{"train_loss": 5.245512008666992, "global_step": 0, "epoch": 0} {"train_loss": 5.216174602508545, "global_step": 1, "epoch": 0} {"train_loss": 5.165977954864502, "global_step": 2, "epoch": 0} {"train_loss": 5.119240760803223, "global_step": 3, "epoch": 0} {"train_loss": 5.038236141204834, "global_step": 4, "epoch": 0} {"train_loss": 5.039923191070557, "global_step": 5, "epoch": 0} {"train_loss": 4.861958980560303, "global_step": 6, "epoch": 0} {"train_loss": 4.779827117919922, "global_step": 7, "epoch": 0} {"train_loss": 4.673827648162842, "global_step": 8, "epoch": 0} {"train_loss": 4.565244197845459, "global_step": 9, "epoch": 0} {"train_loss": 4.288028240203857, "global_step": 10, "epoch": 0} {"train_loss": 3.997525930404663, "global_step": 11, "epoch": 0} {"train_loss": 3.8203341960906982, "global_step": 12, "epoch": 0} {"train_loss": 3.438037633895874, "global_step": 13, "epoch": 0} {"train_loss": 2.9988937377929688, "global_step": 14, "epoch": 0} {"train_loss": 2.6685614585876465, "global_step": 15, "epoch": 0} {"train_loss": 1.782003402709961, "global_step": 16, "epoch": 0} {"train_loss": 1.0069551467895508, "global_step": 17, "epoch": 0} {"train_loss": 0.5781152248382568, "global_step": 18, "epoch": 0} {"train_loss": 0.5304433107376099, "global_step": 19, "epoch": 0} {"train_loss": -0.29140692949295044, "global_step": 20, "epoch": 0} {"train_loss": 0.0547107569873333, "global_step": 21, "epoch": 0} {"train_loss": -0.9246325492858887, "global_step": 22, "epoch": 0} {"train_loss": -0.26391321420669556, "global_step": 23, "epoch": 0} {"train_loss": -0.8291072249412537, "global_step": 24, "epoch": 0} {"train_loss": -1.1796470880508423, "global_step": 25, "epoch": 0} {"train_loss": -1.2078667879104614, "global_step": 26, "epoch": 0} {"train_loss": -1.1229580640792847, "global_step": 27, "epoch": 0} {"train_loss": -1.7455257177352905, "global_step": 28, "epoch": 0} {"train_loss": -1.7795099020004272, "global_step": 29, "epoch": 0} {"train_loss": -1.5415457487106323, "global_step": 30, "epoch": 0} {"train_loss": -1.6935399770736694, "global_step": 31, "epoch": 0} {"train_loss": -2.1126229763031006, "global_step": 32, "epoch": 0} {"train_loss": -2.0508646965026855, "global_step": 33, "epoch": 0} {"train_loss": -1.4859851598739624, "global_step": 34, "epoch": 0} {"train_loss": -1.8105487823486328, "global_step": 35, "epoch": 0} {"train_loss": -2.5565450191497803, "global_step": 36, "epoch": 0} {"train_loss": -2.157252550125122, "global_step": 37, "epoch": 0} {"train_loss": -2.6192429065704346, "global_step": 38, "epoch": 0} {"train_loss": -2.912889003753662, "global_step": 39, "epoch": 0} {"train_loss": -2.0447003841400146, "global_step": 40, "epoch": 0} {"train_loss": -2.9704113006591797, "global_step": 41, "epoch": 0} {"train_loss": -2.814883232116699, "global_step": 42, "epoch": 0} {"train_loss": -2.8723630905151367, "global_step": 43, "epoch": 0} {"train_loss": -2.802328586578369, "global_step": 44, "epoch": 0} {"train_loss": -2.9571120738983154, "global_step": 45, "epoch": 0} {"train_loss": -3.0627427101135254, "global_step": 46, "epoch": 0} {"train_loss": -2.7316958904266357, "global_step": 47, "epoch": 0} {"train_loss": -3.1905853748321533, "global_step": 48, "epoch": 0} {"train_loss": -2.932184934616089, "global_step": 49, "epoch": 0} {"train_loss": -3.356826066970825, "global_step": 50, "epoch": 0} {"train_loss": -3.1329681873321533, "global_step": 51, "epoch": 0} {"train_loss": -3.305799961090088, "global_step": 52, "epoch": 0} {"train_loss": -3.496124744415283, "global_step": 53, "epoch": 0} {"train_loss": -3.566418170928955, "global_step": 54, "epoch": 0} {"train_loss": -3.942418336868286, "global_step": 55, "epoch": 0} {"train_loss": -3.803619384765625, "global_step": 56, "epoch": 0} {"train_loss": -4.168084144592285, "global_step": 57, "epoch": 0} {"train_loss": -3.749927282333374, "global_step": 58, "epoch": 0} {"train_loss": -4.511647701263428, "global_step": 59, "epoch": 0} {"train_loss": -3.8649659156799316, "global_step": 60, "epoch": 0} {"train_loss": -4.555920600891113, "global_step": 61, "epoch": 0} {"train_loss": -4.736410617828369, "global_step": 62, "epoch": 0} {"train_loss": -4.7277092933654785, "global_step": 63, "epoch": 0} {"train_loss": -3.4428393840789795, "global_step": 64, "epoch": 0} {"train_loss": -4.400698661804199, "global_step": 65, "epoch": 0} {"train_loss": -4.569958686828613, "global_step": 66, "epoch": 0} {"train_loss": -4.76687479019165, "global_step": 67, "epoch": 0} {"train_loss": -4.665919780731201, "global_step": 68, "epoch": 0} {"train_loss": -5.37419319152832, "global_step": 69, "epoch": 0} {"train_loss": -5.024474620819092, "global_step": 70, "epoch": 0} {"train_loss": -5.562669277191162, "global_step": 71, "epoch": 0} {"train_loss": -4.945154666900635, "global_step": 72, "epoch": 0} {"train_loss": -5.131469249725342, "global_step": 73, "epoch": 0} {"train_loss": -5.288149356842041, "global_step": 74, "epoch": 0} {"train_loss": -5.0538482666015625, "global_step": 75, "epoch": 0} {"train_loss": -5.218358516693115, "global_step": 76, "epoch": 0} {"train_loss": -5.388396739959717, "global_step": 77, "epoch": 0} {"train_loss": -5.820241451263428, "global_step": 78, "epoch": 0} {"train_loss": -5.990048885345459, "global_step": 79, "epoch": 0} {"train_loss": -5.582648754119873, "global_step": 80, "epoch": 0} {"train_loss": -5.922059535980225, "global_step": 81, "epoch": 0} {"train_loss": -6.226694583892822, "global_step": 82, "epoch": 0} {"train_loss": -6.610739231109619, "global_step": 83, "epoch": 0} {"train_loss": -6.8632402420043945, "global_step": 84, "epoch": 0} {"train_loss": -6.935177803039551, "global_step": 85, "epoch": 0} {"train_loss": -6.7501749992370605, "global_step": 86, "epoch": 0} {"train_loss": -6.373882293701172, "global_step": 87, "epoch": 0} {"train_loss": -6.921577453613281, "global_step": 88, "epoch": 0} {"train_loss": -6.9070658683776855, "global_step": 89, "epoch": 0} {"train_loss": -7.093145847320557, "global_step": 90, "epoch": 0} {"train_loss": -7.484864711761475, "global_step": 91, "epoch": 0} {"train_loss": -7.679051876068115, "global_step": 92, "epoch": 0} {"train_loss": -8.388981819152832, "global_step": 93, "epoch": 0} {"train_loss": -7.82161283493042, "global_step": 94, "epoch": 0} {"train_loss": -8.001472473144531, "global_step": 95, "epoch": 0} {"train_loss": -8.001627922058105, "global_step": 96, "epoch": 0} {"train_loss": -7.207015514373779, "global_step": 97, "epoch": 0} {"train_loss": -4.3467278480529785, "global_step": 98, "epoch": 0} {"train_loss": -6.609555721282959, "global_step": 99, "epoch": 0} {"train_loss": -4.937417030334473, "global_step": 100, "epoch": 0} {"train_loss": -5.272505283355713, "global_step": 101, "epoch": 0} {"train_loss": -5.4913482666015625, "global_step": 102, "epoch": 0} {"train_loss": -6.113648414611816, "global_step": 103, "epoch": 0} {"train_loss": -6.225246906280518, "global_step": 104, "epoch": 0} {"train_loss": -6.929944038391113, "global_step": 105, "epoch": 0} {"train_loss": -6.457409858703613, "global_step": 106, "epoch": 0} {"train_loss": -7.016042232513428, "global_step": 107, "epoch": 0} {"train_loss": -6.955513000488281, "global_step": 108, "epoch": 0} {"train_loss": -7.114160060882568, "global_step": 109, "epoch": 0} {"train_loss": -7.321218967437744, "global_step": 110, "epoch": 0} {"train_loss": -7.70978307723999, "global_step": 111, "epoch": 0} {"train_loss": -7.883523464202881, "global_step": 112, "epoch": 0} {"train_loss": -8.52136516571045, "global_step": 113, "epoch": 0} {"train_loss": -8.846437454223633, "global_step": 114, "epoch": 0} {"train_loss": -8.821410179138184, "global_step": 115, "epoch": 0} {"train_loss": -8.33342456817627, "global_step": 116, "epoch": 0} {"train_loss": -9.524922370910645, "global_step": 117, "epoch": 0} {"train_loss": -9.120080947875977, "global_step": 118, "epoch": 0} {"train_loss": -5.270740032196045, "global_step": 119, "epoch": 0} {"train_loss": -3.2265975952210013, "global_step": 120, "epoch": 0, "train/sim_max_reward_0": 0.0, "train/sim_max_reward_1": 0.0, "train/sim_max_reward_2": 0.0, "train/sim_max_reward_3": 0.0, "train/sim_max_reward_4": 0.0, "train/sim_max_reward_5": 0.0, "test/sim_max_reward_4400000": 0.0, "test/sim_max_reward_4400001": 0.0, "test/sim_max_reward_4400002": 0.0, "test/sim_max_reward_4400003": 0.0, "test/sim_max_reward_4400004": 0.0, "test/sim_max_reward_4400005": 0.0, "test/sim_max_reward_4400006": 0.0, "test/sim_max_reward_4400007": 0.0, "test/sim_max_reward_4400008": 0.0, "test/sim_max_reward_4400009": 0.0, "test/sim_max_reward_4400010": 0.0, "test/sim_max_reward_4400011": 0.0, "test/sim_max_reward_4400012": 0.0, "test/sim_max_reward_4400013": 0.0, "test/sim_max_reward_4400014": 0.0, "test/sim_max_reward_4400015": 0.0, "test/sim_max_reward_4400016": 0.0, "test/sim_max_reward_4400017": 0.0, "test/sim_max_reward_4400018": 0.0, "test/sim_max_reward_4400019": 0.0, "test/sim_max_reward_4400020": 0.0, "test/sim_max_reward_4400021": 0.0, "train/mean_score": 0.0, "test/mean_score": 0.0, "val_loss": 8788441.0} {"train_loss": 2.7548699378967285, "global_step": 121, "epoch": 1} {"train_loss": -4.972243309020996, "global_step": 122, "epoch": 1} {"train_loss": -5.852839946746826, "global_step": 123, "epoch": 1} {"train_loss": -2.153432607650757, "global_step": 124, "epoch": 1} {"train_loss": -6.090178966522217, "global_step": 125, "epoch": 1} {"train_loss": -9.111366271972656, "global_step": 126, "epoch": 1} {"train_loss": -9.698451042175293, "global_step": 127, "epoch": 1} {"train_loss": -9.331888198852539, "global_step": 128, "epoch": 1} {"train_loss": -8.577170372009277, "global_step": 129, "epoch": 1} {"train_loss": -8.753166198730469, "global_step": 130, "epoch": 1} {"train_loss": -8.826827049255371, "global_step": 131, "epoch": 1} {"train_loss": -8.498664855957031, "global_step": 132, "epoch": 1} {"train_loss": -8.939112663269043, "global_step": 133, "epoch": 1} {"train_loss": -9.053790092468262, "global_step": 134, "epoch": 1} {"train_loss": -9.29614543914795, "global_step": 135, "epoch": 1} {"train_loss": -8.901843070983887, "global_step": 136, "epoch": 1} {"train_loss": -9.613512992858887, "global_step": 137, "epoch": 1} {"train_loss": -9.469267845153809, "global_step": 138, "epoch": 1} {"train_loss": -9.509981155395508, "global_step": 139, "epoch": 1} {"train_loss": -9.530204772949219, "global_step": 140, "epoch": 1} {"train_loss": -9.489378929138184, "global_step": 141, "epoch": 1} {"train_loss": -9.73423957824707, "global_step": 142, "epoch": 1} {"train_loss": -9.807096481323242, "global_step": 143, "epoch": 1} {"train_loss": -10.228545188903809, "global_step": 144, "epoch": 1} {"train_loss": -9.87352180480957, "global_step": 145, "epoch": 1} {"train_loss": -9.969945907592773, "global_step": 146, "epoch": 1} {"train_loss": -10.134292602539062, "global_step": 147, "epoch": 1} {"train_loss": -10.093125343322754, "global_step": 148, "epoch": 1} {"train_loss": -10.396719932556152, "global_step": 149, "epoch": 1} {"train_loss": -10.28016185760498, "global_step": 150, "epoch": 1} {"train_loss": -10.458134651184082, "global_step": 151, "epoch": 1} {"train_loss": -10.283945083618164, "global_step": 152, "epoch": 1} {"train_loss": -10.2960205078125, "global_step": 153, "epoch": 1} {"train_loss": -10.689621925354004, "global_step": 154, "epoch": 1} {"train_loss": -10.609402656555176, "global_step": 155, "epoch": 1} {"train_loss": -10.838580131530762, "global_step": 156, "epoch": 1} {"train_loss": -10.22038459777832, "global_step": 157, "epoch": 1} {"train_loss": -10.454747200012207, "global_step": 158, "epoch": 1} {"train_loss": -9.964111328125, "global_step": 159, "epoch": 1} {"train_loss": -10.776410102844238, "global_step": 160, "epoch": 1} {"train_loss": -10.18616771697998, "global_step": 161, "epoch": 1} {"train_loss": -10.427148818969727, "global_step": 162, "epoch": 1} {"train_loss": -10.82169246673584, "global_step": 163, "epoch": 1} {"train_loss": -10.505488395690918, "global_step": 164, "epoch": 1} {"train_loss": -11.158037185668945, "global_step": 165, "epoch": 1} {"train_loss": -11.265959739685059, "global_step": 166, "epoch": 1} {"train_loss": -10.833340644836426, "global_step": 167, "epoch": 1} {"train_loss": -10.898344993591309, "global_step": 168, "epoch": 1} {"train_loss": -10.98055362701416, "global_step": 169, "epoch": 1} {"train_loss": -10.86864948272705, "global_step": 170, "epoch": 1} {"train_loss": -11.12414836883545, "global_step": 171, "epoch": 1} {"train_loss": -11.271780967712402, "global_step": 172, "epoch": 1} {"train_loss": -11.12507152557373, "global_step": 173, "epoch": 1} {"train_loss": -11.183897972106934, "global_step": 174, "epoch": 1} {"train_loss": -11.313044548034668, "global_step": 175, "epoch": 1} {"train_loss": -11.423430442810059, "global_step": 176, "epoch": 1} {"train_loss": -11.500227928161621, "global_step": 177, "epoch": 1} {"train_loss": -10.99695873260498, "global_step": 178, "epoch": 1} {"train_loss": -11.671087265014648, "global_step": 179, "epoch": 1} {"train_loss": -11.23581600189209, "global_step": 180, "epoch": 1} {"train_loss": -11.657737731933594, "global_step": 181, "epoch": 1} {"train_loss": -11.45948600769043, "global_step": 182, "epoch": 1} {"train_loss": -11.394511222839355, "global_step": 183, "epoch": 1} {"train_loss": -11.775721549987793, "global_step": 184, "epoch": 1} {"train_loss": -11.478259086608887, "global_step": 185, "epoch": 1} {"train_loss": -12.065655708312988, "global_step": 186, "epoch": 1} {"train_loss": -11.729682922363281, "global_step": 187, "epoch": 1} {"train_loss": -12.051997184753418, "global_step": 188, "epoch": 1} {"train_loss": -11.56024169921875, "global_step": 189, "epoch": 1} {"train_loss": -11.857400894165039, "global_step": 190, "epoch": 1} {"train_loss": -11.851592063903809, "global_step": 191, "epoch": 1} {"train_loss": -12.263969421386719, "global_step": 192, "epoch": 1} {"train_loss": -11.697077751159668, "global_step": 193, "epoch": 1} {"train_loss": -12.021956443786621, "global_step": 194, "epoch": 1} {"train_loss": -12.131392478942871, "global_step": 195, "epoch": 1} {"train_loss": -12.304661750793457, "global_step": 196, "epoch": 1} {"train_loss": -12.342368125915527, "global_step": 197, "epoch": 1} {"train_loss": -12.19609546661377, "global_step": 198, "epoch": 1} {"train_loss": -12.441695213317871, "global_step": 199, "epoch": 1} {"train_loss": -11.906401634216309, "global_step": 200, "epoch": 1} {"train_loss": -12.48228645324707, "global_step": 201, "epoch": 1} {"train_loss": -12.205780982971191, "global_step": 202, "epoch": 1} {"train_loss": -12.263285636901855, "global_step": 203, "epoch": 1} {"train_loss": -12.394255638122559, "global_step": 204, "epoch": 1} {"train_loss": -12.547406196594238, "global_step": 205, "epoch": 1} {"train_loss": -12.079960823059082, "global_step": 206, "epoch": 1} {"train_loss": -12.244409561157227, "global_step": 207, "epoch": 1} {"train_loss": -12.314249992370605, "global_step": 208, "epoch": 1} {"train_loss": -12.299749374389648, "global_step": 209, "epoch": 1} {"train_loss": -11.856268882751465, "global_step": 210, "epoch": 1} {"train_loss": -12.273955345153809, "global_step": 211, "epoch": 1} {"train_loss": -12.758848190307617, "global_step": 212, "epoch": 1} {"train_loss": -12.594317436218262, "global_step": 213, "epoch": 1} {"train_loss": -12.572794914245605, "global_step": 214, "epoch": 1} {"train_loss": -12.67763900756836, "global_step": 215, "epoch": 1} {"train_loss": -12.851725578308105, "global_step": 216, "epoch": 1} {"train_loss": -12.717781066894531, "global_step": 217, "epoch": 1} {"train_loss": -12.780112266540527, "global_step": 218, "epoch": 1} {"train_loss": -12.612235069274902, "global_step": 219, "epoch": 1} {"train_loss": -12.99249267578125, "global_step": 220, "epoch": 1} {"train_loss": -12.868826866149902, "global_step": 221, "epoch": 1} {"train_loss": -12.581875801086426, "global_step": 222, "epoch": 1} {"train_loss": -13.124300956726074, "global_step": 223, "epoch": 1} {"train_loss": -12.594465255737305, "global_step": 224, "epoch": 1} {"train_loss": -12.493731498718262, "global_step": 225, "epoch": 1} {"train_loss": -12.170502662658691, "global_step": 226, "epoch": 1} {"train_loss": -12.929333686828613, "global_step": 227, "epoch": 1} {"train_loss": -12.391629219055176, "global_step": 228, "epoch": 1} {"train_loss": -13.22002124786377, "global_step": 229, "epoch": 1} {"train_loss": -12.80163288116455, "global_step": 230, "epoch": 1} {"train_loss": -13.280755996704102, "global_step": 231, "epoch": 1} {"train_loss": -13.074409484863281, "global_step": 232, "epoch": 1} {"train_loss": -13.1708402633667, "global_step": 233, "epoch": 1} {"train_loss": -13.319567680358887, "global_step": 234, "epoch": 1} {"train_loss": -13.246983528137207, "global_step": 235, "epoch": 1} {"train_loss": -13.232678413391113, "global_step": 236, "epoch": 1} {"train_loss": -13.127385139465332, "global_step": 237, "epoch": 1} {"train_loss": -13.623297691345215, "global_step": 238, "epoch": 1} {"train_loss": -13.114073753356934, "global_step": 239, "epoch": 1} {"train_loss": -13.400588989257812, "global_step": 240, "epoch": 1} {"train_loss": -11.071855807107342, "global_step": 241, "epoch": 1, "val_loss": 7737783.5} {"train_loss": -13.318102836608887, "global_step": 242, "epoch": 2} {"train_loss": -13.420554161071777, "global_step": 243, "epoch": 2} {"train_loss": -13.505942344665527, "global_step": 244, "epoch": 2} {"train_loss": -13.590489387512207, "global_step": 245, "epoch": 2} {"train_loss": -13.641426086425781, "global_step": 246, "epoch": 2} {"train_loss": -13.637377738952637, "global_step": 247, "epoch": 2} {"train_loss": -13.282025337219238, "global_step": 248, "epoch": 2} {"train_loss": -13.104205131530762, "global_step": 249, "epoch": 2} {"train_loss": -12.232099533081055, "global_step": 250, "epoch": 2} {"train_loss": -11.807371139526367, "global_step": 251, "epoch": 2} {"train_loss": -13.148917198181152, "global_step": 252, "epoch": 2} {"train_loss": -12.411685943603516, "global_step": 253, "epoch": 2} {"train_loss": -13.233139038085938, "global_step": 254, "epoch": 2} {"train_loss": -12.16739273071289, "global_step": 255, "epoch": 2} {"train_loss": -13.31963062286377, "global_step": 256, "epoch": 2} {"train_loss": -13.446560859680176, "global_step": 257, "epoch": 2} {"train_loss": -13.061210632324219, "global_step": 258, "epoch": 2} {"train_loss": -12.741141319274902, "global_step": 259, "epoch": 2} {"train_loss": -12.953102111816406, "global_step": 260, "epoch": 2} {"train_loss": -13.202624320983887, "global_step": 261, "epoch": 2} {"train_loss": -12.811816215515137, "global_step": 262, "epoch": 2} {"train_loss": -13.282889366149902, "global_step": 263, "epoch": 2} {"train_loss": -13.231352806091309, "global_step": 264, "epoch": 2} {"train_loss": -13.227624893188477, "global_step": 265, "epoch": 2} {"train_loss": -12.94571590423584, "global_step": 266, "epoch": 2} {"train_loss": -13.27507495880127, "global_step": 267, "epoch": 2} {"train_loss": -12.961163520812988, "global_step": 268, "epoch": 2} {"train_loss": -13.104220390319824, "global_step": 269, "epoch": 2} {"train_loss": -13.076628684997559, "global_step": 270, "epoch": 2} {"train_loss": -13.268463134765625, "global_step": 271, "epoch": 2} {"train_loss": -13.039810180664062, "global_step": 272, "epoch": 2} {"train_loss": -13.56571102142334, "global_step": 273, "epoch": 2} {"train_loss": -13.550668716430664, "global_step": 274, "epoch": 2} {"train_loss": -13.8095064163208, "global_step": 275, "epoch": 2} {"train_loss": -13.829968452453613, "global_step": 276, "epoch": 2} {"train_loss": -13.23357105255127, "global_step": 277, "epoch": 2} {"train_loss": -13.385775566101074, "global_step": 278, "epoch": 2} {"train_loss": -13.702143669128418, "global_step": 279, "epoch": 2} {"train_loss": -13.496728897094727, "global_step": 280, "epoch": 2} {"train_loss": -13.601208686828613, "global_step": 281, "epoch": 2} {"train_loss": -13.692730903625488, "global_step": 282, "epoch": 2} {"train_loss": -13.642041206359863, "global_step": 283, "epoch": 2} {"train_loss": -13.333498001098633, "global_step": 284, "epoch": 2} {"train_loss": -13.780364036560059, "global_step": 285, "epoch": 2} {"train_loss": -13.104159355163574, "global_step": 286, "epoch": 2} {"train_loss": -12.773329734802246, "global_step": 287, "epoch": 2} {"train_loss": -13.8267183303833, "global_step": 288, "epoch": 2} {"train_loss": -12.817631721496582, "global_step": 289, "epoch": 2} {"train_loss": -12.852679252624512, "global_step": 290, "epoch": 2} {"train_loss": -13.497448921203613, "global_step": 291, "epoch": 2} {"train_loss": -12.441817283630371, "global_step": 292, "epoch": 2} {"train_loss": -13.512763023376465, "global_step": 293, "epoch": 2} {"train_loss": -12.894533157348633, "global_step": 294, "epoch": 2} {"train_loss": -13.342299461364746, "global_step": 295, "epoch": 2} {"train_loss": -13.457803726196289, "global_step": 296, "epoch": 2} {"train_loss": -13.217241287231445, "global_step": 297, "epoch": 2} {"train_loss": -13.8313627243042, "global_step": 298, "epoch": 2} {"train_loss": -13.238382339477539, "global_step": 299, "epoch": 2} {"train_loss": -13.36164379119873, "global_step": 300, "epoch": 2} {"train_loss": -13.178210258483887, "global_step": 301, "epoch": 2} {"train_loss": -13.224334716796875, "global_step": 302, "epoch": 2} {"train_loss": -13.885171890258789, "global_step": 303, "epoch": 2} {"train_loss": -12.943611145019531, "global_step": 304, "epoch": 2} {"train_loss": -13.562830924987793, "global_step": 305, "epoch": 2} {"train_loss": -13.372952461242676, "global_step": 306, "epoch": 2} {"train_loss": -13.175392150878906, "global_step": 307, "epoch": 2} {"train_loss": -13.173715591430664, "global_step": 308, "epoch": 2} {"train_loss": -13.509726524353027, "global_step": 309, "epoch": 2} {"train_loss": -13.558316230773926, "global_step": 310, "epoch": 2} {"train_loss": -13.674899101257324, "global_step": 311, "epoch": 2} {"train_loss": -13.733589172363281, "global_step": 312, "epoch": 2} {"train_loss": -13.441168785095215, "global_step": 313, "epoch": 2} {"train_loss": -13.778474807739258, "global_step": 314, "epoch": 2} {"train_loss": -13.48380184173584, "global_step": 315, "epoch": 2} {"train_loss": -13.945940017700195, "global_step": 316, "epoch": 2} {"train_loss": -13.580679893493652, "global_step": 317, "epoch": 2} {"train_loss": -13.778765678405762, "global_step": 318, "epoch": 2} {"train_loss": -14.07501220703125, "global_step": 319, "epoch": 2} {"train_loss": -13.795099258422852, "global_step": 320, "epoch": 2} {"train_loss": -14.021075248718262, "global_step": 321, "epoch": 2} {"train_loss": -13.858453750610352, "global_step": 322, "epoch": 2} {"train_loss": -13.700156211853027, "global_step": 323, "epoch": 2} {"train_loss": -13.852897644042969, "global_step": 324, "epoch": 2} {"train_loss": -14.166699409484863, "global_step": 325, "epoch": 2} {"train_loss": -14.071657180786133, "global_step": 326, "epoch": 2} {"train_loss": -13.697369575500488, "global_step": 327, "epoch": 2} {"train_loss": -13.996563911437988, "global_step": 328, "epoch": 2} {"train_loss": -13.45318603515625, "global_step": 329, "epoch": 2} {"train_loss": -14.073138236999512, "global_step": 330, "epoch": 2} {"train_loss": -13.745819091796875, "global_step": 331, "epoch": 2} {"train_loss": -13.707391738891602, "global_step": 332, "epoch": 2} {"train_loss": -13.851678848266602, "global_step": 333, "epoch": 2} {"train_loss": -14.101816177368164, "global_step": 334, "epoch": 2} {"train_loss": -13.966229438781738, "global_step": 335, "epoch": 2} {"train_loss": -13.643460273742676, "global_step": 336, "epoch": 2} {"train_loss": -14.066192626953125, "global_step": 337, "epoch": 2} {"train_loss": -13.565821647644043, "global_step": 338, "epoch": 2} {"train_loss": -13.888710021972656, "global_step": 339, "epoch": 2} {"train_loss": -14.298338890075684, "global_step": 340, "epoch": 2} {"train_loss": -14.198298454284668, "global_step": 341, "epoch": 2} {"train_loss": -13.877931594848633, "global_step": 342, "epoch": 2} {"train_loss": -13.80212688446045, "global_step": 343, "epoch": 2} {"train_loss": -14.086860656738281, "global_step": 344, "epoch": 2} {"train_loss": -13.991838455200195, "global_step": 345, "epoch": 2} {"train_loss": -13.85893726348877, "global_step": 346, "epoch": 2} {"train_loss": -14.232782363891602, "global_step": 347, "epoch": 2} {"train_loss": -14.124234199523926, "global_step": 348, "epoch": 2} {"train_loss": -14.272948265075684, "global_step": 349, "epoch": 2} {"train_loss": -13.630075454711914, "global_step": 350, "epoch": 2} {"train_loss": -13.961546897888184, "global_step": 351, "epoch": 2} {"train_loss": -14.398581504821777, "global_step": 352, "epoch": 2} {"train_loss": -14.267654418945312, "global_step": 353, "epoch": 2} {"train_loss": -14.60172176361084, "global_step": 354, "epoch": 2} {"train_loss": -14.455451965332031, "global_step": 355, "epoch": 2} {"train_loss": -14.461504936218262, "global_step": 356, "epoch": 2} {"train_loss": -14.629195213317871, "global_step": 357, "epoch": 2} {"train_loss": -14.462233543395996, "global_step": 358, "epoch": 2} {"train_loss": -13.962160110473633, "global_step": 359, "epoch": 2} {"train_loss": -14.08313274383545, "global_step": 360, "epoch": 2} {"train_loss": -14.747912406921387, "global_step": 361, "epoch": 2} {"train_loss": -13.564069503595022, "global_step": 362, "epoch": 2, "val_loss": 7490262.5} {"train_loss": -14.058276176452637, "global_step": 363, "epoch": 3} {"train_loss": -14.100485801696777, "global_step": 364, "epoch": 3} {"train_loss": -14.105173110961914, "global_step": 365, "epoch": 3} {"train_loss": -14.551287651062012, "global_step": 366, "epoch": 3} {"train_loss": -14.64818000793457, "global_step": 367, "epoch": 3} {"train_loss": -14.376176834106445, "global_step": 368, "epoch": 3} {"train_loss": -13.990580558776855, "global_step": 369, "epoch": 3} {"train_loss": -14.187487602233887, "global_step": 370, "epoch": 3} {"train_loss": -14.416058540344238, "global_step": 371, "epoch": 3} {"train_loss": -14.045244216918945, "global_step": 372, "epoch": 3} {"train_loss": -14.083098411560059, "global_step": 373, "epoch": 3} {"train_loss": -14.968317031860352, "global_step": 374, "epoch": 3} {"train_loss": -14.220492362976074, "global_step": 375, "epoch": 3} {"train_loss": -14.403039932250977, "global_step": 376, "epoch": 3} {"train_loss": -14.411003112792969, "global_step": 377, "epoch": 3} {"train_loss": -14.085494041442871, "global_step": 378, "epoch": 3} {"train_loss": -14.026434898376465, "global_step": 379, "epoch": 3} {"train_loss": -14.4833984375, "global_step": 380, "epoch": 3} {"train_loss": -14.016125679016113, "global_step": 381, "epoch": 3} {"train_loss": -14.712915420532227, "global_step": 382, "epoch": 3} {"train_loss": -13.8670072555542, "global_step": 383, "epoch": 3} {"train_loss": -14.569548606872559, "global_step": 384, "epoch": 3} {"train_loss": -14.213457107543945, "global_step": 385, "epoch": 3} {"train_loss": -13.32182502746582, "global_step": 386, "epoch": 3} {"train_loss": -14.319681167602539, "global_step": 387, "epoch": 3} {"train_loss": -13.808722496032715, "global_step": 388, "epoch": 3} {"train_loss": -14.422186851501465, "global_step": 389, "epoch": 3} {"train_loss": -13.604876518249512, "global_step": 390, "epoch": 3} {"train_loss": -14.435210227966309, "global_step": 391, "epoch": 3} {"train_loss": -13.991644859313965, "global_step": 392, "epoch": 3} {"train_loss": -14.388030052185059, "global_step": 393, "epoch": 3} {"train_loss": -13.608932495117188, "global_step": 394, "epoch": 3} {"train_loss": -13.891632080078125, "global_step": 395, "epoch": 3} {"train_loss": -14.335789680480957, "global_step": 396, "epoch": 3} {"train_loss": -13.836051940917969, "global_step": 397, "epoch": 3} {"train_loss": -14.462678909301758, "global_step": 398, "epoch": 3} {"train_loss": -14.420672416687012, "global_step": 399, "epoch": 3} {"train_loss": -14.422119140625, "global_step": 400, "epoch": 3} {"train_loss": -14.396713256835938, "global_step": 401, "epoch": 3} {"train_loss": -14.093974113464355, "global_step": 402, "epoch": 3} {"train_loss": -14.25858211517334, "global_step": 403, "epoch": 3} {"train_loss": -14.693849563598633, "global_step": 404, "epoch": 3} {"train_loss": -14.323389053344727, "global_step": 405, "epoch": 3} {"train_loss": -14.600821495056152, "global_step": 406, "epoch": 3} {"train_loss": -14.503146171569824, "global_step": 407, "epoch": 3} {"train_loss": -14.871759414672852, "global_step": 408, "epoch": 3} {"train_loss": -14.298189163208008, "global_step": 409, "epoch": 3} {"train_loss": -14.481839179992676, "global_step": 410, "epoch": 3} {"train_loss": -14.786604881286621, "global_step": 411, "epoch": 3} {"train_loss": -14.807098388671875, "global_step": 412, "epoch": 3} {"train_loss": -14.580621719360352, "global_step": 413, "epoch": 3} {"train_loss": -14.696341514587402, "global_step": 414, "epoch": 3} {"train_loss": -14.5614595413208, "global_step": 415, "epoch": 3} {"train_loss": -14.699795722961426, "global_step": 416, "epoch": 3} {"train_loss": -14.769049644470215, "global_step": 417, "epoch": 3} {"train_loss": -14.631865501403809, "global_step": 418, "epoch": 3} {"train_loss": -14.55157470703125, "global_step": 419, "epoch": 3} {"train_loss": -14.133959770202637, "global_step": 420, "epoch": 3} {"train_loss": -14.39306354522705, "global_step": 421, "epoch": 3} {"train_loss": -14.777259826660156, "global_step": 422, "epoch": 3} {"train_loss": -14.616966247558594, "global_step": 423, "epoch": 3} {"train_loss": -14.846658706665039, "global_step": 424, "epoch": 3} {"train_loss": -14.735074043273926, "global_step": 425, "epoch": 3} {"train_loss": -14.902658462524414, "global_step": 426, "epoch": 3} {"train_loss": -14.159889221191406, "global_step": 427, "epoch": 3} {"train_loss": -14.598523139953613, "global_step": 428, "epoch": 3} {"train_loss": -14.925463676452637, "global_step": 429, "epoch": 3} {"train_loss": -14.816235542297363, "global_step": 430, "epoch": 3} {"train_loss": -14.62894344329834, "global_step": 431, "epoch": 3} {"train_loss": -14.663583755493164, "global_step": 432, "epoch": 3} {"train_loss": -14.675936698913574, "global_step": 433, "epoch": 3} {"train_loss": -14.767895698547363, "global_step": 434, "epoch": 3} {"train_loss": -14.756845474243164, "global_step": 435, "epoch": 3} {"train_loss": -14.881909370422363, "global_step": 436, "epoch": 3} {"train_loss": -14.954068183898926, "global_step": 437, "epoch": 3} {"train_loss": -14.501864433288574, "global_step": 438, "epoch": 3} {"train_loss": -15.049239158630371, "global_step": 439, "epoch": 3} {"train_loss": -15.263620376586914, "global_step": 440, "epoch": 3} {"train_loss": -14.790979385375977, "global_step": 441, "epoch": 3} {"train_loss": -15.090802192687988, "global_step": 442, "epoch": 3} {"train_loss": -14.774518013000488, "global_step": 443, "epoch": 3} {"train_loss": -14.915310859680176, "global_step": 444, "epoch": 3} {"train_loss": -14.604277610778809, "global_step": 445, "epoch": 3} {"train_loss": -14.833101272583008, "global_step": 446, "epoch": 3} {"train_loss": -15.032096862792969, "global_step": 447, "epoch": 3} {"train_loss": -14.797404289245605, "global_step": 448, "epoch": 3} {"train_loss": -14.488598823547363, "global_step": 449, "epoch": 3} {"train_loss": -14.880279541015625, "global_step": 450, "epoch": 3} {"train_loss": -14.783343315124512, "global_step": 451, "epoch": 3} {"train_loss": -14.941824913024902, "global_step": 452, "epoch": 3} {"train_loss": -14.876322746276855, "global_step": 453, "epoch": 3} {"train_loss": -14.748751640319824, "global_step": 454, "epoch": 3} {"train_loss": -13.738540649414062, "global_step": 455, "epoch": 3} {"train_loss": -14.385406494140625, "global_step": 456, "epoch": 3} {"train_loss": -14.791682243347168, "global_step": 457, "epoch": 3} {"train_loss": -14.496963500976562, "global_step": 458, "epoch": 3} {"train_loss": -14.752812385559082, "global_step": 459, "epoch": 3} {"train_loss": -14.982858657836914, "global_step": 460, "epoch": 3} {"train_loss": -14.961215019226074, "global_step": 461, "epoch": 3} {"train_loss": -14.854578018188477, "global_step": 462, "epoch": 3} {"train_loss": -14.590718269348145, "global_step": 463, "epoch": 3} {"train_loss": -15.015731811523438, "global_step": 464, "epoch": 3} {"train_loss": -14.719720840454102, "global_step": 465, "epoch": 3} {"train_loss": -15.0530424118042, "global_step": 466, "epoch": 3} {"train_loss": -14.801745414733887, "global_step": 467, "epoch": 3} {"train_loss": -14.558051109313965, "global_step": 468, "epoch": 3} {"train_loss": -14.635968208312988, "global_step": 469, "epoch": 3} {"train_loss": -14.631851196289062, "global_step": 470, "epoch": 3} {"train_loss": -14.607245445251465, "global_step": 471, "epoch": 3} {"train_loss": -14.740968704223633, "global_step": 472, "epoch": 3} {"train_loss": -13.711511611938477, "global_step": 473, "epoch": 3} {"train_loss": -14.657111167907715, "global_step": 474, "epoch": 3} {"train_loss": -14.792686462402344, "global_step": 475, "epoch": 3} {"train_loss": -14.482294082641602, "global_step": 476, "epoch": 3} {"train_loss": -14.778056144714355, "global_step": 477, "epoch": 3} {"train_loss": -14.501635551452637, "global_step": 478, "epoch": 3} {"train_loss": -15.143275260925293, "global_step": 479, "epoch": 3} {"train_loss": -14.238763809204102, "global_step": 480, "epoch": 3} {"train_loss": -15.112375259399414, "global_step": 481, "epoch": 3} {"train_loss": -14.787826538085938, "global_step": 482, "epoch": 3} {"train_loss": -14.535705227497196, "global_step": 483, "epoch": 3, "val_loss": 5531136.0} {"train_loss": -14.655145645141602, "global_step": 484, "epoch": 4} {"train_loss": -15.19111156463623, "global_step": 485, "epoch": 4} {"train_loss": -14.860974311828613, "global_step": 486, "epoch": 4} {"train_loss": -15.202258110046387, "global_step": 487, "epoch": 4} {"train_loss": -15.152239799499512, "global_step": 488, "epoch": 4} {"train_loss": -15.298590660095215, "global_step": 489, "epoch": 4} {"train_loss": -15.0960111618042, "global_step": 490, "epoch": 4} {"train_loss": -15.273640632629395, "global_step": 491, "epoch": 4} {"train_loss": -15.061180114746094, "global_step": 492, "epoch": 4} {"train_loss": -14.88425350189209, "global_step": 493, "epoch": 4} {"train_loss": -14.83580207824707, "global_step": 494, "epoch": 4} {"train_loss": -14.868059158325195, "global_step": 495, "epoch": 4} {"train_loss": -15.367456436157227, "global_step": 496, "epoch": 4} {"train_loss": -14.963900566101074, "global_step": 497, "epoch": 4} {"train_loss": -15.06480884552002, "global_step": 498, "epoch": 4} {"train_loss": -15.025118827819824, "global_step": 499, "epoch": 4} {"train_loss": -15.077006340026855, "global_step": 500, "epoch": 4} {"train_loss": -14.917546272277832, "global_step": 501, "epoch": 4} {"train_loss": -15.619765281677246, "global_step": 502, "epoch": 4} {"train_loss": -15.234625816345215, "global_step": 503, "epoch": 4} {"train_loss": -14.77637767791748, "global_step": 504, "epoch": 4} {"train_loss": -14.961468696594238, "global_step": 505, "epoch": 4} {"train_loss": -15.248605728149414, "global_step": 506, "epoch": 4} {"train_loss": -15.165507316589355, "global_step": 507, "epoch": 4} {"train_loss": -15.060455322265625, "global_step": 508, "epoch": 4} {"train_loss": -14.821810722351074, "global_step": 509, "epoch": 4} {"train_loss": -14.793708801269531, "global_step": 510, "epoch": 4} {"train_loss": -14.931197166442871, "global_step": 511, "epoch": 4} {"train_loss": -14.92230224609375, "global_step": 512, "epoch": 4} {"train_loss": -14.713106155395508, "global_step": 513, "epoch": 4} {"train_loss": -14.597460746765137, "global_step": 514, "epoch": 4} {"train_loss": -15.019177436828613, "global_step": 515, "epoch": 4} {"train_loss": -14.971900939941406, "global_step": 516, "epoch": 4} {"train_loss": -14.352569580078125, "global_step": 517, "epoch": 4} {"train_loss": -15.314764976501465, "global_step": 518, "epoch": 4} {"train_loss": -14.922914505004883, "global_step": 519, "epoch": 4} {"train_loss": -14.523241996765137, "global_step": 520, "epoch": 4} {"train_loss": -15.549598693847656, "global_step": 521, "epoch": 4} {"train_loss": -14.995002746582031, "global_step": 522, "epoch": 4} {"train_loss": -15.494157791137695, "global_step": 523, "epoch": 4} {"train_loss": -15.20682430267334, "global_step": 524, "epoch": 4} {"train_loss": -15.09995174407959, "global_step": 525, "epoch": 4} {"train_loss": -15.102747917175293, "global_step": 526, "epoch": 4} {"train_loss": -15.007957458496094, "global_step": 527, "epoch": 4} {"train_loss": -15.236117362976074, "global_step": 528, "epoch": 4} {"train_loss": -14.911044120788574, "global_step": 529, "epoch": 4} {"train_loss": -15.19024658203125, "global_step": 530, "epoch": 4} {"train_loss": -15.414694786071777, "global_step": 531, "epoch": 4} {"train_loss": -14.52537727355957, "global_step": 532, "epoch": 4} {"train_loss": -15.29443645477295, "global_step": 533, "epoch": 4} {"train_loss": -14.940912246704102, "global_step": 534, "epoch": 4} {"train_loss": -15.358960151672363, "global_step": 535, "epoch": 4} {"train_loss": -14.522831916809082, "global_step": 536, "epoch": 4} {"train_loss": -15.345282554626465, "global_step": 537, "epoch": 4} {"train_loss": -15.011517524719238, "global_step": 538, "epoch": 4} {"train_loss": -15.13037109375, "global_step": 539, "epoch": 4} {"train_loss": -15.266324043273926, "global_step": 540, "epoch": 4} {"train_loss": -15.167281150817871, "global_step": 541, "epoch": 4} {"train_loss": -15.245955467224121, "global_step": 542, "epoch": 4} {"train_loss": -15.624541282653809, "global_step": 543, "epoch": 4} {"train_loss": -14.80059814453125, "global_step": 544, "epoch": 4} {"train_loss": -15.289801597595215, "global_step": 545, "epoch": 4} {"train_loss": -15.220343589782715, "global_step": 546, "epoch": 4} {"train_loss": -15.005602836608887, "global_step": 547, "epoch": 4} {"train_loss": -15.193216323852539, "global_step": 548, "epoch": 4} {"train_loss": -15.191354751586914, "global_step": 549, "epoch": 4} {"train_loss": -15.20993709564209, "global_step": 550, "epoch": 4} {"train_loss": -15.634050369262695, "global_step": 551, "epoch": 4} {"train_loss": -15.330668449401855, "global_step": 552, "epoch": 4} {"train_loss": -15.498059272766113, "global_step": 553, "epoch": 4} {"train_loss": -15.322748184204102, "global_step": 554, "epoch": 4} {"train_loss": -15.310348510742188, "global_step": 555, "epoch": 4} {"train_loss": -15.192639350891113, "global_step": 556, "epoch": 4} {"train_loss": -15.704272270202637, "global_step": 557, "epoch": 4} {"train_loss": -15.565524101257324, "global_step": 558, "epoch": 4} {"train_loss": -14.821463584899902, "global_step": 559, "epoch": 4} {"train_loss": -15.249542236328125, "global_step": 560, "epoch": 4} {"train_loss": -15.251385688781738, "global_step": 561, "epoch": 4} {"train_loss": -15.060864448547363, "global_step": 562, "epoch": 4} {"train_loss": -15.510528564453125, "global_step": 563, "epoch": 4} {"train_loss": -15.76159381866455, "global_step": 564, "epoch": 4} {"train_loss": -15.219347953796387, "global_step": 565, "epoch": 4} {"train_loss": -15.63737678527832, "global_step": 566, "epoch": 4} {"train_loss": -15.154647827148438, "global_step": 567, "epoch": 4} {"train_loss": -15.370190620422363, "global_step": 568, "epoch": 4} {"train_loss": -15.478248596191406, "global_step": 569, "epoch": 4} {"train_loss": -15.429022789001465, "global_step": 570, "epoch": 4} {"train_loss": -15.388031005859375, "global_step": 571, "epoch": 4} {"train_loss": -15.822043418884277, "global_step": 572, "epoch": 4} {"train_loss": -15.005462646484375, "global_step": 573, "epoch": 4} {"train_loss": -14.91614055633545, "global_step": 574, "epoch": 4} {"train_loss": -14.821866035461426, "global_step": 575, "epoch": 4} {"train_loss": -15.657076835632324, "global_step": 576, "epoch": 4} {"train_loss": -15.551012992858887, "global_step": 577, "epoch": 4} {"train_loss": -15.280062675476074, "global_step": 578, "epoch": 4} {"train_loss": -15.22120189666748, "global_step": 579, "epoch": 4} {"train_loss": -15.305070877075195, "global_step": 580, "epoch": 4} {"train_loss": -15.075225830078125, "global_step": 581, "epoch": 4} {"train_loss": -15.107828140258789, "global_step": 582, "epoch": 4} {"train_loss": -14.7912015914917, "global_step": 583, "epoch": 4} {"train_loss": -15.143994331359863, "global_step": 584, "epoch": 4} {"train_loss": -15.114425659179688, "global_step": 585, "epoch": 4} {"train_loss": -15.029304504394531, "global_step": 586, "epoch": 4} {"train_loss": -14.869882583618164, "global_step": 587, "epoch": 4} {"train_loss": -15.144183158874512, "global_step": 588, "epoch": 4} {"train_loss": -15.20744800567627, "global_step": 589, "epoch": 4} {"train_loss": -14.701918601989746, "global_step": 590, "epoch": 4} {"train_loss": -15.224527359008789, "global_step": 591, "epoch": 4} {"train_loss": -15.199075698852539, "global_step": 592, "epoch": 4} {"train_loss": -15.328219413757324, "global_step": 593, "epoch": 4} {"train_loss": -15.261102676391602, "global_step": 594, "epoch": 4} {"train_loss": -15.238776206970215, "global_step": 595, "epoch": 4} {"train_loss": -15.347447395324707, "global_step": 596, "epoch": 4} {"train_loss": -15.182413101196289, "global_step": 597, "epoch": 4} {"train_loss": -15.20167064666748, "global_step": 598, "epoch": 4} {"train_loss": -15.010968208312988, "global_step": 599, "epoch": 4} {"train_loss": -14.935896873474121, "global_step": 600, "epoch": 4} {"train_loss": -15.3850736618042, "global_step": 601, "epoch": 4} {"train_loss": -14.537367820739746, "global_step": 602, "epoch": 4} {"train_loss": -15.136154174804688, "global_step": 603, "epoch": 4} {"train_loss": -15.139979803857724, "global_step": 604, "epoch": 4, "val_loss": 3939266.25} {"train_loss": -14.946313858032227, "global_step": 605, "epoch": 5} {"train_loss": -14.955514907836914, "global_step": 606, "epoch": 5} {"train_loss": -15.229843139648438, "global_step": 607, "epoch": 5} {"train_loss": -15.17639446258545, "global_step": 608, "epoch": 5} {"train_loss": -15.217439651489258, "global_step": 609, "epoch": 5} {"train_loss": -15.529268264770508, "global_step": 610, "epoch": 5} {"train_loss": -14.998756408691406, "global_step": 611, "epoch": 5} {"train_loss": -15.546317100524902, "global_step": 612, "epoch": 5} {"train_loss": -15.228471755981445, "global_step": 613, "epoch": 5} {"train_loss": -15.556802749633789, "global_step": 614, "epoch": 5} {"train_loss": -15.309332847595215, "global_step": 615, "epoch": 5} {"train_loss": -15.366000175476074, "global_step": 616, "epoch": 5} {"train_loss": -15.46146297454834, "global_step": 617, "epoch": 5} {"train_loss": -15.122637748718262, "global_step": 618, "epoch": 5} {"train_loss": -15.193527221679688, "global_step": 619, "epoch": 5} {"train_loss": -15.787701606750488, "global_step": 620, "epoch": 5} {"train_loss": -15.706400871276855, "global_step": 621, "epoch": 5} {"train_loss": -14.85636043548584, "global_step": 622, "epoch": 5} {"train_loss": -15.311233520507812, "global_step": 623, "epoch": 5} {"train_loss": -15.713920593261719, "global_step": 624, "epoch": 5} {"train_loss": -15.168693542480469, "global_step": 625, "epoch": 5} {"train_loss": -13.943316459655762, "global_step": 626, "epoch": 5} {"train_loss": -12.544902801513672, "global_step": 627, "epoch": 5} {"train_loss": -13.766730308532715, "global_step": 628, "epoch": 5} {"train_loss": -15.051971435546875, "global_step": 629, "epoch": 5} {"train_loss": -14.998553276062012, "global_step": 630, "epoch": 5} {"train_loss": -13.874399185180664, "global_step": 631, "epoch": 5} {"train_loss": -14.733369827270508, "global_step": 632, "epoch": 5} {"train_loss": -15.411849975585938, "global_step": 633, "epoch": 5} {"train_loss": -14.733120918273926, "global_step": 634, "epoch": 5} {"train_loss": -14.629547119140625, "global_step": 635, "epoch": 5} {"train_loss": -14.696413040161133, "global_step": 636, "epoch": 5} {"train_loss": -14.591781616210938, "global_step": 637, "epoch": 5} {"train_loss": -14.73498249053955, "global_step": 638, "epoch": 5} {"train_loss": -14.556258201599121, "global_step": 639, "epoch": 5} {"train_loss": -14.804797172546387, "global_step": 640, "epoch": 5} {"train_loss": -14.705408096313477, "global_step": 641, "epoch": 5} {"train_loss": -14.681431770324707, "global_step": 642, "epoch": 5} {"train_loss": -14.655890464782715, "global_step": 643, "epoch": 5} {"train_loss": -14.885223388671875, "global_step": 644, "epoch": 5} {"train_loss": -15.248214721679688, "global_step": 645, "epoch": 5} {"train_loss": -15.132669448852539, "global_step": 646, "epoch": 5} {"train_loss": -14.970221519470215, "global_step": 647, "epoch": 5} {"train_loss": -15.01941967010498, "global_step": 648, "epoch": 5} {"train_loss": -14.799646377563477, "global_step": 649, "epoch": 5} {"train_loss": -15.02696418762207, "global_step": 650, "epoch": 5} {"train_loss": -15.024243354797363, "global_step": 651, "epoch": 5} {"train_loss": -14.485359191894531, "global_step": 652, "epoch": 5} {"train_loss": -15.116497993469238, "global_step": 653, "epoch": 5} {"train_loss": -15.201828002929688, "global_step": 654, "epoch": 5} {"train_loss": -14.885340690612793, "global_step": 655, "epoch": 5} {"train_loss": -15.223971366882324, "global_step": 656, "epoch": 5} {"train_loss": -15.437458992004395, "global_step": 657, "epoch": 5} {"train_loss": -15.162284851074219, "global_step": 658, "epoch": 5} {"train_loss": -15.292734146118164, "global_step": 659, "epoch": 5} {"train_loss": -15.418431282043457, "global_step": 660, "epoch": 5} {"train_loss": -15.37717342376709, "global_step": 661, "epoch": 5} {"train_loss": -15.697131156921387, "global_step": 662, "epoch": 5} {"train_loss": -15.324225425720215, "global_step": 663, "epoch": 5} {"train_loss": -15.27685260772705, "global_step": 664, "epoch": 5} {"train_loss": -15.728639602661133, "global_step": 665, "epoch": 5} {"train_loss": -15.566256523132324, "global_step": 666, "epoch": 5} {"train_loss": -15.810652732849121, "global_step": 667, "epoch": 5} {"train_loss": -15.40778636932373, "global_step": 668, "epoch": 5} {"train_loss": -15.689126968383789, "global_step": 669, "epoch": 5} {"train_loss": -15.629385948181152, "global_step": 670, "epoch": 5} {"train_loss": -15.395285606384277, "global_step": 671, "epoch": 5} {"train_loss": -15.665796279907227, "global_step": 672, "epoch": 5} {"train_loss": -15.663657188415527, "global_step": 673, "epoch": 5} {"train_loss": -15.33592700958252, "global_step": 674, "epoch": 5} {"train_loss": -15.607437133789062, "global_step": 675, "epoch": 5} {"train_loss": -15.381820678710938, "global_step": 676, "epoch": 5} {"train_loss": -15.688898086547852, "global_step": 677, "epoch": 5} {"train_loss": -15.157648086547852, "global_step": 678, "epoch": 5} {"train_loss": -15.538416862487793, "global_step": 679, "epoch": 5} {"train_loss": -15.430567741394043, "global_step": 680, "epoch": 5} {"train_loss": -15.101938247680664, "global_step": 681, "epoch": 5} {"train_loss": -14.441118240356445, "global_step": 682, "epoch": 5} {"train_loss": -15.805729866027832, "global_step": 683, "epoch": 5} {"train_loss": -14.869089126586914, "global_step": 684, "epoch": 5} {"train_loss": -15.519350051879883, "global_step": 685, "epoch": 5} {"train_loss": -14.761240005493164, "global_step": 686, "epoch": 5} {"train_loss": -15.2303466796875, "global_step": 687, "epoch": 5} {"train_loss": -14.765151023864746, "global_step": 688, "epoch": 5} {"train_loss": -15.168070793151855, "global_step": 689, "epoch": 5} {"train_loss": -14.6012544631958, "global_step": 690, "epoch": 5} {"train_loss": -15.139439582824707, "global_step": 691, "epoch": 5} {"train_loss": -15.03299617767334, "global_step": 692, "epoch": 5} {"train_loss": -15.696955680847168, "global_step": 693, "epoch": 5} {"train_loss": -14.89263916015625, "global_step": 694, "epoch": 5} {"train_loss": -15.32489013671875, "global_step": 695, "epoch": 5} {"train_loss": -15.274703025817871, "global_step": 696, "epoch": 5} {"train_loss": -14.882670402526855, "global_step": 697, "epoch": 5} {"train_loss": -15.254440307617188, "global_step": 698, "epoch": 5} {"train_loss": -15.202771186828613, "global_step": 699, "epoch": 5} {"train_loss": -15.210497856140137, "global_step": 700, "epoch": 5} {"train_loss": -14.806937217712402, "global_step": 701, "epoch": 5} {"train_loss": -15.270051956176758, "global_step": 702, "epoch": 5} {"train_loss": -15.042258262634277, "global_step": 703, "epoch": 5} {"train_loss": -14.961786270141602, "global_step": 704, "epoch": 5} {"train_loss": -15.580090522766113, "global_step": 705, "epoch": 5} {"train_loss": -15.493997573852539, "global_step": 706, "epoch": 5} {"train_loss": -15.215319633483887, "global_step": 707, "epoch": 5} {"train_loss": -15.121859550476074, "global_step": 708, "epoch": 5} {"train_loss": -15.375299453735352, "global_step": 709, "epoch": 5} {"train_loss": -15.371319770812988, "global_step": 710, "epoch": 5} {"train_loss": -15.440093994140625, "global_step": 711, "epoch": 5} {"train_loss": -15.585023880004883, "global_step": 712, "epoch": 5} {"train_loss": -15.509623527526855, "global_step": 713, "epoch": 5} {"train_loss": -15.480181694030762, "global_step": 714, "epoch": 5} {"train_loss": -15.329347610473633, "global_step": 715, "epoch": 5} {"train_loss": -16.060285568237305, "global_step": 716, "epoch": 5} {"train_loss": -15.65952205657959, "global_step": 717, "epoch": 5} {"train_loss": -15.8676176071167, "global_step": 718, "epoch": 5} {"train_loss": -15.603438377380371, "global_step": 719, "epoch": 5} {"train_loss": -15.541539192199707, "global_step": 720, "epoch": 5} {"train_loss": -15.32244873046875, "global_step": 721, "epoch": 5} {"train_loss": -15.287027359008789, "global_step": 722, "epoch": 5} {"train_loss": -14.977435111999512, "global_step": 723, "epoch": 5} {"train_loss": -15.571341514587402, "global_step": 724, "epoch": 5} {"train_loss": -15.176913891942048, "global_step": 725, "epoch": 5, "val_loss": 4117326.0} {"train_loss": -15.185681343078613, "global_step": 726, "epoch": 6} {"train_loss": -15.543505668640137, "global_step": 727, "epoch": 6} {"train_loss": -15.721572875976562, "global_step": 728, "epoch": 6} {"train_loss": -15.6647310256958, "global_step": 729, "epoch": 6} {"train_loss": -15.720410346984863, "global_step": 730, "epoch": 6} {"train_loss": -16.08785057067871, "global_step": 731, "epoch": 6} {"train_loss": -15.72984790802002, "global_step": 732, "epoch": 6} {"train_loss": -15.674405097961426, "global_step": 733, "epoch": 6} {"train_loss": -15.339850425720215, "global_step": 734, "epoch": 6} {"train_loss": -15.545618057250977, "global_step": 735, "epoch": 6} {"train_loss": -16.03592872619629, "global_step": 736, "epoch": 6} {"train_loss": -15.557415962219238, "global_step": 737, "epoch": 6} {"train_loss": -15.851025581359863, "global_step": 738, "epoch": 6} {"train_loss": -15.601153373718262, "global_step": 739, "epoch": 6} {"train_loss": -15.653363227844238, "global_step": 740, "epoch": 6} {"train_loss": -15.610849380493164, "global_step": 741, "epoch": 6} {"train_loss": -15.275436401367188, "global_step": 742, "epoch": 6} {"train_loss": -14.779818534851074, "global_step": 743, "epoch": 6} {"train_loss": -14.800475120544434, "global_step": 744, "epoch": 6} {"train_loss": -15.019418716430664, "global_step": 745, "epoch": 6} {"train_loss": -15.261032104492188, "global_step": 746, "epoch": 6} {"train_loss": -15.305343627929688, "global_step": 747, "epoch": 6} {"train_loss": -15.357220649719238, "global_step": 748, "epoch": 6} {"train_loss": -15.27225399017334, "global_step": 749, "epoch": 6} {"train_loss": -15.335128784179688, "global_step": 750, "epoch": 6} {"train_loss": -15.416089057922363, "global_step": 751, "epoch": 6} {"train_loss": -15.685739517211914, "global_step": 752, "epoch": 6} {"train_loss": -15.257420539855957, "global_step": 753, "epoch": 6} {"train_loss": -15.447222709655762, "global_step": 754, "epoch": 6} {"train_loss": -15.607192039489746, "global_step": 755, "epoch": 6} {"train_loss": -15.379953384399414, "global_step": 756, "epoch": 6} {"train_loss": -15.638348579406738, "global_step": 757, "epoch": 6} {"train_loss": -15.52519702911377, "global_step": 758, "epoch": 6} {"train_loss": -15.338526725769043, "global_step": 759, "epoch": 6} {"train_loss": -15.3309907913208, "global_step": 760, "epoch": 6} {"train_loss": -15.877652168273926, "global_step": 761, "epoch": 6} {"train_loss": -15.560388565063477, "global_step": 762, "epoch": 6} {"train_loss": -16.1546688079834, "global_step": 763, "epoch": 6} {"train_loss": -15.379422187805176, "global_step": 764, "epoch": 6} {"train_loss": -15.622550964355469, "global_step": 765, "epoch": 6} {"train_loss": -15.43145751953125, "global_step": 766, "epoch": 6} {"train_loss": -15.603230476379395, "global_step": 767, "epoch": 6} {"train_loss": -15.800175666809082, "global_step": 768, "epoch": 6} {"train_loss": -15.891092300415039, "global_step": 769, "epoch": 6} {"train_loss": -15.591066360473633, "global_step": 770, "epoch": 6} {"train_loss": -15.905369758605957, "global_step": 771, "epoch": 6} {"train_loss": -15.297284126281738, "global_step": 772, "epoch": 6} {"train_loss": -15.473498344421387, "global_step": 773, "epoch": 6} {"train_loss": -15.651593208312988, "global_step": 774, "epoch": 6} {"train_loss": -16.06269645690918, "global_step": 775, "epoch": 6} {"train_loss": -15.105978965759277, "global_step": 776, "epoch": 6} {"train_loss": -15.970118522644043, "global_step": 777, "epoch": 6} {"train_loss": -15.442941665649414, "global_step": 778, "epoch": 6} {"train_loss": -15.423415184020996, "global_step": 779, "epoch": 6} {"train_loss": -15.44427490234375, "global_step": 780, "epoch": 6} {"train_loss": -15.551651000976562, "global_step": 781, "epoch": 6} {"train_loss": -16.029739379882812, "global_step": 782, "epoch": 6} {"train_loss": -15.478912353515625, "global_step": 783, "epoch": 6} {"train_loss": -15.6526517868042, "global_step": 784, "epoch": 6} {"train_loss": -15.650555610656738, "global_step": 785, "epoch": 6} {"train_loss": -15.972762107849121, "global_step": 786, "epoch": 6} {"train_loss": -15.954401016235352, "global_step": 787, "epoch": 6} {"train_loss": -15.189061164855957, "global_step": 788, "epoch": 6} {"train_loss": -15.959115982055664, "global_step": 789, "epoch": 6} {"train_loss": -15.889025688171387, "global_step": 790, "epoch": 6} {"train_loss": -15.986703872680664, "global_step": 791, "epoch": 6} {"train_loss": -15.647418022155762, "global_step": 792, "epoch": 6} {"train_loss": -15.549837112426758, "global_step": 793, "epoch": 6} {"train_loss": -15.658090591430664, "global_step": 794, "epoch": 6} {"train_loss": -15.553753852844238, "global_step": 795, "epoch": 6} {"train_loss": -15.557977676391602, "global_step": 796, "epoch": 6} {"train_loss": -15.563563346862793, "global_step": 797, "epoch": 6} {"train_loss": -15.156111717224121, "global_step": 798, "epoch": 6} {"train_loss": -15.230738639831543, "global_step": 799, "epoch": 6} {"train_loss": -15.446365356445312, "global_step": 800, "epoch": 6} {"train_loss": -15.211450576782227, "global_step": 801, "epoch": 6} {"train_loss": -16.25246238708496, "global_step": 802, "epoch": 6} {"train_loss": -15.210543632507324, "global_step": 803, "epoch": 6} {"train_loss": -15.911662101745605, "global_step": 804, "epoch": 6} {"train_loss": -15.612048149108887, "global_step": 805, "epoch": 6} {"train_loss": -15.761795043945312, "global_step": 806, "epoch": 6} {"train_loss": -15.428573608398438, "global_step": 807, "epoch": 6} {"train_loss": -15.40838623046875, "global_step": 808, "epoch": 6} {"train_loss": -15.498163223266602, "global_step": 809, "epoch": 6} {"train_loss": -15.412741661071777, "global_step": 810, "epoch": 6} {"train_loss": -14.95053768157959, "global_step": 811, "epoch": 6} {"train_loss": -15.62094783782959, "global_step": 812, "epoch": 6} {"train_loss": -15.23491096496582, "global_step": 813, "epoch": 6} {"train_loss": -15.654471397399902, "global_step": 814, "epoch": 6} {"train_loss": -15.217429161071777, "global_step": 815, "epoch": 6} {"train_loss": -15.497639656066895, "global_step": 816, "epoch": 6} {"train_loss": -15.579730033874512, "global_step": 817, "epoch": 6} {"train_loss": -15.438931465148926, "global_step": 818, "epoch": 6} {"train_loss": -15.596285820007324, "global_step": 819, "epoch": 6} {"train_loss": -15.4456148147583, "global_step": 820, "epoch": 6} {"train_loss": -15.317438125610352, "global_step": 821, "epoch": 6} {"train_loss": -16.172779083251953, "global_step": 822, "epoch": 6} {"train_loss": -15.666033744812012, "global_step": 823, "epoch": 6} {"train_loss": -15.633963584899902, "global_step": 824, "epoch": 6} {"train_loss": -15.966049194335938, "global_step": 825, "epoch": 6} {"train_loss": -15.33978271484375, "global_step": 826, "epoch": 6} {"train_loss": -15.28455638885498, "global_step": 827, "epoch": 6} {"train_loss": -15.531964302062988, "global_step": 828, "epoch": 6} {"train_loss": -15.750521659851074, "global_step": 829, "epoch": 6} {"train_loss": -15.724575996398926, "global_step": 830, "epoch": 6} {"train_loss": -16.23125648498535, "global_step": 831, "epoch": 6} {"train_loss": -15.29038143157959, "global_step": 832, "epoch": 6} {"train_loss": -15.607234001159668, "global_step": 833, "epoch": 6} {"train_loss": -15.96196174621582, "global_step": 834, "epoch": 6} {"train_loss": -15.375686645507812, "global_step": 835, "epoch": 6} {"train_loss": -16.038766860961914, "global_step": 836, "epoch": 6} {"train_loss": -15.777017593383789, "global_step": 837, "epoch": 6} {"train_loss": -15.811838150024414, "global_step": 838, "epoch": 6} {"train_loss": -15.664125442504883, "global_step": 839, "epoch": 6} {"train_loss": -15.893683433532715, "global_step": 840, "epoch": 6} {"train_loss": -16.088775634765625, "global_step": 841, "epoch": 6} {"train_loss": -15.747557640075684, "global_step": 842, "epoch": 6} {"train_loss": -16.483224868774414, "global_step": 843, "epoch": 6} {"train_loss": -16.16341209411621, "global_step": 844, "epoch": 6} {"train_loss": -14.969952583312988, "global_step": 845, "epoch": 6} {"train_loss": -15.588845725887078, "global_step": 846, "epoch": 6, "val_loss": 3427327.75} {"train_loss": -15.570854187011719, "global_step": 847, "epoch": 7} {"train_loss": -15.807550430297852, "global_step": 848, "epoch": 7} {"train_loss": -16.009159088134766, "global_step": 849, "epoch": 7} {"train_loss": -15.35456371307373, "global_step": 850, "epoch": 7} {"train_loss": -16.165313720703125, "global_step": 851, "epoch": 7} {"train_loss": -15.727668762207031, "global_step": 852, "epoch": 7} {"train_loss": -15.884714126586914, "global_step": 853, "epoch": 7} {"train_loss": -15.952288627624512, "global_step": 854, "epoch": 7} {"train_loss": -15.986136436462402, "global_step": 855, "epoch": 7} {"train_loss": -16.058794021606445, "global_step": 856, "epoch": 7} {"train_loss": -16.26318359375, "global_step": 857, "epoch": 7} {"train_loss": -15.650313377380371, "global_step": 858, "epoch": 7} {"train_loss": -16.00019645690918, "global_step": 859, "epoch": 7} {"train_loss": -15.745094299316406, "global_step": 860, "epoch": 7} {"train_loss": -16.08640480041504, "global_step": 861, "epoch": 7} {"train_loss": -15.964967727661133, "global_step": 862, "epoch": 7} {"train_loss": -15.954437255859375, "global_step": 863, "epoch": 7} {"train_loss": -15.63751220703125, "global_step": 864, "epoch": 7} {"train_loss": -15.466452598571777, "global_step": 865, "epoch": 7} {"train_loss": -15.765658378601074, "global_step": 866, "epoch": 7} {"train_loss": -14.399492263793945, "global_step": 867, "epoch": 7} {"train_loss": -15.47339916229248, "global_step": 868, "epoch": 7} {"train_loss": -15.068671226501465, "global_step": 869, "epoch": 7} {"train_loss": -15.741540908813477, "global_step": 870, "epoch": 7} {"train_loss": -15.168474197387695, "global_step": 871, "epoch": 7} {"train_loss": -16.18926429748535, "global_step": 872, "epoch": 7} {"train_loss": -16.254575729370117, "global_step": 873, "epoch": 7} {"train_loss": -15.169870376586914, "global_step": 874, "epoch": 7} {"train_loss": -14.982942581176758, "global_step": 875, "epoch": 7} {"train_loss": -16.102685928344727, "global_step": 876, "epoch": 7} {"train_loss": -15.440768241882324, "global_step": 877, "epoch": 7} {"train_loss": -15.803214073181152, "global_step": 878, "epoch": 7} {"train_loss": -15.583296775817871, "global_step": 879, "epoch": 7} {"train_loss": -15.610997200012207, "global_step": 880, "epoch": 7} {"train_loss": -15.913912773132324, "global_step": 881, "epoch": 7} {"train_loss": -15.78024959564209, "global_step": 882, "epoch": 7} {"train_loss": -15.608209609985352, "global_step": 883, "epoch": 7} {"train_loss": -15.57114315032959, "global_step": 884, "epoch": 7} {"train_loss": -15.82624340057373, "global_step": 885, "epoch": 7} {"train_loss": -15.250703811645508, "global_step": 886, "epoch": 7} {"train_loss": -15.626581192016602, "global_step": 887, "epoch": 7} {"train_loss": -15.640533447265625, "global_step": 888, "epoch": 7} {"train_loss": -15.443145751953125, "global_step": 889, "epoch": 7} {"train_loss": -15.35892391204834, "global_step": 890, "epoch": 7} {"train_loss": -15.907119750976562, "global_step": 891, "epoch": 7} {"train_loss": -15.96801471710205, "global_step": 892, "epoch": 7} {"train_loss": -16.116968154907227, "global_step": 893, "epoch": 7} {"train_loss": -16.042713165283203, "global_step": 894, "epoch": 7} {"train_loss": -15.664484977722168, "global_step": 895, "epoch": 7} {"train_loss": -16.196807861328125, "global_step": 896, "epoch": 7} {"train_loss": -15.733612060546875, "global_step": 897, "epoch": 7} {"train_loss": -16.07265281677246, "global_step": 898, "epoch": 7} {"train_loss": -16.40750503540039, "global_step": 899, "epoch": 7} {"train_loss": -16.31572151184082, "global_step": 900, "epoch": 7} {"train_loss": -16.410295486450195, "global_step": 901, "epoch": 7} {"train_loss": -15.960771560668945, "global_step": 902, "epoch": 7} {"train_loss": -16.16823387145996, "global_step": 903, "epoch": 7} {"train_loss": -16.436567306518555, "global_step": 904, "epoch": 7} {"train_loss": -16.341548919677734, "global_step": 905, "epoch": 7} {"train_loss": -15.594433784484863, "global_step": 906, "epoch": 7} {"train_loss": -15.421673774719238, "global_step": 907, "epoch": 7} {"train_loss": -16.066661834716797, "global_step": 908, "epoch": 7} {"train_loss": -16.063003540039062, "global_step": 909, "epoch": 7} {"train_loss": -14.22607707977295, "global_step": 910, "epoch": 7} {"train_loss": -15.748214721679688, "global_step": 911, "epoch": 7} {"train_loss": -15.554498672485352, "global_step": 912, "epoch": 7} {"train_loss": -15.425236701965332, "global_step": 913, "epoch": 7} {"train_loss": -15.453036308288574, "global_step": 914, "epoch": 7} {"train_loss": -16.168914794921875, "global_step": 915, "epoch": 7} {"train_loss": -15.766194343566895, "global_step": 916, "epoch": 7} {"train_loss": -15.905242919921875, "global_step": 917, "epoch": 7} {"train_loss": -15.85227108001709, "global_step": 918, "epoch": 7} {"train_loss": -15.745755195617676, "global_step": 919, "epoch": 7} {"train_loss": -15.702249526977539, "global_step": 920, "epoch": 7} {"train_loss": -15.844698905944824, "global_step": 921, "epoch": 7} {"train_loss": -16.214048385620117, "global_step": 922, "epoch": 7} {"train_loss": -16.078519821166992, "global_step": 923, "epoch": 7} {"train_loss": -15.938549995422363, "global_step": 924, "epoch": 7} {"train_loss": -16.16734504699707, "global_step": 925, "epoch": 7} {"train_loss": -16.06369400024414, "global_step": 926, "epoch": 7} {"train_loss": -15.700540542602539, "global_step": 927, "epoch": 7} {"train_loss": -15.571130752563477, "global_step": 928, "epoch": 7} {"train_loss": -15.638580322265625, "global_step": 929, "epoch": 7} {"train_loss": -16.133716583251953, "global_step": 930, "epoch": 7} {"train_loss": -15.431708335876465, "global_step": 931, "epoch": 7} {"train_loss": -16.206497192382812, "global_step": 932, "epoch": 7} {"train_loss": -15.509112358093262, "global_step": 933, "epoch": 7} {"train_loss": -16.3685302734375, "global_step": 934, "epoch": 7} {"train_loss": -16.028623580932617, "global_step": 935, "epoch": 7} {"train_loss": -15.243799209594727, "global_step": 936, "epoch": 7} {"train_loss": -15.815350532531738, "global_step": 937, "epoch": 7} {"train_loss": -15.955836296081543, "global_step": 938, "epoch": 7} {"train_loss": -15.861227989196777, "global_step": 939, "epoch": 7} {"train_loss": -15.616168022155762, "global_step": 940, "epoch": 7} {"train_loss": -15.623583793640137, "global_step": 941, "epoch": 7} {"train_loss": -16.03450584411621, "global_step": 942, "epoch": 7} {"train_loss": -16.05488395690918, "global_step": 943, "epoch": 7} {"train_loss": -16.13283920288086, "global_step": 944, "epoch": 7} {"train_loss": -15.821818351745605, "global_step": 945, "epoch": 7} {"train_loss": -16.155977249145508, "global_step": 946, "epoch": 7} {"train_loss": -15.981989860534668, "global_step": 947, "epoch": 7} {"train_loss": -16.04617691040039, "global_step": 948, "epoch": 7} {"train_loss": -16.0920352935791, "global_step": 949, "epoch": 7} {"train_loss": -15.958330154418945, "global_step": 950, "epoch": 7} {"train_loss": -15.927577018737793, "global_step": 951, "epoch": 7} {"train_loss": -15.791732788085938, "global_step": 952, "epoch": 7} {"train_loss": -16.17091178894043, "global_step": 953, "epoch": 7} {"train_loss": -15.97113037109375, "global_step": 954, "epoch": 7} {"train_loss": -16.415388107299805, "global_step": 955, "epoch": 7} {"train_loss": -15.951308250427246, "global_step": 956, "epoch": 7} {"train_loss": -16.373931884765625, "global_step": 957, "epoch": 7} {"train_loss": -15.933540344238281, "global_step": 958, "epoch": 7} {"train_loss": -16.287668228149414, "global_step": 959, "epoch": 7} {"train_loss": -15.865435600280762, "global_step": 960, "epoch": 7} {"train_loss": -16.104022979736328, "global_step": 961, "epoch": 7} {"train_loss": -16.08776092529297, "global_step": 962, "epoch": 7} {"train_loss": -16.506019592285156, "global_step": 963, "epoch": 7} {"train_loss": -16.40021324157715, "global_step": 964, "epoch": 7} {"train_loss": -16.257034301757812, "global_step": 965, "epoch": 7} {"train_loss": -16.24373435974121, "global_step": 966, "epoch": 7} {"train_loss": -15.852588566866787, "global_step": 967, "epoch": 7, "val_loss": 3613933.0} {"train_loss": -15.87145709991455, "global_step": 968, "epoch": 8} {"train_loss": -16.8450984954834, "global_step": 969, "epoch": 8} {"train_loss": -16.493642807006836, "global_step": 970, "epoch": 8} {"train_loss": -15.891595840454102, "global_step": 971, "epoch": 8} {"train_loss": -16.567625045776367, "global_step": 972, "epoch": 8} {"train_loss": -16.692916870117188, "global_step": 973, "epoch": 8} {"train_loss": -15.992851257324219, "global_step": 974, "epoch": 8} {"train_loss": -16.615447998046875, "global_step": 975, "epoch": 8} {"train_loss": -16.19072151184082, "global_step": 976, "epoch": 8} {"train_loss": -16.43686294555664, "global_step": 977, "epoch": 8} {"train_loss": -16.22962760925293, "global_step": 978, "epoch": 8} {"train_loss": -16.351747512817383, "global_step": 979, "epoch": 8} {"train_loss": -15.835395812988281, "global_step": 980, "epoch": 8} {"train_loss": -16.28537368774414, "global_step": 981, "epoch": 8} {"train_loss": -15.96005916595459, "global_step": 982, "epoch": 8} {"train_loss": -15.697694778442383, "global_step": 983, "epoch": 8} {"train_loss": -16.40652847290039, "global_step": 984, "epoch": 8} {"train_loss": -15.587538719177246, "global_step": 985, "epoch": 8} {"train_loss": -16.661346435546875, "global_step": 986, "epoch": 8} {"train_loss": -16.019012451171875, "global_step": 987, "epoch": 8} {"train_loss": -15.569815635681152, "global_step": 988, "epoch": 8} {"train_loss": -15.811456680297852, "global_step": 989, "epoch": 8} {"train_loss": -15.731900215148926, "global_step": 990, "epoch": 8} {"train_loss": -15.833465576171875, "global_step": 991, "epoch": 8} {"train_loss": -14.825411796569824, "global_step": 992, "epoch": 8} {"train_loss": -16.078575134277344, "global_step": 993, "epoch": 8} {"train_loss": -15.842726707458496, "global_step": 994, "epoch": 8} {"train_loss": -15.71020221710205, "global_step": 995, "epoch": 8} {"train_loss": -16.18866539001465, "global_step": 996, "epoch": 8} {"train_loss": -15.936144828796387, "global_step": 997, "epoch": 8} {"train_loss": -16.14667320251465, "global_step": 998, "epoch": 8} {"train_loss": -16.25785255432129, "global_step": 999, "epoch": 8} {"train_loss": -16.19696617126465, "global_step": 1000, "epoch": 8} {"train_loss": -16.328487396240234, "global_step": 1001, "epoch": 8} {"train_loss": -16.121625900268555, "global_step": 1002, "epoch": 8} {"train_loss": -16.135129928588867, "global_step": 1003, "epoch": 8} {"train_loss": -16.37373161315918, "global_step": 1004, "epoch": 8} {"train_loss": -16.640579223632812, "global_step": 1005, "epoch": 8} {"train_loss": -16.553319931030273, "global_step": 1006, "epoch": 8} {"train_loss": -16.27396583557129, "global_step": 1007, "epoch": 8} {"train_loss": -16.12286376953125, "global_step": 1008, "epoch": 8} {"train_loss": -15.713549613952637, "global_step": 1009, "epoch": 8} {"train_loss": -16.31378173828125, "global_step": 1010, "epoch": 8} {"train_loss": -16.066743850708008, "global_step": 1011, "epoch": 8} {"train_loss": -16.027515411376953, "global_step": 1012, "epoch": 8} {"train_loss": -15.30608081817627, "global_step": 1013, "epoch": 8} {"train_loss": -15.52546215057373, "global_step": 1014, "epoch": 8} {"train_loss": -15.818338394165039, "global_step": 1015, "epoch": 8} {"train_loss": -16.076751708984375, "global_step": 1016, "epoch": 8} {"train_loss": -15.582893371582031, "global_step": 1017, "epoch": 8} {"train_loss": -16.332059860229492, "global_step": 1018, "epoch": 8} {"train_loss": -15.558862686157227, "global_step": 1019, "epoch": 8} {"train_loss": -15.802411079406738, "global_step": 1020, "epoch": 8} {"train_loss": -16.135339736938477, "global_step": 1021, "epoch": 8} {"train_loss": -15.933844566345215, "global_step": 1022, "epoch": 8} {"train_loss": -16.056184768676758, "global_step": 1023, "epoch": 8} {"train_loss": -15.926668167114258, "global_step": 1024, "epoch": 8} {"train_loss": -16.2923641204834, "global_step": 1025, "epoch": 8} {"train_loss": -16.292604446411133, "global_step": 1026, "epoch": 8} {"train_loss": -16.111927032470703, "global_step": 1027, "epoch": 8} {"train_loss": -16.07362174987793, "global_step": 1028, "epoch": 8} {"train_loss": -16.373395919799805, "global_step": 1029, "epoch": 8} {"train_loss": -16.3447322845459, "global_step": 1030, "epoch": 8} {"train_loss": -16.06886863708496, "global_step": 1031, "epoch": 8} {"train_loss": -16.555580139160156, "global_step": 1032, "epoch": 8} {"train_loss": -15.81641674041748, "global_step": 1033, "epoch": 8} {"train_loss": -16.298315048217773, "global_step": 1034, "epoch": 8} {"train_loss": -16.322641372680664, "global_step": 1035, "epoch": 8} {"train_loss": -16.58243179321289, "global_step": 1036, "epoch": 8} {"train_loss": -15.843971252441406, "global_step": 1037, "epoch": 8} {"train_loss": -16.2712345123291, "global_step": 1038, "epoch": 8} {"train_loss": -16.172256469726562, "global_step": 1039, "epoch": 8} {"train_loss": -15.875887870788574, "global_step": 1040, "epoch": 8} {"train_loss": -16.57904624938965, "global_step": 1041, "epoch": 8} {"train_loss": -16.423603057861328, "global_step": 1042, "epoch": 8} {"train_loss": -16.905105590820312, "global_step": 1043, "epoch": 8} {"train_loss": -16.16118049621582, "global_step": 1044, "epoch": 8} {"train_loss": -16.392614364624023, "global_step": 1045, "epoch": 8} {"train_loss": -16.73927879333496, "global_step": 1046, "epoch": 8} {"train_loss": -16.613468170166016, "global_step": 1047, "epoch": 8} {"train_loss": -16.480731964111328, "global_step": 1048, "epoch": 8} {"train_loss": -15.774431228637695, "global_step": 1049, "epoch": 8} {"train_loss": -16.012971878051758, "global_step": 1050, "epoch": 8} {"train_loss": -16.08642578125, "global_step": 1051, "epoch": 8} {"train_loss": -16.610509872436523, "global_step": 1052, "epoch": 8} {"train_loss": -16.436277389526367, "global_step": 1053, "epoch": 8} {"train_loss": -16.303647994995117, "global_step": 1054, "epoch": 8} {"train_loss": -16.369600296020508, "global_step": 1055, "epoch": 8} {"train_loss": -16.400178909301758, "global_step": 1056, "epoch": 8} {"train_loss": -16.452102661132812, "global_step": 1057, "epoch": 8} {"train_loss": -16.2001895904541, "global_step": 1058, "epoch": 8} {"train_loss": -16.12019920349121, "global_step": 1059, "epoch": 8} {"train_loss": -16.6148681640625, "global_step": 1060, "epoch": 8} {"train_loss": -16.506229400634766, "global_step": 1061, "epoch": 8} {"train_loss": -16.492895126342773, "global_step": 1062, "epoch": 8} {"train_loss": -16.66167640686035, "global_step": 1063, "epoch": 8} {"train_loss": -16.08429527282715, "global_step": 1064, "epoch": 8} {"train_loss": -15.858545303344727, "global_step": 1065, "epoch": 8} {"train_loss": -16.4732608795166, "global_step": 1066, "epoch": 8} {"train_loss": -16.19754981994629, "global_step": 1067, "epoch": 8} {"train_loss": -16.230464935302734, "global_step": 1068, "epoch": 8} {"train_loss": -16.66238784790039, "global_step": 1069, "epoch": 8} {"train_loss": -17.003820419311523, "global_step": 1070, "epoch": 8} {"train_loss": -16.420785903930664, "global_step": 1071, "epoch": 8} {"train_loss": -16.49234962463379, "global_step": 1072, "epoch": 8} {"train_loss": -16.563491821289062, "global_step": 1073, "epoch": 8} {"train_loss": -17.03542137145996, "global_step": 1074, "epoch": 8} {"train_loss": -16.70599365234375, "global_step": 1075, "epoch": 8} {"train_loss": -15.80632495880127, "global_step": 1076, "epoch": 8} {"train_loss": -16.90283966064453, "global_step": 1077, "epoch": 8} {"train_loss": -16.47163963317871, "global_step": 1078, "epoch": 8} {"train_loss": -16.6341609954834, "global_step": 1079, "epoch": 8} {"train_loss": -16.6982421875, "global_step": 1080, "epoch": 8} {"train_loss": -16.31574821472168, "global_step": 1081, "epoch": 8} {"train_loss": -17.10075569152832, "global_step": 1082, "epoch": 8} {"train_loss": -16.980670928955078, "global_step": 1083, "epoch": 8} {"train_loss": -16.163747787475586, "global_step": 1084, "epoch": 8} {"train_loss": -15.929282188415527, "global_step": 1085, "epoch": 8} {"train_loss": -16.72212791442871, "global_step": 1086, "epoch": 8} {"train_loss": -16.86032485961914, "global_step": 1087, "epoch": 8} {"train_loss": -16.234954408377654, "global_step": 1088, "epoch": 8, "val_loss": 3662878.75} {"train_loss": -16.974260330200195, "global_step": 1089, "epoch": 9} {"train_loss": -15.97400188446045, "global_step": 1090, "epoch": 9} {"train_loss": -16.8249568939209, "global_step": 1091, "epoch": 9} {"train_loss": -16.719940185546875, "global_step": 1092, "epoch": 9} {"train_loss": -16.37177848815918, "global_step": 1093, "epoch": 9} {"train_loss": -15.999430656433105, "global_step": 1094, "epoch": 9} {"train_loss": -16.841501235961914, "global_step": 1095, "epoch": 9} {"train_loss": -16.242507934570312, "global_step": 1096, "epoch": 9} {"train_loss": -16.405017852783203, "global_step": 1097, "epoch": 9} {"train_loss": -16.3144474029541, "global_step": 1098, "epoch": 9} {"train_loss": -15.858664512634277, "global_step": 1099, "epoch": 9} {"train_loss": -17.02392578125, "global_step": 1100, "epoch": 9} {"train_loss": -15.781163215637207, "global_step": 1101, "epoch": 9} {"train_loss": -16.458637237548828, "global_step": 1102, "epoch": 9} {"train_loss": -16.277353286743164, "global_step": 1103, "epoch": 9} {"train_loss": -16.693817138671875, "global_step": 1104, "epoch": 9} {"train_loss": -16.620960235595703, "global_step": 1105, "epoch": 9} {"train_loss": -16.511198043823242, "global_step": 1106, "epoch": 9} {"train_loss": -16.75311851501465, "global_step": 1107, "epoch": 9} {"train_loss": -16.44049072265625, "global_step": 1108, "epoch": 9} {"train_loss": -16.54265022277832, "global_step": 1109, "epoch": 9} {"train_loss": -16.338369369506836, "global_step": 1110, "epoch": 9} {"train_loss": -16.267580032348633, "global_step": 1111, "epoch": 9} {"train_loss": -16.58429527282715, "global_step": 1112, "epoch": 9} {"train_loss": -16.359737396240234, "global_step": 1113, "epoch": 9} {"train_loss": -16.83087158203125, "global_step": 1114, "epoch": 9} {"train_loss": -16.13503074645996, "global_step": 1115, "epoch": 9} {"train_loss": -16.73145866394043, "global_step": 1116, "epoch": 9} {"train_loss": -16.17722511291504, "global_step": 1117, "epoch": 9} {"train_loss": -16.071475982666016, "global_step": 1118, "epoch": 9} {"train_loss": -16.353363037109375, "global_step": 1119, "epoch": 9} {"train_loss": -16.91249656677246, "global_step": 1120, "epoch": 9} {"train_loss": -16.580764770507812, "global_step": 1121, "epoch": 9} {"train_loss": -16.98634147644043, "global_step": 1122, "epoch": 9} {"train_loss": -16.668527603149414, "global_step": 1123, "epoch": 9} {"train_loss": -16.436487197875977, "global_step": 1124, "epoch": 9} {"train_loss": -16.791059494018555, "global_step": 1125, "epoch": 9} {"train_loss": -16.937387466430664, "global_step": 1126, "epoch": 9} {"train_loss": -16.705547332763672, "global_step": 1127, "epoch": 9} {"train_loss": -16.4859676361084, "global_step": 1128, "epoch": 9} {"train_loss": -16.660959243774414, "global_step": 1129, "epoch": 9} {"train_loss": -16.368375778198242, "global_step": 1130, "epoch": 9} {"train_loss": -16.450002670288086, "global_step": 1131, "epoch": 9} {"train_loss": -16.54502296447754, "global_step": 1132, "epoch": 9} {"train_loss": -16.1298828125, "global_step": 1133, "epoch": 9} {"train_loss": -16.674299240112305, "global_step": 1134, "epoch": 9} {"train_loss": -16.063547134399414, "global_step": 1135, "epoch": 9} {"train_loss": -16.97706413269043, "global_step": 1136, "epoch": 9} {"train_loss": -16.77487564086914, "global_step": 1137, "epoch": 9} {"train_loss": -16.63093376159668, "global_step": 1138, "epoch": 9} {"train_loss": -16.88222312927246, "global_step": 1139, "epoch": 9} {"train_loss": -17.148731231689453, "global_step": 1140, "epoch": 9} {"train_loss": -16.483373641967773, "global_step": 1141, "epoch": 9} {"train_loss": -16.332826614379883, "global_step": 1142, "epoch": 9} {"train_loss": -16.588882446289062, "global_step": 1143, "epoch": 9} {"train_loss": -16.84036636352539, "global_step": 1144, "epoch": 9} {"train_loss": -15.990493774414062, "global_step": 1145, "epoch": 9} {"train_loss": -16.805252075195312, "global_step": 1146, "epoch": 9} {"train_loss": -16.074047088623047, "global_step": 1147, "epoch": 9} {"train_loss": -16.88388442993164, "global_step": 1148, "epoch": 9} {"train_loss": -16.907068252563477, "global_step": 1149, "epoch": 9} {"train_loss": -16.899211883544922, "global_step": 1150, "epoch": 9} {"train_loss": -16.997867584228516, "global_step": 1151, "epoch": 9} {"train_loss": -16.523176193237305, "global_step": 1152, "epoch": 9} {"train_loss": -16.120698928833008, "global_step": 1153, "epoch": 9} {"train_loss": -16.90534782409668, "global_step": 1154, "epoch": 9} {"train_loss": -16.71491813659668, "global_step": 1155, "epoch": 9} {"train_loss": -16.499645233154297, "global_step": 1156, "epoch": 9} {"train_loss": -16.4877986907959, "global_step": 1157, "epoch": 9} {"train_loss": -16.6252498626709, "global_step": 1158, "epoch": 9} {"train_loss": -16.860136032104492, "global_step": 1159, "epoch": 9} {"train_loss": -16.991575241088867, "global_step": 1160, "epoch": 9} {"train_loss": -16.730825424194336, "global_step": 1161, "epoch": 9} {"train_loss": -16.87971305847168, "global_step": 1162, "epoch": 9} {"train_loss": -16.828231811523438, "global_step": 1163, "epoch": 9} {"train_loss": -16.92104148864746, "global_step": 1164, "epoch": 9} {"train_loss": -16.944168090820312, "global_step": 1165, "epoch": 9} {"train_loss": -17.1066837310791, "global_step": 1166, "epoch": 9} {"train_loss": -16.76114273071289, "global_step": 1167, "epoch": 9} {"train_loss": -16.74225616455078, "global_step": 1168, "epoch": 9} {"train_loss": -17.326013565063477, "global_step": 1169, "epoch": 9} {"train_loss": -16.558610916137695, "global_step": 1170, "epoch": 9} {"train_loss": -17.168577194213867, "global_step": 1171, "epoch": 9} {"train_loss": -16.836713790893555, "global_step": 1172, "epoch": 9} {"train_loss": -17.134511947631836, "global_step": 1173, "epoch": 9} {"train_loss": -16.70660972595215, "global_step": 1174, "epoch": 9} {"train_loss": -16.45503807067871, "global_step": 1175, "epoch": 9} {"train_loss": -16.662336349487305, "global_step": 1176, "epoch": 9} {"train_loss": -16.5161190032959, "global_step": 1177, "epoch": 9} {"train_loss": -16.89145278930664, "global_step": 1178, "epoch": 9} {"train_loss": -16.781064987182617, "global_step": 1179, "epoch": 9} {"train_loss": -16.87094497680664, "global_step": 1180, "epoch": 9} {"train_loss": -16.726165771484375, "global_step": 1181, "epoch": 9} {"train_loss": -16.996671676635742, "global_step": 1182, "epoch": 9} {"train_loss": -16.369314193725586, "global_step": 1183, "epoch": 9} {"train_loss": -16.90193748474121, "global_step": 1184, "epoch": 9} {"train_loss": -16.86000633239746, "global_step": 1185, "epoch": 9} {"train_loss": -16.727474212646484, "global_step": 1186, "epoch": 9} {"train_loss": -16.62569808959961, "global_step": 1187, "epoch": 9} {"train_loss": -16.45351219177246, "global_step": 1188, "epoch": 9} {"train_loss": -16.711441040039062, "global_step": 1189, "epoch": 9} {"train_loss": -16.781667709350586, "global_step": 1190, "epoch": 9} {"train_loss": -16.062498092651367, "global_step": 1191, "epoch": 9} {"train_loss": -15.729657173156738, "global_step": 1192, "epoch": 9} {"train_loss": -16.394399642944336, "global_step": 1193, "epoch": 9} {"train_loss": -16.142946243286133, "global_step": 1194, "epoch": 9} {"train_loss": -16.428863525390625, "global_step": 1195, "epoch": 9} {"train_loss": -16.783273696899414, "global_step": 1196, "epoch": 9} {"train_loss": -16.035518646240234, "global_step": 1197, "epoch": 9} {"train_loss": -17.04072380065918, "global_step": 1198, "epoch": 9} {"train_loss": -16.621458053588867, "global_step": 1199, "epoch": 9} {"train_loss": -16.46992301940918, "global_step": 1200, "epoch": 9} {"train_loss": -16.83362579345703, "global_step": 1201, "epoch": 9} {"train_loss": -16.880847930908203, "global_step": 1202, "epoch": 9} {"train_loss": -16.634496688842773, "global_step": 1203, "epoch": 9} {"train_loss": -17.097627639770508, "global_step": 1204, "epoch": 9} {"train_loss": -16.874414443969727, "global_step": 1205, "epoch": 9} {"train_loss": -16.468915939331055, "global_step": 1206, "epoch": 9} {"train_loss": -16.593841552734375, "global_step": 1207, "epoch": 9} {"train_loss": -16.608009338378906, "global_step": 1208, "epoch": 9} {"train_loss": -16.611177609971733, "global_step": 1209, "epoch": 9, "val_loss": 3298248.75} {"train_loss": -16.79059600830078, "global_step": 1210, "epoch": 10} {"train_loss": -16.660297393798828, "global_step": 1211, "epoch": 10} {"train_loss": -16.8780574798584, "global_step": 1212, "epoch": 10} {"train_loss": -16.6669921875, "global_step": 1213, "epoch": 10} {"train_loss": -16.694013595581055, "global_step": 1214, "epoch": 10} {"train_loss": -16.66770362854004, "global_step": 1215, "epoch": 10} {"train_loss": -16.689834594726562, "global_step": 1216, "epoch": 10} {"train_loss": -16.570913314819336, "global_step": 1217, "epoch": 10} {"train_loss": -16.92535400390625, "global_step": 1218, "epoch": 10} {"train_loss": -16.952634811401367, "global_step": 1219, "epoch": 10} {"train_loss": -16.699995040893555, "global_step": 1220, "epoch": 10} {"train_loss": -16.808847427368164, "global_step": 1221, "epoch": 10} {"train_loss": -17.215322494506836, "global_step": 1222, "epoch": 10} {"train_loss": -16.461027145385742, "global_step": 1223, "epoch": 10} {"train_loss": -16.379718780517578, "global_step": 1224, "epoch": 10} {"train_loss": -16.923599243164062, "global_step": 1225, "epoch": 10} {"train_loss": -16.890033721923828, "global_step": 1226, "epoch": 10} {"train_loss": -16.908367156982422, "global_step": 1227, "epoch": 10} {"train_loss": -16.824914932250977, "global_step": 1228, "epoch": 10} {"train_loss": -16.641796112060547, "global_step": 1229, "epoch": 10} {"train_loss": -16.717538833618164, "global_step": 1230, "epoch": 10} {"train_loss": -16.399860382080078, "global_step": 1231, "epoch": 10} {"train_loss": -16.71485710144043, "global_step": 1232, "epoch": 10} {"train_loss": -16.270755767822266, "global_step": 1233, "epoch": 10} {"train_loss": -16.42825698852539, "global_step": 1234, "epoch": 10} {"train_loss": -16.191843032836914, "global_step": 1235, "epoch": 10} {"train_loss": -16.598846435546875, "global_step": 1236, "epoch": 10} {"train_loss": -16.13410758972168, "global_step": 1237, "epoch": 10} {"train_loss": -16.56354522705078, "global_step": 1238, "epoch": 10} {"train_loss": -16.34257698059082, "global_step": 1239, "epoch": 10} {"train_loss": -17.25657081604004, "global_step": 1240, "epoch": 10} {"train_loss": -15.966734886169434, "global_step": 1241, "epoch": 10} {"train_loss": -16.9952392578125, "global_step": 1242, "epoch": 10} {"train_loss": -16.769424438476562, "global_step": 1243, "epoch": 10} {"train_loss": -17.17093276977539, "global_step": 1244, "epoch": 10} {"train_loss": -16.907079696655273, "global_step": 1245, "epoch": 10} {"train_loss": -16.81378173828125, "global_step": 1246, "epoch": 10} {"train_loss": -16.463674545288086, "global_step": 1247, "epoch": 10} {"train_loss": -16.900135040283203, "global_step": 1248, "epoch": 10} {"train_loss": -16.66152000427246, "global_step": 1249, "epoch": 10} {"train_loss": -16.496984481811523, "global_step": 1250, "epoch": 10} {"train_loss": -16.735090255737305, "global_step": 1251, "epoch": 10} {"train_loss": -17.245885848999023, "global_step": 1252, "epoch": 10} {"train_loss": -16.792936325073242, "global_step": 1253, "epoch": 10} {"train_loss": -16.737430572509766, "global_step": 1254, "epoch": 10} {"train_loss": -16.990982055664062, "global_step": 1255, "epoch": 10} {"train_loss": -16.973522186279297, "global_step": 1256, "epoch": 10} {"train_loss": -16.936094284057617, "global_step": 1257, "epoch": 10} {"train_loss": -17.043527603149414, "global_step": 1258, "epoch": 10} {"train_loss": -17.459274291992188, "global_step": 1259, "epoch": 10} {"train_loss": -16.621633529663086, "global_step": 1260, "epoch": 10} {"train_loss": -16.793954849243164, "global_step": 1261, "epoch": 10} {"train_loss": -16.999372482299805, "global_step": 1262, "epoch": 10} {"train_loss": -16.942426681518555, "global_step": 1263, "epoch": 10} {"train_loss": -17.093231201171875, "global_step": 1264, "epoch": 10} {"train_loss": -17.533477783203125, "global_step": 1265, "epoch": 10} {"train_loss": -16.948909759521484, "global_step": 1266, "epoch": 10} {"train_loss": -17.13594627380371, "global_step": 1267, "epoch": 10} {"train_loss": -16.708467483520508, "global_step": 1268, "epoch": 10} {"train_loss": -17.152517318725586, "global_step": 1269, "epoch": 10} {"train_loss": -16.21940040588379, "global_step": 1270, "epoch": 10} {"train_loss": -16.646808624267578, "global_step": 1271, "epoch": 10} {"train_loss": -16.462270736694336, "global_step": 1272, "epoch": 10} {"train_loss": -16.468732833862305, "global_step": 1273, "epoch": 10} {"train_loss": -17.016681671142578, "global_step": 1274, "epoch": 10} {"train_loss": -16.608366012573242, "global_step": 1275, "epoch": 10} {"train_loss": -17.05983543395996, "global_step": 1276, "epoch": 10} {"train_loss": -17.054811477661133, "global_step": 1277, "epoch": 10} {"train_loss": -16.26346206665039, "global_step": 1278, "epoch": 10} {"train_loss": -16.755998611450195, "global_step": 1279, "epoch": 10} {"train_loss": -16.96254539489746, "global_step": 1280, "epoch": 10} {"train_loss": -16.723072052001953, "global_step": 1281, "epoch": 10} {"train_loss": -17.287498474121094, "global_step": 1282, "epoch": 10} {"train_loss": -16.789901733398438, "global_step": 1283, "epoch": 10} {"train_loss": -16.906570434570312, "global_step": 1284, "epoch": 10} {"train_loss": -17.172725677490234, "global_step": 1285, "epoch": 10} {"train_loss": -17.13545799255371, "global_step": 1286, "epoch": 10} {"train_loss": -16.965694427490234, "global_step": 1287, "epoch": 10} {"train_loss": -17.18233871459961, "global_step": 1288, "epoch": 10} {"train_loss": -17.035795211791992, "global_step": 1289, "epoch": 10} {"train_loss": -16.521564483642578, "global_step": 1290, "epoch": 10} {"train_loss": -16.981271743774414, "global_step": 1291, "epoch": 10} {"train_loss": -16.67173194885254, "global_step": 1292, "epoch": 10} {"train_loss": -17.11183738708496, "global_step": 1293, "epoch": 10} {"train_loss": -17.177579879760742, "global_step": 1294, "epoch": 10} {"train_loss": -16.921703338623047, "global_step": 1295, "epoch": 10} {"train_loss": -17.071496963500977, "global_step": 1296, "epoch": 10} {"train_loss": -16.72318458557129, "global_step": 1297, "epoch": 10} {"train_loss": -16.742290496826172, "global_step": 1298, "epoch": 10} {"train_loss": -17.1630916595459, "global_step": 1299, "epoch": 10} {"train_loss": -16.797719955444336, "global_step": 1300, "epoch": 10} {"train_loss": -16.235666275024414, "global_step": 1301, "epoch": 10} {"train_loss": -16.63457679748535, "global_step": 1302, "epoch": 10} {"train_loss": -16.25105857849121, "global_step": 1303, "epoch": 10} {"train_loss": -16.59116554260254, "global_step": 1304, "epoch": 10} {"train_loss": -16.307283401489258, "global_step": 1305, "epoch": 10} {"train_loss": -16.73311424255371, "global_step": 1306, "epoch": 10} {"train_loss": -17.111480712890625, "global_step": 1307, "epoch": 10} {"train_loss": -16.711145401000977, "global_step": 1308, "epoch": 10} {"train_loss": -16.74314308166504, "global_step": 1309, "epoch": 10} {"train_loss": -16.663663864135742, "global_step": 1310, "epoch": 10} {"train_loss": -16.423568725585938, "global_step": 1311, "epoch": 10} {"train_loss": -17.47873306274414, "global_step": 1312, "epoch": 10} {"train_loss": -17.210651397705078, "global_step": 1313, "epoch": 10} {"train_loss": -16.799413681030273, "global_step": 1314, "epoch": 10} {"train_loss": -16.20072364807129, "global_step": 1315, "epoch": 10} {"train_loss": -16.3791561126709, "global_step": 1316, "epoch": 10} {"train_loss": -16.617237091064453, "global_step": 1317, "epoch": 10} {"train_loss": -16.205778121948242, "global_step": 1318, "epoch": 10} {"train_loss": -16.89472007751465, "global_step": 1319, "epoch": 10} {"train_loss": -16.55068588256836, "global_step": 1320, "epoch": 10} {"train_loss": -16.166898727416992, "global_step": 1321, "epoch": 10} {"train_loss": -16.50893783569336, "global_step": 1322, "epoch": 10} {"train_loss": -15.837793350219727, "global_step": 1323, "epoch": 10} {"train_loss": -16.63007926940918, "global_step": 1324, "epoch": 10} {"train_loss": -16.049808502197266, "global_step": 1325, "epoch": 10} {"train_loss": -16.538244247436523, "global_step": 1326, "epoch": 10} {"train_loss": -16.185632705688477, "global_step": 1327, "epoch": 10} {"train_loss": -16.334753036499023, "global_step": 1328, "epoch": 10} {"train_loss": -16.503101348876953, "global_step": 1329, "epoch": 10} {"train_loss": -16.741107081578782, "global_step": 1330, "epoch": 10, "val_loss": 3404170.75} {"train_loss": -16.44879722595215, "global_step": 1331, "epoch": 11} {"train_loss": -16.134801864624023, "global_step": 1332, "epoch": 11} {"train_loss": -16.858753204345703, "global_step": 1333, "epoch": 11} {"train_loss": -16.610136032104492, "global_step": 1334, "epoch": 11} {"train_loss": -16.48020362854004, "global_step": 1335, "epoch": 11} {"train_loss": -16.44289207458496, "global_step": 1336, "epoch": 11} {"train_loss": -16.892887115478516, "global_step": 1337, "epoch": 11} {"train_loss": -16.946195602416992, "global_step": 1338, "epoch": 11} {"train_loss": -16.590829849243164, "global_step": 1339, "epoch": 11} {"train_loss": -16.584030151367188, "global_step": 1340, "epoch": 11} {"train_loss": -16.493696212768555, "global_step": 1341, "epoch": 11} {"train_loss": -16.752716064453125, "global_step": 1342, "epoch": 11} {"train_loss": -16.974966049194336, "global_step": 1343, "epoch": 11} {"train_loss": -16.409507751464844, "global_step": 1344, "epoch": 11} {"train_loss": -16.497007369995117, "global_step": 1345, "epoch": 11} {"train_loss": -16.17791748046875, "global_step": 1346, "epoch": 11} {"train_loss": -17.018220901489258, "global_step": 1347, "epoch": 11} {"train_loss": -16.25397300720215, "global_step": 1348, "epoch": 11} {"train_loss": -16.978805541992188, "global_step": 1349, "epoch": 11} {"train_loss": -16.590036392211914, "global_step": 1350, "epoch": 11} {"train_loss": -16.769376754760742, "global_step": 1351, "epoch": 11} {"train_loss": -16.673297882080078, "global_step": 1352, "epoch": 11} {"train_loss": -16.63237190246582, "global_step": 1353, "epoch": 11} {"train_loss": -17.00925636291504, "global_step": 1354, "epoch": 11} {"train_loss": -17.25243377685547, "global_step": 1355, "epoch": 11} {"train_loss": -16.764291763305664, "global_step": 1356, "epoch": 11} {"train_loss": -16.58989906311035, "global_step": 1357, "epoch": 11} {"train_loss": -16.570226669311523, "global_step": 1358, "epoch": 11} {"train_loss": -16.951499938964844, "global_step": 1359, "epoch": 11} {"train_loss": -16.86659049987793, "global_step": 1360, "epoch": 11} {"train_loss": -17.04618263244629, "global_step": 1361, "epoch": 11} {"train_loss": -16.31777000427246, "global_step": 1362, "epoch": 11} {"train_loss": -16.75593376159668, "global_step": 1363, "epoch": 11} {"train_loss": -15.966937065124512, "global_step": 1364, "epoch": 11} {"train_loss": -17.02457618713379, "global_step": 1365, "epoch": 11} {"train_loss": -16.753509521484375, "global_step": 1366, "epoch": 11} {"train_loss": -17.415576934814453, "global_step": 1367, "epoch": 11} {"train_loss": -17.151077270507812, "global_step": 1368, "epoch": 11} {"train_loss": -16.642478942871094, "global_step": 1369, "epoch": 11} {"train_loss": -16.907873153686523, "global_step": 1370, "epoch": 11} {"train_loss": -16.601865768432617, "global_step": 1371, "epoch": 11} {"train_loss": -17.003767013549805, "global_step": 1372, "epoch": 11} {"train_loss": -17.144498825073242, "global_step": 1373, "epoch": 11} {"train_loss": -17.6092586517334, "global_step": 1374, "epoch": 11} {"train_loss": -17.34300422668457, "global_step": 1375, "epoch": 11} {"train_loss": -16.805334091186523, "global_step": 1376, "epoch": 11} {"train_loss": -17.433101654052734, "global_step": 1377, "epoch": 11} {"train_loss": -16.99871826171875, "global_step": 1378, "epoch": 11} {"train_loss": -17.312231063842773, "global_step": 1379, "epoch": 11} {"train_loss": -16.83053207397461, "global_step": 1380, "epoch": 11} {"train_loss": -17.011201858520508, "global_step": 1381, "epoch": 11} {"train_loss": -17.1787166595459, "global_step": 1382, "epoch": 11} {"train_loss": -16.492008209228516, "global_step": 1383, "epoch": 11} {"train_loss": -17.071773529052734, "global_step": 1384, "epoch": 11} {"train_loss": -16.933795928955078, "global_step": 1385, "epoch": 11} {"train_loss": -16.455862045288086, "global_step": 1386, "epoch": 11} {"train_loss": -16.543699264526367, "global_step": 1387, "epoch": 11} {"train_loss": -16.710371017456055, "global_step": 1388, "epoch": 11} {"train_loss": -17.206735610961914, "global_step": 1389, "epoch": 11} {"train_loss": -16.52447509765625, "global_step": 1390, "epoch": 11} {"train_loss": -17.070655822753906, "global_step": 1391, "epoch": 11} {"train_loss": -17.323781967163086, "global_step": 1392, "epoch": 11} {"train_loss": -16.62897300720215, "global_step": 1393, "epoch": 11} {"train_loss": -16.5753231048584, "global_step": 1394, "epoch": 11} {"train_loss": -17.025104522705078, "global_step": 1395, "epoch": 11} {"train_loss": -17.1120662689209, "global_step": 1396, "epoch": 11} {"train_loss": -16.796695709228516, "global_step": 1397, "epoch": 11} {"train_loss": -17.284011840820312, "global_step": 1398, "epoch": 11} {"train_loss": -17.431232452392578, "global_step": 1399, "epoch": 11} {"train_loss": -16.59290885925293, "global_step": 1400, "epoch": 11} {"train_loss": -16.92574119567871, "global_step": 1401, "epoch": 11} {"train_loss": -16.954477310180664, "global_step": 1402, "epoch": 11} {"train_loss": -17.13649559020996, "global_step": 1403, "epoch": 11} {"train_loss": -17.1549015045166, "global_step": 1404, "epoch": 11} {"train_loss": -17.09050941467285, "global_step": 1405, "epoch": 11} {"train_loss": -17.01791763305664, "global_step": 1406, "epoch": 11} {"train_loss": -17.174619674682617, "global_step": 1407, "epoch": 11} {"train_loss": -17.435958862304688, "global_step": 1408, "epoch": 11} {"train_loss": -16.801294326782227, "global_step": 1409, "epoch": 11} {"train_loss": -16.728294372558594, "global_step": 1410, "epoch": 11} {"train_loss": -16.671579360961914, "global_step": 1411, "epoch": 11} {"train_loss": -17.510757446289062, "global_step": 1412, "epoch": 11} {"train_loss": -16.723636627197266, "global_step": 1413, "epoch": 11} {"train_loss": -16.9241886138916, "global_step": 1414, "epoch": 11} {"train_loss": -16.89425277709961, "global_step": 1415, "epoch": 11} {"train_loss": -17.097761154174805, "global_step": 1416, "epoch": 11} {"train_loss": -16.771068572998047, "global_step": 1417, "epoch": 11} {"train_loss": -17.00215721130371, "global_step": 1418, "epoch": 11} {"train_loss": -17.442337036132812, "global_step": 1419, "epoch": 11} {"train_loss": -16.6204891204834, "global_step": 1420, "epoch": 11} {"train_loss": -16.9918270111084, "global_step": 1421, "epoch": 11} {"train_loss": -16.930784225463867, "global_step": 1422, "epoch": 11} {"train_loss": -16.799129486083984, "global_step": 1423, "epoch": 11} {"train_loss": -17.40406608581543, "global_step": 1424, "epoch": 11} {"train_loss": -17.039710998535156, "global_step": 1425, "epoch": 11} {"train_loss": -16.975732803344727, "global_step": 1426, "epoch": 11} {"train_loss": -16.99969482421875, "global_step": 1427, "epoch": 11} {"train_loss": -17.02571678161621, "global_step": 1428, "epoch": 11} {"train_loss": -17.042591094970703, "global_step": 1429, "epoch": 11} {"train_loss": -16.929616928100586, "global_step": 1430, "epoch": 11} {"train_loss": -17.054931640625, "global_step": 1431, "epoch": 11} {"train_loss": -16.06532096862793, "global_step": 1432, "epoch": 11} {"train_loss": -17.052793502807617, "global_step": 1433, "epoch": 11} {"train_loss": -16.37563133239746, "global_step": 1434, "epoch": 11} {"train_loss": -16.983659744262695, "global_step": 1435, "epoch": 11} {"train_loss": -16.707340240478516, "global_step": 1436, "epoch": 11} {"train_loss": -17.20960807800293, "global_step": 1437, "epoch": 11} {"train_loss": -17.130558013916016, "global_step": 1438, "epoch": 11} {"train_loss": -16.75899314880371, "global_step": 1439, "epoch": 11} {"train_loss": -17.314525604248047, "global_step": 1440, "epoch": 11} {"train_loss": -15.968347549438477, "global_step": 1441, "epoch": 11} {"train_loss": -17.065837860107422, "global_step": 1442, "epoch": 11} {"train_loss": -16.396455764770508, "global_step": 1443, "epoch": 11} {"train_loss": -16.726125717163086, "global_step": 1444, "epoch": 11} {"train_loss": -17.06117057800293, "global_step": 1445, "epoch": 11} {"train_loss": -17.028831481933594, "global_step": 1446, "epoch": 11} {"train_loss": -17.28272247314453, "global_step": 1447, "epoch": 11} {"train_loss": -17.183969497680664, "global_step": 1448, "epoch": 11} {"train_loss": -16.78374671936035, "global_step": 1449, "epoch": 11} {"train_loss": -16.87135887145996, "global_step": 1450, "epoch": 11} {"train_loss": -16.87051724993493, "global_step": 1451, "epoch": 11, "val_loss": 3054448.75} {"train_loss": -17.143238067626953, "global_step": 1452, "epoch": 12} {"train_loss": -16.934446334838867, "global_step": 1453, "epoch": 12} {"train_loss": -16.376506805419922, "global_step": 1454, "epoch": 12} {"train_loss": -17.046905517578125, "global_step": 1455, "epoch": 12} {"train_loss": -16.830537796020508, "global_step": 1456, "epoch": 12} {"train_loss": -16.417892456054688, "global_step": 1457, "epoch": 12} {"train_loss": -17.11263656616211, "global_step": 1458, "epoch": 12} {"train_loss": -17.04084587097168, "global_step": 1459, "epoch": 12} {"train_loss": -16.92720603942871, "global_step": 1460, "epoch": 12} {"train_loss": -17.071372985839844, "global_step": 1461, "epoch": 12} {"train_loss": -16.880399703979492, "global_step": 1462, "epoch": 12} {"train_loss": -16.701557159423828, "global_step": 1463, "epoch": 12} {"train_loss": -16.734983444213867, "global_step": 1464, "epoch": 12} {"train_loss": -16.18764877319336, "global_step": 1465, "epoch": 12} {"train_loss": -16.60567283630371, "global_step": 1466, "epoch": 12} {"train_loss": -16.687238693237305, "global_step": 1467, "epoch": 12} {"train_loss": -15.743788719177246, "global_step": 1468, "epoch": 12} {"train_loss": -16.479066848754883, "global_step": 1469, "epoch": 12} {"train_loss": -16.22887420654297, "global_step": 1470, "epoch": 12} {"train_loss": -16.617420196533203, "global_step": 1471, "epoch": 12} {"train_loss": -16.31583023071289, "global_step": 1472, "epoch": 12} {"train_loss": -16.84661865234375, "global_step": 1473, "epoch": 12} {"train_loss": -17.141164779663086, "global_step": 1474, "epoch": 12} {"train_loss": -16.95132827758789, "global_step": 1475, "epoch": 12} {"train_loss": -16.8282470703125, "global_step": 1476, "epoch": 12} {"train_loss": -17.247289657592773, "global_step": 1477, "epoch": 12} {"train_loss": -17.00687026977539, "global_step": 1478, "epoch": 12} {"train_loss": -17.100330352783203, "global_step": 1479, "epoch": 12} {"train_loss": -17.067171096801758, "global_step": 1480, "epoch": 12} {"train_loss": -16.716686248779297, "global_step": 1481, "epoch": 12} {"train_loss": -16.79624366760254, "global_step": 1482, "epoch": 12} {"train_loss": -17.38620376586914, "global_step": 1483, "epoch": 12} {"train_loss": -16.99212074279785, "global_step": 1484, "epoch": 12} {"train_loss": -17.1272029876709, "global_step": 1485, "epoch": 12} {"train_loss": -17.39979362487793, "global_step": 1486, "epoch": 12} {"train_loss": -16.863157272338867, "global_step": 1487, "epoch": 12} {"train_loss": -17.224105834960938, "global_step": 1488, "epoch": 12} {"train_loss": -17.054529190063477, "global_step": 1489, "epoch": 12} {"train_loss": -17.028188705444336, "global_step": 1490, "epoch": 12} {"train_loss": -16.486862182617188, "global_step": 1491, "epoch": 12} {"train_loss": -16.90007972717285, "global_step": 1492, "epoch": 12} {"train_loss": -17.309682846069336, "global_step": 1493, "epoch": 12} {"train_loss": -17.050016403198242, "global_step": 1494, "epoch": 12} {"train_loss": -17.360586166381836, "global_step": 1495, "epoch": 12} {"train_loss": -17.192705154418945, "global_step": 1496, "epoch": 12} {"train_loss": -17.354949951171875, "global_step": 1497, "epoch": 12} {"train_loss": -16.736509323120117, "global_step": 1498, "epoch": 12} {"train_loss": -16.899492263793945, "global_step": 1499, "epoch": 12} {"train_loss": -16.412965774536133, "global_step": 1500, "epoch": 12} {"train_loss": -16.574148178100586, "global_step": 1501, "epoch": 12} {"train_loss": -16.605268478393555, "global_step": 1502, "epoch": 12} {"train_loss": -16.723453521728516, "global_step": 1503, "epoch": 12} {"train_loss": -17.167030334472656, "global_step": 1504, "epoch": 12} {"train_loss": -17.068130493164062, "global_step": 1505, "epoch": 12} {"train_loss": -16.885183334350586, "global_step": 1506, "epoch": 12} {"train_loss": -17.11858558654785, "global_step": 1507, "epoch": 12} {"train_loss": -17.3370304107666, "global_step": 1508, "epoch": 12} {"train_loss": -17.095911026000977, "global_step": 1509, "epoch": 12} {"train_loss": -16.929658889770508, "global_step": 1510, "epoch": 12} {"train_loss": -16.801715850830078, "global_step": 1511, "epoch": 12} {"train_loss": -17.40515899658203, "global_step": 1512, "epoch": 12} {"train_loss": -16.58112907409668, "global_step": 1513, "epoch": 12} {"train_loss": -17.298749923706055, "global_step": 1514, "epoch": 12} {"train_loss": -16.01494598388672, "global_step": 1515, "epoch": 12} {"train_loss": -17.179594039916992, "global_step": 1516, "epoch": 12} {"train_loss": -16.789976119995117, "global_step": 1517, "epoch": 12} {"train_loss": -16.83043098449707, "global_step": 1518, "epoch": 12} {"train_loss": -16.72002601623535, "global_step": 1519, "epoch": 12} {"train_loss": -16.69611930847168, "global_step": 1520, "epoch": 12} {"train_loss": -17.4544677734375, "global_step": 1521, "epoch": 12} {"train_loss": -17.596162796020508, "global_step": 1522, "epoch": 12} {"train_loss": -17.142629623413086, "global_step": 1523, "epoch": 12} {"train_loss": -17.00998306274414, "global_step": 1524, "epoch": 12} {"train_loss": -17.181272506713867, "global_step": 1525, "epoch": 12} {"train_loss": -17.477054595947266, "global_step": 1526, "epoch": 12} {"train_loss": -16.826902389526367, "global_step": 1527, "epoch": 12} {"train_loss": -17.2989501953125, "global_step": 1528, "epoch": 12} {"train_loss": -16.86865234375, "global_step": 1529, "epoch": 12} {"train_loss": -17.23369789123535, "global_step": 1530, "epoch": 12} {"train_loss": -17.8067684173584, "global_step": 1531, "epoch": 12} {"train_loss": -16.614484786987305, "global_step": 1532, "epoch": 12} {"train_loss": -17.452486038208008, "global_step": 1533, "epoch": 12} {"train_loss": -16.83014488220215, "global_step": 1534, "epoch": 12} {"train_loss": -17.39697265625, "global_step": 1535, "epoch": 12} {"train_loss": -16.75873374938965, "global_step": 1536, "epoch": 12} {"train_loss": -17.08112335205078, "global_step": 1537, "epoch": 12} {"train_loss": -16.30660057067871, "global_step": 1538, "epoch": 12} {"train_loss": -17.58440589904785, "global_step": 1539, "epoch": 12} {"train_loss": -17.371259689331055, "global_step": 1540, "epoch": 12} {"train_loss": -16.911893844604492, "global_step": 1541, "epoch": 12} {"train_loss": -16.406829833984375, "global_step": 1542, "epoch": 12} {"train_loss": -16.995731353759766, "global_step": 1543, "epoch": 12} {"train_loss": -16.871170043945312, "global_step": 1544, "epoch": 12} {"train_loss": -16.731903076171875, "global_step": 1545, "epoch": 12} {"train_loss": -17.403091430664062, "global_step": 1546, "epoch": 12} {"train_loss": -16.90422821044922, "global_step": 1547, "epoch": 12} {"train_loss": -17.551645278930664, "global_step": 1548, "epoch": 12} {"train_loss": -16.955087661743164, "global_step": 1549, "epoch": 12} {"train_loss": -17.20389175415039, "global_step": 1550, "epoch": 12} {"train_loss": -16.841257095336914, "global_step": 1551, "epoch": 12} {"train_loss": -16.491376876831055, "global_step": 1552, "epoch": 12} {"train_loss": -17.01447105407715, "global_step": 1553, "epoch": 12} {"train_loss": -16.81654930114746, "global_step": 1554, "epoch": 12} {"train_loss": -17.35926628112793, "global_step": 1555, "epoch": 12} {"train_loss": -16.529052734375, "global_step": 1556, "epoch": 12} {"train_loss": -16.999866485595703, "global_step": 1557, "epoch": 12} {"train_loss": -17.255590438842773, "global_step": 1558, "epoch": 12} {"train_loss": -16.7196044921875, "global_step": 1559, "epoch": 12} {"train_loss": -17.394330978393555, "global_step": 1560, "epoch": 12} {"train_loss": -16.918994903564453, "global_step": 1561, "epoch": 12} {"train_loss": -16.438425064086914, "global_step": 1562, "epoch": 12} {"train_loss": -17.198274612426758, "global_step": 1563, "epoch": 12} {"train_loss": -16.748701095581055, "global_step": 1564, "epoch": 12} {"train_loss": -17.238693237304688, "global_step": 1565, "epoch": 12} {"train_loss": -17.163984298706055, "global_step": 1566, "epoch": 12} {"train_loss": -17.257699966430664, "global_step": 1567, "epoch": 12} {"train_loss": -17.020700454711914, "global_step": 1568, "epoch": 12} {"train_loss": -16.973119735717773, "global_step": 1569, "epoch": 12} {"train_loss": -17.015588760375977, "global_step": 1570, "epoch": 12} {"train_loss": -16.501434326171875, "global_step": 1571, "epoch": 12} {"train_loss": -16.94660720352299, "global_step": 1572, "epoch": 12, "val_loss": 3194981.0} {"train_loss": -17.118562698364258, "global_step": 1573, "epoch": 13} {"train_loss": -16.898990631103516, "global_step": 1574, "epoch": 13} {"train_loss": -17.24260711669922, "global_step": 1575, "epoch": 13} {"train_loss": -16.785852432250977, "global_step": 1576, "epoch": 13} {"train_loss": -17.392637252807617, "global_step": 1577, "epoch": 13} {"train_loss": -16.3022518157959, "global_step": 1578, "epoch": 13} {"train_loss": -17.402305603027344, "global_step": 1579, "epoch": 13} {"train_loss": -16.703411102294922, "global_step": 1580, "epoch": 13} {"train_loss": -16.914493560791016, "global_step": 1581, "epoch": 13} {"train_loss": -17.70539665222168, "global_step": 1582, "epoch": 13} {"train_loss": -16.765689849853516, "global_step": 1583, "epoch": 13} {"train_loss": -17.424728393554688, "global_step": 1584, "epoch": 13} {"train_loss": -16.778608322143555, "global_step": 1585, "epoch": 13} {"train_loss": -17.160873413085938, "global_step": 1586, "epoch": 13} {"train_loss": -17.648876190185547, "global_step": 1587, "epoch": 13} {"train_loss": -17.259353637695312, "global_step": 1588, "epoch": 13} {"train_loss": -16.885828018188477, "global_step": 1589, "epoch": 13} {"train_loss": -17.622695922851562, "global_step": 1590, "epoch": 13} {"train_loss": -17.06818962097168, "global_step": 1591, "epoch": 13} {"train_loss": -17.12741470336914, "global_step": 1592, "epoch": 13} {"train_loss": -16.897294998168945, "global_step": 1593, "epoch": 13} {"train_loss": -17.20524024963379, "global_step": 1594, "epoch": 13} {"train_loss": -17.125524520874023, "global_step": 1595, "epoch": 13} {"train_loss": -17.18246841430664, "global_step": 1596, "epoch": 13} {"train_loss": -17.205293655395508, "global_step": 1597, "epoch": 13} {"train_loss": -16.7023868560791, "global_step": 1598, "epoch": 13} {"train_loss": -17.296106338500977, "global_step": 1599, "epoch": 13} {"train_loss": -16.954898834228516, "global_step": 1600, "epoch": 13} {"train_loss": -16.786176681518555, "global_step": 1601, "epoch": 13} {"train_loss": -16.820114135742188, "global_step": 1602, "epoch": 13} {"train_loss": -16.94761848449707, "global_step": 1603, "epoch": 13} {"train_loss": -17.105070114135742, "global_step": 1604, "epoch": 13} {"train_loss": -17.364418029785156, "global_step": 1605, "epoch": 13} {"train_loss": -17.086069107055664, "global_step": 1606, "epoch": 13} {"train_loss": -17.8925838470459, "global_step": 1607, "epoch": 13} {"train_loss": -16.518888473510742, "global_step": 1608, "epoch": 13} {"train_loss": -16.405954360961914, "global_step": 1609, "epoch": 13} {"train_loss": -16.774465560913086, "global_step": 1610, "epoch": 13} {"train_loss": -17.262529373168945, "global_step": 1611, "epoch": 13} {"train_loss": -16.776517868041992, "global_step": 1612, "epoch": 13} {"train_loss": -17.242918014526367, "global_step": 1613, "epoch": 13} {"train_loss": -17.3742618560791, "global_step": 1614, "epoch": 13} {"train_loss": -16.378170013427734, "global_step": 1615, "epoch": 13} {"train_loss": -17.215063095092773, "global_step": 1616, "epoch": 13} {"train_loss": -16.4735107421875, "global_step": 1617, "epoch": 13} {"train_loss": -16.608034133911133, "global_step": 1618, "epoch": 13} {"train_loss": -16.91410255432129, "global_step": 1619, "epoch": 13} {"train_loss": -16.734106063842773, "global_step": 1620, "epoch": 13} {"train_loss": -16.706743240356445, "global_step": 1621, "epoch": 13} {"train_loss": -16.40241241455078, "global_step": 1622, "epoch": 13} {"train_loss": -16.6248722076416, "global_step": 1623, "epoch": 13} {"train_loss": -16.947423934936523, "global_step": 1624, "epoch": 13} {"train_loss": -16.607572555541992, "global_step": 1625, "epoch": 13} {"train_loss": -16.828441619873047, "global_step": 1626, "epoch": 13} {"train_loss": -16.9980411529541, "global_step": 1627, "epoch": 13} {"train_loss": -16.840179443359375, "global_step": 1628, "epoch": 13} {"train_loss": -17.358165740966797, "global_step": 1629, "epoch": 13} {"train_loss": -16.916913986206055, "global_step": 1630, "epoch": 13} {"train_loss": -17.282432556152344, "global_step": 1631, "epoch": 13} {"train_loss": -16.625240325927734, "global_step": 1632, "epoch": 13} {"train_loss": -16.757179260253906, "global_step": 1633, "epoch": 13} {"train_loss": -16.944711685180664, "global_step": 1634, "epoch": 13} {"train_loss": -16.818344116210938, "global_step": 1635, "epoch": 13} {"train_loss": -17.031782150268555, "global_step": 1636, "epoch": 13} {"train_loss": -17.204771041870117, "global_step": 1637, "epoch": 13} {"train_loss": -16.691753387451172, "global_step": 1638, "epoch": 13} {"train_loss": -17.181913375854492, "global_step": 1639, "epoch": 13} {"train_loss": -16.96736717224121, "global_step": 1640, "epoch": 13} {"train_loss": -17.018720626831055, "global_step": 1641, "epoch": 13} {"train_loss": -16.9964599609375, "global_step": 1642, "epoch": 13} {"train_loss": -17.488258361816406, "global_step": 1643, "epoch": 13} {"train_loss": -17.0512752532959, "global_step": 1644, "epoch": 13} {"train_loss": -17.241586685180664, "global_step": 1645, "epoch": 13} {"train_loss": -17.141565322875977, "global_step": 1646, "epoch": 13} {"train_loss": -17.238536834716797, "global_step": 1647, "epoch": 13} {"train_loss": -17.30945587158203, "global_step": 1648, "epoch": 13} {"train_loss": -17.26047134399414, "global_step": 1649, "epoch": 13} {"train_loss": -16.92188835144043, "global_step": 1650, "epoch": 13} {"train_loss": -17.227554321289062, "global_step": 1651, "epoch": 13} {"train_loss": -17.345935821533203, "global_step": 1652, "epoch": 13} {"train_loss": -17.32217788696289, "global_step": 1653, "epoch": 13} {"train_loss": -17.588871002197266, "global_step": 1654, "epoch": 13} {"train_loss": -17.223758697509766, "global_step": 1655, "epoch": 13} {"train_loss": -16.98627471923828, "global_step": 1656, "epoch": 13} {"train_loss": -17.335500717163086, "global_step": 1657, "epoch": 13} {"train_loss": -16.41240882873535, "global_step": 1658, "epoch": 13} {"train_loss": -17.725452423095703, "global_step": 1659, "epoch": 13} {"train_loss": -16.002981185913086, "global_step": 1660, "epoch": 13} {"train_loss": -16.75539207458496, "global_step": 1661, "epoch": 13} {"train_loss": -17.04131317138672, "global_step": 1662, "epoch": 13} {"train_loss": -16.64255714416504, "global_step": 1663, "epoch": 13} {"train_loss": -17.009550094604492, "global_step": 1664, "epoch": 13} {"train_loss": -17.18202018737793, "global_step": 1665, "epoch": 13} {"train_loss": -17.053333282470703, "global_step": 1666, "epoch": 13} {"train_loss": -17.477380752563477, "global_step": 1667, "epoch": 13} {"train_loss": -17.257463455200195, "global_step": 1668, "epoch": 13} {"train_loss": -17.194616317749023, "global_step": 1669, "epoch": 13} {"train_loss": -17.065067291259766, "global_step": 1670, "epoch": 13} {"train_loss": -17.392122268676758, "global_step": 1671, "epoch": 13} {"train_loss": -17.653553009033203, "global_step": 1672, "epoch": 13} {"train_loss": -17.51967430114746, "global_step": 1673, "epoch": 13} {"train_loss": -16.966415405273438, "global_step": 1674, "epoch": 13} {"train_loss": -17.080419540405273, "global_step": 1675, "epoch": 13} {"train_loss": -17.133142471313477, "global_step": 1676, "epoch": 13} {"train_loss": -17.330245971679688, "global_step": 1677, "epoch": 13} {"train_loss": -17.975610733032227, "global_step": 1678, "epoch": 13} {"train_loss": -17.328584671020508, "global_step": 1679, "epoch": 13} {"train_loss": -17.479995727539062, "global_step": 1680, "epoch": 13} {"train_loss": -17.266996383666992, "global_step": 1681, "epoch": 13} {"train_loss": -17.03032875061035, "global_step": 1682, "epoch": 13} {"train_loss": -17.411970138549805, "global_step": 1683, "epoch": 13} {"train_loss": -17.551435470581055, "global_step": 1684, "epoch": 13} {"train_loss": -16.592388153076172, "global_step": 1685, "epoch": 13} {"train_loss": -17.14280128479004, "global_step": 1686, "epoch": 13} {"train_loss": -17.104328155517578, "global_step": 1687, "epoch": 13} {"train_loss": -17.277128219604492, "global_step": 1688, "epoch": 13} {"train_loss": -17.26282501220703, "global_step": 1689, "epoch": 13} {"train_loss": -17.057493209838867, "global_step": 1690, "epoch": 13} {"train_loss": -16.79402732849121, "global_step": 1691, "epoch": 13} {"train_loss": -17.48380470275879, "global_step": 1692, "epoch": 13} {"train_loss": -17.067930300373675, "global_step": 1693, "epoch": 13, "val_loss": 3151266.25} {"train_loss": -16.842016220092773, "global_step": 1694, "epoch": 14} {"train_loss": -17.262304306030273, "global_step": 1695, "epoch": 14} {"train_loss": -17.057096481323242, "global_step": 1696, "epoch": 14} {"train_loss": -17.130931854248047, "global_step": 1697, "epoch": 14} {"train_loss": -17.37335968017578, "global_step": 1698, "epoch": 14} {"train_loss": -16.8621768951416, "global_step": 1699, "epoch": 14} {"train_loss": -17.412084579467773, "global_step": 1700, "epoch": 14} {"train_loss": -17.528587341308594, "global_step": 1701, "epoch": 14} {"train_loss": -17.32063865661621, "global_step": 1702, "epoch": 14} {"train_loss": -16.98948860168457, "global_step": 1703, "epoch": 14} {"train_loss": -17.395771026611328, "global_step": 1704, "epoch": 14} {"train_loss": -16.97652816772461, "global_step": 1705, "epoch": 14} {"train_loss": -17.068241119384766, "global_step": 1706, "epoch": 14} {"train_loss": -17.094297409057617, "global_step": 1707, "epoch": 14} {"train_loss": -17.37969970703125, "global_step": 1708, "epoch": 14} {"train_loss": -17.32576560974121, "global_step": 1709, "epoch": 14} {"train_loss": -17.090368270874023, "global_step": 1710, "epoch": 14} {"train_loss": -17.647138595581055, "global_step": 1711, "epoch": 14} {"train_loss": -17.396154403686523, "global_step": 1712, "epoch": 14} {"train_loss": -16.918500900268555, "global_step": 1713, "epoch": 14} {"train_loss": -16.84967041015625, "global_step": 1714, "epoch": 14} {"train_loss": -17.297021865844727, "global_step": 1715, "epoch": 14} {"train_loss": -17.140151977539062, "global_step": 1716, "epoch": 14} {"train_loss": -17.690664291381836, "global_step": 1717, "epoch": 14} {"train_loss": -17.2275333404541, "global_step": 1718, "epoch": 14} {"train_loss": -17.597972869873047, "global_step": 1719, "epoch": 14} {"train_loss": -17.52324104309082, "global_step": 1720, "epoch": 14} {"train_loss": -17.63154411315918, "global_step": 1721, "epoch": 14} {"train_loss": -17.603506088256836, "global_step": 1722, "epoch": 14} {"train_loss": -17.491750717163086, "global_step": 1723, "epoch": 14} {"train_loss": -17.30128288269043, "global_step": 1724, "epoch": 14} {"train_loss": -17.423437118530273, "global_step": 1725, "epoch": 14} {"train_loss": -17.44904136657715, "global_step": 1726, "epoch": 14} {"train_loss": -17.141162872314453, "global_step": 1727, "epoch": 14} {"train_loss": -17.15794563293457, "global_step": 1728, "epoch": 14} {"train_loss": -17.31017303466797, "global_step": 1729, "epoch": 14} {"train_loss": -17.050825119018555, "global_step": 1730, "epoch": 14} {"train_loss": -17.445953369140625, "global_step": 1731, "epoch": 14} {"train_loss": -16.887704849243164, "global_step": 1732, "epoch": 14} {"train_loss": -17.46051597595215, "global_step": 1733, "epoch": 14} {"train_loss": -17.126319885253906, "global_step": 1734, "epoch": 14} {"train_loss": -17.30925178527832, "global_step": 1735, "epoch": 14} {"train_loss": -17.574905395507812, "global_step": 1736, "epoch": 14} {"train_loss": -17.03944969177246, "global_step": 1737, "epoch": 14} {"train_loss": -17.64484214782715, "global_step": 1738, "epoch": 14} {"train_loss": -17.510883331298828, "global_step": 1739, "epoch": 14} {"train_loss": -17.566722869873047, "global_step": 1740, "epoch": 14} {"train_loss": -17.215749740600586, "global_step": 1741, "epoch": 14} {"train_loss": -16.97150993347168, "global_step": 1742, "epoch": 14} {"train_loss": -17.593297958374023, "global_step": 1743, "epoch": 14} {"train_loss": -16.471332550048828, "global_step": 1744, "epoch": 14} {"train_loss": -17.6727294921875, "global_step": 1745, "epoch": 14} {"train_loss": -16.903120040893555, "global_step": 1746, "epoch": 14} {"train_loss": -16.94402503967285, "global_step": 1747, "epoch": 14} {"train_loss": -17.598426818847656, "global_step": 1748, "epoch": 14} {"train_loss": -17.25922966003418, "global_step": 1749, "epoch": 14} {"train_loss": -17.362239837646484, "global_step": 1750, "epoch": 14} {"train_loss": -17.378217697143555, "global_step": 1751, "epoch": 14} {"train_loss": -17.849384307861328, "global_step": 1752, "epoch": 14} {"train_loss": -16.825878143310547, "global_step": 1753, "epoch": 14} {"train_loss": -17.16495704650879, "global_step": 1754, "epoch": 14} {"train_loss": -17.45415687561035, "global_step": 1755, "epoch": 14} {"train_loss": -17.098915100097656, "global_step": 1756, "epoch": 14} {"train_loss": -16.809356689453125, "global_step": 1757, "epoch": 14} {"train_loss": -17.120115280151367, "global_step": 1758, "epoch": 14} {"train_loss": -17.223134994506836, "global_step": 1759, "epoch": 14} {"train_loss": -17.531814575195312, "global_step": 1760, "epoch": 14} {"train_loss": -17.510156631469727, "global_step": 1761, "epoch": 14} {"train_loss": -17.414567947387695, "global_step": 1762, "epoch": 14} {"train_loss": -17.4716854095459, "global_step": 1763, "epoch": 14} {"train_loss": -17.914783477783203, "global_step": 1764, "epoch": 14} {"train_loss": -17.113536834716797, "global_step": 1765, "epoch": 14} {"train_loss": -17.4974422454834, "global_step": 1766, "epoch": 14} {"train_loss": -17.388822555541992, "global_step": 1767, "epoch": 14} {"train_loss": -16.892236709594727, "global_step": 1768, "epoch": 14} {"train_loss": -17.32673454284668, "global_step": 1769, "epoch": 14} {"train_loss": -17.608734130859375, "global_step": 1770, "epoch": 14} {"train_loss": -17.496994018554688, "global_step": 1771, "epoch": 14} {"train_loss": -17.689905166625977, "global_step": 1772, "epoch": 14} {"train_loss": -17.017133712768555, "global_step": 1773, "epoch": 14} {"train_loss": -17.264728546142578, "global_step": 1774, "epoch": 14} {"train_loss": -17.64812660217285, "global_step": 1775, "epoch": 14} {"train_loss": -17.242448806762695, "global_step": 1776, "epoch": 14} {"train_loss": -17.35078239440918, "global_step": 1777, "epoch": 14} {"train_loss": -16.650691986083984, "global_step": 1778, "epoch": 14} {"train_loss": -17.31978988647461, "global_step": 1779, "epoch": 14} {"train_loss": -17.251028060913086, "global_step": 1780, "epoch": 14} {"train_loss": -17.395008087158203, "global_step": 1781, "epoch": 14} {"train_loss": -17.603927612304688, "global_step": 1782, "epoch": 14} {"train_loss": -17.19074821472168, "global_step": 1783, "epoch": 14} {"train_loss": -17.702899932861328, "global_step": 1784, "epoch": 14} {"train_loss": -17.505863189697266, "global_step": 1785, "epoch": 14} {"train_loss": -17.302330017089844, "global_step": 1786, "epoch": 14} {"train_loss": -17.06236457824707, "global_step": 1787, "epoch": 14} {"train_loss": -17.6955509185791, "global_step": 1788, "epoch": 14} {"train_loss": -17.070648193359375, "global_step": 1789, "epoch": 14} {"train_loss": -16.971067428588867, "global_step": 1790, "epoch": 14} {"train_loss": -16.990034103393555, "global_step": 1791, "epoch": 14} {"train_loss": -17.5574893951416, "global_step": 1792, "epoch": 14} {"train_loss": -17.529401779174805, "global_step": 1793, "epoch": 14} {"train_loss": -17.669191360473633, "global_step": 1794, "epoch": 14} {"train_loss": -17.18134117126465, "global_step": 1795, "epoch": 14} {"train_loss": -17.842042922973633, "global_step": 1796, "epoch": 14} {"train_loss": -17.17975425720215, "global_step": 1797, "epoch": 14} {"train_loss": -17.33465576171875, "global_step": 1798, "epoch": 14} {"train_loss": -17.503080368041992, "global_step": 1799, "epoch": 14} {"train_loss": -17.494369506835938, "global_step": 1800, "epoch": 14} {"train_loss": -17.638757705688477, "global_step": 1801, "epoch": 14} {"train_loss": -17.345186233520508, "global_step": 1802, "epoch": 14} {"train_loss": -17.35541343688965, "global_step": 1803, "epoch": 14} {"train_loss": -17.11085319519043, "global_step": 1804, "epoch": 14} {"train_loss": -17.479101181030273, "global_step": 1805, "epoch": 14} {"train_loss": -17.52139663696289, "global_step": 1806, "epoch": 14} {"train_loss": -17.745601654052734, "global_step": 1807, "epoch": 14} {"train_loss": -16.675968170166016, "global_step": 1808, "epoch": 14} {"train_loss": -17.360366821289062, "global_step": 1809, "epoch": 14} {"train_loss": -17.184051513671875, "global_step": 1810, "epoch": 14} {"train_loss": -16.77631187438965, "global_step": 1811, "epoch": 14} {"train_loss": -17.957685470581055, "global_step": 1812, "epoch": 14} {"train_loss": -17.116626739501953, "global_step": 1813, "epoch": 14} {"train_loss": -17.31139282352668, "global_step": 1814, "epoch": 14, "val_loss": 3127068.25} {"train_loss": -16.658628463745117, "global_step": 1815, "epoch": 15} {"train_loss": -17.579984664916992, "global_step": 1816, "epoch": 15} {"train_loss": -17.64866065979004, "global_step": 1817, "epoch": 15} {"train_loss": -17.21175765991211, "global_step": 1818, "epoch": 15} {"train_loss": -18.03839874267578, "global_step": 1819, "epoch": 15} {"train_loss": -17.68187713623047, "global_step": 1820, "epoch": 15} {"train_loss": -17.3089656829834, "global_step": 1821, "epoch": 15} {"train_loss": -17.372068405151367, "global_step": 1822, "epoch": 15} {"train_loss": -17.306737899780273, "global_step": 1823, "epoch": 15} {"train_loss": -17.5463924407959, "global_step": 1824, "epoch": 15} {"train_loss": -17.469593048095703, "global_step": 1825, "epoch": 15} {"train_loss": -17.59271812438965, "global_step": 1826, "epoch": 15} {"train_loss": -17.139265060424805, "global_step": 1827, "epoch": 15} {"train_loss": -16.850072860717773, "global_step": 1828, "epoch": 15} {"train_loss": -17.72165870666504, "global_step": 1829, "epoch": 15} {"train_loss": -17.603057861328125, "global_step": 1830, "epoch": 15} {"train_loss": -17.671133041381836, "global_step": 1831, "epoch": 15} {"train_loss": -17.63960075378418, "global_step": 1832, "epoch": 15} {"train_loss": -17.168386459350586, "global_step": 1833, "epoch": 15} {"train_loss": -17.394853591918945, "global_step": 1834, "epoch": 15} {"train_loss": -17.43583106994629, "global_step": 1835, "epoch": 15} {"train_loss": -17.77301597595215, "global_step": 1836, "epoch": 15} {"train_loss": -17.609210968017578, "global_step": 1837, "epoch": 15} {"train_loss": -17.57320213317871, "global_step": 1838, "epoch": 15} {"train_loss": -17.649211883544922, "global_step": 1839, "epoch": 15} {"train_loss": -17.79692840576172, "global_step": 1840, "epoch": 15} {"train_loss": -17.476091384887695, "global_step": 1841, "epoch": 15} {"train_loss": -17.853940963745117, "global_step": 1842, "epoch": 15} {"train_loss": -17.584257125854492, "global_step": 1843, "epoch": 15} {"train_loss": -17.848806381225586, "global_step": 1844, "epoch": 15} {"train_loss": -17.487064361572266, "global_step": 1845, "epoch": 15} {"train_loss": -17.677753448486328, "global_step": 1846, "epoch": 15} {"train_loss": -17.214242935180664, "global_step": 1847, "epoch": 15} {"train_loss": -16.801931381225586, "global_step": 1848, "epoch": 15} {"train_loss": -17.73276710510254, "global_step": 1849, "epoch": 15} {"train_loss": -17.336095809936523, "global_step": 1850, "epoch": 15} {"train_loss": -17.627628326416016, "global_step": 1851, "epoch": 15} {"train_loss": -17.67266082763672, "global_step": 1852, "epoch": 15} {"train_loss": -17.458751678466797, "global_step": 1853, "epoch": 15} {"train_loss": -17.667715072631836, "global_step": 1854, "epoch": 15} {"train_loss": -17.45960807800293, "global_step": 1855, "epoch": 15} {"train_loss": -17.786725997924805, "global_step": 1856, "epoch": 15} {"train_loss": -17.720794677734375, "global_step": 1857, "epoch": 15} {"train_loss": -17.606943130493164, "global_step": 1858, "epoch": 15} {"train_loss": -17.872098922729492, "global_step": 1859, "epoch": 15} {"train_loss": -17.315717697143555, "global_step": 1860, "epoch": 15} {"train_loss": -18.08991813659668, "global_step": 1861, "epoch": 15} {"train_loss": -17.353496551513672, "global_step": 1862, "epoch": 15} {"train_loss": -17.446334838867188, "global_step": 1863, "epoch": 15} {"train_loss": -17.546918869018555, "global_step": 1864, "epoch": 15} {"train_loss": -17.63583755493164, "global_step": 1865, "epoch": 15} {"train_loss": -17.286108016967773, "global_step": 1866, "epoch": 15} {"train_loss": -17.657943725585938, "global_step": 1867, "epoch": 15} {"train_loss": -17.932069778442383, "global_step": 1868, "epoch": 15} {"train_loss": -17.594676971435547, "global_step": 1869, "epoch": 15} {"train_loss": -17.04151725769043, "global_step": 1870, "epoch": 15} {"train_loss": -17.233800888061523, "global_step": 1871, "epoch": 15} {"train_loss": -18.032276153564453, "global_step": 1872, "epoch": 15} {"train_loss": -17.54053497314453, "global_step": 1873, "epoch": 15} {"train_loss": -17.878768920898438, "global_step": 1874, "epoch": 15} {"train_loss": -17.113937377929688, "global_step": 1875, "epoch": 15} {"train_loss": -17.30645179748535, "global_step": 1876, "epoch": 15} {"train_loss": -17.608753204345703, "global_step": 1877, "epoch": 15} {"train_loss": -17.26240348815918, "global_step": 1878, "epoch": 15} {"train_loss": -17.16462516784668, "global_step": 1879, "epoch": 15} {"train_loss": -17.298734664916992, "global_step": 1880, "epoch": 15} {"train_loss": -16.74654197692871, "global_step": 1881, "epoch": 15} {"train_loss": -17.12708854675293, "global_step": 1882, "epoch": 15} {"train_loss": -17.26530647277832, "global_step": 1883, "epoch": 15} {"train_loss": -17.180997848510742, "global_step": 1884, "epoch": 15} {"train_loss": -17.1157169342041, "global_step": 1885, "epoch": 15} {"train_loss": -17.650354385375977, "global_step": 1886, "epoch": 15} {"train_loss": -17.39803123474121, "global_step": 1887, "epoch": 15} {"train_loss": -17.51601219177246, "global_step": 1888, "epoch": 15} {"train_loss": -17.515913009643555, "global_step": 1889, "epoch": 15} {"train_loss": -16.967641830444336, "global_step": 1890, "epoch": 15} {"train_loss": -17.61815071105957, "global_step": 1891, "epoch": 15} {"train_loss": -17.738821029663086, "global_step": 1892, "epoch": 15} {"train_loss": -17.363731384277344, "global_step": 1893, "epoch": 15} {"train_loss": -17.4506778717041, "global_step": 1894, "epoch": 15} {"train_loss": -17.634382247924805, "global_step": 1895, "epoch": 15} {"train_loss": -17.105581283569336, "global_step": 1896, "epoch": 15} {"train_loss": -17.730243682861328, "global_step": 1897, "epoch": 15} {"train_loss": -18.121444702148438, "global_step": 1898, "epoch": 15} {"train_loss": -17.409841537475586, "global_step": 1899, "epoch": 15} {"train_loss": -17.723590850830078, "global_step": 1900, "epoch": 15} {"train_loss": -17.537343978881836, "global_step": 1901, "epoch": 15} {"train_loss": -17.407794952392578, "global_step": 1902, "epoch": 15} {"train_loss": -17.448095321655273, "global_step": 1903, "epoch": 15} {"train_loss": -17.77872085571289, "global_step": 1904, "epoch": 15} {"train_loss": -17.61531639099121, "global_step": 1905, "epoch": 15} {"train_loss": -17.82942771911621, "global_step": 1906, "epoch": 15} {"train_loss": -17.749570846557617, "global_step": 1907, "epoch": 15} {"train_loss": -17.371322631835938, "global_step": 1908, "epoch": 15} {"train_loss": -17.53369140625, "global_step": 1909, "epoch": 15} {"train_loss": -17.825275421142578, "global_step": 1910, "epoch": 15} {"train_loss": -17.291929244995117, "global_step": 1911, "epoch": 15} {"train_loss": -17.648550033569336, "global_step": 1912, "epoch": 15} {"train_loss": -16.81756591796875, "global_step": 1913, "epoch": 15} {"train_loss": -17.507015228271484, "global_step": 1914, "epoch": 15} {"train_loss": -17.028297424316406, "global_step": 1915, "epoch": 15} {"train_loss": -17.114437103271484, "global_step": 1916, "epoch": 15} {"train_loss": -17.483041763305664, "global_step": 1917, "epoch": 15} {"train_loss": -16.79298210144043, "global_step": 1918, "epoch": 15} {"train_loss": -17.7015380859375, "global_step": 1919, "epoch": 15} {"train_loss": -17.45069122314453, "global_step": 1920, "epoch": 15} {"train_loss": -17.23512077331543, "global_step": 1921, "epoch": 15} {"train_loss": -17.545928955078125, "global_step": 1922, "epoch": 15} {"train_loss": -16.72407341003418, "global_step": 1923, "epoch": 15} {"train_loss": -17.738636016845703, "global_step": 1924, "epoch": 15} {"train_loss": -17.677255630493164, "global_step": 1925, "epoch": 15} {"train_loss": -17.32062339782715, "global_step": 1926, "epoch": 15} {"train_loss": -17.528961181640625, "global_step": 1927, "epoch": 15} {"train_loss": -16.939176559448242, "global_step": 1928, "epoch": 15} {"train_loss": -17.538427352905273, "global_step": 1929, "epoch": 15} {"train_loss": -17.52228355407715, "global_step": 1930, "epoch": 15} {"train_loss": -17.32893943786621, "global_step": 1931, "epoch": 15} {"train_loss": -17.467426300048828, "global_step": 1932, "epoch": 15} {"train_loss": -17.595178604125977, "global_step": 1933, "epoch": 15} {"train_loss": -17.913969039916992, "global_step": 1934, "epoch": 15} {"train_loss": -17.47297889141997, "global_step": 1935, "epoch": 15, "val_loss": 3259945.0} {"train_loss": -18.040298461914062, "global_step": 1936, "epoch": 16} {"train_loss": -17.972293853759766, "global_step": 1937, "epoch": 16} {"train_loss": -17.32953453063965, "global_step": 1938, "epoch": 16} {"train_loss": -17.749099731445312, "global_step": 1939, "epoch": 16} {"train_loss": -17.151020050048828, "global_step": 1940, "epoch": 16} {"train_loss": -17.71440315246582, "global_step": 1941, "epoch": 16} {"train_loss": -16.897329330444336, "global_step": 1942, "epoch": 16} {"train_loss": -17.08017349243164, "global_step": 1943, "epoch": 16} {"train_loss": -17.247705459594727, "global_step": 1944, "epoch": 16} {"train_loss": -17.441787719726562, "global_step": 1945, "epoch": 16} {"train_loss": -17.268653869628906, "global_step": 1946, "epoch": 16} {"train_loss": -17.601041793823242, "global_step": 1947, "epoch": 16} {"train_loss": -16.957401275634766, "global_step": 1948, "epoch": 16} {"train_loss": -17.726999282836914, "global_step": 1949, "epoch": 16} {"train_loss": -17.027999877929688, "global_step": 1950, "epoch": 16} {"train_loss": -17.14705467224121, "global_step": 1951, "epoch": 16} {"train_loss": -17.411762237548828, "global_step": 1952, "epoch": 16} {"train_loss": -17.18794059753418, "global_step": 1953, "epoch": 16} {"train_loss": -16.847015380859375, "global_step": 1954, "epoch": 16} {"train_loss": -16.968900680541992, "global_step": 1955, "epoch": 16} {"train_loss": -17.401098251342773, "global_step": 1956, "epoch": 16} {"train_loss": -16.597915649414062, "global_step": 1957, "epoch": 16} {"train_loss": -17.434507369995117, "global_step": 1958, "epoch": 16} {"train_loss": -17.709882736206055, "global_step": 1959, "epoch": 16} {"train_loss": -17.311803817749023, "global_step": 1960, "epoch": 16} {"train_loss": -17.28127098083496, "global_step": 1961, "epoch": 16} {"train_loss": -17.078439712524414, "global_step": 1962, "epoch": 16} {"train_loss": -17.22193145751953, "global_step": 1963, "epoch": 16} {"train_loss": -17.222095489501953, "global_step": 1964, "epoch": 16} {"train_loss": -17.398054122924805, "global_step": 1965, "epoch": 16} {"train_loss": -17.353145599365234, "global_step": 1966, "epoch": 16} {"train_loss": -17.392362594604492, "global_step": 1967, "epoch": 16} {"train_loss": -17.323223114013672, "global_step": 1968, "epoch": 16} {"train_loss": -17.373754501342773, "global_step": 1969, "epoch": 16} {"train_loss": -16.53249740600586, "global_step": 1970, "epoch": 16} {"train_loss": -17.64134407043457, "global_step": 1971, "epoch": 16} {"train_loss": -17.54266357421875, "global_step": 1972, "epoch": 16} {"train_loss": -17.997434616088867, "global_step": 1973, "epoch": 16} {"train_loss": -17.822660446166992, "global_step": 1974, "epoch": 16} {"train_loss": -17.436779022216797, "global_step": 1975, "epoch": 16} {"train_loss": -17.473485946655273, "global_step": 1976, "epoch": 16} {"train_loss": -17.258743286132812, "global_step": 1977, "epoch": 16} {"train_loss": -17.76323890686035, "global_step": 1978, "epoch": 16} {"train_loss": -16.089941024780273, "global_step": 1979, "epoch": 16} {"train_loss": -17.153905868530273, "global_step": 1980, "epoch": 16} {"train_loss": -17.457372665405273, "global_step": 1981, "epoch": 16} {"train_loss": -17.56110191345215, "global_step": 1982, "epoch": 16} {"train_loss": -17.267364501953125, "global_step": 1983, "epoch": 16} {"train_loss": -17.91281509399414, "global_step": 1984, "epoch": 16} {"train_loss": -18.02241325378418, "global_step": 1985, "epoch": 16} {"train_loss": -17.417869567871094, "global_step": 1986, "epoch": 16} {"train_loss": -17.74199867248535, "global_step": 1987, "epoch": 16} {"train_loss": -17.668521881103516, "global_step": 1988, "epoch": 16} {"train_loss": -17.687795639038086, "global_step": 1989, "epoch": 16} {"train_loss": -17.961124420166016, "global_step": 1990, "epoch": 16} {"train_loss": -17.718711853027344, "global_step": 1991, "epoch": 16} {"train_loss": -18.084903717041016, "global_step": 1992, "epoch": 16} {"train_loss": -17.519031524658203, "global_step": 1993, "epoch": 16} {"train_loss": -17.338010787963867, "global_step": 1994, "epoch": 16} {"train_loss": -17.724313735961914, "global_step": 1995, "epoch": 16} {"train_loss": -17.57712745666504, "global_step": 1996, "epoch": 16} {"train_loss": -17.57391929626465, "global_step": 1997, "epoch": 16} {"train_loss": -17.958463668823242, "global_step": 1998, "epoch": 16} {"train_loss": -17.553274154663086, "global_step": 1999, "epoch": 16} {"train_loss": -17.796979904174805, "global_step": 2000, "epoch": 16} {"train_loss": -17.5338191986084, "global_step": 2001, "epoch": 16} {"train_loss": -16.9372501373291, "global_step": 2002, "epoch": 16} {"train_loss": -17.40143394470215, "global_step": 2003, "epoch": 16} {"train_loss": -17.172943115234375, "global_step": 2004, "epoch": 16} {"train_loss": -17.896665573120117, "global_step": 2005, "epoch": 16} {"train_loss": -16.96302604675293, "global_step": 2006, "epoch": 16} {"train_loss": -17.177553176879883, "global_step": 2007, "epoch": 16} {"train_loss": -17.27412223815918, "global_step": 2008, "epoch": 16} {"train_loss": -17.439224243164062, "global_step": 2009, "epoch": 16} {"train_loss": -17.647319793701172, "global_step": 2010, "epoch": 16} {"train_loss": -17.64015769958496, "global_step": 2011, "epoch": 16} {"train_loss": -17.54129981994629, "global_step": 2012, "epoch": 16} {"train_loss": -17.881521224975586, "global_step": 2013, "epoch": 16} {"train_loss": -17.655160903930664, "global_step": 2014, "epoch": 16} {"train_loss": -17.668195724487305, "global_step": 2015, "epoch": 16} {"train_loss": -17.393625259399414, "global_step": 2016, "epoch": 16} {"train_loss": -17.764196395874023, "global_step": 2017, "epoch": 16} {"train_loss": -17.997900009155273, "global_step": 2018, "epoch": 16} {"train_loss": -18.125951766967773, "global_step": 2019, "epoch": 16} {"train_loss": -17.894657135009766, "global_step": 2020, "epoch": 16} {"train_loss": -17.9354305267334, "global_step": 2021, "epoch": 16} {"train_loss": -17.456872940063477, "global_step": 2022, "epoch": 16} {"train_loss": -18.132614135742188, "global_step": 2023, "epoch": 16} {"train_loss": -18.242721557617188, "global_step": 2024, "epoch": 16} {"train_loss": -17.831342697143555, "global_step": 2025, "epoch": 16} {"train_loss": -18.13892936706543, "global_step": 2026, "epoch": 16} {"train_loss": -17.509004592895508, "global_step": 2027, "epoch": 16} {"train_loss": -17.761350631713867, "global_step": 2028, "epoch": 16} {"train_loss": -17.674985885620117, "global_step": 2029, "epoch": 16} {"train_loss": -17.580642700195312, "global_step": 2030, "epoch": 16} {"train_loss": -18.120729446411133, "global_step": 2031, "epoch": 16} {"train_loss": -17.13528823852539, "global_step": 2032, "epoch": 16} {"train_loss": -17.95184898376465, "global_step": 2033, "epoch": 16} {"train_loss": -16.91789436340332, "global_step": 2034, "epoch": 16} {"train_loss": -17.972919464111328, "global_step": 2035, "epoch": 16} {"train_loss": -17.08953285217285, "global_step": 2036, "epoch": 16} {"train_loss": -16.77347755432129, "global_step": 2037, "epoch": 16} {"train_loss": -17.402551651000977, "global_step": 2038, "epoch": 16} {"train_loss": -16.54994010925293, "global_step": 2039, "epoch": 16} {"train_loss": -16.788511276245117, "global_step": 2040, "epoch": 16} {"train_loss": -16.63010597229004, "global_step": 2041, "epoch": 16} {"train_loss": -17.30085563659668, "global_step": 2042, "epoch": 16} {"train_loss": -16.778905868530273, "global_step": 2043, "epoch": 16} {"train_loss": -16.92609214782715, "global_step": 2044, "epoch": 16} {"train_loss": -17.35623550415039, "global_step": 2045, "epoch": 16} {"train_loss": -17.115598678588867, "global_step": 2046, "epoch": 16} {"train_loss": -17.158403396606445, "global_step": 2047, "epoch": 16} {"train_loss": -16.87432289123535, "global_step": 2048, "epoch": 16} {"train_loss": -17.328590393066406, "global_step": 2049, "epoch": 16} {"train_loss": -17.45356559753418, "global_step": 2050, "epoch": 16} {"train_loss": -17.672767639160156, "global_step": 2051, "epoch": 16} {"train_loss": -17.668725967407227, "global_step": 2052, "epoch": 16} {"train_loss": -17.85784912109375, "global_step": 2053, "epoch": 16} {"train_loss": -17.534406661987305, "global_step": 2054, "epoch": 16} {"train_loss": -17.80110740661621, "global_step": 2055, "epoch": 16} {"train_loss": -17.455398953650608, "global_step": 2056, "epoch": 16, "val_loss": 2696188.25} {"train_loss": -17.31788444519043, "global_step": 2057, "epoch": 17} {"train_loss": -17.772085189819336, "global_step": 2058, "epoch": 17} {"train_loss": -17.84510612487793, "global_step": 2059, "epoch": 17} {"train_loss": -17.712284088134766, "global_step": 2060, "epoch": 17} {"train_loss": -17.857694625854492, "global_step": 2061, "epoch": 17} {"train_loss": -17.450037002563477, "global_step": 2062, "epoch": 17} {"train_loss": -17.674386978149414, "global_step": 2063, "epoch": 17} {"train_loss": -17.95384407043457, "global_step": 2064, "epoch": 17} {"train_loss": -17.695959091186523, "global_step": 2065, "epoch": 17} {"train_loss": -17.086156845092773, "global_step": 2066, "epoch": 17} {"train_loss": -18.06070899963379, "global_step": 2067, "epoch": 17} {"train_loss": -17.263286590576172, "global_step": 2068, "epoch": 17} {"train_loss": -17.373798370361328, "global_step": 2069, "epoch": 17} {"train_loss": -17.41714096069336, "global_step": 2070, "epoch": 17} {"train_loss": -17.459613800048828, "global_step": 2071, "epoch": 17} {"train_loss": -16.200414657592773, "global_step": 2072, "epoch": 17} {"train_loss": -18.361358642578125, "global_step": 2073, "epoch": 17} {"train_loss": -16.8151912689209, "global_step": 2074, "epoch": 17} {"train_loss": -17.359182357788086, "global_step": 2075, "epoch": 17} {"train_loss": -17.351240158081055, "global_step": 2076, "epoch": 17} {"train_loss": -17.61880874633789, "global_step": 2077, "epoch": 17} {"train_loss": -17.35807228088379, "global_step": 2078, "epoch": 17} {"train_loss": -17.20477867126465, "global_step": 2079, "epoch": 17} {"train_loss": -17.84010887145996, "global_step": 2080, "epoch": 17} {"train_loss": -17.794771194458008, "global_step": 2081, "epoch": 17} {"train_loss": -17.204456329345703, "global_step": 2082, "epoch": 17} {"train_loss": -17.6677188873291, "global_step": 2083, "epoch": 17} {"train_loss": -17.06836700439453, "global_step": 2084, "epoch": 17} {"train_loss": -17.777498245239258, "global_step": 2085, "epoch": 17} {"train_loss": -17.39784812927246, "global_step": 2086, "epoch": 17} {"train_loss": -17.502058029174805, "global_step": 2087, "epoch": 17} {"train_loss": -17.69661521911621, "global_step": 2088, "epoch": 17} {"train_loss": -17.456388473510742, "global_step": 2089, "epoch": 17} {"train_loss": -18.060853958129883, "global_step": 2090, "epoch": 17} {"train_loss": -17.563148498535156, "global_step": 2091, "epoch": 17} {"train_loss": -17.86628532409668, "global_step": 2092, "epoch": 17} {"train_loss": -18.037734985351562, "global_step": 2093, "epoch": 17} {"train_loss": -17.438261032104492, "global_step": 2094, "epoch": 17} {"train_loss": -18.144853591918945, "global_step": 2095, "epoch": 17} {"train_loss": -16.961620330810547, "global_step": 2096, "epoch": 17} {"train_loss": -17.431894302368164, "global_step": 2097, "epoch": 17} {"train_loss": -17.239553451538086, "global_step": 2098, "epoch": 17} {"train_loss": -17.525842666625977, "global_step": 2099, "epoch": 17} {"train_loss": -17.59913444519043, "global_step": 2100, "epoch": 17} {"train_loss": -17.414798736572266, "global_step": 2101, "epoch": 17} {"train_loss": -17.2946720123291, "global_step": 2102, "epoch": 17} {"train_loss": -18.02363395690918, "global_step": 2103, "epoch": 17} {"train_loss": -17.432783126831055, "global_step": 2104, "epoch": 17} {"train_loss": -17.886903762817383, "global_step": 2105, "epoch": 17} {"train_loss": -17.07770347595215, "global_step": 2106, "epoch": 17} {"train_loss": -17.316476821899414, "global_step": 2107, "epoch": 17} {"train_loss": -17.363401412963867, "global_step": 2108, "epoch": 17} {"train_loss": -17.051054000854492, "global_step": 2109, "epoch": 17} {"train_loss": -17.493343353271484, "global_step": 2110, "epoch": 17} {"train_loss": -17.107532501220703, "global_step": 2111, "epoch": 17} {"train_loss": -17.638233184814453, "global_step": 2112, "epoch": 17} {"train_loss": -16.7647762298584, "global_step": 2113, "epoch": 17} {"train_loss": -17.22842788696289, "global_step": 2114, "epoch": 17} {"train_loss": -17.681259155273438, "global_step": 2115, "epoch": 17} {"train_loss": -17.036832809448242, "global_step": 2116, "epoch": 17} {"train_loss": -17.83949089050293, "global_step": 2117, "epoch": 17} {"train_loss": -17.573436737060547, "global_step": 2118, "epoch": 17} {"train_loss": -17.00300407409668, "global_step": 2119, "epoch": 17} {"train_loss": -17.969663619995117, "global_step": 2120, "epoch": 17} {"train_loss": -17.53680419921875, "global_step": 2121, "epoch": 17} {"train_loss": -17.15900230407715, "global_step": 2122, "epoch": 17} {"train_loss": -17.678739547729492, "global_step": 2123, "epoch": 17} {"train_loss": -17.58920669555664, "global_step": 2124, "epoch": 17} {"train_loss": -16.830036163330078, "global_step": 2125, "epoch": 17} {"train_loss": -17.226518630981445, "global_step": 2126, "epoch": 17} {"train_loss": -17.54990005493164, "global_step": 2127, "epoch": 17} {"train_loss": -16.977651596069336, "global_step": 2128, "epoch": 17} {"train_loss": -17.24144744873047, "global_step": 2129, "epoch": 17} {"train_loss": -17.38300895690918, "global_step": 2130, "epoch": 17} {"train_loss": -17.6629581451416, "global_step": 2131, "epoch": 17} {"train_loss": -17.569856643676758, "global_step": 2132, "epoch": 17} {"train_loss": -17.2683048248291, "global_step": 2133, "epoch": 17} {"train_loss": -17.416501998901367, "global_step": 2134, "epoch": 17} {"train_loss": -17.297239303588867, "global_step": 2135, "epoch": 17} {"train_loss": -17.905658721923828, "global_step": 2136, "epoch": 17} {"train_loss": -17.24380874633789, "global_step": 2137, "epoch": 17} {"train_loss": -17.453659057617188, "global_step": 2138, "epoch": 17} {"train_loss": -17.807409286499023, "global_step": 2139, "epoch": 17} {"train_loss": -17.863574981689453, "global_step": 2140, "epoch": 17} {"train_loss": -17.460712432861328, "global_step": 2141, "epoch": 17} {"train_loss": -17.4577579498291, "global_step": 2142, "epoch": 17} {"train_loss": -17.492725372314453, "global_step": 2143, "epoch": 17} {"train_loss": -17.326305389404297, "global_step": 2144, "epoch": 17} {"train_loss": -17.555992126464844, "global_step": 2145, "epoch": 17} {"train_loss": -17.401432037353516, "global_step": 2146, "epoch": 17} {"train_loss": -17.241376876831055, "global_step": 2147, "epoch": 17} {"train_loss": -17.389572143554688, "global_step": 2148, "epoch": 17} {"train_loss": -17.37002944946289, "global_step": 2149, "epoch": 17} {"train_loss": -17.178909301757812, "global_step": 2150, "epoch": 17} {"train_loss": -17.9779109954834, "global_step": 2151, "epoch": 17} {"train_loss": -17.3027400970459, "global_step": 2152, "epoch": 17} {"train_loss": -17.80487060546875, "global_step": 2153, "epoch": 17} {"train_loss": -16.772682189941406, "global_step": 2154, "epoch": 17} {"train_loss": -17.66570281982422, "global_step": 2155, "epoch": 17} {"train_loss": -16.751399993896484, "global_step": 2156, "epoch": 17} {"train_loss": -17.52381706237793, "global_step": 2157, "epoch": 17} {"train_loss": -17.78213119506836, "global_step": 2158, "epoch": 17} {"train_loss": -18.209768295288086, "global_step": 2159, "epoch": 17} {"train_loss": -17.12330436706543, "global_step": 2160, "epoch": 17} {"train_loss": -17.79932975769043, "global_step": 2161, "epoch": 17} {"train_loss": -17.39857292175293, "global_step": 2162, "epoch": 17} {"train_loss": -17.648826599121094, "global_step": 2163, "epoch": 17} {"train_loss": -17.904813766479492, "global_step": 2164, "epoch": 17} {"train_loss": -17.870849609375, "global_step": 2165, "epoch": 17} {"train_loss": -17.62162208557129, "global_step": 2166, "epoch": 17} {"train_loss": -17.54568862915039, "global_step": 2167, "epoch": 17} {"train_loss": -17.824926376342773, "global_step": 2168, "epoch": 17} {"train_loss": -17.938467025756836, "global_step": 2169, "epoch": 17} {"train_loss": -17.9686279296875, "global_step": 2170, "epoch": 17} {"train_loss": -17.609392166137695, "global_step": 2171, "epoch": 17} {"train_loss": -17.952951431274414, "global_step": 2172, "epoch": 17} {"train_loss": -17.716901779174805, "global_step": 2173, "epoch": 17} {"train_loss": -18.02480125427246, "global_step": 2174, "epoch": 17} {"train_loss": -17.51301383972168, "global_step": 2175, "epoch": 17} {"train_loss": -17.88619613647461, "global_step": 2176, "epoch": 17} {"train_loss": -17.5091094813071, "global_step": 2177, "epoch": 17, "val_loss": 3147168.75} {"train_loss": -17.716894149780273, "global_step": 2178, "epoch": 18} {"train_loss": -17.16375732421875, "global_step": 2179, "epoch": 18} {"train_loss": -17.601823806762695, "global_step": 2180, "epoch": 18} {"train_loss": -17.659360885620117, "global_step": 2181, "epoch": 18} {"train_loss": -17.18752098083496, "global_step": 2182, "epoch": 18} {"train_loss": -17.875526428222656, "global_step": 2183, "epoch": 18} {"train_loss": -17.7168025970459, "global_step": 2184, "epoch": 18} {"train_loss": -17.470741271972656, "global_step": 2185, "epoch": 18} {"train_loss": -18.066452026367188, "global_step": 2186, "epoch": 18} {"train_loss": -17.6779842376709, "global_step": 2187, "epoch": 18} {"train_loss": -17.727249145507812, "global_step": 2188, "epoch": 18} {"train_loss": -17.623512268066406, "global_step": 2189, "epoch": 18} {"train_loss": -17.800983428955078, "global_step": 2190, "epoch": 18} {"train_loss": -17.577024459838867, "global_step": 2191, "epoch": 18} {"train_loss": -18.199140548706055, "global_step": 2192, "epoch": 18} {"train_loss": -17.68984031677246, "global_step": 2193, "epoch": 18} {"train_loss": -17.45832633972168, "global_step": 2194, "epoch": 18} {"train_loss": -18.34406089782715, "global_step": 2195, "epoch": 18} {"train_loss": -17.985288619995117, "global_step": 2196, "epoch": 18} {"train_loss": -18.22779655456543, "global_step": 2197, "epoch": 18} {"train_loss": -17.634449005126953, "global_step": 2198, "epoch": 18} {"train_loss": -17.81427001953125, "global_step": 2199, "epoch": 18} {"train_loss": -17.2355899810791, "global_step": 2200, "epoch": 18} {"train_loss": -18.3714656829834, "global_step": 2201, "epoch": 18} {"train_loss": -17.891029357910156, "global_step": 2202, "epoch": 18} {"train_loss": -17.458921432495117, "global_step": 2203, "epoch": 18} {"train_loss": -17.690948486328125, "global_step": 2204, "epoch": 18} {"train_loss": -17.248613357543945, "global_step": 2205, "epoch": 18} {"train_loss": -17.4942626953125, "global_step": 2206, "epoch": 18} {"train_loss": -16.72170639038086, "global_step": 2207, "epoch": 18} {"train_loss": -17.75171661376953, "global_step": 2208, "epoch": 18} {"train_loss": -17.40937614440918, "global_step": 2209, "epoch": 18} {"train_loss": -17.20814323425293, "global_step": 2210, "epoch": 18} {"train_loss": -17.822612762451172, "global_step": 2211, "epoch": 18} {"train_loss": -17.78504180908203, "global_step": 2212, "epoch": 18} {"train_loss": -17.359405517578125, "global_step": 2213, "epoch": 18} {"train_loss": -17.076791763305664, "global_step": 2214, "epoch": 18} {"train_loss": -17.327762603759766, "global_step": 2215, "epoch": 18} {"train_loss": -17.20307159423828, "global_step": 2216, "epoch": 18} {"train_loss": -16.541357040405273, "global_step": 2217, "epoch": 18} {"train_loss": -17.564260482788086, "global_step": 2218, "epoch": 18} {"train_loss": -17.351736068725586, "global_step": 2219, "epoch": 18} {"train_loss": -16.73616600036621, "global_step": 2220, "epoch": 18} {"train_loss": -17.462406158447266, "global_step": 2221, "epoch": 18} {"train_loss": -17.334177017211914, "global_step": 2222, "epoch": 18} {"train_loss": -17.46708106994629, "global_step": 2223, "epoch": 18} {"train_loss": -17.418004989624023, "global_step": 2224, "epoch": 18} {"train_loss": -17.482227325439453, "global_step": 2225, "epoch": 18} {"train_loss": -17.43495750427246, "global_step": 2226, "epoch": 18} {"train_loss": -17.751544952392578, "global_step": 2227, "epoch": 18} {"train_loss": -17.649892807006836, "global_step": 2228, "epoch": 18} {"train_loss": -17.37620735168457, "global_step": 2229, "epoch": 18} {"train_loss": -17.757326126098633, "global_step": 2230, "epoch": 18} {"train_loss": -17.718503952026367, "global_step": 2231, "epoch": 18} {"train_loss": -17.61652946472168, "global_step": 2232, "epoch": 18} {"train_loss": -17.61292266845703, "global_step": 2233, "epoch": 18} {"train_loss": -17.54144287109375, "global_step": 2234, "epoch": 18} {"train_loss": -17.40485191345215, "global_step": 2235, "epoch": 18} {"train_loss": -17.458656311035156, "global_step": 2236, "epoch": 18} {"train_loss": -17.82398796081543, "global_step": 2237, "epoch": 18} {"train_loss": -17.457738876342773, "global_step": 2238, "epoch": 18} {"train_loss": -17.484323501586914, "global_step": 2239, "epoch": 18} {"train_loss": -17.77056312561035, "global_step": 2240, "epoch": 18} {"train_loss": -16.985326766967773, "global_step": 2241, "epoch": 18} {"train_loss": -16.993633270263672, "global_step": 2242, "epoch": 18} {"train_loss": -17.1507625579834, "global_step": 2243, "epoch": 18} {"train_loss": -16.919546127319336, "global_step": 2244, "epoch": 18} {"train_loss": -16.94878387451172, "global_step": 2245, "epoch": 18} {"train_loss": -16.5147762298584, "global_step": 2246, "epoch": 18} {"train_loss": -16.861114501953125, "global_step": 2247, "epoch": 18} {"train_loss": -17.00118064880371, "global_step": 2248, "epoch": 18} {"train_loss": -17.168367385864258, "global_step": 2249, "epoch": 18} {"train_loss": -17.54612159729004, "global_step": 2250, "epoch": 18} {"train_loss": -17.141698837280273, "global_step": 2251, "epoch": 18} {"train_loss": -17.079580307006836, "global_step": 2252, "epoch": 18} {"train_loss": -17.267362594604492, "global_step": 2253, "epoch": 18} {"train_loss": -17.248615264892578, "global_step": 2254, "epoch": 18} {"train_loss": -17.18744659423828, "global_step": 2255, "epoch": 18} {"train_loss": -16.978151321411133, "global_step": 2256, "epoch": 18} {"train_loss": -17.68540382385254, "global_step": 2257, "epoch": 18} {"train_loss": -17.8609676361084, "global_step": 2258, "epoch": 18} {"train_loss": -17.40604591369629, "global_step": 2259, "epoch": 18} {"train_loss": -17.580163955688477, "global_step": 2260, "epoch": 18} {"train_loss": -17.607187271118164, "global_step": 2261, "epoch": 18} {"train_loss": -17.91452407836914, "global_step": 2262, "epoch": 18} {"train_loss": -18.03607177734375, "global_step": 2263, "epoch": 18} {"train_loss": -17.566606521606445, "global_step": 2264, "epoch": 18} {"train_loss": -17.66959571838379, "global_step": 2265, "epoch": 18} {"train_loss": -17.792333602905273, "global_step": 2266, "epoch": 18} {"train_loss": -18.021381378173828, "global_step": 2267, "epoch": 18} {"train_loss": -18.25934410095215, "global_step": 2268, "epoch": 18} {"train_loss": -17.71377944946289, "global_step": 2269, "epoch": 18} {"train_loss": -17.98579216003418, "global_step": 2270, "epoch": 18} {"train_loss": -17.832685470581055, "global_step": 2271, "epoch": 18} {"train_loss": -17.83759117126465, "global_step": 2272, "epoch": 18} {"train_loss": -18.147226333618164, "global_step": 2273, "epoch": 18} {"train_loss": -18.09564781188965, "global_step": 2274, "epoch": 18} {"train_loss": -18.176061630249023, "global_step": 2275, "epoch": 18} {"train_loss": -18.064743041992188, "global_step": 2276, "epoch": 18} {"train_loss": -17.858745574951172, "global_step": 2277, "epoch": 18} {"train_loss": -18.1103515625, "global_step": 2278, "epoch": 18} {"train_loss": -18.201810836791992, "global_step": 2279, "epoch": 18} {"train_loss": -18.12343406677246, "global_step": 2280, "epoch": 18} {"train_loss": -17.76645851135254, "global_step": 2281, "epoch": 18} {"train_loss": -17.928436279296875, "global_step": 2282, "epoch": 18} {"train_loss": -18.087583541870117, "global_step": 2283, "epoch": 18} {"train_loss": -17.88791847229004, "global_step": 2284, "epoch": 18} {"train_loss": -17.646947860717773, "global_step": 2285, "epoch": 18} {"train_loss": -17.794065475463867, "global_step": 2286, "epoch": 18} {"train_loss": -18.339345932006836, "global_step": 2287, "epoch": 18} {"train_loss": -18.172388076782227, "global_step": 2288, "epoch": 18} {"train_loss": -18.432226181030273, "global_step": 2289, "epoch": 18} {"train_loss": -17.43703269958496, "global_step": 2290, "epoch": 18} {"train_loss": -17.50185775756836, "global_step": 2291, "epoch": 18} {"train_loss": -17.5952091217041, "global_step": 2292, "epoch": 18} {"train_loss": -18.252668380737305, "global_step": 2293, "epoch": 18} {"train_loss": -18.30824089050293, "global_step": 2294, "epoch": 18} {"train_loss": -17.54693603515625, "global_step": 2295, "epoch": 18} {"train_loss": -18.30376625061035, "global_step": 2296, "epoch": 18} {"train_loss": -18.119144439697266, "global_step": 2297, "epoch": 18} {"train_loss": -17.62029105572661, "global_step": 2298, "epoch": 18, "val_loss": 2701205.75} {"train_loss": -17.748937606811523, "global_step": 2299, "epoch": 19} {"train_loss": -17.470306396484375, "global_step": 2300, "epoch": 19} {"train_loss": -18.290292739868164, "global_step": 2301, "epoch": 19} {"train_loss": -17.90347671508789, "global_step": 2302, "epoch": 19} {"train_loss": -17.9038143157959, "global_step": 2303, "epoch": 19} {"train_loss": -18.15696907043457, "global_step": 2304, "epoch": 19} {"train_loss": -17.44111442565918, "global_step": 2305, "epoch": 19} {"train_loss": -17.708850860595703, "global_step": 2306, "epoch": 19} {"train_loss": -17.38700294494629, "global_step": 2307, "epoch": 19} {"train_loss": -18.00142478942871, "global_step": 2308, "epoch": 19} {"train_loss": -17.407562255859375, "global_step": 2309, "epoch": 19} {"train_loss": -18.344083786010742, "global_step": 2310, "epoch": 19} {"train_loss": -17.436655044555664, "global_step": 2311, "epoch": 19} {"train_loss": -17.556386947631836, "global_step": 2312, "epoch": 19} {"train_loss": -17.721515655517578, "global_step": 2313, "epoch": 19} {"train_loss": -18.20626449584961, "global_step": 2314, "epoch": 19} {"train_loss": -18.06675148010254, "global_step": 2315, "epoch": 19} {"train_loss": -17.70462989807129, "global_step": 2316, "epoch": 19} {"train_loss": -17.493366241455078, "global_step": 2317, "epoch": 19} {"train_loss": -17.926034927368164, "global_step": 2318, "epoch": 19} {"train_loss": -18.027830123901367, "global_step": 2319, "epoch": 19} {"train_loss": -17.77414321899414, "global_step": 2320, "epoch": 19} {"train_loss": -17.939008712768555, "global_step": 2321, "epoch": 19} {"train_loss": -17.817726135253906, "global_step": 2322, "epoch": 19} {"train_loss": -18.004528045654297, "global_step": 2323, "epoch": 19} {"train_loss": -18.185483932495117, "global_step": 2324, "epoch": 19} {"train_loss": -17.8912410736084, "global_step": 2325, "epoch": 19} {"train_loss": -18.347631454467773, "global_step": 2326, "epoch": 19} {"train_loss": -17.75417709350586, "global_step": 2327, "epoch": 19} {"train_loss": -18.48337745666504, "global_step": 2328, "epoch": 19} {"train_loss": -17.79424476623535, "global_step": 2329, "epoch": 19} {"train_loss": -17.57136344909668, "global_step": 2330, "epoch": 19} {"train_loss": -17.962656021118164, "global_step": 2331, "epoch": 19} {"train_loss": -18.07777214050293, "global_step": 2332, "epoch": 19} {"train_loss": -17.841154098510742, "global_step": 2333, "epoch": 19} {"train_loss": -17.867807388305664, "global_step": 2334, "epoch": 19} {"train_loss": -17.795087814331055, "global_step": 2335, "epoch": 19} {"train_loss": -17.470813751220703, "global_step": 2336, "epoch": 19} {"train_loss": -17.74299430847168, "global_step": 2337, "epoch": 19} {"train_loss": -17.313018798828125, "global_step": 2338, "epoch": 19} {"train_loss": -18.292970657348633, "global_step": 2339, "epoch": 19} {"train_loss": -17.493494033813477, "global_step": 2340, "epoch": 19} {"train_loss": -18.248830795288086, "global_step": 2341, "epoch": 19} {"train_loss": -17.793258666992188, "global_step": 2342, "epoch": 19} {"train_loss": -18.05390739440918, "global_step": 2343, "epoch": 19} {"train_loss": -18.320098876953125, "global_step": 2344, "epoch": 19} {"train_loss": -17.852537155151367, "global_step": 2345, "epoch": 19} {"train_loss": -17.904890060424805, "global_step": 2346, "epoch": 19} {"train_loss": -18.26411247253418, "global_step": 2347, "epoch": 19} {"train_loss": -18.041431427001953, "global_step": 2348, "epoch": 19} {"train_loss": -17.11712074279785, "global_step": 2349, "epoch": 19} {"train_loss": -17.80869483947754, "global_step": 2350, "epoch": 19} {"train_loss": -18.064838409423828, "global_step": 2351, "epoch": 19} {"train_loss": -18.248281478881836, "global_step": 2352, "epoch": 19} {"train_loss": -17.902875900268555, "global_step": 2353, "epoch": 19} {"train_loss": -17.81281280517578, "global_step": 2354, "epoch": 19} {"train_loss": -17.98610496520996, "global_step": 2355, "epoch": 19} {"train_loss": -18.140182495117188, "global_step": 2356, "epoch": 19} {"train_loss": -17.64873695373535, "global_step": 2357, "epoch": 19} {"train_loss": -18.287216186523438, "global_step": 2358, "epoch": 19} {"train_loss": -17.919889450073242, "global_step": 2359, "epoch": 19} {"train_loss": -17.845890045166016, "global_step": 2360, "epoch": 19} {"train_loss": -18.244754791259766, "global_step": 2361, "epoch": 19} {"train_loss": -17.95577049255371, "global_step": 2362, "epoch": 19} {"train_loss": -17.887285232543945, "global_step": 2363, "epoch": 19} {"train_loss": -18.122095108032227, "global_step": 2364, "epoch": 19} {"train_loss": -18.041318893432617, "global_step": 2365, "epoch": 19} {"train_loss": -18.04397964477539, "global_step": 2366, "epoch": 19} {"train_loss": -17.70326042175293, "global_step": 2367, "epoch": 19} {"train_loss": -17.932348251342773, "global_step": 2368, "epoch": 19} {"train_loss": -17.631000518798828, "global_step": 2369, "epoch": 19} {"train_loss": -18.00166130065918, "global_step": 2370, "epoch": 19} {"train_loss": -17.5413761138916, "global_step": 2371, "epoch": 19} {"train_loss": -17.264951705932617, "global_step": 2372, "epoch": 19} {"train_loss": -18.293516159057617, "global_step": 2373, "epoch": 19} {"train_loss": -17.882858276367188, "global_step": 2374, "epoch": 19} {"train_loss": -17.947650909423828, "global_step": 2375, "epoch": 19} {"train_loss": -17.531768798828125, "global_step": 2376, "epoch": 19} {"train_loss": -18.427515029907227, "global_step": 2377, "epoch": 19} {"train_loss": -17.831558227539062, "global_step": 2378, "epoch": 19} {"train_loss": -18.339651107788086, "global_step": 2379, "epoch": 19} {"train_loss": -18.199390411376953, "global_step": 2380, "epoch": 19} {"train_loss": -17.70515251159668, "global_step": 2381, "epoch": 19} {"train_loss": -17.60257339477539, "global_step": 2382, "epoch": 19} {"train_loss": -17.58481216430664, "global_step": 2383, "epoch": 19} {"train_loss": -18.008867263793945, "global_step": 2384, "epoch": 19} {"train_loss": -18.288923263549805, "global_step": 2385, "epoch": 19} {"train_loss": -18.06587028503418, "global_step": 2386, "epoch": 19} {"train_loss": -18.049652099609375, "global_step": 2387, "epoch": 19} {"train_loss": -17.538984298706055, "global_step": 2388, "epoch": 19} {"train_loss": -18.4475154876709, "global_step": 2389, "epoch": 19} {"train_loss": -18.016794204711914, "global_step": 2390, "epoch": 19} {"train_loss": -18.39839744567871, "global_step": 2391, "epoch": 19} {"train_loss": -18.00104331970215, "global_step": 2392, "epoch": 19} {"train_loss": -18.379243850708008, "global_step": 2393, "epoch": 19} {"train_loss": -18.179208755493164, "global_step": 2394, "epoch": 19} {"train_loss": -17.69171142578125, "global_step": 2395, "epoch": 19} {"train_loss": -18.32413101196289, "global_step": 2396, "epoch": 19} {"train_loss": -17.843141555786133, "global_step": 2397, "epoch": 19} {"train_loss": -18.467023849487305, "global_step": 2398, "epoch": 19} {"train_loss": -17.505842208862305, "global_step": 2399, "epoch": 19} {"train_loss": -18.443159103393555, "global_step": 2400, "epoch": 19} {"train_loss": -17.713027954101562, "global_step": 2401, "epoch": 19} {"train_loss": -17.88474464416504, "global_step": 2402, "epoch": 19} {"train_loss": -17.73004150390625, "global_step": 2403, "epoch": 19} {"train_loss": -18.157611846923828, "global_step": 2404, "epoch": 19} {"train_loss": -17.74568748474121, "global_step": 2405, "epoch": 19} {"train_loss": -17.475357055664062, "global_step": 2406, "epoch": 19} {"train_loss": -17.391448974609375, "global_step": 2407, "epoch": 19} {"train_loss": -17.930908203125, "global_step": 2408, "epoch": 19} {"train_loss": -17.336566925048828, "global_step": 2409, "epoch": 19} {"train_loss": -17.759061813354492, "global_step": 2410, "epoch": 19} {"train_loss": -17.550161361694336, "global_step": 2411, "epoch": 19} {"train_loss": -17.873571395874023, "global_step": 2412, "epoch": 19} {"train_loss": -17.6122989654541, "global_step": 2413, "epoch": 19} {"train_loss": -18.23880386352539, "global_step": 2414, "epoch": 19} {"train_loss": -17.766632080078125, "global_step": 2415, "epoch": 19} {"train_loss": -17.57245445251465, "global_step": 2416, "epoch": 19} {"train_loss": -18.07794189453125, "global_step": 2417, "epoch": 19} {"train_loss": -17.856170654296875, "global_step": 2418, "epoch": 19} {"train_loss": -17.893552480650342, "global_step": 2419, "epoch": 19, "val_loss": 2622986.0} {"train_loss": -18.038625717163086, "global_step": 2420, "epoch": 20} {"train_loss": -18.27617835998535, "global_step": 2421, "epoch": 20} {"train_loss": -17.608352661132812, "global_step": 2422, "epoch": 20} {"train_loss": -18.40024185180664, "global_step": 2423, "epoch": 20} {"train_loss": -17.64808464050293, "global_step": 2424, "epoch": 20} {"train_loss": -17.811370849609375, "global_step": 2425, "epoch": 20} {"train_loss": -17.502531051635742, "global_step": 2426, "epoch": 20} {"train_loss": -17.773151397705078, "global_step": 2427, "epoch": 20} {"train_loss": -17.654752731323242, "global_step": 2428, "epoch": 20} {"train_loss": -17.81816291809082, "global_step": 2429, "epoch": 20} {"train_loss": -17.85021209716797, "global_step": 2430, "epoch": 20} {"train_loss": -18.61078453063965, "global_step": 2431, "epoch": 20} {"train_loss": -17.83548355102539, "global_step": 2432, "epoch": 20} {"train_loss": -18.165681838989258, "global_step": 2433, "epoch": 20} {"train_loss": -18.4017391204834, "global_step": 2434, "epoch": 20} {"train_loss": -17.629377365112305, "global_step": 2435, "epoch": 20} {"train_loss": -17.61876678466797, "global_step": 2436, "epoch": 20} {"train_loss": -18.018224716186523, "global_step": 2437, "epoch": 20} {"train_loss": -17.867414474487305, "global_step": 2438, "epoch": 20} {"train_loss": -17.631271362304688, "global_step": 2439, "epoch": 20} {"train_loss": -18.318078994750977, "global_step": 2440, "epoch": 20} {"train_loss": -17.096105575561523, "global_step": 2441, "epoch": 20} {"train_loss": -17.48223876953125, "global_step": 2442, "epoch": 20} {"train_loss": -17.342065811157227, "global_step": 2443, "epoch": 20} {"train_loss": -18.169126510620117, "global_step": 2444, "epoch": 20} {"train_loss": -17.589038848876953, "global_step": 2445, "epoch": 20} {"train_loss": -18.14617919921875, "global_step": 2446, "epoch": 20} {"train_loss": -16.8907413482666, "global_step": 2447, "epoch": 20} {"train_loss": -17.64224624633789, "global_step": 2448, "epoch": 20} {"train_loss": -17.34160614013672, "global_step": 2449, "epoch": 20} {"train_loss": -17.999746322631836, "global_step": 2450, "epoch": 20} {"train_loss": -17.545408248901367, "global_step": 2451, "epoch": 20} {"train_loss": -17.331628799438477, "global_step": 2452, "epoch": 20} {"train_loss": -17.62555694580078, "global_step": 2453, "epoch": 20} {"train_loss": -17.17054557800293, "global_step": 2454, "epoch": 20} {"train_loss": -17.744510650634766, "global_step": 2455, "epoch": 20} {"train_loss": -17.803064346313477, "global_step": 2456, "epoch": 20} {"train_loss": -17.5228271484375, "global_step": 2457, "epoch": 20} {"train_loss": -18.042394638061523, "global_step": 2458, "epoch": 20} {"train_loss": -17.23904800415039, "global_step": 2459, "epoch": 20} {"train_loss": -17.808603286743164, "global_step": 2460, "epoch": 20} {"train_loss": -18.243316650390625, "global_step": 2461, "epoch": 20} {"train_loss": -17.954309463500977, "global_step": 2462, "epoch": 20} {"train_loss": -17.523435592651367, "global_step": 2463, "epoch": 20} {"train_loss": -17.102293014526367, "global_step": 2464, "epoch": 20} {"train_loss": -18.076126098632812, "global_step": 2465, "epoch": 20} {"train_loss": -17.333166122436523, "global_step": 2466, "epoch": 20} {"train_loss": -17.5565128326416, "global_step": 2467, "epoch": 20} {"train_loss": -17.775876998901367, "global_step": 2468, "epoch": 20} {"train_loss": -18.023244857788086, "global_step": 2469, "epoch": 20} {"train_loss": -17.819217681884766, "global_step": 2470, "epoch": 20} {"train_loss": -17.717926025390625, "global_step": 2471, "epoch": 20} {"train_loss": -17.626081466674805, "global_step": 2472, "epoch": 20} {"train_loss": -18.069568634033203, "global_step": 2473, "epoch": 20} {"train_loss": -17.25701904296875, "global_step": 2474, "epoch": 20} {"train_loss": -17.759536743164062, "global_step": 2475, "epoch": 20} {"train_loss": -17.79361915588379, "global_step": 2476, "epoch": 20} {"train_loss": -17.752384185791016, "global_step": 2477, "epoch": 20} {"train_loss": -17.949628829956055, "global_step": 2478, "epoch": 20} {"train_loss": -18.226177215576172, "global_step": 2479, "epoch": 20} {"train_loss": -18.421886444091797, "global_step": 2480, "epoch": 20} {"train_loss": -18.230581283569336, "global_step": 2481, "epoch": 20} {"train_loss": -18.319643020629883, "global_step": 2482, "epoch": 20} {"train_loss": -18.442378997802734, "global_step": 2483, "epoch": 20} {"train_loss": -17.52345848083496, "global_step": 2484, "epoch": 20} {"train_loss": -17.945127487182617, "global_step": 2485, "epoch": 20} {"train_loss": -18.24947166442871, "global_step": 2486, "epoch": 20} {"train_loss": -18.084217071533203, "global_step": 2487, "epoch": 20} {"train_loss": -18.213720321655273, "global_step": 2488, "epoch": 20} {"train_loss": -17.97096824645996, "global_step": 2489, "epoch": 20} {"train_loss": -18.059865951538086, "global_step": 2490, "epoch": 20} {"train_loss": -18.20928192138672, "global_step": 2491, "epoch": 20} {"train_loss": -17.82819938659668, "global_step": 2492, "epoch": 20} {"train_loss": -18.778759002685547, "global_step": 2493, "epoch": 20} {"train_loss": -18.056636810302734, "global_step": 2494, "epoch": 20} {"train_loss": -18.317609786987305, "global_step": 2495, "epoch": 20} {"train_loss": -18.07472038269043, "global_step": 2496, "epoch": 20} {"train_loss": -18.787866592407227, "global_step": 2497, "epoch": 20} {"train_loss": -18.052621841430664, "global_step": 2498, "epoch": 20} {"train_loss": -18.376724243164062, "global_step": 2499, "epoch": 20} {"train_loss": -17.602407455444336, "global_step": 2500, "epoch": 20} {"train_loss": -18.48682975769043, "global_step": 2501, "epoch": 20} {"train_loss": -17.917455673217773, "global_step": 2502, "epoch": 20} {"train_loss": -18.08377456665039, "global_step": 2503, "epoch": 20} {"train_loss": -18.61326789855957, "global_step": 2504, "epoch": 20} {"train_loss": -17.814773559570312, "global_step": 2505, "epoch": 20} {"train_loss": -18.486906051635742, "global_step": 2506, "epoch": 20} {"train_loss": -18.325115203857422, "global_step": 2507, "epoch": 20} {"train_loss": -18.31144905090332, "global_step": 2508, "epoch": 20} {"train_loss": -17.94945526123047, "global_step": 2509, "epoch": 20} {"train_loss": -18.000890731811523, "global_step": 2510, "epoch": 20} {"train_loss": -17.263059616088867, "global_step": 2511, "epoch": 20} {"train_loss": -18.27655601501465, "global_step": 2512, "epoch": 20} {"train_loss": -18.203760147094727, "global_step": 2513, "epoch": 20} {"train_loss": -17.741989135742188, "global_step": 2514, "epoch": 20} {"train_loss": -17.73682975769043, "global_step": 2515, "epoch": 20} {"train_loss": -17.650989532470703, "global_step": 2516, "epoch": 20} {"train_loss": -17.677417755126953, "global_step": 2517, "epoch": 20} {"train_loss": -17.366413116455078, "global_step": 2518, "epoch": 20} {"train_loss": -17.958040237426758, "global_step": 2519, "epoch": 20} {"train_loss": -17.857261657714844, "global_step": 2520, "epoch": 20} {"train_loss": -18.116008758544922, "global_step": 2521, "epoch": 20} {"train_loss": -17.880346298217773, "global_step": 2522, "epoch": 20} {"train_loss": -17.763044357299805, "global_step": 2523, "epoch": 20} {"train_loss": -18.408437728881836, "global_step": 2524, "epoch": 20} {"train_loss": -17.3728084564209, "global_step": 2525, "epoch": 20} {"train_loss": -18.095434188842773, "global_step": 2526, "epoch": 20} {"train_loss": -17.74741554260254, "global_step": 2527, "epoch": 20} {"train_loss": -18.06902503967285, "global_step": 2528, "epoch": 20} {"train_loss": -18.410749435424805, "global_step": 2529, "epoch": 20} {"train_loss": -17.79790496826172, "global_step": 2530, "epoch": 20} {"train_loss": -18.424015045166016, "global_step": 2531, "epoch": 20} {"train_loss": -18.4108943939209, "global_step": 2532, "epoch": 20} {"train_loss": -18.33159828186035, "global_step": 2533, "epoch": 20} {"train_loss": -17.996782302856445, "global_step": 2534, "epoch": 20} {"train_loss": -17.95030403137207, "global_step": 2535, "epoch": 20} {"train_loss": -18.045969009399414, "global_step": 2536, "epoch": 20} {"train_loss": -18.596620559692383, "global_step": 2537, "epoch": 20} {"train_loss": -18.398681640625, "global_step": 2538, "epoch": 20} {"train_loss": -18.424640655517578, "global_step": 2539, "epoch": 20} {"train_loss": -17.929552188589554, "global_step": 2540, "epoch": 20, "val_loss": 2950527.75} {"train_loss": -18.164470672607422, "global_step": 2541, "epoch": 21} {"train_loss": -17.617422103881836, "global_step": 2542, "epoch": 21} {"train_loss": -18.29982566833496, "global_step": 2543, "epoch": 21} {"train_loss": -17.951908111572266, "global_step": 2544, "epoch": 21} {"train_loss": -18.215158462524414, "global_step": 2545, "epoch": 21} {"train_loss": -18.169382095336914, "global_step": 2546, "epoch": 21} {"train_loss": -18.02956771850586, "global_step": 2547, "epoch": 21} {"train_loss": -17.828815460205078, "global_step": 2548, "epoch": 21} {"train_loss": -18.222003936767578, "global_step": 2549, "epoch": 21} {"train_loss": -17.890661239624023, "global_step": 2550, "epoch": 21} {"train_loss": -18.134519577026367, "global_step": 2551, "epoch": 21} {"train_loss": -18.03904151916504, "global_step": 2552, "epoch": 21} {"train_loss": -17.977293014526367, "global_step": 2553, "epoch": 21} {"train_loss": -18.4638671875, "global_step": 2554, "epoch": 21} {"train_loss": -18.055805206298828, "global_step": 2555, "epoch": 21} {"train_loss": -18.415172576904297, "global_step": 2556, "epoch": 21} {"train_loss": -18.154600143432617, "global_step": 2557, "epoch": 21} {"train_loss": -18.433958053588867, "global_step": 2558, "epoch": 21} {"train_loss": -17.98268699645996, "global_step": 2559, "epoch": 21} {"train_loss": -18.42287254333496, "global_step": 2560, "epoch": 21} {"train_loss": -17.966245651245117, "global_step": 2561, "epoch": 21} {"train_loss": -18.59370231628418, "global_step": 2562, "epoch": 21} {"train_loss": -17.74534797668457, "global_step": 2563, "epoch": 21} {"train_loss": -18.330198287963867, "global_step": 2564, "epoch": 21} {"train_loss": -18.455890655517578, "global_step": 2565, "epoch": 21} {"train_loss": -17.989988327026367, "global_step": 2566, "epoch": 21} {"train_loss": -18.19977569580078, "global_step": 2567, "epoch": 21} {"train_loss": -18.237457275390625, "global_step": 2568, "epoch": 21} {"train_loss": -18.22861099243164, "global_step": 2569, "epoch": 21} {"train_loss": -18.231109619140625, "global_step": 2570, "epoch": 21} {"train_loss": -18.130102157592773, "global_step": 2571, "epoch": 21} {"train_loss": -17.77670669555664, "global_step": 2572, "epoch": 21} {"train_loss": -17.84659194946289, "global_step": 2573, "epoch": 21} {"train_loss": -17.691444396972656, "global_step": 2574, "epoch": 21} {"train_loss": -17.990880966186523, "global_step": 2575, "epoch": 21} {"train_loss": -18.186386108398438, "global_step": 2576, "epoch": 21} {"train_loss": -18.33416175842285, "global_step": 2577, "epoch": 21} {"train_loss": -17.89609718322754, "global_step": 2578, "epoch": 21} {"train_loss": -18.48358726501465, "global_step": 2579, "epoch": 21} {"train_loss": -18.627578735351562, "global_step": 2580, "epoch": 21} {"train_loss": -18.336523056030273, "global_step": 2581, "epoch": 21} {"train_loss": -18.15581512451172, "global_step": 2582, "epoch": 21} {"train_loss": -18.2847900390625, "global_step": 2583, "epoch": 21} {"train_loss": -18.086389541625977, "global_step": 2584, "epoch": 21} {"train_loss": -17.67333984375, "global_step": 2585, "epoch": 21} {"train_loss": -17.770158767700195, "global_step": 2586, "epoch": 21} {"train_loss": -18.1483097076416, "global_step": 2587, "epoch": 21} {"train_loss": -17.28218650817871, "global_step": 2588, "epoch": 21} {"train_loss": -18.566181182861328, "global_step": 2589, "epoch": 21} {"train_loss": -17.452272415161133, "global_step": 2590, "epoch": 21} {"train_loss": -18.343759536743164, "global_step": 2591, "epoch": 21} {"train_loss": -17.695926666259766, "global_step": 2592, "epoch": 21} {"train_loss": -18.18112564086914, "global_step": 2593, "epoch": 21} {"train_loss": -17.385265350341797, "global_step": 2594, "epoch": 21} {"train_loss": -18.362796783447266, "global_step": 2595, "epoch": 21} {"train_loss": -18.005935668945312, "global_step": 2596, "epoch": 21} {"train_loss": -18.068822860717773, "global_step": 2597, "epoch": 21} {"train_loss": -17.6234188079834, "global_step": 2598, "epoch": 21} {"train_loss": -18.24349021911621, "global_step": 2599, "epoch": 21} {"train_loss": -18.311132431030273, "global_step": 2600, "epoch": 21} {"train_loss": -17.85795021057129, "global_step": 2601, "epoch": 21} {"train_loss": -18.301315307617188, "global_step": 2602, "epoch": 21} {"train_loss": -18.313095092773438, "global_step": 2603, "epoch": 21} {"train_loss": -17.796096801757812, "global_step": 2604, "epoch": 21} {"train_loss": -18.002277374267578, "global_step": 2605, "epoch": 21} {"train_loss": -17.7667179107666, "global_step": 2606, "epoch": 21} {"train_loss": -18.592187881469727, "global_step": 2607, "epoch": 21} {"train_loss": -18.395780563354492, "global_step": 2608, "epoch": 21} {"train_loss": -18.569061279296875, "global_step": 2609, "epoch": 21} {"train_loss": -17.96307373046875, "global_step": 2610, "epoch": 21} {"train_loss": -18.522846221923828, "global_step": 2611, "epoch": 21} {"train_loss": -18.199462890625, "global_step": 2612, "epoch": 21} {"train_loss": -17.828292846679688, "global_step": 2613, "epoch": 21} {"train_loss": -18.353151321411133, "global_step": 2614, "epoch": 21} {"train_loss": -18.217578887939453, "global_step": 2615, "epoch": 21} {"train_loss": -18.39697265625, "global_step": 2616, "epoch": 21} {"train_loss": -18.197399139404297, "global_step": 2617, "epoch": 21} {"train_loss": -18.37171173095703, "global_step": 2618, "epoch": 21} {"train_loss": -18.517133712768555, "global_step": 2619, "epoch": 21} {"train_loss": -18.24134635925293, "global_step": 2620, "epoch": 21} {"train_loss": -18.116151809692383, "global_step": 2621, "epoch": 21} {"train_loss": -17.705278396606445, "global_step": 2622, "epoch": 21} {"train_loss": -17.680830001831055, "global_step": 2623, "epoch": 21} {"train_loss": -18.311765670776367, "global_step": 2624, "epoch": 21} {"train_loss": -18.39208984375, "global_step": 2625, "epoch": 21} {"train_loss": -18.39323616027832, "global_step": 2626, "epoch": 21} {"train_loss": -18.47369384765625, "global_step": 2627, "epoch": 21} {"train_loss": -18.361005783081055, "global_step": 2628, "epoch": 21} {"train_loss": -18.49356460571289, "global_step": 2629, "epoch": 21} {"train_loss": -17.97962188720703, "global_step": 2630, "epoch": 21} {"train_loss": -18.87826919555664, "global_step": 2631, "epoch": 21} {"train_loss": -18.615890502929688, "global_step": 2632, "epoch": 21} {"train_loss": -18.335140228271484, "global_step": 2633, "epoch": 21} {"train_loss": -18.418853759765625, "global_step": 2634, "epoch": 21} {"train_loss": -18.356403350830078, "global_step": 2635, "epoch": 21} {"train_loss": -18.571176528930664, "global_step": 2636, "epoch": 21} {"train_loss": -17.987886428833008, "global_step": 2637, "epoch": 21} {"train_loss": -18.214750289916992, "global_step": 2638, "epoch": 21} {"train_loss": -18.079153060913086, "global_step": 2639, "epoch": 21} {"train_loss": -18.136606216430664, "global_step": 2640, "epoch": 21} {"train_loss": -18.493560791015625, "global_step": 2641, "epoch": 21} {"train_loss": -18.561670303344727, "global_step": 2642, "epoch": 21} {"train_loss": -18.51861572265625, "global_step": 2643, "epoch": 21} {"train_loss": -18.509109497070312, "global_step": 2644, "epoch": 21} {"train_loss": -18.156875610351562, "global_step": 2645, "epoch": 21} {"train_loss": -18.655609130859375, "global_step": 2646, "epoch": 21} {"train_loss": -17.933364868164062, "global_step": 2647, "epoch": 21} {"train_loss": -18.117223739624023, "global_step": 2648, "epoch": 21} {"train_loss": -18.37158203125, "global_step": 2649, "epoch": 21} {"train_loss": -18.457447052001953, "global_step": 2650, "epoch": 21} {"train_loss": -18.555784225463867, "global_step": 2651, "epoch": 21} {"train_loss": -18.025266647338867, "global_step": 2652, "epoch": 21} {"train_loss": -17.880754470825195, "global_step": 2653, "epoch": 21} {"train_loss": -18.44618797302246, "global_step": 2654, "epoch": 21} {"train_loss": -18.03573226928711, "global_step": 2655, "epoch": 21} {"train_loss": -18.42096710205078, "global_step": 2656, "epoch": 21} {"train_loss": -18.470678329467773, "global_step": 2657, "epoch": 21} {"train_loss": -18.535654067993164, "global_step": 2658, "epoch": 21} {"train_loss": -18.511554718017578, "global_step": 2659, "epoch": 21} {"train_loss": -17.904272079467773, "global_step": 2660, "epoch": 21} {"train_loss": -18.185902398479872, "global_step": 2661, "epoch": 21, "val_loss": 2902490.75} {"train_loss": -18.320405960083008, "global_step": 2662, "epoch": 22} {"train_loss": -18.644079208374023, "global_step": 2663, "epoch": 22} {"train_loss": -18.1319580078125, "global_step": 2664, "epoch": 22} {"train_loss": -18.87183952331543, "global_step": 2665, "epoch": 22} {"train_loss": -18.40474510192871, "global_step": 2666, "epoch": 22} {"train_loss": -18.806480407714844, "global_step": 2667, "epoch": 22} {"train_loss": -18.214101791381836, "global_step": 2668, "epoch": 22} {"train_loss": -18.103622436523438, "global_step": 2669, "epoch": 22} {"train_loss": -18.40370750427246, "global_step": 2670, "epoch": 22} {"train_loss": -18.575183868408203, "global_step": 2671, "epoch": 22} {"train_loss": -18.38326644897461, "global_step": 2672, "epoch": 22} {"train_loss": -18.581825256347656, "global_step": 2673, "epoch": 22} {"train_loss": -18.198694229125977, "global_step": 2674, "epoch": 22} {"train_loss": -18.43450355529785, "global_step": 2675, "epoch": 22} {"train_loss": -18.844783782958984, "global_step": 2676, "epoch": 22} {"train_loss": -18.37371253967285, "global_step": 2677, "epoch": 22} {"train_loss": -18.785429000854492, "global_step": 2678, "epoch": 22} {"train_loss": -17.73885154724121, "global_step": 2679, "epoch": 22} {"train_loss": -17.576749801635742, "global_step": 2680, "epoch": 22} {"train_loss": -17.346078872680664, "global_step": 2681, "epoch": 22} {"train_loss": -18.02968406677246, "global_step": 2682, "epoch": 22} {"train_loss": -17.44767951965332, "global_step": 2683, "epoch": 22} {"train_loss": -18.003816604614258, "global_step": 2684, "epoch": 22} {"train_loss": -17.985410690307617, "global_step": 2685, "epoch": 22} {"train_loss": -17.608379364013672, "global_step": 2686, "epoch": 22} {"train_loss": -18.020029067993164, "global_step": 2687, "epoch": 22} {"train_loss": -17.053234100341797, "global_step": 2688, "epoch": 22} {"train_loss": -17.772701263427734, "global_step": 2689, "epoch": 22} {"train_loss": -18.061986923217773, "global_step": 2690, "epoch": 22} {"train_loss": -18.079191207885742, "global_step": 2691, "epoch": 22} {"train_loss": -18.083154678344727, "global_step": 2692, "epoch": 22} {"train_loss": -17.696340560913086, "global_step": 2693, "epoch": 22} {"train_loss": -18.1001033782959, "global_step": 2694, "epoch": 22} {"train_loss": -18.23990821838379, "global_step": 2695, "epoch": 22} {"train_loss": -17.629018783569336, "global_step": 2696, "epoch": 22} {"train_loss": -18.23201560974121, "global_step": 2697, "epoch": 22} {"train_loss": -18.145687103271484, "global_step": 2698, "epoch": 22} {"train_loss": -17.884254455566406, "global_step": 2699, "epoch": 22} {"train_loss": -18.316162109375, "global_step": 2700, "epoch": 22} {"train_loss": -18.023313522338867, "global_step": 2701, "epoch": 22} {"train_loss": -18.13203239440918, "global_step": 2702, "epoch": 22} {"train_loss": -18.40964126586914, "global_step": 2703, "epoch": 22} {"train_loss": -17.59611701965332, "global_step": 2704, "epoch": 22} {"train_loss": -17.66696548461914, "global_step": 2705, "epoch": 22} {"train_loss": -17.90848159790039, "global_step": 2706, "epoch": 22} {"train_loss": -17.35848045349121, "global_step": 2707, "epoch": 22} {"train_loss": -17.346540451049805, "global_step": 2708, "epoch": 22} {"train_loss": -18.44788932800293, "global_step": 2709, "epoch": 22} {"train_loss": -17.8747615814209, "global_step": 2710, "epoch": 22} {"train_loss": -18.16002655029297, "global_step": 2711, "epoch": 22} {"train_loss": -17.91591453552246, "global_step": 2712, "epoch": 22} {"train_loss": -18.37679100036621, "global_step": 2713, "epoch": 22} {"train_loss": -18.141149520874023, "global_step": 2714, "epoch": 22} {"train_loss": -18.240726470947266, "global_step": 2715, "epoch": 22} {"train_loss": -18.432600021362305, "global_step": 2716, "epoch": 22} {"train_loss": -17.97504997253418, "global_step": 2717, "epoch": 22} {"train_loss": -18.143966674804688, "global_step": 2718, "epoch": 22} {"train_loss": -18.223875045776367, "global_step": 2719, "epoch": 22} {"train_loss": -18.0625, "global_step": 2720, "epoch": 22} {"train_loss": -18.28797721862793, "global_step": 2721, "epoch": 22} {"train_loss": -18.394269943237305, "global_step": 2722, "epoch": 22} {"train_loss": -18.155309677124023, "global_step": 2723, "epoch": 22} {"train_loss": -18.317737579345703, "global_step": 2724, "epoch": 22} {"train_loss": -18.097646713256836, "global_step": 2725, "epoch": 22} {"train_loss": -18.501081466674805, "global_step": 2726, "epoch": 22} {"train_loss": -18.055591583251953, "global_step": 2727, "epoch": 22} {"train_loss": -18.273162841796875, "global_step": 2728, "epoch": 22} {"train_loss": -18.81203269958496, "global_step": 2729, "epoch": 22} {"train_loss": -18.629657745361328, "global_step": 2730, "epoch": 22} {"train_loss": -18.77373695373535, "global_step": 2731, "epoch": 22} {"train_loss": -17.991439819335938, "global_step": 2732, "epoch": 22} {"train_loss": -18.267292022705078, "global_step": 2733, "epoch": 22} {"train_loss": -18.290864944458008, "global_step": 2734, "epoch": 22} {"train_loss": -18.838918685913086, "global_step": 2735, "epoch": 22} {"train_loss": -18.367122650146484, "global_step": 2736, "epoch": 22} {"train_loss": -18.50923728942871, "global_step": 2737, "epoch": 22} {"train_loss": -18.638614654541016, "global_step": 2738, "epoch": 22} {"train_loss": -17.5170955657959, "global_step": 2739, "epoch": 22} {"train_loss": -17.338472366333008, "global_step": 2740, "epoch": 22} {"train_loss": -17.402481079101562, "global_step": 2741, "epoch": 22} {"train_loss": -17.96215057373047, "global_step": 2742, "epoch": 22} {"train_loss": -18.133222579956055, "global_step": 2743, "epoch": 22} {"train_loss": -17.80811309814453, "global_step": 2744, "epoch": 22} {"train_loss": -17.94532585144043, "global_step": 2745, "epoch": 22} {"train_loss": -17.475439071655273, "global_step": 2746, "epoch": 22} {"train_loss": -17.655364990234375, "global_step": 2747, "epoch": 22} {"train_loss": -18.259265899658203, "global_step": 2748, "epoch": 22} {"train_loss": -17.801753997802734, "global_step": 2749, "epoch": 22} {"train_loss": -17.558095932006836, "global_step": 2750, "epoch": 22} {"train_loss": -18.499425888061523, "global_step": 2751, "epoch": 22} {"train_loss": -18.12766456604004, "global_step": 2752, "epoch": 22} {"train_loss": -18.311420440673828, "global_step": 2753, "epoch": 22} {"train_loss": -18.395755767822266, "global_step": 2754, "epoch": 22} {"train_loss": -18.22885513305664, "global_step": 2755, "epoch": 22} {"train_loss": -17.934463500976562, "global_step": 2756, "epoch": 22} {"train_loss": -18.13298988342285, "global_step": 2757, "epoch": 22} {"train_loss": -17.74896240234375, "global_step": 2758, "epoch": 22} {"train_loss": -17.798748016357422, "global_step": 2759, "epoch": 22} {"train_loss": -18.521512985229492, "global_step": 2760, "epoch": 22} {"train_loss": -18.342012405395508, "global_step": 2761, "epoch": 22} {"train_loss": -18.269460678100586, "global_step": 2762, "epoch": 22} {"train_loss": -18.53619956970215, "global_step": 2763, "epoch": 22} {"train_loss": -18.43128776550293, "global_step": 2764, "epoch": 22} {"train_loss": -18.359586715698242, "global_step": 2765, "epoch": 22} {"train_loss": -18.531034469604492, "global_step": 2766, "epoch": 22} {"train_loss": -18.734420776367188, "global_step": 2767, "epoch": 22} {"train_loss": -18.524023056030273, "global_step": 2768, "epoch": 22} {"train_loss": -18.248571395874023, "global_step": 2769, "epoch": 22} {"train_loss": -18.411027908325195, "global_step": 2770, "epoch": 22} {"train_loss": -18.252286911010742, "global_step": 2771, "epoch": 22} {"train_loss": -18.274185180664062, "global_step": 2772, "epoch": 22} {"train_loss": -17.98053550720215, "global_step": 2773, "epoch": 22} {"train_loss": -18.215911865234375, "global_step": 2774, "epoch": 22} {"train_loss": -18.029157638549805, "global_step": 2775, "epoch": 22} {"train_loss": -18.35504722595215, "global_step": 2776, "epoch": 22} {"train_loss": -18.59852409362793, "global_step": 2777, "epoch": 22} {"train_loss": -18.504207611083984, "global_step": 2778, "epoch": 22} {"train_loss": -18.478422164916992, "global_step": 2779, "epoch": 22} {"train_loss": -18.21489906311035, "global_step": 2780, "epoch": 22} {"train_loss": -18.073246002197266, "global_step": 2781, "epoch": 22} {"train_loss": -18.15922035658655, "global_step": 2782, "epoch": 22, "val_loss": 2850214.25} {"train_loss": -18.650737762451172, "global_step": 2783, "epoch": 23} {"train_loss": -18.263277053833008, "global_step": 2784, "epoch": 23} {"train_loss": -18.38128662109375, "global_step": 2785, "epoch": 23} {"train_loss": -18.547317504882812, "global_step": 2786, "epoch": 23} {"train_loss": -18.58660125732422, "global_step": 2787, "epoch": 23} {"train_loss": -18.75072479248047, "global_step": 2788, "epoch": 23} {"train_loss": -18.651165008544922, "global_step": 2789, "epoch": 23} {"train_loss": -18.569351196289062, "global_step": 2790, "epoch": 23} {"train_loss": -18.812171936035156, "global_step": 2791, "epoch": 23} {"train_loss": -19.4898738861084, "global_step": 2792, "epoch": 23} {"train_loss": -18.504545211791992, "global_step": 2793, "epoch": 23} {"train_loss": -18.703725814819336, "global_step": 2794, "epoch": 23} {"train_loss": -18.94916534423828, "global_step": 2795, "epoch": 23} {"train_loss": -18.42681312561035, "global_step": 2796, "epoch": 23} {"train_loss": -18.63764762878418, "global_step": 2797, "epoch": 23} {"train_loss": -18.67816734313965, "global_step": 2798, "epoch": 23} {"train_loss": -18.857276916503906, "global_step": 2799, "epoch": 23} {"train_loss": -18.969993591308594, "global_step": 2800, "epoch": 23} {"train_loss": -18.836978912353516, "global_step": 2801, "epoch": 23} {"train_loss": -18.28679656982422, "global_step": 2802, "epoch": 23} {"train_loss": -17.849567413330078, "global_step": 2803, "epoch": 23} {"train_loss": -18.652332305908203, "global_step": 2804, "epoch": 23} {"train_loss": -18.621362686157227, "global_step": 2805, "epoch": 23} {"train_loss": -18.19962501525879, "global_step": 2806, "epoch": 23} {"train_loss": -18.4814510345459, "global_step": 2807, "epoch": 23} {"train_loss": -18.427814483642578, "global_step": 2808, "epoch": 23} {"train_loss": -18.499561309814453, "global_step": 2809, "epoch": 23} {"train_loss": -18.40563201904297, "global_step": 2810, "epoch": 23} {"train_loss": -18.273563385009766, "global_step": 2811, "epoch": 23} {"train_loss": -18.221834182739258, "global_step": 2812, "epoch": 23} {"train_loss": -18.458744049072266, "global_step": 2813, "epoch": 23} {"train_loss": -17.849002838134766, "global_step": 2814, "epoch": 23} {"train_loss": -18.86444091796875, "global_step": 2815, "epoch": 23} {"train_loss": -18.74880599975586, "global_step": 2816, "epoch": 23} {"train_loss": -19.049163818359375, "global_step": 2817, "epoch": 23} {"train_loss": -17.995817184448242, "global_step": 2818, "epoch": 23} {"train_loss": -18.842737197875977, "global_step": 2819, "epoch": 23} {"train_loss": -18.1637020111084, "global_step": 2820, "epoch": 23} {"train_loss": -18.98682975769043, "global_step": 2821, "epoch": 23} {"train_loss": -18.236644744873047, "global_step": 2822, "epoch": 23} {"train_loss": -18.331533432006836, "global_step": 2823, "epoch": 23} {"train_loss": -18.17774772644043, "global_step": 2824, "epoch": 23} {"train_loss": -18.15938377380371, "global_step": 2825, "epoch": 23} {"train_loss": -18.29300880432129, "global_step": 2826, "epoch": 23} {"train_loss": -18.268878936767578, "global_step": 2827, "epoch": 23} {"train_loss": -18.729473114013672, "global_step": 2828, "epoch": 23} {"train_loss": -18.162311553955078, "global_step": 2829, "epoch": 23} {"train_loss": -18.694913864135742, "global_step": 2830, "epoch": 23} {"train_loss": -18.119970321655273, "global_step": 2831, "epoch": 23} {"train_loss": -18.729520797729492, "global_step": 2832, "epoch": 23} {"train_loss": -18.403152465820312, "global_step": 2833, "epoch": 23} {"train_loss": -18.65711212158203, "global_step": 2834, "epoch": 23} {"train_loss": -18.784521102905273, "global_step": 2835, "epoch": 23} {"train_loss": -18.301244735717773, "global_step": 2836, "epoch": 23} {"train_loss": -18.42705535888672, "global_step": 2837, "epoch": 23} {"train_loss": -17.854230880737305, "global_step": 2838, "epoch": 23} {"train_loss": -18.63007926940918, "global_step": 2839, "epoch": 23} {"train_loss": -18.857269287109375, "global_step": 2840, "epoch": 23} {"train_loss": -18.744232177734375, "global_step": 2841, "epoch": 23} {"train_loss": -18.60418128967285, "global_step": 2842, "epoch": 23} {"train_loss": -18.77065086364746, "global_step": 2843, "epoch": 23} {"train_loss": -18.305845260620117, "global_step": 2844, "epoch": 23} {"train_loss": -18.884130477905273, "global_step": 2845, "epoch": 23} {"train_loss": -18.751585006713867, "global_step": 2846, "epoch": 23} {"train_loss": -18.44605827331543, "global_step": 2847, "epoch": 23} {"train_loss": -19.012863159179688, "global_step": 2848, "epoch": 23} {"train_loss": -18.457002639770508, "global_step": 2849, "epoch": 23} {"train_loss": -18.40467643737793, "global_step": 2850, "epoch": 23} {"train_loss": -18.423635482788086, "global_step": 2851, "epoch": 23} {"train_loss": -18.201826095581055, "global_step": 2852, "epoch": 23} {"train_loss": -18.80280303955078, "global_step": 2853, "epoch": 23} {"train_loss": -17.45477867126465, "global_step": 2854, "epoch": 23} {"train_loss": -18.455781936645508, "global_step": 2855, "epoch": 23} {"train_loss": -18.55549430847168, "global_step": 2856, "epoch": 23} {"train_loss": -19.06510353088379, "global_step": 2857, "epoch": 23} {"train_loss": -18.038053512573242, "global_step": 2858, "epoch": 23} {"train_loss": -17.1807918548584, "global_step": 2859, "epoch": 23} {"train_loss": -18.577978134155273, "global_step": 2860, "epoch": 23} {"train_loss": -17.979969024658203, "global_step": 2861, "epoch": 23} {"train_loss": -18.27948570251465, "global_step": 2862, "epoch": 23} {"train_loss": -18.48818588256836, "global_step": 2863, "epoch": 23} {"train_loss": -18.22913932800293, "global_step": 2864, "epoch": 23} {"train_loss": -18.445322036743164, "global_step": 2865, "epoch": 23} {"train_loss": -18.43881607055664, "global_step": 2866, "epoch": 23} {"train_loss": -18.58413314819336, "global_step": 2867, "epoch": 23} {"train_loss": -18.228946685791016, "global_step": 2868, "epoch": 23} {"train_loss": -18.331525802612305, "global_step": 2869, "epoch": 23} {"train_loss": -17.996912002563477, "global_step": 2870, "epoch": 23} {"train_loss": -18.791357040405273, "global_step": 2871, "epoch": 23} {"train_loss": -18.301151275634766, "global_step": 2872, "epoch": 23} {"train_loss": -18.264476776123047, "global_step": 2873, "epoch": 23} {"train_loss": -18.276596069335938, "global_step": 2874, "epoch": 23} {"train_loss": -18.23485565185547, "global_step": 2875, "epoch": 23} {"train_loss": -18.87033462524414, "global_step": 2876, "epoch": 23} {"train_loss": -18.649023056030273, "global_step": 2877, "epoch": 23} {"train_loss": -18.524066925048828, "global_step": 2878, "epoch": 23} {"train_loss": -18.392539978027344, "global_step": 2879, "epoch": 23} {"train_loss": -18.440420150756836, "global_step": 2880, "epoch": 23} {"train_loss": -17.840845108032227, "global_step": 2881, "epoch": 23} {"train_loss": -18.8717041015625, "global_step": 2882, "epoch": 23} {"train_loss": -18.64753532409668, "global_step": 2883, "epoch": 23} {"train_loss": -18.753751754760742, "global_step": 2884, "epoch": 23} {"train_loss": -17.856706619262695, "global_step": 2885, "epoch": 23} {"train_loss": -18.36337661743164, "global_step": 2886, "epoch": 23} {"train_loss": -18.9755859375, "global_step": 2887, "epoch": 23} {"train_loss": -18.58518409729004, "global_step": 2888, "epoch": 23} {"train_loss": -18.929107666015625, "global_step": 2889, "epoch": 23} {"train_loss": -18.71051025390625, "global_step": 2890, "epoch": 23} {"train_loss": -18.56376075744629, "global_step": 2891, "epoch": 23} {"train_loss": -18.938518524169922, "global_step": 2892, "epoch": 23} {"train_loss": -18.595746994018555, "global_step": 2893, "epoch": 23} {"train_loss": -18.624605178833008, "global_step": 2894, "epoch": 23} {"train_loss": -18.43140411376953, "global_step": 2895, "epoch": 23} {"train_loss": -18.38105583190918, "global_step": 2896, "epoch": 23} {"train_loss": -18.40705680847168, "global_step": 2897, "epoch": 23} {"train_loss": -18.785825729370117, "global_step": 2898, "epoch": 23} {"train_loss": -18.367727279663086, "global_step": 2899, "epoch": 23} {"train_loss": -18.688125610351562, "global_step": 2900, "epoch": 23} {"train_loss": -18.34064483642578, "global_step": 2901, "epoch": 23} {"train_loss": -18.055410385131836, "global_step": 2902, "epoch": 23} {"train_loss": -18.488644497453674, "global_step": 2903, "epoch": 23, "val_loss": 3737364.0} {"train_loss": -18.156206130981445, "global_step": 2904, "epoch": 24} {"train_loss": -18.102163314819336, "global_step": 2905, "epoch": 24} {"train_loss": -18.319576263427734, "global_step": 2906, "epoch": 24} {"train_loss": -18.271142959594727, "global_step": 2907, "epoch": 24} {"train_loss": -17.844223022460938, "global_step": 2908, "epoch": 24} {"train_loss": -18.72494125366211, "global_step": 2909, "epoch": 24} {"train_loss": -18.724218368530273, "global_step": 2910, "epoch": 24} {"train_loss": -18.668066024780273, "global_step": 2911, "epoch": 24} {"train_loss": -18.849456787109375, "global_step": 2912, "epoch": 24} {"train_loss": -18.293243408203125, "global_step": 2913, "epoch": 24} {"train_loss": -18.8442440032959, "global_step": 2914, "epoch": 24} {"train_loss": -18.96999168395996, "global_step": 2915, "epoch": 24} {"train_loss": -18.687009811401367, "global_step": 2916, "epoch": 24} {"train_loss": -18.76458168029785, "global_step": 2917, "epoch": 24} {"train_loss": -18.549957275390625, "global_step": 2918, "epoch": 24} {"train_loss": -18.53516960144043, "global_step": 2919, "epoch": 24} {"train_loss": -18.47333335876465, "global_step": 2920, "epoch": 24} {"train_loss": -19.174285888671875, "global_step": 2921, "epoch": 24} {"train_loss": -18.49091911315918, "global_step": 2922, "epoch": 24} {"train_loss": -18.21874237060547, "global_step": 2923, "epoch": 24} {"train_loss": -18.476856231689453, "global_step": 2924, "epoch": 24} {"train_loss": -18.096174240112305, "global_step": 2925, "epoch": 24} {"train_loss": -17.88525390625, "global_step": 2926, "epoch": 24} {"train_loss": -18.8941650390625, "global_step": 2927, "epoch": 24} {"train_loss": -18.29543113708496, "global_step": 2928, "epoch": 24} {"train_loss": -18.790260314941406, "global_step": 2929, "epoch": 24} {"train_loss": -18.84309959411621, "global_step": 2930, "epoch": 24} {"train_loss": -18.895404815673828, "global_step": 2931, "epoch": 24} {"train_loss": -18.900178909301758, "global_step": 2932, "epoch": 24} {"train_loss": -18.61020278930664, "global_step": 2933, "epoch": 24} {"train_loss": -18.33670425415039, "global_step": 2934, "epoch": 24} {"train_loss": -18.234254837036133, "global_step": 2935, "epoch": 24} {"train_loss": -18.784589767456055, "global_step": 2936, "epoch": 24} {"train_loss": -17.66029930114746, "global_step": 2937, "epoch": 24} {"train_loss": -18.51795768737793, "global_step": 2938, "epoch": 24} {"train_loss": -18.35877799987793, "global_step": 2939, "epoch": 24} {"train_loss": -18.37932777404785, "global_step": 2940, "epoch": 24} {"train_loss": -18.329835891723633, "global_step": 2941, "epoch": 24} {"train_loss": -18.287809371948242, "global_step": 2942, "epoch": 24} {"train_loss": -18.54606056213379, "global_step": 2943, "epoch": 24} {"train_loss": -18.178943634033203, "global_step": 2944, "epoch": 24} {"train_loss": -17.909011840820312, "global_step": 2945, "epoch": 24} {"train_loss": -18.896116256713867, "global_step": 2946, "epoch": 24} {"train_loss": -18.318037033081055, "global_step": 2947, "epoch": 24} {"train_loss": -17.847930908203125, "global_step": 2948, "epoch": 24} {"train_loss": -17.887556076049805, "global_step": 2949, "epoch": 24} {"train_loss": -18.516450881958008, "global_step": 2950, "epoch": 24} {"train_loss": -18.69005584716797, "global_step": 2951, "epoch": 24} {"train_loss": -18.58265495300293, "global_step": 2952, "epoch": 24} {"train_loss": -19.030988693237305, "global_step": 2953, "epoch": 24} {"train_loss": -18.35455894470215, "global_step": 2954, "epoch": 24} {"train_loss": -18.541162490844727, "global_step": 2955, "epoch": 24} {"train_loss": -17.790241241455078, "global_step": 2956, "epoch": 24} {"train_loss": -18.54286003112793, "global_step": 2957, "epoch": 24} {"train_loss": -18.363296508789062, "global_step": 2958, "epoch": 24} {"train_loss": -18.22452735900879, "global_step": 2959, "epoch": 24} {"train_loss": -19.15036392211914, "global_step": 2960, "epoch": 24} {"train_loss": -18.52534294128418, "global_step": 2961, "epoch": 24} {"train_loss": -17.75467300415039, "global_step": 2962, "epoch": 24} {"train_loss": -18.933713912963867, "global_step": 2963, "epoch": 24} {"train_loss": -18.555814743041992, "global_step": 2964, "epoch": 24} {"train_loss": -19.232458114624023, "global_step": 2965, "epoch": 24} {"train_loss": -18.70132827758789, "global_step": 2966, "epoch": 24} {"train_loss": -18.668439865112305, "global_step": 2967, "epoch": 24} {"train_loss": -19.00043296813965, "global_step": 2968, "epoch": 24} {"train_loss": -18.777639389038086, "global_step": 2969, "epoch": 24} {"train_loss": -18.8510799407959, "global_step": 2970, "epoch": 24} {"train_loss": -18.5152530670166, "global_step": 2971, "epoch": 24} {"train_loss": -18.830841064453125, "global_step": 2972, "epoch": 24} {"train_loss": -18.700437545776367, "global_step": 2973, "epoch": 24} {"train_loss": -17.339923858642578, "global_step": 2974, "epoch": 24} {"train_loss": -18.107755661010742, "global_step": 2975, "epoch": 24} {"train_loss": -18.43604850769043, "global_step": 2976, "epoch": 24} {"train_loss": -17.751066207885742, "global_step": 2977, "epoch": 24} {"train_loss": -17.13479232788086, "global_step": 2978, "epoch": 24} {"train_loss": -18.58765983581543, "global_step": 2979, "epoch": 24} {"train_loss": -17.629934310913086, "global_step": 2980, "epoch": 24} {"train_loss": -17.51826286315918, "global_step": 2981, "epoch": 24} {"train_loss": -18.54610252380371, "global_step": 2982, "epoch": 24} {"train_loss": -17.285924911499023, "global_step": 2983, "epoch": 24} {"train_loss": -18.17848777770996, "global_step": 2984, "epoch": 24} {"train_loss": -17.829538345336914, "global_step": 2985, "epoch": 24} {"train_loss": -17.732736587524414, "global_step": 2986, "epoch": 24} {"train_loss": -18.08218765258789, "global_step": 2987, "epoch": 24} {"train_loss": -18.051027297973633, "global_step": 2988, "epoch": 24} {"train_loss": -17.27734375, "global_step": 2989, "epoch": 24} {"train_loss": -18.115829467773438, "global_step": 2990, "epoch": 24} {"train_loss": -18.354995727539062, "global_step": 2991, "epoch": 24} {"train_loss": -18.61737060546875, "global_step": 2992, "epoch": 24} {"train_loss": -18.16120719909668, "global_step": 2993, "epoch": 24} {"train_loss": -18.303936004638672, "global_step": 2994, "epoch": 24} {"train_loss": -18.734731674194336, "global_step": 2995, "epoch": 24} {"train_loss": -18.119667053222656, "global_step": 2996, "epoch": 24} {"train_loss": -17.97782325744629, "global_step": 2997, "epoch": 24} {"train_loss": -18.274072647094727, "global_step": 2998, "epoch": 24} {"train_loss": -17.972671508789062, "global_step": 2999, "epoch": 24} {"train_loss": -17.94782066345215, "global_step": 3000, "epoch": 24} {"train_loss": -18.03081703186035, "global_step": 3001, "epoch": 24} {"train_loss": -18.08856773376465, "global_step": 3002, "epoch": 24} {"train_loss": -18.362462997436523, "global_step": 3003, "epoch": 24} {"train_loss": -18.299880981445312, "global_step": 3004, "epoch": 24} {"train_loss": -18.495100021362305, "global_step": 3005, "epoch": 24} {"train_loss": -19.15435791015625, "global_step": 3006, "epoch": 24} {"train_loss": -18.770063400268555, "global_step": 3007, "epoch": 24} {"train_loss": -18.388776779174805, "global_step": 3008, "epoch": 24} {"train_loss": -18.908493041992188, "global_step": 3009, "epoch": 24} {"train_loss": -18.655080795288086, "global_step": 3010, "epoch": 24} {"train_loss": -18.650409698486328, "global_step": 3011, "epoch": 24} {"train_loss": -18.649343490600586, "global_step": 3012, "epoch": 24} {"train_loss": -18.77425765991211, "global_step": 3013, "epoch": 24} {"train_loss": -18.613792419433594, "global_step": 3014, "epoch": 24} {"train_loss": -18.561864852905273, "global_step": 3015, "epoch": 24} {"train_loss": -18.3797664642334, "global_step": 3016, "epoch": 24} {"train_loss": -18.613067626953125, "global_step": 3017, "epoch": 24} {"train_loss": -17.113401412963867, "global_step": 3018, "epoch": 24} {"train_loss": -18.888742446899414, "global_step": 3019, "epoch": 24} {"train_loss": -17.869251251220703, "global_step": 3020, "epoch": 24} {"train_loss": -18.88050651550293, "global_step": 3021, "epoch": 24} {"train_loss": -18.373579025268555, "global_step": 3022, "epoch": 24} {"train_loss": -18.087024688720703, "global_step": 3023, "epoch": 24} {"train_loss": -18.387391303196427, "global_step": 3024, "epoch": 24, "val_loss": 2674374.75} {"train_loss": -18.625276565551758, "global_step": 3025, "epoch": 25} {"train_loss": -18.78010368347168, "global_step": 3026, "epoch": 25} {"train_loss": -18.346969604492188, "global_step": 3027, "epoch": 25} {"train_loss": -18.558475494384766, "global_step": 3028, "epoch": 25} {"train_loss": -18.876934051513672, "global_step": 3029, "epoch": 25} {"train_loss": -18.83711814880371, "global_step": 3030, "epoch": 25} {"train_loss": -18.958921432495117, "global_step": 3031, "epoch": 25} {"train_loss": -18.9459285736084, "global_step": 3032, "epoch": 25} {"train_loss": -18.6818790435791, "global_step": 3033, "epoch": 25} {"train_loss": -18.611825942993164, "global_step": 3034, "epoch": 25} {"train_loss": -18.75421714782715, "global_step": 3035, "epoch": 25} {"train_loss": -18.607641220092773, "global_step": 3036, "epoch": 25} {"train_loss": -18.994871139526367, "global_step": 3037, "epoch": 25} {"train_loss": -18.31056785583496, "global_step": 3038, "epoch": 25} {"train_loss": -18.236072540283203, "global_step": 3039, "epoch": 25} {"train_loss": -18.26154136657715, "global_step": 3040, "epoch": 25} {"train_loss": -17.6970272064209, "global_step": 3041, "epoch": 25} {"train_loss": -18.498069763183594, "global_step": 3042, "epoch": 25} {"train_loss": -18.559904098510742, "global_step": 3043, "epoch": 25} {"train_loss": -17.84488868713379, "global_step": 3044, "epoch": 25} {"train_loss": -18.407093048095703, "global_step": 3045, "epoch": 25} {"train_loss": -18.037424087524414, "global_step": 3046, "epoch": 25} {"train_loss": -18.91658592224121, "global_step": 3047, "epoch": 25} {"train_loss": -18.360403060913086, "global_step": 3048, "epoch": 25} {"train_loss": -18.436338424682617, "global_step": 3049, "epoch": 25} {"train_loss": -18.528331756591797, "global_step": 3050, "epoch": 25} {"train_loss": -19.061246871948242, "global_step": 3051, "epoch": 25} {"train_loss": -18.98175811767578, "global_step": 3052, "epoch": 25} {"train_loss": -18.23904800415039, "global_step": 3053, "epoch": 25} {"train_loss": -18.413524627685547, "global_step": 3054, "epoch": 25} {"train_loss": -18.00352668762207, "global_step": 3055, "epoch": 25} {"train_loss": -18.660877227783203, "global_step": 3056, "epoch": 25} {"train_loss": -18.599260330200195, "global_step": 3057, "epoch": 25} {"train_loss": -18.413467407226562, "global_step": 3058, "epoch": 25} {"train_loss": -18.66199493408203, "global_step": 3059, "epoch": 25} {"train_loss": -18.709842681884766, "global_step": 3060, "epoch": 25} {"train_loss": -18.208845138549805, "global_step": 3061, "epoch": 25} {"train_loss": -18.377714157104492, "global_step": 3062, "epoch": 25} {"train_loss": -18.74342155456543, "global_step": 3063, "epoch": 25} {"train_loss": -18.743566513061523, "global_step": 3064, "epoch": 25} {"train_loss": -18.920909881591797, "global_step": 3065, "epoch": 25} {"train_loss": -18.623905181884766, "global_step": 3066, "epoch": 25} {"train_loss": -19.330768585205078, "global_step": 3067, "epoch": 25} {"train_loss": -19.07944107055664, "global_step": 3068, "epoch": 25} {"train_loss": -19.212112426757812, "global_step": 3069, "epoch": 25} {"train_loss": -19.67624855041504, "global_step": 3070, "epoch": 25} {"train_loss": -18.74857521057129, "global_step": 3071, "epoch": 25} {"train_loss": -18.43438148498535, "global_step": 3072, "epoch": 25} {"train_loss": -19.277652740478516, "global_step": 3073, "epoch": 25} {"train_loss": -18.103313446044922, "global_step": 3074, "epoch": 25} {"train_loss": -18.8826904296875, "global_step": 3075, "epoch": 25} {"train_loss": -18.446529388427734, "global_step": 3076, "epoch": 25} {"train_loss": -18.707927703857422, "global_step": 3077, "epoch": 25} {"train_loss": -18.661882400512695, "global_step": 3078, "epoch": 25} {"train_loss": -18.281478881835938, "global_step": 3079, "epoch": 25} {"train_loss": -16.67793846130371, "global_step": 3080, "epoch": 25} {"train_loss": -17.296701431274414, "global_step": 3081, "epoch": 25} {"train_loss": -18.04207420349121, "global_step": 3082, "epoch": 25} {"train_loss": -18.092958450317383, "global_step": 3083, "epoch": 25} {"train_loss": -18.025726318359375, "global_step": 3084, "epoch": 25} {"train_loss": -18.64873504638672, "global_step": 3085, "epoch": 25} {"train_loss": -18.016637802124023, "global_step": 3086, "epoch": 25} {"train_loss": -18.63004493713379, "global_step": 3087, "epoch": 25} {"train_loss": -18.63251304626465, "global_step": 3088, "epoch": 25} {"train_loss": -18.758594512939453, "global_step": 3089, "epoch": 25} {"train_loss": -18.52606201171875, "global_step": 3090, "epoch": 25} {"train_loss": -18.139556884765625, "global_step": 3091, "epoch": 25} {"train_loss": -18.37918472290039, "global_step": 3092, "epoch": 25} {"train_loss": -18.305910110473633, "global_step": 3093, "epoch": 25} {"train_loss": -18.048181533813477, "global_step": 3094, "epoch": 25} {"train_loss": -18.362594604492188, "global_step": 3095, "epoch": 25} {"train_loss": -17.9072322845459, "global_step": 3096, "epoch": 25} {"train_loss": -18.565275192260742, "global_step": 3097, "epoch": 25} {"train_loss": -17.60056495666504, "global_step": 3098, "epoch": 25} {"train_loss": -18.502504348754883, "global_step": 3099, "epoch": 25} {"train_loss": -18.426700592041016, "global_step": 3100, "epoch": 25} {"train_loss": -17.915393829345703, "global_step": 3101, "epoch": 25} {"train_loss": -18.565378189086914, "global_step": 3102, "epoch": 25} {"train_loss": -17.900772094726562, "global_step": 3103, "epoch": 25} {"train_loss": -18.053394317626953, "global_step": 3104, "epoch": 25} {"train_loss": -18.426868438720703, "global_step": 3105, "epoch": 25} {"train_loss": -18.667417526245117, "global_step": 3106, "epoch": 25} {"train_loss": -18.38677406311035, "global_step": 3107, "epoch": 25} {"train_loss": -18.711584091186523, "global_step": 3108, "epoch": 25} {"train_loss": -18.28970718383789, "global_step": 3109, "epoch": 25} {"train_loss": -18.710905075073242, "global_step": 3110, "epoch": 25} {"train_loss": -19.040307998657227, "global_step": 3111, "epoch": 25} {"train_loss": -18.816770553588867, "global_step": 3112, "epoch": 25} {"train_loss": -18.83298683166504, "global_step": 3113, "epoch": 25} {"train_loss": -19.03724479675293, "global_step": 3114, "epoch": 25} {"train_loss": -18.696706771850586, "global_step": 3115, "epoch": 25} {"train_loss": -19.122343063354492, "global_step": 3116, "epoch": 25} {"train_loss": -18.473169326782227, "global_step": 3117, "epoch": 25} {"train_loss": -19.192773818969727, "global_step": 3118, "epoch": 25} {"train_loss": -18.933378219604492, "global_step": 3119, "epoch": 25} {"train_loss": -18.904874801635742, "global_step": 3120, "epoch": 25} {"train_loss": -18.215429306030273, "global_step": 3121, "epoch": 25} {"train_loss": -17.291101455688477, "global_step": 3122, "epoch": 25} {"train_loss": -16.59894371032715, "global_step": 3123, "epoch": 25} {"train_loss": -18.067487716674805, "global_step": 3124, "epoch": 25} {"train_loss": -18.324966430664062, "global_step": 3125, "epoch": 25} {"train_loss": -17.703567504882812, "global_step": 3126, "epoch": 25} {"train_loss": -18.19533348083496, "global_step": 3127, "epoch": 25} {"train_loss": -18.331253051757812, "global_step": 3128, "epoch": 25} {"train_loss": -18.314790725708008, "global_step": 3129, "epoch": 25} {"train_loss": -18.058513641357422, "global_step": 3130, "epoch": 25} {"train_loss": -18.632080078125, "global_step": 3131, "epoch": 25} {"train_loss": -18.48687171936035, "global_step": 3132, "epoch": 25} {"train_loss": -16.97612953186035, "global_step": 3133, "epoch": 25} {"train_loss": -18.584156036376953, "global_step": 3134, "epoch": 25} {"train_loss": -17.94965934753418, "global_step": 3135, "epoch": 25} {"train_loss": -18.082473754882812, "global_step": 3136, "epoch": 25} {"train_loss": -18.26050567626953, "global_step": 3137, "epoch": 25} {"train_loss": -17.747648239135742, "global_step": 3138, "epoch": 25} {"train_loss": -18.329566955566406, "global_step": 3139, "epoch": 25} {"train_loss": -18.69886589050293, "global_step": 3140, "epoch": 25} {"train_loss": -18.38675880432129, "global_step": 3141, "epoch": 25} {"train_loss": -18.305377960205078, "global_step": 3142, "epoch": 25} {"train_loss": -18.48793601989746, "global_step": 3143, "epoch": 25} {"train_loss": -18.3104248046875, "global_step": 3144, "epoch": 25} {"train_loss": -18.434457116875766, "global_step": 3145, "epoch": 25, "val_loss": 2483195.5} {"train_loss": -17.818042755126953, "global_step": 3146, "epoch": 26} {"train_loss": -18.4864501953125, "global_step": 3147, "epoch": 26} {"train_loss": -18.135658264160156, "global_step": 3148, "epoch": 26} {"train_loss": -18.817163467407227, "global_step": 3149, "epoch": 26} {"train_loss": -18.201929092407227, "global_step": 3150, "epoch": 26} {"train_loss": -18.611892700195312, "global_step": 3151, "epoch": 26} {"train_loss": -18.22108268737793, "global_step": 3152, "epoch": 26} {"train_loss": -18.877811431884766, "global_step": 3153, "epoch": 26} {"train_loss": -18.440793991088867, "global_step": 3154, "epoch": 26} {"train_loss": -18.880815505981445, "global_step": 3155, "epoch": 26} {"train_loss": -18.74025535583496, "global_step": 3156, "epoch": 26} {"train_loss": -18.755640029907227, "global_step": 3157, "epoch": 26} {"train_loss": -18.719741821289062, "global_step": 3158, "epoch": 26} {"train_loss": -18.6688175201416, "global_step": 3159, "epoch": 26} {"train_loss": -18.767126083374023, "global_step": 3160, "epoch": 26} {"train_loss": -18.69063377380371, "global_step": 3161, "epoch": 26} {"train_loss": -19.120086669921875, "global_step": 3162, "epoch": 26} {"train_loss": -19.353363037109375, "global_step": 3163, "epoch": 26} {"train_loss": -18.774341583251953, "global_step": 3164, "epoch": 26} {"train_loss": -19.149700164794922, "global_step": 3165, "epoch": 26} {"train_loss": -18.60908317565918, "global_step": 3166, "epoch": 26} {"train_loss": -19.182636260986328, "global_step": 3167, "epoch": 26} {"train_loss": -18.584871292114258, "global_step": 3168, "epoch": 26} {"train_loss": -19.094467163085938, "global_step": 3169, "epoch": 26} {"train_loss": -18.92584228515625, "global_step": 3170, "epoch": 26} {"train_loss": -18.96854019165039, "global_step": 3171, "epoch": 26} {"train_loss": -18.399351119995117, "global_step": 3172, "epoch": 26} {"train_loss": -18.430822372436523, "global_step": 3173, "epoch": 26} {"train_loss": -18.92909049987793, "global_step": 3174, "epoch": 26} {"train_loss": -19.12325096130371, "global_step": 3175, "epoch": 26} {"train_loss": -18.73495864868164, "global_step": 3176, "epoch": 26} {"train_loss": -18.762046813964844, "global_step": 3177, "epoch": 26} {"train_loss": -19.383256912231445, "global_step": 3178, "epoch": 26} {"train_loss": -18.625097274780273, "global_step": 3179, "epoch": 26} {"train_loss": -18.32725715637207, "global_step": 3180, "epoch": 26} {"train_loss": -19.19040298461914, "global_step": 3181, "epoch": 26} {"train_loss": -18.902463912963867, "global_step": 3182, "epoch": 26} {"train_loss": -18.73615074157715, "global_step": 3183, "epoch": 26} {"train_loss": -19.330142974853516, "global_step": 3184, "epoch": 26} {"train_loss": -18.9792537689209, "global_step": 3185, "epoch": 26} {"train_loss": -19.137998580932617, "global_step": 3186, "epoch": 26} {"train_loss": -19.162240982055664, "global_step": 3187, "epoch": 26} {"train_loss": -19.31879997253418, "global_step": 3188, "epoch": 26} {"train_loss": -19.04730224609375, "global_step": 3189, "epoch": 26} {"train_loss": -18.559606552124023, "global_step": 3190, "epoch": 26} {"train_loss": -19.259464263916016, "global_step": 3191, "epoch": 26} {"train_loss": -18.705228805541992, "global_step": 3192, "epoch": 26} {"train_loss": -18.82110023498535, "global_step": 3193, "epoch": 26} {"train_loss": -18.32758903503418, "global_step": 3194, "epoch": 26} {"train_loss": -17.851259231567383, "global_step": 3195, "epoch": 26} {"train_loss": -17.96986961364746, "global_step": 3196, "epoch": 26} {"train_loss": -18.706594467163086, "global_step": 3197, "epoch": 26} {"train_loss": -18.536514282226562, "global_step": 3198, "epoch": 26} {"train_loss": -18.52642822265625, "global_step": 3199, "epoch": 26} {"train_loss": -18.548669815063477, "global_step": 3200, "epoch": 26} {"train_loss": -18.70344352722168, "global_step": 3201, "epoch": 26} {"train_loss": -18.419525146484375, "global_step": 3202, "epoch": 26} {"train_loss": -19.205533981323242, "global_step": 3203, "epoch": 26} {"train_loss": -18.752981185913086, "global_step": 3204, "epoch": 26} {"train_loss": -19.00404930114746, "global_step": 3205, "epoch": 26} {"train_loss": -19.096704483032227, "global_step": 3206, "epoch": 26} {"train_loss": -18.840381622314453, "global_step": 3207, "epoch": 26} {"train_loss": -18.808475494384766, "global_step": 3208, "epoch": 26} {"train_loss": -18.863767623901367, "global_step": 3209, "epoch": 26} {"train_loss": -19.116622924804688, "global_step": 3210, "epoch": 26} {"train_loss": -18.875059127807617, "global_step": 3211, "epoch": 26} {"train_loss": -19.039222717285156, "global_step": 3212, "epoch": 26} {"train_loss": -18.435270309448242, "global_step": 3213, "epoch": 26} {"train_loss": -19.39630126953125, "global_step": 3214, "epoch": 26} {"train_loss": -19.08504295349121, "global_step": 3215, "epoch": 26} {"train_loss": -18.68890380859375, "global_step": 3216, "epoch": 26} {"train_loss": -18.742324829101562, "global_step": 3217, "epoch": 26} {"train_loss": -18.596471786499023, "global_step": 3218, "epoch": 26} {"train_loss": -19.446271896362305, "global_step": 3219, "epoch": 26} {"train_loss": -18.150562286376953, "global_step": 3220, "epoch": 26} {"train_loss": -19.117551803588867, "global_step": 3221, "epoch": 26} {"train_loss": -18.348373413085938, "global_step": 3222, "epoch": 26} {"train_loss": -18.65586280822754, "global_step": 3223, "epoch": 26} {"train_loss": -18.960121154785156, "global_step": 3224, "epoch": 26} {"train_loss": -18.023618698120117, "global_step": 3225, "epoch": 26} {"train_loss": -18.41669273376465, "global_step": 3226, "epoch": 26} {"train_loss": -18.161928176879883, "global_step": 3227, "epoch": 26} {"train_loss": -18.034040451049805, "global_step": 3228, "epoch": 26} {"train_loss": -17.9667911529541, "global_step": 3229, "epoch": 26} {"train_loss": -18.27566146850586, "global_step": 3230, "epoch": 26} {"train_loss": -18.319814682006836, "global_step": 3231, "epoch": 26} {"train_loss": -18.61715316772461, "global_step": 3232, "epoch": 26} {"train_loss": -18.665231704711914, "global_step": 3233, "epoch": 26} {"train_loss": -17.711584091186523, "global_step": 3234, "epoch": 26} {"train_loss": -18.571109771728516, "global_step": 3235, "epoch": 26} {"train_loss": -18.325735092163086, "global_step": 3236, "epoch": 26} {"train_loss": -17.975812911987305, "global_step": 3237, "epoch": 26} {"train_loss": -18.809289932250977, "global_step": 3238, "epoch": 26} {"train_loss": -18.324777603149414, "global_step": 3239, "epoch": 26} {"train_loss": -18.34326171875, "global_step": 3240, "epoch": 26} {"train_loss": -18.23358726501465, "global_step": 3241, "epoch": 26} {"train_loss": -18.657875061035156, "global_step": 3242, "epoch": 26} {"train_loss": -18.607343673706055, "global_step": 3243, "epoch": 26} {"train_loss": -18.75379753112793, "global_step": 3244, "epoch": 26} {"train_loss": -18.666393280029297, "global_step": 3245, "epoch": 26} {"train_loss": -18.69659996032715, "global_step": 3246, "epoch": 26} {"train_loss": -19.21638298034668, "global_step": 3247, "epoch": 26} {"train_loss": -18.85453224182129, "global_step": 3248, "epoch": 26} {"train_loss": -19.179861068725586, "global_step": 3249, "epoch": 26} {"train_loss": -19.09280776977539, "global_step": 3250, "epoch": 26} {"train_loss": -18.797622680664062, "global_step": 3251, "epoch": 26} {"train_loss": -18.966575622558594, "global_step": 3252, "epoch": 26} {"train_loss": -19.212890625, "global_step": 3253, "epoch": 26} {"train_loss": -19.601898193359375, "global_step": 3254, "epoch": 26} {"train_loss": -19.31410789489746, "global_step": 3255, "epoch": 26} {"train_loss": -19.457304000854492, "global_step": 3256, "epoch": 26} {"train_loss": -19.192346572875977, "global_step": 3257, "epoch": 26} {"train_loss": -18.529455184936523, "global_step": 3258, "epoch": 26} {"train_loss": -18.903308868408203, "global_step": 3259, "epoch": 26} {"train_loss": -18.16823959350586, "global_step": 3260, "epoch": 26} {"train_loss": -18.493528366088867, "global_step": 3261, "epoch": 26} {"train_loss": -19.05289077758789, "global_step": 3262, "epoch": 26} {"train_loss": -19.49106216430664, "global_step": 3263, "epoch": 26} {"train_loss": -19.13517189025879, "global_step": 3264, "epoch": 26} {"train_loss": -19.24766731262207, "global_step": 3265, "epoch": 26} {"train_loss": -18.743237771278572, "global_step": 3266, "epoch": 26, "val_loss": 2820440.0} {"train_loss": -18.24380874633789, "global_step": 3267, "epoch": 27} {"train_loss": -18.434131622314453, "global_step": 3268, "epoch": 27} {"train_loss": -18.33323860168457, "global_step": 3269, "epoch": 27} {"train_loss": -18.37770652770996, "global_step": 3270, "epoch": 27} {"train_loss": -19.03158950805664, "global_step": 3271, "epoch": 27} {"train_loss": -18.879234313964844, "global_step": 3272, "epoch": 27} {"train_loss": -18.27432632446289, "global_step": 3273, "epoch": 27} {"train_loss": -17.583478927612305, "global_step": 3274, "epoch": 27} {"train_loss": -18.691022872924805, "global_step": 3275, "epoch": 27} {"train_loss": -18.9843692779541, "global_step": 3276, "epoch": 27} {"train_loss": -17.86632537841797, "global_step": 3277, "epoch": 27} {"train_loss": -18.684022903442383, "global_step": 3278, "epoch": 27} {"train_loss": -18.237735748291016, "global_step": 3279, "epoch": 27} {"train_loss": -18.602767944335938, "global_step": 3280, "epoch": 27} {"train_loss": -18.018198013305664, "global_step": 3281, "epoch": 27} {"train_loss": -18.61484146118164, "global_step": 3282, "epoch": 27} {"train_loss": -18.507089614868164, "global_step": 3283, "epoch": 27} {"train_loss": -18.801910400390625, "global_step": 3284, "epoch": 27} {"train_loss": -18.782758712768555, "global_step": 3285, "epoch": 27} {"train_loss": -18.30914306640625, "global_step": 3286, "epoch": 27} {"train_loss": -19.033018112182617, "global_step": 3287, "epoch": 27} {"train_loss": -18.94435691833496, "global_step": 3288, "epoch": 27} {"train_loss": -18.775320053100586, "global_step": 3289, "epoch": 27} {"train_loss": -18.778608322143555, "global_step": 3290, "epoch": 27} {"train_loss": -18.680994033813477, "global_step": 3291, "epoch": 27} {"train_loss": -19.251585006713867, "global_step": 3292, "epoch": 27} {"train_loss": -19.044513702392578, "global_step": 3293, "epoch": 27} {"train_loss": -18.68733024597168, "global_step": 3294, "epoch": 27} {"train_loss": -19.490015029907227, "global_step": 3295, "epoch": 27} {"train_loss": -19.078750610351562, "global_step": 3296, "epoch": 27} {"train_loss": -19.323591232299805, "global_step": 3297, "epoch": 27} {"train_loss": -19.372882843017578, "global_step": 3298, "epoch": 27} {"train_loss": -19.265932083129883, "global_step": 3299, "epoch": 27} {"train_loss": -19.10941505432129, "global_step": 3300, "epoch": 27} {"train_loss": -19.246051788330078, "global_step": 3301, "epoch": 27} {"train_loss": -19.42250633239746, "global_step": 3302, "epoch": 27} {"train_loss": -18.982492446899414, "global_step": 3303, "epoch": 27} {"train_loss": -19.001211166381836, "global_step": 3304, "epoch": 27} {"train_loss": -18.04852294921875, "global_step": 3305, "epoch": 27} {"train_loss": -13.785395622253418, "global_step": 3306, "epoch": 27} {"train_loss": -15.501952171325684, "global_step": 3307, "epoch": 27} {"train_loss": -17.13093376159668, "global_step": 3308, "epoch": 27} {"train_loss": -16.21828842163086, "global_step": 3309, "epoch": 27} {"train_loss": -18.308347702026367, "global_step": 3310, "epoch": 27} {"train_loss": -17.51378631591797, "global_step": 3311, "epoch": 27} {"train_loss": -17.778684616088867, "global_step": 3312, "epoch": 27} {"train_loss": -17.666025161743164, "global_step": 3313, "epoch": 27} {"train_loss": -18.29039192199707, "global_step": 3314, "epoch": 27} {"train_loss": -17.924076080322266, "global_step": 3315, "epoch": 27} {"train_loss": -18.170835494995117, "global_step": 3316, "epoch": 27} {"train_loss": -17.745594024658203, "global_step": 3317, "epoch": 27} {"train_loss": -17.600440979003906, "global_step": 3318, "epoch": 27} {"train_loss": -18.20655632019043, "global_step": 3319, "epoch": 27} {"train_loss": -17.881093978881836, "global_step": 3320, "epoch": 27} {"train_loss": -17.879751205444336, "global_step": 3321, "epoch": 27} {"train_loss": -18.30887794494629, "global_step": 3322, "epoch": 27} {"train_loss": -18.263025283813477, "global_step": 3323, "epoch": 27} {"train_loss": -17.638181686401367, "global_step": 3324, "epoch": 27} {"train_loss": -17.652570724487305, "global_step": 3325, "epoch": 27} {"train_loss": -17.887903213500977, "global_step": 3326, "epoch": 27} {"train_loss": -17.84274673461914, "global_step": 3327, "epoch": 27} {"train_loss": -17.728124618530273, "global_step": 3328, "epoch": 27} {"train_loss": -18.64863395690918, "global_step": 3329, "epoch": 27} {"train_loss": -18.185943603515625, "global_step": 3330, "epoch": 27} {"train_loss": -18.5640811920166, "global_step": 3331, "epoch": 27} {"train_loss": -17.79547119140625, "global_step": 3332, "epoch": 27} {"train_loss": -18.484394073486328, "global_step": 3333, "epoch": 27} {"train_loss": -18.16303253173828, "global_step": 3334, "epoch": 27} {"train_loss": -18.577085494995117, "global_step": 3335, "epoch": 27} {"train_loss": -18.40562629699707, "global_step": 3336, "epoch": 27} {"train_loss": -18.636911392211914, "global_step": 3337, "epoch": 27} {"train_loss": -18.695402145385742, "global_step": 3338, "epoch": 27} {"train_loss": -19.092435836791992, "global_step": 3339, "epoch": 27} {"train_loss": -18.711843490600586, "global_step": 3340, "epoch": 27} {"train_loss": -18.74175453186035, "global_step": 3341, "epoch": 27} {"train_loss": -18.552078247070312, "global_step": 3342, "epoch": 27} {"train_loss": -19.134052276611328, "global_step": 3343, "epoch": 27} {"train_loss": -18.904348373413086, "global_step": 3344, "epoch": 27} {"train_loss": -18.911062240600586, "global_step": 3345, "epoch": 27} {"train_loss": -19.089614868164062, "global_step": 3346, "epoch": 27} {"train_loss": -18.92184829711914, "global_step": 3347, "epoch": 27} {"train_loss": -19.16487693786621, "global_step": 3348, "epoch": 27} {"train_loss": -19.186264038085938, "global_step": 3349, "epoch": 27} {"train_loss": -19.254911422729492, "global_step": 3350, "epoch": 27} {"train_loss": -18.883804321289062, "global_step": 3351, "epoch": 27} {"train_loss": -18.955896377563477, "global_step": 3352, "epoch": 27} {"train_loss": -19.42371940612793, "global_step": 3353, "epoch": 27} {"train_loss": -19.47169303894043, "global_step": 3354, "epoch": 27} {"train_loss": -19.514524459838867, "global_step": 3355, "epoch": 27} {"train_loss": -19.626413345336914, "global_step": 3356, "epoch": 27} {"train_loss": -19.540119171142578, "global_step": 3357, "epoch": 27} {"train_loss": -18.927539825439453, "global_step": 3358, "epoch": 27} {"train_loss": -19.126413345336914, "global_step": 3359, "epoch": 27} {"train_loss": -19.1077938079834, "global_step": 3360, "epoch": 27} {"train_loss": -19.10845375061035, "global_step": 3361, "epoch": 27} {"train_loss": -18.947965621948242, "global_step": 3362, "epoch": 27} {"train_loss": -19.100522994995117, "global_step": 3363, "epoch": 27} {"train_loss": -18.77549171447754, "global_step": 3364, "epoch": 27} {"train_loss": -16.856552124023438, "global_step": 3365, "epoch": 27} {"train_loss": -18.514020919799805, "global_step": 3366, "epoch": 27} {"train_loss": -18.279905319213867, "global_step": 3367, "epoch": 27} {"train_loss": -18.233556747436523, "global_step": 3368, "epoch": 27} {"train_loss": -17.676868438720703, "global_step": 3369, "epoch": 27} {"train_loss": -18.3597469329834, "global_step": 3370, "epoch": 27} {"train_loss": -18.337238311767578, "global_step": 3371, "epoch": 27} {"train_loss": -18.013723373413086, "global_step": 3372, "epoch": 27} {"train_loss": -18.7573184967041, "global_step": 3373, "epoch": 27} {"train_loss": -18.044527053833008, "global_step": 3374, "epoch": 27} {"train_loss": -17.696552276611328, "global_step": 3375, "epoch": 27} {"train_loss": -18.748197555541992, "global_step": 3376, "epoch": 27} {"train_loss": -18.792097091674805, "global_step": 3377, "epoch": 27} {"train_loss": -19.161691665649414, "global_step": 3378, "epoch": 27} {"train_loss": -18.45916175842285, "global_step": 3379, "epoch": 27} {"train_loss": -18.589820861816406, "global_step": 3380, "epoch": 27} {"train_loss": -18.34431266784668, "global_step": 3381, "epoch": 27} {"train_loss": -18.695417404174805, "global_step": 3382, "epoch": 27} {"train_loss": -18.410293579101562, "global_step": 3383, "epoch": 27} {"train_loss": -18.56464958190918, "global_step": 3384, "epoch": 27} {"train_loss": -18.15435218811035, "global_step": 3385, "epoch": 27} {"train_loss": -18.416006088256836, "global_step": 3386, "epoch": 27} {"train_loss": -18.478151431753616, "global_step": 3387, "epoch": 27, "val_loss": 3364543.0} {"train_loss": -19.035451889038086, "global_step": 3388, "epoch": 28} {"train_loss": -18.89957618713379, "global_step": 3389, "epoch": 28} {"train_loss": -19.060152053833008, "global_step": 3390, "epoch": 28} {"train_loss": -18.77104949951172, "global_step": 3391, "epoch": 28} {"train_loss": -18.895793914794922, "global_step": 3392, "epoch": 28} {"train_loss": -19.046634674072266, "global_step": 3393, "epoch": 28} {"train_loss": -19.37964630126953, "global_step": 3394, "epoch": 28} {"train_loss": -18.88720703125, "global_step": 3395, "epoch": 28} {"train_loss": -19.10103416442871, "global_step": 3396, "epoch": 28} {"train_loss": -19.314348220825195, "global_step": 3397, "epoch": 28} {"train_loss": -19.39129638671875, "global_step": 3398, "epoch": 28} {"train_loss": -19.14191436767578, "global_step": 3399, "epoch": 28} {"train_loss": -18.925994873046875, "global_step": 3400, "epoch": 28} {"train_loss": -19.485124588012695, "global_step": 3401, "epoch": 28} {"train_loss": -19.020597457885742, "global_step": 3402, "epoch": 28} {"train_loss": -18.977144241333008, "global_step": 3403, "epoch": 28} {"train_loss": -19.273115158081055, "global_step": 3404, "epoch": 28} {"train_loss": -19.202192306518555, "global_step": 3405, "epoch": 28} {"train_loss": -19.1610107421875, "global_step": 3406, "epoch": 28} {"train_loss": -19.257963180541992, "global_step": 3407, "epoch": 28} {"train_loss": -19.025785446166992, "global_step": 3408, "epoch": 28} {"train_loss": -19.193328857421875, "global_step": 3409, "epoch": 28} {"train_loss": -19.341455459594727, "global_step": 3410, "epoch": 28} {"train_loss": -19.142383575439453, "global_step": 3411, "epoch": 28} {"train_loss": -19.159414291381836, "global_step": 3412, "epoch": 28} {"train_loss": -19.6331729888916, "global_step": 3413, "epoch": 28} {"train_loss": -19.127506256103516, "global_step": 3414, "epoch": 28} {"train_loss": -19.007658004760742, "global_step": 3415, "epoch": 28} {"train_loss": -19.00684928894043, "global_step": 3416, "epoch": 28} {"train_loss": -18.854076385498047, "global_step": 3417, "epoch": 28} {"train_loss": -19.6872501373291, "global_step": 3418, "epoch": 28} {"train_loss": -18.61954116821289, "global_step": 3419, "epoch": 28} {"train_loss": -19.075057983398438, "global_step": 3420, "epoch": 28} {"train_loss": -19.507802963256836, "global_step": 3421, "epoch": 28} {"train_loss": -18.841089248657227, "global_step": 3422, "epoch": 28} {"train_loss": -19.440509796142578, "global_step": 3423, "epoch": 28} {"train_loss": -19.277164459228516, "global_step": 3424, "epoch": 28} {"train_loss": -18.849775314331055, "global_step": 3425, "epoch": 28} {"train_loss": -19.254484176635742, "global_step": 3426, "epoch": 28} {"train_loss": -18.999731063842773, "global_step": 3427, "epoch": 28} {"train_loss": -19.0506649017334, "global_step": 3428, "epoch": 28} {"train_loss": -19.157960891723633, "global_step": 3429, "epoch": 28} {"train_loss": -18.6680850982666, "global_step": 3430, "epoch": 28} {"train_loss": -19.17310905456543, "global_step": 3431, "epoch": 28} {"train_loss": -19.122045516967773, "global_step": 3432, "epoch": 28} {"train_loss": -19.293798446655273, "global_step": 3433, "epoch": 28} {"train_loss": -18.91983413696289, "global_step": 3434, "epoch": 28} {"train_loss": -19.115434646606445, "global_step": 3435, "epoch": 28} {"train_loss": -19.469459533691406, "global_step": 3436, "epoch": 28} {"train_loss": -18.912904739379883, "global_step": 3437, "epoch": 28} {"train_loss": -19.885618209838867, "global_step": 3438, "epoch": 28} {"train_loss": -18.770986557006836, "global_step": 3439, "epoch": 28} {"train_loss": -18.182947158813477, "global_step": 3440, "epoch": 28} {"train_loss": -18.868431091308594, "global_step": 3441, "epoch": 28} {"train_loss": -18.794614791870117, "global_step": 3442, "epoch": 28} {"train_loss": -19.24532127380371, "global_step": 3443, "epoch": 28} {"train_loss": -18.6124210357666, "global_step": 3444, "epoch": 28} {"train_loss": -18.39979362487793, "global_step": 3445, "epoch": 28} {"train_loss": -19.0413761138916, "global_step": 3446, "epoch": 28} {"train_loss": -18.834814071655273, "global_step": 3447, "epoch": 28} {"train_loss": -19.22226333618164, "global_step": 3448, "epoch": 28} {"train_loss": -18.622961044311523, "global_step": 3449, "epoch": 28} {"train_loss": -19.291677474975586, "global_step": 3450, "epoch": 28} {"train_loss": -18.361894607543945, "global_step": 3451, "epoch": 28} {"train_loss": -19.356054306030273, "global_step": 3452, "epoch": 28} {"train_loss": -18.548734664916992, "global_step": 3453, "epoch": 28} {"train_loss": -19.107851028442383, "global_step": 3454, "epoch": 28} {"train_loss": -18.54769515991211, "global_step": 3455, "epoch": 28} {"train_loss": -19.08099365234375, "global_step": 3456, "epoch": 28} {"train_loss": -19.082500457763672, "global_step": 3457, "epoch": 28} {"train_loss": -19.009424209594727, "global_step": 3458, "epoch": 28} {"train_loss": -18.544790267944336, "global_step": 3459, "epoch": 28} {"train_loss": -19.263086318969727, "global_step": 3460, "epoch": 28} {"train_loss": -18.21551513671875, "global_step": 3461, "epoch": 28} {"train_loss": -18.655410766601562, "global_step": 3462, "epoch": 28} {"train_loss": -19.363561630249023, "global_step": 3463, "epoch": 28} {"train_loss": -19.149551391601562, "global_step": 3464, "epoch": 28} {"train_loss": -19.18220329284668, "global_step": 3465, "epoch": 28} {"train_loss": -18.579927444458008, "global_step": 3466, "epoch": 28} {"train_loss": -18.816354751586914, "global_step": 3467, "epoch": 28} {"train_loss": -19.035715103149414, "global_step": 3468, "epoch": 28} {"train_loss": -19.406469345092773, "global_step": 3469, "epoch": 28} {"train_loss": -19.323429107666016, "global_step": 3470, "epoch": 28} {"train_loss": -19.218551635742188, "global_step": 3471, "epoch": 28} {"train_loss": -19.160614013671875, "global_step": 3472, "epoch": 28} {"train_loss": -19.155683517456055, "global_step": 3473, "epoch": 28} {"train_loss": -18.935361862182617, "global_step": 3474, "epoch": 28} {"train_loss": -19.49152183532715, "global_step": 3475, "epoch": 28} {"train_loss": -19.242115020751953, "global_step": 3476, "epoch": 28} {"train_loss": -19.659313201904297, "global_step": 3477, "epoch": 28} {"train_loss": -19.394933700561523, "global_step": 3478, "epoch": 28} {"train_loss": -19.577411651611328, "global_step": 3479, "epoch": 28} {"train_loss": -19.499469757080078, "global_step": 3480, "epoch": 28} {"train_loss": -19.286685943603516, "global_step": 3481, "epoch": 28} {"train_loss": -18.787845611572266, "global_step": 3482, "epoch": 28} {"train_loss": -19.280622482299805, "global_step": 3483, "epoch": 28} {"train_loss": -18.435529708862305, "global_step": 3484, "epoch": 28} {"train_loss": -19.2681827545166, "global_step": 3485, "epoch": 28} {"train_loss": -18.549816131591797, "global_step": 3486, "epoch": 28} {"train_loss": -19.679513931274414, "global_step": 3487, "epoch": 28} {"train_loss": -19.174726486206055, "global_step": 3488, "epoch": 28} {"train_loss": -19.092864990234375, "global_step": 3489, "epoch": 28} {"train_loss": -18.548940658569336, "global_step": 3490, "epoch": 28} {"train_loss": -19.35615348815918, "global_step": 3491, "epoch": 28} {"train_loss": -18.983457565307617, "global_step": 3492, "epoch": 28} {"train_loss": -19.168344497680664, "global_step": 3493, "epoch": 28} {"train_loss": -18.42171287536621, "global_step": 3494, "epoch": 28} {"train_loss": -19.533472061157227, "global_step": 3495, "epoch": 28} {"train_loss": -19.03969383239746, "global_step": 3496, "epoch": 28} {"train_loss": -19.038349151611328, "global_step": 3497, "epoch": 28} {"train_loss": -18.62738037109375, "global_step": 3498, "epoch": 28} {"train_loss": -19.044023513793945, "global_step": 3499, "epoch": 28} {"train_loss": -18.72928810119629, "global_step": 3500, "epoch": 28} {"train_loss": -19.00474739074707, "global_step": 3501, "epoch": 28} {"train_loss": -18.784286499023438, "global_step": 3502, "epoch": 28} {"train_loss": -19.181859970092773, "global_step": 3503, "epoch": 28} {"train_loss": -18.838886260986328, "global_step": 3504, "epoch": 28} {"train_loss": -18.90774917602539, "global_step": 3505, "epoch": 28} {"train_loss": -19.355016708374023, "global_step": 3506, "epoch": 28} {"train_loss": -18.913192749023438, "global_step": 3507, "epoch": 28} {"train_loss": -19.05667186768587, "global_step": 3508, "epoch": 28, "val_loss": 3261648.75} {"train_loss": -18.69830894470215, "global_step": 3509, "epoch": 29} {"train_loss": -19.045001983642578, "global_step": 3510, "epoch": 29} {"train_loss": -19.116809844970703, "global_step": 3511, "epoch": 29} {"train_loss": -19.07111358642578, "global_step": 3512, "epoch": 29} {"train_loss": -19.08648681640625, "global_step": 3513, "epoch": 29} {"train_loss": -19.168872833251953, "global_step": 3514, "epoch": 29} {"train_loss": -19.011157989501953, "global_step": 3515, "epoch": 29} {"train_loss": -19.45228385925293, "global_step": 3516, "epoch": 29} {"train_loss": -18.726791381835938, "global_step": 3517, "epoch": 29} {"train_loss": -19.145889282226562, "global_step": 3518, "epoch": 29} {"train_loss": -19.080175399780273, "global_step": 3519, "epoch": 29} {"train_loss": -18.930776596069336, "global_step": 3520, "epoch": 29} {"train_loss": -18.441333770751953, "global_step": 3521, "epoch": 29} {"train_loss": -19.143835067749023, "global_step": 3522, "epoch": 29} {"train_loss": -19.31505012512207, "global_step": 3523, "epoch": 29} {"train_loss": -18.72612953186035, "global_step": 3524, "epoch": 29} {"train_loss": -19.126663208007812, "global_step": 3525, "epoch": 29} {"train_loss": -18.668928146362305, "global_step": 3526, "epoch": 29} {"train_loss": -19.434423446655273, "global_step": 3527, "epoch": 29} {"train_loss": -19.0956974029541, "global_step": 3528, "epoch": 29} {"train_loss": -19.186115264892578, "global_step": 3529, "epoch": 29} {"train_loss": -19.061248779296875, "global_step": 3530, "epoch": 29} {"train_loss": -18.676380157470703, "global_step": 3531, "epoch": 29} {"train_loss": -19.545995712280273, "global_step": 3532, "epoch": 29} {"train_loss": -19.203672409057617, "global_step": 3533, "epoch": 29} {"train_loss": -19.5768985748291, "global_step": 3534, "epoch": 29} {"train_loss": -18.70142936706543, "global_step": 3535, "epoch": 29} {"train_loss": -19.319477081298828, "global_step": 3536, "epoch": 29} {"train_loss": -19.250478744506836, "global_step": 3537, "epoch": 29} {"train_loss": -19.14350700378418, "global_step": 3538, "epoch": 29} {"train_loss": -19.22462272644043, "global_step": 3539, "epoch": 29} {"train_loss": -19.655000686645508, "global_step": 3540, "epoch": 29} {"train_loss": -18.623910903930664, "global_step": 3541, "epoch": 29} {"train_loss": -19.589099884033203, "global_step": 3542, "epoch": 29} {"train_loss": -19.363449096679688, "global_step": 3543, "epoch": 29} {"train_loss": -19.678762435913086, "global_step": 3544, "epoch": 29} {"train_loss": -19.076215744018555, "global_step": 3545, "epoch": 29} {"train_loss": -19.430505752563477, "global_step": 3546, "epoch": 29} {"train_loss": -18.56722640991211, "global_step": 3547, "epoch": 29} {"train_loss": -19.60609245300293, "global_step": 3548, "epoch": 29} {"train_loss": -19.34943389892578, "global_step": 3549, "epoch": 29} {"train_loss": -19.325483322143555, "global_step": 3550, "epoch": 29} {"train_loss": -18.953004837036133, "global_step": 3551, "epoch": 29} {"train_loss": -19.351953506469727, "global_step": 3552, "epoch": 29} {"train_loss": -18.924196243286133, "global_step": 3553, "epoch": 29} {"train_loss": -19.179311752319336, "global_step": 3554, "epoch": 29} {"train_loss": -19.32844352722168, "global_step": 3555, "epoch": 29} {"train_loss": -19.065723419189453, "global_step": 3556, "epoch": 29} {"train_loss": -19.341693878173828, "global_step": 3557, "epoch": 29} {"train_loss": -19.361391067504883, "global_step": 3558, "epoch": 29} {"train_loss": -19.50522232055664, "global_step": 3559, "epoch": 29} {"train_loss": -18.806276321411133, "global_step": 3560, "epoch": 29} {"train_loss": -18.880430221557617, "global_step": 3561, "epoch": 29} {"train_loss": -18.9571590423584, "global_step": 3562, "epoch": 29} {"train_loss": -19.220232009887695, "global_step": 3563, "epoch": 29} {"train_loss": -18.952850341796875, "global_step": 3564, "epoch": 29} {"train_loss": -18.4310359954834, "global_step": 3565, "epoch": 29} {"train_loss": -19.42986488342285, "global_step": 3566, "epoch": 29} {"train_loss": -19.3660945892334, "global_step": 3567, "epoch": 29} {"train_loss": -19.961240768432617, "global_step": 3568, "epoch": 29} {"train_loss": -19.24176597595215, "global_step": 3569, "epoch": 29} {"train_loss": -19.622108459472656, "global_step": 3570, "epoch": 29} {"train_loss": -19.491994857788086, "global_step": 3571, "epoch": 29} {"train_loss": -19.680755615234375, "global_step": 3572, "epoch": 29} {"train_loss": -19.290124893188477, "global_step": 3573, "epoch": 29} {"train_loss": -19.914180755615234, "global_step": 3574, "epoch": 29} {"train_loss": -19.131174087524414, "global_step": 3575, "epoch": 29} {"train_loss": -19.82565689086914, "global_step": 3576, "epoch": 29} {"train_loss": -19.822540283203125, "global_step": 3577, "epoch": 29} {"train_loss": -19.640810012817383, "global_step": 3578, "epoch": 29} {"train_loss": -19.418413162231445, "global_step": 3579, "epoch": 29} {"train_loss": -19.161069869995117, "global_step": 3580, "epoch": 29} {"train_loss": -19.356840133666992, "global_step": 3581, "epoch": 29} {"train_loss": -19.292238235473633, "global_step": 3582, "epoch": 29} {"train_loss": -19.27869415283203, "global_step": 3583, "epoch": 29} {"train_loss": -19.3017520904541, "global_step": 3584, "epoch": 29} {"train_loss": -20.25070571899414, "global_step": 3585, "epoch": 29} {"train_loss": -18.78687286376953, "global_step": 3586, "epoch": 29} {"train_loss": -19.436969757080078, "global_step": 3587, "epoch": 29} {"train_loss": -19.459684371948242, "global_step": 3588, "epoch": 29} {"train_loss": -19.58771324157715, "global_step": 3589, "epoch": 29} {"train_loss": -18.693851470947266, "global_step": 3590, "epoch": 29} {"train_loss": -19.839519500732422, "global_step": 3591, "epoch": 29} {"train_loss": -19.323810577392578, "global_step": 3592, "epoch": 29} {"train_loss": -19.33868408203125, "global_step": 3593, "epoch": 29} {"train_loss": -19.425947189331055, "global_step": 3594, "epoch": 29} {"train_loss": -19.759368896484375, "global_step": 3595, "epoch": 29} {"train_loss": -19.627214431762695, "global_step": 3596, "epoch": 29} {"train_loss": -19.675865173339844, "global_step": 3597, "epoch": 29} {"train_loss": -19.488910675048828, "global_step": 3598, "epoch": 29} {"train_loss": -19.07206916809082, "global_step": 3599, "epoch": 29} {"train_loss": -19.59921646118164, "global_step": 3600, "epoch": 29} {"train_loss": -19.655858993530273, "global_step": 3601, "epoch": 29} {"train_loss": -18.41001319885254, "global_step": 3602, "epoch": 29} {"train_loss": -17.319538116455078, "global_step": 3603, "epoch": 29} {"train_loss": -19.288501739501953, "global_step": 3604, "epoch": 29} {"train_loss": -18.00954246520996, "global_step": 3605, "epoch": 29} {"train_loss": -19.49068832397461, "global_step": 3606, "epoch": 29} {"train_loss": -18.65004539489746, "global_step": 3607, "epoch": 29} {"train_loss": -18.861352920532227, "global_step": 3608, "epoch": 29} {"train_loss": -19.626691818237305, "global_step": 3609, "epoch": 29} {"train_loss": -18.48795509338379, "global_step": 3610, "epoch": 29} {"train_loss": -19.292865753173828, "global_step": 3611, "epoch": 29} {"train_loss": -19.3135986328125, "global_step": 3612, "epoch": 29} {"train_loss": -19.15838050842285, "global_step": 3613, "epoch": 29} {"train_loss": -19.222627639770508, "global_step": 3614, "epoch": 29} {"train_loss": -19.447654724121094, "global_step": 3615, "epoch": 29} {"train_loss": -18.938526153564453, "global_step": 3616, "epoch": 29} {"train_loss": -18.880264282226562, "global_step": 3617, "epoch": 29} {"train_loss": -19.57991600036621, "global_step": 3618, "epoch": 29} {"train_loss": -19.239652633666992, "global_step": 3619, "epoch": 29} {"train_loss": -18.879684448242188, "global_step": 3620, "epoch": 29} {"train_loss": -19.45768165588379, "global_step": 3621, "epoch": 29} {"train_loss": -19.603296279907227, "global_step": 3622, "epoch": 29} {"train_loss": -19.398902893066406, "global_step": 3623, "epoch": 29} {"train_loss": -19.26372718811035, "global_step": 3624, "epoch": 29} {"train_loss": -19.789417266845703, "global_step": 3625, "epoch": 29} {"train_loss": -19.092527389526367, "global_step": 3626, "epoch": 29} {"train_loss": -19.291433334350586, "global_step": 3627, "epoch": 29} {"train_loss": -19.010135650634766, "global_step": 3628, "epoch": 29} {"train_loss": -19.210533205142692, "global_step": 3629, "epoch": 29, "val_loss": 2894912.0} {"train_loss": -18.47170066833496, "global_step": 3630, "epoch": 30} {"train_loss": -19.43564796447754, "global_step": 3631, "epoch": 30} {"train_loss": -19.321691513061523, "global_step": 3632, "epoch": 30} {"train_loss": -19.073143005371094, "global_step": 3633, "epoch": 30} {"train_loss": -18.7138671875, "global_step": 3634, "epoch": 30} {"train_loss": -19.45701026916504, "global_step": 3635, "epoch": 30} {"train_loss": -18.939870834350586, "global_step": 3636, "epoch": 30} {"train_loss": -19.189725875854492, "global_step": 3637, "epoch": 30} {"train_loss": -18.867734909057617, "global_step": 3638, "epoch": 30} {"train_loss": -19.346548080444336, "global_step": 3639, "epoch": 30} {"train_loss": -18.836578369140625, "global_step": 3640, "epoch": 30} {"train_loss": -20.01399803161621, "global_step": 3641, "epoch": 30} {"train_loss": -19.20319938659668, "global_step": 3642, "epoch": 30} {"train_loss": -19.514450073242188, "global_step": 3643, "epoch": 30} {"train_loss": -19.21898651123047, "global_step": 3644, "epoch": 30} {"train_loss": -19.745220184326172, "global_step": 3645, "epoch": 30} {"train_loss": -19.526473999023438, "global_step": 3646, "epoch": 30} {"train_loss": -19.076475143432617, "global_step": 3647, "epoch": 30} {"train_loss": -19.697099685668945, "global_step": 3648, "epoch": 30} {"train_loss": -19.42706871032715, "global_step": 3649, "epoch": 30} {"train_loss": -19.167665481567383, "global_step": 3650, "epoch": 30} {"train_loss": -19.310697555541992, "global_step": 3651, "epoch": 30} {"train_loss": -19.73170280456543, "global_step": 3652, "epoch": 30} {"train_loss": -19.331212997436523, "global_step": 3653, "epoch": 30} {"train_loss": -19.961700439453125, "global_step": 3654, "epoch": 30} {"train_loss": -19.704885482788086, "global_step": 3655, "epoch": 30} {"train_loss": -19.71877670288086, "global_step": 3656, "epoch": 30} {"train_loss": -19.444669723510742, "global_step": 3657, "epoch": 30} {"train_loss": -18.976041793823242, "global_step": 3658, "epoch": 30} {"train_loss": -19.90313148498535, "global_step": 3659, "epoch": 30} {"train_loss": -19.233539581298828, "global_step": 3660, "epoch": 30} {"train_loss": -18.841978073120117, "global_step": 3661, "epoch": 30} {"train_loss": -20.033309936523438, "global_step": 3662, "epoch": 30} {"train_loss": -18.849597930908203, "global_step": 3663, "epoch": 30} {"train_loss": -19.809438705444336, "global_step": 3664, "epoch": 30} {"train_loss": -19.19269371032715, "global_step": 3665, "epoch": 30} {"train_loss": -19.84021759033203, "global_step": 3666, "epoch": 30} {"train_loss": -18.391794204711914, "global_step": 3667, "epoch": 30} {"train_loss": -18.621959686279297, "global_step": 3668, "epoch": 30} {"train_loss": -19.059459686279297, "global_step": 3669, "epoch": 30} {"train_loss": -19.675113677978516, "global_step": 3670, "epoch": 30} {"train_loss": -18.852296829223633, "global_step": 3671, "epoch": 30} {"train_loss": -18.570398330688477, "global_step": 3672, "epoch": 30} {"train_loss": -19.353116989135742, "global_step": 3673, "epoch": 30} {"train_loss": -19.439733505249023, "global_step": 3674, "epoch": 30} {"train_loss": -19.394683837890625, "global_step": 3675, "epoch": 30} {"train_loss": -19.509801864624023, "global_step": 3676, "epoch": 30} {"train_loss": -18.955167770385742, "global_step": 3677, "epoch": 30} {"train_loss": -19.449939727783203, "global_step": 3678, "epoch": 30} {"train_loss": -19.26856803894043, "global_step": 3679, "epoch": 30} {"train_loss": -19.719818115234375, "global_step": 3680, "epoch": 30} {"train_loss": -19.444746017456055, "global_step": 3681, "epoch": 30} {"train_loss": -19.101037979125977, "global_step": 3682, "epoch": 30} {"train_loss": -19.368423461914062, "global_step": 3683, "epoch": 30} {"train_loss": -19.16860008239746, "global_step": 3684, "epoch": 30} {"train_loss": -19.480531692504883, "global_step": 3685, "epoch": 30} {"train_loss": -19.446149826049805, "global_step": 3686, "epoch": 30} {"train_loss": -19.595544815063477, "global_step": 3687, "epoch": 30} {"train_loss": -19.77100372314453, "global_step": 3688, "epoch": 30} {"train_loss": -19.492481231689453, "global_step": 3689, "epoch": 30} {"train_loss": -19.480924606323242, "global_step": 3690, "epoch": 30} {"train_loss": -19.54311180114746, "global_step": 3691, "epoch": 30} {"train_loss": -19.557098388671875, "global_step": 3692, "epoch": 30} {"train_loss": -19.501760482788086, "global_step": 3693, "epoch": 30} {"train_loss": -19.227827072143555, "global_step": 3694, "epoch": 30} {"train_loss": -19.19137954711914, "global_step": 3695, "epoch": 30} {"train_loss": -18.132251739501953, "global_step": 3696, "epoch": 30} {"train_loss": -19.45660400390625, "global_step": 3697, "epoch": 30} {"train_loss": -19.41231346130371, "global_step": 3698, "epoch": 30} {"train_loss": -19.27899742126465, "global_step": 3699, "epoch": 30} {"train_loss": -19.904434204101562, "global_step": 3700, "epoch": 30} {"train_loss": -19.85154914855957, "global_step": 3701, "epoch": 30} {"train_loss": -19.47500991821289, "global_step": 3702, "epoch": 30} {"train_loss": -19.717695236206055, "global_step": 3703, "epoch": 30} {"train_loss": -19.647092819213867, "global_step": 3704, "epoch": 30} {"train_loss": -19.421245574951172, "global_step": 3705, "epoch": 30} {"train_loss": -19.555795669555664, "global_step": 3706, "epoch": 30} {"train_loss": -19.331525802612305, "global_step": 3707, "epoch": 30} {"train_loss": -19.6199951171875, "global_step": 3708, "epoch": 30} {"train_loss": -19.5372314453125, "global_step": 3709, "epoch": 30} {"train_loss": -19.269399642944336, "global_step": 3710, "epoch": 30} {"train_loss": -19.839109420776367, "global_step": 3711, "epoch": 30} {"train_loss": -19.353322982788086, "global_step": 3712, "epoch": 30} {"train_loss": -18.921247482299805, "global_step": 3713, "epoch": 30} {"train_loss": -17.01649284362793, "global_step": 3714, "epoch": 30} {"train_loss": -19.344125747680664, "global_step": 3715, "epoch": 30} {"train_loss": -19.325496673583984, "global_step": 3716, "epoch": 30} {"train_loss": -19.501415252685547, "global_step": 3717, "epoch": 30} {"train_loss": -19.25705909729004, "global_step": 3718, "epoch": 30} {"train_loss": -19.7432861328125, "global_step": 3719, "epoch": 30} {"train_loss": -18.929428100585938, "global_step": 3720, "epoch": 30} {"train_loss": -19.718847274780273, "global_step": 3721, "epoch": 30} {"train_loss": -18.714797973632812, "global_step": 3722, "epoch": 30} {"train_loss": -18.342029571533203, "global_step": 3723, "epoch": 30} {"train_loss": -19.173532485961914, "global_step": 3724, "epoch": 30} {"train_loss": -19.250417709350586, "global_step": 3725, "epoch": 30} {"train_loss": -19.565814971923828, "global_step": 3726, "epoch": 30} {"train_loss": -19.326322555541992, "global_step": 3727, "epoch": 30} {"train_loss": -19.71982765197754, "global_step": 3728, "epoch": 30} {"train_loss": -19.323780059814453, "global_step": 3729, "epoch": 30} {"train_loss": -19.658740997314453, "global_step": 3730, "epoch": 30} {"train_loss": -19.22587776184082, "global_step": 3731, "epoch": 30} {"train_loss": -19.867380142211914, "global_step": 3732, "epoch": 30} {"train_loss": -19.273054122924805, "global_step": 3733, "epoch": 30} {"train_loss": -19.210840225219727, "global_step": 3734, "epoch": 30} {"train_loss": -19.6119327545166, "global_step": 3735, "epoch": 30} {"train_loss": -19.17002296447754, "global_step": 3736, "epoch": 30} {"train_loss": -19.920425415039062, "global_step": 3737, "epoch": 30} {"train_loss": -19.43055534362793, "global_step": 3738, "epoch": 30} {"train_loss": -19.796716690063477, "global_step": 3739, "epoch": 30} {"train_loss": -19.760149002075195, "global_step": 3740, "epoch": 30} {"train_loss": -19.545461654663086, "global_step": 3741, "epoch": 30} {"train_loss": -19.879436492919922, "global_step": 3742, "epoch": 30} {"train_loss": -19.37410545349121, "global_step": 3743, "epoch": 30} {"train_loss": -19.88649559020996, "global_step": 3744, "epoch": 30} {"train_loss": -19.575374603271484, "global_step": 3745, "epoch": 30} {"train_loss": -20.04495620727539, "global_step": 3746, "epoch": 30} {"train_loss": -18.33833122253418, "global_step": 3747, "epoch": 30} {"train_loss": -17.006288528442383, "global_step": 3748, "epoch": 30} {"train_loss": -17.978832244873047, "global_step": 3749, "epoch": 30} {"train_loss": -19.319863374568214, "global_step": 3750, "epoch": 30, "val_loss": 2792552.0} {"train_loss": -18.54396629333496, "global_step": 3751, "epoch": 31} {"train_loss": -18.414615631103516, "global_step": 3752, "epoch": 31} {"train_loss": -19.650033950805664, "global_step": 3753, "epoch": 31} {"train_loss": -19.123525619506836, "global_step": 3754, "epoch": 31} {"train_loss": -18.666486740112305, "global_step": 3755, "epoch": 31} {"train_loss": -19.34877586364746, "global_step": 3756, "epoch": 31} {"train_loss": -19.234317779541016, "global_step": 3757, "epoch": 31} {"train_loss": -19.42665672302246, "global_step": 3758, "epoch": 31} {"train_loss": -18.948734283447266, "global_step": 3759, "epoch": 31} {"train_loss": -18.196746826171875, "global_step": 3760, "epoch": 31} {"train_loss": -18.783655166625977, "global_step": 3761, "epoch": 31} {"train_loss": -18.76776695251465, "global_step": 3762, "epoch": 31} {"train_loss": -19.163122177124023, "global_step": 3763, "epoch": 31} {"train_loss": -18.465839385986328, "global_step": 3764, "epoch": 31} {"train_loss": -19.15093231201172, "global_step": 3765, "epoch": 31} {"train_loss": -17.70229148864746, "global_step": 3766, "epoch": 31} {"train_loss": -18.979326248168945, "global_step": 3767, "epoch": 31} {"train_loss": -18.854902267456055, "global_step": 3768, "epoch": 31} {"train_loss": -18.938682556152344, "global_step": 3769, "epoch": 31} {"train_loss": -18.872812271118164, "global_step": 3770, "epoch": 31} {"train_loss": -19.27613639831543, "global_step": 3771, "epoch": 31} {"train_loss": -19.079496383666992, "global_step": 3772, "epoch": 31} {"train_loss": -18.948270797729492, "global_step": 3773, "epoch": 31} {"train_loss": -19.639270782470703, "global_step": 3774, "epoch": 31} {"train_loss": -19.103870391845703, "global_step": 3775, "epoch": 31} {"train_loss": -19.092519760131836, "global_step": 3776, "epoch": 31} {"train_loss": -19.40433120727539, "global_step": 3777, "epoch": 31} {"train_loss": -19.141584396362305, "global_step": 3778, "epoch": 31} {"train_loss": -19.313369750976562, "global_step": 3779, "epoch": 31} {"train_loss": -19.949338912963867, "global_step": 3780, "epoch": 31} {"train_loss": -18.900535583496094, "global_step": 3781, "epoch": 31} {"train_loss": -19.8437442779541, "global_step": 3782, "epoch": 31} {"train_loss": -19.674240112304688, "global_step": 3783, "epoch": 31} {"train_loss": -19.579864501953125, "global_step": 3784, "epoch": 31} {"train_loss": -19.410594940185547, "global_step": 3785, "epoch": 31} {"train_loss": -19.68247413635254, "global_step": 3786, "epoch": 31} {"train_loss": -19.759958267211914, "global_step": 3787, "epoch": 31} {"train_loss": -19.732952117919922, "global_step": 3788, "epoch": 31} {"train_loss": -19.0999813079834, "global_step": 3789, "epoch": 31} {"train_loss": -19.317317962646484, "global_step": 3790, "epoch": 31} {"train_loss": -18.639801025390625, "global_step": 3791, "epoch": 31} {"train_loss": -17.40597915649414, "global_step": 3792, "epoch": 31} {"train_loss": -18.242761611938477, "global_step": 3793, "epoch": 31} {"train_loss": -19.61150550842285, "global_step": 3794, "epoch": 31} {"train_loss": -19.162960052490234, "global_step": 3795, "epoch": 31} {"train_loss": -19.417911529541016, "global_step": 3796, "epoch": 31} {"train_loss": -19.2188663482666, "global_step": 3797, "epoch": 31} {"train_loss": -19.584293365478516, "global_step": 3798, "epoch": 31} {"train_loss": -19.5064697265625, "global_step": 3799, "epoch": 31} {"train_loss": -19.687911987304688, "global_step": 3800, "epoch": 31} {"train_loss": -19.819360733032227, "global_step": 3801, "epoch": 31} {"train_loss": -19.39078712463379, "global_step": 3802, "epoch": 31} {"train_loss": -19.1170711517334, "global_step": 3803, "epoch": 31} {"train_loss": -18.936237335205078, "global_step": 3804, "epoch": 31} {"train_loss": -19.86209487915039, "global_step": 3805, "epoch": 31} {"train_loss": -18.779144287109375, "global_step": 3806, "epoch": 31} {"train_loss": -18.550058364868164, "global_step": 3807, "epoch": 31} {"train_loss": -19.678955078125, "global_step": 3808, "epoch": 31} {"train_loss": -19.734615325927734, "global_step": 3809, "epoch": 31} {"train_loss": -19.4080867767334, "global_step": 3810, "epoch": 31} {"train_loss": -19.557519912719727, "global_step": 3811, "epoch": 31} {"train_loss": -18.969913482666016, "global_step": 3812, "epoch": 31} {"train_loss": -19.701997756958008, "global_step": 3813, "epoch": 31} {"train_loss": -19.6031494140625, "global_step": 3814, "epoch": 31} {"train_loss": -19.2242488861084, "global_step": 3815, "epoch": 31} {"train_loss": -19.995023727416992, "global_step": 3816, "epoch": 31} {"train_loss": -18.93251609802246, "global_step": 3817, "epoch": 31} {"train_loss": -19.499719619750977, "global_step": 3818, "epoch": 31} {"train_loss": -19.667957305908203, "global_step": 3819, "epoch": 31} {"train_loss": -19.68326759338379, "global_step": 3820, "epoch": 31} {"train_loss": -18.989532470703125, "global_step": 3821, "epoch": 31} {"train_loss": -19.635452270507812, "global_step": 3822, "epoch": 31} {"train_loss": -19.93210792541504, "global_step": 3823, "epoch": 31} {"train_loss": -19.90363883972168, "global_step": 3824, "epoch": 31} {"train_loss": -18.875507354736328, "global_step": 3825, "epoch": 31} {"train_loss": -19.658430099487305, "global_step": 3826, "epoch": 31} {"train_loss": -19.6445255279541, "global_step": 3827, "epoch": 31} {"train_loss": -19.286916732788086, "global_step": 3828, "epoch": 31} {"train_loss": -19.114988327026367, "global_step": 3829, "epoch": 31} {"train_loss": -18.46833038330078, "global_step": 3830, "epoch": 31} {"train_loss": -17.136953353881836, "global_step": 3831, "epoch": 31} {"train_loss": -18.6411190032959, "global_step": 3832, "epoch": 31} {"train_loss": -19.88553810119629, "global_step": 3833, "epoch": 31} {"train_loss": -19.29758071899414, "global_step": 3834, "epoch": 31} {"train_loss": -19.393484115600586, "global_step": 3835, "epoch": 31} {"train_loss": -19.558908462524414, "global_step": 3836, "epoch": 31} {"train_loss": -18.812515258789062, "global_step": 3837, "epoch": 31} {"train_loss": -19.736846923828125, "global_step": 3838, "epoch": 31} {"train_loss": -18.834609985351562, "global_step": 3839, "epoch": 31} {"train_loss": -19.588348388671875, "global_step": 3840, "epoch": 31} {"train_loss": -19.378028869628906, "global_step": 3841, "epoch": 31} {"train_loss": -18.948801040649414, "global_step": 3842, "epoch": 31} {"train_loss": -19.503992080688477, "global_step": 3843, "epoch": 31} {"train_loss": -19.073535919189453, "global_step": 3844, "epoch": 31} {"train_loss": -19.532377243041992, "global_step": 3845, "epoch": 31} {"train_loss": -18.497678756713867, "global_step": 3846, "epoch": 31} {"train_loss": -19.769079208374023, "global_step": 3847, "epoch": 31} {"train_loss": -18.350950241088867, "global_step": 3848, "epoch": 31} {"train_loss": -19.542224884033203, "global_step": 3849, "epoch": 31} {"train_loss": -18.215627670288086, "global_step": 3850, "epoch": 31} {"train_loss": -20.024351119995117, "global_step": 3851, "epoch": 31} {"train_loss": -19.37511444091797, "global_step": 3852, "epoch": 31} {"train_loss": -19.584871292114258, "global_step": 3853, "epoch": 31} {"train_loss": -18.936555862426758, "global_step": 3854, "epoch": 31} {"train_loss": -19.15860939025879, "global_step": 3855, "epoch": 31} {"train_loss": -19.503616333007812, "global_step": 3856, "epoch": 31} {"train_loss": -19.46856117248535, "global_step": 3857, "epoch": 31} {"train_loss": -19.807830810546875, "global_step": 3858, "epoch": 31} {"train_loss": -20.13431739807129, "global_step": 3859, "epoch": 31} {"train_loss": -19.620452880859375, "global_step": 3860, "epoch": 31} {"train_loss": -19.524620056152344, "global_step": 3861, "epoch": 31} {"train_loss": -19.595523834228516, "global_step": 3862, "epoch": 31} {"train_loss": -19.226118087768555, "global_step": 3863, "epoch": 31} {"train_loss": -19.945968627929688, "global_step": 3864, "epoch": 31} {"train_loss": -19.462499618530273, "global_step": 3865, "epoch": 31} {"train_loss": -18.314498901367188, "global_step": 3866, "epoch": 31} {"train_loss": -19.478166580200195, "global_step": 3867, "epoch": 31} {"train_loss": -19.687589645385742, "global_step": 3868, "epoch": 31} {"train_loss": -19.401567459106445, "global_step": 3869, "epoch": 31} {"train_loss": -20.0568790435791, "global_step": 3870, "epoch": 31} {"train_loss": -19.247879895296965, "global_step": 3871, "epoch": 31, "val_loss": 2720821.0} {"train_loss": -19.846317291259766, "global_step": 3872, "epoch": 32} {"train_loss": -19.866872787475586, "global_step": 3873, "epoch": 32} {"train_loss": -19.570898056030273, "global_step": 3874, "epoch": 32} {"train_loss": -20.08837890625, "global_step": 3875, "epoch": 32} {"train_loss": -20.410057067871094, "global_step": 3876, "epoch": 32} {"train_loss": -20.433979034423828, "global_step": 3877, "epoch": 32} {"train_loss": -19.624670028686523, "global_step": 3878, "epoch": 32} {"train_loss": -19.8316593170166, "global_step": 3879, "epoch": 32} {"train_loss": -19.189727783203125, "global_step": 3880, "epoch": 32} {"train_loss": -18.77570915222168, "global_step": 3881, "epoch": 32} {"train_loss": -18.207895278930664, "global_step": 3882, "epoch": 32} {"train_loss": -18.851110458374023, "global_step": 3883, "epoch": 32} {"train_loss": -19.65254020690918, "global_step": 3884, "epoch": 32} {"train_loss": -19.732189178466797, "global_step": 3885, "epoch": 32} {"train_loss": -19.4061279296875, "global_step": 3886, "epoch": 32} {"train_loss": -19.64210319519043, "global_step": 3887, "epoch": 32} {"train_loss": -19.52019691467285, "global_step": 3888, "epoch": 32} {"train_loss": -19.137304306030273, "global_step": 3889, "epoch": 32} {"train_loss": -19.618040084838867, "global_step": 3890, "epoch": 32} {"train_loss": -18.55150032043457, "global_step": 3891, "epoch": 32} {"train_loss": -19.434463500976562, "global_step": 3892, "epoch": 32} {"train_loss": -19.125967025756836, "global_step": 3893, "epoch": 32} {"train_loss": -18.860586166381836, "global_step": 3894, "epoch": 32} {"train_loss": -18.881811141967773, "global_step": 3895, "epoch": 32} {"train_loss": -19.43214225769043, "global_step": 3896, "epoch": 32} {"train_loss": -19.194997787475586, "global_step": 3897, "epoch": 32} {"train_loss": -19.162967681884766, "global_step": 3898, "epoch": 32} {"train_loss": -18.959224700927734, "global_step": 3899, "epoch": 32} {"train_loss": -18.796680450439453, "global_step": 3900, "epoch": 32} {"train_loss": -19.228958129882812, "global_step": 3901, "epoch": 32} {"train_loss": -18.557432174682617, "global_step": 3902, "epoch": 32} {"train_loss": -19.73248291015625, "global_step": 3903, "epoch": 32} {"train_loss": -19.080656051635742, "global_step": 3904, "epoch": 32} {"train_loss": -18.725189208984375, "global_step": 3905, "epoch": 32} {"train_loss": -19.5341796875, "global_step": 3906, "epoch": 32} {"train_loss": -19.41096305847168, "global_step": 3907, "epoch": 32} {"train_loss": -18.393878936767578, "global_step": 3908, "epoch": 32} {"train_loss": -19.727340698242188, "global_step": 3909, "epoch": 32} {"train_loss": -18.79221534729004, "global_step": 3910, "epoch": 32} {"train_loss": -19.222991943359375, "global_step": 3911, "epoch": 32} {"train_loss": -18.63710594177246, "global_step": 3912, "epoch": 32} {"train_loss": -19.937772750854492, "global_step": 3913, "epoch": 32} {"train_loss": -19.13929557800293, "global_step": 3914, "epoch": 32} {"train_loss": -20.015790939331055, "global_step": 3915, "epoch": 32} {"train_loss": -18.980270385742188, "global_step": 3916, "epoch": 32} {"train_loss": -19.814559936523438, "global_step": 3917, "epoch": 32} {"train_loss": -19.732925415039062, "global_step": 3918, "epoch": 32} {"train_loss": -19.525911331176758, "global_step": 3919, "epoch": 32} {"train_loss": -20.18198013305664, "global_step": 3920, "epoch": 32} {"train_loss": -19.51997947692871, "global_step": 3921, "epoch": 32} {"train_loss": -19.785396575927734, "global_step": 3922, "epoch": 32} {"train_loss": -19.66396141052246, "global_step": 3923, "epoch": 32} {"train_loss": -19.84956169128418, "global_step": 3924, "epoch": 32} {"train_loss": -19.875614166259766, "global_step": 3925, "epoch": 32} {"train_loss": -19.86720848083496, "global_step": 3926, "epoch": 32} {"train_loss": -20.23847007751465, "global_step": 3927, "epoch": 32} {"train_loss": -19.649856567382812, "global_step": 3928, "epoch": 32} {"train_loss": -19.90850830078125, "global_step": 3929, "epoch": 32} {"train_loss": -19.73971176147461, "global_step": 3930, "epoch": 32} {"train_loss": -19.882299423217773, "global_step": 3931, "epoch": 32} {"train_loss": -19.747745513916016, "global_step": 3932, "epoch": 32} {"train_loss": -19.934722900390625, "global_step": 3933, "epoch": 32} {"train_loss": -19.951475143432617, "global_step": 3934, "epoch": 32} {"train_loss": -19.943580627441406, "global_step": 3935, "epoch": 32} {"train_loss": -20.000802993774414, "global_step": 3936, "epoch": 32} {"train_loss": -18.813913345336914, "global_step": 3937, "epoch": 32} {"train_loss": -19.36447525024414, "global_step": 3938, "epoch": 32} {"train_loss": -19.874746322631836, "global_step": 3939, "epoch": 32} {"train_loss": -19.857168197631836, "global_step": 3940, "epoch": 32} {"train_loss": -19.99647331237793, "global_step": 3941, "epoch": 32} {"train_loss": -19.886465072631836, "global_step": 3942, "epoch": 32} {"train_loss": -20.44285011291504, "global_step": 3943, "epoch": 32} {"train_loss": -19.97936248779297, "global_step": 3944, "epoch": 32} {"train_loss": -19.969440460205078, "global_step": 3945, "epoch": 32} {"train_loss": -19.73842430114746, "global_step": 3946, "epoch": 32} {"train_loss": -19.456031799316406, "global_step": 3947, "epoch": 32} {"train_loss": -19.685815811157227, "global_step": 3948, "epoch": 32} {"train_loss": -19.653703689575195, "global_step": 3949, "epoch": 32} {"train_loss": -18.250988006591797, "global_step": 3950, "epoch": 32} {"train_loss": -19.81005096435547, "global_step": 3951, "epoch": 32} {"train_loss": -18.36838722229004, "global_step": 3952, "epoch": 32} {"train_loss": -19.651037216186523, "global_step": 3953, "epoch": 32} {"train_loss": -19.532316207885742, "global_step": 3954, "epoch": 32} {"train_loss": -18.208189010620117, "global_step": 3955, "epoch": 32} {"train_loss": -19.300519943237305, "global_step": 3956, "epoch": 32} {"train_loss": -19.878952026367188, "global_step": 3957, "epoch": 32} {"train_loss": -19.4802303314209, "global_step": 3958, "epoch": 32} {"train_loss": -19.7753963470459, "global_step": 3959, "epoch": 32} {"train_loss": -19.782957077026367, "global_step": 3960, "epoch": 32} {"train_loss": -19.248807907104492, "global_step": 3961, "epoch": 32} {"train_loss": -19.979890823364258, "global_step": 3962, "epoch": 32} {"train_loss": -19.957929611206055, "global_step": 3963, "epoch": 32} {"train_loss": -19.470714569091797, "global_step": 3964, "epoch": 32} {"train_loss": -19.875934600830078, "global_step": 3965, "epoch": 32} {"train_loss": -19.744630813598633, "global_step": 3966, "epoch": 32} {"train_loss": -19.809328079223633, "global_step": 3967, "epoch": 32} {"train_loss": -19.529664993286133, "global_step": 3968, "epoch": 32} {"train_loss": -19.490692138671875, "global_step": 3969, "epoch": 32} {"train_loss": -20.143911361694336, "global_step": 3970, "epoch": 32} {"train_loss": -19.313425064086914, "global_step": 3971, "epoch": 32} {"train_loss": -19.87739372253418, "global_step": 3972, "epoch": 32} {"train_loss": -19.102827072143555, "global_step": 3973, "epoch": 32} {"train_loss": -19.268115997314453, "global_step": 3974, "epoch": 32} {"train_loss": -19.95498275756836, "global_step": 3975, "epoch": 32} {"train_loss": -19.986013412475586, "global_step": 3976, "epoch": 32} {"train_loss": -19.727632522583008, "global_step": 3977, "epoch": 32} {"train_loss": -19.207122802734375, "global_step": 3978, "epoch": 32} {"train_loss": -19.05788230895996, "global_step": 3979, "epoch": 32} {"train_loss": -19.336545944213867, "global_step": 3980, "epoch": 32} {"train_loss": -18.544248580932617, "global_step": 3981, "epoch": 32} {"train_loss": -15.014264106750488, "global_step": 3982, "epoch": 32} {"train_loss": -19.254409790039062, "global_step": 3983, "epoch": 32} {"train_loss": -18.18644142150879, "global_step": 3984, "epoch": 32} {"train_loss": -19.2844181060791, "global_step": 3985, "epoch": 32} {"train_loss": -18.229053497314453, "global_step": 3986, "epoch": 32} {"train_loss": -19.58038330078125, "global_step": 3987, "epoch": 32} {"train_loss": -18.776012420654297, "global_step": 3988, "epoch": 32} {"train_loss": -19.58489990234375, "global_step": 3989, "epoch": 32} {"train_loss": -19.405115127563477, "global_step": 3990, "epoch": 32} {"train_loss": -19.406259536743164, "global_step": 3991, "epoch": 32} {"train_loss": -19.427800887872365, "global_step": 3992, "epoch": 32, "val_loss": 3190185.0} {"train_loss": -18.412857055664062, "global_step": 3993, "epoch": 33} {"train_loss": -19.5269775390625, "global_step": 3994, "epoch": 33} {"train_loss": -18.889009475708008, "global_step": 3995, "epoch": 33} {"train_loss": -19.347694396972656, "global_step": 3996, "epoch": 33} {"train_loss": -19.399417877197266, "global_step": 3997, "epoch": 33} {"train_loss": -18.738046646118164, "global_step": 3998, "epoch": 33} {"train_loss": -19.685274124145508, "global_step": 3999, "epoch": 33} {"train_loss": -19.089841842651367, "global_step": 4000, "epoch": 33} {"train_loss": -19.036813735961914, "global_step": 4001, "epoch": 33} {"train_loss": -19.825796127319336, "global_step": 4002, "epoch": 33} {"train_loss": -18.959941864013672, "global_step": 4003, "epoch": 33} {"train_loss": -19.494245529174805, "global_step": 4004, "epoch": 33} {"train_loss": -18.873132705688477, "global_step": 4005, "epoch": 33} {"train_loss": -19.85981559753418, "global_step": 4006, "epoch": 33} {"train_loss": -19.496179580688477, "global_step": 4007, "epoch": 33} {"train_loss": -18.85920524597168, "global_step": 4008, "epoch": 33} {"train_loss": -19.350400924682617, "global_step": 4009, "epoch": 33} {"train_loss": -19.386213302612305, "global_step": 4010, "epoch": 33} {"train_loss": -19.510889053344727, "global_step": 4011, "epoch": 33} {"train_loss": -19.436378479003906, "global_step": 4012, "epoch": 33} {"train_loss": -19.386001586914062, "global_step": 4013, "epoch": 33} {"train_loss": -19.99463653564453, "global_step": 4014, "epoch": 33} {"train_loss": -19.581361770629883, "global_step": 4015, "epoch": 33} {"train_loss": -19.741552352905273, "global_step": 4016, "epoch": 33} {"train_loss": -19.2233829498291, "global_step": 4017, "epoch": 33} {"train_loss": -19.75095558166504, "global_step": 4018, "epoch": 33} {"train_loss": -19.74089241027832, "global_step": 4019, "epoch": 33} {"train_loss": -19.94878387451172, "global_step": 4020, "epoch": 33} {"train_loss": -19.978103637695312, "global_step": 4021, "epoch": 33} {"train_loss": -19.585325241088867, "global_step": 4022, "epoch": 33} {"train_loss": -20.0321044921875, "global_step": 4023, "epoch": 33} {"train_loss": -19.877187728881836, "global_step": 4024, "epoch": 33} {"train_loss": -19.485158920288086, "global_step": 4025, "epoch": 33} {"train_loss": -20.001184463500977, "global_step": 4026, "epoch": 33} {"train_loss": -19.51181983947754, "global_step": 4027, "epoch": 33} {"train_loss": -19.600675582885742, "global_step": 4028, "epoch": 33} {"train_loss": -18.75627899169922, "global_step": 4029, "epoch": 33} {"train_loss": -16.830900192260742, "global_step": 4030, "epoch": 33} {"train_loss": -18.81879234313965, "global_step": 4031, "epoch": 33} {"train_loss": -19.614299774169922, "global_step": 4032, "epoch": 33} {"train_loss": -19.365808486938477, "global_step": 4033, "epoch": 33} {"train_loss": -19.737281799316406, "global_step": 4034, "epoch": 33} {"train_loss": -19.38481903076172, "global_step": 4035, "epoch": 33} {"train_loss": -20.01377296447754, "global_step": 4036, "epoch": 33} {"train_loss": -19.508377075195312, "global_step": 4037, "epoch": 33} {"train_loss": -20.184146881103516, "global_step": 4038, "epoch": 33} {"train_loss": -19.406457901000977, "global_step": 4039, "epoch": 33} {"train_loss": -20.499282836914062, "global_step": 4040, "epoch": 33} {"train_loss": -19.689788818359375, "global_step": 4041, "epoch": 33} {"train_loss": -19.83820915222168, "global_step": 4042, "epoch": 33} {"train_loss": -19.649625778198242, "global_step": 4043, "epoch": 33} {"train_loss": -19.511499404907227, "global_step": 4044, "epoch": 33} {"train_loss": -20.26356315612793, "global_step": 4045, "epoch": 33} {"train_loss": -19.703800201416016, "global_step": 4046, "epoch": 33} {"train_loss": -20.47527503967285, "global_step": 4047, "epoch": 33} {"train_loss": -19.377084732055664, "global_step": 4048, "epoch": 33} {"train_loss": -18.160608291625977, "global_step": 4049, "epoch": 33} {"train_loss": -18.378673553466797, "global_step": 4050, "epoch": 33} {"train_loss": -19.404356002807617, "global_step": 4051, "epoch": 33} {"train_loss": -18.775146484375, "global_step": 4052, "epoch": 33} {"train_loss": -19.9581356048584, "global_step": 4053, "epoch": 33} {"train_loss": -19.398378372192383, "global_step": 4054, "epoch": 33} {"train_loss": -19.41896629333496, "global_step": 4055, "epoch": 33} {"train_loss": -19.863216400146484, "global_step": 4056, "epoch": 33} {"train_loss": -20.357463836669922, "global_step": 4057, "epoch": 33} {"train_loss": -18.98242950439453, "global_step": 4058, "epoch": 33} {"train_loss": -18.149980545043945, "global_step": 4059, "epoch": 33} {"train_loss": -19.668415069580078, "global_step": 4060, "epoch": 33} {"train_loss": -19.325305938720703, "global_step": 4061, "epoch": 33} {"train_loss": -20.171812057495117, "global_step": 4062, "epoch": 33} {"train_loss": -19.60630989074707, "global_step": 4063, "epoch": 33} {"train_loss": -19.693870544433594, "global_step": 4064, "epoch": 33} {"train_loss": -19.876264572143555, "global_step": 4065, "epoch": 33} {"train_loss": -19.689687728881836, "global_step": 4066, "epoch": 33} {"train_loss": -19.28760528564453, "global_step": 4067, "epoch": 33} {"train_loss": -19.349863052368164, "global_step": 4068, "epoch": 33} {"train_loss": -19.76141357421875, "global_step": 4069, "epoch": 33} {"train_loss": -19.588130950927734, "global_step": 4070, "epoch": 33} {"train_loss": -19.74136734008789, "global_step": 4071, "epoch": 33} {"train_loss": -19.735580444335938, "global_step": 4072, "epoch": 33} {"train_loss": -19.150100708007812, "global_step": 4073, "epoch": 33} {"train_loss": -19.629352569580078, "global_step": 4074, "epoch": 33} {"train_loss": -19.808866500854492, "global_step": 4075, "epoch": 33} {"train_loss": -19.546178817749023, "global_step": 4076, "epoch": 33} {"train_loss": -19.615325927734375, "global_step": 4077, "epoch": 33} {"train_loss": -19.515443801879883, "global_step": 4078, "epoch": 33} {"train_loss": -19.8349609375, "global_step": 4079, "epoch": 33} {"train_loss": -19.915176391601562, "global_step": 4080, "epoch": 33} {"train_loss": -20.089223861694336, "global_step": 4081, "epoch": 33} {"train_loss": -19.984397888183594, "global_step": 4082, "epoch": 33} {"train_loss": -19.838651657104492, "global_step": 4083, "epoch": 33} {"train_loss": -19.916425704956055, "global_step": 4084, "epoch": 33} {"train_loss": -19.95676040649414, "global_step": 4085, "epoch": 33} {"train_loss": -19.465322494506836, "global_step": 4086, "epoch": 33} {"train_loss": -19.879846572875977, "global_step": 4087, "epoch": 33} {"train_loss": -20.081607818603516, "global_step": 4088, "epoch": 33} {"train_loss": -20.196882247924805, "global_step": 4089, "epoch": 33} {"train_loss": -19.98386001586914, "global_step": 4090, "epoch": 33} {"train_loss": -20.424272537231445, "global_step": 4091, "epoch": 33} {"train_loss": -20.015018463134766, "global_step": 4092, "epoch": 33} {"train_loss": -20.652088165283203, "global_step": 4093, "epoch": 33} {"train_loss": -20.317358016967773, "global_step": 4094, "epoch": 33} {"train_loss": -20.048635482788086, "global_step": 4095, "epoch": 33} {"train_loss": -19.520261764526367, "global_step": 4096, "epoch": 33} {"train_loss": -20.082908630371094, "global_step": 4097, "epoch": 33} {"train_loss": -20.126203536987305, "global_step": 4098, "epoch": 33} {"train_loss": -19.61757469177246, "global_step": 4099, "epoch": 33} {"train_loss": -20.036924362182617, "global_step": 4100, "epoch": 33} {"train_loss": -20.189605712890625, "global_step": 4101, "epoch": 33} {"train_loss": -19.84226417541504, "global_step": 4102, "epoch": 33} {"train_loss": -19.326007843017578, "global_step": 4103, "epoch": 33} {"train_loss": -20.221342086791992, "global_step": 4104, "epoch": 33} {"train_loss": -19.9287166595459, "global_step": 4105, "epoch": 33} {"train_loss": -20.193389892578125, "global_step": 4106, "epoch": 33} {"train_loss": -20.27081871032715, "global_step": 4107, "epoch": 33} {"train_loss": -20.5522403717041, "global_step": 4108, "epoch": 33} {"train_loss": -20.384132385253906, "global_step": 4109, "epoch": 33} {"train_loss": -20.32282829284668, "global_step": 4110, "epoch": 33} {"train_loss": -20.371915817260742, "global_step": 4111, "epoch": 33} {"train_loss": -20.353778839111328, "global_step": 4112, "epoch": 33} {"train_loss": -19.644837434626808, "global_step": 4113, "epoch": 33, "val_loss": 3209420.25} {"train_loss": -19.107465744018555, "global_step": 4114, "epoch": 34} {"train_loss": -18.167573928833008, "global_step": 4115, "epoch": 34} {"train_loss": -20.35664939880371, "global_step": 4116, "epoch": 34} {"train_loss": -18.6579532623291, "global_step": 4117, "epoch": 34} {"train_loss": -19.861452102661133, "global_step": 4118, "epoch": 34} {"train_loss": -19.427555084228516, "global_step": 4119, "epoch": 34} {"train_loss": -18.147167205810547, "global_step": 4120, "epoch": 34} {"train_loss": -19.52521324157715, "global_step": 4121, "epoch": 34} {"train_loss": -19.53189468383789, "global_step": 4122, "epoch": 34} {"train_loss": -18.82499122619629, "global_step": 4123, "epoch": 34} {"train_loss": -20.433643341064453, "global_step": 4124, "epoch": 34} {"train_loss": -19.091188430786133, "global_step": 4125, "epoch": 34} {"train_loss": -19.77022361755371, "global_step": 4126, "epoch": 34} {"train_loss": -19.825149536132812, "global_step": 4127, "epoch": 34} {"train_loss": -19.88283348083496, "global_step": 4128, "epoch": 34} {"train_loss": -20.01069450378418, "global_step": 4129, "epoch": 34} {"train_loss": -19.75901222229004, "global_step": 4130, "epoch": 34} {"train_loss": -19.836729049682617, "global_step": 4131, "epoch": 34} {"train_loss": -19.612333297729492, "global_step": 4132, "epoch": 34} {"train_loss": -20.07322883605957, "global_step": 4133, "epoch": 34} {"train_loss": -19.69349479675293, "global_step": 4134, "epoch": 34} {"train_loss": -20.08647346496582, "global_step": 4135, "epoch": 34} {"train_loss": -19.7751407623291, "global_step": 4136, "epoch": 34} {"train_loss": -20.132680892944336, "global_step": 4137, "epoch": 34} {"train_loss": -20.377790451049805, "global_step": 4138, "epoch": 34} {"train_loss": -19.953632354736328, "global_step": 4139, "epoch": 34} {"train_loss": -20.199111938476562, "global_step": 4140, "epoch": 34} {"train_loss": -20.114316940307617, "global_step": 4141, "epoch": 34} {"train_loss": -20.445241928100586, "global_step": 4142, "epoch": 34} {"train_loss": -20.549291610717773, "global_step": 4143, "epoch": 34} {"train_loss": -20.274641036987305, "global_step": 4144, "epoch": 34} {"train_loss": -20.402437210083008, "global_step": 4145, "epoch": 34} {"train_loss": -20.44736099243164, "global_step": 4146, "epoch": 34} {"train_loss": -20.288053512573242, "global_step": 4147, "epoch": 34} {"train_loss": -20.82069969177246, "global_step": 4148, "epoch": 34} {"train_loss": -20.588884353637695, "global_step": 4149, "epoch": 34} {"train_loss": -20.227201461791992, "global_step": 4150, "epoch": 34} {"train_loss": -20.822851181030273, "global_step": 4151, "epoch": 34} {"train_loss": -20.500106811523438, "global_step": 4152, "epoch": 34} {"train_loss": -19.939302444458008, "global_step": 4153, "epoch": 34} {"train_loss": -20.23390007019043, "global_step": 4154, "epoch": 34} {"train_loss": -19.742685317993164, "global_step": 4155, "epoch": 34} {"train_loss": -17.197099685668945, "global_step": 4156, "epoch": 34} {"train_loss": -14.972787857055664, "global_step": 4157, "epoch": 34} {"train_loss": -19.18276596069336, "global_step": 4158, "epoch": 34} {"train_loss": -14.101694107055664, "global_step": 4159, "epoch": 34} {"train_loss": -18.2032527923584, "global_step": 4160, "epoch": 34} {"train_loss": -16.160932540893555, "global_step": 4161, "epoch": 34} {"train_loss": -19.025217056274414, "global_step": 4162, "epoch": 34} {"train_loss": -18.310657501220703, "global_step": 4163, "epoch": 34} {"train_loss": -18.34940528869629, "global_step": 4164, "epoch": 34} {"train_loss": -18.464160919189453, "global_step": 4165, "epoch": 34} {"train_loss": -18.493453979492188, "global_step": 4166, "epoch": 34} {"train_loss": -18.732881546020508, "global_step": 4167, "epoch": 34} {"train_loss": -18.504980087280273, "global_step": 4168, "epoch": 34} {"train_loss": -18.393117904663086, "global_step": 4169, "epoch": 34} {"train_loss": -18.608793258666992, "global_step": 4170, "epoch": 34} {"train_loss": -18.37386703491211, "global_step": 4171, "epoch": 34} {"train_loss": -18.27345085144043, "global_step": 4172, "epoch": 34} {"train_loss": -19.00282859802246, "global_step": 4173, "epoch": 34} {"train_loss": -18.301727294921875, "global_step": 4174, "epoch": 34} {"train_loss": -18.649423599243164, "global_step": 4175, "epoch": 34} {"train_loss": -18.997583389282227, "global_step": 4176, "epoch": 34} {"train_loss": -18.774539947509766, "global_step": 4177, "epoch": 34} {"train_loss": -18.278644561767578, "global_step": 4178, "epoch": 34} {"train_loss": -18.686574935913086, "global_step": 4179, "epoch": 34} {"train_loss": -18.861597061157227, "global_step": 4180, "epoch": 34} {"train_loss": -18.84625244140625, "global_step": 4181, "epoch": 34} {"train_loss": -19.189924240112305, "global_step": 4182, "epoch": 34} {"train_loss": -19.328445434570312, "global_step": 4183, "epoch": 34} {"train_loss": -19.045461654663086, "global_step": 4184, "epoch": 34} {"train_loss": -19.311330795288086, "global_step": 4185, "epoch": 34} {"train_loss": -19.265024185180664, "global_step": 4186, "epoch": 34} {"train_loss": -19.4637451171875, "global_step": 4187, "epoch": 34} {"train_loss": -19.550622940063477, "global_step": 4188, "epoch": 34} {"train_loss": -19.837268829345703, "global_step": 4189, "epoch": 34} {"train_loss": -19.825239181518555, "global_step": 4190, "epoch": 34} {"train_loss": -19.481229782104492, "global_step": 4191, "epoch": 34} {"train_loss": -19.876243591308594, "global_step": 4192, "epoch": 34} {"train_loss": -19.795732498168945, "global_step": 4193, "epoch": 34} {"train_loss": -20.019521713256836, "global_step": 4194, "epoch": 34} {"train_loss": -20.18562126159668, "global_step": 4195, "epoch": 34} {"train_loss": -20.007732391357422, "global_step": 4196, "epoch": 34} {"train_loss": -19.798053741455078, "global_step": 4197, "epoch": 34} {"train_loss": -20.530675888061523, "global_step": 4198, "epoch": 34} {"train_loss": -19.9554500579834, "global_step": 4199, "epoch": 34} {"train_loss": -20.618831634521484, "global_step": 4200, "epoch": 34} {"train_loss": -19.74118423461914, "global_step": 4201, "epoch": 34} {"train_loss": -19.517202377319336, "global_step": 4202, "epoch": 34} {"train_loss": -18.42477035522461, "global_step": 4203, "epoch": 34} {"train_loss": -18.3853759765625, "global_step": 4204, "epoch": 34} {"train_loss": -20.11028480529785, "global_step": 4205, "epoch": 34} {"train_loss": -19.680679321289062, "global_step": 4206, "epoch": 34} {"train_loss": -18.667343139648438, "global_step": 4207, "epoch": 34} {"train_loss": -20.041542053222656, "global_step": 4208, "epoch": 34} {"train_loss": -19.233991622924805, "global_step": 4209, "epoch": 34} {"train_loss": -19.409055709838867, "global_step": 4210, "epoch": 34} {"train_loss": -19.789976119995117, "global_step": 4211, "epoch": 34} {"train_loss": -19.13829803466797, "global_step": 4212, "epoch": 34} {"train_loss": -19.861719131469727, "global_step": 4213, "epoch": 34} {"train_loss": -19.466527938842773, "global_step": 4214, "epoch": 34} {"train_loss": -19.492982864379883, "global_step": 4215, "epoch": 34} {"train_loss": -19.48174285888672, "global_step": 4216, "epoch": 34} {"train_loss": -19.901968002319336, "global_step": 4217, "epoch": 34} {"train_loss": -19.81339454650879, "global_step": 4218, "epoch": 34} {"train_loss": -19.661130905151367, "global_step": 4219, "epoch": 34} {"train_loss": -18.954814910888672, "global_step": 4220, "epoch": 34} {"train_loss": -19.739439010620117, "global_step": 4221, "epoch": 34} {"train_loss": -19.478178024291992, "global_step": 4222, "epoch": 34} {"train_loss": -20.1812744140625, "global_step": 4223, "epoch": 34} {"train_loss": -19.50295066833496, "global_step": 4224, "epoch": 34} {"train_loss": -19.683202743530273, "global_step": 4225, "epoch": 34} {"train_loss": -20.12042999267578, "global_step": 4226, "epoch": 34} {"train_loss": -19.993606567382812, "global_step": 4227, "epoch": 34} {"train_loss": -20.050321578979492, "global_step": 4228, "epoch": 34} {"train_loss": -20.057897567749023, "global_step": 4229, "epoch": 34} {"train_loss": -20.018817901611328, "global_step": 4230, "epoch": 34} {"train_loss": -19.920337677001953, "global_step": 4231, "epoch": 34} {"train_loss": -20.159345626831055, "global_step": 4232, "epoch": 34} {"train_loss": -20.010778427124023, "global_step": 4233, "epoch": 34} {"train_loss": -19.425027074892657, "global_step": 4234, "epoch": 34, "val_loss": 3767777.25} {"train_loss": -20.241819381713867, "global_step": 4235, "epoch": 35} {"train_loss": -19.98514175415039, "global_step": 4236, "epoch": 35} {"train_loss": -20.00407600402832, "global_step": 4237, "epoch": 35} {"train_loss": -19.876920700073242, "global_step": 4238, "epoch": 35} {"train_loss": -20.732309341430664, "global_step": 4239, "epoch": 35} {"train_loss": -20.31068229675293, "global_step": 4240, "epoch": 35} {"train_loss": -20.566938400268555, "global_step": 4241, "epoch": 35} {"train_loss": -20.021207809448242, "global_step": 4242, "epoch": 35} {"train_loss": -20.70798683166504, "global_step": 4243, "epoch": 35} {"train_loss": -19.94313621520996, "global_step": 4244, "epoch": 35} {"train_loss": -19.868610382080078, "global_step": 4245, "epoch": 35} {"train_loss": -20.66098976135254, "global_step": 4246, "epoch": 35} {"train_loss": -20.663467407226562, "global_step": 4247, "epoch": 35} {"train_loss": -20.94119644165039, "global_step": 4248, "epoch": 35} {"train_loss": -20.55792808532715, "global_step": 4249, "epoch": 35} {"train_loss": -20.68694496154785, "global_step": 4250, "epoch": 35} {"train_loss": -20.140039443969727, "global_step": 4251, "epoch": 35} {"train_loss": -19.840198516845703, "global_step": 4252, "epoch": 35} {"train_loss": -19.900283813476562, "global_step": 4253, "epoch": 35} {"train_loss": -19.48225212097168, "global_step": 4254, "epoch": 35} {"train_loss": -21.036893844604492, "global_step": 4255, "epoch": 35} {"train_loss": -19.743051528930664, "global_step": 4256, "epoch": 35} {"train_loss": -20.670604705810547, "global_step": 4257, "epoch": 35} {"train_loss": -20.098255157470703, "global_step": 4258, "epoch": 35} {"train_loss": -20.38998794555664, "global_step": 4259, "epoch": 35} {"train_loss": -20.733205795288086, "global_step": 4260, "epoch": 35} {"train_loss": -20.30861473083496, "global_step": 4261, "epoch": 35} {"train_loss": -20.551496505737305, "global_step": 4262, "epoch": 35} {"train_loss": -20.455705642700195, "global_step": 4263, "epoch": 35} {"train_loss": -20.527530670166016, "global_step": 4264, "epoch": 35} {"train_loss": -20.696531295776367, "global_step": 4265, "epoch": 35} {"train_loss": -20.520376205444336, "global_step": 4266, "epoch": 35} {"train_loss": -20.28120994567871, "global_step": 4267, "epoch": 35} {"train_loss": -19.64657974243164, "global_step": 4268, "epoch": 35} {"train_loss": -20.52274513244629, "global_step": 4269, "epoch": 35} {"train_loss": -20.349191665649414, "global_step": 4270, "epoch": 35} {"train_loss": -20.09556007385254, "global_step": 4271, "epoch": 35} {"train_loss": -20.419540405273438, "global_step": 4272, "epoch": 35} {"train_loss": -19.556184768676758, "global_step": 4273, "epoch": 35} {"train_loss": -20.251541137695312, "global_step": 4274, "epoch": 35} {"train_loss": -19.737028121948242, "global_step": 4275, "epoch": 35} {"train_loss": -20.61863136291504, "global_step": 4276, "epoch": 35} {"train_loss": -20.13128089904785, "global_step": 4277, "epoch": 35} {"train_loss": -20.563955307006836, "global_step": 4278, "epoch": 35} {"train_loss": -20.013525009155273, "global_step": 4279, "epoch": 35} {"train_loss": -17.719318389892578, "global_step": 4280, "epoch": 35} {"train_loss": -18.689794540405273, "global_step": 4281, "epoch": 35} {"train_loss": -20.22762107849121, "global_step": 4282, "epoch": 35} {"train_loss": -19.393463134765625, "global_step": 4283, "epoch": 35} {"train_loss": -19.725845336914062, "global_step": 4284, "epoch": 35} {"train_loss": -19.222307205200195, "global_step": 4285, "epoch": 35} {"train_loss": -20.13047981262207, "global_step": 4286, "epoch": 35} {"train_loss": -19.418371200561523, "global_step": 4287, "epoch": 35} {"train_loss": -19.6262149810791, "global_step": 4288, "epoch": 35} {"train_loss": -20.405088424682617, "global_step": 4289, "epoch": 35} {"train_loss": -20.42475128173828, "global_step": 4290, "epoch": 35} {"train_loss": -19.947912216186523, "global_step": 4291, "epoch": 35} {"train_loss": -20.084081649780273, "global_step": 4292, "epoch": 35} {"train_loss": -19.920703887939453, "global_step": 4293, "epoch": 35} {"train_loss": -20.6190242767334, "global_step": 4294, "epoch": 35} {"train_loss": -19.851049423217773, "global_step": 4295, "epoch": 35} {"train_loss": -19.834754943847656, "global_step": 4296, "epoch": 35} {"train_loss": -20.19515037536621, "global_step": 4297, "epoch": 35} {"train_loss": -20.65018081665039, "global_step": 4298, "epoch": 35} {"train_loss": -20.27955436706543, "global_step": 4299, "epoch": 35} {"train_loss": -20.484296798706055, "global_step": 4300, "epoch": 35} {"train_loss": -20.434036254882812, "global_step": 4301, "epoch": 35} {"train_loss": -20.220823287963867, "global_step": 4302, "epoch": 35} {"train_loss": -19.9668025970459, "global_step": 4303, "epoch": 35} {"train_loss": -20.305686950683594, "global_step": 4304, "epoch": 35} {"train_loss": -20.715457916259766, "global_step": 4305, "epoch": 35} {"train_loss": -20.463470458984375, "global_step": 4306, "epoch": 35} {"train_loss": -20.843210220336914, "global_step": 4307, "epoch": 35} {"train_loss": -19.519580841064453, "global_step": 4308, "epoch": 35} {"train_loss": -19.86336898803711, "global_step": 4309, "epoch": 35} {"train_loss": -20.22403907775879, "global_step": 4310, "epoch": 35} {"train_loss": -19.836637496948242, "global_step": 4311, "epoch": 35} {"train_loss": -20.339679718017578, "global_step": 4312, "epoch": 35} {"train_loss": -18.696115493774414, "global_step": 4313, "epoch": 35} {"train_loss": -20.04151725769043, "global_step": 4314, "epoch": 35} {"train_loss": -19.424293518066406, "global_step": 4315, "epoch": 35} {"train_loss": -20.48300552368164, "global_step": 4316, "epoch": 35} {"train_loss": -19.3775691986084, "global_step": 4317, "epoch": 35} {"train_loss": -20.372915267944336, "global_step": 4318, "epoch": 35} {"train_loss": -20.279247283935547, "global_step": 4319, "epoch": 35} {"train_loss": -20.526962280273438, "global_step": 4320, "epoch": 35} {"train_loss": -20.545896530151367, "global_step": 4321, "epoch": 35} {"train_loss": -20.32455062866211, "global_step": 4322, "epoch": 35} {"train_loss": -20.61231803894043, "global_step": 4323, "epoch": 35} {"train_loss": -20.052324295043945, "global_step": 4324, "epoch": 35} {"train_loss": -20.06171989440918, "global_step": 4325, "epoch": 35} {"train_loss": -20.43080711364746, "global_step": 4326, "epoch": 35} {"train_loss": -20.49952507019043, "global_step": 4327, "epoch": 35} {"train_loss": -19.951736450195312, "global_step": 4328, "epoch": 35} {"train_loss": -20.871610641479492, "global_step": 4329, "epoch": 35} {"train_loss": -20.340620040893555, "global_step": 4330, "epoch": 35} {"train_loss": -20.064254760742188, "global_step": 4331, "epoch": 35} {"train_loss": -20.117055892944336, "global_step": 4332, "epoch": 35} {"train_loss": -20.664852142333984, "global_step": 4333, "epoch": 35} {"train_loss": -20.647062301635742, "global_step": 4334, "epoch": 35} {"train_loss": -20.52650260925293, "global_step": 4335, "epoch": 35} {"train_loss": -20.68926429748535, "global_step": 4336, "epoch": 35} {"train_loss": -20.407453536987305, "global_step": 4337, "epoch": 35} {"train_loss": -20.34003448486328, "global_step": 4338, "epoch": 35} {"train_loss": -20.35164451599121, "global_step": 4339, "epoch": 35} {"train_loss": -20.627872467041016, "global_step": 4340, "epoch": 35} {"train_loss": -20.147403717041016, "global_step": 4341, "epoch": 35} {"train_loss": -20.729150772094727, "global_step": 4342, "epoch": 35} {"train_loss": -20.613996505737305, "global_step": 4343, "epoch": 35} {"train_loss": -20.118139266967773, "global_step": 4344, "epoch": 35} {"train_loss": -20.103979110717773, "global_step": 4345, "epoch": 35} {"train_loss": -20.49669075012207, "global_step": 4346, "epoch": 35} {"train_loss": -20.191009521484375, "global_step": 4347, "epoch": 35} {"train_loss": -20.23862648010254, "global_step": 4348, "epoch": 35} {"train_loss": -20.309858322143555, "global_step": 4349, "epoch": 35} {"train_loss": -20.446094512939453, "global_step": 4350, "epoch": 35} {"train_loss": -20.13409996032715, "global_step": 4351, "epoch": 35} {"train_loss": -20.68913459777832, "global_step": 4352, "epoch": 35} {"train_loss": -20.39312744140625, "global_step": 4353, "epoch": 35} {"train_loss": -20.35112762451172, "global_step": 4354, "epoch": 35} {"train_loss": -20.212952306447935, "global_step": 4355, "epoch": 35, "val_loss": 3596508.75} {"train_loss": -20.0130615234375, "global_step": 4356, "epoch": 36} {"train_loss": -20.2772159576416, "global_step": 4357, "epoch": 36} {"train_loss": -20.87474250793457, "global_step": 4358, "epoch": 36} {"train_loss": -21.01296043395996, "global_step": 4359, "epoch": 36} {"train_loss": -20.675352096557617, "global_step": 4360, "epoch": 36} {"train_loss": -20.74315643310547, "global_step": 4361, "epoch": 36} {"train_loss": -20.947711944580078, "global_step": 4362, "epoch": 36} {"train_loss": -20.3952579498291, "global_step": 4363, "epoch": 36} {"train_loss": -20.8701171875, "global_step": 4364, "epoch": 36} {"train_loss": -21.295236587524414, "global_step": 4365, "epoch": 36} {"train_loss": -20.73273277282715, "global_step": 4366, "epoch": 36} {"train_loss": -20.896703720092773, "global_step": 4367, "epoch": 36} {"train_loss": -20.600454330444336, "global_step": 4368, "epoch": 36} {"train_loss": -20.69784927368164, "global_step": 4369, "epoch": 36} {"train_loss": -20.311880111694336, "global_step": 4370, "epoch": 36} {"train_loss": -19.81709098815918, "global_step": 4371, "epoch": 36} {"train_loss": -19.113452911376953, "global_step": 4372, "epoch": 36} {"train_loss": -18.599124908447266, "global_step": 4373, "epoch": 36} {"train_loss": -20.443021774291992, "global_step": 4374, "epoch": 36} {"train_loss": -19.43405532836914, "global_step": 4375, "epoch": 36} {"train_loss": -20.14295768737793, "global_step": 4376, "epoch": 36} {"train_loss": -20.24325942993164, "global_step": 4377, "epoch": 36} {"train_loss": -19.75038719177246, "global_step": 4378, "epoch": 36} {"train_loss": -20.563568115234375, "global_step": 4379, "epoch": 36} {"train_loss": -20.57276153564453, "global_step": 4380, "epoch": 36} {"train_loss": -20.610090255737305, "global_step": 4381, "epoch": 36} {"train_loss": -20.214229583740234, "global_step": 4382, "epoch": 36} {"train_loss": -20.422895431518555, "global_step": 4383, "epoch": 36} {"train_loss": -20.12140464782715, "global_step": 4384, "epoch": 36} {"train_loss": -19.905139923095703, "global_step": 4385, "epoch": 36} {"train_loss": -20.259742736816406, "global_step": 4386, "epoch": 36} {"train_loss": -20.15622901916504, "global_step": 4387, "epoch": 36} {"train_loss": -19.317020416259766, "global_step": 4388, "epoch": 36} {"train_loss": -20.107791900634766, "global_step": 4389, "epoch": 36} {"train_loss": -20.177026748657227, "global_step": 4390, "epoch": 36} {"train_loss": -19.8489990234375, "global_step": 4391, "epoch": 36} {"train_loss": -20.351070404052734, "global_step": 4392, "epoch": 36} {"train_loss": -19.255725860595703, "global_step": 4393, "epoch": 36} {"train_loss": -20.688003540039062, "global_step": 4394, "epoch": 36} {"train_loss": -18.557117462158203, "global_step": 4395, "epoch": 36} {"train_loss": -20.091917037963867, "global_step": 4396, "epoch": 36} {"train_loss": -18.517942428588867, "global_step": 4397, "epoch": 36} {"train_loss": -17.345508575439453, "global_step": 4398, "epoch": 36} {"train_loss": -17.295421600341797, "global_step": 4399, "epoch": 36} {"train_loss": -19.02330207824707, "global_step": 4400, "epoch": 36} {"train_loss": -18.104856491088867, "global_step": 4401, "epoch": 36} {"train_loss": -19.870691299438477, "global_step": 4402, "epoch": 36} {"train_loss": -19.196941375732422, "global_step": 4403, "epoch": 36} {"train_loss": -19.49054527282715, "global_step": 4404, "epoch": 36} {"train_loss": -19.54791259765625, "global_step": 4405, "epoch": 36} {"train_loss": -19.007627487182617, "global_step": 4406, "epoch": 36} {"train_loss": -19.567556381225586, "global_step": 4407, "epoch": 36} {"train_loss": -19.735204696655273, "global_step": 4408, "epoch": 36} {"train_loss": -19.629972457885742, "global_step": 4409, "epoch": 36} {"train_loss": -19.46171760559082, "global_step": 4410, "epoch": 36} {"train_loss": -19.622207641601562, "global_step": 4411, "epoch": 36} {"train_loss": -19.657634735107422, "global_step": 4412, "epoch": 36} {"train_loss": -19.966630935668945, "global_step": 4413, "epoch": 36} {"train_loss": -19.709739685058594, "global_step": 4414, "epoch": 36} {"train_loss": -19.875234603881836, "global_step": 4415, "epoch": 36} {"train_loss": -19.906740188598633, "global_step": 4416, "epoch": 36} {"train_loss": -19.795791625976562, "global_step": 4417, "epoch": 36} {"train_loss": -20.46335792541504, "global_step": 4418, "epoch": 36} {"train_loss": -19.985048294067383, "global_step": 4419, "epoch": 36} {"train_loss": -19.402833938598633, "global_step": 4420, "epoch": 36} {"train_loss": -19.224889755249023, "global_step": 4421, "epoch": 36} {"train_loss": -19.758018493652344, "global_step": 4422, "epoch": 36} {"train_loss": -19.7392578125, "global_step": 4423, "epoch": 36} {"train_loss": -19.823022842407227, "global_step": 4424, "epoch": 36} {"train_loss": -19.572189331054688, "global_step": 4425, "epoch": 36} {"train_loss": -19.626407623291016, "global_step": 4426, "epoch": 36} {"train_loss": -19.58582878112793, "global_step": 4427, "epoch": 36} {"train_loss": -19.70071792602539, "global_step": 4428, "epoch": 36} {"train_loss": -19.928722381591797, "global_step": 4429, "epoch": 36} {"train_loss": -20.086811065673828, "global_step": 4430, "epoch": 36} {"train_loss": -19.909948348999023, "global_step": 4431, "epoch": 36} {"train_loss": -20.234922409057617, "global_step": 4432, "epoch": 36} {"train_loss": -20.438541412353516, "global_step": 4433, "epoch": 36} {"train_loss": -20.200475692749023, "global_step": 4434, "epoch": 36} {"train_loss": -20.284526824951172, "global_step": 4435, "epoch": 36} {"train_loss": -20.5953426361084, "global_step": 4436, "epoch": 36} {"train_loss": -20.627614974975586, "global_step": 4437, "epoch": 36} {"train_loss": -20.321584701538086, "global_step": 4438, "epoch": 36} {"train_loss": -20.555395126342773, "global_step": 4439, "epoch": 36} {"train_loss": -20.462766647338867, "global_step": 4440, "epoch": 36} {"train_loss": -20.433425903320312, "global_step": 4441, "epoch": 36} {"train_loss": -20.376220703125, "global_step": 4442, "epoch": 36} {"train_loss": -20.25664710998535, "global_step": 4443, "epoch": 36} {"train_loss": -21.131240844726562, "global_step": 4444, "epoch": 36} {"train_loss": -20.413488388061523, "global_step": 4445, "epoch": 36} {"train_loss": -20.934410095214844, "global_step": 4446, "epoch": 36} {"train_loss": -20.955148696899414, "global_step": 4447, "epoch": 36} {"train_loss": -19.341474533081055, "global_step": 4448, "epoch": 36} {"train_loss": -20.64389419555664, "global_step": 4449, "epoch": 36} {"train_loss": -19.999319076538086, "global_step": 4450, "epoch": 36} {"train_loss": -20.309040069580078, "global_step": 4451, "epoch": 36} {"train_loss": -19.63945198059082, "global_step": 4452, "epoch": 36} {"train_loss": -20.168630599975586, "global_step": 4453, "epoch": 36} {"train_loss": -20.222061157226562, "global_step": 4454, "epoch": 36} {"train_loss": -20.328577041625977, "global_step": 4455, "epoch": 36} {"train_loss": -20.299867630004883, "global_step": 4456, "epoch": 36} {"train_loss": -20.414634704589844, "global_step": 4457, "epoch": 36} {"train_loss": -20.66473388671875, "global_step": 4458, "epoch": 36} {"train_loss": -20.16691017150879, "global_step": 4459, "epoch": 36} {"train_loss": -20.65279769897461, "global_step": 4460, "epoch": 36} {"train_loss": -19.67242431640625, "global_step": 4461, "epoch": 36} {"train_loss": -19.99430274963379, "global_step": 4462, "epoch": 36} {"train_loss": -20.75373649597168, "global_step": 4463, "epoch": 36} {"train_loss": -20.51715660095215, "global_step": 4464, "epoch": 36} {"train_loss": -20.409225463867188, "global_step": 4465, "epoch": 36} {"train_loss": -20.598901748657227, "global_step": 4466, "epoch": 36} {"train_loss": -20.442554473876953, "global_step": 4467, "epoch": 36} {"train_loss": -20.47592544555664, "global_step": 4468, "epoch": 36} {"train_loss": -20.990131378173828, "global_step": 4469, "epoch": 36} {"train_loss": -20.653179168701172, "global_step": 4470, "epoch": 36} {"train_loss": -20.123645782470703, "global_step": 4471, "epoch": 36} {"train_loss": -20.727495193481445, "global_step": 4472, "epoch": 36} {"train_loss": -20.61505126953125, "global_step": 4473, "epoch": 36} {"train_loss": -20.914440155029297, "global_step": 4474, "epoch": 36} {"train_loss": -20.73177146911621, "global_step": 4475, "epoch": 36} {"train_loss": -20.07974837437149, "global_step": 4476, "epoch": 36, "val_loss": 3325333.0} {"train_loss": -20.648874282836914, "global_step": 4477, "epoch": 37} {"train_loss": -20.148944854736328, "global_step": 4478, "epoch": 37} {"train_loss": -20.695241928100586, "global_step": 4479, "epoch": 37} {"train_loss": -21.139875411987305, "global_step": 4480, "epoch": 37} {"train_loss": -20.09798240661621, "global_step": 4481, "epoch": 37} {"train_loss": -20.306631088256836, "global_step": 4482, "epoch": 37} {"train_loss": -20.394737243652344, "global_step": 4483, "epoch": 37} {"train_loss": -20.341978073120117, "global_step": 4484, "epoch": 37} {"train_loss": -20.715539932250977, "global_step": 4485, "epoch": 37} {"train_loss": -20.062179565429688, "global_step": 4486, "epoch": 37} {"train_loss": -19.94817543029785, "global_step": 4487, "epoch": 37} {"train_loss": -20.205398559570312, "global_step": 4488, "epoch": 37} {"train_loss": -19.143356323242188, "global_step": 4489, "epoch": 37} {"train_loss": -19.455596923828125, "global_step": 4490, "epoch": 37} {"train_loss": -17.2968692779541, "global_step": 4491, "epoch": 37} {"train_loss": -20.250539779663086, "global_step": 4492, "epoch": 37} {"train_loss": -18.759977340698242, "global_step": 4493, "epoch": 37} {"train_loss": -19.503036499023438, "global_step": 4494, "epoch": 37} {"train_loss": -19.401351928710938, "global_step": 4495, "epoch": 37} {"train_loss": -20.449731826782227, "global_step": 4496, "epoch": 37} {"train_loss": -19.381805419921875, "global_step": 4497, "epoch": 37} {"train_loss": -19.096811294555664, "global_step": 4498, "epoch": 37} {"train_loss": -20.20172119140625, "global_step": 4499, "epoch": 37} {"train_loss": -19.719274520874023, "global_step": 4500, "epoch": 37} {"train_loss": -19.955202102661133, "global_step": 4501, "epoch": 37} {"train_loss": -19.819543838500977, "global_step": 4502, "epoch": 37} {"train_loss": -19.39055061340332, "global_step": 4503, "epoch": 37} {"train_loss": -19.386564254760742, "global_step": 4504, "epoch": 37} {"train_loss": -20.116580963134766, "global_step": 4505, "epoch": 37} {"train_loss": -20.08221435546875, "global_step": 4506, "epoch": 37} {"train_loss": -19.999263763427734, "global_step": 4507, "epoch": 37} {"train_loss": -19.7769775390625, "global_step": 4508, "epoch": 37} {"train_loss": -20.064695358276367, "global_step": 4509, "epoch": 37} {"train_loss": -20.355520248413086, "global_step": 4510, "epoch": 37} {"train_loss": -20.226139068603516, "global_step": 4511, "epoch": 37} {"train_loss": -20.289443969726562, "global_step": 4512, "epoch": 37} {"train_loss": -20.36464500427246, "global_step": 4513, "epoch": 37} {"train_loss": -20.12715721130371, "global_step": 4514, "epoch": 37} {"train_loss": -20.528785705566406, "global_step": 4515, "epoch": 37} {"train_loss": -19.846891403198242, "global_step": 4516, "epoch": 37} {"train_loss": -20.233320236206055, "global_step": 4517, "epoch": 37} {"train_loss": -20.634981155395508, "global_step": 4518, "epoch": 37} {"train_loss": -20.57695770263672, "global_step": 4519, "epoch": 37} {"train_loss": -21.071386337280273, "global_step": 4520, "epoch": 37} {"train_loss": -20.478750228881836, "global_step": 4521, "epoch": 37} {"train_loss": -20.69815444946289, "global_step": 4522, "epoch": 37} {"train_loss": -20.63978385925293, "global_step": 4523, "epoch": 37} {"train_loss": -20.46457862854004, "global_step": 4524, "epoch": 37} {"train_loss": -20.7523250579834, "global_step": 4525, "epoch": 37} {"train_loss": -20.067655563354492, "global_step": 4526, "epoch": 37} {"train_loss": -20.950733184814453, "global_step": 4527, "epoch": 37} {"train_loss": -21.250629425048828, "global_step": 4528, "epoch": 37} {"train_loss": -20.44400978088379, "global_step": 4529, "epoch": 37} {"train_loss": -21.11345863342285, "global_step": 4530, "epoch": 37} {"train_loss": -21.16761589050293, "global_step": 4531, "epoch": 37} {"train_loss": -20.32706069946289, "global_step": 4532, "epoch": 37} {"train_loss": -19.751100540161133, "global_step": 4533, "epoch": 37} {"train_loss": -18.037254333496094, "global_step": 4534, "epoch": 37} {"train_loss": -18.37287712097168, "global_step": 4535, "epoch": 37} {"train_loss": -20.016733169555664, "global_step": 4536, "epoch": 37} {"train_loss": -20.357913970947266, "global_step": 4537, "epoch": 37} {"train_loss": -20.31125259399414, "global_step": 4538, "epoch": 37} {"train_loss": -20.128463745117188, "global_step": 4539, "epoch": 37} {"train_loss": -19.8447208404541, "global_step": 4540, "epoch": 37} {"train_loss": -20.103925704956055, "global_step": 4541, "epoch": 37} {"train_loss": -19.945255279541016, "global_step": 4542, "epoch": 37} {"train_loss": -20.312530517578125, "global_step": 4543, "epoch": 37} {"train_loss": -20.09067153930664, "global_step": 4544, "epoch": 37} {"train_loss": -19.48195457458496, "global_step": 4545, "epoch": 37} {"train_loss": -19.35068702697754, "global_step": 4546, "epoch": 37} {"train_loss": -19.491539001464844, "global_step": 4547, "epoch": 37} {"train_loss": -19.117155075073242, "global_step": 4548, "epoch": 37} {"train_loss": -19.877445220947266, "global_step": 4549, "epoch": 37} {"train_loss": -19.429325103759766, "global_step": 4550, "epoch": 37} {"train_loss": -20.222084045410156, "global_step": 4551, "epoch": 37} {"train_loss": -19.515586853027344, "global_step": 4552, "epoch": 37} {"train_loss": -20.234975814819336, "global_step": 4553, "epoch": 37} {"train_loss": -19.55759620666504, "global_step": 4554, "epoch": 37} {"train_loss": -19.880741119384766, "global_step": 4555, "epoch": 37} {"train_loss": -20.127483367919922, "global_step": 4556, "epoch": 37} {"train_loss": -20.208541870117188, "global_step": 4557, "epoch": 37} {"train_loss": -19.920761108398438, "global_step": 4558, "epoch": 37} {"train_loss": -20.4593505859375, "global_step": 4559, "epoch": 37} {"train_loss": -20.459014892578125, "global_step": 4560, "epoch": 37} {"train_loss": -20.15791893005371, "global_step": 4561, "epoch": 37} {"train_loss": -20.531681060791016, "global_step": 4562, "epoch": 37} {"train_loss": -20.3162784576416, "global_step": 4563, "epoch": 37} {"train_loss": -20.54927635192871, "global_step": 4564, "epoch": 37} {"train_loss": -20.189271926879883, "global_step": 4565, "epoch": 37} {"train_loss": -20.901281356811523, "global_step": 4566, "epoch": 37} {"train_loss": -20.790241241455078, "global_step": 4567, "epoch": 37} {"train_loss": -20.65712547302246, "global_step": 4568, "epoch": 37} {"train_loss": -20.648679733276367, "global_step": 4569, "epoch": 37} {"train_loss": -20.821081161499023, "global_step": 4570, "epoch": 37} {"train_loss": -20.77546501159668, "global_step": 4571, "epoch": 37} {"train_loss": -20.407955169677734, "global_step": 4572, "epoch": 37} {"train_loss": -19.061365127563477, "global_step": 4573, "epoch": 37} {"train_loss": -19.146766662597656, "global_step": 4574, "epoch": 37} {"train_loss": -20.711606979370117, "global_step": 4575, "epoch": 37} {"train_loss": -20.046588897705078, "global_step": 4576, "epoch": 37} {"train_loss": -20.085037231445312, "global_step": 4577, "epoch": 37} {"train_loss": -20.019025802612305, "global_step": 4578, "epoch": 37} {"train_loss": -20.11762046813965, "global_step": 4579, "epoch": 37} {"train_loss": -19.92853546142578, "global_step": 4580, "epoch": 37} {"train_loss": -20.004262924194336, "global_step": 4581, "epoch": 37} {"train_loss": -19.67084312438965, "global_step": 4582, "epoch": 37} {"train_loss": -20.55916404724121, "global_step": 4583, "epoch": 37} {"train_loss": -20.535383224487305, "global_step": 4584, "epoch": 37} {"train_loss": -19.782167434692383, "global_step": 4585, "epoch": 37} {"train_loss": -20.6281681060791, "global_step": 4586, "epoch": 37} {"train_loss": -19.912826538085938, "global_step": 4587, "epoch": 37} {"train_loss": -20.301712036132812, "global_step": 4588, "epoch": 37} {"train_loss": -20.064577102661133, "global_step": 4589, "epoch": 37} {"train_loss": -20.514596939086914, "global_step": 4590, "epoch": 37} {"train_loss": -19.88835906982422, "global_step": 4591, "epoch": 37} {"train_loss": -20.164901733398438, "global_step": 4592, "epoch": 37} {"train_loss": -20.724624633789062, "global_step": 4593, "epoch": 37} {"train_loss": -19.393857955932617, "global_step": 4594, "epoch": 37} {"train_loss": -20.760793685913086, "global_step": 4595, "epoch": 37} {"train_loss": -19.70454216003418, "global_step": 4596, "epoch": 37} {"train_loss": -20.087568409186748, "global_step": 4597, "epoch": 37, "val_loss": 2524457.75} {"train_loss": -19.378097534179688, "global_step": 4598, "epoch": 38} {"train_loss": -20.2922420501709, "global_step": 4599, "epoch": 38} {"train_loss": -19.349124908447266, "global_step": 4600, "epoch": 38} {"train_loss": -19.74677085876465, "global_step": 4601, "epoch": 38} {"train_loss": -18.890012741088867, "global_step": 4602, "epoch": 38} {"train_loss": -20.375701904296875, "global_step": 4603, "epoch": 38} {"train_loss": -19.24195098876953, "global_step": 4604, "epoch": 38} {"train_loss": -19.945560455322266, "global_step": 4605, "epoch": 38} {"train_loss": -19.857303619384766, "global_step": 4606, "epoch": 38} {"train_loss": -19.982154846191406, "global_step": 4607, "epoch": 38} {"train_loss": -20.46797752380371, "global_step": 4608, "epoch": 38} {"train_loss": -20.103750228881836, "global_step": 4609, "epoch": 38} {"train_loss": -20.504995346069336, "global_step": 4610, "epoch": 38} {"train_loss": -20.541839599609375, "global_step": 4611, "epoch": 38} {"train_loss": -20.229074478149414, "global_step": 4612, "epoch": 38} {"train_loss": -20.693174362182617, "global_step": 4613, "epoch": 38} {"train_loss": -20.18214225769043, "global_step": 4614, "epoch": 38} {"train_loss": -20.330244064331055, "global_step": 4615, "epoch": 38} {"train_loss": -20.344663619995117, "global_step": 4616, "epoch": 38} {"train_loss": -20.720556259155273, "global_step": 4617, "epoch": 38} {"train_loss": -20.712980270385742, "global_step": 4618, "epoch": 38} {"train_loss": -20.675512313842773, "global_step": 4619, "epoch": 38} {"train_loss": -21.02501678466797, "global_step": 4620, "epoch": 38} {"train_loss": -21.17617416381836, "global_step": 4621, "epoch": 38} {"train_loss": -20.42414665222168, "global_step": 4622, "epoch": 38} {"train_loss": -19.332305908203125, "global_step": 4623, "epoch": 38} {"train_loss": -17.918188095092773, "global_step": 4624, "epoch": 38} {"train_loss": -15.638412475585938, "global_step": 4625, "epoch": 38} {"train_loss": -17.2049617767334, "global_step": 4626, "epoch": 38} {"train_loss": -14.165300369262695, "global_step": 4627, "epoch": 38} {"train_loss": -10.44982624053955, "global_step": 4628, "epoch": 38} {"train_loss": -16.795034408569336, "global_step": 4629, "epoch": 38} {"train_loss": -19.105009078979492, "global_step": 4630, "epoch": 38} {"train_loss": -16.138154983520508, "global_step": 4631, "epoch": 38} {"train_loss": -15.9884033203125, "global_step": 4632, "epoch": 38} {"train_loss": -18.79483413696289, "global_step": 4633, "epoch": 38} {"train_loss": -18.2951717376709, "global_step": 4634, "epoch": 38} {"train_loss": -19.348739624023438, "global_step": 4635, "epoch": 38} {"train_loss": -19.110393524169922, "global_step": 4636, "epoch": 38} {"train_loss": -18.825563430786133, "global_step": 4637, "epoch": 38} {"train_loss": -18.950170516967773, "global_step": 4638, "epoch": 38} {"train_loss": -18.04156494140625, "global_step": 4639, "epoch": 38} {"train_loss": -17.99067497253418, "global_step": 4640, "epoch": 38} {"train_loss": -17.75810432434082, "global_step": 4641, "epoch": 38} {"train_loss": -18.390827178955078, "global_step": 4642, "epoch": 38} {"train_loss": -18.06339454650879, "global_step": 4643, "epoch": 38} {"train_loss": -18.70747184753418, "global_step": 4644, "epoch": 38} {"train_loss": -18.18703269958496, "global_step": 4645, "epoch": 38} {"train_loss": -18.45491600036621, "global_step": 4646, "epoch": 38} {"train_loss": -17.955480575561523, "global_step": 4647, "epoch": 38} {"train_loss": -18.180227279663086, "global_step": 4648, "epoch": 38} {"train_loss": -18.788633346557617, "global_step": 4649, "epoch": 38} {"train_loss": -19.064802169799805, "global_step": 4650, "epoch": 38} {"train_loss": -18.78029441833496, "global_step": 4651, "epoch": 38} {"train_loss": -18.299476623535156, "global_step": 4652, "epoch": 38} {"train_loss": -18.44028663635254, "global_step": 4653, "epoch": 38} {"train_loss": -17.897390365600586, "global_step": 4654, "epoch": 38} {"train_loss": -18.32179069519043, "global_step": 4655, "epoch": 38} {"train_loss": -18.89473533630371, "global_step": 4656, "epoch": 38} {"train_loss": -18.583324432373047, "global_step": 4657, "epoch": 38} {"train_loss": -18.241004943847656, "global_step": 4658, "epoch": 38} {"train_loss": -18.482580184936523, "global_step": 4659, "epoch": 38} {"train_loss": -18.30341911315918, "global_step": 4660, "epoch": 38} {"train_loss": -18.565202713012695, "global_step": 4661, "epoch": 38} {"train_loss": -19.612165451049805, "global_step": 4662, "epoch": 38} {"train_loss": -19.72136116027832, "global_step": 4663, "epoch": 38} {"train_loss": -19.165239334106445, "global_step": 4664, "epoch": 38} {"train_loss": -19.10650062561035, "global_step": 4665, "epoch": 38} {"train_loss": -18.948511123657227, "global_step": 4666, "epoch": 38} {"train_loss": -19.01183319091797, "global_step": 4667, "epoch": 38} {"train_loss": -19.04047203063965, "global_step": 4668, "epoch": 38} {"train_loss": -19.256454467773438, "global_step": 4669, "epoch": 38} {"train_loss": -19.529804229736328, "global_step": 4670, "epoch": 38} {"train_loss": -19.286245346069336, "global_step": 4671, "epoch": 38} {"train_loss": -19.555463790893555, "global_step": 4672, "epoch": 38} {"train_loss": -19.084535598754883, "global_step": 4673, "epoch": 38} {"train_loss": -19.485794067382812, "global_step": 4674, "epoch": 38} {"train_loss": -19.330615997314453, "global_step": 4675, "epoch": 38} {"train_loss": -19.908660888671875, "global_step": 4676, "epoch": 38} {"train_loss": -19.436620712280273, "global_step": 4677, "epoch": 38} {"train_loss": -19.478384017944336, "global_step": 4678, "epoch": 38} {"train_loss": -19.62796401977539, "global_step": 4679, "epoch": 38} {"train_loss": -19.593687057495117, "global_step": 4680, "epoch": 38} {"train_loss": -19.581357955932617, "global_step": 4681, "epoch": 38} {"train_loss": -19.661434173583984, "global_step": 4682, "epoch": 38} {"train_loss": -20.03502082824707, "global_step": 4683, "epoch": 38} {"train_loss": -20.22686195373535, "global_step": 4684, "epoch": 38} {"train_loss": -20.12529754638672, "global_step": 4685, "epoch": 38} {"train_loss": -19.922714233398438, "global_step": 4686, "epoch": 38} {"train_loss": -19.71320152282715, "global_step": 4687, "epoch": 38} {"train_loss": -19.80757713317871, "global_step": 4688, "epoch": 38} {"train_loss": -19.29927635192871, "global_step": 4689, "epoch": 38} {"train_loss": -19.201223373413086, "global_step": 4690, "epoch": 38} {"train_loss": -20.157001495361328, "global_step": 4691, "epoch": 38} {"train_loss": -20.45265007019043, "global_step": 4692, "epoch": 38} {"train_loss": -20.009204864501953, "global_step": 4693, "epoch": 38} {"train_loss": -19.29395866394043, "global_step": 4694, "epoch": 38} {"train_loss": -19.682958602905273, "global_step": 4695, "epoch": 38} {"train_loss": -18.497434616088867, "global_step": 4696, "epoch": 38} {"train_loss": -18.6106014251709, "global_step": 4697, "epoch": 38} {"train_loss": -18.78557014465332, "global_step": 4698, "epoch": 38} {"train_loss": -19.730436325073242, "global_step": 4699, "epoch": 38} {"train_loss": -18.73406410217285, "global_step": 4700, "epoch": 38} {"train_loss": -19.961984634399414, "global_step": 4701, "epoch": 38} {"train_loss": -19.129369735717773, "global_step": 4702, "epoch": 38} {"train_loss": -18.93307876586914, "global_step": 4703, "epoch": 38} {"train_loss": -19.94452476501465, "global_step": 4704, "epoch": 38} {"train_loss": -19.212284088134766, "global_step": 4705, "epoch": 38} {"train_loss": -19.53473472595215, "global_step": 4706, "epoch": 38} {"train_loss": -19.454946517944336, "global_step": 4707, "epoch": 38} {"train_loss": -19.47115707397461, "global_step": 4708, "epoch": 38} {"train_loss": -20.018583297729492, "global_step": 4709, "epoch": 38} {"train_loss": -19.532201766967773, "global_step": 4710, "epoch": 38} {"train_loss": -19.837909698486328, "global_step": 4711, "epoch": 38} {"train_loss": -20.0515193939209, "global_step": 4712, "epoch": 38} {"train_loss": -20.199005126953125, "global_step": 4713, "epoch": 38} {"train_loss": -19.96767234802246, "global_step": 4714, "epoch": 38} {"train_loss": -19.575407028198242, "global_step": 4715, "epoch": 38} {"train_loss": -19.8945255279541, "global_step": 4716, "epoch": 38} {"train_loss": -20.03836441040039, "global_step": 4717, "epoch": 38} {"train_loss": -19.155825346954597, "global_step": 4718, "epoch": 38, "val_loss": 3453529.75} {"train_loss": -19.797462463378906, "global_step": 4719, "epoch": 39} {"train_loss": -20.243722915649414, "global_step": 4720, "epoch": 39} {"train_loss": -20.420806884765625, "global_step": 4721, "epoch": 39} {"train_loss": -20.373062133789062, "global_step": 4722, "epoch": 39} {"train_loss": -20.62228775024414, "global_step": 4723, "epoch": 39} {"train_loss": -20.271360397338867, "global_step": 4724, "epoch": 39} {"train_loss": -20.724721908569336, "global_step": 4725, "epoch": 39} {"train_loss": -20.777006149291992, "global_step": 4726, "epoch": 39} {"train_loss": -20.77811622619629, "global_step": 4727, "epoch": 39} {"train_loss": -20.632436752319336, "global_step": 4728, "epoch": 39} {"train_loss": -20.911447525024414, "global_step": 4729, "epoch": 39} {"train_loss": -21.45490074157715, "global_step": 4730, "epoch": 39} {"train_loss": -20.740550994873047, "global_step": 4731, "epoch": 39} {"train_loss": -20.76185417175293, "global_step": 4732, "epoch": 39} {"train_loss": -21.151065826416016, "global_step": 4733, "epoch": 39} {"train_loss": -21.29888153076172, "global_step": 4734, "epoch": 39} {"train_loss": -20.976430892944336, "global_step": 4735, "epoch": 39} {"train_loss": -21.157438278198242, "global_step": 4736, "epoch": 39} {"train_loss": -21.084016799926758, "global_step": 4737, "epoch": 39} {"train_loss": -21.50831413269043, "global_step": 4738, "epoch": 39} {"train_loss": -21.297470092773438, "global_step": 4739, "epoch": 39} {"train_loss": -21.661331176757812, "global_step": 4740, "epoch": 39} {"train_loss": -21.781042098999023, "global_step": 4741, "epoch": 39} {"train_loss": -20.9141845703125, "global_step": 4742, "epoch": 39} {"train_loss": -21.341629028320312, "global_step": 4743, "epoch": 39} {"train_loss": -21.191556930541992, "global_step": 4744, "epoch": 39} {"train_loss": -19.857501983642578, "global_step": 4745, "epoch": 39} {"train_loss": -17.367450714111328, "global_step": 4746, "epoch": 39} {"train_loss": -19.28196144104004, "global_step": 4747, "epoch": 39} {"train_loss": -21.26071548461914, "global_step": 4748, "epoch": 39} {"train_loss": -19.309696197509766, "global_step": 4749, "epoch": 39} {"train_loss": -19.98285484313965, "global_step": 4750, "epoch": 39} {"train_loss": -19.780181884765625, "global_step": 4751, "epoch": 39} {"train_loss": -20.89540672302246, "global_step": 4752, "epoch": 39} {"train_loss": -20.532217025756836, "global_step": 4753, "epoch": 39} {"train_loss": -20.871747970581055, "global_step": 4754, "epoch": 39} {"train_loss": -20.346139907836914, "global_step": 4755, "epoch": 39} {"train_loss": -20.25789451599121, "global_step": 4756, "epoch": 39} {"train_loss": -19.851579666137695, "global_step": 4757, "epoch": 39} {"train_loss": -20.04959487915039, "global_step": 4758, "epoch": 39} {"train_loss": -20.196765899658203, "global_step": 4759, "epoch": 39} {"train_loss": -20.055830001831055, "global_step": 4760, "epoch": 39} {"train_loss": -18.62253189086914, "global_step": 4761, "epoch": 39} {"train_loss": -19.839569091796875, "global_step": 4762, "epoch": 39} {"train_loss": -19.906232833862305, "global_step": 4763, "epoch": 39} {"train_loss": -19.70181655883789, "global_step": 4764, "epoch": 39} {"train_loss": -19.65751838684082, "global_step": 4765, "epoch": 39} {"train_loss": -20.658193588256836, "global_step": 4766, "epoch": 39} {"train_loss": -19.958843231201172, "global_step": 4767, "epoch": 39} {"train_loss": -19.71164321899414, "global_step": 4768, "epoch": 39} {"train_loss": -20.565975189208984, "global_step": 4769, "epoch": 39} {"train_loss": -20.276762008666992, "global_step": 4770, "epoch": 39} {"train_loss": -20.493066787719727, "global_step": 4771, "epoch": 39} {"train_loss": -19.977018356323242, "global_step": 4772, "epoch": 39} {"train_loss": -20.724262237548828, "global_step": 4773, "epoch": 39} {"train_loss": -20.449935913085938, "global_step": 4774, "epoch": 39} {"train_loss": -20.596715927124023, "global_step": 4775, "epoch": 39} {"train_loss": -20.855443954467773, "global_step": 4776, "epoch": 39} {"train_loss": -20.743757247924805, "global_step": 4777, "epoch": 39} {"train_loss": -20.68077278137207, "global_step": 4778, "epoch": 39} {"train_loss": -20.385732650756836, "global_step": 4779, "epoch": 39} {"train_loss": -20.706335067749023, "global_step": 4780, "epoch": 39} {"train_loss": -21.046262741088867, "global_step": 4781, "epoch": 39} {"train_loss": -20.277524948120117, "global_step": 4782, "epoch": 39} {"train_loss": -20.472558975219727, "global_step": 4783, "epoch": 39} {"train_loss": -20.884794235229492, "global_step": 4784, "epoch": 39} {"train_loss": -20.559717178344727, "global_step": 4785, "epoch": 39} {"train_loss": -21.144433975219727, "global_step": 4786, "epoch": 39} {"train_loss": -20.31390953063965, "global_step": 4787, "epoch": 39} {"train_loss": -20.86721420288086, "global_step": 4788, "epoch": 39} {"train_loss": -20.4397029876709, "global_step": 4789, "epoch": 39} {"train_loss": -20.827802658081055, "global_step": 4790, "epoch": 39} {"train_loss": -20.556137084960938, "global_step": 4791, "epoch": 39} {"train_loss": -21.12733268737793, "global_step": 4792, "epoch": 39} {"train_loss": -20.298486709594727, "global_step": 4793, "epoch": 39} {"train_loss": -20.986902236938477, "global_step": 4794, "epoch": 39} {"train_loss": -20.40736961364746, "global_step": 4795, "epoch": 39} {"train_loss": -20.90091323852539, "global_step": 4796, "epoch": 39} {"train_loss": -21.183347702026367, "global_step": 4797, "epoch": 39} {"train_loss": -20.704526901245117, "global_step": 4798, "epoch": 39} {"train_loss": -21.174070358276367, "global_step": 4799, "epoch": 39} {"train_loss": -20.68244743347168, "global_step": 4800, "epoch": 39} {"train_loss": -20.5567684173584, "global_step": 4801, "epoch": 39} {"train_loss": -19.906492233276367, "global_step": 4802, "epoch": 39} {"train_loss": -20.916271209716797, "global_step": 4803, "epoch": 39} {"train_loss": -20.88347816467285, "global_step": 4804, "epoch": 39} {"train_loss": -19.635589599609375, "global_step": 4805, "epoch": 39} {"train_loss": -20.94023895263672, "global_step": 4806, "epoch": 39} {"train_loss": -20.064729690551758, "global_step": 4807, "epoch": 39} {"train_loss": -20.46107292175293, "global_step": 4808, "epoch": 39} {"train_loss": -21.295795440673828, "global_step": 4809, "epoch": 39} {"train_loss": -20.761512756347656, "global_step": 4810, "epoch": 39} {"train_loss": -21.11647605895996, "global_step": 4811, "epoch": 39} {"train_loss": -20.985271453857422, "global_step": 4812, "epoch": 39} {"train_loss": -20.957874298095703, "global_step": 4813, "epoch": 39} {"train_loss": -21.127302169799805, "global_step": 4814, "epoch": 39} {"train_loss": -20.211257934570312, "global_step": 4815, "epoch": 39} {"train_loss": -20.735498428344727, "global_step": 4816, "epoch": 39} {"train_loss": -20.785812377929688, "global_step": 4817, "epoch": 39} {"train_loss": -20.324068069458008, "global_step": 4818, "epoch": 39} {"train_loss": -20.566925048828125, "global_step": 4819, "epoch": 39} {"train_loss": -20.790273666381836, "global_step": 4820, "epoch": 39} {"train_loss": -20.7978572845459, "global_step": 4821, "epoch": 39} {"train_loss": -20.69266700744629, "global_step": 4822, "epoch": 39} {"train_loss": -20.790306091308594, "global_step": 4823, "epoch": 39} {"train_loss": -20.695653915405273, "global_step": 4824, "epoch": 39} {"train_loss": -20.924720764160156, "global_step": 4825, "epoch": 39} {"train_loss": -20.809919357299805, "global_step": 4826, "epoch": 39} {"train_loss": -20.334386825561523, "global_step": 4827, "epoch": 39} {"train_loss": -21.382244110107422, "global_step": 4828, "epoch": 39} {"train_loss": -20.708873748779297, "global_step": 4829, "epoch": 39} {"train_loss": -20.48550033569336, "global_step": 4830, "epoch": 39} {"train_loss": -20.445608139038086, "global_step": 4831, "epoch": 39} {"train_loss": -21.240514755249023, "global_step": 4832, "epoch": 39} {"train_loss": -20.589040756225586, "global_step": 4833, "epoch": 39} {"train_loss": -20.401411056518555, "global_step": 4834, "epoch": 39} {"train_loss": -21.471561431884766, "global_step": 4835, "epoch": 39} {"train_loss": -20.636762619018555, "global_step": 4836, "epoch": 39} {"train_loss": -21.057483673095703, "global_step": 4837, "epoch": 39} {"train_loss": -20.786243438720703, "global_step": 4838, "epoch": 39} {"train_loss": -20.588015122847125, "global_step": 4839, "epoch": 39, "val_loss": 2914982.0} {"train_loss": -20.44105339050293, "global_step": 4840, "epoch": 40} {"train_loss": -21.043622970581055, "global_step": 4841, "epoch": 40} {"train_loss": -20.837697982788086, "global_step": 4842, "epoch": 40} {"train_loss": -21.202133178710938, "global_step": 4843, "epoch": 40} {"train_loss": -20.953622817993164, "global_step": 4844, "epoch": 40} {"train_loss": -21.16594123840332, "global_step": 4845, "epoch": 40} {"train_loss": -20.923917770385742, "global_step": 4846, "epoch": 40} {"train_loss": -20.518936157226562, "global_step": 4847, "epoch": 40} {"train_loss": -20.976896286010742, "global_step": 4848, "epoch": 40} {"train_loss": -20.336864471435547, "global_step": 4849, "epoch": 40} {"train_loss": -19.60011863708496, "global_step": 4850, "epoch": 40} {"train_loss": -20.22531509399414, "global_step": 4851, "epoch": 40} {"train_loss": -20.020709991455078, "global_step": 4852, "epoch": 40} {"train_loss": -20.700345993041992, "global_step": 4853, "epoch": 40} {"train_loss": -20.668676376342773, "global_step": 4854, "epoch": 40} {"train_loss": -20.728452682495117, "global_step": 4855, "epoch": 40} {"train_loss": -20.699392318725586, "global_step": 4856, "epoch": 40} {"train_loss": -20.317337036132812, "global_step": 4857, "epoch": 40} {"train_loss": -21.059106826782227, "global_step": 4858, "epoch": 40} {"train_loss": -20.612686157226562, "global_step": 4859, "epoch": 40} {"train_loss": -21.540372848510742, "global_step": 4860, "epoch": 40} {"train_loss": -20.95391273498535, "global_step": 4861, "epoch": 40} {"train_loss": -20.856191635131836, "global_step": 4862, "epoch": 40} {"train_loss": -20.99257469177246, "global_step": 4863, "epoch": 40} {"train_loss": -20.934070587158203, "global_step": 4864, "epoch": 40} {"train_loss": -20.81463050842285, "global_step": 4865, "epoch": 40} {"train_loss": -20.834287643432617, "global_step": 4866, "epoch": 40} {"train_loss": -20.97425651550293, "global_step": 4867, "epoch": 40} {"train_loss": -20.805057525634766, "global_step": 4868, "epoch": 40} {"train_loss": -20.749135971069336, "global_step": 4869, "epoch": 40} {"train_loss": -21.066129684448242, "global_step": 4870, "epoch": 40} {"train_loss": -21.05607032775879, "global_step": 4871, "epoch": 40} {"train_loss": -21.358922958374023, "global_step": 4872, "epoch": 40} {"train_loss": -20.580076217651367, "global_step": 4873, "epoch": 40} {"train_loss": -21.049951553344727, "global_step": 4874, "epoch": 40} {"train_loss": -20.984024047851562, "global_step": 4875, "epoch": 40} {"train_loss": -21.105300903320312, "global_step": 4876, "epoch": 40} {"train_loss": -20.981689453125, "global_step": 4877, "epoch": 40} {"train_loss": -21.12099266052246, "global_step": 4878, "epoch": 40} {"train_loss": -21.086950302124023, "global_step": 4879, "epoch": 40} {"train_loss": -21.079044342041016, "global_step": 4880, "epoch": 40} {"train_loss": -21.428808212280273, "global_step": 4881, "epoch": 40} {"train_loss": -20.993980407714844, "global_step": 4882, "epoch": 40} {"train_loss": -20.765544891357422, "global_step": 4883, "epoch": 40} {"train_loss": -20.919235229492188, "global_step": 4884, "epoch": 40} {"train_loss": -21.923187255859375, "global_step": 4885, "epoch": 40} {"train_loss": -21.02035903930664, "global_step": 4886, "epoch": 40} {"train_loss": -21.020679473876953, "global_step": 4887, "epoch": 40} {"train_loss": -20.430707931518555, "global_step": 4888, "epoch": 40} {"train_loss": -20.139850616455078, "global_step": 4889, "epoch": 40} {"train_loss": -19.1981143951416, "global_step": 4890, "epoch": 40} {"train_loss": -18.756322860717773, "global_step": 4891, "epoch": 40} {"train_loss": -20.254796981811523, "global_step": 4892, "epoch": 40} {"train_loss": -19.030973434448242, "global_step": 4893, "epoch": 40} {"train_loss": -19.275659561157227, "global_step": 4894, "epoch": 40} {"train_loss": -20.73107147216797, "global_step": 4895, "epoch": 40} {"train_loss": -20.859628677368164, "global_step": 4896, "epoch": 40} {"train_loss": -20.548969268798828, "global_step": 4897, "epoch": 40} {"train_loss": -20.57023048400879, "global_step": 4898, "epoch": 40} {"train_loss": -20.822790145874023, "global_step": 4899, "epoch": 40} {"train_loss": -20.551013946533203, "global_step": 4900, "epoch": 40} {"train_loss": -20.795927047729492, "global_step": 4901, "epoch": 40} {"train_loss": -20.646223068237305, "global_step": 4902, "epoch": 40} {"train_loss": -20.443281173706055, "global_step": 4903, "epoch": 40} {"train_loss": -20.922962188720703, "global_step": 4904, "epoch": 40} {"train_loss": -20.68060874938965, "global_step": 4905, "epoch": 40} {"train_loss": -20.53956413269043, "global_step": 4906, "epoch": 40} {"train_loss": -21.1470947265625, "global_step": 4907, "epoch": 40} {"train_loss": -20.681766510009766, "global_step": 4908, "epoch": 40} {"train_loss": -20.906742095947266, "global_step": 4909, "epoch": 40} {"train_loss": -21.449899673461914, "global_step": 4910, "epoch": 40} {"train_loss": -20.623010635375977, "global_step": 4911, "epoch": 40} {"train_loss": -20.70327377319336, "global_step": 4912, "epoch": 40} {"train_loss": -20.81789207458496, "global_step": 4913, "epoch": 40} {"train_loss": -20.892902374267578, "global_step": 4914, "epoch": 40} {"train_loss": -20.517221450805664, "global_step": 4915, "epoch": 40} {"train_loss": -21.233579635620117, "global_step": 4916, "epoch": 40} {"train_loss": -21.363304138183594, "global_step": 4917, "epoch": 40} {"train_loss": -20.879989624023438, "global_step": 4918, "epoch": 40} {"train_loss": -21.262744903564453, "global_step": 4919, "epoch": 40} {"train_loss": -20.644790649414062, "global_step": 4920, "epoch": 40} {"train_loss": -20.940107345581055, "global_step": 4921, "epoch": 40} {"train_loss": -21.56109046936035, "global_step": 4922, "epoch": 40} {"train_loss": -20.91258430480957, "global_step": 4923, "epoch": 40} {"train_loss": -20.91044807434082, "global_step": 4924, "epoch": 40} {"train_loss": -21.036672592163086, "global_step": 4925, "epoch": 40} {"train_loss": -21.345203399658203, "global_step": 4926, "epoch": 40} {"train_loss": -21.40888786315918, "global_step": 4927, "epoch": 40} {"train_loss": -21.175460815429688, "global_step": 4928, "epoch": 40} {"train_loss": -21.25339126586914, "global_step": 4929, "epoch": 40} {"train_loss": -21.635244369506836, "global_step": 4930, "epoch": 40} {"train_loss": -20.957494735717773, "global_step": 4931, "epoch": 40} {"train_loss": -20.924802780151367, "global_step": 4932, "epoch": 40} {"train_loss": -21.068004608154297, "global_step": 4933, "epoch": 40} {"train_loss": -20.768600463867188, "global_step": 4934, "epoch": 40} {"train_loss": -21.402273178100586, "global_step": 4935, "epoch": 40} {"train_loss": -20.62135124206543, "global_step": 4936, "epoch": 40} {"train_loss": -20.005613327026367, "global_step": 4937, "epoch": 40} {"train_loss": -20.881986618041992, "global_step": 4938, "epoch": 40} {"train_loss": -21.271453857421875, "global_step": 4939, "epoch": 40} {"train_loss": -20.37890625, "global_step": 4940, "epoch": 40} {"train_loss": -21.055007934570312, "global_step": 4941, "epoch": 40} {"train_loss": -21.157690048217773, "global_step": 4942, "epoch": 40} {"train_loss": -20.638364791870117, "global_step": 4943, "epoch": 40} {"train_loss": -21.12464141845703, "global_step": 4944, "epoch": 40} {"train_loss": -20.541074752807617, "global_step": 4945, "epoch": 40} {"train_loss": -20.485170364379883, "global_step": 4946, "epoch": 40} {"train_loss": -21.393686294555664, "global_step": 4947, "epoch": 40} {"train_loss": -20.89008140563965, "global_step": 4948, "epoch": 40} {"train_loss": -20.937305450439453, "global_step": 4949, "epoch": 40} {"train_loss": -20.311540603637695, "global_step": 4950, "epoch": 40} {"train_loss": -21.419713973999023, "global_step": 4951, "epoch": 40} {"train_loss": -20.799837112426758, "global_step": 4952, "epoch": 40} {"train_loss": -20.960647583007812, "global_step": 4953, "epoch": 40} {"train_loss": -20.915990829467773, "global_step": 4954, "epoch": 40} {"train_loss": -21.219324111938477, "global_step": 4955, "epoch": 40} {"train_loss": -21.172977447509766, "global_step": 4956, "epoch": 40} {"train_loss": -21.09444808959961, "global_step": 4957, "epoch": 40} {"train_loss": -20.636510848999023, "global_step": 4958, "epoch": 40} {"train_loss": -20.80415153503418, "global_step": 4959, "epoch": 40} {"train_loss": -20.819262764670633, "global_step": 4960, "epoch": 40, "val_loss": 3368211.25} {"train_loss": -20.553836822509766, "global_step": 4961, "epoch": 41} {"train_loss": -21.472003936767578, "global_step": 4962, "epoch": 41} {"train_loss": -21.25257682800293, "global_step": 4963, "epoch": 41} {"train_loss": -21.072139739990234, "global_step": 4964, "epoch": 41} {"train_loss": -20.951589584350586, "global_step": 4965, "epoch": 41} {"train_loss": -21.440353393554688, "global_step": 4966, "epoch": 41} {"train_loss": -20.897321701049805, "global_step": 4967, "epoch": 41} {"train_loss": -20.34569549560547, "global_step": 4968, "epoch": 41} {"train_loss": -20.836149215698242, "global_step": 4969, "epoch": 41} {"train_loss": -19.51453971862793, "global_step": 4970, "epoch": 41} {"train_loss": -20.994531631469727, "global_step": 4971, "epoch": 41} {"train_loss": -20.13172721862793, "global_step": 4972, "epoch": 41} {"train_loss": -20.859411239624023, "global_step": 4973, "epoch": 41} {"train_loss": -20.001493453979492, "global_step": 4974, "epoch": 41} {"train_loss": -21.620811462402344, "global_step": 4975, "epoch": 41} {"train_loss": -21.070510864257812, "global_step": 4976, "epoch": 41} {"train_loss": -21.277082443237305, "global_step": 4977, "epoch": 41} {"train_loss": -20.416948318481445, "global_step": 4978, "epoch": 41} {"train_loss": -21.5490779876709, "global_step": 4979, "epoch": 41} {"train_loss": -21.221668243408203, "global_step": 4980, "epoch": 41} {"train_loss": -20.83662986755371, "global_step": 4981, "epoch": 41} {"train_loss": -20.800901412963867, "global_step": 4982, "epoch": 41} {"train_loss": -19.8403377532959, "global_step": 4983, "epoch": 41} {"train_loss": -20.691425323486328, "global_step": 4984, "epoch": 41} {"train_loss": -20.86077117919922, "global_step": 4985, "epoch": 41} {"train_loss": -21.138158798217773, "global_step": 4986, "epoch": 41} {"train_loss": -20.25136375427246, "global_step": 4987, "epoch": 41} {"train_loss": -21.520750045776367, "global_step": 4988, "epoch": 41} {"train_loss": -19.8752384185791, "global_step": 4989, "epoch": 41} {"train_loss": -18.99445343017578, "global_step": 4990, "epoch": 41} {"train_loss": -17.609745025634766, "global_step": 4991, "epoch": 41} {"train_loss": -21.082077026367188, "global_step": 4992, "epoch": 41} {"train_loss": -18.488134384155273, "global_step": 4993, "epoch": 41} {"train_loss": -20.36614418029785, "global_step": 4994, "epoch": 41} {"train_loss": -20.660985946655273, "global_step": 4995, "epoch": 41} {"train_loss": -20.793994903564453, "global_step": 4996, "epoch": 41} {"train_loss": -20.938629150390625, "global_step": 4997, "epoch": 41} {"train_loss": -21.056177139282227, "global_step": 4998, "epoch": 41} {"train_loss": -20.997089385986328, "global_step": 4999, "epoch": 41} {"train_loss": -21.143817901611328, "global_step": 5000, "epoch": 41} {"train_loss": -20.35893440246582, "global_step": 5001, "epoch": 41} {"train_loss": -20.681249618530273, "global_step": 5002, "epoch": 41} {"train_loss": -20.635910034179688, "global_step": 5003, "epoch": 41} {"train_loss": -20.726112365722656, "global_step": 5004, "epoch": 41} {"train_loss": -21.13816261291504, "global_step": 5005, "epoch": 41} {"train_loss": -21.272008895874023, "global_step": 5006, "epoch": 41} {"train_loss": -20.8442325592041, "global_step": 5007, "epoch": 41} {"train_loss": -20.64512825012207, "global_step": 5008, "epoch": 41} {"train_loss": -20.786741256713867, "global_step": 5009, "epoch": 41} {"train_loss": -20.885711669921875, "global_step": 5010, "epoch": 41} {"train_loss": -20.585603713989258, "global_step": 5011, "epoch": 41} {"train_loss": -20.983352661132812, "global_step": 5012, "epoch": 41} {"train_loss": -21.116424560546875, "global_step": 5013, "epoch": 41} {"train_loss": -20.310131072998047, "global_step": 5014, "epoch": 41} {"train_loss": -20.98294448852539, "global_step": 5015, "epoch": 41} {"train_loss": -20.676000595092773, "global_step": 5016, "epoch": 41} {"train_loss": -20.797666549682617, "global_step": 5017, "epoch": 41} {"train_loss": -21.054054260253906, "global_step": 5018, "epoch": 41} {"train_loss": -20.835256576538086, "global_step": 5019, "epoch": 41} {"train_loss": -21.409526824951172, "global_step": 5020, "epoch": 41} {"train_loss": -20.737140655517578, "global_step": 5021, "epoch": 41} {"train_loss": -21.220991134643555, "global_step": 5022, "epoch": 41} {"train_loss": -21.320053100585938, "global_step": 5023, "epoch": 41} {"train_loss": -21.097793579101562, "global_step": 5024, "epoch": 41} {"train_loss": -21.45267105102539, "global_step": 5025, "epoch": 41} {"train_loss": -21.44814682006836, "global_step": 5026, "epoch": 41} {"train_loss": -21.446456909179688, "global_step": 5027, "epoch": 41} {"train_loss": -21.698808670043945, "global_step": 5028, "epoch": 41} {"train_loss": -21.88187026977539, "global_step": 5029, "epoch": 41} {"train_loss": -21.869247436523438, "global_step": 5030, "epoch": 41} {"train_loss": -21.897624969482422, "global_step": 5031, "epoch": 41} {"train_loss": -21.247528076171875, "global_step": 5032, "epoch": 41} {"train_loss": -21.873701095581055, "global_step": 5033, "epoch": 41} {"train_loss": -21.561660766601562, "global_step": 5034, "epoch": 41} {"train_loss": -21.895002365112305, "global_step": 5035, "epoch": 41} {"train_loss": -22.046354293823242, "global_step": 5036, "epoch": 41} {"train_loss": -21.375289916992188, "global_step": 5037, "epoch": 41} {"train_loss": -21.52669334411621, "global_step": 5038, "epoch": 41} {"train_loss": -21.144514083862305, "global_step": 5039, "epoch": 41} {"train_loss": -21.769424438476562, "global_step": 5040, "epoch": 41} {"train_loss": -21.48479461669922, "global_step": 5041, "epoch": 41} {"train_loss": -21.549360275268555, "global_step": 5042, "epoch": 41} {"train_loss": -19.975046157836914, "global_step": 5043, "epoch": 41} {"train_loss": -20.235197067260742, "global_step": 5044, "epoch": 41} {"train_loss": -19.972579956054688, "global_step": 5045, "epoch": 41} {"train_loss": -19.481332778930664, "global_step": 5046, "epoch": 41} {"train_loss": -21.40912437438965, "global_step": 5047, "epoch": 41} {"train_loss": -20.269346237182617, "global_step": 5048, "epoch": 41} {"train_loss": -18.071744918823242, "global_step": 5049, "epoch": 41} {"train_loss": -20.887022018432617, "global_step": 5050, "epoch": 41} {"train_loss": -19.44183921813965, "global_step": 5051, "epoch": 41} {"train_loss": -20.8287296295166, "global_step": 5052, "epoch": 41} {"train_loss": -19.56137466430664, "global_step": 5053, "epoch": 41} {"train_loss": -21.065807342529297, "global_step": 5054, "epoch": 41} {"train_loss": -20.844938278198242, "global_step": 5055, "epoch": 41} {"train_loss": -19.416608810424805, "global_step": 5056, "epoch": 41} {"train_loss": -20.47340202331543, "global_step": 5057, "epoch": 41} {"train_loss": -21.04707908630371, "global_step": 5058, "epoch": 41} {"train_loss": -20.63759422302246, "global_step": 5059, "epoch": 41} {"train_loss": -20.50580596923828, "global_step": 5060, "epoch": 41} {"train_loss": -20.537622451782227, "global_step": 5061, "epoch": 41} {"train_loss": -20.467729568481445, "global_step": 5062, "epoch": 41} {"train_loss": -20.63752555847168, "global_step": 5063, "epoch": 41} {"train_loss": -20.723438262939453, "global_step": 5064, "epoch": 41} {"train_loss": -20.594663619995117, "global_step": 5065, "epoch": 41} {"train_loss": -21.471454620361328, "global_step": 5066, "epoch": 41} {"train_loss": -20.718122482299805, "global_step": 5067, "epoch": 41} {"train_loss": -20.699918746948242, "global_step": 5068, "epoch": 41} {"train_loss": -20.580015182495117, "global_step": 5069, "epoch": 41} {"train_loss": -20.636716842651367, "global_step": 5070, "epoch": 41} {"train_loss": -21.0235595703125, "global_step": 5071, "epoch": 41} {"train_loss": -20.526296615600586, "global_step": 5072, "epoch": 41} {"train_loss": -20.986900329589844, "global_step": 5073, "epoch": 41} {"train_loss": -20.873315811157227, "global_step": 5074, "epoch": 41} {"train_loss": -20.98907470703125, "global_step": 5075, "epoch": 41} {"train_loss": -21.184955596923828, "global_step": 5076, "epoch": 41} {"train_loss": -20.765850067138672, "global_step": 5077, "epoch": 41} {"train_loss": -20.82137107849121, "global_step": 5078, "epoch": 41} {"train_loss": -20.83869743347168, "global_step": 5079, "epoch": 41} {"train_loss": -20.73615264892578, "global_step": 5080, "epoch": 41} {"train_loss": -20.799475614689598, "global_step": 5081, "epoch": 41, "val_loss": 2996169.75} {"train_loss": -20.994741439819336, "global_step": 5082, "epoch": 42} {"train_loss": -21.089330673217773, "global_step": 5083, "epoch": 42} {"train_loss": -21.150623321533203, "global_step": 5084, "epoch": 42} {"train_loss": -20.596616744995117, "global_step": 5085, "epoch": 42} {"train_loss": -21.053831100463867, "global_step": 5086, "epoch": 42} {"train_loss": -21.336252212524414, "global_step": 5087, "epoch": 42} {"train_loss": -20.92963981628418, "global_step": 5088, "epoch": 42} {"train_loss": -21.440271377563477, "global_step": 5089, "epoch": 42} {"train_loss": -21.28020477294922, "global_step": 5090, "epoch": 42} {"train_loss": -21.46279525756836, "global_step": 5091, "epoch": 42} {"train_loss": -21.422712326049805, "global_step": 5092, "epoch": 42} {"train_loss": -21.38276481628418, "global_step": 5093, "epoch": 42} {"train_loss": -20.953468322753906, "global_step": 5094, "epoch": 42} {"train_loss": -21.352819442749023, "global_step": 5095, "epoch": 42} {"train_loss": -20.911649703979492, "global_step": 5096, "epoch": 42} {"train_loss": -21.299631118774414, "global_step": 5097, "epoch": 42} {"train_loss": -21.03663444519043, "global_step": 5098, "epoch": 42} {"train_loss": -21.0297908782959, "global_step": 5099, "epoch": 42} {"train_loss": -21.284639358520508, "global_step": 5100, "epoch": 42} {"train_loss": -21.320735931396484, "global_step": 5101, "epoch": 42} {"train_loss": -21.375194549560547, "global_step": 5102, "epoch": 42} {"train_loss": -21.694721221923828, "global_step": 5103, "epoch": 42} {"train_loss": -21.999555587768555, "global_step": 5104, "epoch": 42} {"train_loss": -22.171796798706055, "global_step": 5105, "epoch": 42} {"train_loss": -21.715673446655273, "global_step": 5106, "epoch": 42} {"train_loss": -21.409982681274414, "global_step": 5107, "epoch": 42} {"train_loss": -22.038532257080078, "global_step": 5108, "epoch": 42} {"train_loss": -21.000946044921875, "global_step": 5109, "epoch": 42} {"train_loss": -19.316856384277344, "global_step": 5110, "epoch": 42} {"train_loss": -20.21199607849121, "global_step": 5111, "epoch": 42} {"train_loss": -20.567920684814453, "global_step": 5112, "epoch": 42} {"train_loss": -19.263296127319336, "global_step": 5113, "epoch": 42} {"train_loss": -19.041921615600586, "global_step": 5114, "epoch": 42} {"train_loss": -21.468955993652344, "global_step": 5115, "epoch": 42} {"train_loss": -18.968799591064453, "global_step": 5116, "epoch": 42} {"train_loss": -20.675046920776367, "global_step": 5117, "epoch": 42} {"train_loss": -19.58320426940918, "global_step": 5118, "epoch": 42} {"train_loss": -20.334318161010742, "global_step": 5119, "epoch": 42} {"train_loss": -18.990022659301758, "global_step": 5120, "epoch": 42} {"train_loss": -20.819015502929688, "global_step": 5121, "epoch": 42} {"train_loss": -19.677228927612305, "global_step": 5122, "epoch": 42} {"train_loss": -20.985511779785156, "global_step": 5123, "epoch": 42} {"train_loss": -20.633665084838867, "global_step": 5124, "epoch": 42} {"train_loss": -19.8870849609375, "global_step": 5125, "epoch": 42} {"train_loss": -20.539289474487305, "global_step": 5126, "epoch": 42} {"train_loss": -21.100605010986328, "global_step": 5127, "epoch": 42} {"train_loss": -20.643068313598633, "global_step": 5128, "epoch": 42} {"train_loss": -20.0766544342041, "global_step": 5129, "epoch": 42} {"train_loss": -20.6586856842041, "global_step": 5130, "epoch": 42} {"train_loss": -20.71454429626465, "global_step": 5131, "epoch": 42} {"train_loss": -20.052169799804688, "global_step": 5132, "epoch": 42} {"train_loss": -21.13678550720215, "global_step": 5133, "epoch": 42} {"train_loss": -21.176759719848633, "global_step": 5134, "epoch": 42} {"train_loss": -20.53390884399414, "global_step": 5135, "epoch": 42} {"train_loss": -21.09793472290039, "global_step": 5136, "epoch": 42} {"train_loss": -20.847726821899414, "global_step": 5137, "epoch": 42} {"train_loss": -21.084671020507812, "global_step": 5138, "epoch": 42} {"train_loss": -20.627851486206055, "global_step": 5139, "epoch": 42} {"train_loss": -21.0980167388916, "global_step": 5140, "epoch": 42} {"train_loss": -20.321754455566406, "global_step": 5141, "epoch": 42} {"train_loss": -21.179691314697266, "global_step": 5142, "epoch": 42} {"train_loss": -20.625396728515625, "global_step": 5143, "epoch": 42} {"train_loss": -21.2143611907959, "global_step": 5144, "epoch": 42} {"train_loss": -20.780576705932617, "global_step": 5145, "epoch": 42} {"train_loss": -20.472293853759766, "global_step": 5146, "epoch": 42} {"train_loss": -21.129047393798828, "global_step": 5147, "epoch": 42} {"train_loss": -21.2061767578125, "global_step": 5148, "epoch": 42} {"train_loss": -21.197147369384766, "global_step": 5149, "epoch": 42} {"train_loss": -21.098796844482422, "global_step": 5150, "epoch": 42} {"train_loss": -21.05952262878418, "global_step": 5151, "epoch": 42} {"train_loss": -21.339664459228516, "global_step": 5152, "epoch": 42} {"train_loss": -21.32477569580078, "global_step": 5153, "epoch": 42} {"train_loss": -21.35713005065918, "global_step": 5154, "epoch": 42} {"train_loss": -21.23200798034668, "global_step": 5155, "epoch": 42} {"train_loss": -21.451522827148438, "global_step": 5156, "epoch": 42} {"train_loss": -21.314207077026367, "global_step": 5157, "epoch": 42} {"train_loss": -21.234542846679688, "global_step": 5158, "epoch": 42} {"train_loss": -21.77163314819336, "global_step": 5159, "epoch": 42} {"train_loss": -21.7039852142334, "global_step": 5160, "epoch": 42} {"train_loss": -21.44842529296875, "global_step": 5161, "epoch": 42} {"train_loss": -21.48092269897461, "global_step": 5162, "epoch": 42} {"train_loss": -21.032638549804688, "global_step": 5163, "epoch": 42} {"train_loss": -21.458160400390625, "global_step": 5164, "epoch": 42} {"train_loss": -21.278745651245117, "global_step": 5165, "epoch": 42} {"train_loss": -21.268672943115234, "global_step": 5166, "epoch": 42} {"train_loss": -21.39882469177246, "global_step": 5167, "epoch": 42} {"train_loss": -19.928686141967773, "global_step": 5168, "epoch": 42} {"train_loss": -19.33347511291504, "global_step": 5169, "epoch": 42} {"train_loss": -22.075149536132812, "global_step": 5170, "epoch": 42} {"train_loss": -19.76322364807129, "global_step": 5171, "epoch": 42} {"train_loss": -19.953962326049805, "global_step": 5172, "epoch": 42} {"train_loss": -21.136899948120117, "global_step": 5173, "epoch": 42} {"train_loss": -20.467178344726562, "global_step": 5174, "epoch": 42} {"train_loss": -17.479978561401367, "global_step": 5175, "epoch": 42} {"train_loss": -21.448034286499023, "global_step": 5176, "epoch": 42} {"train_loss": -19.698516845703125, "global_step": 5177, "epoch": 42} {"train_loss": -20.42950439453125, "global_step": 5178, "epoch": 42} {"train_loss": -20.624494552612305, "global_step": 5179, "epoch": 42} {"train_loss": -20.70557975769043, "global_step": 5180, "epoch": 42} {"train_loss": -20.620681762695312, "global_step": 5181, "epoch": 42} {"train_loss": -20.8958740234375, "global_step": 5182, "epoch": 42} {"train_loss": -20.854703903198242, "global_step": 5183, "epoch": 42} {"train_loss": -20.824804306030273, "global_step": 5184, "epoch": 42} {"train_loss": -20.57744026184082, "global_step": 5185, "epoch": 42} {"train_loss": -20.93869400024414, "global_step": 5186, "epoch": 42} {"train_loss": -20.876401901245117, "global_step": 5187, "epoch": 42} {"train_loss": -20.910709381103516, "global_step": 5188, "epoch": 42} {"train_loss": -20.842294692993164, "global_step": 5189, "epoch": 42} {"train_loss": -20.580392837524414, "global_step": 5190, "epoch": 42} {"train_loss": -21.08831024169922, "global_step": 5191, "epoch": 42} {"train_loss": -20.69669532775879, "global_step": 5192, "epoch": 42} {"train_loss": -20.864479064941406, "global_step": 5193, "epoch": 42} {"train_loss": -19.864017486572266, "global_step": 5194, "epoch": 42} {"train_loss": -20.539169311523438, "global_step": 5195, "epoch": 42} {"train_loss": -20.749881744384766, "global_step": 5196, "epoch": 42} {"train_loss": -21.27561378479004, "global_step": 5197, "epoch": 42} {"train_loss": -20.713573455810547, "global_step": 5198, "epoch": 42} {"train_loss": -20.92078971862793, "global_step": 5199, "epoch": 42} {"train_loss": -20.690092086791992, "global_step": 5200, "epoch": 42} {"train_loss": -21.457996368408203, "global_step": 5201, "epoch": 42} {"train_loss": -20.84236518607652, "global_step": 5202, "epoch": 42, "val_loss": 2677564.5} {"train_loss": -21.255027770996094, "global_step": 5203, "epoch": 43} {"train_loss": -21.12656021118164, "global_step": 5204, "epoch": 43} {"train_loss": -21.161256790161133, "global_step": 5205, "epoch": 43} {"train_loss": -21.196073532104492, "global_step": 5206, "epoch": 43} {"train_loss": -20.837848663330078, "global_step": 5207, "epoch": 43} {"train_loss": -20.891324996948242, "global_step": 5208, "epoch": 43} {"train_loss": -19.377954483032227, "global_step": 5209, "epoch": 43} {"train_loss": -19.611658096313477, "global_step": 5210, "epoch": 43} {"train_loss": -21.0485782623291, "global_step": 5211, "epoch": 43} {"train_loss": -21.54745864868164, "global_step": 5212, "epoch": 43} {"train_loss": -20.36543083190918, "global_step": 5213, "epoch": 43} {"train_loss": -21.719511032104492, "global_step": 5214, "epoch": 43} {"train_loss": -21.052549362182617, "global_step": 5215, "epoch": 43} {"train_loss": -21.446516036987305, "global_step": 5216, "epoch": 43} {"train_loss": -21.45420265197754, "global_step": 5217, "epoch": 43} {"train_loss": -21.209823608398438, "global_step": 5218, "epoch": 43} {"train_loss": -21.088886260986328, "global_step": 5219, "epoch": 43} {"train_loss": -21.823448181152344, "global_step": 5220, "epoch": 43} {"train_loss": -21.23331642150879, "global_step": 5221, "epoch": 43} {"train_loss": -21.89199447631836, "global_step": 5222, "epoch": 43} {"train_loss": -21.6998348236084, "global_step": 5223, "epoch": 43} {"train_loss": -21.73651695251465, "global_step": 5224, "epoch": 43} {"train_loss": -21.942249298095703, "global_step": 5225, "epoch": 43} {"train_loss": -20.863983154296875, "global_step": 5226, "epoch": 43} {"train_loss": -20.535770416259766, "global_step": 5227, "epoch": 43} {"train_loss": -20.460739135742188, "global_step": 5228, "epoch": 43} {"train_loss": -21.362943649291992, "global_step": 5229, "epoch": 43} {"train_loss": -21.662614822387695, "global_step": 5230, "epoch": 43} {"train_loss": -21.105867385864258, "global_step": 5231, "epoch": 43} {"train_loss": -20.684919357299805, "global_step": 5232, "epoch": 43} {"train_loss": -21.988658905029297, "global_step": 5233, "epoch": 43} {"train_loss": -21.55055809020996, "global_step": 5234, "epoch": 43} {"train_loss": -21.825586318969727, "global_step": 5235, "epoch": 43} {"train_loss": -21.611520767211914, "global_step": 5236, "epoch": 43} {"train_loss": -21.8720760345459, "global_step": 5237, "epoch": 43} {"train_loss": -21.798580169677734, "global_step": 5238, "epoch": 43} {"train_loss": -20.974782943725586, "global_step": 5239, "epoch": 43} {"train_loss": -21.109983444213867, "global_step": 5240, "epoch": 43} {"train_loss": -21.775686264038086, "global_step": 5241, "epoch": 43} {"train_loss": -20.397891998291016, "global_step": 5242, "epoch": 43} {"train_loss": -20.015607833862305, "global_step": 5243, "epoch": 43} {"train_loss": -21.094785690307617, "global_step": 5244, "epoch": 43} {"train_loss": -20.712575912475586, "global_step": 5245, "epoch": 43} {"train_loss": -20.399755477905273, "global_step": 5246, "epoch": 43} {"train_loss": -21.111234664916992, "global_step": 5247, "epoch": 43} {"train_loss": -20.693078994750977, "global_step": 5248, "epoch": 43} {"train_loss": -21.290884017944336, "global_step": 5249, "epoch": 43} {"train_loss": -21.458200454711914, "global_step": 5250, "epoch": 43} {"train_loss": -21.218326568603516, "global_step": 5251, "epoch": 43} {"train_loss": -20.99525260925293, "global_step": 5252, "epoch": 43} {"train_loss": -20.724044799804688, "global_step": 5253, "epoch": 43} {"train_loss": -20.995906829833984, "global_step": 5254, "epoch": 43} {"train_loss": -20.291654586791992, "global_step": 5255, "epoch": 43} {"train_loss": -21.531835556030273, "global_step": 5256, "epoch": 43} {"train_loss": -20.926633834838867, "global_step": 5257, "epoch": 43} {"train_loss": -20.765958786010742, "global_step": 5258, "epoch": 43} {"train_loss": -21.30130958557129, "global_step": 5259, "epoch": 43} {"train_loss": -21.077207565307617, "global_step": 5260, "epoch": 43} {"train_loss": -21.274181365966797, "global_step": 5261, "epoch": 43} {"train_loss": -21.655410766601562, "global_step": 5262, "epoch": 43} {"train_loss": -21.241846084594727, "global_step": 5263, "epoch": 43} {"train_loss": -21.0234432220459, "global_step": 5264, "epoch": 43} {"train_loss": -20.66204833984375, "global_step": 5265, "epoch": 43} {"train_loss": -20.64659309387207, "global_step": 5266, "epoch": 43} {"train_loss": -21.046680450439453, "global_step": 5267, "epoch": 43} {"train_loss": -21.384021759033203, "global_step": 5268, "epoch": 43} {"train_loss": -21.38875389099121, "global_step": 5269, "epoch": 43} {"train_loss": -20.751249313354492, "global_step": 5270, "epoch": 43} {"train_loss": -21.37043571472168, "global_step": 5271, "epoch": 43} {"train_loss": -21.55122947692871, "global_step": 5272, "epoch": 43} {"train_loss": -21.727277755737305, "global_step": 5273, "epoch": 43} {"train_loss": -22.103118896484375, "global_step": 5274, "epoch": 43} {"train_loss": -21.40578269958496, "global_step": 5275, "epoch": 43} {"train_loss": -19.641633987426758, "global_step": 5276, "epoch": 43} {"train_loss": -16.526874542236328, "global_step": 5277, "epoch": 43} {"train_loss": -15.806675910949707, "global_step": 5278, "epoch": 43} {"train_loss": -19.810888290405273, "global_step": 5279, "epoch": 43} {"train_loss": -17.120346069335938, "global_step": 5280, "epoch": 43} {"train_loss": -19.537900924682617, "global_step": 5281, "epoch": 43} {"train_loss": -20.552824020385742, "global_step": 5282, "epoch": 43} {"train_loss": -18.437744140625, "global_step": 5283, "epoch": 43} {"train_loss": -20.133438110351562, "global_step": 5284, "epoch": 43} {"train_loss": -20.54547691345215, "global_step": 5285, "epoch": 43} {"train_loss": -20.90355682373047, "global_step": 5286, "epoch": 43} {"train_loss": -20.6444034576416, "global_step": 5287, "epoch": 43} {"train_loss": -20.462968826293945, "global_step": 5288, "epoch": 43} {"train_loss": -20.090959548950195, "global_step": 5289, "epoch": 43} {"train_loss": -20.594011306762695, "global_step": 5290, "epoch": 43} {"train_loss": -20.235843658447266, "global_step": 5291, "epoch": 43} {"train_loss": -20.296358108520508, "global_step": 5292, "epoch": 43} {"train_loss": -20.7310848236084, "global_step": 5293, "epoch": 43} {"train_loss": -20.449491500854492, "global_step": 5294, "epoch": 43} {"train_loss": -20.553455352783203, "global_step": 5295, "epoch": 43} {"train_loss": -20.267173767089844, "global_step": 5296, "epoch": 43} {"train_loss": -20.984745025634766, "global_step": 5297, "epoch": 43} {"train_loss": -20.248491287231445, "global_step": 5298, "epoch": 43} {"train_loss": -20.77784538269043, "global_step": 5299, "epoch": 43} {"train_loss": -19.823593139648438, "global_step": 5300, "epoch": 43} {"train_loss": -19.866554260253906, "global_step": 5301, "epoch": 43} {"train_loss": -20.90241050720215, "global_step": 5302, "epoch": 43} {"train_loss": -20.62865447998047, "global_step": 5303, "epoch": 43} {"train_loss": -20.346391677856445, "global_step": 5304, "epoch": 43} {"train_loss": -20.181570053100586, "global_step": 5305, "epoch": 43} {"train_loss": -19.609411239624023, "global_step": 5306, "epoch": 43} {"train_loss": -20.2377986907959, "global_step": 5307, "epoch": 43} {"train_loss": -19.898366928100586, "global_step": 5308, "epoch": 43} {"train_loss": -19.29798698425293, "global_step": 5309, "epoch": 43} {"train_loss": -20.063261032104492, "global_step": 5310, "epoch": 43} {"train_loss": -20.06096839904785, "global_step": 5311, "epoch": 43} {"train_loss": -20.386058807373047, "global_step": 5312, "epoch": 43} {"train_loss": -19.866392135620117, "global_step": 5313, "epoch": 43} {"train_loss": -20.62982749938965, "global_step": 5314, "epoch": 43} {"train_loss": -20.518583297729492, "global_step": 5315, "epoch": 43} {"train_loss": -20.261962890625, "global_step": 5316, "epoch": 43} {"train_loss": -20.387968063354492, "global_step": 5317, "epoch": 43} {"train_loss": -20.89466667175293, "global_step": 5318, "epoch": 43} {"train_loss": -20.335084915161133, "global_step": 5319, "epoch": 43} {"train_loss": -20.368486404418945, "global_step": 5320, "epoch": 43} {"train_loss": -20.39019012451172, "global_step": 5321, "epoch": 43} {"train_loss": -20.274734497070312, "global_step": 5322, "epoch": 43} {"train_loss": -20.7080839566948, "global_step": 5323, "epoch": 43, "val_loss": 3382110.0} {"train_loss": -20.261932373046875, "global_step": 5324, "epoch": 44} {"train_loss": -20.44649314880371, "global_step": 5325, "epoch": 44} {"train_loss": -21.379547119140625, "global_step": 5326, "epoch": 44} {"train_loss": -20.4344539642334, "global_step": 5327, "epoch": 44} {"train_loss": -20.38030242919922, "global_step": 5328, "epoch": 44} {"train_loss": -21.158933639526367, "global_step": 5329, "epoch": 44} {"train_loss": -20.8876953125, "global_step": 5330, "epoch": 44} {"train_loss": -21.04523277282715, "global_step": 5331, "epoch": 44} {"train_loss": -21.239171981811523, "global_step": 5332, "epoch": 44} {"train_loss": -21.27874755859375, "global_step": 5333, "epoch": 44} {"train_loss": -21.472061157226562, "global_step": 5334, "epoch": 44} {"train_loss": -20.532255172729492, "global_step": 5335, "epoch": 44} {"train_loss": -20.070096969604492, "global_step": 5336, "epoch": 44} {"train_loss": -21.040699005126953, "global_step": 5337, "epoch": 44} {"train_loss": -21.25372314453125, "global_step": 5338, "epoch": 44} {"train_loss": -19.08970069885254, "global_step": 5339, "epoch": 44} {"train_loss": -20.556550979614258, "global_step": 5340, "epoch": 44} {"train_loss": -20.91398048400879, "global_step": 5341, "epoch": 44} {"train_loss": -19.861967086791992, "global_step": 5342, "epoch": 44} {"train_loss": -21.193321228027344, "global_step": 5343, "epoch": 44} {"train_loss": -20.7584285736084, "global_step": 5344, "epoch": 44} {"train_loss": -21.22439956665039, "global_step": 5345, "epoch": 44} {"train_loss": -21.14454460144043, "global_step": 5346, "epoch": 44} {"train_loss": -21.018922805786133, "global_step": 5347, "epoch": 44} {"train_loss": -21.48223876953125, "global_step": 5348, "epoch": 44} {"train_loss": -21.50128173828125, "global_step": 5349, "epoch": 44} {"train_loss": -21.50091552734375, "global_step": 5350, "epoch": 44} {"train_loss": -20.888368606567383, "global_step": 5351, "epoch": 44} {"train_loss": -21.616424560546875, "global_step": 5352, "epoch": 44} {"train_loss": -21.584075927734375, "global_step": 5353, "epoch": 44} {"train_loss": -21.955007553100586, "global_step": 5354, "epoch": 44} {"train_loss": -21.42780113220215, "global_step": 5355, "epoch": 44} {"train_loss": -22.239120483398438, "global_step": 5356, "epoch": 44} {"train_loss": -21.0201473236084, "global_step": 5357, "epoch": 44} {"train_loss": -21.24241065979004, "global_step": 5358, "epoch": 44} {"train_loss": -21.223188400268555, "global_step": 5359, "epoch": 44} {"train_loss": -21.02094841003418, "global_step": 5360, "epoch": 44} {"train_loss": -21.860342025756836, "global_step": 5361, "epoch": 44} {"train_loss": -21.67873191833496, "global_step": 5362, "epoch": 44} {"train_loss": -21.45870590209961, "global_step": 5363, "epoch": 44} {"train_loss": -21.680944442749023, "global_step": 5364, "epoch": 44} {"train_loss": -21.72325325012207, "global_step": 5365, "epoch": 44} {"train_loss": -21.62517547607422, "global_step": 5366, "epoch": 44} {"train_loss": -21.971820831298828, "global_step": 5367, "epoch": 44} {"train_loss": -22.035436630249023, "global_step": 5368, "epoch": 44} {"train_loss": -22.102724075317383, "global_step": 5369, "epoch": 44} {"train_loss": -21.437759399414062, "global_step": 5370, "epoch": 44} {"train_loss": -20.565839767456055, "global_step": 5371, "epoch": 44} {"train_loss": -20.715513229370117, "global_step": 5372, "epoch": 44} {"train_loss": -21.760665893554688, "global_step": 5373, "epoch": 44} {"train_loss": -20.888242721557617, "global_step": 5374, "epoch": 44} {"train_loss": -20.31769371032715, "global_step": 5375, "epoch": 44} {"train_loss": -20.84347152709961, "global_step": 5376, "epoch": 44} {"train_loss": -18.674898147583008, "global_step": 5377, "epoch": 44} {"train_loss": -19.815488815307617, "global_step": 5378, "epoch": 44} {"train_loss": -20.985919952392578, "global_step": 5379, "epoch": 44} {"train_loss": -20.19336700439453, "global_step": 5380, "epoch": 44} {"train_loss": -21.089548110961914, "global_step": 5381, "epoch": 44} {"train_loss": -21.1417293548584, "global_step": 5382, "epoch": 44} {"train_loss": -20.340534210205078, "global_step": 5383, "epoch": 44} {"train_loss": -20.96663475036621, "global_step": 5384, "epoch": 44} {"train_loss": -21.08183479309082, "global_step": 5385, "epoch": 44} {"train_loss": -20.517915725708008, "global_step": 5386, "epoch": 44} {"train_loss": -21.25385856628418, "global_step": 5387, "epoch": 44} {"train_loss": -21.11460304260254, "global_step": 5388, "epoch": 44} {"train_loss": -20.469907760620117, "global_step": 5389, "epoch": 44} {"train_loss": -20.56398582458496, "global_step": 5390, "epoch": 44} {"train_loss": -21.064847946166992, "global_step": 5391, "epoch": 44} {"train_loss": -19.782732009887695, "global_step": 5392, "epoch": 44} {"train_loss": -20.627986907958984, "global_step": 5393, "epoch": 44} {"train_loss": -21.398649215698242, "global_step": 5394, "epoch": 44} {"train_loss": -20.376590728759766, "global_step": 5395, "epoch": 44} {"train_loss": -20.51554298400879, "global_step": 5396, "epoch": 44} {"train_loss": -20.893482208251953, "global_step": 5397, "epoch": 44} {"train_loss": -21.08734703063965, "global_step": 5398, "epoch": 44} {"train_loss": -21.665298461914062, "global_step": 5399, "epoch": 44} {"train_loss": -21.339406967163086, "global_step": 5400, "epoch": 44} {"train_loss": -21.688161849975586, "global_step": 5401, "epoch": 44} {"train_loss": -21.0277156829834, "global_step": 5402, "epoch": 44} {"train_loss": -21.597503662109375, "global_step": 5403, "epoch": 44} {"train_loss": -21.680496215820312, "global_step": 5404, "epoch": 44} {"train_loss": -21.441518783569336, "global_step": 5405, "epoch": 44} {"train_loss": -21.443645477294922, "global_step": 5406, "epoch": 44} {"train_loss": -21.751005172729492, "global_step": 5407, "epoch": 44} {"train_loss": -21.415653228759766, "global_step": 5408, "epoch": 44} {"train_loss": -21.928680419921875, "global_step": 5409, "epoch": 44} {"train_loss": -22.010498046875, "global_step": 5410, "epoch": 44} {"train_loss": -21.251758575439453, "global_step": 5411, "epoch": 44} {"train_loss": -21.639524459838867, "global_step": 5412, "epoch": 44} {"train_loss": -21.38458824157715, "global_step": 5413, "epoch": 44} {"train_loss": -22.309032440185547, "global_step": 5414, "epoch": 44} {"train_loss": -21.3789119720459, "global_step": 5415, "epoch": 44} {"train_loss": -22.295337677001953, "global_step": 5416, "epoch": 44} {"train_loss": -22.085432052612305, "global_step": 5417, "epoch": 44} {"train_loss": -21.2850399017334, "global_step": 5418, "epoch": 44} {"train_loss": -21.803924560546875, "global_step": 5419, "epoch": 44} {"train_loss": -21.779953002929688, "global_step": 5420, "epoch": 44} {"train_loss": -22.122615814208984, "global_step": 5421, "epoch": 44} {"train_loss": -21.914400100708008, "global_step": 5422, "epoch": 44} {"train_loss": -21.47738265991211, "global_step": 5423, "epoch": 44} {"train_loss": -21.10196304321289, "global_step": 5424, "epoch": 44} {"train_loss": -18.410608291625977, "global_step": 5425, "epoch": 44} {"train_loss": -11.988516807556152, "global_step": 5426, "epoch": 44} {"train_loss": -10.948774337768555, "global_step": 5427, "epoch": 44} {"train_loss": -7.587947845458984, "global_step": 5428, "epoch": 44} {"train_loss": -10.57028865814209, "global_step": 5429, "epoch": 44} {"train_loss": -12.423307418823242, "global_step": 5430, "epoch": 44} {"train_loss": -13.150097846984863, "global_step": 5431, "epoch": 44} {"train_loss": -14.801983833312988, "global_step": 5432, "epoch": 44} {"train_loss": -14.693359375, "global_step": 5433, "epoch": 44} {"train_loss": -15.2367582321167, "global_step": 5434, "epoch": 44} {"train_loss": -15.758641242980957, "global_step": 5435, "epoch": 44} {"train_loss": -15.358230590820312, "global_step": 5436, "epoch": 44} {"train_loss": -16.8720760345459, "global_step": 5437, "epoch": 44} {"train_loss": -17.3991756439209, "global_step": 5438, "epoch": 44} {"train_loss": -16.763004302978516, "global_step": 5439, "epoch": 44} {"train_loss": -17.568323135375977, "global_step": 5440, "epoch": 44} {"train_loss": -17.10519790649414, "global_step": 5441, "epoch": 44} {"train_loss": -17.101430892944336, "global_step": 5442, "epoch": 44} {"train_loss": -17.82023811340332, "global_step": 5443, "epoch": 44} {"train_loss": -20.13453062703787, "global_step": 5444, "epoch": 44, "val_loss": 2976332.0} {"train_loss": -17.999948501586914, "global_step": 5445, "epoch": 45} {"train_loss": -18.37553596496582, "global_step": 5446, "epoch": 45} {"train_loss": -18.928091049194336, "global_step": 5447, "epoch": 45} {"train_loss": -19.0624942779541, "global_step": 5448, "epoch": 45} {"train_loss": -19.534568786621094, "global_step": 5449, "epoch": 45} {"train_loss": -19.340993881225586, "global_step": 5450, "epoch": 45} {"train_loss": -19.55851173400879, "global_step": 5451, "epoch": 45} {"train_loss": -19.870346069335938, "global_step": 5452, "epoch": 45} {"train_loss": -19.842130661010742, "global_step": 5453, "epoch": 45} {"train_loss": -20.311471939086914, "global_step": 5454, "epoch": 45} {"train_loss": -20.000629425048828, "global_step": 5455, "epoch": 45} {"train_loss": -20.293804168701172, "global_step": 5456, "epoch": 45} {"train_loss": -20.36180877685547, "global_step": 5457, "epoch": 45} {"train_loss": -19.737808227539062, "global_step": 5458, "epoch": 45} {"train_loss": -20.215042114257812, "global_step": 5459, "epoch": 45} {"train_loss": -20.790515899658203, "global_step": 5460, "epoch": 45} {"train_loss": -20.66389274597168, "global_step": 5461, "epoch": 45} {"train_loss": -20.430692672729492, "global_step": 5462, "epoch": 45} {"train_loss": -20.62156105041504, "global_step": 5463, "epoch": 45} {"train_loss": -20.959211349487305, "global_step": 5464, "epoch": 45} {"train_loss": -20.42902946472168, "global_step": 5465, "epoch": 45} {"train_loss": -21.08982276916504, "global_step": 5466, "epoch": 45} {"train_loss": -20.604721069335938, "global_step": 5467, "epoch": 45} {"train_loss": -20.577356338500977, "global_step": 5468, "epoch": 45} {"train_loss": -20.15115737915039, "global_step": 5469, "epoch": 45} {"train_loss": -20.365211486816406, "global_step": 5470, "epoch": 45} {"train_loss": -20.54098129272461, "global_step": 5471, "epoch": 45} {"train_loss": -20.596824645996094, "global_step": 5472, "epoch": 45} {"train_loss": -21.153600692749023, "global_step": 5473, "epoch": 45} {"train_loss": -20.310081481933594, "global_step": 5474, "epoch": 45} {"train_loss": -20.752639770507812, "global_step": 5475, "epoch": 45} {"train_loss": -20.85765838623047, "global_step": 5476, "epoch": 45} {"train_loss": -20.47043228149414, "global_step": 5477, "epoch": 45} {"train_loss": -20.055204391479492, "global_step": 5478, "epoch": 45} {"train_loss": -20.659652709960938, "global_step": 5479, "epoch": 45} {"train_loss": -20.921951293945312, "global_step": 5480, "epoch": 45} {"train_loss": -20.212202072143555, "global_step": 5481, "epoch": 45} {"train_loss": -21.2033748626709, "global_step": 5482, "epoch": 45} {"train_loss": -19.618356704711914, "global_step": 5483, "epoch": 45} {"train_loss": -20.790874481201172, "global_step": 5484, "epoch": 45} {"train_loss": -20.538619995117188, "global_step": 5485, "epoch": 45} {"train_loss": -20.074472427368164, "global_step": 5486, "epoch": 45} {"train_loss": -20.19529914855957, "global_step": 5487, "epoch": 45} {"train_loss": -18.9028263092041, "global_step": 5488, "epoch": 45} {"train_loss": -19.32765769958496, "global_step": 5489, "epoch": 45} {"train_loss": -20.64674949645996, "global_step": 5490, "epoch": 45} {"train_loss": -18.15155601501465, "global_step": 5491, "epoch": 45} {"train_loss": -20.077184677124023, "global_step": 5492, "epoch": 45} {"train_loss": -18.990318298339844, "global_step": 5493, "epoch": 45} {"train_loss": -20.94732093811035, "global_step": 5494, "epoch": 45} {"train_loss": -19.748577117919922, "global_step": 5495, "epoch": 45} {"train_loss": -20.68120765686035, "global_step": 5496, "epoch": 45} {"train_loss": -20.25189781188965, "global_step": 5497, "epoch": 45} {"train_loss": -19.570632934570312, "global_step": 5498, "epoch": 45} {"train_loss": -20.533239364624023, "global_step": 5499, "epoch": 45} {"train_loss": -21.03004264831543, "global_step": 5500, "epoch": 45} {"train_loss": -19.98993492126465, "global_step": 5501, "epoch": 45} {"train_loss": -20.415836334228516, "global_step": 5502, "epoch": 45} {"train_loss": -21.299468994140625, "global_step": 5503, "epoch": 45} {"train_loss": -20.45648765563965, "global_step": 5504, "epoch": 45} {"train_loss": -20.864526748657227, "global_step": 5505, "epoch": 45} {"train_loss": -20.920692443847656, "global_step": 5506, "epoch": 45} {"train_loss": -21.029727935791016, "global_step": 5507, "epoch": 45} {"train_loss": -20.69890594482422, "global_step": 5508, "epoch": 45} {"train_loss": -21.00362777709961, "global_step": 5509, "epoch": 45} {"train_loss": -21.02796173095703, "global_step": 5510, "epoch": 45} {"train_loss": -21.09089469909668, "global_step": 5511, "epoch": 45} {"train_loss": -21.351552963256836, "global_step": 5512, "epoch": 45} {"train_loss": -21.232515335083008, "global_step": 5513, "epoch": 45} {"train_loss": -21.11325454711914, "global_step": 5514, "epoch": 45} {"train_loss": -21.173398971557617, "global_step": 5515, "epoch": 45} {"train_loss": -21.502683639526367, "global_step": 5516, "epoch": 45} {"train_loss": -21.551246643066406, "global_step": 5517, "epoch": 45} {"train_loss": -22.08435821533203, "global_step": 5518, "epoch": 45} {"train_loss": -20.949317932128906, "global_step": 5519, "epoch": 45} {"train_loss": -21.606069564819336, "global_step": 5520, "epoch": 45} {"train_loss": -21.457792282104492, "global_step": 5521, "epoch": 45} {"train_loss": -21.997150421142578, "global_step": 5522, "epoch": 45} {"train_loss": -21.985279083251953, "global_step": 5523, "epoch": 45} {"train_loss": -21.741886138916016, "global_step": 5524, "epoch": 45} {"train_loss": -22.09366798400879, "global_step": 5525, "epoch": 45} {"train_loss": -22.187376022338867, "global_step": 5526, "epoch": 45} {"train_loss": -22.062633514404297, "global_step": 5527, "epoch": 45} {"train_loss": -22.186647415161133, "global_step": 5528, "epoch": 45} {"train_loss": -22.256641387939453, "global_step": 5529, "epoch": 45} {"train_loss": -21.594772338867188, "global_step": 5530, "epoch": 45} {"train_loss": -22.2847900390625, "global_step": 5531, "epoch": 45} {"train_loss": -22.137447357177734, "global_step": 5532, "epoch": 45} {"train_loss": -22.088985443115234, "global_step": 5533, "epoch": 45} {"train_loss": -20.781583786010742, "global_step": 5534, "epoch": 45} {"train_loss": -21.317935943603516, "global_step": 5535, "epoch": 45} {"train_loss": -21.980545043945312, "global_step": 5536, "epoch": 45} {"train_loss": -21.69679832458496, "global_step": 5537, "epoch": 45} {"train_loss": -22.139995574951172, "global_step": 5538, "epoch": 45} {"train_loss": -22.02865982055664, "global_step": 5539, "epoch": 45} {"train_loss": -21.912809371948242, "global_step": 5540, "epoch": 45} {"train_loss": -22.3106632232666, "global_step": 5541, "epoch": 45} {"train_loss": -22.411291122436523, "global_step": 5542, "epoch": 45} {"train_loss": -22.40032386779785, "global_step": 5543, "epoch": 45} {"train_loss": -21.3936824798584, "global_step": 5544, "epoch": 45} {"train_loss": -21.610139846801758, "global_step": 5545, "epoch": 45} {"train_loss": -22.397418975830078, "global_step": 5546, "epoch": 45} {"train_loss": -20.669057846069336, "global_step": 5547, "epoch": 45} {"train_loss": -18.426374435424805, "global_step": 5548, "epoch": 45} {"train_loss": -16.358905792236328, "global_step": 5549, "epoch": 45} {"train_loss": -18.355911254882812, "global_step": 5550, "epoch": 45} {"train_loss": -21.368406295776367, "global_step": 5551, "epoch": 45} {"train_loss": -19.40201759338379, "global_step": 5552, "epoch": 45} {"train_loss": -21.047931671142578, "global_step": 5553, "epoch": 45} {"train_loss": -19.649742126464844, "global_step": 5554, "epoch": 45} {"train_loss": -21.02556800842285, "global_step": 5555, "epoch": 45} {"train_loss": -20.895326614379883, "global_step": 5556, "epoch": 45} {"train_loss": -21.14851188659668, "global_step": 5557, "epoch": 45} {"train_loss": -20.617097854614258, "global_step": 5558, "epoch": 45} {"train_loss": -21.31751251220703, "global_step": 5559, "epoch": 45} {"train_loss": -21.136009216308594, "global_step": 5560, "epoch": 45} {"train_loss": -20.598220825195312, "global_step": 5561, "epoch": 45} {"train_loss": -20.912324905395508, "global_step": 5562, "epoch": 45} {"train_loss": -21.337875366210938, "global_step": 5563, "epoch": 45} {"train_loss": -21.052000045776367, "global_step": 5564, "epoch": 45} {"train_loss": -20.71058290654963, "global_step": 5565, "epoch": 45, "val_loss": 3561096.0} {"train_loss": -21.194501876831055, "global_step": 5566, "epoch": 46} {"train_loss": -21.64491081237793, "global_step": 5567, "epoch": 46} {"train_loss": -21.563262939453125, "global_step": 5568, "epoch": 46} {"train_loss": -21.587461471557617, "global_step": 5569, "epoch": 46} {"train_loss": -21.2680606842041, "global_step": 5570, "epoch": 46} {"train_loss": -21.51601219177246, "global_step": 5571, "epoch": 46} {"train_loss": -21.312049865722656, "global_step": 5572, "epoch": 46} {"train_loss": -21.627567291259766, "global_step": 5573, "epoch": 46} {"train_loss": -21.847074508666992, "global_step": 5574, "epoch": 46} {"train_loss": -21.66252326965332, "global_step": 5575, "epoch": 46} {"train_loss": -21.90550422668457, "global_step": 5576, "epoch": 46} {"train_loss": -22.068891525268555, "global_step": 5577, "epoch": 46} {"train_loss": -21.75452995300293, "global_step": 5578, "epoch": 46} {"train_loss": -21.670806884765625, "global_step": 5579, "epoch": 46} {"train_loss": -22.103885650634766, "global_step": 5580, "epoch": 46} {"train_loss": -21.50659942626953, "global_step": 5581, "epoch": 46} {"train_loss": -22.31081199645996, "global_step": 5582, "epoch": 46} {"train_loss": -20.544525146484375, "global_step": 5583, "epoch": 46} {"train_loss": -19.642972946166992, "global_step": 5584, "epoch": 46} {"train_loss": -17.865861892700195, "global_step": 5585, "epoch": 46} {"train_loss": -21.109764099121094, "global_step": 5586, "epoch": 46} {"train_loss": -19.652677536010742, "global_step": 5587, "epoch": 46} {"train_loss": -19.2214412689209, "global_step": 5588, "epoch": 46} {"train_loss": -20.157041549682617, "global_step": 5589, "epoch": 46} {"train_loss": -20.632160186767578, "global_step": 5590, "epoch": 46} {"train_loss": -20.3488826751709, "global_step": 5591, "epoch": 46} {"train_loss": -21.684181213378906, "global_step": 5592, "epoch": 46} {"train_loss": -21.176727294921875, "global_step": 5593, "epoch": 46} {"train_loss": -21.229516983032227, "global_step": 5594, "epoch": 46} {"train_loss": -20.99065589904785, "global_step": 5595, "epoch": 46} {"train_loss": -21.263259887695312, "global_step": 5596, "epoch": 46} {"train_loss": -21.317758560180664, "global_step": 5597, "epoch": 46} {"train_loss": -21.44366455078125, "global_step": 5598, "epoch": 46} {"train_loss": -21.14655876159668, "global_step": 5599, "epoch": 46} {"train_loss": -21.713224411010742, "global_step": 5600, "epoch": 46} {"train_loss": -21.53185272216797, "global_step": 5601, "epoch": 46} {"train_loss": -21.051227569580078, "global_step": 5602, "epoch": 46} {"train_loss": -21.19536781311035, "global_step": 5603, "epoch": 46} {"train_loss": -21.337221145629883, "global_step": 5604, "epoch": 46} {"train_loss": -20.96285057067871, "global_step": 5605, "epoch": 46} {"train_loss": -20.520620346069336, "global_step": 5606, "epoch": 46} {"train_loss": -19.909814834594727, "global_step": 5607, "epoch": 46} {"train_loss": -21.174551010131836, "global_step": 5608, "epoch": 46} {"train_loss": -21.090534210205078, "global_step": 5609, "epoch": 46} {"train_loss": -20.179189682006836, "global_step": 5610, "epoch": 46} {"train_loss": -19.356958389282227, "global_step": 5611, "epoch": 46} {"train_loss": -21.289670944213867, "global_step": 5612, "epoch": 46} {"train_loss": -19.960636138916016, "global_step": 5613, "epoch": 46} {"train_loss": -21.71428871154785, "global_step": 5614, "epoch": 46} {"train_loss": -21.24078941345215, "global_step": 5615, "epoch": 46} {"train_loss": -21.19491958618164, "global_step": 5616, "epoch": 46} {"train_loss": -21.445287704467773, "global_step": 5617, "epoch": 46} {"train_loss": -20.63824462890625, "global_step": 5618, "epoch": 46} {"train_loss": -21.06251335144043, "global_step": 5619, "epoch": 46} {"train_loss": -21.330808639526367, "global_step": 5620, "epoch": 46} {"train_loss": -21.434213638305664, "global_step": 5621, "epoch": 46} {"train_loss": -21.49629020690918, "global_step": 5622, "epoch": 46} {"train_loss": -21.349897384643555, "global_step": 5623, "epoch": 46} {"train_loss": -21.670001983642578, "global_step": 5624, "epoch": 46} {"train_loss": -21.407230377197266, "global_step": 5625, "epoch": 46} {"train_loss": -21.08391761779785, "global_step": 5626, "epoch": 46} {"train_loss": -21.501726150512695, "global_step": 5627, "epoch": 46} {"train_loss": -21.42926025390625, "global_step": 5628, "epoch": 46} {"train_loss": -21.83860206604004, "global_step": 5629, "epoch": 46} {"train_loss": -20.958932876586914, "global_step": 5630, "epoch": 46} {"train_loss": -22.115314483642578, "global_step": 5631, "epoch": 46} {"train_loss": -21.5721378326416, "global_step": 5632, "epoch": 46} {"train_loss": -21.548368453979492, "global_step": 5633, "epoch": 46} {"train_loss": -21.460073471069336, "global_step": 5634, "epoch": 46} {"train_loss": -21.938901901245117, "global_step": 5635, "epoch": 46} {"train_loss": -21.969329833984375, "global_step": 5636, "epoch": 46} {"train_loss": -21.64034652709961, "global_step": 5637, "epoch": 46} {"train_loss": -22.01282501220703, "global_step": 5638, "epoch": 46} {"train_loss": -21.706424713134766, "global_step": 5639, "epoch": 46} {"train_loss": -21.967321395874023, "global_step": 5640, "epoch": 46} {"train_loss": -21.71245002746582, "global_step": 5641, "epoch": 46} {"train_loss": -22.038331985473633, "global_step": 5642, "epoch": 46} {"train_loss": -22.328229904174805, "global_step": 5643, "epoch": 46} {"train_loss": -21.37795066833496, "global_step": 5644, "epoch": 46} {"train_loss": -21.16214370727539, "global_step": 5645, "epoch": 46} {"train_loss": -22.360197067260742, "global_step": 5646, "epoch": 46} {"train_loss": -21.814739227294922, "global_step": 5647, "epoch": 46} {"train_loss": -21.718549728393555, "global_step": 5648, "epoch": 46} {"train_loss": -22.268388748168945, "global_step": 5649, "epoch": 46} {"train_loss": -21.92222023010254, "global_step": 5650, "epoch": 46} {"train_loss": -22.311307907104492, "global_step": 5651, "epoch": 46} {"train_loss": -21.46148109436035, "global_step": 5652, "epoch": 46} {"train_loss": -20.09209632873535, "global_step": 5653, "epoch": 46} {"train_loss": -19.516767501831055, "global_step": 5654, "epoch": 46} {"train_loss": -19.978710174560547, "global_step": 5655, "epoch": 46} {"train_loss": -22.19191551208496, "global_step": 5656, "epoch": 46} {"train_loss": -20.122997283935547, "global_step": 5657, "epoch": 46} {"train_loss": -21.77271270751953, "global_step": 5658, "epoch": 46} {"train_loss": -20.883283615112305, "global_step": 5659, "epoch": 46} {"train_loss": -21.584867477416992, "global_step": 5660, "epoch": 46} {"train_loss": -20.695600509643555, "global_step": 5661, "epoch": 46} {"train_loss": -20.039960861206055, "global_step": 5662, "epoch": 46} {"train_loss": -20.113555908203125, "global_step": 5663, "epoch": 46} {"train_loss": -20.9397029876709, "global_step": 5664, "epoch": 46} {"train_loss": -21.769607543945312, "global_step": 5665, "epoch": 46} {"train_loss": -21.251272201538086, "global_step": 5666, "epoch": 46} {"train_loss": -20.69962501525879, "global_step": 5667, "epoch": 46} {"train_loss": -21.23707389831543, "global_step": 5668, "epoch": 46} {"train_loss": -21.41314125061035, "global_step": 5669, "epoch": 46} {"train_loss": -21.821184158325195, "global_step": 5670, "epoch": 46} {"train_loss": -21.240280151367188, "global_step": 5671, "epoch": 46} {"train_loss": -21.522563934326172, "global_step": 5672, "epoch": 46} {"train_loss": -21.179645538330078, "global_step": 5673, "epoch": 46} {"train_loss": -21.677223205566406, "global_step": 5674, "epoch": 46} {"train_loss": -21.30438995361328, "global_step": 5675, "epoch": 46} {"train_loss": -21.473806381225586, "global_step": 5676, "epoch": 46} {"train_loss": -21.403085708618164, "global_step": 5677, "epoch": 46} {"train_loss": -21.464136123657227, "global_step": 5678, "epoch": 46} {"train_loss": -21.674535751342773, "global_step": 5679, "epoch": 46} {"train_loss": -21.509809494018555, "global_step": 5680, "epoch": 46} {"train_loss": -21.528257369995117, "global_step": 5681, "epoch": 46} {"train_loss": -21.055938720703125, "global_step": 5682, "epoch": 46} {"train_loss": -21.478506088256836, "global_step": 5683, "epoch": 46} {"train_loss": -21.95110511779785, "global_step": 5684, "epoch": 46} {"train_loss": -21.657217025756836, "global_step": 5685, "epoch": 46} {"train_loss": -21.264101627444433, "global_step": 5686, "epoch": 46, "val_loss": 3210622.0} {"train_loss": -22.110715866088867, "global_step": 5687, "epoch": 47} {"train_loss": -22.2615909576416, "global_step": 5688, "epoch": 47} {"train_loss": -22.193042755126953, "global_step": 5689, "epoch": 47} {"train_loss": -21.35205078125, "global_step": 5690, "epoch": 47} {"train_loss": -22.02400779724121, "global_step": 5691, "epoch": 47} {"train_loss": -22.11244010925293, "global_step": 5692, "epoch": 47} {"train_loss": -21.983083724975586, "global_step": 5693, "epoch": 47} {"train_loss": -22.153867721557617, "global_step": 5694, "epoch": 47} {"train_loss": -22.8153076171875, "global_step": 5695, "epoch": 47} {"train_loss": -22.281421661376953, "global_step": 5696, "epoch": 47} {"train_loss": -22.213224411010742, "global_step": 5697, "epoch": 47} {"train_loss": -22.332578659057617, "global_step": 5698, "epoch": 47} {"train_loss": -22.326019287109375, "global_step": 5699, "epoch": 47} {"train_loss": -22.290115356445312, "global_step": 5700, "epoch": 47} {"train_loss": -22.618242263793945, "global_step": 5701, "epoch": 47} {"train_loss": -22.06618309020996, "global_step": 5702, "epoch": 47} {"train_loss": -20.163818359375, "global_step": 5703, "epoch": 47} {"train_loss": -19.408475875854492, "global_step": 5704, "epoch": 47} {"train_loss": -20.572153091430664, "global_step": 5705, "epoch": 47} {"train_loss": -22.373517990112305, "global_step": 5706, "epoch": 47} {"train_loss": -21.297870635986328, "global_step": 5707, "epoch": 47} {"train_loss": -22.179183959960938, "global_step": 5708, "epoch": 47} {"train_loss": -21.451648712158203, "global_step": 5709, "epoch": 47} {"train_loss": -21.617340087890625, "global_step": 5710, "epoch": 47} {"train_loss": -20.30540657043457, "global_step": 5711, "epoch": 47} {"train_loss": -22.025388717651367, "global_step": 5712, "epoch": 47} {"train_loss": -21.734365463256836, "global_step": 5713, "epoch": 47} {"train_loss": -21.6058406829834, "global_step": 5714, "epoch": 47} {"train_loss": -21.018644332885742, "global_step": 5715, "epoch": 47} {"train_loss": -21.520631790161133, "global_step": 5716, "epoch": 47} {"train_loss": -21.86939811706543, "global_step": 5717, "epoch": 47} {"train_loss": -22.46393394470215, "global_step": 5718, "epoch": 47} {"train_loss": -21.95965576171875, "global_step": 5719, "epoch": 47} {"train_loss": -22.066282272338867, "global_step": 5720, "epoch": 47} {"train_loss": -22.010663986206055, "global_step": 5721, "epoch": 47} {"train_loss": -21.559783935546875, "global_step": 5722, "epoch": 47} {"train_loss": -21.732494354248047, "global_step": 5723, "epoch": 47} {"train_loss": -21.093006134033203, "global_step": 5724, "epoch": 47} {"train_loss": -21.28510093688965, "global_step": 5725, "epoch": 47} {"train_loss": -21.41594886779785, "global_step": 5726, "epoch": 47} {"train_loss": -21.116943359375, "global_step": 5727, "epoch": 47} {"train_loss": -21.79364585876465, "global_step": 5728, "epoch": 47} {"train_loss": -20.697956085205078, "global_step": 5729, "epoch": 47} {"train_loss": -20.365537643432617, "global_step": 5730, "epoch": 47} {"train_loss": -21.67384910583496, "global_step": 5731, "epoch": 47} {"train_loss": -21.782169342041016, "global_step": 5732, "epoch": 47} {"train_loss": -21.487150192260742, "global_step": 5733, "epoch": 47} {"train_loss": -21.958908081054688, "global_step": 5734, "epoch": 47} {"train_loss": -21.73016929626465, "global_step": 5735, "epoch": 47} {"train_loss": -21.85938835144043, "global_step": 5736, "epoch": 47} {"train_loss": -21.646034240722656, "global_step": 5737, "epoch": 47} {"train_loss": -21.83066177368164, "global_step": 5738, "epoch": 47} {"train_loss": -21.94413185119629, "global_step": 5739, "epoch": 47} {"train_loss": -21.767351150512695, "global_step": 5740, "epoch": 47} {"train_loss": -21.970699310302734, "global_step": 5741, "epoch": 47} {"train_loss": -21.84845733642578, "global_step": 5742, "epoch": 47} {"train_loss": -22.00681495666504, "global_step": 5743, "epoch": 47} {"train_loss": -22.194074630737305, "global_step": 5744, "epoch": 47} {"train_loss": -21.569734573364258, "global_step": 5745, "epoch": 47} {"train_loss": -22.413089752197266, "global_step": 5746, "epoch": 47} {"train_loss": -21.542316436767578, "global_step": 5747, "epoch": 47} {"train_loss": -21.751453399658203, "global_step": 5748, "epoch": 47} {"train_loss": -22.244054794311523, "global_step": 5749, "epoch": 47} {"train_loss": -22.456817626953125, "global_step": 5750, "epoch": 47} {"train_loss": -22.046510696411133, "global_step": 5751, "epoch": 47} {"train_loss": -22.438739776611328, "global_step": 5752, "epoch": 47} {"train_loss": -22.112241744995117, "global_step": 5753, "epoch": 47} {"train_loss": -21.9693660736084, "global_step": 5754, "epoch": 47} {"train_loss": -22.237287521362305, "global_step": 5755, "epoch": 47} {"train_loss": -22.64499282836914, "global_step": 5756, "epoch": 47} {"train_loss": -22.140766143798828, "global_step": 5757, "epoch": 47} {"train_loss": -22.283588409423828, "global_step": 5758, "epoch": 47} {"train_loss": -22.010366439819336, "global_step": 5759, "epoch": 47} {"train_loss": -21.654142379760742, "global_step": 5760, "epoch": 47} {"train_loss": -21.686491012573242, "global_step": 5761, "epoch": 47} {"train_loss": -21.03400230407715, "global_step": 5762, "epoch": 47} {"train_loss": -21.333576202392578, "global_step": 5763, "epoch": 47} {"train_loss": -20.74562644958496, "global_step": 5764, "epoch": 47} {"train_loss": -21.286901473999023, "global_step": 5765, "epoch": 47} {"train_loss": -21.925405502319336, "global_step": 5766, "epoch": 47} {"train_loss": -21.916522979736328, "global_step": 5767, "epoch": 47} {"train_loss": -21.6765079498291, "global_step": 5768, "epoch": 47} {"train_loss": -21.10675048828125, "global_step": 5769, "epoch": 47} {"train_loss": -22.232553482055664, "global_step": 5770, "epoch": 47} {"train_loss": -20.605703353881836, "global_step": 5771, "epoch": 47} {"train_loss": -20.98583984375, "global_step": 5772, "epoch": 47} {"train_loss": -21.17320442199707, "global_step": 5773, "epoch": 47} {"train_loss": -21.786855697631836, "global_step": 5774, "epoch": 47} {"train_loss": -21.006223678588867, "global_step": 5775, "epoch": 47} {"train_loss": -21.8597412109375, "global_step": 5776, "epoch": 47} {"train_loss": -20.94145965576172, "global_step": 5777, "epoch": 47} {"train_loss": -22.067636489868164, "global_step": 5778, "epoch": 47} {"train_loss": -21.088993072509766, "global_step": 5779, "epoch": 47} {"train_loss": -21.677642822265625, "global_step": 5780, "epoch": 47} {"train_loss": -21.571575164794922, "global_step": 5781, "epoch": 47} {"train_loss": -21.43937110900879, "global_step": 5782, "epoch": 47} {"train_loss": -21.904813766479492, "global_step": 5783, "epoch": 47} {"train_loss": -21.643396377563477, "global_step": 5784, "epoch": 47} {"train_loss": -21.5146427154541, "global_step": 5785, "epoch": 47} {"train_loss": -21.75625228881836, "global_step": 5786, "epoch": 47} {"train_loss": -22.028060913085938, "global_step": 5787, "epoch": 47} {"train_loss": -21.889755249023438, "global_step": 5788, "epoch": 47} {"train_loss": -21.5374755859375, "global_step": 5789, "epoch": 47} {"train_loss": -21.801679611206055, "global_step": 5790, "epoch": 47} {"train_loss": -22.10481071472168, "global_step": 5791, "epoch": 47} {"train_loss": -22.211658477783203, "global_step": 5792, "epoch": 47} {"train_loss": -21.86795425415039, "global_step": 5793, "epoch": 47} {"train_loss": -21.951505661010742, "global_step": 5794, "epoch": 47} {"train_loss": -21.725324630737305, "global_step": 5795, "epoch": 47} {"train_loss": -22.65078353881836, "global_step": 5796, "epoch": 47} {"train_loss": -22.06103515625, "global_step": 5797, "epoch": 47} {"train_loss": -22.389347076416016, "global_step": 5798, "epoch": 47} {"train_loss": -22.216657638549805, "global_step": 5799, "epoch": 47} {"train_loss": -21.319860458374023, "global_step": 5800, "epoch": 47} {"train_loss": -21.136093139648438, "global_step": 5801, "epoch": 47} {"train_loss": -21.34160804748535, "global_step": 5802, "epoch": 47} {"train_loss": -22.276504516601562, "global_step": 5803, "epoch": 47} {"train_loss": -21.258071899414062, "global_step": 5804, "epoch": 47} {"train_loss": -20.97063636779785, "global_step": 5805, "epoch": 47} {"train_loss": -20.244115829467773, "global_step": 5806, "epoch": 47} {"train_loss": -21.71214466252603, "global_step": 5807, "epoch": 47, "val_loss": 2584982.0} {"train_loss": -22.41470718383789, "global_step": 5808, "epoch": 48} {"train_loss": -21.554502487182617, "global_step": 5809, "epoch": 48} {"train_loss": -22.146589279174805, "global_step": 5810, "epoch": 48} {"train_loss": -21.634849548339844, "global_step": 5811, "epoch": 48} {"train_loss": -21.851150512695312, "global_step": 5812, "epoch": 48} {"train_loss": -21.886417388916016, "global_step": 5813, "epoch": 48} {"train_loss": -22.099130630493164, "global_step": 5814, "epoch": 48} {"train_loss": -21.879215240478516, "global_step": 5815, "epoch": 48} {"train_loss": -22.16837501525879, "global_step": 5816, "epoch": 48} {"train_loss": -21.745838165283203, "global_step": 5817, "epoch": 48} {"train_loss": -22.08100700378418, "global_step": 5818, "epoch": 48} {"train_loss": -22.1402587890625, "global_step": 5819, "epoch": 48} {"train_loss": -20.709476470947266, "global_step": 5820, "epoch": 48} {"train_loss": -19.132566452026367, "global_step": 5821, "epoch": 48} {"train_loss": -20.196395874023438, "global_step": 5822, "epoch": 48} {"train_loss": -18.76425552368164, "global_step": 5823, "epoch": 48} {"train_loss": -17.65641212463379, "global_step": 5824, "epoch": 48} {"train_loss": -18.90544319152832, "global_step": 5825, "epoch": 48} {"train_loss": -18.26578140258789, "global_step": 5826, "epoch": 48} {"train_loss": -19.0495662689209, "global_step": 5827, "epoch": 48} {"train_loss": -17.428646087646484, "global_step": 5828, "epoch": 48} {"train_loss": -20.100778579711914, "global_step": 5829, "epoch": 48} {"train_loss": -17.232351303100586, "global_step": 5830, "epoch": 48} {"train_loss": -19.161954879760742, "global_step": 5831, "epoch": 48} {"train_loss": -19.817768096923828, "global_step": 5832, "epoch": 48} {"train_loss": -18.622541427612305, "global_step": 5833, "epoch": 48} {"train_loss": -19.199909210205078, "global_step": 5834, "epoch": 48} {"train_loss": -19.06696319580078, "global_step": 5835, "epoch": 48} {"train_loss": -20.290395736694336, "global_step": 5836, "epoch": 48} {"train_loss": -19.811344146728516, "global_step": 5837, "epoch": 48} {"train_loss": -19.348779678344727, "global_step": 5838, "epoch": 48} {"train_loss": -19.954946517944336, "global_step": 5839, "epoch": 48} {"train_loss": -20.514570236206055, "global_step": 5840, "epoch": 48} {"train_loss": -19.514728546142578, "global_step": 5841, "epoch": 48} {"train_loss": -19.442445755004883, "global_step": 5842, "epoch": 48} {"train_loss": -20.35236358642578, "global_step": 5843, "epoch": 48} {"train_loss": -19.414960861206055, "global_step": 5844, "epoch": 48} {"train_loss": -20.039875030517578, "global_step": 5845, "epoch": 48} {"train_loss": -19.799894332885742, "global_step": 5846, "epoch": 48} {"train_loss": -20.473119735717773, "global_step": 5847, "epoch": 48} {"train_loss": -20.06736183166504, "global_step": 5848, "epoch": 48} {"train_loss": -20.60390281677246, "global_step": 5849, "epoch": 48} {"train_loss": -20.102323532104492, "global_step": 5850, "epoch": 48} {"train_loss": -20.32830810546875, "global_step": 5851, "epoch": 48} {"train_loss": -20.689815521240234, "global_step": 5852, "epoch": 48} {"train_loss": -20.59735107421875, "global_step": 5853, "epoch": 48} {"train_loss": -20.837751388549805, "global_step": 5854, "epoch": 48} {"train_loss": -20.805103302001953, "global_step": 5855, "epoch": 48} {"train_loss": -19.85422134399414, "global_step": 5856, "epoch": 48} {"train_loss": -20.460485458374023, "global_step": 5857, "epoch": 48} {"train_loss": -20.128599166870117, "global_step": 5858, "epoch": 48} {"train_loss": -19.931293487548828, "global_step": 5859, "epoch": 48} {"train_loss": -16.535306930541992, "global_step": 5860, "epoch": 48} {"train_loss": -12.275056838989258, "global_step": 5861, "epoch": 48} {"train_loss": -13.257895469665527, "global_step": 5862, "epoch": 48} {"train_loss": -20.156047821044922, "global_step": 5863, "epoch": 48} {"train_loss": -14.941370010375977, "global_step": 5864, "epoch": 48} {"train_loss": -18.715944290161133, "global_step": 5865, "epoch": 48} {"train_loss": -18.919214248657227, "global_step": 5866, "epoch": 48} {"train_loss": -18.006662368774414, "global_step": 5867, "epoch": 48} {"train_loss": -19.141454696655273, "global_step": 5868, "epoch": 48} {"train_loss": -19.462543487548828, "global_step": 5869, "epoch": 48} {"train_loss": -19.24068260192871, "global_step": 5870, "epoch": 48} {"train_loss": -18.90546989440918, "global_step": 5871, "epoch": 48} {"train_loss": -19.381675720214844, "global_step": 5872, "epoch": 48} {"train_loss": -19.4158878326416, "global_step": 5873, "epoch": 48} {"train_loss": -19.0031795501709, "global_step": 5874, "epoch": 48} {"train_loss": -19.81524658203125, "global_step": 5875, "epoch": 48} {"train_loss": -19.410593032836914, "global_step": 5876, "epoch": 48} {"train_loss": -18.846681594848633, "global_step": 5877, "epoch": 48} {"train_loss": -19.723554611206055, "global_step": 5878, "epoch": 48} {"train_loss": -19.60329818725586, "global_step": 5879, "epoch": 48} {"train_loss": -19.206806182861328, "global_step": 5880, "epoch": 48} {"train_loss": -19.8253231048584, "global_step": 5881, "epoch": 48} {"train_loss": -19.4271240234375, "global_step": 5882, "epoch": 48} {"train_loss": -19.593603134155273, "global_step": 5883, "epoch": 48} {"train_loss": -19.717565536499023, "global_step": 5884, "epoch": 48} {"train_loss": -20.116729736328125, "global_step": 5885, "epoch": 48} {"train_loss": -20.12430763244629, "global_step": 5886, "epoch": 48} {"train_loss": -20.11495018005371, "global_step": 5887, "epoch": 48} {"train_loss": -19.977741241455078, "global_step": 5888, "epoch": 48} {"train_loss": -20.292037963867188, "global_step": 5889, "epoch": 48} {"train_loss": -19.964256286621094, "global_step": 5890, "epoch": 48} {"train_loss": -19.9390869140625, "global_step": 5891, "epoch": 48} {"train_loss": -20.166561126708984, "global_step": 5892, "epoch": 48} {"train_loss": -20.089712142944336, "global_step": 5893, "epoch": 48} {"train_loss": -20.761932373046875, "global_step": 5894, "epoch": 48} {"train_loss": -20.73709487915039, "global_step": 5895, "epoch": 48} {"train_loss": -20.418989181518555, "global_step": 5896, "epoch": 48} {"train_loss": -20.923328399658203, "global_step": 5897, "epoch": 48} {"train_loss": -20.876972198486328, "global_step": 5898, "epoch": 48} {"train_loss": -20.643123626708984, "global_step": 5899, "epoch": 48} {"train_loss": -20.56247901916504, "global_step": 5900, "epoch": 48} {"train_loss": -20.772756576538086, "global_step": 5901, "epoch": 48} {"train_loss": -20.824596405029297, "global_step": 5902, "epoch": 48} {"train_loss": -21.051393508911133, "global_step": 5903, "epoch": 48} {"train_loss": -20.502437591552734, "global_step": 5904, "epoch": 48} {"train_loss": -21.516857147216797, "global_step": 5905, "epoch": 48} {"train_loss": -20.512998580932617, "global_step": 5906, "epoch": 48} {"train_loss": -21.152769088745117, "global_step": 5907, "epoch": 48} {"train_loss": -21.07901382446289, "global_step": 5908, "epoch": 48} {"train_loss": -21.32275390625, "global_step": 5909, "epoch": 48} {"train_loss": -21.084177017211914, "global_step": 5910, "epoch": 48} {"train_loss": -21.095727920532227, "global_step": 5911, "epoch": 48} {"train_loss": -21.651023864746094, "global_step": 5912, "epoch": 48} {"train_loss": -21.387983322143555, "global_step": 5913, "epoch": 48} {"train_loss": -21.803125381469727, "global_step": 5914, "epoch": 48} {"train_loss": -21.820608139038086, "global_step": 5915, "epoch": 48} {"train_loss": -21.378835678100586, "global_step": 5916, "epoch": 48} {"train_loss": -21.122949600219727, "global_step": 5917, "epoch": 48} {"train_loss": -21.6087703704834, "global_step": 5918, "epoch": 48} {"train_loss": -21.141143798828125, "global_step": 5919, "epoch": 48} {"train_loss": -21.28652000427246, "global_step": 5920, "epoch": 48} {"train_loss": -21.527402877807617, "global_step": 5921, "epoch": 48} {"train_loss": -20.474546432495117, "global_step": 5922, "epoch": 48} {"train_loss": -20.884374618530273, "global_step": 5923, "epoch": 48} {"train_loss": -21.21524429321289, "global_step": 5924, "epoch": 48} {"train_loss": -19.67128562927246, "global_step": 5925, "epoch": 48} {"train_loss": -18.026443481445312, "global_step": 5926, "epoch": 48} {"train_loss": -19.575769424438477, "global_step": 5927, "epoch": 48} {"train_loss": -20.03673951487896, "global_step": 5928, "epoch": 48, "val_loss": 2485016.75} {"train_loss": -19.994062423706055, "global_step": 5929, "epoch": 49} {"train_loss": -20.58394432067871, "global_step": 5930, "epoch": 49} {"train_loss": -20.275989532470703, "global_step": 5931, "epoch": 49} {"train_loss": -21.232391357421875, "global_step": 5932, "epoch": 49} {"train_loss": -20.435083389282227, "global_step": 5933, "epoch": 49} {"train_loss": -20.911670684814453, "global_step": 5934, "epoch": 49} {"train_loss": -20.896638870239258, "global_step": 5935, "epoch": 49} {"train_loss": -20.67593765258789, "global_step": 5936, "epoch": 49} {"train_loss": -20.26240348815918, "global_step": 5937, "epoch": 49} {"train_loss": -21.46401023864746, "global_step": 5938, "epoch": 49} {"train_loss": -20.973926544189453, "global_step": 5939, "epoch": 49} {"train_loss": -21.349843978881836, "global_step": 5940, "epoch": 49} {"train_loss": -20.853239059448242, "global_step": 5941, "epoch": 49} {"train_loss": -20.79309844970703, "global_step": 5942, "epoch": 49} {"train_loss": -21.066186904907227, "global_step": 5943, "epoch": 49} {"train_loss": -20.55852699279785, "global_step": 5944, "epoch": 49} {"train_loss": -19.15828514099121, "global_step": 5945, "epoch": 49} {"train_loss": -15.080195426940918, "global_step": 5946, "epoch": 49} {"train_loss": -20.81654167175293, "global_step": 5947, "epoch": 49} {"train_loss": -17.09889030456543, "global_step": 5948, "epoch": 49} {"train_loss": -19.333555221557617, "global_step": 5949, "epoch": 49} {"train_loss": -19.380517959594727, "global_step": 5950, "epoch": 49} {"train_loss": -20.924760818481445, "global_step": 5951, "epoch": 49} {"train_loss": -20.452829360961914, "global_step": 5952, "epoch": 49} {"train_loss": -21.247329711914062, "global_step": 5953, "epoch": 49} {"train_loss": -20.315902709960938, "global_step": 5954, "epoch": 49} {"train_loss": -20.957462310791016, "global_step": 5955, "epoch": 49} {"train_loss": -21.03822135925293, "global_step": 5956, "epoch": 49} {"train_loss": -20.70584487915039, "global_step": 5957, "epoch": 49} {"train_loss": -20.541715621948242, "global_step": 5958, "epoch": 49} {"train_loss": -20.984970092773438, "global_step": 5959, "epoch": 49} {"train_loss": -20.902057647705078, "global_step": 5960, "epoch": 49} {"train_loss": -21.181386947631836, "global_step": 5961, "epoch": 49} {"train_loss": -21.10410499572754, "global_step": 5962, "epoch": 49} {"train_loss": -19.813465118408203, "global_step": 5963, "epoch": 49} {"train_loss": -21.091585159301758, "global_step": 5964, "epoch": 49} {"train_loss": -20.887454986572266, "global_step": 5965, "epoch": 49} {"train_loss": -21.072555541992188, "global_step": 5966, "epoch": 49} {"train_loss": -21.459524154663086, "global_step": 5967, "epoch": 49} {"train_loss": -21.675432205200195, "global_step": 5968, "epoch": 49} {"train_loss": -21.434572219848633, "global_step": 5969, "epoch": 49} {"train_loss": -21.10856819152832, "global_step": 5970, "epoch": 49} {"train_loss": -21.257795333862305, "global_step": 5971, "epoch": 49} {"train_loss": -21.44900894165039, "global_step": 5972, "epoch": 49} {"train_loss": -21.54398536682129, "global_step": 5973, "epoch": 49} {"train_loss": -21.552309036254883, "global_step": 5974, "epoch": 49} {"train_loss": -21.48400115966797, "global_step": 5975, "epoch": 49} {"train_loss": -21.271997451782227, "global_step": 5976, "epoch": 49} {"train_loss": -21.126483917236328, "global_step": 5977, "epoch": 49} {"train_loss": -21.255956649780273, "global_step": 5978, "epoch": 49} {"train_loss": -20.4913387298584, "global_step": 5979, "epoch": 49} {"train_loss": -19.608808517456055, "global_step": 5980, "epoch": 49} {"train_loss": -20.37029457092285, "global_step": 5981, "epoch": 49} {"train_loss": -20.83841896057129, "global_step": 5982, "epoch": 49} {"train_loss": -21.47673988342285, "global_step": 5983, "epoch": 49} {"train_loss": -20.48610496520996, "global_step": 5984, "epoch": 49} {"train_loss": -21.565364837646484, "global_step": 5985, "epoch": 49} {"train_loss": -21.035755157470703, "global_step": 5986, "epoch": 49} {"train_loss": -21.725217819213867, "global_step": 5987, "epoch": 49} {"train_loss": -21.133634567260742, "global_step": 5988, "epoch": 49} {"train_loss": -21.546710968017578, "global_step": 5989, "epoch": 49} {"train_loss": -21.391603469848633, "global_step": 5990, "epoch": 49} {"train_loss": -21.233613967895508, "global_step": 5991, "epoch": 49} {"train_loss": -21.429101943969727, "global_step": 5992, "epoch": 49} {"train_loss": -21.261920928955078, "global_step": 5993, "epoch": 49} {"train_loss": -21.35951805114746, "global_step": 5994, "epoch": 49} {"train_loss": -21.243457794189453, "global_step": 5995, "epoch": 49} {"train_loss": -21.024494171142578, "global_step": 5996, "epoch": 49} {"train_loss": -20.583332061767578, "global_step": 5997, "epoch": 49} {"train_loss": -19.1315975189209, "global_step": 5998, "epoch": 49} {"train_loss": -19.17013168334961, "global_step": 5999, "epoch": 49} {"train_loss": -20.900766372680664, "global_step": 6000, "epoch": 49} {"train_loss": -21.65506362915039, "global_step": 6001, "epoch": 49} {"train_loss": -20.671142578125, "global_step": 6002, "epoch": 49} {"train_loss": -21.582136154174805, "global_step": 6003, "epoch": 49} {"train_loss": -21.886178970336914, "global_step": 6004, "epoch": 49} {"train_loss": -21.823745727539062, "global_step": 6005, "epoch": 49} {"train_loss": -21.995311737060547, "global_step": 6006, "epoch": 49} {"train_loss": -21.419950485229492, "global_step": 6007, "epoch": 49} {"train_loss": -21.11588478088379, "global_step": 6008, "epoch": 49} {"train_loss": -19.140348434448242, "global_step": 6009, "epoch": 49} {"train_loss": -21.298906326293945, "global_step": 6010, "epoch": 49} {"train_loss": -19.88134765625, "global_step": 6011, "epoch": 49} {"train_loss": -21.27047348022461, "global_step": 6012, "epoch": 49} {"train_loss": -21.213764190673828, "global_step": 6013, "epoch": 49} {"train_loss": -21.248437881469727, "global_step": 6014, "epoch": 49} {"train_loss": -21.49985694885254, "global_step": 6015, "epoch": 49} {"train_loss": -21.552263259887695, "global_step": 6016, "epoch": 49} {"train_loss": -21.65839958190918, "global_step": 6017, "epoch": 49} {"train_loss": -21.944753646850586, "global_step": 6018, "epoch": 49} {"train_loss": -21.307361602783203, "global_step": 6019, "epoch": 49} {"train_loss": -21.468015670776367, "global_step": 6020, "epoch": 49} {"train_loss": -20.702665328979492, "global_step": 6021, "epoch": 49} {"train_loss": -21.21648597717285, "global_step": 6022, "epoch": 49} {"train_loss": -20.678804397583008, "global_step": 6023, "epoch": 49} {"train_loss": -21.283655166625977, "global_step": 6024, "epoch": 49} {"train_loss": -21.445457458496094, "global_step": 6025, "epoch": 49} {"train_loss": -22.148324966430664, "global_step": 6026, "epoch": 49} {"train_loss": -21.178842544555664, "global_step": 6027, "epoch": 49} {"train_loss": -20.4533748626709, "global_step": 6028, "epoch": 49} {"train_loss": -21.516637802124023, "global_step": 6029, "epoch": 49} {"train_loss": -21.69622230529785, "global_step": 6030, "epoch": 49} {"train_loss": -20.544422149658203, "global_step": 6031, "epoch": 49} {"train_loss": -21.44083023071289, "global_step": 6032, "epoch": 49} {"train_loss": -20.67837142944336, "global_step": 6033, "epoch": 49} {"train_loss": -20.865877151489258, "global_step": 6034, "epoch": 49} {"train_loss": -19.806705474853516, "global_step": 6035, "epoch": 49} {"train_loss": -21.1153564453125, "global_step": 6036, "epoch": 49} {"train_loss": -20.85233497619629, "global_step": 6037, "epoch": 49} {"train_loss": -21.44780158996582, "global_step": 6038, "epoch": 49} {"train_loss": -20.69660758972168, "global_step": 6039, "epoch": 49} {"train_loss": -21.815021514892578, "global_step": 6040, "epoch": 49} {"train_loss": -21.15425682067871, "global_step": 6041, "epoch": 49} {"train_loss": -21.753768920898438, "global_step": 6042, "epoch": 49} {"train_loss": -21.327932357788086, "global_step": 6043, "epoch": 49} {"train_loss": -22.045211791992188, "global_step": 6044, "epoch": 49} {"train_loss": -21.667264938354492, "global_step": 6045, "epoch": 49} {"train_loss": -21.094228744506836, "global_step": 6046, "epoch": 49} {"train_loss": -21.615604400634766, "global_step": 6047, "epoch": 49} {"train_loss": -21.70918083190918, "global_step": 6048, "epoch": 49} {"train_loss": -20.935787429494304, "global_step": 6049, "epoch": 49, "val_loss": 2217632.5} {"train_loss": -21.80582618713379, "global_step": 6050, "epoch": 50} {"train_loss": -22.27967071533203, "global_step": 6051, "epoch": 50} {"train_loss": -22.11292839050293, "global_step": 6052, "epoch": 50} {"train_loss": -21.673236846923828, "global_step": 6053, "epoch": 50} {"train_loss": -22.17568016052246, "global_step": 6054, "epoch": 50} {"train_loss": -21.631574630737305, "global_step": 6055, "epoch": 50} {"train_loss": -22.149805068969727, "global_step": 6056, "epoch": 50} {"train_loss": -22.335451126098633, "global_step": 6057, "epoch": 50} {"train_loss": -22.272930145263672, "global_step": 6058, "epoch": 50} {"train_loss": -21.984437942504883, "global_step": 6059, "epoch": 50} {"train_loss": -22.261205673217773, "global_step": 6060, "epoch": 50} {"train_loss": -21.7115535736084, "global_step": 6061, "epoch": 50} {"train_loss": -22.035093307495117, "global_step": 6062, "epoch": 50} {"train_loss": -21.76300621032715, "global_step": 6063, "epoch": 50} {"train_loss": -21.960716247558594, "global_step": 6064, "epoch": 50} {"train_loss": -22.572206497192383, "global_step": 6065, "epoch": 50} {"train_loss": -22.87872886657715, "global_step": 6066, "epoch": 50} {"train_loss": -22.08346939086914, "global_step": 6067, "epoch": 50} {"train_loss": -19.39460563659668, "global_step": 6068, "epoch": 50} {"train_loss": -14.141532897949219, "global_step": 6069, "epoch": 50} {"train_loss": -15.151091575622559, "global_step": 6070, "epoch": 50} {"train_loss": -21.286636352539062, "global_step": 6071, "epoch": 50} {"train_loss": -16.3084659576416, "global_step": 6072, "epoch": 50} {"train_loss": -19.703184127807617, "global_step": 6073, "epoch": 50} {"train_loss": -19.760385513305664, "global_step": 6074, "epoch": 50} {"train_loss": -20.062358856201172, "global_step": 6075, "epoch": 50} {"train_loss": -20.067434310913086, "global_step": 6076, "epoch": 50} {"train_loss": -21.204641342163086, "global_step": 6077, "epoch": 50} {"train_loss": -20.171916961669922, "global_step": 6078, "epoch": 50} {"train_loss": -21.307981491088867, "global_step": 6079, "epoch": 50} {"train_loss": -21.374441146850586, "global_step": 6080, "epoch": 50} {"train_loss": -20.562532424926758, "global_step": 6081, "epoch": 50} {"train_loss": -21.191246032714844, "global_step": 6082, "epoch": 50} {"train_loss": -20.301237106323242, "global_step": 6083, "epoch": 50} {"train_loss": -20.699735641479492, "global_step": 6084, "epoch": 50} {"train_loss": -20.4871883392334, "global_step": 6085, "epoch": 50} {"train_loss": -19.4678955078125, "global_step": 6086, "epoch": 50} {"train_loss": -20.98064422607422, "global_step": 6087, "epoch": 50} {"train_loss": -19.56512451171875, "global_step": 6088, "epoch": 50} {"train_loss": -21.265893936157227, "global_step": 6089, "epoch": 50} {"train_loss": -20.60902976989746, "global_step": 6090, "epoch": 50} {"train_loss": -21.044347763061523, "global_step": 6091, "epoch": 50} {"train_loss": -21.26763343811035, "global_step": 6092, "epoch": 50} {"train_loss": -21.116764068603516, "global_step": 6093, "epoch": 50} {"train_loss": -21.15223503112793, "global_step": 6094, "epoch": 50} {"train_loss": -21.26311683654785, "global_step": 6095, "epoch": 50} {"train_loss": -21.2766056060791, "global_step": 6096, "epoch": 50} {"train_loss": -21.461612701416016, "global_step": 6097, "epoch": 50} {"train_loss": -21.406015396118164, "global_step": 6098, "epoch": 50} {"train_loss": -21.614295959472656, "global_step": 6099, "epoch": 50} {"train_loss": -21.72171401977539, "global_step": 6100, "epoch": 50} {"train_loss": -21.49831199645996, "global_step": 6101, "epoch": 50} {"train_loss": -21.36707878112793, "global_step": 6102, "epoch": 50} {"train_loss": -21.530221939086914, "global_step": 6103, "epoch": 50} {"train_loss": -21.658838272094727, "global_step": 6104, "epoch": 50} {"train_loss": -21.716188430786133, "global_step": 6105, "epoch": 50} {"train_loss": -21.808914184570312, "global_step": 6106, "epoch": 50} {"train_loss": -21.261831283569336, "global_step": 6107, "epoch": 50} {"train_loss": -21.730520248413086, "global_step": 6108, "epoch": 50} {"train_loss": -21.532079696655273, "global_step": 6109, "epoch": 50} {"train_loss": -21.611467361450195, "global_step": 6110, "epoch": 50} {"train_loss": -21.796558380126953, "global_step": 6111, "epoch": 50} {"train_loss": -22.05036163330078, "global_step": 6112, "epoch": 50} {"train_loss": -22.00029945373535, "global_step": 6113, "epoch": 50} {"train_loss": -22.096975326538086, "global_step": 6114, "epoch": 50} {"train_loss": -22.237024307250977, "global_step": 6115, "epoch": 50} {"train_loss": -21.914321899414062, "global_step": 6116, "epoch": 50} {"train_loss": -21.9101505279541, "global_step": 6117, "epoch": 50} {"train_loss": -22.2250919342041, "global_step": 6118, "epoch": 50} {"train_loss": -21.99812126159668, "global_step": 6119, "epoch": 50} {"train_loss": -22.545475006103516, "global_step": 6120, "epoch": 50} {"train_loss": -22.48833656311035, "global_step": 6121, "epoch": 50} {"train_loss": -22.626466751098633, "global_step": 6122, "epoch": 50} {"train_loss": -21.980056762695312, "global_step": 6123, "epoch": 50} {"train_loss": -22.41104507446289, "global_step": 6124, "epoch": 50} {"train_loss": -22.466215133666992, "global_step": 6125, "epoch": 50} {"train_loss": -22.561447143554688, "global_step": 6126, "epoch": 50} {"train_loss": -22.611440658569336, "global_step": 6127, "epoch": 50} {"train_loss": -22.55668067932129, "global_step": 6128, "epoch": 50} {"train_loss": -22.666086196899414, "global_step": 6129, "epoch": 50} {"train_loss": -22.86318016052246, "global_step": 6130, "epoch": 50} {"train_loss": -23.2928409576416, "global_step": 6131, "epoch": 50} {"train_loss": -23.03477668762207, "global_step": 6132, "epoch": 50} {"train_loss": -22.617849349975586, "global_step": 6133, "epoch": 50} {"train_loss": -21.547794342041016, "global_step": 6134, "epoch": 50} {"train_loss": -19.02205467224121, "global_step": 6135, "epoch": 50} {"train_loss": -14.41844654083252, "global_step": 6136, "epoch": 50} {"train_loss": -15.62548542022705, "global_step": 6137, "epoch": 50} {"train_loss": -18.964019775390625, "global_step": 6138, "epoch": 50} {"train_loss": -20.041715621948242, "global_step": 6139, "epoch": 50} {"train_loss": -20.154638290405273, "global_step": 6140, "epoch": 50} {"train_loss": -20.13958740234375, "global_step": 6141, "epoch": 50} {"train_loss": -21.850391387939453, "global_step": 6142, "epoch": 50} {"train_loss": -20.532217025756836, "global_step": 6143, "epoch": 50} {"train_loss": -20.131017684936523, "global_step": 6144, "epoch": 50} {"train_loss": -20.476648330688477, "global_step": 6145, "epoch": 50} {"train_loss": -21.670202255249023, "global_step": 6146, "epoch": 50} {"train_loss": -20.81833839416504, "global_step": 6147, "epoch": 50} {"train_loss": -21.063701629638672, "global_step": 6148, "epoch": 50} {"train_loss": -20.64444351196289, "global_step": 6149, "epoch": 50} {"train_loss": -21.31066131591797, "global_step": 6150, "epoch": 50} {"train_loss": -20.420652389526367, "global_step": 6151, "epoch": 50} {"train_loss": -21.01381492614746, "global_step": 6152, "epoch": 50} {"train_loss": -20.53097152709961, "global_step": 6153, "epoch": 50} {"train_loss": -19.99249839782715, "global_step": 6154, "epoch": 50} {"train_loss": -21.563989639282227, "global_step": 6155, "epoch": 50} {"train_loss": -20.676321029663086, "global_step": 6156, "epoch": 50} {"train_loss": -20.56336212158203, "global_step": 6157, "epoch": 50} {"train_loss": -21.20978355407715, "global_step": 6158, "epoch": 50} {"train_loss": -20.926633834838867, "global_step": 6159, "epoch": 50} {"train_loss": -20.82244873046875, "global_step": 6160, "epoch": 50} {"train_loss": -21.01008415222168, "global_step": 6161, "epoch": 50} {"train_loss": -20.7167911529541, "global_step": 6162, "epoch": 50} {"train_loss": -21.241540908813477, "global_step": 6163, "epoch": 50} {"train_loss": -21.29332733154297, "global_step": 6164, "epoch": 50} {"train_loss": -21.215152740478516, "global_step": 6165, "epoch": 50} {"train_loss": -21.481245040893555, "global_step": 6166, "epoch": 50} {"train_loss": -21.786752700805664, "global_step": 6167, "epoch": 50} {"train_loss": -21.367856979370117, "global_step": 6168, "epoch": 50} {"train_loss": -21.714157104492188, "global_step": 6169, "epoch": 50} {"train_loss": -21.128131275334635, "global_step": 6170, "epoch": 50, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4400000": 1.0, "test/sim_max_reward_4400001": 0.0, "test/sim_max_reward_4400002": 1.0, "test/sim_max_reward_4400003": 1.0, "test/sim_max_reward_4400004": 1.0, "test/sim_max_reward_4400005": 1.0, "test/sim_max_reward_4400006": 1.0, "test/sim_max_reward_4400007": 1.0, "test/sim_max_reward_4400008": 1.0, "test/sim_max_reward_4400009": 1.0, "test/sim_max_reward_4400010": 1.0, "test/sim_max_reward_4400011": 1.0, "test/sim_max_reward_4400012": 1.0, "test/sim_max_reward_4400013": 1.0, "test/sim_max_reward_4400014": 1.0, "test/sim_max_reward_4400015": 1.0, "test/sim_max_reward_4400016": 1.0, "test/sim_max_reward_4400017": 1.0, "test/sim_max_reward_4400018": 1.0, "test/sim_max_reward_4400019": 1.0, "test/sim_max_reward_4400020": 1.0, "test/sim_max_reward_4400021": 1.0, "train/mean_score": 1.0, "test/mean_score": 0.9545454545454546, "val_loss": 3274971.75} {"train_loss": -21.244977951049805, "global_step": 6171, "epoch": 51} {"train_loss": -21.344404220581055, "global_step": 6172, "epoch": 51} {"train_loss": -21.697795867919922, "global_step": 6173, "epoch": 51} {"train_loss": -21.487699508666992, "global_step": 6174, "epoch": 51} {"train_loss": -21.763416290283203, "global_step": 6175, "epoch": 51} {"train_loss": -22.185089111328125, "global_step": 6176, "epoch": 51} {"train_loss": -21.968244552612305, "global_step": 6177, "epoch": 51} {"train_loss": -21.9542293548584, "global_step": 6178, "epoch": 51} {"train_loss": -21.89259910583496, "global_step": 6179, "epoch": 51} {"train_loss": -21.807580947875977, "global_step": 6180, "epoch": 51} {"train_loss": -22.41783332824707, "global_step": 6181, "epoch": 51} {"train_loss": -21.667932510375977, "global_step": 6182, "epoch": 51} {"train_loss": -22.110368728637695, "global_step": 6183, "epoch": 51} {"train_loss": -22.519672393798828, "global_step": 6184, "epoch": 51} {"train_loss": -21.870075225830078, "global_step": 6185, "epoch": 51} {"train_loss": -22.024961471557617, "global_step": 6186, "epoch": 51} {"train_loss": -21.986419677734375, "global_step": 6187, "epoch": 51} {"train_loss": -21.971832275390625, "global_step": 6188, "epoch": 51} {"train_loss": -22.220401763916016, "global_step": 6189, "epoch": 51} {"train_loss": -22.211679458618164, "global_step": 6190, "epoch": 51} {"train_loss": -22.256994247436523, "global_step": 6191, "epoch": 51} {"train_loss": -21.977075576782227, "global_step": 6192, "epoch": 51} {"train_loss": -21.85158920288086, "global_step": 6193, "epoch": 51} {"train_loss": -22.148046493530273, "global_step": 6194, "epoch": 51} {"train_loss": -21.77393341064453, "global_step": 6195, "epoch": 51} {"train_loss": -22.409589767456055, "global_step": 6196, "epoch": 51} {"train_loss": -22.7543888092041, "global_step": 6197, "epoch": 51} {"train_loss": -22.8695068359375, "global_step": 6198, "epoch": 51} {"train_loss": -22.07223129272461, "global_step": 6199, "epoch": 51} {"train_loss": -22.665760040283203, "global_step": 6200, "epoch": 51} {"train_loss": -22.686790466308594, "global_step": 6201, "epoch": 51} {"train_loss": -21.57216453552246, "global_step": 6202, "epoch": 51} {"train_loss": -23.2490291595459, "global_step": 6203, "epoch": 51} {"train_loss": -22.395458221435547, "global_step": 6204, "epoch": 51} {"train_loss": -22.266891479492188, "global_step": 6205, "epoch": 51} {"train_loss": -22.678647994995117, "global_step": 6206, "epoch": 51} {"train_loss": -22.48396110534668, "global_step": 6207, "epoch": 51} {"train_loss": -22.387304306030273, "global_step": 6208, "epoch": 51} {"train_loss": -22.25096893310547, "global_step": 6209, "epoch": 51} {"train_loss": -22.425552368164062, "global_step": 6210, "epoch": 51} {"train_loss": -22.55696678161621, "global_step": 6211, "epoch": 51} {"train_loss": -22.457265853881836, "global_step": 6212, "epoch": 51} {"train_loss": -22.488937377929688, "global_step": 6213, "epoch": 51} {"train_loss": -22.515209197998047, "global_step": 6214, "epoch": 51} {"train_loss": -22.42963218688965, "global_step": 6215, "epoch": 51} {"train_loss": -22.47891616821289, "global_step": 6216, "epoch": 51} {"train_loss": -22.109161376953125, "global_step": 6217, "epoch": 51} {"train_loss": -22.889345169067383, "global_step": 6218, "epoch": 51} {"train_loss": -22.598834991455078, "global_step": 6219, "epoch": 51} {"train_loss": -21.56271743774414, "global_step": 6220, "epoch": 51} {"train_loss": -22.298120498657227, "global_step": 6221, "epoch": 51} {"train_loss": -22.596237182617188, "global_step": 6222, "epoch": 51} {"train_loss": -22.81903076171875, "global_step": 6223, "epoch": 51} {"train_loss": -22.480350494384766, "global_step": 6224, "epoch": 51} {"train_loss": -22.950101852416992, "global_step": 6225, "epoch": 51} {"train_loss": -22.745512008666992, "global_step": 6226, "epoch": 51} {"train_loss": -22.53359031677246, "global_step": 6227, "epoch": 51} {"train_loss": -22.606678009033203, "global_step": 6228, "epoch": 51} {"train_loss": -22.656906127929688, "global_step": 6229, "epoch": 51} {"train_loss": -22.454763412475586, "global_step": 6230, "epoch": 51} {"train_loss": -22.489532470703125, "global_step": 6231, "epoch": 51} {"train_loss": -22.694461822509766, "global_step": 6232, "epoch": 51} {"train_loss": -22.414121627807617, "global_step": 6233, "epoch": 51} {"train_loss": -23.268686294555664, "global_step": 6234, "epoch": 51} {"train_loss": -22.5755672454834, "global_step": 6235, "epoch": 51} {"train_loss": -23.086851119995117, "global_step": 6236, "epoch": 51} {"train_loss": -22.613208770751953, "global_step": 6237, "epoch": 51} {"train_loss": -21.452320098876953, "global_step": 6238, "epoch": 51} {"train_loss": -21.40480613708496, "global_step": 6239, "epoch": 51} {"train_loss": -22.096111297607422, "global_step": 6240, "epoch": 51} {"train_loss": -20.21049690246582, "global_step": 6241, "epoch": 51} {"train_loss": -22.6795597076416, "global_step": 6242, "epoch": 51} {"train_loss": -21.544605255126953, "global_step": 6243, "epoch": 51} {"train_loss": -21.21156120300293, "global_step": 6244, "epoch": 51} {"train_loss": -22.431127548217773, "global_step": 6245, "epoch": 51} {"train_loss": -21.040313720703125, "global_step": 6246, "epoch": 51} {"train_loss": -22.008243560791016, "global_step": 6247, "epoch": 51} {"train_loss": -22.439105987548828, "global_step": 6248, "epoch": 51} {"train_loss": -21.411643981933594, "global_step": 6249, "epoch": 51} {"train_loss": -22.54115104675293, "global_step": 6250, "epoch": 51} {"train_loss": -21.13275146484375, "global_step": 6251, "epoch": 51} {"train_loss": -22.504764556884766, "global_step": 6252, "epoch": 51} {"train_loss": -21.918609619140625, "global_step": 6253, "epoch": 51} {"train_loss": -22.62564468383789, "global_step": 6254, "epoch": 51} {"train_loss": -22.13032341003418, "global_step": 6255, "epoch": 51} {"train_loss": -21.878311157226562, "global_step": 6256, "epoch": 51} {"train_loss": -22.482934951782227, "global_step": 6257, "epoch": 51} {"train_loss": -22.672346115112305, "global_step": 6258, "epoch": 51} {"train_loss": -22.735414505004883, "global_step": 6259, "epoch": 51} {"train_loss": -22.88765525817871, "global_step": 6260, "epoch": 51} {"train_loss": -22.25025177001953, "global_step": 6261, "epoch": 51} {"train_loss": -22.303619384765625, "global_step": 6262, "epoch": 51} {"train_loss": -22.452030181884766, "global_step": 6263, "epoch": 51} {"train_loss": -22.210084915161133, "global_step": 6264, "epoch": 51} {"train_loss": -22.648666381835938, "global_step": 6265, "epoch": 51} {"train_loss": -22.85059356689453, "global_step": 6266, "epoch": 51} {"train_loss": -22.210905075073242, "global_step": 6267, "epoch": 51} {"train_loss": -22.5584716796875, "global_step": 6268, "epoch": 51} {"train_loss": -22.58049964904785, "global_step": 6269, "epoch": 51} {"train_loss": -22.885986328125, "global_step": 6270, "epoch": 51} {"train_loss": -22.74329948425293, "global_step": 6271, "epoch": 51} {"train_loss": -22.889354705810547, "global_step": 6272, "epoch": 51} {"train_loss": -22.21026611328125, "global_step": 6273, "epoch": 51} {"train_loss": -22.811424255371094, "global_step": 6274, "epoch": 51} {"train_loss": -22.602123260498047, "global_step": 6275, "epoch": 51} {"train_loss": -22.42108154296875, "global_step": 6276, "epoch": 51} {"train_loss": -23.264738082885742, "global_step": 6277, "epoch": 51} {"train_loss": -22.97885513305664, "global_step": 6278, "epoch": 51} {"train_loss": -23.071739196777344, "global_step": 6279, "epoch": 51} {"train_loss": -23.20528793334961, "global_step": 6280, "epoch": 51} {"train_loss": -22.75245475769043, "global_step": 6281, "epoch": 51} {"train_loss": -22.936185836791992, "global_step": 6282, "epoch": 51} {"train_loss": -22.71822166442871, "global_step": 6283, "epoch": 51} {"train_loss": -22.910924911499023, "global_step": 6284, "epoch": 51} {"train_loss": -22.776975631713867, "global_step": 6285, "epoch": 51} {"train_loss": -22.320295333862305, "global_step": 6286, "epoch": 51} {"train_loss": -22.7025089263916, "global_step": 6287, "epoch": 51} {"train_loss": -21.82843589782715, "global_step": 6288, "epoch": 51} {"train_loss": -21.53553581237793, "global_step": 6289, "epoch": 51} {"train_loss": -18.956212997436523, "global_step": 6290, "epoch": 51} {"train_loss": -22.26923208000246, "global_step": 6291, "epoch": 51, "val_loss": 2926661.0} {"train_loss": -21.386005401611328, "global_step": 6292, "epoch": 52} {"train_loss": -22.0548152923584, "global_step": 6293, "epoch": 52} {"train_loss": -21.513654708862305, "global_step": 6294, "epoch": 52} {"train_loss": -22.296781539916992, "global_step": 6295, "epoch": 52} {"train_loss": -21.448631286621094, "global_step": 6296, "epoch": 52} {"train_loss": -22.582887649536133, "global_step": 6297, "epoch": 52} {"train_loss": -22.026161193847656, "global_step": 6298, "epoch": 52} {"train_loss": -22.32643699645996, "global_step": 6299, "epoch": 52} {"train_loss": -22.217575073242188, "global_step": 6300, "epoch": 52} {"train_loss": -21.947553634643555, "global_step": 6301, "epoch": 52} {"train_loss": -21.66892433166504, "global_step": 6302, "epoch": 52} {"train_loss": -22.31361198425293, "global_step": 6303, "epoch": 52} {"train_loss": -22.328245162963867, "global_step": 6304, "epoch": 52} {"train_loss": -22.16375160217285, "global_step": 6305, "epoch": 52} {"train_loss": -22.29376792907715, "global_step": 6306, "epoch": 52} {"train_loss": -22.02029800415039, "global_step": 6307, "epoch": 52} {"train_loss": -22.29371452331543, "global_step": 6308, "epoch": 52} {"train_loss": -22.10269546508789, "global_step": 6309, "epoch": 52} {"train_loss": -22.108251571655273, "global_step": 6310, "epoch": 52} {"train_loss": -22.614185333251953, "global_step": 6311, "epoch": 52} {"train_loss": -22.480201721191406, "global_step": 6312, "epoch": 52} {"train_loss": -22.365680694580078, "global_step": 6313, "epoch": 52} {"train_loss": -22.19901466369629, "global_step": 6314, "epoch": 52} {"train_loss": -22.72823143005371, "global_step": 6315, "epoch": 52} {"train_loss": -21.791370391845703, "global_step": 6316, "epoch": 52} {"train_loss": -22.523242950439453, "global_step": 6317, "epoch": 52} {"train_loss": -22.4128475189209, "global_step": 6318, "epoch": 52} {"train_loss": -22.630325317382812, "global_step": 6319, "epoch": 52} {"train_loss": -22.575916290283203, "global_step": 6320, "epoch": 52} {"train_loss": -22.400114059448242, "global_step": 6321, "epoch": 52} {"train_loss": -22.99800682067871, "global_step": 6322, "epoch": 52} {"train_loss": -22.481992721557617, "global_step": 6323, "epoch": 52} {"train_loss": -22.032651901245117, "global_step": 6324, "epoch": 52} {"train_loss": -22.8489933013916, "global_step": 6325, "epoch": 52} {"train_loss": -22.260168075561523, "global_step": 6326, "epoch": 52} {"train_loss": -21.80609130859375, "global_step": 6327, "epoch": 52} {"train_loss": -20.788532257080078, "global_step": 6328, "epoch": 52} {"train_loss": -21.71187400817871, "global_step": 6329, "epoch": 52} {"train_loss": -22.35800552368164, "global_step": 6330, "epoch": 52} {"train_loss": -22.291748046875, "global_step": 6331, "epoch": 52} {"train_loss": -19.57538604736328, "global_step": 6332, "epoch": 52} {"train_loss": -19.492834091186523, "global_step": 6333, "epoch": 52} {"train_loss": -20.93526268005371, "global_step": 6334, "epoch": 52} {"train_loss": -22.124929428100586, "global_step": 6335, "epoch": 52} {"train_loss": -20.763036727905273, "global_step": 6336, "epoch": 52} {"train_loss": -22.310503005981445, "global_step": 6337, "epoch": 52} {"train_loss": -21.291208267211914, "global_step": 6338, "epoch": 52} {"train_loss": -22.171030044555664, "global_step": 6339, "epoch": 52} {"train_loss": -21.574920654296875, "global_step": 6340, "epoch": 52} {"train_loss": -21.79435157775879, "global_step": 6341, "epoch": 52} {"train_loss": -21.872119903564453, "global_step": 6342, "epoch": 52} {"train_loss": -21.96210479736328, "global_step": 6343, "epoch": 52} {"train_loss": -22.17365837097168, "global_step": 6344, "epoch": 52} {"train_loss": -22.17518424987793, "global_step": 6345, "epoch": 52} {"train_loss": -22.05929946899414, "global_step": 6346, "epoch": 52} {"train_loss": -22.217636108398438, "global_step": 6347, "epoch": 52} {"train_loss": -22.12513542175293, "global_step": 6348, "epoch": 52} {"train_loss": -22.208810806274414, "global_step": 6349, "epoch": 52} {"train_loss": -21.915441513061523, "global_step": 6350, "epoch": 52} {"train_loss": -22.068950653076172, "global_step": 6351, "epoch": 52} {"train_loss": -21.940109252929688, "global_step": 6352, "epoch": 52} {"train_loss": -21.977445602416992, "global_step": 6353, "epoch": 52} {"train_loss": -22.087493896484375, "global_step": 6354, "epoch": 52} {"train_loss": -21.911794662475586, "global_step": 6355, "epoch": 52} {"train_loss": -22.413002014160156, "global_step": 6356, "epoch": 52} {"train_loss": -21.730337142944336, "global_step": 6357, "epoch": 52} {"train_loss": -22.10785484313965, "global_step": 6358, "epoch": 52} {"train_loss": -22.06838035583496, "global_step": 6359, "epoch": 52} {"train_loss": -22.267202377319336, "global_step": 6360, "epoch": 52} {"train_loss": -22.400358200073242, "global_step": 6361, "epoch": 52} {"train_loss": -22.33833122253418, "global_step": 6362, "epoch": 52} {"train_loss": -22.140966415405273, "global_step": 6363, "epoch": 52} {"train_loss": -21.99386215209961, "global_step": 6364, "epoch": 52} {"train_loss": -21.95479393005371, "global_step": 6365, "epoch": 52} {"train_loss": -22.9392147064209, "global_step": 6366, "epoch": 52} {"train_loss": -22.47124481201172, "global_step": 6367, "epoch": 52} {"train_loss": -22.37164306640625, "global_step": 6368, "epoch": 52} {"train_loss": -22.7591495513916, "global_step": 6369, "epoch": 52} {"train_loss": -22.219999313354492, "global_step": 6370, "epoch": 52} {"train_loss": -22.329875946044922, "global_step": 6371, "epoch": 52} {"train_loss": -22.75727653503418, "global_step": 6372, "epoch": 52} {"train_loss": -21.890554428100586, "global_step": 6373, "epoch": 52} {"train_loss": -22.34930992126465, "global_step": 6374, "epoch": 52} {"train_loss": -22.637056350708008, "global_step": 6375, "epoch": 52} {"train_loss": -22.95298194885254, "global_step": 6376, "epoch": 52} {"train_loss": -22.29629898071289, "global_step": 6377, "epoch": 52} {"train_loss": -22.766569137573242, "global_step": 6378, "epoch": 52} {"train_loss": -23.206899642944336, "global_step": 6379, "epoch": 52} {"train_loss": -22.10611343383789, "global_step": 6380, "epoch": 52} {"train_loss": -23.114667892456055, "global_step": 6381, "epoch": 52} {"train_loss": -22.591337203979492, "global_step": 6382, "epoch": 52} {"train_loss": -22.700326919555664, "global_step": 6383, "epoch": 52} {"train_loss": -22.33669090270996, "global_step": 6384, "epoch": 52} {"train_loss": -22.806203842163086, "global_step": 6385, "epoch": 52} {"train_loss": -22.0036678314209, "global_step": 6386, "epoch": 52} {"train_loss": -22.203184127807617, "global_step": 6387, "epoch": 52} {"train_loss": -22.4658203125, "global_step": 6388, "epoch": 52} {"train_loss": -22.220090866088867, "global_step": 6389, "epoch": 52} {"train_loss": -22.437549591064453, "global_step": 6390, "epoch": 52} {"train_loss": -22.607206344604492, "global_step": 6391, "epoch": 52} {"train_loss": -22.391897201538086, "global_step": 6392, "epoch": 52} {"train_loss": -22.06155776977539, "global_step": 6393, "epoch": 52} {"train_loss": -22.686384201049805, "global_step": 6394, "epoch": 52} {"train_loss": -22.05755615234375, "global_step": 6395, "epoch": 52} {"train_loss": -21.66054344177246, "global_step": 6396, "epoch": 52} {"train_loss": -22.138032913208008, "global_step": 6397, "epoch": 52} {"train_loss": -22.657140731811523, "global_step": 6398, "epoch": 52} {"train_loss": -22.652029037475586, "global_step": 6399, "epoch": 52} {"train_loss": -21.76042938232422, "global_step": 6400, "epoch": 52} {"train_loss": -22.2399845123291, "global_step": 6401, "epoch": 52} {"train_loss": -21.861572265625, "global_step": 6402, "epoch": 52} {"train_loss": -21.902236938476562, "global_step": 6403, "epoch": 52} {"train_loss": -20.8553466796875, "global_step": 6404, "epoch": 52} {"train_loss": -21.747106552124023, "global_step": 6405, "epoch": 52} {"train_loss": -22.50887107849121, "global_step": 6406, "epoch": 52} {"train_loss": -21.42830467224121, "global_step": 6407, "epoch": 52} {"train_loss": -21.927661895751953, "global_step": 6408, "epoch": 52} {"train_loss": -22.215932846069336, "global_step": 6409, "epoch": 52} {"train_loss": -22.439809799194336, "global_step": 6410, "epoch": 52} {"train_loss": -22.5648136138916, "global_step": 6411, "epoch": 52} {"train_loss": -22.134424966228895, "global_step": 6412, "epoch": 52, "val_loss": 3553093.25} {"train_loss": -22.27344512939453, "global_step": 6413, "epoch": 53} {"train_loss": -21.962270736694336, "global_step": 6414, "epoch": 53} {"train_loss": -22.371410369873047, "global_step": 6415, "epoch": 53} {"train_loss": -21.6570987701416, "global_step": 6416, "epoch": 53} {"train_loss": -22.40447425842285, "global_step": 6417, "epoch": 53} {"train_loss": -21.5894832611084, "global_step": 6418, "epoch": 53} {"train_loss": -21.911611557006836, "global_step": 6419, "epoch": 53} {"train_loss": -21.965051651000977, "global_step": 6420, "epoch": 53} {"train_loss": -22.310327529907227, "global_step": 6421, "epoch": 53} {"train_loss": -22.558202743530273, "global_step": 6422, "epoch": 53} {"train_loss": -22.468994140625, "global_step": 6423, "epoch": 53} {"train_loss": -22.834857940673828, "global_step": 6424, "epoch": 53} {"train_loss": -22.228437423706055, "global_step": 6425, "epoch": 53} {"train_loss": -22.490110397338867, "global_step": 6426, "epoch": 53} {"train_loss": -22.823932647705078, "global_step": 6427, "epoch": 53} {"train_loss": -22.650733947753906, "global_step": 6428, "epoch": 53} {"train_loss": -22.769943237304688, "global_step": 6429, "epoch": 53} {"train_loss": -22.4637508392334, "global_step": 6430, "epoch": 53} {"train_loss": -22.772930145263672, "global_step": 6431, "epoch": 53} {"train_loss": -22.734914779663086, "global_step": 6432, "epoch": 53} {"train_loss": -22.845144271850586, "global_step": 6433, "epoch": 53} {"train_loss": -23.152114868164062, "global_step": 6434, "epoch": 53} {"train_loss": -22.810073852539062, "global_step": 6435, "epoch": 53} {"train_loss": -23.182209014892578, "global_step": 6436, "epoch": 53} {"train_loss": -22.653087615966797, "global_step": 6437, "epoch": 53} {"train_loss": -23.0736141204834, "global_step": 6438, "epoch": 53} {"train_loss": -23.270700454711914, "global_step": 6439, "epoch": 53} {"train_loss": -23.328733444213867, "global_step": 6440, "epoch": 53} {"train_loss": -22.678085327148438, "global_step": 6441, "epoch": 53} {"train_loss": -21.491125106811523, "global_step": 6442, "epoch": 53} {"train_loss": -21.546396255493164, "global_step": 6443, "epoch": 53} {"train_loss": -22.924957275390625, "global_step": 6444, "epoch": 53} {"train_loss": -23.06270408630371, "global_step": 6445, "epoch": 53} {"train_loss": -21.112064361572266, "global_step": 6446, "epoch": 53} {"train_loss": -22.058502197265625, "global_step": 6447, "epoch": 53} {"train_loss": -22.991119384765625, "global_step": 6448, "epoch": 53} {"train_loss": -22.320072174072266, "global_step": 6449, "epoch": 53} {"train_loss": -23.39372444152832, "global_step": 6450, "epoch": 53} {"train_loss": -22.77446174621582, "global_step": 6451, "epoch": 53} {"train_loss": -23.26563835144043, "global_step": 6452, "epoch": 53} {"train_loss": -21.101205825805664, "global_step": 6453, "epoch": 53} {"train_loss": -20.868854522705078, "global_step": 6454, "epoch": 53} {"train_loss": -22.22547721862793, "global_step": 6455, "epoch": 53} {"train_loss": -22.381839752197266, "global_step": 6456, "epoch": 53} {"train_loss": -21.996259689331055, "global_step": 6457, "epoch": 53} {"train_loss": -22.154447555541992, "global_step": 6458, "epoch": 53} {"train_loss": -22.104299545288086, "global_step": 6459, "epoch": 53} {"train_loss": -22.601409912109375, "global_step": 6460, "epoch": 53} {"train_loss": -21.45002555847168, "global_step": 6461, "epoch": 53} {"train_loss": -22.558210372924805, "global_step": 6462, "epoch": 53} {"train_loss": -22.35426139831543, "global_step": 6463, "epoch": 53} {"train_loss": -21.338918685913086, "global_step": 6464, "epoch": 53} {"train_loss": -21.965051651000977, "global_step": 6465, "epoch": 53} {"train_loss": -21.832839965820312, "global_step": 6466, "epoch": 53} {"train_loss": -22.6442928314209, "global_step": 6467, "epoch": 53} {"train_loss": -22.57713508605957, "global_step": 6468, "epoch": 53} {"train_loss": -21.244047164916992, "global_step": 6469, "epoch": 53} {"train_loss": -21.906604766845703, "global_step": 6470, "epoch": 53} {"train_loss": -21.73162269592285, "global_step": 6471, "epoch": 53} {"train_loss": -21.824556350708008, "global_step": 6472, "epoch": 53} {"train_loss": -21.5757999420166, "global_step": 6473, "epoch": 53} {"train_loss": -22.428281784057617, "global_step": 6474, "epoch": 53} {"train_loss": -22.164226531982422, "global_step": 6475, "epoch": 53} {"train_loss": -21.582887649536133, "global_step": 6476, "epoch": 53} {"train_loss": -22.185426712036133, "global_step": 6477, "epoch": 53} {"train_loss": -22.171039581298828, "global_step": 6478, "epoch": 53} {"train_loss": -22.03528594970703, "global_step": 6479, "epoch": 53} {"train_loss": -21.9310302734375, "global_step": 6480, "epoch": 53} {"train_loss": -22.40015983581543, "global_step": 6481, "epoch": 53} {"train_loss": -22.59747886657715, "global_step": 6482, "epoch": 53} {"train_loss": -22.4373836517334, "global_step": 6483, "epoch": 53} {"train_loss": -22.654850006103516, "global_step": 6484, "epoch": 53} {"train_loss": -22.748577117919922, "global_step": 6485, "epoch": 53} {"train_loss": -22.739906311035156, "global_step": 6486, "epoch": 53} {"train_loss": -22.5102596282959, "global_step": 6487, "epoch": 53} {"train_loss": -22.644895553588867, "global_step": 6488, "epoch": 53} {"train_loss": -23.37490463256836, "global_step": 6489, "epoch": 53} {"train_loss": -23.043073654174805, "global_step": 6490, "epoch": 53} {"train_loss": -23.277830123901367, "global_step": 6491, "epoch": 53} {"train_loss": -22.67224884033203, "global_step": 6492, "epoch": 53} {"train_loss": -22.737295150756836, "global_step": 6493, "epoch": 53} {"train_loss": -23.004928588867188, "global_step": 6494, "epoch": 53} {"train_loss": -23.163217544555664, "global_step": 6495, "epoch": 53} {"train_loss": -22.94430923461914, "global_step": 6496, "epoch": 53} {"train_loss": -22.806766510009766, "global_step": 6497, "epoch": 53} {"train_loss": -22.825153350830078, "global_step": 6498, "epoch": 53} {"train_loss": -22.418949127197266, "global_step": 6499, "epoch": 53} {"train_loss": -22.21790885925293, "global_step": 6500, "epoch": 53} {"train_loss": -23.534433364868164, "global_step": 6501, "epoch": 53} {"train_loss": -23.038976669311523, "global_step": 6502, "epoch": 53} {"train_loss": -23.077041625976562, "global_step": 6503, "epoch": 53} {"train_loss": -22.37715721130371, "global_step": 6504, "epoch": 53} {"train_loss": -22.298995971679688, "global_step": 6505, "epoch": 53} {"train_loss": -22.003751754760742, "global_step": 6506, "epoch": 53} {"train_loss": -21.051645278930664, "global_step": 6507, "epoch": 53} {"train_loss": -17.83846092224121, "global_step": 6508, "epoch": 53} {"train_loss": -20.475555419921875, "global_step": 6509, "epoch": 53} {"train_loss": -22.687347412109375, "global_step": 6510, "epoch": 53} {"train_loss": -20.92989158630371, "global_step": 6511, "epoch": 53} {"train_loss": -22.19462013244629, "global_step": 6512, "epoch": 53} {"train_loss": -20.686002731323242, "global_step": 6513, "epoch": 53} {"train_loss": -22.503524780273438, "global_step": 6514, "epoch": 53} {"train_loss": -20.967483520507812, "global_step": 6515, "epoch": 53} {"train_loss": -22.141138076782227, "global_step": 6516, "epoch": 53} {"train_loss": -22.366113662719727, "global_step": 6517, "epoch": 53} {"train_loss": -21.979806900024414, "global_step": 6518, "epoch": 53} {"train_loss": -22.703954696655273, "global_step": 6519, "epoch": 53} {"train_loss": -22.2609806060791, "global_step": 6520, "epoch": 53} {"train_loss": -22.46270179748535, "global_step": 6521, "epoch": 53} {"train_loss": -22.63897132873535, "global_step": 6522, "epoch": 53} {"train_loss": -22.699565887451172, "global_step": 6523, "epoch": 53} {"train_loss": -22.87544059753418, "global_step": 6524, "epoch": 53} {"train_loss": -21.932846069335938, "global_step": 6525, "epoch": 53} {"train_loss": -22.311079025268555, "global_step": 6526, "epoch": 53} {"train_loss": -22.329442977905273, "global_step": 6527, "epoch": 53} {"train_loss": -22.63138771057129, "global_step": 6528, "epoch": 53} {"train_loss": -22.421857833862305, "global_step": 6529, "epoch": 53} {"train_loss": -22.4379940032959, "global_step": 6530, "epoch": 53} {"train_loss": -22.433950424194336, "global_step": 6531, "epoch": 53} {"train_loss": -22.534564971923828, "global_step": 6532, "epoch": 53} {"train_loss": -22.31769260690232, "global_step": 6533, "epoch": 53, "val_loss": 3846682.0} {"train_loss": -22.31504249572754, "global_step": 6534, "epoch": 54} {"train_loss": -22.85358238220215, "global_step": 6535, "epoch": 54} {"train_loss": -22.529211044311523, "global_step": 6536, "epoch": 54} {"train_loss": -22.15065574645996, "global_step": 6537, "epoch": 54} {"train_loss": -22.523136138916016, "global_step": 6538, "epoch": 54} {"train_loss": -22.62898826599121, "global_step": 6539, "epoch": 54} {"train_loss": -20.789915084838867, "global_step": 6540, "epoch": 54} {"train_loss": -19.994400024414062, "global_step": 6541, "epoch": 54} {"train_loss": -21.08755874633789, "global_step": 6542, "epoch": 54} {"train_loss": -21.816823959350586, "global_step": 6543, "epoch": 54} {"train_loss": -22.12063217163086, "global_step": 6544, "epoch": 54} {"train_loss": -21.633930206298828, "global_step": 6545, "epoch": 54} {"train_loss": -22.537616729736328, "global_step": 6546, "epoch": 54} {"train_loss": -22.2138729095459, "global_step": 6547, "epoch": 54} {"train_loss": -21.929975509643555, "global_step": 6548, "epoch": 54} {"train_loss": -22.60811424255371, "global_step": 6549, "epoch": 54} {"train_loss": -21.97555923461914, "global_step": 6550, "epoch": 54} {"train_loss": -21.749509811401367, "global_step": 6551, "epoch": 54} {"train_loss": -21.830738067626953, "global_step": 6552, "epoch": 54} {"train_loss": -22.778186798095703, "global_step": 6553, "epoch": 54} {"train_loss": -22.17586898803711, "global_step": 6554, "epoch": 54} {"train_loss": -22.365232467651367, "global_step": 6555, "epoch": 54} {"train_loss": -21.865497589111328, "global_step": 6556, "epoch": 54} {"train_loss": -21.750410079956055, "global_step": 6557, "epoch": 54} {"train_loss": -22.33694076538086, "global_step": 6558, "epoch": 54} {"train_loss": -22.745258331298828, "global_step": 6559, "epoch": 54} {"train_loss": -22.3262939453125, "global_step": 6560, "epoch": 54} {"train_loss": -22.191307067871094, "global_step": 6561, "epoch": 54} {"train_loss": -22.45747184753418, "global_step": 6562, "epoch": 54} {"train_loss": -21.782777786254883, "global_step": 6563, "epoch": 54} {"train_loss": -22.71486473083496, "global_step": 6564, "epoch": 54} {"train_loss": -22.990175247192383, "global_step": 6565, "epoch": 54} {"train_loss": -22.050336837768555, "global_step": 6566, "epoch": 54} {"train_loss": -23.11513900756836, "global_step": 6567, "epoch": 54} {"train_loss": -22.83774185180664, "global_step": 6568, "epoch": 54} {"train_loss": -23.219772338867188, "global_step": 6569, "epoch": 54} {"train_loss": -22.782024383544922, "global_step": 6570, "epoch": 54} {"train_loss": -22.888830184936523, "global_step": 6571, "epoch": 54} {"train_loss": -22.931005477905273, "global_step": 6572, "epoch": 54} {"train_loss": -23.1340274810791, "global_step": 6573, "epoch": 54} {"train_loss": -22.736663818359375, "global_step": 6574, "epoch": 54} {"train_loss": -22.64558982849121, "global_step": 6575, "epoch": 54} {"train_loss": -22.695556640625, "global_step": 6576, "epoch": 54} {"train_loss": -22.564289093017578, "global_step": 6577, "epoch": 54} {"train_loss": -21.962133407592773, "global_step": 6578, "epoch": 54} {"train_loss": -18.606767654418945, "global_step": 6579, "epoch": 54} {"train_loss": -17.275569915771484, "global_step": 6580, "epoch": 54} {"train_loss": -20.316625595092773, "global_step": 6581, "epoch": 54} {"train_loss": -22.919940948486328, "global_step": 6582, "epoch": 54} {"train_loss": -21.85866355895996, "global_step": 6583, "epoch": 54} {"train_loss": -21.939128875732422, "global_step": 6584, "epoch": 54} {"train_loss": -22.672849655151367, "global_step": 6585, "epoch": 54} {"train_loss": -21.751220703125, "global_step": 6586, "epoch": 54} {"train_loss": -22.214786529541016, "global_step": 6587, "epoch": 54} {"train_loss": -22.531837463378906, "global_step": 6588, "epoch": 54} {"train_loss": -21.9353084564209, "global_step": 6589, "epoch": 54} {"train_loss": -22.064355850219727, "global_step": 6590, "epoch": 54} {"train_loss": -22.14727210998535, "global_step": 6591, "epoch": 54} {"train_loss": -22.119443893432617, "global_step": 6592, "epoch": 54} {"train_loss": -22.33042335510254, "global_step": 6593, "epoch": 54} {"train_loss": -22.205162048339844, "global_step": 6594, "epoch": 54} {"train_loss": -22.30472183227539, "global_step": 6595, "epoch": 54} {"train_loss": -22.58348274230957, "global_step": 6596, "epoch": 54} {"train_loss": -22.040313720703125, "global_step": 6597, "epoch": 54} {"train_loss": -22.025970458984375, "global_step": 6598, "epoch": 54} {"train_loss": -21.39270782470703, "global_step": 6599, "epoch": 54} {"train_loss": -22.42418670654297, "global_step": 6600, "epoch": 54} {"train_loss": -21.65485954284668, "global_step": 6601, "epoch": 54} {"train_loss": -20.340927124023438, "global_step": 6602, "epoch": 54} {"train_loss": -21.54722785949707, "global_step": 6603, "epoch": 54} {"train_loss": -21.92310333251953, "global_step": 6604, "epoch": 54} {"train_loss": -22.001333236694336, "global_step": 6605, "epoch": 54} {"train_loss": -21.77005958557129, "global_step": 6606, "epoch": 54} {"train_loss": -22.09699058532715, "global_step": 6607, "epoch": 54} {"train_loss": -22.671844482421875, "global_step": 6608, "epoch": 54} {"train_loss": -22.483938217163086, "global_step": 6609, "epoch": 54} {"train_loss": -22.783788681030273, "global_step": 6610, "epoch": 54} {"train_loss": -22.209165573120117, "global_step": 6611, "epoch": 54} {"train_loss": -22.08251953125, "global_step": 6612, "epoch": 54} {"train_loss": -22.800519943237305, "global_step": 6613, "epoch": 54} {"train_loss": -22.345714569091797, "global_step": 6614, "epoch": 54} {"train_loss": -22.732940673828125, "global_step": 6615, "epoch": 54} {"train_loss": -22.258420944213867, "global_step": 6616, "epoch": 54} {"train_loss": -22.14698600769043, "global_step": 6617, "epoch": 54} {"train_loss": -22.89821434020996, "global_step": 6618, "epoch": 54} {"train_loss": -22.723236083984375, "global_step": 6619, "epoch": 54} {"train_loss": -22.864395141601562, "global_step": 6620, "epoch": 54} {"train_loss": -22.317203521728516, "global_step": 6621, "epoch": 54} {"train_loss": -22.907535552978516, "global_step": 6622, "epoch": 54} {"train_loss": -22.01944923400879, "global_step": 6623, "epoch": 54} {"train_loss": -22.666385650634766, "global_step": 6624, "epoch": 54} {"train_loss": -22.81841468811035, "global_step": 6625, "epoch": 54} {"train_loss": -22.219985961914062, "global_step": 6626, "epoch": 54} {"train_loss": -21.75234603881836, "global_step": 6627, "epoch": 54} {"train_loss": -22.194461822509766, "global_step": 6628, "epoch": 54} {"train_loss": -22.7889461517334, "global_step": 6629, "epoch": 54} {"train_loss": -22.778371810913086, "global_step": 6630, "epoch": 54} {"train_loss": -22.73009490966797, "global_step": 6631, "epoch": 54} {"train_loss": -22.447919845581055, "global_step": 6632, "epoch": 54} {"train_loss": -23.595476150512695, "global_step": 6633, "epoch": 54} {"train_loss": -23.089200973510742, "global_step": 6634, "epoch": 54} {"train_loss": -22.959238052368164, "global_step": 6635, "epoch": 54} {"train_loss": -22.675413131713867, "global_step": 6636, "epoch": 54} {"train_loss": -22.97053337097168, "global_step": 6637, "epoch": 54} {"train_loss": -23.151708602905273, "global_step": 6638, "epoch": 54} {"train_loss": -22.880247116088867, "global_step": 6639, "epoch": 54} {"train_loss": -22.07246971130371, "global_step": 6640, "epoch": 54} {"train_loss": -21.47180938720703, "global_step": 6641, "epoch": 54} {"train_loss": -22.66403579711914, "global_step": 6642, "epoch": 54} {"train_loss": -22.46797752380371, "global_step": 6643, "epoch": 54} {"train_loss": -23.135711669921875, "global_step": 6644, "epoch": 54} {"train_loss": -22.617313385009766, "global_step": 6645, "epoch": 54} {"train_loss": -22.764806747436523, "global_step": 6646, "epoch": 54} {"train_loss": -23.316181182861328, "global_step": 6647, "epoch": 54} {"train_loss": -22.66668128967285, "global_step": 6648, "epoch": 54} {"train_loss": -23.154743194580078, "global_step": 6649, "epoch": 54} {"train_loss": -22.533416748046875, "global_step": 6650, "epoch": 54} {"train_loss": -21.856382369995117, "global_step": 6651, "epoch": 54} {"train_loss": -23.171131134033203, "global_step": 6652, "epoch": 54} {"train_loss": -22.479583740234375, "global_step": 6653, "epoch": 54} {"train_loss": -22.280221261268807, "global_step": 6654, "epoch": 54, "val_loss": 3021748.0} {"train_loss": -22.694364547729492, "global_step": 6655, "epoch": 55} {"train_loss": -22.846811294555664, "global_step": 6656, "epoch": 55} {"train_loss": -23.08832359313965, "global_step": 6657, "epoch": 55} {"train_loss": -22.620214462280273, "global_step": 6658, "epoch": 55} {"train_loss": -22.868833541870117, "global_step": 6659, "epoch": 55} {"train_loss": -22.898921966552734, "global_step": 6660, "epoch": 55} {"train_loss": -22.580114364624023, "global_step": 6661, "epoch": 55} {"train_loss": -23.068695068359375, "global_step": 6662, "epoch": 55} {"train_loss": -22.792770385742188, "global_step": 6663, "epoch": 55} {"train_loss": -22.453092575073242, "global_step": 6664, "epoch": 55} {"train_loss": -22.106260299682617, "global_step": 6665, "epoch": 55} {"train_loss": -21.843921661376953, "global_step": 6666, "epoch": 55} {"train_loss": -22.884675979614258, "global_step": 6667, "epoch": 55} {"train_loss": -21.977191925048828, "global_step": 6668, "epoch": 55} {"train_loss": -21.613815307617188, "global_step": 6669, "epoch": 55} {"train_loss": -22.416540145874023, "global_step": 6670, "epoch": 55} {"train_loss": -22.72383689880371, "global_step": 6671, "epoch": 55} {"train_loss": -22.572755813598633, "global_step": 6672, "epoch": 55} {"train_loss": -22.00021743774414, "global_step": 6673, "epoch": 55} {"train_loss": -22.887699127197266, "global_step": 6674, "epoch": 55} {"train_loss": -22.767057418823242, "global_step": 6675, "epoch": 55} {"train_loss": -21.470205307006836, "global_step": 6676, "epoch": 55} {"train_loss": -22.856321334838867, "global_step": 6677, "epoch": 55} {"train_loss": -22.116851806640625, "global_step": 6678, "epoch": 55} {"train_loss": -22.16534996032715, "global_step": 6679, "epoch": 55} {"train_loss": -22.308584213256836, "global_step": 6680, "epoch": 55} {"train_loss": -22.638111114501953, "global_step": 6681, "epoch": 55} {"train_loss": -21.91292381286621, "global_step": 6682, "epoch": 55} {"train_loss": -21.954538345336914, "global_step": 6683, "epoch": 55} {"train_loss": -20.61081314086914, "global_step": 6684, "epoch": 55} {"train_loss": -22.782257080078125, "global_step": 6685, "epoch": 55} {"train_loss": -22.819482803344727, "global_step": 6686, "epoch": 55} {"train_loss": -22.176437377929688, "global_step": 6687, "epoch": 55} {"train_loss": -22.677305221557617, "global_step": 6688, "epoch": 55} {"train_loss": -22.414169311523438, "global_step": 6689, "epoch": 55} {"train_loss": -22.452112197875977, "global_step": 6690, "epoch": 55} {"train_loss": -22.421077728271484, "global_step": 6691, "epoch": 55} {"train_loss": -22.577009201049805, "global_step": 6692, "epoch": 55} {"train_loss": -23.02829933166504, "global_step": 6693, "epoch": 55} {"train_loss": -22.25394058227539, "global_step": 6694, "epoch": 55} {"train_loss": -22.82033920288086, "global_step": 6695, "epoch": 55} {"train_loss": -22.792743682861328, "global_step": 6696, "epoch": 55} {"train_loss": -22.794275283813477, "global_step": 6697, "epoch": 55} {"train_loss": -22.748300552368164, "global_step": 6698, "epoch": 55} {"train_loss": -22.86283302307129, "global_step": 6699, "epoch": 55} {"train_loss": -22.978246688842773, "global_step": 6700, "epoch": 55} {"train_loss": -22.60914421081543, "global_step": 6701, "epoch": 55} {"train_loss": -22.910688400268555, "global_step": 6702, "epoch": 55} {"train_loss": -22.8986873626709, "global_step": 6703, "epoch": 55} {"train_loss": -23.0743350982666, "global_step": 6704, "epoch": 55} {"train_loss": -22.656492233276367, "global_step": 6705, "epoch": 55} {"train_loss": -22.442174911499023, "global_step": 6706, "epoch": 55} {"train_loss": -22.62761116027832, "global_step": 6707, "epoch": 55} {"train_loss": -23.401559829711914, "global_step": 6708, "epoch": 55} {"train_loss": -22.94561195373535, "global_step": 6709, "epoch": 55} {"train_loss": -22.34353256225586, "global_step": 6710, "epoch": 55} {"train_loss": -22.550025939941406, "global_step": 6711, "epoch": 55} {"train_loss": -22.876876831054688, "global_step": 6712, "epoch": 55} {"train_loss": -22.84662437438965, "global_step": 6713, "epoch": 55} {"train_loss": -21.522459030151367, "global_step": 6714, "epoch": 55} {"train_loss": -22.254653930664062, "global_step": 6715, "epoch": 55} {"train_loss": -22.873273849487305, "global_step": 6716, "epoch": 55} {"train_loss": -22.17671012878418, "global_step": 6717, "epoch": 55} {"train_loss": -22.38094139099121, "global_step": 6718, "epoch": 55} {"train_loss": -23.121212005615234, "global_step": 6719, "epoch": 55} {"train_loss": -22.368316650390625, "global_step": 6720, "epoch": 55} {"train_loss": -23.329816818237305, "global_step": 6721, "epoch": 55} {"train_loss": -22.36671257019043, "global_step": 6722, "epoch": 55} {"train_loss": -22.64270782470703, "global_step": 6723, "epoch": 55} {"train_loss": -22.549306869506836, "global_step": 6724, "epoch": 55} {"train_loss": -22.503286361694336, "global_step": 6725, "epoch": 55} {"train_loss": -22.52901268005371, "global_step": 6726, "epoch": 55} {"train_loss": -22.50975227355957, "global_step": 6727, "epoch": 55} {"train_loss": -22.87330436706543, "global_step": 6728, "epoch": 55} {"train_loss": -22.509841918945312, "global_step": 6729, "epoch": 55} {"train_loss": -22.714527130126953, "global_step": 6730, "epoch": 55} {"train_loss": -23.301837921142578, "global_step": 6731, "epoch": 55} {"train_loss": -22.935033798217773, "global_step": 6732, "epoch": 55} {"train_loss": -22.94160270690918, "global_step": 6733, "epoch": 55} {"train_loss": -23.461896896362305, "global_step": 6734, "epoch": 55} {"train_loss": -22.995315551757812, "global_step": 6735, "epoch": 55} {"train_loss": -23.25956153869629, "global_step": 6736, "epoch": 55} {"train_loss": -23.330982208251953, "global_step": 6737, "epoch": 55} {"train_loss": -23.050418853759766, "global_step": 6738, "epoch": 55} {"train_loss": -23.232892990112305, "global_step": 6739, "epoch": 55} {"train_loss": -23.252397537231445, "global_step": 6740, "epoch": 55} {"train_loss": -23.732114791870117, "global_step": 6741, "epoch": 55} {"train_loss": -22.910961151123047, "global_step": 6742, "epoch": 55} {"train_loss": -22.25431251525879, "global_step": 6743, "epoch": 55} {"train_loss": -19.64896583557129, "global_step": 6744, "epoch": 55} {"train_loss": -21.84406852722168, "global_step": 6745, "epoch": 55} {"train_loss": -23.046781539916992, "global_step": 6746, "epoch": 55} {"train_loss": -21.296754837036133, "global_step": 6747, "epoch": 55} {"train_loss": -22.754682540893555, "global_step": 6748, "epoch": 55} {"train_loss": -21.70697593688965, "global_step": 6749, "epoch": 55} {"train_loss": -21.208595275878906, "global_step": 6750, "epoch": 55} {"train_loss": -20.203351974487305, "global_step": 6751, "epoch": 55} {"train_loss": -21.770109176635742, "global_step": 6752, "epoch": 55} {"train_loss": -22.27484703063965, "global_step": 6753, "epoch": 55} {"train_loss": -21.704450607299805, "global_step": 6754, "epoch": 55} {"train_loss": -22.46558952331543, "global_step": 6755, "epoch": 55} {"train_loss": -22.191604614257812, "global_step": 6756, "epoch": 55} {"train_loss": -22.213478088378906, "global_step": 6757, "epoch": 55} {"train_loss": -22.566936492919922, "global_step": 6758, "epoch": 55} {"train_loss": -22.49506187438965, "global_step": 6759, "epoch": 55} {"train_loss": -22.077619552612305, "global_step": 6760, "epoch": 55} {"train_loss": -22.15976333618164, "global_step": 6761, "epoch": 55} {"train_loss": -22.234434127807617, "global_step": 6762, "epoch": 55} {"train_loss": -22.011693954467773, "global_step": 6763, "epoch": 55} {"train_loss": -22.562219619750977, "global_step": 6764, "epoch": 55} {"train_loss": -22.216882705688477, "global_step": 6765, "epoch": 55} {"train_loss": -21.683258056640625, "global_step": 6766, "epoch": 55} {"train_loss": -22.616683959960938, "global_step": 6767, "epoch": 55} {"train_loss": -22.103317260742188, "global_step": 6768, "epoch": 55} {"train_loss": -22.60845375061035, "global_step": 6769, "epoch": 55} {"train_loss": -22.29836082458496, "global_step": 6770, "epoch": 55} {"train_loss": -22.11180305480957, "global_step": 6771, "epoch": 55} {"train_loss": -22.28866958618164, "global_step": 6772, "epoch": 55} {"train_loss": -22.86750602722168, "global_step": 6773, "epoch": 55} {"train_loss": -22.446340560913086, "global_step": 6774, "epoch": 55} {"train_loss": -22.486174370631698, "global_step": 6775, "epoch": 55, "val_loss": 2934046.0} {"train_loss": -22.739490509033203, "global_step": 6776, "epoch": 56} {"train_loss": -22.863784790039062, "global_step": 6777, "epoch": 56} {"train_loss": -22.236804962158203, "global_step": 6778, "epoch": 56} {"train_loss": -22.776823043823242, "global_step": 6779, "epoch": 56} {"train_loss": -22.92495346069336, "global_step": 6780, "epoch": 56} {"train_loss": -22.9804630279541, "global_step": 6781, "epoch": 56} {"train_loss": -23.19168472290039, "global_step": 6782, "epoch": 56} {"train_loss": -23.15801429748535, "global_step": 6783, "epoch": 56} {"train_loss": -22.967992782592773, "global_step": 6784, "epoch": 56} {"train_loss": -23.41583251953125, "global_step": 6785, "epoch": 56} {"train_loss": -23.457212448120117, "global_step": 6786, "epoch": 56} {"train_loss": -23.236873626708984, "global_step": 6787, "epoch": 56} {"train_loss": -23.644115447998047, "global_step": 6788, "epoch": 56} {"train_loss": -23.28462028503418, "global_step": 6789, "epoch": 56} {"train_loss": -23.282453536987305, "global_step": 6790, "epoch": 56} {"train_loss": -23.646528244018555, "global_step": 6791, "epoch": 56} {"train_loss": -23.251272201538086, "global_step": 6792, "epoch": 56} {"train_loss": -23.746519088745117, "global_step": 6793, "epoch": 56} {"train_loss": -23.404315948486328, "global_step": 6794, "epoch": 56} {"train_loss": -23.15530014038086, "global_step": 6795, "epoch": 56} {"train_loss": -22.092744827270508, "global_step": 6796, "epoch": 56} {"train_loss": -20.241445541381836, "global_step": 6797, "epoch": 56} {"train_loss": -20.50594139099121, "global_step": 6798, "epoch": 56} {"train_loss": -22.893810272216797, "global_step": 6799, "epoch": 56} {"train_loss": -23.23516273498535, "global_step": 6800, "epoch": 56} {"train_loss": -22.22934341430664, "global_step": 6801, "epoch": 56} {"train_loss": -23.08925437927246, "global_step": 6802, "epoch": 56} {"train_loss": -22.667734146118164, "global_step": 6803, "epoch": 56} {"train_loss": -23.207324981689453, "global_step": 6804, "epoch": 56} {"train_loss": -21.45541000366211, "global_step": 6805, "epoch": 56} {"train_loss": -20.66385841369629, "global_step": 6806, "epoch": 56} {"train_loss": -21.381988525390625, "global_step": 6807, "epoch": 56} {"train_loss": -22.03380584716797, "global_step": 6808, "epoch": 56} {"train_loss": -21.192304611206055, "global_step": 6809, "epoch": 56} {"train_loss": -22.475385665893555, "global_step": 6810, "epoch": 56} {"train_loss": -22.039567947387695, "global_step": 6811, "epoch": 56} {"train_loss": -22.73908805847168, "global_step": 6812, "epoch": 56} {"train_loss": -22.420841217041016, "global_step": 6813, "epoch": 56} {"train_loss": -22.597148895263672, "global_step": 6814, "epoch": 56} {"train_loss": -22.26866340637207, "global_step": 6815, "epoch": 56} {"train_loss": -23.16806411743164, "global_step": 6816, "epoch": 56} {"train_loss": -22.40006446838379, "global_step": 6817, "epoch": 56} {"train_loss": -22.906816482543945, "global_step": 6818, "epoch": 56} {"train_loss": -22.818323135375977, "global_step": 6819, "epoch": 56} {"train_loss": -22.61979866027832, "global_step": 6820, "epoch": 56} {"train_loss": -22.88150405883789, "global_step": 6821, "epoch": 56} {"train_loss": -22.72000503540039, "global_step": 6822, "epoch": 56} {"train_loss": -22.74677848815918, "global_step": 6823, "epoch": 56} {"train_loss": -22.77239990234375, "global_step": 6824, "epoch": 56} {"train_loss": -23.239233016967773, "global_step": 6825, "epoch": 56} {"train_loss": -23.109800338745117, "global_step": 6826, "epoch": 56} {"train_loss": -22.765989303588867, "global_step": 6827, "epoch": 56} {"train_loss": -22.94489097595215, "global_step": 6828, "epoch": 56} {"train_loss": -22.35541534423828, "global_step": 6829, "epoch": 56} {"train_loss": -22.440977096557617, "global_step": 6830, "epoch": 56} {"train_loss": -22.775928497314453, "global_step": 6831, "epoch": 56} {"train_loss": -22.36675453186035, "global_step": 6832, "epoch": 56} {"train_loss": -21.93408203125, "global_step": 6833, "epoch": 56} {"train_loss": -22.1356201171875, "global_step": 6834, "epoch": 56} {"train_loss": -22.381689071655273, "global_step": 6835, "epoch": 56} {"train_loss": -22.553327560424805, "global_step": 6836, "epoch": 56} {"train_loss": -22.334802627563477, "global_step": 6837, "epoch": 56} {"train_loss": -22.996381759643555, "global_step": 6838, "epoch": 56} {"train_loss": -21.923742294311523, "global_step": 6839, "epoch": 56} {"train_loss": -22.659276962280273, "global_step": 6840, "epoch": 56} {"train_loss": -22.045446395874023, "global_step": 6841, "epoch": 56} {"train_loss": -22.523406982421875, "global_step": 6842, "epoch": 56} {"train_loss": -22.59919548034668, "global_step": 6843, "epoch": 56} {"train_loss": -22.88058853149414, "global_step": 6844, "epoch": 56} {"train_loss": -22.566335678100586, "global_step": 6845, "epoch": 56} {"train_loss": -22.70330238342285, "global_step": 6846, "epoch": 56} {"train_loss": -22.61931800842285, "global_step": 6847, "epoch": 56} {"train_loss": -23.127561569213867, "global_step": 6848, "epoch": 56} {"train_loss": -22.51848793029785, "global_step": 6849, "epoch": 56} {"train_loss": -22.735776901245117, "global_step": 6850, "epoch": 56} {"train_loss": -23.172557830810547, "global_step": 6851, "epoch": 56} {"train_loss": -22.958023071289062, "global_step": 6852, "epoch": 56} {"train_loss": -22.859840393066406, "global_step": 6853, "epoch": 56} {"train_loss": -22.658931732177734, "global_step": 6854, "epoch": 56} {"train_loss": -23.271852493286133, "global_step": 6855, "epoch": 56} {"train_loss": -23.035322189331055, "global_step": 6856, "epoch": 56} {"train_loss": -22.57980728149414, "global_step": 6857, "epoch": 56} {"train_loss": -23.09894561767578, "global_step": 6858, "epoch": 56} {"train_loss": -22.925304412841797, "global_step": 6859, "epoch": 56} {"train_loss": -23.615942001342773, "global_step": 6860, "epoch": 56} {"train_loss": -22.85227394104004, "global_step": 6861, "epoch": 56} {"train_loss": -23.5836181640625, "global_step": 6862, "epoch": 56} {"train_loss": -22.991416931152344, "global_step": 6863, "epoch": 56} {"train_loss": -22.19830322265625, "global_step": 6864, "epoch": 56} {"train_loss": -21.12638282775879, "global_step": 6865, "epoch": 56} {"train_loss": -18.965707778930664, "global_step": 6866, "epoch": 56} {"train_loss": -19.91945457458496, "global_step": 6867, "epoch": 56} {"train_loss": -23.25546646118164, "global_step": 6868, "epoch": 56} {"train_loss": -20.421945571899414, "global_step": 6869, "epoch": 56} {"train_loss": -22.642236709594727, "global_step": 6870, "epoch": 56} {"train_loss": -21.07110595703125, "global_step": 6871, "epoch": 56} {"train_loss": -23.1998348236084, "global_step": 6872, "epoch": 56} {"train_loss": -22.124841690063477, "global_step": 6873, "epoch": 56} {"train_loss": -22.464773178100586, "global_step": 6874, "epoch": 56} {"train_loss": -22.027101516723633, "global_step": 6875, "epoch": 56} {"train_loss": -21.820404052734375, "global_step": 6876, "epoch": 56} {"train_loss": -22.63983154296875, "global_step": 6877, "epoch": 56} {"train_loss": -22.446557998657227, "global_step": 6878, "epoch": 56} {"train_loss": -22.092056274414062, "global_step": 6879, "epoch": 56} {"train_loss": -22.4240779876709, "global_step": 6880, "epoch": 56} {"train_loss": -22.76456069946289, "global_step": 6881, "epoch": 56} {"train_loss": -22.234867095947266, "global_step": 6882, "epoch": 56} {"train_loss": -21.908849716186523, "global_step": 6883, "epoch": 56} {"train_loss": -22.226871490478516, "global_step": 6884, "epoch": 56} {"train_loss": -22.64790916442871, "global_step": 6885, "epoch": 56} {"train_loss": -22.02140998840332, "global_step": 6886, "epoch": 56} {"train_loss": -22.282133102416992, "global_step": 6887, "epoch": 56} {"train_loss": -22.375049591064453, "global_step": 6888, "epoch": 56} {"train_loss": -21.570844650268555, "global_step": 6889, "epoch": 56} {"train_loss": -22.080148696899414, "global_step": 6890, "epoch": 56} {"train_loss": -22.34445571899414, "global_step": 6891, "epoch": 56} {"train_loss": -21.98910140991211, "global_step": 6892, "epoch": 56} {"train_loss": -22.788389205932617, "global_step": 6893, "epoch": 56} {"train_loss": -22.131122589111328, "global_step": 6894, "epoch": 56} {"train_loss": -22.82818603515625, "global_step": 6895, "epoch": 56} {"train_loss": -22.511061361013365, "global_step": 6896, "epoch": 56, "val_loss": 2837852.75} {"train_loss": -22.78134536743164, "global_step": 6897, "epoch": 57} {"train_loss": -22.458471298217773, "global_step": 6898, "epoch": 57} {"train_loss": -23.07783317565918, "global_step": 6899, "epoch": 57} {"train_loss": -22.460126876831055, "global_step": 6900, "epoch": 57} {"train_loss": -22.438724517822266, "global_step": 6901, "epoch": 57} {"train_loss": -22.429304122924805, "global_step": 6902, "epoch": 57} {"train_loss": -22.797466278076172, "global_step": 6903, "epoch": 57} {"train_loss": -22.808298110961914, "global_step": 6904, "epoch": 57} {"train_loss": -23.0810604095459, "global_step": 6905, "epoch": 57} {"train_loss": -23.095489501953125, "global_step": 6906, "epoch": 57} {"train_loss": -23.228574752807617, "global_step": 6907, "epoch": 57} {"train_loss": -22.98193359375, "global_step": 6908, "epoch": 57} {"train_loss": -22.153575897216797, "global_step": 6909, "epoch": 57} {"train_loss": -20.133737564086914, "global_step": 6910, "epoch": 57} {"train_loss": -21.14328956604004, "global_step": 6911, "epoch": 57} {"train_loss": -23.1058349609375, "global_step": 6912, "epoch": 57} {"train_loss": -21.309656143188477, "global_step": 6913, "epoch": 57} {"train_loss": -22.97096061706543, "global_step": 6914, "epoch": 57} {"train_loss": -22.090808868408203, "global_step": 6915, "epoch": 57} {"train_loss": -22.98013687133789, "global_step": 6916, "epoch": 57} {"train_loss": -22.701656341552734, "global_step": 6917, "epoch": 57} {"train_loss": -23.182998657226562, "global_step": 6918, "epoch": 57} {"train_loss": -22.791738510131836, "global_step": 6919, "epoch": 57} {"train_loss": -23.290687561035156, "global_step": 6920, "epoch": 57} {"train_loss": -23.178865432739258, "global_step": 6921, "epoch": 57} {"train_loss": -23.09929656982422, "global_step": 6922, "epoch": 57} {"train_loss": -23.086957931518555, "global_step": 6923, "epoch": 57} {"train_loss": -22.359508514404297, "global_step": 6924, "epoch": 57} {"train_loss": -23.54242515563965, "global_step": 6925, "epoch": 57} {"train_loss": -22.740995407104492, "global_step": 6926, "epoch": 57} {"train_loss": -23.2143497467041, "global_step": 6927, "epoch": 57} {"train_loss": -23.1544246673584, "global_step": 6928, "epoch": 57} {"train_loss": -23.34280776977539, "global_step": 6929, "epoch": 57} {"train_loss": -22.639158248901367, "global_step": 6930, "epoch": 57} {"train_loss": -23.224336624145508, "global_step": 6931, "epoch": 57} {"train_loss": -23.179227828979492, "global_step": 6932, "epoch": 57} {"train_loss": -22.722196578979492, "global_step": 6933, "epoch": 57} {"train_loss": -23.007450103759766, "global_step": 6934, "epoch": 57} {"train_loss": -22.54512596130371, "global_step": 6935, "epoch": 57} {"train_loss": -22.90523338317871, "global_step": 6936, "epoch": 57} {"train_loss": -21.844175338745117, "global_step": 6937, "epoch": 57} {"train_loss": -19.12204933166504, "global_step": 6938, "epoch": 57} {"train_loss": -21.66255760192871, "global_step": 6939, "epoch": 57} {"train_loss": -20.915395736694336, "global_step": 6940, "epoch": 57} {"train_loss": -20.599592208862305, "global_step": 6941, "epoch": 57} {"train_loss": -17.872312545776367, "global_step": 6942, "epoch": 57} {"train_loss": -18.957883834838867, "global_step": 6943, "epoch": 57} {"train_loss": -21.687192916870117, "global_step": 6944, "epoch": 57} {"train_loss": -22.269336700439453, "global_step": 6945, "epoch": 57} {"train_loss": -21.706878662109375, "global_step": 6946, "epoch": 57} {"train_loss": -22.160888671875, "global_step": 6947, "epoch": 57} {"train_loss": -22.424667358398438, "global_step": 6948, "epoch": 57} {"train_loss": -22.307775497436523, "global_step": 6949, "epoch": 57} {"train_loss": -22.6012020111084, "global_step": 6950, "epoch": 57} {"train_loss": -21.666128158569336, "global_step": 6951, "epoch": 57} {"train_loss": -22.417118072509766, "global_step": 6952, "epoch": 57} {"train_loss": -22.417070388793945, "global_step": 6953, "epoch": 57} {"train_loss": -22.621204376220703, "global_step": 6954, "epoch": 57} {"train_loss": -22.383142471313477, "global_step": 6955, "epoch": 57} {"train_loss": -22.58295249938965, "global_step": 6956, "epoch": 57} {"train_loss": -22.471446990966797, "global_step": 6957, "epoch": 57} {"train_loss": -22.48177146911621, "global_step": 6958, "epoch": 57} {"train_loss": -22.687402725219727, "global_step": 6959, "epoch": 57} {"train_loss": -22.093852996826172, "global_step": 6960, "epoch": 57} {"train_loss": -22.1885929107666, "global_step": 6961, "epoch": 57} {"train_loss": -22.76265525817871, "global_step": 6962, "epoch": 57} {"train_loss": -22.767976760864258, "global_step": 6963, "epoch": 57} {"train_loss": -22.538908004760742, "global_step": 6964, "epoch": 57} {"train_loss": -22.929248809814453, "global_step": 6965, "epoch": 57} {"train_loss": -22.881114959716797, "global_step": 6966, "epoch": 57} {"train_loss": -22.822507858276367, "global_step": 6967, "epoch": 57} {"train_loss": -22.472665786743164, "global_step": 6968, "epoch": 57} {"train_loss": -22.4471378326416, "global_step": 6969, "epoch": 57} {"train_loss": -22.684289932250977, "global_step": 6970, "epoch": 57} {"train_loss": -22.940143585205078, "global_step": 6971, "epoch": 57} {"train_loss": -22.833816528320312, "global_step": 6972, "epoch": 57} {"train_loss": -23.152143478393555, "global_step": 6973, "epoch": 57} {"train_loss": -23.320240020751953, "global_step": 6974, "epoch": 57} {"train_loss": -23.033100128173828, "global_step": 6975, "epoch": 57} {"train_loss": -22.726572036743164, "global_step": 6976, "epoch": 57} {"train_loss": -22.523488998413086, "global_step": 6977, "epoch": 57} {"train_loss": -22.799867630004883, "global_step": 6978, "epoch": 57} {"train_loss": -22.915103912353516, "global_step": 6979, "epoch": 57} {"train_loss": -23.439634323120117, "global_step": 6980, "epoch": 57} {"train_loss": -22.993093490600586, "global_step": 6981, "epoch": 57} {"train_loss": -23.180988311767578, "global_step": 6982, "epoch": 57} {"train_loss": -22.884920120239258, "global_step": 6983, "epoch": 57} {"train_loss": -23.380558013916016, "global_step": 6984, "epoch": 57} {"train_loss": -23.357460021972656, "global_step": 6985, "epoch": 57} {"train_loss": -23.014013290405273, "global_step": 6986, "epoch": 57} {"train_loss": -21.6886043548584, "global_step": 6987, "epoch": 57} {"train_loss": -22.67389488220215, "global_step": 6988, "epoch": 57} {"train_loss": -22.970279693603516, "global_step": 6989, "epoch": 57} {"train_loss": -22.891082763671875, "global_step": 6990, "epoch": 57} {"train_loss": -23.35090446472168, "global_step": 6991, "epoch": 57} {"train_loss": -22.35443687438965, "global_step": 6992, "epoch": 57} {"train_loss": -22.93116569519043, "global_step": 6993, "epoch": 57} {"train_loss": -23.098180770874023, "global_step": 6994, "epoch": 57} {"train_loss": -22.385480880737305, "global_step": 6995, "epoch": 57} {"train_loss": -22.982152938842773, "global_step": 6996, "epoch": 57} {"train_loss": -23.300718307495117, "global_step": 6997, "epoch": 57} {"train_loss": -22.625776290893555, "global_step": 6998, "epoch": 57} {"train_loss": -23.29706382751465, "global_step": 6999, "epoch": 57} {"train_loss": -23.207191467285156, "global_step": 7000, "epoch": 57} {"train_loss": -22.768375396728516, "global_step": 7001, "epoch": 57} {"train_loss": -23.471323013305664, "global_step": 7002, "epoch": 57} {"train_loss": -22.593875885009766, "global_step": 7003, "epoch": 57} {"train_loss": -22.0061092376709, "global_step": 7004, "epoch": 57} {"train_loss": -19.773590087890625, "global_step": 7005, "epoch": 57} {"train_loss": -17.30828285217285, "global_step": 7006, "epoch": 57} {"train_loss": -21.6195011138916, "global_step": 7007, "epoch": 57} {"train_loss": -22.870580673217773, "global_step": 7008, "epoch": 57} {"train_loss": -20.98573112487793, "global_step": 7009, "epoch": 57} {"train_loss": -23.038522720336914, "global_step": 7010, "epoch": 57} {"train_loss": -22.3801212310791, "global_step": 7011, "epoch": 57} {"train_loss": -23.068546295166016, "global_step": 7012, "epoch": 57} {"train_loss": -22.34183120727539, "global_step": 7013, "epoch": 57} {"train_loss": -22.026241302490234, "global_step": 7014, "epoch": 57} {"train_loss": -23.27897071838379, "global_step": 7015, "epoch": 57} {"train_loss": -22.358444213867188, "global_step": 7016, "epoch": 57} {"train_loss": -22.471564158920415, "global_step": 7017, "epoch": 57, "val_loss": 3472227.0} {"train_loss": -22.845184326171875, "global_step": 7018, "epoch": 58} {"train_loss": -22.773038864135742, "global_step": 7019, "epoch": 58} {"train_loss": -22.760364532470703, "global_step": 7020, "epoch": 58} {"train_loss": -23.17506217956543, "global_step": 7021, "epoch": 58} {"train_loss": -22.9765625, "global_step": 7022, "epoch": 58} {"train_loss": -22.88619041442871, "global_step": 7023, "epoch": 58} {"train_loss": -22.93421173095703, "global_step": 7024, "epoch": 58} {"train_loss": -23.149703979492188, "global_step": 7025, "epoch": 58} {"train_loss": -22.974746704101562, "global_step": 7026, "epoch": 58} {"train_loss": -22.659215927124023, "global_step": 7027, "epoch": 58} {"train_loss": -22.54728126525879, "global_step": 7028, "epoch": 58} {"train_loss": -22.81674575805664, "global_step": 7029, "epoch": 58} {"train_loss": -23.248443603515625, "global_step": 7030, "epoch": 58} {"train_loss": -23.247467041015625, "global_step": 7031, "epoch": 58} {"train_loss": -22.882505416870117, "global_step": 7032, "epoch": 58} {"train_loss": -21.227558135986328, "global_step": 7033, "epoch": 58} {"train_loss": -20.399696350097656, "global_step": 7034, "epoch": 58} {"train_loss": -20.838815689086914, "global_step": 7035, "epoch": 58} {"train_loss": -23.36286163330078, "global_step": 7036, "epoch": 58} {"train_loss": -21.826875686645508, "global_step": 7037, "epoch": 58} {"train_loss": -22.473228454589844, "global_step": 7038, "epoch": 58} {"train_loss": -21.93410301208496, "global_step": 7039, "epoch": 58} {"train_loss": -23.320863723754883, "global_step": 7040, "epoch": 58} {"train_loss": -22.278249740600586, "global_step": 7041, "epoch": 58} {"train_loss": -22.95415496826172, "global_step": 7042, "epoch": 58} {"train_loss": -22.541730880737305, "global_step": 7043, "epoch": 58} {"train_loss": -22.5975284576416, "global_step": 7044, "epoch": 58} {"train_loss": -22.668684005737305, "global_step": 7045, "epoch": 58} {"train_loss": -22.399707794189453, "global_step": 7046, "epoch": 58} {"train_loss": -22.7347412109375, "global_step": 7047, "epoch": 58} {"train_loss": -21.849945068359375, "global_step": 7048, "epoch": 58} {"train_loss": -22.694957733154297, "global_step": 7049, "epoch": 58} {"train_loss": -23.000865936279297, "global_step": 7050, "epoch": 58} {"train_loss": -23.12932777404785, "global_step": 7051, "epoch": 58} {"train_loss": -22.717016220092773, "global_step": 7052, "epoch": 58} {"train_loss": -23.403715133666992, "global_step": 7053, "epoch": 58} {"train_loss": -23.150964736938477, "global_step": 7054, "epoch": 58} {"train_loss": -22.918716430664062, "global_step": 7055, "epoch": 58} {"train_loss": -21.2170352935791, "global_step": 7056, "epoch": 58} {"train_loss": -19.371963500976562, "global_step": 7057, "epoch": 58} {"train_loss": -20.99342155456543, "global_step": 7058, "epoch": 58} {"train_loss": -23.11847686767578, "global_step": 7059, "epoch": 58} {"train_loss": -22.26468849182129, "global_step": 7060, "epoch": 58} {"train_loss": -22.029170989990234, "global_step": 7061, "epoch": 58} {"train_loss": -22.264860153198242, "global_step": 7062, "epoch": 58} {"train_loss": -22.3868350982666, "global_step": 7063, "epoch": 58} {"train_loss": -22.626371383666992, "global_step": 7064, "epoch": 58} {"train_loss": -22.5997371673584, "global_step": 7065, "epoch": 58} {"train_loss": -22.61907386779785, "global_step": 7066, "epoch": 58} {"train_loss": -22.76734733581543, "global_step": 7067, "epoch": 58} {"train_loss": -22.15854263305664, "global_step": 7068, "epoch": 58} {"train_loss": -22.87037467956543, "global_step": 7069, "epoch": 58} {"train_loss": -22.76140594482422, "global_step": 7070, "epoch": 58} {"train_loss": -21.78505516052246, "global_step": 7071, "epoch": 58} {"train_loss": -21.734439849853516, "global_step": 7072, "epoch": 58} {"train_loss": -21.248498916625977, "global_step": 7073, "epoch": 58} {"train_loss": -21.43413543701172, "global_step": 7074, "epoch": 58} {"train_loss": -22.662824630737305, "global_step": 7075, "epoch": 58} {"train_loss": -23.170700073242188, "global_step": 7076, "epoch": 58} {"train_loss": -22.832218170166016, "global_step": 7077, "epoch": 58} {"train_loss": -22.636457443237305, "global_step": 7078, "epoch": 58} {"train_loss": -22.995691299438477, "global_step": 7079, "epoch": 58} {"train_loss": -23.05176544189453, "global_step": 7080, "epoch": 58} {"train_loss": -22.7778377532959, "global_step": 7081, "epoch": 58} {"train_loss": -23.271533966064453, "global_step": 7082, "epoch": 58} {"train_loss": -23.10039710998535, "global_step": 7083, "epoch": 58} {"train_loss": -23.30397605895996, "global_step": 7084, "epoch": 58} {"train_loss": -23.37727165222168, "global_step": 7085, "epoch": 58} {"train_loss": -23.3343563079834, "global_step": 7086, "epoch": 58} {"train_loss": -23.412662506103516, "global_step": 7087, "epoch": 58} {"train_loss": -23.18647575378418, "global_step": 7088, "epoch": 58} {"train_loss": -23.115537643432617, "global_step": 7089, "epoch": 58} {"train_loss": -23.883588790893555, "global_step": 7090, "epoch": 58} {"train_loss": -22.961349487304688, "global_step": 7091, "epoch": 58} {"train_loss": -23.40875816345215, "global_step": 7092, "epoch": 58} {"train_loss": -22.957674026489258, "global_step": 7093, "epoch": 58} {"train_loss": -23.200220108032227, "global_step": 7094, "epoch": 58} {"train_loss": -21.58473014831543, "global_step": 7095, "epoch": 58} {"train_loss": -21.4385929107666, "global_step": 7096, "epoch": 58} {"train_loss": -20.894306182861328, "global_step": 7097, "epoch": 58} {"train_loss": -20.484817504882812, "global_step": 7098, "epoch": 58} {"train_loss": -22.556608200073242, "global_step": 7099, "epoch": 58} {"train_loss": -22.28244400024414, "global_step": 7100, "epoch": 58} {"train_loss": -22.266735076904297, "global_step": 7101, "epoch": 58} {"train_loss": -22.755598068237305, "global_step": 7102, "epoch": 58} {"train_loss": -22.760515213012695, "global_step": 7103, "epoch": 58} {"train_loss": -22.27556610107422, "global_step": 7104, "epoch": 58} {"train_loss": -23.620059967041016, "global_step": 7105, "epoch": 58} {"train_loss": -22.44378662109375, "global_step": 7106, "epoch": 58} {"train_loss": -23.012371063232422, "global_step": 7107, "epoch": 58} {"train_loss": -22.645401000976562, "global_step": 7108, "epoch": 58} {"train_loss": -22.87908935546875, "global_step": 7109, "epoch": 58} {"train_loss": -22.95020866394043, "global_step": 7110, "epoch": 58} {"train_loss": -23.41242790222168, "global_step": 7111, "epoch": 58} {"train_loss": -22.934396743774414, "global_step": 7112, "epoch": 58} {"train_loss": -22.952268600463867, "global_step": 7113, "epoch": 58} {"train_loss": -22.596588134765625, "global_step": 7114, "epoch": 58} {"train_loss": -23.249990463256836, "global_step": 7115, "epoch": 58} {"train_loss": -23.358068466186523, "global_step": 7116, "epoch": 58} {"train_loss": -22.733259201049805, "global_step": 7117, "epoch": 58} {"train_loss": -22.922544479370117, "global_step": 7118, "epoch": 58} {"train_loss": -23.212093353271484, "global_step": 7119, "epoch": 58} {"train_loss": -22.919998168945312, "global_step": 7120, "epoch": 58} {"train_loss": -22.746671676635742, "global_step": 7121, "epoch": 58} {"train_loss": -23.095773696899414, "global_step": 7122, "epoch": 58} {"train_loss": -23.100645065307617, "global_step": 7123, "epoch": 58} {"train_loss": -22.869577407836914, "global_step": 7124, "epoch": 58} {"train_loss": -22.855554580688477, "global_step": 7125, "epoch": 58} {"train_loss": -23.09054183959961, "global_step": 7126, "epoch": 58} {"train_loss": -23.36016273498535, "global_step": 7127, "epoch": 58} {"train_loss": -23.208921432495117, "global_step": 7128, "epoch": 58} {"train_loss": -22.96500015258789, "global_step": 7129, "epoch": 58} {"train_loss": -23.1231632232666, "global_step": 7130, "epoch": 58} {"train_loss": -22.715171813964844, "global_step": 7131, "epoch": 58} {"train_loss": -23.614301681518555, "global_step": 7132, "epoch": 58} {"train_loss": -23.10390853881836, "global_step": 7133, "epoch": 58} {"train_loss": -23.179147720336914, "global_step": 7134, "epoch": 58} {"train_loss": -23.12704849243164, "global_step": 7135, "epoch": 58} {"train_loss": -22.51827049255371, "global_step": 7136, "epoch": 58} {"train_loss": -22.44594383239746, "global_step": 7137, "epoch": 58} {"train_loss": -22.66371514186386, "global_step": 7138, "epoch": 58, "val_loss": 3026527.0} {"train_loss": -22.56825065612793, "global_step": 7139, "epoch": 59} {"train_loss": -23.388322830200195, "global_step": 7140, "epoch": 59} {"train_loss": -22.67795181274414, "global_step": 7141, "epoch": 59} {"train_loss": -23.184598922729492, "global_step": 7142, "epoch": 59} {"train_loss": -23.234033584594727, "global_step": 7143, "epoch": 59} {"train_loss": -22.967334747314453, "global_step": 7144, "epoch": 59} {"train_loss": -22.957700729370117, "global_step": 7145, "epoch": 59} {"train_loss": -23.7880802154541, "global_step": 7146, "epoch": 59} {"train_loss": -23.838489532470703, "global_step": 7147, "epoch": 59} {"train_loss": -22.966230392456055, "global_step": 7148, "epoch": 59} {"train_loss": -23.176544189453125, "global_step": 7149, "epoch": 59} {"train_loss": -23.087278366088867, "global_step": 7150, "epoch": 59} {"train_loss": -22.865713119506836, "global_step": 7151, "epoch": 59} {"train_loss": -23.343318939208984, "global_step": 7152, "epoch": 59} {"train_loss": -23.447370529174805, "global_step": 7153, "epoch": 59} {"train_loss": -22.988819122314453, "global_step": 7154, "epoch": 59} {"train_loss": -21.889205932617188, "global_step": 7155, "epoch": 59} {"train_loss": -18.226348876953125, "global_step": 7156, "epoch": 59} {"train_loss": -14.523523330688477, "global_step": 7157, "epoch": 59} {"train_loss": -22.579692840576172, "global_step": 7158, "epoch": 59} {"train_loss": -20.31928825378418, "global_step": 7159, "epoch": 59} {"train_loss": -21.326770782470703, "global_step": 7160, "epoch": 59} {"train_loss": -20.756444931030273, "global_step": 7161, "epoch": 59} {"train_loss": -21.766260147094727, "global_step": 7162, "epoch": 59} {"train_loss": -20.09394073486328, "global_step": 7163, "epoch": 59} {"train_loss": -21.433347702026367, "global_step": 7164, "epoch": 59} {"train_loss": -21.12483024597168, "global_step": 7165, "epoch": 59} {"train_loss": -22.406511306762695, "global_step": 7166, "epoch": 59} {"train_loss": -21.263858795166016, "global_step": 7167, "epoch": 59} {"train_loss": -21.918649673461914, "global_step": 7168, "epoch": 59} {"train_loss": -22.18939781188965, "global_step": 7169, "epoch": 59} {"train_loss": -22.17343521118164, "global_step": 7170, "epoch": 59} {"train_loss": -22.252822875976562, "global_step": 7171, "epoch": 59} {"train_loss": -22.222448348999023, "global_step": 7172, "epoch": 59} {"train_loss": -22.081022262573242, "global_step": 7173, "epoch": 59} {"train_loss": -22.54219627380371, "global_step": 7174, "epoch": 59} {"train_loss": -22.171083450317383, "global_step": 7175, "epoch": 59} {"train_loss": -22.63365936279297, "global_step": 7176, "epoch": 59} {"train_loss": -22.270586013793945, "global_step": 7177, "epoch": 59} {"train_loss": -22.69997215270996, "global_step": 7178, "epoch": 59} {"train_loss": -22.29264259338379, "global_step": 7179, "epoch": 59} {"train_loss": -22.27339744567871, "global_step": 7180, "epoch": 59} {"train_loss": -22.3225040435791, "global_step": 7181, "epoch": 59} {"train_loss": -22.891773223876953, "global_step": 7182, "epoch": 59} {"train_loss": -22.67999267578125, "global_step": 7183, "epoch": 59} {"train_loss": -22.81723403930664, "global_step": 7184, "epoch": 59} {"train_loss": -22.688140869140625, "global_step": 7185, "epoch": 59} {"train_loss": -22.67095375061035, "global_step": 7186, "epoch": 59} {"train_loss": -22.82942008972168, "global_step": 7187, "epoch": 59} {"train_loss": -22.628828048706055, "global_step": 7188, "epoch": 59} {"train_loss": -22.66362953186035, "global_step": 7189, "epoch": 59} {"train_loss": -23.108022689819336, "global_step": 7190, "epoch": 59} {"train_loss": -22.613759994506836, "global_step": 7191, "epoch": 59} {"train_loss": -22.91061019897461, "global_step": 7192, "epoch": 59} {"train_loss": -23.02994728088379, "global_step": 7193, "epoch": 59} {"train_loss": -23.096527099609375, "global_step": 7194, "epoch": 59} {"train_loss": -22.585521697998047, "global_step": 7195, "epoch": 59} {"train_loss": -22.41412925720215, "global_step": 7196, "epoch": 59} {"train_loss": -19.80352210998535, "global_step": 7197, "epoch": 59} {"train_loss": -13.249513626098633, "global_step": 7198, "epoch": 59} {"train_loss": -13.707918167114258, "global_step": 7199, "epoch": 59} {"train_loss": -14.332510948181152, "global_step": 7200, "epoch": 59} {"train_loss": -14.005043029785156, "global_step": 7201, "epoch": 59} {"train_loss": -15.251380920410156, "global_step": 7202, "epoch": 59} {"train_loss": -16.609100341796875, "global_step": 7203, "epoch": 59} {"train_loss": -16.327905654907227, "global_step": 7204, "epoch": 59} {"train_loss": -16.816543579101562, "global_step": 7205, "epoch": 59} {"train_loss": -14.82318115234375, "global_step": 7206, "epoch": 59} {"train_loss": -4.193223476409912, "global_step": 7207, "epoch": 59} {"train_loss": -13.317596435546875, "global_step": 7208, "epoch": 59} {"train_loss": -8.830084800720215, "global_step": 7209, "epoch": 59} {"train_loss": -16.59531021118164, "global_step": 7210, "epoch": 59} {"train_loss": -18.05275535583496, "global_step": 7211, "epoch": 59} {"train_loss": -17.203420639038086, "global_step": 7212, "epoch": 59} {"train_loss": -15.509127616882324, "global_step": 7213, "epoch": 59} {"train_loss": -14.144810676574707, "global_step": 7214, "epoch": 59} {"train_loss": -15.317662239074707, "global_step": 7215, "epoch": 59} {"train_loss": -15.982441902160645, "global_step": 7216, "epoch": 59} {"train_loss": -16.7907772064209, "global_step": 7217, "epoch": 59} {"train_loss": -16.94145393371582, "global_step": 7218, "epoch": 59} {"train_loss": -16.692625045776367, "global_step": 7219, "epoch": 59} {"train_loss": -16.731884002685547, "global_step": 7220, "epoch": 59} {"train_loss": -17.332368850708008, "global_step": 7221, "epoch": 59} {"train_loss": -17.073293685913086, "global_step": 7222, "epoch": 59} {"train_loss": -17.129135131835938, "global_step": 7223, "epoch": 59} {"train_loss": -17.557754516601562, "global_step": 7224, "epoch": 59} {"train_loss": -17.462797164916992, "global_step": 7225, "epoch": 59} {"train_loss": -16.5084285736084, "global_step": 7226, "epoch": 59} {"train_loss": -17.618818283081055, "global_step": 7227, "epoch": 59} {"train_loss": -17.83624839782715, "global_step": 7228, "epoch": 59} {"train_loss": -17.680221557617188, "global_step": 7229, "epoch": 59} {"train_loss": -18.023893356323242, "global_step": 7230, "epoch": 59} {"train_loss": -17.570003509521484, "global_step": 7231, "epoch": 59} {"train_loss": -18.296924591064453, "global_step": 7232, "epoch": 59} {"train_loss": -18.26960563659668, "global_step": 7233, "epoch": 59} {"train_loss": -18.034955978393555, "global_step": 7234, "epoch": 59} {"train_loss": -18.82024574279785, "global_step": 7235, "epoch": 59} {"train_loss": -18.310300827026367, "global_step": 7236, "epoch": 59} {"train_loss": -19.166515350341797, "global_step": 7237, "epoch": 59} {"train_loss": -18.896360397338867, "global_step": 7238, "epoch": 59} {"train_loss": -19.07159996032715, "global_step": 7239, "epoch": 59} {"train_loss": -18.59669303894043, "global_step": 7240, "epoch": 59} {"train_loss": -18.882076263427734, "global_step": 7241, "epoch": 59} {"train_loss": -19.157392501831055, "global_step": 7242, "epoch": 59} {"train_loss": -19.201078414916992, "global_step": 7243, "epoch": 59} {"train_loss": -17.826295852661133, "global_step": 7244, "epoch": 59} {"train_loss": -15.795636177062988, "global_step": 7245, "epoch": 59} {"train_loss": -18.483274459838867, "global_step": 7246, "epoch": 59} {"train_loss": -17.677812576293945, "global_step": 7247, "epoch": 59} {"train_loss": -19.632421493530273, "global_step": 7248, "epoch": 59} {"train_loss": -18.91115379333496, "global_step": 7249, "epoch": 59} {"train_loss": -19.266828536987305, "global_step": 7250, "epoch": 59} {"train_loss": -19.41407585144043, "global_step": 7251, "epoch": 59} {"train_loss": -18.052276611328125, "global_step": 7252, "epoch": 59} {"train_loss": -14.206351280212402, "global_step": 7253, "epoch": 59} {"train_loss": -15.826680183410645, "global_step": 7254, "epoch": 59} {"train_loss": -18.532150268554688, "global_step": 7255, "epoch": 59} {"train_loss": -18.18992042541504, "global_step": 7256, "epoch": 59} {"train_loss": -17.67860221862793, "global_step": 7257, "epoch": 59} {"train_loss": -18.742834091186523, "global_step": 7258, "epoch": 59} {"train_loss": -19.47644554090894, "global_step": 7259, "epoch": 59, "val_loss": 2771361.25} {"train_loss": -19.165830612182617, "global_step": 7260, "epoch": 60} {"train_loss": -18.684240341186523, "global_step": 7261, "epoch": 60} {"train_loss": -18.094532012939453, "global_step": 7262, "epoch": 60} {"train_loss": -18.309741973876953, "global_step": 7263, "epoch": 60} {"train_loss": -19.163305282592773, "global_step": 7264, "epoch": 60} {"train_loss": -18.605756759643555, "global_step": 7265, "epoch": 60} {"train_loss": -18.855012893676758, "global_step": 7266, "epoch": 60} {"train_loss": -19.594602584838867, "global_step": 7267, "epoch": 60} {"train_loss": -18.88861656188965, "global_step": 7268, "epoch": 60} {"train_loss": -18.87744140625, "global_step": 7269, "epoch": 60} {"train_loss": -19.345367431640625, "global_step": 7270, "epoch": 60} {"train_loss": -19.268905639648438, "global_step": 7271, "epoch": 60} {"train_loss": -19.03318214416504, "global_step": 7272, "epoch": 60} {"train_loss": -19.903274536132812, "global_step": 7273, "epoch": 60} {"train_loss": -19.482471466064453, "global_step": 7274, "epoch": 60} {"train_loss": -19.259990692138672, "global_step": 7275, "epoch": 60} {"train_loss": -19.54282569885254, "global_step": 7276, "epoch": 60} {"train_loss": -19.801794052124023, "global_step": 7277, "epoch": 60} {"train_loss": -19.991416931152344, "global_step": 7278, "epoch": 60} {"train_loss": -19.34877586364746, "global_step": 7279, "epoch": 60} {"train_loss": -20.1501522064209, "global_step": 7280, "epoch": 60} {"train_loss": -20.320486068725586, "global_step": 7281, "epoch": 60} {"train_loss": -20.76051902770996, "global_step": 7282, "epoch": 60} {"train_loss": -20.81930160522461, "global_step": 7283, "epoch": 60} {"train_loss": -19.992563247680664, "global_step": 7284, "epoch": 60} {"train_loss": -20.500097274780273, "global_step": 7285, "epoch": 60} {"train_loss": -21.5300350189209, "global_step": 7286, "epoch": 60} {"train_loss": -21.05813980102539, "global_step": 7287, "epoch": 60} {"train_loss": -21.566686630249023, "global_step": 7288, "epoch": 60} {"train_loss": -20.900623321533203, "global_step": 7289, "epoch": 60} {"train_loss": -21.1855411529541, "global_step": 7290, "epoch": 60} {"train_loss": -22.387327194213867, "global_step": 7291, "epoch": 60} {"train_loss": -21.61796760559082, "global_step": 7292, "epoch": 60} {"train_loss": -21.865947723388672, "global_step": 7293, "epoch": 60} {"train_loss": -21.86673355102539, "global_step": 7294, "epoch": 60} {"train_loss": -22.270156860351562, "global_step": 7295, "epoch": 60} {"train_loss": -22.378582000732422, "global_step": 7296, "epoch": 60} {"train_loss": -22.042545318603516, "global_step": 7297, "epoch": 60} {"train_loss": -22.44545555114746, "global_step": 7298, "epoch": 60} {"train_loss": -21.977489471435547, "global_step": 7299, "epoch": 60} {"train_loss": -22.82245445251465, "global_step": 7300, "epoch": 60} {"train_loss": -22.67584228515625, "global_step": 7301, "epoch": 60} {"train_loss": -22.92986488342285, "global_step": 7302, "epoch": 60} {"train_loss": -21.905912399291992, "global_step": 7303, "epoch": 60} {"train_loss": -22.037586212158203, "global_step": 7304, "epoch": 60} {"train_loss": -22.606121063232422, "global_step": 7305, "epoch": 60} {"train_loss": -22.007068634033203, "global_step": 7306, "epoch": 60} {"train_loss": -22.77739143371582, "global_step": 7307, "epoch": 60} {"train_loss": -23.014450073242188, "global_step": 7308, "epoch": 60} {"train_loss": -22.598302841186523, "global_step": 7309, "epoch": 60} {"train_loss": -22.866859436035156, "global_step": 7310, "epoch": 60} {"train_loss": -22.823400497436523, "global_step": 7311, "epoch": 60} {"train_loss": -22.859174728393555, "global_step": 7312, "epoch": 60} {"train_loss": -23.248554229736328, "global_step": 7313, "epoch": 60} {"train_loss": -22.84173011779785, "global_step": 7314, "epoch": 60} {"train_loss": -23.43927764892578, "global_step": 7315, "epoch": 60} {"train_loss": -22.879148483276367, "global_step": 7316, "epoch": 60} {"train_loss": -23.36136245727539, "global_step": 7317, "epoch": 60} {"train_loss": -23.086286544799805, "global_step": 7318, "epoch": 60} {"train_loss": -23.448328018188477, "global_step": 7319, "epoch": 60} {"train_loss": -23.089902877807617, "global_step": 7320, "epoch": 60} {"train_loss": -23.41193962097168, "global_step": 7321, "epoch": 60} {"train_loss": -22.473979949951172, "global_step": 7322, "epoch": 60} {"train_loss": -22.99571418762207, "global_step": 7323, "epoch": 60} {"train_loss": -21.235746383666992, "global_step": 7324, "epoch": 60} {"train_loss": -17.78287124633789, "global_step": 7325, "epoch": 60} {"train_loss": -15.072441101074219, "global_step": 7326, "epoch": 60} {"train_loss": -16.176511764526367, "global_step": 7327, "epoch": 60} {"train_loss": -16.949430465698242, "global_step": 7328, "epoch": 60} {"train_loss": -16.954877853393555, "global_step": 7329, "epoch": 60} {"train_loss": -16.418750762939453, "global_step": 7330, "epoch": 60} {"train_loss": -15.974883079528809, "global_step": 7331, "epoch": 60} {"train_loss": -16.669408798217773, "global_step": 7332, "epoch": 60} {"train_loss": -18.216997146606445, "global_step": 7333, "epoch": 60} {"train_loss": -18.620853424072266, "global_step": 7334, "epoch": 60} {"train_loss": -18.961896896362305, "global_step": 7335, "epoch": 60} {"train_loss": -19.721237182617188, "global_step": 7336, "epoch": 60} {"train_loss": -19.567903518676758, "global_step": 7337, "epoch": 60} {"train_loss": -19.929615020751953, "global_step": 7338, "epoch": 60} {"train_loss": -20.684850692749023, "global_step": 7339, "epoch": 60} {"train_loss": -20.323911666870117, "global_step": 7340, "epoch": 60} {"train_loss": -21.295753479003906, "global_step": 7341, "epoch": 60} {"train_loss": -21.046716690063477, "global_step": 7342, "epoch": 60} {"train_loss": -21.713253021240234, "global_step": 7343, "epoch": 60} {"train_loss": -21.26231575012207, "global_step": 7344, "epoch": 60} {"train_loss": -21.019819259643555, "global_step": 7345, "epoch": 60} {"train_loss": -21.35036277770996, "global_step": 7346, "epoch": 60} {"train_loss": -21.81361198425293, "global_step": 7347, "epoch": 60} {"train_loss": -21.75545310974121, "global_step": 7348, "epoch": 60} {"train_loss": -21.811317443847656, "global_step": 7349, "epoch": 60} {"train_loss": -21.821197509765625, "global_step": 7350, "epoch": 60} {"train_loss": -22.165868759155273, "global_step": 7351, "epoch": 60} {"train_loss": -22.146629333496094, "global_step": 7352, "epoch": 60} {"train_loss": -22.49812889099121, "global_step": 7353, "epoch": 60} {"train_loss": -22.24947166442871, "global_step": 7354, "epoch": 60} {"train_loss": -21.989856719970703, "global_step": 7355, "epoch": 60} {"train_loss": -21.71070671081543, "global_step": 7356, "epoch": 60} {"train_loss": -22.552738189697266, "global_step": 7357, "epoch": 60} {"train_loss": -21.144737243652344, "global_step": 7358, "epoch": 60} {"train_loss": -22.60886001586914, "global_step": 7359, "epoch": 60} {"train_loss": -22.13929557800293, "global_step": 7360, "epoch": 60} {"train_loss": -22.6517276763916, "global_step": 7361, "epoch": 60} {"train_loss": -22.69063377380371, "global_step": 7362, "epoch": 60} {"train_loss": -21.884090423583984, "global_step": 7363, "epoch": 60} {"train_loss": -22.25417137145996, "global_step": 7364, "epoch": 60} {"train_loss": -22.287874221801758, "global_step": 7365, "epoch": 60} {"train_loss": -21.751129150390625, "global_step": 7366, "epoch": 60} {"train_loss": -22.1856632232666, "global_step": 7367, "epoch": 60} {"train_loss": -22.777769088745117, "global_step": 7368, "epoch": 60} {"train_loss": -22.8553524017334, "global_step": 7369, "epoch": 60} {"train_loss": -22.53373908996582, "global_step": 7370, "epoch": 60} {"train_loss": -22.581594467163086, "global_step": 7371, "epoch": 60} {"train_loss": -22.958269119262695, "global_step": 7372, "epoch": 60} {"train_loss": -22.833738327026367, "global_step": 7373, "epoch": 60} {"train_loss": -22.533615112304688, "global_step": 7374, "epoch": 60} {"train_loss": -23.24578094482422, "global_step": 7375, "epoch": 60} {"train_loss": -23.07740592956543, "global_step": 7376, "epoch": 60} {"train_loss": -22.87518310546875, "global_step": 7377, "epoch": 60} {"train_loss": -22.839101791381836, "global_step": 7378, "epoch": 60} {"train_loss": -23.402631759643555, "global_step": 7379, "epoch": 60} {"train_loss": -21.13282839719914, "global_step": 7380, "epoch": 60, "val_loss": 2766307.25} {"train_loss": -22.86650276184082, "global_step": 7381, "epoch": 61} {"train_loss": -20.86334800720215, "global_step": 7382, "epoch": 61} {"train_loss": -21.453357696533203, "global_step": 7383, "epoch": 61} {"train_loss": -23.55556297302246, "global_step": 7384, "epoch": 61} {"train_loss": -22.33962631225586, "global_step": 7385, "epoch": 61} {"train_loss": -20.98005485534668, "global_step": 7386, "epoch": 61} {"train_loss": -23.47994613647461, "global_step": 7387, "epoch": 61} {"train_loss": -20.63973045349121, "global_step": 7388, "epoch": 61} {"train_loss": -22.12022590637207, "global_step": 7389, "epoch": 61} {"train_loss": -22.183897018432617, "global_step": 7390, "epoch": 61} {"train_loss": -22.495391845703125, "global_step": 7391, "epoch": 61} {"train_loss": -23.048202514648438, "global_step": 7392, "epoch": 61} {"train_loss": -23.113874435424805, "global_step": 7393, "epoch": 61} {"train_loss": -22.578048706054688, "global_step": 7394, "epoch": 61} {"train_loss": -23.011388778686523, "global_step": 7395, "epoch": 61} {"train_loss": -22.867685317993164, "global_step": 7396, "epoch": 61} {"train_loss": -23.266653060913086, "global_step": 7397, "epoch": 61} {"train_loss": -22.855388641357422, "global_step": 7398, "epoch": 61} {"train_loss": -23.02669906616211, "global_step": 7399, "epoch": 61} {"train_loss": -23.3512020111084, "global_step": 7400, "epoch": 61} {"train_loss": -23.27191162109375, "global_step": 7401, "epoch": 61} {"train_loss": -23.072494506835938, "global_step": 7402, "epoch": 61} {"train_loss": -23.390134811401367, "global_step": 7403, "epoch": 61} {"train_loss": -23.33966636657715, "global_step": 7404, "epoch": 61} {"train_loss": -23.24241828918457, "global_step": 7405, "epoch": 61} {"train_loss": -23.185636520385742, "global_step": 7406, "epoch": 61} {"train_loss": -23.52488136291504, "global_step": 7407, "epoch": 61} {"train_loss": -23.322309494018555, "global_step": 7408, "epoch": 61} {"train_loss": -23.31217384338379, "global_step": 7409, "epoch": 61} {"train_loss": -23.283071517944336, "global_step": 7410, "epoch": 61} {"train_loss": -23.259782791137695, "global_step": 7411, "epoch": 61} {"train_loss": -23.72944450378418, "global_step": 7412, "epoch": 61} {"train_loss": -23.069604873657227, "global_step": 7413, "epoch": 61} {"train_loss": -23.67827796936035, "global_step": 7414, "epoch": 61} {"train_loss": -23.828054428100586, "global_step": 7415, "epoch": 61} {"train_loss": -23.563039779663086, "global_step": 7416, "epoch": 61} {"train_loss": -22.816091537475586, "global_step": 7417, "epoch": 61} {"train_loss": -22.6416015625, "global_step": 7418, "epoch": 61} {"train_loss": -22.65730857849121, "global_step": 7419, "epoch": 61} {"train_loss": -22.99835777282715, "global_step": 7420, "epoch": 61} {"train_loss": -23.38168716430664, "global_step": 7421, "epoch": 61} {"train_loss": -23.25031852722168, "global_step": 7422, "epoch": 61} {"train_loss": -23.663328170776367, "global_step": 7423, "epoch": 61} {"train_loss": -23.23844337463379, "global_step": 7424, "epoch": 61} {"train_loss": -24.219701766967773, "global_step": 7425, "epoch": 61} {"train_loss": -23.6013240814209, "global_step": 7426, "epoch": 61} {"train_loss": -22.55011558532715, "global_step": 7427, "epoch": 61} {"train_loss": -23.033079147338867, "global_step": 7428, "epoch": 61} {"train_loss": -22.349609375, "global_step": 7429, "epoch": 61} {"train_loss": -23.93898582458496, "global_step": 7430, "epoch": 61} {"train_loss": -23.041772842407227, "global_step": 7431, "epoch": 61} {"train_loss": -23.375707626342773, "global_step": 7432, "epoch": 61} {"train_loss": -23.410959243774414, "global_step": 7433, "epoch": 61} {"train_loss": -23.460540771484375, "global_step": 7434, "epoch": 61} {"train_loss": -23.207796096801758, "global_step": 7435, "epoch": 61} {"train_loss": -23.363733291625977, "global_step": 7436, "epoch": 61} {"train_loss": -23.506742477416992, "global_step": 7437, "epoch": 61} {"train_loss": -23.879413604736328, "global_step": 7438, "epoch": 61} {"train_loss": -22.714879989624023, "global_step": 7439, "epoch": 61} {"train_loss": -22.007144927978516, "global_step": 7440, "epoch": 61} {"train_loss": -22.61612319946289, "global_step": 7441, "epoch": 61} {"train_loss": -23.81394386291504, "global_step": 7442, "epoch": 61} {"train_loss": -22.512617111206055, "global_step": 7443, "epoch": 61} {"train_loss": -23.549440383911133, "global_step": 7444, "epoch": 61} {"train_loss": -23.760889053344727, "global_step": 7445, "epoch": 61} {"train_loss": -23.64763641357422, "global_step": 7446, "epoch": 61} {"train_loss": -23.57061195373535, "global_step": 7447, "epoch": 61} {"train_loss": -23.648731231689453, "global_step": 7448, "epoch": 61} {"train_loss": -23.32649040222168, "global_step": 7449, "epoch": 61} {"train_loss": -23.92683982849121, "global_step": 7450, "epoch": 61} {"train_loss": -23.225996017456055, "global_step": 7451, "epoch": 61} {"train_loss": -21.840225219726562, "global_step": 7452, "epoch": 61} {"train_loss": -19.913015365600586, "global_step": 7453, "epoch": 61} {"train_loss": -21.77545166015625, "global_step": 7454, "epoch": 61} {"train_loss": -23.136600494384766, "global_step": 7455, "epoch": 61} {"train_loss": -23.013580322265625, "global_step": 7456, "epoch": 61} {"train_loss": -21.849754333496094, "global_step": 7457, "epoch": 61} {"train_loss": -22.482189178466797, "global_step": 7458, "epoch": 61} {"train_loss": -23.535694122314453, "global_step": 7459, "epoch": 61} {"train_loss": -22.63190269470215, "global_step": 7460, "epoch": 61} {"train_loss": -23.4605770111084, "global_step": 7461, "epoch": 61} {"train_loss": -22.40631103515625, "global_step": 7462, "epoch": 61} {"train_loss": -23.10182762145996, "global_step": 7463, "epoch": 61} {"train_loss": -23.637800216674805, "global_step": 7464, "epoch": 61} {"train_loss": -23.404916763305664, "global_step": 7465, "epoch": 61} {"train_loss": -23.862031936645508, "global_step": 7466, "epoch": 61} {"train_loss": -23.22437858581543, "global_step": 7467, "epoch": 61} {"train_loss": -23.52945327758789, "global_step": 7468, "epoch": 61} {"train_loss": -23.26758575439453, "global_step": 7469, "epoch": 61} {"train_loss": -22.293298721313477, "global_step": 7470, "epoch": 61} {"train_loss": -22.68606948852539, "global_step": 7471, "epoch": 61} {"train_loss": -23.52992057800293, "global_step": 7472, "epoch": 61} {"train_loss": -22.688335418701172, "global_step": 7473, "epoch": 61} {"train_loss": -23.135377883911133, "global_step": 7474, "epoch": 61} {"train_loss": -23.41524314880371, "global_step": 7475, "epoch": 61} {"train_loss": -23.44099235534668, "global_step": 7476, "epoch": 61} {"train_loss": -23.0974178314209, "global_step": 7477, "epoch": 61} {"train_loss": -23.128278732299805, "global_step": 7478, "epoch": 61} {"train_loss": -22.594886779785156, "global_step": 7479, "epoch": 61} {"train_loss": -23.16157341003418, "global_step": 7480, "epoch": 61} {"train_loss": -22.4796085357666, "global_step": 7481, "epoch": 61} {"train_loss": -20.23723793029785, "global_step": 7482, "epoch": 61} {"train_loss": -23.724863052368164, "global_step": 7483, "epoch": 61} {"train_loss": -22.54073143005371, "global_step": 7484, "epoch": 61} {"train_loss": -19.420795440673828, "global_step": 7485, "epoch": 61} {"train_loss": -21.041467666625977, "global_step": 7486, "epoch": 61} {"train_loss": -21.776809692382812, "global_step": 7487, "epoch": 61} {"train_loss": -21.843727111816406, "global_step": 7488, "epoch": 61} {"train_loss": -22.908979415893555, "global_step": 7489, "epoch": 61} {"train_loss": -22.082115173339844, "global_step": 7490, "epoch": 61} {"train_loss": -22.988012313842773, "global_step": 7491, "epoch": 61} {"train_loss": -22.771833419799805, "global_step": 7492, "epoch": 61} {"train_loss": -22.198022842407227, "global_step": 7493, "epoch": 61} {"train_loss": -22.82484245300293, "global_step": 7494, "epoch": 61} {"train_loss": -22.8582820892334, "global_step": 7495, "epoch": 61} {"train_loss": -22.841341018676758, "global_step": 7496, "epoch": 61} {"train_loss": -23.11016273498535, "global_step": 7497, "epoch": 61} {"train_loss": -23.309539794921875, "global_step": 7498, "epoch": 61} {"train_loss": -23.412954330444336, "global_step": 7499, "epoch": 61} {"train_loss": -23.095256805419922, "global_step": 7500, "epoch": 61} {"train_loss": -22.910213643854316, "global_step": 7501, "epoch": 61, "val_loss": 2902210.0} {"train_loss": -23.40825080871582, "global_step": 7502, "epoch": 62} {"train_loss": -23.476699829101562, "global_step": 7503, "epoch": 62} {"train_loss": -23.764965057373047, "global_step": 7504, "epoch": 62} {"train_loss": -23.263900756835938, "global_step": 7505, "epoch": 62} {"train_loss": -23.17677116394043, "global_step": 7506, "epoch": 62} {"train_loss": -23.790712356567383, "global_step": 7507, "epoch": 62} {"train_loss": -23.68069839477539, "global_step": 7508, "epoch": 62} {"train_loss": -23.08014488220215, "global_step": 7509, "epoch": 62} {"train_loss": -23.7095947265625, "global_step": 7510, "epoch": 62} {"train_loss": -23.286544799804688, "global_step": 7511, "epoch": 62} {"train_loss": -23.915603637695312, "global_step": 7512, "epoch": 62} {"train_loss": -23.778165817260742, "global_step": 7513, "epoch": 62} {"train_loss": -23.59942626953125, "global_step": 7514, "epoch": 62} {"train_loss": -24.130937576293945, "global_step": 7515, "epoch": 62} {"train_loss": -23.911497116088867, "global_step": 7516, "epoch": 62} {"train_loss": -23.732563018798828, "global_step": 7517, "epoch": 62} {"train_loss": -23.253604888916016, "global_step": 7518, "epoch": 62} {"train_loss": -23.781217575073242, "global_step": 7519, "epoch": 62} {"train_loss": -22.676918029785156, "global_step": 7520, "epoch": 62} {"train_loss": -23.407642364501953, "global_step": 7521, "epoch": 62} {"train_loss": -23.628477096557617, "global_step": 7522, "epoch": 62} {"train_loss": -22.126724243164062, "global_step": 7523, "epoch": 62} {"train_loss": -22.75735855102539, "global_step": 7524, "epoch": 62} {"train_loss": -23.372779846191406, "global_step": 7525, "epoch": 62} {"train_loss": -21.266956329345703, "global_step": 7526, "epoch": 62} {"train_loss": -23.371068954467773, "global_step": 7527, "epoch": 62} {"train_loss": -22.566625595092773, "global_step": 7528, "epoch": 62} {"train_loss": -22.399927139282227, "global_step": 7529, "epoch": 62} {"train_loss": -23.192991256713867, "global_step": 7530, "epoch": 62} {"train_loss": -21.802953720092773, "global_step": 7531, "epoch": 62} {"train_loss": -21.247943878173828, "global_step": 7532, "epoch": 62} {"train_loss": -19.65399932861328, "global_step": 7533, "epoch": 62} {"train_loss": -21.88251304626465, "global_step": 7534, "epoch": 62} {"train_loss": -20.888591766357422, "global_step": 7535, "epoch": 62} {"train_loss": -21.87051010131836, "global_step": 7536, "epoch": 62} {"train_loss": -22.096668243408203, "global_step": 7537, "epoch": 62} {"train_loss": -20.779998779296875, "global_step": 7538, "epoch": 62} {"train_loss": -22.52071762084961, "global_step": 7539, "epoch": 62} {"train_loss": -21.337186813354492, "global_step": 7540, "epoch": 62} {"train_loss": -22.4746036529541, "global_step": 7541, "epoch": 62} {"train_loss": -21.047353744506836, "global_step": 7542, "epoch": 62} {"train_loss": -22.566679000854492, "global_step": 7543, "epoch": 62} {"train_loss": -22.291555404663086, "global_step": 7544, "epoch": 62} {"train_loss": -23.00594711303711, "global_step": 7545, "epoch": 62} {"train_loss": -22.52044105529785, "global_step": 7546, "epoch": 62} {"train_loss": -22.57251739501953, "global_step": 7547, "epoch": 62} {"train_loss": -22.5192928314209, "global_step": 7548, "epoch": 62} {"train_loss": -22.820653915405273, "global_step": 7549, "epoch": 62} {"train_loss": -22.607187271118164, "global_step": 7550, "epoch": 62} {"train_loss": -22.894577026367188, "global_step": 7551, "epoch": 62} {"train_loss": -22.835617065429688, "global_step": 7552, "epoch": 62} {"train_loss": -22.714651107788086, "global_step": 7553, "epoch": 62} {"train_loss": -22.916189193725586, "global_step": 7554, "epoch": 62} {"train_loss": -22.977750778198242, "global_step": 7555, "epoch": 62} {"train_loss": -23.32249641418457, "global_step": 7556, "epoch": 62} {"train_loss": -23.249706268310547, "global_step": 7557, "epoch": 62} {"train_loss": -23.54227638244629, "global_step": 7558, "epoch": 62} {"train_loss": -23.343868255615234, "global_step": 7559, "epoch": 62} {"train_loss": -23.09856605529785, "global_step": 7560, "epoch": 62} {"train_loss": -23.223350524902344, "global_step": 7561, "epoch": 62} {"train_loss": -22.611656188964844, "global_step": 7562, "epoch": 62} {"train_loss": -22.223447799682617, "global_step": 7563, "epoch": 62} {"train_loss": -21.87074851989746, "global_step": 7564, "epoch": 62} {"train_loss": -20.21254539489746, "global_step": 7565, "epoch": 62} {"train_loss": -21.13285255432129, "global_step": 7566, "epoch": 62} {"train_loss": -22.85044288635254, "global_step": 7567, "epoch": 62} {"train_loss": -23.608264923095703, "global_step": 7568, "epoch": 62} {"train_loss": -22.637975692749023, "global_step": 7569, "epoch": 62} {"train_loss": -22.344852447509766, "global_step": 7570, "epoch": 62} {"train_loss": -23.049955368041992, "global_step": 7571, "epoch": 62} {"train_loss": -22.394412994384766, "global_step": 7572, "epoch": 62} {"train_loss": -23.81244659423828, "global_step": 7573, "epoch": 62} {"train_loss": -23.299190521240234, "global_step": 7574, "epoch": 62} {"train_loss": -23.687612533569336, "global_step": 7575, "epoch": 62} {"train_loss": -23.6195068359375, "global_step": 7576, "epoch": 62} {"train_loss": -23.41010856628418, "global_step": 7577, "epoch": 62} {"train_loss": -23.410261154174805, "global_step": 7578, "epoch": 62} {"train_loss": -23.41518211364746, "global_step": 7579, "epoch": 62} {"train_loss": -24.014490127563477, "global_step": 7580, "epoch": 62} {"train_loss": -23.478715896606445, "global_step": 7581, "epoch": 62} {"train_loss": -23.21772575378418, "global_step": 7582, "epoch": 62} {"train_loss": -23.965957641601562, "global_step": 7583, "epoch": 62} {"train_loss": -23.666540145874023, "global_step": 7584, "epoch": 62} {"train_loss": -23.146757125854492, "global_step": 7585, "epoch": 62} {"train_loss": -23.062633514404297, "global_step": 7586, "epoch": 62} {"train_loss": -23.419099807739258, "global_step": 7587, "epoch": 62} {"train_loss": -23.121726989746094, "global_step": 7588, "epoch": 62} {"train_loss": -22.37019157409668, "global_step": 7589, "epoch": 62} {"train_loss": -21.822431564331055, "global_step": 7590, "epoch": 62} {"train_loss": -22.983484268188477, "global_step": 7591, "epoch": 62} {"train_loss": -22.61672592163086, "global_step": 7592, "epoch": 62} {"train_loss": -22.75800895690918, "global_step": 7593, "epoch": 62} {"train_loss": -23.761157989501953, "global_step": 7594, "epoch": 62} {"train_loss": -23.649765014648438, "global_step": 7595, "epoch": 62} {"train_loss": -23.31456184387207, "global_step": 7596, "epoch": 62} {"train_loss": -23.13082504272461, "global_step": 7597, "epoch": 62} {"train_loss": -23.699064254760742, "global_step": 7598, "epoch": 62} {"train_loss": -23.53317642211914, "global_step": 7599, "epoch": 62} {"train_loss": -23.38724708557129, "global_step": 7600, "epoch": 62} {"train_loss": -23.881580352783203, "global_step": 7601, "epoch": 62} {"train_loss": -23.28662109375, "global_step": 7602, "epoch": 62} {"train_loss": -22.37821388244629, "global_step": 7603, "epoch": 62} {"train_loss": -21.12605094909668, "global_step": 7604, "epoch": 62} {"train_loss": -20.71198081970215, "global_step": 7605, "epoch": 62} {"train_loss": -23.58289909362793, "global_step": 7606, "epoch": 62} {"train_loss": -23.492443084716797, "global_step": 7607, "epoch": 62} {"train_loss": -22.534046173095703, "global_step": 7608, "epoch": 62} {"train_loss": -23.508237838745117, "global_step": 7609, "epoch": 62} {"train_loss": -22.99129295349121, "global_step": 7610, "epoch": 62} {"train_loss": -23.474599838256836, "global_step": 7611, "epoch": 62} {"train_loss": -23.17341423034668, "global_step": 7612, "epoch": 62} {"train_loss": -23.235191345214844, "global_step": 7613, "epoch": 62} {"train_loss": -23.365793228149414, "global_step": 7614, "epoch": 62} {"train_loss": -22.589841842651367, "global_step": 7615, "epoch": 62} {"train_loss": -22.64215660095215, "global_step": 7616, "epoch": 62} {"train_loss": -23.817983627319336, "global_step": 7617, "epoch": 62} {"train_loss": -22.65570640563965, "global_step": 7618, "epoch": 62} {"train_loss": -22.477481842041016, "global_step": 7619, "epoch": 62} {"train_loss": -22.398590087890625, "global_step": 7620, "epoch": 62} {"train_loss": -20.964780807495117, "global_step": 7621, "epoch": 62} {"train_loss": -22.839068594057697, "global_step": 7622, "epoch": 62, "val_loss": 2602591.75} {"train_loss": -22.085845947265625, "global_step": 7623, "epoch": 63} {"train_loss": -19.062164306640625, "global_step": 7624, "epoch": 63} {"train_loss": -22.122610092163086, "global_step": 7625, "epoch": 63} {"train_loss": -23.456758499145508, "global_step": 7626, "epoch": 63} {"train_loss": -21.440900802612305, "global_step": 7627, "epoch": 63} {"train_loss": -20.823928833007812, "global_step": 7628, "epoch": 63} {"train_loss": -22.57880401611328, "global_step": 7629, "epoch": 63} {"train_loss": -22.21257972717285, "global_step": 7630, "epoch": 63} {"train_loss": -21.066320419311523, "global_step": 7631, "epoch": 63} {"train_loss": -21.572431564331055, "global_step": 7632, "epoch": 63} {"train_loss": -21.474842071533203, "global_step": 7633, "epoch": 63} {"train_loss": -22.293087005615234, "global_step": 7634, "epoch": 63} {"train_loss": -22.505325317382812, "global_step": 7635, "epoch": 63} {"train_loss": -22.2362060546875, "global_step": 7636, "epoch": 63} {"train_loss": -22.393348693847656, "global_step": 7637, "epoch": 63} {"train_loss": -21.894638061523438, "global_step": 7638, "epoch": 63} {"train_loss": -22.7413387298584, "global_step": 7639, "epoch": 63} {"train_loss": -22.390317916870117, "global_step": 7640, "epoch": 63} {"train_loss": -22.55899429321289, "global_step": 7641, "epoch": 63} {"train_loss": -22.880416870117188, "global_step": 7642, "epoch": 63} {"train_loss": -22.84627342224121, "global_step": 7643, "epoch": 63} {"train_loss": -23.207836151123047, "global_step": 7644, "epoch": 63} {"train_loss": -22.641454696655273, "global_step": 7645, "epoch": 63} {"train_loss": -22.82884407043457, "global_step": 7646, "epoch": 63} {"train_loss": -23.156593322753906, "global_step": 7647, "epoch": 63} {"train_loss": -22.710037231445312, "global_step": 7648, "epoch": 63} {"train_loss": -22.6225643157959, "global_step": 7649, "epoch": 63} {"train_loss": -23.206342697143555, "global_step": 7650, "epoch": 63} {"train_loss": -23.111600875854492, "global_step": 7651, "epoch": 63} {"train_loss": -23.0585994720459, "global_step": 7652, "epoch": 63} {"train_loss": -22.8752498626709, "global_step": 7653, "epoch": 63} {"train_loss": -22.936582565307617, "global_step": 7654, "epoch": 63} {"train_loss": -22.95224952697754, "global_step": 7655, "epoch": 63} {"train_loss": -22.908315658569336, "global_step": 7656, "epoch": 63} {"train_loss": -22.652389526367188, "global_step": 7657, "epoch": 63} {"train_loss": -22.969087600708008, "global_step": 7658, "epoch": 63} {"train_loss": -23.688169479370117, "global_step": 7659, "epoch": 63} {"train_loss": -22.84970474243164, "global_step": 7660, "epoch": 63} {"train_loss": -22.568286895751953, "global_step": 7661, "epoch": 63} {"train_loss": -22.76496696472168, "global_step": 7662, "epoch": 63} {"train_loss": -22.568283081054688, "global_step": 7663, "epoch": 63} {"train_loss": -23.420576095581055, "global_step": 7664, "epoch": 63} {"train_loss": -23.802490234375, "global_step": 7665, "epoch": 63} {"train_loss": -22.51580238342285, "global_step": 7666, "epoch": 63} {"train_loss": -22.89400291442871, "global_step": 7667, "epoch": 63} {"train_loss": -23.101505279541016, "global_step": 7668, "epoch": 63} {"train_loss": -22.016759872436523, "global_step": 7669, "epoch": 63} {"train_loss": -23.045812606811523, "global_step": 7670, "epoch": 63} {"train_loss": -23.334760665893555, "global_step": 7671, "epoch": 63} {"train_loss": -22.545644760131836, "global_step": 7672, "epoch": 63} {"train_loss": -23.239810943603516, "global_step": 7673, "epoch": 63} {"train_loss": -22.769603729248047, "global_step": 7674, "epoch": 63} {"train_loss": -23.473417282104492, "global_step": 7675, "epoch": 63} {"train_loss": -23.291858673095703, "global_step": 7676, "epoch": 63} {"train_loss": -23.04445457458496, "global_step": 7677, "epoch": 63} {"train_loss": -22.737173080444336, "global_step": 7678, "epoch": 63} {"train_loss": -21.780405044555664, "global_step": 7679, "epoch": 63} {"train_loss": -22.26336097717285, "global_step": 7680, "epoch": 63} {"train_loss": -23.529226303100586, "global_step": 7681, "epoch": 63} {"train_loss": -22.89596939086914, "global_step": 7682, "epoch": 63} {"train_loss": -23.101993560791016, "global_step": 7683, "epoch": 63} {"train_loss": -23.62908935546875, "global_step": 7684, "epoch": 63} {"train_loss": -22.260591506958008, "global_step": 7685, "epoch": 63} {"train_loss": -23.334915161132812, "global_step": 7686, "epoch": 63} {"train_loss": -22.85735511779785, "global_step": 7687, "epoch": 63} {"train_loss": -22.578977584838867, "global_step": 7688, "epoch": 63} {"train_loss": -21.31683921813965, "global_step": 7689, "epoch": 63} {"train_loss": -22.368207931518555, "global_step": 7690, "epoch": 63} {"train_loss": -23.053756713867188, "global_step": 7691, "epoch": 63} {"train_loss": -22.746702194213867, "global_step": 7692, "epoch": 63} {"train_loss": -23.004581451416016, "global_step": 7693, "epoch": 63} {"train_loss": -23.651281356811523, "global_step": 7694, "epoch": 63} {"train_loss": -22.72443199157715, "global_step": 7695, "epoch": 63} {"train_loss": -23.519987106323242, "global_step": 7696, "epoch": 63} {"train_loss": -22.852664947509766, "global_step": 7697, "epoch": 63} {"train_loss": -22.854215621948242, "global_step": 7698, "epoch": 63} {"train_loss": -22.91241455078125, "global_step": 7699, "epoch": 63} {"train_loss": -23.225723266601562, "global_step": 7700, "epoch": 63} {"train_loss": -23.594724655151367, "global_step": 7701, "epoch": 63} {"train_loss": -22.839406967163086, "global_step": 7702, "epoch": 63} {"train_loss": -23.258472442626953, "global_step": 7703, "epoch": 63} {"train_loss": -23.311378479003906, "global_step": 7704, "epoch": 63} {"train_loss": -23.349842071533203, "global_step": 7705, "epoch": 63} {"train_loss": -23.053495407104492, "global_step": 7706, "epoch": 63} {"train_loss": -22.79836654663086, "global_step": 7707, "epoch": 63} {"train_loss": -23.156721115112305, "global_step": 7708, "epoch": 63} {"train_loss": -23.25701904296875, "global_step": 7709, "epoch": 63} {"train_loss": -22.74592399597168, "global_step": 7710, "epoch": 63} {"train_loss": -23.537015914916992, "global_step": 7711, "epoch": 63} {"train_loss": -23.24888038635254, "global_step": 7712, "epoch": 63} {"train_loss": -23.543195724487305, "global_step": 7713, "epoch": 63} {"train_loss": -23.627904891967773, "global_step": 7714, "epoch": 63} {"train_loss": -22.756864547729492, "global_step": 7715, "epoch": 63} {"train_loss": -23.425809860229492, "global_step": 7716, "epoch": 63} {"train_loss": -22.67919158935547, "global_step": 7717, "epoch": 63} {"train_loss": -22.460769653320312, "global_step": 7718, "epoch": 63} {"train_loss": -23.36530113220215, "global_step": 7719, "epoch": 63} {"train_loss": -21.28055191040039, "global_step": 7720, "epoch": 63} {"train_loss": -23.882169723510742, "global_step": 7721, "epoch": 63} {"train_loss": -22.209701538085938, "global_step": 7722, "epoch": 63} {"train_loss": -23.465234756469727, "global_step": 7723, "epoch": 63} {"train_loss": -22.71278953552246, "global_step": 7724, "epoch": 63} {"train_loss": -23.674850463867188, "global_step": 7725, "epoch": 63} {"train_loss": -22.9493465423584, "global_step": 7726, "epoch": 63} {"train_loss": -23.708280563354492, "global_step": 7727, "epoch": 63} {"train_loss": -23.665761947631836, "global_step": 7728, "epoch": 63} {"train_loss": -22.362890243530273, "global_step": 7729, "epoch": 63} {"train_loss": -23.722274780273438, "global_step": 7730, "epoch": 63} {"train_loss": -22.51373863220215, "global_step": 7731, "epoch": 63} {"train_loss": -23.503217697143555, "global_step": 7732, "epoch": 63} {"train_loss": -23.34005355834961, "global_step": 7733, "epoch": 63} {"train_loss": -23.62271499633789, "global_step": 7734, "epoch": 63} {"train_loss": -23.53583335876465, "global_step": 7735, "epoch": 63} {"train_loss": -23.55421257019043, "global_step": 7736, "epoch": 63} {"train_loss": -23.706865310668945, "global_step": 7737, "epoch": 63} {"train_loss": -23.160001754760742, "global_step": 7738, "epoch": 63} {"train_loss": -23.693649291992188, "global_step": 7739, "epoch": 63} {"train_loss": -23.405975341796875, "global_step": 7740, "epoch": 63} {"train_loss": -21.969526290893555, "global_step": 7741, "epoch": 63} {"train_loss": -17.72616958618164, "global_step": 7742, "epoch": 63} {"train_loss": -22.77456797450042, "global_step": 7743, "epoch": 63, "val_loss": 2606395.25} {"train_loss": -14.307830810546875, "global_step": 7744, "epoch": 64} {"train_loss": 4.862091064453125, "global_step": 7745, "epoch": 64} {"train_loss": -0.9119608998298645, "global_step": 7746, "epoch": 64} {"train_loss": -7.113498687744141, "global_step": 7747, "epoch": 64} {"train_loss": -11.243121147155762, "global_step": 7748, "epoch": 64} {"train_loss": -9.368612289428711, "global_step": 7749, "epoch": 64} {"train_loss": -10.252477645874023, "global_step": 7750, "epoch": 64} {"train_loss": -16.06574821472168, "global_step": 7751, "epoch": 64} {"train_loss": -16.55746841430664, "global_step": 7752, "epoch": 64} {"train_loss": -15.127359390258789, "global_step": 7753, "epoch": 64} {"train_loss": -16.75628089904785, "global_step": 7754, "epoch": 64} {"train_loss": -16.324844360351562, "global_step": 7755, "epoch": 64} {"train_loss": -16.884084701538086, "global_step": 7756, "epoch": 64} {"train_loss": -17.689369201660156, "global_step": 7757, "epoch": 64} {"train_loss": -16.994077682495117, "global_step": 7758, "epoch": 64} {"train_loss": -17.88719940185547, "global_step": 7759, "epoch": 64} {"train_loss": -17.793701171875, "global_step": 7760, "epoch": 64} {"train_loss": -17.78773307800293, "global_step": 7761, "epoch": 64} {"train_loss": -18.198558807373047, "global_step": 7762, "epoch": 64} {"train_loss": -18.4761962890625, "global_step": 7763, "epoch": 64} {"train_loss": -18.325946807861328, "global_step": 7764, "epoch": 64} {"train_loss": -18.603227615356445, "global_step": 7765, "epoch": 64} {"train_loss": -18.503332138061523, "global_step": 7766, "epoch": 64} {"train_loss": -18.383190155029297, "global_step": 7767, "epoch": 64} {"train_loss": -18.55655860900879, "global_step": 7768, "epoch": 64} {"train_loss": -18.418598175048828, "global_step": 7769, "epoch": 64} {"train_loss": -18.617406845092773, "global_step": 7770, "epoch": 64} {"train_loss": -18.580951690673828, "global_step": 7771, "epoch": 64} {"train_loss": -19.046632766723633, "global_step": 7772, "epoch": 64} {"train_loss": -18.75819206237793, "global_step": 7773, "epoch": 64} {"train_loss": -19.06721305847168, "global_step": 7774, "epoch": 64} {"train_loss": -19.184755325317383, "global_step": 7775, "epoch": 64} {"train_loss": -18.570444107055664, "global_step": 7776, "epoch": 64} {"train_loss": -19.009733200073242, "global_step": 7777, "epoch": 64} {"train_loss": -19.44942283630371, "global_step": 7778, "epoch": 64} {"train_loss": -19.171533584594727, "global_step": 7779, "epoch": 64} {"train_loss": -19.412124633789062, "global_step": 7780, "epoch": 64} {"train_loss": -20.06046485900879, "global_step": 7781, "epoch": 64} {"train_loss": -20.16626739501953, "global_step": 7782, "epoch": 64} {"train_loss": -19.28141212463379, "global_step": 7783, "epoch": 64} {"train_loss": -20.519794464111328, "global_step": 7784, "epoch": 64} {"train_loss": -20.194839477539062, "global_step": 7785, "epoch": 64} {"train_loss": -20.197248458862305, "global_step": 7786, "epoch": 64} {"train_loss": -20.02351188659668, "global_step": 7787, "epoch": 64} {"train_loss": -19.54086685180664, "global_step": 7788, "epoch": 64} {"train_loss": -20.245817184448242, "global_step": 7789, "epoch": 64} {"train_loss": -20.46772575378418, "global_step": 7790, "epoch": 64} {"train_loss": -20.50830841064453, "global_step": 7791, "epoch": 64} {"train_loss": -20.31179428100586, "global_step": 7792, "epoch": 64} {"train_loss": -20.559049606323242, "global_step": 7793, "epoch": 64} {"train_loss": -19.781639099121094, "global_step": 7794, "epoch": 64} {"train_loss": -20.340970993041992, "global_step": 7795, "epoch": 64} {"train_loss": -21.397781372070312, "global_step": 7796, "epoch": 64} {"train_loss": -20.054716110229492, "global_step": 7797, "epoch": 64} {"train_loss": -20.4735107421875, "global_step": 7798, "epoch": 64} {"train_loss": -19.708768844604492, "global_step": 7799, "epoch": 64} {"train_loss": -20.50613784790039, "global_step": 7800, "epoch": 64} {"train_loss": -20.665552139282227, "global_step": 7801, "epoch": 64} {"train_loss": -20.48291015625, "global_step": 7802, "epoch": 64} {"train_loss": -21.488628387451172, "global_step": 7803, "epoch": 64} {"train_loss": -21.173419952392578, "global_step": 7804, "epoch": 64} {"train_loss": -21.06123924255371, "global_step": 7805, "epoch": 64} {"train_loss": -21.146312713623047, "global_step": 7806, "epoch": 64} {"train_loss": -21.521329879760742, "global_step": 7807, "epoch": 64} {"train_loss": -20.809085845947266, "global_step": 7808, "epoch": 64} {"train_loss": -21.271669387817383, "global_step": 7809, "epoch": 64} {"train_loss": -20.909658432006836, "global_step": 7810, "epoch": 64} {"train_loss": -20.899200439453125, "global_step": 7811, "epoch": 64} {"train_loss": -20.793628692626953, "global_step": 7812, "epoch": 64} {"train_loss": -18.252925872802734, "global_step": 7813, "epoch": 64} {"train_loss": -12.739725112915039, "global_step": 7814, "epoch": 64} {"train_loss": -18.034656524658203, "global_step": 7815, "epoch": 64} {"train_loss": -18.42580223083496, "global_step": 7816, "epoch": 64} {"train_loss": -21.065448760986328, "global_step": 7817, "epoch": 64} {"train_loss": -18.63990020751953, "global_step": 7818, "epoch": 64} {"train_loss": -19.716341018676758, "global_step": 7819, "epoch": 64} {"train_loss": -21.349206924438477, "global_step": 7820, "epoch": 64} {"train_loss": -20.293066024780273, "global_step": 7821, "epoch": 64} {"train_loss": -19.482236862182617, "global_step": 7822, "epoch": 64} {"train_loss": -20.957149505615234, "global_step": 7823, "epoch": 64} {"train_loss": -21.21697235107422, "global_step": 7824, "epoch": 64} {"train_loss": -21.2595157623291, "global_step": 7825, "epoch": 64} {"train_loss": -20.27545738220215, "global_step": 7826, "epoch": 64} {"train_loss": -20.685415267944336, "global_step": 7827, "epoch": 64} {"train_loss": -21.720508575439453, "global_step": 7828, "epoch": 64} {"train_loss": -20.925186157226562, "global_step": 7829, "epoch": 64} {"train_loss": -20.961807250976562, "global_step": 7830, "epoch": 64} {"train_loss": -21.419919967651367, "global_step": 7831, "epoch": 64} {"train_loss": -21.418588638305664, "global_step": 7832, "epoch": 64} {"train_loss": -21.188589096069336, "global_step": 7833, "epoch": 64} {"train_loss": -20.62046241760254, "global_step": 7834, "epoch": 64} {"train_loss": -21.31275749206543, "global_step": 7835, "epoch": 64} {"train_loss": -21.237089157104492, "global_step": 7836, "epoch": 64} {"train_loss": -21.512907028198242, "global_step": 7837, "epoch": 64} {"train_loss": -20.983280181884766, "global_step": 7838, "epoch": 64} {"train_loss": -21.10967445373535, "global_step": 7839, "epoch": 64} {"train_loss": -21.253217697143555, "global_step": 7840, "epoch": 64} {"train_loss": -19.28706932067871, "global_step": 7841, "epoch": 64} {"train_loss": -17.217370986938477, "global_step": 7842, "epoch": 64} {"train_loss": -12.640007972717285, "global_step": 7843, "epoch": 64} {"train_loss": -21.300443649291992, "global_step": 7844, "epoch": 64} {"train_loss": -17.832489013671875, "global_step": 7845, "epoch": 64} {"train_loss": -20.7603702545166, "global_step": 7846, "epoch": 64} {"train_loss": -20.43471336364746, "global_step": 7847, "epoch": 64} {"train_loss": -20.01759910583496, "global_step": 7848, "epoch": 64} {"train_loss": -20.230375289916992, "global_step": 7849, "epoch": 64} {"train_loss": -21.070966720581055, "global_step": 7850, "epoch": 64} {"train_loss": -20.91339683532715, "global_step": 7851, "epoch": 64} {"train_loss": -21.120651245117188, "global_step": 7852, "epoch": 64} {"train_loss": -20.36935806274414, "global_step": 7853, "epoch": 64} {"train_loss": -20.67327880859375, "global_step": 7854, "epoch": 64} {"train_loss": -20.920045852661133, "global_step": 7855, "epoch": 64} {"train_loss": -20.964801788330078, "global_step": 7856, "epoch": 64} {"train_loss": -21.021167755126953, "global_step": 7857, "epoch": 64} {"train_loss": -21.280263900756836, "global_step": 7858, "epoch": 64} {"train_loss": -21.332448959350586, "global_step": 7859, "epoch": 64} {"train_loss": -20.58489990234375, "global_step": 7860, "epoch": 64} {"train_loss": -19.60575294494629, "global_step": 7861, "epoch": 64} {"train_loss": -11.534642219543457, "global_step": 7862, "epoch": 64} {"train_loss": -16.379911422729492, "global_step": 7863, "epoch": 64} {"train_loss": -18.87011893179791, "global_step": 7864, "epoch": 64, "val_loss": 3783878.0} {"train_loss": -18.43482208251953, "global_step": 7865, "epoch": 65} {"train_loss": -21.108652114868164, "global_step": 7866, "epoch": 65} {"train_loss": -19.625349044799805, "global_step": 7867, "epoch": 65} {"train_loss": -20.035858154296875, "global_step": 7868, "epoch": 65} {"train_loss": -20.290708541870117, "global_step": 7869, "epoch": 65} {"train_loss": -20.818828582763672, "global_step": 7870, "epoch": 65} {"train_loss": -20.57745933532715, "global_step": 7871, "epoch": 65} {"train_loss": -19.633285522460938, "global_step": 7872, "epoch": 65} {"train_loss": -20.87493896484375, "global_step": 7873, "epoch": 65} {"train_loss": -20.559696197509766, "global_step": 7874, "epoch": 65} {"train_loss": -20.639705657958984, "global_step": 7875, "epoch": 65} {"train_loss": -20.08485984802246, "global_step": 7876, "epoch": 65} {"train_loss": -20.197052001953125, "global_step": 7877, "epoch": 65} {"train_loss": -20.33183479309082, "global_step": 7878, "epoch": 65} {"train_loss": -20.345630645751953, "global_step": 7879, "epoch": 65} {"train_loss": -20.814430236816406, "global_step": 7880, "epoch": 65} {"train_loss": -20.745574951171875, "global_step": 7881, "epoch": 65} {"train_loss": -21.041717529296875, "global_step": 7882, "epoch": 65} {"train_loss": -21.25628089904785, "global_step": 7883, "epoch": 65} {"train_loss": -21.366455078125, "global_step": 7884, "epoch": 65} {"train_loss": -20.914249420166016, "global_step": 7885, "epoch": 65} {"train_loss": -21.394363403320312, "global_step": 7886, "epoch": 65} {"train_loss": -21.257904052734375, "global_step": 7887, "epoch": 65} {"train_loss": -21.3790340423584, "global_step": 7888, "epoch": 65} {"train_loss": -21.146635055541992, "global_step": 7889, "epoch": 65} {"train_loss": -21.63915252685547, "global_step": 7890, "epoch": 65} {"train_loss": -21.4730224609375, "global_step": 7891, "epoch": 65} {"train_loss": -21.66214942932129, "global_step": 7892, "epoch": 65} {"train_loss": -21.622310638427734, "global_step": 7893, "epoch": 65} {"train_loss": -21.53750991821289, "global_step": 7894, "epoch": 65} {"train_loss": -21.588804244995117, "global_step": 7895, "epoch": 65} {"train_loss": -21.781951904296875, "global_step": 7896, "epoch": 65} {"train_loss": -21.997888565063477, "global_step": 7897, "epoch": 65} {"train_loss": -21.768482208251953, "global_step": 7898, "epoch": 65} {"train_loss": -22.135190963745117, "global_step": 7899, "epoch": 65} {"train_loss": -22.253860473632812, "global_step": 7900, "epoch": 65} {"train_loss": -22.36602210998535, "global_step": 7901, "epoch": 65} {"train_loss": -22.352813720703125, "global_step": 7902, "epoch": 65} {"train_loss": -22.466861724853516, "global_step": 7903, "epoch": 65} {"train_loss": -22.324460983276367, "global_step": 7904, "epoch": 65} {"train_loss": -22.292348861694336, "global_step": 7905, "epoch": 65} {"train_loss": -22.453330993652344, "global_step": 7906, "epoch": 65} {"train_loss": -22.37647819519043, "global_step": 7907, "epoch": 65} {"train_loss": -22.56683921813965, "global_step": 7908, "epoch": 65} {"train_loss": -22.46370506286621, "global_step": 7909, "epoch": 65} {"train_loss": -22.36263084411621, "global_step": 7910, "epoch": 65} {"train_loss": -23.0314998626709, "global_step": 7911, "epoch": 65} {"train_loss": -22.452951431274414, "global_step": 7912, "epoch": 65} {"train_loss": -21.226491928100586, "global_step": 7913, "epoch": 65} {"train_loss": -17.653684616088867, "global_step": 7914, "epoch": 65} {"train_loss": -20.82325553894043, "global_step": 7915, "epoch": 65} {"train_loss": -22.744970321655273, "global_step": 7916, "epoch": 65} {"train_loss": -19.479206085205078, "global_step": 7917, "epoch": 65} {"train_loss": -22.70588493347168, "global_step": 7918, "epoch": 65} {"train_loss": -20.99384117126465, "global_step": 7919, "epoch": 65} {"train_loss": -22.19142723083496, "global_step": 7920, "epoch": 65} {"train_loss": -21.775636672973633, "global_step": 7921, "epoch": 65} {"train_loss": -22.272382736206055, "global_step": 7922, "epoch": 65} {"train_loss": -22.046615600585938, "global_step": 7923, "epoch": 65} {"train_loss": -22.488479614257812, "global_step": 7924, "epoch": 65} {"train_loss": -22.1794376373291, "global_step": 7925, "epoch": 65} {"train_loss": -22.4368839263916, "global_step": 7926, "epoch": 65} {"train_loss": -21.295576095581055, "global_step": 7927, "epoch": 65} {"train_loss": -21.761493682861328, "global_step": 7928, "epoch": 65} {"train_loss": -22.717044830322266, "global_step": 7929, "epoch": 65} {"train_loss": -22.581954956054688, "global_step": 7930, "epoch": 65} {"train_loss": -21.705434799194336, "global_step": 7931, "epoch": 65} {"train_loss": -22.950733184814453, "global_step": 7932, "epoch": 65} {"train_loss": -22.381484985351562, "global_step": 7933, "epoch": 65} {"train_loss": -21.382070541381836, "global_step": 7934, "epoch": 65} {"train_loss": -20.757802963256836, "global_step": 7935, "epoch": 65} {"train_loss": -13.583581924438477, "global_step": 7936, "epoch": 65} {"train_loss": -7.315121650695801, "global_step": 7937, "epoch": 65} {"train_loss": -16.853199005126953, "global_step": 7938, "epoch": 65} {"train_loss": -15.990092277526855, "global_step": 7939, "epoch": 65} {"train_loss": -14.15783405303955, "global_step": 7940, "epoch": 65} {"train_loss": -20.357616424560547, "global_step": 7941, "epoch": 65} {"train_loss": -20.41654396057129, "global_step": 7942, "epoch": 65} {"train_loss": -20.25404930114746, "global_step": 7943, "epoch": 65} {"train_loss": -20.101764678955078, "global_step": 7944, "epoch": 65} {"train_loss": -19.459012985229492, "global_step": 7945, "epoch": 65} {"train_loss": -19.015043258666992, "global_step": 7946, "epoch": 65} {"train_loss": -20.146337509155273, "global_step": 7947, "epoch": 65} {"train_loss": -19.981897354125977, "global_step": 7948, "epoch": 65} {"train_loss": -19.62652015686035, "global_step": 7949, "epoch": 65} {"train_loss": -20.50442886352539, "global_step": 7950, "epoch": 65} {"train_loss": -20.327543258666992, "global_step": 7951, "epoch": 65} {"train_loss": -20.139474868774414, "global_step": 7952, "epoch": 65} {"train_loss": -20.377246856689453, "global_step": 7953, "epoch": 65} {"train_loss": -19.84358787536621, "global_step": 7954, "epoch": 65} {"train_loss": -21.31158447265625, "global_step": 7955, "epoch": 65} {"train_loss": -20.368579864501953, "global_step": 7956, "epoch": 65} {"train_loss": -20.573034286499023, "global_step": 7957, "epoch": 65} {"train_loss": -20.238327026367188, "global_step": 7958, "epoch": 65} {"train_loss": -20.61671257019043, "global_step": 7959, "epoch": 65} {"train_loss": -20.845918655395508, "global_step": 7960, "epoch": 65} {"train_loss": -20.655241012573242, "global_step": 7961, "epoch": 65} {"train_loss": -20.560129165649414, "global_step": 7962, "epoch": 65} {"train_loss": -20.536151885986328, "global_step": 7963, "epoch": 65} {"train_loss": -21.27335548400879, "global_step": 7964, "epoch": 65} {"train_loss": -21.03997230529785, "global_step": 7965, "epoch": 65} {"train_loss": -21.373064041137695, "global_step": 7966, "epoch": 65} {"train_loss": -20.861328125, "global_step": 7967, "epoch": 65} {"train_loss": -21.07698631286621, "global_step": 7968, "epoch": 65} {"train_loss": -20.708019256591797, "global_step": 7969, "epoch": 65} {"train_loss": -21.374269485473633, "global_step": 7970, "epoch": 65} {"train_loss": -21.105361938476562, "global_step": 7971, "epoch": 65} {"train_loss": -21.603681564331055, "global_step": 7972, "epoch": 65} {"train_loss": -20.92635154724121, "global_step": 7973, "epoch": 65} {"train_loss": -21.65608787536621, "global_step": 7974, "epoch": 65} {"train_loss": -21.384061813354492, "global_step": 7975, "epoch": 65} {"train_loss": -22.064268112182617, "global_step": 7976, "epoch": 65} {"train_loss": -21.742944717407227, "global_step": 7977, "epoch": 65} {"train_loss": -21.40680503845215, "global_step": 7978, "epoch": 65} {"train_loss": -21.42986488342285, "global_step": 7979, "epoch": 65} {"train_loss": -21.50398063659668, "global_step": 7980, "epoch": 65} {"train_loss": -21.577640533447266, "global_step": 7981, "epoch": 65} {"train_loss": -21.378925323486328, "global_step": 7982, "epoch": 65} {"train_loss": -21.754596710205078, "global_step": 7983, "epoch": 65} {"train_loss": -21.781972885131836, "global_step": 7984, "epoch": 65} {"train_loss": -20.884262881003135, "global_step": 7985, "epoch": 65, "val_loss": 3017310.25} {"train_loss": -22.292556762695312, "global_step": 7986, "epoch": 66} {"train_loss": -21.875125885009766, "global_step": 7987, "epoch": 66} {"train_loss": -21.861095428466797, "global_step": 7988, "epoch": 66} {"train_loss": -22.025476455688477, "global_step": 7989, "epoch": 66} {"train_loss": -22.321138381958008, "global_step": 7990, "epoch": 66} {"train_loss": -22.069412231445312, "global_step": 7991, "epoch": 66} {"train_loss": -22.047998428344727, "global_step": 7992, "epoch": 66} {"train_loss": -21.73665428161621, "global_step": 7993, "epoch": 66} {"train_loss": -20.880672454833984, "global_step": 7994, "epoch": 66} {"train_loss": -17.671955108642578, "global_step": 7995, "epoch": 66} {"train_loss": -13.452323913574219, "global_step": 7996, "epoch": 66} {"train_loss": -11.69123363494873, "global_step": 7997, "epoch": 66} {"train_loss": -16.732486724853516, "global_step": 7998, "epoch": 66} {"train_loss": -10.13888168334961, "global_step": 7999, "epoch": 66} {"train_loss": -19.041269302368164, "global_step": 8000, "epoch": 66} {"train_loss": -16.452564239501953, "global_step": 8001, "epoch": 66} {"train_loss": -19.927947998046875, "global_step": 8002, "epoch": 66} {"train_loss": -17.201190948486328, "global_step": 8003, "epoch": 66} {"train_loss": -19.82720184326172, "global_step": 8004, "epoch": 66} {"train_loss": -19.743343353271484, "global_step": 8005, "epoch": 66} {"train_loss": -20.136199951171875, "global_step": 8006, "epoch": 66} {"train_loss": -19.680917739868164, "global_step": 8007, "epoch": 66} {"train_loss": -20.076459884643555, "global_step": 8008, "epoch": 66} {"train_loss": -19.617483139038086, "global_step": 8009, "epoch": 66} {"train_loss": -19.8192195892334, "global_step": 8010, "epoch": 66} {"train_loss": -20.22060203552246, "global_step": 8011, "epoch": 66} {"train_loss": -19.883132934570312, "global_step": 8012, "epoch": 66} {"train_loss": -20.442792892456055, "global_step": 8013, "epoch": 66} {"train_loss": -20.374244689941406, "global_step": 8014, "epoch": 66} {"train_loss": -20.183568954467773, "global_step": 8015, "epoch": 66} {"train_loss": -20.135692596435547, "global_step": 8016, "epoch": 66} {"train_loss": -20.25689125061035, "global_step": 8017, "epoch": 66} {"train_loss": -20.34401512145996, "global_step": 8018, "epoch": 66} {"train_loss": -20.407455444335938, "global_step": 8019, "epoch": 66} {"train_loss": -20.452795028686523, "global_step": 8020, "epoch": 66} {"train_loss": -20.050922393798828, "global_step": 8021, "epoch": 66} {"train_loss": -20.267019271850586, "global_step": 8022, "epoch": 66} {"train_loss": -20.147497177124023, "global_step": 8023, "epoch": 66} {"train_loss": -20.52778434753418, "global_step": 8024, "epoch": 66} {"train_loss": -20.936460494995117, "global_step": 8025, "epoch": 66} {"train_loss": -20.28192710876465, "global_step": 8026, "epoch": 66} {"train_loss": -20.276966094970703, "global_step": 8027, "epoch": 66} {"train_loss": -20.591413497924805, "global_step": 8028, "epoch": 66} {"train_loss": -20.7177791595459, "global_step": 8029, "epoch": 66} {"train_loss": -20.363374710083008, "global_step": 8030, "epoch": 66} {"train_loss": -20.79695701599121, "global_step": 8031, "epoch": 66} {"train_loss": -20.702579498291016, "global_step": 8032, "epoch": 66} {"train_loss": -20.84364128112793, "global_step": 8033, "epoch": 66} {"train_loss": -20.928512573242188, "global_step": 8034, "epoch": 66} {"train_loss": -20.922964096069336, "global_step": 8035, "epoch": 66} {"train_loss": -21.279775619506836, "global_step": 8036, "epoch": 66} {"train_loss": -20.837581634521484, "global_step": 8037, "epoch": 66} {"train_loss": -21.25556755065918, "global_step": 8038, "epoch": 66} {"train_loss": -21.442182540893555, "global_step": 8039, "epoch": 66} {"train_loss": -21.098953247070312, "global_step": 8040, "epoch": 66} {"train_loss": -21.276769638061523, "global_step": 8041, "epoch": 66} {"train_loss": -21.496835708618164, "global_step": 8042, "epoch": 66} {"train_loss": -21.414518356323242, "global_step": 8043, "epoch": 66} {"train_loss": -21.338876724243164, "global_step": 8044, "epoch": 66} {"train_loss": -21.16572380065918, "global_step": 8045, "epoch": 66} {"train_loss": -21.5238037109375, "global_step": 8046, "epoch": 66} {"train_loss": -22.116474151611328, "global_step": 8047, "epoch": 66} {"train_loss": -22.005163192749023, "global_step": 8048, "epoch": 66} {"train_loss": -22.022613525390625, "global_step": 8049, "epoch": 66} {"train_loss": -22.286115646362305, "global_step": 8050, "epoch": 66} {"train_loss": -21.784353256225586, "global_step": 8051, "epoch": 66} {"train_loss": -21.94936752319336, "global_step": 8052, "epoch": 66} {"train_loss": -22.03657341003418, "global_step": 8053, "epoch": 66} {"train_loss": -21.766061782836914, "global_step": 8054, "epoch": 66} {"train_loss": -22.19944190979004, "global_step": 8055, "epoch": 66} {"train_loss": -21.705209732055664, "global_step": 8056, "epoch": 66} {"train_loss": -22.01027488708496, "global_step": 8057, "epoch": 66} {"train_loss": -21.518774032592773, "global_step": 8058, "epoch": 66} {"train_loss": -22.268709182739258, "global_step": 8059, "epoch": 66} {"train_loss": -22.8010311126709, "global_step": 8060, "epoch": 66} {"train_loss": -22.076580047607422, "global_step": 8061, "epoch": 66} {"train_loss": -22.257299423217773, "global_step": 8062, "epoch": 66} {"train_loss": -22.18207550048828, "global_step": 8063, "epoch": 66} {"train_loss": -22.416950225830078, "global_step": 8064, "epoch": 66} {"train_loss": -22.560043334960938, "global_step": 8065, "epoch": 66} {"train_loss": -22.513025283813477, "global_step": 8066, "epoch": 66} {"train_loss": -22.24447250366211, "global_step": 8067, "epoch": 66} {"train_loss": -22.571746826171875, "global_step": 8068, "epoch": 66} {"train_loss": -22.54589080810547, "global_step": 8069, "epoch": 66} {"train_loss": -23.089223861694336, "global_step": 8070, "epoch": 66} {"train_loss": -22.815731048583984, "global_step": 8071, "epoch": 66} {"train_loss": -22.923189163208008, "global_step": 8072, "epoch": 66} {"train_loss": -22.676136016845703, "global_step": 8073, "epoch": 66} {"train_loss": -23.121427536010742, "global_step": 8074, "epoch": 66} {"train_loss": -23.28583335876465, "global_step": 8075, "epoch": 66} {"train_loss": -22.88945770263672, "global_step": 8076, "epoch": 66} {"train_loss": -22.999248504638672, "global_step": 8077, "epoch": 66} {"train_loss": -23.059484481811523, "global_step": 8078, "epoch": 66} {"train_loss": -23.2025089263916, "global_step": 8079, "epoch": 66} {"train_loss": -23.070993423461914, "global_step": 8080, "epoch": 66} {"train_loss": -23.49654769897461, "global_step": 8081, "epoch": 66} {"train_loss": -23.15458106994629, "global_step": 8082, "epoch": 66} {"train_loss": -23.547504425048828, "global_step": 8083, "epoch": 66} {"train_loss": -23.424442291259766, "global_step": 8084, "epoch": 66} {"train_loss": -23.234643936157227, "global_step": 8085, "epoch": 66} {"train_loss": -23.082233428955078, "global_step": 8086, "epoch": 66} {"train_loss": -23.418609619140625, "global_step": 8087, "epoch": 66} {"train_loss": -23.496488571166992, "global_step": 8088, "epoch": 66} {"train_loss": -23.788257598876953, "global_step": 8089, "epoch": 66} {"train_loss": -23.648584365844727, "global_step": 8090, "epoch": 66} {"train_loss": -23.576879501342773, "global_step": 8091, "epoch": 66} {"train_loss": -23.866195678710938, "global_step": 8092, "epoch": 66} {"train_loss": -23.599321365356445, "global_step": 8093, "epoch": 66} {"train_loss": -23.49022674560547, "global_step": 8094, "epoch": 66} {"train_loss": -23.709352493286133, "global_step": 8095, "epoch": 66} {"train_loss": -23.004959106445312, "global_step": 8096, "epoch": 66} {"train_loss": -23.309829711914062, "global_step": 8097, "epoch": 66} {"train_loss": -21.438364028930664, "global_step": 8098, "epoch": 66} {"train_loss": -15.05602741241455, "global_step": 8099, "epoch": 66} {"train_loss": -13.423898696899414, "global_step": 8100, "epoch": 66} {"train_loss": -21.3233699798584, "global_step": 8101, "epoch": 66} {"train_loss": -19.366567611694336, "global_step": 8102, "epoch": 66} {"train_loss": -22.5450496673584, "global_step": 8103, "epoch": 66} {"train_loss": -20.11781120300293, "global_step": 8104, "epoch": 66} {"train_loss": -22.8370304107666, "global_step": 8105, "epoch": 66} {"train_loss": -21.184552358201714, "global_step": 8106, "epoch": 66, "val_loss": 3249459.25} {"train_loss": -21.80074119567871, "global_step": 8107, "epoch": 67} {"train_loss": -22.72771644592285, "global_step": 8108, "epoch": 67} {"train_loss": -22.21343994140625, "global_step": 8109, "epoch": 67} {"train_loss": -22.964075088500977, "global_step": 8110, "epoch": 67} {"train_loss": -21.9625301361084, "global_step": 8111, "epoch": 67} {"train_loss": -22.174245834350586, "global_step": 8112, "epoch": 67} {"train_loss": -22.469039916992188, "global_step": 8113, "epoch": 67} {"train_loss": -22.90109634399414, "global_step": 8114, "epoch": 67} {"train_loss": -22.810346603393555, "global_step": 8115, "epoch": 67} {"train_loss": -22.34210777282715, "global_step": 8116, "epoch": 67} {"train_loss": -21.963436126708984, "global_step": 8117, "epoch": 67} {"train_loss": -22.611764907836914, "global_step": 8118, "epoch": 67} {"train_loss": -22.17629051208496, "global_step": 8119, "epoch": 67} {"train_loss": -22.349950790405273, "global_step": 8120, "epoch": 67} {"train_loss": -22.942426681518555, "global_step": 8121, "epoch": 67} {"train_loss": -22.88992691040039, "global_step": 8122, "epoch": 67} {"train_loss": -22.222196578979492, "global_step": 8123, "epoch": 67} {"train_loss": -23.173851013183594, "global_step": 8124, "epoch": 67} {"train_loss": -22.646682739257812, "global_step": 8125, "epoch": 67} {"train_loss": -22.87103843688965, "global_step": 8126, "epoch": 67} {"train_loss": -22.96004295349121, "global_step": 8127, "epoch": 67} {"train_loss": -22.611392974853516, "global_step": 8128, "epoch": 67} {"train_loss": -22.96011734008789, "global_step": 8129, "epoch": 67} {"train_loss": -20.547130584716797, "global_step": 8130, "epoch": 67} {"train_loss": -5.630061626434326, "global_step": 8131, "epoch": 67} {"train_loss": -5.344241619110107, "global_step": 8132, "epoch": 67} {"train_loss": -7.511735439300537, "global_step": 8133, "epoch": 67} {"train_loss": -8.521151542663574, "global_step": 8134, "epoch": 67} {"train_loss": -12.345986366271973, "global_step": 8135, "epoch": 67} {"train_loss": -12.63325023651123, "global_step": 8136, "epoch": 67} {"train_loss": -14.103116035461426, "global_step": 8137, "epoch": 67} {"train_loss": -17.121992111206055, "global_step": 8138, "epoch": 67} {"train_loss": -14.90539836883545, "global_step": 8139, "epoch": 67} {"train_loss": -17.724672317504883, "global_step": 8140, "epoch": 67} {"train_loss": -18.66847038269043, "global_step": 8141, "epoch": 67} {"train_loss": -18.716840744018555, "global_step": 8142, "epoch": 67} {"train_loss": -19.08136558532715, "global_step": 8143, "epoch": 67} {"train_loss": -19.313684463500977, "global_step": 8144, "epoch": 67} {"train_loss": -19.532424926757812, "global_step": 8145, "epoch": 67} {"train_loss": -20.3276309967041, "global_step": 8146, "epoch": 67} {"train_loss": -20.687917709350586, "global_step": 8147, "epoch": 67} {"train_loss": -20.70728874206543, "global_step": 8148, "epoch": 67} {"train_loss": -20.37366485595703, "global_step": 8149, "epoch": 67} {"train_loss": -20.613689422607422, "global_step": 8150, "epoch": 67} {"train_loss": -21.09754753112793, "global_step": 8151, "epoch": 67} {"train_loss": -20.641977310180664, "global_step": 8152, "epoch": 67} {"train_loss": -21.225061416625977, "global_step": 8153, "epoch": 67} {"train_loss": -20.87647819519043, "global_step": 8154, "epoch": 67} {"train_loss": -21.241296768188477, "global_step": 8155, "epoch": 67} {"train_loss": -21.3189754486084, "global_step": 8156, "epoch": 67} {"train_loss": -21.653594970703125, "global_step": 8157, "epoch": 67} {"train_loss": -21.065271377563477, "global_step": 8158, "epoch": 67} {"train_loss": -21.292800903320312, "global_step": 8159, "epoch": 67} {"train_loss": -21.292430877685547, "global_step": 8160, "epoch": 67} {"train_loss": -21.604171752929688, "global_step": 8161, "epoch": 67} {"train_loss": -22.304712295532227, "global_step": 8162, "epoch": 67} {"train_loss": -21.704923629760742, "global_step": 8163, "epoch": 67} {"train_loss": -21.877090454101562, "global_step": 8164, "epoch": 67} {"train_loss": -21.836435317993164, "global_step": 8165, "epoch": 67} {"train_loss": -21.693565368652344, "global_step": 8166, "epoch": 67} {"train_loss": -21.509475708007812, "global_step": 8167, "epoch": 67} {"train_loss": -21.678939819335938, "global_step": 8168, "epoch": 67} {"train_loss": -22.0363712310791, "global_step": 8169, "epoch": 67} {"train_loss": -20.917926788330078, "global_step": 8170, "epoch": 67} {"train_loss": -22.138708114624023, "global_step": 8171, "epoch": 67} {"train_loss": -22.718008041381836, "global_step": 8172, "epoch": 67} {"train_loss": -21.32139778137207, "global_step": 8173, "epoch": 67} {"train_loss": -21.792734146118164, "global_step": 8174, "epoch": 67} {"train_loss": -22.23955726623535, "global_step": 8175, "epoch": 67} {"train_loss": -21.646265029907227, "global_step": 8176, "epoch": 67} {"train_loss": -22.242456436157227, "global_step": 8177, "epoch": 67} {"train_loss": -21.843183517456055, "global_step": 8178, "epoch": 67} {"train_loss": -21.796903610229492, "global_step": 8179, "epoch": 67} {"train_loss": -22.046241760253906, "global_step": 8180, "epoch": 67} {"train_loss": -22.466053009033203, "global_step": 8181, "epoch": 67} {"train_loss": -22.005081176757812, "global_step": 8182, "epoch": 67} {"train_loss": -22.133075714111328, "global_step": 8183, "epoch": 67} {"train_loss": -22.264747619628906, "global_step": 8184, "epoch": 67} {"train_loss": -22.321670532226562, "global_step": 8185, "epoch": 67} {"train_loss": -22.478214263916016, "global_step": 8186, "epoch": 67} {"train_loss": -22.25422477722168, "global_step": 8187, "epoch": 67} {"train_loss": -22.833940505981445, "global_step": 8188, "epoch": 67} {"train_loss": -22.279516220092773, "global_step": 8189, "epoch": 67} {"train_loss": -22.931095123291016, "global_step": 8190, "epoch": 67} {"train_loss": -22.405521392822266, "global_step": 8191, "epoch": 67} {"train_loss": -22.4327449798584, "global_step": 8192, "epoch": 67} {"train_loss": -22.570276260375977, "global_step": 8193, "epoch": 67} {"train_loss": -22.513935089111328, "global_step": 8194, "epoch": 67} {"train_loss": -22.850656509399414, "global_step": 8195, "epoch": 67} {"train_loss": -22.705724716186523, "global_step": 8196, "epoch": 67} {"train_loss": -22.937650680541992, "global_step": 8197, "epoch": 67} {"train_loss": -22.37935447692871, "global_step": 8198, "epoch": 67} {"train_loss": -22.45183753967285, "global_step": 8199, "epoch": 67} {"train_loss": -22.461410522460938, "global_step": 8200, "epoch": 67} {"train_loss": -22.46573829650879, "global_step": 8201, "epoch": 67} {"train_loss": -22.48828125, "global_step": 8202, "epoch": 67} {"train_loss": -23.03761100769043, "global_step": 8203, "epoch": 67} {"train_loss": -23.17587661743164, "global_step": 8204, "epoch": 67} {"train_loss": -22.9534912109375, "global_step": 8205, "epoch": 67} {"train_loss": -22.64536476135254, "global_step": 8206, "epoch": 67} {"train_loss": -22.646129608154297, "global_step": 8207, "epoch": 67} {"train_loss": -23.34098243713379, "global_step": 8208, "epoch": 67} {"train_loss": -22.376296997070312, "global_step": 8209, "epoch": 67} {"train_loss": -22.46946144104004, "global_step": 8210, "epoch": 67} {"train_loss": -23.167713165283203, "global_step": 8211, "epoch": 67} {"train_loss": -23.358610153198242, "global_step": 8212, "epoch": 67} {"train_loss": -22.54874038696289, "global_step": 8213, "epoch": 67} {"train_loss": -22.976428985595703, "global_step": 8214, "epoch": 67} {"train_loss": -23.46870994567871, "global_step": 8215, "epoch": 67} {"train_loss": -22.79486656188965, "global_step": 8216, "epoch": 67} {"train_loss": -22.7089786529541, "global_step": 8217, "epoch": 67} {"train_loss": -23.053869247436523, "global_step": 8218, "epoch": 67} {"train_loss": -22.903095245361328, "global_step": 8219, "epoch": 67} {"train_loss": -23.044923782348633, "global_step": 8220, "epoch": 67} {"train_loss": -22.40806007385254, "global_step": 8221, "epoch": 67} {"train_loss": -21.370986938476562, "global_step": 8222, "epoch": 67} {"train_loss": -14.881964683532715, "global_step": 8223, "epoch": 67} {"train_loss": -5.669286251068115, "global_step": 8224, "epoch": 67} {"train_loss": -6.619897365570068, "global_step": 8225, "epoch": 67} {"train_loss": -7.7234930992126465, "global_step": 8226, "epoch": 67} {"train_loss": -20.63508038481405, "global_step": 8227, "epoch": 67, "val_loss": 5543309.5} {"train_loss": -8.206194877624512, "global_step": 8228, "epoch": 68} {"train_loss": -7.603814601898193, "global_step": 8229, "epoch": 68} {"train_loss": -8.253865242004395, "global_step": 8230, "epoch": 68} {"train_loss": -8.34724235534668, "global_step": 8231, "epoch": 68} {"train_loss": -9.732260704040527, "global_step": 8232, "epoch": 68} {"train_loss": -11.156088829040527, "global_step": 8233, "epoch": 68} {"train_loss": -10.7634916305542, "global_step": 8234, "epoch": 68} {"train_loss": -11.31470775604248, "global_step": 8235, "epoch": 68} {"train_loss": -10.431113243103027, "global_step": 8236, "epoch": 68} {"train_loss": -11.559854507446289, "global_step": 8237, "epoch": 68} {"train_loss": -12.537025451660156, "global_step": 8238, "epoch": 68} {"train_loss": -12.375868797302246, "global_step": 8239, "epoch": 68} {"train_loss": -11.941447257995605, "global_step": 8240, "epoch": 68} {"train_loss": -13.517804145812988, "global_step": 8241, "epoch": 68} {"train_loss": -11.019049644470215, "global_step": 8242, "epoch": 68} {"train_loss": -11.10376262664795, "global_step": 8243, "epoch": 68} {"train_loss": -12.840112686157227, "global_step": 8244, "epoch": 68} {"train_loss": -12.121298789978027, "global_step": 8245, "epoch": 68} {"train_loss": -13.677337646484375, "global_step": 8246, "epoch": 68} {"train_loss": -14.008035659790039, "global_step": 8247, "epoch": 68} {"train_loss": -13.050165176391602, "global_step": 8248, "epoch": 68} {"train_loss": -14.003283500671387, "global_step": 8249, "epoch": 68} {"train_loss": -13.8250150680542, "global_step": 8250, "epoch": 68} {"train_loss": -14.804341316223145, "global_step": 8251, "epoch": 68} {"train_loss": -12.781780242919922, "global_step": 8252, "epoch": 68} {"train_loss": -14.488824844360352, "global_step": 8253, "epoch": 68} {"train_loss": -13.083086967468262, "global_step": 8254, "epoch": 68} {"train_loss": -13.329492568969727, "global_step": 8255, "epoch": 68} {"train_loss": -15.063580513000488, "global_step": 8256, "epoch": 68} {"train_loss": -14.209540367126465, "global_step": 8257, "epoch": 68} {"train_loss": -14.149563789367676, "global_step": 8258, "epoch": 68} {"train_loss": -15.627023696899414, "global_step": 8259, "epoch": 68} {"train_loss": -16.5148983001709, "global_step": 8260, "epoch": 68} {"train_loss": -14.995635986328125, "global_step": 8261, "epoch": 68} {"train_loss": -16.65378761291504, "global_step": 8262, "epoch": 68} {"train_loss": -16.06504249572754, "global_step": 8263, "epoch": 68} {"train_loss": -16.823318481445312, "global_step": 8264, "epoch": 68} {"train_loss": -15.3530912399292, "global_step": 8265, "epoch": 68} {"train_loss": -16.896947860717773, "global_step": 8266, "epoch": 68} {"train_loss": -16.417295455932617, "global_step": 8267, "epoch": 68} {"train_loss": -16.158750534057617, "global_step": 8268, "epoch": 68} {"train_loss": -16.7542667388916, "global_step": 8269, "epoch": 68} {"train_loss": -17.382719039916992, "global_step": 8270, "epoch": 68} {"train_loss": -17.286130905151367, "global_step": 8271, "epoch": 68} {"train_loss": -17.22911262512207, "global_step": 8272, "epoch": 68} {"train_loss": -16.947114944458008, "global_step": 8273, "epoch": 68} {"train_loss": -17.59642219543457, "global_step": 8274, "epoch": 68} {"train_loss": -16.92758560180664, "global_step": 8275, "epoch": 68} {"train_loss": -17.238637924194336, "global_step": 8276, "epoch": 68} {"train_loss": -17.61659049987793, "global_step": 8277, "epoch": 68} {"train_loss": -17.731657028198242, "global_step": 8278, "epoch": 68} {"train_loss": -18.056854248046875, "global_step": 8279, "epoch": 68} {"train_loss": -17.43248176574707, "global_step": 8280, "epoch": 68} {"train_loss": -18.627065658569336, "global_step": 8281, "epoch": 68} {"train_loss": -18.835100173950195, "global_step": 8282, "epoch": 68} {"train_loss": -18.35304069519043, "global_step": 8283, "epoch": 68} {"train_loss": -19.379446029663086, "global_step": 8284, "epoch": 68} {"train_loss": -18.617263793945312, "global_step": 8285, "epoch": 68} {"train_loss": -19.800861358642578, "global_step": 8286, "epoch": 68} {"train_loss": -18.6730899810791, "global_step": 8287, "epoch": 68} {"train_loss": -16.5690975189209, "global_step": 8288, "epoch": 68} {"train_loss": -11.56402587890625, "global_step": 8289, "epoch": 68} {"train_loss": -17.911361694335938, "global_step": 8290, "epoch": 68} {"train_loss": -15.645401000976562, "global_step": 8291, "epoch": 68} {"train_loss": -18.650257110595703, "global_step": 8292, "epoch": 68} {"train_loss": -17.957050323486328, "global_step": 8293, "epoch": 68} {"train_loss": -18.165699005126953, "global_step": 8294, "epoch": 68} {"train_loss": -17.701852798461914, "global_step": 8295, "epoch": 68} {"train_loss": -18.82358169555664, "global_step": 8296, "epoch": 68} {"train_loss": -18.800537109375, "global_step": 8297, "epoch": 68} {"train_loss": -19.175992965698242, "global_step": 8298, "epoch": 68} {"train_loss": -19.06918716430664, "global_step": 8299, "epoch": 68} {"train_loss": -19.397123336791992, "global_step": 8300, "epoch": 68} {"train_loss": -19.3201961517334, "global_step": 8301, "epoch": 68} {"train_loss": -18.61018943786621, "global_step": 8302, "epoch": 68} {"train_loss": -19.6449031829834, "global_step": 8303, "epoch": 68} {"train_loss": -20.110071182250977, "global_step": 8304, "epoch": 68} {"train_loss": -19.977792739868164, "global_step": 8305, "epoch": 68} {"train_loss": -19.90485191345215, "global_step": 8306, "epoch": 68} {"train_loss": -18.6708984375, "global_step": 8307, "epoch": 68} {"train_loss": -17.908462524414062, "global_step": 8308, "epoch": 68} {"train_loss": -12.741209983825684, "global_step": 8309, "epoch": 68} {"train_loss": -15.738662719726562, "global_step": 8310, "epoch": 68} {"train_loss": -17.933683395385742, "global_step": 8311, "epoch": 68} {"train_loss": -20.065401077270508, "global_step": 8312, "epoch": 68} {"train_loss": -17.886518478393555, "global_step": 8313, "epoch": 68} {"train_loss": -18.436708450317383, "global_step": 8314, "epoch": 68} {"train_loss": -20.056638717651367, "global_step": 8315, "epoch": 68} {"train_loss": -19.657535552978516, "global_step": 8316, "epoch": 68} {"train_loss": -20.169673919677734, "global_step": 8317, "epoch": 68} {"train_loss": -19.20461082458496, "global_step": 8318, "epoch": 68} {"train_loss": -19.565105438232422, "global_step": 8319, "epoch": 68} {"train_loss": -18.34299087524414, "global_step": 8320, "epoch": 68} {"train_loss": -19.734729766845703, "global_step": 8321, "epoch": 68} {"train_loss": -19.435152053833008, "global_step": 8322, "epoch": 68} {"train_loss": -19.121469497680664, "global_step": 8323, "epoch": 68} {"train_loss": -19.206087112426758, "global_step": 8324, "epoch": 68} {"train_loss": -20.07730484008789, "global_step": 8325, "epoch": 68} {"train_loss": -19.286880493164062, "global_step": 8326, "epoch": 68} {"train_loss": -20.285253524780273, "global_step": 8327, "epoch": 68} {"train_loss": -19.62397575378418, "global_step": 8328, "epoch": 68} {"train_loss": -19.665245056152344, "global_step": 8329, "epoch": 68} {"train_loss": -19.638113021850586, "global_step": 8330, "epoch": 68} {"train_loss": -19.721193313598633, "global_step": 8331, "epoch": 68} {"train_loss": -20.06918716430664, "global_step": 8332, "epoch": 68} {"train_loss": -19.86147117614746, "global_step": 8333, "epoch": 68} {"train_loss": -19.44612693786621, "global_step": 8334, "epoch": 68} {"train_loss": -19.65015983581543, "global_step": 8335, "epoch": 68} {"train_loss": -20.09016227722168, "global_step": 8336, "epoch": 68} {"train_loss": -20.811798095703125, "global_step": 8337, "epoch": 68} {"train_loss": -20.306169509887695, "global_step": 8338, "epoch": 68} {"train_loss": -19.243581771850586, "global_step": 8339, "epoch": 68} {"train_loss": -20.6323184967041, "global_step": 8340, "epoch": 68} {"train_loss": -20.079498291015625, "global_step": 8341, "epoch": 68} {"train_loss": -20.069416046142578, "global_step": 8342, "epoch": 68} {"train_loss": -20.027048110961914, "global_step": 8343, "epoch": 68} {"train_loss": -20.309673309326172, "global_step": 8344, "epoch": 68} {"train_loss": -20.88893699645996, "global_step": 8345, "epoch": 68} {"train_loss": -20.645313262939453, "global_step": 8346, "epoch": 68} {"train_loss": -20.589033126831055, "global_step": 8347, "epoch": 68} {"train_loss": -16.86551661136722, "global_step": 8348, "epoch": 68, "val_loss": 3606580.75} {"train_loss": -21.11736297607422, "global_step": 8349, "epoch": 69} {"train_loss": -20.820194244384766, "global_step": 8350, "epoch": 69} {"train_loss": -21.181320190429688, "global_step": 8351, "epoch": 69} {"train_loss": -20.871679306030273, "global_step": 8352, "epoch": 69} {"train_loss": -21.16160011291504, "global_step": 8353, "epoch": 69} {"train_loss": -21.03285789489746, "global_step": 8354, "epoch": 69} {"train_loss": -21.432371139526367, "global_step": 8355, "epoch": 69} {"train_loss": -21.789011001586914, "global_step": 8356, "epoch": 69} {"train_loss": -21.508642196655273, "global_step": 8357, "epoch": 69} {"train_loss": -22.225204467773438, "global_step": 8358, "epoch": 69} {"train_loss": -21.8074951171875, "global_step": 8359, "epoch": 69} {"train_loss": -21.850706100463867, "global_step": 8360, "epoch": 69} {"train_loss": -21.382232666015625, "global_step": 8361, "epoch": 69} {"train_loss": -22.173295974731445, "global_step": 8362, "epoch": 69} {"train_loss": -21.801513671875, "global_step": 8363, "epoch": 69} {"train_loss": -22.048248291015625, "global_step": 8364, "epoch": 69} {"train_loss": -21.89314842224121, "global_step": 8365, "epoch": 69} {"train_loss": -21.77437400817871, "global_step": 8366, "epoch": 69} {"train_loss": -22.492738723754883, "global_step": 8367, "epoch": 69} {"train_loss": -22.480588912963867, "global_step": 8368, "epoch": 69} {"train_loss": -22.09285545349121, "global_step": 8369, "epoch": 69} {"train_loss": -22.663833618164062, "global_step": 8370, "epoch": 69} {"train_loss": -22.359220504760742, "global_step": 8371, "epoch": 69} {"train_loss": -22.53360939025879, "global_step": 8372, "epoch": 69} {"train_loss": -22.4330997467041, "global_step": 8373, "epoch": 69} {"train_loss": -22.01825714111328, "global_step": 8374, "epoch": 69} {"train_loss": -17.279314041137695, "global_step": 8375, "epoch": 69} {"train_loss": -8.020517349243164, "global_step": 8376, "epoch": 69} {"train_loss": -19.48386573791504, "global_step": 8377, "epoch": 69} {"train_loss": -17.65546989440918, "global_step": 8378, "epoch": 69} {"train_loss": -20.637435913085938, "global_step": 8379, "epoch": 69} {"train_loss": -20.98788833618164, "global_step": 8380, "epoch": 69} {"train_loss": -19.981487274169922, "global_step": 8381, "epoch": 69} {"train_loss": -19.8953914642334, "global_step": 8382, "epoch": 69} {"train_loss": -20.25423812866211, "global_step": 8383, "epoch": 69} {"train_loss": -21.26650047302246, "global_step": 8384, "epoch": 69} {"train_loss": -21.574689865112305, "global_step": 8385, "epoch": 69} {"train_loss": -21.487180709838867, "global_step": 8386, "epoch": 69} {"train_loss": -21.04169464111328, "global_step": 8387, "epoch": 69} {"train_loss": -20.930078506469727, "global_step": 8388, "epoch": 69} {"train_loss": -21.12604331970215, "global_step": 8389, "epoch": 69} {"train_loss": -21.192049026489258, "global_step": 8390, "epoch": 69} {"train_loss": -20.15411949157715, "global_step": 8391, "epoch": 69} {"train_loss": -20.061084747314453, "global_step": 8392, "epoch": 69} {"train_loss": -20.14093017578125, "global_step": 8393, "epoch": 69} {"train_loss": -20.567218780517578, "global_step": 8394, "epoch": 69} {"train_loss": -21.182531356811523, "global_step": 8395, "epoch": 69} {"train_loss": -21.6262264251709, "global_step": 8396, "epoch": 69} {"train_loss": -21.329919815063477, "global_step": 8397, "epoch": 69} {"train_loss": -21.632062911987305, "global_step": 8398, "epoch": 69} {"train_loss": -20.902685165405273, "global_step": 8399, "epoch": 69} {"train_loss": -21.13434600830078, "global_step": 8400, "epoch": 69} {"train_loss": -21.00180435180664, "global_step": 8401, "epoch": 69} {"train_loss": -21.66343116760254, "global_step": 8402, "epoch": 69} {"train_loss": -21.692495346069336, "global_step": 8403, "epoch": 69} {"train_loss": -21.821678161621094, "global_step": 8404, "epoch": 69} {"train_loss": -21.65049171447754, "global_step": 8405, "epoch": 69} {"train_loss": -21.232019424438477, "global_step": 8406, "epoch": 69} {"train_loss": -21.43787384033203, "global_step": 8407, "epoch": 69} {"train_loss": -20.829824447631836, "global_step": 8408, "epoch": 69} {"train_loss": -21.07794952392578, "global_step": 8409, "epoch": 69} {"train_loss": -21.697477340698242, "global_step": 8410, "epoch": 69} {"train_loss": -21.45710563659668, "global_step": 8411, "epoch": 69} {"train_loss": -21.327939987182617, "global_step": 8412, "epoch": 69} {"train_loss": -22.20897674560547, "global_step": 8413, "epoch": 69} {"train_loss": -21.44869613647461, "global_step": 8414, "epoch": 69} {"train_loss": -21.54068374633789, "global_step": 8415, "epoch": 69} {"train_loss": -21.574865341186523, "global_step": 8416, "epoch": 69} {"train_loss": -21.831478118896484, "global_step": 8417, "epoch": 69} {"train_loss": -22.267074584960938, "global_step": 8418, "epoch": 69} {"train_loss": -20.746191024780273, "global_step": 8419, "epoch": 69} {"train_loss": -21.63217544555664, "global_step": 8420, "epoch": 69} {"train_loss": -21.44253158569336, "global_step": 8421, "epoch": 69} {"train_loss": -21.18466567993164, "global_step": 8422, "epoch": 69} {"train_loss": -21.407764434814453, "global_step": 8423, "epoch": 69} {"train_loss": -21.606245040893555, "global_step": 8424, "epoch": 69} {"train_loss": -22.163982391357422, "global_step": 8425, "epoch": 69} {"train_loss": -21.28633689880371, "global_step": 8426, "epoch": 69} {"train_loss": -21.78304100036621, "global_step": 8427, "epoch": 69} {"train_loss": -20.179067611694336, "global_step": 8428, "epoch": 69} {"train_loss": -17.565961837768555, "global_step": 8429, "epoch": 69} {"train_loss": -16.01955223083496, "global_step": 8430, "epoch": 69} {"train_loss": -17.493436813354492, "global_step": 8431, "epoch": 69} {"train_loss": -18.153106689453125, "global_step": 8432, "epoch": 69} {"train_loss": -20.79774284362793, "global_step": 8433, "epoch": 69} {"train_loss": -20.560832977294922, "global_step": 8434, "epoch": 69} {"train_loss": -20.922624588012695, "global_step": 8435, "epoch": 69} {"train_loss": -20.75221061706543, "global_step": 8436, "epoch": 69} {"train_loss": -20.079866409301758, "global_step": 8437, "epoch": 69} {"train_loss": -20.90463638305664, "global_step": 8438, "epoch": 69} {"train_loss": -20.57270050048828, "global_step": 8439, "epoch": 69} {"train_loss": -20.968311309814453, "global_step": 8440, "epoch": 69} {"train_loss": -21.451223373413086, "global_step": 8441, "epoch": 69} {"train_loss": -21.017850875854492, "global_step": 8442, "epoch": 69} {"train_loss": -21.205556869506836, "global_step": 8443, "epoch": 69} {"train_loss": -21.1054744720459, "global_step": 8444, "epoch": 69} {"train_loss": -21.25750160217285, "global_step": 8445, "epoch": 69} {"train_loss": -21.633604049682617, "global_step": 8446, "epoch": 69} {"train_loss": -21.272628784179688, "global_step": 8447, "epoch": 69} {"train_loss": -21.627988815307617, "global_step": 8448, "epoch": 69} {"train_loss": -21.388364791870117, "global_step": 8449, "epoch": 69} {"train_loss": -21.27492332458496, "global_step": 8450, "epoch": 69} {"train_loss": -21.8580379486084, "global_step": 8451, "epoch": 69} {"train_loss": -21.307523727416992, "global_step": 8452, "epoch": 69} {"train_loss": -21.046979904174805, "global_step": 8453, "epoch": 69} {"train_loss": -21.639324188232422, "global_step": 8454, "epoch": 69} {"train_loss": -21.542333602905273, "global_step": 8455, "epoch": 69} {"train_loss": -21.638090133666992, "global_step": 8456, "epoch": 69} {"train_loss": -21.73359489440918, "global_step": 8457, "epoch": 69} {"train_loss": -21.05043601989746, "global_step": 8458, "epoch": 69} {"train_loss": -21.213972091674805, "global_step": 8459, "epoch": 69} {"train_loss": -22.079015731811523, "global_step": 8460, "epoch": 69} {"train_loss": -21.98044776916504, "global_step": 8461, "epoch": 69} {"train_loss": -21.638395309448242, "global_step": 8462, "epoch": 69} {"train_loss": -22.24471092224121, "global_step": 8463, "epoch": 69} {"train_loss": -22.32029151916504, "global_step": 8464, "epoch": 69} {"train_loss": -22.17194938659668, "global_step": 8465, "epoch": 69} {"train_loss": -22.288925170898438, "global_step": 8466, "epoch": 69} {"train_loss": -22.30733299255371, "global_step": 8467, "epoch": 69} {"train_loss": -22.11518669128418, "global_step": 8468, "epoch": 69} {"train_loss": -21.092468892247222, "global_step": 8469, "epoch": 69, "val_loss": 3413144.25} {"train_loss": -22.597333908081055, "global_step": 8470, "epoch": 70} {"train_loss": -22.292341232299805, "global_step": 8471, "epoch": 70} {"train_loss": -22.525632858276367, "global_step": 8472, "epoch": 70} {"train_loss": -22.3087100982666, "global_step": 8473, "epoch": 70} {"train_loss": -22.26177978515625, "global_step": 8474, "epoch": 70} {"train_loss": -22.17045021057129, "global_step": 8475, "epoch": 70} {"train_loss": -22.75797462463379, "global_step": 8476, "epoch": 70} {"train_loss": -22.530881881713867, "global_step": 8477, "epoch": 70} {"train_loss": -23.338333129882812, "global_step": 8478, "epoch": 70} {"train_loss": -22.335979461669922, "global_step": 8479, "epoch": 70} {"train_loss": -23.367856979370117, "global_step": 8480, "epoch": 70} {"train_loss": -22.94013023376465, "global_step": 8481, "epoch": 70} {"train_loss": -23.354238510131836, "global_step": 8482, "epoch": 70} {"train_loss": -23.39249610900879, "global_step": 8483, "epoch": 70} {"train_loss": -23.153240203857422, "global_step": 8484, "epoch": 70} {"train_loss": -23.67409324645996, "global_step": 8485, "epoch": 70} {"train_loss": -22.953004837036133, "global_step": 8486, "epoch": 70} {"train_loss": -23.589147567749023, "global_step": 8487, "epoch": 70} {"train_loss": -23.324254989624023, "global_step": 8488, "epoch": 70} {"train_loss": -23.49493408203125, "global_step": 8489, "epoch": 70} {"train_loss": -23.64112663269043, "global_step": 8490, "epoch": 70} {"train_loss": -23.132652282714844, "global_step": 8491, "epoch": 70} {"train_loss": -22.759185791015625, "global_step": 8492, "epoch": 70} {"train_loss": -17.28663444519043, "global_step": 8493, "epoch": 70} {"train_loss": 16.3619327545166, "global_step": 8494, "epoch": 70} {"train_loss": 27.318689346313477, "global_step": 8495, "epoch": 70} {"train_loss": -15.455551147460938, "global_step": 8496, "epoch": 70} {"train_loss": -17.00440788269043, "global_step": 8497, "epoch": 70} {"train_loss": -6.488687992095947, "global_step": 8498, "epoch": 70} {"train_loss": -12.387810707092285, "global_step": 8499, "epoch": 70} {"train_loss": -17.600934982299805, "global_step": 8500, "epoch": 70} {"train_loss": -19.58502960205078, "global_step": 8501, "epoch": 70} {"train_loss": -19.983171463012695, "global_step": 8502, "epoch": 70} {"train_loss": -20.01334571838379, "global_step": 8503, "epoch": 70} {"train_loss": -19.330673217773438, "global_step": 8504, "epoch": 70} {"train_loss": -19.135942459106445, "global_step": 8505, "epoch": 70} {"train_loss": -18.69509506225586, "global_step": 8506, "epoch": 70} {"train_loss": -18.48444938659668, "global_step": 8507, "epoch": 70} {"train_loss": -19.474586486816406, "global_step": 8508, "epoch": 70} {"train_loss": -18.8715763092041, "global_step": 8509, "epoch": 70} {"train_loss": -19.424091339111328, "global_step": 8510, "epoch": 70} {"train_loss": -19.61481285095215, "global_step": 8511, "epoch": 70} {"train_loss": -19.62186622619629, "global_step": 8512, "epoch": 70} {"train_loss": -19.287031173706055, "global_step": 8513, "epoch": 70} {"train_loss": -20.0137996673584, "global_step": 8514, "epoch": 70} {"train_loss": -19.973072052001953, "global_step": 8515, "epoch": 70} {"train_loss": -20.164039611816406, "global_step": 8516, "epoch": 70} {"train_loss": -20.141115188598633, "global_step": 8517, "epoch": 70} {"train_loss": -20.49489402770996, "global_step": 8518, "epoch": 70} {"train_loss": -20.05891227722168, "global_step": 8519, "epoch": 70} {"train_loss": -20.78019142150879, "global_step": 8520, "epoch": 70} {"train_loss": -20.126541137695312, "global_step": 8521, "epoch": 70} {"train_loss": -20.212848663330078, "global_step": 8522, "epoch": 70} {"train_loss": -20.310928344726562, "global_step": 8523, "epoch": 70} {"train_loss": -20.904037475585938, "global_step": 8524, "epoch": 70} {"train_loss": -20.548547744750977, "global_step": 8525, "epoch": 70} {"train_loss": -21.012470245361328, "global_step": 8526, "epoch": 70} {"train_loss": -20.585464477539062, "global_step": 8527, "epoch": 70} {"train_loss": -20.741168975830078, "global_step": 8528, "epoch": 70} {"train_loss": -20.434467315673828, "global_step": 8529, "epoch": 70} {"train_loss": -20.983488082885742, "global_step": 8530, "epoch": 70} {"train_loss": -20.60845375061035, "global_step": 8531, "epoch": 70} {"train_loss": -20.874469757080078, "global_step": 8532, "epoch": 70} {"train_loss": -20.936237335205078, "global_step": 8533, "epoch": 70} {"train_loss": -21.016050338745117, "global_step": 8534, "epoch": 70} {"train_loss": -20.50362777709961, "global_step": 8535, "epoch": 70} {"train_loss": -21.328664779663086, "global_step": 8536, "epoch": 70} {"train_loss": -21.443099975585938, "global_step": 8537, "epoch": 70} {"train_loss": -21.930173873901367, "global_step": 8538, "epoch": 70} {"train_loss": -20.320283889770508, "global_step": 8539, "epoch": 70} {"train_loss": -21.697673797607422, "global_step": 8540, "epoch": 70} {"train_loss": -21.061538696289062, "global_step": 8541, "epoch": 70} {"train_loss": -21.205930709838867, "global_step": 8542, "epoch": 70} {"train_loss": -20.879228591918945, "global_step": 8543, "epoch": 70} {"train_loss": -21.26825714111328, "global_step": 8544, "epoch": 70} {"train_loss": -21.04509925842285, "global_step": 8545, "epoch": 70} {"train_loss": -20.594900131225586, "global_step": 8546, "epoch": 70} {"train_loss": -18.614065170288086, "global_step": 8547, "epoch": 70} {"train_loss": -17.30585289001465, "global_step": 8548, "epoch": 70} {"train_loss": -19.930063247680664, "global_step": 8549, "epoch": 70} {"train_loss": -21.383018493652344, "global_step": 8550, "epoch": 70} {"train_loss": -19.85927963256836, "global_step": 8551, "epoch": 70} {"train_loss": -21.51696014404297, "global_step": 8552, "epoch": 70} {"train_loss": -20.573881149291992, "global_step": 8553, "epoch": 70} {"train_loss": -21.399951934814453, "global_step": 8554, "epoch": 70} {"train_loss": -20.17107582092285, "global_step": 8555, "epoch": 70} {"train_loss": -20.785951614379883, "global_step": 8556, "epoch": 70} {"train_loss": -21.146451950073242, "global_step": 8557, "epoch": 70} {"train_loss": -20.29660987854004, "global_step": 8558, "epoch": 70} {"train_loss": -21.12958526611328, "global_step": 8559, "epoch": 70} {"train_loss": -20.922592163085938, "global_step": 8560, "epoch": 70} {"train_loss": -21.008020401000977, "global_step": 8561, "epoch": 70} {"train_loss": -21.194290161132812, "global_step": 8562, "epoch": 70} {"train_loss": -21.60586929321289, "global_step": 8563, "epoch": 70} {"train_loss": -21.039613723754883, "global_step": 8564, "epoch": 70} {"train_loss": -21.075271606445312, "global_step": 8565, "epoch": 70} {"train_loss": -21.15013313293457, "global_step": 8566, "epoch": 70} {"train_loss": -18.629697799682617, "global_step": 8567, "epoch": 70} {"train_loss": -14.990450859069824, "global_step": 8568, "epoch": 70} {"train_loss": -5.793665409088135, "global_step": 8569, "epoch": 70} {"train_loss": -14.920111656188965, "global_step": 8570, "epoch": 70} {"train_loss": -16.2333984375, "global_step": 8571, "epoch": 70} {"train_loss": -21.02642822265625, "global_step": 8572, "epoch": 70} {"train_loss": -16.671960830688477, "global_step": 8573, "epoch": 70} {"train_loss": -16.908105850219727, "global_step": 8574, "epoch": 70} {"train_loss": -19.508045196533203, "global_step": 8575, "epoch": 70} {"train_loss": -20.57052230834961, "global_step": 8576, "epoch": 70} {"train_loss": -20.165781021118164, "global_step": 8577, "epoch": 70} {"train_loss": -19.392539978027344, "global_step": 8578, "epoch": 70} {"train_loss": -19.968870162963867, "global_step": 8579, "epoch": 70} {"train_loss": -19.271360397338867, "global_step": 8580, "epoch": 70} {"train_loss": -19.839872360229492, "global_step": 8581, "epoch": 70} {"train_loss": -19.58448600769043, "global_step": 8582, "epoch": 70} {"train_loss": -19.906110763549805, "global_step": 8583, "epoch": 70} {"train_loss": -20.099515914916992, "global_step": 8584, "epoch": 70} {"train_loss": -19.837671279907227, "global_step": 8585, "epoch": 70} {"train_loss": -20.685129165649414, "global_step": 8586, "epoch": 70} {"train_loss": -20.095218658447266, "global_step": 8587, "epoch": 70} {"train_loss": -19.518592834472656, "global_step": 8588, "epoch": 70} {"train_loss": -19.71567726135254, "global_step": 8589, "epoch": 70} {"train_loss": -19.516534048663683, "global_step": 8590, "epoch": 70, "val_loss": 2796222.25} {"train_loss": -20.473997116088867, "global_step": 8591, "epoch": 71} {"train_loss": -20.134796142578125, "global_step": 8592, "epoch": 71} {"train_loss": -19.879846572875977, "global_step": 8593, "epoch": 71} {"train_loss": -20.394216537475586, "global_step": 8594, "epoch": 71} {"train_loss": -19.712594985961914, "global_step": 8595, "epoch": 71} {"train_loss": -20.890172958374023, "global_step": 8596, "epoch": 71} {"train_loss": -19.828969955444336, "global_step": 8597, "epoch": 71} {"train_loss": -20.62244987487793, "global_step": 8598, "epoch": 71} {"train_loss": -20.661602020263672, "global_step": 8599, "epoch": 71} {"train_loss": -19.767541885375977, "global_step": 8600, "epoch": 71} {"train_loss": -20.759361267089844, "global_step": 8601, "epoch": 71} {"train_loss": -20.308692932128906, "global_step": 8602, "epoch": 71} {"train_loss": -20.738874435424805, "global_step": 8603, "epoch": 71} {"train_loss": -20.939924240112305, "global_step": 8604, "epoch": 71} {"train_loss": -21.241697311401367, "global_step": 8605, "epoch": 71} {"train_loss": -21.0006160736084, "global_step": 8606, "epoch": 71} {"train_loss": -20.03619956970215, "global_step": 8607, "epoch": 71} {"train_loss": -21.009069442749023, "global_step": 8608, "epoch": 71} {"train_loss": -20.339752197265625, "global_step": 8609, "epoch": 71} {"train_loss": -20.837888717651367, "global_step": 8610, "epoch": 71} {"train_loss": -21.181615829467773, "global_step": 8611, "epoch": 71} {"train_loss": -20.591337203979492, "global_step": 8612, "epoch": 71} {"train_loss": -20.892004013061523, "global_step": 8613, "epoch": 71} {"train_loss": -20.63576316833496, "global_step": 8614, "epoch": 71} {"train_loss": -20.985715866088867, "global_step": 8615, "epoch": 71} {"train_loss": -20.754369735717773, "global_step": 8616, "epoch": 71} {"train_loss": -20.232440948486328, "global_step": 8617, "epoch": 71} {"train_loss": -20.42032814025879, "global_step": 8618, "epoch": 71} {"train_loss": -20.036230087280273, "global_step": 8619, "epoch": 71} {"train_loss": -20.80557632446289, "global_step": 8620, "epoch": 71} {"train_loss": -20.661474227905273, "global_step": 8621, "epoch": 71} {"train_loss": -20.89198112487793, "global_step": 8622, "epoch": 71} {"train_loss": -20.94156837463379, "global_step": 8623, "epoch": 71} {"train_loss": -21.100839614868164, "global_step": 8624, "epoch": 71} {"train_loss": -21.421100616455078, "global_step": 8625, "epoch": 71} {"train_loss": -21.289579391479492, "global_step": 8626, "epoch": 71} {"train_loss": -20.600759506225586, "global_step": 8627, "epoch": 71} {"train_loss": -20.836881637573242, "global_step": 8628, "epoch": 71} {"train_loss": -21.76226043701172, "global_step": 8629, "epoch": 71} {"train_loss": -21.313764572143555, "global_step": 8630, "epoch": 71} {"train_loss": -21.2879695892334, "global_step": 8631, "epoch": 71} {"train_loss": -20.9110050201416, "global_step": 8632, "epoch": 71} {"train_loss": -21.421873092651367, "global_step": 8633, "epoch": 71} {"train_loss": -20.946523666381836, "global_step": 8634, "epoch": 71} {"train_loss": -20.253679275512695, "global_step": 8635, "epoch": 71} {"train_loss": -20.590391159057617, "global_step": 8636, "epoch": 71} {"train_loss": -21.11837387084961, "global_step": 8637, "epoch": 71} {"train_loss": -20.61406707763672, "global_step": 8638, "epoch": 71} {"train_loss": -21.029911041259766, "global_step": 8639, "epoch": 71} {"train_loss": -20.329458236694336, "global_step": 8640, "epoch": 71} {"train_loss": -17.997121810913086, "global_step": 8641, "epoch": 71} {"train_loss": -12.538080215454102, "global_step": 8642, "epoch": 71} {"train_loss": -11.406938552856445, "global_step": 8643, "epoch": 71} {"train_loss": -20.59615135192871, "global_step": 8644, "epoch": 71} {"train_loss": -16.751501083374023, "global_step": 8645, "epoch": 71} {"train_loss": -19.684446334838867, "global_step": 8646, "epoch": 71} {"train_loss": -19.899553298950195, "global_step": 8647, "epoch": 71} {"train_loss": -18.855249404907227, "global_step": 8648, "epoch": 71} {"train_loss": -19.77333641052246, "global_step": 8649, "epoch": 71} {"train_loss": -20.475317001342773, "global_step": 8650, "epoch": 71} {"train_loss": -20.806074142456055, "global_step": 8651, "epoch": 71} {"train_loss": -19.83915138244629, "global_step": 8652, "epoch": 71} {"train_loss": -18.92047882080078, "global_step": 8653, "epoch": 71} {"train_loss": -19.920795440673828, "global_step": 8654, "epoch": 71} {"train_loss": -20.417394638061523, "global_step": 8655, "epoch": 71} {"train_loss": -20.8966064453125, "global_step": 8656, "epoch": 71} {"train_loss": -21.122726440429688, "global_step": 8657, "epoch": 71} {"train_loss": -20.76215934753418, "global_step": 8658, "epoch": 71} {"train_loss": -20.448843002319336, "global_step": 8659, "epoch": 71} {"train_loss": -20.000356674194336, "global_step": 8660, "epoch": 71} {"train_loss": -19.867416381835938, "global_step": 8661, "epoch": 71} {"train_loss": -20.976057052612305, "global_step": 8662, "epoch": 71} {"train_loss": -21.052743911743164, "global_step": 8663, "epoch": 71} {"train_loss": -20.70121192932129, "global_step": 8664, "epoch": 71} {"train_loss": -20.358352661132812, "global_step": 8665, "epoch": 71} {"train_loss": -20.019933700561523, "global_step": 8666, "epoch": 71} {"train_loss": -20.907922744750977, "global_step": 8667, "epoch": 71} {"train_loss": -20.896499633789062, "global_step": 8668, "epoch": 71} {"train_loss": -20.936979293823242, "global_step": 8669, "epoch": 71} {"train_loss": -20.845178604125977, "global_step": 8670, "epoch": 71} {"train_loss": -20.39991569519043, "global_step": 8671, "epoch": 71} {"train_loss": -20.380050659179688, "global_step": 8672, "epoch": 71} {"train_loss": -20.25258445739746, "global_step": 8673, "epoch": 71} {"train_loss": -20.70364761352539, "global_step": 8674, "epoch": 71} {"train_loss": -20.75836753845215, "global_step": 8675, "epoch": 71} {"train_loss": -20.405319213867188, "global_step": 8676, "epoch": 71} {"train_loss": -20.9141902923584, "global_step": 8677, "epoch": 71} {"train_loss": -20.372791290283203, "global_step": 8678, "epoch": 71} {"train_loss": -20.82781219482422, "global_step": 8679, "epoch": 71} {"train_loss": -21.186325073242188, "global_step": 8680, "epoch": 71} {"train_loss": -21.525043487548828, "global_step": 8681, "epoch": 71} {"train_loss": -20.423202514648438, "global_step": 8682, "epoch": 71} {"train_loss": -20.498783111572266, "global_step": 8683, "epoch": 71} {"train_loss": -20.912233352661133, "global_step": 8684, "epoch": 71} {"train_loss": -20.60972023010254, "global_step": 8685, "epoch": 71} {"train_loss": -21.458120346069336, "global_step": 8686, "epoch": 71} {"train_loss": -21.373233795166016, "global_step": 8687, "epoch": 71} {"train_loss": -21.484712600708008, "global_step": 8688, "epoch": 71} {"train_loss": -21.732681274414062, "global_step": 8689, "epoch": 71} {"train_loss": -21.787668228149414, "global_step": 8690, "epoch": 71} {"train_loss": -21.79652214050293, "global_step": 8691, "epoch": 71} {"train_loss": -21.295621871948242, "global_step": 8692, "epoch": 71} {"train_loss": -21.294763565063477, "global_step": 8693, "epoch": 71} {"train_loss": -21.415529251098633, "global_step": 8694, "epoch": 71} {"train_loss": -21.777833938598633, "global_step": 8695, "epoch": 71} {"train_loss": -21.949371337890625, "global_step": 8696, "epoch": 71} {"train_loss": -21.91892433166504, "global_step": 8697, "epoch": 71} {"train_loss": -21.89920997619629, "global_step": 8698, "epoch": 71} {"train_loss": -21.950748443603516, "global_step": 8699, "epoch": 71} {"train_loss": -21.868873596191406, "global_step": 8700, "epoch": 71} {"train_loss": -21.847177505493164, "global_step": 8701, "epoch": 71} {"train_loss": -21.194562911987305, "global_step": 8702, "epoch": 71} {"train_loss": -21.556974411010742, "global_step": 8703, "epoch": 71} {"train_loss": -21.78656578063965, "global_step": 8704, "epoch": 71} {"train_loss": -21.761032104492188, "global_step": 8705, "epoch": 71} {"train_loss": -22.024805068969727, "global_step": 8706, "epoch": 71} {"train_loss": -22.031030654907227, "global_step": 8707, "epoch": 71} {"train_loss": -22.321523666381836, "global_step": 8708, "epoch": 71} {"train_loss": -22.067161560058594, "global_step": 8709, "epoch": 71} {"train_loss": -22.37572479248047, "global_step": 8710, "epoch": 71} {"train_loss": -20.655672987630545, "global_step": 8711, "epoch": 71, "val_loss": 2902355.25} {"train_loss": -22.27166748046875, "global_step": 8712, "epoch": 72} {"train_loss": -22.493070602416992, "global_step": 8713, "epoch": 72} {"train_loss": -22.484731674194336, "global_step": 8714, "epoch": 72} {"train_loss": -21.906068801879883, "global_step": 8715, "epoch": 72} {"train_loss": -22.689044952392578, "global_step": 8716, "epoch": 72} {"train_loss": -22.532102584838867, "global_step": 8717, "epoch": 72} {"train_loss": -22.432693481445312, "global_step": 8718, "epoch": 72} {"train_loss": -22.493783950805664, "global_step": 8719, "epoch": 72} {"train_loss": -22.293569564819336, "global_step": 8720, "epoch": 72} {"train_loss": -22.502674102783203, "global_step": 8721, "epoch": 72} {"train_loss": -22.74152183532715, "global_step": 8722, "epoch": 72} {"train_loss": -22.33624267578125, "global_step": 8723, "epoch": 72} {"train_loss": -22.82964515686035, "global_step": 8724, "epoch": 72} {"train_loss": -22.630878448486328, "global_step": 8725, "epoch": 72} {"train_loss": -22.702072143554688, "global_step": 8726, "epoch": 72} {"train_loss": -21.86884117126465, "global_step": 8727, "epoch": 72} {"train_loss": -22.641162872314453, "global_step": 8728, "epoch": 72} {"train_loss": -22.316848754882812, "global_step": 8729, "epoch": 72} {"train_loss": -23.02859878540039, "global_step": 8730, "epoch": 72} {"train_loss": -23.51087188720703, "global_step": 8731, "epoch": 72} {"train_loss": -22.599578857421875, "global_step": 8732, "epoch": 72} {"train_loss": -22.501806259155273, "global_step": 8733, "epoch": 72} {"train_loss": -22.909902572631836, "global_step": 8734, "epoch": 72} {"train_loss": -22.181262969970703, "global_step": 8735, "epoch": 72} {"train_loss": -22.824539184570312, "global_step": 8736, "epoch": 72} {"train_loss": -22.566654205322266, "global_step": 8737, "epoch": 72} {"train_loss": -23.039663314819336, "global_step": 8738, "epoch": 72} {"train_loss": -22.66219139099121, "global_step": 8739, "epoch": 72} {"train_loss": -22.83718490600586, "global_step": 8740, "epoch": 72} {"train_loss": -23.073270797729492, "global_step": 8741, "epoch": 72} {"train_loss": -22.593957901000977, "global_step": 8742, "epoch": 72} {"train_loss": -22.70295524597168, "global_step": 8743, "epoch": 72} {"train_loss": -23.080957412719727, "global_step": 8744, "epoch": 72} {"train_loss": -21.36318016052246, "global_step": 8745, "epoch": 72} {"train_loss": -22.156036376953125, "global_step": 8746, "epoch": 72} {"train_loss": -23.04460906982422, "global_step": 8747, "epoch": 72} {"train_loss": -21.38287925720215, "global_step": 8748, "epoch": 72} {"train_loss": -20.606712341308594, "global_step": 8749, "epoch": 72} {"train_loss": -16.627910614013672, "global_step": 8750, "epoch": 72} {"train_loss": -12.534944534301758, "global_step": 8751, "epoch": 72} {"train_loss": -13.028633117675781, "global_step": 8752, "epoch": 72} {"train_loss": -20.886240005493164, "global_step": 8753, "epoch": 72} {"train_loss": -15.815912246704102, "global_step": 8754, "epoch": 72} {"train_loss": -20.823217391967773, "global_step": 8755, "epoch": 72} {"train_loss": -21.216251373291016, "global_step": 8756, "epoch": 72} {"train_loss": -19.694026947021484, "global_step": 8757, "epoch": 72} {"train_loss": -20.700895309448242, "global_step": 8758, "epoch": 72} {"train_loss": -20.788129806518555, "global_step": 8759, "epoch": 72} {"train_loss": -20.646726608276367, "global_step": 8760, "epoch": 72} {"train_loss": -20.990320205688477, "global_step": 8761, "epoch": 72} {"train_loss": -20.021825790405273, "global_step": 8762, "epoch": 72} {"train_loss": -20.7426815032959, "global_step": 8763, "epoch": 72} {"train_loss": -21.294797897338867, "global_step": 8764, "epoch": 72} {"train_loss": -20.955158233642578, "global_step": 8765, "epoch": 72} {"train_loss": -20.899188995361328, "global_step": 8766, "epoch": 72} {"train_loss": -21.250354766845703, "global_step": 8767, "epoch": 72} {"train_loss": -21.188169479370117, "global_step": 8768, "epoch": 72} {"train_loss": -21.025604248046875, "global_step": 8769, "epoch": 72} {"train_loss": -20.88700294494629, "global_step": 8770, "epoch": 72} {"train_loss": -21.305377960205078, "global_step": 8771, "epoch": 72} {"train_loss": -20.791004180908203, "global_step": 8772, "epoch": 72} {"train_loss": -20.962942123413086, "global_step": 8773, "epoch": 72} {"train_loss": -21.359333038330078, "global_step": 8774, "epoch": 72} {"train_loss": -21.491024017333984, "global_step": 8775, "epoch": 72} {"train_loss": -21.520994186401367, "global_step": 8776, "epoch": 72} {"train_loss": -21.441347122192383, "global_step": 8777, "epoch": 72} {"train_loss": -21.524017333984375, "global_step": 8778, "epoch": 72} {"train_loss": -21.268354415893555, "global_step": 8779, "epoch": 72} {"train_loss": -21.772357940673828, "global_step": 8780, "epoch": 72} {"train_loss": -21.553455352783203, "global_step": 8781, "epoch": 72} {"train_loss": -21.634265899658203, "global_step": 8782, "epoch": 72} {"train_loss": -21.659849166870117, "global_step": 8783, "epoch": 72} {"train_loss": -21.323890686035156, "global_step": 8784, "epoch": 72} {"train_loss": -21.693689346313477, "global_step": 8785, "epoch": 72} {"train_loss": -21.937475204467773, "global_step": 8786, "epoch": 72} {"train_loss": -21.302976608276367, "global_step": 8787, "epoch": 72} {"train_loss": -21.539230346679688, "global_step": 8788, "epoch": 72} {"train_loss": -21.741191864013672, "global_step": 8789, "epoch": 72} {"train_loss": -21.97845458984375, "global_step": 8790, "epoch": 72} {"train_loss": -21.870704650878906, "global_step": 8791, "epoch": 72} {"train_loss": -21.73396873474121, "global_step": 8792, "epoch": 72} {"train_loss": -21.548023223876953, "global_step": 8793, "epoch": 72} {"train_loss": -22.047670364379883, "global_step": 8794, "epoch": 72} {"train_loss": -21.783432006835938, "global_step": 8795, "epoch": 72} {"train_loss": -20.946537017822266, "global_step": 8796, "epoch": 72} {"train_loss": -22.058433532714844, "global_step": 8797, "epoch": 72} {"train_loss": -22.35761833190918, "global_step": 8798, "epoch": 72} {"train_loss": -21.443185806274414, "global_step": 8799, "epoch": 72} {"train_loss": -22.17745018005371, "global_step": 8800, "epoch": 72} {"train_loss": -22.19252586364746, "global_step": 8801, "epoch": 72} {"train_loss": -22.197961807250977, "global_step": 8802, "epoch": 72} {"train_loss": -22.071842193603516, "global_step": 8803, "epoch": 72} {"train_loss": -21.920270919799805, "global_step": 8804, "epoch": 72} {"train_loss": -22.066181182861328, "global_step": 8805, "epoch": 72} {"train_loss": -21.939231872558594, "global_step": 8806, "epoch": 72} {"train_loss": -21.775236129760742, "global_step": 8807, "epoch": 72} {"train_loss": -21.014928817749023, "global_step": 8808, "epoch": 72} {"train_loss": -20.68040657043457, "global_step": 8809, "epoch": 72} {"train_loss": -22.133596420288086, "global_step": 8810, "epoch": 72} {"train_loss": -21.807104110717773, "global_step": 8811, "epoch": 72} {"train_loss": -20.2766170501709, "global_step": 8812, "epoch": 72} {"train_loss": -22.679323196411133, "global_step": 8813, "epoch": 72} {"train_loss": -20.081159591674805, "global_step": 8814, "epoch": 72} {"train_loss": -20.56130027770996, "global_step": 8815, "epoch": 72} {"train_loss": -21.598257064819336, "global_step": 8816, "epoch": 72} {"train_loss": -20.798828125, "global_step": 8817, "epoch": 72} {"train_loss": -21.80768394470215, "global_step": 8818, "epoch": 72} {"train_loss": -21.18798828125, "global_step": 8819, "epoch": 72} {"train_loss": -21.959747314453125, "global_step": 8820, "epoch": 72} {"train_loss": -21.644901275634766, "global_step": 8821, "epoch": 72} {"train_loss": -21.9215087890625, "global_step": 8822, "epoch": 72} {"train_loss": -22.387731552124023, "global_step": 8823, "epoch": 72} {"train_loss": -21.863813400268555, "global_step": 8824, "epoch": 72} {"train_loss": -22.461267471313477, "global_step": 8825, "epoch": 72} {"train_loss": -22.316946029663086, "global_step": 8826, "epoch": 72} {"train_loss": -22.02936363220215, "global_step": 8827, "epoch": 72} {"train_loss": -22.56369972229004, "global_step": 8828, "epoch": 72} {"train_loss": -22.45772933959961, "global_step": 8829, "epoch": 72} {"train_loss": -22.33699607849121, "global_step": 8830, "epoch": 72} {"train_loss": -22.6864070892334, "global_step": 8831, "epoch": 72} {"train_loss": -21.591888017890867, "global_step": 8832, "epoch": 72, "val_loss": 2483930.0} {"train_loss": -22.563356399536133, "global_step": 8833, "epoch": 73} {"train_loss": -22.453296661376953, "global_step": 8834, "epoch": 73} {"train_loss": -23.005834579467773, "global_step": 8835, "epoch": 73} {"train_loss": -22.54313850402832, "global_step": 8836, "epoch": 73} {"train_loss": -22.75593376159668, "global_step": 8837, "epoch": 73} {"train_loss": -22.791139602661133, "global_step": 8838, "epoch": 73} {"train_loss": -22.29714584350586, "global_step": 8839, "epoch": 73} {"train_loss": -22.89476203918457, "global_step": 8840, "epoch": 73} {"train_loss": -22.74134635925293, "global_step": 8841, "epoch": 73} {"train_loss": -22.272397994995117, "global_step": 8842, "epoch": 73} {"train_loss": -22.47023582458496, "global_step": 8843, "epoch": 73} {"train_loss": -23.0726318359375, "global_step": 8844, "epoch": 73} {"train_loss": -23.244237899780273, "global_step": 8845, "epoch": 73} {"train_loss": -23.337575912475586, "global_step": 8846, "epoch": 73} {"train_loss": -22.76936149597168, "global_step": 8847, "epoch": 73} {"train_loss": -22.93194580078125, "global_step": 8848, "epoch": 73} {"train_loss": -23.117490768432617, "global_step": 8849, "epoch": 73} {"train_loss": -23.058439254760742, "global_step": 8850, "epoch": 73} {"train_loss": -23.244138717651367, "global_step": 8851, "epoch": 73} {"train_loss": -22.628341674804688, "global_step": 8852, "epoch": 73} {"train_loss": -23.1376895904541, "global_step": 8853, "epoch": 73} {"train_loss": -23.119144439697266, "global_step": 8854, "epoch": 73} {"train_loss": -22.88934326171875, "global_step": 8855, "epoch": 73} {"train_loss": -23.436277389526367, "global_step": 8856, "epoch": 73} {"train_loss": -23.2918701171875, "global_step": 8857, "epoch": 73} {"train_loss": -23.064546585083008, "global_step": 8858, "epoch": 73} {"train_loss": -23.568069458007812, "global_step": 8859, "epoch": 73} {"train_loss": -23.255735397338867, "global_step": 8860, "epoch": 73} {"train_loss": -23.17586898803711, "global_step": 8861, "epoch": 73} {"train_loss": -23.34934425354004, "global_step": 8862, "epoch": 73} {"train_loss": -22.89751625061035, "global_step": 8863, "epoch": 73} {"train_loss": -23.46827507019043, "global_step": 8864, "epoch": 73} {"train_loss": -23.09980583190918, "global_step": 8865, "epoch": 73} {"train_loss": -23.561721801757812, "global_step": 8866, "epoch": 73} {"train_loss": -23.45167350769043, "global_step": 8867, "epoch": 73} {"train_loss": -23.684263229370117, "global_step": 8868, "epoch": 73} {"train_loss": -23.495925903320312, "global_step": 8869, "epoch": 73} {"train_loss": -23.5329647064209, "global_step": 8870, "epoch": 73} {"train_loss": -23.55046844482422, "global_step": 8871, "epoch": 73} {"train_loss": -23.755043029785156, "global_step": 8872, "epoch": 73} {"train_loss": -23.353139877319336, "global_step": 8873, "epoch": 73} {"train_loss": -23.745540618896484, "global_step": 8874, "epoch": 73} {"train_loss": -23.630651473999023, "global_step": 8875, "epoch": 73} {"train_loss": -23.35721778869629, "global_step": 8876, "epoch": 73} {"train_loss": -23.658554077148438, "global_step": 8877, "epoch": 73} {"train_loss": -23.912784576416016, "global_step": 8878, "epoch": 73} {"train_loss": -23.793193817138672, "global_step": 8879, "epoch": 73} {"train_loss": -23.709545135498047, "global_step": 8880, "epoch": 73} {"train_loss": -23.572397232055664, "global_step": 8881, "epoch": 73} {"train_loss": -23.34162712097168, "global_step": 8882, "epoch": 73} {"train_loss": -23.679147720336914, "global_step": 8883, "epoch": 73} {"train_loss": -22.77688980102539, "global_step": 8884, "epoch": 73} {"train_loss": -21.290700912475586, "global_step": 8885, "epoch": 73} {"train_loss": -18.02387046813965, "global_step": 8886, "epoch": 73} {"train_loss": -10.967318534851074, "global_step": 8887, "epoch": 73} {"train_loss": -4.2258620262146, "global_step": 8888, "epoch": 73} {"train_loss": -22.13923454284668, "global_step": 8889, "epoch": 73} {"train_loss": -14.58415699005127, "global_step": 8890, "epoch": 73} {"train_loss": -19.00789451599121, "global_step": 8891, "epoch": 73} {"train_loss": -22.549161911010742, "global_step": 8892, "epoch": 73} {"train_loss": -20.440170288085938, "global_step": 8893, "epoch": 73} {"train_loss": -20.116043090820312, "global_step": 8894, "epoch": 73} {"train_loss": -21.0795841217041, "global_step": 8895, "epoch": 73} {"train_loss": -21.97730827331543, "global_step": 8896, "epoch": 73} {"train_loss": -21.84918785095215, "global_step": 8897, "epoch": 73} {"train_loss": -22.67572021484375, "global_step": 8898, "epoch": 73} {"train_loss": -22.360883712768555, "global_step": 8899, "epoch": 73} {"train_loss": -21.743427276611328, "global_step": 8900, "epoch": 73} {"train_loss": -21.408756256103516, "global_step": 8901, "epoch": 73} {"train_loss": -21.504621505737305, "global_step": 8902, "epoch": 73} {"train_loss": -21.801095962524414, "global_step": 8903, "epoch": 73} {"train_loss": -21.59041404724121, "global_step": 8904, "epoch": 73} {"train_loss": -21.945480346679688, "global_step": 8905, "epoch": 73} {"train_loss": -22.281599044799805, "global_step": 8906, "epoch": 73} {"train_loss": -21.727554321289062, "global_step": 8907, "epoch": 73} {"train_loss": -22.065004348754883, "global_step": 8908, "epoch": 73} {"train_loss": -21.911401748657227, "global_step": 8909, "epoch": 73} {"train_loss": -22.144315719604492, "global_step": 8910, "epoch": 73} {"train_loss": -22.066068649291992, "global_step": 8911, "epoch": 73} {"train_loss": -22.569211959838867, "global_step": 8912, "epoch": 73} {"train_loss": -22.232101440429688, "global_step": 8913, "epoch": 73} {"train_loss": -21.915937423706055, "global_step": 8914, "epoch": 73} {"train_loss": -22.127656936645508, "global_step": 8915, "epoch": 73} {"train_loss": -22.347097396850586, "global_step": 8916, "epoch": 73} {"train_loss": -21.97077178955078, "global_step": 8917, "epoch": 73} {"train_loss": -22.146162033081055, "global_step": 8918, "epoch": 73} {"train_loss": -22.901418685913086, "global_step": 8919, "epoch": 73} {"train_loss": -22.523298263549805, "global_step": 8920, "epoch": 73} {"train_loss": -22.030597686767578, "global_step": 8921, "epoch": 73} {"train_loss": -22.747589111328125, "global_step": 8922, "epoch": 73} {"train_loss": -22.109861373901367, "global_step": 8923, "epoch": 73} {"train_loss": -22.31446647644043, "global_step": 8924, "epoch": 73} {"train_loss": -21.070453643798828, "global_step": 8925, "epoch": 73} {"train_loss": -22.252843856811523, "global_step": 8926, "epoch": 73} {"train_loss": -22.339136123657227, "global_step": 8927, "epoch": 73} {"train_loss": -21.739683151245117, "global_step": 8928, "epoch": 73} {"train_loss": -20.705720901489258, "global_step": 8929, "epoch": 73} {"train_loss": -22.64235496520996, "global_step": 8930, "epoch": 73} {"train_loss": -22.489789962768555, "global_step": 8931, "epoch": 73} {"train_loss": -21.487380981445312, "global_step": 8932, "epoch": 73} {"train_loss": -22.415836334228516, "global_step": 8933, "epoch": 73} {"train_loss": -21.818740844726562, "global_step": 8934, "epoch": 73} {"train_loss": -21.954452514648438, "global_step": 8935, "epoch": 73} {"train_loss": -21.894241333007812, "global_step": 8936, "epoch": 73} {"train_loss": -22.12590980529785, "global_step": 8937, "epoch": 73} {"train_loss": -21.565431594848633, "global_step": 8938, "epoch": 73} {"train_loss": -21.833372116088867, "global_step": 8939, "epoch": 73} {"train_loss": -21.566665649414062, "global_step": 8940, "epoch": 73} {"train_loss": -21.709089279174805, "global_step": 8941, "epoch": 73} {"train_loss": -22.07549476623535, "global_step": 8942, "epoch": 73} {"train_loss": -20.90520668029785, "global_step": 8943, "epoch": 73} {"train_loss": -21.494356155395508, "global_step": 8944, "epoch": 73} {"train_loss": -21.59855079650879, "global_step": 8945, "epoch": 73} {"train_loss": -17.261259078979492, "global_step": 8946, "epoch": 73} {"train_loss": -21.904272079467773, "global_step": 8947, "epoch": 73} {"train_loss": -21.774322509765625, "global_step": 8948, "epoch": 73} {"train_loss": -22.085691452026367, "global_step": 8949, "epoch": 73} {"train_loss": -21.894155502319336, "global_step": 8950, "epoch": 73} {"train_loss": -22.19074058532715, "global_step": 8951, "epoch": 73} {"train_loss": -21.720596313476562, "global_step": 8952, "epoch": 73} {"train_loss": -22.057528483966166, "global_step": 8953, "epoch": 73, "val_loss": 3707501.25} {"train_loss": -21.799806594848633, "global_step": 8954, "epoch": 74} {"train_loss": -21.1814022064209, "global_step": 8955, "epoch": 74} {"train_loss": -22.10252571105957, "global_step": 8956, "epoch": 74} {"train_loss": -22.086044311523438, "global_step": 8957, "epoch": 74} {"train_loss": -22.06328773498535, "global_step": 8958, "epoch": 74} {"train_loss": -22.042917251586914, "global_step": 8959, "epoch": 74} {"train_loss": -22.102115631103516, "global_step": 8960, "epoch": 74} {"train_loss": -21.959762573242188, "global_step": 8961, "epoch": 74} {"train_loss": -21.941051483154297, "global_step": 8962, "epoch": 74} {"train_loss": -22.134403228759766, "global_step": 8963, "epoch": 74} {"train_loss": -22.254371643066406, "global_step": 8964, "epoch": 74} {"train_loss": -22.23011589050293, "global_step": 8965, "epoch": 74} {"train_loss": -22.549551010131836, "global_step": 8966, "epoch": 74} {"train_loss": -22.01554298400879, "global_step": 8967, "epoch": 74} {"train_loss": -22.010852813720703, "global_step": 8968, "epoch": 74} {"train_loss": -22.546926498413086, "global_step": 8969, "epoch": 74} {"train_loss": -22.82942008972168, "global_step": 8970, "epoch": 74} {"train_loss": -22.584867477416992, "global_step": 8971, "epoch": 74} {"train_loss": -22.114643096923828, "global_step": 8972, "epoch": 74} {"train_loss": -22.552371978759766, "global_step": 8973, "epoch": 74} {"train_loss": -22.823484420776367, "global_step": 8974, "epoch": 74} {"train_loss": -22.729034423828125, "global_step": 8975, "epoch": 74} {"train_loss": -22.823009490966797, "global_step": 8976, "epoch": 74} {"train_loss": -22.571924209594727, "global_step": 8977, "epoch": 74} {"train_loss": -22.8118839263916, "global_step": 8978, "epoch": 74} {"train_loss": -23.075706481933594, "global_step": 8979, "epoch": 74} {"train_loss": -22.340818405151367, "global_step": 8980, "epoch": 74} {"train_loss": -21.95656394958496, "global_step": 8981, "epoch": 74} {"train_loss": -22.91657829284668, "global_step": 8982, "epoch": 74} {"train_loss": -21.701690673828125, "global_step": 8983, "epoch": 74} {"train_loss": -22.512292861938477, "global_step": 8984, "epoch": 74} {"train_loss": -22.038259506225586, "global_step": 8985, "epoch": 74} {"train_loss": -23.00968360900879, "global_step": 8986, "epoch": 74} {"train_loss": -22.43122673034668, "global_step": 8987, "epoch": 74} {"train_loss": -22.23464012145996, "global_step": 8988, "epoch": 74} {"train_loss": -22.701637268066406, "global_step": 8989, "epoch": 74} {"train_loss": -22.71623420715332, "global_step": 8990, "epoch": 74} {"train_loss": -22.830772399902344, "global_step": 8991, "epoch": 74} {"train_loss": -22.955289840698242, "global_step": 8992, "epoch": 74} {"train_loss": -23.292524337768555, "global_step": 8993, "epoch": 74} {"train_loss": -22.72301483154297, "global_step": 8994, "epoch": 74} {"train_loss": -22.98193359375, "global_step": 8995, "epoch": 74} {"train_loss": -23.00288200378418, "global_step": 8996, "epoch": 74} {"train_loss": -23.13544273376465, "global_step": 8997, "epoch": 74} {"train_loss": -23.13514518737793, "global_step": 8998, "epoch": 74} {"train_loss": -23.61993980407715, "global_step": 8999, "epoch": 74} {"train_loss": -23.294239044189453, "global_step": 9000, "epoch": 74} {"train_loss": -23.807050704956055, "global_step": 9001, "epoch": 74} {"train_loss": -23.44722557067871, "global_step": 9002, "epoch": 74} {"train_loss": -23.423526763916016, "global_step": 9003, "epoch": 74} {"train_loss": -23.440584182739258, "global_step": 9004, "epoch": 74} {"train_loss": -22.794109344482422, "global_step": 9005, "epoch": 74} {"train_loss": -23.721967697143555, "global_step": 9006, "epoch": 74} {"train_loss": -23.443044662475586, "global_step": 9007, "epoch": 74} {"train_loss": -23.68411636352539, "global_step": 9008, "epoch": 74} {"train_loss": -22.274555206298828, "global_step": 9009, "epoch": 74} {"train_loss": -22.29741859436035, "global_step": 9010, "epoch": 74} {"train_loss": -23.162948608398438, "global_step": 9011, "epoch": 74} {"train_loss": -21.98185920715332, "global_step": 9012, "epoch": 74} {"train_loss": -23.078556060791016, "global_step": 9013, "epoch": 74} {"train_loss": -23.09883689880371, "global_step": 9014, "epoch": 74} {"train_loss": -23.241071701049805, "global_step": 9015, "epoch": 74} {"train_loss": -23.34686851501465, "global_step": 9016, "epoch": 74} {"train_loss": -23.589994430541992, "global_step": 9017, "epoch": 74} {"train_loss": -23.372953414916992, "global_step": 9018, "epoch": 74} {"train_loss": -23.319671630859375, "global_step": 9019, "epoch": 74} {"train_loss": -23.760679244995117, "global_step": 9020, "epoch": 74} {"train_loss": -23.295202255249023, "global_step": 9021, "epoch": 74} {"train_loss": -23.315046310424805, "global_step": 9022, "epoch": 74} {"train_loss": -23.257719039916992, "global_step": 9023, "epoch": 74} {"train_loss": -22.380746841430664, "global_step": 9024, "epoch": 74} {"train_loss": -20.954627990722656, "global_step": 9025, "epoch": 74} {"train_loss": -19.444223403930664, "global_step": 9026, "epoch": 74} {"train_loss": -19.134918212890625, "global_step": 9027, "epoch": 74} {"train_loss": -22.762617111206055, "global_step": 9028, "epoch": 74} {"train_loss": -21.855215072631836, "global_step": 9029, "epoch": 74} {"train_loss": -19.766271591186523, "global_step": 9030, "epoch": 74} {"train_loss": -23.19759750366211, "global_step": 9031, "epoch": 74} {"train_loss": -20.12822914123535, "global_step": 9032, "epoch": 74} {"train_loss": -23.17036247253418, "global_step": 9033, "epoch": 74} {"train_loss": -22.08190155029297, "global_step": 9034, "epoch": 74} {"train_loss": -23.126972198486328, "global_step": 9035, "epoch": 74} {"train_loss": -21.337080001831055, "global_step": 9036, "epoch": 74} {"train_loss": -22.158172607421875, "global_step": 9037, "epoch": 74} {"train_loss": -21.790685653686523, "global_step": 9038, "epoch": 74} {"train_loss": -23.16571044921875, "global_step": 9039, "epoch": 74} {"train_loss": -21.761096954345703, "global_step": 9040, "epoch": 74} {"train_loss": -22.670455932617188, "global_step": 9041, "epoch": 74} {"train_loss": -22.742597579956055, "global_step": 9042, "epoch": 74} {"train_loss": -22.74885368347168, "global_step": 9043, "epoch": 74} {"train_loss": -22.999935150146484, "global_step": 9044, "epoch": 74} {"train_loss": -22.320180892944336, "global_step": 9045, "epoch": 74} {"train_loss": -23.20454216003418, "global_step": 9046, "epoch": 74} {"train_loss": -23.187026977539062, "global_step": 9047, "epoch": 74} {"train_loss": -23.193723678588867, "global_step": 9048, "epoch": 74} {"train_loss": -23.571531295776367, "global_step": 9049, "epoch": 74} {"train_loss": -23.415054321289062, "global_step": 9050, "epoch": 74} {"train_loss": -22.806753158569336, "global_step": 9051, "epoch": 74} {"train_loss": -23.23834991455078, "global_step": 9052, "epoch": 74} {"train_loss": -23.54256820678711, "global_step": 9053, "epoch": 74} {"train_loss": -23.06747817993164, "global_step": 9054, "epoch": 74} {"train_loss": -23.61489486694336, "global_step": 9055, "epoch": 74} {"train_loss": -23.406835556030273, "global_step": 9056, "epoch": 74} {"train_loss": -23.613693237304688, "global_step": 9057, "epoch": 74} {"train_loss": -23.346094131469727, "global_step": 9058, "epoch": 74} {"train_loss": -23.67889976501465, "global_step": 9059, "epoch": 74} {"train_loss": -23.689712524414062, "global_step": 9060, "epoch": 74} {"train_loss": -23.971866607666016, "global_step": 9061, "epoch": 74} {"train_loss": -23.8348388671875, "global_step": 9062, "epoch": 74} {"train_loss": -23.57780647277832, "global_step": 9063, "epoch": 74} {"train_loss": -23.38271141052246, "global_step": 9064, "epoch": 74} {"train_loss": -24.004058837890625, "global_step": 9065, "epoch": 74} {"train_loss": -23.33563995361328, "global_step": 9066, "epoch": 74} {"train_loss": -23.947715759277344, "global_step": 9067, "epoch": 74} {"train_loss": -23.901992797851562, "global_step": 9068, "epoch": 74} {"train_loss": -23.603723526000977, "global_step": 9069, "epoch": 74} {"train_loss": -24.002391815185547, "global_step": 9070, "epoch": 74} {"train_loss": -23.870973587036133, "global_step": 9071, "epoch": 74} {"train_loss": -23.828245162963867, "global_step": 9072, "epoch": 74} {"train_loss": -23.558012008666992, "global_step": 9073, "epoch": 74} {"train_loss": -22.782995996396405, "global_step": 9074, "epoch": 74, "val_loss": 3609763.75} {"train_loss": -24.204111099243164, "global_step": 9075, "epoch": 75} {"train_loss": -23.51340675354004, "global_step": 9076, "epoch": 75} {"train_loss": -23.52040672302246, "global_step": 9077, "epoch": 75} {"train_loss": -23.51111602783203, "global_step": 9078, "epoch": 75} {"train_loss": -23.61992835998535, "global_step": 9079, "epoch": 75} {"train_loss": -23.255462646484375, "global_step": 9080, "epoch": 75} {"train_loss": -23.8763484954834, "global_step": 9081, "epoch": 75} {"train_loss": -23.965408325195312, "global_step": 9082, "epoch": 75} {"train_loss": -22.533226013183594, "global_step": 9083, "epoch": 75} {"train_loss": -20.959609985351562, "global_step": 9084, "epoch": 75} {"train_loss": -20.915271759033203, "global_step": 9085, "epoch": 75} {"train_loss": -23.64021110534668, "global_step": 9086, "epoch": 75} {"train_loss": -22.619125366210938, "global_step": 9087, "epoch": 75} {"train_loss": -23.291866302490234, "global_step": 9088, "epoch": 75} {"train_loss": -22.718393325805664, "global_step": 9089, "epoch": 75} {"train_loss": -23.444433212280273, "global_step": 9090, "epoch": 75} {"train_loss": -23.102338790893555, "global_step": 9091, "epoch": 75} {"train_loss": -24.05219078063965, "global_step": 9092, "epoch": 75} {"train_loss": -23.299266815185547, "global_step": 9093, "epoch": 75} {"train_loss": -23.678342819213867, "global_step": 9094, "epoch": 75} {"train_loss": -23.269582748413086, "global_step": 9095, "epoch": 75} {"train_loss": -23.412803649902344, "global_step": 9096, "epoch": 75} {"train_loss": -23.963712692260742, "global_step": 9097, "epoch": 75} {"train_loss": -23.35906982421875, "global_step": 9098, "epoch": 75} {"train_loss": -24.23455238342285, "global_step": 9099, "epoch": 75} {"train_loss": -23.472103118896484, "global_step": 9100, "epoch": 75} {"train_loss": -23.622695922851562, "global_step": 9101, "epoch": 75} {"train_loss": -23.368135452270508, "global_step": 9102, "epoch": 75} {"train_loss": -23.547134399414062, "global_step": 9103, "epoch": 75} {"train_loss": -23.74220085144043, "global_step": 9104, "epoch": 75} {"train_loss": -23.956520080566406, "global_step": 9105, "epoch": 75} {"train_loss": -23.507047653198242, "global_step": 9106, "epoch": 75} {"train_loss": -23.477798461914062, "global_step": 9107, "epoch": 75} {"train_loss": -23.977859497070312, "global_step": 9108, "epoch": 75} {"train_loss": -23.72590446472168, "global_step": 9109, "epoch": 75} {"train_loss": -23.63520622253418, "global_step": 9110, "epoch": 75} {"train_loss": -23.459936141967773, "global_step": 9111, "epoch": 75} {"train_loss": -23.447471618652344, "global_step": 9112, "epoch": 75} {"train_loss": -23.595569610595703, "global_step": 9113, "epoch": 75} {"train_loss": -23.385723114013672, "global_step": 9114, "epoch": 75} {"train_loss": -23.464839935302734, "global_step": 9115, "epoch": 75} {"train_loss": -22.97719383239746, "global_step": 9116, "epoch": 75} {"train_loss": -21.907697677612305, "global_step": 9117, "epoch": 75} {"train_loss": -21.141698837280273, "global_step": 9118, "epoch": 75} {"train_loss": -23.01088523864746, "global_step": 9119, "epoch": 75} {"train_loss": -23.509206771850586, "global_step": 9120, "epoch": 75} {"train_loss": -21.37757682800293, "global_step": 9121, "epoch": 75} {"train_loss": -22.413196563720703, "global_step": 9122, "epoch": 75} {"train_loss": -23.399147033691406, "global_step": 9123, "epoch": 75} {"train_loss": -22.097827911376953, "global_step": 9124, "epoch": 75} {"train_loss": -23.208459854125977, "global_step": 9125, "epoch": 75} {"train_loss": -22.144887924194336, "global_step": 9126, "epoch": 75} {"train_loss": -22.78409767150879, "global_step": 9127, "epoch": 75} {"train_loss": -23.670291900634766, "global_step": 9128, "epoch": 75} {"train_loss": -23.09152603149414, "global_step": 9129, "epoch": 75} {"train_loss": -23.632659912109375, "global_step": 9130, "epoch": 75} {"train_loss": -23.394641876220703, "global_step": 9131, "epoch": 75} {"train_loss": -23.298803329467773, "global_step": 9132, "epoch": 75} {"train_loss": -23.0510311126709, "global_step": 9133, "epoch": 75} {"train_loss": -23.96014976501465, "global_step": 9134, "epoch": 75} {"train_loss": -23.348695755004883, "global_step": 9135, "epoch": 75} {"train_loss": -23.389877319335938, "global_step": 9136, "epoch": 75} {"train_loss": -23.888212203979492, "global_step": 9137, "epoch": 75} {"train_loss": -23.870685577392578, "global_step": 9138, "epoch": 75} {"train_loss": -23.603910446166992, "global_step": 9139, "epoch": 75} {"train_loss": -23.80817222595215, "global_step": 9140, "epoch": 75} {"train_loss": -24.001928329467773, "global_step": 9141, "epoch": 75} {"train_loss": -23.953466415405273, "global_step": 9142, "epoch": 75} {"train_loss": -23.516767501831055, "global_step": 9143, "epoch": 75} {"train_loss": -23.776203155517578, "global_step": 9144, "epoch": 75} {"train_loss": -23.717758178710938, "global_step": 9145, "epoch": 75} {"train_loss": -24.027645111083984, "global_step": 9146, "epoch": 75} {"train_loss": -23.66851806640625, "global_step": 9147, "epoch": 75} {"train_loss": -23.5994873046875, "global_step": 9148, "epoch": 75} {"train_loss": -24.085193634033203, "global_step": 9149, "epoch": 75} {"train_loss": -23.817991256713867, "global_step": 9150, "epoch": 75} {"train_loss": -23.80788230895996, "global_step": 9151, "epoch": 75} {"train_loss": -24.341781616210938, "global_step": 9152, "epoch": 75} {"train_loss": -24.089479446411133, "global_step": 9153, "epoch": 75} {"train_loss": -24.16023063659668, "global_step": 9154, "epoch": 75} {"train_loss": -24.2943058013916, "global_step": 9155, "epoch": 75} {"train_loss": -24.32321548461914, "global_step": 9156, "epoch": 75} {"train_loss": -24.233217239379883, "global_step": 9157, "epoch": 75} {"train_loss": -23.967575073242188, "global_step": 9158, "epoch": 75} {"train_loss": -24.285938262939453, "global_step": 9159, "epoch": 75} {"train_loss": -24.432863235473633, "global_step": 9160, "epoch": 75} {"train_loss": -23.9849853515625, "global_step": 9161, "epoch": 75} {"train_loss": -24.2484188079834, "global_step": 9162, "epoch": 75} {"train_loss": -24.354724884033203, "global_step": 9163, "epoch": 75} {"train_loss": -24.39950942993164, "global_step": 9164, "epoch": 75} {"train_loss": -24.305402755737305, "global_step": 9165, "epoch": 75} {"train_loss": -24.621984481811523, "global_step": 9166, "epoch": 75} {"train_loss": -24.8398494720459, "global_step": 9167, "epoch": 75} {"train_loss": -24.407142639160156, "global_step": 9168, "epoch": 75} {"train_loss": -24.433225631713867, "global_step": 9169, "epoch": 75} {"train_loss": -24.6527099609375, "global_step": 9170, "epoch": 75} {"train_loss": -23.58863067626953, "global_step": 9171, "epoch": 75} {"train_loss": -21.581926345825195, "global_step": 9172, "epoch": 75} {"train_loss": -18.98059844970703, "global_step": 9173, "epoch": 75} {"train_loss": -20.16994285583496, "global_step": 9174, "epoch": 75} {"train_loss": -22.83914566040039, "global_step": 9175, "epoch": 75} {"train_loss": -23.349552154541016, "global_step": 9176, "epoch": 75} {"train_loss": -22.367780685424805, "global_step": 9177, "epoch": 75} {"train_loss": -22.80664825439453, "global_step": 9178, "epoch": 75} {"train_loss": -23.243391036987305, "global_step": 9179, "epoch": 75} {"train_loss": -23.745880126953125, "global_step": 9180, "epoch": 75} {"train_loss": -23.05024528503418, "global_step": 9181, "epoch": 75} {"train_loss": -23.34231948852539, "global_step": 9182, "epoch": 75} {"train_loss": -23.634422302246094, "global_step": 9183, "epoch": 75} {"train_loss": -22.81040382385254, "global_step": 9184, "epoch": 75} {"train_loss": -23.61453628540039, "global_step": 9185, "epoch": 75} {"train_loss": -23.91497039794922, "global_step": 9186, "epoch": 75} {"train_loss": -22.332887649536133, "global_step": 9187, "epoch": 75} {"train_loss": -23.153945922851562, "global_step": 9188, "epoch": 75} {"train_loss": -23.813888549804688, "global_step": 9189, "epoch": 75} {"train_loss": -23.143030166625977, "global_step": 9190, "epoch": 75} {"train_loss": -23.715993881225586, "global_step": 9191, "epoch": 75} {"train_loss": -23.383813858032227, "global_step": 9192, "epoch": 75} {"train_loss": -23.42478370666504, "global_step": 9193, "epoch": 75} {"train_loss": -23.631929397583008, "global_step": 9194, "epoch": 75} {"train_loss": -23.415230412128544, "global_step": 9195, "epoch": 75, "val_loss": 3204844.75} {"train_loss": -23.91010856628418, "global_step": 9196, "epoch": 76} {"train_loss": -23.537832260131836, "global_step": 9197, "epoch": 76} {"train_loss": -23.582645416259766, "global_step": 9198, "epoch": 76} {"train_loss": -23.863431930541992, "global_step": 9199, "epoch": 76} {"train_loss": -23.570663452148438, "global_step": 9200, "epoch": 76} {"train_loss": -23.373483657836914, "global_step": 9201, "epoch": 76} {"train_loss": -22.5804500579834, "global_step": 9202, "epoch": 76} {"train_loss": -22.738676071166992, "global_step": 9203, "epoch": 76} {"train_loss": -22.58774185180664, "global_step": 9204, "epoch": 76} {"train_loss": -23.856138229370117, "global_step": 9205, "epoch": 76} {"train_loss": -23.487112045288086, "global_step": 9206, "epoch": 76} {"train_loss": -22.986921310424805, "global_step": 9207, "epoch": 76} {"train_loss": -23.663419723510742, "global_step": 9208, "epoch": 76} {"train_loss": -23.90208625793457, "global_step": 9209, "epoch": 76} {"train_loss": -23.756855010986328, "global_step": 9210, "epoch": 76} {"train_loss": -23.075706481933594, "global_step": 9211, "epoch": 76} {"train_loss": -23.362260818481445, "global_step": 9212, "epoch": 76} {"train_loss": -23.583890914916992, "global_step": 9213, "epoch": 76} {"train_loss": -23.13649559020996, "global_step": 9214, "epoch": 76} {"train_loss": -23.916662216186523, "global_step": 9215, "epoch": 76} {"train_loss": -23.646635055541992, "global_step": 9216, "epoch": 76} {"train_loss": -23.605060577392578, "global_step": 9217, "epoch": 76} {"train_loss": -23.956892013549805, "global_step": 9218, "epoch": 76} {"train_loss": -24.01447105407715, "global_step": 9219, "epoch": 76} {"train_loss": -23.581069946289062, "global_step": 9220, "epoch": 76} {"train_loss": -24.158296585083008, "global_step": 9221, "epoch": 76} {"train_loss": -23.855539321899414, "global_step": 9222, "epoch": 76} {"train_loss": -24.06195831298828, "global_step": 9223, "epoch": 76} {"train_loss": -24.090225219726562, "global_step": 9224, "epoch": 76} {"train_loss": -23.624860763549805, "global_step": 9225, "epoch": 76} {"train_loss": -23.638914108276367, "global_step": 9226, "epoch": 76} {"train_loss": -23.91971206665039, "global_step": 9227, "epoch": 76} {"train_loss": -24.406858444213867, "global_step": 9228, "epoch": 76} {"train_loss": -23.96803855895996, "global_step": 9229, "epoch": 76} {"train_loss": -23.71327781677246, "global_step": 9230, "epoch": 76} {"train_loss": -23.825645446777344, "global_step": 9231, "epoch": 76} {"train_loss": -24.2407169342041, "global_step": 9232, "epoch": 76} {"train_loss": -23.84693717956543, "global_step": 9233, "epoch": 76} {"train_loss": -24.066930770874023, "global_step": 9234, "epoch": 76} {"train_loss": -24.2455997467041, "global_step": 9235, "epoch": 76} {"train_loss": -24.479734420776367, "global_step": 9236, "epoch": 76} {"train_loss": -23.803943634033203, "global_step": 9237, "epoch": 76} {"train_loss": -24.16070556640625, "global_step": 9238, "epoch": 76} {"train_loss": -24.729774475097656, "global_step": 9239, "epoch": 76} {"train_loss": -24.59254264831543, "global_step": 9240, "epoch": 76} {"train_loss": -24.32423973083496, "global_step": 9241, "epoch": 76} {"train_loss": -23.086109161376953, "global_step": 9242, "epoch": 76} {"train_loss": -23.140714645385742, "global_step": 9243, "epoch": 76} {"train_loss": -22.513277053833008, "global_step": 9244, "epoch": 76} {"train_loss": -22.56614112854004, "global_step": 9245, "epoch": 76} {"train_loss": -23.879724502563477, "global_step": 9246, "epoch": 76} {"train_loss": -23.582448959350586, "global_step": 9247, "epoch": 76} {"train_loss": -22.206811904907227, "global_step": 9248, "epoch": 76} {"train_loss": -24.018720626831055, "global_step": 9249, "epoch": 76} {"train_loss": -23.631643295288086, "global_step": 9250, "epoch": 76} {"train_loss": -24.152708053588867, "global_step": 9251, "epoch": 76} {"train_loss": -24.11147117614746, "global_step": 9252, "epoch": 76} {"train_loss": -23.492359161376953, "global_step": 9253, "epoch": 76} {"train_loss": -23.929790496826172, "global_step": 9254, "epoch": 76} {"train_loss": -23.48714256286621, "global_step": 9255, "epoch": 76} {"train_loss": -23.805524826049805, "global_step": 9256, "epoch": 76} {"train_loss": -22.5887508392334, "global_step": 9257, "epoch": 76} {"train_loss": -22.563583374023438, "global_step": 9258, "epoch": 76} {"train_loss": -23.365345001220703, "global_step": 9259, "epoch": 76} {"train_loss": -23.937360763549805, "global_step": 9260, "epoch": 76} {"train_loss": -23.65047264099121, "global_step": 9261, "epoch": 76} {"train_loss": -23.373899459838867, "global_step": 9262, "epoch": 76} {"train_loss": -24.73016357421875, "global_step": 9263, "epoch": 76} {"train_loss": -24.297033309936523, "global_step": 9264, "epoch": 76} {"train_loss": -24.391407012939453, "global_step": 9265, "epoch": 76} {"train_loss": -24.344472885131836, "global_step": 9266, "epoch": 76} {"train_loss": -24.40371322631836, "global_step": 9267, "epoch": 76} {"train_loss": -24.388662338256836, "global_step": 9268, "epoch": 76} {"train_loss": -24.10431480407715, "global_step": 9269, "epoch": 76} {"train_loss": -23.877782821655273, "global_step": 9270, "epoch": 76} {"train_loss": -23.805957794189453, "global_step": 9271, "epoch": 76} {"train_loss": -23.85188102722168, "global_step": 9272, "epoch": 76} {"train_loss": -22.294452667236328, "global_step": 9273, "epoch": 76} {"train_loss": -22.063404083251953, "global_step": 9274, "epoch": 76} {"train_loss": -22.973949432373047, "global_step": 9275, "epoch": 76} {"train_loss": -24.448810577392578, "global_step": 9276, "epoch": 76} {"train_loss": -23.22397804260254, "global_step": 9277, "epoch": 76} {"train_loss": -21.585651397705078, "global_step": 9278, "epoch": 76} {"train_loss": -20.199344635009766, "global_step": 9279, "epoch": 76} {"train_loss": -22.925031661987305, "global_step": 9280, "epoch": 76} {"train_loss": -22.785343170166016, "global_step": 9281, "epoch": 76} {"train_loss": -20.93387794494629, "global_step": 9282, "epoch": 76} {"train_loss": -23.227128982543945, "global_step": 9283, "epoch": 76} {"train_loss": -22.82935333251953, "global_step": 9284, "epoch": 76} {"train_loss": -22.649768829345703, "global_step": 9285, "epoch": 76} {"train_loss": -23.368087768554688, "global_step": 9286, "epoch": 76} {"train_loss": -22.573923110961914, "global_step": 9287, "epoch": 76} {"train_loss": -22.913537979125977, "global_step": 9288, "epoch": 76} {"train_loss": -22.857467651367188, "global_step": 9289, "epoch": 76} {"train_loss": -22.56574058532715, "global_step": 9290, "epoch": 76} {"train_loss": -23.600229263305664, "global_step": 9291, "epoch": 76} {"train_loss": -23.088083267211914, "global_step": 9292, "epoch": 76} {"train_loss": -23.35541343688965, "global_step": 9293, "epoch": 76} {"train_loss": -23.634252548217773, "global_step": 9294, "epoch": 76} {"train_loss": -23.520280838012695, "global_step": 9295, "epoch": 76} {"train_loss": -23.465774536132812, "global_step": 9296, "epoch": 76} {"train_loss": -23.7021427154541, "global_step": 9297, "epoch": 76} {"train_loss": -22.905845642089844, "global_step": 9298, "epoch": 76} {"train_loss": -23.599624633789062, "global_step": 9299, "epoch": 76} {"train_loss": -23.908720016479492, "global_step": 9300, "epoch": 76} {"train_loss": -24.012845993041992, "global_step": 9301, "epoch": 76} {"train_loss": -23.676916122436523, "global_step": 9302, "epoch": 76} {"train_loss": -23.750152587890625, "global_step": 9303, "epoch": 76} {"train_loss": -24.036224365234375, "global_step": 9304, "epoch": 76} {"train_loss": -23.725690841674805, "global_step": 9305, "epoch": 76} {"train_loss": -23.886709213256836, "global_step": 9306, "epoch": 76} {"train_loss": -23.784080505371094, "global_step": 9307, "epoch": 76} {"train_loss": -24.178770065307617, "global_step": 9308, "epoch": 76} {"train_loss": -24.043651580810547, "global_step": 9309, "epoch": 76} {"train_loss": -23.978187561035156, "global_step": 9310, "epoch": 76} {"train_loss": -23.845979690551758, "global_step": 9311, "epoch": 76} {"train_loss": -23.9443416595459, "global_step": 9312, "epoch": 76} {"train_loss": -24.227575302124023, "global_step": 9313, "epoch": 76} {"train_loss": -24.37590789794922, "global_step": 9314, "epoch": 76} {"train_loss": -24.359067916870117, "global_step": 9315, "epoch": 76} {"train_loss": -23.566056070248944, "global_step": 9316, "epoch": 76, "val_loss": 3336292.75} {"train_loss": -23.614877700805664, "global_step": 9317, "epoch": 77} {"train_loss": -23.30401611328125, "global_step": 9318, "epoch": 77} {"train_loss": -23.971290588378906, "global_step": 9319, "epoch": 77} {"train_loss": -23.8456974029541, "global_step": 9320, "epoch": 77} {"train_loss": -23.158660888671875, "global_step": 9321, "epoch": 77} {"train_loss": -22.272037506103516, "global_step": 9322, "epoch": 77} {"train_loss": -22.152658462524414, "global_step": 9323, "epoch": 77} {"train_loss": -22.819032669067383, "global_step": 9324, "epoch": 77} {"train_loss": -24.075361251831055, "global_step": 9325, "epoch": 77} {"train_loss": -23.35769271850586, "global_step": 9326, "epoch": 77} {"train_loss": -20.974590301513672, "global_step": 9327, "epoch": 77} {"train_loss": -21.79312515258789, "global_step": 9328, "epoch": 77} {"train_loss": -23.41884422302246, "global_step": 9329, "epoch": 77} {"train_loss": -23.240522384643555, "global_step": 9330, "epoch": 77} {"train_loss": -22.862228393554688, "global_step": 9331, "epoch": 77} {"train_loss": -24.68887710571289, "global_step": 9332, "epoch": 77} {"train_loss": -22.918577194213867, "global_step": 9333, "epoch": 77} {"train_loss": -23.111148834228516, "global_step": 9334, "epoch": 77} {"train_loss": -24.247716903686523, "global_step": 9335, "epoch": 77} {"train_loss": -23.540552139282227, "global_step": 9336, "epoch": 77} {"train_loss": -24.267126083374023, "global_step": 9337, "epoch": 77} {"train_loss": -23.35787010192871, "global_step": 9338, "epoch": 77} {"train_loss": -23.90496253967285, "global_step": 9339, "epoch": 77} {"train_loss": -23.080032348632812, "global_step": 9340, "epoch": 77} {"train_loss": -23.98189353942871, "global_step": 9341, "epoch": 77} {"train_loss": -23.574440002441406, "global_step": 9342, "epoch": 77} {"train_loss": -24.292205810546875, "global_step": 9343, "epoch": 77} {"train_loss": -23.610477447509766, "global_step": 9344, "epoch": 77} {"train_loss": -23.8552303314209, "global_step": 9345, "epoch": 77} {"train_loss": -23.982341766357422, "global_step": 9346, "epoch": 77} {"train_loss": -24.089794158935547, "global_step": 9347, "epoch": 77} {"train_loss": -24.08331871032715, "global_step": 9348, "epoch": 77} {"train_loss": -23.46776580810547, "global_step": 9349, "epoch": 77} {"train_loss": -24.267253875732422, "global_step": 9350, "epoch": 77} {"train_loss": -23.334592819213867, "global_step": 9351, "epoch": 77} {"train_loss": -24.147462844848633, "global_step": 9352, "epoch": 77} {"train_loss": -24.233352661132812, "global_step": 9353, "epoch": 77} {"train_loss": -23.897756576538086, "global_step": 9354, "epoch": 77} {"train_loss": -23.298555374145508, "global_step": 9355, "epoch": 77} {"train_loss": -24.186777114868164, "global_step": 9356, "epoch": 77} {"train_loss": -23.92959213256836, "global_step": 9357, "epoch": 77} {"train_loss": -24.435842514038086, "global_step": 9358, "epoch": 77} {"train_loss": -24.74113655090332, "global_step": 9359, "epoch": 77} {"train_loss": -24.041372299194336, "global_step": 9360, "epoch": 77} {"train_loss": -24.39505958557129, "global_step": 9361, "epoch": 77} {"train_loss": -24.27949333190918, "global_step": 9362, "epoch": 77} {"train_loss": -24.354631423950195, "global_step": 9363, "epoch": 77} {"train_loss": -24.385879516601562, "global_step": 9364, "epoch": 77} {"train_loss": -23.727523803710938, "global_step": 9365, "epoch": 77} {"train_loss": -24.576812744140625, "global_step": 9366, "epoch": 77} {"train_loss": -23.589099884033203, "global_step": 9367, "epoch": 77} {"train_loss": -24.123380661010742, "global_step": 9368, "epoch": 77} {"train_loss": -23.8880558013916, "global_step": 9369, "epoch": 77} {"train_loss": -23.82723045349121, "global_step": 9370, "epoch": 77} {"train_loss": -23.7692928314209, "global_step": 9371, "epoch": 77} {"train_loss": -24.114728927612305, "global_step": 9372, "epoch": 77} {"train_loss": -23.48292350769043, "global_step": 9373, "epoch": 77} {"train_loss": -24.380155563354492, "global_step": 9374, "epoch": 77} {"train_loss": -23.27939796447754, "global_step": 9375, "epoch": 77} {"train_loss": -22.37278175354004, "global_step": 9376, "epoch": 77} {"train_loss": -22.285886764526367, "global_step": 9377, "epoch": 77} {"train_loss": -22.52670669555664, "global_step": 9378, "epoch": 77} {"train_loss": -22.87860679626465, "global_step": 9379, "epoch": 77} {"train_loss": -22.954130172729492, "global_step": 9380, "epoch": 77} {"train_loss": -23.4790096282959, "global_step": 9381, "epoch": 77} {"train_loss": -23.37904930114746, "global_step": 9382, "epoch": 77} {"train_loss": -23.35443115234375, "global_step": 9383, "epoch": 77} {"train_loss": -23.913232803344727, "global_step": 9384, "epoch": 77} {"train_loss": -23.41742515563965, "global_step": 9385, "epoch": 77} {"train_loss": -23.012800216674805, "global_step": 9386, "epoch": 77} {"train_loss": -23.953857421875, "global_step": 9387, "epoch": 77} {"train_loss": -23.806554794311523, "global_step": 9388, "epoch": 77} {"train_loss": -23.13018798828125, "global_step": 9389, "epoch": 77} {"train_loss": -23.342138290405273, "global_step": 9390, "epoch": 77} {"train_loss": -24.079437255859375, "global_step": 9391, "epoch": 77} {"train_loss": -22.85471534729004, "global_step": 9392, "epoch": 77} {"train_loss": -23.52037811279297, "global_step": 9393, "epoch": 77} {"train_loss": -24.162622451782227, "global_step": 9394, "epoch": 77} {"train_loss": -22.90333366394043, "global_step": 9395, "epoch": 77} {"train_loss": -24.48847770690918, "global_step": 9396, "epoch": 77} {"train_loss": -23.141437530517578, "global_step": 9397, "epoch": 77} {"train_loss": -23.40896987915039, "global_step": 9398, "epoch": 77} {"train_loss": -23.87605094909668, "global_step": 9399, "epoch": 77} {"train_loss": -23.652753829956055, "global_step": 9400, "epoch": 77} {"train_loss": -24.105764389038086, "global_step": 9401, "epoch": 77} {"train_loss": -24.02327537536621, "global_step": 9402, "epoch": 77} {"train_loss": -24.303302764892578, "global_step": 9403, "epoch": 77} {"train_loss": -24.313404083251953, "global_step": 9404, "epoch": 77} {"train_loss": -24.30258560180664, "global_step": 9405, "epoch": 77} {"train_loss": -24.20661163330078, "global_step": 9406, "epoch": 77} {"train_loss": -24.170578002929688, "global_step": 9407, "epoch": 77} {"train_loss": -24.112943649291992, "global_step": 9408, "epoch": 77} {"train_loss": -24.239459991455078, "global_step": 9409, "epoch": 77} {"train_loss": -24.485254287719727, "global_step": 9410, "epoch": 77} {"train_loss": -24.190595626831055, "global_step": 9411, "epoch": 77} {"train_loss": -24.127370834350586, "global_step": 9412, "epoch": 77} {"train_loss": -24.203157424926758, "global_step": 9413, "epoch": 77} {"train_loss": -24.30940818786621, "global_step": 9414, "epoch": 77} {"train_loss": -24.693899154663086, "global_step": 9415, "epoch": 77} {"train_loss": -24.607637405395508, "global_step": 9416, "epoch": 77} {"train_loss": -24.384366989135742, "global_step": 9417, "epoch": 77} {"train_loss": -24.632442474365234, "global_step": 9418, "epoch": 77} {"train_loss": -24.07187843322754, "global_step": 9419, "epoch": 77} {"train_loss": -24.581100463867188, "global_step": 9420, "epoch": 77} {"train_loss": -23.671253204345703, "global_step": 9421, "epoch": 77} {"train_loss": -23.90107536315918, "global_step": 9422, "epoch": 77} {"train_loss": -23.517223358154297, "global_step": 9423, "epoch": 77} {"train_loss": -24.019926071166992, "global_step": 9424, "epoch": 77} {"train_loss": -22.96906852722168, "global_step": 9425, "epoch": 77} {"train_loss": -23.420316696166992, "global_step": 9426, "epoch": 77} {"train_loss": -23.25771713256836, "global_step": 9427, "epoch": 77} {"train_loss": -23.57025718688965, "global_step": 9428, "epoch": 77} {"train_loss": -23.21559715270996, "global_step": 9429, "epoch": 77} {"train_loss": -22.932113647460938, "global_step": 9430, "epoch": 77} {"train_loss": -19.57081413269043, "global_step": 9431, "epoch": 77} {"train_loss": -13.579916954040527, "global_step": 9432, "epoch": 77} {"train_loss": -9.891572952270508, "global_step": 9433, "epoch": 77} {"train_loss": -17.032825469970703, "global_step": 9434, "epoch": 77} {"train_loss": -16.842857360839844, "global_step": 9435, "epoch": 77} {"train_loss": -13.410928726196289, "global_step": 9436, "epoch": 77} {"train_loss": -23.23769954807502, "global_step": 9437, "epoch": 77, "val_loss": 4431702.0} {"train_loss": -17.302448272705078, "global_step": 9438, "epoch": 78} {"train_loss": -20.3792781829834, "global_step": 9439, "epoch": 78} {"train_loss": -18.500965118408203, "global_step": 9440, "epoch": 78} {"train_loss": -19.584802627563477, "global_step": 9441, "epoch": 78} {"train_loss": -19.9193058013916, "global_step": 9442, "epoch": 78} {"train_loss": -20.64594841003418, "global_step": 9443, "epoch": 78} {"train_loss": -20.36174201965332, "global_step": 9444, "epoch": 78} {"train_loss": -20.25083351135254, "global_step": 9445, "epoch": 78} {"train_loss": -21.26766014099121, "global_step": 9446, "epoch": 78} {"train_loss": -20.50248908996582, "global_step": 9447, "epoch": 78} {"train_loss": -20.829809188842773, "global_step": 9448, "epoch": 78} {"train_loss": -20.906143188476562, "global_step": 9449, "epoch": 78} {"train_loss": -20.54124641418457, "global_step": 9450, "epoch": 78} {"train_loss": -21.450397491455078, "global_step": 9451, "epoch": 78} {"train_loss": -21.52879524230957, "global_step": 9452, "epoch": 78} {"train_loss": -20.866016387939453, "global_step": 9453, "epoch": 78} {"train_loss": -21.719207763671875, "global_step": 9454, "epoch": 78} {"train_loss": -21.553756713867188, "global_step": 9455, "epoch": 78} {"train_loss": -21.828350067138672, "global_step": 9456, "epoch": 78} {"train_loss": -21.219205856323242, "global_step": 9457, "epoch": 78} {"train_loss": -21.683212280273438, "global_step": 9458, "epoch": 78} {"train_loss": -21.121030807495117, "global_step": 9459, "epoch": 78} {"train_loss": -22.061609268188477, "global_step": 9460, "epoch": 78} {"train_loss": -21.732421875, "global_step": 9461, "epoch": 78} {"train_loss": -21.253276824951172, "global_step": 9462, "epoch": 78} {"train_loss": -22.688129425048828, "global_step": 9463, "epoch": 78} {"train_loss": -21.02110481262207, "global_step": 9464, "epoch": 78} {"train_loss": -22.724491119384766, "global_step": 9465, "epoch": 78} {"train_loss": -21.80698585510254, "global_step": 9466, "epoch": 78} {"train_loss": -20.946840286254883, "global_step": 9467, "epoch": 78} {"train_loss": -21.7420654296875, "global_step": 9468, "epoch": 78} {"train_loss": -21.90250015258789, "global_step": 9469, "epoch": 78} {"train_loss": -21.972442626953125, "global_step": 9470, "epoch": 78} {"train_loss": -21.359540939331055, "global_step": 9471, "epoch": 78} {"train_loss": -22.0079402923584, "global_step": 9472, "epoch": 78} {"train_loss": -22.491697311401367, "global_step": 9473, "epoch": 78} {"train_loss": -21.985395431518555, "global_step": 9474, "epoch": 78} {"train_loss": -22.879379272460938, "global_step": 9475, "epoch": 78} {"train_loss": -22.081514358520508, "global_step": 9476, "epoch": 78} {"train_loss": -22.13368034362793, "global_step": 9477, "epoch": 78} {"train_loss": -22.85138511657715, "global_step": 9478, "epoch": 78} {"train_loss": -22.55781364440918, "global_step": 9479, "epoch": 78} {"train_loss": -21.96750259399414, "global_step": 9480, "epoch": 78} {"train_loss": -20.349931716918945, "global_step": 9481, "epoch": 78} {"train_loss": -21.207807540893555, "global_step": 9482, "epoch": 78} {"train_loss": -22.441377639770508, "global_step": 9483, "epoch": 78} {"train_loss": -21.26520347595215, "global_step": 9484, "epoch": 78} {"train_loss": -22.791593551635742, "global_step": 9485, "epoch": 78} {"train_loss": -22.31233024597168, "global_step": 9486, "epoch": 78} {"train_loss": -22.411176681518555, "global_step": 9487, "epoch": 78} {"train_loss": -21.713626861572266, "global_step": 9488, "epoch": 78} {"train_loss": -23.089155197143555, "global_step": 9489, "epoch": 78} {"train_loss": -21.938547134399414, "global_step": 9490, "epoch": 78} {"train_loss": -23.004911422729492, "global_step": 9491, "epoch": 78} {"train_loss": -22.544448852539062, "global_step": 9492, "epoch": 78} {"train_loss": -22.547163009643555, "global_step": 9493, "epoch": 78} {"train_loss": -22.94278335571289, "global_step": 9494, "epoch": 78} {"train_loss": -22.87980079650879, "global_step": 9495, "epoch": 78} {"train_loss": -23.139760971069336, "global_step": 9496, "epoch": 78} {"train_loss": -22.92999839782715, "global_step": 9497, "epoch": 78} {"train_loss": -22.514751434326172, "global_step": 9498, "epoch": 78} {"train_loss": -22.96404266357422, "global_step": 9499, "epoch": 78} {"train_loss": -22.711843490600586, "global_step": 9500, "epoch": 78} {"train_loss": -20.98523712158203, "global_step": 9501, "epoch": 78} {"train_loss": -20.30224609375, "global_step": 9502, "epoch": 78} {"train_loss": -23.12952995300293, "global_step": 9503, "epoch": 78} {"train_loss": -22.00916862487793, "global_step": 9504, "epoch": 78} {"train_loss": -21.555612564086914, "global_step": 9505, "epoch": 78} {"train_loss": -22.66484260559082, "global_step": 9506, "epoch": 78} {"train_loss": -21.939777374267578, "global_step": 9507, "epoch": 78} {"train_loss": -22.511194229125977, "global_step": 9508, "epoch": 78} {"train_loss": -22.374832153320312, "global_step": 9509, "epoch": 78} {"train_loss": -22.58558464050293, "global_step": 9510, "epoch": 78} {"train_loss": -23.35538673400879, "global_step": 9511, "epoch": 78} {"train_loss": -22.43631935119629, "global_step": 9512, "epoch": 78} {"train_loss": -23.200040817260742, "global_step": 9513, "epoch": 78} {"train_loss": -23.044036865234375, "global_step": 9514, "epoch": 78} {"train_loss": -23.024444580078125, "global_step": 9515, "epoch": 78} {"train_loss": -23.21986961364746, "global_step": 9516, "epoch": 78} {"train_loss": -23.467594146728516, "global_step": 9517, "epoch": 78} {"train_loss": -23.353029251098633, "global_step": 9518, "epoch": 78} {"train_loss": -22.395910263061523, "global_step": 9519, "epoch": 78} {"train_loss": -23.22208595275879, "global_step": 9520, "epoch": 78} {"train_loss": -22.88903045654297, "global_step": 9521, "epoch": 78} {"train_loss": -22.977100372314453, "global_step": 9522, "epoch": 78} {"train_loss": -23.042640686035156, "global_step": 9523, "epoch": 78} {"train_loss": -23.14191246032715, "global_step": 9524, "epoch": 78} {"train_loss": -23.144989013671875, "global_step": 9525, "epoch": 78} {"train_loss": -23.420063018798828, "global_step": 9526, "epoch": 78} {"train_loss": -22.835601806640625, "global_step": 9527, "epoch": 78} {"train_loss": -23.339237213134766, "global_step": 9528, "epoch": 78} {"train_loss": -22.56031608581543, "global_step": 9529, "epoch": 78} {"train_loss": -21.788150787353516, "global_step": 9530, "epoch": 78} {"train_loss": -22.018823623657227, "global_step": 9531, "epoch": 78} {"train_loss": -18.611486434936523, "global_step": 9532, "epoch": 78} {"train_loss": -16.4710693359375, "global_step": 9533, "epoch": 78} {"train_loss": -16.98756217956543, "global_step": 9534, "epoch": 78} {"train_loss": -23.04534912109375, "global_step": 9535, "epoch": 78} {"train_loss": -19.565113067626953, "global_step": 9536, "epoch": 78} {"train_loss": -22.763778686523438, "global_step": 9537, "epoch": 78} {"train_loss": -20.75408172607422, "global_step": 9538, "epoch": 78} {"train_loss": -22.119548797607422, "global_step": 9539, "epoch": 78} {"train_loss": -21.852497100830078, "global_step": 9540, "epoch": 78} {"train_loss": -21.394901275634766, "global_step": 9541, "epoch": 78} {"train_loss": -22.044660568237305, "global_step": 9542, "epoch": 78} {"train_loss": -22.500308990478516, "global_step": 9543, "epoch": 78} {"train_loss": -22.305234909057617, "global_step": 9544, "epoch": 78} {"train_loss": -22.217090606689453, "global_step": 9545, "epoch": 78} {"train_loss": -22.551864624023438, "global_step": 9546, "epoch": 78} {"train_loss": -22.626850128173828, "global_step": 9547, "epoch": 78} {"train_loss": -22.6237735748291, "global_step": 9548, "epoch": 78} {"train_loss": -22.777156829833984, "global_step": 9549, "epoch": 78} {"train_loss": -22.632715225219727, "global_step": 9550, "epoch": 78} {"train_loss": -22.3494930267334, "global_step": 9551, "epoch": 78} {"train_loss": -23.0423526763916, "global_step": 9552, "epoch": 78} {"train_loss": -23.04937171936035, "global_step": 9553, "epoch": 78} {"train_loss": -22.98723602294922, "global_step": 9554, "epoch": 78} {"train_loss": -22.627853393554688, "global_step": 9555, "epoch": 78} {"train_loss": -22.86556053161621, "global_step": 9556, "epoch": 78} {"train_loss": -22.8007755279541, "global_step": 9557, "epoch": 78} {"train_loss": -21.93611100882538, "global_step": 9558, "epoch": 78, "val_loss": 3655279.75} {"train_loss": -22.502817153930664, "global_step": 9559, "epoch": 79} {"train_loss": -23.137470245361328, "global_step": 9560, "epoch": 79} {"train_loss": -22.87129783630371, "global_step": 9561, "epoch": 79} {"train_loss": -22.507070541381836, "global_step": 9562, "epoch": 79} {"train_loss": -22.693655014038086, "global_step": 9563, "epoch": 79} {"train_loss": -22.823129653930664, "global_step": 9564, "epoch": 79} {"train_loss": -22.90590476989746, "global_step": 9565, "epoch": 79} {"train_loss": -22.96293067932129, "global_step": 9566, "epoch": 79} {"train_loss": -22.95627212524414, "global_step": 9567, "epoch": 79} {"train_loss": -23.123502731323242, "global_step": 9568, "epoch": 79} {"train_loss": -23.010404586791992, "global_step": 9569, "epoch": 79} {"train_loss": -23.60951805114746, "global_step": 9570, "epoch": 79} {"train_loss": -23.07528305053711, "global_step": 9571, "epoch": 79} {"train_loss": -22.6774959564209, "global_step": 9572, "epoch": 79} {"train_loss": -22.67587661743164, "global_step": 9573, "epoch": 79} {"train_loss": -22.95245361328125, "global_step": 9574, "epoch": 79} {"train_loss": -22.117258071899414, "global_step": 9575, "epoch": 79} {"train_loss": -22.251758575439453, "global_step": 9576, "epoch": 79} {"train_loss": -22.717403411865234, "global_step": 9577, "epoch": 79} {"train_loss": -23.231460571289062, "global_step": 9578, "epoch": 79} {"train_loss": -23.582918167114258, "global_step": 9579, "epoch": 79} {"train_loss": -23.194110870361328, "global_step": 9580, "epoch": 79} {"train_loss": -23.356266021728516, "global_step": 9581, "epoch": 79} {"train_loss": -23.67036247253418, "global_step": 9582, "epoch": 79} {"train_loss": -23.674222946166992, "global_step": 9583, "epoch": 79} {"train_loss": -23.33881187438965, "global_step": 9584, "epoch": 79} {"train_loss": -23.067649841308594, "global_step": 9585, "epoch": 79} {"train_loss": -23.38739585876465, "global_step": 9586, "epoch": 79} {"train_loss": -23.558349609375, "global_step": 9587, "epoch": 79} {"train_loss": -23.443885803222656, "global_step": 9588, "epoch": 79} {"train_loss": -23.90677833557129, "global_step": 9589, "epoch": 79} {"train_loss": -23.806997299194336, "global_step": 9590, "epoch": 79} {"train_loss": -23.882474899291992, "global_step": 9591, "epoch": 79} {"train_loss": -23.857641220092773, "global_step": 9592, "epoch": 79} {"train_loss": -23.546735763549805, "global_step": 9593, "epoch": 79} {"train_loss": -23.611997604370117, "global_step": 9594, "epoch": 79} {"train_loss": -23.666114807128906, "global_step": 9595, "epoch": 79} {"train_loss": -23.016616821289062, "global_step": 9596, "epoch": 79} {"train_loss": -22.956098556518555, "global_step": 9597, "epoch": 79} {"train_loss": -22.729597091674805, "global_step": 9598, "epoch": 79} {"train_loss": -22.633146286010742, "global_step": 9599, "epoch": 79} {"train_loss": -22.883495330810547, "global_step": 9600, "epoch": 79} {"train_loss": -23.12360191345215, "global_step": 9601, "epoch": 79} {"train_loss": -23.390531539916992, "global_step": 9602, "epoch": 79} {"train_loss": -23.909255981445312, "global_step": 9603, "epoch": 79} {"train_loss": -24.077890396118164, "global_step": 9604, "epoch": 79} {"train_loss": -23.84767723083496, "global_step": 9605, "epoch": 79} {"train_loss": -23.649717330932617, "global_step": 9606, "epoch": 79} {"train_loss": -23.65625762939453, "global_step": 9607, "epoch": 79} {"train_loss": -23.684619903564453, "global_step": 9608, "epoch": 79} {"train_loss": -23.632549285888672, "global_step": 9609, "epoch": 79} {"train_loss": -24.301055908203125, "global_step": 9610, "epoch": 79} {"train_loss": -23.69817543029785, "global_step": 9611, "epoch": 79} {"train_loss": -23.894683837890625, "global_step": 9612, "epoch": 79} {"train_loss": -23.421802520751953, "global_step": 9613, "epoch": 79} {"train_loss": -23.70237922668457, "global_step": 9614, "epoch": 79} {"train_loss": -24.036325454711914, "global_step": 9615, "epoch": 79} {"train_loss": -23.821901321411133, "global_step": 9616, "epoch": 79} {"train_loss": -23.69891929626465, "global_step": 9617, "epoch": 79} {"train_loss": -23.3887939453125, "global_step": 9618, "epoch": 79} {"train_loss": -23.449636459350586, "global_step": 9619, "epoch": 79} {"train_loss": -23.912294387817383, "global_step": 9620, "epoch": 79} {"train_loss": -23.531225204467773, "global_step": 9621, "epoch": 79} {"train_loss": -23.365407943725586, "global_step": 9622, "epoch": 79} {"train_loss": -22.2497615814209, "global_step": 9623, "epoch": 79} {"train_loss": -22.301847457885742, "global_step": 9624, "epoch": 79} {"train_loss": -19.949447631835938, "global_step": 9625, "epoch": 79} {"train_loss": -20.70577049255371, "global_step": 9626, "epoch": 79} {"train_loss": -20.78974723815918, "global_step": 9627, "epoch": 79} {"train_loss": -17.65921974182129, "global_step": 9628, "epoch": 79} {"train_loss": -23.055402755737305, "global_step": 9629, "epoch": 79} {"train_loss": -21.412145614624023, "global_step": 9630, "epoch": 79} {"train_loss": -22.30479621887207, "global_step": 9631, "epoch": 79} {"train_loss": -22.02044677734375, "global_step": 9632, "epoch": 79} {"train_loss": -22.45627784729004, "global_step": 9633, "epoch": 79} {"train_loss": -23.256338119506836, "global_step": 9634, "epoch": 79} {"train_loss": -22.438337326049805, "global_step": 9635, "epoch": 79} {"train_loss": -22.48079490661621, "global_step": 9636, "epoch": 79} {"train_loss": -23.189315795898438, "global_step": 9637, "epoch": 79} {"train_loss": -22.95989990234375, "global_step": 9638, "epoch": 79} {"train_loss": -22.832921981811523, "global_step": 9639, "epoch": 79} {"train_loss": -23.317731857299805, "global_step": 9640, "epoch": 79} {"train_loss": -23.62432098388672, "global_step": 9641, "epoch": 79} {"train_loss": -23.170434951782227, "global_step": 9642, "epoch": 79} {"train_loss": -22.870176315307617, "global_step": 9643, "epoch": 79} {"train_loss": -22.917051315307617, "global_step": 9644, "epoch": 79} {"train_loss": -23.108844757080078, "global_step": 9645, "epoch": 79} {"train_loss": -23.02497100830078, "global_step": 9646, "epoch": 79} {"train_loss": -23.069913864135742, "global_step": 9647, "epoch": 79} {"train_loss": -23.228656768798828, "global_step": 9648, "epoch": 79} {"train_loss": -23.318830490112305, "global_step": 9649, "epoch": 79} {"train_loss": -23.081308364868164, "global_step": 9650, "epoch": 79} {"train_loss": -23.438018798828125, "global_step": 9651, "epoch": 79} {"train_loss": -23.2935848236084, "global_step": 9652, "epoch": 79} {"train_loss": -22.85035514831543, "global_step": 9653, "epoch": 79} {"train_loss": -23.25243377685547, "global_step": 9654, "epoch": 79} {"train_loss": -23.727603912353516, "global_step": 9655, "epoch": 79} {"train_loss": -23.40148162841797, "global_step": 9656, "epoch": 79} {"train_loss": -22.578317642211914, "global_step": 9657, "epoch": 79} {"train_loss": -21.764524459838867, "global_step": 9658, "epoch": 79} {"train_loss": -23.024314880371094, "global_step": 9659, "epoch": 79} {"train_loss": -23.211170196533203, "global_step": 9660, "epoch": 79} {"train_loss": -23.699234008789062, "global_step": 9661, "epoch": 79} {"train_loss": -23.588125228881836, "global_step": 9662, "epoch": 79} {"train_loss": -23.76050567626953, "global_step": 9663, "epoch": 79} {"train_loss": -23.60004997253418, "global_step": 9664, "epoch": 79} {"train_loss": -23.113893508911133, "global_step": 9665, "epoch": 79} {"train_loss": -22.489789962768555, "global_step": 9666, "epoch": 79} {"train_loss": -23.308805465698242, "global_step": 9667, "epoch": 79} {"train_loss": -24.093900680541992, "global_step": 9668, "epoch": 79} {"train_loss": -22.71726417541504, "global_step": 9669, "epoch": 79} {"train_loss": -21.979337692260742, "global_step": 9670, "epoch": 79} {"train_loss": -22.03663444519043, "global_step": 9671, "epoch": 79} {"train_loss": -22.6151123046875, "global_step": 9672, "epoch": 79} {"train_loss": -23.45059585571289, "global_step": 9673, "epoch": 79} {"train_loss": -23.280933380126953, "global_step": 9674, "epoch": 79} {"train_loss": -22.023910522460938, "global_step": 9675, "epoch": 79} {"train_loss": -22.044612884521484, "global_step": 9676, "epoch": 79} {"train_loss": -23.88650894165039, "global_step": 9677, "epoch": 79} {"train_loss": -22.451154708862305, "global_step": 9678, "epoch": 79} {"train_loss": -23.02353311964303, "global_step": 9679, "epoch": 79, "val_loss": 2397398.25} {"train_loss": -23.866165161132812, "global_step": 9680, "epoch": 80} {"train_loss": -22.59125518798828, "global_step": 9681, "epoch": 80} {"train_loss": -23.340749740600586, "global_step": 9682, "epoch": 80} {"train_loss": -23.517316818237305, "global_step": 9683, "epoch": 80} {"train_loss": -22.8881893157959, "global_step": 9684, "epoch": 80} {"train_loss": -23.194570541381836, "global_step": 9685, "epoch": 80} {"train_loss": -21.835174560546875, "global_step": 9686, "epoch": 80} {"train_loss": -21.860477447509766, "global_step": 9687, "epoch": 80} {"train_loss": -23.24209976196289, "global_step": 9688, "epoch": 80} {"train_loss": -23.365581512451172, "global_step": 9689, "epoch": 80} {"train_loss": -23.52685546875, "global_step": 9690, "epoch": 80} {"train_loss": -23.60953712463379, "global_step": 9691, "epoch": 80} {"train_loss": -23.452041625976562, "global_step": 9692, "epoch": 80} {"train_loss": -23.116159439086914, "global_step": 9693, "epoch": 80} {"train_loss": -23.867328643798828, "global_step": 9694, "epoch": 80} {"train_loss": -23.838638305664062, "global_step": 9695, "epoch": 80} {"train_loss": -23.965085983276367, "global_step": 9696, "epoch": 80} {"train_loss": -23.538537979125977, "global_step": 9697, "epoch": 80} {"train_loss": -23.821754455566406, "global_step": 9698, "epoch": 80} {"train_loss": -23.88222312927246, "global_step": 9699, "epoch": 80} {"train_loss": -24.117956161499023, "global_step": 9700, "epoch": 80} {"train_loss": -24.017765045166016, "global_step": 9701, "epoch": 80} {"train_loss": -23.615299224853516, "global_step": 9702, "epoch": 80} {"train_loss": -23.7160701751709, "global_step": 9703, "epoch": 80} {"train_loss": -23.90814781188965, "global_step": 9704, "epoch": 80} {"train_loss": -23.718948364257812, "global_step": 9705, "epoch": 80} {"train_loss": -23.78327751159668, "global_step": 9706, "epoch": 80} {"train_loss": -23.80460548400879, "global_step": 9707, "epoch": 80} {"train_loss": -23.937536239624023, "global_step": 9708, "epoch": 80} {"train_loss": -23.806188583374023, "global_step": 9709, "epoch": 80} {"train_loss": -24.160415649414062, "global_step": 9710, "epoch": 80} {"train_loss": -24.240924835205078, "global_step": 9711, "epoch": 80} {"train_loss": -23.9234561920166, "global_step": 9712, "epoch": 80} {"train_loss": -24.1986083984375, "global_step": 9713, "epoch": 80} {"train_loss": -24.03704261779785, "global_step": 9714, "epoch": 80} {"train_loss": -24.547300338745117, "global_step": 9715, "epoch": 80} {"train_loss": -24.388622283935547, "global_step": 9716, "epoch": 80} {"train_loss": -24.597225189208984, "global_step": 9717, "epoch": 80} {"train_loss": -24.358856201171875, "global_step": 9718, "epoch": 80} {"train_loss": -24.520498275756836, "global_step": 9719, "epoch": 80} {"train_loss": -23.93594741821289, "global_step": 9720, "epoch": 80} {"train_loss": -24.138813018798828, "global_step": 9721, "epoch": 80} {"train_loss": -24.574010848999023, "global_step": 9722, "epoch": 80} {"train_loss": -24.199329376220703, "global_step": 9723, "epoch": 80} {"train_loss": -24.215978622436523, "global_step": 9724, "epoch": 80} {"train_loss": -24.066862106323242, "global_step": 9725, "epoch": 80} {"train_loss": -23.917814254760742, "global_step": 9726, "epoch": 80} {"train_loss": -23.053739547729492, "global_step": 9727, "epoch": 80} {"train_loss": -23.372730255126953, "global_step": 9728, "epoch": 80} {"train_loss": -22.729721069335938, "global_step": 9729, "epoch": 80} {"train_loss": -23.465497970581055, "global_step": 9730, "epoch": 80} {"train_loss": -24.247516632080078, "global_step": 9731, "epoch": 80} {"train_loss": -24.219755172729492, "global_step": 9732, "epoch": 80} {"train_loss": -23.671384811401367, "global_step": 9733, "epoch": 80} {"train_loss": -21.949020385742188, "global_step": 9734, "epoch": 80} {"train_loss": -15.929183006286621, "global_step": 9735, "epoch": 80} {"train_loss": -8.083002090454102, "global_step": 9736, "epoch": 80} {"train_loss": -6.274803161621094, "global_step": 9737, "epoch": 80} {"train_loss": -21.50941276550293, "global_step": 9738, "epoch": 80} {"train_loss": -18.592985153198242, "global_step": 9739, "epoch": 80} {"train_loss": -19.28192710876465, "global_step": 9740, "epoch": 80} {"train_loss": -21.942594528198242, "global_step": 9741, "epoch": 80} {"train_loss": -20.874786376953125, "global_step": 9742, "epoch": 80} {"train_loss": -20.60918617248535, "global_step": 9743, "epoch": 80} {"train_loss": -20.803434371948242, "global_step": 9744, "epoch": 80} {"train_loss": -21.81639289855957, "global_step": 9745, "epoch": 80} {"train_loss": -20.91200828552246, "global_step": 9746, "epoch": 80} {"train_loss": -21.300403594970703, "global_step": 9747, "epoch": 80} {"train_loss": -21.59393310546875, "global_step": 9748, "epoch": 80} {"train_loss": -22.022846221923828, "global_step": 9749, "epoch": 80} {"train_loss": -21.464969635009766, "global_step": 9750, "epoch": 80} {"train_loss": -22.219083786010742, "global_step": 9751, "epoch": 80} {"train_loss": -22.008970260620117, "global_step": 9752, "epoch": 80} {"train_loss": -21.81640625, "global_step": 9753, "epoch": 80} {"train_loss": -22.30008888244629, "global_step": 9754, "epoch": 80} {"train_loss": -21.92801856994629, "global_step": 9755, "epoch": 80} {"train_loss": -22.13825035095215, "global_step": 9756, "epoch": 80} {"train_loss": -22.169198989868164, "global_step": 9757, "epoch": 80} {"train_loss": -22.28598403930664, "global_step": 9758, "epoch": 80} {"train_loss": -22.483884811401367, "global_step": 9759, "epoch": 80} {"train_loss": -22.36574363708496, "global_step": 9760, "epoch": 80} {"train_loss": -22.877212524414062, "global_step": 9761, "epoch": 80} {"train_loss": -22.816030502319336, "global_step": 9762, "epoch": 80} {"train_loss": -22.487165451049805, "global_step": 9763, "epoch": 80} {"train_loss": -23.06875991821289, "global_step": 9764, "epoch": 80} {"train_loss": -22.7435302734375, "global_step": 9765, "epoch": 80} {"train_loss": -22.545185089111328, "global_step": 9766, "epoch": 80} {"train_loss": -22.397037506103516, "global_step": 9767, "epoch": 80} {"train_loss": -22.847919464111328, "global_step": 9768, "epoch": 80} {"train_loss": -22.834959030151367, "global_step": 9769, "epoch": 80} {"train_loss": -22.94102668762207, "global_step": 9770, "epoch": 80} {"train_loss": -22.752538681030273, "global_step": 9771, "epoch": 80} {"train_loss": -22.887250900268555, "global_step": 9772, "epoch": 80} {"train_loss": -22.88946533203125, "global_step": 9773, "epoch": 80} {"train_loss": -22.974130630493164, "global_step": 9774, "epoch": 80} {"train_loss": -23.1580753326416, "global_step": 9775, "epoch": 80} {"train_loss": -23.272417068481445, "global_step": 9776, "epoch": 80} {"train_loss": -23.316274642944336, "global_step": 9777, "epoch": 80} {"train_loss": -23.280969619750977, "global_step": 9778, "epoch": 80} {"train_loss": -23.140535354614258, "global_step": 9779, "epoch": 80} {"train_loss": -23.306982040405273, "global_step": 9780, "epoch": 80} {"train_loss": -23.194019317626953, "global_step": 9781, "epoch": 80} {"train_loss": -23.422832489013672, "global_step": 9782, "epoch": 80} {"train_loss": -23.165124893188477, "global_step": 9783, "epoch": 80} {"train_loss": -23.59929847717285, "global_step": 9784, "epoch": 80} {"train_loss": -23.266834259033203, "global_step": 9785, "epoch": 80} {"train_loss": -23.20015525817871, "global_step": 9786, "epoch": 80} {"train_loss": -22.731801986694336, "global_step": 9787, "epoch": 80} {"train_loss": -21.473974227905273, "global_step": 9788, "epoch": 80} {"train_loss": -21.001819610595703, "global_step": 9789, "epoch": 80} {"train_loss": -19.978391647338867, "global_step": 9790, "epoch": 80} {"train_loss": -21.1231746673584, "global_step": 9791, "epoch": 80} {"train_loss": -22.998062133789062, "global_step": 9792, "epoch": 80} {"train_loss": -22.325212478637695, "global_step": 9793, "epoch": 80} {"train_loss": -21.67829704284668, "global_step": 9794, "epoch": 80} {"train_loss": -22.932432174682617, "global_step": 9795, "epoch": 80} {"train_loss": -21.23550033569336, "global_step": 9796, "epoch": 80} {"train_loss": -20.55058479309082, "global_step": 9797, "epoch": 80} {"train_loss": -19.64048957824707, "global_step": 9798, "epoch": 80} {"train_loss": -22.834972381591797, "global_step": 9799, "epoch": 80} {"train_loss": -22.55376955300323, "global_step": 9800, "epoch": 80, "val_loss": 2919704.0} {"train_loss": -22.301929473876953, "global_step": 9801, "epoch": 81} {"train_loss": -22.38690185546875, "global_step": 9802, "epoch": 81} {"train_loss": -22.363309860229492, "global_step": 9803, "epoch": 81} {"train_loss": -22.811765670776367, "global_step": 9804, "epoch": 81} {"train_loss": -22.35584831237793, "global_step": 9805, "epoch": 81} {"train_loss": -23.204957962036133, "global_step": 9806, "epoch": 81} {"train_loss": -22.7830753326416, "global_step": 9807, "epoch": 81} {"train_loss": -22.720205307006836, "global_step": 9808, "epoch": 81} {"train_loss": -23.093181610107422, "global_step": 9809, "epoch": 81} {"train_loss": -22.84615135192871, "global_step": 9810, "epoch": 81} {"train_loss": -22.70218276977539, "global_step": 9811, "epoch": 81} {"train_loss": -23.219730377197266, "global_step": 9812, "epoch": 81} {"train_loss": -22.97857093811035, "global_step": 9813, "epoch": 81} {"train_loss": -22.91163444519043, "global_step": 9814, "epoch": 81} {"train_loss": -23.407108306884766, "global_step": 9815, "epoch": 81} {"train_loss": -22.780149459838867, "global_step": 9816, "epoch": 81} {"train_loss": -23.367448806762695, "global_step": 9817, "epoch": 81} {"train_loss": -22.98934555053711, "global_step": 9818, "epoch": 81} {"train_loss": -23.101224899291992, "global_step": 9819, "epoch": 81} {"train_loss": -23.117918014526367, "global_step": 9820, "epoch": 81} {"train_loss": -23.483633041381836, "global_step": 9821, "epoch": 81} {"train_loss": -23.231916427612305, "global_step": 9822, "epoch": 81} {"train_loss": -23.425825119018555, "global_step": 9823, "epoch": 81} {"train_loss": -23.52750015258789, "global_step": 9824, "epoch": 81} {"train_loss": -23.577075958251953, "global_step": 9825, "epoch": 81} {"train_loss": -23.6514892578125, "global_step": 9826, "epoch": 81} {"train_loss": -23.618762969970703, "global_step": 9827, "epoch": 81} {"train_loss": -23.592365264892578, "global_step": 9828, "epoch": 81} {"train_loss": -24.032522201538086, "global_step": 9829, "epoch": 81} {"train_loss": -23.641033172607422, "global_step": 9830, "epoch": 81} {"train_loss": -23.70386505126953, "global_step": 9831, "epoch": 81} {"train_loss": -23.89848518371582, "global_step": 9832, "epoch": 81} {"train_loss": -23.718135833740234, "global_step": 9833, "epoch": 81} {"train_loss": -23.57884407043457, "global_step": 9834, "epoch": 81} {"train_loss": -23.73952293395996, "global_step": 9835, "epoch": 81} {"train_loss": -23.66452980041504, "global_step": 9836, "epoch": 81} {"train_loss": -23.866924285888672, "global_step": 9837, "epoch": 81} {"train_loss": -23.932418823242188, "global_step": 9838, "epoch": 81} {"train_loss": -23.562515258789062, "global_step": 9839, "epoch": 81} {"train_loss": -22.651844024658203, "global_step": 9840, "epoch": 81} {"train_loss": -19.743730545043945, "global_step": 9841, "epoch": 81} {"train_loss": -12.556731224060059, "global_step": 9842, "epoch": 81} {"train_loss": -5.970221996307373, "global_step": 9843, "epoch": 81} {"train_loss": -15.880560874938965, "global_step": 9844, "epoch": 81} {"train_loss": -21.129901885986328, "global_step": 9845, "epoch": 81} {"train_loss": -20.404489517211914, "global_step": 9846, "epoch": 81} {"train_loss": -20.224245071411133, "global_step": 9847, "epoch": 81} {"train_loss": -22.681577682495117, "global_step": 9848, "epoch": 81} {"train_loss": -21.694387435913086, "global_step": 9849, "epoch": 81} {"train_loss": -21.390174865722656, "global_step": 9850, "epoch": 81} {"train_loss": -22.278532028198242, "global_step": 9851, "epoch": 81} {"train_loss": -22.613784790039062, "global_step": 9852, "epoch": 81} {"train_loss": -22.452749252319336, "global_step": 9853, "epoch": 81} {"train_loss": -22.406112670898438, "global_step": 9854, "epoch": 81} {"train_loss": -22.47723960876465, "global_step": 9855, "epoch": 81} {"train_loss": -22.660810470581055, "global_step": 9856, "epoch": 81} {"train_loss": -22.514753341674805, "global_step": 9857, "epoch": 81} {"train_loss": -23.09142303466797, "global_step": 9858, "epoch": 81} {"train_loss": -22.610658645629883, "global_step": 9859, "epoch": 81} {"train_loss": -22.44957733154297, "global_step": 9860, "epoch": 81} {"train_loss": -22.72125244140625, "global_step": 9861, "epoch": 81} {"train_loss": -22.512771606445312, "global_step": 9862, "epoch": 81} {"train_loss": -23.153806686401367, "global_step": 9863, "epoch": 81} {"train_loss": -22.756772994995117, "global_step": 9864, "epoch": 81} {"train_loss": -23.303613662719727, "global_step": 9865, "epoch": 81} {"train_loss": -22.69730567932129, "global_step": 9866, "epoch": 81} {"train_loss": -23.364723205566406, "global_step": 9867, "epoch": 81} {"train_loss": -23.317655563354492, "global_step": 9868, "epoch": 81} {"train_loss": -23.085983276367188, "global_step": 9869, "epoch": 81} {"train_loss": -22.933727264404297, "global_step": 9870, "epoch": 81} {"train_loss": -22.82071876525879, "global_step": 9871, "epoch": 81} {"train_loss": -23.347232818603516, "global_step": 9872, "epoch": 81} {"train_loss": -23.244220733642578, "global_step": 9873, "epoch": 81} {"train_loss": -23.439350128173828, "global_step": 9874, "epoch": 81} {"train_loss": -23.051788330078125, "global_step": 9875, "epoch": 81} {"train_loss": -22.9165096282959, "global_step": 9876, "epoch": 81} {"train_loss": -22.836668014526367, "global_step": 9877, "epoch": 81} {"train_loss": -23.4719295501709, "global_step": 9878, "epoch": 81} {"train_loss": -23.757741928100586, "global_step": 9879, "epoch": 81} {"train_loss": -22.910337448120117, "global_step": 9880, "epoch": 81} {"train_loss": -23.00339698791504, "global_step": 9881, "epoch": 81} {"train_loss": -22.188207626342773, "global_step": 9882, "epoch": 81} {"train_loss": -20.43275260925293, "global_step": 9883, "epoch": 81} {"train_loss": -20.922454833984375, "global_step": 9884, "epoch": 81} {"train_loss": -23.627628326416016, "global_step": 9885, "epoch": 81} {"train_loss": -22.818212509155273, "global_step": 9886, "epoch": 81} {"train_loss": -23.492521286010742, "global_step": 9887, "epoch": 81} {"train_loss": -23.303342819213867, "global_step": 9888, "epoch": 81} {"train_loss": -23.461307525634766, "global_step": 9889, "epoch": 81} {"train_loss": -23.3166446685791, "global_step": 9890, "epoch": 81} {"train_loss": -22.706989288330078, "global_step": 9891, "epoch": 81} {"train_loss": -22.6841983795166, "global_step": 9892, "epoch": 81} {"train_loss": -22.20271873474121, "global_step": 9893, "epoch": 81} {"train_loss": -22.3749942779541, "global_step": 9894, "epoch": 81} {"train_loss": -23.391122817993164, "global_step": 9895, "epoch": 81} {"train_loss": -23.855506896972656, "global_step": 9896, "epoch": 81} {"train_loss": -22.991744995117188, "global_step": 9897, "epoch": 81} {"train_loss": -22.671735763549805, "global_step": 9898, "epoch": 81} {"train_loss": -23.21121597290039, "global_step": 9899, "epoch": 81} {"train_loss": -23.648420333862305, "global_step": 9900, "epoch": 81} {"train_loss": -23.31932830810547, "global_step": 9901, "epoch": 81} {"train_loss": -23.607419967651367, "global_step": 9902, "epoch": 81} {"train_loss": -23.698728561401367, "global_step": 9903, "epoch": 81} {"train_loss": -23.22853660583496, "global_step": 9904, "epoch": 81} {"train_loss": -23.44864845275879, "global_step": 9905, "epoch": 81} {"train_loss": -23.432510375976562, "global_step": 9906, "epoch": 81} {"train_loss": -24.019001007080078, "global_step": 9907, "epoch": 81} {"train_loss": -23.292055130004883, "global_step": 9908, "epoch": 81} {"train_loss": -23.817365646362305, "global_step": 9909, "epoch": 81} {"train_loss": -23.963300704956055, "global_step": 9910, "epoch": 81} {"train_loss": -23.896963119506836, "global_step": 9911, "epoch": 81} {"train_loss": -23.4694881439209, "global_step": 9912, "epoch": 81} {"train_loss": -23.589574813842773, "global_step": 9913, "epoch": 81} {"train_loss": -23.79286003112793, "global_step": 9914, "epoch": 81} {"train_loss": -23.505029678344727, "global_step": 9915, "epoch": 81} {"train_loss": -23.807952880859375, "global_step": 9916, "epoch": 81} {"train_loss": -23.692819595336914, "global_step": 9917, "epoch": 81} {"train_loss": -24.149187088012695, "global_step": 9918, "epoch": 81} {"train_loss": -24.046653747558594, "global_step": 9919, "epoch": 81} {"train_loss": -24.030303955078125, "global_step": 9920, "epoch": 81} {"train_loss": -22.750305187603658, "global_step": 9921, "epoch": 81, "val_loss": 3406995.25} {"train_loss": -24.39532470703125, "global_step": 9922, "epoch": 82} {"train_loss": -24.346704483032227, "global_step": 9923, "epoch": 82} {"train_loss": -24.50203514099121, "global_step": 9924, "epoch": 82} {"train_loss": -24.029706954956055, "global_step": 9925, "epoch": 82} {"train_loss": -24.02796745300293, "global_step": 9926, "epoch": 82} {"train_loss": -24.034086227416992, "global_step": 9927, "epoch": 82} {"train_loss": -23.82111167907715, "global_step": 9928, "epoch": 82} {"train_loss": -23.6452693939209, "global_step": 9929, "epoch": 82} {"train_loss": -24.14446449279785, "global_step": 9930, "epoch": 82} {"train_loss": -23.9416446685791, "global_step": 9931, "epoch": 82} {"train_loss": -23.694734573364258, "global_step": 9932, "epoch": 82} {"train_loss": -23.287443161010742, "global_step": 9933, "epoch": 82} {"train_loss": -23.73573112487793, "global_step": 9934, "epoch": 82} {"train_loss": -24.174545288085938, "global_step": 9935, "epoch": 82} {"train_loss": -24.10573387145996, "global_step": 9936, "epoch": 82} {"train_loss": -23.601490020751953, "global_step": 9937, "epoch": 82} {"train_loss": -24.09308433532715, "global_step": 9938, "epoch": 82} {"train_loss": -24.551706314086914, "global_step": 9939, "epoch": 82} {"train_loss": -24.201675415039062, "global_step": 9940, "epoch": 82} {"train_loss": -24.248085021972656, "global_step": 9941, "epoch": 82} {"train_loss": -24.262052536010742, "global_step": 9942, "epoch": 82} {"train_loss": -24.300334930419922, "global_step": 9943, "epoch": 82} {"train_loss": -24.684391021728516, "global_step": 9944, "epoch": 82} {"train_loss": -24.1674861907959, "global_step": 9945, "epoch": 82} {"train_loss": -23.59513282775879, "global_step": 9946, "epoch": 82} {"train_loss": -24.32488441467285, "global_step": 9947, "epoch": 82} {"train_loss": -23.40790367126465, "global_step": 9948, "epoch": 82} {"train_loss": -22.203857421875, "global_step": 9949, "epoch": 82} {"train_loss": -23.240985870361328, "global_step": 9950, "epoch": 82} {"train_loss": -23.829187393188477, "global_step": 9951, "epoch": 82} {"train_loss": -22.210159301757812, "global_step": 9952, "epoch": 82} {"train_loss": -23.588903427124023, "global_step": 9953, "epoch": 82} {"train_loss": -23.60794448852539, "global_step": 9954, "epoch": 82} {"train_loss": -23.35335922241211, "global_step": 9955, "epoch": 82} {"train_loss": -23.512907028198242, "global_step": 9956, "epoch": 82} {"train_loss": -22.715774536132812, "global_step": 9957, "epoch": 82} {"train_loss": -23.325397491455078, "global_step": 9958, "epoch": 82} {"train_loss": -22.53761100769043, "global_step": 9959, "epoch": 82} {"train_loss": -23.016069412231445, "global_step": 9960, "epoch": 82} {"train_loss": -22.74574089050293, "global_step": 9961, "epoch": 82} {"train_loss": -23.838972091674805, "global_step": 9962, "epoch": 82} {"train_loss": -22.792280197143555, "global_step": 9963, "epoch": 82} {"train_loss": -23.593069076538086, "global_step": 9964, "epoch": 82} {"train_loss": -22.323759078979492, "global_step": 9965, "epoch": 82} {"train_loss": -23.800649642944336, "global_step": 9966, "epoch": 82} {"train_loss": -22.524980545043945, "global_step": 9967, "epoch": 82} {"train_loss": -21.171249389648438, "global_step": 9968, "epoch": 82} {"train_loss": -23.211315155029297, "global_step": 9969, "epoch": 82} {"train_loss": -22.547454833984375, "global_step": 9970, "epoch": 82} {"train_loss": -21.7352352142334, "global_step": 9971, "epoch": 82} {"train_loss": -23.5561466217041, "global_step": 9972, "epoch": 82} {"train_loss": -22.90180015563965, "global_step": 9973, "epoch": 82} {"train_loss": -23.27400016784668, "global_step": 9974, "epoch": 82} {"train_loss": -23.720684051513672, "global_step": 9975, "epoch": 82} {"train_loss": -23.608922958374023, "global_step": 9976, "epoch": 82} {"train_loss": -23.2074031829834, "global_step": 9977, "epoch": 82} {"train_loss": -23.005075454711914, "global_step": 9978, "epoch": 82} {"train_loss": -23.283777236938477, "global_step": 9979, "epoch": 82} {"train_loss": -23.505285263061523, "global_step": 9980, "epoch": 82} {"train_loss": -23.28095817565918, "global_step": 9981, "epoch": 82} {"train_loss": -23.64393424987793, "global_step": 9982, "epoch": 82} {"train_loss": -23.53427505493164, "global_step": 9983, "epoch": 82} {"train_loss": -23.849531173706055, "global_step": 9984, "epoch": 82} {"train_loss": -24.016992568969727, "global_step": 9985, "epoch": 82} {"train_loss": -23.537229537963867, "global_step": 9986, "epoch": 82} {"train_loss": -24.330615997314453, "global_step": 9987, "epoch": 82} {"train_loss": -23.915142059326172, "global_step": 9988, "epoch": 82} {"train_loss": -24.219470977783203, "global_step": 9989, "epoch": 82} {"train_loss": -23.913053512573242, "global_step": 9990, "epoch": 82} {"train_loss": -23.911741256713867, "global_step": 9991, "epoch": 82} {"train_loss": -24.219396591186523, "global_step": 9992, "epoch": 82} {"train_loss": -23.66616439819336, "global_step": 9993, "epoch": 82} {"train_loss": -24.392532348632812, "global_step": 9994, "epoch": 82} {"train_loss": -23.66075897216797, "global_step": 9995, "epoch": 82} {"train_loss": -23.840078353881836, "global_step": 9996, "epoch": 82} {"train_loss": -23.75269889831543, "global_step": 9997, "epoch": 82} {"train_loss": -23.361555099487305, "global_step": 9998, "epoch": 82} {"train_loss": -23.530370712280273, "global_step": 9999, "epoch": 82} {"train_loss": -23.486587524414062, "global_step": 10000, "epoch": 82} {"train_loss": -23.652782440185547, "global_step": 10001, "epoch": 82} {"train_loss": -23.662887573242188, "global_step": 10002, "epoch": 82} {"train_loss": -23.99468231201172, "global_step": 10003, "epoch": 82} {"train_loss": -24.157400131225586, "global_step": 10004, "epoch": 82} {"train_loss": -24.080121994018555, "global_step": 10005, "epoch": 82} {"train_loss": -24.46843147277832, "global_step": 10006, "epoch": 82} {"train_loss": -24.161466598510742, "global_step": 10007, "epoch": 82} {"train_loss": -24.230478286743164, "global_step": 10008, "epoch": 82} {"train_loss": -24.452573776245117, "global_step": 10009, "epoch": 82} {"train_loss": -24.227209091186523, "global_step": 10010, "epoch": 82} {"train_loss": -24.32767105102539, "global_step": 10011, "epoch": 82} {"train_loss": -24.207265853881836, "global_step": 10012, "epoch": 82} {"train_loss": -24.463970184326172, "global_step": 10013, "epoch": 82} {"train_loss": -24.664094924926758, "global_step": 10014, "epoch": 82} {"train_loss": -24.20159912109375, "global_step": 10015, "epoch": 82} {"train_loss": -24.407365798950195, "global_step": 10016, "epoch": 82} {"train_loss": -24.279449462890625, "global_step": 10017, "epoch": 82} {"train_loss": -24.270689010620117, "global_step": 10018, "epoch": 82} {"train_loss": -24.389921188354492, "global_step": 10019, "epoch": 82} {"train_loss": -24.573755264282227, "global_step": 10020, "epoch": 82} {"train_loss": -24.907197952270508, "global_step": 10021, "epoch": 82} {"train_loss": -24.513721466064453, "global_step": 10022, "epoch": 82} {"train_loss": -24.218900680541992, "global_step": 10023, "epoch": 82} {"train_loss": -24.473316192626953, "global_step": 10024, "epoch": 82} {"train_loss": -24.757923126220703, "global_step": 10025, "epoch": 82} {"train_loss": -24.530685424804688, "global_step": 10026, "epoch": 82} {"train_loss": -24.749147415161133, "global_step": 10027, "epoch": 82} {"train_loss": -24.31646728515625, "global_step": 10028, "epoch": 82} {"train_loss": -24.790395736694336, "global_step": 10029, "epoch": 82} {"train_loss": -24.760665893554688, "global_step": 10030, "epoch": 82} {"train_loss": -24.60220718383789, "global_step": 10031, "epoch": 82} {"train_loss": -24.56595802307129, "global_step": 10032, "epoch": 82} {"train_loss": -24.82709312438965, "global_step": 10033, "epoch": 82} {"train_loss": -24.7914981842041, "global_step": 10034, "epoch": 82} {"train_loss": -24.14192008972168, "global_step": 10035, "epoch": 82} {"train_loss": -24.975238800048828, "global_step": 10036, "epoch": 82} {"train_loss": -24.88177490234375, "global_step": 10037, "epoch": 82} {"train_loss": -24.679141998291016, "global_step": 10038, "epoch": 82} {"train_loss": -25.19219207763672, "global_step": 10039, "epoch": 82} {"train_loss": -24.012907028198242, "global_step": 10040, "epoch": 82} {"train_loss": -23.977399826049805, "global_step": 10041, "epoch": 82} {"train_loss": -23.850267489094378, "global_step": 10042, "epoch": 82, "val_loss": 2867166.25} {"train_loss": -21.232126235961914, "global_step": 10043, "epoch": 83} {"train_loss": -22.64540672302246, "global_step": 10044, "epoch": 83} {"train_loss": -24.37021255493164, "global_step": 10045, "epoch": 83} {"train_loss": -22.989608764648438, "global_step": 10046, "epoch": 83} {"train_loss": -22.8016414642334, "global_step": 10047, "epoch": 83} {"train_loss": -23.83668327331543, "global_step": 10048, "epoch": 83} {"train_loss": -23.64208984375, "global_step": 10049, "epoch": 83} {"train_loss": -23.959997177124023, "global_step": 10050, "epoch": 83} {"train_loss": -22.190338134765625, "global_step": 10051, "epoch": 83} {"train_loss": -23.808942794799805, "global_step": 10052, "epoch": 83} {"train_loss": -23.569021224975586, "global_step": 10053, "epoch": 83} {"train_loss": -24.32645034790039, "global_step": 10054, "epoch": 83} {"train_loss": -23.915090560913086, "global_step": 10055, "epoch": 83} {"train_loss": -23.605205535888672, "global_step": 10056, "epoch": 83} {"train_loss": -23.969152450561523, "global_step": 10057, "epoch": 83} {"train_loss": -23.598012924194336, "global_step": 10058, "epoch": 83} {"train_loss": -23.921085357666016, "global_step": 10059, "epoch": 83} {"train_loss": -23.89231300354004, "global_step": 10060, "epoch": 83} {"train_loss": -23.557809829711914, "global_step": 10061, "epoch": 83} {"train_loss": -23.192304611206055, "global_step": 10062, "epoch": 83} {"train_loss": -23.678800582885742, "global_step": 10063, "epoch": 83} {"train_loss": -23.610605239868164, "global_step": 10064, "epoch": 83} {"train_loss": -23.37587547302246, "global_step": 10065, "epoch": 83} {"train_loss": -24.131505966186523, "global_step": 10066, "epoch": 83} {"train_loss": -23.872766494750977, "global_step": 10067, "epoch": 83} {"train_loss": -23.980976104736328, "global_step": 10068, "epoch": 83} {"train_loss": -24.180057525634766, "global_step": 10069, "epoch": 83} {"train_loss": -24.414905548095703, "global_step": 10070, "epoch": 83} {"train_loss": -24.190719604492188, "global_step": 10071, "epoch": 83} {"train_loss": -24.21222496032715, "global_step": 10072, "epoch": 83} {"train_loss": -24.233579635620117, "global_step": 10073, "epoch": 83} {"train_loss": -23.788297653198242, "global_step": 10074, "epoch": 83} {"train_loss": -24.406173706054688, "global_step": 10075, "epoch": 83} {"train_loss": -24.235435485839844, "global_step": 10076, "epoch": 83} {"train_loss": -24.53009605407715, "global_step": 10077, "epoch": 83} {"train_loss": -24.3892822265625, "global_step": 10078, "epoch": 83} {"train_loss": -24.758010864257812, "global_step": 10079, "epoch": 83} {"train_loss": -24.550809860229492, "global_step": 10080, "epoch": 83} {"train_loss": -24.484338760375977, "global_step": 10081, "epoch": 83} {"train_loss": -24.49728775024414, "global_step": 10082, "epoch": 83} {"train_loss": -24.501148223876953, "global_step": 10083, "epoch": 83} {"train_loss": -24.332326889038086, "global_step": 10084, "epoch": 83} {"train_loss": -24.412818908691406, "global_step": 10085, "epoch": 83} {"train_loss": -24.698545455932617, "global_step": 10086, "epoch": 83} {"train_loss": -24.474010467529297, "global_step": 10087, "epoch": 83} {"train_loss": -24.496252059936523, "global_step": 10088, "epoch": 83} {"train_loss": -25.03272819519043, "global_step": 10089, "epoch": 83} {"train_loss": -24.68720054626465, "global_step": 10090, "epoch": 83} {"train_loss": -25.114328384399414, "global_step": 10091, "epoch": 83} {"train_loss": -24.59897804260254, "global_step": 10092, "epoch": 83} {"train_loss": -24.484296798706055, "global_step": 10093, "epoch": 83} {"train_loss": -24.759445190429688, "global_step": 10094, "epoch": 83} {"train_loss": -25.05525779724121, "global_step": 10095, "epoch": 83} {"train_loss": -24.713754653930664, "global_step": 10096, "epoch": 83} {"train_loss": -24.35211753845215, "global_step": 10097, "epoch": 83} {"train_loss": -24.033903121948242, "global_step": 10098, "epoch": 83} {"train_loss": -24.62078094482422, "global_step": 10099, "epoch": 83} {"train_loss": -24.407987594604492, "global_step": 10100, "epoch": 83} {"train_loss": -23.823514938354492, "global_step": 10101, "epoch": 83} {"train_loss": -24.22860336303711, "global_step": 10102, "epoch": 83} {"train_loss": -25.181982040405273, "global_step": 10103, "epoch": 83} {"train_loss": -24.014429092407227, "global_step": 10104, "epoch": 83} {"train_loss": -23.77573585510254, "global_step": 10105, "epoch": 83} {"train_loss": -23.766077041625977, "global_step": 10106, "epoch": 83} {"train_loss": -21.69490623474121, "global_step": 10107, "epoch": 83} {"train_loss": -22.192384719848633, "global_step": 10108, "epoch": 83} {"train_loss": -21.12613868713379, "global_step": 10109, "epoch": 83} {"train_loss": -21.28401756286621, "global_step": 10110, "epoch": 83} {"train_loss": -23.36871337890625, "global_step": 10111, "epoch": 83} {"train_loss": -24.100557327270508, "global_step": 10112, "epoch": 83} {"train_loss": -21.746456146240234, "global_step": 10113, "epoch": 83} {"train_loss": -22.30548667907715, "global_step": 10114, "epoch": 83} {"train_loss": -24.290958404541016, "global_step": 10115, "epoch": 83} {"train_loss": -22.037927627563477, "global_step": 10116, "epoch": 83} {"train_loss": -23.9126033782959, "global_step": 10117, "epoch": 83} {"train_loss": -23.47388458251953, "global_step": 10118, "epoch": 83} {"train_loss": -23.975248336791992, "global_step": 10119, "epoch": 83} {"train_loss": -24.03049087524414, "global_step": 10120, "epoch": 83} {"train_loss": -23.855575561523438, "global_step": 10121, "epoch": 83} {"train_loss": -23.97383689880371, "global_step": 10122, "epoch": 83} {"train_loss": -24.145376205444336, "global_step": 10123, "epoch": 83} {"train_loss": -22.286163330078125, "global_step": 10124, "epoch": 83} {"train_loss": -22.266965866088867, "global_step": 10125, "epoch": 83} {"train_loss": -23.3234920501709, "global_step": 10126, "epoch": 83} {"train_loss": -21.298620223999023, "global_step": 10127, "epoch": 83} {"train_loss": -23.588958740234375, "global_step": 10128, "epoch": 83} {"train_loss": -23.05976676940918, "global_step": 10129, "epoch": 83} {"train_loss": -22.208324432373047, "global_step": 10130, "epoch": 83} {"train_loss": -23.978139877319336, "global_step": 10131, "epoch": 83} {"train_loss": -23.71415138244629, "global_step": 10132, "epoch": 83} {"train_loss": -23.419498443603516, "global_step": 10133, "epoch": 83} {"train_loss": -23.582231521606445, "global_step": 10134, "epoch": 83} {"train_loss": -23.1621150970459, "global_step": 10135, "epoch": 83} {"train_loss": -24.04376220703125, "global_step": 10136, "epoch": 83} {"train_loss": -23.648399353027344, "global_step": 10137, "epoch": 83} {"train_loss": -24.152027130126953, "global_step": 10138, "epoch": 83} {"train_loss": -23.88031005859375, "global_step": 10139, "epoch": 83} {"train_loss": -23.441328048706055, "global_step": 10140, "epoch": 83} {"train_loss": -23.997116088867188, "global_step": 10141, "epoch": 83} {"train_loss": -23.967884063720703, "global_step": 10142, "epoch": 83} {"train_loss": -24.11421012878418, "global_step": 10143, "epoch": 83} {"train_loss": -24.114093780517578, "global_step": 10144, "epoch": 83} {"train_loss": -24.462085723876953, "global_step": 10145, "epoch": 83} {"train_loss": -24.130338668823242, "global_step": 10146, "epoch": 83} {"train_loss": -24.482419967651367, "global_step": 10147, "epoch": 83} {"train_loss": -24.361785888671875, "global_step": 10148, "epoch": 83} {"train_loss": -24.297225952148438, "global_step": 10149, "epoch": 83} {"train_loss": -24.512115478515625, "global_step": 10150, "epoch": 83} {"train_loss": -23.977092742919922, "global_step": 10151, "epoch": 83} {"train_loss": -23.951047897338867, "global_step": 10152, "epoch": 83} {"train_loss": -24.056411743164062, "global_step": 10153, "epoch": 83} {"train_loss": -23.919851303100586, "global_step": 10154, "epoch": 83} {"train_loss": -24.388439178466797, "global_step": 10155, "epoch": 83} {"train_loss": -24.440460205078125, "global_step": 10156, "epoch": 83} {"train_loss": -24.64118003845215, "global_step": 10157, "epoch": 83} {"train_loss": -24.252187728881836, "global_step": 10158, "epoch": 83} {"train_loss": -23.736255645751953, "global_step": 10159, "epoch": 83} {"train_loss": -22.6330509185791, "global_step": 10160, "epoch": 83} {"train_loss": -17.541667938232422, "global_step": 10161, "epoch": 83} {"train_loss": -9.107231140136719, "global_step": 10162, "epoch": 83} {"train_loss": -23.526435268811944, "global_step": 10163, "epoch": 83, "val_loss": 2858676.75} {"train_loss": -24.232126235961914, "global_step": 10164, "epoch": 84} {"train_loss": -18.301410675048828, "global_step": 10165, "epoch": 84} {"train_loss": -21.294652938842773, "global_step": 10166, "epoch": 84} {"train_loss": -23.02753448486328, "global_step": 10167, "epoch": 84} {"train_loss": -20.28947639465332, "global_step": 10168, "epoch": 84} {"train_loss": -21.401565551757812, "global_step": 10169, "epoch": 84} {"train_loss": -22.055456161499023, "global_step": 10170, "epoch": 84} {"train_loss": -23.39636993408203, "global_step": 10171, "epoch": 84} {"train_loss": -22.675884246826172, "global_step": 10172, "epoch": 84} {"train_loss": -22.54169464111328, "global_step": 10173, "epoch": 84} {"train_loss": -22.402963638305664, "global_step": 10174, "epoch": 84} {"train_loss": -22.21040916442871, "global_step": 10175, "epoch": 84} {"train_loss": -22.55010223388672, "global_step": 10176, "epoch": 84} {"train_loss": -22.720104217529297, "global_step": 10177, "epoch": 84} {"train_loss": -23.056732177734375, "global_step": 10178, "epoch": 84} {"train_loss": -23.206132888793945, "global_step": 10179, "epoch": 84} {"train_loss": -22.986331939697266, "global_step": 10180, "epoch": 84} {"train_loss": -23.405221939086914, "global_step": 10181, "epoch": 84} {"train_loss": -23.231014251708984, "global_step": 10182, "epoch": 84} {"train_loss": -23.031476974487305, "global_step": 10183, "epoch": 84} {"train_loss": -23.03371238708496, "global_step": 10184, "epoch": 84} {"train_loss": -23.06792640686035, "global_step": 10185, "epoch": 84} {"train_loss": -23.108013153076172, "global_step": 10186, "epoch": 84} {"train_loss": -22.809385299682617, "global_step": 10187, "epoch": 84} {"train_loss": -23.110952377319336, "global_step": 10188, "epoch": 84} {"train_loss": -22.99976921081543, "global_step": 10189, "epoch": 84} {"train_loss": -23.453954696655273, "global_step": 10190, "epoch": 84} {"train_loss": -23.819581985473633, "global_step": 10191, "epoch": 84} {"train_loss": -23.476713180541992, "global_step": 10192, "epoch": 84} {"train_loss": -23.546499252319336, "global_step": 10193, "epoch": 84} {"train_loss": -23.191307067871094, "global_step": 10194, "epoch": 84} {"train_loss": -23.68157386779785, "global_step": 10195, "epoch": 84} {"train_loss": -23.904586791992188, "global_step": 10196, "epoch": 84} {"train_loss": -23.62253761291504, "global_step": 10197, "epoch": 84} {"train_loss": -23.87174415588379, "global_step": 10198, "epoch": 84} {"train_loss": -23.736732482910156, "global_step": 10199, "epoch": 84} {"train_loss": -23.50398063659668, "global_step": 10200, "epoch": 84} {"train_loss": -23.56031608581543, "global_step": 10201, "epoch": 84} {"train_loss": -23.074186325073242, "global_step": 10202, "epoch": 84} {"train_loss": -23.32466697692871, "global_step": 10203, "epoch": 84} {"train_loss": -23.37379264831543, "global_step": 10204, "epoch": 84} {"train_loss": -23.64796257019043, "global_step": 10205, "epoch": 84} {"train_loss": -22.44180679321289, "global_step": 10206, "epoch": 84} {"train_loss": -23.258493423461914, "global_step": 10207, "epoch": 84} {"train_loss": -23.505023956298828, "global_step": 10208, "epoch": 84} {"train_loss": -22.352460861206055, "global_step": 10209, "epoch": 84} {"train_loss": -23.558073043823242, "global_step": 10210, "epoch": 84} {"train_loss": -23.48427963256836, "global_step": 10211, "epoch": 84} {"train_loss": -22.897321701049805, "global_step": 10212, "epoch": 84} {"train_loss": -23.677961349487305, "global_step": 10213, "epoch": 84} {"train_loss": -23.53363800048828, "global_step": 10214, "epoch": 84} {"train_loss": -23.591650009155273, "global_step": 10215, "epoch": 84} {"train_loss": -23.238983154296875, "global_step": 10216, "epoch": 84} {"train_loss": -23.484359741210938, "global_step": 10217, "epoch": 84} {"train_loss": -23.822824478149414, "global_step": 10218, "epoch": 84} {"train_loss": -24.018531799316406, "global_step": 10219, "epoch": 84} {"train_loss": -23.72015380859375, "global_step": 10220, "epoch": 84} {"train_loss": -23.578704833984375, "global_step": 10221, "epoch": 84} {"train_loss": -22.772205352783203, "global_step": 10222, "epoch": 84} {"train_loss": -22.643095016479492, "global_step": 10223, "epoch": 84} {"train_loss": -22.653722763061523, "global_step": 10224, "epoch": 84} {"train_loss": -22.141998291015625, "global_step": 10225, "epoch": 84} {"train_loss": -21.840665817260742, "global_step": 10226, "epoch": 84} {"train_loss": -22.816020965576172, "global_step": 10227, "epoch": 84} {"train_loss": -24.024478912353516, "global_step": 10228, "epoch": 84} {"train_loss": -23.132627487182617, "global_step": 10229, "epoch": 84} {"train_loss": -22.53384017944336, "global_step": 10230, "epoch": 84} {"train_loss": -23.2581729888916, "global_step": 10231, "epoch": 84} {"train_loss": -23.194978713989258, "global_step": 10232, "epoch": 84} {"train_loss": -23.067127227783203, "global_step": 10233, "epoch": 84} {"train_loss": -23.149343490600586, "global_step": 10234, "epoch": 84} {"train_loss": -23.604055404663086, "global_step": 10235, "epoch": 84} {"train_loss": -23.49564552307129, "global_step": 10236, "epoch": 84} {"train_loss": -23.606050491333008, "global_step": 10237, "epoch": 84} {"train_loss": -24.25406265258789, "global_step": 10238, "epoch": 84} {"train_loss": -23.85898780822754, "global_step": 10239, "epoch": 84} {"train_loss": -24.117908477783203, "global_step": 10240, "epoch": 84} {"train_loss": -23.96483612060547, "global_step": 10241, "epoch": 84} {"train_loss": -23.797657012939453, "global_step": 10242, "epoch": 84} {"train_loss": -23.026220321655273, "global_step": 10243, "epoch": 84} {"train_loss": -23.63777732849121, "global_step": 10244, "epoch": 84} {"train_loss": -23.532108306884766, "global_step": 10245, "epoch": 84} {"train_loss": -23.154949188232422, "global_step": 10246, "epoch": 84} {"train_loss": -23.689682006835938, "global_step": 10247, "epoch": 84} {"train_loss": -23.10757064819336, "global_step": 10248, "epoch": 84} {"train_loss": -23.87997817993164, "global_step": 10249, "epoch": 84} {"train_loss": -24.077863693237305, "global_step": 10250, "epoch": 84} {"train_loss": -23.293170928955078, "global_step": 10251, "epoch": 84} {"train_loss": -23.868633270263672, "global_step": 10252, "epoch": 84} {"train_loss": -23.53212547302246, "global_step": 10253, "epoch": 84} {"train_loss": -23.768945693969727, "global_step": 10254, "epoch": 84} {"train_loss": -23.907197952270508, "global_step": 10255, "epoch": 84} {"train_loss": -23.322961807250977, "global_step": 10256, "epoch": 84} {"train_loss": -23.709945678710938, "global_step": 10257, "epoch": 84} {"train_loss": -23.624608993530273, "global_step": 10258, "epoch": 84} {"train_loss": -23.935766220092773, "global_step": 10259, "epoch": 84} {"train_loss": -23.63678550720215, "global_step": 10260, "epoch": 84} {"train_loss": -24.353961944580078, "global_step": 10261, "epoch": 84} {"train_loss": -23.791379928588867, "global_step": 10262, "epoch": 84} {"train_loss": -23.664859771728516, "global_step": 10263, "epoch": 84} {"train_loss": -24.217243194580078, "global_step": 10264, "epoch": 84} {"train_loss": -23.898452758789062, "global_step": 10265, "epoch": 84} {"train_loss": -24.036775588989258, "global_step": 10266, "epoch": 84} {"train_loss": -23.6653995513916, "global_step": 10267, "epoch": 84} {"train_loss": -23.81960678100586, "global_step": 10268, "epoch": 84} {"train_loss": -23.976299285888672, "global_step": 10269, "epoch": 84} {"train_loss": -23.86142921447754, "global_step": 10270, "epoch": 84} {"train_loss": -24.379940032958984, "global_step": 10271, "epoch": 84} {"train_loss": -23.678983688354492, "global_step": 10272, "epoch": 84} {"train_loss": -24.35099983215332, "global_step": 10273, "epoch": 84} {"train_loss": -24.045001983642578, "global_step": 10274, "epoch": 84} {"train_loss": -24.16470718383789, "global_step": 10275, "epoch": 84} {"train_loss": -24.110626220703125, "global_step": 10276, "epoch": 84} {"train_loss": -24.014888763427734, "global_step": 10277, "epoch": 84} {"train_loss": -24.499717712402344, "global_step": 10278, "epoch": 84} {"train_loss": -24.37803077697754, "global_step": 10279, "epoch": 84} {"train_loss": -23.66141128540039, "global_step": 10280, "epoch": 84} {"train_loss": -20.692373275756836, "global_step": 10281, "epoch": 84} {"train_loss": -22.44327735900879, "global_step": 10282, "epoch": 84} {"train_loss": -23.94260597229004, "global_step": 10283, "epoch": 84} {"train_loss": -23.313384726027813, "global_step": 10284, "epoch": 84, "val_loss": 2965282.25} {"train_loss": -24.242277145385742, "global_step": 10285, "epoch": 85} {"train_loss": -23.990808486938477, "global_step": 10286, "epoch": 85} {"train_loss": -23.338037490844727, "global_step": 10287, "epoch": 85} {"train_loss": -24.118345260620117, "global_step": 10288, "epoch": 85} {"train_loss": -23.881763458251953, "global_step": 10289, "epoch": 85} {"train_loss": -24.550443649291992, "global_step": 10290, "epoch": 85} {"train_loss": -23.9892578125, "global_step": 10291, "epoch": 85} {"train_loss": -24.262767791748047, "global_step": 10292, "epoch": 85} {"train_loss": -23.97260856628418, "global_step": 10293, "epoch": 85} {"train_loss": -24.419153213500977, "global_step": 10294, "epoch": 85} {"train_loss": -23.695819854736328, "global_step": 10295, "epoch": 85} {"train_loss": -24.54830551147461, "global_step": 10296, "epoch": 85} {"train_loss": -24.241003036499023, "global_step": 10297, "epoch": 85} {"train_loss": -24.471420288085938, "global_step": 10298, "epoch": 85} {"train_loss": -24.6358585357666, "global_step": 10299, "epoch": 85} {"train_loss": -24.38555335998535, "global_step": 10300, "epoch": 85} {"train_loss": -24.391082763671875, "global_step": 10301, "epoch": 85} {"train_loss": -24.094593048095703, "global_step": 10302, "epoch": 85} {"train_loss": -24.010622024536133, "global_step": 10303, "epoch": 85} {"train_loss": -24.293020248413086, "global_step": 10304, "epoch": 85} {"train_loss": -24.594038009643555, "global_step": 10305, "epoch": 85} {"train_loss": -23.5861873626709, "global_step": 10306, "epoch": 85} {"train_loss": -24.266813278198242, "global_step": 10307, "epoch": 85} {"train_loss": -24.806190490722656, "global_step": 10308, "epoch": 85} {"train_loss": -24.324037551879883, "global_step": 10309, "epoch": 85} {"train_loss": -24.7067928314209, "global_step": 10310, "epoch": 85} {"train_loss": -24.6284236907959, "global_step": 10311, "epoch": 85} {"train_loss": -24.69160270690918, "global_step": 10312, "epoch": 85} {"train_loss": -24.971195220947266, "global_step": 10313, "epoch": 85} {"train_loss": -24.58144187927246, "global_step": 10314, "epoch": 85} {"train_loss": -24.7613468170166, "global_step": 10315, "epoch": 85} {"train_loss": -24.21011734008789, "global_step": 10316, "epoch": 85} {"train_loss": -24.34248924255371, "global_step": 10317, "epoch": 85} {"train_loss": -24.752334594726562, "global_step": 10318, "epoch": 85} {"train_loss": -24.499454498291016, "global_step": 10319, "epoch": 85} {"train_loss": -24.163427352905273, "global_step": 10320, "epoch": 85} {"train_loss": -24.134395599365234, "global_step": 10321, "epoch": 85} {"train_loss": -24.22056770324707, "global_step": 10322, "epoch": 85} {"train_loss": -24.876737594604492, "global_step": 10323, "epoch": 85} {"train_loss": -24.62360954284668, "global_step": 10324, "epoch": 85} {"train_loss": -24.115598678588867, "global_step": 10325, "epoch": 85} {"train_loss": -23.52374267578125, "global_step": 10326, "epoch": 85} {"train_loss": -24.25079917907715, "global_step": 10327, "epoch": 85} {"train_loss": -24.8122501373291, "global_step": 10328, "epoch": 85} {"train_loss": -24.141353607177734, "global_step": 10329, "epoch": 85} {"train_loss": -24.69000244140625, "global_step": 10330, "epoch": 85} {"train_loss": -24.380155563354492, "global_step": 10331, "epoch": 85} {"train_loss": -24.612037658691406, "global_step": 10332, "epoch": 85} {"train_loss": -24.398130416870117, "global_step": 10333, "epoch": 85} {"train_loss": -23.970890045166016, "global_step": 10334, "epoch": 85} {"train_loss": -24.3309383392334, "global_step": 10335, "epoch": 85} {"train_loss": -24.495195388793945, "global_step": 10336, "epoch": 85} {"train_loss": -24.134418487548828, "global_step": 10337, "epoch": 85} {"train_loss": -24.982084274291992, "global_step": 10338, "epoch": 85} {"train_loss": -24.25972557067871, "global_step": 10339, "epoch": 85} {"train_loss": -24.334442138671875, "global_step": 10340, "epoch": 85} {"train_loss": -24.021902084350586, "global_step": 10341, "epoch": 85} {"train_loss": -23.2331600189209, "global_step": 10342, "epoch": 85} {"train_loss": -24.316274642944336, "global_step": 10343, "epoch": 85} {"train_loss": -25.189334869384766, "global_step": 10344, "epoch": 85} {"train_loss": -24.39069938659668, "global_step": 10345, "epoch": 85} {"train_loss": -23.910730361938477, "global_step": 10346, "epoch": 85} {"train_loss": -23.039005279541016, "global_step": 10347, "epoch": 85} {"train_loss": -22.665674209594727, "global_step": 10348, "epoch": 85} {"train_loss": -23.840158462524414, "global_step": 10349, "epoch": 85} {"train_loss": -24.441007614135742, "global_step": 10350, "epoch": 85} {"train_loss": -24.65091323852539, "global_step": 10351, "epoch": 85} {"train_loss": -23.399158477783203, "global_step": 10352, "epoch": 85} {"train_loss": -24.615877151489258, "global_step": 10353, "epoch": 85} {"train_loss": -24.517011642456055, "global_step": 10354, "epoch": 85} {"train_loss": -23.174564361572266, "global_step": 10355, "epoch": 85} {"train_loss": -24.750394821166992, "global_step": 10356, "epoch": 85} {"train_loss": -23.41096305847168, "global_step": 10357, "epoch": 85} {"train_loss": -24.73415184020996, "global_step": 10358, "epoch": 85} {"train_loss": -24.330490112304688, "global_step": 10359, "epoch": 85} {"train_loss": -24.340011596679688, "global_step": 10360, "epoch": 85} {"train_loss": -24.40252685546875, "global_step": 10361, "epoch": 85} {"train_loss": -24.223278045654297, "global_step": 10362, "epoch": 85} {"train_loss": -23.412982940673828, "global_step": 10363, "epoch": 85} {"train_loss": -23.35248374938965, "global_step": 10364, "epoch": 85} {"train_loss": -23.072160720825195, "global_step": 10365, "epoch": 85} {"train_loss": -23.513660430908203, "global_step": 10366, "epoch": 85} {"train_loss": -23.360998153686523, "global_step": 10367, "epoch": 85} {"train_loss": -24.478620529174805, "global_step": 10368, "epoch": 85} {"train_loss": -24.1314640045166, "global_step": 10369, "epoch": 85} {"train_loss": -24.49106788635254, "global_step": 10370, "epoch": 85} {"train_loss": -24.046682357788086, "global_step": 10371, "epoch": 85} {"train_loss": -24.156448364257812, "global_step": 10372, "epoch": 85} {"train_loss": -24.53208351135254, "global_step": 10373, "epoch": 85} {"train_loss": -24.04707908630371, "global_step": 10374, "epoch": 85} {"train_loss": -24.351974487304688, "global_step": 10375, "epoch": 85} {"train_loss": -24.680322647094727, "global_step": 10376, "epoch": 85} {"train_loss": -24.57020378112793, "global_step": 10377, "epoch": 85} {"train_loss": -24.442195892333984, "global_step": 10378, "epoch": 85} {"train_loss": -23.622268676757812, "global_step": 10379, "epoch": 85} {"train_loss": -24.319660186767578, "global_step": 10380, "epoch": 85} {"train_loss": -24.616247177124023, "global_step": 10381, "epoch": 85} {"train_loss": -24.31064224243164, "global_step": 10382, "epoch": 85} {"train_loss": -24.735645294189453, "global_step": 10383, "epoch": 85} {"train_loss": -24.87505531311035, "global_step": 10384, "epoch": 85} {"train_loss": -24.885744094848633, "global_step": 10385, "epoch": 85} {"train_loss": -24.283998489379883, "global_step": 10386, "epoch": 85} {"train_loss": -24.896154403686523, "global_step": 10387, "epoch": 85} {"train_loss": -23.928817749023438, "global_step": 10388, "epoch": 85} {"train_loss": -24.756866455078125, "global_step": 10389, "epoch": 85} {"train_loss": -24.7823429107666, "global_step": 10390, "epoch": 85} {"train_loss": -24.453311920166016, "global_step": 10391, "epoch": 85} {"train_loss": -24.6787166595459, "global_step": 10392, "epoch": 85} {"train_loss": -24.731306076049805, "global_step": 10393, "epoch": 85} {"train_loss": -25.05470848083496, "global_step": 10394, "epoch": 85} {"train_loss": -24.847946166992188, "global_step": 10395, "epoch": 85} {"train_loss": -24.20829200744629, "global_step": 10396, "epoch": 85} {"train_loss": -24.555118560791016, "global_step": 10397, "epoch": 85} {"train_loss": -24.942527770996094, "global_step": 10398, "epoch": 85} {"train_loss": -24.669525146484375, "global_step": 10399, "epoch": 85} {"train_loss": -25.10519790649414, "global_step": 10400, "epoch": 85} {"train_loss": -24.443145751953125, "global_step": 10401, "epoch": 85} {"train_loss": -25.027528762817383, "global_step": 10402, "epoch": 85} {"train_loss": -23.991769790649414, "global_step": 10403, "epoch": 85} {"train_loss": -23.46945571899414, "global_step": 10404, "epoch": 85} {"train_loss": -24.29116408292912, "global_step": 10405, "epoch": 85, "val_loss": 2785873.0} {"train_loss": -24.34281349182129, "global_step": 10406, "epoch": 86} {"train_loss": -23.923538208007812, "global_step": 10407, "epoch": 86} {"train_loss": -24.515426635742188, "global_step": 10408, "epoch": 86} {"train_loss": -24.215404510498047, "global_step": 10409, "epoch": 86} {"train_loss": -23.858993530273438, "global_step": 10410, "epoch": 86} {"train_loss": -24.778268814086914, "global_step": 10411, "epoch": 86} {"train_loss": -24.445926666259766, "global_step": 10412, "epoch": 86} {"train_loss": -24.393945693969727, "global_step": 10413, "epoch": 86} {"train_loss": -25.037038803100586, "global_step": 10414, "epoch": 86} {"train_loss": -24.58376693725586, "global_step": 10415, "epoch": 86} {"train_loss": -25.09661102294922, "global_step": 10416, "epoch": 86} {"train_loss": -25.008941650390625, "global_step": 10417, "epoch": 86} {"train_loss": -24.81226921081543, "global_step": 10418, "epoch": 86} {"train_loss": -24.509817123413086, "global_step": 10419, "epoch": 86} {"train_loss": -24.977201461791992, "global_step": 10420, "epoch": 86} {"train_loss": -24.622058868408203, "global_step": 10421, "epoch": 86} {"train_loss": -25.17574119567871, "global_step": 10422, "epoch": 86} {"train_loss": -24.73309898376465, "global_step": 10423, "epoch": 86} {"train_loss": -25.30963134765625, "global_step": 10424, "epoch": 86} {"train_loss": -24.896039962768555, "global_step": 10425, "epoch": 86} {"train_loss": -25.30910301208496, "global_step": 10426, "epoch": 86} {"train_loss": -24.77813720703125, "global_step": 10427, "epoch": 86} {"train_loss": -24.79677963256836, "global_step": 10428, "epoch": 86} {"train_loss": -25.181238174438477, "global_step": 10429, "epoch": 86} {"train_loss": -24.10805320739746, "global_step": 10430, "epoch": 86} {"train_loss": -24.964763641357422, "global_step": 10431, "epoch": 86} {"train_loss": -24.971668243408203, "global_step": 10432, "epoch": 86} {"train_loss": -24.7432861328125, "global_step": 10433, "epoch": 86} {"train_loss": -24.881189346313477, "global_step": 10434, "epoch": 86} {"train_loss": -23.906347274780273, "global_step": 10435, "epoch": 86} {"train_loss": -22.228086471557617, "global_step": 10436, "epoch": 86} {"train_loss": -21.10856819152832, "global_step": 10437, "epoch": 86} {"train_loss": -19.15888023376465, "global_step": 10438, "epoch": 86} {"train_loss": -21.747283935546875, "global_step": 10439, "epoch": 86} {"train_loss": -24.94325065612793, "global_step": 10440, "epoch": 86} {"train_loss": -21.849950790405273, "global_step": 10441, "epoch": 86} {"train_loss": -23.34672737121582, "global_step": 10442, "epoch": 86} {"train_loss": -22.754384994506836, "global_step": 10443, "epoch": 86} {"train_loss": -22.509780883789062, "global_step": 10444, "epoch": 86} {"train_loss": -23.166654586791992, "global_step": 10445, "epoch": 86} {"train_loss": -24.415599822998047, "global_step": 10446, "epoch": 86} {"train_loss": -23.6946964263916, "global_step": 10447, "epoch": 86} {"train_loss": -23.762632369995117, "global_step": 10448, "epoch": 86} {"train_loss": -23.365070343017578, "global_step": 10449, "epoch": 86} {"train_loss": -24.58050537109375, "global_step": 10450, "epoch": 86} {"train_loss": -24.291208267211914, "global_step": 10451, "epoch": 86} {"train_loss": -24.22740936279297, "global_step": 10452, "epoch": 86} {"train_loss": -24.537811279296875, "global_step": 10453, "epoch": 86} {"train_loss": -23.974817276000977, "global_step": 10454, "epoch": 86} {"train_loss": -24.643606185913086, "global_step": 10455, "epoch": 86} {"train_loss": -24.565475463867188, "global_step": 10456, "epoch": 86} {"train_loss": -24.62155532836914, "global_step": 10457, "epoch": 86} {"train_loss": -24.128461837768555, "global_step": 10458, "epoch": 86} {"train_loss": -24.73831558227539, "global_step": 10459, "epoch": 86} {"train_loss": -24.199148178100586, "global_step": 10460, "epoch": 86} {"train_loss": -24.15232276916504, "global_step": 10461, "epoch": 86} {"train_loss": -24.627277374267578, "global_step": 10462, "epoch": 86} {"train_loss": -24.684101104736328, "global_step": 10463, "epoch": 86} {"train_loss": -24.548973083496094, "global_step": 10464, "epoch": 86} {"train_loss": -23.90730857849121, "global_step": 10465, "epoch": 86} {"train_loss": -24.67314910888672, "global_step": 10466, "epoch": 86} {"train_loss": -24.52089500427246, "global_step": 10467, "epoch": 86} {"train_loss": -24.331787109375, "global_step": 10468, "epoch": 86} {"train_loss": -24.544921875, "global_step": 10469, "epoch": 86} {"train_loss": -24.719486236572266, "global_step": 10470, "epoch": 86} {"train_loss": -24.85771942138672, "global_step": 10471, "epoch": 86} {"train_loss": -24.596385955810547, "global_step": 10472, "epoch": 86} {"train_loss": -25.036752700805664, "global_step": 10473, "epoch": 86} {"train_loss": -25.19251823425293, "global_step": 10474, "epoch": 86} {"train_loss": -24.685300827026367, "global_step": 10475, "epoch": 86} {"train_loss": -25.130008697509766, "global_step": 10476, "epoch": 86} {"train_loss": -24.63113784790039, "global_step": 10477, "epoch": 86} {"train_loss": -24.68813133239746, "global_step": 10478, "epoch": 86} {"train_loss": -24.787553787231445, "global_step": 10479, "epoch": 86} {"train_loss": -24.716238021850586, "global_step": 10480, "epoch": 86} {"train_loss": -24.701250076293945, "global_step": 10481, "epoch": 86} {"train_loss": -24.66648292541504, "global_step": 10482, "epoch": 86} {"train_loss": -24.55204963684082, "global_step": 10483, "epoch": 86} {"train_loss": -24.96439552307129, "global_step": 10484, "epoch": 86} {"train_loss": -23.903303146362305, "global_step": 10485, "epoch": 86} {"train_loss": -23.206640243530273, "global_step": 10486, "epoch": 86} {"train_loss": -24.26862144470215, "global_step": 10487, "epoch": 86} {"train_loss": -24.748958587646484, "global_step": 10488, "epoch": 86} {"train_loss": -24.426082611083984, "global_step": 10489, "epoch": 86} {"train_loss": -24.43172264099121, "global_step": 10490, "epoch": 86} {"train_loss": -24.65333366394043, "global_step": 10491, "epoch": 86} {"train_loss": -24.4057559967041, "global_step": 10492, "epoch": 86} {"train_loss": -23.84791374206543, "global_step": 10493, "epoch": 86} {"train_loss": -22.798269271850586, "global_step": 10494, "epoch": 86} {"train_loss": -24.328266143798828, "global_step": 10495, "epoch": 86} {"train_loss": -24.323408126831055, "global_step": 10496, "epoch": 86} {"train_loss": -21.79041862487793, "global_step": 10497, "epoch": 86} {"train_loss": -23.73981475830078, "global_step": 10498, "epoch": 86} {"train_loss": -24.040006637573242, "global_step": 10499, "epoch": 86} {"train_loss": -22.272022247314453, "global_step": 10500, "epoch": 86} {"train_loss": -24.38831901550293, "global_step": 10501, "epoch": 86} {"train_loss": -23.460325241088867, "global_step": 10502, "epoch": 86} {"train_loss": -24.1220703125, "global_step": 10503, "epoch": 86} {"train_loss": -23.3227596282959, "global_step": 10504, "epoch": 86} {"train_loss": -23.844409942626953, "global_step": 10505, "epoch": 86} {"train_loss": -23.731552124023438, "global_step": 10506, "epoch": 86} {"train_loss": -23.929609298706055, "global_step": 10507, "epoch": 86} {"train_loss": -24.082866668701172, "global_step": 10508, "epoch": 86} {"train_loss": -23.921152114868164, "global_step": 10509, "epoch": 86} {"train_loss": -23.729536056518555, "global_step": 10510, "epoch": 86} {"train_loss": -24.566986083984375, "global_step": 10511, "epoch": 86} {"train_loss": -23.686445236206055, "global_step": 10512, "epoch": 86} {"train_loss": -23.911046981811523, "global_step": 10513, "epoch": 86} {"train_loss": -24.547210693359375, "global_step": 10514, "epoch": 86} {"train_loss": -23.88787841796875, "global_step": 10515, "epoch": 86} {"train_loss": -24.27834129333496, "global_step": 10516, "epoch": 86} {"train_loss": -24.016876220703125, "global_step": 10517, "epoch": 86} {"train_loss": -23.6377010345459, "global_step": 10518, "epoch": 86} {"train_loss": -24.521615982055664, "global_step": 10519, "epoch": 86} {"train_loss": -23.810836791992188, "global_step": 10520, "epoch": 86} {"train_loss": -24.006977081298828, "global_step": 10521, "epoch": 86} {"train_loss": -24.092529296875, "global_step": 10522, "epoch": 86} {"train_loss": -23.62326431274414, "global_step": 10523, "epoch": 86} {"train_loss": -24.776090621948242, "global_step": 10524, "epoch": 86} {"train_loss": -24.696203231811523, "global_step": 10525, "epoch": 86} {"train_loss": -24.178444728378423, "global_step": 10526, "epoch": 86, "val_loss": 3279066.0} {"train_loss": -23.683887481689453, "global_step": 10527, "epoch": 87} {"train_loss": -24.048513412475586, "global_step": 10528, "epoch": 87} {"train_loss": -23.568689346313477, "global_step": 10529, "epoch": 87} {"train_loss": -23.246566772460938, "global_step": 10530, "epoch": 87} {"train_loss": -22.815994262695312, "global_step": 10531, "epoch": 87} {"train_loss": -22.848657608032227, "global_step": 10532, "epoch": 87} {"train_loss": -24.678821563720703, "global_step": 10533, "epoch": 87} {"train_loss": -23.932355880737305, "global_step": 10534, "epoch": 87} {"train_loss": -23.642688751220703, "global_step": 10535, "epoch": 87} {"train_loss": -23.02890396118164, "global_step": 10536, "epoch": 87} {"train_loss": -24.9163875579834, "global_step": 10537, "epoch": 87} {"train_loss": -23.962682723999023, "global_step": 10538, "epoch": 87} {"train_loss": -23.709810256958008, "global_step": 10539, "epoch": 87} {"train_loss": -23.84925651550293, "global_step": 10540, "epoch": 87} {"train_loss": -23.83346176147461, "global_step": 10541, "epoch": 87} {"train_loss": -24.18269157409668, "global_step": 10542, "epoch": 87} {"train_loss": -24.56559944152832, "global_step": 10543, "epoch": 87} {"train_loss": -24.616247177124023, "global_step": 10544, "epoch": 87} {"train_loss": -24.394107818603516, "global_step": 10545, "epoch": 87} {"train_loss": -24.783889770507812, "global_step": 10546, "epoch": 87} {"train_loss": -24.493244171142578, "global_step": 10547, "epoch": 87} {"train_loss": -24.18772315979004, "global_step": 10548, "epoch": 87} {"train_loss": -24.595739364624023, "global_step": 10549, "epoch": 87} {"train_loss": -24.233137130737305, "global_step": 10550, "epoch": 87} {"train_loss": -24.544469833374023, "global_step": 10551, "epoch": 87} {"train_loss": -24.54869270324707, "global_step": 10552, "epoch": 87} {"train_loss": -24.117780685424805, "global_step": 10553, "epoch": 87} {"train_loss": -25.145198822021484, "global_step": 10554, "epoch": 87} {"train_loss": -24.43669891357422, "global_step": 10555, "epoch": 87} {"train_loss": -24.834745407104492, "global_step": 10556, "epoch": 87} {"train_loss": -24.73807144165039, "global_step": 10557, "epoch": 87} {"train_loss": -24.895036697387695, "global_step": 10558, "epoch": 87} {"train_loss": -24.886289596557617, "global_step": 10559, "epoch": 87} {"train_loss": -24.857723236083984, "global_step": 10560, "epoch": 87} {"train_loss": -25.312936782836914, "global_step": 10561, "epoch": 87} {"train_loss": -25.09667205810547, "global_step": 10562, "epoch": 87} {"train_loss": -25.221115112304688, "global_step": 10563, "epoch": 87} {"train_loss": -25.324949264526367, "global_step": 10564, "epoch": 87} {"train_loss": -24.917661666870117, "global_step": 10565, "epoch": 87} {"train_loss": -24.980436325073242, "global_step": 10566, "epoch": 87} {"train_loss": -25.074514389038086, "global_step": 10567, "epoch": 87} {"train_loss": -24.84916114807129, "global_step": 10568, "epoch": 87} {"train_loss": -25.188722610473633, "global_step": 10569, "epoch": 87} {"train_loss": -25.017126083374023, "global_step": 10570, "epoch": 87} {"train_loss": -25.057775497436523, "global_step": 10571, "epoch": 87} {"train_loss": -25.12259292602539, "global_step": 10572, "epoch": 87} {"train_loss": -25.031740188598633, "global_step": 10573, "epoch": 87} {"train_loss": -24.89935874938965, "global_step": 10574, "epoch": 87} {"train_loss": -25.568206787109375, "global_step": 10575, "epoch": 87} {"train_loss": -25.42183494567871, "global_step": 10576, "epoch": 87} {"train_loss": -25.018274307250977, "global_step": 10577, "epoch": 87} {"train_loss": -25.379562377929688, "global_step": 10578, "epoch": 87} {"train_loss": -24.886356353759766, "global_step": 10579, "epoch": 87} {"train_loss": -25.283327102661133, "global_step": 10580, "epoch": 87} {"train_loss": -23.76527214050293, "global_step": 10581, "epoch": 87} {"train_loss": -20.967761993408203, "global_step": 10582, "epoch": 87} {"train_loss": -19.289457321166992, "global_step": 10583, "epoch": 87} {"train_loss": -22.544469833374023, "global_step": 10584, "epoch": 87} {"train_loss": -24.20368003845215, "global_step": 10585, "epoch": 87} {"train_loss": -21.568405151367188, "global_step": 10586, "epoch": 87} {"train_loss": -23.60226058959961, "global_step": 10587, "epoch": 87} {"train_loss": -23.66226577758789, "global_step": 10588, "epoch": 87} {"train_loss": -23.67111587524414, "global_step": 10589, "epoch": 87} {"train_loss": -23.99189567565918, "global_step": 10590, "epoch": 87} {"train_loss": -22.79210090637207, "global_step": 10591, "epoch": 87} {"train_loss": -24.605533599853516, "global_step": 10592, "epoch": 87} {"train_loss": -23.76691436767578, "global_step": 10593, "epoch": 87} {"train_loss": -24.76051902770996, "global_step": 10594, "epoch": 87} {"train_loss": -23.896499633789062, "global_step": 10595, "epoch": 87} {"train_loss": -24.79483985900879, "global_step": 10596, "epoch": 87} {"train_loss": -24.471141815185547, "global_step": 10597, "epoch": 87} {"train_loss": -24.14900016784668, "global_step": 10598, "epoch": 87} {"train_loss": -25.215147018432617, "global_step": 10599, "epoch": 87} {"train_loss": -24.718687057495117, "global_step": 10600, "epoch": 87} {"train_loss": -24.473691940307617, "global_step": 10601, "epoch": 87} {"train_loss": -24.3927059173584, "global_step": 10602, "epoch": 87} {"train_loss": -24.901229858398438, "global_step": 10603, "epoch": 87} {"train_loss": -24.527345657348633, "global_step": 10604, "epoch": 87} {"train_loss": -24.679622650146484, "global_step": 10605, "epoch": 87} {"train_loss": -24.365222930908203, "global_step": 10606, "epoch": 87} {"train_loss": -23.679670333862305, "global_step": 10607, "epoch": 87} {"train_loss": -24.007600784301758, "global_step": 10608, "epoch": 87} {"train_loss": -24.525693893432617, "global_step": 10609, "epoch": 87} {"train_loss": -23.979053497314453, "global_step": 10610, "epoch": 87} {"train_loss": -24.360876083374023, "global_step": 10611, "epoch": 87} {"train_loss": -25.37714195251465, "global_step": 10612, "epoch": 87} {"train_loss": -24.170141220092773, "global_step": 10613, "epoch": 87} {"train_loss": -24.06077003479004, "global_step": 10614, "epoch": 87} {"train_loss": -24.990415573120117, "global_step": 10615, "epoch": 87} {"train_loss": -24.235980987548828, "global_step": 10616, "epoch": 87} {"train_loss": -24.405303955078125, "global_step": 10617, "epoch": 87} {"train_loss": -24.51048469543457, "global_step": 10618, "epoch": 87} {"train_loss": -24.400964736938477, "global_step": 10619, "epoch": 87} {"train_loss": -25.376916885375977, "global_step": 10620, "epoch": 87} {"train_loss": -24.59765625, "global_step": 10621, "epoch": 87} {"train_loss": -24.973264694213867, "global_step": 10622, "epoch": 87} {"train_loss": -24.781015396118164, "global_step": 10623, "epoch": 87} {"train_loss": -25.184627532958984, "global_step": 10624, "epoch": 87} {"train_loss": -24.69947624206543, "global_step": 10625, "epoch": 87} {"train_loss": -24.976720809936523, "global_step": 10626, "epoch": 87} {"train_loss": -24.58906364440918, "global_step": 10627, "epoch": 87} {"train_loss": -25.151517868041992, "global_step": 10628, "epoch": 87} {"train_loss": -24.4106502532959, "global_step": 10629, "epoch": 87} {"train_loss": -24.789798736572266, "global_step": 10630, "epoch": 87} {"train_loss": -24.906599044799805, "global_step": 10631, "epoch": 87} {"train_loss": -24.218839645385742, "global_step": 10632, "epoch": 87} {"train_loss": -24.570585250854492, "global_step": 10633, "epoch": 87} {"train_loss": -24.14566421508789, "global_step": 10634, "epoch": 87} {"train_loss": -24.12745475769043, "global_step": 10635, "epoch": 87} {"train_loss": -24.62544059753418, "global_step": 10636, "epoch": 87} {"train_loss": -24.423818588256836, "global_step": 10637, "epoch": 87} {"train_loss": -24.51466178894043, "global_step": 10638, "epoch": 87} {"train_loss": -24.516611099243164, "global_step": 10639, "epoch": 87} {"train_loss": -24.147119522094727, "global_step": 10640, "epoch": 87} {"train_loss": -25.248306274414062, "global_step": 10641, "epoch": 87} {"train_loss": -24.793991088867188, "global_step": 10642, "epoch": 87} {"train_loss": -24.36308479309082, "global_step": 10643, "epoch": 87} {"train_loss": -23.896364212036133, "global_step": 10644, "epoch": 87} {"train_loss": -24.074064254760742, "global_step": 10645, "epoch": 87} {"train_loss": -25.002090454101562, "global_step": 10646, "epoch": 87} {"train_loss": -24.368449833767475, "global_step": 10647, "epoch": 87, "val_loss": 2885012.75} {"train_loss": -23.544069290161133, "global_step": 10648, "epoch": 88} {"train_loss": -24.15188980102539, "global_step": 10649, "epoch": 88} {"train_loss": -23.24136734008789, "global_step": 10650, "epoch": 88} {"train_loss": -24.90597152709961, "global_step": 10651, "epoch": 88} {"train_loss": -23.288862228393555, "global_step": 10652, "epoch": 88} {"train_loss": -24.796987533569336, "global_step": 10653, "epoch": 88} {"train_loss": -24.351917266845703, "global_step": 10654, "epoch": 88} {"train_loss": -24.9025936126709, "global_step": 10655, "epoch": 88} {"train_loss": -24.506412506103516, "global_step": 10656, "epoch": 88} {"train_loss": -24.068492889404297, "global_step": 10657, "epoch": 88} {"train_loss": -24.550552368164062, "global_step": 10658, "epoch": 88} {"train_loss": -24.286108016967773, "global_step": 10659, "epoch": 88} {"train_loss": -24.703153610229492, "global_step": 10660, "epoch": 88} {"train_loss": -24.35093116760254, "global_step": 10661, "epoch": 88} {"train_loss": -24.962278366088867, "global_step": 10662, "epoch": 88} {"train_loss": -24.7889461517334, "global_step": 10663, "epoch": 88} {"train_loss": -24.875215530395508, "global_step": 10664, "epoch": 88} {"train_loss": -24.707950592041016, "global_step": 10665, "epoch": 88} {"train_loss": -24.894607543945312, "global_step": 10666, "epoch": 88} {"train_loss": -24.887598037719727, "global_step": 10667, "epoch": 88} {"train_loss": -24.352554321289062, "global_step": 10668, "epoch": 88} {"train_loss": -24.909128189086914, "global_step": 10669, "epoch": 88} {"train_loss": -24.136316299438477, "global_step": 10670, "epoch": 88} {"train_loss": -24.437297821044922, "global_step": 10671, "epoch": 88} {"train_loss": -24.9899845123291, "global_step": 10672, "epoch": 88} {"train_loss": -24.788991928100586, "global_step": 10673, "epoch": 88} {"train_loss": -24.731184005737305, "global_step": 10674, "epoch": 88} {"train_loss": -24.680252075195312, "global_step": 10675, "epoch": 88} {"train_loss": -25.38711929321289, "global_step": 10676, "epoch": 88} {"train_loss": -25.26472282409668, "global_step": 10677, "epoch": 88} {"train_loss": -24.24031639099121, "global_step": 10678, "epoch": 88} {"train_loss": -25.072742462158203, "global_step": 10679, "epoch": 88} {"train_loss": -24.636978149414062, "global_step": 10680, "epoch": 88} {"train_loss": -25.1887149810791, "global_step": 10681, "epoch": 88} {"train_loss": -25.14344596862793, "global_step": 10682, "epoch": 88} {"train_loss": -24.80417251586914, "global_step": 10683, "epoch": 88} {"train_loss": -25.349777221679688, "global_step": 10684, "epoch": 88} {"train_loss": -25.464269638061523, "global_step": 10685, "epoch": 88} {"train_loss": -24.893651962280273, "global_step": 10686, "epoch": 88} {"train_loss": -23.617979049682617, "global_step": 10687, "epoch": 88} {"train_loss": -22.93609619140625, "global_step": 10688, "epoch": 88} {"train_loss": -23.505369186401367, "global_step": 10689, "epoch": 88} {"train_loss": -21.773801803588867, "global_step": 10690, "epoch": 88} {"train_loss": -23.14792251586914, "global_step": 10691, "epoch": 88} {"train_loss": -23.9175968170166, "global_step": 10692, "epoch": 88} {"train_loss": -22.343915939331055, "global_step": 10693, "epoch": 88} {"train_loss": -24.11269187927246, "global_step": 10694, "epoch": 88} {"train_loss": -23.235315322875977, "global_step": 10695, "epoch": 88} {"train_loss": -23.658573150634766, "global_step": 10696, "epoch": 88} {"train_loss": -22.48457145690918, "global_step": 10697, "epoch": 88} {"train_loss": -21.622243881225586, "global_step": 10698, "epoch": 88} {"train_loss": -22.2070369720459, "global_step": 10699, "epoch": 88} {"train_loss": -24.391218185424805, "global_step": 10700, "epoch": 88} {"train_loss": -22.94462013244629, "global_step": 10701, "epoch": 88} {"train_loss": -22.507164001464844, "global_step": 10702, "epoch": 88} {"train_loss": -23.940420150756836, "global_step": 10703, "epoch": 88} {"train_loss": -23.7493953704834, "global_step": 10704, "epoch": 88} {"train_loss": -23.812225341796875, "global_step": 10705, "epoch": 88} {"train_loss": -23.90523338317871, "global_step": 10706, "epoch": 88} {"train_loss": -23.7501220703125, "global_step": 10707, "epoch": 88} {"train_loss": -24.690996170043945, "global_step": 10708, "epoch": 88} {"train_loss": -24.3460693359375, "global_step": 10709, "epoch": 88} {"train_loss": -24.137399673461914, "global_step": 10710, "epoch": 88} {"train_loss": -24.24570083618164, "global_step": 10711, "epoch": 88} {"train_loss": -24.68953514099121, "global_step": 10712, "epoch": 88} {"train_loss": -24.251874923706055, "global_step": 10713, "epoch": 88} {"train_loss": -24.47314453125, "global_step": 10714, "epoch": 88} {"train_loss": -24.385868072509766, "global_step": 10715, "epoch": 88} {"train_loss": -24.150968551635742, "global_step": 10716, "epoch": 88} {"train_loss": -24.590051651000977, "global_step": 10717, "epoch": 88} {"train_loss": -24.505165100097656, "global_step": 10718, "epoch": 88} {"train_loss": -24.5452938079834, "global_step": 10719, "epoch": 88} {"train_loss": -24.452396392822266, "global_step": 10720, "epoch": 88} {"train_loss": -24.76955223083496, "global_step": 10721, "epoch": 88} {"train_loss": -24.884519577026367, "global_step": 10722, "epoch": 88} {"train_loss": -24.782094955444336, "global_step": 10723, "epoch": 88} {"train_loss": -24.65765380859375, "global_step": 10724, "epoch": 88} {"train_loss": -24.77283477783203, "global_step": 10725, "epoch": 88} {"train_loss": -24.84613609313965, "global_step": 10726, "epoch": 88} {"train_loss": -25.10896110534668, "global_step": 10727, "epoch": 88} {"train_loss": -25.05240821838379, "global_step": 10728, "epoch": 88} {"train_loss": -25.272916793823242, "global_step": 10729, "epoch": 88} {"train_loss": -25.079832077026367, "global_step": 10730, "epoch": 88} {"train_loss": -25.258935928344727, "global_step": 10731, "epoch": 88} {"train_loss": -25.440170288085938, "global_step": 10732, "epoch": 88} {"train_loss": -25.494916915893555, "global_step": 10733, "epoch": 88} {"train_loss": -24.978174209594727, "global_step": 10734, "epoch": 88} {"train_loss": -25.119827270507812, "global_step": 10735, "epoch": 88} {"train_loss": -25.0129337310791, "global_step": 10736, "epoch": 88} {"train_loss": -24.684810638427734, "global_step": 10737, "epoch": 88} {"train_loss": -24.283267974853516, "global_step": 10738, "epoch": 88} {"train_loss": -24.356672286987305, "global_step": 10739, "epoch": 88} {"train_loss": -24.57964324951172, "global_step": 10740, "epoch": 88} {"train_loss": -23.838064193725586, "global_step": 10741, "epoch": 88} {"train_loss": -23.835603713989258, "global_step": 10742, "epoch": 88} {"train_loss": -23.99420738220215, "global_step": 10743, "epoch": 88} {"train_loss": -24.8919734954834, "global_step": 10744, "epoch": 88} {"train_loss": -23.71868324279785, "global_step": 10745, "epoch": 88} {"train_loss": -23.131547927856445, "global_step": 10746, "epoch": 88} {"train_loss": -25.182153701782227, "global_step": 10747, "epoch": 88} {"train_loss": -24.479066848754883, "global_step": 10748, "epoch": 88} {"train_loss": -22.369144439697266, "global_step": 10749, "epoch": 88} {"train_loss": -24.598405838012695, "global_step": 10750, "epoch": 88} {"train_loss": -24.904830932617188, "global_step": 10751, "epoch": 88} {"train_loss": -24.264976501464844, "global_step": 10752, "epoch": 88} {"train_loss": -24.961759567260742, "global_step": 10753, "epoch": 88} {"train_loss": -24.407562255859375, "global_step": 10754, "epoch": 88} {"train_loss": -25.095745086669922, "global_step": 10755, "epoch": 88} {"train_loss": -24.31740379333496, "global_step": 10756, "epoch": 88} {"train_loss": -25.02823257446289, "global_step": 10757, "epoch": 88} {"train_loss": -24.312585830688477, "global_step": 10758, "epoch": 88} {"train_loss": -25.004663467407227, "global_step": 10759, "epoch": 88} {"train_loss": -24.594411849975586, "global_step": 10760, "epoch": 88} {"train_loss": -25.08794593811035, "global_step": 10761, "epoch": 88} {"train_loss": -24.080636978149414, "global_step": 10762, "epoch": 88} {"train_loss": -24.571523666381836, "global_step": 10763, "epoch": 88} {"train_loss": -24.798175811767578, "global_step": 10764, "epoch": 88} {"train_loss": -24.285871505737305, "global_step": 10765, "epoch": 88} {"train_loss": -25.34981346130371, "global_step": 10766, "epoch": 88} {"train_loss": -24.7397518157959, "global_step": 10767, "epoch": 88} {"train_loss": -24.36295785194586, "global_step": 10768, "epoch": 88, "val_loss": 2583582.0} {"train_loss": -22.975317001342773, "global_step": 10769, "epoch": 89} {"train_loss": -22.03737449645996, "global_step": 10770, "epoch": 89} {"train_loss": -20.834121704101562, "global_step": 10771, "epoch": 89} {"train_loss": -21.505859375, "global_step": 10772, "epoch": 89} {"train_loss": -23.109256744384766, "global_step": 10773, "epoch": 89} {"train_loss": -23.136335372924805, "global_step": 10774, "epoch": 89} {"train_loss": -23.41607093811035, "global_step": 10775, "epoch": 89} {"train_loss": -23.350828170776367, "global_step": 10776, "epoch": 89} {"train_loss": -23.18766212463379, "global_step": 10777, "epoch": 89} {"train_loss": -23.299259185791016, "global_step": 10778, "epoch": 89} {"train_loss": -24.506710052490234, "global_step": 10779, "epoch": 89} {"train_loss": -23.689077377319336, "global_step": 10780, "epoch": 89} {"train_loss": -23.515060424804688, "global_step": 10781, "epoch": 89} {"train_loss": -24.170011520385742, "global_step": 10782, "epoch": 89} {"train_loss": -23.382986068725586, "global_step": 10783, "epoch": 89} {"train_loss": -23.55962562561035, "global_step": 10784, "epoch": 89} {"train_loss": -24.226228713989258, "global_step": 10785, "epoch": 89} {"train_loss": -23.9130916595459, "global_step": 10786, "epoch": 89} {"train_loss": -24.40597915649414, "global_step": 10787, "epoch": 89} {"train_loss": -23.827993392944336, "global_step": 10788, "epoch": 89} {"train_loss": -24.440561294555664, "global_step": 10789, "epoch": 89} {"train_loss": -24.342187881469727, "global_step": 10790, "epoch": 89} {"train_loss": -24.5540714263916, "global_step": 10791, "epoch": 89} {"train_loss": -24.712736129760742, "global_step": 10792, "epoch": 89} {"train_loss": -24.454076766967773, "global_step": 10793, "epoch": 89} {"train_loss": -24.246801376342773, "global_step": 10794, "epoch": 89} {"train_loss": -24.649810791015625, "global_step": 10795, "epoch": 89} {"train_loss": -24.423215866088867, "global_step": 10796, "epoch": 89} {"train_loss": -24.436437606811523, "global_step": 10797, "epoch": 89} {"train_loss": -24.699935913085938, "global_step": 10798, "epoch": 89} {"train_loss": -24.40738296508789, "global_step": 10799, "epoch": 89} {"train_loss": -24.696552276611328, "global_step": 10800, "epoch": 89} {"train_loss": -24.83234214782715, "global_step": 10801, "epoch": 89} {"train_loss": -24.54978370666504, "global_step": 10802, "epoch": 89} {"train_loss": -24.616918563842773, "global_step": 10803, "epoch": 89} {"train_loss": -24.94333267211914, "global_step": 10804, "epoch": 89} {"train_loss": -24.614606857299805, "global_step": 10805, "epoch": 89} {"train_loss": -24.956287384033203, "global_step": 10806, "epoch": 89} {"train_loss": -25.01012420654297, "global_step": 10807, "epoch": 89} {"train_loss": -24.602108001708984, "global_step": 10808, "epoch": 89} {"train_loss": -24.397924423217773, "global_step": 10809, "epoch": 89} {"train_loss": -24.993850708007812, "global_step": 10810, "epoch": 89} {"train_loss": -25.00371742248535, "global_step": 10811, "epoch": 89} {"train_loss": -24.78891372680664, "global_step": 10812, "epoch": 89} {"train_loss": -25.149585723876953, "global_step": 10813, "epoch": 89} {"train_loss": -24.89120864868164, "global_step": 10814, "epoch": 89} {"train_loss": -25.171363830566406, "global_step": 10815, "epoch": 89} {"train_loss": -24.984445571899414, "global_step": 10816, "epoch": 89} {"train_loss": -25.240915298461914, "global_step": 10817, "epoch": 89} {"train_loss": -24.786340713500977, "global_step": 10818, "epoch": 89} {"train_loss": -24.848907470703125, "global_step": 10819, "epoch": 89} {"train_loss": -25.121137619018555, "global_step": 10820, "epoch": 89} {"train_loss": -24.984331130981445, "global_step": 10821, "epoch": 89} {"train_loss": -25.356111526489258, "global_step": 10822, "epoch": 89} {"train_loss": -25.037250518798828, "global_step": 10823, "epoch": 89} {"train_loss": -24.71230125427246, "global_step": 10824, "epoch": 89} {"train_loss": -24.937381744384766, "global_step": 10825, "epoch": 89} {"train_loss": -25.15709686279297, "global_step": 10826, "epoch": 89} {"train_loss": -24.858118057250977, "global_step": 10827, "epoch": 89} {"train_loss": -25.49241065979004, "global_step": 10828, "epoch": 89} {"train_loss": -24.692996978759766, "global_step": 10829, "epoch": 89} {"train_loss": -25.15827751159668, "global_step": 10830, "epoch": 89} {"train_loss": -25.202009201049805, "global_step": 10831, "epoch": 89} {"train_loss": -24.716861724853516, "global_step": 10832, "epoch": 89} {"train_loss": -24.542909622192383, "global_step": 10833, "epoch": 89} {"train_loss": -25.8386173248291, "global_step": 10834, "epoch": 89} {"train_loss": -25.209388732910156, "global_step": 10835, "epoch": 89} {"train_loss": -25.16839599609375, "global_step": 10836, "epoch": 89} {"train_loss": -24.88850975036621, "global_step": 10837, "epoch": 89} {"train_loss": -25.06702995300293, "global_step": 10838, "epoch": 89} {"train_loss": -25.25370979309082, "global_step": 10839, "epoch": 89} {"train_loss": -24.967554092407227, "global_step": 10840, "epoch": 89} {"train_loss": -24.7064266204834, "global_step": 10841, "epoch": 89} {"train_loss": -24.726726531982422, "global_step": 10842, "epoch": 89} {"train_loss": -24.6926212310791, "global_step": 10843, "epoch": 89} {"train_loss": -24.070003509521484, "global_step": 10844, "epoch": 89} {"train_loss": -23.800621032714844, "global_step": 10845, "epoch": 89} {"train_loss": -25.282794952392578, "global_step": 10846, "epoch": 89} {"train_loss": -23.967260360717773, "global_step": 10847, "epoch": 89} {"train_loss": -22.625436782836914, "global_step": 10848, "epoch": 89} {"train_loss": -20.86659049987793, "global_step": 10849, "epoch": 89} {"train_loss": -24.537368774414062, "global_step": 10850, "epoch": 89} {"train_loss": -24.305761337280273, "global_step": 10851, "epoch": 89} {"train_loss": -21.055404663085938, "global_step": 10852, "epoch": 89} {"train_loss": -23.654857635498047, "global_step": 10853, "epoch": 89} {"train_loss": -23.588653564453125, "global_step": 10854, "epoch": 89} {"train_loss": -24.4439754486084, "global_step": 10855, "epoch": 89} {"train_loss": -24.35797691345215, "global_step": 10856, "epoch": 89} {"train_loss": -25.026565551757812, "global_step": 10857, "epoch": 89} {"train_loss": -24.084558486938477, "global_step": 10858, "epoch": 89} {"train_loss": -24.631122589111328, "global_step": 10859, "epoch": 89} {"train_loss": -24.246353149414062, "global_step": 10860, "epoch": 89} {"train_loss": -24.705341339111328, "global_step": 10861, "epoch": 89} {"train_loss": -23.671772003173828, "global_step": 10862, "epoch": 89} {"train_loss": -23.487661361694336, "global_step": 10863, "epoch": 89} {"train_loss": -22.5067081451416, "global_step": 10864, "epoch": 89} {"train_loss": -21.489755630493164, "global_step": 10865, "epoch": 89} {"train_loss": -22.0883731842041, "global_step": 10866, "epoch": 89} {"train_loss": -23.7287654876709, "global_step": 10867, "epoch": 89} {"train_loss": -23.603487014770508, "global_step": 10868, "epoch": 89} {"train_loss": -22.96731948852539, "global_step": 10869, "epoch": 89} {"train_loss": -24.86789894104004, "global_step": 10870, "epoch": 89} {"train_loss": -23.048053741455078, "global_step": 10871, "epoch": 89} {"train_loss": -24.60750389099121, "global_step": 10872, "epoch": 89} {"train_loss": -23.68345832824707, "global_step": 10873, "epoch": 89} {"train_loss": -24.09897232055664, "global_step": 10874, "epoch": 89} {"train_loss": -23.818323135375977, "global_step": 10875, "epoch": 89} {"train_loss": -24.61952781677246, "global_step": 10876, "epoch": 89} {"train_loss": -24.56016731262207, "global_step": 10877, "epoch": 89} {"train_loss": -24.43619155883789, "global_step": 10878, "epoch": 89} {"train_loss": -24.444034576416016, "global_step": 10879, "epoch": 89} {"train_loss": -24.545949935913086, "global_step": 10880, "epoch": 89} {"train_loss": -24.696212768554688, "global_step": 10881, "epoch": 89} {"train_loss": -24.65348243713379, "global_step": 10882, "epoch": 89} {"train_loss": -24.833486557006836, "global_step": 10883, "epoch": 89} {"train_loss": -24.713468551635742, "global_step": 10884, "epoch": 89} {"train_loss": -24.64301300048828, "global_step": 10885, "epoch": 89} {"train_loss": -24.9698429107666, "global_step": 10886, "epoch": 89} {"train_loss": -24.736160278320312, "global_step": 10887, "epoch": 89} {"train_loss": -24.860151290893555, "global_step": 10888, "epoch": 89} {"train_loss": -24.259379741574122, "global_step": 10889, "epoch": 89, "val_loss": 2495233.0} {"train_loss": -24.879104614257812, "global_step": 10890, "epoch": 90} {"train_loss": -25.096105575561523, "global_step": 10891, "epoch": 90} {"train_loss": -24.803302764892578, "global_step": 10892, "epoch": 90} {"train_loss": -25.3218994140625, "global_step": 10893, "epoch": 90} {"train_loss": -24.763553619384766, "global_step": 10894, "epoch": 90} {"train_loss": -25.555171966552734, "global_step": 10895, "epoch": 90} {"train_loss": -25.10404396057129, "global_step": 10896, "epoch": 90} {"train_loss": -25.159067153930664, "global_step": 10897, "epoch": 90} {"train_loss": -25.03822135925293, "global_step": 10898, "epoch": 90} {"train_loss": -25.341230392456055, "global_step": 10899, "epoch": 90} {"train_loss": -25.217580795288086, "global_step": 10900, "epoch": 90} {"train_loss": -25.17873191833496, "global_step": 10901, "epoch": 90} {"train_loss": -24.8577880859375, "global_step": 10902, "epoch": 90} {"train_loss": -24.711645126342773, "global_step": 10903, "epoch": 90} {"train_loss": -24.82564926147461, "global_step": 10904, "epoch": 90} {"train_loss": -25.0957088470459, "global_step": 10905, "epoch": 90} {"train_loss": -25.412015914916992, "global_step": 10906, "epoch": 90} {"train_loss": -25.099557876586914, "global_step": 10907, "epoch": 90} {"train_loss": -24.889768600463867, "global_step": 10908, "epoch": 90} {"train_loss": -25.17300033569336, "global_step": 10909, "epoch": 90} {"train_loss": -25.662464141845703, "global_step": 10910, "epoch": 90} {"train_loss": -25.407419204711914, "global_step": 10911, "epoch": 90} {"train_loss": -25.4417781829834, "global_step": 10912, "epoch": 90} {"train_loss": -25.06540870666504, "global_step": 10913, "epoch": 90} {"train_loss": -25.459089279174805, "global_step": 10914, "epoch": 90} {"train_loss": -24.710105895996094, "global_step": 10915, "epoch": 90} {"train_loss": -25.267427444458008, "global_step": 10916, "epoch": 90} {"train_loss": -25.332639694213867, "global_step": 10917, "epoch": 90} {"train_loss": -25.19913101196289, "global_step": 10918, "epoch": 90} {"train_loss": -25.422119140625, "global_step": 10919, "epoch": 90} {"train_loss": -25.251590728759766, "global_step": 10920, "epoch": 90} {"train_loss": -24.633438110351562, "global_step": 10921, "epoch": 90} {"train_loss": -24.87007713317871, "global_step": 10922, "epoch": 90} {"train_loss": -23.56488037109375, "global_step": 10923, "epoch": 90} {"train_loss": -24.741064071655273, "global_step": 10924, "epoch": 90} {"train_loss": -25.08782958984375, "global_step": 10925, "epoch": 90} {"train_loss": -25.53010368347168, "global_step": 10926, "epoch": 90} {"train_loss": -24.76123046875, "global_step": 10927, "epoch": 90} {"train_loss": -24.995573043823242, "global_step": 10928, "epoch": 90} {"train_loss": -24.431936264038086, "global_step": 10929, "epoch": 90} {"train_loss": -24.82322120666504, "global_step": 10930, "epoch": 90} {"train_loss": -23.5843563079834, "global_step": 10931, "epoch": 90} {"train_loss": -25.204269409179688, "global_step": 10932, "epoch": 90} {"train_loss": -23.86762046813965, "global_step": 10933, "epoch": 90} {"train_loss": -23.875478744506836, "global_step": 10934, "epoch": 90} {"train_loss": -23.5789794921875, "global_step": 10935, "epoch": 90} {"train_loss": -23.647192001342773, "global_step": 10936, "epoch": 90} {"train_loss": -22.924991607666016, "global_step": 10937, "epoch": 90} {"train_loss": -24.43020248413086, "global_step": 10938, "epoch": 90} {"train_loss": -23.721479415893555, "global_step": 10939, "epoch": 90} {"train_loss": -23.551908493041992, "global_step": 10940, "epoch": 90} {"train_loss": -24.481138229370117, "global_step": 10941, "epoch": 90} {"train_loss": -24.596240997314453, "global_step": 10942, "epoch": 90} {"train_loss": -23.21534538269043, "global_step": 10943, "epoch": 90} {"train_loss": -23.63373374938965, "global_step": 10944, "epoch": 90} {"train_loss": -24.690982818603516, "global_step": 10945, "epoch": 90} {"train_loss": -24.51467514038086, "global_step": 10946, "epoch": 90} {"train_loss": -22.72720718383789, "global_step": 10947, "epoch": 90} {"train_loss": -24.52435302734375, "global_step": 10948, "epoch": 90} {"train_loss": -24.07219886779785, "global_step": 10949, "epoch": 90} {"train_loss": -24.006332397460938, "global_step": 10950, "epoch": 90} {"train_loss": -24.56157684326172, "global_step": 10951, "epoch": 90} {"train_loss": -24.546003341674805, "global_step": 10952, "epoch": 90} {"train_loss": -24.28157615661621, "global_step": 10953, "epoch": 90} {"train_loss": -24.430789947509766, "global_step": 10954, "epoch": 90} {"train_loss": -24.495237350463867, "global_step": 10955, "epoch": 90} {"train_loss": -24.718048095703125, "global_step": 10956, "epoch": 90} {"train_loss": -24.564882278442383, "global_step": 10957, "epoch": 90} {"train_loss": -24.735960006713867, "global_step": 10958, "epoch": 90} {"train_loss": -24.264816284179688, "global_step": 10959, "epoch": 90} {"train_loss": -24.949628829956055, "global_step": 10960, "epoch": 90} {"train_loss": -24.297605514526367, "global_step": 10961, "epoch": 90} {"train_loss": -24.85369300842285, "global_step": 10962, "epoch": 90} {"train_loss": -24.317543029785156, "global_step": 10963, "epoch": 90} {"train_loss": -24.896507263183594, "global_step": 10964, "epoch": 90} {"train_loss": -24.282236099243164, "global_step": 10965, "epoch": 90} {"train_loss": -24.18733024597168, "global_step": 10966, "epoch": 90} {"train_loss": -24.637075424194336, "global_step": 10967, "epoch": 90} {"train_loss": -24.921466827392578, "global_step": 10968, "epoch": 90} {"train_loss": -24.93935203552246, "global_step": 10969, "epoch": 90} {"train_loss": -24.722219467163086, "global_step": 10970, "epoch": 90} {"train_loss": -24.96390724182129, "global_step": 10971, "epoch": 90} {"train_loss": -24.356897354125977, "global_step": 10972, "epoch": 90} {"train_loss": -23.552200317382812, "global_step": 10973, "epoch": 90} {"train_loss": -24.844318389892578, "global_step": 10974, "epoch": 90} {"train_loss": -24.204254150390625, "global_step": 10975, "epoch": 90} {"train_loss": -24.449739456176758, "global_step": 10976, "epoch": 90} {"train_loss": -24.815473556518555, "global_step": 10977, "epoch": 90} {"train_loss": -23.970218658447266, "global_step": 10978, "epoch": 90} {"train_loss": -24.660322189331055, "global_step": 10979, "epoch": 90} {"train_loss": -24.118013381958008, "global_step": 10980, "epoch": 90} {"train_loss": -24.77541160583496, "global_step": 10981, "epoch": 90} {"train_loss": -25.166391372680664, "global_step": 10982, "epoch": 90} {"train_loss": -25.060678482055664, "global_step": 10983, "epoch": 90} {"train_loss": -25.11861228942871, "global_step": 10984, "epoch": 90} {"train_loss": -25.188684463500977, "global_step": 10985, "epoch": 90} {"train_loss": -25.283384323120117, "global_step": 10986, "epoch": 90} {"train_loss": -25.19844627380371, "global_step": 10987, "epoch": 90} {"train_loss": -24.52374839782715, "global_step": 10988, "epoch": 90} {"train_loss": -24.128337860107422, "global_step": 10989, "epoch": 90} {"train_loss": -24.542755126953125, "global_step": 10990, "epoch": 90} {"train_loss": -22.947744369506836, "global_step": 10991, "epoch": 90} {"train_loss": -25.314762115478516, "global_step": 10992, "epoch": 90} {"train_loss": -22.6267147064209, "global_step": 10993, "epoch": 90} {"train_loss": -24.305818557739258, "global_step": 10994, "epoch": 90} {"train_loss": -23.799442291259766, "global_step": 10995, "epoch": 90} {"train_loss": -24.607175827026367, "global_step": 10996, "epoch": 90} {"train_loss": -24.40007972717285, "global_step": 10997, "epoch": 90} {"train_loss": -23.796672821044922, "global_step": 10998, "epoch": 90} {"train_loss": -23.9436092376709, "global_step": 10999, "epoch": 90} {"train_loss": -25.07925796508789, "global_step": 11000, "epoch": 90} {"train_loss": -24.654129028320312, "global_step": 11001, "epoch": 90} {"train_loss": -24.9343318939209, "global_step": 11002, "epoch": 90} {"train_loss": -25.11048698425293, "global_step": 11003, "epoch": 90} {"train_loss": -24.94829559326172, "global_step": 11004, "epoch": 90} {"train_loss": -24.96330451965332, "global_step": 11005, "epoch": 90} {"train_loss": -24.9821720123291, "global_step": 11006, "epoch": 90} {"train_loss": -25.223133087158203, "global_step": 11007, "epoch": 90} {"train_loss": -24.91220474243164, "global_step": 11008, "epoch": 90} {"train_loss": -24.626089096069336, "global_step": 11009, "epoch": 90} {"train_loss": -24.63547630940587, "global_step": 11010, "epoch": 90, "val_loss": 2562774.0} {"train_loss": -25.29709815979004, "global_step": 11011, "epoch": 91} {"train_loss": -25.210681915283203, "global_step": 11012, "epoch": 91} {"train_loss": -25.481204986572266, "global_step": 11013, "epoch": 91} {"train_loss": -25.237438201904297, "global_step": 11014, "epoch": 91} {"train_loss": -24.828786849975586, "global_step": 11015, "epoch": 91} {"train_loss": -24.436676025390625, "global_step": 11016, "epoch": 91} {"train_loss": -25.105615615844727, "global_step": 11017, "epoch": 91} {"train_loss": -24.862619400024414, "global_step": 11018, "epoch": 91} {"train_loss": -25.138803482055664, "global_step": 11019, "epoch": 91} {"train_loss": -24.954627990722656, "global_step": 11020, "epoch": 91} {"train_loss": -24.981067657470703, "global_step": 11021, "epoch": 91} {"train_loss": -25.238773345947266, "global_step": 11022, "epoch": 91} {"train_loss": -25.10580825805664, "global_step": 11023, "epoch": 91} {"train_loss": -24.744688034057617, "global_step": 11024, "epoch": 91} {"train_loss": -25.581785202026367, "global_step": 11025, "epoch": 91} {"train_loss": -25.520706176757812, "global_step": 11026, "epoch": 91} {"train_loss": -25.890594482421875, "global_step": 11027, "epoch": 91} {"train_loss": -25.28143310546875, "global_step": 11028, "epoch": 91} {"train_loss": -24.913570404052734, "global_step": 11029, "epoch": 91} {"train_loss": -25.353944778442383, "global_step": 11030, "epoch": 91} {"train_loss": -25.036853790283203, "global_step": 11031, "epoch": 91} {"train_loss": -25.215696334838867, "global_step": 11032, "epoch": 91} {"train_loss": -25.621362686157227, "global_step": 11033, "epoch": 91} {"train_loss": -25.26393699645996, "global_step": 11034, "epoch": 91} {"train_loss": -24.17129898071289, "global_step": 11035, "epoch": 91} {"train_loss": -23.209089279174805, "global_step": 11036, "epoch": 91} {"train_loss": -23.100692749023438, "global_step": 11037, "epoch": 91} {"train_loss": -23.622255325317383, "global_step": 11038, "epoch": 91} {"train_loss": -24.49846649169922, "global_step": 11039, "epoch": 91} {"train_loss": -24.42365074157715, "global_step": 11040, "epoch": 91} {"train_loss": -25.250261306762695, "global_step": 11041, "epoch": 91} {"train_loss": -24.804719924926758, "global_step": 11042, "epoch": 91} {"train_loss": -24.116107940673828, "global_step": 11043, "epoch": 91} {"train_loss": -25.33479881286621, "global_step": 11044, "epoch": 91} {"train_loss": -24.10944175720215, "global_step": 11045, "epoch": 91} {"train_loss": -22.76169204711914, "global_step": 11046, "epoch": 91} {"train_loss": -24.303754806518555, "global_step": 11047, "epoch": 91} {"train_loss": -23.350744247436523, "global_step": 11048, "epoch": 91} {"train_loss": -23.114572525024414, "global_step": 11049, "epoch": 91} {"train_loss": -23.96255874633789, "global_step": 11050, "epoch": 91} {"train_loss": -23.70578956604004, "global_step": 11051, "epoch": 91} {"train_loss": -24.056543350219727, "global_step": 11052, "epoch": 91} {"train_loss": -24.584314346313477, "global_step": 11053, "epoch": 91} {"train_loss": -24.118223190307617, "global_step": 11054, "epoch": 91} {"train_loss": -24.298913955688477, "global_step": 11055, "epoch": 91} {"train_loss": -24.5032901763916, "global_step": 11056, "epoch": 91} {"train_loss": -24.259418487548828, "global_step": 11057, "epoch": 91} {"train_loss": -24.66707420349121, "global_step": 11058, "epoch": 91} {"train_loss": -23.480966567993164, "global_step": 11059, "epoch": 91} {"train_loss": -25.039278030395508, "global_step": 11060, "epoch": 91} {"train_loss": -24.70834732055664, "global_step": 11061, "epoch": 91} {"train_loss": -25.072799682617188, "global_step": 11062, "epoch": 91} {"train_loss": -24.76392936706543, "global_step": 11063, "epoch": 91} {"train_loss": -24.72599220275879, "global_step": 11064, "epoch": 91} {"train_loss": -24.369543075561523, "global_step": 11065, "epoch": 91} {"train_loss": -25.197484970092773, "global_step": 11066, "epoch": 91} {"train_loss": -24.65521812438965, "global_step": 11067, "epoch": 91} {"train_loss": -25.40171241760254, "global_step": 11068, "epoch": 91} {"train_loss": -25.017789840698242, "global_step": 11069, "epoch": 91} {"train_loss": -25.061994552612305, "global_step": 11070, "epoch": 91} {"train_loss": -25.04957389831543, "global_step": 11071, "epoch": 91} {"train_loss": -25.1010799407959, "global_step": 11072, "epoch": 91} {"train_loss": -25.11060905456543, "global_step": 11073, "epoch": 91} {"train_loss": -24.782150268554688, "global_step": 11074, "epoch": 91} {"train_loss": -25.189037322998047, "global_step": 11075, "epoch": 91} {"train_loss": -23.854190826416016, "global_step": 11076, "epoch": 91} {"train_loss": -21.570255279541016, "global_step": 11077, "epoch": 91} {"train_loss": -18.054914474487305, "global_step": 11078, "epoch": 91} {"train_loss": -17.5992374420166, "global_step": 11079, "epoch": 91} {"train_loss": -25.06050682067871, "global_step": 11080, "epoch": 91} {"train_loss": -20.33756446838379, "global_step": 11081, "epoch": 91} {"train_loss": -22.860740661621094, "global_step": 11082, "epoch": 91} {"train_loss": -22.414962768554688, "global_step": 11083, "epoch": 91} {"train_loss": -24.349042892456055, "global_step": 11084, "epoch": 91} {"train_loss": -22.511621475219727, "global_step": 11085, "epoch": 91} {"train_loss": -24.2659912109375, "global_step": 11086, "epoch": 91} {"train_loss": -24.465139389038086, "global_step": 11087, "epoch": 91} {"train_loss": -23.962690353393555, "global_step": 11088, "epoch": 91} {"train_loss": -23.55550765991211, "global_step": 11089, "epoch": 91} {"train_loss": -24.308332443237305, "global_step": 11090, "epoch": 91} {"train_loss": -24.583885192871094, "global_step": 11091, "epoch": 91} {"train_loss": -23.9534854888916, "global_step": 11092, "epoch": 91} {"train_loss": -24.024829864501953, "global_step": 11093, "epoch": 91} {"train_loss": -24.264814376831055, "global_step": 11094, "epoch": 91} {"train_loss": -24.4404239654541, "global_step": 11095, "epoch": 91} {"train_loss": -24.52466583251953, "global_step": 11096, "epoch": 91} {"train_loss": -24.6785888671875, "global_step": 11097, "epoch": 91} {"train_loss": -24.308942794799805, "global_step": 11098, "epoch": 91} {"train_loss": -24.172826766967773, "global_step": 11099, "epoch": 91} {"train_loss": -24.521514892578125, "global_step": 11100, "epoch": 91} {"train_loss": -24.502368927001953, "global_step": 11101, "epoch": 91} {"train_loss": -24.757915496826172, "global_step": 11102, "epoch": 91} {"train_loss": -24.587631225585938, "global_step": 11103, "epoch": 91} {"train_loss": -24.41621971130371, "global_step": 11104, "epoch": 91} {"train_loss": -24.40182876586914, "global_step": 11105, "epoch": 91} {"train_loss": -24.75473403930664, "global_step": 11106, "epoch": 91} {"train_loss": -24.322385787963867, "global_step": 11107, "epoch": 91} {"train_loss": -24.169633865356445, "global_step": 11108, "epoch": 91} {"train_loss": -24.575056076049805, "global_step": 11109, "epoch": 91} {"train_loss": -24.82007598876953, "global_step": 11110, "epoch": 91} {"train_loss": -24.509397506713867, "global_step": 11111, "epoch": 91} {"train_loss": -23.992719650268555, "global_step": 11112, "epoch": 91} {"train_loss": -23.87909507751465, "global_step": 11113, "epoch": 91} {"train_loss": -23.89765739440918, "global_step": 11114, "epoch": 91} {"train_loss": -24.34870719909668, "global_step": 11115, "epoch": 91} {"train_loss": -24.587934494018555, "global_step": 11116, "epoch": 91} {"train_loss": -24.328439712524414, "global_step": 11117, "epoch": 91} {"train_loss": -24.79975700378418, "global_step": 11118, "epoch": 91} {"train_loss": -24.564964294433594, "global_step": 11119, "epoch": 91} {"train_loss": -23.298673629760742, "global_step": 11120, "epoch": 91} {"train_loss": -23.030696868896484, "global_step": 11121, "epoch": 91} {"train_loss": -24.299610137939453, "global_step": 11122, "epoch": 91} {"train_loss": -24.673065185546875, "global_step": 11123, "epoch": 91} {"train_loss": -23.729658126831055, "global_step": 11124, "epoch": 91} {"train_loss": -21.74240493774414, "global_step": 11125, "epoch": 91} {"train_loss": -19.781911849975586, "global_step": 11126, "epoch": 91} {"train_loss": -23.086515426635742, "global_step": 11127, "epoch": 91} {"train_loss": -24.702667236328125, "global_step": 11128, "epoch": 91} {"train_loss": -22.986955642700195, "global_step": 11129, "epoch": 91} {"train_loss": -23.654518127441406, "global_step": 11130, "epoch": 91} {"train_loss": -24.224729411858174, "global_step": 11131, "epoch": 91, "val_loss": 2696314.75} {"train_loss": -24.293920516967773, "global_step": 11132, "epoch": 92} {"train_loss": -24.211761474609375, "global_step": 11133, "epoch": 92} {"train_loss": -24.242483139038086, "global_step": 11134, "epoch": 92} {"train_loss": -24.255239486694336, "global_step": 11135, "epoch": 92} {"train_loss": -24.79791259765625, "global_step": 11136, "epoch": 92} {"train_loss": -23.790813446044922, "global_step": 11137, "epoch": 92} {"train_loss": -24.689374923706055, "global_step": 11138, "epoch": 92} {"train_loss": -24.442703247070312, "global_step": 11139, "epoch": 92} {"train_loss": -24.38858413696289, "global_step": 11140, "epoch": 92} {"train_loss": -24.8403377532959, "global_step": 11141, "epoch": 92} {"train_loss": -24.068023681640625, "global_step": 11142, "epoch": 92} {"train_loss": -25.081321716308594, "global_step": 11143, "epoch": 92} {"train_loss": -24.391523361206055, "global_step": 11144, "epoch": 92} {"train_loss": -24.445375442504883, "global_step": 11145, "epoch": 92} {"train_loss": -24.544879913330078, "global_step": 11146, "epoch": 92} {"train_loss": -24.541311264038086, "global_step": 11147, "epoch": 92} {"train_loss": -24.51549530029297, "global_step": 11148, "epoch": 92} {"train_loss": -24.75974464416504, "global_step": 11149, "epoch": 92} {"train_loss": -24.889942169189453, "global_step": 11150, "epoch": 92} {"train_loss": -24.72759437561035, "global_step": 11151, "epoch": 92} {"train_loss": -24.88237190246582, "global_step": 11152, "epoch": 92} {"train_loss": -24.43228530883789, "global_step": 11153, "epoch": 92} {"train_loss": -25.200546264648438, "global_step": 11154, "epoch": 92} {"train_loss": -25.030136108398438, "global_step": 11155, "epoch": 92} {"train_loss": -25.1448974609375, "global_step": 11156, "epoch": 92} {"train_loss": -25.05042839050293, "global_step": 11157, "epoch": 92} {"train_loss": -24.912717819213867, "global_step": 11158, "epoch": 92} {"train_loss": -25.191986083984375, "global_step": 11159, "epoch": 92} {"train_loss": -25.450117111206055, "global_step": 11160, "epoch": 92} {"train_loss": -24.84563446044922, "global_step": 11161, "epoch": 92} {"train_loss": -25.263883590698242, "global_step": 11162, "epoch": 92} {"train_loss": -25.110143661499023, "global_step": 11163, "epoch": 92} {"train_loss": -25.27486801147461, "global_step": 11164, "epoch": 92} {"train_loss": -25.396875381469727, "global_step": 11165, "epoch": 92} {"train_loss": -24.719141006469727, "global_step": 11166, "epoch": 92} {"train_loss": -25.505470275878906, "global_step": 11167, "epoch": 92} {"train_loss": -25.327844619750977, "global_step": 11168, "epoch": 92} {"train_loss": -25.097496032714844, "global_step": 11169, "epoch": 92} {"train_loss": -25.00235366821289, "global_step": 11170, "epoch": 92} {"train_loss": -24.800756454467773, "global_step": 11171, "epoch": 92} {"train_loss": -25.188404083251953, "global_step": 11172, "epoch": 92} {"train_loss": -25.319019317626953, "global_step": 11173, "epoch": 92} {"train_loss": -25.033716201782227, "global_step": 11174, "epoch": 92} {"train_loss": -24.840391159057617, "global_step": 11175, "epoch": 92} {"train_loss": -24.206714630126953, "global_step": 11176, "epoch": 92} {"train_loss": -23.96185302734375, "global_step": 11177, "epoch": 92} {"train_loss": -23.753496170043945, "global_step": 11178, "epoch": 92} {"train_loss": -23.23381233215332, "global_step": 11179, "epoch": 92} {"train_loss": -22.189044952392578, "global_step": 11180, "epoch": 92} {"train_loss": -24.47547721862793, "global_step": 11181, "epoch": 92} {"train_loss": -24.129472732543945, "global_step": 11182, "epoch": 92} {"train_loss": -23.945261001586914, "global_step": 11183, "epoch": 92} {"train_loss": -25.027881622314453, "global_step": 11184, "epoch": 92} {"train_loss": -25.187963485717773, "global_step": 11185, "epoch": 92} {"train_loss": -24.714618682861328, "global_step": 11186, "epoch": 92} {"train_loss": -24.5139217376709, "global_step": 11187, "epoch": 92} {"train_loss": -24.533740997314453, "global_step": 11188, "epoch": 92} {"train_loss": -25.303871154785156, "global_step": 11189, "epoch": 92} {"train_loss": -24.790573120117188, "global_step": 11190, "epoch": 92} {"train_loss": -25.057531356811523, "global_step": 11191, "epoch": 92} {"train_loss": -25.146291732788086, "global_step": 11192, "epoch": 92} {"train_loss": -24.74479103088379, "global_step": 11193, "epoch": 92} {"train_loss": -24.905975341796875, "global_step": 11194, "epoch": 92} {"train_loss": -25.315465927124023, "global_step": 11195, "epoch": 92} {"train_loss": -24.999366760253906, "global_step": 11196, "epoch": 92} {"train_loss": -25.19561767578125, "global_step": 11197, "epoch": 92} {"train_loss": -25.32389259338379, "global_step": 11198, "epoch": 92} {"train_loss": -25.247100830078125, "global_step": 11199, "epoch": 92} {"train_loss": -24.773496627807617, "global_step": 11200, "epoch": 92} {"train_loss": -25.217838287353516, "global_step": 11201, "epoch": 92} {"train_loss": -25.041793823242188, "global_step": 11202, "epoch": 92} {"train_loss": -24.85627555847168, "global_step": 11203, "epoch": 92} {"train_loss": -24.971176147460938, "global_step": 11204, "epoch": 92} {"train_loss": -24.119449615478516, "global_step": 11205, "epoch": 92} {"train_loss": -25.430328369140625, "global_step": 11206, "epoch": 92} {"train_loss": -24.645761489868164, "global_step": 11207, "epoch": 92} {"train_loss": -24.618669509887695, "global_step": 11208, "epoch": 92} {"train_loss": -25.36244010925293, "global_step": 11209, "epoch": 92} {"train_loss": -24.743581771850586, "global_step": 11210, "epoch": 92} {"train_loss": -25.013626098632812, "global_step": 11211, "epoch": 92} {"train_loss": -24.82307243347168, "global_step": 11212, "epoch": 92} {"train_loss": -25.331546783447266, "global_step": 11213, "epoch": 92} {"train_loss": -24.817575454711914, "global_step": 11214, "epoch": 92} {"train_loss": -25.226903915405273, "global_step": 11215, "epoch": 92} {"train_loss": -24.687562942504883, "global_step": 11216, "epoch": 92} {"train_loss": -24.015125274658203, "global_step": 11217, "epoch": 92} {"train_loss": -22.423675537109375, "global_step": 11218, "epoch": 92} {"train_loss": -18.57301139831543, "global_step": 11219, "epoch": 92} {"train_loss": -17.991470336914062, "global_step": 11220, "epoch": 92} {"train_loss": -25.072784423828125, "global_step": 11221, "epoch": 92} {"train_loss": -21.993467330932617, "global_step": 11222, "epoch": 92} {"train_loss": -24.597707748413086, "global_step": 11223, "epoch": 92} {"train_loss": -23.323545455932617, "global_step": 11224, "epoch": 92} {"train_loss": -24.952239990234375, "global_step": 11225, "epoch": 92} {"train_loss": -23.27042007446289, "global_step": 11226, "epoch": 92} {"train_loss": -24.55061912536621, "global_step": 11227, "epoch": 92} {"train_loss": -25.006139755249023, "global_step": 11228, "epoch": 92} {"train_loss": -24.050275802612305, "global_step": 11229, "epoch": 92} {"train_loss": -24.855911254882812, "global_step": 11230, "epoch": 92} {"train_loss": -24.88909912109375, "global_step": 11231, "epoch": 92} {"train_loss": -24.915912628173828, "global_step": 11232, "epoch": 92} {"train_loss": -24.81882667541504, "global_step": 11233, "epoch": 92} {"train_loss": -24.659635543823242, "global_step": 11234, "epoch": 92} {"train_loss": -24.611021041870117, "global_step": 11235, "epoch": 92} {"train_loss": -24.353927612304688, "global_step": 11236, "epoch": 92} {"train_loss": -24.67630386352539, "global_step": 11237, "epoch": 92} {"train_loss": -24.211841583251953, "global_step": 11238, "epoch": 92} {"train_loss": -24.176931381225586, "global_step": 11239, "epoch": 92} {"train_loss": -24.397525787353516, "global_step": 11240, "epoch": 92} {"train_loss": -24.6285343170166, "global_step": 11241, "epoch": 92} {"train_loss": -24.824935913085938, "global_step": 11242, "epoch": 92} {"train_loss": -24.991580963134766, "global_step": 11243, "epoch": 92} {"train_loss": -24.20619773864746, "global_step": 11244, "epoch": 92} {"train_loss": -24.514549255371094, "global_step": 11245, "epoch": 92} {"train_loss": -24.98240089416504, "global_step": 11246, "epoch": 92} {"train_loss": -24.993619918823242, "global_step": 11247, "epoch": 92} {"train_loss": -24.80299186706543, "global_step": 11248, "epoch": 92} {"train_loss": -25.309812545776367, "global_step": 11249, "epoch": 92} {"train_loss": -24.683889389038086, "global_step": 11250, "epoch": 92} {"train_loss": -23.10689353942871, "global_step": 11251, "epoch": 92} {"train_loss": -24.511131207805036, "global_step": 11252, "epoch": 92, "val_loss": 3104196.0} {"train_loss": -16.07193374633789, "global_step": 11253, "epoch": 93} {"train_loss": -21.549787521362305, "global_step": 11254, "epoch": 93} {"train_loss": -22.622087478637695, "global_step": 11255, "epoch": 93} {"train_loss": -24.338048934936523, "global_step": 11256, "epoch": 93} {"train_loss": -22.178775787353516, "global_step": 11257, "epoch": 93} {"train_loss": -23.999298095703125, "global_step": 11258, "epoch": 93} {"train_loss": -23.02713966369629, "global_step": 11259, "epoch": 93} {"train_loss": -23.78964614868164, "global_step": 11260, "epoch": 93} {"train_loss": -24.00131607055664, "global_step": 11261, "epoch": 93} {"train_loss": -23.484344482421875, "global_step": 11262, "epoch": 93} {"train_loss": -24.071277618408203, "global_step": 11263, "epoch": 93} {"train_loss": -24.258344650268555, "global_step": 11264, "epoch": 93} {"train_loss": -23.944965362548828, "global_step": 11265, "epoch": 93} {"train_loss": -24.294008255004883, "global_step": 11266, "epoch": 93} {"train_loss": -24.3625431060791, "global_step": 11267, "epoch": 93} {"train_loss": -24.039112091064453, "global_step": 11268, "epoch": 93} {"train_loss": -24.170209884643555, "global_step": 11269, "epoch": 93} {"train_loss": -24.193212509155273, "global_step": 11270, "epoch": 93} {"train_loss": -23.938932418823242, "global_step": 11271, "epoch": 93} {"train_loss": -24.378225326538086, "global_step": 11272, "epoch": 93} {"train_loss": -24.431564331054688, "global_step": 11273, "epoch": 93} {"train_loss": -24.178085327148438, "global_step": 11274, "epoch": 93} {"train_loss": -24.266904830932617, "global_step": 11275, "epoch": 93} {"train_loss": -24.266416549682617, "global_step": 11276, "epoch": 93} {"train_loss": -24.585834503173828, "global_step": 11277, "epoch": 93} {"train_loss": -23.835548400878906, "global_step": 11278, "epoch": 93} {"train_loss": -24.37233543395996, "global_step": 11279, "epoch": 93} {"train_loss": -23.909940719604492, "global_step": 11280, "epoch": 93} {"train_loss": -24.815380096435547, "global_step": 11281, "epoch": 93} {"train_loss": -24.550260543823242, "global_step": 11282, "epoch": 93} {"train_loss": -24.70065689086914, "global_step": 11283, "epoch": 93} {"train_loss": -24.865520477294922, "global_step": 11284, "epoch": 93} {"train_loss": -24.669300079345703, "global_step": 11285, "epoch": 93} {"train_loss": -24.433460235595703, "global_step": 11286, "epoch": 93} {"train_loss": -24.83595085144043, "global_step": 11287, "epoch": 93} {"train_loss": -24.709253311157227, "global_step": 11288, "epoch": 93} {"train_loss": -24.614137649536133, "global_step": 11289, "epoch": 93} {"train_loss": -24.48622703552246, "global_step": 11290, "epoch": 93} {"train_loss": -24.186986923217773, "global_step": 11291, "epoch": 93} {"train_loss": -23.863861083984375, "global_step": 11292, "epoch": 93} {"train_loss": -23.50501251220703, "global_step": 11293, "epoch": 93} {"train_loss": -22.581026077270508, "global_step": 11294, "epoch": 93} {"train_loss": -19.754758834838867, "global_step": 11295, "epoch": 93} {"train_loss": -19.32960319519043, "global_step": 11296, "epoch": 93} {"train_loss": -23.734907150268555, "global_step": 11297, "epoch": 93} {"train_loss": -24.479602813720703, "global_step": 11298, "epoch": 93} {"train_loss": -23.617313385009766, "global_step": 11299, "epoch": 93} {"train_loss": -24.4962158203125, "global_step": 11300, "epoch": 93} {"train_loss": -23.86000633239746, "global_step": 11301, "epoch": 93} {"train_loss": -24.323429107666016, "global_step": 11302, "epoch": 93} {"train_loss": -24.405506134033203, "global_step": 11303, "epoch": 93} {"train_loss": -24.107507705688477, "global_step": 11304, "epoch": 93} {"train_loss": -24.826393127441406, "global_step": 11305, "epoch": 93} {"train_loss": -24.01922035217285, "global_step": 11306, "epoch": 93} {"train_loss": -24.072168350219727, "global_step": 11307, "epoch": 93} {"train_loss": -24.726343154907227, "global_step": 11308, "epoch": 93} {"train_loss": -24.024166107177734, "global_step": 11309, "epoch": 93} {"train_loss": -24.33296012878418, "global_step": 11310, "epoch": 93} {"train_loss": -24.96424102783203, "global_step": 11311, "epoch": 93} {"train_loss": -24.829349517822266, "global_step": 11312, "epoch": 93} {"train_loss": -24.693830490112305, "global_step": 11313, "epoch": 93} {"train_loss": -24.708084106445312, "global_step": 11314, "epoch": 93} {"train_loss": -24.68017578125, "global_step": 11315, "epoch": 93} {"train_loss": -24.84852409362793, "global_step": 11316, "epoch": 93} {"train_loss": -24.458017349243164, "global_step": 11317, "epoch": 93} {"train_loss": -25.222919464111328, "global_step": 11318, "epoch": 93} {"train_loss": -25.08138656616211, "global_step": 11319, "epoch": 93} {"train_loss": -24.687219619750977, "global_step": 11320, "epoch": 93} {"train_loss": -25.063905715942383, "global_step": 11321, "epoch": 93} {"train_loss": -24.236804962158203, "global_step": 11322, "epoch": 93} {"train_loss": -24.810489654541016, "global_step": 11323, "epoch": 93} {"train_loss": -24.555755615234375, "global_step": 11324, "epoch": 93} {"train_loss": -25.460893630981445, "global_step": 11325, "epoch": 93} {"train_loss": -25.057161331176758, "global_step": 11326, "epoch": 93} {"train_loss": -25.1364803314209, "global_step": 11327, "epoch": 93} {"train_loss": -25.205106735229492, "global_step": 11328, "epoch": 93} {"train_loss": -25.226215362548828, "global_step": 11329, "epoch": 93} {"train_loss": -25.43323516845703, "global_step": 11330, "epoch": 93} {"train_loss": -25.48761558532715, "global_step": 11331, "epoch": 93} {"train_loss": -25.285587310791016, "global_step": 11332, "epoch": 93} {"train_loss": -25.36101722717285, "global_step": 11333, "epoch": 93} {"train_loss": -25.580663681030273, "global_step": 11334, "epoch": 93} {"train_loss": -25.3713321685791, "global_step": 11335, "epoch": 93} {"train_loss": -25.366281509399414, "global_step": 11336, "epoch": 93} {"train_loss": -25.19927406311035, "global_step": 11337, "epoch": 93} {"train_loss": -25.114887237548828, "global_step": 11338, "epoch": 93} {"train_loss": -25.629308700561523, "global_step": 11339, "epoch": 93} {"train_loss": -25.30962562561035, "global_step": 11340, "epoch": 93} {"train_loss": -25.328187942504883, "global_step": 11341, "epoch": 93} {"train_loss": -25.299589157104492, "global_step": 11342, "epoch": 93} {"train_loss": -25.508209228515625, "global_step": 11343, "epoch": 93} {"train_loss": -25.41922378540039, "global_step": 11344, "epoch": 93} {"train_loss": -25.28584098815918, "global_step": 11345, "epoch": 93} {"train_loss": -24.411354064941406, "global_step": 11346, "epoch": 93} {"train_loss": -22.90993309020996, "global_step": 11347, "epoch": 93} {"train_loss": -21.71329116821289, "global_step": 11348, "epoch": 93} {"train_loss": -18.79420280456543, "global_step": 11349, "epoch": 93} {"train_loss": -19.31178092956543, "global_step": 11350, "epoch": 93} {"train_loss": -23.98702049255371, "global_step": 11351, "epoch": 93} {"train_loss": -23.150495529174805, "global_step": 11352, "epoch": 93} {"train_loss": -23.341476440429688, "global_step": 11353, "epoch": 93} {"train_loss": -23.729591369628906, "global_step": 11354, "epoch": 93} {"train_loss": -24.633590698242188, "global_step": 11355, "epoch": 93} {"train_loss": -24.02387809753418, "global_step": 11356, "epoch": 93} {"train_loss": -25.01783561706543, "global_step": 11357, "epoch": 93} {"train_loss": -24.31174087524414, "global_step": 11358, "epoch": 93} {"train_loss": -24.49129295349121, "global_step": 11359, "epoch": 93} {"train_loss": -24.713348388671875, "global_step": 11360, "epoch": 93} {"train_loss": -24.035776138305664, "global_step": 11361, "epoch": 93} {"train_loss": -24.284393310546875, "global_step": 11362, "epoch": 93} {"train_loss": -24.832674026489258, "global_step": 11363, "epoch": 93} {"train_loss": -24.633865356445312, "global_step": 11364, "epoch": 93} {"train_loss": -24.355222702026367, "global_step": 11365, "epoch": 93} {"train_loss": -24.792604446411133, "global_step": 11366, "epoch": 93} {"train_loss": -25.14218521118164, "global_step": 11367, "epoch": 93} {"train_loss": -24.912527084350586, "global_step": 11368, "epoch": 93} {"train_loss": -24.930870056152344, "global_step": 11369, "epoch": 93} {"train_loss": -24.767520904541016, "global_step": 11370, "epoch": 93} {"train_loss": -24.61806869506836, "global_step": 11371, "epoch": 93} {"train_loss": -25.068378448486328, "global_step": 11372, "epoch": 93} {"train_loss": -24.195822156165256, "global_step": 11373, "epoch": 93, "val_loss": 2523526.0} {"train_loss": -24.637210845947266, "global_step": 11374, "epoch": 94} {"train_loss": -25.108976364135742, "global_step": 11375, "epoch": 94} {"train_loss": -24.910486221313477, "global_step": 11376, "epoch": 94} {"train_loss": -25.17629051208496, "global_step": 11377, "epoch": 94} {"train_loss": -25.279088973999023, "global_step": 11378, "epoch": 94} {"train_loss": -24.624710083007812, "global_step": 11379, "epoch": 94} {"train_loss": -24.8764591217041, "global_step": 11380, "epoch": 94} {"train_loss": -25.339323043823242, "global_step": 11381, "epoch": 94} {"train_loss": -25.164533615112305, "global_step": 11382, "epoch": 94} {"train_loss": -25.103839874267578, "global_step": 11383, "epoch": 94} {"train_loss": -25.090473175048828, "global_step": 11384, "epoch": 94} {"train_loss": -25.27303123474121, "global_step": 11385, "epoch": 94} {"train_loss": -25.119861602783203, "global_step": 11386, "epoch": 94} {"train_loss": -25.092601776123047, "global_step": 11387, "epoch": 94} {"train_loss": -25.054187774658203, "global_step": 11388, "epoch": 94} {"train_loss": -25.399620056152344, "global_step": 11389, "epoch": 94} {"train_loss": -25.23171043395996, "global_step": 11390, "epoch": 94} {"train_loss": -25.487878799438477, "global_step": 11391, "epoch": 94} {"train_loss": -25.253835678100586, "global_step": 11392, "epoch": 94} {"train_loss": -25.101226806640625, "global_step": 11393, "epoch": 94} {"train_loss": -25.588058471679688, "global_step": 11394, "epoch": 94} {"train_loss": -24.709409713745117, "global_step": 11395, "epoch": 94} {"train_loss": -23.630462646484375, "global_step": 11396, "epoch": 94} {"train_loss": -24.64479637145996, "global_step": 11397, "epoch": 94} {"train_loss": -23.952167510986328, "global_step": 11398, "epoch": 94} {"train_loss": -24.57916831970215, "global_step": 11399, "epoch": 94} {"train_loss": -23.59891128540039, "global_step": 11400, "epoch": 94} {"train_loss": -24.95888328552246, "global_step": 11401, "epoch": 94} {"train_loss": -24.82026481628418, "global_step": 11402, "epoch": 94} {"train_loss": -23.868871688842773, "global_step": 11403, "epoch": 94} {"train_loss": -25.310388565063477, "global_step": 11404, "epoch": 94} {"train_loss": -23.6893367767334, "global_step": 11405, "epoch": 94} {"train_loss": -23.380876541137695, "global_step": 11406, "epoch": 94} {"train_loss": -22.4122314453125, "global_step": 11407, "epoch": 94} {"train_loss": -21.216922760009766, "global_step": 11408, "epoch": 94} {"train_loss": -22.256244659423828, "global_step": 11409, "epoch": 94} {"train_loss": -24.621082305908203, "global_step": 11410, "epoch": 94} {"train_loss": -23.810232162475586, "global_step": 11411, "epoch": 94} {"train_loss": -23.315937042236328, "global_step": 11412, "epoch": 94} {"train_loss": -24.508808135986328, "global_step": 11413, "epoch": 94} {"train_loss": -23.083829879760742, "global_step": 11414, "epoch": 94} {"train_loss": -24.932077407836914, "global_step": 11415, "epoch": 94} {"train_loss": -23.942222595214844, "global_step": 11416, "epoch": 94} {"train_loss": -24.711441040039062, "global_step": 11417, "epoch": 94} {"train_loss": -23.85835075378418, "global_step": 11418, "epoch": 94} {"train_loss": -24.26862907409668, "global_step": 11419, "epoch": 94} {"train_loss": -23.980920791625977, "global_step": 11420, "epoch": 94} {"train_loss": -24.54791259765625, "global_step": 11421, "epoch": 94} {"train_loss": -24.66013526916504, "global_step": 11422, "epoch": 94} {"train_loss": -24.433082580566406, "global_step": 11423, "epoch": 94} {"train_loss": -23.904193878173828, "global_step": 11424, "epoch": 94} {"train_loss": -24.772724151611328, "global_step": 11425, "epoch": 94} {"train_loss": -23.947256088256836, "global_step": 11426, "epoch": 94} {"train_loss": -24.53706169128418, "global_step": 11427, "epoch": 94} {"train_loss": -24.980924606323242, "global_step": 11428, "epoch": 94} {"train_loss": -24.906614303588867, "global_step": 11429, "epoch": 94} {"train_loss": -24.750898361206055, "global_step": 11430, "epoch": 94} {"train_loss": -24.0009708404541, "global_step": 11431, "epoch": 94} {"train_loss": -24.908170700073242, "global_step": 11432, "epoch": 94} {"train_loss": -24.45066261291504, "global_step": 11433, "epoch": 94} {"train_loss": -25.28928565979004, "global_step": 11434, "epoch": 94} {"train_loss": -24.73185920715332, "global_step": 11435, "epoch": 94} {"train_loss": -25.16419792175293, "global_step": 11436, "epoch": 94} {"train_loss": -24.806745529174805, "global_step": 11437, "epoch": 94} {"train_loss": -25.303491592407227, "global_step": 11438, "epoch": 94} {"train_loss": -24.937631607055664, "global_step": 11439, "epoch": 94} {"train_loss": -25.378982543945312, "global_step": 11440, "epoch": 94} {"train_loss": -25.296377182006836, "global_step": 11441, "epoch": 94} {"train_loss": -25.49937629699707, "global_step": 11442, "epoch": 94} {"train_loss": -24.94991111755371, "global_step": 11443, "epoch": 94} {"train_loss": -25.087814331054688, "global_step": 11444, "epoch": 94} {"train_loss": -25.414031982421875, "global_step": 11445, "epoch": 94} {"train_loss": -25.336647033691406, "global_step": 11446, "epoch": 94} {"train_loss": -24.52897071838379, "global_step": 11447, "epoch": 94} {"train_loss": -25.329870223999023, "global_step": 11448, "epoch": 94} {"train_loss": -25.635412216186523, "global_step": 11449, "epoch": 94} {"train_loss": -25.44179344177246, "global_step": 11450, "epoch": 94} {"train_loss": -25.46554946899414, "global_step": 11451, "epoch": 94} {"train_loss": -25.09938621520996, "global_step": 11452, "epoch": 94} {"train_loss": -25.344711303710938, "global_step": 11453, "epoch": 94} {"train_loss": -25.536231994628906, "global_step": 11454, "epoch": 94} {"train_loss": -25.309797286987305, "global_step": 11455, "epoch": 94} {"train_loss": -25.606725692749023, "global_step": 11456, "epoch": 94} {"train_loss": -25.647550582885742, "global_step": 11457, "epoch": 94} {"train_loss": -25.879257202148438, "global_step": 11458, "epoch": 94} {"train_loss": -25.483739852905273, "global_step": 11459, "epoch": 94} {"train_loss": -25.62261962890625, "global_step": 11460, "epoch": 94} {"train_loss": -25.599409103393555, "global_step": 11461, "epoch": 94} {"train_loss": -25.75775146484375, "global_step": 11462, "epoch": 94} {"train_loss": -25.914276123046875, "global_step": 11463, "epoch": 94} {"train_loss": -25.837512969970703, "global_step": 11464, "epoch": 94} {"train_loss": -25.608427047729492, "global_step": 11465, "epoch": 94} {"train_loss": -25.591230392456055, "global_step": 11466, "epoch": 94} {"train_loss": -25.159454345703125, "global_step": 11467, "epoch": 94} {"train_loss": -24.99285316467285, "global_step": 11468, "epoch": 94} {"train_loss": -23.77751350402832, "global_step": 11469, "epoch": 94} {"train_loss": -24.15127944946289, "global_step": 11470, "epoch": 94} {"train_loss": -23.582239151000977, "global_step": 11471, "epoch": 94} {"train_loss": -24.982418060302734, "global_step": 11472, "epoch": 94} {"train_loss": -25.84760093688965, "global_step": 11473, "epoch": 94} {"train_loss": -25.01227378845215, "global_step": 11474, "epoch": 94} {"train_loss": -23.5269775390625, "global_step": 11475, "epoch": 94} {"train_loss": -24.155181884765625, "global_step": 11476, "epoch": 94} {"train_loss": -25.4171199798584, "global_step": 11477, "epoch": 94} {"train_loss": -24.600358963012695, "global_step": 11478, "epoch": 94} {"train_loss": -25.3184757232666, "global_step": 11479, "epoch": 94} {"train_loss": -25.30451011657715, "global_step": 11480, "epoch": 94} {"train_loss": -25.291589736938477, "global_step": 11481, "epoch": 94} {"train_loss": -25.43830680847168, "global_step": 11482, "epoch": 94} {"train_loss": -25.96272087097168, "global_step": 11483, "epoch": 94} {"train_loss": -25.20737648010254, "global_step": 11484, "epoch": 94} {"train_loss": -25.06654930114746, "global_step": 11485, "epoch": 94} {"train_loss": -25.8209228515625, "global_step": 11486, "epoch": 94} {"train_loss": -26.0892333984375, "global_step": 11487, "epoch": 94} {"train_loss": -25.277877807617188, "global_step": 11488, "epoch": 94} {"train_loss": -25.4141845703125, "global_step": 11489, "epoch": 94} {"train_loss": -25.17865753173828, "global_step": 11490, "epoch": 94} {"train_loss": -25.275907516479492, "global_step": 11491, "epoch": 94} {"train_loss": -25.35790252685547, "global_step": 11492, "epoch": 94} {"train_loss": -25.671789169311523, "global_step": 11493, "epoch": 94} {"train_loss": -24.858298971633282, "global_step": 11494, "epoch": 94, "val_loss": 2593718.25} {"train_loss": -24.569778442382812, "global_step": 11495, "epoch": 95} {"train_loss": -25.514631271362305, "global_step": 11496, "epoch": 95} {"train_loss": -25.240768432617188, "global_step": 11497, "epoch": 95} {"train_loss": -23.27875328063965, "global_step": 11498, "epoch": 95} {"train_loss": -24.265966415405273, "global_step": 11499, "epoch": 95} {"train_loss": -25.17078971862793, "global_step": 11500, "epoch": 95} {"train_loss": -23.084611892700195, "global_step": 11501, "epoch": 95} {"train_loss": -21.421466827392578, "global_step": 11502, "epoch": 95} {"train_loss": -23.5650634765625, "global_step": 11503, "epoch": 95} {"train_loss": -22.557682037353516, "global_step": 11504, "epoch": 95} {"train_loss": -24.063993453979492, "global_step": 11505, "epoch": 95} {"train_loss": -25.008594512939453, "global_step": 11506, "epoch": 95} {"train_loss": -24.720090866088867, "global_step": 11507, "epoch": 95} {"train_loss": -24.7419376373291, "global_step": 11508, "epoch": 95} {"train_loss": -24.571828842163086, "global_step": 11509, "epoch": 95} {"train_loss": -24.730688095092773, "global_step": 11510, "epoch": 95} {"train_loss": -24.9237117767334, "global_step": 11511, "epoch": 95} {"train_loss": -24.491535186767578, "global_step": 11512, "epoch": 95} {"train_loss": -24.85171127319336, "global_step": 11513, "epoch": 95} {"train_loss": -25.44603157043457, "global_step": 11514, "epoch": 95} {"train_loss": -24.971302032470703, "global_step": 11515, "epoch": 95} {"train_loss": -25.153247833251953, "global_step": 11516, "epoch": 95} {"train_loss": -24.850866317749023, "global_step": 11517, "epoch": 95} {"train_loss": -25.180654525756836, "global_step": 11518, "epoch": 95} {"train_loss": -25.016098022460938, "global_step": 11519, "epoch": 95} {"train_loss": -24.90181541442871, "global_step": 11520, "epoch": 95} {"train_loss": -25.55671501159668, "global_step": 11521, "epoch": 95} {"train_loss": -25.377492904663086, "global_step": 11522, "epoch": 95} {"train_loss": -25.24432373046875, "global_step": 11523, "epoch": 95} {"train_loss": -25.502628326416016, "global_step": 11524, "epoch": 95} {"train_loss": -25.236989974975586, "global_step": 11525, "epoch": 95} {"train_loss": -25.37538719177246, "global_step": 11526, "epoch": 95} {"train_loss": -25.19427490234375, "global_step": 11527, "epoch": 95} {"train_loss": -25.4785213470459, "global_step": 11528, "epoch": 95} {"train_loss": -25.51409149169922, "global_step": 11529, "epoch": 95} {"train_loss": -25.53306007385254, "global_step": 11530, "epoch": 95} {"train_loss": -25.7097110748291, "global_step": 11531, "epoch": 95} {"train_loss": -25.711475372314453, "global_step": 11532, "epoch": 95} {"train_loss": -25.262460708618164, "global_step": 11533, "epoch": 95} {"train_loss": -25.687116622924805, "global_step": 11534, "epoch": 95} {"train_loss": -26.000228881835938, "global_step": 11535, "epoch": 95} {"train_loss": -25.53141212463379, "global_step": 11536, "epoch": 95} {"train_loss": -25.538259506225586, "global_step": 11537, "epoch": 95} {"train_loss": -25.982288360595703, "global_step": 11538, "epoch": 95} {"train_loss": -25.793228149414062, "global_step": 11539, "epoch": 95} {"train_loss": -25.578874588012695, "global_step": 11540, "epoch": 95} {"train_loss": -25.87336540222168, "global_step": 11541, "epoch": 95} {"train_loss": -25.13850975036621, "global_step": 11542, "epoch": 95} {"train_loss": -25.211328506469727, "global_step": 11543, "epoch": 95} {"train_loss": -25.21224021911621, "global_step": 11544, "epoch": 95} {"train_loss": -25.518457412719727, "global_step": 11545, "epoch": 95} {"train_loss": -26.12836265563965, "global_step": 11546, "epoch": 95} {"train_loss": -25.278654098510742, "global_step": 11547, "epoch": 95} {"train_loss": -25.654783248901367, "global_step": 11548, "epoch": 95} {"train_loss": -25.199325561523438, "global_step": 11549, "epoch": 95} {"train_loss": -24.65069007873535, "global_step": 11550, "epoch": 95} {"train_loss": -24.86920928955078, "global_step": 11551, "epoch": 95} {"train_loss": -23.31428337097168, "global_step": 11552, "epoch": 95} {"train_loss": -23.870529174804688, "global_step": 11553, "epoch": 95} {"train_loss": -25.3162899017334, "global_step": 11554, "epoch": 95} {"train_loss": -25.78839111328125, "global_step": 11555, "epoch": 95} {"train_loss": -25.40340232849121, "global_step": 11556, "epoch": 95} {"train_loss": -25.05839729309082, "global_step": 11557, "epoch": 95} {"train_loss": -25.20672607421875, "global_step": 11558, "epoch": 95} {"train_loss": -25.829343795776367, "global_step": 11559, "epoch": 95} {"train_loss": -25.076900482177734, "global_step": 11560, "epoch": 95} {"train_loss": -24.45488929748535, "global_step": 11561, "epoch": 95} {"train_loss": -24.093902587890625, "global_step": 11562, "epoch": 95} {"train_loss": -20.97328758239746, "global_step": 11563, "epoch": 95} {"train_loss": -11.710029602050781, "global_step": 11564, "epoch": 95} {"train_loss": -1.8361492156982422, "global_step": 11565, "epoch": 95} {"train_loss": -20.62847900390625, "global_step": 11566, "epoch": 95} {"train_loss": -16.82067108154297, "global_step": 11567, "epoch": 95} {"train_loss": -24.718168258666992, "global_step": 11568, "epoch": 95} {"train_loss": -21.33548355102539, "global_step": 11569, "epoch": 95} {"train_loss": -20.66768455505371, "global_step": 11570, "epoch": 95} {"train_loss": -23.429031372070312, "global_step": 11571, "epoch": 95} {"train_loss": -24.115901947021484, "global_step": 11572, "epoch": 95} {"train_loss": -23.82847785949707, "global_step": 11573, "epoch": 95} {"train_loss": -22.76470375061035, "global_step": 11574, "epoch": 95} {"train_loss": -23.059049606323242, "global_step": 11575, "epoch": 95} {"train_loss": -22.865371704101562, "global_step": 11576, "epoch": 95} {"train_loss": -23.02007484436035, "global_step": 11577, "epoch": 95} {"train_loss": -23.827978134155273, "global_step": 11578, "epoch": 95} {"train_loss": -23.62101173400879, "global_step": 11579, "epoch": 95} {"train_loss": -24.176403045654297, "global_step": 11580, "epoch": 95} {"train_loss": -23.49420738220215, "global_step": 11581, "epoch": 95} {"train_loss": -23.706745147705078, "global_step": 11582, "epoch": 95} {"train_loss": -24.162504196166992, "global_step": 11583, "epoch": 95} {"train_loss": -23.499441146850586, "global_step": 11584, "epoch": 95} {"train_loss": -24.06488800048828, "global_step": 11585, "epoch": 95} {"train_loss": -23.841705322265625, "global_step": 11586, "epoch": 95} {"train_loss": -24.11549949645996, "global_step": 11587, "epoch": 95} {"train_loss": -23.52449607849121, "global_step": 11588, "epoch": 95} {"train_loss": -23.9600830078125, "global_step": 11589, "epoch": 95} {"train_loss": -24.04433250427246, "global_step": 11590, "epoch": 95} {"train_loss": -24.08649253845215, "global_step": 11591, "epoch": 95} {"train_loss": -23.896747589111328, "global_step": 11592, "epoch": 95} {"train_loss": -24.07283592224121, "global_step": 11593, "epoch": 95} {"train_loss": -22.606130599975586, "global_step": 11594, "epoch": 95} {"train_loss": -23.202077865600586, "global_step": 11595, "epoch": 95} {"train_loss": -23.65677833557129, "global_step": 11596, "epoch": 95} {"train_loss": -23.03363609313965, "global_step": 11597, "epoch": 95} {"train_loss": -24.035808563232422, "global_step": 11598, "epoch": 95} {"train_loss": -24.071142196655273, "global_step": 11599, "epoch": 95} {"train_loss": -23.640003204345703, "global_step": 11600, "epoch": 95} {"train_loss": -23.384763717651367, "global_step": 11601, "epoch": 95} {"train_loss": -24.166446685791016, "global_step": 11602, "epoch": 95} {"train_loss": -24.056787490844727, "global_step": 11603, "epoch": 95} {"train_loss": -24.2172908782959, "global_step": 11604, "epoch": 95} {"train_loss": -23.863525390625, "global_step": 11605, "epoch": 95} {"train_loss": -24.20631980895996, "global_step": 11606, "epoch": 95} {"train_loss": -24.712383270263672, "global_step": 11607, "epoch": 95} {"train_loss": -23.77809715270996, "global_step": 11608, "epoch": 95} {"train_loss": -24.478300094604492, "global_step": 11609, "epoch": 95} {"train_loss": -24.1610107421875, "global_step": 11610, "epoch": 95} {"train_loss": -23.628950119018555, "global_step": 11611, "epoch": 95} {"train_loss": -23.520130157470703, "global_step": 11612, "epoch": 95} {"train_loss": -23.8646183013916, "global_step": 11613, "epoch": 95} {"train_loss": -24.059045791625977, "global_step": 11614, "epoch": 95} {"train_loss": -24.03153523531827, "global_step": 11615, "epoch": 95, "val_loss": 2698333.0} {"train_loss": -24.151376724243164, "global_step": 11616, "epoch": 96} {"train_loss": -24.3825740814209, "global_step": 11617, "epoch": 96} {"train_loss": -24.286239624023438, "global_step": 11618, "epoch": 96} {"train_loss": -24.16099739074707, "global_step": 11619, "epoch": 96} {"train_loss": -24.552051544189453, "global_step": 11620, "epoch": 96} {"train_loss": -24.274547576904297, "global_step": 11621, "epoch": 96} {"train_loss": -24.103904724121094, "global_step": 11622, "epoch": 96} {"train_loss": -24.028827667236328, "global_step": 11623, "epoch": 96} {"train_loss": -24.9688663482666, "global_step": 11624, "epoch": 96} {"train_loss": -24.330001831054688, "global_step": 11625, "epoch": 96} {"train_loss": -24.295795440673828, "global_step": 11626, "epoch": 96} {"train_loss": -24.778167724609375, "global_step": 11627, "epoch": 96} {"train_loss": -24.222211837768555, "global_step": 11628, "epoch": 96} {"train_loss": -23.7093563079834, "global_step": 11629, "epoch": 96} {"train_loss": -24.536617279052734, "global_step": 11630, "epoch": 96} {"train_loss": -23.23154067993164, "global_step": 11631, "epoch": 96} {"train_loss": -24.265609741210938, "global_step": 11632, "epoch": 96} {"train_loss": -23.51686668395996, "global_step": 11633, "epoch": 96} {"train_loss": -23.160985946655273, "global_step": 11634, "epoch": 96} {"train_loss": -24.46296501159668, "global_step": 11635, "epoch": 96} {"train_loss": -23.669851303100586, "global_step": 11636, "epoch": 96} {"train_loss": -23.749021530151367, "global_step": 11637, "epoch": 96} {"train_loss": -24.413639068603516, "global_step": 11638, "epoch": 96} {"train_loss": -23.959924697875977, "global_step": 11639, "epoch": 96} {"train_loss": -25.001707077026367, "global_step": 11640, "epoch": 96} {"train_loss": -23.825910568237305, "global_step": 11641, "epoch": 96} {"train_loss": -24.439294815063477, "global_step": 11642, "epoch": 96} {"train_loss": -24.282852172851562, "global_step": 11643, "epoch": 96} {"train_loss": -24.428098678588867, "global_step": 11644, "epoch": 96} {"train_loss": -24.117544174194336, "global_step": 11645, "epoch": 96} {"train_loss": -24.74445343017578, "global_step": 11646, "epoch": 96} {"train_loss": -24.020627975463867, "global_step": 11647, "epoch": 96} {"train_loss": -24.776182174682617, "global_step": 11648, "epoch": 96} {"train_loss": -24.891443252563477, "global_step": 11649, "epoch": 96} {"train_loss": -24.41834259033203, "global_step": 11650, "epoch": 96} {"train_loss": -24.53582191467285, "global_step": 11651, "epoch": 96} {"train_loss": -24.605009078979492, "global_step": 11652, "epoch": 96} {"train_loss": -24.094022750854492, "global_step": 11653, "epoch": 96} {"train_loss": -23.615915298461914, "global_step": 11654, "epoch": 96} {"train_loss": -24.282487869262695, "global_step": 11655, "epoch": 96} {"train_loss": -24.948423385620117, "global_step": 11656, "epoch": 96} {"train_loss": -23.806560516357422, "global_step": 11657, "epoch": 96} {"train_loss": -24.195268630981445, "global_step": 11658, "epoch": 96} {"train_loss": -24.878387451171875, "global_step": 11659, "epoch": 96} {"train_loss": -24.31831169128418, "global_step": 11660, "epoch": 96} {"train_loss": -23.60841941833496, "global_step": 11661, "epoch": 96} {"train_loss": -24.690773010253906, "global_step": 11662, "epoch": 96} {"train_loss": -24.458066940307617, "global_step": 11663, "epoch": 96} {"train_loss": -24.894201278686523, "global_step": 11664, "epoch": 96} {"train_loss": -24.778589248657227, "global_step": 11665, "epoch": 96} {"train_loss": -24.768238067626953, "global_step": 11666, "epoch": 96} {"train_loss": -23.34857749938965, "global_step": 11667, "epoch": 96} {"train_loss": -22.627952575683594, "global_step": 11668, "epoch": 96} {"train_loss": -24.514570236206055, "global_step": 11669, "epoch": 96} {"train_loss": -22.526243209838867, "global_step": 11670, "epoch": 96} {"train_loss": -24.3541202545166, "global_step": 11671, "epoch": 96} {"train_loss": -22.83195686340332, "global_step": 11672, "epoch": 96} {"train_loss": -24.44846534729004, "global_step": 11673, "epoch": 96} {"train_loss": -24.012548446655273, "global_step": 11674, "epoch": 96} {"train_loss": -23.51297950744629, "global_step": 11675, "epoch": 96} {"train_loss": -24.27253532409668, "global_step": 11676, "epoch": 96} {"train_loss": -25.177099227905273, "global_step": 11677, "epoch": 96} {"train_loss": -24.607816696166992, "global_step": 11678, "epoch": 96} {"train_loss": -24.437185287475586, "global_step": 11679, "epoch": 96} {"train_loss": -24.169466018676758, "global_step": 11680, "epoch": 96} {"train_loss": -24.87676429748535, "global_step": 11681, "epoch": 96} {"train_loss": -24.439340591430664, "global_step": 11682, "epoch": 96} {"train_loss": -24.648656845092773, "global_step": 11683, "epoch": 96} {"train_loss": -24.805288314819336, "global_step": 11684, "epoch": 96} {"train_loss": -24.839269638061523, "global_step": 11685, "epoch": 96} {"train_loss": -24.981903076171875, "global_step": 11686, "epoch": 96} {"train_loss": -24.617338180541992, "global_step": 11687, "epoch": 96} {"train_loss": -24.58265495300293, "global_step": 11688, "epoch": 96} {"train_loss": -25.083812713623047, "global_step": 11689, "epoch": 96} {"train_loss": -25.000961303710938, "global_step": 11690, "epoch": 96} {"train_loss": -25.050418853759766, "global_step": 11691, "epoch": 96} {"train_loss": -25.007604598999023, "global_step": 11692, "epoch": 96} {"train_loss": -25.166650772094727, "global_step": 11693, "epoch": 96} {"train_loss": -24.526426315307617, "global_step": 11694, "epoch": 96} {"train_loss": -24.38020133972168, "global_step": 11695, "epoch": 96} {"train_loss": -25.182371139526367, "global_step": 11696, "epoch": 96} {"train_loss": -24.9288387298584, "global_step": 11697, "epoch": 96} {"train_loss": -25.033117294311523, "global_step": 11698, "epoch": 96} {"train_loss": -25.00257110595703, "global_step": 11699, "epoch": 96} {"train_loss": -25.129056930541992, "global_step": 11700, "epoch": 96} {"train_loss": -25.485654830932617, "global_step": 11701, "epoch": 96} {"train_loss": -25.108762741088867, "global_step": 11702, "epoch": 96} {"train_loss": -25.20994758605957, "global_step": 11703, "epoch": 96} {"train_loss": -25.207962036132812, "global_step": 11704, "epoch": 96} {"train_loss": -25.100553512573242, "global_step": 11705, "epoch": 96} {"train_loss": -25.064903259277344, "global_step": 11706, "epoch": 96} {"train_loss": -25.23682975769043, "global_step": 11707, "epoch": 96} {"train_loss": -24.834768295288086, "global_step": 11708, "epoch": 96} {"train_loss": -25.16310691833496, "global_step": 11709, "epoch": 96} {"train_loss": -24.66817855834961, "global_step": 11710, "epoch": 96} {"train_loss": -22.01823616027832, "global_step": 11711, "epoch": 96} {"train_loss": -7.915464878082275, "global_step": 11712, "epoch": 96} {"train_loss": 1.6890537738800049, "global_step": 11713, "epoch": 96} {"train_loss": -22.02313804626465, "global_step": 11714, "epoch": 96} {"train_loss": -14.064658164978027, "global_step": 11715, "epoch": 96} {"train_loss": -23.797718048095703, "global_step": 11716, "epoch": 96} {"train_loss": -18.149953842163086, "global_step": 11717, "epoch": 96} {"train_loss": -20.534940719604492, "global_step": 11718, "epoch": 96} {"train_loss": -23.481279373168945, "global_step": 11719, "epoch": 96} {"train_loss": -22.823657989501953, "global_step": 11720, "epoch": 96} {"train_loss": -21.83483123779297, "global_step": 11721, "epoch": 96} {"train_loss": -21.377164840698242, "global_step": 11722, "epoch": 96} {"train_loss": -22.792743682861328, "global_step": 11723, "epoch": 96} {"train_loss": -22.723905563354492, "global_step": 11724, "epoch": 96} {"train_loss": -23.410146713256836, "global_step": 11725, "epoch": 96} {"train_loss": -23.362546920776367, "global_step": 11726, "epoch": 96} {"train_loss": -23.06339454650879, "global_step": 11727, "epoch": 96} {"train_loss": -22.665494918823242, "global_step": 11728, "epoch": 96} {"train_loss": -23.17014503479004, "global_step": 11729, "epoch": 96} {"train_loss": -22.961824417114258, "global_step": 11730, "epoch": 96} {"train_loss": -22.870288848876953, "global_step": 11731, "epoch": 96} {"train_loss": -23.3409423828125, "global_step": 11732, "epoch": 96} {"train_loss": -23.08077621459961, "global_step": 11733, "epoch": 96} {"train_loss": -23.71819305419922, "global_step": 11734, "epoch": 96} {"train_loss": -23.857070922851562, "global_step": 11735, "epoch": 96} {"train_loss": -23.661856787263854, "global_step": 11736, "epoch": 96, "val_loss": 2690399.0} {"train_loss": -23.79876708984375, "global_step": 11737, "epoch": 97} {"train_loss": -23.6630802154541, "global_step": 11738, "epoch": 97} {"train_loss": -23.59040641784668, "global_step": 11739, "epoch": 97} {"train_loss": -23.343978881835938, "global_step": 11740, "epoch": 97} {"train_loss": -23.822101593017578, "global_step": 11741, "epoch": 97} {"train_loss": -23.669124603271484, "global_step": 11742, "epoch": 97} {"train_loss": -23.538068771362305, "global_step": 11743, "epoch": 97} {"train_loss": -24.089313507080078, "global_step": 11744, "epoch": 97} {"train_loss": -23.925010681152344, "global_step": 11745, "epoch": 97} {"train_loss": -23.67876434326172, "global_step": 11746, "epoch": 97} {"train_loss": -24.214326858520508, "global_step": 11747, "epoch": 97} {"train_loss": -23.447986602783203, "global_step": 11748, "epoch": 97} {"train_loss": -23.01811408996582, "global_step": 11749, "epoch": 97} {"train_loss": -23.282543182373047, "global_step": 11750, "epoch": 97} {"train_loss": -24.508892059326172, "global_step": 11751, "epoch": 97} {"train_loss": -24.14134979248047, "global_step": 11752, "epoch": 97} {"train_loss": -24.0606746673584, "global_step": 11753, "epoch": 97} {"train_loss": -24.08928108215332, "global_step": 11754, "epoch": 97} {"train_loss": -24.188772201538086, "global_step": 11755, "epoch": 97} {"train_loss": -24.24769401550293, "global_step": 11756, "epoch": 97} {"train_loss": -24.26700210571289, "global_step": 11757, "epoch": 97} {"train_loss": -23.754379272460938, "global_step": 11758, "epoch": 97} {"train_loss": -24.66639518737793, "global_step": 11759, "epoch": 97} {"train_loss": -24.068586349487305, "global_step": 11760, "epoch": 97} {"train_loss": -24.51357078552246, "global_step": 11761, "epoch": 97} {"train_loss": -24.178598403930664, "global_step": 11762, "epoch": 97} {"train_loss": -24.722698211669922, "global_step": 11763, "epoch": 97} {"train_loss": -24.841062545776367, "global_step": 11764, "epoch": 97} {"train_loss": -24.75037956237793, "global_step": 11765, "epoch": 97} {"train_loss": -24.450254440307617, "global_step": 11766, "epoch": 97} {"train_loss": -24.739660263061523, "global_step": 11767, "epoch": 97} {"train_loss": -24.78547477722168, "global_step": 11768, "epoch": 97} {"train_loss": -24.73700523376465, "global_step": 11769, "epoch": 97} {"train_loss": -24.546680450439453, "global_step": 11770, "epoch": 97} {"train_loss": -24.81732940673828, "global_step": 11771, "epoch": 97} {"train_loss": -24.649505615234375, "global_step": 11772, "epoch": 97} {"train_loss": -24.52351951599121, "global_step": 11773, "epoch": 97} {"train_loss": -24.229022979736328, "global_step": 11774, "epoch": 97} {"train_loss": -24.83321189880371, "global_step": 11775, "epoch": 97} {"train_loss": -24.6971492767334, "global_step": 11776, "epoch": 97} {"train_loss": -24.839038848876953, "global_step": 11777, "epoch": 97} {"train_loss": -25.035144805908203, "global_step": 11778, "epoch": 97} {"train_loss": -24.735305786132812, "global_step": 11779, "epoch": 97} {"train_loss": -25.062915802001953, "global_step": 11780, "epoch": 97} {"train_loss": -24.941518783569336, "global_step": 11781, "epoch": 97} {"train_loss": -24.1776180267334, "global_step": 11782, "epoch": 97} {"train_loss": -23.323070526123047, "global_step": 11783, "epoch": 97} {"train_loss": -23.249876022338867, "global_step": 11784, "epoch": 97} {"train_loss": -24.812185287475586, "global_step": 11785, "epoch": 97} {"train_loss": -23.509031295776367, "global_step": 11786, "epoch": 97} {"train_loss": -22.893997192382812, "global_step": 11787, "epoch": 97} {"train_loss": -25.023406982421875, "global_step": 11788, "epoch": 97} {"train_loss": -24.31036949157715, "global_step": 11789, "epoch": 97} {"train_loss": -24.209821701049805, "global_step": 11790, "epoch": 97} {"train_loss": -24.892663955688477, "global_step": 11791, "epoch": 97} {"train_loss": -23.7739200592041, "global_step": 11792, "epoch": 97} {"train_loss": -25.101293563842773, "global_step": 11793, "epoch": 97} {"train_loss": -24.49554443359375, "global_step": 11794, "epoch": 97} {"train_loss": -24.800439834594727, "global_step": 11795, "epoch": 97} {"train_loss": -24.701976776123047, "global_step": 11796, "epoch": 97} {"train_loss": -24.758317947387695, "global_step": 11797, "epoch": 97} {"train_loss": -24.821969985961914, "global_step": 11798, "epoch": 97} {"train_loss": -24.340478897094727, "global_step": 11799, "epoch": 97} {"train_loss": -24.931230545043945, "global_step": 11800, "epoch": 97} {"train_loss": -24.684782028198242, "global_step": 11801, "epoch": 97} {"train_loss": -24.689844131469727, "global_step": 11802, "epoch": 97} {"train_loss": -24.358606338500977, "global_step": 11803, "epoch": 97} {"train_loss": -24.717851638793945, "global_step": 11804, "epoch": 97} {"train_loss": -25.0922794342041, "global_step": 11805, "epoch": 97} {"train_loss": -24.293441772460938, "global_step": 11806, "epoch": 97} {"train_loss": -23.56243324279785, "global_step": 11807, "epoch": 97} {"train_loss": -23.25177574157715, "global_step": 11808, "epoch": 97} {"train_loss": -24.240938186645508, "global_step": 11809, "epoch": 97} {"train_loss": -25.07501792907715, "global_step": 11810, "epoch": 97} {"train_loss": -24.373828887939453, "global_step": 11811, "epoch": 97} {"train_loss": -24.71278190612793, "global_step": 11812, "epoch": 97} {"train_loss": -24.83727264404297, "global_step": 11813, "epoch": 97} {"train_loss": -25.2005615234375, "global_step": 11814, "epoch": 97} {"train_loss": -25.01858139038086, "global_step": 11815, "epoch": 97} {"train_loss": -24.99214744567871, "global_step": 11816, "epoch": 97} {"train_loss": -24.89919090270996, "global_step": 11817, "epoch": 97} {"train_loss": -24.808053970336914, "global_step": 11818, "epoch": 97} {"train_loss": -25.125059127807617, "global_step": 11819, "epoch": 97} {"train_loss": -24.90842056274414, "global_step": 11820, "epoch": 97} {"train_loss": -25.215625762939453, "global_step": 11821, "epoch": 97} {"train_loss": -25.04790687561035, "global_step": 11822, "epoch": 97} {"train_loss": -25.136001586914062, "global_step": 11823, "epoch": 97} {"train_loss": -24.781564712524414, "global_step": 11824, "epoch": 97} {"train_loss": -24.997304916381836, "global_step": 11825, "epoch": 97} {"train_loss": -25.080623626708984, "global_step": 11826, "epoch": 97} {"train_loss": -24.953519821166992, "global_step": 11827, "epoch": 97} {"train_loss": -23.817646026611328, "global_step": 11828, "epoch": 97} {"train_loss": -22.66358757019043, "global_step": 11829, "epoch": 97} {"train_loss": -23.330867767333984, "global_step": 11830, "epoch": 97} {"train_loss": -25.093229293823242, "global_step": 11831, "epoch": 97} {"train_loss": -24.569379806518555, "global_step": 11832, "epoch": 97} {"train_loss": -24.683561325073242, "global_step": 11833, "epoch": 97} {"train_loss": -25.20408821105957, "global_step": 11834, "epoch": 97} {"train_loss": -25.086088180541992, "global_step": 11835, "epoch": 97} {"train_loss": -24.626760482788086, "global_step": 11836, "epoch": 97} {"train_loss": -25.117389678955078, "global_step": 11837, "epoch": 97} {"train_loss": -25.05836296081543, "global_step": 11838, "epoch": 97} {"train_loss": -24.5804500579834, "global_step": 11839, "epoch": 97} {"train_loss": -25.721044540405273, "global_step": 11840, "epoch": 97} {"train_loss": -24.930456161499023, "global_step": 11841, "epoch": 97} {"train_loss": -25.16170883178711, "global_step": 11842, "epoch": 97} {"train_loss": -25.054906845092773, "global_step": 11843, "epoch": 97} {"train_loss": -24.62584114074707, "global_step": 11844, "epoch": 97} {"train_loss": -24.89939308166504, "global_step": 11845, "epoch": 97} {"train_loss": -24.710065841674805, "global_step": 11846, "epoch": 97} {"train_loss": -25.73904800415039, "global_step": 11847, "epoch": 97} {"train_loss": -24.700592041015625, "global_step": 11848, "epoch": 97} {"train_loss": -25.47286033630371, "global_step": 11849, "epoch": 97} {"train_loss": -25.065153121948242, "global_step": 11850, "epoch": 97} {"train_loss": -25.341079711914062, "global_step": 11851, "epoch": 97} {"train_loss": -25.185144424438477, "global_step": 11852, "epoch": 97} {"train_loss": -25.188547134399414, "global_step": 11853, "epoch": 97} {"train_loss": -25.54397964477539, "global_step": 11854, "epoch": 97} {"train_loss": -25.7667179107666, "global_step": 11855, "epoch": 97} {"train_loss": -24.997150421142578, "global_step": 11856, "epoch": 97} {"train_loss": -24.525741545622015, "global_step": 11857, "epoch": 97, "val_loss": 3282787.75} {"train_loss": -24.06097984313965, "global_step": 11858, "epoch": 98} {"train_loss": -24.74484634399414, "global_step": 11859, "epoch": 98} {"train_loss": -24.874799728393555, "global_step": 11860, "epoch": 98} {"train_loss": -25.400148391723633, "global_step": 11861, "epoch": 98} {"train_loss": -24.755889892578125, "global_step": 11862, "epoch": 98} {"train_loss": -25.07480812072754, "global_step": 11863, "epoch": 98} {"train_loss": -25.604965209960938, "global_step": 11864, "epoch": 98} {"train_loss": -25.029722213745117, "global_step": 11865, "epoch": 98} {"train_loss": -24.823904037475586, "global_step": 11866, "epoch": 98} {"train_loss": -25.124250411987305, "global_step": 11867, "epoch": 98} {"train_loss": -25.385007858276367, "global_step": 11868, "epoch": 98} {"train_loss": -24.868295669555664, "global_step": 11869, "epoch": 98} {"train_loss": -25.31702995300293, "global_step": 11870, "epoch": 98} {"train_loss": -25.577573776245117, "global_step": 11871, "epoch": 98} {"train_loss": -25.005382537841797, "global_step": 11872, "epoch": 98} {"train_loss": -25.019376754760742, "global_step": 11873, "epoch": 98} {"train_loss": -25.61444091796875, "global_step": 11874, "epoch": 98} {"train_loss": -25.37417984008789, "global_step": 11875, "epoch": 98} {"train_loss": -25.36396598815918, "global_step": 11876, "epoch": 98} {"train_loss": -25.419261932373047, "global_step": 11877, "epoch": 98} {"train_loss": -24.922134399414062, "global_step": 11878, "epoch": 98} {"train_loss": -25.565282821655273, "global_step": 11879, "epoch": 98} {"train_loss": -25.070768356323242, "global_step": 11880, "epoch": 98} {"train_loss": -24.81886100769043, "global_step": 11881, "epoch": 98} {"train_loss": -25.7745304107666, "global_step": 11882, "epoch": 98} {"train_loss": -25.216711044311523, "global_step": 11883, "epoch": 98} {"train_loss": -25.83404541015625, "global_step": 11884, "epoch": 98} {"train_loss": -25.116056442260742, "global_step": 11885, "epoch": 98} {"train_loss": -26.01885414123535, "global_step": 11886, "epoch": 98} {"train_loss": -24.928890228271484, "global_step": 11887, "epoch": 98} {"train_loss": -25.844507217407227, "global_step": 11888, "epoch": 98} {"train_loss": -25.028873443603516, "global_step": 11889, "epoch": 98} {"train_loss": -25.731924057006836, "global_step": 11890, "epoch": 98} {"train_loss": -25.839853286743164, "global_step": 11891, "epoch": 98} {"train_loss": -25.279935836791992, "global_step": 11892, "epoch": 98} {"train_loss": -25.484609603881836, "global_step": 11893, "epoch": 98} {"train_loss": -25.786157608032227, "global_step": 11894, "epoch": 98} {"train_loss": -25.661121368408203, "global_step": 11895, "epoch": 98} {"train_loss": -25.936120986938477, "global_step": 11896, "epoch": 98} {"train_loss": -25.088041305541992, "global_step": 11897, "epoch": 98} {"train_loss": -25.666248321533203, "global_step": 11898, "epoch": 98} {"train_loss": -25.005529403686523, "global_step": 11899, "epoch": 98} {"train_loss": -25.343570709228516, "global_step": 11900, "epoch": 98} {"train_loss": -24.790267944335938, "global_step": 11901, "epoch": 98} {"train_loss": -25.655078887939453, "global_step": 11902, "epoch": 98} {"train_loss": -25.399524688720703, "global_step": 11903, "epoch": 98} {"train_loss": -25.636457443237305, "global_step": 11904, "epoch": 98} {"train_loss": -25.82696533203125, "global_step": 11905, "epoch": 98} {"train_loss": -24.66812515258789, "global_step": 11906, "epoch": 98} {"train_loss": -24.346567153930664, "global_step": 11907, "epoch": 98} {"train_loss": -17.309431076049805, "global_step": 11908, "epoch": 98} {"train_loss": -7.362740993499756, "global_step": 11909, "epoch": 98} {"train_loss": -24.271329879760742, "global_step": 11910, "epoch": 98} {"train_loss": -20.824254989624023, "global_step": 11911, "epoch": 98} {"train_loss": -22.368682861328125, "global_step": 11912, "epoch": 98} {"train_loss": -21.90082550048828, "global_step": 11913, "epoch": 98} {"train_loss": -24.988229751586914, "global_step": 11914, "epoch": 98} {"train_loss": -24.497900009155273, "global_step": 11915, "epoch": 98} {"train_loss": -23.972370147705078, "global_step": 11916, "epoch": 98} {"train_loss": -23.641704559326172, "global_step": 11917, "epoch": 98} {"train_loss": -23.23834228515625, "global_step": 11918, "epoch": 98} {"train_loss": -23.86287498474121, "global_step": 11919, "epoch": 98} {"train_loss": -24.56272315979004, "global_step": 11920, "epoch": 98} {"train_loss": -25.22157096862793, "global_step": 11921, "epoch": 98} {"train_loss": -24.933897018432617, "global_step": 11922, "epoch": 98} {"train_loss": -24.799787521362305, "global_step": 11923, "epoch": 98} {"train_loss": -25.200876235961914, "global_step": 11924, "epoch": 98} {"train_loss": -25.092824935913086, "global_step": 11925, "epoch": 98} {"train_loss": -24.967302322387695, "global_step": 11926, "epoch": 98} {"train_loss": -25.1955623626709, "global_step": 11927, "epoch": 98} {"train_loss": -24.70513343811035, "global_step": 11928, "epoch": 98} {"train_loss": -25.28451919555664, "global_step": 11929, "epoch": 98} {"train_loss": -24.391767501831055, "global_step": 11930, "epoch": 98} {"train_loss": -24.955007553100586, "global_step": 11931, "epoch": 98} {"train_loss": -25.059057235717773, "global_step": 11932, "epoch": 98} {"train_loss": -24.77106285095215, "global_step": 11933, "epoch": 98} {"train_loss": -25.52493667602539, "global_step": 11934, "epoch": 98} {"train_loss": -24.459043502807617, "global_step": 11935, "epoch": 98} {"train_loss": -25.037946701049805, "global_step": 11936, "epoch": 98} {"train_loss": -25.233396530151367, "global_step": 11937, "epoch": 98} {"train_loss": -23.55615234375, "global_step": 11938, "epoch": 98} {"train_loss": -24.34791374206543, "global_step": 11939, "epoch": 98} {"train_loss": -24.747161865234375, "global_step": 11940, "epoch": 98} {"train_loss": -23.229597091674805, "global_step": 11941, "epoch": 98} {"train_loss": -23.248424530029297, "global_step": 11942, "epoch": 98} {"train_loss": -20.493127822875977, "global_step": 11943, "epoch": 98} {"train_loss": -14.14714241027832, "global_step": 11944, "epoch": 98} {"train_loss": -17.158615112304688, "global_step": 11945, "epoch": 98} {"train_loss": -24.25899314880371, "global_step": 11946, "epoch": 98} {"train_loss": -19.012954711914062, "global_step": 11947, "epoch": 98} {"train_loss": -23.890329360961914, "global_step": 11948, "epoch": 98} {"train_loss": -20.100204467773438, "global_step": 11949, "epoch": 98} {"train_loss": -24.573148727416992, "global_step": 11950, "epoch": 98} {"train_loss": -21.587562561035156, "global_step": 11951, "epoch": 98} {"train_loss": -23.352108001708984, "global_step": 11952, "epoch": 98} {"train_loss": -24.063535690307617, "global_step": 11953, "epoch": 98} {"train_loss": -23.40178871154785, "global_step": 11954, "epoch": 98} {"train_loss": -23.364944458007812, "global_step": 11955, "epoch": 98} {"train_loss": -23.900836944580078, "global_step": 11956, "epoch": 98} {"train_loss": -24.581247329711914, "global_step": 11957, "epoch": 98} {"train_loss": -23.867300033569336, "global_step": 11958, "epoch": 98} {"train_loss": -23.679725646972656, "global_step": 11959, "epoch": 98} {"train_loss": -23.974822998046875, "global_step": 11960, "epoch": 98} {"train_loss": -24.231821060180664, "global_step": 11961, "epoch": 98} {"train_loss": -24.258455276489258, "global_step": 11962, "epoch": 98} {"train_loss": -24.074594497680664, "global_step": 11963, "epoch": 98} {"train_loss": -24.121728897094727, "global_step": 11964, "epoch": 98} {"train_loss": -24.078649520874023, "global_step": 11965, "epoch": 98} {"train_loss": -24.35573387145996, "global_step": 11966, "epoch": 98} {"train_loss": -24.627737045288086, "global_step": 11967, "epoch": 98} {"train_loss": -24.37003517150879, "global_step": 11968, "epoch": 98} {"train_loss": -24.190580368041992, "global_step": 11969, "epoch": 98} {"train_loss": -24.571958541870117, "global_step": 11970, "epoch": 98} {"train_loss": -24.557809829711914, "global_step": 11971, "epoch": 98} {"train_loss": -24.538156509399414, "global_step": 11972, "epoch": 98} {"train_loss": -24.444345474243164, "global_step": 11973, "epoch": 98} {"train_loss": -24.670440673828125, "global_step": 11974, "epoch": 98} {"train_loss": -24.3502254486084, "global_step": 11975, "epoch": 98} {"train_loss": -24.512775421142578, "global_step": 11976, "epoch": 98} {"train_loss": -24.561132431030273, "global_step": 11977, "epoch": 98} {"train_loss": -24.206591688897, "global_step": 11978, "epoch": 98, "val_loss": 2973039.0} {"train_loss": -24.988874435424805, "global_step": 11979, "epoch": 99} {"train_loss": -24.951013565063477, "global_step": 11980, "epoch": 99} {"train_loss": -25.069042205810547, "global_step": 11981, "epoch": 99} {"train_loss": -24.940832138061523, "global_step": 11982, "epoch": 99} {"train_loss": -25.083703994750977, "global_step": 11983, "epoch": 99} {"train_loss": -24.61690330505371, "global_step": 11984, "epoch": 99} {"train_loss": -25.22933006286621, "global_step": 11985, "epoch": 99} {"train_loss": -24.576135635375977, "global_step": 11986, "epoch": 99} {"train_loss": -24.470876693725586, "global_step": 11987, "epoch": 99} {"train_loss": -25.346221923828125, "global_step": 11988, "epoch": 99} {"train_loss": -24.46468162536621, "global_step": 11989, "epoch": 99} {"train_loss": -25.13179588317871, "global_step": 11990, "epoch": 99} {"train_loss": -24.956567764282227, "global_step": 11991, "epoch": 99} {"train_loss": -24.322479248046875, "global_step": 11992, "epoch": 99} {"train_loss": -24.824172973632812, "global_step": 11993, "epoch": 99} {"train_loss": -24.36873435974121, "global_step": 11994, "epoch": 99} {"train_loss": -24.92629051208496, "global_step": 11995, "epoch": 99} {"train_loss": -25.30345916748047, "global_step": 11996, "epoch": 99} {"train_loss": -24.66505241394043, "global_step": 11997, "epoch": 99} {"train_loss": -24.568496704101562, "global_step": 11998, "epoch": 99} {"train_loss": -24.966733932495117, "global_step": 11999, "epoch": 99} {"train_loss": -24.875904083251953, "global_step": 12000, "epoch": 99} {"train_loss": -25.006986618041992, "global_step": 12001, "epoch": 99} {"train_loss": -24.36195945739746, "global_step": 12002, "epoch": 99} {"train_loss": -22.403738021850586, "global_step": 12003, "epoch": 99} {"train_loss": -18.91536521911621, "global_step": 12004, "epoch": 99} {"train_loss": -19.476181030273438, "global_step": 12005, "epoch": 99} {"train_loss": -24.095924377441406, "global_step": 12006, "epoch": 99} {"train_loss": -21.909690856933594, "global_step": 12007, "epoch": 99} {"train_loss": -23.32561683654785, "global_step": 12008, "epoch": 99} {"train_loss": -23.311309814453125, "global_step": 12009, "epoch": 99} {"train_loss": -24.17622947692871, "global_step": 12010, "epoch": 99} {"train_loss": -23.423803329467773, "global_step": 12011, "epoch": 99} {"train_loss": -23.71952247619629, "global_step": 12012, "epoch": 99} {"train_loss": -24.319002151489258, "global_step": 12013, "epoch": 99} {"train_loss": -24.138198852539062, "global_step": 12014, "epoch": 99} {"train_loss": -23.902841567993164, "global_step": 12015, "epoch": 99} {"train_loss": -24.320592880249023, "global_step": 12016, "epoch": 99} {"train_loss": -24.356386184692383, "global_step": 12017, "epoch": 99} {"train_loss": -24.400888442993164, "global_step": 12018, "epoch": 99} {"train_loss": -24.165311813354492, "global_step": 12019, "epoch": 99} {"train_loss": -24.696935653686523, "global_step": 12020, "epoch": 99} {"train_loss": -24.333145141601562, "global_step": 12021, "epoch": 99} {"train_loss": -24.757665634155273, "global_step": 12022, "epoch": 99} {"train_loss": -24.011768341064453, "global_step": 12023, "epoch": 99} {"train_loss": -24.586328506469727, "global_step": 12024, "epoch": 99} {"train_loss": -24.239704132080078, "global_step": 12025, "epoch": 99} {"train_loss": -24.818761825561523, "global_step": 12026, "epoch": 99} {"train_loss": -24.758586883544922, "global_step": 12027, "epoch": 99} {"train_loss": -24.636219024658203, "global_step": 12028, "epoch": 99} {"train_loss": -24.638572692871094, "global_step": 12029, "epoch": 99} {"train_loss": -24.18289566040039, "global_step": 12030, "epoch": 99} {"train_loss": -25.090986251831055, "global_step": 12031, "epoch": 99} {"train_loss": -24.80692481994629, "global_step": 12032, "epoch": 99} {"train_loss": -24.598596572875977, "global_step": 12033, "epoch": 99} {"train_loss": -24.582107543945312, "global_step": 12034, "epoch": 99} {"train_loss": -24.677194595336914, "global_step": 12035, "epoch": 99} {"train_loss": -24.767044067382812, "global_step": 12036, "epoch": 99} {"train_loss": -24.209436416625977, "global_step": 12037, "epoch": 99} {"train_loss": -24.424060821533203, "global_step": 12038, "epoch": 99} {"train_loss": -24.710519790649414, "global_step": 12039, "epoch": 99} {"train_loss": -24.49294090270996, "global_step": 12040, "epoch": 99} {"train_loss": -25.225492477416992, "global_step": 12041, "epoch": 99} {"train_loss": -24.84344482421875, "global_step": 12042, "epoch": 99} {"train_loss": -24.805400848388672, "global_step": 12043, "epoch": 99} {"train_loss": -24.847187042236328, "global_step": 12044, "epoch": 99} {"train_loss": -24.899141311645508, "global_step": 12045, "epoch": 99} {"train_loss": -25.044416427612305, "global_step": 12046, "epoch": 99} {"train_loss": -24.998737335205078, "global_step": 12047, "epoch": 99} {"train_loss": -25.424352645874023, "global_step": 12048, "epoch": 99} {"train_loss": -25.461963653564453, "global_step": 12049, "epoch": 99} {"train_loss": -25.164602279663086, "global_step": 12050, "epoch": 99} {"train_loss": -25.450498580932617, "global_step": 12051, "epoch": 99} {"train_loss": -25.159330368041992, "global_step": 12052, "epoch": 99} {"train_loss": -25.333606719970703, "global_step": 12053, "epoch": 99} {"train_loss": -25.42720603942871, "global_step": 12054, "epoch": 99} {"train_loss": -25.63214111328125, "global_step": 12055, "epoch": 99} {"train_loss": -25.120849609375, "global_step": 12056, "epoch": 99} {"train_loss": -25.303470611572266, "global_step": 12057, "epoch": 99} {"train_loss": -25.6608943939209, "global_step": 12058, "epoch": 99} {"train_loss": -25.169349670410156, "global_step": 12059, "epoch": 99} {"train_loss": -25.637680053710938, "global_step": 12060, "epoch": 99} {"train_loss": -25.206398010253906, "global_step": 12061, "epoch": 99} {"train_loss": -25.449941635131836, "global_step": 12062, "epoch": 99} {"train_loss": -25.65545654296875, "global_step": 12063, "epoch": 99} {"train_loss": -25.71768569946289, "global_step": 12064, "epoch": 99} {"train_loss": -25.653156280517578, "global_step": 12065, "epoch": 99} {"train_loss": -25.44535255432129, "global_step": 12066, "epoch": 99} {"train_loss": -25.89347267150879, "global_step": 12067, "epoch": 99} {"train_loss": -25.624929428100586, "global_step": 12068, "epoch": 99} {"train_loss": -25.986494064331055, "global_step": 12069, "epoch": 99} {"train_loss": -25.58359718322754, "global_step": 12070, "epoch": 99} {"train_loss": -25.902490615844727, "global_step": 12071, "epoch": 99} {"train_loss": -25.939855575561523, "global_step": 12072, "epoch": 99} {"train_loss": -25.781147003173828, "global_step": 12073, "epoch": 99} {"train_loss": -26.130664825439453, "global_step": 12074, "epoch": 99} {"train_loss": -26.06916618347168, "global_step": 12075, "epoch": 99} {"train_loss": -26.19956398010254, "global_step": 12076, "epoch": 99} {"train_loss": -26.2134952545166, "global_step": 12077, "epoch": 99} {"train_loss": -25.694076538085938, "global_step": 12078, "epoch": 99} {"train_loss": -25.831045150756836, "global_step": 12079, "epoch": 99} {"train_loss": -25.538442611694336, "global_step": 12080, "epoch": 99} {"train_loss": -24.4576416015625, "global_step": 12081, "epoch": 99} {"train_loss": -23.819190979003906, "global_step": 12082, "epoch": 99} {"train_loss": -21.08210563659668, "global_step": 12083, "epoch": 99} {"train_loss": -16.754898071289062, "global_step": 12084, "epoch": 99} {"train_loss": -21.645776748657227, "global_step": 12085, "epoch": 99} {"train_loss": -25.528343200683594, "global_step": 12086, "epoch": 99} {"train_loss": -23.440406799316406, "global_step": 12087, "epoch": 99} {"train_loss": -25.57404899597168, "global_step": 12088, "epoch": 99} {"train_loss": -24.539297103881836, "global_step": 12089, "epoch": 99} {"train_loss": -25.045719146728516, "global_step": 12090, "epoch": 99} {"train_loss": -24.700265884399414, "global_step": 12091, "epoch": 99} {"train_loss": -25.7868595123291, "global_step": 12092, "epoch": 99} {"train_loss": -24.954618453979492, "global_step": 12093, "epoch": 99} {"train_loss": -25.303050994873047, "global_step": 12094, "epoch": 99} {"train_loss": -25.366106033325195, "global_step": 12095, "epoch": 99} {"train_loss": -24.814401626586914, "global_step": 12096, "epoch": 99} {"train_loss": -25.74256706237793, "global_step": 12097, "epoch": 99} {"train_loss": -24.9553279876709, "global_step": 12098, "epoch": 99} {"train_loss": -24.673474430052703, "global_step": 12099, "epoch": 99, "val_loss": 2482448.25} {"train_loss": -25.330427169799805, "global_step": 12100, "epoch": 100} {"train_loss": -25.21921730041504, "global_step": 12101, "epoch": 100} {"train_loss": -25.580190658569336, "global_step": 12102, "epoch": 100} {"train_loss": -25.36098289489746, "global_step": 12103, "epoch": 100} {"train_loss": -25.302995681762695, "global_step": 12104, "epoch": 100} {"train_loss": -25.19699478149414, "global_step": 12105, "epoch": 100} {"train_loss": -25.864276885986328, "global_step": 12106, "epoch": 100} {"train_loss": -25.749603271484375, "global_step": 12107, "epoch": 100} {"train_loss": -23.382246017456055, "global_step": 12108, "epoch": 100} {"train_loss": -23.838003158569336, "global_step": 12109, "epoch": 100} {"train_loss": -24.311920166015625, "global_step": 12110, "epoch": 100} {"train_loss": -25.484485626220703, "global_step": 12111, "epoch": 100} {"train_loss": -24.763845443725586, "global_step": 12112, "epoch": 100} {"train_loss": -25.11717987060547, "global_step": 12113, "epoch": 100} {"train_loss": -25.463550567626953, "global_step": 12114, "epoch": 100} {"train_loss": -25.240339279174805, "global_step": 12115, "epoch": 100} {"train_loss": -25.74603843688965, "global_step": 12116, "epoch": 100} {"train_loss": -25.1633358001709, "global_step": 12117, "epoch": 100} {"train_loss": -25.35695457458496, "global_step": 12118, "epoch": 100} {"train_loss": -25.270557403564453, "global_step": 12119, "epoch": 100} {"train_loss": -25.295873641967773, "global_step": 12120, "epoch": 100} {"train_loss": -24.69190216064453, "global_step": 12121, "epoch": 100} {"train_loss": -25.328184127807617, "global_step": 12122, "epoch": 100} {"train_loss": -25.22062110900879, "global_step": 12123, "epoch": 100} {"train_loss": -24.88856315612793, "global_step": 12124, "epoch": 100} {"train_loss": -25.351154327392578, "global_step": 12125, "epoch": 100} {"train_loss": -25.549596786499023, "global_step": 12126, "epoch": 100} {"train_loss": -25.047147750854492, "global_step": 12127, "epoch": 100} {"train_loss": -25.31504249572754, "global_step": 12128, "epoch": 100} {"train_loss": -25.598791122436523, "global_step": 12129, "epoch": 100} {"train_loss": -25.26651382446289, "global_step": 12130, "epoch": 100} {"train_loss": -24.811981201171875, "global_step": 12131, "epoch": 100} {"train_loss": -24.976037979125977, "global_step": 12132, "epoch": 100} {"train_loss": -25.322385787963867, "global_step": 12133, "epoch": 100} {"train_loss": -25.562570571899414, "global_step": 12134, "epoch": 100} {"train_loss": -25.441938400268555, "global_step": 12135, "epoch": 100} {"train_loss": -25.290451049804688, "global_step": 12136, "epoch": 100} {"train_loss": -24.8648681640625, "global_step": 12137, "epoch": 100} {"train_loss": -25.595829010009766, "global_step": 12138, "epoch": 100} {"train_loss": -25.582733154296875, "global_step": 12139, "epoch": 100} {"train_loss": -25.033172607421875, "global_step": 12140, "epoch": 100} {"train_loss": -25.41754913330078, "global_step": 12141, "epoch": 100} {"train_loss": -25.375471115112305, "global_step": 12142, "epoch": 100} {"train_loss": -24.858869552612305, "global_step": 12143, "epoch": 100} {"train_loss": -24.45366096496582, "global_step": 12144, "epoch": 100} {"train_loss": -25.640661239624023, "global_step": 12145, "epoch": 100} {"train_loss": -25.44200897216797, "global_step": 12146, "epoch": 100} {"train_loss": -25.59523582458496, "global_step": 12147, "epoch": 100} {"train_loss": -26.0406494140625, "global_step": 12148, "epoch": 100} {"train_loss": -25.599775314331055, "global_step": 12149, "epoch": 100} {"train_loss": -25.635915756225586, "global_step": 12150, "epoch": 100} {"train_loss": -25.665781021118164, "global_step": 12151, "epoch": 100} {"train_loss": -24.86888313293457, "global_step": 12152, "epoch": 100} {"train_loss": -25.902729034423828, "global_step": 12153, "epoch": 100} {"train_loss": -25.576568603515625, "global_step": 12154, "epoch": 100} {"train_loss": -25.809406280517578, "global_step": 12155, "epoch": 100} {"train_loss": -25.818252563476562, "global_step": 12156, "epoch": 100} {"train_loss": -25.37152671813965, "global_step": 12157, "epoch": 100} {"train_loss": -25.39266014099121, "global_step": 12158, "epoch": 100} {"train_loss": -26.222219467163086, "global_step": 12159, "epoch": 100} {"train_loss": -25.718000411987305, "global_step": 12160, "epoch": 100} {"train_loss": -25.841455459594727, "global_step": 12161, "epoch": 100} {"train_loss": -25.443496704101562, "global_step": 12162, "epoch": 100} {"train_loss": -25.897247314453125, "global_step": 12163, "epoch": 100} {"train_loss": -25.81048583984375, "global_step": 12164, "epoch": 100} {"train_loss": -25.856237411499023, "global_step": 12165, "epoch": 100} {"train_loss": -25.74531364440918, "global_step": 12166, "epoch": 100} {"train_loss": -25.620859146118164, "global_step": 12167, "epoch": 100} {"train_loss": -25.937549591064453, "global_step": 12168, "epoch": 100} {"train_loss": -25.975830078125, "global_step": 12169, "epoch": 100} {"train_loss": -25.636423110961914, "global_step": 12170, "epoch": 100} {"train_loss": -25.434457778930664, "global_step": 12171, "epoch": 100} {"train_loss": -26.276248931884766, "global_step": 12172, "epoch": 100} {"train_loss": -25.77744483947754, "global_step": 12173, "epoch": 100} {"train_loss": -26.043771743774414, "global_step": 12174, "epoch": 100} {"train_loss": -26.024368286132812, "global_step": 12175, "epoch": 100} {"train_loss": -25.382474899291992, "global_step": 12176, "epoch": 100} {"train_loss": -26.1406307220459, "global_step": 12177, "epoch": 100} {"train_loss": -26.122175216674805, "global_step": 12178, "epoch": 100} {"train_loss": -25.875640869140625, "global_step": 12179, "epoch": 100} {"train_loss": -26.31927490234375, "global_step": 12180, "epoch": 100} {"train_loss": -25.544233322143555, "global_step": 12181, "epoch": 100} {"train_loss": -26.356719970703125, "global_step": 12182, "epoch": 100} {"train_loss": -25.95376968383789, "global_step": 12183, "epoch": 100} {"train_loss": -25.436704635620117, "global_step": 12184, "epoch": 100} {"train_loss": -25.7838191986084, "global_step": 12185, "epoch": 100} {"train_loss": -25.324466705322266, "global_step": 12186, "epoch": 100} {"train_loss": -26.174665451049805, "global_step": 12187, "epoch": 100} {"train_loss": -25.52895164489746, "global_step": 12188, "epoch": 100} {"train_loss": -22.577682495117188, "global_step": 12189, "epoch": 100} {"train_loss": -19.054819107055664, "global_step": 12190, "epoch": 100} {"train_loss": -22.8664608001709, "global_step": 12191, "epoch": 100} {"train_loss": -23.21587371826172, "global_step": 12192, "epoch": 100} {"train_loss": -20.550321578979492, "global_step": 12193, "epoch": 100} {"train_loss": -23.981159210205078, "global_step": 12194, "epoch": 100} {"train_loss": -22.57618522644043, "global_step": 12195, "epoch": 100} {"train_loss": -23.53608512878418, "global_step": 12196, "epoch": 100} {"train_loss": -24.721364974975586, "global_step": 12197, "epoch": 100} {"train_loss": -22.879255294799805, "global_step": 12198, "epoch": 100} {"train_loss": -24.592561721801758, "global_step": 12199, "epoch": 100} {"train_loss": -24.256908416748047, "global_step": 12200, "epoch": 100} {"train_loss": -24.589643478393555, "global_step": 12201, "epoch": 100} {"train_loss": -24.03396987915039, "global_step": 12202, "epoch": 100} {"train_loss": -24.334627151489258, "global_step": 12203, "epoch": 100} {"train_loss": -24.35580825805664, "global_step": 12204, "epoch": 100} {"train_loss": -24.434947967529297, "global_step": 12205, "epoch": 100} {"train_loss": -25.232603073120117, "global_step": 12206, "epoch": 100} {"train_loss": -24.585346221923828, "global_step": 12207, "epoch": 100} {"train_loss": -25.21615982055664, "global_step": 12208, "epoch": 100} {"train_loss": -24.37073516845703, "global_step": 12209, "epoch": 100} {"train_loss": -24.421905517578125, "global_step": 12210, "epoch": 100} {"train_loss": -24.504947662353516, "global_step": 12211, "epoch": 100} {"train_loss": -24.766931533813477, "global_step": 12212, "epoch": 100} {"train_loss": -25.363529205322266, "global_step": 12213, "epoch": 100} {"train_loss": -25.37601661682129, "global_step": 12214, "epoch": 100} {"train_loss": -24.887821197509766, "global_step": 12215, "epoch": 100} {"train_loss": -24.63973045349121, "global_step": 12216, "epoch": 100} {"train_loss": -24.385799407958984, "global_step": 12217, "epoch": 100} {"train_loss": -25.1472110748291, "global_step": 12218, "epoch": 100} {"train_loss": -24.67706871032715, "global_step": 12219, "epoch": 100} {"train_loss": -25.084140131296206, "global_step": 12220, "epoch": 100, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4400000": 1.0, "test/sim_max_reward_4400001": 1.0, "test/sim_max_reward_4400002": 1.0, "test/sim_max_reward_4400003": 1.0, "test/sim_max_reward_4400004": 1.0, "test/sim_max_reward_4400005": 1.0, "test/sim_max_reward_4400006": 1.0, "test/sim_max_reward_4400007": 1.0, "test/sim_max_reward_4400008": 1.0, "test/sim_max_reward_4400009": 1.0, "test/sim_max_reward_4400010": 1.0, "test/sim_max_reward_4400011": 1.0, "test/sim_max_reward_4400012": 1.0, "test/sim_max_reward_4400013": 1.0, "test/sim_max_reward_4400014": 1.0, "test/sim_max_reward_4400015": 1.0, "test/sim_max_reward_4400016": 1.0, "test/sim_max_reward_4400017": 1.0, "test/sim_max_reward_4400018": 1.0, "test/sim_max_reward_4400019": 1.0, "test/sim_max_reward_4400020": 1.0, "test/sim_max_reward_4400021": 1.0, "train/mean_score": 1.0, "test/mean_score": 1.0, "val_loss": 2554765.75} {"train_loss": -24.470306396484375, "global_step": 12221, "epoch": 101} {"train_loss": -25.02503776550293, "global_step": 12222, "epoch": 101} {"train_loss": -24.56817626953125, "global_step": 12223, "epoch": 101} {"train_loss": -25.306684494018555, "global_step": 12224, "epoch": 101} {"train_loss": -24.246768951416016, "global_step": 12225, "epoch": 101} {"train_loss": -25.35529327392578, "global_step": 12226, "epoch": 101} {"train_loss": -24.82582664489746, "global_step": 12227, "epoch": 101} {"train_loss": -24.8824462890625, "global_step": 12228, "epoch": 101} {"train_loss": -25.530271530151367, "global_step": 12229, "epoch": 101} {"train_loss": -24.423389434814453, "global_step": 12230, "epoch": 101} {"train_loss": -25.32241439819336, "global_step": 12231, "epoch": 101} {"train_loss": -24.691864013671875, "global_step": 12232, "epoch": 101} {"train_loss": -24.507221221923828, "global_step": 12233, "epoch": 101} {"train_loss": -25.323413848876953, "global_step": 12234, "epoch": 101} {"train_loss": -25.187637329101562, "global_step": 12235, "epoch": 101} {"train_loss": -24.43560028076172, "global_step": 12236, "epoch": 101} {"train_loss": -25.446197509765625, "global_step": 12237, "epoch": 101} {"train_loss": -25.23487663269043, "global_step": 12238, "epoch": 101} {"train_loss": -25.19768524169922, "global_step": 12239, "epoch": 101} {"train_loss": -25.537012100219727, "global_step": 12240, "epoch": 101} {"train_loss": -25.43589210510254, "global_step": 12241, "epoch": 101} {"train_loss": -25.548900604248047, "global_step": 12242, "epoch": 101} {"train_loss": -25.57371711730957, "global_step": 12243, "epoch": 101} {"train_loss": -25.789831161499023, "global_step": 12244, "epoch": 101} {"train_loss": -25.459909439086914, "global_step": 12245, "epoch": 101} {"train_loss": -25.722558975219727, "global_step": 12246, "epoch": 101} {"train_loss": -25.7484073638916, "global_step": 12247, "epoch": 101} {"train_loss": -25.85507583618164, "global_step": 12248, "epoch": 101} {"train_loss": -26.1268253326416, "global_step": 12249, "epoch": 101} {"train_loss": -25.540822982788086, "global_step": 12250, "epoch": 101} {"train_loss": -25.917083740234375, "global_step": 12251, "epoch": 101} {"train_loss": -26.10322380065918, "global_step": 12252, "epoch": 101} {"train_loss": -25.361852645874023, "global_step": 12253, "epoch": 101} {"train_loss": -26.135669708251953, "global_step": 12254, "epoch": 101} {"train_loss": -25.80632972717285, "global_step": 12255, "epoch": 101} {"train_loss": -25.895105361938477, "global_step": 12256, "epoch": 101} {"train_loss": -25.6812686920166, "global_step": 12257, "epoch": 101} {"train_loss": -25.2880859375, "global_step": 12258, "epoch": 101} {"train_loss": -24.069482803344727, "global_step": 12259, "epoch": 101} {"train_loss": -23.66848373413086, "global_step": 12260, "epoch": 101} {"train_loss": -23.860570907592773, "global_step": 12261, "epoch": 101} {"train_loss": -24.86121940612793, "global_step": 12262, "epoch": 101} {"train_loss": -26.121870040893555, "global_step": 12263, "epoch": 101} {"train_loss": -25.615034103393555, "global_step": 12264, "epoch": 101} {"train_loss": -25.504045486450195, "global_step": 12265, "epoch": 101} {"train_loss": -25.675628662109375, "global_step": 12266, "epoch": 101} {"train_loss": -25.68013572692871, "global_step": 12267, "epoch": 101} {"train_loss": -25.762149810791016, "global_step": 12268, "epoch": 101} {"train_loss": -26.09589195251465, "global_step": 12269, "epoch": 101} {"train_loss": -26.08106803894043, "global_step": 12270, "epoch": 101} {"train_loss": -25.98024559020996, "global_step": 12271, "epoch": 101} {"train_loss": -26.2756404876709, "global_step": 12272, "epoch": 101} {"train_loss": -26.25623893737793, "global_step": 12273, "epoch": 101} {"train_loss": -26.17311668395996, "global_step": 12274, "epoch": 101} {"train_loss": -25.929025650024414, "global_step": 12275, "epoch": 101} {"train_loss": -25.961973190307617, "global_step": 12276, "epoch": 101} {"train_loss": -26.064727783203125, "global_step": 12277, "epoch": 101} {"train_loss": -25.668264389038086, "global_step": 12278, "epoch": 101} {"train_loss": -25.43326759338379, "global_step": 12279, "epoch": 101} {"train_loss": -25.61347007751465, "global_step": 12280, "epoch": 101} {"train_loss": -25.681396484375, "global_step": 12281, "epoch": 101} {"train_loss": -26.06622314453125, "global_step": 12282, "epoch": 101} {"train_loss": -25.744836807250977, "global_step": 12283, "epoch": 101} {"train_loss": -26.167516708374023, "global_step": 12284, "epoch": 101} {"train_loss": -26.141204833984375, "global_step": 12285, "epoch": 101} {"train_loss": -25.849811553955078, "global_step": 12286, "epoch": 101} {"train_loss": -25.545312881469727, "global_step": 12287, "epoch": 101} {"train_loss": -25.915298461914062, "global_step": 12288, "epoch": 101} {"train_loss": -26.002368927001953, "global_step": 12289, "epoch": 101} {"train_loss": -25.29365348815918, "global_step": 12290, "epoch": 101} {"train_loss": -24.316930770874023, "global_step": 12291, "epoch": 101} {"train_loss": -26.279932022094727, "global_step": 12292, "epoch": 101} {"train_loss": -26.405004501342773, "global_step": 12293, "epoch": 101} {"train_loss": -24.078163146972656, "global_step": 12294, "epoch": 101} {"train_loss": -24.228055953979492, "global_step": 12295, "epoch": 101} {"train_loss": -23.58416748046875, "global_step": 12296, "epoch": 101} {"train_loss": -24.432987213134766, "global_step": 12297, "epoch": 101} {"train_loss": -25.625335693359375, "global_step": 12298, "epoch": 101} {"train_loss": -24.267959594726562, "global_step": 12299, "epoch": 101} {"train_loss": -25.360448837280273, "global_step": 12300, "epoch": 101} {"train_loss": -24.598041534423828, "global_step": 12301, "epoch": 101} {"train_loss": -25.688440322875977, "global_step": 12302, "epoch": 101} {"train_loss": -25.371667861938477, "global_step": 12303, "epoch": 101} {"train_loss": -24.759366989135742, "global_step": 12304, "epoch": 101} {"train_loss": -25.53902816772461, "global_step": 12305, "epoch": 101} {"train_loss": -25.351125717163086, "global_step": 12306, "epoch": 101} {"train_loss": -25.618459701538086, "global_step": 12307, "epoch": 101} {"train_loss": -25.47498893737793, "global_step": 12308, "epoch": 101} {"train_loss": -26.21323013305664, "global_step": 12309, "epoch": 101} {"train_loss": -25.758047103881836, "global_step": 12310, "epoch": 101} {"train_loss": -25.521974563598633, "global_step": 12311, "epoch": 101} {"train_loss": -25.915557861328125, "global_step": 12312, "epoch": 101} {"train_loss": -25.550691604614258, "global_step": 12313, "epoch": 101} {"train_loss": -25.56983757019043, "global_step": 12314, "epoch": 101} {"train_loss": -25.6398983001709, "global_step": 12315, "epoch": 101} {"train_loss": -26.15900993347168, "global_step": 12316, "epoch": 101} {"train_loss": -25.7544002532959, "global_step": 12317, "epoch": 101} {"train_loss": -26.05072593688965, "global_step": 12318, "epoch": 101} {"train_loss": -26.170001983642578, "global_step": 12319, "epoch": 101} {"train_loss": -26.03228759765625, "global_step": 12320, "epoch": 101} {"train_loss": -25.492719650268555, "global_step": 12321, "epoch": 101} {"train_loss": -26.01766014099121, "global_step": 12322, "epoch": 101} {"train_loss": -24.984634399414062, "global_step": 12323, "epoch": 101} {"train_loss": -24.295652389526367, "global_step": 12324, "epoch": 101} {"train_loss": -25.249231338500977, "global_step": 12325, "epoch": 101} {"train_loss": -25.9097957611084, "global_step": 12326, "epoch": 101} {"train_loss": -24.05974578857422, "global_step": 12327, "epoch": 101} {"train_loss": -22.754850387573242, "global_step": 12328, "epoch": 101} {"train_loss": -25.144378662109375, "global_step": 12329, "epoch": 101} {"train_loss": -25.27744483947754, "global_step": 12330, "epoch": 101} {"train_loss": -22.499271392822266, "global_step": 12331, "epoch": 101} {"train_loss": -25.99314308166504, "global_step": 12332, "epoch": 101} {"train_loss": -24.475400924682617, "global_step": 12333, "epoch": 101} {"train_loss": -25.73725700378418, "global_step": 12334, "epoch": 101} {"train_loss": -25.519880294799805, "global_step": 12335, "epoch": 101} {"train_loss": -26.031579971313477, "global_step": 12336, "epoch": 101} {"train_loss": -25.42475128173828, "global_step": 12337, "epoch": 101} {"train_loss": -26.01922607421875, "global_step": 12338, "epoch": 101} {"train_loss": -25.28587532043457, "global_step": 12339, "epoch": 101} {"train_loss": -25.9825439453125, "global_step": 12340, "epoch": 101} {"train_loss": -25.390234088109544, "global_step": 12341, "epoch": 101, "val_loss": 2566852.5} {"train_loss": -25.54939842224121, "global_step": 12342, "epoch": 102} {"train_loss": -25.9962158203125, "global_step": 12343, "epoch": 102} {"train_loss": -25.818897247314453, "global_step": 12344, "epoch": 102} {"train_loss": -25.342744827270508, "global_step": 12345, "epoch": 102} {"train_loss": -25.419355392456055, "global_step": 12346, "epoch": 102} {"train_loss": -25.805875778198242, "global_step": 12347, "epoch": 102} {"train_loss": -26.091474533081055, "global_step": 12348, "epoch": 102} {"train_loss": -26.142370223999023, "global_step": 12349, "epoch": 102} {"train_loss": -25.70426368713379, "global_step": 12350, "epoch": 102} {"train_loss": -26.1567325592041, "global_step": 12351, "epoch": 102} {"train_loss": -25.785680770874023, "global_step": 12352, "epoch": 102} {"train_loss": -25.890851974487305, "global_step": 12353, "epoch": 102} {"train_loss": -26.04274559020996, "global_step": 12354, "epoch": 102} {"train_loss": -25.71826171875, "global_step": 12355, "epoch": 102} {"train_loss": -26.17543601989746, "global_step": 12356, "epoch": 102} {"train_loss": -26.1365909576416, "global_step": 12357, "epoch": 102} {"train_loss": -25.78961753845215, "global_step": 12358, "epoch": 102} {"train_loss": -24.851606369018555, "global_step": 12359, "epoch": 102} {"train_loss": -25.178388595581055, "global_step": 12360, "epoch": 102} {"train_loss": -25.756317138671875, "global_step": 12361, "epoch": 102} {"train_loss": -25.29896354675293, "global_step": 12362, "epoch": 102} {"train_loss": -26.131855010986328, "global_step": 12363, "epoch": 102} {"train_loss": -26.21795654296875, "global_step": 12364, "epoch": 102} {"train_loss": -24.69723129272461, "global_step": 12365, "epoch": 102} {"train_loss": -24.237943649291992, "global_step": 12366, "epoch": 102} {"train_loss": -25.55562973022461, "global_step": 12367, "epoch": 102} {"train_loss": -26.22587013244629, "global_step": 12368, "epoch": 102} {"train_loss": -25.572420120239258, "global_step": 12369, "epoch": 102} {"train_loss": -25.647232055664062, "global_step": 12370, "epoch": 102} {"train_loss": -25.592117309570312, "global_step": 12371, "epoch": 102} {"train_loss": -26.114328384399414, "global_step": 12372, "epoch": 102} {"train_loss": -25.742116928100586, "global_step": 12373, "epoch": 102} {"train_loss": -26.186872482299805, "global_step": 12374, "epoch": 102} {"train_loss": -26.03497886657715, "global_step": 12375, "epoch": 102} {"train_loss": -25.963171005249023, "global_step": 12376, "epoch": 102} {"train_loss": -26.089269638061523, "global_step": 12377, "epoch": 102} {"train_loss": -26.169031143188477, "global_step": 12378, "epoch": 102} {"train_loss": -25.373708724975586, "global_step": 12379, "epoch": 102} {"train_loss": -26.04755973815918, "global_step": 12380, "epoch": 102} {"train_loss": -26.222660064697266, "global_step": 12381, "epoch": 102} {"train_loss": -25.577146530151367, "global_step": 12382, "epoch": 102} {"train_loss": -25.506500244140625, "global_step": 12383, "epoch": 102} {"train_loss": -26.26130485534668, "global_step": 12384, "epoch": 102} {"train_loss": -25.489686965942383, "global_step": 12385, "epoch": 102} {"train_loss": -25.53778648376465, "global_step": 12386, "epoch": 102} {"train_loss": -26.236316680908203, "global_step": 12387, "epoch": 102} {"train_loss": -25.529443740844727, "global_step": 12388, "epoch": 102} {"train_loss": -24.774423599243164, "global_step": 12389, "epoch": 102} {"train_loss": -25.748910903930664, "global_step": 12390, "epoch": 102} {"train_loss": -25.503496170043945, "global_step": 12391, "epoch": 102} {"train_loss": -26.300973892211914, "global_step": 12392, "epoch": 102} {"train_loss": -25.58436393737793, "global_step": 12393, "epoch": 102} {"train_loss": -26.67451286315918, "global_step": 12394, "epoch": 102} {"train_loss": -25.918405532836914, "global_step": 12395, "epoch": 102} {"train_loss": -26.38641929626465, "global_step": 12396, "epoch": 102} {"train_loss": -26.231311798095703, "global_step": 12397, "epoch": 102} {"train_loss": -25.952987670898438, "global_step": 12398, "epoch": 102} {"train_loss": -26.271772384643555, "global_step": 12399, "epoch": 102} {"train_loss": -26.060651779174805, "global_step": 12400, "epoch": 102} {"train_loss": -26.56070327758789, "global_step": 12401, "epoch": 102} {"train_loss": -26.088586807250977, "global_step": 12402, "epoch": 102} {"train_loss": -25.638830184936523, "global_step": 12403, "epoch": 102} {"train_loss": -25.81559181213379, "global_step": 12404, "epoch": 102} {"train_loss": -25.549612045288086, "global_step": 12405, "epoch": 102} {"train_loss": -26.701162338256836, "global_step": 12406, "epoch": 102} {"train_loss": -25.577693939208984, "global_step": 12407, "epoch": 102} {"train_loss": -26.23832130432129, "global_step": 12408, "epoch": 102} {"train_loss": -26.162946701049805, "global_step": 12409, "epoch": 102} {"train_loss": -26.01192283630371, "global_step": 12410, "epoch": 102} {"train_loss": -25.9318904876709, "global_step": 12411, "epoch": 102} {"train_loss": -25.707550048828125, "global_step": 12412, "epoch": 102} {"train_loss": -25.772125244140625, "global_step": 12413, "epoch": 102} {"train_loss": -26.03742027282715, "global_step": 12414, "epoch": 102} {"train_loss": -25.845661163330078, "global_step": 12415, "epoch": 102} {"train_loss": -25.639822006225586, "global_step": 12416, "epoch": 102} {"train_loss": -25.64606285095215, "global_step": 12417, "epoch": 102} {"train_loss": -25.324167251586914, "global_step": 12418, "epoch": 102} {"train_loss": -25.644277572631836, "global_step": 12419, "epoch": 102} {"train_loss": -22.669092178344727, "global_step": 12420, "epoch": 102} {"train_loss": -21.26959800720215, "global_step": 12421, "epoch": 102} {"train_loss": -22.316495895385742, "global_step": 12422, "epoch": 102} {"train_loss": -23.913089752197266, "global_step": 12423, "epoch": 102} {"train_loss": -21.399938583374023, "global_step": 12424, "epoch": 102} {"train_loss": -23.688989639282227, "global_step": 12425, "epoch": 102} {"train_loss": -24.923572540283203, "global_step": 12426, "epoch": 102} {"train_loss": -24.64017677307129, "global_step": 12427, "epoch": 102} {"train_loss": -25.250507354736328, "global_step": 12428, "epoch": 102} {"train_loss": -25.165103912353516, "global_step": 12429, "epoch": 102} {"train_loss": -25.463382720947266, "global_step": 12430, "epoch": 102} {"train_loss": -25.76727867126465, "global_step": 12431, "epoch": 102} {"train_loss": -25.2285099029541, "global_step": 12432, "epoch": 102} {"train_loss": -25.577070236206055, "global_step": 12433, "epoch": 102} {"train_loss": -25.489736557006836, "global_step": 12434, "epoch": 102} {"train_loss": -25.395051956176758, "global_step": 12435, "epoch": 102} {"train_loss": -25.25428581237793, "global_step": 12436, "epoch": 102} {"train_loss": -25.286701202392578, "global_step": 12437, "epoch": 102} {"train_loss": -25.383792877197266, "global_step": 12438, "epoch": 102} {"train_loss": -25.25669288635254, "global_step": 12439, "epoch": 102} {"train_loss": -25.75897216796875, "global_step": 12440, "epoch": 102} {"train_loss": -25.45699119567871, "global_step": 12441, "epoch": 102} {"train_loss": -25.70136833190918, "global_step": 12442, "epoch": 102} {"train_loss": -24.937637329101562, "global_step": 12443, "epoch": 102} {"train_loss": -25.335674285888672, "global_step": 12444, "epoch": 102} {"train_loss": -26.04365348815918, "global_step": 12445, "epoch": 102} {"train_loss": -25.809873580932617, "global_step": 12446, "epoch": 102} {"train_loss": -24.10405158996582, "global_step": 12447, "epoch": 102} {"train_loss": -23.875324249267578, "global_step": 12448, "epoch": 102} {"train_loss": -25.391456604003906, "global_step": 12449, "epoch": 102} {"train_loss": -25.350149154663086, "global_step": 12450, "epoch": 102} {"train_loss": -24.951641082763672, "global_step": 12451, "epoch": 102} {"train_loss": -25.853952407836914, "global_step": 12452, "epoch": 102} {"train_loss": -24.78830337524414, "global_step": 12453, "epoch": 102} {"train_loss": -24.83555030822754, "global_step": 12454, "epoch": 102} {"train_loss": -26.026758193969727, "global_step": 12455, "epoch": 102} {"train_loss": -25.000686645507812, "global_step": 12456, "epoch": 102} {"train_loss": -25.593015670776367, "global_step": 12457, "epoch": 102} {"train_loss": -25.78229331970215, "global_step": 12458, "epoch": 102} {"train_loss": -25.772052764892578, "global_step": 12459, "epoch": 102} {"train_loss": -26.312543869018555, "global_step": 12460, "epoch": 102} {"train_loss": -26.264036178588867, "global_step": 12461, "epoch": 102} {"train_loss": -25.519691120494496, "global_step": 12462, "epoch": 102, "val_loss": 3147449.75} {"train_loss": -26.032672882080078, "global_step": 12463, "epoch": 103} {"train_loss": -26.243188858032227, "global_step": 12464, "epoch": 103} {"train_loss": -26.239912033081055, "global_step": 12465, "epoch": 103} {"train_loss": -26.23831558227539, "global_step": 12466, "epoch": 103} {"train_loss": -26.064130783081055, "global_step": 12467, "epoch": 103} {"train_loss": -26.142114639282227, "global_step": 12468, "epoch": 103} {"train_loss": -26.036008834838867, "global_step": 12469, "epoch": 103} {"train_loss": -26.600854873657227, "global_step": 12470, "epoch": 103} {"train_loss": -26.005117416381836, "global_step": 12471, "epoch": 103} {"train_loss": -26.58221435546875, "global_step": 12472, "epoch": 103} {"train_loss": -26.3795166015625, "global_step": 12473, "epoch": 103} {"train_loss": -26.65278434753418, "global_step": 12474, "epoch": 103} {"train_loss": -26.215269088745117, "global_step": 12475, "epoch": 103} {"train_loss": -26.2038516998291, "global_step": 12476, "epoch": 103} {"train_loss": -26.36530113220215, "global_step": 12477, "epoch": 103} {"train_loss": -26.5203857421875, "global_step": 12478, "epoch": 103} {"train_loss": -26.744443893432617, "global_step": 12479, "epoch": 103} {"train_loss": -26.370336532592773, "global_step": 12480, "epoch": 103} {"train_loss": -26.2088623046875, "global_step": 12481, "epoch": 103} {"train_loss": -25.891645431518555, "global_step": 12482, "epoch": 103} {"train_loss": -24.99226188659668, "global_step": 12483, "epoch": 103} {"train_loss": -24.132225036621094, "global_step": 12484, "epoch": 103} {"train_loss": -23.916532516479492, "global_step": 12485, "epoch": 103} {"train_loss": -24.80653190612793, "global_step": 12486, "epoch": 103} {"train_loss": -25.778644561767578, "global_step": 12487, "epoch": 103} {"train_loss": -25.972768783569336, "global_step": 12488, "epoch": 103} {"train_loss": -26.034271240234375, "global_step": 12489, "epoch": 103} {"train_loss": -25.92604637145996, "global_step": 12490, "epoch": 103} {"train_loss": -25.360857009887695, "global_step": 12491, "epoch": 103} {"train_loss": -26.068872451782227, "global_step": 12492, "epoch": 103} {"train_loss": -25.59015655517578, "global_step": 12493, "epoch": 103} {"train_loss": -25.669530868530273, "global_step": 12494, "epoch": 103} {"train_loss": -26.00458335876465, "global_step": 12495, "epoch": 103} {"train_loss": -25.976102828979492, "global_step": 12496, "epoch": 103} {"train_loss": -24.885154724121094, "global_step": 12497, "epoch": 103} {"train_loss": -25.794727325439453, "global_step": 12498, "epoch": 103} {"train_loss": -25.144119262695312, "global_step": 12499, "epoch": 103} {"train_loss": -26.23238182067871, "global_step": 12500, "epoch": 103} {"train_loss": -25.64398193359375, "global_step": 12501, "epoch": 103} {"train_loss": -25.939855575561523, "global_step": 12502, "epoch": 103} {"train_loss": -25.861175537109375, "global_step": 12503, "epoch": 103} {"train_loss": -25.29444694519043, "global_step": 12504, "epoch": 103} {"train_loss": -26.322546005249023, "global_step": 12505, "epoch": 103} {"train_loss": -25.988309860229492, "global_step": 12506, "epoch": 103} {"train_loss": -26.234607696533203, "global_step": 12507, "epoch": 103} {"train_loss": -25.948766708374023, "global_step": 12508, "epoch": 103} {"train_loss": -26.081989288330078, "global_step": 12509, "epoch": 103} {"train_loss": -25.714096069335938, "global_step": 12510, "epoch": 103} {"train_loss": -26.068281173706055, "global_step": 12511, "epoch": 103} {"train_loss": -26.435993194580078, "global_step": 12512, "epoch": 103} {"train_loss": -26.15087890625, "global_step": 12513, "epoch": 103} {"train_loss": -25.996662139892578, "global_step": 12514, "epoch": 103} {"train_loss": -26.173376083374023, "global_step": 12515, "epoch": 103} {"train_loss": -26.0308837890625, "global_step": 12516, "epoch": 103} {"train_loss": -25.940296173095703, "global_step": 12517, "epoch": 103} {"train_loss": -25.06495475769043, "global_step": 12518, "epoch": 103} {"train_loss": -25.60664176940918, "global_step": 12519, "epoch": 103} {"train_loss": -26.098005294799805, "global_step": 12520, "epoch": 103} {"train_loss": -26.270986557006836, "global_step": 12521, "epoch": 103} {"train_loss": -25.302072525024414, "global_step": 12522, "epoch": 103} {"train_loss": -22.81369972229004, "global_step": 12523, "epoch": 103} {"train_loss": -13.578149795532227, "global_step": 12524, "epoch": 103} {"train_loss": 18.524389266967773, "global_step": 12525, "epoch": 103} {"train_loss": 1.3613226413726807, "global_step": 12526, "epoch": 103} {"train_loss": -19.860916137695312, "global_step": 12527, "epoch": 103} {"train_loss": -19.321664810180664, "global_step": 12528, "epoch": 103} {"train_loss": -15.812219619750977, "global_step": 12529, "epoch": 103} {"train_loss": -20.96170997619629, "global_step": 12530, "epoch": 103} {"train_loss": -22.90303611755371, "global_step": 12531, "epoch": 103} {"train_loss": -23.11329460144043, "global_step": 12532, "epoch": 103} {"train_loss": -21.940046310424805, "global_step": 12533, "epoch": 103} {"train_loss": -21.59067726135254, "global_step": 12534, "epoch": 103} {"train_loss": -21.086936950683594, "global_step": 12535, "epoch": 103} {"train_loss": -22.522226333618164, "global_step": 12536, "epoch": 103} {"train_loss": -22.8916015625, "global_step": 12537, "epoch": 103} {"train_loss": -23.612028121948242, "global_step": 12538, "epoch": 103} {"train_loss": -23.686830520629883, "global_step": 12539, "epoch": 103} {"train_loss": -23.84691619873047, "global_step": 12540, "epoch": 103} {"train_loss": -23.863914489746094, "global_step": 12541, "epoch": 103} {"train_loss": -23.837507247924805, "global_step": 12542, "epoch": 103} {"train_loss": -24.173376083374023, "global_step": 12543, "epoch": 103} {"train_loss": -23.92940330505371, "global_step": 12544, "epoch": 103} {"train_loss": -23.827117919921875, "global_step": 12545, "epoch": 103} {"train_loss": -23.977737426757812, "global_step": 12546, "epoch": 103} {"train_loss": -24.06165885925293, "global_step": 12547, "epoch": 103} {"train_loss": -23.681575775146484, "global_step": 12548, "epoch": 103} {"train_loss": -24.120468139648438, "global_step": 12549, "epoch": 103} {"train_loss": -24.469694137573242, "global_step": 12550, "epoch": 103} {"train_loss": -24.307111740112305, "global_step": 12551, "epoch": 103} {"train_loss": -24.54342269897461, "global_step": 12552, "epoch": 103} {"train_loss": -23.894010543823242, "global_step": 12553, "epoch": 103} {"train_loss": -24.608198165893555, "global_step": 12554, "epoch": 103} {"train_loss": -24.700944900512695, "global_step": 12555, "epoch": 103} {"train_loss": -24.419509887695312, "global_step": 12556, "epoch": 103} {"train_loss": -24.59321403503418, "global_step": 12557, "epoch": 103} {"train_loss": -24.638675689697266, "global_step": 12558, "epoch": 103} {"train_loss": -24.85993194580078, "global_step": 12559, "epoch": 103} {"train_loss": -24.921140670776367, "global_step": 12560, "epoch": 103} {"train_loss": -24.8087100982666, "global_step": 12561, "epoch": 103} {"train_loss": -25.42466163635254, "global_step": 12562, "epoch": 103} {"train_loss": -25.131099700927734, "global_step": 12563, "epoch": 103} {"train_loss": -24.969234466552734, "global_step": 12564, "epoch": 103} {"train_loss": -25.21319007873535, "global_step": 12565, "epoch": 103} {"train_loss": -24.81251335144043, "global_step": 12566, "epoch": 103} {"train_loss": -24.853721618652344, "global_step": 12567, "epoch": 103} {"train_loss": -25.457319259643555, "global_step": 12568, "epoch": 103} {"train_loss": -24.982120513916016, "global_step": 12569, "epoch": 103} {"train_loss": -24.788780212402344, "global_step": 12570, "epoch": 103} {"train_loss": -25.397418975830078, "global_step": 12571, "epoch": 103} {"train_loss": -25.080810546875, "global_step": 12572, "epoch": 103} {"train_loss": -24.934322357177734, "global_step": 12573, "epoch": 103} {"train_loss": -25.30291748046875, "global_step": 12574, "epoch": 103} {"train_loss": -25.000999450683594, "global_step": 12575, "epoch": 103} {"train_loss": -25.33066177368164, "global_step": 12576, "epoch": 103} {"train_loss": -25.221750259399414, "global_step": 12577, "epoch": 103} {"train_loss": -24.605009078979492, "global_step": 12578, "epoch": 103} {"train_loss": -24.437448501586914, "global_step": 12579, "epoch": 103} {"train_loss": -23.7354793548584, "global_step": 12580, "epoch": 103} {"train_loss": -23.4969539642334, "global_step": 12581, "epoch": 103} {"train_loss": -24.47933006286621, "global_step": 12582, "epoch": 103} {"train_loss": -24.230552151183453, "global_step": 12583, "epoch": 103, "val_loss": 2835914.0} {"train_loss": -24.900196075439453, "global_step": 12584, "epoch": 104} {"train_loss": -23.990276336669922, "global_step": 12585, "epoch": 104} {"train_loss": -24.05176544189453, "global_step": 12586, "epoch": 104} {"train_loss": -24.48224449157715, "global_step": 12587, "epoch": 104} {"train_loss": -25.277366638183594, "global_step": 12588, "epoch": 104} {"train_loss": -23.82337760925293, "global_step": 12589, "epoch": 104} {"train_loss": -23.801664352416992, "global_step": 12590, "epoch": 104} {"train_loss": -24.23188591003418, "global_step": 12591, "epoch": 104} {"train_loss": -24.782987594604492, "global_step": 12592, "epoch": 104} {"train_loss": -24.887853622436523, "global_step": 12593, "epoch": 104} {"train_loss": -23.77889060974121, "global_step": 12594, "epoch": 104} {"train_loss": -24.74549102783203, "global_step": 12595, "epoch": 104} {"train_loss": -25.43667984008789, "global_step": 12596, "epoch": 104} {"train_loss": -24.79509735107422, "global_step": 12597, "epoch": 104} {"train_loss": -24.439966201782227, "global_step": 12598, "epoch": 104} {"train_loss": -24.953866958618164, "global_step": 12599, "epoch": 104} {"train_loss": -25.15259552001953, "global_step": 12600, "epoch": 104} {"train_loss": -24.75503921508789, "global_step": 12601, "epoch": 104} {"train_loss": -24.77625846862793, "global_step": 12602, "epoch": 104} {"train_loss": -24.65157699584961, "global_step": 12603, "epoch": 104} {"train_loss": -25.207902908325195, "global_step": 12604, "epoch": 104} {"train_loss": -25.12452507019043, "global_step": 12605, "epoch": 104} {"train_loss": -24.98940658569336, "global_step": 12606, "epoch": 104} {"train_loss": -25.066553115844727, "global_step": 12607, "epoch": 104} {"train_loss": -24.716684341430664, "global_step": 12608, "epoch": 104} {"train_loss": -24.302703857421875, "global_step": 12609, "epoch": 104} {"train_loss": -25.427274703979492, "global_step": 12610, "epoch": 104} {"train_loss": -24.81708335876465, "global_step": 12611, "epoch": 104} {"train_loss": -23.221538543701172, "global_step": 12612, "epoch": 104} {"train_loss": -24.350961685180664, "global_step": 12613, "epoch": 104} {"train_loss": -25.434226989746094, "global_step": 12614, "epoch": 104} {"train_loss": -24.213109970092773, "global_step": 12615, "epoch": 104} {"train_loss": -24.179258346557617, "global_step": 12616, "epoch": 104} {"train_loss": -24.113609313964844, "global_step": 12617, "epoch": 104} {"train_loss": -24.080060958862305, "global_step": 12618, "epoch": 104} {"train_loss": -23.283466339111328, "global_step": 12619, "epoch": 104} {"train_loss": -24.876585006713867, "global_step": 12620, "epoch": 104} {"train_loss": -23.33228874206543, "global_step": 12621, "epoch": 104} {"train_loss": -24.804468154907227, "global_step": 12622, "epoch": 104} {"train_loss": -23.231290817260742, "global_step": 12623, "epoch": 104} {"train_loss": -24.984899520874023, "global_step": 12624, "epoch": 104} {"train_loss": -23.795841217041016, "global_step": 12625, "epoch": 104} {"train_loss": -24.58692169189453, "global_step": 12626, "epoch": 104} {"train_loss": -24.7972469329834, "global_step": 12627, "epoch": 104} {"train_loss": -24.939502716064453, "global_step": 12628, "epoch": 104} {"train_loss": -25.186384201049805, "global_step": 12629, "epoch": 104} {"train_loss": -25.153181076049805, "global_step": 12630, "epoch": 104} {"train_loss": -25.209918975830078, "global_step": 12631, "epoch": 104} {"train_loss": -24.86502456665039, "global_step": 12632, "epoch": 104} {"train_loss": -25.143665313720703, "global_step": 12633, "epoch": 104} {"train_loss": -25.079282760620117, "global_step": 12634, "epoch": 104} {"train_loss": -25.249008178710938, "global_step": 12635, "epoch": 104} {"train_loss": -25.068628311157227, "global_step": 12636, "epoch": 104} {"train_loss": -24.930646896362305, "global_step": 12637, "epoch": 104} {"train_loss": -24.82905387878418, "global_step": 12638, "epoch": 104} {"train_loss": -24.855010986328125, "global_step": 12639, "epoch": 104} {"train_loss": -24.934324264526367, "global_step": 12640, "epoch": 104} {"train_loss": -24.896438598632812, "global_step": 12641, "epoch": 104} {"train_loss": -25.39284324645996, "global_step": 12642, "epoch": 104} {"train_loss": -25.333242416381836, "global_step": 12643, "epoch": 104} {"train_loss": -24.608234405517578, "global_step": 12644, "epoch": 104} {"train_loss": -25.038543701171875, "global_step": 12645, "epoch": 104} {"train_loss": -24.774152755737305, "global_step": 12646, "epoch": 104} {"train_loss": -25.231014251708984, "global_step": 12647, "epoch": 104} {"train_loss": -25.630773544311523, "global_step": 12648, "epoch": 104} {"train_loss": -25.025299072265625, "global_step": 12649, "epoch": 104} {"train_loss": -25.44569206237793, "global_step": 12650, "epoch": 104} {"train_loss": -25.69266700744629, "global_step": 12651, "epoch": 104} {"train_loss": -25.21173095703125, "global_step": 12652, "epoch": 104} {"train_loss": -25.270465850830078, "global_step": 12653, "epoch": 104} {"train_loss": -25.450590133666992, "global_step": 12654, "epoch": 104} {"train_loss": -24.617338180541992, "global_step": 12655, "epoch": 104} {"train_loss": -25.1562557220459, "global_step": 12656, "epoch": 104} {"train_loss": -25.39145851135254, "global_step": 12657, "epoch": 104} {"train_loss": -25.588184356689453, "global_step": 12658, "epoch": 104} {"train_loss": -25.441679000854492, "global_step": 12659, "epoch": 104} {"train_loss": -25.60532569885254, "global_step": 12660, "epoch": 104} {"train_loss": -25.634973526000977, "global_step": 12661, "epoch": 104} {"train_loss": -25.473920822143555, "global_step": 12662, "epoch": 104} {"train_loss": -25.303190231323242, "global_step": 12663, "epoch": 104} {"train_loss": -25.60524559020996, "global_step": 12664, "epoch": 104} {"train_loss": -25.48097801208496, "global_step": 12665, "epoch": 104} {"train_loss": -25.26314353942871, "global_step": 12666, "epoch": 104} {"train_loss": -25.67030143737793, "global_step": 12667, "epoch": 104} {"train_loss": -25.67923355102539, "global_step": 12668, "epoch": 104} {"train_loss": -25.285707473754883, "global_step": 12669, "epoch": 104} {"train_loss": -25.291242599487305, "global_step": 12670, "epoch": 104} {"train_loss": -25.081632614135742, "global_step": 12671, "epoch": 104} {"train_loss": -25.946073532104492, "global_step": 12672, "epoch": 104} {"train_loss": -24.966949462890625, "global_step": 12673, "epoch": 104} {"train_loss": -25.279590606689453, "global_step": 12674, "epoch": 104} {"train_loss": -24.8658504486084, "global_step": 12675, "epoch": 104} {"train_loss": -25.56288719177246, "global_step": 12676, "epoch": 104} {"train_loss": -25.480850219726562, "global_step": 12677, "epoch": 104} {"train_loss": -25.589872360229492, "global_step": 12678, "epoch": 104} {"train_loss": -25.67276954650879, "global_step": 12679, "epoch": 104} {"train_loss": -25.605899810791016, "global_step": 12680, "epoch": 104} {"train_loss": -25.77631950378418, "global_step": 12681, "epoch": 104} {"train_loss": -25.773178100585938, "global_step": 12682, "epoch": 104} {"train_loss": -25.292760848999023, "global_step": 12683, "epoch": 104} {"train_loss": -25.878711700439453, "global_step": 12684, "epoch": 104} {"train_loss": -24.886783599853516, "global_step": 12685, "epoch": 104} {"train_loss": -25.99072265625, "global_step": 12686, "epoch": 104} {"train_loss": -25.468799591064453, "global_step": 12687, "epoch": 104} {"train_loss": -25.358020782470703, "global_step": 12688, "epoch": 104} {"train_loss": -25.845869064331055, "global_step": 12689, "epoch": 104} {"train_loss": -25.589704513549805, "global_step": 12690, "epoch": 104} {"train_loss": -25.650144577026367, "global_step": 12691, "epoch": 104} {"train_loss": -25.42107582092285, "global_step": 12692, "epoch": 104} {"train_loss": -25.70782470703125, "global_step": 12693, "epoch": 104} {"train_loss": -25.728025436401367, "global_step": 12694, "epoch": 104} {"train_loss": -25.380605697631836, "global_step": 12695, "epoch": 104} {"train_loss": -25.44902229309082, "global_step": 12696, "epoch": 104} {"train_loss": -26.130908966064453, "global_step": 12697, "epoch": 104} {"train_loss": -25.20235824584961, "global_step": 12698, "epoch": 104} {"train_loss": -25.379491806030273, "global_step": 12699, "epoch": 104} {"train_loss": -24.214710235595703, "global_step": 12700, "epoch": 104} {"train_loss": -23.599252700805664, "global_step": 12701, "epoch": 104} {"train_loss": -19.87940788269043, "global_step": 12702, "epoch": 104} {"train_loss": -20.361764907836914, "global_step": 12703, "epoch": 104} {"train_loss": -24.931327268111804, "global_step": 12704, "epoch": 104, "val_loss": 3410415.75} {"train_loss": -22.977205276489258, "global_step": 12705, "epoch": 105} {"train_loss": -22.779617309570312, "global_step": 12706, "epoch": 105} {"train_loss": -24.943174362182617, "global_step": 12707, "epoch": 105} {"train_loss": -22.99587059020996, "global_step": 12708, "epoch": 105} {"train_loss": -24.524864196777344, "global_step": 12709, "epoch": 105} {"train_loss": -23.949359893798828, "global_step": 12710, "epoch": 105} {"train_loss": -24.731470108032227, "global_step": 12711, "epoch": 105} {"train_loss": -24.68671226501465, "global_step": 12712, "epoch": 105} {"train_loss": -24.497594833374023, "global_step": 12713, "epoch": 105} {"train_loss": -24.993682861328125, "global_step": 12714, "epoch": 105} {"train_loss": -24.72330093383789, "global_step": 12715, "epoch": 105} {"train_loss": -24.811994552612305, "global_step": 12716, "epoch": 105} {"train_loss": -25.202743530273438, "global_step": 12717, "epoch": 105} {"train_loss": -25.1889591217041, "global_step": 12718, "epoch": 105} {"train_loss": -25.142526626586914, "global_step": 12719, "epoch": 105} {"train_loss": -25.300537109375, "global_step": 12720, "epoch": 105} {"train_loss": -24.995372772216797, "global_step": 12721, "epoch": 105} {"train_loss": -25.1889705657959, "global_step": 12722, "epoch": 105} {"train_loss": -25.017648696899414, "global_step": 12723, "epoch": 105} {"train_loss": -24.551101684570312, "global_step": 12724, "epoch": 105} {"train_loss": -25.112689971923828, "global_step": 12725, "epoch": 105} {"train_loss": -25.09391212463379, "global_step": 12726, "epoch": 105} {"train_loss": -25.446950912475586, "global_step": 12727, "epoch": 105} {"train_loss": -25.491321563720703, "global_step": 12728, "epoch": 105} {"train_loss": -25.141878128051758, "global_step": 12729, "epoch": 105} {"train_loss": -25.60774040222168, "global_step": 12730, "epoch": 105} {"train_loss": -25.71150016784668, "global_step": 12731, "epoch": 105} {"train_loss": -24.936471939086914, "global_step": 12732, "epoch": 105} {"train_loss": -24.970474243164062, "global_step": 12733, "epoch": 105} {"train_loss": -25.541006088256836, "global_step": 12734, "epoch": 105} {"train_loss": -25.072370529174805, "global_step": 12735, "epoch": 105} {"train_loss": -24.953371047973633, "global_step": 12736, "epoch": 105} {"train_loss": -25.731164932250977, "global_step": 12737, "epoch": 105} {"train_loss": -25.5401554107666, "global_step": 12738, "epoch": 105} {"train_loss": -25.491910934448242, "global_step": 12739, "epoch": 105} {"train_loss": -25.487258911132812, "global_step": 12740, "epoch": 105} {"train_loss": -25.489439010620117, "global_step": 12741, "epoch": 105} {"train_loss": -25.547855377197266, "global_step": 12742, "epoch": 105} {"train_loss": -25.46168327331543, "global_step": 12743, "epoch": 105} {"train_loss": -25.7036190032959, "global_step": 12744, "epoch": 105} {"train_loss": -25.47768211364746, "global_step": 12745, "epoch": 105} {"train_loss": -25.051069259643555, "global_step": 12746, "epoch": 105} {"train_loss": -26.070409774780273, "global_step": 12747, "epoch": 105} {"train_loss": -26.141332626342773, "global_step": 12748, "epoch": 105} {"train_loss": -25.849273681640625, "global_step": 12749, "epoch": 105} {"train_loss": -25.940277099609375, "global_step": 12750, "epoch": 105} {"train_loss": -24.974409103393555, "global_step": 12751, "epoch": 105} {"train_loss": -25.17624282836914, "global_step": 12752, "epoch": 105} {"train_loss": -25.575763702392578, "global_step": 12753, "epoch": 105} {"train_loss": -25.633182525634766, "global_step": 12754, "epoch": 105} {"train_loss": -25.91973876953125, "global_step": 12755, "epoch": 105} {"train_loss": -25.319345474243164, "global_step": 12756, "epoch": 105} {"train_loss": -25.526470184326172, "global_step": 12757, "epoch": 105} {"train_loss": -25.912595748901367, "global_step": 12758, "epoch": 105} {"train_loss": -25.56725311279297, "global_step": 12759, "epoch": 105} {"train_loss": -25.814313888549805, "global_step": 12760, "epoch": 105} {"train_loss": -25.495187759399414, "global_step": 12761, "epoch": 105} {"train_loss": -25.997793197631836, "global_step": 12762, "epoch": 105} {"train_loss": -25.82779884338379, "global_step": 12763, "epoch": 105} {"train_loss": -25.81130027770996, "global_step": 12764, "epoch": 105} {"train_loss": -26.04168701171875, "global_step": 12765, "epoch": 105} {"train_loss": -25.836566925048828, "global_step": 12766, "epoch": 105} {"train_loss": -26.517414093017578, "global_step": 12767, "epoch": 105} {"train_loss": -25.61907386779785, "global_step": 12768, "epoch": 105} {"train_loss": -26.304279327392578, "global_step": 12769, "epoch": 105} {"train_loss": -26.05866050720215, "global_step": 12770, "epoch": 105} {"train_loss": -26.02046775817871, "global_step": 12771, "epoch": 105} {"train_loss": -25.901264190673828, "global_step": 12772, "epoch": 105} {"train_loss": -26.249921798706055, "global_step": 12773, "epoch": 105} {"train_loss": -26.183069229125977, "global_step": 12774, "epoch": 105} {"train_loss": -26.229711532592773, "global_step": 12775, "epoch": 105} {"train_loss": -26.348041534423828, "global_step": 12776, "epoch": 105} {"train_loss": -26.481475830078125, "global_step": 12777, "epoch": 105} {"train_loss": -26.181913375854492, "global_step": 12778, "epoch": 105} {"train_loss": -25.883758544921875, "global_step": 12779, "epoch": 105} {"train_loss": -26.439716339111328, "global_step": 12780, "epoch": 105} {"train_loss": -26.043212890625, "global_step": 12781, "epoch": 105} {"train_loss": -26.472394943237305, "global_step": 12782, "epoch": 105} {"train_loss": -26.249792098999023, "global_step": 12783, "epoch": 105} {"train_loss": -26.693166732788086, "global_step": 12784, "epoch": 105} {"train_loss": -26.288965225219727, "global_step": 12785, "epoch": 105} {"train_loss": -26.222375869750977, "global_step": 12786, "epoch": 105} {"train_loss": -26.256412506103516, "global_step": 12787, "epoch": 105} {"train_loss": -26.100940704345703, "global_step": 12788, "epoch": 105} {"train_loss": -26.255598068237305, "global_step": 12789, "epoch": 105} {"train_loss": -26.53236198425293, "global_step": 12790, "epoch": 105} {"train_loss": -26.37879753112793, "global_step": 12791, "epoch": 105} {"train_loss": -26.247730255126953, "global_step": 12792, "epoch": 105} {"train_loss": -26.500106811523438, "global_step": 12793, "epoch": 105} {"train_loss": -26.477197647094727, "global_step": 12794, "epoch": 105} {"train_loss": -26.14333152770996, "global_step": 12795, "epoch": 105} {"train_loss": -26.782413482666016, "global_step": 12796, "epoch": 105} {"train_loss": -26.4197940826416, "global_step": 12797, "epoch": 105} {"train_loss": -26.165912628173828, "global_step": 12798, "epoch": 105} {"train_loss": -26.35697364807129, "global_step": 12799, "epoch": 105} {"train_loss": -27.16908073425293, "global_step": 12800, "epoch": 105} {"train_loss": -26.88177490234375, "global_step": 12801, "epoch": 105} {"train_loss": -25.9818058013916, "global_step": 12802, "epoch": 105} {"train_loss": -25.517961502075195, "global_step": 12803, "epoch": 105} {"train_loss": -22.36233901977539, "global_step": 12804, "epoch": 105} {"train_loss": -22.67292022705078, "global_step": 12805, "epoch": 105} {"train_loss": -25.6716251373291, "global_step": 12806, "epoch": 105} {"train_loss": -25.37860679626465, "global_step": 12807, "epoch": 105} {"train_loss": -25.346866607666016, "global_step": 12808, "epoch": 105} {"train_loss": -26.035400390625, "global_step": 12809, "epoch": 105} {"train_loss": -24.095157623291016, "global_step": 12810, "epoch": 105} {"train_loss": -24.95511245727539, "global_step": 12811, "epoch": 105} {"train_loss": -25.688562393188477, "global_step": 12812, "epoch": 105} {"train_loss": -25.25063133239746, "global_step": 12813, "epoch": 105} {"train_loss": -25.01283836364746, "global_step": 12814, "epoch": 105} {"train_loss": -24.90508460998535, "global_step": 12815, "epoch": 105} {"train_loss": -25.407007217407227, "global_step": 12816, "epoch": 105} {"train_loss": -25.552406311035156, "global_step": 12817, "epoch": 105} {"train_loss": -25.388843536376953, "global_step": 12818, "epoch": 105} {"train_loss": -24.993473052978516, "global_step": 12819, "epoch": 105} {"train_loss": -26.249685287475586, "global_step": 12820, "epoch": 105} {"train_loss": -25.805334091186523, "global_step": 12821, "epoch": 105} {"train_loss": -26.169153213500977, "global_step": 12822, "epoch": 105} {"train_loss": -25.57771110534668, "global_step": 12823, "epoch": 105} {"train_loss": -25.7967529296875, "global_step": 12824, "epoch": 105} {"train_loss": -25.543384977608675, "global_step": 12825, "epoch": 105, "val_loss": 2574008.25} {"train_loss": -26.286828994750977, "global_step": 12826, "epoch": 106} {"train_loss": -26.3365535736084, "global_step": 12827, "epoch": 106} {"train_loss": -26.48638343811035, "global_step": 12828, "epoch": 106} {"train_loss": -26.118375778198242, "global_step": 12829, "epoch": 106} {"train_loss": -26.010488510131836, "global_step": 12830, "epoch": 106} {"train_loss": -26.215112686157227, "global_step": 12831, "epoch": 106} {"train_loss": -26.0185604095459, "global_step": 12832, "epoch": 106} {"train_loss": -26.159290313720703, "global_step": 12833, "epoch": 106} {"train_loss": -26.233652114868164, "global_step": 12834, "epoch": 106} {"train_loss": -26.27900505065918, "global_step": 12835, "epoch": 106} {"train_loss": -26.589588165283203, "global_step": 12836, "epoch": 106} {"train_loss": -26.239206314086914, "global_step": 12837, "epoch": 106} {"train_loss": -26.228530883789062, "global_step": 12838, "epoch": 106} {"train_loss": -26.7386474609375, "global_step": 12839, "epoch": 106} {"train_loss": -26.610763549804688, "global_step": 12840, "epoch": 106} {"train_loss": -26.4892635345459, "global_step": 12841, "epoch": 106} {"train_loss": -26.32211685180664, "global_step": 12842, "epoch": 106} {"train_loss": -26.709516525268555, "global_step": 12843, "epoch": 106} {"train_loss": -26.373075485229492, "global_step": 12844, "epoch": 106} {"train_loss": -26.738910675048828, "global_step": 12845, "epoch": 106} {"train_loss": -26.748910903930664, "global_step": 12846, "epoch": 106} {"train_loss": -26.582691192626953, "global_step": 12847, "epoch": 106} {"train_loss": -26.793170928955078, "global_step": 12848, "epoch": 106} {"train_loss": -26.899877548217773, "global_step": 12849, "epoch": 106} {"train_loss": -26.771352767944336, "global_step": 12850, "epoch": 106} {"train_loss": -27.16985511779785, "global_step": 12851, "epoch": 106} {"train_loss": -26.558822631835938, "global_step": 12852, "epoch": 106} {"train_loss": -27.06878089904785, "global_step": 12853, "epoch": 106} {"train_loss": -26.453710556030273, "global_step": 12854, "epoch": 106} {"train_loss": -25.768030166625977, "global_step": 12855, "epoch": 106} {"train_loss": -25.19097900390625, "global_step": 12856, "epoch": 106} {"train_loss": -25.401098251342773, "global_step": 12857, "epoch": 106} {"train_loss": -26.01211929321289, "global_step": 12858, "epoch": 106} {"train_loss": -26.310346603393555, "global_step": 12859, "epoch": 106} {"train_loss": -26.62330436706543, "global_step": 12860, "epoch": 106} {"train_loss": -26.807846069335938, "global_step": 12861, "epoch": 106} {"train_loss": -25.856565475463867, "global_step": 12862, "epoch": 106} {"train_loss": -25.228015899658203, "global_step": 12863, "epoch": 106} {"train_loss": -25.206884384155273, "global_step": 12864, "epoch": 106} {"train_loss": -25.928089141845703, "global_step": 12865, "epoch": 106} {"train_loss": -26.811264038085938, "global_step": 12866, "epoch": 106} {"train_loss": -25.979970932006836, "global_step": 12867, "epoch": 106} {"train_loss": -24.65633773803711, "global_step": 12868, "epoch": 106} {"train_loss": -25.36089515686035, "global_step": 12869, "epoch": 106} {"train_loss": -26.767614364624023, "global_step": 12870, "epoch": 106} {"train_loss": -26.101104736328125, "global_step": 12871, "epoch": 106} {"train_loss": -25.941089630126953, "global_step": 12872, "epoch": 106} {"train_loss": -26.0822811126709, "global_step": 12873, "epoch": 106} {"train_loss": -26.140811920166016, "global_step": 12874, "epoch": 106} {"train_loss": -25.46492576599121, "global_step": 12875, "epoch": 106} {"train_loss": -26.1352596282959, "global_step": 12876, "epoch": 106} {"train_loss": -26.515356063842773, "global_step": 12877, "epoch": 106} {"train_loss": -25.541032791137695, "global_step": 12878, "epoch": 106} {"train_loss": -25.61496925354004, "global_step": 12879, "epoch": 106} {"train_loss": -26.341644287109375, "global_step": 12880, "epoch": 106} {"train_loss": -26.204025268554688, "global_step": 12881, "epoch": 106} {"train_loss": -26.7360897064209, "global_step": 12882, "epoch": 106} {"train_loss": -25.963109970092773, "global_step": 12883, "epoch": 106} {"train_loss": -26.763736724853516, "global_step": 12884, "epoch": 106} {"train_loss": -26.073535919189453, "global_step": 12885, "epoch": 106} {"train_loss": -26.100805282592773, "global_step": 12886, "epoch": 106} {"train_loss": -25.672819137573242, "global_step": 12887, "epoch": 106} {"train_loss": -24.845046997070312, "global_step": 12888, "epoch": 106} {"train_loss": -26.1735782623291, "global_step": 12889, "epoch": 106} {"train_loss": -25.68414306640625, "global_step": 12890, "epoch": 106} {"train_loss": -24.06296730041504, "global_step": 12891, "epoch": 106} {"train_loss": -26.053380966186523, "global_step": 12892, "epoch": 106} {"train_loss": -22.382749557495117, "global_step": 12893, "epoch": 106} {"train_loss": -26.057361602783203, "global_step": 12894, "epoch": 106} {"train_loss": -22.574905395507812, "global_step": 12895, "epoch": 106} {"train_loss": -26.256711959838867, "global_step": 12896, "epoch": 106} {"train_loss": -24.552717208862305, "global_step": 12897, "epoch": 106} {"train_loss": -25.382238388061523, "global_step": 12898, "epoch": 106} {"train_loss": -26.244672775268555, "global_step": 12899, "epoch": 106} {"train_loss": -24.685758590698242, "global_step": 12900, "epoch": 106} {"train_loss": -25.523099899291992, "global_step": 12901, "epoch": 106} {"train_loss": -26.494495391845703, "global_step": 12902, "epoch": 106} {"train_loss": -25.343236923217773, "global_step": 12903, "epoch": 106} {"train_loss": -25.458951950073242, "global_step": 12904, "epoch": 106} {"train_loss": -26.182592391967773, "global_step": 12905, "epoch": 106} {"train_loss": -26.471723556518555, "global_step": 12906, "epoch": 106} {"train_loss": -26.053190231323242, "global_step": 12907, "epoch": 106} {"train_loss": -26.38800621032715, "global_step": 12908, "epoch": 106} {"train_loss": -26.369226455688477, "global_step": 12909, "epoch": 106} {"train_loss": -25.992389678955078, "global_step": 12910, "epoch": 106} {"train_loss": -26.521869659423828, "global_step": 12911, "epoch": 106} {"train_loss": -26.351133346557617, "global_step": 12912, "epoch": 106} {"train_loss": -25.56163787841797, "global_step": 12913, "epoch": 106} {"train_loss": -26.313465118408203, "global_step": 12914, "epoch": 106} {"train_loss": -25.80859375, "global_step": 12915, "epoch": 106} {"train_loss": -25.663293838500977, "global_step": 12916, "epoch": 106} {"train_loss": -26.343114852905273, "global_step": 12917, "epoch": 106} {"train_loss": -25.132221221923828, "global_step": 12918, "epoch": 106} {"train_loss": -24.813858032226562, "global_step": 12919, "epoch": 106} {"train_loss": -26.604171752929688, "global_step": 12920, "epoch": 106} {"train_loss": -25.54855728149414, "global_step": 12921, "epoch": 106} {"train_loss": -24.20231056213379, "global_step": 12922, "epoch": 106} {"train_loss": -26.652616500854492, "global_step": 12923, "epoch": 106} {"train_loss": -25.68537712097168, "global_step": 12924, "epoch": 106} {"train_loss": -26.084192276000977, "global_step": 12925, "epoch": 106} {"train_loss": -25.678192138671875, "global_step": 12926, "epoch": 106} {"train_loss": -25.17170524597168, "global_step": 12927, "epoch": 106} {"train_loss": -26.861658096313477, "global_step": 12928, "epoch": 106} {"train_loss": -25.743085861206055, "global_step": 12929, "epoch": 106} {"train_loss": -26.187286376953125, "global_step": 12930, "epoch": 106} {"train_loss": -25.382612228393555, "global_step": 12931, "epoch": 106} {"train_loss": -26.48504638671875, "global_step": 12932, "epoch": 106} {"train_loss": -25.829492568969727, "global_step": 12933, "epoch": 106} {"train_loss": -25.952289581298828, "global_step": 12934, "epoch": 106} {"train_loss": -25.92677879333496, "global_step": 12935, "epoch": 106} {"train_loss": -25.524707794189453, "global_step": 12936, "epoch": 106} {"train_loss": -24.818204879760742, "global_step": 12937, "epoch": 106} {"train_loss": -25.856201171875, "global_step": 12938, "epoch": 106} {"train_loss": -26.17164421081543, "global_step": 12939, "epoch": 106} {"train_loss": -25.639089584350586, "global_step": 12940, "epoch": 106} {"train_loss": -26.205121994018555, "global_step": 12941, "epoch": 106} {"train_loss": -26.194610595703125, "global_step": 12942, "epoch": 106} {"train_loss": -25.920154571533203, "global_step": 12943, "epoch": 106} {"train_loss": -25.993793487548828, "global_step": 12944, "epoch": 106} {"train_loss": -25.021778106689453, "global_step": 12945, "epoch": 106} {"train_loss": -25.947671007518927, "global_step": 12946, "epoch": 106, "val_loss": 2686993.5} {"train_loss": -25.9816951751709, "global_step": 12947, "epoch": 107} {"train_loss": -26.21832847595215, "global_step": 12948, "epoch": 107} {"train_loss": -24.9110050201416, "global_step": 12949, "epoch": 107} {"train_loss": -25.742156982421875, "global_step": 12950, "epoch": 107} {"train_loss": -24.324081420898438, "global_step": 12951, "epoch": 107} {"train_loss": -25.654829025268555, "global_step": 12952, "epoch": 107} {"train_loss": -25.446632385253906, "global_step": 12953, "epoch": 107} {"train_loss": -25.761117935180664, "global_step": 12954, "epoch": 107} {"train_loss": -25.663909912109375, "global_step": 12955, "epoch": 107} {"train_loss": -26.383106231689453, "global_step": 12956, "epoch": 107} {"train_loss": -25.54522132873535, "global_step": 12957, "epoch": 107} {"train_loss": -25.30240249633789, "global_step": 12958, "epoch": 107} {"train_loss": -26.077472686767578, "global_step": 12959, "epoch": 107} {"train_loss": -25.40818977355957, "global_step": 12960, "epoch": 107} {"train_loss": -25.266286849975586, "global_step": 12961, "epoch": 107} {"train_loss": -25.811603546142578, "global_step": 12962, "epoch": 107} {"train_loss": -26.155731201171875, "global_step": 12963, "epoch": 107} {"train_loss": -25.388486862182617, "global_step": 12964, "epoch": 107} {"train_loss": -26.088336944580078, "global_step": 12965, "epoch": 107} {"train_loss": -25.69437599182129, "global_step": 12966, "epoch": 107} {"train_loss": -26.15616226196289, "global_step": 12967, "epoch": 107} {"train_loss": -25.860095977783203, "global_step": 12968, "epoch": 107} {"train_loss": -25.80250358581543, "global_step": 12969, "epoch": 107} {"train_loss": -26.049579620361328, "global_step": 12970, "epoch": 107} {"train_loss": -25.390384674072266, "global_step": 12971, "epoch": 107} {"train_loss": -26.580739974975586, "global_step": 12972, "epoch": 107} {"train_loss": -26.025720596313477, "global_step": 12973, "epoch": 107} {"train_loss": -26.170995712280273, "global_step": 12974, "epoch": 107} {"train_loss": -26.692914962768555, "global_step": 12975, "epoch": 107} {"train_loss": -26.743383407592773, "global_step": 12976, "epoch": 107} {"train_loss": -26.350126266479492, "global_step": 12977, "epoch": 107} {"train_loss": -26.689533233642578, "global_step": 12978, "epoch": 107} {"train_loss": -26.08575439453125, "global_step": 12979, "epoch": 107} {"train_loss": -26.212575912475586, "global_step": 12980, "epoch": 107} {"train_loss": -26.173648834228516, "global_step": 12981, "epoch": 107} {"train_loss": -26.43403434753418, "global_step": 12982, "epoch": 107} {"train_loss": -26.19610023498535, "global_step": 12983, "epoch": 107} {"train_loss": -26.4249324798584, "global_step": 12984, "epoch": 107} {"train_loss": -26.4665470123291, "global_step": 12985, "epoch": 107} {"train_loss": -26.748144149780273, "global_step": 12986, "epoch": 107} {"train_loss": -25.432449340820312, "global_step": 12987, "epoch": 107} {"train_loss": -26.021575927734375, "global_step": 12988, "epoch": 107} {"train_loss": -26.8039493560791, "global_step": 12989, "epoch": 107} {"train_loss": -26.096338272094727, "global_step": 12990, "epoch": 107} {"train_loss": -25.90375328063965, "global_step": 12991, "epoch": 107} {"train_loss": -26.642322540283203, "global_step": 12992, "epoch": 107} {"train_loss": -26.906005859375, "global_step": 12993, "epoch": 107} {"train_loss": -26.6546573638916, "global_step": 12994, "epoch": 107} {"train_loss": -26.038938522338867, "global_step": 12995, "epoch": 107} {"train_loss": -26.35337257385254, "global_step": 12996, "epoch": 107} {"train_loss": -26.418689727783203, "global_step": 12997, "epoch": 107} {"train_loss": -26.700580596923828, "global_step": 12998, "epoch": 107} {"train_loss": -25.8355712890625, "global_step": 12999, "epoch": 107} {"train_loss": -26.476428985595703, "global_step": 13000, "epoch": 107} {"train_loss": -26.863632202148438, "global_step": 13001, "epoch": 107} {"train_loss": -26.1914005279541, "global_step": 13002, "epoch": 107} {"train_loss": -26.352643966674805, "global_step": 13003, "epoch": 107} {"train_loss": -26.277572631835938, "global_step": 13004, "epoch": 107} {"train_loss": -26.823627471923828, "global_step": 13005, "epoch": 107} {"train_loss": -26.9614315032959, "global_step": 13006, "epoch": 107} {"train_loss": -26.17789649963379, "global_step": 13007, "epoch": 107} {"train_loss": -26.483572006225586, "global_step": 13008, "epoch": 107} {"train_loss": -26.53644371032715, "global_step": 13009, "epoch": 107} {"train_loss": -25.9859619140625, "global_step": 13010, "epoch": 107} {"train_loss": -25.8818359375, "global_step": 13011, "epoch": 107} {"train_loss": -26.036075592041016, "global_step": 13012, "epoch": 107} {"train_loss": -26.418781280517578, "global_step": 13013, "epoch": 107} {"train_loss": -26.348886489868164, "global_step": 13014, "epoch": 107} {"train_loss": -26.60064125061035, "global_step": 13015, "epoch": 107} {"train_loss": -26.870710372924805, "global_step": 13016, "epoch": 107} {"train_loss": -26.106409072875977, "global_step": 13017, "epoch": 107} {"train_loss": -25.310461044311523, "global_step": 13018, "epoch": 107} {"train_loss": -25.318275451660156, "global_step": 13019, "epoch": 107} {"train_loss": -26.54642105102539, "global_step": 13020, "epoch": 107} {"train_loss": -26.88437843322754, "global_step": 13021, "epoch": 107} {"train_loss": -25.97247886657715, "global_step": 13022, "epoch": 107} {"train_loss": -26.316675186157227, "global_step": 13023, "epoch": 107} {"train_loss": -26.621625900268555, "global_step": 13024, "epoch": 107} {"train_loss": -27.048192977905273, "global_step": 13025, "epoch": 107} {"train_loss": -26.44839859008789, "global_step": 13026, "epoch": 107} {"train_loss": -26.29730796813965, "global_step": 13027, "epoch": 107} {"train_loss": -26.569992065429688, "global_step": 13028, "epoch": 107} {"train_loss": -27.1437931060791, "global_step": 13029, "epoch": 107} {"train_loss": -26.684789657592773, "global_step": 13030, "epoch": 107} {"train_loss": -26.93570327758789, "global_step": 13031, "epoch": 107} {"train_loss": -26.47918128967285, "global_step": 13032, "epoch": 107} {"train_loss": -26.30462646484375, "global_step": 13033, "epoch": 107} {"train_loss": -27.34347915649414, "global_step": 13034, "epoch": 107} {"train_loss": -26.436582565307617, "global_step": 13035, "epoch": 107} {"train_loss": -26.375036239624023, "global_step": 13036, "epoch": 107} {"train_loss": -26.55877113342285, "global_step": 13037, "epoch": 107} {"train_loss": -26.164276123046875, "global_step": 13038, "epoch": 107} {"train_loss": -26.75249671936035, "global_step": 13039, "epoch": 107} {"train_loss": -26.524658203125, "global_step": 13040, "epoch": 107} {"train_loss": -26.72607421875, "global_step": 13041, "epoch": 107} {"train_loss": -25.616193771362305, "global_step": 13042, "epoch": 107} {"train_loss": -25.25119400024414, "global_step": 13043, "epoch": 107} {"train_loss": -25.260284423828125, "global_step": 13044, "epoch": 107} {"train_loss": -25.7316837310791, "global_step": 13045, "epoch": 107} {"train_loss": -26.335681915283203, "global_step": 13046, "epoch": 107} {"train_loss": -26.183536529541016, "global_step": 13047, "epoch": 107} {"train_loss": -27.15907096862793, "global_step": 13048, "epoch": 107} {"train_loss": -25.904211044311523, "global_step": 13049, "epoch": 107} {"train_loss": -27.050134658813477, "global_step": 13050, "epoch": 107} {"train_loss": -26.301721572875977, "global_step": 13051, "epoch": 107} {"train_loss": -26.235029220581055, "global_step": 13052, "epoch": 107} {"train_loss": -26.2874813079834, "global_step": 13053, "epoch": 107} {"train_loss": -26.421667098999023, "global_step": 13054, "epoch": 107} {"train_loss": -26.68303871154785, "global_step": 13055, "epoch": 107} {"train_loss": -25.687814712524414, "global_step": 13056, "epoch": 107} {"train_loss": -24.948057174682617, "global_step": 13057, "epoch": 107} {"train_loss": -25.539447784423828, "global_step": 13058, "epoch": 107} {"train_loss": -26.69883155822754, "global_step": 13059, "epoch": 107} {"train_loss": -26.067462921142578, "global_step": 13060, "epoch": 107} {"train_loss": -25.808490753173828, "global_step": 13061, "epoch": 107} {"train_loss": -27.11256217956543, "global_step": 13062, "epoch": 107} {"train_loss": -26.2469425201416, "global_step": 13063, "epoch": 107} {"train_loss": -26.111539840698242, "global_step": 13064, "epoch": 107} {"train_loss": -26.745834350585938, "global_step": 13065, "epoch": 107} {"train_loss": -26.58319664001465, "global_step": 13066, "epoch": 107} {"train_loss": -26.2107471434538, "global_step": 13067, "epoch": 107, "val_loss": 3229103.25} {"train_loss": -25.980981826782227, "global_step": 13068, "epoch": 108} {"train_loss": -26.748931884765625, "global_step": 13069, "epoch": 108} {"train_loss": -25.961246490478516, "global_step": 13070, "epoch": 108} {"train_loss": -24.571802139282227, "global_step": 13071, "epoch": 108} {"train_loss": -24.579975128173828, "global_step": 13072, "epoch": 108} {"train_loss": -25.358022689819336, "global_step": 13073, "epoch": 108} {"train_loss": -25.9548282623291, "global_step": 13074, "epoch": 108} {"train_loss": -26.4409236907959, "global_step": 13075, "epoch": 108} {"train_loss": -26.620920181274414, "global_step": 13076, "epoch": 108} {"train_loss": -26.169113159179688, "global_step": 13077, "epoch": 108} {"train_loss": -26.23441505432129, "global_step": 13078, "epoch": 108} {"train_loss": -27.171125411987305, "global_step": 13079, "epoch": 108} {"train_loss": -26.68696403503418, "global_step": 13080, "epoch": 108} {"train_loss": -26.654706954956055, "global_step": 13081, "epoch": 108} {"train_loss": -26.960805892944336, "global_step": 13082, "epoch": 108} {"train_loss": -26.573989868164062, "global_step": 13083, "epoch": 108} {"train_loss": -25.589441299438477, "global_step": 13084, "epoch": 108} {"train_loss": -26.1824893951416, "global_step": 13085, "epoch": 108} {"train_loss": -27.056324005126953, "global_step": 13086, "epoch": 108} {"train_loss": -26.480926513671875, "global_step": 13087, "epoch": 108} {"train_loss": -26.755035400390625, "global_step": 13088, "epoch": 108} {"train_loss": -26.4137020111084, "global_step": 13089, "epoch": 108} {"train_loss": -26.29334831237793, "global_step": 13090, "epoch": 108} {"train_loss": -26.391845703125, "global_step": 13091, "epoch": 108} {"train_loss": -26.898212432861328, "global_step": 13092, "epoch": 108} {"train_loss": -26.203414916992188, "global_step": 13093, "epoch": 108} {"train_loss": -26.91303825378418, "global_step": 13094, "epoch": 108} {"train_loss": -25.905364990234375, "global_step": 13095, "epoch": 108} {"train_loss": -26.474578857421875, "global_step": 13096, "epoch": 108} {"train_loss": -26.370046615600586, "global_step": 13097, "epoch": 108} {"train_loss": -25.728073120117188, "global_step": 13098, "epoch": 108} {"train_loss": -26.70660400390625, "global_step": 13099, "epoch": 108} {"train_loss": -25.0864315032959, "global_step": 13100, "epoch": 108} {"train_loss": -21.594633102416992, "global_step": 13101, "epoch": 108} {"train_loss": -16.910888671875, "global_step": 13102, "epoch": 108} {"train_loss": -21.278593063354492, "global_step": 13103, "epoch": 108} {"train_loss": -25.23341941833496, "global_step": 13104, "epoch": 108} {"train_loss": -23.799259185791016, "global_step": 13105, "epoch": 108} {"train_loss": -24.675094604492188, "global_step": 13106, "epoch": 108} {"train_loss": -26.066492080688477, "global_step": 13107, "epoch": 108} {"train_loss": -24.866628646850586, "global_step": 13108, "epoch": 108} {"train_loss": -25.174747467041016, "global_step": 13109, "epoch": 108} {"train_loss": -25.357572555541992, "global_step": 13110, "epoch": 108} {"train_loss": -25.55316734313965, "global_step": 13111, "epoch": 108} {"train_loss": -25.02320671081543, "global_step": 13112, "epoch": 108} {"train_loss": -24.741352081298828, "global_step": 13113, "epoch": 108} {"train_loss": -25.364973068237305, "global_step": 13114, "epoch": 108} {"train_loss": -25.50006675720215, "global_step": 13115, "epoch": 108} {"train_loss": -25.436933517456055, "global_step": 13116, "epoch": 108} {"train_loss": -25.729843139648438, "global_step": 13117, "epoch": 108} {"train_loss": -25.658246994018555, "global_step": 13118, "epoch": 108} {"train_loss": -25.563505172729492, "global_step": 13119, "epoch": 108} {"train_loss": -26.200489044189453, "global_step": 13120, "epoch": 108} {"train_loss": -25.558923721313477, "global_step": 13121, "epoch": 108} {"train_loss": -25.848663330078125, "global_step": 13122, "epoch": 108} {"train_loss": -26.07270622253418, "global_step": 13123, "epoch": 108} {"train_loss": -25.94956398010254, "global_step": 13124, "epoch": 108} {"train_loss": -25.80206298828125, "global_step": 13125, "epoch": 108} {"train_loss": -25.750722885131836, "global_step": 13126, "epoch": 108} {"train_loss": -25.707168579101562, "global_step": 13127, "epoch": 108} {"train_loss": -26.122589111328125, "global_step": 13128, "epoch": 108} {"train_loss": -25.857816696166992, "global_step": 13129, "epoch": 108} {"train_loss": -25.747777938842773, "global_step": 13130, "epoch": 108} {"train_loss": -26.11432456970215, "global_step": 13131, "epoch": 108} {"train_loss": -26.1071834564209, "global_step": 13132, "epoch": 108} {"train_loss": -26.123727798461914, "global_step": 13133, "epoch": 108} {"train_loss": -25.606592178344727, "global_step": 13134, "epoch": 108} {"train_loss": -25.996173858642578, "global_step": 13135, "epoch": 108} {"train_loss": -25.80122184753418, "global_step": 13136, "epoch": 108} {"train_loss": -25.158483505249023, "global_step": 13137, "epoch": 108} {"train_loss": -26.041309356689453, "global_step": 13138, "epoch": 108} {"train_loss": -26.20135498046875, "global_step": 13139, "epoch": 108} {"train_loss": -26.340911865234375, "global_step": 13140, "epoch": 108} {"train_loss": -25.888141632080078, "global_step": 13141, "epoch": 108} {"train_loss": -25.68958854675293, "global_step": 13142, "epoch": 108} {"train_loss": -25.264007568359375, "global_step": 13143, "epoch": 108} {"train_loss": -26.530996322631836, "global_step": 13144, "epoch": 108} {"train_loss": -25.99911880493164, "global_step": 13145, "epoch": 108} {"train_loss": -26.032556533813477, "global_step": 13146, "epoch": 108} {"train_loss": -26.05196189880371, "global_step": 13147, "epoch": 108} {"train_loss": -26.15235710144043, "global_step": 13148, "epoch": 108} {"train_loss": -26.702184677124023, "global_step": 13149, "epoch": 108} {"train_loss": -26.084970474243164, "global_step": 13150, "epoch": 108} {"train_loss": -25.758390426635742, "global_step": 13151, "epoch": 108} {"train_loss": -26.560049057006836, "global_step": 13152, "epoch": 108} {"train_loss": -26.471302032470703, "global_step": 13153, "epoch": 108} {"train_loss": -25.540708541870117, "global_step": 13154, "epoch": 108} {"train_loss": -26.13209342956543, "global_step": 13155, "epoch": 108} {"train_loss": -26.91302490234375, "global_step": 13156, "epoch": 108} {"train_loss": -26.4078311920166, "global_step": 13157, "epoch": 108} {"train_loss": -26.493743896484375, "global_step": 13158, "epoch": 108} {"train_loss": -26.185810089111328, "global_step": 13159, "epoch": 108} {"train_loss": -26.065702438354492, "global_step": 13160, "epoch": 108} {"train_loss": -25.94830322265625, "global_step": 13161, "epoch": 108} {"train_loss": -24.459903717041016, "global_step": 13162, "epoch": 108} {"train_loss": -21.942045211791992, "global_step": 13163, "epoch": 108} {"train_loss": -20.853607177734375, "global_step": 13164, "epoch": 108} {"train_loss": -26.06158447265625, "global_step": 13165, "epoch": 108} {"train_loss": -24.642108917236328, "global_step": 13166, "epoch": 108} {"train_loss": -19.201478958129883, "global_step": 13167, "epoch": 108} {"train_loss": -24.125, "global_step": 13168, "epoch": 108} {"train_loss": -25.877050399780273, "global_step": 13169, "epoch": 108} {"train_loss": -23.927406311035156, "global_step": 13170, "epoch": 108} {"train_loss": -25.765338897705078, "global_step": 13171, "epoch": 108} {"train_loss": -25.30190086364746, "global_step": 13172, "epoch": 108} {"train_loss": -25.37799644470215, "global_step": 13173, "epoch": 108} {"train_loss": -26.155988693237305, "global_step": 13174, "epoch": 108} {"train_loss": -24.987548828125, "global_step": 13175, "epoch": 108} {"train_loss": -26.404102325439453, "global_step": 13176, "epoch": 108} {"train_loss": -25.761627197265625, "global_step": 13177, "epoch": 108} {"train_loss": -26.373722076416016, "global_step": 13178, "epoch": 108} {"train_loss": -26.008167266845703, "global_step": 13179, "epoch": 108} {"train_loss": -25.97188377380371, "global_step": 13180, "epoch": 108} {"train_loss": -26.28523063659668, "global_step": 13181, "epoch": 108} {"train_loss": -26.042144775390625, "global_step": 13182, "epoch": 108} {"train_loss": -26.253448486328125, "global_step": 13183, "epoch": 108} {"train_loss": -26.427886962890625, "global_step": 13184, "epoch": 108} {"train_loss": -26.409337997436523, "global_step": 13185, "epoch": 108} {"train_loss": -26.115259170532227, "global_step": 13186, "epoch": 108} {"train_loss": -26.149106979370117, "global_step": 13187, "epoch": 108} {"train_loss": -25.633466137342218, "global_step": 13188, "epoch": 108, "val_loss": 2790211.25} {"train_loss": -26.035755157470703, "global_step": 13189, "epoch": 109} {"train_loss": -26.637914657592773, "global_step": 13190, "epoch": 109} {"train_loss": -26.215845108032227, "global_step": 13191, "epoch": 109} {"train_loss": -26.38165283203125, "global_step": 13192, "epoch": 109} {"train_loss": -26.3393611907959, "global_step": 13193, "epoch": 109} {"train_loss": -26.864978790283203, "global_step": 13194, "epoch": 109} {"train_loss": -26.259765625, "global_step": 13195, "epoch": 109} {"train_loss": -26.494352340698242, "global_step": 13196, "epoch": 109} {"train_loss": -26.799976348876953, "global_step": 13197, "epoch": 109} {"train_loss": -26.14507484436035, "global_step": 13198, "epoch": 109} {"train_loss": -27.058271408081055, "global_step": 13199, "epoch": 109} {"train_loss": -26.766803741455078, "global_step": 13200, "epoch": 109} {"train_loss": -26.577716827392578, "global_step": 13201, "epoch": 109} {"train_loss": -26.646146774291992, "global_step": 13202, "epoch": 109} {"train_loss": -26.723485946655273, "global_step": 13203, "epoch": 109} {"train_loss": -26.662805557250977, "global_step": 13204, "epoch": 109} {"train_loss": -26.651371002197266, "global_step": 13205, "epoch": 109} {"train_loss": -26.981481552124023, "global_step": 13206, "epoch": 109} {"train_loss": -26.376041412353516, "global_step": 13207, "epoch": 109} {"train_loss": -24.66849136352539, "global_step": 13208, "epoch": 109} {"train_loss": -23.63286781311035, "global_step": 13209, "epoch": 109} {"train_loss": -23.077396392822266, "global_step": 13210, "epoch": 109} {"train_loss": -25.362634658813477, "global_step": 13211, "epoch": 109} {"train_loss": -26.858755111694336, "global_step": 13212, "epoch": 109} {"train_loss": -24.807357788085938, "global_step": 13213, "epoch": 109} {"train_loss": -26.193872451782227, "global_step": 13214, "epoch": 109} {"train_loss": -26.290388107299805, "global_step": 13215, "epoch": 109} {"train_loss": -25.942703247070312, "global_step": 13216, "epoch": 109} {"train_loss": -26.747007369995117, "global_step": 13217, "epoch": 109} {"train_loss": -25.980289459228516, "global_step": 13218, "epoch": 109} {"train_loss": -26.889698028564453, "global_step": 13219, "epoch": 109} {"train_loss": -25.909475326538086, "global_step": 13220, "epoch": 109} {"train_loss": -26.164875030517578, "global_step": 13221, "epoch": 109} {"train_loss": -26.891218185424805, "global_step": 13222, "epoch": 109} {"train_loss": -25.66819190979004, "global_step": 13223, "epoch": 109} {"train_loss": -26.43465232849121, "global_step": 13224, "epoch": 109} {"train_loss": -26.5620059967041, "global_step": 13225, "epoch": 109} {"train_loss": -26.377172470092773, "global_step": 13226, "epoch": 109} {"train_loss": -26.882740020751953, "global_step": 13227, "epoch": 109} {"train_loss": -26.51630210876465, "global_step": 13228, "epoch": 109} {"train_loss": -26.122724533081055, "global_step": 13229, "epoch": 109} {"train_loss": -26.931379318237305, "global_step": 13230, "epoch": 109} {"train_loss": -26.487516403198242, "global_step": 13231, "epoch": 109} {"train_loss": -25.831220626831055, "global_step": 13232, "epoch": 109} {"train_loss": -25.89068031311035, "global_step": 13233, "epoch": 109} {"train_loss": -25.88469886779785, "global_step": 13234, "epoch": 109} {"train_loss": -26.153966903686523, "global_step": 13235, "epoch": 109} {"train_loss": -26.439300537109375, "global_step": 13236, "epoch": 109} {"train_loss": -26.518299102783203, "global_step": 13237, "epoch": 109} {"train_loss": -26.304044723510742, "global_step": 13238, "epoch": 109} {"train_loss": -26.6807861328125, "global_step": 13239, "epoch": 109} {"train_loss": -25.933988571166992, "global_step": 13240, "epoch": 109} {"train_loss": -25.4617919921875, "global_step": 13241, "epoch": 109} {"train_loss": -26.339981079101562, "global_step": 13242, "epoch": 109} {"train_loss": -26.28031349182129, "global_step": 13243, "epoch": 109} {"train_loss": -25.625782012939453, "global_step": 13244, "epoch": 109} {"train_loss": -26.981870651245117, "global_step": 13245, "epoch": 109} {"train_loss": -26.590564727783203, "global_step": 13246, "epoch": 109} {"train_loss": -26.938034057617188, "global_step": 13247, "epoch": 109} {"train_loss": -26.558576583862305, "global_step": 13248, "epoch": 109} {"train_loss": -26.59377098083496, "global_step": 13249, "epoch": 109} {"train_loss": -26.591907501220703, "global_step": 13250, "epoch": 109} {"train_loss": -26.769758224487305, "global_step": 13251, "epoch": 109} {"train_loss": -26.25819206237793, "global_step": 13252, "epoch": 109} {"train_loss": -26.479736328125, "global_step": 13253, "epoch": 109} {"train_loss": -26.83918571472168, "global_step": 13254, "epoch": 109} {"train_loss": -26.34916114807129, "global_step": 13255, "epoch": 109} {"train_loss": -26.794498443603516, "global_step": 13256, "epoch": 109} {"train_loss": -26.891706466674805, "global_step": 13257, "epoch": 109} {"train_loss": -26.921066284179688, "global_step": 13258, "epoch": 109} {"train_loss": -26.86016273498535, "global_step": 13259, "epoch": 109} {"train_loss": -26.693201065063477, "global_step": 13260, "epoch": 109} {"train_loss": -27.19943618774414, "global_step": 13261, "epoch": 109} {"train_loss": -26.227487564086914, "global_step": 13262, "epoch": 109} {"train_loss": -26.663366317749023, "global_step": 13263, "epoch": 109} {"train_loss": -26.71022605895996, "global_step": 13264, "epoch": 109} {"train_loss": -26.595367431640625, "global_step": 13265, "epoch": 109} {"train_loss": -27.002689361572266, "global_step": 13266, "epoch": 109} {"train_loss": -26.8035945892334, "global_step": 13267, "epoch": 109} {"train_loss": -27.188425064086914, "global_step": 13268, "epoch": 109} {"train_loss": -26.910367965698242, "global_step": 13269, "epoch": 109} {"train_loss": -27.29852867126465, "global_step": 13270, "epoch": 109} {"train_loss": -26.805896759033203, "global_step": 13271, "epoch": 109} {"train_loss": -27.394498825073242, "global_step": 13272, "epoch": 109} {"train_loss": -27.0251522064209, "global_step": 13273, "epoch": 109} {"train_loss": -26.858844757080078, "global_step": 13274, "epoch": 109} {"train_loss": -26.901763916015625, "global_step": 13275, "epoch": 109} {"train_loss": -26.871328353881836, "global_step": 13276, "epoch": 109} {"train_loss": -26.959447860717773, "global_step": 13277, "epoch": 109} {"train_loss": -27.138830184936523, "global_step": 13278, "epoch": 109} {"train_loss": -26.9848575592041, "global_step": 13279, "epoch": 109} {"train_loss": -27.12628173828125, "global_step": 13280, "epoch": 109} {"train_loss": -27.060489654541016, "global_step": 13281, "epoch": 109} {"train_loss": -27.308135986328125, "global_step": 13282, "epoch": 109} {"train_loss": -27.095396041870117, "global_step": 13283, "epoch": 109} {"train_loss": -26.451435089111328, "global_step": 13284, "epoch": 109} {"train_loss": -25.584394454956055, "global_step": 13285, "epoch": 109} {"train_loss": -27.57554054260254, "global_step": 13286, "epoch": 109} {"train_loss": -26.39528465270996, "global_step": 13287, "epoch": 109} {"train_loss": -26.679269790649414, "global_step": 13288, "epoch": 109} {"train_loss": -27.0459041595459, "global_step": 13289, "epoch": 109} {"train_loss": -27.335830688476562, "global_step": 13290, "epoch": 109} {"train_loss": -26.509906768798828, "global_step": 13291, "epoch": 109} {"train_loss": -27.244964599609375, "global_step": 13292, "epoch": 109} {"train_loss": -27.024930953979492, "global_step": 13293, "epoch": 109} {"train_loss": -27.21575927734375, "global_step": 13294, "epoch": 109} {"train_loss": -26.554962158203125, "global_step": 13295, "epoch": 109} {"train_loss": -23.6186580657959, "global_step": 13296, "epoch": 109} {"train_loss": -20.219411849975586, "global_step": 13297, "epoch": 109} {"train_loss": -18.8892822265625, "global_step": 13298, "epoch": 109} {"train_loss": -22.554460525512695, "global_step": 13299, "epoch": 109} {"train_loss": -26.171142578125, "global_step": 13300, "epoch": 109} {"train_loss": -22.948673248291016, "global_step": 13301, "epoch": 109} {"train_loss": -25.437177658081055, "global_step": 13302, "epoch": 109} {"train_loss": -25.445531845092773, "global_step": 13303, "epoch": 109} {"train_loss": -25.840478897094727, "global_step": 13304, "epoch": 109} {"train_loss": -24.78883934020996, "global_step": 13305, "epoch": 109} {"train_loss": -25.647470474243164, "global_step": 13306, "epoch": 109} {"train_loss": -24.76192283630371, "global_step": 13307, "epoch": 109} {"train_loss": -23.017166137695312, "global_step": 13308, "epoch": 109} {"train_loss": -26.20551221232769, "global_step": 13309, "epoch": 109, "val_loss": 2710346.0} {"train_loss": -25.7962703704834, "global_step": 13310, "epoch": 110} {"train_loss": -24.70375633239746, "global_step": 13311, "epoch": 110} {"train_loss": -25.769956588745117, "global_step": 13312, "epoch": 110} {"train_loss": -25.518659591674805, "global_step": 13313, "epoch": 110} {"train_loss": -26.082590103149414, "global_step": 13314, "epoch": 110} {"train_loss": -25.579938888549805, "global_step": 13315, "epoch": 110} {"train_loss": -25.542133331298828, "global_step": 13316, "epoch": 110} {"train_loss": -25.748559951782227, "global_step": 13317, "epoch": 110} {"train_loss": -25.73563575744629, "global_step": 13318, "epoch": 110} {"train_loss": -25.570419311523438, "global_step": 13319, "epoch": 110} {"train_loss": -25.687026977539062, "global_step": 13320, "epoch": 110} {"train_loss": -25.91470718383789, "global_step": 13321, "epoch": 110} {"train_loss": -26.201141357421875, "global_step": 13322, "epoch": 110} {"train_loss": -25.71149253845215, "global_step": 13323, "epoch": 110} {"train_loss": -26.02066421508789, "global_step": 13324, "epoch": 110} {"train_loss": -25.779499053955078, "global_step": 13325, "epoch": 110} {"train_loss": -25.961929321289062, "global_step": 13326, "epoch": 110} {"train_loss": -26.489486694335938, "global_step": 13327, "epoch": 110} {"train_loss": -26.108591079711914, "global_step": 13328, "epoch": 110} {"train_loss": -26.353906631469727, "global_step": 13329, "epoch": 110} {"train_loss": -26.5933895111084, "global_step": 13330, "epoch": 110} {"train_loss": -26.767765045166016, "global_step": 13331, "epoch": 110} {"train_loss": -26.706823348999023, "global_step": 13332, "epoch": 110} {"train_loss": -26.503324508666992, "global_step": 13333, "epoch": 110} {"train_loss": -26.831769943237305, "global_step": 13334, "epoch": 110} {"train_loss": -26.437530517578125, "global_step": 13335, "epoch": 110} {"train_loss": -26.711286544799805, "global_step": 13336, "epoch": 110} {"train_loss": -26.420263290405273, "global_step": 13337, "epoch": 110} {"train_loss": -26.73968505859375, "global_step": 13338, "epoch": 110} {"train_loss": -26.660049438476562, "global_step": 13339, "epoch": 110} {"train_loss": -27.010156631469727, "global_step": 13340, "epoch": 110} {"train_loss": -26.569360733032227, "global_step": 13341, "epoch": 110} {"train_loss": -26.718244552612305, "global_step": 13342, "epoch": 110} {"train_loss": -26.797494888305664, "global_step": 13343, "epoch": 110} {"train_loss": -26.84762954711914, "global_step": 13344, "epoch": 110} {"train_loss": -26.880390167236328, "global_step": 13345, "epoch": 110} {"train_loss": -27.002851486206055, "global_step": 13346, "epoch": 110} {"train_loss": -26.69304847717285, "global_step": 13347, "epoch": 110} {"train_loss": -27.0330753326416, "global_step": 13348, "epoch": 110} {"train_loss": -27.03059196472168, "global_step": 13349, "epoch": 110} {"train_loss": -27.1269474029541, "global_step": 13350, "epoch": 110} {"train_loss": -27.334680557250977, "global_step": 13351, "epoch": 110} {"train_loss": -26.836355209350586, "global_step": 13352, "epoch": 110} {"train_loss": -27.239471435546875, "global_step": 13353, "epoch": 110} {"train_loss": -27.185155868530273, "global_step": 13354, "epoch": 110} {"train_loss": -26.353851318359375, "global_step": 13355, "epoch": 110} {"train_loss": -26.59806251525879, "global_step": 13356, "epoch": 110} {"train_loss": -26.631460189819336, "global_step": 13357, "epoch": 110} {"train_loss": -26.811370849609375, "global_step": 13358, "epoch": 110} {"train_loss": -27.182058334350586, "global_step": 13359, "epoch": 110} {"train_loss": -26.962858200073242, "global_step": 13360, "epoch": 110} {"train_loss": -26.665363311767578, "global_step": 13361, "epoch": 110} {"train_loss": -25.943378448486328, "global_step": 13362, "epoch": 110} {"train_loss": -24.218252182006836, "global_step": 13363, "epoch": 110} {"train_loss": -25.274606704711914, "global_step": 13364, "epoch": 110} {"train_loss": -25.321264266967773, "global_step": 13365, "epoch": 110} {"train_loss": -25.220355987548828, "global_step": 13366, "epoch": 110} {"train_loss": -26.29279136657715, "global_step": 13367, "epoch": 110} {"train_loss": -25.57282829284668, "global_step": 13368, "epoch": 110} {"train_loss": -25.373870849609375, "global_step": 13369, "epoch": 110} {"train_loss": -25.638330459594727, "global_step": 13370, "epoch": 110} {"train_loss": -24.58016014099121, "global_step": 13371, "epoch": 110} {"train_loss": -24.064605712890625, "global_step": 13372, "epoch": 110} {"train_loss": -25.794647216796875, "global_step": 13373, "epoch": 110} {"train_loss": -25.258874893188477, "global_step": 13374, "epoch": 110} {"train_loss": -24.68768882751465, "global_step": 13375, "epoch": 110} {"train_loss": -25.9871768951416, "global_step": 13376, "epoch": 110} {"train_loss": -26.028390884399414, "global_step": 13377, "epoch": 110} {"train_loss": -25.253950119018555, "global_step": 13378, "epoch": 110} {"train_loss": -26.60378074645996, "global_step": 13379, "epoch": 110} {"train_loss": -26.0319881439209, "global_step": 13380, "epoch": 110} {"train_loss": -26.17898941040039, "global_step": 13381, "epoch": 110} {"train_loss": -26.353302001953125, "global_step": 13382, "epoch": 110} {"train_loss": -25.844192504882812, "global_step": 13383, "epoch": 110} {"train_loss": -25.97627067565918, "global_step": 13384, "epoch": 110} {"train_loss": -26.24396324157715, "global_step": 13385, "epoch": 110} {"train_loss": -26.328901290893555, "global_step": 13386, "epoch": 110} {"train_loss": -26.431472778320312, "global_step": 13387, "epoch": 110} {"train_loss": -26.65449333190918, "global_step": 13388, "epoch": 110} {"train_loss": -26.454450607299805, "global_step": 13389, "epoch": 110} {"train_loss": -26.397104263305664, "global_step": 13390, "epoch": 110} {"train_loss": -26.278600692749023, "global_step": 13391, "epoch": 110} {"train_loss": -26.490629196166992, "global_step": 13392, "epoch": 110} {"train_loss": -26.50629997253418, "global_step": 13393, "epoch": 110} {"train_loss": -26.3092041015625, "global_step": 13394, "epoch": 110} {"train_loss": -26.940872192382812, "global_step": 13395, "epoch": 110} {"train_loss": -26.14948081970215, "global_step": 13396, "epoch": 110} {"train_loss": -27.088422775268555, "global_step": 13397, "epoch": 110} {"train_loss": -26.599294662475586, "global_step": 13398, "epoch": 110} {"train_loss": -26.165637969970703, "global_step": 13399, "epoch": 110} {"train_loss": -26.0196533203125, "global_step": 13400, "epoch": 110} {"train_loss": -26.7369327545166, "global_step": 13401, "epoch": 110} {"train_loss": -26.8381290435791, "global_step": 13402, "epoch": 110} {"train_loss": -26.3716983795166, "global_step": 13403, "epoch": 110} {"train_loss": -25.53536033630371, "global_step": 13404, "epoch": 110} {"train_loss": -26.60957908630371, "global_step": 13405, "epoch": 110} {"train_loss": -26.13521385192871, "global_step": 13406, "epoch": 110} {"train_loss": -26.301664352416992, "global_step": 13407, "epoch": 110} {"train_loss": -26.460113525390625, "global_step": 13408, "epoch": 110} {"train_loss": -26.21177101135254, "global_step": 13409, "epoch": 110} {"train_loss": -26.4793701171875, "global_step": 13410, "epoch": 110} {"train_loss": -26.17665672302246, "global_step": 13411, "epoch": 110} {"train_loss": -26.7678279876709, "global_step": 13412, "epoch": 110} {"train_loss": -26.959253311157227, "global_step": 13413, "epoch": 110} {"train_loss": -26.571516036987305, "global_step": 13414, "epoch": 110} {"train_loss": -26.5367374420166, "global_step": 13415, "epoch": 110} {"train_loss": -26.370914459228516, "global_step": 13416, "epoch": 110} {"train_loss": -26.389150619506836, "global_step": 13417, "epoch": 110} {"train_loss": -26.82583999633789, "global_step": 13418, "epoch": 110} {"train_loss": -25.956262588500977, "global_step": 13419, "epoch": 110} {"train_loss": -26.31460952758789, "global_step": 13420, "epoch": 110} {"train_loss": -25.04861068725586, "global_step": 13421, "epoch": 110} {"train_loss": -25.825286865234375, "global_step": 13422, "epoch": 110} {"train_loss": -26.43048667907715, "global_step": 13423, "epoch": 110} {"train_loss": -26.241485595703125, "global_step": 13424, "epoch": 110} {"train_loss": -26.999881744384766, "global_step": 13425, "epoch": 110} {"train_loss": -26.48463249206543, "global_step": 13426, "epoch": 110} {"train_loss": -27.151029586791992, "global_step": 13427, "epoch": 110} {"train_loss": -26.604665756225586, "global_step": 13428, "epoch": 110} {"train_loss": -26.709333419799805, "global_step": 13429, "epoch": 110} {"train_loss": -26.262933526157347, "global_step": 13430, "epoch": 110, "val_loss": 3030110.75} {"train_loss": -26.383880615234375, "global_step": 13431, "epoch": 111} {"train_loss": -26.241342544555664, "global_step": 13432, "epoch": 111} {"train_loss": -26.749731063842773, "global_step": 13433, "epoch": 111} {"train_loss": -27.175933837890625, "global_step": 13434, "epoch": 111} {"train_loss": -27.283552169799805, "global_step": 13435, "epoch": 111} {"train_loss": -27.14271354675293, "global_step": 13436, "epoch": 111} {"train_loss": -26.36325454711914, "global_step": 13437, "epoch": 111} {"train_loss": -27.56182289123535, "global_step": 13438, "epoch": 111} {"train_loss": -27.353052139282227, "global_step": 13439, "epoch": 111} {"train_loss": -26.688390731811523, "global_step": 13440, "epoch": 111} {"train_loss": -27.30925941467285, "global_step": 13441, "epoch": 111} {"train_loss": -26.776168823242188, "global_step": 13442, "epoch": 111} {"train_loss": -26.3898983001709, "global_step": 13443, "epoch": 111} {"train_loss": -25.20291519165039, "global_step": 13444, "epoch": 111} {"train_loss": -26.504743576049805, "global_step": 13445, "epoch": 111} {"train_loss": -26.32666015625, "global_step": 13446, "epoch": 111} {"train_loss": -26.85597038269043, "global_step": 13447, "epoch": 111} {"train_loss": -26.71514320373535, "global_step": 13448, "epoch": 111} {"train_loss": -26.596662521362305, "global_step": 13449, "epoch": 111} {"train_loss": -27.17506980895996, "global_step": 13450, "epoch": 111} {"train_loss": -26.606809616088867, "global_step": 13451, "epoch": 111} {"train_loss": -27.39896011352539, "global_step": 13452, "epoch": 111} {"train_loss": -26.930622100830078, "global_step": 13453, "epoch": 111} {"train_loss": -25.282453536987305, "global_step": 13454, "epoch": 111} {"train_loss": -24.709814071655273, "global_step": 13455, "epoch": 111} {"train_loss": -22.893329620361328, "global_step": 13456, "epoch": 111} {"train_loss": -25.71773338317871, "global_step": 13457, "epoch": 111} {"train_loss": -26.021848678588867, "global_step": 13458, "epoch": 111} {"train_loss": -25.279220581054688, "global_step": 13459, "epoch": 111} {"train_loss": -26.002532958984375, "global_step": 13460, "epoch": 111} {"train_loss": -25.63446044921875, "global_step": 13461, "epoch": 111} {"train_loss": -25.972137451171875, "global_step": 13462, "epoch": 111} {"train_loss": -26.426605224609375, "global_step": 13463, "epoch": 111} {"train_loss": -26.381479263305664, "global_step": 13464, "epoch": 111} {"train_loss": -26.45319938659668, "global_step": 13465, "epoch": 111} {"train_loss": -26.767444610595703, "global_step": 13466, "epoch": 111} {"train_loss": -27.100387573242188, "global_step": 13467, "epoch": 111} {"train_loss": -26.29511070251465, "global_step": 13468, "epoch": 111} {"train_loss": -26.18589210510254, "global_step": 13469, "epoch": 111} {"train_loss": -26.059167861938477, "global_step": 13470, "epoch": 111} {"train_loss": -26.754932403564453, "global_step": 13471, "epoch": 111} {"train_loss": -26.853696823120117, "global_step": 13472, "epoch": 111} {"train_loss": -26.81552505493164, "global_step": 13473, "epoch": 111} {"train_loss": -27.117578506469727, "global_step": 13474, "epoch": 111} {"train_loss": -26.827661514282227, "global_step": 13475, "epoch": 111} {"train_loss": -27.0759220123291, "global_step": 13476, "epoch": 111} {"train_loss": -26.81271743774414, "global_step": 13477, "epoch": 111} {"train_loss": -26.75971794128418, "global_step": 13478, "epoch": 111} {"train_loss": -26.508848190307617, "global_step": 13479, "epoch": 111} {"train_loss": -27.065420150756836, "global_step": 13480, "epoch": 111} {"train_loss": -27.094587326049805, "global_step": 13481, "epoch": 111} {"train_loss": -27.34598159790039, "global_step": 13482, "epoch": 111} {"train_loss": -27.48984146118164, "global_step": 13483, "epoch": 111} {"train_loss": -27.361785888671875, "global_step": 13484, "epoch": 111} {"train_loss": -27.5267276763916, "global_step": 13485, "epoch": 111} {"train_loss": -27.406835556030273, "global_step": 13486, "epoch": 111} {"train_loss": -27.19532585144043, "global_step": 13487, "epoch": 111} {"train_loss": -27.262725830078125, "global_step": 13488, "epoch": 111} {"train_loss": -26.995773315429688, "global_step": 13489, "epoch": 111} {"train_loss": -27.20161247253418, "global_step": 13490, "epoch": 111} {"train_loss": -26.186582565307617, "global_step": 13491, "epoch": 111} {"train_loss": -24.13701057434082, "global_step": 13492, "epoch": 111} {"train_loss": -18.269542694091797, "global_step": 13493, "epoch": 111} {"train_loss": -11.436979293823242, "global_step": 13494, "epoch": 111} {"train_loss": -17.57358169555664, "global_step": 13495, "epoch": 111} {"train_loss": -24.82944107055664, "global_step": 13496, "epoch": 111} {"train_loss": -20.994848251342773, "global_step": 13497, "epoch": 111} {"train_loss": -24.911033630371094, "global_step": 13498, "epoch": 111} {"train_loss": -26.024372100830078, "global_step": 13499, "epoch": 111} {"train_loss": -23.92207145690918, "global_step": 13500, "epoch": 111} {"train_loss": -25.19950294494629, "global_step": 13501, "epoch": 111} {"train_loss": -25.727252960205078, "global_step": 13502, "epoch": 111} {"train_loss": -25.776565551757812, "global_step": 13503, "epoch": 111} {"train_loss": -24.269216537475586, "global_step": 13504, "epoch": 111} {"train_loss": -25.089601516723633, "global_step": 13505, "epoch": 111} {"train_loss": -25.245054244995117, "global_step": 13506, "epoch": 111} {"train_loss": -26.249841690063477, "global_step": 13507, "epoch": 111} {"train_loss": -26.119312286376953, "global_step": 13508, "epoch": 111} {"train_loss": -25.996124267578125, "global_step": 13509, "epoch": 111} {"train_loss": -25.68434715270996, "global_step": 13510, "epoch": 111} {"train_loss": -25.79313087463379, "global_step": 13511, "epoch": 111} {"train_loss": -25.056310653686523, "global_step": 13512, "epoch": 111} {"train_loss": -25.913068771362305, "global_step": 13513, "epoch": 111} {"train_loss": -26.2194766998291, "global_step": 13514, "epoch": 111} {"train_loss": -26.166259765625, "global_step": 13515, "epoch": 111} {"train_loss": -26.138086318969727, "global_step": 13516, "epoch": 111} {"train_loss": -25.470643997192383, "global_step": 13517, "epoch": 111} {"train_loss": -26.32356071472168, "global_step": 13518, "epoch": 111} {"train_loss": -25.614227294921875, "global_step": 13519, "epoch": 111} {"train_loss": -26.0550537109375, "global_step": 13520, "epoch": 111} {"train_loss": -26.164045333862305, "global_step": 13521, "epoch": 111} {"train_loss": -26.025772094726562, "global_step": 13522, "epoch": 111} {"train_loss": -25.799436569213867, "global_step": 13523, "epoch": 111} {"train_loss": -25.79709243774414, "global_step": 13524, "epoch": 111} {"train_loss": -26.230010986328125, "global_step": 13525, "epoch": 111} {"train_loss": -25.981237411499023, "global_step": 13526, "epoch": 111} {"train_loss": -26.361557006835938, "global_step": 13527, "epoch": 111} {"train_loss": -26.134601593017578, "global_step": 13528, "epoch": 111} {"train_loss": -26.093061447143555, "global_step": 13529, "epoch": 111} {"train_loss": -26.3528995513916, "global_step": 13530, "epoch": 111} {"train_loss": -25.292160034179688, "global_step": 13531, "epoch": 111} {"train_loss": -25.81133460998535, "global_step": 13532, "epoch": 111} {"train_loss": -25.8384952545166, "global_step": 13533, "epoch": 111} {"train_loss": -25.79410743713379, "global_step": 13534, "epoch": 111} {"train_loss": -25.585309982299805, "global_step": 13535, "epoch": 111} {"train_loss": -25.87318229675293, "global_step": 13536, "epoch": 111} {"train_loss": -26.317996978759766, "global_step": 13537, "epoch": 111} {"train_loss": -25.404666900634766, "global_step": 13538, "epoch": 111} {"train_loss": -25.579442977905273, "global_step": 13539, "epoch": 111} {"train_loss": -26.3773136138916, "global_step": 13540, "epoch": 111} {"train_loss": -25.683414459228516, "global_step": 13541, "epoch": 111} {"train_loss": -25.765243530273438, "global_step": 13542, "epoch": 111} {"train_loss": -24.65787124633789, "global_step": 13543, "epoch": 111} {"train_loss": -26.072561264038086, "global_step": 13544, "epoch": 111} {"train_loss": -25.289859771728516, "global_step": 13545, "epoch": 111} {"train_loss": -25.778751373291016, "global_step": 13546, "epoch": 111} {"train_loss": -26.231786727905273, "global_step": 13547, "epoch": 111} {"train_loss": -25.819787979125977, "global_step": 13548, "epoch": 111} {"train_loss": -25.20353126525879, "global_step": 13549, "epoch": 111} {"train_loss": -26.102872848510742, "global_step": 13550, "epoch": 111} {"train_loss": -25.866730335330175, "global_step": 13551, "epoch": 111, "val_loss": 2758137.75} {"train_loss": -26.207111358642578, "global_step": 13552, "epoch": 112} {"train_loss": -25.806884765625, "global_step": 13553, "epoch": 112} {"train_loss": -26.197717666625977, "global_step": 13554, "epoch": 112} {"train_loss": -25.855239868164062, "global_step": 13555, "epoch": 112} {"train_loss": -24.922855377197266, "global_step": 13556, "epoch": 112} {"train_loss": -25.391374588012695, "global_step": 13557, "epoch": 112} {"train_loss": -25.728445053100586, "global_step": 13558, "epoch": 112} {"train_loss": -26.181379318237305, "global_step": 13559, "epoch": 112} {"train_loss": -26.15694236755371, "global_step": 13560, "epoch": 112} {"train_loss": -25.91826820373535, "global_step": 13561, "epoch": 112} {"train_loss": -26.721765518188477, "global_step": 13562, "epoch": 112} {"train_loss": -25.762128829956055, "global_step": 13563, "epoch": 112} {"train_loss": -26.525775909423828, "global_step": 13564, "epoch": 112} {"train_loss": -25.777725219726562, "global_step": 13565, "epoch": 112} {"train_loss": -26.342060089111328, "global_step": 13566, "epoch": 112} {"train_loss": -26.389251708984375, "global_step": 13567, "epoch": 112} {"train_loss": -25.981733322143555, "global_step": 13568, "epoch": 112} {"train_loss": -26.092639923095703, "global_step": 13569, "epoch": 112} {"train_loss": -25.418054580688477, "global_step": 13570, "epoch": 112} {"train_loss": -25.58795166015625, "global_step": 13571, "epoch": 112} {"train_loss": -26.285511016845703, "global_step": 13572, "epoch": 112} {"train_loss": -25.863706588745117, "global_step": 13573, "epoch": 112} {"train_loss": -26.723363876342773, "global_step": 13574, "epoch": 112} {"train_loss": -26.102447509765625, "global_step": 13575, "epoch": 112} {"train_loss": -26.464345932006836, "global_step": 13576, "epoch": 112} {"train_loss": -26.21994972229004, "global_step": 13577, "epoch": 112} {"train_loss": -26.8189640045166, "global_step": 13578, "epoch": 112} {"train_loss": -26.46836280822754, "global_step": 13579, "epoch": 112} {"train_loss": -26.62021827697754, "global_step": 13580, "epoch": 112} {"train_loss": -26.764257431030273, "global_step": 13581, "epoch": 112} {"train_loss": -26.587615966796875, "global_step": 13582, "epoch": 112} {"train_loss": -26.7807559967041, "global_step": 13583, "epoch": 112} {"train_loss": -26.885852813720703, "global_step": 13584, "epoch": 112} {"train_loss": -26.92325782775879, "global_step": 13585, "epoch": 112} {"train_loss": -26.925222396850586, "global_step": 13586, "epoch": 112} {"train_loss": -27.00327491760254, "global_step": 13587, "epoch": 112} {"train_loss": -26.77741050720215, "global_step": 13588, "epoch": 112} {"train_loss": -26.93592643737793, "global_step": 13589, "epoch": 112} {"train_loss": -26.60715103149414, "global_step": 13590, "epoch": 112} {"train_loss": -26.240997314453125, "global_step": 13591, "epoch": 112} {"train_loss": -26.528472900390625, "global_step": 13592, "epoch": 112} {"train_loss": -27.07574462890625, "global_step": 13593, "epoch": 112} {"train_loss": -27.052175521850586, "global_step": 13594, "epoch": 112} {"train_loss": -26.64687156677246, "global_step": 13595, "epoch": 112} {"train_loss": -26.637109756469727, "global_step": 13596, "epoch": 112} {"train_loss": -26.8728084564209, "global_step": 13597, "epoch": 112} {"train_loss": -26.352359771728516, "global_step": 13598, "epoch": 112} {"train_loss": -27.110910415649414, "global_step": 13599, "epoch": 112} {"train_loss": -27.337759017944336, "global_step": 13600, "epoch": 112} {"train_loss": -26.854724884033203, "global_step": 13601, "epoch": 112} {"train_loss": -27.20734977722168, "global_step": 13602, "epoch": 112} {"train_loss": -27.058725357055664, "global_step": 13603, "epoch": 112} {"train_loss": -26.6914005279541, "global_step": 13604, "epoch": 112} {"train_loss": -26.538564682006836, "global_step": 13605, "epoch": 112} {"train_loss": -26.71040153503418, "global_step": 13606, "epoch": 112} {"train_loss": -26.807422637939453, "global_step": 13607, "epoch": 112} {"train_loss": -27.256118774414062, "global_step": 13608, "epoch": 112} {"train_loss": -26.22124671936035, "global_step": 13609, "epoch": 112} {"train_loss": -26.501005172729492, "global_step": 13610, "epoch": 112} {"train_loss": -25.941741943359375, "global_step": 13611, "epoch": 112} {"train_loss": -26.726062774658203, "global_step": 13612, "epoch": 112} {"train_loss": -26.456867218017578, "global_step": 13613, "epoch": 112} {"train_loss": -26.32619285583496, "global_step": 13614, "epoch": 112} {"train_loss": -26.310272216796875, "global_step": 13615, "epoch": 112} {"train_loss": -26.37839698791504, "global_step": 13616, "epoch": 112} {"train_loss": -26.2691593170166, "global_step": 13617, "epoch": 112} {"train_loss": -25.574966430664062, "global_step": 13618, "epoch": 112} {"train_loss": -26.204511642456055, "global_step": 13619, "epoch": 112} {"train_loss": -26.439191818237305, "global_step": 13620, "epoch": 112} {"train_loss": -27.180938720703125, "global_step": 13621, "epoch": 112} {"train_loss": -26.28342056274414, "global_step": 13622, "epoch": 112} {"train_loss": -26.743200302124023, "global_step": 13623, "epoch": 112} {"train_loss": -26.381498336791992, "global_step": 13624, "epoch": 112} {"train_loss": -26.36935806274414, "global_step": 13625, "epoch": 112} {"train_loss": -26.502197265625, "global_step": 13626, "epoch": 112} {"train_loss": -26.66963005065918, "global_step": 13627, "epoch": 112} {"train_loss": -26.83064079284668, "global_step": 13628, "epoch": 112} {"train_loss": -26.008901596069336, "global_step": 13629, "epoch": 112} {"train_loss": -26.955347061157227, "global_step": 13630, "epoch": 112} {"train_loss": -26.92054557800293, "global_step": 13631, "epoch": 112} {"train_loss": -26.758752822875977, "global_step": 13632, "epoch": 112} {"train_loss": -26.391162872314453, "global_step": 13633, "epoch": 112} {"train_loss": -26.013763427734375, "global_step": 13634, "epoch": 112} {"train_loss": -26.180112838745117, "global_step": 13635, "epoch": 112} {"train_loss": -26.517932891845703, "global_step": 13636, "epoch": 112} {"train_loss": -26.258832931518555, "global_step": 13637, "epoch": 112} {"train_loss": -25.81585121154785, "global_step": 13638, "epoch": 112} {"train_loss": -26.260746002197266, "global_step": 13639, "epoch": 112} {"train_loss": -26.63690757751465, "global_step": 13640, "epoch": 112} {"train_loss": -26.437341690063477, "global_step": 13641, "epoch": 112} {"train_loss": -26.190052032470703, "global_step": 13642, "epoch": 112} {"train_loss": -26.31146240234375, "global_step": 13643, "epoch": 112} {"train_loss": -26.84799575805664, "global_step": 13644, "epoch": 112} {"train_loss": -25.666196823120117, "global_step": 13645, "epoch": 112} {"train_loss": -23.341550827026367, "global_step": 13646, "epoch": 112} {"train_loss": -24.66073989868164, "global_step": 13647, "epoch": 112} {"train_loss": -26.396636962890625, "global_step": 13648, "epoch": 112} {"train_loss": -25.203189849853516, "global_step": 13649, "epoch": 112} {"train_loss": -25.073501586914062, "global_step": 13650, "epoch": 112} {"train_loss": -26.253808975219727, "global_step": 13651, "epoch": 112} {"train_loss": -25.86182975769043, "global_step": 13652, "epoch": 112} {"train_loss": -26.13327980041504, "global_step": 13653, "epoch": 112} {"train_loss": -26.0888614654541, "global_step": 13654, "epoch": 112} {"train_loss": -26.211334228515625, "global_step": 13655, "epoch": 112} {"train_loss": -26.7426700592041, "global_step": 13656, "epoch": 112} {"train_loss": -26.586746215820312, "global_step": 13657, "epoch": 112} {"train_loss": -26.692779541015625, "global_step": 13658, "epoch": 112} {"train_loss": -26.50139808654785, "global_step": 13659, "epoch": 112} {"train_loss": -26.675079345703125, "global_step": 13660, "epoch": 112} {"train_loss": -26.538843154907227, "global_step": 13661, "epoch": 112} {"train_loss": -27.028411865234375, "global_step": 13662, "epoch": 112} {"train_loss": -26.781171798706055, "global_step": 13663, "epoch": 112} {"train_loss": -26.65045166015625, "global_step": 13664, "epoch": 112} {"train_loss": -27.058435440063477, "global_step": 13665, "epoch": 112} {"train_loss": -27.21296501159668, "global_step": 13666, "epoch": 112} {"train_loss": -27.0134220123291, "global_step": 13667, "epoch": 112} {"train_loss": -27.006977081298828, "global_step": 13668, "epoch": 112} {"train_loss": -27.591150283813477, "global_step": 13669, "epoch": 112} {"train_loss": -26.769195556640625, "global_step": 13670, "epoch": 112} {"train_loss": -27.236438751220703, "global_step": 13671, "epoch": 112} {"train_loss": -26.419319925229413, "global_step": 13672, "epoch": 112, "val_loss": 2690631.0} {"train_loss": -27.13264274597168, "global_step": 13673, "epoch": 113} {"train_loss": -27.454853057861328, "global_step": 13674, "epoch": 113} {"train_loss": -27.322309494018555, "global_step": 13675, "epoch": 113} {"train_loss": -27.42693519592285, "global_step": 13676, "epoch": 113} {"train_loss": -27.224185943603516, "global_step": 13677, "epoch": 113} {"train_loss": -27.53925132751465, "global_step": 13678, "epoch": 113} {"train_loss": -27.277795791625977, "global_step": 13679, "epoch": 113} {"train_loss": -26.778425216674805, "global_step": 13680, "epoch": 113} {"train_loss": -27.050012588500977, "global_step": 13681, "epoch": 113} {"train_loss": -27.836286544799805, "global_step": 13682, "epoch": 113} {"train_loss": -27.6359806060791, "global_step": 13683, "epoch": 113} {"train_loss": -27.749042510986328, "global_step": 13684, "epoch": 113} {"train_loss": -27.337366104125977, "global_step": 13685, "epoch": 113} {"train_loss": -26.980850219726562, "global_step": 13686, "epoch": 113} {"train_loss": -27.585779190063477, "global_step": 13687, "epoch": 113} {"train_loss": -27.35455894470215, "global_step": 13688, "epoch": 113} {"train_loss": -27.230945587158203, "global_step": 13689, "epoch": 113} {"train_loss": -27.270151138305664, "global_step": 13690, "epoch": 113} {"train_loss": -27.13080406188965, "global_step": 13691, "epoch": 113} {"train_loss": -27.17750358581543, "global_step": 13692, "epoch": 113} {"train_loss": -27.197675704956055, "global_step": 13693, "epoch": 113} {"train_loss": -27.571094512939453, "global_step": 13694, "epoch": 113} {"train_loss": -27.3326358795166, "global_step": 13695, "epoch": 113} {"train_loss": -26.81980323791504, "global_step": 13696, "epoch": 113} {"train_loss": -25.389081954956055, "global_step": 13697, "epoch": 113} {"train_loss": -22.70185661315918, "global_step": 13698, "epoch": 113} {"train_loss": -24.191022872924805, "global_step": 13699, "epoch": 113} {"train_loss": -27.0565242767334, "global_step": 13700, "epoch": 113} {"train_loss": -26.31024742126465, "global_step": 13701, "epoch": 113} {"train_loss": -25.595983505249023, "global_step": 13702, "epoch": 113} {"train_loss": -26.503828048706055, "global_step": 13703, "epoch": 113} {"train_loss": -26.845932006835938, "global_step": 13704, "epoch": 113} {"train_loss": -27.106414794921875, "global_step": 13705, "epoch": 113} {"train_loss": -27.011220932006836, "global_step": 13706, "epoch": 113} {"train_loss": -26.464689254760742, "global_step": 13707, "epoch": 113} {"train_loss": -26.33099937438965, "global_step": 13708, "epoch": 113} {"train_loss": -25.209156036376953, "global_step": 13709, "epoch": 113} {"train_loss": -26.003894805908203, "global_step": 13710, "epoch": 113} {"train_loss": -26.684497833251953, "global_step": 13711, "epoch": 113} {"train_loss": -27.061817169189453, "global_step": 13712, "epoch": 113} {"train_loss": -25.598432540893555, "global_step": 13713, "epoch": 113} {"train_loss": -25.649982452392578, "global_step": 13714, "epoch": 113} {"train_loss": -26.535369873046875, "global_step": 13715, "epoch": 113} {"train_loss": -26.3697509765625, "global_step": 13716, "epoch": 113} {"train_loss": -26.48147964477539, "global_step": 13717, "epoch": 113} {"train_loss": -26.6035099029541, "global_step": 13718, "epoch": 113} {"train_loss": -26.77693748474121, "global_step": 13719, "epoch": 113} {"train_loss": -26.14422607421875, "global_step": 13720, "epoch": 113} {"train_loss": -25.879566192626953, "global_step": 13721, "epoch": 113} {"train_loss": -26.75225830078125, "global_step": 13722, "epoch": 113} {"train_loss": -26.359342575073242, "global_step": 13723, "epoch": 113} {"train_loss": -26.974878311157227, "global_step": 13724, "epoch": 113} {"train_loss": -27.080280303955078, "global_step": 13725, "epoch": 113} {"train_loss": -26.567779541015625, "global_step": 13726, "epoch": 113} {"train_loss": -26.47376823425293, "global_step": 13727, "epoch": 113} {"train_loss": -26.2545108795166, "global_step": 13728, "epoch": 113} {"train_loss": -27.078367233276367, "global_step": 13729, "epoch": 113} {"train_loss": -26.622894287109375, "global_step": 13730, "epoch": 113} {"train_loss": -26.59437370300293, "global_step": 13731, "epoch": 113} {"train_loss": -26.167829513549805, "global_step": 13732, "epoch": 113} {"train_loss": -26.816404342651367, "global_step": 13733, "epoch": 113} {"train_loss": -26.60595703125, "global_step": 13734, "epoch": 113} {"train_loss": -26.76266860961914, "global_step": 13735, "epoch": 113} {"train_loss": -27.338775634765625, "global_step": 13736, "epoch": 113} {"train_loss": -26.989286422729492, "global_step": 13737, "epoch": 113} {"train_loss": -27.191009521484375, "global_step": 13738, "epoch": 113} {"train_loss": -26.785797119140625, "global_step": 13739, "epoch": 113} {"train_loss": -27.380828857421875, "global_step": 13740, "epoch": 113} {"train_loss": -27.061450958251953, "global_step": 13741, "epoch": 113} {"train_loss": -27.3588924407959, "global_step": 13742, "epoch": 113} {"train_loss": -27.255781173706055, "global_step": 13743, "epoch": 113} {"train_loss": -27.084264755249023, "global_step": 13744, "epoch": 113} {"train_loss": -26.873626708984375, "global_step": 13745, "epoch": 113} {"train_loss": -26.067031860351562, "global_step": 13746, "epoch": 113} {"train_loss": -25.188840866088867, "global_step": 13747, "epoch": 113} {"train_loss": -26.3356990814209, "global_step": 13748, "epoch": 113} {"train_loss": -26.874670028686523, "global_step": 13749, "epoch": 113} {"train_loss": -27.0490779876709, "global_step": 13750, "epoch": 113} {"train_loss": -26.310306549072266, "global_step": 13751, "epoch": 113} {"train_loss": -26.288076400756836, "global_step": 13752, "epoch": 113} {"train_loss": -27.423444747924805, "global_step": 13753, "epoch": 113} {"train_loss": -26.397998809814453, "global_step": 13754, "epoch": 113} {"train_loss": -24.434707641601562, "global_step": 13755, "epoch": 113} {"train_loss": -24.702693939208984, "global_step": 13756, "epoch": 113} {"train_loss": -26.0161075592041, "global_step": 13757, "epoch": 113} {"train_loss": -26.773696899414062, "global_step": 13758, "epoch": 113} {"train_loss": -26.64274024963379, "global_step": 13759, "epoch": 113} {"train_loss": -26.196142196655273, "global_step": 13760, "epoch": 113} {"train_loss": -27.139562606811523, "global_step": 13761, "epoch": 113} {"train_loss": -26.58369255065918, "global_step": 13762, "epoch": 113} {"train_loss": -27.15899085998535, "global_step": 13763, "epoch": 113} {"train_loss": -26.79134178161621, "global_step": 13764, "epoch": 113} {"train_loss": -26.409570693969727, "global_step": 13765, "epoch": 113} {"train_loss": -26.735248565673828, "global_step": 13766, "epoch": 113} {"train_loss": -27.001813888549805, "global_step": 13767, "epoch": 113} {"train_loss": -26.909961700439453, "global_step": 13768, "epoch": 113} {"train_loss": -27.104053497314453, "global_step": 13769, "epoch": 113} {"train_loss": -26.936298370361328, "global_step": 13770, "epoch": 113} {"train_loss": -26.938901901245117, "global_step": 13771, "epoch": 113} {"train_loss": -26.862430572509766, "global_step": 13772, "epoch": 113} {"train_loss": -27.29560661315918, "global_step": 13773, "epoch": 113} {"train_loss": -27.0548152923584, "global_step": 13774, "epoch": 113} {"train_loss": -27.662582397460938, "global_step": 13775, "epoch": 113} {"train_loss": -27.24295425415039, "global_step": 13776, "epoch": 113} {"train_loss": -27.257925033569336, "global_step": 13777, "epoch": 113} {"train_loss": -27.380002975463867, "global_step": 13778, "epoch": 113} {"train_loss": -27.061756134033203, "global_step": 13779, "epoch": 113} {"train_loss": -27.18558692932129, "global_step": 13780, "epoch": 113} {"train_loss": -27.08154296875, "global_step": 13781, "epoch": 113} {"train_loss": -26.695844650268555, "global_step": 13782, "epoch": 113} {"train_loss": -26.754093170166016, "global_step": 13783, "epoch": 113} {"train_loss": -26.198705673217773, "global_step": 13784, "epoch": 113} {"train_loss": -24.922048568725586, "global_step": 13785, "epoch": 113} {"train_loss": -24.896499633789062, "global_step": 13786, "epoch": 113} {"train_loss": -26.76901626586914, "global_step": 13787, "epoch": 113} {"train_loss": -26.717853546142578, "global_step": 13788, "epoch": 113} {"train_loss": -25.2678279876709, "global_step": 13789, "epoch": 113} {"train_loss": -27.03053092956543, "global_step": 13790, "epoch": 113} {"train_loss": -26.07759666442871, "global_step": 13791, "epoch": 113} {"train_loss": -24.50819969177246, "global_step": 13792, "epoch": 113} {"train_loss": -26.652287475333726, "global_step": 13793, "epoch": 113, "val_loss": 2735736.25} {"train_loss": -26.44191551208496, "global_step": 13794, "epoch": 114} {"train_loss": -26.35658836364746, "global_step": 13795, "epoch": 114} {"train_loss": -27.262042999267578, "global_step": 13796, "epoch": 114} {"train_loss": -26.517126083374023, "global_step": 13797, "epoch": 114} {"train_loss": -26.481658935546875, "global_step": 13798, "epoch": 114} {"train_loss": -27.375097274780273, "global_step": 13799, "epoch": 114} {"train_loss": -26.702219009399414, "global_step": 13800, "epoch": 114} {"train_loss": -26.834543228149414, "global_step": 13801, "epoch": 114} {"train_loss": -27.323240280151367, "global_step": 13802, "epoch": 114} {"train_loss": -27.114362716674805, "global_step": 13803, "epoch": 114} {"train_loss": -26.771224975585938, "global_step": 13804, "epoch": 114} {"train_loss": -27.1430606842041, "global_step": 13805, "epoch": 114} {"train_loss": -27.341251373291016, "global_step": 13806, "epoch": 114} {"train_loss": -26.906280517578125, "global_step": 13807, "epoch": 114} {"train_loss": -27.66106605529785, "global_step": 13808, "epoch": 114} {"train_loss": -27.275772094726562, "global_step": 13809, "epoch": 114} {"train_loss": -27.474929809570312, "global_step": 13810, "epoch": 114} {"train_loss": -27.331165313720703, "global_step": 13811, "epoch": 114} {"train_loss": -27.199857711791992, "global_step": 13812, "epoch": 114} {"train_loss": -27.379199981689453, "global_step": 13813, "epoch": 114} {"train_loss": -27.34540367126465, "global_step": 13814, "epoch": 114} {"train_loss": -27.513803482055664, "global_step": 13815, "epoch": 114} {"train_loss": -27.4588680267334, "global_step": 13816, "epoch": 114} {"train_loss": -28.08001136779785, "global_step": 13817, "epoch": 114} {"train_loss": -27.691370010375977, "global_step": 13818, "epoch": 114} {"train_loss": -27.420440673828125, "global_step": 13819, "epoch": 114} {"train_loss": -27.505096435546875, "global_step": 13820, "epoch": 114} {"train_loss": -27.374658584594727, "global_step": 13821, "epoch": 114} {"train_loss": -27.660898208618164, "global_step": 13822, "epoch": 114} {"train_loss": -27.610010147094727, "global_step": 13823, "epoch": 114} {"train_loss": -26.843698501586914, "global_step": 13824, "epoch": 114} {"train_loss": -26.937591552734375, "global_step": 13825, "epoch": 114} {"train_loss": -27.049697875976562, "global_step": 13826, "epoch": 114} {"train_loss": -27.223575592041016, "global_step": 13827, "epoch": 114} {"train_loss": -27.0122013092041, "global_step": 13828, "epoch": 114} {"train_loss": -25.968061447143555, "global_step": 13829, "epoch": 114} {"train_loss": -27.74250602722168, "global_step": 13830, "epoch": 114} {"train_loss": -26.84575843811035, "global_step": 13831, "epoch": 114} {"train_loss": -27.316787719726562, "global_step": 13832, "epoch": 114} {"train_loss": -26.770034790039062, "global_step": 13833, "epoch": 114} {"train_loss": -27.469335556030273, "global_step": 13834, "epoch": 114} {"train_loss": -27.294086456298828, "global_step": 13835, "epoch": 114} {"train_loss": -27.5643310546875, "global_step": 13836, "epoch": 114} {"train_loss": -27.868717193603516, "global_step": 13837, "epoch": 114} {"train_loss": -27.80756950378418, "global_step": 13838, "epoch": 114} {"train_loss": -26.658252716064453, "global_step": 13839, "epoch": 114} {"train_loss": -25.239133834838867, "global_step": 13840, "epoch": 114} {"train_loss": -22.55392074584961, "global_step": 13841, "epoch": 114} {"train_loss": -20.663352966308594, "global_step": 13842, "epoch": 114} {"train_loss": -18.322494506835938, "global_step": 13843, "epoch": 114} {"train_loss": -19.715391159057617, "global_step": 13844, "epoch": 114} {"train_loss": -26.87442970275879, "global_step": 13845, "epoch": 114} {"train_loss": -25.053434371948242, "global_step": 13846, "epoch": 114} {"train_loss": -27.016937255859375, "global_step": 13847, "epoch": 114} {"train_loss": -25.174867630004883, "global_step": 13848, "epoch": 114} {"train_loss": -26.015838623046875, "global_step": 13849, "epoch": 114} {"train_loss": -24.567541122436523, "global_step": 13850, "epoch": 114} {"train_loss": -25.83396339416504, "global_step": 13851, "epoch": 114} {"train_loss": -26.59872817993164, "global_step": 13852, "epoch": 114} {"train_loss": -25.811328887939453, "global_step": 13853, "epoch": 114} {"train_loss": -26.552419662475586, "global_step": 13854, "epoch": 114} {"train_loss": -25.5158634185791, "global_step": 13855, "epoch": 114} {"train_loss": -25.866153717041016, "global_step": 13856, "epoch": 114} {"train_loss": -26.39276123046875, "global_step": 13857, "epoch": 114} {"train_loss": -26.154455184936523, "global_step": 13858, "epoch": 114} {"train_loss": -26.485029220581055, "global_step": 13859, "epoch": 114} {"train_loss": -26.176767349243164, "global_step": 13860, "epoch": 114} {"train_loss": -25.759618759155273, "global_step": 13861, "epoch": 114} {"train_loss": -27.008222579956055, "global_step": 13862, "epoch": 114} {"train_loss": -26.389404296875, "global_step": 13863, "epoch": 114} {"train_loss": -26.152008056640625, "global_step": 13864, "epoch": 114} {"train_loss": -26.874765396118164, "global_step": 13865, "epoch": 114} {"train_loss": -26.859716415405273, "global_step": 13866, "epoch": 114} {"train_loss": -26.797330856323242, "global_step": 13867, "epoch": 114} {"train_loss": -26.776565551757812, "global_step": 13868, "epoch": 114} {"train_loss": -26.768009185791016, "global_step": 13869, "epoch": 114} {"train_loss": -27.347991943359375, "global_step": 13870, "epoch": 114} {"train_loss": -26.7893123626709, "global_step": 13871, "epoch": 114} {"train_loss": -27.085657119750977, "global_step": 13872, "epoch": 114} {"train_loss": -26.6275691986084, "global_step": 13873, "epoch": 114} {"train_loss": -26.912023544311523, "global_step": 13874, "epoch": 114} {"train_loss": -26.624921798706055, "global_step": 13875, "epoch": 114} {"train_loss": -26.670312881469727, "global_step": 13876, "epoch": 114} {"train_loss": -26.97955894470215, "global_step": 13877, "epoch": 114} {"train_loss": -26.58979606628418, "global_step": 13878, "epoch": 114} {"train_loss": -26.5887393951416, "global_step": 13879, "epoch": 114} {"train_loss": -26.747411727905273, "global_step": 13880, "epoch": 114} {"train_loss": -25.524555206298828, "global_step": 13881, "epoch": 114} {"train_loss": -22.23299217224121, "global_step": 13882, "epoch": 114} {"train_loss": -20.192895889282227, "global_step": 13883, "epoch": 114} {"train_loss": -24.844425201416016, "global_step": 13884, "epoch": 114} {"train_loss": -27.00245475769043, "global_step": 13885, "epoch": 114} {"train_loss": -24.039464950561523, "global_step": 13886, "epoch": 114} {"train_loss": -25.985305786132812, "global_step": 13887, "epoch": 114} {"train_loss": -24.424720764160156, "global_step": 13888, "epoch": 114} {"train_loss": -24.798086166381836, "global_step": 13889, "epoch": 114} {"train_loss": -24.261014938354492, "global_step": 13890, "epoch": 114} {"train_loss": -25.48917579650879, "global_step": 13891, "epoch": 114} {"train_loss": -23.69359588623047, "global_step": 13892, "epoch": 114} {"train_loss": -26.303558349609375, "global_step": 13893, "epoch": 114} {"train_loss": -24.630966186523438, "global_step": 13894, "epoch": 114} {"train_loss": -25.404598236083984, "global_step": 13895, "epoch": 114} {"train_loss": -26.4006404876709, "global_step": 13896, "epoch": 114} {"train_loss": -25.210163116455078, "global_step": 13897, "epoch": 114} {"train_loss": -26.886056900024414, "global_step": 13898, "epoch": 114} {"train_loss": -26.17463493347168, "global_step": 13899, "epoch": 114} {"train_loss": -26.16507911682129, "global_step": 13900, "epoch": 114} {"train_loss": -26.040363311767578, "global_step": 13901, "epoch": 114} {"train_loss": -26.098779678344727, "global_step": 13902, "epoch": 114} {"train_loss": -25.981115341186523, "global_step": 13903, "epoch": 114} {"train_loss": -26.412199020385742, "global_step": 13904, "epoch": 114} {"train_loss": -26.166213989257812, "global_step": 13905, "epoch": 114} {"train_loss": -26.400800704956055, "global_step": 13906, "epoch": 114} {"train_loss": -26.211957931518555, "global_step": 13907, "epoch": 114} {"train_loss": -27.001102447509766, "global_step": 13908, "epoch": 114} {"train_loss": -26.43478775024414, "global_step": 13909, "epoch": 114} {"train_loss": -26.64322853088379, "global_step": 13910, "epoch": 114} {"train_loss": -26.497644424438477, "global_step": 13911, "epoch": 114} {"train_loss": -25.860376358032227, "global_step": 13912, "epoch": 114} {"train_loss": -26.574262619018555, "global_step": 13913, "epoch": 114} {"train_loss": -26.252295438908348, "global_step": 13914, "epoch": 114, "val_loss": 3046440.75} {"train_loss": -24.144134521484375, "global_step": 13915, "epoch": 115} {"train_loss": -21.91373062133789, "global_step": 13916, "epoch": 115} {"train_loss": -25.243141174316406, "global_step": 13917, "epoch": 115} {"train_loss": -26.0103702545166, "global_step": 13918, "epoch": 115} {"train_loss": -24.283458709716797, "global_step": 13919, "epoch": 115} {"train_loss": -26.384206771850586, "global_step": 13920, "epoch": 115} {"train_loss": -25.0911808013916, "global_step": 13921, "epoch": 115} {"train_loss": -26.11555290222168, "global_step": 13922, "epoch": 115} {"train_loss": -26.177276611328125, "global_step": 13923, "epoch": 115} {"train_loss": -26.430673599243164, "global_step": 13924, "epoch": 115} {"train_loss": -26.47602653503418, "global_step": 13925, "epoch": 115} {"train_loss": -25.87369155883789, "global_step": 13926, "epoch": 115} {"train_loss": -26.72900390625, "global_step": 13927, "epoch": 115} {"train_loss": -26.422571182250977, "global_step": 13928, "epoch": 115} {"train_loss": -26.620960235595703, "global_step": 13929, "epoch": 115} {"train_loss": -26.6267147064209, "global_step": 13930, "epoch": 115} {"train_loss": -26.718124389648438, "global_step": 13931, "epoch": 115} {"train_loss": -26.73687171936035, "global_step": 13932, "epoch": 115} {"train_loss": -26.8033447265625, "global_step": 13933, "epoch": 115} {"train_loss": -26.6787109375, "global_step": 13934, "epoch": 115} {"train_loss": -26.974533081054688, "global_step": 13935, "epoch": 115} {"train_loss": -26.720661163330078, "global_step": 13936, "epoch": 115} {"train_loss": -26.654987335205078, "global_step": 13937, "epoch": 115} {"train_loss": -26.8295841217041, "global_step": 13938, "epoch": 115} {"train_loss": -26.909137725830078, "global_step": 13939, "epoch": 115} {"train_loss": -27.094465255737305, "global_step": 13940, "epoch": 115} {"train_loss": -27.058155059814453, "global_step": 13941, "epoch": 115} {"train_loss": -27.231313705444336, "global_step": 13942, "epoch": 115} {"train_loss": -27.164457321166992, "global_step": 13943, "epoch": 115} {"train_loss": -26.47210121154785, "global_step": 13944, "epoch": 115} {"train_loss": -27.280054092407227, "global_step": 13945, "epoch": 115} {"train_loss": -26.900360107421875, "global_step": 13946, "epoch": 115} {"train_loss": -27.179168701171875, "global_step": 13947, "epoch": 115} {"train_loss": -27.196029663085938, "global_step": 13948, "epoch": 115} {"train_loss": -27.23333740234375, "global_step": 13949, "epoch": 115} {"train_loss": -26.951398849487305, "global_step": 13950, "epoch": 115} {"train_loss": -26.85442543029785, "global_step": 13951, "epoch": 115} {"train_loss": -27.371809005737305, "global_step": 13952, "epoch": 115} {"train_loss": -27.27876091003418, "global_step": 13953, "epoch": 115} {"train_loss": -27.460205078125, "global_step": 13954, "epoch": 115} {"train_loss": -27.125608444213867, "global_step": 13955, "epoch": 115} {"train_loss": -27.4344425201416, "global_step": 13956, "epoch": 115} {"train_loss": -27.35773277282715, "global_step": 13957, "epoch": 115} {"train_loss": -27.4631404876709, "global_step": 13958, "epoch": 115} {"train_loss": -27.494232177734375, "global_step": 13959, "epoch": 115} {"train_loss": -27.27679443359375, "global_step": 13960, "epoch": 115} {"train_loss": -26.427160263061523, "global_step": 13961, "epoch": 115} {"train_loss": -27.62860107421875, "global_step": 13962, "epoch": 115} {"train_loss": -27.321929931640625, "global_step": 13963, "epoch": 115} {"train_loss": -27.387012481689453, "global_step": 13964, "epoch": 115} {"train_loss": -27.570449829101562, "global_step": 13965, "epoch": 115} {"train_loss": -27.75017738342285, "global_step": 13966, "epoch": 115} {"train_loss": -27.51313591003418, "global_step": 13967, "epoch": 115} {"train_loss": -27.153852462768555, "global_step": 13968, "epoch": 115} {"train_loss": -28.040313720703125, "global_step": 13969, "epoch": 115} {"train_loss": -27.85017204284668, "global_step": 13970, "epoch": 115} {"train_loss": -27.322362899780273, "global_step": 13971, "epoch": 115} {"train_loss": -27.908742904663086, "global_step": 13972, "epoch": 115} {"train_loss": -27.369129180908203, "global_step": 13973, "epoch": 115} {"train_loss": -27.71381187438965, "global_step": 13974, "epoch": 115} {"train_loss": -27.810644149780273, "global_step": 13975, "epoch": 115} {"train_loss": -27.5755672454834, "global_step": 13976, "epoch": 115} {"train_loss": -27.325626373291016, "global_step": 13977, "epoch": 115} {"train_loss": -27.58523941040039, "global_step": 13978, "epoch": 115} {"train_loss": -27.316492080688477, "global_step": 13979, "epoch": 115} {"train_loss": -27.564035415649414, "global_step": 13980, "epoch": 115} {"train_loss": -27.612430572509766, "global_step": 13981, "epoch": 115} {"train_loss": -27.666833877563477, "global_step": 13982, "epoch": 115} {"train_loss": -28.04532241821289, "global_step": 13983, "epoch": 115} {"train_loss": -28.05605125427246, "global_step": 13984, "epoch": 115} {"train_loss": -27.59156608581543, "global_step": 13985, "epoch": 115} {"train_loss": -27.51691246032715, "global_step": 13986, "epoch": 115} {"train_loss": -27.72177505493164, "global_step": 13987, "epoch": 115} {"train_loss": -27.84228515625, "global_step": 13988, "epoch": 115} {"train_loss": -27.2227725982666, "global_step": 13989, "epoch": 115} {"train_loss": -26.16887855529785, "global_step": 13990, "epoch": 115} {"train_loss": -22.953197479248047, "global_step": 13991, "epoch": 115} {"train_loss": -17.470869064331055, "global_step": 13992, "epoch": 115} {"train_loss": -9.459699630737305, "global_step": 13993, "epoch": 115} {"train_loss": -19.184429168701172, "global_step": 13994, "epoch": 115} {"train_loss": -23.9182186126709, "global_step": 13995, "epoch": 115} {"train_loss": -23.167137145996094, "global_step": 13996, "epoch": 115} {"train_loss": -23.245880126953125, "global_step": 13997, "epoch": 115} {"train_loss": -25.27436637878418, "global_step": 13998, "epoch": 115} {"train_loss": -24.858890533447266, "global_step": 13999, "epoch": 115} {"train_loss": -24.98310089111328, "global_step": 14000, "epoch": 115} {"train_loss": -24.561141967773438, "global_step": 14001, "epoch": 115} {"train_loss": -25.508750915527344, "global_step": 14002, "epoch": 115} {"train_loss": -26.246524810791016, "global_step": 14003, "epoch": 115} {"train_loss": -24.948293685913086, "global_step": 14004, "epoch": 115} {"train_loss": -25.613630294799805, "global_step": 14005, "epoch": 115} {"train_loss": -26.2545166015625, "global_step": 14006, "epoch": 115} {"train_loss": -25.876514434814453, "global_step": 14007, "epoch": 115} {"train_loss": -25.876081466674805, "global_step": 14008, "epoch": 115} {"train_loss": -25.675708770751953, "global_step": 14009, "epoch": 115} {"train_loss": -25.54929542541504, "global_step": 14010, "epoch": 115} {"train_loss": -25.39487075805664, "global_step": 14011, "epoch": 115} {"train_loss": -25.018081665039062, "global_step": 14012, "epoch": 115} {"train_loss": -25.57102394104004, "global_step": 14013, "epoch": 115} {"train_loss": -25.444631576538086, "global_step": 14014, "epoch": 115} {"train_loss": -26.674543380737305, "global_step": 14015, "epoch": 115} {"train_loss": -26.004398345947266, "global_step": 14016, "epoch": 115} {"train_loss": -25.625593185424805, "global_step": 14017, "epoch": 115} {"train_loss": -26.2148494720459, "global_step": 14018, "epoch": 115} {"train_loss": -25.52370262145996, "global_step": 14019, "epoch": 115} {"train_loss": -26.453479766845703, "global_step": 14020, "epoch": 115} {"train_loss": -26.91985511779785, "global_step": 14021, "epoch": 115} {"train_loss": -25.409482955932617, "global_step": 14022, "epoch": 115} {"train_loss": -26.0036563873291, "global_step": 14023, "epoch": 115} {"train_loss": -26.177831649780273, "global_step": 14024, "epoch": 115} {"train_loss": -25.832555770874023, "global_step": 14025, "epoch": 115} {"train_loss": -26.31363868713379, "global_step": 14026, "epoch": 115} {"train_loss": -26.290912628173828, "global_step": 14027, "epoch": 115} {"train_loss": -26.206968307495117, "global_step": 14028, "epoch": 115} {"train_loss": -25.032041549682617, "global_step": 14029, "epoch": 115} {"train_loss": -25.14635467529297, "global_step": 14030, "epoch": 115} {"train_loss": -25.916950225830078, "global_step": 14031, "epoch": 115} {"train_loss": -26.00721549987793, "global_step": 14032, "epoch": 115} {"train_loss": -26.46352195739746, "global_step": 14033, "epoch": 115} {"train_loss": -25.52585220336914, "global_step": 14034, "epoch": 115} {"train_loss": -26.16537207611336, "global_step": 14035, "epoch": 115, "val_loss": 2716837.75} {"train_loss": -26.114398956298828, "global_step": 14036, "epoch": 116} {"train_loss": -26.46881103515625, "global_step": 14037, "epoch": 116} {"train_loss": -26.320697784423828, "global_step": 14038, "epoch": 116} {"train_loss": -26.111013412475586, "global_step": 14039, "epoch": 116} {"train_loss": -26.2976131439209, "global_step": 14040, "epoch": 116} {"train_loss": -26.793561935424805, "global_step": 14041, "epoch": 116} {"train_loss": -26.191802978515625, "global_step": 14042, "epoch": 116} {"train_loss": -26.541839599609375, "global_step": 14043, "epoch": 116} {"train_loss": -26.435659408569336, "global_step": 14044, "epoch": 116} {"train_loss": -26.609054565429688, "global_step": 14045, "epoch": 116} {"train_loss": -26.6802978515625, "global_step": 14046, "epoch": 116} {"train_loss": -26.175024032592773, "global_step": 14047, "epoch": 116} {"train_loss": -26.264429092407227, "global_step": 14048, "epoch": 116} {"train_loss": -26.60471534729004, "global_step": 14049, "epoch": 116} {"train_loss": -26.370309829711914, "global_step": 14050, "epoch": 116} {"train_loss": -25.97197914123535, "global_step": 14051, "epoch": 116} {"train_loss": -26.789398193359375, "global_step": 14052, "epoch": 116} {"train_loss": -26.471677780151367, "global_step": 14053, "epoch": 116} {"train_loss": -25.901615142822266, "global_step": 14054, "epoch": 116} {"train_loss": -25.91943359375, "global_step": 14055, "epoch": 116} {"train_loss": -26.17298698425293, "global_step": 14056, "epoch": 116} {"train_loss": -27.079853057861328, "global_step": 14057, "epoch": 116} {"train_loss": -26.668445587158203, "global_step": 14058, "epoch": 116} {"train_loss": -26.14527702331543, "global_step": 14059, "epoch": 116} {"train_loss": -27.038156509399414, "global_step": 14060, "epoch": 116} {"train_loss": -26.908533096313477, "global_step": 14061, "epoch": 116} {"train_loss": -26.317920684814453, "global_step": 14062, "epoch": 116} {"train_loss": -26.842926025390625, "global_step": 14063, "epoch": 116} {"train_loss": -26.282785415649414, "global_step": 14064, "epoch": 116} {"train_loss": -26.67978858947754, "global_step": 14065, "epoch": 116} {"train_loss": -26.003889083862305, "global_step": 14066, "epoch": 116} {"train_loss": -26.602863311767578, "global_step": 14067, "epoch": 116} {"train_loss": -26.69685173034668, "global_step": 14068, "epoch": 116} {"train_loss": -26.766571044921875, "global_step": 14069, "epoch": 116} {"train_loss": -26.447986602783203, "global_step": 14070, "epoch": 116} {"train_loss": -26.75568199157715, "global_step": 14071, "epoch": 116} {"train_loss": -27.01649284362793, "global_step": 14072, "epoch": 116} {"train_loss": -27.018651962280273, "global_step": 14073, "epoch": 116} {"train_loss": -26.923181533813477, "global_step": 14074, "epoch": 116} {"train_loss": -27.027252197265625, "global_step": 14075, "epoch": 116} {"train_loss": -27.452682495117188, "global_step": 14076, "epoch": 116} {"train_loss": -26.845361709594727, "global_step": 14077, "epoch": 116} {"train_loss": -27.250751495361328, "global_step": 14078, "epoch": 116} {"train_loss": -26.404443740844727, "global_step": 14079, "epoch": 116} {"train_loss": -27.266305923461914, "global_step": 14080, "epoch": 116} {"train_loss": -26.52829933166504, "global_step": 14081, "epoch": 116} {"train_loss": -27.038089752197266, "global_step": 14082, "epoch": 116} {"train_loss": -26.43958854675293, "global_step": 14083, "epoch": 116} {"train_loss": -26.810285568237305, "global_step": 14084, "epoch": 116} {"train_loss": -26.721343994140625, "global_step": 14085, "epoch": 116} {"train_loss": -26.893890380859375, "global_step": 14086, "epoch": 116} {"train_loss": -26.42180824279785, "global_step": 14087, "epoch": 116} {"train_loss": -25.537778854370117, "global_step": 14088, "epoch": 116} {"train_loss": -25.108367919921875, "global_step": 14089, "epoch": 116} {"train_loss": -25.635074615478516, "global_step": 14090, "epoch": 116} {"train_loss": -26.489221572875977, "global_step": 14091, "epoch": 116} {"train_loss": -27.23847770690918, "global_step": 14092, "epoch": 116} {"train_loss": -24.665006637573242, "global_step": 14093, "epoch": 116} {"train_loss": -24.998306274414062, "global_step": 14094, "epoch": 116} {"train_loss": -26.11480140686035, "global_step": 14095, "epoch": 116} {"train_loss": -26.027454376220703, "global_step": 14096, "epoch": 116} {"train_loss": -26.435590744018555, "global_step": 14097, "epoch": 116} {"train_loss": -26.872644424438477, "global_step": 14098, "epoch": 116} {"train_loss": -25.42176628112793, "global_step": 14099, "epoch": 116} {"train_loss": -26.717493057250977, "global_step": 14100, "epoch": 116} {"train_loss": -26.20953941345215, "global_step": 14101, "epoch": 116} {"train_loss": -26.281646728515625, "global_step": 14102, "epoch": 116} {"train_loss": -26.499725341796875, "global_step": 14103, "epoch": 116} {"train_loss": -26.60255241394043, "global_step": 14104, "epoch": 116} {"train_loss": -27.442108154296875, "global_step": 14105, "epoch": 116} {"train_loss": -26.33729362487793, "global_step": 14106, "epoch": 116} {"train_loss": -26.295257568359375, "global_step": 14107, "epoch": 116} {"train_loss": -26.243139266967773, "global_step": 14108, "epoch": 116} {"train_loss": -26.981618881225586, "global_step": 14109, "epoch": 116} {"train_loss": -26.72857666015625, "global_step": 14110, "epoch": 116} {"train_loss": -26.538354873657227, "global_step": 14111, "epoch": 116} {"train_loss": -26.864059448242188, "global_step": 14112, "epoch": 116} {"train_loss": -26.87701988220215, "global_step": 14113, "epoch": 116} {"train_loss": -27.07710075378418, "global_step": 14114, "epoch": 116} {"train_loss": -26.57551383972168, "global_step": 14115, "epoch": 116} {"train_loss": -27.0056095123291, "global_step": 14116, "epoch": 116} {"train_loss": -26.9400634765625, "global_step": 14117, "epoch": 116} {"train_loss": -26.987781524658203, "global_step": 14118, "epoch": 116} {"train_loss": -27.184951782226562, "global_step": 14119, "epoch": 116} {"train_loss": -27.07792091369629, "global_step": 14120, "epoch": 116} {"train_loss": -27.117399215698242, "global_step": 14121, "epoch": 116} {"train_loss": -27.587966918945312, "global_step": 14122, "epoch": 116} {"train_loss": -26.65409278869629, "global_step": 14123, "epoch": 116} {"train_loss": -27.357776641845703, "global_step": 14124, "epoch": 116} {"train_loss": -27.051294326782227, "global_step": 14125, "epoch": 116} {"train_loss": -27.086963653564453, "global_step": 14126, "epoch": 116} {"train_loss": -27.199487686157227, "global_step": 14127, "epoch": 116} {"train_loss": -27.1909236907959, "global_step": 14128, "epoch": 116} {"train_loss": -26.8674259185791, "global_step": 14129, "epoch": 116} {"train_loss": -26.672285079956055, "global_step": 14130, "epoch": 116} {"train_loss": -25.96902847290039, "global_step": 14131, "epoch": 116} {"train_loss": -26.279190063476562, "global_step": 14132, "epoch": 116} {"train_loss": -25.54249382019043, "global_step": 14133, "epoch": 116} {"train_loss": -25.511423110961914, "global_step": 14134, "epoch": 116} {"train_loss": -25.858489990234375, "global_step": 14135, "epoch": 116} {"train_loss": -26.21026039123535, "global_step": 14136, "epoch": 116} {"train_loss": -25.939870834350586, "global_step": 14137, "epoch": 116} {"train_loss": -26.471094131469727, "global_step": 14138, "epoch": 116} {"train_loss": -25.887205123901367, "global_step": 14139, "epoch": 116} {"train_loss": -26.517425537109375, "global_step": 14140, "epoch": 116} {"train_loss": -25.82192039489746, "global_step": 14141, "epoch": 116} {"train_loss": -27.083393096923828, "global_step": 14142, "epoch": 116} {"train_loss": -26.053869247436523, "global_step": 14143, "epoch": 116} {"train_loss": -26.84421730041504, "global_step": 14144, "epoch": 116} {"train_loss": -26.3583927154541, "global_step": 14145, "epoch": 116} {"train_loss": -27.172449111938477, "global_step": 14146, "epoch": 116} {"train_loss": -26.571640014648438, "global_step": 14147, "epoch": 116} {"train_loss": -26.70884132385254, "global_step": 14148, "epoch": 116} {"train_loss": -26.507858276367188, "global_step": 14149, "epoch": 116} {"train_loss": -26.716999053955078, "global_step": 14150, "epoch": 116} {"train_loss": -27.570404052734375, "global_step": 14151, "epoch": 116} {"train_loss": -26.574726104736328, "global_step": 14152, "epoch": 116} {"train_loss": -26.784076690673828, "global_step": 14153, "epoch": 116} {"train_loss": -27.363330841064453, "global_step": 14154, "epoch": 116} {"train_loss": -27.125944137573242, "global_step": 14155, "epoch": 116} {"train_loss": -26.560848661690706, "global_step": 14156, "epoch": 116, "val_loss": 2901126.25} {"train_loss": -27.025714874267578, "global_step": 14157, "epoch": 117} {"train_loss": -27.001245498657227, "global_step": 14158, "epoch": 117} {"train_loss": -26.540435791015625, "global_step": 14159, "epoch": 117} {"train_loss": -26.539417266845703, "global_step": 14160, "epoch": 117} {"train_loss": -27.082117080688477, "global_step": 14161, "epoch": 117} {"train_loss": -27.568571090698242, "global_step": 14162, "epoch": 117} {"train_loss": -26.869375228881836, "global_step": 14163, "epoch": 117} {"train_loss": -26.612287521362305, "global_step": 14164, "epoch": 117} {"train_loss": -26.291065216064453, "global_step": 14165, "epoch": 117} {"train_loss": -26.4362735748291, "global_step": 14166, "epoch": 117} {"train_loss": -27.915546417236328, "global_step": 14167, "epoch": 117} {"train_loss": -27.356428146362305, "global_step": 14168, "epoch": 117} {"train_loss": -27.439071655273438, "global_step": 14169, "epoch": 117} {"train_loss": -27.4426326751709, "global_step": 14170, "epoch": 117} {"train_loss": -27.693754196166992, "global_step": 14171, "epoch": 117} {"train_loss": -27.4019832611084, "global_step": 14172, "epoch": 117} {"train_loss": -27.838031768798828, "global_step": 14173, "epoch": 117} {"train_loss": -27.833404541015625, "global_step": 14174, "epoch": 117} {"train_loss": -26.950414657592773, "global_step": 14175, "epoch": 117} {"train_loss": -25.028438568115234, "global_step": 14176, "epoch": 117} {"train_loss": -27.6528263092041, "global_step": 14177, "epoch": 117} {"train_loss": -26.238920211791992, "global_step": 14178, "epoch": 117} {"train_loss": -26.70263671875, "global_step": 14179, "epoch": 117} {"train_loss": -26.317764282226562, "global_step": 14180, "epoch": 117} {"train_loss": -27.369632720947266, "global_step": 14181, "epoch": 117} {"train_loss": -26.146387100219727, "global_step": 14182, "epoch": 117} {"train_loss": -26.723806381225586, "global_step": 14183, "epoch": 117} {"train_loss": -27.381927490234375, "global_step": 14184, "epoch": 117} {"train_loss": -26.7325439453125, "global_step": 14185, "epoch": 117} {"train_loss": -27.12677574157715, "global_step": 14186, "epoch": 117} {"train_loss": -27.574140548706055, "global_step": 14187, "epoch": 117} {"train_loss": -27.190214157104492, "global_step": 14188, "epoch": 117} {"train_loss": -27.595502853393555, "global_step": 14189, "epoch": 117} {"train_loss": -27.25412940979004, "global_step": 14190, "epoch": 117} {"train_loss": -27.631052017211914, "global_step": 14191, "epoch": 117} {"train_loss": -27.170896530151367, "global_step": 14192, "epoch": 117} {"train_loss": -27.41840934753418, "global_step": 14193, "epoch": 117} {"train_loss": -27.6456241607666, "global_step": 14194, "epoch": 117} {"train_loss": -27.245624542236328, "global_step": 14195, "epoch": 117} {"train_loss": -27.532501220703125, "global_step": 14196, "epoch": 117} {"train_loss": -27.97059440612793, "global_step": 14197, "epoch": 117} {"train_loss": -27.69986343383789, "global_step": 14198, "epoch": 117} {"train_loss": -27.50215721130371, "global_step": 14199, "epoch": 117} {"train_loss": -27.30544090270996, "global_step": 14200, "epoch": 117} {"train_loss": -27.472095489501953, "global_step": 14201, "epoch": 117} {"train_loss": -27.159591674804688, "global_step": 14202, "epoch": 117} {"train_loss": -27.663846969604492, "global_step": 14203, "epoch": 117} {"train_loss": -27.56776237487793, "global_step": 14204, "epoch": 117} {"train_loss": -27.789453506469727, "global_step": 14205, "epoch": 117} {"train_loss": -27.509763717651367, "global_step": 14206, "epoch": 117} {"train_loss": -27.379718780517578, "global_step": 14207, "epoch": 117} {"train_loss": -27.280195236206055, "global_step": 14208, "epoch": 117} {"train_loss": -27.460397720336914, "global_step": 14209, "epoch": 117} {"train_loss": -27.64759635925293, "global_step": 14210, "epoch": 117} {"train_loss": -27.064374923706055, "global_step": 14211, "epoch": 117} {"train_loss": -26.33854103088379, "global_step": 14212, "epoch": 117} {"train_loss": -26.09944725036621, "global_step": 14213, "epoch": 117} {"train_loss": -26.68997573852539, "global_step": 14214, "epoch": 117} {"train_loss": -26.441608428955078, "global_step": 14215, "epoch": 117} {"train_loss": -24.626623153686523, "global_step": 14216, "epoch": 117} {"train_loss": -23.94143295288086, "global_step": 14217, "epoch": 117} {"train_loss": -26.18115234375, "global_step": 14218, "epoch": 117} {"train_loss": -23.399559020996094, "global_step": 14219, "epoch": 117} {"train_loss": -24.138370513916016, "global_step": 14220, "epoch": 117} {"train_loss": -27.046966552734375, "global_step": 14221, "epoch": 117} {"train_loss": -23.825830459594727, "global_step": 14222, "epoch": 117} {"train_loss": -24.301000595092773, "global_step": 14223, "epoch": 117} {"train_loss": -24.589603424072266, "global_step": 14224, "epoch": 117} {"train_loss": -25.555383682250977, "global_step": 14225, "epoch": 117} {"train_loss": -24.878217697143555, "global_step": 14226, "epoch": 117} {"train_loss": -26.3306827545166, "global_step": 14227, "epoch": 117} {"train_loss": -25.181928634643555, "global_step": 14228, "epoch": 117} {"train_loss": -25.660003662109375, "global_step": 14229, "epoch": 117} {"train_loss": -25.522703170776367, "global_step": 14230, "epoch": 117} {"train_loss": -25.86384391784668, "global_step": 14231, "epoch": 117} {"train_loss": -26.650562286376953, "global_step": 14232, "epoch": 117} {"train_loss": -25.617069244384766, "global_step": 14233, "epoch": 117} {"train_loss": -25.62384033203125, "global_step": 14234, "epoch": 117} {"train_loss": -26.30875015258789, "global_step": 14235, "epoch": 117} {"train_loss": -25.671314239501953, "global_step": 14236, "epoch": 117} {"train_loss": -26.3365535736084, "global_step": 14237, "epoch": 117} {"train_loss": -25.692895889282227, "global_step": 14238, "epoch": 117} {"train_loss": -26.34077262878418, "global_step": 14239, "epoch": 117} {"train_loss": -25.481632232666016, "global_step": 14240, "epoch": 117} {"train_loss": -26.571460723876953, "global_step": 14241, "epoch": 117} {"train_loss": -26.633411407470703, "global_step": 14242, "epoch": 117} {"train_loss": -26.18269157409668, "global_step": 14243, "epoch": 117} {"train_loss": -26.455732345581055, "global_step": 14244, "epoch": 117} {"train_loss": -26.70464515686035, "global_step": 14245, "epoch": 117} {"train_loss": -26.523828506469727, "global_step": 14246, "epoch": 117} {"train_loss": -26.792621612548828, "global_step": 14247, "epoch": 117} {"train_loss": -26.310094833374023, "global_step": 14248, "epoch": 117} {"train_loss": -26.572484970092773, "global_step": 14249, "epoch": 117} {"train_loss": -26.856678009033203, "global_step": 14250, "epoch": 117} {"train_loss": -26.519367218017578, "global_step": 14251, "epoch": 117} {"train_loss": -26.954267501831055, "global_step": 14252, "epoch": 117} {"train_loss": -27.151580810546875, "global_step": 14253, "epoch": 117} {"train_loss": -26.631872177124023, "global_step": 14254, "epoch": 117} {"train_loss": -27.268844604492188, "global_step": 14255, "epoch": 117} {"train_loss": -26.57252311706543, "global_step": 14256, "epoch": 117} {"train_loss": -27.031085968017578, "global_step": 14257, "epoch": 117} {"train_loss": -27.197729110717773, "global_step": 14258, "epoch": 117} {"train_loss": -27.383121490478516, "global_step": 14259, "epoch": 117} {"train_loss": -26.815357208251953, "global_step": 14260, "epoch": 117} {"train_loss": -27.34735679626465, "global_step": 14261, "epoch": 117} {"train_loss": -27.474409103393555, "global_step": 14262, "epoch": 117} {"train_loss": -27.220932006835938, "global_step": 14263, "epoch": 117} {"train_loss": -26.769880294799805, "global_step": 14264, "epoch": 117} {"train_loss": -26.859638214111328, "global_step": 14265, "epoch": 117} {"train_loss": -26.083541870117188, "global_step": 14266, "epoch": 117} {"train_loss": -25.284765243530273, "global_step": 14267, "epoch": 117} {"train_loss": -23.3574161529541, "global_step": 14268, "epoch": 117} {"train_loss": -22.63440704345703, "global_step": 14269, "epoch": 117} {"train_loss": -22.978111267089844, "global_step": 14270, "epoch": 117} {"train_loss": -24.794300079345703, "global_step": 14271, "epoch": 117} {"train_loss": -26.977344512939453, "global_step": 14272, "epoch": 117} {"train_loss": -26.159509658813477, "global_step": 14273, "epoch": 117} {"train_loss": -27.06388282775879, "global_step": 14274, "epoch": 117} {"train_loss": -26.30042839050293, "global_step": 14275, "epoch": 117} {"train_loss": -27.051284790039062, "global_step": 14276, "epoch": 117} {"train_loss": -26.546321459052976, "global_step": 14277, "epoch": 117, "val_loss": 2595556.0} {"train_loss": -27.2653865814209, "global_step": 14278, "epoch": 118} {"train_loss": -26.428125381469727, "global_step": 14279, "epoch": 118} {"train_loss": -26.827117919921875, "global_step": 14280, "epoch": 118} {"train_loss": -26.558307647705078, "global_step": 14281, "epoch": 118} {"train_loss": -27.29193687438965, "global_step": 14282, "epoch": 118} {"train_loss": -27.105756759643555, "global_step": 14283, "epoch": 118} {"train_loss": -26.751205444335938, "global_step": 14284, "epoch": 118} {"train_loss": -27.151403427124023, "global_step": 14285, "epoch": 118} {"train_loss": -27.04949951171875, "global_step": 14286, "epoch": 118} {"train_loss": -27.17490577697754, "global_step": 14287, "epoch": 118} {"train_loss": -27.274612426757812, "global_step": 14288, "epoch": 118} {"train_loss": -27.011600494384766, "global_step": 14289, "epoch": 118} {"train_loss": -27.222309112548828, "global_step": 14290, "epoch": 118} {"train_loss": -27.149932861328125, "global_step": 14291, "epoch": 118} {"train_loss": -27.20370864868164, "global_step": 14292, "epoch": 118} {"train_loss": -26.76020622253418, "global_step": 14293, "epoch": 118} {"train_loss": -27.8319149017334, "global_step": 14294, "epoch": 118} {"train_loss": -27.0980281829834, "global_step": 14295, "epoch": 118} {"train_loss": -27.21771812438965, "global_step": 14296, "epoch": 118} {"train_loss": -27.40755271911621, "global_step": 14297, "epoch": 118} {"train_loss": -26.788869857788086, "global_step": 14298, "epoch": 118} {"train_loss": -27.3509464263916, "global_step": 14299, "epoch": 118} {"train_loss": -26.865049362182617, "global_step": 14300, "epoch": 118} {"train_loss": -27.029163360595703, "global_step": 14301, "epoch": 118} {"train_loss": -27.74519157409668, "global_step": 14302, "epoch": 118} {"train_loss": -27.476537704467773, "global_step": 14303, "epoch": 118} {"train_loss": -27.6278133392334, "global_step": 14304, "epoch": 118} {"train_loss": -27.78583335876465, "global_step": 14305, "epoch": 118} {"train_loss": -27.399091720581055, "global_step": 14306, "epoch": 118} {"train_loss": -26.95303726196289, "global_step": 14307, "epoch": 118} {"train_loss": -27.901296615600586, "global_step": 14308, "epoch": 118} {"train_loss": -27.141626358032227, "global_step": 14309, "epoch": 118} {"train_loss": -26.284133911132812, "global_step": 14310, "epoch": 118} {"train_loss": -26.234375, "global_step": 14311, "epoch": 118} {"train_loss": -27.25834083557129, "global_step": 14312, "epoch": 118} {"train_loss": -26.76604652404785, "global_step": 14313, "epoch": 118} {"train_loss": -26.737531661987305, "global_step": 14314, "epoch": 118} {"train_loss": -27.50845718383789, "global_step": 14315, "epoch": 118} {"train_loss": -27.08084487915039, "global_step": 14316, "epoch": 118} {"train_loss": -27.577320098876953, "global_step": 14317, "epoch": 118} {"train_loss": -26.97393226623535, "global_step": 14318, "epoch": 118} {"train_loss": -26.912494659423828, "global_step": 14319, "epoch": 118} {"train_loss": -26.792688369750977, "global_step": 14320, "epoch": 118} {"train_loss": -26.886350631713867, "global_step": 14321, "epoch": 118} {"train_loss": -27.518224716186523, "global_step": 14322, "epoch": 118} {"train_loss": -26.372772216796875, "global_step": 14323, "epoch": 118} {"train_loss": -25.795612335205078, "global_step": 14324, "epoch": 118} {"train_loss": -24.538116455078125, "global_step": 14325, "epoch": 118} {"train_loss": -23.2036190032959, "global_step": 14326, "epoch": 118} {"train_loss": -25.34030532836914, "global_step": 14327, "epoch": 118} {"train_loss": -26.858844757080078, "global_step": 14328, "epoch": 118} {"train_loss": -26.580448150634766, "global_step": 14329, "epoch": 118} {"train_loss": -26.339590072631836, "global_step": 14330, "epoch": 118} {"train_loss": -27.402753829956055, "global_step": 14331, "epoch": 118} {"train_loss": -26.837980270385742, "global_step": 14332, "epoch": 118} {"train_loss": -27.11799430847168, "global_step": 14333, "epoch": 118} {"train_loss": -27.169971466064453, "global_step": 14334, "epoch": 118} {"train_loss": -26.633161544799805, "global_step": 14335, "epoch": 118} {"train_loss": -27.404926300048828, "global_step": 14336, "epoch": 118} {"train_loss": -27.187152862548828, "global_step": 14337, "epoch": 118} {"train_loss": -27.537464141845703, "global_step": 14338, "epoch": 118} {"train_loss": -27.43934440612793, "global_step": 14339, "epoch": 118} {"train_loss": -27.63160514831543, "global_step": 14340, "epoch": 118} {"train_loss": -27.4261474609375, "global_step": 14341, "epoch": 118} {"train_loss": -27.596750259399414, "global_step": 14342, "epoch": 118} {"train_loss": -27.442432403564453, "global_step": 14343, "epoch": 118} {"train_loss": -27.475513458251953, "global_step": 14344, "epoch": 118} {"train_loss": -27.60759925842285, "global_step": 14345, "epoch": 118} {"train_loss": -27.31005859375, "global_step": 14346, "epoch": 118} {"train_loss": -27.569364547729492, "global_step": 14347, "epoch": 118} {"train_loss": -27.67506980895996, "global_step": 14348, "epoch": 118} {"train_loss": -27.441137313842773, "global_step": 14349, "epoch": 118} {"train_loss": -27.083593368530273, "global_step": 14350, "epoch": 118} {"train_loss": -27.49024772644043, "global_step": 14351, "epoch": 118} {"train_loss": -27.369665145874023, "global_step": 14352, "epoch": 118} {"train_loss": -26.983306884765625, "global_step": 14353, "epoch": 118} {"train_loss": -27.594818115234375, "global_step": 14354, "epoch": 118} {"train_loss": -28.08172607421875, "global_step": 14355, "epoch": 118} {"train_loss": -27.555133819580078, "global_step": 14356, "epoch": 118} {"train_loss": -27.551679611206055, "global_step": 14357, "epoch": 118} {"train_loss": -27.794025421142578, "global_step": 14358, "epoch": 118} {"train_loss": -27.840137481689453, "global_step": 14359, "epoch": 118} {"train_loss": -27.84454917907715, "global_step": 14360, "epoch": 118} {"train_loss": -27.4414005279541, "global_step": 14361, "epoch": 118} {"train_loss": -27.587812423706055, "global_step": 14362, "epoch": 118} {"train_loss": -27.69874382019043, "global_step": 14363, "epoch": 118} {"train_loss": -27.30561637878418, "global_step": 14364, "epoch": 118} {"train_loss": -28.09504508972168, "global_step": 14365, "epoch": 118} {"train_loss": -27.5751953125, "global_step": 14366, "epoch": 118} {"train_loss": -27.648273468017578, "global_step": 14367, "epoch": 118} {"train_loss": -27.902027130126953, "global_step": 14368, "epoch": 118} {"train_loss": -28.018701553344727, "global_step": 14369, "epoch": 118} {"train_loss": -27.527368545532227, "global_step": 14370, "epoch": 118} {"train_loss": -27.561063766479492, "global_step": 14371, "epoch": 118} {"train_loss": -26.696308135986328, "global_step": 14372, "epoch": 118} {"train_loss": -27.396215438842773, "global_step": 14373, "epoch": 118} {"train_loss": -27.808002471923828, "global_step": 14374, "epoch": 118} {"train_loss": -27.46512222290039, "global_step": 14375, "epoch": 118} {"train_loss": -27.436676025390625, "global_step": 14376, "epoch": 118} {"train_loss": -27.493457794189453, "global_step": 14377, "epoch": 118} {"train_loss": -27.274473190307617, "global_step": 14378, "epoch": 118} {"train_loss": -27.03705406188965, "global_step": 14379, "epoch": 118} {"train_loss": -27.21639060974121, "global_step": 14380, "epoch": 118} {"train_loss": -28.03216552734375, "global_step": 14381, "epoch": 118} {"train_loss": -26.703433990478516, "global_step": 14382, "epoch": 118} {"train_loss": -27.15863037109375, "global_step": 14383, "epoch": 118} {"train_loss": -27.10565757751465, "global_step": 14384, "epoch": 118} {"train_loss": -27.622394561767578, "global_step": 14385, "epoch": 118} {"train_loss": -27.42647361755371, "global_step": 14386, "epoch": 118} {"train_loss": -27.677953720092773, "global_step": 14387, "epoch": 118} {"train_loss": -27.081878662109375, "global_step": 14388, "epoch": 118} {"train_loss": -27.591266632080078, "global_step": 14389, "epoch": 118} {"train_loss": -27.550418853759766, "global_step": 14390, "epoch": 118} {"train_loss": -27.336599349975586, "global_step": 14391, "epoch": 118} {"train_loss": -27.90540885925293, "global_step": 14392, "epoch": 118} {"train_loss": -27.7938232421875, "global_step": 14393, "epoch": 118} {"train_loss": -27.418081283569336, "global_step": 14394, "epoch": 118} {"train_loss": -27.582910537719727, "global_step": 14395, "epoch": 118} {"train_loss": -27.545307159423828, "global_step": 14396, "epoch": 118} {"train_loss": -27.962329864501953, "global_step": 14397, "epoch": 118} {"train_loss": -27.223358280402568, "global_step": 14398, "epoch": 118, "val_loss": 2636979.5} {"train_loss": -26.740476608276367, "global_step": 14399, "epoch": 119} {"train_loss": -27.711109161376953, "global_step": 14400, "epoch": 119} {"train_loss": -27.667264938354492, "global_step": 14401, "epoch": 119} {"train_loss": -26.30885887145996, "global_step": 14402, "epoch": 119} {"train_loss": -22.939977645874023, "global_step": 14403, "epoch": 119} {"train_loss": -18.297107696533203, "global_step": 14404, "epoch": 119} {"train_loss": -19.06760025024414, "global_step": 14405, "epoch": 119} {"train_loss": -27.50221061706543, "global_step": 14406, "epoch": 119} {"train_loss": -24.58236312866211, "global_step": 14407, "epoch": 119} {"train_loss": -26.490039825439453, "global_step": 14408, "epoch": 119} {"train_loss": -26.6312255859375, "global_step": 14409, "epoch": 119} {"train_loss": -27.265125274658203, "global_step": 14410, "epoch": 119} {"train_loss": -26.167829513549805, "global_step": 14411, "epoch": 119} {"train_loss": -26.52153968811035, "global_step": 14412, "epoch": 119} {"train_loss": -26.989181518554688, "global_step": 14413, "epoch": 119} {"train_loss": -27.338977813720703, "global_step": 14414, "epoch": 119} {"train_loss": -27.042261123657227, "global_step": 14415, "epoch": 119} {"train_loss": -26.903736114501953, "global_step": 14416, "epoch": 119} {"train_loss": -26.95790672302246, "global_step": 14417, "epoch": 119} {"train_loss": -27.0237979888916, "global_step": 14418, "epoch": 119} {"train_loss": -25.94251823425293, "global_step": 14419, "epoch": 119} {"train_loss": -25.178205490112305, "global_step": 14420, "epoch": 119} {"train_loss": -23.886823654174805, "global_step": 14421, "epoch": 119} {"train_loss": -22.18045425415039, "global_step": 14422, "epoch": 119} {"train_loss": -23.55765151977539, "global_step": 14423, "epoch": 119} {"train_loss": -27.403564453125, "global_step": 14424, "epoch": 119} {"train_loss": -25.25548553466797, "global_step": 14425, "epoch": 119} {"train_loss": -24.44977378845215, "global_step": 14426, "epoch": 119} {"train_loss": -27.061630249023438, "global_step": 14427, "epoch": 119} {"train_loss": -25.195022583007812, "global_step": 14428, "epoch": 119} {"train_loss": -27.163869857788086, "global_step": 14429, "epoch": 119} {"train_loss": -25.485055923461914, "global_step": 14430, "epoch": 119} {"train_loss": -26.635583877563477, "global_step": 14431, "epoch": 119} {"train_loss": -26.06134605407715, "global_step": 14432, "epoch": 119} {"train_loss": -26.808807373046875, "global_step": 14433, "epoch": 119} {"train_loss": -26.525548934936523, "global_step": 14434, "epoch": 119} {"train_loss": -26.558670043945312, "global_step": 14435, "epoch": 119} {"train_loss": -26.63884925842285, "global_step": 14436, "epoch": 119} {"train_loss": -26.411773681640625, "global_step": 14437, "epoch": 119} {"train_loss": -25.921030044555664, "global_step": 14438, "epoch": 119} {"train_loss": -25.907276153564453, "global_step": 14439, "epoch": 119} {"train_loss": -26.458829879760742, "global_step": 14440, "epoch": 119} {"train_loss": -26.991744995117188, "global_step": 14441, "epoch": 119} {"train_loss": -27.228179931640625, "global_step": 14442, "epoch": 119} {"train_loss": -26.720407485961914, "global_step": 14443, "epoch": 119} {"train_loss": -27.1722354888916, "global_step": 14444, "epoch": 119} {"train_loss": -26.51618766784668, "global_step": 14445, "epoch": 119} {"train_loss": -25.62430763244629, "global_step": 14446, "epoch": 119} {"train_loss": -25.100252151489258, "global_step": 14447, "epoch": 119} {"train_loss": -26.439496994018555, "global_step": 14448, "epoch": 119} {"train_loss": -25.5257511138916, "global_step": 14449, "epoch": 119} {"train_loss": -25.395435333251953, "global_step": 14450, "epoch": 119} {"train_loss": -26.849714279174805, "global_step": 14451, "epoch": 119} {"train_loss": -26.31096839904785, "global_step": 14452, "epoch": 119} {"train_loss": -26.780805587768555, "global_step": 14453, "epoch": 119} {"train_loss": -26.455810546875, "global_step": 14454, "epoch": 119} {"train_loss": -27.426111221313477, "global_step": 14455, "epoch": 119} {"train_loss": -26.618850708007812, "global_step": 14456, "epoch": 119} {"train_loss": -26.7006893157959, "global_step": 14457, "epoch": 119} {"train_loss": -27.306562423706055, "global_step": 14458, "epoch": 119} {"train_loss": -26.876020431518555, "global_step": 14459, "epoch": 119} {"train_loss": -26.964879989624023, "global_step": 14460, "epoch": 119} {"train_loss": -26.95307731628418, "global_step": 14461, "epoch": 119} {"train_loss": -27.198699951171875, "global_step": 14462, "epoch": 119} {"train_loss": -26.91949462890625, "global_step": 14463, "epoch": 119} {"train_loss": -27.012475967407227, "global_step": 14464, "epoch": 119} {"train_loss": -26.846546173095703, "global_step": 14465, "epoch": 119} {"train_loss": -27.38165283203125, "global_step": 14466, "epoch": 119} {"train_loss": -27.419891357421875, "global_step": 14467, "epoch": 119} {"train_loss": -27.435932159423828, "global_step": 14468, "epoch": 119} {"train_loss": -27.24126625061035, "global_step": 14469, "epoch": 119} {"train_loss": -27.385465621948242, "global_step": 14470, "epoch": 119} {"train_loss": -27.43702507019043, "global_step": 14471, "epoch": 119} {"train_loss": -27.33524513244629, "global_step": 14472, "epoch": 119} {"train_loss": -26.741809844970703, "global_step": 14473, "epoch": 119} {"train_loss": -27.009485244750977, "global_step": 14474, "epoch": 119} {"train_loss": -26.92255973815918, "global_step": 14475, "epoch": 119} {"train_loss": -27.676084518432617, "global_step": 14476, "epoch": 119} {"train_loss": -26.44586753845215, "global_step": 14477, "epoch": 119} {"train_loss": -25.578353881835938, "global_step": 14478, "epoch": 119} {"train_loss": -26.760089874267578, "global_step": 14479, "epoch": 119} {"train_loss": -27.370718002319336, "global_step": 14480, "epoch": 119} {"train_loss": -26.534809112548828, "global_step": 14481, "epoch": 119} {"train_loss": -26.842920303344727, "global_step": 14482, "epoch": 119} {"train_loss": -27.44781494140625, "global_step": 14483, "epoch": 119} {"train_loss": -27.082189559936523, "global_step": 14484, "epoch": 119} {"train_loss": -27.1062068939209, "global_step": 14485, "epoch": 119} {"train_loss": -27.150136947631836, "global_step": 14486, "epoch": 119} {"train_loss": -27.11921501159668, "global_step": 14487, "epoch": 119} {"train_loss": -27.31982421875, "global_step": 14488, "epoch": 119} {"train_loss": -27.367706298828125, "global_step": 14489, "epoch": 119} {"train_loss": -27.593963623046875, "global_step": 14490, "epoch": 119} {"train_loss": -27.401016235351562, "global_step": 14491, "epoch": 119} {"train_loss": -27.211130142211914, "global_step": 14492, "epoch": 119} {"train_loss": -26.187253952026367, "global_step": 14493, "epoch": 119} {"train_loss": -27.540037155151367, "global_step": 14494, "epoch": 119} {"train_loss": -27.684112548828125, "global_step": 14495, "epoch": 119} {"train_loss": -27.179956436157227, "global_step": 14496, "epoch": 119} {"train_loss": -27.462549209594727, "global_step": 14497, "epoch": 119} {"train_loss": -27.440628051757812, "global_step": 14498, "epoch": 119} {"train_loss": -27.43482780456543, "global_step": 14499, "epoch": 119} {"train_loss": -27.440088272094727, "global_step": 14500, "epoch": 119} {"train_loss": -28.1118221282959, "global_step": 14501, "epoch": 119} {"train_loss": -27.485464096069336, "global_step": 14502, "epoch": 119} {"train_loss": -27.829648971557617, "global_step": 14503, "epoch": 119} {"train_loss": -27.311735153198242, "global_step": 14504, "epoch": 119} {"train_loss": -27.693830490112305, "global_step": 14505, "epoch": 119} {"train_loss": -27.782882690429688, "global_step": 14506, "epoch": 119} {"train_loss": -27.651899337768555, "global_step": 14507, "epoch": 119} {"train_loss": -27.62750244140625, "global_step": 14508, "epoch": 119} {"train_loss": -27.42787742614746, "global_step": 14509, "epoch": 119} {"train_loss": -27.394311904907227, "global_step": 14510, "epoch": 119} {"train_loss": -27.85441017150879, "global_step": 14511, "epoch": 119} {"train_loss": -27.908559799194336, "global_step": 14512, "epoch": 119} {"train_loss": -27.550886154174805, "global_step": 14513, "epoch": 119} {"train_loss": -27.570215225219727, "global_step": 14514, "epoch": 119} {"train_loss": -27.73480796813965, "global_step": 14515, "epoch": 119} {"train_loss": -28.058950424194336, "global_step": 14516, "epoch": 119} {"train_loss": -27.396198272705078, "global_step": 14517, "epoch": 119} {"train_loss": -27.616003036499023, "global_step": 14518, "epoch": 119} {"train_loss": -26.654141181756643, "global_step": 14519, "epoch": 119, "val_loss": 2654384.75} {"train_loss": -27.49444007873535, "global_step": 14520, "epoch": 120} {"train_loss": -27.68735694885254, "global_step": 14521, "epoch": 120} {"train_loss": -27.627735137939453, "global_step": 14522, "epoch": 120} {"train_loss": -27.421356201171875, "global_step": 14523, "epoch": 120} {"train_loss": -26.851587295532227, "global_step": 14524, "epoch": 120} {"train_loss": -27.69891929626465, "global_step": 14525, "epoch": 120} {"train_loss": -27.289947509765625, "global_step": 14526, "epoch": 120} {"train_loss": -28.028539657592773, "global_step": 14527, "epoch": 120} {"train_loss": -27.622297286987305, "global_step": 14528, "epoch": 120} {"train_loss": -27.553577423095703, "global_step": 14529, "epoch": 120} {"train_loss": -27.422788619995117, "global_step": 14530, "epoch": 120} {"train_loss": -28.172712326049805, "global_step": 14531, "epoch": 120} {"train_loss": -27.696765899658203, "global_step": 14532, "epoch": 120} {"train_loss": -27.451833724975586, "global_step": 14533, "epoch": 120} {"train_loss": -27.15390968322754, "global_step": 14534, "epoch": 120} {"train_loss": -25.644460678100586, "global_step": 14535, "epoch": 120} {"train_loss": -24.11945343017578, "global_step": 14536, "epoch": 120} {"train_loss": -24.00966453552246, "global_step": 14537, "epoch": 120} {"train_loss": -27.256494522094727, "global_step": 14538, "epoch": 120} {"train_loss": -26.757232666015625, "global_step": 14539, "epoch": 120} {"train_loss": -25.97186851501465, "global_step": 14540, "epoch": 120} {"train_loss": -25.74861717224121, "global_step": 14541, "epoch": 120} {"train_loss": -23.959253311157227, "global_step": 14542, "epoch": 120} {"train_loss": -25.274229049682617, "global_step": 14543, "epoch": 120} {"train_loss": -26.43397331237793, "global_step": 14544, "epoch": 120} {"train_loss": -25.793323516845703, "global_step": 14545, "epoch": 120} {"train_loss": -24.56854820251465, "global_step": 14546, "epoch": 120} {"train_loss": -25.172727584838867, "global_step": 14547, "epoch": 120} {"train_loss": -27.174713134765625, "global_step": 14548, "epoch": 120} {"train_loss": -26.5648193359375, "global_step": 14549, "epoch": 120} {"train_loss": -25.73569107055664, "global_step": 14550, "epoch": 120} {"train_loss": -27.487045288085938, "global_step": 14551, "epoch": 120} {"train_loss": -26.684980392456055, "global_step": 14552, "epoch": 120} {"train_loss": -27.07520866394043, "global_step": 14553, "epoch": 120} {"train_loss": -26.250656127929688, "global_step": 14554, "epoch": 120} {"train_loss": -27.14932632446289, "global_step": 14555, "epoch": 120} {"train_loss": -27.18497657775879, "global_step": 14556, "epoch": 120} {"train_loss": -26.86905288696289, "global_step": 14557, "epoch": 120} {"train_loss": -26.647375106811523, "global_step": 14558, "epoch": 120} {"train_loss": -27.117212295532227, "global_step": 14559, "epoch": 120} {"train_loss": -26.5804386138916, "global_step": 14560, "epoch": 120} {"train_loss": -27.2990665435791, "global_step": 14561, "epoch": 120} {"train_loss": -26.82254981994629, "global_step": 14562, "epoch": 120} {"train_loss": -26.987030029296875, "global_step": 14563, "epoch": 120} {"train_loss": -26.80161476135254, "global_step": 14564, "epoch": 120} {"train_loss": -26.938434600830078, "global_step": 14565, "epoch": 120} {"train_loss": -27.032947540283203, "global_step": 14566, "epoch": 120} {"train_loss": -27.208337783813477, "global_step": 14567, "epoch": 120} {"train_loss": -26.683822631835938, "global_step": 14568, "epoch": 120} {"train_loss": -27.49576759338379, "global_step": 14569, "epoch": 120} {"train_loss": -27.110441207885742, "global_step": 14570, "epoch": 120} {"train_loss": -27.224050521850586, "global_step": 14571, "epoch": 120} {"train_loss": -27.077905654907227, "global_step": 14572, "epoch": 120} {"train_loss": -27.49672508239746, "global_step": 14573, "epoch": 120} {"train_loss": -27.48994255065918, "global_step": 14574, "epoch": 120} {"train_loss": -27.559528350830078, "global_step": 14575, "epoch": 120} {"train_loss": -27.798847198486328, "global_step": 14576, "epoch": 120} {"train_loss": -27.621631622314453, "global_step": 14577, "epoch": 120} {"train_loss": -27.88176918029785, "global_step": 14578, "epoch": 120} {"train_loss": -27.77003288269043, "global_step": 14579, "epoch": 120} {"train_loss": -27.40647315979004, "global_step": 14580, "epoch": 120} {"train_loss": -26.910846710205078, "global_step": 14581, "epoch": 120} {"train_loss": -25.920825958251953, "global_step": 14582, "epoch": 120} {"train_loss": -26.545913696289062, "global_step": 14583, "epoch": 120} {"train_loss": -27.842578887939453, "global_step": 14584, "epoch": 120} {"train_loss": -27.378326416015625, "global_step": 14585, "epoch": 120} {"train_loss": -27.154773712158203, "global_step": 14586, "epoch": 120} {"train_loss": -27.562772750854492, "global_step": 14587, "epoch": 120} {"train_loss": -27.24281120300293, "global_step": 14588, "epoch": 120} {"train_loss": -26.805007934570312, "global_step": 14589, "epoch": 120} {"train_loss": -26.72787857055664, "global_step": 14590, "epoch": 120} {"train_loss": -26.3448543548584, "global_step": 14591, "epoch": 120} {"train_loss": -26.61273765563965, "global_step": 14592, "epoch": 120} {"train_loss": -26.992923736572266, "global_step": 14593, "epoch": 120} {"train_loss": -27.679767608642578, "global_step": 14594, "epoch": 120} {"train_loss": -27.461606979370117, "global_step": 14595, "epoch": 120} {"train_loss": -27.437515258789062, "global_step": 14596, "epoch": 120} {"train_loss": -27.389623641967773, "global_step": 14597, "epoch": 120} {"train_loss": -27.005966186523438, "global_step": 14598, "epoch": 120} {"train_loss": -27.663908004760742, "global_step": 14599, "epoch": 120} {"train_loss": -27.154150009155273, "global_step": 14600, "epoch": 120} {"train_loss": -27.191699981689453, "global_step": 14601, "epoch": 120} {"train_loss": -27.134057998657227, "global_step": 14602, "epoch": 120} {"train_loss": -27.720224380493164, "global_step": 14603, "epoch": 120} {"train_loss": -26.87371253967285, "global_step": 14604, "epoch": 120} {"train_loss": -26.563825607299805, "global_step": 14605, "epoch": 120} {"train_loss": -27.140378952026367, "global_step": 14606, "epoch": 120} {"train_loss": -27.665250778198242, "global_step": 14607, "epoch": 120} {"train_loss": -26.7575740814209, "global_step": 14608, "epoch": 120} {"train_loss": -26.562686920166016, "global_step": 14609, "epoch": 120} {"train_loss": -26.726526260375977, "global_step": 14610, "epoch": 120} {"train_loss": -26.660877227783203, "global_step": 14611, "epoch": 120} {"train_loss": -27.633264541625977, "global_step": 14612, "epoch": 120} {"train_loss": -26.11261558532715, "global_step": 14613, "epoch": 120} {"train_loss": -26.096460342407227, "global_step": 14614, "epoch": 120} {"train_loss": -27.610095977783203, "global_step": 14615, "epoch": 120} {"train_loss": -27.1268253326416, "global_step": 14616, "epoch": 120} {"train_loss": -27.159198760986328, "global_step": 14617, "epoch": 120} {"train_loss": -27.908349990844727, "global_step": 14618, "epoch": 120} {"train_loss": -26.578474044799805, "global_step": 14619, "epoch": 120} {"train_loss": -27.597137451171875, "global_step": 14620, "epoch": 120} {"train_loss": -27.744428634643555, "global_step": 14621, "epoch": 120} {"train_loss": -27.787256240844727, "global_step": 14622, "epoch": 120} {"train_loss": -27.7983341217041, "global_step": 14623, "epoch": 120} {"train_loss": -27.46485710144043, "global_step": 14624, "epoch": 120} {"train_loss": -27.71961784362793, "global_step": 14625, "epoch": 120} {"train_loss": -27.6798038482666, "global_step": 14626, "epoch": 120} {"train_loss": -28.175710678100586, "global_step": 14627, "epoch": 120} {"train_loss": -27.612049102783203, "global_step": 14628, "epoch": 120} {"train_loss": -27.838897705078125, "global_step": 14629, "epoch": 120} {"train_loss": -27.8719539642334, "global_step": 14630, "epoch": 120} {"train_loss": -27.590351104736328, "global_step": 14631, "epoch": 120} {"train_loss": -28.126239776611328, "global_step": 14632, "epoch": 120} {"train_loss": -28.065673828125, "global_step": 14633, "epoch": 120} {"train_loss": -28.41448402404785, "global_step": 14634, "epoch": 120} {"train_loss": -27.52143669128418, "global_step": 14635, "epoch": 120} {"train_loss": -28.540973663330078, "global_step": 14636, "epoch": 120} {"train_loss": -27.36310386657715, "global_step": 14637, "epoch": 120} {"train_loss": -26.731189727783203, "global_step": 14638, "epoch": 120} {"train_loss": -26.081897735595703, "global_step": 14639, "epoch": 120} {"train_loss": -27.039048171240434, "global_step": 14640, "epoch": 120, "val_loss": 2763989.75} {"train_loss": -25.31995964050293, "global_step": 14641, "epoch": 121} {"train_loss": -26.321517944335938, "global_step": 14642, "epoch": 121} {"train_loss": -27.65359878540039, "global_step": 14643, "epoch": 121} {"train_loss": -26.4652156829834, "global_step": 14644, "epoch": 121} {"train_loss": -25.55439567565918, "global_step": 14645, "epoch": 121} {"train_loss": -27.05474853515625, "global_step": 14646, "epoch": 121} {"train_loss": -27.220556259155273, "global_step": 14647, "epoch": 121} {"train_loss": -26.888269424438477, "global_step": 14648, "epoch": 121} {"train_loss": -27.661069869995117, "global_step": 14649, "epoch": 121} {"train_loss": -27.1251220703125, "global_step": 14650, "epoch": 121} {"train_loss": -28.111738204956055, "global_step": 14651, "epoch": 121} {"train_loss": -26.8715763092041, "global_step": 14652, "epoch": 121} {"train_loss": -27.517797470092773, "global_step": 14653, "epoch": 121} {"train_loss": -27.357816696166992, "global_step": 14654, "epoch": 121} {"train_loss": -28.2797794342041, "global_step": 14655, "epoch": 121} {"train_loss": -26.947864532470703, "global_step": 14656, "epoch": 121} {"train_loss": -27.591596603393555, "global_step": 14657, "epoch": 121} {"train_loss": -27.185749053955078, "global_step": 14658, "epoch": 121} {"train_loss": -27.161237716674805, "global_step": 14659, "epoch": 121} {"train_loss": -28.133472442626953, "global_step": 14660, "epoch": 121} {"train_loss": -27.287912368774414, "global_step": 14661, "epoch": 121} {"train_loss": -27.74287986755371, "global_step": 14662, "epoch": 121} {"train_loss": -27.457599639892578, "global_step": 14663, "epoch": 121} {"train_loss": -27.871463775634766, "global_step": 14664, "epoch": 121} {"train_loss": -27.4931583404541, "global_step": 14665, "epoch": 121} {"train_loss": -26.75221824645996, "global_step": 14666, "epoch": 121} {"train_loss": -26.771320343017578, "global_step": 14667, "epoch": 121} {"train_loss": -27.447370529174805, "global_step": 14668, "epoch": 121} {"train_loss": -27.739246368408203, "global_step": 14669, "epoch": 121} {"train_loss": -27.967838287353516, "global_step": 14670, "epoch": 121} {"train_loss": -27.932254791259766, "global_step": 14671, "epoch": 121} {"train_loss": -27.947830200195312, "global_step": 14672, "epoch": 121} {"train_loss": -27.854719161987305, "global_step": 14673, "epoch": 121} {"train_loss": -27.307687759399414, "global_step": 14674, "epoch": 121} {"train_loss": -27.356372833251953, "global_step": 14675, "epoch": 121} {"train_loss": -27.54718589782715, "global_step": 14676, "epoch": 121} {"train_loss": -27.5731258392334, "global_step": 14677, "epoch": 121} {"train_loss": -27.665510177612305, "global_step": 14678, "epoch": 121} {"train_loss": -28.100147247314453, "global_step": 14679, "epoch": 121} {"train_loss": -27.329193115234375, "global_step": 14680, "epoch": 121} {"train_loss": -27.7042179107666, "global_step": 14681, "epoch": 121} {"train_loss": -27.2451114654541, "global_step": 14682, "epoch": 121} {"train_loss": -27.830305099487305, "global_step": 14683, "epoch": 121} {"train_loss": -27.652847290039062, "global_step": 14684, "epoch": 121} {"train_loss": -26.6926326751709, "global_step": 14685, "epoch": 121} {"train_loss": -27.4129695892334, "global_step": 14686, "epoch": 121} {"train_loss": -26.8990478515625, "global_step": 14687, "epoch": 121} {"train_loss": -26.145334243774414, "global_step": 14688, "epoch": 121} {"train_loss": -26.59492301940918, "global_step": 14689, "epoch": 121} {"train_loss": -27.455068588256836, "global_step": 14690, "epoch": 121} {"train_loss": -27.580032348632812, "global_step": 14691, "epoch": 121} {"train_loss": -27.643285751342773, "global_step": 14692, "epoch": 121} {"train_loss": -27.269580841064453, "global_step": 14693, "epoch": 121} {"train_loss": -26.780603408813477, "global_step": 14694, "epoch": 121} {"train_loss": -27.47285270690918, "global_step": 14695, "epoch": 121} {"train_loss": -27.405078887939453, "global_step": 14696, "epoch": 121} {"train_loss": -27.6469783782959, "global_step": 14697, "epoch": 121} {"train_loss": -27.309707641601562, "global_step": 14698, "epoch": 121} {"train_loss": -27.0869140625, "global_step": 14699, "epoch": 121} {"train_loss": -26.738534927368164, "global_step": 14700, "epoch": 121} {"train_loss": -27.2176570892334, "global_step": 14701, "epoch": 121} {"train_loss": -27.935449600219727, "global_step": 14702, "epoch": 121} {"train_loss": -26.92328453063965, "global_step": 14703, "epoch": 121} {"train_loss": -27.236454010009766, "global_step": 14704, "epoch": 121} {"train_loss": -27.915876388549805, "global_step": 14705, "epoch": 121} {"train_loss": -26.9500675201416, "global_step": 14706, "epoch": 121} {"train_loss": -27.49295425415039, "global_step": 14707, "epoch": 121} {"train_loss": -27.122634887695312, "global_step": 14708, "epoch": 121} {"train_loss": -27.380659103393555, "global_step": 14709, "epoch": 121} {"train_loss": -26.828460693359375, "global_step": 14710, "epoch": 121} {"train_loss": -26.693958282470703, "global_step": 14711, "epoch": 121} {"train_loss": -28.1737060546875, "global_step": 14712, "epoch": 121} {"train_loss": -27.5671329498291, "global_step": 14713, "epoch": 121} {"train_loss": -26.555103302001953, "global_step": 14714, "epoch": 121} {"train_loss": -27.896350860595703, "global_step": 14715, "epoch": 121} {"train_loss": -27.245519638061523, "global_step": 14716, "epoch": 121} {"train_loss": -26.935453414916992, "global_step": 14717, "epoch": 121} {"train_loss": -27.963972091674805, "global_step": 14718, "epoch": 121} {"train_loss": -27.5908260345459, "global_step": 14719, "epoch": 121} {"train_loss": -27.256763458251953, "global_step": 14720, "epoch": 121} {"train_loss": -27.7894229888916, "global_step": 14721, "epoch": 121} {"train_loss": -27.64106559753418, "global_step": 14722, "epoch": 121} {"train_loss": -27.913095474243164, "global_step": 14723, "epoch": 121} {"train_loss": -27.985952377319336, "global_step": 14724, "epoch": 121} {"train_loss": -27.86762046813965, "global_step": 14725, "epoch": 121} {"train_loss": -28.214771270751953, "global_step": 14726, "epoch": 121} {"train_loss": -27.55118179321289, "global_step": 14727, "epoch": 121} {"train_loss": -28.163610458374023, "global_step": 14728, "epoch": 121} {"train_loss": -27.95209312438965, "global_step": 14729, "epoch": 121} {"train_loss": -28.133848190307617, "global_step": 14730, "epoch": 121} {"train_loss": -28.07149314880371, "global_step": 14731, "epoch": 121} {"train_loss": -27.95526123046875, "global_step": 14732, "epoch": 121} {"train_loss": -25.725168228149414, "global_step": 14733, "epoch": 121} {"train_loss": -21.7333984375, "global_step": 14734, "epoch": 121} {"train_loss": -12.057686805725098, "global_step": 14735, "epoch": 121} {"train_loss": -14.126083374023438, "global_step": 14736, "epoch": 121} {"train_loss": -26.430103302001953, "global_step": 14737, "epoch": 121} {"train_loss": -20.88966178894043, "global_step": 14738, "epoch": 121} {"train_loss": -22.737058639526367, "global_step": 14739, "epoch": 121} {"train_loss": -24.818437576293945, "global_step": 14740, "epoch": 121} {"train_loss": -25.3465633392334, "global_step": 14741, "epoch": 121} {"train_loss": -24.83538246154785, "global_step": 14742, "epoch": 121} {"train_loss": -25.275888442993164, "global_step": 14743, "epoch": 121} {"train_loss": -26.25214195251465, "global_step": 14744, "epoch": 121} {"train_loss": -25.937118530273438, "global_step": 14745, "epoch": 121} {"train_loss": -25.34980583190918, "global_step": 14746, "epoch": 121} {"train_loss": -26.101423263549805, "global_step": 14747, "epoch": 121} {"train_loss": -25.619733810424805, "global_step": 14748, "epoch": 121} {"train_loss": -26.173370361328125, "global_step": 14749, "epoch": 121} {"train_loss": -25.957361221313477, "global_step": 14750, "epoch": 121} {"train_loss": -26.485441207885742, "global_step": 14751, "epoch": 121} {"train_loss": -25.927404403686523, "global_step": 14752, "epoch": 121} {"train_loss": -26.562658309936523, "global_step": 14753, "epoch": 121} {"train_loss": -25.986907958984375, "global_step": 14754, "epoch": 121} {"train_loss": -26.447738647460938, "global_step": 14755, "epoch": 121} {"train_loss": -26.054779052734375, "global_step": 14756, "epoch": 121} {"train_loss": -26.752233505249023, "global_step": 14757, "epoch": 121} {"train_loss": -26.411865234375, "global_step": 14758, "epoch": 121} {"train_loss": -25.63185691833496, "global_step": 14759, "epoch": 121} {"train_loss": -26.617292404174805, "global_step": 14760, "epoch": 121} {"train_loss": -26.73732953820347, "global_step": 14761, "epoch": 121, "val_loss": 2685055.25} {"train_loss": -27.109533309936523, "global_step": 14762, "epoch": 122} {"train_loss": -26.59393310546875, "global_step": 14763, "epoch": 122} {"train_loss": -26.849353790283203, "global_step": 14764, "epoch": 122} {"train_loss": -26.494714736938477, "global_step": 14765, "epoch": 122} {"train_loss": -26.68128776550293, "global_step": 14766, "epoch": 122} {"train_loss": -26.455286026000977, "global_step": 14767, "epoch": 122} {"train_loss": -26.676559448242188, "global_step": 14768, "epoch": 122} {"train_loss": -26.421234130859375, "global_step": 14769, "epoch": 122} {"train_loss": -26.429630279541016, "global_step": 14770, "epoch": 122} {"train_loss": -26.44063377380371, "global_step": 14771, "epoch": 122} {"train_loss": -27.05946922302246, "global_step": 14772, "epoch": 122} {"train_loss": -26.294631958007812, "global_step": 14773, "epoch": 122} {"train_loss": -26.909353256225586, "global_step": 14774, "epoch": 122} {"train_loss": -26.593786239624023, "global_step": 14775, "epoch": 122} {"train_loss": -26.488950729370117, "global_step": 14776, "epoch": 122} {"train_loss": -26.57081413269043, "global_step": 14777, "epoch": 122} {"train_loss": -26.761707305908203, "global_step": 14778, "epoch": 122} {"train_loss": -26.18268394470215, "global_step": 14779, "epoch": 122} {"train_loss": -26.5090274810791, "global_step": 14780, "epoch": 122} {"train_loss": -26.686264038085938, "global_step": 14781, "epoch": 122} {"train_loss": -26.49349021911621, "global_step": 14782, "epoch": 122} {"train_loss": -27.41839599609375, "global_step": 14783, "epoch": 122} {"train_loss": -26.879621505737305, "global_step": 14784, "epoch": 122} {"train_loss": -26.51063346862793, "global_step": 14785, "epoch": 122} {"train_loss": -25.63623046875, "global_step": 14786, "epoch": 122} {"train_loss": -24.300373077392578, "global_step": 14787, "epoch": 122} {"train_loss": -23.754486083984375, "global_step": 14788, "epoch": 122} {"train_loss": -24.818103790283203, "global_step": 14789, "epoch": 122} {"train_loss": -25.919437408447266, "global_step": 14790, "epoch": 122} {"train_loss": -26.158370971679688, "global_step": 14791, "epoch": 122} {"train_loss": -25.751953125, "global_step": 14792, "epoch": 122} {"train_loss": -26.822004318237305, "global_step": 14793, "epoch": 122} {"train_loss": -26.380512237548828, "global_step": 14794, "epoch": 122} {"train_loss": -26.955121994018555, "global_step": 14795, "epoch": 122} {"train_loss": -26.637205123901367, "global_step": 14796, "epoch": 122} {"train_loss": -27.27054786682129, "global_step": 14797, "epoch": 122} {"train_loss": -26.679533004760742, "global_step": 14798, "epoch": 122} {"train_loss": -26.943042755126953, "global_step": 14799, "epoch": 122} {"train_loss": -26.904993057250977, "global_step": 14800, "epoch": 122} {"train_loss": -27.22393798828125, "global_step": 14801, "epoch": 122} {"train_loss": -27.342365264892578, "global_step": 14802, "epoch": 122} {"train_loss": -26.999969482421875, "global_step": 14803, "epoch": 122} {"train_loss": -26.91840171813965, "global_step": 14804, "epoch": 122} {"train_loss": -26.908578872680664, "global_step": 14805, "epoch": 122} {"train_loss": -27.188901901245117, "global_step": 14806, "epoch": 122} {"train_loss": -27.172590255737305, "global_step": 14807, "epoch": 122} {"train_loss": -27.058725357055664, "global_step": 14808, "epoch": 122} {"train_loss": -27.028905868530273, "global_step": 14809, "epoch": 122} {"train_loss": -26.441980361938477, "global_step": 14810, "epoch": 122} {"train_loss": -27.12201499938965, "global_step": 14811, "epoch": 122} {"train_loss": -27.25301170349121, "global_step": 14812, "epoch": 122} {"train_loss": -27.560016632080078, "global_step": 14813, "epoch": 122} {"train_loss": -27.269367218017578, "global_step": 14814, "epoch": 122} {"train_loss": -27.366073608398438, "global_step": 14815, "epoch": 122} {"train_loss": -27.88654136657715, "global_step": 14816, "epoch": 122} {"train_loss": -27.244653701782227, "global_step": 14817, "epoch": 122} {"train_loss": -26.309234619140625, "global_step": 14818, "epoch": 122} {"train_loss": -26.55789566040039, "global_step": 14819, "epoch": 122} {"train_loss": -26.90043067932129, "global_step": 14820, "epoch": 122} {"train_loss": -27.117324829101562, "global_step": 14821, "epoch": 122} {"train_loss": -25.329666137695312, "global_step": 14822, "epoch": 122} {"train_loss": -26.523862838745117, "global_step": 14823, "epoch": 122} {"train_loss": -27.520719528198242, "global_step": 14824, "epoch": 122} {"train_loss": -25.99275016784668, "global_step": 14825, "epoch": 122} {"train_loss": -26.930805206298828, "global_step": 14826, "epoch": 122} {"train_loss": -27.490644454956055, "global_step": 14827, "epoch": 122} {"train_loss": -27.192346572875977, "global_step": 14828, "epoch": 122} {"train_loss": -27.41965103149414, "global_step": 14829, "epoch": 122} {"train_loss": -26.674591064453125, "global_step": 14830, "epoch": 122} {"train_loss": -24.831418991088867, "global_step": 14831, "epoch": 122} {"train_loss": -23.644983291625977, "global_step": 14832, "epoch": 122} {"train_loss": -25.792266845703125, "global_step": 14833, "epoch": 122} {"train_loss": -26.922473907470703, "global_step": 14834, "epoch": 122} {"train_loss": -26.66729164123535, "global_step": 14835, "epoch": 122} {"train_loss": -26.5466365814209, "global_step": 14836, "epoch": 122} {"train_loss": -26.70696449279785, "global_step": 14837, "epoch": 122} {"train_loss": -26.848926544189453, "global_step": 14838, "epoch": 122} {"train_loss": -27.503158569335938, "global_step": 14839, "epoch": 122} {"train_loss": -26.980749130249023, "global_step": 14840, "epoch": 122} {"train_loss": -27.435626983642578, "global_step": 14841, "epoch": 122} {"train_loss": -27.30867576599121, "global_step": 14842, "epoch": 122} {"train_loss": -27.27455711364746, "global_step": 14843, "epoch": 122} {"train_loss": -27.41718101501465, "global_step": 14844, "epoch": 122} {"train_loss": -27.311792373657227, "global_step": 14845, "epoch": 122} {"train_loss": -27.28192710876465, "global_step": 14846, "epoch": 122} {"train_loss": -27.008316040039062, "global_step": 14847, "epoch": 122} {"train_loss": -27.839828491210938, "global_step": 14848, "epoch": 122} {"train_loss": -26.998544692993164, "global_step": 14849, "epoch": 122} {"train_loss": -27.125879287719727, "global_step": 14850, "epoch": 122} {"train_loss": -27.535486221313477, "global_step": 14851, "epoch": 122} {"train_loss": -27.34976577758789, "global_step": 14852, "epoch": 122} {"train_loss": -26.69068717956543, "global_step": 14853, "epoch": 122} {"train_loss": -27.417139053344727, "global_step": 14854, "epoch": 122} {"train_loss": -27.106943130493164, "global_step": 14855, "epoch": 122} {"train_loss": -26.40150260925293, "global_step": 14856, "epoch": 122} {"train_loss": -27.32761001586914, "global_step": 14857, "epoch": 122} {"train_loss": -26.18269920349121, "global_step": 14858, "epoch": 122} {"train_loss": -24.091814041137695, "global_step": 14859, "epoch": 122} {"train_loss": -25.60483169555664, "global_step": 14860, "epoch": 122} {"train_loss": -27.414731979370117, "global_step": 14861, "epoch": 122} {"train_loss": -26.52008056640625, "global_step": 14862, "epoch": 122} {"train_loss": -27.353656768798828, "global_step": 14863, "epoch": 122} {"train_loss": -27.834508895874023, "global_step": 14864, "epoch": 122} {"train_loss": -27.42789649963379, "global_step": 14865, "epoch": 122} {"train_loss": -27.277761459350586, "global_step": 14866, "epoch": 122} {"train_loss": -27.881763458251953, "global_step": 14867, "epoch": 122} {"train_loss": -27.710744857788086, "global_step": 14868, "epoch": 122} {"train_loss": -27.685285568237305, "global_step": 14869, "epoch": 122} {"train_loss": -27.662368774414062, "global_step": 14870, "epoch": 122} {"train_loss": -27.786212921142578, "global_step": 14871, "epoch": 122} {"train_loss": -27.833139419555664, "global_step": 14872, "epoch": 122} {"train_loss": -27.7758731842041, "global_step": 14873, "epoch": 122} {"train_loss": -27.885656356811523, "global_step": 14874, "epoch": 122} {"train_loss": -27.984699249267578, "global_step": 14875, "epoch": 122} {"train_loss": -27.45880699157715, "global_step": 14876, "epoch": 122} {"train_loss": -27.942340850830078, "global_step": 14877, "epoch": 122} {"train_loss": -27.804059982299805, "global_step": 14878, "epoch": 122} {"train_loss": -27.60626220703125, "global_step": 14879, "epoch": 122} {"train_loss": -28.119205474853516, "global_step": 14880, "epoch": 122} {"train_loss": -27.585493087768555, "global_step": 14881, "epoch": 122} {"train_loss": -26.85977407723419, "global_step": 14882, "epoch": 122, "val_loss": 2792329.5} {"train_loss": -28.11687660217285, "global_step": 14883, "epoch": 123} {"train_loss": -27.86236572265625, "global_step": 14884, "epoch": 123} {"train_loss": -28.170377731323242, "global_step": 14885, "epoch": 123} {"train_loss": -27.756988525390625, "global_step": 14886, "epoch": 123} {"train_loss": -27.66961669921875, "global_step": 14887, "epoch": 123} {"train_loss": -27.710229873657227, "global_step": 14888, "epoch": 123} {"train_loss": -27.53729248046875, "global_step": 14889, "epoch": 123} {"train_loss": -26.68143081665039, "global_step": 14890, "epoch": 123} {"train_loss": -25.07628059387207, "global_step": 14891, "epoch": 123} {"train_loss": -23.05360984802246, "global_step": 14892, "epoch": 123} {"train_loss": -18.671398162841797, "global_step": 14893, "epoch": 123} {"train_loss": -19.161510467529297, "global_step": 14894, "epoch": 123} {"train_loss": -26.637908935546875, "global_step": 14895, "epoch": 123} {"train_loss": -24.026575088500977, "global_step": 14896, "epoch": 123} {"train_loss": -26.34238624572754, "global_step": 14897, "epoch": 123} {"train_loss": -24.731000900268555, "global_step": 14898, "epoch": 123} {"train_loss": -26.284696578979492, "global_step": 14899, "epoch": 123} {"train_loss": -25.380170822143555, "global_step": 14900, "epoch": 123} {"train_loss": -26.462472915649414, "global_step": 14901, "epoch": 123} {"train_loss": -26.83867835998535, "global_step": 14902, "epoch": 123} {"train_loss": -26.863245010375977, "global_step": 14903, "epoch": 123} {"train_loss": -26.513671875, "global_step": 14904, "epoch": 123} {"train_loss": -26.840551376342773, "global_step": 14905, "epoch": 123} {"train_loss": -26.73176383972168, "global_step": 14906, "epoch": 123} {"train_loss": -26.894514083862305, "global_step": 14907, "epoch": 123} {"train_loss": -26.35346794128418, "global_step": 14908, "epoch": 123} {"train_loss": -27.026046752929688, "global_step": 14909, "epoch": 123} {"train_loss": -26.7481689453125, "global_step": 14910, "epoch": 123} {"train_loss": -26.57056999206543, "global_step": 14911, "epoch": 123} {"train_loss": -27.075763702392578, "global_step": 14912, "epoch": 123} {"train_loss": -26.417373657226562, "global_step": 14913, "epoch": 123} {"train_loss": -27.04583740234375, "global_step": 14914, "epoch": 123} {"train_loss": -27.323383331298828, "global_step": 14915, "epoch": 123} {"train_loss": -27.6022891998291, "global_step": 14916, "epoch": 123} {"train_loss": -27.21002197265625, "global_step": 14917, "epoch": 123} {"train_loss": -27.269500732421875, "global_step": 14918, "epoch": 123} {"train_loss": -27.154560089111328, "global_step": 14919, "epoch": 123} {"train_loss": -27.207111358642578, "global_step": 14920, "epoch": 123} {"train_loss": -27.4735107421875, "global_step": 14921, "epoch": 123} {"train_loss": -27.47503089904785, "global_step": 14922, "epoch": 123} {"train_loss": -27.3057918548584, "global_step": 14923, "epoch": 123} {"train_loss": -27.40907096862793, "global_step": 14924, "epoch": 123} {"train_loss": -27.028928756713867, "global_step": 14925, "epoch": 123} {"train_loss": -27.34714698791504, "global_step": 14926, "epoch": 123} {"train_loss": -26.719696044921875, "global_step": 14927, "epoch": 123} {"train_loss": -26.514942169189453, "global_step": 14928, "epoch": 123} {"train_loss": -25.831396102905273, "global_step": 14929, "epoch": 123} {"train_loss": -24.90753746032715, "global_step": 14930, "epoch": 123} {"train_loss": -20.37699317932129, "global_step": 14931, "epoch": 123} {"train_loss": -18.392038345336914, "global_step": 14932, "epoch": 123} {"train_loss": -23.98658561706543, "global_step": 14933, "epoch": 123} {"train_loss": -26.704328536987305, "global_step": 14934, "epoch": 123} {"train_loss": -23.651968002319336, "global_step": 14935, "epoch": 123} {"train_loss": -26.851367950439453, "global_step": 14936, "epoch": 123} {"train_loss": -25.55600929260254, "global_step": 14937, "epoch": 123} {"train_loss": -26.854877471923828, "global_step": 14938, "epoch": 123} {"train_loss": -26.281131744384766, "global_step": 14939, "epoch": 123} {"train_loss": -26.43192481994629, "global_step": 14940, "epoch": 123} {"train_loss": -27.106420516967773, "global_step": 14941, "epoch": 123} {"train_loss": -26.540435791015625, "global_step": 14942, "epoch": 123} {"train_loss": -25.7242374420166, "global_step": 14943, "epoch": 123} {"train_loss": -26.929086685180664, "global_step": 14944, "epoch": 123} {"train_loss": -26.975391387939453, "global_step": 14945, "epoch": 123} {"train_loss": -26.766265869140625, "global_step": 14946, "epoch": 123} {"train_loss": -26.884174346923828, "global_step": 14947, "epoch": 123} {"train_loss": -26.261320114135742, "global_step": 14948, "epoch": 123} {"train_loss": -26.336170196533203, "global_step": 14949, "epoch": 123} {"train_loss": -27.253110885620117, "global_step": 14950, "epoch": 123} {"train_loss": -27.04218101501465, "global_step": 14951, "epoch": 123} {"train_loss": -27.103479385375977, "global_step": 14952, "epoch": 123} {"train_loss": -26.871225357055664, "global_step": 14953, "epoch": 123} {"train_loss": -26.768972396850586, "global_step": 14954, "epoch": 123} {"train_loss": -27.15227699279785, "global_step": 14955, "epoch": 123} {"train_loss": -27.299060821533203, "global_step": 14956, "epoch": 123} {"train_loss": -27.191556930541992, "global_step": 14957, "epoch": 123} {"train_loss": -27.0059871673584, "global_step": 14958, "epoch": 123} {"train_loss": -27.071496963500977, "global_step": 14959, "epoch": 123} {"train_loss": -27.294885635375977, "global_step": 14960, "epoch": 123} {"train_loss": -27.43003273010254, "global_step": 14961, "epoch": 123} {"train_loss": -27.398950576782227, "global_step": 14962, "epoch": 123} {"train_loss": -27.287710189819336, "global_step": 14963, "epoch": 123} {"train_loss": -26.9527530670166, "global_step": 14964, "epoch": 123} {"train_loss": -26.040868759155273, "global_step": 14965, "epoch": 123} {"train_loss": -26.820911407470703, "global_step": 14966, "epoch": 123} {"train_loss": -27.384490966796875, "global_step": 14967, "epoch": 123} {"train_loss": -27.23516273498535, "global_step": 14968, "epoch": 123} {"train_loss": -27.292871475219727, "global_step": 14969, "epoch": 123} {"train_loss": -27.67062759399414, "global_step": 14970, "epoch": 123} {"train_loss": -26.68137550354004, "global_step": 14971, "epoch": 123} {"train_loss": -27.460315704345703, "global_step": 14972, "epoch": 123} {"train_loss": -27.866043090820312, "global_step": 14973, "epoch": 123} {"train_loss": -26.542682647705078, "global_step": 14974, "epoch": 123} {"train_loss": -26.959522247314453, "global_step": 14975, "epoch": 123} {"train_loss": -27.083044052124023, "global_step": 14976, "epoch": 123} {"train_loss": -27.371936798095703, "global_step": 14977, "epoch": 123} {"train_loss": -27.36702537536621, "global_step": 14978, "epoch": 123} {"train_loss": -27.413299560546875, "global_step": 14979, "epoch": 123} {"train_loss": -27.98493766784668, "global_step": 14980, "epoch": 123} {"train_loss": -27.689441680908203, "global_step": 14981, "epoch": 123} {"train_loss": -27.484155654907227, "global_step": 14982, "epoch": 123} {"train_loss": -26.923532485961914, "global_step": 14983, "epoch": 123} {"train_loss": -27.383331298828125, "global_step": 14984, "epoch": 123} {"train_loss": -27.41126823425293, "global_step": 14985, "epoch": 123} {"train_loss": -27.513715744018555, "global_step": 14986, "epoch": 123} {"train_loss": -27.434234619140625, "global_step": 14987, "epoch": 123} {"train_loss": -27.786970138549805, "global_step": 14988, "epoch": 123} {"train_loss": -27.802631378173828, "global_step": 14989, "epoch": 123} {"train_loss": -27.95648193359375, "global_step": 14990, "epoch": 123} {"train_loss": -28.089323043823242, "global_step": 14991, "epoch": 123} {"train_loss": -27.465717315673828, "global_step": 14992, "epoch": 123} {"train_loss": -27.586078643798828, "global_step": 14993, "epoch": 123} {"train_loss": -27.2382869720459, "global_step": 14994, "epoch": 123} {"train_loss": -26.465564727783203, "global_step": 14995, "epoch": 123} {"train_loss": -27.486682891845703, "global_step": 14996, "epoch": 123} {"train_loss": -26.866201400756836, "global_step": 14997, "epoch": 123} {"train_loss": -27.55378532409668, "global_step": 14998, "epoch": 123} {"train_loss": -27.597675323486328, "global_step": 14999, "epoch": 123} {"train_loss": -26.78169822692871, "global_step": 15000, "epoch": 123} {"train_loss": -27.782032012939453, "global_step": 15001, "epoch": 123} {"train_loss": -27.710464477539062, "global_step": 15002, "epoch": 123} {"train_loss": -26.65723803811822, "global_step": 15003, "epoch": 123, "val_loss": 2480025.75} {"train_loss": -27.39215660095215, "global_step": 15004, "epoch": 124} {"train_loss": -27.38811683654785, "global_step": 15005, "epoch": 124} {"train_loss": -27.6156005859375, "global_step": 15006, "epoch": 124} {"train_loss": -27.384384155273438, "global_step": 15007, "epoch": 124} {"train_loss": -27.75567626953125, "global_step": 15008, "epoch": 124} {"train_loss": -27.980310440063477, "global_step": 15009, "epoch": 124} {"train_loss": -27.784454345703125, "global_step": 15010, "epoch": 124} {"train_loss": -27.721160888671875, "global_step": 15011, "epoch": 124} {"train_loss": -28.05636978149414, "global_step": 15012, "epoch": 124} {"train_loss": -27.8723087310791, "global_step": 15013, "epoch": 124} {"train_loss": -26.62595558166504, "global_step": 15014, "epoch": 124} {"train_loss": -28.208154678344727, "global_step": 15015, "epoch": 124} {"train_loss": -28.042768478393555, "global_step": 15016, "epoch": 124} {"train_loss": -27.913602828979492, "global_step": 15017, "epoch": 124} {"train_loss": -28.44756507873535, "global_step": 15018, "epoch": 124} {"train_loss": -27.81110191345215, "global_step": 15019, "epoch": 124} {"train_loss": -27.908248901367188, "global_step": 15020, "epoch": 124} {"train_loss": -27.56644630432129, "global_step": 15021, "epoch": 124} {"train_loss": -27.25452995300293, "global_step": 15022, "epoch": 124} {"train_loss": -27.269617080688477, "global_step": 15023, "epoch": 124} {"train_loss": -26.67998695373535, "global_step": 15024, "epoch": 124} {"train_loss": -24.238115310668945, "global_step": 15025, "epoch": 124} {"train_loss": -28.35275650024414, "global_step": 15026, "epoch": 124} {"train_loss": -26.6070613861084, "global_step": 15027, "epoch": 124} {"train_loss": -27.78358268737793, "global_step": 15028, "epoch": 124} {"train_loss": -27.323379516601562, "global_step": 15029, "epoch": 124} {"train_loss": -27.994718551635742, "global_step": 15030, "epoch": 124} {"train_loss": -27.264312744140625, "global_step": 15031, "epoch": 124} {"train_loss": -28.01594352722168, "global_step": 15032, "epoch": 124} {"train_loss": -28.44843864440918, "global_step": 15033, "epoch": 124} {"train_loss": -28.297000885009766, "global_step": 15034, "epoch": 124} {"train_loss": -27.953693389892578, "global_step": 15035, "epoch": 124} {"train_loss": -28.32830810546875, "global_step": 15036, "epoch": 124} {"train_loss": -28.5521183013916, "global_step": 15037, "epoch": 124} {"train_loss": -27.68521499633789, "global_step": 15038, "epoch": 124} {"train_loss": -27.625293731689453, "global_step": 15039, "epoch": 124} {"train_loss": -28.024951934814453, "global_step": 15040, "epoch": 124} {"train_loss": -28.006607055664062, "global_step": 15041, "epoch": 124} {"train_loss": -27.639204025268555, "global_step": 15042, "epoch": 124} {"train_loss": -27.423404693603516, "global_step": 15043, "epoch": 124} {"train_loss": -26.871356964111328, "global_step": 15044, "epoch": 124} {"train_loss": -26.5458927154541, "global_step": 15045, "epoch": 124} {"train_loss": -25.677438735961914, "global_step": 15046, "epoch": 124} {"train_loss": -25.385683059692383, "global_step": 15047, "epoch": 124} {"train_loss": -27.261993408203125, "global_step": 15048, "epoch": 124} {"train_loss": -27.585962295532227, "global_step": 15049, "epoch": 124} {"train_loss": -27.322118759155273, "global_step": 15050, "epoch": 124} {"train_loss": -27.11484146118164, "global_step": 15051, "epoch": 124} {"train_loss": -26.5999698638916, "global_step": 15052, "epoch": 124} {"train_loss": -27.112445831298828, "global_step": 15053, "epoch": 124} {"train_loss": -27.904096603393555, "global_step": 15054, "epoch": 124} {"train_loss": -27.2640323638916, "global_step": 15055, "epoch": 124} {"train_loss": -27.268741607666016, "global_step": 15056, "epoch": 124} {"train_loss": -27.875396728515625, "global_step": 15057, "epoch": 124} {"train_loss": -27.580224990844727, "global_step": 15058, "epoch": 124} {"train_loss": -27.0607967376709, "global_step": 15059, "epoch": 124} {"train_loss": -26.94590187072754, "global_step": 15060, "epoch": 124} {"train_loss": -27.380014419555664, "global_step": 15061, "epoch": 124} {"train_loss": -27.1158447265625, "global_step": 15062, "epoch": 124} {"train_loss": -27.73004722595215, "global_step": 15063, "epoch": 124} {"train_loss": -27.726755142211914, "global_step": 15064, "epoch": 124} {"train_loss": -27.16015625, "global_step": 15065, "epoch": 124} {"train_loss": -27.471817016601562, "global_step": 15066, "epoch": 124} {"train_loss": -27.831083297729492, "global_step": 15067, "epoch": 124} {"train_loss": -27.926712036132812, "global_step": 15068, "epoch": 124} {"train_loss": -27.737009048461914, "global_step": 15069, "epoch": 124} {"train_loss": -27.970569610595703, "global_step": 15070, "epoch": 124} {"train_loss": -27.544225692749023, "global_step": 15071, "epoch": 124} {"train_loss": -27.468536376953125, "global_step": 15072, "epoch": 124} {"train_loss": -27.653823852539062, "global_step": 15073, "epoch": 124} {"train_loss": -27.702245712280273, "global_step": 15074, "epoch": 124} {"train_loss": -27.635894775390625, "global_step": 15075, "epoch": 124} {"train_loss": -27.731597900390625, "global_step": 15076, "epoch": 124} {"train_loss": -28.197172164916992, "global_step": 15077, "epoch": 124} {"train_loss": -28.175586700439453, "global_step": 15078, "epoch": 124} {"train_loss": -28.060699462890625, "global_step": 15079, "epoch": 124} {"train_loss": -28.27216148376465, "global_step": 15080, "epoch": 124} {"train_loss": -28.18115234375, "global_step": 15081, "epoch": 124} {"train_loss": -27.754470825195312, "global_step": 15082, "epoch": 124} {"train_loss": -27.07733154296875, "global_step": 15083, "epoch": 124} {"train_loss": -27.53827476501465, "global_step": 15084, "epoch": 124} {"train_loss": -27.409162521362305, "global_step": 15085, "epoch": 124} {"train_loss": -26.572193145751953, "global_step": 15086, "epoch": 124} {"train_loss": -27.959497451782227, "global_step": 15087, "epoch": 124} {"train_loss": -28.1662654876709, "global_step": 15088, "epoch": 124} {"train_loss": -26.98089027404785, "global_step": 15089, "epoch": 124} {"train_loss": -27.898212432861328, "global_step": 15090, "epoch": 124} {"train_loss": -27.86746597290039, "global_step": 15091, "epoch": 124} {"train_loss": -27.132253646850586, "global_step": 15092, "epoch": 124} {"train_loss": -28.141632080078125, "global_step": 15093, "epoch": 124} {"train_loss": -28.234378814697266, "global_step": 15094, "epoch": 124} {"train_loss": -27.713977813720703, "global_step": 15095, "epoch": 124} {"train_loss": -28.21503257751465, "global_step": 15096, "epoch": 124} {"train_loss": -28.172256469726562, "global_step": 15097, "epoch": 124} {"train_loss": -27.771329879760742, "global_step": 15098, "epoch": 124} {"train_loss": -28.029022216796875, "global_step": 15099, "epoch": 124} {"train_loss": -28.005163192749023, "global_step": 15100, "epoch": 124} {"train_loss": -28.360309600830078, "global_step": 15101, "epoch": 124} {"train_loss": -28.557342529296875, "global_step": 15102, "epoch": 124} {"train_loss": -28.57246208190918, "global_step": 15103, "epoch": 124} {"train_loss": -28.429372787475586, "global_step": 15104, "epoch": 124} {"train_loss": -28.141809463500977, "global_step": 15105, "epoch": 124} {"train_loss": -27.74818229675293, "global_step": 15106, "epoch": 124} {"train_loss": -26.926786422729492, "global_step": 15107, "epoch": 124} {"train_loss": -22.849132537841797, "global_step": 15108, "epoch": 124} {"train_loss": -17.52739906311035, "global_step": 15109, "epoch": 124} {"train_loss": -10.903021812438965, "global_step": 15110, "epoch": 124} {"train_loss": -19.613737106323242, "global_step": 15111, "epoch": 124} {"train_loss": -26.4269962310791, "global_step": 15112, "epoch": 124} {"train_loss": -24.000442504882812, "global_step": 15113, "epoch": 124} {"train_loss": -24.500442504882812, "global_step": 15114, "epoch": 124} {"train_loss": -27.081586837768555, "global_step": 15115, "epoch": 124} {"train_loss": -24.762985229492188, "global_step": 15116, "epoch": 124} {"train_loss": -25.234800338745117, "global_step": 15117, "epoch": 124} {"train_loss": -27.12078857421875, "global_step": 15118, "epoch": 124} {"train_loss": -26.444074630737305, "global_step": 15119, "epoch": 124} {"train_loss": -26.051715850830078, "global_step": 15120, "epoch": 124} {"train_loss": -26.488616943359375, "global_step": 15121, "epoch": 124} {"train_loss": -26.62208366394043, "global_step": 15122, "epoch": 124} {"train_loss": -26.568069458007812, "global_step": 15123, "epoch": 124} {"train_loss": -27.113525824113324, "global_step": 15124, "epoch": 124, "val_loss": 2758009.0} {"train_loss": -26.85809326171875, "global_step": 15125, "epoch": 125} {"train_loss": -26.752710342407227, "global_step": 15126, "epoch": 125} {"train_loss": -26.695348739624023, "global_step": 15127, "epoch": 125} {"train_loss": -26.79288101196289, "global_step": 15128, "epoch": 125} {"train_loss": -27.321699142456055, "global_step": 15129, "epoch": 125} {"train_loss": -26.648101806640625, "global_step": 15130, "epoch": 125} {"train_loss": -26.827123641967773, "global_step": 15131, "epoch": 125} {"train_loss": -26.495824813842773, "global_step": 15132, "epoch": 125} {"train_loss": -26.01432228088379, "global_step": 15133, "epoch": 125} {"train_loss": -26.238515853881836, "global_step": 15134, "epoch": 125} {"train_loss": -27.05828857421875, "global_step": 15135, "epoch": 125} {"train_loss": -27.185556411743164, "global_step": 15136, "epoch": 125} {"train_loss": -26.84686279296875, "global_step": 15137, "epoch": 125} {"train_loss": -26.47265625, "global_step": 15138, "epoch": 125} {"train_loss": -27.058923721313477, "global_step": 15139, "epoch": 125} {"train_loss": -27.2259464263916, "global_step": 15140, "epoch": 125} {"train_loss": -26.525833129882812, "global_step": 15141, "epoch": 125} {"train_loss": -26.100324630737305, "global_step": 15142, "epoch": 125} {"train_loss": -26.163610458374023, "global_step": 15143, "epoch": 125} {"train_loss": -26.8819522857666, "global_step": 15144, "epoch": 125} {"train_loss": -27.652729034423828, "global_step": 15145, "epoch": 125} {"train_loss": -26.6833553314209, "global_step": 15146, "epoch": 125} {"train_loss": -27.232196807861328, "global_step": 15147, "epoch": 125} {"train_loss": -27.931537628173828, "global_step": 15148, "epoch": 125} {"train_loss": -27.368146896362305, "global_step": 15149, "epoch": 125} {"train_loss": -26.898313522338867, "global_step": 15150, "epoch": 125} {"train_loss": -27.599384307861328, "global_step": 15151, "epoch": 125} {"train_loss": -27.106781005859375, "global_step": 15152, "epoch": 125} {"train_loss": -27.491403579711914, "global_step": 15153, "epoch": 125} {"train_loss": -26.702457427978516, "global_step": 15154, "epoch": 125} {"train_loss": -26.503965377807617, "global_step": 15155, "epoch": 125} {"train_loss": -25.954843521118164, "global_step": 15156, "epoch": 125} {"train_loss": -27.014570236206055, "global_step": 15157, "epoch": 125} {"train_loss": -26.954004287719727, "global_step": 15158, "epoch": 125} {"train_loss": -26.779638290405273, "global_step": 15159, "epoch": 125} {"train_loss": -26.795063018798828, "global_step": 15160, "epoch": 125} {"train_loss": -26.0684871673584, "global_step": 15161, "epoch": 125} {"train_loss": -27.844385147094727, "global_step": 15162, "epoch": 125} {"train_loss": -26.006683349609375, "global_step": 15163, "epoch": 125} {"train_loss": -26.192337036132812, "global_step": 15164, "epoch": 125} {"train_loss": -27.650089263916016, "global_step": 15165, "epoch": 125} {"train_loss": -26.815805435180664, "global_step": 15166, "epoch": 125} {"train_loss": -27.468847274780273, "global_step": 15167, "epoch": 125} {"train_loss": -27.5728759765625, "global_step": 15168, "epoch": 125} {"train_loss": -27.268476486206055, "global_step": 15169, "epoch": 125} {"train_loss": -27.556562423706055, "global_step": 15170, "epoch": 125} {"train_loss": -27.441068649291992, "global_step": 15171, "epoch": 125} {"train_loss": -26.944089889526367, "global_step": 15172, "epoch": 125} {"train_loss": -25.95538330078125, "global_step": 15173, "epoch": 125} {"train_loss": -27.41373062133789, "global_step": 15174, "epoch": 125} {"train_loss": -26.99909782409668, "global_step": 15175, "epoch": 125} {"train_loss": -27.447742462158203, "global_step": 15176, "epoch": 125} {"train_loss": -26.91645622253418, "global_step": 15177, "epoch": 125} {"train_loss": -26.950483322143555, "global_step": 15178, "epoch": 125} {"train_loss": -27.488895416259766, "global_step": 15179, "epoch": 125} {"train_loss": -27.44038963317871, "global_step": 15180, "epoch": 125} {"train_loss": -27.150049209594727, "global_step": 15181, "epoch": 125} {"train_loss": -27.03571891784668, "global_step": 15182, "epoch": 125} {"train_loss": -27.4764347076416, "global_step": 15183, "epoch": 125} {"train_loss": -27.430517196655273, "global_step": 15184, "epoch": 125} {"train_loss": -27.2861270904541, "global_step": 15185, "epoch": 125} {"train_loss": -27.581113815307617, "global_step": 15186, "epoch": 125} {"train_loss": -26.82850456237793, "global_step": 15187, "epoch": 125} {"train_loss": -27.572885513305664, "global_step": 15188, "epoch": 125} {"train_loss": -27.809797286987305, "global_step": 15189, "epoch": 125} {"train_loss": -27.3704891204834, "global_step": 15190, "epoch": 125} {"train_loss": -27.792200088500977, "global_step": 15191, "epoch": 125} {"train_loss": -27.70953941345215, "global_step": 15192, "epoch": 125} {"train_loss": -28.139875411987305, "global_step": 15193, "epoch": 125} {"train_loss": -28.0738525390625, "global_step": 15194, "epoch": 125} {"train_loss": -27.840063095092773, "global_step": 15195, "epoch": 125} {"train_loss": -27.582334518432617, "global_step": 15196, "epoch": 125} {"train_loss": -27.906518936157227, "global_step": 15197, "epoch": 125} {"train_loss": -27.522214889526367, "global_step": 15198, "epoch": 125} {"train_loss": -27.73587989807129, "global_step": 15199, "epoch": 125} {"train_loss": -27.928735733032227, "global_step": 15200, "epoch": 125} {"train_loss": -27.957046508789062, "global_step": 15201, "epoch": 125} {"train_loss": -27.6818904876709, "global_step": 15202, "epoch": 125} {"train_loss": -27.5767765045166, "global_step": 15203, "epoch": 125} {"train_loss": -27.811548233032227, "global_step": 15204, "epoch": 125} {"train_loss": -28.03554344177246, "global_step": 15205, "epoch": 125} {"train_loss": -27.540790557861328, "global_step": 15206, "epoch": 125} {"train_loss": -28.019001007080078, "global_step": 15207, "epoch": 125} {"train_loss": -27.946874618530273, "global_step": 15208, "epoch": 125} {"train_loss": -28.1539363861084, "global_step": 15209, "epoch": 125} {"train_loss": -27.915969848632812, "global_step": 15210, "epoch": 125} {"train_loss": -27.459426879882812, "global_step": 15211, "epoch": 125} {"train_loss": -26.834564208984375, "global_step": 15212, "epoch": 125} {"train_loss": -23.082685470581055, "global_step": 15213, "epoch": 125} {"train_loss": -15.1856050491333, "global_step": 15214, "epoch": 125} {"train_loss": -7.447761058807373, "global_step": 15215, "epoch": 125} {"train_loss": -19.48280143737793, "global_step": 15216, "epoch": 125} {"train_loss": -23.1969051361084, "global_step": 15217, "epoch": 125} {"train_loss": -24.41193962097168, "global_step": 15218, "epoch": 125} {"train_loss": -21.080713272094727, "global_step": 15219, "epoch": 125} {"train_loss": -23.753692626953125, "global_step": 15220, "epoch": 125} {"train_loss": -23.582250595092773, "global_step": 15221, "epoch": 125} {"train_loss": -23.845046997070312, "global_step": 15222, "epoch": 125} {"train_loss": -22.045623779296875, "global_step": 15223, "epoch": 125} {"train_loss": -26.292585372924805, "global_step": 15224, "epoch": 125} {"train_loss": -25.067811965942383, "global_step": 15225, "epoch": 125} {"train_loss": -25.33053970336914, "global_step": 15226, "epoch": 125} {"train_loss": -24.63194465637207, "global_step": 15227, "epoch": 125} {"train_loss": -25.277070999145508, "global_step": 15228, "epoch": 125} {"train_loss": -24.790878295898438, "global_step": 15229, "epoch": 125} {"train_loss": -26.129043579101562, "global_step": 15230, "epoch": 125} {"train_loss": -25.8579158782959, "global_step": 15231, "epoch": 125} {"train_loss": -26.149982452392578, "global_step": 15232, "epoch": 125} {"train_loss": -26.188451766967773, "global_step": 15233, "epoch": 125} {"train_loss": -25.458465576171875, "global_step": 15234, "epoch": 125} {"train_loss": -26.038522720336914, "global_step": 15235, "epoch": 125} {"train_loss": -26.570236206054688, "global_step": 15236, "epoch": 125} {"train_loss": -25.70340919494629, "global_step": 15237, "epoch": 125} {"train_loss": -26.161090850830078, "global_step": 15238, "epoch": 125} {"train_loss": -26.049118041992188, "global_step": 15239, "epoch": 125} {"train_loss": -25.99764060974121, "global_step": 15240, "epoch": 125} {"train_loss": -26.669931411743164, "global_step": 15241, "epoch": 125} {"train_loss": -26.391326904296875, "global_step": 15242, "epoch": 125} {"train_loss": -26.098743438720703, "global_step": 15243, "epoch": 125} {"train_loss": -26.687240600585938, "global_step": 15244, "epoch": 125} {"train_loss": -26.3656281439726, "global_step": 15245, "epoch": 125, "val_loss": 2682847.25} {"train_loss": -26.733779907226562, "global_step": 15246, "epoch": 126} {"train_loss": -26.320541381835938, "global_step": 15247, "epoch": 126} {"train_loss": -26.508167266845703, "global_step": 15248, "epoch": 126} {"train_loss": -26.897958755493164, "global_step": 15249, "epoch": 126} {"train_loss": -26.695636749267578, "global_step": 15250, "epoch": 126} {"train_loss": -26.655893325805664, "global_step": 15251, "epoch": 126} {"train_loss": -27.0369873046875, "global_step": 15252, "epoch": 126} {"train_loss": -26.570148468017578, "global_step": 15253, "epoch": 126} {"train_loss": -26.99067497253418, "global_step": 15254, "epoch": 126} {"train_loss": -26.7617244720459, "global_step": 15255, "epoch": 126} {"train_loss": -27.12482261657715, "global_step": 15256, "epoch": 126} {"train_loss": -27.038923263549805, "global_step": 15257, "epoch": 126} {"train_loss": -27.156543731689453, "global_step": 15258, "epoch": 126} {"train_loss": -27.24944496154785, "global_step": 15259, "epoch": 126} {"train_loss": -26.828474044799805, "global_step": 15260, "epoch": 126} {"train_loss": -26.968908309936523, "global_step": 15261, "epoch": 126} {"train_loss": -26.885976791381836, "global_step": 15262, "epoch": 126} {"train_loss": -26.7315616607666, "global_step": 15263, "epoch": 126} {"train_loss": -27.55133056640625, "global_step": 15264, "epoch": 126} {"train_loss": -27.25661277770996, "global_step": 15265, "epoch": 126} {"train_loss": -27.2801456451416, "global_step": 15266, "epoch": 126} {"train_loss": -27.31024742126465, "global_step": 15267, "epoch": 126} {"train_loss": -26.97406578063965, "global_step": 15268, "epoch": 126} {"train_loss": -27.523752212524414, "global_step": 15269, "epoch": 126} {"train_loss": -27.429468154907227, "global_step": 15270, "epoch": 126} {"train_loss": -27.236663818359375, "global_step": 15271, "epoch": 126} {"train_loss": -26.9250545501709, "global_step": 15272, "epoch": 126} {"train_loss": -27.38189125061035, "global_step": 15273, "epoch": 126} {"train_loss": -27.04194450378418, "global_step": 15274, "epoch": 126} {"train_loss": -26.701141357421875, "global_step": 15275, "epoch": 126} {"train_loss": -27.211450576782227, "global_step": 15276, "epoch": 126} {"train_loss": -27.2451171875, "global_step": 15277, "epoch": 126} {"train_loss": -27.163604736328125, "global_step": 15278, "epoch": 126} {"train_loss": -27.498334884643555, "global_step": 15279, "epoch": 126} {"train_loss": -27.014480590820312, "global_step": 15280, "epoch": 126} {"train_loss": -26.9437313079834, "global_step": 15281, "epoch": 126} {"train_loss": -24.97163963317871, "global_step": 15282, "epoch": 126} {"train_loss": -27.271930694580078, "global_step": 15283, "epoch": 126} {"train_loss": -25.13511085510254, "global_step": 15284, "epoch": 126} {"train_loss": -26.718036651611328, "global_step": 15285, "epoch": 126} {"train_loss": -25.91200065612793, "global_step": 15286, "epoch": 126} {"train_loss": -25.110082626342773, "global_step": 15287, "epoch": 126} {"train_loss": -26.497922897338867, "global_step": 15288, "epoch": 126} {"train_loss": -26.6005859375, "global_step": 15289, "epoch": 126} {"train_loss": -26.1103515625, "global_step": 15290, "epoch": 126} {"train_loss": -27.420272827148438, "global_step": 15291, "epoch": 126} {"train_loss": -26.75079345703125, "global_step": 15292, "epoch": 126} {"train_loss": -26.920331954956055, "global_step": 15293, "epoch": 126} {"train_loss": -26.96442985534668, "global_step": 15294, "epoch": 126} {"train_loss": -27.120080947875977, "global_step": 15295, "epoch": 126} {"train_loss": -27.546701431274414, "global_step": 15296, "epoch": 126} {"train_loss": -27.321924209594727, "global_step": 15297, "epoch": 126} {"train_loss": -27.39253044128418, "global_step": 15298, "epoch": 126} {"train_loss": -27.431350708007812, "global_step": 15299, "epoch": 126} {"train_loss": -27.838720321655273, "global_step": 15300, "epoch": 126} {"train_loss": -27.31703758239746, "global_step": 15301, "epoch": 126} {"train_loss": -27.423696517944336, "global_step": 15302, "epoch": 126} {"train_loss": -27.573537826538086, "global_step": 15303, "epoch": 126} {"train_loss": -28.054718017578125, "global_step": 15304, "epoch": 126} {"train_loss": -27.864999771118164, "global_step": 15305, "epoch": 126} {"train_loss": -27.562088012695312, "global_step": 15306, "epoch": 126} {"train_loss": -27.327789306640625, "global_step": 15307, "epoch": 126} {"train_loss": -27.677839279174805, "global_step": 15308, "epoch": 126} {"train_loss": -27.054731369018555, "global_step": 15309, "epoch": 126} {"train_loss": -27.300016403198242, "global_step": 15310, "epoch": 126} {"train_loss": -27.84234046936035, "global_step": 15311, "epoch": 126} {"train_loss": -27.883987426757812, "global_step": 15312, "epoch": 126} {"train_loss": -27.648359298706055, "global_step": 15313, "epoch": 126} {"train_loss": -27.232736587524414, "global_step": 15314, "epoch": 126} {"train_loss": -27.060632705688477, "global_step": 15315, "epoch": 126} {"train_loss": -27.54741859436035, "global_step": 15316, "epoch": 126} {"train_loss": -27.6520938873291, "global_step": 15317, "epoch": 126} {"train_loss": -27.348485946655273, "global_step": 15318, "epoch": 126} {"train_loss": -26.47100257873535, "global_step": 15319, "epoch": 126} {"train_loss": -27.58984375, "global_step": 15320, "epoch": 126} {"train_loss": -27.026464462280273, "global_step": 15321, "epoch": 126} {"train_loss": -27.135740280151367, "global_step": 15322, "epoch": 126} {"train_loss": -25.467187881469727, "global_step": 15323, "epoch": 126} {"train_loss": -22.514442443847656, "global_step": 15324, "epoch": 126} {"train_loss": -18.039592742919922, "global_step": 15325, "epoch": 126} {"train_loss": -14.741836547851562, "global_step": 15326, "epoch": 126} {"train_loss": -26.375259399414062, "global_step": 15327, "epoch": 126} {"train_loss": -22.26171112060547, "global_step": 15328, "epoch": 126} {"train_loss": -26.658405303955078, "global_step": 15329, "epoch": 126} {"train_loss": -23.528467178344727, "global_step": 15330, "epoch": 126} {"train_loss": -24.01576042175293, "global_step": 15331, "epoch": 126} {"train_loss": -26.3281307220459, "global_step": 15332, "epoch": 126} {"train_loss": -24.709434509277344, "global_step": 15333, "epoch": 126} {"train_loss": -24.953937530517578, "global_step": 15334, "epoch": 126} {"train_loss": -25.623044967651367, "global_step": 15335, "epoch": 126} {"train_loss": -25.67243766784668, "global_step": 15336, "epoch": 126} {"train_loss": -25.637243270874023, "global_step": 15337, "epoch": 126} {"train_loss": -26.333450317382812, "global_step": 15338, "epoch": 126} {"train_loss": -26.6229190826416, "global_step": 15339, "epoch": 126} {"train_loss": -26.245344161987305, "global_step": 15340, "epoch": 126} {"train_loss": -26.122089385986328, "global_step": 15341, "epoch": 126} {"train_loss": -26.2518253326416, "global_step": 15342, "epoch": 126} {"train_loss": -26.316883087158203, "global_step": 15343, "epoch": 126} {"train_loss": -26.688098907470703, "global_step": 15344, "epoch": 126} {"train_loss": -26.273773193359375, "global_step": 15345, "epoch": 126} {"train_loss": -26.41534996032715, "global_step": 15346, "epoch": 126} {"train_loss": -26.9277400970459, "global_step": 15347, "epoch": 126} {"train_loss": -25.940290451049805, "global_step": 15348, "epoch": 126} {"train_loss": -26.205188751220703, "global_step": 15349, "epoch": 126} {"train_loss": -26.05732536315918, "global_step": 15350, "epoch": 126} {"train_loss": -26.081750869750977, "global_step": 15351, "epoch": 126} {"train_loss": -25.872913360595703, "global_step": 15352, "epoch": 126} {"train_loss": -26.297513961791992, "global_step": 15353, "epoch": 126} {"train_loss": -26.806238174438477, "global_step": 15354, "epoch": 126} {"train_loss": -26.463911056518555, "global_step": 15355, "epoch": 126} {"train_loss": -26.794544219970703, "global_step": 15356, "epoch": 126} {"train_loss": -26.71742057800293, "global_step": 15357, "epoch": 126} {"train_loss": -26.414636611938477, "global_step": 15358, "epoch": 126} {"train_loss": -26.844207763671875, "global_step": 15359, "epoch": 126} {"train_loss": -26.462926864624023, "global_step": 15360, "epoch": 126} {"train_loss": -27.138731002807617, "global_step": 15361, "epoch": 126} {"train_loss": -26.70564079284668, "global_step": 15362, "epoch": 126} {"train_loss": -25.750864028930664, "global_step": 15363, "epoch": 126} {"train_loss": -26.745746612548828, "global_step": 15364, "epoch": 126} {"train_loss": -27.29316520690918, "global_step": 15365, "epoch": 126} {"train_loss": -26.506526158860893, "global_step": 15366, "epoch": 126, "val_loss": 2836552.0} {"train_loss": -26.727766036987305, "global_step": 15367, "epoch": 127} {"train_loss": -27.069238662719727, "global_step": 15368, "epoch": 127} {"train_loss": -26.93039894104004, "global_step": 15369, "epoch": 127} {"train_loss": -26.810367584228516, "global_step": 15370, "epoch": 127} {"train_loss": -27.106796264648438, "global_step": 15371, "epoch": 127} {"train_loss": -27.209915161132812, "global_step": 15372, "epoch": 127} {"train_loss": -26.88392448425293, "global_step": 15373, "epoch": 127} {"train_loss": -26.9721736907959, "global_step": 15374, "epoch": 127} {"train_loss": -26.94219970703125, "global_step": 15375, "epoch": 127} {"train_loss": -27.048017501831055, "global_step": 15376, "epoch": 127} {"train_loss": -27.302717208862305, "global_step": 15377, "epoch": 127} {"train_loss": -27.4094181060791, "global_step": 15378, "epoch": 127} {"train_loss": -27.194433212280273, "global_step": 15379, "epoch": 127} {"train_loss": -27.405744552612305, "global_step": 15380, "epoch": 127} {"train_loss": -27.62405776977539, "global_step": 15381, "epoch": 127} {"train_loss": -27.118207931518555, "global_step": 15382, "epoch": 127} {"train_loss": -27.35000991821289, "global_step": 15383, "epoch": 127} {"train_loss": -27.474456787109375, "global_step": 15384, "epoch": 127} {"train_loss": -26.9074649810791, "global_step": 15385, "epoch": 127} {"train_loss": -26.98248863220215, "global_step": 15386, "epoch": 127} {"train_loss": -26.97235679626465, "global_step": 15387, "epoch": 127} {"train_loss": -26.6275577545166, "global_step": 15388, "epoch": 127} {"train_loss": -26.936071395874023, "global_step": 15389, "epoch": 127} {"train_loss": -27.096792221069336, "global_step": 15390, "epoch": 127} {"train_loss": -27.37946128845215, "global_step": 15391, "epoch": 127} {"train_loss": -27.8945255279541, "global_step": 15392, "epoch": 127} {"train_loss": -27.104211807250977, "global_step": 15393, "epoch": 127} {"train_loss": -27.426137924194336, "global_step": 15394, "epoch": 127} {"train_loss": -27.822071075439453, "global_step": 15395, "epoch": 127} {"train_loss": -27.800628662109375, "global_step": 15396, "epoch": 127} {"train_loss": -27.570356369018555, "global_step": 15397, "epoch": 127} {"train_loss": -27.434707641601562, "global_step": 15398, "epoch": 127} {"train_loss": -27.611419677734375, "global_step": 15399, "epoch": 127} {"train_loss": -28.003437042236328, "global_step": 15400, "epoch": 127} {"train_loss": -27.461261749267578, "global_step": 15401, "epoch": 127} {"train_loss": -27.975696563720703, "global_step": 15402, "epoch": 127} {"train_loss": -27.889684677124023, "global_step": 15403, "epoch": 127} {"train_loss": -28.171661376953125, "global_step": 15404, "epoch": 127} {"train_loss": -27.530200958251953, "global_step": 15405, "epoch": 127} {"train_loss": -28.260135650634766, "global_step": 15406, "epoch": 127} {"train_loss": -27.869583129882812, "global_step": 15407, "epoch": 127} {"train_loss": -28.10489845275879, "global_step": 15408, "epoch": 127} {"train_loss": -27.7549991607666, "global_step": 15409, "epoch": 127} {"train_loss": -27.46742057800293, "global_step": 15410, "epoch": 127} {"train_loss": -27.94939613342285, "global_step": 15411, "epoch": 127} {"train_loss": -27.761877059936523, "global_step": 15412, "epoch": 127} {"train_loss": -27.507726669311523, "global_step": 15413, "epoch": 127} {"train_loss": -27.632429122924805, "global_step": 15414, "epoch": 127} {"train_loss": -27.984785079956055, "global_step": 15415, "epoch": 127} {"train_loss": -27.907672882080078, "global_step": 15416, "epoch": 127} {"train_loss": -28.3075008392334, "global_step": 15417, "epoch": 127} {"train_loss": -27.262067794799805, "global_step": 15418, "epoch": 127} {"train_loss": -27.90349769592285, "global_step": 15419, "epoch": 127} {"train_loss": -27.759775161743164, "global_step": 15420, "epoch": 127} {"train_loss": -27.77186393737793, "global_step": 15421, "epoch": 127} {"train_loss": -27.816547393798828, "global_step": 15422, "epoch": 127} {"train_loss": -28.280908584594727, "global_step": 15423, "epoch": 127} {"train_loss": -27.46966552734375, "global_step": 15424, "epoch": 127} {"train_loss": -26.936847686767578, "global_step": 15425, "epoch": 127} {"train_loss": -28.538660049438477, "global_step": 15426, "epoch": 127} {"train_loss": -27.970056533813477, "global_step": 15427, "epoch": 127} {"train_loss": -28.0157470703125, "global_step": 15428, "epoch": 127} {"train_loss": -27.47562599182129, "global_step": 15429, "epoch": 127} {"train_loss": -28.138568878173828, "global_step": 15430, "epoch": 127} {"train_loss": -28.380130767822266, "global_step": 15431, "epoch": 127} {"train_loss": -28.011564254760742, "global_step": 15432, "epoch": 127} {"train_loss": -28.288747787475586, "global_step": 15433, "epoch": 127} {"train_loss": -28.542295455932617, "global_step": 15434, "epoch": 127} {"train_loss": -28.495054244995117, "global_step": 15435, "epoch": 127} {"train_loss": -27.91570472717285, "global_step": 15436, "epoch": 127} {"train_loss": -28.374780654907227, "global_step": 15437, "epoch": 127} {"train_loss": -28.734655380249023, "global_step": 15438, "epoch": 127} {"train_loss": -28.379535675048828, "global_step": 15439, "epoch": 127} {"train_loss": -28.461332321166992, "global_step": 15440, "epoch": 127} {"train_loss": -28.658361434936523, "global_step": 15441, "epoch": 127} {"train_loss": -28.589147567749023, "global_step": 15442, "epoch": 127} {"train_loss": -28.474029541015625, "global_step": 15443, "epoch": 127} {"train_loss": -28.860822677612305, "global_step": 15444, "epoch": 127} {"train_loss": -28.61141014099121, "global_step": 15445, "epoch": 127} {"train_loss": -28.51386070251465, "global_step": 15446, "epoch": 127} {"train_loss": -28.671667098999023, "global_step": 15447, "epoch": 127} {"train_loss": -28.555816650390625, "global_step": 15448, "epoch": 127} {"train_loss": -28.97821617126465, "global_step": 15449, "epoch": 127} {"train_loss": -28.997838973999023, "global_step": 15450, "epoch": 127} {"train_loss": -28.80938720703125, "global_step": 15451, "epoch": 127} {"train_loss": -28.93646240234375, "global_step": 15452, "epoch": 127} {"train_loss": -28.200056076049805, "global_step": 15453, "epoch": 127} {"train_loss": -25.95355796813965, "global_step": 15454, "epoch": 127} {"train_loss": -23.053985595703125, "global_step": 15455, "epoch": 127} {"train_loss": -19.018192291259766, "global_step": 15456, "epoch": 127} {"train_loss": -16.464120864868164, "global_step": 15457, "epoch": 127} {"train_loss": -20.330846786499023, "global_step": 15458, "epoch": 127} {"train_loss": -22.70783042907715, "global_step": 15459, "epoch": 127} {"train_loss": -23.691267013549805, "global_step": 15460, "epoch": 127} {"train_loss": -26.607746124267578, "global_step": 15461, "epoch": 127} {"train_loss": -24.43862533569336, "global_step": 15462, "epoch": 127} {"train_loss": -26.458541870117188, "global_step": 15463, "epoch": 127} {"train_loss": -26.346723556518555, "global_step": 15464, "epoch": 127} {"train_loss": -26.18098258972168, "global_step": 15465, "epoch": 127} {"train_loss": -26.737293243408203, "global_step": 15466, "epoch": 127} {"train_loss": -26.53203773498535, "global_step": 15467, "epoch": 127} {"train_loss": -26.340978622436523, "global_step": 15468, "epoch": 127} {"train_loss": -27.131576538085938, "global_step": 15469, "epoch": 127} {"train_loss": -26.775846481323242, "global_step": 15470, "epoch": 127} {"train_loss": -26.989648818969727, "global_step": 15471, "epoch": 127} {"train_loss": -27.351789474487305, "global_step": 15472, "epoch": 127} {"train_loss": -27.353357315063477, "global_step": 15473, "epoch": 127} {"train_loss": -27.427555084228516, "global_step": 15474, "epoch": 127} {"train_loss": -27.02668571472168, "global_step": 15475, "epoch": 127} {"train_loss": -27.23333168029785, "global_step": 15476, "epoch": 127} {"train_loss": -27.434743881225586, "global_step": 15477, "epoch": 127} {"train_loss": -27.48870277404785, "global_step": 15478, "epoch": 127} {"train_loss": -26.851057052612305, "global_step": 15479, "epoch": 127} {"train_loss": -27.514850616455078, "global_step": 15480, "epoch": 127} {"train_loss": -27.7063045501709, "global_step": 15481, "epoch": 127} {"train_loss": -27.222448348999023, "global_step": 15482, "epoch": 127} {"train_loss": -27.786762237548828, "global_step": 15483, "epoch": 127} {"train_loss": -27.5568790435791, "global_step": 15484, "epoch": 127} {"train_loss": -27.724750518798828, "global_step": 15485, "epoch": 127} {"train_loss": -27.81214714050293, "global_step": 15486, "epoch": 127} {"train_loss": -27.259148038123264, "global_step": 15487, "epoch": 127, "val_loss": 2713290.0} {"train_loss": -27.704608917236328, "global_step": 15488, "epoch": 128} {"train_loss": -27.611093521118164, "global_step": 15489, "epoch": 128} {"train_loss": -27.694379806518555, "global_step": 15490, "epoch": 128} {"train_loss": -27.75592041015625, "global_step": 15491, "epoch": 128} {"train_loss": -27.654621124267578, "global_step": 15492, "epoch": 128} {"train_loss": -27.921239852905273, "global_step": 15493, "epoch": 128} {"train_loss": -27.936140060424805, "global_step": 15494, "epoch": 128} {"train_loss": -27.405675888061523, "global_step": 15495, "epoch": 128} {"train_loss": -28.024036407470703, "global_step": 15496, "epoch": 128} {"train_loss": -28.004430770874023, "global_step": 15497, "epoch": 128} {"train_loss": -27.304916381835938, "global_step": 15498, "epoch": 128} {"train_loss": -27.83926773071289, "global_step": 15499, "epoch": 128} {"train_loss": -27.77606201171875, "global_step": 15500, "epoch": 128} {"train_loss": -27.790557861328125, "global_step": 15501, "epoch": 128} {"train_loss": -28.004302978515625, "global_step": 15502, "epoch": 128} {"train_loss": -28.028522491455078, "global_step": 15503, "epoch": 128} {"train_loss": -27.443359375, "global_step": 15504, "epoch": 128} {"train_loss": -27.781278610229492, "global_step": 15505, "epoch": 128} {"train_loss": -27.913898468017578, "global_step": 15506, "epoch": 128} {"train_loss": -27.70842933654785, "global_step": 15507, "epoch": 128} {"train_loss": -28.019866943359375, "global_step": 15508, "epoch": 128} {"train_loss": -27.98196792602539, "global_step": 15509, "epoch": 128} {"train_loss": -27.284143447875977, "global_step": 15510, "epoch": 128} {"train_loss": -27.374414443969727, "global_step": 15511, "epoch": 128} {"train_loss": -26.951129913330078, "global_step": 15512, "epoch": 128} {"train_loss": -27.400592803955078, "global_step": 15513, "epoch": 128} {"train_loss": -26.209142684936523, "global_step": 15514, "epoch": 128} {"train_loss": -27.22902488708496, "global_step": 15515, "epoch": 128} {"train_loss": -26.614166259765625, "global_step": 15516, "epoch": 128} {"train_loss": -27.687986373901367, "global_step": 15517, "epoch": 128} {"train_loss": -27.426740646362305, "global_step": 15518, "epoch": 128} {"train_loss": -27.360260009765625, "global_step": 15519, "epoch": 128} {"train_loss": -27.63892936706543, "global_step": 15520, "epoch": 128} {"train_loss": -27.675460815429688, "global_step": 15521, "epoch": 128} {"train_loss": -27.51658058166504, "global_step": 15522, "epoch": 128} {"train_loss": -27.7847900390625, "global_step": 15523, "epoch": 128} {"train_loss": -28.26069450378418, "global_step": 15524, "epoch": 128} {"train_loss": -27.93330955505371, "global_step": 15525, "epoch": 128} {"train_loss": -27.791259765625, "global_step": 15526, "epoch": 128} {"train_loss": -27.36527442932129, "global_step": 15527, "epoch": 128} {"train_loss": -28.191953659057617, "global_step": 15528, "epoch": 128} {"train_loss": -28.364978790283203, "global_step": 15529, "epoch": 128} {"train_loss": -27.765729904174805, "global_step": 15530, "epoch": 128} {"train_loss": -27.944202423095703, "global_step": 15531, "epoch": 128} {"train_loss": -28.346704483032227, "global_step": 15532, "epoch": 128} {"train_loss": -28.28386878967285, "global_step": 15533, "epoch": 128} {"train_loss": -27.995824813842773, "global_step": 15534, "epoch": 128} {"train_loss": -28.312997817993164, "global_step": 15535, "epoch": 128} {"train_loss": -27.948102951049805, "global_step": 15536, "epoch": 128} {"train_loss": -28.204370498657227, "global_step": 15537, "epoch": 128} {"train_loss": -28.23369789123535, "global_step": 15538, "epoch": 128} {"train_loss": -28.7337703704834, "global_step": 15539, "epoch": 128} {"train_loss": -28.2432804107666, "global_step": 15540, "epoch": 128} {"train_loss": -28.262052536010742, "global_step": 15541, "epoch": 128} {"train_loss": -28.197492599487305, "global_step": 15542, "epoch": 128} {"train_loss": -27.626874923706055, "global_step": 15543, "epoch": 128} {"train_loss": -27.88557243347168, "global_step": 15544, "epoch": 128} {"train_loss": -28.255033493041992, "global_step": 15545, "epoch": 128} {"train_loss": -27.136381149291992, "global_step": 15546, "epoch": 128} {"train_loss": -26.89971923828125, "global_step": 15547, "epoch": 128} {"train_loss": -27.726896286010742, "global_step": 15548, "epoch": 128} {"train_loss": -27.798803329467773, "global_step": 15549, "epoch": 128} {"train_loss": -27.3961124420166, "global_step": 15550, "epoch": 128} {"train_loss": -27.9420108795166, "global_step": 15551, "epoch": 128} {"train_loss": -27.785175323486328, "global_step": 15552, "epoch": 128} {"train_loss": -27.743738174438477, "global_step": 15553, "epoch": 128} {"train_loss": -27.56879234313965, "global_step": 15554, "epoch": 128} {"train_loss": -27.754133224487305, "global_step": 15555, "epoch": 128} {"train_loss": -27.9575252532959, "global_step": 15556, "epoch": 128} {"train_loss": -27.96161460876465, "global_step": 15557, "epoch": 128} {"train_loss": -28.247140884399414, "global_step": 15558, "epoch": 128} {"train_loss": -28.191640853881836, "global_step": 15559, "epoch": 128} {"train_loss": -27.801254272460938, "global_step": 15560, "epoch": 128} {"train_loss": -27.76068687438965, "global_step": 15561, "epoch": 128} {"train_loss": -28.379724502563477, "global_step": 15562, "epoch": 128} {"train_loss": -28.039167404174805, "global_step": 15563, "epoch": 128} {"train_loss": -27.862064361572266, "global_step": 15564, "epoch": 128} {"train_loss": -28.159337997436523, "global_step": 15565, "epoch": 128} {"train_loss": -27.822797775268555, "global_step": 15566, "epoch": 128} {"train_loss": -28.512475967407227, "global_step": 15567, "epoch": 128} {"train_loss": -28.002410888671875, "global_step": 15568, "epoch": 128} {"train_loss": -28.07575798034668, "global_step": 15569, "epoch": 128} {"train_loss": -28.031171798706055, "global_step": 15570, "epoch": 128} {"train_loss": -28.514820098876953, "global_step": 15571, "epoch": 128} {"train_loss": -28.45379066467285, "global_step": 15572, "epoch": 128} {"train_loss": -28.124502182006836, "global_step": 15573, "epoch": 128} {"train_loss": -28.611804962158203, "global_step": 15574, "epoch": 128} {"train_loss": -28.567626953125, "global_step": 15575, "epoch": 128} {"train_loss": -27.99458122253418, "global_step": 15576, "epoch": 128} {"train_loss": -28.802631378173828, "global_step": 15577, "epoch": 128} {"train_loss": -28.499799728393555, "global_step": 15578, "epoch": 128} {"train_loss": -28.544767379760742, "global_step": 15579, "epoch": 128} {"train_loss": -28.48335075378418, "global_step": 15580, "epoch": 128} {"train_loss": -28.20020866394043, "global_step": 15581, "epoch": 128} {"train_loss": -28.486251831054688, "global_step": 15582, "epoch": 128} {"train_loss": -28.12521743774414, "global_step": 15583, "epoch": 128} {"train_loss": -26.58112144470215, "global_step": 15584, "epoch": 128} {"train_loss": -26.232574462890625, "global_step": 15585, "epoch": 128} {"train_loss": -24.25300407409668, "global_step": 15586, "epoch": 128} {"train_loss": -22.104618072509766, "global_step": 15587, "epoch": 128} {"train_loss": -19.53887176513672, "global_step": 15588, "epoch": 128} {"train_loss": -25.514507293701172, "global_step": 15589, "epoch": 128} {"train_loss": -25.59545135498047, "global_step": 15590, "epoch": 128} {"train_loss": -24.850378036499023, "global_step": 15591, "epoch": 128} {"train_loss": -25.524150848388672, "global_step": 15592, "epoch": 128} {"train_loss": -26.09159278869629, "global_step": 15593, "epoch": 128} {"train_loss": -26.972131729125977, "global_step": 15594, "epoch": 128} {"train_loss": -26.949399948120117, "global_step": 15595, "epoch": 128} {"train_loss": -26.2056884765625, "global_step": 15596, "epoch": 128} {"train_loss": -27.967269897460938, "global_step": 15597, "epoch": 128} {"train_loss": -26.540082931518555, "global_step": 15598, "epoch": 128} {"train_loss": -27.143787384033203, "global_step": 15599, "epoch": 128} {"train_loss": -27.55742835998535, "global_step": 15600, "epoch": 128} {"train_loss": -26.90690040588379, "global_step": 15601, "epoch": 128} {"train_loss": -27.478214263916016, "global_step": 15602, "epoch": 128} {"train_loss": -27.466312408447266, "global_step": 15603, "epoch": 128} {"train_loss": -27.700611114501953, "global_step": 15604, "epoch": 128} {"train_loss": -27.397138595581055, "global_step": 15605, "epoch": 128} {"train_loss": -27.627090454101562, "global_step": 15606, "epoch": 128} {"train_loss": -27.969913482666016, "global_step": 15607, "epoch": 128} {"train_loss": -27.5488341150205, "global_step": 15608, "epoch": 128, "val_loss": 2575113.75} {"train_loss": -27.699365615844727, "global_step": 15609, "epoch": 129} {"train_loss": -27.9497127532959, "global_step": 15610, "epoch": 129} {"train_loss": -27.755401611328125, "global_step": 15611, "epoch": 129} {"train_loss": -28.2121524810791, "global_step": 15612, "epoch": 129} {"train_loss": -27.841577529907227, "global_step": 15613, "epoch": 129} {"train_loss": -27.91718101501465, "global_step": 15614, "epoch": 129} {"train_loss": -28.3736572265625, "global_step": 15615, "epoch": 129} {"train_loss": -28.10352897644043, "global_step": 15616, "epoch": 129} {"train_loss": -28.3807373046875, "global_step": 15617, "epoch": 129} {"train_loss": -28.415237426757812, "global_step": 15618, "epoch": 129} {"train_loss": -28.032934188842773, "global_step": 15619, "epoch": 129} {"train_loss": -28.11919593811035, "global_step": 15620, "epoch": 129} {"train_loss": -27.975656509399414, "global_step": 15621, "epoch": 129} {"train_loss": -27.14862632751465, "global_step": 15622, "epoch": 129} {"train_loss": -27.788583755493164, "global_step": 15623, "epoch": 129} {"train_loss": -23.036497116088867, "global_step": 15624, "epoch": 129} {"train_loss": 0.2560291290283203, "global_step": 15625, "epoch": 129} {"train_loss": 1.038661241531372, "global_step": 15626, "epoch": 129} {"train_loss": -21.6093692779541, "global_step": 15627, "epoch": 129} {"train_loss": -23.570127487182617, "global_step": 15628, "epoch": 129} {"train_loss": -21.71211051940918, "global_step": 15629, "epoch": 129} {"train_loss": -18.707012176513672, "global_step": 15630, "epoch": 129} {"train_loss": -25.719135284423828, "global_step": 15631, "epoch": 129} {"train_loss": -25.48101806640625, "global_step": 15632, "epoch": 129} {"train_loss": -26.010557174682617, "global_step": 15633, "epoch": 129} {"train_loss": -24.11082649230957, "global_step": 15634, "epoch": 129} {"train_loss": -25.576068878173828, "global_step": 15635, "epoch": 129} {"train_loss": -24.037878036499023, "global_step": 15636, "epoch": 129} {"train_loss": -25.010902404785156, "global_step": 15637, "epoch": 129} {"train_loss": -25.513172149658203, "global_step": 15638, "epoch": 129} {"train_loss": -26.368261337280273, "global_step": 15639, "epoch": 129} {"train_loss": -25.832937240600586, "global_step": 15640, "epoch": 129} {"train_loss": -26.569345474243164, "global_step": 15641, "epoch": 129} {"train_loss": -26.171955108642578, "global_step": 15642, "epoch": 129} {"train_loss": -26.341796875, "global_step": 15643, "epoch": 129} {"train_loss": -26.77857780456543, "global_step": 15644, "epoch": 129} {"train_loss": -26.06987953186035, "global_step": 15645, "epoch": 129} {"train_loss": -26.848163604736328, "global_step": 15646, "epoch": 129} {"train_loss": -26.8381404876709, "global_step": 15647, "epoch": 129} {"train_loss": -26.85853385925293, "global_step": 15648, "epoch": 129} {"train_loss": -26.4376163482666, "global_step": 15649, "epoch": 129} {"train_loss": -26.483022689819336, "global_step": 15650, "epoch": 129} {"train_loss": -26.900842666625977, "global_step": 15651, "epoch": 129} {"train_loss": -26.62912940979004, "global_step": 15652, "epoch": 129} {"train_loss": -26.615802764892578, "global_step": 15653, "epoch": 129} {"train_loss": -26.849477767944336, "global_step": 15654, "epoch": 129} {"train_loss": -26.970163345336914, "global_step": 15655, "epoch": 129} {"train_loss": -27.36471939086914, "global_step": 15656, "epoch": 129} {"train_loss": -27.20416831970215, "global_step": 15657, "epoch": 129} {"train_loss": -27.187856674194336, "global_step": 15658, "epoch": 129} {"train_loss": -27.40280532836914, "global_step": 15659, "epoch": 129} {"train_loss": -27.23008155822754, "global_step": 15660, "epoch": 129} {"train_loss": -27.37738609313965, "global_step": 15661, "epoch": 129} {"train_loss": -27.524885177612305, "global_step": 15662, "epoch": 129} {"train_loss": -27.594533920288086, "global_step": 15663, "epoch": 129} {"train_loss": -27.576642990112305, "global_step": 15664, "epoch": 129} {"train_loss": -28.068740844726562, "global_step": 15665, "epoch": 129} {"train_loss": -27.656665802001953, "global_step": 15666, "epoch": 129} {"train_loss": -27.44548988342285, "global_step": 15667, "epoch": 129} {"train_loss": -28.184101104736328, "global_step": 15668, "epoch": 129} {"train_loss": -27.342670440673828, "global_step": 15669, "epoch": 129} {"train_loss": -28.007837295532227, "global_step": 15670, "epoch": 129} {"train_loss": -28.172300338745117, "global_step": 15671, "epoch": 129} {"train_loss": -27.78925132751465, "global_step": 15672, "epoch": 129} {"train_loss": -28.407629013061523, "global_step": 15673, "epoch": 129} {"train_loss": -27.913793563842773, "global_step": 15674, "epoch": 129} {"train_loss": -28.3109073638916, "global_step": 15675, "epoch": 129} {"train_loss": -28.082218170166016, "global_step": 15676, "epoch": 129} {"train_loss": -28.508108139038086, "global_step": 15677, "epoch": 129} {"train_loss": -27.71889305114746, "global_step": 15678, "epoch": 129} {"train_loss": -28.06587791442871, "global_step": 15679, "epoch": 129} {"train_loss": -27.283100128173828, "global_step": 15680, "epoch": 129} {"train_loss": -27.5970401763916, "global_step": 15681, "epoch": 129} {"train_loss": -27.93922233581543, "global_step": 15682, "epoch": 129} {"train_loss": -28.254657745361328, "global_step": 15683, "epoch": 129} {"train_loss": -27.75848388671875, "global_step": 15684, "epoch": 129} {"train_loss": -27.981861114501953, "global_step": 15685, "epoch": 129} {"train_loss": -28.112085342407227, "global_step": 15686, "epoch": 129} {"train_loss": -27.9390926361084, "global_step": 15687, "epoch": 129} {"train_loss": -27.787790298461914, "global_step": 15688, "epoch": 129} {"train_loss": -27.90771484375, "global_step": 15689, "epoch": 129} {"train_loss": -27.664947509765625, "global_step": 15690, "epoch": 129} {"train_loss": -27.606313705444336, "global_step": 15691, "epoch": 129} {"train_loss": -27.61042594909668, "global_step": 15692, "epoch": 129} {"train_loss": -27.9769344329834, "global_step": 15693, "epoch": 129} {"train_loss": -27.742368698120117, "global_step": 15694, "epoch": 129} {"train_loss": -28.1337833404541, "global_step": 15695, "epoch": 129} {"train_loss": -28.013355255126953, "global_step": 15696, "epoch": 129} {"train_loss": -27.753149032592773, "global_step": 15697, "epoch": 129} {"train_loss": -28.642303466796875, "global_step": 15698, "epoch": 129} {"train_loss": -27.972553253173828, "global_step": 15699, "epoch": 129} {"train_loss": -28.07533073425293, "global_step": 15700, "epoch": 129} {"train_loss": -27.94951820373535, "global_step": 15701, "epoch": 129} {"train_loss": -28.09382438659668, "global_step": 15702, "epoch": 129} {"train_loss": -27.972702026367188, "global_step": 15703, "epoch": 129} {"train_loss": -28.3848819732666, "global_step": 15704, "epoch": 129} {"train_loss": -27.94305992126465, "global_step": 15705, "epoch": 129} {"train_loss": -28.07560157775879, "global_step": 15706, "epoch": 129} {"train_loss": -27.744592666625977, "global_step": 15707, "epoch": 129} {"train_loss": -28.03668785095215, "global_step": 15708, "epoch": 129} {"train_loss": -26.80231285095215, "global_step": 15709, "epoch": 129} {"train_loss": -22.9473934173584, "global_step": 15710, "epoch": 129} {"train_loss": -13.942886352539062, "global_step": 15711, "epoch": 129} {"train_loss": -15.306792259216309, "global_step": 15712, "epoch": 129} {"train_loss": -26.287033081054688, "global_step": 15713, "epoch": 129} {"train_loss": -20.314916610717773, "global_step": 15714, "epoch": 129} {"train_loss": -26.314773559570312, "global_step": 15715, "epoch": 129} {"train_loss": -24.502012252807617, "global_step": 15716, "epoch": 129} {"train_loss": -25.084768295288086, "global_step": 15717, "epoch": 129} {"train_loss": -26.64300537109375, "global_step": 15718, "epoch": 129} {"train_loss": -26.261463165283203, "global_step": 15719, "epoch": 129} {"train_loss": -25.528940200805664, "global_step": 15720, "epoch": 129} {"train_loss": -26.832639694213867, "global_step": 15721, "epoch": 129} {"train_loss": -26.9107608795166, "global_step": 15722, "epoch": 129} {"train_loss": -26.8259334564209, "global_step": 15723, "epoch": 129} {"train_loss": -26.53580093383789, "global_step": 15724, "epoch": 129} {"train_loss": -26.79680824279785, "global_step": 15725, "epoch": 129} {"train_loss": -26.164337158203125, "global_step": 15726, "epoch": 129} {"train_loss": -27.168546676635742, "global_step": 15727, "epoch": 129} {"train_loss": -26.6466007232666, "global_step": 15728, "epoch": 129} {"train_loss": -26.254847422119013, "global_step": 15729, "epoch": 129, "val_loss": 2685873.0} {"train_loss": -26.62737464904785, "global_step": 15730, "epoch": 130} {"train_loss": -27.050994873046875, "global_step": 15731, "epoch": 130} {"train_loss": -26.360126495361328, "global_step": 15732, "epoch": 130} {"train_loss": -26.49176025390625, "global_step": 15733, "epoch": 130} {"train_loss": -25.972082138061523, "global_step": 15734, "epoch": 130} {"train_loss": -25.493070602416992, "global_step": 15735, "epoch": 130} {"train_loss": -27.09326171875, "global_step": 15736, "epoch": 130} {"train_loss": -25.349227905273438, "global_step": 15737, "epoch": 130} {"train_loss": -26.90445899963379, "global_step": 15738, "epoch": 130} {"train_loss": -25.36629295349121, "global_step": 15739, "epoch": 130} {"train_loss": -26.866125106811523, "global_step": 15740, "epoch": 130} {"train_loss": -25.834043502807617, "global_step": 15741, "epoch": 130} {"train_loss": -26.8348331451416, "global_step": 15742, "epoch": 130} {"train_loss": -27.14154624938965, "global_step": 15743, "epoch": 130} {"train_loss": -26.178024291992188, "global_step": 15744, "epoch": 130} {"train_loss": -27.38018798828125, "global_step": 15745, "epoch": 130} {"train_loss": -27.156036376953125, "global_step": 15746, "epoch": 130} {"train_loss": -27.047595977783203, "global_step": 15747, "epoch": 130} {"train_loss": -27.083267211914062, "global_step": 15748, "epoch": 130} {"train_loss": -27.000890731811523, "global_step": 15749, "epoch": 130} {"train_loss": -27.035511016845703, "global_step": 15750, "epoch": 130} {"train_loss": -27.241674423217773, "global_step": 15751, "epoch": 130} {"train_loss": -26.9493465423584, "global_step": 15752, "epoch": 130} {"train_loss": -27.440784454345703, "global_step": 15753, "epoch": 130} {"train_loss": -27.08428382873535, "global_step": 15754, "epoch": 130} {"train_loss": -26.94447898864746, "global_step": 15755, "epoch": 130} {"train_loss": -27.35346031188965, "global_step": 15756, "epoch": 130} {"train_loss": -27.012903213500977, "global_step": 15757, "epoch": 130} {"train_loss": -26.96478843688965, "global_step": 15758, "epoch": 130} {"train_loss": -26.175628662109375, "global_step": 15759, "epoch": 130} {"train_loss": -25.491851806640625, "global_step": 15760, "epoch": 130} {"train_loss": -25.872358322143555, "global_step": 15761, "epoch": 130} {"train_loss": -26.84954261779785, "global_step": 15762, "epoch": 130} {"train_loss": -27.407934188842773, "global_step": 15763, "epoch": 130} {"train_loss": -26.82074546813965, "global_step": 15764, "epoch": 130} {"train_loss": -27.2706241607666, "global_step": 15765, "epoch": 130} {"train_loss": -27.58906364440918, "global_step": 15766, "epoch": 130} {"train_loss": -26.206933975219727, "global_step": 15767, "epoch": 130} {"train_loss": -27.37898063659668, "global_step": 15768, "epoch": 130} {"train_loss": -27.08045768737793, "global_step": 15769, "epoch": 130} {"train_loss": -27.334808349609375, "global_step": 15770, "epoch": 130} {"train_loss": -27.154748916625977, "global_step": 15771, "epoch": 130} {"train_loss": -27.892520904541016, "global_step": 15772, "epoch": 130} {"train_loss": -27.3321475982666, "global_step": 15773, "epoch": 130} {"train_loss": -27.740249633789062, "global_step": 15774, "epoch": 130} {"train_loss": -27.508420944213867, "global_step": 15775, "epoch": 130} {"train_loss": -27.309690475463867, "global_step": 15776, "epoch": 130} {"train_loss": -27.222171783447266, "global_step": 15777, "epoch": 130} {"train_loss": -27.329151153564453, "global_step": 15778, "epoch": 130} {"train_loss": -27.259931564331055, "global_step": 15779, "epoch": 130} {"train_loss": -26.22197914123535, "global_step": 15780, "epoch": 130} {"train_loss": -25.8989200592041, "global_step": 15781, "epoch": 130} {"train_loss": -26.369348526000977, "global_step": 15782, "epoch": 130} {"train_loss": -26.980566024780273, "global_step": 15783, "epoch": 130} {"train_loss": -27.844099044799805, "global_step": 15784, "epoch": 130} {"train_loss": -27.25050163269043, "global_step": 15785, "epoch": 130} {"train_loss": -26.066328048706055, "global_step": 15786, "epoch": 130} {"train_loss": -25.959135055541992, "global_step": 15787, "epoch": 130} {"train_loss": -27.44658851623535, "global_step": 15788, "epoch": 130} {"train_loss": -27.444076538085938, "global_step": 15789, "epoch": 130} {"train_loss": -25.012062072753906, "global_step": 15790, "epoch": 130} {"train_loss": -25.539974212646484, "global_step": 15791, "epoch": 130} {"train_loss": -27.54082679748535, "global_step": 15792, "epoch": 130} {"train_loss": -26.534915924072266, "global_step": 15793, "epoch": 130} {"train_loss": -27.290008544921875, "global_step": 15794, "epoch": 130} {"train_loss": -26.454904556274414, "global_step": 15795, "epoch": 130} {"train_loss": -26.57674217224121, "global_step": 15796, "epoch": 130} {"train_loss": -27.321048736572266, "global_step": 15797, "epoch": 130} {"train_loss": -26.987579345703125, "global_step": 15798, "epoch": 130} {"train_loss": -27.120624542236328, "global_step": 15799, "epoch": 130} {"train_loss": -27.377920150756836, "global_step": 15800, "epoch": 130} {"train_loss": -27.728479385375977, "global_step": 15801, "epoch": 130} {"train_loss": -27.290882110595703, "global_step": 15802, "epoch": 130} {"train_loss": -27.492528915405273, "global_step": 15803, "epoch": 130} {"train_loss": -27.05025291442871, "global_step": 15804, "epoch": 130} {"train_loss": -27.781946182250977, "global_step": 15805, "epoch": 130} {"train_loss": -27.481725692749023, "global_step": 15806, "epoch": 130} {"train_loss": -27.557769775390625, "global_step": 15807, "epoch": 130} {"train_loss": -27.836252212524414, "global_step": 15808, "epoch": 130} {"train_loss": -27.614347457885742, "global_step": 15809, "epoch": 130} {"train_loss": -27.747943878173828, "global_step": 15810, "epoch": 130} {"train_loss": -27.989959716796875, "global_step": 15811, "epoch": 130} {"train_loss": -27.864398956298828, "global_step": 15812, "epoch": 130} {"train_loss": -28.066608428955078, "global_step": 15813, "epoch": 130} {"train_loss": -27.71259117126465, "global_step": 15814, "epoch": 130} {"train_loss": -28.0096492767334, "global_step": 15815, "epoch": 130} {"train_loss": -27.1779842376709, "global_step": 15816, "epoch": 130} {"train_loss": -27.8687744140625, "global_step": 15817, "epoch": 130} {"train_loss": -27.982507705688477, "global_step": 15818, "epoch": 130} {"train_loss": -28.17620849609375, "global_step": 15819, "epoch": 130} {"train_loss": -28.39019203186035, "global_step": 15820, "epoch": 130} {"train_loss": -28.055408477783203, "global_step": 15821, "epoch": 130} {"train_loss": -28.03983497619629, "global_step": 15822, "epoch": 130} {"train_loss": -28.154157638549805, "global_step": 15823, "epoch": 130} {"train_loss": -28.263830184936523, "global_step": 15824, "epoch": 130} {"train_loss": -28.172025680541992, "global_step": 15825, "epoch": 130} {"train_loss": -27.7857723236084, "global_step": 15826, "epoch": 130} {"train_loss": -26.791784286499023, "global_step": 15827, "epoch": 130} {"train_loss": -26.293378829956055, "global_step": 15828, "epoch": 130} {"train_loss": -24.769529342651367, "global_step": 15829, "epoch": 130} {"train_loss": -21.590286254882812, "global_step": 15830, "epoch": 130} {"train_loss": -22.438608169555664, "global_step": 15831, "epoch": 130} {"train_loss": -27.386083602905273, "global_step": 15832, "epoch": 130} {"train_loss": -26.31348991394043, "global_step": 15833, "epoch": 130} {"train_loss": -25.428930282592773, "global_step": 15834, "epoch": 130} {"train_loss": -28.130664825439453, "global_step": 15835, "epoch": 130} {"train_loss": -26.532392501831055, "global_step": 15836, "epoch": 130} {"train_loss": -27.40513038635254, "global_step": 15837, "epoch": 130} {"train_loss": -27.363788604736328, "global_step": 15838, "epoch": 130} {"train_loss": -27.694257736206055, "global_step": 15839, "epoch": 130} {"train_loss": -27.65667152404785, "global_step": 15840, "epoch": 130} {"train_loss": -26.778202056884766, "global_step": 15841, "epoch": 130} {"train_loss": -27.950414657592773, "global_step": 15842, "epoch": 130} {"train_loss": -26.960779190063477, "global_step": 15843, "epoch": 130} {"train_loss": -27.154621124267578, "global_step": 15844, "epoch": 130} {"train_loss": -27.71759033203125, "global_step": 15845, "epoch": 130} {"train_loss": -27.90968132019043, "global_step": 15846, "epoch": 130} {"train_loss": -26.99603271484375, "global_step": 15847, "epoch": 130} {"train_loss": -27.387365341186523, "global_step": 15848, "epoch": 130} {"train_loss": -28.045454025268555, "global_step": 15849, "epoch": 130} {"train_loss": -27.002727303623168, "global_step": 15850, "epoch": 130, "val_loss": 2681113.0} {"train_loss": -27.447265625, "global_step": 15851, "epoch": 131} {"train_loss": -27.951208114624023, "global_step": 15852, "epoch": 131} {"train_loss": -27.233154296875, "global_step": 15853, "epoch": 131} {"train_loss": -27.297473907470703, "global_step": 15854, "epoch": 131} {"train_loss": -27.68210220336914, "global_step": 15855, "epoch": 131} {"train_loss": -28.11814308166504, "global_step": 15856, "epoch": 131} {"train_loss": -27.608251571655273, "global_step": 15857, "epoch": 131} {"train_loss": -28.1204891204834, "global_step": 15858, "epoch": 131} {"train_loss": -28.106159210205078, "global_step": 15859, "epoch": 131} {"train_loss": -28.103607177734375, "global_step": 15860, "epoch": 131} {"train_loss": -27.8612060546875, "global_step": 15861, "epoch": 131} {"train_loss": -28.295654296875, "global_step": 15862, "epoch": 131} {"train_loss": -28.16670036315918, "global_step": 15863, "epoch": 131} {"train_loss": -27.979124069213867, "global_step": 15864, "epoch": 131} {"train_loss": -28.5052547454834, "global_step": 15865, "epoch": 131} {"train_loss": -27.678876876831055, "global_step": 15866, "epoch": 131} {"train_loss": -27.849584579467773, "global_step": 15867, "epoch": 131} {"train_loss": -27.645450592041016, "global_step": 15868, "epoch": 131} {"train_loss": -27.966999053955078, "global_step": 15869, "epoch": 131} {"train_loss": -28.01336097717285, "global_step": 15870, "epoch": 131} {"train_loss": -28.149982452392578, "global_step": 15871, "epoch": 131} {"train_loss": -27.803388595581055, "global_step": 15872, "epoch": 131} {"train_loss": -28.28521156311035, "global_step": 15873, "epoch": 131} {"train_loss": -28.41766929626465, "global_step": 15874, "epoch": 131} {"train_loss": -27.936878204345703, "global_step": 15875, "epoch": 131} {"train_loss": -28.039335250854492, "global_step": 15876, "epoch": 131} {"train_loss": -28.300983428955078, "global_step": 15877, "epoch": 131} {"train_loss": -28.311254501342773, "global_step": 15878, "epoch": 131} {"train_loss": -27.987476348876953, "global_step": 15879, "epoch": 131} {"train_loss": -28.156766891479492, "global_step": 15880, "epoch": 131} {"train_loss": -28.1987361907959, "global_step": 15881, "epoch": 131} {"train_loss": -28.212987899780273, "global_step": 15882, "epoch": 131} {"train_loss": -27.850177764892578, "global_step": 15883, "epoch": 131} {"train_loss": -27.89973258972168, "global_step": 15884, "epoch": 131} {"train_loss": -28.2198543548584, "global_step": 15885, "epoch": 131} {"train_loss": -27.15730857849121, "global_step": 15886, "epoch": 131} {"train_loss": -28.258825302124023, "global_step": 15887, "epoch": 131} {"train_loss": -27.312158584594727, "global_step": 15888, "epoch": 131} {"train_loss": -25.5722713470459, "global_step": 15889, "epoch": 131} {"train_loss": -28.424230575561523, "global_step": 15890, "epoch": 131} {"train_loss": -26.434650421142578, "global_step": 15891, "epoch": 131} {"train_loss": -27.792327880859375, "global_step": 15892, "epoch": 131} {"train_loss": -25.837249755859375, "global_step": 15893, "epoch": 131} {"train_loss": -27.20379066467285, "global_step": 15894, "epoch": 131} {"train_loss": -27.927154541015625, "global_step": 15895, "epoch": 131} {"train_loss": -25.707015991210938, "global_step": 15896, "epoch": 131} {"train_loss": -27.149030685424805, "global_step": 15897, "epoch": 131} {"train_loss": -27.500980377197266, "global_step": 15898, "epoch": 131} {"train_loss": -26.371061325073242, "global_step": 15899, "epoch": 131} {"train_loss": -24.98675537109375, "global_step": 15900, "epoch": 131} {"train_loss": -26.302000045776367, "global_step": 15901, "epoch": 131} {"train_loss": -27.510940551757812, "global_step": 15902, "epoch": 131} {"train_loss": -27.4461612701416, "global_step": 15903, "epoch": 131} {"train_loss": -26.953704833984375, "global_step": 15904, "epoch": 131} {"train_loss": -27.514368057250977, "global_step": 15905, "epoch": 131} {"train_loss": -27.721240997314453, "global_step": 15906, "epoch": 131} {"train_loss": -27.236860275268555, "global_step": 15907, "epoch": 131} {"train_loss": -27.971677780151367, "global_step": 15908, "epoch": 131} {"train_loss": -28.185434341430664, "global_step": 15909, "epoch": 131} {"train_loss": -27.983753204345703, "global_step": 15910, "epoch": 131} {"train_loss": -26.979907989501953, "global_step": 15911, "epoch": 131} {"train_loss": -27.47309684753418, "global_step": 15912, "epoch": 131} {"train_loss": -27.731128692626953, "global_step": 15913, "epoch": 131} {"train_loss": -26.399667739868164, "global_step": 15914, "epoch": 131} {"train_loss": -26.37946128845215, "global_step": 15915, "epoch": 131} {"train_loss": -27.90276527404785, "global_step": 15916, "epoch": 131} {"train_loss": -27.476118087768555, "global_step": 15917, "epoch": 131} {"train_loss": -27.309219360351562, "global_step": 15918, "epoch": 131} {"train_loss": -28.137685775756836, "global_step": 15919, "epoch": 131} {"train_loss": -28.24812126159668, "global_step": 15920, "epoch": 131} {"train_loss": -27.93581199645996, "global_step": 15921, "epoch": 131} {"train_loss": -27.743844985961914, "global_step": 15922, "epoch": 131} {"train_loss": -27.8719539642334, "global_step": 15923, "epoch": 131} {"train_loss": -27.67689323425293, "global_step": 15924, "epoch": 131} {"train_loss": -27.559484481811523, "global_step": 15925, "epoch": 131} {"train_loss": -26.503026962280273, "global_step": 15926, "epoch": 131} {"train_loss": -27.852380752563477, "global_step": 15927, "epoch": 131} {"train_loss": -26.558746337890625, "global_step": 15928, "epoch": 131} {"train_loss": -26.599355697631836, "global_step": 15929, "epoch": 131} {"train_loss": -27.687467575073242, "global_step": 15930, "epoch": 131} {"train_loss": -25.0537052154541, "global_step": 15931, "epoch": 131} {"train_loss": -27.429372787475586, "global_step": 15932, "epoch": 131} {"train_loss": -25.97494888305664, "global_step": 15933, "epoch": 131} {"train_loss": -26.9676570892334, "global_step": 15934, "epoch": 131} {"train_loss": -26.085342407226562, "global_step": 15935, "epoch": 131} {"train_loss": -26.613311767578125, "global_step": 15936, "epoch": 131} {"train_loss": -27.203842163085938, "global_step": 15937, "epoch": 131} {"train_loss": -27.902393341064453, "global_step": 15938, "epoch": 131} {"train_loss": -26.854801177978516, "global_step": 15939, "epoch": 131} {"train_loss": -27.79304313659668, "global_step": 15940, "epoch": 131} {"train_loss": -27.1512451171875, "global_step": 15941, "epoch": 131} {"train_loss": -27.474634170532227, "global_step": 15942, "epoch": 131} {"train_loss": -26.8568115234375, "global_step": 15943, "epoch": 131} {"train_loss": -27.621740341186523, "global_step": 15944, "epoch": 131} {"train_loss": -27.733810424804688, "global_step": 15945, "epoch": 131} {"train_loss": -27.42574119567871, "global_step": 15946, "epoch": 131} {"train_loss": -27.24042320251465, "global_step": 15947, "epoch": 131} {"train_loss": -27.00507164001465, "global_step": 15948, "epoch": 131} {"train_loss": -27.534704208374023, "global_step": 15949, "epoch": 131} {"train_loss": -28.198545455932617, "global_step": 15950, "epoch": 131} {"train_loss": -27.848556518554688, "global_step": 15951, "epoch": 131} {"train_loss": -27.88966941833496, "global_step": 15952, "epoch": 131} {"train_loss": -27.37408447265625, "global_step": 15953, "epoch": 131} {"train_loss": -27.865461349487305, "global_step": 15954, "epoch": 131} {"train_loss": -28.048908233642578, "global_step": 15955, "epoch": 131} {"train_loss": -27.9801025390625, "global_step": 15956, "epoch": 131} {"train_loss": -28.492080688476562, "global_step": 15957, "epoch": 131} {"train_loss": -28.478391647338867, "global_step": 15958, "epoch": 131} {"train_loss": -28.132699966430664, "global_step": 15959, "epoch": 131} {"train_loss": -28.275156021118164, "global_step": 15960, "epoch": 131} {"train_loss": -28.32065773010254, "global_step": 15961, "epoch": 131} {"train_loss": -27.999317169189453, "global_step": 15962, "epoch": 131} {"train_loss": -28.428770065307617, "global_step": 15963, "epoch": 131} {"train_loss": -27.801488876342773, "global_step": 15964, "epoch": 131} {"train_loss": -28.418685913085938, "global_step": 15965, "epoch": 131} {"train_loss": -28.4702205657959, "global_step": 15966, "epoch": 131} {"train_loss": -28.483091354370117, "global_step": 15967, "epoch": 131} {"train_loss": -27.901697158813477, "global_step": 15968, "epoch": 131} {"train_loss": -28.220422744750977, "global_step": 15969, "epoch": 131} {"train_loss": -28.73457145690918, "global_step": 15970, "epoch": 131} {"train_loss": -27.602103446140763, "global_step": 15971, "epoch": 131, "val_loss": 2704273.0} {"train_loss": -27.726093292236328, "global_step": 15972, "epoch": 132} {"train_loss": -28.18220329284668, "global_step": 15973, "epoch": 132} {"train_loss": -28.195093154907227, "global_step": 15974, "epoch": 132} {"train_loss": -27.9623966217041, "global_step": 15975, "epoch": 132} {"train_loss": -28.248809814453125, "global_step": 15976, "epoch": 132} {"train_loss": -27.368072509765625, "global_step": 15977, "epoch": 132} {"train_loss": -27.938323974609375, "global_step": 15978, "epoch": 132} {"train_loss": -27.60934829711914, "global_step": 15979, "epoch": 132} {"train_loss": -27.59674644470215, "global_step": 15980, "epoch": 132} {"train_loss": -28.104755401611328, "global_step": 15981, "epoch": 132} {"train_loss": -28.081872940063477, "global_step": 15982, "epoch": 132} {"train_loss": -28.242429733276367, "global_step": 15983, "epoch": 132} {"train_loss": -27.3946590423584, "global_step": 15984, "epoch": 132} {"train_loss": -27.702438354492188, "global_step": 15985, "epoch": 132} {"train_loss": -25.71856117248535, "global_step": 15986, "epoch": 132} {"train_loss": -22.64255142211914, "global_step": 15987, "epoch": 132} {"train_loss": -22.034029006958008, "global_step": 15988, "epoch": 132} {"train_loss": -25.900739669799805, "global_step": 15989, "epoch": 132} {"train_loss": -28.48235511779785, "global_step": 15990, "epoch": 132} {"train_loss": -26.8028564453125, "global_step": 15991, "epoch": 132} {"train_loss": -28.06036376953125, "global_step": 15992, "epoch": 132} {"train_loss": -27.4449462890625, "global_step": 15993, "epoch": 132} {"train_loss": -27.955129623413086, "global_step": 15994, "epoch": 132} {"train_loss": -27.8150634765625, "global_step": 15995, "epoch": 132} {"train_loss": -27.78370475769043, "global_step": 15996, "epoch": 132} {"train_loss": -27.780487060546875, "global_step": 15997, "epoch": 132} {"train_loss": -28.0921573638916, "global_step": 15998, "epoch": 132} {"train_loss": -28.210479736328125, "global_step": 15999, "epoch": 132} {"train_loss": -28.057889938354492, "global_step": 16000, "epoch": 132} {"train_loss": -28.02920913696289, "global_step": 16001, "epoch": 132} {"train_loss": -28.008941650390625, "global_step": 16002, "epoch": 132} {"train_loss": -28.0413875579834, "global_step": 16003, "epoch": 132} {"train_loss": -27.718412399291992, "global_step": 16004, "epoch": 132} {"train_loss": -28.44229507446289, "global_step": 16005, "epoch": 132} {"train_loss": -28.1104736328125, "global_step": 16006, "epoch": 132} {"train_loss": -28.35638427734375, "global_step": 16007, "epoch": 132} {"train_loss": -28.152074813842773, "global_step": 16008, "epoch": 132} {"train_loss": -28.409088134765625, "global_step": 16009, "epoch": 132} {"train_loss": -28.139036178588867, "global_step": 16010, "epoch": 132} {"train_loss": -27.75594139099121, "global_step": 16011, "epoch": 132} {"train_loss": -28.151016235351562, "global_step": 16012, "epoch": 132} {"train_loss": -28.45772361755371, "global_step": 16013, "epoch": 132} {"train_loss": -28.575918197631836, "global_step": 16014, "epoch": 132} {"train_loss": -28.22108268737793, "global_step": 16015, "epoch": 132} {"train_loss": -28.396570205688477, "global_step": 16016, "epoch": 132} {"train_loss": -28.251205444335938, "global_step": 16017, "epoch": 132} {"train_loss": -27.4749698638916, "global_step": 16018, "epoch": 132} {"train_loss": -27.838476181030273, "global_step": 16019, "epoch": 132} {"train_loss": -27.687103271484375, "global_step": 16020, "epoch": 132} {"train_loss": -28.442670822143555, "global_step": 16021, "epoch": 132} {"train_loss": -28.248493194580078, "global_step": 16022, "epoch": 132} {"train_loss": -28.03030776977539, "global_step": 16023, "epoch": 132} {"train_loss": -28.153650283813477, "global_step": 16024, "epoch": 132} {"train_loss": -28.12652015686035, "global_step": 16025, "epoch": 132} {"train_loss": -27.895666122436523, "global_step": 16026, "epoch": 132} {"train_loss": -27.95475196838379, "global_step": 16027, "epoch": 132} {"train_loss": -28.818622589111328, "global_step": 16028, "epoch": 132} {"train_loss": -27.84417152404785, "global_step": 16029, "epoch": 132} {"train_loss": -28.858747482299805, "global_step": 16030, "epoch": 132} {"train_loss": -28.526229858398438, "global_step": 16031, "epoch": 132} {"train_loss": -28.510095596313477, "global_step": 16032, "epoch": 132} {"train_loss": -28.68235206604004, "global_step": 16033, "epoch": 132} {"train_loss": -27.9447078704834, "global_step": 16034, "epoch": 132} {"train_loss": -28.28472900390625, "global_step": 16035, "epoch": 132} {"train_loss": -28.6225528717041, "global_step": 16036, "epoch": 132} {"train_loss": -28.297189712524414, "global_step": 16037, "epoch": 132} {"train_loss": -27.994922637939453, "global_step": 16038, "epoch": 132} {"train_loss": -28.542739868164062, "global_step": 16039, "epoch": 132} {"train_loss": -27.67453956604004, "global_step": 16040, "epoch": 132} {"train_loss": -27.270986557006836, "global_step": 16041, "epoch": 132} {"train_loss": -27.818429946899414, "global_step": 16042, "epoch": 132} {"train_loss": -27.841175079345703, "global_step": 16043, "epoch": 132} {"train_loss": -26.902063369750977, "global_step": 16044, "epoch": 132} {"train_loss": -28.343769073486328, "global_step": 16045, "epoch": 132} {"train_loss": -26.439599990844727, "global_step": 16046, "epoch": 132} {"train_loss": -26.77571678161621, "global_step": 16047, "epoch": 132} {"train_loss": -28.185348510742188, "global_step": 16048, "epoch": 132} {"train_loss": -26.294483184814453, "global_step": 16049, "epoch": 132} {"train_loss": -28.455968856811523, "global_step": 16050, "epoch": 132} {"train_loss": -27.30417251586914, "global_step": 16051, "epoch": 132} {"train_loss": -27.699005126953125, "global_step": 16052, "epoch": 132} {"train_loss": -26.487476348876953, "global_step": 16053, "epoch": 132} {"train_loss": -25.92291831970215, "global_step": 16054, "epoch": 132} {"train_loss": -26.405200958251953, "global_step": 16055, "epoch": 132} {"train_loss": -26.81306266784668, "global_step": 16056, "epoch": 132} {"train_loss": -26.59326171875, "global_step": 16057, "epoch": 132} {"train_loss": -27.032331466674805, "global_step": 16058, "epoch": 132} {"train_loss": -26.961212158203125, "global_step": 16059, "epoch": 132} {"train_loss": -26.82942008972168, "global_step": 16060, "epoch": 132} {"train_loss": -27.265832901000977, "global_step": 16061, "epoch": 132} {"train_loss": -27.78619956970215, "global_step": 16062, "epoch": 132} {"train_loss": -27.613367080688477, "global_step": 16063, "epoch": 132} {"train_loss": -27.636566162109375, "global_step": 16064, "epoch": 132} {"train_loss": -27.971973419189453, "global_step": 16065, "epoch": 132} {"train_loss": -27.288793563842773, "global_step": 16066, "epoch": 132} {"train_loss": -27.81458854675293, "global_step": 16067, "epoch": 132} {"train_loss": -28.00087547302246, "global_step": 16068, "epoch": 132} {"train_loss": -27.674169540405273, "global_step": 16069, "epoch": 132} {"train_loss": -27.856042861938477, "global_step": 16070, "epoch": 132} {"train_loss": -27.582624435424805, "global_step": 16071, "epoch": 132} {"train_loss": -27.367956161499023, "global_step": 16072, "epoch": 132} {"train_loss": -27.805709838867188, "global_step": 16073, "epoch": 132} {"train_loss": -27.853864669799805, "global_step": 16074, "epoch": 132} {"train_loss": -28.045270919799805, "global_step": 16075, "epoch": 132} {"train_loss": -28.1866512298584, "global_step": 16076, "epoch": 132} {"train_loss": -28.022216796875, "global_step": 16077, "epoch": 132} {"train_loss": -28.23904800415039, "global_step": 16078, "epoch": 132} {"train_loss": -27.983606338500977, "global_step": 16079, "epoch": 132} {"train_loss": -26.6705379486084, "global_step": 16080, "epoch": 132} {"train_loss": -23.818208694458008, "global_step": 16081, "epoch": 132} {"train_loss": -19.53923988342285, "global_step": 16082, "epoch": 132} {"train_loss": -21.765583038330078, "global_step": 16083, "epoch": 132} {"train_loss": -27.352888107299805, "global_step": 16084, "epoch": 132} {"train_loss": -26.03565788269043, "global_step": 16085, "epoch": 132} {"train_loss": -27.35051918029785, "global_step": 16086, "epoch": 132} {"train_loss": -26.486083984375, "global_step": 16087, "epoch": 132} {"train_loss": -27.94927978515625, "global_step": 16088, "epoch": 132} {"train_loss": -26.815052032470703, "global_step": 16089, "epoch": 132} {"train_loss": -27.933563232421875, "global_step": 16090, "epoch": 132} {"train_loss": -27.200830459594727, "global_step": 16091, "epoch": 132} {"train_loss": -27.498912685173604, "global_step": 16092, "epoch": 132, "val_loss": 2470582.25} {"train_loss": -28.044189453125, "global_step": 16093, "epoch": 133} {"train_loss": -27.773767471313477, "global_step": 16094, "epoch": 133} {"train_loss": -27.316104888916016, "global_step": 16095, "epoch": 133} {"train_loss": -27.78623390197754, "global_step": 16096, "epoch": 133} {"train_loss": -27.598529815673828, "global_step": 16097, "epoch": 133} {"train_loss": -27.495849609375, "global_step": 16098, "epoch": 133} {"train_loss": -27.784772872924805, "global_step": 16099, "epoch": 133} {"train_loss": -28.120309829711914, "global_step": 16100, "epoch": 133} {"train_loss": -27.5788516998291, "global_step": 16101, "epoch": 133} {"train_loss": -27.715911865234375, "global_step": 16102, "epoch": 133} {"train_loss": -27.154754638671875, "global_step": 16103, "epoch": 133} {"train_loss": -26.977527618408203, "global_step": 16104, "epoch": 133} {"train_loss": -25.467758178710938, "global_step": 16105, "epoch": 133} {"train_loss": -24.076171875, "global_step": 16106, "epoch": 133} {"train_loss": -24.686683654785156, "global_step": 16107, "epoch": 133} {"train_loss": -25.696319580078125, "global_step": 16108, "epoch": 133} {"train_loss": -27.9106388092041, "global_step": 16109, "epoch": 133} {"train_loss": -26.505584716796875, "global_step": 16110, "epoch": 133} {"train_loss": -26.497098922729492, "global_step": 16111, "epoch": 133} {"train_loss": -27.682809829711914, "global_step": 16112, "epoch": 133} {"train_loss": -27.150821685791016, "global_step": 16113, "epoch": 133} {"train_loss": -27.750349044799805, "global_step": 16114, "epoch": 133} {"train_loss": -27.57317543029785, "global_step": 16115, "epoch": 133} {"train_loss": -27.869739532470703, "global_step": 16116, "epoch": 133} {"train_loss": -28.085620880126953, "global_step": 16117, "epoch": 133} {"train_loss": -28.1153621673584, "global_step": 16118, "epoch": 133} {"train_loss": -27.640857696533203, "global_step": 16119, "epoch": 133} {"train_loss": -27.73769187927246, "global_step": 16120, "epoch": 133} {"train_loss": -28.122594833374023, "global_step": 16121, "epoch": 133} {"train_loss": -28.120468139648438, "global_step": 16122, "epoch": 133} {"train_loss": -28.32529640197754, "global_step": 16123, "epoch": 133} {"train_loss": -27.980438232421875, "global_step": 16124, "epoch": 133} {"train_loss": -28.29927635192871, "global_step": 16125, "epoch": 133} {"train_loss": -27.97962760925293, "global_step": 16126, "epoch": 133} {"train_loss": -28.053220748901367, "global_step": 16127, "epoch": 133} {"train_loss": -28.01740837097168, "global_step": 16128, "epoch": 133} {"train_loss": -28.44817543029785, "global_step": 16129, "epoch": 133} {"train_loss": -27.897974014282227, "global_step": 16130, "epoch": 133} {"train_loss": -28.323617935180664, "global_step": 16131, "epoch": 133} {"train_loss": -28.313573837280273, "global_step": 16132, "epoch": 133} {"train_loss": -28.514936447143555, "global_step": 16133, "epoch": 133} {"train_loss": -28.40299415588379, "global_step": 16134, "epoch": 133} {"train_loss": -28.293598175048828, "global_step": 16135, "epoch": 133} {"train_loss": -28.4998779296875, "global_step": 16136, "epoch": 133} {"train_loss": -28.52191162109375, "global_step": 16137, "epoch": 133} {"train_loss": -28.166040420532227, "global_step": 16138, "epoch": 133} {"train_loss": -28.674945831298828, "global_step": 16139, "epoch": 133} {"train_loss": -28.804914474487305, "global_step": 16140, "epoch": 133} {"train_loss": -28.2514705657959, "global_step": 16141, "epoch": 133} {"train_loss": -28.6611328125, "global_step": 16142, "epoch": 133} {"train_loss": -28.6445369720459, "global_step": 16143, "epoch": 133} {"train_loss": -28.59916114807129, "global_step": 16144, "epoch": 133} {"train_loss": -28.514230728149414, "global_step": 16145, "epoch": 133} {"train_loss": -28.58695411682129, "global_step": 16146, "epoch": 133} {"train_loss": -28.621877670288086, "global_step": 16147, "epoch": 133} {"train_loss": -28.510339736938477, "global_step": 16148, "epoch": 133} {"train_loss": -28.70256996154785, "global_step": 16149, "epoch": 133} {"train_loss": -28.714035034179688, "global_step": 16150, "epoch": 133} {"train_loss": -29.2002010345459, "global_step": 16151, "epoch": 133} {"train_loss": -28.5549373626709, "global_step": 16152, "epoch": 133} {"train_loss": -28.93037223815918, "global_step": 16153, "epoch": 133} {"train_loss": -28.506921768188477, "global_step": 16154, "epoch": 133} {"train_loss": -28.407135009765625, "global_step": 16155, "epoch": 133} {"train_loss": -28.1286563873291, "global_step": 16156, "epoch": 133} {"train_loss": -27.66057777404785, "global_step": 16157, "epoch": 133} {"train_loss": -26.88047218322754, "global_step": 16158, "epoch": 133} {"train_loss": -26.222763061523438, "global_step": 16159, "epoch": 133} {"train_loss": -25.459548950195312, "global_step": 16160, "epoch": 133} {"train_loss": -28.683475494384766, "global_step": 16161, "epoch": 133} {"train_loss": -25.853376388549805, "global_step": 16162, "epoch": 133} {"train_loss": -23.72126579284668, "global_step": 16163, "epoch": 133} {"train_loss": -27.050281524658203, "global_step": 16164, "epoch": 133} {"train_loss": -27.687183380126953, "global_step": 16165, "epoch": 133} {"train_loss": -25.419166564941406, "global_step": 16166, "epoch": 133} {"train_loss": -26.03797721862793, "global_step": 16167, "epoch": 133} {"train_loss": -26.639881134033203, "global_step": 16168, "epoch": 133} {"train_loss": -26.02288246154785, "global_step": 16169, "epoch": 133} {"train_loss": -26.2882022857666, "global_step": 16170, "epoch": 133} {"train_loss": -22.520620346069336, "global_step": 16171, "epoch": 133} {"train_loss": -27.618566513061523, "global_step": 16172, "epoch": 133} {"train_loss": -26.969797134399414, "global_step": 16173, "epoch": 133} {"train_loss": -25.375499725341797, "global_step": 16174, "epoch": 133} {"train_loss": -27.330432891845703, "global_step": 16175, "epoch": 133} {"train_loss": -27.261234283447266, "global_step": 16176, "epoch": 133} {"train_loss": -27.212961196899414, "global_step": 16177, "epoch": 133} {"train_loss": -27.5615177154541, "global_step": 16178, "epoch": 133} {"train_loss": -27.011051177978516, "global_step": 16179, "epoch": 133} {"train_loss": -27.605859756469727, "global_step": 16180, "epoch": 133} {"train_loss": -27.82676124572754, "global_step": 16181, "epoch": 133} {"train_loss": -27.83467674255371, "global_step": 16182, "epoch": 133} {"train_loss": -27.780399322509766, "global_step": 16183, "epoch": 133} {"train_loss": -27.89351463317871, "global_step": 16184, "epoch": 133} {"train_loss": -27.692346572875977, "global_step": 16185, "epoch": 133} {"train_loss": -27.65826988220215, "global_step": 16186, "epoch": 133} {"train_loss": -27.910842895507812, "global_step": 16187, "epoch": 133} {"train_loss": -28.141616821289062, "global_step": 16188, "epoch": 133} {"train_loss": -27.769887924194336, "global_step": 16189, "epoch": 133} {"train_loss": -27.847553253173828, "global_step": 16190, "epoch": 133} {"train_loss": -28.240549087524414, "global_step": 16191, "epoch": 133} {"train_loss": -28.047021865844727, "global_step": 16192, "epoch": 133} {"train_loss": -28.276025772094727, "global_step": 16193, "epoch": 133} {"train_loss": -28.585214614868164, "global_step": 16194, "epoch": 133} {"train_loss": -28.453100204467773, "global_step": 16195, "epoch": 133} {"train_loss": -28.28700065612793, "global_step": 16196, "epoch": 133} {"train_loss": -28.116348266601562, "global_step": 16197, "epoch": 133} {"train_loss": -28.149017333984375, "global_step": 16198, "epoch": 133} {"train_loss": -27.577245712280273, "global_step": 16199, "epoch": 133} {"train_loss": -26.277484893798828, "global_step": 16200, "epoch": 133} {"train_loss": -15.9458589553833, "global_step": 16201, "epoch": 133} {"train_loss": 31.0627498626709, "global_step": 16202, "epoch": 133} {"train_loss": 66.64949035644531, "global_step": 16203, "epoch": 133} {"train_loss": -18.815189361572266, "global_step": 16204, "epoch": 133} {"train_loss": -0.1183754950761795, "global_step": 16205, "epoch": 133} {"train_loss": 1.406226634979248, "global_step": 16206, "epoch": 133} {"train_loss": -17.571950912475586, "global_step": 16207, "epoch": 133} {"train_loss": -24.56819725036621, "global_step": 16208, "epoch": 133} {"train_loss": -20.782121658325195, "global_step": 16209, "epoch": 133} {"train_loss": -17.33577537536621, "global_step": 16210, "epoch": 133} {"train_loss": -16.70358657836914, "global_step": 16211, "epoch": 133} {"train_loss": -17.741077423095703, "global_step": 16212, "epoch": 133} {"train_loss": -25.209436757135983, "global_step": 16213, "epoch": 133, "val_loss": 2901235.75} {"train_loss": -21.180538177490234, "global_step": 16214, "epoch": 134} {"train_loss": -21.953115463256836, "global_step": 16215, "epoch": 134} {"train_loss": -22.65757179260254, "global_step": 16216, "epoch": 134} {"train_loss": -23.451847076416016, "global_step": 16217, "epoch": 134} {"train_loss": -23.351621627807617, "global_step": 16218, "epoch": 134} {"train_loss": -23.563800811767578, "global_step": 16219, "epoch": 134} {"train_loss": -23.350994110107422, "global_step": 16220, "epoch": 134} {"train_loss": -23.47144889831543, "global_step": 16221, "epoch": 134} {"train_loss": -23.080419540405273, "global_step": 16222, "epoch": 134} {"train_loss": -23.622915267944336, "global_step": 16223, "epoch": 134} {"train_loss": -23.772634506225586, "global_step": 16224, "epoch": 134} {"train_loss": -24.227216720581055, "global_step": 16225, "epoch": 134} {"train_loss": -23.883459091186523, "global_step": 16226, "epoch": 134} {"train_loss": -24.479413986206055, "global_step": 16227, "epoch": 134} {"train_loss": -24.143863677978516, "global_step": 16228, "epoch": 134} {"train_loss": -23.985031127929688, "global_step": 16229, "epoch": 134} {"train_loss": -24.30536651611328, "global_step": 16230, "epoch": 134} {"train_loss": -24.537002563476562, "global_step": 16231, "epoch": 134} {"train_loss": -24.486892700195312, "global_step": 16232, "epoch": 134} {"train_loss": -24.212718963623047, "global_step": 16233, "epoch": 134} {"train_loss": -24.651811599731445, "global_step": 16234, "epoch": 134} {"train_loss": -25.031625747680664, "global_step": 16235, "epoch": 134} {"train_loss": -24.81862449645996, "global_step": 16236, "epoch": 134} {"train_loss": -25.1916446685791, "global_step": 16237, "epoch": 134} {"train_loss": -24.987567901611328, "global_step": 16238, "epoch": 134} {"train_loss": -25.332847595214844, "global_step": 16239, "epoch": 134} {"train_loss": -25.62299919128418, "global_step": 16240, "epoch": 134} {"train_loss": -25.531606674194336, "global_step": 16241, "epoch": 134} {"train_loss": -25.562768936157227, "global_step": 16242, "epoch": 134} {"train_loss": -25.919174194335938, "global_step": 16243, "epoch": 134} {"train_loss": -25.7406005859375, "global_step": 16244, "epoch": 134} {"train_loss": -25.900421142578125, "global_step": 16245, "epoch": 134} {"train_loss": -25.95468521118164, "global_step": 16246, "epoch": 134} {"train_loss": -26.124011993408203, "global_step": 16247, "epoch": 134} {"train_loss": -26.347766876220703, "global_step": 16248, "epoch": 134} {"train_loss": -26.27899169921875, "global_step": 16249, "epoch": 134} {"train_loss": -26.420873641967773, "global_step": 16250, "epoch": 134} {"train_loss": -26.062946319580078, "global_step": 16251, "epoch": 134} {"train_loss": -26.45625114440918, "global_step": 16252, "epoch": 134} {"train_loss": -26.43610191345215, "global_step": 16253, "epoch": 134} {"train_loss": -26.414505004882812, "global_step": 16254, "epoch": 134} {"train_loss": -26.383543014526367, "global_step": 16255, "epoch": 134} {"train_loss": -26.29863929748535, "global_step": 16256, "epoch": 134} {"train_loss": -26.628021240234375, "global_step": 16257, "epoch": 134} {"train_loss": -26.6408748626709, "global_step": 16258, "epoch": 134} {"train_loss": -25.48786735534668, "global_step": 16259, "epoch": 134} {"train_loss": -26.506641387939453, "global_step": 16260, "epoch": 134} {"train_loss": -26.784870147705078, "global_step": 16261, "epoch": 134} {"train_loss": -26.289548873901367, "global_step": 16262, "epoch": 134} {"train_loss": -26.678003311157227, "global_step": 16263, "epoch": 134} {"train_loss": -26.475830078125, "global_step": 16264, "epoch": 134} {"train_loss": -26.717565536499023, "global_step": 16265, "epoch": 134} {"train_loss": -26.8098201751709, "global_step": 16266, "epoch": 134} {"train_loss": -26.262182235717773, "global_step": 16267, "epoch": 134} {"train_loss": -26.512094497680664, "global_step": 16268, "epoch": 134} {"train_loss": -26.3763370513916, "global_step": 16269, "epoch": 134} {"train_loss": -26.473840713500977, "global_step": 16270, "epoch": 134} {"train_loss": -26.59360694885254, "global_step": 16271, "epoch": 134} {"train_loss": -26.50113296508789, "global_step": 16272, "epoch": 134} {"train_loss": -26.731393814086914, "global_step": 16273, "epoch": 134} {"train_loss": -26.615976333618164, "global_step": 16274, "epoch": 134} {"train_loss": -26.727035522460938, "global_step": 16275, "epoch": 134} {"train_loss": -26.65213966369629, "global_step": 16276, "epoch": 134} {"train_loss": -26.81402015686035, "global_step": 16277, "epoch": 134} {"train_loss": -26.853927612304688, "global_step": 16278, "epoch": 134} {"train_loss": -26.78016471862793, "global_step": 16279, "epoch": 134} {"train_loss": -26.509870529174805, "global_step": 16280, "epoch": 134} {"train_loss": -26.5352725982666, "global_step": 16281, "epoch": 134} {"train_loss": -26.643308639526367, "global_step": 16282, "epoch": 134} {"train_loss": -26.575653076171875, "global_step": 16283, "epoch": 134} {"train_loss": -26.835590362548828, "global_step": 16284, "epoch": 134} {"train_loss": -27.094924926757812, "global_step": 16285, "epoch": 134} {"train_loss": -25.8617000579834, "global_step": 16286, "epoch": 134} {"train_loss": -26.893604278564453, "global_step": 16287, "epoch": 134} {"train_loss": -26.438074111938477, "global_step": 16288, "epoch": 134} {"train_loss": -26.9359073638916, "global_step": 16289, "epoch": 134} {"train_loss": -26.490808486938477, "global_step": 16290, "epoch": 134} {"train_loss": -26.747562408447266, "global_step": 16291, "epoch": 134} {"train_loss": -26.41840171813965, "global_step": 16292, "epoch": 134} {"train_loss": -27.018661499023438, "global_step": 16293, "epoch": 134} {"train_loss": -26.360403060913086, "global_step": 16294, "epoch": 134} {"train_loss": -26.603515625, "global_step": 16295, "epoch": 134} {"train_loss": -26.496124267578125, "global_step": 16296, "epoch": 134} {"train_loss": -26.554624557495117, "global_step": 16297, "epoch": 134} {"train_loss": -26.801549911499023, "global_step": 16298, "epoch": 134} {"train_loss": -26.291723251342773, "global_step": 16299, "epoch": 134} {"train_loss": -26.637542724609375, "global_step": 16300, "epoch": 134} {"train_loss": -26.20931053161621, "global_step": 16301, "epoch": 134} {"train_loss": -26.314239501953125, "global_step": 16302, "epoch": 134} {"train_loss": -26.599822998046875, "global_step": 16303, "epoch": 134} {"train_loss": -27.032629013061523, "global_step": 16304, "epoch": 134} {"train_loss": -26.323535919189453, "global_step": 16305, "epoch": 134} {"train_loss": -25.05890464782715, "global_step": 16306, "epoch": 134} {"train_loss": -25.10910987854004, "global_step": 16307, "epoch": 134} {"train_loss": -26.480642318725586, "global_step": 16308, "epoch": 134} {"train_loss": -26.5805606842041, "global_step": 16309, "epoch": 134} {"train_loss": -26.08222770690918, "global_step": 16310, "epoch": 134} {"train_loss": -26.739959716796875, "global_step": 16311, "epoch": 134} {"train_loss": -27.230762481689453, "global_step": 16312, "epoch": 134} {"train_loss": -26.498046875, "global_step": 16313, "epoch": 134} {"train_loss": -26.695276260375977, "global_step": 16314, "epoch": 134} {"train_loss": -27.334875106811523, "global_step": 16315, "epoch": 134} {"train_loss": -26.302291870117188, "global_step": 16316, "epoch": 134} {"train_loss": -26.745641708374023, "global_step": 16317, "epoch": 134} {"train_loss": -27.547773361206055, "global_step": 16318, "epoch": 134} {"train_loss": -26.556257247924805, "global_step": 16319, "epoch": 134} {"train_loss": -27.346393585205078, "global_step": 16320, "epoch": 134} {"train_loss": -26.13575553894043, "global_step": 16321, "epoch": 134} {"train_loss": -26.102262496948242, "global_step": 16322, "epoch": 134} {"train_loss": -26.870487213134766, "global_step": 16323, "epoch": 134} {"train_loss": -27.13797950744629, "global_step": 16324, "epoch": 134} {"train_loss": -26.526819229125977, "global_step": 16325, "epoch": 134} {"train_loss": -26.753070831298828, "global_step": 16326, "epoch": 134} {"train_loss": -27.154417037963867, "global_step": 16327, "epoch": 134} {"train_loss": -27.154434204101562, "global_step": 16328, "epoch": 134} {"train_loss": -26.965810775756836, "global_step": 16329, "epoch": 134} {"train_loss": -27.148115158081055, "global_step": 16330, "epoch": 134} {"train_loss": -27.220386505126953, "global_step": 16331, "epoch": 134} {"train_loss": -27.13539695739746, "global_step": 16332, "epoch": 134} {"train_loss": -27.453332901000977, "global_step": 16333, "epoch": 134} {"train_loss": -25.96799651847398, "global_step": 16334, "epoch": 134, "val_loss": 2676364.5} {"train_loss": -26.61675453186035, "global_step": 16335, "epoch": 135} {"train_loss": -27.422657012939453, "global_step": 16336, "epoch": 135} {"train_loss": -26.481155395507812, "global_step": 16337, "epoch": 135} {"train_loss": -26.828174591064453, "global_step": 16338, "epoch": 135} {"train_loss": -27.086694717407227, "global_step": 16339, "epoch": 135} {"train_loss": -27.13528823852539, "global_step": 16340, "epoch": 135} {"train_loss": -26.928632736206055, "global_step": 16341, "epoch": 135} {"train_loss": -26.6367130279541, "global_step": 16342, "epoch": 135} {"train_loss": -27.107358932495117, "global_step": 16343, "epoch": 135} {"train_loss": -27.4608154296875, "global_step": 16344, "epoch": 135} {"train_loss": -27.256591796875, "global_step": 16345, "epoch": 135} {"train_loss": -27.306421279907227, "global_step": 16346, "epoch": 135} {"train_loss": -27.176746368408203, "global_step": 16347, "epoch": 135} {"train_loss": -27.33082389831543, "global_step": 16348, "epoch": 135} {"train_loss": -27.480621337890625, "global_step": 16349, "epoch": 135} {"train_loss": -27.35841178894043, "global_step": 16350, "epoch": 135} {"train_loss": -27.4966983795166, "global_step": 16351, "epoch": 135} {"train_loss": -27.039810180664062, "global_step": 16352, "epoch": 135} {"train_loss": -26.93047523498535, "global_step": 16353, "epoch": 135} {"train_loss": -26.90976905822754, "global_step": 16354, "epoch": 135} {"train_loss": -26.581632614135742, "global_step": 16355, "epoch": 135} {"train_loss": -27.447620391845703, "global_step": 16356, "epoch": 135} {"train_loss": -27.27823257446289, "global_step": 16357, "epoch": 135} {"train_loss": -27.029956817626953, "global_step": 16358, "epoch": 135} {"train_loss": -26.620834350585938, "global_step": 16359, "epoch": 135} {"train_loss": -26.859485626220703, "global_step": 16360, "epoch": 135} {"train_loss": -26.941213607788086, "global_step": 16361, "epoch": 135} {"train_loss": -26.832544326782227, "global_step": 16362, "epoch": 135} {"train_loss": -26.536596298217773, "global_step": 16363, "epoch": 135} {"train_loss": -26.02901268005371, "global_step": 16364, "epoch": 135} {"train_loss": -26.520050048828125, "global_step": 16365, "epoch": 135} {"train_loss": -27.383344650268555, "global_step": 16366, "epoch": 135} {"train_loss": -26.96189308166504, "global_step": 16367, "epoch": 135} {"train_loss": -27.167158126831055, "global_step": 16368, "epoch": 135} {"train_loss": -27.16948890686035, "global_step": 16369, "epoch": 135} {"train_loss": -26.99934959411621, "global_step": 16370, "epoch": 135} {"train_loss": -27.519662857055664, "global_step": 16371, "epoch": 135} {"train_loss": -26.40082359313965, "global_step": 16372, "epoch": 135} {"train_loss": -26.919296264648438, "global_step": 16373, "epoch": 135} {"train_loss": -27.1741943359375, "global_step": 16374, "epoch": 135} {"train_loss": -26.591266632080078, "global_step": 16375, "epoch": 135} {"train_loss": -26.627912521362305, "global_step": 16376, "epoch": 135} {"train_loss": -26.873859405517578, "global_step": 16377, "epoch": 135} {"train_loss": -26.249372482299805, "global_step": 16378, "epoch": 135} {"train_loss": -26.977649688720703, "global_step": 16379, "epoch": 135} {"train_loss": -26.503568649291992, "global_step": 16380, "epoch": 135} {"train_loss": -26.50176429748535, "global_step": 16381, "epoch": 135} {"train_loss": -26.89906883239746, "global_step": 16382, "epoch": 135} {"train_loss": -26.650426864624023, "global_step": 16383, "epoch": 135} {"train_loss": -27.227575302124023, "global_step": 16384, "epoch": 135} {"train_loss": -26.796741485595703, "global_step": 16385, "epoch": 135} {"train_loss": -27.287641525268555, "global_step": 16386, "epoch": 135} {"train_loss": -26.515287399291992, "global_step": 16387, "epoch": 135} {"train_loss": -26.4483585357666, "global_step": 16388, "epoch": 135} {"train_loss": -26.432559967041016, "global_step": 16389, "epoch": 135} {"train_loss": -27.177976608276367, "global_step": 16390, "epoch": 135} {"train_loss": -26.30132484436035, "global_step": 16391, "epoch": 135} {"train_loss": -25.738256454467773, "global_step": 16392, "epoch": 135} {"train_loss": -25.512985229492188, "global_step": 16393, "epoch": 135} {"train_loss": -27.09071922302246, "global_step": 16394, "epoch": 135} {"train_loss": -26.75164222717285, "global_step": 16395, "epoch": 135} {"train_loss": -26.0419979095459, "global_step": 16396, "epoch": 135} {"train_loss": -26.280141830444336, "global_step": 16397, "epoch": 135} {"train_loss": -27.433935165405273, "global_step": 16398, "epoch": 135} {"train_loss": -26.952655792236328, "global_step": 16399, "epoch": 135} {"train_loss": -27.31316566467285, "global_step": 16400, "epoch": 135} {"train_loss": -27.1014461517334, "global_step": 16401, "epoch": 135} {"train_loss": -26.977182388305664, "global_step": 16402, "epoch": 135} {"train_loss": -26.716272354125977, "global_step": 16403, "epoch": 135} {"train_loss": -27.27577018737793, "global_step": 16404, "epoch": 135} {"train_loss": -27.11972999572754, "global_step": 16405, "epoch": 135} {"train_loss": -27.528263092041016, "global_step": 16406, "epoch": 135} {"train_loss": -27.02850341796875, "global_step": 16407, "epoch": 135} {"train_loss": -27.551925659179688, "global_step": 16408, "epoch": 135} {"train_loss": -27.038543701171875, "global_step": 16409, "epoch": 135} {"train_loss": -27.414020538330078, "global_step": 16410, "epoch": 135} {"train_loss": -27.4221248626709, "global_step": 16411, "epoch": 135} {"train_loss": -27.259069442749023, "global_step": 16412, "epoch": 135} {"train_loss": -27.01411247253418, "global_step": 16413, "epoch": 135} {"train_loss": -27.747419357299805, "global_step": 16414, "epoch": 135} {"train_loss": -27.241708755493164, "global_step": 16415, "epoch": 135} {"train_loss": -27.042036056518555, "global_step": 16416, "epoch": 135} {"train_loss": -27.3414363861084, "global_step": 16417, "epoch": 135} {"train_loss": -26.418806076049805, "global_step": 16418, "epoch": 135} {"train_loss": -27.06943702697754, "global_step": 16419, "epoch": 135} {"train_loss": -26.866239547729492, "global_step": 16420, "epoch": 135} {"train_loss": -26.787134170532227, "global_step": 16421, "epoch": 135} {"train_loss": -27.518936157226562, "global_step": 16422, "epoch": 135} {"train_loss": -27.132877349853516, "global_step": 16423, "epoch": 135} {"train_loss": -27.16729736328125, "global_step": 16424, "epoch": 135} {"train_loss": -26.8800048828125, "global_step": 16425, "epoch": 135} {"train_loss": -27.033512115478516, "global_step": 16426, "epoch": 135} {"train_loss": -27.411609649658203, "global_step": 16427, "epoch": 135} {"train_loss": -27.08017921447754, "global_step": 16428, "epoch": 135} {"train_loss": -27.682783126831055, "global_step": 16429, "epoch": 135} {"train_loss": -26.889265060424805, "global_step": 16430, "epoch": 135} {"train_loss": -27.42864418029785, "global_step": 16431, "epoch": 135} {"train_loss": -27.28679847717285, "global_step": 16432, "epoch": 135} {"train_loss": -27.72942543029785, "global_step": 16433, "epoch": 135} {"train_loss": -27.64906120300293, "global_step": 16434, "epoch": 135} {"train_loss": -26.782026290893555, "global_step": 16435, "epoch": 135} {"train_loss": -27.332366943359375, "global_step": 16436, "epoch": 135} {"train_loss": -27.528961181640625, "global_step": 16437, "epoch": 135} {"train_loss": -27.61659049987793, "global_step": 16438, "epoch": 135} {"train_loss": -27.41330909729004, "global_step": 16439, "epoch": 135} {"train_loss": -26.968708038330078, "global_step": 16440, "epoch": 135} {"train_loss": -27.857473373413086, "global_step": 16441, "epoch": 135} {"train_loss": -27.50971031188965, "global_step": 16442, "epoch": 135} {"train_loss": -27.582080841064453, "global_step": 16443, "epoch": 135} {"train_loss": -27.80940055847168, "global_step": 16444, "epoch": 135} {"train_loss": -27.608739852905273, "global_step": 16445, "epoch": 135} {"train_loss": -27.44097900390625, "global_step": 16446, "epoch": 135} {"train_loss": -27.459070205688477, "global_step": 16447, "epoch": 135} {"train_loss": -27.11928367614746, "global_step": 16448, "epoch": 135} {"train_loss": -27.3193359375, "global_step": 16449, "epoch": 135} {"train_loss": -27.345808029174805, "global_step": 16450, "epoch": 135} {"train_loss": -27.720382690429688, "global_step": 16451, "epoch": 135} {"train_loss": -27.764209747314453, "global_step": 16452, "epoch": 135} {"train_loss": -27.42793846130371, "global_step": 16453, "epoch": 135} {"train_loss": -26.193334579467773, "global_step": 16454, "epoch": 135} {"train_loss": -27.02414148504084, "global_step": 16455, "epoch": 135, "val_loss": 2670580.75} {"train_loss": -18.81820297241211, "global_step": 16456, "epoch": 136} {"train_loss": -20.013086318969727, "global_step": 16457, "epoch": 136} {"train_loss": -27.152637481689453, "global_step": 16458, "epoch": 136} {"train_loss": -23.70716667175293, "global_step": 16459, "epoch": 136} {"train_loss": -25.883642196655273, "global_step": 16460, "epoch": 136} {"train_loss": -24.251556396484375, "global_step": 16461, "epoch": 136} {"train_loss": -27.281248092651367, "global_step": 16462, "epoch": 136} {"train_loss": -25.43341636657715, "global_step": 16463, "epoch": 136} {"train_loss": -26.435819625854492, "global_step": 16464, "epoch": 136} {"train_loss": -26.87586784362793, "global_step": 16465, "epoch": 136} {"train_loss": -25.2540283203125, "global_step": 16466, "epoch": 136} {"train_loss": -26.50486183166504, "global_step": 16467, "epoch": 136} {"train_loss": -27.372045516967773, "global_step": 16468, "epoch": 136} {"train_loss": -26.495426177978516, "global_step": 16469, "epoch": 136} {"train_loss": -26.516454696655273, "global_step": 16470, "epoch": 136} {"train_loss": -26.799192428588867, "global_step": 16471, "epoch": 136} {"train_loss": -26.83290672302246, "global_step": 16472, "epoch": 136} {"train_loss": -27.254196166992188, "global_step": 16473, "epoch": 136} {"train_loss": -25.67487907409668, "global_step": 16474, "epoch": 136} {"train_loss": -25.806976318359375, "global_step": 16475, "epoch": 136} {"train_loss": -26.8106746673584, "global_step": 16476, "epoch": 136} {"train_loss": -26.91389274597168, "global_step": 16477, "epoch": 136} {"train_loss": -26.123458862304688, "global_step": 16478, "epoch": 136} {"train_loss": -26.684131622314453, "global_step": 16479, "epoch": 136} {"train_loss": -26.842365264892578, "global_step": 16480, "epoch": 136} {"train_loss": -27.249547958374023, "global_step": 16481, "epoch": 136} {"train_loss": -26.868946075439453, "global_step": 16482, "epoch": 136} {"train_loss": -26.870954513549805, "global_step": 16483, "epoch": 136} {"train_loss": -27.262495040893555, "global_step": 16484, "epoch": 136} {"train_loss": -27.192182540893555, "global_step": 16485, "epoch": 136} {"train_loss": -26.9803409576416, "global_step": 16486, "epoch": 136} {"train_loss": -27.47308349609375, "global_step": 16487, "epoch": 136} {"train_loss": -26.70918083190918, "global_step": 16488, "epoch": 136} {"train_loss": -27.094425201416016, "global_step": 16489, "epoch": 136} {"train_loss": -27.47235107421875, "global_step": 16490, "epoch": 136} {"train_loss": -27.113422393798828, "global_step": 16491, "epoch": 136} {"train_loss": -27.33684730529785, "global_step": 16492, "epoch": 136} {"train_loss": -27.71231460571289, "global_step": 16493, "epoch": 136} {"train_loss": -27.071374893188477, "global_step": 16494, "epoch": 136} {"train_loss": -27.179691314697266, "global_step": 16495, "epoch": 136} {"train_loss": -27.1027774810791, "global_step": 16496, "epoch": 136} {"train_loss": -26.8963623046875, "global_step": 16497, "epoch": 136} {"train_loss": -27.15143394470215, "global_step": 16498, "epoch": 136} {"train_loss": -27.08588981628418, "global_step": 16499, "epoch": 136} {"train_loss": -27.38628578186035, "global_step": 16500, "epoch": 136} {"train_loss": -27.348840713500977, "global_step": 16501, "epoch": 136} {"train_loss": -27.507675170898438, "global_step": 16502, "epoch": 136} {"train_loss": -27.001195907592773, "global_step": 16503, "epoch": 136} {"train_loss": -27.29805564880371, "global_step": 16504, "epoch": 136} {"train_loss": -27.5155029296875, "global_step": 16505, "epoch": 136} {"train_loss": -27.805837631225586, "global_step": 16506, "epoch": 136} {"train_loss": -27.657459259033203, "global_step": 16507, "epoch": 136} {"train_loss": -27.88372802734375, "global_step": 16508, "epoch": 136} {"train_loss": -27.773895263671875, "global_step": 16509, "epoch": 136} {"train_loss": -27.435285568237305, "global_step": 16510, "epoch": 136} {"train_loss": -27.162588119506836, "global_step": 16511, "epoch": 136} {"train_loss": -27.526525497436523, "global_step": 16512, "epoch": 136} {"train_loss": -27.737646102905273, "global_step": 16513, "epoch": 136} {"train_loss": -27.996139526367188, "global_step": 16514, "epoch": 136} {"train_loss": -27.548980712890625, "global_step": 16515, "epoch": 136} {"train_loss": -27.515424728393555, "global_step": 16516, "epoch": 136} {"train_loss": -27.81812858581543, "global_step": 16517, "epoch": 136} {"train_loss": -27.22315788269043, "global_step": 16518, "epoch": 136} {"train_loss": -27.20892906188965, "global_step": 16519, "epoch": 136} {"train_loss": -27.509733200073242, "global_step": 16520, "epoch": 136} {"train_loss": -27.94330406188965, "global_step": 16521, "epoch": 136} {"train_loss": -27.050397872924805, "global_step": 16522, "epoch": 136} {"train_loss": -27.582326889038086, "global_step": 16523, "epoch": 136} {"train_loss": -27.2979679107666, "global_step": 16524, "epoch": 136} {"train_loss": -27.110198974609375, "global_step": 16525, "epoch": 136} {"train_loss": -27.065048217773438, "global_step": 16526, "epoch": 136} {"train_loss": -26.565784454345703, "global_step": 16527, "epoch": 136} {"train_loss": -26.836933135986328, "global_step": 16528, "epoch": 136} {"train_loss": -26.31037712097168, "global_step": 16529, "epoch": 136} {"train_loss": -26.164831161499023, "global_step": 16530, "epoch": 136} {"train_loss": -26.8216495513916, "global_step": 16531, "epoch": 136} {"train_loss": -27.227497100830078, "global_step": 16532, "epoch": 136} {"train_loss": -26.13140869140625, "global_step": 16533, "epoch": 136} {"train_loss": -27.625152587890625, "global_step": 16534, "epoch": 136} {"train_loss": -26.7464656829834, "global_step": 16535, "epoch": 136} {"train_loss": -27.324827194213867, "global_step": 16536, "epoch": 136} {"train_loss": -27.175642013549805, "global_step": 16537, "epoch": 136} {"train_loss": -27.17291831970215, "global_step": 16538, "epoch": 136} {"train_loss": -26.139184951782227, "global_step": 16539, "epoch": 136} {"train_loss": -27.018217086791992, "global_step": 16540, "epoch": 136} {"train_loss": -27.340667724609375, "global_step": 16541, "epoch": 136} {"train_loss": -26.85761070251465, "global_step": 16542, "epoch": 136} {"train_loss": -26.9267578125, "global_step": 16543, "epoch": 136} {"train_loss": -27.532867431640625, "global_step": 16544, "epoch": 136} {"train_loss": -27.19927406311035, "global_step": 16545, "epoch": 136} {"train_loss": -27.2828369140625, "global_step": 16546, "epoch": 136} {"train_loss": -27.574148178100586, "global_step": 16547, "epoch": 136} {"train_loss": -27.27168846130371, "global_step": 16548, "epoch": 136} {"train_loss": -27.704065322875977, "global_step": 16549, "epoch": 136} {"train_loss": -27.316221237182617, "global_step": 16550, "epoch": 136} {"train_loss": -27.5937557220459, "global_step": 16551, "epoch": 136} {"train_loss": -27.74903678894043, "global_step": 16552, "epoch": 136} {"train_loss": -27.420883178710938, "global_step": 16553, "epoch": 136} {"train_loss": -27.90813636779785, "global_step": 16554, "epoch": 136} {"train_loss": -27.71285057067871, "global_step": 16555, "epoch": 136} {"train_loss": -27.447452545166016, "global_step": 16556, "epoch": 136} {"train_loss": -27.74517250061035, "global_step": 16557, "epoch": 136} {"train_loss": -27.71331214904785, "global_step": 16558, "epoch": 136} {"train_loss": -26.774072647094727, "global_step": 16559, "epoch": 136} {"train_loss": -26.34539222717285, "global_step": 16560, "epoch": 136} {"train_loss": -27.17500114440918, "global_step": 16561, "epoch": 136} {"train_loss": -27.8212890625, "global_step": 16562, "epoch": 136} {"train_loss": -26.427459716796875, "global_step": 16563, "epoch": 136} {"train_loss": -27.091556549072266, "global_step": 16564, "epoch": 136} {"train_loss": -27.07643699645996, "global_step": 16565, "epoch": 136} {"train_loss": -27.506155014038086, "global_step": 16566, "epoch": 136} {"train_loss": -26.64142417907715, "global_step": 16567, "epoch": 136} {"train_loss": -27.118793487548828, "global_step": 16568, "epoch": 136} {"train_loss": -26.856409072875977, "global_step": 16569, "epoch": 136} {"train_loss": -26.8980770111084, "global_step": 16570, "epoch": 136} {"train_loss": -27.42813491821289, "global_step": 16571, "epoch": 136} {"train_loss": -27.296539306640625, "global_step": 16572, "epoch": 136} {"train_loss": -27.6312255859375, "global_step": 16573, "epoch": 136} {"train_loss": -27.43922233581543, "global_step": 16574, "epoch": 136} {"train_loss": -27.694656372070312, "global_step": 16575, "epoch": 136} {"train_loss": -26.938653378447224, "global_step": 16576, "epoch": 136, "val_loss": 2679005.25} {"train_loss": -27.366596221923828, "global_step": 16577, "epoch": 137} {"train_loss": -27.631519317626953, "global_step": 16578, "epoch": 137} {"train_loss": -27.895750045776367, "global_step": 16579, "epoch": 137} {"train_loss": -27.625980377197266, "global_step": 16580, "epoch": 137} {"train_loss": -27.49981689453125, "global_step": 16581, "epoch": 137} {"train_loss": -28.01300621032715, "global_step": 16582, "epoch": 137} {"train_loss": -26.631113052368164, "global_step": 16583, "epoch": 137} {"train_loss": -27.274219512939453, "global_step": 16584, "epoch": 137} {"train_loss": -27.009668350219727, "global_step": 16585, "epoch": 137} {"train_loss": -27.079132080078125, "global_step": 16586, "epoch": 137} {"train_loss": -27.015869140625, "global_step": 16587, "epoch": 137} {"train_loss": -27.140623092651367, "global_step": 16588, "epoch": 137} {"train_loss": -27.411060333251953, "global_step": 16589, "epoch": 137} {"train_loss": -28.042097091674805, "global_step": 16590, "epoch": 137} {"train_loss": -27.18680191040039, "global_step": 16591, "epoch": 137} {"train_loss": -27.44561195373535, "global_step": 16592, "epoch": 137} {"train_loss": -27.719257354736328, "global_step": 16593, "epoch": 137} {"train_loss": -27.88868522644043, "global_step": 16594, "epoch": 137} {"train_loss": -28.05771255493164, "global_step": 16595, "epoch": 137} {"train_loss": -28.152124404907227, "global_step": 16596, "epoch": 137} {"train_loss": -27.70149803161621, "global_step": 16597, "epoch": 137} {"train_loss": -28.295873641967773, "global_step": 16598, "epoch": 137} {"train_loss": -27.711206436157227, "global_step": 16599, "epoch": 137} {"train_loss": -27.994922637939453, "global_step": 16600, "epoch": 137} {"train_loss": -27.93096351623535, "global_step": 16601, "epoch": 137} {"train_loss": -27.565820693969727, "global_step": 16602, "epoch": 137} {"train_loss": -27.6809024810791, "global_step": 16603, "epoch": 137} {"train_loss": -28.13984489440918, "global_step": 16604, "epoch": 137} {"train_loss": -28.040771484375, "global_step": 16605, "epoch": 137} {"train_loss": -27.760366439819336, "global_step": 16606, "epoch": 137} {"train_loss": -27.820932388305664, "global_step": 16607, "epoch": 137} {"train_loss": -27.746694564819336, "global_step": 16608, "epoch": 137} {"train_loss": -27.61417579650879, "global_step": 16609, "epoch": 137} {"train_loss": -28.203489303588867, "global_step": 16610, "epoch": 137} {"train_loss": -27.87285804748535, "global_step": 16611, "epoch": 137} {"train_loss": -27.6949405670166, "global_step": 16612, "epoch": 137} {"train_loss": -28.168766021728516, "global_step": 16613, "epoch": 137} {"train_loss": -28.400318145751953, "global_step": 16614, "epoch": 137} {"train_loss": -28.2630558013916, "global_step": 16615, "epoch": 137} {"train_loss": -27.645557403564453, "global_step": 16616, "epoch": 137} {"train_loss": -27.43817138671875, "global_step": 16617, "epoch": 137} {"train_loss": -28.142974853515625, "global_step": 16618, "epoch": 137} {"train_loss": -27.772764205932617, "global_step": 16619, "epoch": 137} {"train_loss": -27.2673282623291, "global_step": 16620, "epoch": 137} {"train_loss": -27.7578125, "global_step": 16621, "epoch": 137} {"train_loss": -28.549341201782227, "global_step": 16622, "epoch": 137} {"train_loss": -27.130918502807617, "global_step": 16623, "epoch": 137} {"train_loss": -26.5888729095459, "global_step": 16624, "epoch": 137} {"train_loss": -27.66470718383789, "global_step": 16625, "epoch": 137} {"train_loss": -27.962549209594727, "global_step": 16626, "epoch": 137} {"train_loss": -27.3902645111084, "global_step": 16627, "epoch": 137} {"train_loss": -27.91273307800293, "global_step": 16628, "epoch": 137} {"train_loss": -27.906482696533203, "global_step": 16629, "epoch": 137} {"train_loss": -27.185546875, "global_step": 16630, "epoch": 137} {"train_loss": -28.12593650817871, "global_step": 16631, "epoch": 137} {"train_loss": -27.72974967956543, "global_step": 16632, "epoch": 137} {"train_loss": -27.7657470703125, "global_step": 16633, "epoch": 137} {"train_loss": -28.15342140197754, "global_step": 16634, "epoch": 137} {"train_loss": -27.20065689086914, "global_step": 16635, "epoch": 137} {"train_loss": -28.310632705688477, "global_step": 16636, "epoch": 137} {"train_loss": -27.783044815063477, "global_step": 16637, "epoch": 137} {"train_loss": -28.4991512298584, "global_step": 16638, "epoch": 137} {"train_loss": -27.8900203704834, "global_step": 16639, "epoch": 137} {"train_loss": -28.14056396484375, "global_step": 16640, "epoch": 137} {"train_loss": -27.70826530456543, "global_step": 16641, "epoch": 137} {"train_loss": -27.9936580657959, "global_step": 16642, "epoch": 137} {"train_loss": -28.160598754882812, "global_step": 16643, "epoch": 137} {"train_loss": -28.09211540222168, "global_step": 16644, "epoch": 137} {"train_loss": -28.449567794799805, "global_step": 16645, "epoch": 137} {"train_loss": -28.06153678894043, "global_step": 16646, "epoch": 137} {"train_loss": -28.315433502197266, "global_step": 16647, "epoch": 137} {"train_loss": -27.898160934448242, "global_step": 16648, "epoch": 137} {"train_loss": -28.024927139282227, "global_step": 16649, "epoch": 137} {"train_loss": -27.871408462524414, "global_step": 16650, "epoch": 137} {"train_loss": -28.3121395111084, "global_step": 16651, "epoch": 137} {"train_loss": -27.239309310913086, "global_step": 16652, "epoch": 137} {"train_loss": -27.303747177124023, "global_step": 16653, "epoch": 137} {"train_loss": -27.15749168395996, "global_step": 16654, "epoch": 137} {"train_loss": -28.144338607788086, "global_step": 16655, "epoch": 137} {"train_loss": -27.940881729125977, "global_step": 16656, "epoch": 137} {"train_loss": -28.243146896362305, "global_step": 16657, "epoch": 137} {"train_loss": -27.093835830688477, "global_step": 16658, "epoch": 137} {"train_loss": -27.783594131469727, "global_step": 16659, "epoch": 137} {"train_loss": -27.278064727783203, "global_step": 16660, "epoch": 137} {"train_loss": -27.692108154296875, "global_step": 16661, "epoch": 137} {"train_loss": -27.961151123046875, "global_step": 16662, "epoch": 137} {"train_loss": -28.355161666870117, "global_step": 16663, "epoch": 137} {"train_loss": -28.11875343322754, "global_step": 16664, "epoch": 137} {"train_loss": -27.63856315612793, "global_step": 16665, "epoch": 137} {"train_loss": -27.761449813842773, "global_step": 16666, "epoch": 137} {"train_loss": -28.173553466796875, "global_step": 16667, "epoch": 137} {"train_loss": -28.269453048706055, "global_step": 16668, "epoch": 137} {"train_loss": -28.316192626953125, "global_step": 16669, "epoch": 137} {"train_loss": -28.224170684814453, "global_step": 16670, "epoch": 137} {"train_loss": -28.102331161499023, "global_step": 16671, "epoch": 137} {"train_loss": -28.421066284179688, "global_step": 16672, "epoch": 137} {"train_loss": -27.573938369750977, "global_step": 16673, "epoch": 137} {"train_loss": -28.193235397338867, "global_step": 16674, "epoch": 137} {"train_loss": -27.74494743347168, "global_step": 16675, "epoch": 137} {"train_loss": -28.154455184936523, "global_step": 16676, "epoch": 137} {"train_loss": -28.12860107421875, "global_step": 16677, "epoch": 137} {"train_loss": -27.448043823242188, "global_step": 16678, "epoch": 137} {"train_loss": -27.491016387939453, "global_step": 16679, "epoch": 137} {"train_loss": -28.3537654876709, "global_step": 16680, "epoch": 137} {"train_loss": -27.14930534362793, "global_step": 16681, "epoch": 137} {"train_loss": -27.97968864440918, "global_step": 16682, "epoch": 137} {"train_loss": -28.004220962524414, "global_step": 16683, "epoch": 137} {"train_loss": -28.26302146911621, "global_step": 16684, "epoch": 137} {"train_loss": -28.08672523498535, "global_step": 16685, "epoch": 137} {"train_loss": -28.618154525756836, "global_step": 16686, "epoch": 137} {"train_loss": -27.401885986328125, "global_step": 16687, "epoch": 137} {"train_loss": -27.94452476501465, "global_step": 16688, "epoch": 137} {"train_loss": -28.465866088867188, "global_step": 16689, "epoch": 137} {"train_loss": -28.29266929626465, "global_step": 16690, "epoch": 137} {"train_loss": -27.957290649414062, "global_step": 16691, "epoch": 137} {"train_loss": -28.224292755126953, "global_step": 16692, "epoch": 137} {"train_loss": -28.1694393157959, "global_step": 16693, "epoch": 137} {"train_loss": -28.144453048706055, "global_step": 16694, "epoch": 137} {"train_loss": -28.028669357299805, "global_step": 16695, "epoch": 137} {"train_loss": -28.306354522705078, "global_step": 16696, "epoch": 137} {"train_loss": -27.83911236849698, "global_step": 16697, "epoch": 137, "val_loss": 2787201.5} {"train_loss": -27.1085205078125, "global_step": 16698, "epoch": 138} {"train_loss": -28.14168357849121, "global_step": 16699, "epoch": 138} {"train_loss": -27.309553146362305, "global_step": 16700, "epoch": 138} {"train_loss": -27.750507354736328, "global_step": 16701, "epoch": 138} {"train_loss": -28.412153244018555, "global_step": 16702, "epoch": 138} {"train_loss": -26.465723037719727, "global_step": 16703, "epoch": 138} {"train_loss": -24.580095291137695, "global_step": 16704, "epoch": 138} {"train_loss": -24.376319885253906, "global_step": 16705, "epoch": 138} {"train_loss": -26.84002685546875, "global_step": 16706, "epoch": 138} {"train_loss": -28.2022705078125, "global_step": 16707, "epoch": 138} {"train_loss": -26.82269287109375, "global_step": 16708, "epoch": 138} {"train_loss": -27.196002960205078, "global_step": 16709, "epoch": 138} {"train_loss": -26.314163208007812, "global_step": 16710, "epoch": 138} {"train_loss": -28.02132225036621, "global_step": 16711, "epoch": 138} {"train_loss": -26.491058349609375, "global_step": 16712, "epoch": 138} {"train_loss": -27.79620933532715, "global_step": 16713, "epoch": 138} {"train_loss": -27.73898696899414, "global_step": 16714, "epoch": 138} {"train_loss": -27.277423858642578, "global_step": 16715, "epoch": 138} {"train_loss": -27.1147403717041, "global_step": 16716, "epoch": 138} {"train_loss": -28.11223793029785, "global_step": 16717, "epoch": 138} {"train_loss": -27.976526260375977, "global_step": 16718, "epoch": 138} {"train_loss": -28.271337509155273, "global_step": 16719, "epoch": 138} {"train_loss": -27.56109046936035, "global_step": 16720, "epoch": 138} {"train_loss": -27.5206241607666, "global_step": 16721, "epoch": 138} {"train_loss": -28.042499542236328, "global_step": 16722, "epoch": 138} {"train_loss": -27.490896224975586, "global_step": 16723, "epoch": 138} {"train_loss": -27.966882705688477, "global_step": 16724, "epoch": 138} {"train_loss": -28.000873565673828, "global_step": 16725, "epoch": 138} {"train_loss": -28.273208618164062, "global_step": 16726, "epoch": 138} {"train_loss": -27.905384063720703, "global_step": 16727, "epoch": 138} {"train_loss": -27.600873947143555, "global_step": 16728, "epoch": 138} {"train_loss": -27.995954513549805, "global_step": 16729, "epoch": 138} {"train_loss": -27.6225528717041, "global_step": 16730, "epoch": 138} {"train_loss": -27.829193115234375, "global_step": 16731, "epoch": 138} {"train_loss": -28.07763671875, "global_step": 16732, "epoch": 138} {"train_loss": -27.899154663085938, "global_step": 16733, "epoch": 138} {"train_loss": -28.059589385986328, "global_step": 16734, "epoch": 138} {"train_loss": -27.763864517211914, "global_step": 16735, "epoch": 138} {"train_loss": -28.167688369750977, "global_step": 16736, "epoch": 138} {"train_loss": -28.225122451782227, "global_step": 16737, "epoch": 138} {"train_loss": -27.1544132232666, "global_step": 16738, "epoch": 138} {"train_loss": -28.64794921875, "global_step": 16739, "epoch": 138} {"train_loss": -26.259811401367188, "global_step": 16740, "epoch": 138} {"train_loss": -28.0369815826416, "global_step": 16741, "epoch": 138} {"train_loss": -27.550573348999023, "global_step": 16742, "epoch": 138} {"train_loss": -28.361852645874023, "global_step": 16743, "epoch": 138} {"train_loss": -28.196279525756836, "global_step": 16744, "epoch": 138} {"train_loss": -28.673175811767578, "global_step": 16745, "epoch": 138} {"train_loss": -28.07844352722168, "global_step": 16746, "epoch": 138} {"train_loss": -28.480268478393555, "global_step": 16747, "epoch": 138} {"train_loss": -28.381561279296875, "global_step": 16748, "epoch": 138} {"train_loss": -28.4348201751709, "global_step": 16749, "epoch": 138} {"train_loss": -28.57090187072754, "global_step": 16750, "epoch": 138} {"train_loss": -28.842853546142578, "global_step": 16751, "epoch": 138} {"train_loss": -28.645009994506836, "global_step": 16752, "epoch": 138} {"train_loss": -28.511823654174805, "global_step": 16753, "epoch": 138} {"train_loss": -28.611953735351562, "global_step": 16754, "epoch": 138} {"train_loss": -28.149738311767578, "global_step": 16755, "epoch": 138} {"train_loss": -28.693090438842773, "global_step": 16756, "epoch": 138} {"train_loss": -28.4000186920166, "global_step": 16757, "epoch": 138} {"train_loss": -28.6589298248291, "global_step": 16758, "epoch": 138} {"train_loss": -29.018918991088867, "global_step": 16759, "epoch": 138} {"train_loss": -28.912412643432617, "global_step": 16760, "epoch": 138} {"train_loss": -28.263715744018555, "global_step": 16761, "epoch": 138} {"train_loss": -28.694555282592773, "global_step": 16762, "epoch": 138} {"train_loss": -28.43926429748535, "global_step": 16763, "epoch": 138} {"train_loss": -28.433414459228516, "global_step": 16764, "epoch": 138} {"train_loss": -28.406179428100586, "global_step": 16765, "epoch": 138} {"train_loss": -28.577550888061523, "global_step": 16766, "epoch": 138} {"train_loss": -28.33806800842285, "global_step": 16767, "epoch": 138} {"train_loss": -28.45086669921875, "global_step": 16768, "epoch": 138} {"train_loss": -28.792510986328125, "global_step": 16769, "epoch": 138} {"train_loss": -28.57073402404785, "global_step": 16770, "epoch": 138} {"train_loss": -28.46917152404785, "global_step": 16771, "epoch": 138} {"train_loss": -28.198583602905273, "global_step": 16772, "epoch": 138} {"train_loss": -28.737457275390625, "global_step": 16773, "epoch": 138} {"train_loss": -28.748876571655273, "global_step": 16774, "epoch": 138} {"train_loss": -28.832677841186523, "global_step": 16775, "epoch": 138} {"train_loss": -28.654626846313477, "global_step": 16776, "epoch": 138} {"train_loss": -28.449060440063477, "global_step": 16777, "epoch": 138} {"train_loss": -28.79853630065918, "global_step": 16778, "epoch": 138} {"train_loss": -28.983585357666016, "global_step": 16779, "epoch": 138} {"train_loss": -28.310667037963867, "global_step": 16780, "epoch": 138} {"train_loss": -28.726428985595703, "global_step": 16781, "epoch": 138} {"train_loss": -28.899667739868164, "global_step": 16782, "epoch": 138} {"train_loss": -28.548934936523438, "global_step": 16783, "epoch": 138} {"train_loss": -29.244983673095703, "global_step": 16784, "epoch": 138} {"train_loss": -28.53777503967285, "global_step": 16785, "epoch": 138} {"train_loss": -29.0538272857666, "global_step": 16786, "epoch": 138} {"train_loss": -29.30316734313965, "global_step": 16787, "epoch": 138} {"train_loss": -28.74989891052246, "global_step": 16788, "epoch": 138} {"train_loss": -28.19862174987793, "global_step": 16789, "epoch": 138} {"train_loss": -27.5257568359375, "global_step": 16790, "epoch": 138} {"train_loss": -22.361608505249023, "global_step": 16791, "epoch": 138} {"train_loss": -12.294367790222168, "global_step": 16792, "epoch": 138} {"train_loss": -10.256571769714355, "global_step": 16793, "epoch": 138} {"train_loss": -12.127565383911133, "global_step": 16794, "epoch": 138} {"train_loss": -11.762150764465332, "global_step": 16795, "epoch": 138} {"train_loss": -14.089886665344238, "global_step": 16796, "epoch": 138} {"train_loss": -12.871962547302246, "global_step": 16797, "epoch": 138} {"train_loss": -15.117212295532227, "global_step": 16798, "epoch": 138} {"train_loss": -14.436042785644531, "global_step": 16799, "epoch": 138} {"train_loss": -13.1947603225708, "global_step": 16800, "epoch": 138} {"train_loss": -14.931170463562012, "global_step": 16801, "epoch": 138} {"train_loss": -15.629236221313477, "global_step": 16802, "epoch": 138} {"train_loss": -15.579012870788574, "global_step": 16803, "epoch": 138} {"train_loss": -17.778573989868164, "global_step": 16804, "epoch": 138} {"train_loss": -18.365550994873047, "global_step": 16805, "epoch": 138} {"train_loss": -16.152935028076172, "global_step": 16806, "epoch": 138} {"train_loss": -18.6507568359375, "global_step": 16807, "epoch": 138} {"train_loss": -18.04722785949707, "global_step": 16808, "epoch": 138} {"train_loss": -18.248111724853516, "global_step": 16809, "epoch": 138} {"train_loss": -19.6563663482666, "global_step": 16810, "epoch": 138} {"train_loss": -18.92769432067871, "global_step": 16811, "epoch": 138} {"train_loss": -19.059301376342773, "global_step": 16812, "epoch": 138} {"train_loss": -19.81270980834961, "global_step": 16813, "epoch": 138} {"train_loss": -21.154356002807617, "global_step": 16814, "epoch": 138} {"train_loss": -20.472394943237305, "global_step": 16815, "epoch": 138} {"train_loss": -21.365604400634766, "global_step": 16816, "epoch": 138} {"train_loss": -21.68779754638672, "global_step": 16817, "epoch": 138} {"train_loss": -25.502386392640673, "global_step": 16818, "epoch": 138, "val_loss": 2597991.0} {"train_loss": -22.195350646972656, "global_step": 16819, "epoch": 139} {"train_loss": -22.4945125579834, "global_step": 16820, "epoch": 139} {"train_loss": -22.358734130859375, "global_step": 16821, "epoch": 139} {"train_loss": -22.686010360717773, "global_step": 16822, "epoch": 139} {"train_loss": -23.465700149536133, "global_step": 16823, "epoch": 139} {"train_loss": -23.330482482910156, "global_step": 16824, "epoch": 139} {"train_loss": -23.936704635620117, "global_step": 16825, "epoch": 139} {"train_loss": -23.69672203063965, "global_step": 16826, "epoch": 139} {"train_loss": -20.366788864135742, "global_step": 16827, "epoch": 139} {"train_loss": -18.016408920288086, "global_step": 16828, "epoch": 139} {"train_loss": -22.028823852539062, "global_step": 16829, "epoch": 139} {"train_loss": -8.8765869140625, "global_step": 16830, "epoch": 139} {"train_loss": -23.78463363647461, "global_step": 16831, "epoch": 139} {"train_loss": -16.367910385131836, "global_step": 16832, "epoch": 139} {"train_loss": -22.437015533447266, "global_step": 16833, "epoch": 139} {"train_loss": -23.63665199279785, "global_step": 16834, "epoch": 139} {"train_loss": -21.64946937561035, "global_step": 16835, "epoch": 139} {"train_loss": -22.46006202697754, "global_step": 16836, "epoch": 139} {"train_loss": -23.019668579101562, "global_step": 16837, "epoch": 139} {"train_loss": -23.25675392150879, "global_step": 16838, "epoch": 139} {"train_loss": -23.778146743774414, "global_step": 16839, "epoch": 139} {"train_loss": -23.643959045410156, "global_step": 16840, "epoch": 139} {"train_loss": -22.4031982421875, "global_step": 16841, "epoch": 139} {"train_loss": -23.186065673828125, "global_step": 16842, "epoch": 139} {"train_loss": -23.487186431884766, "global_step": 16843, "epoch": 139} {"train_loss": -22.308713912963867, "global_step": 16844, "epoch": 139} {"train_loss": -23.637603759765625, "global_step": 16845, "epoch": 139} {"train_loss": -23.59697151184082, "global_step": 16846, "epoch": 139} {"train_loss": -24.30241584777832, "global_step": 16847, "epoch": 139} {"train_loss": -24.225149154663086, "global_step": 16848, "epoch": 139} {"train_loss": -24.379741668701172, "global_step": 16849, "epoch": 139} {"train_loss": -24.24592399597168, "global_step": 16850, "epoch": 139} {"train_loss": -24.563589096069336, "global_step": 16851, "epoch": 139} {"train_loss": -23.77199363708496, "global_step": 16852, "epoch": 139} {"train_loss": -24.788766860961914, "global_step": 16853, "epoch": 139} {"train_loss": -24.45524024963379, "global_step": 16854, "epoch": 139} {"train_loss": -24.236709594726562, "global_step": 16855, "epoch": 139} {"train_loss": -24.04113006591797, "global_step": 16856, "epoch": 139} {"train_loss": -22.161405563354492, "global_step": 16857, "epoch": 139} {"train_loss": -22.87799072265625, "global_step": 16858, "epoch": 139} {"train_loss": -24.401721954345703, "global_step": 16859, "epoch": 139} {"train_loss": -22.677583694458008, "global_step": 16860, "epoch": 139} {"train_loss": -23.849523544311523, "global_step": 16861, "epoch": 139} {"train_loss": -24.13155174255371, "global_step": 16862, "epoch": 139} {"train_loss": -24.62527847290039, "global_step": 16863, "epoch": 139} {"train_loss": -23.826908111572266, "global_step": 16864, "epoch": 139} {"train_loss": -24.62613296508789, "global_step": 16865, "epoch": 139} {"train_loss": -24.397390365600586, "global_step": 16866, "epoch": 139} {"train_loss": -24.30017852783203, "global_step": 16867, "epoch": 139} {"train_loss": -24.281553268432617, "global_step": 16868, "epoch": 139} {"train_loss": -24.533857345581055, "global_step": 16869, "epoch": 139} {"train_loss": -24.79087257385254, "global_step": 16870, "epoch": 139} {"train_loss": -24.719167709350586, "global_step": 16871, "epoch": 139} {"train_loss": -24.802528381347656, "global_step": 16872, "epoch": 139} {"train_loss": -24.232160568237305, "global_step": 16873, "epoch": 139} {"train_loss": -22.14579200744629, "global_step": 16874, "epoch": 139} {"train_loss": -12.932931900024414, "global_step": 16875, "epoch": 139} {"train_loss": -22.593631744384766, "global_step": 16876, "epoch": 139} {"train_loss": -18.793195724487305, "global_step": 16877, "epoch": 139} {"train_loss": -25.361600875854492, "global_step": 16878, "epoch": 139} {"train_loss": -22.463809967041016, "global_step": 16879, "epoch": 139} {"train_loss": -21.531051635742188, "global_step": 16880, "epoch": 139} {"train_loss": -24.594980239868164, "global_step": 16881, "epoch": 139} {"train_loss": -25.251680374145508, "global_step": 16882, "epoch": 139} {"train_loss": -24.01177406311035, "global_step": 16883, "epoch": 139} {"train_loss": -23.817977905273438, "global_step": 16884, "epoch": 139} {"train_loss": -23.021284103393555, "global_step": 16885, "epoch": 139} {"train_loss": -24.199695587158203, "global_step": 16886, "epoch": 139} {"train_loss": -24.803937911987305, "global_step": 16887, "epoch": 139} {"train_loss": -25.070816040039062, "global_step": 16888, "epoch": 139} {"train_loss": -25.369239807128906, "global_step": 16889, "epoch": 139} {"train_loss": -25.311861038208008, "global_step": 16890, "epoch": 139} {"train_loss": -25.115461349487305, "global_step": 16891, "epoch": 139} {"train_loss": -25.1176815032959, "global_step": 16892, "epoch": 139} {"train_loss": -24.934589385986328, "global_step": 16893, "epoch": 139} {"train_loss": -25.375417709350586, "global_step": 16894, "epoch": 139} {"train_loss": -25.36931037902832, "global_step": 16895, "epoch": 139} {"train_loss": -24.919267654418945, "global_step": 16896, "epoch": 139} {"train_loss": -25.423240661621094, "global_step": 16897, "epoch": 139} {"train_loss": -25.59223747253418, "global_step": 16898, "epoch": 139} {"train_loss": -25.49561882019043, "global_step": 16899, "epoch": 139} {"train_loss": -25.369565963745117, "global_step": 16900, "epoch": 139} {"train_loss": -26.25398063659668, "global_step": 16901, "epoch": 139} {"train_loss": -24.938581466674805, "global_step": 16902, "epoch": 139} {"train_loss": -25.464262008666992, "global_step": 16903, "epoch": 139} {"train_loss": -24.929595947265625, "global_step": 16904, "epoch": 139} {"train_loss": -24.116025924682617, "global_step": 16905, "epoch": 139} {"train_loss": -22.48965835571289, "global_step": 16906, "epoch": 139} {"train_loss": -23.838499069213867, "global_step": 16907, "epoch": 139} {"train_loss": -25.326122283935547, "global_step": 16908, "epoch": 139} {"train_loss": -23.8946475982666, "global_step": 16909, "epoch": 139} {"train_loss": -24.925474166870117, "global_step": 16910, "epoch": 139} {"train_loss": -23.914419174194336, "global_step": 16911, "epoch": 139} {"train_loss": -22.255722045898438, "global_step": 16912, "epoch": 139} {"train_loss": -19.72219467163086, "global_step": 16913, "epoch": 139} {"train_loss": -22.46292495727539, "global_step": 16914, "epoch": 139} {"train_loss": -24.487945556640625, "global_step": 16915, "epoch": 139} {"train_loss": -22.47186279296875, "global_step": 16916, "epoch": 139} {"train_loss": -24.580976486206055, "global_step": 16917, "epoch": 139} {"train_loss": -24.259002685546875, "global_step": 16918, "epoch": 139} {"train_loss": -24.293668746948242, "global_step": 16919, "epoch": 139} {"train_loss": -24.835254669189453, "global_step": 16920, "epoch": 139} {"train_loss": -24.425926208496094, "global_step": 16921, "epoch": 139} {"train_loss": -24.714086532592773, "global_step": 16922, "epoch": 139} {"train_loss": -24.38287353515625, "global_step": 16923, "epoch": 139} {"train_loss": -25.03541374206543, "global_step": 16924, "epoch": 139} {"train_loss": -25.024444580078125, "global_step": 16925, "epoch": 139} {"train_loss": -24.8738956451416, "global_step": 16926, "epoch": 139} {"train_loss": -24.744070053100586, "global_step": 16927, "epoch": 139} {"train_loss": -25.23259925842285, "global_step": 16928, "epoch": 139} {"train_loss": -25.234115600585938, "global_step": 16929, "epoch": 139} {"train_loss": -25.750507354736328, "global_step": 16930, "epoch": 139} {"train_loss": -24.99395751953125, "global_step": 16931, "epoch": 139} {"train_loss": -25.1481990814209, "global_step": 16932, "epoch": 139} {"train_loss": -25.14755630493164, "global_step": 16933, "epoch": 139} {"train_loss": -25.018171310424805, "global_step": 16934, "epoch": 139} {"train_loss": -25.802215576171875, "global_step": 16935, "epoch": 139} {"train_loss": -25.8809757232666, "global_step": 16936, "epoch": 139} {"train_loss": -26.007909774780273, "global_step": 16937, "epoch": 139} {"train_loss": -25.480804443359375, "global_step": 16938, "epoch": 139} {"train_loss": -23.726483021885894, "global_step": 16939, "epoch": 139, "val_loss": 2713490.5} {"train_loss": -25.67328453063965, "global_step": 16940, "epoch": 140} {"train_loss": -25.72114372253418, "global_step": 16941, "epoch": 140} {"train_loss": -25.62428092956543, "global_step": 16942, "epoch": 140} {"train_loss": -26.00197410583496, "global_step": 16943, "epoch": 140} {"train_loss": -26.66845703125, "global_step": 16944, "epoch": 140} {"train_loss": -26.3616943359375, "global_step": 16945, "epoch": 140} {"train_loss": -25.90032386779785, "global_step": 16946, "epoch": 140} {"train_loss": -26.0145320892334, "global_step": 16947, "epoch": 140} {"train_loss": -26.306476593017578, "global_step": 16948, "epoch": 140} {"train_loss": -26.16193962097168, "global_step": 16949, "epoch": 140} {"train_loss": -26.353803634643555, "global_step": 16950, "epoch": 140} {"train_loss": -26.64630126953125, "global_step": 16951, "epoch": 140} {"train_loss": -25.806859970092773, "global_step": 16952, "epoch": 140} {"train_loss": -26.56793212890625, "global_step": 16953, "epoch": 140} {"train_loss": -26.882001876831055, "global_step": 16954, "epoch": 140} {"train_loss": -26.69057273864746, "global_step": 16955, "epoch": 140} {"train_loss": -26.734521865844727, "global_step": 16956, "epoch": 140} {"train_loss": -26.89943504333496, "global_step": 16957, "epoch": 140} {"train_loss": -27.09095573425293, "global_step": 16958, "epoch": 140} {"train_loss": -26.87129020690918, "global_step": 16959, "epoch": 140} {"train_loss": -27.1656551361084, "global_step": 16960, "epoch": 140} {"train_loss": -27.355777740478516, "global_step": 16961, "epoch": 140} {"train_loss": -27.178518295288086, "global_step": 16962, "epoch": 140} {"train_loss": -27.226736068725586, "global_step": 16963, "epoch": 140} {"train_loss": -27.560867309570312, "global_step": 16964, "epoch": 140} {"train_loss": -27.683277130126953, "global_step": 16965, "epoch": 140} {"train_loss": -27.478925704956055, "global_step": 16966, "epoch": 140} {"train_loss": -27.715087890625, "global_step": 16967, "epoch": 140} {"train_loss": -27.627410888671875, "global_step": 16968, "epoch": 140} {"train_loss": -28.050128936767578, "global_step": 16969, "epoch": 140} {"train_loss": -27.090932846069336, "global_step": 16970, "epoch": 140} {"train_loss": -27.63557243347168, "global_step": 16971, "epoch": 140} {"train_loss": -27.15180015563965, "global_step": 16972, "epoch": 140} {"train_loss": -27.164159774780273, "global_step": 16973, "epoch": 140} {"train_loss": -27.424589157104492, "global_step": 16974, "epoch": 140} {"train_loss": -26.849252700805664, "global_step": 16975, "epoch": 140} {"train_loss": -27.543649673461914, "global_step": 16976, "epoch": 140} {"train_loss": -27.373340606689453, "global_step": 16977, "epoch": 140} {"train_loss": -27.12859535217285, "global_step": 16978, "epoch": 140} {"train_loss": -27.470916748046875, "global_step": 16979, "epoch": 140} {"train_loss": -27.05594825744629, "global_step": 16980, "epoch": 140} {"train_loss": -26.779077529907227, "global_step": 16981, "epoch": 140} {"train_loss": -26.91957664489746, "global_step": 16982, "epoch": 140} {"train_loss": -27.4143123626709, "global_step": 16983, "epoch": 140} {"train_loss": -27.156391143798828, "global_step": 16984, "epoch": 140} {"train_loss": -26.313232421875, "global_step": 16985, "epoch": 140} {"train_loss": -25.370412826538086, "global_step": 16986, "epoch": 140} {"train_loss": -22.553272247314453, "global_step": 16987, "epoch": 140} {"train_loss": -24.123947143554688, "global_step": 16988, "epoch": 140} {"train_loss": -27.394269943237305, "global_step": 16989, "epoch": 140} {"train_loss": -25.70588493347168, "global_step": 16990, "epoch": 140} {"train_loss": -27.158613204956055, "global_step": 16991, "epoch": 140} {"train_loss": -26.302356719970703, "global_step": 16992, "epoch": 140} {"train_loss": -28.023717880249023, "global_step": 16993, "epoch": 140} {"train_loss": -26.533960342407227, "global_step": 16994, "epoch": 140} {"train_loss": -26.789932250976562, "global_step": 16995, "epoch": 140} {"train_loss": -27.589460372924805, "global_step": 16996, "epoch": 140} {"train_loss": -26.637109756469727, "global_step": 16997, "epoch": 140} {"train_loss": -27.182376861572266, "global_step": 16998, "epoch": 140} {"train_loss": -27.652973175048828, "global_step": 16999, "epoch": 140} {"train_loss": -27.36432456970215, "global_step": 17000, "epoch": 140} {"train_loss": -27.553503036499023, "global_step": 17001, "epoch": 140} {"train_loss": -27.28521728515625, "global_step": 17002, "epoch": 140} {"train_loss": -27.784666061401367, "global_step": 17003, "epoch": 140} {"train_loss": -27.108327865600586, "global_step": 17004, "epoch": 140} {"train_loss": -27.894983291625977, "global_step": 17005, "epoch": 140} {"train_loss": -27.1085147857666, "global_step": 17006, "epoch": 140} {"train_loss": -27.817646026611328, "global_step": 17007, "epoch": 140} {"train_loss": -27.337814331054688, "global_step": 17008, "epoch": 140} {"train_loss": -26.967472076416016, "global_step": 17009, "epoch": 140} {"train_loss": -26.40756607055664, "global_step": 17010, "epoch": 140} {"train_loss": -25.79254722595215, "global_step": 17011, "epoch": 140} {"train_loss": -26.18561363220215, "global_step": 17012, "epoch": 140} {"train_loss": -27.057931900024414, "global_step": 17013, "epoch": 140} {"train_loss": -27.690479278564453, "global_step": 17014, "epoch": 140} {"train_loss": -27.42236328125, "global_step": 17015, "epoch": 140} {"train_loss": -26.437850952148438, "global_step": 17016, "epoch": 140} {"train_loss": -25.0430908203125, "global_step": 17017, "epoch": 140} {"train_loss": -22.992368698120117, "global_step": 17018, "epoch": 140} {"train_loss": -22.2895565032959, "global_step": 17019, "epoch": 140} {"train_loss": -27.680816650390625, "global_step": 17020, "epoch": 140} {"train_loss": -25.64400291442871, "global_step": 17021, "epoch": 140} {"train_loss": -26.80169105529785, "global_step": 17022, "epoch": 140} {"train_loss": -26.017393112182617, "global_step": 17023, "epoch": 140} {"train_loss": -27.292505264282227, "global_step": 17024, "epoch": 140} {"train_loss": -26.14752769470215, "global_step": 17025, "epoch": 140} {"train_loss": -27.178991317749023, "global_step": 17026, "epoch": 140} {"train_loss": -27.08271598815918, "global_step": 17027, "epoch": 140} {"train_loss": -26.370798110961914, "global_step": 17028, "epoch": 140} {"train_loss": -27.499988555908203, "global_step": 17029, "epoch": 140} {"train_loss": -26.677648544311523, "global_step": 17030, "epoch": 140} {"train_loss": -26.57465934753418, "global_step": 17031, "epoch": 140} {"train_loss": -26.881399154663086, "global_step": 17032, "epoch": 140} {"train_loss": -26.860258102416992, "global_step": 17033, "epoch": 140} {"train_loss": -26.7893123626709, "global_step": 17034, "epoch": 140} {"train_loss": -27.138864517211914, "global_step": 17035, "epoch": 140} {"train_loss": -27.465940475463867, "global_step": 17036, "epoch": 140} {"train_loss": -27.076969146728516, "global_step": 17037, "epoch": 140} {"train_loss": -27.4013614654541, "global_step": 17038, "epoch": 140} {"train_loss": -27.28553581237793, "global_step": 17039, "epoch": 140} {"train_loss": -27.11447525024414, "global_step": 17040, "epoch": 140} {"train_loss": -27.670013427734375, "global_step": 17041, "epoch": 140} {"train_loss": -26.596118927001953, "global_step": 17042, "epoch": 140} {"train_loss": -26.81377601623535, "global_step": 17043, "epoch": 140} {"train_loss": -27.223041534423828, "global_step": 17044, "epoch": 140} {"train_loss": -25.38477897644043, "global_step": 17045, "epoch": 140} {"train_loss": -26.857715606689453, "global_step": 17046, "epoch": 140} {"train_loss": -26.806615829467773, "global_step": 17047, "epoch": 140} {"train_loss": -27.068439483642578, "global_step": 17048, "epoch": 140} {"train_loss": -27.379358291625977, "global_step": 17049, "epoch": 140} {"train_loss": -27.1590518951416, "global_step": 17050, "epoch": 140} {"train_loss": -26.720380783081055, "global_step": 17051, "epoch": 140} {"train_loss": -25.616262435913086, "global_step": 17052, "epoch": 140} {"train_loss": -21.93021583557129, "global_step": 17053, "epoch": 140} {"train_loss": -15.471722602844238, "global_step": 17054, "epoch": 140} {"train_loss": -24.26883888244629, "global_step": 17055, "epoch": 140} {"train_loss": -24.403263092041016, "global_step": 17056, "epoch": 140} {"train_loss": -25.575218200683594, "global_step": 17057, "epoch": 140} {"train_loss": -24.418596267700195, "global_step": 17058, "epoch": 140} {"train_loss": -27.278854370117188, "global_step": 17059, "epoch": 140} {"train_loss": -26.550129196860574, "global_step": 17060, "epoch": 140, "val_loss": 2738603.75} {"train_loss": -25.437244415283203, "global_step": 17061, "epoch": 141} {"train_loss": -27.01087760925293, "global_step": 17062, "epoch": 141} {"train_loss": -26.76150894165039, "global_step": 17063, "epoch": 141} {"train_loss": -26.480356216430664, "global_step": 17064, "epoch": 141} {"train_loss": -26.53059196472168, "global_step": 17065, "epoch": 141} {"train_loss": -26.4984130859375, "global_step": 17066, "epoch": 141} {"train_loss": -27.27638053894043, "global_step": 17067, "epoch": 141} {"train_loss": -27.330488204956055, "global_step": 17068, "epoch": 141} {"train_loss": -26.805500030517578, "global_step": 17069, "epoch": 141} {"train_loss": -26.567102432250977, "global_step": 17070, "epoch": 141} {"train_loss": -26.195087432861328, "global_step": 17071, "epoch": 141} {"train_loss": -25.67099380493164, "global_step": 17072, "epoch": 141} {"train_loss": -24.969696044921875, "global_step": 17073, "epoch": 141} {"train_loss": -26.03497314453125, "global_step": 17074, "epoch": 141} {"train_loss": -27.122406005859375, "global_step": 17075, "epoch": 141} {"train_loss": -26.5980167388916, "global_step": 17076, "epoch": 141} {"train_loss": -26.560880661010742, "global_step": 17077, "epoch": 141} {"train_loss": -27.22199821472168, "global_step": 17078, "epoch": 141} {"train_loss": -27.171463012695312, "global_step": 17079, "epoch": 141} {"train_loss": -27.683456420898438, "global_step": 17080, "epoch": 141} {"train_loss": -27.521215438842773, "global_step": 17081, "epoch": 141} {"train_loss": -27.124486923217773, "global_step": 17082, "epoch": 141} {"train_loss": -27.662710189819336, "global_step": 17083, "epoch": 141} {"train_loss": -26.686676025390625, "global_step": 17084, "epoch": 141} {"train_loss": -27.157211303710938, "global_step": 17085, "epoch": 141} {"train_loss": -27.76834487915039, "global_step": 17086, "epoch": 141} {"train_loss": -27.41377067565918, "global_step": 17087, "epoch": 141} {"train_loss": -27.377195358276367, "global_step": 17088, "epoch": 141} {"train_loss": -27.83917236328125, "global_step": 17089, "epoch": 141} {"train_loss": -27.60162925720215, "global_step": 17090, "epoch": 141} {"train_loss": -27.5981502532959, "global_step": 17091, "epoch": 141} {"train_loss": -27.6336612701416, "global_step": 17092, "epoch": 141} {"train_loss": -27.608688354492188, "global_step": 17093, "epoch": 141} {"train_loss": -27.471899032592773, "global_step": 17094, "epoch": 141} {"train_loss": -27.22052574157715, "global_step": 17095, "epoch": 141} {"train_loss": -27.746702194213867, "global_step": 17096, "epoch": 141} {"train_loss": -27.2546329498291, "global_step": 17097, "epoch": 141} {"train_loss": -27.56536865234375, "global_step": 17098, "epoch": 141} {"train_loss": -26.813520431518555, "global_step": 17099, "epoch": 141} {"train_loss": -27.441137313842773, "global_step": 17100, "epoch": 141} {"train_loss": -27.505701065063477, "global_step": 17101, "epoch": 141} {"train_loss": -27.69952392578125, "global_step": 17102, "epoch": 141} {"train_loss": -28.106632232666016, "global_step": 17103, "epoch": 141} {"train_loss": -27.923904418945312, "global_step": 17104, "epoch": 141} {"train_loss": -28.177534103393555, "global_step": 17105, "epoch": 141} {"train_loss": -27.777353286743164, "global_step": 17106, "epoch": 141} {"train_loss": -27.910507202148438, "global_step": 17107, "epoch": 141} {"train_loss": -27.275686264038086, "global_step": 17108, "epoch": 141} {"train_loss": -27.49225425720215, "global_step": 17109, "epoch": 141} {"train_loss": -27.635618209838867, "global_step": 17110, "epoch": 141} {"train_loss": -26.8445987701416, "global_step": 17111, "epoch": 141} {"train_loss": -25.814929962158203, "global_step": 17112, "epoch": 141} {"train_loss": -20.457748413085938, "global_step": 17113, "epoch": 141} {"train_loss": -16.62355613708496, "global_step": 17114, "epoch": 141} {"train_loss": -26.413572311401367, "global_step": 17115, "epoch": 141} {"train_loss": -23.14609718322754, "global_step": 17116, "epoch": 141} {"train_loss": -26.19549560546875, "global_step": 17117, "epoch": 141} {"train_loss": -22.84869956970215, "global_step": 17118, "epoch": 141} {"train_loss": -25.20693016052246, "global_step": 17119, "epoch": 141} {"train_loss": -24.096418380737305, "global_step": 17120, "epoch": 141} {"train_loss": -21.25581169128418, "global_step": 17121, "epoch": 141} {"train_loss": -23.378427505493164, "global_step": 17122, "epoch": 141} {"train_loss": -26.2996826171875, "global_step": 17123, "epoch": 141} {"train_loss": -25.722782135009766, "global_step": 17124, "epoch": 141} {"train_loss": -25.206647872924805, "global_step": 17125, "epoch": 141} {"train_loss": -25.256153106689453, "global_step": 17126, "epoch": 141} {"train_loss": -25.870397567749023, "global_step": 17127, "epoch": 141} {"train_loss": -25.53987693786621, "global_step": 17128, "epoch": 141} {"train_loss": -26.463438034057617, "global_step": 17129, "epoch": 141} {"train_loss": -25.427921295166016, "global_step": 17130, "epoch": 141} {"train_loss": -26.255859375, "global_step": 17131, "epoch": 141} {"train_loss": -25.986188888549805, "global_step": 17132, "epoch": 141} {"train_loss": -25.696664810180664, "global_step": 17133, "epoch": 141} {"train_loss": -26.443683624267578, "global_step": 17134, "epoch": 141} {"train_loss": -26.32398796081543, "global_step": 17135, "epoch": 141} {"train_loss": -26.5377197265625, "global_step": 17136, "epoch": 141} {"train_loss": -26.42365074157715, "global_step": 17137, "epoch": 141} {"train_loss": -26.84295654296875, "global_step": 17138, "epoch": 141} {"train_loss": -26.109067916870117, "global_step": 17139, "epoch": 141} {"train_loss": -26.138458251953125, "global_step": 17140, "epoch": 141} {"train_loss": -26.42144203186035, "global_step": 17141, "epoch": 141} {"train_loss": -26.793472290039062, "global_step": 17142, "epoch": 141} {"train_loss": -26.028669357299805, "global_step": 17143, "epoch": 141} {"train_loss": -26.393680572509766, "global_step": 17144, "epoch": 141} {"train_loss": -26.77622413635254, "global_step": 17145, "epoch": 141} {"train_loss": -26.244613647460938, "global_step": 17146, "epoch": 141} {"train_loss": -26.945104598999023, "global_step": 17147, "epoch": 141} {"train_loss": -26.71491813659668, "global_step": 17148, "epoch": 141} {"train_loss": -27.08469581604004, "global_step": 17149, "epoch": 141} {"train_loss": -26.656614303588867, "global_step": 17150, "epoch": 141} {"train_loss": -26.827356338500977, "global_step": 17151, "epoch": 141} {"train_loss": -27.15110206604004, "global_step": 17152, "epoch": 141} {"train_loss": -26.7878475189209, "global_step": 17153, "epoch": 141} {"train_loss": -27.524036407470703, "global_step": 17154, "epoch": 141} {"train_loss": -27.280017852783203, "global_step": 17155, "epoch": 141} {"train_loss": -26.96784782409668, "global_step": 17156, "epoch": 141} {"train_loss": -27.090551376342773, "global_step": 17157, "epoch": 141} {"train_loss": -27.212860107421875, "global_step": 17158, "epoch": 141} {"train_loss": -27.364133834838867, "global_step": 17159, "epoch": 141} {"train_loss": -27.403715133666992, "global_step": 17160, "epoch": 141} {"train_loss": -27.22482681274414, "global_step": 17161, "epoch": 141} {"train_loss": -27.553604125976562, "global_step": 17162, "epoch": 141} {"train_loss": -27.473730087280273, "global_step": 17163, "epoch": 141} {"train_loss": -27.24225425720215, "global_step": 17164, "epoch": 141} {"train_loss": -27.526453018188477, "global_step": 17165, "epoch": 141} {"train_loss": -27.640958786010742, "global_step": 17166, "epoch": 141} {"train_loss": -27.304859161376953, "global_step": 17167, "epoch": 141} {"train_loss": -27.499988555908203, "global_step": 17168, "epoch": 141} {"train_loss": -27.64438247680664, "global_step": 17169, "epoch": 141} {"train_loss": -27.69495964050293, "global_step": 17170, "epoch": 141} {"train_loss": -26.92431640625, "global_step": 17171, "epoch": 141} {"train_loss": -27.871509552001953, "global_step": 17172, "epoch": 141} {"train_loss": -27.314111709594727, "global_step": 17173, "epoch": 141} {"train_loss": -27.821741104125977, "global_step": 17174, "epoch": 141} {"train_loss": -27.581716537475586, "global_step": 17175, "epoch": 141} {"train_loss": -27.568130493164062, "global_step": 17176, "epoch": 141} {"train_loss": -27.682031631469727, "global_step": 17177, "epoch": 141} {"train_loss": -27.522119522094727, "global_step": 17178, "epoch": 141} {"train_loss": -27.46332359313965, "global_step": 17179, "epoch": 141} {"train_loss": -27.470483779907227, "global_step": 17180, "epoch": 141} {"train_loss": -26.6494649146214, "global_step": 17181, "epoch": 141, "val_loss": 2675512.0} {"train_loss": -28.07572364807129, "global_step": 17182, "epoch": 142} {"train_loss": -27.766443252563477, "global_step": 17183, "epoch": 142} {"train_loss": -28.05544090270996, "global_step": 17184, "epoch": 142} {"train_loss": -27.895124435424805, "global_step": 17185, "epoch": 142} {"train_loss": -27.98377799987793, "global_step": 17186, "epoch": 142} {"train_loss": -27.668487548828125, "global_step": 17187, "epoch": 142} {"train_loss": -26.569738388061523, "global_step": 17188, "epoch": 142} {"train_loss": -25.414352416992188, "global_step": 17189, "epoch": 142} {"train_loss": -23.651784896850586, "global_step": 17190, "epoch": 142} {"train_loss": -25.62643814086914, "global_step": 17191, "epoch": 142} {"train_loss": -26.354782104492188, "global_step": 17192, "epoch": 142} {"train_loss": -24.142568588256836, "global_step": 17193, "epoch": 142} {"train_loss": -25.898603439331055, "global_step": 17194, "epoch": 142} {"train_loss": -27.106632232666016, "global_step": 17195, "epoch": 142} {"train_loss": -25.256488800048828, "global_step": 17196, "epoch": 142} {"train_loss": -25.412755966186523, "global_step": 17197, "epoch": 142} {"train_loss": -26.830413818359375, "global_step": 17198, "epoch": 142} {"train_loss": -26.303266525268555, "global_step": 17199, "epoch": 142} {"train_loss": -26.509668350219727, "global_step": 17200, "epoch": 142} {"train_loss": -25.782669067382812, "global_step": 17201, "epoch": 142} {"train_loss": -26.140310287475586, "global_step": 17202, "epoch": 142} {"train_loss": -26.635534286499023, "global_step": 17203, "epoch": 142} {"train_loss": -26.707733154296875, "global_step": 17204, "epoch": 142} {"train_loss": -26.47210693359375, "global_step": 17205, "epoch": 142} {"train_loss": -27.290973663330078, "global_step": 17206, "epoch": 142} {"train_loss": -27.0709171295166, "global_step": 17207, "epoch": 142} {"train_loss": -26.69091796875, "global_step": 17208, "epoch": 142} {"train_loss": -27.480884552001953, "global_step": 17209, "epoch": 142} {"train_loss": -26.79237174987793, "global_step": 17210, "epoch": 142} {"train_loss": -27.759618759155273, "global_step": 17211, "epoch": 142} {"train_loss": -27.473602294921875, "global_step": 17212, "epoch": 142} {"train_loss": -27.767658233642578, "global_step": 17213, "epoch": 142} {"train_loss": -27.918411254882812, "global_step": 17214, "epoch": 142} {"train_loss": -27.890167236328125, "global_step": 17215, "epoch": 142} {"train_loss": -28.21221923828125, "global_step": 17216, "epoch": 142} {"train_loss": -27.928007125854492, "global_step": 17217, "epoch": 142} {"train_loss": -27.61536979675293, "global_step": 17218, "epoch": 142} {"train_loss": -27.560474395751953, "global_step": 17219, "epoch": 142} {"train_loss": -27.59280776977539, "global_step": 17220, "epoch": 142} {"train_loss": -27.846588134765625, "global_step": 17221, "epoch": 142} {"train_loss": -28.1314697265625, "global_step": 17222, "epoch": 142} {"train_loss": -27.933691024780273, "global_step": 17223, "epoch": 142} {"train_loss": -28.13742446899414, "global_step": 17224, "epoch": 142} {"train_loss": -28.048410415649414, "global_step": 17225, "epoch": 142} {"train_loss": -28.03059196472168, "global_step": 17226, "epoch": 142} {"train_loss": -27.9706974029541, "global_step": 17227, "epoch": 142} {"train_loss": -28.017669677734375, "global_step": 17228, "epoch": 142} {"train_loss": -28.376026153564453, "global_step": 17229, "epoch": 142} {"train_loss": -27.828510284423828, "global_step": 17230, "epoch": 142} {"train_loss": -28.312650680541992, "global_step": 17231, "epoch": 142} {"train_loss": -28.34535026550293, "global_step": 17232, "epoch": 142} {"train_loss": -28.3363094329834, "global_step": 17233, "epoch": 142} {"train_loss": -28.53461265563965, "global_step": 17234, "epoch": 142} {"train_loss": -28.57355308532715, "global_step": 17235, "epoch": 142} {"train_loss": -27.981855392456055, "global_step": 17236, "epoch": 142} {"train_loss": -28.160877227783203, "global_step": 17237, "epoch": 142} {"train_loss": -28.043806076049805, "global_step": 17238, "epoch": 142} {"train_loss": -28.47010612487793, "global_step": 17239, "epoch": 142} {"train_loss": -28.030261993408203, "global_step": 17240, "epoch": 142} {"train_loss": -28.343168258666992, "global_step": 17241, "epoch": 142} {"train_loss": -28.154300689697266, "global_step": 17242, "epoch": 142} {"train_loss": -28.278919219970703, "global_step": 17243, "epoch": 142} {"train_loss": -28.681982040405273, "global_step": 17244, "epoch": 142} {"train_loss": -28.314809799194336, "global_step": 17245, "epoch": 142} {"train_loss": -28.54164695739746, "global_step": 17246, "epoch": 142} {"train_loss": -28.380762100219727, "global_step": 17247, "epoch": 142} {"train_loss": -28.40618896484375, "global_step": 17248, "epoch": 142} {"train_loss": -28.501800537109375, "global_step": 17249, "epoch": 142} {"train_loss": -28.396686553955078, "global_step": 17250, "epoch": 142} {"train_loss": -28.71821403503418, "global_step": 17251, "epoch": 142} {"train_loss": -28.553808212280273, "global_step": 17252, "epoch": 142} {"train_loss": -28.312780380249023, "global_step": 17253, "epoch": 142} {"train_loss": -28.613248825073242, "global_step": 17254, "epoch": 142} {"train_loss": -28.28541374206543, "global_step": 17255, "epoch": 142} {"train_loss": -28.751916885375977, "global_step": 17256, "epoch": 142} {"train_loss": -28.3812255859375, "global_step": 17257, "epoch": 142} {"train_loss": -29.01513671875, "global_step": 17258, "epoch": 142} {"train_loss": -28.560699462890625, "global_step": 17259, "epoch": 142} {"train_loss": -28.308399200439453, "global_step": 17260, "epoch": 142} {"train_loss": -28.167987823486328, "global_step": 17261, "epoch": 142} {"train_loss": -27.706769943237305, "global_step": 17262, "epoch": 142} {"train_loss": -24.848318099975586, "global_step": 17263, "epoch": 142} {"train_loss": -17.200912475585938, "global_step": 17264, "epoch": 142} {"train_loss": -10.981233596801758, "global_step": 17265, "epoch": 142} {"train_loss": -25.808135986328125, "global_step": 17266, "epoch": 142} {"train_loss": -17.52310562133789, "global_step": 17267, "epoch": 142} {"train_loss": -27.12150001525879, "global_step": 17268, "epoch": 142} {"train_loss": -22.47672462463379, "global_step": 17269, "epoch": 142} {"train_loss": -24.761295318603516, "global_step": 17270, "epoch": 142} {"train_loss": -27.95157241821289, "global_step": 17271, "epoch": 142} {"train_loss": -26.832965850830078, "global_step": 17272, "epoch": 142} {"train_loss": -25.78713035583496, "global_step": 17273, "epoch": 142} {"train_loss": -25.859619140625, "global_step": 17274, "epoch": 142} {"train_loss": -26.866342544555664, "global_step": 17275, "epoch": 142} {"train_loss": -27.595327377319336, "global_step": 17276, "epoch": 142} {"train_loss": -27.206045150756836, "global_step": 17277, "epoch": 142} {"train_loss": -26.758136749267578, "global_step": 17278, "epoch": 142} {"train_loss": -26.297529220581055, "global_step": 17279, "epoch": 142} {"train_loss": -26.668989181518555, "global_step": 17280, "epoch": 142} {"train_loss": -27.061370849609375, "global_step": 17281, "epoch": 142} {"train_loss": -26.871387481689453, "global_step": 17282, "epoch": 142} {"train_loss": -27.54475212097168, "global_step": 17283, "epoch": 142} {"train_loss": -27.171405792236328, "global_step": 17284, "epoch": 142} {"train_loss": -26.648517608642578, "global_step": 17285, "epoch": 142} {"train_loss": -27.626785278320312, "global_step": 17286, "epoch": 142} {"train_loss": -27.570188522338867, "global_step": 17287, "epoch": 142} {"train_loss": -27.40829849243164, "global_step": 17288, "epoch": 142} {"train_loss": -27.1114444732666, "global_step": 17289, "epoch": 142} {"train_loss": -25.976337432861328, "global_step": 17290, "epoch": 142} {"train_loss": -27.049335479736328, "global_step": 17291, "epoch": 142} {"train_loss": -26.88404655456543, "global_step": 17292, "epoch": 142} {"train_loss": -26.103561401367188, "global_step": 17293, "epoch": 142} {"train_loss": -27.73687171936035, "global_step": 17294, "epoch": 142} {"train_loss": -26.540128707885742, "global_step": 17295, "epoch": 142} {"train_loss": -27.893274307250977, "global_step": 17296, "epoch": 142} {"train_loss": -27.175674438476562, "global_step": 17297, "epoch": 142} {"train_loss": -27.592695236206055, "global_step": 17298, "epoch": 142} {"train_loss": -27.678159713745117, "global_step": 17299, "epoch": 142} {"train_loss": -27.583637237548828, "global_step": 17300, "epoch": 142} {"train_loss": -27.827390670776367, "global_step": 17301, "epoch": 142} {"train_loss": -27.048069268218743, "global_step": 17302, "epoch": 142, "val_loss": 2534326.75} {"train_loss": -27.989410400390625, "global_step": 17303, "epoch": 143} {"train_loss": -27.833663940429688, "global_step": 17304, "epoch": 143} {"train_loss": -27.509902954101562, "global_step": 17305, "epoch": 143} {"train_loss": -27.4186954498291, "global_step": 17306, "epoch": 143} {"train_loss": -27.465930938720703, "global_step": 17307, "epoch": 143} {"train_loss": -27.387939453125, "global_step": 17308, "epoch": 143} {"train_loss": -27.135400772094727, "global_step": 17309, "epoch": 143} {"train_loss": -26.792835235595703, "global_step": 17310, "epoch": 143} {"train_loss": -27.749929428100586, "global_step": 17311, "epoch": 143} {"train_loss": -26.51466178894043, "global_step": 17312, "epoch": 143} {"train_loss": -27.008991241455078, "global_step": 17313, "epoch": 143} {"train_loss": -27.262128829956055, "global_step": 17314, "epoch": 143} {"train_loss": -27.322412490844727, "global_step": 17315, "epoch": 143} {"train_loss": -24.907020568847656, "global_step": 17316, "epoch": 143} {"train_loss": -15.074701309204102, "global_step": 17317, "epoch": 143} {"train_loss": 26.133682250976562, "global_step": 17318, "epoch": 143} {"train_loss": 14.636542320251465, "global_step": 17319, "epoch": 143} {"train_loss": -20.562772750854492, "global_step": 17320, "epoch": 143} {"train_loss": -20.001480102539062, "global_step": 17321, "epoch": 143} {"train_loss": -11.377532005310059, "global_step": 17322, "epoch": 143} {"train_loss": -22.099090576171875, "global_step": 17323, "epoch": 143} {"train_loss": -25.151138305664062, "global_step": 17324, "epoch": 143} {"train_loss": -23.710220336914062, "global_step": 17325, "epoch": 143} {"train_loss": -21.739038467407227, "global_step": 17326, "epoch": 143} {"train_loss": -21.9013614654541, "global_step": 17327, "epoch": 143} {"train_loss": -22.963367462158203, "global_step": 17328, "epoch": 143} {"train_loss": -23.646728515625, "global_step": 17329, "epoch": 143} {"train_loss": -24.82682228088379, "global_step": 17330, "epoch": 143} {"train_loss": -25.385419845581055, "global_step": 17331, "epoch": 143} {"train_loss": -25.359718322753906, "global_step": 17332, "epoch": 143} {"train_loss": -25.857574462890625, "global_step": 17333, "epoch": 143} {"train_loss": -24.737668991088867, "global_step": 17334, "epoch": 143} {"train_loss": -24.79939842224121, "global_step": 17335, "epoch": 143} {"train_loss": -24.857343673706055, "global_step": 17336, "epoch": 143} {"train_loss": -24.871877670288086, "global_step": 17337, "epoch": 143} {"train_loss": -25.317087173461914, "global_step": 17338, "epoch": 143} {"train_loss": -25.044160842895508, "global_step": 17339, "epoch": 143} {"train_loss": -25.16023826599121, "global_step": 17340, "epoch": 143} {"train_loss": -25.046390533447266, "global_step": 17341, "epoch": 143} {"train_loss": -25.138748168945312, "global_step": 17342, "epoch": 143} {"train_loss": -25.45380973815918, "global_step": 17343, "epoch": 143} {"train_loss": -25.242406845092773, "global_step": 17344, "epoch": 143} {"train_loss": -25.221311569213867, "global_step": 17345, "epoch": 143} {"train_loss": -25.937393188476562, "global_step": 17346, "epoch": 143} {"train_loss": -25.725509643554688, "global_step": 17347, "epoch": 143} {"train_loss": -26.007471084594727, "global_step": 17348, "epoch": 143} {"train_loss": -26.565093994140625, "global_step": 17349, "epoch": 143} {"train_loss": -26.19656753540039, "global_step": 17350, "epoch": 143} {"train_loss": -26.361371994018555, "global_step": 17351, "epoch": 143} {"train_loss": -26.580554962158203, "global_step": 17352, "epoch": 143} {"train_loss": -26.434925079345703, "global_step": 17353, "epoch": 143} {"train_loss": -26.051313400268555, "global_step": 17354, "epoch": 143} {"train_loss": -26.613645553588867, "global_step": 17355, "epoch": 143} {"train_loss": -26.2453556060791, "global_step": 17356, "epoch": 143} {"train_loss": -26.723819732666016, "global_step": 17357, "epoch": 143} {"train_loss": -26.7502498626709, "global_step": 17358, "epoch": 143} {"train_loss": -26.807050704956055, "global_step": 17359, "epoch": 143} {"train_loss": -26.57905387878418, "global_step": 17360, "epoch": 143} {"train_loss": -26.423852920532227, "global_step": 17361, "epoch": 143} {"train_loss": -26.674779891967773, "global_step": 17362, "epoch": 143} {"train_loss": -26.62872314453125, "global_step": 17363, "epoch": 143} {"train_loss": -26.854827880859375, "global_step": 17364, "epoch": 143} {"train_loss": -26.856332778930664, "global_step": 17365, "epoch": 143} {"train_loss": -27.008075714111328, "global_step": 17366, "epoch": 143} {"train_loss": -26.42078971862793, "global_step": 17367, "epoch": 143} {"train_loss": -26.889760971069336, "global_step": 17368, "epoch": 143} {"train_loss": -26.70354652404785, "global_step": 17369, "epoch": 143} {"train_loss": -26.057891845703125, "global_step": 17370, "epoch": 143} {"train_loss": -25.09381103515625, "global_step": 17371, "epoch": 143} {"train_loss": -26.3990421295166, "global_step": 17372, "epoch": 143} {"train_loss": -26.19523048400879, "global_step": 17373, "epoch": 143} {"train_loss": -26.497467041015625, "global_step": 17374, "epoch": 143} {"train_loss": -26.630319595336914, "global_step": 17375, "epoch": 143} {"train_loss": -26.17535400390625, "global_step": 17376, "epoch": 143} {"train_loss": -25.830371856689453, "global_step": 17377, "epoch": 143} {"train_loss": -25.774307250976562, "global_step": 17378, "epoch": 143} {"train_loss": -26.16412353515625, "global_step": 17379, "epoch": 143} {"train_loss": -26.252552032470703, "global_step": 17380, "epoch": 143} {"train_loss": -26.070642471313477, "global_step": 17381, "epoch": 143} {"train_loss": -26.811267852783203, "global_step": 17382, "epoch": 143} {"train_loss": -26.103246688842773, "global_step": 17383, "epoch": 143} {"train_loss": -26.421051025390625, "global_step": 17384, "epoch": 143} {"train_loss": -26.0654354095459, "global_step": 17385, "epoch": 143} {"train_loss": -26.788461685180664, "global_step": 17386, "epoch": 143} {"train_loss": -26.289020538330078, "global_step": 17387, "epoch": 143} {"train_loss": -27.030139923095703, "global_step": 17388, "epoch": 143} {"train_loss": -26.258686065673828, "global_step": 17389, "epoch": 143} {"train_loss": -24.141094207763672, "global_step": 17390, "epoch": 143} {"train_loss": -21.77555274963379, "global_step": 17391, "epoch": 143} {"train_loss": -21.882492065429688, "global_step": 17392, "epoch": 143} {"train_loss": -26.061304092407227, "global_step": 17393, "epoch": 143} {"train_loss": -25.111682891845703, "global_step": 17394, "epoch": 143} {"train_loss": -24.68321990966797, "global_step": 17395, "epoch": 143} {"train_loss": -26.6254825592041, "global_step": 17396, "epoch": 143} {"train_loss": -25.402353286743164, "global_step": 17397, "epoch": 143} {"train_loss": -25.732715606689453, "global_step": 17398, "epoch": 143} {"train_loss": -25.98138999938965, "global_step": 17399, "epoch": 143} {"train_loss": -25.4824275970459, "global_step": 17400, "epoch": 143} {"train_loss": -25.636877059936523, "global_step": 17401, "epoch": 143} {"train_loss": -25.777042388916016, "global_step": 17402, "epoch": 143} {"train_loss": -26.552148818969727, "global_step": 17403, "epoch": 143} {"train_loss": -26.299161911010742, "global_step": 17404, "epoch": 143} {"train_loss": -25.964324951171875, "global_step": 17405, "epoch": 143} {"train_loss": -26.144147872924805, "global_step": 17406, "epoch": 143} {"train_loss": -26.383493423461914, "global_step": 17407, "epoch": 143} {"train_loss": -26.754674911499023, "global_step": 17408, "epoch": 143} {"train_loss": -26.472970962524414, "global_step": 17409, "epoch": 143} {"train_loss": -26.394943237304688, "global_step": 17410, "epoch": 143} {"train_loss": -26.2198429107666, "global_step": 17411, "epoch": 143} {"train_loss": -26.835723876953125, "global_step": 17412, "epoch": 143} {"train_loss": -25.81264305114746, "global_step": 17413, "epoch": 143} {"train_loss": -26.807538986206055, "global_step": 17414, "epoch": 143} {"train_loss": -26.32958984375, "global_step": 17415, "epoch": 143} {"train_loss": -26.95648765563965, "global_step": 17416, "epoch": 143} {"train_loss": -26.527631759643555, "global_step": 17417, "epoch": 143} {"train_loss": -26.678546905517578, "global_step": 17418, "epoch": 143} {"train_loss": -26.68267250061035, "global_step": 17419, "epoch": 143} {"train_loss": -27.044538497924805, "global_step": 17420, "epoch": 143} {"train_loss": -26.706268310546875, "global_step": 17421, "epoch": 143} {"train_loss": -26.782093048095703, "global_step": 17422, "epoch": 143} {"train_loss": -24.896902415378033, "global_step": 17423, "epoch": 143, "val_loss": 2624023.75} {"train_loss": -27.060827255249023, "global_step": 17424, "epoch": 144} {"train_loss": -27.1093692779541, "global_step": 17425, "epoch": 144} {"train_loss": -27.104724884033203, "global_step": 17426, "epoch": 144} {"train_loss": -26.710432052612305, "global_step": 17427, "epoch": 144} {"train_loss": -27.062414169311523, "global_step": 17428, "epoch": 144} {"train_loss": -27.217666625976562, "global_step": 17429, "epoch": 144} {"train_loss": -27.03864097595215, "global_step": 17430, "epoch": 144} {"train_loss": -27.154071807861328, "global_step": 17431, "epoch": 144} {"train_loss": -27.117542266845703, "global_step": 17432, "epoch": 144} {"train_loss": -26.870990753173828, "global_step": 17433, "epoch": 144} {"train_loss": -27.68619728088379, "global_step": 17434, "epoch": 144} {"train_loss": -27.114049911499023, "global_step": 17435, "epoch": 144} {"train_loss": -27.26771354675293, "global_step": 17436, "epoch": 144} {"train_loss": -27.27399253845215, "global_step": 17437, "epoch": 144} {"train_loss": -27.305341720581055, "global_step": 17438, "epoch": 144} {"train_loss": -27.013065338134766, "global_step": 17439, "epoch": 144} {"train_loss": -27.576276779174805, "global_step": 17440, "epoch": 144} {"train_loss": -27.384017944335938, "global_step": 17441, "epoch": 144} {"train_loss": -27.539281845092773, "global_step": 17442, "epoch": 144} {"train_loss": -27.404951095581055, "global_step": 17443, "epoch": 144} {"train_loss": -27.611536026000977, "global_step": 17444, "epoch": 144} {"train_loss": -26.775482177734375, "global_step": 17445, "epoch": 144} {"train_loss": -26.831602096557617, "global_step": 17446, "epoch": 144} {"train_loss": -27.270965576171875, "global_step": 17447, "epoch": 144} {"train_loss": -27.303394317626953, "global_step": 17448, "epoch": 144} {"train_loss": -27.282184600830078, "global_step": 17449, "epoch": 144} {"train_loss": -27.135757446289062, "global_step": 17450, "epoch": 144} {"train_loss": -27.540075302124023, "global_step": 17451, "epoch": 144} {"train_loss": -26.371252059936523, "global_step": 17452, "epoch": 144} {"train_loss": -27.34051513671875, "global_step": 17453, "epoch": 144} {"train_loss": -26.597930908203125, "global_step": 17454, "epoch": 144} {"train_loss": -27.390522003173828, "global_step": 17455, "epoch": 144} {"train_loss": -26.694910049438477, "global_step": 17456, "epoch": 144} {"train_loss": -27.07697105407715, "global_step": 17457, "epoch": 144} {"train_loss": -27.777606964111328, "global_step": 17458, "epoch": 144} {"train_loss": -26.517919540405273, "global_step": 17459, "epoch": 144} {"train_loss": -27.492084503173828, "global_step": 17460, "epoch": 144} {"train_loss": -27.50446128845215, "global_step": 17461, "epoch": 144} {"train_loss": -27.611474990844727, "global_step": 17462, "epoch": 144} {"train_loss": -27.70062828063965, "global_step": 17463, "epoch": 144} {"train_loss": -27.67181968688965, "global_step": 17464, "epoch": 144} {"train_loss": -27.311145782470703, "global_step": 17465, "epoch": 144} {"train_loss": -27.435546875, "global_step": 17466, "epoch": 144} {"train_loss": -27.478811264038086, "global_step": 17467, "epoch": 144} {"train_loss": -27.384357452392578, "global_step": 17468, "epoch": 144} {"train_loss": -27.056777954101562, "global_step": 17469, "epoch": 144} {"train_loss": -26.459142684936523, "global_step": 17470, "epoch": 144} {"train_loss": -27.720245361328125, "global_step": 17471, "epoch": 144} {"train_loss": -27.43610954284668, "global_step": 17472, "epoch": 144} {"train_loss": -27.174041748046875, "global_step": 17473, "epoch": 144} {"train_loss": -27.01204490661621, "global_step": 17474, "epoch": 144} {"train_loss": -27.872879028320312, "global_step": 17475, "epoch": 144} {"train_loss": -27.505111694335938, "global_step": 17476, "epoch": 144} {"train_loss": -26.477970123291016, "global_step": 17477, "epoch": 144} {"train_loss": -27.876081466674805, "global_step": 17478, "epoch": 144} {"train_loss": -27.484655380249023, "global_step": 17479, "epoch": 144} {"train_loss": -27.660125732421875, "global_step": 17480, "epoch": 144} {"train_loss": -28.08168601989746, "global_step": 17481, "epoch": 144} {"train_loss": -27.274160385131836, "global_step": 17482, "epoch": 144} {"train_loss": -28.113950729370117, "global_step": 17483, "epoch": 144} {"train_loss": -27.773141860961914, "global_step": 17484, "epoch": 144} {"train_loss": -27.62442970275879, "global_step": 17485, "epoch": 144} {"train_loss": -28.165674209594727, "global_step": 17486, "epoch": 144} {"train_loss": -27.86592674255371, "global_step": 17487, "epoch": 144} {"train_loss": -28.55927085876465, "global_step": 17488, "epoch": 144} {"train_loss": -28.138565063476562, "global_step": 17489, "epoch": 144} {"train_loss": -27.92864990234375, "global_step": 17490, "epoch": 144} {"train_loss": -27.977436065673828, "global_step": 17491, "epoch": 144} {"train_loss": -27.28403663635254, "global_step": 17492, "epoch": 144} {"train_loss": -27.478851318359375, "global_step": 17493, "epoch": 144} {"train_loss": -27.808996200561523, "global_step": 17494, "epoch": 144} {"train_loss": -28.17645835876465, "global_step": 17495, "epoch": 144} {"train_loss": -27.865407943725586, "global_step": 17496, "epoch": 144} {"train_loss": -27.991241455078125, "global_step": 17497, "epoch": 144} {"train_loss": -26.649158477783203, "global_step": 17498, "epoch": 144} {"train_loss": -24.81141471862793, "global_step": 17499, "epoch": 144} {"train_loss": -23.0931339263916, "global_step": 17500, "epoch": 144} {"train_loss": -25.55496597290039, "global_step": 17501, "epoch": 144} {"train_loss": -26.939945220947266, "global_step": 17502, "epoch": 144} {"train_loss": -26.814985275268555, "global_step": 17503, "epoch": 144} {"train_loss": -24.083162307739258, "global_step": 17504, "epoch": 144} {"train_loss": -25.581689834594727, "global_step": 17505, "epoch": 144} {"train_loss": -25.240217208862305, "global_step": 17506, "epoch": 144} {"train_loss": -26.12778663635254, "global_step": 17507, "epoch": 144} {"train_loss": -24.966033935546875, "global_step": 17508, "epoch": 144} {"train_loss": -26.62116813659668, "global_step": 17509, "epoch": 144} {"train_loss": -26.362274169921875, "global_step": 17510, "epoch": 144} {"train_loss": -26.521072387695312, "global_step": 17511, "epoch": 144} {"train_loss": -25.979694366455078, "global_step": 17512, "epoch": 144} {"train_loss": -26.33203125, "global_step": 17513, "epoch": 144} {"train_loss": -26.724817276000977, "global_step": 17514, "epoch": 144} {"train_loss": -26.950397491455078, "global_step": 17515, "epoch": 144} {"train_loss": -27.20503807067871, "global_step": 17516, "epoch": 144} {"train_loss": -27.091135025024414, "global_step": 17517, "epoch": 144} {"train_loss": -26.819284439086914, "global_step": 17518, "epoch": 144} {"train_loss": -27.16285514831543, "global_step": 17519, "epoch": 144} {"train_loss": -26.70142936706543, "global_step": 17520, "epoch": 144} {"train_loss": -26.994861602783203, "global_step": 17521, "epoch": 144} {"train_loss": -26.894102096557617, "global_step": 17522, "epoch": 144} {"train_loss": -26.559192657470703, "global_step": 17523, "epoch": 144} {"train_loss": -26.902719497680664, "global_step": 17524, "epoch": 144} {"train_loss": -27.0602970123291, "global_step": 17525, "epoch": 144} {"train_loss": -27.877826690673828, "global_step": 17526, "epoch": 144} {"train_loss": -27.621557235717773, "global_step": 17527, "epoch": 144} {"train_loss": -27.2476863861084, "global_step": 17528, "epoch": 144} {"train_loss": -27.34173011779785, "global_step": 17529, "epoch": 144} {"train_loss": -27.623952865600586, "global_step": 17530, "epoch": 144} {"train_loss": -27.48316764831543, "global_step": 17531, "epoch": 144} {"train_loss": -27.25530433654785, "global_step": 17532, "epoch": 144} {"train_loss": -27.4100341796875, "global_step": 17533, "epoch": 144} {"train_loss": -27.27882194519043, "global_step": 17534, "epoch": 144} {"train_loss": -27.25412368774414, "global_step": 17535, "epoch": 144} {"train_loss": -27.5050106048584, "global_step": 17536, "epoch": 144} {"train_loss": -26.999500274658203, "global_step": 17537, "epoch": 144} {"train_loss": -27.833784103393555, "global_step": 17538, "epoch": 144} {"train_loss": -27.379331588745117, "global_step": 17539, "epoch": 144} {"train_loss": -27.85137939453125, "global_step": 17540, "epoch": 144} {"train_loss": -27.776147842407227, "global_step": 17541, "epoch": 144} {"train_loss": -27.627079010009766, "global_step": 17542, "epoch": 144} {"train_loss": -27.97535514831543, "global_step": 17543, "epoch": 144} {"train_loss": -27.144410267349116, "global_step": 17544, "epoch": 144, "val_loss": 2431793.75} {"train_loss": -27.797595977783203, "global_step": 17545, "epoch": 145} {"train_loss": -27.68398094177246, "global_step": 17546, "epoch": 145} {"train_loss": -27.50125503540039, "global_step": 17547, "epoch": 145} {"train_loss": -28.02789306640625, "global_step": 17548, "epoch": 145} {"train_loss": -27.79642105102539, "global_step": 17549, "epoch": 145} {"train_loss": -27.914493560791016, "global_step": 17550, "epoch": 145} {"train_loss": -27.848560333251953, "global_step": 17551, "epoch": 145} {"train_loss": -27.927289962768555, "global_step": 17552, "epoch": 145} {"train_loss": -27.920515060424805, "global_step": 17553, "epoch": 145} {"train_loss": -28.017202377319336, "global_step": 17554, "epoch": 145} {"train_loss": -28.382925033569336, "global_step": 17555, "epoch": 145} {"train_loss": -28.25714683532715, "global_step": 17556, "epoch": 145} {"train_loss": -28.192651748657227, "global_step": 17557, "epoch": 145} {"train_loss": -27.816043853759766, "global_step": 17558, "epoch": 145} {"train_loss": -28.42620277404785, "global_step": 17559, "epoch": 145} {"train_loss": -28.129261016845703, "global_step": 17560, "epoch": 145} {"train_loss": -28.299335479736328, "global_step": 17561, "epoch": 145} {"train_loss": -27.96681022644043, "global_step": 17562, "epoch": 145} {"train_loss": -27.664661407470703, "global_step": 17563, "epoch": 145} {"train_loss": -27.9091796875, "global_step": 17564, "epoch": 145} {"train_loss": -27.112348556518555, "global_step": 17565, "epoch": 145} {"train_loss": -26.927579879760742, "global_step": 17566, "epoch": 145} {"train_loss": -28.37176513671875, "global_step": 17567, "epoch": 145} {"train_loss": -27.822500228881836, "global_step": 17568, "epoch": 145} {"train_loss": -27.340606689453125, "global_step": 17569, "epoch": 145} {"train_loss": -28.15402603149414, "global_step": 17570, "epoch": 145} {"train_loss": -27.368515014648438, "global_step": 17571, "epoch": 145} {"train_loss": -27.9229793548584, "global_step": 17572, "epoch": 145} {"train_loss": -28.004308700561523, "global_step": 17573, "epoch": 145} {"train_loss": -28.307905197143555, "global_step": 17574, "epoch": 145} {"train_loss": -27.25872802734375, "global_step": 17575, "epoch": 145} {"train_loss": -25.728683471679688, "global_step": 17576, "epoch": 145} {"train_loss": -27.519216537475586, "global_step": 17577, "epoch": 145} {"train_loss": -27.888153076171875, "global_step": 17578, "epoch": 145} {"train_loss": -27.740442276000977, "global_step": 17579, "epoch": 145} {"train_loss": -27.425878524780273, "global_step": 17580, "epoch": 145} {"train_loss": -27.551050186157227, "global_step": 17581, "epoch": 145} {"train_loss": -27.8575439453125, "global_step": 17582, "epoch": 145} {"train_loss": -28.209745407104492, "global_step": 17583, "epoch": 145} {"train_loss": -27.740509033203125, "global_step": 17584, "epoch": 145} {"train_loss": -26.666364669799805, "global_step": 17585, "epoch": 145} {"train_loss": -27.680395126342773, "global_step": 17586, "epoch": 145} {"train_loss": -27.858808517456055, "global_step": 17587, "epoch": 145} {"train_loss": -27.41684913635254, "global_step": 17588, "epoch": 145} {"train_loss": -27.390338897705078, "global_step": 17589, "epoch": 145} {"train_loss": -27.571369171142578, "global_step": 17590, "epoch": 145} {"train_loss": -27.077573776245117, "global_step": 17591, "epoch": 145} {"train_loss": -27.062885284423828, "global_step": 17592, "epoch": 145} {"train_loss": -28.36459732055664, "global_step": 17593, "epoch": 145} {"train_loss": -27.3757381439209, "global_step": 17594, "epoch": 145} {"train_loss": -27.734588623046875, "global_step": 17595, "epoch": 145} {"train_loss": -28.148523330688477, "global_step": 17596, "epoch": 145} {"train_loss": -27.808307647705078, "global_step": 17597, "epoch": 145} {"train_loss": -28.161396026611328, "global_step": 17598, "epoch": 145} {"train_loss": -28.115381240844727, "global_step": 17599, "epoch": 145} {"train_loss": -27.938825607299805, "global_step": 17600, "epoch": 145} {"train_loss": -28.522287368774414, "global_step": 17601, "epoch": 145} {"train_loss": -27.8609619140625, "global_step": 17602, "epoch": 145} {"train_loss": -28.289331436157227, "global_step": 17603, "epoch": 145} {"train_loss": -28.19580078125, "global_step": 17604, "epoch": 145} {"train_loss": -28.48065185546875, "global_step": 17605, "epoch": 145} {"train_loss": -28.71394157409668, "global_step": 17606, "epoch": 145} {"train_loss": -28.350555419921875, "global_step": 17607, "epoch": 145} {"train_loss": -28.596267700195312, "global_step": 17608, "epoch": 145} {"train_loss": -28.389490127563477, "global_step": 17609, "epoch": 145} {"train_loss": -28.4349308013916, "global_step": 17610, "epoch": 145} {"train_loss": -28.221466064453125, "global_step": 17611, "epoch": 145} {"train_loss": -28.133209228515625, "global_step": 17612, "epoch": 145} {"train_loss": -27.9932918548584, "global_step": 17613, "epoch": 145} {"train_loss": -26.813993453979492, "global_step": 17614, "epoch": 145} {"train_loss": -25.893712997436523, "global_step": 17615, "epoch": 145} {"train_loss": -25.123668670654297, "global_step": 17616, "epoch": 145} {"train_loss": -25.867929458618164, "global_step": 17617, "epoch": 145} {"train_loss": -28.800474166870117, "global_step": 17618, "epoch": 145} {"train_loss": -26.990222930908203, "global_step": 17619, "epoch": 145} {"train_loss": -26.666828155517578, "global_step": 17620, "epoch": 145} {"train_loss": -28.5164794921875, "global_step": 17621, "epoch": 145} {"train_loss": -27.11846351623535, "global_step": 17622, "epoch": 145} {"train_loss": -28.357776641845703, "global_step": 17623, "epoch": 145} {"train_loss": -27.79542350769043, "global_step": 17624, "epoch": 145} {"train_loss": -27.676610946655273, "global_step": 17625, "epoch": 145} {"train_loss": -27.75274658203125, "global_step": 17626, "epoch": 145} {"train_loss": -28.065961837768555, "global_step": 17627, "epoch": 145} {"train_loss": -26.599287033081055, "global_step": 17628, "epoch": 145} {"train_loss": -28.464584350585938, "global_step": 17629, "epoch": 145} {"train_loss": -27.376657485961914, "global_step": 17630, "epoch": 145} {"train_loss": -28.79227066040039, "global_step": 17631, "epoch": 145} {"train_loss": -28.127965927124023, "global_step": 17632, "epoch": 145} {"train_loss": -28.022693634033203, "global_step": 17633, "epoch": 145} {"train_loss": -28.303197860717773, "global_step": 17634, "epoch": 145} {"train_loss": -27.805282592773438, "global_step": 17635, "epoch": 145} {"train_loss": -28.468626022338867, "global_step": 17636, "epoch": 145} {"train_loss": -28.531890869140625, "global_step": 17637, "epoch": 145} {"train_loss": -28.607751846313477, "global_step": 17638, "epoch": 145} {"train_loss": -28.7362003326416, "global_step": 17639, "epoch": 145} {"train_loss": -28.404647827148438, "global_step": 17640, "epoch": 145} {"train_loss": -28.833093643188477, "global_step": 17641, "epoch": 145} {"train_loss": -28.523117065429688, "global_step": 17642, "epoch": 145} {"train_loss": -28.228973388671875, "global_step": 17643, "epoch": 145} {"train_loss": -28.028287887573242, "global_step": 17644, "epoch": 145} {"train_loss": -28.25592041015625, "global_step": 17645, "epoch": 145} {"train_loss": -28.084674835205078, "global_step": 17646, "epoch": 145} {"train_loss": -28.388935089111328, "global_step": 17647, "epoch": 145} {"train_loss": -28.385700225830078, "global_step": 17648, "epoch": 145} {"train_loss": -28.394102096557617, "global_step": 17649, "epoch": 145} {"train_loss": -27.8309383392334, "global_step": 17650, "epoch": 145} {"train_loss": -28.377126693725586, "global_step": 17651, "epoch": 145} {"train_loss": -27.939685821533203, "global_step": 17652, "epoch": 145} {"train_loss": -27.73768424987793, "global_step": 17653, "epoch": 145} {"train_loss": -27.862146377563477, "global_step": 17654, "epoch": 145} {"train_loss": -28.464624404907227, "global_step": 17655, "epoch": 145} {"train_loss": -28.581974029541016, "global_step": 17656, "epoch": 145} {"train_loss": -28.396270751953125, "global_step": 17657, "epoch": 145} {"train_loss": -28.67974853515625, "global_step": 17658, "epoch": 145} {"train_loss": -28.56684684753418, "global_step": 17659, "epoch": 145} {"train_loss": -28.38285255432129, "global_step": 17660, "epoch": 145} {"train_loss": -27.41754722595215, "global_step": 17661, "epoch": 145} {"train_loss": -26.406530380249023, "global_step": 17662, "epoch": 145} {"train_loss": -27.912933349609375, "global_step": 17663, "epoch": 145} {"train_loss": -28.176538467407227, "global_step": 17664, "epoch": 145} {"train_loss": -27.876017373455458, "global_step": 17665, "epoch": 145, "val_loss": 2767688.0} {"train_loss": -26.059539794921875, "global_step": 17666, "epoch": 146} {"train_loss": -27.193662643432617, "global_step": 17667, "epoch": 146} {"train_loss": -27.748809814453125, "global_step": 17668, "epoch": 146} {"train_loss": -25.92778968811035, "global_step": 17669, "epoch": 146} {"train_loss": -27.623682022094727, "global_step": 17670, "epoch": 146} {"train_loss": -28.54139518737793, "global_step": 17671, "epoch": 146} {"train_loss": -28.102075576782227, "global_step": 17672, "epoch": 146} {"train_loss": -28.666494369506836, "global_step": 17673, "epoch": 146} {"train_loss": -28.074060440063477, "global_step": 17674, "epoch": 146} {"train_loss": -28.962194442749023, "global_step": 17675, "epoch": 146} {"train_loss": -28.359180450439453, "global_step": 17676, "epoch": 146} {"train_loss": -28.6060733795166, "global_step": 17677, "epoch": 146} {"train_loss": -29.012908935546875, "global_step": 17678, "epoch": 146} {"train_loss": -28.580854415893555, "global_step": 17679, "epoch": 146} {"train_loss": -28.596466064453125, "global_step": 17680, "epoch": 146} {"train_loss": -28.506336212158203, "global_step": 17681, "epoch": 146} {"train_loss": -28.90314292907715, "global_step": 17682, "epoch": 146} {"train_loss": -28.4085636138916, "global_step": 17683, "epoch": 146} {"train_loss": -28.5235652923584, "global_step": 17684, "epoch": 146} {"train_loss": -28.466821670532227, "global_step": 17685, "epoch": 146} {"train_loss": -28.908811569213867, "global_step": 17686, "epoch": 146} {"train_loss": -28.369709014892578, "global_step": 17687, "epoch": 146} {"train_loss": -28.452524185180664, "global_step": 17688, "epoch": 146} {"train_loss": -28.724206924438477, "global_step": 17689, "epoch": 146} {"train_loss": -27.96502113342285, "global_step": 17690, "epoch": 146} {"train_loss": -28.09324073791504, "global_step": 17691, "epoch": 146} {"train_loss": -28.52327537536621, "global_step": 17692, "epoch": 146} {"train_loss": -28.853612899780273, "global_step": 17693, "epoch": 146} {"train_loss": -28.13397216796875, "global_step": 17694, "epoch": 146} {"train_loss": -28.794843673706055, "global_step": 17695, "epoch": 146} {"train_loss": -28.519256591796875, "global_step": 17696, "epoch": 146} {"train_loss": -28.638822555541992, "global_step": 17697, "epoch": 146} {"train_loss": -28.6649227142334, "global_step": 17698, "epoch": 146} {"train_loss": -28.455768585205078, "global_step": 17699, "epoch": 146} {"train_loss": -28.574506759643555, "global_step": 17700, "epoch": 146} {"train_loss": -28.852197647094727, "global_step": 17701, "epoch": 146} {"train_loss": -29.193347930908203, "global_step": 17702, "epoch": 146} {"train_loss": -28.721521377563477, "global_step": 17703, "epoch": 146} {"train_loss": -28.180683135986328, "global_step": 17704, "epoch": 146} {"train_loss": -28.923017501831055, "global_step": 17705, "epoch": 146} {"train_loss": -28.584081649780273, "global_step": 17706, "epoch": 146} {"train_loss": -29.118574142456055, "global_step": 17707, "epoch": 146} {"train_loss": -28.775182723999023, "global_step": 17708, "epoch": 146} {"train_loss": -28.45819091796875, "global_step": 17709, "epoch": 146} {"train_loss": -28.846363067626953, "global_step": 17710, "epoch": 146} {"train_loss": -28.432424545288086, "global_step": 17711, "epoch": 146} {"train_loss": -26.40411949157715, "global_step": 17712, "epoch": 146} {"train_loss": -24.116710662841797, "global_step": 17713, "epoch": 146} {"train_loss": -19.411558151245117, "global_step": 17714, "epoch": 146} {"train_loss": -20.321395874023438, "global_step": 17715, "epoch": 146} {"train_loss": -28.292388916015625, "global_step": 17716, "epoch": 146} {"train_loss": -24.01725959777832, "global_step": 17717, "epoch": 146} {"train_loss": -28.001449584960938, "global_step": 17718, "epoch": 146} {"train_loss": -24.918643951416016, "global_step": 17719, "epoch": 146} {"train_loss": -27.779172897338867, "global_step": 17720, "epoch": 146} {"train_loss": -26.82989501953125, "global_step": 17721, "epoch": 146} {"train_loss": -26.223011016845703, "global_step": 17722, "epoch": 146} {"train_loss": -28.002161026000977, "global_step": 17723, "epoch": 146} {"train_loss": -28.09720230102539, "global_step": 17724, "epoch": 146} {"train_loss": -26.931427001953125, "global_step": 17725, "epoch": 146} {"train_loss": -27.362592697143555, "global_step": 17726, "epoch": 146} {"train_loss": -27.68776512145996, "global_step": 17727, "epoch": 146} {"train_loss": -28.39922523498535, "global_step": 17728, "epoch": 146} {"train_loss": -27.685522079467773, "global_step": 17729, "epoch": 146} {"train_loss": -27.390613555908203, "global_step": 17730, "epoch": 146} {"train_loss": -27.65520668029785, "global_step": 17731, "epoch": 146} {"train_loss": -27.733198165893555, "global_step": 17732, "epoch": 146} {"train_loss": -27.88532066345215, "global_step": 17733, "epoch": 146} {"train_loss": -27.62183952331543, "global_step": 17734, "epoch": 146} {"train_loss": -27.987232208251953, "global_step": 17735, "epoch": 146} {"train_loss": -27.823049545288086, "global_step": 17736, "epoch": 146} {"train_loss": -27.971179962158203, "global_step": 17737, "epoch": 146} {"train_loss": -27.724750518798828, "global_step": 17738, "epoch": 146} {"train_loss": -27.039331436157227, "global_step": 17739, "epoch": 146} {"train_loss": -27.589323043823242, "global_step": 17740, "epoch": 146} {"train_loss": -28.041120529174805, "global_step": 17741, "epoch": 146} {"train_loss": -27.9758358001709, "global_step": 17742, "epoch": 146} {"train_loss": -27.740707397460938, "global_step": 17743, "epoch": 146} {"train_loss": -27.40286636352539, "global_step": 17744, "epoch": 146} {"train_loss": -26.314380645751953, "global_step": 17745, "epoch": 146} {"train_loss": -25.555028915405273, "global_step": 17746, "epoch": 146} {"train_loss": -25.355493545532227, "global_step": 17747, "epoch": 146} {"train_loss": -26.131519317626953, "global_step": 17748, "epoch": 146} {"train_loss": -28.082000732421875, "global_step": 17749, "epoch": 146} {"train_loss": -26.403461456298828, "global_step": 17750, "epoch": 146} {"train_loss": -27.454111099243164, "global_step": 17751, "epoch": 146} {"train_loss": -27.381088256835938, "global_step": 17752, "epoch": 146} {"train_loss": -27.050668716430664, "global_step": 17753, "epoch": 146} {"train_loss": -27.891071319580078, "global_step": 17754, "epoch": 146} {"train_loss": -27.633438110351562, "global_step": 17755, "epoch": 146} {"train_loss": -28.189350128173828, "global_step": 17756, "epoch": 146} {"train_loss": -27.720571517944336, "global_step": 17757, "epoch": 146} {"train_loss": -27.942874908447266, "global_step": 17758, "epoch": 146} {"train_loss": -27.7115478515625, "global_step": 17759, "epoch": 146} {"train_loss": -27.814661026000977, "global_step": 17760, "epoch": 146} {"train_loss": -27.83534049987793, "global_step": 17761, "epoch": 146} {"train_loss": -27.50796890258789, "global_step": 17762, "epoch": 146} {"train_loss": -28.34431266784668, "global_step": 17763, "epoch": 146} {"train_loss": -27.884225845336914, "global_step": 17764, "epoch": 146} {"train_loss": -28.03864097595215, "global_step": 17765, "epoch": 146} {"train_loss": -28.314701080322266, "global_step": 17766, "epoch": 146} {"train_loss": -27.848413467407227, "global_step": 17767, "epoch": 146} {"train_loss": -28.14170265197754, "global_step": 17768, "epoch": 146} {"train_loss": -28.583642959594727, "global_step": 17769, "epoch": 146} {"train_loss": -28.259801864624023, "global_step": 17770, "epoch": 146} {"train_loss": -28.10089683532715, "global_step": 17771, "epoch": 146} {"train_loss": -28.23642921447754, "global_step": 17772, "epoch": 146} {"train_loss": -28.301427841186523, "global_step": 17773, "epoch": 146} {"train_loss": -28.0916748046875, "global_step": 17774, "epoch": 146} {"train_loss": -27.957178115844727, "global_step": 17775, "epoch": 146} {"train_loss": -28.347583770751953, "global_step": 17776, "epoch": 146} {"train_loss": -27.8010311126709, "global_step": 17777, "epoch": 146} {"train_loss": -25.867223739624023, "global_step": 17778, "epoch": 146} {"train_loss": -25.82777214050293, "global_step": 17779, "epoch": 146} {"train_loss": -27.222578048706055, "global_step": 17780, "epoch": 146} {"train_loss": -27.30536460876465, "global_step": 17781, "epoch": 146} {"train_loss": -27.077009201049805, "global_step": 17782, "epoch": 146} {"train_loss": -27.61431312561035, "global_step": 17783, "epoch": 146} {"train_loss": -27.35910415649414, "global_step": 17784, "epoch": 146} {"train_loss": -27.52703285217285, "global_step": 17785, "epoch": 146} {"train_loss": -27.676455505623306, "global_step": 17786, "epoch": 146, "val_loss": 2494511.25} {"train_loss": -27.94037437438965, "global_step": 17787, "epoch": 147} {"train_loss": -27.502119064331055, "global_step": 17788, "epoch": 147} {"train_loss": -28.18744468688965, "global_step": 17789, "epoch": 147} {"train_loss": -27.281335830688477, "global_step": 17790, "epoch": 147} {"train_loss": -27.931644439697266, "global_step": 17791, "epoch": 147} {"train_loss": -28.337133407592773, "global_step": 17792, "epoch": 147} {"train_loss": -28.093114852905273, "global_step": 17793, "epoch": 147} {"train_loss": -27.75286865234375, "global_step": 17794, "epoch": 147} {"train_loss": -28.400861740112305, "global_step": 17795, "epoch": 147} {"train_loss": -28.4494571685791, "global_step": 17796, "epoch": 147} {"train_loss": -27.880634307861328, "global_step": 17797, "epoch": 147} {"train_loss": -28.08064079284668, "global_step": 17798, "epoch": 147} {"train_loss": -28.324966430664062, "global_step": 17799, "epoch": 147} {"train_loss": -28.624860763549805, "global_step": 17800, "epoch": 147} {"train_loss": -28.31170654296875, "global_step": 17801, "epoch": 147} {"train_loss": -27.838598251342773, "global_step": 17802, "epoch": 147} {"train_loss": -28.09026527404785, "global_step": 17803, "epoch": 147} {"train_loss": -27.795114517211914, "global_step": 17804, "epoch": 147} {"train_loss": -28.094709396362305, "global_step": 17805, "epoch": 147} {"train_loss": -28.750364303588867, "global_step": 17806, "epoch": 147} {"train_loss": -28.088651657104492, "global_step": 17807, "epoch": 147} {"train_loss": -28.269367218017578, "global_step": 17808, "epoch": 147} {"train_loss": -28.2771053314209, "global_step": 17809, "epoch": 147} {"train_loss": -28.528385162353516, "global_step": 17810, "epoch": 147} {"train_loss": -28.546035766601562, "global_step": 17811, "epoch": 147} {"train_loss": -28.807147979736328, "global_step": 17812, "epoch": 147} {"train_loss": -28.379690170288086, "global_step": 17813, "epoch": 147} {"train_loss": -28.34895133972168, "global_step": 17814, "epoch": 147} {"train_loss": -28.660022735595703, "global_step": 17815, "epoch": 147} {"train_loss": -28.88483238220215, "global_step": 17816, "epoch": 147} {"train_loss": -28.809051513671875, "global_step": 17817, "epoch": 147} {"train_loss": -28.81245231628418, "global_step": 17818, "epoch": 147} {"train_loss": -29.02996826171875, "global_step": 17819, "epoch": 147} {"train_loss": -28.74346923828125, "global_step": 17820, "epoch": 147} {"train_loss": -28.92386817932129, "global_step": 17821, "epoch": 147} {"train_loss": -28.78318214416504, "global_step": 17822, "epoch": 147} {"train_loss": -29.305112838745117, "global_step": 17823, "epoch": 147} {"train_loss": -28.750829696655273, "global_step": 17824, "epoch": 147} {"train_loss": -28.6685848236084, "global_step": 17825, "epoch": 147} {"train_loss": -28.86810302734375, "global_step": 17826, "epoch": 147} {"train_loss": -29.124364852905273, "global_step": 17827, "epoch": 147} {"train_loss": -28.994665145874023, "global_step": 17828, "epoch": 147} {"train_loss": -28.874853134155273, "global_step": 17829, "epoch": 147} {"train_loss": -28.95147705078125, "global_step": 17830, "epoch": 147} {"train_loss": -28.173959732055664, "global_step": 17831, "epoch": 147} {"train_loss": -28.216022491455078, "global_step": 17832, "epoch": 147} {"train_loss": -28.705646514892578, "global_step": 17833, "epoch": 147} {"train_loss": -29.03728675842285, "global_step": 17834, "epoch": 147} {"train_loss": -28.857364654541016, "global_step": 17835, "epoch": 147} {"train_loss": -28.820104598999023, "global_step": 17836, "epoch": 147} {"train_loss": -29.404748916625977, "global_step": 17837, "epoch": 147} {"train_loss": -28.44223403930664, "global_step": 17838, "epoch": 147} {"train_loss": -29.04718589782715, "global_step": 17839, "epoch": 147} {"train_loss": -28.3194580078125, "global_step": 17840, "epoch": 147} {"train_loss": -28.158044815063477, "global_step": 17841, "epoch": 147} {"train_loss": -27.584945678710938, "global_step": 17842, "epoch": 147} {"train_loss": -27.23322868347168, "global_step": 17843, "epoch": 147} {"train_loss": -26.819000244140625, "global_step": 17844, "epoch": 147} {"train_loss": -25.0892391204834, "global_step": 17845, "epoch": 147} {"train_loss": -25.9886474609375, "global_step": 17846, "epoch": 147} {"train_loss": -27.441303253173828, "global_step": 17847, "epoch": 147} {"train_loss": -27.020578384399414, "global_step": 17848, "epoch": 147} {"train_loss": -28.17657470703125, "global_step": 17849, "epoch": 147} {"train_loss": -28.60098648071289, "global_step": 17850, "epoch": 147} {"train_loss": -28.569324493408203, "global_step": 17851, "epoch": 147} {"train_loss": -28.80136489868164, "global_step": 17852, "epoch": 147} {"train_loss": -28.55463981628418, "global_step": 17853, "epoch": 147} {"train_loss": -28.43234634399414, "global_step": 17854, "epoch": 147} {"train_loss": -28.258649826049805, "global_step": 17855, "epoch": 147} {"train_loss": -28.300872802734375, "global_step": 17856, "epoch": 147} {"train_loss": -29.057357788085938, "global_step": 17857, "epoch": 147} {"train_loss": -28.888593673706055, "global_step": 17858, "epoch": 147} {"train_loss": -29.15774917602539, "global_step": 17859, "epoch": 147} {"train_loss": -28.99126625061035, "global_step": 17860, "epoch": 147} {"train_loss": -28.74798011779785, "global_step": 17861, "epoch": 147} {"train_loss": -28.495746612548828, "global_step": 17862, "epoch": 147} {"train_loss": -28.953882217407227, "global_step": 17863, "epoch": 147} {"train_loss": -28.431961059570312, "global_step": 17864, "epoch": 147} {"train_loss": -26.903339385986328, "global_step": 17865, "epoch": 147} {"train_loss": -28.558399200439453, "global_step": 17866, "epoch": 147} {"train_loss": -28.79665184020996, "global_step": 17867, "epoch": 147} {"train_loss": -28.79477310180664, "global_step": 17868, "epoch": 147} {"train_loss": -28.284635543823242, "global_step": 17869, "epoch": 147} {"train_loss": -28.623184204101562, "global_step": 17870, "epoch": 147} {"train_loss": -28.52204704284668, "global_step": 17871, "epoch": 147} {"train_loss": -27.4284725189209, "global_step": 17872, "epoch": 147} {"train_loss": -27.892072677612305, "global_step": 17873, "epoch": 147} {"train_loss": -28.690114974975586, "global_step": 17874, "epoch": 147} {"train_loss": -27.712955474853516, "global_step": 17875, "epoch": 147} {"train_loss": -27.876270294189453, "global_step": 17876, "epoch": 147} {"train_loss": -27.85259437561035, "global_step": 17877, "epoch": 147} {"train_loss": -26.6113224029541, "global_step": 17878, "epoch": 147} {"train_loss": -27.775821685791016, "global_step": 17879, "epoch": 147} {"train_loss": -26.581167221069336, "global_step": 17880, "epoch": 147} {"train_loss": -26.652265548706055, "global_step": 17881, "epoch": 147} {"train_loss": -28.014785766601562, "global_step": 17882, "epoch": 147} {"train_loss": -24.268369674682617, "global_step": 17883, "epoch": 147} {"train_loss": -27.17893409729004, "global_step": 17884, "epoch": 147} {"train_loss": -27.93055534362793, "global_step": 17885, "epoch": 147} {"train_loss": -27.13434410095215, "global_step": 17886, "epoch": 147} {"train_loss": -28.357330322265625, "global_step": 17887, "epoch": 147} {"train_loss": -26.878686904907227, "global_step": 17888, "epoch": 147} {"train_loss": -28.028491973876953, "global_step": 17889, "epoch": 147} {"train_loss": -27.5371036529541, "global_step": 17890, "epoch": 147} {"train_loss": -28.00785255432129, "global_step": 17891, "epoch": 147} {"train_loss": -28.10262107849121, "global_step": 17892, "epoch": 147} {"train_loss": -27.236215591430664, "global_step": 17893, "epoch": 147} {"train_loss": -28.33624267578125, "global_step": 17894, "epoch": 147} {"train_loss": -27.804931640625, "global_step": 17895, "epoch": 147} {"train_loss": -28.533950805664062, "global_step": 17896, "epoch": 147} {"train_loss": -27.56842041015625, "global_step": 17897, "epoch": 147} {"train_loss": -28.522418975830078, "global_step": 17898, "epoch": 147} {"train_loss": -27.806127548217773, "global_step": 17899, "epoch": 147} {"train_loss": -28.766498565673828, "global_step": 17900, "epoch": 147} {"train_loss": -28.144012451171875, "global_step": 17901, "epoch": 147} {"train_loss": -29.126728057861328, "global_step": 17902, "epoch": 147} {"train_loss": -28.63232421875, "global_step": 17903, "epoch": 147} {"train_loss": -28.895751953125, "global_step": 17904, "epoch": 147} {"train_loss": -28.787036895751953, "global_step": 17905, "epoch": 147} {"train_loss": -28.562591552734375, "global_step": 17906, "epoch": 147} {"train_loss": -28.199327137844623, "global_step": 17907, "epoch": 147, "val_loss": 2534870.75} {"train_loss": -28.767333984375, "global_step": 17908, "epoch": 148} {"train_loss": -28.824499130249023, "global_step": 17909, "epoch": 148} {"train_loss": -28.900678634643555, "global_step": 17910, "epoch": 148} {"train_loss": -28.732257843017578, "global_step": 17911, "epoch": 148} {"train_loss": -29.116912841796875, "global_step": 17912, "epoch": 148} {"train_loss": -28.651941299438477, "global_step": 17913, "epoch": 148} {"train_loss": -29.286441802978516, "global_step": 17914, "epoch": 148} {"train_loss": -28.722064971923828, "global_step": 17915, "epoch": 148} {"train_loss": -29.115314483642578, "global_step": 17916, "epoch": 148} {"train_loss": -28.620086669921875, "global_step": 17917, "epoch": 148} {"train_loss": -27.725116729736328, "global_step": 17918, "epoch": 148} {"train_loss": -28.84756851196289, "global_step": 17919, "epoch": 148} {"train_loss": -27.950164794921875, "global_step": 17920, "epoch": 148} {"train_loss": -28.9110050201416, "global_step": 17921, "epoch": 148} {"train_loss": -28.527997970581055, "global_step": 17922, "epoch": 148} {"train_loss": -28.416275024414062, "global_step": 17923, "epoch": 148} {"train_loss": -28.625051498413086, "global_step": 17924, "epoch": 148} {"train_loss": -28.8548641204834, "global_step": 17925, "epoch": 148} {"train_loss": -28.636280059814453, "global_step": 17926, "epoch": 148} {"train_loss": -28.52764320373535, "global_step": 17927, "epoch": 148} {"train_loss": -28.428308486938477, "global_step": 17928, "epoch": 148} {"train_loss": -28.40228271484375, "global_step": 17929, "epoch": 148} {"train_loss": -27.843297958374023, "global_step": 17930, "epoch": 148} {"train_loss": -28.38962173461914, "global_step": 17931, "epoch": 148} {"train_loss": -28.2181339263916, "global_step": 17932, "epoch": 148} {"train_loss": -28.643234252929688, "global_step": 17933, "epoch": 148} {"train_loss": -28.722150802612305, "global_step": 17934, "epoch": 148} {"train_loss": -28.96536636352539, "global_step": 17935, "epoch": 148} {"train_loss": -29.080366134643555, "global_step": 17936, "epoch": 148} {"train_loss": -28.946744918823242, "global_step": 17937, "epoch": 148} {"train_loss": -28.48590660095215, "global_step": 17938, "epoch": 148} {"train_loss": -28.9168758392334, "global_step": 17939, "epoch": 148} {"train_loss": -28.40199851989746, "global_step": 17940, "epoch": 148} {"train_loss": -29.338850021362305, "global_step": 17941, "epoch": 148} {"train_loss": -28.229490280151367, "global_step": 17942, "epoch": 148} {"train_loss": -26.994653701782227, "global_step": 17943, "epoch": 148} {"train_loss": -23.081968307495117, "global_step": 17944, "epoch": 148} {"train_loss": -15.9241943359375, "global_step": 17945, "epoch": 148} {"train_loss": -18.8699951171875, "global_step": 17946, "epoch": 148} {"train_loss": -28.972152709960938, "global_step": 17947, "epoch": 148} {"train_loss": -23.210264205932617, "global_step": 17948, "epoch": 148} {"train_loss": -28.49678611755371, "global_step": 17949, "epoch": 148} {"train_loss": -25.80376625061035, "global_step": 17950, "epoch": 148} {"train_loss": -26.874622344970703, "global_step": 17951, "epoch": 148} {"train_loss": -28.33331871032715, "global_step": 17952, "epoch": 148} {"train_loss": -27.343122482299805, "global_step": 17953, "epoch": 148} {"train_loss": -26.82437515258789, "global_step": 17954, "epoch": 148} {"train_loss": -27.658615112304688, "global_step": 17955, "epoch": 148} {"train_loss": -28.312274932861328, "global_step": 17956, "epoch": 148} {"train_loss": -28.035730361938477, "global_step": 17957, "epoch": 148} {"train_loss": -27.689619064331055, "global_step": 17958, "epoch": 148} {"train_loss": -28.119840621948242, "global_step": 17959, "epoch": 148} {"train_loss": -27.57529067993164, "global_step": 17960, "epoch": 148} {"train_loss": -28.150808334350586, "global_step": 17961, "epoch": 148} {"train_loss": -28.374835968017578, "global_step": 17962, "epoch": 148} {"train_loss": -27.5927734375, "global_step": 17963, "epoch": 148} {"train_loss": -28.273630142211914, "global_step": 17964, "epoch": 148} {"train_loss": -28.316843032836914, "global_step": 17965, "epoch": 148} {"train_loss": -27.9837646484375, "global_step": 17966, "epoch": 148} {"train_loss": -28.3179874420166, "global_step": 17967, "epoch": 148} {"train_loss": -28.382904052734375, "global_step": 17968, "epoch": 148} {"train_loss": -27.807722091674805, "global_step": 17969, "epoch": 148} {"train_loss": -27.73178482055664, "global_step": 17970, "epoch": 148} {"train_loss": -28.651538848876953, "global_step": 17971, "epoch": 148} {"train_loss": -27.950912475585938, "global_step": 17972, "epoch": 148} {"train_loss": -27.713104248046875, "global_step": 17973, "epoch": 148} {"train_loss": -28.165639877319336, "global_step": 17974, "epoch": 148} {"train_loss": -28.2132511138916, "global_step": 17975, "epoch": 148} {"train_loss": -27.996179580688477, "global_step": 17976, "epoch": 148} {"train_loss": -28.404804229736328, "global_step": 17977, "epoch": 148} {"train_loss": -28.42630386352539, "global_step": 17978, "epoch": 148} {"train_loss": -28.358701705932617, "global_step": 17979, "epoch": 148} {"train_loss": -28.245141983032227, "global_step": 17980, "epoch": 148} {"train_loss": -28.288602828979492, "global_step": 17981, "epoch": 148} {"train_loss": -27.983478546142578, "global_step": 17982, "epoch": 148} {"train_loss": -28.62323570251465, "global_step": 17983, "epoch": 148} {"train_loss": -28.667749404907227, "global_step": 17984, "epoch": 148} {"train_loss": -28.220075607299805, "global_step": 17985, "epoch": 148} {"train_loss": -28.98932456970215, "global_step": 17986, "epoch": 148} {"train_loss": -28.252883911132812, "global_step": 17987, "epoch": 148} {"train_loss": -27.537921905517578, "global_step": 17988, "epoch": 148} {"train_loss": -28.55498695373535, "global_step": 17989, "epoch": 148} {"train_loss": -28.692182540893555, "global_step": 17990, "epoch": 148} {"train_loss": -28.459716796875, "global_step": 17991, "epoch": 148} {"train_loss": -28.18239402770996, "global_step": 17992, "epoch": 148} {"train_loss": -27.9572696685791, "global_step": 17993, "epoch": 148} {"train_loss": -28.42645835876465, "global_step": 17994, "epoch": 148} {"train_loss": -27.593313217163086, "global_step": 17995, "epoch": 148} {"train_loss": -28.581205368041992, "global_step": 17996, "epoch": 148} {"train_loss": -28.37082290649414, "global_step": 17997, "epoch": 148} {"train_loss": -29.040069580078125, "global_step": 17998, "epoch": 148} {"train_loss": -28.6658878326416, "global_step": 17999, "epoch": 148} {"train_loss": -28.06043815612793, "global_step": 18000, "epoch": 148} {"train_loss": -28.741117477416992, "global_step": 18001, "epoch": 148} {"train_loss": -28.59602165222168, "global_step": 18002, "epoch": 148} {"train_loss": -28.35150146484375, "global_step": 18003, "epoch": 148} {"train_loss": -28.474462509155273, "global_step": 18004, "epoch": 148} {"train_loss": -28.33159828186035, "global_step": 18005, "epoch": 148} {"train_loss": -28.608091354370117, "global_step": 18006, "epoch": 148} {"train_loss": -27.400379180908203, "global_step": 18007, "epoch": 148} {"train_loss": -28.677906036376953, "global_step": 18008, "epoch": 148} {"train_loss": -28.167530059814453, "global_step": 18009, "epoch": 148} {"train_loss": -28.142484664916992, "global_step": 18010, "epoch": 148} {"train_loss": -28.573017120361328, "global_step": 18011, "epoch": 148} {"train_loss": -28.765823364257812, "global_step": 18012, "epoch": 148} {"train_loss": -28.270751953125, "global_step": 18013, "epoch": 148} {"train_loss": -28.8228702545166, "global_step": 18014, "epoch": 148} {"train_loss": -28.371625900268555, "global_step": 18015, "epoch": 148} {"train_loss": -28.006732940673828, "global_step": 18016, "epoch": 148} {"train_loss": -28.6549015045166, "global_step": 18017, "epoch": 148} {"train_loss": -28.786977767944336, "global_step": 18018, "epoch": 148} {"train_loss": -28.524946212768555, "global_step": 18019, "epoch": 148} {"train_loss": -28.30586051940918, "global_step": 18020, "epoch": 148} {"train_loss": -28.262968063354492, "global_step": 18021, "epoch": 148} {"train_loss": -27.169172286987305, "global_step": 18022, "epoch": 148} {"train_loss": -25.114423751831055, "global_step": 18023, "epoch": 148} {"train_loss": -16.181110382080078, "global_step": 18024, "epoch": 148} {"train_loss": 1.1214990615844727, "global_step": 18025, "epoch": 148} {"train_loss": -17.37042808532715, "global_step": 18026, "epoch": 148} {"train_loss": -23.869821548461914, "global_step": 18027, "epoch": 148} {"train_loss": -27.478253963565038, "global_step": 18028, "epoch": 148, "val_loss": 3064588.0} {"train_loss": -21.268030166625977, "global_step": 18029, "epoch": 149} {"train_loss": -25.731475830078125, "global_step": 18030, "epoch": 149} {"train_loss": -18.146099090576172, "global_step": 18031, "epoch": 149} {"train_loss": -25.750146865844727, "global_step": 18032, "epoch": 149} {"train_loss": -25.78458595275879, "global_step": 18033, "epoch": 149} {"train_loss": -24.156110763549805, "global_step": 18034, "epoch": 149} {"train_loss": -22.6983642578125, "global_step": 18035, "epoch": 149} {"train_loss": -26.183338165283203, "global_step": 18036, "epoch": 149} {"train_loss": -25.764169692993164, "global_step": 18037, "epoch": 149} {"train_loss": -26.648269653320312, "global_step": 18038, "epoch": 149} {"train_loss": -24.33832359313965, "global_step": 18039, "epoch": 149} {"train_loss": -26.095701217651367, "global_step": 18040, "epoch": 149} {"train_loss": -24.950000762939453, "global_step": 18041, "epoch": 149} {"train_loss": -26.9155216217041, "global_step": 18042, "epoch": 149} {"train_loss": -26.71759605407715, "global_step": 18043, "epoch": 149} {"train_loss": -26.829971313476562, "global_step": 18044, "epoch": 149} {"train_loss": -26.257007598876953, "global_step": 18045, "epoch": 149} {"train_loss": -26.152379989624023, "global_step": 18046, "epoch": 149} {"train_loss": -26.06862449645996, "global_step": 18047, "epoch": 149} {"train_loss": -27.1108455657959, "global_step": 18048, "epoch": 149} {"train_loss": -26.656558990478516, "global_step": 18049, "epoch": 149} {"train_loss": -27.130573272705078, "global_step": 18050, "epoch": 149} {"train_loss": -27.5549373626709, "global_step": 18051, "epoch": 149} {"train_loss": -26.74151039123535, "global_step": 18052, "epoch": 149} {"train_loss": -27.533899307250977, "global_step": 18053, "epoch": 149} {"train_loss": -27.246292114257812, "global_step": 18054, "epoch": 149} {"train_loss": -27.5429630279541, "global_step": 18055, "epoch": 149} {"train_loss": -27.58418083190918, "global_step": 18056, "epoch": 149} {"train_loss": -27.71638298034668, "global_step": 18057, "epoch": 149} {"train_loss": -27.614856719970703, "global_step": 18058, "epoch": 149} {"train_loss": -28.022748947143555, "global_step": 18059, "epoch": 149} {"train_loss": -27.6101131439209, "global_step": 18060, "epoch": 149} {"train_loss": -27.8210391998291, "global_step": 18061, "epoch": 149} {"train_loss": -27.95038414001465, "global_step": 18062, "epoch": 149} {"train_loss": -27.980026245117188, "global_step": 18063, "epoch": 149} {"train_loss": -27.766803741455078, "global_step": 18064, "epoch": 149} {"train_loss": -27.876630783081055, "global_step": 18065, "epoch": 149} {"train_loss": -28.040754318237305, "global_step": 18066, "epoch": 149} {"train_loss": -27.999958038330078, "global_step": 18067, "epoch": 149} {"train_loss": -27.836780548095703, "global_step": 18068, "epoch": 149} {"train_loss": -27.4393253326416, "global_step": 18069, "epoch": 149} {"train_loss": -28.34394645690918, "global_step": 18070, "epoch": 149} {"train_loss": -27.8037052154541, "global_step": 18071, "epoch": 149} {"train_loss": -27.698627471923828, "global_step": 18072, "epoch": 149} {"train_loss": -28.335824966430664, "global_step": 18073, "epoch": 149} {"train_loss": -28.082090377807617, "global_step": 18074, "epoch": 149} {"train_loss": -28.27423095703125, "global_step": 18075, "epoch": 149} {"train_loss": -27.757343292236328, "global_step": 18076, "epoch": 149} {"train_loss": -28.103940963745117, "global_step": 18077, "epoch": 149} {"train_loss": -27.904890060424805, "global_step": 18078, "epoch": 149} {"train_loss": -28.224897384643555, "global_step": 18079, "epoch": 149} {"train_loss": -28.591337203979492, "global_step": 18080, "epoch": 149} {"train_loss": -28.156681060791016, "global_step": 18081, "epoch": 149} {"train_loss": -28.154407501220703, "global_step": 18082, "epoch": 149} {"train_loss": -28.553119659423828, "global_step": 18083, "epoch": 149} {"train_loss": -28.481733322143555, "global_step": 18084, "epoch": 149} {"train_loss": -28.64080238342285, "global_step": 18085, "epoch": 149} {"train_loss": -28.222692489624023, "global_step": 18086, "epoch": 149} {"train_loss": -28.3792667388916, "global_step": 18087, "epoch": 149} {"train_loss": -28.097156524658203, "global_step": 18088, "epoch": 149} {"train_loss": -28.5494327545166, "global_step": 18089, "epoch": 149} {"train_loss": -27.447717666625977, "global_step": 18090, "epoch": 149} {"train_loss": -28.655059814453125, "global_step": 18091, "epoch": 149} {"train_loss": -27.71478271484375, "global_step": 18092, "epoch": 149} {"train_loss": -27.292043685913086, "global_step": 18093, "epoch": 149} {"train_loss": -28.342145919799805, "global_step": 18094, "epoch": 149} {"train_loss": -27.992578506469727, "global_step": 18095, "epoch": 149} {"train_loss": -28.18183708190918, "global_step": 18096, "epoch": 149} {"train_loss": -27.68027114868164, "global_step": 18097, "epoch": 149} {"train_loss": -28.31524658203125, "global_step": 18098, "epoch": 149} {"train_loss": -27.938154220581055, "global_step": 18099, "epoch": 149} {"train_loss": -28.4239559173584, "global_step": 18100, "epoch": 149} {"train_loss": -27.88506507873535, "global_step": 18101, "epoch": 149} {"train_loss": -28.626453399658203, "global_step": 18102, "epoch": 149} {"train_loss": -28.173974990844727, "global_step": 18103, "epoch": 149} {"train_loss": -28.232770919799805, "global_step": 18104, "epoch": 149} {"train_loss": -28.39954948425293, "global_step": 18105, "epoch": 149} {"train_loss": -27.922168731689453, "global_step": 18106, "epoch": 149} {"train_loss": -28.5579891204834, "global_step": 18107, "epoch": 149} {"train_loss": -28.28553581237793, "global_step": 18108, "epoch": 149} {"train_loss": -27.891813278198242, "global_step": 18109, "epoch": 149} {"train_loss": -28.821517944335938, "global_step": 18110, "epoch": 149} {"train_loss": -27.989347457885742, "global_step": 18111, "epoch": 149} {"train_loss": -27.620153427124023, "global_step": 18112, "epoch": 149} {"train_loss": -28.8815975189209, "global_step": 18113, "epoch": 149} {"train_loss": -28.836767196655273, "global_step": 18114, "epoch": 149} {"train_loss": -28.795377731323242, "global_step": 18115, "epoch": 149} {"train_loss": -28.303979873657227, "global_step": 18116, "epoch": 149} {"train_loss": -28.31695556640625, "global_step": 18117, "epoch": 149} {"train_loss": -28.043500900268555, "global_step": 18118, "epoch": 149} {"train_loss": -27.315282821655273, "global_step": 18119, "epoch": 149} {"train_loss": -28.151702880859375, "global_step": 18120, "epoch": 149} {"train_loss": -28.00115966796875, "global_step": 18121, "epoch": 149} {"train_loss": -28.07393455505371, "global_step": 18122, "epoch": 149} {"train_loss": -28.320234298706055, "global_step": 18123, "epoch": 149} {"train_loss": -28.262609481811523, "global_step": 18124, "epoch": 149} {"train_loss": -27.990497589111328, "global_step": 18125, "epoch": 149} {"train_loss": -28.156232833862305, "global_step": 18126, "epoch": 149} {"train_loss": -27.648099899291992, "global_step": 18127, "epoch": 149} {"train_loss": -26.514440536499023, "global_step": 18128, "epoch": 149} {"train_loss": -25.573257446289062, "global_step": 18129, "epoch": 149} {"train_loss": -22.902555465698242, "global_step": 18130, "epoch": 149} {"train_loss": -20.653095245361328, "global_step": 18131, "epoch": 149} {"train_loss": -26.007349014282227, "global_step": 18132, "epoch": 149} {"train_loss": -26.05118179321289, "global_step": 18133, "epoch": 149} {"train_loss": -25.067020416259766, "global_step": 18134, "epoch": 149} {"train_loss": -27.390588760375977, "global_step": 18135, "epoch": 149} {"train_loss": -26.356470108032227, "global_step": 18136, "epoch": 149} {"train_loss": -27.291730880737305, "global_step": 18137, "epoch": 149} {"train_loss": -27.46969985961914, "global_step": 18138, "epoch": 149} {"train_loss": -26.104480743408203, "global_step": 18139, "epoch": 149} {"train_loss": -27.505353927612305, "global_step": 18140, "epoch": 149} {"train_loss": -28.033355712890625, "global_step": 18141, "epoch": 149} {"train_loss": -27.2686710357666, "global_step": 18142, "epoch": 149} {"train_loss": -27.718536376953125, "global_step": 18143, "epoch": 149} {"train_loss": -28.200042724609375, "global_step": 18144, "epoch": 149} {"train_loss": -27.555185317993164, "global_step": 18145, "epoch": 149} {"train_loss": -27.566404342651367, "global_step": 18146, "epoch": 149} {"train_loss": -27.652097702026367, "global_step": 18147, "epoch": 149} {"train_loss": -28.032337188720703, "global_step": 18148, "epoch": 149} {"train_loss": -27.29050943674135, "global_step": 18149, "epoch": 149, "val_loss": 2557708.75} {"train_loss": -28.118268966674805, "global_step": 18150, "epoch": 150} {"train_loss": -27.571945190429688, "global_step": 18151, "epoch": 150} {"train_loss": -28.394866943359375, "global_step": 18152, "epoch": 150} {"train_loss": -28.2978572845459, "global_step": 18153, "epoch": 150} {"train_loss": -27.964746475219727, "global_step": 18154, "epoch": 150} {"train_loss": -27.875120162963867, "global_step": 18155, "epoch": 150} {"train_loss": -28.094058990478516, "global_step": 18156, "epoch": 150} {"train_loss": -28.393842697143555, "global_step": 18157, "epoch": 150} {"train_loss": -28.352767944335938, "global_step": 18158, "epoch": 150} {"train_loss": -28.317792892456055, "global_step": 18159, "epoch": 150} {"train_loss": -28.521337509155273, "global_step": 18160, "epoch": 150} {"train_loss": -28.425329208374023, "global_step": 18161, "epoch": 150} {"train_loss": -28.586179733276367, "global_step": 18162, "epoch": 150} {"train_loss": -28.338071823120117, "global_step": 18163, "epoch": 150} {"train_loss": -28.241718292236328, "global_step": 18164, "epoch": 150} {"train_loss": -28.174680709838867, "global_step": 18165, "epoch": 150} {"train_loss": -28.7733097076416, "global_step": 18166, "epoch": 150} {"train_loss": -28.46076011657715, "global_step": 18167, "epoch": 150} {"train_loss": -28.064472198486328, "global_step": 18168, "epoch": 150} {"train_loss": -27.86053466796875, "global_step": 18169, "epoch": 150} {"train_loss": -27.884998321533203, "global_step": 18170, "epoch": 150} {"train_loss": -26.7981014251709, "global_step": 18171, "epoch": 150} {"train_loss": -24.098228454589844, "global_step": 18172, "epoch": 150} {"train_loss": -20.83702850341797, "global_step": 18173, "epoch": 150} {"train_loss": -20.937650680541992, "global_step": 18174, "epoch": 150} {"train_loss": -26.706634521484375, "global_step": 18175, "epoch": 150} {"train_loss": -27.3745174407959, "global_step": 18176, "epoch": 150} {"train_loss": -25.969335556030273, "global_step": 18177, "epoch": 150} {"train_loss": -27.576156616210938, "global_step": 18178, "epoch": 150} {"train_loss": -27.016508102416992, "global_step": 18179, "epoch": 150} {"train_loss": -27.641132354736328, "global_step": 18180, "epoch": 150} {"train_loss": -27.831838607788086, "global_step": 18181, "epoch": 150} {"train_loss": -26.407119750976562, "global_step": 18182, "epoch": 150} {"train_loss": -27.8110408782959, "global_step": 18183, "epoch": 150} {"train_loss": -27.24069595336914, "global_step": 18184, "epoch": 150} {"train_loss": -27.336566925048828, "global_step": 18185, "epoch": 150} {"train_loss": -27.787582397460938, "global_step": 18186, "epoch": 150} {"train_loss": -27.18475914001465, "global_step": 18187, "epoch": 150} {"train_loss": -27.600812911987305, "global_step": 18188, "epoch": 150} {"train_loss": -27.45545768737793, "global_step": 18189, "epoch": 150} {"train_loss": -27.652128219604492, "global_step": 18190, "epoch": 150} {"train_loss": -27.2716121673584, "global_step": 18191, "epoch": 150} {"train_loss": -27.785009384155273, "global_step": 18192, "epoch": 150} {"train_loss": -27.713977813720703, "global_step": 18193, "epoch": 150} {"train_loss": -27.3702449798584, "global_step": 18194, "epoch": 150} {"train_loss": -27.87391471862793, "global_step": 18195, "epoch": 150} {"train_loss": -26.9210147857666, "global_step": 18196, "epoch": 150} {"train_loss": -28.02303123474121, "global_step": 18197, "epoch": 150} {"train_loss": -27.234506607055664, "global_step": 18198, "epoch": 150} {"train_loss": -27.699390411376953, "global_step": 18199, "epoch": 150} {"train_loss": -27.46148681640625, "global_step": 18200, "epoch": 150} {"train_loss": -27.589887619018555, "global_step": 18201, "epoch": 150} {"train_loss": -28.347808837890625, "global_step": 18202, "epoch": 150} {"train_loss": -28.147436141967773, "global_step": 18203, "epoch": 150} {"train_loss": -28.088117599487305, "global_step": 18204, "epoch": 150} {"train_loss": -28.56342124938965, "global_step": 18205, "epoch": 150} {"train_loss": -27.804906845092773, "global_step": 18206, "epoch": 150} {"train_loss": -28.690473556518555, "global_step": 18207, "epoch": 150} {"train_loss": -27.863800048828125, "global_step": 18208, "epoch": 150} {"train_loss": -28.60395622253418, "global_step": 18209, "epoch": 150} {"train_loss": -28.733234405517578, "global_step": 18210, "epoch": 150} {"train_loss": -28.231664657592773, "global_step": 18211, "epoch": 150} {"train_loss": -28.582321166992188, "global_step": 18212, "epoch": 150} {"train_loss": -28.476730346679688, "global_step": 18213, "epoch": 150} {"train_loss": -28.770954132080078, "global_step": 18214, "epoch": 150} {"train_loss": -28.783056259155273, "global_step": 18215, "epoch": 150} {"train_loss": -28.7790584564209, "global_step": 18216, "epoch": 150} {"train_loss": -28.488067626953125, "global_step": 18217, "epoch": 150} {"train_loss": -28.75661277770996, "global_step": 18218, "epoch": 150} {"train_loss": -28.56171226501465, "global_step": 18219, "epoch": 150} {"train_loss": -28.445547103881836, "global_step": 18220, "epoch": 150} {"train_loss": -28.883132934570312, "global_step": 18221, "epoch": 150} {"train_loss": -28.846460342407227, "global_step": 18222, "epoch": 150} {"train_loss": -29.009628295898438, "global_step": 18223, "epoch": 150} {"train_loss": -28.428735733032227, "global_step": 18224, "epoch": 150} {"train_loss": -28.790857315063477, "global_step": 18225, "epoch": 150} {"train_loss": -29.20637321472168, "global_step": 18226, "epoch": 150} {"train_loss": -28.7127628326416, "global_step": 18227, "epoch": 150} {"train_loss": -28.642057418823242, "global_step": 18228, "epoch": 150} {"train_loss": -28.773218154907227, "global_step": 18229, "epoch": 150} {"train_loss": -29.344091415405273, "global_step": 18230, "epoch": 150} {"train_loss": -29.278167724609375, "global_step": 18231, "epoch": 150} {"train_loss": -28.75752067565918, "global_step": 18232, "epoch": 150} {"train_loss": -29.18672752380371, "global_step": 18233, "epoch": 150} {"train_loss": -28.722766876220703, "global_step": 18234, "epoch": 150} {"train_loss": -28.441892623901367, "global_step": 18235, "epoch": 150} {"train_loss": -28.712417602539062, "global_step": 18236, "epoch": 150} {"train_loss": -28.671857833862305, "global_step": 18237, "epoch": 150} {"train_loss": -27.939136505126953, "global_step": 18238, "epoch": 150} {"train_loss": -28.405210494995117, "global_step": 18239, "epoch": 150} {"train_loss": -26.447235107421875, "global_step": 18240, "epoch": 150} {"train_loss": -29.25129508972168, "global_step": 18241, "epoch": 150} {"train_loss": -28.7795467376709, "global_step": 18242, "epoch": 150} {"train_loss": -27.119367599487305, "global_step": 18243, "epoch": 150} {"train_loss": -28.855697631835938, "global_step": 18244, "epoch": 150} {"train_loss": -28.385160446166992, "global_step": 18245, "epoch": 150} {"train_loss": -28.31927490234375, "global_step": 18246, "epoch": 150} {"train_loss": -28.42970085144043, "global_step": 18247, "epoch": 150} {"train_loss": -29.074207305908203, "global_step": 18248, "epoch": 150} {"train_loss": -29.077688217163086, "global_step": 18249, "epoch": 150} {"train_loss": -28.91302490234375, "global_step": 18250, "epoch": 150} {"train_loss": -27.984149932861328, "global_step": 18251, "epoch": 150} {"train_loss": -27.9398193359375, "global_step": 18252, "epoch": 150} {"train_loss": -28.872241973876953, "global_step": 18253, "epoch": 150} {"train_loss": -27.449970245361328, "global_step": 18254, "epoch": 150} {"train_loss": -27.656116485595703, "global_step": 18255, "epoch": 150} {"train_loss": -28.19207191467285, "global_step": 18256, "epoch": 150} {"train_loss": -28.591068267822266, "global_step": 18257, "epoch": 150} {"train_loss": -27.797536849975586, "global_step": 18258, "epoch": 150} {"train_loss": -27.978784561157227, "global_step": 18259, "epoch": 150} {"train_loss": -28.81304359436035, "global_step": 18260, "epoch": 150} {"train_loss": -28.577747344970703, "global_step": 18261, "epoch": 150} {"train_loss": -28.268991470336914, "global_step": 18262, "epoch": 150} {"train_loss": -28.89777183532715, "global_step": 18263, "epoch": 150} {"train_loss": -29.074399948120117, "global_step": 18264, "epoch": 150} {"train_loss": -28.64532470703125, "global_step": 18265, "epoch": 150} {"train_loss": -28.926618576049805, "global_step": 18266, "epoch": 150} {"train_loss": -28.499670028686523, "global_step": 18267, "epoch": 150} {"train_loss": -29.06839370727539, "global_step": 18268, "epoch": 150} {"train_loss": -28.080961227416992, "global_step": 18269, "epoch": 150} {"train_loss": -28.04037565436245, "global_step": 18270, "epoch": 150, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4400000": 1.0, "test/sim_max_reward_4400001": 1.0, "test/sim_max_reward_4400002": 1.0, "test/sim_max_reward_4400003": 1.0, "test/sim_max_reward_4400004": 1.0, "test/sim_max_reward_4400005": 1.0, "test/sim_max_reward_4400006": 1.0, "test/sim_max_reward_4400007": 1.0, "test/sim_max_reward_4400008": 1.0, "test/sim_max_reward_4400009": 1.0, "test/sim_max_reward_4400010": 1.0, "test/sim_max_reward_4400011": 1.0, "test/sim_max_reward_4400012": 1.0, "test/sim_max_reward_4400013": 1.0, "test/sim_max_reward_4400014": 1.0, "test/sim_max_reward_4400015": 1.0, "test/sim_max_reward_4400016": 1.0, "test/sim_max_reward_4400017": 1.0, "test/sim_max_reward_4400018": 1.0, "test/sim_max_reward_4400019": 1.0, "test/sim_max_reward_4400020": 1.0, "test/sim_max_reward_4400021": 1.0, "train/mean_score": 1.0, "test/mean_score": 1.0, "val_loss": 2535890.0} {"train_loss": -28.545873641967773, "global_step": 18271, "epoch": 151} {"train_loss": -28.615726470947266, "global_step": 18272, "epoch": 151} {"train_loss": -28.562423706054688, "global_step": 18273, "epoch": 151} {"train_loss": -27.53253173828125, "global_step": 18274, "epoch": 151} {"train_loss": -27.94060707092285, "global_step": 18275, "epoch": 151} {"train_loss": -26.551366806030273, "global_step": 18276, "epoch": 151} {"train_loss": -26.231184005737305, "global_step": 18277, "epoch": 151} {"train_loss": -26.62513542175293, "global_step": 18278, "epoch": 151} {"train_loss": -28.123462677001953, "global_step": 18279, "epoch": 151} {"train_loss": -25.670392990112305, "global_step": 18280, "epoch": 151} {"train_loss": -26.59596824645996, "global_step": 18281, "epoch": 151} {"train_loss": -28.278364181518555, "global_step": 18282, "epoch": 151} {"train_loss": -27.26313591003418, "global_step": 18283, "epoch": 151} {"train_loss": -27.585357666015625, "global_step": 18284, "epoch": 151} {"train_loss": -26.765838623046875, "global_step": 18285, "epoch": 151} {"train_loss": -28.403064727783203, "global_step": 18286, "epoch": 151} {"train_loss": -27.618207931518555, "global_step": 18287, "epoch": 151} {"train_loss": -27.3867130279541, "global_step": 18288, "epoch": 151} {"train_loss": -27.988754272460938, "global_step": 18289, "epoch": 151} {"train_loss": -27.333032608032227, "global_step": 18290, "epoch": 151} {"train_loss": -28.00798988342285, "global_step": 18291, "epoch": 151} {"train_loss": -27.81671714782715, "global_step": 18292, "epoch": 151} {"train_loss": -27.9740047454834, "global_step": 18293, "epoch": 151} {"train_loss": -27.345539093017578, "global_step": 18294, "epoch": 151} {"train_loss": -28.479040145874023, "global_step": 18295, "epoch": 151} {"train_loss": -28.276275634765625, "global_step": 18296, "epoch": 151} {"train_loss": -28.286840438842773, "global_step": 18297, "epoch": 151} {"train_loss": -28.2607364654541, "global_step": 18298, "epoch": 151} {"train_loss": -28.355072021484375, "global_step": 18299, "epoch": 151} {"train_loss": -28.4519100189209, "global_step": 18300, "epoch": 151} {"train_loss": -28.24997329711914, "global_step": 18301, "epoch": 151} {"train_loss": -28.756244659423828, "global_step": 18302, "epoch": 151} {"train_loss": -28.96746253967285, "global_step": 18303, "epoch": 151} {"train_loss": -28.549631118774414, "global_step": 18304, "epoch": 151} {"train_loss": -28.970630645751953, "global_step": 18305, "epoch": 151} {"train_loss": -28.780920028686523, "global_step": 18306, "epoch": 151} {"train_loss": -28.594104766845703, "global_step": 18307, "epoch": 151} {"train_loss": -28.871923446655273, "global_step": 18308, "epoch": 151} {"train_loss": -28.0073184967041, "global_step": 18309, "epoch": 151} {"train_loss": -28.851520538330078, "global_step": 18310, "epoch": 151} {"train_loss": -29.098718643188477, "global_step": 18311, "epoch": 151} {"train_loss": -29.34266471862793, "global_step": 18312, "epoch": 151} {"train_loss": -28.4097957611084, "global_step": 18313, "epoch": 151} {"train_loss": -28.52302360534668, "global_step": 18314, "epoch": 151} {"train_loss": -28.619342803955078, "global_step": 18315, "epoch": 151} {"train_loss": -29.269031524658203, "global_step": 18316, "epoch": 151} {"train_loss": -28.8561954498291, "global_step": 18317, "epoch": 151} {"train_loss": -28.817825317382812, "global_step": 18318, "epoch": 151} {"train_loss": -29.398956298828125, "global_step": 18319, "epoch": 151} {"train_loss": -28.80548095703125, "global_step": 18320, "epoch": 151} {"train_loss": -29.078094482421875, "global_step": 18321, "epoch": 151} {"train_loss": -27.46030044555664, "global_step": 18322, "epoch": 151} {"train_loss": -28.53838539123535, "global_step": 18323, "epoch": 151} {"train_loss": -27.791406631469727, "global_step": 18324, "epoch": 151} {"train_loss": -28.65852165222168, "global_step": 18325, "epoch": 151} {"train_loss": -27.26776123046875, "global_step": 18326, "epoch": 151} {"train_loss": -27.926273345947266, "global_step": 18327, "epoch": 151} {"train_loss": -27.30352783203125, "global_step": 18328, "epoch": 151} {"train_loss": -28.928730010986328, "global_step": 18329, "epoch": 151} {"train_loss": -28.8997745513916, "global_step": 18330, "epoch": 151} {"train_loss": -28.548511505126953, "global_step": 18331, "epoch": 151} {"train_loss": -29.194580078125, "global_step": 18332, "epoch": 151} {"train_loss": -29.073225021362305, "global_step": 18333, "epoch": 151} {"train_loss": -28.205896377563477, "global_step": 18334, "epoch": 151} {"train_loss": -27.502044677734375, "global_step": 18335, "epoch": 151} {"train_loss": -27.03400230407715, "global_step": 18336, "epoch": 151} {"train_loss": -27.7276611328125, "global_step": 18337, "epoch": 151} {"train_loss": -29.21234703063965, "global_step": 18338, "epoch": 151} {"train_loss": -28.0269718170166, "global_step": 18339, "epoch": 151} {"train_loss": -28.124704360961914, "global_step": 18340, "epoch": 151} {"train_loss": -29.275678634643555, "global_step": 18341, "epoch": 151} {"train_loss": -28.886539459228516, "global_step": 18342, "epoch": 151} {"train_loss": -28.767419815063477, "global_step": 18343, "epoch": 151} {"train_loss": -29.39824867248535, "global_step": 18344, "epoch": 151} {"train_loss": -28.403356552124023, "global_step": 18345, "epoch": 151} {"train_loss": -29.072189331054688, "global_step": 18346, "epoch": 151} {"train_loss": -28.514013290405273, "global_step": 18347, "epoch": 151} {"train_loss": -28.581174850463867, "global_step": 18348, "epoch": 151} {"train_loss": -28.694772720336914, "global_step": 18349, "epoch": 151} {"train_loss": -28.635940551757812, "global_step": 18350, "epoch": 151} {"train_loss": -29.253021240234375, "global_step": 18351, "epoch": 151} {"train_loss": -29.0271053314209, "global_step": 18352, "epoch": 151} {"train_loss": -29.69548988342285, "global_step": 18353, "epoch": 151} {"train_loss": -28.573776245117188, "global_step": 18354, "epoch": 151} {"train_loss": -29.20842933654785, "global_step": 18355, "epoch": 151} {"train_loss": -28.696563720703125, "global_step": 18356, "epoch": 151} {"train_loss": -29.205142974853516, "global_step": 18357, "epoch": 151} {"train_loss": -29.076658248901367, "global_step": 18358, "epoch": 151} {"train_loss": -29.48478126525879, "global_step": 18359, "epoch": 151} {"train_loss": -29.138620376586914, "global_step": 18360, "epoch": 151} {"train_loss": -28.989469528198242, "global_step": 18361, "epoch": 151} {"train_loss": -29.3907527923584, "global_step": 18362, "epoch": 151} {"train_loss": -28.6662654876709, "global_step": 18363, "epoch": 151} {"train_loss": -29.228412628173828, "global_step": 18364, "epoch": 151} {"train_loss": -29.448591232299805, "global_step": 18365, "epoch": 151} {"train_loss": -29.045780181884766, "global_step": 18366, "epoch": 151} {"train_loss": -29.14727783203125, "global_step": 18367, "epoch": 151} {"train_loss": -29.26432228088379, "global_step": 18368, "epoch": 151} {"train_loss": -29.63543128967285, "global_step": 18369, "epoch": 151} {"train_loss": -29.84161949157715, "global_step": 18370, "epoch": 151} {"train_loss": -29.349912643432617, "global_step": 18371, "epoch": 151} {"train_loss": -29.65581703186035, "global_step": 18372, "epoch": 151} {"train_loss": -29.624053955078125, "global_step": 18373, "epoch": 151} {"train_loss": -29.692174911499023, "global_step": 18374, "epoch": 151} {"train_loss": -28.930652618408203, "global_step": 18375, "epoch": 151} {"train_loss": -28.95953369140625, "global_step": 18376, "epoch": 151} {"train_loss": -27.867650985717773, "global_step": 18377, "epoch": 151} {"train_loss": -25.56685447692871, "global_step": 18378, "epoch": 151} {"train_loss": -24.85213851928711, "global_step": 18379, "epoch": 151} {"train_loss": -22.970510482788086, "global_step": 18380, "epoch": 151} {"train_loss": -25.458349227905273, "global_step": 18381, "epoch": 151} {"train_loss": -28.388418197631836, "global_step": 18382, "epoch": 151} {"train_loss": -28.19683265686035, "global_step": 18383, "epoch": 151} {"train_loss": -27.417570114135742, "global_step": 18384, "epoch": 151} {"train_loss": -28.47110939025879, "global_step": 18385, "epoch": 151} {"train_loss": -28.429351806640625, "global_step": 18386, "epoch": 151} {"train_loss": -28.3405704498291, "global_step": 18387, "epoch": 151} {"train_loss": -28.20477867126465, "global_step": 18388, "epoch": 151} {"train_loss": -28.496458053588867, "global_step": 18389, "epoch": 151} {"train_loss": -28.510854721069336, "global_step": 18390, "epoch": 151} {"train_loss": -28.343625565205723, "global_step": 18391, "epoch": 151, "val_loss": 2578733.25} {"train_loss": -28.209259033203125, "global_step": 18392, "epoch": 152} {"train_loss": -29.089338302612305, "global_step": 18393, "epoch": 152} {"train_loss": -27.537113189697266, "global_step": 18394, "epoch": 152} {"train_loss": -28.006366729736328, "global_step": 18395, "epoch": 152} {"train_loss": -28.417102813720703, "global_step": 18396, "epoch": 152} {"train_loss": -27.924848556518555, "global_step": 18397, "epoch": 152} {"train_loss": -28.75815200805664, "global_step": 18398, "epoch": 152} {"train_loss": -28.2036075592041, "global_step": 18399, "epoch": 152} {"train_loss": -28.51314353942871, "global_step": 18400, "epoch": 152} {"train_loss": -28.659658432006836, "global_step": 18401, "epoch": 152} {"train_loss": -28.873334884643555, "global_step": 18402, "epoch": 152} {"train_loss": -29.018783569335938, "global_step": 18403, "epoch": 152} {"train_loss": -28.66717529296875, "global_step": 18404, "epoch": 152} {"train_loss": -29.123615264892578, "global_step": 18405, "epoch": 152} {"train_loss": -29.06305503845215, "global_step": 18406, "epoch": 152} {"train_loss": -28.920923233032227, "global_step": 18407, "epoch": 152} {"train_loss": -29.19484519958496, "global_step": 18408, "epoch": 152} {"train_loss": -29.191253662109375, "global_step": 18409, "epoch": 152} {"train_loss": -29.292667388916016, "global_step": 18410, "epoch": 152} {"train_loss": -29.122705459594727, "global_step": 18411, "epoch": 152} {"train_loss": -29.4588565826416, "global_step": 18412, "epoch": 152} {"train_loss": -29.6269474029541, "global_step": 18413, "epoch": 152} {"train_loss": -29.372663497924805, "global_step": 18414, "epoch": 152} {"train_loss": -29.61140251159668, "global_step": 18415, "epoch": 152} {"train_loss": -29.0544490814209, "global_step": 18416, "epoch": 152} {"train_loss": -29.27069664001465, "global_step": 18417, "epoch": 152} {"train_loss": -29.243627548217773, "global_step": 18418, "epoch": 152} {"train_loss": -29.06500244140625, "global_step": 18419, "epoch": 152} {"train_loss": -29.433012008666992, "global_step": 18420, "epoch": 152} {"train_loss": -29.4019832611084, "global_step": 18421, "epoch": 152} {"train_loss": -29.656925201416016, "global_step": 18422, "epoch": 152} {"train_loss": -29.386327743530273, "global_step": 18423, "epoch": 152} {"train_loss": -29.305683135986328, "global_step": 18424, "epoch": 152} {"train_loss": -29.2607421875, "global_step": 18425, "epoch": 152} {"train_loss": -29.63396644592285, "global_step": 18426, "epoch": 152} {"train_loss": -28.817663192749023, "global_step": 18427, "epoch": 152} {"train_loss": -27.43501091003418, "global_step": 18428, "epoch": 152} {"train_loss": -25.884296417236328, "global_step": 18429, "epoch": 152} {"train_loss": -21.481006622314453, "global_step": 18430, "epoch": 152} {"train_loss": -20.57233238220215, "global_step": 18431, "epoch": 152} {"train_loss": -25.28146743774414, "global_step": 18432, "epoch": 152} {"train_loss": -29.29465103149414, "global_step": 18433, "epoch": 152} {"train_loss": -26.363813400268555, "global_step": 18434, "epoch": 152} {"train_loss": -28.463815689086914, "global_step": 18435, "epoch": 152} {"train_loss": -28.00341796875, "global_step": 18436, "epoch": 152} {"train_loss": -28.48910903930664, "global_step": 18437, "epoch": 152} {"train_loss": -28.403060913085938, "global_step": 18438, "epoch": 152} {"train_loss": -27.677778244018555, "global_step": 18439, "epoch": 152} {"train_loss": -27.137592315673828, "global_step": 18440, "epoch": 152} {"train_loss": -26.599390029907227, "global_step": 18441, "epoch": 152} {"train_loss": -26.7178955078125, "global_step": 18442, "epoch": 152} {"train_loss": -27.939416885375977, "global_step": 18443, "epoch": 152} {"train_loss": -28.1363468170166, "global_step": 18444, "epoch": 152} {"train_loss": -27.383405685424805, "global_step": 18445, "epoch": 152} {"train_loss": -27.073896408081055, "global_step": 18446, "epoch": 152} {"train_loss": -27.9630184173584, "global_step": 18447, "epoch": 152} {"train_loss": -26.28025245666504, "global_step": 18448, "epoch": 152} {"train_loss": -27.6411075592041, "global_step": 18449, "epoch": 152} {"train_loss": -27.57718276977539, "global_step": 18450, "epoch": 152} {"train_loss": -27.81025505065918, "global_step": 18451, "epoch": 152} {"train_loss": -27.79572868347168, "global_step": 18452, "epoch": 152} {"train_loss": -28.3924503326416, "global_step": 18453, "epoch": 152} {"train_loss": -27.8142147064209, "global_step": 18454, "epoch": 152} {"train_loss": -28.026273727416992, "global_step": 18455, "epoch": 152} {"train_loss": -28.099878311157227, "global_step": 18456, "epoch": 152} {"train_loss": -28.251632690429688, "global_step": 18457, "epoch": 152} {"train_loss": -28.259618759155273, "global_step": 18458, "epoch": 152} {"train_loss": -28.088788986206055, "global_step": 18459, "epoch": 152} {"train_loss": -28.45086669921875, "global_step": 18460, "epoch": 152} {"train_loss": -28.23724365234375, "global_step": 18461, "epoch": 152} {"train_loss": -28.082660675048828, "global_step": 18462, "epoch": 152} {"train_loss": -28.723636627197266, "global_step": 18463, "epoch": 152} {"train_loss": -28.329931259155273, "global_step": 18464, "epoch": 152} {"train_loss": -28.653060913085938, "global_step": 18465, "epoch": 152} {"train_loss": -28.767608642578125, "global_step": 18466, "epoch": 152} {"train_loss": -28.23737144470215, "global_step": 18467, "epoch": 152} {"train_loss": -28.71468162536621, "global_step": 18468, "epoch": 152} {"train_loss": -28.525604248046875, "global_step": 18469, "epoch": 152} {"train_loss": -28.756244659423828, "global_step": 18470, "epoch": 152} {"train_loss": -28.39094352722168, "global_step": 18471, "epoch": 152} {"train_loss": -28.4993896484375, "global_step": 18472, "epoch": 152} {"train_loss": -28.47174072265625, "global_step": 18473, "epoch": 152} {"train_loss": -28.979888916015625, "global_step": 18474, "epoch": 152} {"train_loss": -27.6646785736084, "global_step": 18475, "epoch": 152} {"train_loss": -28.67023277282715, "global_step": 18476, "epoch": 152} {"train_loss": -28.375242233276367, "global_step": 18477, "epoch": 152} {"train_loss": -28.523406982421875, "global_step": 18478, "epoch": 152} {"train_loss": -28.76984977722168, "global_step": 18479, "epoch": 152} {"train_loss": -28.554000854492188, "global_step": 18480, "epoch": 152} {"train_loss": -28.66343116760254, "global_step": 18481, "epoch": 152} {"train_loss": -28.747251510620117, "global_step": 18482, "epoch": 152} {"train_loss": -28.83648681640625, "global_step": 18483, "epoch": 152} {"train_loss": -28.8828125, "global_step": 18484, "epoch": 152} {"train_loss": -28.43255043029785, "global_step": 18485, "epoch": 152} {"train_loss": -28.957138061523438, "global_step": 18486, "epoch": 152} {"train_loss": -28.797128677368164, "global_step": 18487, "epoch": 152} {"train_loss": -29.148681640625, "global_step": 18488, "epoch": 152} {"train_loss": -28.992538452148438, "global_step": 18489, "epoch": 152} {"train_loss": -29.0093994140625, "global_step": 18490, "epoch": 152} {"train_loss": -28.913131713867188, "global_step": 18491, "epoch": 152} {"train_loss": -29.20551872253418, "global_step": 18492, "epoch": 152} {"train_loss": -28.3967342376709, "global_step": 18493, "epoch": 152} {"train_loss": -29.50860023498535, "global_step": 18494, "epoch": 152} {"train_loss": -28.996505737304688, "global_step": 18495, "epoch": 152} {"train_loss": -29.489606857299805, "global_step": 18496, "epoch": 152} {"train_loss": -29.16781997680664, "global_step": 18497, "epoch": 152} {"train_loss": -29.21758460998535, "global_step": 18498, "epoch": 152} {"train_loss": -29.632553100585938, "global_step": 18499, "epoch": 152} {"train_loss": -29.368371963500977, "global_step": 18500, "epoch": 152} {"train_loss": -29.469833374023438, "global_step": 18501, "epoch": 152} {"train_loss": -29.46270751953125, "global_step": 18502, "epoch": 152} {"train_loss": -29.584009170532227, "global_step": 18503, "epoch": 152} {"train_loss": -29.530593872070312, "global_step": 18504, "epoch": 152} {"train_loss": -29.707977294921875, "global_step": 18505, "epoch": 152} {"train_loss": -29.57421875, "global_step": 18506, "epoch": 152} {"train_loss": -29.734601974487305, "global_step": 18507, "epoch": 152} {"train_loss": -29.529407501220703, "global_step": 18508, "epoch": 152} {"train_loss": -29.746286392211914, "global_step": 18509, "epoch": 152} {"train_loss": -29.870014190673828, "global_step": 18510, "epoch": 152} {"train_loss": -29.534223556518555, "global_step": 18511, "epoch": 152} {"train_loss": -28.489256630259113, "global_step": 18512, "epoch": 152, "val_loss": 2709462.25} {"train_loss": -28.59480094909668, "global_step": 18513, "epoch": 153} {"train_loss": -27.910449981689453, "global_step": 18514, "epoch": 153} {"train_loss": -27.126184463500977, "global_step": 18515, "epoch": 153} {"train_loss": -26.340118408203125, "global_step": 18516, "epoch": 153} {"train_loss": -28.465368270874023, "global_step": 18517, "epoch": 153} {"train_loss": -29.43218421936035, "global_step": 18518, "epoch": 153} {"train_loss": -26.077564239501953, "global_step": 18519, "epoch": 153} {"train_loss": -26.807159423828125, "global_step": 18520, "epoch": 153} {"train_loss": -28.60040283203125, "global_step": 18521, "epoch": 153} {"train_loss": -28.811376571655273, "global_step": 18522, "epoch": 153} {"train_loss": -27.64397621154785, "global_step": 18523, "epoch": 153} {"train_loss": -28.979053497314453, "global_step": 18524, "epoch": 153} {"train_loss": -28.525278091430664, "global_step": 18525, "epoch": 153} {"train_loss": -28.55707359313965, "global_step": 18526, "epoch": 153} {"train_loss": -28.65553092956543, "global_step": 18527, "epoch": 153} {"train_loss": -27.938446044921875, "global_step": 18528, "epoch": 153} {"train_loss": -28.1993350982666, "global_step": 18529, "epoch": 153} {"train_loss": -28.7217960357666, "global_step": 18530, "epoch": 153} {"train_loss": -28.59465980529785, "global_step": 18531, "epoch": 153} {"train_loss": -27.465137481689453, "global_step": 18532, "epoch": 153} {"train_loss": -28.21222496032715, "global_step": 18533, "epoch": 153} {"train_loss": -29.474853515625, "global_step": 18534, "epoch": 153} {"train_loss": -28.907896041870117, "global_step": 18535, "epoch": 153} {"train_loss": -28.966745376586914, "global_step": 18536, "epoch": 153} {"train_loss": -29.565399169921875, "global_step": 18537, "epoch": 153} {"train_loss": -29.43836784362793, "global_step": 18538, "epoch": 153} {"train_loss": -28.960912704467773, "global_step": 18539, "epoch": 153} {"train_loss": -29.283069610595703, "global_step": 18540, "epoch": 153} {"train_loss": -29.1062068939209, "global_step": 18541, "epoch": 153} {"train_loss": -29.28144645690918, "global_step": 18542, "epoch": 153} {"train_loss": -29.251972198486328, "global_step": 18543, "epoch": 153} {"train_loss": -29.165943145751953, "global_step": 18544, "epoch": 153} {"train_loss": -29.569442749023438, "global_step": 18545, "epoch": 153} {"train_loss": -29.39483070373535, "global_step": 18546, "epoch": 153} {"train_loss": -29.811908721923828, "global_step": 18547, "epoch": 153} {"train_loss": -29.2540225982666, "global_step": 18548, "epoch": 153} {"train_loss": -29.333393096923828, "global_step": 18549, "epoch": 153} {"train_loss": -28.93861198425293, "global_step": 18550, "epoch": 153} {"train_loss": -28.268753051757812, "global_step": 18551, "epoch": 153} {"train_loss": -29.598499298095703, "global_step": 18552, "epoch": 153} {"train_loss": -29.27937126159668, "global_step": 18553, "epoch": 153} {"train_loss": -28.426345825195312, "global_step": 18554, "epoch": 153} {"train_loss": -26.895299911499023, "global_step": 18555, "epoch": 153} {"train_loss": -25.23703956604004, "global_step": 18556, "epoch": 153} {"train_loss": -26.358905792236328, "global_step": 18557, "epoch": 153} {"train_loss": -28.713150024414062, "global_step": 18558, "epoch": 153} {"train_loss": -27.96729850769043, "global_step": 18559, "epoch": 153} {"train_loss": -27.51433753967285, "global_step": 18560, "epoch": 153} {"train_loss": -29.20881462097168, "global_step": 18561, "epoch": 153} {"train_loss": -29.055334091186523, "global_step": 18562, "epoch": 153} {"train_loss": -26.521448135375977, "global_step": 18563, "epoch": 153} {"train_loss": -29.403234481811523, "global_step": 18564, "epoch": 153} {"train_loss": -28.416879653930664, "global_step": 18565, "epoch": 153} {"train_loss": -28.21722984313965, "global_step": 18566, "epoch": 153} {"train_loss": -28.395170211791992, "global_step": 18567, "epoch": 153} {"train_loss": -27.98638343811035, "global_step": 18568, "epoch": 153} {"train_loss": -28.818185806274414, "global_step": 18569, "epoch": 153} {"train_loss": -28.670866012573242, "global_step": 18570, "epoch": 153} {"train_loss": -27.322351455688477, "global_step": 18571, "epoch": 153} {"train_loss": -26.317855834960938, "global_step": 18572, "epoch": 153} {"train_loss": -20.51551628112793, "global_step": 18573, "epoch": 153} {"train_loss": -12.132181167602539, "global_step": 18574, "epoch": 153} {"train_loss": -16.296194076538086, "global_step": 18575, "epoch": 153} {"train_loss": -27.005725860595703, "global_step": 18576, "epoch": 153} {"train_loss": -23.73194694519043, "global_step": 18577, "epoch": 153} {"train_loss": -27.574609756469727, "global_step": 18578, "epoch": 153} {"train_loss": -25.772764205932617, "global_step": 18579, "epoch": 153} {"train_loss": -26.743255615234375, "global_step": 18580, "epoch": 153} {"train_loss": -26.977630615234375, "global_step": 18581, "epoch": 153} {"train_loss": -26.484100341796875, "global_step": 18582, "epoch": 153} {"train_loss": -27.009307861328125, "global_step": 18583, "epoch": 153} {"train_loss": -27.5578670501709, "global_step": 18584, "epoch": 153} {"train_loss": -26.9416446685791, "global_step": 18585, "epoch": 153} {"train_loss": -26.981678009033203, "global_step": 18586, "epoch": 153} {"train_loss": -27.48703956604004, "global_step": 18587, "epoch": 153} {"train_loss": -27.86114501953125, "global_step": 18588, "epoch": 153} {"train_loss": -27.92817497253418, "global_step": 18589, "epoch": 153} {"train_loss": -28.015918731689453, "global_step": 18590, "epoch": 153} {"train_loss": -27.386133193969727, "global_step": 18591, "epoch": 153} {"train_loss": -27.595111846923828, "global_step": 18592, "epoch": 153} {"train_loss": -28.204849243164062, "global_step": 18593, "epoch": 153} {"train_loss": -27.756805419921875, "global_step": 18594, "epoch": 153} {"train_loss": -27.91737174987793, "global_step": 18595, "epoch": 153} {"train_loss": -28.05234146118164, "global_step": 18596, "epoch": 153} {"train_loss": -27.5615177154541, "global_step": 18597, "epoch": 153} {"train_loss": -27.105609893798828, "global_step": 18598, "epoch": 153} {"train_loss": -27.57679557800293, "global_step": 18599, "epoch": 153} {"train_loss": -28.25412940979004, "global_step": 18600, "epoch": 153} {"train_loss": -27.924428939819336, "global_step": 18601, "epoch": 153} {"train_loss": -27.874069213867188, "global_step": 18602, "epoch": 153} {"train_loss": -28.317956924438477, "global_step": 18603, "epoch": 153} {"train_loss": -27.820510864257812, "global_step": 18604, "epoch": 153} {"train_loss": -27.770910263061523, "global_step": 18605, "epoch": 153} {"train_loss": -28.409513473510742, "global_step": 18606, "epoch": 153} {"train_loss": -26.856948852539062, "global_step": 18607, "epoch": 153} {"train_loss": -27.26434326171875, "global_step": 18608, "epoch": 153} {"train_loss": -28.62005615234375, "global_step": 18609, "epoch": 153} {"train_loss": -27.297170639038086, "global_step": 18610, "epoch": 153} {"train_loss": -28.23639488220215, "global_step": 18611, "epoch": 153} {"train_loss": -28.05567741394043, "global_step": 18612, "epoch": 153} {"train_loss": -27.996814727783203, "global_step": 18613, "epoch": 153} {"train_loss": -28.300268173217773, "global_step": 18614, "epoch": 153} {"train_loss": -28.027973175048828, "global_step": 18615, "epoch": 153} {"train_loss": -28.514877319335938, "global_step": 18616, "epoch": 153} {"train_loss": -28.363433837890625, "global_step": 18617, "epoch": 153} {"train_loss": -28.587665557861328, "global_step": 18618, "epoch": 153} {"train_loss": -28.41000747680664, "global_step": 18619, "epoch": 153} {"train_loss": -28.575483322143555, "global_step": 18620, "epoch": 153} {"train_loss": -27.81122398376465, "global_step": 18621, "epoch": 153} {"train_loss": -28.59735679626465, "global_step": 18622, "epoch": 153} {"train_loss": -28.706527709960938, "global_step": 18623, "epoch": 153} {"train_loss": -28.31260108947754, "global_step": 18624, "epoch": 153} {"train_loss": -28.832910537719727, "global_step": 18625, "epoch": 153} {"train_loss": -28.464502334594727, "global_step": 18626, "epoch": 153} {"train_loss": -28.90570640563965, "global_step": 18627, "epoch": 153} {"train_loss": -28.767934799194336, "global_step": 18628, "epoch": 153} {"train_loss": -28.689138412475586, "global_step": 18629, "epoch": 153} {"train_loss": -28.4176082611084, "global_step": 18630, "epoch": 153} {"train_loss": -28.67803955078125, "global_step": 18631, "epoch": 153} {"train_loss": -28.33199119567871, "global_step": 18632, "epoch": 153} {"train_loss": -27.82511346990412, "global_step": 18633, "epoch": 153, "val_loss": 2580354.25} {"train_loss": -28.625080108642578, "global_step": 18634, "epoch": 154} {"train_loss": -28.977514266967773, "global_step": 18635, "epoch": 154} {"train_loss": -28.61964225769043, "global_step": 18636, "epoch": 154} {"train_loss": -28.984338760375977, "global_step": 18637, "epoch": 154} {"train_loss": -29.1434268951416, "global_step": 18638, "epoch": 154} {"train_loss": -28.251937866210938, "global_step": 18639, "epoch": 154} {"train_loss": -28.77687644958496, "global_step": 18640, "epoch": 154} {"train_loss": -28.757190704345703, "global_step": 18641, "epoch": 154} {"train_loss": -28.143756866455078, "global_step": 18642, "epoch": 154} {"train_loss": -28.533344268798828, "global_step": 18643, "epoch": 154} {"train_loss": -28.490787506103516, "global_step": 18644, "epoch": 154} {"train_loss": -29.301305770874023, "global_step": 18645, "epoch": 154} {"train_loss": -28.922693252563477, "global_step": 18646, "epoch": 154} {"train_loss": -28.583087921142578, "global_step": 18647, "epoch": 154} {"train_loss": -28.1436767578125, "global_step": 18648, "epoch": 154} {"train_loss": -27.325122833251953, "global_step": 18649, "epoch": 154} {"train_loss": -26.6638126373291, "global_step": 18650, "epoch": 154} {"train_loss": -25.706098556518555, "global_step": 18651, "epoch": 154} {"train_loss": -23.949445724487305, "global_step": 18652, "epoch": 154} {"train_loss": -27.031463623046875, "global_step": 18653, "epoch": 154} {"train_loss": -28.726032257080078, "global_step": 18654, "epoch": 154} {"train_loss": -27.638568878173828, "global_step": 18655, "epoch": 154} {"train_loss": -27.3831729888916, "global_step": 18656, "epoch": 154} {"train_loss": -29.031097412109375, "global_step": 18657, "epoch": 154} {"train_loss": -28.71316909790039, "global_step": 18658, "epoch": 154} {"train_loss": -28.045490264892578, "global_step": 18659, "epoch": 154} {"train_loss": -28.737714767456055, "global_step": 18660, "epoch": 154} {"train_loss": -28.223424911499023, "global_step": 18661, "epoch": 154} {"train_loss": -28.110660552978516, "global_step": 18662, "epoch": 154} {"train_loss": -28.847684860229492, "global_step": 18663, "epoch": 154} {"train_loss": -28.450916290283203, "global_step": 18664, "epoch": 154} {"train_loss": -28.649280548095703, "global_step": 18665, "epoch": 154} {"train_loss": -28.50201988220215, "global_step": 18666, "epoch": 154} {"train_loss": -28.95355796813965, "global_step": 18667, "epoch": 154} {"train_loss": -29.130918502807617, "global_step": 18668, "epoch": 154} {"train_loss": -28.6041202545166, "global_step": 18669, "epoch": 154} {"train_loss": -29.226821899414062, "global_step": 18670, "epoch": 154} {"train_loss": -29.022809982299805, "global_step": 18671, "epoch": 154} {"train_loss": -28.837146759033203, "global_step": 18672, "epoch": 154} {"train_loss": -28.75758171081543, "global_step": 18673, "epoch": 154} {"train_loss": -28.88985252380371, "global_step": 18674, "epoch": 154} {"train_loss": -28.377029418945312, "global_step": 18675, "epoch": 154} {"train_loss": -28.670438766479492, "global_step": 18676, "epoch": 154} {"train_loss": -28.889057159423828, "global_step": 18677, "epoch": 154} {"train_loss": -29.242542266845703, "global_step": 18678, "epoch": 154} {"train_loss": -29.015798568725586, "global_step": 18679, "epoch": 154} {"train_loss": -29.52716636657715, "global_step": 18680, "epoch": 154} {"train_loss": -28.154333114624023, "global_step": 18681, "epoch": 154} {"train_loss": -27.123777389526367, "global_step": 18682, "epoch": 154} {"train_loss": -27.615060806274414, "global_step": 18683, "epoch": 154} {"train_loss": -28.954294204711914, "global_step": 18684, "epoch": 154} {"train_loss": -28.480005264282227, "global_step": 18685, "epoch": 154} {"train_loss": -28.463953018188477, "global_step": 18686, "epoch": 154} {"train_loss": -28.968826293945312, "global_step": 18687, "epoch": 154} {"train_loss": -28.804340362548828, "global_step": 18688, "epoch": 154} {"train_loss": -28.54547119140625, "global_step": 18689, "epoch": 154} {"train_loss": -28.79802894592285, "global_step": 18690, "epoch": 154} {"train_loss": -28.58245849609375, "global_step": 18691, "epoch": 154} {"train_loss": -28.9157657623291, "global_step": 18692, "epoch": 154} {"train_loss": -28.936847686767578, "global_step": 18693, "epoch": 154} {"train_loss": -28.718215942382812, "global_step": 18694, "epoch": 154} {"train_loss": -28.888385772705078, "global_step": 18695, "epoch": 154} {"train_loss": -28.5897216796875, "global_step": 18696, "epoch": 154} {"train_loss": -28.695098876953125, "global_step": 18697, "epoch": 154} {"train_loss": -28.92172622680664, "global_step": 18698, "epoch": 154} {"train_loss": -29.3863525390625, "global_step": 18699, "epoch": 154} {"train_loss": -29.182281494140625, "global_step": 18700, "epoch": 154} {"train_loss": -29.069278717041016, "global_step": 18701, "epoch": 154} {"train_loss": -29.157358169555664, "global_step": 18702, "epoch": 154} {"train_loss": -29.08631706237793, "global_step": 18703, "epoch": 154} {"train_loss": -29.346994400024414, "global_step": 18704, "epoch": 154} {"train_loss": -29.515302658081055, "global_step": 18705, "epoch": 154} {"train_loss": -29.116514205932617, "global_step": 18706, "epoch": 154} {"train_loss": -28.79986000061035, "global_step": 18707, "epoch": 154} {"train_loss": -29.37506103515625, "global_step": 18708, "epoch": 154} {"train_loss": -29.1837158203125, "global_step": 18709, "epoch": 154} {"train_loss": -29.107624053955078, "global_step": 18710, "epoch": 154} {"train_loss": -29.572126388549805, "global_step": 18711, "epoch": 154} {"train_loss": -29.2501163482666, "global_step": 18712, "epoch": 154} {"train_loss": -29.3607234954834, "global_step": 18713, "epoch": 154} {"train_loss": -29.2916316986084, "global_step": 18714, "epoch": 154} {"train_loss": -29.046295166015625, "global_step": 18715, "epoch": 154} {"train_loss": -29.541946411132812, "global_step": 18716, "epoch": 154} {"train_loss": -29.27304458618164, "global_step": 18717, "epoch": 154} {"train_loss": -29.131467819213867, "global_step": 18718, "epoch": 154} {"train_loss": -29.64484214782715, "global_step": 18719, "epoch": 154} {"train_loss": -29.42281150817871, "global_step": 18720, "epoch": 154} {"train_loss": -29.53321647644043, "global_step": 18721, "epoch": 154} {"train_loss": -29.206518173217773, "global_step": 18722, "epoch": 154} {"train_loss": -28.8912296295166, "global_step": 18723, "epoch": 154} {"train_loss": -29.25506591796875, "global_step": 18724, "epoch": 154} {"train_loss": -29.76093101501465, "global_step": 18725, "epoch": 154} {"train_loss": -29.386276245117188, "global_step": 18726, "epoch": 154} {"train_loss": -30.01824951171875, "global_step": 18727, "epoch": 154} {"train_loss": -29.570249557495117, "global_step": 18728, "epoch": 154} {"train_loss": -29.86703872680664, "global_step": 18729, "epoch": 154} {"train_loss": -29.40033531188965, "global_step": 18730, "epoch": 154} {"train_loss": -28.98296546936035, "global_step": 18731, "epoch": 154} {"train_loss": -29.786733627319336, "global_step": 18732, "epoch": 154} {"train_loss": -29.319913864135742, "global_step": 18733, "epoch": 154} {"train_loss": -29.332721710205078, "global_step": 18734, "epoch": 154} {"train_loss": -29.510303497314453, "global_step": 18735, "epoch": 154} {"train_loss": -29.256458282470703, "global_step": 18736, "epoch": 154} {"train_loss": -29.500497817993164, "global_step": 18737, "epoch": 154} {"train_loss": -29.26711082458496, "global_step": 18738, "epoch": 154} {"train_loss": -29.610071182250977, "global_step": 18739, "epoch": 154} {"train_loss": -29.121082305908203, "global_step": 18740, "epoch": 154} {"train_loss": -29.46221351623535, "global_step": 18741, "epoch": 154} {"train_loss": -29.80584144592285, "global_step": 18742, "epoch": 154} {"train_loss": -29.90079689025879, "global_step": 18743, "epoch": 154} {"train_loss": -29.78289222717285, "global_step": 18744, "epoch": 154} {"train_loss": -29.227603912353516, "global_step": 18745, "epoch": 154} {"train_loss": -29.72265625, "global_step": 18746, "epoch": 154} {"train_loss": -29.582502365112305, "global_step": 18747, "epoch": 154} {"train_loss": -28.713186264038086, "global_step": 18748, "epoch": 154} {"train_loss": -29.040128707885742, "global_step": 18749, "epoch": 154} {"train_loss": -28.674610137939453, "global_step": 18750, "epoch": 154} {"train_loss": -28.83302116394043, "global_step": 18751, "epoch": 154} {"train_loss": -28.331457138061523, "global_step": 18752, "epoch": 154} {"train_loss": -29.1889705657959, "global_step": 18753, "epoch": 154} {"train_loss": -28.857267742314615, "global_step": 18754, "epoch": 154, "val_loss": 2681224.25} {"train_loss": -29.45068359375, "global_step": 18755, "epoch": 155} {"train_loss": -29.715238571166992, "global_step": 18756, "epoch": 155} {"train_loss": -28.536914825439453, "global_step": 18757, "epoch": 155} {"train_loss": -28.54462242126465, "global_step": 18758, "epoch": 155} {"train_loss": -27.651260375976562, "global_step": 18759, "epoch": 155} {"train_loss": -28.226028442382812, "global_step": 18760, "epoch": 155} {"train_loss": -28.53228759765625, "global_step": 18761, "epoch": 155} {"train_loss": -29.67364501953125, "global_step": 18762, "epoch": 155} {"train_loss": -29.51386833190918, "global_step": 18763, "epoch": 155} {"train_loss": -28.71490478515625, "global_step": 18764, "epoch": 155} {"train_loss": -28.88848304748535, "global_step": 18765, "epoch": 155} {"train_loss": -28.8738956451416, "global_step": 18766, "epoch": 155} {"train_loss": -29.51666259765625, "global_step": 18767, "epoch": 155} {"train_loss": -29.209440231323242, "global_step": 18768, "epoch": 155} {"train_loss": -29.14606285095215, "global_step": 18769, "epoch": 155} {"train_loss": -28.73294448852539, "global_step": 18770, "epoch": 155} {"train_loss": -29.330854415893555, "global_step": 18771, "epoch": 155} {"train_loss": -28.81912612915039, "global_step": 18772, "epoch": 155} {"train_loss": -29.284032821655273, "global_step": 18773, "epoch": 155} {"train_loss": -29.70269203186035, "global_step": 18774, "epoch": 155} {"train_loss": -29.325544357299805, "global_step": 18775, "epoch": 155} {"train_loss": -29.17850112915039, "global_step": 18776, "epoch": 155} {"train_loss": -29.466907501220703, "global_step": 18777, "epoch": 155} {"train_loss": -30.10605239868164, "global_step": 18778, "epoch": 155} {"train_loss": -29.985336303710938, "global_step": 18779, "epoch": 155} {"train_loss": -29.257511138916016, "global_step": 18780, "epoch": 155} {"train_loss": -28.889545440673828, "global_step": 18781, "epoch": 155} {"train_loss": -29.825429916381836, "global_step": 18782, "epoch": 155} {"train_loss": -29.643447875976562, "global_step": 18783, "epoch": 155} {"train_loss": -29.426513671875, "global_step": 18784, "epoch": 155} {"train_loss": -28.77927589416504, "global_step": 18785, "epoch": 155} {"train_loss": -29.599689483642578, "global_step": 18786, "epoch": 155} {"train_loss": -29.6666259765625, "global_step": 18787, "epoch": 155} {"train_loss": -29.562421798706055, "global_step": 18788, "epoch": 155} {"train_loss": -27.89934730529785, "global_step": 18789, "epoch": 155} {"train_loss": -29.006601333618164, "global_step": 18790, "epoch": 155} {"train_loss": -29.45503044128418, "global_step": 18791, "epoch": 155} {"train_loss": -29.00613784790039, "global_step": 18792, "epoch": 155} {"train_loss": -29.36704444885254, "global_step": 18793, "epoch": 155} {"train_loss": -29.133832931518555, "global_step": 18794, "epoch": 155} {"train_loss": -29.4378719329834, "global_step": 18795, "epoch": 155} {"train_loss": -29.22132682800293, "global_step": 18796, "epoch": 155} {"train_loss": -28.908105850219727, "global_step": 18797, "epoch": 155} {"train_loss": -28.32356071472168, "global_step": 18798, "epoch": 155} {"train_loss": -29.419836044311523, "global_step": 18799, "epoch": 155} {"train_loss": -29.59360122680664, "global_step": 18800, "epoch": 155} {"train_loss": -28.730573654174805, "global_step": 18801, "epoch": 155} {"train_loss": -29.408605575561523, "global_step": 18802, "epoch": 155} {"train_loss": -29.861902236938477, "global_step": 18803, "epoch": 155} {"train_loss": -29.04518699645996, "global_step": 18804, "epoch": 155} {"train_loss": -28.677160263061523, "global_step": 18805, "epoch": 155} {"train_loss": -28.93828773498535, "global_step": 18806, "epoch": 155} {"train_loss": -27.86414909362793, "global_step": 18807, "epoch": 155} {"train_loss": -28.73581886291504, "global_step": 18808, "epoch": 155} {"train_loss": -29.615192413330078, "global_step": 18809, "epoch": 155} {"train_loss": -28.29502296447754, "global_step": 18810, "epoch": 155} {"train_loss": -27.4743595123291, "global_step": 18811, "epoch": 155} {"train_loss": -28.88739013671875, "global_step": 18812, "epoch": 155} {"train_loss": -29.0273380279541, "global_step": 18813, "epoch": 155} {"train_loss": -28.225305557250977, "global_step": 18814, "epoch": 155} {"train_loss": -29.709035873413086, "global_step": 18815, "epoch": 155} {"train_loss": -28.950796127319336, "global_step": 18816, "epoch": 155} {"train_loss": -28.487457275390625, "global_step": 18817, "epoch": 155} {"train_loss": -29.102643966674805, "global_step": 18818, "epoch": 155} {"train_loss": -29.149433135986328, "global_step": 18819, "epoch": 155} {"train_loss": -28.839527130126953, "global_step": 18820, "epoch": 155} {"train_loss": -29.050485610961914, "global_step": 18821, "epoch": 155} {"train_loss": -29.17719078063965, "global_step": 18822, "epoch": 155} {"train_loss": -28.810632705688477, "global_step": 18823, "epoch": 155} {"train_loss": -28.188262939453125, "global_step": 18824, "epoch": 155} {"train_loss": -29.099872589111328, "global_step": 18825, "epoch": 155} {"train_loss": -29.164325714111328, "global_step": 18826, "epoch": 155} {"train_loss": -29.353586196899414, "global_step": 18827, "epoch": 155} {"train_loss": -29.352136611938477, "global_step": 18828, "epoch": 155} {"train_loss": -28.7133731842041, "global_step": 18829, "epoch": 155} {"train_loss": -27.3861026763916, "global_step": 18830, "epoch": 155} {"train_loss": -26.5395565032959, "global_step": 18831, "epoch": 155} {"train_loss": -26.404775619506836, "global_step": 18832, "epoch": 155} {"train_loss": -28.558597564697266, "global_step": 18833, "epoch": 155} {"train_loss": -29.036670684814453, "global_step": 18834, "epoch": 155} {"train_loss": -26.731403350830078, "global_step": 18835, "epoch": 155} {"train_loss": -28.467615127563477, "global_step": 18836, "epoch": 155} {"train_loss": -28.834228515625, "global_step": 18837, "epoch": 155} {"train_loss": -28.359760284423828, "global_step": 18838, "epoch": 155} {"train_loss": -29.001352310180664, "global_step": 18839, "epoch": 155} {"train_loss": -28.453704833984375, "global_step": 18840, "epoch": 155} {"train_loss": -28.198057174682617, "global_step": 18841, "epoch": 155} {"train_loss": -27.459569931030273, "global_step": 18842, "epoch": 155} {"train_loss": -26.0457763671875, "global_step": 18843, "epoch": 155} {"train_loss": -28.839385986328125, "global_step": 18844, "epoch": 155} {"train_loss": -27.998754501342773, "global_step": 18845, "epoch": 155} {"train_loss": -27.81300163269043, "global_step": 18846, "epoch": 155} {"train_loss": -29.0656681060791, "global_step": 18847, "epoch": 155} {"train_loss": -27.99604606628418, "global_step": 18848, "epoch": 155} {"train_loss": -29.002197265625, "global_step": 18849, "epoch": 155} {"train_loss": -29.262924194335938, "global_step": 18850, "epoch": 155} {"train_loss": -28.453784942626953, "global_step": 18851, "epoch": 155} {"train_loss": -28.99485206604004, "global_step": 18852, "epoch": 155} {"train_loss": -29.255823135375977, "global_step": 18853, "epoch": 155} {"train_loss": -29.039663314819336, "global_step": 18854, "epoch": 155} {"train_loss": -29.31430435180664, "global_step": 18855, "epoch": 155} {"train_loss": -29.497159957885742, "global_step": 18856, "epoch": 155} {"train_loss": -29.19546890258789, "global_step": 18857, "epoch": 155} {"train_loss": -29.266010284423828, "global_step": 18858, "epoch": 155} {"train_loss": -29.451309204101562, "global_step": 18859, "epoch": 155} {"train_loss": -28.7043514251709, "global_step": 18860, "epoch": 155} {"train_loss": -29.444089889526367, "global_step": 18861, "epoch": 155} {"train_loss": -29.2573299407959, "global_step": 18862, "epoch": 155} {"train_loss": -29.464801788330078, "global_step": 18863, "epoch": 155} {"train_loss": -29.30914306640625, "global_step": 18864, "epoch": 155} {"train_loss": -29.699249267578125, "global_step": 18865, "epoch": 155} {"train_loss": -29.10268211364746, "global_step": 18866, "epoch": 155} {"train_loss": -28.67865562438965, "global_step": 18867, "epoch": 155} {"train_loss": -28.95356559753418, "global_step": 18868, "epoch": 155} {"train_loss": -29.008136749267578, "global_step": 18869, "epoch": 155} {"train_loss": -29.47920036315918, "global_step": 18870, "epoch": 155} {"train_loss": -28.611469268798828, "global_step": 18871, "epoch": 155} {"train_loss": -27.96575927734375, "global_step": 18872, "epoch": 155} {"train_loss": -27.443283081054688, "global_step": 18873, "epoch": 155} {"train_loss": -27.624521255493164, "global_step": 18874, "epoch": 155} {"train_loss": -28.856042483621394, "global_step": 18875, "epoch": 155, "val_loss": 2689497.75} {"train_loss": -27.700586318969727, "global_step": 18876, "epoch": 156} {"train_loss": -28.242298126220703, "global_step": 18877, "epoch": 156} {"train_loss": -28.398691177368164, "global_step": 18878, "epoch": 156} {"train_loss": -28.37577247619629, "global_step": 18879, "epoch": 156} {"train_loss": -29.12519645690918, "global_step": 18880, "epoch": 156} {"train_loss": -28.73537254333496, "global_step": 18881, "epoch": 156} {"train_loss": -28.26803970336914, "global_step": 18882, "epoch": 156} {"train_loss": -28.009366989135742, "global_step": 18883, "epoch": 156} {"train_loss": -28.764554977416992, "global_step": 18884, "epoch": 156} {"train_loss": -28.612112045288086, "global_step": 18885, "epoch": 156} {"train_loss": -29.663068771362305, "global_step": 18886, "epoch": 156} {"train_loss": -28.851882934570312, "global_step": 18887, "epoch": 156} {"train_loss": -27.9239559173584, "global_step": 18888, "epoch": 156} {"train_loss": -29.10348892211914, "global_step": 18889, "epoch": 156} {"train_loss": -29.16365623474121, "global_step": 18890, "epoch": 156} {"train_loss": -27.618886947631836, "global_step": 18891, "epoch": 156} {"train_loss": -28.42498207092285, "global_step": 18892, "epoch": 156} {"train_loss": -29.65618324279785, "global_step": 18893, "epoch": 156} {"train_loss": -27.648117065429688, "global_step": 18894, "epoch": 156} {"train_loss": -28.03682518005371, "global_step": 18895, "epoch": 156} {"train_loss": -29.324914932250977, "global_step": 18896, "epoch": 156} {"train_loss": -27.879505157470703, "global_step": 18897, "epoch": 156} {"train_loss": -29.437475204467773, "global_step": 18898, "epoch": 156} {"train_loss": -29.138620376586914, "global_step": 18899, "epoch": 156} {"train_loss": -28.40423583984375, "global_step": 18900, "epoch": 156} {"train_loss": -29.779539108276367, "global_step": 18901, "epoch": 156} {"train_loss": -29.339197158813477, "global_step": 18902, "epoch": 156} {"train_loss": -29.621667861938477, "global_step": 18903, "epoch": 156} {"train_loss": -29.07073974609375, "global_step": 18904, "epoch": 156} {"train_loss": -29.04489517211914, "global_step": 18905, "epoch": 156} {"train_loss": -29.22539710998535, "global_step": 18906, "epoch": 156} {"train_loss": -28.869474411010742, "global_step": 18907, "epoch": 156} {"train_loss": -29.402099609375, "global_step": 18908, "epoch": 156} {"train_loss": -29.376523971557617, "global_step": 18909, "epoch": 156} {"train_loss": -28.862150192260742, "global_step": 18910, "epoch": 156} {"train_loss": -29.443756103515625, "global_step": 18911, "epoch": 156} {"train_loss": -29.44993019104004, "global_step": 18912, "epoch": 156} {"train_loss": -28.661161422729492, "global_step": 18913, "epoch": 156} {"train_loss": -29.514820098876953, "global_step": 18914, "epoch": 156} {"train_loss": -29.603540420532227, "global_step": 18915, "epoch": 156} {"train_loss": -29.337696075439453, "global_step": 18916, "epoch": 156} {"train_loss": -29.310941696166992, "global_step": 18917, "epoch": 156} {"train_loss": -29.15460205078125, "global_step": 18918, "epoch": 156} {"train_loss": -29.846323013305664, "global_step": 18919, "epoch": 156} {"train_loss": -29.513029098510742, "global_step": 18920, "epoch": 156} {"train_loss": -29.267932891845703, "global_step": 18921, "epoch": 156} {"train_loss": -29.622526168823242, "global_step": 18922, "epoch": 156} {"train_loss": -29.798542022705078, "global_step": 18923, "epoch": 156} {"train_loss": -28.623456954956055, "global_step": 18924, "epoch": 156} {"train_loss": -28.455978393554688, "global_step": 18925, "epoch": 156} {"train_loss": -27.690113067626953, "global_step": 18926, "epoch": 156} {"train_loss": -29.129491806030273, "global_step": 18927, "epoch": 156} {"train_loss": -29.65325355529785, "global_step": 18928, "epoch": 156} {"train_loss": -29.22187614440918, "global_step": 18929, "epoch": 156} {"train_loss": -28.601892471313477, "global_step": 18930, "epoch": 156} {"train_loss": -29.376270294189453, "global_step": 18931, "epoch": 156} {"train_loss": -29.157001495361328, "global_step": 18932, "epoch": 156} {"train_loss": -29.042510986328125, "global_step": 18933, "epoch": 156} {"train_loss": -29.327985763549805, "global_step": 18934, "epoch": 156} {"train_loss": -29.462549209594727, "global_step": 18935, "epoch": 156} {"train_loss": -29.26127052307129, "global_step": 18936, "epoch": 156} {"train_loss": -29.50147819519043, "global_step": 18937, "epoch": 156} {"train_loss": -29.373865127563477, "global_step": 18938, "epoch": 156} {"train_loss": -29.42941665649414, "global_step": 18939, "epoch": 156} {"train_loss": -29.424972534179688, "global_step": 18940, "epoch": 156} {"train_loss": -28.739194869995117, "global_step": 18941, "epoch": 156} {"train_loss": -28.975418090820312, "global_step": 18942, "epoch": 156} {"train_loss": -28.133249282836914, "global_step": 18943, "epoch": 156} {"train_loss": -29.57087516784668, "global_step": 18944, "epoch": 156} {"train_loss": -28.843387603759766, "global_step": 18945, "epoch": 156} {"train_loss": -30.104333877563477, "global_step": 18946, "epoch": 156} {"train_loss": -28.766265869140625, "global_step": 18947, "epoch": 156} {"train_loss": -29.595947265625, "global_step": 18948, "epoch": 156} {"train_loss": -29.869958877563477, "global_step": 18949, "epoch": 156} {"train_loss": -29.34235191345215, "global_step": 18950, "epoch": 156} {"train_loss": -29.718149185180664, "global_step": 18951, "epoch": 156} {"train_loss": -29.74728775024414, "global_step": 18952, "epoch": 156} {"train_loss": -29.65250587463379, "global_step": 18953, "epoch": 156} {"train_loss": -29.8350772857666, "global_step": 18954, "epoch": 156} {"train_loss": -29.101858139038086, "global_step": 18955, "epoch": 156} {"train_loss": -28.129064559936523, "global_step": 18956, "epoch": 156} {"train_loss": -28.3739013671875, "global_step": 18957, "epoch": 156} {"train_loss": -28.855249404907227, "global_step": 18958, "epoch": 156} {"train_loss": -29.594324111938477, "global_step": 18959, "epoch": 156} {"train_loss": -29.322416305541992, "global_step": 18960, "epoch": 156} {"train_loss": -28.558263778686523, "global_step": 18961, "epoch": 156} {"train_loss": -29.065587997436523, "global_step": 18962, "epoch": 156} {"train_loss": -29.262388229370117, "global_step": 18963, "epoch": 156} {"train_loss": -28.375030517578125, "global_step": 18964, "epoch": 156} {"train_loss": -26.9113712310791, "global_step": 18965, "epoch": 156} {"train_loss": -29.043472290039062, "global_step": 18966, "epoch": 156} {"train_loss": -29.20222282409668, "global_step": 18967, "epoch": 156} {"train_loss": -28.110279083251953, "global_step": 18968, "epoch": 156} {"train_loss": -29.25640296936035, "global_step": 18969, "epoch": 156} {"train_loss": -28.827436447143555, "global_step": 18970, "epoch": 156} {"train_loss": -29.271268844604492, "global_step": 18971, "epoch": 156} {"train_loss": -29.420654296875, "global_step": 18972, "epoch": 156} {"train_loss": -28.641468048095703, "global_step": 18973, "epoch": 156} {"train_loss": -29.443023681640625, "global_step": 18974, "epoch": 156} {"train_loss": -29.564191818237305, "global_step": 18975, "epoch": 156} {"train_loss": -29.328235626220703, "global_step": 18976, "epoch": 156} {"train_loss": -29.709644317626953, "global_step": 18977, "epoch": 156} {"train_loss": -29.900915145874023, "global_step": 18978, "epoch": 156} {"train_loss": -29.39930534362793, "global_step": 18979, "epoch": 156} {"train_loss": -29.007177352905273, "global_step": 18980, "epoch": 156} {"train_loss": -29.724035263061523, "global_step": 18981, "epoch": 156} {"train_loss": -29.29437255859375, "global_step": 18982, "epoch": 156} {"train_loss": -29.372400283813477, "global_step": 18983, "epoch": 156} {"train_loss": -29.593774795532227, "global_step": 18984, "epoch": 156} {"train_loss": -29.52495765686035, "global_step": 18985, "epoch": 156} {"train_loss": -29.09488296508789, "global_step": 18986, "epoch": 156} {"train_loss": -29.08722496032715, "global_step": 18987, "epoch": 156} {"train_loss": -28.432373046875, "global_step": 18988, "epoch": 156} {"train_loss": -27.695880889892578, "global_step": 18989, "epoch": 156} {"train_loss": -28.43910026550293, "global_step": 18990, "epoch": 156} {"train_loss": -28.4268741607666, "global_step": 18991, "epoch": 156} {"train_loss": -29.687971115112305, "global_step": 18992, "epoch": 156} {"train_loss": -29.403106689453125, "global_step": 18993, "epoch": 156} {"train_loss": -27.824604034423828, "global_step": 18994, "epoch": 156} {"train_loss": -26.35755729675293, "global_step": 18995, "epoch": 156} {"train_loss": -28.995080522269255, "global_step": 18996, "epoch": 156, "val_loss": 2736075.25} {"train_loss": -29.438756942749023, "global_step": 18997, "epoch": 157} {"train_loss": -28.905431747436523, "global_step": 18998, "epoch": 157} {"train_loss": -28.72633171081543, "global_step": 18999, "epoch": 157} {"train_loss": -28.876453399658203, "global_step": 19000, "epoch": 157} {"train_loss": -29.003259658813477, "global_step": 19001, "epoch": 157} {"train_loss": -29.35639762878418, "global_step": 19002, "epoch": 157} {"train_loss": -29.462234497070312, "global_step": 19003, "epoch": 157} {"train_loss": -28.867267608642578, "global_step": 19004, "epoch": 157} {"train_loss": -29.2009334564209, "global_step": 19005, "epoch": 157} {"train_loss": -29.086170196533203, "global_step": 19006, "epoch": 157} {"train_loss": -29.257299423217773, "global_step": 19007, "epoch": 157} {"train_loss": -29.55535316467285, "global_step": 19008, "epoch": 157} {"train_loss": -29.071008682250977, "global_step": 19009, "epoch": 157} {"train_loss": -28.897733688354492, "global_step": 19010, "epoch": 157} {"train_loss": -28.983137130737305, "global_step": 19011, "epoch": 157} {"train_loss": -29.18362808227539, "global_step": 19012, "epoch": 157} {"train_loss": -27.331375122070312, "global_step": 19013, "epoch": 157} {"train_loss": -26.448486328125, "global_step": 19014, "epoch": 157} {"train_loss": -25.908658981323242, "global_step": 19015, "epoch": 157} {"train_loss": -27.446374893188477, "global_step": 19016, "epoch": 157} {"train_loss": -28.706409454345703, "global_step": 19017, "epoch": 157} {"train_loss": -29.069766998291016, "global_step": 19018, "epoch": 157} {"train_loss": -28.80060386657715, "global_step": 19019, "epoch": 157} {"train_loss": -28.463642120361328, "global_step": 19020, "epoch": 157} {"train_loss": -28.70965576171875, "global_step": 19021, "epoch": 157} {"train_loss": -28.33704948425293, "global_step": 19022, "epoch": 157} {"train_loss": -27.20963478088379, "global_step": 19023, "epoch": 157} {"train_loss": -28.985883712768555, "global_step": 19024, "epoch": 157} {"train_loss": -28.84762954711914, "global_step": 19025, "epoch": 157} {"train_loss": -28.546247482299805, "global_step": 19026, "epoch": 157} {"train_loss": -29.473281860351562, "global_step": 19027, "epoch": 157} {"train_loss": -28.400983810424805, "global_step": 19028, "epoch": 157} {"train_loss": -29.521167755126953, "global_step": 19029, "epoch": 157} {"train_loss": -29.071643829345703, "global_step": 19030, "epoch": 157} {"train_loss": -29.076765060424805, "global_step": 19031, "epoch": 157} {"train_loss": -28.826248168945312, "global_step": 19032, "epoch": 157} {"train_loss": -29.35955810546875, "global_step": 19033, "epoch": 157} {"train_loss": -28.663471221923828, "global_step": 19034, "epoch": 157} {"train_loss": -28.687042236328125, "global_step": 19035, "epoch": 157} {"train_loss": -29.305078506469727, "global_step": 19036, "epoch": 157} {"train_loss": -29.149738311767578, "global_step": 19037, "epoch": 157} {"train_loss": -28.80755615234375, "global_step": 19038, "epoch": 157} {"train_loss": -29.5195369720459, "global_step": 19039, "epoch": 157} {"train_loss": -28.87140464782715, "global_step": 19040, "epoch": 157} {"train_loss": -29.154794692993164, "global_step": 19041, "epoch": 157} {"train_loss": -28.87103843688965, "global_step": 19042, "epoch": 157} {"train_loss": -29.144433975219727, "global_step": 19043, "epoch": 157} {"train_loss": -28.754297256469727, "global_step": 19044, "epoch": 157} {"train_loss": -28.68568229675293, "global_step": 19045, "epoch": 157} {"train_loss": -29.5808048248291, "global_step": 19046, "epoch": 157} {"train_loss": -29.540678024291992, "global_step": 19047, "epoch": 157} {"train_loss": -29.073347091674805, "global_step": 19048, "epoch": 157} {"train_loss": -29.054712295532227, "global_step": 19049, "epoch": 157} {"train_loss": -29.01258659362793, "global_step": 19050, "epoch": 157} {"train_loss": -29.342878341674805, "global_step": 19051, "epoch": 157} {"train_loss": -29.3726863861084, "global_step": 19052, "epoch": 157} {"train_loss": -29.40482521057129, "global_step": 19053, "epoch": 157} {"train_loss": -29.283756256103516, "global_step": 19054, "epoch": 157} {"train_loss": -29.43153190612793, "global_step": 19055, "epoch": 157} {"train_loss": -29.758581161499023, "global_step": 19056, "epoch": 157} {"train_loss": -29.472766876220703, "global_step": 19057, "epoch": 157} {"train_loss": -28.925708770751953, "global_step": 19058, "epoch": 157} {"train_loss": -29.28596305847168, "global_step": 19059, "epoch": 157} {"train_loss": -29.541791915893555, "global_step": 19060, "epoch": 157} {"train_loss": -29.52377700805664, "global_step": 19061, "epoch": 157} {"train_loss": -29.1160831451416, "global_step": 19062, "epoch": 157} {"train_loss": -29.718366622924805, "global_step": 19063, "epoch": 157} {"train_loss": -29.99814224243164, "global_step": 19064, "epoch": 157} {"train_loss": -29.76822280883789, "global_step": 19065, "epoch": 157} {"train_loss": -29.495365142822266, "global_step": 19066, "epoch": 157} {"train_loss": -29.183944702148438, "global_step": 19067, "epoch": 157} {"train_loss": -29.366180419921875, "global_step": 19068, "epoch": 157} {"train_loss": -29.840723037719727, "global_step": 19069, "epoch": 157} {"train_loss": -29.646814346313477, "global_step": 19070, "epoch": 157} {"train_loss": -29.709091186523438, "global_step": 19071, "epoch": 157} {"train_loss": -30.03692054748535, "global_step": 19072, "epoch": 157} {"train_loss": -29.10052490234375, "global_step": 19073, "epoch": 157} {"train_loss": -29.69703483581543, "global_step": 19074, "epoch": 157} {"train_loss": -29.183837890625, "global_step": 19075, "epoch": 157} {"train_loss": -29.7982120513916, "global_step": 19076, "epoch": 157} {"train_loss": -29.99286460876465, "global_step": 19077, "epoch": 157} {"train_loss": -29.52959632873535, "global_step": 19078, "epoch": 157} {"train_loss": -29.19219398498535, "global_step": 19079, "epoch": 157} {"train_loss": -29.077421188354492, "global_step": 19080, "epoch": 157} {"train_loss": -28.564483642578125, "global_step": 19081, "epoch": 157} {"train_loss": -28.582351684570312, "global_step": 19082, "epoch": 157} {"train_loss": -28.798437118530273, "global_step": 19083, "epoch": 157} {"train_loss": -29.640161514282227, "global_step": 19084, "epoch": 157} {"train_loss": -29.781736373901367, "global_step": 19085, "epoch": 157} {"train_loss": -28.7457332611084, "global_step": 19086, "epoch": 157} {"train_loss": -28.22891616821289, "global_step": 19087, "epoch": 157} {"train_loss": -25.22176170349121, "global_step": 19088, "epoch": 157} {"train_loss": -25.796045303344727, "global_step": 19089, "epoch": 157} {"train_loss": -29.471149444580078, "global_step": 19090, "epoch": 157} {"train_loss": -27.593433380126953, "global_step": 19091, "epoch": 157} {"train_loss": -25.236927032470703, "global_step": 19092, "epoch": 157} {"train_loss": -28.5393009185791, "global_step": 19093, "epoch": 157} {"train_loss": -28.8978214263916, "global_step": 19094, "epoch": 157} {"train_loss": -27.04781150817871, "global_step": 19095, "epoch": 157} {"train_loss": -29.764062881469727, "global_step": 19096, "epoch": 157} {"train_loss": -27.806121826171875, "global_step": 19097, "epoch": 157} {"train_loss": -28.8088321685791, "global_step": 19098, "epoch": 157} {"train_loss": -28.58953857421875, "global_step": 19099, "epoch": 157} {"train_loss": -29.015100479125977, "global_step": 19100, "epoch": 157} {"train_loss": -28.599409103393555, "global_step": 19101, "epoch": 157} {"train_loss": -29.30240249633789, "global_step": 19102, "epoch": 157} {"train_loss": -28.89320182800293, "global_step": 19103, "epoch": 157} {"train_loss": -29.203632354736328, "global_step": 19104, "epoch": 157} {"train_loss": -29.58786964416504, "global_step": 19105, "epoch": 157} {"train_loss": -29.1063175201416, "global_step": 19106, "epoch": 157} {"train_loss": -29.815841674804688, "global_step": 19107, "epoch": 157} {"train_loss": -29.24273109436035, "global_step": 19108, "epoch": 157} {"train_loss": -29.36394691467285, "global_step": 19109, "epoch": 157} {"train_loss": -29.49518394470215, "global_step": 19110, "epoch": 157} {"train_loss": -29.31744384765625, "global_step": 19111, "epoch": 157} {"train_loss": -29.3839054107666, "global_step": 19112, "epoch": 157} {"train_loss": -29.629552841186523, "global_step": 19113, "epoch": 157} {"train_loss": -29.637969970703125, "global_step": 19114, "epoch": 157} {"train_loss": -29.76685905456543, "global_step": 19115, "epoch": 157} {"train_loss": -29.31402587890625, "global_step": 19116, "epoch": 157} {"train_loss": -28.957682459807593, "global_step": 19117, "epoch": 157, "val_loss": 2623117.75} {"train_loss": -28.94345474243164, "global_step": 19118, "epoch": 158} {"train_loss": -28.748106002807617, "global_step": 19119, "epoch": 158} {"train_loss": -28.707427978515625, "global_step": 19120, "epoch": 158} {"train_loss": -28.222869873046875, "global_step": 19121, "epoch": 158} {"train_loss": -29.328577041625977, "global_step": 19122, "epoch": 158} {"train_loss": -28.446752548217773, "global_step": 19123, "epoch": 158} {"train_loss": -29.051441192626953, "global_step": 19124, "epoch": 158} {"train_loss": -29.230077743530273, "global_step": 19125, "epoch": 158} {"train_loss": -29.521032333374023, "global_step": 19126, "epoch": 158} {"train_loss": -29.100873947143555, "global_step": 19127, "epoch": 158} {"train_loss": -28.676410675048828, "global_step": 19128, "epoch": 158} {"train_loss": -29.6140193939209, "global_step": 19129, "epoch": 158} {"train_loss": -28.397369384765625, "global_step": 19130, "epoch": 158} {"train_loss": -29.9295711517334, "global_step": 19131, "epoch": 158} {"train_loss": -28.519412994384766, "global_step": 19132, "epoch": 158} {"train_loss": -29.07232093811035, "global_step": 19133, "epoch": 158} {"train_loss": -29.45020866394043, "global_step": 19134, "epoch": 158} {"train_loss": -29.408588409423828, "global_step": 19135, "epoch": 158} {"train_loss": -29.630908966064453, "global_step": 19136, "epoch": 158} {"train_loss": -28.996753692626953, "global_step": 19137, "epoch": 158} {"train_loss": -28.669031143188477, "global_step": 19138, "epoch": 158} {"train_loss": -27.853652954101562, "global_step": 19139, "epoch": 158} {"train_loss": -28.767913818359375, "global_step": 19140, "epoch": 158} {"train_loss": -27.995685577392578, "global_step": 19141, "epoch": 158} {"train_loss": -28.6414794921875, "global_step": 19142, "epoch": 158} {"train_loss": -29.571439743041992, "global_step": 19143, "epoch": 158} {"train_loss": -28.362823486328125, "global_step": 19144, "epoch": 158} {"train_loss": -28.169574737548828, "global_step": 19145, "epoch": 158} {"train_loss": -29.90360450744629, "global_step": 19146, "epoch": 158} {"train_loss": -28.863739013671875, "global_step": 19147, "epoch": 158} {"train_loss": -28.237934112548828, "global_step": 19148, "epoch": 158} {"train_loss": -29.3011531829834, "global_step": 19149, "epoch": 158} {"train_loss": -28.385272979736328, "global_step": 19150, "epoch": 158} {"train_loss": -29.16777992248535, "global_step": 19151, "epoch": 158} {"train_loss": -27.931501388549805, "global_step": 19152, "epoch": 158} {"train_loss": -28.59760856628418, "global_step": 19153, "epoch": 158} {"train_loss": -26.46876335144043, "global_step": 19154, "epoch": 158} {"train_loss": -25.729928970336914, "global_step": 19155, "epoch": 158} {"train_loss": -28.10920524597168, "global_step": 19156, "epoch": 158} {"train_loss": -28.198516845703125, "global_step": 19157, "epoch": 158} {"train_loss": -28.007587432861328, "global_step": 19158, "epoch": 158} {"train_loss": -27.952524185180664, "global_step": 19159, "epoch": 158} {"train_loss": -28.619876861572266, "global_step": 19160, "epoch": 158} {"train_loss": -27.97381591796875, "global_step": 19161, "epoch": 158} {"train_loss": -27.707849502563477, "global_step": 19162, "epoch": 158} {"train_loss": -28.56572914123535, "global_step": 19163, "epoch": 158} {"train_loss": -28.930267333984375, "global_step": 19164, "epoch": 158} {"train_loss": -28.796762466430664, "global_step": 19165, "epoch": 158} {"train_loss": -27.756113052368164, "global_step": 19166, "epoch": 158} {"train_loss": -28.356367111206055, "global_step": 19167, "epoch": 158} {"train_loss": -28.7083797454834, "global_step": 19168, "epoch": 158} {"train_loss": -29.24604606628418, "global_step": 19169, "epoch": 158} {"train_loss": -28.720197677612305, "global_step": 19170, "epoch": 158} {"train_loss": -28.905303955078125, "global_step": 19171, "epoch": 158} {"train_loss": -28.868900299072266, "global_step": 19172, "epoch": 158} {"train_loss": -29.056116104125977, "global_step": 19173, "epoch": 158} {"train_loss": -29.15669059753418, "global_step": 19174, "epoch": 158} {"train_loss": -29.5053653717041, "global_step": 19175, "epoch": 158} {"train_loss": -28.585926055908203, "global_step": 19176, "epoch": 158} {"train_loss": -29.077245712280273, "global_step": 19177, "epoch": 158} {"train_loss": -29.080245971679688, "global_step": 19178, "epoch": 158} {"train_loss": -28.551794052124023, "global_step": 19179, "epoch": 158} {"train_loss": -28.86220359802246, "global_step": 19180, "epoch": 158} {"train_loss": -29.24480628967285, "global_step": 19181, "epoch": 158} {"train_loss": -28.92954444885254, "global_step": 19182, "epoch": 158} {"train_loss": -28.75872230529785, "global_step": 19183, "epoch": 158} {"train_loss": -29.51014518737793, "global_step": 19184, "epoch": 158} {"train_loss": -29.639347076416016, "global_step": 19185, "epoch": 158} {"train_loss": -28.801843643188477, "global_step": 19186, "epoch": 158} {"train_loss": -29.375564575195312, "global_step": 19187, "epoch": 158} {"train_loss": -29.583942413330078, "global_step": 19188, "epoch": 158} {"train_loss": -29.35397720336914, "global_step": 19189, "epoch": 158} {"train_loss": -29.295324325561523, "global_step": 19190, "epoch": 158} {"train_loss": -29.369855880737305, "global_step": 19191, "epoch": 158} {"train_loss": -29.7017822265625, "global_step": 19192, "epoch": 158} {"train_loss": -29.7940673828125, "global_step": 19193, "epoch": 158} {"train_loss": -29.401464462280273, "global_step": 19194, "epoch": 158} {"train_loss": -29.695281982421875, "global_step": 19195, "epoch": 158} {"train_loss": -29.84479331970215, "global_step": 19196, "epoch": 158} {"train_loss": -29.112096786499023, "global_step": 19197, "epoch": 158} {"train_loss": -29.291473388671875, "global_step": 19198, "epoch": 158} {"train_loss": -29.971363067626953, "global_step": 19199, "epoch": 158} {"train_loss": -29.333707809448242, "global_step": 19200, "epoch": 158} {"train_loss": -29.475738525390625, "global_step": 19201, "epoch": 158} {"train_loss": -29.82343101501465, "global_step": 19202, "epoch": 158} {"train_loss": -29.74372673034668, "global_step": 19203, "epoch": 158} {"train_loss": -29.301000595092773, "global_step": 19204, "epoch": 158} {"train_loss": -29.859115600585938, "global_step": 19205, "epoch": 158} {"train_loss": -29.794147491455078, "global_step": 19206, "epoch": 158} {"train_loss": -29.18389892578125, "global_step": 19207, "epoch": 158} {"train_loss": -28.872766494750977, "global_step": 19208, "epoch": 158} {"train_loss": -29.930334091186523, "global_step": 19209, "epoch": 158} {"train_loss": -29.6885929107666, "global_step": 19210, "epoch": 158} {"train_loss": -29.500776290893555, "global_step": 19211, "epoch": 158} {"train_loss": -29.629413604736328, "global_step": 19212, "epoch": 158} {"train_loss": -29.392627716064453, "global_step": 19213, "epoch": 158} {"train_loss": -29.431562423706055, "global_step": 19214, "epoch": 158} {"train_loss": -28.738571166992188, "global_step": 19215, "epoch": 158} {"train_loss": -29.586755752563477, "global_step": 19216, "epoch": 158} {"train_loss": -29.553192138671875, "global_step": 19217, "epoch": 158} {"train_loss": -29.552194595336914, "global_step": 19218, "epoch": 158} {"train_loss": -30.05242919921875, "global_step": 19219, "epoch": 158} {"train_loss": -29.745441436767578, "global_step": 19220, "epoch": 158} {"train_loss": -29.905364990234375, "global_step": 19221, "epoch": 158} {"train_loss": -29.914813995361328, "global_step": 19222, "epoch": 158} {"train_loss": -30.1301212310791, "global_step": 19223, "epoch": 158} {"train_loss": -29.982486724853516, "global_step": 19224, "epoch": 158} {"train_loss": -29.313446044921875, "global_step": 19225, "epoch": 158} {"train_loss": -30.074934005737305, "global_step": 19226, "epoch": 158} {"train_loss": -29.864789962768555, "global_step": 19227, "epoch": 158} {"train_loss": -30.037372589111328, "global_step": 19228, "epoch": 158} {"train_loss": -29.925031661987305, "global_step": 19229, "epoch": 158} {"train_loss": -28.653013229370117, "global_step": 19230, "epoch": 158} {"train_loss": -27.394636154174805, "global_step": 19231, "epoch": 158} {"train_loss": -29.25846290588379, "global_step": 19232, "epoch": 158} {"train_loss": -29.0218448638916, "global_step": 19233, "epoch": 158} {"train_loss": -26.0224552154541, "global_step": 19234, "epoch": 158} {"train_loss": -26.632917404174805, "global_step": 19235, "epoch": 158} {"train_loss": -25.61355972290039, "global_step": 19236, "epoch": 158} {"train_loss": -24.75969123840332, "global_step": 19237, "epoch": 158} {"train_loss": -28.921139535825116, "global_step": 19238, "epoch": 158, "val_loss": 2750644.75} {"train_loss": -27.606342315673828, "global_step": 19239, "epoch": 159} {"train_loss": -25.57542610168457, "global_step": 19240, "epoch": 159} {"train_loss": -28.038000106811523, "global_step": 19241, "epoch": 159} {"train_loss": -26.58599281311035, "global_step": 19242, "epoch": 159} {"train_loss": -29.15179443359375, "global_step": 19243, "epoch": 159} {"train_loss": -27.673505783081055, "global_step": 19244, "epoch": 159} {"train_loss": -28.073911666870117, "global_step": 19245, "epoch": 159} {"train_loss": -28.95904541015625, "global_step": 19246, "epoch": 159} {"train_loss": -28.168664932250977, "global_step": 19247, "epoch": 159} {"train_loss": -28.454345703125, "global_step": 19248, "epoch": 159} {"train_loss": -28.916467666625977, "global_step": 19249, "epoch": 159} {"train_loss": -27.742578506469727, "global_step": 19250, "epoch": 159} {"train_loss": -28.321985244750977, "global_step": 19251, "epoch": 159} {"train_loss": -28.6602783203125, "global_step": 19252, "epoch": 159} {"train_loss": -28.438800811767578, "global_step": 19253, "epoch": 159} {"train_loss": -29.554059982299805, "global_step": 19254, "epoch": 159} {"train_loss": -28.903249740600586, "global_step": 19255, "epoch": 159} {"train_loss": -29.066761016845703, "global_step": 19256, "epoch": 159} {"train_loss": -28.787561416625977, "global_step": 19257, "epoch": 159} {"train_loss": -29.102529525756836, "global_step": 19258, "epoch": 159} {"train_loss": -29.08015251159668, "global_step": 19259, "epoch": 159} {"train_loss": -29.310882568359375, "global_step": 19260, "epoch": 159} {"train_loss": -29.196258544921875, "global_step": 19261, "epoch": 159} {"train_loss": -28.940723419189453, "global_step": 19262, "epoch": 159} {"train_loss": -29.243000030517578, "global_step": 19263, "epoch": 159} {"train_loss": -29.269025802612305, "global_step": 19264, "epoch": 159} {"train_loss": -29.6333065032959, "global_step": 19265, "epoch": 159} {"train_loss": -28.086109161376953, "global_step": 19266, "epoch": 159} {"train_loss": -29.310449600219727, "global_step": 19267, "epoch": 159} {"train_loss": -28.50895118713379, "global_step": 19268, "epoch": 159} {"train_loss": -28.40520668029785, "global_step": 19269, "epoch": 159} {"train_loss": -28.555023193359375, "global_step": 19270, "epoch": 159} {"train_loss": -28.65337562561035, "global_step": 19271, "epoch": 159} {"train_loss": -28.713834762573242, "global_step": 19272, "epoch": 159} {"train_loss": -29.120471954345703, "global_step": 19273, "epoch": 159} {"train_loss": -28.497913360595703, "global_step": 19274, "epoch": 159} {"train_loss": -29.722797393798828, "global_step": 19275, "epoch": 159} {"train_loss": -29.33233642578125, "global_step": 19276, "epoch": 159} {"train_loss": -29.534759521484375, "global_step": 19277, "epoch": 159} {"train_loss": -29.57503318786621, "global_step": 19278, "epoch": 159} {"train_loss": -29.079715728759766, "global_step": 19279, "epoch": 159} {"train_loss": -29.341461181640625, "global_step": 19280, "epoch": 159} {"train_loss": -29.4371280670166, "global_step": 19281, "epoch": 159} {"train_loss": -28.623746871948242, "global_step": 19282, "epoch": 159} {"train_loss": -29.7249698638916, "global_step": 19283, "epoch": 159} {"train_loss": -28.69053077697754, "global_step": 19284, "epoch": 159} {"train_loss": -28.267847061157227, "global_step": 19285, "epoch": 159} {"train_loss": -28.089340209960938, "global_step": 19286, "epoch": 159} {"train_loss": -29.35978126525879, "global_step": 19287, "epoch": 159} {"train_loss": -29.18798828125, "global_step": 19288, "epoch": 159} {"train_loss": -29.232580184936523, "global_step": 19289, "epoch": 159} {"train_loss": -29.527021408081055, "global_step": 19290, "epoch": 159} {"train_loss": -29.78521728515625, "global_step": 19291, "epoch": 159} {"train_loss": -29.049962997436523, "global_step": 19292, "epoch": 159} {"train_loss": -28.789794921875, "global_step": 19293, "epoch": 159} {"train_loss": -29.10222816467285, "global_step": 19294, "epoch": 159} {"train_loss": -29.80962562561035, "global_step": 19295, "epoch": 159} {"train_loss": -29.534677505493164, "global_step": 19296, "epoch": 159} {"train_loss": -29.674640655517578, "global_step": 19297, "epoch": 159} {"train_loss": -29.366626739501953, "global_step": 19298, "epoch": 159} {"train_loss": -29.85462760925293, "global_step": 19299, "epoch": 159} {"train_loss": -29.9350643157959, "global_step": 19300, "epoch": 159} {"train_loss": -29.34844970703125, "global_step": 19301, "epoch": 159} {"train_loss": -29.550622940063477, "global_step": 19302, "epoch": 159} {"train_loss": -29.74906349182129, "global_step": 19303, "epoch": 159} {"train_loss": -29.800601959228516, "global_step": 19304, "epoch": 159} {"train_loss": -30.11810302734375, "global_step": 19305, "epoch": 159} {"train_loss": -29.652057647705078, "global_step": 19306, "epoch": 159} {"train_loss": -29.569061279296875, "global_step": 19307, "epoch": 159} {"train_loss": -29.539966583251953, "global_step": 19308, "epoch": 159} {"train_loss": -28.765653610229492, "global_step": 19309, "epoch": 159} {"train_loss": -29.659940719604492, "global_step": 19310, "epoch": 159} {"train_loss": -29.17645263671875, "global_step": 19311, "epoch": 159} {"train_loss": -29.25823974609375, "global_step": 19312, "epoch": 159} {"train_loss": -29.582611083984375, "global_step": 19313, "epoch": 159} {"train_loss": -29.234663009643555, "global_step": 19314, "epoch": 159} {"train_loss": -29.671218872070312, "global_step": 19315, "epoch": 159} {"train_loss": -29.962665557861328, "global_step": 19316, "epoch": 159} {"train_loss": -29.657424926757812, "global_step": 19317, "epoch": 159} {"train_loss": -27.92811393737793, "global_step": 19318, "epoch": 159} {"train_loss": -26.014163970947266, "global_step": 19319, "epoch": 159} {"train_loss": -16.8327693939209, "global_step": 19320, "epoch": 159} {"train_loss": -6.365520000457764, "global_step": 19321, "epoch": 159} {"train_loss": -23.654809951782227, "global_step": 19322, "epoch": 159} {"train_loss": -22.012908935546875, "global_step": 19323, "epoch": 159} {"train_loss": -22.33785057067871, "global_step": 19324, "epoch": 159} {"train_loss": -23.041637420654297, "global_step": 19325, "epoch": 159} {"train_loss": -28.261388778686523, "global_step": 19326, "epoch": 159} {"train_loss": -22.816640853881836, "global_step": 19327, "epoch": 159} {"train_loss": -28.23432731628418, "global_step": 19328, "epoch": 159} {"train_loss": -25.5352783203125, "global_step": 19329, "epoch": 159} {"train_loss": -27.183435440063477, "global_step": 19330, "epoch": 159} {"train_loss": -26.219640731811523, "global_step": 19331, "epoch": 159} {"train_loss": -28.016164779663086, "global_step": 19332, "epoch": 159} {"train_loss": -27.015735626220703, "global_step": 19333, "epoch": 159} {"train_loss": -27.364912033081055, "global_step": 19334, "epoch": 159} {"train_loss": -27.69734764099121, "global_step": 19335, "epoch": 159} {"train_loss": -27.318716049194336, "global_step": 19336, "epoch": 159} {"train_loss": -28.229536056518555, "global_step": 19337, "epoch": 159} {"train_loss": -28.890928268432617, "global_step": 19338, "epoch": 159} {"train_loss": -28.095855712890625, "global_step": 19339, "epoch": 159} {"train_loss": -28.0546817779541, "global_step": 19340, "epoch": 159} {"train_loss": -28.611730575561523, "global_step": 19341, "epoch": 159} {"train_loss": -28.10772705078125, "global_step": 19342, "epoch": 159} {"train_loss": -28.146915435791016, "global_step": 19343, "epoch": 159} {"train_loss": -28.701648712158203, "global_step": 19344, "epoch": 159} {"train_loss": -28.593915939331055, "global_step": 19345, "epoch": 159} {"train_loss": -28.013031005859375, "global_step": 19346, "epoch": 159} {"train_loss": -28.545185089111328, "global_step": 19347, "epoch": 159} {"train_loss": -28.745258331298828, "global_step": 19348, "epoch": 159} {"train_loss": -28.83619499206543, "global_step": 19349, "epoch": 159} {"train_loss": -28.628427505493164, "global_step": 19350, "epoch": 159} {"train_loss": -28.73158073425293, "global_step": 19351, "epoch": 159} {"train_loss": -28.649084091186523, "global_step": 19352, "epoch": 159} {"train_loss": -28.993574142456055, "global_step": 19353, "epoch": 159} {"train_loss": -29.093433380126953, "global_step": 19354, "epoch": 159} {"train_loss": -28.7906494140625, "global_step": 19355, "epoch": 159} {"train_loss": -29.0290470123291, "global_step": 19356, "epoch": 159} {"train_loss": -28.901548385620117, "global_step": 19357, "epoch": 159} {"train_loss": -29.008529663085938, "global_step": 19358, "epoch": 159} {"train_loss": -28.21685929337809, "global_step": 19359, "epoch": 159, "val_loss": 2755113.25} {"train_loss": -29.25345230102539, "global_step": 19360, "epoch": 160} {"train_loss": -29.22625732421875, "global_step": 19361, "epoch": 160} {"train_loss": -28.924041748046875, "global_step": 19362, "epoch": 160} {"train_loss": -29.49456214904785, "global_step": 19363, "epoch": 160} {"train_loss": -29.007232666015625, "global_step": 19364, "epoch": 160} {"train_loss": -29.03179931640625, "global_step": 19365, "epoch": 160} {"train_loss": -29.160755157470703, "global_step": 19366, "epoch": 160} {"train_loss": -28.98553466796875, "global_step": 19367, "epoch": 160} {"train_loss": -28.661548614501953, "global_step": 19368, "epoch": 160} {"train_loss": -28.99177360534668, "global_step": 19369, "epoch": 160} {"train_loss": -28.5233211517334, "global_step": 19370, "epoch": 160} {"train_loss": -27.97218132019043, "global_step": 19371, "epoch": 160} {"train_loss": -28.16554069519043, "global_step": 19372, "epoch": 160} {"train_loss": -27.751678466796875, "global_step": 19373, "epoch": 160} {"train_loss": -27.029769897460938, "global_step": 19374, "epoch": 160} {"train_loss": -26.289426803588867, "global_step": 19375, "epoch": 160} {"train_loss": -23.566190719604492, "global_step": 19376, "epoch": 160} {"train_loss": -21.64839744567871, "global_step": 19377, "epoch": 160} {"train_loss": -28.31400489807129, "global_step": 19378, "epoch": 160} {"train_loss": -24.422863006591797, "global_step": 19379, "epoch": 160} {"train_loss": -27.021459579467773, "global_step": 19380, "epoch": 160} {"train_loss": -27.70701026916504, "global_step": 19381, "epoch": 160} {"train_loss": -27.01930046081543, "global_step": 19382, "epoch": 160} {"train_loss": -26.7644100189209, "global_step": 19383, "epoch": 160} {"train_loss": -27.60935401916504, "global_step": 19384, "epoch": 160} {"train_loss": -27.534116744995117, "global_step": 19385, "epoch": 160} {"train_loss": -28.368383407592773, "global_step": 19386, "epoch": 160} {"train_loss": -27.497770309448242, "global_step": 19387, "epoch": 160} {"train_loss": -28.037710189819336, "global_step": 19388, "epoch": 160} {"train_loss": -27.84522819519043, "global_step": 19389, "epoch": 160} {"train_loss": -28.253921508789062, "global_step": 19390, "epoch": 160} {"train_loss": -28.45148277282715, "global_step": 19391, "epoch": 160} {"train_loss": -28.050241470336914, "global_step": 19392, "epoch": 160} {"train_loss": -28.058216094970703, "global_step": 19393, "epoch": 160} {"train_loss": -28.5310115814209, "global_step": 19394, "epoch": 160} {"train_loss": -28.4840030670166, "global_step": 19395, "epoch": 160} {"train_loss": -28.30133056640625, "global_step": 19396, "epoch": 160} {"train_loss": -28.58111572265625, "global_step": 19397, "epoch": 160} {"train_loss": -28.520008087158203, "global_step": 19398, "epoch": 160} {"train_loss": -28.32525062561035, "global_step": 19399, "epoch": 160} {"train_loss": -28.279809951782227, "global_step": 19400, "epoch": 160} {"train_loss": -28.57693862915039, "global_step": 19401, "epoch": 160} {"train_loss": -28.352445602416992, "global_step": 19402, "epoch": 160} {"train_loss": -28.2418270111084, "global_step": 19403, "epoch": 160} {"train_loss": -28.473968505859375, "global_step": 19404, "epoch": 160} {"train_loss": -28.476520538330078, "global_step": 19405, "epoch": 160} {"train_loss": -28.741907119750977, "global_step": 19406, "epoch": 160} {"train_loss": -29.025644302368164, "global_step": 19407, "epoch": 160} {"train_loss": -28.853124618530273, "global_step": 19408, "epoch": 160} {"train_loss": -28.758106231689453, "global_step": 19409, "epoch": 160} {"train_loss": -28.697254180908203, "global_step": 19410, "epoch": 160} {"train_loss": -28.734731674194336, "global_step": 19411, "epoch": 160} {"train_loss": -28.806610107421875, "global_step": 19412, "epoch": 160} {"train_loss": -28.980356216430664, "global_step": 19413, "epoch": 160} {"train_loss": -29.184194564819336, "global_step": 19414, "epoch": 160} {"train_loss": -29.16792106628418, "global_step": 19415, "epoch": 160} {"train_loss": -29.14546012878418, "global_step": 19416, "epoch": 160} {"train_loss": -29.352807998657227, "global_step": 19417, "epoch": 160} {"train_loss": -29.283599853515625, "global_step": 19418, "epoch": 160} {"train_loss": -29.427703857421875, "global_step": 19419, "epoch": 160} {"train_loss": -29.39591407775879, "global_step": 19420, "epoch": 160} {"train_loss": -29.293354034423828, "global_step": 19421, "epoch": 160} {"train_loss": -29.34527015686035, "global_step": 19422, "epoch": 160} {"train_loss": -28.933246612548828, "global_step": 19423, "epoch": 160} {"train_loss": -29.36997413635254, "global_step": 19424, "epoch": 160} {"train_loss": -29.33905601501465, "global_step": 19425, "epoch": 160} {"train_loss": -29.43635368347168, "global_step": 19426, "epoch": 160} {"train_loss": -29.569568634033203, "global_step": 19427, "epoch": 160} {"train_loss": -29.395370483398438, "global_step": 19428, "epoch": 160} {"train_loss": -29.632837295532227, "global_step": 19429, "epoch": 160} {"train_loss": -29.10737419128418, "global_step": 19430, "epoch": 160} {"train_loss": -29.445667266845703, "global_step": 19431, "epoch": 160} {"train_loss": -28.88591957092285, "global_step": 19432, "epoch": 160} {"train_loss": -28.736530303955078, "global_step": 19433, "epoch": 160} {"train_loss": -29.372278213500977, "global_step": 19434, "epoch": 160} {"train_loss": -29.700403213500977, "global_step": 19435, "epoch": 160} {"train_loss": -28.97028160095215, "global_step": 19436, "epoch": 160} {"train_loss": -29.58040428161621, "global_step": 19437, "epoch": 160} {"train_loss": -29.741254806518555, "global_step": 19438, "epoch": 160} {"train_loss": -28.86972427368164, "global_step": 19439, "epoch": 160} {"train_loss": -29.707706451416016, "global_step": 19440, "epoch": 160} {"train_loss": -29.472387313842773, "global_step": 19441, "epoch": 160} {"train_loss": -29.552356719970703, "global_step": 19442, "epoch": 160} {"train_loss": -29.154882431030273, "global_step": 19443, "epoch": 160} {"train_loss": -28.875, "global_step": 19444, "epoch": 160} {"train_loss": -29.512958526611328, "global_step": 19445, "epoch": 160} {"train_loss": -29.71510887145996, "global_step": 19446, "epoch": 160} {"train_loss": -29.557025909423828, "global_step": 19447, "epoch": 160} {"train_loss": -29.58664321899414, "global_step": 19448, "epoch": 160} {"train_loss": -28.857885360717773, "global_step": 19449, "epoch": 160} {"train_loss": -28.49772071838379, "global_step": 19450, "epoch": 160} {"train_loss": -29.382299423217773, "global_step": 19451, "epoch": 160} {"train_loss": -29.323511123657227, "global_step": 19452, "epoch": 160} {"train_loss": -28.18108558654785, "global_step": 19453, "epoch": 160} {"train_loss": -28.0487003326416, "global_step": 19454, "epoch": 160} {"train_loss": -28.119428634643555, "global_step": 19455, "epoch": 160} {"train_loss": -28.55536460876465, "global_step": 19456, "epoch": 160} {"train_loss": -28.0494384765625, "global_step": 19457, "epoch": 160} {"train_loss": -27.775625228881836, "global_step": 19458, "epoch": 160} {"train_loss": -28.26836585998535, "global_step": 19459, "epoch": 160} {"train_loss": -28.238250732421875, "global_step": 19460, "epoch": 160} {"train_loss": -29.11588478088379, "global_step": 19461, "epoch": 160} {"train_loss": -28.175262451171875, "global_step": 19462, "epoch": 160} {"train_loss": -29.564050674438477, "global_step": 19463, "epoch": 160} {"train_loss": -27.13092613220215, "global_step": 19464, "epoch": 160} {"train_loss": -28.49161148071289, "global_step": 19465, "epoch": 160} {"train_loss": -28.719989776611328, "global_step": 19466, "epoch": 160} {"train_loss": -28.68006706237793, "global_step": 19467, "epoch": 160} {"train_loss": -29.074146270751953, "global_step": 19468, "epoch": 160} {"train_loss": -28.837202072143555, "global_step": 19469, "epoch": 160} {"train_loss": -29.418798446655273, "global_step": 19470, "epoch": 160} {"train_loss": -28.858356475830078, "global_step": 19471, "epoch": 160} {"train_loss": -29.0700740814209, "global_step": 19472, "epoch": 160} {"train_loss": -29.62883949279785, "global_step": 19473, "epoch": 160} {"train_loss": -29.08782958984375, "global_step": 19474, "epoch": 160} {"train_loss": -29.35052490234375, "global_step": 19475, "epoch": 160} {"train_loss": -29.845184326171875, "global_step": 19476, "epoch": 160} {"train_loss": -29.22669792175293, "global_step": 19477, "epoch": 160} {"train_loss": -29.55281639099121, "global_step": 19478, "epoch": 160} {"train_loss": -29.576169967651367, "global_step": 19479, "epoch": 160} {"train_loss": -28.62400384382768, "global_step": 19480, "epoch": 160, "val_loss": 2611668.0} {"train_loss": -29.39031410217285, "global_step": 19481, "epoch": 161} {"train_loss": -29.676748275756836, "global_step": 19482, "epoch": 161} {"train_loss": -29.498376846313477, "global_step": 19483, "epoch": 161} {"train_loss": -29.89363670349121, "global_step": 19484, "epoch": 161} {"train_loss": -29.011322021484375, "global_step": 19485, "epoch": 161} {"train_loss": -29.561025619506836, "global_step": 19486, "epoch": 161} {"train_loss": -29.744916915893555, "global_step": 19487, "epoch": 161} {"train_loss": -29.6141357421875, "global_step": 19488, "epoch": 161} {"train_loss": -29.519704818725586, "global_step": 19489, "epoch": 161} {"train_loss": -29.72623062133789, "global_step": 19490, "epoch": 161} {"train_loss": -29.5943603515625, "global_step": 19491, "epoch": 161} {"train_loss": -29.82704734802246, "global_step": 19492, "epoch": 161} {"train_loss": -30.00673484802246, "global_step": 19493, "epoch": 161} {"train_loss": -29.681842803955078, "global_step": 19494, "epoch": 161} {"train_loss": -29.580358505249023, "global_step": 19495, "epoch": 161} {"train_loss": -29.074451446533203, "global_step": 19496, "epoch": 161} {"train_loss": -29.630102157592773, "global_step": 19497, "epoch": 161} {"train_loss": -29.61321449279785, "global_step": 19498, "epoch": 161} {"train_loss": -28.8078670501709, "global_step": 19499, "epoch": 161} {"train_loss": -30.001596450805664, "global_step": 19500, "epoch": 161} {"train_loss": -29.506641387939453, "global_step": 19501, "epoch": 161} {"train_loss": -28.915771484375, "global_step": 19502, "epoch": 161} {"train_loss": -29.717004776000977, "global_step": 19503, "epoch": 161} {"train_loss": -29.319721221923828, "global_step": 19504, "epoch": 161} {"train_loss": -29.781269073486328, "global_step": 19505, "epoch": 161} {"train_loss": -29.631452560424805, "global_step": 19506, "epoch": 161} {"train_loss": -29.5750675201416, "global_step": 19507, "epoch": 161} {"train_loss": -29.062726974487305, "global_step": 19508, "epoch": 161} {"train_loss": -28.60493278503418, "global_step": 19509, "epoch": 161} {"train_loss": -30.038623809814453, "global_step": 19510, "epoch": 161} {"train_loss": -29.242822647094727, "global_step": 19511, "epoch": 161} {"train_loss": -29.539392471313477, "global_step": 19512, "epoch": 161} {"train_loss": -29.245283126831055, "global_step": 19513, "epoch": 161} {"train_loss": -28.575300216674805, "global_step": 19514, "epoch": 161} {"train_loss": -26.61380386352539, "global_step": 19515, "epoch": 161} {"train_loss": -22.409255981445312, "global_step": 19516, "epoch": 161} {"train_loss": -22.1221866607666, "global_step": 19517, "epoch": 161} {"train_loss": -25.27982521057129, "global_step": 19518, "epoch": 161} {"train_loss": -28.95758056640625, "global_step": 19519, "epoch": 161} {"train_loss": -26.636621475219727, "global_step": 19520, "epoch": 161} {"train_loss": -28.855688095092773, "global_step": 19521, "epoch": 161} {"train_loss": -28.593488693237305, "global_step": 19522, "epoch": 161} {"train_loss": -27.71492576599121, "global_step": 19523, "epoch": 161} {"train_loss": -29.335712432861328, "global_step": 19524, "epoch": 161} {"train_loss": -28.31318473815918, "global_step": 19525, "epoch": 161} {"train_loss": -28.386966705322266, "global_step": 19526, "epoch": 161} {"train_loss": -28.709863662719727, "global_step": 19527, "epoch": 161} {"train_loss": -29.25678062438965, "global_step": 19528, "epoch": 161} {"train_loss": -28.68841552734375, "global_step": 19529, "epoch": 161} {"train_loss": -28.558874130249023, "global_step": 19530, "epoch": 161} {"train_loss": -29.248458862304688, "global_step": 19531, "epoch": 161} {"train_loss": -29.564136505126953, "global_step": 19532, "epoch": 161} {"train_loss": -29.251188278198242, "global_step": 19533, "epoch": 161} {"train_loss": -28.753992080688477, "global_step": 19534, "epoch": 161} {"train_loss": -29.416791915893555, "global_step": 19535, "epoch": 161} {"train_loss": -29.452301025390625, "global_step": 19536, "epoch": 161} {"train_loss": -29.434778213500977, "global_step": 19537, "epoch": 161} {"train_loss": -29.587026596069336, "global_step": 19538, "epoch": 161} {"train_loss": -29.600967407226562, "global_step": 19539, "epoch": 161} {"train_loss": -29.403751373291016, "global_step": 19540, "epoch": 161} {"train_loss": -29.59039306640625, "global_step": 19541, "epoch": 161} {"train_loss": -29.306180953979492, "global_step": 19542, "epoch": 161} {"train_loss": -29.539154052734375, "global_step": 19543, "epoch": 161} {"train_loss": -29.582666397094727, "global_step": 19544, "epoch": 161} {"train_loss": -29.79104995727539, "global_step": 19545, "epoch": 161} {"train_loss": -29.341882705688477, "global_step": 19546, "epoch": 161} {"train_loss": -29.809619903564453, "global_step": 19547, "epoch": 161} {"train_loss": -29.525785446166992, "global_step": 19548, "epoch": 161} {"train_loss": -29.84662437438965, "global_step": 19549, "epoch": 161} {"train_loss": -29.054357528686523, "global_step": 19550, "epoch": 161} {"train_loss": -28.4031925201416, "global_step": 19551, "epoch": 161} {"train_loss": -26.394046783447266, "global_step": 19552, "epoch": 161} {"train_loss": -24.200214385986328, "global_step": 19553, "epoch": 161} {"train_loss": -25.36073875427246, "global_step": 19554, "epoch": 161} {"train_loss": -27.516077041625977, "global_step": 19555, "epoch": 161} {"train_loss": -29.226465225219727, "global_step": 19556, "epoch": 161} {"train_loss": -28.620380401611328, "global_step": 19557, "epoch": 161} {"train_loss": -28.213083267211914, "global_step": 19558, "epoch": 161} {"train_loss": -29.50496482849121, "global_step": 19559, "epoch": 161} {"train_loss": -28.999103546142578, "global_step": 19560, "epoch": 161} {"train_loss": -29.98858070373535, "global_step": 19561, "epoch": 161} {"train_loss": -28.83369255065918, "global_step": 19562, "epoch": 161} {"train_loss": -29.566120147705078, "global_step": 19563, "epoch": 161} {"train_loss": -28.90321922302246, "global_step": 19564, "epoch": 161} {"train_loss": -28.950788497924805, "global_step": 19565, "epoch": 161} {"train_loss": -29.0396671295166, "global_step": 19566, "epoch": 161} {"train_loss": -29.619129180908203, "global_step": 19567, "epoch": 161} {"train_loss": -28.926523208618164, "global_step": 19568, "epoch": 161} {"train_loss": -29.251977920532227, "global_step": 19569, "epoch": 161} {"train_loss": -29.34199333190918, "global_step": 19570, "epoch": 161} {"train_loss": -29.602542877197266, "global_step": 19571, "epoch": 161} {"train_loss": -29.213239669799805, "global_step": 19572, "epoch": 161} {"train_loss": -28.970123291015625, "global_step": 19573, "epoch": 161} {"train_loss": -28.972900390625, "global_step": 19574, "epoch": 161} {"train_loss": -29.101932525634766, "global_step": 19575, "epoch": 161} {"train_loss": -29.006567001342773, "global_step": 19576, "epoch": 161} {"train_loss": -28.684528350830078, "global_step": 19577, "epoch": 161} {"train_loss": -29.550521850585938, "global_step": 19578, "epoch": 161} {"train_loss": -29.295995712280273, "global_step": 19579, "epoch": 161} {"train_loss": -29.260761260986328, "global_step": 19580, "epoch": 161} {"train_loss": -29.053730010986328, "global_step": 19581, "epoch": 161} {"train_loss": -29.040225982666016, "global_step": 19582, "epoch": 161} {"train_loss": -28.747465133666992, "global_step": 19583, "epoch": 161} {"train_loss": -28.398761749267578, "global_step": 19584, "epoch": 161} {"train_loss": -26.682554244995117, "global_step": 19585, "epoch": 161} {"train_loss": -23.524259567260742, "global_step": 19586, "epoch": 161} {"train_loss": -23.926025390625, "global_step": 19587, "epoch": 161} {"train_loss": -28.704259872436523, "global_step": 19588, "epoch": 161} {"train_loss": -28.711135864257812, "global_step": 19589, "epoch": 161} {"train_loss": -26.562225341796875, "global_step": 19590, "epoch": 161} {"train_loss": -28.7777156829834, "global_step": 19591, "epoch": 161} {"train_loss": -27.67694091796875, "global_step": 19592, "epoch": 161} {"train_loss": -28.773426055908203, "global_step": 19593, "epoch": 161} {"train_loss": -27.9747314453125, "global_step": 19594, "epoch": 161} {"train_loss": -29.28936195373535, "global_step": 19595, "epoch": 161} {"train_loss": -28.463672637939453, "global_step": 19596, "epoch": 161} {"train_loss": -29.087244033813477, "global_step": 19597, "epoch": 161} {"train_loss": -29.256101608276367, "global_step": 19598, "epoch": 161} {"train_loss": -29.59465980529785, "global_step": 19599, "epoch": 161} {"train_loss": -29.188339233398438, "global_step": 19600, "epoch": 161} {"train_loss": -28.769706599968526, "global_step": 19601, "epoch": 161, "val_loss": 2562663.0} {"train_loss": -28.576736450195312, "global_step": 19602, "epoch": 162} {"train_loss": -28.92885398864746, "global_step": 19603, "epoch": 162} {"train_loss": -29.083160400390625, "global_step": 19604, "epoch": 162} {"train_loss": -29.297094345092773, "global_step": 19605, "epoch": 162} {"train_loss": -28.870878219604492, "global_step": 19606, "epoch": 162} {"train_loss": -29.148046493530273, "global_step": 19607, "epoch": 162} {"train_loss": -29.28656578063965, "global_step": 19608, "epoch": 162} {"train_loss": -28.789342880249023, "global_step": 19609, "epoch": 162} {"train_loss": -29.62647819519043, "global_step": 19610, "epoch": 162} {"train_loss": -29.182098388671875, "global_step": 19611, "epoch": 162} {"train_loss": -29.49262046813965, "global_step": 19612, "epoch": 162} {"train_loss": -29.57952308654785, "global_step": 19613, "epoch": 162} {"train_loss": -28.659406661987305, "global_step": 19614, "epoch": 162} {"train_loss": -29.1889705657959, "global_step": 19615, "epoch": 162} {"train_loss": -29.501745223999023, "global_step": 19616, "epoch": 162} {"train_loss": -29.28948402404785, "global_step": 19617, "epoch": 162} {"train_loss": -29.556915283203125, "global_step": 19618, "epoch": 162} {"train_loss": -29.401596069335938, "global_step": 19619, "epoch": 162} {"train_loss": -29.65641212463379, "global_step": 19620, "epoch": 162} {"train_loss": -29.883344650268555, "global_step": 19621, "epoch": 162} {"train_loss": -29.465036392211914, "global_step": 19622, "epoch": 162} {"train_loss": -29.982404708862305, "global_step": 19623, "epoch": 162} {"train_loss": -29.79315757751465, "global_step": 19624, "epoch": 162} {"train_loss": -29.59772300720215, "global_step": 19625, "epoch": 162} {"train_loss": -29.90032386779785, "global_step": 19626, "epoch": 162} {"train_loss": -29.671173095703125, "global_step": 19627, "epoch": 162} {"train_loss": -30.138315200805664, "global_step": 19628, "epoch": 162} {"train_loss": -29.4968318939209, "global_step": 19629, "epoch": 162} {"train_loss": -30.496259689331055, "global_step": 19630, "epoch": 162} {"train_loss": -30.079742431640625, "global_step": 19631, "epoch": 162} {"train_loss": -30.402799606323242, "global_step": 19632, "epoch": 162} {"train_loss": -29.898706436157227, "global_step": 19633, "epoch": 162} {"train_loss": -30.1611270904541, "global_step": 19634, "epoch": 162} {"train_loss": -29.893102645874023, "global_step": 19635, "epoch": 162} {"train_loss": -29.791229248046875, "global_step": 19636, "epoch": 162} {"train_loss": -29.741540908813477, "global_step": 19637, "epoch": 162} {"train_loss": -29.709487915039062, "global_step": 19638, "epoch": 162} {"train_loss": -29.4310302734375, "global_step": 19639, "epoch": 162} {"train_loss": -29.076751708984375, "global_step": 19640, "epoch": 162} {"train_loss": -28.44834327697754, "global_step": 19641, "epoch": 162} {"train_loss": -27.47258949279785, "global_step": 19642, "epoch": 162} {"train_loss": -27.4378604888916, "global_step": 19643, "epoch": 162} {"train_loss": -25.418542861938477, "global_step": 19644, "epoch": 162} {"train_loss": -25.8338623046875, "global_step": 19645, "epoch": 162} {"train_loss": -28.497867584228516, "global_step": 19646, "epoch": 162} {"train_loss": -28.86543846130371, "global_step": 19647, "epoch": 162} {"train_loss": -29.3022518157959, "global_step": 19648, "epoch": 162} {"train_loss": -28.710798263549805, "global_step": 19649, "epoch": 162} {"train_loss": -29.14542007446289, "global_step": 19650, "epoch": 162} {"train_loss": -29.480661392211914, "global_step": 19651, "epoch": 162} {"train_loss": -28.28778076171875, "global_step": 19652, "epoch": 162} {"train_loss": -29.491506576538086, "global_step": 19653, "epoch": 162} {"train_loss": -28.645217895507812, "global_step": 19654, "epoch": 162} {"train_loss": -29.4039249420166, "global_step": 19655, "epoch": 162} {"train_loss": -29.443891525268555, "global_step": 19656, "epoch": 162} {"train_loss": -29.160924911499023, "global_step": 19657, "epoch": 162} {"train_loss": -29.212085723876953, "global_step": 19658, "epoch": 162} {"train_loss": -29.463947296142578, "global_step": 19659, "epoch": 162} {"train_loss": -29.433359146118164, "global_step": 19660, "epoch": 162} {"train_loss": -29.37298011779785, "global_step": 19661, "epoch": 162} {"train_loss": -29.520898818969727, "global_step": 19662, "epoch": 162} {"train_loss": -29.312469482421875, "global_step": 19663, "epoch": 162} {"train_loss": -29.271753311157227, "global_step": 19664, "epoch": 162} {"train_loss": -29.872114181518555, "global_step": 19665, "epoch": 162} {"train_loss": -29.410898208618164, "global_step": 19666, "epoch": 162} {"train_loss": -29.67853355407715, "global_step": 19667, "epoch": 162} {"train_loss": -29.537586212158203, "global_step": 19668, "epoch": 162} {"train_loss": -29.99054527282715, "global_step": 19669, "epoch": 162} {"train_loss": -29.799665451049805, "global_step": 19670, "epoch": 162} {"train_loss": -29.446008682250977, "global_step": 19671, "epoch": 162} {"train_loss": -29.504291534423828, "global_step": 19672, "epoch": 162} {"train_loss": -28.638477325439453, "global_step": 19673, "epoch": 162} {"train_loss": -30.052465438842773, "global_step": 19674, "epoch": 162} {"train_loss": -28.882892608642578, "global_step": 19675, "epoch": 162} {"train_loss": -29.79339027404785, "global_step": 19676, "epoch": 162} {"train_loss": -29.551513671875, "global_step": 19677, "epoch": 162} {"train_loss": -29.560379028320312, "global_step": 19678, "epoch": 162} {"train_loss": -29.819217681884766, "global_step": 19679, "epoch": 162} {"train_loss": -29.815250396728516, "global_step": 19680, "epoch": 162} {"train_loss": -30.250320434570312, "global_step": 19681, "epoch": 162} {"train_loss": -30.134963989257812, "global_step": 19682, "epoch": 162} {"train_loss": -30.021759033203125, "global_step": 19683, "epoch": 162} {"train_loss": -29.96375846862793, "global_step": 19684, "epoch": 162} {"train_loss": -29.684045791625977, "global_step": 19685, "epoch": 162} {"train_loss": -29.813461303710938, "global_step": 19686, "epoch": 162} {"train_loss": -29.844022750854492, "global_step": 19687, "epoch": 162} {"train_loss": -29.951160430908203, "global_step": 19688, "epoch": 162} {"train_loss": -30.07927894592285, "global_step": 19689, "epoch": 162} {"train_loss": -30.255685806274414, "global_step": 19690, "epoch": 162} {"train_loss": -29.49590492248535, "global_step": 19691, "epoch": 162} {"train_loss": -30.381738662719727, "global_step": 19692, "epoch": 162} {"train_loss": -29.28315544128418, "global_step": 19693, "epoch": 162} {"train_loss": -29.6359806060791, "global_step": 19694, "epoch": 162} {"train_loss": -29.069671630859375, "global_step": 19695, "epoch": 162} {"train_loss": -29.327993392944336, "global_step": 19696, "epoch": 162} {"train_loss": -29.486974716186523, "global_step": 19697, "epoch": 162} {"train_loss": -29.003005981445312, "global_step": 19698, "epoch": 162} {"train_loss": -28.455291748046875, "global_step": 19699, "epoch": 162} {"train_loss": -26.848093032836914, "global_step": 19700, "epoch": 162} {"train_loss": -28.848737716674805, "global_step": 19701, "epoch": 162} {"train_loss": -22.29216766357422, "global_step": 19702, "epoch": 162} {"train_loss": -28.248321533203125, "global_step": 19703, "epoch": 162} {"train_loss": -24.16028594970703, "global_step": 19704, "epoch": 162} {"train_loss": -26.9754638671875, "global_step": 19705, "epoch": 162} {"train_loss": -28.289447784423828, "global_step": 19706, "epoch": 162} {"train_loss": -28.0975284576416, "global_step": 19707, "epoch": 162} {"train_loss": -27.7955322265625, "global_step": 19708, "epoch": 162} {"train_loss": -29.68548011779785, "global_step": 19709, "epoch": 162} {"train_loss": -28.821380615234375, "global_step": 19710, "epoch": 162} {"train_loss": -28.450408935546875, "global_step": 19711, "epoch": 162} {"train_loss": -28.83526039123535, "global_step": 19712, "epoch": 162} {"train_loss": -29.789392471313477, "global_step": 19713, "epoch": 162} {"train_loss": -29.2198543548584, "global_step": 19714, "epoch": 162} {"train_loss": -29.102991104125977, "global_step": 19715, "epoch": 162} {"train_loss": -29.509801864624023, "global_step": 19716, "epoch": 162} {"train_loss": -29.163726806640625, "global_step": 19717, "epoch": 162} {"train_loss": -29.79204750061035, "global_step": 19718, "epoch": 162} {"train_loss": -29.28542137145996, "global_step": 19719, "epoch": 162} {"train_loss": -29.994338989257812, "global_step": 19720, "epoch": 162} {"train_loss": -29.269092559814453, "global_step": 19721, "epoch": 162} {"train_loss": -29.17199666046899, "global_step": 19722, "epoch": 162, "val_loss": 2629335.75} {"train_loss": -29.473508834838867, "global_step": 19723, "epoch": 163} {"train_loss": -29.221435546875, "global_step": 19724, "epoch": 163} {"train_loss": -29.683094024658203, "global_step": 19725, "epoch": 163} {"train_loss": -29.11280632019043, "global_step": 19726, "epoch": 163} {"train_loss": -29.830738067626953, "global_step": 19727, "epoch": 163} {"train_loss": -29.7282657623291, "global_step": 19728, "epoch": 163} {"train_loss": -29.390811920166016, "global_step": 19729, "epoch": 163} {"train_loss": -29.92976188659668, "global_step": 19730, "epoch": 163} {"train_loss": -29.3529109954834, "global_step": 19731, "epoch": 163} {"train_loss": -29.4393310546875, "global_step": 19732, "epoch": 163} {"train_loss": -29.434858322143555, "global_step": 19733, "epoch": 163} {"train_loss": -29.41314697265625, "global_step": 19734, "epoch": 163} {"train_loss": -29.708942413330078, "global_step": 19735, "epoch": 163} {"train_loss": -29.14971351623535, "global_step": 19736, "epoch": 163} {"train_loss": -29.095245361328125, "global_step": 19737, "epoch": 163} {"train_loss": -29.676132202148438, "global_step": 19738, "epoch": 163} {"train_loss": -29.2374267578125, "global_step": 19739, "epoch": 163} {"train_loss": -28.9965763092041, "global_step": 19740, "epoch": 163} {"train_loss": -29.72466468811035, "global_step": 19741, "epoch": 163} {"train_loss": -29.491958618164062, "global_step": 19742, "epoch": 163} {"train_loss": -28.31387710571289, "global_step": 19743, "epoch": 163} {"train_loss": -27.81049919128418, "global_step": 19744, "epoch": 163} {"train_loss": -29.453094482421875, "global_step": 19745, "epoch": 163} {"train_loss": -29.1248779296875, "global_step": 19746, "epoch": 163} {"train_loss": -28.317291259765625, "global_step": 19747, "epoch": 163} {"train_loss": -28.862943649291992, "global_step": 19748, "epoch": 163} {"train_loss": -28.945444107055664, "global_step": 19749, "epoch": 163} {"train_loss": -29.16236686706543, "global_step": 19750, "epoch": 163} {"train_loss": -28.714391708374023, "global_step": 19751, "epoch": 163} {"train_loss": -28.574787139892578, "global_step": 19752, "epoch": 163} {"train_loss": -28.35724449157715, "global_step": 19753, "epoch": 163} {"train_loss": -27.713153839111328, "global_step": 19754, "epoch": 163} {"train_loss": -28.065946578979492, "global_step": 19755, "epoch": 163} {"train_loss": -27.0786075592041, "global_step": 19756, "epoch": 163} {"train_loss": -28.362274169921875, "global_step": 19757, "epoch": 163} {"train_loss": -29.219472885131836, "global_step": 19758, "epoch": 163} {"train_loss": -28.882232666015625, "global_step": 19759, "epoch": 163} {"train_loss": -29.863122940063477, "global_step": 19760, "epoch": 163} {"train_loss": -29.164915084838867, "global_step": 19761, "epoch": 163} {"train_loss": -29.321063995361328, "global_step": 19762, "epoch": 163} {"train_loss": -29.27280616760254, "global_step": 19763, "epoch": 163} {"train_loss": -29.032636642456055, "global_step": 19764, "epoch": 163} {"train_loss": -29.21451759338379, "global_step": 19765, "epoch": 163} {"train_loss": -29.511367797851562, "global_step": 19766, "epoch": 163} {"train_loss": -29.003305435180664, "global_step": 19767, "epoch": 163} {"train_loss": -29.456701278686523, "global_step": 19768, "epoch": 163} {"train_loss": -28.97574806213379, "global_step": 19769, "epoch": 163} {"train_loss": -29.76741600036621, "global_step": 19770, "epoch": 163} {"train_loss": -29.04102897644043, "global_step": 19771, "epoch": 163} {"train_loss": -29.1484432220459, "global_step": 19772, "epoch": 163} {"train_loss": -29.170989990234375, "global_step": 19773, "epoch": 163} {"train_loss": -29.25909996032715, "global_step": 19774, "epoch": 163} {"train_loss": -29.687047958374023, "global_step": 19775, "epoch": 163} {"train_loss": -29.76938819885254, "global_step": 19776, "epoch": 163} {"train_loss": -29.725683212280273, "global_step": 19777, "epoch": 163} {"train_loss": -29.79390525817871, "global_step": 19778, "epoch": 163} {"train_loss": -29.624067306518555, "global_step": 19779, "epoch": 163} {"train_loss": -29.713891983032227, "global_step": 19780, "epoch": 163} {"train_loss": -29.51087760925293, "global_step": 19781, "epoch": 163} {"train_loss": -29.747045516967773, "global_step": 19782, "epoch": 163} {"train_loss": -29.80487060546875, "global_step": 19783, "epoch": 163} {"train_loss": -30.321638107299805, "global_step": 19784, "epoch": 163} {"train_loss": -29.66511344909668, "global_step": 19785, "epoch": 163} {"train_loss": -29.452844619750977, "global_step": 19786, "epoch": 163} {"train_loss": -29.052160263061523, "global_step": 19787, "epoch": 163} {"train_loss": -29.069059371948242, "global_step": 19788, "epoch": 163} {"train_loss": -28.618268966674805, "global_step": 19789, "epoch": 163} {"train_loss": -27.934162139892578, "global_step": 19790, "epoch": 163} {"train_loss": -29.179672241210938, "global_step": 19791, "epoch": 163} {"train_loss": -29.641286849975586, "global_step": 19792, "epoch": 163} {"train_loss": -28.524005889892578, "global_step": 19793, "epoch": 163} {"train_loss": -28.668561935424805, "global_step": 19794, "epoch": 163} {"train_loss": -28.58089256286621, "global_step": 19795, "epoch": 163} {"train_loss": -26.05426597595215, "global_step": 19796, "epoch": 163} {"train_loss": -29.243988037109375, "global_step": 19797, "epoch": 163} {"train_loss": -29.4581241607666, "global_step": 19798, "epoch": 163} {"train_loss": -28.090808868408203, "global_step": 19799, "epoch": 163} {"train_loss": -28.352008819580078, "global_step": 19800, "epoch": 163} {"train_loss": -29.723230361938477, "global_step": 19801, "epoch": 163} {"train_loss": -28.65533447265625, "global_step": 19802, "epoch": 163} {"train_loss": -27.892841339111328, "global_step": 19803, "epoch": 163} {"train_loss": -29.431243896484375, "global_step": 19804, "epoch": 163} {"train_loss": -28.89426040649414, "global_step": 19805, "epoch": 163} {"train_loss": -28.011707305908203, "global_step": 19806, "epoch": 163} {"train_loss": -29.87286376953125, "global_step": 19807, "epoch": 163} {"train_loss": -29.044214248657227, "global_step": 19808, "epoch": 163} {"train_loss": -29.61470603942871, "global_step": 19809, "epoch": 163} {"train_loss": -29.302921295166016, "global_step": 19810, "epoch": 163} {"train_loss": -29.214279174804688, "global_step": 19811, "epoch": 163} {"train_loss": -29.87772560119629, "global_step": 19812, "epoch": 163} {"train_loss": -28.990270614624023, "global_step": 19813, "epoch": 163} {"train_loss": -29.643707275390625, "global_step": 19814, "epoch": 163} {"train_loss": -28.04680824279785, "global_step": 19815, "epoch": 163} {"train_loss": -25.227874755859375, "global_step": 19816, "epoch": 163} {"train_loss": -20.7414493560791, "global_step": 19817, "epoch": 163} {"train_loss": -24.109844207763672, "global_step": 19818, "epoch": 163} {"train_loss": -29.157730102539062, "global_step": 19819, "epoch": 163} {"train_loss": -27.701278686523438, "global_step": 19820, "epoch": 163} {"train_loss": -28.606536865234375, "global_step": 19821, "epoch": 163} {"train_loss": -28.3436222076416, "global_step": 19822, "epoch": 163} {"train_loss": -29.190839767456055, "global_step": 19823, "epoch": 163} {"train_loss": -28.437530517578125, "global_step": 19824, "epoch": 163} {"train_loss": -29.082258224487305, "global_step": 19825, "epoch": 163} {"train_loss": -29.190160751342773, "global_step": 19826, "epoch": 163} {"train_loss": -28.803924560546875, "global_step": 19827, "epoch": 163} {"train_loss": -28.808069229125977, "global_step": 19828, "epoch": 163} {"train_loss": -28.947345733642578, "global_step": 19829, "epoch": 163} {"train_loss": -29.2025089263916, "global_step": 19830, "epoch": 163} {"train_loss": -29.326452255249023, "global_step": 19831, "epoch": 163} {"train_loss": -29.169836044311523, "global_step": 19832, "epoch": 163} {"train_loss": -29.796873092651367, "global_step": 19833, "epoch": 163} {"train_loss": -28.89630126953125, "global_step": 19834, "epoch": 163} {"train_loss": -28.343542098999023, "global_step": 19835, "epoch": 163} {"train_loss": -28.632883071899414, "global_step": 19836, "epoch": 163} {"train_loss": -29.047454833984375, "global_step": 19837, "epoch": 163} {"train_loss": -29.384418487548828, "global_step": 19838, "epoch": 163} {"train_loss": -29.24627113342285, "global_step": 19839, "epoch": 163} {"train_loss": -28.721664428710938, "global_step": 19840, "epoch": 163} {"train_loss": -28.656774520874023, "global_step": 19841, "epoch": 163} {"train_loss": -28.620746612548828, "global_step": 19842, "epoch": 163} {"train_loss": -28.92095485403518, "global_step": 19843, "epoch": 163, "val_loss": 2561980.0} {"train_loss": -29.558887481689453, "global_step": 19844, "epoch": 164} {"train_loss": -29.544431686401367, "global_step": 19845, "epoch": 164} {"train_loss": -29.816492080688477, "global_step": 19846, "epoch": 164} {"train_loss": -29.345701217651367, "global_step": 19847, "epoch": 164} {"train_loss": -29.542892456054688, "global_step": 19848, "epoch": 164} {"train_loss": -29.345014572143555, "global_step": 19849, "epoch": 164} {"train_loss": -29.98628807067871, "global_step": 19850, "epoch": 164} {"train_loss": -29.151525497436523, "global_step": 19851, "epoch": 164} {"train_loss": -29.155933380126953, "global_step": 19852, "epoch": 164} {"train_loss": -28.94980812072754, "global_step": 19853, "epoch": 164} {"train_loss": -29.68096923828125, "global_step": 19854, "epoch": 164} {"train_loss": -29.768171310424805, "global_step": 19855, "epoch": 164} {"train_loss": -29.982181549072266, "global_step": 19856, "epoch": 164} {"train_loss": -29.69270133972168, "global_step": 19857, "epoch": 164} {"train_loss": -29.916828155517578, "global_step": 19858, "epoch": 164} {"train_loss": -29.791608810424805, "global_step": 19859, "epoch": 164} {"train_loss": -29.655689239501953, "global_step": 19860, "epoch": 164} {"train_loss": -29.522085189819336, "global_step": 19861, "epoch": 164} {"train_loss": -29.81183433532715, "global_step": 19862, "epoch": 164} {"train_loss": -29.494359970092773, "global_step": 19863, "epoch": 164} {"train_loss": -29.820514678955078, "global_step": 19864, "epoch": 164} {"train_loss": -29.289640426635742, "global_step": 19865, "epoch": 164} {"train_loss": -29.40707778930664, "global_step": 19866, "epoch": 164} {"train_loss": -29.03608512878418, "global_step": 19867, "epoch": 164} {"train_loss": -29.338672637939453, "global_step": 19868, "epoch": 164} {"train_loss": -29.845630645751953, "global_step": 19869, "epoch": 164} {"train_loss": -29.923505783081055, "global_step": 19870, "epoch": 164} {"train_loss": -29.74370765686035, "global_step": 19871, "epoch": 164} {"train_loss": -30.052017211914062, "global_step": 19872, "epoch": 164} {"train_loss": -30.047643661499023, "global_step": 19873, "epoch": 164} {"train_loss": -29.93397331237793, "global_step": 19874, "epoch": 164} {"train_loss": -30.271366119384766, "global_step": 19875, "epoch": 164} {"train_loss": -29.646860122680664, "global_step": 19876, "epoch": 164} {"train_loss": -29.634164810180664, "global_step": 19877, "epoch": 164} {"train_loss": -29.8964786529541, "global_step": 19878, "epoch": 164} {"train_loss": -29.278928756713867, "global_step": 19879, "epoch": 164} {"train_loss": -29.614593505859375, "global_step": 19880, "epoch": 164} {"train_loss": -29.96357536315918, "global_step": 19881, "epoch": 164} {"train_loss": -30.182031631469727, "global_step": 19882, "epoch": 164} {"train_loss": -29.326459884643555, "global_step": 19883, "epoch": 164} {"train_loss": -30.0882511138916, "global_step": 19884, "epoch": 164} {"train_loss": -30.1763916015625, "global_step": 19885, "epoch": 164} {"train_loss": -28.710351943969727, "global_step": 19886, "epoch": 164} {"train_loss": -28.997350692749023, "global_step": 19887, "epoch": 164} {"train_loss": -29.429807662963867, "global_step": 19888, "epoch": 164} {"train_loss": -29.585813522338867, "global_step": 19889, "epoch": 164} {"train_loss": -29.030378341674805, "global_step": 19890, "epoch": 164} {"train_loss": -29.73529624938965, "global_step": 19891, "epoch": 164} {"train_loss": -30.01220703125, "global_step": 19892, "epoch": 164} {"train_loss": -28.785968780517578, "global_step": 19893, "epoch": 164} {"train_loss": -29.93777847290039, "global_step": 19894, "epoch": 164} {"train_loss": -28.90247917175293, "global_step": 19895, "epoch": 164} {"train_loss": -29.2358455657959, "global_step": 19896, "epoch": 164} {"train_loss": -29.103031158447266, "global_step": 19897, "epoch": 164} {"train_loss": -29.50977897644043, "global_step": 19898, "epoch": 164} {"train_loss": -29.032968521118164, "global_step": 19899, "epoch": 164} {"train_loss": -27.218921661376953, "global_step": 19900, "epoch": 164} {"train_loss": -25.74118995666504, "global_step": 19901, "epoch": 164} {"train_loss": -24.932025909423828, "global_step": 19902, "epoch": 164} {"train_loss": -27.2955265045166, "global_step": 19903, "epoch": 164} {"train_loss": -29.533523559570312, "global_step": 19904, "epoch": 164} {"train_loss": -28.549259185791016, "global_step": 19905, "epoch": 164} {"train_loss": -28.9329776763916, "global_step": 19906, "epoch": 164} {"train_loss": -30.20652198791504, "global_step": 19907, "epoch": 164} {"train_loss": -28.882368087768555, "global_step": 19908, "epoch": 164} {"train_loss": -29.374052047729492, "global_step": 19909, "epoch": 164} {"train_loss": -28.992874145507812, "global_step": 19910, "epoch": 164} {"train_loss": -29.240615844726562, "global_step": 19911, "epoch": 164} {"train_loss": -28.699731826782227, "global_step": 19912, "epoch": 164} {"train_loss": -29.48345375061035, "global_step": 19913, "epoch": 164} {"train_loss": -28.970661163330078, "global_step": 19914, "epoch": 164} {"train_loss": -29.297903060913086, "global_step": 19915, "epoch": 164} {"train_loss": -28.99897575378418, "global_step": 19916, "epoch": 164} {"train_loss": -29.221521377563477, "global_step": 19917, "epoch": 164} {"train_loss": -29.37481689453125, "global_step": 19918, "epoch": 164} {"train_loss": -29.656904220581055, "global_step": 19919, "epoch": 164} {"train_loss": -29.432926177978516, "global_step": 19920, "epoch": 164} {"train_loss": -29.640411376953125, "global_step": 19921, "epoch": 164} {"train_loss": -30.03839683532715, "global_step": 19922, "epoch": 164} {"train_loss": -29.17841911315918, "global_step": 19923, "epoch": 164} {"train_loss": -29.283727645874023, "global_step": 19924, "epoch": 164} {"train_loss": -29.2623348236084, "global_step": 19925, "epoch": 164} {"train_loss": -29.802343368530273, "global_step": 19926, "epoch": 164} {"train_loss": -28.99247169494629, "global_step": 19927, "epoch": 164} {"train_loss": -29.446338653564453, "global_step": 19928, "epoch": 164} {"train_loss": -30.01943016052246, "global_step": 19929, "epoch": 164} {"train_loss": -29.457569122314453, "global_step": 19930, "epoch": 164} {"train_loss": -29.7150936126709, "global_step": 19931, "epoch": 164} {"train_loss": -29.901046752929688, "global_step": 19932, "epoch": 164} {"train_loss": -29.742990493774414, "global_step": 19933, "epoch": 164} {"train_loss": -29.844106674194336, "global_step": 19934, "epoch": 164} {"train_loss": -29.7626895904541, "global_step": 19935, "epoch": 164} {"train_loss": -29.712366104125977, "global_step": 19936, "epoch": 164} {"train_loss": -29.098310470581055, "global_step": 19937, "epoch": 164} {"train_loss": -28.8664608001709, "global_step": 19938, "epoch": 164} {"train_loss": -29.703617095947266, "global_step": 19939, "epoch": 164} {"train_loss": -30.006677627563477, "global_step": 19940, "epoch": 164} {"train_loss": -30.381872177124023, "global_step": 19941, "epoch": 164} {"train_loss": -29.735288619995117, "global_step": 19942, "epoch": 164} {"train_loss": -29.58978271484375, "global_step": 19943, "epoch": 164} {"train_loss": -28.638809204101562, "global_step": 19944, "epoch": 164} {"train_loss": -27.823474884033203, "global_step": 19945, "epoch": 164} {"train_loss": -25.925201416015625, "global_step": 19946, "epoch": 164} {"train_loss": -23.562002182006836, "global_step": 19947, "epoch": 164} {"train_loss": -24.865217208862305, "global_step": 19948, "epoch": 164} {"train_loss": -28.10079002380371, "global_step": 19949, "epoch": 164} {"train_loss": -28.96908950805664, "global_step": 19950, "epoch": 164} {"train_loss": -27.814184188842773, "global_step": 19951, "epoch": 164} {"train_loss": -29.484350204467773, "global_step": 19952, "epoch": 164} {"train_loss": -28.366010665893555, "global_step": 19953, "epoch": 164} {"train_loss": -29.876575469970703, "global_step": 19954, "epoch": 164} {"train_loss": -29.2861270904541, "global_step": 19955, "epoch": 164} {"train_loss": -28.367956161499023, "global_step": 19956, "epoch": 164} {"train_loss": -29.917795181274414, "global_step": 19957, "epoch": 164} {"train_loss": -29.5864315032959, "global_step": 19958, "epoch": 164} {"train_loss": -29.42463493347168, "global_step": 19959, "epoch": 164} {"train_loss": -29.004613876342773, "global_step": 19960, "epoch": 164} {"train_loss": -29.29537010192871, "global_step": 19961, "epoch": 164} {"train_loss": -29.393264770507812, "global_step": 19962, "epoch": 164} {"train_loss": -29.627729415893555, "global_step": 19963, "epoch": 164} {"train_loss": -29.226977135524276, "global_step": 19964, "epoch": 164, "val_loss": 2736780.25} {"train_loss": -29.372465133666992, "global_step": 19965, "epoch": 165} {"train_loss": -29.998010635375977, "global_step": 19966, "epoch": 165} {"train_loss": -29.4278621673584, "global_step": 19967, "epoch": 165} {"train_loss": -29.51484489440918, "global_step": 19968, "epoch": 165} {"train_loss": -29.357030868530273, "global_step": 19969, "epoch": 165} {"train_loss": -29.710432052612305, "global_step": 19970, "epoch": 165} {"train_loss": -29.640317916870117, "global_step": 19971, "epoch": 165} {"train_loss": -29.8410701751709, "global_step": 19972, "epoch": 165} {"train_loss": -29.21942710876465, "global_step": 19973, "epoch": 165} {"train_loss": -29.88844108581543, "global_step": 19974, "epoch": 165} {"train_loss": -29.669668197631836, "global_step": 19975, "epoch": 165} {"train_loss": -29.568958282470703, "global_step": 19976, "epoch": 165} {"train_loss": -29.585920333862305, "global_step": 19977, "epoch": 165} {"train_loss": -29.791584014892578, "global_step": 19978, "epoch": 165} {"train_loss": -29.515277862548828, "global_step": 19979, "epoch": 165} {"train_loss": -29.587451934814453, "global_step": 19980, "epoch": 165} {"train_loss": -28.854761123657227, "global_step": 19981, "epoch": 165} {"train_loss": -28.8616886138916, "global_step": 19982, "epoch": 165} {"train_loss": -29.159208297729492, "global_step": 19983, "epoch": 165} {"train_loss": -29.08552360534668, "global_step": 19984, "epoch": 165} {"train_loss": -28.58643913269043, "global_step": 19985, "epoch": 165} {"train_loss": -29.1242733001709, "global_step": 19986, "epoch": 165} {"train_loss": -28.130878448486328, "global_step": 19987, "epoch": 165} {"train_loss": -28.830713272094727, "global_step": 19988, "epoch": 165} {"train_loss": -29.505136489868164, "global_step": 19989, "epoch": 165} {"train_loss": -30.053075790405273, "global_step": 19990, "epoch": 165} {"train_loss": -29.16925048828125, "global_step": 19991, "epoch": 165} {"train_loss": -28.440704345703125, "global_step": 19992, "epoch": 165} {"train_loss": -29.150527954101562, "global_step": 19993, "epoch": 165} {"train_loss": -30.165546417236328, "global_step": 19994, "epoch": 165} {"train_loss": -29.6666259765625, "global_step": 19995, "epoch": 165} {"train_loss": -29.38490104675293, "global_step": 19996, "epoch": 165} {"train_loss": -29.5190486907959, "global_step": 19997, "epoch": 165} {"train_loss": -28.75531005859375, "global_step": 19998, "epoch": 165} {"train_loss": -29.631128311157227, "global_step": 19999, "epoch": 165} {"train_loss": -29.731128692626953, "global_step": 20000, "epoch": 165} {"train_loss": -29.469512939453125, "global_step": 20001, "epoch": 165} {"train_loss": -30.02003288269043, "global_step": 20002, "epoch": 165} {"train_loss": -29.88837242126465, "global_step": 20003, "epoch": 165} {"train_loss": -29.700082778930664, "global_step": 20004, "epoch": 165} {"train_loss": -29.863784790039062, "global_step": 20005, "epoch": 165} {"train_loss": -29.847095489501953, "global_step": 20006, "epoch": 165} {"train_loss": -29.9692325592041, "global_step": 20007, "epoch": 165} {"train_loss": -29.925235748291016, "global_step": 20008, "epoch": 165} {"train_loss": -29.661487579345703, "global_step": 20009, "epoch": 165} {"train_loss": -29.94097900390625, "global_step": 20010, "epoch": 165} {"train_loss": -29.641464233398438, "global_step": 20011, "epoch": 165} {"train_loss": -29.842870712280273, "global_step": 20012, "epoch": 165} {"train_loss": -30.265165328979492, "global_step": 20013, "epoch": 165} {"train_loss": -29.11151695251465, "global_step": 20014, "epoch": 165} {"train_loss": -30.18731117248535, "global_step": 20015, "epoch": 165} {"train_loss": -30.220041275024414, "global_step": 20016, "epoch": 165} {"train_loss": -29.77313804626465, "global_step": 20017, "epoch": 165} {"train_loss": -30.155715942382812, "global_step": 20018, "epoch": 165} {"train_loss": -29.800983428955078, "global_step": 20019, "epoch": 165} {"train_loss": -30.306013107299805, "global_step": 20020, "epoch": 165} {"train_loss": -30.17717933654785, "global_step": 20021, "epoch": 165} {"train_loss": -30.089202880859375, "global_step": 20022, "epoch": 165} {"train_loss": -29.274938583374023, "global_step": 20023, "epoch": 165} {"train_loss": -29.186750411987305, "global_step": 20024, "epoch": 165} {"train_loss": -27.7632999420166, "global_step": 20025, "epoch": 165} {"train_loss": -26.12660026550293, "global_step": 20026, "epoch": 165} {"train_loss": -24.230260848999023, "global_step": 20027, "epoch": 165} {"train_loss": -20.399503707885742, "global_step": 20028, "epoch": 165} {"train_loss": -19.77540397644043, "global_step": 20029, "epoch": 165} {"train_loss": -27.785730361938477, "global_step": 20030, "epoch": 165} {"train_loss": -26.980060577392578, "global_step": 20031, "epoch": 165} {"train_loss": -27.795042037963867, "global_step": 20032, "epoch": 165} {"train_loss": -26.633508682250977, "global_step": 20033, "epoch": 165} {"train_loss": -28.929975509643555, "global_step": 20034, "epoch": 165} {"train_loss": -26.95871925354004, "global_step": 20035, "epoch": 165} {"train_loss": -29.175100326538086, "global_step": 20036, "epoch": 165} {"train_loss": -28.799463272094727, "global_step": 20037, "epoch": 165} {"train_loss": -27.831212997436523, "global_step": 20038, "epoch": 165} {"train_loss": -29.031116485595703, "global_step": 20039, "epoch": 165} {"train_loss": -28.78993034362793, "global_step": 20040, "epoch": 165} {"train_loss": -28.285795211791992, "global_step": 20041, "epoch": 165} {"train_loss": -27.995359420776367, "global_step": 20042, "epoch": 165} {"train_loss": -29.38296890258789, "global_step": 20043, "epoch": 165} {"train_loss": -29.223180770874023, "global_step": 20044, "epoch": 165} {"train_loss": -29.211889266967773, "global_step": 20045, "epoch": 165} {"train_loss": -28.5620174407959, "global_step": 20046, "epoch": 165} {"train_loss": -29.427350997924805, "global_step": 20047, "epoch": 165} {"train_loss": -29.79619789123535, "global_step": 20048, "epoch": 165} {"train_loss": -29.613082885742188, "global_step": 20049, "epoch": 165} {"train_loss": -29.053735733032227, "global_step": 20050, "epoch": 165} {"train_loss": -29.662744522094727, "global_step": 20051, "epoch": 165} {"train_loss": -29.322233200073242, "global_step": 20052, "epoch": 165} {"train_loss": -29.949451446533203, "global_step": 20053, "epoch": 165} {"train_loss": -29.894189834594727, "global_step": 20054, "epoch": 165} {"train_loss": -29.4265079498291, "global_step": 20055, "epoch": 165} {"train_loss": -29.700525283813477, "global_step": 20056, "epoch": 165} {"train_loss": -29.560516357421875, "global_step": 20057, "epoch": 165} {"train_loss": -29.96229362487793, "global_step": 20058, "epoch": 165} {"train_loss": -30.15289306640625, "global_step": 20059, "epoch": 165} {"train_loss": -29.621280670166016, "global_step": 20060, "epoch": 165} {"train_loss": -29.114355087280273, "global_step": 20061, "epoch": 165} {"train_loss": -29.4644832611084, "global_step": 20062, "epoch": 165} {"train_loss": -29.691192626953125, "global_step": 20063, "epoch": 165} {"train_loss": -29.492816925048828, "global_step": 20064, "epoch": 165} {"train_loss": -29.720748901367188, "global_step": 20065, "epoch": 165} {"train_loss": -29.666217803955078, "global_step": 20066, "epoch": 165} {"train_loss": -29.62158203125, "global_step": 20067, "epoch": 165} {"train_loss": -28.941633224487305, "global_step": 20068, "epoch": 165} {"train_loss": -24.369779586791992, "global_step": 20069, "epoch": 165} {"train_loss": -13.393950462341309, "global_step": 20070, "epoch": 165} {"train_loss": 8.294074058532715, "global_step": 20071, "epoch": 165} {"train_loss": -0.10507746040821075, "global_step": 20072, "epoch": 165} {"train_loss": -28.210113525390625, "global_step": 20073, "epoch": 165} {"train_loss": -16.071868896484375, "global_step": 20074, "epoch": 165} {"train_loss": -26.28249168395996, "global_step": 20075, "epoch": 165} {"train_loss": -26.521631240844727, "global_step": 20076, "epoch": 165} {"train_loss": -23.02694320678711, "global_step": 20077, "epoch": 165} {"train_loss": -25.15437889099121, "global_step": 20078, "epoch": 165} {"train_loss": -27.71329116821289, "global_step": 20079, "epoch": 165} {"train_loss": -27.904296875, "global_step": 20080, "epoch": 165} {"train_loss": -26.85382652282715, "global_step": 20081, "epoch": 165} {"train_loss": -26.59162712097168, "global_step": 20082, "epoch": 165} {"train_loss": -27.040496826171875, "global_step": 20083, "epoch": 165} {"train_loss": -27.033618927001953, "global_step": 20084, "epoch": 165} {"train_loss": -28.010414467985964, "global_step": 20085, "epoch": 165, "val_loss": 2599045.0} {"train_loss": -27.9551944732666, "global_step": 20086, "epoch": 166} {"train_loss": -27.413293838500977, "global_step": 20087, "epoch": 166} {"train_loss": -28.136884689331055, "global_step": 20088, "epoch": 166} {"train_loss": -27.959228515625, "global_step": 20089, "epoch": 166} {"train_loss": -27.652570724487305, "global_step": 20090, "epoch": 166} {"train_loss": -28.076831817626953, "global_step": 20091, "epoch": 166} {"train_loss": -27.617528915405273, "global_step": 20092, "epoch": 166} {"train_loss": -28.303491592407227, "global_step": 20093, "epoch": 166} {"train_loss": -28.024805068969727, "global_step": 20094, "epoch": 166} {"train_loss": -28.28839683532715, "global_step": 20095, "epoch": 166} {"train_loss": -28.510089874267578, "global_step": 20096, "epoch": 166} {"train_loss": -28.666528701782227, "global_step": 20097, "epoch": 166} {"train_loss": -28.217166900634766, "global_step": 20098, "epoch": 166} {"train_loss": -28.67169761657715, "global_step": 20099, "epoch": 166} {"train_loss": -28.54619789123535, "global_step": 20100, "epoch": 166} {"train_loss": -28.28335952758789, "global_step": 20101, "epoch": 166} {"train_loss": -28.821792602539062, "global_step": 20102, "epoch": 166} {"train_loss": -28.82075309753418, "global_step": 20103, "epoch": 166} {"train_loss": -28.67071533203125, "global_step": 20104, "epoch": 166} {"train_loss": -28.4664306640625, "global_step": 20105, "epoch": 166} {"train_loss": -28.722400665283203, "global_step": 20106, "epoch": 166} {"train_loss": -29.122915267944336, "global_step": 20107, "epoch": 166} {"train_loss": -29.00092124938965, "global_step": 20108, "epoch": 166} {"train_loss": -29.141345977783203, "global_step": 20109, "epoch": 166} {"train_loss": -29.289905548095703, "global_step": 20110, "epoch": 166} {"train_loss": -28.61443519592285, "global_step": 20111, "epoch": 166} {"train_loss": -28.179428100585938, "global_step": 20112, "epoch": 166} {"train_loss": -28.999893188476562, "global_step": 20113, "epoch": 166} {"train_loss": -28.610000610351562, "global_step": 20114, "epoch": 166} {"train_loss": -29.12060546875, "global_step": 20115, "epoch": 166} {"train_loss": -28.706573486328125, "global_step": 20116, "epoch": 166} {"train_loss": -28.774641036987305, "global_step": 20117, "epoch": 166} {"train_loss": -28.36030387878418, "global_step": 20118, "epoch": 166} {"train_loss": -28.566930770874023, "global_step": 20119, "epoch": 166} {"train_loss": -28.16497230529785, "global_step": 20120, "epoch": 166} {"train_loss": -27.78704261779785, "global_step": 20121, "epoch": 166} {"train_loss": -27.64381980895996, "global_step": 20122, "epoch": 166} {"train_loss": -29.2709903717041, "global_step": 20123, "epoch": 166} {"train_loss": -28.246923446655273, "global_step": 20124, "epoch": 166} {"train_loss": -27.779569625854492, "global_step": 20125, "epoch": 166} {"train_loss": -26.11494255065918, "global_step": 20126, "epoch": 166} {"train_loss": -24.91374397277832, "global_step": 20127, "epoch": 166} {"train_loss": -25.81485939025879, "global_step": 20128, "epoch": 166} {"train_loss": -26.681015014648438, "global_step": 20129, "epoch": 166} {"train_loss": -27.331695556640625, "global_step": 20130, "epoch": 166} {"train_loss": -26.5946044921875, "global_step": 20131, "epoch": 166} {"train_loss": -28.622854232788086, "global_step": 20132, "epoch": 166} {"train_loss": -27.427515029907227, "global_step": 20133, "epoch": 166} {"train_loss": -28.49433708190918, "global_step": 20134, "epoch": 166} {"train_loss": -27.68710708618164, "global_step": 20135, "epoch": 166} {"train_loss": -28.472440719604492, "global_step": 20136, "epoch": 166} {"train_loss": -27.965057373046875, "global_step": 20137, "epoch": 166} {"train_loss": -28.474811553955078, "global_step": 20138, "epoch": 166} {"train_loss": -28.305051803588867, "global_step": 20139, "epoch": 166} {"train_loss": -27.95361328125, "global_step": 20140, "epoch": 166} {"train_loss": -28.435888290405273, "global_step": 20141, "epoch": 166} {"train_loss": -28.231237411499023, "global_step": 20142, "epoch": 166} {"train_loss": -28.5151309967041, "global_step": 20143, "epoch": 166} {"train_loss": -28.458881378173828, "global_step": 20144, "epoch": 166} {"train_loss": -28.520904541015625, "global_step": 20145, "epoch": 166} {"train_loss": -28.501306533813477, "global_step": 20146, "epoch": 166} {"train_loss": -28.186767578125, "global_step": 20147, "epoch": 166} {"train_loss": -28.60843849182129, "global_step": 20148, "epoch": 166} {"train_loss": -28.144733428955078, "global_step": 20149, "epoch": 166} {"train_loss": -28.85025978088379, "global_step": 20150, "epoch": 166} {"train_loss": -28.95358657836914, "global_step": 20151, "epoch": 166} {"train_loss": -28.96893310546875, "global_step": 20152, "epoch": 166} {"train_loss": -28.528295516967773, "global_step": 20153, "epoch": 166} {"train_loss": -28.4576416015625, "global_step": 20154, "epoch": 166} {"train_loss": -29.0408992767334, "global_step": 20155, "epoch": 166} {"train_loss": -29.54351234436035, "global_step": 20156, "epoch": 166} {"train_loss": -29.074426651000977, "global_step": 20157, "epoch": 166} {"train_loss": -28.93424415588379, "global_step": 20158, "epoch": 166} {"train_loss": -28.715734481811523, "global_step": 20159, "epoch": 166} {"train_loss": -29.163679122924805, "global_step": 20160, "epoch": 166} {"train_loss": -28.96489906311035, "global_step": 20161, "epoch": 166} {"train_loss": -29.40004539489746, "global_step": 20162, "epoch": 166} {"train_loss": -29.2040958404541, "global_step": 20163, "epoch": 166} {"train_loss": -29.153797149658203, "global_step": 20164, "epoch": 166} {"train_loss": -28.896764755249023, "global_step": 20165, "epoch": 166} {"train_loss": -28.8414363861084, "global_step": 20166, "epoch": 166} {"train_loss": -29.413330078125, "global_step": 20167, "epoch": 166} {"train_loss": -29.198965072631836, "global_step": 20168, "epoch": 166} {"train_loss": -28.855390548706055, "global_step": 20169, "epoch": 166} {"train_loss": -29.201419830322266, "global_step": 20170, "epoch": 166} {"train_loss": -29.314163208007812, "global_step": 20171, "epoch": 166} {"train_loss": -29.3713321685791, "global_step": 20172, "epoch": 166} {"train_loss": -28.776813507080078, "global_step": 20173, "epoch": 166} {"train_loss": -29.07460594177246, "global_step": 20174, "epoch": 166} {"train_loss": -29.015966415405273, "global_step": 20175, "epoch": 166} {"train_loss": -29.53853416442871, "global_step": 20176, "epoch": 166} {"train_loss": -29.084753036499023, "global_step": 20177, "epoch": 166} {"train_loss": -28.897916793823242, "global_step": 20178, "epoch": 166} {"train_loss": -29.368093490600586, "global_step": 20179, "epoch": 166} {"train_loss": -29.40388298034668, "global_step": 20180, "epoch": 166} {"train_loss": -29.204870223999023, "global_step": 20181, "epoch": 166} {"train_loss": -29.13642692565918, "global_step": 20182, "epoch": 166} {"train_loss": -28.581823348999023, "global_step": 20183, "epoch": 166} {"train_loss": -28.925735473632812, "global_step": 20184, "epoch": 166} {"train_loss": -28.31337547302246, "global_step": 20185, "epoch": 166} {"train_loss": -27.810876846313477, "global_step": 20186, "epoch": 166} {"train_loss": -29.0718994140625, "global_step": 20187, "epoch": 166} {"train_loss": -28.26251792907715, "global_step": 20188, "epoch": 166} {"train_loss": -28.94394874572754, "global_step": 20189, "epoch": 166} {"train_loss": -28.6586971282959, "global_step": 20190, "epoch": 166} {"train_loss": -28.451826095581055, "global_step": 20191, "epoch": 166} {"train_loss": -28.67978858947754, "global_step": 20192, "epoch": 166} {"train_loss": -28.442304611206055, "global_step": 20193, "epoch": 166} {"train_loss": -29.264434814453125, "global_step": 20194, "epoch": 166} {"train_loss": -28.571918487548828, "global_step": 20195, "epoch": 166} {"train_loss": -28.910511016845703, "global_step": 20196, "epoch": 166} {"train_loss": -29.471527099609375, "global_step": 20197, "epoch": 166} {"train_loss": -29.19437599182129, "global_step": 20198, "epoch": 166} {"train_loss": -29.343332290649414, "global_step": 20199, "epoch": 166} {"train_loss": -29.095932006835938, "global_step": 20200, "epoch": 166} {"train_loss": -29.51372718811035, "global_step": 20201, "epoch": 166} {"train_loss": -29.60138511657715, "global_step": 20202, "epoch": 166} {"train_loss": -29.35283851623535, "global_step": 20203, "epoch": 166} {"train_loss": -29.364551544189453, "global_step": 20204, "epoch": 166} {"train_loss": -28.780893325805664, "global_step": 20205, "epoch": 166} {"train_loss": -28.570047930252453, "global_step": 20206, "epoch": 166, "val_loss": 2683974.0} {"train_loss": -29.965076446533203, "global_step": 20207, "epoch": 167} {"train_loss": -29.59588050842285, "global_step": 20208, "epoch": 167} {"train_loss": -29.168354034423828, "global_step": 20209, "epoch": 167} {"train_loss": -29.073835372924805, "global_step": 20210, "epoch": 167} {"train_loss": -29.17721939086914, "global_step": 20211, "epoch": 167} {"train_loss": -28.2482852935791, "global_step": 20212, "epoch": 167} {"train_loss": -27.285383224487305, "global_step": 20213, "epoch": 167} {"train_loss": -29.2658748626709, "global_step": 20214, "epoch": 167} {"train_loss": -28.904132843017578, "global_step": 20215, "epoch": 167} {"train_loss": -29.325687408447266, "global_step": 20216, "epoch": 167} {"train_loss": -29.413549423217773, "global_step": 20217, "epoch": 167} {"train_loss": -29.213891983032227, "global_step": 20218, "epoch": 167} {"train_loss": -28.767166137695312, "global_step": 20219, "epoch": 167} {"train_loss": -29.337757110595703, "global_step": 20220, "epoch": 167} {"train_loss": -29.650068283081055, "global_step": 20221, "epoch": 167} {"train_loss": -29.049909591674805, "global_step": 20222, "epoch": 167} {"train_loss": -29.749181747436523, "global_step": 20223, "epoch": 167} {"train_loss": -28.973169326782227, "global_step": 20224, "epoch": 167} {"train_loss": -29.603336334228516, "global_step": 20225, "epoch": 167} {"train_loss": -29.470611572265625, "global_step": 20226, "epoch": 167} {"train_loss": -29.270654678344727, "global_step": 20227, "epoch": 167} {"train_loss": -29.647552490234375, "global_step": 20228, "epoch": 167} {"train_loss": -29.478900909423828, "global_step": 20229, "epoch": 167} {"train_loss": -29.69196891784668, "global_step": 20230, "epoch": 167} {"train_loss": -29.30908203125, "global_step": 20231, "epoch": 167} {"train_loss": -29.614593505859375, "global_step": 20232, "epoch": 167} {"train_loss": -29.34588050842285, "global_step": 20233, "epoch": 167} {"train_loss": -29.4095516204834, "global_step": 20234, "epoch": 167} {"train_loss": -29.2093563079834, "global_step": 20235, "epoch": 167} {"train_loss": -30.274072647094727, "global_step": 20236, "epoch": 167} {"train_loss": -30.0849609375, "global_step": 20237, "epoch": 167} {"train_loss": -27.86834716796875, "global_step": 20238, "epoch": 167} {"train_loss": -25.204639434814453, "global_step": 20239, "epoch": 167} {"train_loss": -21.6087589263916, "global_step": 20240, "epoch": 167} {"train_loss": -22.22157096862793, "global_step": 20241, "epoch": 167} {"train_loss": -26.4073486328125, "global_step": 20242, "epoch": 167} {"train_loss": -23.815570831298828, "global_step": 20243, "epoch": 167} {"train_loss": -26.6384220123291, "global_step": 20244, "epoch": 167} {"train_loss": -27.563480377197266, "global_step": 20245, "epoch": 167} {"train_loss": -26.860036849975586, "global_step": 20246, "epoch": 167} {"train_loss": -26.786396026611328, "global_step": 20247, "epoch": 167} {"train_loss": -28.8261661529541, "global_step": 20248, "epoch": 167} {"train_loss": -28.405054092407227, "global_step": 20249, "epoch": 167} {"train_loss": -28.1811580657959, "global_step": 20250, "epoch": 167} {"train_loss": -28.17380142211914, "global_step": 20251, "epoch": 167} {"train_loss": -28.91840171813965, "global_step": 20252, "epoch": 167} {"train_loss": -28.029510498046875, "global_step": 20253, "epoch": 167} {"train_loss": -29.065353393554688, "global_step": 20254, "epoch": 167} {"train_loss": -28.73784828186035, "global_step": 20255, "epoch": 167} {"train_loss": -28.871931076049805, "global_step": 20256, "epoch": 167} {"train_loss": -29.054418563842773, "global_step": 20257, "epoch": 167} {"train_loss": -28.64170265197754, "global_step": 20258, "epoch": 167} {"train_loss": -28.981595993041992, "global_step": 20259, "epoch": 167} {"train_loss": -28.974164962768555, "global_step": 20260, "epoch": 167} {"train_loss": -29.085742950439453, "global_step": 20261, "epoch": 167} {"train_loss": -28.99383544921875, "global_step": 20262, "epoch": 167} {"train_loss": -29.127399444580078, "global_step": 20263, "epoch": 167} {"train_loss": -29.237707138061523, "global_step": 20264, "epoch": 167} {"train_loss": -29.04878044128418, "global_step": 20265, "epoch": 167} {"train_loss": -28.899152755737305, "global_step": 20266, "epoch": 167} {"train_loss": -28.85605239868164, "global_step": 20267, "epoch": 167} {"train_loss": -29.019287109375, "global_step": 20268, "epoch": 167} {"train_loss": -28.501708984375, "global_step": 20269, "epoch": 167} {"train_loss": -28.660364151000977, "global_step": 20270, "epoch": 167} {"train_loss": -28.323440551757812, "global_step": 20271, "epoch": 167} {"train_loss": -29.5413875579834, "global_step": 20272, "epoch": 167} {"train_loss": -28.4757022857666, "global_step": 20273, "epoch": 167} {"train_loss": -29.47310447692871, "global_step": 20274, "epoch": 167} {"train_loss": -28.64723777770996, "global_step": 20275, "epoch": 167} {"train_loss": -28.699682235717773, "global_step": 20276, "epoch": 167} {"train_loss": -29.397907257080078, "global_step": 20277, "epoch": 167} {"train_loss": -29.29817008972168, "global_step": 20278, "epoch": 167} {"train_loss": -29.718515396118164, "global_step": 20279, "epoch": 167} {"train_loss": -29.432132720947266, "global_step": 20280, "epoch": 167} {"train_loss": -29.489511489868164, "global_step": 20281, "epoch": 167} {"train_loss": -29.36130142211914, "global_step": 20282, "epoch": 167} {"train_loss": -29.051889419555664, "global_step": 20283, "epoch": 167} {"train_loss": -29.431991577148438, "global_step": 20284, "epoch": 167} {"train_loss": -29.411102294921875, "global_step": 20285, "epoch": 167} {"train_loss": -29.2459774017334, "global_step": 20286, "epoch": 167} {"train_loss": -29.718732833862305, "global_step": 20287, "epoch": 167} {"train_loss": -29.64284324645996, "global_step": 20288, "epoch": 167} {"train_loss": -29.56989097595215, "global_step": 20289, "epoch": 167} {"train_loss": -29.0926456451416, "global_step": 20290, "epoch": 167} {"train_loss": -29.897491455078125, "global_step": 20291, "epoch": 167} {"train_loss": -29.271474838256836, "global_step": 20292, "epoch": 167} {"train_loss": -29.35528564453125, "global_step": 20293, "epoch": 167} {"train_loss": -29.513463973999023, "global_step": 20294, "epoch": 167} {"train_loss": -29.548038482666016, "global_step": 20295, "epoch": 167} {"train_loss": -29.32217788696289, "global_step": 20296, "epoch": 167} {"train_loss": -29.397058486938477, "global_step": 20297, "epoch": 167} {"train_loss": -29.771825790405273, "global_step": 20298, "epoch": 167} {"train_loss": -29.437231063842773, "global_step": 20299, "epoch": 167} {"train_loss": -29.234272003173828, "global_step": 20300, "epoch": 167} {"train_loss": -29.896015167236328, "global_step": 20301, "epoch": 167} {"train_loss": -29.79144287109375, "global_step": 20302, "epoch": 167} {"train_loss": -29.5999698638916, "global_step": 20303, "epoch": 167} {"train_loss": -29.954633712768555, "global_step": 20304, "epoch": 167} {"train_loss": -29.810110092163086, "global_step": 20305, "epoch": 167} {"train_loss": -29.651397705078125, "global_step": 20306, "epoch": 167} {"train_loss": -29.876239776611328, "global_step": 20307, "epoch": 167} {"train_loss": -30.063974380493164, "global_step": 20308, "epoch": 167} {"train_loss": -30.012807846069336, "global_step": 20309, "epoch": 167} {"train_loss": -29.819726943969727, "global_step": 20310, "epoch": 167} {"train_loss": -29.939453125, "global_step": 20311, "epoch": 167} {"train_loss": -30.249042510986328, "global_step": 20312, "epoch": 167} {"train_loss": -30.06100845336914, "global_step": 20313, "epoch": 167} {"train_loss": -30.131610870361328, "global_step": 20314, "epoch": 167} {"train_loss": -30.514892578125, "global_step": 20315, "epoch": 167} {"train_loss": -30.220672607421875, "global_step": 20316, "epoch": 167} {"train_loss": -30.12440299987793, "global_step": 20317, "epoch": 167} {"train_loss": -30.113351821899414, "global_step": 20318, "epoch": 167} {"train_loss": -30.37013816833496, "global_step": 20319, "epoch": 167} {"train_loss": -30.23699951171875, "global_step": 20320, "epoch": 167} {"train_loss": -29.9190673828125, "global_step": 20321, "epoch": 167} {"train_loss": -30.0678653717041, "global_step": 20322, "epoch": 167} {"train_loss": -29.906518936157227, "global_step": 20323, "epoch": 167} {"train_loss": -29.059385299682617, "global_step": 20324, "epoch": 167} {"train_loss": -28.70069694519043, "global_step": 20325, "epoch": 167} {"train_loss": -30.253355026245117, "global_step": 20326, "epoch": 167} {"train_loss": -29.033880706661005, "global_step": 20327, "epoch": 167, "val_loss": 2586501.0} {"train_loss": -29.298065185546875, "global_step": 20328, "epoch": 168} {"train_loss": -28.40201187133789, "global_step": 20329, "epoch": 168} {"train_loss": -29.634052276611328, "global_step": 20330, "epoch": 168} {"train_loss": -29.73206901550293, "global_step": 20331, "epoch": 168} {"train_loss": -28.928049087524414, "global_step": 20332, "epoch": 168} {"train_loss": -28.9663028717041, "global_step": 20333, "epoch": 168} {"train_loss": -29.16126823425293, "global_step": 20334, "epoch": 168} {"train_loss": -28.817752838134766, "global_step": 20335, "epoch": 168} {"train_loss": -29.633962631225586, "global_step": 20336, "epoch": 168} {"train_loss": -29.7095890045166, "global_step": 20337, "epoch": 168} {"train_loss": -28.14055824279785, "global_step": 20338, "epoch": 168} {"train_loss": -28.583532333374023, "global_step": 20339, "epoch": 168} {"train_loss": -29.936288833618164, "global_step": 20340, "epoch": 168} {"train_loss": -29.406219482421875, "global_step": 20341, "epoch": 168} {"train_loss": -29.362878799438477, "global_step": 20342, "epoch": 168} {"train_loss": -29.967761993408203, "global_step": 20343, "epoch": 168} {"train_loss": -29.20450782775879, "global_step": 20344, "epoch": 168} {"train_loss": -29.483484268188477, "global_step": 20345, "epoch": 168} {"train_loss": -29.9322509765625, "global_step": 20346, "epoch": 168} {"train_loss": -29.496702194213867, "global_step": 20347, "epoch": 168} {"train_loss": -28.96158218383789, "global_step": 20348, "epoch": 168} {"train_loss": -29.58320426940918, "global_step": 20349, "epoch": 168} {"train_loss": -29.966825485229492, "global_step": 20350, "epoch": 168} {"train_loss": -30.146509170532227, "global_step": 20351, "epoch": 168} {"train_loss": -30.13218116760254, "global_step": 20352, "epoch": 168} {"train_loss": -29.398061752319336, "global_step": 20353, "epoch": 168} {"train_loss": -29.7872257232666, "global_step": 20354, "epoch": 168} {"train_loss": -30.318592071533203, "global_step": 20355, "epoch": 168} {"train_loss": -30.149051666259766, "global_step": 20356, "epoch": 168} {"train_loss": -30.4188175201416, "global_step": 20357, "epoch": 168} {"train_loss": -30.37188720703125, "global_step": 20358, "epoch": 168} {"train_loss": -30.320083618164062, "global_step": 20359, "epoch": 168} {"train_loss": -30.361597061157227, "global_step": 20360, "epoch": 168} {"train_loss": -30.348133087158203, "global_step": 20361, "epoch": 168} {"train_loss": -30.07233238220215, "global_step": 20362, "epoch": 168} {"train_loss": -29.9309139251709, "global_step": 20363, "epoch": 168} {"train_loss": -29.540918350219727, "global_step": 20364, "epoch": 168} {"train_loss": -29.94001579284668, "global_step": 20365, "epoch": 168} {"train_loss": -30.549640655517578, "global_step": 20366, "epoch": 168} {"train_loss": -30.159650802612305, "global_step": 20367, "epoch": 168} {"train_loss": -29.650434494018555, "global_step": 20368, "epoch": 168} {"train_loss": -29.508636474609375, "global_step": 20369, "epoch": 168} {"train_loss": -28.862884521484375, "global_step": 20370, "epoch": 168} {"train_loss": -28.773975372314453, "global_step": 20371, "epoch": 168} {"train_loss": -28.65656852722168, "global_step": 20372, "epoch": 168} {"train_loss": -29.32874870300293, "global_step": 20373, "epoch": 168} {"train_loss": -29.183837890625, "global_step": 20374, "epoch": 168} {"train_loss": -29.564701080322266, "global_step": 20375, "epoch": 168} {"train_loss": -30.218732833862305, "global_step": 20376, "epoch": 168} {"train_loss": -30.090299606323242, "global_step": 20377, "epoch": 168} {"train_loss": -30.45684814453125, "global_step": 20378, "epoch": 168} {"train_loss": -29.916996002197266, "global_step": 20379, "epoch": 168} {"train_loss": -30.172637939453125, "global_step": 20380, "epoch": 168} {"train_loss": -29.880374908447266, "global_step": 20381, "epoch": 168} {"train_loss": -29.78203773498535, "global_step": 20382, "epoch": 168} {"train_loss": -29.782468795776367, "global_step": 20383, "epoch": 168} {"train_loss": -29.49982261657715, "global_step": 20384, "epoch": 168} {"train_loss": -30.008901596069336, "global_step": 20385, "epoch": 168} {"train_loss": -29.555572509765625, "global_step": 20386, "epoch": 168} {"train_loss": -29.816816329956055, "global_step": 20387, "epoch": 168} {"train_loss": -30.249059677124023, "global_step": 20388, "epoch": 168} {"train_loss": -30.17597770690918, "global_step": 20389, "epoch": 168} {"train_loss": -30.233118057250977, "global_step": 20390, "epoch": 168} {"train_loss": -29.83538818359375, "global_step": 20391, "epoch": 168} {"train_loss": -30.05449867248535, "global_step": 20392, "epoch": 168} {"train_loss": -30.29953384399414, "global_step": 20393, "epoch": 168} {"train_loss": -30.54896354675293, "global_step": 20394, "epoch": 168} {"train_loss": -29.871137619018555, "global_step": 20395, "epoch": 168} {"train_loss": -30.25048828125, "global_step": 20396, "epoch": 168} {"train_loss": -30.37400245666504, "global_step": 20397, "epoch": 168} {"train_loss": -30.618011474609375, "global_step": 20398, "epoch": 168} {"train_loss": -30.21052360534668, "global_step": 20399, "epoch": 168} {"train_loss": -30.584394454956055, "global_step": 20400, "epoch": 168} {"train_loss": -30.056049346923828, "global_step": 20401, "epoch": 168} {"train_loss": -30.513376235961914, "global_step": 20402, "epoch": 168} {"train_loss": -29.701181411743164, "global_step": 20403, "epoch": 168} {"train_loss": -27.76896095275879, "global_step": 20404, "epoch": 168} {"train_loss": -20.616689682006836, "global_step": 20405, "epoch": 168} {"train_loss": -2.585925579071045, "global_step": 20406, "epoch": 168} {"train_loss": -3.600879430770874, "global_step": 20407, "epoch": 168} {"train_loss": -28.73276710510254, "global_step": 20408, "epoch": 168} {"train_loss": -19.971155166625977, "global_step": 20409, "epoch": 168} {"train_loss": -28.576501846313477, "global_step": 20410, "epoch": 168} {"train_loss": -25.540590286254883, "global_step": 20411, "epoch": 168} {"train_loss": -25.169614791870117, "global_step": 20412, "epoch": 168} {"train_loss": -28.162240982055664, "global_step": 20413, "epoch": 168} {"train_loss": -28.458276748657227, "global_step": 20414, "epoch": 168} {"train_loss": -27.504785537719727, "global_step": 20415, "epoch": 168} {"train_loss": -27.0474796295166, "global_step": 20416, "epoch": 168} {"train_loss": -28.0816650390625, "global_step": 20417, "epoch": 168} {"train_loss": -28.916105270385742, "global_step": 20418, "epoch": 168} {"train_loss": -28.54262351989746, "global_step": 20419, "epoch": 168} {"train_loss": -28.231678009033203, "global_step": 20420, "epoch": 168} {"train_loss": -28.237329483032227, "global_step": 20421, "epoch": 168} {"train_loss": -28.561115264892578, "global_step": 20422, "epoch": 168} {"train_loss": -28.8942928314209, "global_step": 20423, "epoch": 168} {"train_loss": -28.531509399414062, "global_step": 20424, "epoch": 168} {"train_loss": -29.011341094970703, "global_step": 20425, "epoch": 168} {"train_loss": -28.3737735748291, "global_step": 20426, "epoch": 168} {"train_loss": -28.696136474609375, "global_step": 20427, "epoch": 168} {"train_loss": -29.175968170166016, "global_step": 20428, "epoch": 168} {"train_loss": -28.744260787963867, "global_step": 20429, "epoch": 168} {"train_loss": -28.58217430114746, "global_step": 20430, "epoch": 168} {"train_loss": -29.110437393188477, "global_step": 20431, "epoch": 168} {"train_loss": -29.011859893798828, "global_step": 20432, "epoch": 168} {"train_loss": -29.696435928344727, "global_step": 20433, "epoch": 168} {"train_loss": -29.085256576538086, "global_step": 20434, "epoch": 168} {"train_loss": -29.619800567626953, "global_step": 20435, "epoch": 168} {"train_loss": -29.235498428344727, "global_step": 20436, "epoch": 168} {"train_loss": -29.68573570251465, "global_step": 20437, "epoch": 168} {"train_loss": -29.132843017578125, "global_step": 20438, "epoch": 168} {"train_loss": -29.51066017150879, "global_step": 20439, "epoch": 168} {"train_loss": -29.2471866607666, "global_step": 20440, "epoch": 168} {"train_loss": -29.92959976196289, "global_step": 20441, "epoch": 168} {"train_loss": -29.216779708862305, "global_step": 20442, "epoch": 168} {"train_loss": -29.750564575195312, "global_step": 20443, "epoch": 168} {"train_loss": -29.616291046142578, "global_step": 20444, "epoch": 168} {"train_loss": -29.786550521850586, "global_step": 20445, "epoch": 168} {"train_loss": -29.133031845092773, "global_step": 20446, "epoch": 168} {"train_loss": -29.61979103088379, "global_step": 20447, "epoch": 168} {"train_loss": -28.806222389552218, "global_step": 20448, "epoch": 168, "val_loss": 2645013.75} {"train_loss": -27.690942764282227, "global_step": 20449, "epoch": 169} {"train_loss": -25.60968017578125, "global_step": 20450, "epoch": 169} {"train_loss": -26.6527042388916, "global_step": 20451, "epoch": 169} {"train_loss": -29.141845703125, "global_step": 20452, "epoch": 169} {"train_loss": -28.17585563659668, "global_step": 20453, "epoch": 169} {"train_loss": -27.707242965698242, "global_step": 20454, "epoch": 169} {"train_loss": -29.253467559814453, "global_step": 20455, "epoch": 169} {"train_loss": -28.319494247436523, "global_step": 20456, "epoch": 169} {"train_loss": -29.06023597717285, "global_step": 20457, "epoch": 169} {"train_loss": -29.15986442565918, "global_step": 20458, "epoch": 169} {"train_loss": -28.87738037109375, "global_step": 20459, "epoch": 169} {"train_loss": -28.521574020385742, "global_step": 20460, "epoch": 169} {"train_loss": -29.1645450592041, "global_step": 20461, "epoch": 169} {"train_loss": -28.434247970581055, "global_step": 20462, "epoch": 169} {"train_loss": -28.52469825744629, "global_step": 20463, "epoch": 169} {"train_loss": -28.3344669342041, "global_step": 20464, "epoch": 169} {"train_loss": -29.79813003540039, "global_step": 20465, "epoch": 169} {"train_loss": -28.355117797851562, "global_step": 20466, "epoch": 169} {"train_loss": -29.548181533813477, "global_step": 20467, "epoch": 169} {"train_loss": -29.35986328125, "global_step": 20468, "epoch": 169} {"train_loss": -28.910017013549805, "global_step": 20469, "epoch": 169} {"train_loss": -28.764484405517578, "global_step": 20470, "epoch": 169} {"train_loss": -29.62615966796875, "global_step": 20471, "epoch": 169} {"train_loss": -29.1395320892334, "global_step": 20472, "epoch": 169} {"train_loss": -29.5185604095459, "global_step": 20473, "epoch": 169} {"train_loss": -29.648923873901367, "global_step": 20474, "epoch": 169} {"train_loss": -29.734716415405273, "global_step": 20475, "epoch": 169} {"train_loss": -29.931257247924805, "global_step": 20476, "epoch": 169} {"train_loss": -29.311080932617188, "global_step": 20477, "epoch": 169} {"train_loss": -29.47873306274414, "global_step": 20478, "epoch": 169} {"train_loss": -29.636035919189453, "global_step": 20479, "epoch": 169} {"train_loss": -29.54168701171875, "global_step": 20480, "epoch": 169} {"train_loss": -29.72820472717285, "global_step": 20481, "epoch": 169} {"train_loss": -30.111364364624023, "global_step": 20482, "epoch": 169} {"train_loss": -29.282806396484375, "global_step": 20483, "epoch": 169} {"train_loss": -28.777679443359375, "global_step": 20484, "epoch": 169} {"train_loss": -28.549833297729492, "global_step": 20485, "epoch": 169} {"train_loss": -29.728290557861328, "global_step": 20486, "epoch": 169} {"train_loss": -30.22297477722168, "global_step": 20487, "epoch": 169} {"train_loss": -29.295303344726562, "global_step": 20488, "epoch": 169} {"train_loss": -29.310461044311523, "global_step": 20489, "epoch": 169} {"train_loss": -29.343626022338867, "global_step": 20490, "epoch": 169} {"train_loss": -29.72321891784668, "global_step": 20491, "epoch": 169} {"train_loss": -29.653766632080078, "global_step": 20492, "epoch": 169} {"train_loss": -29.352283477783203, "global_step": 20493, "epoch": 169} {"train_loss": -28.70684814453125, "global_step": 20494, "epoch": 169} {"train_loss": -29.961206436157227, "global_step": 20495, "epoch": 169} {"train_loss": -30.00068473815918, "global_step": 20496, "epoch": 169} {"train_loss": -30.3779296875, "global_step": 20497, "epoch": 169} {"train_loss": -29.343414306640625, "global_step": 20498, "epoch": 169} {"train_loss": -29.139535903930664, "global_step": 20499, "epoch": 169} {"train_loss": -29.88563346862793, "global_step": 20500, "epoch": 169} {"train_loss": -29.466205596923828, "global_step": 20501, "epoch": 169} {"train_loss": -29.46319580078125, "global_step": 20502, "epoch": 169} {"train_loss": -29.354816436767578, "global_step": 20503, "epoch": 169} {"train_loss": -29.88185691833496, "global_step": 20504, "epoch": 169} {"train_loss": -29.399169921875, "global_step": 20505, "epoch": 169} {"train_loss": -29.915618896484375, "global_step": 20506, "epoch": 169} {"train_loss": -29.25037956237793, "global_step": 20507, "epoch": 169} {"train_loss": -29.35688591003418, "global_step": 20508, "epoch": 169} {"train_loss": -29.385602951049805, "global_step": 20509, "epoch": 169} {"train_loss": -29.116230010986328, "global_step": 20510, "epoch": 169} {"train_loss": -29.67237663269043, "global_step": 20511, "epoch": 169} {"train_loss": -28.189868927001953, "global_step": 20512, "epoch": 169} {"train_loss": -27.611875534057617, "global_step": 20513, "epoch": 169} {"train_loss": -28.94287109375, "global_step": 20514, "epoch": 169} {"train_loss": -28.118066787719727, "global_step": 20515, "epoch": 169} {"train_loss": -29.546920776367188, "global_step": 20516, "epoch": 169} {"train_loss": -28.3275089263916, "global_step": 20517, "epoch": 169} {"train_loss": -28.762121200561523, "global_step": 20518, "epoch": 169} {"train_loss": -28.6387939453125, "global_step": 20519, "epoch": 169} {"train_loss": -29.278135299682617, "global_step": 20520, "epoch": 169} {"train_loss": -29.787982940673828, "global_step": 20521, "epoch": 169} {"train_loss": -29.39703369140625, "global_step": 20522, "epoch": 169} {"train_loss": -29.147192001342773, "global_step": 20523, "epoch": 169} {"train_loss": -29.49432373046875, "global_step": 20524, "epoch": 169} {"train_loss": -29.266921997070312, "global_step": 20525, "epoch": 169} {"train_loss": -29.294492721557617, "global_step": 20526, "epoch": 169} {"train_loss": -29.167097091674805, "global_step": 20527, "epoch": 169} {"train_loss": -28.471790313720703, "global_step": 20528, "epoch": 169} {"train_loss": -29.41619300842285, "global_step": 20529, "epoch": 169} {"train_loss": -29.0147647857666, "global_step": 20530, "epoch": 169} {"train_loss": -29.79229736328125, "global_step": 20531, "epoch": 169} {"train_loss": -29.60235023498535, "global_step": 20532, "epoch": 169} {"train_loss": -29.361480712890625, "global_step": 20533, "epoch": 169} {"train_loss": -29.44605827331543, "global_step": 20534, "epoch": 169} {"train_loss": -29.548023223876953, "global_step": 20535, "epoch": 169} {"train_loss": -30.025558471679688, "global_step": 20536, "epoch": 169} {"train_loss": -29.856739044189453, "global_step": 20537, "epoch": 169} {"train_loss": -29.99981689453125, "global_step": 20538, "epoch": 169} {"train_loss": -29.516626358032227, "global_step": 20539, "epoch": 169} {"train_loss": -30.110218048095703, "global_step": 20540, "epoch": 169} {"train_loss": -29.74399185180664, "global_step": 20541, "epoch": 169} {"train_loss": -28.935958862304688, "global_step": 20542, "epoch": 169} {"train_loss": -29.639678955078125, "global_step": 20543, "epoch": 169} {"train_loss": -29.891849517822266, "global_step": 20544, "epoch": 169} {"train_loss": -29.7270565032959, "global_step": 20545, "epoch": 169} {"train_loss": -29.59299659729004, "global_step": 20546, "epoch": 169} {"train_loss": -29.578262329101562, "global_step": 20547, "epoch": 169} {"train_loss": -29.798444747924805, "global_step": 20548, "epoch": 169} {"train_loss": -28.870222091674805, "global_step": 20549, "epoch": 169} {"train_loss": -29.303577423095703, "global_step": 20550, "epoch": 169} {"train_loss": -29.305322647094727, "global_step": 20551, "epoch": 169} {"train_loss": -29.35053825378418, "global_step": 20552, "epoch": 169} {"train_loss": -28.39630699157715, "global_step": 20553, "epoch": 169} {"train_loss": -26.038694381713867, "global_step": 20554, "epoch": 169} {"train_loss": -26.063907623291016, "global_step": 20555, "epoch": 169} {"train_loss": -27.303909301757812, "global_step": 20556, "epoch": 169} {"train_loss": -29.43564796447754, "global_step": 20557, "epoch": 169} {"train_loss": -29.168792724609375, "global_step": 20558, "epoch": 169} {"train_loss": -28.27803611755371, "global_step": 20559, "epoch": 169} {"train_loss": -28.871179580688477, "global_step": 20560, "epoch": 169} {"train_loss": -29.75469970703125, "global_step": 20561, "epoch": 169} {"train_loss": -28.229135513305664, "global_step": 20562, "epoch": 169} {"train_loss": -29.01410484313965, "global_step": 20563, "epoch": 169} {"train_loss": -29.804290771484375, "global_step": 20564, "epoch": 169} {"train_loss": -29.509740829467773, "global_step": 20565, "epoch": 169} {"train_loss": -29.759815216064453, "global_step": 20566, "epoch": 169} {"train_loss": -29.40176773071289, "global_step": 20567, "epoch": 169} {"train_loss": -29.54566764831543, "global_step": 20568, "epoch": 169} {"train_loss": -29.13659822448226, "global_step": 20569, "epoch": 169, "val_loss": 2455672.75} {"train_loss": -30.013532638549805, "global_step": 20570, "epoch": 170} {"train_loss": -28.47747802734375, "global_step": 20571, "epoch": 170} {"train_loss": -29.363027572631836, "global_step": 20572, "epoch": 170} {"train_loss": -29.662296295166016, "global_step": 20573, "epoch": 170} {"train_loss": -29.11264419555664, "global_step": 20574, "epoch": 170} {"train_loss": -29.18305015563965, "global_step": 20575, "epoch": 170} {"train_loss": -29.828144073486328, "global_step": 20576, "epoch": 170} {"train_loss": -29.162525177001953, "global_step": 20577, "epoch": 170} {"train_loss": -30.004993438720703, "global_step": 20578, "epoch": 170} {"train_loss": -30.070892333984375, "global_step": 20579, "epoch": 170} {"train_loss": -29.684762954711914, "global_step": 20580, "epoch": 170} {"train_loss": -29.815954208374023, "global_step": 20581, "epoch": 170} {"train_loss": -29.7186336517334, "global_step": 20582, "epoch": 170} {"train_loss": -29.960147857666016, "global_step": 20583, "epoch": 170} {"train_loss": -29.662450790405273, "global_step": 20584, "epoch": 170} {"train_loss": -29.785444259643555, "global_step": 20585, "epoch": 170} {"train_loss": -29.660825729370117, "global_step": 20586, "epoch": 170} {"train_loss": -29.96319580078125, "global_step": 20587, "epoch": 170} {"train_loss": -29.329004287719727, "global_step": 20588, "epoch": 170} {"train_loss": -29.714447021484375, "global_step": 20589, "epoch": 170} {"train_loss": -30.402374267578125, "global_step": 20590, "epoch": 170} {"train_loss": -30.2033748626709, "global_step": 20591, "epoch": 170} {"train_loss": -30.179676055908203, "global_step": 20592, "epoch": 170} {"train_loss": -30.266706466674805, "global_step": 20593, "epoch": 170} {"train_loss": -30.17597007751465, "global_step": 20594, "epoch": 170} {"train_loss": -29.80255126953125, "global_step": 20595, "epoch": 170} {"train_loss": -29.652774810791016, "global_step": 20596, "epoch": 170} {"train_loss": -29.252197265625, "global_step": 20597, "epoch": 170} {"train_loss": -30.4136962890625, "global_step": 20598, "epoch": 170} {"train_loss": -30.152942657470703, "global_step": 20599, "epoch": 170} {"train_loss": -30.079364776611328, "global_step": 20600, "epoch": 170} {"train_loss": -30.525365829467773, "global_step": 20601, "epoch": 170} {"train_loss": -30.18023681640625, "global_step": 20602, "epoch": 170} {"train_loss": -29.997486114501953, "global_step": 20603, "epoch": 170} {"train_loss": -29.425756454467773, "global_step": 20604, "epoch": 170} {"train_loss": -29.825550079345703, "global_step": 20605, "epoch": 170} {"train_loss": -29.855854034423828, "global_step": 20606, "epoch": 170} {"train_loss": -30.070892333984375, "global_step": 20607, "epoch": 170} {"train_loss": -29.597620010375977, "global_step": 20608, "epoch": 170} {"train_loss": -28.904809951782227, "global_step": 20609, "epoch": 170} {"train_loss": -30.021503448486328, "global_step": 20610, "epoch": 170} {"train_loss": -29.19059181213379, "global_step": 20611, "epoch": 170} {"train_loss": -29.711307525634766, "global_step": 20612, "epoch": 170} {"train_loss": -29.76163673400879, "global_step": 20613, "epoch": 170} {"train_loss": -29.49579429626465, "global_step": 20614, "epoch": 170} {"train_loss": -29.792917251586914, "global_step": 20615, "epoch": 170} {"train_loss": -29.996835708618164, "global_step": 20616, "epoch": 170} {"train_loss": -29.43409538269043, "global_step": 20617, "epoch": 170} {"train_loss": -29.9354305267334, "global_step": 20618, "epoch": 170} {"train_loss": -30.02644920349121, "global_step": 20619, "epoch": 170} {"train_loss": -30.024524688720703, "global_step": 20620, "epoch": 170} {"train_loss": -29.880773544311523, "global_step": 20621, "epoch": 170} {"train_loss": -29.667484283447266, "global_step": 20622, "epoch": 170} {"train_loss": -29.990835189819336, "global_step": 20623, "epoch": 170} {"train_loss": -29.9326229095459, "global_step": 20624, "epoch": 170} {"train_loss": -28.818744659423828, "global_step": 20625, "epoch": 170} {"train_loss": -29.52158546447754, "global_step": 20626, "epoch": 170} {"train_loss": -29.514734268188477, "global_step": 20627, "epoch": 170} {"train_loss": -29.73809814453125, "global_step": 20628, "epoch": 170} {"train_loss": -29.564971923828125, "global_step": 20629, "epoch": 170} {"train_loss": -29.406091690063477, "global_step": 20630, "epoch": 170} {"train_loss": -29.725873947143555, "global_step": 20631, "epoch": 170} {"train_loss": -30.076099395751953, "global_step": 20632, "epoch": 170} {"train_loss": -29.6695556640625, "global_step": 20633, "epoch": 170} {"train_loss": -28.98383903503418, "global_step": 20634, "epoch": 170} {"train_loss": -30.14887046813965, "global_step": 20635, "epoch": 170} {"train_loss": -28.966901779174805, "global_step": 20636, "epoch": 170} {"train_loss": -28.245574951171875, "global_step": 20637, "epoch": 170} {"train_loss": -29.6527156829834, "global_step": 20638, "epoch": 170} {"train_loss": -29.728246688842773, "global_step": 20639, "epoch": 170} {"train_loss": -29.217615127563477, "global_step": 20640, "epoch": 170} {"train_loss": -30.505109786987305, "global_step": 20641, "epoch": 170} {"train_loss": -29.226398468017578, "global_step": 20642, "epoch": 170} {"train_loss": -29.902570724487305, "global_step": 20643, "epoch": 170} {"train_loss": -29.83915138244629, "global_step": 20644, "epoch": 170} {"train_loss": -30.311689376831055, "global_step": 20645, "epoch": 170} {"train_loss": -29.826704025268555, "global_step": 20646, "epoch": 170} {"train_loss": -29.892017364501953, "global_step": 20647, "epoch": 170} {"train_loss": -30.068323135375977, "global_step": 20648, "epoch": 170} {"train_loss": -29.646650314331055, "global_step": 20649, "epoch": 170} {"train_loss": -29.49077796936035, "global_step": 20650, "epoch": 170} {"train_loss": -28.215042114257812, "global_step": 20651, "epoch": 170} {"train_loss": -28.125595092773438, "global_step": 20652, "epoch": 170} {"train_loss": -26.27740478515625, "global_step": 20653, "epoch": 170} {"train_loss": -26.99004554748535, "global_step": 20654, "epoch": 170} {"train_loss": -28.10456657409668, "global_step": 20655, "epoch": 170} {"train_loss": -28.856740951538086, "global_step": 20656, "epoch": 170} {"train_loss": -29.949371337890625, "global_step": 20657, "epoch": 170} {"train_loss": -28.870065689086914, "global_step": 20658, "epoch": 170} {"train_loss": -29.24810791015625, "global_step": 20659, "epoch": 170} {"train_loss": -29.56922721862793, "global_step": 20660, "epoch": 170} {"train_loss": -29.34803581237793, "global_step": 20661, "epoch": 170} {"train_loss": -29.190631866455078, "global_step": 20662, "epoch": 170} {"train_loss": -29.793981552124023, "global_step": 20663, "epoch": 170} {"train_loss": -29.755508422851562, "global_step": 20664, "epoch": 170} {"train_loss": -29.244070053100586, "global_step": 20665, "epoch": 170} {"train_loss": -29.44717788696289, "global_step": 20666, "epoch": 170} {"train_loss": -29.7208309173584, "global_step": 20667, "epoch": 170} {"train_loss": -29.6182861328125, "global_step": 20668, "epoch": 170} {"train_loss": -29.79652214050293, "global_step": 20669, "epoch": 170} {"train_loss": -29.1175479888916, "global_step": 20670, "epoch": 170} {"train_loss": -29.681745529174805, "global_step": 20671, "epoch": 170} {"train_loss": -28.68560791015625, "global_step": 20672, "epoch": 170} {"train_loss": -29.971094131469727, "global_step": 20673, "epoch": 170} {"train_loss": -29.315027236938477, "global_step": 20674, "epoch": 170} {"train_loss": -29.02119255065918, "global_step": 20675, "epoch": 170} {"train_loss": -29.755054473876953, "global_step": 20676, "epoch": 170} {"train_loss": -29.24151611328125, "global_step": 20677, "epoch": 170} {"train_loss": -29.150482177734375, "global_step": 20678, "epoch": 170} {"train_loss": -30.0935115814209, "global_step": 20679, "epoch": 170} {"train_loss": -28.638845443725586, "global_step": 20680, "epoch": 170} {"train_loss": -29.67670249938965, "global_step": 20681, "epoch": 170} {"train_loss": -29.308109283447266, "global_step": 20682, "epoch": 170} {"train_loss": -29.31764030456543, "global_step": 20683, "epoch": 170} {"train_loss": -30.355148315429688, "global_step": 20684, "epoch": 170} {"train_loss": -30.0301570892334, "global_step": 20685, "epoch": 170} {"train_loss": -30.09990882873535, "global_step": 20686, "epoch": 170} {"train_loss": -29.9447078704834, "global_step": 20687, "epoch": 170} {"train_loss": -29.2452449798584, "global_step": 20688, "epoch": 170} {"train_loss": -29.27910804748535, "global_step": 20689, "epoch": 170} {"train_loss": -29.56809151074118, "global_step": 20690, "epoch": 170, "val_loss": 2481936.75} {"train_loss": -30.494251251220703, "global_step": 20691, "epoch": 171} {"train_loss": -29.81314468383789, "global_step": 20692, "epoch": 171} {"train_loss": -30.049840927124023, "global_step": 20693, "epoch": 171} {"train_loss": -29.631662368774414, "global_step": 20694, "epoch": 171} {"train_loss": -30.443918228149414, "global_step": 20695, "epoch": 171} {"train_loss": -30.34858512878418, "global_step": 20696, "epoch": 171} {"train_loss": -30.339859008789062, "global_step": 20697, "epoch": 171} {"train_loss": -29.729650497436523, "global_step": 20698, "epoch": 171} {"train_loss": -29.83233642578125, "global_step": 20699, "epoch": 171} {"train_loss": -30.07233238220215, "global_step": 20700, "epoch": 171} {"train_loss": -30.597944259643555, "global_step": 20701, "epoch": 171} {"train_loss": -30.68073081970215, "global_step": 20702, "epoch": 171} {"train_loss": -30.14743995666504, "global_step": 20703, "epoch": 171} {"train_loss": -30.562082290649414, "global_step": 20704, "epoch": 171} {"train_loss": -30.58771324157715, "global_step": 20705, "epoch": 171} {"train_loss": -30.814666748046875, "global_step": 20706, "epoch": 171} {"train_loss": -30.68281364440918, "global_step": 20707, "epoch": 171} {"train_loss": -30.712987899780273, "global_step": 20708, "epoch": 171} {"train_loss": -30.5764217376709, "global_step": 20709, "epoch": 171} {"train_loss": -30.46546745300293, "global_step": 20710, "epoch": 171} {"train_loss": -30.862842559814453, "global_step": 20711, "epoch": 171} {"train_loss": -30.251081466674805, "global_step": 20712, "epoch": 171} {"train_loss": -30.759923934936523, "global_step": 20713, "epoch": 171} {"train_loss": -30.435300827026367, "global_step": 20714, "epoch": 171} {"train_loss": -30.4384708404541, "global_step": 20715, "epoch": 171} {"train_loss": -30.33283805847168, "global_step": 20716, "epoch": 171} {"train_loss": -30.61628532409668, "global_step": 20717, "epoch": 171} {"train_loss": -30.759521484375, "global_step": 20718, "epoch": 171} {"train_loss": -30.35975456237793, "global_step": 20719, "epoch": 171} {"train_loss": -30.591907501220703, "global_step": 20720, "epoch": 171} {"train_loss": -30.380767822265625, "global_step": 20721, "epoch": 171} {"train_loss": -30.684528350830078, "global_step": 20722, "epoch": 171} {"train_loss": -29.975671768188477, "global_step": 20723, "epoch": 171} {"train_loss": -29.361547470092773, "global_step": 20724, "epoch": 171} {"train_loss": -27.737268447875977, "global_step": 20725, "epoch": 171} {"train_loss": -24.787084579467773, "global_step": 20726, "epoch": 171} {"train_loss": -24.60243797302246, "global_step": 20727, "epoch": 171} {"train_loss": -28.621906280517578, "global_step": 20728, "epoch": 171} {"train_loss": -28.690109252929688, "global_step": 20729, "epoch": 171} {"train_loss": -25.476911544799805, "global_step": 20730, "epoch": 171} {"train_loss": -29.219541549682617, "global_step": 20731, "epoch": 171} {"train_loss": -27.97967529296875, "global_step": 20732, "epoch": 171} {"train_loss": -28.514450073242188, "global_step": 20733, "epoch": 171} {"train_loss": -28.188568115234375, "global_step": 20734, "epoch": 171} {"train_loss": -28.60515785217285, "global_step": 20735, "epoch": 171} {"train_loss": -29.266021728515625, "global_step": 20736, "epoch": 171} {"train_loss": -29.52656364440918, "global_step": 20737, "epoch": 171} {"train_loss": -28.435749053955078, "global_step": 20738, "epoch": 171} {"train_loss": -28.8445987701416, "global_step": 20739, "epoch": 171} {"train_loss": -29.68890953063965, "global_step": 20740, "epoch": 171} {"train_loss": -28.984516143798828, "global_step": 20741, "epoch": 171} {"train_loss": -29.035266876220703, "global_step": 20742, "epoch": 171} {"train_loss": -29.629348754882812, "global_step": 20743, "epoch": 171} {"train_loss": -29.735631942749023, "global_step": 20744, "epoch": 171} {"train_loss": -29.6148681640625, "global_step": 20745, "epoch": 171} {"train_loss": -28.708459854125977, "global_step": 20746, "epoch": 171} {"train_loss": -29.218402862548828, "global_step": 20747, "epoch": 171} {"train_loss": -29.31277847290039, "global_step": 20748, "epoch": 171} {"train_loss": -29.44614601135254, "global_step": 20749, "epoch": 171} {"train_loss": -28.80133628845215, "global_step": 20750, "epoch": 171} {"train_loss": -27.79144859313965, "global_step": 20751, "epoch": 171} {"train_loss": -26.684803009033203, "global_step": 20752, "epoch": 171} {"train_loss": -26.078327178955078, "global_step": 20753, "epoch": 171} {"train_loss": -28.1029052734375, "global_step": 20754, "epoch": 171} {"train_loss": -28.487503051757812, "global_step": 20755, "epoch": 171} {"train_loss": -29.045551300048828, "global_step": 20756, "epoch": 171} {"train_loss": -28.436399459838867, "global_step": 20757, "epoch": 171} {"train_loss": -29.24395179748535, "global_step": 20758, "epoch": 171} {"train_loss": -29.51969337463379, "global_step": 20759, "epoch": 171} {"train_loss": -29.483274459838867, "global_step": 20760, "epoch": 171} {"train_loss": -29.307632446289062, "global_step": 20761, "epoch": 171} {"train_loss": -29.90174674987793, "global_step": 20762, "epoch": 171} {"train_loss": -29.720813751220703, "global_step": 20763, "epoch": 171} {"train_loss": -29.76483154296875, "global_step": 20764, "epoch": 171} {"train_loss": -29.7122802734375, "global_step": 20765, "epoch": 171} {"train_loss": -29.423002243041992, "global_step": 20766, "epoch": 171} {"train_loss": -29.38276481628418, "global_step": 20767, "epoch": 171} {"train_loss": -29.971357345581055, "global_step": 20768, "epoch": 171} {"train_loss": -29.914886474609375, "global_step": 20769, "epoch": 171} {"train_loss": -29.70636558532715, "global_step": 20770, "epoch": 171} {"train_loss": -29.971607208251953, "global_step": 20771, "epoch": 171} {"train_loss": -30.1082763671875, "global_step": 20772, "epoch": 171} {"train_loss": -30.091373443603516, "global_step": 20773, "epoch": 171} {"train_loss": -29.746259689331055, "global_step": 20774, "epoch": 171} {"train_loss": -30.0053653717041, "global_step": 20775, "epoch": 171} {"train_loss": -29.691625595092773, "global_step": 20776, "epoch": 171} {"train_loss": -30.3516902923584, "global_step": 20777, "epoch": 171} {"train_loss": -30.295358657836914, "global_step": 20778, "epoch": 171} {"train_loss": -30.092161178588867, "global_step": 20779, "epoch": 171} {"train_loss": -30.11090087890625, "global_step": 20780, "epoch": 171} {"train_loss": -29.961566925048828, "global_step": 20781, "epoch": 171} {"train_loss": -30.39435386657715, "global_step": 20782, "epoch": 171} {"train_loss": -29.781036376953125, "global_step": 20783, "epoch": 171} {"train_loss": -29.130990982055664, "global_step": 20784, "epoch": 171} {"train_loss": -29.796417236328125, "global_step": 20785, "epoch": 171} {"train_loss": -30.08323097229004, "global_step": 20786, "epoch": 171} {"train_loss": -29.60393714904785, "global_step": 20787, "epoch": 171} {"train_loss": -29.949939727783203, "global_step": 20788, "epoch": 171} {"train_loss": -30.1660099029541, "global_step": 20789, "epoch": 171} {"train_loss": -30.023029327392578, "global_step": 20790, "epoch": 171} {"train_loss": -30.22951316833496, "global_step": 20791, "epoch": 171} {"train_loss": -30.178632736206055, "global_step": 20792, "epoch": 171} {"train_loss": -30.23895835876465, "global_step": 20793, "epoch": 171} {"train_loss": -30.308490753173828, "global_step": 20794, "epoch": 171} {"train_loss": -29.877887725830078, "global_step": 20795, "epoch": 171} {"train_loss": -30.3842830657959, "global_step": 20796, "epoch": 171} {"train_loss": -30.371252059936523, "global_step": 20797, "epoch": 171} {"train_loss": -30.198652267456055, "global_step": 20798, "epoch": 171} {"train_loss": -29.450971603393555, "global_step": 20799, "epoch": 171} {"train_loss": -28.890369415283203, "global_step": 20800, "epoch": 171} {"train_loss": -30.20182228088379, "global_step": 20801, "epoch": 171} {"train_loss": -29.68191909790039, "global_step": 20802, "epoch": 171} {"train_loss": -30.303709030151367, "global_step": 20803, "epoch": 171} {"train_loss": -30.3704891204834, "global_step": 20804, "epoch": 171} {"train_loss": -30.55084800720215, "global_step": 20805, "epoch": 171} {"train_loss": -30.065582275390625, "global_step": 20806, "epoch": 171} {"train_loss": -30.687204360961914, "global_step": 20807, "epoch": 171} {"train_loss": -30.5191650390625, "global_step": 20808, "epoch": 171} {"train_loss": -30.44968605041504, "global_step": 20809, "epoch": 171} {"train_loss": -30.651288986206055, "global_step": 20810, "epoch": 171} {"train_loss": -29.6329669164232, "global_step": 20811, "epoch": 171, "val_loss": 2494272.25} {"train_loss": -29.4197998046875, "global_step": 20812, "epoch": 172} {"train_loss": -29.621442794799805, "global_step": 20813, "epoch": 172} {"train_loss": -29.659971237182617, "global_step": 20814, "epoch": 172} {"train_loss": -29.368330001831055, "global_step": 20815, "epoch": 172} {"train_loss": -29.357812881469727, "global_step": 20816, "epoch": 172} {"train_loss": -30.12908935546875, "global_step": 20817, "epoch": 172} {"train_loss": -29.92136001586914, "global_step": 20818, "epoch": 172} {"train_loss": -30.032514572143555, "global_step": 20819, "epoch": 172} {"train_loss": -28.190876007080078, "global_step": 20820, "epoch": 172} {"train_loss": -27.370908737182617, "global_step": 20821, "epoch": 172} {"train_loss": -27.149438858032227, "global_step": 20822, "epoch": 172} {"train_loss": -28.6337890625, "global_step": 20823, "epoch": 172} {"train_loss": -30.014301300048828, "global_step": 20824, "epoch": 172} {"train_loss": -29.505823135375977, "global_step": 20825, "epoch": 172} {"train_loss": -27.935022354125977, "global_step": 20826, "epoch": 172} {"train_loss": -27.682239532470703, "global_step": 20827, "epoch": 172} {"train_loss": -29.243078231811523, "global_step": 20828, "epoch": 172} {"train_loss": -30.168750762939453, "global_step": 20829, "epoch": 172} {"train_loss": -27.9782772064209, "global_step": 20830, "epoch": 172} {"train_loss": -28.45538902282715, "global_step": 20831, "epoch": 172} {"train_loss": -30.66460609436035, "global_step": 20832, "epoch": 172} {"train_loss": -28.64556312561035, "global_step": 20833, "epoch": 172} {"train_loss": -29.058395385742188, "global_step": 20834, "epoch": 172} {"train_loss": -30.317907333374023, "global_step": 20835, "epoch": 172} {"train_loss": -29.129318237304688, "global_step": 20836, "epoch": 172} {"train_loss": -30.61417007446289, "global_step": 20837, "epoch": 172} {"train_loss": -28.66572380065918, "global_step": 20838, "epoch": 172} {"train_loss": -29.815160751342773, "global_step": 20839, "epoch": 172} {"train_loss": -30.44761085510254, "global_step": 20840, "epoch": 172} {"train_loss": -29.31074333190918, "global_step": 20841, "epoch": 172} {"train_loss": -30.369720458984375, "global_step": 20842, "epoch": 172} {"train_loss": -29.766305923461914, "global_step": 20843, "epoch": 172} {"train_loss": -30.188297271728516, "global_step": 20844, "epoch": 172} {"train_loss": -30.112470626831055, "global_step": 20845, "epoch": 172} {"train_loss": -30.4191837310791, "global_step": 20846, "epoch": 172} {"train_loss": -30.194875717163086, "global_step": 20847, "epoch": 172} {"train_loss": -30.594711303710938, "global_step": 20848, "epoch": 172} {"train_loss": -30.04066276550293, "global_step": 20849, "epoch": 172} {"train_loss": -30.73042106628418, "global_step": 20850, "epoch": 172} {"train_loss": -30.429285049438477, "global_step": 20851, "epoch": 172} {"train_loss": -29.906789779663086, "global_step": 20852, "epoch": 172} {"train_loss": -30.374235153198242, "global_step": 20853, "epoch": 172} {"train_loss": -30.852384567260742, "global_step": 20854, "epoch": 172} {"train_loss": -29.468366622924805, "global_step": 20855, "epoch": 172} {"train_loss": -30.2570858001709, "global_step": 20856, "epoch": 172} {"train_loss": -29.26679039001465, "global_step": 20857, "epoch": 172} {"train_loss": -27.86456298828125, "global_step": 20858, "epoch": 172} {"train_loss": -26.804676055908203, "global_step": 20859, "epoch": 172} {"train_loss": -30.110010147094727, "global_step": 20860, "epoch": 172} {"train_loss": -28.572996139526367, "global_step": 20861, "epoch": 172} {"train_loss": -28.41242790222168, "global_step": 20862, "epoch": 172} {"train_loss": -24.568105697631836, "global_step": 20863, "epoch": 172} {"train_loss": -26.78040885925293, "global_step": 20864, "epoch": 172} {"train_loss": -28.6126651763916, "global_step": 20865, "epoch": 172} {"train_loss": -29.279523849487305, "global_step": 20866, "epoch": 172} {"train_loss": -27.661121368408203, "global_step": 20867, "epoch": 172} {"train_loss": -27.647306442260742, "global_step": 20868, "epoch": 172} {"train_loss": -29.645299911499023, "global_step": 20869, "epoch": 172} {"train_loss": -28.867279052734375, "global_step": 20870, "epoch": 172} {"train_loss": -30.07183265686035, "global_step": 20871, "epoch": 172} {"train_loss": -29.0000057220459, "global_step": 20872, "epoch": 172} {"train_loss": -30.18902587890625, "global_step": 20873, "epoch": 172} {"train_loss": -29.57521629333496, "global_step": 20874, "epoch": 172} {"train_loss": -30.1812686920166, "global_step": 20875, "epoch": 172} {"train_loss": -29.622589111328125, "global_step": 20876, "epoch": 172} {"train_loss": -29.7158203125, "global_step": 20877, "epoch": 172} {"train_loss": -30.060779571533203, "global_step": 20878, "epoch": 172} {"train_loss": -29.35230827331543, "global_step": 20879, "epoch": 172} {"train_loss": -29.998462677001953, "global_step": 20880, "epoch": 172} {"train_loss": -29.451984405517578, "global_step": 20881, "epoch": 172} {"train_loss": -30.05475425720215, "global_step": 20882, "epoch": 172} {"train_loss": -29.733829498291016, "global_step": 20883, "epoch": 172} {"train_loss": -29.31637954711914, "global_step": 20884, "epoch": 172} {"train_loss": -29.517353057861328, "global_step": 20885, "epoch": 172} {"train_loss": -29.921247482299805, "global_step": 20886, "epoch": 172} {"train_loss": -29.4005184173584, "global_step": 20887, "epoch": 172} {"train_loss": -30.308368682861328, "global_step": 20888, "epoch": 172} {"train_loss": -29.825483322143555, "global_step": 20889, "epoch": 172} {"train_loss": -30.180387496948242, "global_step": 20890, "epoch": 172} {"train_loss": -29.499120712280273, "global_step": 20891, "epoch": 172} {"train_loss": -30.100666046142578, "global_step": 20892, "epoch": 172} {"train_loss": -30.029956817626953, "global_step": 20893, "epoch": 172} {"train_loss": -29.992294311523438, "global_step": 20894, "epoch": 172} {"train_loss": -30.0867862701416, "global_step": 20895, "epoch": 172} {"train_loss": -30.294940948486328, "global_step": 20896, "epoch": 172} {"train_loss": -29.98406410217285, "global_step": 20897, "epoch": 172} {"train_loss": -29.491865158081055, "global_step": 20898, "epoch": 172} {"train_loss": -28.5454044342041, "global_step": 20899, "epoch": 172} {"train_loss": -27.32317543029785, "global_step": 20900, "epoch": 172} {"train_loss": -26.954059600830078, "global_step": 20901, "epoch": 172} {"train_loss": -29.284460067749023, "global_step": 20902, "epoch": 172} {"train_loss": -29.913410186767578, "global_step": 20903, "epoch": 172} {"train_loss": -27.269580841064453, "global_step": 20904, "epoch": 172} {"train_loss": -28.795093536376953, "global_step": 20905, "epoch": 172} {"train_loss": -30.131214141845703, "global_step": 20906, "epoch": 172} {"train_loss": -27.951765060424805, "global_step": 20907, "epoch": 172} {"train_loss": -30.13970947265625, "global_step": 20908, "epoch": 172} {"train_loss": -29.437458038330078, "global_step": 20909, "epoch": 172} {"train_loss": -29.00275993347168, "global_step": 20910, "epoch": 172} {"train_loss": -30.0072078704834, "global_step": 20911, "epoch": 172} {"train_loss": -29.488752365112305, "global_step": 20912, "epoch": 172} {"train_loss": -30.14468765258789, "global_step": 20913, "epoch": 172} {"train_loss": -30.020751953125, "global_step": 20914, "epoch": 172} {"train_loss": -30.02186393737793, "global_step": 20915, "epoch": 172} {"train_loss": -30.12151527404785, "global_step": 20916, "epoch": 172} {"train_loss": -30.173017501831055, "global_step": 20917, "epoch": 172} {"train_loss": -30.153615951538086, "global_step": 20918, "epoch": 172} {"train_loss": -30.073530197143555, "global_step": 20919, "epoch": 172} {"train_loss": -30.284412384033203, "global_step": 20920, "epoch": 172} {"train_loss": -30.32404136657715, "global_step": 20921, "epoch": 172} {"train_loss": -30.665180206298828, "global_step": 20922, "epoch": 172} {"train_loss": -30.299102783203125, "global_step": 20923, "epoch": 172} {"train_loss": -29.980487823486328, "global_step": 20924, "epoch": 172} {"train_loss": -30.77349281311035, "global_step": 20925, "epoch": 172} {"train_loss": -30.02894401550293, "global_step": 20926, "epoch": 172} {"train_loss": -30.27667808532715, "global_step": 20927, "epoch": 172} {"train_loss": -30.027135848999023, "global_step": 20928, "epoch": 172} {"train_loss": -30.56276512145996, "global_step": 20929, "epoch": 172} {"train_loss": -29.94648551940918, "global_step": 20930, "epoch": 172} {"train_loss": -29.825153350830078, "global_step": 20931, "epoch": 172} {"train_loss": -29.478343333094575, "global_step": 20932, "epoch": 172, "val_loss": 2527705.25} {"train_loss": -30.049976348876953, "global_step": 20933, "epoch": 173} {"train_loss": -29.46051025390625, "global_step": 20934, "epoch": 173} {"train_loss": -29.849821090698242, "global_step": 20935, "epoch": 173} {"train_loss": -30.62578773498535, "global_step": 20936, "epoch": 173} {"train_loss": -29.67945671081543, "global_step": 20937, "epoch": 173} {"train_loss": -28.222091674804688, "global_step": 20938, "epoch": 173} {"train_loss": -28.97639274597168, "global_step": 20939, "epoch": 173} {"train_loss": -29.609975814819336, "global_step": 20940, "epoch": 173} {"train_loss": -30.444656372070312, "global_step": 20941, "epoch": 173} {"train_loss": -30.16451072692871, "global_step": 20942, "epoch": 173} {"train_loss": -29.591238021850586, "global_step": 20943, "epoch": 173} {"train_loss": -29.966123580932617, "global_step": 20944, "epoch": 173} {"train_loss": -29.617233276367188, "global_step": 20945, "epoch": 173} {"train_loss": -29.7308349609375, "global_step": 20946, "epoch": 173} {"train_loss": -29.22443962097168, "global_step": 20947, "epoch": 173} {"train_loss": -30.09490394592285, "global_step": 20948, "epoch": 173} {"train_loss": -30.207983016967773, "global_step": 20949, "epoch": 173} {"train_loss": -29.626672744750977, "global_step": 20950, "epoch": 173} {"train_loss": -29.898035049438477, "global_step": 20951, "epoch": 173} {"train_loss": -29.960235595703125, "global_step": 20952, "epoch": 173} {"train_loss": -29.996923446655273, "global_step": 20953, "epoch": 173} {"train_loss": -29.771055221557617, "global_step": 20954, "epoch": 173} {"train_loss": -30.044635772705078, "global_step": 20955, "epoch": 173} {"train_loss": -29.469024658203125, "global_step": 20956, "epoch": 173} {"train_loss": -29.89371681213379, "global_step": 20957, "epoch": 173} {"train_loss": -30.025190353393555, "global_step": 20958, "epoch": 173} {"train_loss": -29.426456451416016, "global_step": 20959, "epoch": 173} {"train_loss": -30.343326568603516, "global_step": 20960, "epoch": 173} {"train_loss": -29.796918869018555, "global_step": 20961, "epoch": 173} {"train_loss": -28.790136337280273, "global_step": 20962, "epoch": 173} {"train_loss": -27.715290069580078, "global_step": 20963, "epoch": 173} {"train_loss": -19.857534408569336, "global_step": 20964, "epoch": 173} {"train_loss": -9.487226486206055, "global_step": 20965, "epoch": 173} {"train_loss": -11.753060340881348, "global_step": 20966, "epoch": 173} {"train_loss": -28.496118545532227, "global_step": 20967, "epoch": 173} {"train_loss": -20.954124450683594, "global_step": 20968, "epoch": 173} {"train_loss": -25.900793075561523, "global_step": 20969, "epoch": 173} {"train_loss": -28.428430557250977, "global_step": 20970, "epoch": 173} {"train_loss": -24.94394302368164, "global_step": 20971, "epoch": 173} {"train_loss": -26.25736427307129, "global_step": 20972, "epoch": 173} {"train_loss": -28.831562042236328, "global_step": 20973, "epoch": 173} {"train_loss": -28.533496856689453, "global_step": 20974, "epoch": 173} {"train_loss": -28.05356216430664, "global_step": 20975, "epoch": 173} {"train_loss": -27.27518081665039, "global_step": 20976, "epoch": 173} {"train_loss": -27.97027015686035, "global_step": 20977, "epoch": 173} {"train_loss": -28.111942291259766, "global_step": 20978, "epoch": 173} {"train_loss": -29.041168212890625, "global_step": 20979, "epoch": 173} {"train_loss": -28.092208862304688, "global_step": 20980, "epoch": 173} {"train_loss": -28.9143123626709, "global_step": 20981, "epoch": 173} {"train_loss": -29.01761245727539, "global_step": 20982, "epoch": 173} {"train_loss": -28.81648063659668, "global_step": 20983, "epoch": 173} {"train_loss": -28.2779483795166, "global_step": 20984, "epoch": 173} {"train_loss": -28.813928604125977, "global_step": 20985, "epoch": 173} {"train_loss": -28.454517364501953, "global_step": 20986, "epoch": 173} {"train_loss": -29.279172897338867, "global_step": 20987, "epoch": 173} {"train_loss": -28.73798179626465, "global_step": 20988, "epoch": 173} {"train_loss": -29.01491355895996, "global_step": 20989, "epoch": 173} {"train_loss": -28.989492416381836, "global_step": 20990, "epoch": 173} {"train_loss": -29.74319839477539, "global_step": 20991, "epoch": 173} {"train_loss": -28.89544677734375, "global_step": 20992, "epoch": 173} {"train_loss": -29.319860458374023, "global_step": 20993, "epoch": 173} {"train_loss": -28.84303092956543, "global_step": 20994, "epoch": 173} {"train_loss": -29.231069564819336, "global_step": 20995, "epoch": 173} {"train_loss": -28.93398094177246, "global_step": 20996, "epoch": 173} {"train_loss": -29.09319496154785, "global_step": 20997, "epoch": 173} {"train_loss": -29.355976104736328, "global_step": 20998, "epoch": 173} {"train_loss": -29.61500358581543, "global_step": 20999, "epoch": 173} {"train_loss": -29.40616798400879, "global_step": 21000, "epoch": 173} {"train_loss": -29.466474533081055, "global_step": 21001, "epoch": 173} {"train_loss": -29.58283042907715, "global_step": 21002, "epoch": 173} {"train_loss": -29.531341552734375, "global_step": 21003, "epoch": 173} {"train_loss": -29.251605987548828, "global_step": 21004, "epoch": 173} {"train_loss": -30.136890411376953, "global_step": 21005, "epoch": 173} {"train_loss": -29.90850830078125, "global_step": 21006, "epoch": 173} {"train_loss": -29.863327026367188, "global_step": 21007, "epoch": 173} {"train_loss": -29.668333053588867, "global_step": 21008, "epoch": 173} {"train_loss": -29.205942153930664, "global_step": 21009, "epoch": 173} {"train_loss": -30.016183853149414, "global_step": 21010, "epoch": 173} {"train_loss": -29.91177749633789, "global_step": 21011, "epoch": 173} {"train_loss": -30.029926300048828, "global_step": 21012, "epoch": 173} {"train_loss": -28.914243698120117, "global_step": 21013, "epoch": 173} {"train_loss": -29.083555221557617, "global_step": 21014, "epoch": 173} {"train_loss": -30.04876136779785, "global_step": 21015, "epoch": 173} {"train_loss": -30.05279541015625, "global_step": 21016, "epoch": 173} {"train_loss": -29.939184188842773, "global_step": 21017, "epoch": 173} {"train_loss": -29.88483238220215, "global_step": 21018, "epoch": 173} {"train_loss": -30.1987247467041, "global_step": 21019, "epoch": 173} {"train_loss": -29.718799591064453, "global_step": 21020, "epoch": 173} {"train_loss": -29.99424171447754, "global_step": 21021, "epoch": 173} {"train_loss": -29.642114639282227, "global_step": 21022, "epoch": 173} {"train_loss": -30.16202163696289, "global_step": 21023, "epoch": 173} {"train_loss": -29.31186294555664, "global_step": 21024, "epoch": 173} {"train_loss": -29.330488204956055, "global_step": 21025, "epoch": 173} {"train_loss": -29.503210067749023, "global_step": 21026, "epoch": 173} {"train_loss": -29.802820205688477, "global_step": 21027, "epoch": 173} {"train_loss": -29.815139770507812, "global_step": 21028, "epoch": 173} {"train_loss": -29.963117599487305, "global_step": 21029, "epoch": 173} {"train_loss": -28.660751342773438, "global_step": 21030, "epoch": 173} {"train_loss": -28.66037940979004, "global_step": 21031, "epoch": 173} {"train_loss": -29.43760108947754, "global_step": 21032, "epoch": 173} {"train_loss": -29.418020248413086, "global_step": 21033, "epoch": 173} {"train_loss": -29.957754135131836, "global_step": 21034, "epoch": 173} {"train_loss": -29.459619522094727, "global_step": 21035, "epoch": 173} {"train_loss": -28.967361450195312, "global_step": 21036, "epoch": 173} {"train_loss": -28.48084831237793, "global_step": 21037, "epoch": 173} {"train_loss": -29.076892852783203, "global_step": 21038, "epoch": 173} {"train_loss": -29.78498649597168, "global_step": 21039, "epoch": 173} {"train_loss": -29.112409591674805, "global_step": 21040, "epoch": 173} {"train_loss": -28.731958389282227, "global_step": 21041, "epoch": 173} {"train_loss": -27.869831085205078, "global_step": 21042, "epoch": 173} {"train_loss": -27.209909439086914, "global_step": 21043, "epoch": 173} {"train_loss": -25.826581954956055, "global_step": 21044, "epoch": 173} {"train_loss": -26.669164657592773, "global_step": 21045, "epoch": 173} {"train_loss": -27.90167236328125, "global_step": 21046, "epoch": 173} {"train_loss": -28.623640060424805, "global_step": 21047, "epoch": 173} {"train_loss": -28.43747329711914, "global_step": 21048, "epoch": 173} {"train_loss": -29.05051040649414, "global_step": 21049, "epoch": 173} {"train_loss": -29.482650756835938, "global_step": 21050, "epoch": 173} {"train_loss": -29.25510597229004, "global_step": 21051, "epoch": 173} {"train_loss": -29.065603256225586, "global_step": 21052, "epoch": 173} {"train_loss": -28.70342781918108, "global_step": 21053, "epoch": 173, "val_loss": 2821841.25} {"train_loss": -29.737659454345703, "global_step": 21054, "epoch": 174} {"train_loss": -29.212345123291016, "global_step": 21055, "epoch": 174} {"train_loss": -28.978845596313477, "global_step": 21056, "epoch": 174} {"train_loss": -29.20644187927246, "global_step": 21057, "epoch": 174} {"train_loss": -29.832229614257812, "global_step": 21058, "epoch": 174} {"train_loss": -28.46992301940918, "global_step": 21059, "epoch": 174} {"train_loss": -30.021947860717773, "global_step": 21060, "epoch": 174} {"train_loss": -29.06580924987793, "global_step": 21061, "epoch": 174} {"train_loss": -29.180089950561523, "global_step": 21062, "epoch": 174} {"train_loss": -29.939258575439453, "global_step": 21063, "epoch": 174} {"train_loss": -28.977216720581055, "global_step": 21064, "epoch": 174} {"train_loss": -30.064374923706055, "global_step": 21065, "epoch": 174} {"train_loss": -29.409772872924805, "global_step": 21066, "epoch": 174} {"train_loss": -29.334360122680664, "global_step": 21067, "epoch": 174} {"train_loss": -29.924407958984375, "global_step": 21068, "epoch": 174} {"train_loss": -29.383752822875977, "global_step": 21069, "epoch": 174} {"train_loss": -29.162189483642578, "global_step": 21070, "epoch": 174} {"train_loss": -29.010028839111328, "global_step": 21071, "epoch": 174} {"train_loss": -29.6439208984375, "global_step": 21072, "epoch": 174} {"train_loss": -28.804677963256836, "global_step": 21073, "epoch": 174} {"train_loss": -29.626386642456055, "global_step": 21074, "epoch": 174} {"train_loss": -29.371601104736328, "global_step": 21075, "epoch": 174} {"train_loss": -29.605453491210938, "global_step": 21076, "epoch": 174} {"train_loss": -29.899402618408203, "global_step": 21077, "epoch": 174} {"train_loss": -29.667236328125, "global_step": 21078, "epoch": 174} {"train_loss": -29.509199142456055, "global_step": 21079, "epoch": 174} {"train_loss": -30.199926376342773, "global_step": 21080, "epoch": 174} {"train_loss": -29.876483917236328, "global_step": 21081, "epoch": 174} {"train_loss": -29.784509658813477, "global_step": 21082, "epoch": 174} {"train_loss": -29.350244522094727, "global_step": 21083, "epoch": 174} {"train_loss": -29.66385269165039, "global_step": 21084, "epoch": 174} {"train_loss": -30.107519149780273, "global_step": 21085, "epoch": 174} {"train_loss": -29.838464736938477, "global_step": 21086, "epoch": 174} {"train_loss": -29.98207664489746, "global_step": 21087, "epoch": 174} {"train_loss": -30.008474349975586, "global_step": 21088, "epoch": 174} {"train_loss": -30.105518341064453, "global_step": 21089, "epoch": 174} {"train_loss": -30.045642852783203, "global_step": 21090, "epoch": 174} {"train_loss": -30.13983154296875, "global_step": 21091, "epoch": 174} {"train_loss": -30.1014461517334, "global_step": 21092, "epoch": 174} {"train_loss": -30.016265869140625, "global_step": 21093, "epoch": 174} {"train_loss": -30.14557456970215, "global_step": 21094, "epoch": 174} {"train_loss": -29.87824058532715, "global_step": 21095, "epoch": 174} {"train_loss": -30.032529830932617, "global_step": 21096, "epoch": 174} {"train_loss": -30.146121978759766, "global_step": 21097, "epoch": 174} {"train_loss": -30.231977462768555, "global_step": 21098, "epoch": 174} {"train_loss": -30.327543258666992, "global_step": 21099, "epoch": 174} {"train_loss": -30.059967041015625, "global_step": 21100, "epoch": 174} {"train_loss": -29.890735626220703, "global_step": 21101, "epoch": 174} {"train_loss": -30.239063262939453, "global_step": 21102, "epoch": 174} {"train_loss": -29.651599884033203, "global_step": 21103, "epoch": 174} {"train_loss": -29.632221221923828, "global_step": 21104, "epoch": 174} {"train_loss": -29.735122680664062, "global_step": 21105, "epoch": 174} {"train_loss": -30.128461837768555, "global_step": 21106, "epoch": 174} {"train_loss": -29.937875747680664, "global_step": 21107, "epoch": 174} {"train_loss": -30.431982040405273, "global_step": 21108, "epoch": 174} {"train_loss": -29.920352935791016, "global_step": 21109, "epoch": 174} {"train_loss": -29.929853439331055, "global_step": 21110, "epoch": 174} {"train_loss": -29.260602951049805, "global_step": 21111, "epoch": 174} {"train_loss": -29.671100616455078, "global_step": 21112, "epoch": 174} {"train_loss": -29.47881507873535, "global_step": 21113, "epoch": 174} {"train_loss": -29.18732261657715, "global_step": 21114, "epoch": 174} {"train_loss": -28.76666831970215, "global_step": 21115, "epoch": 174} {"train_loss": -28.178638458251953, "global_step": 21116, "epoch": 174} {"train_loss": -29.28167152404785, "global_step": 21117, "epoch": 174} {"train_loss": -29.7708683013916, "global_step": 21118, "epoch": 174} {"train_loss": -28.766035079956055, "global_step": 21119, "epoch": 174} {"train_loss": -28.551977157592773, "global_step": 21120, "epoch": 174} {"train_loss": -28.81979751586914, "global_step": 21121, "epoch": 174} {"train_loss": -29.6400146484375, "global_step": 21122, "epoch": 174} {"train_loss": -29.991674423217773, "global_step": 21123, "epoch": 174} {"train_loss": -29.552392959594727, "global_step": 21124, "epoch": 174} {"train_loss": -29.57806968688965, "global_step": 21125, "epoch": 174} {"train_loss": -29.6608943939209, "global_step": 21126, "epoch": 174} {"train_loss": -29.742572784423828, "global_step": 21127, "epoch": 174} {"train_loss": -28.637182235717773, "global_step": 21128, "epoch": 174} {"train_loss": -30.0782470703125, "global_step": 21129, "epoch": 174} {"train_loss": -30.433805465698242, "global_step": 21130, "epoch": 174} {"train_loss": -29.369903564453125, "global_step": 21131, "epoch": 174} {"train_loss": -27.518728256225586, "global_step": 21132, "epoch": 174} {"train_loss": -27.780813217163086, "global_step": 21133, "epoch": 174} {"train_loss": -29.7113037109375, "global_step": 21134, "epoch": 174} {"train_loss": -29.74122428894043, "global_step": 21135, "epoch": 174} {"train_loss": -29.176366806030273, "global_step": 21136, "epoch": 174} {"train_loss": -29.729358673095703, "global_step": 21137, "epoch": 174} {"train_loss": -29.081424713134766, "global_step": 21138, "epoch": 174} {"train_loss": -28.79365348815918, "global_step": 21139, "epoch": 174} {"train_loss": -29.4996337890625, "global_step": 21140, "epoch": 174} {"train_loss": -29.769437789916992, "global_step": 21141, "epoch": 174} {"train_loss": -29.692235946655273, "global_step": 21142, "epoch": 174} {"train_loss": -30.014379501342773, "global_step": 21143, "epoch": 174} {"train_loss": -30.313196182250977, "global_step": 21144, "epoch": 174} {"train_loss": -30.6044864654541, "global_step": 21145, "epoch": 174} {"train_loss": -30.0783748626709, "global_step": 21146, "epoch": 174} {"train_loss": -30.161853790283203, "global_step": 21147, "epoch": 174} {"train_loss": -30.283117294311523, "global_step": 21148, "epoch": 174} {"train_loss": -30.319482803344727, "global_step": 21149, "epoch": 174} {"train_loss": -30.39571189880371, "global_step": 21150, "epoch": 174} {"train_loss": -30.073514938354492, "global_step": 21151, "epoch": 174} {"train_loss": -30.151885986328125, "global_step": 21152, "epoch": 174} {"train_loss": -30.2701473236084, "global_step": 21153, "epoch": 174} {"train_loss": -30.473663330078125, "global_step": 21154, "epoch": 174} {"train_loss": -30.373239517211914, "global_step": 21155, "epoch": 174} {"train_loss": -30.273193359375, "global_step": 21156, "epoch": 174} {"train_loss": -30.517948150634766, "global_step": 21157, "epoch": 174} {"train_loss": -30.678152084350586, "global_step": 21158, "epoch": 174} {"train_loss": -30.908414840698242, "global_step": 21159, "epoch": 174} {"train_loss": -30.367109298706055, "global_step": 21160, "epoch": 174} {"train_loss": -30.7652530670166, "global_step": 21161, "epoch": 174} {"train_loss": -30.531179428100586, "global_step": 21162, "epoch": 174} {"train_loss": -30.225955963134766, "global_step": 21163, "epoch": 174} {"train_loss": -30.485248565673828, "global_step": 21164, "epoch": 174} {"train_loss": -30.269134521484375, "global_step": 21165, "epoch": 174} {"train_loss": -30.506580352783203, "global_step": 21166, "epoch": 174} {"train_loss": -30.680877685546875, "global_step": 21167, "epoch": 174} {"train_loss": -30.6496639251709, "global_step": 21168, "epoch": 174} {"train_loss": -30.75834083557129, "global_step": 21169, "epoch": 174} {"train_loss": -30.501123428344727, "global_step": 21170, "epoch": 174} {"train_loss": -30.890518188476562, "global_step": 21171, "epoch": 174} {"train_loss": -30.690509796142578, "global_step": 21172, "epoch": 174} {"train_loss": -31.14794921875, "global_step": 21173, "epoch": 174} {"train_loss": -29.80524479259144, "global_step": 21174, "epoch": 174, "val_loss": 2623088.0} {"train_loss": -30.544940948486328, "global_step": 21175, "epoch": 175} {"train_loss": -30.125402450561523, "global_step": 21176, "epoch": 175} {"train_loss": -30.389938354492188, "global_step": 21177, "epoch": 175} {"train_loss": -29.270254135131836, "global_step": 21178, "epoch": 175} {"train_loss": -30.20765495300293, "global_step": 21179, "epoch": 175} {"train_loss": -30.3806095123291, "global_step": 21180, "epoch": 175} {"train_loss": -29.803974151611328, "global_step": 21181, "epoch": 175} {"train_loss": -29.780500411987305, "global_step": 21182, "epoch": 175} {"train_loss": -28.66666030883789, "global_step": 21183, "epoch": 175} {"train_loss": -28.095813751220703, "global_step": 21184, "epoch": 175} {"train_loss": -23.96614646911621, "global_step": 21185, "epoch": 175} {"train_loss": -19.89803123474121, "global_step": 21186, "epoch": 175} {"train_loss": -21.931222915649414, "global_step": 21187, "epoch": 175} {"train_loss": -29.932891845703125, "global_step": 21188, "epoch": 175} {"train_loss": -23.78498649597168, "global_step": 21189, "epoch": 175} {"train_loss": -29.340940475463867, "global_step": 21190, "epoch": 175} {"train_loss": -27.0800838470459, "global_step": 21191, "epoch": 175} {"train_loss": -29.669544219970703, "global_step": 21192, "epoch": 175} {"train_loss": -27.758832931518555, "global_step": 21193, "epoch": 175} {"train_loss": -29.367307662963867, "global_step": 21194, "epoch": 175} {"train_loss": -28.84986686706543, "global_step": 21195, "epoch": 175} {"train_loss": -29.021284103393555, "global_step": 21196, "epoch": 175} {"train_loss": -29.124120712280273, "global_step": 21197, "epoch": 175} {"train_loss": -29.50676918029785, "global_step": 21198, "epoch": 175} {"train_loss": -29.532642364501953, "global_step": 21199, "epoch": 175} {"train_loss": -30.041095733642578, "global_step": 21200, "epoch": 175} {"train_loss": -29.80213737487793, "global_step": 21201, "epoch": 175} {"train_loss": -29.461511611938477, "global_step": 21202, "epoch": 175} {"train_loss": -29.724124908447266, "global_step": 21203, "epoch": 175} {"train_loss": -29.704710006713867, "global_step": 21204, "epoch": 175} {"train_loss": -29.62306022644043, "global_step": 21205, "epoch": 175} {"train_loss": -29.799081802368164, "global_step": 21206, "epoch": 175} {"train_loss": -30.196380615234375, "global_step": 21207, "epoch": 175} {"train_loss": -29.911102294921875, "global_step": 21208, "epoch": 175} {"train_loss": -30.27317237854004, "global_step": 21209, "epoch": 175} {"train_loss": -29.977521896362305, "global_step": 21210, "epoch": 175} {"train_loss": -30.4821720123291, "global_step": 21211, "epoch": 175} {"train_loss": -30.146991729736328, "global_step": 21212, "epoch": 175} {"train_loss": -30.208372116088867, "global_step": 21213, "epoch": 175} {"train_loss": -29.894611358642578, "global_step": 21214, "epoch": 175} {"train_loss": -30.03078269958496, "global_step": 21215, "epoch": 175} {"train_loss": -30.453479766845703, "global_step": 21216, "epoch": 175} {"train_loss": -30.02642822265625, "global_step": 21217, "epoch": 175} {"train_loss": -30.081762313842773, "global_step": 21218, "epoch": 175} {"train_loss": -30.191650390625, "global_step": 21219, "epoch": 175} {"train_loss": -30.003742218017578, "global_step": 21220, "epoch": 175} {"train_loss": -30.004596710205078, "global_step": 21221, "epoch": 175} {"train_loss": -29.880956649780273, "global_step": 21222, "epoch": 175} {"train_loss": -30.050329208374023, "global_step": 21223, "epoch": 175} {"train_loss": -30.51679039001465, "global_step": 21224, "epoch": 175} {"train_loss": -30.0571231842041, "global_step": 21225, "epoch": 175} {"train_loss": -30.10068130493164, "global_step": 21226, "epoch": 175} {"train_loss": -30.220884323120117, "global_step": 21227, "epoch": 175} {"train_loss": -30.369775772094727, "global_step": 21228, "epoch": 175} {"train_loss": -30.617643356323242, "global_step": 21229, "epoch": 175} {"train_loss": -30.18267250061035, "global_step": 21230, "epoch": 175} {"train_loss": -30.583179473876953, "global_step": 21231, "epoch": 175} {"train_loss": -29.964618682861328, "global_step": 21232, "epoch": 175} {"train_loss": -30.212299346923828, "global_step": 21233, "epoch": 175} {"train_loss": -30.347930908203125, "global_step": 21234, "epoch": 175} {"train_loss": -29.8879451751709, "global_step": 21235, "epoch": 175} {"train_loss": -29.654150009155273, "global_step": 21236, "epoch": 175} {"train_loss": -30.201135635375977, "global_step": 21237, "epoch": 175} {"train_loss": -28.890745162963867, "global_step": 21238, "epoch": 175} {"train_loss": -29.560033798217773, "global_step": 21239, "epoch": 175} {"train_loss": -28.564300537109375, "global_step": 21240, "epoch": 175} {"train_loss": -26.841840744018555, "global_step": 21241, "epoch": 175} {"train_loss": -19.93806266784668, "global_step": 21242, "epoch": 175} {"train_loss": -6.096951961517334, "global_step": 21243, "epoch": 175} {"train_loss": -3.718780279159546, "global_step": 21244, "epoch": 175} {"train_loss": -29.387344360351562, "global_step": 21245, "epoch": 175} {"train_loss": -17.139883041381836, "global_step": 21246, "epoch": 175} {"train_loss": -29.53838539123535, "global_step": 21247, "epoch": 175} {"train_loss": -22.88949966430664, "global_step": 21248, "epoch": 175} {"train_loss": -25.706897735595703, "global_step": 21249, "epoch": 175} {"train_loss": -28.904340744018555, "global_step": 21250, "epoch": 175} {"train_loss": -27.37643814086914, "global_step": 21251, "epoch": 175} {"train_loss": -25.871625900268555, "global_step": 21252, "epoch": 175} {"train_loss": -28.52783203125, "global_step": 21253, "epoch": 175} {"train_loss": -29.179279327392578, "global_step": 21254, "epoch": 175} {"train_loss": -28.425769805908203, "global_step": 21255, "epoch": 175} {"train_loss": -27.903852462768555, "global_step": 21256, "epoch": 175} {"train_loss": -28.160449981689453, "global_step": 21257, "epoch": 175} {"train_loss": -28.558338165283203, "global_step": 21258, "epoch": 175} {"train_loss": -28.93121910095215, "global_step": 21259, "epoch": 175} {"train_loss": -29.19793128967285, "global_step": 21260, "epoch": 175} {"train_loss": -29.20857048034668, "global_step": 21261, "epoch": 175} {"train_loss": -29.321460723876953, "global_step": 21262, "epoch": 175} {"train_loss": -29.196369171142578, "global_step": 21263, "epoch": 175} {"train_loss": -29.155752182006836, "global_step": 21264, "epoch": 175} {"train_loss": -28.908740997314453, "global_step": 21265, "epoch": 175} {"train_loss": -28.834075927734375, "global_step": 21266, "epoch": 175} {"train_loss": -29.123998641967773, "global_step": 21267, "epoch": 175} {"train_loss": -29.419034957885742, "global_step": 21268, "epoch": 175} {"train_loss": -29.687274932861328, "global_step": 21269, "epoch": 175} {"train_loss": -29.69325065612793, "global_step": 21270, "epoch": 175} {"train_loss": -29.716108322143555, "global_step": 21271, "epoch": 175} {"train_loss": -29.195356369018555, "global_step": 21272, "epoch": 175} {"train_loss": -29.387914657592773, "global_step": 21273, "epoch": 175} {"train_loss": -29.85419273376465, "global_step": 21274, "epoch": 175} {"train_loss": -29.64255142211914, "global_step": 21275, "epoch": 175} {"train_loss": -29.454221725463867, "global_step": 21276, "epoch": 175} {"train_loss": -29.593236923217773, "global_step": 21277, "epoch": 175} {"train_loss": -29.71526527404785, "global_step": 21278, "epoch": 175} {"train_loss": -30.172271728515625, "global_step": 21279, "epoch": 175} {"train_loss": -29.241291046142578, "global_step": 21280, "epoch": 175} {"train_loss": -30.17848014831543, "global_step": 21281, "epoch": 175} {"train_loss": -29.221179962158203, "global_step": 21282, "epoch": 175} {"train_loss": -29.77487564086914, "global_step": 21283, "epoch": 175} {"train_loss": -29.50482177734375, "global_step": 21284, "epoch": 175} {"train_loss": -29.673276901245117, "global_step": 21285, "epoch": 175} {"train_loss": -29.42647361755371, "global_step": 21286, "epoch": 175} {"train_loss": -29.74118995666504, "global_step": 21287, "epoch": 175} {"train_loss": -29.519636154174805, "global_step": 21288, "epoch": 175} {"train_loss": -29.37812614440918, "global_step": 21289, "epoch": 175} {"train_loss": -30.07122802734375, "global_step": 21290, "epoch": 175} {"train_loss": -29.54291343688965, "global_step": 21291, "epoch": 175} {"train_loss": -29.74970817565918, "global_step": 21292, "epoch": 175} {"train_loss": -29.591169357299805, "global_step": 21293, "epoch": 175} {"train_loss": -29.722259521484375, "global_step": 21294, "epoch": 175} {"train_loss": -28.605903272786417, "global_step": 21295, "epoch": 175, "val_loss": 2546499.75} {"train_loss": -29.90801429748535, "global_step": 21296, "epoch": 176} {"train_loss": -29.75786781311035, "global_step": 21297, "epoch": 176} {"train_loss": -29.83222007751465, "global_step": 21298, "epoch": 176} {"train_loss": -29.492040634155273, "global_step": 21299, "epoch": 176} {"train_loss": -29.189285278320312, "global_step": 21300, "epoch": 176} {"train_loss": -29.05877685546875, "global_step": 21301, "epoch": 176} {"train_loss": -28.771345138549805, "global_step": 21302, "epoch": 176} {"train_loss": -28.490814208984375, "global_step": 21303, "epoch": 176} {"train_loss": -28.3320255279541, "global_step": 21304, "epoch": 176} {"train_loss": -29.416162490844727, "global_step": 21305, "epoch": 176} {"train_loss": -28.28533363342285, "global_step": 21306, "epoch": 176} {"train_loss": -27.178991317749023, "global_step": 21307, "epoch": 176} {"train_loss": -27.42511558532715, "global_step": 21308, "epoch": 176} {"train_loss": -28.137250900268555, "global_step": 21309, "epoch": 176} {"train_loss": -29.781147003173828, "global_step": 21310, "epoch": 176} {"train_loss": -28.84354591369629, "global_step": 21311, "epoch": 176} {"train_loss": -29.459054946899414, "global_step": 21312, "epoch": 176} {"train_loss": -29.516698837280273, "global_step": 21313, "epoch": 176} {"train_loss": -28.878498077392578, "global_step": 21314, "epoch": 176} {"train_loss": -29.24216079711914, "global_step": 21315, "epoch": 176} {"train_loss": -28.701292037963867, "global_step": 21316, "epoch": 176} {"train_loss": -29.384952545166016, "global_step": 21317, "epoch": 176} {"train_loss": -29.185150146484375, "global_step": 21318, "epoch": 176} {"train_loss": -28.61993980407715, "global_step": 21319, "epoch": 176} {"train_loss": -29.619619369506836, "global_step": 21320, "epoch": 176} {"train_loss": -28.215717315673828, "global_step": 21321, "epoch": 176} {"train_loss": -29.27447509765625, "global_step": 21322, "epoch": 176} {"train_loss": -28.03889274597168, "global_step": 21323, "epoch": 176} {"train_loss": -29.074594497680664, "global_step": 21324, "epoch": 176} {"train_loss": -28.737516403198242, "global_step": 21325, "epoch": 176} {"train_loss": -29.524799346923828, "global_step": 21326, "epoch": 176} {"train_loss": -29.19516372680664, "global_step": 21327, "epoch": 176} {"train_loss": -28.689844131469727, "global_step": 21328, "epoch": 176} {"train_loss": -28.842992782592773, "global_step": 21329, "epoch": 176} {"train_loss": -28.757556915283203, "global_step": 21330, "epoch": 176} {"train_loss": -28.44182777404785, "global_step": 21331, "epoch": 176} {"train_loss": -29.343353271484375, "global_step": 21332, "epoch": 176} {"train_loss": -28.54343605041504, "global_step": 21333, "epoch": 176} {"train_loss": -29.372282028198242, "global_step": 21334, "epoch": 176} {"train_loss": -28.80112648010254, "global_step": 21335, "epoch": 176} {"train_loss": -29.30084228515625, "global_step": 21336, "epoch": 176} {"train_loss": -29.048551559448242, "global_step": 21337, "epoch": 176} {"train_loss": -29.419050216674805, "global_step": 21338, "epoch": 176} {"train_loss": -29.73663330078125, "global_step": 21339, "epoch": 176} {"train_loss": -29.306015014648438, "global_step": 21340, "epoch": 176} {"train_loss": -29.580520629882812, "global_step": 21341, "epoch": 176} {"train_loss": -29.45352554321289, "global_step": 21342, "epoch": 176} {"train_loss": -30.0939884185791, "global_step": 21343, "epoch": 176} {"train_loss": -29.588470458984375, "global_step": 21344, "epoch": 176} {"train_loss": -29.66721534729004, "global_step": 21345, "epoch": 176} {"train_loss": -29.912580490112305, "global_step": 21346, "epoch": 176} {"train_loss": -29.479339599609375, "global_step": 21347, "epoch": 176} {"train_loss": -29.795618057250977, "global_step": 21348, "epoch": 176} {"train_loss": -29.8425235748291, "global_step": 21349, "epoch": 176} {"train_loss": -29.529205322265625, "global_step": 21350, "epoch": 176} {"train_loss": -30.18485450744629, "global_step": 21351, "epoch": 176} {"train_loss": -29.911468505859375, "global_step": 21352, "epoch": 176} {"train_loss": -29.858963012695312, "global_step": 21353, "epoch": 176} {"train_loss": -29.593536376953125, "global_step": 21354, "epoch": 176} {"train_loss": -29.979612350463867, "global_step": 21355, "epoch": 176} {"train_loss": -29.591459274291992, "global_step": 21356, "epoch": 176} {"train_loss": -29.829320907592773, "global_step": 21357, "epoch": 176} {"train_loss": -30.213891983032227, "global_step": 21358, "epoch": 176} {"train_loss": -30.295507431030273, "global_step": 21359, "epoch": 176} {"train_loss": -30.00030517578125, "global_step": 21360, "epoch": 176} {"train_loss": -30.123809814453125, "global_step": 21361, "epoch": 176} {"train_loss": -30.1052303314209, "global_step": 21362, "epoch": 176} {"train_loss": -30.385297775268555, "global_step": 21363, "epoch": 176} {"train_loss": -30.0202579498291, "global_step": 21364, "epoch": 176} {"train_loss": -30.242273330688477, "global_step": 21365, "epoch": 176} {"train_loss": -30.421899795532227, "global_step": 21366, "epoch": 176} {"train_loss": -30.378881454467773, "global_step": 21367, "epoch": 176} {"train_loss": -30.1783447265625, "global_step": 21368, "epoch": 176} {"train_loss": -29.7742977142334, "global_step": 21369, "epoch": 176} {"train_loss": -29.926361083984375, "global_step": 21370, "epoch": 176} {"train_loss": -29.6666202545166, "global_step": 21371, "epoch": 176} {"train_loss": -30.062788009643555, "global_step": 21372, "epoch": 176} {"train_loss": -30.370691299438477, "global_step": 21373, "epoch": 176} {"train_loss": -30.119491577148438, "global_step": 21374, "epoch": 176} {"train_loss": -29.6412296295166, "global_step": 21375, "epoch": 176} {"train_loss": -29.081298828125, "global_step": 21376, "epoch": 176} {"train_loss": -27.360931396484375, "global_step": 21377, "epoch": 176} {"train_loss": -27.053632736206055, "global_step": 21378, "epoch": 176} {"train_loss": -28.655776977539062, "global_step": 21379, "epoch": 176} {"train_loss": -30.23844337463379, "global_step": 21380, "epoch": 176} {"train_loss": -29.66328239440918, "global_step": 21381, "epoch": 176} {"train_loss": -29.216161727905273, "global_step": 21382, "epoch": 176} {"train_loss": -29.498504638671875, "global_step": 21383, "epoch": 176} {"train_loss": -30.0636043548584, "global_step": 21384, "epoch": 176} {"train_loss": -30.5761661529541, "global_step": 21385, "epoch": 176} {"train_loss": -30.268085479736328, "global_step": 21386, "epoch": 176} {"train_loss": -30.36628532409668, "global_step": 21387, "epoch": 176} {"train_loss": -30.214069366455078, "global_step": 21388, "epoch": 176} {"train_loss": -29.927148818969727, "global_step": 21389, "epoch": 176} {"train_loss": -30.250883102416992, "global_step": 21390, "epoch": 176} {"train_loss": -30.681196212768555, "global_step": 21391, "epoch": 176} {"train_loss": -30.543745040893555, "global_step": 21392, "epoch": 176} {"train_loss": -30.741439819335938, "global_step": 21393, "epoch": 176} {"train_loss": -30.670331954956055, "global_step": 21394, "epoch": 176} {"train_loss": -30.446741104125977, "global_step": 21395, "epoch": 176} {"train_loss": -30.455854415893555, "global_step": 21396, "epoch": 176} {"train_loss": -30.4150390625, "global_step": 21397, "epoch": 176} {"train_loss": -30.444360733032227, "global_step": 21398, "epoch": 176} {"train_loss": -30.576894760131836, "global_step": 21399, "epoch": 176} {"train_loss": -29.944955825805664, "global_step": 21400, "epoch": 176} {"train_loss": -30.420669555664062, "global_step": 21401, "epoch": 176} {"train_loss": -30.248416900634766, "global_step": 21402, "epoch": 176} {"train_loss": -30.612869262695312, "global_step": 21403, "epoch": 176} {"train_loss": -30.8118896484375, "global_step": 21404, "epoch": 176} {"train_loss": -30.510541915893555, "global_step": 21405, "epoch": 176} {"train_loss": -30.590246200561523, "global_step": 21406, "epoch": 176} {"train_loss": -30.66943359375, "global_step": 21407, "epoch": 176} {"train_loss": -30.24085807800293, "global_step": 21408, "epoch": 176} {"train_loss": -29.4562931060791, "global_step": 21409, "epoch": 176} {"train_loss": -30.37123680114746, "global_step": 21410, "epoch": 176} {"train_loss": -30.173376083374023, "global_step": 21411, "epoch": 176} {"train_loss": -30.080530166625977, "global_step": 21412, "epoch": 176} {"train_loss": -29.867938995361328, "global_step": 21413, "epoch": 176} {"train_loss": -29.34492301940918, "global_step": 21414, "epoch": 176} {"train_loss": -28.46702003479004, "global_step": 21415, "epoch": 176} {"train_loss": -29.59129385514693, "global_step": 21416, "epoch": 176, "val_loss": 2551484.0} {"train_loss": -30.11818504333496, "global_step": 21417, "epoch": 177} {"train_loss": -29.154287338256836, "global_step": 21418, "epoch": 177} {"train_loss": -30.300048828125, "global_step": 21419, "epoch": 177} {"train_loss": -29.674909591674805, "global_step": 21420, "epoch": 177} {"train_loss": -30.402292251586914, "global_step": 21421, "epoch": 177} {"train_loss": -29.5583438873291, "global_step": 21422, "epoch": 177} {"train_loss": -30.3192138671875, "global_step": 21423, "epoch": 177} {"train_loss": -29.9892520904541, "global_step": 21424, "epoch": 177} {"train_loss": -30.00247573852539, "global_step": 21425, "epoch": 177} {"train_loss": -28.493860244750977, "global_step": 21426, "epoch": 177} {"train_loss": -28.827991485595703, "global_step": 21427, "epoch": 177} {"train_loss": -28.592166900634766, "global_step": 21428, "epoch": 177} {"train_loss": -24.440176010131836, "global_step": 21429, "epoch": 177} {"train_loss": -30.03993797302246, "global_step": 21430, "epoch": 177} {"train_loss": -27.01824378967285, "global_step": 21431, "epoch": 177} {"train_loss": -28.32929039001465, "global_step": 21432, "epoch": 177} {"train_loss": -29.435577392578125, "global_step": 21433, "epoch": 177} {"train_loss": -27.49592399597168, "global_step": 21434, "epoch": 177} {"train_loss": -28.26824378967285, "global_step": 21435, "epoch": 177} {"train_loss": -30.2418212890625, "global_step": 21436, "epoch": 177} {"train_loss": -29.416284561157227, "global_step": 21437, "epoch": 177} {"train_loss": -29.040082931518555, "global_step": 21438, "epoch": 177} {"train_loss": -28.517812728881836, "global_step": 21439, "epoch": 177} {"train_loss": -29.619659423828125, "global_step": 21440, "epoch": 177} {"train_loss": -30.375640869140625, "global_step": 21441, "epoch": 177} {"train_loss": -30.008939743041992, "global_step": 21442, "epoch": 177} {"train_loss": -29.9813289642334, "global_step": 21443, "epoch": 177} {"train_loss": -29.814929962158203, "global_step": 21444, "epoch": 177} {"train_loss": -30.107206344604492, "global_step": 21445, "epoch": 177} {"train_loss": -29.343799591064453, "global_step": 21446, "epoch": 177} {"train_loss": -29.824670791625977, "global_step": 21447, "epoch": 177} {"train_loss": -29.887149810791016, "global_step": 21448, "epoch": 177} {"train_loss": -30.250280380249023, "global_step": 21449, "epoch": 177} {"train_loss": -30.257482528686523, "global_step": 21450, "epoch": 177} {"train_loss": -30.262144088745117, "global_step": 21451, "epoch": 177} {"train_loss": -29.81182861328125, "global_step": 21452, "epoch": 177} {"train_loss": -29.262475967407227, "global_step": 21453, "epoch": 177} {"train_loss": -29.88797378540039, "global_step": 21454, "epoch": 177} {"train_loss": -29.939367294311523, "global_step": 21455, "epoch": 177} {"train_loss": -29.961606979370117, "global_step": 21456, "epoch": 177} {"train_loss": -29.682891845703125, "global_step": 21457, "epoch": 177} {"train_loss": -29.1916561126709, "global_step": 21458, "epoch": 177} {"train_loss": -29.944625854492188, "global_step": 21459, "epoch": 177} {"train_loss": -29.918664932250977, "global_step": 21460, "epoch": 177} {"train_loss": -29.64088249206543, "global_step": 21461, "epoch": 177} {"train_loss": -29.47659683227539, "global_step": 21462, "epoch": 177} {"train_loss": -30.1351375579834, "global_step": 21463, "epoch": 177} {"train_loss": -29.632144927978516, "global_step": 21464, "epoch": 177} {"train_loss": -29.351408004760742, "global_step": 21465, "epoch": 177} {"train_loss": -29.306411743164062, "global_step": 21466, "epoch": 177} {"train_loss": -27.698383331298828, "global_step": 21467, "epoch": 177} {"train_loss": -25.809656143188477, "global_step": 21468, "epoch": 177} {"train_loss": -26.41109275817871, "global_step": 21469, "epoch": 177} {"train_loss": -24.591915130615234, "global_step": 21470, "epoch": 177} {"train_loss": -27.752710342407227, "global_step": 21471, "epoch": 177} {"train_loss": -27.403583526611328, "global_step": 21472, "epoch": 177} {"train_loss": -26.101449966430664, "global_step": 21473, "epoch": 177} {"train_loss": -28.672622680664062, "global_step": 21474, "epoch": 177} {"train_loss": -27.647266387939453, "global_step": 21475, "epoch": 177} {"train_loss": -28.26068687438965, "global_step": 21476, "epoch": 177} {"train_loss": -27.357690811157227, "global_step": 21477, "epoch": 177} {"train_loss": -28.90496826171875, "global_step": 21478, "epoch": 177} {"train_loss": -27.648359298706055, "global_step": 21479, "epoch": 177} {"train_loss": -28.324186325073242, "global_step": 21480, "epoch": 177} {"train_loss": -27.640607833862305, "global_step": 21481, "epoch": 177} {"train_loss": -29.56633949279785, "global_step": 21482, "epoch": 177} {"train_loss": -28.17166519165039, "global_step": 21483, "epoch": 177} {"train_loss": -29.18421745300293, "global_step": 21484, "epoch": 177} {"train_loss": -28.7947940826416, "global_step": 21485, "epoch": 177} {"train_loss": -29.162906646728516, "global_step": 21486, "epoch": 177} {"train_loss": -29.176746368408203, "global_step": 21487, "epoch": 177} {"train_loss": -28.755247116088867, "global_step": 21488, "epoch": 177} {"train_loss": -28.92958641052246, "global_step": 21489, "epoch": 177} {"train_loss": -29.836822509765625, "global_step": 21490, "epoch": 177} {"train_loss": -29.191619873046875, "global_step": 21491, "epoch": 177} {"train_loss": -29.128009796142578, "global_step": 21492, "epoch": 177} {"train_loss": -29.69254493713379, "global_step": 21493, "epoch": 177} {"train_loss": -29.720478057861328, "global_step": 21494, "epoch": 177} {"train_loss": -29.709333419799805, "global_step": 21495, "epoch": 177} {"train_loss": -29.76297378540039, "global_step": 21496, "epoch": 177} {"train_loss": -29.910703659057617, "global_step": 21497, "epoch": 177} {"train_loss": -29.557226181030273, "global_step": 21498, "epoch": 177} {"train_loss": -29.844526290893555, "global_step": 21499, "epoch": 177} {"train_loss": -29.81647300720215, "global_step": 21500, "epoch": 177} {"train_loss": -30.0662899017334, "global_step": 21501, "epoch": 177} {"train_loss": -29.87662696838379, "global_step": 21502, "epoch": 177} {"train_loss": -30.126541137695312, "global_step": 21503, "epoch": 177} {"train_loss": -29.985132217407227, "global_step": 21504, "epoch": 177} {"train_loss": -30.15876579284668, "global_step": 21505, "epoch": 177} {"train_loss": -30.428577423095703, "global_step": 21506, "epoch": 177} {"train_loss": -30.275243759155273, "global_step": 21507, "epoch": 177} {"train_loss": -29.99249839782715, "global_step": 21508, "epoch": 177} {"train_loss": -29.975040435791016, "global_step": 21509, "epoch": 177} {"train_loss": -29.957965850830078, "global_step": 21510, "epoch": 177} {"train_loss": -30.314254760742188, "global_step": 21511, "epoch": 177} {"train_loss": -30.47602653503418, "global_step": 21512, "epoch": 177} {"train_loss": -30.29241943359375, "global_step": 21513, "epoch": 177} {"train_loss": -30.26116943359375, "global_step": 21514, "epoch": 177} {"train_loss": -30.06436538696289, "global_step": 21515, "epoch": 177} {"train_loss": -30.351276397705078, "global_step": 21516, "epoch": 177} {"train_loss": -30.496002197265625, "global_step": 21517, "epoch": 177} {"train_loss": -30.285614013671875, "global_step": 21518, "epoch": 177} {"train_loss": -30.10767936706543, "global_step": 21519, "epoch": 177} {"train_loss": -30.4593448638916, "global_step": 21520, "epoch": 177} {"train_loss": -30.313623428344727, "global_step": 21521, "epoch": 177} {"train_loss": -30.756006240844727, "global_step": 21522, "epoch": 177} {"train_loss": -30.171438217163086, "global_step": 21523, "epoch": 177} {"train_loss": -30.537710189819336, "global_step": 21524, "epoch": 177} {"train_loss": -29.950458526611328, "global_step": 21525, "epoch": 177} {"train_loss": -30.55974769592285, "global_step": 21526, "epoch": 177} {"train_loss": -30.605859756469727, "global_step": 21527, "epoch": 177} {"train_loss": -30.602737426757812, "global_step": 21528, "epoch": 177} {"train_loss": -30.658344268798828, "global_step": 21529, "epoch": 177} {"train_loss": -30.52667236328125, "global_step": 21530, "epoch": 177} {"train_loss": -30.29203224182129, "global_step": 21531, "epoch": 177} {"train_loss": -29.37887954711914, "global_step": 21532, "epoch": 177} {"train_loss": -28.648929595947266, "global_step": 21533, "epoch": 177} {"train_loss": -27.353864669799805, "global_step": 21534, "epoch": 177} {"train_loss": -26.29410171508789, "global_step": 21535, "epoch": 177} {"train_loss": -27.811126708984375, "global_step": 21536, "epoch": 177} {"train_loss": -29.331481917830537, "global_step": 21537, "epoch": 177, "val_loss": 2705175.75} {"train_loss": -29.884374618530273, "global_step": 21538, "epoch": 178} {"train_loss": -29.245105743408203, "global_step": 21539, "epoch": 178} {"train_loss": -29.9498233795166, "global_step": 21540, "epoch": 178} {"train_loss": -30.167774200439453, "global_step": 21541, "epoch": 178} {"train_loss": -29.40386962890625, "global_step": 21542, "epoch": 178} {"train_loss": -30.068307876586914, "global_step": 21543, "epoch": 178} {"train_loss": -29.824066162109375, "global_step": 21544, "epoch": 178} {"train_loss": -29.876317977905273, "global_step": 21545, "epoch": 178} {"train_loss": -30.173389434814453, "global_step": 21546, "epoch": 178} {"train_loss": -29.9873046875, "global_step": 21547, "epoch": 178} {"train_loss": -30.094207763671875, "global_step": 21548, "epoch": 178} {"train_loss": -30.32923698425293, "global_step": 21549, "epoch": 178} {"train_loss": -30.055627822875977, "global_step": 21550, "epoch": 178} {"train_loss": -30.137287139892578, "global_step": 21551, "epoch": 178} {"train_loss": -30.167804718017578, "global_step": 21552, "epoch": 178} {"train_loss": -30.227231979370117, "global_step": 21553, "epoch": 178} {"train_loss": -29.793737411499023, "global_step": 21554, "epoch": 178} {"train_loss": -30.127676010131836, "global_step": 21555, "epoch": 178} {"train_loss": -29.90872573852539, "global_step": 21556, "epoch": 178} {"train_loss": -30.162824630737305, "global_step": 21557, "epoch": 178} {"train_loss": -30.2396297454834, "global_step": 21558, "epoch": 178} {"train_loss": -30.075443267822266, "global_step": 21559, "epoch": 178} {"train_loss": -30.257333755493164, "global_step": 21560, "epoch": 178} {"train_loss": -30.045339584350586, "global_step": 21561, "epoch": 178} {"train_loss": -30.058441162109375, "global_step": 21562, "epoch": 178} {"train_loss": -30.003620147705078, "global_step": 21563, "epoch": 178} {"train_loss": -30.17880630493164, "global_step": 21564, "epoch": 178} {"train_loss": -30.39678382873535, "global_step": 21565, "epoch": 178} {"train_loss": -30.028345108032227, "global_step": 21566, "epoch": 178} {"train_loss": -30.31247901916504, "global_step": 21567, "epoch": 178} {"train_loss": -29.890766143798828, "global_step": 21568, "epoch": 178} {"train_loss": -30.101160049438477, "global_step": 21569, "epoch": 178} {"train_loss": -30.029006958007812, "global_step": 21570, "epoch": 178} {"train_loss": -30.58966064453125, "global_step": 21571, "epoch": 178} {"train_loss": -29.95331382751465, "global_step": 21572, "epoch": 178} {"train_loss": -30.408872604370117, "global_step": 21573, "epoch": 178} {"train_loss": -30.513416290283203, "global_step": 21574, "epoch": 178} {"train_loss": -30.678857803344727, "global_step": 21575, "epoch": 178} {"train_loss": -30.425642013549805, "global_step": 21576, "epoch": 178} {"train_loss": -30.722614288330078, "global_step": 21577, "epoch": 178} {"train_loss": -30.6751651763916, "global_step": 21578, "epoch": 178} {"train_loss": -30.46734046936035, "global_step": 21579, "epoch": 178} {"train_loss": -30.195789337158203, "global_step": 21580, "epoch": 178} {"train_loss": -29.907154083251953, "global_step": 21581, "epoch": 178} {"train_loss": -30.692968368530273, "global_step": 21582, "epoch": 178} {"train_loss": -30.036758422851562, "global_step": 21583, "epoch": 178} {"train_loss": -30.599536895751953, "global_step": 21584, "epoch": 178} {"train_loss": -30.718414306640625, "global_step": 21585, "epoch": 178} {"train_loss": -29.94672203063965, "global_step": 21586, "epoch": 178} {"train_loss": -30.568204879760742, "global_step": 21587, "epoch": 178} {"train_loss": -30.776031494140625, "global_step": 21588, "epoch": 178} {"train_loss": -30.806943893432617, "global_step": 21589, "epoch": 178} {"train_loss": -30.81060218811035, "global_step": 21590, "epoch": 178} {"train_loss": -30.973310470581055, "global_step": 21591, "epoch": 178} {"train_loss": -30.937299728393555, "global_step": 21592, "epoch": 178} {"train_loss": -30.596887588500977, "global_step": 21593, "epoch": 178} {"train_loss": -30.486846923828125, "global_step": 21594, "epoch": 178} {"train_loss": -31.130170822143555, "global_step": 21595, "epoch": 178} {"train_loss": -29.933618545532227, "global_step": 21596, "epoch": 178} {"train_loss": -30.197803497314453, "global_step": 21597, "epoch": 178} {"train_loss": -30.309316635131836, "global_step": 21598, "epoch": 178} {"train_loss": -29.69122886657715, "global_step": 21599, "epoch": 178} {"train_loss": -28.4417724609375, "global_step": 21600, "epoch": 178} {"train_loss": -27.123640060424805, "global_step": 21601, "epoch": 178} {"train_loss": -25.90109634399414, "global_step": 21602, "epoch": 178} {"train_loss": -27.266820907592773, "global_step": 21603, "epoch": 178} {"train_loss": -27.906970977783203, "global_step": 21604, "epoch": 178} {"train_loss": -28.914892196655273, "global_step": 21605, "epoch": 178} {"train_loss": -30.577350616455078, "global_step": 21606, "epoch": 178} {"train_loss": -29.829177856445312, "global_step": 21607, "epoch": 178} {"train_loss": -28.332090377807617, "global_step": 21608, "epoch": 178} {"train_loss": -30.24820327758789, "global_step": 21609, "epoch": 178} {"train_loss": -29.693017959594727, "global_step": 21610, "epoch": 178} {"train_loss": -30.0960693359375, "global_step": 21611, "epoch": 178} {"train_loss": -30.464984893798828, "global_step": 21612, "epoch": 178} {"train_loss": -30.194982528686523, "global_step": 21613, "epoch": 178} {"train_loss": -30.18739128112793, "global_step": 21614, "epoch": 178} {"train_loss": -30.4426326751709, "global_step": 21615, "epoch": 178} {"train_loss": -30.504892349243164, "global_step": 21616, "epoch": 178} {"train_loss": -31.030567169189453, "global_step": 21617, "epoch": 178} {"train_loss": -30.549575805664062, "global_step": 21618, "epoch": 178} {"train_loss": -30.6195125579834, "global_step": 21619, "epoch": 178} {"train_loss": -30.683012008666992, "global_step": 21620, "epoch": 178} {"train_loss": -30.66786003112793, "global_step": 21621, "epoch": 178} {"train_loss": -30.272886276245117, "global_step": 21622, "epoch": 178} {"train_loss": -30.54851722717285, "global_step": 21623, "epoch": 178} {"train_loss": -30.741928100585938, "global_step": 21624, "epoch": 178} {"train_loss": -30.867883682250977, "global_step": 21625, "epoch": 178} {"train_loss": -31.088117599487305, "global_step": 21626, "epoch": 178} {"train_loss": -30.422164916992188, "global_step": 21627, "epoch": 178} {"train_loss": -29.263513565063477, "global_step": 21628, "epoch": 178} {"train_loss": -24.8629093170166, "global_step": 21629, "epoch": 178} {"train_loss": -14.34131145477295, "global_step": 21630, "epoch": 178} {"train_loss": -20.853883743286133, "global_step": 21631, "epoch": 178} {"train_loss": -29.339330673217773, "global_step": 21632, "epoch": 178} {"train_loss": -17.417587280273438, "global_step": 21633, "epoch": 178} {"train_loss": -30.026071548461914, "global_step": 21634, "epoch": 178} {"train_loss": -23.39130210876465, "global_step": 21635, "epoch": 178} {"train_loss": -29.086755752563477, "global_step": 21636, "epoch": 178} {"train_loss": -26.769287109375, "global_step": 21637, "epoch": 178} {"train_loss": -26.871856689453125, "global_step": 21638, "epoch": 178} {"train_loss": -29.636444091796875, "global_step": 21639, "epoch": 178} {"train_loss": -28.949682235717773, "global_step": 21640, "epoch": 178} {"train_loss": -27.9022159576416, "global_step": 21641, "epoch": 178} {"train_loss": -28.45719337463379, "global_step": 21642, "epoch": 178} {"train_loss": -29.872760772705078, "global_step": 21643, "epoch": 178} {"train_loss": -29.215240478515625, "global_step": 21644, "epoch": 178} {"train_loss": -29.22939109802246, "global_step": 21645, "epoch": 178} {"train_loss": -29.07120132446289, "global_step": 21646, "epoch": 178} {"train_loss": -28.6567440032959, "global_step": 21647, "epoch": 178} {"train_loss": -28.19195556640625, "global_step": 21648, "epoch": 178} {"train_loss": -29.053369522094727, "global_step": 21649, "epoch": 178} {"train_loss": -29.761072158813477, "global_step": 21650, "epoch": 178} {"train_loss": -28.611108779907227, "global_step": 21651, "epoch": 178} {"train_loss": -29.109445571899414, "global_step": 21652, "epoch": 178} {"train_loss": -29.676849365234375, "global_step": 21653, "epoch": 178} {"train_loss": -29.424701690673828, "global_step": 21654, "epoch": 178} {"train_loss": -29.786319732666016, "global_step": 21655, "epoch": 178} {"train_loss": -29.805532455444336, "global_step": 21656, "epoch": 178} {"train_loss": -29.804534912109375, "global_step": 21657, "epoch": 178} {"train_loss": -29.46142009861213, "global_step": 21658, "epoch": 178, "val_loss": 2494294.0} {"train_loss": -29.609771728515625, "global_step": 21659, "epoch": 179} {"train_loss": -29.722644805908203, "global_step": 21660, "epoch": 179} {"train_loss": -29.89411735534668, "global_step": 21661, "epoch": 179} {"train_loss": -30.305744171142578, "global_step": 21662, "epoch": 179} {"train_loss": -29.88022232055664, "global_step": 21663, "epoch": 179} {"train_loss": -30.22796058654785, "global_step": 21664, "epoch": 179} {"train_loss": -29.821516036987305, "global_step": 21665, "epoch": 179} {"train_loss": -29.894489288330078, "global_step": 21666, "epoch": 179} {"train_loss": -29.866199493408203, "global_step": 21667, "epoch": 179} {"train_loss": -30.351415634155273, "global_step": 21668, "epoch": 179} {"train_loss": -29.276899337768555, "global_step": 21669, "epoch": 179} {"train_loss": -29.053924560546875, "global_step": 21670, "epoch": 179} {"train_loss": -29.92461585998535, "global_step": 21671, "epoch": 179} {"train_loss": -29.514678955078125, "global_step": 21672, "epoch": 179} {"train_loss": -29.791067123413086, "global_step": 21673, "epoch": 179} {"train_loss": -30.221954345703125, "global_step": 21674, "epoch": 179} {"train_loss": -29.788938522338867, "global_step": 21675, "epoch": 179} {"train_loss": -30.345367431640625, "global_step": 21676, "epoch": 179} {"train_loss": -30.04648780822754, "global_step": 21677, "epoch": 179} {"train_loss": -30.009458541870117, "global_step": 21678, "epoch": 179} {"train_loss": -29.982391357421875, "global_step": 21679, "epoch": 179} {"train_loss": -29.706756591796875, "global_step": 21680, "epoch": 179} {"train_loss": -30.218612670898438, "global_step": 21681, "epoch": 179} {"train_loss": -30.70503044128418, "global_step": 21682, "epoch": 179} {"train_loss": -30.435312271118164, "global_step": 21683, "epoch": 179} {"train_loss": -30.01312828063965, "global_step": 21684, "epoch": 179} {"train_loss": -29.71156883239746, "global_step": 21685, "epoch": 179} {"train_loss": -29.971759796142578, "global_step": 21686, "epoch": 179} {"train_loss": -30.428983688354492, "global_step": 21687, "epoch": 179} {"train_loss": -29.933212280273438, "global_step": 21688, "epoch": 179} {"train_loss": -29.931549072265625, "global_step": 21689, "epoch": 179} {"train_loss": -30.144582748413086, "global_step": 21690, "epoch": 179} {"train_loss": -30.255218505859375, "global_step": 21691, "epoch": 179} {"train_loss": -29.938312530517578, "global_step": 21692, "epoch": 179} {"train_loss": -30.67068862915039, "global_step": 21693, "epoch": 179} {"train_loss": -30.187671661376953, "global_step": 21694, "epoch": 179} {"train_loss": -30.038684844970703, "global_step": 21695, "epoch": 179} {"train_loss": -29.683761596679688, "global_step": 21696, "epoch": 179} {"train_loss": -29.70528221130371, "global_step": 21697, "epoch": 179} {"train_loss": -30.29387855529785, "global_step": 21698, "epoch": 179} {"train_loss": -29.875146865844727, "global_step": 21699, "epoch": 179} {"train_loss": -29.342208862304688, "global_step": 21700, "epoch": 179} {"train_loss": -30.595884323120117, "global_step": 21701, "epoch": 179} {"train_loss": -29.712549209594727, "global_step": 21702, "epoch": 179} {"train_loss": -29.4433650970459, "global_step": 21703, "epoch": 179} {"train_loss": -29.67557144165039, "global_step": 21704, "epoch": 179} {"train_loss": -30.425994873046875, "global_step": 21705, "epoch": 179} {"train_loss": -30.0939884185791, "global_step": 21706, "epoch": 179} {"train_loss": -29.819669723510742, "global_step": 21707, "epoch": 179} {"train_loss": -30.34307861328125, "global_step": 21708, "epoch": 179} {"train_loss": -30.01372718811035, "global_step": 21709, "epoch": 179} {"train_loss": -30.3070125579834, "global_step": 21710, "epoch": 179} {"train_loss": -30.310338973999023, "global_step": 21711, "epoch": 179} {"train_loss": -30.132654190063477, "global_step": 21712, "epoch": 179} {"train_loss": -29.784870147705078, "global_step": 21713, "epoch": 179} {"train_loss": -29.44269371032715, "global_step": 21714, "epoch": 179} {"train_loss": -29.5191650390625, "global_step": 21715, "epoch": 179} {"train_loss": -28.845508575439453, "global_step": 21716, "epoch": 179} {"train_loss": -28.41362953186035, "global_step": 21717, "epoch": 179} {"train_loss": -26.237226486206055, "global_step": 21718, "epoch": 179} {"train_loss": -27.3492488861084, "global_step": 21719, "epoch": 179} {"train_loss": -28.909025192260742, "global_step": 21720, "epoch": 179} {"train_loss": -29.53468132019043, "global_step": 21721, "epoch": 179} {"train_loss": -28.09634780883789, "global_step": 21722, "epoch": 179} {"train_loss": -29.990102767944336, "global_step": 21723, "epoch": 179} {"train_loss": -29.339330673217773, "global_step": 21724, "epoch": 179} {"train_loss": -29.34327507019043, "global_step": 21725, "epoch": 179} {"train_loss": -29.7838191986084, "global_step": 21726, "epoch": 179} {"train_loss": -29.69209098815918, "global_step": 21727, "epoch": 179} {"train_loss": -28.738937377929688, "global_step": 21728, "epoch": 179} {"train_loss": -29.487018585205078, "global_step": 21729, "epoch": 179} {"train_loss": -27.50677490234375, "global_step": 21730, "epoch": 179} {"train_loss": -29.598108291625977, "global_step": 21731, "epoch": 179} {"train_loss": -28.09686851501465, "global_step": 21732, "epoch": 179} {"train_loss": -28.586227416992188, "global_step": 21733, "epoch": 179} {"train_loss": -28.955793380737305, "global_step": 21734, "epoch": 179} {"train_loss": -28.3978328704834, "global_step": 21735, "epoch": 179} {"train_loss": -28.561737060546875, "global_step": 21736, "epoch": 179} {"train_loss": -29.00687599182129, "global_step": 21737, "epoch": 179} {"train_loss": -29.183673858642578, "global_step": 21738, "epoch": 179} {"train_loss": -28.31768798828125, "global_step": 21739, "epoch": 179} {"train_loss": -29.18672752380371, "global_step": 21740, "epoch": 179} {"train_loss": -29.279266357421875, "global_step": 21741, "epoch": 179} {"train_loss": -29.0196533203125, "global_step": 21742, "epoch": 179} {"train_loss": -29.29905128479004, "global_step": 21743, "epoch": 179} {"train_loss": -29.580942153930664, "global_step": 21744, "epoch": 179} {"train_loss": -29.67791175842285, "global_step": 21745, "epoch": 179} {"train_loss": -29.850357055664062, "global_step": 21746, "epoch": 179} {"train_loss": -29.739837646484375, "global_step": 21747, "epoch": 179} {"train_loss": -29.98335075378418, "global_step": 21748, "epoch": 179} {"train_loss": -29.904966354370117, "global_step": 21749, "epoch": 179} {"train_loss": -30.044483184814453, "global_step": 21750, "epoch": 179} {"train_loss": -29.71546745300293, "global_step": 21751, "epoch": 179} {"train_loss": -29.41253089904785, "global_step": 21752, "epoch": 179} {"train_loss": -29.808095932006836, "global_step": 21753, "epoch": 179} {"train_loss": -30.1749324798584, "global_step": 21754, "epoch": 179} {"train_loss": -29.8240909576416, "global_step": 21755, "epoch": 179} {"train_loss": -30.20168113708496, "global_step": 21756, "epoch": 179} {"train_loss": -30.28559684753418, "global_step": 21757, "epoch": 179} {"train_loss": -29.85377311706543, "global_step": 21758, "epoch": 179} {"train_loss": -30.5080623626709, "global_step": 21759, "epoch": 179} {"train_loss": -30.35890769958496, "global_step": 21760, "epoch": 179} {"train_loss": -29.937280654907227, "global_step": 21761, "epoch": 179} {"train_loss": -30.463123321533203, "global_step": 21762, "epoch": 179} {"train_loss": -30.02422523498535, "global_step": 21763, "epoch": 179} {"train_loss": -29.8199462890625, "global_step": 21764, "epoch": 179} {"train_loss": -30.789899826049805, "global_step": 21765, "epoch": 179} {"train_loss": -30.46613121032715, "global_step": 21766, "epoch": 179} {"train_loss": -30.313812255859375, "global_step": 21767, "epoch": 179} {"train_loss": -30.389036178588867, "global_step": 21768, "epoch": 179} {"train_loss": -29.781824111938477, "global_step": 21769, "epoch": 179} {"train_loss": -30.25611686706543, "global_step": 21770, "epoch": 179} {"train_loss": -30.56939125061035, "global_step": 21771, "epoch": 179} {"train_loss": -30.301267623901367, "global_step": 21772, "epoch": 179} {"train_loss": -30.70489501953125, "global_step": 21773, "epoch": 179} {"train_loss": -30.398269653320312, "global_step": 21774, "epoch": 179} {"train_loss": -29.927038192749023, "global_step": 21775, "epoch": 179} {"train_loss": -29.88313865661621, "global_step": 21776, "epoch": 179} {"train_loss": -28.719135284423828, "global_step": 21777, "epoch": 179} {"train_loss": -28.503437042236328, "global_step": 21778, "epoch": 179} {"train_loss": -29.70480983513446, "global_step": 21779, "epoch": 179, "val_loss": 2688915.75} {"train_loss": -29.560123443603516, "global_step": 21780, "epoch": 180} {"train_loss": -30.768484115600586, "global_step": 21781, "epoch": 180} {"train_loss": -30.263463973999023, "global_step": 21782, "epoch": 180} {"train_loss": -29.853973388671875, "global_step": 21783, "epoch": 180} {"train_loss": -29.49386978149414, "global_step": 21784, "epoch": 180} {"train_loss": -30.52265739440918, "global_step": 21785, "epoch": 180} {"train_loss": -30.459470748901367, "global_step": 21786, "epoch": 180} {"train_loss": -30.23524284362793, "global_step": 21787, "epoch": 180} {"train_loss": -30.19109535217285, "global_step": 21788, "epoch": 180} {"train_loss": -30.90302085876465, "global_step": 21789, "epoch": 180} {"train_loss": -30.537878036499023, "global_step": 21790, "epoch": 180} {"train_loss": -30.57040786743164, "global_step": 21791, "epoch": 180} {"train_loss": -30.614145278930664, "global_step": 21792, "epoch": 180} {"train_loss": -30.487329483032227, "global_step": 21793, "epoch": 180} {"train_loss": -30.551321029663086, "global_step": 21794, "epoch": 180} {"train_loss": -30.207656860351562, "global_step": 21795, "epoch": 180} {"train_loss": -30.32901382446289, "global_step": 21796, "epoch": 180} {"train_loss": -30.863622665405273, "global_step": 21797, "epoch": 180} {"train_loss": -30.6202449798584, "global_step": 21798, "epoch": 180} {"train_loss": -30.70623779296875, "global_step": 21799, "epoch": 180} {"train_loss": -30.152868270874023, "global_step": 21800, "epoch": 180} {"train_loss": -30.14057731628418, "global_step": 21801, "epoch": 180} {"train_loss": -30.05617332458496, "global_step": 21802, "epoch": 180} {"train_loss": -30.31766700744629, "global_step": 21803, "epoch": 180} {"train_loss": -30.647130966186523, "global_step": 21804, "epoch": 180} {"train_loss": -30.044086456298828, "global_step": 21805, "epoch": 180} {"train_loss": -30.48974609375, "global_step": 21806, "epoch": 180} {"train_loss": -30.105377197265625, "global_step": 21807, "epoch": 180} {"train_loss": -30.54143714904785, "global_step": 21808, "epoch": 180} {"train_loss": -31.01002311706543, "global_step": 21809, "epoch": 180} {"train_loss": -30.229894638061523, "global_step": 21810, "epoch": 180} {"train_loss": -30.6835880279541, "global_step": 21811, "epoch": 180} {"train_loss": -30.52351188659668, "global_step": 21812, "epoch": 180} {"train_loss": -30.443143844604492, "global_step": 21813, "epoch": 180} {"train_loss": -30.434402465820312, "global_step": 21814, "epoch": 180} {"train_loss": -30.13392448425293, "global_step": 21815, "epoch": 180} {"train_loss": -30.02777671813965, "global_step": 21816, "epoch": 180} {"train_loss": -30.721960067749023, "global_step": 21817, "epoch": 180} {"train_loss": -30.464263916015625, "global_step": 21818, "epoch": 180} {"train_loss": -29.440948486328125, "global_step": 21819, "epoch": 180} {"train_loss": -29.8509464263916, "global_step": 21820, "epoch": 180} {"train_loss": -30.38348960876465, "global_step": 21821, "epoch": 180} {"train_loss": -30.918317794799805, "global_step": 21822, "epoch": 180} {"train_loss": -30.71551513671875, "global_step": 21823, "epoch": 180} {"train_loss": -30.7146053314209, "global_step": 21824, "epoch": 180} {"train_loss": -30.173873901367188, "global_step": 21825, "epoch": 180} {"train_loss": -30.865949630737305, "global_step": 21826, "epoch": 180} {"train_loss": -30.752201080322266, "global_step": 21827, "epoch": 180} {"train_loss": -30.244693756103516, "global_step": 21828, "epoch": 180} {"train_loss": -30.66058349609375, "global_step": 21829, "epoch": 180} {"train_loss": -30.668109893798828, "global_step": 21830, "epoch": 180} {"train_loss": -30.985336303710938, "global_step": 21831, "epoch": 180} {"train_loss": -31.153589248657227, "global_step": 21832, "epoch": 180} {"train_loss": -31.0601806640625, "global_step": 21833, "epoch": 180} {"train_loss": -30.895313262939453, "global_step": 21834, "epoch": 180} {"train_loss": -30.95778465270996, "global_step": 21835, "epoch": 180} {"train_loss": -30.696155548095703, "global_step": 21836, "epoch": 180} {"train_loss": -30.7663631439209, "global_step": 21837, "epoch": 180} {"train_loss": -30.29367446899414, "global_step": 21838, "epoch": 180} {"train_loss": -30.96246910095215, "global_step": 21839, "epoch": 180} {"train_loss": -30.86383056640625, "global_step": 21840, "epoch": 180} {"train_loss": -31.120290756225586, "global_step": 21841, "epoch": 180} {"train_loss": -30.9520320892334, "global_step": 21842, "epoch": 180} {"train_loss": -30.525571823120117, "global_step": 21843, "epoch": 180} {"train_loss": -30.047739028930664, "global_step": 21844, "epoch": 180} {"train_loss": -27.176366806030273, "global_step": 21845, "epoch": 180} {"train_loss": -24.64692497253418, "global_step": 21846, "epoch": 180} {"train_loss": -27.289194107055664, "global_step": 21847, "epoch": 180} {"train_loss": -27.84830093383789, "global_step": 21848, "epoch": 180} {"train_loss": -21.167896270751953, "global_step": 21849, "epoch": 180} {"train_loss": -27.55316734313965, "global_step": 21850, "epoch": 180} {"train_loss": -27.312793731689453, "global_step": 21851, "epoch": 180} {"train_loss": -28.92236328125, "global_step": 21852, "epoch": 180} {"train_loss": -27.844572067260742, "global_step": 21853, "epoch": 180} {"train_loss": -29.651403427124023, "global_step": 21854, "epoch": 180} {"train_loss": -29.238494873046875, "global_step": 21855, "epoch": 180} {"train_loss": -28.501724243164062, "global_step": 21856, "epoch": 180} {"train_loss": -28.453977584838867, "global_step": 21857, "epoch": 180} {"train_loss": -30.117780685424805, "global_step": 21858, "epoch": 180} {"train_loss": -29.484241485595703, "global_step": 21859, "epoch": 180} {"train_loss": -29.170536041259766, "global_step": 21860, "epoch": 180} {"train_loss": -29.75653076171875, "global_step": 21861, "epoch": 180} {"train_loss": -29.83155632019043, "global_step": 21862, "epoch": 180} {"train_loss": -28.889387130737305, "global_step": 21863, "epoch": 180} {"train_loss": -27.504566192626953, "global_step": 21864, "epoch": 180} {"train_loss": -28.2182674407959, "global_step": 21865, "epoch": 180} {"train_loss": -29.690387725830078, "global_step": 21866, "epoch": 180} {"train_loss": -30.36710548400879, "global_step": 21867, "epoch": 180} {"train_loss": -29.444507598876953, "global_step": 21868, "epoch": 180} {"train_loss": -29.159143447875977, "global_step": 21869, "epoch": 180} {"train_loss": -30.103185653686523, "global_step": 21870, "epoch": 180} {"train_loss": -30.08977699279785, "global_step": 21871, "epoch": 180} {"train_loss": -30.028018951416016, "global_step": 21872, "epoch": 180} {"train_loss": -29.683652877807617, "global_step": 21873, "epoch": 180} {"train_loss": -30.104400634765625, "global_step": 21874, "epoch": 180} {"train_loss": -30.155868530273438, "global_step": 21875, "epoch": 180} {"train_loss": -29.83851432800293, "global_step": 21876, "epoch": 180} {"train_loss": -30.21465492248535, "global_step": 21877, "epoch": 180} {"train_loss": -29.64408302307129, "global_step": 21878, "epoch": 180} {"train_loss": -30.208932876586914, "global_step": 21879, "epoch": 180} {"train_loss": -30.289417266845703, "global_step": 21880, "epoch": 180} {"train_loss": -30.456485748291016, "global_step": 21881, "epoch": 180} {"train_loss": -29.980133056640625, "global_step": 21882, "epoch": 180} {"train_loss": -29.9218692779541, "global_step": 21883, "epoch": 180} {"train_loss": -30.3245906829834, "global_step": 21884, "epoch": 180} {"train_loss": -30.132781982421875, "global_step": 21885, "epoch": 180} {"train_loss": -30.041162490844727, "global_step": 21886, "epoch": 180} {"train_loss": -30.335668563842773, "global_step": 21887, "epoch": 180} {"train_loss": -30.24567222595215, "global_step": 21888, "epoch": 180} {"train_loss": -30.518497467041016, "global_step": 21889, "epoch": 180} {"train_loss": -30.531641006469727, "global_step": 21890, "epoch": 180} {"train_loss": -30.451017379760742, "global_step": 21891, "epoch": 180} {"train_loss": -29.659046173095703, "global_step": 21892, "epoch": 180} {"train_loss": -30.300878524780273, "global_step": 21893, "epoch": 180} {"train_loss": -30.55411148071289, "global_step": 21894, "epoch": 180} {"train_loss": -29.114837646484375, "global_step": 21895, "epoch": 180} {"train_loss": -30.50909996032715, "global_step": 21896, "epoch": 180} {"train_loss": -29.5655574798584, "global_step": 21897, "epoch": 180} {"train_loss": -30.295907974243164, "global_step": 21898, "epoch": 180} {"train_loss": -30.334625244140625, "global_step": 21899, "epoch": 180} {"train_loss": -29.944925875703166, "global_step": 21900, "epoch": 180, "val_loss": 2517967.0} {"train_loss": -29.531829833984375, "global_step": 21901, "epoch": 181} {"train_loss": -30.099029541015625, "global_step": 21902, "epoch": 181} {"train_loss": -29.810745239257812, "global_step": 21903, "epoch": 181} {"train_loss": -29.970142364501953, "global_step": 21904, "epoch": 181} {"train_loss": -30.481246948242188, "global_step": 21905, "epoch": 181} {"train_loss": -30.476499557495117, "global_step": 21906, "epoch": 181} {"train_loss": -29.879642486572266, "global_step": 21907, "epoch": 181} {"train_loss": -30.985143661499023, "global_step": 21908, "epoch": 181} {"train_loss": -30.61707878112793, "global_step": 21909, "epoch": 181} {"train_loss": -30.32354736328125, "global_step": 21910, "epoch": 181} {"train_loss": -30.433216094970703, "global_step": 21911, "epoch": 181} {"train_loss": -29.905149459838867, "global_step": 21912, "epoch": 181} {"train_loss": -29.1002197265625, "global_step": 21913, "epoch": 181} {"train_loss": -27.5058650970459, "global_step": 21914, "epoch": 181} {"train_loss": -23.878496170043945, "global_step": 21915, "epoch": 181} {"train_loss": -21.921354293823242, "global_step": 21916, "epoch": 181} {"train_loss": -23.902191162109375, "global_step": 21917, "epoch": 181} {"train_loss": -29.998767852783203, "global_step": 21918, "epoch": 181} {"train_loss": -24.52743911743164, "global_step": 21919, "epoch": 181} {"train_loss": -29.022260665893555, "global_step": 21920, "epoch": 181} {"train_loss": -27.052961349487305, "global_step": 21921, "epoch": 181} {"train_loss": -28.089414596557617, "global_step": 21922, "epoch": 181} {"train_loss": -28.874755859375, "global_step": 21923, "epoch": 181} {"train_loss": -29.587732315063477, "global_step": 21924, "epoch": 181} {"train_loss": -28.607486724853516, "global_step": 21925, "epoch": 181} {"train_loss": -29.552499771118164, "global_step": 21926, "epoch": 181} {"train_loss": -29.24724769592285, "global_step": 21927, "epoch": 181} {"train_loss": -29.722808837890625, "global_step": 21928, "epoch": 181} {"train_loss": -30.043975830078125, "global_step": 21929, "epoch": 181} {"train_loss": -30.004840850830078, "global_step": 21930, "epoch": 181} {"train_loss": -29.434833526611328, "global_step": 21931, "epoch": 181} {"train_loss": -29.804731369018555, "global_step": 21932, "epoch": 181} {"train_loss": -30.349740982055664, "global_step": 21933, "epoch": 181} {"train_loss": -30.206104278564453, "global_step": 21934, "epoch": 181} {"train_loss": -30.075971603393555, "global_step": 21935, "epoch": 181} {"train_loss": -30.173751831054688, "global_step": 21936, "epoch": 181} {"train_loss": -30.0030517578125, "global_step": 21937, "epoch": 181} {"train_loss": -30.395111083984375, "global_step": 21938, "epoch": 181} {"train_loss": -30.42579460144043, "global_step": 21939, "epoch": 181} {"train_loss": -29.6386775970459, "global_step": 21940, "epoch": 181} {"train_loss": -29.93082618713379, "global_step": 21941, "epoch": 181} {"train_loss": -29.751880645751953, "global_step": 21942, "epoch": 181} {"train_loss": -30.206418991088867, "global_step": 21943, "epoch": 181} {"train_loss": -30.554174423217773, "global_step": 21944, "epoch": 181} {"train_loss": -29.98794937133789, "global_step": 21945, "epoch": 181} {"train_loss": -29.85725212097168, "global_step": 21946, "epoch": 181} {"train_loss": -30.11854362487793, "global_step": 21947, "epoch": 181} {"train_loss": -29.973901748657227, "global_step": 21948, "epoch": 181} {"train_loss": -29.886749267578125, "global_step": 21949, "epoch": 181} {"train_loss": -30.08147621154785, "global_step": 21950, "epoch": 181} {"train_loss": -29.9283447265625, "global_step": 21951, "epoch": 181} {"train_loss": -29.463911056518555, "global_step": 21952, "epoch": 181} {"train_loss": -28.802392959594727, "global_step": 21953, "epoch": 181} {"train_loss": -28.250150680541992, "global_step": 21954, "epoch": 181} {"train_loss": -27.970386505126953, "global_step": 21955, "epoch": 181} {"train_loss": -26.681928634643555, "global_step": 21956, "epoch": 181} {"train_loss": -25.081562042236328, "global_step": 21957, "epoch": 181} {"train_loss": -28.398950576782227, "global_step": 21958, "epoch": 181} {"train_loss": -30.12101173400879, "global_step": 21959, "epoch": 181} {"train_loss": -27.664886474609375, "global_step": 21960, "epoch": 181} {"train_loss": -27.497577667236328, "global_step": 21961, "epoch": 181} {"train_loss": -29.842599868774414, "global_step": 21962, "epoch": 181} {"train_loss": -26.491657257080078, "global_step": 21963, "epoch": 181} {"train_loss": -29.4959659576416, "global_step": 21964, "epoch": 181} {"train_loss": -27.957767486572266, "global_step": 21965, "epoch": 181} {"train_loss": -29.651037216186523, "global_step": 21966, "epoch": 181} {"train_loss": -28.49273681640625, "global_step": 21967, "epoch": 181} {"train_loss": -29.89532470703125, "global_step": 21968, "epoch": 181} {"train_loss": -28.621768951416016, "global_step": 21969, "epoch": 181} {"train_loss": -29.71282386779785, "global_step": 21970, "epoch": 181} {"train_loss": -29.49163818359375, "global_step": 21971, "epoch": 181} {"train_loss": -29.54913902282715, "global_step": 21972, "epoch": 181} {"train_loss": -29.41852378845215, "global_step": 21973, "epoch": 181} {"train_loss": -29.6904239654541, "global_step": 21974, "epoch": 181} {"train_loss": -30.218908309936523, "global_step": 21975, "epoch": 181} {"train_loss": -29.818632125854492, "global_step": 21976, "epoch": 181} {"train_loss": -29.76321792602539, "global_step": 21977, "epoch": 181} {"train_loss": -30.071985244750977, "global_step": 21978, "epoch": 181} {"train_loss": -29.69476318359375, "global_step": 21979, "epoch": 181} {"train_loss": -30.003992080688477, "global_step": 21980, "epoch": 181} {"train_loss": -29.81589126586914, "global_step": 21981, "epoch": 181} {"train_loss": -29.76979637145996, "global_step": 21982, "epoch": 181} {"train_loss": -30.0578556060791, "global_step": 21983, "epoch": 181} {"train_loss": -30.57203483581543, "global_step": 21984, "epoch": 181} {"train_loss": -29.919921875, "global_step": 21985, "epoch": 181} {"train_loss": -30.215057373046875, "global_step": 21986, "epoch": 181} {"train_loss": -30.139379501342773, "global_step": 21987, "epoch": 181} {"train_loss": -29.932113647460938, "global_step": 21988, "epoch": 181} {"train_loss": -29.8258113861084, "global_step": 21989, "epoch": 181} {"train_loss": -29.158737182617188, "global_step": 21990, "epoch": 181} {"train_loss": -30.05387306213379, "global_step": 21991, "epoch": 181} {"train_loss": -30.509878158569336, "global_step": 21992, "epoch": 181} {"train_loss": -29.944318771362305, "global_step": 21993, "epoch": 181} {"train_loss": -29.546619415283203, "global_step": 21994, "epoch": 181} {"train_loss": -30.48943519592285, "global_step": 21995, "epoch": 181} {"train_loss": -29.39017677307129, "global_step": 21996, "epoch": 181} {"train_loss": -29.764307022094727, "global_step": 21997, "epoch": 181} {"train_loss": -30.128814697265625, "global_step": 21998, "epoch": 181} {"train_loss": -29.79520034790039, "global_step": 21999, "epoch": 181} {"train_loss": -29.683746337890625, "global_step": 22000, "epoch": 181} {"train_loss": -30.405393600463867, "global_step": 22001, "epoch": 181} {"train_loss": -30.375503540039062, "global_step": 22002, "epoch": 181} {"train_loss": -29.4337100982666, "global_step": 22003, "epoch": 181} {"train_loss": -30.375959396362305, "global_step": 22004, "epoch": 181} {"train_loss": -30.31231689453125, "global_step": 22005, "epoch": 181} {"train_loss": -30.171594619750977, "global_step": 22006, "epoch": 181} {"train_loss": -30.55628776550293, "global_step": 22007, "epoch": 181} {"train_loss": -30.386707305908203, "global_step": 22008, "epoch": 181} {"train_loss": -30.553537368774414, "global_step": 22009, "epoch": 181} {"train_loss": -30.30630874633789, "global_step": 22010, "epoch": 181} {"train_loss": -30.744159698486328, "global_step": 22011, "epoch": 181} {"train_loss": -30.338605880737305, "global_step": 22012, "epoch": 181} {"train_loss": -30.578266143798828, "global_step": 22013, "epoch": 181} {"train_loss": -30.19114112854004, "global_step": 22014, "epoch": 181} {"train_loss": -30.918909072875977, "global_step": 22015, "epoch": 181} {"train_loss": -30.487308502197266, "global_step": 22016, "epoch": 181} {"train_loss": -30.97149085998535, "global_step": 22017, "epoch": 181} {"train_loss": -30.066852569580078, "global_step": 22018, "epoch": 181} {"train_loss": -30.778478622436523, "global_step": 22019, "epoch": 181} {"train_loss": -30.314563751220703, "global_step": 22020, "epoch": 181} {"train_loss": -29.496913878385687, "global_step": 22021, "epoch": 181, "val_loss": 2635080.5} {"train_loss": -29.456439971923828, "global_step": 22022, "epoch": 182} {"train_loss": -30.11810302734375, "global_step": 22023, "epoch": 182} {"train_loss": -29.985107421875, "global_step": 22024, "epoch": 182} {"train_loss": -29.730335235595703, "global_step": 22025, "epoch": 182} {"train_loss": -30.32977294921875, "global_step": 22026, "epoch": 182} {"train_loss": -30.4288272857666, "global_step": 22027, "epoch": 182} {"train_loss": -30.59125328063965, "global_step": 22028, "epoch": 182} {"train_loss": -30.313383102416992, "global_step": 22029, "epoch": 182} {"train_loss": -30.509531021118164, "global_step": 22030, "epoch": 182} {"train_loss": -30.581342697143555, "global_step": 22031, "epoch": 182} {"train_loss": -30.537748336791992, "global_step": 22032, "epoch": 182} {"train_loss": -30.346677780151367, "global_step": 22033, "epoch": 182} {"train_loss": -30.557083129882812, "global_step": 22034, "epoch": 182} {"train_loss": -30.157596588134766, "global_step": 22035, "epoch": 182} {"train_loss": -31.041645050048828, "global_step": 22036, "epoch": 182} {"train_loss": -30.27625846862793, "global_step": 22037, "epoch": 182} {"train_loss": -30.424224853515625, "global_step": 22038, "epoch": 182} {"train_loss": -30.289709091186523, "global_step": 22039, "epoch": 182} {"train_loss": -30.06766128540039, "global_step": 22040, "epoch": 182} {"train_loss": -30.492950439453125, "global_step": 22041, "epoch": 182} {"train_loss": -30.40447998046875, "global_step": 22042, "epoch": 182} {"train_loss": -30.323766708374023, "global_step": 22043, "epoch": 182} {"train_loss": -31.0742130279541, "global_step": 22044, "epoch": 182} {"train_loss": -30.14653968811035, "global_step": 22045, "epoch": 182} {"train_loss": -30.003583908081055, "global_step": 22046, "epoch": 182} {"train_loss": -30.645559310913086, "global_step": 22047, "epoch": 182} {"train_loss": -30.4360294342041, "global_step": 22048, "epoch": 182} {"train_loss": -30.455175399780273, "global_step": 22049, "epoch": 182} {"train_loss": -30.46615982055664, "global_step": 22050, "epoch": 182} {"train_loss": -30.653654098510742, "global_step": 22051, "epoch": 182} {"train_loss": -30.495695114135742, "global_step": 22052, "epoch": 182} {"train_loss": -30.5927734375, "global_step": 22053, "epoch": 182} {"train_loss": -30.6461124420166, "global_step": 22054, "epoch": 182} {"train_loss": -30.791650772094727, "global_step": 22055, "epoch": 182} {"train_loss": -31.0418758392334, "global_step": 22056, "epoch": 182} {"train_loss": -30.989858627319336, "global_step": 22057, "epoch": 182} {"train_loss": -30.8265323638916, "global_step": 22058, "epoch": 182} {"train_loss": -30.8177433013916, "global_step": 22059, "epoch": 182} {"train_loss": -31.186254501342773, "global_step": 22060, "epoch": 182} {"train_loss": -31.26395606994629, "global_step": 22061, "epoch": 182} {"train_loss": -31.161901473999023, "global_step": 22062, "epoch": 182} {"train_loss": -30.995946884155273, "global_step": 22063, "epoch": 182} {"train_loss": -31.311126708984375, "global_step": 22064, "epoch": 182} {"train_loss": -30.915531158447266, "global_step": 22065, "epoch": 182} {"train_loss": -31.159870147705078, "global_step": 22066, "epoch": 182} {"train_loss": -31.4384822845459, "global_step": 22067, "epoch": 182} {"train_loss": -31.11292839050293, "global_step": 22068, "epoch": 182} {"train_loss": -31.020933151245117, "global_step": 22069, "epoch": 182} {"train_loss": -31.146289825439453, "global_step": 22070, "epoch": 182} {"train_loss": -30.623722076416016, "global_step": 22071, "epoch": 182} {"train_loss": -31.653539657592773, "global_step": 22072, "epoch": 182} {"train_loss": -30.847593307495117, "global_step": 22073, "epoch": 182} {"train_loss": -31.237701416015625, "global_step": 22074, "epoch": 182} {"train_loss": -31.009063720703125, "global_step": 22075, "epoch": 182} {"train_loss": -31.232900619506836, "global_step": 22076, "epoch": 182} {"train_loss": -30.68585777282715, "global_step": 22077, "epoch": 182} {"train_loss": -30.36517333984375, "global_step": 22078, "epoch": 182} {"train_loss": -31.073083877563477, "global_step": 22079, "epoch": 182} {"train_loss": -30.713769912719727, "global_step": 22080, "epoch": 182} {"train_loss": -30.86907386779785, "global_step": 22081, "epoch": 182} {"train_loss": -30.528791427612305, "global_step": 22082, "epoch": 182} {"train_loss": -30.3400936126709, "global_step": 22083, "epoch": 182} {"train_loss": -30.812946319580078, "global_step": 22084, "epoch": 182} {"train_loss": -30.756738662719727, "global_step": 22085, "epoch": 182} {"train_loss": -30.390958786010742, "global_step": 22086, "epoch": 182} {"train_loss": -30.677841186523438, "global_step": 22087, "epoch": 182} {"train_loss": -29.748937606811523, "global_step": 22088, "epoch": 182} {"train_loss": -29.101160049438477, "global_step": 22089, "epoch": 182} {"train_loss": -29.2503662109375, "global_step": 22090, "epoch": 182} {"train_loss": -28.769424438476562, "global_step": 22091, "epoch": 182} {"train_loss": -28.671838760375977, "global_step": 22092, "epoch": 182} {"train_loss": -29.714529037475586, "global_step": 22093, "epoch": 182} {"train_loss": -30.313812255859375, "global_step": 22094, "epoch": 182} {"train_loss": -29.801807403564453, "global_step": 22095, "epoch": 182} {"train_loss": -27.633604049682617, "global_step": 22096, "epoch": 182} {"train_loss": -29.085134506225586, "global_step": 22097, "epoch": 182} {"train_loss": -30.767730712890625, "global_step": 22098, "epoch": 182} {"train_loss": -29.024627685546875, "global_step": 22099, "epoch": 182} {"train_loss": -29.16400718688965, "global_step": 22100, "epoch": 182} {"train_loss": -28.42030143737793, "global_step": 22101, "epoch": 182} {"train_loss": -30.04631996154785, "global_step": 22102, "epoch": 182} {"train_loss": -29.80611228942871, "global_step": 22103, "epoch": 182} {"train_loss": -29.57830810546875, "global_step": 22104, "epoch": 182} {"train_loss": -30.434797286987305, "global_step": 22105, "epoch": 182} {"train_loss": -29.352066040039062, "global_step": 22106, "epoch": 182} {"train_loss": -30.549177169799805, "global_step": 22107, "epoch": 182} {"train_loss": -30.359365463256836, "global_step": 22108, "epoch": 182} {"train_loss": -30.110197067260742, "global_step": 22109, "epoch": 182} {"train_loss": -30.958044052124023, "global_step": 22110, "epoch": 182} {"train_loss": -29.997528076171875, "global_step": 22111, "epoch": 182} {"train_loss": -30.095884323120117, "global_step": 22112, "epoch": 182} {"train_loss": -30.429092407226562, "global_step": 22113, "epoch": 182} {"train_loss": -29.541202545166016, "global_step": 22114, "epoch": 182} {"train_loss": -30.71455192565918, "global_step": 22115, "epoch": 182} {"train_loss": -30.510223388671875, "global_step": 22116, "epoch": 182} {"train_loss": -29.699411392211914, "global_step": 22117, "epoch": 182} {"train_loss": -30.716779708862305, "global_step": 22118, "epoch": 182} {"train_loss": -29.8324031829834, "global_step": 22119, "epoch": 182} {"train_loss": -30.025348663330078, "global_step": 22120, "epoch": 182} {"train_loss": -29.7039737701416, "global_step": 22121, "epoch": 182} {"train_loss": -29.30988121032715, "global_step": 22122, "epoch": 182} {"train_loss": -29.730865478515625, "global_step": 22123, "epoch": 182} {"train_loss": -27.55525016784668, "global_step": 22124, "epoch": 182} {"train_loss": -29.021665573120117, "global_step": 22125, "epoch": 182} {"train_loss": -29.54070472717285, "global_step": 22126, "epoch": 182} {"train_loss": -30.23308753967285, "global_step": 22127, "epoch": 182} {"train_loss": -27.9508113861084, "global_step": 22128, "epoch": 182} {"train_loss": -28.828216552734375, "global_step": 22129, "epoch": 182} {"train_loss": -30.32645034790039, "global_step": 22130, "epoch": 182} {"train_loss": -30.121789932250977, "global_step": 22131, "epoch": 182} {"train_loss": -29.401840209960938, "global_step": 22132, "epoch": 182} {"train_loss": -29.900304794311523, "global_step": 22133, "epoch": 182} {"train_loss": -30.1657657623291, "global_step": 22134, "epoch": 182} {"train_loss": -29.965925216674805, "global_step": 22135, "epoch": 182} {"train_loss": -29.900333404541016, "global_step": 22136, "epoch": 182} {"train_loss": -30.36641502380371, "global_step": 22137, "epoch": 182} {"train_loss": -30.14554214477539, "global_step": 22138, "epoch": 182} {"train_loss": -30.425342559814453, "global_step": 22139, "epoch": 182} {"train_loss": -29.83148193359375, "global_step": 22140, "epoch": 182} {"train_loss": -30.667810440063477, "global_step": 22141, "epoch": 182} {"train_loss": -30.241594645602643, "global_step": 22142, "epoch": 182, "val_loss": 2746703.25} {"train_loss": -30.798664093017578, "global_step": 22143, "epoch": 183} {"train_loss": -30.0853271484375, "global_step": 22144, "epoch": 183} {"train_loss": -30.461511611938477, "global_step": 22145, "epoch": 183} {"train_loss": -31.02090835571289, "global_step": 22146, "epoch": 183} {"train_loss": -30.63677978515625, "global_step": 22147, "epoch": 183} {"train_loss": -30.572919845581055, "global_step": 22148, "epoch": 183} {"train_loss": -30.427204132080078, "global_step": 22149, "epoch": 183} {"train_loss": -31.041584014892578, "global_step": 22150, "epoch": 183} {"train_loss": -30.436460494995117, "global_step": 22151, "epoch": 183} {"train_loss": -30.493162155151367, "global_step": 22152, "epoch": 183} {"train_loss": -30.277603149414062, "global_step": 22153, "epoch": 183} {"train_loss": -30.927011489868164, "global_step": 22154, "epoch": 183} {"train_loss": -30.58905601501465, "global_step": 22155, "epoch": 183} {"train_loss": -30.505640029907227, "global_step": 22156, "epoch": 183} {"train_loss": -30.709836959838867, "global_step": 22157, "epoch": 183} {"train_loss": -30.608407974243164, "global_step": 22158, "epoch": 183} {"train_loss": -31.103515625, "global_step": 22159, "epoch": 183} {"train_loss": -31.041837692260742, "global_step": 22160, "epoch": 183} {"train_loss": -30.85491371154785, "global_step": 22161, "epoch": 183} {"train_loss": -31.15937614440918, "global_step": 22162, "epoch": 183} {"train_loss": -31.402063369750977, "global_step": 22163, "epoch": 183} {"train_loss": -31.127338409423828, "global_step": 22164, "epoch": 183} {"train_loss": -31.104894638061523, "global_step": 22165, "epoch": 183} {"train_loss": -31.427143096923828, "global_step": 22166, "epoch": 183} {"train_loss": -31.270498275756836, "global_step": 22167, "epoch": 183} {"train_loss": -31.495532989501953, "global_step": 22168, "epoch": 183} {"train_loss": -31.205881118774414, "global_step": 22169, "epoch": 183} {"train_loss": -30.804553985595703, "global_step": 22170, "epoch": 183} {"train_loss": -31.409210205078125, "global_step": 22171, "epoch": 183} {"train_loss": -30.40492057800293, "global_step": 22172, "epoch": 183} {"train_loss": -30.899749755859375, "global_step": 22173, "epoch": 183} {"train_loss": -31.23213768005371, "global_step": 22174, "epoch": 183} {"train_loss": -30.683706283569336, "global_step": 22175, "epoch": 183} {"train_loss": -30.913366317749023, "global_step": 22176, "epoch": 183} {"train_loss": -31.153060913085938, "global_step": 22177, "epoch": 183} {"train_loss": -30.145559310913086, "global_step": 22178, "epoch": 183} {"train_loss": -30.66812515258789, "global_step": 22179, "epoch": 183} {"train_loss": -29.5924015045166, "global_step": 22180, "epoch": 183} {"train_loss": -30.183435440063477, "global_step": 22181, "epoch": 183} {"train_loss": -29.931476593017578, "global_step": 22182, "epoch": 183} {"train_loss": -27.034942626953125, "global_step": 22183, "epoch": 183} {"train_loss": -27.626266479492188, "global_step": 22184, "epoch": 183} {"train_loss": -30.434589385986328, "global_step": 22185, "epoch": 183} {"train_loss": -29.147964477539062, "global_step": 22186, "epoch": 183} {"train_loss": -28.531940460205078, "global_step": 22187, "epoch": 183} {"train_loss": -27.483245849609375, "global_step": 22188, "epoch": 183} {"train_loss": -27.281681060791016, "global_step": 22189, "epoch": 183} {"train_loss": -30.38088035583496, "global_step": 22190, "epoch": 183} {"train_loss": -28.808622360229492, "global_step": 22191, "epoch": 183} {"train_loss": -28.597370147705078, "global_step": 22192, "epoch": 183} {"train_loss": -30.184125900268555, "global_step": 22193, "epoch": 183} {"train_loss": -29.968698501586914, "global_step": 22194, "epoch": 183} {"train_loss": -29.906967163085938, "global_step": 22195, "epoch": 183} {"train_loss": -29.78384780883789, "global_step": 22196, "epoch": 183} {"train_loss": -30.045013427734375, "global_step": 22197, "epoch": 183} {"train_loss": -30.411474227905273, "global_step": 22198, "epoch": 183} {"train_loss": -30.255109786987305, "global_step": 22199, "epoch": 183} {"train_loss": -30.1483154296875, "global_step": 22200, "epoch": 183} {"train_loss": -30.71172523498535, "global_step": 22201, "epoch": 183} {"train_loss": -30.01971435546875, "global_step": 22202, "epoch": 183} {"train_loss": -30.50567626953125, "global_step": 22203, "epoch": 183} {"train_loss": -30.29473876953125, "global_step": 22204, "epoch": 183} {"train_loss": -30.8140926361084, "global_step": 22205, "epoch": 183} {"train_loss": -30.602462768554688, "global_step": 22206, "epoch": 183} {"train_loss": -30.040180206298828, "global_step": 22207, "epoch": 183} {"train_loss": -29.957971572875977, "global_step": 22208, "epoch": 183} {"train_loss": -29.50996208190918, "global_step": 22209, "epoch": 183} {"train_loss": -30.919095993041992, "global_step": 22210, "epoch": 183} {"train_loss": -30.842411041259766, "global_step": 22211, "epoch": 183} {"train_loss": -31.0181827545166, "global_step": 22212, "epoch": 183} {"train_loss": -30.468433380126953, "global_step": 22213, "epoch": 183} {"train_loss": -30.243982315063477, "global_step": 22214, "epoch": 183} {"train_loss": -29.956289291381836, "global_step": 22215, "epoch": 183} {"train_loss": -30.76765251159668, "global_step": 22216, "epoch": 183} {"train_loss": -30.762990951538086, "global_step": 22217, "epoch": 183} {"train_loss": -30.409711837768555, "global_step": 22218, "epoch": 183} {"train_loss": -30.941898345947266, "global_step": 22219, "epoch": 183} {"train_loss": -30.823627471923828, "global_step": 22220, "epoch": 183} {"train_loss": -30.8460693359375, "global_step": 22221, "epoch": 183} {"train_loss": -30.76303482055664, "global_step": 22222, "epoch": 183} {"train_loss": -30.881208419799805, "global_step": 22223, "epoch": 183} {"train_loss": -30.686059951782227, "global_step": 22224, "epoch": 183} {"train_loss": -30.578840255737305, "global_step": 22225, "epoch": 183} {"train_loss": -29.217914581298828, "global_step": 22226, "epoch": 183} {"train_loss": -29.141218185424805, "global_step": 22227, "epoch": 183} {"train_loss": -28.171253204345703, "global_step": 22228, "epoch": 183} {"train_loss": -29.588302612304688, "global_step": 22229, "epoch": 183} {"train_loss": -30.303577423095703, "global_step": 22230, "epoch": 183} {"train_loss": -30.5765438079834, "global_step": 22231, "epoch": 183} {"train_loss": -30.331531524658203, "global_step": 22232, "epoch": 183} {"train_loss": -29.493427276611328, "global_step": 22233, "epoch": 183} {"train_loss": -30.072463989257812, "global_step": 22234, "epoch": 183} {"train_loss": -28.311710357666016, "global_step": 22235, "epoch": 183} {"train_loss": -28.238134384155273, "global_step": 22236, "epoch": 183} {"train_loss": -29.962726593017578, "global_step": 22237, "epoch": 183} {"train_loss": -30.22810173034668, "global_step": 22238, "epoch": 183} {"train_loss": -28.82541275024414, "global_step": 22239, "epoch": 183} {"train_loss": -29.0323543548584, "global_step": 22240, "epoch": 183} {"train_loss": -28.328052520751953, "global_step": 22241, "epoch": 183} {"train_loss": -28.598737716674805, "global_step": 22242, "epoch": 183} {"train_loss": -29.984973907470703, "global_step": 22243, "epoch": 183} {"train_loss": -29.145898818969727, "global_step": 22244, "epoch": 183} {"train_loss": -30.30396842956543, "global_step": 22245, "epoch": 183} {"train_loss": -30.078393936157227, "global_step": 22246, "epoch": 183} {"train_loss": -29.85993003845215, "global_step": 22247, "epoch": 183} {"train_loss": -29.3835506439209, "global_step": 22248, "epoch": 183} {"train_loss": -29.669931411743164, "global_step": 22249, "epoch": 183} {"train_loss": -30.7115421295166, "global_step": 22250, "epoch": 183} {"train_loss": -29.203845977783203, "global_step": 22251, "epoch": 183} {"train_loss": -29.137699127197266, "global_step": 22252, "epoch": 183} {"train_loss": -29.642072677612305, "global_step": 22253, "epoch": 183} {"train_loss": -30.75555992126465, "global_step": 22254, "epoch": 183} {"train_loss": -29.85171890258789, "global_step": 22255, "epoch": 183} {"train_loss": -30.462560653686523, "global_step": 22256, "epoch": 183} {"train_loss": -30.118879318237305, "global_step": 22257, "epoch": 183} {"train_loss": -30.725622177124023, "global_step": 22258, "epoch": 183} {"train_loss": -30.650146484375, "global_step": 22259, "epoch": 183} {"train_loss": -30.437543869018555, "global_step": 22260, "epoch": 183} {"train_loss": -30.82674217224121, "global_step": 22261, "epoch": 183} {"train_loss": -30.7423038482666, "global_step": 22262, "epoch": 183} {"train_loss": -30.175105969767927, "global_step": 22263, "epoch": 183, "val_loss": 2471122.0} {"train_loss": -31.0531063079834, "global_step": 22264, "epoch": 184} {"train_loss": -30.368680953979492, "global_step": 22265, "epoch": 184} {"train_loss": -30.83466148376465, "global_step": 22266, "epoch": 184} {"train_loss": -30.889602661132812, "global_step": 22267, "epoch": 184} {"train_loss": -31.0154972076416, "global_step": 22268, "epoch": 184} {"train_loss": -31.138996124267578, "global_step": 22269, "epoch": 184} {"train_loss": -29.828201293945312, "global_step": 22270, "epoch": 184} {"train_loss": -31.132293701171875, "global_step": 22271, "epoch": 184} {"train_loss": -29.552610397338867, "global_step": 22272, "epoch": 184} {"train_loss": -30.661069869995117, "global_step": 22273, "epoch": 184} {"train_loss": -31.025543212890625, "global_step": 22274, "epoch": 184} {"train_loss": -30.46365737915039, "global_step": 22275, "epoch": 184} {"train_loss": -29.73996925354004, "global_step": 22276, "epoch": 184} {"train_loss": -29.03875160217285, "global_step": 22277, "epoch": 184} {"train_loss": -27.8698787689209, "global_step": 22278, "epoch": 184} {"train_loss": -26.724634170532227, "global_step": 22279, "epoch": 184} {"train_loss": -26.78034019470215, "global_step": 22280, "epoch": 184} {"train_loss": -30.6339054107666, "global_step": 22281, "epoch": 184} {"train_loss": -29.2935848236084, "global_step": 22282, "epoch": 184} {"train_loss": -27.580114364624023, "global_step": 22283, "epoch": 184} {"train_loss": -30.515609741210938, "global_step": 22284, "epoch": 184} {"train_loss": -28.940031051635742, "global_step": 22285, "epoch": 184} {"train_loss": -29.11709976196289, "global_step": 22286, "epoch": 184} {"train_loss": -29.761646270751953, "global_step": 22287, "epoch": 184} {"train_loss": -28.69196891784668, "global_step": 22288, "epoch": 184} {"train_loss": -30.099567413330078, "global_step": 22289, "epoch": 184} {"train_loss": -29.046918869018555, "global_step": 22290, "epoch": 184} {"train_loss": -30.62636375427246, "global_step": 22291, "epoch": 184} {"train_loss": -29.606739044189453, "global_step": 22292, "epoch": 184} {"train_loss": -29.98434829711914, "global_step": 22293, "epoch": 184} {"train_loss": -30.37214469909668, "global_step": 22294, "epoch": 184} {"train_loss": -29.693262100219727, "global_step": 22295, "epoch": 184} {"train_loss": -30.716297149658203, "global_step": 22296, "epoch": 184} {"train_loss": -29.785587310791016, "global_step": 22297, "epoch": 184} {"train_loss": -30.291242599487305, "global_step": 22298, "epoch": 184} {"train_loss": -30.41680335998535, "global_step": 22299, "epoch": 184} {"train_loss": -29.063461303710938, "global_step": 22300, "epoch": 184} {"train_loss": -28.912769317626953, "global_step": 22301, "epoch": 184} {"train_loss": -30.202295303344727, "global_step": 22302, "epoch": 184} {"train_loss": -29.8447265625, "global_step": 22303, "epoch": 184} {"train_loss": -27.48981285095215, "global_step": 22304, "epoch": 184} {"train_loss": -26.961511611938477, "global_step": 22305, "epoch": 184} {"train_loss": -30.1378173828125, "global_step": 22306, "epoch": 184} {"train_loss": -28.094385147094727, "global_step": 22307, "epoch": 184} {"train_loss": -28.399524688720703, "global_step": 22308, "epoch": 184} {"train_loss": -28.31182289123535, "global_step": 22309, "epoch": 184} {"train_loss": -27.21506690979004, "global_step": 22310, "epoch": 184} {"train_loss": -28.248249053955078, "global_step": 22311, "epoch": 184} {"train_loss": -29.318817138671875, "global_step": 22312, "epoch": 184} {"train_loss": -30.16668701171875, "global_step": 22313, "epoch": 184} {"train_loss": -28.77459716796875, "global_step": 22314, "epoch": 184} {"train_loss": -30.008502960205078, "global_step": 22315, "epoch": 184} {"train_loss": -29.5048770904541, "global_step": 22316, "epoch": 184} {"train_loss": -30.163436889648438, "global_step": 22317, "epoch": 184} {"train_loss": -30.523548126220703, "global_step": 22318, "epoch": 184} {"train_loss": -29.489233016967773, "global_step": 22319, "epoch": 184} {"train_loss": -30.291534423828125, "global_step": 22320, "epoch": 184} {"train_loss": -29.957029342651367, "global_step": 22321, "epoch": 184} {"train_loss": -30.091999053955078, "global_step": 22322, "epoch": 184} {"train_loss": -29.975854873657227, "global_step": 22323, "epoch": 184} {"train_loss": -30.29034996032715, "global_step": 22324, "epoch": 184} {"train_loss": -30.248525619506836, "global_step": 22325, "epoch": 184} {"train_loss": -30.375274658203125, "global_step": 22326, "epoch": 184} {"train_loss": -30.635019302368164, "global_step": 22327, "epoch": 184} {"train_loss": -30.526514053344727, "global_step": 22328, "epoch": 184} {"train_loss": -30.585046768188477, "global_step": 22329, "epoch": 184} {"train_loss": -30.486310958862305, "global_step": 22330, "epoch": 184} {"train_loss": -30.593408584594727, "global_step": 22331, "epoch": 184} {"train_loss": -30.741535186767578, "global_step": 22332, "epoch": 184} {"train_loss": -30.153715133666992, "global_step": 22333, "epoch": 184} {"train_loss": -30.743757247924805, "global_step": 22334, "epoch": 184} {"train_loss": -30.738025665283203, "global_step": 22335, "epoch": 184} {"train_loss": -30.50699806213379, "global_step": 22336, "epoch": 184} {"train_loss": -30.658767700195312, "global_step": 22337, "epoch": 184} {"train_loss": -30.958051681518555, "global_step": 22338, "epoch": 184} {"train_loss": -30.786279678344727, "global_step": 22339, "epoch": 184} {"train_loss": -30.42827796936035, "global_step": 22340, "epoch": 184} {"train_loss": -30.63421058654785, "global_step": 22341, "epoch": 184} {"train_loss": -30.52627944946289, "global_step": 22342, "epoch": 184} {"train_loss": -30.857162475585938, "global_step": 22343, "epoch": 184} {"train_loss": -30.699880599975586, "global_step": 22344, "epoch": 184} {"train_loss": -30.405553817749023, "global_step": 22345, "epoch": 184} {"train_loss": -30.788330078125, "global_step": 22346, "epoch": 184} {"train_loss": -30.764387130737305, "global_step": 22347, "epoch": 184} {"train_loss": -31.390714645385742, "global_step": 22348, "epoch": 184} {"train_loss": -30.586807250976562, "global_step": 22349, "epoch": 184} {"train_loss": -31.050464630126953, "global_step": 22350, "epoch": 184} {"train_loss": -30.79050064086914, "global_step": 22351, "epoch": 184} {"train_loss": -31.17364501953125, "global_step": 22352, "epoch": 184} {"train_loss": -30.907541275024414, "global_step": 22353, "epoch": 184} {"train_loss": -30.90537452697754, "global_step": 22354, "epoch": 184} {"train_loss": -30.891836166381836, "global_step": 22355, "epoch": 184} {"train_loss": -30.830862045288086, "global_step": 22356, "epoch": 184} {"train_loss": -31.097192764282227, "global_step": 22357, "epoch": 184} {"train_loss": -30.98870277404785, "global_step": 22358, "epoch": 184} {"train_loss": -31.189899444580078, "global_step": 22359, "epoch": 184} {"train_loss": -30.87940788269043, "global_step": 22360, "epoch": 184} {"train_loss": -31.09857749938965, "global_step": 22361, "epoch": 184} {"train_loss": -31.193754196166992, "global_step": 22362, "epoch": 184} {"train_loss": -30.87727165222168, "global_step": 22363, "epoch": 184} {"train_loss": -31.522851943969727, "global_step": 22364, "epoch": 184} {"train_loss": -31.154882431030273, "global_step": 22365, "epoch": 184} {"train_loss": -30.128305435180664, "global_step": 22366, "epoch": 184} {"train_loss": -30.679157257080078, "global_step": 22367, "epoch": 184} {"train_loss": -31.37577247619629, "global_step": 22368, "epoch": 184} {"train_loss": -31.384916305541992, "global_step": 22369, "epoch": 184} {"train_loss": -31.53641700744629, "global_step": 22370, "epoch": 184} {"train_loss": -30.697357177734375, "global_step": 22371, "epoch": 184} {"train_loss": -31.185510635375977, "global_step": 22372, "epoch": 184} {"train_loss": -30.368423461914062, "global_step": 22373, "epoch": 184} {"train_loss": -30.728315353393555, "global_step": 22374, "epoch": 184} {"train_loss": -31.147375106811523, "global_step": 22375, "epoch": 184} {"train_loss": -30.415302276611328, "global_step": 22376, "epoch": 184} {"train_loss": -29.113061904907227, "global_step": 22377, "epoch": 184} {"train_loss": -27.112333297729492, "global_step": 22378, "epoch": 184} {"train_loss": -24.84929847717285, "global_step": 22379, "epoch": 184} {"train_loss": -13.539949417114258, "global_step": 22380, "epoch": 184} {"train_loss": -13.542922973632812, "global_step": 22381, "epoch": 184} {"train_loss": -30.6167049407959, "global_step": 22382, "epoch": 184} {"train_loss": -21.516206741333008, "global_step": 22383, "epoch": 184} {"train_loss": -29.73186470851425, "global_step": 22384, "epoch": 184, "val_loss": 2616122.25} {"train_loss": -25.85100746154785, "global_step": 22385, "epoch": 185} {"train_loss": -29.802143096923828, "global_step": 22386, "epoch": 185} {"train_loss": -29.475324630737305, "global_step": 22387, "epoch": 185} {"train_loss": -28.09033203125, "global_step": 22388, "epoch": 185} {"train_loss": -29.745630264282227, "global_step": 22389, "epoch": 185} {"train_loss": -29.36004066467285, "global_step": 22390, "epoch": 185} {"train_loss": -29.368656158447266, "global_step": 22391, "epoch": 185} {"train_loss": -28.720905303955078, "global_step": 22392, "epoch": 185} {"train_loss": -29.85346031188965, "global_step": 22393, "epoch": 185} {"train_loss": -30.173725128173828, "global_step": 22394, "epoch": 185} {"train_loss": -29.79388999938965, "global_step": 22395, "epoch": 185} {"train_loss": -29.669843673706055, "global_step": 22396, "epoch": 185} {"train_loss": -29.46137809753418, "global_step": 22397, "epoch": 185} {"train_loss": -29.73493003845215, "global_step": 22398, "epoch": 185} {"train_loss": -29.96503257751465, "global_step": 22399, "epoch": 185} {"train_loss": -30.064111709594727, "global_step": 22400, "epoch": 185} {"train_loss": -30.134119033813477, "global_step": 22401, "epoch": 185} {"train_loss": -30.010419845581055, "global_step": 22402, "epoch": 185} {"train_loss": -30.3065185546875, "global_step": 22403, "epoch": 185} {"train_loss": -30.036489486694336, "global_step": 22404, "epoch": 185} {"train_loss": -30.53081703186035, "global_step": 22405, "epoch": 185} {"train_loss": -30.128799438476562, "global_step": 22406, "epoch": 185} {"train_loss": -30.571069717407227, "global_step": 22407, "epoch": 185} {"train_loss": -30.24188232421875, "global_step": 22408, "epoch": 185} {"train_loss": -30.164091110229492, "global_step": 22409, "epoch": 185} {"train_loss": -29.961088180541992, "global_step": 22410, "epoch": 185} {"train_loss": -30.4628849029541, "global_step": 22411, "epoch": 185} {"train_loss": -29.979297637939453, "global_step": 22412, "epoch": 185} {"train_loss": -30.5021915435791, "global_step": 22413, "epoch": 185} {"train_loss": -30.535419464111328, "global_step": 22414, "epoch": 185} {"train_loss": -30.35141944885254, "global_step": 22415, "epoch": 185} {"train_loss": -30.48895263671875, "global_step": 22416, "epoch": 185} {"train_loss": -30.53119468688965, "global_step": 22417, "epoch": 185} {"train_loss": -29.9162540435791, "global_step": 22418, "epoch": 185} {"train_loss": -30.023181915283203, "global_step": 22419, "epoch": 185} {"train_loss": -29.760221481323242, "global_step": 22420, "epoch": 185} {"train_loss": -30.292699813842773, "global_step": 22421, "epoch": 185} {"train_loss": -30.46539306640625, "global_step": 22422, "epoch": 185} {"train_loss": -29.148162841796875, "global_step": 22423, "epoch": 185} {"train_loss": -30.534656524658203, "global_step": 22424, "epoch": 185} {"train_loss": -29.53265953063965, "global_step": 22425, "epoch": 185} {"train_loss": -29.154111862182617, "global_step": 22426, "epoch": 185} {"train_loss": -27.611989974975586, "global_step": 22427, "epoch": 185} {"train_loss": -27.8604736328125, "global_step": 22428, "epoch": 185} {"train_loss": -26.958988189697266, "global_step": 22429, "epoch": 185} {"train_loss": -24.343551635742188, "global_step": 22430, "epoch": 185} {"train_loss": -19.490259170532227, "global_step": 22431, "epoch": 185} {"train_loss": -24.93072509765625, "global_step": 22432, "epoch": 185} {"train_loss": -27.824100494384766, "global_step": 22433, "epoch": 185} {"train_loss": -24.62712287902832, "global_step": 22434, "epoch": 185} {"train_loss": -29.242572784423828, "global_step": 22435, "epoch": 185} {"train_loss": -25.849292755126953, "global_step": 22436, "epoch": 185} {"train_loss": -28.900060653686523, "global_step": 22437, "epoch": 185} {"train_loss": -27.345285415649414, "global_step": 22438, "epoch": 185} {"train_loss": -27.884626388549805, "global_step": 22439, "epoch": 185} {"train_loss": -29.390533447265625, "global_step": 22440, "epoch": 185} {"train_loss": -27.758214950561523, "global_step": 22441, "epoch": 185} {"train_loss": -29.36488914489746, "global_step": 22442, "epoch": 185} {"train_loss": -27.67060661315918, "global_step": 22443, "epoch": 185} {"train_loss": -29.332595825195312, "global_step": 22444, "epoch": 185} {"train_loss": -28.319538116455078, "global_step": 22445, "epoch": 185} {"train_loss": -29.47223472595215, "global_step": 22446, "epoch": 185} {"train_loss": -28.796018600463867, "global_step": 22447, "epoch": 185} {"train_loss": -29.504989624023438, "global_step": 22448, "epoch": 185} {"train_loss": -28.80555534362793, "global_step": 22449, "epoch": 185} {"train_loss": -29.287158966064453, "global_step": 22450, "epoch": 185} {"train_loss": -28.979150772094727, "global_step": 22451, "epoch": 185} {"train_loss": -29.2542724609375, "global_step": 22452, "epoch": 185} {"train_loss": -29.6953182220459, "global_step": 22453, "epoch": 185} {"train_loss": -29.556699752807617, "global_step": 22454, "epoch": 185} {"train_loss": -29.576309204101562, "global_step": 22455, "epoch": 185} {"train_loss": -30.027029037475586, "global_step": 22456, "epoch": 185} {"train_loss": -29.442733764648438, "global_step": 22457, "epoch": 185} {"train_loss": -30.169666290283203, "global_step": 22458, "epoch": 185} {"train_loss": -29.697874069213867, "global_step": 22459, "epoch": 185} {"train_loss": -29.797658920288086, "global_step": 22460, "epoch": 185} {"train_loss": -29.65287208557129, "global_step": 22461, "epoch": 185} {"train_loss": -30.413122177124023, "global_step": 22462, "epoch": 185} {"train_loss": -29.96347427368164, "global_step": 22463, "epoch": 185} {"train_loss": -29.57979393005371, "global_step": 22464, "epoch": 185} {"train_loss": -29.649545669555664, "global_step": 22465, "epoch": 185} {"train_loss": -29.7894229888916, "global_step": 22466, "epoch": 185} {"train_loss": -30.472370147705078, "global_step": 22467, "epoch": 185} {"train_loss": -30.048786163330078, "global_step": 22468, "epoch": 185} {"train_loss": -30.033939361572266, "global_step": 22469, "epoch": 185} {"train_loss": -29.563634872436523, "global_step": 22470, "epoch": 185} {"train_loss": -29.943374633789062, "global_step": 22471, "epoch": 185} {"train_loss": -30.13734245300293, "global_step": 22472, "epoch": 185} {"train_loss": -29.697956085205078, "global_step": 22473, "epoch": 185} {"train_loss": -30.527063369750977, "global_step": 22474, "epoch": 185} {"train_loss": -29.68865966796875, "global_step": 22475, "epoch": 185} {"train_loss": -29.745248794555664, "global_step": 22476, "epoch": 185} {"train_loss": -30.349973678588867, "global_step": 22477, "epoch": 185} {"train_loss": -30.232152938842773, "global_step": 22478, "epoch": 185} {"train_loss": -29.943750381469727, "global_step": 22479, "epoch": 185} {"train_loss": -30.25882911682129, "global_step": 22480, "epoch": 185} {"train_loss": -29.94168472290039, "global_step": 22481, "epoch": 185} {"train_loss": -30.041425704956055, "global_step": 22482, "epoch": 185} {"train_loss": -30.21710205078125, "global_step": 22483, "epoch": 185} {"train_loss": -30.068944931030273, "global_step": 22484, "epoch": 185} {"train_loss": -29.872406005859375, "global_step": 22485, "epoch": 185} {"train_loss": -29.933568954467773, "global_step": 22486, "epoch": 185} {"train_loss": -30.1813907623291, "global_step": 22487, "epoch": 185} {"train_loss": -30.16391372680664, "global_step": 22488, "epoch": 185} {"train_loss": -30.168638229370117, "global_step": 22489, "epoch": 185} {"train_loss": -29.949325561523438, "global_step": 22490, "epoch": 185} {"train_loss": -29.6156005859375, "global_step": 22491, "epoch": 185} {"train_loss": -30.031997680664062, "global_step": 22492, "epoch": 185} {"train_loss": -29.634662628173828, "global_step": 22493, "epoch": 185} {"train_loss": -30.16115379333496, "global_step": 22494, "epoch": 185} {"train_loss": -29.95599937438965, "global_step": 22495, "epoch": 185} {"train_loss": -30.084400177001953, "global_step": 22496, "epoch": 185} {"train_loss": -30.243839263916016, "global_step": 22497, "epoch": 185} {"train_loss": -30.49859619140625, "global_step": 22498, "epoch": 185} {"train_loss": -30.470733642578125, "global_step": 22499, "epoch": 185} {"train_loss": -30.11878776550293, "global_step": 22500, "epoch": 185} {"train_loss": -30.62810707092285, "global_step": 22501, "epoch": 185} {"train_loss": -30.50189208984375, "global_step": 22502, "epoch": 185} {"train_loss": -30.414199829101562, "global_step": 22503, "epoch": 185} {"train_loss": -30.0784854888916, "global_step": 22504, "epoch": 185} {"train_loss": -29.443999140715796, "global_step": 22505, "epoch": 185, "val_loss": 2707297.0} {"train_loss": -30.8983211517334, "global_step": 22506, "epoch": 186} {"train_loss": -30.655349731445312, "global_step": 22507, "epoch": 186} {"train_loss": -30.625478744506836, "global_step": 22508, "epoch": 186} {"train_loss": -30.387067794799805, "global_step": 22509, "epoch": 186} {"train_loss": -30.19759178161621, "global_step": 22510, "epoch": 186} {"train_loss": -30.435144424438477, "global_step": 22511, "epoch": 186} {"train_loss": -30.723928451538086, "global_step": 22512, "epoch": 186} {"train_loss": -30.659866333007812, "global_step": 22513, "epoch": 186} {"train_loss": -30.063581466674805, "global_step": 22514, "epoch": 186} {"train_loss": -29.822790145874023, "global_step": 22515, "epoch": 186} {"train_loss": -29.98966407775879, "global_step": 22516, "epoch": 186} {"train_loss": -30.576101303100586, "global_step": 22517, "epoch": 186} {"train_loss": -30.759857177734375, "global_step": 22518, "epoch": 186} {"train_loss": -30.698705673217773, "global_step": 22519, "epoch": 186} {"train_loss": -30.791950225830078, "global_step": 22520, "epoch": 186} {"train_loss": -30.86726951599121, "global_step": 22521, "epoch": 186} {"train_loss": -30.795907974243164, "global_step": 22522, "epoch": 186} {"train_loss": -30.736669540405273, "global_step": 22523, "epoch": 186} {"train_loss": -30.5811710357666, "global_step": 22524, "epoch": 186} {"train_loss": -30.83900260925293, "global_step": 22525, "epoch": 186} {"train_loss": -30.794824600219727, "global_step": 22526, "epoch": 186} {"train_loss": -30.338790893554688, "global_step": 22527, "epoch": 186} {"train_loss": -30.744497299194336, "global_step": 22528, "epoch": 186} {"train_loss": -30.192840576171875, "global_step": 22529, "epoch": 186} {"train_loss": -30.307209014892578, "global_step": 22530, "epoch": 186} {"train_loss": -30.542285919189453, "global_step": 22531, "epoch": 186} {"train_loss": -30.558637619018555, "global_step": 22532, "epoch": 186} {"train_loss": -30.84596061706543, "global_step": 22533, "epoch": 186} {"train_loss": -30.27309226989746, "global_step": 22534, "epoch": 186} {"train_loss": -30.325153350830078, "global_step": 22535, "epoch": 186} {"train_loss": -30.971878051757812, "global_step": 22536, "epoch": 186} {"train_loss": -30.562036514282227, "global_step": 22537, "epoch": 186} {"train_loss": -31.274673461914062, "global_step": 22538, "epoch": 186} {"train_loss": -30.6970157623291, "global_step": 22539, "epoch": 186} {"train_loss": -31.09589958190918, "global_step": 22540, "epoch": 186} {"train_loss": -30.433368682861328, "global_step": 22541, "epoch": 186} {"train_loss": -30.764347076416016, "global_step": 22542, "epoch": 186} {"train_loss": -30.8762264251709, "global_step": 22543, "epoch": 186} {"train_loss": -30.582258224487305, "global_step": 22544, "epoch": 186} {"train_loss": -30.547819137573242, "global_step": 22545, "epoch": 186} {"train_loss": -30.68271827697754, "global_step": 22546, "epoch": 186} {"train_loss": -30.46286964416504, "global_step": 22547, "epoch": 186} {"train_loss": -30.812931060791016, "global_step": 22548, "epoch": 186} {"train_loss": -30.869232177734375, "global_step": 22549, "epoch": 186} {"train_loss": -31.26348304748535, "global_step": 22550, "epoch": 186} {"train_loss": -31.03635025024414, "global_step": 22551, "epoch": 186} {"train_loss": -31.03065299987793, "global_step": 22552, "epoch": 186} {"train_loss": -31.019535064697266, "global_step": 22553, "epoch": 186} {"train_loss": -31.31263542175293, "global_step": 22554, "epoch": 186} {"train_loss": -31.204421997070312, "global_step": 22555, "epoch": 186} {"train_loss": -31.184066772460938, "global_step": 22556, "epoch": 186} {"train_loss": -30.68290138244629, "global_step": 22557, "epoch": 186} {"train_loss": -31.090255737304688, "global_step": 22558, "epoch": 186} {"train_loss": -31.364673614501953, "global_step": 22559, "epoch": 186} {"train_loss": -31.141748428344727, "global_step": 22560, "epoch": 186} {"train_loss": -31.447919845581055, "global_step": 22561, "epoch": 186} {"train_loss": -31.40252685546875, "global_step": 22562, "epoch": 186} {"train_loss": -31.31782341003418, "global_step": 22563, "epoch": 186} {"train_loss": -30.999114990234375, "global_step": 22564, "epoch": 186} {"train_loss": -31.40288734436035, "global_step": 22565, "epoch": 186} {"train_loss": -30.889379501342773, "global_step": 22566, "epoch": 186} {"train_loss": -30.998987197875977, "global_step": 22567, "epoch": 186} {"train_loss": -30.880603790283203, "global_step": 22568, "epoch": 186} {"train_loss": -30.899219512939453, "global_step": 22569, "epoch": 186} {"train_loss": -30.723758697509766, "global_step": 22570, "epoch": 186} {"train_loss": -31.090436935424805, "global_step": 22571, "epoch": 186} {"train_loss": -30.3360652923584, "global_step": 22572, "epoch": 186} {"train_loss": -30.813199996948242, "global_step": 22573, "epoch": 186} {"train_loss": -30.736555099487305, "global_step": 22574, "epoch": 186} {"train_loss": -30.202722549438477, "global_step": 22575, "epoch": 186} {"train_loss": -29.182554244995117, "global_step": 22576, "epoch": 186} {"train_loss": -28.09231948852539, "global_step": 22577, "epoch": 186} {"train_loss": -23.605405807495117, "global_step": 22578, "epoch": 186} {"train_loss": -25.325336456298828, "global_step": 22579, "epoch": 186} {"train_loss": -30.4747314453125, "global_step": 22580, "epoch": 186} {"train_loss": -28.251890182495117, "global_step": 22581, "epoch": 186} {"train_loss": -29.497440338134766, "global_step": 22582, "epoch": 186} {"train_loss": -29.04142189025879, "global_step": 22583, "epoch": 186} {"train_loss": -29.079275131225586, "global_step": 22584, "epoch": 186} {"train_loss": -29.56182289123535, "global_step": 22585, "epoch": 186} {"train_loss": -29.796995162963867, "global_step": 22586, "epoch": 186} {"train_loss": -28.562728881835938, "global_step": 22587, "epoch": 186} {"train_loss": -30.523914337158203, "global_step": 22588, "epoch": 186} {"train_loss": -29.12537956237793, "global_step": 22589, "epoch": 186} {"train_loss": -30.235578536987305, "global_step": 22590, "epoch": 186} {"train_loss": -30.052383422851562, "global_step": 22591, "epoch": 186} {"train_loss": -29.999893188476562, "global_step": 22592, "epoch": 186} {"train_loss": -30.294361114501953, "global_step": 22593, "epoch": 186} {"train_loss": -30.254281997680664, "global_step": 22594, "epoch": 186} {"train_loss": -29.794050216674805, "global_step": 22595, "epoch": 186} {"train_loss": -31.070383071899414, "global_step": 22596, "epoch": 186} {"train_loss": -30.596708297729492, "global_step": 22597, "epoch": 186} {"train_loss": -30.776782989501953, "global_step": 22598, "epoch": 186} {"train_loss": -31.120527267456055, "global_step": 22599, "epoch": 186} {"train_loss": -30.453353881835938, "global_step": 22600, "epoch": 186} {"train_loss": -30.500471115112305, "global_step": 22601, "epoch": 186} {"train_loss": -30.47123146057129, "global_step": 22602, "epoch": 186} {"train_loss": -30.277313232421875, "global_step": 22603, "epoch": 186} {"train_loss": -29.959741592407227, "global_step": 22604, "epoch": 186} {"train_loss": -29.435068130493164, "global_step": 22605, "epoch": 186} {"train_loss": -29.175485610961914, "global_step": 22606, "epoch": 186} {"train_loss": -28.92864418029785, "global_step": 22607, "epoch": 186} {"train_loss": -28.886045455932617, "global_step": 22608, "epoch": 186} {"train_loss": -29.395444869995117, "global_step": 22609, "epoch": 186} {"train_loss": -30.56330680847168, "global_step": 22610, "epoch": 186} {"train_loss": -30.701520919799805, "global_step": 22611, "epoch": 186} {"train_loss": -29.492450714111328, "global_step": 22612, "epoch": 186} {"train_loss": -31.26079750061035, "global_step": 22613, "epoch": 186} {"train_loss": -30.699060440063477, "global_step": 22614, "epoch": 186} {"train_loss": -30.31366539001465, "global_step": 22615, "epoch": 186} {"train_loss": -30.379179000854492, "global_step": 22616, "epoch": 186} {"train_loss": -30.768207550048828, "global_step": 22617, "epoch": 186} {"train_loss": -30.88443374633789, "global_step": 22618, "epoch": 186} {"train_loss": -30.330915451049805, "global_step": 22619, "epoch": 186} {"train_loss": -30.390338897705078, "global_step": 22620, "epoch": 186} {"train_loss": -30.083099365234375, "global_step": 22621, "epoch": 186} {"train_loss": -29.752023696899414, "global_step": 22622, "epoch": 186} {"train_loss": -30.507190704345703, "global_step": 22623, "epoch": 186} {"train_loss": -30.420734405517578, "global_step": 22624, "epoch": 186} {"train_loss": -30.149076461791992, "global_step": 22625, "epoch": 186} {"train_loss": -30.343504614081265, "global_step": 22626, "epoch": 186, "val_loss": 2474077.25} {"train_loss": -30.686370849609375, "global_step": 22627, "epoch": 187} {"train_loss": -30.676136016845703, "global_step": 22628, "epoch": 187} {"train_loss": -30.56316566467285, "global_step": 22629, "epoch": 187} {"train_loss": -30.96778678894043, "global_step": 22630, "epoch": 187} {"train_loss": -30.67856216430664, "global_step": 22631, "epoch": 187} {"train_loss": -30.88849449157715, "global_step": 22632, "epoch": 187} {"train_loss": -30.632741928100586, "global_step": 22633, "epoch": 187} {"train_loss": -30.527414321899414, "global_step": 22634, "epoch": 187} {"train_loss": -30.60381507873535, "global_step": 22635, "epoch": 187} {"train_loss": -30.87091064453125, "global_step": 22636, "epoch": 187} {"train_loss": -31.03794288635254, "global_step": 22637, "epoch": 187} {"train_loss": -31.255521774291992, "global_step": 22638, "epoch": 187} {"train_loss": -31.252370834350586, "global_step": 22639, "epoch": 187} {"train_loss": -30.92694091796875, "global_step": 22640, "epoch": 187} {"train_loss": -31.10640525817871, "global_step": 22641, "epoch": 187} {"train_loss": -30.710620880126953, "global_step": 22642, "epoch": 187} {"train_loss": -30.274091720581055, "global_step": 22643, "epoch": 187} {"train_loss": -30.266788482666016, "global_step": 22644, "epoch": 187} {"train_loss": -29.40691566467285, "global_step": 22645, "epoch": 187} {"train_loss": -24.11359977722168, "global_step": 22646, "epoch": 187} {"train_loss": -10.788561820983887, "global_step": 22647, "epoch": 187} {"train_loss": -15.73492431640625, "global_step": 22648, "epoch": 187} {"train_loss": -30.00821876525879, "global_step": 22649, "epoch": 187} {"train_loss": -22.046844482421875, "global_step": 22650, "epoch": 187} {"train_loss": -25.872400283813477, "global_step": 22651, "epoch": 187} {"train_loss": -27.088560104370117, "global_step": 22652, "epoch": 187} {"train_loss": -29.321523666381836, "global_step": 22653, "epoch": 187} {"train_loss": -27.47629165649414, "global_step": 22654, "epoch": 187} {"train_loss": -29.49320411682129, "global_step": 22655, "epoch": 187} {"train_loss": -29.475421905517578, "global_step": 22656, "epoch": 187} {"train_loss": -28.790002822875977, "global_step": 22657, "epoch": 187} {"train_loss": -28.951862335205078, "global_step": 22658, "epoch": 187} {"train_loss": -30.322614669799805, "global_step": 22659, "epoch": 187} {"train_loss": -29.789682388305664, "global_step": 22660, "epoch": 187} {"train_loss": -29.364166259765625, "global_step": 22661, "epoch": 187} {"train_loss": -29.814054489135742, "global_step": 22662, "epoch": 187} {"train_loss": -30.15694236755371, "global_step": 22663, "epoch": 187} {"train_loss": -30.361663818359375, "global_step": 22664, "epoch": 187} {"train_loss": -29.77744483947754, "global_step": 22665, "epoch": 187} {"train_loss": -29.85211753845215, "global_step": 22666, "epoch": 187} {"train_loss": -29.973424911499023, "global_step": 22667, "epoch": 187} {"train_loss": -30.363101959228516, "global_step": 22668, "epoch": 187} {"train_loss": -30.03732681274414, "global_step": 22669, "epoch": 187} {"train_loss": -29.896259307861328, "global_step": 22670, "epoch": 187} {"train_loss": -30.235462188720703, "global_step": 22671, "epoch": 187} {"train_loss": -30.51031494140625, "global_step": 22672, "epoch": 187} {"train_loss": -30.322345733642578, "global_step": 22673, "epoch": 187} {"train_loss": -30.21640396118164, "global_step": 22674, "epoch": 187} {"train_loss": -30.230112075805664, "global_step": 22675, "epoch": 187} {"train_loss": -30.507923126220703, "global_step": 22676, "epoch": 187} {"train_loss": -30.37196159362793, "global_step": 22677, "epoch": 187} {"train_loss": -30.407196044921875, "global_step": 22678, "epoch": 187} {"train_loss": -30.456357955932617, "global_step": 22679, "epoch": 187} {"train_loss": -30.672592163085938, "global_step": 22680, "epoch": 187} {"train_loss": -30.892969131469727, "global_step": 22681, "epoch": 187} {"train_loss": -30.802900314331055, "global_step": 22682, "epoch": 187} {"train_loss": -30.867755889892578, "global_step": 22683, "epoch": 187} {"train_loss": -30.247228622436523, "global_step": 22684, "epoch": 187} {"train_loss": -29.07958984375, "global_step": 22685, "epoch": 187} {"train_loss": -27.587675094604492, "global_step": 22686, "epoch": 187} {"train_loss": -23.500484466552734, "global_step": 22687, "epoch": 187} {"train_loss": -28.3808650970459, "global_step": 22688, "epoch": 187} {"train_loss": -26.921777725219727, "global_step": 22689, "epoch": 187} {"train_loss": -29.45380210876465, "global_step": 22690, "epoch": 187} {"train_loss": -24.69707679748535, "global_step": 22691, "epoch": 187} {"train_loss": -30.303796768188477, "global_step": 22692, "epoch": 187} {"train_loss": -29.16558265686035, "global_step": 22693, "epoch": 187} {"train_loss": -27.826557159423828, "global_step": 22694, "epoch": 187} {"train_loss": -28.108295440673828, "global_step": 22695, "epoch": 187} {"train_loss": -28.249942779541016, "global_step": 22696, "epoch": 187} {"train_loss": -28.179574966430664, "global_step": 22697, "epoch": 187} {"train_loss": -25.66455078125, "global_step": 22698, "epoch": 187} {"train_loss": -24.500158309936523, "global_step": 22699, "epoch": 187} {"train_loss": -26.52681541442871, "global_step": 22700, "epoch": 187} {"train_loss": -28.5858097076416, "global_step": 22701, "epoch": 187} {"train_loss": -29.40205955505371, "global_step": 22702, "epoch": 187} {"train_loss": -28.76239013671875, "global_step": 22703, "epoch": 187} {"train_loss": -29.4115047454834, "global_step": 22704, "epoch": 187} {"train_loss": -29.852087020874023, "global_step": 22705, "epoch": 187} {"train_loss": -29.803464889526367, "global_step": 22706, "epoch": 187} {"train_loss": -29.62641716003418, "global_step": 22707, "epoch": 187} {"train_loss": -29.62002944946289, "global_step": 22708, "epoch": 187} {"train_loss": -29.65728187561035, "global_step": 22709, "epoch": 187} {"train_loss": -29.7818603515625, "global_step": 22710, "epoch": 187} {"train_loss": -29.8060359954834, "global_step": 22711, "epoch": 187} {"train_loss": -29.538135528564453, "global_step": 22712, "epoch": 187} {"train_loss": -29.826765060424805, "global_step": 22713, "epoch": 187} {"train_loss": -29.508451461791992, "global_step": 22714, "epoch": 187} {"train_loss": -30.12603187561035, "global_step": 22715, "epoch": 187} {"train_loss": -29.82879066467285, "global_step": 22716, "epoch": 187} {"train_loss": -29.719165802001953, "global_step": 22717, "epoch": 187} {"train_loss": -29.92302894592285, "global_step": 22718, "epoch": 187} {"train_loss": -30.232131958007812, "global_step": 22719, "epoch": 187} {"train_loss": -30.099273681640625, "global_step": 22720, "epoch": 187} {"train_loss": -29.979516983032227, "global_step": 22721, "epoch": 187} {"train_loss": -30.252832412719727, "global_step": 22722, "epoch": 187} {"train_loss": -30.519351959228516, "global_step": 22723, "epoch": 187} {"train_loss": -30.108564376831055, "global_step": 22724, "epoch": 187} {"train_loss": -30.36602210998535, "global_step": 22725, "epoch": 187} {"train_loss": -30.144697189331055, "global_step": 22726, "epoch": 187} {"train_loss": -30.000207901000977, "global_step": 22727, "epoch": 187} {"train_loss": -30.015655517578125, "global_step": 22728, "epoch": 187} {"train_loss": -30.085468292236328, "global_step": 22729, "epoch": 187} {"train_loss": -30.3018798828125, "global_step": 22730, "epoch": 187} {"train_loss": -30.707799911499023, "global_step": 22731, "epoch": 187} {"train_loss": -30.42755126953125, "global_step": 22732, "epoch": 187} {"train_loss": -29.856494903564453, "global_step": 22733, "epoch": 187} {"train_loss": -30.085525512695312, "global_step": 22734, "epoch": 187} {"train_loss": -30.037641525268555, "global_step": 22735, "epoch": 187} {"train_loss": -30.45708656311035, "global_step": 22736, "epoch": 187} {"train_loss": -30.366621017456055, "global_step": 22737, "epoch": 187} {"train_loss": -30.042631149291992, "global_step": 22738, "epoch": 187} {"train_loss": -30.141372680664062, "global_step": 22739, "epoch": 187} {"train_loss": -30.381092071533203, "global_step": 22740, "epoch": 187} {"train_loss": -29.70221519470215, "global_step": 22741, "epoch": 187} {"train_loss": -28.600696563720703, "global_step": 22742, "epoch": 187} {"train_loss": -26.10529136657715, "global_step": 22743, "epoch": 187} {"train_loss": -23.705549240112305, "global_step": 22744, "epoch": 187} {"train_loss": -25.670257568359375, "global_step": 22745, "epoch": 187} {"train_loss": -28.891386032104492, "global_step": 22746, "epoch": 187} {"train_loss": -29.142781825105022, "global_step": 22747, "epoch": 187, "val_loss": 2766018.75} {"train_loss": -27.694644927978516, "global_step": 22748, "epoch": 188} {"train_loss": -30.05804443359375, "global_step": 22749, "epoch": 188} {"train_loss": -28.596054077148438, "global_step": 22750, "epoch": 188} {"train_loss": -29.427814483642578, "global_step": 22751, "epoch": 188} {"train_loss": -28.66474723815918, "global_step": 22752, "epoch": 188} {"train_loss": -29.810169219970703, "global_step": 22753, "epoch": 188} {"train_loss": -29.422077178955078, "global_step": 22754, "epoch": 188} {"train_loss": -28.58621597290039, "global_step": 22755, "epoch": 188} {"train_loss": -29.018781661987305, "global_step": 22756, "epoch": 188} {"train_loss": -29.584463119506836, "global_step": 22757, "epoch": 188} {"train_loss": -29.363245010375977, "global_step": 22758, "epoch": 188} {"train_loss": -30.012073516845703, "global_step": 22759, "epoch": 188} {"train_loss": -29.363882064819336, "global_step": 22760, "epoch": 188} {"train_loss": -29.66172218322754, "global_step": 22761, "epoch": 188} {"train_loss": -29.8872013092041, "global_step": 22762, "epoch": 188} {"train_loss": -29.791900634765625, "global_step": 22763, "epoch": 188} {"train_loss": -29.6135311126709, "global_step": 22764, "epoch": 188} {"train_loss": -29.698623657226562, "global_step": 22765, "epoch": 188} {"train_loss": -29.763879776000977, "global_step": 22766, "epoch": 188} {"train_loss": -29.667938232421875, "global_step": 22767, "epoch": 188} {"train_loss": -29.581872940063477, "global_step": 22768, "epoch": 188} {"train_loss": -29.881567001342773, "global_step": 22769, "epoch": 188} {"train_loss": -29.920135498046875, "global_step": 22770, "epoch": 188} {"train_loss": -29.512744903564453, "global_step": 22771, "epoch": 188} {"train_loss": -30.054656982421875, "global_step": 22772, "epoch": 188} {"train_loss": -30.232107162475586, "global_step": 22773, "epoch": 188} {"train_loss": -29.853168487548828, "global_step": 22774, "epoch": 188} {"train_loss": -29.654541015625, "global_step": 22775, "epoch": 188} {"train_loss": -30.180356979370117, "global_step": 22776, "epoch": 188} {"train_loss": -29.34380531311035, "global_step": 22777, "epoch": 188} {"train_loss": -30.009607315063477, "global_step": 22778, "epoch": 188} {"train_loss": -30.093524932861328, "global_step": 22779, "epoch": 188} {"train_loss": -28.397003173828125, "global_step": 22780, "epoch": 188} {"train_loss": -29.822351455688477, "global_step": 22781, "epoch": 188} {"train_loss": -29.5122127532959, "global_step": 22782, "epoch": 188} {"train_loss": -29.591552734375, "global_step": 22783, "epoch": 188} {"train_loss": -29.955921173095703, "global_step": 22784, "epoch": 188} {"train_loss": -29.585683822631836, "global_step": 22785, "epoch": 188} {"train_loss": -29.121103286743164, "global_step": 22786, "epoch": 188} {"train_loss": -30.09254264831543, "global_step": 22787, "epoch": 188} {"train_loss": -30.402847290039062, "global_step": 22788, "epoch": 188} {"train_loss": -30.43524742126465, "global_step": 22789, "epoch": 188} {"train_loss": -29.80263328552246, "global_step": 22790, "epoch": 188} {"train_loss": -30.061864852905273, "global_step": 22791, "epoch": 188} {"train_loss": -30.374713897705078, "global_step": 22792, "epoch": 188} {"train_loss": -30.862409591674805, "global_step": 22793, "epoch": 188} {"train_loss": -30.300201416015625, "global_step": 22794, "epoch": 188} {"train_loss": -30.575529098510742, "global_step": 22795, "epoch": 188} {"train_loss": -30.36272621154785, "global_step": 22796, "epoch": 188} {"train_loss": -30.401386260986328, "global_step": 22797, "epoch": 188} {"train_loss": -30.407424926757812, "global_step": 22798, "epoch": 188} {"train_loss": -29.982513427734375, "global_step": 22799, "epoch": 188} {"train_loss": -30.16817283630371, "global_step": 22800, "epoch": 188} {"train_loss": -30.347936630249023, "global_step": 22801, "epoch": 188} {"train_loss": -30.276721954345703, "global_step": 22802, "epoch": 188} {"train_loss": -30.803449630737305, "global_step": 22803, "epoch": 188} {"train_loss": -29.130285263061523, "global_step": 22804, "epoch": 188} {"train_loss": -29.487060546875, "global_step": 22805, "epoch": 188} {"train_loss": -30.06721305847168, "global_step": 22806, "epoch": 188} {"train_loss": -30.914030075073242, "global_step": 22807, "epoch": 188} {"train_loss": -30.358081817626953, "global_step": 22808, "epoch": 188} {"train_loss": -30.69753074645996, "global_step": 22809, "epoch": 188} {"train_loss": -30.4261531829834, "global_step": 22810, "epoch": 188} {"train_loss": -30.516204833984375, "global_step": 22811, "epoch": 188} {"train_loss": -30.70810317993164, "global_step": 22812, "epoch": 188} {"train_loss": -30.608251571655273, "global_step": 22813, "epoch": 188} {"train_loss": -30.267446517944336, "global_step": 22814, "epoch": 188} {"train_loss": -31.04292106628418, "global_step": 22815, "epoch": 188} {"train_loss": -30.46576499938965, "global_step": 22816, "epoch": 188} {"train_loss": -30.632110595703125, "global_step": 22817, "epoch": 188} {"train_loss": -30.445730209350586, "global_step": 22818, "epoch": 188} {"train_loss": -30.7157039642334, "global_step": 22819, "epoch": 188} {"train_loss": -30.48785972595215, "global_step": 22820, "epoch": 188} {"train_loss": -30.684064865112305, "global_step": 22821, "epoch": 188} {"train_loss": -30.413928985595703, "global_step": 22822, "epoch": 188} {"train_loss": -29.30225944519043, "global_step": 22823, "epoch": 188} {"train_loss": -30.24309730529785, "global_step": 22824, "epoch": 188} {"train_loss": -30.342941284179688, "global_step": 22825, "epoch": 188} {"train_loss": -30.558942794799805, "global_step": 22826, "epoch": 188} {"train_loss": -30.992328643798828, "global_step": 22827, "epoch": 188} {"train_loss": -30.882404327392578, "global_step": 22828, "epoch": 188} {"train_loss": -30.64287757873535, "global_step": 22829, "epoch": 188} {"train_loss": -30.353336334228516, "global_step": 22830, "epoch": 188} {"train_loss": -30.595794677734375, "global_step": 22831, "epoch": 188} {"train_loss": -30.638580322265625, "global_step": 22832, "epoch": 188} {"train_loss": -30.76349449157715, "global_step": 22833, "epoch": 188} {"train_loss": -30.399457931518555, "global_step": 22834, "epoch": 188} {"train_loss": -30.83969497680664, "global_step": 22835, "epoch": 188} {"train_loss": -30.41763687133789, "global_step": 22836, "epoch": 188} {"train_loss": -30.3967227935791, "global_step": 22837, "epoch": 188} {"train_loss": -30.5394229888916, "global_step": 22838, "epoch": 188} {"train_loss": -29.86695671081543, "global_step": 22839, "epoch": 188} {"train_loss": -29.877634048461914, "global_step": 22840, "epoch": 188} {"train_loss": -29.15046501159668, "global_step": 22841, "epoch": 188} {"train_loss": -30.657712936401367, "global_step": 22842, "epoch": 188} {"train_loss": -30.464746475219727, "global_step": 22843, "epoch": 188} {"train_loss": -30.40775489807129, "global_step": 22844, "epoch": 188} {"train_loss": -28.560443878173828, "global_step": 22845, "epoch": 188} {"train_loss": -29.568878173828125, "global_step": 22846, "epoch": 188} {"train_loss": -30.7431583404541, "global_step": 22847, "epoch": 188} {"train_loss": -30.561431884765625, "global_step": 22848, "epoch": 188} {"train_loss": -29.975732803344727, "global_step": 22849, "epoch": 188} {"train_loss": -30.978424072265625, "global_step": 22850, "epoch": 188} {"train_loss": -30.60466957092285, "global_step": 22851, "epoch": 188} {"train_loss": -30.2656307220459, "global_step": 22852, "epoch": 188} {"train_loss": -30.52132225036621, "global_step": 22853, "epoch": 188} {"train_loss": -30.7460880279541, "global_step": 22854, "epoch": 188} {"train_loss": -30.17020606994629, "global_step": 22855, "epoch": 188} {"train_loss": -30.612516403198242, "global_step": 22856, "epoch": 188} {"train_loss": -30.9936466217041, "global_step": 22857, "epoch": 188} {"train_loss": -30.67582130432129, "global_step": 22858, "epoch": 188} {"train_loss": -30.666013717651367, "global_step": 22859, "epoch": 188} {"train_loss": -31.304468154907227, "global_step": 22860, "epoch": 188} {"train_loss": -30.8551082611084, "global_step": 22861, "epoch": 188} {"train_loss": -31.11990737915039, "global_step": 22862, "epoch": 188} {"train_loss": -31.173948287963867, "global_step": 22863, "epoch": 188} {"train_loss": -31.076080322265625, "global_step": 22864, "epoch": 188} {"train_loss": -30.634992599487305, "global_step": 22865, "epoch": 188} {"train_loss": -29.57181167602539, "global_step": 22866, "epoch": 188} {"train_loss": -30.457355499267578, "global_step": 22867, "epoch": 188} {"train_loss": -30.134391595509427, "global_step": 22868, "epoch": 188, "val_loss": 2560725.0} {"train_loss": -30.522632598876953, "global_step": 22869, "epoch": 189} {"train_loss": -30.0397891998291, "global_step": 22870, "epoch": 189} {"train_loss": -30.632389068603516, "global_step": 22871, "epoch": 189} {"train_loss": -30.478967666625977, "global_step": 22872, "epoch": 189} {"train_loss": -31.330591201782227, "global_step": 22873, "epoch": 189} {"train_loss": -30.985315322875977, "global_step": 22874, "epoch": 189} {"train_loss": -30.004369735717773, "global_step": 22875, "epoch": 189} {"train_loss": -30.6569766998291, "global_step": 22876, "epoch": 189} {"train_loss": -31.47308921813965, "global_step": 22877, "epoch": 189} {"train_loss": -31.14483642578125, "global_step": 22878, "epoch": 189} {"train_loss": -30.66338539123535, "global_step": 22879, "epoch": 189} {"train_loss": -30.98097038269043, "global_step": 22880, "epoch": 189} {"train_loss": -31.178741455078125, "global_step": 22881, "epoch": 189} {"train_loss": -29.634626388549805, "global_step": 22882, "epoch": 189} {"train_loss": -30.716440200805664, "global_step": 22883, "epoch": 189} {"train_loss": -30.526691436767578, "global_step": 22884, "epoch": 189} {"train_loss": -29.291234970092773, "global_step": 22885, "epoch": 189} {"train_loss": -30.91693115234375, "global_step": 22886, "epoch": 189} {"train_loss": -30.182809829711914, "global_step": 22887, "epoch": 189} {"train_loss": -31.21661376953125, "global_step": 22888, "epoch": 189} {"train_loss": -30.089609146118164, "global_step": 22889, "epoch": 189} {"train_loss": -30.261388778686523, "global_step": 22890, "epoch": 189} {"train_loss": -30.528257369995117, "global_step": 22891, "epoch": 189} {"train_loss": -30.3232421875, "global_step": 22892, "epoch": 189} {"train_loss": -30.599035263061523, "global_step": 22893, "epoch": 189} {"train_loss": -30.38193702697754, "global_step": 22894, "epoch": 189} {"train_loss": -31.111083984375, "global_step": 22895, "epoch": 189} {"train_loss": -30.19953727722168, "global_step": 22896, "epoch": 189} {"train_loss": -30.90594482421875, "global_step": 22897, "epoch": 189} {"train_loss": -30.328519821166992, "global_step": 22898, "epoch": 189} {"train_loss": -30.948598861694336, "global_step": 22899, "epoch": 189} {"train_loss": -30.341135025024414, "global_step": 22900, "epoch": 189} {"train_loss": -30.71608543395996, "global_step": 22901, "epoch": 189} {"train_loss": -31.056537628173828, "global_step": 22902, "epoch": 189} {"train_loss": -31.110157012939453, "global_step": 22903, "epoch": 189} {"train_loss": -30.470701217651367, "global_step": 22904, "epoch": 189} {"train_loss": -30.794153213500977, "global_step": 22905, "epoch": 189} {"train_loss": -30.315631866455078, "global_step": 22906, "epoch": 189} {"train_loss": -30.20255470275879, "global_step": 22907, "epoch": 189} {"train_loss": -28.938879013061523, "global_step": 22908, "epoch": 189} {"train_loss": -27.42354393005371, "global_step": 22909, "epoch": 189} {"train_loss": -23.1597900390625, "global_step": 22910, "epoch": 189} {"train_loss": -24.48766326904297, "global_step": 22911, "epoch": 189} {"train_loss": -28.23406982421875, "global_step": 22912, "epoch": 189} {"train_loss": -30.55387306213379, "global_step": 22913, "epoch": 189} {"train_loss": -28.268415451049805, "global_step": 22914, "epoch": 189} {"train_loss": -30.004953384399414, "global_step": 22915, "epoch": 189} {"train_loss": -29.317243576049805, "global_step": 22916, "epoch": 189} {"train_loss": -29.892927169799805, "global_step": 22917, "epoch": 189} {"train_loss": -29.231916427612305, "global_step": 22918, "epoch": 189} {"train_loss": -30.49517822265625, "global_step": 22919, "epoch": 189} {"train_loss": -29.503875732421875, "global_step": 22920, "epoch": 189} {"train_loss": -30.466100692749023, "global_step": 22921, "epoch": 189} {"train_loss": -30.157257080078125, "global_step": 22922, "epoch": 189} {"train_loss": -29.44076919555664, "global_step": 22923, "epoch": 189} {"train_loss": -30.410367965698242, "global_step": 22924, "epoch": 189} {"train_loss": -30.355072021484375, "global_step": 22925, "epoch": 189} {"train_loss": -30.626550674438477, "global_step": 22926, "epoch": 189} {"train_loss": -30.523569107055664, "global_step": 22927, "epoch": 189} {"train_loss": -30.767541885375977, "global_step": 22928, "epoch": 189} {"train_loss": -30.229955673217773, "global_step": 22929, "epoch": 189} {"train_loss": -31.129663467407227, "global_step": 22930, "epoch": 189} {"train_loss": -30.37017822265625, "global_step": 22931, "epoch": 189} {"train_loss": -30.2386474609375, "global_step": 22932, "epoch": 189} {"train_loss": -29.951400756835938, "global_step": 22933, "epoch": 189} {"train_loss": -30.174457550048828, "global_step": 22934, "epoch": 189} {"train_loss": -30.634069442749023, "global_step": 22935, "epoch": 189} {"train_loss": -30.904123306274414, "global_step": 22936, "epoch": 189} {"train_loss": -30.86765480041504, "global_step": 22937, "epoch": 189} {"train_loss": -30.79471206665039, "global_step": 22938, "epoch": 189} {"train_loss": -30.98676109313965, "global_step": 22939, "epoch": 189} {"train_loss": -31.09490966796875, "global_step": 22940, "epoch": 189} {"train_loss": -31.2442569732666, "global_step": 22941, "epoch": 189} {"train_loss": -31.032550811767578, "global_step": 22942, "epoch": 189} {"train_loss": -31.077417373657227, "global_step": 22943, "epoch": 189} {"train_loss": -31.05252456665039, "global_step": 22944, "epoch": 189} {"train_loss": -30.83977699279785, "global_step": 22945, "epoch": 189} {"train_loss": -31.379621505737305, "global_step": 22946, "epoch": 189} {"train_loss": -30.775390625, "global_step": 22947, "epoch": 189} {"train_loss": -30.9836483001709, "global_step": 22948, "epoch": 189} {"train_loss": -30.748075485229492, "global_step": 22949, "epoch": 189} {"train_loss": -30.423145294189453, "global_step": 22950, "epoch": 189} {"train_loss": -29.829221725463867, "global_step": 22951, "epoch": 189} {"train_loss": -29.27943992614746, "global_step": 22952, "epoch": 189} {"train_loss": -29.592126846313477, "global_step": 22953, "epoch": 189} {"train_loss": -29.741113662719727, "global_step": 22954, "epoch": 189} {"train_loss": -30.486215591430664, "global_step": 22955, "epoch": 189} {"train_loss": -30.557775497436523, "global_step": 22956, "epoch": 189} {"train_loss": -31.07761001586914, "global_step": 22957, "epoch": 189} {"train_loss": -30.50126075744629, "global_step": 22958, "epoch": 189} {"train_loss": -30.607873916625977, "global_step": 22959, "epoch": 189} {"train_loss": -29.9910945892334, "global_step": 22960, "epoch": 189} {"train_loss": -30.93025779724121, "global_step": 22961, "epoch": 189} {"train_loss": -30.668577194213867, "global_step": 22962, "epoch": 189} {"train_loss": -30.166828155517578, "global_step": 22963, "epoch": 189} {"train_loss": -29.852842330932617, "global_step": 22964, "epoch": 189} {"train_loss": -30.562185287475586, "global_step": 22965, "epoch": 189} {"train_loss": -30.46182632446289, "global_step": 22966, "epoch": 189} {"train_loss": -29.88934898376465, "global_step": 22967, "epoch": 189} {"train_loss": -28.496320724487305, "global_step": 22968, "epoch": 189} {"train_loss": -28.930456161499023, "global_step": 22969, "epoch": 189} {"train_loss": -29.077991485595703, "global_step": 22970, "epoch": 189} {"train_loss": -29.87481117248535, "global_step": 22971, "epoch": 189} {"train_loss": -30.9427547454834, "global_step": 22972, "epoch": 189} {"train_loss": -29.7127628326416, "global_step": 22973, "epoch": 189} {"train_loss": -30.26311683654785, "global_step": 22974, "epoch": 189} {"train_loss": -29.90803337097168, "global_step": 22975, "epoch": 189} {"train_loss": -30.64954948425293, "global_step": 22976, "epoch": 189} {"train_loss": -30.156042098999023, "global_step": 22977, "epoch": 189} {"train_loss": -30.734350204467773, "global_step": 22978, "epoch": 189} {"train_loss": -30.375822067260742, "global_step": 22979, "epoch": 189} {"train_loss": -30.670440673828125, "global_step": 22980, "epoch": 189} {"train_loss": -30.604028701782227, "global_step": 22981, "epoch": 189} {"train_loss": -31.136646270751953, "global_step": 22982, "epoch": 189} {"train_loss": -30.955554962158203, "global_step": 22983, "epoch": 189} {"train_loss": -30.656829833984375, "global_step": 22984, "epoch": 189} {"train_loss": -31.284011840820312, "global_step": 22985, "epoch": 189} {"train_loss": -30.62790870666504, "global_step": 22986, "epoch": 189} {"train_loss": -30.90557289123535, "global_step": 22987, "epoch": 189} {"train_loss": -29.98367691040039, "global_step": 22988, "epoch": 189} {"train_loss": -30.26883520961793, "global_step": 22989, "epoch": 189, "val_loss": 2666819.0} {"train_loss": -30.67412757873535, "global_step": 22990, "epoch": 190} {"train_loss": -30.58062744140625, "global_step": 22991, "epoch": 190} {"train_loss": -30.446557998657227, "global_step": 22992, "epoch": 190} {"train_loss": -29.409048080444336, "global_step": 22993, "epoch": 190} {"train_loss": -29.899219512939453, "global_step": 22994, "epoch": 190} {"train_loss": -30.5855655670166, "global_step": 22995, "epoch": 190} {"train_loss": -30.52715492248535, "global_step": 22996, "epoch": 190} {"train_loss": -29.49909782409668, "global_step": 22997, "epoch": 190} {"train_loss": -30.5006160736084, "global_step": 22998, "epoch": 190} {"train_loss": -30.664871215820312, "global_step": 22999, "epoch": 190} {"train_loss": -30.28515625, "global_step": 23000, "epoch": 190} {"train_loss": -30.233997344970703, "global_step": 23001, "epoch": 190} {"train_loss": -30.078510284423828, "global_step": 23002, "epoch": 190} {"train_loss": -30.427114486694336, "global_step": 23003, "epoch": 190} {"train_loss": -30.431842803955078, "global_step": 23004, "epoch": 190} {"train_loss": -30.735570907592773, "global_step": 23005, "epoch": 190} {"train_loss": -29.56023597717285, "global_step": 23006, "epoch": 190} {"train_loss": -29.831708908081055, "global_step": 23007, "epoch": 190} {"train_loss": -29.822803497314453, "global_step": 23008, "epoch": 190} {"train_loss": -30.63852310180664, "global_step": 23009, "epoch": 190} {"train_loss": -30.378461837768555, "global_step": 23010, "epoch": 190} {"train_loss": -30.7841854095459, "global_step": 23011, "epoch": 190} {"train_loss": -30.469924926757812, "global_step": 23012, "epoch": 190} {"train_loss": -30.76947593688965, "global_step": 23013, "epoch": 190} {"train_loss": -30.64267349243164, "global_step": 23014, "epoch": 190} {"train_loss": -31.000402450561523, "global_step": 23015, "epoch": 190} {"train_loss": -31.223133087158203, "global_step": 23016, "epoch": 190} {"train_loss": -31.119665145874023, "global_step": 23017, "epoch": 190} {"train_loss": -31.324756622314453, "global_step": 23018, "epoch": 190} {"train_loss": -31.145715713500977, "global_step": 23019, "epoch": 190} {"train_loss": -31.228961944580078, "global_step": 23020, "epoch": 190} {"train_loss": -31.13832664489746, "global_step": 23021, "epoch": 190} {"train_loss": -31.44944190979004, "global_step": 23022, "epoch": 190} {"train_loss": -30.631113052368164, "global_step": 23023, "epoch": 190} {"train_loss": -29.655736923217773, "global_step": 23024, "epoch": 190} {"train_loss": -28.244333267211914, "global_step": 23025, "epoch": 190} {"train_loss": -28.574146270751953, "global_step": 23026, "epoch": 190} {"train_loss": -30.886783599853516, "global_step": 23027, "epoch": 190} {"train_loss": -31.228361129760742, "global_step": 23028, "epoch": 190} {"train_loss": -30.110065460205078, "global_step": 23029, "epoch": 190} {"train_loss": -29.729612350463867, "global_step": 23030, "epoch": 190} {"train_loss": -31.20647621154785, "global_step": 23031, "epoch": 190} {"train_loss": -31.426847457885742, "global_step": 23032, "epoch": 190} {"train_loss": -30.841527938842773, "global_step": 23033, "epoch": 190} {"train_loss": -31.46453285217285, "global_step": 23034, "epoch": 190} {"train_loss": -31.35251808166504, "global_step": 23035, "epoch": 190} {"train_loss": -30.824201583862305, "global_step": 23036, "epoch": 190} {"train_loss": -31.60304069519043, "global_step": 23037, "epoch": 190} {"train_loss": -31.543628692626953, "global_step": 23038, "epoch": 190} {"train_loss": -31.531875610351562, "global_step": 23039, "epoch": 190} {"train_loss": -31.6993350982666, "global_step": 23040, "epoch": 190} {"train_loss": -31.4881591796875, "global_step": 23041, "epoch": 190} {"train_loss": -31.4796142578125, "global_step": 23042, "epoch": 190} {"train_loss": -31.492462158203125, "global_step": 23043, "epoch": 190} {"train_loss": -31.70403480529785, "global_step": 23044, "epoch": 190} {"train_loss": -31.47181510925293, "global_step": 23045, "epoch": 190} {"train_loss": -31.683263778686523, "global_step": 23046, "epoch": 190} {"train_loss": -31.286962509155273, "global_step": 23047, "epoch": 190} {"train_loss": -31.624181747436523, "global_step": 23048, "epoch": 190} {"train_loss": -31.126907348632812, "global_step": 23049, "epoch": 190} {"train_loss": -30.900060653686523, "global_step": 23050, "epoch": 190} {"train_loss": -29.11878776550293, "global_step": 23051, "epoch": 190} {"train_loss": -27.235504150390625, "global_step": 23052, "epoch": 190} {"train_loss": -24.709095001220703, "global_step": 23053, "epoch": 190} {"train_loss": -20.732946395874023, "global_step": 23054, "epoch": 190} {"train_loss": -23.681516647338867, "global_step": 23055, "epoch": 190} {"train_loss": -31.12592124938965, "global_step": 23056, "epoch": 190} {"train_loss": -27.41204261779785, "global_step": 23057, "epoch": 190} {"train_loss": -31.020517349243164, "global_step": 23058, "epoch": 190} {"train_loss": -28.75933837890625, "global_step": 23059, "epoch": 190} {"train_loss": -30.185577392578125, "global_step": 23060, "epoch": 190} {"train_loss": -30.310094833374023, "global_step": 23061, "epoch": 190} {"train_loss": -29.726659774780273, "global_step": 23062, "epoch": 190} {"train_loss": -29.892749786376953, "global_step": 23063, "epoch": 190} {"train_loss": -30.493871688842773, "global_step": 23064, "epoch": 190} {"train_loss": -29.999494552612305, "global_step": 23065, "epoch": 190} {"train_loss": -30.411518096923828, "global_step": 23066, "epoch": 190} {"train_loss": -30.30206298828125, "global_step": 23067, "epoch": 190} {"train_loss": -29.56842041015625, "global_step": 23068, "epoch": 190} {"train_loss": -30.83448600769043, "global_step": 23069, "epoch": 190} {"train_loss": -30.040674209594727, "global_step": 23070, "epoch": 190} {"train_loss": -30.31155776977539, "global_step": 23071, "epoch": 190} {"train_loss": -30.258636474609375, "global_step": 23072, "epoch": 190} {"train_loss": -30.53196144104004, "global_step": 23073, "epoch": 190} {"train_loss": -30.19379234313965, "global_step": 23074, "epoch": 190} {"train_loss": -29.582548141479492, "global_step": 23075, "epoch": 190} {"train_loss": -29.922910690307617, "global_step": 23076, "epoch": 190} {"train_loss": -30.132719039916992, "global_step": 23077, "epoch": 190} {"train_loss": -30.500410079956055, "global_step": 23078, "epoch": 190} {"train_loss": -29.995365142822266, "global_step": 23079, "epoch": 190} {"train_loss": -29.736133575439453, "global_step": 23080, "epoch": 190} {"train_loss": -30.28693962097168, "global_step": 23081, "epoch": 190} {"train_loss": -30.526010513305664, "global_step": 23082, "epoch": 190} {"train_loss": -30.65864372253418, "global_step": 23083, "epoch": 190} {"train_loss": -30.679540634155273, "global_step": 23084, "epoch": 190} {"train_loss": -30.457677841186523, "global_step": 23085, "epoch": 190} {"train_loss": -30.86591148376465, "global_step": 23086, "epoch": 190} {"train_loss": -30.790348052978516, "global_step": 23087, "epoch": 190} {"train_loss": -31.164396286010742, "global_step": 23088, "epoch": 190} {"train_loss": -30.85793113708496, "global_step": 23089, "epoch": 190} {"train_loss": -30.941272735595703, "global_step": 23090, "epoch": 190} {"train_loss": -31.21527099609375, "global_step": 23091, "epoch": 190} {"train_loss": -30.234983444213867, "global_step": 23092, "epoch": 190} {"train_loss": -30.775909423828125, "global_step": 23093, "epoch": 190} {"train_loss": -31.38482093811035, "global_step": 23094, "epoch": 190} {"train_loss": -30.8673095703125, "global_step": 23095, "epoch": 190} {"train_loss": -31.24566650390625, "global_step": 23096, "epoch": 190} {"train_loss": -31.095067977905273, "global_step": 23097, "epoch": 190} {"train_loss": -30.39910316467285, "global_step": 23098, "epoch": 190} {"train_loss": -30.485803604125977, "global_step": 23099, "epoch": 190} {"train_loss": -30.917463302612305, "global_step": 23100, "epoch": 190} {"train_loss": -31.333642959594727, "global_step": 23101, "epoch": 190} {"train_loss": -30.360137939453125, "global_step": 23102, "epoch": 190} {"train_loss": -31.08880043029785, "global_step": 23103, "epoch": 190} {"train_loss": -30.42844581604004, "global_step": 23104, "epoch": 190} {"train_loss": -30.1258602142334, "global_step": 23105, "epoch": 190} {"train_loss": -29.722614288330078, "global_step": 23106, "epoch": 190} {"train_loss": -29.967700958251953, "global_step": 23107, "epoch": 190} {"train_loss": -30.385786056518555, "global_step": 23108, "epoch": 190} {"train_loss": -29.0769100189209, "global_step": 23109, "epoch": 190} {"train_loss": -30.318637264661554, "global_step": 23110, "epoch": 190, "val_loss": 2484884.75} {"train_loss": -28.570783615112305, "global_step": 23111, "epoch": 191} {"train_loss": -28.46329116821289, "global_step": 23112, "epoch": 191} {"train_loss": -29.733198165893555, "global_step": 23113, "epoch": 191} {"train_loss": -27.883649826049805, "global_step": 23114, "epoch": 191} {"train_loss": -29.699316024780273, "global_step": 23115, "epoch": 191} {"train_loss": -29.554784774780273, "global_step": 23116, "epoch": 191} {"train_loss": -29.679834365844727, "global_step": 23117, "epoch": 191} {"train_loss": -29.3255558013916, "global_step": 23118, "epoch": 191} {"train_loss": -30.50494384765625, "global_step": 23119, "epoch": 191} {"train_loss": -28.707128524780273, "global_step": 23120, "epoch": 191} {"train_loss": -29.395191192626953, "global_step": 23121, "epoch": 191} {"train_loss": -29.054494857788086, "global_step": 23122, "epoch": 191} {"train_loss": -25.486631393432617, "global_step": 23123, "epoch": 191} {"train_loss": -12.386504173278809, "global_step": 23124, "epoch": 191} {"train_loss": -9.746901512145996, "global_step": 23125, "epoch": 191} {"train_loss": -27.059797286987305, "global_step": 23126, "epoch": 191} {"train_loss": -27.40230369567871, "global_step": 23127, "epoch": 191} {"train_loss": -26.42740249633789, "global_step": 23128, "epoch": 191} {"train_loss": -28.365697860717773, "global_step": 23129, "epoch": 191} {"train_loss": -28.835895538330078, "global_step": 23130, "epoch": 191} {"train_loss": -27.029937744140625, "global_step": 23131, "epoch": 191} {"train_loss": -29.2125186920166, "global_step": 23132, "epoch": 191} {"train_loss": -28.02886390686035, "global_step": 23133, "epoch": 191} {"train_loss": -28.3194637298584, "global_step": 23134, "epoch": 191} {"train_loss": -29.865081787109375, "global_step": 23135, "epoch": 191} {"train_loss": -29.079803466796875, "global_step": 23136, "epoch": 191} {"train_loss": -28.652118682861328, "global_step": 23137, "epoch": 191} {"train_loss": -29.42848014831543, "global_step": 23138, "epoch": 191} {"train_loss": -29.571075439453125, "global_step": 23139, "epoch": 191} {"train_loss": -29.441944122314453, "global_step": 23140, "epoch": 191} {"train_loss": -28.937702178955078, "global_step": 23141, "epoch": 191} {"train_loss": -29.302099227905273, "global_step": 23142, "epoch": 191} {"train_loss": -29.87664794921875, "global_step": 23143, "epoch": 191} {"train_loss": -30.13661003112793, "global_step": 23144, "epoch": 191} {"train_loss": -29.530378341674805, "global_step": 23145, "epoch": 191} {"train_loss": -29.749500274658203, "global_step": 23146, "epoch": 191} {"train_loss": -29.95808219909668, "global_step": 23147, "epoch": 191} {"train_loss": -30.268964767456055, "global_step": 23148, "epoch": 191} {"train_loss": -30.348316192626953, "global_step": 23149, "epoch": 191} {"train_loss": -30.333730697631836, "global_step": 23150, "epoch": 191} {"train_loss": -30.17618751525879, "global_step": 23151, "epoch": 191} {"train_loss": -30.355619430541992, "global_step": 23152, "epoch": 191} {"train_loss": -30.373777389526367, "global_step": 23153, "epoch": 191} {"train_loss": -29.63007164001465, "global_step": 23154, "epoch": 191} {"train_loss": -30.470977783203125, "global_step": 23155, "epoch": 191} {"train_loss": -30.280597686767578, "global_step": 23156, "epoch": 191} {"train_loss": -29.96868324279785, "global_step": 23157, "epoch": 191} {"train_loss": -31.041534423828125, "global_step": 23158, "epoch": 191} {"train_loss": -30.42335319519043, "global_step": 23159, "epoch": 191} {"train_loss": -30.527868270874023, "global_step": 23160, "epoch": 191} {"train_loss": -30.668420791625977, "global_step": 23161, "epoch": 191} {"train_loss": -30.689435958862305, "global_step": 23162, "epoch": 191} {"train_loss": -30.476577758789062, "global_step": 23163, "epoch": 191} {"train_loss": -30.487060546875, "global_step": 23164, "epoch": 191} {"train_loss": -30.63250732421875, "global_step": 23165, "epoch": 191} {"train_loss": -30.1581974029541, "global_step": 23166, "epoch": 191} {"train_loss": -30.60761833190918, "global_step": 23167, "epoch": 191} {"train_loss": -30.727142333984375, "global_step": 23168, "epoch": 191} {"train_loss": -30.493406295776367, "global_step": 23169, "epoch": 191} {"train_loss": -30.365034103393555, "global_step": 23170, "epoch": 191} {"train_loss": -30.967941284179688, "global_step": 23171, "epoch": 191} {"train_loss": -30.899389266967773, "global_step": 23172, "epoch": 191} {"train_loss": -30.797882080078125, "global_step": 23173, "epoch": 191} {"train_loss": -30.955419540405273, "global_step": 23174, "epoch": 191} {"train_loss": -30.48599624633789, "global_step": 23175, "epoch": 191} {"train_loss": -30.326940536499023, "global_step": 23176, "epoch": 191} {"train_loss": -30.2619686126709, "global_step": 23177, "epoch": 191} {"train_loss": -31.163074493408203, "global_step": 23178, "epoch": 191} {"train_loss": -30.463464736938477, "global_step": 23179, "epoch": 191} {"train_loss": -30.67783546447754, "global_step": 23180, "epoch": 191} {"train_loss": -30.457189559936523, "global_step": 23181, "epoch": 191} {"train_loss": -30.63179588317871, "global_step": 23182, "epoch": 191} {"train_loss": -29.62106704711914, "global_step": 23183, "epoch": 191} {"train_loss": -27.519977569580078, "global_step": 23184, "epoch": 191} {"train_loss": -23.209714889526367, "global_step": 23185, "epoch": 191} {"train_loss": -16.983240127563477, "global_step": 23186, "epoch": 191} {"train_loss": -24.81410789489746, "global_step": 23187, "epoch": 191} {"train_loss": -29.934362411499023, "global_step": 23188, "epoch": 191} {"train_loss": -25.834354400634766, "global_step": 23189, "epoch": 191} {"train_loss": -30.2370662689209, "global_step": 23190, "epoch": 191} {"train_loss": -27.98836326599121, "global_step": 23191, "epoch": 191} {"train_loss": -29.609418869018555, "global_step": 23192, "epoch": 191} {"train_loss": -29.544269561767578, "global_step": 23193, "epoch": 191} {"train_loss": -29.4428768157959, "global_step": 23194, "epoch": 191} {"train_loss": -29.96502113342285, "global_step": 23195, "epoch": 191} {"train_loss": -29.38679313659668, "global_step": 23196, "epoch": 191} {"train_loss": -29.6575870513916, "global_step": 23197, "epoch": 191} {"train_loss": -29.76080894470215, "global_step": 23198, "epoch": 191} {"train_loss": -29.968597412109375, "global_step": 23199, "epoch": 191} {"train_loss": -29.89129638671875, "global_step": 23200, "epoch": 191} {"train_loss": -29.811248779296875, "global_step": 23201, "epoch": 191} {"train_loss": -29.560632705688477, "global_step": 23202, "epoch": 191} {"train_loss": -29.85371208190918, "global_step": 23203, "epoch": 191} {"train_loss": -29.501428604125977, "global_step": 23204, "epoch": 191} {"train_loss": -30.030515670776367, "global_step": 23205, "epoch": 191} {"train_loss": -29.9809513092041, "global_step": 23206, "epoch": 191} {"train_loss": -29.866500854492188, "global_step": 23207, "epoch": 191} {"train_loss": -29.856046676635742, "global_step": 23208, "epoch": 191} {"train_loss": -30.022497177124023, "global_step": 23209, "epoch": 191} {"train_loss": -29.70882225036621, "global_step": 23210, "epoch": 191} {"train_loss": -30.1187744140625, "global_step": 23211, "epoch": 191} {"train_loss": -29.784250259399414, "global_step": 23212, "epoch": 191} {"train_loss": -30.00006103515625, "global_step": 23213, "epoch": 191} {"train_loss": -30.246252059936523, "global_step": 23214, "epoch": 191} {"train_loss": -29.68735694885254, "global_step": 23215, "epoch": 191} {"train_loss": -29.782712936401367, "global_step": 23216, "epoch": 191} {"train_loss": -30.175006866455078, "global_step": 23217, "epoch": 191} {"train_loss": -29.97626304626465, "global_step": 23218, "epoch": 191} {"train_loss": -30.043424606323242, "global_step": 23219, "epoch": 191} {"train_loss": -30.12699317932129, "global_step": 23220, "epoch": 191} {"train_loss": -30.249624252319336, "global_step": 23221, "epoch": 191} {"train_loss": -30.444793701171875, "global_step": 23222, "epoch": 191} {"train_loss": -30.485309600830078, "global_step": 23223, "epoch": 191} {"train_loss": -30.07139015197754, "global_step": 23224, "epoch": 191} {"train_loss": -30.01349449157715, "global_step": 23225, "epoch": 191} {"train_loss": -30.684070587158203, "global_step": 23226, "epoch": 191} {"train_loss": -30.4733829498291, "global_step": 23227, "epoch": 191} {"train_loss": -30.5918025970459, "global_step": 23228, "epoch": 191} {"train_loss": -30.90594482421875, "global_step": 23229, "epoch": 191} {"train_loss": -30.17913246154785, "global_step": 23230, "epoch": 191} {"train_loss": -29.22338208285245, "global_step": 23231, "epoch": 191, "val_loss": 2523705.75} {"train_loss": -30.69776725769043, "global_step": 23232, "epoch": 192} {"train_loss": -30.9665584564209, "global_step": 23233, "epoch": 192} {"train_loss": -30.781070709228516, "global_step": 23234, "epoch": 192} {"train_loss": -30.717676162719727, "global_step": 23235, "epoch": 192} {"train_loss": -30.921838760375977, "global_step": 23236, "epoch": 192} {"train_loss": -30.845273971557617, "global_step": 23237, "epoch": 192} {"train_loss": -30.527856826782227, "global_step": 23238, "epoch": 192} {"train_loss": -29.7209415435791, "global_step": 23239, "epoch": 192} {"train_loss": -29.52752685546875, "global_step": 23240, "epoch": 192} {"train_loss": -30.28333854675293, "global_step": 23241, "epoch": 192} {"train_loss": -30.4940185546875, "global_step": 23242, "epoch": 192} {"train_loss": -29.92584800720215, "global_step": 23243, "epoch": 192} {"train_loss": -28.454771041870117, "global_step": 23244, "epoch": 192} {"train_loss": -27.569660186767578, "global_step": 23245, "epoch": 192} {"train_loss": -28.24124526977539, "global_step": 23246, "epoch": 192} {"train_loss": -30.80537223815918, "global_step": 23247, "epoch": 192} {"train_loss": -30.32283592224121, "global_step": 23248, "epoch": 192} {"train_loss": -28.647985458374023, "global_step": 23249, "epoch": 192} {"train_loss": -29.548816680908203, "global_step": 23250, "epoch": 192} {"train_loss": -30.154499053955078, "global_step": 23251, "epoch": 192} {"train_loss": -29.4084415435791, "global_step": 23252, "epoch": 192} {"train_loss": -30.382429122924805, "global_step": 23253, "epoch": 192} {"train_loss": -29.589513778686523, "global_step": 23254, "epoch": 192} {"train_loss": -29.54829216003418, "global_step": 23255, "epoch": 192} {"train_loss": -29.56036376953125, "global_step": 23256, "epoch": 192} {"train_loss": -28.413105010986328, "global_step": 23257, "epoch": 192} {"train_loss": -30.25052833557129, "global_step": 23258, "epoch": 192} {"train_loss": -29.59565544128418, "global_step": 23259, "epoch": 192} {"train_loss": -30.097013473510742, "global_step": 23260, "epoch": 192} {"train_loss": -29.7981014251709, "global_step": 23261, "epoch": 192} {"train_loss": -30.4512882232666, "global_step": 23262, "epoch": 192} {"train_loss": -30.47930908203125, "global_step": 23263, "epoch": 192} {"train_loss": -29.731164932250977, "global_step": 23264, "epoch": 192} {"train_loss": -30.42132568359375, "global_step": 23265, "epoch": 192} {"train_loss": -30.60150146484375, "global_step": 23266, "epoch": 192} {"train_loss": -30.572107315063477, "global_step": 23267, "epoch": 192} {"train_loss": -30.528547286987305, "global_step": 23268, "epoch": 192} {"train_loss": -30.5914249420166, "global_step": 23269, "epoch": 192} {"train_loss": -30.56064224243164, "global_step": 23270, "epoch": 192} {"train_loss": -31.165555953979492, "global_step": 23271, "epoch": 192} {"train_loss": -30.458887100219727, "global_step": 23272, "epoch": 192} {"train_loss": -30.78242301940918, "global_step": 23273, "epoch": 192} {"train_loss": -30.796106338500977, "global_step": 23274, "epoch": 192} {"train_loss": -31.013540267944336, "global_step": 23275, "epoch": 192} {"train_loss": -30.838134765625, "global_step": 23276, "epoch": 192} {"train_loss": -31.1732120513916, "global_step": 23277, "epoch": 192} {"train_loss": -31.237262725830078, "global_step": 23278, "epoch": 192} {"train_loss": -30.936279296875, "global_step": 23279, "epoch": 192} {"train_loss": -31.316974639892578, "global_step": 23280, "epoch": 192} {"train_loss": -31.30927848815918, "global_step": 23281, "epoch": 192} {"train_loss": -31.305389404296875, "global_step": 23282, "epoch": 192} {"train_loss": -31.237140655517578, "global_step": 23283, "epoch": 192} {"train_loss": -30.84168815612793, "global_step": 23284, "epoch": 192} {"train_loss": -30.632099151611328, "global_step": 23285, "epoch": 192} {"train_loss": -31.551416397094727, "global_step": 23286, "epoch": 192} {"train_loss": -31.04469108581543, "global_step": 23287, "epoch": 192} {"train_loss": -30.580976486206055, "global_step": 23288, "epoch": 192} {"train_loss": -31.072834014892578, "global_step": 23289, "epoch": 192} {"train_loss": -30.545835494995117, "global_step": 23290, "epoch": 192} {"train_loss": -30.86689567565918, "global_step": 23291, "epoch": 192} {"train_loss": -31.499582290649414, "global_step": 23292, "epoch": 192} {"train_loss": -30.298303604125977, "global_step": 23293, "epoch": 192} {"train_loss": -30.449737548828125, "global_step": 23294, "epoch": 192} {"train_loss": -30.832965850830078, "global_step": 23295, "epoch": 192} {"train_loss": -31.356216430664062, "global_step": 23296, "epoch": 192} {"train_loss": -30.367536544799805, "global_step": 23297, "epoch": 192} {"train_loss": -31.100818634033203, "global_step": 23298, "epoch": 192} {"train_loss": -31.39766502380371, "global_step": 23299, "epoch": 192} {"train_loss": -31.238935470581055, "global_step": 23300, "epoch": 192} {"train_loss": -31.21576499938965, "global_step": 23301, "epoch": 192} {"train_loss": -31.19428062438965, "global_step": 23302, "epoch": 192} {"train_loss": -31.48736572265625, "global_step": 23303, "epoch": 192} {"train_loss": -30.401479721069336, "global_step": 23304, "epoch": 192} {"train_loss": -31.567285537719727, "global_step": 23305, "epoch": 192} {"train_loss": -31.123870849609375, "global_step": 23306, "epoch": 192} {"train_loss": -31.169330596923828, "global_step": 23307, "epoch": 192} {"train_loss": -31.205768585205078, "global_step": 23308, "epoch": 192} {"train_loss": -31.467376708984375, "global_step": 23309, "epoch": 192} {"train_loss": -30.7181396484375, "global_step": 23310, "epoch": 192} {"train_loss": -30.85051918029785, "global_step": 23311, "epoch": 192} {"train_loss": -31.14637565612793, "global_step": 23312, "epoch": 192} {"train_loss": -31.143762588500977, "global_step": 23313, "epoch": 192} {"train_loss": -31.545654296875, "global_step": 23314, "epoch": 192} {"train_loss": -30.850671768188477, "global_step": 23315, "epoch": 192} {"train_loss": -31.44441795349121, "global_step": 23316, "epoch": 192} {"train_loss": -31.65154457092285, "global_step": 23317, "epoch": 192} {"train_loss": -31.280548095703125, "global_step": 23318, "epoch": 192} {"train_loss": -31.896621704101562, "global_step": 23319, "epoch": 192} {"train_loss": -31.61115837097168, "global_step": 23320, "epoch": 192} {"train_loss": -31.77436637878418, "global_step": 23321, "epoch": 192} {"train_loss": -31.358976364135742, "global_step": 23322, "epoch": 192} {"train_loss": -31.10943603515625, "global_step": 23323, "epoch": 192} {"train_loss": -31.99676513671875, "global_step": 23324, "epoch": 192} {"train_loss": -30.885990142822266, "global_step": 23325, "epoch": 192} {"train_loss": -31.48383903503418, "global_step": 23326, "epoch": 192} {"train_loss": -31.966535568237305, "global_step": 23327, "epoch": 192} {"train_loss": -31.3497257232666, "global_step": 23328, "epoch": 192} {"train_loss": -30.992767333984375, "global_step": 23329, "epoch": 192} {"train_loss": -31.53460693359375, "global_step": 23330, "epoch": 192} {"train_loss": -31.8182373046875, "global_step": 23331, "epoch": 192} {"train_loss": -31.240476608276367, "global_step": 23332, "epoch": 192} {"train_loss": -31.663915634155273, "global_step": 23333, "epoch": 192} {"train_loss": -30.778486251831055, "global_step": 23334, "epoch": 192} {"train_loss": -28.456098556518555, "global_step": 23335, "epoch": 192} {"train_loss": -25.4915828704834, "global_step": 23336, "epoch": 192} {"train_loss": -25.78887367248535, "global_step": 23337, "epoch": 192} {"train_loss": -27.80718421936035, "global_step": 23338, "epoch": 192} {"train_loss": -29.91461753845215, "global_step": 23339, "epoch": 192} {"train_loss": -27.642271041870117, "global_step": 23340, "epoch": 192} {"train_loss": -29.141340255737305, "global_step": 23341, "epoch": 192} {"train_loss": -29.7116641998291, "global_step": 23342, "epoch": 192} {"train_loss": -27.797971725463867, "global_step": 23343, "epoch": 192} {"train_loss": -28.317411422729492, "global_step": 23344, "epoch": 192} {"train_loss": -29.07520866394043, "global_step": 23345, "epoch": 192} {"train_loss": -27.974990844726562, "global_step": 23346, "epoch": 192} {"train_loss": -27.754667282104492, "global_step": 23347, "epoch": 192} {"train_loss": -28.554019927978516, "global_step": 23348, "epoch": 192} {"train_loss": -27.0855655670166, "global_step": 23349, "epoch": 192} {"train_loss": -28.330427169799805, "global_step": 23350, "epoch": 192} {"train_loss": -28.892744064331055, "global_step": 23351, "epoch": 192} {"train_loss": -30.333879691510163, "global_step": 23352, "epoch": 192, "val_loss": 2698064.75} {"train_loss": -28.882266998291016, "global_step": 23353, "epoch": 193} {"train_loss": -29.66015625, "global_step": 23354, "epoch": 193} {"train_loss": -29.4782772064209, "global_step": 23355, "epoch": 193} {"train_loss": -29.7802791595459, "global_step": 23356, "epoch": 193} {"train_loss": -29.585676193237305, "global_step": 23357, "epoch": 193} {"train_loss": -29.73402214050293, "global_step": 23358, "epoch": 193} {"train_loss": -29.964109420776367, "global_step": 23359, "epoch": 193} {"train_loss": -29.740110397338867, "global_step": 23360, "epoch": 193} {"train_loss": -29.9606876373291, "global_step": 23361, "epoch": 193} {"train_loss": -30.22627830505371, "global_step": 23362, "epoch": 193} {"train_loss": -30.12726402282715, "global_step": 23363, "epoch": 193} {"train_loss": -30.060956954956055, "global_step": 23364, "epoch": 193} {"train_loss": -30.325851440429688, "global_step": 23365, "epoch": 193} {"train_loss": -29.77886962890625, "global_step": 23366, "epoch": 193} {"train_loss": -30.419443130493164, "global_step": 23367, "epoch": 193} {"train_loss": -31.02186393737793, "global_step": 23368, "epoch": 193} {"train_loss": -30.3062686920166, "global_step": 23369, "epoch": 193} {"train_loss": -30.277441024780273, "global_step": 23370, "epoch": 193} {"train_loss": -31.002334594726562, "global_step": 23371, "epoch": 193} {"train_loss": -30.344074249267578, "global_step": 23372, "epoch": 193} {"train_loss": -29.495758056640625, "global_step": 23373, "epoch": 193} {"train_loss": -30.428129196166992, "global_step": 23374, "epoch": 193} {"train_loss": -30.381269454956055, "global_step": 23375, "epoch": 193} {"train_loss": -30.519031524658203, "global_step": 23376, "epoch": 193} {"train_loss": -30.4873046875, "global_step": 23377, "epoch": 193} {"train_loss": -30.8978328704834, "global_step": 23378, "epoch": 193} {"train_loss": -30.224557876586914, "global_step": 23379, "epoch": 193} {"train_loss": -30.56099510192871, "global_step": 23380, "epoch": 193} {"train_loss": -30.709598541259766, "global_step": 23381, "epoch": 193} {"train_loss": -30.441415786743164, "global_step": 23382, "epoch": 193} {"train_loss": -30.542022705078125, "global_step": 23383, "epoch": 193} {"train_loss": -30.710065841674805, "global_step": 23384, "epoch": 193} {"train_loss": -30.574338912963867, "global_step": 23385, "epoch": 193} {"train_loss": -30.3446102142334, "global_step": 23386, "epoch": 193} {"train_loss": -30.40638542175293, "global_step": 23387, "epoch": 193} {"train_loss": -30.49419593811035, "global_step": 23388, "epoch": 193} {"train_loss": -31.195371627807617, "global_step": 23389, "epoch": 193} {"train_loss": -30.679859161376953, "global_step": 23390, "epoch": 193} {"train_loss": -30.907480239868164, "global_step": 23391, "epoch": 193} {"train_loss": -30.5411319732666, "global_step": 23392, "epoch": 193} {"train_loss": -30.46253776550293, "global_step": 23393, "epoch": 193} {"train_loss": -30.88230323791504, "global_step": 23394, "epoch": 193} {"train_loss": -30.955352783203125, "global_step": 23395, "epoch": 193} {"train_loss": -31.334522247314453, "global_step": 23396, "epoch": 193} {"train_loss": -30.9042911529541, "global_step": 23397, "epoch": 193} {"train_loss": -30.244531631469727, "global_step": 23398, "epoch": 193} {"train_loss": -30.089818954467773, "global_step": 23399, "epoch": 193} {"train_loss": -29.73105239868164, "global_step": 23400, "epoch": 193} {"train_loss": -30.052228927612305, "global_step": 23401, "epoch": 193} {"train_loss": -30.71014976501465, "global_step": 23402, "epoch": 193} {"train_loss": -30.8322696685791, "global_step": 23403, "epoch": 193} {"train_loss": -31.099924087524414, "global_step": 23404, "epoch": 193} {"train_loss": -29.997690200805664, "global_step": 23405, "epoch": 193} {"train_loss": -31.118818283081055, "global_step": 23406, "epoch": 193} {"train_loss": -30.843555450439453, "global_step": 23407, "epoch": 193} {"train_loss": -30.826374053955078, "global_step": 23408, "epoch": 193} {"train_loss": -30.2736873626709, "global_step": 23409, "epoch": 193} {"train_loss": -30.90036964416504, "global_step": 23410, "epoch": 193} {"train_loss": -30.86138916015625, "global_step": 23411, "epoch": 193} {"train_loss": -31.042463302612305, "global_step": 23412, "epoch": 193} {"train_loss": -31.33612632751465, "global_step": 23413, "epoch": 193} {"train_loss": -30.570819854736328, "global_step": 23414, "epoch": 193} {"train_loss": -30.401721954345703, "global_step": 23415, "epoch": 193} {"train_loss": -30.45231056213379, "global_step": 23416, "epoch": 193} {"train_loss": -30.815521240234375, "global_step": 23417, "epoch": 193} {"train_loss": -31.48408317565918, "global_step": 23418, "epoch": 193} {"train_loss": -31.212997436523438, "global_step": 23419, "epoch": 193} {"train_loss": -30.341150283813477, "global_step": 23420, "epoch": 193} {"train_loss": -29.799787521362305, "global_step": 23421, "epoch": 193} {"train_loss": -30.688953399658203, "global_step": 23422, "epoch": 193} {"train_loss": -31.130483627319336, "global_step": 23423, "epoch": 193} {"train_loss": -31.67046546936035, "global_step": 23424, "epoch": 193} {"train_loss": -31.239715576171875, "global_step": 23425, "epoch": 193} {"train_loss": -30.826826095581055, "global_step": 23426, "epoch": 193} {"train_loss": -30.725370407104492, "global_step": 23427, "epoch": 193} {"train_loss": -31.056522369384766, "global_step": 23428, "epoch": 193} {"train_loss": -31.037067413330078, "global_step": 23429, "epoch": 193} {"train_loss": -30.817523956298828, "global_step": 23430, "epoch": 193} {"train_loss": -30.799779891967773, "global_step": 23431, "epoch": 193} {"train_loss": -31.284250259399414, "global_step": 23432, "epoch": 193} {"train_loss": -31.54218864440918, "global_step": 23433, "epoch": 193} {"train_loss": -31.307357788085938, "global_step": 23434, "epoch": 193} {"train_loss": -31.266433715820312, "global_step": 23435, "epoch": 193} {"train_loss": -30.4298038482666, "global_step": 23436, "epoch": 193} {"train_loss": -31.63532066345215, "global_step": 23437, "epoch": 193} {"train_loss": -30.875104904174805, "global_step": 23438, "epoch": 193} {"train_loss": -31.393692016601562, "global_step": 23439, "epoch": 193} {"train_loss": -30.88335609436035, "global_step": 23440, "epoch": 193} {"train_loss": -30.759235382080078, "global_step": 23441, "epoch": 193} {"train_loss": -31.096418380737305, "global_step": 23442, "epoch": 193} {"train_loss": -31.1535701751709, "global_step": 23443, "epoch": 193} {"train_loss": -29.942514419555664, "global_step": 23444, "epoch": 193} {"train_loss": -31.155439376831055, "global_step": 23445, "epoch": 193} {"train_loss": -30.00074577331543, "global_step": 23446, "epoch": 193} {"train_loss": -30.55482292175293, "global_step": 23447, "epoch": 193} {"train_loss": -30.580398559570312, "global_step": 23448, "epoch": 193} {"train_loss": -30.363922119140625, "global_step": 23449, "epoch": 193} {"train_loss": -29.427701950073242, "global_step": 23450, "epoch": 193} {"train_loss": -28.538843154907227, "global_step": 23451, "epoch": 193} {"train_loss": -29.623016357421875, "global_step": 23452, "epoch": 193} {"train_loss": -31.107715606689453, "global_step": 23453, "epoch": 193} {"train_loss": -30.386783599853516, "global_step": 23454, "epoch": 193} {"train_loss": -29.906436920166016, "global_step": 23455, "epoch": 193} {"train_loss": -30.315671920776367, "global_step": 23456, "epoch": 193} {"train_loss": -30.4760684967041, "global_step": 23457, "epoch": 193} {"train_loss": -29.33406639099121, "global_step": 23458, "epoch": 193} {"train_loss": -30.33296012878418, "global_step": 23459, "epoch": 193} {"train_loss": -30.649642944335938, "global_step": 23460, "epoch": 193} {"train_loss": -29.66436767578125, "global_step": 23461, "epoch": 193} {"train_loss": -30.720853805541992, "global_step": 23462, "epoch": 193} {"train_loss": -30.95490837097168, "global_step": 23463, "epoch": 193} {"train_loss": -30.370298385620117, "global_step": 23464, "epoch": 193} {"train_loss": -30.498395919799805, "global_step": 23465, "epoch": 193} {"train_loss": -31.0566349029541, "global_step": 23466, "epoch": 193} {"train_loss": -31.0369815826416, "global_step": 23467, "epoch": 193} {"train_loss": -30.343408584594727, "global_step": 23468, "epoch": 193} {"train_loss": -31.225494384765625, "global_step": 23469, "epoch": 193} {"train_loss": -30.75075340270996, "global_step": 23470, "epoch": 193} {"train_loss": -30.2952880859375, "global_step": 23471, "epoch": 193} {"train_loss": -31.229450225830078, "global_step": 23472, "epoch": 193} {"train_loss": -30.550940080122515, "global_step": 23473, "epoch": 193, "val_loss": 2719876.0} {"train_loss": -30.950510025024414, "global_step": 23474, "epoch": 194} {"train_loss": -31.08245849609375, "global_step": 23475, "epoch": 194} {"train_loss": -29.914005279541016, "global_step": 23476, "epoch": 194} {"train_loss": -29.136566162109375, "global_step": 23477, "epoch": 194} {"train_loss": -28.603017807006836, "global_step": 23478, "epoch": 194} {"train_loss": -29.364715576171875, "global_step": 23479, "epoch": 194} {"train_loss": -30.606672286987305, "global_step": 23480, "epoch": 194} {"train_loss": -31.1215763092041, "global_step": 23481, "epoch": 194} {"train_loss": -31.099714279174805, "global_step": 23482, "epoch": 194} {"train_loss": -31.05181884765625, "global_step": 23483, "epoch": 194} {"train_loss": -31.42609977722168, "global_step": 23484, "epoch": 194} {"train_loss": -31.618228912353516, "global_step": 23485, "epoch": 194} {"train_loss": -31.217166900634766, "global_step": 23486, "epoch": 194} {"train_loss": -31.001806259155273, "global_step": 23487, "epoch": 194} {"train_loss": -31.766925811767578, "global_step": 23488, "epoch": 194} {"train_loss": -31.031402587890625, "global_step": 23489, "epoch": 194} {"train_loss": -31.034061431884766, "global_step": 23490, "epoch": 194} {"train_loss": -30.066059112548828, "global_step": 23491, "epoch": 194} {"train_loss": -30.560123443603516, "global_step": 23492, "epoch": 194} {"train_loss": -31.3123722076416, "global_step": 23493, "epoch": 194} {"train_loss": -30.782367706298828, "global_step": 23494, "epoch": 194} {"train_loss": -31.665313720703125, "global_step": 23495, "epoch": 194} {"train_loss": -31.193994522094727, "global_step": 23496, "epoch": 194} {"train_loss": -30.47889518737793, "global_step": 23497, "epoch": 194} {"train_loss": -30.725080490112305, "global_step": 23498, "epoch": 194} {"train_loss": -30.758779525756836, "global_step": 23499, "epoch": 194} {"train_loss": -30.954587936401367, "global_step": 23500, "epoch": 194} {"train_loss": -30.905811309814453, "global_step": 23501, "epoch": 194} {"train_loss": -29.617538452148438, "global_step": 23502, "epoch": 194} {"train_loss": -31.102054595947266, "global_step": 23503, "epoch": 194} {"train_loss": -29.87367057800293, "global_step": 23504, "epoch": 194} {"train_loss": -29.807880401611328, "global_step": 23505, "epoch": 194} {"train_loss": -31.471603393554688, "global_step": 23506, "epoch": 194} {"train_loss": -30.232446670532227, "global_step": 23507, "epoch": 194} {"train_loss": -31.4150447845459, "global_step": 23508, "epoch": 194} {"train_loss": -31.451053619384766, "global_step": 23509, "epoch": 194} {"train_loss": -31.525068283081055, "global_step": 23510, "epoch": 194} {"train_loss": -31.508283615112305, "global_step": 23511, "epoch": 194} {"train_loss": -31.097387313842773, "global_step": 23512, "epoch": 194} {"train_loss": -31.526636123657227, "global_step": 23513, "epoch": 194} {"train_loss": -31.691146850585938, "global_step": 23514, "epoch": 194} {"train_loss": -31.998315811157227, "global_step": 23515, "epoch": 194} {"train_loss": -31.689634323120117, "global_step": 23516, "epoch": 194} {"train_loss": -31.73613929748535, "global_step": 23517, "epoch": 194} {"train_loss": -32.179351806640625, "global_step": 23518, "epoch": 194} {"train_loss": -31.82755470275879, "global_step": 23519, "epoch": 194} {"train_loss": -31.53663444519043, "global_step": 23520, "epoch": 194} {"train_loss": -31.89451026916504, "global_step": 23521, "epoch": 194} {"train_loss": -31.904150009155273, "global_step": 23522, "epoch": 194} {"train_loss": -31.906543731689453, "global_step": 23523, "epoch": 194} {"train_loss": -31.164581298828125, "global_step": 23524, "epoch": 194} {"train_loss": -31.631855010986328, "global_step": 23525, "epoch": 194} {"train_loss": -31.71600914001465, "global_step": 23526, "epoch": 194} {"train_loss": -31.814376831054688, "global_step": 23527, "epoch": 194} {"train_loss": -31.319538116455078, "global_step": 23528, "epoch": 194} {"train_loss": -29.99411964416504, "global_step": 23529, "epoch": 194} {"train_loss": -26.56648063659668, "global_step": 23530, "epoch": 194} {"train_loss": -20.094419479370117, "global_step": 23531, "epoch": 194} {"train_loss": -13.085283279418945, "global_step": 23532, "epoch": 194} {"train_loss": -18.386747360229492, "global_step": 23533, "epoch": 194} {"train_loss": -30.649839401245117, "global_step": 23534, "epoch": 194} {"train_loss": -24.747854232788086, "global_step": 23535, "epoch": 194} {"train_loss": -31.332014083862305, "global_step": 23536, "epoch": 194} {"train_loss": -26.209203720092773, "global_step": 23537, "epoch": 194} {"train_loss": -30.04571533203125, "global_step": 23538, "epoch": 194} {"train_loss": -28.98383140563965, "global_step": 23539, "epoch": 194} {"train_loss": -28.94978904724121, "global_step": 23540, "epoch": 194} {"train_loss": -30.379674911499023, "global_step": 23541, "epoch": 194} {"train_loss": -29.437942504882812, "global_step": 23542, "epoch": 194} {"train_loss": -29.2479248046875, "global_step": 23543, "epoch": 194} {"train_loss": -29.309431076049805, "global_step": 23544, "epoch": 194} {"train_loss": -30.738630294799805, "global_step": 23545, "epoch": 194} {"train_loss": -29.341596603393555, "global_step": 23546, "epoch": 194} {"train_loss": -29.6215763092041, "global_step": 23547, "epoch": 194} {"train_loss": -30.292768478393555, "global_step": 23548, "epoch": 194} {"train_loss": -30.090930938720703, "global_step": 23549, "epoch": 194} {"train_loss": -30.35108757019043, "global_step": 23550, "epoch": 194} {"train_loss": -30.36053466796875, "global_step": 23551, "epoch": 194} {"train_loss": -29.779804229736328, "global_step": 23552, "epoch": 194} {"train_loss": -30.57843017578125, "global_step": 23553, "epoch": 194} {"train_loss": -30.562747955322266, "global_step": 23554, "epoch": 194} {"train_loss": -30.386152267456055, "global_step": 23555, "epoch": 194} {"train_loss": -30.263193130493164, "global_step": 23556, "epoch": 194} {"train_loss": -30.146930694580078, "global_step": 23557, "epoch": 194} {"train_loss": -30.17854881286621, "global_step": 23558, "epoch": 194} {"train_loss": -30.71854019165039, "global_step": 23559, "epoch": 194} {"train_loss": -29.36115837097168, "global_step": 23560, "epoch": 194} {"train_loss": -28.062286376953125, "global_step": 23561, "epoch": 194} {"train_loss": -29.25615882873535, "global_step": 23562, "epoch": 194} {"train_loss": -29.93912696838379, "global_step": 23563, "epoch": 194} {"train_loss": -30.644412994384766, "global_step": 23564, "epoch": 194} {"train_loss": -29.236343383789062, "global_step": 23565, "epoch": 194} {"train_loss": -28.328954696655273, "global_step": 23566, "epoch": 194} {"train_loss": -29.361831665039062, "global_step": 23567, "epoch": 194} {"train_loss": -30.469186782836914, "global_step": 23568, "epoch": 194} {"train_loss": -28.92708396911621, "global_step": 23569, "epoch": 194} {"train_loss": -30.218786239624023, "global_step": 23570, "epoch": 194} {"train_loss": -29.421497344970703, "global_step": 23571, "epoch": 194} {"train_loss": -29.054819107055664, "global_step": 23572, "epoch": 194} {"train_loss": -31.382572174072266, "global_step": 23573, "epoch": 194} {"train_loss": -29.39161491394043, "global_step": 23574, "epoch": 194} {"train_loss": -30.642404556274414, "global_step": 23575, "epoch": 194} {"train_loss": -29.4093017578125, "global_step": 23576, "epoch": 194} {"train_loss": -30.467893600463867, "global_step": 23577, "epoch": 194} {"train_loss": -30.61215591430664, "global_step": 23578, "epoch": 194} {"train_loss": -30.478118896484375, "global_step": 23579, "epoch": 194} {"train_loss": -30.943134307861328, "global_step": 23580, "epoch": 194} {"train_loss": -30.5477237701416, "global_step": 23581, "epoch": 194} {"train_loss": -30.480859756469727, "global_step": 23582, "epoch": 194} {"train_loss": -30.32037353515625, "global_step": 23583, "epoch": 194} {"train_loss": -30.514881134033203, "global_step": 23584, "epoch": 194} {"train_loss": -30.762006759643555, "global_step": 23585, "epoch": 194} {"train_loss": -30.648725509643555, "global_step": 23586, "epoch": 194} {"train_loss": -30.69569206237793, "global_step": 23587, "epoch": 194} {"train_loss": -30.88325309753418, "global_step": 23588, "epoch": 194} {"train_loss": -30.370004653930664, "global_step": 23589, "epoch": 194} {"train_loss": -30.854761123657227, "global_step": 23590, "epoch": 194} {"train_loss": -30.760831832885742, "global_step": 23591, "epoch": 194} {"train_loss": -31.225818634033203, "global_step": 23592, "epoch": 194} {"train_loss": -30.634357452392578, "global_step": 23593, "epoch": 194} {"train_loss": -30.117727689506594, "global_step": 23594, "epoch": 194, "val_loss": 2542161.75} {"train_loss": -30.81780433654785, "global_step": 23595, "epoch": 195} {"train_loss": -30.918533325195312, "global_step": 23596, "epoch": 195} {"train_loss": -30.827070236206055, "global_step": 23597, "epoch": 195} {"train_loss": -30.6829776763916, "global_step": 23598, "epoch": 195} {"train_loss": -31.106597900390625, "global_step": 23599, "epoch": 195} {"train_loss": -29.976947784423828, "global_step": 23600, "epoch": 195} {"train_loss": -30.246875762939453, "global_step": 23601, "epoch": 195} {"train_loss": -30.622711181640625, "global_step": 23602, "epoch": 195} {"train_loss": -30.288808822631836, "global_step": 23603, "epoch": 195} {"train_loss": -28.74884033203125, "global_step": 23604, "epoch": 195} {"train_loss": -30.906238555908203, "global_step": 23605, "epoch": 195} {"train_loss": -29.386260986328125, "global_step": 23606, "epoch": 195} {"train_loss": -30.652597427368164, "global_step": 23607, "epoch": 195} {"train_loss": -29.857192993164062, "global_step": 23608, "epoch": 195} {"train_loss": -30.795751571655273, "global_step": 23609, "epoch": 195} {"train_loss": -30.217130661010742, "global_step": 23610, "epoch": 195} {"train_loss": -30.542341232299805, "global_step": 23611, "epoch": 195} {"train_loss": -28.17486000061035, "global_step": 23612, "epoch": 195} {"train_loss": -28.835500717163086, "global_step": 23613, "epoch": 195} {"train_loss": -30.1724910736084, "global_step": 23614, "epoch": 195} {"train_loss": -30.076013565063477, "global_step": 23615, "epoch": 195} {"train_loss": -30.531204223632812, "global_step": 23616, "epoch": 195} {"train_loss": -30.767826080322266, "global_step": 23617, "epoch": 195} {"train_loss": -30.328144073486328, "global_step": 23618, "epoch": 195} {"train_loss": -30.92032814025879, "global_step": 23619, "epoch": 195} {"train_loss": -30.15925407409668, "global_step": 23620, "epoch": 195} {"train_loss": -30.04225730895996, "global_step": 23621, "epoch": 195} {"train_loss": -30.22710609436035, "global_step": 23622, "epoch": 195} {"train_loss": -30.528125762939453, "global_step": 23623, "epoch": 195} {"train_loss": -30.171361923217773, "global_step": 23624, "epoch": 195} {"train_loss": -31.302297592163086, "global_step": 23625, "epoch": 195} {"train_loss": -30.184528350830078, "global_step": 23626, "epoch": 195} {"train_loss": -30.998245239257812, "global_step": 23627, "epoch": 195} {"train_loss": -30.197431564331055, "global_step": 23628, "epoch": 195} {"train_loss": -31.052902221679688, "global_step": 23629, "epoch": 195} {"train_loss": -30.793676376342773, "global_step": 23630, "epoch": 195} {"train_loss": -31.09199333190918, "global_step": 23631, "epoch": 195} {"train_loss": -30.970731735229492, "global_step": 23632, "epoch": 195} {"train_loss": -30.960702896118164, "global_step": 23633, "epoch": 195} {"train_loss": -30.967761993408203, "global_step": 23634, "epoch": 195} {"train_loss": -31.216842651367188, "global_step": 23635, "epoch": 195} {"train_loss": -30.911239624023438, "global_step": 23636, "epoch": 195} {"train_loss": -31.358718872070312, "global_step": 23637, "epoch": 195} {"train_loss": -30.971954345703125, "global_step": 23638, "epoch": 195} {"train_loss": -31.443159103393555, "global_step": 23639, "epoch": 195} {"train_loss": -30.69794273376465, "global_step": 23640, "epoch": 195} {"train_loss": -31.10772705078125, "global_step": 23641, "epoch": 195} {"train_loss": -30.664854049682617, "global_step": 23642, "epoch": 195} {"train_loss": -31.17754554748535, "global_step": 23643, "epoch": 195} {"train_loss": -30.62906837463379, "global_step": 23644, "epoch": 195} {"train_loss": -31.15387535095215, "global_step": 23645, "epoch": 195} {"train_loss": -30.829923629760742, "global_step": 23646, "epoch": 195} {"train_loss": -30.53977394104004, "global_step": 23647, "epoch": 195} {"train_loss": -31.051435470581055, "global_step": 23648, "epoch": 195} {"train_loss": -29.328643798828125, "global_step": 23649, "epoch": 195} {"train_loss": -25.998764038085938, "global_step": 23650, "epoch": 195} {"train_loss": -25.172983169555664, "global_step": 23651, "epoch": 195} {"train_loss": -28.299009323120117, "global_step": 23652, "epoch": 195} {"train_loss": -29.088653564453125, "global_step": 23653, "epoch": 195} {"train_loss": -29.691547393798828, "global_step": 23654, "epoch": 195} {"train_loss": -29.84260368347168, "global_step": 23655, "epoch": 195} {"train_loss": -31.173688888549805, "global_step": 23656, "epoch": 195} {"train_loss": -29.426294326782227, "global_step": 23657, "epoch": 195} {"train_loss": -29.03427505493164, "global_step": 23658, "epoch": 195} {"train_loss": -30.442108154296875, "global_step": 23659, "epoch": 195} {"train_loss": -30.49891471862793, "global_step": 23660, "epoch": 195} {"train_loss": -29.70167350769043, "global_step": 23661, "epoch": 195} {"train_loss": -30.452056884765625, "global_step": 23662, "epoch": 195} {"train_loss": -30.348310470581055, "global_step": 23663, "epoch": 195} {"train_loss": -29.915292739868164, "global_step": 23664, "epoch": 195} {"train_loss": -30.78444480895996, "global_step": 23665, "epoch": 195} {"train_loss": -30.303497314453125, "global_step": 23666, "epoch": 195} {"train_loss": -30.650480270385742, "global_step": 23667, "epoch": 195} {"train_loss": -30.558271408081055, "global_step": 23668, "epoch": 195} {"train_loss": -30.928573608398438, "global_step": 23669, "epoch": 195} {"train_loss": -30.867284774780273, "global_step": 23670, "epoch": 195} {"train_loss": -31.113157272338867, "global_step": 23671, "epoch": 195} {"train_loss": -30.918292999267578, "global_step": 23672, "epoch": 195} {"train_loss": -31.054792404174805, "global_step": 23673, "epoch": 195} {"train_loss": -30.608118057250977, "global_step": 23674, "epoch": 195} {"train_loss": -31.3134708404541, "global_step": 23675, "epoch": 195} {"train_loss": -30.84440040588379, "global_step": 23676, "epoch": 195} {"train_loss": -31.16034507751465, "global_step": 23677, "epoch": 195} {"train_loss": -30.914636611938477, "global_step": 23678, "epoch": 195} {"train_loss": -31.267902374267578, "global_step": 23679, "epoch": 195} {"train_loss": -30.941015243530273, "global_step": 23680, "epoch": 195} {"train_loss": -31.48406982421875, "global_step": 23681, "epoch": 195} {"train_loss": -30.658435821533203, "global_step": 23682, "epoch": 195} {"train_loss": -31.10896110534668, "global_step": 23683, "epoch": 195} {"train_loss": -31.328290939331055, "global_step": 23684, "epoch": 195} {"train_loss": -30.9980525970459, "global_step": 23685, "epoch": 195} {"train_loss": -30.930267333984375, "global_step": 23686, "epoch": 195} {"train_loss": -31.771381378173828, "global_step": 23687, "epoch": 195} {"train_loss": -31.1664981842041, "global_step": 23688, "epoch": 195} {"train_loss": -31.10452651977539, "global_step": 23689, "epoch": 195} {"train_loss": -30.91718101501465, "global_step": 23690, "epoch": 195} {"train_loss": -31.188329696655273, "global_step": 23691, "epoch": 195} {"train_loss": -31.608749389648438, "global_step": 23692, "epoch": 195} {"train_loss": -30.80488395690918, "global_step": 23693, "epoch": 195} {"train_loss": -30.9534912109375, "global_step": 23694, "epoch": 195} {"train_loss": -30.82710838317871, "global_step": 23695, "epoch": 195} {"train_loss": -31.07576560974121, "global_step": 23696, "epoch": 195} {"train_loss": -31.308820724487305, "global_step": 23697, "epoch": 195} {"train_loss": -30.900415420532227, "global_step": 23698, "epoch": 195} {"train_loss": -31.06283950805664, "global_step": 23699, "epoch": 195} {"train_loss": -31.152746200561523, "global_step": 23700, "epoch": 195} {"train_loss": -31.5623836517334, "global_step": 23701, "epoch": 195} {"train_loss": -31.020843505859375, "global_step": 23702, "epoch": 195} {"train_loss": -31.42283058166504, "global_step": 23703, "epoch": 195} {"train_loss": -31.310977935791016, "global_step": 23704, "epoch": 195} {"train_loss": -31.281835556030273, "global_step": 23705, "epoch": 195} {"train_loss": -30.96820068359375, "global_step": 23706, "epoch": 195} {"train_loss": -31.13325309753418, "global_step": 23707, "epoch": 195} {"train_loss": -31.628204345703125, "global_step": 23708, "epoch": 195} {"train_loss": -31.54107666015625, "global_step": 23709, "epoch": 195} {"train_loss": -31.440414428710938, "global_step": 23710, "epoch": 195} {"train_loss": -31.024921417236328, "global_step": 23711, "epoch": 195} {"train_loss": -31.474822998046875, "global_step": 23712, "epoch": 195} {"train_loss": -31.463428497314453, "global_step": 23713, "epoch": 195} {"train_loss": -31.340295791625977, "global_step": 23714, "epoch": 195} {"train_loss": -30.615334045788472, "global_step": 23715, "epoch": 195, "val_loss": 2631779.75} {"train_loss": -31.482086181640625, "global_step": 23716, "epoch": 196} {"train_loss": -31.538726806640625, "global_step": 23717, "epoch": 196} {"train_loss": -31.459577560424805, "global_step": 23718, "epoch": 196} {"train_loss": -31.960004806518555, "global_step": 23719, "epoch": 196} {"train_loss": -31.50908851623535, "global_step": 23720, "epoch": 196} {"train_loss": -31.229822158813477, "global_step": 23721, "epoch": 196} {"train_loss": -30.6444091796875, "global_step": 23722, "epoch": 196} {"train_loss": -30.56817054748535, "global_step": 23723, "epoch": 196} {"train_loss": -29.456165313720703, "global_step": 23724, "epoch": 196} {"train_loss": -29.227502822875977, "global_step": 23725, "epoch": 196} {"train_loss": -31.248859405517578, "global_step": 23726, "epoch": 196} {"train_loss": -31.258386611938477, "global_step": 23727, "epoch": 196} {"train_loss": -29.542388916015625, "global_step": 23728, "epoch": 196} {"train_loss": -30.476835250854492, "global_step": 23729, "epoch": 196} {"train_loss": -30.118122100830078, "global_step": 23730, "epoch": 196} {"train_loss": -30.078140258789062, "global_step": 23731, "epoch": 196} {"train_loss": -30.701034545898438, "global_step": 23732, "epoch": 196} {"train_loss": -31.18416404724121, "global_step": 23733, "epoch": 196} {"train_loss": -29.664276123046875, "global_step": 23734, "epoch": 196} {"train_loss": -28.75311851501465, "global_step": 23735, "epoch": 196} {"train_loss": -24.214181900024414, "global_step": 23736, "epoch": 196} {"train_loss": -19.242971420288086, "global_step": 23737, "epoch": 196} {"train_loss": -26.31550407409668, "global_step": 23738, "epoch": 196} {"train_loss": -26.598535537719727, "global_step": 23739, "epoch": 196} {"train_loss": -29.57081413269043, "global_step": 23740, "epoch": 196} {"train_loss": -28.0401668548584, "global_step": 23741, "epoch": 196} {"train_loss": -29.53521156311035, "global_step": 23742, "epoch": 196} {"train_loss": -30.243635177612305, "global_step": 23743, "epoch": 196} {"train_loss": -30.233722686767578, "global_step": 23744, "epoch": 196} {"train_loss": -29.941680908203125, "global_step": 23745, "epoch": 196} {"train_loss": -30.204679489135742, "global_step": 23746, "epoch": 196} {"train_loss": -30.56793212890625, "global_step": 23747, "epoch": 196} {"train_loss": -30.777912139892578, "global_step": 23748, "epoch": 196} {"train_loss": -30.870115280151367, "global_step": 23749, "epoch": 196} {"train_loss": -30.616592407226562, "global_step": 23750, "epoch": 196} {"train_loss": -30.874670028686523, "global_step": 23751, "epoch": 196} {"train_loss": -30.819971084594727, "global_step": 23752, "epoch": 196} {"train_loss": -30.356674194335938, "global_step": 23753, "epoch": 196} {"train_loss": -30.228113174438477, "global_step": 23754, "epoch": 196} {"train_loss": -30.138341903686523, "global_step": 23755, "epoch": 196} {"train_loss": -31.272846221923828, "global_step": 23756, "epoch": 196} {"train_loss": -30.594491958618164, "global_step": 23757, "epoch": 196} {"train_loss": -30.819562911987305, "global_step": 23758, "epoch": 196} {"train_loss": -31.025915145874023, "global_step": 23759, "epoch": 196} {"train_loss": -31.169178009033203, "global_step": 23760, "epoch": 196} {"train_loss": -30.88018226623535, "global_step": 23761, "epoch": 196} {"train_loss": -30.784086227416992, "global_step": 23762, "epoch": 196} {"train_loss": -30.928730010986328, "global_step": 23763, "epoch": 196} {"train_loss": -30.409666061401367, "global_step": 23764, "epoch": 196} {"train_loss": -30.820226669311523, "global_step": 23765, "epoch": 196} {"train_loss": -30.527875900268555, "global_step": 23766, "epoch": 196} {"train_loss": -31.204212188720703, "global_step": 23767, "epoch": 196} {"train_loss": -30.7392635345459, "global_step": 23768, "epoch": 196} {"train_loss": -30.316913604736328, "global_step": 23769, "epoch": 196} {"train_loss": -30.687345504760742, "global_step": 23770, "epoch": 196} {"train_loss": -30.268590927124023, "global_step": 23771, "epoch": 196} {"train_loss": -31.589834213256836, "global_step": 23772, "epoch": 196} {"train_loss": -30.604785919189453, "global_step": 23773, "epoch": 196} {"train_loss": -30.23554039001465, "global_step": 23774, "epoch": 196} {"train_loss": -30.293424606323242, "global_step": 23775, "epoch": 196} {"train_loss": -30.885974884033203, "global_step": 23776, "epoch": 196} {"train_loss": -30.22881507873535, "global_step": 23777, "epoch": 196} {"train_loss": -29.100019454956055, "global_step": 23778, "epoch": 196} {"train_loss": -30.427831649780273, "global_step": 23779, "epoch": 196} {"train_loss": -30.854883193969727, "global_step": 23780, "epoch": 196} {"train_loss": -29.790185928344727, "global_step": 23781, "epoch": 196} {"train_loss": -29.8775634765625, "global_step": 23782, "epoch": 196} {"train_loss": -29.925418853759766, "global_step": 23783, "epoch": 196} {"train_loss": -29.530319213867188, "global_step": 23784, "epoch": 196} {"train_loss": -31.07124900817871, "global_step": 23785, "epoch": 196} {"train_loss": -29.79041862487793, "global_step": 23786, "epoch": 196} {"train_loss": -29.06772232055664, "global_step": 23787, "epoch": 196} {"train_loss": -29.8248348236084, "global_step": 23788, "epoch": 196} {"train_loss": -28.924060821533203, "global_step": 23789, "epoch": 196} {"train_loss": -30.370227813720703, "global_step": 23790, "epoch": 196} {"train_loss": -30.315399169921875, "global_step": 23791, "epoch": 196} {"train_loss": -31.439111709594727, "global_step": 23792, "epoch": 196} {"train_loss": -30.33699607849121, "global_step": 23793, "epoch": 196} {"train_loss": -30.5609188079834, "global_step": 23794, "epoch": 196} {"train_loss": -30.592819213867188, "global_step": 23795, "epoch": 196} {"train_loss": -31.25856590270996, "global_step": 23796, "epoch": 196} {"train_loss": -30.5258846282959, "global_step": 23797, "epoch": 196} {"train_loss": -30.66619300842285, "global_step": 23798, "epoch": 196} {"train_loss": -30.223236083984375, "global_step": 23799, "epoch": 196} {"train_loss": -30.520954132080078, "global_step": 23800, "epoch": 196} {"train_loss": -30.295461654663086, "global_step": 23801, "epoch": 196} {"train_loss": -30.73406410217285, "global_step": 23802, "epoch": 196} {"train_loss": -30.54648208618164, "global_step": 23803, "epoch": 196} {"train_loss": -29.806325912475586, "global_step": 23804, "epoch": 196} {"train_loss": -30.445642471313477, "global_step": 23805, "epoch": 196} {"train_loss": -30.743066787719727, "global_step": 23806, "epoch": 196} {"train_loss": -30.329639434814453, "global_step": 23807, "epoch": 196} {"train_loss": -30.709680557250977, "global_step": 23808, "epoch": 196} {"train_loss": -30.72393226623535, "global_step": 23809, "epoch": 196} {"train_loss": -30.47677993774414, "global_step": 23810, "epoch": 196} {"train_loss": -31.091318130493164, "global_step": 23811, "epoch": 196} {"train_loss": -30.425573348999023, "global_step": 23812, "epoch": 196} {"train_loss": -30.366140365600586, "global_step": 23813, "epoch": 196} {"train_loss": -30.751758575439453, "global_step": 23814, "epoch": 196} {"train_loss": -30.77613639831543, "global_step": 23815, "epoch": 196} {"train_loss": -30.41641616821289, "global_step": 23816, "epoch": 196} {"train_loss": -31.23060417175293, "global_step": 23817, "epoch": 196} {"train_loss": -30.777179718017578, "global_step": 23818, "epoch": 196} {"train_loss": -31.179996490478516, "global_step": 23819, "epoch": 196} {"train_loss": -30.7678165435791, "global_step": 23820, "epoch": 196} {"train_loss": -31.228796005249023, "global_step": 23821, "epoch": 196} {"train_loss": -31.260705947875977, "global_step": 23822, "epoch": 196} {"train_loss": -31.319684982299805, "global_step": 23823, "epoch": 196} {"train_loss": -31.427011489868164, "global_step": 23824, "epoch": 196} {"train_loss": -31.170913696289062, "global_step": 23825, "epoch": 196} {"train_loss": -31.759313583374023, "global_step": 23826, "epoch": 196} {"train_loss": -31.424840927124023, "global_step": 23827, "epoch": 196} {"train_loss": -30.89784049987793, "global_step": 23828, "epoch": 196} {"train_loss": -31.31452751159668, "global_step": 23829, "epoch": 196} {"train_loss": -31.194061279296875, "global_step": 23830, "epoch": 196} {"train_loss": -31.158100128173828, "global_step": 23831, "epoch": 196} {"train_loss": -31.504491806030273, "global_step": 23832, "epoch": 196} {"train_loss": -31.313812255859375, "global_step": 23833, "epoch": 196} {"train_loss": -31.450963973999023, "global_step": 23834, "epoch": 196} {"train_loss": -31.890522003173828, "global_step": 23835, "epoch": 196} {"train_loss": -30.38493930406807, "global_step": 23836, "epoch": 196, "val_loss": 2770350.75} {"train_loss": -31.044708251953125, "global_step": 23837, "epoch": 197} {"train_loss": -30.975006103515625, "global_step": 23838, "epoch": 197} {"train_loss": -31.244176864624023, "global_step": 23839, "epoch": 197} {"train_loss": -30.872100830078125, "global_step": 23840, "epoch": 197} {"train_loss": -31.0338134765625, "global_step": 23841, "epoch": 197} {"train_loss": -28.94550132751465, "global_step": 23842, "epoch": 197} {"train_loss": -30.449329376220703, "global_step": 23843, "epoch": 197} {"train_loss": -29.049102783203125, "global_step": 23844, "epoch": 197} {"train_loss": -29.857019424438477, "global_step": 23845, "epoch": 197} {"train_loss": -28.77596092224121, "global_step": 23846, "epoch": 197} {"train_loss": -27.619495391845703, "global_step": 23847, "epoch": 197} {"train_loss": -28.556854248046875, "global_step": 23848, "epoch": 197} {"train_loss": -28.89692497253418, "global_step": 23849, "epoch": 197} {"train_loss": -30.62544059753418, "global_step": 23850, "epoch": 197} {"train_loss": -28.14788246154785, "global_step": 23851, "epoch": 197} {"train_loss": -29.189050674438477, "global_step": 23852, "epoch": 197} {"train_loss": -30.75791358947754, "global_step": 23853, "epoch": 197} {"train_loss": -29.11783790588379, "global_step": 23854, "epoch": 197} {"train_loss": -30.4050235748291, "global_step": 23855, "epoch": 197} {"train_loss": -30.56684684753418, "global_step": 23856, "epoch": 197} {"train_loss": -29.1458740234375, "global_step": 23857, "epoch": 197} {"train_loss": -30.195138931274414, "global_step": 23858, "epoch": 197} {"train_loss": -30.035058975219727, "global_step": 23859, "epoch": 197} {"train_loss": -30.13872718811035, "global_step": 23860, "epoch": 197} {"train_loss": -29.238203048706055, "global_step": 23861, "epoch": 197} {"train_loss": -29.343271255493164, "global_step": 23862, "epoch": 197} {"train_loss": -30.01197624206543, "global_step": 23863, "epoch": 197} {"train_loss": -30.35431480407715, "global_step": 23864, "epoch": 197} {"train_loss": -30.05755043029785, "global_step": 23865, "epoch": 197} {"train_loss": -30.508975982666016, "global_step": 23866, "epoch": 197} {"train_loss": -30.226154327392578, "global_step": 23867, "epoch": 197} {"train_loss": -30.184247970581055, "global_step": 23868, "epoch": 197} {"train_loss": -30.617002487182617, "global_step": 23869, "epoch": 197} {"train_loss": -30.942493438720703, "global_step": 23870, "epoch": 197} {"train_loss": -30.168439865112305, "global_step": 23871, "epoch": 197} {"train_loss": -31.038496017456055, "global_step": 23872, "epoch": 197} {"train_loss": -30.45542335510254, "global_step": 23873, "epoch": 197} {"train_loss": -30.39204216003418, "global_step": 23874, "epoch": 197} {"train_loss": -30.88905143737793, "global_step": 23875, "epoch": 197} {"train_loss": -30.482330322265625, "global_step": 23876, "epoch": 197} {"train_loss": -30.95478630065918, "global_step": 23877, "epoch": 197} {"train_loss": -30.838993072509766, "global_step": 23878, "epoch": 197} {"train_loss": -31.458755493164062, "global_step": 23879, "epoch": 197} {"train_loss": -30.29412269592285, "global_step": 23880, "epoch": 197} {"train_loss": -30.778181076049805, "global_step": 23881, "epoch": 197} {"train_loss": -31.155405044555664, "global_step": 23882, "epoch": 197} {"train_loss": -30.7210693359375, "global_step": 23883, "epoch": 197} {"train_loss": -30.718915939331055, "global_step": 23884, "epoch": 197} {"train_loss": -31.264591217041016, "global_step": 23885, "epoch": 197} {"train_loss": -31.045673370361328, "global_step": 23886, "epoch": 197} {"train_loss": -31.009511947631836, "global_step": 23887, "epoch": 197} {"train_loss": -31.208765029907227, "global_step": 23888, "epoch": 197} {"train_loss": -30.977481842041016, "global_step": 23889, "epoch": 197} {"train_loss": -31.151269912719727, "global_step": 23890, "epoch": 197} {"train_loss": -30.948896408081055, "global_step": 23891, "epoch": 197} {"train_loss": -30.58426284790039, "global_step": 23892, "epoch": 197} {"train_loss": -31.236433029174805, "global_step": 23893, "epoch": 197} {"train_loss": -31.255615234375, "global_step": 23894, "epoch": 197} {"train_loss": -30.155256271362305, "global_step": 23895, "epoch": 197} {"train_loss": -30.33692741394043, "global_step": 23896, "epoch": 197} {"train_loss": -30.714893341064453, "global_step": 23897, "epoch": 197} {"train_loss": -31.1668701171875, "global_step": 23898, "epoch": 197} {"train_loss": -30.691755294799805, "global_step": 23899, "epoch": 197} {"train_loss": -30.539657592773438, "global_step": 23900, "epoch": 197} {"train_loss": -30.687835693359375, "global_step": 23901, "epoch": 197} {"train_loss": -31.551366806030273, "global_step": 23902, "epoch": 197} {"train_loss": -30.449060440063477, "global_step": 23903, "epoch": 197} {"train_loss": -31.208459854125977, "global_step": 23904, "epoch": 197} {"train_loss": -31.28260612487793, "global_step": 23905, "epoch": 197} {"train_loss": -31.263235092163086, "global_step": 23906, "epoch": 197} {"train_loss": -30.88027000427246, "global_step": 23907, "epoch": 197} {"train_loss": -30.96088981628418, "global_step": 23908, "epoch": 197} {"train_loss": -31.24026870727539, "global_step": 23909, "epoch": 197} {"train_loss": -30.48699378967285, "global_step": 23910, "epoch": 197} {"train_loss": -30.849761962890625, "global_step": 23911, "epoch": 197} {"train_loss": -30.80909538269043, "global_step": 23912, "epoch": 197} {"train_loss": -31.243000030517578, "global_step": 23913, "epoch": 197} {"train_loss": -30.850217819213867, "global_step": 23914, "epoch": 197} {"train_loss": -31.37867546081543, "global_step": 23915, "epoch": 197} {"train_loss": -31.0439510345459, "global_step": 23916, "epoch": 197} {"train_loss": -31.65899658203125, "global_step": 23917, "epoch": 197} {"train_loss": -31.185346603393555, "global_step": 23918, "epoch": 197} {"train_loss": -32.033447265625, "global_step": 23919, "epoch": 197} {"train_loss": -31.495269775390625, "global_step": 23920, "epoch": 197} {"train_loss": -31.940414428710938, "global_step": 23921, "epoch": 197} {"train_loss": -31.769861221313477, "global_step": 23922, "epoch": 197} {"train_loss": -31.5100040435791, "global_step": 23923, "epoch": 197} {"train_loss": -31.666479110717773, "global_step": 23924, "epoch": 197} {"train_loss": -31.24653434753418, "global_step": 23925, "epoch": 197} {"train_loss": -31.251285552978516, "global_step": 23926, "epoch": 197} {"train_loss": -31.0969295501709, "global_step": 23927, "epoch": 197} {"train_loss": -31.0062255859375, "global_step": 23928, "epoch": 197} {"train_loss": -30.071340560913086, "global_step": 23929, "epoch": 197} {"train_loss": -28.746326446533203, "global_step": 23930, "epoch": 197} {"train_loss": -29.82084083557129, "global_step": 23931, "epoch": 197} {"train_loss": -30.337080001831055, "global_step": 23932, "epoch": 197} {"train_loss": -30.131885528564453, "global_step": 23933, "epoch": 197} {"train_loss": -31.482275009155273, "global_step": 23934, "epoch": 197} {"train_loss": -30.778547286987305, "global_step": 23935, "epoch": 197} {"train_loss": -31.61150550842285, "global_step": 23936, "epoch": 197} {"train_loss": -31.689010620117188, "global_step": 23937, "epoch": 197} {"train_loss": -30.51845359802246, "global_step": 23938, "epoch": 197} {"train_loss": -30.454212188720703, "global_step": 23939, "epoch": 197} {"train_loss": -28.869232177734375, "global_step": 23940, "epoch": 197} {"train_loss": -27.75886344909668, "global_step": 23941, "epoch": 197} {"train_loss": -25.96087646484375, "global_step": 23942, "epoch": 197} {"train_loss": -27.071949005126953, "global_step": 23943, "epoch": 197} {"train_loss": -30.977136611938477, "global_step": 23944, "epoch": 197} {"train_loss": -28.948822021484375, "global_step": 23945, "epoch": 197} {"train_loss": -29.346332550048828, "global_step": 23946, "epoch": 197} {"train_loss": -30.394819259643555, "global_step": 23947, "epoch": 197} {"train_loss": -29.704666137695312, "global_step": 23948, "epoch": 197} {"train_loss": -31.086612701416016, "global_step": 23949, "epoch": 197} {"train_loss": -30.460962295532227, "global_step": 23950, "epoch": 197} {"train_loss": -31.18955421447754, "global_step": 23951, "epoch": 197} {"train_loss": -31.01350212097168, "global_step": 23952, "epoch": 197} {"train_loss": -30.60737419128418, "global_step": 23953, "epoch": 197} {"train_loss": -31.107192993164062, "global_step": 23954, "epoch": 197} {"train_loss": -30.87265396118164, "global_step": 23955, "epoch": 197} {"train_loss": -31.204504013061523, "global_step": 23956, "epoch": 197} {"train_loss": -30.48827551219089, "global_step": 23957, "epoch": 197, "val_loss": 2589342.0} {"train_loss": -30.95387077331543, "global_step": 23958, "epoch": 198} {"train_loss": -31.263446807861328, "global_step": 23959, "epoch": 198} {"train_loss": -31.3952693939209, "global_step": 23960, "epoch": 198} {"train_loss": -31.037689208984375, "global_step": 23961, "epoch": 198} {"train_loss": -30.441715240478516, "global_step": 23962, "epoch": 198} {"train_loss": -29.556339263916016, "global_step": 23963, "epoch": 198} {"train_loss": -29.87759780883789, "global_step": 23964, "epoch": 198} {"train_loss": -28.921178817749023, "global_step": 23965, "epoch": 198} {"train_loss": -29.861408233642578, "global_step": 23966, "epoch": 198} {"train_loss": -29.444616317749023, "global_step": 23967, "epoch": 198} {"train_loss": -30.619037628173828, "global_step": 23968, "epoch": 198} {"train_loss": -31.007543563842773, "global_step": 23969, "epoch": 198} {"train_loss": -30.43120765686035, "global_step": 23970, "epoch": 198} {"train_loss": -29.821638107299805, "global_step": 23971, "epoch": 198} {"train_loss": -30.345449447631836, "global_step": 23972, "epoch": 198} {"train_loss": -29.89739418029785, "global_step": 23973, "epoch": 198} {"train_loss": -30.377593994140625, "global_step": 23974, "epoch": 198} {"train_loss": -30.22052001953125, "global_step": 23975, "epoch": 198} {"train_loss": -30.011159896850586, "global_step": 23976, "epoch": 198} {"train_loss": -30.0889835357666, "global_step": 23977, "epoch": 198} {"train_loss": -29.46563720703125, "global_step": 23978, "epoch": 198} {"train_loss": -30.26032066345215, "global_step": 23979, "epoch": 198} {"train_loss": -30.39739418029785, "global_step": 23980, "epoch": 198} {"train_loss": -30.194379806518555, "global_step": 23981, "epoch": 198} {"train_loss": -29.271528244018555, "global_step": 23982, "epoch": 198} {"train_loss": -30.53973388671875, "global_step": 23983, "epoch": 198} {"train_loss": -30.566022872924805, "global_step": 23984, "epoch": 198} {"train_loss": -30.05341148376465, "global_step": 23985, "epoch": 198} {"train_loss": -29.819921493530273, "global_step": 23986, "epoch": 198} {"train_loss": -30.79026222229004, "global_step": 23987, "epoch": 198} {"train_loss": -30.21192741394043, "global_step": 23988, "epoch": 198} {"train_loss": -29.986783981323242, "global_step": 23989, "epoch": 198} {"train_loss": -30.438098907470703, "global_step": 23990, "epoch": 198} {"train_loss": -29.618677139282227, "global_step": 23991, "epoch": 198} {"train_loss": -30.70387840270996, "global_step": 23992, "epoch": 198} {"train_loss": -30.55792808532715, "global_step": 23993, "epoch": 198} {"train_loss": -29.302743911743164, "global_step": 23994, "epoch": 198} {"train_loss": -30.83222007751465, "global_step": 23995, "epoch": 198} {"train_loss": -30.699201583862305, "global_step": 23996, "epoch": 198} {"train_loss": -30.85735511779785, "global_step": 23997, "epoch": 198} {"train_loss": -30.472288131713867, "global_step": 23998, "epoch": 198} {"train_loss": -31.463947296142578, "global_step": 23999, "epoch": 198} {"train_loss": -30.800186157226562, "global_step": 24000, "epoch": 198} {"train_loss": -30.002593994140625, "global_step": 24001, "epoch": 198} {"train_loss": -30.389867782592773, "global_step": 24002, "epoch": 198} {"train_loss": -31.213727951049805, "global_step": 24003, "epoch": 198} {"train_loss": -31.424917221069336, "global_step": 24004, "epoch": 198} {"train_loss": -30.117874145507812, "global_step": 24005, "epoch": 198} {"train_loss": -30.892242431640625, "global_step": 24006, "epoch": 198} {"train_loss": -31.285390853881836, "global_step": 24007, "epoch": 198} {"train_loss": -29.585676193237305, "global_step": 24008, "epoch": 198} {"train_loss": -30.75188636779785, "global_step": 24009, "epoch": 198} {"train_loss": -31.379858016967773, "global_step": 24010, "epoch": 198} {"train_loss": -30.60162353515625, "global_step": 24011, "epoch": 198} {"train_loss": -30.578571319580078, "global_step": 24012, "epoch": 198} {"train_loss": -31.220733642578125, "global_step": 24013, "epoch": 198} {"train_loss": -30.479040145874023, "global_step": 24014, "epoch": 198} {"train_loss": -31.916868209838867, "global_step": 24015, "epoch": 198} {"train_loss": -31.155912399291992, "global_step": 24016, "epoch": 198} {"train_loss": -31.133697509765625, "global_step": 24017, "epoch": 198} {"train_loss": -31.526762008666992, "global_step": 24018, "epoch": 198} {"train_loss": -31.323352813720703, "global_step": 24019, "epoch": 198} {"train_loss": -31.93552017211914, "global_step": 24020, "epoch": 198} {"train_loss": -31.597715377807617, "global_step": 24021, "epoch": 198} {"train_loss": -31.376178741455078, "global_step": 24022, "epoch": 198} {"train_loss": -31.69586181640625, "global_step": 24023, "epoch": 198} {"train_loss": -31.308643341064453, "global_step": 24024, "epoch": 198} {"train_loss": -31.70979881286621, "global_step": 24025, "epoch": 198} {"train_loss": -31.97181510925293, "global_step": 24026, "epoch": 198} {"train_loss": -31.561559677124023, "global_step": 24027, "epoch": 198} {"train_loss": -31.59247398376465, "global_step": 24028, "epoch": 198} {"train_loss": -31.567340850830078, "global_step": 24029, "epoch": 198} {"train_loss": -31.4017333984375, "global_step": 24030, "epoch": 198} {"train_loss": -31.39227294921875, "global_step": 24031, "epoch": 198} {"train_loss": -31.367267608642578, "global_step": 24032, "epoch": 198} {"train_loss": -32.239173889160156, "global_step": 24033, "epoch": 198} {"train_loss": -31.680021286010742, "global_step": 24034, "epoch": 198} {"train_loss": -31.814184188842773, "global_step": 24035, "epoch": 198} {"train_loss": -31.74102783203125, "global_step": 24036, "epoch": 198} {"train_loss": -31.96927261352539, "global_step": 24037, "epoch": 198} {"train_loss": -31.654226303100586, "global_step": 24038, "epoch": 198} {"train_loss": -31.464441299438477, "global_step": 24039, "epoch": 198} {"train_loss": -31.43006706237793, "global_step": 24040, "epoch": 198} {"train_loss": -31.703123092651367, "global_step": 24041, "epoch": 198} {"train_loss": -31.907073974609375, "global_step": 24042, "epoch": 198} {"train_loss": -31.85312843322754, "global_step": 24043, "epoch": 198} {"train_loss": -31.8487606048584, "global_step": 24044, "epoch": 198} {"train_loss": -31.717639923095703, "global_step": 24045, "epoch": 198} {"train_loss": -32.0148811340332, "global_step": 24046, "epoch": 198} {"train_loss": -31.969940185546875, "global_step": 24047, "epoch": 198} {"train_loss": -31.91228675842285, "global_step": 24048, "epoch": 198} {"train_loss": -31.866806030273438, "global_step": 24049, "epoch": 198} {"train_loss": -31.133886337280273, "global_step": 24050, "epoch": 198} {"train_loss": -31.194135665893555, "global_step": 24051, "epoch": 198} {"train_loss": -30.896772384643555, "global_step": 24052, "epoch": 198} {"train_loss": -31.24395751953125, "global_step": 24053, "epoch": 198} {"train_loss": -30.868331909179688, "global_step": 24054, "epoch": 198} {"train_loss": -31.734272003173828, "global_step": 24055, "epoch": 198} {"train_loss": -31.986494064331055, "global_step": 24056, "epoch": 198} {"train_loss": -31.29157066345215, "global_step": 24057, "epoch": 198} {"train_loss": -29.26276206970215, "global_step": 24058, "epoch": 198} {"train_loss": -26.5804443359375, "global_step": 24059, "epoch": 198} {"train_loss": -20.5190486907959, "global_step": 24060, "epoch": 198} {"train_loss": -7.381014347076416, "global_step": 24061, "epoch": 198} {"train_loss": -5.770808696746826, "global_step": 24062, "epoch": 198} {"train_loss": -28.7362060546875, "global_step": 24063, "epoch": 198} {"train_loss": -20.585779190063477, "global_step": 24064, "epoch": 198} {"train_loss": -28.54096794128418, "global_step": 24065, "epoch": 198} {"train_loss": -25.862049102783203, "global_step": 24066, "epoch": 198} {"train_loss": -25.793914794921875, "global_step": 24067, "epoch": 198} {"train_loss": -29.04379653930664, "global_step": 24068, "epoch": 198} {"train_loss": -27.66947364807129, "global_step": 24069, "epoch": 198} {"train_loss": -25.187694549560547, "global_step": 24070, "epoch": 198} {"train_loss": -27.9613037109375, "global_step": 24071, "epoch": 198} {"train_loss": -28.848041534423828, "global_step": 24072, "epoch": 198} {"train_loss": -26.904052734375, "global_step": 24073, "epoch": 198} {"train_loss": -29.667810440063477, "global_step": 24074, "epoch": 198} {"train_loss": -27.874738693237305, "global_step": 24075, "epoch": 198} {"train_loss": -28.47382164001465, "global_step": 24076, "epoch": 198} {"train_loss": -27.707233428955078, "global_step": 24077, "epoch": 198} {"train_loss": -29.9135487926893, "global_step": 24078, "epoch": 198, "val_loss": 2708507.0} {"train_loss": -29.0955810546875, "global_step": 24079, "epoch": 199} {"train_loss": -30.0677433013916, "global_step": 24080, "epoch": 199} {"train_loss": -29.207788467407227, "global_step": 24081, "epoch": 199} {"train_loss": -29.196826934814453, "global_step": 24082, "epoch": 199} {"train_loss": -29.35309410095215, "global_step": 24083, "epoch": 199} {"train_loss": -29.35064697265625, "global_step": 24084, "epoch": 199} {"train_loss": -29.71892738342285, "global_step": 24085, "epoch": 199} {"train_loss": -29.778486251831055, "global_step": 24086, "epoch": 199} {"train_loss": -30.005126953125, "global_step": 24087, "epoch": 199} {"train_loss": -30.096418380737305, "global_step": 24088, "epoch": 199} {"train_loss": -30.121234893798828, "global_step": 24089, "epoch": 199} {"train_loss": -30.070175170898438, "global_step": 24090, "epoch": 199} {"train_loss": -30.20298194885254, "global_step": 24091, "epoch": 199} {"train_loss": -30.088092803955078, "global_step": 24092, "epoch": 199} {"train_loss": -29.83587074279785, "global_step": 24093, "epoch": 199} {"train_loss": -29.79721450805664, "global_step": 24094, "epoch": 199} {"train_loss": -30.10328483581543, "global_step": 24095, "epoch": 199} {"train_loss": -30.198514938354492, "global_step": 24096, "epoch": 199} {"train_loss": -30.07648277282715, "global_step": 24097, "epoch": 199} {"train_loss": -29.99957275390625, "global_step": 24098, "epoch": 199} {"train_loss": -29.81426429748535, "global_step": 24099, "epoch": 199} {"train_loss": -30.40272331237793, "global_step": 24100, "epoch": 199} {"train_loss": -29.967105865478516, "global_step": 24101, "epoch": 199} {"train_loss": -29.9920654296875, "global_step": 24102, "epoch": 199} {"train_loss": -30.529132843017578, "global_step": 24103, "epoch": 199} {"train_loss": -30.459630966186523, "global_step": 24104, "epoch": 199} {"train_loss": -30.12177848815918, "global_step": 24105, "epoch": 199} {"train_loss": -30.566686630249023, "global_step": 24106, "epoch": 199} {"train_loss": -30.650388717651367, "global_step": 24107, "epoch": 199} {"train_loss": -30.680500030517578, "global_step": 24108, "epoch": 199} {"train_loss": -30.36958122253418, "global_step": 24109, "epoch": 199} {"train_loss": -30.396961212158203, "global_step": 24110, "epoch": 199} {"train_loss": -29.894363403320312, "global_step": 24111, "epoch": 199} {"train_loss": -30.305530548095703, "global_step": 24112, "epoch": 199} {"train_loss": -30.400304794311523, "global_step": 24113, "epoch": 199} {"train_loss": -30.163223266601562, "global_step": 24114, "epoch": 199} {"train_loss": -29.80032730102539, "global_step": 24115, "epoch": 199} {"train_loss": -29.236181259155273, "global_step": 24116, "epoch": 199} {"train_loss": -28.210275650024414, "global_step": 24117, "epoch": 199} {"train_loss": -28.683820724487305, "global_step": 24118, "epoch": 199} {"train_loss": -30.40070152282715, "global_step": 24119, "epoch": 199} {"train_loss": -30.469470977783203, "global_step": 24120, "epoch": 199} {"train_loss": -30.478137969970703, "global_step": 24121, "epoch": 199} {"train_loss": -30.369049072265625, "global_step": 24122, "epoch": 199} {"train_loss": -30.707799911499023, "global_step": 24123, "epoch": 199} {"train_loss": -30.2973690032959, "global_step": 24124, "epoch": 199} {"train_loss": -30.05586051940918, "global_step": 24125, "epoch": 199} {"train_loss": -30.81641960144043, "global_step": 24126, "epoch": 199} {"train_loss": -30.412250518798828, "global_step": 24127, "epoch": 199} {"train_loss": -30.919912338256836, "global_step": 24128, "epoch": 199} {"train_loss": -30.372949600219727, "global_step": 24129, "epoch": 199} {"train_loss": -30.57425880432129, "global_step": 24130, "epoch": 199} {"train_loss": -30.286148071289062, "global_step": 24131, "epoch": 199} {"train_loss": -30.01494789123535, "global_step": 24132, "epoch": 199} {"train_loss": -30.5017032623291, "global_step": 24133, "epoch": 199} {"train_loss": -29.697463989257812, "global_step": 24134, "epoch": 199} {"train_loss": -30.22532081604004, "global_step": 24135, "epoch": 199} {"train_loss": -30.187788009643555, "global_step": 24136, "epoch": 199} {"train_loss": -30.149398803710938, "global_step": 24137, "epoch": 199} {"train_loss": -29.12387466430664, "global_step": 24138, "epoch": 199} {"train_loss": -23.180341720581055, "global_step": 24139, "epoch": 199} {"train_loss": -5.827807903289795, "global_step": 24140, "epoch": 199} {"train_loss": -7.203355312347412, "global_step": 24141, "epoch": 199} {"train_loss": -29.168292999267578, "global_step": 24142, "epoch": 199} {"train_loss": -12.226805686950684, "global_step": 24143, "epoch": 199} {"train_loss": -28.664194107055664, "global_step": 24144, "epoch": 199} {"train_loss": -24.3482723236084, "global_step": 24145, "epoch": 199} {"train_loss": -22.607486724853516, "global_step": 24146, "epoch": 199} {"train_loss": -29.05854606628418, "global_step": 24147, "epoch": 199} {"train_loss": -28.506210327148438, "global_step": 24148, "epoch": 199} {"train_loss": -26.952484130859375, "global_step": 24149, "epoch": 199} {"train_loss": -27.092809677124023, "global_step": 24150, "epoch": 199} {"train_loss": -28.130237579345703, "global_step": 24151, "epoch": 199} {"train_loss": -28.35487937927246, "global_step": 24152, "epoch": 199} {"train_loss": -28.773569107055664, "global_step": 24153, "epoch": 199} {"train_loss": -28.931970596313477, "global_step": 24154, "epoch": 199} {"train_loss": -28.387189865112305, "global_step": 24155, "epoch": 199} {"train_loss": -28.317569732666016, "global_step": 24156, "epoch": 199} {"train_loss": -28.153217315673828, "global_step": 24157, "epoch": 199} {"train_loss": -28.525060653686523, "global_step": 24158, "epoch": 199} {"train_loss": -28.960845947265625, "global_step": 24159, "epoch": 199} {"train_loss": -29.048267364501953, "global_step": 24160, "epoch": 199} {"train_loss": -29.25872802734375, "global_step": 24161, "epoch": 199} {"train_loss": -29.483551025390625, "global_step": 24162, "epoch": 199} {"train_loss": -28.9737606048584, "global_step": 24163, "epoch": 199} {"train_loss": -29.356367111206055, "global_step": 24164, "epoch": 199} {"train_loss": -29.29513931274414, "global_step": 24165, "epoch": 199} {"train_loss": -29.383438110351562, "global_step": 24166, "epoch": 199} {"train_loss": -29.488611221313477, "global_step": 24167, "epoch": 199} {"train_loss": -29.4138240814209, "global_step": 24168, "epoch": 199} {"train_loss": -29.3984432220459, "global_step": 24169, "epoch": 199} {"train_loss": -29.253040313720703, "global_step": 24170, "epoch": 199} {"train_loss": -29.928043365478516, "global_step": 24171, "epoch": 199} {"train_loss": -29.7343692779541, "global_step": 24172, "epoch": 199} {"train_loss": -29.4505615234375, "global_step": 24173, "epoch": 199} {"train_loss": -29.81922721862793, "global_step": 24174, "epoch": 199} {"train_loss": -29.95977783203125, "global_step": 24175, "epoch": 199} {"train_loss": -29.731393814086914, "global_step": 24176, "epoch": 199} {"train_loss": -29.582263946533203, "global_step": 24177, "epoch": 199} {"train_loss": -29.89051628112793, "global_step": 24178, "epoch": 199} {"train_loss": -29.994836807250977, "global_step": 24179, "epoch": 199} {"train_loss": -30.136890411376953, "global_step": 24180, "epoch": 199} {"train_loss": -29.683643341064453, "global_step": 24181, "epoch": 199} {"train_loss": -29.81464195251465, "global_step": 24182, "epoch": 199} {"train_loss": -30.3106746673584, "global_step": 24183, "epoch": 199} {"train_loss": -30.28610610961914, "global_step": 24184, "epoch": 199} {"train_loss": -30.349206924438477, "global_step": 24185, "epoch": 199} {"train_loss": -30.04620933532715, "global_step": 24186, "epoch": 199} {"train_loss": -30.015399932861328, "global_step": 24187, "epoch": 199} {"train_loss": -30.222204208374023, "global_step": 24188, "epoch": 199} {"train_loss": -30.534696578979492, "global_step": 24189, "epoch": 199} {"train_loss": -30.066104888916016, "global_step": 24190, "epoch": 199} {"train_loss": -30.42056655883789, "global_step": 24191, "epoch": 199} {"train_loss": -30.317157745361328, "global_step": 24192, "epoch": 199} {"train_loss": -30.155139923095703, "global_step": 24193, "epoch": 199} {"train_loss": -30.590167999267578, "global_step": 24194, "epoch": 199} {"train_loss": -30.019607543945312, "global_step": 24195, "epoch": 199} {"train_loss": -30.171024322509766, "global_step": 24196, "epoch": 199} {"train_loss": -30.52667236328125, "global_step": 24197, "epoch": 199} {"train_loss": -30.0943603515625, "global_step": 24198, "epoch": 199} {"train_loss": -29.079782296803373, "global_step": 24199, "epoch": 199, "val_loss": 2498462.25} {"train_loss": -29.626605987548828, "global_step": 24200, "epoch": 200} {"train_loss": -30.168798446655273, "global_step": 24201, "epoch": 200} {"train_loss": -30.360380172729492, "global_step": 24202, "epoch": 200} {"train_loss": -29.976306915283203, "global_step": 24203, "epoch": 200} {"train_loss": -30.209619522094727, "global_step": 24204, "epoch": 200} {"train_loss": -29.727262496948242, "global_step": 24205, "epoch": 200} {"train_loss": -30.4586238861084, "global_step": 24206, "epoch": 200} {"train_loss": -29.902074813842773, "global_step": 24207, "epoch": 200} {"train_loss": -30.362430572509766, "global_step": 24208, "epoch": 200} {"train_loss": -30.116674423217773, "global_step": 24209, "epoch": 200} {"train_loss": -29.799015045166016, "global_step": 24210, "epoch": 200} {"train_loss": -30.461902618408203, "global_step": 24211, "epoch": 200} {"train_loss": -30.013427734375, "global_step": 24212, "epoch": 200} {"train_loss": -30.45267677307129, "global_step": 24213, "epoch": 200} {"train_loss": -30.597070693969727, "global_step": 24214, "epoch": 200} {"train_loss": -29.993087768554688, "global_step": 24215, "epoch": 200} {"train_loss": -30.66242027282715, "global_step": 24216, "epoch": 200} {"train_loss": -30.298065185546875, "global_step": 24217, "epoch": 200} {"train_loss": -30.597885131835938, "global_step": 24218, "epoch": 200} {"train_loss": -30.8457088470459, "global_step": 24219, "epoch": 200} {"train_loss": -30.621063232421875, "global_step": 24220, "epoch": 200} {"train_loss": -30.641651153564453, "global_step": 24221, "epoch": 200} {"train_loss": -30.085651397705078, "global_step": 24222, "epoch": 200} {"train_loss": -28.456933975219727, "global_step": 24223, "epoch": 200} {"train_loss": -22.47871208190918, "global_step": 24224, "epoch": 200} {"train_loss": -7.9016008377075195, "global_step": 24225, "epoch": 200} {"train_loss": 11.43435287475586, "global_step": 24226, "epoch": 200} {"train_loss": -10.932281494140625, "global_step": 24227, "epoch": 200} {"train_loss": -21.147993087768555, "global_step": 24228, "epoch": 200} {"train_loss": -23.367528915405273, "global_step": 24229, "epoch": 200} {"train_loss": -17.592138290405273, "global_step": 24230, "epoch": 200} {"train_loss": -28.13092613220215, "global_step": 24231, "epoch": 200} {"train_loss": -26.962182998657227, "global_step": 24232, "epoch": 200} {"train_loss": -23.159982681274414, "global_step": 24233, "epoch": 200} {"train_loss": -25.39642906188965, "global_step": 24234, "epoch": 200} {"train_loss": -28.84942054748535, "global_step": 24235, "epoch": 200} {"train_loss": -28.715768814086914, "global_step": 24236, "epoch": 200} {"train_loss": -28.049345016479492, "global_step": 24237, "epoch": 200} {"train_loss": -27.733081817626953, "global_step": 24238, "epoch": 200} {"train_loss": -27.424585342407227, "global_step": 24239, "epoch": 200} {"train_loss": -28.305200576782227, "global_step": 24240, "epoch": 200} {"train_loss": -27.815872192382812, "global_step": 24241, "epoch": 200} {"train_loss": -28.22199821472168, "global_step": 24242, "epoch": 200} {"train_loss": -28.590723037719727, "global_step": 24243, "epoch": 200} {"train_loss": -28.825345993041992, "global_step": 24244, "epoch": 200} {"train_loss": -28.2078914642334, "global_step": 24245, "epoch": 200} {"train_loss": -28.73832130432129, "global_step": 24246, "epoch": 200} {"train_loss": -28.698719024658203, "global_step": 24247, "epoch": 200} {"train_loss": -28.790292739868164, "global_step": 24248, "epoch": 200} {"train_loss": -28.805561065673828, "global_step": 24249, "epoch": 200} {"train_loss": -29.1098575592041, "global_step": 24250, "epoch": 200} {"train_loss": -29.240116119384766, "global_step": 24251, "epoch": 200} {"train_loss": -29.28733253479004, "global_step": 24252, "epoch": 200} {"train_loss": -29.401325225830078, "global_step": 24253, "epoch": 200} {"train_loss": -29.30523109436035, "global_step": 24254, "epoch": 200} {"train_loss": -29.258771896362305, "global_step": 24255, "epoch": 200} {"train_loss": -29.520980834960938, "global_step": 24256, "epoch": 200} {"train_loss": -29.428821563720703, "global_step": 24257, "epoch": 200} {"train_loss": -29.5694580078125, "global_step": 24258, "epoch": 200} {"train_loss": -29.3630313873291, "global_step": 24259, "epoch": 200} {"train_loss": -29.777496337890625, "global_step": 24260, "epoch": 200} {"train_loss": -29.134296417236328, "global_step": 24261, "epoch": 200} {"train_loss": -29.96465492248535, "global_step": 24262, "epoch": 200} {"train_loss": -29.211530685424805, "global_step": 24263, "epoch": 200} {"train_loss": -29.735807418823242, "global_step": 24264, "epoch": 200} {"train_loss": -29.713916778564453, "global_step": 24265, "epoch": 200} {"train_loss": -29.66827392578125, "global_step": 24266, "epoch": 200} {"train_loss": -29.92245864868164, "global_step": 24267, "epoch": 200} {"train_loss": -29.244720458984375, "global_step": 24268, "epoch": 200} {"train_loss": -29.985198974609375, "global_step": 24269, "epoch": 200} {"train_loss": -29.37569236755371, "global_step": 24270, "epoch": 200} {"train_loss": -29.739614486694336, "global_step": 24271, "epoch": 200} {"train_loss": -29.470853805541992, "global_step": 24272, "epoch": 200} {"train_loss": -29.76287841796875, "global_step": 24273, "epoch": 200} {"train_loss": -29.347070693969727, "global_step": 24274, "epoch": 200} {"train_loss": -29.52433204650879, "global_step": 24275, "epoch": 200} {"train_loss": -30.114267349243164, "global_step": 24276, "epoch": 200} {"train_loss": -29.456220626831055, "global_step": 24277, "epoch": 200} {"train_loss": -29.706928253173828, "global_step": 24278, "epoch": 200} {"train_loss": -29.47314453125, "global_step": 24279, "epoch": 200} {"train_loss": -29.20659828186035, "global_step": 24280, "epoch": 200} {"train_loss": -29.427474975585938, "global_step": 24281, "epoch": 200} {"train_loss": -29.977060317993164, "global_step": 24282, "epoch": 200} {"train_loss": -29.23695182800293, "global_step": 24283, "epoch": 200} {"train_loss": -29.2850341796875, "global_step": 24284, "epoch": 200} {"train_loss": -29.35564613342285, "global_step": 24285, "epoch": 200} {"train_loss": -29.839624404907227, "global_step": 24286, "epoch": 200} {"train_loss": -29.41925048828125, "global_step": 24287, "epoch": 200} {"train_loss": -29.639368057250977, "global_step": 24288, "epoch": 200} {"train_loss": -28.925363540649414, "global_step": 24289, "epoch": 200} {"train_loss": -29.3642520904541, "global_step": 24290, "epoch": 200} {"train_loss": -29.491575241088867, "global_step": 24291, "epoch": 200} {"train_loss": -28.9454402923584, "global_step": 24292, "epoch": 200} {"train_loss": -29.102148056030273, "global_step": 24293, "epoch": 200} {"train_loss": -29.75701904296875, "global_step": 24294, "epoch": 200} {"train_loss": -27.9766902923584, "global_step": 24295, "epoch": 200} {"train_loss": -28.622695922851562, "global_step": 24296, "epoch": 200} {"train_loss": -29.542993545532227, "global_step": 24297, "epoch": 200} {"train_loss": -28.490049362182617, "global_step": 24298, "epoch": 200} {"train_loss": -29.500524520874023, "global_step": 24299, "epoch": 200} {"train_loss": -28.6801815032959, "global_step": 24300, "epoch": 200} {"train_loss": -29.074750900268555, "global_step": 24301, "epoch": 200} {"train_loss": -28.482532501220703, "global_step": 24302, "epoch": 200} {"train_loss": -28.922765731811523, "global_step": 24303, "epoch": 200} {"train_loss": -29.19911003112793, "global_step": 24304, "epoch": 200} {"train_loss": -28.4161376953125, "global_step": 24305, "epoch": 200} {"train_loss": -29.722517013549805, "global_step": 24306, "epoch": 200} {"train_loss": -29.174819946289062, "global_step": 24307, "epoch": 200} {"train_loss": -28.890844345092773, "global_step": 24308, "epoch": 200} {"train_loss": -29.709735870361328, "global_step": 24309, "epoch": 200} {"train_loss": -29.538244247436523, "global_step": 24310, "epoch": 200} {"train_loss": -29.393537521362305, "global_step": 24311, "epoch": 200} {"train_loss": -30.0391788482666, "global_step": 24312, "epoch": 200} {"train_loss": -29.907623291015625, "global_step": 24313, "epoch": 200} {"train_loss": -29.321760177612305, "global_step": 24314, "epoch": 200} {"train_loss": -29.68061637878418, "global_step": 24315, "epoch": 200} {"train_loss": -30.02023696899414, "global_step": 24316, "epoch": 200} {"train_loss": -30.036569595336914, "global_step": 24317, "epoch": 200} {"train_loss": -30.322742462158203, "global_step": 24318, "epoch": 200} {"train_loss": -29.95621109008789, "global_step": 24319, "epoch": 200} {"train_loss": -28.38820351056816, "global_step": 24320, "epoch": 200, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4400000": 1.0, "test/sim_max_reward_4400001": 1.0, "test/sim_max_reward_4400002": 1.0, "test/sim_max_reward_4400003": 1.0, "test/sim_max_reward_4400004": 1.0, "test/sim_max_reward_4400005": 1.0, "test/sim_max_reward_4400006": 1.0, "test/sim_max_reward_4400007": 1.0, "test/sim_max_reward_4400008": 1.0, "test/sim_max_reward_4400009": 1.0, "test/sim_max_reward_4400010": 1.0, "test/sim_max_reward_4400011": 1.0, "test/sim_max_reward_4400012": 1.0, "test/sim_max_reward_4400013": 1.0, "test/sim_max_reward_4400014": 1.0, "test/sim_max_reward_4400015": 1.0, "test/sim_max_reward_4400016": 1.0, "test/sim_max_reward_4400017": 1.0, "test/sim_max_reward_4400018": 1.0, "test/sim_max_reward_4400019": 1.0, "test/sim_max_reward_4400020": 1.0, "test/sim_max_reward_4400021": 1.0, "train/mean_score": 1.0, "test/mean_score": 1.0, "val_loss": 2502337.75} {"train_loss": -30.474853515625, "global_step": 24321, "epoch": 201} {"train_loss": -30.37189292907715, "global_step": 24322, "epoch": 201} {"train_loss": -29.283178329467773, "global_step": 24323, "epoch": 201} {"train_loss": -30.310415267944336, "global_step": 24324, "epoch": 201} {"train_loss": -30.20574951171875, "global_step": 24325, "epoch": 201} {"train_loss": -29.70232582092285, "global_step": 24326, "epoch": 201} {"train_loss": -30.3323974609375, "global_step": 24327, "epoch": 201} {"train_loss": -30.19044303894043, "global_step": 24328, "epoch": 201} {"train_loss": -30.164270401000977, "global_step": 24329, "epoch": 201} {"train_loss": -30.498151779174805, "global_step": 24330, "epoch": 201} {"train_loss": -30.247217178344727, "global_step": 24331, "epoch": 201} {"train_loss": -30.144275665283203, "global_step": 24332, "epoch": 201} {"train_loss": -30.502063751220703, "global_step": 24333, "epoch": 201} {"train_loss": -30.36102294921875, "global_step": 24334, "epoch": 201} {"train_loss": -30.489608764648438, "global_step": 24335, "epoch": 201} {"train_loss": -29.837560653686523, "global_step": 24336, "epoch": 201} {"train_loss": -29.864484786987305, "global_step": 24337, "epoch": 201} {"train_loss": -30.079914093017578, "global_step": 24338, "epoch": 201} {"train_loss": -30.005207061767578, "global_step": 24339, "epoch": 201} {"train_loss": -30.102832794189453, "global_step": 24340, "epoch": 201} {"train_loss": -29.643091201782227, "global_step": 24341, "epoch": 201} {"train_loss": -30.244842529296875, "global_step": 24342, "epoch": 201} {"train_loss": -30.197986602783203, "global_step": 24343, "epoch": 201} {"train_loss": -28.55084800720215, "global_step": 24344, "epoch": 201} {"train_loss": -30.048572540283203, "global_step": 24345, "epoch": 201} {"train_loss": -30.128326416015625, "global_step": 24346, "epoch": 201} {"train_loss": -30.3001708984375, "global_step": 24347, "epoch": 201} {"train_loss": -30.090131759643555, "global_step": 24348, "epoch": 201} {"train_loss": -30.681482315063477, "global_step": 24349, "epoch": 201} {"train_loss": -30.178359985351562, "global_step": 24350, "epoch": 201} {"train_loss": -30.41425895690918, "global_step": 24351, "epoch": 201} {"train_loss": -30.831396102905273, "global_step": 24352, "epoch": 201} {"train_loss": -30.522321701049805, "global_step": 24353, "epoch": 201} {"train_loss": -30.26682472229004, "global_step": 24354, "epoch": 201} {"train_loss": -30.717676162719727, "global_step": 24355, "epoch": 201} {"train_loss": -31.003915786743164, "global_step": 24356, "epoch": 201} {"train_loss": -30.621322631835938, "global_step": 24357, "epoch": 201} {"train_loss": -30.504308700561523, "global_step": 24358, "epoch": 201} {"train_loss": -30.66987419128418, "global_step": 24359, "epoch": 201} {"train_loss": -30.48805046081543, "global_step": 24360, "epoch": 201} {"train_loss": -30.713659286499023, "global_step": 24361, "epoch": 201} {"train_loss": -30.62249183654785, "global_step": 24362, "epoch": 201} {"train_loss": -30.79352378845215, "global_step": 24363, "epoch": 201} {"train_loss": -30.94501304626465, "global_step": 24364, "epoch": 201} {"train_loss": -30.25800132751465, "global_step": 24365, "epoch": 201} {"train_loss": -30.415802001953125, "global_step": 24366, "epoch": 201} {"train_loss": -30.700408935546875, "global_step": 24367, "epoch": 201} {"train_loss": -30.592432022094727, "global_step": 24368, "epoch": 201} {"train_loss": -31.323352813720703, "global_step": 24369, "epoch": 201} {"train_loss": -30.764057159423828, "global_step": 24370, "epoch": 201} {"train_loss": -30.803638458251953, "global_step": 24371, "epoch": 201} {"train_loss": -30.8728084564209, "global_step": 24372, "epoch": 201} {"train_loss": -30.679059982299805, "global_step": 24373, "epoch": 201} {"train_loss": -31.3382568359375, "global_step": 24374, "epoch": 201} {"train_loss": -30.45942497253418, "global_step": 24375, "epoch": 201} {"train_loss": -30.7150821685791, "global_step": 24376, "epoch": 201} {"train_loss": -30.96917152404785, "global_step": 24377, "epoch": 201} {"train_loss": -30.515966415405273, "global_step": 24378, "epoch": 201} {"train_loss": -31.175207138061523, "global_step": 24379, "epoch": 201} {"train_loss": -30.510244369506836, "global_step": 24380, "epoch": 201} {"train_loss": -31.00850486755371, "global_step": 24381, "epoch": 201} {"train_loss": -31.268972396850586, "global_step": 24382, "epoch": 201} {"train_loss": -30.811426162719727, "global_step": 24383, "epoch": 201} {"train_loss": -30.681791305541992, "global_step": 24384, "epoch": 201} {"train_loss": -30.39936637878418, "global_step": 24385, "epoch": 201} {"train_loss": -30.604084014892578, "global_step": 24386, "epoch": 201} {"train_loss": -30.986486434936523, "global_step": 24387, "epoch": 201} {"train_loss": -30.647003173828125, "global_step": 24388, "epoch": 201} {"train_loss": -30.847888946533203, "global_step": 24389, "epoch": 201} {"train_loss": -30.647144317626953, "global_step": 24390, "epoch": 201} {"train_loss": -30.590579986572266, "global_step": 24391, "epoch": 201} {"train_loss": -30.30729103088379, "global_step": 24392, "epoch": 201} {"train_loss": -30.308256149291992, "global_step": 24393, "epoch": 201} {"train_loss": -30.70949363708496, "global_step": 24394, "epoch": 201} {"train_loss": -30.964618682861328, "global_step": 24395, "epoch": 201} {"train_loss": -30.41752052307129, "global_step": 24396, "epoch": 201} {"train_loss": -29.623029708862305, "global_step": 24397, "epoch": 201} {"train_loss": -29.12176513671875, "global_step": 24398, "epoch": 201} {"train_loss": -29.798980712890625, "global_step": 24399, "epoch": 201} {"train_loss": -31.05525016784668, "global_step": 24400, "epoch": 201} {"train_loss": -30.322729110717773, "global_step": 24401, "epoch": 201} {"train_loss": -28.971755981445312, "global_step": 24402, "epoch": 201} {"train_loss": -30.51226234436035, "global_step": 24403, "epoch": 201} {"train_loss": -30.804534912109375, "global_step": 24404, "epoch": 201} {"train_loss": -28.9593448638916, "global_step": 24405, "epoch": 201} {"train_loss": -29.866058349609375, "global_step": 24406, "epoch": 201} {"train_loss": -30.5933780670166, "global_step": 24407, "epoch": 201} {"train_loss": -28.98304557800293, "global_step": 24408, "epoch": 201} {"train_loss": -30.398822784423828, "global_step": 24409, "epoch": 201} {"train_loss": -30.503705978393555, "global_step": 24410, "epoch": 201} {"train_loss": -30.227758407592773, "global_step": 24411, "epoch": 201} {"train_loss": -30.74462890625, "global_step": 24412, "epoch": 201} {"train_loss": -29.843830108642578, "global_step": 24413, "epoch": 201} {"train_loss": -31.034162521362305, "global_step": 24414, "epoch": 201} {"train_loss": -29.40376853942871, "global_step": 24415, "epoch": 201} {"train_loss": -30.6494197845459, "global_step": 24416, "epoch": 201} {"train_loss": -30.40584373474121, "global_step": 24417, "epoch": 201} {"train_loss": -31.02890396118164, "global_step": 24418, "epoch": 201} {"train_loss": -30.385059356689453, "global_step": 24419, "epoch": 201} {"train_loss": -30.42671012878418, "global_step": 24420, "epoch": 201} {"train_loss": -30.766910552978516, "global_step": 24421, "epoch": 201} {"train_loss": -30.481260299682617, "global_step": 24422, "epoch": 201} {"train_loss": -30.806293487548828, "global_step": 24423, "epoch": 201} {"train_loss": -30.797082901000977, "global_step": 24424, "epoch": 201} {"train_loss": -30.439453125, "global_step": 24425, "epoch": 201} {"train_loss": -30.543176651000977, "global_step": 24426, "epoch": 201} {"train_loss": -31.001388549804688, "global_step": 24427, "epoch": 201} {"train_loss": -30.455413818359375, "global_step": 24428, "epoch": 201} {"train_loss": -30.989572525024414, "global_step": 24429, "epoch": 201} {"train_loss": -30.791433334350586, "global_step": 24430, "epoch": 201} {"train_loss": -30.77515983581543, "global_step": 24431, "epoch": 201} {"train_loss": -30.879247665405273, "global_step": 24432, "epoch": 201} {"train_loss": -30.206817626953125, "global_step": 24433, "epoch": 201} {"train_loss": -30.688873291015625, "global_step": 24434, "epoch": 201} {"train_loss": -30.8906307220459, "global_step": 24435, "epoch": 201} {"train_loss": -30.4306697845459, "global_step": 24436, "epoch": 201} {"train_loss": -30.987533569335938, "global_step": 24437, "epoch": 201} {"train_loss": -30.728225708007812, "global_step": 24438, "epoch": 201} {"train_loss": -30.498798370361328, "global_step": 24439, "epoch": 201} {"train_loss": -30.247760772705078, "global_step": 24440, "epoch": 201} {"train_loss": -30.447121155163472, "global_step": 24441, "epoch": 201, "val_loss": 2407819.5} {"train_loss": -31.007781982421875, "global_step": 24442, "epoch": 202} {"train_loss": -31.327539443969727, "global_step": 24443, "epoch": 202} {"train_loss": -31.021360397338867, "global_step": 24444, "epoch": 202} {"train_loss": -30.956586837768555, "global_step": 24445, "epoch": 202} {"train_loss": -31.301593780517578, "global_step": 24446, "epoch": 202} {"train_loss": -31.2783145904541, "global_step": 24447, "epoch": 202} {"train_loss": -31.67536735534668, "global_step": 24448, "epoch": 202} {"train_loss": -31.221906661987305, "global_step": 24449, "epoch": 202} {"train_loss": -31.302738189697266, "global_step": 24450, "epoch": 202} {"train_loss": -31.554197311401367, "global_step": 24451, "epoch": 202} {"train_loss": -31.499267578125, "global_step": 24452, "epoch": 202} {"train_loss": -31.894290924072266, "global_step": 24453, "epoch": 202} {"train_loss": -31.351184844970703, "global_step": 24454, "epoch": 202} {"train_loss": -31.367084503173828, "global_step": 24455, "epoch": 202} {"train_loss": -30.821063995361328, "global_step": 24456, "epoch": 202} {"train_loss": -31.702627182006836, "global_step": 24457, "epoch": 202} {"train_loss": -30.830121994018555, "global_step": 24458, "epoch": 202} {"train_loss": -31.161481857299805, "global_step": 24459, "epoch": 202} {"train_loss": -31.37147331237793, "global_step": 24460, "epoch": 202} {"train_loss": -31.438146591186523, "global_step": 24461, "epoch": 202} {"train_loss": -30.628570556640625, "global_step": 24462, "epoch": 202} {"train_loss": -31.278409957885742, "global_step": 24463, "epoch": 202} {"train_loss": -31.212839126586914, "global_step": 24464, "epoch": 202} {"train_loss": -30.998319625854492, "global_step": 24465, "epoch": 202} {"train_loss": -31.38685417175293, "global_step": 24466, "epoch": 202} {"train_loss": -30.914758682250977, "global_step": 24467, "epoch": 202} {"train_loss": -31.507429122924805, "global_step": 24468, "epoch": 202} {"train_loss": -31.678577423095703, "global_step": 24469, "epoch": 202} {"train_loss": -31.037189483642578, "global_step": 24470, "epoch": 202} {"train_loss": -31.50508689880371, "global_step": 24471, "epoch": 202} {"train_loss": -31.611190795898438, "global_step": 24472, "epoch": 202} {"train_loss": -30.679319381713867, "global_step": 24473, "epoch": 202} {"train_loss": -31.226713180541992, "global_step": 24474, "epoch": 202} {"train_loss": -31.619237899780273, "global_step": 24475, "epoch": 202} {"train_loss": -31.269683837890625, "global_step": 24476, "epoch": 202} {"train_loss": -31.009159088134766, "global_step": 24477, "epoch": 202} {"train_loss": -31.411029815673828, "global_step": 24478, "epoch": 202} {"train_loss": -31.578327178955078, "global_step": 24479, "epoch": 202} {"train_loss": -30.729129791259766, "global_step": 24480, "epoch": 202} {"train_loss": -31.415374755859375, "global_step": 24481, "epoch": 202} {"train_loss": -31.544677734375, "global_step": 24482, "epoch": 202} {"train_loss": -31.109182357788086, "global_step": 24483, "epoch": 202} {"train_loss": -29.908735275268555, "global_step": 24484, "epoch": 202} {"train_loss": -29.566272735595703, "global_step": 24485, "epoch": 202} {"train_loss": -25.09138298034668, "global_step": 24486, "epoch": 202} {"train_loss": -14.522233963012695, "global_step": 24487, "epoch": 202} {"train_loss": -11.387877464294434, "global_step": 24488, "epoch": 202} {"train_loss": -27.56801414489746, "global_step": 24489, "epoch": 202} {"train_loss": -25.93828773498535, "global_step": 24490, "epoch": 202} {"train_loss": -27.349628448486328, "global_step": 24491, "epoch": 202} {"train_loss": -25.060874938964844, "global_step": 24492, "epoch": 202} {"train_loss": -29.536584854125977, "global_step": 24493, "epoch": 202} {"train_loss": -25.762908935546875, "global_step": 24494, "epoch": 202} {"train_loss": -28.818784713745117, "global_step": 24495, "epoch": 202} {"train_loss": -28.482275009155273, "global_step": 24496, "epoch": 202} {"train_loss": -28.40254783630371, "global_step": 24497, "epoch": 202} {"train_loss": -28.040191650390625, "global_step": 24498, "epoch": 202} {"train_loss": -29.221960067749023, "global_step": 24499, "epoch": 202} {"train_loss": -28.27802085876465, "global_step": 24500, "epoch": 202} {"train_loss": -28.35479164123535, "global_step": 24501, "epoch": 202} {"train_loss": -29.478775024414062, "global_step": 24502, "epoch": 202} {"train_loss": -28.566364288330078, "global_step": 24503, "epoch": 202} {"train_loss": -30.489883422851562, "global_step": 24504, "epoch": 202} {"train_loss": -29.30366325378418, "global_step": 24505, "epoch": 202} {"train_loss": -28.543359756469727, "global_step": 24506, "epoch": 202} {"train_loss": -29.394012451171875, "global_step": 24507, "epoch": 202} {"train_loss": -28.44342613220215, "global_step": 24508, "epoch": 202} {"train_loss": -29.31928062438965, "global_step": 24509, "epoch": 202} {"train_loss": -29.748336791992188, "global_step": 24510, "epoch": 202} {"train_loss": -29.83526611328125, "global_step": 24511, "epoch": 202} {"train_loss": -29.91424560546875, "global_step": 24512, "epoch": 202} {"train_loss": -29.7718563079834, "global_step": 24513, "epoch": 202} {"train_loss": -29.710113525390625, "global_step": 24514, "epoch": 202} {"train_loss": -29.6879940032959, "global_step": 24515, "epoch": 202} {"train_loss": -30.364471435546875, "global_step": 24516, "epoch": 202} {"train_loss": -30.33094596862793, "global_step": 24517, "epoch": 202} {"train_loss": -29.953393936157227, "global_step": 24518, "epoch": 202} {"train_loss": -29.909048080444336, "global_step": 24519, "epoch": 202} {"train_loss": -30.036603927612305, "global_step": 24520, "epoch": 202} {"train_loss": -30.21381187438965, "global_step": 24521, "epoch": 202} {"train_loss": -30.172164916992188, "global_step": 24522, "epoch": 202} {"train_loss": -30.357141494750977, "global_step": 24523, "epoch": 202} {"train_loss": -29.78131675720215, "global_step": 24524, "epoch": 202} {"train_loss": -30.476659774780273, "global_step": 24525, "epoch": 202} {"train_loss": -30.68583106994629, "global_step": 24526, "epoch": 202} {"train_loss": -30.1451416015625, "global_step": 24527, "epoch": 202} {"train_loss": -30.893430709838867, "global_step": 24528, "epoch": 202} {"train_loss": -30.726276397705078, "global_step": 24529, "epoch": 202} {"train_loss": -30.052038192749023, "global_step": 24530, "epoch": 202} {"train_loss": -30.629270553588867, "global_step": 24531, "epoch": 202} {"train_loss": -30.49212646484375, "global_step": 24532, "epoch": 202} {"train_loss": -30.32728385925293, "global_step": 24533, "epoch": 202} {"train_loss": -30.576553344726562, "global_step": 24534, "epoch": 202} {"train_loss": -29.544645309448242, "global_step": 24535, "epoch": 202} {"train_loss": -29.80655288696289, "global_step": 24536, "epoch": 202} {"train_loss": -30.603796005249023, "global_step": 24537, "epoch": 202} {"train_loss": -30.10982322692871, "global_step": 24538, "epoch": 202} {"train_loss": -29.422327041625977, "global_step": 24539, "epoch": 202} {"train_loss": -30.57670021057129, "global_step": 24540, "epoch": 202} {"train_loss": -29.39536476135254, "global_step": 24541, "epoch": 202} {"train_loss": -29.037811279296875, "global_step": 24542, "epoch": 202} {"train_loss": -26.517526626586914, "global_step": 24543, "epoch": 202} {"train_loss": -18.335752487182617, "global_step": 24544, "epoch": 202} {"train_loss": -11.86108684539795, "global_step": 24545, "epoch": 202} {"train_loss": -15.29548168182373, "global_step": 24546, "epoch": 202} {"train_loss": -29.435028076171875, "global_step": 24547, "epoch": 202} {"train_loss": -21.1823787689209, "global_step": 24548, "epoch": 202} {"train_loss": -28.768783569335938, "global_step": 24549, "epoch": 202} {"train_loss": -25.191001892089844, "global_step": 24550, "epoch": 202} {"train_loss": -28.793310165405273, "global_step": 24551, "epoch": 202} {"train_loss": -27.004663467407227, "global_step": 24552, "epoch": 202} {"train_loss": -27.613149642944336, "global_step": 24553, "epoch": 202} {"train_loss": -29.015155792236328, "global_step": 24554, "epoch": 202} {"train_loss": -28.681440353393555, "global_step": 24555, "epoch": 202} {"train_loss": -27.53656005859375, "global_step": 24556, "epoch": 202} {"train_loss": -28.547119140625, "global_step": 24557, "epoch": 202} {"train_loss": -28.960241317749023, "global_step": 24558, "epoch": 202} {"train_loss": -28.902082443237305, "global_step": 24559, "epoch": 202} {"train_loss": -28.85662269592285, "global_step": 24560, "epoch": 202} {"train_loss": -28.994779586791992, "global_step": 24561, "epoch": 202} {"train_loss": -29.175840653663826, "global_step": 24562, "epoch": 202, "val_loss": 2539827.0} {"train_loss": -29.40984535217285, "global_step": 24563, "epoch": 203} {"train_loss": -29.49956703186035, "global_step": 24564, "epoch": 203} {"train_loss": -29.12575340270996, "global_step": 24565, "epoch": 203} {"train_loss": -29.243183135986328, "global_step": 24566, "epoch": 203} {"train_loss": -29.676511764526367, "global_step": 24567, "epoch": 203} {"train_loss": -29.82181167602539, "global_step": 24568, "epoch": 203} {"train_loss": -29.390838623046875, "global_step": 24569, "epoch": 203} {"train_loss": -29.76483726501465, "global_step": 24570, "epoch": 203} {"train_loss": -29.5492000579834, "global_step": 24571, "epoch": 203} {"train_loss": -29.5634765625, "global_step": 24572, "epoch": 203} {"train_loss": -29.815942764282227, "global_step": 24573, "epoch": 203} {"train_loss": -30.000822067260742, "global_step": 24574, "epoch": 203} {"train_loss": -30.375030517578125, "global_step": 24575, "epoch": 203} {"train_loss": -30.192401885986328, "global_step": 24576, "epoch": 203} {"train_loss": -30.23520851135254, "global_step": 24577, "epoch": 203} {"train_loss": -29.9512939453125, "global_step": 24578, "epoch": 203} {"train_loss": -30.5349063873291, "global_step": 24579, "epoch": 203} {"train_loss": -30.011892318725586, "global_step": 24580, "epoch": 203} {"train_loss": -29.926923751831055, "global_step": 24581, "epoch": 203} {"train_loss": -30.02667236328125, "global_step": 24582, "epoch": 203} {"train_loss": -30.434619903564453, "global_step": 24583, "epoch": 203} {"train_loss": -29.88407325744629, "global_step": 24584, "epoch": 203} {"train_loss": -30.833852767944336, "global_step": 24585, "epoch": 203} {"train_loss": -30.479633331298828, "global_step": 24586, "epoch": 203} {"train_loss": -30.245641708374023, "global_step": 24587, "epoch": 203} {"train_loss": -30.231367111206055, "global_step": 24588, "epoch": 203} {"train_loss": -30.435415267944336, "global_step": 24589, "epoch": 203} {"train_loss": -30.6881103515625, "global_step": 24590, "epoch": 203} {"train_loss": -30.441904067993164, "global_step": 24591, "epoch": 203} {"train_loss": -30.3710880279541, "global_step": 24592, "epoch": 203} {"train_loss": -30.620059967041016, "global_step": 24593, "epoch": 203} {"train_loss": -30.81146812438965, "global_step": 24594, "epoch": 203} {"train_loss": -29.580520629882812, "global_step": 24595, "epoch": 203} {"train_loss": -30.88911247253418, "global_step": 24596, "epoch": 203} {"train_loss": -30.452747344970703, "global_step": 24597, "epoch": 203} {"train_loss": -30.720239639282227, "global_step": 24598, "epoch": 203} {"train_loss": -29.92597770690918, "global_step": 24599, "epoch": 203} {"train_loss": -30.19488525390625, "global_step": 24600, "epoch": 203} {"train_loss": -30.240827560424805, "global_step": 24601, "epoch": 203} {"train_loss": -30.709131240844727, "global_step": 24602, "epoch": 203} {"train_loss": -30.5758113861084, "global_step": 24603, "epoch": 203} {"train_loss": -30.65020751953125, "global_step": 24604, "epoch": 203} {"train_loss": -30.452930450439453, "global_step": 24605, "epoch": 203} {"train_loss": -30.451461791992188, "global_step": 24606, "epoch": 203} {"train_loss": -30.74379539489746, "global_step": 24607, "epoch": 203} {"train_loss": -30.580183029174805, "global_step": 24608, "epoch": 203} {"train_loss": -30.78853416442871, "global_step": 24609, "epoch": 203} {"train_loss": -30.655948638916016, "global_step": 24610, "epoch": 203} {"train_loss": -30.7247314453125, "global_step": 24611, "epoch": 203} {"train_loss": -30.7335147857666, "global_step": 24612, "epoch": 203} {"train_loss": -30.79913902282715, "global_step": 24613, "epoch": 203} {"train_loss": -31.028905868530273, "global_step": 24614, "epoch": 203} {"train_loss": -30.247756958007812, "global_step": 24615, "epoch": 203} {"train_loss": -30.57120704650879, "global_step": 24616, "epoch": 203} {"train_loss": -30.76336669921875, "global_step": 24617, "epoch": 203} {"train_loss": -31.02559471130371, "global_step": 24618, "epoch": 203} {"train_loss": -31.200347900390625, "global_step": 24619, "epoch": 203} {"train_loss": -30.8846435546875, "global_step": 24620, "epoch": 203} {"train_loss": -31.105520248413086, "global_step": 24621, "epoch": 203} {"train_loss": -31.1822452545166, "global_step": 24622, "epoch": 203} {"train_loss": -31.127904891967773, "global_step": 24623, "epoch": 203} {"train_loss": -30.78168296813965, "global_step": 24624, "epoch": 203} {"train_loss": -30.738357543945312, "global_step": 24625, "epoch": 203} {"train_loss": -31.157392501831055, "global_step": 24626, "epoch": 203} {"train_loss": -31.14397621154785, "global_step": 24627, "epoch": 203} {"train_loss": -31.43827247619629, "global_step": 24628, "epoch": 203} {"train_loss": -31.412290573120117, "global_step": 24629, "epoch": 203} {"train_loss": -31.55405616760254, "global_step": 24630, "epoch": 203} {"train_loss": -30.784448623657227, "global_step": 24631, "epoch": 203} {"train_loss": -31.467687606811523, "global_step": 24632, "epoch": 203} {"train_loss": -31.072301864624023, "global_step": 24633, "epoch": 203} {"train_loss": -31.480932235717773, "global_step": 24634, "epoch": 203} {"train_loss": -31.46820640563965, "global_step": 24635, "epoch": 203} {"train_loss": -31.29280662536621, "global_step": 24636, "epoch": 203} {"train_loss": -30.871580123901367, "global_step": 24637, "epoch": 203} {"train_loss": -31.148273468017578, "global_step": 24638, "epoch": 203} {"train_loss": -31.070749282836914, "global_step": 24639, "epoch": 203} {"train_loss": -30.83115005493164, "global_step": 24640, "epoch": 203} {"train_loss": -31.533893585205078, "global_step": 24641, "epoch": 203} {"train_loss": -31.26932144165039, "global_step": 24642, "epoch": 203} {"train_loss": -31.423757553100586, "global_step": 24643, "epoch": 203} {"train_loss": -31.216970443725586, "global_step": 24644, "epoch": 203} {"train_loss": -30.037519454956055, "global_step": 24645, "epoch": 203} {"train_loss": -30.966405868530273, "global_step": 24646, "epoch": 203} {"train_loss": -31.11065101623535, "global_step": 24647, "epoch": 203} {"train_loss": -31.09153175354004, "global_step": 24648, "epoch": 203} {"train_loss": -30.860483169555664, "global_step": 24649, "epoch": 203} {"train_loss": -30.656925201416016, "global_step": 24650, "epoch": 203} {"train_loss": -31.244842529296875, "global_step": 24651, "epoch": 203} {"train_loss": -31.112476348876953, "global_step": 24652, "epoch": 203} {"train_loss": -30.72700309753418, "global_step": 24653, "epoch": 203} {"train_loss": -30.7629337310791, "global_step": 24654, "epoch": 203} {"train_loss": -31.54060173034668, "global_step": 24655, "epoch": 203} {"train_loss": -31.336400985717773, "global_step": 24656, "epoch": 203} {"train_loss": -30.973676681518555, "global_step": 24657, "epoch": 203} {"train_loss": -31.414194107055664, "global_step": 24658, "epoch": 203} {"train_loss": -31.036787033081055, "global_step": 24659, "epoch": 203} {"train_loss": -30.145544052124023, "global_step": 24660, "epoch": 203} {"train_loss": -30.732196807861328, "global_step": 24661, "epoch": 203} {"train_loss": -31.49627685546875, "global_step": 24662, "epoch": 203} {"train_loss": -31.101348876953125, "global_step": 24663, "epoch": 203} {"train_loss": -30.989124298095703, "global_step": 24664, "epoch": 203} {"train_loss": -31.52101707458496, "global_step": 24665, "epoch": 203} {"train_loss": -30.06005859375, "global_step": 24666, "epoch": 203} {"train_loss": -31.298959732055664, "global_step": 24667, "epoch": 203} {"train_loss": -30.26302146911621, "global_step": 24668, "epoch": 203} {"train_loss": -31.52752685546875, "global_step": 24669, "epoch": 203} {"train_loss": -30.608240127563477, "global_step": 24670, "epoch": 203} {"train_loss": -30.97883415222168, "global_step": 24671, "epoch": 203} {"train_loss": -30.78999137878418, "global_step": 24672, "epoch": 203} {"train_loss": -30.635229110717773, "global_step": 24673, "epoch": 203} {"train_loss": -31.100101470947266, "global_step": 24674, "epoch": 203} {"train_loss": -31.70722770690918, "global_step": 24675, "epoch": 203} {"train_loss": -30.9370174407959, "global_step": 24676, "epoch": 203} {"train_loss": -31.12076759338379, "global_step": 24677, "epoch": 203} {"train_loss": -31.184560775756836, "global_step": 24678, "epoch": 203} {"train_loss": -31.5848388671875, "global_step": 24679, "epoch": 203} {"train_loss": -30.83135414123535, "global_step": 24680, "epoch": 203} {"train_loss": -31.243467330932617, "global_step": 24681, "epoch": 203} {"train_loss": -31.338876724243164, "global_step": 24682, "epoch": 203} {"train_loss": -30.705347108446862, "global_step": 24683, "epoch": 203, "val_loss": 2590178.75} {"train_loss": -31.376108169555664, "global_step": 24684, "epoch": 204} {"train_loss": -31.365453720092773, "global_step": 24685, "epoch": 204} {"train_loss": -31.267614364624023, "global_step": 24686, "epoch": 204} {"train_loss": -31.7181396484375, "global_step": 24687, "epoch": 204} {"train_loss": -31.593597412109375, "global_step": 24688, "epoch": 204} {"train_loss": -31.36271095275879, "global_step": 24689, "epoch": 204} {"train_loss": -31.36834144592285, "global_step": 24690, "epoch": 204} {"train_loss": -31.762348175048828, "global_step": 24691, "epoch": 204} {"train_loss": -31.688810348510742, "global_step": 24692, "epoch": 204} {"train_loss": -31.242572784423828, "global_step": 24693, "epoch": 204} {"train_loss": -30.96243667602539, "global_step": 24694, "epoch": 204} {"train_loss": -29.19548988342285, "global_step": 24695, "epoch": 204} {"train_loss": -25.76909828186035, "global_step": 24696, "epoch": 204} {"train_loss": -21.053266525268555, "global_step": 24697, "epoch": 204} {"train_loss": -18.90224266052246, "global_step": 24698, "epoch": 204} {"train_loss": -24.464284896850586, "global_step": 24699, "epoch": 204} {"train_loss": -30.35553550720215, "global_step": 24700, "epoch": 204} {"train_loss": -23.468427658081055, "global_step": 24701, "epoch": 204} {"train_loss": -30.291181564331055, "global_step": 24702, "epoch": 204} {"train_loss": -27.88678550720215, "global_step": 24703, "epoch": 204} {"train_loss": -29.874847412109375, "global_step": 24704, "epoch": 204} {"train_loss": -29.955591201782227, "global_step": 24705, "epoch": 204} {"train_loss": -31.084232330322266, "global_step": 24706, "epoch": 204} {"train_loss": -29.981739044189453, "global_step": 24707, "epoch": 204} {"train_loss": -30.525192260742188, "global_step": 24708, "epoch": 204} {"train_loss": -30.948068618774414, "global_step": 24709, "epoch": 204} {"train_loss": -29.701831817626953, "global_step": 24710, "epoch": 204} {"train_loss": -30.837202072143555, "global_step": 24711, "epoch": 204} {"train_loss": -30.59687614440918, "global_step": 24712, "epoch": 204} {"train_loss": -30.404266357421875, "global_step": 24713, "epoch": 204} {"train_loss": -31.094263076782227, "global_step": 24714, "epoch": 204} {"train_loss": -31.218915939331055, "global_step": 24715, "epoch": 204} {"train_loss": -31.071378707885742, "global_step": 24716, "epoch": 204} {"train_loss": -30.811660766601562, "global_step": 24717, "epoch": 204} {"train_loss": -31.087194442749023, "global_step": 24718, "epoch": 204} {"train_loss": -31.38254165649414, "global_step": 24719, "epoch": 204} {"train_loss": -31.023365020751953, "global_step": 24720, "epoch": 204} {"train_loss": -30.907379150390625, "global_step": 24721, "epoch": 204} {"train_loss": -31.494781494140625, "global_step": 24722, "epoch": 204} {"train_loss": -31.267105102539062, "global_step": 24723, "epoch": 204} {"train_loss": -31.473773956298828, "global_step": 24724, "epoch": 204} {"train_loss": -31.452356338500977, "global_step": 24725, "epoch": 204} {"train_loss": -31.14637565612793, "global_step": 24726, "epoch": 204} {"train_loss": -31.799646377563477, "global_step": 24727, "epoch": 204} {"train_loss": -31.478412628173828, "global_step": 24728, "epoch": 204} {"train_loss": -31.64447593688965, "global_step": 24729, "epoch": 204} {"train_loss": -31.655719757080078, "global_step": 24730, "epoch": 204} {"train_loss": -31.49759292602539, "global_step": 24731, "epoch": 204} {"train_loss": -31.219812393188477, "global_step": 24732, "epoch": 204} {"train_loss": -31.491125106811523, "global_step": 24733, "epoch": 204} {"train_loss": -31.640216827392578, "global_step": 24734, "epoch": 204} {"train_loss": -30.329669952392578, "global_step": 24735, "epoch": 204} {"train_loss": -31.508886337280273, "global_step": 24736, "epoch": 204} {"train_loss": -30.601957321166992, "global_step": 24737, "epoch": 204} {"train_loss": -31.61378288269043, "global_step": 24738, "epoch": 204} {"train_loss": -30.75048828125, "global_step": 24739, "epoch": 204} {"train_loss": -31.0903263092041, "global_step": 24740, "epoch": 204} {"train_loss": -30.934247970581055, "global_step": 24741, "epoch": 204} {"train_loss": -31.088647842407227, "global_step": 24742, "epoch": 204} {"train_loss": -31.08013343811035, "global_step": 24743, "epoch": 204} {"train_loss": -30.7695369720459, "global_step": 24744, "epoch": 204} {"train_loss": -30.78973388671875, "global_step": 24745, "epoch": 204} {"train_loss": -30.29572105407715, "global_step": 24746, "epoch": 204} {"train_loss": -31.218652725219727, "global_step": 24747, "epoch": 204} {"train_loss": -31.170303344726562, "global_step": 24748, "epoch": 204} {"train_loss": -30.566457748413086, "global_step": 24749, "epoch": 204} {"train_loss": -31.397979736328125, "global_step": 24750, "epoch": 204} {"train_loss": -31.233060836791992, "global_step": 24751, "epoch": 204} {"train_loss": -31.400320053100586, "global_step": 24752, "epoch": 204} {"train_loss": -31.55475425720215, "global_step": 24753, "epoch": 204} {"train_loss": -31.178680419921875, "global_step": 24754, "epoch": 204} {"train_loss": -31.160511016845703, "global_step": 24755, "epoch": 204} {"train_loss": -30.50606346130371, "global_step": 24756, "epoch": 204} {"train_loss": -31.23003578186035, "global_step": 24757, "epoch": 204} {"train_loss": -31.70533561706543, "global_step": 24758, "epoch": 204} {"train_loss": -31.243818283081055, "global_step": 24759, "epoch": 204} {"train_loss": -30.643707275390625, "global_step": 24760, "epoch": 204} {"train_loss": -31.685504913330078, "global_step": 24761, "epoch": 204} {"train_loss": -31.217966079711914, "global_step": 24762, "epoch": 204} {"train_loss": -31.281707763671875, "global_step": 24763, "epoch": 204} {"train_loss": -31.2910099029541, "global_step": 24764, "epoch": 204} {"train_loss": -31.21363639831543, "global_step": 24765, "epoch": 204} {"train_loss": -30.546594619750977, "global_step": 24766, "epoch": 204} {"train_loss": -31.569854736328125, "global_step": 24767, "epoch": 204} {"train_loss": -31.199045181274414, "global_step": 24768, "epoch": 204} {"train_loss": -31.61773109436035, "global_step": 24769, "epoch": 204} {"train_loss": -31.014875411987305, "global_step": 24770, "epoch": 204} {"train_loss": -31.651594161987305, "global_step": 24771, "epoch": 204} {"train_loss": -30.750349044799805, "global_step": 24772, "epoch": 204} {"train_loss": -30.06036376953125, "global_step": 24773, "epoch": 204} {"train_loss": -31.51495361328125, "global_step": 24774, "epoch": 204} {"train_loss": -30.15032386779785, "global_step": 24775, "epoch": 204} {"train_loss": -31.34381103515625, "global_step": 24776, "epoch": 204} {"train_loss": -30.782123565673828, "global_step": 24777, "epoch": 204} {"train_loss": -31.534988403320312, "global_step": 24778, "epoch": 204} {"train_loss": -31.433446884155273, "global_step": 24779, "epoch": 204} {"train_loss": -31.311872482299805, "global_step": 24780, "epoch": 204} {"train_loss": -31.608184814453125, "global_step": 24781, "epoch": 204} {"train_loss": -31.41666030883789, "global_step": 24782, "epoch": 204} {"train_loss": -31.4797306060791, "global_step": 24783, "epoch": 204} {"train_loss": -30.38201332092285, "global_step": 24784, "epoch": 204} {"train_loss": -31.366025924682617, "global_step": 24785, "epoch": 204} {"train_loss": -31.193632125854492, "global_step": 24786, "epoch": 204} {"train_loss": -30.53680419921875, "global_step": 24787, "epoch": 204} {"train_loss": -29.85066032409668, "global_step": 24788, "epoch": 204} {"train_loss": -28.784290313720703, "global_step": 24789, "epoch": 204} {"train_loss": -29.551130294799805, "global_step": 24790, "epoch": 204} {"train_loss": -30.54084587097168, "global_step": 24791, "epoch": 204} {"train_loss": -29.65728187561035, "global_step": 24792, "epoch": 204} {"train_loss": -29.182035446166992, "global_step": 24793, "epoch": 204} {"train_loss": -30.73929786682129, "global_step": 24794, "epoch": 204} {"train_loss": -30.5053768157959, "global_step": 24795, "epoch": 204} {"train_loss": -30.48249626159668, "global_step": 24796, "epoch": 204} {"train_loss": -30.83723258972168, "global_step": 24797, "epoch": 204} {"train_loss": -30.544702529907227, "global_step": 24798, "epoch": 204} {"train_loss": -30.520673751831055, "global_step": 24799, "epoch": 204} {"train_loss": -31.7308406829834, "global_step": 24800, "epoch": 204} {"train_loss": -30.553831100463867, "global_step": 24801, "epoch": 204} {"train_loss": -29.639453887939453, "global_step": 24802, "epoch": 204} {"train_loss": -29.6497859954834, "global_step": 24803, "epoch": 204} {"train_loss": -30.582649120614548, "global_step": 24804, "epoch": 204, "val_loss": 2643188.75} {"train_loss": -29.926528930664062, "global_step": 24805, "epoch": 205} {"train_loss": -30.737218856811523, "global_step": 24806, "epoch": 205} {"train_loss": -29.403173446655273, "global_step": 24807, "epoch": 205} {"train_loss": -28.50811767578125, "global_step": 24808, "epoch": 205} {"train_loss": -30.696874618530273, "global_step": 24809, "epoch": 205} {"train_loss": -30.854389190673828, "global_step": 24810, "epoch": 205} {"train_loss": -28.89861488342285, "global_step": 24811, "epoch": 205} {"train_loss": -30.99238395690918, "global_step": 24812, "epoch": 205} {"train_loss": -30.629322052001953, "global_step": 24813, "epoch": 205} {"train_loss": -30.9326229095459, "global_step": 24814, "epoch": 205} {"train_loss": -30.27850914001465, "global_step": 24815, "epoch": 205} {"train_loss": -30.580493927001953, "global_step": 24816, "epoch": 205} {"train_loss": -30.731021881103516, "global_step": 24817, "epoch": 205} {"train_loss": -31.1856746673584, "global_step": 24818, "epoch": 205} {"train_loss": -31.305957794189453, "global_step": 24819, "epoch": 205} {"train_loss": -31.235370635986328, "global_step": 24820, "epoch": 205} {"train_loss": -31.269622802734375, "global_step": 24821, "epoch": 205} {"train_loss": -30.81494140625, "global_step": 24822, "epoch": 205} {"train_loss": -31.48193359375, "global_step": 24823, "epoch": 205} {"train_loss": -31.237768173217773, "global_step": 24824, "epoch": 205} {"train_loss": -31.110197067260742, "global_step": 24825, "epoch": 205} {"train_loss": -31.40180778503418, "global_step": 24826, "epoch": 205} {"train_loss": -31.44649314880371, "global_step": 24827, "epoch": 205} {"train_loss": -31.416595458984375, "global_step": 24828, "epoch": 205} {"train_loss": -31.467395782470703, "global_step": 24829, "epoch": 205} {"train_loss": -31.7073974609375, "global_step": 24830, "epoch": 205} {"train_loss": -30.98825454711914, "global_step": 24831, "epoch": 205} {"train_loss": -31.56867027282715, "global_step": 24832, "epoch": 205} {"train_loss": -31.383747100830078, "global_step": 24833, "epoch": 205} {"train_loss": -31.666208267211914, "global_step": 24834, "epoch": 205} {"train_loss": -31.977407455444336, "global_step": 24835, "epoch": 205} {"train_loss": -31.368650436401367, "global_step": 24836, "epoch": 205} {"train_loss": -31.72454833984375, "global_step": 24837, "epoch": 205} {"train_loss": -31.065296173095703, "global_step": 24838, "epoch": 205} {"train_loss": -32.05363082885742, "global_step": 24839, "epoch": 205} {"train_loss": -31.9997615814209, "global_step": 24840, "epoch": 205} {"train_loss": -31.508838653564453, "global_step": 24841, "epoch": 205} {"train_loss": -31.74677848815918, "global_step": 24842, "epoch": 205} {"train_loss": -31.218671798706055, "global_step": 24843, "epoch": 205} {"train_loss": -31.937055587768555, "global_step": 24844, "epoch": 205} {"train_loss": -31.931989669799805, "global_step": 24845, "epoch": 205} {"train_loss": -31.75190544128418, "global_step": 24846, "epoch": 205} {"train_loss": -31.650053024291992, "global_step": 24847, "epoch": 205} {"train_loss": -32.267330169677734, "global_step": 24848, "epoch": 205} {"train_loss": -31.85321617126465, "global_step": 24849, "epoch": 205} {"train_loss": -31.582971572875977, "global_step": 24850, "epoch": 205} {"train_loss": -32.14820098876953, "global_step": 24851, "epoch": 205} {"train_loss": -32.24724197387695, "global_step": 24852, "epoch": 205} {"train_loss": -31.98388671875, "global_step": 24853, "epoch": 205} {"train_loss": -31.298322677612305, "global_step": 24854, "epoch": 205} {"train_loss": -32.04193115234375, "global_step": 24855, "epoch": 205} {"train_loss": -32.11248016357422, "global_step": 24856, "epoch": 205} {"train_loss": -31.49627113342285, "global_step": 24857, "epoch": 205} {"train_loss": -31.802587509155273, "global_step": 24858, "epoch": 205} {"train_loss": -31.703845977783203, "global_step": 24859, "epoch": 205} {"train_loss": -31.9222354888916, "global_step": 24860, "epoch": 205} {"train_loss": -32.193817138671875, "global_step": 24861, "epoch": 205} {"train_loss": -31.503942489624023, "global_step": 24862, "epoch": 205} {"train_loss": -31.920608520507812, "global_step": 24863, "epoch": 205} {"train_loss": -31.594884872436523, "global_step": 24864, "epoch": 205} {"train_loss": -31.38312339782715, "global_step": 24865, "epoch": 205} {"train_loss": -32.36115646362305, "global_step": 24866, "epoch": 205} {"train_loss": -30.848377227783203, "global_step": 24867, "epoch": 205} {"train_loss": -31.120695114135742, "global_step": 24868, "epoch": 205} {"train_loss": -30.705474853515625, "global_step": 24869, "epoch": 205} {"train_loss": -30.476667404174805, "global_step": 24870, "epoch": 205} {"train_loss": -31.44476890563965, "global_step": 24871, "epoch": 205} {"train_loss": -30.023895263671875, "global_step": 24872, "epoch": 205} {"train_loss": -29.69422721862793, "global_step": 24873, "epoch": 205} {"train_loss": -30.51513671875, "global_step": 24874, "epoch": 205} {"train_loss": -28.617334365844727, "global_step": 24875, "epoch": 205} {"train_loss": -29.406888961791992, "global_step": 24876, "epoch": 205} {"train_loss": -29.70330238342285, "global_step": 24877, "epoch": 205} {"train_loss": -30.96384620666504, "global_step": 24878, "epoch": 205} {"train_loss": -31.248565673828125, "global_step": 24879, "epoch": 205} {"train_loss": -29.690725326538086, "global_step": 24880, "epoch": 205} {"train_loss": -29.716333389282227, "global_step": 24881, "epoch": 205} {"train_loss": -31.416894912719727, "global_step": 24882, "epoch": 205} {"train_loss": -30.756067276000977, "global_step": 24883, "epoch": 205} {"train_loss": -30.607526779174805, "global_step": 24884, "epoch": 205} {"train_loss": -31.171375274658203, "global_step": 24885, "epoch": 205} {"train_loss": -30.09514808654785, "global_step": 24886, "epoch": 205} {"train_loss": -30.573705673217773, "global_step": 24887, "epoch": 205} {"train_loss": -31.440750122070312, "global_step": 24888, "epoch": 205} {"train_loss": -30.857654571533203, "global_step": 24889, "epoch": 205} {"train_loss": -30.99493408203125, "global_step": 24890, "epoch": 205} {"train_loss": -30.628507614135742, "global_step": 24891, "epoch": 205} {"train_loss": -31.33928871154785, "global_step": 24892, "epoch": 205} {"train_loss": -30.935876846313477, "global_step": 24893, "epoch": 205} {"train_loss": -30.307159423828125, "global_step": 24894, "epoch": 205} {"train_loss": -31.659637451171875, "global_step": 24895, "epoch": 205} {"train_loss": -30.360340118408203, "global_step": 24896, "epoch": 205} {"train_loss": -30.562274932861328, "global_step": 24897, "epoch": 205} {"train_loss": -30.6424617767334, "global_step": 24898, "epoch": 205} {"train_loss": -31.271249771118164, "global_step": 24899, "epoch": 205} {"train_loss": -30.873401641845703, "global_step": 24900, "epoch": 205} {"train_loss": -30.48023796081543, "global_step": 24901, "epoch": 205} {"train_loss": -30.90463638305664, "global_step": 24902, "epoch": 205} {"train_loss": -31.149572372436523, "global_step": 24903, "epoch": 205} {"train_loss": -31.11236000061035, "global_step": 24904, "epoch": 205} {"train_loss": -30.85761833190918, "global_step": 24905, "epoch": 205} {"train_loss": -31.286468505859375, "global_step": 24906, "epoch": 205} {"train_loss": -30.657318115234375, "global_step": 24907, "epoch": 205} {"train_loss": -31.71172523498535, "global_step": 24908, "epoch": 205} {"train_loss": -31.110675811767578, "global_step": 24909, "epoch": 205} {"train_loss": -30.71392250061035, "global_step": 24910, "epoch": 205} {"train_loss": -31.2231502532959, "global_step": 24911, "epoch": 205} {"train_loss": -31.371856689453125, "global_step": 24912, "epoch": 205} {"train_loss": -31.163373947143555, "global_step": 24913, "epoch": 205} {"train_loss": -31.65500831604004, "global_step": 24914, "epoch": 205} {"train_loss": -31.546833038330078, "global_step": 24915, "epoch": 205} {"train_loss": -31.619543075561523, "global_step": 24916, "epoch": 205} {"train_loss": -31.50124168395996, "global_step": 24917, "epoch": 205} {"train_loss": -31.504247665405273, "global_step": 24918, "epoch": 205} {"train_loss": -31.17172622680664, "global_step": 24919, "epoch": 205} {"train_loss": -30.357406616210938, "global_step": 24920, "epoch": 205} {"train_loss": -30.96002769470215, "global_step": 24921, "epoch": 205} {"train_loss": -31.13138198852539, "global_step": 24922, "epoch": 205} {"train_loss": -31.67340087890625, "global_step": 24923, "epoch": 205} {"train_loss": -30.898059844970703, "global_step": 24924, "epoch": 205} {"train_loss": -31.094150164895808, "global_step": 24925, "epoch": 205, "val_loss": 2544558.25} {"train_loss": -31.63067054748535, "global_step": 24926, "epoch": 206} {"train_loss": -31.924823760986328, "global_step": 24927, "epoch": 206} {"train_loss": -31.7641544342041, "global_step": 24928, "epoch": 206} {"train_loss": -31.47222900390625, "global_step": 24929, "epoch": 206} {"train_loss": -31.741485595703125, "global_step": 24930, "epoch": 206} {"train_loss": -31.775711059570312, "global_step": 24931, "epoch": 206} {"train_loss": -31.8548641204834, "global_step": 24932, "epoch": 206} {"train_loss": -31.12810707092285, "global_step": 24933, "epoch": 206} {"train_loss": -30.68414878845215, "global_step": 24934, "epoch": 206} {"train_loss": -30.465015411376953, "global_step": 24935, "epoch": 206} {"train_loss": -31.8897705078125, "global_step": 24936, "epoch": 206} {"train_loss": -31.246597290039062, "global_step": 24937, "epoch": 206} {"train_loss": -30.08955192565918, "global_step": 24938, "epoch": 206} {"train_loss": -29.62723159790039, "global_step": 24939, "epoch": 206} {"train_loss": -32.08379364013672, "global_step": 24940, "epoch": 206} {"train_loss": -31.02215003967285, "global_step": 24941, "epoch": 206} {"train_loss": -30.927169799804688, "global_step": 24942, "epoch": 206} {"train_loss": -30.758527755737305, "global_step": 24943, "epoch": 206} {"train_loss": -31.2092342376709, "global_step": 24944, "epoch": 206} {"train_loss": -31.3325138092041, "global_step": 24945, "epoch": 206} {"train_loss": -31.873838424682617, "global_step": 24946, "epoch": 206} {"train_loss": -31.197647094726562, "global_step": 24947, "epoch": 206} {"train_loss": -31.6041316986084, "global_step": 24948, "epoch": 206} {"train_loss": -31.826765060424805, "global_step": 24949, "epoch": 206} {"train_loss": -31.321767807006836, "global_step": 24950, "epoch": 206} {"train_loss": -31.79888916015625, "global_step": 24951, "epoch": 206} {"train_loss": -31.822925567626953, "global_step": 24952, "epoch": 206} {"train_loss": -31.679086685180664, "global_step": 24953, "epoch": 206} {"train_loss": -31.38606834411621, "global_step": 24954, "epoch": 206} {"train_loss": -31.68385124206543, "global_step": 24955, "epoch": 206} {"train_loss": -32.106075286865234, "global_step": 24956, "epoch": 206} {"train_loss": -31.429040908813477, "global_step": 24957, "epoch": 206} {"train_loss": -31.86415672302246, "global_step": 24958, "epoch": 206} {"train_loss": -31.489337921142578, "global_step": 24959, "epoch": 206} {"train_loss": -31.958087921142578, "global_step": 24960, "epoch": 206} {"train_loss": -31.319761276245117, "global_step": 24961, "epoch": 206} {"train_loss": -31.999155044555664, "global_step": 24962, "epoch": 206} {"train_loss": -31.655166625976562, "global_step": 24963, "epoch": 206} {"train_loss": -32.220489501953125, "global_step": 24964, "epoch": 206} {"train_loss": -31.406696319580078, "global_step": 24965, "epoch": 206} {"train_loss": -31.56239128112793, "global_step": 24966, "epoch": 206} {"train_loss": -32.33728790283203, "global_step": 24967, "epoch": 206} {"train_loss": -31.704282760620117, "global_step": 24968, "epoch": 206} {"train_loss": -31.14312171936035, "global_step": 24969, "epoch": 206} {"train_loss": -32.21506881713867, "global_step": 24970, "epoch": 206} {"train_loss": -31.957874298095703, "global_step": 24971, "epoch": 206} {"train_loss": -31.693866729736328, "global_step": 24972, "epoch": 206} {"train_loss": -31.743988037109375, "global_step": 24973, "epoch": 206} {"train_loss": -32.13318634033203, "global_step": 24974, "epoch": 206} {"train_loss": -31.811614990234375, "global_step": 24975, "epoch": 206} {"train_loss": -32.19294357299805, "global_step": 24976, "epoch": 206} {"train_loss": -32.122352600097656, "global_step": 24977, "epoch": 206} {"train_loss": -30.226654052734375, "global_step": 24978, "epoch": 206} {"train_loss": -29.73722267150879, "global_step": 24979, "epoch": 206} {"train_loss": -31.766143798828125, "global_step": 24980, "epoch": 206} {"train_loss": -30.211912155151367, "global_step": 24981, "epoch": 206} {"train_loss": -30.938623428344727, "global_step": 24982, "epoch": 206} {"train_loss": -31.11638832092285, "global_step": 24983, "epoch": 206} {"train_loss": -28.631412506103516, "global_step": 24984, "epoch": 206} {"train_loss": -31.5233154296875, "global_step": 24985, "epoch": 206} {"train_loss": -30.441770553588867, "global_step": 24986, "epoch": 206} {"train_loss": -30.44366455078125, "global_step": 24987, "epoch": 206} {"train_loss": -30.7762508392334, "global_step": 24988, "epoch": 206} {"train_loss": -29.814533233642578, "global_step": 24989, "epoch": 206} {"train_loss": -28.688520431518555, "global_step": 24990, "epoch": 206} {"train_loss": -28.29787254333496, "global_step": 24991, "epoch": 206} {"train_loss": -29.294864654541016, "global_step": 24992, "epoch": 206} {"train_loss": -30.56525993347168, "global_step": 24993, "epoch": 206} {"train_loss": -30.341089248657227, "global_step": 24994, "epoch": 206} {"train_loss": -31.24269676208496, "global_step": 24995, "epoch": 206} {"train_loss": -28.958005905151367, "global_step": 24996, "epoch": 206} {"train_loss": -30.69197654724121, "global_step": 24997, "epoch": 206} {"train_loss": -31.39300537109375, "global_step": 24998, "epoch": 206} {"train_loss": -30.3409481048584, "global_step": 24999, "epoch": 206} {"train_loss": -30.850217819213867, "global_step": 25000, "epoch": 206} {"train_loss": -31.32098388671875, "global_step": 25001, "epoch": 206} {"train_loss": -31.388742446899414, "global_step": 25002, "epoch": 206} {"train_loss": -31.792394638061523, "global_step": 25003, "epoch": 206} {"train_loss": -31.362934112548828, "global_step": 25004, "epoch": 206} {"train_loss": -31.14935874938965, "global_step": 25005, "epoch": 206} {"train_loss": -31.47993278503418, "global_step": 25006, "epoch": 206} {"train_loss": -31.3116512298584, "global_step": 25007, "epoch": 206} {"train_loss": -31.502506256103516, "global_step": 25008, "epoch": 206} {"train_loss": -31.022464752197266, "global_step": 25009, "epoch": 206} {"train_loss": -30.474414825439453, "global_step": 25010, "epoch": 206} {"train_loss": -30.8598575592041, "global_step": 25011, "epoch": 206} {"train_loss": -29.9971923828125, "global_step": 25012, "epoch": 206} {"train_loss": -30.60951042175293, "global_step": 25013, "epoch": 206} {"train_loss": -30.519453048706055, "global_step": 25014, "epoch": 206} {"train_loss": -31.317779541015625, "global_step": 25015, "epoch": 206} {"train_loss": -31.19292640686035, "global_step": 25016, "epoch": 206} {"train_loss": -30.95429801940918, "global_step": 25017, "epoch": 206} {"train_loss": -31.075597763061523, "global_step": 25018, "epoch": 206} {"train_loss": -29.265676498413086, "global_step": 25019, "epoch": 206} {"train_loss": -31.718175888061523, "global_step": 25020, "epoch": 206} {"train_loss": -30.622159957885742, "global_step": 25021, "epoch": 206} {"train_loss": -29.896081924438477, "global_step": 25022, "epoch": 206} {"train_loss": -29.555389404296875, "global_step": 25023, "epoch": 206} {"train_loss": -30.622547149658203, "global_step": 25024, "epoch": 206} {"train_loss": -30.39493179321289, "global_step": 25025, "epoch": 206} {"train_loss": -29.78177261352539, "global_step": 25026, "epoch": 206} {"train_loss": -30.742761611938477, "global_step": 25027, "epoch": 206} {"train_loss": -30.71872329711914, "global_step": 25028, "epoch": 206} {"train_loss": -29.7979736328125, "global_step": 25029, "epoch": 206} {"train_loss": -31.157794952392578, "global_step": 25030, "epoch": 206} {"train_loss": -30.327106475830078, "global_step": 25031, "epoch": 206} {"train_loss": -29.55689811706543, "global_step": 25032, "epoch": 206} {"train_loss": -30.76348876953125, "global_step": 25033, "epoch": 206} {"train_loss": -30.559146881103516, "global_step": 25034, "epoch": 206} {"train_loss": -30.44752311706543, "global_step": 25035, "epoch": 206} {"train_loss": -31.37030029296875, "global_step": 25036, "epoch": 206} {"train_loss": -30.447057723999023, "global_step": 25037, "epoch": 206} {"train_loss": -31.64469337463379, "global_step": 25038, "epoch": 206} {"train_loss": -31.225797653198242, "global_step": 25039, "epoch": 206} {"train_loss": -29.738616943359375, "global_step": 25040, "epoch": 206} {"train_loss": -29.289264678955078, "global_step": 25041, "epoch": 206} {"train_loss": -28.704931259155273, "global_step": 25042, "epoch": 206} {"train_loss": -29.854719161987305, "global_step": 25043, "epoch": 206} {"train_loss": -30.59381675720215, "global_step": 25044, "epoch": 206} {"train_loss": -31.16143226623535, "global_step": 25045, "epoch": 206} {"train_loss": -30.976751800411005, "global_step": 25046, "epoch": 206, "val_loss": 2530445.25} {"train_loss": -31.06760597229004, "global_step": 25047, "epoch": 207} {"train_loss": -31.738067626953125, "global_step": 25048, "epoch": 207} {"train_loss": -31.27210807800293, "global_step": 25049, "epoch": 207} {"train_loss": -31.355045318603516, "global_step": 25050, "epoch": 207} {"train_loss": -31.1928768157959, "global_step": 25051, "epoch": 207} {"train_loss": -31.24358558654785, "global_step": 25052, "epoch": 207} {"train_loss": -31.779748916625977, "global_step": 25053, "epoch": 207} {"train_loss": -30.993127822875977, "global_step": 25054, "epoch": 207} {"train_loss": -31.9672794342041, "global_step": 25055, "epoch": 207} {"train_loss": -31.201196670532227, "global_step": 25056, "epoch": 207} {"train_loss": -31.594959259033203, "global_step": 25057, "epoch": 207} {"train_loss": -31.43212890625, "global_step": 25058, "epoch": 207} {"train_loss": -31.23541259765625, "global_step": 25059, "epoch": 207} {"train_loss": -31.71463394165039, "global_step": 25060, "epoch": 207} {"train_loss": -31.0593318939209, "global_step": 25061, "epoch": 207} {"train_loss": -32.21868133544922, "global_step": 25062, "epoch": 207} {"train_loss": -31.30716896057129, "global_step": 25063, "epoch": 207} {"train_loss": -31.20033073425293, "global_step": 25064, "epoch": 207} {"train_loss": -31.985624313354492, "global_step": 25065, "epoch": 207} {"train_loss": -30.662328720092773, "global_step": 25066, "epoch": 207} {"train_loss": -31.80426025390625, "global_step": 25067, "epoch": 207} {"train_loss": -30.5706844329834, "global_step": 25068, "epoch": 207} {"train_loss": -32.0289192199707, "global_step": 25069, "epoch": 207} {"train_loss": -31.193262100219727, "global_step": 25070, "epoch": 207} {"train_loss": -31.078588485717773, "global_step": 25071, "epoch": 207} {"train_loss": -31.817712783813477, "global_step": 25072, "epoch": 207} {"train_loss": -31.208417892456055, "global_step": 25073, "epoch": 207} {"train_loss": -32.111690521240234, "global_step": 25074, "epoch": 207} {"train_loss": -31.24720573425293, "global_step": 25075, "epoch": 207} {"train_loss": -31.7153377532959, "global_step": 25076, "epoch": 207} {"train_loss": -31.632293701171875, "global_step": 25077, "epoch": 207} {"train_loss": -32.047035217285156, "global_step": 25078, "epoch": 207} {"train_loss": -31.60959815979004, "global_step": 25079, "epoch": 207} {"train_loss": -30.83230972290039, "global_step": 25080, "epoch": 207} {"train_loss": -30.617767333984375, "global_step": 25081, "epoch": 207} {"train_loss": -31.198688507080078, "global_step": 25082, "epoch": 207} {"train_loss": -30.93259048461914, "global_step": 25083, "epoch": 207} {"train_loss": -31.47261619567871, "global_step": 25084, "epoch": 207} {"train_loss": -31.799047470092773, "global_step": 25085, "epoch": 207} {"train_loss": -31.6800537109375, "global_step": 25086, "epoch": 207} {"train_loss": -31.35196876525879, "global_step": 25087, "epoch": 207} {"train_loss": -31.759632110595703, "global_step": 25088, "epoch": 207} {"train_loss": -31.186880111694336, "global_step": 25089, "epoch": 207} {"train_loss": -29.848743438720703, "global_step": 25090, "epoch": 207} {"train_loss": -30.75943946838379, "global_step": 25091, "epoch": 207} {"train_loss": -31.662811279296875, "global_step": 25092, "epoch": 207} {"train_loss": -31.6468505859375, "global_step": 25093, "epoch": 207} {"train_loss": -29.867481231689453, "global_step": 25094, "epoch": 207} {"train_loss": -29.875593185424805, "global_step": 25095, "epoch": 207} {"train_loss": -31.751279830932617, "global_step": 25096, "epoch": 207} {"train_loss": -30.650854110717773, "global_step": 25097, "epoch": 207} {"train_loss": -28.123077392578125, "global_step": 25098, "epoch": 207} {"train_loss": -30.468839645385742, "global_step": 25099, "epoch": 207} {"train_loss": -31.79969596862793, "global_step": 25100, "epoch": 207} {"train_loss": -30.542932510375977, "global_step": 25101, "epoch": 207} {"train_loss": -29.653060913085938, "global_step": 25102, "epoch": 207} {"train_loss": -28.877416610717773, "global_step": 25103, "epoch": 207} {"train_loss": -31.24973487854004, "global_step": 25104, "epoch": 207} {"train_loss": -30.701074600219727, "global_step": 25105, "epoch": 207} {"train_loss": -31.125579833984375, "global_step": 25106, "epoch": 207} {"train_loss": -31.368976593017578, "global_step": 25107, "epoch": 207} {"train_loss": -31.53517723083496, "global_step": 25108, "epoch": 207} {"train_loss": -31.614728927612305, "global_step": 25109, "epoch": 207} {"train_loss": -31.39275550842285, "global_step": 25110, "epoch": 207} {"train_loss": -30.697906494140625, "global_step": 25111, "epoch": 207} {"train_loss": -31.031164169311523, "global_step": 25112, "epoch": 207} {"train_loss": -31.020923614501953, "global_step": 25113, "epoch": 207} {"train_loss": -30.945043563842773, "global_step": 25114, "epoch": 207} {"train_loss": -31.41493034362793, "global_step": 25115, "epoch": 207} {"train_loss": -30.750173568725586, "global_step": 25116, "epoch": 207} {"train_loss": -30.555301666259766, "global_step": 25117, "epoch": 207} {"train_loss": -30.936853408813477, "global_step": 25118, "epoch": 207} {"train_loss": -30.913190841674805, "global_step": 25119, "epoch": 207} {"train_loss": -31.44951820373535, "global_step": 25120, "epoch": 207} {"train_loss": -31.044591903686523, "global_step": 25121, "epoch": 207} {"train_loss": -31.681201934814453, "global_step": 25122, "epoch": 207} {"train_loss": -31.179365158081055, "global_step": 25123, "epoch": 207} {"train_loss": -30.791412353515625, "global_step": 25124, "epoch": 207} {"train_loss": -31.85135269165039, "global_step": 25125, "epoch": 207} {"train_loss": -31.230337142944336, "global_step": 25126, "epoch": 207} {"train_loss": -31.388906478881836, "global_step": 25127, "epoch": 207} {"train_loss": -31.85146141052246, "global_step": 25128, "epoch": 207} {"train_loss": -31.505247116088867, "global_step": 25129, "epoch": 207} {"train_loss": -31.593061447143555, "global_step": 25130, "epoch": 207} {"train_loss": -31.476898193359375, "global_step": 25131, "epoch": 207} {"train_loss": -31.70308494567871, "global_step": 25132, "epoch": 207} {"train_loss": -31.531192779541016, "global_step": 25133, "epoch": 207} {"train_loss": -31.723108291625977, "global_step": 25134, "epoch": 207} {"train_loss": -31.588308334350586, "global_step": 25135, "epoch": 207} {"train_loss": -31.74408531188965, "global_step": 25136, "epoch": 207} {"train_loss": -31.34743309020996, "global_step": 25137, "epoch": 207} {"train_loss": -31.7916316986084, "global_step": 25138, "epoch": 207} {"train_loss": -31.42669677734375, "global_step": 25139, "epoch": 207} {"train_loss": -31.37739372253418, "global_step": 25140, "epoch": 207} {"train_loss": -31.831113815307617, "global_step": 25141, "epoch": 207} {"train_loss": -31.394485473632812, "global_step": 25142, "epoch": 207} {"train_loss": -32.17718505859375, "global_step": 25143, "epoch": 207} {"train_loss": -31.802228927612305, "global_step": 25144, "epoch": 207} {"train_loss": -31.898834228515625, "global_step": 25145, "epoch": 207} {"train_loss": -32.01428985595703, "global_step": 25146, "epoch": 207} {"train_loss": -32.065731048583984, "global_step": 25147, "epoch": 207} {"train_loss": -32.030094146728516, "global_step": 25148, "epoch": 207} {"train_loss": -31.833423614501953, "global_step": 25149, "epoch": 207} {"train_loss": -31.834936141967773, "global_step": 25150, "epoch": 207} {"train_loss": -32.18244171142578, "global_step": 25151, "epoch": 207} {"train_loss": -32.650848388671875, "global_step": 25152, "epoch": 207} {"train_loss": -31.949935913085938, "global_step": 25153, "epoch": 207} {"train_loss": -32.464622497558594, "global_step": 25154, "epoch": 207} {"train_loss": -32.49361038208008, "global_step": 25155, "epoch": 207} {"train_loss": -32.14193344116211, "global_step": 25156, "epoch": 207} {"train_loss": -31.871931076049805, "global_step": 25157, "epoch": 207} {"train_loss": -31.43120765686035, "global_step": 25158, "epoch": 207} {"train_loss": -31.61810874938965, "global_step": 25159, "epoch": 207} {"train_loss": -32.20676803588867, "global_step": 25160, "epoch": 207} {"train_loss": -32.159854888916016, "global_step": 25161, "epoch": 207} {"train_loss": -31.70020866394043, "global_step": 25162, "epoch": 207} {"train_loss": -32.06011962890625, "global_step": 25163, "epoch": 207} {"train_loss": -31.498899459838867, "global_step": 25164, "epoch": 207} {"train_loss": -30.253082275390625, "global_step": 25165, "epoch": 207} {"train_loss": -31.110448837280273, "global_step": 25166, "epoch": 207} {"train_loss": -31.37065463420773, "global_step": 25167, "epoch": 207, "val_loss": 2532486.5} {"train_loss": -31.324817657470703, "global_step": 25168, "epoch": 208} {"train_loss": -32.31422424316406, "global_step": 25169, "epoch": 208} {"train_loss": -31.985349655151367, "global_step": 25170, "epoch": 208} {"train_loss": -32.4923095703125, "global_step": 25171, "epoch": 208} {"train_loss": -31.824247360229492, "global_step": 25172, "epoch": 208} {"train_loss": -31.548486709594727, "global_step": 25173, "epoch": 208} {"train_loss": -31.272668838500977, "global_step": 25174, "epoch": 208} {"train_loss": -31.156293869018555, "global_step": 25175, "epoch": 208} {"train_loss": -28.373777389526367, "global_step": 25176, "epoch": 208} {"train_loss": -18.22286033630371, "global_step": 25177, "epoch": 208} {"train_loss": -10.682818412780762, "global_step": 25178, "epoch": 208} {"train_loss": -24.015186309814453, "global_step": 25179, "epoch": 208} {"train_loss": -29.431562423706055, "global_step": 25180, "epoch": 208} {"train_loss": -18.698848724365234, "global_step": 25181, "epoch": 208} {"train_loss": -25.19118881225586, "global_step": 25182, "epoch": 208} {"train_loss": -23.542139053344727, "global_step": 25183, "epoch": 208} {"train_loss": -30.956134796142578, "global_step": 25184, "epoch": 208} {"train_loss": -27.56159019470215, "global_step": 25185, "epoch": 208} {"train_loss": -29.291242599487305, "global_step": 25186, "epoch": 208} {"train_loss": -29.846240997314453, "global_step": 25187, "epoch": 208} {"train_loss": -28.481061935424805, "global_step": 25188, "epoch": 208} {"train_loss": -30.120380401611328, "global_step": 25189, "epoch": 208} {"train_loss": -30.5389461517334, "global_step": 25190, "epoch": 208} {"train_loss": -29.262897491455078, "global_step": 25191, "epoch": 208} {"train_loss": -30.40143394470215, "global_step": 25192, "epoch": 208} {"train_loss": -30.360097885131836, "global_step": 25193, "epoch": 208} {"train_loss": -30.67884635925293, "global_step": 25194, "epoch": 208} {"train_loss": -29.70423698425293, "global_step": 25195, "epoch": 208} {"train_loss": -30.431182861328125, "global_step": 25196, "epoch": 208} {"train_loss": -30.33672523498535, "global_step": 25197, "epoch": 208} {"train_loss": -30.783361434936523, "global_step": 25198, "epoch": 208} {"train_loss": -30.39088249206543, "global_step": 25199, "epoch": 208} {"train_loss": -30.831008911132812, "global_step": 25200, "epoch": 208} {"train_loss": -30.94276237487793, "global_step": 25201, "epoch": 208} {"train_loss": -31.024707794189453, "global_step": 25202, "epoch": 208} {"train_loss": -30.369836807250977, "global_step": 25203, "epoch": 208} {"train_loss": -31.0667781829834, "global_step": 25204, "epoch": 208} {"train_loss": -30.58756446838379, "global_step": 25205, "epoch": 208} {"train_loss": -31.339801788330078, "global_step": 25206, "epoch": 208} {"train_loss": -30.954898834228516, "global_step": 25207, "epoch": 208} {"train_loss": -31.342615127563477, "global_step": 25208, "epoch": 208} {"train_loss": -30.742034912109375, "global_step": 25209, "epoch": 208} {"train_loss": -31.145517349243164, "global_step": 25210, "epoch": 208} {"train_loss": -30.9699649810791, "global_step": 25211, "epoch": 208} {"train_loss": -31.284347534179688, "global_step": 25212, "epoch": 208} {"train_loss": -31.3382625579834, "global_step": 25213, "epoch": 208} {"train_loss": -31.688268661499023, "global_step": 25214, "epoch": 208} {"train_loss": -30.98642921447754, "global_step": 25215, "epoch": 208} {"train_loss": -31.37312126159668, "global_step": 25216, "epoch": 208} {"train_loss": -30.79256248474121, "global_step": 25217, "epoch": 208} {"train_loss": -31.07172203063965, "global_step": 25218, "epoch": 208} {"train_loss": -31.102298736572266, "global_step": 25219, "epoch": 208} {"train_loss": -31.78434181213379, "global_step": 25220, "epoch": 208} {"train_loss": -31.33986473083496, "global_step": 25221, "epoch": 208} {"train_loss": -31.02259635925293, "global_step": 25222, "epoch": 208} {"train_loss": -31.48932456970215, "global_step": 25223, "epoch": 208} {"train_loss": -31.264612197875977, "global_step": 25224, "epoch": 208} {"train_loss": -31.013574600219727, "global_step": 25225, "epoch": 208} {"train_loss": -31.127979278564453, "global_step": 25226, "epoch": 208} {"train_loss": -31.243253707885742, "global_step": 25227, "epoch": 208} {"train_loss": -31.449798583984375, "global_step": 25228, "epoch": 208} {"train_loss": -31.131010055541992, "global_step": 25229, "epoch": 208} {"train_loss": -31.26473045349121, "global_step": 25230, "epoch": 208} {"train_loss": -31.108121871948242, "global_step": 25231, "epoch": 208} {"train_loss": -30.748554229736328, "global_step": 25232, "epoch": 208} {"train_loss": -31.734853744506836, "global_step": 25233, "epoch": 208} {"train_loss": -30.8385009765625, "global_step": 25234, "epoch": 208} {"train_loss": -31.12744140625, "global_step": 25235, "epoch": 208} {"train_loss": -31.695337295532227, "global_step": 25236, "epoch": 208} {"train_loss": -31.615554809570312, "global_step": 25237, "epoch": 208} {"train_loss": -31.586139678955078, "global_step": 25238, "epoch": 208} {"train_loss": -31.583343505859375, "global_step": 25239, "epoch": 208} {"train_loss": -31.72705078125, "global_step": 25240, "epoch": 208} {"train_loss": -31.222620010375977, "global_step": 25241, "epoch": 208} {"train_loss": -31.614099502563477, "global_step": 25242, "epoch": 208} {"train_loss": -31.82843589782715, "global_step": 25243, "epoch": 208} {"train_loss": -31.846799850463867, "global_step": 25244, "epoch": 208} {"train_loss": -31.477441787719727, "global_step": 25245, "epoch": 208} {"train_loss": -31.2036190032959, "global_step": 25246, "epoch": 208} {"train_loss": -31.085784912109375, "global_step": 25247, "epoch": 208} {"train_loss": -31.65799903869629, "global_step": 25248, "epoch": 208} {"train_loss": -31.3094539642334, "global_step": 25249, "epoch": 208} {"train_loss": -31.565998077392578, "global_step": 25250, "epoch": 208} {"train_loss": -31.295013427734375, "global_step": 25251, "epoch": 208} {"train_loss": -30.865209579467773, "global_step": 25252, "epoch": 208} {"train_loss": -30.094953536987305, "global_step": 25253, "epoch": 208} {"train_loss": -27.967077255249023, "global_step": 25254, "epoch": 208} {"train_loss": -23.946842193603516, "global_step": 25255, "epoch": 208} {"train_loss": -21.50895881652832, "global_step": 25256, "epoch": 208} {"train_loss": -25.475311279296875, "global_step": 25257, "epoch": 208} {"train_loss": -31.48390007019043, "global_step": 25258, "epoch": 208} {"train_loss": -29.125097274780273, "global_step": 25259, "epoch": 208} {"train_loss": -28.628992080688477, "global_step": 25260, "epoch": 208} {"train_loss": -30.90033531188965, "global_step": 25261, "epoch": 208} {"train_loss": -28.952838897705078, "global_step": 25262, "epoch": 208} {"train_loss": -31.2042236328125, "global_step": 25263, "epoch": 208} {"train_loss": -30.4912052154541, "global_step": 25264, "epoch": 208} {"train_loss": -30.383270263671875, "global_step": 25265, "epoch": 208} {"train_loss": -31.1237735748291, "global_step": 25266, "epoch": 208} {"train_loss": -29.904144287109375, "global_step": 25267, "epoch": 208} {"train_loss": -31.123401641845703, "global_step": 25268, "epoch": 208} {"train_loss": -30.754169464111328, "global_step": 25269, "epoch": 208} {"train_loss": -30.35352897644043, "global_step": 25270, "epoch": 208} {"train_loss": -30.89227867126465, "global_step": 25271, "epoch": 208} {"train_loss": -30.48125648498535, "global_step": 25272, "epoch": 208} {"train_loss": -30.83180809020996, "global_step": 25273, "epoch": 208} {"train_loss": -30.697174072265625, "global_step": 25274, "epoch": 208} {"train_loss": -31.18377685546875, "global_step": 25275, "epoch": 208} {"train_loss": -30.7150936126709, "global_step": 25276, "epoch": 208} {"train_loss": -30.449539184570312, "global_step": 25277, "epoch": 208} {"train_loss": -31.092594146728516, "global_step": 25278, "epoch": 208} {"train_loss": -31.025815963745117, "global_step": 25279, "epoch": 208} {"train_loss": -30.946517944335938, "global_step": 25280, "epoch": 208} {"train_loss": -31.714508056640625, "global_step": 25281, "epoch": 208} {"train_loss": -31.424365997314453, "global_step": 25282, "epoch": 208} {"train_loss": -31.190216064453125, "global_step": 25283, "epoch": 208} {"train_loss": -31.38277244567871, "global_step": 25284, "epoch": 208} {"train_loss": -31.578943252563477, "global_step": 25285, "epoch": 208} {"train_loss": -31.2820987701416, "global_step": 25286, "epoch": 208} {"train_loss": -31.497297286987305, "global_step": 25287, "epoch": 208} {"train_loss": -30.165332880887117, "global_step": 25288, "epoch": 208, "val_loss": 2699029.0} {"train_loss": -30.36809730529785, "global_step": 25289, "epoch": 209} {"train_loss": -31.422592163085938, "global_step": 25290, "epoch": 209} {"train_loss": -29.801252365112305, "global_step": 25291, "epoch": 209} {"train_loss": -29.273426055908203, "global_step": 25292, "epoch": 209} {"train_loss": -30.85868263244629, "global_step": 25293, "epoch": 209} {"train_loss": -30.6495361328125, "global_step": 25294, "epoch": 209} {"train_loss": -31.4466609954834, "global_step": 25295, "epoch": 209} {"train_loss": -31.027124404907227, "global_step": 25296, "epoch": 209} {"train_loss": -31.020017623901367, "global_step": 25297, "epoch": 209} {"train_loss": -31.165014266967773, "global_step": 25298, "epoch": 209} {"train_loss": -30.76087760925293, "global_step": 25299, "epoch": 209} {"train_loss": -31.299854278564453, "global_step": 25300, "epoch": 209} {"train_loss": -31.176361083984375, "global_step": 25301, "epoch": 209} {"train_loss": -31.137990951538086, "global_step": 25302, "epoch": 209} {"train_loss": -31.612268447875977, "global_step": 25303, "epoch": 209} {"train_loss": -31.904376983642578, "global_step": 25304, "epoch": 209} {"train_loss": -31.67424964904785, "global_step": 25305, "epoch": 209} {"train_loss": -30.833139419555664, "global_step": 25306, "epoch": 209} {"train_loss": -31.6647891998291, "global_step": 25307, "epoch": 209} {"train_loss": -31.971540451049805, "global_step": 25308, "epoch": 209} {"train_loss": -31.486669540405273, "global_step": 25309, "epoch": 209} {"train_loss": -31.21746826171875, "global_step": 25310, "epoch": 209} {"train_loss": -31.349853515625, "global_step": 25311, "epoch": 209} {"train_loss": -31.504901885986328, "global_step": 25312, "epoch": 209} {"train_loss": -31.30191421508789, "global_step": 25313, "epoch": 209} {"train_loss": -31.861072540283203, "global_step": 25314, "epoch": 209} {"train_loss": -31.245710372924805, "global_step": 25315, "epoch": 209} {"train_loss": -31.237991333007812, "global_step": 25316, "epoch": 209} {"train_loss": -31.4982852935791, "global_step": 25317, "epoch": 209} {"train_loss": -31.540851593017578, "global_step": 25318, "epoch": 209} {"train_loss": -31.692981719970703, "global_step": 25319, "epoch": 209} {"train_loss": -31.571256637573242, "global_step": 25320, "epoch": 209} {"train_loss": -31.144636154174805, "global_step": 25321, "epoch": 209} {"train_loss": -30.9963436126709, "global_step": 25322, "epoch": 209} {"train_loss": -31.545745849609375, "global_step": 25323, "epoch": 209} {"train_loss": -31.161222457885742, "global_step": 25324, "epoch": 209} {"train_loss": -31.07777214050293, "global_step": 25325, "epoch": 209} {"train_loss": -29.888837814331055, "global_step": 25326, "epoch": 209} {"train_loss": -30.33465576171875, "global_step": 25327, "epoch": 209} {"train_loss": -31.58669090270996, "global_step": 25328, "epoch": 209} {"train_loss": -31.635282516479492, "global_step": 25329, "epoch": 209} {"train_loss": -30.7155704498291, "global_step": 25330, "epoch": 209} {"train_loss": -31.408658981323242, "global_step": 25331, "epoch": 209} {"train_loss": -31.7734432220459, "global_step": 25332, "epoch": 209} {"train_loss": -30.705768585205078, "global_step": 25333, "epoch": 209} {"train_loss": -28.577070236206055, "global_step": 25334, "epoch": 209} {"train_loss": -30.232315063476562, "global_step": 25335, "epoch": 209} {"train_loss": -31.37088966369629, "global_step": 25336, "epoch": 209} {"train_loss": -31.3217716217041, "global_step": 25337, "epoch": 209} {"train_loss": -31.34122657775879, "global_step": 25338, "epoch": 209} {"train_loss": -31.005023956298828, "global_step": 25339, "epoch": 209} {"train_loss": -31.500497817993164, "global_step": 25340, "epoch": 209} {"train_loss": -31.224836349487305, "global_step": 25341, "epoch": 209} {"train_loss": -31.595640182495117, "global_step": 25342, "epoch": 209} {"train_loss": -31.330310821533203, "global_step": 25343, "epoch": 209} {"train_loss": -31.497175216674805, "global_step": 25344, "epoch": 209} {"train_loss": -31.649566650390625, "global_step": 25345, "epoch": 209} {"train_loss": -31.761768341064453, "global_step": 25346, "epoch": 209} {"train_loss": -31.078369140625, "global_step": 25347, "epoch": 209} {"train_loss": -31.572858810424805, "global_step": 25348, "epoch": 209} {"train_loss": -31.35516929626465, "global_step": 25349, "epoch": 209} {"train_loss": -31.680744171142578, "global_step": 25350, "epoch": 209} {"train_loss": -31.64817237854004, "global_step": 25351, "epoch": 209} {"train_loss": -31.16506004333496, "global_step": 25352, "epoch": 209} {"train_loss": -31.657461166381836, "global_step": 25353, "epoch": 209} {"train_loss": -31.57307243347168, "global_step": 25354, "epoch": 209} {"train_loss": -31.279550552368164, "global_step": 25355, "epoch": 209} {"train_loss": -31.774709701538086, "global_step": 25356, "epoch": 209} {"train_loss": -31.37994956970215, "global_step": 25357, "epoch": 209} {"train_loss": -31.47043800354004, "global_step": 25358, "epoch": 209} {"train_loss": -30.113754272460938, "global_step": 25359, "epoch": 209} {"train_loss": -31.776691436767578, "global_step": 25360, "epoch": 209} {"train_loss": -30.83969497680664, "global_step": 25361, "epoch": 209} {"train_loss": -31.291975021362305, "global_step": 25362, "epoch": 209} {"train_loss": -31.528467178344727, "global_step": 25363, "epoch": 209} {"train_loss": -31.566864013671875, "global_step": 25364, "epoch": 209} {"train_loss": -31.002735137939453, "global_step": 25365, "epoch": 209} {"train_loss": -31.31500244140625, "global_step": 25366, "epoch": 209} {"train_loss": -30.774316787719727, "global_step": 25367, "epoch": 209} {"train_loss": -30.945337295532227, "global_step": 25368, "epoch": 209} {"train_loss": -30.23646354675293, "global_step": 25369, "epoch": 209} {"train_loss": -28.623640060424805, "global_step": 25370, "epoch": 209} {"train_loss": -30.05828857421875, "global_step": 25371, "epoch": 209} {"train_loss": -30.573596954345703, "global_step": 25372, "epoch": 209} {"train_loss": -29.51885414123535, "global_step": 25373, "epoch": 209} {"train_loss": -31.270904541015625, "global_step": 25374, "epoch": 209} {"train_loss": -28.688016891479492, "global_step": 25375, "epoch": 209} {"train_loss": -31.321949005126953, "global_step": 25376, "epoch": 209} {"train_loss": -30.70416831970215, "global_step": 25377, "epoch": 209} {"train_loss": -29.10213279724121, "global_step": 25378, "epoch": 209} {"train_loss": -30.908716201782227, "global_step": 25379, "epoch": 209} {"train_loss": -30.579465866088867, "global_step": 25380, "epoch": 209} {"train_loss": -30.084074020385742, "global_step": 25381, "epoch": 209} {"train_loss": -30.910125732421875, "global_step": 25382, "epoch": 209} {"train_loss": -30.55405044555664, "global_step": 25383, "epoch": 209} {"train_loss": -30.77273941040039, "global_step": 25384, "epoch": 209} {"train_loss": -31.164260864257812, "global_step": 25385, "epoch": 209} {"train_loss": -31.36570167541504, "global_step": 25386, "epoch": 209} {"train_loss": -30.75360679626465, "global_step": 25387, "epoch": 209} {"train_loss": -31.690597534179688, "global_step": 25388, "epoch": 209} {"train_loss": -30.912796020507812, "global_step": 25389, "epoch": 209} {"train_loss": -30.646320343017578, "global_step": 25390, "epoch": 209} {"train_loss": -31.54352378845215, "global_step": 25391, "epoch": 209} {"train_loss": -31.106470108032227, "global_step": 25392, "epoch": 209} {"train_loss": -30.98602867126465, "global_step": 25393, "epoch": 209} {"train_loss": -30.996984481811523, "global_step": 25394, "epoch": 209} {"train_loss": -31.3997745513916, "global_step": 25395, "epoch": 209} {"train_loss": -31.12122917175293, "global_step": 25396, "epoch": 209} {"train_loss": -31.461029052734375, "global_step": 25397, "epoch": 209} {"train_loss": -30.82988929748535, "global_step": 25398, "epoch": 209} {"train_loss": -30.921573638916016, "global_step": 25399, "epoch": 209} {"train_loss": -31.088531494140625, "global_step": 25400, "epoch": 209} {"train_loss": -31.401330947875977, "global_step": 25401, "epoch": 209} {"train_loss": -30.570646286010742, "global_step": 25402, "epoch": 209} {"train_loss": -29.44158935546875, "global_step": 25403, "epoch": 209} {"train_loss": -29.177993774414062, "global_step": 25404, "epoch": 209} {"train_loss": -31.430744171142578, "global_step": 25405, "epoch": 209} {"train_loss": -31.584753036499023, "global_step": 25406, "epoch": 209} {"train_loss": -31.17194175720215, "global_step": 25407, "epoch": 209} {"train_loss": -31.151782989501953, "global_step": 25408, "epoch": 209} {"train_loss": -31.037080559848754, "global_step": 25409, "epoch": 209, "val_loss": 2530667.0} {"train_loss": -31.409543991088867, "global_step": 25410, "epoch": 210} {"train_loss": -30.99350357055664, "global_step": 25411, "epoch": 210} {"train_loss": -31.81275749206543, "global_step": 25412, "epoch": 210} {"train_loss": -31.36419677734375, "global_step": 25413, "epoch": 210} {"train_loss": -31.05634117126465, "global_step": 25414, "epoch": 210} {"train_loss": -31.925634384155273, "global_step": 25415, "epoch": 210} {"train_loss": -31.441024780273438, "global_step": 25416, "epoch": 210} {"train_loss": -31.357471466064453, "global_step": 25417, "epoch": 210} {"train_loss": -31.39105224609375, "global_step": 25418, "epoch": 210} {"train_loss": -31.949054718017578, "global_step": 25419, "epoch": 210} {"train_loss": -31.852100372314453, "global_step": 25420, "epoch": 210} {"train_loss": -31.483051300048828, "global_step": 25421, "epoch": 210} {"train_loss": -32.03812026977539, "global_step": 25422, "epoch": 210} {"train_loss": -32.03413009643555, "global_step": 25423, "epoch": 210} {"train_loss": -31.689802169799805, "global_step": 25424, "epoch": 210} {"train_loss": -31.231840133666992, "global_step": 25425, "epoch": 210} {"train_loss": -30.8232421875, "global_step": 25426, "epoch": 210} {"train_loss": -29.978174209594727, "global_step": 25427, "epoch": 210} {"train_loss": -31.483734130859375, "global_step": 25428, "epoch": 210} {"train_loss": -32.34130859375, "global_step": 25429, "epoch": 210} {"train_loss": -31.0650691986084, "global_step": 25430, "epoch": 210} {"train_loss": -30.6951904296875, "global_step": 25431, "epoch": 210} {"train_loss": -31.3210391998291, "global_step": 25432, "epoch": 210} {"train_loss": -31.616662979125977, "global_step": 25433, "epoch": 210} {"train_loss": -30.772008895874023, "global_step": 25434, "epoch": 210} {"train_loss": -30.81941032409668, "global_step": 25435, "epoch": 210} {"train_loss": -31.43427085876465, "global_step": 25436, "epoch": 210} {"train_loss": -30.415210723876953, "global_step": 25437, "epoch": 210} {"train_loss": -30.966659545898438, "global_step": 25438, "epoch": 210} {"train_loss": -31.198339462280273, "global_step": 25439, "epoch": 210} {"train_loss": -30.250919342041016, "global_step": 25440, "epoch": 210} {"train_loss": -30.8814754486084, "global_step": 25441, "epoch": 210} {"train_loss": -31.082763671875, "global_step": 25442, "epoch": 210} {"train_loss": -31.069910049438477, "global_step": 25443, "epoch": 210} {"train_loss": -31.15376853942871, "global_step": 25444, "epoch": 210} {"train_loss": -30.026697158813477, "global_step": 25445, "epoch": 210} {"train_loss": -30.614023208618164, "global_step": 25446, "epoch": 210} {"train_loss": -30.30362892150879, "global_step": 25447, "epoch": 210} {"train_loss": -29.9168701171875, "global_step": 25448, "epoch": 210} {"train_loss": -29.06106948852539, "global_step": 25449, "epoch": 210} {"train_loss": -27.7211971282959, "global_step": 25450, "epoch": 210} {"train_loss": -28.713220596313477, "global_step": 25451, "epoch": 210} {"train_loss": -29.7121639251709, "global_step": 25452, "epoch": 210} {"train_loss": -30.907827377319336, "global_step": 25453, "epoch": 210} {"train_loss": -31.249521255493164, "global_step": 25454, "epoch": 210} {"train_loss": -29.724191665649414, "global_step": 25455, "epoch": 210} {"train_loss": -29.509918212890625, "global_step": 25456, "epoch": 210} {"train_loss": -30.604169845581055, "global_step": 25457, "epoch": 210} {"train_loss": -31.085973739624023, "global_step": 25458, "epoch": 210} {"train_loss": -30.634763717651367, "global_step": 25459, "epoch": 210} {"train_loss": -31.28898048400879, "global_step": 25460, "epoch": 210} {"train_loss": -31.24513816833496, "global_step": 25461, "epoch": 210} {"train_loss": -31.23577308654785, "global_step": 25462, "epoch": 210} {"train_loss": -31.020294189453125, "global_step": 25463, "epoch": 210} {"train_loss": -31.671295166015625, "global_step": 25464, "epoch": 210} {"train_loss": -31.297332763671875, "global_step": 25465, "epoch": 210} {"train_loss": -31.600341796875, "global_step": 25466, "epoch": 210} {"train_loss": -30.931692123413086, "global_step": 25467, "epoch": 210} {"train_loss": -31.784961700439453, "global_step": 25468, "epoch": 210} {"train_loss": -30.86957359313965, "global_step": 25469, "epoch": 210} {"train_loss": -31.758438110351562, "global_step": 25470, "epoch": 210} {"train_loss": -31.891515731811523, "global_step": 25471, "epoch": 210} {"train_loss": -31.911945343017578, "global_step": 25472, "epoch": 210} {"train_loss": -31.9918212890625, "global_step": 25473, "epoch": 210} {"train_loss": -31.6743221282959, "global_step": 25474, "epoch": 210} {"train_loss": -32.269874572753906, "global_step": 25475, "epoch": 210} {"train_loss": -31.866968154907227, "global_step": 25476, "epoch": 210} {"train_loss": -31.962804794311523, "global_step": 25477, "epoch": 210} {"train_loss": -31.58405876159668, "global_step": 25478, "epoch": 210} {"train_loss": -31.73349380493164, "global_step": 25479, "epoch": 210} {"train_loss": -31.6842098236084, "global_step": 25480, "epoch": 210} {"train_loss": -31.974090576171875, "global_step": 25481, "epoch": 210} {"train_loss": -31.729877471923828, "global_step": 25482, "epoch": 210} {"train_loss": -31.509336471557617, "global_step": 25483, "epoch": 210} {"train_loss": -31.792865753173828, "global_step": 25484, "epoch": 210} {"train_loss": -31.89756202697754, "global_step": 25485, "epoch": 210} {"train_loss": -31.987060546875, "global_step": 25486, "epoch": 210} {"train_loss": -31.82329750061035, "global_step": 25487, "epoch": 210} {"train_loss": -31.470809936523438, "global_step": 25488, "epoch": 210} {"train_loss": -30.733280181884766, "global_step": 25489, "epoch": 210} {"train_loss": -31.096471786499023, "global_step": 25490, "epoch": 210} {"train_loss": -30.7064151763916, "global_step": 25491, "epoch": 210} {"train_loss": -30.607526779174805, "global_step": 25492, "epoch": 210} {"train_loss": -30.77327537536621, "global_step": 25493, "epoch": 210} {"train_loss": -31.094518661499023, "global_step": 25494, "epoch": 210} {"train_loss": -31.2078857421875, "global_step": 25495, "epoch": 210} {"train_loss": -31.65472984313965, "global_step": 25496, "epoch": 210} {"train_loss": -30.956586837768555, "global_step": 25497, "epoch": 210} {"train_loss": -30.2877254486084, "global_step": 25498, "epoch": 210} {"train_loss": -30.243091583251953, "global_step": 25499, "epoch": 210} {"train_loss": -31.184423446655273, "global_step": 25500, "epoch": 210} {"train_loss": -31.37116050720215, "global_step": 25501, "epoch": 210} {"train_loss": -30.63165855407715, "global_step": 25502, "epoch": 210} {"train_loss": -31.140165328979492, "global_step": 25503, "epoch": 210} {"train_loss": -31.466449737548828, "global_step": 25504, "epoch": 210} {"train_loss": -31.29143714904785, "global_step": 25505, "epoch": 210} {"train_loss": -31.67233657836914, "global_step": 25506, "epoch": 210} {"train_loss": -31.460412979125977, "global_step": 25507, "epoch": 210} {"train_loss": -31.61395263671875, "global_step": 25508, "epoch": 210} {"train_loss": -31.864410400390625, "global_step": 25509, "epoch": 210} {"train_loss": -31.66529655456543, "global_step": 25510, "epoch": 210} {"train_loss": -32.128631591796875, "global_step": 25511, "epoch": 210} {"train_loss": -31.5716609954834, "global_step": 25512, "epoch": 210} {"train_loss": -31.80353355407715, "global_step": 25513, "epoch": 210} {"train_loss": -32.2512092590332, "global_step": 25514, "epoch": 210} {"train_loss": -31.376855850219727, "global_step": 25515, "epoch": 210} {"train_loss": -31.852136611938477, "global_step": 25516, "epoch": 210} {"train_loss": -32.604393005371094, "global_step": 25517, "epoch": 210} {"train_loss": -31.874357223510742, "global_step": 25518, "epoch": 210} {"train_loss": -31.946714401245117, "global_step": 25519, "epoch": 210} {"train_loss": -31.833234786987305, "global_step": 25520, "epoch": 210} {"train_loss": -31.994873046875, "global_step": 25521, "epoch": 210} {"train_loss": -32.22624588012695, "global_step": 25522, "epoch": 210} {"train_loss": -32.015682220458984, "global_step": 25523, "epoch": 210} {"train_loss": -31.833587646484375, "global_step": 25524, "epoch": 210} {"train_loss": -31.979999542236328, "global_step": 25525, "epoch": 210} {"train_loss": -32.144229888916016, "global_step": 25526, "epoch": 210} {"train_loss": -32.22736740112305, "global_step": 25527, "epoch": 210} {"train_loss": -31.030004501342773, "global_step": 25528, "epoch": 210} {"train_loss": -31.859106063842773, "global_step": 25529, "epoch": 210} {"train_loss": -31.28106732013797, "global_step": 25530, "epoch": 210, "val_loss": 2562171.75} {"train_loss": -31.44980812072754, "global_step": 25531, "epoch": 211} {"train_loss": -31.591922760009766, "global_step": 25532, "epoch": 211} {"train_loss": -31.770517349243164, "global_step": 25533, "epoch": 211} {"train_loss": -31.768463134765625, "global_step": 25534, "epoch": 211} {"train_loss": -31.477237701416016, "global_step": 25535, "epoch": 211} {"train_loss": -31.54833984375, "global_step": 25536, "epoch": 211} {"train_loss": -31.407363891601562, "global_step": 25537, "epoch": 211} {"train_loss": -31.264997482299805, "global_step": 25538, "epoch": 211} {"train_loss": -30.52583885192871, "global_step": 25539, "epoch": 211} {"train_loss": -31.279266357421875, "global_step": 25540, "epoch": 211} {"train_loss": -30.849811553955078, "global_step": 25541, "epoch": 211} {"train_loss": -31.420608520507812, "global_step": 25542, "epoch": 211} {"train_loss": -31.50636863708496, "global_step": 25543, "epoch": 211} {"train_loss": -30.689544677734375, "global_step": 25544, "epoch": 211} {"train_loss": -31.89068031311035, "global_step": 25545, "epoch": 211} {"train_loss": -31.259876251220703, "global_step": 25546, "epoch": 211} {"train_loss": -31.79499626159668, "global_step": 25547, "epoch": 211} {"train_loss": -31.798627853393555, "global_step": 25548, "epoch": 211} {"train_loss": -31.6805419921875, "global_step": 25549, "epoch": 211} {"train_loss": -31.720722198486328, "global_step": 25550, "epoch": 211} {"train_loss": -31.794391632080078, "global_step": 25551, "epoch": 211} {"train_loss": -31.437671661376953, "global_step": 25552, "epoch": 211} {"train_loss": -31.452890396118164, "global_step": 25553, "epoch": 211} {"train_loss": -31.956613540649414, "global_step": 25554, "epoch": 211} {"train_loss": -32.20573043823242, "global_step": 25555, "epoch": 211} {"train_loss": -31.48526954650879, "global_step": 25556, "epoch": 211} {"train_loss": -32.099910736083984, "global_step": 25557, "epoch": 211} {"train_loss": -31.18427085876465, "global_step": 25558, "epoch": 211} {"train_loss": -30.593612670898438, "global_step": 25559, "epoch": 211} {"train_loss": -30.7868709564209, "global_step": 25560, "epoch": 211} {"train_loss": -30.240741729736328, "global_step": 25561, "epoch": 211} {"train_loss": -29.168710708618164, "global_step": 25562, "epoch": 211} {"train_loss": -30.65437126159668, "global_step": 25563, "epoch": 211} {"train_loss": -31.53133201599121, "global_step": 25564, "epoch": 211} {"train_loss": -32.136566162109375, "global_step": 25565, "epoch": 211} {"train_loss": -30.8061580657959, "global_step": 25566, "epoch": 211} {"train_loss": -30.20012855529785, "global_step": 25567, "epoch": 211} {"train_loss": -31.217681884765625, "global_step": 25568, "epoch": 211} {"train_loss": -31.610980987548828, "global_step": 25569, "epoch": 211} {"train_loss": -31.505563735961914, "global_step": 25570, "epoch": 211} {"train_loss": -31.59758949279785, "global_step": 25571, "epoch": 211} {"train_loss": -29.470075607299805, "global_step": 25572, "epoch": 211} {"train_loss": -29.035812377929688, "global_step": 25573, "epoch": 211} {"train_loss": -31.351181030273438, "global_step": 25574, "epoch": 211} {"train_loss": -31.40250015258789, "global_step": 25575, "epoch": 211} {"train_loss": -30.25531578063965, "global_step": 25576, "epoch": 211} {"train_loss": -30.129724502563477, "global_step": 25577, "epoch": 211} {"train_loss": -31.808181762695312, "global_step": 25578, "epoch": 211} {"train_loss": -31.675434112548828, "global_step": 25579, "epoch": 211} {"train_loss": -31.169904708862305, "global_step": 25580, "epoch": 211} {"train_loss": -31.7145938873291, "global_step": 25581, "epoch": 211} {"train_loss": -31.45718765258789, "global_step": 25582, "epoch": 211} {"train_loss": -31.3470401763916, "global_step": 25583, "epoch": 211} {"train_loss": -31.406522750854492, "global_step": 25584, "epoch": 211} {"train_loss": -31.603958129882812, "global_step": 25585, "epoch": 211} {"train_loss": -31.529605865478516, "global_step": 25586, "epoch": 211} {"train_loss": -31.94196891784668, "global_step": 25587, "epoch": 211} {"train_loss": -31.317752838134766, "global_step": 25588, "epoch": 211} {"train_loss": -31.60733985900879, "global_step": 25589, "epoch": 211} {"train_loss": -31.078083038330078, "global_step": 25590, "epoch": 211} {"train_loss": -31.60971450805664, "global_step": 25591, "epoch": 211} {"train_loss": -32.0839729309082, "global_step": 25592, "epoch": 211} {"train_loss": -31.304685592651367, "global_step": 25593, "epoch": 211} {"train_loss": -31.408050537109375, "global_step": 25594, "epoch": 211} {"train_loss": -32.036685943603516, "global_step": 25595, "epoch": 211} {"train_loss": -31.766117095947266, "global_step": 25596, "epoch": 211} {"train_loss": -31.843048095703125, "global_step": 25597, "epoch": 211} {"train_loss": -31.800451278686523, "global_step": 25598, "epoch": 211} {"train_loss": -31.96552085876465, "global_step": 25599, "epoch": 211} {"train_loss": -32.496803283691406, "global_step": 25600, "epoch": 211} {"train_loss": -31.5255126953125, "global_step": 25601, "epoch": 211} {"train_loss": -31.80242919921875, "global_step": 25602, "epoch": 211} {"train_loss": -32.29905319213867, "global_step": 25603, "epoch": 211} {"train_loss": -32.22653579711914, "global_step": 25604, "epoch": 211} {"train_loss": -32.547054290771484, "global_step": 25605, "epoch": 211} {"train_loss": -32.1276969909668, "global_step": 25606, "epoch": 211} {"train_loss": -32.319610595703125, "global_step": 25607, "epoch": 211} {"train_loss": -32.13812255859375, "global_step": 25608, "epoch": 211} {"train_loss": -31.35527992248535, "global_step": 25609, "epoch": 211} {"train_loss": -29.976903915405273, "global_step": 25610, "epoch": 211} {"train_loss": -31.17677116394043, "global_step": 25611, "epoch": 211} {"train_loss": -30.997678756713867, "global_step": 25612, "epoch": 211} {"train_loss": -31.735517501831055, "global_step": 25613, "epoch": 211} {"train_loss": -32.56349182128906, "global_step": 25614, "epoch": 211} {"train_loss": -31.81146240234375, "global_step": 25615, "epoch": 211} {"train_loss": -31.145421981811523, "global_step": 25616, "epoch": 211} {"train_loss": -32.55056381225586, "global_step": 25617, "epoch": 211} {"train_loss": -32.23523712158203, "global_step": 25618, "epoch": 211} {"train_loss": -31.614933013916016, "global_step": 25619, "epoch": 211} {"train_loss": -30.869123458862305, "global_step": 25620, "epoch": 211} {"train_loss": -31.972822189331055, "global_step": 25621, "epoch": 211} {"train_loss": -32.18134307861328, "global_step": 25622, "epoch": 211} {"train_loss": -31.38282585144043, "global_step": 25623, "epoch": 211} {"train_loss": -32.00643539428711, "global_step": 25624, "epoch": 211} {"train_loss": -32.017982482910156, "global_step": 25625, "epoch": 211} {"train_loss": -31.17371940612793, "global_step": 25626, "epoch": 211} {"train_loss": -31.913293838500977, "global_step": 25627, "epoch": 211} {"train_loss": -31.676740646362305, "global_step": 25628, "epoch": 211} {"train_loss": -31.716516494750977, "global_step": 25629, "epoch": 211} {"train_loss": -31.429174423217773, "global_step": 25630, "epoch": 211} {"train_loss": -30.742252349853516, "global_step": 25631, "epoch": 211} {"train_loss": -31.821706771850586, "global_step": 25632, "epoch": 211} {"train_loss": -31.584552764892578, "global_step": 25633, "epoch": 211} {"train_loss": -31.76006507873535, "global_step": 25634, "epoch": 211} {"train_loss": -31.9691104888916, "global_step": 25635, "epoch": 211} {"train_loss": -30.218585968017578, "global_step": 25636, "epoch": 211} {"train_loss": -28.460721969604492, "global_step": 25637, "epoch": 211} {"train_loss": -26.182621002197266, "global_step": 25638, "epoch": 211} {"train_loss": -27.244474411010742, "global_step": 25639, "epoch": 211} {"train_loss": -31.293542861938477, "global_step": 25640, "epoch": 211} {"train_loss": -29.192523956298828, "global_step": 25641, "epoch": 211} {"train_loss": -29.42323112487793, "global_step": 25642, "epoch": 211} {"train_loss": -30.548852920532227, "global_step": 25643, "epoch": 211} {"train_loss": -30.59404945373535, "global_step": 25644, "epoch": 211} {"train_loss": -31.274534225463867, "global_step": 25645, "epoch": 211} {"train_loss": -30.568220138549805, "global_step": 25646, "epoch": 211} {"train_loss": -30.379846572875977, "global_step": 25647, "epoch": 211} {"train_loss": -30.708148956298828, "global_step": 25648, "epoch": 211} {"train_loss": -31.3125, "global_step": 25649, "epoch": 211} {"train_loss": -30.622573852539062, "global_step": 25650, "epoch": 211} {"train_loss": -31.26966145412981, "global_step": 25651, "epoch": 211, "val_loss": 2570562.5} {"train_loss": -31.363967895507812, "global_step": 25652, "epoch": 212} {"train_loss": -30.547565460205078, "global_step": 25653, "epoch": 212} {"train_loss": -30.95942497253418, "global_step": 25654, "epoch": 212} {"train_loss": -31.589527130126953, "global_step": 25655, "epoch": 212} {"train_loss": -31.3293399810791, "global_step": 25656, "epoch": 212} {"train_loss": -30.448755264282227, "global_step": 25657, "epoch": 212} {"train_loss": -31.096826553344727, "global_step": 25658, "epoch": 212} {"train_loss": -30.990827560424805, "global_step": 25659, "epoch": 212} {"train_loss": -30.713891983032227, "global_step": 25660, "epoch": 212} {"train_loss": -30.50042152404785, "global_step": 25661, "epoch": 212} {"train_loss": -31.18397331237793, "global_step": 25662, "epoch": 212} {"train_loss": -31.857847213745117, "global_step": 25663, "epoch": 212} {"train_loss": -30.85123634338379, "global_step": 25664, "epoch": 212} {"train_loss": -30.73554801940918, "global_step": 25665, "epoch": 212} {"train_loss": -31.046899795532227, "global_step": 25666, "epoch": 212} {"train_loss": -30.000741958618164, "global_step": 25667, "epoch": 212} {"train_loss": -31.494230270385742, "global_step": 25668, "epoch": 212} {"train_loss": -30.386798858642578, "global_step": 25669, "epoch": 212} {"train_loss": -31.386432647705078, "global_step": 25670, "epoch": 212} {"train_loss": -29.54481315612793, "global_step": 25671, "epoch": 212} {"train_loss": -30.323505401611328, "global_step": 25672, "epoch": 212} {"train_loss": -30.663009643554688, "global_step": 25673, "epoch": 212} {"train_loss": -30.123884201049805, "global_step": 25674, "epoch": 212} {"train_loss": -31.38386344909668, "global_step": 25675, "epoch": 212} {"train_loss": -31.21295738220215, "global_step": 25676, "epoch": 212} {"train_loss": -31.126678466796875, "global_step": 25677, "epoch": 212} {"train_loss": -31.4019775390625, "global_step": 25678, "epoch": 212} {"train_loss": -31.46624183654785, "global_step": 25679, "epoch": 212} {"train_loss": -31.848119735717773, "global_step": 25680, "epoch": 212} {"train_loss": -31.33807373046875, "global_step": 25681, "epoch": 212} {"train_loss": -31.765625, "global_step": 25682, "epoch": 212} {"train_loss": -31.156137466430664, "global_step": 25683, "epoch": 212} {"train_loss": -31.96894645690918, "global_step": 25684, "epoch": 212} {"train_loss": -31.72247886657715, "global_step": 25685, "epoch": 212} {"train_loss": -31.1143741607666, "global_step": 25686, "epoch": 212} {"train_loss": -31.498701095581055, "global_step": 25687, "epoch": 212} {"train_loss": -31.801544189453125, "global_step": 25688, "epoch": 212} {"train_loss": -31.642065048217773, "global_step": 25689, "epoch": 212} {"train_loss": -32.17361068725586, "global_step": 25690, "epoch": 212} {"train_loss": -31.631574630737305, "global_step": 25691, "epoch": 212} {"train_loss": -31.18096923828125, "global_step": 25692, "epoch": 212} {"train_loss": -31.616369247436523, "global_step": 25693, "epoch": 212} {"train_loss": -31.446521759033203, "global_step": 25694, "epoch": 212} {"train_loss": -31.6816349029541, "global_step": 25695, "epoch": 212} {"train_loss": -31.564313888549805, "global_step": 25696, "epoch": 212} {"train_loss": -31.929763793945312, "global_step": 25697, "epoch": 212} {"train_loss": -31.979328155517578, "global_step": 25698, "epoch": 212} {"train_loss": -31.91448974609375, "global_step": 25699, "epoch": 212} {"train_loss": -31.52728843688965, "global_step": 25700, "epoch": 212} {"train_loss": -31.0580997467041, "global_step": 25701, "epoch": 212} {"train_loss": -30.090045928955078, "global_step": 25702, "epoch": 212} {"train_loss": -31.014047622680664, "global_step": 25703, "epoch": 212} {"train_loss": -31.2353515625, "global_step": 25704, "epoch": 212} {"train_loss": -31.50266456604004, "global_step": 25705, "epoch": 212} {"train_loss": -31.063684463500977, "global_step": 25706, "epoch": 212} {"train_loss": -30.8557186126709, "global_step": 25707, "epoch": 212} {"train_loss": -31.39695167541504, "global_step": 25708, "epoch": 212} {"train_loss": -32.06474685668945, "global_step": 25709, "epoch": 212} {"train_loss": -31.00394058227539, "global_step": 25710, "epoch": 212} {"train_loss": -31.02887535095215, "global_step": 25711, "epoch": 212} {"train_loss": -32.13304138183594, "global_step": 25712, "epoch": 212} {"train_loss": -31.319726943969727, "global_step": 25713, "epoch": 212} {"train_loss": -31.01844596862793, "global_step": 25714, "epoch": 212} {"train_loss": -31.47574234008789, "global_step": 25715, "epoch": 212} {"train_loss": -31.869714736938477, "global_step": 25716, "epoch": 212} {"train_loss": -31.8555965423584, "global_step": 25717, "epoch": 212} {"train_loss": -30.91511344909668, "global_step": 25718, "epoch": 212} {"train_loss": -31.539794921875, "global_step": 25719, "epoch": 212} {"train_loss": -31.5224552154541, "global_step": 25720, "epoch": 212} {"train_loss": -32.00334167480469, "global_step": 25721, "epoch": 212} {"train_loss": -31.2425537109375, "global_step": 25722, "epoch": 212} {"train_loss": -31.043781280517578, "global_step": 25723, "epoch": 212} {"train_loss": -31.92243003845215, "global_step": 25724, "epoch": 212} {"train_loss": -31.994306564331055, "global_step": 25725, "epoch": 212} {"train_loss": -31.538339614868164, "global_step": 25726, "epoch": 212} {"train_loss": -31.76495361328125, "global_step": 25727, "epoch": 212} {"train_loss": -32.19961929321289, "global_step": 25728, "epoch": 212} {"train_loss": -31.680219650268555, "global_step": 25729, "epoch": 212} {"train_loss": -31.48663902282715, "global_step": 25730, "epoch": 212} {"train_loss": -32.00590515136719, "global_step": 25731, "epoch": 212} {"train_loss": -31.734027862548828, "global_step": 25732, "epoch": 212} {"train_loss": -32.09507369995117, "global_step": 25733, "epoch": 212} {"train_loss": -31.109220504760742, "global_step": 25734, "epoch": 212} {"train_loss": -30.784591674804688, "global_step": 25735, "epoch": 212} {"train_loss": -28.89478874206543, "global_step": 25736, "epoch": 212} {"train_loss": -26.58588981628418, "global_step": 25737, "epoch": 212} {"train_loss": -20.906911849975586, "global_step": 25738, "epoch": 212} {"train_loss": -15.3927001953125, "global_step": 25739, "epoch": 212} {"train_loss": -20.750967025756836, "global_step": 25740, "epoch": 212} {"train_loss": -30.21941566467285, "global_step": 25741, "epoch": 212} {"train_loss": -21.674293518066406, "global_step": 25742, "epoch": 212} {"train_loss": -29.710668563842773, "global_step": 25743, "epoch": 212} {"train_loss": -27.29082679748535, "global_step": 25744, "epoch": 212} {"train_loss": -27.82795524597168, "global_step": 25745, "epoch": 212} {"train_loss": -29.467878341674805, "global_step": 25746, "epoch": 212} {"train_loss": -27.811676025390625, "global_step": 25747, "epoch": 212} {"train_loss": -28.818180084228516, "global_step": 25748, "epoch": 212} {"train_loss": -30.939477920532227, "global_step": 25749, "epoch": 212} {"train_loss": -29.7901611328125, "global_step": 25750, "epoch": 212} {"train_loss": -29.032800674438477, "global_step": 25751, "epoch": 212} {"train_loss": -28.841772079467773, "global_step": 25752, "epoch": 212} {"train_loss": -30.989858627319336, "global_step": 25753, "epoch": 212} {"train_loss": -29.973480224609375, "global_step": 25754, "epoch": 212} {"train_loss": -30.23109245300293, "global_step": 25755, "epoch": 212} {"train_loss": -29.981098175048828, "global_step": 25756, "epoch": 212} {"train_loss": -30.252044677734375, "global_step": 25757, "epoch": 212} {"train_loss": -30.788434982299805, "global_step": 25758, "epoch": 212} {"train_loss": -30.47757911682129, "global_step": 25759, "epoch": 212} {"train_loss": -31.018049240112305, "global_step": 25760, "epoch": 212} {"train_loss": -30.3541259765625, "global_step": 25761, "epoch": 212} {"train_loss": -30.78473472595215, "global_step": 25762, "epoch": 212} {"train_loss": -30.590768814086914, "global_step": 25763, "epoch": 212} {"train_loss": -31.041486740112305, "global_step": 25764, "epoch": 212} {"train_loss": -31.230005264282227, "global_step": 25765, "epoch": 212} {"train_loss": -31.2276668548584, "global_step": 25766, "epoch": 212} {"train_loss": -30.923583984375, "global_step": 25767, "epoch": 212} {"train_loss": -31.133100509643555, "global_step": 25768, "epoch": 212} {"train_loss": -31.0939998626709, "global_step": 25769, "epoch": 212} {"train_loss": -30.97041130065918, "global_step": 25770, "epoch": 212} {"train_loss": -30.570785522460938, "global_step": 25771, "epoch": 212} {"train_loss": -30.57176560015718, "global_step": 25772, "epoch": 212, "val_loss": 2606019.75} {"train_loss": -31.612985610961914, "global_step": 25773, "epoch": 213} {"train_loss": -31.344970703125, "global_step": 25774, "epoch": 213} {"train_loss": -31.11695671081543, "global_step": 25775, "epoch": 213} {"train_loss": -30.9973087310791, "global_step": 25776, "epoch": 213} {"train_loss": -31.264022827148438, "global_step": 25777, "epoch": 213} {"train_loss": -31.23199462890625, "global_step": 25778, "epoch": 213} {"train_loss": -31.29998207092285, "global_step": 25779, "epoch": 213} {"train_loss": -31.05877113342285, "global_step": 25780, "epoch": 213} {"train_loss": -31.267019271850586, "global_step": 25781, "epoch": 213} {"train_loss": -30.730005264282227, "global_step": 25782, "epoch": 213} {"train_loss": -30.302967071533203, "global_step": 25783, "epoch": 213} {"train_loss": -30.778614044189453, "global_step": 25784, "epoch": 213} {"train_loss": -31.59675407409668, "global_step": 25785, "epoch": 213} {"train_loss": -31.619531631469727, "global_step": 25786, "epoch": 213} {"train_loss": -31.396106719970703, "global_step": 25787, "epoch": 213} {"train_loss": -30.1644287109375, "global_step": 25788, "epoch": 213} {"train_loss": -29.602447509765625, "global_step": 25789, "epoch": 213} {"train_loss": -31.552494049072266, "global_step": 25790, "epoch": 213} {"train_loss": -31.218290328979492, "global_step": 25791, "epoch": 213} {"train_loss": -31.26722526550293, "global_step": 25792, "epoch": 213} {"train_loss": -31.073348999023438, "global_step": 25793, "epoch": 213} {"train_loss": -30.132917404174805, "global_step": 25794, "epoch": 213} {"train_loss": -31.14322853088379, "global_step": 25795, "epoch": 213} {"train_loss": -30.688024520874023, "global_step": 25796, "epoch": 213} {"train_loss": -30.900678634643555, "global_step": 25797, "epoch": 213} {"train_loss": -31.24240493774414, "global_step": 25798, "epoch": 213} {"train_loss": -30.9886474609375, "global_step": 25799, "epoch": 213} {"train_loss": -31.0887393951416, "global_step": 25800, "epoch": 213} {"train_loss": -30.38663673400879, "global_step": 25801, "epoch": 213} {"train_loss": -30.16011619567871, "global_step": 25802, "epoch": 213} {"train_loss": -30.8358097076416, "global_step": 25803, "epoch": 213} {"train_loss": -30.440185546875, "global_step": 25804, "epoch": 213} {"train_loss": -29.566137313842773, "global_step": 25805, "epoch": 213} {"train_loss": -26.812673568725586, "global_step": 25806, "epoch": 213} {"train_loss": -28.97458839416504, "global_step": 25807, "epoch": 213} {"train_loss": -30.497028350830078, "global_step": 25808, "epoch": 213} {"train_loss": -30.697412490844727, "global_step": 25809, "epoch": 213} {"train_loss": -30.289846420288086, "global_step": 25810, "epoch": 213} {"train_loss": -31.104339599609375, "global_step": 25811, "epoch": 213} {"train_loss": -30.588842391967773, "global_step": 25812, "epoch": 213} {"train_loss": -30.976367950439453, "global_step": 25813, "epoch": 213} {"train_loss": -31.001453399658203, "global_step": 25814, "epoch": 213} {"train_loss": -30.942829132080078, "global_step": 25815, "epoch": 213} {"train_loss": -30.9124813079834, "global_step": 25816, "epoch": 213} {"train_loss": -30.831846237182617, "global_step": 25817, "epoch": 213} {"train_loss": -31.312231063842773, "global_step": 25818, "epoch": 213} {"train_loss": -30.879392623901367, "global_step": 25819, "epoch": 213} {"train_loss": -31.25599479675293, "global_step": 25820, "epoch": 213} {"train_loss": -31.174901962280273, "global_step": 25821, "epoch": 213} {"train_loss": -30.72236442565918, "global_step": 25822, "epoch": 213} {"train_loss": -31.16517448425293, "global_step": 25823, "epoch": 213} {"train_loss": -31.410541534423828, "global_step": 25824, "epoch": 213} {"train_loss": -31.102588653564453, "global_step": 25825, "epoch": 213} {"train_loss": -31.33942985534668, "global_step": 25826, "epoch": 213} {"train_loss": -31.720458984375, "global_step": 25827, "epoch": 213} {"train_loss": -31.28326988220215, "global_step": 25828, "epoch": 213} {"train_loss": -31.280614852905273, "global_step": 25829, "epoch": 213} {"train_loss": -31.325897216796875, "global_step": 25830, "epoch": 213} {"train_loss": -31.654584884643555, "global_step": 25831, "epoch": 213} {"train_loss": -31.7094783782959, "global_step": 25832, "epoch": 213} {"train_loss": -31.51264762878418, "global_step": 25833, "epoch": 213} {"train_loss": -31.420530319213867, "global_step": 25834, "epoch": 213} {"train_loss": -31.665990829467773, "global_step": 25835, "epoch": 213} {"train_loss": -31.71473503112793, "global_step": 25836, "epoch": 213} {"train_loss": -31.434814453125, "global_step": 25837, "epoch": 213} {"train_loss": -31.881942749023438, "global_step": 25838, "epoch": 213} {"train_loss": -31.36289405822754, "global_step": 25839, "epoch": 213} {"train_loss": -31.657779693603516, "global_step": 25840, "epoch": 213} {"train_loss": -31.529144287109375, "global_step": 25841, "epoch": 213} {"train_loss": -31.14369010925293, "global_step": 25842, "epoch": 213} {"train_loss": -31.38453483581543, "global_step": 25843, "epoch": 213} {"train_loss": -31.704181671142578, "global_step": 25844, "epoch": 213} {"train_loss": -31.7414608001709, "global_step": 25845, "epoch": 213} {"train_loss": -31.59793472290039, "global_step": 25846, "epoch": 213} {"train_loss": -31.384984970092773, "global_step": 25847, "epoch": 213} {"train_loss": -31.606735229492188, "global_step": 25848, "epoch": 213} {"train_loss": -31.827795028686523, "global_step": 25849, "epoch": 213} {"train_loss": -31.46588134765625, "global_step": 25850, "epoch": 213} {"train_loss": -31.981830596923828, "global_step": 25851, "epoch": 213} {"train_loss": -31.54743003845215, "global_step": 25852, "epoch": 213} {"train_loss": -30.969470977783203, "global_step": 25853, "epoch": 213} {"train_loss": -30.883142471313477, "global_step": 25854, "epoch": 213} {"train_loss": -31.276464462280273, "global_step": 25855, "epoch": 213} {"train_loss": -31.9686336517334, "global_step": 25856, "epoch": 213} {"train_loss": -31.65755271911621, "global_step": 25857, "epoch": 213} {"train_loss": -31.55002784729004, "global_step": 25858, "epoch": 213} {"train_loss": -30.993886947631836, "global_step": 25859, "epoch": 213} {"train_loss": -29.831140518188477, "global_step": 25860, "epoch": 213} {"train_loss": -30.00605583190918, "global_step": 25861, "epoch": 213} {"train_loss": -31.040771484375, "global_step": 25862, "epoch": 213} {"train_loss": -32.08269119262695, "global_step": 25863, "epoch": 213} {"train_loss": -30.400487899780273, "global_step": 25864, "epoch": 213} {"train_loss": -30.81743812561035, "global_step": 25865, "epoch": 213} {"train_loss": -31.406461715698242, "global_step": 25866, "epoch": 213} {"train_loss": -31.426654815673828, "global_step": 25867, "epoch": 213} {"train_loss": -30.95713233947754, "global_step": 25868, "epoch": 213} {"train_loss": -31.6586856842041, "global_step": 25869, "epoch": 213} {"train_loss": -31.0828857421875, "global_step": 25870, "epoch": 213} {"train_loss": -30.815509796142578, "global_step": 25871, "epoch": 213} {"train_loss": -31.414045333862305, "global_step": 25872, "epoch": 213} {"train_loss": -31.60572624206543, "global_step": 25873, "epoch": 213} {"train_loss": -31.0827693939209, "global_step": 25874, "epoch": 213} {"train_loss": -31.474567413330078, "global_step": 25875, "epoch": 213} {"train_loss": -31.62491798400879, "global_step": 25876, "epoch": 213} {"train_loss": -31.106481552124023, "global_step": 25877, "epoch": 213} {"train_loss": -31.41437339782715, "global_step": 25878, "epoch": 213} {"train_loss": -31.63332176208496, "global_step": 25879, "epoch": 213} {"train_loss": -31.861663818359375, "global_step": 25880, "epoch": 213} {"train_loss": -31.72230339050293, "global_step": 25881, "epoch": 213} {"train_loss": -31.89084243774414, "global_step": 25882, "epoch": 213} {"train_loss": -31.29047203063965, "global_step": 25883, "epoch": 213} {"train_loss": -31.3193302154541, "global_step": 25884, "epoch": 213} {"train_loss": -31.703155517578125, "global_step": 25885, "epoch": 213} {"train_loss": -31.049484252929688, "global_step": 25886, "epoch": 213} {"train_loss": -31.218412399291992, "global_step": 25887, "epoch": 213} {"train_loss": -30.974302291870117, "global_step": 25888, "epoch": 213} {"train_loss": -31.439289093017578, "global_step": 25889, "epoch": 213} {"train_loss": -30.7995548248291, "global_step": 25890, "epoch": 213} {"train_loss": -30.623620986938477, "global_step": 25891, "epoch": 213} {"train_loss": -31.396869659423828, "global_step": 25892, "epoch": 213} {"train_loss": -31.117217166364686, "global_step": 25893, "epoch": 213, "val_loss": 2555313.25} {"train_loss": -31.077253341674805, "global_step": 25894, "epoch": 214} {"train_loss": -31.800800323486328, "global_step": 25895, "epoch": 214} {"train_loss": -31.016998291015625, "global_step": 25896, "epoch": 214} {"train_loss": -31.654966354370117, "global_step": 25897, "epoch": 214} {"train_loss": -31.27985954284668, "global_step": 25898, "epoch": 214} {"train_loss": -31.773086547851562, "global_step": 25899, "epoch": 214} {"train_loss": -31.77288246154785, "global_step": 25900, "epoch": 214} {"train_loss": -31.756519317626953, "global_step": 25901, "epoch": 214} {"train_loss": -32.00678634643555, "global_step": 25902, "epoch": 214} {"train_loss": -31.654972076416016, "global_step": 25903, "epoch": 214} {"train_loss": -31.294092178344727, "global_step": 25904, "epoch": 214} {"train_loss": -31.92279624938965, "global_step": 25905, "epoch": 214} {"train_loss": -31.540327072143555, "global_step": 25906, "epoch": 214} {"train_loss": -32.27248764038086, "global_step": 25907, "epoch": 214} {"train_loss": -32.02132034301758, "global_step": 25908, "epoch": 214} {"train_loss": -32.2175178527832, "global_step": 25909, "epoch": 214} {"train_loss": -32.08115768432617, "global_step": 25910, "epoch": 214} {"train_loss": -32.26118087768555, "global_step": 25911, "epoch": 214} {"train_loss": -31.830493927001953, "global_step": 25912, "epoch": 214} {"train_loss": -31.57770347595215, "global_step": 25913, "epoch": 214} {"train_loss": -31.238800048828125, "global_step": 25914, "epoch": 214} {"train_loss": -31.42255210876465, "global_step": 25915, "epoch": 214} {"train_loss": -31.49152946472168, "global_step": 25916, "epoch": 214} {"train_loss": -32.10833740234375, "global_step": 25917, "epoch": 214} {"train_loss": -32.4674186706543, "global_step": 25918, "epoch": 214} {"train_loss": -32.44254684448242, "global_step": 25919, "epoch": 214} {"train_loss": -32.64071273803711, "global_step": 25920, "epoch": 214} {"train_loss": -31.58741569519043, "global_step": 25921, "epoch": 214} {"train_loss": -29.265295028686523, "global_step": 25922, "epoch": 214} {"train_loss": -32.54964828491211, "global_step": 25923, "epoch": 214} {"train_loss": -30.804752349853516, "global_step": 25924, "epoch": 214} {"train_loss": -32.278743743896484, "global_step": 25925, "epoch": 214} {"train_loss": -31.73552894592285, "global_step": 25926, "epoch": 214} {"train_loss": -32.58051681518555, "global_step": 25927, "epoch": 214} {"train_loss": -31.65447998046875, "global_step": 25928, "epoch": 214} {"train_loss": -32.225887298583984, "global_step": 25929, "epoch": 214} {"train_loss": -31.7326717376709, "global_step": 25930, "epoch": 214} {"train_loss": -31.85291862487793, "global_step": 25931, "epoch": 214} {"train_loss": -30.856428146362305, "global_step": 25932, "epoch": 214} {"train_loss": -30.62836265563965, "global_step": 25933, "epoch": 214} {"train_loss": -32.14983367919922, "global_step": 25934, "epoch": 214} {"train_loss": -32.293731689453125, "global_step": 25935, "epoch": 214} {"train_loss": -31.739316940307617, "global_step": 25936, "epoch": 214} {"train_loss": -30.876874923706055, "global_step": 25937, "epoch": 214} {"train_loss": -31.0102596282959, "global_step": 25938, "epoch": 214} {"train_loss": -31.6711368560791, "global_step": 25939, "epoch": 214} {"train_loss": -32.28211975097656, "global_step": 25940, "epoch": 214} {"train_loss": -32.3082160949707, "global_step": 25941, "epoch": 214} {"train_loss": -31.495954513549805, "global_step": 25942, "epoch": 214} {"train_loss": -30.963226318359375, "global_step": 25943, "epoch": 214} {"train_loss": -30.10857582092285, "global_step": 25944, "epoch": 214} {"train_loss": -29.415624618530273, "global_step": 25945, "epoch": 214} {"train_loss": -29.814807891845703, "global_step": 25946, "epoch": 214} {"train_loss": -30.255094528198242, "global_step": 25947, "epoch": 214} {"train_loss": -31.630422592163086, "global_step": 25948, "epoch": 214} {"train_loss": -31.880817413330078, "global_step": 25949, "epoch": 214} {"train_loss": -30.7636661529541, "global_step": 25950, "epoch": 214} {"train_loss": -31.26954460144043, "global_step": 25951, "epoch": 214} {"train_loss": -31.9366397857666, "global_step": 25952, "epoch": 214} {"train_loss": -31.182758331298828, "global_step": 25953, "epoch": 214} {"train_loss": -30.3020076751709, "global_step": 25954, "epoch": 214} {"train_loss": -32.17691421508789, "global_step": 25955, "epoch": 214} {"train_loss": -31.55059814453125, "global_step": 25956, "epoch": 214} {"train_loss": -32.175682067871094, "global_step": 25957, "epoch": 214} {"train_loss": -32.109214782714844, "global_step": 25958, "epoch": 214} {"train_loss": -31.28790855407715, "global_step": 25959, "epoch": 214} {"train_loss": -31.971500396728516, "global_step": 25960, "epoch": 214} {"train_loss": -31.191991806030273, "global_step": 25961, "epoch": 214} {"train_loss": -31.335983276367188, "global_step": 25962, "epoch": 214} {"train_loss": -31.85894203186035, "global_step": 25963, "epoch": 214} {"train_loss": -31.289587020874023, "global_step": 25964, "epoch": 214} {"train_loss": -31.656835556030273, "global_step": 25965, "epoch": 214} {"train_loss": -31.68877601623535, "global_step": 25966, "epoch": 214} {"train_loss": -31.824188232421875, "global_step": 25967, "epoch": 214} {"train_loss": -31.827741622924805, "global_step": 25968, "epoch": 214} {"train_loss": -30.9145565032959, "global_step": 25969, "epoch": 214} {"train_loss": -31.74142837524414, "global_step": 25970, "epoch": 214} {"train_loss": -28.7508487701416, "global_step": 25971, "epoch": 214} {"train_loss": -31.137237548828125, "global_step": 25972, "epoch": 214} {"train_loss": -30.0703182220459, "global_step": 25973, "epoch": 214} {"train_loss": -31.578418731689453, "global_step": 25974, "epoch": 214} {"train_loss": -29.620391845703125, "global_step": 25975, "epoch": 214} {"train_loss": -32.00370407104492, "global_step": 25976, "epoch": 214} {"train_loss": -31.09882926940918, "global_step": 25977, "epoch": 214} {"train_loss": -31.687992095947266, "global_step": 25978, "epoch": 214} {"train_loss": -32.04116439819336, "global_step": 25979, "epoch": 214} {"train_loss": -31.97247314453125, "global_step": 25980, "epoch": 214} {"train_loss": -31.83881950378418, "global_step": 25981, "epoch": 214} {"train_loss": -31.837451934814453, "global_step": 25982, "epoch": 214} {"train_loss": -31.703031539916992, "global_step": 25983, "epoch": 214} {"train_loss": -31.838653564453125, "global_step": 25984, "epoch": 214} {"train_loss": -31.79833984375, "global_step": 25985, "epoch": 214} {"train_loss": -32.00870895385742, "global_step": 25986, "epoch": 214} {"train_loss": -32.15130615234375, "global_step": 25987, "epoch": 214} {"train_loss": -31.76719093322754, "global_step": 25988, "epoch": 214} {"train_loss": -31.178815841674805, "global_step": 25989, "epoch": 214} {"train_loss": -31.208789825439453, "global_step": 25990, "epoch": 214} {"train_loss": -31.615188598632812, "global_step": 25991, "epoch": 214} {"train_loss": -31.513843536376953, "global_step": 25992, "epoch": 214} {"train_loss": -30.560134887695312, "global_step": 25993, "epoch": 214} {"train_loss": -28.221088409423828, "global_step": 25994, "epoch": 214} {"train_loss": -24.730642318725586, "global_step": 25995, "epoch": 214} {"train_loss": -20.49442481994629, "global_step": 25996, "epoch": 214} {"train_loss": -26.13958740234375, "global_step": 25997, "epoch": 214} {"train_loss": -29.669248580932617, "global_step": 25998, "epoch": 214} {"train_loss": -22.685468673706055, "global_step": 25999, "epoch": 214} {"train_loss": -30.228940963745117, "global_step": 26000, "epoch": 214} {"train_loss": -26.784467697143555, "global_step": 26001, "epoch": 214} {"train_loss": -30.626712799072266, "global_step": 26002, "epoch": 214} {"train_loss": -28.45509147644043, "global_step": 26003, "epoch": 214} {"train_loss": -30.052038192749023, "global_step": 26004, "epoch": 214} {"train_loss": -29.05765151977539, "global_step": 26005, "epoch": 214} {"train_loss": -29.82354736328125, "global_step": 26006, "epoch": 214} {"train_loss": -30.702802658081055, "global_step": 26007, "epoch": 214} {"train_loss": -29.79962158203125, "global_step": 26008, "epoch": 214} {"train_loss": -30.511411666870117, "global_step": 26009, "epoch": 214} {"train_loss": -30.646657943725586, "global_step": 26010, "epoch": 214} {"train_loss": -30.693775177001953, "global_step": 26011, "epoch": 214} {"train_loss": -30.059295654296875, "global_step": 26012, "epoch": 214} {"train_loss": -30.3652286529541, "global_step": 26013, "epoch": 214} {"train_loss": -31.007239854040225, "global_step": 26014, "epoch": 214, "val_loss": 2656664.75} {"train_loss": -30.800146102905273, "global_step": 26015, "epoch": 215} {"train_loss": -30.515750885009766, "global_step": 26016, "epoch": 215} {"train_loss": -30.921472549438477, "global_step": 26017, "epoch": 215} {"train_loss": -31.43505859375, "global_step": 26018, "epoch": 215} {"train_loss": -31.077533721923828, "global_step": 26019, "epoch": 215} {"train_loss": -31.312637329101562, "global_step": 26020, "epoch": 215} {"train_loss": -31.14116859436035, "global_step": 26021, "epoch": 215} {"train_loss": -31.68210220336914, "global_step": 26022, "epoch": 215} {"train_loss": -31.518247604370117, "global_step": 26023, "epoch": 215} {"train_loss": -31.287799835205078, "global_step": 26024, "epoch": 215} {"train_loss": -31.65468406677246, "global_step": 26025, "epoch": 215} {"train_loss": -31.49239158630371, "global_step": 26026, "epoch": 215} {"train_loss": -31.787206649780273, "global_step": 26027, "epoch": 215} {"train_loss": -31.569738388061523, "global_step": 26028, "epoch": 215} {"train_loss": -31.67872428894043, "global_step": 26029, "epoch": 215} {"train_loss": -31.914630889892578, "global_step": 26030, "epoch": 215} {"train_loss": -31.94125747680664, "global_step": 26031, "epoch": 215} {"train_loss": -31.6130313873291, "global_step": 26032, "epoch": 215} {"train_loss": -31.09283447265625, "global_step": 26033, "epoch": 215} {"train_loss": -31.59659767150879, "global_step": 26034, "epoch": 215} {"train_loss": -31.024494171142578, "global_step": 26035, "epoch": 215} {"train_loss": -32.28710174560547, "global_step": 26036, "epoch": 215} {"train_loss": -31.543851852416992, "global_step": 26037, "epoch": 215} {"train_loss": -31.5123348236084, "global_step": 26038, "epoch": 215} {"train_loss": -30.615497589111328, "global_step": 26039, "epoch": 215} {"train_loss": -29.88197135925293, "global_step": 26040, "epoch": 215} {"train_loss": -29.70566749572754, "global_step": 26041, "epoch": 215} {"train_loss": -31.242292404174805, "global_step": 26042, "epoch": 215} {"train_loss": -31.6990909576416, "global_step": 26043, "epoch": 215} {"train_loss": -31.681833267211914, "global_step": 26044, "epoch": 215} {"train_loss": -30.248565673828125, "global_step": 26045, "epoch": 215} {"train_loss": -31.96078872680664, "global_step": 26046, "epoch": 215} {"train_loss": -31.443328857421875, "global_step": 26047, "epoch": 215} {"train_loss": -31.695968627929688, "global_step": 26048, "epoch": 215} {"train_loss": -31.540313720703125, "global_step": 26049, "epoch": 215} {"train_loss": -31.88270378112793, "global_step": 26050, "epoch": 215} {"train_loss": -30.74371910095215, "global_step": 26051, "epoch": 215} {"train_loss": -29.94061851501465, "global_step": 26052, "epoch": 215} {"train_loss": -27.654592514038086, "global_step": 26053, "epoch": 215} {"train_loss": -22.324176788330078, "global_step": 26054, "epoch": 215} {"train_loss": -15.897111892700195, "global_step": 26055, "epoch": 215} {"train_loss": -21.29234504699707, "global_step": 26056, "epoch": 215} {"train_loss": -31.06524658203125, "global_step": 26057, "epoch": 215} {"train_loss": -25.699609756469727, "global_step": 26058, "epoch": 215} {"train_loss": -30.08176612854004, "global_step": 26059, "epoch": 215} {"train_loss": -29.2402286529541, "global_step": 26060, "epoch": 215} {"train_loss": -28.513273239135742, "global_step": 26061, "epoch": 215} {"train_loss": -30.817724227905273, "global_step": 26062, "epoch": 215} {"train_loss": -30.443113327026367, "global_step": 26063, "epoch": 215} {"train_loss": -29.13899040222168, "global_step": 26064, "epoch": 215} {"train_loss": -30.251455307006836, "global_step": 26065, "epoch": 215} {"train_loss": -30.836002349853516, "global_step": 26066, "epoch": 215} {"train_loss": -30.532379150390625, "global_step": 26067, "epoch": 215} {"train_loss": -30.737539291381836, "global_step": 26068, "epoch": 215} {"train_loss": -30.44235610961914, "global_step": 26069, "epoch": 215} {"train_loss": -30.557218551635742, "global_step": 26070, "epoch": 215} {"train_loss": -30.781402587890625, "global_step": 26071, "epoch": 215} {"train_loss": -31.14599609375, "global_step": 26072, "epoch": 215} {"train_loss": -31.053607940673828, "global_step": 26073, "epoch": 215} {"train_loss": -30.860477447509766, "global_step": 26074, "epoch": 215} {"train_loss": -30.920080184936523, "global_step": 26075, "epoch": 215} {"train_loss": -31.224645614624023, "global_step": 26076, "epoch": 215} {"train_loss": -31.515771865844727, "global_step": 26077, "epoch": 215} {"train_loss": -30.984785079956055, "global_step": 26078, "epoch": 215} {"train_loss": -31.009464263916016, "global_step": 26079, "epoch": 215} {"train_loss": -31.0831298828125, "global_step": 26080, "epoch": 215} {"train_loss": -31.13400650024414, "global_step": 26081, "epoch": 215} {"train_loss": -30.96345329284668, "global_step": 26082, "epoch": 215} {"train_loss": -31.298437118530273, "global_step": 26083, "epoch": 215} {"train_loss": -31.063703536987305, "global_step": 26084, "epoch": 215} {"train_loss": -31.693683624267578, "global_step": 26085, "epoch": 215} {"train_loss": -31.086267471313477, "global_step": 26086, "epoch": 215} {"train_loss": -31.030725479125977, "global_step": 26087, "epoch": 215} {"train_loss": -31.264307022094727, "global_step": 26088, "epoch": 215} {"train_loss": -31.467472076416016, "global_step": 26089, "epoch": 215} {"train_loss": -30.518686294555664, "global_step": 26090, "epoch": 215} {"train_loss": -30.975997924804688, "global_step": 26091, "epoch": 215} {"train_loss": -31.285846710205078, "global_step": 26092, "epoch": 215} {"train_loss": -31.390371322631836, "global_step": 26093, "epoch": 215} {"train_loss": -31.017663955688477, "global_step": 26094, "epoch": 215} {"train_loss": -30.848331451416016, "global_step": 26095, "epoch": 215} {"train_loss": -30.728073120117188, "global_step": 26096, "epoch": 215} {"train_loss": -31.130285263061523, "global_step": 26097, "epoch": 215} {"train_loss": -31.1995849609375, "global_step": 26098, "epoch": 215} {"train_loss": -31.199359893798828, "global_step": 26099, "epoch": 215} {"train_loss": -30.297895431518555, "global_step": 26100, "epoch": 215} {"train_loss": -30.723371505737305, "global_step": 26101, "epoch": 215} {"train_loss": -30.999835968017578, "global_step": 26102, "epoch": 215} {"train_loss": -31.326074600219727, "global_step": 26103, "epoch": 215} {"train_loss": -30.8808536529541, "global_step": 26104, "epoch": 215} {"train_loss": -31.148178100585938, "global_step": 26105, "epoch": 215} {"train_loss": -30.873090744018555, "global_step": 26106, "epoch": 215} {"train_loss": -31.039945602416992, "global_step": 26107, "epoch": 215} {"train_loss": -30.92255973815918, "global_step": 26108, "epoch": 215} {"train_loss": -31.208402633666992, "global_step": 26109, "epoch": 215} {"train_loss": -31.696765899658203, "global_step": 26110, "epoch": 215} {"train_loss": -30.583505630493164, "global_step": 26111, "epoch": 215} {"train_loss": -31.10150146484375, "global_step": 26112, "epoch": 215} {"train_loss": -30.246423721313477, "global_step": 26113, "epoch": 215} {"train_loss": -31.157291412353516, "global_step": 26114, "epoch": 215} {"train_loss": -31.383535385131836, "global_step": 26115, "epoch": 215} {"train_loss": -31.065658569335938, "global_step": 26116, "epoch": 215} {"train_loss": -31.521093368530273, "global_step": 26117, "epoch": 215} {"train_loss": -31.054218292236328, "global_step": 26118, "epoch": 215} {"train_loss": -30.565229415893555, "global_step": 26119, "epoch": 215} {"train_loss": -31.6014347076416, "global_step": 26120, "epoch": 215} {"train_loss": -31.573774337768555, "global_step": 26121, "epoch": 215} {"train_loss": -31.510726928710938, "global_step": 26122, "epoch": 215} {"train_loss": -31.4525089263916, "global_step": 26123, "epoch": 215} {"train_loss": -31.473779678344727, "global_step": 26124, "epoch": 215} {"train_loss": -31.446491241455078, "global_step": 26125, "epoch": 215} {"train_loss": -31.339506149291992, "global_step": 26126, "epoch": 215} {"train_loss": -31.878576278686523, "global_step": 26127, "epoch": 215} {"train_loss": -32.086605072021484, "global_step": 26128, "epoch": 215} {"train_loss": -31.28260612487793, "global_step": 26129, "epoch": 215} {"train_loss": -30.985279083251953, "global_step": 26130, "epoch": 215} {"train_loss": -31.825519561767578, "global_step": 26131, "epoch": 215} {"train_loss": -31.848127365112305, "global_step": 26132, "epoch": 215} {"train_loss": -31.375080108642578, "global_step": 26133, "epoch": 215} {"train_loss": -31.152847290039062, "global_step": 26134, "epoch": 215} {"train_loss": -30.74684537146702, "global_step": 26135, "epoch": 215, "val_loss": 2539754.75} {"train_loss": -32.17991638183594, "global_step": 26136, "epoch": 216} {"train_loss": -31.719257354736328, "global_step": 26137, "epoch": 216} {"train_loss": -31.667240142822266, "global_step": 26138, "epoch": 216} {"train_loss": -31.817642211914062, "global_step": 26139, "epoch": 216} {"train_loss": -31.78809928894043, "global_step": 26140, "epoch": 216} {"train_loss": -31.838857650756836, "global_step": 26141, "epoch": 216} {"train_loss": -31.217920303344727, "global_step": 26142, "epoch": 216} {"train_loss": -32.23655319213867, "global_step": 26143, "epoch": 216} {"train_loss": -32.0384635925293, "global_step": 26144, "epoch": 216} {"train_loss": -31.5788516998291, "global_step": 26145, "epoch": 216} {"train_loss": -31.641000747680664, "global_step": 26146, "epoch": 216} {"train_loss": -31.535755157470703, "global_step": 26147, "epoch": 216} {"train_loss": -32.456180572509766, "global_step": 26148, "epoch": 216} {"train_loss": -31.787158966064453, "global_step": 26149, "epoch": 216} {"train_loss": -32.14263916015625, "global_step": 26150, "epoch": 216} {"train_loss": -31.932804107666016, "global_step": 26151, "epoch": 216} {"train_loss": -31.89208984375, "global_step": 26152, "epoch": 216} {"train_loss": -32.27113342285156, "global_step": 26153, "epoch": 216} {"train_loss": -32.0472297668457, "global_step": 26154, "epoch": 216} {"train_loss": -32.15555953979492, "global_step": 26155, "epoch": 216} {"train_loss": -32.0123291015625, "global_step": 26156, "epoch": 216} {"train_loss": -31.364973068237305, "global_step": 26157, "epoch": 216} {"train_loss": -31.33342933654785, "global_step": 26158, "epoch": 216} {"train_loss": -31.474109649658203, "global_step": 26159, "epoch": 216} {"train_loss": -31.87322425842285, "global_step": 26160, "epoch": 216} {"train_loss": -31.47886085510254, "global_step": 26161, "epoch": 216} {"train_loss": -31.491687774658203, "global_step": 26162, "epoch": 216} {"train_loss": -32.21446228027344, "global_step": 26163, "epoch": 216} {"train_loss": -31.88776206970215, "global_step": 26164, "epoch": 216} {"train_loss": -31.61225700378418, "global_step": 26165, "epoch": 216} {"train_loss": -31.060434341430664, "global_step": 26166, "epoch": 216} {"train_loss": -30.862689971923828, "global_step": 26167, "epoch": 216} {"train_loss": -30.523855209350586, "global_step": 26168, "epoch": 216} {"train_loss": -29.16983413696289, "global_step": 26169, "epoch": 216} {"train_loss": -25.689777374267578, "global_step": 26170, "epoch": 216} {"train_loss": -18.751279830932617, "global_step": 26171, "epoch": 216} {"train_loss": -13.853815078735352, "global_step": 26172, "epoch": 216} {"train_loss": -28.233495712280273, "global_step": 26173, "epoch": 216} {"train_loss": -29.12653160095215, "global_step": 26174, "epoch": 216} {"train_loss": -28.42066764831543, "global_step": 26175, "epoch": 216} {"train_loss": -30.84356117248535, "global_step": 26176, "epoch": 216} {"train_loss": -29.53860855102539, "global_step": 26177, "epoch": 216} {"train_loss": -30.111892700195312, "global_step": 26178, "epoch": 216} {"train_loss": -30.91144371032715, "global_step": 26179, "epoch": 216} {"train_loss": -29.716541290283203, "global_step": 26180, "epoch": 216} {"train_loss": -30.785322189331055, "global_step": 26181, "epoch": 216} {"train_loss": -30.56220054626465, "global_step": 26182, "epoch": 216} {"train_loss": -27.529388427734375, "global_step": 26183, "epoch": 216} {"train_loss": -29.740209579467773, "global_step": 26184, "epoch": 216} {"train_loss": -29.752521514892578, "global_step": 26185, "epoch": 216} {"train_loss": -28.195480346679688, "global_step": 26186, "epoch": 216} {"train_loss": -29.53389549255371, "global_step": 26187, "epoch": 216} {"train_loss": -28.929962158203125, "global_step": 26188, "epoch": 216} {"train_loss": -30.955307006835938, "global_step": 26189, "epoch": 216} {"train_loss": -30.008779525756836, "global_step": 26190, "epoch": 216} {"train_loss": -30.347888946533203, "global_step": 26191, "epoch": 216} {"train_loss": -30.499774932861328, "global_step": 26192, "epoch": 216} {"train_loss": -29.89320182800293, "global_step": 26193, "epoch": 216} {"train_loss": -31.243616104125977, "global_step": 26194, "epoch": 216} {"train_loss": -30.35297966003418, "global_step": 26195, "epoch": 216} {"train_loss": -30.181716918945312, "global_step": 26196, "epoch": 216} {"train_loss": -30.888952255249023, "global_step": 26197, "epoch": 216} {"train_loss": -31.04071617126465, "global_step": 26198, "epoch": 216} {"train_loss": -30.820173263549805, "global_step": 26199, "epoch": 216} {"train_loss": -31.078954696655273, "global_step": 26200, "epoch": 216} {"train_loss": -31.151397705078125, "global_step": 26201, "epoch": 216} {"train_loss": -31.126535415649414, "global_step": 26202, "epoch": 216} {"train_loss": -31.179288864135742, "global_step": 26203, "epoch": 216} {"train_loss": -31.146316528320312, "global_step": 26204, "epoch": 216} {"train_loss": -31.3859806060791, "global_step": 26205, "epoch": 216} {"train_loss": -31.395217895507812, "global_step": 26206, "epoch": 216} {"train_loss": -31.209613800048828, "global_step": 26207, "epoch": 216} {"train_loss": -31.566940307617188, "global_step": 26208, "epoch": 216} {"train_loss": -31.081989288330078, "global_step": 26209, "epoch": 216} {"train_loss": -31.754682540893555, "global_step": 26210, "epoch": 216} {"train_loss": -30.990015029907227, "global_step": 26211, "epoch": 216} {"train_loss": -31.804941177368164, "global_step": 26212, "epoch": 216} {"train_loss": -31.60015869140625, "global_step": 26213, "epoch": 216} {"train_loss": -31.369482040405273, "global_step": 26214, "epoch": 216} {"train_loss": -31.869977951049805, "global_step": 26215, "epoch": 216} {"train_loss": -31.499448776245117, "global_step": 26216, "epoch": 216} {"train_loss": -31.490264892578125, "global_step": 26217, "epoch": 216} {"train_loss": -32.00704574584961, "global_step": 26218, "epoch": 216} {"train_loss": -31.53480339050293, "global_step": 26219, "epoch": 216} {"train_loss": -31.816669464111328, "global_step": 26220, "epoch": 216} {"train_loss": -31.944257736206055, "global_step": 26221, "epoch": 216} {"train_loss": -31.800537109375, "global_step": 26222, "epoch": 216} {"train_loss": -31.9249324798584, "global_step": 26223, "epoch": 216} {"train_loss": -32.002655029296875, "global_step": 26224, "epoch": 216} {"train_loss": -31.806446075439453, "global_step": 26225, "epoch": 216} {"train_loss": -31.81867027282715, "global_step": 26226, "epoch": 216} {"train_loss": -31.81537437438965, "global_step": 26227, "epoch": 216} {"train_loss": -32.15664291381836, "global_step": 26228, "epoch": 216} {"train_loss": -31.98748779296875, "global_step": 26229, "epoch": 216} {"train_loss": -31.377521514892578, "global_step": 26230, "epoch": 216} {"train_loss": -31.667516708374023, "global_step": 26231, "epoch": 216} {"train_loss": -31.182586669921875, "global_step": 26232, "epoch": 216} {"train_loss": -31.325733184814453, "global_step": 26233, "epoch": 216} {"train_loss": -31.89239501953125, "global_step": 26234, "epoch": 216} {"train_loss": -31.942615509033203, "global_step": 26235, "epoch": 216} {"train_loss": -31.238697052001953, "global_step": 26236, "epoch": 216} {"train_loss": -30.246381759643555, "global_step": 26237, "epoch": 216} {"train_loss": -30.19843864440918, "global_step": 26238, "epoch": 216} {"train_loss": -29.366132736206055, "global_step": 26239, "epoch": 216} {"train_loss": -30.9022274017334, "global_step": 26240, "epoch": 216} {"train_loss": -31.516218185424805, "global_step": 26241, "epoch": 216} {"train_loss": -29.402191162109375, "global_step": 26242, "epoch": 216} {"train_loss": -27.17249870300293, "global_step": 26243, "epoch": 216} {"train_loss": -31.437726974487305, "global_step": 26244, "epoch": 216} {"train_loss": -30.42120361328125, "global_step": 26245, "epoch": 216} {"train_loss": -30.169591903686523, "global_step": 26246, "epoch": 216} {"train_loss": -31.5771541595459, "global_step": 26247, "epoch": 216} {"train_loss": -29.5102481842041, "global_step": 26248, "epoch": 216} {"train_loss": -30.98150634765625, "global_step": 26249, "epoch": 216} {"train_loss": -30.748294830322266, "global_step": 26250, "epoch": 216} {"train_loss": -29.726593017578125, "global_step": 26251, "epoch": 216} {"train_loss": -30.794879913330078, "global_step": 26252, "epoch": 216} {"train_loss": -31.061819076538086, "global_step": 26253, "epoch": 216} {"train_loss": -31.089136123657227, "global_step": 26254, "epoch": 216} {"train_loss": -31.023883819580078, "global_step": 26255, "epoch": 216} {"train_loss": -30.740248183573573, "global_step": 26256, "epoch": 216, "val_loss": 2608215.25} {"train_loss": -30.51935386657715, "global_step": 26257, "epoch": 217} {"train_loss": -31.2390079498291, "global_step": 26258, "epoch": 217} {"train_loss": -31.246490478515625, "global_step": 26259, "epoch": 217} {"train_loss": -29.056692123413086, "global_step": 26260, "epoch": 217} {"train_loss": -31.38205337524414, "global_step": 26261, "epoch": 217} {"train_loss": -29.125890731811523, "global_step": 26262, "epoch": 217} {"train_loss": -31.563779830932617, "global_step": 26263, "epoch": 217} {"train_loss": -29.5421142578125, "global_step": 26264, "epoch": 217} {"train_loss": -31.380762100219727, "global_step": 26265, "epoch": 217} {"train_loss": -30.52947998046875, "global_step": 26266, "epoch": 217} {"train_loss": -31.347753524780273, "global_step": 26267, "epoch": 217} {"train_loss": -30.139257431030273, "global_step": 26268, "epoch": 217} {"train_loss": -31.213605880737305, "global_step": 26269, "epoch": 217} {"train_loss": -31.03668212890625, "global_step": 26270, "epoch": 217} {"train_loss": -31.328887939453125, "global_step": 26271, "epoch": 217} {"train_loss": -31.39967155456543, "global_step": 26272, "epoch": 217} {"train_loss": -31.320377349853516, "global_step": 26273, "epoch": 217} {"train_loss": -31.066537857055664, "global_step": 26274, "epoch": 217} {"train_loss": -31.13809585571289, "global_step": 26275, "epoch": 217} {"train_loss": -31.263809204101562, "global_step": 26276, "epoch": 217} {"train_loss": -31.52273941040039, "global_step": 26277, "epoch": 217} {"train_loss": -31.876300811767578, "global_step": 26278, "epoch": 217} {"train_loss": -31.628503799438477, "global_step": 26279, "epoch": 217} {"train_loss": -31.422531127929688, "global_step": 26280, "epoch": 217} {"train_loss": -31.50919532775879, "global_step": 26281, "epoch": 217} {"train_loss": -32.053260803222656, "global_step": 26282, "epoch": 217} {"train_loss": -31.75811767578125, "global_step": 26283, "epoch": 217} {"train_loss": -31.62275505065918, "global_step": 26284, "epoch": 217} {"train_loss": -31.117462158203125, "global_step": 26285, "epoch": 217} {"train_loss": -31.551313400268555, "global_step": 26286, "epoch": 217} {"train_loss": -31.808176040649414, "global_step": 26287, "epoch": 217} {"train_loss": -32.22764587402344, "global_step": 26288, "epoch": 217} {"train_loss": -32.35555648803711, "global_step": 26289, "epoch": 217} {"train_loss": -31.66681480407715, "global_step": 26290, "epoch": 217} {"train_loss": -31.926517486572266, "global_step": 26291, "epoch": 217} {"train_loss": -32.24036407470703, "global_step": 26292, "epoch": 217} {"train_loss": -31.41400718688965, "global_step": 26293, "epoch": 217} {"train_loss": -30.841337203979492, "global_step": 26294, "epoch": 217} {"train_loss": -31.730260848999023, "global_step": 26295, "epoch": 217} {"train_loss": -32.005462646484375, "global_step": 26296, "epoch": 217} {"train_loss": -30.49911880493164, "global_step": 26297, "epoch": 217} {"train_loss": -30.3780517578125, "global_step": 26298, "epoch": 217} {"train_loss": -32.22550964355469, "global_step": 26299, "epoch": 217} {"train_loss": -29.864770889282227, "global_step": 26300, "epoch": 217} {"train_loss": -30.210678100585938, "global_step": 26301, "epoch": 217} {"train_loss": -31.24676513671875, "global_step": 26302, "epoch": 217} {"train_loss": -31.1864070892334, "global_step": 26303, "epoch": 217} {"train_loss": -31.064428329467773, "global_step": 26304, "epoch": 217} {"train_loss": -31.553625106811523, "global_step": 26305, "epoch": 217} {"train_loss": -31.375019073486328, "global_step": 26306, "epoch": 217} {"train_loss": -31.654861450195312, "global_step": 26307, "epoch": 217} {"train_loss": -31.69489860534668, "global_step": 26308, "epoch": 217} {"train_loss": -31.489683151245117, "global_step": 26309, "epoch": 217} {"train_loss": -31.614593505859375, "global_step": 26310, "epoch": 217} {"train_loss": -31.565885543823242, "global_step": 26311, "epoch": 217} {"train_loss": -31.420263290405273, "global_step": 26312, "epoch": 217} {"train_loss": -31.85517692565918, "global_step": 26313, "epoch": 217} {"train_loss": -31.439252853393555, "global_step": 26314, "epoch": 217} {"train_loss": -30.965713500976562, "global_step": 26315, "epoch": 217} {"train_loss": -30.9851131439209, "global_step": 26316, "epoch": 217} {"train_loss": -31.33420753479004, "global_step": 26317, "epoch": 217} {"train_loss": -31.886066436767578, "global_step": 26318, "epoch": 217} {"train_loss": -30.648054122924805, "global_step": 26319, "epoch": 217} {"train_loss": -31.383493423461914, "global_step": 26320, "epoch": 217} {"train_loss": -32.01301574707031, "global_step": 26321, "epoch": 217} {"train_loss": -31.283191680908203, "global_step": 26322, "epoch": 217} {"train_loss": -30.405364990234375, "global_step": 26323, "epoch": 217} {"train_loss": -31.983991622924805, "global_step": 26324, "epoch": 217} {"train_loss": -31.184293746948242, "global_step": 26325, "epoch": 217} {"train_loss": -31.8569393157959, "global_step": 26326, "epoch": 217} {"train_loss": -31.79109001159668, "global_step": 26327, "epoch": 217} {"train_loss": -31.846174240112305, "global_step": 26328, "epoch": 217} {"train_loss": -31.9141845703125, "global_step": 26329, "epoch": 217} {"train_loss": -31.685815811157227, "global_step": 26330, "epoch": 217} {"train_loss": -31.605573654174805, "global_step": 26331, "epoch": 217} {"train_loss": -30.817718505859375, "global_step": 26332, "epoch": 217} {"train_loss": -31.79020118713379, "global_step": 26333, "epoch": 217} {"train_loss": -31.813125610351562, "global_step": 26334, "epoch": 217} {"train_loss": -31.94105339050293, "global_step": 26335, "epoch": 217} {"train_loss": -31.872055053710938, "global_step": 26336, "epoch": 217} {"train_loss": -32.20103073120117, "global_step": 26337, "epoch": 217} {"train_loss": -32.232337951660156, "global_step": 26338, "epoch": 217} {"train_loss": -31.48649024963379, "global_step": 26339, "epoch": 217} {"train_loss": -31.896650314331055, "global_step": 26340, "epoch": 217} {"train_loss": -32.244808197021484, "global_step": 26341, "epoch": 217} {"train_loss": -32.180152893066406, "global_step": 26342, "epoch": 217} {"train_loss": -31.897480010986328, "global_step": 26343, "epoch": 217} {"train_loss": -31.71120262145996, "global_step": 26344, "epoch": 217} {"train_loss": -31.822187423706055, "global_step": 26345, "epoch": 217} {"train_loss": -32.18476486206055, "global_step": 26346, "epoch": 217} {"train_loss": -31.67026138305664, "global_step": 26347, "epoch": 217} {"train_loss": -32.250823974609375, "global_step": 26348, "epoch": 217} {"train_loss": -32.32725143432617, "global_step": 26349, "epoch": 217} {"train_loss": -32.00672912597656, "global_step": 26350, "epoch": 217} {"train_loss": -32.179771423339844, "global_step": 26351, "epoch": 217} {"train_loss": -31.938013076782227, "global_step": 26352, "epoch": 217} {"train_loss": -32.57615280151367, "global_step": 26353, "epoch": 217} {"train_loss": -32.353267669677734, "global_step": 26354, "epoch": 217} {"train_loss": -32.32513427734375, "global_step": 26355, "epoch": 217} {"train_loss": -30.83530616760254, "global_step": 26356, "epoch": 217} {"train_loss": -31.67637062072754, "global_step": 26357, "epoch": 217} {"train_loss": -31.356042861938477, "global_step": 26358, "epoch": 217} {"train_loss": -31.85662269592285, "global_step": 26359, "epoch": 217} {"train_loss": -32.570220947265625, "global_step": 26360, "epoch": 217} {"train_loss": -32.472991943359375, "global_step": 26361, "epoch": 217} {"train_loss": -31.79082679748535, "global_step": 26362, "epoch": 217} {"train_loss": -31.1675968170166, "global_step": 26363, "epoch": 217} {"train_loss": -32.225101470947266, "global_step": 26364, "epoch": 217} {"train_loss": -32.06838607788086, "global_step": 26365, "epoch": 217} {"train_loss": -31.700305938720703, "global_step": 26366, "epoch": 217} {"train_loss": -31.556745529174805, "global_step": 26367, "epoch": 217} {"train_loss": -30.495954513549805, "global_step": 26368, "epoch": 217} {"train_loss": -31.369583129882812, "global_step": 26369, "epoch": 217} {"train_loss": -31.381610870361328, "global_step": 26370, "epoch": 217} {"train_loss": -32.06547164916992, "global_step": 26371, "epoch": 217} {"train_loss": -31.424402236938477, "global_step": 26372, "epoch": 217} {"train_loss": -32.474246978759766, "global_step": 26373, "epoch": 217} {"train_loss": -31.49029541015625, "global_step": 26374, "epoch": 217} {"train_loss": -32.31764602661133, "global_step": 26375, "epoch": 217} {"train_loss": -32.21144485473633, "global_step": 26376, "epoch": 217} {"train_loss": -31.522566866283576, "global_step": 26377, "epoch": 217, "val_loss": 2464308.75} {"train_loss": -31.79737663269043, "global_step": 26378, "epoch": 218} {"train_loss": -31.58094596862793, "global_step": 26379, "epoch": 218} {"train_loss": -31.6571044921875, "global_step": 26380, "epoch": 218} {"train_loss": -32.00099182128906, "global_step": 26381, "epoch": 218} {"train_loss": -31.890167236328125, "global_step": 26382, "epoch": 218} {"train_loss": -32.367008209228516, "global_step": 26383, "epoch": 218} {"train_loss": -32.1942024230957, "global_step": 26384, "epoch": 218} {"train_loss": -32.196529388427734, "global_step": 26385, "epoch": 218} {"train_loss": -31.53877067565918, "global_step": 26386, "epoch": 218} {"train_loss": -31.46661376953125, "global_step": 26387, "epoch": 218} {"train_loss": -32.19723129272461, "global_step": 26388, "epoch": 218} {"train_loss": -32.318416595458984, "global_step": 26389, "epoch": 218} {"train_loss": -31.93732261657715, "global_step": 26390, "epoch": 218} {"train_loss": -30.935443878173828, "global_step": 26391, "epoch": 218} {"train_loss": -30.232385635375977, "global_step": 26392, "epoch": 218} {"train_loss": -31.580860137939453, "global_step": 26393, "epoch": 218} {"train_loss": -32.003719329833984, "global_step": 26394, "epoch": 218} {"train_loss": -31.26382827758789, "global_step": 26395, "epoch": 218} {"train_loss": -30.112369537353516, "global_step": 26396, "epoch": 218} {"train_loss": -30.172094345092773, "global_step": 26397, "epoch": 218} {"train_loss": -31.809316635131836, "global_step": 26398, "epoch": 218} {"train_loss": -31.908395767211914, "global_step": 26399, "epoch": 218} {"train_loss": -29.49936294555664, "global_step": 26400, "epoch": 218} {"train_loss": -26.822370529174805, "global_step": 26401, "epoch": 218} {"train_loss": -30.1978702545166, "global_step": 26402, "epoch": 218} {"train_loss": -29.978912353515625, "global_step": 26403, "epoch": 218} {"train_loss": -27.469547271728516, "global_step": 26404, "epoch": 218} {"train_loss": -29.79448890686035, "global_step": 26405, "epoch": 218} {"train_loss": -29.84906005859375, "global_step": 26406, "epoch": 218} {"train_loss": -28.58841896057129, "global_step": 26407, "epoch": 218} {"train_loss": -30.502552032470703, "global_step": 26408, "epoch": 218} {"train_loss": -28.869171142578125, "global_step": 26409, "epoch": 218} {"train_loss": -30.715124130249023, "global_step": 26410, "epoch": 218} {"train_loss": -30.4992618560791, "global_step": 26411, "epoch": 218} {"train_loss": -32.06852340698242, "global_step": 26412, "epoch": 218} {"train_loss": -30.655963897705078, "global_step": 26413, "epoch": 218} {"train_loss": -31.13116455078125, "global_step": 26414, "epoch": 218} {"train_loss": -31.360538482666016, "global_step": 26415, "epoch": 218} {"train_loss": -31.363428115844727, "global_step": 26416, "epoch": 218} {"train_loss": -30.539081573486328, "global_step": 26417, "epoch": 218} {"train_loss": -31.901517868041992, "global_step": 26418, "epoch": 218} {"train_loss": -30.657135009765625, "global_step": 26419, "epoch": 218} {"train_loss": -31.808349609375, "global_step": 26420, "epoch": 218} {"train_loss": -31.539026260375977, "global_step": 26421, "epoch": 218} {"train_loss": -31.8798770904541, "global_step": 26422, "epoch": 218} {"train_loss": -31.33112907409668, "global_step": 26423, "epoch": 218} {"train_loss": -31.81330680847168, "global_step": 26424, "epoch": 218} {"train_loss": -31.722227096557617, "global_step": 26425, "epoch": 218} {"train_loss": -31.860136032104492, "global_step": 26426, "epoch": 218} {"train_loss": -31.486785888671875, "global_step": 26427, "epoch": 218} {"train_loss": -32.11785125732422, "global_step": 26428, "epoch": 218} {"train_loss": -31.829336166381836, "global_step": 26429, "epoch": 218} {"train_loss": -32.05241775512695, "global_step": 26430, "epoch": 218} {"train_loss": -31.91156005859375, "global_step": 26431, "epoch": 218} {"train_loss": -31.849233627319336, "global_step": 26432, "epoch": 218} {"train_loss": -32.11385726928711, "global_step": 26433, "epoch": 218} {"train_loss": -32.38545608520508, "global_step": 26434, "epoch": 218} {"train_loss": -32.20377731323242, "global_step": 26435, "epoch": 218} {"train_loss": -32.09779739379883, "global_step": 26436, "epoch": 218} {"train_loss": -32.2509880065918, "global_step": 26437, "epoch": 218} {"train_loss": -32.17448425292969, "global_step": 26438, "epoch": 218} {"train_loss": -32.30641174316406, "global_step": 26439, "epoch": 218} {"train_loss": -32.13224411010742, "global_step": 26440, "epoch": 218} {"train_loss": -32.67169189453125, "global_step": 26441, "epoch": 218} {"train_loss": -32.33343505859375, "global_step": 26442, "epoch": 218} {"train_loss": -32.2235221862793, "global_step": 26443, "epoch": 218} {"train_loss": -32.20632553100586, "global_step": 26444, "epoch": 218} {"train_loss": -32.10737609863281, "global_step": 26445, "epoch": 218} {"train_loss": -32.19746017456055, "global_step": 26446, "epoch": 218} {"train_loss": -32.26350021362305, "global_step": 26447, "epoch": 218} {"train_loss": -32.05035400390625, "global_step": 26448, "epoch": 218} {"train_loss": -31.912195205688477, "global_step": 26449, "epoch": 218} {"train_loss": -32.55516052246094, "global_step": 26450, "epoch": 218} {"train_loss": -31.5846004486084, "global_step": 26451, "epoch": 218} {"train_loss": -32.00400924682617, "global_step": 26452, "epoch": 218} {"train_loss": -32.447486877441406, "global_step": 26453, "epoch": 218} {"train_loss": -32.036476135253906, "global_step": 26454, "epoch": 218} {"train_loss": -32.14763259887695, "global_step": 26455, "epoch": 218} {"train_loss": -32.25291061401367, "global_step": 26456, "epoch": 218} {"train_loss": -32.00447463989258, "global_step": 26457, "epoch": 218} {"train_loss": -31.826923370361328, "global_step": 26458, "epoch": 218} {"train_loss": -31.854084014892578, "global_step": 26459, "epoch": 218} {"train_loss": -32.25163650512695, "global_step": 26460, "epoch": 218} {"train_loss": -31.63981056213379, "global_step": 26461, "epoch": 218} {"train_loss": -31.07671546936035, "global_step": 26462, "epoch": 218} {"train_loss": -31.22028160095215, "global_step": 26463, "epoch": 218} {"train_loss": -31.161230087280273, "global_step": 26464, "epoch": 218} {"train_loss": -32.45756149291992, "global_step": 26465, "epoch": 218} {"train_loss": -31.4432430267334, "global_step": 26466, "epoch": 218} {"train_loss": -32.072505950927734, "global_step": 26467, "epoch": 218} {"train_loss": -31.86688804626465, "global_step": 26468, "epoch": 218} {"train_loss": -30.565885543823242, "global_step": 26469, "epoch": 218} {"train_loss": -30.238922119140625, "global_step": 26470, "epoch": 218} {"train_loss": -30.40607261657715, "global_step": 26471, "epoch": 218} {"train_loss": -31.483722686767578, "global_step": 26472, "epoch": 218} {"train_loss": -32.00233840942383, "global_step": 26473, "epoch": 218} {"train_loss": -30.893909454345703, "global_step": 26474, "epoch": 218} {"train_loss": -30.549665451049805, "global_step": 26475, "epoch": 218} {"train_loss": -30.136728286743164, "global_step": 26476, "epoch": 218} {"train_loss": -32.1817512512207, "global_step": 26477, "epoch": 218} {"train_loss": -32.01746368408203, "global_step": 26478, "epoch": 218} {"train_loss": -30.6301326751709, "global_step": 26479, "epoch": 218} {"train_loss": -32.62778854370117, "global_step": 26480, "epoch": 218} {"train_loss": -31.153493881225586, "global_step": 26481, "epoch": 218} {"train_loss": -30.000415802001953, "global_step": 26482, "epoch": 218} {"train_loss": -32.41978073120117, "global_step": 26483, "epoch": 218} {"train_loss": -30.4654598236084, "global_step": 26484, "epoch": 218} {"train_loss": -32.33856201171875, "global_step": 26485, "epoch": 218} {"train_loss": -31.272174835205078, "global_step": 26486, "epoch": 218} {"train_loss": -30.407928466796875, "global_step": 26487, "epoch": 218} {"train_loss": -31.454608917236328, "global_step": 26488, "epoch": 218} {"train_loss": -30.333066940307617, "global_step": 26489, "epoch": 218} {"train_loss": -31.907550811767578, "global_step": 26490, "epoch": 218} {"train_loss": -30.606611251831055, "global_step": 26491, "epoch": 218} {"train_loss": -31.45524024963379, "global_step": 26492, "epoch": 218} {"train_loss": -31.413837432861328, "global_step": 26493, "epoch": 218} {"train_loss": -31.691267013549805, "global_step": 26494, "epoch": 218} {"train_loss": -31.568307876586914, "global_step": 26495, "epoch": 218} {"train_loss": -31.494619369506836, "global_step": 26496, "epoch": 218} {"train_loss": -31.8064022064209, "global_step": 26497, "epoch": 218} {"train_loss": -31.419133005063397, "global_step": 26498, "epoch": 218, "val_loss": 2412970.25} {"train_loss": -31.25691795349121, "global_step": 26499, "epoch": 219} {"train_loss": -31.30109977722168, "global_step": 26500, "epoch": 219} {"train_loss": -31.01124382019043, "global_step": 26501, "epoch": 219} {"train_loss": -31.20026206970215, "global_step": 26502, "epoch": 219} {"train_loss": -30.71807861328125, "global_step": 26503, "epoch": 219} {"train_loss": -30.726293563842773, "global_step": 26504, "epoch": 219} {"train_loss": -30.653772354125977, "global_step": 26505, "epoch": 219} {"train_loss": -30.092126846313477, "global_step": 26506, "epoch": 219} {"train_loss": -30.777027130126953, "global_step": 26507, "epoch": 219} {"train_loss": -30.751630783081055, "global_step": 26508, "epoch": 219} {"train_loss": -30.185407638549805, "global_step": 26509, "epoch": 219} {"train_loss": -29.103473663330078, "global_step": 26510, "epoch": 219} {"train_loss": -30.005334854125977, "global_step": 26511, "epoch": 219} {"train_loss": -31.595884323120117, "global_step": 26512, "epoch": 219} {"train_loss": -30.5808162689209, "global_step": 26513, "epoch": 219} {"train_loss": -28.275054931640625, "global_step": 26514, "epoch": 219} {"train_loss": -29.927343368530273, "global_step": 26515, "epoch": 219} {"train_loss": -31.772113800048828, "global_step": 26516, "epoch": 219} {"train_loss": -30.324384689331055, "global_step": 26517, "epoch": 219} {"train_loss": -28.361631393432617, "global_step": 26518, "epoch": 219} {"train_loss": -30.57439613342285, "global_step": 26519, "epoch": 219} {"train_loss": -28.712560653686523, "global_step": 26520, "epoch": 219} {"train_loss": -29.639759063720703, "global_step": 26521, "epoch": 219} {"train_loss": -31.640247344970703, "global_step": 26522, "epoch": 219} {"train_loss": -30.118803024291992, "global_step": 26523, "epoch": 219} {"train_loss": -31.574356079101562, "global_step": 26524, "epoch": 219} {"train_loss": -30.59734535217285, "global_step": 26525, "epoch": 219} {"train_loss": -31.75067710876465, "global_step": 26526, "epoch": 219} {"train_loss": -30.79422378540039, "global_step": 26527, "epoch": 219} {"train_loss": -31.124908447265625, "global_step": 26528, "epoch": 219} {"train_loss": -31.4080867767334, "global_step": 26529, "epoch": 219} {"train_loss": -31.15867042541504, "global_step": 26530, "epoch": 219} {"train_loss": -32.1705207824707, "global_step": 26531, "epoch": 219} {"train_loss": -31.16375160217285, "global_step": 26532, "epoch": 219} {"train_loss": -31.887836456298828, "global_step": 26533, "epoch": 219} {"train_loss": -31.688901901245117, "global_step": 26534, "epoch": 219} {"train_loss": -31.680322647094727, "global_step": 26535, "epoch": 219} {"train_loss": -32.0866813659668, "global_step": 26536, "epoch": 219} {"train_loss": -31.129907608032227, "global_step": 26537, "epoch": 219} {"train_loss": -31.414031982421875, "global_step": 26538, "epoch": 219} {"train_loss": -31.96713638305664, "global_step": 26539, "epoch": 219} {"train_loss": -31.5999813079834, "global_step": 26540, "epoch": 219} {"train_loss": -31.8138484954834, "global_step": 26541, "epoch": 219} {"train_loss": -32.38056182861328, "global_step": 26542, "epoch": 219} {"train_loss": -31.78704833984375, "global_step": 26543, "epoch": 219} {"train_loss": -32.11780548095703, "global_step": 26544, "epoch": 219} {"train_loss": -32.175907135009766, "global_step": 26545, "epoch": 219} {"train_loss": -32.05697250366211, "global_step": 26546, "epoch": 219} {"train_loss": -32.14543914794922, "global_step": 26547, "epoch": 219} {"train_loss": -32.1594352722168, "global_step": 26548, "epoch": 219} {"train_loss": -32.096885681152344, "global_step": 26549, "epoch": 219} {"train_loss": -32.48063278198242, "global_step": 26550, "epoch": 219} {"train_loss": -32.118019104003906, "global_step": 26551, "epoch": 219} {"train_loss": -31.754657745361328, "global_step": 26552, "epoch": 219} {"train_loss": -32.21312713623047, "global_step": 26553, "epoch": 219} {"train_loss": -32.27006912231445, "global_step": 26554, "epoch": 219} {"train_loss": -31.861913681030273, "global_step": 26555, "epoch": 219} {"train_loss": -31.307416915893555, "global_step": 26556, "epoch": 219} {"train_loss": -31.8612117767334, "global_step": 26557, "epoch": 219} {"train_loss": -31.33172035217285, "global_step": 26558, "epoch": 219} {"train_loss": -32.28994369506836, "global_step": 26559, "epoch": 219} {"train_loss": -30.640722274780273, "global_step": 26560, "epoch": 219} {"train_loss": -32.15139389038086, "global_step": 26561, "epoch": 219} {"train_loss": -31.62809181213379, "global_step": 26562, "epoch": 219} {"train_loss": -31.588272094726562, "global_step": 26563, "epoch": 219} {"train_loss": -32.35244369506836, "global_step": 26564, "epoch": 219} {"train_loss": -31.575164794921875, "global_step": 26565, "epoch": 219} {"train_loss": -32.04909896850586, "global_step": 26566, "epoch": 219} {"train_loss": -31.92144775390625, "global_step": 26567, "epoch": 219} {"train_loss": -32.41520309448242, "global_step": 26568, "epoch": 219} {"train_loss": -32.08130645751953, "global_step": 26569, "epoch": 219} {"train_loss": -32.076969146728516, "global_step": 26570, "epoch": 219} {"train_loss": -31.683202743530273, "global_step": 26571, "epoch": 219} {"train_loss": -32.5315055847168, "global_step": 26572, "epoch": 219} {"train_loss": -32.27273941040039, "global_step": 26573, "epoch": 219} {"train_loss": -32.196346282958984, "global_step": 26574, "epoch": 219} {"train_loss": -32.33826446533203, "global_step": 26575, "epoch": 219} {"train_loss": -32.577308654785156, "global_step": 26576, "epoch": 219} {"train_loss": -32.497615814208984, "global_step": 26577, "epoch": 219} {"train_loss": -32.573726654052734, "global_step": 26578, "epoch": 219} {"train_loss": -32.4579963684082, "global_step": 26579, "epoch": 219} {"train_loss": -32.025264739990234, "global_step": 26580, "epoch": 219} {"train_loss": -31.6691837310791, "global_step": 26581, "epoch": 219} {"train_loss": -28.789554595947266, "global_step": 26582, "epoch": 219} {"train_loss": -21.984342575073242, "global_step": 26583, "epoch": 219} {"train_loss": -31.69904899597168, "global_step": 26584, "epoch": 219} {"train_loss": -24.984060287475586, "global_step": 26585, "epoch": 219} {"train_loss": -22.916534423828125, "global_step": 26586, "epoch": 219} {"train_loss": -25.10154914855957, "global_step": 26587, "epoch": 219} {"train_loss": -21.0595703125, "global_step": 26588, "epoch": 219} {"train_loss": -20.026647567749023, "global_step": 26589, "epoch": 219} {"train_loss": -25.076169967651367, "global_step": 26590, "epoch": 219} {"train_loss": -20.802453994750977, "global_step": 26591, "epoch": 219} {"train_loss": -25.905441284179688, "global_step": 26592, "epoch": 219} {"train_loss": -23.02198028564453, "global_step": 26593, "epoch": 219} {"train_loss": -28.572046279907227, "global_step": 26594, "epoch": 219} {"train_loss": -28.952850341796875, "global_step": 26595, "epoch": 219} {"train_loss": -24.22052574157715, "global_step": 26596, "epoch": 219} {"train_loss": -29.121732711791992, "global_step": 26597, "epoch": 219} {"train_loss": -30.137495040893555, "global_step": 26598, "epoch": 219} {"train_loss": -29.319650650024414, "global_step": 26599, "epoch": 219} {"train_loss": -29.67626953125, "global_step": 26600, "epoch": 219} {"train_loss": -28.113187789916992, "global_step": 26601, "epoch": 219} {"train_loss": -30.268890380859375, "global_step": 26602, "epoch": 219} {"train_loss": -29.75811195373535, "global_step": 26603, "epoch": 219} {"train_loss": -31.04150390625, "global_step": 26604, "epoch": 219} {"train_loss": -29.706928253173828, "global_step": 26605, "epoch": 219} {"train_loss": -30.3751277923584, "global_step": 26606, "epoch": 219} {"train_loss": -30.33180046081543, "global_step": 26607, "epoch": 219} {"train_loss": -30.771717071533203, "global_step": 26608, "epoch": 219} {"train_loss": -30.82753562927246, "global_step": 26609, "epoch": 219} {"train_loss": -30.787918090820312, "global_step": 26610, "epoch": 219} {"train_loss": -30.694534301757812, "global_step": 26611, "epoch": 219} {"train_loss": -30.45005226135254, "global_step": 26612, "epoch": 219} {"train_loss": -30.94293785095215, "global_step": 26613, "epoch": 219} {"train_loss": -31.032215118408203, "global_step": 26614, "epoch": 219} {"train_loss": -31.00770378112793, "global_step": 26615, "epoch": 219} {"train_loss": -30.70345115661621, "global_step": 26616, "epoch": 219} {"train_loss": -30.824146270751953, "global_step": 26617, "epoch": 219} {"train_loss": -31.0938663482666, "global_step": 26618, "epoch": 219} {"train_loss": -30.403355259540653, "global_step": 26619, "epoch": 219, "val_loss": 2479977.75} {"train_loss": -30.685766220092773, "global_step": 26620, "epoch": 220} {"train_loss": -31.073230743408203, "global_step": 26621, "epoch": 220} {"train_loss": -31.367971420288086, "global_step": 26622, "epoch": 220} {"train_loss": -31.106021881103516, "global_step": 26623, "epoch": 220} {"train_loss": -30.958154678344727, "global_step": 26624, "epoch": 220} {"train_loss": -31.336713790893555, "global_step": 26625, "epoch": 220} {"train_loss": -31.019922256469727, "global_step": 26626, "epoch": 220} {"train_loss": -31.258258819580078, "global_step": 26627, "epoch": 220} {"train_loss": -30.967151641845703, "global_step": 26628, "epoch": 220} {"train_loss": -31.61988639831543, "global_step": 26629, "epoch": 220} {"train_loss": -31.53607177734375, "global_step": 26630, "epoch": 220} {"train_loss": -31.4352970123291, "global_step": 26631, "epoch": 220} {"train_loss": -31.69683265686035, "global_step": 26632, "epoch": 220} {"train_loss": -31.736867904663086, "global_step": 26633, "epoch": 220} {"train_loss": -31.548208236694336, "global_step": 26634, "epoch": 220} {"train_loss": -31.404478073120117, "global_step": 26635, "epoch": 220} {"train_loss": -31.5281982421875, "global_step": 26636, "epoch": 220} {"train_loss": -31.691198348999023, "global_step": 26637, "epoch": 220} {"train_loss": -31.708698272705078, "global_step": 26638, "epoch": 220} {"train_loss": -31.317331314086914, "global_step": 26639, "epoch": 220} {"train_loss": -31.363271713256836, "global_step": 26640, "epoch": 220} {"train_loss": -30.985754013061523, "global_step": 26641, "epoch": 220} {"train_loss": -31.672210693359375, "global_step": 26642, "epoch": 220} {"train_loss": -31.97955322265625, "global_step": 26643, "epoch": 220} {"train_loss": -31.645679473876953, "global_step": 26644, "epoch": 220} {"train_loss": -31.298236846923828, "global_step": 26645, "epoch": 220} {"train_loss": -31.912240982055664, "global_step": 26646, "epoch": 220} {"train_loss": -31.305448532104492, "global_step": 26647, "epoch": 220} {"train_loss": -31.545190811157227, "global_step": 26648, "epoch": 220} {"train_loss": -31.6257381439209, "global_step": 26649, "epoch": 220} {"train_loss": -31.51930046081543, "global_step": 26650, "epoch": 220} {"train_loss": -31.24253273010254, "global_step": 26651, "epoch": 220} {"train_loss": -30.955062866210938, "global_step": 26652, "epoch": 220} {"train_loss": -30.063390731811523, "global_step": 26653, "epoch": 220} {"train_loss": -28.936193466186523, "global_step": 26654, "epoch": 220} {"train_loss": -27.026779174804688, "global_step": 26655, "epoch": 220} {"train_loss": -24.48017692565918, "global_step": 26656, "epoch": 220} {"train_loss": -21.784692764282227, "global_step": 26657, "epoch": 220} {"train_loss": -26.361547470092773, "global_step": 26658, "epoch": 220} {"train_loss": -25.83284568786621, "global_step": 26659, "epoch": 220} {"train_loss": -26.863910675048828, "global_step": 26660, "epoch": 220} {"train_loss": -29.041675567626953, "global_step": 26661, "epoch": 220} {"train_loss": -27.626379013061523, "global_step": 26662, "epoch": 220} {"train_loss": -29.575641632080078, "global_step": 26663, "epoch": 220} {"train_loss": -26.911396026611328, "global_step": 26664, "epoch": 220} {"train_loss": -30.780675888061523, "global_step": 26665, "epoch": 220} {"train_loss": -29.461523056030273, "global_step": 26666, "epoch": 220} {"train_loss": -28.087982177734375, "global_step": 26667, "epoch": 220} {"train_loss": -30.8670654296875, "global_step": 26668, "epoch": 220} {"train_loss": -30.512121200561523, "global_step": 26669, "epoch": 220} {"train_loss": -30.611663818359375, "global_step": 26670, "epoch": 220} {"train_loss": -29.876739501953125, "global_step": 26671, "epoch": 220} {"train_loss": -29.952280044555664, "global_step": 26672, "epoch": 220} {"train_loss": -30.15540885925293, "global_step": 26673, "epoch": 220} {"train_loss": -31.10869789123535, "global_step": 26674, "epoch": 220} {"train_loss": -31.22003746032715, "global_step": 26675, "epoch": 220} {"train_loss": -30.964643478393555, "global_step": 26676, "epoch": 220} {"train_loss": -31.021240234375, "global_step": 26677, "epoch": 220} {"train_loss": -30.389251708984375, "global_step": 26678, "epoch": 220} {"train_loss": -30.543344497680664, "global_step": 26679, "epoch": 220} {"train_loss": -30.726688385009766, "global_step": 26680, "epoch": 220} {"train_loss": -30.644245147705078, "global_step": 26681, "epoch": 220} {"train_loss": -30.837589263916016, "global_step": 26682, "epoch": 220} {"train_loss": -31.118183135986328, "global_step": 26683, "epoch": 220} {"train_loss": -30.9685001373291, "global_step": 26684, "epoch": 220} {"train_loss": -31.40497398376465, "global_step": 26685, "epoch": 220} {"train_loss": -30.6787166595459, "global_step": 26686, "epoch": 220} {"train_loss": -30.617725372314453, "global_step": 26687, "epoch": 220} {"train_loss": -30.970182418823242, "global_step": 26688, "epoch": 220} {"train_loss": -29.60662841796875, "global_step": 26689, "epoch": 220} {"train_loss": -31.282148361206055, "global_step": 26690, "epoch": 220} {"train_loss": -28.771041870117188, "global_step": 26691, "epoch": 220} {"train_loss": -31.330276489257812, "global_step": 26692, "epoch": 220} {"train_loss": -29.940046310424805, "global_step": 26693, "epoch": 220} {"train_loss": -31.577743530273438, "global_step": 26694, "epoch": 220} {"train_loss": -29.711862564086914, "global_step": 26695, "epoch": 220} {"train_loss": -31.258670806884766, "global_step": 26696, "epoch": 220} {"train_loss": -30.548389434814453, "global_step": 26697, "epoch": 220} {"train_loss": -30.929956436157227, "global_step": 26698, "epoch": 220} {"train_loss": -31.215473175048828, "global_step": 26699, "epoch": 220} {"train_loss": -30.820281982421875, "global_step": 26700, "epoch": 220} {"train_loss": -31.292688369750977, "global_step": 26701, "epoch": 220} {"train_loss": -31.00702476501465, "global_step": 26702, "epoch": 220} {"train_loss": -31.622699737548828, "global_step": 26703, "epoch": 220} {"train_loss": -31.249494552612305, "global_step": 26704, "epoch": 220} {"train_loss": -30.734689712524414, "global_step": 26705, "epoch": 220} {"train_loss": -31.0114803314209, "global_step": 26706, "epoch": 220} {"train_loss": -31.502826690673828, "global_step": 26707, "epoch": 220} {"train_loss": -30.856794357299805, "global_step": 26708, "epoch": 220} {"train_loss": -31.464746475219727, "global_step": 26709, "epoch": 220} {"train_loss": -31.845060348510742, "global_step": 26710, "epoch": 220} {"train_loss": -31.1502685546875, "global_step": 26711, "epoch": 220} {"train_loss": -31.232519149780273, "global_step": 26712, "epoch": 220} {"train_loss": -31.36859703063965, "global_step": 26713, "epoch": 220} {"train_loss": -31.852365493774414, "global_step": 26714, "epoch": 220} {"train_loss": -31.792774200439453, "global_step": 26715, "epoch": 220} {"train_loss": -31.184158325195312, "global_step": 26716, "epoch": 220} {"train_loss": -31.442792892456055, "global_step": 26717, "epoch": 220} {"train_loss": -30.30796241760254, "global_step": 26718, "epoch": 220} {"train_loss": -30.685964584350586, "global_step": 26719, "epoch": 220} {"train_loss": -30.732336044311523, "global_step": 26720, "epoch": 220} {"train_loss": -31.280303955078125, "global_step": 26721, "epoch": 220} {"train_loss": -31.794279098510742, "global_step": 26722, "epoch": 220} {"train_loss": -31.64277458190918, "global_step": 26723, "epoch": 220} {"train_loss": -31.585973739624023, "global_step": 26724, "epoch": 220} {"train_loss": -31.91790199279785, "global_step": 26725, "epoch": 220} {"train_loss": -31.448144912719727, "global_step": 26726, "epoch": 220} {"train_loss": -31.682178497314453, "global_step": 26727, "epoch": 220} {"train_loss": -30.934757232666016, "global_step": 26728, "epoch": 220} {"train_loss": -31.395273208618164, "global_step": 26729, "epoch": 220} {"train_loss": -31.740259170532227, "global_step": 26730, "epoch": 220} {"train_loss": -29.532297134399414, "global_step": 26731, "epoch": 220} {"train_loss": -27.59100341796875, "global_step": 26732, "epoch": 220} {"train_loss": -25.681360244750977, "global_step": 26733, "epoch": 220} {"train_loss": -28.16526222229004, "global_step": 26734, "epoch": 220} {"train_loss": -31.11516761779785, "global_step": 26735, "epoch": 220} {"train_loss": -31.16945457458496, "global_step": 26736, "epoch": 220} {"train_loss": -30.60694694519043, "global_step": 26737, "epoch": 220} {"train_loss": -31.72230339050293, "global_step": 26738, "epoch": 220} {"train_loss": -31.54851722717285, "global_step": 26739, "epoch": 220} {"train_loss": -30.57374938460421, "global_step": 26740, "epoch": 220, "val_loss": 2549117.75} {"train_loss": -31.069751739501953, "global_step": 26741, "epoch": 221} {"train_loss": -31.16822624206543, "global_step": 26742, "epoch": 221} {"train_loss": -31.487567901611328, "global_step": 26743, "epoch": 221} {"train_loss": -31.818042755126953, "global_step": 26744, "epoch": 221} {"train_loss": -31.41326332092285, "global_step": 26745, "epoch": 221} {"train_loss": -31.52471351623535, "global_step": 26746, "epoch": 221} {"train_loss": -31.651700973510742, "global_step": 26747, "epoch": 221} {"train_loss": -31.665815353393555, "global_step": 26748, "epoch": 221} {"train_loss": -31.771224975585938, "global_step": 26749, "epoch": 221} {"train_loss": -31.9544734954834, "global_step": 26750, "epoch": 221} {"train_loss": -31.773900985717773, "global_step": 26751, "epoch": 221} {"train_loss": -31.925556182861328, "global_step": 26752, "epoch": 221} {"train_loss": -31.603607177734375, "global_step": 26753, "epoch": 221} {"train_loss": -32.00492477416992, "global_step": 26754, "epoch": 221} {"train_loss": -31.9355411529541, "global_step": 26755, "epoch": 221} {"train_loss": -32.125911712646484, "global_step": 26756, "epoch": 221} {"train_loss": -31.94312858581543, "global_step": 26757, "epoch": 221} {"train_loss": -32.05341720581055, "global_step": 26758, "epoch": 221} {"train_loss": -31.8763427734375, "global_step": 26759, "epoch": 221} {"train_loss": -32.057247161865234, "global_step": 26760, "epoch": 221} {"train_loss": -32.34796905517578, "global_step": 26761, "epoch": 221} {"train_loss": -31.92789077758789, "global_step": 26762, "epoch": 221} {"train_loss": -32.291259765625, "global_step": 26763, "epoch": 221} {"train_loss": -32.09638214111328, "global_step": 26764, "epoch": 221} {"train_loss": -32.440921783447266, "global_step": 26765, "epoch": 221} {"train_loss": -32.56217575073242, "global_step": 26766, "epoch": 221} {"train_loss": -32.18185043334961, "global_step": 26767, "epoch": 221} {"train_loss": -32.47834396362305, "global_step": 26768, "epoch": 221} {"train_loss": -32.55474853515625, "global_step": 26769, "epoch": 221} {"train_loss": -32.72843551635742, "global_step": 26770, "epoch": 221} {"train_loss": -32.22550582885742, "global_step": 26771, "epoch": 221} {"train_loss": -32.720947265625, "global_step": 26772, "epoch": 221} {"train_loss": -32.44558334350586, "global_step": 26773, "epoch": 221} {"train_loss": -32.30826950073242, "global_step": 26774, "epoch": 221} {"train_loss": -32.46482849121094, "global_step": 26775, "epoch": 221} {"train_loss": -32.20127487182617, "global_step": 26776, "epoch": 221} {"train_loss": -32.07745361328125, "global_step": 26777, "epoch": 221} {"train_loss": -32.74262619018555, "global_step": 26778, "epoch": 221} {"train_loss": -32.518707275390625, "global_step": 26779, "epoch": 221} {"train_loss": -32.12490463256836, "global_step": 26780, "epoch": 221} {"train_loss": -32.49137878417969, "global_step": 26781, "epoch": 221} {"train_loss": -32.632877349853516, "global_step": 26782, "epoch": 221} {"train_loss": -32.344139099121094, "global_step": 26783, "epoch": 221} {"train_loss": -32.35649108886719, "global_step": 26784, "epoch": 221} {"train_loss": -31.975055694580078, "global_step": 26785, "epoch": 221} {"train_loss": -32.1099967956543, "global_step": 26786, "epoch": 221} {"train_loss": -32.39675521850586, "global_step": 26787, "epoch": 221} {"train_loss": -32.364498138427734, "global_step": 26788, "epoch": 221} {"train_loss": -32.51777267456055, "global_step": 26789, "epoch": 221} {"train_loss": -32.38047409057617, "global_step": 26790, "epoch": 221} {"train_loss": -31.916492462158203, "global_step": 26791, "epoch": 221} {"train_loss": -31.680313110351562, "global_step": 26792, "epoch": 221} {"train_loss": -30.91472816467285, "global_step": 26793, "epoch": 221} {"train_loss": -29.785709381103516, "global_step": 26794, "epoch": 221} {"train_loss": -27.610034942626953, "global_step": 26795, "epoch": 221} {"train_loss": -19.852659225463867, "global_step": 26796, "epoch": 221} {"train_loss": -31.832202911376953, "global_step": 26797, "epoch": 221} {"train_loss": -27.863555908203125, "global_step": 26798, "epoch": 221} {"train_loss": -25.18599510192871, "global_step": 26799, "epoch": 221} {"train_loss": -32.07417297363281, "global_step": 26800, "epoch": 221} {"train_loss": -28.64080810546875, "global_step": 26801, "epoch": 221} {"train_loss": -31.23029136657715, "global_step": 26802, "epoch": 221} {"train_loss": -29.624753952026367, "global_step": 26803, "epoch": 221} {"train_loss": -32.019630432128906, "global_step": 26804, "epoch": 221} {"train_loss": -29.78028678894043, "global_step": 26805, "epoch": 221} {"train_loss": -31.777196884155273, "global_step": 26806, "epoch": 221} {"train_loss": -31.095508575439453, "global_step": 26807, "epoch": 221} {"train_loss": -31.27821922302246, "global_step": 26808, "epoch": 221} {"train_loss": -32.06402587890625, "global_step": 26809, "epoch": 221} {"train_loss": -31.381540298461914, "global_step": 26810, "epoch": 221} {"train_loss": -31.39865493774414, "global_step": 26811, "epoch": 221} {"train_loss": -32.3061408996582, "global_step": 26812, "epoch": 221} {"train_loss": -31.79426383972168, "global_step": 26813, "epoch": 221} {"train_loss": -31.56023597717285, "global_step": 26814, "epoch": 221} {"train_loss": -32.01017379760742, "global_step": 26815, "epoch": 221} {"train_loss": -31.60222816467285, "global_step": 26816, "epoch": 221} {"train_loss": -32.1049690246582, "global_step": 26817, "epoch": 221} {"train_loss": -32.25681686401367, "global_step": 26818, "epoch": 221} {"train_loss": -32.23264694213867, "global_step": 26819, "epoch": 221} {"train_loss": -32.249019622802734, "global_step": 26820, "epoch": 221} {"train_loss": -32.0973014831543, "global_step": 26821, "epoch": 221} {"train_loss": -32.06284713745117, "global_step": 26822, "epoch": 221} {"train_loss": -32.16145706176758, "global_step": 26823, "epoch": 221} {"train_loss": -32.277183532714844, "global_step": 26824, "epoch": 221} {"train_loss": -32.54326629638672, "global_step": 26825, "epoch": 221} {"train_loss": -32.548614501953125, "global_step": 26826, "epoch": 221} {"train_loss": -30.90753746032715, "global_step": 26827, "epoch": 221} {"train_loss": -26.848520278930664, "global_step": 26828, "epoch": 221} {"train_loss": -20.09141731262207, "global_step": 26829, "epoch": 221} {"train_loss": -11.827548027038574, "global_step": 26830, "epoch": 221} {"train_loss": -29.257404327392578, "global_step": 26831, "epoch": 221} {"train_loss": -9.340102195739746, "global_step": 26832, "epoch": 221} {"train_loss": -26.25592613220215, "global_step": 26833, "epoch": 221} {"train_loss": -19.8262996673584, "global_step": 26834, "epoch": 221} {"train_loss": -28.341205596923828, "global_step": 26835, "epoch": 221} {"train_loss": -24.00583839416504, "global_step": 26836, "epoch": 221} {"train_loss": -27.337202072143555, "global_step": 26837, "epoch": 221} {"train_loss": -28.032140731811523, "global_step": 26838, "epoch": 221} {"train_loss": -25.950117111206055, "global_step": 26839, "epoch": 221} {"train_loss": -28.94098472595215, "global_step": 26840, "epoch": 221} {"train_loss": -29.551532745361328, "global_step": 26841, "epoch": 221} {"train_loss": -27.990650177001953, "global_step": 26842, "epoch": 221} {"train_loss": -28.711883544921875, "global_step": 26843, "epoch": 221} {"train_loss": -29.476232528686523, "global_step": 26844, "epoch": 221} {"train_loss": -29.7161922454834, "global_step": 26845, "epoch": 221} {"train_loss": -29.691211700439453, "global_step": 26846, "epoch": 221} {"train_loss": -28.85369300842285, "global_step": 26847, "epoch": 221} {"train_loss": -29.329742431640625, "global_step": 26848, "epoch": 221} {"train_loss": -30.084705352783203, "global_step": 26849, "epoch": 221} {"train_loss": -30.10468101501465, "global_step": 26850, "epoch": 221} {"train_loss": -30.016162872314453, "global_step": 26851, "epoch": 221} {"train_loss": -29.877368927001953, "global_step": 26852, "epoch": 221} {"train_loss": -29.734420776367188, "global_step": 26853, "epoch": 221} {"train_loss": -29.876798629760742, "global_step": 26854, "epoch": 221} {"train_loss": -30.12947654724121, "global_step": 26855, "epoch": 221} {"train_loss": -30.227313995361328, "global_step": 26856, "epoch": 221} {"train_loss": -30.255451202392578, "global_step": 26857, "epoch": 221} {"train_loss": -30.131994247436523, "global_step": 26858, "epoch": 221} {"train_loss": -30.582263946533203, "global_step": 26859, "epoch": 221} {"train_loss": -30.139453887939453, "global_step": 26860, "epoch": 221} {"train_loss": -30.401281908523938, "global_step": 26861, "epoch": 221, "val_loss": 2725318.25} {"train_loss": -30.595539093017578, "global_step": 26862, "epoch": 222} {"train_loss": -30.99213218688965, "global_step": 26863, "epoch": 222} {"train_loss": -30.947534561157227, "global_step": 26864, "epoch": 222} {"train_loss": -31.09149169921875, "global_step": 26865, "epoch": 222} {"train_loss": -30.97022819519043, "global_step": 26866, "epoch": 222} {"train_loss": -30.993667602539062, "global_step": 26867, "epoch": 222} {"train_loss": -30.73369789123535, "global_step": 26868, "epoch": 222} {"train_loss": -30.667633056640625, "global_step": 26869, "epoch": 222} {"train_loss": -30.693893432617188, "global_step": 26870, "epoch": 222} {"train_loss": -30.20273208618164, "global_step": 26871, "epoch": 222} {"train_loss": -28.475711822509766, "global_step": 26872, "epoch": 222} {"train_loss": -21.422561645507812, "global_step": 26873, "epoch": 222} {"train_loss": -0.6512851715087891, "global_step": 26874, "epoch": 222} {"train_loss": 7.398863315582275, "global_step": 26875, "epoch": 222} {"train_loss": -30.553308486938477, "global_step": 26876, "epoch": 222} {"train_loss": -9.383838653564453, "global_step": 26877, "epoch": 222} {"train_loss": -22.107175827026367, "global_step": 26878, "epoch": 222} {"train_loss": -26.5327091217041, "global_step": 26879, "epoch": 222} {"train_loss": -17.313459396362305, "global_step": 26880, "epoch": 222} {"train_loss": -25.35777473449707, "global_step": 26881, "epoch": 222} {"train_loss": -29.64679527282715, "global_step": 26882, "epoch": 222} {"train_loss": -27.00837516784668, "global_step": 26883, "epoch": 222} {"train_loss": -24.897357940673828, "global_step": 26884, "epoch": 222} {"train_loss": -26.61468505859375, "global_step": 26885, "epoch": 222} {"train_loss": -28.958688735961914, "global_step": 26886, "epoch": 222} {"train_loss": -29.735822677612305, "global_step": 26887, "epoch": 222} {"train_loss": -29.980459213256836, "global_step": 26888, "epoch": 222} {"train_loss": -29.05678367614746, "global_step": 26889, "epoch": 222} {"train_loss": -28.714588165283203, "global_step": 26890, "epoch": 222} {"train_loss": -28.758726119995117, "global_step": 26891, "epoch": 222} {"train_loss": -29.39385986328125, "global_step": 26892, "epoch": 222} {"train_loss": -30.233732223510742, "global_step": 26893, "epoch": 222} {"train_loss": -30.03925895690918, "global_step": 26894, "epoch": 222} {"train_loss": -29.758804321289062, "global_step": 26895, "epoch": 222} {"train_loss": -30.0154972076416, "global_step": 26896, "epoch": 222} {"train_loss": -29.872709274291992, "global_step": 26897, "epoch": 222} {"train_loss": -29.498188018798828, "global_step": 26898, "epoch": 222} {"train_loss": -29.774124145507812, "global_step": 26899, "epoch": 222} {"train_loss": -29.784543991088867, "global_step": 26900, "epoch": 222} {"train_loss": -29.643766403198242, "global_step": 26901, "epoch": 222} {"train_loss": -29.147369384765625, "global_step": 26902, "epoch": 222} {"train_loss": -29.783864974975586, "global_step": 26903, "epoch": 222} {"train_loss": -29.633153915405273, "global_step": 26904, "epoch": 222} {"train_loss": -30.445837020874023, "global_step": 26905, "epoch": 222} {"train_loss": -30.331701278686523, "global_step": 26906, "epoch": 222} {"train_loss": -30.134870529174805, "global_step": 26907, "epoch": 222} {"train_loss": -30.488346099853516, "global_step": 26908, "epoch": 222} {"train_loss": -30.449527740478516, "global_step": 26909, "epoch": 222} {"train_loss": -30.3623046875, "global_step": 26910, "epoch": 222} {"train_loss": -30.4361572265625, "global_step": 26911, "epoch": 222} {"train_loss": -30.2452335357666, "global_step": 26912, "epoch": 222} {"train_loss": -30.27215003967285, "global_step": 26913, "epoch": 222} {"train_loss": -30.328168869018555, "global_step": 26914, "epoch": 222} {"train_loss": -30.33711051940918, "global_step": 26915, "epoch": 222} {"train_loss": -30.558902740478516, "global_step": 26916, "epoch": 222} {"train_loss": -30.6343936920166, "global_step": 26917, "epoch": 222} {"train_loss": -29.77882957458496, "global_step": 26918, "epoch": 222} {"train_loss": -30.881437301635742, "global_step": 26919, "epoch": 222} {"train_loss": -30.86396598815918, "global_step": 26920, "epoch": 222} {"train_loss": -30.81831169128418, "global_step": 26921, "epoch": 222} {"train_loss": -30.621143341064453, "global_step": 26922, "epoch": 222} {"train_loss": -30.49812889099121, "global_step": 26923, "epoch": 222} {"train_loss": -30.671106338500977, "global_step": 26924, "epoch": 222} {"train_loss": -30.960187911987305, "global_step": 26925, "epoch": 222} {"train_loss": -30.5750675201416, "global_step": 26926, "epoch": 222} {"train_loss": -30.824827194213867, "global_step": 26927, "epoch": 222} {"train_loss": -30.37676429748535, "global_step": 26928, "epoch": 222} {"train_loss": -30.80474281311035, "global_step": 26929, "epoch": 222} {"train_loss": -30.82703971862793, "global_step": 26930, "epoch": 222} {"train_loss": -30.326770782470703, "global_step": 26931, "epoch": 222} {"train_loss": -30.34981346130371, "global_step": 26932, "epoch": 222} {"train_loss": -31.012344360351562, "global_step": 26933, "epoch": 222} {"train_loss": -31.09038734436035, "global_step": 26934, "epoch": 222} {"train_loss": -30.184232711791992, "global_step": 26935, "epoch": 222} {"train_loss": -30.550018310546875, "global_step": 26936, "epoch": 222} {"train_loss": -31.22736930847168, "global_step": 26937, "epoch": 222} {"train_loss": -30.393218994140625, "global_step": 26938, "epoch": 222} {"train_loss": -30.447498321533203, "global_step": 26939, "epoch": 222} {"train_loss": -31.01407814025879, "global_step": 26940, "epoch": 222} {"train_loss": -30.367359161376953, "global_step": 26941, "epoch": 222} {"train_loss": -30.758502960205078, "global_step": 26942, "epoch": 222} {"train_loss": -30.526578903198242, "global_step": 26943, "epoch": 222} {"train_loss": -30.826831817626953, "global_step": 26944, "epoch": 222} {"train_loss": -30.6760196685791, "global_step": 26945, "epoch": 222} {"train_loss": -30.95075798034668, "global_step": 26946, "epoch": 222} {"train_loss": -31.115400314331055, "global_step": 26947, "epoch": 222} {"train_loss": -30.857770919799805, "global_step": 26948, "epoch": 222} {"train_loss": -30.8055477142334, "global_step": 26949, "epoch": 222} {"train_loss": -30.8841609954834, "global_step": 26950, "epoch": 222} {"train_loss": -31.250085830688477, "global_step": 26951, "epoch": 222} {"train_loss": -30.69317626953125, "global_step": 26952, "epoch": 222} {"train_loss": -30.890090942382812, "global_step": 26953, "epoch": 222} {"train_loss": -31.41350746154785, "global_step": 26954, "epoch": 222} {"train_loss": -30.912750244140625, "global_step": 26955, "epoch": 222} {"train_loss": -31.200576782226562, "global_step": 26956, "epoch": 222} {"train_loss": -31.094858169555664, "global_step": 26957, "epoch": 222} {"train_loss": -30.976755142211914, "global_step": 26958, "epoch": 222} {"train_loss": -31.025876998901367, "global_step": 26959, "epoch": 222} {"train_loss": -31.188512802124023, "global_step": 26960, "epoch": 222} {"train_loss": -31.21589469909668, "global_step": 26961, "epoch": 222} {"train_loss": -30.53609275817871, "global_step": 26962, "epoch": 222} {"train_loss": -30.619537353515625, "global_step": 26963, "epoch": 222} {"train_loss": -31.286191940307617, "global_step": 26964, "epoch": 222} {"train_loss": -30.706241607666016, "global_step": 26965, "epoch": 222} {"train_loss": -31.073511123657227, "global_step": 26966, "epoch": 222} {"train_loss": -30.536670684814453, "global_step": 26967, "epoch": 222} {"train_loss": -30.521337509155273, "global_step": 26968, "epoch": 222} {"train_loss": -30.7984619140625, "global_step": 26969, "epoch": 222} {"train_loss": -31.064041137695312, "global_step": 26970, "epoch": 222} {"train_loss": -30.963850021362305, "global_step": 26971, "epoch": 222} {"train_loss": -30.693500518798828, "global_step": 26972, "epoch": 222} {"train_loss": -30.279712677001953, "global_step": 26973, "epoch": 222} {"train_loss": -30.200239181518555, "global_step": 26974, "epoch": 222} {"train_loss": -30.668964385986328, "global_step": 26975, "epoch": 222} {"train_loss": -30.849781036376953, "global_step": 26976, "epoch": 222} {"train_loss": -31.07282829284668, "global_step": 26977, "epoch": 222} {"train_loss": -30.59052085876465, "global_step": 26978, "epoch": 222} {"train_loss": -29.587316513061523, "global_step": 26979, "epoch": 222} {"train_loss": -30.710126876831055, "global_step": 26980, "epoch": 222} {"train_loss": -30.874866485595703, "global_step": 26981, "epoch": 222} {"train_loss": -29.297991157563263, "global_step": 26982, "epoch": 222, "val_loss": 2576317.75} {"train_loss": -30.909133911132812, "global_step": 26983, "epoch": 223} {"train_loss": -28.50140953063965, "global_step": 26984, "epoch": 223} {"train_loss": -28.248899459838867, "global_step": 26985, "epoch": 223} {"train_loss": -30.433929443359375, "global_step": 26986, "epoch": 223} {"train_loss": -27.956628799438477, "global_step": 26987, "epoch": 223} {"train_loss": -29.487634658813477, "global_step": 26988, "epoch": 223} {"train_loss": -28.426727294921875, "global_step": 26989, "epoch": 223} {"train_loss": -26.853363037109375, "global_step": 26990, "epoch": 223} {"train_loss": -26.762975692749023, "global_step": 26991, "epoch": 223} {"train_loss": -27.288848876953125, "global_step": 26992, "epoch": 223} {"train_loss": -30.8140926361084, "global_step": 26993, "epoch": 223} {"train_loss": -29.251142501831055, "global_step": 26994, "epoch": 223} {"train_loss": -28.148365020751953, "global_step": 26995, "epoch": 223} {"train_loss": -31.156021118164062, "global_step": 26996, "epoch": 223} {"train_loss": -28.47406578063965, "global_step": 26997, "epoch": 223} {"train_loss": -29.25732421875, "global_step": 26998, "epoch": 223} {"train_loss": -30.138660430908203, "global_step": 26999, "epoch": 223} {"train_loss": -29.951068878173828, "global_step": 27000, "epoch": 223} {"train_loss": -30.401769638061523, "global_step": 27001, "epoch": 223} {"train_loss": -29.61810302734375, "global_step": 27002, "epoch": 223} {"train_loss": -30.194543838500977, "global_step": 27003, "epoch": 223} {"train_loss": -30.306324005126953, "global_step": 27004, "epoch": 223} {"train_loss": -31.090259552001953, "global_step": 27005, "epoch": 223} {"train_loss": -30.645902633666992, "global_step": 27006, "epoch": 223} {"train_loss": -31.05877685546875, "global_step": 27007, "epoch": 223} {"train_loss": -30.861948013305664, "global_step": 27008, "epoch": 223} {"train_loss": -30.990385055541992, "global_step": 27009, "epoch": 223} {"train_loss": -31.301965713500977, "global_step": 27010, "epoch": 223} {"train_loss": -31.074787139892578, "global_step": 27011, "epoch": 223} {"train_loss": -31.02613639831543, "global_step": 27012, "epoch": 223} {"train_loss": -31.040143966674805, "global_step": 27013, "epoch": 223} {"train_loss": -30.534521102905273, "global_step": 27014, "epoch": 223} {"train_loss": -31.21462059020996, "global_step": 27015, "epoch": 223} {"train_loss": -30.754053115844727, "global_step": 27016, "epoch": 223} {"train_loss": -31.131933212280273, "global_step": 27017, "epoch": 223} {"train_loss": -30.792118072509766, "global_step": 27018, "epoch": 223} {"train_loss": -30.81797218322754, "global_step": 27019, "epoch": 223} {"train_loss": -30.955982208251953, "global_step": 27020, "epoch": 223} {"train_loss": -30.993505477905273, "global_step": 27021, "epoch": 223} {"train_loss": -31.355886459350586, "global_step": 27022, "epoch": 223} {"train_loss": -31.5515193939209, "global_step": 27023, "epoch": 223} {"train_loss": -31.11464500427246, "global_step": 27024, "epoch": 223} {"train_loss": -30.966211318969727, "global_step": 27025, "epoch": 223} {"train_loss": -30.66144371032715, "global_step": 27026, "epoch": 223} {"train_loss": -30.938806533813477, "global_step": 27027, "epoch": 223} {"train_loss": -31.115528106689453, "global_step": 27028, "epoch": 223} {"train_loss": -31.424121856689453, "global_step": 27029, "epoch": 223} {"train_loss": -31.45937156677246, "global_step": 27030, "epoch": 223} {"train_loss": -31.068628311157227, "global_step": 27031, "epoch": 223} {"train_loss": -31.31888771057129, "global_step": 27032, "epoch": 223} {"train_loss": -31.045795440673828, "global_step": 27033, "epoch": 223} {"train_loss": -30.965103149414062, "global_step": 27034, "epoch": 223} {"train_loss": -31.299161911010742, "global_step": 27035, "epoch": 223} {"train_loss": -31.557147979736328, "global_step": 27036, "epoch": 223} {"train_loss": -31.41163444519043, "global_step": 27037, "epoch": 223} {"train_loss": -31.20305824279785, "global_step": 27038, "epoch": 223} {"train_loss": -31.405221939086914, "global_step": 27039, "epoch": 223} {"train_loss": -31.507556915283203, "global_step": 27040, "epoch": 223} {"train_loss": -31.5201416015625, "global_step": 27041, "epoch": 223} {"train_loss": -31.522443771362305, "global_step": 27042, "epoch": 223} {"train_loss": -31.783588409423828, "global_step": 27043, "epoch": 223} {"train_loss": -31.61636734008789, "global_step": 27044, "epoch": 223} {"train_loss": -31.987518310546875, "global_step": 27045, "epoch": 223} {"train_loss": -31.815641403198242, "global_step": 27046, "epoch": 223} {"train_loss": -31.938953399658203, "global_step": 27047, "epoch": 223} {"train_loss": -31.91704750061035, "global_step": 27048, "epoch": 223} {"train_loss": -31.66805076599121, "global_step": 27049, "epoch": 223} {"train_loss": -31.6234130859375, "global_step": 27050, "epoch": 223} {"train_loss": -31.778406143188477, "global_step": 27051, "epoch": 223} {"train_loss": -30.65350914001465, "global_step": 27052, "epoch": 223} {"train_loss": -30.840253829956055, "global_step": 27053, "epoch": 223} {"train_loss": -31.578826904296875, "global_step": 27054, "epoch": 223} {"train_loss": -29.13779067993164, "global_step": 27055, "epoch": 223} {"train_loss": -30.413991928100586, "global_step": 27056, "epoch": 223} {"train_loss": -27.357229232788086, "global_step": 27057, "epoch": 223} {"train_loss": -30.2799129486084, "global_step": 27058, "epoch": 223} {"train_loss": -29.260663986206055, "global_step": 27059, "epoch": 223} {"train_loss": -28.000259399414062, "global_step": 27060, "epoch": 223} {"train_loss": -29.614500045776367, "global_step": 27061, "epoch": 223} {"train_loss": -30.328998565673828, "global_step": 27062, "epoch": 223} {"train_loss": -31.536481857299805, "global_step": 27063, "epoch": 223} {"train_loss": -31.068790435791016, "global_step": 27064, "epoch": 223} {"train_loss": -31.42878532409668, "global_step": 27065, "epoch": 223} {"train_loss": -31.291580200195312, "global_step": 27066, "epoch": 223} {"train_loss": -30.67706298828125, "global_step": 27067, "epoch": 223} {"train_loss": -31.19175148010254, "global_step": 27068, "epoch": 223} {"train_loss": -31.524023056030273, "global_step": 27069, "epoch": 223} {"train_loss": -31.068891525268555, "global_step": 27070, "epoch": 223} {"train_loss": -31.200698852539062, "global_step": 27071, "epoch": 223} {"train_loss": -31.287506103515625, "global_step": 27072, "epoch": 223} {"train_loss": -31.634069442749023, "global_step": 27073, "epoch": 223} {"train_loss": -31.443334579467773, "global_step": 27074, "epoch": 223} {"train_loss": -31.309812545776367, "global_step": 27075, "epoch": 223} {"train_loss": -31.209421157836914, "global_step": 27076, "epoch": 223} {"train_loss": -31.46514320373535, "global_step": 27077, "epoch": 223} {"train_loss": -31.720966339111328, "global_step": 27078, "epoch": 223} {"train_loss": -31.683130264282227, "global_step": 27079, "epoch": 223} {"train_loss": -31.996662139892578, "global_step": 27080, "epoch": 223} {"train_loss": -31.872262954711914, "global_step": 27081, "epoch": 223} {"train_loss": -31.689697265625, "global_step": 27082, "epoch": 223} {"train_loss": -31.884668350219727, "global_step": 27083, "epoch": 223} {"train_loss": -31.463592529296875, "global_step": 27084, "epoch": 223} {"train_loss": -32.28242111206055, "global_step": 27085, "epoch": 223} {"train_loss": -31.588300704956055, "global_step": 27086, "epoch": 223} {"train_loss": -31.474210739135742, "global_step": 27087, "epoch": 223} {"train_loss": -31.74187660217285, "global_step": 27088, "epoch": 223} {"train_loss": -31.6075439453125, "global_step": 27089, "epoch": 223} {"train_loss": -32.00916290283203, "global_step": 27090, "epoch": 223} {"train_loss": -31.798887252807617, "global_step": 27091, "epoch": 223} {"train_loss": -31.909046173095703, "global_step": 27092, "epoch": 223} {"train_loss": -31.752338409423828, "global_step": 27093, "epoch": 223} {"train_loss": -32.05134582519531, "global_step": 27094, "epoch": 223} {"train_loss": -31.595081329345703, "global_step": 27095, "epoch": 223} {"train_loss": -31.439899444580078, "global_step": 27096, "epoch": 223} {"train_loss": -30.781158447265625, "global_step": 27097, "epoch": 223} {"train_loss": -29.713027954101562, "global_step": 27098, "epoch": 223} {"train_loss": -31.425174713134766, "global_step": 27099, "epoch": 223} {"train_loss": -30.333911895751953, "global_step": 27100, "epoch": 223} {"train_loss": -30.397186279296875, "global_step": 27101, "epoch": 223} {"train_loss": -30.324451446533203, "global_step": 27102, "epoch": 223} {"train_loss": -30.796163511670326, "global_step": 27103, "epoch": 223, "val_loss": 2708091.0} {"train_loss": -30.5045108795166, "global_step": 27104, "epoch": 224} {"train_loss": -26.6368465423584, "global_step": 27105, "epoch": 224} {"train_loss": -29.22376823425293, "global_step": 27106, "epoch": 224} {"train_loss": -31.243438720703125, "global_step": 27107, "epoch": 224} {"train_loss": -29.815778732299805, "global_step": 27108, "epoch": 224} {"train_loss": -30.047805786132812, "global_step": 27109, "epoch": 224} {"train_loss": -31.0006103515625, "global_step": 27110, "epoch": 224} {"train_loss": -31.06805992126465, "global_step": 27111, "epoch": 224} {"train_loss": -30.9500789642334, "global_step": 27112, "epoch": 224} {"train_loss": -30.63824462890625, "global_step": 27113, "epoch": 224} {"train_loss": -31.048999786376953, "global_step": 27114, "epoch": 224} {"train_loss": -31.180952072143555, "global_step": 27115, "epoch": 224} {"train_loss": -31.091506958007812, "global_step": 27116, "epoch": 224} {"train_loss": -31.407154083251953, "global_step": 27117, "epoch": 224} {"train_loss": -31.38983726501465, "global_step": 27118, "epoch": 224} {"train_loss": -31.06764030456543, "global_step": 27119, "epoch": 224} {"train_loss": -31.59388542175293, "global_step": 27120, "epoch": 224} {"train_loss": -30.952543258666992, "global_step": 27121, "epoch": 224} {"train_loss": -31.39178466796875, "global_step": 27122, "epoch": 224} {"train_loss": -31.239973068237305, "global_step": 27123, "epoch": 224} {"train_loss": -31.3587703704834, "global_step": 27124, "epoch": 224} {"train_loss": -31.384931564331055, "global_step": 27125, "epoch": 224} {"train_loss": -31.37090492248535, "global_step": 27126, "epoch": 224} {"train_loss": -31.42691421508789, "global_step": 27127, "epoch": 224} {"train_loss": -31.478504180908203, "global_step": 27128, "epoch": 224} {"train_loss": -31.1423397064209, "global_step": 27129, "epoch": 224} {"train_loss": -31.341480255126953, "global_step": 27130, "epoch": 224} {"train_loss": -31.527753829956055, "global_step": 27131, "epoch": 224} {"train_loss": -31.586816787719727, "global_step": 27132, "epoch": 224} {"train_loss": -31.857213973999023, "global_step": 27133, "epoch": 224} {"train_loss": -31.962665557861328, "global_step": 27134, "epoch": 224} {"train_loss": -31.917648315429688, "global_step": 27135, "epoch": 224} {"train_loss": -32.28810501098633, "global_step": 27136, "epoch": 224} {"train_loss": -31.901721954345703, "global_step": 27137, "epoch": 224} {"train_loss": -32.34658432006836, "global_step": 27138, "epoch": 224} {"train_loss": -31.81792640686035, "global_step": 27139, "epoch": 224} {"train_loss": -31.77166748046875, "global_step": 27140, "epoch": 224} {"train_loss": -31.96058464050293, "global_step": 27141, "epoch": 224} {"train_loss": -32.33091354370117, "global_step": 27142, "epoch": 224} {"train_loss": -32.13665008544922, "global_step": 27143, "epoch": 224} {"train_loss": -32.19770431518555, "global_step": 27144, "epoch": 224} {"train_loss": -32.491329193115234, "global_step": 27145, "epoch": 224} {"train_loss": -32.29692459106445, "global_step": 27146, "epoch": 224} {"train_loss": -32.066993713378906, "global_step": 27147, "epoch": 224} {"train_loss": -32.856361389160156, "global_step": 27148, "epoch": 224} {"train_loss": -32.72500991821289, "global_step": 27149, "epoch": 224} {"train_loss": -32.48678970336914, "global_step": 27150, "epoch": 224} {"train_loss": -32.458099365234375, "global_step": 27151, "epoch": 224} {"train_loss": -32.10174560546875, "global_step": 27152, "epoch": 224} {"train_loss": -32.29710006713867, "global_step": 27153, "epoch": 224} {"train_loss": -32.82402420043945, "global_step": 27154, "epoch": 224} {"train_loss": -32.047454833984375, "global_step": 27155, "epoch": 224} {"train_loss": -31.96150016784668, "global_step": 27156, "epoch": 224} {"train_loss": -32.61399841308594, "global_step": 27157, "epoch": 224} {"train_loss": -32.075382232666016, "global_step": 27158, "epoch": 224} {"train_loss": -30.707015991210938, "global_step": 27159, "epoch": 224} {"train_loss": -31.177160263061523, "global_step": 27160, "epoch": 224} {"train_loss": -31.666107177734375, "global_step": 27161, "epoch": 224} {"train_loss": -32.38313674926758, "global_step": 27162, "epoch": 224} {"train_loss": -31.749420166015625, "global_step": 27163, "epoch": 224} {"train_loss": -32.44648361206055, "global_step": 27164, "epoch": 224} {"train_loss": -32.12137222290039, "global_step": 27165, "epoch": 224} {"train_loss": -32.50486755371094, "global_step": 27166, "epoch": 224} {"train_loss": -31.53046989440918, "global_step": 27167, "epoch": 224} {"train_loss": -32.075740814208984, "global_step": 27168, "epoch": 224} {"train_loss": -32.3165397644043, "global_step": 27169, "epoch": 224} {"train_loss": -31.653833389282227, "global_step": 27170, "epoch": 224} {"train_loss": -31.670663833618164, "global_step": 27171, "epoch": 224} {"train_loss": -30.897886276245117, "global_step": 27172, "epoch": 224} {"train_loss": -30.78828239440918, "global_step": 27173, "epoch": 224} {"train_loss": -30.1298770904541, "global_step": 27174, "epoch": 224} {"train_loss": -29.520343780517578, "global_step": 27175, "epoch": 224} {"train_loss": -29.154224395751953, "global_step": 27176, "epoch": 224} {"train_loss": -30.838672637939453, "global_step": 27177, "epoch": 224} {"train_loss": -29.065027236938477, "global_step": 27178, "epoch": 224} {"train_loss": -25.90972328186035, "global_step": 27179, "epoch": 224} {"train_loss": -27.6474666595459, "global_step": 27180, "epoch": 224} {"train_loss": -28.932706832885742, "global_step": 27181, "epoch": 224} {"train_loss": -30.354984283447266, "global_step": 27182, "epoch": 224} {"train_loss": -31.2990779876709, "global_step": 27183, "epoch": 224} {"train_loss": -27.297916412353516, "global_step": 27184, "epoch": 224} {"train_loss": -31.53120231628418, "global_step": 27185, "epoch": 224} {"train_loss": -30.805456161499023, "global_step": 27186, "epoch": 224} {"train_loss": -31.09113121032715, "global_step": 27187, "epoch": 224} {"train_loss": -31.219009399414062, "global_step": 27188, "epoch": 224} {"train_loss": -31.328460693359375, "global_step": 27189, "epoch": 224} {"train_loss": -30.79603385925293, "global_step": 27190, "epoch": 224} {"train_loss": -30.437658309936523, "global_step": 27191, "epoch": 224} {"train_loss": -31.216571807861328, "global_step": 27192, "epoch": 224} {"train_loss": -31.099884033203125, "global_step": 27193, "epoch": 224} {"train_loss": -30.572721481323242, "global_step": 27194, "epoch": 224} {"train_loss": -31.477460861206055, "global_step": 27195, "epoch": 224} {"train_loss": -30.68031120300293, "global_step": 27196, "epoch": 224} {"train_loss": -30.830860137939453, "global_step": 27197, "epoch": 224} {"train_loss": -30.755964279174805, "global_step": 27198, "epoch": 224} {"train_loss": -31.14497947692871, "global_step": 27199, "epoch": 224} {"train_loss": -31.15399169921875, "global_step": 27200, "epoch": 224} {"train_loss": -31.663135528564453, "global_step": 27201, "epoch": 224} {"train_loss": -31.173437118530273, "global_step": 27202, "epoch": 224} {"train_loss": -31.602649688720703, "global_step": 27203, "epoch": 224} {"train_loss": -31.326980590820312, "global_step": 27204, "epoch": 224} {"train_loss": -31.43961524963379, "global_step": 27205, "epoch": 224} {"train_loss": -31.559492111206055, "global_step": 27206, "epoch": 224} {"train_loss": -31.656660079956055, "global_step": 27207, "epoch": 224} {"train_loss": -31.793699264526367, "global_step": 27208, "epoch": 224} {"train_loss": -31.713903427124023, "global_step": 27209, "epoch": 224} {"train_loss": -31.7161922454834, "global_step": 27210, "epoch": 224} {"train_loss": -31.528120040893555, "global_step": 27211, "epoch": 224} {"train_loss": -31.463531494140625, "global_step": 27212, "epoch": 224} {"train_loss": -31.934326171875, "global_step": 27213, "epoch": 224} {"train_loss": -31.388715744018555, "global_step": 27214, "epoch": 224} {"train_loss": -32.06208038330078, "global_step": 27215, "epoch": 224} {"train_loss": -32.117427825927734, "global_step": 27216, "epoch": 224} {"train_loss": -31.72909927368164, "global_step": 27217, "epoch": 224} {"train_loss": -31.955570220947266, "global_step": 27218, "epoch": 224} {"train_loss": -32.33079528808594, "global_step": 27219, "epoch": 224} {"train_loss": -31.465473175048828, "global_step": 27220, "epoch": 224} {"train_loss": -31.998336791992188, "global_step": 27221, "epoch": 224} {"train_loss": -31.892887115478516, "global_step": 27222, "epoch": 224} {"train_loss": -31.967334747314453, "global_step": 27223, "epoch": 224} {"train_loss": -31.302611122446613, "global_step": 27224, "epoch": 224, "val_loss": 2530741.25} {"train_loss": -31.745559692382812, "global_step": 27225, "epoch": 225} {"train_loss": -32.49540328979492, "global_step": 27226, "epoch": 225} {"train_loss": -32.41688919067383, "global_step": 27227, "epoch": 225} {"train_loss": -32.27386474609375, "global_step": 27228, "epoch": 225} {"train_loss": -32.6041259765625, "global_step": 27229, "epoch": 225} {"train_loss": -32.4166374206543, "global_step": 27230, "epoch": 225} {"train_loss": -32.65325927734375, "global_step": 27231, "epoch": 225} {"train_loss": -32.276123046875, "global_step": 27232, "epoch": 225} {"train_loss": -32.51618576049805, "global_step": 27233, "epoch": 225} {"train_loss": -32.3127326965332, "global_step": 27234, "epoch": 225} {"train_loss": -32.32293701171875, "global_step": 27235, "epoch": 225} {"train_loss": -32.530433654785156, "global_step": 27236, "epoch": 225} {"train_loss": -32.18671798706055, "global_step": 27237, "epoch": 225} {"train_loss": -32.54366683959961, "global_step": 27238, "epoch": 225} {"train_loss": -32.21110534667969, "global_step": 27239, "epoch": 225} {"train_loss": -32.22364044189453, "global_step": 27240, "epoch": 225} {"train_loss": -32.324459075927734, "global_step": 27241, "epoch": 225} {"train_loss": -32.519874572753906, "global_step": 27242, "epoch": 225} {"train_loss": -32.489253997802734, "global_step": 27243, "epoch": 225} {"train_loss": -32.14302444458008, "global_step": 27244, "epoch": 225} {"train_loss": -32.480567932128906, "global_step": 27245, "epoch": 225} {"train_loss": -32.000152587890625, "global_step": 27246, "epoch": 225} {"train_loss": -32.319618225097656, "global_step": 27247, "epoch": 225} {"train_loss": -32.07659912109375, "global_step": 27248, "epoch": 225} {"train_loss": -32.46675491333008, "global_step": 27249, "epoch": 225} {"train_loss": -32.048744201660156, "global_step": 27250, "epoch": 225} {"train_loss": -31.911069869995117, "global_step": 27251, "epoch": 225} {"train_loss": -32.68423080444336, "global_step": 27252, "epoch": 225} {"train_loss": -32.38319778442383, "global_step": 27253, "epoch": 225} {"train_loss": -32.32029724121094, "global_step": 27254, "epoch": 225} {"train_loss": -32.66791534423828, "global_step": 27255, "epoch": 225} {"train_loss": -32.3507194519043, "global_step": 27256, "epoch": 225} {"train_loss": -32.711002349853516, "global_step": 27257, "epoch": 225} {"train_loss": -32.60652542114258, "global_step": 27258, "epoch": 225} {"train_loss": -32.19976806640625, "global_step": 27259, "epoch": 225} {"train_loss": -31.99542236328125, "global_step": 27260, "epoch": 225} {"train_loss": -30.46170425415039, "global_step": 27261, "epoch": 225} {"train_loss": -31.4874210357666, "global_step": 27262, "epoch": 225} {"train_loss": -31.888519287109375, "global_step": 27263, "epoch": 225} {"train_loss": -32.06494903564453, "global_step": 27264, "epoch": 225} {"train_loss": -31.2928466796875, "global_step": 27265, "epoch": 225} {"train_loss": -30.80034828186035, "global_step": 27266, "epoch": 225} {"train_loss": -30.26873779296875, "global_step": 27267, "epoch": 225} {"train_loss": -32.28078842163086, "global_step": 27268, "epoch": 225} {"train_loss": -30.566553115844727, "global_step": 27269, "epoch": 225} {"train_loss": -28.475284576416016, "global_step": 27270, "epoch": 225} {"train_loss": -30.09627342224121, "global_step": 27271, "epoch": 225} {"train_loss": -29.927602767944336, "global_step": 27272, "epoch": 225} {"train_loss": -29.332082748413086, "global_step": 27273, "epoch": 225} {"train_loss": -32.06719970703125, "global_step": 27274, "epoch": 225} {"train_loss": -31.765844345092773, "global_step": 27275, "epoch": 225} {"train_loss": -31.27438735961914, "global_step": 27276, "epoch": 225} {"train_loss": -31.794910430908203, "global_step": 27277, "epoch": 225} {"train_loss": -30.981122970581055, "global_step": 27278, "epoch": 225} {"train_loss": -31.90450096130371, "global_step": 27279, "epoch": 225} {"train_loss": -31.670562744140625, "global_step": 27280, "epoch": 225} {"train_loss": -31.8527889251709, "global_step": 27281, "epoch": 225} {"train_loss": -32.04911422729492, "global_step": 27282, "epoch": 225} {"train_loss": -31.976831436157227, "global_step": 27283, "epoch": 225} {"train_loss": -31.289661407470703, "global_step": 27284, "epoch": 225} {"train_loss": -32.17717361450195, "global_step": 27285, "epoch": 225} {"train_loss": -31.7613582611084, "global_step": 27286, "epoch": 225} {"train_loss": -31.897436141967773, "global_step": 27287, "epoch": 225} {"train_loss": -31.86468505859375, "global_step": 27288, "epoch": 225} {"train_loss": -32.32411575317383, "global_step": 27289, "epoch": 225} {"train_loss": -32.24201583862305, "global_step": 27290, "epoch": 225} {"train_loss": -31.925369262695312, "global_step": 27291, "epoch": 225} {"train_loss": -31.31428337097168, "global_step": 27292, "epoch": 225} {"train_loss": -32.63890838623047, "global_step": 27293, "epoch": 225} {"train_loss": -32.048072814941406, "global_step": 27294, "epoch": 225} {"train_loss": -32.14484786987305, "global_step": 27295, "epoch": 225} {"train_loss": -32.061729431152344, "global_step": 27296, "epoch": 225} {"train_loss": -32.10456466674805, "global_step": 27297, "epoch": 225} {"train_loss": -31.807432174682617, "global_step": 27298, "epoch": 225} {"train_loss": -32.27909469604492, "global_step": 27299, "epoch": 225} {"train_loss": -32.5989875793457, "global_step": 27300, "epoch": 225} {"train_loss": -32.14950180053711, "global_step": 27301, "epoch": 225} {"train_loss": -32.26396560668945, "global_step": 27302, "epoch": 225} {"train_loss": -32.23173141479492, "global_step": 27303, "epoch": 225} {"train_loss": -32.31180953979492, "global_step": 27304, "epoch": 225} {"train_loss": -32.409969329833984, "global_step": 27305, "epoch": 225} {"train_loss": -32.664100646972656, "global_step": 27306, "epoch": 225} {"train_loss": -32.5689811706543, "global_step": 27307, "epoch": 225} {"train_loss": -32.52863311767578, "global_step": 27308, "epoch": 225} {"train_loss": -32.47682571411133, "global_step": 27309, "epoch": 225} {"train_loss": -31.78621482849121, "global_step": 27310, "epoch": 225} {"train_loss": -32.672847747802734, "global_step": 27311, "epoch": 225} {"train_loss": -32.463470458984375, "global_step": 27312, "epoch": 225} {"train_loss": -32.20412826538086, "global_step": 27313, "epoch": 225} {"train_loss": -32.169559478759766, "global_step": 27314, "epoch": 225} {"train_loss": -32.47208786010742, "global_step": 27315, "epoch": 225} {"train_loss": -32.388763427734375, "global_step": 27316, "epoch": 225} {"train_loss": -32.4676628112793, "global_step": 27317, "epoch": 225} {"train_loss": -32.50434494018555, "global_step": 27318, "epoch": 225} {"train_loss": -32.9887809753418, "global_step": 27319, "epoch": 225} {"train_loss": -32.371395111083984, "global_step": 27320, "epoch": 225} {"train_loss": -32.42098617553711, "global_step": 27321, "epoch": 225} {"train_loss": -32.63564682006836, "global_step": 27322, "epoch": 225} {"train_loss": -32.6695671081543, "global_step": 27323, "epoch": 225} {"train_loss": -31.813129425048828, "global_step": 27324, "epoch": 225} {"train_loss": -29.7979679107666, "global_step": 27325, "epoch": 225} {"train_loss": -26.761005401611328, "global_step": 27326, "epoch": 225} {"train_loss": -30.958057403564453, "global_step": 27327, "epoch": 225} {"train_loss": -29.919330596923828, "global_step": 27328, "epoch": 225} {"train_loss": -31.83271598815918, "global_step": 27329, "epoch": 225} {"train_loss": -30.179157257080078, "global_step": 27330, "epoch": 225} {"train_loss": -29.72185707092285, "global_step": 27331, "epoch": 225} {"train_loss": -28.890369415283203, "global_step": 27332, "epoch": 225} {"train_loss": -27.2529296875, "global_step": 27333, "epoch": 225} {"train_loss": -23.91370964050293, "global_step": 27334, "epoch": 225} {"train_loss": -18.974506378173828, "global_step": 27335, "epoch": 225} {"train_loss": -18.678695678710938, "global_step": 27336, "epoch": 225} {"train_loss": -31.521291732788086, "global_step": 27337, "epoch": 225} {"train_loss": -19.342330932617188, "global_step": 27338, "epoch": 225} {"train_loss": -26.432025909423828, "global_step": 27339, "epoch": 225} {"train_loss": -29.370080947875977, "global_step": 27340, "epoch": 225} {"train_loss": -23.762531280517578, "global_step": 27341, "epoch": 225} {"train_loss": -29.10857582092285, "global_step": 27342, "epoch": 225} {"train_loss": -27.585010528564453, "global_step": 27343, "epoch": 225} {"train_loss": -28.571821212768555, "global_step": 27344, "epoch": 225} {"train_loss": -31.20402287254649, "global_step": 27345, "epoch": 225, "val_loss": 2441866.25} {"train_loss": -27.58210563659668, "global_step": 27346, "epoch": 226} {"train_loss": -31.353376388549805, "global_step": 27347, "epoch": 226} {"train_loss": -29.605392456054688, "global_step": 27348, "epoch": 226} {"train_loss": -28.864797592163086, "global_step": 27349, "epoch": 226} {"train_loss": -30.945425033569336, "global_step": 27350, "epoch": 226} {"train_loss": -29.9364070892334, "global_step": 27351, "epoch": 226} {"train_loss": -29.677764892578125, "global_step": 27352, "epoch": 226} {"train_loss": -31.0809326171875, "global_step": 27353, "epoch": 226} {"train_loss": -30.954252243041992, "global_step": 27354, "epoch": 226} {"train_loss": -29.891876220703125, "global_step": 27355, "epoch": 226} {"train_loss": -31.05243492126465, "global_step": 27356, "epoch": 226} {"train_loss": -31.055999755859375, "global_step": 27357, "epoch": 226} {"train_loss": -31.028961181640625, "global_step": 27358, "epoch": 226} {"train_loss": -30.712881088256836, "global_step": 27359, "epoch": 226} {"train_loss": -31.43230628967285, "global_step": 27360, "epoch": 226} {"train_loss": -30.84859275817871, "global_step": 27361, "epoch": 226} {"train_loss": -30.921659469604492, "global_step": 27362, "epoch": 226} {"train_loss": -30.642675399780273, "global_step": 27363, "epoch": 226} {"train_loss": -31.247467041015625, "global_step": 27364, "epoch": 226} {"train_loss": -31.446130752563477, "global_step": 27365, "epoch": 226} {"train_loss": -31.46177101135254, "global_step": 27366, "epoch": 226} {"train_loss": -30.98318862915039, "global_step": 27367, "epoch": 226} {"train_loss": -31.305908203125, "global_step": 27368, "epoch": 226} {"train_loss": -31.5924072265625, "global_step": 27369, "epoch": 226} {"train_loss": -31.483840942382812, "global_step": 27370, "epoch": 226} {"train_loss": -31.606611251831055, "global_step": 27371, "epoch": 226} {"train_loss": -31.2705020904541, "global_step": 27372, "epoch": 226} {"train_loss": -31.82818031311035, "global_step": 27373, "epoch": 226} {"train_loss": -31.786624908447266, "global_step": 27374, "epoch": 226} {"train_loss": -31.740705490112305, "global_step": 27375, "epoch": 226} {"train_loss": -31.888818740844727, "global_step": 27376, "epoch": 226} {"train_loss": -32.20075225830078, "global_step": 27377, "epoch": 226} {"train_loss": -31.99061393737793, "global_step": 27378, "epoch": 226} {"train_loss": -31.920759201049805, "global_step": 27379, "epoch": 226} {"train_loss": -32.32589340209961, "global_step": 27380, "epoch": 226} {"train_loss": -31.666767120361328, "global_step": 27381, "epoch": 226} {"train_loss": -32.20821762084961, "global_step": 27382, "epoch": 226} {"train_loss": -32.08685302734375, "global_step": 27383, "epoch": 226} {"train_loss": -31.88448143005371, "global_step": 27384, "epoch": 226} {"train_loss": -32.29179000854492, "global_step": 27385, "epoch": 226} {"train_loss": -31.8839168548584, "global_step": 27386, "epoch": 226} {"train_loss": -31.578933715820312, "global_step": 27387, "epoch": 226} {"train_loss": -30.733596801757812, "global_step": 27388, "epoch": 226} {"train_loss": -30.231054306030273, "global_step": 27389, "epoch": 226} {"train_loss": -29.107669830322266, "global_step": 27390, "epoch": 226} {"train_loss": -28.049230575561523, "global_step": 27391, "epoch": 226} {"train_loss": -29.020145416259766, "global_step": 27392, "epoch": 226} {"train_loss": -30.187341690063477, "global_step": 27393, "epoch": 226} {"train_loss": -31.803546905517578, "global_step": 27394, "epoch": 226} {"train_loss": -29.84564208984375, "global_step": 27395, "epoch": 226} {"train_loss": -28.277206420898438, "global_step": 27396, "epoch": 226} {"train_loss": -31.064847946166992, "global_step": 27397, "epoch": 226} {"train_loss": -31.154333114624023, "global_step": 27398, "epoch": 226} {"train_loss": -31.146316528320312, "global_step": 27399, "epoch": 226} {"train_loss": -29.069854736328125, "global_step": 27400, "epoch": 226} {"train_loss": -29.496877670288086, "global_step": 27401, "epoch": 226} {"train_loss": -30.66761589050293, "global_step": 27402, "epoch": 226} {"train_loss": -29.0941104888916, "global_step": 27403, "epoch": 226} {"train_loss": -30.878467559814453, "global_step": 27404, "epoch": 226} {"train_loss": -29.200687408447266, "global_step": 27405, "epoch": 226} {"train_loss": -30.88232421875, "global_step": 27406, "epoch": 226} {"train_loss": -30.407148361206055, "global_step": 27407, "epoch": 226} {"train_loss": -30.377172470092773, "global_step": 27408, "epoch": 226} {"train_loss": -30.65012550354004, "global_step": 27409, "epoch": 226} {"train_loss": -31.208072662353516, "global_step": 27410, "epoch": 226} {"train_loss": -30.941314697265625, "global_step": 27411, "epoch": 226} {"train_loss": -31.118988037109375, "global_step": 27412, "epoch": 226} {"train_loss": -31.23029136657715, "global_step": 27413, "epoch": 226} {"train_loss": -31.217763900756836, "global_step": 27414, "epoch": 226} {"train_loss": -31.356801986694336, "global_step": 27415, "epoch": 226} {"train_loss": -30.870059967041016, "global_step": 27416, "epoch": 226} {"train_loss": -31.287240982055664, "global_step": 27417, "epoch": 226} {"train_loss": -31.604339599609375, "global_step": 27418, "epoch": 226} {"train_loss": -31.583127975463867, "global_step": 27419, "epoch": 226} {"train_loss": -31.5226993560791, "global_step": 27420, "epoch": 226} {"train_loss": -31.771875381469727, "global_step": 27421, "epoch": 226} {"train_loss": -31.61614418029785, "global_step": 27422, "epoch": 226} {"train_loss": -31.761701583862305, "global_step": 27423, "epoch": 226} {"train_loss": -31.837121963500977, "global_step": 27424, "epoch": 226} {"train_loss": -31.826736450195312, "global_step": 27425, "epoch": 226} {"train_loss": -31.900897979736328, "global_step": 27426, "epoch": 226} {"train_loss": -31.988067626953125, "global_step": 27427, "epoch": 226} {"train_loss": -32.12832260131836, "global_step": 27428, "epoch": 226} {"train_loss": -31.985929489135742, "global_step": 27429, "epoch": 226} {"train_loss": -32.32547378540039, "global_step": 27430, "epoch": 226} {"train_loss": -32.09590148925781, "global_step": 27431, "epoch": 226} {"train_loss": -32.26375198364258, "global_step": 27432, "epoch": 226} {"train_loss": -31.98148536682129, "global_step": 27433, "epoch": 226} {"train_loss": -32.15170669555664, "global_step": 27434, "epoch": 226} {"train_loss": -32.28804016113281, "global_step": 27435, "epoch": 226} {"train_loss": -32.663448333740234, "global_step": 27436, "epoch": 226} {"train_loss": -32.23783493041992, "global_step": 27437, "epoch": 226} {"train_loss": -32.35924530029297, "global_step": 27438, "epoch": 226} {"train_loss": -32.42184066772461, "global_step": 27439, "epoch": 226} {"train_loss": -32.038047790527344, "global_step": 27440, "epoch": 226} {"train_loss": -32.82645797729492, "global_step": 27441, "epoch": 226} {"train_loss": -32.84041213989258, "global_step": 27442, "epoch": 226} {"train_loss": -32.680233001708984, "global_step": 27443, "epoch": 226} {"train_loss": -32.56214141845703, "global_step": 27444, "epoch": 226} {"train_loss": -32.386592864990234, "global_step": 27445, "epoch": 226} {"train_loss": -32.56141662597656, "global_step": 27446, "epoch": 226} {"train_loss": -32.61140060424805, "global_step": 27447, "epoch": 226} {"train_loss": -32.14241027832031, "global_step": 27448, "epoch": 226} {"train_loss": -32.889671325683594, "global_step": 27449, "epoch": 226} {"train_loss": -32.984405517578125, "global_step": 27450, "epoch": 226} {"train_loss": -32.44392013549805, "global_step": 27451, "epoch": 226} {"train_loss": -32.905120849609375, "global_step": 27452, "epoch": 226} {"train_loss": -32.5779914855957, "global_step": 27453, "epoch": 226} {"train_loss": -32.930145263671875, "global_step": 27454, "epoch": 226} {"train_loss": -33.131465911865234, "global_step": 27455, "epoch": 226} {"train_loss": -32.59769821166992, "global_step": 27456, "epoch": 226} {"train_loss": -33.055152893066406, "global_step": 27457, "epoch": 226} {"train_loss": -32.424964904785156, "global_step": 27458, "epoch": 226} {"train_loss": -32.90252685546875, "global_step": 27459, "epoch": 226} {"train_loss": -32.4619026184082, "global_step": 27460, "epoch": 226} {"train_loss": -32.417144775390625, "global_step": 27461, "epoch": 226} {"train_loss": -32.3433723449707, "global_step": 27462, "epoch": 226} {"train_loss": -32.21841049194336, "global_step": 27463, "epoch": 226} {"train_loss": -32.44942855834961, "global_step": 27464, "epoch": 226} {"train_loss": -32.52975082397461, "global_step": 27465, "epoch": 226} {"train_loss": -31.44241793293598, "global_step": 27466, "epoch": 226, "val_loss": 2394479.25} {"train_loss": -32.33466339111328, "global_step": 27467, "epoch": 227} {"train_loss": -32.6151237487793, "global_step": 27468, "epoch": 227} {"train_loss": -31.8096866607666, "global_step": 27469, "epoch": 227} {"train_loss": -31.942157745361328, "global_step": 27470, "epoch": 227} {"train_loss": -31.436548233032227, "global_step": 27471, "epoch": 227} {"train_loss": -32.06966781616211, "global_step": 27472, "epoch": 227} {"train_loss": -32.400142669677734, "global_step": 27473, "epoch": 227} {"train_loss": -32.398704528808594, "global_step": 27474, "epoch": 227} {"train_loss": -32.3782958984375, "global_step": 27475, "epoch": 227} {"train_loss": -31.818470001220703, "global_step": 27476, "epoch": 227} {"train_loss": -31.632116317749023, "global_step": 27477, "epoch": 227} {"train_loss": -31.070138931274414, "global_step": 27478, "epoch": 227} {"train_loss": -30.156299591064453, "global_step": 27479, "epoch": 227} {"train_loss": -29.56821060180664, "global_step": 27480, "epoch": 227} {"train_loss": -28.921875, "global_step": 27481, "epoch": 227} {"train_loss": -24.707792282104492, "global_step": 27482, "epoch": 227} {"train_loss": -23.170743942260742, "global_step": 27483, "epoch": 227} {"train_loss": -31.190099716186523, "global_step": 27484, "epoch": 227} {"train_loss": -30.036529541015625, "global_step": 27485, "epoch": 227} {"train_loss": -29.28816032409668, "global_step": 27486, "epoch": 227} {"train_loss": -31.706897735595703, "global_step": 27487, "epoch": 227} {"train_loss": -30.106876373291016, "global_step": 27488, "epoch": 227} {"train_loss": -31.459592819213867, "global_step": 27489, "epoch": 227} {"train_loss": -30.917163848876953, "global_step": 27490, "epoch": 227} {"train_loss": -31.459487915039062, "global_step": 27491, "epoch": 227} {"train_loss": -31.718250274658203, "global_step": 27492, "epoch": 227} {"train_loss": -31.039844512939453, "global_step": 27493, "epoch": 227} {"train_loss": -32.04052734375, "global_step": 27494, "epoch": 227} {"train_loss": -31.522199630737305, "global_step": 27495, "epoch": 227} {"train_loss": -31.633691787719727, "global_step": 27496, "epoch": 227} {"train_loss": -31.65437126159668, "global_step": 27497, "epoch": 227} {"train_loss": -32.24685287475586, "global_step": 27498, "epoch": 227} {"train_loss": -31.78961753845215, "global_step": 27499, "epoch": 227} {"train_loss": -32.09444046020508, "global_step": 27500, "epoch": 227} {"train_loss": -31.75644302368164, "global_step": 27501, "epoch": 227} {"train_loss": -31.92254066467285, "global_step": 27502, "epoch": 227} {"train_loss": -31.077075958251953, "global_step": 27503, "epoch": 227} {"train_loss": -29.498798370361328, "global_step": 27504, "epoch": 227} {"train_loss": -27.015731811523438, "global_step": 27505, "epoch": 227} {"train_loss": -28.4857234954834, "global_step": 27506, "epoch": 227} {"train_loss": -31.369726181030273, "global_step": 27507, "epoch": 227} {"train_loss": -31.515634536743164, "global_step": 27508, "epoch": 227} {"train_loss": -30.020217895507812, "global_step": 27509, "epoch": 227} {"train_loss": -31.443998336791992, "global_step": 27510, "epoch": 227} {"train_loss": -31.59830665588379, "global_step": 27511, "epoch": 227} {"train_loss": -30.84528160095215, "global_step": 27512, "epoch": 227} {"train_loss": -31.872655868530273, "global_step": 27513, "epoch": 227} {"train_loss": -32.16294479370117, "global_step": 27514, "epoch": 227} {"train_loss": -31.83709144592285, "global_step": 27515, "epoch": 227} {"train_loss": -31.902801513671875, "global_step": 27516, "epoch": 227} {"train_loss": -32.04041290283203, "global_step": 27517, "epoch": 227} {"train_loss": -32.22309112548828, "global_step": 27518, "epoch": 227} {"train_loss": -32.280582427978516, "global_step": 27519, "epoch": 227} {"train_loss": -31.503528594970703, "global_step": 27520, "epoch": 227} {"train_loss": -32.121150970458984, "global_step": 27521, "epoch": 227} {"train_loss": -32.172428131103516, "global_step": 27522, "epoch": 227} {"train_loss": -32.16071701049805, "global_step": 27523, "epoch": 227} {"train_loss": -31.691181182861328, "global_step": 27524, "epoch": 227} {"train_loss": -31.827619552612305, "global_step": 27525, "epoch": 227} {"train_loss": -31.980117797851562, "global_step": 27526, "epoch": 227} {"train_loss": -32.202571868896484, "global_step": 27527, "epoch": 227} {"train_loss": -32.25527572631836, "global_step": 27528, "epoch": 227} {"train_loss": -32.477928161621094, "global_step": 27529, "epoch": 227} {"train_loss": -31.921253204345703, "global_step": 27530, "epoch": 227} {"train_loss": -32.40047836303711, "global_step": 27531, "epoch": 227} {"train_loss": -32.458892822265625, "global_step": 27532, "epoch": 227} {"train_loss": -32.23969268798828, "global_step": 27533, "epoch": 227} {"train_loss": -32.30229568481445, "global_step": 27534, "epoch": 227} {"train_loss": -32.32094955444336, "global_step": 27535, "epoch": 227} {"train_loss": -32.39190673828125, "global_step": 27536, "epoch": 227} {"train_loss": -32.34397888183594, "global_step": 27537, "epoch": 227} {"train_loss": -32.573036193847656, "global_step": 27538, "epoch": 227} {"train_loss": -32.56604766845703, "global_step": 27539, "epoch": 227} {"train_loss": -32.25603485107422, "global_step": 27540, "epoch": 227} {"train_loss": -32.19645309448242, "global_step": 27541, "epoch": 227} {"train_loss": -31.99493408203125, "global_step": 27542, "epoch": 227} {"train_loss": -32.295650482177734, "global_step": 27543, "epoch": 227} {"train_loss": -32.748836517333984, "global_step": 27544, "epoch": 227} {"train_loss": -32.04914093017578, "global_step": 27545, "epoch": 227} {"train_loss": -32.365264892578125, "global_step": 27546, "epoch": 227} {"train_loss": -31.592121124267578, "global_step": 27547, "epoch": 227} {"train_loss": -32.044166564941406, "global_step": 27548, "epoch": 227} {"train_loss": -32.407474517822266, "global_step": 27549, "epoch": 227} {"train_loss": -31.762622833251953, "global_step": 27550, "epoch": 227} {"train_loss": -31.967575073242188, "global_step": 27551, "epoch": 227} {"train_loss": -31.965667724609375, "global_step": 27552, "epoch": 227} {"train_loss": -31.303083419799805, "global_step": 27553, "epoch": 227} {"train_loss": -31.733295440673828, "global_step": 27554, "epoch": 227} {"train_loss": -32.451988220214844, "global_step": 27555, "epoch": 227} {"train_loss": -32.10185623168945, "global_step": 27556, "epoch": 227} {"train_loss": -31.315418243408203, "global_step": 27557, "epoch": 227} {"train_loss": -31.490955352783203, "global_step": 27558, "epoch": 227} {"train_loss": -31.26553726196289, "global_step": 27559, "epoch": 227} {"train_loss": -30.725616455078125, "global_step": 27560, "epoch": 227} {"train_loss": -31.371362686157227, "global_step": 27561, "epoch": 227} {"train_loss": -31.156538009643555, "global_step": 27562, "epoch": 227} {"train_loss": -31.53163719177246, "global_step": 27563, "epoch": 227} {"train_loss": -31.868192672729492, "global_step": 27564, "epoch": 227} {"train_loss": -31.893280029296875, "global_step": 27565, "epoch": 227} {"train_loss": -31.571744918823242, "global_step": 27566, "epoch": 227} {"train_loss": -30.25730323791504, "global_step": 27567, "epoch": 227} {"train_loss": -32.09760665893555, "global_step": 27568, "epoch": 227} {"train_loss": -31.050357818603516, "global_step": 27569, "epoch": 227} {"train_loss": -31.35120964050293, "global_step": 27570, "epoch": 227} {"train_loss": -31.490802764892578, "global_step": 27571, "epoch": 227} {"train_loss": -32.2492561340332, "global_step": 27572, "epoch": 227} {"train_loss": -31.863889694213867, "global_step": 27573, "epoch": 227} {"train_loss": -31.709665298461914, "global_step": 27574, "epoch": 227} {"train_loss": -31.791433334350586, "global_step": 27575, "epoch": 227} {"train_loss": -31.514984130859375, "global_step": 27576, "epoch": 227} {"train_loss": -31.95492935180664, "global_step": 27577, "epoch": 227} {"train_loss": -31.88538932800293, "global_step": 27578, "epoch": 227} {"train_loss": -31.38184928894043, "global_step": 27579, "epoch": 227} {"train_loss": -31.78678321838379, "global_step": 27580, "epoch": 227} {"train_loss": -32.2878532409668, "global_step": 27581, "epoch": 227} {"train_loss": -31.62091636657715, "global_step": 27582, "epoch": 227} {"train_loss": -31.23002052307129, "global_step": 27583, "epoch": 227} {"train_loss": -31.45928955078125, "global_step": 27584, "epoch": 227} {"train_loss": -30.986242294311523, "global_step": 27585, "epoch": 227} {"train_loss": -32.55423355102539, "global_step": 27586, "epoch": 227} {"train_loss": -31.50057601928711, "global_step": 27587, "epoch": 227, "val_loss": 2397650.25} {"train_loss": -32.60306930541992, "global_step": 27588, "epoch": 228} {"train_loss": -31.58392906188965, "global_step": 27589, "epoch": 228} {"train_loss": -31.443628311157227, "global_step": 27590, "epoch": 228} {"train_loss": -31.737869262695312, "global_step": 27591, "epoch": 228} {"train_loss": -32.274444580078125, "global_step": 27592, "epoch": 228} {"train_loss": -32.656288146972656, "global_step": 27593, "epoch": 228} {"train_loss": -32.295501708984375, "global_step": 27594, "epoch": 228} {"train_loss": -31.797876358032227, "global_step": 27595, "epoch": 228} {"train_loss": -31.525455474853516, "global_step": 27596, "epoch": 228} {"train_loss": -31.161224365234375, "global_step": 27597, "epoch": 228} {"train_loss": -32.23210906982422, "global_step": 27598, "epoch": 228} {"train_loss": -32.287513732910156, "global_step": 27599, "epoch": 228} {"train_loss": -32.444393157958984, "global_step": 27600, "epoch": 228} {"train_loss": -32.51764678955078, "global_step": 27601, "epoch": 228} {"train_loss": -32.34830856323242, "global_step": 27602, "epoch": 228} {"train_loss": -32.25675964355469, "global_step": 27603, "epoch": 228} {"train_loss": -31.892980575561523, "global_step": 27604, "epoch": 228} {"train_loss": -32.79246520996094, "global_step": 27605, "epoch": 228} {"train_loss": -32.29231643676758, "global_step": 27606, "epoch": 228} {"train_loss": -32.7918701171875, "global_step": 27607, "epoch": 228} {"train_loss": -32.16846466064453, "global_step": 27608, "epoch": 228} {"train_loss": -32.950469970703125, "global_step": 27609, "epoch": 228} {"train_loss": -32.9705924987793, "global_step": 27610, "epoch": 228} {"train_loss": -32.9074821472168, "global_step": 27611, "epoch": 228} {"train_loss": -32.93830490112305, "global_step": 27612, "epoch": 228} {"train_loss": -32.83927536010742, "global_step": 27613, "epoch": 228} {"train_loss": -32.57343673706055, "global_step": 27614, "epoch": 228} {"train_loss": -32.345298767089844, "global_step": 27615, "epoch": 228} {"train_loss": -32.310794830322266, "global_step": 27616, "epoch": 228} {"train_loss": -33.29197692871094, "global_step": 27617, "epoch": 228} {"train_loss": -32.7423210144043, "global_step": 27618, "epoch": 228} {"train_loss": -32.06594467163086, "global_step": 27619, "epoch": 228} {"train_loss": -31.780790328979492, "global_step": 27620, "epoch": 228} {"train_loss": -31.240711212158203, "global_step": 27621, "epoch": 228} {"train_loss": -28.325597763061523, "global_step": 27622, "epoch": 228} {"train_loss": -24.838729858398438, "global_step": 27623, "epoch": 228} {"train_loss": -30.29437255859375, "global_step": 27624, "epoch": 228} {"train_loss": -31.582366943359375, "global_step": 27625, "epoch": 228} {"train_loss": -29.097412109375, "global_step": 27626, "epoch": 228} {"train_loss": -26.976978302001953, "global_step": 27627, "epoch": 228} {"train_loss": -23.4717960357666, "global_step": 27628, "epoch": 228} {"train_loss": -21.280704498291016, "global_step": 27629, "epoch": 228} {"train_loss": -29.73068618774414, "global_step": 27630, "epoch": 228} {"train_loss": -22.944381713867188, "global_step": 27631, "epoch": 228} {"train_loss": -28.810535430908203, "global_step": 27632, "epoch": 228} {"train_loss": -23.571496963500977, "global_step": 27633, "epoch": 228} {"train_loss": -27.4438533782959, "global_step": 27634, "epoch": 228} {"train_loss": -27.35038185119629, "global_step": 27635, "epoch": 228} {"train_loss": -25.525781631469727, "global_step": 27636, "epoch": 228} {"train_loss": -29.484785079956055, "global_step": 27637, "epoch": 228} {"train_loss": -28.967920303344727, "global_step": 27638, "epoch": 228} {"train_loss": -27.69623374938965, "global_step": 27639, "epoch": 228} {"train_loss": -30.08222007751465, "global_step": 27640, "epoch": 228} {"train_loss": -30.382709503173828, "global_step": 27641, "epoch": 228} {"train_loss": -29.4335880279541, "global_step": 27642, "epoch": 228} {"train_loss": -29.47747802734375, "global_step": 27643, "epoch": 228} {"train_loss": -30.1533145904541, "global_step": 27644, "epoch": 228} {"train_loss": -30.763471603393555, "global_step": 27645, "epoch": 228} {"train_loss": -29.62322998046875, "global_step": 27646, "epoch": 228} {"train_loss": -30.46976089477539, "global_step": 27647, "epoch": 228} {"train_loss": -30.001367568969727, "global_step": 27648, "epoch": 228} {"train_loss": -31.090534210205078, "global_step": 27649, "epoch": 228} {"train_loss": -30.943389892578125, "global_step": 27650, "epoch": 228} {"train_loss": -30.324487686157227, "global_step": 27651, "epoch": 228} {"train_loss": -31.031030654907227, "global_step": 27652, "epoch": 228} {"train_loss": -30.6716365814209, "global_step": 27653, "epoch": 228} {"train_loss": -30.76873779296875, "global_step": 27654, "epoch": 228} {"train_loss": -31.28890037536621, "global_step": 27655, "epoch": 228} {"train_loss": -31.093286514282227, "global_step": 27656, "epoch": 228} {"train_loss": -31.262052536010742, "global_step": 27657, "epoch": 228} {"train_loss": -31.498031616210938, "global_step": 27658, "epoch": 228} {"train_loss": -30.854970932006836, "global_step": 27659, "epoch": 228} {"train_loss": -31.75703239440918, "global_step": 27660, "epoch": 228} {"train_loss": -31.55073356628418, "global_step": 27661, "epoch": 228} {"train_loss": -31.277973175048828, "global_step": 27662, "epoch": 228} {"train_loss": -31.4664249420166, "global_step": 27663, "epoch": 228} {"train_loss": -31.447132110595703, "global_step": 27664, "epoch": 228} {"train_loss": -31.842350006103516, "global_step": 27665, "epoch": 228} {"train_loss": -31.58357048034668, "global_step": 27666, "epoch": 228} {"train_loss": -31.83331871032715, "global_step": 27667, "epoch": 228} {"train_loss": -31.92947769165039, "global_step": 27668, "epoch": 228} {"train_loss": -31.915618896484375, "global_step": 27669, "epoch": 228} {"train_loss": -31.724401473999023, "global_step": 27670, "epoch": 228} {"train_loss": -32.09010314941406, "global_step": 27671, "epoch": 228} {"train_loss": -32.201271057128906, "global_step": 27672, "epoch": 228} {"train_loss": -32.0861701965332, "global_step": 27673, "epoch": 228} {"train_loss": -32.12459182739258, "global_step": 27674, "epoch": 228} {"train_loss": -32.28911209106445, "global_step": 27675, "epoch": 228} {"train_loss": -32.0970573425293, "global_step": 27676, "epoch": 228} {"train_loss": -31.825590133666992, "global_step": 27677, "epoch": 228} {"train_loss": -32.02877426147461, "global_step": 27678, "epoch": 228} {"train_loss": -31.890396118164062, "global_step": 27679, "epoch": 228} {"train_loss": -31.47767448425293, "global_step": 27680, "epoch": 228} {"train_loss": -32.054115295410156, "global_step": 27681, "epoch": 228} {"train_loss": -31.455963134765625, "global_step": 27682, "epoch": 228} {"train_loss": -31.568384170532227, "global_step": 27683, "epoch": 228} {"train_loss": -31.241270065307617, "global_step": 27684, "epoch": 228} {"train_loss": -30.84914207458496, "global_step": 27685, "epoch": 228} {"train_loss": -32.018707275390625, "global_step": 27686, "epoch": 228} {"train_loss": -30.69132423400879, "global_step": 27687, "epoch": 228} {"train_loss": -31.50287437438965, "global_step": 27688, "epoch": 228} {"train_loss": -31.707855224609375, "global_step": 27689, "epoch": 228} {"train_loss": -31.253660202026367, "global_step": 27690, "epoch": 228} {"train_loss": -30.603347778320312, "global_step": 27691, "epoch": 228} {"train_loss": -30.545557022094727, "global_step": 27692, "epoch": 228} {"train_loss": -31.773908615112305, "global_step": 27693, "epoch": 228} {"train_loss": -31.161474227905273, "global_step": 27694, "epoch": 228} {"train_loss": -31.286365509033203, "global_step": 27695, "epoch": 228} {"train_loss": -31.509525299072266, "global_step": 27696, "epoch": 228} {"train_loss": -31.734521865844727, "global_step": 27697, "epoch": 228} {"train_loss": -31.75031089782715, "global_step": 27698, "epoch": 228} {"train_loss": -31.343048095703125, "global_step": 27699, "epoch": 228} {"train_loss": -32.0307731628418, "global_step": 27700, "epoch": 228} {"train_loss": -31.562292098999023, "global_step": 27701, "epoch": 228} {"train_loss": -31.55531120300293, "global_step": 27702, "epoch": 228} {"train_loss": -31.15372657775879, "global_step": 27703, "epoch": 228} {"train_loss": -31.43463134765625, "global_step": 27704, "epoch": 228} {"train_loss": -31.18617057800293, "global_step": 27705, "epoch": 228} {"train_loss": -31.70380973815918, "global_step": 27706, "epoch": 228} {"train_loss": -31.559736251831055, "global_step": 27707, "epoch": 228} {"train_loss": -30.950491124933418, "global_step": 27708, "epoch": 228, "val_loss": 2572442.0} {"train_loss": -31.4986515045166, "global_step": 27709, "epoch": 229} {"train_loss": -31.80695152282715, "global_step": 27710, "epoch": 229} {"train_loss": -30.954120635986328, "global_step": 27711, "epoch": 229} {"train_loss": -30.652179718017578, "global_step": 27712, "epoch": 229} {"train_loss": -30.453458786010742, "global_step": 27713, "epoch": 229} {"train_loss": -28.701419830322266, "global_step": 27714, "epoch": 229} {"train_loss": -27.181507110595703, "global_step": 27715, "epoch": 229} {"train_loss": -26.170324325561523, "global_step": 27716, "epoch": 229} {"train_loss": -24.75446128845215, "global_step": 27717, "epoch": 229} {"train_loss": -29.9910831451416, "global_step": 27718, "epoch": 229} {"train_loss": -31.643430709838867, "global_step": 27719, "epoch": 229} {"train_loss": -29.39227867126465, "global_step": 27720, "epoch": 229} {"train_loss": -30.4904842376709, "global_step": 27721, "epoch": 229} {"train_loss": -31.76932144165039, "global_step": 27722, "epoch": 229} {"train_loss": -30.35342788696289, "global_step": 27723, "epoch": 229} {"train_loss": -32.050697326660156, "global_step": 27724, "epoch": 229} {"train_loss": -31.531177520751953, "global_step": 27725, "epoch": 229} {"train_loss": -31.867578506469727, "global_step": 27726, "epoch": 229} {"train_loss": -31.176420211791992, "global_step": 27727, "epoch": 229} {"train_loss": -31.9538516998291, "global_step": 27728, "epoch": 229} {"train_loss": -31.90778160095215, "global_step": 27729, "epoch": 229} {"train_loss": -31.61720085144043, "global_step": 27730, "epoch": 229} {"train_loss": -31.060443878173828, "global_step": 27731, "epoch": 229} {"train_loss": -32.3310432434082, "global_step": 27732, "epoch": 229} {"train_loss": -32.21320724487305, "global_step": 27733, "epoch": 229} {"train_loss": -31.79047966003418, "global_step": 27734, "epoch": 229} {"train_loss": -31.937057495117188, "global_step": 27735, "epoch": 229} {"train_loss": -32.02218246459961, "global_step": 27736, "epoch": 229} {"train_loss": -31.82032585144043, "global_step": 27737, "epoch": 229} {"train_loss": -32.04119873046875, "global_step": 27738, "epoch": 229} {"train_loss": -32.10006332397461, "global_step": 27739, "epoch": 229} {"train_loss": -32.1282844543457, "global_step": 27740, "epoch": 229} {"train_loss": -31.935504913330078, "global_step": 27741, "epoch": 229} {"train_loss": -32.122554779052734, "global_step": 27742, "epoch": 229} {"train_loss": -32.57044982910156, "global_step": 27743, "epoch": 229} {"train_loss": -31.1436824798584, "global_step": 27744, "epoch": 229} {"train_loss": -31.532318115234375, "global_step": 27745, "epoch": 229} {"train_loss": -32.5224609375, "global_step": 27746, "epoch": 229} {"train_loss": -31.601364135742188, "global_step": 27747, "epoch": 229} {"train_loss": -32.00055694580078, "global_step": 27748, "epoch": 229} {"train_loss": -31.59158706665039, "global_step": 27749, "epoch": 229} {"train_loss": -31.876989364624023, "global_step": 27750, "epoch": 229} {"train_loss": -31.908649444580078, "global_step": 27751, "epoch": 229} {"train_loss": -31.366422653198242, "global_step": 27752, "epoch": 229} {"train_loss": -29.8461856842041, "global_step": 27753, "epoch": 229} {"train_loss": -31.2985897064209, "global_step": 27754, "epoch": 229} {"train_loss": -29.626728057861328, "global_step": 27755, "epoch": 229} {"train_loss": -28.91641616821289, "global_step": 27756, "epoch": 229} {"train_loss": -29.04483413696289, "global_step": 27757, "epoch": 229} {"train_loss": -28.41266441345215, "global_step": 27758, "epoch": 229} {"train_loss": -27.4830265045166, "global_step": 27759, "epoch": 229} {"train_loss": -31.162967681884766, "global_step": 27760, "epoch": 229} {"train_loss": -28.827123641967773, "global_step": 27761, "epoch": 229} {"train_loss": -28.283985137939453, "global_step": 27762, "epoch": 229} {"train_loss": -30.977970123291016, "global_step": 27763, "epoch": 229} {"train_loss": -30.97665786743164, "global_step": 27764, "epoch": 229} {"train_loss": -31.241622924804688, "global_step": 27765, "epoch": 229} {"train_loss": -30.631561279296875, "global_step": 27766, "epoch": 229} {"train_loss": -31.087299346923828, "global_step": 27767, "epoch": 229} {"train_loss": -31.67732048034668, "global_step": 27768, "epoch": 229} {"train_loss": -31.06818962097168, "global_step": 27769, "epoch": 229} {"train_loss": -30.89542579650879, "global_step": 27770, "epoch": 229} {"train_loss": -32.113887786865234, "global_step": 27771, "epoch": 229} {"train_loss": -31.437952041625977, "global_step": 27772, "epoch": 229} {"train_loss": -32.06571960449219, "global_step": 27773, "epoch": 229} {"train_loss": -31.52033042907715, "global_step": 27774, "epoch": 229} {"train_loss": -31.87916374206543, "global_step": 27775, "epoch": 229} {"train_loss": -31.3924617767334, "global_step": 27776, "epoch": 229} {"train_loss": -31.5266170501709, "global_step": 27777, "epoch": 229} {"train_loss": -32.035152435302734, "global_step": 27778, "epoch": 229} {"train_loss": -31.950977325439453, "global_step": 27779, "epoch": 229} {"train_loss": -31.614395141601562, "global_step": 27780, "epoch": 229} {"train_loss": -32.202613830566406, "global_step": 27781, "epoch": 229} {"train_loss": -32.007110595703125, "global_step": 27782, "epoch": 229} {"train_loss": -31.804718017578125, "global_step": 27783, "epoch": 229} {"train_loss": -32.22608184814453, "global_step": 27784, "epoch": 229} {"train_loss": -31.688373565673828, "global_step": 27785, "epoch": 229} {"train_loss": -32.17426681518555, "global_step": 27786, "epoch": 229} {"train_loss": -32.06571578979492, "global_step": 27787, "epoch": 229} {"train_loss": -32.27033233642578, "global_step": 27788, "epoch": 229} {"train_loss": -32.187767028808594, "global_step": 27789, "epoch": 229} {"train_loss": -32.236541748046875, "global_step": 27790, "epoch": 229} {"train_loss": -32.344871520996094, "global_step": 27791, "epoch": 229} {"train_loss": -32.31081771850586, "global_step": 27792, "epoch": 229} {"train_loss": -32.124656677246094, "global_step": 27793, "epoch": 229} {"train_loss": -30.513782501220703, "global_step": 27794, "epoch": 229} {"train_loss": -29.072830200195312, "global_step": 27795, "epoch": 229} {"train_loss": -26.623594284057617, "global_step": 27796, "epoch": 229} {"train_loss": -21.35896110534668, "global_step": 27797, "epoch": 229} {"train_loss": -31.440479278564453, "global_step": 27798, "epoch": 229} {"train_loss": -25.991613388061523, "global_step": 27799, "epoch": 229} {"train_loss": -30.99732780456543, "global_step": 27800, "epoch": 229} {"train_loss": -28.77540397644043, "global_step": 27801, "epoch": 229} {"train_loss": -30.222248077392578, "global_step": 27802, "epoch": 229} {"train_loss": -29.69775390625, "global_step": 27803, "epoch": 229} {"train_loss": -30.78716468811035, "global_step": 27804, "epoch": 229} {"train_loss": -29.563892364501953, "global_step": 27805, "epoch": 229} {"train_loss": -30.873144149780273, "global_step": 27806, "epoch": 229} {"train_loss": -30.272947311401367, "global_step": 27807, "epoch": 229} {"train_loss": -30.247314453125, "global_step": 27808, "epoch": 229} {"train_loss": -30.99354362487793, "global_step": 27809, "epoch": 229} {"train_loss": -30.663206100463867, "global_step": 27810, "epoch": 229} {"train_loss": -29.78948402404785, "global_step": 27811, "epoch": 229} {"train_loss": -31.405332565307617, "global_step": 27812, "epoch": 229} {"train_loss": -30.40192222595215, "global_step": 27813, "epoch": 229} {"train_loss": -29.800817489624023, "global_step": 27814, "epoch": 229} {"train_loss": -31.522613525390625, "global_step": 27815, "epoch": 229} {"train_loss": -30.70283317565918, "global_step": 27816, "epoch": 229} {"train_loss": -30.325708389282227, "global_step": 27817, "epoch": 229} {"train_loss": -30.52753257751465, "global_step": 27818, "epoch": 229} {"train_loss": -31.387372970581055, "global_step": 27819, "epoch": 229} {"train_loss": -30.802488327026367, "global_step": 27820, "epoch": 229} {"train_loss": -31.12345314025879, "global_step": 27821, "epoch": 229} {"train_loss": -30.812488555908203, "global_step": 27822, "epoch": 229} {"train_loss": -31.8155517578125, "global_step": 27823, "epoch": 229} {"train_loss": -31.147459030151367, "global_step": 27824, "epoch": 229} {"train_loss": -31.41949462890625, "global_step": 27825, "epoch": 229} {"train_loss": -31.468536376953125, "global_step": 27826, "epoch": 229} {"train_loss": -31.4838809967041, "global_step": 27827, "epoch": 229} {"train_loss": -31.5233154296875, "global_step": 27828, "epoch": 229} {"train_loss": -30.85187100181895, "global_step": 27829, "epoch": 229, "val_loss": 2369192.25} {"train_loss": -31.6014404296875, "global_step": 27830, "epoch": 230} {"train_loss": -31.481287002563477, "global_step": 27831, "epoch": 230} {"train_loss": -31.78765869140625, "global_step": 27832, "epoch": 230} {"train_loss": -31.69498062133789, "global_step": 27833, "epoch": 230} {"train_loss": -31.9875545501709, "global_step": 27834, "epoch": 230} {"train_loss": -31.887475967407227, "global_step": 27835, "epoch": 230} {"train_loss": -31.693822860717773, "global_step": 27836, "epoch": 230} {"train_loss": -32.09212875366211, "global_step": 27837, "epoch": 230} {"train_loss": -31.8072566986084, "global_step": 27838, "epoch": 230} {"train_loss": -31.727941513061523, "global_step": 27839, "epoch": 230} {"train_loss": -30.173187255859375, "global_step": 27840, "epoch": 230} {"train_loss": -31.43477439880371, "global_step": 27841, "epoch": 230} {"train_loss": -32.57596969604492, "global_step": 27842, "epoch": 230} {"train_loss": -31.385635375976562, "global_step": 27843, "epoch": 230} {"train_loss": -31.513425827026367, "global_step": 27844, "epoch": 230} {"train_loss": -31.7283992767334, "global_step": 27845, "epoch": 230} {"train_loss": -32.3167839050293, "global_step": 27846, "epoch": 230} {"train_loss": -31.01019287109375, "global_step": 27847, "epoch": 230} {"train_loss": -31.207550048828125, "global_step": 27848, "epoch": 230} {"train_loss": -30.249658584594727, "global_step": 27849, "epoch": 230} {"train_loss": -31.29905128479004, "global_step": 27850, "epoch": 230} {"train_loss": -31.00581169128418, "global_step": 27851, "epoch": 230} {"train_loss": -31.822072982788086, "global_step": 27852, "epoch": 230} {"train_loss": -31.251087188720703, "global_step": 27853, "epoch": 230} {"train_loss": -30.41053581237793, "global_step": 27854, "epoch": 230} {"train_loss": -30.74567985534668, "global_step": 27855, "epoch": 230} {"train_loss": -30.37664794921875, "global_step": 27856, "epoch": 230} {"train_loss": -29.117963790893555, "global_step": 27857, "epoch": 230} {"train_loss": -30.566349029541016, "global_step": 27858, "epoch": 230} {"train_loss": -29.800832748413086, "global_step": 27859, "epoch": 230} {"train_loss": -28.860721588134766, "global_step": 27860, "epoch": 230} {"train_loss": -27.631391525268555, "global_step": 27861, "epoch": 230} {"train_loss": -26.614212036132812, "global_step": 27862, "epoch": 230} {"train_loss": -29.072858810424805, "global_step": 27863, "epoch": 230} {"train_loss": -31.05120277404785, "global_step": 27864, "epoch": 230} {"train_loss": -30.555383682250977, "global_step": 27865, "epoch": 230} {"train_loss": -29.324405670166016, "global_step": 27866, "epoch": 230} {"train_loss": -30.847843170166016, "global_step": 27867, "epoch": 230} {"train_loss": -31.302701950073242, "global_step": 27868, "epoch": 230} {"train_loss": -30.41765785217285, "global_step": 27869, "epoch": 230} {"train_loss": -31.790266036987305, "global_step": 27870, "epoch": 230} {"train_loss": -31.62238121032715, "global_step": 27871, "epoch": 230} {"train_loss": -30.781217575073242, "global_step": 27872, "epoch": 230} {"train_loss": -32.24733352661133, "global_step": 27873, "epoch": 230} {"train_loss": -30.14545249938965, "global_step": 27874, "epoch": 230} {"train_loss": -31.679431915283203, "global_step": 27875, "epoch": 230} {"train_loss": -31.031909942626953, "global_step": 27876, "epoch": 230} {"train_loss": -31.536590576171875, "global_step": 27877, "epoch": 230} {"train_loss": -31.002307891845703, "global_step": 27878, "epoch": 230} {"train_loss": -31.31671714782715, "global_step": 27879, "epoch": 230} {"train_loss": -30.99903678894043, "global_step": 27880, "epoch": 230} {"train_loss": -31.3375301361084, "global_step": 27881, "epoch": 230} {"train_loss": -31.040130615234375, "global_step": 27882, "epoch": 230} {"train_loss": -31.3798828125, "global_step": 27883, "epoch": 230} {"train_loss": -31.344518661499023, "global_step": 27884, "epoch": 230} {"train_loss": -31.790164947509766, "global_step": 27885, "epoch": 230} {"train_loss": -31.53248405456543, "global_step": 27886, "epoch": 230} {"train_loss": -31.427387237548828, "global_step": 27887, "epoch": 230} {"train_loss": -31.928836822509766, "global_step": 27888, "epoch": 230} {"train_loss": -31.986621856689453, "global_step": 27889, "epoch": 230} {"train_loss": -31.564727783203125, "global_step": 27890, "epoch": 230} {"train_loss": -32.106815338134766, "global_step": 27891, "epoch": 230} {"train_loss": -31.94144058227539, "global_step": 27892, "epoch": 230} {"train_loss": -31.686050415039062, "global_step": 27893, "epoch": 230} {"train_loss": -31.977863311767578, "global_step": 27894, "epoch": 230} {"train_loss": -31.420392990112305, "global_step": 27895, "epoch": 230} {"train_loss": -31.61299705505371, "global_step": 27896, "epoch": 230} {"train_loss": -31.518177032470703, "global_step": 27897, "epoch": 230} {"train_loss": -31.918954849243164, "global_step": 27898, "epoch": 230} {"train_loss": -32.18858337402344, "global_step": 27899, "epoch": 230} {"train_loss": -31.553442001342773, "global_step": 27900, "epoch": 230} {"train_loss": -31.610639572143555, "global_step": 27901, "epoch": 230} {"train_loss": -31.686975479125977, "global_step": 27902, "epoch": 230} {"train_loss": -32.154911041259766, "global_step": 27903, "epoch": 230} {"train_loss": -32.153778076171875, "global_step": 27904, "epoch": 230} {"train_loss": -32.04301834106445, "global_step": 27905, "epoch": 230} {"train_loss": -32.14232635498047, "global_step": 27906, "epoch": 230} {"train_loss": -32.200016021728516, "global_step": 27907, "epoch": 230} {"train_loss": -32.46786117553711, "global_step": 27908, "epoch": 230} {"train_loss": -32.00319290161133, "global_step": 27909, "epoch": 230} {"train_loss": -32.46833038330078, "global_step": 27910, "epoch": 230} {"train_loss": -32.288307189941406, "global_step": 27911, "epoch": 230} {"train_loss": -32.620906829833984, "global_step": 27912, "epoch": 230} {"train_loss": -31.54143714904785, "global_step": 27913, "epoch": 230} {"train_loss": -32.136146545410156, "global_step": 27914, "epoch": 230} {"train_loss": -32.04759216308594, "global_step": 27915, "epoch": 230} {"train_loss": -32.2252082824707, "global_step": 27916, "epoch": 230} {"train_loss": -32.02126693725586, "global_step": 27917, "epoch": 230} {"train_loss": -32.20051574707031, "global_step": 27918, "epoch": 230} {"train_loss": -32.084712982177734, "global_step": 27919, "epoch": 230} {"train_loss": -32.634124755859375, "global_step": 27920, "epoch": 230} {"train_loss": -31.995187759399414, "global_step": 27921, "epoch": 230} {"train_loss": -32.35451126098633, "global_step": 27922, "epoch": 230} {"train_loss": -32.095802307128906, "global_step": 27923, "epoch": 230} {"train_loss": -32.720375061035156, "global_step": 27924, "epoch": 230} {"train_loss": -32.79254913330078, "global_step": 27925, "epoch": 230} {"train_loss": -32.330806732177734, "global_step": 27926, "epoch": 230} {"train_loss": -32.61982727050781, "global_step": 27927, "epoch": 230} {"train_loss": -32.52680206298828, "global_step": 27928, "epoch": 230} {"train_loss": -32.778472900390625, "global_step": 27929, "epoch": 230} {"train_loss": -32.665157318115234, "global_step": 27930, "epoch": 230} {"train_loss": -32.2369384765625, "global_step": 27931, "epoch": 230} {"train_loss": -32.6643180847168, "global_step": 27932, "epoch": 230} {"train_loss": -32.9364128112793, "global_step": 27933, "epoch": 230} {"train_loss": -32.710628509521484, "global_step": 27934, "epoch": 230} {"train_loss": -32.59290313720703, "global_step": 27935, "epoch": 230} {"train_loss": -32.62446212768555, "global_step": 27936, "epoch": 230} {"train_loss": -32.65076446533203, "global_step": 27937, "epoch": 230} {"train_loss": -33.24201965332031, "global_step": 27938, "epoch": 230} {"train_loss": -32.6106071472168, "global_step": 27939, "epoch": 230} {"train_loss": -32.699764251708984, "global_step": 27940, "epoch": 230} {"train_loss": -32.325775146484375, "global_step": 27941, "epoch": 230} {"train_loss": -31.530948638916016, "global_step": 27942, "epoch": 230} {"train_loss": -32.36073303222656, "global_step": 27943, "epoch": 230} {"train_loss": -32.17403793334961, "global_step": 27944, "epoch": 230} {"train_loss": -32.28180694580078, "global_step": 27945, "epoch": 230} {"train_loss": -32.191070556640625, "global_step": 27946, "epoch": 230} {"train_loss": -32.227394104003906, "global_step": 27947, "epoch": 230} {"train_loss": -32.894020080566406, "global_step": 27948, "epoch": 230} {"train_loss": -32.73060989379883, "global_step": 27949, "epoch": 230} {"train_loss": -31.637274860350555, "global_step": 27950, "epoch": 230, "val_loss": 2506531.75} {"train_loss": -31.802265167236328, "global_step": 27951, "epoch": 231} {"train_loss": -31.613122940063477, "global_step": 27952, "epoch": 231} {"train_loss": -31.76656150817871, "global_step": 27953, "epoch": 231} {"train_loss": -30.53653335571289, "global_step": 27954, "epoch": 231} {"train_loss": -30.891590118408203, "global_step": 27955, "epoch": 231} {"train_loss": -32.26327133178711, "global_step": 27956, "epoch": 231} {"train_loss": -32.2399787902832, "global_step": 27957, "epoch": 231} {"train_loss": -31.1940975189209, "global_step": 27958, "epoch": 231} {"train_loss": -30.96278190612793, "global_step": 27959, "epoch": 231} {"train_loss": -32.68506622314453, "global_step": 27960, "epoch": 231} {"train_loss": -31.930891036987305, "global_step": 27961, "epoch": 231} {"train_loss": -30.985504150390625, "global_step": 27962, "epoch": 231} {"train_loss": -31.602069854736328, "global_step": 27963, "epoch": 231} {"train_loss": -31.955066680908203, "global_step": 27964, "epoch": 231} {"train_loss": -29.7554874420166, "global_step": 27965, "epoch": 231} {"train_loss": -27.77178382873535, "global_step": 27966, "epoch": 231} {"train_loss": -22.70993995666504, "global_step": 27967, "epoch": 231} {"train_loss": -31.69007682800293, "global_step": 27968, "epoch": 231} {"train_loss": -26.471548080444336, "global_step": 27969, "epoch": 231} {"train_loss": -23.188156127929688, "global_step": 27970, "epoch": 231} {"train_loss": -26.559118270874023, "global_step": 27971, "epoch": 231} {"train_loss": -22.207351684570312, "global_step": 27972, "epoch": 231} {"train_loss": -20.21640968322754, "global_step": 27973, "epoch": 231} {"train_loss": -20.164438247680664, "global_step": 27974, "epoch": 231} {"train_loss": -21.181049346923828, "global_step": 27975, "epoch": 231} {"train_loss": -27.53562355041504, "global_step": 27976, "epoch": 231} {"train_loss": -24.357961654663086, "global_step": 27977, "epoch": 231} {"train_loss": -22.644147872924805, "global_step": 27978, "epoch": 231} {"train_loss": -23.956933975219727, "global_step": 27979, "epoch": 231} {"train_loss": -22.319005966186523, "global_step": 27980, "epoch": 231} {"train_loss": -26.54518699645996, "global_step": 27981, "epoch": 231} {"train_loss": -28.476415634155273, "global_step": 27982, "epoch": 231} {"train_loss": -27.23200798034668, "global_step": 27983, "epoch": 231} {"train_loss": -25.378812789916992, "global_step": 27984, "epoch": 231} {"train_loss": -25.25261878967285, "global_step": 27985, "epoch": 231} {"train_loss": -27.778518676757812, "global_step": 27986, "epoch": 231} {"train_loss": -29.1937198638916, "global_step": 27987, "epoch": 231} {"train_loss": -30.044769287109375, "global_step": 27988, "epoch": 231} {"train_loss": -29.220417022705078, "global_step": 27989, "epoch": 231} {"train_loss": -28.5782413482666, "global_step": 27990, "epoch": 231} {"train_loss": -29.65860366821289, "global_step": 27991, "epoch": 231} {"train_loss": -30.568710327148438, "global_step": 27992, "epoch": 231} {"train_loss": -30.73261070251465, "global_step": 27993, "epoch": 231} {"train_loss": -30.770349502563477, "global_step": 27994, "epoch": 231} {"train_loss": -30.6029052734375, "global_step": 27995, "epoch": 231} {"train_loss": -30.546354293823242, "global_step": 27996, "epoch": 231} {"train_loss": -30.635480880737305, "global_step": 27997, "epoch": 231} {"train_loss": -30.991247177124023, "global_step": 27998, "epoch": 231} {"train_loss": -30.990942001342773, "global_step": 27999, "epoch": 231} {"train_loss": -31.139297485351562, "global_step": 28000, "epoch": 231} {"train_loss": -31.710290908813477, "global_step": 28001, "epoch": 231} {"train_loss": -31.052091598510742, "global_step": 28002, "epoch": 231} {"train_loss": -31.57722282409668, "global_step": 28003, "epoch": 231} {"train_loss": -31.184335708618164, "global_step": 28004, "epoch": 231} {"train_loss": -31.513620376586914, "global_step": 28005, "epoch": 231} {"train_loss": -31.485204696655273, "global_step": 28006, "epoch": 231} {"train_loss": -31.251224517822266, "global_step": 28007, "epoch": 231} {"train_loss": -31.626134872436523, "global_step": 28008, "epoch": 231} {"train_loss": -31.48761558532715, "global_step": 28009, "epoch": 231} {"train_loss": -31.836963653564453, "global_step": 28010, "epoch": 231} {"train_loss": -31.983434677124023, "global_step": 28011, "epoch": 231} {"train_loss": -31.913251876831055, "global_step": 28012, "epoch": 231} {"train_loss": -31.885847091674805, "global_step": 28013, "epoch": 231} {"train_loss": -31.442548751831055, "global_step": 28014, "epoch": 231} {"train_loss": -31.907379150390625, "global_step": 28015, "epoch": 231} {"train_loss": -31.440967559814453, "global_step": 28016, "epoch": 231} {"train_loss": -31.805707931518555, "global_step": 28017, "epoch": 231} {"train_loss": -31.859180450439453, "global_step": 28018, "epoch": 231} {"train_loss": -31.90354347229004, "global_step": 28019, "epoch": 231} {"train_loss": -31.86628532409668, "global_step": 28020, "epoch": 231} {"train_loss": -32.23938751220703, "global_step": 28021, "epoch": 231} {"train_loss": -32.41264724731445, "global_step": 28022, "epoch": 231} {"train_loss": -31.819578170776367, "global_step": 28023, "epoch": 231} {"train_loss": -32.019527435302734, "global_step": 28024, "epoch": 231} {"train_loss": -31.520742416381836, "global_step": 28025, "epoch": 231} {"train_loss": -31.513721466064453, "global_step": 28026, "epoch": 231} {"train_loss": -30.780176162719727, "global_step": 28027, "epoch": 231} {"train_loss": -29.873022079467773, "global_step": 28028, "epoch": 231} {"train_loss": -28.846662521362305, "global_step": 28029, "epoch": 231} {"train_loss": -26.7407283782959, "global_step": 28030, "epoch": 231} {"train_loss": -24.301284790039062, "global_step": 28031, "epoch": 231} {"train_loss": -22.653173446655273, "global_step": 28032, "epoch": 231} {"train_loss": -29.91328239440918, "global_step": 28033, "epoch": 231} {"train_loss": -24.006601333618164, "global_step": 28034, "epoch": 231} {"train_loss": -20.950958251953125, "global_step": 28035, "epoch": 231} {"train_loss": -30.400165557861328, "global_step": 28036, "epoch": 231} {"train_loss": -26.5534610748291, "global_step": 28037, "epoch": 231} {"train_loss": -28.391706466674805, "global_step": 28038, "epoch": 231} {"train_loss": -28.58930778503418, "global_step": 28039, "epoch": 231} {"train_loss": -26.79014015197754, "global_step": 28040, "epoch": 231} {"train_loss": -30.3719482421875, "global_step": 28041, "epoch": 231} {"train_loss": -28.2673282623291, "global_step": 28042, "epoch": 231} {"train_loss": -29.469690322875977, "global_step": 28043, "epoch": 231} {"train_loss": -30.6600341796875, "global_step": 28044, "epoch": 231} {"train_loss": -28.859527587890625, "global_step": 28045, "epoch": 231} {"train_loss": -29.97124671936035, "global_step": 28046, "epoch": 231} {"train_loss": -31.232690811157227, "global_step": 28047, "epoch": 231} {"train_loss": -30.220136642456055, "global_step": 28048, "epoch": 231} {"train_loss": -29.178247451782227, "global_step": 28049, "epoch": 231} {"train_loss": -30.510107040405273, "global_step": 28050, "epoch": 231} {"train_loss": -30.89528465270996, "global_step": 28051, "epoch": 231} {"train_loss": -30.8949031829834, "global_step": 28052, "epoch": 231} {"train_loss": -30.516050338745117, "global_step": 28053, "epoch": 231} {"train_loss": -30.618682861328125, "global_step": 28054, "epoch": 231} {"train_loss": -30.801549911499023, "global_step": 28055, "epoch": 231} {"train_loss": -31.25745964050293, "global_step": 28056, "epoch": 231} {"train_loss": -30.927030563354492, "global_step": 28057, "epoch": 231} {"train_loss": -31.088953018188477, "global_step": 28058, "epoch": 231} {"train_loss": -30.827533721923828, "global_step": 28059, "epoch": 231} {"train_loss": -31.138635635375977, "global_step": 28060, "epoch": 231} {"train_loss": -31.598316192626953, "global_step": 28061, "epoch": 231} {"train_loss": -31.124420166015625, "global_step": 28062, "epoch": 231} {"train_loss": -31.014257431030273, "global_step": 28063, "epoch": 231} {"train_loss": -31.363073348999023, "global_step": 28064, "epoch": 231} {"train_loss": -31.34061050415039, "global_step": 28065, "epoch": 231} {"train_loss": -31.180866241455078, "global_step": 28066, "epoch": 231} {"train_loss": -30.906818389892578, "global_step": 28067, "epoch": 231} {"train_loss": -31.56671714782715, "global_step": 28068, "epoch": 231} {"train_loss": -31.74310874938965, "global_step": 28069, "epoch": 231} {"train_loss": -31.580053329467773, "global_step": 28070, "epoch": 231} {"train_loss": -29.544806346420415, "global_step": 28071, "epoch": 231, "val_loss": 2476722.25} {"train_loss": -31.790830612182617, "global_step": 28072, "epoch": 232} {"train_loss": -31.6116886138916, "global_step": 28073, "epoch": 232} {"train_loss": -31.716583251953125, "global_step": 28074, "epoch": 232} {"train_loss": -31.583194732666016, "global_step": 28075, "epoch": 232} {"train_loss": -32.092918395996094, "global_step": 28076, "epoch": 232} {"train_loss": -32.07504653930664, "global_step": 28077, "epoch": 232} {"train_loss": -32.04289627075195, "global_step": 28078, "epoch": 232} {"train_loss": -31.396316528320312, "global_step": 28079, "epoch": 232} {"train_loss": -31.225622177124023, "global_step": 28080, "epoch": 232} {"train_loss": -29.976789474487305, "global_step": 28081, "epoch": 232} {"train_loss": -26.590076446533203, "global_step": 28082, "epoch": 232} {"train_loss": -17.969648361206055, "global_step": 28083, "epoch": 232} {"train_loss": -13.71994686126709, "global_step": 28084, "epoch": 232} {"train_loss": -31.060745239257812, "global_step": 28085, "epoch": 232} {"train_loss": -19.309865951538086, "global_step": 28086, "epoch": 232} {"train_loss": -21.873098373413086, "global_step": 28087, "epoch": 232} {"train_loss": -23.750526428222656, "global_step": 28088, "epoch": 232} {"train_loss": -22.281829833984375, "global_step": 28089, "epoch": 232} {"train_loss": -30.656896591186523, "global_step": 28090, "epoch": 232} {"train_loss": -24.71027946472168, "global_step": 28091, "epoch": 232} {"train_loss": -26.77557373046875, "global_step": 28092, "epoch": 232} {"train_loss": -30.324079513549805, "global_step": 28093, "epoch": 232} {"train_loss": -29.690637588500977, "global_step": 28094, "epoch": 232} {"train_loss": -28.101343154907227, "global_step": 28095, "epoch": 232} {"train_loss": -28.6204833984375, "global_step": 28096, "epoch": 232} {"train_loss": -29.93988037109375, "global_step": 28097, "epoch": 232} {"train_loss": -30.443424224853516, "global_step": 28098, "epoch": 232} {"train_loss": -30.037134170532227, "global_step": 28099, "epoch": 232} {"train_loss": -29.724002838134766, "global_step": 28100, "epoch": 232} {"train_loss": -29.6069393157959, "global_step": 28101, "epoch": 232} {"train_loss": -29.6092586517334, "global_step": 28102, "epoch": 232} {"train_loss": -30.193052291870117, "global_step": 28103, "epoch": 232} {"train_loss": -30.40751075744629, "global_step": 28104, "epoch": 232} {"train_loss": -30.796072006225586, "global_step": 28105, "epoch": 232} {"train_loss": -30.469995498657227, "global_step": 28106, "epoch": 232} {"train_loss": -29.954320907592773, "global_step": 28107, "epoch": 232} {"train_loss": -29.982059478759766, "global_step": 28108, "epoch": 232} {"train_loss": -30.654010772705078, "global_step": 28109, "epoch": 232} {"train_loss": -30.730178833007812, "global_step": 28110, "epoch": 232} {"train_loss": -29.960363388061523, "global_step": 28111, "epoch": 232} {"train_loss": -30.72833251953125, "global_step": 28112, "epoch": 232} {"train_loss": -30.878040313720703, "global_step": 28113, "epoch": 232} {"train_loss": -31.027027130126953, "global_step": 28114, "epoch": 232} {"train_loss": -30.913782119750977, "global_step": 28115, "epoch": 232} {"train_loss": -30.59681510925293, "global_step": 28116, "epoch": 232} {"train_loss": -30.9819278717041, "global_step": 28117, "epoch": 232} {"train_loss": -30.299222946166992, "global_step": 28118, "epoch": 232} {"train_loss": -30.54751968383789, "global_step": 28119, "epoch": 232} {"train_loss": -30.0223445892334, "global_step": 28120, "epoch": 232} {"train_loss": -30.00806999206543, "global_step": 28121, "epoch": 232} {"train_loss": -31.045413970947266, "global_step": 28122, "epoch": 232} {"train_loss": -30.287506103515625, "global_step": 28123, "epoch": 232} {"train_loss": -30.898590087890625, "global_step": 28124, "epoch": 232} {"train_loss": -30.85024070739746, "global_step": 28125, "epoch": 232} {"train_loss": -30.623884201049805, "global_step": 28126, "epoch": 232} {"train_loss": -31.232999801635742, "global_step": 28127, "epoch": 232} {"train_loss": -31.169330596923828, "global_step": 28128, "epoch": 232} {"train_loss": -31.38238525390625, "global_step": 28129, "epoch": 232} {"train_loss": -31.352859497070312, "global_step": 28130, "epoch": 232} {"train_loss": -31.015247344970703, "global_step": 28131, "epoch": 232} {"train_loss": -31.191375732421875, "global_step": 28132, "epoch": 232} {"train_loss": -31.222381591796875, "global_step": 28133, "epoch": 232} {"train_loss": -31.278776168823242, "global_step": 28134, "epoch": 232} {"train_loss": -30.6535587310791, "global_step": 28135, "epoch": 232} {"train_loss": -31.766162872314453, "global_step": 28136, "epoch": 232} {"train_loss": -31.322635650634766, "global_step": 28137, "epoch": 232} {"train_loss": -30.744098663330078, "global_step": 28138, "epoch": 232} {"train_loss": -31.621551513671875, "global_step": 28139, "epoch": 232} {"train_loss": -31.23459243774414, "global_step": 28140, "epoch": 232} {"train_loss": -31.360204696655273, "global_step": 28141, "epoch": 232} {"train_loss": -31.2944278717041, "global_step": 28142, "epoch": 232} {"train_loss": -31.152851104736328, "global_step": 28143, "epoch": 232} {"train_loss": -31.615081787109375, "global_step": 28144, "epoch": 232} {"train_loss": -31.70026206970215, "global_step": 28145, "epoch": 232} {"train_loss": -31.23255729675293, "global_step": 28146, "epoch": 232} {"train_loss": -31.717437744140625, "global_step": 28147, "epoch": 232} {"train_loss": -31.56754493713379, "global_step": 28148, "epoch": 232} {"train_loss": -31.112905502319336, "global_step": 28149, "epoch": 232} {"train_loss": -31.91670799255371, "global_step": 28150, "epoch": 232} {"train_loss": -30.65960693359375, "global_step": 28151, "epoch": 232} {"train_loss": -31.309741973876953, "global_step": 28152, "epoch": 232} {"train_loss": -31.476577758789062, "global_step": 28153, "epoch": 232} {"train_loss": -30.31107521057129, "global_step": 28154, "epoch": 232} {"train_loss": -31.018524169921875, "global_step": 28155, "epoch": 232} {"train_loss": -31.088621139526367, "global_step": 28156, "epoch": 232} {"train_loss": -29.5372314453125, "global_step": 28157, "epoch": 232} {"train_loss": -30.003345489501953, "global_step": 28158, "epoch": 232} {"train_loss": -31.261066436767578, "global_step": 28159, "epoch": 232} {"train_loss": -30.3013858795166, "global_step": 28160, "epoch": 232} {"train_loss": -30.794965744018555, "global_step": 28161, "epoch": 232} {"train_loss": -31.455686569213867, "global_step": 28162, "epoch": 232} {"train_loss": -31.232608795166016, "global_step": 28163, "epoch": 232} {"train_loss": -31.47846794128418, "global_step": 28164, "epoch": 232} {"train_loss": -31.099817276000977, "global_step": 28165, "epoch": 232} {"train_loss": -31.45513916015625, "global_step": 28166, "epoch": 232} {"train_loss": -31.074066162109375, "global_step": 28167, "epoch": 232} {"train_loss": -31.08174705505371, "global_step": 28168, "epoch": 232} {"train_loss": -31.555883407592773, "global_step": 28169, "epoch": 232} {"train_loss": -31.642438888549805, "global_step": 28170, "epoch": 232} {"train_loss": -31.5003604888916, "global_step": 28171, "epoch": 232} {"train_loss": -31.49189567565918, "global_step": 28172, "epoch": 232} {"train_loss": -31.608579635620117, "global_step": 28173, "epoch": 232} {"train_loss": -31.575986862182617, "global_step": 28174, "epoch": 232} {"train_loss": -31.388538360595703, "global_step": 28175, "epoch": 232} {"train_loss": -31.431238174438477, "global_step": 28176, "epoch": 232} {"train_loss": -31.939910888671875, "global_step": 28177, "epoch": 232} {"train_loss": -32.08170700073242, "global_step": 28178, "epoch": 232} {"train_loss": -31.974878311157227, "global_step": 28179, "epoch": 232} {"train_loss": -31.680158615112305, "global_step": 28180, "epoch": 232} {"train_loss": -31.564878463745117, "global_step": 28181, "epoch": 232} {"train_loss": -31.806371688842773, "global_step": 28182, "epoch": 232} {"train_loss": -32.292510986328125, "global_step": 28183, "epoch": 232} {"train_loss": -32.30934524536133, "global_step": 28184, "epoch": 232} {"train_loss": -31.8969669342041, "global_step": 28185, "epoch": 232} {"train_loss": -32.26033401489258, "global_step": 28186, "epoch": 232} {"train_loss": -31.762226104736328, "global_step": 28187, "epoch": 232} {"train_loss": -31.966779708862305, "global_step": 28188, "epoch": 232} {"train_loss": -31.901762008666992, "global_step": 28189, "epoch": 232} {"train_loss": -31.68867301940918, "global_step": 28190, "epoch": 232} {"train_loss": -31.953596115112305, "global_step": 28191, "epoch": 232} {"train_loss": -30.36884551402951, "global_step": 28192, "epoch": 232, "val_loss": 2721581.25} {"train_loss": -31.928647994995117, "global_step": 28193, "epoch": 233} {"train_loss": -31.7960147857666, "global_step": 28194, "epoch": 233} {"train_loss": -32.03042221069336, "global_step": 28195, "epoch": 233} {"train_loss": -31.892210006713867, "global_step": 28196, "epoch": 233} {"train_loss": -31.502960205078125, "global_step": 28197, "epoch": 233} {"train_loss": -31.760360717773438, "global_step": 28198, "epoch": 233} {"train_loss": -31.984912872314453, "global_step": 28199, "epoch": 233} {"train_loss": -31.974069595336914, "global_step": 28200, "epoch": 233} {"train_loss": -31.301095962524414, "global_step": 28201, "epoch": 233} {"train_loss": -30.407926559448242, "global_step": 28202, "epoch": 233} {"train_loss": -31.89068603515625, "global_step": 28203, "epoch": 233} {"train_loss": -31.599477767944336, "global_step": 28204, "epoch": 233} {"train_loss": -31.549203872680664, "global_step": 28205, "epoch": 233} {"train_loss": -32.44417953491211, "global_step": 28206, "epoch": 233} {"train_loss": -31.309675216674805, "global_step": 28207, "epoch": 233} {"train_loss": -31.989120483398438, "global_step": 28208, "epoch": 233} {"train_loss": -31.562536239624023, "global_step": 28209, "epoch": 233} {"train_loss": -31.515233993530273, "global_step": 28210, "epoch": 233} {"train_loss": -32.145320892333984, "global_step": 28211, "epoch": 233} {"train_loss": -32.0838508605957, "global_step": 28212, "epoch": 233} {"train_loss": -31.9393253326416, "global_step": 28213, "epoch": 233} {"train_loss": -31.764434814453125, "global_step": 28214, "epoch": 233} {"train_loss": -32.760948181152344, "global_step": 28215, "epoch": 233} {"train_loss": -32.361873626708984, "global_step": 28216, "epoch": 233} {"train_loss": -32.02394104003906, "global_step": 28217, "epoch": 233} {"train_loss": -32.867366790771484, "global_step": 28218, "epoch": 233} {"train_loss": -31.884855270385742, "global_step": 28219, "epoch": 233} {"train_loss": -32.24478530883789, "global_step": 28220, "epoch": 233} {"train_loss": -31.765329360961914, "global_step": 28221, "epoch": 233} {"train_loss": -32.37710189819336, "global_step": 28222, "epoch": 233} {"train_loss": -31.949316024780273, "global_step": 28223, "epoch": 233} {"train_loss": -32.309635162353516, "global_step": 28224, "epoch": 233} {"train_loss": -32.23326110839844, "global_step": 28225, "epoch": 233} {"train_loss": -32.35353469848633, "global_step": 28226, "epoch": 233} {"train_loss": -32.374019622802734, "global_step": 28227, "epoch": 233} {"train_loss": -32.44746017456055, "global_step": 28228, "epoch": 233} {"train_loss": -31.968053817749023, "global_step": 28229, "epoch": 233} {"train_loss": -32.548431396484375, "global_step": 28230, "epoch": 233} {"train_loss": -31.78656005859375, "global_step": 28231, "epoch": 233} {"train_loss": -32.42734146118164, "global_step": 28232, "epoch": 233} {"train_loss": -32.634666442871094, "global_step": 28233, "epoch": 233} {"train_loss": -32.330135345458984, "global_step": 28234, "epoch": 233} {"train_loss": -32.35946273803711, "global_step": 28235, "epoch": 233} {"train_loss": -32.61016845703125, "global_step": 28236, "epoch": 233} {"train_loss": -32.57619857788086, "global_step": 28237, "epoch": 233} {"train_loss": -32.148841857910156, "global_step": 28238, "epoch": 233} {"train_loss": -32.33506393432617, "global_step": 28239, "epoch": 233} {"train_loss": -31.31781005859375, "global_step": 28240, "epoch": 233} {"train_loss": -30.00272560119629, "global_step": 28241, "epoch": 233} {"train_loss": -23.095367431640625, "global_step": 28242, "epoch": 233} {"train_loss": -18.800872802734375, "global_step": 28243, "epoch": 233} {"train_loss": -20.301738739013672, "global_step": 28244, "epoch": 233} {"train_loss": -17.862619400024414, "global_step": 28245, "epoch": 233} {"train_loss": -20.188377380371094, "global_step": 28246, "epoch": 233} {"train_loss": -19.55373191833496, "global_step": 28247, "epoch": 233} {"train_loss": -18.666257858276367, "global_step": 28248, "epoch": 233} {"train_loss": -20.95832633972168, "global_step": 28249, "epoch": 233} {"train_loss": -20.089101791381836, "global_step": 28250, "epoch": 233} {"train_loss": -20.877700805664062, "global_step": 28251, "epoch": 233} {"train_loss": -21.063369750976562, "global_step": 28252, "epoch": 233} {"train_loss": -21.789653778076172, "global_step": 28253, "epoch": 233} {"train_loss": -21.999162673950195, "global_step": 28254, "epoch": 233} {"train_loss": -22.11305809020996, "global_step": 28255, "epoch": 233} {"train_loss": -23.221435546875, "global_step": 28256, "epoch": 233} {"train_loss": -23.864511489868164, "global_step": 28257, "epoch": 233} {"train_loss": -23.03602409362793, "global_step": 28258, "epoch": 233} {"train_loss": -23.556310653686523, "global_step": 28259, "epoch": 233} {"train_loss": -24.368200302124023, "global_step": 28260, "epoch": 233} {"train_loss": -25.055587768554688, "global_step": 28261, "epoch": 233} {"train_loss": -25.685110092163086, "global_step": 28262, "epoch": 233} {"train_loss": -26.015295028686523, "global_step": 28263, "epoch": 233} {"train_loss": -26.586318969726562, "global_step": 28264, "epoch": 233} {"train_loss": -25.75709342956543, "global_step": 28265, "epoch": 233} {"train_loss": -22.01552391052246, "global_step": 28266, "epoch": 233} {"train_loss": -17.635665893554688, "global_step": 28267, "epoch": 233} {"train_loss": -26.194372177124023, "global_step": 28268, "epoch": 233} {"train_loss": -24.149106979370117, "global_step": 28269, "epoch": 233} {"train_loss": -24.881717681884766, "global_step": 28270, "epoch": 233} {"train_loss": -26.40030860900879, "global_step": 28271, "epoch": 233} {"train_loss": -26.600738525390625, "global_step": 28272, "epoch": 233} {"train_loss": -24.07379150390625, "global_step": 28273, "epoch": 233} {"train_loss": -23.72271156311035, "global_step": 28274, "epoch": 233} {"train_loss": -26.501270294189453, "global_step": 28275, "epoch": 233} {"train_loss": -27.219125747680664, "global_step": 28276, "epoch": 233} {"train_loss": -26.66851234436035, "global_step": 28277, "epoch": 233} {"train_loss": -26.210102081298828, "global_step": 28278, "epoch": 233} {"train_loss": -27.260705947875977, "global_step": 28279, "epoch": 233} {"train_loss": -27.56428337097168, "global_step": 28280, "epoch": 233} {"train_loss": -28.00861167907715, "global_step": 28281, "epoch": 233} {"train_loss": -26.600255966186523, "global_step": 28282, "epoch": 233} {"train_loss": -27.34138298034668, "global_step": 28283, "epoch": 233} {"train_loss": -26.7109432220459, "global_step": 28284, "epoch": 233} {"train_loss": -27.80030632019043, "global_step": 28285, "epoch": 233} {"train_loss": -26.363935470581055, "global_step": 28286, "epoch": 233} {"train_loss": -26.001148223876953, "global_step": 28287, "epoch": 233} {"train_loss": -27.961584091186523, "global_step": 28288, "epoch": 233} {"train_loss": -27.094457626342773, "global_step": 28289, "epoch": 233} {"train_loss": -27.52583885192871, "global_step": 28290, "epoch": 233} {"train_loss": -28.748682022094727, "global_step": 28291, "epoch": 233} {"train_loss": -27.979766845703125, "global_step": 28292, "epoch": 233} {"train_loss": -28.175262451171875, "global_step": 28293, "epoch": 233} {"train_loss": -27.642807006835938, "global_step": 28294, "epoch": 233} {"train_loss": -28.571115493774414, "global_step": 28295, "epoch": 233} {"train_loss": -28.371606826782227, "global_step": 28296, "epoch": 233} {"train_loss": -28.067548751831055, "global_step": 28297, "epoch": 233} {"train_loss": -27.130142211914062, "global_step": 28298, "epoch": 233} {"train_loss": -27.91493034362793, "global_step": 28299, "epoch": 233} {"train_loss": -28.4486141204834, "global_step": 28300, "epoch": 233} {"train_loss": -28.968143463134766, "global_step": 28301, "epoch": 233} {"train_loss": -29.446523666381836, "global_step": 28302, "epoch": 233} {"train_loss": -29.371450424194336, "global_step": 28303, "epoch": 233} {"train_loss": -29.162023544311523, "global_step": 28304, "epoch": 233} {"train_loss": -29.450876235961914, "global_step": 28305, "epoch": 233} {"train_loss": -29.533899307250977, "global_step": 28306, "epoch": 233} {"train_loss": -29.513708114624023, "global_step": 28307, "epoch": 233} {"train_loss": -27.8415584564209, "global_step": 28308, "epoch": 233} {"train_loss": -28.63591957092285, "global_step": 28309, "epoch": 233} {"train_loss": -28.537952423095703, "global_step": 28310, "epoch": 233} {"train_loss": -29.6910343170166, "global_step": 28311, "epoch": 233} {"train_loss": -29.125049591064453, "global_step": 28312, "epoch": 233} {"train_loss": -28.177369771910108, "global_step": 28313, "epoch": 233, "val_loss": 2572873.75} {"train_loss": -28.35638427734375, "global_step": 28314, "epoch": 234} {"train_loss": -26.610855102539062, "global_step": 28315, "epoch": 234} {"train_loss": -26.863622665405273, "global_step": 28316, "epoch": 234} {"train_loss": -23.694597244262695, "global_step": 28317, "epoch": 234} {"train_loss": -20.21433448791504, "global_step": 28318, "epoch": 234} {"train_loss": -26.99079704284668, "global_step": 28319, "epoch": 234} {"train_loss": -23.291824340820312, "global_step": 28320, "epoch": 234} {"train_loss": -19.728546142578125, "global_step": 28321, "epoch": 234} {"train_loss": -19.681787490844727, "global_step": 28322, "epoch": 234} {"train_loss": -24.23114776611328, "global_step": 28323, "epoch": 234} {"train_loss": -23.50442123413086, "global_step": 28324, "epoch": 234} {"train_loss": -22.701162338256836, "global_step": 28325, "epoch": 234} {"train_loss": -27.194564819335938, "global_step": 28326, "epoch": 234} {"train_loss": -25.354780197143555, "global_step": 28327, "epoch": 234} {"train_loss": -26.413562774658203, "global_step": 28328, "epoch": 234} {"train_loss": -26.170495986938477, "global_step": 28329, "epoch": 234} {"train_loss": -26.61440086364746, "global_step": 28330, "epoch": 234} {"train_loss": -26.787023544311523, "global_step": 28331, "epoch": 234} {"train_loss": -27.32770347595215, "global_step": 28332, "epoch": 234} {"train_loss": -27.037689208984375, "global_step": 28333, "epoch": 234} {"train_loss": -27.859670639038086, "global_step": 28334, "epoch": 234} {"train_loss": -27.088693618774414, "global_step": 28335, "epoch": 234} {"train_loss": -27.068464279174805, "global_step": 28336, "epoch": 234} {"train_loss": -27.173358917236328, "global_step": 28337, "epoch": 234} {"train_loss": -27.648962020874023, "global_step": 28338, "epoch": 234} {"train_loss": -27.996885299682617, "global_step": 28339, "epoch": 234} {"train_loss": -28.008041381835938, "global_step": 28340, "epoch": 234} {"train_loss": -27.51593017578125, "global_step": 28341, "epoch": 234} {"train_loss": -27.292617797851562, "global_step": 28342, "epoch": 234} {"train_loss": -27.573001861572266, "global_step": 28343, "epoch": 234} {"train_loss": -27.657745361328125, "global_step": 28344, "epoch": 234} {"train_loss": -28.03738784790039, "global_step": 28345, "epoch": 234} {"train_loss": -27.61667823791504, "global_step": 28346, "epoch": 234} {"train_loss": -28.590742111206055, "global_step": 28347, "epoch": 234} {"train_loss": -27.940473556518555, "global_step": 28348, "epoch": 234} {"train_loss": -28.4212646484375, "global_step": 28349, "epoch": 234} {"train_loss": -28.251300811767578, "global_step": 28350, "epoch": 234} {"train_loss": -28.716466903686523, "global_step": 28351, "epoch": 234} {"train_loss": -28.725976943969727, "global_step": 28352, "epoch": 234} {"train_loss": -28.488229751586914, "global_step": 28353, "epoch": 234} {"train_loss": -29.243005752563477, "global_step": 28354, "epoch": 234} {"train_loss": -28.415796279907227, "global_step": 28355, "epoch": 234} {"train_loss": -29.083215713500977, "global_step": 28356, "epoch": 234} {"train_loss": -29.23078727722168, "global_step": 28357, "epoch": 234} {"train_loss": -28.552270889282227, "global_step": 28358, "epoch": 234} {"train_loss": -28.802045822143555, "global_step": 28359, "epoch": 234} {"train_loss": -29.41248893737793, "global_step": 28360, "epoch": 234} {"train_loss": -29.6595401763916, "global_step": 28361, "epoch": 234} {"train_loss": -29.6605167388916, "global_step": 28362, "epoch": 234} {"train_loss": -29.76017189025879, "global_step": 28363, "epoch": 234} {"train_loss": -29.95953369140625, "global_step": 28364, "epoch": 234} {"train_loss": -29.613697052001953, "global_step": 28365, "epoch": 234} {"train_loss": -29.74261474609375, "global_step": 28366, "epoch": 234} {"train_loss": -30.17547035217285, "global_step": 28367, "epoch": 234} {"train_loss": -30.15815544128418, "global_step": 28368, "epoch": 234} {"train_loss": -30.23456382751465, "global_step": 28369, "epoch": 234} {"train_loss": -30.75294303894043, "global_step": 28370, "epoch": 234} {"train_loss": -30.339818954467773, "global_step": 28371, "epoch": 234} {"train_loss": -29.385400772094727, "global_step": 28372, "epoch": 234} {"train_loss": -28.444055557250977, "global_step": 28373, "epoch": 234} {"train_loss": -26.74905776977539, "global_step": 28374, "epoch": 234} {"train_loss": -27.490936279296875, "global_step": 28375, "epoch": 234} {"train_loss": -30.00569725036621, "global_step": 28376, "epoch": 234} {"train_loss": -28.477392196655273, "global_step": 28377, "epoch": 234} {"train_loss": -29.24212074279785, "global_step": 28378, "epoch": 234} {"train_loss": -24.421207427978516, "global_step": 28379, "epoch": 234} {"train_loss": -23.78656005859375, "global_step": 28380, "epoch": 234} {"train_loss": -29.292463302612305, "global_step": 28381, "epoch": 234} {"train_loss": -27.050491333007812, "global_step": 28382, "epoch": 234} {"train_loss": -29.91216468811035, "global_step": 28383, "epoch": 234} {"train_loss": -26.769372940063477, "global_step": 28384, "epoch": 234} {"train_loss": -29.588483810424805, "global_step": 28385, "epoch": 234} {"train_loss": -28.241363525390625, "global_step": 28386, "epoch": 234} {"train_loss": -29.1522274017334, "global_step": 28387, "epoch": 234} {"train_loss": -29.48079490661621, "global_step": 28388, "epoch": 234} {"train_loss": -28.932056427001953, "global_step": 28389, "epoch": 234} {"train_loss": -28.816333770751953, "global_step": 28390, "epoch": 234} {"train_loss": -28.876800537109375, "global_step": 28391, "epoch": 234} {"train_loss": -28.73583984375, "global_step": 28392, "epoch": 234} {"train_loss": -29.567581176757812, "global_step": 28393, "epoch": 234} {"train_loss": -28.209125518798828, "global_step": 28394, "epoch": 234} {"train_loss": -29.418243408203125, "global_step": 28395, "epoch": 234} {"train_loss": -28.49668312072754, "global_step": 28396, "epoch": 234} {"train_loss": -29.306921005249023, "global_step": 28397, "epoch": 234} {"train_loss": -30.142602920532227, "global_step": 28398, "epoch": 234} {"train_loss": -29.144926071166992, "global_step": 28399, "epoch": 234} {"train_loss": -29.98164176940918, "global_step": 28400, "epoch": 234} {"train_loss": -29.5188045501709, "global_step": 28401, "epoch": 234} {"train_loss": -29.604568481445312, "global_step": 28402, "epoch": 234} {"train_loss": -27.76551628112793, "global_step": 28403, "epoch": 234} {"train_loss": -20.103046417236328, "global_step": 28404, "epoch": 234} {"train_loss": 3.529850482940674, "global_step": 28405, "epoch": 234} {"train_loss": -22.069883346557617, "global_step": 28406, "epoch": 234} {"train_loss": -12.582087516784668, "global_step": 28407, "epoch": 234} {"train_loss": -29.604883193969727, "global_step": 28408, "epoch": 234} {"train_loss": -21.882123947143555, "global_step": 28409, "epoch": 234} {"train_loss": -21.93558692932129, "global_step": 28410, "epoch": 234} {"train_loss": -28.645727157592773, "global_step": 28411, "epoch": 234} {"train_loss": -28.658090591430664, "global_step": 28412, "epoch": 234} {"train_loss": -27.625646591186523, "global_step": 28413, "epoch": 234} {"train_loss": -27.1533260345459, "global_step": 28414, "epoch": 234} {"train_loss": -25.7728271484375, "global_step": 28415, "epoch": 234} {"train_loss": -27.7165470123291, "global_step": 28416, "epoch": 234} {"train_loss": -29.126001358032227, "global_step": 28417, "epoch": 234} {"train_loss": -29.626178741455078, "global_step": 28418, "epoch": 234} {"train_loss": -29.37624168395996, "global_step": 28419, "epoch": 234} {"train_loss": -29.018503189086914, "global_step": 28420, "epoch": 234} {"train_loss": -28.881378173828125, "global_step": 28421, "epoch": 234} {"train_loss": -29.1981201171875, "global_step": 28422, "epoch": 234} {"train_loss": -28.74360466003418, "global_step": 28423, "epoch": 234} {"train_loss": -28.49146842956543, "global_step": 28424, "epoch": 234} {"train_loss": -29.57708168029785, "global_step": 28425, "epoch": 234} {"train_loss": -29.740148544311523, "global_step": 28426, "epoch": 234} {"train_loss": -29.403656005859375, "global_step": 28427, "epoch": 234} {"train_loss": -29.870004653930664, "global_step": 28428, "epoch": 234} {"train_loss": -29.904687881469727, "global_step": 28429, "epoch": 234} {"train_loss": -29.9381046295166, "global_step": 28430, "epoch": 234} {"train_loss": -29.71126365661621, "global_step": 28431, "epoch": 234} {"train_loss": -29.711517333984375, "global_step": 28432, "epoch": 234} {"train_loss": -30.15988540649414, "global_step": 28433, "epoch": 234} {"train_loss": -27.472181749737953, "global_step": 28434, "epoch": 234, "val_loss": 2614279.25} {"train_loss": -30.385009765625, "global_step": 28435, "epoch": 235} {"train_loss": -30.3236083984375, "global_step": 28436, "epoch": 235} {"train_loss": -30.08296012878418, "global_step": 28437, "epoch": 235} {"train_loss": -30.618927001953125, "global_step": 28438, "epoch": 235} {"train_loss": -30.55632972717285, "global_step": 28439, "epoch": 235} {"train_loss": -30.130273818969727, "global_step": 28440, "epoch": 235} {"train_loss": -30.088788986206055, "global_step": 28441, "epoch": 235} {"train_loss": -29.84869956970215, "global_step": 28442, "epoch": 235} {"train_loss": -30.21990966796875, "global_step": 28443, "epoch": 235} {"train_loss": -29.743139266967773, "global_step": 28444, "epoch": 235} {"train_loss": -28.66562843322754, "global_step": 28445, "epoch": 235} {"train_loss": -28.000396728515625, "global_step": 28446, "epoch": 235} {"train_loss": -26.741626739501953, "global_step": 28447, "epoch": 235} {"train_loss": -29.352115631103516, "global_step": 28448, "epoch": 235} {"train_loss": -29.392465591430664, "global_step": 28449, "epoch": 235} {"train_loss": -26.699600219726562, "global_step": 28450, "epoch": 235} {"train_loss": -27.89885902404785, "global_step": 28451, "epoch": 235} {"train_loss": -29.739185333251953, "global_step": 28452, "epoch": 235} {"train_loss": -28.737049102783203, "global_step": 28453, "epoch": 235} {"train_loss": -28.7032527923584, "global_step": 28454, "epoch": 235} {"train_loss": -28.9556884765625, "global_step": 28455, "epoch": 235} {"train_loss": -29.543432235717773, "global_step": 28456, "epoch": 235} {"train_loss": -29.2746524810791, "global_step": 28457, "epoch": 235} {"train_loss": -29.72780418395996, "global_step": 28458, "epoch": 235} {"train_loss": -29.738767623901367, "global_step": 28459, "epoch": 235} {"train_loss": -29.669025421142578, "global_step": 28460, "epoch": 235} {"train_loss": -29.601333618164062, "global_step": 28461, "epoch": 235} {"train_loss": -29.906280517578125, "global_step": 28462, "epoch": 235} {"train_loss": -29.760822296142578, "global_step": 28463, "epoch": 235} {"train_loss": -29.33634376525879, "global_step": 28464, "epoch": 235} {"train_loss": -30.08967399597168, "global_step": 28465, "epoch": 235} {"train_loss": -29.660924911499023, "global_step": 28466, "epoch": 235} {"train_loss": -30.214069366455078, "global_step": 28467, "epoch": 235} {"train_loss": -30.0183162689209, "global_step": 28468, "epoch": 235} {"train_loss": -29.899587631225586, "global_step": 28469, "epoch": 235} {"train_loss": -30.203664779663086, "global_step": 28470, "epoch": 235} {"train_loss": -30.154098510742188, "global_step": 28471, "epoch": 235} {"train_loss": -29.593420028686523, "global_step": 28472, "epoch": 235} {"train_loss": -30.124221801757812, "global_step": 28473, "epoch": 235} {"train_loss": -30.278162002563477, "global_step": 28474, "epoch": 235} {"train_loss": -29.94489860534668, "global_step": 28475, "epoch": 235} {"train_loss": -29.997440338134766, "global_step": 28476, "epoch": 235} {"train_loss": -30.2457332611084, "global_step": 28477, "epoch": 235} {"train_loss": -30.5523681640625, "global_step": 28478, "epoch": 235} {"train_loss": -30.299945831298828, "global_step": 28479, "epoch": 235} {"train_loss": -30.156787872314453, "global_step": 28480, "epoch": 235} {"train_loss": -29.37298011779785, "global_step": 28481, "epoch": 235} {"train_loss": -23.7045841217041, "global_step": 28482, "epoch": 235} {"train_loss": -7.934164524078369, "global_step": 28483, "epoch": 235} {"train_loss": -14.448160171508789, "global_step": 28484, "epoch": 235} {"train_loss": -27.615436553955078, "global_step": 28485, "epoch": 235} {"train_loss": -23.505247116088867, "global_step": 28486, "epoch": 235} {"train_loss": -24.878217697143555, "global_step": 28487, "epoch": 235} {"train_loss": -29.953271865844727, "global_step": 28488, "epoch": 235} {"train_loss": -25.987323760986328, "global_step": 28489, "epoch": 235} {"train_loss": -26.439929962158203, "global_step": 28490, "epoch": 235} {"train_loss": -29.581823348999023, "global_step": 28491, "epoch": 235} {"train_loss": -30.04560661315918, "global_step": 28492, "epoch": 235} {"train_loss": -28.945621490478516, "global_step": 28493, "epoch": 235} {"train_loss": -28.245635986328125, "global_step": 28494, "epoch": 235} {"train_loss": -28.899953842163086, "global_step": 28495, "epoch": 235} {"train_loss": -29.3804874420166, "global_step": 28496, "epoch": 235} {"train_loss": -30.07191276550293, "global_step": 28497, "epoch": 235} {"train_loss": -29.832876205444336, "global_step": 28498, "epoch": 235} {"train_loss": -29.674182891845703, "global_step": 28499, "epoch": 235} {"train_loss": -29.682397842407227, "global_step": 28500, "epoch": 235} {"train_loss": -29.406400680541992, "global_step": 28501, "epoch": 235} {"train_loss": -29.195053100585938, "global_step": 28502, "epoch": 235} {"train_loss": -30.032241821289062, "global_step": 28503, "epoch": 235} {"train_loss": -30.11048698425293, "global_step": 28504, "epoch": 235} {"train_loss": -30.035871505737305, "global_step": 28505, "epoch": 235} {"train_loss": -29.999494552612305, "global_step": 28506, "epoch": 235} {"train_loss": -29.980152130126953, "global_step": 28507, "epoch": 235} {"train_loss": -30.16187858581543, "global_step": 28508, "epoch": 235} {"train_loss": -29.462665557861328, "global_step": 28509, "epoch": 235} {"train_loss": -29.27739906311035, "global_step": 28510, "epoch": 235} {"train_loss": -29.76673698425293, "global_step": 28511, "epoch": 235} {"train_loss": -29.86640739440918, "global_step": 28512, "epoch": 235} {"train_loss": -29.790719985961914, "global_step": 28513, "epoch": 235} {"train_loss": -30.035367965698242, "global_step": 28514, "epoch": 235} {"train_loss": -30.195026397705078, "global_step": 28515, "epoch": 235} {"train_loss": -29.469482421875, "global_step": 28516, "epoch": 235} {"train_loss": -30.811216354370117, "global_step": 28517, "epoch": 235} {"train_loss": -29.8800048828125, "global_step": 28518, "epoch": 235} {"train_loss": -29.380796432495117, "global_step": 28519, "epoch": 235} {"train_loss": -29.753515243530273, "global_step": 28520, "epoch": 235} {"train_loss": -30.151081085205078, "global_step": 28521, "epoch": 235} {"train_loss": -29.465728759765625, "global_step": 28522, "epoch": 235} {"train_loss": -29.08194923400879, "global_step": 28523, "epoch": 235} {"train_loss": -24.6113338470459, "global_step": 28524, "epoch": 235} {"train_loss": -10.62973403930664, "global_step": 28525, "epoch": 235} {"train_loss": -7.470045566558838, "global_step": 28526, "epoch": 235} {"train_loss": -29.32160758972168, "global_step": 28527, "epoch": 235} {"train_loss": -18.530134201049805, "global_step": 28528, "epoch": 235} {"train_loss": -29.292282104492188, "global_step": 28529, "epoch": 235} {"train_loss": -25.6392822265625, "global_step": 28530, "epoch": 235} {"train_loss": -25.03325843811035, "global_step": 28531, "epoch": 235} {"train_loss": -29.426502227783203, "global_step": 28532, "epoch": 235} {"train_loss": -29.651762008666992, "global_step": 28533, "epoch": 235} {"train_loss": -27.168258666992188, "global_step": 28534, "epoch": 235} {"train_loss": -26.991439819335938, "global_step": 28535, "epoch": 235} {"train_loss": -28.66924476623535, "global_step": 28536, "epoch": 235} {"train_loss": -29.050064086914062, "global_step": 28537, "epoch": 235} {"train_loss": -29.289045333862305, "global_step": 28538, "epoch": 235} {"train_loss": -27.428991317749023, "global_step": 28539, "epoch": 235} {"train_loss": -28.414234161376953, "global_step": 28540, "epoch": 235} {"train_loss": -27.76133155822754, "global_step": 28541, "epoch": 235} {"train_loss": -28.7440128326416, "global_step": 28542, "epoch": 235} {"train_loss": -28.784000396728516, "global_step": 28543, "epoch": 235} {"train_loss": -29.274301528930664, "global_step": 28544, "epoch": 235} {"train_loss": -28.988727569580078, "global_step": 28545, "epoch": 235} {"train_loss": -28.4305362701416, "global_step": 28546, "epoch": 235} {"train_loss": -27.81611442565918, "global_step": 28547, "epoch": 235} {"train_loss": -27.783935546875, "global_step": 28548, "epoch": 235} {"train_loss": -27.65606117248535, "global_step": 28549, "epoch": 235} {"train_loss": -28.506750106811523, "global_step": 28550, "epoch": 235} {"train_loss": -27.862695693969727, "global_step": 28551, "epoch": 235} {"train_loss": -29.283435821533203, "global_step": 28552, "epoch": 235} {"train_loss": -28.477954864501953, "global_step": 28553, "epoch": 235} {"train_loss": -28.905603408813477, "global_step": 28554, "epoch": 235} {"train_loss": -28.35120282291381, "global_step": 28555, "epoch": 235, "val_loss": 2471367.25} {"train_loss": -28.920719146728516, "global_step": 28556, "epoch": 236} {"train_loss": -29.388036727905273, "global_step": 28557, "epoch": 236} {"train_loss": -28.872968673706055, "global_step": 28558, "epoch": 236} {"train_loss": -29.643329620361328, "global_step": 28559, "epoch": 236} {"train_loss": -29.68951988220215, "global_step": 28560, "epoch": 236} {"train_loss": -29.3917293548584, "global_step": 28561, "epoch": 236} {"train_loss": -29.09210777282715, "global_step": 28562, "epoch": 236} {"train_loss": -29.27066993713379, "global_step": 28563, "epoch": 236} {"train_loss": -29.607160568237305, "global_step": 28564, "epoch": 236} {"train_loss": -29.415878295898438, "global_step": 28565, "epoch": 236} {"train_loss": -29.681354522705078, "global_step": 28566, "epoch": 236} {"train_loss": -29.370824813842773, "global_step": 28567, "epoch": 236} {"train_loss": -30.07394790649414, "global_step": 28568, "epoch": 236} {"train_loss": -29.61475944519043, "global_step": 28569, "epoch": 236} {"train_loss": -29.425491333007812, "global_step": 28570, "epoch": 236} {"train_loss": -29.427221298217773, "global_step": 28571, "epoch": 236} {"train_loss": -29.75531005859375, "global_step": 28572, "epoch": 236} {"train_loss": -29.652402877807617, "global_step": 28573, "epoch": 236} {"train_loss": -29.730854034423828, "global_step": 28574, "epoch": 236} {"train_loss": -30.041015625, "global_step": 28575, "epoch": 236} {"train_loss": -29.643157958984375, "global_step": 28576, "epoch": 236} {"train_loss": -29.79343032836914, "global_step": 28577, "epoch": 236} {"train_loss": -29.93218994140625, "global_step": 28578, "epoch": 236} {"train_loss": -29.78230857849121, "global_step": 28579, "epoch": 236} {"train_loss": -29.23150062561035, "global_step": 28580, "epoch": 236} {"train_loss": -29.8862247467041, "global_step": 28581, "epoch": 236} {"train_loss": -30.15839958190918, "global_step": 28582, "epoch": 236} {"train_loss": -29.951541900634766, "global_step": 28583, "epoch": 236} {"train_loss": -29.364429473876953, "global_step": 28584, "epoch": 236} {"train_loss": -28.925546646118164, "global_step": 28585, "epoch": 236} {"train_loss": -29.3851375579834, "global_step": 28586, "epoch": 236} {"train_loss": -29.214365005493164, "global_step": 28587, "epoch": 236} {"train_loss": -26.860273361206055, "global_step": 28588, "epoch": 236} {"train_loss": -26.345788955688477, "global_step": 28589, "epoch": 236} {"train_loss": -28.113779067993164, "global_step": 28590, "epoch": 236} {"train_loss": -29.201236724853516, "global_step": 28591, "epoch": 236} {"train_loss": -28.643945693969727, "global_step": 28592, "epoch": 236} {"train_loss": -28.9250545501709, "global_step": 28593, "epoch": 236} {"train_loss": -29.093765258789062, "global_step": 28594, "epoch": 236} {"train_loss": -28.803791046142578, "global_step": 28595, "epoch": 236} {"train_loss": -28.027347564697266, "global_step": 28596, "epoch": 236} {"train_loss": -29.120365142822266, "global_step": 28597, "epoch": 236} {"train_loss": -28.328332901000977, "global_step": 28598, "epoch": 236} {"train_loss": -29.065292358398438, "global_step": 28599, "epoch": 236} {"train_loss": -29.14068603515625, "global_step": 28600, "epoch": 236} {"train_loss": -28.69268226623535, "global_step": 28601, "epoch": 236} {"train_loss": -29.190412521362305, "global_step": 28602, "epoch": 236} {"train_loss": -28.98687171936035, "global_step": 28603, "epoch": 236} {"train_loss": -29.078638076782227, "global_step": 28604, "epoch": 236} {"train_loss": -28.94515037536621, "global_step": 28605, "epoch": 236} {"train_loss": -29.48187255859375, "global_step": 28606, "epoch": 236} {"train_loss": -29.02296257019043, "global_step": 28607, "epoch": 236} {"train_loss": -29.12314796447754, "global_step": 28608, "epoch": 236} {"train_loss": -29.410795211791992, "global_step": 28609, "epoch": 236} {"train_loss": -29.143674850463867, "global_step": 28610, "epoch": 236} {"train_loss": -29.2560977935791, "global_step": 28611, "epoch": 236} {"train_loss": -29.388269424438477, "global_step": 28612, "epoch": 236} {"train_loss": -29.343460083007812, "global_step": 28613, "epoch": 236} {"train_loss": -29.203046798706055, "global_step": 28614, "epoch": 236} {"train_loss": -29.30158042907715, "global_step": 28615, "epoch": 236} {"train_loss": -28.80804443359375, "global_step": 28616, "epoch": 236} {"train_loss": -29.836950302124023, "global_step": 28617, "epoch": 236} {"train_loss": -29.63559913635254, "global_step": 28618, "epoch": 236} {"train_loss": -29.307153701782227, "global_step": 28619, "epoch": 236} {"train_loss": -29.6689395904541, "global_step": 28620, "epoch": 236} {"train_loss": -29.641813278198242, "global_step": 28621, "epoch": 236} {"train_loss": -29.2347412109375, "global_step": 28622, "epoch": 236} {"train_loss": -29.713964462280273, "global_step": 28623, "epoch": 236} {"train_loss": -30.714588165283203, "global_step": 28624, "epoch": 236} {"train_loss": -29.93912124633789, "global_step": 28625, "epoch": 236} {"train_loss": -29.78436851501465, "global_step": 28626, "epoch": 236} {"train_loss": -30.16943359375, "global_step": 28627, "epoch": 236} {"train_loss": -29.89460563659668, "global_step": 28628, "epoch": 236} {"train_loss": -30.37432289123535, "global_step": 28629, "epoch": 236} {"train_loss": -30.421157836914062, "global_step": 28630, "epoch": 236} {"train_loss": -30.631574630737305, "global_step": 28631, "epoch": 236} {"train_loss": -30.622039794921875, "global_step": 28632, "epoch": 236} {"train_loss": -30.3185977935791, "global_step": 28633, "epoch": 236} {"train_loss": -30.424291610717773, "global_step": 28634, "epoch": 236} {"train_loss": -30.434253692626953, "global_step": 28635, "epoch": 236} {"train_loss": -30.515539169311523, "global_step": 28636, "epoch": 236} {"train_loss": -30.382688522338867, "global_step": 28637, "epoch": 236} {"train_loss": -30.517881393432617, "global_step": 28638, "epoch": 236} {"train_loss": -30.904815673828125, "global_step": 28639, "epoch": 236} {"train_loss": -30.7757511138916, "global_step": 28640, "epoch": 236} {"train_loss": -30.869327545166016, "global_step": 28641, "epoch": 236} {"train_loss": -30.423892974853516, "global_step": 28642, "epoch": 236} {"train_loss": -30.83099937438965, "global_step": 28643, "epoch": 236} {"train_loss": -31.25383949279785, "global_step": 28644, "epoch": 236} {"train_loss": -30.9338321685791, "global_step": 28645, "epoch": 236} {"train_loss": -30.81439781188965, "global_step": 28646, "epoch": 236} {"train_loss": -31.210693359375, "global_step": 28647, "epoch": 236} {"train_loss": -31.122838973999023, "global_step": 28648, "epoch": 236} {"train_loss": -30.839862823486328, "global_step": 28649, "epoch": 236} {"train_loss": -30.8498592376709, "global_step": 28650, "epoch": 236} {"train_loss": -31.317493438720703, "global_step": 28651, "epoch": 236} {"train_loss": -30.840301513671875, "global_step": 28652, "epoch": 236} {"train_loss": -30.6756649017334, "global_step": 28653, "epoch": 236} {"train_loss": -29.76029396057129, "global_step": 28654, "epoch": 236} {"train_loss": -30.63994789123535, "global_step": 28655, "epoch": 236} {"train_loss": -29.70734214782715, "global_step": 28656, "epoch": 236} {"train_loss": -31.160001754760742, "global_step": 28657, "epoch": 236} {"train_loss": -30.375797271728516, "global_step": 28658, "epoch": 236} {"train_loss": -30.86874771118164, "global_step": 28659, "epoch": 236} {"train_loss": -30.260168075561523, "global_step": 28660, "epoch": 236} {"train_loss": -31.084516525268555, "global_step": 28661, "epoch": 236} {"train_loss": -30.51246452331543, "global_step": 28662, "epoch": 236} {"train_loss": -30.80120849609375, "global_step": 28663, "epoch": 236} {"train_loss": -30.4393367767334, "global_step": 28664, "epoch": 236} {"train_loss": -30.54021644592285, "global_step": 28665, "epoch": 236} {"train_loss": -30.952402114868164, "global_step": 28666, "epoch": 236} {"train_loss": -30.667844772338867, "global_step": 28667, "epoch": 236} {"train_loss": -30.945755004882812, "global_step": 28668, "epoch": 236} {"train_loss": -30.720111846923828, "global_step": 28669, "epoch": 236} {"train_loss": -30.758249282836914, "global_step": 28670, "epoch": 236} {"train_loss": -31.04823875427246, "global_step": 28671, "epoch": 236} {"train_loss": -30.50177001953125, "global_step": 28672, "epoch": 236} {"train_loss": -30.50266456604004, "global_step": 28673, "epoch": 236} {"train_loss": -31.024749755859375, "global_step": 28674, "epoch": 236} {"train_loss": -30.88776206970215, "global_step": 28675, "epoch": 236} {"train_loss": -29.854194325849043, "global_step": 28676, "epoch": 236, "val_loss": 2549062.5} {"train_loss": -30.469900131225586, "global_step": 28677, "epoch": 237} {"train_loss": -30.908472061157227, "global_step": 28678, "epoch": 237} {"train_loss": -31.282011032104492, "global_step": 28679, "epoch": 237} {"train_loss": -30.710168838500977, "global_step": 28680, "epoch": 237} {"train_loss": -30.909381866455078, "global_step": 28681, "epoch": 237} {"train_loss": -30.740976333618164, "global_step": 28682, "epoch": 237} {"train_loss": -30.836669921875, "global_step": 28683, "epoch": 237} {"train_loss": -31.065229415893555, "global_step": 28684, "epoch": 237} {"train_loss": -31.045194625854492, "global_step": 28685, "epoch": 237} {"train_loss": -31.2406005859375, "global_step": 28686, "epoch": 237} {"train_loss": -31.274887084960938, "global_step": 28687, "epoch": 237} {"train_loss": -31.293262481689453, "global_step": 28688, "epoch": 237} {"train_loss": -31.398014068603516, "global_step": 28689, "epoch": 237} {"train_loss": -31.53407096862793, "global_step": 28690, "epoch": 237} {"train_loss": -31.345417022705078, "global_step": 28691, "epoch": 237} {"train_loss": -31.05299186706543, "global_step": 28692, "epoch": 237} {"train_loss": -31.437707901000977, "global_step": 28693, "epoch": 237} {"train_loss": -31.39805030822754, "global_step": 28694, "epoch": 237} {"train_loss": -31.820697784423828, "global_step": 28695, "epoch": 237} {"train_loss": -31.4787654876709, "global_step": 28696, "epoch": 237} {"train_loss": -31.127294540405273, "global_step": 28697, "epoch": 237} {"train_loss": -31.970062255859375, "global_step": 28698, "epoch": 237} {"train_loss": -31.607715606689453, "global_step": 28699, "epoch": 237} {"train_loss": -32.162628173828125, "global_step": 28700, "epoch": 237} {"train_loss": -31.5379581451416, "global_step": 28701, "epoch": 237} {"train_loss": -31.506872177124023, "global_step": 28702, "epoch": 237} {"train_loss": -31.883703231811523, "global_step": 28703, "epoch": 237} {"train_loss": -31.404510498046875, "global_step": 28704, "epoch": 237} {"train_loss": -31.52727699279785, "global_step": 28705, "epoch": 237} {"train_loss": -31.722036361694336, "global_step": 28706, "epoch": 237} {"train_loss": -32.38938522338867, "global_step": 28707, "epoch": 237} {"train_loss": -31.6800594329834, "global_step": 28708, "epoch": 237} {"train_loss": -32.22119903564453, "global_step": 28709, "epoch": 237} {"train_loss": -31.93414306640625, "global_step": 28710, "epoch": 237} {"train_loss": -31.96803855895996, "global_step": 28711, "epoch": 237} {"train_loss": -31.721912384033203, "global_step": 28712, "epoch": 237} {"train_loss": -32.272666931152344, "global_step": 28713, "epoch": 237} {"train_loss": -31.736074447631836, "global_step": 28714, "epoch": 237} {"train_loss": -32.126625061035156, "global_step": 28715, "epoch": 237} {"train_loss": -31.5189266204834, "global_step": 28716, "epoch": 237} {"train_loss": -32.367061614990234, "global_step": 28717, "epoch": 237} {"train_loss": -31.4610595703125, "global_step": 28718, "epoch": 237} {"train_loss": -32.258785247802734, "global_step": 28719, "epoch": 237} {"train_loss": -31.783191680908203, "global_step": 28720, "epoch": 237} {"train_loss": -31.96487808227539, "global_step": 28721, "epoch": 237} {"train_loss": -31.627490997314453, "global_step": 28722, "epoch": 237} {"train_loss": -31.990453720092773, "global_step": 28723, "epoch": 237} {"train_loss": -31.095123291015625, "global_step": 28724, "epoch": 237} {"train_loss": -29.391061782836914, "global_step": 28725, "epoch": 237} {"train_loss": -28.52594566345215, "global_step": 28726, "epoch": 237} {"train_loss": -30.637622833251953, "global_step": 28727, "epoch": 237} {"train_loss": -27.698362350463867, "global_step": 28728, "epoch": 237} {"train_loss": -28.673404693603516, "global_step": 28729, "epoch": 237} {"train_loss": -28.356775283813477, "global_step": 28730, "epoch": 237} {"train_loss": -31.033782958984375, "global_step": 28731, "epoch": 237} {"train_loss": -27.839765548706055, "global_step": 28732, "epoch": 237} {"train_loss": -32.073787689208984, "global_step": 28733, "epoch": 237} {"train_loss": -31.28468132019043, "global_step": 28734, "epoch": 237} {"train_loss": -30.505935668945312, "global_step": 28735, "epoch": 237} {"train_loss": -30.43130874633789, "global_step": 28736, "epoch": 237} {"train_loss": -31.715911865234375, "global_step": 28737, "epoch": 237} {"train_loss": -31.841796875, "global_step": 28738, "epoch": 237} {"train_loss": -31.675525665283203, "global_step": 28739, "epoch": 237} {"train_loss": -30.538379669189453, "global_step": 28740, "epoch": 237} {"train_loss": -30.356643676757812, "global_step": 28741, "epoch": 237} {"train_loss": -31.685306549072266, "global_step": 28742, "epoch": 237} {"train_loss": -31.088184356689453, "global_step": 28743, "epoch": 237} {"train_loss": -31.708404541015625, "global_step": 28744, "epoch": 237} {"train_loss": -31.756519317626953, "global_step": 28745, "epoch": 237} {"train_loss": -31.9525146484375, "global_step": 28746, "epoch": 237} {"train_loss": -31.917774200439453, "global_step": 28747, "epoch": 237} {"train_loss": -32.075164794921875, "global_step": 28748, "epoch": 237} {"train_loss": -31.489734649658203, "global_step": 28749, "epoch": 237} {"train_loss": -31.6505069732666, "global_step": 28750, "epoch": 237} {"train_loss": -32.01429748535156, "global_step": 28751, "epoch": 237} {"train_loss": -31.746673583984375, "global_step": 28752, "epoch": 237} {"train_loss": -32.506813049316406, "global_step": 28753, "epoch": 237} {"train_loss": -31.234119415283203, "global_step": 28754, "epoch": 237} {"train_loss": -32.70546340942383, "global_step": 28755, "epoch": 237} {"train_loss": -32.170108795166016, "global_step": 28756, "epoch": 237} {"train_loss": -31.397947311401367, "global_step": 28757, "epoch": 237} {"train_loss": -32.13236618041992, "global_step": 28758, "epoch": 237} {"train_loss": -31.750341415405273, "global_step": 28759, "epoch": 237} {"train_loss": -32.04275131225586, "global_step": 28760, "epoch": 237} {"train_loss": -31.624399185180664, "global_step": 28761, "epoch": 237} {"train_loss": -31.52887535095215, "global_step": 28762, "epoch": 237} {"train_loss": -31.12812614440918, "global_step": 28763, "epoch": 237} {"train_loss": -31.786237716674805, "global_step": 28764, "epoch": 237} {"train_loss": -32.21474838256836, "global_step": 28765, "epoch": 237} {"train_loss": -32.0442008972168, "global_step": 28766, "epoch": 237} {"train_loss": -31.366653442382812, "global_step": 28767, "epoch": 237} {"train_loss": -30.28700828552246, "global_step": 28768, "epoch": 237} {"train_loss": -30.44706153869629, "global_step": 28769, "epoch": 237} {"train_loss": -31.2844295501709, "global_step": 28770, "epoch": 237} {"train_loss": -31.17343521118164, "global_step": 28771, "epoch": 237} {"train_loss": -30.756437301635742, "global_step": 28772, "epoch": 237} {"train_loss": -30.9932918548584, "global_step": 28773, "epoch": 237} {"train_loss": -29.863784790039062, "global_step": 28774, "epoch": 237} {"train_loss": -30.354856491088867, "global_step": 28775, "epoch": 237} {"train_loss": -29.632831573486328, "global_step": 28776, "epoch": 237} {"train_loss": -29.24338722229004, "global_step": 28777, "epoch": 237} {"train_loss": -28.10706901550293, "global_step": 28778, "epoch": 237} {"train_loss": -28.857135772705078, "global_step": 28779, "epoch": 237} {"train_loss": -27.75205421447754, "global_step": 28780, "epoch": 237} {"train_loss": -25.98383903503418, "global_step": 28781, "epoch": 237} {"train_loss": -28.492956161499023, "global_step": 28782, "epoch": 237} {"train_loss": -31.025434494018555, "global_step": 28783, "epoch": 237} {"train_loss": -30.13129234313965, "global_step": 28784, "epoch": 237} {"train_loss": -30.480350494384766, "global_step": 28785, "epoch": 237} {"train_loss": -30.6483154296875, "global_step": 28786, "epoch": 237} {"train_loss": -30.755126953125, "global_step": 28787, "epoch": 237} {"train_loss": -30.935888290405273, "global_step": 28788, "epoch": 237} {"train_loss": -30.912092208862305, "global_step": 28789, "epoch": 237} {"train_loss": -30.776020050048828, "global_step": 28790, "epoch": 237} {"train_loss": -31.34771156311035, "global_step": 28791, "epoch": 237} {"train_loss": -31.4948673248291, "global_step": 28792, "epoch": 237} {"train_loss": -31.28809928894043, "global_step": 28793, "epoch": 237} {"train_loss": -31.186365127563477, "global_step": 28794, "epoch": 237} {"train_loss": -30.962783813476562, "global_step": 28795, "epoch": 237} {"train_loss": -31.39739990234375, "global_step": 28796, "epoch": 237} {"train_loss": -31.08158852443222, "global_step": 28797, "epoch": 237, "val_loss": 2695921.25} {"train_loss": -31.00699234008789, "global_step": 28798, "epoch": 238} {"train_loss": -31.70631217956543, "global_step": 28799, "epoch": 238} {"train_loss": -30.8370418548584, "global_step": 28800, "epoch": 238} {"train_loss": -31.417428970336914, "global_step": 28801, "epoch": 238} {"train_loss": -31.335721969604492, "global_step": 28802, "epoch": 238} {"train_loss": -31.03651237487793, "global_step": 28803, "epoch": 238} {"train_loss": -31.51129722595215, "global_step": 28804, "epoch": 238} {"train_loss": -31.092182159423828, "global_step": 28805, "epoch": 238} {"train_loss": -31.599475860595703, "global_step": 28806, "epoch": 238} {"train_loss": -31.49761390686035, "global_step": 28807, "epoch": 238} {"train_loss": -31.695005416870117, "global_step": 28808, "epoch": 238} {"train_loss": -31.322021484375, "global_step": 28809, "epoch": 238} {"train_loss": -31.398523330688477, "global_step": 28810, "epoch": 238} {"train_loss": -31.267332077026367, "global_step": 28811, "epoch": 238} {"train_loss": -31.428668975830078, "global_step": 28812, "epoch": 238} {"train_loss": -31.7919864654541, "global_step": 28813, "epoch": 238} {"train_loss": -31.818500518798828, "global_step": 28814, "epoch": 238} {"train_loss": -32.03840255737305, "global_step": 28815, "epoch": 238} {"train_loss": -31.768875122070312, "global_step": 28816, "epoch": 238} {"train_loss": -31.897384643554688, "global_step": 28817, "epoch": 238} {"train_loss": -31.7545166015625, "global_step": 28818, "epoch": 238} {"train_loss": -31.85663414001465, "global_step": 28819, "epoch": 238} {"train_loss": -31.797311782836914, "global_step": 28820, "epoch": 238} {"train_loss": -32.1937370300293, "global_step": 28821, "epoch": 238} {"train_loss": -32.10774230957031, "global_step": 28822, "epoch": 238} {"train_loss": -32.43429183959961, "global_step": 28823, "epoch": 238} {"train_loss": -31.835224151611328, "global_step": 28824, "epoch": 238} {"train_loss": -31.673078536987305, "global_step": 28825, "epoch": 238} {"train_loss": -32.01172637939453, "global_step": 28826, "epoch": 238} {"train_loss": -32.084228515625, "global_step": 28827, "epoch": 238} {"train_loss": -30.920995712280273, "global_step": 28828, "epoch": 238} {"train_loss": -29.6153621673584, "global_step": 28829, "epoch": 238} {"train_loss": -23.884153366088867, "global_step": 28830, "epoch": 238} {"train_loss": -26.145334243774414, "global_step": 28831, "epoch": 238} {"train_loss": -31.641794204711914, "global_step": 28832, "epoch": 238} {"train_loss": -29.133869171142578, "global_step": 28833, "epoch": 238} {"train_loss": -25.274898529052734, "global_step": 28834, "epoch": 238} {"train_loss": -30.333288192749023, "global_step": 28835, "epoch": 238} {"train_loss": -28.048192977905273, "global_step": 28836, "epoch": 238} {"train_loss": -30.886322021484375, "global_step": 28837, "epoch": 238} {"train_loss": -29.81784439086914, "global_step": 28838, "epoch": 238} {"train_loss": -31.394001007080078, "global_step": 28839, "epoch": 238} {"train_loss": -29.228546142578125, "global_step": 28840, "epoch": 238} {"train_loss": -31.328357696533203, "global_step": 28841, "epoch": 238} {"train_loss": -30.521839141845703, "global_step": 28842, "epoch": 238} {"train_loss": -30.826833724975586, "global_step": 28843, "epoch": 238} {"train_loss": -31.14432144165039, "global_step": 28844, "epoch": 238} {"train_loss": -30.956863403320312, "global_step": 28845, "epoch": 238} {"train_loss": -30.431318283081055, "global_step": 28846, "epoch": 238} {"train_loss": -31.371923446655273, "global_step": 28847, "epoch": 238} {"train_loss": -31.203210830688477, "global_step": 28848, "epoch": 238} {"train_loss": -31.15130043029785, "global_step": 28849, "epoch": 238} {"train_loss": -30.950407028198242, "global_step": 28850, "epoch": 238} {"train_loss": -31.31497573852539, "global_step": 28851, "epoch": 238} {"train_loss": -31.6533145904541, "global_step": 28852, "epoch": 238} {"train_loss": -31.770954132080078, "global_step": 28853, "epoch": 238} {"train_loss": -31.66510581970215, "global_step": 28854, "epoch": 238} {"train_loss": -31.470651626586914, "global_step": 28855, "epoch": 238} {"train_loss": -31.553253173828125, "global_step": 28856, "epoch": 238} {"train_loss": -31.693647384643555, "global_step": 28857, "epoch": 238} {"train_loss": -31.462615966796875, "global_step": 28858, "epoch": 238} {"train_loss": -31.53828239440918, "global_step": 28859, "epoch": 238} {"train_loss": -31.394811630249023, "global_step": 28860, "epoch": 238} {"train_loss": -31.57683753967285, "global_step": 28861, "epoch": 238} {"train_loss": -30.860116958618164, "global_step": 28862, "epoch": 238} {"train_loss": -31.507801055908203, "global_step": 28863, "epoch": 238} {"train_loss": -31.246301651000977, "global_step": 28864, "epoch": 238} {"train_loss": -31.913742065429688, "global_step": 28865, "epoch": 238} {"train_loss": -31.155517578125, "global_step": 28866, "epoch": 238} {"train_loss": -30.849653244018555, "global_step": 28867, "epoch": 238} {"train_loss": -29.612043380737305, "global_step": 28868, "epoch": 238} {"train_loss": -28.23963737487793, "global_step": 28869, "epoch": 238} {"train_loss": -27.494916915893555, "global_step": 28870, "epoch": 238} {"train_loss": -24.63517951965332, "global_step": 28871, "epoch": 238} {"train_loss": -26.65755271911621, "global_step": 28872, "epoch": 238} {"train_loss": -30.880414962768555, "global_step": 28873, "epoch": 238} {"train_loss": -29.585004806518555, "global_step": 28874, "epoch": 238} {"train_loss": -30.492660522460938, "global_step": 28875, "epoch": 238} {"train_loss": -29.8590145111084, "global_step": 28876, "epoch": 238} {"train_loss": -31.30986976623535, "global_step": 28877, "epoch": 238} {"train_loss": -30.664798736572266, "global_step": 28878, "epoch": 238} {"train_loss": -29.502721786499023, "global_step": 28879, "epoch": 238} {"train_loss": -30.69343376159668, "global_step": 28880, "epoch": 238} {"train_loss": -31.4316349029541, "global_step": 28881, "epoch": 238} {"train_loss": -30.791553497314453, "global_step": 28882, "epoch": 238} {"train_loss": -30.085290908813477, "global_step": 28883, "epoch": 238} {"train_loss": -31.076629638671875, "global_step": 28884, "epoch": 238} {"train_loss": -29.859466552734375, "global_step": 28885, "epoch": 238} {"train_loss": -30.846113204956055, "global_step": 28886, "epoch": 238} {"train_loss": -30.82931900024414, "global_step": 28887, "epoch": 238} {"train_loss": -30.723590850830078, "global_step": 28888, "epoch": 238} {"train_loss": -31.02042579650879, "global_step": 28889, "epoch": 238} {"train_loss": -30.676855087280273, "global_step": 28890, "epoch": 238} {"train_loss": -31.867313385009766, "global_step": 28891, "epoch": 238} {"train_loss": -30.967496871948242, "global_step": 28892, "epoch": 238} {"train_loss": -31.56085205078125, "global_step": 28893, "epoch": 238} {"train_loss": -31.1312313079834, "global_step": 28894, "epoch": 238} {"train_loss": -31.461288452148438, "global_step": 28895, "epoch": 238} {"train_loss": -31.29343605041504, "global_step": 28896, "epoch": 238} {"train_loss": -31.836517333984375, "global_step": 28897, "epoch": 238} {"train_loss": -31.152170181274414, "global_step": 28898, "epoch": 238} {"train_loss": -31.660703659057617, "global_step": 28899, "epoch": 238} {"train_loss": -31.36515235900879, "global_step": 28900, "epoch": 238} {"train_loss": -31.507587432861328, "global_step": 28901, "epoch": 238} {"train_loss": -31.43474769592285, "global_step": 28902, "epoch": 238} {"train_loss": -31.686649322509766, "global_step": 28903, "epoch": 238} {"train_loss": -31.5433292388916, "global_step": 28904, "epoch": 238} {"train_loss": -31.449182510375977, "global_step": 28905, "epoch": 238} {"train_loss": -31.560428619384766, "global_step": 28906, "epoch": 238} {"train_loss": -32.234920501708984, "global_step": 28907, "epoch": 238} {"train_loss": -31.398956298828125, "global_step": 28908, "epoch": 238} {"train_loss": -31.847314834594727, "global_step": 28909, "epoch": 238} {"train_loss": -31.507190704345703, "global_step": 28910, "epoch": 238} {"train_loss": -31.904993057250977, "global_step": 28911, "epoch": 238} {"train_loss": -31.57390785217285, "global_step": 28912, "epoch": 238} {"train_loss": -32.16095733642578, "global_step": 28913, "epoch": 238} {"train_loss": -31.91596031188965, "global_step": 28914, "epoch": 238} {"train_loss": -31.643529891967773, "global_step": 28915, "epoch": 238} {"train_loss": -32.00711441040039, "global_step": 28916, "epoch": 238} {"train_loss": -31.510587692260742, "global_step": 28917, "epoch": 238} {"train_loss": -30.929796739058062, "global_step": 28918, "epoch": 238, "val_loss": 2562724.0} {"train_loss": -31.331274032592773, "global_step": 28919, "epoch": 239} {"train_loss": -31.719690322875977, "global_step": 28920, "epoch": 239} {"train_loss": -31.434919357299805, "global_step": 28921, "epoch": 239} {"train_loss": -31.728534698486328, "global_step": 28922, "epoch": 239} {"train_loss": -32.01987838745117, "global_step": 28923, "epoch": 239} {"train_loss": -31.756031036376953, "global_step": 28924, "epoch": 239} {"train_loss": -31.50910758972168, "global_step": 28925, "epoch": 239} {"train_loss": -31.9561824798584, "global_step": 28926, "epoch": 239} {"train_loss": -31.825918197631836, "global_step": 28927, "epoch": 239} {"train_loss": -31.990936279296875, "global_step": 28928, "epoch": 239} {"train_loss": -31.78778076171875, "global_step": 28929, "epoch": 239} {"train_loss": -32.05792999267578, "global_step": 28930, "epoch": 239} {"train_loss": -31.55655860900879, "global_step": 28931, "epoch": 239} {"train_loss": -31.916259765625, "global_step": 28932, "epoch": 239} {"train_loss": -31.961545944213867, "global_step": 28933, "epoch": 239} {"train_loss": -31.674468994140625, "global_step": 28934, "epoch": 239} {"train_loss": -31.7258243560791, "global_step": 28935, "epoch": 239} {"train_loss": -31.719518661499023, "global_step": 28936, "epoch": 239} {"train_loss": -30.587255477905273, "global_step": 28937, "epoch": 239} {"train_loss": -31.97577476501465, "global_step": 28938, "epoch": 239} {"train_loss": -32.15140914916992, "global_step": 28939, "epoch": 239} {"train_loss": -31.85028648376465, "global_step": 28940, "epoch": 239} {"train_loss": -31.431257247924805, "global_step": 28941, "epoch": 239} {"train_loss": -32.28886032104492, "global_step": 28942, "epoch": 239} {"train_loss": -31.829023361206055, "global_step": 28943, "epoch": 239} {"train_loss": -31.359704971313477, "global_step": 28944, "epoch": 239} {"train_loss": -31.191492080688477, "global_step": 28945, "epoch": 239} {"train_loss": -30.360706329345703, "global_step": 28946, "epoch": 239} {"train_loss": -31.744144439697266, "global_step": 28947, "epoch": 239} {"train_loss": -31.477819442749023, "global_step": 28948, "epoch": 239} {"train_loss": -31.6337833404541, "global_step": 28949, "epoch": 239} {"train_loss": -31.69495964050293, "global_step": 28950, "epoch": 239} {"train_loss": -31.674169540405273, "global_step": 28951, "epoch": 239} {"train_loss": -32.16946029663086, "global_step": 28952, "epoch": 239} {"train_loss": -32.37945556640625, "global_step": 28953, "epoch": 239} {"train_loss": -32.594905853271484, "global_step": 28954, "epoch": 239} {"train_loss": -31.903518676757812, "global_step": 28955, "epoch": 239} {"train_loss": -32.089046478271484, "global_step": 28956, "epoch": 239} {"train_loss": -31.932565689086914, "global_step": 28957, "epoch": 239} {"train_loss": -31.756635665893555, "global_step": 28958, "epoch": 239} {"train_loss": -32.60471725463867, "global_step": 28959, "epoch": 239} {"train_loss": -32.13149642944336, "global_step": 28960, "epoch": 239} {"train_loss": -31.935956954956055, "global_step": 28961, "epoch": 239} {"train_loss": -32.168479919433594, "global_step": 28962, "epoch": 239} {"train_loss": -32.6261100769043, "global_step": 28963, "epoch": 239} {"train_loss": -32.147499084472656, "global_step": 28964, "epoch": 239} {"train_loss": -31.400487899780273, "global_step": 28965, "epoch": 239} {"train_loss": -32.23163986206055, "global_step": 28966, "epoch": 239} {"train_loss": -31.58026695251465, "global_step": 28967, "epoch": 239} {"train_loss": -31.54408073425293, "global_step": 28968, "epoch": 239} {"train_loss": -29.547494888305664, "global_step": 28969, "epoch": 239} {"train_loss": -23.672388076782227, "global_step": 28970, "epoch": 239} {"train_loss": -19.375307083129883, "global_step": 28971, "epoch": 239} {"train_loss": -26.31061363220215, "global_step": 28972, "epoch": 239} {"train_loss": -31.624975204467773, "global_step": 28973, "epoch": 239} {"train_loss": -27.745044708251953, "global_step": 28974, "epoch": 239} {"train_loss": -30.060007095336914, "global_step": 28975, "epoch": 239} {"train_loss": -29.434850692749023, "global_step": 28976, "epoch": 239} {"train_loss": -29.234949111938477, "global_step": 28977, "epoch": 239} {"train_loss": -29.820636749267578, "global_step": 28978, "epoch": 239} {"train_loss": -30.366165161132812, "global_step": 28979, "epoch": 239} {"train_loss": -30.77457046508789, "global_step": 28980, "epoch": 239} {"train_loss": -31.20271873474121, "global_step": 28981, "epoch": 239} {"train_loss": -29.880643844604492, "global_step": 28982, "epoch": 239} {"train_loss": -31.60593032836914, "global_step": 28983, "epoch": 239} {"train_loss": -31.600112915039062, "global_step": 28984, "epoch": 239} {"train_loss": -31.08935546875, "global_step": 28985, "epoch": 239} {"train_loss": -31.204269409179688, "global_step": 28986, "epoch": 239} {"train_loss": -32.11848449707031, "global_step": 28987, "epoch": 239} {"train_loss": -31.303564071655273, "global_step": 28988, "epoch": 239} {"train_loss": -31.526004791259766, "global_step": 28989, "epoch": 239} {"train_loss": -31.184362411499023, "global_step": 28990, "epoch": 239} {"train_loss": -31.33551025390625, "global_step": 28991, "epoch": 239} {"train_loss": -32.15301513671875, "global_step": 28992, "epoch": 239} {"train_loss": -31.83319664001465, "global_step": 28993, "epoch": 239} {"train_loss": -31.40534782409668, "global_step": 28994, "epoch": 239} {"train_loss": -32.02254867553711, "global_step": 28995, "epoch": 239} {"train_loss": -31.91147232055664, "global_step": 28996, "epoch": 239} {"train_loss": -31.12760353088379, "global_step": 28997, "epoch": 239} {"train_loss": -31.89265251159668, "global_step": 28998, "epoch": 239} {"train_loss": -31.985280990600586, "global_step": 28999, "epoch": 239} {"train_loss": -31.275983810424805, "global_step": 29000, "epoch": 239} {"train_loss": -31.43817710876465, "global_step": 29001, "epoch": 239} {"train_loss": -31.85272216796875, "global_step": 29002, "epoch": 239} {"train_loss": -31.93181800842285, "global_step": 29003, "epoch": 239} {"train_loss": -31.80242347717285, "global_step": 29004, "epoch": 239} {"train_loss": -32.15449905395508, "global_step": 29005, "epoch": 239} {"train_loss": -31.994550704956055, "global_step": 29006, "epoch": 239} {"train_loss": -31.97804832458496, "global_step": 29007, "epoch": 239} {"train_loss": -32.04043197631836, "global_step": 29008, "epoch": 239} {"train_loss": -31.90511131286621, "global_step": 29009, "epoch": 239} {"train_loss": -31.424484252929688, "global_step": 29010, "epoch": 239} {"train_loss": -31.7082462310791, "global_step": 29011, "epoch": 239} {"train_loss": -30.98794937133789, "global_step": 29012, "epoch": 239} {"train_loss": -28.197751998901367, "global_step": 29013, "epoch": 239} {"train_loss": -16.154088973999023, "global_step": 29014, "epoch": 239} {"train_loss": -7.804257392883301, "global_step": 29015, "epoch": 239} {"train_loss": -24.724050521850586, "global_step": 29016, "epoch": 239} {"train_loss": -26.5721378326416, "global_step": 29017, "epoch": 239} {"train_loss": -29.197345733642578, "global_step": 29018, "epoch": 239} {"train_loss": -25.55036163330078, "global_step": 29019, "epoch": 239} {"train_loss": -30.19976234436035, "global_step": 29020, "epoch": 239} {"train_loss": -27.00404167175293, "global_step": 29021, "epoch": 239} {"train_loss": -29.03826904296875, "global_step": 29022, "epoch": 239} {"train_loss": -31.061609268188477, "global_step": 29023, "epoch": 239} {"train_loss": -29.50287437438965, "global_step": 29024, "epoch": 239} {"train_loss": -28.226062774658203, "global_step": 29025, "epoch": 239} {"train_loss": -30.58729362487793, "global_step": 29026, "epoch": 239} {"train_loss": -30.356937408447266, "global_step": 29027, "epoch": 239} {"train_loss": -29.604040145874023, "global_step": 29028, "epoch": 239} {"train_loss": -29.51923942565918, "global_step": 29029, "epoch": 239} {"train_loss": -30.301420211791992, "global_step": 29030, "epoch": 239} {"train_loss": -30.36882972717285, "global_step": 29031, "epoch": 239} {"train_loss": -31.04852294921875, "global_step": 29032, "epoch": 239} {"train_loss": -30.373184204101562, "global_step": 29033, "epoch": 239} {"train_loss": -30.498926162719727, "global_step": 29034, "epoch": 239} {"train_loss": -30.20840835571289, "global_step": 29035, "epoch": 239} {"train_loss": -30.629613876342773, "global_step": 29036, "epoch": 239} {"train_loss": -30.890554428100586, "global_step": 29037, "epoch": 239} {"train_loss": -31.323108673095703, "global_step": 29038, "epoch": 239} {"train_loss": -30.569175113331188, "global_step": 29039, "epoch": 239, "val_loss": 2714481.25} {"train_loss": -30.772480010986328, "global_step": 29040, "epoch": 240} {"train_loss": -30.924320220947266, "global_step": 29041, "epoch": 240} {"train_loss": -31.2668514251709, "global_step": 29042, "epoch": 240} {"train_loss": -31.08320426940918, "global_step": 29043, "epoch": 240} {"train_loss": -31.266345977783203, "global_step": 29044, "epoch": 240} {"train_loss": -31.20745849609375, "global_step": 29045, "epoch": 240} {"train_loss": -31.28566551208496, "global_step": 29046, "epoch": 240} {"train_loss": -31.295190811157227, "global_step": 29047, "epoch": 240} {"train_loss": -31.23817253112793, "global_step": 29048, "epoch": 240} {"train_loss": -31.517414093017578, "global_step": 29049, "epoch": 240} {"train_loss": -31.344228744506836, "global_step": 29050, "epoch": 240} {"train_loss": -31.69866943359375, "global_step": 29051, "epoch": 240} {"train_loss": -31.865676879882812, "global_step": 29052, "epoch": 240} {"train_loss": -31.762500762939453, "global_step": 29053, "epoch": 240} {"train_loss": -31.822622299194336, "global_step": 29054, "epoch": 240} {"train_loss": -32.02169418334961, "global_step": 29055, "epoch": 240} {"train_loss": -31.857900619506836, "global_step": 29056, "epoch": 240} {"train_loss": -32.12934112548828, "global_step": 29057, "epoch": 240} {"train_loss": -32.023406982421875, "global_step": 29058, "epoch": 240} {"train_loss": -31.761646270751953, "global_step": 29059, "epoch": 240} {"train_loss": -32.012142181396484, "global_step": 29060, "epoch": 240} {"train_loss": -32.03895568847656, "global_step": 29061, "epoch": 240} {"train_loss": -31.780492782592773, "global_step": 29062, "epoch": 240} {"train_loss": -31.983259201049805, "global_step": 29063, "epoch": 240} {"train_loss": -32.0273323059082, "global_step": 29064, "epoch": 240} {"train_loss": -31.95155906677246, "global_step": 29065, "epoch": 240} {"train_loss": -31.503692626953125, "global_step": 29066, "epoch": 240} {"train_loss": -32.16473388671875, "global_step": 29067, "epoch": 240} {"train_loss": -32.007965087890625, "global_step": 29068, "epoch": 240} {"train_loss": -31.7537841796875, "global_step": 29069, "epoch": 240} {"train_loss": -31.96246337890625, "global_step": 29070, "epoch": 240} {"train_loss": -30.93755531311035, "global_step": 29071, "epoch": 240} {"train_loss": -27.695148468017578, "global_step": 29072, "epoch": 240} {"train_loss": -19.87001609802246, "global_step": 29073, "epoch": 240} {"train_loss": -14.951705932617188, "global_step": 29074, "epoch": 240} {"train_loss": -27.947967529296875, "global_step": 29075, "epoch": 240} {"train_loss": -26.83991813659668, "global_step": 29076, "epoch": 240} {"train_loss": -26.284839630126953, "global_step": 29077, "epoch": 240} {"train_loss": -28.722333908081055, "global_step": 29078, "epoch": 240} {"train_loss": -29.480621337890625, "global_step": 29079, "epoch": 240} {"train_loss": -28.57162857055664, "global_step": 29080, "epoch": 240} {"train_loss": -29.30246925354004, "global_step": 29081, "epoch": 240} {"train_loss": -30.211267471313477, "global_step": 29082, "epoch": 240} {"train_loss": -28.5821590423584, "global_step": 29083, "epoch": 240} {"train_loss": -29.865392684936523, "global_step": 29084, "epoch": 240} {"train_loss": -30.15582847595215, "global_step": 29085, "epoch": 240} {"train_loss": -30.13227653503418, "global_step": 29086, "epoch": 240} {"train_loss": -29.347867965698242, "global_step": 29087, "epoch": 240} {"train_loss": -29.36244010925293, "global_step": 29088, "epoch": 240} {"train_loss": -30.785663604736328, "global_step": 29089, "epoch": 240} {"train_loss": -29.207056045532227, "global_step": 29090, "epoch": 240} {"train_loss": -30.084585189819336, "global_step": 29091, "epoch": 240} {"train_loss": -29.987852096557617, "global_step": 29092, "epoch": 240} {"train_loss": -30.499170303344727, "global_step": 29093, "epoch": 240} {"train_loss": -30.017929077148438, "global_step": 29094, "epoch": 240} {"train_loss": -30.3102970123291, "global_step": 29095, "epoch": 240} {"train_loss": -30.54604148864746, "global_step": 29096, "epoch": 240} {"train_loss": -30.870819091796875, "global_step": 29097, "epoch": 240} {"train_loss": -30.231393814086914, "global_step": 29098, "epoch": 240} {"train_loss": -30.0765438079834, "global_step": 29099, "epoch": 240} {"train_loss": -30.63862419128418, "global_step": 29100, "epoch": 240} {"train_loss": -30.05365562438965, "global_step": 29101, "epoch": 240} {"train_loss": -30.4954891204834, "global_step": 29102, "epoch": 240} {"train_loss": -30.095294952392578, "global_step": 29103, "epoch": 240} {"train_loss": -31.103866577148438, "global_step": 29104, "epoch": 240} {"train_loss": -30.34339714050293, "global_step": 29105, "epoch": 240} {"train_loss": -30.679290771484375, "global_step": 29106, "epoch": 240} {"train_loss": -30.867324829101562, "global_step": 29107, "epoch": 240} {"train_loss": -30.5398006439209, "global_step": 29108, "epoch": 240} {"train_loss": -31.193571090698242, "global_step": 29109, "epoch": 240} {"train_loss": -31.16065788269043, "global_step": 29110, "epoch": 240} {"train_loss": -31.2053279876709, "global_step": 29111, "epoch": 240} {"train_loss": -31.340534210205078, "global_step": 29112, "epoch": 240} {"train_loss": -31.255125045776367, "global_step": 29113, "epoch": 240} {"train_loss": -31.71864128112793, "global_step": 29114, "epoch": 240} {"train_loss": -31.217138290405273, "global_step": 29115, "epoch": 240} {"train_loss": -31.324172973632812, "global_step": 29116, "epoch": 240} {"train_loss": -31.604572296142578, "global_step": 29117, "epoch": 240} {"train_loss": -31.616352081298828, "global_step": 29118, "epoch": 240} {"train_loss": -31.310216903686523, "global_step": 29119, "epoch": 240} {"train_loss": -31.8542537689209, "global_step": 29120, "epoch": 240} {"train_loss": -31.591230392456055, "global_step": 29121, "epoch": 240} {"train_loss": -31.495519638061523, "global_step": 29122, "epoch": 240} {"train_loss": -31.38641357421875, "global_step": 29123, "epoch": 240} {"train_loss": -31.448577880859375, "global_step": 29124, "epoch": 240} {"train_loss": -32.061946868896484, "global_step": 29125, "epoch": 240} {"train_loss": -31.78133201599121, "global_step": 29126, "epoch": 240} {"train_loss": -32.15287399291992, "global_step": 29127, "epoch": 240} {"train_loss": -31.9443302154541, "global_step": 29128, "epoch": 240} {"train_loss": -31.99261474609375, "global_step": 29129, "epoch": 240} {"train_loss": -31.92962074279785, "global_step": 29130, "epoch": 240} {"train_loss": -31.987293243408203, "global_step": 29131, "epoch": 240} {"train_loss": -31.745147705078125, "global_step": 29132, "epoch": 240} {"train_loss": -30.94968605041504, "global_step": 29133, "epoch": 240} {"train_loss": -31.411291122436523, "global_step": 29134, "epoch": 240} {"train_loss": -32.22509002685547, "global_step": 29135, "epoch": 240} {"train_loss": -31.72626304626465, "global_step": 29136, "epoch": 240} {"train_loss": -31.30426597595215, "global_step": 29137, "epoch": 240} {"train_loss": -32.23401641845703, "global_step": 29138, "epoch": 240} {"train_loss": -31.515045166015625, "global_step": 29139, "epoch": 240} {"train_loss": -32.202598571777344, "global_step": 29140, "epoch": 240} {"train_loss": -31.66213035583496, "global_step": 29141, "epoch": 240} {"train_loss": -32.1158447265625, "global_step": 29142, "epoch": 240} {"train_loss": -31.800689697265625, "global_step": 29143, "epoch": 240} {"train_loss": -31.895475387573242, "global_step": 29144, "epoch": 240} {"train_loss": -31.91097068786621, "global_step": 29145, "epoch": 240} {"train_loss": -32.0559196472168, "global_step": 29146, "epoch": 240} {"train_loss": -31.88043212890625, "global_step": 29147, "epoch": 240} {"train_loss": -31.60727882385254, "global_step": 29148, "epoch": 240} {"train_loss": -31.6669979095459, "global_step": 29149, "epoch": 240} {"train_loss": -31.298938751220703, "global_step": 29150, "epoch": 240} {"train_loss": -29.75146484375, "global_step": 29151, "epoch": 240} {"train_loss": -25.325443267822266, "global_step": 29152, "epoch": 240} {"train_loss": -13.31091594696045, "global_step": 29153, "epoch": 240} {"train_loss": 11.048474311828613, "global_step": 29154, "epoch": 240} {"train_loss": -22.83603858947754, "global_step": 29155, "epoch": 240} {"train_loss": -16.05515480041504, "global_step": 29156, "epoch": 240} {"train_loss": -25.275487899780273, "global_step": 29157, "epoch": 240} {"train_loss": -19.924274444580078, "global_step": 29158, "epoch": 240} {"train_loss": -30.426807403564453, "global_step": 29159, "epoch": 240} {"train_loss": -29.88380659119157, "global_step": 29160, "epoch": 240, "val_loss": 2543492.25} {"train_loss": -25.783544540405273, "global_step": 29161, "epoch": 241} {"train_loss": -28.449384689331055, "global_step": 29162, "epoch": 241} {"train_loss": -30.70990562438965, "global_step": 29163, "epoch": 241} {"train_loss": -29.53839111328125, "global_step": 29164, "epoch": 241} {"train_loss": -28.00636100769043, "global_step": 29165, "epoch": 241} {"train_loss": -28.4045352935791, "global_step": 29166, "epoch": 241} {"train_loss": -29.717620849609375, "global_step": 29167, "epoch": 241} {"train_loss": -29.88457679748535, "global_step": 29168, "epoch": 241} {"train_loss": -30.353668212890625, "global_step": 29169, "epoch": 241} {"train_loss": -30.002883911132812, "global_step": 29170, "epoch": 241} {"train_loss": -30.086164474487305, "global_step": 29171, "epoch": 241} {"train_loss": -28.0859432220459, "global_step": 29172, "epoch": 241} {"train_loss": -29.419113159179688, "global_step": 29173, "epoch": 241} {"train_loss": -29.71144676208496, "global_step": 29174, "epoch": 241} {"train_loss": -29.59852409362793, "global_step": 29175, "epoch": 241} {"train_loss": -29.38490104675293, "global_step": 29176, "epoch": 241} {"train_loss": -29.018808364868164, "global_step": 29177, "epoch": 241} {"train_loss": -27.0862979888916, "global_step": 29178, "epoch": 241} {"train_loss": -29.945541381835938, "global_step": 29179, "epoch": 241} {"train_loss": -27.094146728515625, "global_step": 29180, "epoch": 241} {"train_loss": -29.211200714111328, "global_step": 29181, "epoch": 241} {"train_loss": -28.3149471282959, "global_step": 29182, "epoch": 241} {"train_loss": -29.851160049438477, "global_step": 29183, "epoch": 241} {"train_loss": -28.27947425842285, "global_step": 29184, "epoch": 241} {"train_loss": -29.847003936767578, "global_step": 29185, "epoch": 241} {"train_loss": -30.21417236328125, "global_step": 29186, "epoch": 241} {"train_loss": -28.842214584350586, "global_step": 29187, "epoch": 241} {"train_loss": -29.959177017211914, "global_step": 29188, "epoch": 241} {"train_loss": -30.164281845092773, "global_step": 29189, "epoch": 241} {"train_loss": -30.012128829956055, "global_step": 29190, "epoch": 241} {"train_loss": -29.913415908813477, "global_step": 29191, "epoch": 241} {"train_loss": -29.698591232299805, "global_step": 29192, "epoch": 241} {"train_loss": -30.332685470581055, "global_step": 29193, "epoch": 241} {"train_loss": -30.20912742614746, "global_step": 29194, "epoch": 241} {"train_loss": -30.521997451782227, "global_step": 29195, "epoch": 241} {"train_loss": -30.660781860351562, "global_step": 29196, "epoch": 241} {"train_loss": -30.20240592956543, "global_step": 29197, "epoch": 241} {"train_loss": -30.339679718017578, "global_step": 29198, "epoch": 241} {"train_loss": -30.430654525756836, "global_step": 29199, "epoch": 241} {"train_loss": -30.526172637939453, "global_step": 29200, "epoch": 241} {"train_loss": -30.560287475585938, "global_step": 29201, "epoch": 241} {"train_loss": -31.03095817565918, "global_step": 29202, "epoch": 241} {"train_loss": -29.796300888061523, "global_step": 29203, "epoch": 241} {"train_loss": -31.06012535095215, "global_step": 29204, "epoch": 241} {"train_loss": -31.450153350830078, "global_step": 29205, "epoch": 241} {"train_loss": -30.65365982055664, "global_step": 29206, "epoch": 241} {"train_loss": -31.271982192993164, "global_step": 29207, "epoch": 241} {"train_loss": -31.033798217773438, "global_step": 29208, "epoch": 241} {"train_loss": -31.034616470336914, "global_step": 29209, "epoch": 241} {"train_loss": -31.216876983642578, "global_step": 29210, "epoch": 241} {"train_loss": -30.640933990478516, "global_step": 29211, "epoch": 241} {"train_loss": -31.3317928314209, "global_step": 29212, "epoch": 241} {"train_loss": -30.840612411499023, "global_step": 29213, "epoch": 241} {"train_loss": -31.266157150268555, "global_step": 29214, "epoch": 241} {"train_loss": -29.13605308532715, "global_step": 29215, "epoch": 241} {"train_loss": -30.806598663330078, "global_step": 29216, "epoch": 241} {"train_loss": -31.16304588317871, "global_step": 29217, "epoch": 241} {"train_loss": -30.584096908569336, "global_step": 29218, "epoch": 241} {"train_loss": -31.114225387573242, "global_step": 29219, "epoch": 241} {"train_loss": -30.576467514038086, "global_step": 29220, "epoch": 241} {"train_loss": -30.420156478881836, "global_step": 29221, "epoch": 241} {"train_loss": -30.354846954345703, "global_step": 29222, "epoch": 241} {"train_loss": -31.298736572265625, "global_step": 29223, "epoch": 241} {"train_loss": -31.172521591186523, "global_step": 29224, "epoch": 241} {"train_loss": -31.627145767211914, "global_step": 29225, "epoch": 241} {"train_loss": -29.480377197265625, "global_step": 29226, "epoch": 241} {"train_loss": -30.26490592956543, "global_step": 29227, "epoch": 241} {"train_loss": -29.683277130126953, "global_step": 29228, "epoch": 241} {"train_loss": -31.09156608581543, "global_step": 29229, "epoch": 241} {"train_loss": -30.859363555908203, "global_step": 29230, "epoch": 241} {"train_loss": -31.3951358795166, "global_step": 29231, "epoch": 241} {"train_loss": -30.729694366455078, "global_step": 29232, "epoch": 241} {"train_loss": -30.767822265625, "global_step": 29233, "epoch": 241} {"train_loss": -30.6716365814209, "global_step": 29234, "epoch": 241} {"train_loss": -30.932973861694336, "global_step": 29235, "epoch": 241} {"train_loss": -31.01861000061035, "global_step": 29236, "epoch": 241} {"train_loss": -31.517541885375977, "global_step": 29237, "epoch": 241} {"train_loss": -30.954015731811523, "global_step": 29238, "epoch": 241} {"train_loss": -31.22246742248535, "global_step": 29239, "epoch": 241} {"train_loss": -29.9504451751709, "global_step": 29240, "epoch": 241} {"train_loss": -31.495874404907227, "global_step": 29241, "epoch": 241} {"train_loss": -30.677703857421875, "global_step": 29242, "epoch": 241} {"train_loss": -31.554922103881836, "global_step": 29243, "epoch": 241} {"train_loss": -31.171051025390625, "global_step": 29244, "epoch": 241} {"train_loss": -31.169788360595703, "global_step": 29245, "epoch": 241} {"train_loss": -31.426013946533203, "global_step": 29246, "epoch": 241} {"train_loss": -31.24164390563965, "global_step": 29247, "epoch": 241} {"train_loss": -31.69539451599121, "global_step": 29248, "epoch": 241} {"train_loss": -31.33192253112793, "global_step": 29249, "epoch": 241} {"train_loss": -31.551294326782227, "global_step": 29250, "epoch": 241} {"train_loss": -31.37554931640625, "global_step": 29251, "epoch": 241} {"train_loss": -31.11488914489746, "global_step": 29252, "epoch": 241} {"train_loss": -31.318708419799805, "global_step": 29253, "epoch": 241} {"train_loss": -31.29224967956543, "global_step": 29254, "epoch": 241} {"train_loss": -31.437652587890625, "global_step": 29255, "epoch": 241} {"train_loss": -31.597946166992188, "global_step": 29256, "epoch": 241} {"train_loss": -31.376331329345703, "global_step": 29257, "epoch": 241} {"train_loss": -31.752517700195312, "global_step": 29258, "epoch": 241} {"train_loss": -31.782896041870117, "global_step": 29259, "epoch": 241} {"train_loss": -31.577783584594727, "global_step": 29260, "epoch": 241} {"train_loss": -32.26829528808594, "global_step": 29261, "epoch": 241} {"train_loss": -31.93462562561035, "global_step": 29262, "epoch": 241} {"train_loss": -31.5161190032959, "global_step": 29263, "epoch": 241} {"train_loss": -32.183135986328125, "global_step": 29264, "epoch": 241} {"train_loss": -32.2325325012207, "global_step": 29265, "epoch": 241} {"train_loss": -31.787750244140625, "global_step": 29266, "epoch": 241} {"train_loss": -31.952442169189453, "global_step": 29267, "epoch": 241} {"train_loss": -31.973926544189453, "global_step": 29268, "epoch": 241} {"train_loss": -32.29014205932617, "global_step": 29269, "epoch": 241} {"train_loss": -32.38644790649414, "global_step": 29270, "epoch": 241} {"train_loss": -32.138729095458984, "global_step": 29271, "epoch": 241} {"train_loss": -32.00312423706055, "global_step": 29272, "epoch": 241} {"train_loss": -31.5454158782959, "global_step": 29273, "epoch": 241} {"train_loss": -31.616010665893555, "global_step": 29274, "epoch": 241} {"train_loss": -31.742969512939453, "global_step": 29275, "epoch": 241} {"train_loss": -30.26569938659668, "global_step": 29276, "epoch": 241} {"train_loss": -25.846887588500977, "global_step": 29277, "epoch": 241} {"train_loss": -26.76191520690918, "global_step": 29278, "epoch": 241} {"train_loss": -30.255308151245117, "global_step": 29279, "epoch": 241} {"train_loss": -29.78897476196289, "global_step": 29280, "epoch": 241} {"train_loss": -30.49385488525895, "global_step": 29281, "epoch": 241, "val_loss": 2686489.25} {"train_loss": -30.828458786010742, "global_step": 29282, "epoch": 242} {"train_loss": -29.696561813354492, "global_step": 29283, "epoch": 242} {"train_loss": -29.886743545532227, "global_step": 29284, "epoch": 242} {"train_loss": -31.6798038482666, "global_step": 29285, "epoch": 242} {"train_loss": -30.6370792388916, "global_step": 29286, "epoch": 242} {"train_loss": -29.229907989501953, "global_step": 29287, "epoch": 242} {"train_loss": -30.737585067749023, "global_step": 29288, "epoch": 242} {"train_loss": -30.46489906311035, "global_step": 29289, "epoch": 242} {"train_loss": -31.334461212158203, "global_step": 29290, "epoch": 242} {"train_loss": -30.340417861938477, "global_step": 29291, "epoch": 242} {"train_loss": -30.768634796142578, "global_step": 29292, "epoch": 242} {"train_loss": -31.039514541625977, "global_step": 29293, "epoch": 242} {"train_loss": -30.770782470703125, "global_step": 29294, "epoch": 242} {"train_loss": -30.755659103393555, "global_step": 29295, "epoch": 242} {"train_loss": -32.084224700927734, "global_step": 29296, "epoch": 242} {"train_loss": -31.21685791015625, "global_step": 29297, "epoch": 242} {"train_loss": -31.346216201782227, "global_step": 29298, "epoch": 242} {"train_loss": -31.451492309570312, "global_step": 29299, "epoch": 242} {"train_loss": -31.481916427612305, "global_step": 29300, "epoch": 242} {"train_loss": -31.40162467956543, "global_step": 29301, "epoch": 242} {"train_loss": -31.279821395874023, "global_step": 29302, "epoch": 242} {"train_loss": -32.14892578125, "global_step": 29303, "epoch": 242} {"train_loss": -31.80731773376465, "global_step": 29304, "epoch": 242} {"train_loss": -31.467248916625977, "global_step": 29305, "epoch": 242} {"train_loss": -31.750171661376953, "global_step": 29306, "epoch": 242} {"train_loss": -31.526870727539062, "global_step": 29307, "epoch": 242} {"train_loss": -31.562829971313477, "global_step": 29308, "epoch": 242} {"train_loss": -31.834253311157227, "global_step": 29309, "epoch": 242} {"train_loss": -32.39836502075195, "global_step": 29310, "epoch": 242} {"train_loss": -31.808700561523438, "global_step": 29311, "epoch": 242} {"train_loss": -31.788223266601562, "global_step": 29312, "epoch": 242} {"train_loss": -32.061546325683594, "global_step": 29313, "epoch": 242} {"train_loss": -31.806232452392578, "global_step": 29314, "epoch": 242} {"train_loss": -32.09341049194336, "global_step": 29315, "epoch": 242} {"train_loss": -31.742523193359375, "global_step": 29316, "epoch": 242} {"train_loss": -31.856250762939453, "global_step": 29317, "epoch": 242} {"train_loss": -32.30579376220703, "global_step": 29318, "epoch": 242} {"train_loss": -32.30667495727539, "global_step": 29319, "epoch": 242} {"train_loss": -31.72944450378418, "global_step": 29320, "epoch": 242} {"train_loss": -32.35625076293945, "global_step": 29321, "epoch": 242} {"train_loss": -31.02436637878418, "global_step": 29322, "epoch": 242} {"train_loss": -30.786157608032227, "global_step": 29323, "epoch": 242} {"train_loss": -29.51051139831543, "global_step": 29324, "epoch": 242} {"train_loss": -30.496713638305664, "global_step": 29325, "epoch": 242} {"train_loss": -30.870670318603516, "global_step": 29326, "epoch": 242} {"train_loss": -31.727407455444336, "global_step": 29327, "epoch": 242} {"train_loss": -30.306848526000977, "global_step": 29328, "epoch": 242} {"train_loss": -29.506900787353516, "global_step": 29329, "epoch": 242} {"train_loss": -31.471704483032227, "global_step": 29330, "epoch": 242} {"train_loss": -30.61475944519043, "global_step": 29331, "epoch": 242} {"train_loss": -30.774845123291016, "global_step": 29332, "epoch": 242} {"train_loss": -29.680500030517578, "global_step": 29333, "epoch": 242} {"train_loss": -31.3796329498291, "global_step": 29334, "epoch": 242} {"train_loss": -29.842559814453125, "global_step": 29335, "epoch": 242} {"train_loss": -31.252399444580078, "global_step": 29336, "epoch": 242} {"train_loss": -30.71113395690918, "global_step": 29337, "epoch": 242} {"train_loss": -30.754230499267578, "global_step": 29338, "epoch": 242} {"train_loss": -30.32642936706543, "global_step": 29339, "epoch": 242} {"train_loss": -30.98915672302246, "global_step": 29340, "epoch": 242} {"train_loss": -31.0526180267334, "global_step": 29341, "epoch": 242} {"train_loss": -31.498029708862305, "global_step": 29342, "epoch": 242} {"train_loss": -31.8161678314209, "global_step": 29343, "epoch": 242} {"train_loss": -31.724172592163086, "global_step": 29344, "epoch": 242} {"train_loss": -31.219106674194336, "global_step": 29345, "epoch": 242} {"train_loss": -31.5814266204834, "global_step": 29346, "epoch": 242} {"train_loss": -31.426794052124023, "global_step": 29347, "epoch": 242} {"train_loss": -31.290571212768555, "global_step": 29348, "epoch": 242} {"train_loss": -31.53866958618164, "global_step": 29349, "epoch": 242} {"train_loss": -31.456212997436523, "global_step": 29350, "epoch": 242} {"train_loss": -31.70965576171875, "global_step": 29351, "epoch": 242} {"train_loss": -31.829187393188477, "global_step": 29352, "epoch": 242} {"train_loss": -31.115461349487305, "global_step": 29353, "epoch": 242} {"train_loss": -30.96748924255371, "global_step": 29354, "epoch": 242} {"train_loss": -30.897907257080078, "global_step": 29355, "epoch": 242} {"train_loss": -31.376733779907227, "global_step": 29356, "epoch": 242} {"train_loss": -31.870819091796875, "global_step": 29357, "epoch": 242} {"train_loss": -31.829442977905273, "global_step": 29358, "epoch": 242} {"train_loss": -31.405115127563477, "global_step": 29359, "epoch": 242} {"train_loss": -31.58990478515625, "global_step": 29360, "epoch": 242} {"train_loss": -31.898563385009766, "global_step": 29361, "epoch": 242} {"train_loss": -31.54729652404785, "global_step": 29362, "epoch": 242} {"train_loss": -31.990711212158203, "global_step": 29363, "epoch": 242} {"train_loss": -31.85259437561035, "global_step": 29364, "epoch": 242} {"train_loss": -31.858810424804688, "global_step": 29365, "epoch": 242} {"train_loss": -32.17028045654297, "global_step": 29366, "epoch": 242} {"train_loss": -32.22806930541992, "global_step": 29367, "epoch": 242} {"train_loss": -32.0920524597168, "global_step": 29368, "epoch": 242} {"train_loss": -31.941726684570312, "global_step": 29369, "epoch": 242} {"train_loss": -31.92579460144043, "global_step": 29370, "epoch": 242} {"train_loss": -32.264827728271484, "global_step": 29371, "epoch": 242} {"train_loss": -31.761754989624023, "global_step": 29372, "epoch": 242} {"train_loss": -32.42439270019531, "global_step": 29373, "epoch": 242} {"train_loss": -32.0506591796875, "global_step": 29374, "epoch": 242} {"train_loss": -32.17973709106445, "global_step": 29375, "epoch": 242} {"train_loss": -32.4588623046875, "global_step": 29376, "epoch": 242} {"train_loss": -32.03518295288086, "global_step": 29377, "epoch": 242} {"train_loss": -31.770389556884766, "global_step": 29378, "epoch": 242} {"train_loss": -32.33182907104492, "global_step": 29379, "epoch": 242} {"train_loss": -31.1577205657959, "global_step": 29380, "epoch": 242} {"train_loss": -30.694971084594727, "global_step": 29381, "epoch": 242} {"train_loss": -30.6258544921875, "global_step": 29382, "epoch": 242} {"train_loss": -28.213369369506836, "global_step": 29383, "epoch": 242} {"train_loss": -30.06561851501465, "global_step": 29384, "epoch": 242} {"train_loss": -30.5711612701416, "global_step": 29385, "epoch": 242} {"train_loss": -28.69288444519043, "global_step": 29386, "epoch": 242} {"train_loss": -31.64118766784668, "global_step": 29387, "epoch": 242} {"train_loss": -30.102407455444336, "global_step": 29388, "epoch": 242} {"train_loss": -30.83345603942871, "global_step": 29389, "epoch": 242} {"train_loss": -30.518796920776367, "global_step": 29390, "epoch": 242} {"train_loss": -31.054061889648438, "global_step": 29391, "epoch": 242} {"train_loss": -29.717809677124023, "global_step": 29392, "epoch": 242} {"train_loss": -26.7718563079834, "global_step": 29393, "epoch": 242} {"train_loss": -27.341949462890625, "global_step": 29394, "epoch": 242} {"train_loss": -28.39291763305664, "global_step": 29395, "epoch": 242} {"train_loss": -31.023242950439453, "global_step": 29396, "epoch": 242} {"train_loss": -30.1391544342041, "global_step": 29397, "epoch": 242} {"train_loss": -30.36052894592285, "global_step": 29398, "epoch": 242} {"train_loss": -31.450149536132812, "global_step": 29399, "epoch": 242} {"train_loss": -30.40201759338379, "global_step": 29400, "epoch": 242} {"train_loss": -30.960708618164062, "global_step": 29401, "epoch": 242} {"train_loss": -31.128831563902295, "global_step": 29402, "epoch": 242, "val_loss": 2816853.25} {"train_loss": -31.036762237548828, "global_step": 29403, "epoch": 243} {"train_loss": -31.30548667907715, "global_step": 29404, "epoch": 243} {"train_loss": -30.799665451049805, "global_step": 29405, "epoch": 243} {"train_loss": -31.79719352722168, "global_step": 29406, "epoch": 243} {"train_loss": -31.3648624420166, "global_step": 29407, "epoch": 243} {"train_loss": -31.64060401916504, "global_step": 29408, "epoch": 243} {"train_loss": -31.33441734313965, "global_step": 29409, "epoch": 243} {"train_loss": -31.63484001159668, "global_step": 29410, "epoch": 243} {"train_loss": -31.321882247924805, "global_step": 29411, "epoch": 243} {"train_loss": -31.8256893157959, "global_step": 29412, "epoch": 243} {"train_loss": -31.600818634033203, "global_step": 29413, "epoch": 243} {"train_loss": -31.045154571533203, "global_step": 29414, "epoch": 243} {"train_loss": -31.506698608398438, "global_step": 29415, "epoch": 243} {"train_loss": -31.7783145904541, "global_step": 29416, "epoch": 243} {"train_loss": -31.962385177612305, "global_step": 29417, "epoch": 243} {"train_loss": -31.27498435974121, "global_step": 29418, "epoch": 243} {"train_loss": -31.690933227539062, "global_step": 29419, "epoch": 243} {"train_loss": -30.650592803955078, "global_step": 29420, "epoch": 243} {"train_loss": -31.706430435180664, "global_step": 29421, "epoch": 243} {"train_loss": -31.92664909362793, "global_step": 29422, "epoch": 243} {"train_loss": -31.70014762878418, "global_step": 29423, "epoch": 243} {"train_loss": -31.725513458251953, "global_step": 29424, "epoch": 243} {"train_loss": -31.460006713867188, "global_step": 29425, "epoch": 243} {"train_loss": -31.68280601501465, "global_step": 29426, "epoch": 243} {"train_loss": -31.790637969970703, "global_step": 29427, "epoch": 243} {"train_loss": -31.94740104675293, "global_step": 29428, "epoch": 243} {"train_loss": -31.99908447265625, "global_step": 29429, "epoch": 243} {"train_loss": -32.16408920288086, "global_step": 29430, "epoch": 243} {"train_loss": -32.5792236328125, "global_step": 29431, "epoch": 243} {"train_loss": -32.26937484741211, "global_step": 29432, "epoch": 243} {"train_loss": -32.505088806152344, "global_step": 29433, "epoch": 243} {"train_loss": -32.5026969909668, "global_step": 29434, "epoch": 243} {"train_loss": -32.6474494934082, "global_step": 29435, "epoch": 243} {"train_loss": -32.520320892333984, "global_step": 29436, "epoch": 243} {"train_loss": -32.541255950927734, "global_step": 29437, "epoch": 243} {"train_loss": -31.99762535095215, "global_step": 29438, "epoch": 243} {"train_loss": -32.09373092651367, "global_step": 29439, "epoch": 243} {"train_loss": -31.871368408203125, "global_step": 29440, "epoch": 243} {"train_loss": -32.00287628173828, "global_step": 29441, "epoch": 243} {"train_loss": -32.68569564819336, "global_step": 29442, "epoch": 243} {"train_loss": -31.9442195892334, "global_step": 29443, "epoch": 243} {"train_loss": -32.532493591308594, "global_step": 29444, "epoch": 243} {"train_loss": -32.20589065551758, "global_step": 29445, "epoch": 243} {"train_loss": -32.483192443847656, "global_step": 29446, "epoch": 243} {"train_loss": -31.991580963134766, "global_step": 29447, "epoch": 243} {"train_loss": -31.71270751953125, "global_step": 29448, "epoch": 243} {"train_loss": -32.3637809753418, "global_step": 29449, "epoch": 243} {"train_loss": -32.38761520385742, "global_step": 29450, "epoch": 243} {"train_loss": -31.839338302612305, "global_step": 29451, "epoch": 243} {"train_loss": -31.612640380859375, "global_step": 29452, "epoch": 243} {"train_loss": -30.524816513061523, "global_step": 29453, "epoch": 243} {"train_loss": -32.08167266845703, "global_step": 29454, "epoch": 243} {"train_loss": -30.610626220703125, "global_step": 29455, "epoch": 243} {"train_loss": -28.992050170898438, "global_step": 29456, "epoch": 243} {"train_loss": -29.633834838867188, "global_step": 29457, "epoch": 243} {"train_loss": -31.93230628967285, "global_step": 29458, "epoch": 243} {"train_loss": -29.95611000061035, "global_step": 29459, "epoch": 243} {"train_loss": -27.05580711364746, "global_step": 29460, "epoch": 243} {"train_loss": -30.063581466674805, "global_step": 29461, "epoch": 243} {"train_loss": -31.805633544921875, "global_step": 29462, "epoch": 243} {"train_loss": -30.113117218017578, "global_step": 29463, "epoch": 243} {"train_loss": -31.588560104370117, "global_step": 29464, "epoch": 243} {"train_loss": -30.933435440063477, "global_step": 29465, "epoch": 243} {"train_loss": -31.905637741088867, "global_step": 29466, "epoch": 243} {"train_loss": -30.791812896728516, "global_step": 29467, "epoch": 243} {"train_loss": -31.478870391845703, "global_step": 29468, "epoch": 243} {"train_loss": -31.124372482299805, "global_step": 29469, "epoch": 243} {"train_loss": -31.98291015625, "global_step": 29470, "epoch": 243} {"train_loss": -31.49062156677246, "global_step": 29471, "epoch": 243} {"train_loss": -32.221649169921875, "global_step": 29472, "epoch": 243} {"train_loss": -31.045713424682617, "global_step": 29473, "epoch": 243} {"train_loss": -32.316463470458984, "global_step": 29474, "epoch": 243} {"train_loss": -31.614599227905273, "global_step": 29475, "epoch": 243} {"train_loss": -32.006256103515625, "global_step": 29476, "epoch": 243} {"train_loss": -31.67998695373535, "global_step": 29477, "epoch": 243} {"train_loss": -32.384456634521484, "global_step": 29478, "epoch": 243} {"train_loss": -32.24311447143555, "global_step": 29479, "epoch": 243} {"train_loss": -31.95815086364746, "global_step": 29480, "epoch": 243} {"train_loss": -31.923171997070312, "global_step": 29481, "epoch": 243} {"train_loss": -32.09950256347656, "global_step": 29482, "epoch": 243} {"train_loss": -32.04293441772461, "global_step": 29483, "epoch": 243} {"train_loss": -32.20173645019531, "global_step": 29484, "epoch": 243} {"train_loss": -32.42326736450195, "global_step": 29485, "epoch": 243} {"train_loss": -31.400922775268555, "global_step": 29486, "epoch": 243} {"train_loss": -32.214019775390625, "global_step": 29487, "epoch": 243} {"train_loss": -32.63236618041992, "global_step": 29488, "epoch": 243} {"train_loss": -32.01610565185547, "global_step": 29489, "epoch": 243} {"train_loss": -31.837238311767578, "global_step": 29490, "epoch": 243} {"train_loss": -32.30119705200195, "global_step": 29491, "epoch": 243} {"train_loss": -32.39317321777344, "global_step": 29492, "epoch": 243} {"train_loss": -31.916284561157227, "global_step": 29493, "epoch": 243} {"train_loss": -32.158477783203125, "global_step": 29494, "epoch": 243} {"train_loss": -32.46845626831055, "global_step": 29495, "epoch": 243} {"train_loss": -32.31329345703125, "global_step": 29496, "epoch": 243} {"train_loss": -32.21596908569336, "global_step": 29497, "epoch": 243} {"train_loss": -32.496246337890625, "global_step": 29498, "epoch": 243} {"train_loss": -32.84920883178711, "global_step": 29499, "epoch": 243} {"train_loss": -32.5379638671875, "global_step": 29500, "epoch": 243} {"train_loss": -32.476844787597656, "global_step": 29501, "epoch": 243} {"train_loss": -32.094703674316406, "global_step": 29502, "epoch": 243} {"train_loss": -32.81983184814453, "global_step": 29503, "epoch": 243} {"train_loss": -32.606571197509766, "global_step": 29504, "epoch": 243} {"train_loss": -32.1684455871582, "global_step": 29505, "epoch": 243} {"train_loss": -31.254907608032227, "global_step": 29506, "epoch": 243} {"train_loss": -32.39619827270508, "global_step": 29507, "epoch": 243} {"train_loss": -32.39323043823242, "global_step": 29508, "epoch": 243} {"train_loss": -32.616207122802734, "global_step": 29509, "epoch": 243} {"train_loss": -32.205928802490234, "global_step": 29510, "epoch": 243} {"train_loss": -31.814228057861328, "global_step": 29511, "epoch": 243} {"train_loss": -32.78706359863281, "global_step": 29512, "epoch": 243} {"train_loss": -32.31071090698242, "global_step": 29513, "epoch": 243} {"train_loss": -32.43197250366211, "global_step": 29514, "epoch": 243} {"train_loss": -31.403888702392578, "global_step": 29515, "epoch": 243} {"train_loss": -31.997283935546875, "global_step": 29516, "epoch": 243} {"train_loss": -31.7843017578125, "global_step": 29517, "epoch": 243} {"train_loss": -32.68524932861328, "global_step": 29518, "epoch": 243} {"train_loss": -31.123281478881836, "global_step": 29519, "epoch": 243} {"train_loss": -31.964025497436523, "global_step": 29520, "epoch": 243} {"train_loss": -32.375240325927734, "global_step": 29521, "epoch": 243} {"train_loss": -31.876676559448242, "global_step": 29522, "epoch": 243} {"train_loss": -31.800476641694377, "global_step": 29523, "epoch": 243, "val_loss": 2730513.75} {"train_loss": -32.627281188964844, "global_step": 29524, "epoch": 244} {"train_loss": -31.6593017578125, "global_step": 29525, "epoch": 244} {"train_loss": -30.728652954101562, "global_step": 29526, "epoch": 244} {"train_loss": -31.75311279296875, "global_step": 29527, "epoch": 244} {"train_loss": -32.47701644897461, "global_step": 29528, "epoch": 244} {"train_loss": -31.14470863342285, "global_step": 29529, "epoch": 244} {"train_loss": -31.573257446289062, "global_step": 29530, "epoch": 244} {"train_loss": -31.613935470581055, "global_step": 29531, "epoch": 244} {"train_loss": -32.02785110473633, "global_step": 29532, "epoch": 244} {"train_loss": -31.3967227935791, "global_step": 29533, "epoch": 244} {"train_loss": -30.56560707092285, "global_step": 29534, "epoch": 244} {"train_loss": -31.976089477539062, "global_step": 29535, "epoch": 244} {"train_loss": -31.973302841186523, "global_step": 29536, "epoch": 244} {"train_loss": -30.97793960571289, "global_step": 29537, "epoch": 244} {"train_loss": -31.61343765258789, "global_step": 29538, "epoch": 244} {"train_loss": -32.33433151245117, "global_step": 29539, "epoch": 244} {"train_loss": -31.438894271850586, "global_step": 29540, "epoch": 244} {"train_loss": -31.789676666259766, "global_step": 29541, "epoch": 244} {"train_loss": -31.720373153686523, "global_step": 29542, "epoch": 244} {"train_loss": -31.639911651611328, "global_step": 29543, "epoch": 244} {"train_loss": -32.343196868896484, "global_step": 29544, "epoch": 244} {"train_loss": -31.866180419921875, "global_step": 29545, "epoch": 244} {"train_loss": -32.183135986328125, "global_step": 29546, "epoch": 244} {"train_loss": -32.42615509033203, "global_step": 29547, "epoch": 244} {"train_loss": -31.367563247680664, "global_step": 29548, "epoch": 244} {"train_loss": -32.1971321105957, "global_step": 29549, "epoch": 244} {"train_loss": -32.062461853027344, "global_step": 29550, "epoch": 244} {"train_loss": -32.2946662902832, "global_step": 29551, "epoch": 244} {"train_loss": -32.7990608215332, "global_step": 29552, "epoch": 244} {"train_loss": -31.983707427978516, "global_step": 29553, "epoch": 244} {"train_loss": -32.44013595581055, "global_step": 29554, "epoch": 244} {"train_loss": -32.50773239135742, "global_step": 29555, "epoch": 244} {"train_loss": -32.18511962890625, "global_step": 29556, "epoch": 244} {"train_loss": -32.08828353881836, "global_step": 29557, "epoch": 244} {"train_loss": -32.166168212890625, "global_step": 29558, "epoch": 244} {"train_loss": -31.108112335205078, "global_step": 29559, "epoch": 244} {"train_loss": -30.469038009643555, "global_step": 29560, "epoch": 244} {"train_loss": -32.43095016479492, "global_step": 29561, "epoch": 244} {"train_loss": -31.28192138671875, "global_step": 29562, "epoch": 244} {"train_loss": -31.748258590698242, "global_step": 29563, "epoch": 244} {"train_loss": -32.24558639526367, "global_step": 29564, "epoch": 244} {"train_loss": -31.857770919799805, "global_step": 29565, "epoch": 244} {"train_loss": -32.93904113769531, "global_step": 29566, "epoch": 244} {"train_loss": -32.08449935913086, "global_step": 29567, "epoch": 244} {"train_loss": -31.985273361206055, "global_step": 29568, "epoch": 244} {"train_loss": -32.87907791137695, "global_step": 29569, "epoch": 244} {"train_loss": -32.38151168823242, "global_step": 29570, "epoch": 244} {"train_loss": -32.09174346923828, "global_step": 29571, "epoch": 244} {"train_loss": -32.70197296142578, "global_step": 29572, "epoch": 244} {"train_loss": -32.7168083190918, "global_step": 29573, "epoch": 244} {"train_loss": -32.7989501953125, "global_step": 29574, "epoch": 244} {"train_loss": -32.43632888793945, "global_step": 29575, "epoch": 244} {"train_loss": -32.47441864013672, "global_step": 29576, "epoch": 244} {"train_loss": -32.88961410522461, "global_step": 29577, "epoch": 244} {"train_loss": -32.72841262817383, "global_step": 29578, "epoch": 244} {"train_loss": -32.23468017578125, "global_step": 29579, "epoch": 244} {"train_loss": -29.72028923034668, "global_step": 29580, "epoch": 244} {"train_loss": -25.12434196472168, "global_step": 29581, "epoch": 244} {"train_loss": -13.378275871276855, "global_step": 29582, "epoch": 244} {"train_loss": 1.5784882307052612, "global_step": 29583, "epoch": 244} {"train_loss": -22.697011947631836, "global_step": 29584, "epoch": 244} {"train_loss": -24.141523361206055, "global_step": 29585, "epoch": 244} {"train_loss": -25.30470848083496, "global_step": 29586, "epoch": 244} {"train_loss": -23.70574378967285, "global_step": 29587, "epoch": 244} {"train_loss": -31.085315704345703, "global_step": 29588, "epoch": 244} {"train_loss": -26.26067543029785, "global_step": 29589, "epoch": 244} {"train_loss": -27.460779190063477, "global_step": 29590, "epoch": 244} {"train_loss": -30.261966705322266, "global_step": 29591, "epoch": 244} {"train_loss": -30.2581787109375, "global_step": 29592, "epoch": 244} {"train_loss": -28.67913246154785, "global_step": 29593, "epoch": 244} {"train_loss": -28.867359161376953, "global_step": 29594, "epoch": 244} {"train_loss": -30.61321449279785, "global_step": 29595, "epoch": 244} {"train_loss": -30.48578453063965, "global_step": 29596, "epoch": 244} {"train_loss": -31.2329044342041, "global_step": 29597, "epoch": 244} {"train_loss": -30.10382080078125, "global_step": 29598, "epoch": 244} {"train_loss": -30.78962516784668, "global_step": 29599, "epoch": 244} {"train_loss": -29.979522705078125, "global_step": 29600, "epoch": 244} {"train_loss": -30.781635284423828, "global_step": 29601, "epoch": 244} {"train_loss": -30.4923152923584, "global_step": 29602, "epoch": 244} {"train_loss": -31.376882553100586, "global_step": 29603, "epoch": 244} {"train_loss": -31.08281898498535, "global_step": 29604, "epoch": 244} {"train_loss": -31.102569580078125, "global_step": 29605, "epoch": 244} {"train_loss": -30.779870986938477, "global_step": 29606, "epoch": 244} {"train_loss": -31.129444122314453, "global_step": 29607, "epoch": 244} {"train_loss": -30.83900260925293, "global_step": 29608, "epoch": 244} {"train_loss": -31.24788475036621, "global_step": 29609, "epoch": 244} {"train_loss": -31.221235275268555, "global_step": 29610, "epoch": 244} {"train_loss": -31.026926040649414, "global_step": 29611, "epoch": 244} {"train_loss": -31.447134017944336, "global_step": 29612, "epoch": 244} {"train_loss": -31.610273361206055, "global_step": 29613, "epoch": 244} {"train_loss": -31.492568969726562, "global_step": 29614, "epoch": 244} {"train_loss": -31.344404220581055, "global_step": 29615, "epoch": 244} {"train_loss": -31.469318389892578, "global_step": 29616, "epoch": 244} {"train_loss": -31.513696670532227, "global_step": 29617, "epoch": 244} {"train_loss": -31.873029708862305, "global_step": 29618, "epoch": 244} {"train_loss": -31.40070152282715, "global_step": 29619, "epoch": 244} {"train_loss": -31.513351440429688, "global_step": 29620, "epoch": 244} {"train_loss": -32.15776824951172, "global_step": 29621, "epoch": 244} {"train_loss": -31.654443740844727, "global_step": 29622, "epoch": 244} {"train_loss": -31.56183433532715, "global_step": 29623, "epoch": 244} {"train_loss": -31.657703399658203, "global_step": 29624, "epoch": 244} {"train_loss": -31.82110595703125, "global_step": 29625, "epoch": 244} {"train_loss": -32.09006881713867, "global_step": 29626, "epoch": 244} {"train_loss": -31.6612606048584, "global_step": 29627, "epoch": 244} {"train_loss": -32.27530288696289, "global_step": 29628, "epoch": 244} {"train_loss": -31.726612091064453, "global_step": 29629, "epoch": 244} {"train_loss": -32.18941879272461, "global_step": 29630, "epoch": 244} {"train_loss": -31.83405113220215, "global_step": 29631, "epoch": 244} {"train_loss": -31.795949935913086, "global_step": 29632, "epoch": 244} {"train_loss": -31.9294490814209, "global_step": 29633, "epoch": 244} {"train_loss": -32.27397918701172, "global_step": 29634, "epoch": 244} {"train_loss": -31.625457763671875, "global_step": 29635, "epoch": 244} {"train_loss": -32.05747985839844, "global_step": 29636, "epoch": 244} {"train_loss": -32.37273406982422, "global_step": 29637, "epoch": 244} {"train_loss": -32.023319244384766, "global_step": 29638, "epoch": 244} {"train_loss": -31.86701774597168, "global_step": 29639, "epoch": 244} {"train_loss": -31.89544677734375, "global_step": 29640, "epoch": 244} {"train_loss": -32.45554733276367, "global_step": 29641, "epoch": 244} {"train_loss": -32.25754928588867, "global_step": 29642, "epoch": 244} {"train_loss": -31.706342697143555, "global_step": 29643, "epoch": 244} {"train_loss": -30.849192502084843, "global_step": 29644, "epoch": 244, "val_loss": 2598995.0} {"train_loss": -31.327924728393555, "global_step": 29645, "epoch": 245} {"train_loss": -31.555652618408203, "global_step": 29646, "epoch": 245} {"train_loss": -31.476287841796875, "global_step": 29647, "epoch": 245} {"train_loss": -29.86539649963379, "global_step": 29648, "epoch": 245} {"train_loss": -24.190460205078125, "global_step": 29649, "epoch": 245} {"train_loss": -12.02164363861084, "global_step": 29650, "epoch": 245} {"train_loss": -4.906352996826172, "global_step": 29651, "epoch": 245} {"train_loss": -26.89809226989746, "global_step": 29652, "epoch": 245} {"train_loss": -21.354223251342773, "global_step": 29653, "epoch": 245} {"train_loss": -26.671558380126953, "global_step": 29654, "epoch": 245} {"train_loss": -24.39917755126953, "global_step": 29655, "epoch": 245} {"train_loss": -30.052719116210938, "global_step": 29656, "epoch": 245} {"train_loss": -28.50587272644043, "global_step": 29657, "epoch": 245} {"train_loss": -26.320425033569336, "global_step": 29658, "epoch": 245} {"train_loss": -29.519474029541016, "global_step": 29659, "epoch": 245} {"train_loss": -30.153034210205078, "global_step": 29660, "epoch": 245} {"train_loss": -29.85541343688965, "global_step": 29661, "epoch": 245} {"train_loss": -28.040266036987305, "global_step": 29662, "epoch": 245} {"train_loss": -29.598730087280273, "global_step": 29663, "epoch": 245} {"train_loss": -31.004343032836914, "global_step": 29664, "epoch": 245} {"train_loss": -30.125890731811523, "global_step": 29665, "epoch": 245} {"train_loss": -30.16514015197754, "global_step": 29666, "epoch": 245} {"train_loss": -29.507795333862305, "global_step": 29667, "epoch": 245} {"train_loss": -29.83074378967285, "global_step": 29668, "epoch": 245} {"train_loss": -30.240537643432617, "global_step": 29669, "epoch": 245} {"train_loss": -30.643293380737305, "global_step": 29670, "epoch": 245} {"train_loss": -31.031452178955078, "global_step": 29671, "epoch": 245} {"train_loss": -30.215087890625, "global_step": 29672, "epoch": 245} {"train_loss": -30.50946617126465, "global_step": 29673, "epoch": 245} {"train_loss": -30.3963565826416, "global_step": 29674, "epoch": 245} {"train_loss": -30.197534561157227, "global_step": 29675, "epoch": 245} {"train_loss": -30.014074325561523, "global_step": 29676, "epoch": 245} {"train_loss": -30.542016983032227, "global_step": 29677, "epoch": 245} {"train_loss": -31.134037017822266, "global_step": 29678, "epoch": 245} {"train_loss": -30.9198055267334, "global_step": 29679, "epoch": 245} {"train_loss": -30.86459732055664, "global_step": 29680, "epoch": 245} {"train_loss": -30.850311279296875, "global_step": 29681, "epoch": 245} {"train_loss": -30.276105880737305, "global_step": 29682, "epoch": 245} {"train_loss": -30.8856201171875, "global_step": 29683, "epoch": 245} {"train_loss": -31.04206657409668, "global_step": 29684, "epoch": 245} {"train_loss": -31.013885498046875, "global_step": 29685, "epoch": 245} {"train_loss": -30.903369903564453, "global_step": 29686, "epoch": 245} {"train_loss": -30.805810928344727, "global_step": 29687, "epoch": 245} {"train_loss": -30.865097045898438, "global_step": 29688, "epoch": 245} {"train_loss": -31.19879150390625, "global_step": 29689, "epoch": 245} {"train_loss": -31.32269287109375, "global_step": 29690, "epoch": 245} {"train_loss": -31.121557235717773, "global_step": 29691, "epoch": 245} {"train_loss": -31.385595321655273, "global_step": 29692, "epoch": 245} {"train_loss": -31.455549240112305, "global_step": 29693, "epoch": 245} {"train_loss": -30.960187911987305, "global_step": 29694, "epoch": 245} {"train_loss": -31.074369430541992, "global_step": 29695, "epoch": 245} {"train_loss": -31.91744041442871, "global_step": 29696, "epoch": 245} {"train_loss": -31.643957138061523, "global_step": 29697, "epoch": 245} {"train_loss": -30.904022216796875, "global_step": 29698, "epoch": 245} {"train_loss": -31.400360107421875, "global_step": 29699, "epoch": 245} {"train_loss": -30.8576602935791, "global_step": 29700, "epoch": 245} {"train_loss": -31.607778549194336, "global_step": 29701, "epoch": 245} {"train_loss": -31.85561180114746, "global_step": 29702, "epoch": 245} {"train_loss": -31.123502731323242, "global_step": 29703, "epoch": 245} {"train_loss": -31.664987564086914, "global_step": 29704, "epoch": 245} {"train_loss": -31.52400016784668, "global_step": 29705, "epoch": 245} {"train_loss": -31.310882568359375, "global_step": 29706, "epoch": 245} {"train_loss": -32.33522033691406, "global_step": 29707, "epoch": 245} {"train_loss": -30.702716827392578, "global_step": 29708, "epoch": 245} {"train_loss": -31.205978393554688, "global_step": 29709, "epoch": 245} {"train_loss": -31.418106079101562, "global_step": 29710, "epoch": 245} {"train_loss": -30.477853775024414, "global_step": 29711, "epoch": 245} {"train_loss": -31.05205726623535, "global_step": 29712, "epoch": 245} {"train_loss": -31.551074981689453, "global_step": 29713, "epoch": 245} {"train_loss": -30.562952041625977, "global_step": 29714, "epoch": 245} {"train_loss": -31.612470626831055, "global_step": 29715, "epoch": 245} {"train_loss": -31.279043197631836, "global_step": 29716, "epoch": 245} {"train_loss": -31.6460018157959, "global_step": 29717, "epoch": 245} {"train_loss": -31.599172592163086, "global_step": 29718, "epoch": 245} {"train_loss": -31.432626724243164, "global_step": 29719, "epoch": 245} {"train_loss": -31.68145751953125, "global_step": 29720, "epoch": 245} {"train_loss": -31.171131134033203, "global_step": 29721, "epoch": 245} {"train_loss": -31.5418758392334, "global_step": 29722, "epoch": 245} {"train_loss": -31.603498458862305, "global_step": 29723, "epoch": 245} {"train_loss": -31.570951461791992, "global_step": 29724, "epoch": 245} {"train_loss": -31.631351470947266, "global_step": 29725, "epoch": 245} {"train_loss": -31.118818283081055, "global_step": 29726, "epoch": 245} {"train_loss": -30.981229782104492, "global_step": 29727, "epoch": 245} {"train_loss": -30.651987075805664, "global_step": 29728, "epoch": 245} {"train_loss": -29.686086654663086, "global_step": 29729, "epoch": 245} {"train_loss": -31.24616813659668, "global_step": 29730, "epoch": 245} {"train_loss": -31.1029109954834, "global_step": 29731, "epoch": 245} {"train_loss": -28.231359481811523, "global_step": 29732, "epoch": 245} {"train_loss": -31.144672393798828, "global_step": 29733, "epoch": 245} {"train_loss": -30.108617782592773, "global_step": 29734, "epoch": 245} {"train_loss": -31.093677520751953, "global_step": 29735, "epoch": 245} {"train_loss": -29.9799747467041, "global_step": 29736, "epoch": 245} {"train_loss": -31.519046783447266, "global_step": 29737, "epoch": 245} {"train_loss": -30.554611206054688, "global_step": 29738, "epoch": 245} {"train_loss": -31.268508911132812, "global_step": 29739, "epoch": 245} {"train_loss": -31.54612159729004, "global_step": 29740, "epoch": 245} {"train_loss": -30.92287254333496, "global_step": 29741, "epoch": 245} {"train_loss": -29.2508544921875, "global_step": 29742, "epoch": 245} {"train_loss": -29.469940185546875, "global_step": 29743, "epoch": 245} {"train_loss": -29.09616470336914, "global_step": 29744, "epoch": 245} {"train_loss": -30.348764419555664, "global_step": 29745, "epoch": 245} {"train_loss": -30.52886390686035, "global_step": 29746, "epoch": 245} {"train_loss": -29.790851593017578, "global_step": 29747, "epoch": 245} {"train_loss": -30.640625, "global_step": 29748, "epoch": 245} {"train_loss": -29.399051666259766, "global_step": 29749, "epoch": 245} {"train_loss": -31.084415435791016, "global_step": 29750, "epoch": 245} {"train_loss": -30.898284912109375, "global_step": 29751, "epoch": 245} {"train_loss": -30.642200469970703, "global_step": 29752, "epoch": 245} {"train_loss": -30.41816520690918, "global_step": 29753, "epoch": 245} {"train_loss": -31.8895206451416, "global_step": 29754, "epoch": 245} {"train_loss": -30.6025447845459, "global_step": 29755, "epoch": 245} {"train_loss": -30.65644645690918, "global_step": 29756, "epoch": 245} {"train_loss": -30.989547729492188, "global_step": 29757, "epoch": 245} {"train_loss": -31.894580841064453, "global_step": 29758, "epoch": 245} {"train_loss": -31.624164581298828, "global_step": 29759, "epoch": 245} {"train_loss": -31.637903213500977, "global_step": 29760, "epoch": 245} {"train_loss": -31.609561920166016, "global_step": 29761, "epoch": 245} {"train_loss": -31.63868522644043, "global_step": 29762, "epoch": 245} {"train_loss": -31.60027503967285, "global_step": 29763, "epoch": 245} {"train_loss": -31.74623680114746, "global_step": 29764, "epoch": 245} {"train_loss": -30.17662569313995, "global_step": 29765, "epoch": 245, "val_loss": 2531645.0} {"train_loss": -31.260339736938477, "global_step": 29766, "epoch": 246} {"train_loss": -31.48287010192871, "global_step": 29767, "epoch": 246} {"train_loss": -32.06061935424805, "global_step": 29768, "epoch": 246} {"train_loss": -31.747161865234375, "global_step": 29769, "epoch": 246} {"train_loss": -30.72749137878418, "global_step": 29770, "epoch": 246} {"train_loss": -31.475177764892578, "global_step": 29771, "epoch": 246} {"train_loss": -31.71416664123535, "global_step": 29772, "epoch": 246} {"train_loss": -31.117340087890625, "global_step": 29773, "epoch": 246} {"train_loss": -31.276945114135742, "global_step": 29774, "epoch": 246} {"train_loss": -32.05361557006836, "global_step": 29775, "epoch": 246} {"train_loss": -31.03835105895996, "global_step": 29776, "epoch": 246} {"train_loss": -32.03461837768555, "global_step": 29777, "epoch": 246} {"train_loss": -31.5675048828125, "global_step": 29778, "epoch": 246} {"train_loss": -31.017501831054688, "global_step": 29779, "epoch": 246} {"train_loss": -31.520151138305664, "global_step": 29780, "epoch": 246} {"train_loss": -31.571012496948242, "global_step": 29781, "epoch": 246} {"train_loss": -31.70619010925293, "global_step": 29782, "epoch": 246} {"train_loss": -31.84726333618164, "global_step": 29783, "epoch": 246} {"train_loss": -31.509546279907227, "global_step": 29784, "epoch": 246} {"train_loss": -31.940893173217773, "global_step": 29785, "epoch": 246} {"train_loss": -31.6408634185791, "global_step": 29786, "epoch": 246} {"train_loss": -31.590490341186523, "global_step": 29787, "epoch": 246} {"train_loss": -31.411664962768555, "global_step": 29788, "epoch": 246} {"train_loss": -31.326704025268555, "global_step": 29789, "epoch": 246} {"train_loss": -32.06800079345703, "global_step": 29790, "epoch": 246} {"train_loss": -31.154508590698242, "global_step": 29791, "epoch": 246} {"train_loss": -31.525421142578125, "global_step": 29792, "epoch": 246} {"train_loss": -30.861011505126953, "global_step": 29793, "epoch": 246} {"train_loss": -31.227869033813477, "global_step": 29794, "epoch": 246} {"train_loss": -31.726123809814453, "global_step": 29795, "epoch": 246} {"train_loss": -31.461944580078125, "global_step": 29796, "epoch": 246} {"train_loss": -30.98090934753418, "global_step": 29797, "epoch": 246} {"train_loss": -30.33094596862793, "global_step": 29798, "epoch": 246} {"train_loss": -31.543903350830078, "global_step": 29799, "epoch": 246} {"train_loss": -31.54620933532715, "global_step": 29800, "epoch": 246} {"train_loss": -31.909286499023438, "global_step": 29801, "epoch": 246} {"train_loss": -31.38801383972168, "global_step": 29802, "epoch": 246} {"train_loss": -31.481525421142578, "global_step": 29803, "epoch": 246} {"train_loss": -31.78297996520996, "global_step": 29804, "epoch": 246} {"train_loss": -31.16376304626465, "global_step": 29805, "epoch": 246} {"train_loss": -28.897933959960938, "global_step": 29806, "epoch": 246} {"train_loss": -25.627323150634766, "global_step": 29807, "epoch": 246} {"train_loss": -26.090856552124023, "global_step": 29808, "epoch": 246} {"train_loss": -29.618732452392578, "global_step": 29809, "epoch": 246} {"train_loss": -31.904462814331055, "global_step": 29810, "epoch": 246} {"train_loss": -30.970605850219727, "global_step": 29811, "epoch": 246} {"train_loss": -30.52447509765625, "global_step": 29812, "epoch": 246} {"train_loss": -31.421432495117188, "global_step": 29813, "epoch": 246} {"train_loss": -30.825708389282227, "global_step": 29814, "epoch": 246} {"train_loss": -30.676904678344727, "global_step": 29815, "epoch": 246} {"train_loss": -31.618732452392578, "global_step": 29816, "epoch": 246} {"train_loss": -30.7838191986084, "global_step": 29817, "epoch": 246} {"train_loss": -31.79706382751465, "global_step": 29818, "epoch": 246} {"train_loss": -30.754785537719727, "global_step": 29819, "epoch": 246} {"train_loss": -31.739973068237305, "global_step": 29820, "epoch": 246} {"train_loss": -31.398691177368164, "global_step": 29821, "epoch": 246} {"train_loss": -31.88606834411621, "global_step": 29822, "epoch": 246} {"train_loss": -31.070276260375977, "global_step": 29823, "epoch": 246} {"train_loss": -32.2088737487793, "global_step": 29824, "epoch": 246} {"train_loss": -31.648895263671875, "global_step": 29825, "epoch": 246} {"train_loss": -32.42393112182617, "global_step": 29826, "epoch": 246} {"train_loss": -31.829574584960938, "global_step": 29827, "epoch": 246} {"train_loss": -31.8829402923584, "global_step": 29828, "epoch": 246} {"train_loss": -31.29941749572754, "global_step": 29829, "epoch": 246} {"train_loss": -32.02408981323242, "global_step": 29830, "epoch": 246} {"train_loss": -31.903345108032227, "global_step": 29831, "epoch": 246} {"train_loss": -32.11051559448242, "global_step": 29832, "epoch": 246} {"train_loss": -32.26200485229492, "global_step": 29833, "epoch": 246} {"train_loss": -32.10374450683594, "global_step": 29834, "epoch": 246} {"train_loss": -32.07699203491211, "global_step": 29835, "epoch": 246} {"train_loss": -32.1784553527832, "global_step": 29836, "epoch": 246} {"train_loss": -32.3499755859375, "global_step": 29837, "epoch": 246} {"train_loss": -32.2121467590332, "global_step": 29838, "epoch": 246} {"train_loss": -32.434173583984375, "global_step": 29839, "epoch": 246} {"train_loss": -32.210262298583984, "global_step": 29840, "epoch": 246} {"train_loss": -32.44147491455078, "global_step": 29841, "epoch": 246} {"train_loss": -32.458396911621094, "global_step": 29842, "epoch": 246} {"train_loss": -32.611934661865234, "global_step": 29843, "epoch": 246} {"train_loss": -31.97802734375, "global_step": 29844, "epoch": 246} {"train_loss": -32.66356658935547, "global_step": 29845, "epoch": 246} {"train_loss": -32.25031661987305, "global_step": 29846, "epoch": 246} {"train_loss": -31.375104904174805, "global_step": 29847, "epoch": 246} {"train_loss": -32.42862319946289, "global_step": 29848, "epoch": 246} {"train_loss": -32.72691345214844, "global_step": 29849, "epoch": 246} {"train_loss": -31.59164810180664, "global_step": 29850, "epoch": 246} {"train_loss": -32.542842864990234, "global_step": 29851, "epoch": 246} {"train_loss": -32.47993469238281, "global_step": 29852, "epoch": 246} {"train_loss": -27.6823787689209, "global_step": 29853, "epoch": 246} {"train_loss": -32.01064682006836, "global_step": 29854, "epoch": 246} {"train_loss": -32.443511962890625, "global_step": 29855, "epoch": 246} {"train_loss": -31.82293128967285, "global_step": 29856, "epoch": 246} {"train_loss": -31.855199813842773, "global_step": 29857, "epoch": 246} {"train_loss": -30.361988067626953, "global_step": 29858, "epoch": 246} {"train_loss": -32.0943489074707, "global_step": 29859, "epoch": 246} {"train_loss": -31.594680786132812, "global_step": 29860, "epoch": 246} {"train_loss": -31.555150985717773, "global_step": 29861, "epoch": 246} {"train_loss": -31.53470230102539, "global_step": 29862, "epoch": 246} {"train_loss": -30.58790397644043, "global_step": 29863, "epoch": 246} {"train_loss": -32.065738677978516, "global_step": 29864, "epoch": 246} {"train_loss": -31.299829483032227, "global_step": 29865, "epoch": 246} {"train_loss": -30.21502113342285, "global_step": 29866, "epoch": 246} {"train_loss": -31.155029296875, "global_step": 29867, "epoch": 246} {"train_loss": -31.141569137573242, "global_step": 29868, "epoch": 246} {"train_loss": -29.8980655670166, "global_step": 29869, "epoch": 246} {"train_loss": -31.07124900817871, "global_step": 29870, "epoch": 246} {"train_loss": -30.509138107299805, "global_step": 29871, "epoch": 246} {"train_loss": -31.51454734802246, "global_step": 29872, "epoch": 246} {"train_loss": -31.7379207611084, "global_step": 29873, "epoch": 246} {"train_loss": -31.332151412963867, "global_step": 29874, "epoch": 246} {"train_loss": -31.27152442932129, "global_step": 29875, "epoch": 246} {"train_loss": -30.891218185424805, "global_step": 29876, "epoch": 246} {"train_loss": -31.189035415649414, "global_step": 29877, "epoch": 246} {"train_loss": -30.620935440063477, "global_step": 29878, "epoch": 246} {"train_loss": -31.278043746948242, "global_step": 29879, "epoch": 246} {"train_loss": -30.543378829956055, "global_step": 29880, "epoch": 246} {"train_loss": -31.364151000976562, "global_step": 29881, "epoch": 246} {"train_loss": -31.056198120117188, "global_step": 29882, "epoch": 246} {"train_loss": -30.8150577545166, "global_step": 29883, "epoch": 246} {"train_loss": -31.090173721313477, "global_step": 29884, "epoch": 246} {"train_loss": -31.111234664916992, "global_step": 29885, "epoch": 246} {"train_loss": -31.38121154091575, "global_step": 29886, "epoch": 246, "val_loss": 3391416.0} {"train_loss": -31.200681686401367, "global_step": 29887, "epoch": 247} {"train_loss": -31.63332176208496, "global_step": 29888, "epoch": 247} {"train_loss": -31.4290771484375, "global_step": 29889, "epoch": 247} {"train_loss": -31.002288818359375, "global_step": 29890, "epoch": 247} {"train_loss": -31.578857421875, "global_step": 29891, "epoch": 247} {"train_loss": -30.990997314453125, "global_step": 29892, "epoch": 247} {"train_loss": -31.489816665649414, "global_step": 29893, "epoch": 247} {"train_loss": -31.617197036743164, "global_step": 29894, "epoch": 247} {"train_loss": -31.721576690673828, "global_step": 29895, "epoch": 247} {"train_loss": -31.73701286315918, "global_step": 29896, "epoch": 247} {"train_loss": -31.529447555541992, "global_step": 29897, "epoch": 247} {"train_loss": -32.14593505859375, "global_step": 29898, "epoch": 247} {"train_loss": -31.707422256469727, "global_step": 29899, "epoch": 247} {"train_loss": -32.17520523071289, "global_step": 29900, "epoch": 247} {"train_loss": -32.158023834228516, "global_step": 29901, "epoch": 247} {"train_loss": -32.42570114135742, "global_step": 29902, "epoch": 247} {"train_loss": -32.19061279296875, "global_step": 29903, "epoch": 247} {"train_loss": -31.98394203186035, "global_step": 29904, "epoch": 247} {"train_loss": -32.473426818847656, "global_step": 29905, "epoch": 247} {"train_loss": -32.17798614501953, "global_step": 29906, "epoch": 247} {"train_loss": -32.355499267578125, "global_step": 29907, "epoch": 247} {"train_loss": -32.43436813354492, "global_step": 29908, "epoch": 247} {"train_loss": -32.14463424682617, "global_step": 29909, "epoch": 247} {"train_loss": -32.336544036865234, "global_step": 29910, "epoch": 247} {"train_loss": -32.50001525878906, "global_step": 29911, "epoch": 247} {"train_loss": -31.662525177001953, "global_step": 29912, "epoch": 247} {"train_loss": -32.98025894165039, "global_step": 29913, "epoch": 247} {"train_loss": -32.45165252685547, "global_step": 29914, "epoch": 247} {"train_loss": -32.66029357910156, "global_step": 29915, "epoch": 247} {"train_loss": -33.17431640625, "global_step": 29916, "epoch": 247} {"train_loss": -33.178768157958984, "global_step": 29917, "epoch": 247} {"train_loss": -33.001129150390625, "global_step": 29918, "epoch": 247} {"train_loss": -32.75885009765625, "global_step": 29919, "epoch": 247} {"train_loss": -32.16264724731445, "global_step": 29920, "epoch": 247} {"train_loss": -32.77372360229492, "global_step": 29921, "epoch": 247} {"train_loss": -32.80011749267578, "global_step": 29922, "epoch": 247} {"train_loss": -33.26536178588867, "global_step": 29923, "epoch": 247} {"train_loss": -32.658870697021484, "global_step": 29924, "epoch": 247} {"train_loss": -32.81695556640625, "global_step": 29925, "epoch": 247} {"train_loss": -32.66785430908203, "global_step": 29926, "epoch": 247} {"train_loss": -33.21770095825195, "global_step": 29927, "epoch": 247} {"train_loss": -32.9970588684082, "global_step": 29928, "epoch": 247} {"train_loss": -32.612953186035156, "global_step": 29929, "epoch": 247} {"train_loss": -32.85867691040039, "global_step": 29930, "epoch": 247} {"train_loss": -32.17399215698242, "global_step": 29931, "epoch": 247} {"train_loss": -32.31523895263672, "global_step": 29932, "epoch": 247} {"train_loss": -30.929941177368164, "global_step": 29933, "epoch": 247} {"train_loss": -30.64217185974121, "global_step": 29934, "epoch": 247} {"train_loss": -30.458837509155273, "global_step": 29935, "epoch": 247} {"train_loss": -29.645177841186523, "global_step": 29936, "epoch": 247} {"train_loss": -30.848031997680664, "global_step": 29937, "epoch": 247} {"train_loss": -32.48757553100586, "global_step": 29938, "epoch": 247} {"train_loss": -30.633453369140625, "global_step": 29939, "epoch": 247} {"train_loss": -31.4571533203125, "global_step": 29940, "epoch": 247} {"train_loss": -31.994359970092773, "global_step": 29941, "epoch": 247} {"train_loss": -32.25054931640625, "global_step": 29942, "epoch": 247} {"train_loss": -32.21595001220703, "global_step": 29943, "epoch": 247} {"train_loss": -31.040973663330078, "global_step": 29944, "epoch": 247} {"train_loss": -31.310855865478516, "global_step": 29945, "epoch": 247} {"train_loss": -32.19911575317383, "global_step": 29946, "epoch": 247} {"train_loss": -31.305194854736328, "global_step": 29947, "epoch": 247} {"train_loss": -30.954578399658203, "global_step": 29948, "epoch": 247} {"train_loss": -32.07378005981445, "global_step": 29949, "epoch": 247} {"train_loss": -31.448331832885742, "global_step": 29950, "epoch": 247} {"train_loss": -30.956878662109375, "global_step": 29951, "epoch": 247} {"train_loss": -32.08091354370117, "global_step": 29952, "epoch": 247} {"train_loss": -31.18025016784668, "global_step": 29953, "epoch": 247} {"train_loss": -31.441864013671875, "global_step": 29954, "epoch": 247} {"train_loss": -31.320209503173828, "global_step": 29955, "epoch": 247} {"train_loss": -31.56202507019043, "global_step": 29956, "epoch": 247} {"train_loss": -30.316059112548828, "global_step": 29957, "epoch": 247} {"train_loss": -32.221492767333984, "global_step": 29958, "epoch": 247} {"train_loss": -31.257526397705078, "global_step": 29959, "epoch": 247} {"train_loss": -31.639575958251953, "global_step": 29960, "epoch": 247} {"train_loss": -31.227645874023438, "global_step": 29961, "epoch": 247} {"train_loss": -31.610992431640625, "global_step": 29962, "epoch": 247} {"train_loss": -31.4279727935791, "global_step": 29963, "epoch": 247} {"train_loss": -31.947412490844727, "global_step": 29964, "epoch": 247} {"train_loss": -31.803258895874023, "global_step": 29965, "epoch": 247} {"train_loss": -31.676651000976562, "global_step": 29966, "epoch": 247} {"train_loss": -31.931974411010742, "global_step": 29967, "epoch": 247} {"train_loss": -31.9670352935791, "global_step": 29968, "epoch": 247} {"train_loss": -32.253658294677734, "global_step": 29969, "epoch": 247} {"train_loss": -32.247920989990234, "global_step": 29970, "epoch": 247} {"train_loss": -32.45243453979492, "global_step": 29971, "epoch": 247} {"train_loss": -31.935626983642578, "global_step": 29972, "epoch": 247} {"train_loss": -32.2495002746582, "global_step": 29973, "epoch": 247} {"train_loss": -32.12504959106445, "global_step": 29974, "epoch": 247} {"train_loss": -31.89446449279785, "global_step": 29975, "epoch": 247} {"train_loss": -32.208412170410156, "global_step": 29976, "epoch": 247} {"train_loss": -32.43666458129883, "global_step": 29977, "epoch": 247} {"train_loss": -32.2833366394043, "global_step": 29978, "epoch": 247} {"train_loss": -32.36332702636719, "global_step": 29979, "epoch": 247} {"train_loss": -32.614784240722656, "global_step": 29980, "epoch": 247} {"train_loss": -32.76634979248047, "global_step": 29981, "epoch": 247} {"train_loss": -32.363311767578125, "global_step": 29982, "epoch": 247} {"train_loss": -32.44371795654297, "global_step": 29983, "epoch": 247} {"train_loss": -32.24420928955078, "global_step": 29984, "epoch": 247} {"train_loss": -32.46048355102539, "global_step": 29985, "epoch": 247} {"train_loss": -32.42287826538086, "global_step": 29986, "epoch": 247} {"train_loss": -32.89677047729492, "global_step": 29987, "epoch": 247} {"train_loss": -32.473079681396484, "global_step": 29988, "epoch": 247} {"train_loss": -32.678504943847656, "global_step": 29989, "epoch": 247} {"train_loss": -32.338050842285156, "global_step": 29990, "epoch": 247} {"train_loss": -32.24861526489258, "global_step": 29991, "epoch": 247} {"train_loss": -32.399166107177734, "global_step": 29992, "epoch": 247} {"train_loss": -31.39434814453125, "global_step": 29993, "epoch": 247} {"train_loss": -30.694494247436523, "global_step": 29994, "epoch": 247} {"train_loss": -30.7228946685791, "global_step": 29995, "epoch": 247} {"train_loss": -30.756383895874023, "global_step": 29996, "epoch": 247} {"train_loss": -31.563013076782227, "global_step": 29997, "epoch": 247} {"train_loss": -32.69131851196289, "global_step": 29998, "epoch": 247} {"train_loss": -32.398033142089844, "global_step": 29999, "epoch": 247} {"train_loss": -32.69376754760742, "global_step": 30000, "epoch": 247} {"train_loss": -32.00105285644531, "global_step": 30001, "epoch": 247} {"train_loss": -31.6136417388916, "global_step": 30002, "epoch": 247} {"train_loss": -32.223968505859375, "global_step": 30003, "epoch": 247} {"train_loss": -31.847949981689453, "global_step": 30004, "epoch": 247} {"train_loss": -31.493146896362305, "global_step": 30005, "epoch": 247} {"train_loss": -31.955915451049805, "global_step": 30006, "epoch": 247} {"train_loss": -31.968821832956362, "global_step": 30007, "epoch": 247, "val_loss": 2481273.25} {"train_loss": -31.0023136138916, "global_step": 30008, "epoch": 248} {"train_loss": -31.793689727783203, "global_step": 30009, "epoch": 248} {"train_loss": -32.08694076538086, "global_step": 30010, "epoch": 248} {"train_loss": -31.1020450592041, "global_step": 30011, "epoch": 248} {"train_loss": -31.132001876831055, "global_step": 30012, "epoch": 248} {"train_loss": -31.008472442626953, "global_step": 30013, "epoch": 248} {"train_loss": -31.079015731811523, "global_step": 30014, "epoch": 248} {"train_loss": -32.23537826538086, "global_step": 30015, "epoch": 248} {"train_loss": -32.347625732421875, "global_step": 30016, "epoch": 248} {"train_loss": -31.461227416992188, "global_step": 30017, "epoch": 248} {"train_loss": -30.44830322265625, "global_step": 30018, "epoch": 248} {"train_loss": -32.540897369384766, "global_step": 30019, "epoch": 248} {"train_loss": -32.76338577270508, "global_step": 30020, "epoch": 248} {"train_loss": -32.58405685424805, "global_step": 30021, "epoch": 248} {"train_loss": -31.881391525268555, "global_step": 30022, "epoch": 248} {"train_loss": -32.23580551147461, "global_step": 30023, "epoch": 248} {"train_loss": -32.79257583618164, "global_step": 30024, "epoch": 248} {"train_loss": -31.535232543945312, "global_step": 30025, "epoch": 248} {"train_loss": -31.32583999633789, "global_step": 30026, "epoch": 248} {"train_loss": -32.997955322265625, "global_step": 30027, "epoch": 248} {"train_loss": -32.37052536010742, "global_step": 30028, "epoch": 248} {"train_loss": -32.27497482299805, "global_step": 30029, "epoch": 248} {"train_loss": -33.06611251831055, "global_step": 30030, "epoch": 248} {"train_loss": -32.294795989990234, "global_step": 30031, "epoch": 248} {"train_loss": -32.51604080200195, "global_step": 30032, "epoch": 248} {"train_loss": -33.26215362548828, "global_step": 30033, "epoch": 248} {"train_loss": -32.0553092956543, "global_step": 30034, "epoch": 248} {"train_loss": -32.6910514831543, "global_step": 30035, "epoch": 248} {"train_loss": -32.83871078491211, "global_step": 30036, "epoch": 248} {"train_loss": -32.12538528442383, "global_step": 30037, "epoch": 248} {"train_loss": -32.4053840637207, "global_step": 30038, "epoch": 248} {"train_loss": -32.203792572021484, "global_step": 30039, "epoch": 248} {"train_loss": -32.40015411376953, "global_step": 30040, "epoch": 248} {"train_loss": -30.937768936157227, "global_step": 30041, "epoch": 248} {"train_loss": -32.152889251708984, "global_step": 30042, "epoch": 248} {"train_loss": -31.690637588500977, "global_step": 30043, "epoch": 248} {"train_loss": -29.167560577392578, "global_step": 30044, "epoch": 248} {"train_loss": -28.686542510986328, "global_step": 30045, "epoch": 248} {"train_loss": -28.121458053588867, "global_step": 30046, "epoch": 248} {"train_loss": -26.76449966430664, "global_step": 30047, "epoch": 248} {"train_loss": -24.369657516479492, "global_step": 30048, "epoch": 248} {"train_loss": -30.786218643188477, "global_step": 30049, "epoch": 248} {"train_loss": -27.022708892822266, "global_step": 30050, "epoch": 248} {"train_loss": -29.317584991455078, "global_step": 30051, "epoch": 248} {"train_loss": -31.685779571533203, "global_step": 30052, "epoch": 248} {"train_loss": -31.7864933013916, "global_step": 30053, "epoch": 248} {"train_loss": -29.879486083984375, "global_step": 30054, "epoch": 248} {"train_loss": -30.624841690063477, "global_step": 30055, "epoch": 248} {"train_loss": -31.194433212280273, "global_step": 30056, "epoch": 248} {"train_loss": -32.38794708251953, "global_step": 30057, "epoch": 248} {"train_loss": -32.22515869140625, "global_step": 30058, "epoch": 248} {"train_loss": -32.30122756958008, "global_step": 30059, "epoch": 248} {"train_loss": -31.88905143737793, "global_step": 30060, "epoch": 248} {"train_loss": -32.1237678527832, "global_step": 30061, "epoch": 248} {"train_loss": -31.137561798095703, "global_step": 30062, "epoch": 248} {"train_loss": -31.974109649658203, "global_step": 30063, "epoch": 248} {"train_loss": -31.520002365112305, "global_step": 30064, "epoch": 248} {"train_loss": -32.089412689208984, "global_step": 30065, "epoch": 248} {"train_loss": -32.081844329833984, "global_step": 30066, "epoch": 248} {"train_loss": -31.780576705932617, "global_step": 30067, "epoch": 248} {"train_loss": -32.07323455810547, "global_step": 30068, "epoch": 248} {"train_loss": -32.63462829589844, "global_step": 30069, "epoch": 248} {"train_loss": -32.05720138549805, "global_step": 30070, "epoch": 248} {"train_loss": -31.066614151000977, "global_step": 30071, "epoch": 248} {"train_loss": -32.48701095581055, "global_step": 30072, "epoch": 248} {"train_loss": -32.11893844604492, "global_step": 30073, "epoch": 248} {"train_loss": -32.37342834472656, "global_step": 30074, "epoch": 248} {"train_loss": -31.30597496032715, "global_step": 30075, "epoch": 248} {"train_loss": -31.9414005279541, "global_step": 30076, "epoch": 248} {"train_loss": -31.771442413330078, "global_step": 30077, "epoch": 248} {"train_loss": -32.25115966796875, "global_step": 30078, "epoch": 248} {"train_loss": -31.922544479370117, "global_step": 30079, "epoch": 248} {"train_loss": -32.23958969116211, "global_step": 30080, "epoch": 248} {"train_loss": -32.41285705566406, "global_step": 30081, "epoch": 248} {"train_loss": -31.425561904907227, "global_step": 30082, "epoch": 248} {"train_loss": -31.7429141998291, "global_step": 30083, "epoch": 248} {"train_loss": -30.9268856048584, "global_step": 30084, "epoch": 248} {"train_loss": -30.766387939453125, "global_step": 30085, "epoch": 248} {"train_loss": -32.516510009765625, "global_step": 30086, "epoch": 248} {"train_loss": -31.853246688842773, "global_step": 30087, "epoch": 248} {"train_loss": -31.0307674407959, "global_step": 30088, "epoch": 248} {"train_loss": -31.517292022705078, "global_step": 30089, "epoch": 248} {"train_loss": -29.744709014892578, "global_step": 30090, "epoch": 248} {"train_loss": -31.462905883789062, "global_step": 30091, "epoch": 248} {"train_loss": -31.686920166015625, "global_step": 30092, "epoch": 248} {"train_loss": -31.499582290649414, "global_step": 30093, "epoch": 248} {"train_loss": -31.820417404174805, "global_step": 30094, "epoch": 248} {"train_loss": -31.617990493774414, "global_step": 30095, "epoch": 248} {"train_loss": -31.265684127807617, "global_step": 30096, "epoch": 248} {"train_loss": -32.14972686767578, "global_step": 30097, "epoch": 248} {"train_loss": -31.156696319580078, "global_step": 30098, "epoch": 248} {"train_loss": -31.542810440063477, "global_step": 30099, "epoch": 248} {"train_loss": -31.625974655151367, "global_step": 30100, "epoch": 248} {"train_loss": -32.05427169799805, "global_step": 30101, "epoch": 248} {"train_loss": -30.67380714416504, "global_step": 30102, "epoch": 248} {"train_loss": -31.662729263305664, "global_step": 30103, "epoch": 248} {"train_loss": -31.903858184814453, "global_step": 30104, "epoch": 248} {"train_loss": -32.38998794555664, "global_step": 30105, "epoch": 248} {"train_loss": -31.425947189331055, "global_step": 30106, "epoch": 248} {"train_loss": -32.01591110229492, "global_step": 30107, "epoch": 248} {"train_loss": -31.458791732788086, "global_step": 30108, "epoch": 248} {"train_loss": -31.917566299438477, "global_step": 30109, "epoch": 248} {"train_loss": -32.283966064453125, "global_step": 30110, "epoch": 248} {"train_loss": -32.42118453979492, "global_step": 30111, "epoch": 248} {"train_loss": -32.486053466796875, "global_step": 30112, "epoch": 248} {"train_loss": -32.12521743774414, "global_step": 30113, "epoch": 248} {"train_loss": -32.12891387939453, "global_step": 30114, "epoch": 248} {"train_loss": -32.05833053588867, "global_step": 30115, "epoch": 248} {"train_loss": -32.28083419799805, "global_step": 30116, "epoch": 248} {"train_loss": -32.22296142578125, "global_step": 30117, "epoch": 248} {"train_loss": -31.128494262695312, "global_step": 30118, "epoch": 248} {"train_loss": -29.181365966796875, "global_step": 30119, "epoch": 248} {"train_loss": -22.44105339050293, "global_step": 30120, "epoch": 248} {"train_loss": -13.855949401855469, "global_step": 30121, "epoch": 248} {"train_loss": -5.991340160369873, "global_step": 30122, "epoch": 248} {"train_loss": -18.659250259399414, "global_step": 30123, "epoch": 248} {"train_loss": -30.081323623657227, "global_step": 30124, "epoch": 248} {"train_loss": -15.84918212890625, "global_step": 30125, "epoch": 248} {"train_loss": -31.17588233947754, "global_step": 30126, "epoch": 248} {"train_loss": -23.35599708557129, "global_step": 30127, "epoch": 248} {"train_loss": -30.79079356469399, "global_step": 30128, "epoch": 248, "val_loss": 2533995.25} {"train_loss": -26.587461471557617, "global_step": 30129, "epoch": 249} {"train_loss": -28.104955673217773, "global_step": 30130, "epoch": 249} {"train_loss": -29.347394943237305, "global_step": 30131, "epoch": 249} {"train_loss": -28.240854263305664, "global_step": 30132, "epoch": 249} {"train_loss": -28.131540298461914, "global_step": 30133, "epoch": 249} {"train_loss": -29.39937400817871, "global_step": 30134, "epoch": 249} {"train_loss": -29.29892349243164, "global_step": 30135, "epoch": 249} {"train_loss": -28.99155616760254, "global_step": 30136, "epoch": 249} {"train_loss": -29.325265884399414, "global_step": 30137, "epoch": 249} {"train_loss": -29.8674259185791, "global_step": 30138, "epoch": 249} {"train_loss": -30.190343856811523, "global_step": 30139, "epoch": 249} {"train_loss": -30.101917266845703, "global_step": 30140, "epoch": 249} {"train_loss": -29.872648239135742, "global_step": 30141, "epoch": 249} {"train_loss": -30.42721939086914, "global_step": 30142, "epoch": 249} {"train_loss": -31.074323654174805, "global_step": 30143, "epoch": 249} {"train_loss": -30.204181671142578, "global_step": 30144, "epoch": 249} {"train_loss": -30.172809600830078, "global_step": 30145, "epoch": 249} {"train_loss": -29.223724365234375, "global_step": 30146, "epoch": 249} {"train_loss": -30.76832389831543, "global_step": 30147, "epoch": 249} {"train_loss": -31.001361846923828, "global_step": 30148, "epoch": 249} {"train_loss": -30.758407592773438, "global_step": 30149, "epoch": 249} {"train_loss": -30.40802001953125, "global_step": 30150, "epoch": 249} {"train_loss": -30.799367904663086, "global_step": 30151, "epoch": 249} {"train_loss": -30.886249542236328, "global_step": 30152, "epoch": 249} {"train_loss": -31.22629165649414, "global_step": 30153, "epoch": 249} {"train_loss": -30.599706649780273, "global_step": 30154, "epoch": 249} {"train_loss": -30.976898193359375, "global_step": 30155, "epoch": 249} {"train_loss": -31.003454208374023, "global_step": 30156, "epoch": 249} {"train_loss": -31.003284454345703, "global_step": 30157, "epoch": 249} {"train_loss": -30.718799591064453, "global_step": 30158, "epoch": 249} {"train_loss": -30.7334041595459, "global_step": 30159, "epoch": 249} {"train_loss": -29.359704971313477, "global_step": 30160, "epoch": 249} {"train_loss": -31.087799072265625, "global_step": 30161, "epoch": 249} {"train_loss": -30.6442813873291, "global_step": 30162, "epoch": 249} {"train_loss": -30.4897403717041, "global_step": 30163, "epoch": 249} {"train_loss": -30.669469833374023, "global_step": 30164, "epoch": 249} {"train_loss": -31.1170711517334, "global_step": 30165, "epoch": 249} {"train_loss": -30.224658966064453, "global_step": 30166, "epoch": 249} {"train_loss": -31.553861618041992, "global_step": 30167, "epoch": 249} {"train_loss": -31.251386642456055, "global_step": 30168, "epoch": 249} {"train_loss": -31.0681209564209, "global_step": 30169, "epoch": 249} {"train_loss": -31.3162841796875, "global_step": 30170, "epoch": 249} {"train_loss": -31.0048885345459, "global_step": 30171, "epoch": 249} {"train_loss": -31.52664566040039, "global_step": 30172, "epoch": 249} {"train_loss": -31.310461044311523, "global_step": 30173, "epoch": 249} {"train_loss": -31.07063865661621, "global_step": 30174, "epoch": 249} {"train_loss": -31.11945915222168, "global_step": 30175, "epoch": 249} {"train_loss": -31.261056900024414, "global_step": 30176, "epoch": 249} {"train_loss": -31.663549423217773, "global_step": 30177, "epoch": 249} {"train_loss": -31.1044921875, "global_step": 30178, "epoch": 249} {"train_loss": -31.167377471923828, "global_step": 30179, "epoch": 249} {"train_loss": -30.7623291015625, "global_step": 30180, "epoch": 249} {"train_loss": -31.78208351135254, "global_step": 30181, "epoch": 249} {"train_loss": -31.305877685546875, "global_step": 30182, "epoch": 249} {"train_loss": -31.409820556640625, "global_step": 30183, "epoch": 249} {"train_loss": -30.363265991210938, "global_step": 30184, "epoch": 249} {"train_loss": -31.66578483581543, "global_step": 30185, "epoch": 249} {"train_loss": -31.4761962890625, "global_step": 30186, "epoch": 249} {"train_loss": -30.606292724609375, "global_step": 30187, "epoch": 249} {"train_loss": -31.527673721313477, "global_step": 30188, "epoch": 249} {"train_loss": -31.3884220123291, "global_step": 30189, "epoch": 249} {"train_loss": -31.330860137939453, "global_step": 30190, "epoch": 249} {"train_loss": -31.567914962768555, "global_step": 30191, "epoch": 249} {"train_loss": -31.47104263305664, "global_step": 30192, "epoch": 249} {"train_loss": -31.631717681884766, "global_step": 30193, "epoch": 249} {"train_loss": -31.71785545349121, "global_step": 30194, "epoch": 249} {"train_loss": -31.36932373046875, "global_step": 30195, "epoch": 249} {"train_loss": -30.935575485229492, "global_step": 30196, "epoch": 249} {"train_loss": -31.685083389282227, "global_step": 30197, "epoch": 249} {"train_loss": -31.44061851501465, "global_step": 30198, "epoch": 249} {"train_loss": -31.422412872314453, "global_step": 30199, "epoch": 249} {"train_loss": -31.3155517578125, "global_step": 30200, "epoch": 249} {"train_loss": -31.820037841796875, "global_step": 30201, "epoch": 249} {"train_loss": -31.811370849609375, "global_step": 30202, "epoch": 249} {"train_loss": -30.538562774658203, "global_step": 30203, "epoch": 249} {"train_loss": -27.808141708374023, "global_step": 30204, "epoch": 249} {"train_loss": -24.926172256469727, "global_step": 30205, "epoch": 249} {"train_loss": -20.739761352539062, "global_step": 30206, "epoch": 249} {"train_loss": -29.7752685546875, "global_step": 30207, "epoch": 249} {"train_loss": -24.21805763244629, "global_step": 30208, "epoch": 249} {"train_loss": -25.497488021850586, "global_step": 30209, "epoch": 249} {"train_loss": -27.13498306274414, "global_step": 30210, "epoch": 249} {"train_loss": -30.220035552978516, "global_step": 30211, "epoch": 249} {"train_loss": -28.32874870300293, "global_step": 30212, "epoch": 249} {"train_loss": -29.310882568359375, "global_step": 30213, "epoch": 249} {"train_loss": -30.91219139099121, "global_step": 30214, "epoch": 249} {"train_loss": -30.8121337890625, "global_step": 30215, "epoch": 249} {"train_loss": -29.601171493530273, "global_step": 30216, "epoch": 249} {"train_loss": -30.24476432800293, "global_step": 30217, "epoch": 249} {"train_loss": -30.849918365478516, "global_step": 30218, "epoch": 249} {"train_loss": -30.64642333984375, "global_step": 30219, "epoch": 249} {"train_loss": -30.953744888305664, "global_step": 30220, "epoch": 249} {"train_loss": -30.789724349975586, "global_step": 30221, "epoch": 249} {"train_loss": -30.754087448120117, "global_step": 30222, "epoch": 249} {"train_loss": -30.737974166870117, "global_step": 30223, "epoch": 249} {"train_loss": -31.36410903930664, "global_step": 30224, "epoch": 249} {"train_loss": -31.592126846313477, "global_step": 30225, "epoch": 249} {"train_loss": -31.126575469970703, "global_step": 30226, "epoch": 249} {"train_loss": -31.344358444213867, "global_step": 30227, "epoch": 249} {"train_loss": -31.471527099609375, "global_step": 30228, "epoch": 249} {"train_loss": -31.49053382873535, "global_step": 30229, "epoch": 249} {"train_loss": -31.2454833984375, "global_step": 30230, "epoch": 249} {"train_loss": -31.320449829101562, "global_step": 30231, "epoch": 249} {"train_loss": -31.750019073486328, "global_step": 30232, "epoch": 249} {"train_loss": -31.396930694580078, "global_step": 30233, "epoch": 249} {"train_loss": -30.761255264282227, "global_step": 30234, "epoch": 249} {"train_loss": -29.92523765563965, "global_step": 30235, "epoch": 249} {"train_loss": -31.186521530151367, "global_step": 30236, "epoch": 249} {"train_loss": -29.443857192993164, "global_step": 30237, "epoch": 249} {"train_loss": -30.63519287109375, "global_step": 30238, "epoch": 249} {"train_loss": -30.493558883666992, "global_step": 30239, "epoch": 249} {"train_loss": -30.657379150390625, "global_step": 30240, "epoch": 249} {"train_loss": -30.858808517456055, "global_step": 30241, "epoch": 249} {"train_loss": -30.605138778686523, "global_step": 30242, "epoch": 249} {"train_loss": -31.144046783447266, "global_step": 30243, "epoch": 249} {"train_loss": -30.849756240844727, "global_step": 30244, "epoch": 249} {"train_loss": -30.570112228393555, "global_step": 30245, "epoch": 249} {"train_loss": -30.2235164642334, "global_step": 30246, "epoch": 249} {"train_loss": -29.469568252563477, "global_step": 30247, "epoch": 249} {"train_loss": -31.04132080078125, "global_step": 30248, "epoch": 249} {"train_loss": -30.398523425267747, "global_step": 30249, "epoch": 249, "val_loss": 2779675.25} {"train_loss": -30.068403244018555, "global_step": 30250, "epoch": 250} {"train_loss": -30.964338302612305, "global_step": 30251, "epoch": 250} {"train_loss": -29.777557373046875, "global_step": 30252, "epoch": 250} {"train_loss": -30.494983673095703, "global_step": 30253, "epoch": 250} {"train_loss": -30.724903106689453, "global_step": 30254, "epoch": 250} {"train_loss": -31.250940322875977, "global_step": 30255, "epoch": 250} {"train_loss": -30.73353385925293, "global_step": 30256, "epoch": 250} {"train_loss": -31.2379093170166, "global_step": 30257, "epoch": 250} {"train_loss": -31.119037628173828, "global_step": 30258, "epoch": 250} {"train_loss": -31.406646728515625, "global_step": 30259, "epoch": 250} {"train_loss": -28.889739990234375, "global_step": 30260, "epoch": 250} {"train_loss": -31.430225372314453, "global_step": 30261, "epoch": 250} {"train_loss": -30.511428833007812, "global_step": 30262, "epoch": 250} {"train_loss": -30.3786678314209, "global_step": 30263, "epoch": 250} {"train_loss": -30.802526473999023, "global_step": 30264, "epoch": 250} {"train_loss": -30.8895206451416, "global_step": 30265, "epoch": 250} {"train_loss": -30.594745635986328, "global_step": 30266, "epoch": 250} {"train_loss": -30.5872802734375, "global_step": 30267, "epoch": 250} {"train_loss": -31.04913902282715, "global_step": 30268, "epoch": 250} {"train_loss": -30.88873291015625, "global_step": 30269, "epoch": 250} {"train_loss": -31.125476837158203, "global_step": 30270, "epoch": 250} {"train_loss": -30.520978927612305, "global_step": 30271, "epoch": 250} {"train_loss": -30.62060546875, "global_step": 30272, "epoch": 250} {"train_loss": -30.901630401611328, "global_step": 30273, "epoch": 250} {"train_loss": -30.53547477722168, "global_step": 30274, "epoch": 250} {"train_loss": -31.580549240112305, "global_step": 30275, "epoch": 250} {"train_loss": -31.261259078979492, "global_step": 30276, "epoch": 250} {"train_loss": -31.625350952148438, "global_step": 30277, "epoch": 250} {"train_loss": -31.058927536010742, "global_step": 30278, "epoch": 250} {"train_loss": -31.22150230407715, "global_step": 30279, "epoch": 250} {"train_loss": -31.5245361328125, "global_step": 30280, "epoch": 250} {"train_loss": -31.0606632232666, "global_step": 30281, "epoch": 250} {"train_loss": -31.625593185424805, "global_step": 30282, "epoch": 250} {"train_loss": -30.805524826049805, "global_step": 30283, "epoch": 250} {"train_loss": -31.947906494140625, "global_step": 30284, "epoch": 250} {"train_loss": -31.707998275756836, "global_step": 30285, "epoch": 250} {"train_loss": -31.370807647705078, "global_step": 30286, "epoch": 250} {"train_loss": -32.167701721191406, "global_step": 30287, "epoch": 250} {"train_loss": -31.599355697631836, "global_step": 30288, "epoch": 250} {"train_loss": -31.893295288085938, "global_step": 30289, "epoch": 250} {"train_loss": -31.808242797851562, "global_step": 30290, "epoch": 250} {"train_loss": -31.11858558654785, "global_step": 30291, "epoch": 250} {"train_loss": -32.12177658081055, "global_step": 30292, "epoch": 250} {"train_loss": -32.3310432434082, "global_step": 30293, "epoch": 250} {"train_loss": -32.548091888427734, "global_step": 30294, "epoch": 250} {"train_loss": -31.24744987487793, "global_step": 30295, "epoch": 250} {"train_loss": -31.838348388671875, "global_step": 30296, "epoch": 250} {"train_loss": -31.72930335998535, "global_step": 30297, "epoch": 250} {"train_loss": -31.124319076538086, "global_step": 30298, "epoch": 250} {"train_loss": -31.28914451599121, "global_step": 30299, "epoch": 250} {"train_loss": -29.6373233795166, "global_step": 30300, "epoch": 250} {"train_loss": -31.202573776245117, "global_step": 30301, "epoch": 250} {"train_loss": -30.109174728393555, "global_step": 30302, "epoch": 250} {"train_loss": -30.619037628173828, "global_step": 30303, "epoch": 250} {"train_loss": -31.661542892456055, "global_step": 30304, "epoch": 250} {"train_loss": -31.525360107421875, "global_step": 30305, "epoch": 250} {"train_loss": -32.23627471923828, "global_step": 30306, "epoch": 250} {"train_loss": -31.78980827331543, "global_step": 30307, "epoch": 250} {"train_loss": -32.12118148803711, "global_step": 30308, "epoch": 250} {"train_loss": -31.663471221923828, "global_step": 30309, "epoch": 250} {"train_loss": -32.74952697753906, "global_step": 30310, "epoch": 250} {"train_loss": -31.971899032592773, "global_step": 30311, "epoch": 250} {"train_loss": -31.752878189086914, "global_step": 30312, "epoch": 250} {"train_loss": -32.43852996826172, "global_step": 30313, "epoch": 250} {"train_loss": -32.2994384765625, "global_step": 30314, "epoch": 250} {"train_loss": -32.741539001464844, "global_step": 30315, "epoch": 250} {"train_loss": -32.54280471801758, "global_step": 30316, "epoch": 250} {"train_loss": -32.254638671875, "global_step": 30317, "epoch": 250} {"train_loss": -32.325347900390625, "global_step": 30318, "epoch": 250} {"train_loss": -32.26949691772461, "global_step": 30319, "epoch": 250} {"train_loss": -32.12604522705078, "global_step": 30320, "epoch": 250} {"train_loss": -32.3036003112793, "global_step": 30321, "epoch": 250} {"train_loss": -32.519317626953125, "global_step": 30322, "epoch": 250} {"train_loss": -32.43207931518555, "global_step": 30323, "epoch": 250} {"train_loss": -32.52643966674805, "global_step": 30324, "epoch": 250} {"train_loss": -32.405250549316406, "global_step": 30325, "epoch": 250} {"train_loss": -32.04288101196289, "global_step": 30326, "epoch": 250} {"train_loss": -32.216278076171875, "global_step": 30327, "epoch": 250} {"train_loss": -32.749114990234375, "global_step": 30328, "epoch": 250} {"train_loss": -32.632991790771484, "global_step": 30329, "epoch": 250} {"train_loss": -31.8979434967041, "global_step": 30330, "epoch": 250} {"train_loss": -32.619747161865234, "global_step": 30331, "epoch": 250} {"train_loss": -32.12400436401367, "global_step": 30332, "epoch": 250} {"train_loss": -32.57387924194336, "global_step": 30333, "epoch": 250} {"train_loss": -32.73625564575195, "global_step": 30334, "epoch": 250} {"train_loss": -32.530635833740234, "global_step": 30335, "epoch": 250} {"train_loss": -31.97547721862793, "global_step": 30336, "epoch": 250} {"train_loss": -30.88401222229004, "global_step": 30337, "epoch": 250} {"train_loss": -32.27326965332031, "global_step": 30338, "epoch": 250} {"train_loss": -31.61712074279785, "global_step": 30339, "epoch": 250} {"train_loss": -31.610279083251953, "global_step": 30340, "epoch": 250} {"train_loss": -31.187957763671875, "global_step": 30341, "epoch": 250} {"train_loss": -29.969440460205078, "global_step": 30342, "epoch": 250} {"train_loss": -28.80074119567871, "global_step": 30343, "epoch": 250} {"train_loss": -26.37835693359375, "global_step": 30344, "epoch": 250} {"train_loss": -25.146833419799805, "global_step": 30345, "epoch": 250} {"train_loss": -30.21182632446289, "global_step": 30346, "epoch": 250} {"train_loss": -31.329513549804688, "global_step": 30347, "epoch": 250} {"train_loss": -28.304397583007812, "global_step": 30348, "epoch": 250} {"train_loss": -30.884984970092773, "global_step": 30349, "epoch": 250} {"train_loss": -30.30852699279785, "global_step": 30350, "epoch": 250} {"train_loss": -28.7716121673584, "global_step": 30351, "epoch": 250} {"train_loss": -31.802343368530273, "global_step": 30352, "epoch": 250} {"train_loss": -29.999755859375, "global_step": 30353, "epoch": 250} {"train_loss": -30.845380783081055, "global_step": 30354, "epoch": 250} {"train_loss": -30.48026466369629, "global_step": 30355, "epoch": 250} {"train_loss": -31.820255279541016, "global_step": 30356, "epoch": 250} {"train_loss": -30.692596435546875, "global_step": 30357, "epoch": 250} {"train_loss": -32.230342864990234, "global_step": 30358, "epoch": 250} {"train_loss": -30.877660751342773, "global_step": 30359, "epoch": 250} {"train_loss": -31.77289390563965, "global_step": 30360, "epoch": 250} {"train_loss": -31.043426513671875, "global_step": 30361, "epoch": 250} {"train_loss": -30.882720947265625, "global_step": 30362, "epoch": 250} {"train_loss": -30.911523818969727, "global_step": 30363, "epoch": 250} {"train_loss": -30.54924964904785, "global_step": 30364, "epoch": 250} {"train_loss": -30.953277587890625, "global_step": 30365, "epoch": 250} {"train_loss": -29.800994873046875, "global_step": 30366, "epoch": 250} {"train_loss": -30.907506942749023, "global_step": 30367, "epoch": 250} {"train_loss": -29.02546501159668, "global_step": 30368, "epoch": 250} {"train_loss": -30.371021270751953, "global_step": 30369, "epoch": 250} {"train_loss": -31.215558658946644, "global_step": 30370, "epoch": 250, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4400000": 1.0, "test/sim_max_reward_4400001": 1.0, "test/sim_max_reward_4400002": 1.0, "test/sim_max_reward_4400003": 1.0, "test/sim_max_reward_4400004": 1.0, "test/sim_max_reward_4400005": 1.0, "test/sim_max_reward_4400006": 1.0, "test/sim_max_reward_4400007": 1.0, "test/sim_max_reward_4400008": 1.0, "test/sim_max_reward_4400009": 1.0, "test/sim_max_reward_4400010": 1.0, "test/sim_max_reward_4400011": 1.0, "test/sim_max_reward_4400012": 1.0, "test/sim_max_reward_4400013": 1.0, "test/sim_max_reward_4400014": 1.0, "test/sim_max_reward_4400015": 1.0, "test/sim_max_reward_4400016": 1.0, "test/sim_max_reward_4400017": 1.0, "test/sim_max_reward_4400018": 1.0, "test/sim_max_reward_4400019": 1.0, "test/sim_max_reward_4400020": 1.0, "test/sim_max_reward_4400021": 1.0, "train/mean_score": 1.0, "test/mean_score": 1.0, "val_loss": 2564594.25} {"train_loss": -30.717309951782227, "global_step": 30371, "epoch": 251} {"train_loss": -30.064245223999023, "global_step": 30372, "epoch": 251} {"train_loss": -31.113676071166992, "global_step": 30373, "epoch": 251} {"train_loss": -31.115476608276367, "global_step": 30374, "epoch": 251} {"train_loss": -31.293237686157227, "global_step": 30375, "epoch": 251} {"train_loss": -31.076614379882812, "global_step": 30376, "epoch": 251} {"train_loss": -30.869470596313477, "global_step": 30377, "epoch": 251} {"train_loss": -31.15235710144043, "global_step": 30378, "epoch": 251} {"train_loss": -31.145862579345703, "global_step": 30379, "epoch": 251} {"train_loss": -31.54275894165039, "global_step": 30380, "epoch": 251} {"train_loss": -31.665409088134766, "global_step": 30381, "epoch": 251} {"train_loss": -31.8402042388916, "global_step": 30382, "epoch": 251} {"train_loss": -31.765323638916016, "global_step": 30383, "epoch": 251} {"train_loss": -32.0589714050293, "global_step": 30384, "epoch": 251} {"train_loss": -31.71240234375, "global_step": 30385, "epoch": 251} {"train_loss": -31.718097686767578, "global_step": 30386, "epoch": 251} {"train_loss": -31.8897762298584, "global_step": 30387, "epoch": 251} {"train_loss": -31.884323120117188, "global_step": 30388, "epoch": 251} {"train_loss": -32.04531478881836, "global_step": 30389, "epoch": 251} {"train_loss": -31.749988555908203, "global_step": 30390, "epoch": 251} {"train_loss": -31.88405418395996, "global_step": 30391, "epoch": 251} {"train_loss": -32.23862838745117, "global_step": 30392, "epoch": 251} {"train_loss": -31.663007736206055, "global_step": 30393, "epoch": 251} {"train_loss": -31.81363296508789, "global_step": 30394, "epoch": 251} {"train_loss": -32.174842834472656, "global_step": 30395, "epoch": 251} {"train_loss": -31.766040802001953, "global_step": 30396, "epoch": 251} {"train_loss": -32.2204704284668, "global_step": 30397, "epoch": 251} {"train_loss": -32.22883605957031, "global_step": 30398, "epoch": 251} {"train_loss": -32.147926330566406, "global_step": 30399, "epoch": 251} {"train_loss": -32.71343994140625, "global_step": 30400, "epoch": 251} {"train_loss": -32.545379638671875, "global_step": 30401, "epoch": 251} {"train_loss": -31.489124298095703, "global_step": 30402, "epoch": 251} {"train_loss": -31.975799560546875, "global_step": 30403, "epoch": 251} {"train_loss": -32.273250579833984, "global_step": 30404, "epoch": 251} {"train_loss": -32.16915512084961, "global_step": 30405, "epoch": 251} {"train_loss": -32.15760040283203, "global_step": 30406, "epoch": 251} {"train_loss": -32.083309173583984, "global_step": 30407, "epoch": 251} {"train_loss": -32.49763107299805, "global_step": 30408, "epoch": 251} {"train_loss": -32.46171188354492, "global_step": 30409, "epoch": 251} {"train_loss": -32.198726654052734, "global_step": 30410, "epoch": 251} {"train_loss": -32.208229064941406, "global_step": 30411, "epoch": 251} {"train_loss": -32.5688362121582, "global_step": 30412, "epoch": 251} {"train_loss": -31.276880264282227, "global_step": 30413, "epoch": 251} {"train_loss": -32.15903854370117, "global_step": 30414, "epoch": 251} {"train_loss": -32.071083068847656, "global_step": 30415, "epoch": 251} {"train_loss": -32.26536178588867, "global_step": 30416, "epoch": 251} {"train_loss": -32.3774528503418, "global_step": 30417, "epoch": 251} {"train_loss": -32.08424758911133, "global_step": 30418, "epoch": 251} {"train_loss": -31.624765396118164, "global_step": 30419, "epoch": 251} {"train_loss": -32.47847366333008, "global_step": 30420, "epoch": 251} {"train_loss": -32.17967987060547, "global_step": 30421, "epoch": 251} {"train_loss": -31.59784507751465, "global_step": 30422, "epoch": 251} {"train_loss": -32.4245719909668, "global_step": 30423, "epoch": 251} {"train_loss": -32.661277770996094, "global_step": 30424, "epoch": 251} {"train_loss": -31.9007625579834, "global_step": 30425, "epoch": 251} {"train_loss": -30.931455612182617, "global_step": 30426, "epoch": 251} {"train_loss": -32.076210021972656, "global_step": 30427, "epoch": 251} {"train_loss": -32.976898193359375, "global_step": 30428, "epoch": 251} {"train_loss": -31.411352157592773, "global_step": 30429, "epoch": 251} {"train_loss": -33.10506820678711, "global_step": 30430, "epoch": 251} {"train_loss": -32.61100387573242, "global_step": 30431, "epoch": 251} {"train_loss": -32.114315032958984, "global_step": 30432, "epoch": 251} {"train_loss": -32.33961486816406, "global_step": 30433, "epoch": 251} {"train_loss": -31.306928634643555, "global_step": 30434, "epoch": 251} {"train_loss": -31.476282119750977, "global_step": 30435, "epoch": 251} {"train_loss": -32.605037689208984, "global_step": 30436, "epoch": 251} {"train_loss": -32.71515655517578, "global_step": 30437, "epoch": 251} {"train_loss": -31.821563720703125, "global_step": 30438, "epoch": 251} {"train_loss": -31.82779884338379, "global_step": 30439, "epoch": 251} {"train_loss": -32.743160247802734, "global_step": 30440, "epoch": 251} {"train_loss": -32.436824798583984, "global_step": 30441, "epoch": 251} {"train_loss": -32.55121994018555, "global_step": 30442, "epoch": 251} {"train_loss": -32.210140228271484, "global_step": 30443, "epoch": 251} {"train_loss": -31.8798828125, "global_step": 30444, "epoch": 251} {"train_loss": -32.220672607421875, "global_step": 30445, "epoch": 251} {"train_loss": -30.342273712158203, "global_step": 30446, "epoch": 251} {"train_loss": -31.50054359436035, "global_step": 30447, "epoch": 251} {"train_loss": -32.2015266418457, "global_step": 30448, "epoch": 251} {"train_loss": -32.65560531616211, "global_step": 30449, "epoch": 251} {"train_loss": -31.799087524414062, "global_step": 30450, "epoch": 251} {"train_loss": -31.688817977905273, "global_step": 30451, "epoch": 251} {"train_loss": -32.2100944519043, "global_step": 30452, "epoch": 251} {"train_loss": -32.09663391113281, "global_step": 30453, "epoch": 251} {"train_loss": -32.8609619140625, "global_step": 30454, "epoch": 251} {"train_loss": -32.17159652709961, "global_step": 30455, "epoch": 251} {"train_loss": -32.094547271728516, "global_step": 30456, "epoch": 251} {"train_loss": -32.626922607421875, "global_step": 30457, "epoch": 251} {"train_loss": -32.08306884765625, "global_step": 30458, "epoch": 251} {"train_loss": -32.01414108276367, "global_step": 30459, "epoch": 251} {"train_loss": -32.225807189941406, "global_step": 30460, "epoch": 251} {"train_loss": -32.16028594970703, "global_step": 30461, "epoch": 251} {"train_loss": -31.146020889282227, "global_step": 30462, "epoch": 251} {"train_loss": -32.226993560791016, "global_step": 30463, "epoch": 251} {"train_loss": -32.32646560668945, "global_step": 30464, "epoch": 251} {"train_loss": -32.67316818237305, "global_step": 30465, "epoch": 251} {"train_loss": -32.46511459350586, "global_step": 30466, "epoch": 251} {"train_loss": -32.40048599243164, "global_step": 30467, "epoch": 251} {"train_loss": -31.770572662353516, "global_step": 30468, "epoch": 251} {"train_loss": -32.846160888671875, "global_step": 30469, "epoch": 251} {"train_loss": -32.37993240356445, "global_step": 30470, "epoch": 251} {"train_loss": -32.8499870300293, "global_step": 30471, "epoch": 251} {"train_loss": -32.444297790527344, "global_step": 30472, "epoch": 251} {"train_loss": -32.89833068847656, "global_step": 30473, "epoch": 251} {"train_loss": -32.11214828491211, "global_step": 30474, "epoch": 251} {"train_loss": -32.69858169555664, "global_step": 30475, "epoch": 251} {"train_loss": -32.5413932800293, "global_step": 30476, "epoch": 251} {"train_loss": -32.84805679321289, "global_step": 30477, "epoch": 251} {"train_loss": -32.73641586303711, "global_step": 30478, "epoch": 251} {"train_loss": -32.63961410522461, "global_step": 30479, "epoch": 251} {"train_loss": -32.803260803222656, "global_step": 30480, "epoch": 251} {"train_loss": -33.26259231567383, "global_step": 30481, "epoch": 251} {"train_loss": -33.0885124206543, "global_step": 30482, "epoch": 251} {"train_loss": -32.6679801940918, "global_step": 30483, "epoch": 251} {"train_loss": -33.38546371459961, "global_step": 30484, "epoch": 251} {"train_loss": -32.53750228881836, "global_step": 30485, "epoch": 251} {"train_loss": -33.03468322753906, "global_step": 30486, "epoch": 251} {"train_loss": -32.80009841918945, "global_step": 30487, "epoch": 251} {"train_loss": -32.79552459716797, "global_step": 30488, "epoch": 251} {"train_loss": -33.30733871459961, "global_step": 30489, "epoch": 251} {"train_loss": -32.91548538208008, "global_step": 30490, "epoch": 251} {"train_loss": -32.133960676587314, "global_step": 30491, "epoch": 251, "val_loss": 2473799.25} {"train_loss": -33.05615997314453, "global_step": 30492, "epoch": 252} {"train_loss": -33.037899017333984, "global_step": 30493, "epoch": 252} {"train_loss": -32.5080451965332, "global_step": 30494, "epoch": 252} {"train_loss": -31.92384147644043, "global_step": 30495, "epoch": 252} {"train_loss": -31.122879028320312, "global_step": 30496, "epoch": 252} {"train_loss": -29.593536376953125, "global_step": 30497, "epoch": 252} {"train_loss": -25.96796989440918, "global_step": 30498, "epoch": 252} {"train_loss": -16.973407745361328, "global_step": 30499, "epoch": 252} {"train_loss": -10.524589538574219, "global_step": 30500, "epoch": 252} {"train_loss": -18.80841636657715, "global_step": 30501, "epoch": 252} {"train_loss": -28.23137855529785, "global_step": 30502, "epoch": 252} {"train_loss": -29.458459854125977, "global_step": 30503, "epoch": 252} {"train_loss": -28.3675479888916, "global_step": 30504, "epoch": 252} {"train_loss": -28.004281997680664, "global_step": 30505, "epoch": 252} {"train_loss": -29.109189987182617, "global_step": 30506, "epoch": 252} {"train_loss": -30.628217697143555, "global_step": 30507, "epoch": 252} {"train_loss": -29.670501708984375, "global_step": 30508, "epoch": 252} {"train_loss": -30.323896408081055, "global_step": 30509, "epoch": 252} {"train_loss": -31.32779884338379, "global_step": 30510, "epoch": 252} {"train_loss": -29.258838653564453, "global_step": 30511, "epoch": 252} {"train_loss": -30.74824333190918, "global_step": 30512, "epoch": 252} {"train_loss": -31.0709285736084, "global_step": 30513, "epoch": 252} {"train_loss": -30.33198356628418, "global_step": 30514, "epoch": 252} {"train_loss": -31.05055809020996, "global_step": 30515, "epoch": 252} {"train_loss": -31.250532150268555, "global_step": 30516, "epoch": 252} {"train_loss": -30.7154598236084, "global_step": 30517, "epoch": 252} {"train_loss": -30.678394317626953, "global_step": 30518, "epoch": 252} {"train_loss": -30.735315322875977, "global_step": 30519, "epoch": 252} {"train_loss": -31.434823989868164, "global_step": 30520, "epoch": 252} {"train_loss": -31.265554428100586, "global_step": 30521, "epoch": 252} {"train_loss": -31.634912490844727, "global_step": 30522, "epoch": 252} {"train_loss": -31.56574058532715, "global_step": 30523, "epoch": 252} {"train_loss": -31.626325607299805, "global_step": 30524, "epoch": 252} {"train_loss": -31.96504020690918, "global_step": 30525, "epoch": 252} {"train_loss": -31.7120418548584, "global_step": 30526, "epoch": 252} {"train_loss": -31.7900447845459, "global_step": 30527, "epoch": 252} {"train_loss": -31.56855583190918, "global_step": 30528, "epoch": 252} {"train_loss": -32.04830551147461, "global_step": 30529, "epoch": 252} {"train_loss": -31.997312545776367, "global_step": 30530, "epoch": 252} {"train_loss": -32.216697692871094, "global_step": 30531, "epoch": 252} {"train_loss": -31.336734771728516, "global_step": 30532, "epoch": 252} {"train_loss": -32.07380294799805, "global_step": 30533, "epoch": 252} {"train_loss": -32.467742919921875, "global_step": 30534, "epoch": 252} {"train_loss": -32.253318786621094, "global_step": 30535, "epoch": 252} {"train_loss": -32.30934143066406, "global_step": 30536, "epoch": 252} {"train_loss": -31.89794921875, "global_step": 30537, "epoch": 252} {"train_loss": -32.55707550048828, "global_step": 30538, "epoch": 252} {"train_loss": -32.43275833129883, "global_step": 30539, "epoch": 252} {"train_loss": -32.1862907409668, "global_step": 30540, "epoch": 252} {"train_loss": -32.352569580078125, "global_step": 30541, "epoch": 252} {"train_loss": -32.60245895385742, "global_step": 30542, "epoch": 252} {"train_loss": -32.465309143066406, "global_step": 30543, "epoch": 252} {"train_loss": -32.31917190551758, "global_step": 30544, "epoch": 252} {"train_loss": -32.54439926147461, "global_step": 30545, "epoch": 252} {"train_loss": -32.56119918823242, "global_step": 30546, "epoch": 252} {"train_loss": -32.60154342651367, "global_step": 30547, "epoch": 252} {"train_loss": -32.856781005859375, "global_step": 30548, "epoch": 252} {"train_loss": -32.5757942199707, "global_step": 30549, "epoch": 252} {"train_loss": -33.0278434753418, "global_step": 30550, "epoch": 252} {"train_loss": -32.576812744140625, "global_step": 30551, "epoch": 252} {"train_loss": -32.599483489990234, "global_step": 30552, "epoch": 252} {"train_loss": -32.31958770751953, "global_step": 30553, "epoch": 252} {"train_loss": -32.60749435424805, "global_step": 30554, "epoch": 252} {"train_loss": -32.39009094238281, "global_step": 30555, "epoch": 252} {"train_loss": -32.36494827270508, "global_step": 30556, "epoch": 252} {"train_loss": -31.68410301208496, "global_step": 30557, "epoch": 252} {"train_loss": -32.3105583190918, "global_step": 30558, "epoch": 252} {"train_loss": -32.11030960083008, "global_step": 30559, "epoch": 252} {"train_loss": -32.85238265991211, "global_step": 30560, "epoch": 252} {"train_loss": -31.789152145385742, "global_step": 30561, "epoch": 252} {"train_loss": -33.05705642700195, "global_step": 30562, "epoch": 252} {"train_loss": -32.3336296081543, "global_step": 30563, "epoch": 252} {"train_loss": -32.26249313354492, "global_step": 30564, "epoch": 252} {"train_loss": -32.70112609863281, "global_step": 30565, "epoch": 252} {"train_loss": -32.3670539855957, "global_step": 30566, "epoch": 252} {"train_loss": -32.56884002685547, "global_step": 30567, "epoch": 252} {"train_loss": -32.691925048828125, "global_step": 30568, "epoch": 252} {"train_loss": -31.99540138244629, "global_step": 30569, "epoch": 252} {"train_loss": -32.530391693115234, "global_step": 30570, "epoch": 252} {"train_loss": -31.423608779907227, "global_step": 30571, "epoch": 252} {"train_loss": -32.462181091308594, "global_step": 30572, "epoch": 252} {"train_loss": -31.765104293823242, "global_step": 30573, "epoch": 252} {"train_loss": -31.735197067260742, "global_step": 30574, "epoch": 252} {"train_loss": -31.31744384765625, "global_step": 30575, "epoch": 252} {"train_loss": -32.28742218017578, "global_step": 30576, "epoch": 252} {"train_loss": -31.2144775390625, "global_step": 30577, "epoch": 252} {"train_loss": -30.688312530517578, "global_step": 30578, "epoch": 252} {"train_loss": -28.66609001159668, "global_step": 30579, "epoch": 252} {"train_loss": -26.166976928710938, "global_step": 30580, "epoch": 252} {"train_loss": -25.226903915405273, "global_step": 30581, "epoch": 252} {"train_loss": -28.960119247436523, "global_step": 30582, "epoch": 252} {"train_loss": -31.540632247924805, "global_step": 30583, "epoch": 252} {"train_loss": -27.555524826049805, "global_step": 30584, "epoch": 252} {"train_loss": -30.528106689453125, "global_step": 30585, "epoch": 252} {"train_loss": -29.961898803710938, "global_step": 30586, "epoch": 252} {"train_loss": -29.67490005493164, "global_step": 30587, "epoch": 252} {"train_loss": -30.57293128967285, "global_step": 30588, "epoch": 252} {"train_loss": -30.99671745300293, "global_step": 30589, "epoch": 252} {"train_loss": -31.079456329345703, "global_step": 30590, "epoch": 252} {"train_loss": -31.735788345336914, "global_step": 30591, "epoch": 252} {"train_loss": -31.056360244750977, "global_step": 30592, "epoch": 252} {"train_loss": -31.586389541625977, "global_step": 30593, "epoch": 252} {"train_loss": -31.325794219970703, "global_step": 30594, "epoch": 252} {"train_loss": -31.331180572509766, "global_step": 30595, "epoch": 252} {"train_loss": -31.72551918029785, "global_step": 30596, "epoch": 252} {"train_loss": -31.630712509155273, "global_step": 30597, "epoch": 252} {"train_loss": -31.370925903320312, "global_step": 30598, "epoch": 252} {"train_loss": -31.826202392578125, "global_step": 30599, "epoch": 252} {"train_loss": -31.92599868774414, "global_step": 30600, "epoch": 252} {"train_loss": -32.133480072021484, "global_step": 30601, "epoch": 252} {"train_loss": -32.26752853393555, "global_step": 30602, "epoch": 252} {"train_loss": -31.799158096313477, "global_step": 30603, "epoch": 252} {"train_loss": -31.897872924804688, "global_step": 30604, "epoch": 252} {"train_loss": -32.63566207885742, "global_step": 30605, "epoch": 252} {"train_loss": -32.226253509521484, "global_step": 30606, "epoch": 252} {"train_loss": -32.374542236328125, "global_step": 30607, "epoch": 252} {"train_loss": -32.6436653137207, "global_step": 30608, "epoch": 252} {"train_loss": -32.33539962768555, "global_step": 30609, "epoch": 252} {"train_loss": -32.32396697998047, "global_step": 30610, "epoch": 252} {"train_loss": -32.468360900878906, "global_step": 30611, "epoch": 252} {"train_loss": -31.039377275577262, "global_step": 30612, "epoch": 252, "val_loss": 2756626.25} {"train_loss": -32.51860427856445, "global_step": 30613, "epoch": 253} {"train_loss": -31.789281845092773, "global_step": 30614, "epoch": 253} {"train_loss": -32.732173919677734, "global_step": 30615, "epoch": 253} {"train_loss": -32.025882720947266, "global_step": 30616, "epoch": 253} {"train_loss": -33.00642776489258, "global_step": 30617, "epoch": 253} {"train_loss": -32.8357048034668, "global_step": 30618, "epoch": 253} {"train_loss": -32.983619689941406, "global_step": 30619, "epoch": 253} {"train_loss": -32.52668380737305, "global_step": 30620, "epoch": 253} {"train_loss": -33.08864974975586, "global_step": 30621, "epoch": 253} {"train_loss": -32.72443771362305, "global_step": 30622, "epoch": 253} {"train_loss": -32.12952423095703, "global_step": 30623, "epoch": 253} {"train_loss": -31.9122314453125, "global_step": 30624, "epoch": 253} {"train_loss": -32.921749114990234, "global_step": 30625, "epoch": 253} {"train_loss": -31.91855812072754, "global_step": 30626, "epoch": 253} {"train_loss": -31.957334518432617, "global_step": 30627, "epoch": 253} {"train_loss": -31.520971298217773, "global_step": 30628, "epoch": 253} {"train_loss": -31.73478126525879, "global_step": 30629, "epoch": 253} {"train_loss": -32.3476676940918, "global_step": 30630, "epoch": 253} {"train_loss": -32.099151611328125, "global_step": 30631, "epoch": 253} {"train_loss": -32.5380973815918, "global_step": 30632, "epoch": 253} {"train_loss": -32.368404388427734, "global_step": 30633, "epoch": 253} {"train_loss": -30.947803497314453, "global_step": 30634, "epoch": 253} {"train_loss": -31.563940048217773, "global_step": 30635, "epoch": 253} {"train_loss": -30.64715576171875, "global_step": 30636, "epoch": 253} {"train_loss": -31.866193771362305, "global_step": 30637, "epoch": 253} {"train_loss": -31.442398071289062, "global_step": 30638, "epoch": 253} {"train_loss": -31.330875396728516, "global_step": 30639, "epoch": 253} {"train_loss": -32.43064880371094, "global_step": 30640, "epoch": 253} {"train_loss": -31.892160415649414, "global_step": 30641, "epoch": 253} {"train_loss": -31.184289932250977, "global_step": 30642, "epoch": 253} {"train_loss": -31.31060791015625, "global_step": 30643, "epoch": 253} {"train_loss": -31.58308219909668, "global_step": 30644, "epoch": 253} {"train_loss": -31.48052406311035, "global_step": 30645, "epoch": 253} {"train_loss": -31.78968620300293, "global_step": 30646, "epoch": 253} {"train_loss": -32.19263458251953, "global_step": 30647, "epoch": 253} {"train_loss": -32.31101608276367, "global_step": 30648, "epoch": 253} {"train_loss": -32.263545989990234, "global_step": 30649, "epoch": 253} {"train_loss": -32.30857467651367, "global_step": 30650, "epoch": 253} {"train_loss": -32.24829864501953, "global_step": 30651, "epoch": 253} {"train_loss": -31.769947052001953, "global_step": 30652, "epoch": 253} {"train_loss": -31.747909545898438, "global_step": 30653, "epoch": 253} {"train_loss": -31.9315128326416, "global_step": 30654, "epoch": 253} {"train_loss": -32.21714401245117, "global_step": 30655, "epoch": 253} {"train_loss": -32.03778076171875, "global_step": 30656, "epoch": 253} {"train_loss": -31.651147842407227, "global_step": 30657, "epoch": 253} {"train_loss": -32.5616340637207, "global_step": 30658, "epoch": 253} {"train_loss": -32.16317367553711, "global_step": 30659, "epoch": 253} {"train_loss": -32.78022384643555, "global_step": 30660, "epoch": 253} {"train_loss": -32.1630859375, "global_step": 30661, "epoch": 253} {"train_loss": -32.38076400756836, "global_step": 30662, "epoch": 253} {"train_loss": -32.5998649597168, "global_step": 30663, "epoch": 253} {"train_loss": -32.66071319580078, "global_step": 30664, "epoch": 253} {"train_loss": -32.541595458984375, "global_step": 30665, "epoch": 253} {"train_loss": -32.337928771972656, "global_step": 30666, "epoch": 253} {"train_loss": -32.740657806396484, "global_step": 30667, "epoch": 253} {"train_loss": -32.90934371948242, "global_step": 30668, "epoch": 253} {"train_loss": -32.140968322753906, "global_step": 30669, "epoch": 253} {"train_loss": -32.530120849609375, "global_step": 30670, "epoch": 253} {"train_loss": -32.77484130859375, "global_step": 30671, "epoch": 253} {"train_loss": -33.185813903808594, "global_step": 30672, "epoch": 253} {"train_loss": -33.13270568847656, "global_step": 30673, "epoch": 253} {"train_loss": -32.22970199584961, "global_step": 30674, "epoch": 253} {"train_loss": -32.23746109008789, "global_step": 30675, "epoch": 253} {"train_loss": -32.5192756652832, "global_step": 30676, "epoch": 253} {"train_loss": -32.827327728271484, "global_step": 30677, "epoch": 253} {"train_loss": -32.955745697021484, "global_step": 30678, "epoch": 253} {"train_loss": -31.84425163269043, "global_step": 30679, "epoch": 253} {"train_loss": -32.77171325683594, "global_step": 30680, "epoch": 253} {"train_loss": -32.92281723022461, "global_step": 30681, "epoch": 253} {"train_loss": -32.99990463256836, "global_step": 30682, "epoch": 253} {"train_loss": -33.29742431640625, "global_step": 30683, "epoch": 253} {"train_loss": -33.020538330078125, "global_step": 30684, "epoch": 253} {"train_loss": -32.79695129394531, "global_step": 30685, "epoch": 253} {"train_loss": -32.645538330078125, "global_step": 30686, "epoch": 253} {"train_loss": -33.00984573364258, "global_step": 30687, "epoch": 253} {"train_loss": -32.68423080444336, "global_step": 30688, "epoch": 253} {"train_loss": -33.31459045410156, "global_step": 30689, "epoch": 253} {"train_loss": -32.707603454589844, "global_step": 30690, "epoch": 253} {"train_loss": -32.55526351928711, "global_step": 30691, "epoch": 253} {"train_loss": -33.373260498046875, "global_step": 30692, "epoch": 253} {"train_loss": -33.01848602294922, "global_step": 30693, "epoch": 253} {"train_loss": -32.702754974365234, "global_step": 30694, "epoch": 253} {"train_loss": -32.8680305480957, "global_step": 30695, "epoch": 253} {"train_loss": -32.4423713684082, "global_step": 30696, "epoch": 253} {"train_loss": -32.04372024536133, "global_step": 30697, "epoch": 253} {"train_loss": -33.21421432495117, "global_step": 30698, "epoch": 253} {"train_loss": -33.19565963745117, "global_step": 30699, "epoch": 253} {"train_loss": -32.877655029296875, "global_step": 30700, "epoch": 253} {"train_loss": -33.38508987426758, "global_step": 30701, "epoch": 253} {"train_loss": -33.379119873046875, "global_step": 30702, "epoch": 253} {"train_loss": -32.93736267089844, "global_step": 30703, "epoch": 253} {"train_loss": -32.738399505615234, "global_step": 30704, "epoch": 253} {"train_loss": -32.742469787597656, "global_step": 30705, "epoch": 253} {"train_loss": -31.300466537475586, "global_step": 30706, "epoch": 253} {"train_loss": -29.822546005249023, "global_step": 30707, "epoch": 253} {"train_loss": -21.800798416137695, "global_step": 30708, "epoch": 253} {"train_loss": -7.186737060546875, "global_step": 30709, "epoch": 253} {"train_loss": -7.2515549659729, "global_step": 30710, "epoch": 253} {"train_loss": -30.563684463500977, "global_step": 30711, "epoch": 253} {"train_loss": -20.5013484954834, "global_step": 30712, "epoch": 253} {"train_loss": -30.63565444946289, "global_step": 30713, "epoch": 253} {"train_loss": -24.075307846069336, "global_step": 30714, "epoch": 253} {"train_loss": -28.115558624267578, "global_step": 30715, "epoch": 253} {"train_loss": -30.67999839782715, "global_step": 30716, "epoch": 253} {"train_loss": -27.27768898010254, "global_step": 30717, "epoch": 253} {"train_loss": -28.083127975463867, "global_step": 30718, "epoch": 253} {"train_loss": -31.0119571685791, "global_step": 30719, "epoch": 253} {"train_loss": -28.717260360717773, "global_step": 30720, "epoch": 253} {"train_loss": -29.718313217163086, "global_step": 30721, "epoch": 253} {"train_loss": -29.9117431640625, "global_step": 30722, "epoch": 253} {"train_loss": -30.48774528503418, "global_step": 30723, "epoch": 253} {"train_loss": -31.23255729675293, "global_step": 30724, "epoch": 253} {"train_loss": -30.188068389892578, "global_step": 30725, "epoch": 253} {"train_loss": -30.683135986328125, "global_step": 30726, "epoch": 253} {"train_loss": -29.847442626953125, "global_step": 30727, "epoch": 253} {"train_loss": -31.481481552124023, "global_step": 30728, "epoch": 253} {"train_loss": -30.759618759155273, "global_step": 30729, "epoch": 253} {"train_loss": -31.512609481811523, "global_step": 30730, "epoch": 253} {"train_loss": -31.187122344970703, "global_step": 30731, "epoch": 253} {"train_loss": -31.19160270690918, "global_step": 30732, "epoch": 253} {"train_loss": -31.326217718360837, "global_step": 30733, "epoch": 253, "val_loss": 2693295.75} {"train_loss": -31.0870418548584, "global_step": 30734, "epoch": 254} {"train_loss": -31.66645622253418, "global_step": 30735, "epoch": 254} {"train_loss": -31.41326904296875, "global_step": 30736, "epoch": 254} {"train_loss": -31.937097549438477, "global_step": 30737, "epoch": 254} {"train_loss": -31.962766647338867, "global_step": 30738, "epoch": 254} {"train_loss": -31.526662826538086, "global_step": 30739, "epoch": 254} {"train_loss": -31.717254638671875, "global_step": 30740, "epoch": 254} {"train_loss": -32.06906509399414, "global_step": 30741, "epoch": 254} {"train_loss": -32.0248908996582, "global_step": 30742, "epoch": 254} {"train_loss": -32.417144775390625, "global_step": 30743, "epoch": 254} {"train_loss": -32.12666320800781, "global_step": 30744, "epoch": 254} {"train_loss": -32.23903274536133, "global_step": 30745, "epoch": 254} {"train_loss": -32.2168083190918, "global_step": 30746, "epoch": 254} {"train_loss": -32.21516036987305, "global_step": 30747, "epoch": 254} {"train_loss": -32.3574333190918, "global_step": 30748, "epoch": 254} {"train_loss": -32.351200103759766, "global_step": 30749, "epoch": 254} {"train_loss": -32.337684631347656, "global_step": 30750, "epoch": 254} {"train_loss": -32.5745964050293, "global_step": 30751, "epoch": 254} {"train_loss": -32.56218338012695, "global_step": 30752, "epoch": 254} {"train_loss": -31.87806510925293, "global_step": 30753, "epoch": 254} {"train_loss": -31.374862670898438, "global_step": 30754, "epoch": 254} {"train_loss": -31.7404842376709, "global_step": 30755, "epoch": 254} {"train_loss": -32.35866928100586, "global_step": 30756, "epoch": 254} {"train_loss": -31.19473648071289, "global_step": 30757, "epoch": 254} {"train_loss": -31.423480987548828, "global_step": 30758, "epoch": 254} {"train_loss": -32.39876937866211, "global_step": 30759, "epoch": 254} {"train_loss": -31.504194259643555, "global_step": 30760, "epoch": 254} {"train_loss": -32.235633850097656, "global_step": 30761, "epoch": 254} {"train_loss": -32.34494400024414, "global_step": 30762, "epoch": 254} {"train_loss": -32.389190673828125, "global_step": 30763, "epoch": 254} {"train_loss": -32.2309455871582, "global_step": 30764, "epoch": 254} {"train_loss": -32.270511627197266, "global_step": 30765, "epoch": 254} {"train_loss": -32.479278564453125, "global_step": 30766, "epoch": 254} {"train_loss": -31.372161865234375, "global_step": 30767, "epoch": 254} {"train_loss": -31.887588500976562, "global_step": 30768, "epoch": 254} {"train_loss": -31.912656784057617, "global_step": 30769, "epoch": 254} {"train_loss": -32.55009460449219, "global_step": 30770, "epoch": 254} {"train_loss": -31.49442481994629, "global_step": 30771, "epoch": 254} {"train_loss": -32.47138214111328, "global_step": 30772, "epoch": 254} {"train_loss": -32.39413070678711, "global_step": 30773, "epoch": 254} {"train_loss": -32.63949203491211, "global_step": 30774, "epoch": 254} {"train_loss": -32.22811508178711, "global_step": 30775, "epoch": 254} {"train_loss": -31.96380043029785, "global_step": 30776, "epoch": 254} {"train_loss": -32.33028793334961, "global_step": 30777, "epoch": 254} {"train_loss": -32.72174835205078, "global_step": 30778, "epoch": 254} {"train_loss": -32.2475700378418, "global_step": 30779, "epoch": 254} {"train_loss": -32.08647537231445, "global_step": 30780, "epoch": 254} {"train_loss": -32.58305740356445, "global_step": 30781, "epoch": 254} {"train_loss": -32.49579620361328, "global_step": 30782, "epoch": 254} {"train_loss": -32.242061614990234, "global_step": 30783, "epoch": 254} {"train_loss": -31.744709014892578, "global_step": 30784, "epoch": 254} {"train_loss": -31.860172271728516, "global_step": 30785, "epoch": 254} {"train_loss": -31.301807403564453, "global_step": 30786, "epoch": 254} {"train_loss": -32.44768142700195, "global_step": 30787, "epoch": 254} {"train_loss": -31.9166259765625, "global_step": 30788, "epoch": 254} {"train_loss": -31.803613662719727, "global_step": 30789, "epoch": 254} {"train_loss": -32.03269958496094, "global_step": 30790, "epoch": 254} {"train_loss": -32.1114616394043, "global_step": 30791, "epoch": 254} {"train_loss": -32.580718994140625, "global_step": 30792, "epoch": 254} {"train_loss": -31.770191192626953, "global_step": 30793, "epoch": 254} {"train_loss": -32.16695022583008, "global_step": 30794, "epoch": 254} {"train_loss": -31.683507919311523, "global_step": 30795, "epoch": 254} {"train_loss": -32.33255386352539, "global_step": 30796, "epoch": 254} {"train_loss": -32.360145568847656, "global_step": 30797, "epoch": 254} {"train_loss": -32.20105743408203, "global_step": 30798, "epoch": 254} {"train_loss": -31.962818145751953, "global_step": 30799, "epoch": 254} {"train_loss": -32.29984664916992, "global_step": 30800, "epoch": 254} {"train_loss": -32.24227523803711, "global_step": 30801, "epoch": 254} {"train_loss": -31.79475975036621, "global_step": 30802, "epoch": 254} {"train_loss": -31.62030601501465, "global_step": 30803, "epoch": 254} {"train_loss": -32.270565032958984, "global_step": 30804, "epoch": 254} {"train_loss": -32.27589797973633, "global_step": 30805, "epoch": 254} {"train_loss": -31.423749923706055, "global_step": 30806, "epoch": 254} {"train_loss": -31.808462142944336, "global_step": 30807, "epoch": 254} {"train_loss": -30.90447998046875, "global_step": 30808, "epoch": 254} {"train_loss": -29.40955924987793, "global_step": 30809, "epoch": 254} {"train_loss": -24.00971794128418, "global_step": 30810, "epoch": 254} {"train_loss": -22.636260986328125, "global_step": 30811, "epoch": 254} {"train_loss": -28.4364070892334, "global_step": 30812, "epoch": 254} {"train_loss": -32.1141242980957, "global_step": 30813, "epoch": 254} {"train_loss": -29.691747665405273, "global_step": 30814, "epoch": 254} {"train_loss": -31.104618072509766, "global_step": 30815, "epoch": 254} {"train_loss": -32.25859451293945, "global_step": 30816, "epoch": 254} {"train_loss": -30.516916275024414, "global_step": 30817, "epoch": 254} {"train_loss": -31.694421768188477, "global_step": 30818, "epoch": 254} {"train_loss": -30.762739181518555, "global_step": 30819, "epoch": 254} {"train_loss": -30.972320556640625, "global_step": 30820, "epoch": 254} {"train_loss": -31.38360023498535, "global_step": 30821, "epoch": 254} {"train_loss": -30.094202041625977, "global_step": 30822, "epoch": 254} {"train_loss": -31.089269638061523, "global_step": 30823, "epoch": 254} {"train_loss": -30.678190231323242, "global_step": 30824, "epoch": 254} {"train_loss": -31.32181167602539, "global_step": 30825, "epoch": 254} {"train_loss": -30.480213165283203, "global_step": 30826, "epoch": 254} {"train_loss": -30.633886337280273, "global_step": 30827, "epoch": 254} {"train_loss": -31.591480255126953, "global_step": 30828, "epoch": 254} {"train_loss": -31.15777587890625, "global_step": 30829, "epoch": 254} {"train_loss": -31.809003829956055, "global_step": 30830, "epoch": 254} {"train_loss": -31.18062400817871, "global_step": 30831, "epoch": 254} {"train_loss": -31.831022262573242, "global_step": 30832, "epoch": 254} {"train_loss": -31.295881271362305, "global_step": 30833, "epoch": 254} {"train_loss": -31.56769371032715, "global_step": 30834, "epoch": 254} {"train_loss": -31.565143585205078, "global_step": 30835, "epoch": 254} {"train_loss": -31.198657989501953, "global_step": 30836, "epoch": 254} {"train_loss": -31.62154197692871, "global_step": 30837, "epoch": 254} {"train_loss": -32.08950424194336, "global_step": 30838, "epoch": 254} {"train_loss": -31.576709747314453, "global_step": 30839, "epoch": 254} {"train_loss": -31.558835983276367, "global_step": 30840, "epoch": 254} {"train_loss": -32.0081787109375, "global_step": 30841, "epoch": 254} {"train_loss": -31.8322696685791, "global_step": 30842, "epoch": 254} {"train_loss": -31.63239097595215, "global_step": 30843, "epoch": 254} {"train_loss": -32.3169059753418, "global_step": 30844, "epoch": 254} {"train_loss": -30.92840003967285, "global_step": 30845, "epoch": 254} {"train_loss": -31.922412872314453, "global_step": 30846, "epoch": 254} {"train_loss": -32.06898498535156, "global_step": 30847, "epoch": 254} {"train_loss": -31.384830474853516, "global_step": 30848, "epoch": 254} {"train_loss": -31.613525390625, "global_step": 30849, "epoch": 254} {"train_loss": -31.738330841064453, "global_step": 30850, "epoch": 254} {"train_loss": -31.52741813659668, "global_step": 30851, "epoch": 254} {"train_loss": -31.00600242614746, "global_step": 30852, "epoch": 254} {"train_loss": -32.17524337768555, "global_step": 30853, "epoch": 254} {"train_loss": -31.62065048848302, "global_step": 30854, "epoch": 254, "val_loss": 2958469.25} {"train_loss": -32.214576721191406, "global_step": 30855, "epoch": 255} {"train_loss": -31.65411949157715, "global_step": 30856, "epoch": 255} {"train_loss": -31.16619873046875, "global_step": 30857, "epoch": 255} {"train_loss": -31.05377197265625, "global_step": 30858, "epoch": 255} {"train_loss": -31.272077560424805, "global_step": 30859, "epoch": 255} {"train_loss": -32.01087951660156, "global_step": 30860, "epoch": 255} {"train_loss": -32.3157844543457, "global_step": 30861, "epoch": 255} {"train_loss": -31.37884521484375, "global_step": 30862, "epoch": 255} {"train_loss": -32.715145111083984, "global_step": 30863, "epoch": 255} {"train_loss": -32.066341400146484, "global_step": 30864, "epoch": 255} {"train_loss": -32.02043533325195, "global_step": 30865, "epoch": 255} {"train_loss": -31.49964714050293, "global_step": 30866, "epoch": 255} {"train_loss": -31.723657608032227, "global_step": 30867, "epoch": 255} {"train_loss": -31.642414093017578, "global_step": 30868, "epoch": 255} {"train_loss": -32.094425201416016, "global_step": 30869, "epoch": 255} {"train_loss": -32.28217697143555, "global_step": 30870, "epoch": 255} {"train_loss": -32.096290588378906, "global_step": 30871, "epoch": 255} {"train_loss": -32.4073486328125, "global_step": 30872, "epoch": 255} {"train_loss": -31.85688591003418, "global_step": 30873, "epoch": 255} {"train_loss": -32.33488845825195, "global_step": 30874, "epoch": 255} {"train_loss": -32.67231369018555, "global_step": 30875, "epoch": 255} {"train_loss": -32.17385482788086, "global_step": 30876, "epoch": 255} {"train_loss": -31.570999145507812, "global_step": 30877, "epoch": 255} {"train_loss": -31.969079971313477, "global_step": 30878, "epoch": 255} {"train_loss": -32.168556213378906, "global_step": 30879, "epoch": 255} {"train_loss": -32.41065216064453, "global_step": 30880, "epoch": 255} {"train_loss": -31.954334259033203, "global_step": 30881, "epoch": 255} {"train_loss": -32.37332534790039, "global_step": 30882, "epoch": 255} {"train_loss": -32.5941047668457, "global_step": 30883, "epoch": 255} {"train_loss": -32.21664047241211, "global_step": 30884, "epoch": 255} {"train_loss": -32.53070068359375, "global_step": 30885, "epoch": 255} {"train_loss": -32.85121536254883, "global_step": 30886, "epoch": 255} {"train_loss": -32.43105697631836, "global_step": 30887, "epoch": 255} {"train_loss": -32.769073486328125, "global_step": 30888, "epoch": 255} {"train_loss": -32.64509201049805, "global_step": 30889, "epoch": 255} {"train_loss": -31.8265438079834, "global_step": 30890, "epoch": 255} {"train_loss": -32.358184814453125, "global_step": 30891, "epoch": 255} {"train_loss": -32.84646224975586, "global_step": 30892, "epoch": 255} {"train_loss": -32.12778854370117, "global_step": 30893, "epoch": 255} {"train_loss": -30.91743278503418, "global_step": 30894, "epoch": 255} {"train_loss": -32.21928787231445, "global_step": 30895, "epoch": 255} {"train_loss": -32.70260238647461, "global_step": 30896, "epoch": 255} {"train_loss": -31.833465576171875, "global_step": 30897, "epoch": 255} {"train_loss": -32.81120681762695, "global_step": 30898, "epoch": 255} {"train_loss": -32.56570053100586, "global_step": 30899, "epoch": 255} {"train_loss": -32.29060745239258, "global_step": 30900, "epoch": 255} {"train_loss": -32.29276657104492, "global_step": 30901, "epoch": 255} {"train_loss": -32.30630111694336, "global_step": 30902, "epoch": 255} {"train_loss": -32.35811233520508, "global_step": 30903, "epoch": 255} {"train_loss": -33.05256652832031, "global_step": 30904, "epoch": 255} {"train_loss": -31.804651260375977, "global_step": 30905, "epoch": 255} {"train_loss": -32.27006912231445, "global_step": 30906, "epoch": 255} {"train_loss": -32.811824798583984, "global_step": 30907, "epoch": 255} {"train_loss": -31.75754737854004, "global_step": 30908, "epoch": 255} {"train_loss": -33.08330535888672, "global_step": 30909, "epoch": 255} {"train_loss": -32.34463119506836, "global_step": 30910, "epoch": 255} {"train_loss": -32.7662353515625, "global_step": 30911, "epoch": 255} {"train_loss": -32.15631103515625, "global_step": 30912, "epoch": 255} {"train_loss": -31.814966201782227, "global_step": 30913, "epoch": 255} {"train_loss": -32.45981979370117, "global_step": 30914, "epoch": 255} {"train_loss": -31.66424560546875, "global_step": 30915, "epoch": 255} {"train_loss": -32.00556564331055, "global_step": 30916, "epoch": 255} {"train_loss": -32.529972076416016, "global_step": 30917, "epoch": 255} {"train_loss": -31.98774528503418, "global_step": 30918, "epoch": 255} {"train_loss": -32.34585189819336, "global_step": 30919, "epoch": 255} {"train_loss": -32.00491714477539, "global_step": 30920, "epoch": 255} {"train_loss": -32.954811096191406, "global_step": 30921, "epoch": 255} {"train_loss": -31.882116317749023, "global_step": 30922, "epoch": 255} {"train_loss": -32.81449508666992, "global_step": 30923, "epoch": 255} {"train_loss": -32.15732955932617, "global_step": 30924, "epoch": 255} {"train_loss": -32.85895919799805, "global_step": 30925, "epoch": 255} {"train_loss": -32.47393035888672, "global_step": 30926, "epoch": 255} {"train_loss": -32.836158752441406, "global_step": 30927, "epoch": 255} {"train_loss": -32.9850959777832, "global_step": 30928, "epoch": 255} {"train_loss": -33.003578186035156, "global_step": 30929, "epoch": 255} {"train_loss": -32.61111831665039, "global_step": 30930, "epoch": 255} {"train_loss": -33.00916290283203, "global_step": 30931, "epoch": 255} {"train_loss": -32.944480895996094, "global_step": 30932, "epoch": 255} {"train_loss": -32.8740348815918, "global_step": 30933, "epoch": 255} {"train_loss": -33.16331100463867, "global_step": 30934, "epoch": 255} {"train_loss": -32.787235260009766, "global_step": 30935, "epoch": 255} {"train_loss": -32.946502685546875, "global_step": 30936, "epoch": 255} {"train_loss": -33.10136795043945, "global_step": 30937, "epoch": 255} {"train_loss": -32.13853073120117, "global_step": 30938, "epoch": 255} {"train_loss": -32.9852294921875, "global_step": 30939, "epoch": 255} {"train_loss": -31.805526733398438, "global_step": 30940, "epoch": 255} {"train_loss": -32.80236053466797, "global_step": 30941, "epoch": 255} {"train_loss": -32.23006057739258, "global_step": 30942, "epoch": 255} {"train_loss": -32.66461944580078, "global_step": 30943, "epoch": 255} {"train_loss": -33.24239730834961, "global_step": 30944, "epoch": 255} {"train_loss": -32.35169219970703, "global_step": 30945, "epoch": 255} {"train_loss": -33.008216857910156, "global_step": 30946, "epoch": 255} {"train_loss": -32.992618560791016, "global_step": 30947, "epoch": 255} {"train_loss": -33.02198791503906, "global_step": 30948, "epoch": 255} {"train_loss": -33.17731857299805, "global_step": 30949, "epoch": 255} {"train_loss": -31.732803344726562, "global_step": 30950, "epoch": 255} {"train_loss": -32.656982421875, "global_step": 30951, "epoch": 255} {"train_loss": -31.59112548828125, "global_step": 30952, "epoch": 255} {"train_loss": -31.639978408813477, "global_step": 30953, "epoch": 255} {"train_loss": -32.85966110229492, "global_step": 30954, "epoch": 255} {"train_loss": -31.616104125976562, "global_step": 30955, "epoch": 255} {"train_loss": -32.41275405883789, "global_step": 30956, "epoch": 255} {"train_loss": -32.54519271850586, "global_step": 30957, "epoch": 255} {"train_loss": -32.58497619628906, "global_step": 30958, "epoch": 255} {"train_loss": -33.161006927490234, "global_step": 30959, "epoch": 255} {"train_loss": -32.471168518066406, "global_step": 30960, "epoch": 255} {"train_loss": -32.802303314208984, "global_step": 30961, "epoch": 255} {"train_loss": -32.615501403808594, "global_step": 30962, "epoch": 255} {"train_loss": -32.25307083129883, "global_step": 30963, "epoch": 255} {"train_loss": -32.89289474487305, "global_step": 30964, "epoch": 255} {"train_loss": -32.371910095214844, "global_step": 30965, "epoch": 255} {"train_loss": -32.823211669921875, "global_step": 30966, "epoch": 255} {"train_loss": -32.613433837890625, "global_step": 30967, "epoch": 255} {"train_loss": -32.37254333496094, "global_step": 30968, "epoch": 255} {"train_loss": -33.04292678833008, "global_step": 30969, "epoch": 255} {"train_loss": -32.40351104736328, "global_step": 30970, "epoch": 255} {"train_loss": -32.67538833618164, "global_step": 30971, "epoch": 255} {"train_loss": -32.25236892700195, "global_step": 30972, "epoch": 255} {"train_loss": -31.37192153930664, "global_step": 30973, "epoch": 255} {"train_loss": -30.5284366607666, "global_step": 30974, "epoch": 255} {"train_loss": -32.341723245037485, "global_step": 30975, "epoch": 255, "val_loss": 2483297.75} {"train_loss": -32.57990646362305, "global_step": 30976, "epoch": 256} {"train_loss": -32.390071868896484, "global_step": 30977, "epoch": 256} {"train_loss": -32.03291320800781, "global_step": 30978, "epoch": 256} {"train_loss": -30.644620895385742, "global_step": 30979, "epoch": 256} {"train_loss": -30.948781967163086, "global_step": 30980, "epoch": 256} {"train_loss": -32.9843635559082, "global_step": 30981, "epoch": 256} {"train_loss": -32.15190505981445, "global_step": 30982, "epoch": 256} {"train_loss": -31.60310935974121, "global_step": 30983, "epoch": 256} {"train_loss": -31.95941162109375, "global_step": 30984, "epoch": 256} {"train_loss": -33.26033401489258, "global_step": 30985, "epoch": 256} {"train_loss": -32.096126556396484, "global_step": 30986, "epoch": 256} {"train_loss": -32.12173080444336, "global_step": 30987, "epoch": 256} {"train_loss": -32.94658279418945, "global_step": 30988, "epoch": 256} {"train_loss": -32.3220100402832, "global_step": 30989, "epoch": 256} {"train_loss": -32.90410232543945, "global_step": 30990, "epoch": 256} {"train_loss": -32.85938262939453, "global_step": 30991, "epoch": 256} {"train_loss": -32.58406448364258, "global_step": 30992, "epoch": 256} {"train_loss": -31.770511627197266, "global_step": 30993, "epoch": 256} {"train_loss": -32.858856201171875, "global_step": 30994, "epoch": 256} {"train_loss": -33.1851921081543, "global_step": 30995, "epoch": 256} {"train_loss": -33.20167541503906, "global_step": 30996, "epoch": 256} {"train_loss": -32.69150924682617, "global_step": 30997, "epoch": 256} {"train_loss": -31.860197067260742, "global_step": 30998, "epoch": 256} {"train_loss": -31.787729263305664, "global_step": 30999, "epoch": 256} {"train_loss": -33.165279388427734, "global_step": 31000, "epoch": 256} {"train_loss": -33.02250289916992, "global_step": 31001, "epoch": 256} {"train_loss": -32.22841262817383, "global_step": 31002, "epoch": 256} {"train_loss": -31.786725997924805, "global_step": 31003, "epoch": 256} {"train_loss": -31.788013458251953, "global_step": 31004, "epoch": 256} {"train_loss": -32.81950759887695, "global_step": 31005, "epoch": 256} {"train_loss": -32.64445114135742, "global_step": 31006, "epoch": 256} {"train_loss": -32.691444396972656, "global_step": 31007, "epoch": 256} {"train_loss": -32.90784454345703, "global_step": 31008, "epoch": 256} {"train_loss": -32.450927734375, "global_step": 31009, "epoch": 256} {"train_loss": -33.3520622253418, "global_step": 31010, "epoch": 256} {"train_loss": -33.22906494140625, "global_step": 31011, "epoch": 256} {"train_loss": -33.45701217651367, "global_step": 31012, "epoch": 256} {"train_loss": -32.86747741699219, "global_step": 31013, "epoch": 256} {"train_loss": -33.32486343383789, "global_step": 31014, "epoch": 256} {"train_loss": -32.291900634765625, "global_step": 31015, "epoch": 256} {"train_loss": -32.98616027832031, "global_step": 31016, "epoch": 256} {"train_loss": -32.76081466674805, "global_step": 31017, "epoch": 256} {"train_loss": -32.68474197387695, "global_step": 31018, "epoch": 256} {"train_loss": -32.83272171020508, "global_step": 31019, "epoch": 256} {"train_loss": -32.79833984375, "global_step": 31020, "epoch": 256} {"train_loss": -32.15853500366211, "global_step": 31021, "epoch": 256} {"train_loss": -32.8016471862793, "global_step": 31022, "epoch": 256} {"train_loss": -31.779922485351562, "global_step": 31023, "epoch": 256} {"train_loss": -31.915563583374023, "global_step": 31024, "epoch": 256} {"train_loss": -32.759883880615234, "global_step": 31025, "epoch": 256} {"train_loss": -32.277984619140625, "global_step": 31026, "epoch": 256} {"train_loss": -32.8492317199707, "global_step": 31027, "epoch": 256} {"train_loss": -33.14531707763672, "global_step": 31028, "epoch": 256} {"train_loss": -32.222877502441406, "global_step": 31029, "epoch": 256} {"train_loss": -32.90724182128906, "global_step": 31030, "epoch": 256} {"train_loss": -32.33272933959961, "global_step": 31031, "epoch": 256} {"train_loss": -32.31289291381836, "global_step": 31032, "epoch": 256} {"train_loss": -32.84566879272461, "global_step": 31033, "epoch": 256} {"train_loss": -32.4618034362793, "global_step": 31034, "epoch": 256} {"train_loss": -32.720516204833984, "global_step": 31035, "epoch": 256} {"train_loss": -33.03298568725586, "global_step": 31036, "epoch": 256} {"train_loss": -33.09772491455078, "global_step": 31037, "epoch": 256} {"train_loss": -32.88190841674805, "global_step": 31038, "epoch": 256} {"train_loss": -32.307491302490234, "global_step": 31039, "epoch": 256} {"train_loss": -32.5694694519043, "global_step": 31040, "epoch": 256} {"train_loss": -33.22420120239258, "global_step": 31041, "epoch": 256} {"train_loss": -33.05867004394531, "global_step": 31042, "epoch": 256} {"train_loss": -32.25502395629883, "global_step": 31043, "epoch": 256} {"train_loss": -32.907257080078125, "global_step": 31044, "epoch": 256} {"train_loss": -32.486148834228516, "global_step": 31045, "epoch": 256} {"train_loss": -33.4289665222168, "global_step": 31046, "epoch": 256} {"train_loss": -32.72135543823242, "global_step": 31047, "epoch": 256} {"train_loss": -32.87340545654297, "global_step": 31048, "epoch": 256} {"train_loss": -33.221435546875, "global_step": 31049, "epoch": 256} {"train_loss": -33.20938491821289, "global_step": 31050, "epoch": 256} {"train_loss": -33.0156364440918, "global_step": 31051, "epoch": 256} {"train_loss": -32.5054931640625, "global_step": 31052, "epoch": 256} {"train_loss": -32.36787033081055, "global_step": 31053, "epoch": 256} {"train_loss": -32.67922592163086, "global_step": 31054, "epoch": 256} {"train_loss": -33.202606201171875, "global_step": 31055, "epoch": 256} {"train_loss": -33.49345779418945, "global_step": 31056, "epoch": 256} {"train_loss": -33.30952072143555, "global_step": 31057, "epoch": 256} {"train_loss": -33.02121353149414, "global_step": 31058, "epoch": 256} {"train_loss": -33.016693115234375, "global_step": 31059, "epoch": 256} {"train_loss": -30.42591667175293, "global_step": 31060, "epoch": 256} {"train_loss": -28.162092208862305, "global_step": 31061, "epoch": 256} {"train_loss": -29.999048233032227, "global_step": 31062, "epoch": 256} {"train_loss": -32.95635986328125, "global_step": 31063, "epoch": 256} {"train_loss": -31.149261474609375, "global_step": 31064, "epoch": 256} {"train_loss": -26.63038444519043, "global_step": 31065, "epoch": 256} {"train_loss": -26.322355270385742, "global_step": 31066, "epoch": 256} {"train_loss": -32.04529571533203, "global_step": 31067, "epoch": 256} {"train_loss": -30.91652488708496, "global_step": 31068, "epoch": 256} {"train_loss": -31.003812789916992, "global_step": 31069, "epoch": 256} {"train_loss": -31.11408042907715, "global_step": 31070, "epoch": 256} {"train_loss": -29.748249053955078, "global_step": 31071, "epoch": 256} {"train_loss": -30.548583984375, "global_step": 31072, "epoch": 256} {"train_loss": -29.360187530517578, "global_step": 31073, "epoch": 256} {"train_loss": -29.515668869018555, "global_step": 31074, "epoch": 256} {"train_loss": -31.21893882751465, "global_step": 31075, "epoch": 256} {"train_loss": -30.228479385375977, "global_step": 31076, "epoch": 256} {"train_loss": -30.670507431030273, "global_step": 31077, "epoch": 256} {"train_loss": -32.42437744140625, "global_step": 31078, "epoch": 256} {"train_loss": -30.905073165893555, "global_step": 31079, "epoch": 256} {"train_loss": -30.72324562072754, "global_step": 31080, "epoch": 256} {"train_loss": -29.867334365844727, "global_step": 31081, "epoch": 256} {"train_loss": -31.082944869995117, "global_step": 31082, "epoch": 256} {"train_loss": -31.39154624938965, "global_step": 31083, "epoch": 256} {"train_loss": -30.66159439086914, "global_step": 31084, "epoch": 256} {"train_loss": -32.47828674316406, "global_step": 31085, "epoch": 256} {"train_loss": -31.117401123046875, "global_step": 31086, "epoch": 256} {"train_loss": -31.853803634643555, "global_step": 31087, "epoch": 256} {"train_loss": -32.28279495239258, "global_step": 31088, "epoch": 256} {"train_loss": -31.47296714782715, "global_step": 31089, "epoch": 256} {"train_loss": -31.9598445892334, "global_step": 31090, "epoch": 256} {"train_loss": -32.24906539916992, "global_step": 31091, "epoch": 256} {"train_loss": -31.860218048095703, "global_step": 31092, "epoch": 256} {"train_loss": -32.66797637939453, "global_step": 31093, "epoch": 256} {"train_loss": -32.13417434692383, "global_step": 31094, "epoch": 256} {"train_loss": -32.51180648803711, "global_step": 31095, "epoch": 256} {"train_loss": -32.10928759299034, "global_step": 31096, "epoch": 256, "val_loss": 2668746.75} {"train_loss": -32.57481002807617, "global_step": 31097, "epoch": 257} {"train_loss": -32.51519775390625, "global_step": 31098, "epoch": 257} {"train_loss": -32.81549835205078, "global_step": 31099, "epoch": 257} {"train_loss": -32.57088851928711, "global_step": 31100, "epoch": 257} {"train_loss": -32.509910583496094, "global_step": 31101, "epoch": 257} {"train_loss": -32.20152282714844, "global_step": 31102, "epoch": 257} {"train_loss": -32.522361755371094, "global_step": 31103, "epoch": 257} {"train_loss": -32.42948532104492, "global_step": 31104, "epoch": 257} {"train_loss": -32.03389358520508, "global_step": 31105, "epoch": 257} {"train_loss": -32.938289642333984, "global_step": 31106, "epoch": 257} {"train_loss": -31.936420440673828, "global_step": 31107, "epoch": 257} {"train_loss": -32.916500091552734, "global_step": 31108, "epoch": 257} {"train_loss": -32.53542709350586, "global_step": 31109, "epoch": 257} {"train_loss": -32.536354064941406, "global_step": 31110, "epoch": 257} {"train_loss": -32.590694427490234, "global_step": 31111, "epoch": 257} {"train_loss": -32.52455520629883, "global_step": 31112, "epoch": 257} {"train_loss": -32.332786560058594, "global_step": 31113, "epoch": 257} {"train_loss": -33.178951263427734, "global_step": 31114, "epoch": 257} {"train_loss": -32.36198425292969, "global_step": 31115, "epoch": 257} {"train_loss": -33.45111083984375, "global_step": 31116, "epoch": 257} {"train_loss": -32.45196533203125, "global_step": 31117, "epoch": 257} {"train_loss": -32.66498947143555, "global_step": 31118, "epoch": 257} {"train_loss": -33.06136703491211, "global_step": 31119, "epoch": 257} {"train_loss": -33.155879974365234, "global_step": 31120, "epoch": 257} {"train_loss": -32.95472717285156, "global_step": 31121, "epoch": 257} {"train_loss": -33.038333892822266, "global_step": 31122, "epoch": 257} {"train_loss": -32.7874641418457, "global_step": 31123, "epoch": 257} {"train_loss": -33.145362854003906, "global_step": 31124, "epoch": 257} {"train_loss": -32.7655029296875, "global_step": 31125, "epoch": 257} {"train_loss": -33.186458587646484, "global_step": 31126, "epoch": 257} {"train_loss": -33.19572067260742, "global_step": 31127, "epoch": 257} {"train_loss": -33.049835205078125, "global_step": 31128, "epoch": 257} {"train_loss": -33.03221893310547, "global_step": 31129, "epoch": 257} {"train_loss": -32.91935729980469, "global_step": 31130, "epoch": 257} {"train_loss": -33.28935623168945, "global_step": 31131, "epoch": 257} {"train_loss": -33.28078842163086, "global_step": 31132, "epoch": 257} {"train_loss": -33.0756950378418, "global_step": 31133, "epoch": 257} {"train_loss": -33.21077346801758, "global_step": 31134, "epoch": 257} {"train_loss": -33.58665084838867, "global_step": 31135, "epoch": 257} {"train_loss": -33.454872131347656, "global_step": 31136, "epoch": 257} {"train_loss": -33.286842346191406, "global_step": 31137, "epoch": 257} {"train_loss": -33.312374114990234, "global_step": 31138, "epoch": 257} {"train_loss": -32.8843994140625, "global_step": 31139, "epoch": 257} {"train_loss": -33.240211486816406, "global_step": 31140, "epoch": 257} {"train_loss": -32.914363861083984, "global_step": 31141, "epoch": 257} {"train_loss": -33.1457405090332, "global_step": 31142, "epoch": 257} {"train_loss": -32.750423431396484, "global_step": 31143, "epoch": 257} {"train_loss": -32.111019134521484, "global_step": 31144, "epoch": 257} {"train_loss": -30.960657119750977, "global_step": 31145, "epoch": 257} {"train_loss": -29.074203491210938, "global_step": 31146, "epoch": 257} {"train_loss": -25.85196876525879, "global_step": 31147, "epoch": 257} {"train_loss": -18.94436264038086, "global_step": 31148, "epoch": 257} {"train_loss": -6.868052959442139, "global_step": 31149, "epoch": 257} {"train_loss": -21.193151473999023, "global_step": 31150, "epoch": 257} {"train_loss": -27.48141860961914, "global_step": 31151, "epoch": 257} {"train_loss": -23.08024024963379, "global_step": 31152, "epoch": 257} {"train_loss": -29.85731315612793, "global_step": 31153, "epoch": 257} {"train_loss": -30.245014190673828, "global_step": 31154, "epoch": 257} {"train_loss": -26.401426315307617, "global_step": 31155, "epoch": 257} {"train_loss": -31.138731002807617, "global_step": 31156, "epoch": 257} {"train_loss": -29.8078556060791, "global_step": 31157, "epoch": 257} {"train_loss": -28.989120483398438, "global_step": 31158, "epoch": 257} {"train_loss": -31.018964767456055, "global_step": 31159, "epoch": 257} {"train_loss": -30.59539794921875, "global_step": 31160, "epoch": 257} {"train_loss": -29.45523452758789, "global_step": 31161, "epoch": 257} {"train_loss": -30.668506622314453, "global_step": 31162, "epoch": 257} {"train_loss": -30.44208335876465, "global_step": 31163, "epoch": 257} {"train_loss": -30.69134521484375, "global_step": 31164, "epoch": 257} {"train_loss": -30.01700782775879, "global_step": 31165, "epoch": 257} {"train_loss": -30.645111083984375, "global_step": 31166, "epoch": 257} {"train_loss": -31.048236846923828, "global_step": 31167, "epoch": 257} {"train_loss": -31.298328399658203, "global_step": 31168, "epoch": 257} {"train_loss": -30.508466720581055, "global_step": 31169, "epoch": 257} {"train_loss": -31.282907485961914, "global_step": 31170, "epoch": 257} {"train_loss": -31.12482261657715, "global_step": 31171, "epoch": 257} {"train_loss": -31.796646118164062, "global_step": 31172, "epoch": 257} {"train_loss": -31.52528190612793, "global_step": 31173, "epoch": 257} {"train_loss": -31.895795822143555, "global_step": 31174, "epoch": 257} {"train_loss": -31.45224380493164, "global_step": 31175, "epoch": 257} {"train_loss": -31.373926162719727, "global_step": 31176, "epoch": 257} {"train_loss": -32.21430206298828, "global_step": 31177, "epoch": 257} {"train_loss": -31.949604034423828, "global_step": 31178, "epoch": 257} {"train_loss": -32.09463119506836, "global_step": 31179, "epoch": 257} {"train_loss": -32.22695541381836, "global_step": 31180, "epoch": 257} {"train_loss": -32.15869140625, "global_step": 31181, "epoch": 257} {"train_loss": -32.185787200927734, "global_step": 31182, "epoch": 257} {"train_loss": -32.17222213745117, "global_step": 31183, "epoch": 257} {"train_loss": -32.04509353637695, "global_step": 31184, "epoch": 257} {"train_loss": -32.35811996459961, "global_step": 31185, "epoch": 257} {"train_loss": -32.4112548828125, "global_step": 31186, "epoch": 257} {"train_loss": -32.414833068847656, "global_step": 31187, "epoch": 257} {"train_loss": -32.748809814453125, "global_step": 31188, "epoch": 257} {"train_loss": -32.830013275146484, "global_step": 31189, "epoch": 257} {"train_loss": -32.712158203125, "global_step": 31190, "epoch": 257} {"train_loss": -32.6025276184082, "global_step": 31191, "epoch": 257} {"train_loss": -32.80978012084961, "global_step": 31192, "epoch": 257} {"train_loss": -32.803466796875, "global_step": 31193, "epoch": 257} {"train_loss": -32.87126541137695, "global_step": 31194, "epoch": 257} {"train_loss": -32.52423095703125, "global_step": 31195, "epoch": 257} {"train_loss": -32.89907455444336, "global_step": 31196, "epoch": 257} {"train_loss": -33.04061508178711, "global_step": 31197, "epoch": 257} {"train_loss": -32.904884338378906, "global_step": 31198, "epoch": 257} {"train_loss": -32.97711944580078, "global_step": 31199, "epoch": 257} {"train_loss": -32.65615463256836, "global_step": 31200, "epoch": 257} {"train_loss": -33.20964813232422, "global_step": 31201, "epoch": 257} {"train_loss": -32.62894821166992, "global_step": 31202, "epoch": 257} {"train_loss": -33.25535202026367, "global_step": 31203, "epoch": 257} {"train_loss": -33.09122848510742, "global_step": 31204, "epoch": 257} {"train_loss": -31.53767967224121, "global_step": 31205, "epoch": 257} {"train_loss": -32.43516159057617, "global_step": 31206, "epoch": 257} {"train_loss": -33.08455276489258, "global_step": 31207, "epoch": 257} {"train_loss": -32.097755432128906, "global_step": 31208, "epoch": 257} {"train_loss": -32.25079345703125, "global_step": 31209, "epoch": 257} {"train_loss": -33.15244674682617, "global_step": 31210, "epoch": 257} {"train_loss": -32.56555938720703, "global_step": 31211, "epoch": 257} {"train_loss": -33.05791091918945, "global_step": 31212, "epoch": 257} {"train_loss": -32.84039306640625, "global_step": 31213, "epoch": 257} {"train_loss": -32.740997314453125, "global_step": 31214, "epoch": 257} {"train_loss": -33.075660705566406, "global_step": 31215, "epoch": 257} {"train_loss": -33.12007522583008, "global_step": 31216, "epoch": 257} {"train_loss": -31.65603312579068, "global_step": 31217, "epoch": 257, "val_loss": 2643926.25} {"train_loss": -33.12824249267578, "global_step": 31218, "epoch": 258} {"train_loss": -32.78448486328125, "global_step": 31219, "epoch": 258} {"train_loss": -32.953468322753906, "global_step": 31220, "epoch": 258} {"train_loss": -32.04881286621094, "global_step": 31221, "epoch": 258} {"train_loss": -32.95991134643555, "global_step": 31222, "epoch": 258} {"train_loss": -32.76133346557617, "global_step": 31223, "epoch": 258} {"train_loss": -32.946067810058594, "global_step": 31224, "epoch": 258} {"train_loss": -33.06014633178711, "global_step": 31225, "epoch": 258} {"train_loss": -32.72055435180664, "global_step": 31226, "epoch": 258} {"train_loss": -33.24234390258789, "global_step": 31227, "epoch": 258} {"train_loss": -32.90974044799805, "global_step": 31228, "epoch": 258} {"train_loss": -32.706825256347656, "global_step": 31229, "epoch": 258} {"train_loss": -33.58466339111328, "global_step": 31230, "epoch": 258} {"train_loss": -33.21864700317383, "global_step": 31231, "epoch": 258} {"train_loss": -32.38755798339844, "global_step": 31232, "epoch": 258} {"train_loss": -32.271141052246094, "global_step": 31233, "epoch": 258} {"train_loss": -31.702878952026367, "global_step": 31234, "epoch": 258} {"train_loss": -31.032541275024414, "global_step": 31235, "epoch": 258} {"train_loss": -30.315603256225586, "global_step": 31236, "epoch": 258} {"train_loss": -30.1163330078125, "global_step": 31237, "epoch": 258} {"train_loss": -29.684619903564453, "global_step": 31238, "epoch": 258} {"train_loss": -30.044233322143555, "global_step": 31239, "epoch": 258} {"train_loss": -31.12128257751465, "global_step": 31240, "epoch": 258} {"train_loss": -31.85101318359375, "global_step": 31241, "epoch": 258} {"train_loss": -32.016357421875, "global_step": 31242, "epoch": 258} {"train_loss": -32.20844268798828, "global_step": 31243, "epoch": 258} {"train_loss": -32.764259338378906, "global_step": 31244, "epoch": 258} {"train_loss": -32.42315673828125, "global_step": 31245, "epoch": 258} {"train_loss": -32.81699752807617, "global_step": 31246, "epoch": 258} {"train_loss": -33.160884857177734, "global_step": 31247, "epoch": 258} {"train_loss": -32.67509078979492, "global_step": 31248, "epoch": 258} {"train_loss": -32.802528381347656, "global_step": 31249, "epoch": 258} {"train_loss": -32.54387664794922, "global_step": 31250, "epoch": 258} {"train_loss": -32.82477569580078, "global_step": 31251, "epoch": 258} {"train_loss": -32.01850509643555, "global_step": 31252, "epoch": 258} {"train_loss": -32.51408386230469, "global_step": 31253, "epoch": 258} {"train_loss": -32.283660888671875, "global_step": 31254, "epoch": 258} {"train_loss": -32.45681381225586, "global_step": 31255, "epoch": 258} {"train_loss": -32.85472869873047, "global_step": 31256, "epoch": 258} {"train_loss": -32.795021057128906, "global_step": 31257, "epoch": 258} {"train_loss": -32.680294036865234, "global_step": 31258, "epoch": 258} {"train_loss": -32.366943359375, "global_step": 31259, "epoch": 258} {"train_loss": -31.801599502563477, "global_step": 31260, "epoch": 258} {"train_loss": -31.298620223999023, "global_step": 31261, "epoch": 258} {"train_loss": -32.68450927734375, "global_step": 31262, "epoch": 258} {"train_loss": -32.24453353881836, "global_step": 31263, "epoch": 258} {"train_loss": -30.579748153686523, "global_step": 31264, "epoch": 258} {"train_loss": -29.700597763061523, "global_step": 31265, "epoch": 258} {"train_loss": -29.424177169799805, "global_step": 31266, "epoch": 258} {"train_loss": -31.49336051940918, "global_step": 31267, "epoch": 258} {"train_loss": -30.124170303344727, "global_step": 31268, "epoch": 258} {"train_loss": -30.761402130126953, "global_step": 31269, "epoch": 258} {"train_loss": -30.434057235717773, "global_step": 31270, "epoch": 258} {"train_loss": -31.347171783447266, "global_step": 31271, "epoch": 258} {"train_loss": -31.389867782592773, "global_step": 31272, "epoch": 258} {"train_loss": -32.33298110961914, "global_step": 31273, "epoch": 258} {"train_loss": -30.945959091186523, "global_step": 31274, "epoch": 258} {"train_loss": -32.16731643676758, "global_step": 31275, "epoch": 258} {"train_loss": -31.2777042388916, "global_step": 31276, "epoch": 258} {"train_loss": -31.645526885986328, "global_step": 31277, "epoch": 258} {"train_loss": -31.671918869018555, "global_step": 31278, "epoch": 258} {"train_loss": -32.155548095703125, "global_step": 31279, "epoch": 258} {"train_loss": -32.01750564575195, "global_step": 31280, "epoch": 258} {"train_loss": -32.11383819580078, "global_step": 31281, "epoch": 258} {"train_loss": -32.44487762451172, "global_step": 31282, "epoch": 258} {"train_loss": -32.28206253051758, "global_step": 31283, "epoch": 258} {"train_loss": -32.07985305786133, "global_step": 31284, "epoch": 258} {"train_loss": -32.637977600097656, "global_step": 31285, "epoch": 258} {"train_loss": -32.54901885986328, "global_step": 31286, "epoch": 258} {"train_loss": -32.486019134521484, "global_step": 31287, "epoch": 258} {"train_loss": -32.17320251464844, "global_step": 31288, "epoch": 258} {"train_loss": -32.471466064453125, "global_step": 31289, "epoch": 258} {"train_loss": -32.619258880615234, "global_step": 31290, "epoch": 258} {"train_loss": -32.522804260253906, "global_step": 31291, "epoch": 258} {"train_loss": -31.687864303588867, "global_step": 31292, "epoch": 258} {"train_loss": -32.63991165161133, "global_step": 31293, "epoch": 258} {"train_loss": -31.959949493408203, "global_step": 31294, "epoch": 258} {"train_loss": -32.685157775878906, "global_step": 31295, "epoch": 258} {"train_loss": -31.592212677001953, "global_step": 31296, "epoch": 258} {"train_loss": -32.68781661987305, "global_step": 31297, "epoch": 258} {"train_loss": -31.050207138061523, "global_step": 31298, "epoch": 258} {"train_loss": -33.12185287475586, "global_step": 31299, "epoch": 258} {"train_loss": -31.158233642578125, "global_step": 31300, "epoch": 258} {"train_loss": -32.07779312133789, "global_step": 31301, "epoch": 258} {"train_loss": -32.92730712890625, "global_step": 31302, "epoch": 258} {"train_loss": -31.870712280273438, "global_step": 31303, "epoch": 258} {"train_loss": -33.099327087402344, "global_step": 31304, "epoch": 258} {"train_loss": -33.28632736206055, "global_step": 31305, "epoch": 258} {"train_loss": -32.3156623840332, "global_step": 31306, "epoch": 258} {"train_loss": -33.35409164428711, "global_step": 31307, "epoch": 258} {"train_loss": -32.7708740234375, "global_step": 31308, "epoch": 258} {"train_loss": -32.762428283691406, "global_step": 31309, "epoch": 258} {"train_loss": -32.4458122253418, "global_step": 31310, "epoch": 258} {"train_loss": -33.13915252685547, "global_step": 31311, "epoch": 258} {"train_loss": -33.26143264770508, "global_step": 31312, "epoch": 258} {"train_loss": -32.762542724609375, "global_step": 31313, "epoch": 258} {"train_loss": -33.14202880859375, "global_step": 31314, "epoch": 258} {"train_loss": -33.964351654052734, "global_step": 31315, "epoch": 258} {"train_loss": -33.0887451171875, "global_step": 31316, "epoch": 258} {"train_loss": -32.96416473388672, "global_step": 31317, "epoch": 258} {"train_loss": -32.69854736328125, "global_step": 31318, "epoch": 258} {"train_loss": -32.72017288208008, "global_step": 31319, "epoch": 258} {"train_loss": -32.38822937011719, "global_step": 31320, "epoch": 258} {"train_loss": -32.30011749267578, "global_step": 31321, "epoch": 258} {"train_loss": -31.72085952758789, "global_step": 31322, "epoch": 258} {"train_loss": -32.358455657958984, "global_step": 31323, "epoch": 258} {"train_loss": -32.90639114379883, "global_step": 31324, "epoch": 258} {"train_loss": -32.7757682800293, "global_step": 31325, "epoch": 258} {"train_loss": -32.72589874267578, "global_step": 31326, "epoch": 258} {"train_loss": -32.08456039428711, "global_step": 31327, "epoch": 258} {"train_loss": -31.48878288269043, "global_step": 31328, "epoch": 258} {"train_loss": -30.556838989257812, "global_step": 31329, "epoch": 258} {"train_loss": -29.932205200195312, "global_step": 31330, "epoch": 258} {"train_loss": -30.603626251220703, "global_step": 31331, "epoch": 258} {"train_loss": -32.10892868041992, "global_step": 31332, "epoch": 258} {"train_loss": -32.44181442260742, "global_step": 31333, "epoch": 258} {"train_loss": -31.787036895751953, "global_step": 31334, "epoch": 258} {"train_loss": -31.674060821533203, "global_step": 31335, "epoch": 258} {"train_loss": -32.01680374145508, "global_step": 31336, "epoch": 258} {"train_loss": -32.647369384765625, "global_step": 31337, "epoch": 258} {"train_loss": -32.16106698532735, "global_step": 31338, "epoch": 258, "val_loss": 2619654.75} {"train_loss": -32.31403732299805, "global_step": 31339, "epoch": 259} {"train_loss": -32.59959030151367, "global_step": 31340, "epoch": 259} {"train_loss": -32.709468841552734, "global_step": 31341, "epoch": 259} {"train_loss": -32.40618896484375, "global_step": 31342, "epoch": 259} {"train_loss": -32.59895706176758, "global_step": 31343, "epoch": 259} {"train_loss": -32.54185104370117, "global_step": 31344, "epoch": 259} {"train_loss": -32.71755599975586, "global_step": 31345, "epoch": 259} {"train_loss": -32.78139877319336, "global_step": 31346, "epoch": 259} {"train_loss": -32.89591598510742, "global_step": 31347, "epoch": 259} {"train_loss": -33.06535720825195, "global_step": 31348, "epoch": 259} {"train_loss": -32.98212814331055, "global_step": 31349, "epoch": 259} {"train_loss": -32.225425720214844, "global_step": 31350, "epoch": 259} {"train_loss": -30.6688175201416, "global_step": 31351, "epoch": 259} {"train_loss": -31.2662410736084, "global_step": 31352, "epoch": 259} {"train_loss": -33.1090087890625, "global_step": 31353, "epoch": 259} {"train_loss": -31.958234786987305, "global_step": 31354, "epoch": 259} {"train_loss": -30.227460861206055, "global_step": 31355, "epoch": 259} {"train_loss": -32.321807861328125, "global_step": 31356, "epoch": 259} {"train_loss": -33.026180267333984, "global_step": 31357, "epoch": 259} {"train_loss": -32.54069137573242, "global_step": 31358, "epoch": 259} {"train_loss": -32.72825241088867, "global_step": 31359, "epoch": 259} {"train_loss": -33.09370040893555, "global_step": 31360, "epoch": 259} {"train_loss": -32.78328323364258, "global_step": 31361, "epoch": 259} {"train_loss": -32.87532043457031, "global_step": 31362, "epoch": 259} {"train_loss": -32.79814147949219, "global_step": 31363, "epoch": 259} {"train_loss": -33.1176872253418, "global_step": 31364, "epoch": 259} {"train_loss": -33.08831787109375, "global_step": 31365, "epoch": 259} {"train_loss": -33.41913986206055, "global_step": 31366, "epoch": 259} {"train_loss": -33.28839111328125, "global_step": 31367, "epoch": 259} {"train_loss": -33.336280822753906, "global_step": 31368, "epoch": 259} {"train_loss": -33.667625427246094, "global_step": 31369, "epoch": 259} {"train_loss": -33.180721282958984, "global_step": 31370, "epoch": 259} {"train_loss": -32.79362869262695, "global_step": 31371, "epoch": 259} {"train_loss": -33.321773529052734, "global_step": 31372, "epoch": 259} {"train_loss": -32.802398681640625, "global_step": 31373, "epoch": 259} {"train_loss": -33.39504623413086, "global_step": 31374, "epoch": 259} {"train_loss": -33.3060417175293, "global_step": 31375, "epoch": 259} {"train_loss": -31.604236602783203, "global_step": 31376, "epoch": 259} {"train_loss": -32.871395111083984, "global_step": 31377, "epoch": 259} {"train_loss": -33.027706146240234, "global_step": 31378, "epoch": 259} {"train_loss": -33.21308517456055, "global_step": 31379, "epoch": 259} {"train_loss": -32.66460037231445, "global_step": 31380, "epoch": 259} {"train_loss": -31.925434112548828, "global_step": 31381, "epoch": 259} {"train_loss": -33.1613655090332, "global_step": 31382, "epoch": 259} {"train_loss": -32.9210090637207, "global_step": 31383, "epoch": 259} {"train_loss": -31.506351470947266, "global_step": 31384, "epoch": 259} {"train_loss": -29.302541732788086, "global_step": 31385, "epoch": 259} {"train_loss": -27.243000030517578, "global_step": 31386, "epoch": 259} {"train_loss": -22.30792808532715, "global_step": 31387, "epoch": 259} {"train_loss": -15.276649475097656, "global_step": 31388, "epoch": 259} {"train_loss": -27.04782485961914, "global_step": 31389, "epoch": 259} {"train_loss": -30.600866317749023, "global_step": 31390, "epoch": 259} {"train_loss": -26.02039909362793, "global_step": 31391, "epoch": 259} {"train_loss": -31.68659782409668, "global_step": 31392, "epoch": 259} {"train_loss": -29.152576446533203, "global_step": 31393, "epoch": 259} {"train_loss": -31.50527000427246, "global_step": 31394, "epoch": 259} {"train_loss": -31.66941261291504, "global_step": 31395, "epoch": 259} {"train_loss": -30.393461227416992, "global_step": 31396, "epoch": 259} {"train_loss": -31.950571060180664, "global_step": 31397, "epoch": 259} {"train_loss": -32.14992141723633, "global_step": 31398, "epoch": 259} {"train_loss": -31.259906768798828, "global_step": 31399, "epoch": 259} {"train_loss": -31.9761962890625, "global_step": 31400, "epoch": 259} {"train_loss": -32.538665771484375, "global_step": 31401, "epoch": 259} {"train_loss": -31.923980712890625, "global_step": 31402, "epoch": 259} {"train_loss": -31.7308349609375, "global_step": 31403, "epoch": 259} {"train_loss": -32.281490325927734, "global_step": 31404, "epoch": 259} {"train_loss": -32.613834381103516, "global_step": 31405, "epoch": 259} {"train_loss": -32.15024948120117, "global_step": 31406, "epoch": 259} {"train_loss": -31.87152671813965, "global_step": 31407, "epoch": 259} {"train_loss": -31.8512020111084, "global_step": 31408, "epoch": 259} {"train_loss": -32.37689208984375, "global_step": 31409, "epoch": 259} {"train_loss": -31.981786727905273, "global_step": 31410, "epoch": 259} {"train_loss": -32.13849639892578, "global_step": 31411, "epoch": 259} {"train_loss": -32.088294982910156, "global_step": 31412, "epoch": 259} {"train_loss": -32.36837387084961, "global_step": 31413, "epoch": 259} {"train_loss": -32.033782958984375, "global_step": 31414, "epoch": 259} {"train_loss": -32.53347396850586, "global_step": 31415, "epoch": 259} {"train_loss": -32.73612594604492, "global_step": 31416, "epoch": 259} {"train_loss": -32.618995666503906, "global_step": 31417, "epoch": 259} {"train_loss": -32.63581466674805, "global_step": 31418, "epoch": 259} {"train_loss": -32.708126068115234, "global_step": 31419, "epoch": 259} {"train_loss": -32.308528900146484, "global_step": 31420, "epoch": 259} {"train_loss": -32.973854064941406, "global_step": 31421, "epoch": 259} {"train_loss": -32.562042236328125, "global_step": 31422, "epoch": 259} {"train_loss": -32.745479583740234, "global_step": 31423, "epoch": 259} {"train_loss": -32.95523452758789, "global_step": 31424, "epoch": 259} {"train_loss": -32.57157516479492, "global_step": 31425, "epoch": 259} {"train_loss": -32.87490463256836, "global_step": 31426, "epoch": 259} {"train_loss": -32.899330139160156, "global_step": 31427, "epoch": 259} {"train_loss": -32.90255355834961, "global_step": 31428, "epoch": 259} {"train_loss": -33.330970764160156, "global_step": 31429, "epoch": 259} {"train_loss": -32.72811508178711, "global_step": 31430, "epoch": 259} {"train_loss": -33.36997985839844, "global_step": 31431, "epoch": 259} {"train_loss": -33.0010986328125, "global_step": 31432, "epoch": 259} {"train_loss": -32.88990020751953, "global_step": 31433, "epoch": 259} {"train_loss": -32.954986572265625, "global_step": 31434, "epoch": 259} {"train_loss": -32.11378860473633, "global_step": 31435, "epoch": 259} {"train_loss": -32.42745590209961, "global_step": 31436, "epoch": 259} {"train_loss": -32.80310821533203, "global_step": 31437, "epoch": 259} {"train_loss": -32.95563888549805, "global_step": 31438, "epoch": 259} {"train_loss": -33.154449462890625, "global_step": 31439, "epoch": 259} {"train_loss": -33.42914581298828, "global_step": 31440, "epoch": 259} {"train_loss": -32.70068359375, "global_step": 31441, "epoch": 259} {"train_loss": -33.291465759277344, "global_step": 31442, "epoch": 259} {"train_loss": -32.88847732543945, "global_step": 31443, "epoch": 259} {"train_loss": -32.292877197265625, "global_step": 31444, "epoch": 259} {"train_loss": -32.9936637878418, "global_step": 31445, "epoch": 259} {"train_loss": -33.12582778930664, "global_step": 31446, "epoch": 259} {"train_loss": -33.04488754272461, "global_step": 31447, "epoch": 259} {"train_loss": -32.93693923950195, "global_step": 31448, "epoch": 259} {"train_loss": -32.20546340942383, "global_step": 31449, "epoch": 259} {"train_loss": -29.337568283081055, "global_step": 31450, "epoch": 259} {"train_loss": -28.637451171875, "global_step": 31451, "epoch": 259} {"train_loss": -30.721654891967773, "global_step": 31452, "epoch": 259} {"train_loss": -32.4122428894043, "global_step": 31453, "epoch": 259} {"train_loss": -32.24666976928711, "global_step": 31454, "epoch": 259} {"train_loss": -29.486587524414062, "global_step": 31455, "epoch": 259} {"train_loss": -30.054418563842773, "global_step": 31456, "epoch": 259} {"train_loss": -31.562503814697266, "global_step": 31457, "epoch": 259} {"train_loss": -32.00979232788086, "global_step": 31458, "epoch": 259} {"train_loss": -31.979908604267216, "global_step": 31459, "epoch": 259, "val_loss": 2559615.0} {"train_loss": -31.651586532592773, "global_step": 31460, "epoch": 260} {"train_loss": -32.21364974975586, "global_step": 31461, "epoch": 260} {"train_loss": -30.9527530670166, "global_step": 31462, "epoch": 260} {"train_loss": -31.997516632080078, "global_step": 31463, "epoch": 260} {"train_loss": -30.466657638549805, "global_step": 31464, "epoch": 260} {"train_loss": -31.593191146850586, "global_step": 31465, "epoch": 260} {"train_loss": -31.610706329345703, "global_step": 31466, "epoch": 260} {"train_loss": -30.27837562561035, "global_step": 31467, "epoch": 260} {"train_loss": -31.93768310546875, "global_step": 31468, "epoch": 260} {"train_loss": -30.630985260009766, "global_step": 31469, "epoch": 260} {"train_loss": -30.757970809936523, "global_step": 31470, "epoch": 260} {"train_loss": -31.790781021118164, "global_step": 31471, "epoch": 260} {"train_loss": -31.906652450561523, "global_step": 31472, "epoch": 260} {"train_loss": -30.530019760131836, "global_step": 31473, "epoch": 260} {"train_loss": -31.720489501953125, "global_step": 31474, "epoch": 260} {"train_loss": -31.088886260986328, "global_step": 31475, "epoch": 260} {"train_loss": -32.1589241027832, "global_step": 31476, "epoch": 260} {"train_loss": -31.9672794342041, "global_step": 31477, "epoch": 260} {"train_loss": -32.05440902709961, "global_step": 31478, "epoch": 260} {"train_loss": -32.169715881347656, "global_step": 31479, "epoch": 260} {"train_loss": -31.845550537109375, "global_step": 31480, "epoch": 260} {"train_loss": -32.64777755737305, "global_step": 31481, "epoch": 260} {"train_loss": -31.80250358581543, "global_step": 31482, "epoch": 260} {"train_loss": -32.10000991821289, "global_step": 31483, "epoch": 260} {"train_loss": -32.16592025756836, "global_step": 31484, "epoch": 260} {"train_loss": -32.586334228515625, "global_step": 31485, "epoch": 260} {"train_loss": -31.8863468170166, "global_step": 31486, "epoch": 260} {"train_loss": -30.068103790283203, "global_step": 31487, "epoch": 260} {"train_loss": -30.827686309814453, "global_step": 31488, "epoch": 260} {"train_loss": -31.25967788696289, "global_step": 31489, "epoch": 260} {"train_loss": -32.7030029296875, "global_step": 31490, "epoch": 260} {"train_loss": -32.413631439208984, "global_step": 31491, "epoch": 260} {"train_loss": -32.53921127319336, "global_step": 31492, "epoch": 260} {"train_loss": -32.36211395263672, "global_step": 31493, "epoch": 260} {"train_loss": -32.791561126708984, "global_step": 31494, "epoch": 260} {"train_loss": -32.135528564453125, "global_step": 31495, "epoch": 260} {"train_loss": -31.839630126953125, "global_step": 31496, "epoch": 260} {"train_loss": -32.64728546142578, "global_step": 31497, "epoch": 260} {"train_loss": -32.40727615356445, "global_step": 31498, "epoch": 260} {"train_loss": -32.7701530456543, "global_step": 31499, "epoch": 260} {"train_loss": -33.101112365722656, "global_step": 31500, "epoch": 260} {"train_loss": -32.6223258972168, "global_step": 31501, "epoch": 260} {"train_loss": -33.226585388183594, "global_step": 31502, "epoch": 260} {"train_loss": -32.271427154541016, "global_step": 31503, "epoch": 260} {"train_loss": -32.70338821411133, "global_step": 31504, "epoch": 260} {"train_loss": -32.060325622558594, "global_step": 31505, "epoch": 260} {"train_loss": -32.74619674682617, "global_step": 31506, "epoch": 260} {"train_loss": -32.21281814575195, "global_step": 31507, "epoch": 260} {"train_loss": -32.01338577270508, "global_step": 31508, "epoch": 260} {"train_loss": -32.34138870239258, "global_step": 31509, "epoch": 260} {"train_loss": -32.33539581298828, "global_step": 31510, "epoch": 260} {"train_loss": -31.616056442260742, "global_step": 31511, "epoch": 260} {"train_loss": -32.18791580200195, "global_step": 31512, "epoch": 260} {"train_loss": -31.920520782470703, "global_step": 31513, "epoch": 260} {"train_loss": -32.47257614135742, "global_step": 31514, "epoch": 260} {"train_loss": -32.38151931762695, "global_step": 31515, "epoch": 260} {"train_loss": -32.09492874145508, "global_step": 31516, "epoch": 260} {"train_loss": -32.28236770629883, "global_step": 31517, "epoch": 260} {"train_loss": -32.64387130737305, "global_step": 31518, "epoch": 260} {"train_loss": -32.303802490234375, "global_step": 31519, "epoch": 260} {"train_loss": -32.48078155517578, "global_step": 31520, "epoch": 260} {"train_loss": -32.63753128051758, "global_step": 31521, "epoch": 260} {"train_loss": -32.17048263549805, "global_step": 31522, "epoch": 260} {"train_loss": -33.021461486816406, "global_step": 31523, "epoch": 260} {"train_loss": -32.59733581542969, "global_step": 31524, "epoch": 260} {"train_loss": -32.29291534423828, "global_step": 31525, "epoch": 260} {"train_loss": -32.932674407958984, "global_step": 31526, "epoch": 260} {"train_loss": -33.07019805908203, "global_step": 31527, "epoch": 260} {"train_loss": -33.32258224487305, "global_step": 31528, "epoch": 260} {"train_loss": -33.27000045776367, "global_step": 31529, "epoch": 260} {"train_loss": -33.24144744873047, "global_step": 31530, "epoch": 260} {"train_loss": -32.40956115722656, "global_step": 31531, "epoch": 260} {"train_loss": -33.46906280517578, "global_step": 31532, "epoch": 260} {"train_loss": -33.11117172241211, "global_step": 31533, "epoch": 260} {"train_loss": -33.12928009033203, "global_step": 31534, "epoch": 260} {"train_loss": -33.124446868896484, "global_step": 31535, "epoch": 260} {"train_loss": -33.112510681152344, "global_step": 31536, "epoch": 260} {"train_loss": -33.12371826171875, "global_step": 31537, "epoch": 260} {"train_loss": -32.506954193115234, "global_step": 31538, "epoch": 260} {"train_loss": -32.84470748901367, "global_step": 31539, "epoch": 260} {"train_loss": -31.524316787719727, "global_step": 31540, "epoch": 260} {"train_loss": -31.145313262939453, "global_step": 31541, "epoch": 260} {"train_loss": -27.003681182861328, "global_step": 31542, "epoch": 260} {"train_loss": -20.719083786010742, "global_step": 31543, "epoch": 260} {"train_loss": -12.88450813293457, "global_step": 31544, "epoch": 260} {"train_loss": -28.0584774017334, "global_step": 31545, "epoch": 260} {"train_loss": -25.840240478515625, "global_step": 31546, "epoch": 260} {"train_loss": -26.449554443359375, "global_step": 31547, "epoch": 260} {"train_loss": -25.606122970581055, "global_step": 31548, "epoch": 260} {"train_loss": -29.866147994995117, "global_step": 31549, "epoch": 260} {"train_loss": -26.556577682495117, "global_step": 31550, "epoch": 260} {"train_loss": -31.133081436157227, "global_step": 31551, "epoch": 260} {"train_loss": -30.817672729492188, "global_step": 31552, "epoch": 260} {"train_loss": -28.47344970703125, "global_step": 31553, "epoch": 260} {"train_loss": -29.42804527282715, "global_step": 31554, "epoch": 260} {"train_loss": -31.03497314453125, "global_step": 31555, "epoch": 260} {"train_loss": -30.50249671936035, "global_step": 31556, "epoch": 260} {"train_loss": -30.224964141845703, "global_step": 31557, "epoch": 260} {"train_loss": -27.424365997314453, "global_step": 31558, "epoch": 260} {"train_loss": -31.44211196899414, "global_step": 31559, "epoch": 260} {"train_loss": -30.455087661743164, "global_step": 31560, "epoch": 260} {"train_loss": -29.9160099029541, "global_step": 31561, "epoch": 260} {"train_loss": -30.709638595581055, "global_step": 31562, "epoch": 260} {"train_loss": -30.707685470581055, "global_step": 31563, "epoch": 260} {"train_loss": -31.14054298400879, "global_step": 31564, "epoch": 260} {"train_loss": -30.666370391845703, "global_step": 31565, "epoch": 260} {"train_loss": -30.948272705078125, "global_step": 31566, "epoch": 260} {"train_loss": -31.524152755737305, "global_step": 31567, "epoch": 260} {"train_loss": -30.88762855529785, "global_step": 31568, "epoch": 260} {"train_loss": -31.064029693603516, "global_step": 31569, "epoch": 260} {"train_loss": -31.654958724975586, "global_step": 31570, "epoch": 260} {"train_loss": -31.4267520904541, "global_step": 31571, "epoch": 260} {"train_loss": -30.907453536987305, "global_step": 31572, "epoch": 260} {"train_loss": -31.531381607055664, "global_step": 31573, "epoch": 260} {"train_loss": -31.16695213317871, "global_step": 31574, "epoch": 260} {"train_loss": -31.773334503173828, "global_step": 31575, "epoch": 260} {"train_loss": -31.86066246032715, "global_step": 31576, "epoch": 260} {"train_loss": -30.898666381835938, "global_step": 31577, "epoch": 260} {"train_loss": -31.44366455078125, "global_step": 31578, "epoch": 260} {"train_loss": -31.934045791625977, "global_step": 31579, "epoch": 260} {"train_loss": -31.2968154938753, "global_step": 31580, "epoch": 260, "val_loss": 2302635.75} {"train_loss": -32.15320587158203, "global_step": 31581, "epoch": 261} {"train_loss": -32.05170822143555, "global_step": 31582, "epoch": 261} {"train_loss": -32.22449493408203, "global_step": 31583, "epoch": 261} {"train_loss": -32.13301467895508, "global_step": 31584, "epoch": 261} {"train_loss": -32.1202278137207, "global_step": 31585, "epoch": 261} {"train_loss": -32.25906753540039, "global_step": 31586, "epoch": 261} {"train_loss": -32.09334945678711, "global_step": 31587, "epoch": 261} {"train_loss": -32.39785385131836, "global_step": 31588, "epoch": 261} {"train_loss": -32.26953125, "global_step": 31589, "epoch": 261} {"train_loss": -32.565643310546875, "global_step": 31590, "epoch": 261} {"train_loss": -32.72780990600586, "global_step": 31591, "epoch": 261} {"train_loss": -32.84756088256836, "global_step": 31592, "epoch": 261} {"train_loss": -32.592891693115234, "global_step": 31593, "epoch": 261} {"train_loss": -32.413299560546875, "global_step": 31594, "epoch": 261} {"train_loss": -32.851558685302734, "global_step": 31595, "epoch": 261} {"train_loss": -32.81364822387695, "global_step": 31596, "epoch": 261} {"train_loss": -32.45589065551758, "global_step": 31597, "epoch": 261} {"train_loss": -32.633602142333984, "global_step": 31598, "epoch": 261} {"train_loss": -32.9692497253418, "global_step": 31599, "epoch": 261} {"train_loss": -32.6268424987793, "global_step": 31600, "epoch": 261} {"train_loss": -32.73991012573242, "global_step": 31601, "epoch": 261} {"train_loss": -33.05568313598633, "global_step": 31602, "epoch": 261} {"train_loss": -32.543914794921875, "global_step": 31603, "epoch": 261} {"train_loss": -32.83209991455078, "global_step": 31604, "epoch": 261} {"train_loss": -32.37241744995117, "global_step": 31605, "epoch": 261} {"train_loss": -31.016998291015625, "global_step": 31606, "epoch": 261} {"train_loss": -32.7806282043457, "global_step": 31607, "epoch": 261} {"train_loss": -30.571125030517578, "global_step": 31608, "epoch": 261} {"train_loss": -30.673816680908203, "global_step": 31609, "epoch": 261} {"train_loss": -26.403966903686523, "global_step": 31610, "epoch": 261} {"train_loss": -25.23402976989746, "global_step": 31611, "epoch": 261} {"train_loss": -23.394561767578125, "global_step": 31612, "epoch": 261} {"train_loss": -28.73274803161621, "global_step": 31613, "epoch": 261} {"train_loss": -30.5577392578125, "global_step": 31614, "epoch": 261} {"train_loss": -31.098508834838867, "global_step": 31615, "epoch": 261} {"train_loss": -30.285785675048828, "global_step": 31616, "epoch": 261} {"train_loss": -31.257080078125, "global_step": 31617, "epoch": 261} {"train_loss": -31.391876220703125, "global_step": 31618, "epoch": 261} {"train_loss": -32.314056396484375, "global_step": 31619, "epoch": 261} {"train_loss": -31.034305572509766, "global_step": 31620, "epoch": 261} {"train_loss": -31.592687606811523, "global_step": 31621, "epoch": 261} {"train_loss": -30.990386962890625, "global_step": 31622, "epoch": 261} {"train_loss": -30.435678482055664, "global_step": 31623, "epoch": 261} {"train_loss": -32.06851577758789, "global_step": 31624, "epoch": 261} {"train_loss": -31.32929801940918, "global_step": 31625, "epoch": 261} {"train_loss": -31.711095809936523, "global_step": 31626, "epoch": 261} {"train_loss": -30.66851234436035, "global_step": 31627, "epoch": 261} {"train_loss": -31.128803253173828, "global_step": 31628, "epoch": 261} {"train_loss": -31.745473861694336, "global_step": 31629, "epoch": 261} {"train_loss": -31.613544464111328, "global_step": 31630, "epoch": 261} {"train_loss": -32.22257614135742, "global_step": 31631, "epoch": 261} {"train_loss": -31.409015655517578, "global_step": 31632, "epoch": 261} {"train_loss": -32.175025939941406, "global_step": 31633, "epoch": 261} {"train_loss": -32.09688949584961, "global_step": 31634, "epoch": 261} {"train_loss": -32.3115348815918, "global_step": 31635, "epoch": 261} {"train_loss": -32.25566482543945, "global_step": 31636, "epoch": 261} {"train_loss": -31.8448486328125, "global_step": 31637, "epoch": 261} {"train_loss": -32.191314697265625, "global_step": 31638, "epoch": 261} {"train_loss": -31.90372085571289, "global_step": 31639, "epoch": 261} {"train_loss": -32.40916061401367, "global_step": 31640, "epoch": 261} {"train_loss": -32.407806396484375, "global_step": 31641, "epoch": 261} {"train_loss": -32.292171478271484, "global_step": 31642, "epoch": 261} {"train_loss": -32.602691650390625, "global_step": 31643, "epoch": 261} {"train_loss": -32.61033248901367, "global_step": 31644, "epoch": 261} {"train_loss": -32.457252502441406, "global_step": 31645, "epoch": 261} {"train_loss": -32.441917419433594, "global_step": 31646, "epoch": 261} {"train_loss": -31.26774024963379, "global_step": 31647, "epoch": 261} {"train_loss": -32.242835998535156, "global_step": 31648, "epoch": 261} {"train_loss": -31.64499855041504, "global_step": 31649, "epoch": 261} {"train_loss": -26.32256507873535, "global_step": 31650, "epoch": 261} {"train_loss": -14.111726760864258, "global_step": 31651, "epoch": 261} {"train_loss": 4.732314586639404, "global_step": 31652, "epoch": 261} {"train_loss": -12.223099708557129, "global_step": 31653, "epoch": 261} {"train_loss": -27.921558380126953, "global_step": 31654, "epoch": 261} {"train_loss": -14.656608581542969, "global_step": 31655, "epoch": 261} {"train_loss": -29.222166061401367, "global_step": 31656, "epoch": 261} {"train_loss": -27.02042007446289, "global_step": 31657, "epoch": 261} {"train_loss": -23.457834243774414, "global_step": 31658, "epoch": 261} {"train_loss": -30.451196670532227, "global_step": 31659, "epoch": 261} {"train_loss": -30.6373348236084, "global_step": 31660, "epoch": 261} {"train_loss": -27.385114669799805, "global_step": 31661, "epoch": 261} {"train_loss": -28.872882843017578, "global_step": 31662, "epoch": 261} {"train_loss": -30.6049747467041, "global_step": 31663, "epoch": 261} {"train_loss": -31.6728458404541, "global_step": 31664, "epoch": 261} {"train_loss": -31.20770835876465, "global_step": 31665, "epoch": 261} {"train_loss": -30.07846450805664, "global_step": 31666, "epoch": 261} {"train_loss": -30.227506637573242, "global_step": 31667, "epoch": 261} {"train_loss": -30.3865966796875, "global_step": 31668, "epoch": 261} {"train_loss": -30.51189613342285, "global_step": 31669, "epoch": 261} {"train_loss": -30.126483917236328, "global_step": 31670, "epoch": 261} {"train_loss": -31.3365421295166, "global_step": 31671, "epoch": 261} {"train_loss": -30.720258712768555, "global_step": 31672, "epoch": 261} {"train_loss": -31.1191349029541, "global_step": 31673, "epoch": 261} {"train_loss": -30.5039005279541, "global_step": 31674, "epoch": 261} {"train_loss": -30.861963272094727, "global_step": 31675, "epoch": 261} {"train_loss": -31.06705093383789, "global_step": 31676, "epoch": 261} {"train_loss": -31.276159286499023, "global_step": 31677, "epoch": 261} {"train_loss": -31.501813888549805, "global_step": 31678, "epoch": 261} {"train_loss": -31.36066246032715, "global_step": 31679, "epoch": 261} {"train_loss": -31.16353416442871, "global_step": 31680, "epoch": 261} {"train_loss": -31.003244400024414, "global_step": 31681, "epoch": 261} {"train_loss": -31.634153366088867, "global_step": 31682, "epoch": 261} {"train_loss": -30.507551193237305, "global_step": 31683, "epoch": 261} {"train_loss": -31.201208114624023, "global_step": 31684, "epoch": 261} {"train_loss": -31.122241973876953, "global_step": 31685, "epoch": 261} {"train_loss": -31.891340255737305, "global_step": 31686, "epoch": 261} {"train_loss": -31.81524085998535, "global_step": 31687, "epoch": 261} {"train_loss": -31.500635147094727, "global_step": 31688, "epoch": 261} {"train_loss": -31.87965202331543, "global_step": 31689, "epoch": 261} {"train_loss": -31.462995529174805, "global_step": 31690, "epoch": 261} {"train_loss": -31.893299102783203, "global_step": 31691, "epoch": 261} {"train_loss": -31.54960060119629, "global_step": 31692, "epoch": 261} {"train_loss": -32.009803771972656, "global_step": 31693, "epoch": 261} {"train_loss": -31.649494171142578, "global_step": 31694, "epoch": 261} {"train_loss": -31.631092071533203, "global_step": 31695, "epoch": 261} {"train_loss": -32.17829513549805, "global_step": 31696, "epoch": 261} {"train_loss": -31.69196891784668, "global_step": 31697, "epoch": 261} {"train_loss": -31.946928024291992, "global_step": 31698, "epoch": 261} {"train_loss": -31.641300201416016, "global_step": 31699, "epoch": 261} {"train_loss": -31.73196792602539, "global_step": 31700, "epoch": 261} {"train_loss": -30.49598119672665, "global_step": 31701, "epoch": 261, "val_loss": 2514369.75} {"train_loss": -31.68153953552246, "global_step": 31702, "epoch": 262} {"train_loss": -31.806055068969727, "global_step": 31703, "epoch": 262} {"train_loss": -31.840314865112305, "global_step": 31704, "epoch": 262} {"train_loss": -32.03447723388672, "global_step": 31705, "epoch": 262} {"train_loss": -31.773595809936523, "global_step": 31706, "epoch": 262} {"train_loss": -32.13682174682617, "global_step": 31707, "epoch": 262} {"train_loss": -31.504079818725586, "global_step": 31708, "epoch": 262} {"train_loss": -31.652481079101562, "global_step": 31709, "epoch": 262} {"train_loss": -32.27061080932617, "global_step": 31710, "epoch": 262} {"train_loss": -31.468809127807617, "global_step": 31711, "epoch": 262} {"train_loss": -32.0609016418457, "global_step": 31712, "epoch": 262} {"train_loss": -31.851465225219727, "global_step": 31713, "epoch": 262} {"train_loss": -31.42276954650879, "global_step": 31714, "epoch": 262} {"train_loss": -31.889978408813477, "global_step": 31715, "epoch": 262} {"train_loss": -32.14191436767578, "global_step": 31716, "epoch": 262} {"train_loss": -31.326879501342773, "global_step": 31717, "epoch": 262} {"train_loss": -32.036842346191406, "global_step": 31718, "epoch": 262} {"train_loss": -31.542083740234375, "global_step": 31719, "epoch": 262} {"train_loss": -31.947290420532227, "global_step": 31720, "epoch": 262} {"train_loss": -32.04641342163086, "global_step": 31721, "epoch": 262} {"train_loss": -32.50027084350586, "global_step": 31722, "epoch": 262} {"train_loss": -32.270263671875, "global_step": 31723, "epoch": 262} {"train_loss": -32.00776290893555, "global_step": 31724, "epoch": 262} {"train_loss": -31.582868576049805, "global_step": 31725, "epoch": 262} {"train_loss": -31.86309242248535, "global_step": 31726, "epoch": 262} {"train_loss": -32.40675735473633, "global_step": 31727, "epoch": 262} {"train_loss": -32.324134826660156, "global_step": 31728, "epoch": 262} {"train_loss": -32.338279724121094, "global_step": 31729, "epoch": 262} {"train_loss": -32.090667724609375, "global_step": 31730, "epoch": 262} {"train_loss": -31.669239044189453, "global_step": 31731, "epoch": 262} {"train_loss": -31.90266990661621, "global_step": 31732, "epoch": 262} {"train_loss": -31.718984603881836, "global_step": 31733, "epoch": 262} {"train_loss": -31.59650230407715, "global_step": 31734, "epoch": 262} {"train_loss": -32.122589111328125, "global_step": 31735, "epoch": 262} {"train_loss": -31.704425811767578, "global_step": 31736, "epoch": 262} {"train_loss": -32.279293060302734, "global_step": 31737, "epoch": 262} {"train_loss": -31.76958656311035, "global_step": 31738, "epoch": 262} {"train_loss": -32.45416259765625, "global_step": 31739, "epoch": 262} {"train_loss": -31.489429473876953, "global_step": 31740, "epoch": 262} {"train_loss": -30.837270736694336, "global_step": 31741, "epoch": 262} {"train_loss": -31.642139434814453, "global_step": 31742, "epoch": 262} {"train_loss": -31.524946212768555, "global_step": 31743, "epoch": 262} {"train_loss": -31.37555503845215, "global_step": 31744, "epoch": 262} {"train_loss": -31.709287643432617, "global_step": 31745, "epoch": 262} {"train_loss": -30.96461296081543, "global_step": 31746, "epoch": 262} {"train_loss": -31.191625595092773, "global_step": 31747, "epoch": 262} {"train_loss": -31.659900665283203, "global_step": 31748, "epoch": 262} {"train_loss": -28.673315048217773, "global_step": 31749, "epoch": 262} {"train_loss": -30.467016220092773, "global_step": 31750, "epoch": 262} {"train_loss": -31.352216720581055, "global_step": 31751, "epoch": 262} {"train_loss": -30.99346923828125, "global_step": 31752, "epoch": 262} {"train_loss": -30.200336456298828, "global_step": 31753, "epoch": 262} {"train_loss": -30.65144157409668, "global_step": 31754, "epoch": 262} {"train_loss": -30.093175888061523, "global_step": 31755, "epoch": 262} {"train_loss": -30.204980850219727, "global_step": 31756, "epoch": 262} {"train_loss": -31.463727951049805, "global_step": 31757, "epoch": 262} {"train_loss": -30.4561767578125, "global_step": 31758, "epoch": 262} {"train_loss": -30.868854522705078, "global_step": 31759, "epoch": 262} {"train_loss": -31.06680679321289, "global_step": 31760, "epoch": 262} {"train_loss": -30.6278018951416, "global_step": 31761, "epoch": 262} {"train_loss": -31.05853843688965, "global_step": 31762, "epoch": 262} {"train_loss": -30.897308349609375, "global_step": 31763, "epoch": 262} {"train_loss": -30.50300407409668, "global_step": 31764, "epoch": 262} {"train_loss": -31.58916664123535, "global_step": 31765, "epoch": 262} {"train_loss": -30.836698532104492, "global_step": 31766, "epoch": 262} {"train_loss": -31.122589111328125, "global_step": 31767, "epoch": 262} {"train_loss": -31.735443115234375, "global_step": 31768, "epoch": 262} {"train_loss": -30.81195068359375, "global_step": 31769, "epoch": 262} {"train_loss": -31.090106964111328, "global_step": 31770, "epoch": 262} {"train_loss": -31.529916763305664, "global_step": 31771, "epoch": 262} {"train_loss": -31.500532150268555, "global_step": 31772, "epoch": 262} {"train_loss": -27.57391357421875, "global_step": 31773, "epoch": 262} {"train_loss": -31.32562828063965, "global_step": 31774, "epoch": 262} {"train_loss": -31.702911376953125, "global_step": 31775, "epoch": 262} {"train_loss": -31.28053092956543, "global_step": 31776, "epoch": 262} {"train_loss": -31.344806671142578, "global_step": 31777, "epoch": 262} {"train_loss": -31.305761337280273, "global_step": 31778, "epoch": 262} {"train_loss": -32.12369918823242, "global_step": 31779, "epoch": 262} {"train_loss": -31.837003707885742, "global_step": 31780, "epoch": 262} {"train_loss": -32.11220932006836, "global_step": 31781, "epoch": 262} {"train_loss": -31.797866821289062, "global_step": 31782, "epoch": 262} {"train_loss": -31.842193603515625, "global_step": 31783, "epoch": 262} {"train_loss": -31.499744415283203, "global_step": 31784, "epoch": 262} {"train_loss": -31.439977645874023, "global_step": 31785, "epoch": 262} {"train_loss": -32.009090423583984, "global_step": 31786, "epoch": 262} {"train_loss": -32.06205368041992, "global_step": 31787, "epoch": 262} {"train_loss": -31.939361572265625, "global_step": 31788, "epoch": 262} {"train_loss": -31.80792808532715, "global_step": 31789, "epoch": 262} {"train_loss": -32.23845291137695, "global_step": 31790, "epoch": 262} {"train_loss": -32.20925521850586, "global_step": 31791, "epoch": 262} {"train_loss": -32.654354095458984, "global_step": 31792, "epoch": 262} {"train_loss": -32.21718215942383, "global_step": 31793, "epoch": 262} {"train_loss": -32.72579574584961, "global_step": 31794, "epoch": 262} {"train_loss": -32.21883773803711, "global_step": 31795, "epoch": 262} {"train_loss": -31.78940773010254, "global_step": 31796, "epoch": 262} {"train_loss": -32.83232498168945, "global_step": 31797, "epoch": 262} {"train_loss": -32.71893310546875, "global_step": 31798, "epoch": 262} {"train_loss": -32.514495849609375, "global_step": 31799, "epoch": 262} {"train_loss": -32.51782989501953, "global_step": 31800, "epoch": 262} {"train_loss": -32.91746139526367, "global_step": 31801, "epoch": 262} {"train_loss": -32.51780700683594, "global_step": 31802, "epoch": 262} {"train_loss": -32.763980865478516, "global_step": 31803, "epoch": 262} {"train_loss": -32.51227569580078, "global_step": 31804, "epoch": 262} {"train_loss": -32.324676513671875, "global_step": 31805, "epoch": 262} {"train_loss": -30.60914421081543, "global_step": 31806, "epoch": 262} {"train_loss": -22.713350296020508, "global_step": 31807, "epoch": 262} {"train_loss": -10.552133560180664, "global_step": 31808, "epoch": 262} {"train_loss": -7.571322917938232, "global_step": 31809, "epoch": 262} {"train_loss": -29.530858993530273, "global_step": 31810, "epoch": 262} {"train_loss": -19.993406295776367, "global_step": 31811, "epoch": 262} {"train_loss": -23.03352928161621, "global_step": 31812, "epoch": 262} {"train_loss": -26.301177978515625, "global_step": 31813, "epoch": 262} {"train_loss": -30.035932540893555, "global_step": 31814, "epoch": 262} {"train_loss": -26.359909057617188, "global_step": 31815, "epoch": 262} {"train_loss": -30.501779556274414, "global_step": 31816, "epoch": 262} {"train_loss": -30.11041831970215, "global_step": 31817, "epoch": 262} {"train_loss": -28.59580421447754, "global_step": 31818, "epoch": 262} {"train_loss": -30.06166648864746, "global_step": 31819, "epoch": 262} {"train_loss": -30.480762481689453, "global_step": 31820, "epoch": 262} {"train_loss": -30.316802978515625, "global_step": 31821, "epoch": 262} {"train_loss": -30.797762669807625, "global_step": 31822, "epoch": 262, "val_loss": 2650469.25} {"train_loss": -30.289722442626953, "global_step": 31823, "epoch": 263} {"train_loss": -30.78700828552246, "global_step": 31824, "epoch": 263} {"train_loss": -30.60898780822754, "global_step": 31825, "epoch": 263} {"train_loss": -30.714826583862305, "global_step": 31826, "epoch": 263} {"train_loss": -30.396726608276367, "global_step": 31827, "epoch": 263} {"train_loss": -31.100879669189453, "global_step": 31828, "epoch": 263} {"train_loss": -30.768218994140625, "global_step": 31829, "epoch": 263} {"train_loss": -31.251556396484375, "global_step": 31830, "epoch": 263} {"train_loss": -31.318273544311523, "global_step": 31831, "epoch": 263} {"train_loss": -31.38239097595215, "global_step": 31832, "epoch": 263} {"train_loss": -30.9054012298584, "global_step": 31833, "epoch": 263} {"train_loss": -31.495319366455078, "global_step": 31834, "epoch": 263} {"train_loss": -31.622766494750977, "global_step": 31835, "epoch": 263} {"train_loss": -31.91708755493164, "global_step": 31836, "epoch": 263} {"train_loss": -31.6613712310791, "global_step": 31837, "epoch": 263} {"train_loss": -31.437971115112305, "global_step": 31838, "epoch": 263} {"train_loss": -31.757410049438477, "global_step": 31839, "epoch": 263} {"train_loss": -31.688491821289062, "global_step": 31840, "epoch": 263} {"train_loss": -31.924686431884766, "global_step": 31841, "epoch": 263} {"train_loss": -31.88368034362793, "global_step": 31842, "epoch": 263} {"train_loss": -31.47443199157715, "global_step": 31843, "epoch": 263} {"train_loss": -32.414371490478516, "global_step": 31844, "epoch": 263} {"train_loss": -32.07896041870117, "global_step": 31845, "epoch": 263} {"train_loss": -32.166255950927734, "global_step": 31846, "epoch": 263} {"train_loss": -32.262779235839844, "global_step": 31847, "epoch": 263} {"train_loss": -32.111202239990234, "global_step": 31848, "epoch": 263} {"train_loss": -32.00907897949219, "global_step": 31849, "epoch": 263} {"train_loss": -32.409515380859375, "global_step": 31850, "epoch": 263} {"train_loss": -32.14336013793945, "global_step": 31851, "epoch": 263} {"train_loss": -32.29514694213867, "global_step": 31852, "epoch": 263} {"train_loss": -32.43418502807617, "global_step": 31853, "epoch": 263} {"train_loss": -32.119258880615234, "global_step": 31854, "epoch": 263} {"train_loss": -32.256248474121094, "global_step": 31855, "epoch": 263} {"train_loss": -32.399261474609375, "global_step": 31856, "epoch": 263} {"train_loss": -32.6238899230957, "global_step": 31857, "epoch": 263} {"train_loss": -32.42515182495117, "global_step": 31858, "epoch": 263} {"train_loss": -32.30591583251953, "global_step": 31859, "epoch": 263} {"train_loss": -32.554718017578125, "global_step": 31860, "epoch": 263} {"train_loss": -32.43100357055664, "global_step": 31861, "epoch": 263} {"train_loss": -32.62372970581055, "global_step": 31862, "epoch": 263} {"train_loss": -32.301979064941406, "global_step": 31863, "epoch": 263} {"train_loss": -32.562923431396484, "global_step": 31864, "epoch": 263} {"train_loss": -32.605743408203125, "global_step": 31865, "epoch": 263} {"train_loss": -32.20969009399414, "global_step": 31866, "epoch": 263} {"train_loss": -32.042659759521484, "global_step": 31867, "epoch": 263} {"train_loss": -32.182674407958984, "global_step": 31868, "epoch": 263} {"train_loss": -32.22207260131836, "global_step": 31869, "epoch": 263} {"train_loss": -32.77763748168945, "global_step": 31870, "epoch": 263} {"train_loss": -31.319751739501953, "global_step": 31871, "epoch": 263} {"train_loss": -29.532550811767578, "global_step": 31872, "epoch": 263} {"train_loss": -26.781421661376953, "global_step": 31873, "epoch": 263} {"train_loss": -27.1878604888916, "global_step": 31874, "epoch": 263} {"train_loss": -31.20953941345215, "global_step": 31875, "epoch": 263} {"train_loss": -31.619958877563477, "global_step": 31876, "epoch": 263} {"train_loss": -31.195343017578125, "global_step": 31877, "epoch": 263} {"train_loss": -31.672626495361328, "global_step": 31878, "epoch": 263} {"train_loss": -30.628576278686523, "global_step": 31879, "epoch": 263} {"train_loss": -30.032018661499023, "global_step": 31880, "epoch": 263} {"train_loss": -32.22285842895508, "global_step": 31881, "epoch": 263} {"train_loss": -30.708667755126953, "global_step": 31882, "epoch": 263} {"train_loss": -31.26267433166504, "global_step": 31883, "epoch": 263} {"train_loss": -30.551122665405273, "global_step": 31884, "epoch": 263} {"train_loss": -32.28935623168945, "global_step": 31885, "epoch": 263} {"train_loss": -30.7847843170166, "global_step": 31886, "epoch": 263} {"train_loss": -31.520252227783203, "global_step": 31887, "epoch": 263} {"train_loss": -31.212675094604492, "global_step": 31888, "epoch": 263} {"train_loss": -31.8546085357666, "global_step": 31889, "epoch": 263} {"train_loss": -31.6760311126709, "global_step": 31890, "epoch": 263} {"train_loss": -32.33513259887695, "global_step": 31891, "epoch": 263} {"train_loss": -31.4907169342041, "global_step": 31892, "epoch": 263} {"train_loss": -31.925430297851562, "global_step": 31893, "epoch": 263} {"train_loss": -31.453754425048828, "global_step": 31894, "epoch": 263} {"train_loss": -31.016143798828125, "global_step": 31895, "epoch": 263} {"train_loss": -31.796478271484375, "global_step": 31896, "epoch": 263} {"train_loss": -30.247955322265625, "global_step": 31897, "epoch": 263} {"train_loss": -32.056392669677734, "global_step": 31898, "epoch": 263} {"train_loss": -31.43305778503418, "global_step": 31899, "epoch": 263} {"train_loss": -31.636869430541992, "global_step": 31900, "epoch": 263} {"train_loss": -31.499853134155273, "global_step": 31901, "epoch": 263} {"train_loss": -31.417163848876953, "global_step": 31902, "epoch": 263} {"train_loss": -32.20485305786133, "global_step": 31903, "epoch": 263} {"train_loss": -31.12662696838379, "global_step": 31904, "epoch": 263} {"train_loss": -31.98211097717285, "global_step": 31905, "epoch": 263} {"train_loss": -32.20682907104492, "global_step": 31906, "epoch": 263} {"train_loss": -32.08650588989258, "global_step": 31907, "epoch": 263} {"train_loss": -31.63742446899414, "global_step": 31908, "epoch": 263} {"train_loss": -31.8360538482666, "global_step": 31909, "epoch": 263} {"train_loss": -31.653827667236328, "global_step": 31910, "epoch": 263} {"train_loss": -31.9610595703125, "global_step": 31911, "epoch": 263} {"train_loss": -32.141204833984375, "global_step": 31912, "epoch": 263} {"train_loss": -32.033363342285156, "global_step": 31913, "epoch": 263} {"train_loss": -32.02676010131836, "global_step": 31914, "epoch": 263} {"train_loss": -31.39166259765625, "global_step": 31915, "epoch": 263} {"train_loss": -32.49508285522461, "global_step": 31916, "epoch": 263} {"train_loss": -31.937469482421875, "global_step": 31917, "epoch": 263} {"train_loss": -31.93295669555664, "global_step": 31918, "epoch": 263} {"train_loss": -32.16315460205078, "global_step": 31919, "epoch": 263} {"train_loss": -31.859806060791016, "global_step": 31920, "epoch": 263} {"train_loss": -31.426349639892578, "global_step": 31921, "epoch": 263} {"train_loss": -32.34593963623047, "global_step": 31922, "epoch": 263} {"train_loss": -32.286407470703125, "global_step": 31923, "epoch": 263} {"train_loss": -32.70933151245117, "global_step": 31924, "epoch": 263} {"train_loss": -32.607608795166016, "global_step": 31925, "epoch": 263} {"train_loss": -32.550575256347656, "global_step": 31926, "epoch": 263} {"train_loss": -32.71126174926758, "global_step": 31927, "epoch": 263} {"train_loss": -32.58723068237305, "global_step": 31928, "epoch": 263} {"train_loss": -32.47095489501953, "global_step": 31929, "epoch": 263} {"train_loss": -33.10968780517578, "global_step": 31930, "epoch": 263} {"train_loss": -32.5734748840332, "global_step": 31931, "epoch": 263} {"train_loss": -32.44797897338867, "global_step": 31932, "epoch": 263} {"train_loss": -32.909912109375, "global_step": 31933, "epoch": 263} {"train_loss": -33.17759323120117, "global_step": 31934, "epoch": 263} {"train_loss": -32.9001579284668, "global_step": 31935, "epoch": 263} {"train_loss": -33.223960876464844, "global_step": 31936, "epoch": 263} {"train_loss": -33.102657318115234, "global_step": 31937, "epoch": 263} {"train_loss": -33.0233039855957, "global_step": 31938, "epoch": 263} {"train_loss": -32.98611068725586, "global_step": 31939, "epoch": 263} {"train_loss": -33.04460525512695, "global_step": 31940, "epoch": 263} {"train_loss": -32.581295013427734, "global_step": 31941, "epoch": 263} {"train_loss": -32.6322135925293, "global_step": 31942, "epoch": 263} {"train_loss": -31.808718358189605, "global_step": 31943, "epoch": 263, "val_loss": 2575217.75} {"train_loss": -31.237165451049805, "global_step": 31944, "epoch": 264} {"train_loss": -31.27772331237793, "global_step": 31945, "epoch": 264} {"train_loss": -29.44305992126465, "global_step": 31946, "epoch": 264} {"train_loss": -32.06203079223633, "global_step": 31947, "epoch": 264} {"train_loss": -30.695837020874023, "global_step": 31948, "epoch": 264} {"train_loss": -32.008724212646484, "global_step": 31949, "epoch": 264} {"train_loss": -32.09907150268555, "global_step": 31950, "epoch": 264} {"train_loss": -31.147565841674805, "global_step": 31951, "epoch": 264} {"train_loss": -31.669097900390625, "global_step": 31952, "epoch": 264} {"train_loss": -31.099069595336914, "global_step": 31953, "epoch": 264} {"train_loss": -31.7227840423584, "global_step": 31954, "epoch": 264} {"train_loss": -32.0683479309082, "global_step": 31955, "epoch": 264} {"train_loss": -32.0243034362793, "global_step": 31956, "epoch": 264} {"train_loss": -32.180660247802734, "global_step": 31957, "epoch": 264} {"train_loss": -31.84185218811035, "global_step": 31958, "epoch": 264} {"train_loss": -32.52064895629883, "global_step": 31959, "epoch": 264} {"train_loss": -32.69997787475586, "global_step": 31960, "epoch": 264} {"train_loss": -32.304054260253906, "global_step": 31961, "epoch": 264} {"train_loss": -32.36539840698242, "global_step": 31962, "epoch": 264} {"train_loss": -32.632869720458984, "global_step": 31963, "epoch": 264} {"train_loss": -32.80135726928711, "global_step": 31964, "epoch": 264} {"train_loss": -32.548622131347656, "global_step": 31965, "epoch": 264} {"train_loss": -32.397438049316406, "global_step": 31966, "epoch": 264} {"train_loss": -32.770347595214844, "global_step": 31967, "epoch": 264} {"train_loss": -32.432064056396484, "global_step": 31968, "epoch": 264} {"train_loss": -32.54507064819336, "global_step": 31969, "epoch": 264} {"train_loss": -32.65584945678711, "global_step": 31970, "epoch": 264} {"train_loss": -32.63846206665039, "global_step": 31971, "epoch": 264} {"train_loss": -32.401702880859375, "global_step": 31972, "epoch": 264} {"train_loss": -32.2531852722168, "global_step": 31973, "epoch": 264} {"train_loss": -32.105995178222656, "global_step": 31974, "epoch": 264} {"train_loss": -32.86787033081055, "global_step": 31975, "epoch": 264} {"train_loss": -32.15786361694336, "global_step": 31976, "epoch": 264} {"train_loss": -33.06749725341797, "global_step": 31977, "epoch": 264} {"train_loss": -32.573368072509766, "global_step": 31978, "epoch": 264} {"train_loss": -32.4097900390625, "global_step": 31979, "epoch": 264} {"train_loss": -32.32429122924805, "global_step": 31980, "epoch": 264} {"train_loss": -32.96657180786133, "global_step": 31981, "epoch": 264} {"train_loss": -33.29652786254883, "global_step": 31982, "epoch": 264} {"train_loss": -32.9044303894043, "global_step": 31983, "epoch": 264} {"train_loss": -33.18276596069336, "global_step": 31984, "epoch": 264} {"train_loss": -32.70158386230469, "global_step": 31985, "epoch": 264} {"train_loss": -33.46059036254883, "global_step": 31986, "epoch": 264} {"train_loss": -33.41677474975586, "global_step": 31987, "epoch": 264} {"train_loss": -32.75486373901367, "global_step": 31988, "epoch": 264} {"train_loss": -33.22194290161133, "global_step": 31989, "epoch": 264} {"train_loss": -33.21792984008789, "global_step": 31990, "epoch": 264} {"train_loss": -33.39636993408203, "global_step": 31991, "epoch": 264} {"train_loss": -33.5433235168457, "global_step": 31992, "epoch": 264} {"train_loss": -33.20347595214844, "global_step": 31993, "epoch": 264} {"train_loss": -33.32224655151367, "global_step": 31994, "epoch": 264} {"train_loss": -33.51491928100586, "global_step": 31995, "epoch": 264} {"train_loss": -33.2070198059082, "global_step": 31996, "epoch": 264} {"train_loss": -33.38643264770508, "global_step": 31997, "epoch": 264} {"train_loss": -33.33976364135742, "global_step": 31998, "epoch": 264} {"train_loss": -33.56390380859375, "global_step": 31999, "epoch": 264} {"train_loss": -33.34579086303711, "global_step": 32000, "epoch": 264} {"train_loss": -33.542667388916016, "global_step": 32001, "epoch": 264} {"train_loss": -33.283626556396484, "global_step": 32002, "epoch": 264} {"train_loss": -33.60913848876953, "global_step": 32003, "epoch": 264} {"train_loss": -32.72016525268555, "global_step": 32004, "epoch": 264} {"train_loss": -33.29107666015625, "global_step": 32005, "epoch": 264} {"train_loss": -33.180335998535156, "global_step": 32006, "epoch": 264} {"train_loss": -32.821502685546875, "global_step": 32007, "epoch": 264} {"train_loss": -32.317562103271484, "global_step": 32008, "epoch": 264} {"train_loss": -32.39811325073242, "global_step": 32009, "epoch": 264} {"train_loss": -32.735652923583984, "global_step": 32010, "epoch": 264} {"train_loss": -31.873777389526367, "global_step": 32011, "epoch": 264} {"train_loss": -32.55045700073242, "global_step": 32012, "epoch": 264} {"train_loss": -32.73564529418945, "global_step": 32013, "epoch": 264} {"train_loss": -32.91257858276367, "global_step": 32014, "epoch": 264} {"train_loss": -32.05011749267578, "global_step": 32015, "epoch": 264} {"train_loss": -32.61884689331055, "global_step": 32016, "epoch": 264} {"train_loss": -32.60585403442383, "global_step": 32017, "epoch": 264} {"train_loss": -32.96794128417969, "global_step": 32018, "epoch": 264} {"train_loss": -33.34584045410156, "global_step": 32019, "epoch": 264} {"train_loss": -32.424129486083984, "global_step": 32020, "epoch": 264} {"train_loss": -32.55540466308594, "global_step": 32021, "epoch": 264} {"train_loss": -32.2077522277832, "global_step": 32022, "epoch": 264} {"train_loss": -32.60344314575195, "global_step": 32023, "epoch": 264} {"train_loss": -32.85042190551758, "global_step": 32024, "epoch": 264} {"train_loss": -32.93478775024414, "global_step": 32025, "epoch": 264} {"train_loss": -32.44955062866211, "global_step": 32026, "epoch": 264} {"train_loss": -32.66043472290039, "global_step": 32027, "epoch": 264} {"train_loss": -32.63375473022461, "global_step": 32028, "epoch": 264} {"train_loss": -32.71077346801758, "global_step": 32029, "epoch": 264} {"train_loss": -32.46450424194336, "global_step": 32030, "epoch": 264} {"train_loss": -32.77191162109375, "global_step": 32031, "epoch": 264} {"train_loss": -32.750205993652344, "global_step": 32032, "epoch": 264} {"train_loss": -32.6178092956543, "global_step": 32033, "epoch": 264} {"train_loss": -33.588165283203125, "global_step": 32034, "epoch": 264} {"train_loss": -32.94797897338867, "global_step": 32035, "epoch": 264} {"train_loss": -33.12279510498047, "global_step": 32036, "epoch": 264} {"train_loss": -33.171470642089844, "global_step": 32037, "epoch": 264} {"train_loss": -33.40913009643555, "global_step": 32038, "epoch": 264} {"train_loss": -33.265655517578125, "global_step": 32039, "epoch": 264} {"train_loss": -33.423858642578125, "global_step": 32040, "epoch": 264} {"train_loss": -33.443172454833984, "global_step": 32041, "epoch": 264} {"train_loss": -33.575439453125, "global_step": 32042, "epoch": 264} {"train_loss": -33.026817321777344, "global_step": 32043, "epoch": 264} {"train_loss": -33.84956741333008, "global_step": 32044, "epoch": 264} {"train_loss": -32.85539627075195, "global_step": 32045, "epoch": 264} {"train_loss": -33.509300231933594, "global_step": 32046, "epoch": 264} {"train_loss": -33.39036178588867, "global_step": 32047, "epoch": 264} {"train_loss": -33.080806732177734, "global_step": 32048, "epoch": 264} {"train_loss": -33.066654205322266, "global_step": 32049, "epoch": 264} {"train_loss": -33.393096923828125, "global_step": 32050, "epoch": 264} {"train_loss": -33.79458236694336, "global_step": 32051, "epoch": 264} {"train_loss": -33.551082611083984, "global_step": 32052, "epoch": 264} {"train_loss": -33.461830139160156, "global_step": 32053, "epoch": 264} {"train_loss": -33.494903564453125, "global_step": 32054, "epoch": 264} {"train_loss": -33.24036407470703, "global_step": 32055, "epoch": 264} {"train_loss": -33.70357131958008, "global_step": 32056, "epoch": 264} {"train_loss": -33.33356475830078, "global_step": 32057, "epoch": 264} {"train_loss": -33.56689453125, "global_step": 32058, "epoch": 264} {"train_loss": -33.82686996459961, "global_step": 32059, "epoch": 264} {"train_loss": -33.801143646240234, "global_step": 32060, "epoch": 264} {"train_loss": -33.648006439208984, "global_step": 32061, "epoch": 264} {"train_loss": -33.75197219848633, "global_step": 32062, "epoch": 264} {"train_loss": -33.1391487121582, "global_step": 32063, "epoch": 264} {"train_loss": -32.80553658540584, "global_step": 32064, "epoch": 264, "val_loss": 2653222.75} {"train_loss": -33.358306884765625, "global_step": 32065, "epoch": 265} {"train_loss": -33.76839065551758, "global_step": 32066, "epoch": 265} {"train_loss": -33.360774993896484, "global_step": 32067, "epoch": 265} {"train_loss": -33.66070556640625, "global_step": 32068, "epoch": 265} {"train_loss": -33.350852966308594, "global_step": 32069, "epoch": 265} {"train_loss": -33.47115707397461, "global_step": 32070, "epoch": 265} {"train_loss": -32.78156661987305, "global_step": 32071, "epoch": 265} {"train_loss": -32.516075134277344, "global_step": 32072, "epoch": 265} {"train_loss": -32.762935638427734, "global_step": 32073, "epoch": 265} {"train_loss": -32.6787223815918, "global_step": 32074, "epoch": 265} {"train_loss": -31.85333251953125, "global_step": 32075, "epoch": 265} {"train_loss": -31.058935165405273, "global_step": 32076, "epoch": 265} {"train_loss": -30.799148559570312, "global_step": 32077, "epoch": 265} {"train_loss": -32.84970474243164, "global_step": 32078, "epoch": 265} {"train_loss": -28.130773544311523, "global_step": 32079, "epoch": 265} {"train_loss": -31.61138343811035, "global_step": 32080, "epoch": 265} {"train_loss": -31.851842880249023, "global_step": 32081, "epoch": 265} {"train_loss": -28.151891708374023, "global_step": 32082, "epoch": 265} {"train_loss": -30.315576553344727, "global_step": 32083, "epoch": 265} {"train_loss": -32.163055419921875, "global_step": 32084, "epoch": 265} {"train_loss": -30.832082748413086, "global_step": 32085, "epoch": 265} {"train_loss": -32.55408477783203, "global_step": 32086, "epoch": 265} {"train_loss": -30.517871856689453, "global_step": 32087, "epoch": 265} {"train_loss": -31.57118034362793, "global_step": 32088, "epoch": 265} {"train_loss": -30.1265869140625, "global_step": 32089, "epoch": 265} {"train_loss": -32.05121612548828, "global_step": 32090, "epoch": 265} {"train_loss": -30.79530143737793, "global_step": 32091, "epoch": 265} {"train_loss": -32.90639114379883, "global_step": 32092, "epoch": 265} {"train_loss": -31.51641273498535, "global_step": 32093, "epoch": 265} {"train_loss": -32.10012435913086, "global_step": 32094, "epoch": 265} {"train_loss": -31.5328426361084, "global_step": 32095, "epoch": 265} {"train_loss": -31.262475967407227, "global_step": 32096, "epoch": 265} {"train_loss": -32.86574935913086, "global_step": 32097, "epoch": 265} {"train_loss": -31.891393661499023, "global_step": 32098, "epoch": 265} {"train_loss": -30.6781005859375, "global_step": 32099, "epoch": 265} {"train_loss": -28.890350341796875, "global_step": 32100, "epoch": 265} {"train_loss": -31.030261993408203, "global_step": 32101, "epoch": 265} {"train_loss": -32.54320526123047, "global_step": 32102, "epoch": 265} {"train_loss": -27.773273468017578, "global_step": 32103, "epoch": 265} {"train_loss": -30.224775314331055, "global_step": 32104, "epoch": 265} {"train_loss": -32.679290771484375, "global_step": 32105, "epoch": 265} {"train_loss": -30.080297470092773, "global_step": 32106, "epoch": 265} {"train_loss": -32.62077331542969, "global_step": 32107, "epoch": 265} {"train_loss": -30.512527465820312, "global_step": 32108, "epoch": 265} {"train_loss": -31.683399200439453, "global_step": 32109, "epoch": 265} {"train_loss": -32.21099853515625, "global_step": 32110, "epoch": 265} {"train_loss": -31.918928146362305, "global_step": 32111, "epoch": 265} {"train_loss": -32.83052444458008, "global_step": 32112, "epoch": 265} {"train_loss": -32.26868438720703, "global_step": 32113, "epoch": 265} {"train_loss": -32.75594711303711, "global_step": 32114, "epoch": 265} {"train_loss": -32.14453887939453, "global_step": 32115, "epoch": 265} {"train_loss": -32.999446868896484, "global_step": 32116, "epoch": 265} {"train_loss": -32.57307434082031, "global_step": 32117, "epoch": 265} {"train_loss": -32.503944396972656, "global_step": 32118, "epoch": 265} {"train_loss": -32.768550872802734, "global_step": 32119, "epoch": 265} {"train_loss": -32.54307174682617, "global_step": 32120, "epoch": 265} {"train_loss": -32.57625198364258, "global_step": 32121, "epoch": 265} {"train_loss": -33.262054443359375, "global_step": 32122, "epoch": 265} {"train_loss": -33.32369613647461, "global_step": 32123, "epoch": 265} {"train_loss": -33.415931701660156, "global_step": 32124, "epoch": 265} {"train_loss": -33.17903518676758, "global_step": 32125, "epoch": 265} {"train_loss": -33.17959213256836, "global_step": 32126, "epoch": 265} {"train_loss": -32.78273010253906, "global_step": 32127, "epoch": 265} {"train_loss": -33.048160552978516, "global_step": 32128, "epoch": 265} {"train_loss": -33.111934661865234, "global_step": 32129, "epoch": 265} {"train_loss": -33.16111373901367, "global_step": 32130, "epoch": 265} {"train_loss": -32.675594329833984, "global_step": 32131, "epoch": 265} {"train_loss": -33.2158317565918, "global_step": 32132, "epoch": 265} {"train_loss": -33.26315689086914, "global_step": 32133, "epoch": 265} {"train_loss": -33.06765365600586, "global_step": 32134, "epoch": 265} {"train_loss": -32.8068733215332, "global_step": 32135, "epoch": 265} {"train_loss": -33.48385238647461, "global_step": 32136, "epoch": 265} {"train_loss": -33.16493225097656, "global_step": 32137, "epoch": 265} {"train_loss": -33.25820541381836, "global_step": 32138, "epoch": 265} {"train_loss": -33.65007400512695, "global_step": 32139, "epoch": 265} {"train_loss": -32.8477668762207, "global_step": 32140, "epoch": 265} {"train_loss": -33.03517150878906, "global_step": 32141, "epoch": 265} {"train_loss": -31.289270401000977, "global_step": 32142, "epoch": 265} {"train_loss": -32.80144119262695, "global_step": 32143, "epoch": 265} {"train_loss": -32.216678619384766, "global_step": 32144, "epoch": 265} {"train_loss": -32.91401290893555, "global_step": 32145, "epoch": 265} {"train_loss": -32.751461029052734, "global_step": 32146, "epoch": 265} {"train_loss": -32.98897933959961, "global_step": 32147, "epoch": 265} {"train_loss": -32.44883346557617, "global_step": 32148, "epoch": 265} {"train_loss": -32.38889694213867, "global_step": 32149, "epoch": 265} {"train_loss": -32.69432830810547, "global_step": 32150, "epoch": 265} {"train_loss": -32.592041015625, "global_step": 32151, "epoch": 265} {"train_loss": -32.567909240722656, "global_step": 32152, "epoch": 265} {"train_loss": -31.874120712280273, "global_step": 32153, "epoch": 265} {"train_loss": -33.18675994873047, "global_step": 32154, "epoch": 265} {"train_loss": -32.950904846191406, "global_step": 32155, "epoch": 265} {"train_loss": -32.69985580444336, "global_step": 32156, "epoch": 265} {"train_loss": -32.242366790771484, "global_step": 32157, "epoch": 265} {"train_loss": -32.9373664855957, "global_step": 32158, "epoch": 265} {"train_loss": -31.843103408813477, "global_step": 32159, "epoch": 265} {"train_loss": -32.798065185546875, "global_step": 32160, "epoch": 265} {"train_loss": -33.03025436401367, "global_step": 32161, "epoch": 265} {"train_loss": -32.09714126586914, "global_step": 32162, "epoch": 265} {"train_loss": -32.21116256713867, "global_step": 32163, "epoch": 265} {"train_loss": -33.34845733642578, "global_step": 32164, "epoch": 265} {"train_loss": -33.02528762817383, "global_step": 32165, "epoch": 265} {"train_loss": -32.885738372802734, "global_step": 32166, "epoch": 265} {"train_loss": -33.12717819213867, "global_step": 32167, "epoch": 265} {"train_loss": -33.01205062866211, "global_step": 32168, "epoch": 265} {"train_loss": -32.90517807006836, "global_step": 32169, "epoch": 265} {"train_loss": -32.2274284362793, "global_step": 32170, "epoch": 265} {"train_loss": -32.581275939941406, "global_step": 32171, "epoch": 265} {"train_loss": -32.94111633300781, "global_step": 32172, "epoch": 265} {"train_loss": -33.05216598510742, "global_step": 32173, "epoch": 265} {"train_loss": -32.51459884643555, "global_step": 32174, "epoch": 265} {"train_loss": -33.21803283691406, "global_step": 32175, "epoch": 265} {"train_loss": -33.21604919433594, "global_step": 32176, "epoch": 265} {"train_loss": -32.62134552001953, "global_step": 32177, "epoch": 265} {"train_loss": -32.4173583984375, "global_step": 32178, "epoch": 265} {"train_loss": -32.102359771728516, "global_step": 32179, "epoch": 265} {"train_loss": -33.23699951171875, "global_step": 32180, "epoch": 265} {"train_loss": -32.32294464111328, "global_step": 32181, "epoch": 265} {"train_loss": -32.97890853881836, "global_step": 32182, "epoch": 265} {"train_loss": -33.854183197021484, "global_step": 32183, "epoch": 265} {"train_loss": -32.4370002746582, "global_step": 32184, "epoch": 265} {"train_loss": -32.343080898946965, "global_step": 32185, "epoch": 265, "val_loss": 2724911.25} {"train_loss": -33.24419021606445, "global_step": 32186, "epoch": 266} {"train_loss": -33.65508270263672, "global_step": 32187, "epoch": 266} {"train_loss": -33.00319290161133, "global_step": 32188, "epoch": 266} {"train_loss": -33.292598724365234, "global_step": 32189, "epoch": 266} {"train_loss": -33.2724723815918, "global_step": 32190, "epoch": 266} {"train_loss": -32.70075607299805, "global_step": 32191, "epoch": 266} {"train_loss": -33.84403991699219, "global_step": 32192, "epoch": 266} {"train_loss": -33.38059997558594, "global_step": 32193, "epoch": 266} {"train_loss": -33.35976028442383, "global_step": 32194, "epoch": 266} {"train_loss": -33.43629837036133, "global_step": 32195, "epoch": 266} {"train_loss": -33.984840393066406, "global_step": 32196, "epoch": 266} {"train_loss": -33.79808044433594, "global_step": 32197, "epoch": 266} {"train_loss": -33.957618713378906, "global_step": 32198, "epoch": 266} {"train_loss": -33.963233947753906, "global_step": 32199, "epoch": 266} {"train_loss": -33.2557258605957, "global_step": 32200, "epoch": 266} {"train_loss": -33.35051345825195, "global_step": 32201, "epoch": 266} {"train_loss": -33.64838409423828, "global_step": 32202, "epoch": 266} {"train_loss": -33.84699249267578, "global_step": 32203, "epoch": 266} {"train_loss": -32.924896240234375, "global_step": 32204, "epoch": 266} {"train_loss": -32.89016342163086, "global_step": 32205, "epoch": 266} {"train_loss": -33.994117736816406, "global_step": 32206, "epoch": 266} {"train_loss": -32.35285186767578, "global_step": 32207, "epoch": 266} {"train_loss": -33.56447982788086, "global_step": 32208, "epoch": 266} {"train_loss": -31.336328506469727, "global_step": 32209, "epoch": 266} {"train_loss": -32.789833068847656, "global_step": 32210, "epoch": 266} {"train_loss": -33.46803283691406, "global_step": 32211, "epoch": 266} {"train_loss": -31.855371475219727, "global_step": 32212, "epoch": 266} {"train_loss": -32.9813346862793, "global_step": 32213, "epoch": 266} {"train_loss": -32.537899017333984, "global_step": 32214, "epoch": 266} {"train_loss": -29.1235408782959, "global_step": 32215, "epoch": 266} {"train_loss": -31.64878273010254, "global_step": 32216, "epoch": 266} {"train_loss": -29.2602481842041, "global_step": 32217, "epoch": 266} {"train_loss": -28.94036865234375, "global_step": 32218, "epoch": 266} {"train_loss": -28.779499053955078, "global_step": 32219, "epoch": 266} {"train_loss": -30.364835739135742, "global_step": 32220, "epoch": 266} {"train_loss": -28.670917510986328, "global_step": 32221, "epoch": 266} {"train_loss": -28.82854652404785, "global_step": 32222, "epoch": 266} {"train_loss": -29.174047470092773, "global_step": 32223, "epoch": 266} {"train_loss": -30.491214752197266, "global_step": 32224, "epoch": 266} {"train_loss": -28.45505142211914, "global_step": 32225, "epoch": 266} {"train_loss": -27.130598068237305, "global_step": 32226, "epoch": 266} {"train_loss": -28.813968658447266, "global_step": 32227, "epoch": 266} {"train_loss": -30.7381649017334, "global_step": 32228, "epoch": 266} {"train_loss": -28.321552276611328, "global_step": 32229, "epoch": 266} {"train_loss": -29.349170684814453, "global_step": 32230, "epoch": 266} {"train_loss": -29.08833885192871, "global_step": 32231, "epoch": 266} {"train_loss": -29.74209976196289, "global_step": 32232, "epoch": 266} {"train_loss": -29.847183227539062, "global_step": 32233, "epoch": 266} {"train_loss": -29.630859375, "global_step": 32234, "epoch": 266} {"train_loss": -29.797521591186523, "global_step": 32235, "epoch": 266} {"train_loss": -30.163043975830078, "global_step": 32236, "epoch": 266} {"train_loss": -30.31050682067871, "global_step": 32237, "epoch": 266} {"train_loss": -30.707616806030273, "global_step": 32238, "epoch": 266} {"train_loss": -29.561185836791992, "global_step": 32239, "epoch": 266} {"train_loss": -30.618030548095703, "global_step": 32240, "epoch": 266} {"train_loss": -30.421674728393555, "global_step": 32241, "epoch": 266} {"train_loss": -30.663816452026367, "global_step": 32242, "epoch": 266} {"train_loss": -30.71087646484375, "global_step": 32243, "epoch": 266} {"train_loss": -30.482309341430664, "global_step": 32244, "epoch": 266} {"train_loss": -31.34002685546875, "global_step": 32245, "epoch": 266} {"train_loss": -30.658447265625, "global_step": 32246, "epoch": 266} {"train_loss": -31.18048667907715, "global_step": 32247, "epoch": 266} {"train_loss": -31.1754150390625, "global_step": 32248, "epoch": 266} {"train_loss": -30.98007583618164, "global_step": 32249, "epoch": 266} {"train_loss": -30.9205322265625, "global_step": 32250, "epoch": 266} {"train_loss": -31.710620880126953, "global_step": 32251, "epoch": 266} {"train_loss": -30.301904678344727, "global_step": 32252, "epoch": 266} {"train_loss": -31.23726463317871, "global_step": 32253, "epoch": 266} {"train_loss": -31.159290313720703, "global_step": 32254, "epoch": 266} {"train_loss": -31.570343017578125, "global_step": 32255, "epoch": 266} {"train_loss": -31.616159439086914, "global_step": 32256, "epoch": 266} {"train_loss": -31.546186447143555, "global_step": 32257, "epoch": 266} {"train_loss": -31.960468292236328, "global_step": 32258, "epoch": 266} {"train_loss": -31.15142822265625, "global_step": 32259, "epoch": 266} {"train_loss": -31.928253173828125, "global_step": 32260, "epoch": 266} {"train_loss": -31.779052734375, "global_step": 32261, "epoch": 266} {"train_loss": -32.1097526550293, "global_step": 32262, "epoch": 266} {"train_loss": -31.775943756103516, "global_step": 32263, "epoch": 266} {"train_loss": -32.2905387878418, "global_step": 32264, "epoch": 266} {"train_loss": -32.17171859741211, "global_step": 32265, "epoch": 266} {"train_loss": -32.15177536010742, "global_step": 32266, "epoch": 266} {"train_loss": -31.472675323486328, "global_step": 32267, "epoch": 266} {"train_loss": -32.026180267333984, "global_step": 32268, "epoch": 266} {"train_loss": -32.82463836669922, "global_step": 32269, "epoch": 266} {"train_loss": -32.10492706298828, "global_step": 32270, "epoch": 266} {"train_loss": -32.08266067504883, "global_step": 32271, "epoch": 266} {"train_loss": -31.384815216064453, "global_step": 32272, "epoch": 266} {"train_loss": -31.82537269592285, "global_step": 32273, "epoch": 266} {"train_loss": -33.31056594848633, "global_step": 32274, "epoch": 266} {"train_loss": -33.01252746582031, "global_step": 32275, "epoch": 266} {"train_loss": -31.61455726623535, "global_step": 32276, "epoch": 266} {"train_loss": -31.578815460205078, "global_step": 32277, "epoch": 266} {"train_loss": -33.521026611328125, "global_step": 32278, "epoch": 266} {"train_loss": -32.56600570678711, "global_step": 32279, "epoch": 266} {"train_loss": -32.07851028442383, "global_step": 32280, "epoch": 266} {"train_loss": -33.593048095703125, "global_step": 32281, "epoch": 266} {"train_loss": -32.695777893066406, "global_step": 32282, "epoch": 266} {"train_loss": -31.725622177124023, "global_step": 32283, "epoch": 266} {"train_loss": -31.702184677124023, "global_step": 32284, "epoch": 266} {"train_loss": -33.16175079345703, "global_step": 32285, "epoch": 266} {"train_loss": -32.40635299682617, "global_step": 32286, "epoch": 266} {"train_loss": -32.73270797729492, "global_step": 32287, "epoch": 266} {"train_loss": -33.93674850463867, "global_step": 32288, "epoch": 266} {"train_loss": -32.62217712402344, "global_step": 32289, "epoch": 266} {"train_loss": -32.79928970336914, "global_step": 32290, "epoch": 266} {"train_loss": -33.67000961303711, "global_step": 32291, "epoch": 266} {"train_loss": -33.30567932128906, "global_step": 32292, "epoch": 266} {"train_loss": -33.60786819458008, "global_step": 32293, "epoch": 266} {"train_loss": -33.56709289550781, "global_step": 32294, "epoch": 266} {"train_loss": -33.17414093017578, "global_step": 32295, "epoch": 266} {"train_loss": -33.322933197021484, "global_step": 32296, "epoch": 266} {"train_loss": -33.549808502197266, "global_step": 32297, "epoch": 266} {"train_loss": -33.703704833984375, "global_step": 32298, "epoch": 266} {"train_loss": -33.100616455078125, "global_step": 32299, "epoch": 266} {"train_loss": -33.170894622802734, "global_step": 32300, "epoch": 266} {"train_loss": -33.41851806640625, "global_step": 32301, "epoch": 266} {"train_loss": -33.440704345703125, "global_step": 32302, "epoch": 266} {"train_loss": -33.31356430053711, "global_step": 32303, "epoch": 266} {"train_loss": -34.148590087890625, "global_step": 32304, "epoch": 266} {"train_loss": -33.27103805541992, "global_step": 32305, "epoch": 266} {"train_loss": -31.899916924720955, "global_step": 32306, "epoch": 266, "val_loss": 2526059.75} {"train_loss": -33.85462188720703, "global_step": 32307, "epoch": 267} {"train_loss": -32.83795166015625, "global_step": 32308, "epoch": 267} {"train_loss": -33.82429504394531, "global_step": 32309, "epoch": 267} {"train_loss": -33.21238327026367, "global_step": 32310, "epoch": 267} {"train_loss": -32.76710891723633, "global_step": 32311, "epoch": 267} {"train_loss": -32.84006118774414, "global_step": 32312, "epoch": 267} {"train_loss": -33.26917266845703, "global_step": 32313, "epoch": 267} {"train_loss": -32.29148864746094, "global_step": 32314, "epoch": 267} {"train_loss": -32.67586135864258, "global_step": 32315, "epoch": 267} {"train_loss": -33.1087646484375, "global_step": 32316, "epoch": 267} {"train_loss": -32.6783332824707, "global_step": 32317, "epoch": 267} {"train_loss": -32.49769592285156, "global_step": 32318, "epoch": 267} {"train_loss": -32.471534729003906, "global_step": 32319, "epoch": 267} {"train_loss": -32.6239128112793, "global_step": 32320, "epoch": 267} {"train_loss": -32.93037796020508, "global_step": 32321, "epoch": 267} {"train_loss": -33.17936325073242, "global_step": 32322, "epoch": 267} {"train_loss": -32.51466751098633, "global_step": 32323, "epoch": 267} {"train_loss": -32.96713638305664, "global_step": 32324, "epoch": 267} {"train_loss": -33.29734420776367, "global_step": 32325, "epoch": 267} {"train_loss": -33.36848831176758, "global_step": 32326, "epoch": 267} {"train_loss": -31.769214630126953, "global_step": 32327, "epoch": 267} {"train_loss": -32.31785202026367, "global_step": 32328, "epoch": 267} {"train_loss": -32.153717041015625, "global_step": 32329, "epoch": 267} {"train_loss": -32.417213439941406, "global_step": 32330, "epoch": 267} {"train_loss": -32.7007942199707, "global_step": 32331, "epoch": 267} {"train_loss": -32.4366340637207, "global_step": 32332, "epoch": 267} {"train_loss": -32.101070404052734, "global_step": 32333, "epoch": 267} {"train_loss": -31.711328506469727, "global_step": 32334, "epoch": 267} {"train_loss": -30.45830726623535, "global_step": 32335, "epoch": 267} {"train_loss": -30.303922653198242, "global_step": 32336, "epoch": 267} {"train_loss": -29.46368980407715, "global_step": 32337, "epoch": 267} {"train_loss": -30.35761070251465, "global_step": 32338, "epoch": 267} {"train_loss": -28.129358291625977, "global_step": 32339, "epoch": 267} {"train_loss": -24.194934844970703, "global_step": 32340, "epoch": 267} {"train_loss": -24.978271484375, "global_step": 32341, "epoch": 267} {"train_loss": -30.68499183654785, "global_step": 32342, "epoch": 267} {"train_loss": -28.515823364257812, "global_step": 32343, "epoch": 267} {"train_loss": -30.251300811767578, "global_step": 32344, "epoch": 267} {"train_loss": -30.001447677612305, "global_step": 32345, "epoch": 267} {"train_loss": -30.25540542602539, "global_step": 32346, "epoch": 267} {"train_loss": -31.0267276763916, "global_step": 32347, "epoch": 267} {"train_loss": -30.032440185546875, "global_step": 32348, "epoch": 267} {"train_loss": -31.21613121032715, "global_step": 32349, "epoch": 267} {"train_loss": -31.368112564086914, "global_step": 32350, "epoch": 267} {"train_loss": -30.321203231811523, "global_step": 32351, "epoch": 267} {"train_loss": -32.457801818847656, "global_step": 32352, "epoch": 267} {"train_loss": -30.804431915283203, "global_step": 32353, "epoch": 267} {"train_loss": -29.859304428100586, "global_step": 32354, "epoch": 267} {"train_loss": -30.84847068786621, "global_step": 32355, "epoch": 267} {"train_loss": -31.969196319580078, "global_step": 32356, "epoch": 267} {"train_loss": -31.852270126342773, "global_step": 32357, "epoch": 267} {"train_loss": -31.951440811157227, "global_step": 32358, "epoch": 267} {"train_loss": -31.631183624267578, "global_step": 32359, "epoch": 267} {"train_loss": -32.25569534301758, "global_step": 32360, "epoch": 267} {"train_loss": -32.147403717041016, "global_step": 32361, "epoch": 267} {"train_loss": -32.06513595581055, "global_step": 32362, "epoch": 267} {"train_loss": -32.40987777709961, "global_step": 32363, "epoch": 267} {"train_loss": -32.2702751159668, "global_step": 32364, "epoch": 267} {"train_loss": -32.60786819458008, "global_step": 32365, "epoch": 267} {"train_loss": -32.41019058227539, "global_step": 32366, "epoch": 267} {"train_loss": -32.30980682373047, "global_step": 32367, "epoch": 267} {"train_loss": -32.311492919921875, "global_step": 32368, "epoch": 267} {"train_loss": -32.38658905029297, "global_step": 32369, "epoch": 267} {"train_loss": -31.635028839111328, "global_step": 32370, "epoch": 267} {"train_loss": -32.48951721191406, "global_step": 32371, "epoch": 267} {"train_loss": -32.657020568847656, "global_step": 32372, "epoch": 267} {"train_loss": -32.46355056762695, "global_step": 32373, "epoch": 267} {"train_loss": -32.8512077331543, "global_step": 32374, "epoch": 267} {"train_loss": -32.362754821777344, "global_step": 32375, "epoch": 267} {"train_loss": -32.5191764831543, "global_step": 32376, "epoch": 267} {"train_loss": -33.114646911621094, "global_step": 32377, "epoch": 267} {"train_loss": -32.771053314208984, "global_step": 32378, "epoch": 267} {"train_loss": -32.89577102661133, "global_step": 32379, "epoch": 267} {"train_loss": -32.65987014770508, "global_step": 32380, "epoch": 267} {"train_loss": -33.05329132080078, "global_step": 32381, "epoch": 267} {"train_loss": -32.81824493408203, "global_step": 32382, "epoch": 267} {"train_loss": -32.890804290771484, "global_step": 32383, "epoch": 267} {"train_loss": -33.22677230834961, "global_step": 32384, "epoch": 267} {"train_loss": -33.083621978759766, "global_step": 32385, "epoch": 267} {"train_loss": -32.97227096557617, "global_step": 32386, "epoch": 267} {"train_loss": -33.28106689453125, "global_step": 32387, "epoch": 267} {"train_loss": -33.175113677978516, "global_step": 32388, "epoch": 267} {"train_loss": -33.54240036010742, "global_step": 32389, "epoch": 267} {"train_loss": -33.58201217651367, "global_step": 32390, "epoch": 267} {"train_loss": -32.765316009521484, "global_step": 32391, "epoch": 267} {"train_loss": -33.11178970336914, "global_step": 32392, "epoch": 267} {"train_loss": -33.66288375854492, "global_step": 32393, "epoch": 267} {"train_loss": -33.38784408569336, "global_step": 32394, "epoch": 267} {"train_loss": -33.13401794433594, "global_step": 32395, "epoch": 267} {"train_loss": -33.380104064941406, "global_step": 32396, "epoch": 267} {"train_loss": -32.462562561035156, "global_step": 32397, "epoch": 267} {"train_loss": -32.8651008605957, "global_step": 32398, "epoch": 267} {"train_loss": -33.408729553222656, "global_step": 32399, "epoch": 267} {"train_loss": -32.85703659057617, "global_step": 32400, "epoch": 267} {"train_loss": -33.39545822143555, "global_step": 32401, "epoch": 267} {"train_loss": -33.46390151977539, "global_step": 32402, "epoch": 267} {"train_loss": -32.54273223876953, "global_step": 32403, "epoch": 267} {"train_loss": -32.419532775878906, "global_step": 32404, "epoch": 267} {"train_loss": -33.42877960205078, "global_step": 32405, "epoch": 267} {"train_loss": -33.187225341796875, "global_step": 32406, "epoch": 267} {"train_loss": -32.823280334472656, "global_step": 32407, "epoch": 267} {"train_loss": -32.8355827331543, "global_step": 32408, "epoch": 267} {"train_loss": -33.19509506225586, "global_step": 32409, "epoch": 267} {"train_loss": -33.03898239135742, "global_step": 32410, "epoch": 267} {"train_loss": -33.79264450073242, "global_step": 32411, "epoch": 267} {"train_loss": -33.48787307739258, "global_step": 32412, "epoch": 267} {"train_loss": -33.03562545776367, "global_step": 32413, "epoch": 267} {"train_loss": -33.3324089050293, "global_step": 32414, "epoch": 267} {"train_loss": -32.99445724487305, "global_step": 32415, "epoch": 267} {"train_loss": -32.57025909423828, "global_step": 32416, "epoch": 267} {"train_loss": -33.6387825012207, "global_step": 32417, "epoch": 267} {"train_loss": -33.28169631958008, "global_step": 32418, "epoch": 267} {"train_loss": -32.74183654785156, "global_step": 32419, "epoch": 267} {"train_loss": -31.812162399291992, "global_step": 32420, "epoch": 267} {"train_loss": -31.207422256469727, "global_step": 32421, "epoch": 267} {"train_loss": -32.854732513427734, "global_step": 32422, "epoch": 267} {"train_loss": -33.169429779052734, "global_step": 32423, "epoch": 267} {"train_loss": -31.17340660095215, "global_step": 32424, "epoch": 267} {"train_loss": -30.145404815673828, "global_step": 32425, "epoch": 267} {"train_loss": -30.21528434753418, "global_step": 32426, "epoch": 267} {"train_loss": -32.19388052254669, "global_step": 32427, "epoch": 267, "val_loss": 2564094.75} {"train_loss": -32.31373977661133, "global_step": 32428, "epoch": 268} {"train_loss": -32.32966232299805, "global_step": 32429, "epoch": 268} {"train_loss": -33.05906295776367, "global_step": 32430, "epoch": 268} {"train_loss": -32.0628547668457, "global_step": 32431, "epoch": 268} {"train_loss": -32.73046875, "global_step": 32432, "epoch": 268} {"train_loss": -33.067108154296875, "global_step": 32433, "epoch": 268} {"train_loss": -32.04500198364258, "global_step": 32434, "epoch": 268} {"train_loss": -33.167518615722656, "global_step": 32435, "epoch": 268} {"train_loss": -33.11845016479492, "global_step": 32436, "epoch": 268} {"train_loss": -31.435712814331055, "global_step": 32437, "epoch": 268} {"train_loss": -32.578311920166016, "global_step": 32438, "epoch": 268} {"train_loss": -33.033329010009766, "global_step": 32439, "epoch": 268} {"train_loss": -32.109230041503906, "global_step": 32440, "epoch": 268} {"train_loss": -32.11956787109375, "global_step": 32441, "epoch": 268} {"train_loss": -32.345298767089844, "global_step": 32442, "epoch": 268} {"train_loss": -31.177915573120117, "global_step": 32443, "epoch": 268} {"train_loss": -32.769229888916016, "global_step": 32444, "epoch": 268} {"train_loss": -32.21859359741211, "global_step": 32445, "epoch": 268} {"train_loss": -31.7218074798584, "global_step": 32446, "epoch": 268} {"train_loss": -32.23698806762695, "global_step": 32447, "epoch": 268} {"train_loss": -32.435546875, "global_step": 32448, "epoch": 268} {"train_loss": -32.64522933959961, "global_step": 32449, "epoch": 268} {"train_loss": -32.726165771484375, "global_step": 32450, "epoch": 268} {"train_loss": -32.663063049316406, "global_step": 32451, "epoch": 268} {"train_loss": -33.101593017578125, "global_step": 32452, "epoch": 268} {"train_loss": -32.890785217285156, "global_step": 32453, "epoch": 268} {"train_loss": -32.93003845214844, "global_step": 32454, "epoch": 268} {"train_loss": -33.20960235595703, "global_step": 32455, "epoch": 268} {"train_loss": -33.28837203979492, "global_step": 32456, "epoch": 268} {"train_loss": -33.20437240600586, "global_step": 32457, "epoch": 268} {"train_loss": -32.67942428588867, "global_step": 32458, "epoch": 268} {"train_loss": -33.327144622802734, "global_step": 32459, "epoch": 268} {"train_loss": -33.31264877319336, "global_step": 32460, "epoch": 268} {"train_loss": -33.66701126098633, "global_step": 32461, "epoch": 268} {"train_loss": -33.688228607177734, "global_step": 32462, "epoch": 268} {"train_loss": -33.09040451049805, "global_step": 32463, "epoch": 268} {"train_loss": -33.2273063659668, "global_step": 32464, "epoch": 268} {"train_loss": -33.1643180847168, "global_step": 32465, "epoch": 268} {"train_loss": -33.067832946777344, "global_step": 32466, "epoch": 268} {"train_loss": -33.327877044677734, "global_step": 32467, "epoch": 268} {"train_loss": -33.664791107177734, "global_step": 32468, "epoch": 268} {"train_loss": -33.5329475402832, "global_step": 32469, "epoch": 268} {"train_loss": -33.048648834228516, "global_step": 32470, "epoch": 268} {"train_loss": -33.31583786010742, "global_step": 32471, "epoch": 268} {"train_loss": -33.170623779296875, "global_step": 32472, "epoch": 268} {"train_loss": -33.343231201171875, "global_step": 32473, "epoch": 268} {"train_loss": -33.2197265625, "global_step": 32474, "epoch": 268} {"train_loss": -32.54037094116211, "global_step": 32475, "epoch": 268} {"train_loss": -33.5308837890625, "global_step": 32476, "epoch": 268} {"train_loss": -33.24788284301758, "global_step": 32477, "epoch": 268} {"train_loss": -33.72909164428711, "global_step": 32478, "epoch": 268} {"train_loss": -33.373878479003906, "global_step": 32479, "epoch": 268} {"train_loss": -33.130348205566406, "global_step": 32480, "epoch": 268} {"train_loss": -33.62862777709961, "global_step": 32481, "epoch": 268} {"train_loss": -32.9466667175293, "global_step": 32482, "epoch": 268} {"train_loss": -32.89353561401367, "global_step": 32483, "epoch": 268} {"train_loss": -33.041778564453125, "global_step": 32484, "epoch": 268} {"train_loss": -33.44532775878906, "global_step": 32485, "epoch": 268} {"train_loss": -33.06241989135742, "global_step": 32486, "epoch": 268} {"train_loss": -33.41427230834961, "global_step": 32487, "epoch": 268} {"train_loss": -32.2752571105957, "global_step": 32488, "epoch": 268} {"train_loss": -33.03868103027344, "global_step": 32489, "epoch": 268} {"train_loss": -33.48084259033203, "global_step": 32490, "epoch": 268} {"train_loss": -32.43449020385742, "global_step": 32491, "epoch": 268} {"train_loss": -33.636199951171875, "global_step": 32492, "epoch": 268} {"train_loss": -33.65342330932617, "global_step": 32493, "epoch": 268} {"train_loss": -33.1602668762207, "global_step": 32494, "epoch": 268} {"train_loss": -33.17145538330078, "global_step": 32495, "epoch": 268} {"train_loss": -33.92185974121094, "global_step": 32496, "epoch": 268} {"train_loss": -32.90857696533203, "global_step": 32497, "epoch": 268} {"train_loss": -33.39884948730469, "global_step": 32498, "epoch": 268} {"train_loss": -33.09458541870117, "global_step": 32499, "epoch": 268} {"train_loss": -32.936012268066406, "global_step": 32500, "epoch": 268} {"train_loss": -33.271053314208984, "global_step": 32501, "epoch": 268} {"train_loss": -33.22825622558594, "global_step": 32502, "epoch": 268} {"train_loss": -33.985713958740234, "global_step": 32503, "epoch": 268} {"train_loss": -33.59064483642578, "global_step": 32504, "epoch": 268} {"train_loss": -33.708595275878906, "global_step": 32505, "epoch": 268} {"train_loss": -33.9108772277832, "global_step": 32506, "epoch": 268} {"train_loss": -33.31309127807617, "global_step": 32507, "epoch": 268} {"train_loss": -32.68695831298828, "global_step": 32508, "epoch": 268} {"train_loss": -31.217884063720703, "global_step": 32509, "epoch": 268} {"train_loss": -24.370384216308594, "global_step": 32510, "epoch": 268} {"train_loss": -10.246129035949707, "global_step": 32511, "epoch": 268} {"train_loss": 12.41730785369873, "global_step": 32512, "epoch": 268} {"train_loss": -17.054702758789062, "global_step": 32513, "epoch": 268} {"train_loss": -16.499204635620117, "global_step": 32514, "epoch": 268} {"train_loss": -21.327016830444336, "global_step": 32515, "epoch": 268} {"train_loss": -18.75802230834961, "global_step": 32516, "epoch": 268} {"train_loss": -28.987024307250977, "global_step": 32517, "epoch": 268} {"train_loss": -29.192102432250977, "global_step": 32518, "epoch": 268} {"train_loss": -26.170166015625, "global_step": 32519, "epoch": 268} {"train_loss": -25.829870223999023, "global_step": 32520, "epoch": 268} {"train_loss": -29.630910873413086, "global_step": 32521, "epoch": 268} {"train_loss": -30.074621200561523, "global_step": 32522, "epoch": 268} {"train_loss": -29.976369857788086, "global_step": 32523, "epoch": 268} {"train_loss": -30.6898193359375, "global_step": 32524, "epoch": 268} {"train_loss": -29.08639907836914, "global_step": 32525, "epoch": 268} {"train_loss": -30.155099868774414, "global_step": 32526, "epoch": 268} {"train_loss": -29.930952072143555, "global_step": 32527, "epoch": 268} {"train_loss": -31.101572036743164, "global_step": 32528, "epoch": 268} {"train_loss": -30.794361114501953, "global_step": 32529, "epoch": 268} {"train_loss": -31.68466567993164, "global_step": 32530, "epoch": 268} {"train_loss": -31.539113998413086, "global_step": 32531, "epoch": 268} {"train_loss": -31.284530639648438, "global_step": 32532, "epoch": 268} {"train_loss": -31.23700523376465, "global_step": 32533, "epoch": 268} {"train_loss": -31.12336540222168, "global_step": 32534, "epoch": 268} {"train_loss": -31.048221588134766, "global_step": 32535, "epoch": 268} {"train_loss": -31.320911407470703, "global_step": 32536, "epoch": 268} {"train_loss": -31.53523063659668, "global_step": 32537, "epoch": 268} {"train_loss": -31.717514038085938, "global_step": 32538, "epoch": 268} {"train_loss": -31.599760055541992, "global_step": 32539, "epoch": 268} {"train_loss": -31.764379501342773, "global_step": 32540, "epoch": 268} {"train_loss": -31.775800704956055, "global_step": 32541, "epoch": 268} {"train_loss": -32.27808380126953, "global_step": 32542, "epoch": 268} {"train_loss": -31.94781494140625, "global_step": 32543, "epoch": 268} {"train_loss": -31.956449508666992, "global_step": 32544, "epoch": 268} {"train_loss": -31.87576675415039, "global_step": 32545, "epoch": 268} {"train_loss": -32.045074462890625, "global_step": 32546, "epoch": 268} {"train_loss": -32.048213958740234, "global_step": 32547, "epoch": 268} {"train_loss": -31.27360101179643, "global_step": 32548, "epoch": 268, "val_loss": 2751674.75} {"train_loss": -32.154823303222656, "global_step": 32549, "epoch": 269} {"train_loss": -32.10246658325195, "global_step": 32550, "epoch": 269} {"train_loss": -32.42490768432617, "global_step": 32551, "epoch": 269} {"train_loss": -32.2266731262207, "global_step": 32552, "epoch": 269} {"train_loss": -32.90863800048828, "global_step": 32553, "epoch": 269} {"train_loss": -32.43561935424805, "global_step": 32554, "epoch": 269} {"train_loss": -32.74235153198242, "global_step": 32555, "epoch": 269} {"train_loss": -32.55604934692383, "global_step": 32556, "epoch": 269} {"train_loss": -32.74149703979492, "global_step": 32557, "epoch": 269} {"train_loss": -32.793312072753906, "global_step": 32558, "epoch": 269} {"train_loss": -32.716495513916016, "global_step": 32559, "epoch": 269} {"train_loss": -32.85320281982422, "global_step": 32560, "epoch": 269} {"train_loss": -32.8486442565918, "global_step": 32561, "epoch": 269} {"train_loss": -32.654144287109375, "global_step": 32562, "epoch": 269} {"train_loss": -32.56068420410156, "global_step": 32563, "epoch": 269} {"train_loss": -32.00484085083008, "global_step": 32564, "epoch": 269} {"train_loss": -31.513080596923828, "global_step": 32565, "epoch": 269} {"train_loss": -31.169879913330078, "global_step": 32566, "epoch": 269} {"train_loss": -32.370826721191406, "global_step": 32567, "epoch": 269} {"train_loss": -32.721126556396484, "global_step": 32568, "epoch": 269} {"train_loss": -33.015899658203125, "global_step": 32569, "epoch": 269} {"train_loss": -32.11605453491211, "global_step": 32570, "epoch": 269} {"train_loss": -31.614395141601562, "global_step": 32571, "epoch": 269} {"train_loss": -32.52001953125, "global_step": 32572, "epoch": 269} {"train_loss": -31.934219360351562, "global_step": 32573, "epoch": 269} {"train_loss": -30.029891967773438, "global_step": 32574, "epoch": 269} {"train_loss": -30.656478881835938, "global_step": 32575, "epoch": 269} {"train_loss": -32.60786819458008, "global_step": 32576, "epoch": 269} {"train_loss": -30.544775009155273, "global_step": 32577, "epoch": 269} {"train_loss": -32.59952926635742, "global_step": 32578, "epoch": 269} {"train_loss": -31.122241973876953, "global_step": 32579, "epoch": 269} {"train_loss": -32.300479888916016, "global_step": 32580, "epoch": 269} {"train_loss": -32.06840133666992, "global_step": 32581, "epoch": 269} {"train_loss": -30.92745018005371, "global_step": 32582, "epoch": 269} {"train_loss": -31.962066650390625, "global_step": 32583, "epoch": 269} {"train_loss": -32.044700622558594, "global_step": 32584, "epoch": 269} {"train_loss": -32.08191680908203, "global_step": 32585, "epoch": 269} {"train_loss": -31.915481567382812, "global_step": 32586, "epoch": 269} {"train_loss": -31.60469627380371, "global_step": 32587, "epoch": 269} {"train_loss": -32.04077911376953, "global_step": 32588, "epoch": 269} {"train_loss": -32.109004974365234, "global_step": 32589, "epoch": 269} {"train_loss": -32.29501724243164, "global_step": 32590, "epoch": 269} {"train_loss": -32.48318099975586, "global_step": 32591, "epoch": 269} {"train_loss": -32.61738204956055, "global_step": 32592, "epoch": 269} {"train_loss": -31.856403350830078, "global_step": 32593, "epoch": 269} {"train_loss": -32.45329666137695, "global_step": 32594, "epoch": 269} {"train_loss": -32.05184555053711, "global_step": 32595, "epoch": 269} {"train_loss": -32.04685592651367, "global_step": 32596, "epoch": 269} {"train_loss": -31.932697296142578, "global_step": 32597, "epoch": 269} {"train_loss": -32.07587814331055, "global_step": 32598, "epoch": 269} {"train_loss": -32.19520950317383, "global_step": 32599, "epoch": 269} {"train_loss": -32.48783493041992, "global_step": 32600, "epoch": 269} {"train_loss": -32.097023010253906, "global_step": 32601, "epoch": 269} {"train_loss": -31.695837020874023, "global_step": 32602, "epoch": 269} {"train_loss": -31.023456573486328, "global_step": 32603, "epoch": 269} {"train_loss": -30.649322509765625, "global_step": 32604, "epoch": 269} {"train_loss": -32.134098052978516, "global_step": 32605, "epoch": 269} {"train_loss": -32.21527862548828, "global_step": 32606, "epoch": 269} {"train_loss": -31.200794219970703, "global_step": 32607, "epoch": 269} {"train_loss": -29.88715171813965, "global_step": 32608, "epoch": 269} {"train_loss": -31.192401885986328, "global_step": 32609, "epoch": 269} {"train_loss": -32.98639678955078, "global_step": 32610, "epoch": 269} {"train_loss": -31.892200469970703, "global_step": 32611, "epoch": 269} {"train_loss": -31.582935333251953, "global_step": 32612, "epoch": 269} {"train_loss": -32.210304260253906, "global_step": 32613, "epoch": 269} {"train_loss": -32.1411247253418, "global_step": 32614, "epoch": 269} {"train_loss": -31.997373580932617, "global_step": 32615, "epoch": 269} {"train_loss": -32.2541389465332, "global_step": 32616, "epoch": 269} {"train_loss": -32.98381423950195, "global_step": 32617, "epoch": 269} {"train_loss": -32.33484649658203, "global_step": 32618, "epoch": 269} {"train_loss": -32.79951477050781, "global_step": 32619, "epoch": 269} {"train_loss": -32.74452209472656, "global_step": 32620, "epoch": 269} {"train_loss": -32.06901931762695, "global_step": 32621, "epoch": 269} {"train_loss": -31.66114616394043, "global_step": 32622, "epoch": 269} {"train_loss": -31.5205020904541, "global_step": 32623, "epoch": 269} {"train_loss": -31.36557388305664, "global_step": 32624, "epoch": 269} {"train_loss": -32.64630126953125, "global_step": 32625, "epoch": 269} {"train_loss": -32.87935256958008, "global_step": 32626, "epoch": 269} {"train_loss": -32.51713943481445, "global_step": 32627, "epoch": 269} {"train_loss": -31.7115421295166, "global_step": 32628, "epoch": 269} {"train_loss": -31.470426559448242, "global_step": 32629, "epoch": 269} {"train_loss": -32.82403564453125, "global_step": 32630, "epoch": 269} {"train_loss": -31.8241024017334, "global_step": 32631, "epoch": 269} {"train_loss": -31.601409912109375, "global_step": 32632, "epoch": 269} {"train_loss": -33.00718307495117, "global_step": 32633, "epoch": 269} {"train_loss": -32.58784866333008, "global_step": 32634, "epoch": 269} {"train_loss": -29.59378433227539, "global_step": 32635, "epoch": 269} {"train_loss": -32.49638748168945, "global_step": 32636, "epoch": 269} {"train_loss": -31.479660034179688, "global_step": 32637, "epoch": 269} {"train_loss": -31.740249633789062, "global_step": 32638, "epoch": 269} {"train_loss": -31.478479385375977, "global_step": 32639, "epoch": 269} {"train_loss": -30.45733642578125, "global_step": 32640, "epoch": 269} {"train_loss": -31.081607818603516, "global_step": 32641, "epoch": 269} {"train_loss": -31.5828857421875, "global_step": 32642, "epoch": 269} {"train_loss": -31.28754234313965, "global_step": 32643, "epoch": 269} {"train_loss": -32.209529876708984, "global_step": 32644, "epoch": 269} {"train_loss": -31.15192985534668, "global_step": 32645, "epoch": 269} {"train_loss": -32.328651428222656, "global_step": 32646, "epoch": 269} {"train_loss": -31.331594467163086, "global_step": 32647, "epoch": 269} {"train_loss": -31.609542846679688, "global_step": 32648, "epoch": 269} {"train_loss": -32.10347366333008, "global_step": 32649, "epoch": 269} {"train_loss": -32.104949951171875, "global_step": 32650, "epoch": 269} {"train_loss": -32.258705139160156, "global_step": 32651, "epoch": 269} {"train_loss": -31.834272384643555, "global_step": 32652, "epoch": 269} {"train_loss": -32.3084716796875, "global_step": 32653, "epoch": 269} {"train_loss": -32.5666618347168, "global_step": 32654, "epoch": 269} {"train_loss": -32.3486442565918, "global_step": 32655, "epoch": 269} {"train_loss": -32.59912109375, "global_step": 32656, "epoch": 269} {"train_loss": -32.78107833862305, "global_step": 32657, "epoch": 269} {"train_loss": -32.63018035888672, "global_step": 32658, "epoch": 269} {"train_loss": -32.545833587646484, "global_step": 32659, "epoch": 269} {"train_loss": -32.26631546020508, "global_step": 32660, "epoch": 269} {"train_loss": -32.079410552978516, "global_step": 32661, "epoch": 269} {"train_loss": -32.61989212036133, "global_step": 32662, "epoch": 269} {"train_loss": -32.862464904785156, "global_step": 32663, "epoch": 269} {"train_loss": -32.49050521850586, "global_step": 32664, "epoch": 269} {"train_loss": -32.86935806274414, "global_step": 32665, "epoch": 269} {"train_loss": -32.3360595703125, "global_step": 32666, "epoch": 269} {"train_loss": -32.732540130615234, "global_step": 32667, "epoch": 269} {"train_loss": -32.726924896240234, "global_step": 32668, "epoch": 269} {"train_loss": -32.06683280251243, "global_step": 32669, "epoch": 269, "val_loss": 2639338.75} {"train_loss": -32.59891891479492, "global_step": 32670, "epoch": 270} {"train_loss": -32.31289291381836, "global_step": 32671, "epoch": 270} {"train_loss": -32.53217697143555, "global_step": 32672, "epoch": 270} {"train_loss": -32.69923782348633, "global_step": 32673, "epoch": 270} {"train_loss": -32.9339714050293, "global_step": 32674, "epoch": 270} {"train_loss": -31.5395565032959, "global_step": 32675, "epoch": 270} {"train_loss": -32.005069732666016, "global_step": 32676, "epoch": 270} {"train_loss": -31.352432250976562, "global_step": 32677, "epoch": 270} {"train_loss": -31.138263702392578, "global_step": 32678, "epoch": 270} {"train_loss": -32.72184753417969, "global_step": 32679, "epoch": 270} {"train_loss": -30.73675537109375, "global_step": 32680, "epoch": 270} {"train_loss": -32.06809616088867, "global_step": 32681, "epoch": 270} {"train_loss": -31.533334732055664, "global_step": 32682, "epoch": 270} {"train_loss": -32.72486114501953, "global_step": 32683, "epoch": 270} {"train_loss": -31.8417911529541, "global_step": 32684, "epoch": 270} {"train_loss": -31.457977294921875, "global_step": 32685, "epoch": 270} {"train_loss": -31.530170440673828, "global_step": 32686, "epoch": 270} {"train_loss": -31.797231674194336, "global_step": 32687, "epoch": 270} {"train_loss": -32.246612548828125, "global_step": 32688, "epoch": 270} {"train_loss": -32.300079345703125, "global_step": 32689, "epoch": 270} {"train_loss": -32.87882614135742, "global_step": 32690, "epoch": 270} {"train_loss": -33.029823303222656, "global_step": 32691, "epoch": 270} {"train_loss": -32.908809661865234, "global_step": 32692, "epoch": 270} {"train_loss": -31.988006591796875, "global_step": 32693, "epoch": 270} {"train_loss": -32.874176025390625, "global_step": 32694, "epoch": 270} {"train_loss": -33.01174545288086, "global_step": 32695, "epoch": 270} {"train_loss": -32.66553497314453, "global_step": 32696, "epoch": 270} {"train_loss": -32.472660064697266, "global_step": 32697, "epoch": 270} {"train_loss": -32.697914123535156, "global_step": 32698, "epoch": 270} {"train_loss": -32.13429641723633, "global_step": 32699, "epoch": 270} {"train_loss": -32.59395217895508, "global_step": 32700, "epoch": 270} {"train_loss": -33.010616302490234, "global_step": 32701, "epoch": 270} {"train_loss": -32.33378219604492, "global_step": 32702, "epoch": 270} {"train_loss": -32.57660675048828, "global_step": 32703, "epoch": 270} {"train_loss": -32.78812026977539, "global_step": 32704, "epoch": 270} {"train_loss": -32.08695602416992, "global_step": 32705, "epoch": 270} {"train_loss": -32.10511016845703, "global_step": 32706, "epoch": 270} {"train_loss": -31.073495864868164, "global_step": 32707, "epoch": 270} {"train_loss": -28.828964233398438, "global_step": 32708, "epoch": 270} {"train_loss": -28.18397331237793, "global_step": 32709, "epoch": 270} {"train_loss": -31.898075103759766, "global_step": 32710, "epoch": 270} {"train_loss": -31.849273681640625, "global_step": 32711, "epoch": 270} {"train_loss": -29.020349502563477, "global_step": 32712, "epoch": 270} {"train_loss": -31.345417022705078, "global_step": 32713, "epoch": 270} {"train_loss": -31.64228630065918, "global_step": 32714, "epoch": 270} {"train_loss": -30.631561279296875, "global_step": 32715, "epoch": 270} {"train_loss": -32.285091400146484, "global_step": 32716, "epoch": 270} {"train_loss": -31.789596557617188, "global_step": 32717, "epoch": 270} {"train_loss": -30.581256866455078, "global_step": 32718, "epoch": 270} {"train_loss": -32.565521240234375, "global_step": 32719, "epoch": 270} {"train_loss": -32.12968063354492, "global_step": 32720, "epoch": 270} {"train_loss": -32.5565299987793, "global_step": 32721, "epoch": 270} {"train_loss": -31.503503799438477, "global_step": 32722, "epoch": 270} {"train_loss": -32.64750289916992, "global_step": 32723, "epoch": 270} {"train_loss": -32.91053771972656, "global_step": 32724, "epoch": 270} {"train_loss": -32.07645797729492, "global_step": 32725, "epoch": 270} {"train_loss": -33.103267669677734, "global_step": 32726, "epoch": 270} {"train_loss": -32.01670455932617, "global_step": 32727, "epoch": 270} {"train_loss": -33.03227615356445, "global_step": 32728, "epoch": 270} {"train_loss": -32.35990905761719, "global_step": 32729, "epoch": 270} {"train_loss": -32.7415657043457, "global_step": 32730, "epoch": 270} {"train_loss": -32.58899688720703, "global_step": 32731, "epoch": 270} {"train_loss": -32.1925163269043, "global_step": 32732, "epoch": 270} {"train_loss": -33.195613861083984, "global_step": 32733, "epoch": 270} {"train_loss": -32.58132553100586, "global_step": 32734, "epoch": 270} {"train_loss": -32.89589309692383, "global_step": 32735, "epoch": 270} {"train_loss": -33.228763580322266, "global_step": 32736, "epoch": 270} {"train_loss": -32.790443420410156, "global_step": 32737, "epoch": 270} {"train_loss": -33.051658630371094, "global_step": 32738, "epoch": 270} {"train_loss": -32.87295150756836, "global_step": 32739, "epoch": 270} {"train_loss": -32.46894073486328, "global_step": 32740, "epoch": 270} {"train_loss": -33.13564682006836, "global_step": 32741, "epoch": 270} {"train_loss": -32.83452224731445, "global_step": 32742, "epoch": 270} {"train_loss": -32.919952392578125, "global_step": 32743, "epoch": 270} {"train_loss": -32.60166549682617, "global_step": 32744, "epoch": 270} {"train_loss": -33.020320892333984, "global_step": 32745, "epoch": 270} {"train_loss": -32.324092864990234, "global_step": 32746, "epoch": 270} {"train_loss": -32.7857780456543, "global_step": 32747, "epoch": 270} {"train_loss": -32.72361373901367, "global_step": 32748, "epoch": 270} {"train_loss": -32.36991500854492, "global_step": 32749, "epoch": 270} {"train_loss": -33.31245803833008, "global_step": 32750, "epoch": 270} {"train_loss": -32.82334518432617, "global_step": 32751, "epoch": 270} {"train_loss": -31.30354118347168, "global_step": 32752, "epoch": 270} {"train_loss": -33.022579193115234, "global_step": 32753, "epoch": 270} {"train_loss": -33.258277893066406, "global_step": 32754, "epoch": 270} {"train_loss": -32.31414794921875, "global_step": 32755, "epoch": 270} {"train_loss": -33.35413360595703, "global_step": 32756, "epoch": 270} {"train_loss": -32.782405853271484, "global_step": 32757, "epoch": 270} {"train_loss": -32.470680236816406, "global_step": 32758, "epoch": 270} {"train_loss": -32.89089584350586, "global_step": 32759, "epoch": 270} {"train_loss": -32.324947357177734, "global_step": 32760, "epoch": 270} {"train_loss": -33.17417526245117, "global_step": 32761, "epoch": 270} {"train_loss": -32.27579879760742, "global_step": 32762, "epoch": 270} {"train_loss": -32.9130744934082, "global_step": 32763, "epoch": 270} {"train_loss": -32.33675765991211, "global_step": 32764, "epoch": 270} {"train_loss": -31.55704689025879, "global_step": 32765, "epoch": 270} {"train_loss": -31.64710807800293, "global_step": 32766, "epoch": 270} {"train_loss": -32.38444900512695, "global_step": 32767, "epoch": 270} {"train_loss": -32.65389633178711, "global_step": 32768, "epoch": 270} {"train_loss": -32.80419921875, "global_step": 32769, "epoch": 270} {"train_loss": -32.96554946899414, "global_step": 32770, "epoch": 270} {"train_loss": -33.08087158203125, "global_step": 32771, "epoch": 270} {"train_loss": -32.71602249145508, "global_step": 32772, "epoch": 270} {"train_loss": -33.037376403808594, "global_step": 32773, "epoch": 270} {"train_loss": -33.40529251098633, "global_step": 32774, "epoch": 270} {"train_loss": -33.18120193481445, "global_step": 32775, "epoch": 270} {"train_loss": -33.518470764160156, "global_step": 32776, "epoch": 270} {"train_loss": -33.19375991821289, "global_step": 32777, "epoch": 270} {"train_loss": -33.47379684448242, "global_step": 32778, "epoch": 270} {"train_loss": -33.46418380737305, "global_step": 32779, "epoch": 270} {"train_loss": -33.43056106567383, "global_step": 32780, "epoch": 270} {"train_loss": -33.32759475708008, "global_step": 32781, "epoch": 270} {"train_loss": -33.40497970581055, "global_step": 32782, "epoch": 270} {"train_loss": -33.27997589111328, "global_step": 32783, "epoch": 270} {"train_loss": -33.17666244506836, "global_step": 32784, "epoch": 270} {"train_loss": -32.75636672973633, "global_step": 32785, "epoch": 270} {"train_loss": -31.15565299987793, "global_step": 32786, "epoch": 270} {"train_loss": -28.476337432861328, "global_step": 32787, "epoch": 270} {"train_loss": -29.30950927734375, "global_step": 32788, "epoch": 270} {"train_loss": -30.887195587158203, "global_step": 32789, "epoch": 270} {"train_loss": -32.3223783792543, "global_step": 32790, "epoch": 270, "val_loss": 2509101.25} {"train_loss": -33.27992630004883, "global_step": 32791, "epoch": 271} {"train_loss": -33.17522048950195, "global_step": 32792, "epoch": 271} {"train_loss": -33.66584396362305, "global_step": 32793, "epoch": 271} {"train_loss": -32.93857192993164, "global_step": 32794, "epoch": 271} {"train_loss": -32.91520309448242, "global_step": 32795, "epoch": 271} {"train_loss": -33.22015380859375, "global_step": 32796, "epoch": 271} {"train_loss": -33.12615966796875, "global_step": 32797, "epoch": 271} {"train_loss": -32.9180908203125, "global_step": 32798, "epoch": 271} {"train_loss": -33.2299690246582, "global_step": 32799, "epoch": 271} {"train_loss": -32.370845794677734, "global_step": 32800, "epoch": 271} {"train_loss": -32.397396087646484, "global_step": 32801, "epoch": 271} {"train_loss": -32.53596115112305, "global_step": 32802, "epoch": 271} {"train_loss": -32.032527923583984, "global_step": 32803, "epoch": 271} {"train_loss": -31.8685302734375, "global_step": 32804, "epoch": 271} {"train_loss": -32.22140121459961, "global_step": 32805, "epoch": 271} {"train_loss": -32.41608428955078, "global_step": 32806, "epoch": 271} {"train_loss": -31.09610366821289, "global_step": 32807, "epoch": 271} {"train_loss": -32.69966506958008, "global_step": 32808, "epoch": 271} {"train_loss": -32.13572311401367, "global_step": 32809, "epoch": 271} {"train_loss": -32.89466094970703, "global_step": 32810, "epoch": 271} {"train_loss": -32.85471725463867, "global_step": 32811, "epoch": 271} {"train_loss": -32.708553314208984, "global_step": 32812, "epoch": 271} {"train_loss": -32.85396957397461, "global_step": 32813, "epoch": 271} {"train_loss": -32.43010330200195, "global_step": 32814, "epoch": 271} {"train_loss": -33.09397506713867, "global_step": 32815, "epoch": 271} {"train_loss": -32.742347717285156, "global_step": 32816, "epoch": 271} {"train_loss": -32.91035079956055, "global_step": 32817, "epoch": 271} {"train_loss": -32.94986343383789, "global_step": 32818, "epoch": 271} {"train_loss": -31.999181747436523, "global_step": 32819, "epoch": 271} {"train_loss": -31.891340255737305, "global_step": 32820, "epoch": 271} {"train_loss": -31.931543350219727, "global_step": 32821, "epoch": 271} {"train_loss": -32.37455368041992, "global_step": 32822, "epoch": 271} {"train_loss": -32.5455436706543, "global_step": 32823, "epoch": 271} {"train_loss": -32.37632369995117, "global_step": 32824, "epoch": 271} {"train_loss": -30.29071044921875, "global_step": 32825, "epoch": 271} {"train_loss": -30.65557289123535, "global_step": 32826, "epoch": 271} {"train_loss": -32.14133834838867, "global_step": 32827, "epoch": 271} {"train_loss": -32.8538932800293, "global_step": 32828, "epoch": 271} {"train_loss": -31.536230087280273, "global_step": 32829, "epoch": 271} {"train_loss": -32.43381118774414, "global_step": 32830, "epoch": 271} {"train_loss": -32.92752456665039, "global_step": 32831, "epoch": 271} {"train_loss": -32.605377197265625, "global_step": 32832, "epoch": 271} {"train_loss": -33.01789093017578, "global_step": 32833, "epoch": 271} {"train_loss": -33.20515441894531, "global_step": 32834, "epoch": 271} {"train_loss": -33.29561233520508, "global_step": 32835, "epoch": 271} {"train_loss": -33.22829818725586, "global_step": 32836, "epoch": 271} {"train_loss": -33.28875732421875, "global_step": 32837, "epoch": 271} {"train_loss": -32.589454650878906, "global_step": 32838, "epoch": 271} {"train_loss": -32.9438591003418, "global_step": 32839, "epoch": 271} {"train_loss": -32.342159271240234, "global_step": 32840, "epoch": 271} {"train_loss": -30.538604736328125, "global_step": 32841, "epoch": 271} {"train_loss": -33.065834045410156, "global_step": 32842, "epoch": 271} {"train_loss": -32.33821487426758, "global_step": 32843, "epoch": 271} {"train_loss": -29.67380142211914, "global_step": 32844, "epoch": 271} {"train_loss": -33.803558349609375, "global_step": 32845, "epoch": 271} {"train_loss": -30.94488525390625, "global_step": 32846, "epoch": 271} {"train_loss": -33.22532272338867, "global_step": 32847, "epoch": 271} {"train_loss": -30.95973014831543, "global_step": 32848, "epoch": 271} {"train_loss": -32.92139434814453, "global_step": 32849, "epoch": 271} {"train_loss": -33.48686599731445, "global_step": 32850, "epoch": 271} {"train_loss": -31.896976470947266, "global_step": 32851, "epoch": 271} {"train_loss": -33.11787796020508, "global_step": 32852, "epoch": 271} {"train_loss": -32.79043197631836, "global_step": 32853, "epoch": 271} {"train_loss": -32.84940719604492, "global_step": 32854, "epoch": 271} {"train_loss": -32.48335647583008, "global_step": 32855, "epoch": 271} {"train_loss": -33.239967346191406, "global_step": 32856, "epoch": 271} {"train_loss": -33.25204086303711, "global_step": 32857, "epoch": 271} {"train_loss": -33.54810333251953, "global_step": 32858, "epoch": 271} {"train_loss": -33.274871826171875, "global_step": 32859, "epoch": 271} {"train_loss": -33.520790100097656, "global_step": 32860, "epoch": 271} {"train_loss": -33.4981689453125, "global_step": 32861, "epoch": 271} {"train_loss": -33.93929672241211, "global_step": 32862, "epoch": 271} {"train_loss": -33.46389389038086, "global_step": 32863, "epoch": 271} {"train_loss": -32.710968017578125, "global_step": 32864, "epoch": 271} {"train_loss": -32.989253997802734, "global_step": 32865, "epoch": 271} {"train_loss": -33.25225830078125, "global_step": 32866, "epoch": 271} {"train_loss": -32.55141067504883, "global_step": 32867, "epoch": 271} {"train_loss": -32.11867141723633, "global_step": 32868, "epoch": 271} {"train_loss": -33.41330337524414, "global_step": 32869, "epoch": 271} {"train_loss": -33.62262725830078, "global_step": 32870, "epoch": 271} {"train_loss": -33.45237350463867, "global_step": 32871, "epoch": 271} {"train_loss": -32.5996208190918, "global_step": 32872, "epoch": 271} {"train_loss": -32.608062744140625, "global_step": 32873, "epoch": 271} {"train_loss": -33.49665451049805, "global_step": 32874, "epoch": 271} {"train_loss": -33.51545715332031, "global_step": 32875, "epoch": 271} {"train_loss": -33.371089935302734, "global_step": 32876, "epoch": 271} {"train_loss": -33.5787467956543, "global_step": 32877, "epoch": 271} {"train_loss": -34.0781364440918, "global_step": 32878, "epoch": 271} {"train_loss": -33.84501266479492, "global_step": 32879, "epoch": 271} {"train_loss": -32.91060256958008, "global_step": 32880, "epoch": 271} {"train_loss": -31.617279052734375, "global_step": 32881, "epoch": 271} {"train_loss": -30.172119140625, "global_step": 32882, "epoch": 271} {"train_loss": -26.342947006225586, "global_step": 32883, "epoch": 271} {"train_loss": -22.906461715698242, "global_step": 32884, "epoch": 271} {"train_loss": -26.176443099975586, "global_step": 32885, "epoch": 271} {"train_loss": -33.201271057128906, "global_step": 32886, "epoch": 271} {"train_loss": -30.63507080078125, "global_step": 32887, "epoch": 271} {"train_loss": -29.214200973510742, "global_step": 32888, "epoch": 271} {"train_loss": -33.1209602355957, "global_step": 32889, "epoch": 271} {"train_loss": -29.56861686706543, "global_step": 32890, "epoch": 271} {"train_loss": -32.14119338989258, "global_step": 32891, "epoch": 271} {"train_loss": -30.418664932250977, "global_step": 32892, "epoch": 271} {"train_loss": -32.87860107421875, "global_step": 32893, "epoch": 271} {"train_loss": -32.0977783203125, "global_step": 32894, "epoch": 271} {"train_loss": -32.4197998046875, "global_step": 32895, "epoch": 271} {"train_loss": -32.4362907409668, "global_step": 32896, "epoch": 271} {"train_loss": -32.18693542480469, "global_step": 32897, "epoch": 271} {"train_loss": -32.9356803894043, "global_step": 32898, "epoch": 271} {"train_loss": -32.439754486083984, "global_step": 32899, "epoch": 271} {"train_loss": -32.86860275268555, "global_step": 32900, "epoch": 271} {"train_loss": -32.62812423706055, "global_step": 32901, "epoch": 271} {"train_loss": -32.79091262817383, "global_step": 32902, "epoch": 271} {"train_loss": -32.97952651977539, "global_step": 32903, "epoch": 271} {"train_loss": -33.04143142700195, "global_step": 32904, "epoch": 271} {"train_loss": -32.52186965942383, "global_step": 32905, "epoch": 271} {"train_loss": -32.6904296875, "global_step": 32906, "epoch": 271} {"train_loss": -32.206756591796875, "global_step": 32907, "epoch": 271} {"train_loss": -32.79690933227539, "global_step": 32908, "epoch": 271} {"train_loss": -32.771575927734375, "global_step": 32909, "epoch": 271} {"train_loss": -33.10969161987305, "global_step": 32910, "epoch": 271} {"train_loss": -32.40163522515415, "global_step": 32911, "epoch": 271, "val_loss": 2410147.25} {"train_loss": -32.513946533203125, "global_step": 32912, "epoch": 272} {"train_loss": -32.841835021972656, "global_step": 32913, "epoch": 272} {"train_loss": -32.48534393310547, "global_step": 32914, "epoch": 272} {"train_loss": -32.82833480834961, "global_step": 32915, "epoch": 272} {"train_loss": -32.98482131958008, "global_step": 32916, "epoch": 272} {"train_loss": -33.14467239379883, "global_step": 32917, "epoch": 272} {"train_loss": -32.92763900756836, "global_step": 32918, "epoch": 272} {"train_loss": -33.29804229736328, "global_step": 32919, "epoch": 272} {"train_loss": -33.19539260864258, "global_step": 32920, "epoch": 272} {"train_loss": -33.732643127441406, "global_step": 32921, "epoch": 272} {"train_loss": -33.46024703979492, "global_step": 32922, "epoch": 272} {"train_loss": -33.105934143066406, "global_step": 32923, "epoch": 272} {"train_loss": -33.26163864135742, "global_step": 32924, "epoch": 272} {"train_loss": -33.130165100097656, "global_step": 32925, "epoch": 272} {"train_loss": -33.302734375, "global_step": 32926, "epoch": 272} {"train_loss": -33.492794036865234, "global_step": 32927, "epoch": 272} {"train_loss": -33.57156753540039, "global_step": 32928, "epoch": 272} {"train_loss": -33.546749114990234, "global_step": 32929, "epoch": 272} {"train_loss": -33.68549728393555, "global_step": 32930, "epoch": 272} {"train_loss": -33.472896575927734, "global_step": 32931, "epoch": 272} {"train_loss": -33.78165817260742, "global_step": 32932, "epoch": 272} {"train_loss": -33.6807861328125, "global_step": 32933, "epoch": 272} {"train_loss": -33.78915786743164, "global_step": 32934, "epoch": 272} {"train_loss": -33.66950225830078, "global_step": 32935, "epoch": 272} {"train_loss": -33.946311950683594, "global_step": 32936, "epoch": 272} {"train_loss": -34.02009201049805, "global_step": 32937, "epoch": 272} {"train_loss": -33.90395736694336, "global_step": 32938, "epoch": 272} {"train_loss": -33.601219177246094, "global_step": 32939, "epoch": 272} {"train_loss": -33.4937629699707, "global_step": 32940, "epoch": 272} {"train_loss": -33.18043899536133, "global_step": 32941, "epoch": 272} {"train_loss": -31.897491455078125, "global_step": 32942, "epoch": 272} {"train_loss": -29.99799156188965, "global_step": 32943, "epoch": 272} {"train_loss": -28.88115882873535, "global_step": 32944, "epoch": 272} {"train_loss": -29.977521896362305, "global_step": 32945, "epoch": 272} {"train_loss": -32.40359115600586, "global_step": 32946, "epoch": 272} {"train_loss": -33.486183166503906, "global_step": 32947, "epoch": 272} {"train_loss": -32.505714416503906, "global_step": 32948, "epoch": 272} {"train_loss": -32.17007827758789, "global_step": 32949, "epoch": 272} {"train_loss": -33.35337448120117, "global_step": 32950, "epoch": 272} {"train_loss": -32.60990524291992, "global_step": 32951, "epoch": 272} {"train_loss": -32.480804443359375, "global_step": 32952, "epoch": 272} {"train_loss": -33.336151123046875, "global_step": 32953, "epoch": 272} {"train_loss": -32.348575592041016, "global_step": 32954, "epoch": 272} {"train_loss": -32.57546615600586, "global_step": 32955, "epoch": 272} {"train_loss": -33.16162872314453, "global_step": 32956, "epoch": 272} {"train_loss": -32.46561050415039, "global_step": 32957, "epoch": 272} {"train_loss": -32.951229095458984, "global_step": 32958, "epoch": 272} {"train_loss": -33.12453842163086, "global_step": 32959, "epoch": 272} {"train_loss": -33.27149963378906, "global_step": 32960, "epoch": 272} {"train_loss": -33.351680755615234, "global_step": 32961, "epoch": 272} {"train_loss": -32.69923782348633, "global_step": 32962, "epoch": 272} {"train_loss": -33.5142936706543, "global_step": 32963, "epoch": 272} {"train_loss": -31.705530166625977, "global_step": 32964, "epoch": 272} {"train_loss": -33.12824630737305, "global_step": 32965, "epoch": 272} {"train_loss": -31.8537654876709, "global_step": 32966, "epoch": 272} {"train_loss": -32.62202072143555, "global_step": 32967, "epoch": 272} {"train_loss": -32.577980041503906, "global_step": 32968, "epoch": 272} {"train_loss": -32.48760986328125, "global_step": 32969, "epoch": 272} {"train_loss": -32.891639709472656, "global_step": 32970, "epoch": 272} {"train_loss": -33.1279182434082, "global_step": 32971, "epoch": 272} {"train_loss": -33.0151252746582, "global_step": 32972, "epoch": 272} {"train_loss": -32.791969299316406, "global_step": 32973, "epoch": 272} {"train_loss": -32.791358947753906, "global_step": 32974, "epoch": 272} {"train_loss": -33.051204681396484, "global_step": 32975, "epoch": 272} {"train_loss": -33.11672592163086, "global_step": 32976, "epoch": 272} {"train_loss": -33.327613830566406, "global_step": 32977, "epoch": 272} {"train_loss": -31.66183853149414, "global_step": 32978, "epoch": 272} {"train_loss": -31.715076446533203, "global_step": 32979, "epoch": 272} {"train_loss": -31.9980525970459, "global_step": 32980, "epoch": 272} {"train_loss": -33.3687858581543, "global_step": 32981, "epoch": 272} {"train_loss": -32.95156478881836, "global_step": 32982, "epoch": 272} {"train_loss": -33.40553665161133, "global_step": 32983, "epoch": 272} {"train_loss": -33.027488708496094, "global_step": 32984, "epoch": 272} {"train_loss": -33.68100357055664, "global_step": 32985, "epoch": 272} {"train_loss": -33.35715866088867, "global_step": 32986, "epoch": 272} {"train_loss": -33.58552932739258, "global_step": 32987, "epoch": 272} {"train_loss": -33.77203369140625, "global_step": 32988, "epoch": 272} {"train_loss": -33.97695541381836, "global_step": 32989, "epoch": 272} {"train_loss": -33.390846252441406, "global_step": 32990, "epoch": 272} {"train_loss": -33.91083526611328, "global_step": 32991, "epoch": 272} {"train_loss": -33.87235641479492, "global_step": 32992, "epoch": 272} {"train_loss": -33.67307662963867, "global_step": 32993, "epoch": 272} {"train_loss": -33.87147903442383, "global_step": 32994, "epoch": 272} {"train_loss": -34.11860275268555, "global_step": 32995, "epoch": 272} {"train_loss": -34.140525817871094, "global_step": 32996, "epoch": 272} {"train_loss": -33.9080810546875, "global_step": 32997, "epoch": 272} {"train_loss": -34.00366973876953, "global_step": 32998, "epoch": 272} {"train_loss": -34.14427947998047, "global_step": 32999, "epoch": 272} {"train_loss": -34.224727630615234, "global_step": 33000, "epoch": 272} {"train_loss": -34.07429122924805, "global_step": 33001, "epoch": 272} {"train_loss": -34.0738639831543, "global_step": 33002, "epoch": 272} {"train_loss": -33.95869064331055, "global_step": 33003, "epoch": 272} {"train_loss": -33.57902145385742, "global_step": 33004, "epoch": 272} {"train_loss": -33.85357666015625, "global_step": 33005, "epoch": 272} {"train_loss": -33.94911575317383, "global_step": 33006, "epoch": 272} {"train_loss": -33.7504997253418, "global_step": 33007, "epoch": 272} {"train_loss": -33.916412353515625, "global_step": 33008, "epoch": 272} {"train_loss": -33.28512191772461, "global_step": 33009, "epoch": 272} {"train_loss": -33.23337936401367, "global_step": 33010, "epoch": 272} {"train_loss": -31.725067138671875, "global_step": 33011, "epoch": 272} {"train_loss": -32.444393157958984, "global_step": 33012, "epoch": 272} {"train_loss": -33.85203552246094, "global_step": 33013, "epoch": 272} {"train_loss": -33.319854736328125, "global_step": 33014, "epoch": 272} {"train_loss": -33.652122497558594, "global_step": 33015, "epoch": 272} {"train_loss": -33.05540084838867, "global_step": 33016, "epoch": 272} {"train_loss": -33.60248947143555, "global_step": 33017, "epoch": 272} {"train_loss": -32.480316162109375, "global_step": 33018, "epoch": 272} {"train_loss": -32.90937805175781, "global_step": 33019, "epoch": 272} {"train_loss": -32.79453659057617, "global_step": 33020, "epoch": 272} {"train_loss": -32.7658576965332, "global_step": 33021, "epoch": 272} {"train_loss": -33.82587814331055, "global_step": 33022, "epoch": 272} {"train_loss": -33.40257263183594, "global_step": 33023, "epoch": 272} {"train_loss": -33.30270004272461, "global_step": 33024, "epoch": 272} {"train_loss": -33.41067123413086, "global_step": 33025, "epoch": 272} {"train_loss": -33.29676055908203, "global_step": 33026, "epoch": 272} {"train_loss": -32.982051849365234, "global_step": 33027, "epoch": 272} {"train_loss": -33.09695816040039, "global_step": 33028, "epoch": 272} {"train_loss": -33.23234558105469, "global_step": 33029, "epoch": 272} {"train_loss": -32.778438568115234, "global_step": 33030, "epoch": 272} {"train_loss": -32.72966384887695, "global_step": 33031, "epoch": 272} {"train_loss": -33.11551442422157, "global_step": 33032, "epoch": 272, "val_loss": 2520391.0} {"train_loss": -32.81635284423828, "global_step": 33033, "epoch": 273} {"train_loss": -32.65957260131836, "global_step": 33034, "epoch": 273} {"train_loss": -32.67483139038086, "global_step": 33035, "epoch": 273} {"train_loss": -32.93516540527344, "global_step": 33036, "epoch": 273} {"train_loss": -32.107112884521484, "global_step": 33037, "epoch": 273} {"train_loss": -31.540420532226562, "global_step": 33038, "epoch": 273} {"train_loss": -31.432775497436523, "global_step": 33039, "epoch": 273} {"train_loss": -31.869586944580078, "global_step": 33040, "epoch": 273} {"train_loss": -33.0406494140625, "global_step": 33041, "epoch": 273} {"train_loss": -32.879695892333984, "global_step": 33042, "epoch": 273} {"train_loss": -32.649192810058594, "global_step": 33043, "epoch": 273} {"train_loss": -32.48521041870117, "global_step": 33044, "epoch": 273} {"train_loss": -32.064453125, "global_step": 33045, "epoch": 273} {"train_loss": -32.61134719848633, "global_step": 33046, "epoch": 273} {"train_loss": -31.180692672729492, "global_step": 33047, "epoch": 273} {"train_loss": -30.254281997680664, "global_step": 33048, "epoch": 273} {"train_loss": -28.48676872253418, "global_step": 33049, "epoch": 273} {"train_loss": -29.265241622924805, "global_step": 33050, "epoch": 273} {"train_loss": -30.571985244750977, "global_step": 33051, "epoch": 273} {"train_loss": -31.992101669311523, "global_step": 33052, "epoch": 273} {"train_loss": -32.91092300415039, "global_step": 33053, "epoch": 273} {"train_loss": -32.735595703125, "global_step": 33054, "epoch": 273} {"train_loss": -32.9417724609375, "global_step": 33055, "epoch": 273} {"train_loss": -33.18777847290039, "global_step": 33056, "epoch": 273} {"train_loss": -32.67987823486328, "global_step": 33057, "epoch": 273} {"train_loss": -33.423763275146484, "global_step": 33058, "epoch": 273} {"train_loss": -33.59534454345703, "global_step": 33059, "epoch": 273} {"train_loss": -33.81691360473633, "global_step": 33060, "epoch": 273} {"train_loss": -31.64112663269043, "global_step": 33061, "epoch": 273} {"train_loss": -33.33994674682617, "global_step": 33062, "epoch": 273} {"train_loss": -33.1224250793457, "global_step": 33063, "epoch": 273} {"train_loss": -32.38142013549805, "global_step": 33064, "epoch": 273} {"train_loss": -32.6487922668457, "global_step": 33065, "epoch": 273} {"train_loss": -33.454219818115234, "global_step": 33066, "epoch": 273} {"train_loss": -33.89977264404297, "global_step": 33067, "epoch": 273} {"train_loss": -33.067562103271484, "global_step": 33068, "epoch": 273} {"train_loss": -33.46993637084961, "global_step": 33069, "epoch": 273} {"train_loss": -33.55432891845703, "global_step": 33070, "epoch": 273} {"train_loss": -33.244319915771484, "global_step": 33071, "epoch": 273} {"train_loss": -33.668861389160156, "global_step": 33072, "epoch": 273} {"train_loss": -32.700164794921875, "global_step": 33073, "epoch": 273} {"train_loss": -33.30044174194336, "global_step": 33074, "epoch": 273} {"train_loss": -32.17460250854492, "global_step": 33075, "epoch": 273} {"train_loss": -33.1929931640625, "global_step": 33076, "epoch": 273} {"train_loss": -30.94512939453125, "global_step": 33077, "epoch": 273} {"train_loss": -29.988494873046875, "global_step": 33078, "epoch": 273} {"train_loss": -32.02945327758789, "global_step": 33079, "epoch": 273} {"train_loss": -31.61335563659668, "global_step": 33080, "epoch": 273} {"train_loss": -30.396926879882812, "global_step": 33081, "epoch": 273} {"train_loss": -32.63364791870117, "global_step": 33082, "epoch": 273} {"train_loss": -32.2459716796875, "global_step": 33083, "epoch": 273} {"train_loss": -32.98517608642578, "global_step": 33084, "epoch": 273} {"train_loss": -33.0249137878418, "global_step": 33085, "epoch": 273} {"train_loss": -33.401405334472656, "global_step": 33086, "epoch": 273} {"train_loss": -32.32542419433594, "global_step": 33087, "epoch": 273} {"train_loss": -33.25053024291992, "global_step": 33088, "epoch": 273} {"train_loss": -32.61884689331055, "global_step": 33089, "epoch": 273} {"train_loss": -33.6832160949707, "global_step": 33090, "epoch": 273} {"train_loss": -32.58066940307617, "global_step": 33091, "epoch": 273} {"train_loss": -33.57341384887695, "global_step": 33092, "epoch": 273} {"train_loss": -33.17844772338867, "global_step": 33093, "epoch": 273} {"train_loss": -32.87819290161133, "global_step": 33094, "epoch": 273} {"train_loss": -33.04220199584961, "global_step": 33095, "epoch": 273} {"train_loss": -34.326168060302734, "global_step": 33096, "epoch": 273} {"train_loss": -33.47053909301758, "global_step": 33097, "epoch": 273} {"train_loss": -32.950653076171875, "global_step": 33098, "epoch": 273} {"train_loss": -31.279462814331055, "global_step": 33099, "epoch": 273} {"train_loss": -28.476205825805664, "global_step": 33100, "epoch": 273} {"train_loss": -21.99934196472168, "global_step": 33101, "epoch": 273} {"train_loss": -17.848678588867188, "global_step": 33102, "epoch": 273} {"train_loss": -32.855403900146484, "global_step": 33103, "epoch": 273} {"train_loss": -25.561870574951172, "global_step": 33104, "epoch": 273} {"train_loss": -25.955265045166016, "global_step": 33105, "epoch": 273} {"train_loss": -28.83893394470215, "global_step": 33106, "epoch": 273} {"train_loss": -29.69954490661621, "global_step": 33107, "epoch": 273} {"train_loss": -27.102277755737305, "global_step": 33108, "epoch": 273} {"train_loss": -32.60585403442383, "global_step": 33109, "epoch": 273} {"train_loss": -30.378454208374023, "global_step": 33110, "epoch": 273} {"train_loss": -29.374059677124023, "global_step": 33111, "epoch": 273} {"train_loss": -32.725250244140625, "global_step": 33112, "epoch": 273} {"train_loss": -31.546411514282227, "global_step": 33113, "epoch": 273} {"train_loss": -29.930078506469727, "global_step": 33114, "epoch": 273} {"train_loss": -31.4754695892334, "global_step": 33115, "epoch": 273} {"train_loss": -32.80817794799805, "global_step": 33116, "epoch": 273} {"train_loss": -31.989490509033203, "global_step": 33117, "epoch": 273} {"train_loss": -31.345258712768555, "global_step": 33118, "epoch": 273} {"train_loss": -31.38823890686035, "global_step": 33119, "epoch": 273} {"train_loss": -32.24288558959961, "global_step": 33120, "epoch": 273} {"train_loss": -32.553009033203125, "global_step": 33121, "epoch": 273} {"train_loss": -31.59852409362793, "global_step": 33122, "epoch": 273} {"train_loss": -31.56830406188965, "global_step": 33123, "epoch": 273} {"train_loss": -31.98443031311035, "global_step": 33124, "epoch": 273} {"train_loss": -32.240447998046875, "global_step": 33125, "epoch": 273} {"train_loss": -32.66777038574219, "global_step": 33126, "epoch": 273} {"train_loss": -32.80978012084961, "global_step": 33127, "epoch": 273} {"train_loss": -32.631099700927734, "global_step": 33128, "epoch": 273} {"train_loss": -32.31875228881836, "global_step": 33129, "epoch": 273} {"train_loss": -32.59260940551758, "global_step": 33130, "epoch": 273} {"train_loss": -33.02228927612305, "global_step": 33131, "epoch": 273} {"train_loss": -32.79970932006836, "global_step": 33132, "epoch": 273} {"train_loss": -32.77980041503906, "global_step": 33133, "epoch": 273} {"train_loss": -32.74753952026367, "global_step": 33134, "epoch": 273} {"train_loss": -32.753143310546875, "global_step": 33135, "epoch": 273} {"train_loss": -32.70173263549805, "global_step": 33136, "epoch": 273} {"train_loss": -33.23686599731445, "global_step": 33137, "epoch": 273} {"train_loss": -32.709083557128906, "global_step": 33138, "epoch": 273} {"train_loss": -31.93244743347168, "global_step": 33139, "epoch": 273} {"train_loss": -33.14078903198242, "global_step": 33140, "epoch": 273} {"train_loss": -33.020835876464844, "global_step": 33141, "epoch": 273} {"train_loss": -33.01386642456055, "global_step": 33142, "epoch": 273} {"train_loss": -32.95216369628906, "global_step": 33143, "epoch": 273} {"train_loss": -33.06284713745117, "global_step": 33144, "epoch": 273} {"train_loss": -32.6671257019043, "global_step": 33145, "epoch": 273} {"train_loss": -33.229732513427734, "global_step": 33146, "epoch": 273} {"train_loss": -33.09501266479492, "global_step": 33147, "epoch": 273} {"train_loss": -33.220821380615234, "global_step": 33148, "epoch": 273} {"train_loss": -32.958492279052734, "global_step": 33149, "epoch": 273} {"train_loss": -33.30315399169922, "global_step": 33150, "epoch": 273} {"train_loss": -33.3282356262207, "global_step": 33151, "epoch": 273} {"train_loss": -32.51286697387695, "global_step": 33152, "epoch": 273} {"train_loss": -32.01733117852329, "global_step": 33153, "epoch": 273, "val_loss": 2711754.0} {"train_loss": -33.15179443359375, "global_step": 33154, "epoch": 274} {"train_loss": -33.100826263427734, "global_step": 33155, "epoch": 274} {"train_loss": -33.131866455078125, "global_step": 33156, "epoch": 274} {"train_loss": -32.06800842285156, "global_step": 33157, "epoch": 274} {"train_loss": -33.42580032348633, "global_step": 33158, "epoch": 274} {"train_loss": -33.10419845581055, "global_step": 33159, "epoch": 274} {"train_loss": -33.25289535522461, "global_step": 33160, "epoch": 274} {"train_loss": -32.77961349487305, "global_step": 33161, "epoch": 274} {"train_loss": -33.02922439575195, "global_step": 33162, "epoch": 274} {"train_loss": -32.86057662963867, "global_step": 33163, "epoch": 274} {"train_loss": -33.270450592041016, "global_step": 33164, "epoch": 274} {"train_loss": -33.1912841796875, "global_step": 33165, "epoch": 274} {"train_loss": -33.20235824584961, "global_step": 33166, "epoch": 274} {"train_loss": -32.41984939575195, "global_step": 33167, "epoch": 274} {"train_loss": -32.36786651611328, "global_step": 33168, "epoch": 274} {"train_loss": -32.50222396850586, "global_step": 33169, "epoch": 274} {"train_loss": -31.935998916625977, "global_step": 33170, "epoch": 274} {"train_loss": -29.646686553955078, "global_step": 33171, "epoch": 274} {"train_loss": -21.65521812438965, "global_step": 33172, "epoch": 274} {"train_loss": -5.894900798797607, "global_step": 33173, "epoch": 274} {"train_loss": -5.282708644866943, "global_step": 33174, "epoch": 274} {"train_loss": -30.44732666015625, "global_step": 33175, "epoch": 274} {"train_loss": -24.307157516479492, "global_step": 33176, "epoch": 274} {"train_loss": -30.9307861328125, "global_step": 33177, "epoch": 274} {"train_loss": -23.4760799407959, "global_step": 33178, "epoch": 274} {"train_loss": -31.83091163635254, "global_step": 33179, "epoch": 274} {"train_loss": -29.015432357788086, "global_step": 33180, "epoch": 274} {"train_loss": -29.004108428955078, "global_step": 33181, "epoch": 274} {"train_loss": -32.10744094848633, "global_step": 33182, "epoch": 274} {"train_loss": -30.404743194580078, "global_step": 33183, "epoch": 274} {"train_loss": -29.583892822265625, "global_step": 33184, "epoch": 274} {"train_loss": -31.30552101135254, "global_step": 33185, "epoch": 274} {"train_loss": -31.7119140625, "global_step": 33186, "epoch": 274} {"train_loss": -30.798572540283203, "global_step": 33187, "epoch": 274} {"train_loss": -30.549646377563477, "global_step": 33188, "epoch": 274} {"train_loss": -31.258310317993164, "global_step": 33189, "epoch": 274} {"train_loss": -31.87127685546875, "global_step": 33190, "epoch": 274} {"train_loss": -32.20269775390625, "global_step": 33191, "epoch": 274} {"train_loss": -31.984548568725586, "global_step": 33192, "epoch": 274} {"train_loss": -31.24088478088379, "global_step": 33193, "epoch": 274} {"train_loss": -31.659467697143555, "global_step": 33194, "epoch": 274} {"train_loss": -31.666553497314453, "global_step": 33195, "epoch": 274} {"train_loss": -31.906522750854492, "global_step": 33196, "epoch": 274} {"train_loss": -32.52815246582031, "global_step": 33197, "epoch": 274} {"train_loss": -32.19672393798828, "global_step": 33198, "epoch": 274} {"train_loss": -32.02044677734375, "global_step": 33199, "epoch": 274} {"train_loss": -32.40517807006836, "global_step": 33200, "epoch": 274} {"train_loss": -31.945392608642578, "global_step": 33201, "epoch": 274} {"train_loss": -32.55970764160156, "global_step": 33202, "epoch": 274} {"train_loss": -32.65940856933594, "global_step": 33203, "epoch": 274} {"train_loss": -32.51879119873047, "global_step": 33204, "epoch": 274} {"train_loss": -32.73291015625, "global_step": 33205, "epoch": 274} {"train_loss": -32.9930534362793, "global_step": 33206, "epoch": 274} {"train_loss": -32.464481353759766, "global_step": 33207, "epoch": 274} {"train_loss": -32.45195770263672, "global_step": 33208, "epoch": 274} {"train_loss": -32.933074951171875, "global_step": 33209, "epoch": 274} {"train_loss": -32.44635772705078, "global_step": 33210, "epoch": 274} {"train_loss": -32.84485626220703, "global_step": 33211, "epoch": 274} {"train_loss": -32.82891845703125, "global_step": 33212, "epoch": 274} {"train_loss": -32.83829116821289, "global_step": 33213, "epoch": 274} {"train_loss": -32.81501007080078, "global_step": 33214, "epoch": 274} {"train_loss": -33.04166793823242, "global_step": 33215, "epoch": 274} {"train_loss": -33.001861572265625, "global_step": 33216, "epoch": 274} {"train_loss": -32.89516830444336, "global_step": 33217, "epoch": 274} {"train_loss": -32.898193359375, "global_step": 33218, "epoch": 274} {"train_loss": -32.1005744934082, "global_step": 33219, "epoch": 274} {"train_loss": -32.717506408691406, "global_step": 33220, "epoch": 274} {"train_loss": -33.28426742553711, "global_step": 33221, "epoch": 274} {"train_loss": -32.80366134643555, "global_step": 33222, "epoch": 274} {"train_loss": -32.82122039794922, "global_step": 33223, "epoch": 274} {"train_loss": -32.99917221069336, "global_step": 33224, "epoch": 274} {"train_loss": -32.98734664916992, "global_step": 33225, "epoch": 274} {"train_loss": -32.67937088012695, "global_step": 33226, "epoch": 274} {"train_loss": -32.61542510986328, "global_step": 33227, "epoch": 274} {"train_loss": -32.76702880859375, "global_step": 33228, "epoch": 274} {"train_loss": -31.061182022094727, "global_step": 33229, "epoch": 274} {"train_loss": -33.494361877441406, "global_step": 33230, "epoch": 274} {"train_loss": -30.5832462310791, "global_step": 33231, "epoch": 274} {"train_loss": -31.4051456451416, "global_step": 33232, "epoch": 274} {"train_loss": -31.780248641967773, "global_step": 33233, "epoch": 274} {"train_loss": -30.56467056274414, "global_step": 33234, "epoch": 274} {"train_loss": -30.81381607055664, "global_step": 33235, "epoch": 274} {"train_loss": -29.896503448486328, "global_step": 33236, "epoch": 274} {"train_loss": -27.370838165283203, "global_step": 33237, "epoch": 274} {"train_loss": -27.3041934967041, "global_step": 33238, "epoch": 274} {"train_loss": -29.28220558166504, "global_step": 33239, "epoch": 274} {"train_loss": -28.86528968811035, "global_step": 33240, "epoch": 274} {"train_loss": -29.969757080078125, "global_step": 33241, "epoch": 274} {"train_loss": -29.784351348876953, "global_step": 33242, "epoch": 274} {"train_loss": -30.568634033203125, "global_step": 33243, "epoch": 274} {"train_loss": -29.533111572265625, "global_step": 33244, "epoch": 274} {"train_loss": -31.275278091430664, "global_step": 33245, "epoch": 274} {"train_loss": -30.262149810791016, "global_step": 33246, "epoch": 274} {"train_loss": -31.410337448120117, "global_step": 33247, "epoch": 274} {"train_loss": -30.5033016204834, "global_step": 33248, "epoch": 274} {"train_loss": -31.257495880126953, "global_step": 33249, "epoch": 274} {"train_loss": -30.991968154907227, "global_step": 33250, "epoch": 274} {"train_loss": -30.811376571655273, "global_step": 33251, "epoch": 274} {"train_loss": -31.39521598815918, "global_step": 33252, "epoch": 274} {"train_loss": -30.899728775024414, "global_step": 33253, "epoch": 274} {"train_loss": -31.299840927124023, "global_step": 33254, "epoch": 274} {"train_loss": -31.584716796875, "global_step": 33255, "epoch": 274} {"train_loss": -31.89716911315918, "global_step": 33256, "epoch": 274} {"train_loss": -31.76203727722168, "global_step": 33257, "epoch": 274} {"train_loss": -31.32270622253418, "global_step": 33258, "epoch": 274} {"train_loss": -31.530012130737305, "global_step": 33259, "epoch": 274} {"train_loss": -31.15475845336914, "global_step": 33260, "epoch": 274} {"train_loss": -31.64784812927246, "global_step": 33261, "epoch": 274} {"train_loss": -31.927946090698242, "global_step": 33262, "epoch": 274} {"train_loss": -31.51557731628418, "global_step": 33263, "epoch": 274} {"train_loss": -31.59979820251465, "global_step": 33264, "epoch": 274} {"train_loss": -31.976354598999023, "global_step": 33265, "epoch": 274} {"train_loss": -31.3641414642334, "global_step": 33266, "epoch": 274} {"train_loss": -30.963470458984375, "global_step": 33267, "epoch": 274} {"train_loss": -31.64149284362793, "global_step": 33268, "epoch": 274} {"train_loss": -32.177642822265625, "global_step": 33269, "epoch": 274} {"train_loss": -32.03275680541992, "global_step": 33270, "epoch": 274} {"train_loss": -31.483612060546875, "global_step": 33271, "epoch": 274} {"train_loss": -32.01860427856445, "global_step": 33272, "epoch": 274} {"train_loss": -31.663137435913086, "global_step": 33273, "epoch": 274} {"train_loss": -31.086210999607054, "global_step": 33274, "epoch": 274, "val_loss": 2500911.75} {"train_loss": -31.5394344329834, "global_step": 33275, "epoch": 275} {"train_loss": -29.36153221130371, "global_step": 33276, "epoch": 275} {"train_loss": -27.351058959960938, "global_step": 33277, "epoch": 275} {"train_loss": -30.157094955444336, "global_step": 33278, "epoch": 275} {"train_loss": -30.889331817626953, "global_step": 33279, "epoch": 275} {"train_loss": -28.79999351501465, "global_step": 33280, "epoch": 275} {"train_loss": -28.931365966796875, "global_step": 33281, "epoch": 275} {"train_loss": -29.688642501831055, "global_step": 33282, "epoch": 275} {"train_loss": -28.566923141479492, "global_step": 33283, "epoch": 275} {"train_loss": -32.02631759643555, "global_step": 33284, "epoch": 275} {"train_loss": -30.638671875, "global_step": 33285, "epoch": 275} {"train_loss": -30.164575576782227, "global_step": 33286, "epoch": 275} {"train_loss": -31.250442504882812, "global_step": 33287, "epoch": 275} {"train_loss": -32.29725646972656, "global_step": 33288, "epoch": 275} {"train_loss": -31.575464248657227, "global_step": 33289, "epoch": 275} {"train_loss": -31.419830322265625, "global_step": 33290, "epoch": 275} {"train_loss": -30.68189811706543, "global_step": 33291, "epoch": 275} {"train_loss": -31.957921981811523, "global_step": 33292, "epoch": 275} {"train_loss": -32.42716598510742, "global_step": 33293, "epoch": 275} {"train_loss": -32.56877136230469, "global_step": 33294, "epoch": 275} {"train_loss": -32.23486328125, "global_step": 33295, "epoch": 275} {"train_loss": -32.377471923828125, "global_step": 33296, "epoch": 275} {"train_loss": -32.02859115600586, "global_step": 33297, "epoch": 275} {"train_loss": -31.50628662109375, "global_step": 33298, "epoch": 275} {"train_loss": -32.04011154174805, "global_step": 33299, "epoch": 275} {"train_loss": -31.80755615234375, "global_step": 33300, "epoch": 275} {"train_loss": -32.39299392700195, "global_step": 33301, "epoch": 275} {"train_loss": -32.566410064697266, "global_step": 33302, "epoch": 275} {"train_loss": -32.4310302734375, "global_step": 33303, "epoch": 275} {"train_loss": -32.78607177734375, "global_step": 33304, "epoch": 275} {"train_loss": -32.340084075927734, "global_step": 33305, "epoch": 275} {"train_loss": -31.941852569580078, "global_step": 33306, "epoch": 275} {"train_loss": -32.569969177246094, "global_step": 33307, "epoch": 275} {"train_loss": -32.15592575073242, "global_step": 33308, "epoch": 275} {"train_loss": -32.14408493041992, "global_step": 33309, "epoch": 275} {"train_loss": -32.455989837646484, "global_step": 33310, "epoch": 275} {"train_loss": -32.2252311706543, "global_step": 33311, "epoch": 275} {"train_loss": -31.75701904296875, "global_step": 33312, "epoch": 275} {"train_loss": -32.23582077026367, "global_step": 33313, "epoch": 275} {"train_loss": -32.18589401245117, "global_step": 33314, "epoch": 275} {"train_loss": -30.785419464111328, "global_step": 33315, "epoch": 275} {"train_loss": -31.51590919494629, "global_step": 33316, "epoch": 275} {"train_loss": -32.1149787902832, "global_step": 33317, "epoch": 275} {"train_loss": -32.67119216918945, "global_step": 33318, "epoch": 275} {"train_loss": -32.320404052734375, "global_step": 33319, "epoch": 275} {"train_loss": -32.26909255981445, "global_step": 33320, "epoch": 275} {"train_loss": -32.47404479980469, "global_step": 33321, "epoch": 275} {"train_loss": -32.277462005615234, "global_step": 33322, "epoch": 275} {"train_loss": -32.66115951538086, "global_step": 33323, "epoch": 275} {"train_loss": -32.93528747558594, "global_step": 33324, "epoch": 275} {"train_loss": -33.23029708862305, "global_step": 33325, "epoch": 275} {"train_loss": -32.41831588745117, "global_step": 33326, "epoch": 275} {"train_loss": -32.762062072753906, "global_step": 33327, "epoch": 275} {"train_loss": -32.84215545654297, "global_step": 33328, "epoch": 275} {"train_loss": -33.08339309692383, "global_step": 33329, "epoch": 275} {"train_loss": -32.91090393066406, "global_step": 33330, "epoch": 275} {"train_loss": -33.12928771972656, "global_step": 33331, "epoch": 275} {"train_loss": -33.124290466308594, "global_step": 33332, "epoch": 275} {"train_loss": -33.004005432128906, "global_step": 33333, "epoch": 275} {"train_loss": -33.458072662353516, "global_step": 33334, "epoch": 275} {"train_loss": -33.485618591308594, "global_step": 33335, "epoch": 275} {"train_loss": -33.338497161865234, "global_step": 33336, "epoch": 275} {"train_loss": -33.07289505004883, "global_step": 33337, "epoch": 275} {"train_loss": -33.1872673034668, "global_step": 33338, "epoch": 275} {"train_loss": -33.39982986450195, "global_step": 33339, "epoch": 275} {"train_loss": -33.21506881713867, "global_step": 33340, "epoch": 275} {"train_loss": -32.94150924682617, "global_step": 33341, "epoch": 275} {"train_loss": -33.163848876953125, "global_step": 33342, "epoch": 275} {"train_loss": -33.282379150390625, "global_step": 33343, "epoch": 275} {"train_loss": -33.55562210083008, "global_step": 33344, "epoch": 275} {"train_loss": -33.28243637084961, "global_step": 33345, "epoch": 275} {"train_loss": -33.12477493286133, "global_step": 33346, "epoch": 275} {"train_loss": -33.76887893676758, "global_step": 33347, "epoch": 275} {"train_loss": -33.153621673583984, "global_step": 33348, "epoch": 275} {"train_loss": -33.44231033325195, "global_step": 33349, "epoch": 275} {"train_loss": -33.336830139160156, "global_step": 33350, "epoch": 275} {"train_loss": -33.35145950317383, "global_step": 33351, "epoch": 275} {"train_loss": -33.52700424194336, "global_step": 33352, "epoch": 275} {"train_loss": -33.48989486694336, "global_step": 33353, "epoch": 275} {"train_loss": -33.63418197631836, "global_step": 33354, "epoch": 275} {"train_loss": -33.55534362792969, "global_step": 33355, "epoch": 275} {"train_loss": -33.64998245239258, "global_step": 33356, "epoch": 275} {"train_loss": -33.47737503051758, "global_step": 33357, "epoch": 275} {"train_loss": -33.431793212890625, "global_step": 33358, "epoch": 275} {"train_loss": -32.88631057739258, "global_step": 33359, "epoch": 275} {"train_loss": -32.79377746582031, "global_step": 33360, "epoch": 275} {"train_loss": -32.87273025512695, "global_step": 33361, "epoch": 275} {"train_loss": -33.07509994506836, "global_step": 33362, "epoch": 275} {"train_loss": -33.53715133666992, "global_step": 33363, "epoch": 275} {"train_loss": -33.35065841674805, "global_step": 33364, "epoch": 275} {"train_loss": -32.799835205078125, "global_step": 33365, "epoch": 275} {"train_loss": -32.80550003051758, "global_step": 33366, "epoch": 275} {"train_loss": -30.797483444213867, "global_step": 33367, "epoch": 275} {"train_loss": -28.036588668823242, "global_step": 33368, "epoch": 275} {"train_loss": -27.576894760131836, "global_step": 33369, "epoch": 275} {"train_loss": -31.77988052368164, "global_step": 33370, "epoch": 275} {"train_loss": -32.609554290771484, "global_step": 33371, "epoch": 275} {"train_loss": -30.5347900390625, "global_step": 33372, "epoch": 275} {"train_loss": -32.60523223876953, "global_step": 33373, "epoch": 275} {"train_loss": -32.55373764038086, "global_step": 33374, "epoch": 275} {"train_loss": -31.721282958984375, "global_step": 33375, "epoch": 275} {"train_loss": -33.253570556640625, "global_step": 33376, "epoch": 275} {"train_loss": -32.111690521240234, "global_step": 33377, "epoch": 275} {"train_loss": -32.479461669921875, "global_step": 33378, "epoch": 275} {"train_loss": -31.654081344604492, "global_step": 33379, "epoch": 275} {"train_loss": -33.11129379272461, "global_step": 33380, "epoch": 275} {"train_loss": -32.01201629638672, "global_step": 33381, "epoch": 275} {"train_loss": -32.25407791137695, "global_step": 33382, "epoch": 275} {"train_loss": -32.34768295288086, "global_step": 33383, "epoch": 275} {"train_loss": -33.137569427490234, "global_step": 33384, "epoch": 275} {"train_loss": -32.732879638671875, "global_step": 33385, "epoch": 275} {"train_loss": -32.64120101928711, "global_step": 33386, "epoch": 275} {"train_loss": -31.923721313476562, "global_step": 33387, "epoch": 275} {"train_loss": -32.874542236328125, "global_step": 33388, "epoch": 275} {"train_loss": -32.471046447753906, "global_step": 33389, "epoch": 275} {"train_loss": -31.7335205078125, "global_step": 33390, "epoch": 275} {"train_loss": -33.0107421875, "global_step": 33391, "epoch": 275} {"train_loss": -32.37525939941406, "global_step": 33392, "epoch": 275} {"train_loss": -33.142642974853516, "global_step": 33393, "epoch": 275} {"train_loss": -32.6927490234375, "global_step": 33394, "epoch": 275} {"train_loss": -32.250553966553746, "global_step": 33395, "epoch": 275, "val_loss": 2554882.25} {"train_loss": -32.321533203125, "global_step": 33396, "epoch": 276} {"train_loss": -32.42256164550781, "global_step": 33397, "epoch": 276} {"train_loss": -32.92560958862305, "global_step": 33398, "epoch": 276} {"train_loss": -32.4290885925293, "global_step": 33399, "epoch": 276} {"train_loss": -32.27187728881836, "global_step": 33400, "epoch": 276} {"train_loss": -33.11334991455078, "global_step": 33401, "epoch": 276} {"train_loss": -31.45380210876465, "global_step": 33402, "epoch": 276} {"train_loss": -32.89186477661133, "global_step": 33403, "epoch": 276} {"train_loss": -32.98796463012695, "global_step": 33404, "epoch": 276} {"train_loss": -32.5744743347168, "global_step": 33405, "epoch": 276} {"train_loss": -33.35295104980469, "global_step": 33406, "epoch": 276} {"train_loss": -33.21061325073242, "global_step": 33407, "epoch": 276} {"train_loss": -32.891578674316406, "global_step": 33408, "epoch": 276} {"train_loss": -32.26885986328125, "global_step": 33409, "epoch": 276} {"train_loss": -33.13355255126953, "global_step": 33410, "epoch": 276} {"train_loss": -32.586605072021484, "global_step": 33411, "epoch": 276} {"train_loss": -32.822505950927734, "global_step": 33412, "epoch": 276} {"train_loss": -32.72780990600586, "global_step": 33413, "epoch": 276} {"train_loss": -33.14178466796875, "global_step": 33414, "epoch": 276} {"train_loss": -33.06599807739258, "global_step": 33415, "epoch": 276} {"train_loss": -33.3378791809082, "global_step": 33416, "epoch": 276} {"train_loss": -33.09914016723633, "global_step": 33417, "epoch": 276} {"train_loss": -33.44553756713867, "global_step": 33418, "epoch": 276} {"train_loss": -33.105506896972656, "global_step": 33419, "epoch": 276} {"train_loss": -32.799110412597656, "global_step": 33420, "epoch": 276} {"train_loss": -33.477169036865234, "global_step": 33421, "epoch": 276} {"train_loss": -32.83481979370117, "global_step": 33422, "epoch": 276} {"train_loss": -32.85085678100586, "global_step": 33423, "epoch": 276} {"train_loss": -33.422725677490234, "global_step": 33424, "epoch": 276} {"train_loss": -32.84638214111328, "global_step": 33425, "epoch": 276} {"train_loss": -30.393600463867188, "global_step": 33426, "epoch": 276} {"train_loss": -22.86810874938965, "global_step": 33427, "epoch": 276} {"train_loss": -7.7685980796813965, "global_step": 33428, "epoch": 276} {"train_loss": -2.1920361518859863, "global_step": 33429, "epoch": 276} {"train_loss": -25.0958251953125, "global_step": 33430, "epoch": 276} {"train_loss": -28.38291358947754, "global_step": 33431, "epoch": 276} {"train_loss": -26.25971794128418, "global_step": 33432, "epoch": 276} {"train_loss": -22.26964569091797, "global_step": 33433, "epoch": 276} {"train_loss": -30.143579483032227, "global_step": 33434, "epoch": 276} {"train_loss": -26.764739990234375, "global_step": 33435, "epoch": 276} {"train_loss": -30.02460289001465, "global_step": 33436, "epoch": 276} {"train_loss": -30.45021629333496, "global_step": 33437, "epoch": 276} {"train_loss": -26.78223991394043, "global_step": 33438, "epoch": 276} {"train_loss": -29.3655948638916, "global_step": 33439, "epoch": 276} {"train_loss": -30.43147087097168, "global_step": 33440, "epoch": 276} {"train_loss": -29.92518424987793, "global_step": 33441, "epoch": 276} {"train_loss": -30.329248428344727, "global_step": 33442, "epoch": 276} {"train_loss": -30.466032028198242, "global_step": 33443, "epoch": 276} {"train_loss": -31.241043090820312, "global_step": 33444, "epoch": 276} {"train_loss": -31.711902618408203, "global_step": 33445, "epoch": 276} {"train_loss": -31.5575008392334, "global_step": 33446, "epoch": 276} {"train_loss": -30.825666427612305, "global_step": 33447, "epoch": 276} {"train_loss": -30.6527042388916, "global_step": 33448, "epoch": 276} {"train_loss": -31.577411651611328, "global_step": 33449, "epoch": 276} {"train_loss": -31.560443878173828, "global_step": 33450, "epoch": 276} {"train_loss": -31.43276023864746, "global_step": 33451, "epoch": 276} {"train_loss": -31.40130043029785, "global_step": 33452, "epoch": 276} {"train_loss": -31.752460479736328, "global_step": 33453, "epoch": 276} {"train_loss": -31.46001625061035, "global_step": 33454, "epoch": 276} {"train_loss": -31.992069244384766, "global_step": 33455, "epoch": 276} {"train_loss": -31.59711265563965, "global_step": 33456, "epoch": 276} {"train_loss": -32.09497833251953, "global_step": 33457, "epoch": 276} {"train_loss": -31.963336944580078, "global_step": 33458, "epoch": 276} {"train_loss": -31.991968154907227, "global_step": 33459, "epoch": 276} {"train_loss": -32.04665756225586, "global_step": 33460, "epoch": 276} {"train_loss": -32.413246154785156, "global_step": 33461, "epoch": 276} {"train_loss": -32.533260345458984, "global_step": 33462, "epoch": 276} {"train_loss": -32.22840881347656, "global_step": 33463, "epoch": 276} {"train_loss": -32.128841400146484, "global_step": 33464, "epoch": 276} {"train_loss": -32.224609375, "global_step": 33465, "epoch": 276} {"train_loss": -32.592430114746094, "global_step": 33466, "epoch": 276} {"train_loss": -32.21118927001953, "global_step": 33467, "epoch": 276} {"train_loss": -32.4658088684082, "global_step": 33468, "epoch": 276} {"train_loss": -32.810150146484375, "global_step": 33469, "epoch": 276} {"train_loss": -32.555599212646484, "global_step": 33470, "epoch": 276} {"train_loss": -32.602203369140625, "global_step": 33471, "epoch": 276} {"train_loss": -32.833534240722656, "global_step": 33472, "epoch": 276} {"train_loss": -32.439510345458984, "global_step": 33473, "epoch": 276} {"train_loss": -33.09865951538086, "global_step": 33474, "epoch": 276} {"train_loss": -32.81592559814453, "global_step": 33475, "epoch": 276} {"train_loss": -32.8005485534668, "global_step": 33476, "epoch": 276} {"train_loss": -32.842018127441406, "global_step": 33477, "epoch": 276} {"train_loss": -32.996490478515625, "global_step": 33478, "epoch": 276} {"train_loss": -32.767799377441406, "global_step": 33479, "epoch": 276} {"train_loss": -33.204097747802734, "global_step": 33480, "epoch": 276} {"train_loss": -32.68732833862305, "global_step": 33481, "epoch": 276} {"train_loss": -33.100006103515625, "global_step": 33482, "epoch": 276} {"train_loss": -33.10612106323242, "global_step": 33483, "epoch": 276} {"train_loss": -32.8967170715332, "global_step": 33484, "epoch": 276} {"train_loss": -33.309322357177734, "global_step": 33485, "epoch": 276} {"train_loss": -32.95595932006836, "global_step": 33486, "epoch": 276} {"train_loss": -33.11177062988281, "global_step": 33487, "epoch": 276} {"train_loss": -32.734657287597656, "global_step": 33488, "epoch": 276} {"train_loss": -33.11668014526367, "global_step": 33489, "epoch": 276} {"train_loss": -32.476070404052734, "global_step": 33490, "epoch": 276} {"train_loss": -32.877418518066406, "global_step": 33491, "epoch": 276} {"train_loss": -32.42482376098633, "global_step": 33492, "epoch": 276} {"train_loss": -32.682315826416016, "global_step": 33493, "epoch": 276} {"train_loss": -32.88472366333008, "global_step": 33494, "epoch": 276} {"train_loss": -33.36347579956055, "global_step": 33495, "epoch": 276} {"train_loss": -32.98307418823242, "global_step": 33496, "epoch": 276} {"train_loss": -32.766178131103516, "global_step": 33497, "epoch": 276} {"train_loss": -33.35909652709961, "global_step": 33498, "epoch": 276} {"train_loss": -32.86369705200195, "global_step": 33499, "epoch": 276} {"train_loss": -32.52648162841797, "global_step": 33500, "epoch": 276} {"train_loss": -32.912147521972656, "global_step": 33501, "epoch": 276} {"train_loss": -33.200592041015625, "global_step": 33502, "epoch": 276} {"train_loss": -32.496482849121094, "global_step": 33503, "epoch": 276} {"train_loss": -32.917110443115234, "global_step": 33504, "epoch": 276} {"train_loss": -32.1134033203125, "global_step": 33505, "epoch": 276} {"train_loss": -33.09707260131836, "global_step": 33506, "epoch": 276} {"train_loss": -31.96119499206543, "global_step": 33507, "epoch": 276} {"train_loss": -32.83216094970703, "global_step": 33508, "epoch": 276} {"train_loss": -33.106014251708984, "global_step": 33509, "epoch": 276} {"train_loss": -32.33236312866211, "global_step": 33510, "epoch": 276} {"train_loss": -32.7501335144043, "global_step": 33511, "epoch": 276} {"train_loss": -32.12379455566406, "global_step": 33512, "epoch": 276} {"train_loss": -32.56587600708008, "global_step": 33513, "epoch": 276} {"train_loss": -32.53031539916992, "global_step": 33514, "epoch": 276} {"train_loss": -32.090572357177734, "global_step": 33515, "epoch": 276} {"train_loss": -31.529611997367923, "global_step": 33516, "epoch": 276, "val_loss": 2423185.25} {"train_loss": -32.47571563720703, "global_step": 33517, "epoch": 277} {"train_loss": -31.813953399658203, "global_step": 33518, "epoch": 277} {"train_loss": -32.4801025390625, "global_step": 33519, "epoch": 277} {"train_loss": -32.70509719848633, "global_step": 33520, "epoch": 277} {"train_loss": -32.4042854309082, "global_step": 33521, "epoch": 277} {"train_loss": -32.82356643676758, "global_step": 33522, "epoch": 277} {"train_loss": -32.31453323364258, "global_step": 33523, "epoch": 277} {"train_loss": -32.891761779785156, "global_step": 33524, "epoch": 277} {"train_loss": -32.973026275634766, "global_step": 33525, "epoch": 277} {"train_loss": -32.87397384643555, "global_step": 33526, "epoch": 277} {"train_loss": -32.12456512451172, "global_step": 33527, "epoch": 277} {"train_loss": -32.58027267456055, "global_step": 33528, "epoch": 277} {"train_loss": -32.7365608215332, "global_step": 33529, "epoch": 277} {"train_loss": -32.952640533447266, "global_step": 33530, "epoch": 277} {"train_loss": -32.35615158081055, "global_step": 33531, "epoch": 277} {"train_loss": -32.877498626708984, "global_step": 33532, "epoch": 277} {"train_loss": -32.853458404541016, "global_step": 33533, "epoch": 277} {"train_loss": -32.90584182739258, "global_step": 33534, "epoch": 277} {"train_loss": -31.743717193603516, "global_step": 33535, "epoch": 277} {"train_loss": -32.523067474365234, "global_step": 33536, "epoch": 277} {"train_loss": -33.01997756958008, "global_step": 33537, "epoch": 277} {"train_loss": -33.01940155029297, "global_step": 33538, "epoch": 277} {"train_loss": -32.420013427734375, "global_step": 33539, "epoch": 277} {"train_loss": -31.905431747436523, "global_step": 33540, "epoch": 277} {"train_loss": -32.581939697265625, "global_step": 33541, "epoch": 277} {"train_loss": -32.78333282470703, "global_step": 33542, "epoch": 277} {"train_loss": -32.91691207885742, "global_step": 33543, "epoch": 277} {"train_loss": -32.63895034790039, "global_step": 33544, "epoch": 277} {"train_loss": -32.38087844848633, "global_step": 33545, "epoch": 277} {"train_loss": -31.956457138061523, "global_step": 33546, "epoch": 277} {"train_loss": -30.369741439819336, "global_step": 33547, "epoch": 277} {"train_loss": -25.91375732421875, "global_step": 33548, "epoch": 277} {"train_loss": -23.300628662109375, "global_step": 33549, "epoch": 277} {"train_loss": -28.0157470703125, "global_step": 33550, "epoch": 277} {"train_loss": -32.644004821777344, "global_step": 33551, "epoch": 277} {"train_loss": -32.32659912109375, "global_step": 33552, "epoch": 277} {"train_loss": -31.455350875854492, "global_step": 33553, "epoch": 277} {"train_loss": -32.89323043823242, "global_step": 33554, "epoch": 277} {"train_loss": -30.128183364868164, "global_step": 33555, "epoch": 277} {"train_loss": -32.71399688720703, "global_step": 33556, "epoch": 277} {"train_loss": -30.673791885375977, "global_step": 33557, "epoch": 277} {"train_loss": -32.29828643798828, "global_step": 33558, "epoch": 277} {"train_loss": -32.4144401550293, "global_step": 33559, "epoch": 277} {"train_loss": -33.02288818359375, "global_step": 33560, "epoch": 277} {"train_loss": -31.37061882019043, "global_step": 33561, "epoch": 277} {"train_loss": -32.51972961425781, "global_step": 33562, "epoch": 277} {"train_loss": -31.13056755065918, "global_step": 33563, "epoch": 277} {"train_loss": -33.11228561401367, "global_step": 33564, "epoch": 277} {"train_loss": -31.825153350830078, "global_step": 33565, "epoch": 277} {"train_loss": -32.48881149291992, "global_step": 33566, "epoch": 277} {"train_loss": -32.54627227783203, "global_step": 33567, "epoch": 277} {"train_loss": -31.656295776367188, "global_step": 33568, "epoch": 277} {"train_loss": -32.614376068115234, "global_step": 33569, "epoch": 277} {"train_loss": -31.533527374267578, "global_step": 33570, "epoch": 277} {"train_loss": -31.898563385009766, "global_step": 33571, "epoch": 277} {"train_loss": -32.081214904785156, "global_step": 33572, "epoch": 277} {"train_loss": -30.2641544342041, "global_step": 33573, "epoch": 277} {"train_loss": -32.85531234741211, "global_step": 33574, "epoch": 277} {"train_loss": -31.276342391967773, "global_step": 33575, "epoch": 277} {"train_loss": -32.03460693359375, "global_step": 33576, "epoch": 277} {"train_loss": -32.401424407958984, "global_step": 33577, "epoch": 277} {"train_loss": -32.2740592956543, "global_step": 33578, "epoch": 277} {"train_loss": -32.523529052734375, "global_step": 33579, "epoch": 277} {"train_loss": -32.37160110473633, "global_step": 33580, "epoch": 277} {"train_loss": -32.978736877441406, "global_step": 33581, "epoch": 277} {"train_loss": -32.60625457763672, "global_step": 33582, "epoch": 277} {"train_loss": -32.44743347167969, "global_step": 33583, "epoch": 277} {"train_loss": -33.26717758178711, "global_step": 33584, "epoch": 277} {"train_loss": -33.209495544433594, "global_step": 33585, "epoch": 277} {"train_loss": -33.38648223876953, "global_step": 33586, "epoch": 277} {"train_loss": -32.94587326049805, "global_step": 33587, "epoch": 277} {"train_loss": -32.827247619628906, "global_step": 33588, "epoch": 277} {"train_loss": -33.31245422363281, "global_step": 33589, "epoch": 277} {"train_loss": -33.07221603393555, "global_step": 33590, "epoch": 277} {"train_loss": -32.845611572265625, "global_step": 33591, "epoch": 277} {"train_loss": -33.075042724609375, "global_step": 33592, "epoch": 277} {"train_loss": -32.83283233642578, "global_step": 33593, "epoch": 277} {"train_loss": -32.82432556152344, "global_step": 33594, "epoch": 277} {"train_loss": -33.39011764526367, "global_step": 33595, "epoch": 277} {"train_loss": -32.40325164794922, "global_step": 33596, "epoch": 277} {"train_loss": -33.30329513549805, "global_step": 33597, "epoch": 277} {"train_loss": -32.87093734741211, "global_step": 33598, "epoch": 277} {"train_loss": -32.55697250366211, "global_step": 33599, "epoch": 277} {"train_loss": -33.22459030151367, "global_step": 33600, "epoch": 277} {"train_loss": -32.554073333740234, "global_step": 33601, "epoch": 277} {"train_loss": -32.55778884887695, "global_step": 33602, "epoch": 277} {"train_loss": -32.91782760620117, "global_step": 33603, "epoch": 277} {"train_loss": -33.10407257080078, "global_step": 33604, "epoch": 277} {"train_loss": -33.258758544921875, "global_step": 33605, "epoch": 277} {"train_loss": -32.77728271484375, "global_step": 33606, "epoch": 277} {"train_loss": -33.021060943603516, "global_step": 33607, "epoch": 277} {"train_loss": -32.94843673706055, "global_step": 33608, "epoch": 277} {"train_loss": -32.43247604370117, "global_step": 33609, "epoch": 277} {"train_loss": -32.637760162353516, "global_step": 33610, "epoch": 277} {"train_loss": -32.072566986083984, "global_step": 33611, "epoch": 277} {"train_loss": -32.16382598876953, "global_step": 33612, "epoch": 277} {"train_loss": -33.11878204345703, "global_step": 33613, "epoch": 277} {"train_loss": -32.78584671020508, "global_step": 33614, "epoch": 277} {"train_loss": -32.75791931152344, "global_step": 33615, "epoch": 277} {"train_loss": -32.28031539916992, "global_step": 33616, "epoch": 277} {"train_loss": -31.967975616455078, "global_step": 33617, "epoch": 277} {"train_loss": -30.764453887939453, "global_step": 33618, "epoch": 277} {"train_loss": -31.11536979675293, "global_step": 33619, "epoch": 277} {"train_loss": -33.0850944519043, "global_step": 33620, "epoch": 277} {"train_loss": -31.36896324157715, "global_step": 33621, "epoch": 277} {"train_loss": -30.847625732421875, "global_step": 33622, "epoch": 277} {"train_loss": -32.462764739990234, "global_step": 33623, "epoch": 277} {"train_loss": -31.80865478515625, "global_step": 33624, "epoch": 277} {"train_loss": -32.1682243347168, "global_step": 33625, "epoch": 277} {"train_loss": -32.685245513916016, "global_step": 33626, "epoch": 277} {"train_loss": -32.28159713745117, "global_step": 33627, "epoch": 277} {"train_loss": -32.27022171020508, "global_step": 33628, "epoch": 277} {"train_loss": -32.58150100708008, "global_step": 33629, "epoch": 277} {"train_loss": -32.317054748535156, "global_step": 33630, "epoch": 277} {"train_loss": -32.45991897583008, "global_step": 33631, "epoch": 277} {"train_loss": -32.678470611572266, "global_step": 33632, "epoch": 277} {"train_loss": -32.60879135131836, "global_step": 33633, "epoch": 277} {"train_loss": -32.32986068725586, "global_step": 33634, "epoch": 277} {"train_loss": -32.56861114501953, "global_step": 33635, "epoch": 277} {"train_loss": -32.55350875854492, "global_step": 33636, "epoch": 277} {"train_loss": -32.26868854869496, "global_step": 33637, "epoch": 277, "val_loss": 2393615.25} {"train_loss": -31.675277709960938, "global_step": 33638, "epoch": 278} {"train_loss": -32.888816833496094, "global_step": 33639, "epoch": 278} {"train_loss": -32.748207092285156, "global_step": 33640, "epoch": 278} {"train_loss": -33.33150863647461, "global_step": 33641, "epoch": 278} {"train_loss": -32.91597366333008, "global_step": 33642, "epoch": 278} {"train_loss": -32.922462463378906, "global_step": 33643, "epoch": 278} {"train_loss": -33.02907943725586, "global_step": 33644, "epoch": 278} {"train_loss": -33.017086029052734, "global_step": 33645, "epoch": 278} {"train_loss": -32.98908615112305, "global_step": 33646, "epoch": 278} {"train_loss": -33.043704986572266, "global_step": 33647, "epoch": 278} {"train_loss": -33.04215621948242, "global_step": 33648, "epoch": 278} {"train_loss": -32.46218490600586, "global_step": 33649, "epoch": 278} {"train_loss": -32.85799026489258, "global_step": 33650, "epoch": 278} {"train_loss": -33.5911865234375, "global_step": 33651, "epoch": 278} {"train_loss": -33.114681243896484, "global_step": 33652, "epoch": 278} {"train_loss": -33.07664489746094, "global_step": 33653, "epoch": 278} {"train_loss": -33.59860610961914, "global_step": 33654, "epoch": 278} {"train_loss": -32.92107009887695, "global_step": 33655, "epoch": 278} {"train_loss": -33.43008804321289, "global_step": 33656, "epoch": 278} {"train_loss": -32.791500091552734, "global_step": 33657, "epoch": 278} {"train_loss": -33.13887405395508, "global_step": 33658, "epoch": 278} {"train_loss": -33.96502685546875, "global_step": 33659, "epoch": 278} {"train_loss": -33.593231201171875, "global_step": 33660, "epoch": 278} {"train_loss": -33.067787170410156, "global_step": 33661, "epoch": 278} {"train_loss": -33.79667282104492, "global_step": 33662, "epoch": 278} {"train_loss": -33.72629928588867, "global_step": 33663, "epoch": 278} {"train_loss": -33.89740753173828, "global_step": 33664, "epoch": 278} {"train_loss": -33.608154296875, "global_step": 33665, "epoch": 278} {"train_loss": -33.61747360229492, "global_step": 33666, "epoch": 278} {"train_loss": -33.763404846191406, "global_step": 33667, "epoch": 278} {"train_loss": -33.872798919677734, "global_step": 33668, "epoch": 278} {"train_loss": -33.55580139160156, "global_step": 33669, "epoch": 278} {"train_loss": -34.24481964111328, "global_step": 33670, "epoch": 278} {"train_loss": -33.8533935546875, "global_step": 33671, "epoch": 278} {"train_loss": -33.81467819213867, "global_step": 33672, "epoch": 278} {"train_loss": -33.55335235595703, "global_step": 33673, "epoch": 278} {"train_loss": -34.38128662109375, "global_step": 33674, "epoch": 278} {"train_loss": -33.88821792602539, "global_step": 33675, "epoch": 278} {"train_loss": -33.20139694213867, "global_step": 33676, "epoch": 278} {"train_loss": -33.746944427490234, "global_step": 33677, "epoch": 278} {"train_loss": -33.647796630859375, "global_step": 33678, "epoch": 278} {"train_loss": -33.95536422729492, "global_step": 33679, "epoch": 278} {"train_loss": -33.595314025878906, "global_step": 33680, "epoch": 278} {"train_loss": -33.565608978271484, "global_step": 33681, "epoch": 278} {"train_loss": -33.33972930908203, "global_step": 33682, "epoch": 278} {"train_loss": -31.59661293029785, "global_step": 33683, "epoch": 278} {"train_loss": -33.15473556518555, "global_step": 33684, "epoch": 278} {"train_loss": -32.844268798828125, "global_step": 33685, "epoch": 278} {"train_loss": -32.89739990234375, "global_step": 33686, "epoch": 278} {"train_loss": -31.472442626953125, "global_step": 33687, "epoch": 278} {"train_loss": -33.61343002319336, "global_step": 33688, "epoch": 278} {"train_loss": -33.2901725769043, "global_step": 33689, "epoch": 278} {"train_loss": -31.274459838867188, "global_step": 33690, "epoch": 278} {"train_loss": -33.182491302490234, "global_step": 33691, "epoch": 278} {"train_loss": -31.652585983276367, "global_step": 33692, "epoch": 278} {"train_loss": -31.5018310546875, "global_step": 33693, "epoch": 278} {"train_loss": -31.935733795166016, "global_step": 33694, "epoch": 278} {"train_loss": -31.28216552734375, "global_step": 33695, "epoch": 278} {"train_loss": -31.79373550415039, "global_step": 33696, "epoch": 278} {"train_loss": -30.43951988220215, "global_step": 33697, "epoch": 278} {"train_loss": -32.64093017578125, "global_step": 33698, "epoch": 278} {"train_loss": -31.44877052307129, "global_step": 33699, "epoch": 278} {"train_loss": -32.170413970947266, "global_step": 33700, "epoch": 278} {"train_loss": -31.443525314331055, "global_step": 33701, "epoch": 278} {"train_loss": -31.202905654907227, "global_step": 33702, "epoch": 278} {"train_loss": -31.804370880126953, "global_step": 33703, "epoch": 278} {"train_loss": -32.22565460205078, "global_step": 33704, "epoch": 278} {"train_loss": -31.307973861694336, "global_step": 33705, "epoch": 278} {"train_loss": -31.30104637145996, "global_step": 33706, "epoch": 278} {"train_loss": -30.125473022460938, "global_step": 33707, "epoch": 278} {"train_loss": -32.36785888671875, "global_step": 33708, "epoch": 278} {"train_loss": -31.9774227142334, "global_step": 33709, "epoch": 278} {"train_loss": -32.1526985168457, "global_step": 33710, "epoch": 278} {"train_loss": -32.2946891784668, "global_step": 33711, "epoch": 278} {"train_loss": -31.831298828125, "global_step": 33712, "epoch": 278} {"train_loss": -31.545886993408203, "global_step": 33713, "epoch": 278} {"train_loss": -32.46062088012695, "global_step": 33714, "epoch": 278} {"train_loss": -32.01725387573242, "global_step": 33715, "epoch": 278} {"train_loss": -32.84858322143555, "global_step": 33716, "epoch": 278} {"train_loss": -32.82497787475586, "global_step": 33717, "epoch": 278} {"train_loss": -32.23714828491211, "global_step": 33718, "epoch": 278} {"train_loss": -32.24874496459961, "global_step": 33719, "epoch": 278} {"train_loss": -31.921369552612305, "global_step": 33720, "epoch": 278} {"train_loss": -32.34743881225586, "global_step": 33721, "epoch": 278} {"train_loss": -32.59180450439453, "global_step": 33722, "epoch": 278} {"train_loss": -32.26168441772461, "global_step": 33723, "epoch": 278} {"train_loss": -32.45148468017578, "global_step": 33724, "epoch": 278} {"train_loss": -32.23883056640625, "global_step": 33725, "epoch": 278} {"train_loss": -32.13232421875, "global_step": 33726, "epoch": 278} {"train_loss": -32.1824951171875, "global_step": 33727, "epoch": 278} {"train_loss": -32.857391357421875, "global_step": 33728, "epoch": 278} {"train_loss": -33.01466751098633, "global_step": 33729, "epoch": 278} {"train_loss": -33.22610855102539, "global_step": 33730, "epoch": 278} {"train_loss": -32.99979782104492, "global_step": 33731, "epoch": 278} {"train_loss": -32.957275390625, "global_step": 33732, "epoch": 278} {"train_loss": -32.728431701660156, "global_step": 33733, "epoch": 278} {"train_loss": -33.213191986083984, "global_step": 33734, "epoch": 278} {"train_loss": -33.444068908691406, "global_step": 33735, "epoch": 278} {"train_loss": -33.32863235473633, "global_step": 33736, "epoch": 278} {"train_loss": -32.4386100769043, "global_step": 33737, "epoch": 278} {"train_loss": -33.200889587402344, "global_step": 33738, "epoch": 278} {"train_loss": -33.18726348876953, "global_step": 33739, "epoch": 278} {"train_loss": -33.34260940551758, "global_step": 33740, "epoch": 278} {"train_loss": -32.647972106933594, "global_step": 33741, "epoch": 278} {"train_loss": -33.41715621948242, "global_step": 33742, "epoch": 278} {"train_loss": -32.80112838745117, "global_step": 33743, "epoch": 278} {"train_loss": -32.49333572387695, "global_step": 33744, "epoch": 278} {"train_loss": -32.29569625854492, "global_step": 33745, "epoch": 278} {"train_loss": -31.317642211914062, "global_step": 33746, "epoch": 278} {"train_loss": -31.32547950744629, "global_step": 33747, "epoch": 278} {"train_loss": -32.41128158569336, "global_step": 33748, "epoch": 278} {"train_loss": -33.792236328125, "global_step": 33749, "epoch": 278} {"train_loss": -33.197601318359375, "global_step": 33750, "epoch": 278} {"train_loss": -32.17817306518555, "global_step": 33751, "epoch": 278} {"train_loss": -33.356197357177734, "global_step": 33752, "epoch": 278} {"train_loss": -33.70332717895508, "global_step": 33753, "epoch": 278} {"train_loss": -32.766475677490234, "global_step": 33754, "epoch": 278} {"train_loss": -32.8568000793457, "global_step": 33755, "epoch": 278} {"train_loss": -33.972816467285156, "global_step": 33756, "epoch": 278} {"train_loss": -33.13149642944336, "global_step": 33757, "epoch": 278} {"train_loss": -32.76810832063028, "global_step": 33758, "epoch": 278, "val_loss": 2529416.75} {"train_loss": -33.077423095703125, "global_step": 33759, "epoch": 279} {"train_loss": -33.59578323364258, "global_step": 33760, "epoch": 279} {"train_loss": -32.96712112426758, "global_step": 33761, "epoch": 279} {"train_loss": -33.30183410644531, "global_step": 33762, "epoch": 279} {"train_loss": -33.3177604675293, "global_step": 33763, "epoch": 279} {"train_loss": -32.153564453125, "global_step": 33764, "epoch": 279} {"train_loss": -33.05839157104492, "global_step": 33765, "epoch": 279} {"train_loss": -32.303138732910156, "global_step": 33766, "epoch": 279} {"train_loss": -32.10353469848633, "global_step": 33767, "epoch": 279} {"train_loss": -31.59750747680664, "global_step": 33768, "epoch": 279} {"train_loss": -31.987600326538086, "global_step": 33769, "epoch": 279} {"train_loss": -31.534915924072266, "global_step": 33770, "epoch": 279} {"train_loss": -32.63875961303711, "global_step": 33771, "epoch": 279} {"train_loss": -32.79133224487305, "global_step": 33772, "epoch": 279} {"train_loss": -30.667713165283203, "global_step": 33773, "epoch": 279} {"train_loss": -30.560392379760742, "global_step": 33774, "epoch": 279} {"train_loss": -32.480247497558594, "global_step": 33775, "epoch": 279} {"train_loss": -32.9927864074707, "global_step": 33776, "epoch": 279} {"train_loss": -29.84071159362793, "global_step": 33777, "epoch": 279} {"train_loss": -30.98939323425293, "global_step": 33778, "epoch": 279} {"train_loss": -33.195186614990234, "global_step": 33779, "epoch": 279} {"train_loss": -31.94781494140625, "global_step": 33780, "epoch": 279} {"train_loss": -30.277450561523438, "global_step": 33781, "epoch": 279} {"train_loss": -33.18014144897461, "global_step": 33782, "epoch": 279} {"train_loss": -31.661563873291016, "global_step": 33783, "epoch": 279} {"train_loss": -32.32429504394531, "global_step": 33784, "epoch": 279} {"train_loss": -33.03642654418945, "global_step": 33785, "epoch": 279} {"train_loss": -31.797887802124023, "global_step": 33786, "epoch": 279} {"train_loss": -33.336971282958984, "global_step": 33787, "epoch": 279} {"train_loss": -32.20328903198242, "global_step": 33788, "epoch": 279} {"train_loss": -33.11469650268555, "global_step": 33789, "epoch": 279} {"train_loss": -31.91351318359375, "global_step": 33790, "epoch": 279} {"train_loss": -33.29182815551758, "global_step": 33791, "epoch": 279} {"train_loss": -32.16374969482422, "global_step": 33792, "epoch": 279} {"train_loss": -33.4224853515625, "global_step": 33793, "epoch": 279} {"train_loss": -31.512409210205078, "global_step": 33794, "epoch": 279} {"train_loss": -33.041954040527344, "global_step": 33795, "epoch": 279} {"train_loss": -32.69959259033203, "global_step": 33796, "epoch": 279} {"train_loss": -33.17409896850586, "global_step": 33797, "epoch": 279} {"train_loss": -32.700862884521484, "global_step": 33798, "epoch": 279} {"train_loss": -33.25722122192383, "global_step": 33799, "epoch": 279} {"train_loss": -33.1265869140625, "global_step": 33800, "epoch": 279} {"train_loss": -33.399940490722656, "global_step": 33801, "epoch": 279} {"train_loss": -32.64572525024414, "global_step": 33802, "epoch": 279} {"train_loss": -33.41071701049805, "global_step": 33803, "epoch": 279} {"train_loss": -33.433074951171875, "global_step": 33804, "epoch": 279} {"train_loss": -32.995826721191406, "global_step": 33805, "epoch": 279} {"train_loss": -33.986419677734375, "global_step": 33806, "epoch": 279} {"train_loss": -33.3262825012207, "global_step": 33807, "epoch": 279} {"train_loss": -33.593902587890625, "global_step": 33808, "epoch": 279} {"train_loss": -33.92631912231445, "global_step": 33809, "epoch": 279} {"train_loss": -32.95726776123047, "global_step": 33810, "epoch": 279} {"train_loss": -33.9944953918457, "global_step": 33811, "epoch": 279} {"train_loss": -33.50118637084961, "global_step": 33812, "epoch": 279} {"train_loss": -34.02765655517578, "global_step": 33813, "epoch": 279} {"train_loss": -33.68404769897461, "global_step": 33814, "epoch": 279} {"train_loss": -33.81501007080078, "global_step": 33815, "epoch": 279} {"train_loss": -33.573150634765625, "global_step": 33816, "epoch": 279} {"train_loss": -33.47199630737305, "global_step": 33817, "epoch": 279} {"train_loss": -33.97169494628906, "global_step": 33818, "epoch": 279} {"train_loss": -34.14944076538086, "global_step": 33819, "epoch": 279} {"train_loss": -34.09916687011719, "global_step": 33820, "epoch": 279} {"train_loss": -33.84531021118164, "global_step": 33821, "epoch": 279} {"train_loss": -34.0359001159668, "global_step": 33822, "epoch": 279} {"train_loss": -33.74420928955078, "global_step": 33823, "epoch": 279} {"train_loss": -33.9302864074707, "global_step": 33824, "epoch": 279} {"train_loss": -33.521907806396484, "global_step": 33825, "epoch": 279} {"train_loss": -33.04861831665039, "global_step": 33826, "epoch": 279} {"train_loss": -33.459922790527344, "global_step": 33827, "epoch": 279} {"train_loss": -33.736061096191406, "global_step": 33828, "epoch": 279} {"train_loss": -33.48126220703125, "global_step": 33829, "epoch": 279} {"train_loss": -33.217323303222656, "global_step": 33830, "epoch": 279} {"train_loss": -32.98661422729492, "global_step": 33831, "epoch": 279} {"train_loss": -32.071895599365234, "global_step": 33832, "epoch": 279} {"train_loss": -32.14653015136719, "global_step": 33833, "epoch": 279} {"train_loss": -31.960880279541016, "global_step": 33834, "epoch": 279} {"train_loss": -27.397052764892578, "global_step": 33835, "epoch": 279} {"train_loss": -27.292139053344727, "global_step": 33836, "epoch": 279} {"train_loss": -30.621124267578125, "global_step": 33837, "epoch": 279} {"train_loss": -32.51458740234375, "global_step": 33838, "epoch": 279} {"train_loss": -28.14374351501465, "global_step": 33839, "epoch": 279} {"train_loss": -30.907337188720703, "global_step": 33840, "epoch": 279} {"train_loss": -32.503231048583984, "global_step": 33841, "epoch": 279} {"train_loss": -30.147613525390625, "global_step": 33842, "epoch": 279} {"train_loss": -31.089706420898438, "global_step": 33843, "epoch": 279} {"train_loss": -31.23158073425293, "global_step": 33844, "epoch": 279} {"train_loss": -31.93841552734375, "global_step": 33845, "epoch": 279} {"train_loss": -31.657575607299805, "global_step": 33846, "epoch": 279} {"train_loss": -31.952350616455078, "global_step": 33847, "epoch": 279} {"train_loss": -32.38296127319336, "global_step": 33848, "epoch": 279} {"train_loss": -32.75147247314453, "global_step": 33849, "epoch": 279} {"train_loss": -32.353240966796875, "global_step": 33850, "epoch": 279} {"train_loss": -32.52814483642578, "global_step": 33851, "epoch": 279} {"train_loss": -32.28522491455078, "global_step": 33852, "epoch": 279} {"train_loss": -31.76949119567871, "global_step": 33853, "epoch": 279} {"train_loss": -32.40465545654297, "global_step": 33854, "epoch": 279} {"train_loss": -31.852497100830078, "global_step": 33855, "epoch": 279} {"train_loss": -32.19936752319336, "global_step": 33856, "epoch": 279} {"train_loss": -32.30427169799805, "global_step": 33857, "epoch": 279} {"train_loss": -32.66084289550781, "global_step": 33858, "epoch": 279} {"train_loss": -32.98150634765625, "global_step": 33859, "epoch": 279} {"train_loss": -32.26986312866211, "global_step": 33860, "epoch": 279} {"train_loss": -32.93059158325195, "global_step": 33861, "epoch": 279} {"train_loss": -32.98505783081055, "global_step": 33862, "epoch": 279} {"train_loss": -31.81085777282715, "global_step": 33863, "epoch": 279} {"train_loss": -32.15114212036133, "global_step": 33864, "epoch": 279} {"train_loss": -31.881528854370117, "global_step": 33865, "epoch": 279} {"train_loss": -31.97810173034668, "global_step": 33866, "epoch": 279} {"train_loss": -32.4073600769043, "global_step": 33867, "epoch": 279} {"train_loss": -33.233768463134766, "global_step": 33868, "epoch": 279} {"train_loss": -33.245174407958984, "global_step": 33869, "epoch": 279} {"train_loss": -31.84212303161621, "global_step": 33870, "epoch": 279} {"train_loss": -30.520889282226562, "global_step": 33871, "epoch": 279} {"train_loss": -28.616662979125977, "global_step": 33872, "epoch": 279} {"train_loss": -30.893951416015625, "global_step": 33873, "epoch": 279} {"train_loss": -32.61359786987305, "global_step": 33874, "epoch": 279} {"train_loss": -32.615570068359375, "global_step": 33875, "epoch": 279} {"train_loss": -31.7536563873291, "global_step": 33876, "epoch": 279} {"train_loss": -32.61531448364258, "global_step": 33877, "epoch": 279} {"train_loss": -33.277950286865234, "global_step": 33878, "epoch": 279} {"train_loss": -32.439340827878844, "global_step": 33879, "epoch": 279, "val_loss": 2499632.25} {"train_loss": -32.282196044921875, "global_step": 33880, "epoch": 280} {"train_loss": -33.682159423828125, "global_step": 33881, "epoch": 280} {"train_loss": -32.488563537597656, "global_step": 33882, "epoch": 280} {"train_loss": -33.1888542175293, "global_step": 33883, "epoch": 280} {"train_loss": -33.069637298583984, "global_step": 33884, "epoch": 280} {"train_loss": -32.2578010559082, "global_step": 33885, "epoch": 280} {"train_loss": -33.44430160522461, "global_step": 33886, "epoch": 280} {"train_loss": -32.22365188598633, "global_step": 33887, "epoch": 280} {"train_loss": -33.58852767944336, "global_step": 33888, "epoch": 280} {"train_loss": -32.59033203125, "global_step": 33889, "epoch": 280} {"train_loss": -33.625667572021484, "global_step": 33890, "epoch": 280} {"train_loss": -32.586483001708984, "global_step": 33891, "epoch": 280} {"train_loss": -32.41815185546875, "global_step": 33892, "epoch": 280} {"train_loss": -33.497901916503906, "global_step": 33893, "epoch": 280} {"train_loss": -33.29647445678711, "global_step": 33894, "epoch": 280} {"train_loss": -33.67577362060547, "global_step": 33895, "epoch": 280} {"train_loss": -33.499542236328125, "global_step": 33896, "epoch": 280} {"train_loss": -33.17387008666992, "global_step": 33897, "epoch": 280} {"train_loss": -33.617061614990234, "global_step": 33898, "epoch": 280} {"train_loss": -33.47732162475586, "global_step": 33899, "epoch": 280} {"train_loss": -33.424964904785156, "global_step": 33900, "epoch": 280} {"train_loss": -33.76774978637695, "global_step": 33901, "epoch": 280} {"train_loss": -33.31962203979492, "global_step": 33902, "epoch": 280} {"train_loss": -33.66140365600586, "global_step": 33903, "epoch": 280} {"train_loss": -33.20769500732422, "global_step": 33904, "epoch": 280} {"train_loss": -33.47356033325195, "global_step": 33905, "epoch": 280} {"train_loss": -33.9052848815918, "global_step": 33906, "epoch": 280} {"train_loss": -33.57369613647461, "global_step": 33907, "epoch": 280} {"train_loss": -33.19398880004883, "global_step": 33908, "epoch": 280} {"train_loss": -33.095115661621094, "global_step": 33909, "epoch": 280} {"train_loss": -33.610591888427734, "global_step": 33910, "epoch": 280} {"train_loss": -33.67121124267578, "global_step": 33911, "epoch": 280} {"train_loss": -33.31191635131836, "global_step": 33912, "epoch": 280} {"train_loss": -32.430511474609375, "global_step": 33913, "epoch": 280} {"train_loss": -32.6666145324707, "global_step": 33914, "epoch": 280} {"train_loss": -33.11802291870117, "global_step": 33915, "epoch": 280} {"train_loss": -33.25593185424805, "global_step": 33916, "epoch": 280} {"train_loss": -33.4453239440918, "global_step": 33917, "epoch": 280} {"train_loss": -32.82308578491211, "global_step": 33918, "epoch": 280} {"train_loss": -33.729610443115234, "global_step": 33919, "epoch": 280} {"train_loss": -33.298011779785156, "global_step": 33920, "epoch": 280} {"train_loss": -33.408817291259766, "global_step": 33921, "epoch": 280} {"train_loss": -33.1001091003418, "global_step": 33922, "epoch": 280} {"train_loss": -33.36460494995117, "global_step": 33923, "epoch": 280} {"train_loss": -33.71079635620117, "global_step": 33924, "epoch": 280} {"train_loss": -33.38947677612305, "global_step": 33925, "epoch": 280} {"train_loss": -32.8709716796875, "global_step": 33926, "epoch": 280} {"train_loss": -33.33378219604492, "global_step": 33927, "epoch": 280} {"train_loss": -32.25043487548828, "global_step": 33928, "epoch": 280} {"train_loss": -32.33854293823242, "global_step": 33929, "epoch": 280} {"train_loss": -29.78631019592285, "global_step": 33930, "epoch": 280} {"train_loss": -26.781736373901367, "global_step": 33931, "epoch": 280} {"train_loss": -31.382699966430664, "global_step": 33932, "epoch": 280} {"train_loss": -31.577777862548828, "global_step": 33933, "epoch": 280} {"train_loss": -32.31182861328125, "global_step": 33934, "epoch": 280} {"train_loss": -32.53936004638672, "global_step": 33935, "epoch": 280} {"train_loss": -32.734683990478516, "global_step": 33936, "epoch": 280} {"train_loss": -33.042171478271484, "global_step": 33937, "epoch": 280} {"train_loss": -32.54684066772461, "global_step": 33938, "epoch": 280} {"train_loss": -33.32820510864258, "global_step": 33939, "epoch": 280} {"train_loss": -33.25910949707031, "global_step": 33940, "epoch": 280} {"train_loss": -32.51465606689453, "global_step": 33941, "epoch": 280} {"train_loss": -33.248252868652344, "global_step": 33942, "epoch": 280} {"train_loss": -32.90994644165039, "global_step": 33943, "epoch": 280} {"train_loss": -32.84638214111328, "global_step": 33944, "epoch": 280} {"train_loss": -32.946441650390625, "global_step": 33945, "epoch": 280} {"train_loss": -32.270904541015625, "global_step": 33946, "epoch": 280} {"train_loss": -33.53923416137695, "global_step": 33947, "epoch": 280} {"train_loss": -33.233482360839844, "global_step": 33948, "epoch": 280} {"train_loss": -32.8796272277832, "global_step": 33949, "epoch": 280} {"train_loss": -33.18486022949219, "global_step": 33950, "epoch": 280} {"train_loss": -32.82657241821289, "global_step": 33951, "epoch": 280} {"train_loss": -32.4127311706543, "global_step": 33952, "epoch": 280} {"train_loss": -33.5777702331543, "global_step": 33953, "epoch": 280} {"train_loss": -33.262359619140625, "global_step": 33954, "epoch": 280} {"train_loss": -32.58930587768555, "global_step": 33955, "epoch": 280} {"train_loss": -33.93226623535156, "global_step": 33956, "epoch": 280} {"train_loss": -33.28257369995117, "global_step": 33957, "epoch": 280} {"train_loss": -33.92179870605469, "global_step": 33958, "epoch": 280} {"train_loss": -33.59629821777344, "global_step": 33959, "epoch": 280} {"train_loss": -31.725177764892578, "global_step": 33960, "epoch": 280} {"train_loss": -33.85408401489258, "global_step": 33961, "epoch": 280} {"train_loss": -33.40751266479492, "global_step": 33962, "epoch": 280} {"train_loss": -33.84917068481445, "global_step": 33963, "epoch": 280} {"train_loss": -33.52389907836914, "global_step": 33964, "epoch": 280} {"train_loss": -33.5118522644043, "global_step": 33965, "epoch": 280} {"train_loss": -33.63593673706055, "global_step": 33966, "epoch": 280} {"train_loss": -32.5023193359375, "global_step": 33967, "epoch": 280} {"train_loss": -33.79084396362305, "global_step": 33968, "epoch": 280} {"train_loss": -32.969844818115234, "global_step": 33969, "epoch": 280} {"train_loss": -33.362857818603516, "global_step": 33970, "epoch": 280} {"train_loss": -33.65778732299805, "global_step": 33971, "epoch": 280} {"train_loss": -33.715972900390625, "global_step": 33972, "epoch": 280} {"train_loss": -33.79820251464844, "global_step": 33973, "epoch": 280} {"train_loss": -33.90045928955078, "global_step": 33974, "epoch": 280} {"train_loss": -33.746925354003906, "global_step": 33975, "epoch": 280} {"train_loss": -33.1663818359375, "global_step": 33976, "epoch": 280} {"train_loss": -33.32065963745117, "global_step": 33977, "epoch": 280} {"train_loss": -33.71548080444336, "global_step": 33978, "epoch": 280} {"train_loss": -33.49884033203125, "global_step": 33979, "epoch": 280} {"train_loss": -33.94289779663086, "global_step": 33980, "epoch": 280} {"train_loss": -33.5155029296875, "global_step": 33981, "epoch": 280} {"train_loss": -33.95315170288086, "global_step": 33982, "epoch": 280} {"train_loss": -33.8629264831543, "global_step": 33983, "epoch": 280} {"train_loss": -33.90308380126953, "global_step": 33984, "epoch": 280} {"train_loss": -33.668678283691406, "global_step": 33985, "epoch": 280} {"train_loss": -33.62522506713867, "global_step": 33986, "epoch": 280} {"train_loss": -34.226837158203125, "global_step": 33987, "epoch": 280} {"train_loss": -34.248844146728516, "global_step": 33988, "epoch": 280} {"train_loss": -33.794921875, "global_step": 33989, "epoch": 280} {"train_loss": -34.45392990112305, "global_step": 33990, "epoch": 280} {"train_loss": -34.06499481201172, "global_step": 33991, "epoch": 280} {"train_loss": -33.76249313354492, "global_step": 33992, "epoch": 280} {"train_loss": -33.319305419921875, "global_step": 33993, "epoch": 280} {"train_loss": -32.96178436279297, "global_step": 33994, "epoch": 280} {"train_loss": -32.170257568359375, "global_step": 33995, "epoch": 280} {"train_loss": -30.5429630279541, "global_step": 33996, "epoch": 280} {"train_loss": -29.964313507080078, "global_step": 33997, "epoch": 280} {"train_loss": -31.923974990844727, "global_step": 33998, "epoch": 280} {"train_loss": -32.89407730102539, "global_step": 33999, "epoch": 280} {"train_loss": -33.0918491931001, "global_step": 34000, "epoch": 280, "val_loss": 2527946.25} {"train_loss": -32.523780822753906, "global_step": 34001, "epoch": 281} {"train_loss": -33.56612014770508, "global_step": 34002, "epoch": 281} {"train_loss": -33.721343994140625, "global_step": 34003, "epoch": 281} {"train_loss": -33.9463005065918, "global_step": 34004, "epoch": 281} {"train_loss": -34.019283294677734, "global_step": 34005, "epoch": 281} {"train_loss": -33.334957122802734, "global_step": 34006, "epoch": 281} {"train_loss": -33.55018997192383, "global_step": 34007, "epoch": 281} {"train_loss": -33.64105224609375, "global_step": 34008, "epoch": 281} {"train_loss": -34.070770263671875, "global_step": 34009, "epoch": 281} {"train_loss": -33.38508605957031, "global_step": 34010, "epoch": 281} {"train_loss": -34.01020812988281, "global_step": 34011, "epoch": 281} {"train_loss": -33.74098587036133, "global_step": 34012, "epoch": 281} {"train_loss": -32.84788131713867, "global_step": 34013, "epoch": 281} {"train_loss": -32.88302993774414, "global_step": 34014, "epoch": 281} {"train_loss": -33.2946662902832, "global_step": 34015, "epoch": 281} {"train_loss": -33.884857177734375, "global_step": 34016, "epoch": 281} {"train_loss": -32.9066276550293, "global_step": 34017, "epoch": 281} {"train_loss": -33.99019241333008, "global_step": 34018, "epoch": 281} {"train_loss": -33.33340072631836, "global_step": 34019, "epoch": 281} {"train_loss": -33.17732620239258, "global_step": 34020, "epoch": 281} {"train_loss": -33.55991744995117, "global_step": 34021, "epoch": 281} {"train_loss": -33.2352409362793, "global_step": 34022, "epoch": 281} {"train_loss": -33.23662567138672, "global_step": 34023, "epoch": 281} {"train_loss": -33.2805061340332, "global_step": 34024, "epoch": 281} {"train_loss": -33.65304183959961, "global_step": 34025, "epoch": 281} {"train_loss": -33.620174407958984, "global_step": 34026, "epoch": 281} {"train_loss": -33.81270980834961, "global_step": 34027, "epoch": 281} {"train_loss": -33.282527923583984, "global_step": 34028, "epoch": 281} {"train_loss": -32.604915618896484, "global_step": 34029, "epoch": 281} {"train_loss": -31.896820068359375, "global_step": 34030, "epoch": 281} {"train_loss": -29.57111930847168, "global_step": 34031, "epoch": 281} {"train_loss": -26.79117774963379, "global_step": 34032, "epoch": 281} {"train_loss": -27.9934139251709, "global_step": 34033, "epoch": 281} {"train_loss": -30.506103515625, "global_step": 34034, "epoch": 281} {"train_loss": -33.366329193115234, "global_step": 34035, "epoch": 281} {"train_loss": -31.92376136779785, "global_step": 34036, "epoch": 281} {"train_loss": -30.870655059814453, "global_step": 34037, "epoch": 281} {"train_loss": -32.6352653503418, "global_step": 34038, "epoch": 281} {"train_loss": -32.91980743408203, "global_step": 34039, "epoch": 281} {"train_loss": -32.41652297973633, "global_step": 34040, "epoch": 281} {"train_loss": -33.74923324584961, "global_step": 34041, "epoch": 281} {"train_loss": -32.611209869384766, "global_step": 34042, "epoch": 281} {"train_loss": -33.58524703979492, "global_step": 34043, "epoch": 281} {"train_loss": -32.76479721069336, "global_step": 34044, "epoch": 281} {"train_loss": -33.42485809326172, "global_step": 34045, "epoch": 281} {"train_loss": -33.23793029785156, "global_step": 34046, "epoch": 281} {"train_loss": -33.56663513183594, "global_step": 34047, "epoch": 281} {"train_loss": -33.153873443603516, "global_step": 34048, "epoch": 281} {"train_loss": -33.27130889892578, "global_step": 34049, "epoch": 281} {"train_loss": -33.59975051879883, "global_step": 34050, "epoch": 281} {"train_loss": -32.67399215698242, "global_step": 34051, "epoch": 281} {"train_loss": -33.04683303833008, "global_step": 34052, "epoch": 281} {"train_loss": -32.94847106933594, "global_step": 34053, "epoch": 281} {"train_loss": -33.331581115722656, "global_step": 34054, "epoch": 281} {"train_loss": -33.308021545410156, "global_step": 34055, "epoch": 281} {"train_loss": -33.505619049072266, "global_step": 34056, "epoch": 281} {"train_loss": -33.64667892456055, "global_step": 34057, "epoch": 281} {"train_loss": -33.44429397583008, "global_step": 34058, "epoch": 281} {"train_loss": -33.77022933959961, "global_step": 34059, "epoch": 281} {"train_loss": -33.492042541503906, "global_step": 34060, "epoch": 281} {"train_loss": -31.90473747253418, "global_step": 34061, "epoch": 281} {"train_loss": -34.11112594604492, "global_step": 34062, "epoch": 281} {"train_loss": -33.550960540771484, "global_step": 34063, "epoch": 281} {"train_loss": -33.647705078125, "global_step": 34064, "epoch": 281} {"train_loss": -33.74390411376953, "global_step": 34065, "epoch": 281} {"train_loss": -33.63828659057617, "global_step": 34066, "epoch": 281} {"train_loss": -33.732513427734375, "global_step": 34067, "epoch": 281} {"train_loss": -33.821929931640625, "global_step": 34068, "epoch": 281} {"train_loss": -33.60762023925781, "global_step": 34069, "epoch": 281} {"train_loss": -32.962154388427734, "global_step": 34070, "epoch": 281} {"train_loss": -32.4119987487793, "global_step": 34071, "epoch": 281} {"train_loss": -33.17538833618164, "global_step": 34072, "epoch": 281} {"train_loss": -32.1071891784668, "global_step": 34073, "epoch": 281} {"train_loss": -27.26676368713379, "global_step": 34074, "epoch": 281} {"train_loss": -23.35026741027832, "global_step": 34075, "epoch": 281} {"train_loss": -26.76411247253418, "global_step": 34076, "epoch": 281} {"train_loss": -32.246498107910156, "global_step": 34077, "epoch": 281} {"train_loss": -31.5164852142334, "global_step": 34078, "epoch": 281} {"train_loss": -27.054574966430664, "global_step": 34079, "epoch": 281} {"train_loss": -28.7663631439209, "global_step": 34080, "epoch": 281} {"train_loss": -33.58883285522461, "global_step": 34081, "epoch": 281} {"train_loss": -30.490192413330078, "global_step": 34082, "epoch": 281} {"train_loss": -32.25410079956055, "global_step": 34083, "epoch": 281} {"train_loss": -30.959915161132812, "global_step": 34084, "epoch": 281} {"train_loss": -32.14869689941406, "global_step": 34085, "epoch": 281} {"train_loss": -31.433837890625, "global_step": 34086, "epoch": 281} {"train_loss": -32.94497299194336, "global_step": 34087, "epoch": 281} {"train_loss": -31.557870864868164, "global_step": 34088, "epoch": 281} {"train_loss": -32.90269088745117, "global_step": 34089, "epoch": 281} {"train_loss": -32.25328063964844, "global_step": 34090, "epoch": 281} {"train_loss": -31.912616729736328, "global_step": 34091, "epoch": 281} {"train_loss": -33.218658447265625, "global_step": 34092, "epoch": 281} {"train_loss": -31.979700088500977, "global_step": 34093, "epoch": 281} {"train_loss": -32.09914779663086, "global_step": 34094, "epoch": 281} {"train_loss": -32.900997161865234, "global_step": 34095, "epoch": 281} {"train_loss": -33.015968322753906, "global_step": 34096, "epoch": 281} {"train_loss": -32.58761215209961, "global_step": 34097, "epoch": 281} {"train_loss": -33.5057258605957, "global_step": 34098, "epoch": 281} {"train_loss": -33.215797424316406, "global_step": 34099, "epoch": 281} {"train_loss": -33.26479721069336, "global_step": 34100, "epoch": 281} {"train_loss": -33.34666061401367, "global_step": 34101, "epoch": 281} {"train_loss": -33.272499084472656, "global_step": 34102, "epoch": 281} {"train_loss": -33.32788848876953, "global_step": 34103, "epoch": 281} {"train_loss": -33.2346076965332, "global_step": 34104, "epoch": 281} {"train_loss": -33.40546798706055, "global_step": 34105, "epoch": 281} {"train_loss": -33.10652542114258, "global_step": 34106, "epoch": 281} {"train_loss": -33.31551742553711, "global_step": 34107, "epoch": 281} {"train_loss": -33.31606674194336, "global_step": 34108, "epoch": 281} {"train_loss": -33.76784896850586, "global_step": 34109, "epoch": 281} {"train_loss": -33.70701217651367, "global_step": 34110, "epoch": 281} {"train_loss": -33.6425895690918, "global_step": 34111, "epoch": 281} {"train_loss": -33.43881607055664, "global_step": 34112, "epoch": 281} {"train_loss": -33.69477844238281, "global_step": 34113, "epoch": 281} {"train_loss": -33.940673828125, "global_step": 34114, "epoch": 281} {"train_loss": -33.93874740600586, "global_step": 34115, "epoch": 281} {"train_loss": -33.72554397583008, "global_step": 34116, "epoch": 281} {"train_loss": -33.17451858520508, "global_step": 34117, "epoch": 281} {"train_loss": -32.58279037475586, "global_step": 34118, "epoch": 281} {"train_loss": -31.368549346923828, "global_step": 34119, "epoch": 281} {"train_loss": -27.63946533203125, "global_step": 34120, "epoch": 281} {"train_loss": -32.51242544631327, "global_step": 34121, "epoch": 281, "val_loss": 2662715.25} {"train_loss": -17.005775451660156, "global_step": 34122, "epoch": 282} {"train_loss": -27.917083740234375, "global_step": 34123, "epoch": 282} {"train_loss": -28.174335479736328, "global_step": 34124, "epoch": 282} {"train_loss": -28.765399932861328, "global_step": 34125, "epoch": 282} {"train_loss": -26.356170654296875, "global_step": 34126, "epoch": 282} {"train_loss": -30.864171981811523, "global_step": 34127, "epoch": 282} {"train_loss": -26.163894653320312, "global_step": 34128, "epoch": 282} {"train_loss": -32.61330032348633, "global_step": 34129, "epoch": 282} {"train_loss": -30.150226593017578, "global_step": 34130, "epoch": 282} {"train_loss": -29.71647071838379, "global_step": 34131, "epoch": 282} {"train_loss": -31.977766036987305, "global_step": 34132, "epoch": 282} {"train_loss": -32.429832458496094, "global_step": 34133, "epoch": 282} {"train_loss": -30.51729393005371, "global_step": 34134, "epoch": 282} {"train_loss": -31.468128204345703, "global_step": 34135, "epoch": 282} {"train_loss": -32.36301803588867, "global_step": 34136, "epoch": 282} {"train_loss": -32.72162628173828, "global_step": 34137, "epoch": 282} {"train_loss": -31.55495262145996, "global_step": 34138, "epoch": 282} {"train_loss": -31.58319664001465, "global_step": 34139, "epoch": 282} {"train_loss": -32.12339401245117, "global_step": 34140, "epoch": 282} {"train_loss": -32.744140625, "global_step": 34141, "epoch": 282} {"train_loss": -32.731689453125, "global_step": 34142, "epoch": 282} {"train_loss": -32.18707275390625, "global_step": 34143, "epoch": 282} {"train_loss": -31.724008560180664, "global_step": 34144, "epoch": 282} {"train_loss": -31.973615646362305, "global_step": 34145, "epoch": 282} {"train_loss": -32.644527435302734, "global_step": 34146, "epoch": 282} {"train_loss": -31.933408737182617, "global_step": 34147, "epoch": 282} {"train_loss": -32.46644973754883, "global_step": 34148, "epoch": 282} {"train_loss": -32.59629440307617, "global_step": 34149, "epoch": 282} {"train_loss": -32.5661506652832, "global_step": 34150, "epoch": 282} {"train_loss": -31.993589401245117, "global_step": 34151, "epoch": 282} {"train_loss": -32.24108123779297, "global_step": 34152, "epoch": 282} {"train_loss": -32.60598373413086, "global_step": 34153, "epoch": 282} {"train_loss": -32.02632141113281, "global_step": 34154, "epoch": 282} {"train_loss": -32.41716003417969, "global_step": 34155, "epoch": 282} {"train_loss": -32.6203498840332, "global_step": 34156, "epoch": 282} {"train_loss": -32.67226791381836, "global_step": 34157, "epoch": 282} {"train_loss": -32.403194427490234, "global_step": 34158, "epoch": 282} {"train_loss": -32.74876403808594, "global_step": 34159, "epoch": 282} {"train_loss": -32.96212387084961, "global_step": 34160, "epoch": 282} {"train_loss": -33.15315628051758, "global_step": 34161, "epoch": 282} {"train_loss": -32.86262130737305, "global_step": 34162, "epoch": 282} {"train_loss": -32.55491256713867, "global_step": 34163, "epoch": 282} {"train_loss": -33.17560958862305, "global_step": 34164, "epoch": 282} {"train_loss": -33.098323822021484, "global_step": 34165, "epoch": 282} {"train_loss": -32.758663177490234, "global_step": 34166, "epoch": 282} {"train_loss": -33.52313995361328, "global_step": 34167, "epoch": 282} {"train_loss": -33.24895095825195, "global_step": 34168, "epoch": 282} {"train_loss": -32.9444694519043, "global_step": 34169, "epoch": 282} {"train_loss": -33.59330368041992, "global_step": 34170, "epoch": 282} {"train_loss": -32.893611907958984, "global_step": 34171, "epoch": 282} {"train_loss": -33.234737396240234, "global_step": 34172, "epoch": 282} {"train_loss": -33.019386291503906, "global_step": 34173, "epoch": 282} {"train_loss": -33.609588623046875, "global_step": 34174, "epoch": 282} {"train_loss": -33.551856994628906, "global_step": 34175, "epoch": 282} {"train_loss": -33.103267669677734, "global_step": 34176, "epoch": 282} {"train_loss": -33.0357780456543, "global_step": 34177, "epoch": 282} {"train_loss": -33.67861557006836, "global_step": 34178, "epoch": 282} {"train_loss": -32.71855545043945, "global_step": 34179, "epoch": 282} {"train_loss": -33.362510681152344, "global_step": 34180, "epoch": 282} {"train_loss": -33.0219612121582, "global_step": 34181, "epoch": 282} {"train_loss": -33.48950958251953, "global_step": 34182, "epoch": 282} {"train_loss": -33.56216049194336, "global_step": 34183, "epoch": 282} {"train_loss": -32.1762580871582, "global_step": 34184, "epoch": 282} {"train_loss": -33.84964370727539, "global_step": 34185, "epoch": 282} {"train_loss": -33.2951774597168, "global_step": 34186, "epoch": 282} {"train_loss": -33.301483154296875, "global_step": 34187, "epoch": 282} {"train_loss": -32.720855712890625, "global_step": 34188, "epoch": 282} {"train_loss": -33.098506927490234, "global_step": 34189, "epoch": 282} {"train_loss": -32.76792526245117, "global_step": 34190, "epoch": 282} {"train_loss": -33.00072479248047, "global_step": 34191, "epoch": 282} {"train_loss": -32.90424728393555, "global_step": 34192, "epoch": 282} {"train_loss": -32.679046630859375, "global_step": 34193, "epoch": 282} {"train_loss": -33.408233642578125, "global_step": 34194, "epoch": 282} {"train_loss": -32.8700065612793, "global_step": 34195, "epoch": 282} {"train_loss": -32.52543258666992, "global_step": 34196, "epoch": 282} {"train_loss": -33.388671875, "global_step": 34197, "epoch": 282} {"train_loss": -32.60696792602539, "global_step": 34198, "epoch": 282} {"train_loss": -32.52315902709961, "global_step": 34199, "epoch": 282} {"train_loss": -31.806665420532227, "global_step": 34200, "epoch": 282} {"train_loss": -32.178436279296875, "global_step": 34201, "epoch": 282} {"train_loss": -32.19939041137695, "global_step": 34202, "epoch": 282} {"train_loss": -30.763830184936523, "global_step": 34203, "epoch": 282} {"train_loss": -21.41583251953125, "global_step": 34204, "epoch": 282} {"train_loss": -12.261950492858887, "global_step": 34205, "epoch": 282} {"train_loss": -29.052997589111328, "global_step": 34206, "epoch": 282} {"train_loss": -18.322885513305664, "global_step": 34207, "epoch": 282} {"train_loss": -23.48394775390625, "global_step": 34208, "epoch": 282} {"train_loss": -18.782148361206055, "global_step": 34209, "epoch": 282} {"train_loss": -23.18244743347168, "global_step": 34210, "epoch": 282} {"train_loss": -29.592212677001953, "global_step": 34211, "epoch": 282} {"train_loss": -23.285497665405273, "global_step": 34212, "epoch": 282} {"train_loss": -29.1507511138916, "global_step": 34213, "epoch": 282} {"train_loss": -24.81341552734375, "global_step": 34214, "epoch": 282} {"train_loss": -31.381641387939453, "global_step": 34215, "epoch": 282} {"train_loss": -29.545129776000977, "global_step": 34216, "epoch": 282} {"train_loss": -29.84539222717285, "global_step": 34217, "epoch": 282} {"train_loss": -29.639997482299805, "global_step": 34218, "epoch": 282} {"train_loss": -28.596054077148438, "global_step": 34219, "epoch": 282} {"train_loss": -31.22314453125, "global_step": 34220, "epoch": 282} {"train_loss": -30.963048934936523, "global_step": 34221, "epoch": 282} {"train_loss": -30.801071166992188, "global_step": 34222, "epoch": 282} {"train_loss": -31.47950553894043, "global_step": 34223, "epoch": 282} {"train_loss": -31.814733505249023, "global_step": 34224, "epoch": 282} {"train_loss": -30.9627628326416, "global_step": 34225, "epoch": 282} {"train_loss": -30.952346801757812, "global_step": 34226, "epoch": 282} {"train_loss": -31.633222579956055, "global_step": 34227, "epoch": 282} {"train_loss": -31.70570182800293, "global_step": 34228, "epoch": 282} {"train_loss": -31.1379451751709, "global_step": 34229, "epoch": 282} {"train_loss": -32.009727478027344, "global_step": 34230, "epoch": 282} {"train_loss": -32.12868118286133, "global_step": 34231, "epoch": 282} {"train_loss": -32.08039474487305, "global_step": 34232, "epoch": 282} {"train_loss": -32.210182189941406, "global_step": 34233, "epoch": 282} {"train_loss": -32.28101348876953, "global_step": 34234, "epoch": 282} {"train_loss": -32.425559997558594, "global_step": 34235, "epoch": 282} {"train_loss": -32.441993713378906, "global_step": 34236, "epoch": 282} {"train_loss": -32.41609573364258, "global_step": 34237, "epoch": 282} {"train_loss": -32.18842315673828, "global_step": 34238, "epoch": 282} {"train_loss": -32.30955123901367, "global_step": 34239, "epoch": 282} {"train_loss": -32.26662063598633, "global_step": 34240, "epoch": 282} {"train_loss": -32.7051887512207, "global_step": 34241, "epoch": 282} {"train_loss": -31.116558145885627, "global_step": 34242, "epoch": 282, "val_loss": 2465030.5} {"train_loss": -32.860382080078125, "global_step": 34243, "epoch": 283} {"train_loss": -32.448829650878906, "global_step": 34244, "epoch": 283} {"train_loss": -32.75593948364258, "global_step": 34245, "epoch": 283} {"train_loss": -32.849815368652344, "global_step": 34246, "epoch": 283} {"train_loss": -32.60697555541992, "global_step": 34247, "epoch": 283} {"train_loss": -33.103004455566406, "global_step": 34248, "epoch": 283} {"train_loss": -32.755855560302734, "global_step": 34249, "epoch": 283} {"train_loss": -32.624691009521484, "global_step": 34250, "epoch": 283} {"train_loss": -33.0758056640625, "global_step": 34251, "epoch": 283} {"train_loss": -32.999176025390625, "global_step": 34252, "epoch": 283} {"train_loss": -32.781124114990234, "global_step": 34253, "epoch": 283} {"train_loss": -32.9088020324707, "global_step": 34254, "epoch": 283} {"train_loss": -33.411991119384766, "global_step": 34255, "epoch": 283} {"train_loss": -32.0528564453125, "global_step": 34256, "epoch": 283} {"train_loss": -32.59693145751953, "global_step": 34257, "epoch": 283} {"train_loss": -33.06520080566406, "global_step": 34258, "epoch": 283} {"train_loss": -32.994903564453125, "global_step": 34259, "epoch": 283} {"train_loss": -32.72626495361328, "global_step": 34260, "epoch": 283} {"train_loss": -32.90341567993164, "global_step": 34261, "epoch": 283} {"train_loss": -33.07171630859375, "global_step": 34262, "epoch": 283} {"train_loss": -32.64702224731445, "global_step": 34263, "epoch": 283} {"train_loss": -33.020503997802734, "global_step": 34264, "epoch": 283} {"train_loss": -32.67927169799805, "global_step": 34265, "epoch": 283} {"train_loss": -32.011962890625, "global_step": 34266, "epoch": 283} {"train_loss": -31.693328857421875, "global_step": 34267, "epoch": 283} {"train_loss": -32.31482696533203, "global_step": 34268, "epoch": 283} {"train_loss": -32.383174896240234, "global_step": 34269, "epoch": 283} {"train_loss": -32.14985275268555, "global_step": 34270, "epoch": 283} {"train_loss": -32.37496566772461, "global_step": 34271, "epoch": 283} {"train_loss": -32.205406188964844, "global_step": 34272, "epoch": 283} {"train_loss": -31.2774658203125, "global_step": 34273, "epoch": 283} {"train_loss": -31.947193145751953, "global_step": 34274, "epoch": 283} {"train_loss": -32.211647033691406, "global_step": 34275, "epoch": 283} {"train_loss": -32.46474075317383, "global_step": 34276, "epoch": 283} {"train_loss": -32.466163635253906, "global_step": 34277, "epoch": 283} {"train_loss": -29.661060333251953, "global_step": 34278, "epoch": 283} {"train_loss": -31.494873046875, "global_step": 34279, "epoch": 283} {"train_loss": -31.05596351623535, "global_step": 34280, "epoch": 283} {"train_loss": -31.213613510131836, "global_step": 34281, "epoch": 283} {"train_loss": -31.787612915039062, "global_step": 34282, "epoch": 283} {"train_loss": -32.616092681884766, "global_step": 34283, "epoch": 283} {"train_loss": -32.20265579223633, "global_step": 34284, "epoch": 283} {"train_loss": -31.87066078186035, "global_step": 34285, "epoch": 283} {"train_loss": -32.09273147583008, "global_step": 34286, "epoch": 283} {"train_loss": -31.31902503967285, "global_step": 34287, "epoch": 283} {"train_loss": -32.3376579284668, "global_step": 34288, "epoch": 283} {"train_loss": -31.48000144958496, "global_step": 34289, "epoch": 283} {"train_loss": -30.3376407623291, "global_step": 34290, "epoch": 283} {"train_loss": -30.547712326049805, "global_step": 34291, "epoch": 283} {"train_loss": -31.672704696655273, "global_step": 34292, "epoch": 283} {"train_loss": -32.13772201538086, "global_step": 34293, "epoch": 283} {"train_loss": -31.314041137695312, "global_step": 34294, "epoch": 283} {"train_loss": -31.65879249572754, "global_step": 34295, "epoch": 283} {"train_loss": -31.91718864440918, "global_step": 34296, "epoch": 283} {"train_loss": -32.31631851196289, "global_step": 34297, "epoch": 283} {"train_loss": -32.320716857910156, "global_step": 34298, "epoch": 283} {"train_loss": -32.0364875793457, "global_step": 34299, "epoch": 283} {"train_loss": -32.31159973144531, "global_step": 34300, "epoch": 283} {"train_loss": -32.468135833740234, "global_step": 34301, "epoch": 283} {"train_loss": -32.46613693237305, "global_step": 34302, "epoch": 283} {"train_loss": -31.702314376831055, "global_step": 34303, "epoch": 283} {"train_loss": -32.3935661315918, "global_step": 34304, "epoch": 283} {"train_loss": -32.532230377197266, "global_step": 34305, "epoch": 283} {"train_loss": -32.144771575927734, "global_step": 34306, "epoch": 283} {"train_loss": -32.824317932128906, "global_step": 34307, "epoch": 283} {"train_loss": -32.65133285522461, "global_step": 34308, "epoch": 283} {"train_loss": -32.60089111328125, "global_step": 34309, "epoch": 283} {"train_loss": -32.98591232299805, "global_step": 34310, "epoch": 283} {"train_loss": -32.107704162597656, "global_step": 34311, "epoch": 283} {"train_loss": -30.106689453125, "global_step": 34312, "epoch": 283} {"train_loss": -32.183101654052734, "global_step": 34313, "epoch": 283} {"train_loss": -32.698238372802734, "global_step": 34314, "epoch": 283} {"train_loss": -32.43428421020508, "global_step": 34315, "epoch": 283} {"train_loss": -32.07568359375, "global_step": 34316, "epoch": 283} {"train_loss": -33.09275817871094, "global_step": 34317, "epoch": 283} {"train_loss": -31.578113555908203, "global_step": 34318, "epoch": 283} {"train_loss": -32.86753463745117, "global_step": 34319, "epoch": 283} {"train_loss": -32.751495361328125, "global_step": 34320, "epoch": 283} {"train_loss": -32.67757034301758, "global_step": 34321, "epoch": 283} {"train_loss": -32.600067138671875, "global_step": 34322, "epoch": 283} {"train_loss": -32.1746826171875, "global_step": 34323, "epoch": 283} {"train_loss": -33.35512924194336, "global_step": 34324, "epoch": 283} {"train_loss": -31.91506004333496, "global_step": 34325, "epoch": 283} {"train_loss": -32.946773529052734, "global_step": 34326, "epoch": 283} {"train_loss": -31.66596794128418, "global_step": 34327, "epoch": 283} {"train_loss": -32.98127365112305, "global_step": 34328, "epoch": 283} {"train_loss": -32.19817352294922, "global_step": 34329, "epoch": 283} {"train_loss": -32.97356033325195, "global_step": 34330, "epoch": 283} {"train_loss": -32.57197952270508, "global_step": 34331, "epoch": 283} {"train_loss": -33.11600112915039, "global_step": 34332, "epoch": 283} {"train_loss": -33.58515930175781, "global_step": 34333, "epoch": 283} {"train_loss": -33.63294219970703, "global_step": 34334, "epoch": 283} {"train_loss": -33.32547378540039, "global_step": 34335, "epoch": 283} {"train_loss": -33.837257385253906, "global_step": 34336, "epoch": 283} {"train_loss": -33.097747802734375, "global_step": 34337, "epoch": 283} {"train_loss": -33.766456604003906, "global_step": 34338, "epoch": 283} {"train_loss": -33.307464599609375, "global_step": 34339, "epoch": 283} {"train_loss": -33.888912200927734, "global_step": 34340, "epoch": 283} {"train_loss": -33.41749572753906, "global_step": 34341, "epoch": 283} {"train_loss": -33.670570373535156, "global_step": 34342, "epoch": 283} {"train_loss": -33.35187530517578, "global_step": 34343, "epoch": 283} {"train_loss": -32.3465576171875, "global_step": 34344, "epoch": 283} {"train_loss": -33.22601318359375, "global_step": 34345, "epoch": 283} {"train_loss": -33.929115295410156, "global_step": 34346, "epoch": 283} {"train_loss": -33.0866813659668, "global_step": 34347, "epoch": 283} {"train_loss": -33.05339813232422, "global_step": 34348, "epoch": 283} {"train_loss": -33.425846099853516, "global_step": 34349, "epoch": 283} {"train_loss": -32.212059020996094, "global_step": 34350, "epoch": 283} {"train_loss": -32.653499603271484, "global_step": 34351, "epoch": 283} {"train_loss": -32.265499114990234, "global_step": 34352, "epoch": 283} {"train_loss": -33.390132904052734, "global_step": 34353, "epoch": 283} {"train_loss": -32.644752502441406, "global_step": 34354, "epoch": 283} {"train_loss": -33.02341842651367, "global_step": 34355, "epoch": 283} {"train_loss": -32.08774948120117, "global_step": 34356, "epoch": 283} {"train_loss": -33.07576370239258, "global_step": 34357, "epoch": 283} {"train_loss": -32.40495681762695, "global_step": 34358, "epoch": 283} {"train_loss": -32.67380905151367, "global_step": 34359, "epoch": 283} {"train_loss": -32.772003173828125, "global_step": 34360, "epoch": 283} {"train_loss": -32.9206428527832, "global_step": 34361, "epoch": 283} {"train_loss": -33.2242546081543, "global_step": 34362, "epoch": 283} {"train_loss": -32.48912603204901, "global_step": 34363, "epoch": 283, "val_loss": 2526892.25} {"train_loss": -32.475215911865234, "global_step": 34364, "epoch": 284} {"train_loss": -32.7944221496582, "global_step": 34365, "epoch": 284} {"train_loss": -32.39191436767578, "global_step": 34366, "epoch": 284} {"train_loss": -31.57716941833496, "global_step": 34367, "epoch": 284} {"train_loss": -33.3713264465332, "global_step": 34368, "epoch": 284} {"train_loss": -33.044315338134766, "global_step": 34369, "epoch": 284} {"train_loss": -32.626399993896484, "global_step": 34370, "epoch": 284} {"train_loss": -32.12248611450195, "global_step": 34371, "epoch": 284} {"train_loss": -33.310176849365234, "global_step": 34372, "epoch": 284} {"train_loss": -32.77637481689453, "global_step": 34373, "epoch": 284} {"train_loss": -32.31107711791992, "global_step": 34374, "epoch": 284} {"train_loss": -32.164302825927734, "global_step": 34375, "epoch": 284} {"train_loss": -32.84407424926758, "global_step": 34376, "epoch": 284} {"train_loss": -33.097530364990234, "global_step": 34377, "epoch": 284} {"train_loss": -32.99375534057617, "global_step": 34378, "epoch": 284} {"train_loss": -32.2419548034668, "global_step": 34379, "epoch": 284} {"train_loss": -33.22796630859375, "global_step": 34380, "epoch": 284} {"train_loss": -31.661407470703125, "global_step": 34381, "epoch": 284} {"train_loss": -30.830121994018555, "global_step": 34382, "epoch": 284} {"train_loss": -31.57599449157715, "global_step": 34383, "epoch": 284} {"train_loss": -32.74327850341797, "global_step": 34384, "epoch": 284} {"train_loss": -31.893590927124023, "global_step": 34385, "epoch": 284} {"train_loss": -30.735177993774414, "global_step": 34386, "epoch": 284} {"train_loss": -31.224151611328125, "global_step": 34387, "epoch": 284} {"train_loss": -30.100845336914062, "global_step": 34388, "epoch": 284} {"train_loss": -31.54486656188965, "global_step": 34389, "epoch": 284} {"train_loss": -32.247032165527344, "global_step": 34390, "epoch": 284} {"train_loss": -30.74652099609375, "global_step": 34391, "epoch": 284} {"train_loss": -31.42469596862793, "global_step": 34392, "epoch": 284} {"train_loss": -32.060302734375, "global_step": 34393, "epoch": 284} {"train_loss": -31.598358154296875, "global_step": 34394, "epoch": 284} {"train_loss": -31.285863876342773, "global_step": 34395, "epoch": 284} {"train_loss": -31.757287979125977, "global_step": 34396, "epoch": 284} {"train_loss": -32.23612594604492, "global_step": 34397, "epoch": 284} {"train_loss": -32.56132125854492, "global_step": 34398, "epoch": 284} {"train_loss": -32.74758529663086, "global_step": 34399, "epoch": 284} {"train_loss": -31.34882164001465, "global_step": 34400, "epoch": 284} {"train_loss": -32.49892044067383, "global_step": 34401, "epoch": 284} {"train_loss": -32.045955657958984, "global_step": 34402, "epoch": 284} {"train_loss": -31.968557357788086, "global_step": 34403, "epoch": 284} {"train_loss": -32.60956954956055, "global_step": 34404, "epoch": 284} {"train_loss": -32.58901596069336, "global_step": 34405, "epoch": 284} {"train_loss": -32.590267181396484, "global_step": 34406, "epoch": 284} {"train_loss": -32.85213851928711, "global_step": 34407, "epoch": 284} {"train_loss": -32.80202102661133, "global_step": 34408, "epoch": 284} {"train_loss": -32.92377853393555, "global_step": 34409, "epoch": 284} {"train_loss": -33.42009735107422, "global_step": 34410, "epoch": 284} {"train_loss": -32.46553421020508, "global_step": 34411, "epoch": 284} {"train_loss": -32.45515060424805, "global_step": 34412, "epoch": 284} {"train_loss": -33.29551315307617, "global_step": 34413, "epoch": 284} {"train_loss": -32.611812591552734, "global_step": 34414, "epoch": 284} {"train_loss": -33.357818603515625, "global_step": 34415, "epoch": 284} {"train_loss": -32.686920166015625, "global_step": 34416, "epoch": 284} {"train_loss": -33.33529281616211, "global_step": 34417, "epoch": 284} {"train_loss": -33.17502212524414, "global_step": 34418, "epoch": 284} {"train_loss": -33.384639739990234, "global_step": 34419, "epoch": 284} {"train_loss": -32.99935531616211, "global_step": 34420, "epoch": 284} {"train_loss": -32.3458366394043, "global_step": 34421, "epoch": 284} {"train_loss": -33.28511428833008, "global_step": 34422, "epoch": 284} {"train_loss": -33.79144287109375, "global_step": 34423, "epoch": 284} {"train_loss": -33.32081985473633, "global_step": 34424, "epoch": 284} {"train_loss": -33.40138626098633, "global_step": 34425, "epoch": 284} {"train_loss": -33.553466796875, "global_step": 34426, "epoch": 284} {"train_loss": -33.2940673828125, "global_step": 34427, "epoch": 284} {"train_loss": -33.53398513793945, "global_step": 34428, "epoch": 284} {"train_loss": -33.1149787902832, "global_step": 34429, "epoch": 284} {"train_loss": -32.893898010253906, "global_step": 34430, "epoch": 284} {"train_loss": -33.733707427978516, "global_step": 34431, "epoch": 284} {"train_loss": -33.814064025878906, "global_step": 34432, "epoch": 284} {"train_loss": -33.91134262084961, "global_step": 34433, "epoch": 284} {"train_loss": -33.655914306640625, "global_step": 34434, "epoch": 284} {"train_loss": -33.34600830078125, "global_step": 34435, "epoch": 284} {"train_loss": -33.1922721862793, "global_step": 34436, "epoch": 284} {"train_loss": -34.288936614990234, "global_step": 34437, "epoch": 284} {"train_loss": -33.51385498046875, "global_step": 34438, "epoch": 284} {"train_loss": -33.26921463012695, "global_step": 34439, "epoch": 284} {"train_loss": -33.594642639160156, "global_step": 34440, "epoch": 284} {"train_loss": -32.271705627441406, "global_step": 34441, "epoch": 284} {"train_loss": -33.5400276184082, "global_step": 34442, "epoch": 284} {"train_loss": -33.723655700683594, "global_step": 34443, "epoch": 284} {"train_loss": -34.01502227783203, "global_step": 34444, "epoch": 284} {"train_loss": -33.837127685546875, "global_step": 34445, "epoch": 284} {"train_loss": -33.6235466003418, "global_step": 34446, "epoch": 284} {"train_loss": -34.29499053955078, "global_step": 34447, "epoch": 284} {"train_loss": -33.49055099487305, "global_step": 34448, "epoch": 284} {"train_loss": -33.40610885620117, "global_step": 34449, "epoch": 284} {"train_loss": -32.42571258544922, "global_step": 34450, "epoch": 284} {"train_loss": -33.97296142578125, "global_step": 34451, "epoch": 284} {"train_loss": -34.0306510925293, "global_step": 34452, "epoch": 284} {"train_loss": -33.4705696105957, "global_step": 34453, "epoch": 284} {"train_loss": -31.756799697875977, "global_step": 34454, "epoch": 284} {"train_loss": -27.737873077392578, "global_step": 34455, "epoch": 284} {"train_loss": -26.353717803955078, "global_step": 34456, "epoch": 284} {"train_loss": -27.105010986328125, "global_step": 34457, "epoch": 284} {"train_loss": -29.759923934936523, "global_step": 34458, "epoch": 284} {"train_loss": -30.941503524780273, "global_step": 34459, "epoch": 284} {"train_loss": -29.602514266967773, "global_step": 34460, "epoch": 284} {"train_loss": -32.54165267944336, "global_step": 34461, "epoch": 284} {"train_loss": -29.359344482421875, "global_step": 34462, "epoch": 284} {"train_loss": -32.0719108581543, "global_step": 34463, "epoch": 284} {"train_loss": -31.861438751220703, "global_step": 34464, "epoch": 284} {"train_loss": -32.43787384033203, "global_step": 34465, "epoch": 284} {"train_loss": -31.634235382080078, "global_step": 34466, "epoch": 284} {"train_loss": -32.88923645019531, "global_step": 34467, "epoch": 284} {"train_loss": -31.98237419128418, "global_step": 34468, "epoch": 284} {"train_loss": -32.611507415771484, "global_step": 34469, "epoch": 284} {"train_loss": -32.296329498291016, "global_step": 34470, "epoch": 284} {"train_loss": -32.48228073120117, "global_step": 34471, "epoch": 284} {"train_loss": -33.29397201538086, "global_step": 34472, "epoch": 284} {"train_loss": -32.89847946166992, "global_step": 34473, "epoch": 284} {"train_loss": -32.071388244628906, "global_step": 34474, "epoch": 284} {"train_loss": -32.589962005615234, "global_step": 34475, "epoch": 284} {"train_loss": -33.2662353515625, "global_step": 34476, "epoch": 284} {"train_loss": -32.24880599975586, "global_step": 34477, "epoch": 284} {"train_loss": -32.539852142333984, "global_step": 34478, "epoch": 284} {"train_loss": -33.27992630004883, "global_step": 34479, "epoch": 284} {"train_loss": -33.15416717529297, "global_step": 34480, "epoch": 284} {"train_loss": -32.844818115234375, "global_step": 34481, "epoch": 284} {"train_loss": -33.08121871948242, "global_step": 34482, "epoch": 284} {"train_loss": -32.469764709472656, "global_step": 34483, "epoch": 284} {"train_loss": -32.48013589401876, "global_step": 34484, "epoch": 284, "val_loss": 2588190.25} {"train_loss": -32.27388381958008, "global_step": 34485, "epoch": 285} {"train_loss": -33.35551452636719, "global_step": 34486, "epoch": 285} {"train_loss": -33.505714416503906, "global_step": 34487, "epoch": 285} {"train_loss": -32.892147064208984, "global_step": 34488, "epoch": 285} {"train_loss": -31.872182846069336, "global_step": 34489, "epoch": 285} {"train_loss": -31.60114860534668, "global_step": 34490, "epoch": 285} {"train_loss": -33.340789794921875, "global_step": 34491, "epoch": 285} {"train_loss": -33.02553939819336, "global_step": 34492, "epoch": 285} {"train_loss": -31.82337760925293, "global_step": 34493, "epoch": 285} {"train_loss": -31.809707641601562, "global_step": 34494, "epoch": 285} {"train_loss": -32.289737701416016, "global_step": 34495, "epoch": 285} {"train_loss": -32.48972702026367, "global_step": 34496, "epoch": 285} {"train_loss": -32.0898323059082, "global_step": 34497, "epoch": 285} {"train_loss": -33.5789794921875, "global_step": 34498, "epoch": 285} {"train_loss": -32.54093551635742, "global_step": 34499, "epoch": 285} {"train_loss": -32.894527435302734, "global_step": 34500, "epoch": 285} {"train_loss": -32.76082229614258, "global_step": 34501, "epoch": 285} {"train_loss": -31.84113883972168, "global_step": 34502, "epoch": 285} {"train_loss": -33.28424072265625, "global_step": 34503, "epoch": 285} {"train_loss": -32.309139251708984, "global_step": 34504, "epoch": 285} {"train_loss": -33.770668029785156, "global_step": 34505, "epoch": 285} {"train_loss": -33.47904586791992, "global_step": 34506, "epoch": 285} {"train_loss": -32.66062545776367, "global_step": 34507, "epoch": 285} {"train_loss": -33.460906982421875, "global_step": 34508, "epoch": 285} {"train_loss": -32.418094635009766, "global_step": 34509, "epoch": 285} {"train_loss": -33.292640686035156, "global_step": 34510, "epoch": 285} {"train_loss": -32.463104248046875, "global_step": 34511, "epoch": 285} {"train_loss": -33.62717819213867, "global_step": 34512, "epoch": 285} {"train_loss": -32.011775970458984, "global_step": 34513, "epoch": 285} {"train_loss": -33.60366439819336, "global_step": 34514, "epoch": 285} {"train_loss": -33.42856979370117, "global_step": 34515, "epoch": 285} {"train_loss": -33.48225784301758, "global_step": 34516, "epoch": 285} {"train_loss": -32.450347900390625, "global_step": 34517, "epoch": 285} {"train_loss": -33.09316635131836, "global_step": 34518, "epoch": 285} {"train_loss": -32.22333908081055, "global_step": 34519, "epoch": 285} {"train_loss": -32.148345947265625, "global_step": 34520, "epoch": 285} {"train_loss": -29.97137451171875, "global_step": 34521, "epoch": 285} {"train_loss": -30.61861228942871, "global_step": 34522, "epoch": 285} {"train_loss": -29.110387802124023, "global_step": 34523, "epoch": 285} {"train_loss": -28.340051651000977, "global_step": 34524, "epoch": 285} {"train_loss": -29.249380111694336, "global_step": 34525, "epoch": 285} {"train_loss": -31.732831954956055, "global_step": 34526, "epoch": 285} {"train_loss": -31.958328247070312, "global_step": 34527, "epoch": 285} {"train_loss": -30.4468994140625, "global_step": 34528, "epoch": 285} {"train_loss": -31.716527938842773, "global_step": 34529, "epoch": 285} {"train_loss": -32.89377975463867, "global_step": 34530, "epoch": 285} {"train_loss": -31.283756256103516, "global_step": 34531, "epoch": 285} {"train_loss": -31.8283634185791, "global_step": 34532, "epoch": 285} {"train_loss": -32.16645431518555, "global_step": 34533, "epoch": 285} {"train_loss": -32.30393600463867, "global_step": 34534, "epoch": 285} {"train_loss": -31.880084991455078, "global_step": 34535, "epoch": 285} {"train_loss": -30.75189208984375, "global_step": 34536, "epoch": 285} {"train_loss": -32.313987731933594, "global_step": 34537, "epoch": 285} {"train_loss": -32.30991744995117, "global_step": 34538, "epoch": 285} {"train_loss": -31.662275314331055, "global_step": 34539, "epoch": 285} {"train_loss": -32.2507438659668, "global_step": 34540, "epoch": 285} {"train_loss": -32.026824951171875, "global_step": 34541, "epoch": 285} {"train_loss": -31.355335235595703, "global_step": 34542, "epoch": 285} {"train_loss": -32.2335319519043, "global_step": 34543, "epoch": 285} {"train_loss": -32.2104377746582, "global_step": 34544, "epoch": 285} {"train_loss": -32.47454833984375, "global_step": 34545, "epoch": 285} {"train_loss": -32.63740158081055, "global_step": 34546, "epoch": 285} {"train_loss": -32.742469787597656, "global_step": 34547, "epoch": 285} {"train_loss": -32.578163146972656, "global_step": 34548, "epoch": 285} {"train_loss": -33.1931266784668, "global_step": 34549, "epoch": 285} {"train_loss": -32.83308792114258, "global_step": 34550, "epoch": 285} {"train_loss": -32.58216857910156, "global_step": 34551, "epoch": 285} {"train_loss": -33.12030029296875, "global_step": 34552, "epoch": 285} {"train_loss": -33.150020599365234, "global_step": 34553, "epoch": 285} {"train_loss": -33.2564582824707, "global_step": 34554, "epoch": 285} {"train_loss": -33.35767364501953, "global_step": 34555, "epoch": 285} {"train_loss": -33.02850341796875, "global_step": 34556, "epoch": 285} {"train_loss": -33.221160888671875, "global_step": 34557, "epoch": 285} {"train_loss": -32.827754974365234, "global_step": 34558, "epoch": 285} {"train_loss": -32.99477767944336, "global_step": 34559, "epoch": 285} {"train_loss": -33.686336517333984, "global_step": 34560, "epoch": 285} {"train_loss": -33.38602828979492, "global_step": 34561, "epoch": 285} {"train_loss": -33.192134857177734, "global_step": 34562, "epoch": 285} {"train_loss": -33.53757095336914, "global_step": 34563, "epoch": 285} {"train_loss": -33.37496566772461, "global_step": 34564, "epoch": 285} {"train_loss": -33.86147689819336, "global_step": 34565, "epoch": 285} {"train_loss": -33.88290023803711, "global_step": 34566, "epoch": 285} {"train_loss": -33.97514724731445, "global_step": 34567, "epoch": 285} {"train_loss": -33.7951774597168, "global_step": 34568, "epoch": 285} {"train_loss": -33.729286193847656, "global_step": 34569, "epoch": 285} {"train_loss": -33.7971305847168, "global_step": 34570, "epoch": 285} {"train_loss": -34.183902740478516, "global_step": 34571, "epoch": 285} {"train_loss": -33.996551513671875, "global_step": 34572, "epoch": 285} {"train_loss": -34.03189468383789, "global_step": 34573, "epoch": 285} {"train_loss": -33.4361572265625, "global_step": 34574, "epoch": 285} {"train_loss": -34.31246566772461, "global_step": 34575, "epoch": 285} {"train_loss": -34.008636474609375, "global_step": 34576, "epoch": 285} {"train_loss": -34.391334533691406, "global_step": 34577, "epoch": 285} {"train_loss": -33.11613082885742, "global_step": 34578, "epoch": 285} {"train_loss": -34.42005920410156, "global_step": 34579, "epoch": 285} {"train_loss": -33.5704460144043, "global_step": 34580, "epoch": 285} {"train_loss": -33.86945724487305, "global_step": 34581, "epoch": 285} {"train_loss": -33.723487854003906, "global_step": 34582, "epoch": 285} {"train_loss": -33.46450424194336, "global_step": 34583, "epoch": 285} {"train_loss": -34.09586715698242, "global_step": 34584, "epoch": 285} {"train_loss": -33.98124313354492, "global_step": 34585, "epoch": 285} {"train_loss": -33.38630676269531, "global_step": 34586, "epoch": 285} {"train_loss": -33.89992904663086, "global_step": 34587, "epoch": 285} {"train_loss": -34.37058639526367, "global_step": 34588, "epoch": 285} {"train_loss": -34.133033752441406, "global_step": 34589, "epoch": 285} {"train_loss": -33.68681716918945, "global_step": 34590, "epoch": 285} {"train_loss": -32.6724739074707, "global_step": 34591, "epoch": 285} {"train_loss": -34.23006057739258, "global_step": 34592, "epoch": 285} {"train_loss": -34.01449203491211, "global_step": 34593, "epoch": 285} {"train_loss": -33.472469329833984, "global_step": 34594, "epoch": 285} {"train_loss": -33.5279426574707, "global_step": 34595, "epoch": 285} {"train_loss": -32.90278244018555, "global_step": 34596, "epoch": 285} {"train_loss": -32.42567825317383, "global_step": 34597, "epoch": 285} {"train_loss": -32.35799789428711, "global_step": 34598, "epoch": 285} {"train_loss": -32.59316635131836, "global_step": 34599, "epoch": 285} {"train_loss": -31.402912139892578, "global_step": 34600, "epoch": 285} {"train_loss": -31.06776237487793, "global_step": 34601, "epoch": 285} {"train_loss": -28.1712589263916, "global_step": 34602, "epoch": 285} {"train_loss": -23.627689361572266, "global_step": 34603, "epoch": 285} {"train_loss": -19.645709991455078, "global_step": 34604, "epoch": 285} {"train_loss": -32.49461101500456, "global_step": 34605, "epoch": 285, "val_loss": 2605599.0} {"train_loss": -32.1396484375, "global_step": 34606, "epoch": 286} {"train_loss": -28.6004695892334, "global_step": 34607, "epoch": 286} {"train_loss": -31.691925048828125, "global_step": 34608, "epoch": 286} {"train_loss": -30.00880241394043, "global_step": 34609, "epoch": 286} {"train_loss": -32.672298431396484, "global_step": 34610, "epoch": 286} {"train_loss": -30.998258590698242, "global_step": 34611, "epoch": 286} {"train_loss": -32.531639099121094, "global_step": 34612, "epoch": 286} {"train_loss": -32.125732421875, "global_step": 34613, "epoch": 286} {"train_loss": -32.40653610229492, "global_step": 34614, "epoch": 286} {"train_loss": -32.777767181396484, "global_step": 34615, "epoch": 286} {"train_loss": -31.85498046875, "global_step": 34616, "epoch": 286} {"train_loss": -31.62466812133789, "global_step": 34617, "epoch": 286} {"train_loss": -33.03121566772461, "global_step": 34618, "epoch": 286} {"train_loss": -31.52252197265625, "global_step": 34619, "epoch": 286} {"train_loss": -32.50654602050781, "global_step": 34620, "epoch": 286} {"train_loss": -33.04973602294922, "global_step": 34621, "epoch": 286} {"train_loss": -31.34197998046875, "global_step": 34622, "epoch": 286} {"train_loss": -32.40839767456055, "global_step": 34623, "epoch": 286} {"train_loss": -32.09262466430664, "global_step": 34624, "epoch": 286} {"train_loss": -32.52052307128906, "global_step": 34625, "epoch": 286} {"train_loss": -32.1894645690918, "global_step": 34626, "epoch": 286} {"train_loss": -32.62453079223633, "global_step": 34627, "epoch": 286} {"train_loss": -31.84396743774414, "global_step": 34628, "epoch": 286} {"train_loss": -31.96343421936035, "global_step": 34629, "epoch": 286} {"train_loss": -31.047988891601562, "global_step": 34630, "epoch": 286} {"train_loss": -31.157224655151367, "global_step": 34631, "epoch": 286} {"train_loss": -32.21798324584961, "global_step": 34632, "epoch": 286} {"train_loss": -31.238540649414062, "global_step": 34633, "epoch": 286} {"train_loss": -32.72475814819336, "global_step": 34634, "epoch": 286} {"train_loss": -32.30781173706055, "global_step": 34635, "epoch": 286} {"train_loss": -32.44501495361328, "global_step": 34636, "epoch": 286} {"train_loss": -31.43893814086914, "global_step": 34637, "epoch": 286} {"train_loss": -32.08720779418945, "global_step": 34638, "epoch": 286} {"train_loss": -32.74860763549805, "global_step": 34639, "epoch": 286} {"train_loss": -32.5914306640625, "global_step": 34640, "epoch": 286} {"train_loss": -32.44747543334961, "global_step": 34641, "epoch": 286} {"train_loss": -32.6031608581543, "global_step": 34642, "epoch": 286} {"train_loss": -32.436038970947266, "global_step": 34643, "epoch": 286} {"train_loss": -32.36180877685547, "global_step": 34644, "epoch": 286} {"train_loss": -32.84383010864258, "global_step": 34645, "epoch": 286} {"train_loss": -32.657264709472656, "global_step": 34646, "epoch": 286} {"train_loss": -33.19667434692383, "global_step": 34647, "epoch": 286} {"train_loss": -33.195472717285156, "global_step": 34648, "epoch": 286} {"train_loss": -32.662418365478516, "global_step": 34649, "epoch": 286} {"train_loss": -32.582759857177734, "global_step": 34650, "epoch": 286} {"train_loss": -33.04669189453125, "global_step": 34651, "epoch": 286} {"train_loss": -32.87575912475586, "global_step": 34652, "epoch": 286} {"train_loss": -33.506526947021484, "global_step": 34653, "epoch": 286} {"train_loss": -32.79666519165039, "global_step": 34654, "epoch": 286} {"train_loss": -33.48485565185547, "global_step": 34655, "epoch": 286} {"train_loss": -33.41771697998047, "global_step": 34656, "epoch": 286} {"train_loss": -33.26182174682617, "global_step": 34657, "epoch": 286} {"train_loss": -33.21737289428711, "global_step": 34658, "epoch": 286} {"train_loss": -33.13683319091797, "global_step": 34659, "epoch": 286} {"train_loss": -32.98663330078125, "global_step": 34660, "epoch": 286} {"train_loss": -33.6082878112793, "global_step": 34661, "epoch": 286} {"train_loss": -32.419097900390625, "global_step": 34662, "epoch": 286} {"train_loss": -31.968048095703125, "global_step": 34663, "epoch": 286} {"train_loss": -32.74110794067383, "global_step": 34664, "epoch": 286} {"train_loss": -31.436201095581055, "global_step": 34665, "epoch": 286} {"train_loss": -33.17891311645508, "global_step": 34666, "epoch": 286} {"train_loss": -32.420570373535156, "global_step": 34667, "epoch": 286} {"train_loss": -32.321998596191406, "global_step": 34668, "epoch": 286} {"train_loss": -33.61506271362305, "global_step": 34669, "epoch": 286} {"train_loss": -32.40104293823242, "global_step": 34670, "epoch": 286} {"train_loss": -33.9499626159668, "global_step": 34671, "epoch": 286} {"train_loss": -32.9815673828125, "global_step": 34672, "epoch": 286} {"train_loss": -33.25678634643555, "global_step": 34673, "epoch": 286} {"train_loss": -33.49929428100586, "global_step": 34674, "epoch": 286} {"train_loss": -32.93699264526367, "global_step": 34675, "epoch": 286} {"train_loss": -33.61350631713867, "global_step": 34676, "epoch": 286} {"train_loss": -32.49594497680664, "global_step": 34677, "epoch": 286} {"train_loss": -33.41743087768555, "global_step": 34678, "epoch": 286} {"train_loss": -33.43595504760742, "global_step": 34679, "epoch": 286} {"train_loss": -33.47738265991211, "global_step": 34680, "epoch": 286} {"train_loss": -34.081329345703125, "global_step": 34681, "epoch": 286} {"train_loss": -33.95335006713867, "global_step": 34682, "epoch": 286} {"train_loss": -33.528926849365234, "global_step": 34683, "epoch": 286} {"train_loss": -33.626708984375, "global_step": 34684, "epoch": 286} {"train_loss": -33.4266357421875, "global_step": 34685, "epoch": 286} {"train_loss": -33.884246826171875, "global_step": 34686, "epoch": 286} {"train_loss": -33.982208251953125, "global_step": 34687, "epoch": 286} {"train_loss": -33.48604202270508, "global_step": 34688, "epoch": 286} {"train_loss": -33.684871673583984, "global_step": 34689, "epoch": 286} {"train_loss": -33.088897705078125, "global_step": 34690, "epoch": 286} {"train_loss": -33.188655853271484, "global_step": 34691, "epoch": 286} {"train_loss": -33.4401741027832, "global_step": 34692, "epoch": 286} {"train_loss": -33.285640716552734, "global_step": 34693, "epoch": 286} {"train_loss": -32.3547477722168, "global_step": 34694, "epoch": 286} {"train_loss": -32.8858528137207, "global_step": 34695, "epoch": 286} {"train_loss": -33.39899444580078, "global_step": 34696, "epoch": 286} {"train_loss": -33.54832077026367, "global_step": 34697, "epoch": 286} {"train_loss": -33.240665435791016, "global_step": 34698, "epoch": 286} {"train_loss": -32.734375, "global_step": 34699, "epoch": 286} {"train_loss": -31.519128799438477, "global_step": 34700, "epoch": 286} {"train_loss": -32.620338439941406, "global_step": 34701, "epoch": 286} {"train_loss": -32.87400436401367, "global_step": 34702, "epoch": 286} {"train_loss": -32.32273483276367, "global_step": 34703, "epoch": 286} {"train_loss": -32.565643310546875, "global_step": 34704, "epoch": 286} {"train_loss": -33.36687088012695, "global_step": 34705, "epoch": 286} {"train_loss": -33.164710998535156, "global_step": 34706, "epoch": 286} {"train_loss": -32.8580207824707, "global_step": 34707, "epoch": 286} {"train_loss": -31.36982536315918, "global_step": 34708, "epoch": 286} {"train_loss": -32.927581787109375, "global_step": 34709, "epoch": 286} {"train_loss": -33.01360321044922, "global_step": 34710, "epoch": 286} {"train_loss": -32.887020111083984, "global_step": 34711, "epoch": 286} {"train_loss": -32.538368225097656, "global_step": 34712, "epoch": 286} {"train_loss": -33.410762786865234, "global_step": 34713, "epoch": 286} {"train_loss": -33.28459548950195, "global_step": 34714, "epoch": 286} {"train_loss": -32.471229553222656, "global_step": 34715, "epoch": 286} {"train_loss": -32.206764221191406, "global_step": 34716, "epoch": 286} {"train_loss": -32.577186584472656, "global_step": 34717, "epoch": 286} {"train_loss": -32.79541778564453, "global_step": 34718, "epoch": 286} {"train_loss": -33.52963638305664, "global_step": 34719, "epoch": 286} {"train_loss": -33.421836853027344, "global_step": 34720, "epoch": 286} {"train_loss": -33.429779052734375, "global_step": 34721, "epoch": 286} {"train_loss": -33.67545700073242, "global_step": 34722, "epoch": 286} {"train_loss": -33.963497161865234, "global_step": 34723, "epoch": 286} {"train_loss": -33.76072311401367, "global_step": 34724, "epoch": 286} {"train_loss": -33.858943939208984, "global_step": 34725, "epoch": 286} {"train_loss": -32.74215603662916, "global_step": 34726, "epoch": 286, "val_loss": 2523397.0} {"train_loss": -33.92034912109375, "global_step": 34727, "epoch": 287} {"train_loss": -34.17085266113281, "global_step": 34728, "epoch": 287} {"train_loss": -33.66107177734375, "global_step": 34729, "epoch": 287} {"train_loss": -33.622249603271484, "global_step": 34730, "epoch": 287} {"train_loss": -33.63943099975586, "global_step": 34731, "epoch": 287} {"train_loss": -33.871395111083984, "global_step": 34732, "epoch": 287} {"train_loss": -33.636043548583984, "global_step": 34733, "epoch": 287} {"train_loss": -33.837947845458984, "global_step": 34734, "epoch": 287} {"train_loss": -33.99882888793945, "global_step": 34735, "epoch": 287} {"train_loss": -34.08109664916992, "global_step": 34736, "epoch": 287} {"train_loss": -34.1375732421875, "global_step": 34737, "epoch": 287} {"train_loss": -34.02449035644531, "global_step": 34738, "epoch": 287} {"train_loss": -34.172054290771484, "global_step": 34739, "epoch": 287} {"train_loss": -34.26359558105469, "global_step": 34740, "epoch": 287} {"train_loss": -34.537200927734375, "global_step": 34741, "epoch": 287} {"train_loss": -34.567291259765625, "global_step": 34742, "epoch": 287} {"train_loss": -34.61980056762695, "global_step": 34743, "epoch": 287} {"train_loss": -34.15147018432617, "global_step": 34744, "epoch": 287} {"train_loss": -33.674739837646484, "global_step": 34745, "epoch": 287} {"train_loss": -33.36421585083008, "global_step": 34746, "epoch": 287} {"train_loss": -31.965076446533203, "global_step": 34747, "epoch": 287} {"train_loss": -30.94671630859375, "global_step": 34748, "epoch": 287} {"train_loss": -27.51975440979004, "global_step": 34749, "epoch": 287} {"train_loss": -25.802526473999023, "global_step": 34750, "epoch": 287} {"train_loss": -29.65750503540039, "global_step": 34751, "epoch": 287} {"train_loss": -32.986602783203125, "global_step": 34752, "epoch": 287} {"train_loss": -32.07780075073242, "global_step": 34753, "epoch": 287} {"train_loss": -32.73798370361328, "global_step": 34754, "epoch": 287} {"train_loss": -33.35333251953125, "global_step": 34755, "epoch": 287} {"train_loss": -33.20127487182617, "global_step": 34756, "epoch": 287} {"train_loss": -34.023345947265625, "global_step": 34757, "epoch": 287} {"train_loss": -33.708465576171875, "global_step": 34758, "epoch": 287} {"train_loss": -32.94680404663086, "global_step": 34759, "epoch": 287} {"train_loss": -33.60871124267578, "global_step": 34760, "epoch": 287} {"train_loss": -33.48226547241211, "global_step": 34761, "epoch": 287} {"train_loss": -33.18760299682617, "global_step": 34762, "epoch": 287} {"train_loss": -29.779178619384766, "global_step": 34763, "epoch": 287} {"train_loss": -32.57524490356445, "global_step": 34764, "epoch": 287} {"train_loss": -33.64451217651367, "global_step": 34765, "epoch": 287} {"train_loss": -31.817157745361328, "global_step": 34766, "epoch": 287} {"train_loss": -33.24177551269531, "global_step": 34767, "epoch": 287} {"train_loss": -32.28635787963867, "global_step": 34768, "epoch": 287} {"train_loss": -33.586509704589844, "global_step": 34769, "epoch": 287} {"train_loss": -32.423851013183594, "global_step": 34770, "epoch": 287} {"train_loss": -32.47060775756836, "global_step": 34771, "epoch": 287} {"train_loss": -33.13826370239258, "global_step": 34772, "epoch": 287} {"train_loss": -33.531410217285156, "global_step": 34773, "epoch": 287} {"train_loss": -31.95584487915039, "global_step": 34774, "epoch": 287} {"train_loss": -33.387977600097656, "global_step": 34775, "epoch": 287} {"train_loss": -33.41157150268555, "global_step": 34776, "epoch": 287} {"train_loss": -33.21326446533203, "global_step": 34777, "epoch": 287} {"train_loss": -33.292236328125, "global_step": 34778, "epoch": 287} {"train_loss": -33.70168685913086, "global_step": 34779, "epoch": 287} {"train_loss": -33.32794952392578, "global_step": 34780, "epoch": 287} {"train_loss": -33.36684036254883, "global_step": 34781, "epoch": 287} {"train_loss": -32.984107971191406, "global_step": 34782, "epoch": 287} {"train_loss": -33.27606964111328, "global_step": 34783, "epoch": 287} {"train_loss": -33.872314453125, "global_step": 34784, "epoch": 287} {"train_loss": -33.32230758666992, "global_step": 34785, "epoch": 287} {"train_loss": -33.698455810546875, "global_step": 34786, "epoch": 287} {"train_loss": -33.273468017578125, "global_step": 34787, "epoch": 287} {"train_loss": -34.041542053222656, "global_step": 34788, "epoch": 287} {"train_loss": -34.11595153808594, "global_step": 34789, "epoch": 287} {"train_loss": -33.16664505004883, "global_step": 34790, "epoch": 287} {"train_loss": -33.7037353515625, "global_step": 34791, "epoch": 287} {"train_loss": -33.41475296020508, "global_step": 34792, "epoch": 287} {"train_loss": -34.19234085083008, "global_step": 34793, "epoch": 287} {"train_loss": -33.52570343017578, "global_step": 34794, "epoch": 287} {"train_loss": -33.04487991333008, "global_step": 34795, "epoch": 287} {"train_loss": -33.0882682800293, "global_step": 34796, "epoch": 287} {"train_loss": -32.648345947265625, "global_step": 34797, "epoch": 287} {"train_loss": -31.461271286010742, "global_step": 34798, "epoch": 287} {"train_loss": -29.659570693969727, "global_step": 34799, "epoch": 287} {"train_loss": -32.12139892578125, "global_step": 34800, "epoch": 287} {"train_loss": -33.42619705200195, "global_step": 34801, "epoch": 287} {"train_loss": -32.86236572265625, "global_step": 34802, "epoch": 287} {"train_loss": -32.09719467163086, "global_step": 34803, "epoch": 287} {"train_loss": -31.434499740600586, "global_step": 34804, "epoch": 287} {"train_loss": -32.724220275878906, "global_step": 34805, "epoch": 287} {"train_loss": -33.50505065917969, "global_step": 34806, "epoch": 287} {"train_loss": -32.55076599121094, "global_step": 34807, "epoch": 287} {"train_loss": -32.929500579833984, "global_step": 34808, "epoch": 287} {"train_loss": -33.518310546875, "global_step": 34809, "epoch": 287} {"train_loss": -33.414031982421875, "global_step": 34810, "epoch": 287} {"train_loss": -33.86511993408203, "global_step": 34811, "epoch": 287} {"train_loss": -33.684417724609375, "global_step": 34812, "epoch": 287} {"train_loss": -33.19771957397461, "global_step": 34813, "epoch": 287} {"train_loss": -34.36843490600586, "global_step": 34814, "epoch": 287} {"train_loss": -33.49726486206055, "global_step": 34815, "epoch": 287} {"train_loss": -33.85441970825195, "global_step": 34816, "epoch": 287} {"train_loss": -34.302852630615234, "global_step": 34817, "epoch": 287} {"train_loss": -33.908912658691406, "global_step": 34818, "epoch": 287} {"train_loss": -33.84510040283203, "global_step": 34819, "epoch": 287} {"train_loss": -33.84542465209961, "global_step": 34820, "epoch": 287} {"train_loss": -34.105106353759766, "global_step": 34821, "epoch": 287} {"train_loss": -33.8346061706543, "global_step": 34822, "epoch": 287} {"train_loss": -33.420467376708984, "global_step": 34823, "epoch": 287} {"train_loss": -33.858734130859375, "global_step": 34824, "epoch": 287} {"train_loss": -33.925262451171875, "global_step": 34825, "epoch": 287} {"train_loss": -33.73543167114258, "global_step": 34826, "epoch": 287} {"train_loss": -33.75599670410156, "global_step": 34827, "epoch": 287} {"train_loss": -33.52613067626953, "global_step": 34828, "epoch": 287} {"train_loss": -32.8789176940918, "global_step": 34829, "epoch": 287} {"train_loss": -32.40584945678711, "global_step": 34830, "epoch": 287} {"train_loss": -32.80747604370117, "global_step": 34831, "epoch": 287} {"train_loss": -33.48381423950195, "global_step": 34832, "epoch": 287} {"train_loss": -33.297607421875, "global_step": 34833, "epoch": 287} {"train_loss": -32.58198165893555, "global_step": 34834, "epoch": 287} {"train_loss": -32.846920013427734, "global_step": 34835, "epoch": 287} {"train_loss": -33.6098747253418, "global_step": 34836, "epoch": 287} {"train_loss": -33.395957946777344, "global_step": 34837, "epoch": 287} {"train_loss": -32.402523040771484, "global_step": 34838, "epoch": 287} {"train_loss": -33.03450012207031, "global_step": 34839, "epoch": 287} {"train_loss": -33.41768264770508, "global_step": 34840, "epoch": 287} {"train_loss": -32.41512680053711, "global_step": 34841, "epoch": 287} {"train_loss": -33.2142448425293, "global_step": 34842, "epoch": 287} {"train_loss": -32.60699462890625, "global_step": 34843, "epoch": 287} {"train_loss": -33.49875259399414, "global_step": 34844, "epoch": 287} {"train_loss": -32.4904670715332, "global_step": 34845, "epoch": 287} {"train_loss": -33.6993522644043, "global_step": 34846, "epoch": 287} {"train_loss": -33.12751919770044, "global_step": 34847, "epoch": 287, "val_loss": 2625421.25} {"train_loss": -32.9879035949707, "global_step": 34848, "epoch": 288} {"train_loss": -33.4575080871582, "global_step": 34849, "epoch": 288} {"train_loss": -33.2531852722168, "global_step": 34850, "epoch": 288} {"train_loss": -33.60691833496094, "global_step": 34851, "epoch": 288} {"train_loss": -33.77496337890625, "global_step": 34852, "epoch": 288} {"train_loss": -33.48980712890625, "global_step": 34853, "epoch": 288} {"train_loss": -33.8288688659668, "global_step": 34854, "epoch": 288} {"train_loss": -33.56249237060547, "global_step": 34855, "epoch": 288} {"train_loss": -33.84942626953125, "global_step": 34856, "epoch": 288} {"train_loss": -33.82856750488281, "global_step": 34857, "epoch": 288} {"train_loss": -33.50151824951172, "global_step": 34858, "epoch": 288} {"train_loss": -33.06602478027344, "global_step": 34859, "epoch": 288} {"train_loss": -33.80793762207031, "global_step": 34860, "epoch": 288} {"train_loss": -34.374507904052734, "global_step": 34861, "epoch": 288} {"train_loss": -33.354217529296875, "global_step": 34862, "epoch": 288} {"train_loss": -34.33076095581055, "global_step": 34863, "epoch": 288} {"train_loss": -34.494014739990234, "global_step": 34864, "epoch": 288} {"train_loss": -33.59830856323242, "global_step": 34865, "epoch": 288} {"train_loss": -33.744808197021484, "global_step": 34866, "epoch": 288} {"train_loss": -33.91316604614258, "global_step": 34867, "epoch": 288} {"train_loss": -34.35020446777344, "global_step": 34868, "epoch": 288} {"train_loss": -34.11188888549805, "global_step": 34869, "epoch": 288} {"train_loss": -33.953548431396484, "global_step": 34870, "epoch": 288} {"train_loss": -34.22768020629883, "global_step": 34871, "epoch": 288} {"train_loss": -34.298309326171875, "global_step": 34872, "epoch": 288} {"train_loss": -34.21952438354492, "global_step": 34873, "epoch": 288} {"train_loss": -34.56888961791992, "global_step": 34874, "epoch": 288} {"train_loss": -34.36281967163086, "global_step": 34875, "epoch": 288} {"train_loss": -34.33252716064453, "global_step": 34876, "epoch": 288} {"train_loss": -34.48780059814453, "global_step": 34877, "epoch": 288} {"train_loss": -34.711238861083984, "global_step": 34878, "epoch": 288} {"train_loss": -34.36353302001953, "global_step": 34879, "epoch": 288} {"train_loss": -34.551204681396484, "global_step": 34880, "epoch": 288} {"train_loss": -34.50399398803711, "global_step": 34881, "epoch": 288} {"train_loss": -34.42893981933594, "global_step": 34882, "epoch": 288} {"train_loss": -34.3062744140625, "global_step": 34883, "epoch": 288} {"train_loss": -34.10446548461914, "global_step": 34884, "epoch": 288} {"train_loss": -33.24494934082031, "global_step": 34885, "epoch": 288} {"train_loss": -28.340106964111328, "global_step": 34886, "epoch": 288} {"train_loss": -3.7691895961761475, "global_step": 34887, "epoch": 288} {"train_loss": 33.902339935302734, "global_step": 34888, "epoch": 288} {"train_loss": -9.31917667388916, "global_step": 34889, "epoch": 288} {"train_loss": -23.110641479492188, "global_step": 34890, "epoch": 288} {"train_loss": -27.81377601623535, "global_step": 34891, "epoch": 288} {"train_loss": -19.877470016479492, "global_step": 34892, "epoch": 288} {"train_loss": -32.23374938964844, "global_step": 34893, "epoch": 288} {"train_loss": -29.241168975830078, "global_step": 34894, "epoch": 288} {"train_loss": -26.789840698242188, "global_step": 34895, "epoch": 288} {"train_loss": -30.329736709594727, "global_step": 34896, "epoch": 288} {"train_loss": -32.48263168334961, "global_step": 34897, "epoch": 288} {"train_loss": -32.03106689453125, "global_step": 34898, "epoch": 288} {"train_loss": -30.874420166015625, "global_step": 34899, "epoch": 288} {"train_loss": -30.344125747680664, "global_step": 34900, "epoch": 288} {"train_loss": -30.777082443237305, "global_step": 34901, "epoch": 288} {"train_loss": -32.48807907104492, "global_step": 34902, "epoch": 288} {"train_loss": -32.69110870361328, "global_step": 34903, "epoch": 288} {"train_loss": -31.85068130493164, "global_step": 34904, "epoch": 288} {"train_loss": -31.88751220703125, "global_step": 34905, "epoch": 288} {"train_loss": -31.509973526000977, "global_step": 34906, "epoch": 288} {"train_loss": -32.187782287597656, "global_step": 34907, "epoch": 288} {"train_loss": -32.098628997802734, "global_step": 34908, "epoch": 288} {"train_loss": -32.24843215942383, "global_step": 34909, "epoch": 288} {"train_loss": -32.535091400146484, "global_step": 34910, "epoch": 288} {"train_loss": -32.57161331176758, "global_step": 34911, "epoch": 288} {"train_loss": -32.376678466796875, "global_step": 34912, "epoch": 288} {"train_loss": -32.32468795776367, "global_step": 34913, "epoch": 288} {"train_loss": -32.884910583496094, "global_step": 34914, "epoch": 288} {"train_loss": -32.51013946533203, "global_step": 34915, "epoch": 288} {"train_loss": -32.4219970703125, "global_step": 34916, "epoch": 288} {"train_loss": -32.94540023803711, "global_step": 34917, "epoch": 288} {"train_loss": -33.394744873046875, "global_step": 34918, "epoch": 288} {"train_loss": -33.00288009643555, "global_step": 34919, "epoch": 288} {"train_loss": -32.84096145629883, "global_step": 34920, "epoch": 288} {"train_loss": -33.13801956176758, "global_step": 34921, "epoch": 288} {"train_loss": -32.6792106628418, "global_step": 34922, "epoch": 288} {"train_loss": -33.10468673706055, "global_step": 34923, "epoch": 288} {"train_loss": -32.89949417114258, "global_step": 34924, "epoch": 288} {"train_loss": -33.160274505615234, "global_step": 34925, "epoch": 288} {"train_loss": -33.54195022583008, "global_step": 34926, "epoch": 288} {"train_loss": -33.7328987121582, "global_step": 34927, "epoch": 288} {"train_loss": -33.511775970458984, "global_step": 34928, "epoch": 288} {"train_loss": -33.800323486328125, "global_step": 34929, "epoch": 288} {"train_loss": -33.390560150146484, "global_step": 34930, "epoch": 288} {"train_loss": -33.54757308959961, "global_step": 34931, "epoch": 288} {"train_loss": -33.805110931396484, "global_step": 34932, "epoch": 288} {"train_loss": -33.19438934326172, "global_step": 34933, "epoch": 288} {"train_loss": -32.928409576416016, "global_step": 34934, "epoch": 288} {"train_loss": -33.72687530517578, "global_step": 34935, "epoch": 288} {"train_loss": -32.78456115722656, "global_step": 34936, "epoch": 288} {"train_loss": -32.8593864440918, "global_step": 34937, "epoch": 288} {"train_loss": -33.122554779052734, "global_step": 34938, "epoch": 288} {"train_loss": -32.63886642456055, "global_step": 34939, "epoch": 288} {"train_loss": -33.17403030395508, "global_step": 34940, "epoch": 288} {"train_loss": -33.10821533203125, "global_step": 34941, "epoch": 288} {"train_loss": -32.55461883544922, "global_step": 34942, "epoch": 288} {"train_loss": -33.215396881103516, "global_step": 34943, "epoch": 288} {"train_loss": -33.33484649658203, "global_step": 34944, "epoch": 288} {"train_loss": -32.297298431396484, "global_step": 34945, "epoch": 288} {"train_loss": -33.39958572387695, "global_step": 34946, "epoch": 288} {"train_loss": -32.176177978515625, "global_step": 34947, "epoch": 288} {"train_loss": -33.081451416015625, "global_step": 34948, "epoch": 288} {"train_loss": -32.847896575927734, "global_step": 34949, "epoch": 288} {"train_loss": -33.563629150390625, "global_step": 34950, "epoch": 288} {"train_loss": -33.13616943359375, "global_step": 34951, "epoch": 288} {"train_loss": -33.20455551147461, "global_step": 34952, "epoch": 288} {"train_loss": -33.14535140991211, "global_step": 34953, "epoch": 288} {"train_loss": -32.812721252441406, "global_step": 34954, "epoch": 288} {"train_loss": -33.186317443847656, "global_step": 34955, "epoch": 288} {"train_loss": -33.49080276489258, "global_step": 34956, "epoch": 288} {"train_loss": -33.03754806518555, "global_step": 34957, "epoch": 288} {"train_loss": -33.40993118286133, "global_step": 34958, "epoch": 288} {"train_loss": -32.828495025634766, "global_step": 34959, "epoch": 288} {"train_loss": -32.959564208984375, "global_step": 34960, "epoch": 288} {"train_loss": -30.481201171875, "global_step": 34961, "epoch": 288} {"train_loss": -22.391826629638672, "global_step": 34962, "epoch": 288} {"train_loss": -4.550961971282959, "global_step": 34963, "epoch": 288} {"train_loss": 38.195125579833984, "global_step": 34964, "epoch": 288} {"train_loss": 13.79248046875, "global_step": 34965, "epoch": 288} {"train_loss": -25.475706100463867, "global_step": 34966, "epoch": 288} {"train_loss": -8.339274406433105, "global_step": 34967, "epoch": 288} {"train_loss": -30.112052344093637, "global_step": 34968, "epoch": 288, "val_loss": 2536990.25} {"train_loss": -25.663908004760742, "global_step": 34969, "epoch": 289} {"train_loss": -21.121679306030273, "global_step": 34970, "epoch": 289} {"train_loss": -19.94374656677246, "global_step": 34971, "epoch": 289} {"train_loss": -29.887853622436523, "global_step": 34972, "epoch": 289} {"train_loss": -28.50398063659668, "global_step": 34973, "epoch": 289} {"train_loss": -27.19290542602539, "global_step": 34974, "epoch": 289} {"train_loss": -27.424535751342773, "global_step": 34975, "epoch": 289} {"train_loss": -26.041122436523438, "global_step": 34976, "epoch": 289} {"train_loss": -28.95185661315918, "global_step": 34977, "epoch": 289} {"train_loss": -29.73529624938965, "global_step": 34978, "epoch": 289} {"train_loss": -29.72348976135254, "global_step": 34979, "epoch": 289} {"train_loss": -29.9218692779541, "global_step": 34980, "epoch": 289} {"train_loss": -29.689685821533203, "global_step": 34981, "epoch": 289} {"train_loss": -28.76314353942871, "global_step": 34982, "epoch": 289} {"train_loss": -29.025104522705078, "global_step": 34983, "epoch": 289} {"train_loss": -29.49594497680664, "global_step": 34984, "epoch": 289} {"train_loss": -29.533588409423828, "global_step": 34985, "epoch": 289} {"train_loss": -30.192785263061523, "global_step": 34986, "epoch": 289} {"train_loss": -30.030609130859375, "global_step": 34987, "epoch": 289} {"train_loss": -30.443811416625977, "global_step": 34988, "epoch": 289} {"train_loss": -30.314260482788086, "global_step": 34989, "epoch": 289} {"train_loss": -30.04316520690918, "global_step": 34990, "epoch": 289} {"train_loss": -30.128711700439453, "global_step": 34991, "epoch": 289} {"train_loss": -30.17266273498535, "global_step": 34992, "epoch": 289} {"train_loss": -30.333038330078125, "global_step": 34993, "epoch": 289} {"train_loss": -30.158771514892578, "global_step": 34994, "epoch": 289} {"train_loss": -30.524587631225586, "global_step": 34995, "epoch": 289} {"train_loss": -30.70600700378418, "global_step": 34996, "epoch": 289} {"train_loss": -30.569122314453125, "global_step": 34997, "epoch": 289} {"train_loss": -30.97471046447754, "global_step": 34998, "epoch": 289} {"train_loss": -30.796972274780273, "global_step": 34999, "epoch": 289} {"train_loss": -31.213666915893555, "global_step": 35000, "epoch": 289} {"train_loss": -30.902509689331055, "global_step": 35001, "epoch": 289} {"train_loss": -30.997297286987305, "global_step": 35002, "epoch": 289} {"train_loss": -31.23727798461914, "global_step": 35003, "epoch": 289} {"train_loss": -30.97820472717285, "global_step": 35004, "epoch": 289} {"train_loss": -31.394346237182617, "global_step": 35005, "epoch": 289} {"train_loss": -31.20745849609375, "global_step": 35006, "epoch": 289} {"train_loss": -31.797077178955078, "global_step": 35007, "epoch": 289} {"train_loss": -31.474109649658203, "global_step": 35008, "epoch": 289} {"train_loss": -31.301467895507812, "global_step": 35009, "epoch": 289} {"train_loss": -31.814407348632812, "global_step": 35010, "epoch": 289} {"train_loss": -31.866931915283203, "global_step": 35011, "epoch": 289} {"train_loss": -31.51009178161621, "global_step": 35012, "epoch": 289} {"train_loss": -31.46661949157715, "global_step": 35013, "epoch": 289} {"train_loss": -32.01319122314453, "global_step": 35014, "epoch": 289} {"train_loss": -32.342872619628906, "global_step": 35015, "epoch": 289} {"train_loss": -32.06974411010742, "global_step": 35016, "epoch": 289} {"train_loss": -31.912799835205078, "global_step": 35017, "epoch": 289} {"train_loss": -32.20329666137695, "global_step": 35018, "epoch": 289} {"train_loss": -32.14260482788086, "global_step": 35019, "epoch": 289} {"train_loss": -32.51739501953125, "global_step": 35020, "epoch": 289} {"train_loss": -32.51969909667969, "global_step": 35021, "epoch": 289} {"train_loss": -32.17856979370117, "global_step": 35022, "epoch": 289} {"train_loss": -32.0882568359375, "global_step": 35023, "epoch": 289} {"train_loss": -32.33907699584961, "global_step": 35024, "epoch": 289} {"train_loss": -32.45895004272461, "global_step": 35025, "epoch": 289} {"train_loss": -32.1513557434082, "global_step": 35026, "epoch": 289} {"train_loss": -31.393781661987305, "global_step": 35027, "epoch": 289} {"train_loss": -32.1888542175293, "global_step": 35028, "epoch": 289} {"train_loss": -30.642108917236328, "global_step": 35029, "epoch": 289} {"train_loss": -28.14082145690918, "global_step": 35030, "epoch": 289} {"train_loss": -28.310211181640625, "global_step": 35031, "epoch": 289} {"train_loss": -28.744821548461914, "global_step": 35032, "epoch": 289} {"train_loss": -31.392578125, "global_step": 35033, "epoch": 289} {"train_loss": -29.002460479736328, "global_step": 35034, "epoch": 289} {"train_loss": -31.132587432861328, "global_step": 35035, "epoch": 289} {"train_loss": -30.567291259765625, "global_step": 35036, "epoch": 289} {"train_loss": -31.470746994018555, "global_step": 35037, "epoch": 289} {"train_loss": -30.698007583618164, "global_step": 35038, "epoch": 289} {"train_loss": -30.81081199645996, "global_step": 35039, "epoch": 289} {"train_loss": -31.56275749206543, "global_step": 35040, "epoch": 289} {"train_loss": -31.334814071655273, "global_step": 35041, "epoch": 289} {"train_loss": -31.40358543395996, "global_step": 35042, "epoch": 289} {"train_loss": -31.34793472290039, "global_step": 35043, "epoch": 289} {"train_loss": -31.76336097717285, "global_step": 35044, "epoch": 289} {"train_loss": -30.382675170898438, "global_step": 35045, "epoch": 289} {"train_loss": -31.42413330078125, "global_step": 35046, "epoch": 289} {"train_loss": -31.316953659057617, "global_step": 35047, "epoch": 289} {"train_loss": -31.556310653686523, "global_step": 35048, "epoch": 289} {"train_loss": -31.57111167907715, "global_step": 35049, "epoch": 289} {"train_loss": -31.565826416015625, "global_step": 35050, "epoch": 289} {"train_loss": -31.514265060424805, "global_step": 35051, "epoch": 289} {"train_loss": -31.85562515258789, "global_step": 35052, "epoch": 289} {"train_loss": -31.67255210876465, "global_step": 35053, "epoch": 289} {"train_loss": -31.88361930847168, "global_step": 35054, "epoch": 289} {"train_loss": -31.0895938873291, "global_step": 35055, "epoch": 289} {"train_loss": -32.20960235595703, "global_step": 35056, "epoch": 289} {"train_loss": -31.871353149414062, "global_step": 35057, "epoch": 289} {"train_loss": -32.03342819213867, "global_step": 35058, "epoch": 289} {"train_loss": -32.13213348388672, "global_step": 35059, "epoch": 289} {"train_loss": -31.73075294494629, "global_step": 35060, "epoch": 289} {"train_loss": -31.840133666992188, "global_step": 35061, "epoch": 289} {"train_loss": -32.31867980957031, "global_step": 35062, "epoch": 289} {"train_loss": -32.28663635253906, "global_step": 35063, "epoch": 289} {"train_loss": -32.04305648803711, "global_step": 35064, "epoch": 289} {"train_loss": -32.42900466918945, "global_step": 35065, "epoch": 289} {"train_loss": -31.973623275756836, "global_step": 35066, "epoch": 289} {"train_loss": -32.42047882080078, "global_step": 35067, "epoch": 289} {"train_loss": -32.143245697021484, "global_step": 35068, "epoch": 289} {"train_loss": -32.1578483581543, "global_step": 35069, "epoch": 289} {"train_loss": -32.558528900146484, "global_step": 35070, "epoch": 289} {"train_loss": -32.259212493896484, "global_step": 35071, "epoch": 289} {"train_loss": -31.942819595336914, "global_step": 35072, "epoch": 289} {"train_loss": -32.259429931640625, "global_step": 35073, "epoch": 289} {"train_loss": -31.744611740112305, "global_step": 35074, "epoch": 289} {"train_loss": -32.41122055053711, "global_step": 35075, "epoch": 289} {"train_loss": -31.6427059173584, "global_step": 35076, "epoch": 289} {"train_loss": -32.442081451416016, "global_step": 35077, "epoch": 289} {"train_loss": -32.399810791015625, "global_step": 35078, "epoch": 289} {"train_loss": -32.678138732910156, "global_step": 35079, "epoch": 289} {"train_loss": -32.437103271484375, "global_step": 35080, "epoch": 289} {"train_loss": -32.13652038574219, "global_step": 35081, "epoch": 289} {"train_loss": -30.608352661132812, "global_step": 35082, "epoch": 289} {"train_loss": -32.10230255126953, "global_step": 35083, "epoch": 289} {"train_loss": -32.13870620727539, "global_step": 35084, "epoch": 289} {"train_loss": -32.22738265991211, "global_step": 35085, "epoch": 289} {"train_loss": -32.14443588256836, "global_step": 35086, "epoch": 289} {"train_loss": -32.50640106201172, "global_step": 35087, "epoch": 289} {"train_loss": -32.532344818115234, "global_step": 35088, "epoch": 289} {"train_loss": -30.95188016339767, "global_step": 35089, "epoch": 289, "val_loss": 2592759.25} {"train_loss": -32.687652587890625, "global_step": 35090, "epoch": 290} {"train_loss": -32.323760986328125, "global_step": 35091, "epoch": 290} {"train_loss": -31.136693954467773, "global_step": 35092, "epoch": 290} {"train_loss": -31.618677139282227, "global_step": 35093, "epoch": 290} {"train_loss": -31.860248565673828, "global_step": 35094, "epoch": 290} {"train_loss": -32.09224319458008, "global_step": 35095, "epoch": 290} {"train_loss": -31.72611427307129, "global_step": 35096, "epoch": 290} {"train_loss": -32.058929443359375, "global_step": 35097, "epoch": 290} {"train_loss": -32.20577621459961, "global_step": 35098, "epoch": 290} {"train_loss": -32.41173553466797, "global_step": 35099, "epoch": 290} {"train_loss": -32.33623123168945, "global_step": 35100, "epoch": 290} {"train_loss": -32.44580841064453, "global_step": 35101, "epoch": 290} {"train_loss": -32.006385803222656, "global_step": 35102, "epoch": 290} {"train_loss": -32.79877471923828, "global_step": 35103, "epoch": 290} {"train_loss": -32.60976791381836, "global_step": 35104, "epoch": 290} {"train_loss": -32.44684600830078, "global_step": 35105, "epoch": 290} {"train_loss": -32.28715896606445, "global_step": 35106, "epoch": 290} {"train_loss": -32.8552360534668, "global_step": 35107, "epoch": 290} {"train_loss": -32.35888671875, "global_step": 35108, "epoch": 290} {"train_loss": -32.924503326416016, "global_step": 35109, "epoch": 290} {"train_loss": -32.58156204223633, "global_step": 35110, "epoch": 290} {"train_loss": -32.91627502441406, "global_step": 35111, "epoch": 290} {"train_loss": -32.75295639038086, "global_step": 35112, "epoch": 290} {"train_loss": -32.99459457397461, "global_step": 35113, "epoch": 290} {"train_loss": -32.04193878173828, "global_step": 35114, "epoch": 290} {"train_loss": -32.967323303222656, "global_step": 35115, "epoch": 290} {"train_loss": -32.913299560546875, "global_step": 35116, "epoch": 290} {"train_loss": -32.450923919677734, "global_step": 35117, "epoch": 290} {"train_loss": -31.50592041015625, "global_step": 35118, "epoch": 290} {"train_loss": -32.09262466430664, "global_step": 35119, "epoch": 290} {"train_loss": -32.62223434448242, "global_step": 35120, "epoch": 290} {"train_loss": -30.63861656188965, "global_step": 35121, "epoch": 290} {"train_loss": -32.55024337768555, "global_step": 35122, "epoch": 290} {"train_loss": -32.37574005126953, "global_step": 35123, "epoch": 290} {"train_loss": -31.505313873291016, "global_step": 35124, "epoch": 290} {"train_loss": -32.37224197387695, "global_step": 35125, "epoch": 290} {"train_loss": -32.27582931518555, "global_step": 35126, "epoch": 290} {"train_loss": -31.52997398376465, "global_step": 35127, "epoch": 290} {"train_loss": -31.886220932006836, "global_step": 35128, "epoch": 290} {"train_loss": -31.871341705322266, "global_step": 35129, "epoch": 290} {"train_loss": -31.9675235748291, "global_step": 35130, "epoch": 290} {"train_loss": -32.497581481933594, "global_step": 35131, "epoch": 290} {"train_loss": -32.048683166503906, "global_step": 35132, "epoch": 290} {"train_loss": -32.03609085083008, "global_step": 35133, "epoch": 290} {"train_loss": -32.51063537597656, "global_step": 35134, "epoch": 290} {"train_loss": -32.39191436767578, "global_step": 35135, "epoch": 290} {"train_loss": -32.537227630615234, "global_step": 35136, "epoch": 290} {"train_loss": -32.93557357788086, "global_step": 35137, "epoch": 290} {"train_loss": -32.27375793457031, "global_step": 35138, "epoch": 290} {"train_loss": -31.721450805664062, "global_step": 35139, "epoch": 290} {"train_loss": -31.54778480529785, "global_step": 35140, "epoch": 290} {"train_loss": -31.857635498046875, "global_step": 35141, "epoch": 290} {"train_loss": -32.40023422241211, "global_step": 35142, "epoch": 290} {"train_loss": -31.4451961517334, "global_step": 35143, "epoch": 290} {"train_loss": -32.467987060546875, "global_step": 35144, "epoch": 290} {"train_loss": -32.251136779785156, "global_step": 35145, "epoch": 290} {"train_loss": -31.689489364624023, "global_step": 35146, "epoch": 290} {"train_loss": -30.683725357055664, "global_step": 35147, "epoch": 290} {"train_loss": -30.62421989440918, "global_step": 35148, "epoch": 290} {"train_loss": -32.639434814453125, "global_step": 35149, "epoch": 290} {"train_loss": -32.365474700927734, "global_step": 35150, "epoch": 290} {"train_loss": -31.28177833557129, "global_step": 35151, "epoch": 290} {"train_loss": -31.266021728515625, "global_step": 35152, "epoch": 290} {"train_loss": -31.734853744506836, "global_step": 35153, "epoch": 290} {"train_loss": -32.17924118041992, "global_step": 35154, "epoch": 290} {"train_loss": -31.570026397705078, "global_step": 35155, "epoch": 290} {"train_loss": -31.950403213500977, "global_step": 35156, "epoch": 290} {"train_loss": -32.5521125793457, "global_step": 35157, "epoch": 290} {"train_loss": -31.835590362548828, "global_step": 35158, "epoch": 290} {"train_loss": -31.512409210205078, "global_step": 35159, "epoch": 290} {"train_loss": -32.58284378051758, "global_step": 35160, "epoch": 290} {"train_loss": -32.0374755859375, "global_step": 35161, "epoch": 290} {"train_loss": -32.2860107421875, "global_step": 35162, "epoch": 290} {"train_loss": -31.204299926757812, "global_step": 35163, "epoch": 290} {"train_loss": -31.936508178710938, "global_step": 35164, "epoch": 290} {"train_loss": -32.72459030151367, "global_step": 35165, "epoch": 290} {"train_loss": -32.035125732421875, "global_step": 35166, "epoch": 290} {"train_loss": -32.0150260925293, "global_step": 35167, "epoch": 290} {"train_loss": -32.385738372802734, "global_step": 35168, "epoch": 290} {"train_loss": -32.261871337890625, "global_step": 35169, "epoch": 290} {"train_loss": -32.251888275146484, "global_step": 35170, "epoch": 290} {"train_loss": -31.7200927734375, "global_step": 35171, "epoch": 290} {"train_loss": -32.961727142333984, "global_step": 35172, "epoch": 290} {"train_loss": -32.02885055541992, "global_step": 35173, "epoch": 290} {"train_loss": -32.578853607177734, "global_step": 35174, "epoch": 290} {"train_loss": -32.85232162475586, "global_step": 35175, "epoch": 290} {"train_loss": -32.379425048828125, "global_step": 35176, "epoch": 290} {"train_loss": -32.44498825073242, "global_step": 35177, "epoch": 290} {"train_loss": -32.09760665893555, "global_step": 35178, "epoch": 290} {"train_loss": -32.41897201538086, "global_step": 35179, "epoch": 290} {"train_loss": -32.530853271484375, "global_step": 35180, "epoch": 290} {"train_loss": -32.41009521484375, "global_step": 35181, "epoch": 290} {"train_loss": -32.82760238647461, "global_step": 35182, "epoch": 290} {"train_loss": -32.603050231933594, "global_step": 35183, "epoch": 290} {"train_loss": -32.783180236816406, "global_step": 35184, "epoch": 290} {"train_loss": -32.25210189819336, "global_step": 35185, "epoch": 290} {"train_loss": -32.827125549316406, "global_step": 35186, "epoch": 290} {"train_loss": -32.35270309448242, "global_step": 35187, "epoch": 290} {"train_loss": -32.769954681396484, "global_step": 35188, "epoch": 290} {"train_loss": -32.97282791137695, "global_step": 35189, "epoch": 290} {"train_loss": -32.89223861694336, "global_step": 35190, "epoch": 290} {"train_loss": -31.94900894165039, "global_step": 35191, "epoch": 290} {"train_loss": -32.332767486572266, "global_step": 35192, "epoch": 290} {"train_loss": -32.639278411865234, "global_step": 35193, "epoch": 290} {"train_loss": -32.46842575073242, "global_step": 35194, "epoch": 290} {"train_loss": -32.850868225097656, "global_step": 35195, "epoch": 290} {"train_loss": -31.919748306274414, "global_step": 35196, "epoch": 290} {"train_loss": -31.677600860595703, "global_step": 35197, "epoch": 290} {"train_loss": -31.8537540435791, "global_step": 35198, "epoch": 290} {"train_loss": -32.775760650634766, "global_step": 35199, "epoch": 290} {"train_loss": -32.17144775390625, "global_step": 35200, "epoch": 290} {"train_loss": -32.061744689941406, "global_step": 35201, "epoch": 290} {"train_loss": -31.808521270751953, "global_step": 35202, "epoch": 290} {"train_loss": -32.267974853515625, "global_step": 35203, "epoch": 290} {"train_loss": -32.68366622924805, "global_step": 35204, "epoch": 290} {"train_loss": -32.24799728393555, "global_step": 35205, "epoch": 290} {"train_loss": -32.33830642700195, "global_step": 35206, "epoch": 290} {"train_loss": -32.55506134033203, "global_step": 35207, "epoch": 290} {"train_loss": -32.54807662963867, "global_step": 35208, "epoch": 290} {"train_loss": -33.02503967285156, "global_step": 35209, "epoch": 290} {"train_loss": -32.233919269782454, "global_step": 35210, "epoch": 290, "val_loss": 2612806.75} {"train_loss": -32.61608123779297, "global_step": 35211, "epoch": 291} {"train_loss": -32.889617919921875, "global_step": 35212, "epoch": 291} {"train_loss": -32.48249053955078, "global_step": 35213, "epoch": 291} {"train_loss": -32.50260543823242, "global_step": 35214, "epoch": 291} {"train_loss": -33.209957122802734, "global_step": 35215, "epoch": 291} {"train_loss": -33.19923782348633, "global_step": 35216, "epoch": 291} {"train_loss": -32.34764099121094, "global_step": 35217, "epoch": 291} {"train_loss": -32.92615509033203, "global_step": 35218, "epoch": 291} {"train_loss": -31.234983444213867, "global_step": 35219, "epoch": 291} {"train_loss": -27.09247398376465, "global_step": 35220, "epoch": 291} {"train_loss": -21.52023696899414, "global_step": 35221, "epoch": 291} {"train_loss": -26.792835235595703, "global_step": 35222, "epoch": 291} {"train_loss": -32.99924850463867, "global_step": 35223, "epoch": 291} {"train_loss": -30.85713005065918, "global_step": 35224, "epoch": 291} {"train_loss": -32.13996505737305, "global_step": 35225, "epoch": 291} {"train_loss": -32.3532829284668, "global_step": 35226, "epoch": 291} {"train_loss": -31.535934448242188, "global_step": 35227, "epoch": 291} {"train_loss": -32.39402389526367, "global_step": 35228, "epoch": 291} {"train_loss": -32.931331634521484, "global_step": 35229, "epoch": 291} {"train_loss": -32.761390686035156, "global_step": 35230, "epoch": 291} {"train_loss": -32.746734619140625, "global_step": 35231, "epoch": 291} {"train_loss": -32.89651107788086, "global_step": 35232, "epoch": 291} {"train_loss": -33.00418472290039, "global_step": 35233, "epoch": 291} {"train_loss": -32.61465072631836, "global_step": 35234, "epoch": 291} {"train_loss": -32.961700439453125, "global_step": 35235, "epoch": 291} {"train_loss": -32.979957580566406, "global_step": 35236, "epoch": 291} {"train_loss": -32.8267707824707, "global_step": 35237, "epoch": 291} {"train_loss": -33.274688720703125, "global_step": 35238, "epoch": 291} {"train_loss": -32.80367660522461, "global_step": 35239, "epoch": 291} {"train_loss": -33.0050163269043, "global_step": 35240, "epoch": 291} {"train_loss": -33.12215805053711, "global_step": 35241, "epoch": 291} {"train_loss": -33.123695373535156, "global_step": 35242, "epoch": 291} {"train_loss": -33.303955078125, "global_step": 35243, "epoch": 291} {"train_loss": -32.887542724609375, "global_step": 35244, "epoch": 291} {"train_loss": -33.146751403808594, "global_step": 35245, "epoch": 291} {"train_loss": -33.30573654174805, "global_step": 35246, "epoch": 291} {"train_loss": -33.424495697021484, "global_step": 35247, "epoch": 291} {"train_loss": -33.51161575317383, "global_step": 35248, "epoch": 291} {"train_loss": -33.07515335083008, "global_step": 35249, "epoch": 291} {"train_loss": -33.79383087158203, "global_step": 35250, "epoch": 291} {"train_loss": -33.29336929321289, "global_step": 35251, "epoch": 291} {"train_loss": -33.4207878112793, "global_step": 35252, "epoch": 291} {"train_loss": -33.682003021240234, "global_step": 35253, "epoch": 291} {"train_loss": -33.13009262084961, "global_step": 35254, "epoch": 291} {"train_loss": -33.32429122924805, "global_step": 35255, "epoch": 291} {"train_loss": -33.40129470825195, "global_step": 35256, "epoch": 291} {"train_loss": -33.32012176513672, "global_step": 35257, "epoch": 291} {"train_loss": -33.42542266845703, "global_step": 35258, "epoch": 291} {"train_loss": -33.77490997314453, "global_step": 35259, "epoch": 291} {"train_loss": -33.84455108642578, "global_step": 35260, "epoch": 291} {"train_loss": -32.857666015625, "global_step": 35261, "epoch": 291} {"train_loss": -32.62077713012695, "global_step": 35262, "epoch": 291} {"train_loss": -32.64921188354492, "global_step": 35263, "epoch": 291} {"train_loss": -28.45295524597168, "global_step": 35264, "epoch": 291} {"train_loss": -21.99263572692871, "global_step": 35265, "epoch": 291} {"train_loss": -21.208011627197266, "global_step": 35266, "epoch": 291} {"train_loss": -21.638168334960938, "global_step": 35267, "epoch": 291} {"train_loss": -23.28269386291504, "global_step": 35268, "epoch": 291} {"train_loss": -22.273452758789062, "global_step": 35269, "epoch": 291} {"train_loss": -24.423925399780273, "global_step": 35270, "epoch": 291} {"train_loss": -27.232412338256836, "global_step": 35271, "epoch": 291} {"train_loss": -26.459964752197266, "global_step": 35272, "epoch": 291} {"train_loss": -28.38592529296875, "global_step": 35273, "epoch": 291} {"train_loss": -28.863983154296875, "global_step": 35274, "epoch": 291} {"train_loss": -28.9930477142334, "global_step": 35275, "epoch": 291} {"train_loss": -30.399484634399414, "global_step": 35276, "epoch": 291} {"train_loss": -29.73080825805664, "global_step": 35277, "epoch": 291} {"train_loss": -30.07504653930664, "global_step": 35278, "epoch": 291} {"train_loss": -30.93263053894043, "global_step": 35279, "epoch": 291} {"train_loss": -31.030065536499023, "global_step": 35280, "epoch": 291} {"train_loss": -30.808897018432617, "global_step": 35281, "epoch": 291} {"train_loss": -31.4791202545166, "global_step": 35282, "epoch": 291} {"train_loss": -31.807462692260742, "global_step": 35283, "epoch": 291} {"train_loss": -31.31978416442871, "global_step": 35284, "epoch": 291} {"train_loss": -32.111202239990234, "global_step": 35285, "epoch": 291} {"train_loss": -32.225765228271484, "global_step": 35286, "epoch": 291} {"train_loss": -32.31594467163086, "global_step": 35287, "epoch": 291} {"train_loss": -32.56756591796875, "global_step": 35288, "epoch": 291} {"train_loss": -31.755081176757812, "global_step": 35289, "epoch": 291} {"train_loss": -32.20138168334961, "global_step": 35290, "epoch": 291} {"train_loss": -32.6233024597168, "global_step": 35291, "epoch": 291} {"train_loss": -32.172874450683594, "global_step": 35292, "epoch": 291} {"train_loss": -32.174476623535156, "global_step": 35293, "epoch": 291} {"train_loss": -32.37540054321289, "global_step": 35294, "epoch": 291} {"train_loss": -32.53108215332031, "global_step": 35295, "epoch": 291} {"train_loss": -32.95602035522461, "global_step": 35296, "epoch": 291} {"train_loss": -32.88370895385742, "global_step": 35297, "epoch": 291} {"train_loss": -32.70809555053711, "global_step": 35298, "epoch": 291} {"train_loss": -32.83716583251953, "global_step": 35299, "epoch": 291} {"train_loss": -33.27653884887695, "global_step": 35300, "epoch": 291} {"train_loss": -33.08509826660156, "global_step": 35301, "epoch": 291} {"train_loss": -33.22065353393555, "global_step": 35302, "epoch": 291} {"train_loss": -33.10157775878906, "global_step": 35303, "epoch": 291} {"train_loss": -33.25876998901367, "global_step": 35304, "epoch": 291} {"train_loss": -33.25806427001953, "global_step": 35305, "epoch": 291} {"train_loss": -33.271297454833984, "global_step": 35306, "epoch": 291} {"train_loss": -33.62837219238281, "global_step": 35307, "epoch": 291} {"train_loss": -33.67007064819336, "global_step": 35308, "epoch": 291} {"train_loss": -33.69224166870117, "global_step": 35309, "epoch": 291} {"train_loss": -33.06303024291992, "global_step": 35310, "epoch": 291} {"train_loss": -33.38340377807617, "global_step": 35311, "epoch": 291} {"train_loss": -33.445770263671875, "global_step": 35312, "epoch": 291} {"train_loss": -32.928077697753906, "global_step": 35313, "epoch": 291} {"train_loss": -33.51331329345703, "global_step": 35314, "epoch": 291} {"train_loss": -33.09556198120117, "global_step": 35315, "epoch": 291} {"train_loss": -33.1944694519043, "global_step": 35316, "epoch": 291} {"train_loss": -32.963680267333984, "global_step": 35317, "epoch": 291} {"train_loss": -32.965309143066406, "global_step": 35318, "epoch": 291} {"train_loss": -33.10175704956055, "global_step": 35319, "epoch": 291} {"train_loss": -33.70277786254883, "global_step": 35320, "epoch": 291} {"train_loss": -32.4626579284668, "global_step": 35321, "epoch": 291} {"train_loss": -32.68281173706055, "global_step": 35322, "epoch": 291} {"train_loss": -32.604248046875, "global_step": 35323, "epoch": 291} {"train_loss": -33.783382415771484, "global_step": 35324, "epoch": 291} {"train_loss": -33.13694381713867, "global_step": 35325, "epoch": 291} {"train_loss": -32.540985107421875, "global_step": 35326, "epoch": 291} {"train_loss": -33.22782516479492, "global_step": 35327, "epoch": 291} {"train_loss": -32.92030334472656, "global_step": 35328, "epoch": 291} {"train_loss": -32.819679260253906, "global_step": 35329, "epoch": 291} {"train_loss": -32.03610610961914, "global_step": 35330, "epoch": 291} {"train_loss": -31.8031454480384, "global_step": 35331, "epoch": 291, "val_loss": 2702945.75} {"train_loss": -30.944259643554688, "global_step": 35332, "epoch": 292} {"train_loss": -32.47993850708008, "global_step": 35333, "epoch": 292} {"train_loss": -32.18104934692383, "global_step": 35334, "epoch": 292} {"train_loss": -29.444381713867188, "global_step": 35335, "epoch": 292} {"train_loss": -32.50832748413086, "global_step": 35336, "epoch": 292} {"train_loss": -29.299543380737305, "global_step": 35337, "epoch": 292} {"train_loss": -31.339094161987305, "global_step": 35338, "epoch": 292} {"train_loss": -28.971525192260742, "global_step": 35339, "epoch": 292} {"train_loss": -32.643218994140625, "global_step": 35340, "epoch": 292} {"train_loss": -31.033035278320312, "global_step": 35341, "epoch": 292} {"train_loss": -31.463397979736328, "global_step": 35342, "epoch": 292} {"train_loss": -32.552242279052734, "global_step": 35343, "epoch": 292} {"train_loss": -31.704084396362305, "global_step": 35344, "epoch": 292} {"train_loss": -30.644641876220703, "global_step": 35345, "epoch": 292} {"train_loss": -31.739654541015625, "global_step": 35346, "epoch": 292} {"train_loss": -32.656036376953125, "global_step": 35347, "epoch": 292} {"train_loss": -32.05877685546875, "global_step": 35348, "epoch": 292} {"train_loss": -32.87459945678711, "global_step": 35349, "epoch": 292} {"train_loss": -31.976978302001953, "global_step": 35350, "epoch": 292} {"train_loss": -32.874847412109375, "global_step": 35351, "epoch": 292} {"train_loss": -32.456905364990234, "global_step": 35352, "epoch": 292} {"train_loss": -32.7453727722168, "global_step": 35353, "epoch": 292} {"train_loss": -32.29035568237305, "global_step": 35354, "epoch": 292} {"train_loss": -32.960086822509766, "global_step": 35355, "epoch": 292} {"train_loss": -32.984169006347656, "global_step": 35356, "epoch": 292} {"train_loss": -33.14237594604492, "global_step": 35357, "epoch": 292} {"train_loss": -32.84577178955078, "global_step": 35358, "epoch": 292} {"train_loss": -33.410484313964844, "global_step": 35359, "epoch": 292} {"train_loss": -33.022430419921875, "global_step": 35360, "epoch": 292} {"train_loss": -32.85600280761719, "global_step": 35361, "epoch": 292} {"train_loss": -33.41072082519531, "global_step": 35362, "epoch": 292} {"train_loss": -32.987274169921875, "global_step": 35363, "epoch": 292} {"train_loss": -32.599796295166016, "global_step": 35364, "epoch": 292} {"train_loss": -33.3037223815918, "global_step": 35365, "epoch": 292} {"train_loss": -33.16133499145508, "global_step": 35366, "epoch": 292} {"train_loss": -33.3775520324707, "global_step": 35367, "epoch": 292} {"train_loss": -33.66788864135742, "global_step": 35368, "epoch": 292} {"train_loss": -33.46797561645508, "global_step": 35369, "epoch": 292} {"train_loss": -33.37063217163086, "global_step": 35370, "epoch": 292} {"train_loss": -33.09563064575195, "global_step": 35371, "epoch": 292} {"train_loss": -33.59773254394531, "global_step": 35372, "epoch": 292} {"train_loss": -33.828346252441406, "global_step": 35373, "epoch": 292} {"train_loss": -33.46548080444336, "global_step": 35374, "epoch": 292} {"train_loss": -33.76076889038086, "global_step": 35375, "epoch": 292} {"train_loss": -33.67908477783203, "global_step": 35376, "epoch": 292} {"train_loss": -33.70652389526367, "global_step": 35377, "epoch": 292} {"train_loss": -34.02174758911133, "global_step": 35378, "epoch": 292} {"train_loss": -33.30559158325195, "global_step": 35379, "epoch": 292} {"train_loss": -33.728267669677734, "global_step": 35380, "epoch": 292} {"train_loss": -33.79465866088867, "global_step": 35381, "epoch": 292} {"train_loss": -33.760719299316406, "global_step": 35382, "epoch": 292} {"train_loss": -33.514644622802734, "global_step": 35383, "epoch": 292} {"train_loss": -33.464271545410156, "global_step": 35384, "epoch": 292} {"train_loss": -34.25891876220703, "global_step": 35385, "epoch": 292} {"train_loss": -33.70415115356445, "global_step": 35386, "epoch": 292} {"train_loss": -33.85294723510742, "global_step": 35387, "epoch": 292} {"train_loss": -34.27729034423828, "global_step": 35388, "epoch": 292} {"train_loss": -33.912723541259766, "global_step": 35389, "epoch": 292} {"train_loss": -33.488426208496094, "global_step": 35390, "epoch": 292} {"train_loss": -33.5325813293457, "global_step": 35391, "epoch": 292} {"train_loss": -34.2859001159668, "global_step": 35392, "epoch": 292} {"train_loss": -33.32792663574219, "global_step": 35393, "epoch": 292} {"train_loss": -32.88932800292969, "global_step": 35394, "epoch": 292} {"train_loss": -33.354217529296875, "global_step": 35395, "epoch": 292} {"train_loss": -33.90339279174805, "global_step": 35396, "epoch": 292} {"train_loss": -33.04072189331055, "global_step": 35397, "epoch": 292} {"train_loss": -33.64259719848633, "global_step": 35398, "epoch": 292} {"train_loss": -32.273292541503906, "global_step": 35399, "epoch": 292} {"train_loss": -32.87321853637695, "global_step": 35400, "epoch": 292} {"train_loss": -33.990203857421875, "global_step": 35401, "epoch": 292} {"train_loss": -32.42890930175781, "global_step": 35402, "epoch": 292} {"train_loss": -32.23209762573242, "global_step": 35403, "epoch": 292} {"train_loss": -33.96717071533203, "global_step": 35404, "epoch": 292} {"train_loss": -32.344478607177734, "global_step": 35405, "epoch": 292} {"train_loss": -33.884342193603516, "global_step": 35406, "epoch": 292} {"train_loss": -32.1346321105957, "global_step": 35407, "epoch": 292} {"train_loss": -33.69560623168945, "global_step": 35408, "epoch": 292} {"train_loss": -32.34910583496094, "global_step": 35409, "epoch": 292} {"train_loss": -33.51112747192383, "global_step": 35410, "epoch": 292} {"train_loss": -33.46225357055664, "global_step": 35411, "epoch": 292} {"train_loss": -33.52306365966797, "global_step": 35412, "epoch": 292} {"train_loss": -33.457763671875, "global_step": 35413, "epoch": 292} {"train_loss": -33.18013000488281, "global_step": 35414, "epoch": 292} {"train_loss": -33.035213470458984, "global_step": 35415, "epoch": 292} {"train_loss": -32.65328598022461, "global_step": 35416, "epoch": 292} {"train_loss": -33.4047737121582, "global_step": 35417, "epoch": 292} {"train_loss": -32.0700798034668, "global_step": 35418, "epoch": 292} {"train_loss": -32.29848098754883, "global_step": 35419, "epoch": 292} {"train_loss": -32.15388107299805, "global_step": 35420, "epoch": 292} {"train_loss": -30.02931022644043, "global_step": 35421, "epoch": 292} {"train_loss": -27.467853546142578, "global_step": 35422, "epoch": 292} {"train_loss": -32.974605560302734, "global_step": 35423, "epoch": 292} {"train_loss": -24.959157943725586, "global_step": 35424, "epoch": 292} {"train_loss": -29.850360870361328, "global_step": 35425, "epoch": 292} {"train_loss": -31.28655433654785, "global_step": 35426, "epoch": 292} {"train_loss": -22.452857971191406, "global_step": 35427, "epoch": 292} {"train_loss": -32.60618209838867, "global_step": 35428, "epoch": 292} {"train_loss": -27.12360954284668, "global_step": 35429, "epoch": 292} {"train_loss": -31.266834259033203, "global_step": 35430, "epoch": 292} {"train_loss": -29.64923667907715, "global_step": 35431, "epoch": 292} {"train_loss": -32.50735092163086, "global_step": 35432, "epoch": 292} {"train_loss": -29.741165161132812, "global_step": 35433, "epoch": 292} {"train_loss": -32.388729095458984, "global_step": 35434, "epoch": 292} {"train_loss": -31.30828857421875, "global_step": 35435, "epoch": 292} {"train_loss": -31.255361557006836, "global_step": 35436, "epoch": 292} {"train_loss": -32.85493087768555, "global_step": 35437, "epoch": 292} {"train_loss": -32.27144241333008, "global_step": 35438, "epoch": 292} {"train_loss": -31.893335342407227, "global_step": 35439, "epoch": 292} {"train_loss": -31.80620765686035, "global_step": 35440, "epoch": 292} {"train_loss": -32.689510345458984, "global_step": 35441, "epoch": 292} {"train_loss": -32.57041549682617, "global_step": 35442, "epoch": 292} {"train_loss": -32.472320556640625, "global_step": 35443, "epoch": 292} {"train_loss": -32.7592887878418, "global_step": 35444, "epoch": 292} {"train_loss": -32.58661651611328, "global_step": 35445, "epoch": 292} {"train_loss": -33.03817367553711, "global_step": 35446, "epoch": 292} {"train_loss": -32.51772689819336, "global_step": 35447, "epoch": 292} {"train_loss": -32.45146942138672, "global_step": 35448, "epoch": 292} {"train_loss": -32.98728561401367, "global_step": 35449, "epoch": 292} {"train_loss": -33.11960983276367, "global_step": 35450, "epoch": 292} {"train_loss": -32.97064971923828, "global_step": 35451, "epoch": 292} {"train_loss": -32.442412825655346, "global_step": 35452, "epoch": 292, "val_loss": 2434168.0} {"train_loss": -33.2862548828125, "global_step": 35453, "epoch": 293} {"train_loss": -33.67752456665039, "global_step": 35454, "epoch": 293} {"train_loss": -32.96769714355469, "global_step": 35455, "epoch": 293} {"train_loss": -33.492919921875, "global_step": 35456, "epoch": 293} {"train_loss": -32.734771728515625, "global_step": 35457, "epoch": 293} {"train_loss": -33.38679122924805, "global_step": 35458, "epoch": 293} {"train_loss": -33.29829025268555, "global_step": 35459, "epoch": 293} {"train_loss": -33.36639404296875, "global_step": 35460, "epoch": 293} {"train_loss": -33.4765739440918, "global_step": 35461, "epoch": 293} {"train_loss": -33.86609649658203, "global_step": 35462, "epoch": 293} {"train_loss": -33.57464599609375, "global_step": 35463, "epoch": 293} {"train_loss": -33.77353286743164, "global_step": 35464, "epoch": 293} {"train_loss": -33.45068359375, "global_step": 35465, "epoch": 293} {"train_loss": -33.7791862487793, "global_step": 35466, "epoch": 293} {"train_loss": -33.64170837402344, "global_step": 35467, "epoch": 293} {"train_loss": -33.97727584838867, "global_step": 35468, "epoch": 293} {"train_loss": -33.501949310302734, "global_step": 35469, "epoch": 293} {"train_loss": -33.858795166015625, "global_step": 35470, "epoch": 293} {"train_loss": -33.90987777709961, "global_step": 35471, "epoch": 293} {"train_loss": -33.6097526550293, "global_step": 35472, "epoch": 293} {"train_loss": -34.20752716064453, "global_step": 35473, "epoch": 293} {"train_loss": -33.15911865234375, "global_step": 35474, "epoch": 293} {"train_loss": -33.97368240356445, "global_step": 35475, "epoch": 293} {"train_loss": -33.98125076293945, "global_step": 35476, "epoch": 293} {"train_loss": -33.58950424194336, "global_step": 35477, "epoch": 293} {"train_loss": -33.60288619995117, "global_step": 35478, "epoch": 293} {"train_loss": -33.549129486083984, "global_step": 35479, "epoch": 293} {"train_loss": -33.901973724365234, "global_step": 35480, "epoch": 293} {"train_loss": -33.68801498413086, "global_step": 35481, "epoch": 293} {"train_loss": -33.90570831298828, "global_step": 35482, "epoch": 293} {"train_loss": -33.71258544921875, "global_step": 35483, "epoch": 293} {"train_loss": -34.09526062011719, "global_step": 35484, "epoch": 293} {"train_loss": -34.02708053588867, "global_step": 35485, "epoch": 293} {"train_loss": -33.12074279785156, "global_step": 35486, "epoch": 293} {"train_loss": -33.544921875, "global_step": 35487, "epoch": 293} {"train_loss": -33.71064376831055, "global_step": 35488, "epoch": 293} {"train_loss": -34.07188415527344, "global_step": 35489, "epoch": 293} {"train_loss": -33.50419616699219, "global_step": 35490, "epoch": 293} {"train_loss": -33.78321838378906, "global_step": 35491, "epoch": 293} {"train_loss": -34.01285934448242, "global_step": 35492, "epoch": 293} {"train_loss": -34.0456428527832, "global_step": 35493, "epoch": 293} {"train_loss": -33.7598876953125, "global_step": 35494, "epoch": 293} {"train_loss": -33.94793701171875, "global_step": 35495, "epoch": 293} {"train_loss": -33.96503448486328, "global_step": 35496, "epoch": 293} {"train_loss": -33.4989013671875, "global_step": 35497, "epoch": 293} {"train_loss": -34.22711181640625, "global_step": 35498, "epoch": 293} {"train_loss": -34.34612274169922, "global_step": 35499, "epoch": 293} {"train_loss": -33.99497604370117, "global_step": 35500, "epoch": 293} {"train_loss": -34.28287887573242, "global_step": 35501, "epoch": 293} {"train_loss": -33.83312225341797, "global_step": 35502, "epoch": 293} {"train_loss": -34.369319915771484, "global_step": 35503, "epoch": 293} {"train_loss": -34.29652404785156, "global_step": 35504, "epoch": 293} {"train_loss": -33.83048629760742, "global_step": 35505, "epoch": 293} {"train_loss": -33.35559844970703, "global_step": 35506, "epoch": 293} {"train_loss": -33.221431732177734, "global_step": 35507, "epoch": 293} {"train_loss": -32.34150314331055, "global_step": 35508, "epoch": 293} {"train_loss": -33.881038665771484, "global_step": 35509, "epoch": 293} {"train_loss": -34.03940963745117, "global_step": 35510, "epoch": 293} {"train_loss": -34.078426361083984, "global_step": 35511, "epoch": 293} {"train_loss": -34.242408752441406, "global_step": 35512, "epoch": 293} {"train_loss": -33.87546920776367, "global_step": 35513, "epoch": 293} {"train_loss": -34.43259811401367, "global_step": 35514, "epoch": 293} {"train_loss": -33.58942794799805, "global_step": 35515, "epoch": 293} {"train_loss": -34.315250396728516, "global_step": 35516, "epoch": 293} {"train_loss": -34.15818405151367, "global_step": 35517, "epoch": 293} {"train_loss": -33.563758850097656, "global_step": 35518, "epoch": 293} {"train_loss": -34.37940216064453, "global_step": 35519, "epoch": 293} {"train_loss": -33.96503829956055, "global_step": 35520, "epoch": 293} {"train_loss": -33.417701721191406, "global_step": 35521, "epoch": 293} {"train_loss": -34.058258056640625, "global_step": 35522, "epoch": 293} {"train_loss": -34.41442108154297, "global_step": 35523, "epoch": 293} {"train_loss": -34.02101516723633, "global_step": 35524, "epoch": 293} {"train_loss": -33.26563262939453, "global_step": 35525, "epoch": 293} {"train_loss": -32.02667999267578, "global_step": 35526, "epoch": 293} {"train_loss": -27.04705810546875, "global_step": 35527, "epoch": 293} {"train_loss": -18.83258628845215, "global_step": 35528, "epoch": 293} {"train_loss": -15.94975757598877, "global_step": 35529, "epoch": 293} {"train_loss": -25.81557273864746, "global_step": 35530, "epoch": 293} {"train_loss": -33.52228546142578, "global_step": 35531, "epoch": 293} {"train_loss": -28.245609283447266, "global_step": 35532, "epoch": 293} {"train_loss": -29.78192138671875, "global_step": 35533, "epoch": 293} {"train_loss": -30.008359909057617, "global_step": 35534, "epoch": 293} {"train_loss": -29.53614616394043, "global_step": 35535, "epoch": 293} {"train_loss": -30.67447853088379, "global_step": 35536, "epoch": 293} {"train_loss": -31.589704513549805, "global_step": 35537, "epoch": 293} {"train_loss": -28.6165714263916, "global_step": 35538, "epoch": 293} {"train_loss": -32.50972366333008, "global_step": 35539, "epoch": 293} {"train_loss": -30.318561553955078, "global_step": 35540, "epoch": 293} {"train_loss": -32.238521575927734, "global_step": 35541, "epoch": 293} {"train_loss": -32.16782760620117, "global_step": 35542, "epoch": 293} {"train_loss": -30.926008224487305, "global_step": 35543, "epoch": 293} {"train_loss": -33.56490707397461, "global_step": 35544, "epoch": 293} {"train_loss": -32.13410568237305, "global_step": 35545, "epoch": 293} {"train_loss": -31.522052764892578, "global_step": 35546, "epoch": 293} {"train_loss": -33.1117057800293, "global_step": 35547, "epoch": 293} {"train_loss": -32.540950775146484, "global_step": 35548, "epoch": 293} {"train_loss": -31.874719619750977, "global_step": 35549, "epoch": 293} {"train_loss": -33.0519905090332, "global_step": 35550, "epoch": 293} {"train_loss": -32.9174690246582, "global_step": 35551, "epoch": 293} {"train_loss": -32.468482971191406, "global_step": 35552, "epoch": 293} {"train_loss": -32.490028381347656, "global_step": 35553, "epoch": 293} {"train_loss": -33.06752014160156, "global_step": 35554, "epoch": 293} {"train_loss": -32.935237884521484, "global_step": 35555, "epoch": 293} {"train_loss": -33.03609848022461, "global_step": 35556, "epoch": 293} {"train_loss": -32.92951202392578, "global_step": 35557, "epoch": 293} {"train_loss": -33.24949264526367, "global_step": 35558, "epoch": 293} {"train_loss": -32.934749603271484, "global_step": 35559, "epoch": 293} {"train_loss": -33.6920051574707, "global_step": 35560, "epoch": 293} {"train_loss": -33.91982650756836, "global_step": 35561, "epoch": 293} {"train_loss": -33.62751388549805, "global_step": 35562, "epoch": 293} {"train_loss": -33.479610443115234, "global_step": 35563, "epoch": 293} {"train_loss": -33.73231887817383, "global_step": 35564, "epoch": 293} {"train_loss": -33.72371292114258, "global_step": 35565, "epoch": 293} {"train_loss": -33.81126022338867, "global_step": 35566, "epoch": 293} {"train_loss": -33.79121017456055, "global_step": 35567, "epoch": 293} {"train_loss": -33.85002517700195, "global_step": 35568, "epoch": 293} {"train_loss": -33.555091857910156, "global_step": 35569, "epoch": 293} {"train_loss": -33.99021530151367, "global_step": 35570, "epoch": 293} {"train_loss": -33.656734466552734, "global_step": 35571, "epoch": 293} {"train_loss": -33.91701126098633, "global_step": 35572, "epoch": 293} {"train_loss": -32.90395433252508, "global_step": 35573, "epoch": 293, "val_loss": 2316566.25} {"train_loss": -33.9366455078125, "global_step": 35574, "epoch": 294} {"train_loss": -33.813079833984375, "global_step": 35575, "epoch": 294} {"train_loss": -33.61652755737305, "global_step": 35576, "epoch": 294} {"train_loss": -33.781402587890625, "global_step": 35577, "epoch": 294} {"train_loss": -33.6213493347168, "global_step": 35578, "epoch": 294} {"train_loss": -33.92264175415039, "global_step": 35579, "epoch": 294} {"train_loss": -33.85354232788086, "global_step": 35580, "epoch": 294} {"train_loss": -33.89711380004883, "global_step": 35581, "epoch": 294} {"train_loss": -33.9067497253418, "global_step": 35582, "epoch": 294} {"train_loss": -33.19508743286133, "global_step": 35583, "epoch": 294} {"train_loss": -33.85836410522461, "global_step": 35584, "epoch": 294} {"train_loss": -33.83559799194336, "global_step": 35585, "epoch": 294} {"train_loss": -34.260292053222656, "global_step": 35586, "epoch": 294} {"train_loss": -33.36664962768555, "global_step": 35587, "epoch": 294} {"train_loss": -32.96982955932617, "global_step": 35588, "epoch": 294} {"train_loss": -33.28456497192383, "global_step": 35589, "epoch": 294} {"train_loss": -33.913917541503906, "global_step": 35590, "epoch": 294} {"train_loss": -33.04635238647461, "global_step": 35591, "epoch": 294} {"train_loss": -33.75040817260742, "global_step": 35592, "epoch": 294} {"train_loss": -34.067047119140625, "global_step": 35593, "epoch": 294} {"train_loss": -33.987457275390625, "global_step": 35594, "epoch": 294} {"train_loss": -32.30475616455078, "global_step": 35595, "epoch": 294} {"train_loss": -33.048370361328125, "global_step": 35596, "epoch": 294} {"train_loss": -33.0682373046875, "global_step": 35597, "epoch": 294} {"train_loss": -33.391963958740234, "global_step": 35598, "epoch": 294} {"train_loss": -34.098388671875, "global_step": 35599, "epoch": 294} {"train_loss": -32.83597946166992, "global_step": 35600, "epoch": 294} {"train_loss": -33.12086486816406, "global_step": 35601, "epoch": 294} {"train_loss": -33.394676208496094, "global_step": 35602, "epoch": 294} {"train_loss": -32.82136917114258, "global_step": 35603, "epoch": 294} {"train_loss": -32.97998046875, "global_step": 35604, "epoch": 294} {"train_loss": -33.356689453125, "global_step": 35605, "epoch": 294} {"train_loss": -33.49910354614258, "global_step": 35606, "epoch": 294} {"train_loss": -33.35671615600586, "global_step": 35607, "epoch": 294} {"train_loss": -33.399635314941406, "global_step": 35608, "epoch": 294} {"train_loss": -33.4868278503418, "global_step": 35609, "epoch": 294} {"train_loss": -33.023983001708984, "global_step": 35610, "epoch": 294} {"train_loss": -33.59548568725586, "global_step": 35611, "epoch": 294} {"train_loss": -33.884803771972656, "global_step": 35612, "epoch": 294} {"train_loss": -33.28541564941406, "global_step": 35613, "epoch": 294} {"train_loss": -33.33582305908203, "global_step": 35614, "epoch": 294} {"train_loss": -33.64756393432617, "global_step": 35615, "epoch": 294} {"train_loss": -33.85352325439453, "global_step": 35616, "epoch": 294} {"train_loss": -33.76388168334961, "global_step": 35617, "epoch": 294} {"train_loss": -33.774932861328125, "global_step": 35618, "epoch": 294} {"train_loss": -33.71906280517578, "global_step": 35619, "epoch": 294} {"train_loss": -34.16523361206055, "global_step": 35620, "epoch": 294} {"train_loss": -33.87668991088867, "global_step": 35621, "epoch": 294} {"train_loss": -33.604347229003906, "global_step": 35622, "epoch": 294} {"train_loss": -33.83311080932617, "global_step": 35623, "epoch": 294} {"train_loss": -34.17002487182617, "global_step": 35624, "epoch": 294} {"train_loss": -33.712623596191406, "global_step": 35625, "epoch": 294} {"train_loss": -33.48973083496094, "global_step": 35626, "epoch": 294} {"train_loss": -32.26140594482422, "global_step": 35627, "epoch": 294} {"train_loss": -32.4643669128418, "global_step": 35628, "epoch": 294} {"train_loss": -32.296905517578125, "global_step": 35629, "epoch": 294} {"train_loss": -32.82466506958008, "global_step": 35630, "epoch": 294} {"train_loss": -32.991302490234375, "global_step": 35631, "epoch": 294} {"train_loss": -33.13209533691406, "global_step": 35632, "epoch": 294} {"train_loss": -33.65814971923828, "global_step": 35633, "epoch": 294} {"train_loss": -33.02301788330078, "global_step": 35634, "epoch": 294} {"train_loss": -32.52163314819336, "global_step": 35635, "epoch": 294} {"train_loss": -31.61427879333496, "global_step": 35636, "epoch": 294} {"train_loss": -33.0741081237793, "global_step": 35637, "epoch": 294} {"train_loss": -33.52439498901367, "global_step": 35638, "epoch": 294} {"train_loss": -34.1254997253418, "global_step": 35639, "epoch": 294} {"train_loss": -33.18321990966797, "global_step": 35640, "epoch": 294} {"train_loss": -33.572959899902344, "global_step": 35641, "epoch": 294} {"train_loss": -33.91248321533203, "global_step": 35642, "epoch": 294} {"train_loss": -34.28347396850586, "global_step": 35643, "epoch": 294} {"train_loss": -33.861305236816406, "global_step": 35644, "epoch": 294} {"train_loss": -34.31638717651367, "global_step": 35645, "epoch": 294} {"train_loss": -33.76214599609375, "global_step": 35646, "epoch": 294} {"train_loss": -34.097530364990234, "global_step": 35647, "epoch": 294} {"train_loss": -33.8230094909668, "global_step": 35648, "epoch": 294} {"train_loss": -34.043880462646484, "global_step": 35649, "epoch": 294} {"train_loss": -34.18143081665039, "global_step": 35650, "epoch": 294} {"train_loss": -34.23926544189453, "global_step": 35651, "epoch": 294} {"train_loss": -34.29270553588867, "global_step": 35652, "epoch": 294} {"train_loss": -34.59365463256836, "global_step": 35653, "epoch": 294} {"train_loss": -33.7336540222168, "global_step": 35654, "epoch": 294} {"train_loss": -34.15681838989258, "global_step": 35655, "epoch": 294} {"train_loss": -33.97040557861328, "global_step": 35656, "epoch": 294} {"train_loss": -33.77163314819336, "global_step": 35657, "epoch": 294} {"train_loss": -34.10557174682617, "global_step": 35658, "epoch": 294} {"train_loss": -33.608333587646484, "global_step": 35659, "epoch": 294} {"train_loss": -33.6025390625, "global_step": 35660, "epoch": 294} {"train_loss": -33.764137268066406, "global_step": 35661, "epoch": 294} {"train_loss": -34.06017303466797, "global_step": 35662, "epoch": 294} {"train_loss": -34.210548400878906, "global_step": 35663, "epoch": 294} {"train_loss": -33.3756217956543, "global_step": 35664, "epoch": 294} {"train_loss": -32.949005126953125, "global_step": 35665, "epoch": 294} {"train_loss": -30.97956657409668, "global_step": 35666, "epoch": 294} {"train_loss": -30.540510177612305, "global_step": 35667, "epoch": 294} {"train_loss": -32.253963470458984, "global_step": 35668, "epoch": 294} {"train_loss": -32.827293395996094, "global_step": 35669, "epoch": 294} {"train_loss": -32.81538772583008, "global_step": 35670, "epoch": 294} {"train_loss": -32.68296432495117, "global_step": 35671, "epoch": 294} {"train_loss": -32.43485641479492, "global_step": 35672, "epoch": 294} {"train_loss": -32.951942443847656, "global_step": 35673, "epoch": 294} {"train_loss": -33.35673522949219, "global_step": 35674, "epoch": 294} {"train_loss": -32.256595611572266, "global_step": 35675, "epoch": 294} {"train_loss": -32.87543487548828, "global_step": 35676, "epoch": 294} {"train_loss": -33.12687301635742, "global_step": 35677, "epoch": 294} {"train_loss": -33.898841857910156, "global_step": 35678, "epoch": 294} {"train_loss": -31.961145401000977, "global_step": 35679, "epoch": 294} {"train_loss": -33.8639030456543, "global_step": 35680, "epoch": 294} {"train_loss": -33.204261779785156, "global_step": 35681, "epoch": 294} {"train_loss": -33.360355377197266, "global_step": 35682, "epoch": 294} {"train_loss": -33.81574630737305, "global_step": 35683, "epoch": 294} {"train_loss": -33.249324798583984, "global_step": 35684, "epoch": 294} {"train_loss": -34.085235595703125, "global_step": 35685, "epoch": 294} {"train_loss": -33.1582145690918, "global_step": 35686, "epoch": 294} {"train_loss": -33.75813674926758, "global_step": 35687, "epoch": 294} {"train_loss": -32.99188995361328, "global_step": 35688, "epoch": 294} {"train_loss": -33.591949462890625, "global_step": 35689, "epoch": 294} {"train_loss": -33.6826286315918, "global_step": 35690, "epoch": 294} {"train_loss": -33.567291259765625, "global_step": 35691, "epoch": 294} {"train_loss": -33.430545806884766, "global_step": 35692, "epoch": 294} {"train_loss": -33.343624114990234, "global_step": 35693, "epoch": 294} {"train_loss": -33.43264111605558, "global_step": 35694, "epoch": 294, "val_loss": 2520551.25} {"train_loss": -33.853294372558594, "global_step": 35695, "epoch": 295} {"train_loss": -33.46587371826172, "global_step": 35696, "epoch": 295} {"train_loss": -33.0246467590332, "global_step": 35697, "epoch": 295} {"train_loss": -33.732337951660156, "global_step": 35698, "epoch": 295} {"train_loss": -33.9164924621582, "global_step": 35699, "epoch": 295} {"train_loss": -33.813209533691406, "global_step": 35700, "epoch": 295} {"train_loss": -32.85187911987305, "global_step": 35701, "epoch": 295} {"train_loss": -33.9105110168457, "global_step": 35702, "epoch": 295} {"train_loss": -34.23046875, "global_step": 35703, "epoch": 295} {"train_loss": -34.04655075073242, "global_step": 35704, "epoch": 295} {"train_loss": -33.42188262939453, "global_step": 35705, "epoch": 295} {"train_loss": -33.72273635864258, "global_step": 35706, "epoch": 295} {"train_loss": -34.355403900146484, "global_step": 35707, "epoch": 295} {"train_loss": -34.282691955566406, "global_step": 35708, "epoch": 295} {"train_loss": -34.2332878112793, "global_step": 35709, "epoch": 295} {"train_loss": -33.606117248535156, "global_step": 35710, "epoch": 295} {"train_loss": -34.17424774169922, "global_step": 35711, "epoch": 295} {"train_loss": -33.60103988647461, "global_step": 35712, "epoch": 295} {"train_loss": -34.09444808959961, "global_step": 35713, "epoch": 295} {"train_loss": -33.81110382080078, "global_step": 35714, "epoch": 295} {"train_loss": -34.306121826171875, "global_step": 35715, "epoch": 295} {"train_loss": -34.24258041381836, "global_step": 35716, "epoch": 295} {"train_loss": -34.38540267944336, "global_step": 35717, "epoch": 295} {"train_loss": -34.09807205200195, "global_step": 35718, "epoch": 295} {"train_loss": -34.66830062866211, "global_step": 35719, "epoch": 295} {"train_loss": -33.65630340576172, "global_step": 35720, "epoch": 295} {"train_loss": -34.5755729675293, "global_step": 35721, "epoch": 295} {"train_loss": -33.974464416503906, "global_step": 35722, "epoch": 295} {"train_loss": -33.47832107543945, "global_step": 35723, "epoch": 295} {"train_loss": -33.304805755615234, "global_step": 35724, "epoch": 295} {"train_loss": -32.90707015991211, "global_step": 35725, "epoch": 295} {"train_loss": -32.87594223022461, "global_step": 35726, "epoch": 295} {"train_loss": -34.39091110229492, "global_step": 35727, "epoch": 295} {"train_loss": -32.95331954956055, "global_step": 35728, "epoch": 295} {"train_loss": -33.96704864501953, "global_step": 35729, "epoch": 295} {"train_loss": -34.254695892333984, "global_step": 35730, "epoch": 295} {"train_loss": -34.12311935424805, "global_step": 35731, "epoch": 295} {"train_loss": -33.87255096435547, "global_step": 35732, "epoch": 295} {"train_loss": -33.95949935913086, "global_step": 35733, "epoch": 295} {"train_loss": -34.08370590209961, "global_step": 35734, "epoch": 295} {"train_loss": -33.81311798095703, "global_step": 35735, "epoch": 295} {"train_loss": -34.578800201416016, "global_step": 35736, "epoch": 295} {"train_loss": -33.65879440307617, "global_step": 35737, "epoch": 295} {"train_loss": -32.6785774230957, "global_step": 35738, "epoch": 295} {"train_loss": -32.98240280151367, "global_step": 35739, "epoch": 295} {"train_loss": -34.2778205871582, "global_step": 35740, "epoch": 295} {"train_loss": -32.681007385253906, "global_step": 35741, "epoch": 295} {"train_loss": -31.858154296875, "global_step": 35742, "epoch": 295} {"train_loss": -31.31745719909668, "global_step": 35743, "epoch": 295} {"train_loss": -33.46926498413086, "global_step": 35744, "epoch": 295} {"train_loss": -32.62112045288086, "global_step": 35745, "epoch": 295} {"train_loss": -30.72873878479004, "global_step": 35746, "epoch": 295} {"train_loss": -31.655441284179688, "global_step": 35747, "epoch": 295} {"train_loss": -31.7718505859375, "global_step": 35748, "epoch": 295} {"train_loss": -31.428380966186523, "global_step": 35749, "epoch": 295} {"train_loss": -31.911401748657227, "global_step": 35750, "epoch": 295} {"train_loss": -32.44181442260742, "global_step": 35751, "epoch": 295} {"train_loss": -33.6813850402832, "global_step": 35752, "epoch": 295} {"train_loss": -32.01323318481445, "global_step": 35753, "epoch": 295} {"train_loss": -32.427650451660156, "global_step": 35754, "epoch": 295} {"train_loss": -33.648441314697266, "global_step": 35755, "epoch": 295} {"train_loss": -33.02798843383789, "global_step": 35756, "epoch": 295} {"train_loss": -33.13243865966797, "global_step": 35757, "epoch": 295} {"train_loss": -33.70236587524414, "global_step": 35758, "epoch": 295} {"train_loss": -33.572322845458984, "global_step": 35759, "epoch": 295} {"train_loss": -33.749237060546875, "global_step": 35760, "epoch": 295} {"train_loss": -33.963470458984375, "global_step": 35761, "epoch": 295} {"train_loss": -33.9390983581543, "global_step": 35762, "epoch": 295} {"train_loss": -34.338050842285156, "global_step": 35763, "epoch": 295} {"train_loss": -33.65339279174805, "global_step": 35764, "epoch": 295} {"train_loss": -33.8269157409668, "global_step": 35765, "epoch": 295} {"train_loss": -34.13957977294922, "global_step": 35766, "epoch": 295} {"train_loss": -34.22573471069336, "global_step": 35767, "epoch": 295} {"train_loss": -33.80183029174805, "global_step": 35768, "epoch": 295} {"train_loss": -34.175682067871094, "global_step": 35769, "epoch": 295} {"train_loss": -34.15104293823242, "global_step": 35770, "epoch": 295} {"train_loss": -34.189483642578125, "global_step": 35771, "epoch": 295} {"train_loss": -34.45357894897461, "global_step": 35772, "epoch": 295} {"train_loss": -33.60978317260742, "global_step": 35773, "epoch": 295} {"train_loss": -34.35710906982422, "global_step": 35774, "epoch": 295} {"train_loss": -33.790340423583984, "global_step": 35775, "epoch": 295} {"train_loss": -33.85416793823242, "global_step": 35776, "epoch": 295} {"train_loss": -34.17047119140625, "global_step": 35777, "epoch": 295} {"train_loss": -33.88373947143555, "global_step": 35778, "epoch": 295} {"train_loss": -34.2786750793457, "global_step": 35779, "epoch": 295} {"train_loss": -34.416561126708984, "global_step": 35780, "epoch": 295} {"train_loss": -33.65430450439453, "global_step": 35781, "epoch": 295} {"train_loss": -34.328182220458984, "global_step": 35782, "epoch": 295} {"train_loss": -34.21969223022461, "global_step": 35783, "epoch": 295} {"train_loss": -34.66756820678711, "global_step": 35784, "epoch": 295} {"train_loss": -34.4097900390625, "global_step": 35785, "epoch": 295} {"train_loss": -34.70413589477539, "global_step": 35786, "epoch": 295} {"train_loss": -34.86368942260742, "global_step": 35787, "epoch": 295} {"train_loss": -34.487220764160156, "global_step": 35788, "epoch": 295} {"train_loss": -34.71437454223633, "global_step": 35789, "epoch": 295} {"train_loss": -34.3942985534668, "global_step": 35790, "epoch": 295} {"train_loss": -34.80842590332031, "global_step": 35791, "epoch": 295} {"train_loss": -34.64833068847656, "global_step": 35792, "epoch": 295} {"train_loss": -35.07373046875, "global_step": 35793, "epoch": 295} {"train_loss": -34.90154266357422, "global_step": 35794, "epoch": 295} {"train_loss": -34.570098876953125, "global_step": 35795, "epoch": 295} {"train_loss": -34.589111328125, "global_step": 35796, "epoch": 295} {"train_loss": -35.03984832763672, "global_step": 35797, "epoch": 295} {"train_loss": -34.168182373046875, "global_step": 35798, "epoch": 295} {"train_loss": -34.650413513183594, "global_step": 35799, "epoch": 295} {"train_loss": -34.363094329833984, "global_step": 35800, "epoch": 295} {"train_loss": -34.32706832885742, "global_step": 35801, "epoch": 295} {"train_loss": -34.568397521972656, "global_step": 35802, "epoch": 295} {"train_loss": -34.273345947265625, "global_step": 35803, "epoch": 295} {"train_loss": -33.439910888671875, "global_step": 35804, "epoch": 295} {"train_loss": -31.993200302124023, "global_step": 35805, "epoch": 295} {"train_loss": -32.86318588256836, "global_step": 35806, "epoch": 295} {"train_loss": -34.0191764831543, "global_step": 35807, "epoch": 295} {"train_loss": -32.95823287963867, "global_step": 35808, "epoch": 295} {"train_loss": -33.43341827392578, "global_step": 35809, "epoch": 295} {"train_loss": -33.42409133911133, "global_step": 35810, "epoch": 295} {"train_loss": -33.05929183959961, "global_step": 35811, "epoch": 295} {"train_loss": -33.878414154052734, "global_step": 35812, "epoch": 295} {"train_loss": -34.07076644897461, "global_step": 35813, "epoch": 295} {"train_loss": -34.07218551635742, "global_step": 35814, "epoch": 295} {"train_loss": -33.7510540386862, "global_step": 35815, "epoch": 295, "val_loss": 2579314.0} {"train_loss": -34.213966369628906, "global_step": 35816, "epoch": 296} {"train_loss": -34.3871955871582, "global_step": 35817, "epoch": 296} {"train_loss": -34.17259216308594, "global_step": 35818, "epoch": 296} {"train_loss": -34.25539779663086, "global_step": 35819, "epoch": 296} {"train_loss": -34.378414154052734, "global_step": 35820, "epoch": 296} {"train_loss": -34.85880661010742, "global_step": 35821, "epoch": 296} {"train_loss": -34.463104248046875, "global_step": 35822, "epoch": 296} {"train_loss": -34.34463882446289, "global_step": 35823, "epoch": 296} {"train_loss": -34.48724365234375, "global_step": 35824, "epoch": 296} {"train_loss": -34.42731475830078, "global_step": 35825, "epoch": 296} {"train_loss": -34.611602783203125, "global_step": 35826, "epoch": 296} {"train_loss": -34.79785919189453, "global_step": 35827, "epoch": 296} {"train_loss": -34.34109115600586, "global_step": 35828, "epoch": 296} {"train_loss": -34.47532653808594, "global_step": 35829, "epoch": 296} {"train_loss": -34.02956771850586, "global_step": 35830, "epoch": 296} {"train_loss": -34.6994743347168, "global_step": 35831, "epoch": 296} {"train_loss": -34.71177291870117, "global_step": 35832, "epoch": 296} {"train_loss": -33.95476531982422, "global_step": 35833, "epoch": 296} {"train_loss": -34.0646858215332, "global_step": 35834, "epoch": 296} {"train_loss": -34.25992965698242, "global_step": 35835, "epoch": 296} {"train_loss": -34.69990539550781, "global_step": 35836, "epoch": 296} {"train_loss": -35.09235763549805, "global_step": 35837, "epoch": 296} {"train_loss": -33.897377014160156, "global_step": 35838, "epoch": 296} {"train_loss": -34.262489318847656, "global_step": 35839, "epoch": 296} {"train_loss": -34.80823516845703, "global_step": 35840, "epoch": 296} {"train_loss": -34.91414260864258, "global_step": 35841, "epoch": 296} {"train_loss": -33.958003997802734, "global_step": 35842, "epoch": 296} {"train_loss": -33.97764587402344, "global_step": 35843, "epoch": 296} {"train_loss": -34.788726806640625, "global_step": 35844, "epoch": 296} {"train_loss": -34.09440994262695, "global_step": 35845, "epoch": 296} {"train_loss": -34.07724380493164, "global_step": 35846, "epoch": 296} {"train_loss": -35.07659149169922, "global_step": 35847, "epoch": 296} {"train_loss": -34.45985412597656, "global_step": 35848, "epoch": 296} {"train_loss": -34.88272476196289, "global_step": 35849, "epoch": 296} {"train_loss": -34.49569320678711, "global_step": 35850, "epoch": 296} {"train_loss": -33.883480072021484, "global_step": 35851, "epoch": 296} {"train_loss": -35.12518310546875, "global_step": 35852, "epoch": 296} {"train_loss": -34.29729080200195, "global_step": 35853, "epoch": 296} {"train_loss": -34.36527633666992, "global_step": 35854, "epoch": 296} {"train_loss": -33.76808166503906, "global_step": 35855, "epoch": 296} {"train_loss": -32.14008712768555, "global_step": 35856, "epoch": 296} {"train_loss": -28.711828231811523, "global_step": 35857, "epoch": 296} {"train_loss": -24.7027645111084, "global_step": 35858, "epoch": 296} {"train_loss": -24.238956451416016, "global_step": 35859, "epoch": 296} {"train_loss": -24.856937408447266, "global_step": 35860, "epoch": 296} {"train_loss": -23.666824340820312, "global_step": 35861, "epoch": 296} {"train_loss": -24.582441329956055, "global_step": 35862, "epoch": 296} {"train_loss": -25.452863693237305, "global_step": 35863, "epoch": 296} {"train_loss": -25.574024200439453, "global_step": 35864, "epoch": 296} {"train_loss": -25.985523223876953, "global_step": 35865, "epoch": 296} {"train_loss": -24.98311424255371, "global_step": 35866, "epoch": 296} {"train_loss": -25.395811080932617, "global_step": 35867, "epoch": 296} {"train_loss": -27.060956954956055, "global_step": 35868, "epoch": 296} {"train_loss": -26.477828979492188, "global_step": 35869, "epoch": 296} {"train_loss": -29.513031005859375, "global_step": 35870, "epoch": 296} {"train_loss": -27.6640625, "global_step": 35871, "epoch": 296} {"train_loss": -27.50233268737793, "global_step": 35872, "epoch": 296} {"train_loss": -28.145267486572266, "global_step": 35873, "epoch": 296} {"train_loss": -27.785724639892578, "global_step": 35874, "epoch": 296} {"train_loss": -27.883874893188477, "global_step": 35875, "epoch": 296} {"train_loss": -26.057397842407227, "global_step": 35876, "epoch": 296} {"train_loss": -26.13602638244629, "global_step": 35877, "epoch": 296} {"train_loss": -25.934595108032227, "global_step": 35878, "epoch": 296} {"train_loss": -29.056623458862305, "global_step": 35879, "epoch": 296} {"train_loss": -26.68049430847168, "global_step": 35880, "epoch": 296} {"train_loss": -28.928503036499023, "global_step": 35881, "epoch": 296} {"train_loss": -27.616849899291992, "global_step": 35882, "epoch": 296} {"train_loss": -29.480085372924805, "global_step": 35883, "epoch": 296} {"train_loss": -28.082477569580078, "global_step": 35884, "epoch": 296} {"train_loss": -29.811115264892578, "global_step": 35885, "epoch": 296} {"train_loss": -28.987186431884766, "global_step": 35886, "epoch": 296} {"train_loss": -29.768400192260742, "global_step": 35887, "epoch": 296} {"train_loss": -29.023778915405273, "global_step": 35888, "epoch": 296} {"train_loss": -30.331876754760742, "global_step": 35889, "epoch": 296} {"train_loss": -29.24561882019043, "global_step": 35890, "epoch": 296} {"train_loss": -29.61982536315918, "global_step": 35891, "epoch": 296} {"train_loss": -25.8571834564209, "global_step": 35892, "epoch": 296} {"train_loss": -26.92941665649414, "global_step": 35893, "epoch": 296} {"train_loss": -24.892467498779297, "global_step": 35894, "epoch": 296} {"train_loss": -20.331836700439453, "global_step": 35895, "epoch": 296} {"train_loss": -26.489282608032227, "global_step": 35896, "epoch": 296} {"train_loss": -24.616750717163086, "global_step": 35897, "epoch": 296} {"train_loss": -28.772497177124023, "global_step": 35898, "epoch": 296} {"train_loss": -25.423063278198242, "global_step": 35899, "epoch": 296} {"train_loss": -28.24884605407715, "global_step": 35900, "epoch": 296} {"train_loss": -28.40357780456543, "global_step": 35901, "epoch": 296} {"train_loss": -27.804540634155273, "global_step": 35902, "epoch": 296} {"train_loss": -27.950204849243164, "global_step": 35903, "epoch": 296} {"train_loss": -29.109333038330078, "global_step": 35904, "epoch": 296} {"train_loss": -29.162353515625, "global_step": 35905, "epoch": 296} {"train_loss": -28.326162338256836, "global_step": 35906, "epoch": 296} {"train_loss": -28.88983726501465, "global_step": 35907, "epoch": 296} {"train_loss": -29.48369789123535, "global_step": 35908, "epoch": 296} {"train_loss": -29.2702693939209, "global_step": 35909, "epoch": 296} {"train_loss": -29.583160400390625, "global_step": 35910, "epoch": 296} {"train_loss": -29.698841094970703, "global_step": 35911, "epoch": 296} {"train_loss": -29.366830825805664, "global_step": 35912, "epoch": 296} {"train_loss": -29.67832374572754, "global_step": 35913, "epoch": 296} {"train_loss": -29.261539459228516, "global_step": 35914, "epoch": 296} {"train_loss": -29.603199005126953, "global_step": 35915, "epoch": 296} {"train_loss": -30.326221466064453, "global_step": 35916, "epoch": 296} {"train_loss": -30.06076431274414, "global_step": 35917, "epoch": 296} {"train_loss": -30.040075302124023, "global_step": 35918, "epoch": 296} {"train_loss": -29.8872127532959, "global_step": 35919, "epoch": 296} {"train_loss": -29.918073654174805, "global_step": 35920, "epoch": 296} {"train_loss": -29.571395874023438, "global_step": 35921, "epoch": 296} {"train_loss": -30.021020889282227, "global_step": 35922, "epoch": 296} {"train_loss": -30.329330444335938, "global_step": 35923, "epoch": 296} {"train_loss": -30.84331703186035, "global_step": 35924, "epoch": 296} {"train_loss": -30.287113189697266, "global_step": 35925, "epoch": 296} {"train_loss": -30.464981079101562, "global_step": 35926, "epoch": 296} {"train_loss": -31.17563247680664, "global_step": 35927, "epoch": 296} {"train_loss": -31.034032821655273, "global_step": 35928, "epoch": 296} {"train_loss": -31.102649688720703, "global_step": 35929, "epoch": 296} {"train_loss": -30.038440704345703, "global_step": 35930, "epoch": 296} {"train_loss": -30.289642333984375, "global_step": 35931, "epoch": 296} {"train_loss": -31.3754940032959, "global_step": 35932, "epoch": 296} {"train_loss": -30.574371337890625, "global_step": 35933, "epoch": 296} {"train_loss": -30.76572608947754, "global_step": 35934, "epoch": 296} {"train_loss": -31.726428985595703, "global_step": 35935, "epoch": 296} {"train_loss": -30.341029285399383, "global_step": 35936, "epoch": 296, "val_loss": 2491713.75} {"train_loss": -31.334074020385742, "global_step": 35937, "epoch": 297} {"train_loss": -30.3316593170166, "global_step": 35938, "epoch": 297} {"train_loss": -30.211181640625, "global_step": 35939, "epoch": 297} {"train_loss": -31.839935302734375, "global_step": 35940, "epoch": 297} {"train_loss": -29.17823600769043, "global_step": 35941, "epoch": 297} {"train_loss": -31.991979598999023, "global_step": 35942, "epoch": 297} {"train_loss": -30.67488670349121, "global_step": 35943, "epoch": 297} {"train_loss": -32.332122802734375, "global_step": 35944, "epoch": 297} {"train_loss": -31.54999351501465, "global_step": 35945, "epoch": 297} {"train_loss": -31.335968017578125, "global_step": 35946, "epoch": 297} {"train_loss": -32.671417236328125, "global_step": 35947, "epoch": 297} {"train_loss": -32.74188995361328, "global_step": 35948, "epoch": 297} {"train_loss": -32.218994140625, "global_step": 35949, "epoch": 297} {"train_loss": -33.770668029785156, "global_step": 35950, "epoch": 297} {"train_loss": -33.897003173828125, "global_step": 35951, "epoch": 297} {"train_loss": -33.757354736328125, "global_step": 35952, "epoch": 297} {"train_loss": -33.32994079589844, "global_step": 35953, "epoch": 297} {"train_loss": -33.09965133666992, "global_step": 35954, "epoch": 297} {"train_loss": -33.33661651611328, "global_step": 35955, "epoch": 297} {"train_loss": -33.52387237548828, "global_step": 35956, "epoch": 297} {"train_loss": -33.076026916503906, "global_step": 35957, "epoch": 297} {"train_loss": -33.71849822998047, "global_step": 35958, "epoch": 297} {"train_loss": -33.8050422668457, "global_step": 35959, "epoch": 297} {"train_loss": -33.979732513427734, "global_step": 35960, "epoch": 297} {"train_loss": -33.82634353637695, "global_step": 35961, "epoch": 297} {"train_loss": -34.264869689941406, "global_step": 35962, "epoch": 297} {"train_loss": -33.20529556274414, "global_step": 35963, "epoch": 297} {"train_loss": -32.3198356628418, "global_step": 35964, "epoch": 297} {"train_loss": -32.45626449584961, "global_step": 35965, "epoch": 297} {"train_loss": -34.10700607299805, "global_step": 35966, "epoch": 297} {"train_loss": -34.55143356323242, "global_step": 35967, "epoch": 297} {"train_loss": -33.77122116088867, "global_step": 35968, "epoch": 297} {"train_loss": -33.25722122192383, "global_step": 35969, "epoch": 297} {"train_loss": -32.46973419189453, "global_step": 35970, "epoch": 297} {"train_loss": -32.99319076538086, "global_step": 35971, "epoch": 297} {"train_loss": -32.47426986694336, "global_step": 35972, "epoch": 297} {"train_loss": -33.21683883666992, "global_step": 35973, "epoch": 297} {"train_loss": -33.82101058959961, "global_step": 35974, "epoch": 297} {"train_loss": -31.63344383239746, "global_step": 35975, "epoch": 297} {"train_loss": -33.51641845703125, "global_step": 35976, "epoch": 297} {"train_loss": -33.641658782958984, "global_step": 35977, "epoch": 297} {"train_loss": -33.07748031616211, "global_step": 35978, "epoch": 297} {"train_loss": -32.661476135253906, "global_step": 35979, "epoch": 297} {"train_loss": -33.0462646484375, "global_step": 35980, "epoch": 297} {"train_loss": -32.559322357177734, "global_step": 35981, "epoch": 297} {"train_loss": -31.856164932250977, "global_step": 35982, "epoch": 297} {"train_loss": -33.58431625366211, "global_step": 35983, "epoch": 297} {"train_loss": -32.961158752441406, "global_step": 35984, "epoch": 297} {"train_loss": -33.68160629272461, "global_step": 35985, "epoch": 297} {"train_loss": -33.58225631713867, "global_step": 35986, "epoch": 297} {"train_loss": -33.74761962890625, "global_step": 35987, "epoch": 297} {"train_loss": -34.596038818359375, "global_step": 35988, "epoch": 297} {"train_loss": -33.067848205566406, "global_step": 35989, "epoch": 297} {"train_loss": -34.09370803833008, "global_step": 35990, "epoch": 297} {"train_loss": -33.251007080078125, "global_step": 35991, "epoch": 297} {"train_loss": -33.436683654785156, "global_step": 35992, "epoch": 297} {"train_loss": -33.31402587890625, "global_step": 35993, "epoch": 297} {"train_loss": -33.921783447265625, "global_step": 35994, "epoch": 297} {"train_loss": -31.592041015625, "global_step": 35995, "epoch": 297} {"train_loss": -32.36494445800781, "global_step": 35996, "epoch": 297} {"train_loss": -33.355926513671875, "global_step": 35997, "epoch": 297} {"train_loss": -32.353660583496094, "global_step": 35998, "epoch": 297} {"train_loss": -32.5416259765625, "global_step": 35999, "epoch": 297} {"train_loss": -32.10121536254883, "global_step": 36000, "epoch": 297} {"train_loss": -32.54804611206055, "global_step": 36001, "epoch": 297} {"train_loss": -32.96083450317383, "global_step": 36002, "epoch": 297} {"train_loss": -33.18044662475586, "global_step": 36003, "epoch": 297} {"train_loss": -33.17107009887695, "global_step": 36004, "epoch": 297} {"train_loss": -33.768611907958984, "global_step": 36005, "epoch": 297} {"train_loss": -32.68782043457031, "global_step": 36006, "epoch": 297} {"train_loss": -32.73768615722656, "global_step": 36007, "epoch": 297} {"train_loss": -33.73699951171875, "global_step": 36008, "epoch": 297} {"train_loss": -32.94559860229492, "global_step": 36009, "epoch": 297} {"train_loss": -33.999000549316406, "global_step": 36010, "epoch": 297} {"train_loss": -33.377689361572266, "global_step": 36011, "epoch": 297} {"train_loss": -33.84126281738281, "global_step": 36012, "epoch": 297} {"train_loss": -33.77877426147461, "global_step": 36013, "epoch": 297} {"train_loss": -33.79938507080078, "global_step": 36014, "epoch": 297} {"train_loss": -33.76052474975586, "global_step": 36015, "epoch": 297} {"train_loss": -33.78040313720703, "global_step": 36016, "epoch": 297} {"train_loss": -33.59959030151367, "global_step": 36017, "epoch": 297} {"train_loss": -33.97178268432617, "global_step": 36018, "epoch": 297} {"train_loss": -34.26943588256836, "global_step": 36019, "epoch": 297} {"train_loss": -33.874603271484375, "global_step": 36020, "epoch": 297} {"train_loss": -33.875640869140625, "global_step": 36021, "epoch": 297} {"train_loss": -34.245887756347656, "global_step": 36022, "epoch": 297} {"train_loss": -33.548213958740234, "global_step": 36023, "epoch": 297} {"train_loss": -33.8619499206543, "global_step": 36024, "epoch": 297} {"train_loss": -33.596275329589844, "global_step": 36025, "epoch": 297} {"train_loss": -34.234710693359375, "global_step": 36026, "epoch": 297} {"train_loss": -33.90421676635742, "global_step": 36027, "epoch": 297} {"train_loss": -34.22486114501953, "global_step": 36028, "epoch": 297} {"train_loss": -34.3863410949707, "global_step": 36029, "epoch": 297} {"train_loss": -34.03365707397461, "global_step": 36030, "epoch": 297} {"train_loss": -34.14136505126953, "global_step": 36031, "epoch": 297} {"train_loss": -34.0062141418457, "global_step": 36032, "epoch": 297} {"train_loss": -33.971832275390625, "global_step": 36033, "epoch": 297} {"train_loss": -33.67677688598633, "global_step": 36034, "epoch": 297} {"train_loss": -33.93619155883789, "global_step": 36035, "epoch": 297} {"train_loss": -34.28553009033203, "global_step": 36036, "epoch": 297} {"train_loss": -34.32719039916992, "global_step": 36037, "epoch": 297} {"train_loss": -34.630306243896484, "global_step": 36038, "epoch": 297} {"train_loss": -34.37983322143555, "global_step": 36039, "epoch": 297} {"train_loss": -34.17647171020508, "global_step": 36040, "epoch": 297} {"train_loss": -33.83919906616211, "global_step": 36041, "epoch": 297} {"train_loss": -33.58890914916992, "global_step": 36042, "epoch": 297} {"train_loss": -34.894046783447266, "global_step": 36043, "epoch": 297} {"train_loss": -34.28522491455078, "global_step": 36044, "epoch": 297} {"train_loss": -32.016693115234375, "global_step": 36045, "epoch": 297} {"train_loss": -29.40622329711914, "global_step": 36046, "epoch": 297} {"train_loss": -27.207616806030273, "global_step": 36047, "epoch": 297} {"train_loss": -27.696048736572266, "global_step": 36048, "epoch": 297} {"train_loss": -30.91718864440918, "global_step": 36049, "epoch": 297} {"train_loss": -33.336753845214844, "global_step": 36050, "epoch": 297} {"train_loss": -30.555316925048828, "global_step": 36051, "epoch": 297} {"train_loss": -30.052200317382812, "global_step": 36052, "epoch": 297} {"train_loss": -28.861658096313477, "global_step": 36053, "epoch": 297} {"train_loss": -30.8554744720459, "global_step": 36054, "epoch": 297} {"train_loss": -30.97283363342285, "global_step": 36055, "epoch": 297} {"train_loss": -32.70966720581055, "global_step": 36056, "epoch": 297} {"train_loss": -32.954459844541944, "global_step": 36057, "epoch": 297, "val_loss": 2673091.0} {"train_loss": -31.4000244140625, "global_step": 36058, "epoch": 298} {"train_loss": -32.999176025390625, "global_step": 36059, "epoch": 298} {"train_loss": -31.466796875, "global_step": 36060, "epoch": 298} {"train_loss": -33.01912307739258, "global_step": 36061, "epoch": 298} {"train_loss": -32.720821380615234, "global_step": 36062, "epoch": 298} {"train_loss": -32.557106018066406, "global_step": 36063, "epoch": 298} {"train_loss": -31.779027938842773, "global_step": 36064, "epoch": 298} {"train_loss": -33.02337646484375, "global_step": 36065, "epoch": 298} {"train_loss": -31.5949649810791, "global_step": 36066, "epoch": 298} {"train_loss": -32.63456344604492, "global_step": 36067, "epoch": 298} {"train_loss": -32.9627799987793, "global_step": 36068, "epoch": 298} {"train_loss": -32.39616012573242, "global_step": 36069, "epoch": 298} {"train_loss": -32.996299743652344, "global_step": 36070, "epoch": 298} {"train_loss": -32.677005767822266, "global_step": 36071, "epoch": 298} {"train_loss": -33.21632385253906, "global_step": 36072, "epoch": 298} {"train_loss": -33.39147186279297, "global_step": 36073, "epoch": 298} {"train_loss": -33.185420989990234, "global_step": 36074, "epoch": 298} {"train_loss": -33.735897064208984, "global_step": 36075, "epoch": 298} {"train_loss": -33.289154052734375, "global_step": 36076, "epoch": 298} {"train_loss": -33.48924255371094, "global_step": 36077, "epoch": 298} {"train_loss": -33.567115783691406, "global_step": 36078, "epoch": 298} {"train_loss": -33.356746673583984, "global_step": 36079, "epoch": 298} {"train_loss": -33.837310791015625, "global_step": 36080, "epoch": 298} {"train_loss": -33.84868240356445, "global_step": 36081, "epoch": 298} {"train_loss": -33.69393539428711, "global_step": 36082, "epoch": 298} {"train_loss": -33.8715705871582, "global_step": 36083, "epoch": 298} {"train_loss": -33.238338470458984, "global_step": 36084, "epoch": 298} {"train_loss": -33.72457504272461, "global_step": 36085, "epoch": 298} {"train_loss": -33.88345718383789, "global_step": 36086, "epoch": 298} {"train_loss": -33.6187744140625, "global_step": 36087, "epoch": 298} {"train_loss": -33.53057861328125, "global_step": 36088, "epoch": 298} {"train_loss": -34.00432586669922, "global_step": 36089, "epoch": 298} {"train_loss": -33.55769729614258, "global_step": 36090, "epoch": 298} {"train_loss": -33.75815200805664, "global_step": 36091, "epoch": 298} {"train_loss": -34.19901657104492, "global_step": 36092, "epoch": 298} {"train_loss": -34.07631301879883, "global_step": 36093, "epoch": 298} {"train_loss": -33.608272552490234, "global_step": 36094, "epoch": 298} {"train_loss": -33.080501556396484, "global_step": 36095, "epoch": 298} {"train_loss": -33.827571868896484, "global_step": 36096, "epoch": 298} {"train_loss": -33.98163604736328, "global_step": 36097, "epoch": 298} {"train_loss": -34.36782455444336, "global_step": 36098, "epoch": 298} {"train_loss": -33.7448844909668, "global_step": 36099, "epoch": 298} {"train_loss": -34.33478927612305, "global_step": 36100, "epoch": 298} {"train_loss": -34.6120719909668, "global_step": 36101, "epoch": 298} {"train_loss": -34.44354248046875, "global_step": 36102, "epoch": 298} {"train_loss": -34.409759521484375, "global_step": 36103, "epoch": 298} {"train_loss": -33.809635162353516, "global_step": 36104, "epoch": 298} {"train_loss": -33.07827377319336, "global_step": 36105, "epoch": 298} {"train_loss": -34.10149002075195, "global_step": 36106, "epoch": 298} {"train_loss": -34.760414123535156, "global_step": 36107, "epoch": 298} {"train_loss": -33.069271087646484, "global_step": 36108, "epoch": 298} {"train_loss": -32.57741165161133, "global_step": 36109, "epoch": 298} {"train_loss": -34.54826354980469, "global_step": 36110, "epoch": 298} {"train_loss": -34.4129753112793, "global_step": 36111, "epoch": 298} {"train_loss": -33.40576171875, "global_step": 36112, "epoch": 298} {"train_loss": -33.26579666137695, "global_step": 36113, "epoch": 298} {"train_loss": -34.4425163269043, "global_step": 36114, "epoch": 298} {"train_loss": -34.0830078125, "global_step": 36115, "epoch": 298} {"train_loss": -33.73200607299805, "global_step": 36116, "epoch": 298} {"train_loss": -34.37786865234375, "global_step": 36117, "epoch": 298} {"train_loss": -33.89762878417969, "global_step": 36118, "epoch": 298} {"train_loss": -33.777748107910156, "global_step": 36119, "epoch": 298} {"train_loss": -33.808834075927734, "global_step": 36120, "epoch": 298} {"train_loss": -33.61652755737305, "global_step": 36121, "epoch": 298} {"train_loss": -33.58077621459961, "global_step": 36122, "epoch": 298} {"train_loss": -33.166656494140625, "global_step": 36123, "epoch": 298} {"train_loss": -32.366172790527344, "global_step": 36124, "epoch": 298} {"train_loss": -33.769771575927734, "global_step": 36125, "epoch": 298} {"train_loss": -34.686954498291016, "global_step": 36126, "epoch": 298} {"train_loss": -33.896461486816406, "global_step": 36127, "epoch": 298} {"train_loss": -34.154090881347656, "global_step": 36128, "epoch": 298} {"train_loss": -33.24601364135742, "global_step": 36129, "epoch": 298} {"train_loss": -34.390438079833984, "global_step": 36130, "epoch": 298} {"train_loss": -34.20048904418945, "global_step": 36131, "epoch": 298} {"train_loss": -34.23759841918945, "global_step": 36132, "epoch": 298} {"train_loss": -34.233726501464844, "global_step": 36133, "epoch": 298} {"train_loss": -34.10513687133789, "global_step": 36134, "epoch": 298} {"train_loss": -33.14649200439453, "global_step": 36135, "epoch": 298} {"train_loss": -33.83802032470703, "global_step": 36136, "epoch": 298} {"train_loss": -33.87026596069336, "global_step": 36137, "epoch": 298} {"train_loss": -34.35050582885742, "global_step": 36138, "epoch": 298} {"train_loss": -33.7966194152832, "global_step": 36139, "epoch": 298} {"train_loss": -34.2176628112793, "global_step": 36140, "epoch": 298} {"train_loss": -33.39415740966797, "global_step": 36141, "epoch": 298} {"train_loss": -34.54146957397461, "global_step": 36142, "epoch": 298} {"train_loss": -33.88666534423828, "global_step": 36143, "epoch": 298} {"train_loss": -34.055171966552734, "global_step": 36144, "epoch": 298} {"train_loss": -33.48702621459961, "global_step": 36145, "epoch": 298} {"train_loss": -33.805908203125, "global_step": 36146, "epoch": 298} {"train_loss": -34.04453659057617, "global_step": 36147, "epoch": 298} {"train_loss": -33.550167083740234, "global_step": 36148, "epoch": 298} {"train_loss": -33.745506286621094, "global_step": 36149, "epoch": 298} {"train_loss": -33.94535446166992, "global_step": 36150, "epoch": 298} {"train_loss": -33.63331985473633, "global_step": 36151, "epoch": 298} {"train_loss": -34.04693603515625, "global_step": 36152, "epoch": 298} {"train_loss": -33.518218994140625, "global_step": 36153, "epoch": 298} {"train_loss": -33.90266036987305, "global_step": 36154, "epoch": 298} {"train_loss": -32.38750076293945, "global_step": 36155, "epoch": 298} {"train_loss": -33.30249786376953, "global_step": 36156, "epoch": 298} {"train_loss": -32.85092544555664, "global_step": 36157, "epoch": 298} {"train_loss": -32.38957977294922, "global_step": 36158, "epoch": 298} {"train_loss": -33.79157638549805, "global_step": 36159, "epoch": 298} {"train_loss": -34.55389404296875, "global_step": 36160, "epoch": 298} {"train_loss": -33.47906494140625, "global_step": 36161, "epoch": 298} {"train_loss": -32.90468215942383, "global_step": 36162, "epoch": 298} {"train_loss": -33.15086364746094, "global_step": 36163, "epoch": 298} {"train_loss": -32.55100631713867, "global_step": 36164, "epoch": 298} {"train_loss": -33.111351013183594, "global_step": 36165, "epoch": 298} {"train_loss": -32.170013427734375, "global_step": 36166, "epoch": 298} {"train_loss": -33.11490249633789, "global_step": 36167, "epoch": 298} {"train_loss": -33.268306732177734, "global_step": 36168, "epoch": 298} {"train_loss": -33.55554962158203, "global_step": 36169, "epoch": 298} {"train_loss": -31.55634880065918, "global_step": 36170, "epoch": 298} {"train_loss": -33.94419479370117, "global_step": 36171, "epoch": 298} {"train_loss": -33.17791748046875, "global_step": 36172, "epoch": 298} {"train_loss": -31.892658233642578, "global_step": 36173, "epoch": 298} {"train_loss": -34.46989059448242, "global_step": 36174, "epoch": 298} {"train_loss": -33.43869400024414, "global_step": 36175, "epoch": 298} {"train_loss": -33.04972457885742, "global_step": 36176, "epoch": 298} {"train_loss": -33.62434005737305, "global_step": 36177, "epoch": 298} {"train_loss": -33.51280623822173, "global_step": 36178, "epoch": 298, "val_loss": 2499216.25} {"train_loss": -33.1635856628418, "global_step": 36179, "epoch": 299} {"train_loss": -32.6669921875, "global_step": 36180, "epoch": 299} {"train_loss": -33.91091537475586, "global_step": 36181, "epoch": 299} {"train_loss": -33.592811584472656, "global_step": 36182, "epoch": 299} {"train_loss": -32.6694450378418, "global_step": 36183, "epoch": 299} {"train_loss": -32.702919006347656, "global_step": 36184, "epoch": 299} {"train_loss": -33.73844528198242, "global_step": 36185, "epoch": 299} {"train_loss": -32.996551513671875, "global_step": 36186, "epoch": 299} {"train_loss": -33.12722396850586, "global_step": 36187, "epoch": 299} {"train_loss": -33.59156799316406, "global_step": 36188, "epoch": 299} {"train_loss": -34.778602600097656, "global_step": 36189, "epoch": 299} {"train_loss": -32.8338623046875, "global_step": 36190, "epoch": 299} {"train_loss": -31.670495986938477, "global_step": 36191, "epoch": 299} {"train_loss": -30.655725479125977, "global_step": 36192, "epoch": 299} {"train_loss": -33.899513244628906, "global_step": 36193, "epoch": 299} {"train_loss": -32.31916427612305, "global_step": 36194, "epoch": 299} {"train_loss": -32.7730827331543, "global_step": 36195, "epoch": 299} {"train_loss": -31.541961669921875, "global_step": 36196, "epoch": 299} {"train_loss": -33.50667953491211, "global_step": 36197, "epoch": 299} {"train_loss": -31.254047393798828, "global_step": 36198, "epoch": 299} {"train_loss": -33.618282318115234, "global_step": 36199, "epoch": 299} {"train_loss": -32.258480072021484, "global_step": 36200, "epoch": 299} {"train_loss": -30.989912033081055, "global_step": 36201, "epoch": 299} {"train_loss": -30.943023681640625, "global_step": 36202, "epoch": 299} {"train_loss": -30.05360221862793, "global_step": 36203, "epoch": 299} {"train_loss": -31.70941162109375, "global_step": 36204, "epoch": 299} {"train_loss": -27.558887481689453, "global_step": 36205, "epoch": 299} {"train_loss": -30.576780319213867, "global_step": 36206, "epoch": 299} {"train_loss": -26.94631004333496, "global_step": 36207, "epoch": 299} {"train_loss": -27.46880531311035, "global_step": 36208, "epoch": 299} {"train_loss": -27.58601951599121, "global_step": 36209, "epoch": 299} {"train_loss": -26.965564727783203, "global_step": 36210, "epoch": 299} {"train_loss": -27.435688018798828, "global_step": 36211, "epoch": 299} {"train_loss": -27.718448638916016, "global_step": 36212, "epoch": 299} {"train_loss": -28.296890258789062, "global_step": 36213, "epoch": 299} {"train_loss": -28.39093589782715, "global_step": 36214, "epoch": 299} {"train_loss": -28.513019561767578, "global_step": 36215, "epoch": 299} {"train_loss": -28.874547958374023, "global_step": 36216, "epoch": 299} {"train_loss": -29.089094161987305, "global_step": 36217, "epoch": 299} {"train_loss": -29.338764190673828, "global_step": 36218, "epoch": 299} {"train_loss": -29.309911727905273, "global_step": 36219, "epoch": 299} {"train_loss": -29.140445709228516, "global_step": 36220, "epoch": 299} {"train_loss": -29.57444190979004, "global_step": 36221, "epoch": 299} {"train_loss": -29.957244873046875, "global_step": 36222, "epoch": 299} {"train_loss": -30.56235122680664, "global_step": 36223, "epoch": 299} {"train_loss": -30.59791374206543, "global_step": 36224, "epoch": 299} {"train_loss": -28.91873550415039, "global_step": 36225, "epoch": 299} {"train_loss": -22.89470863342285, "global_step": 36226, "epoch": 299} {"train_loss": -17.516956329345703, "global_step": 36227, "epoch": 299} {"train_loss": -25.64335060119629, "global_step": 36228, "epoch": 299} {"train_loss": -11.860346794128418, "global_step": 36229, "epoch": 299} {"train_loss": -25.771270751953125, "global_step": 36230, "epoch": 299} {"train_loss": -24.419902801513672, "global_step": 36231, "epoch": 299} {"train_loss": -27.574127197265625, "global_step": 36232, "epoch": 299} {"train_loss": -27.88917350769043, "global_step": 36233, "epoch": 299} {"train_loss": -29.4736385345459, "global_step": 36234, "epoch": 299} {"train_loss": -28.479358673095703, "global_step": 36235, "epoch": 299} {"train_loss": -28.029394149780273, "global_step": 36236, "epoch": 299} {"train_loss": -29.88563346862793, "global_step": 36237, "epoch": 299} {"train_loss": -30.30939292907715, "global_step": 36238, "epoch": 299} {"train_loss": -29.105789184570312, "global_step": 36239, "epoch": 299} {"train_loss": -28.924625396728516, "global_step": 36240, "epoch": 299} {"train_loss": -29.431604385375977, "global_step": 36241, "epoch": 299} {"train_loss": -30.218353271484375, "global_step": 36242, "epoch": 299} {"train_loss": -30.3170166015625, "global_step": 36243, "epoch": 299} {"train_loss": -30.570270538330078, "global_step": 36244, "epoch": 299} {"train_loss": -29.615955352783203, "global_step": 36245, "epoch": 299} {"train_loss": -29.768890380859375, "global_step": 36246, "epoch": 299} {"train_loss": -29.49057960510254, "global_step": 36247, "epoch": 299} {"train_loss": -28.030500411987305, "global_step": 36248, "epoch": 299} {"train_loss": -22.367645263671875, "global_step": 36249, "epoch": 299} {"train_loss": -19.81475830078125, "global_step": 36250, "epoch": 299} {"train_loss": -30.617109298706055, "global_step": 36251, "epoch": 299} {"train_loss": -23.494871139526367, "global_step": 36252, "epoch": 299} {"train_loss": -29.669485092163086, "global_step": 36253, "epoch": 299} {"train_loss": -26.772357940673828, "global_step": 36254, "epoch": 299} {"train_loss": -27.60479736328125, "global_step": 36255, "epoch": 299} {"train_loss": -29.940460205078125, "global_step": 36256, "epoch": 299} {"train_loss": -28.19988441467285, "global_step": 36257, "epoch": 299} {"train_loss": -27.475263595581055, "global_step": 36258, "epoch": 299} {"train_loss": -29.2519474029541, "global_step": 36259, "epoch": 299} {"train_loss": -29.82771110534668, "global_step": 36260, "epoch": 299} {"train_loss": -28.90228843688965, "global_step": 36261, "epoch": 299} {"train_loss": -28.94462013244629, "global_step": 36262, "epoch": 299} {"train_loss": -29.189605712890625, "global_step": 36263, "epoch": 299} {"train_loss": -28.73138999938965, "global_step": 36264, "epoch": 299} {"train_loss": -27.656036376953125, "global_step": 36265, "epoch": 299} {"train_loss": -29.572290420532227, "global_step": 36266, "epoch": 299} {"train_loss": -29.68168067932129, "global_step": 36267, "epoch": 299} {"train_loss": -29.21541404724121, "global_step": 36268, "epoch": 299} {"train_loss": -30.116073608398438, "global_step": 36269, "epoch": 299} {"train_loss": -30.252887725830078, "global_step": 36270, "epoch": 299} {"train_loss": -30.544570922851562, "global_step": 36271, "epoch": 299} {"train_loss": -30.594690322875977, "global_step": 36272, "epoch": 299} {"train_loss": -30.589948654174805, "global_step": 36273, "epoch": 299} {"train_loss": -30.220218658447266, "global_step": 36274, "epoch": 299} {"train_loss": -30.393239974975586, "global_step": 36275, "epoch": 299} {"train_loss": -30.92683219909668, "global_step": 36276, "epoch": 299} {"train_loss": -30.087055206298828, "global_step": 36277, "epoch": 299} {"train_loss": -29.506338119506836, "global_step": 36278, "epoch": 299} {"train_loss": -28.776803970336914, "global_step": 36279, "epoch": 299} {"train_loss": -27.75969886779785, "global_step": 36280, "epoch": 299} {"train_loss": -29.32842445373535, "global_step": 36281, "epoch": 299} {"train_loss": -31.474740982055664, "global_step": 36282, "epoch": 299} {"train_loss": -30.6113224029541, "global_step": 36283, "epoch": 299} {"train_loss": -30.926416397094727, "global_step": 36284, "epoch": 299} {"train_loss": -30.644697189331055, "global_step": 36285, "epoch": 299} {"train_loss": -30.840320587158203, "global_step": 36286, "epoch": 299} {"train_loss": -30.6688175201416, "global_step": 36287, "epoch": 299} {"train_loss": -31.2198486328125, "global_step": 36288, "epoch": 299} {"train_loss": -31.06549644470215, "global_step": 36289, "epoch": 299} {"train_loss": -31.12700843811035, "global_step": 36290, "epoch": 299} {"train_loss": -30.875762939453125, "global_step": 36291, "epoch": 299} {"train_loss": -31.14234733581543, "global_step": 36292, "epoch": 299} {"train_loss": -31.2937068939209, "global_step": 36293, "epoch": 299} {"train_loss": -31.05426597595215, "global_step": 36294, "epoch": 299} {"train_loss": -31.480533599853516, "global_step": 36295, "epoch": 299} {"train_loss": -31.804819107055664, "global_step": 36296, "epoch": 299} {"train_loss": -31.669279098510742, "global_step": 36297, "epoch": 299} {"train_loss": -31.814682006835938, "global_step": 36298, "epoch": 299} {"train_loss": -29.605757729081084, "global_step": 36299, "epoch": 299, "val_loss": 2541573.0} {"train_loss": -31.6932315826416, "global_step": 36300, "epoch": 300} {"train_loss": -31.92058753967285, "global_step": 36301, "epoch": 300} {"train_loss": -31.94598960876465, "global_step": 36302, "epoch": 300} {"train_loss": -32.18012619018555, "global_step": 36303, "epoch": 300} {"train_loss": -32.2965202331543, "global_step": 36304, "epoch": 300} {"train_loss": -32.0202522277832, "global_step": 36305, "epoch": 300} {"train_loss": -32.457786560058594, "global_step": 36306, "epoch": 300} {"train_loss": -32.30751419067383, "global_step": 36307, "epoch": 300} {"train_loss": -32.24586868286133, "global_step": 36308, "epoch": 300} {"train_loss": -31.842132568359375, "global_step": 36309, "epoch": 300} {"train_loss": -31.574934005737305, "global_step": 36310, "epoch": 300} {"train_loss": -28.221952438354492, "global_step": 36311, "epoch": 300} {"train_loss": -24.228818893432617, "global_step": 36312, "epoch": 300} {"train_loss": -28.168798446655273, "global_step": 36313, "epoch": 300} {"train_loss": -31.587661743164062, "global_step": 36314, "epoch": 300} {"train_loss": -29.287961959838867, "global_step": 36315, "epoch": 300} {"train_loss": -32.04237365722656, "global_step": 36316, "epoch": 300} {"train_loss": -30.668781280517578, "global_step": 36317, "epoch": 300} {"train_loss": -31.936676025390625, "global_step": 36318, "epoch": 300} {"train_loss": -31.678152084350586, "global_step": 36319, "epoch": 300} {"train_loss": -31.596302032470703, "global_step": 36320, "epoch": 300} {"train_loss": -31.496784210205078, "global_step": 36321, "epoch": 300} {"train_loss": -32.626155853271484, "global_step": 36322, "epoch": 300} {"train_loss": -31.714935302734375, "global_step": 36323, "epoch": 300} {"train_loss": -31.462860107421875, "global_step": 36324, "epoch": 300} {"train_loss": -32.17116928100586, "global_step": 36325, "epoch": 300} {"train_loss": -32.14058303833008, "global_step": 36326, "epoch": 300} {"train_loss": -30.185993194580078, "global_step": 36327, "epoch": 300} {"train_loss": -25.451467514038086, "global_step": 36328, "epoch": 300} {"train_loss": -20.9913387298584, "global_step": 36329, "epoch": 300} {"train_loss": -31.618261337280273, "global_step": 36330, "epoch": 300} {"train_loss": -28.01226806640625, "global_step": 36331, "epoch": 300} {"train_loss": -32.022544860839844, "global_step": 36332, "epoch": 300} {"train_loss": -28.904356002807617, "global_step": 36333, "epoch": 300} {"train_loss": -32.03046798706055, "global_step": 36334, "epoch": 300} {"train_loss": -31.50798988342285, "global_step": 36335, "epoch": 300} {"train_loss": -30.756567001342773, "global_step": 36336, "epoch": 300} {"train_loss": -31.830982208251953, "global_step": 36337, "epoch": 300} {"train_loss": -31.817718505859375, "global_step": 36338, "epoch": 300} {"train_loss": -31.120901107788086, "global_step": 36339, "epoch": 300} {"train_loss": -31.027236938476562, "global_step": 36340, "epoch": 300} {"train_loss": -31.954700469970703, "global_step": 36341, "epoch": 300} {"train_loss": -31.01369285583496, "global_step": 36342, "epoch": 300} {"train_loss": -29.468799591064453, "global_step": 36343, "epoch": 300} {"train_loss": -28.247241973876953, "global_step": 36344, "epoch": 300} {"train_loss": -29.015771865844727, "global_step": 36345, "epoch": 300} {"train_loss": -31.73467445373535, "global_step": 36346, "epoch": 300} {"train_loss": -31.551694869995117, "global_step": 36347, "epoch": 300} {"train_loss": -31.29718589782715, "global_step": 36348, "epoch": 300} {"train_loss": -31.388235092163086, "global_step": 36349, "epoch": 300} {"train_loss": -31.908063888549805, "global_step": 36350, "epoch": 300} {"train_loss": -32.01792526245117, "global_step": 36351, "epoch": 300} {"train_loss": -31.99014663696289, "global_step": 36352, "epoch": 300} {"train_loss": -31.401294708251953, "global_step": 36353, "epoch": 300} {"train_loss": -31.801008224487305, "global_step": 36354, "epoch": 300} {"train_loss": -32.134891510009766, "global_step": 36355, "epoch": 300} {"train_loss": -31.90008544921875, "global_step": 36356, "epoch": 300} {"train_loss": -31.826887130737305, "global_step": 36357, "epoch": 300} {"train_loss": -32.207027435302734, "global_step": 36358, "epoch": 300} {"train_loss": -31.841882705688477, "global_step": 36359, "epoch": 300} {"train_loss": -32.26180648803711, "global_step": 36360, "epoch": 300} {"train_loss": -32.088653564453125, "global_step": 36361, "epoch": 300} {"train_loss": -32.13527297973633, "global_step": 36362, "epoch": 300} {"train_loss": -32.2065315246582, "global_step": 36363, "epoch": 300} {"train_loss": -32.276851654052734, "global_step": 36364, "epoch": 300} {"train_loss": -32.0735969543457, "global_step": 36365, "epoch": 300} {"train_loss": -32.20119094848633, "global_step": 36366, "epoch": 300} {"train_loss": -32.477294921875, "global_step": 36367, "epoch": 300} {"train_loss": -32.4522819519043, "global_step": 36368, "epoch": 300} {"train_loss": -32.70124435424805, "global_step": 36369, "epoch": 300} {"train_loss": -32.424983978271484, "global_step": 36370, "epoch": 300} {"train_loss": -32.425201416015625, "global_step": 36371, "epoch": 300} {"train_loss": -32.91959762573242, "global_step": 36372, "epoch": 300} {"train_loss": -33.0379524230957, "global_step": 36373, "epoch": 300} {"train_loss": -32.69379806518555, "global_step": 36374, "epoch": 300} {"train_loss": -32.35136032104492, "global_step": 36375, "epoch": 300} {"train_loss": -32.362430572509766, "global_step": 36376, "epoch": 300} {"train_loss": -31.59956169128418, "global_step": 36377, "epoch": 300} {"train_loss": -27.690967559814453, "global_step": 36378, "epoch": 300} {"train_loss": -21.245464324951172, "global_step": 36379, "epoch": 300} {"train_loss": -19.184377670288086, "global_step": 36380, "epoch": 300} {"train_loss": -32.63566970825195, "global_step": 36381, "epoch": 300} {"train_loss": -27.1610164642334, "global_step": 36382, "epoch": 300} {"train_loss": -33.06105422973633, "global_step": 36383, "epoch": 300} {"train_loss": -28.28215980529785, "global_step": 36384, "epoch": 300} {"train_loss": -32.00966262817383, "global_step": 36385, "epoch": 300} {"train_loss": -32.1066780090332, "global_step": 36386, "epoch": 300} {"train_loss": -30.276132583618164, "global_step": 36387, "epoch": 300} {"train_loss": -31.7205867767334, "global_step": 36388, "epoch": 300} {"train_loss": -32.695350646972656, "global_step": 36389, "epoch": 300} {"train_loss": -31.94407081604004, "global_step": 36390, "epoch": 300} {"train_loss": -31.29648208618164, "global_step": 36391, "epoch": 300} {"train_loss": -32.24345779418945, "global_step": 36392, "epoch": 300} {"train_loss": -32.65837478637695, "global_step": 36393, "epoch": 300} {"train_loss": -32.38132858276367, "global_step": 36394, "epoch": 300} {"train_loss": -31.616708755493164, "global_step": 36395, "epoch": 300} {"train_loss": -32.831233978271484, "global_step": 36396, "epoch": 300} {"train_loss": -32.61524200439453, "global_step": 36397, "epoch": 300} {"train_loss": -32.77478790283203, "global_step": 36398, "epoch": 300} {"train_loss": -32.541831970214844, "global_step": 36399, "epoch": 300} {"train_loss": -32.147727966308594, "global_step": 36400, "epoch": 300} {"train_loss": -32.358314514160156, "global_step": 36401, "epoch": 300} {"train_loss": -33.36563491821289, "global_step": 36402, "epoch": 300} {"train_loss": -32.5327262878418, "global_step": 36403, "epoch": 300} {"train_loss": -32.90073013305664, "global_step": 36404, "epoch": 300} {"train_loss": -32.7070198059082, "global_step": 36405, "epoch": 300} {"train_loss": -32.09729766845703, "global_step": 36406, "epoch": 300} {"train_loss": -32.26520919799805, "global_step": 36407, "epoch": 300} {"train_loss": -32.78898239135742, "global_step": 36408, "epoch": 300} {"train_loss": -31.101667404174805, "global_step": 36409, "epoch": 300} {"train_loss": -29.272687911987305, "global_step": 36410, "epoch": 300} {"train_loss": -30.243921279907227, "global_step": 36411, "epoch": 300} {"train_loss": -30.149063110351562, "global_step": 36412, "epoch": 300} {"train_loss": -29.532230377197266, "global_step": 36413, "epoch": 300} {"train_loss": -32.04841995239258, "global_step": 36414, "epoch": 300} {"train_loss": -31.507221221923828, "global_step": 36415, "epoch": 300} {"train_loss": -31.1048641204834, "global_step": 36416, "epoch": 300} {"train_loss": -29.74356460571289, "global_step": 36417, "epoch": 300} {"train_loss": -32.04214096069336, "global_step": 36418, "epoch": 300} {"train_loss": -32.9294548034668, "global_step": 36419, "epoch": 300} {"train_loss": -31.189737130787748, "global_step": 36420, "epoch": 300, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4400000": 1.0, "test/sim_max_reward_4400001": 1.0, "test/sim_max_reward_4400002": 1.0, "test/sim_max_reward_4400003": 1.0, "test/sim_max_reward_4400004": 1.0, "test/sim_max_reward_4400005": 1.0, "test/sim_max_reward_4400006": 1.0, "test/sim_max_reward_4400007": 1.0, "test/sim_max_reward_4400008": 1.0, "test/sim_max_reward_4400009": 1.0, "test/sim_max_reward_4400010": 1.0, "test/sim_max_reward_4400011": 1.0, "test/sim_max_reward_4400012": 1.0, "test/sim_max_reward_4400013": 1.0, "test/sim_max_reward_4400014": 1.0, "test/sim_max_reward_4400015": 1.0, "test/sim_max_reward_4400016": 1.0, "test/sim_max_reward_4400017": 1.0, "test/sim_max_reward_4400018": 1.0, "test/sim_max_reward_4400019": 1.0, "test/sim_max_reward_4400020": 1.0, "test/sim_max_reward_4400021": 1.0, "train/mean_score": 1.0, "test/mean_score": 1.0, "val_loss": 2551844.25} {"train_loss": -32.52983474731445, "global_step": 36421, "epoch": 301} {"train_loss": -32.04584884643555, "global_step": 36422, "epoch": 301} {"train_loss": -32.346153259277344, "global_step": 36423, "epoch": 301} {"train_loss": -31.62885093688965, "global_step": 36424, "epoch": 301} {"train_loss": -31.93768310546875, "global_step": 36425, "epoch": 301} {"train_loss": -31.784204483032227, "global_step": 36426, "epoch": 301} {"train_loss": -32.034027099609375, "global_step": 36427, "epoch": 301} {"train_loss": -32.65673065185547, "global_step": 36428, "epoch": 301} {"train_loss": -32.33317184448242, "global_step": 36429, "epoch": 301} {"train_loss": -30.4648494720459, "global_step": 36430, "epoch": 301} {"train_loss": -31.549457550048828, "global_step": 36431, "epoch": 301} {"train_loss": -32.37237548828125, "global_step": 36432, "epoch": 301} {"train_loss": -30.260639190673828, "global_step": 36433, "epoch": 301} {"train_loss": -30.333097457885742, "global_step": 36434, "epoch": 301} {"train_loss": -32.198360443115234, "global_step": 36435, "epoch": 301} {"train_loss": -30.37888526916504, "global_step": 36436, "epoch": 301} {"train_loss": -32.360958099365234, "global_step": 36437, "epoch": 301} {"train_loss": -31.15593910217285, "global_step": 36438, "epoch": 301} {"train_loss": -32.184871673583984, "global_step": 36439, "epoch": 301} {"train_loss": -31.63836669921875, "global_step": 36440, "epoch": 301} {"train_loss": -32.44462203979492, "global_step": 36441, "epoch": 301} {"train_loss": -32.371192932128906, "global_step": 36442, "epoch": 301} {"train_loss": -31.946996688842773, "global_step": 36443, "epoch": 301} {"train_loss": -32.1837158203125, "global_step": 36444, "epoch": 301} {"train_loss": -31.57470703125, "global_step": 36445, "epoch": 301} {"train_loss": -32.57928466796875, "global_step": 36446, "epoch": 301} {"train_loss": -31.97361183166504, "global_step": 36447, "epoch": 301} {"train_loss": -31.978687286376953, "global_step": 36448, "epoch": 301} {"train_loss": -32.74204635620117, "global_step": 36449, "epoch": 301} {"train_loss": -31.79007911682129, "global_step": 36450, "epoch": 301} {"train_loss": -32.62823486328125, "global_step": 36451, "epoch": 301} {"train_loss": -32.075111389160156, "global_step": 36452, "epoch": 301} {"train_loss": -32.53899002075195, "global_step": 36453, "epoch": 301} {"train_loss": -32.59873580932617, "global_step": 36454, "epoch": 301} {"train_loss": -32.3352165222168, "global_step": 36455, "epoch": 301} {"train_loss": -32.635963439941406, "global_step": 36456, "epoch": 301} {"train_loss": -32.87300109863281, "global_step": 36457, "epoch": 301} {"train_loss": -32.743133544921875, "global_step": 36458, "epoch": 301} {"train_loss": -32.80953598022461, "global_step": 36459, "epoch": 301} {"train_loss": -32.985939025878906, "global_step": 36460, "epoch": 301} {"train_loss": -32.809932708740234, "global_step": 36461, "epoch": 301} {"train_loss": -32.57480239868164, "global_step": 36462, "epoch": 301} {"train_loss": -32.6500129699707, "global_step": 36463, "epoch": 301} {"train_loss": -32.30228805541992, "global_step": 36464, "epoch": 301} {"train_loss": -32.33851623535156, "global_step": 36465, "epoch": 301} {"train_loss": -32.231300354003906, "global_step": 36466, "epoch": 301} {"train_loss": -33.2217903137207, "global_step": 36467, "epoch": 301} {"train_loss": -32.43715286254883, "global_step": 36468, "epoch": 301} {"train_loss": -32.41804885864258, "global_step": 36469, "epoch": 301} {"train_loss": -33.25159454345703, "global_step": 36470, "epoch": 301} {"train_loss": -32.96024703979492, "global_step": 36471, "epoch": 301} {"train_loss": -32.41950988769531, "global_step": 36472, "epoch": 301} {"train_loss": -31.08662223815918, "global_step": 36473, "epoch": 301} {"train_loss": -30.296157836914062, "global_step": 36474, "epoch": 301} {"train_loss": -31.59284019470215, "global_step": 36475, "epoch": 301} {"train_loss": -33.45024490356445, "global_step": 36476, "epoch": 301} {"train_loss": -32.230953216552734, "global_step": 36477, "epoch": 301} {"train_loss": -31.73504638671875, "global_step": 36478, "epoch": 301} {"train_loss": -31.573896408081055, "global_step": 36479, "epoch": 301} {"train_loss": -27.152082443237305, "global_step": 36480, "epoch": 301} {"train_loss": -14.7806978225708, "global_step": 36481, "epoch": 301} {"train_loss": -18.221105575561523, "global_step": 36482, "epoch": 301} {"train_loss": -32.80546188354492, "global_step": 36483, "epoch": 301} {"train_loss": -24.507099151611328, "global_step": 36484, "epoch": 301} {"train_loss": -32.90822982788086, "global_step": 36485, "epoch": 301} {"train_loss": -29.131671905517578, "global_step": 36486, "epoch": 301} {"train_loss": -30.705209732055664, "global_step": 36487, "epoch": 301} {"train_loss": -32.67670822143555, "global_step": 36488, "epoch": 301} {"train_loss": -30.9774169921875, "global_step": 36489, "epoch": 301} {"train_loss": -31.301422119140625, "global_step": 36490, "epoch": 301} {"train_loss": -32.899147033691406, "global_step": 36491, "epoch": 301} {"train_loss": -32.41585159301758, "global_step": 36492, "epoch": 301} {"train_loss": -31.412738800048828, "global_step": 36493, "epoch": 301} {"train_loss": -31.758228302001953, "global_step": 36494, "epoch": 301} {"train_loss": -32.1020393371582, "global_step": 36495, "epoch": 301} {"train_loss": -32.51849365234375, "global_step": 36496, "epoch": 301} {"train_loss": -32.362491607666016, "global_step": 36497, "epoch": 301} {"train_loss": -31.4632511138916, "global_step": 36498, "epoch": 301} {"train_loss": -32.45884323120117, "global_step": 36499, "epoch": 301} {"train_loss": -32.10676956176758, "global_step": 36500, "epoch": 301} {"train_loss": -33.06085205078125, "global_step": 36501, "epoch": 301} {"train_loss": -32.207977294921875, "global_step": 36502, "epoch": 301} {"train_loss": -33.025569915771484, "global_step": 36503, "epoch": 301} {"train_loss": -32.34910202026367, "global_step": 36504, "epoch": 301} {"train_loss": -32.1112060546875, "global_step": 36505, "epoch": 301} {"train_loss": -32.55561065673828, "global_step": 36506, "epoch": 301} {"train_loss": -32.22114562988281, "global_step": 36507, "epoch": 301} {"train_loss": -32.91518020629883, "global_step": 36508, "epoch": 301} {"train_loss": -32.001625061035156, "global_step": 36509, "epoch": 301} {"train_loss": -32.90161895751953, "global_step": 36510, "epoch": 301} {"train_loss": -32.167030334472656, "global_step": 36511, "epoch": 301} {"train_loss": -32.618568420410156, "global_step": 36512, "epoch": 301} {"train_loss": -32.950721740722656, "global_step": 36513, "epoch": 301} {"train_loss": -33.05221176147461, "global_step": 36514, "epoch": 301} {"train_loss": -33.039363861083984, "global_step": 36515, "epoch": 301} {"train_loss": -32.755577087402344, "global_step": 36516, "epoch": 301} {"train_loss": -33.011226654052734, "global_step": 36517, "epoch": 301} {"train_loss": -33.11387634277344, "global_step": 36518, "epoch": 301} {"train_loss": -33.0617790222168, "global_step": 36519, "epoch": 301} {"train_loss": -33.34341049194336, "global_step": 36520, "epoch": 301} {"train_loss": -33.43931198120117, "global_step": 36521, "epoch": 301} {"train_loss": -33.291015625, "global_step": 36522, "epoch": 301} {"train_loss": -32.65808868408203, "global_step": 36523, "epoch": 301} {"train_loss": -33.22480392456055, "global_step": 36524, "epoch": 301} {"train_loss": -32.98642349243164, "global_step": 36525, "epoch": 301} {"train_loss": -32.20808029174805, "global_step": 36526, "epoch": 301} {"train_loss": -31.240808486938477, "global_step": 36527, "epoch": 301} {"train_loss": -32.87172317504883, "global_step": 36528, "epoch": 301} {"train_loss": -32.345863342285156, "global_step": 36529, "epoch": 301} {"train_loss": -31.531274795532227, "global_step": 36530, "epoch": 301} {"train_loss": -32.50660705566406, "global_step": 36531, "epoch": 301} {"train_loss": -32.492034912109375, "global_step": 36532, "epoch": 301} {"train_loss": -30.668420791625977, "global_step": 36533, "epoch": 301} {"train_loss": -31.04669761657715, "global_step": 36534, "epoch": 301} {"train_loss": -31.523712158203125, "global_step": 36535, "epoch": 301} {"train_loss": -32.439022064208984, "global_step": 36536, "epoch": 301} {"train_loss": -32.85178756713867, "global_step": 36537, "epoch": 301} {"train_loss": -31.682233810424805, "global_step": 36538, "epoch": 301} {"train_loss": -32.47844314575195, "global_step": 36539, "epoch": 301} {"train_loss": -32.469974517822266, "global_step": 36540, "epoch": 301} {"train_loss": -31.863341331481934, "global_step": 36541, "epoch": 301, "val_loss": 2489924.25} {"train_loss": -32.87236404418945, "global_step": 36542, "epoch": 302} {"train_loss": -31.876373291015625, "global_step": 36543, "epoch": 302} {"train_loss": -32.98548126220703, "global_step": 36544, "epoch": 302} {"train_loss": -32.6673698425293, "global_step": 36545, "epoch": 302} {"train_loss": -31.782230377197266, "global_step": 36546, "epoch": 302} {"train_loss": -32.030879974365234, "global_step": 36547, "epoch": 302} {"train_loss": -31.842870712280273, "global_step": 36548, "epoch": 302} {"train_loss": -31.560712814331055, "global_step": 36549, "epoch": 302} {"train_loss": -31.536314010620117, "global_step": 36550, "epoch": 302} {"train_loss": -30.40018081665039, "global_step": 36551, "epoch": 302} {"train_loss": -27.630481719970703, "global_step": 36552, "epoch": 302} {"train_loss": -22.44060707092285, "global_step": 36553, "epoch": 302} {"train_loss": -20.925745010375977, "global_step": 36554, "epoch": 302} {"train_loss": -31.18414878845215, "global_step": 36555, "epoch": 302} {"train_loss": -28.23994255065918, "global_step": 36556, "epoch": 302} {"train_loss": -30.482282638549805, "global_step": 36557, "epoch": 302} {"train_loss": -29.04255485534668, "global_step": 36558, "epoch": 302} {"train_loss": -32.35321044921875, "global_step": 36559, "epoch": 302} {"train_loss": -30.06422233581543, "global_step": 36560, "epoch": 302} {"train_loss": -30.91301918029785, "global_step": 36561, "epoch": 302} {"train_loss": -32.074432373046875, "global_step": 36562, "epoch": 302} {"train_loss": -28.516504287719727, "global_step": 36563, "epoch": 302} {"train_loss": -30.796133041381836, "global_step": 36564, "epoch": 302} {"train_loss": -28.320709228515625, "global_step": 36565, "epoch": 302} {"train_loss": -27.03390884399414, "global_step": 36566, "epoch": 302} {"train_loss": -29.453510284423828, "global_step": 36567, "epoch": 302} {"train_loss": -26.325897216796875, "global_step": 36568, "epoch": 302} {"train_loss": -30.092529296875, "global_step": 36569, "epoch": 302} {"train_loss": -29.686325073242188, "global_step": 36570, "epoch": 302} {"train_loss": -30.224029541015625, "global_step": 36571, "epoch": 302} {"train_loss": -30.0626220703125, "global_step": 36572, "epoch": 302} {"train_loss": -29.414554595947266, "global_step": 36573, "epoch": 302} {"train_loss": -31.803197860717773, "global_step": 36574, "epoch": 302} {"train_loss": -31.303930282592773, "global_step": 36575, "epoch": 302} {"train_loss": -29.136388778686523, "global_step": 36576, "epoch": 302} {"train_loss": -31.335163116455078, "global_step": 36577, "epoch": 302} {"train_loss": -31.763446807861328, "global_step": 36578, "epoch": 302} {"train_loss": -31.201435089111328, "global_step": 36579, "epoch": 302} {"train_loss": -31.672758102416992, "global_step": 36580, "epoch": 302} {"train_loss": -32.09513473510742, "global_step": 36581, "epoch": 302} {"train_loss": -32.4244499206543, "global_step": 36582, "epoch": 302} {"train_loss": -31.227161407470703, "global_step": 36583, "epoch": 302} {"train_loss": -31.80462646484375, "global_step": 36584, "epoch": 302} {"train_loss": -32.12699890136719, "global_step": 36585, "epoch": 302} {"train_loss": -32.610042572021484, "global_step": 36586, "epoch": 302} {"train_loss": -32.251461029052734, "global_step": 36587, "epoch": 302} {"train_loss": -32.20757293701172, "global_step": 36588, "epoch": 302} {"train_loss": -31.94112205505371, "global_step": 36589, "epoch": 302} {"train_loss": -32.1817512512207, "global_step": 36590, "epoch": 302} {"train_loss": -32.78409194946289, "global_step": 36591, "epoch": 302} {"train_loss": -32.51857376098633, "global_step": 36592, "epoch": 302} {"train_loss": -32.59076690673828, "global_step": 36593, "epoch": 302} {"train_loss": -32.36268997192383, "global_step": 36594, "epoch": 302} {"train_loss": -32.41520309448242, "global_step": 36595, "epoch": 302} {"train_loss": -32.91267013549805, "global_step": 36596, "epoch": 302} {"train_loss": -32.69561004638672, "global_step": 36597, "epoch": 302} {"train_loss": -32.957786560058594, "global_step": 36598, "epoch": 302} {"train_loss": -32.696041107177734, "global_step": 36599, "epoch": 302} {"train_loss": -32.78071975708008, "global_step": 36600, "epoch": 302} {"train_loss": -32.81174850463867, "global_step": 36601, "epoch": 302} {"train_loss": -33.144142150878906, "global_step": 36602, "epoch": 302} {"train_loss": -33.06873321533203, "global_step": 36603, "epoch": 302} {"train_loss": -33.6883659362793, "global_step": 36604, "epoch": 302} {"train_loss": -33.69045639038086, "global_step": 36605, "epoch": 302} {"train_loss": -33.23008728027344, "global_step": 36606, "epoch": 302} {"train_loss": -33.09705352783203, "global_step": 36607, "epoch": 302} {"train_loss": -32.39078903198242, "global_step": 36608, "epoch": 302} {"train_loss": -32.057472229003906, "global_step": 36609, "epoch": 302} {"train_loss": -28.36260986328125, "global_step": 36610, "epoch": 302} {"train_loss": -18.55913734436035, "global_step": 36611, "epoch": 302} {"train_loss": -17.671039581298828, "global_step": 36612, "epoch": 302} {"train_loss": -32.001949310302734, "global_step": 36613, "epoch": 302} {"train_loss": -25.982336044311523, "global_step": 36614, "epoch": 302} {"train_loss": -31.591909408569336, "global_step": 36615, "epoch": 302} {"train_loss": -26.55927085876465, "global_step": 36616, "epoch": 302} {"train_loss": -32.445194244384766, "global_step": 36617, "epoch": 302} {"train_loss": -29.455881118774414, "global_step": 36618, "epoch": 302} {"train_loss": -29.88434410095215, "global_step": 36619, "epoch": 302} {"train_loss": -29.2376766204834, "global_step": 36620, "epoch": 302} {"train_loss": -29.46022605895996, "global_step": 36621, "epoch": 302} {"train_loss": -31.103551864624023, "global_step": 36622, "epoch": 302} {"train_loss": -30.699548721313477, "global_step": 36623, "epoch": 302} {"train_loss": -28.04436683654785, "global_step": 36624, "epoch": 302} {"train_loss": -29.521926879882812, "global_step": 36625, "epoch": 302} {"train_loss": -31.272993087768555, "global_step": 36626, "epoch": 302} {"train_loss": -27.28303337097168, "global_step": 36627, "epoch": 302} {"train_loss": -30.557294845581055, "global_step": 36628, "epoch": 302} {"train_loss": -29.69333839416504, "global_step": 36629, "epoch": 302} {"train_loss": -29.137470245361328, "global_step": 36630, "epoch": 302} {"train_loss": -29.6671142578125, "global_step": 36631, "epoch": 302} {"train_loss": -30.587873458862305, "global_step": 36632, "epoch": 302} {"train_loss": -28.8629207611084, "global_step": 36633, "epoch": 302} {"train_loss": -30.059539794921875, "global_step": 36634, "epoch": 302} {"train_loss": -30.233936309814453, "global_step": 36635, "epoch": 302} {"train_loss": -28.560544967651367, "global_step": 36636, "epoch": 302} {"train_loss": -29.991195678710938, "global_step": 36637, "epoch": 302} {"train_loss": -29.45907974243164, "global_step": 36638, "epoch": 302} {"train_loss": -29.63518714904785, "global_step": 36639, "epoch": 302} {"train_loss": -30.070398330688477, "global_step": 36640, "epoch": 302} {"train_loss": -30.963232040405273, "global_step": 36641, "epoch": 302} {"train_loss": -31.08621597290039, "global_step": 36642, "epoch": 302} {"train_loss": -30.884796142578125, "global_step": 36643, "epoch": 302} {"train_loss": -30.50562858581543, "global_step": 36644, "epoch": 302} {"train_loss": -30.908300399780273, "global_step": 36645, "epoch": 302} {"train_loss": -30.991132736206055, "global_step": 36646, "epoch": 302} {"train_loss": -30.937047958374023, "global_step": 36647, "epoch": 302} {"train_loss": -31.262134552001953, "global_step": 36648, "epoch": 302} {"train_loss": -28.227447509765625, "global_step": 36649, "epoch": 302} {"train_loss": -31.19379234313965, "global_step": 36650, "epoch": 302} {"train_loss": -30.730030059814453, "global_step": 36651, "epoch": 302} {"train_loss": -30.39165687561035, "global_step": 36652, "epoch": 302} {"train_loss": -31.125818252563477, "global_step": 36653, "epoch": 302} {"train_loss": -31.16485595703125, "global_step": 36654, "epoch": 302} {"train_loss": -30.842899322509766, "global_step": 36655, "epoch": 302} {"train_loss": -30.39692497253418, "global_step": 36656, "epoch": 302} {"train_loss": -30.693845748901367, "global_step": 36657, "epoch": 302} {"train_loss": -31.275495529174805, "global_step": 36658, "epoch": 302} {"train_loss": -31.496963500976562, "global_step": 36659, "epoch": 302} {"train_loss": -31.287433624267578, "global_step": 36660, "epoch": 302} {"train_loss": -29.691221237182617, "global_step": 36661, "epoch": 302} {"train_loss": -30.50302957897344, "global_step": 36662, "epoch": 302, "val_loss": 2627458.0} {"train_loss": -31.51799964904785, "global_step": 36663, "epoch": 303} {"train_loss": -30.061145782470703, "global_step": 36664, "epoch": 303} {"train_loss": -31.087793350219727, "global_step": 36665, "epoch": 303} {"train_loss": -31.381744384765625, "global_step": 36666, "epoch": 303} {"train_loss": -31.767337799072266, "global_step": 36667, "epoch": 303} {"train_loss": -31.023542404174805, "global_step": 36668, "epoch": 303} {"train_loss": -32.1034049987793, "global_step": 36669, "epoch": 303} {"train_loss": -31.794403076171875, "global_step": 36670, "epoch": 303} {"train_loss": -31.743803024291992, "global_step": 36671, "epoch": 303} {"train_loss": -31.988744735717773, "global_step": 36672, "epoch": 303} {"train_loss": -31.493366241455078, "global_step": 36673, "epoch": 303} {"train_loss": -31.778711318969727, "global_step": 36674, "epoch": 303} {"train_loss": -31.73334312438965, "global_step": 36675, "epoch": 303} {"train_loss": -32.02854537963867, "global_step": 36676, "epoch": 303} {"train_loss": -32.312530517578125, "global_step": 36677, "epoch": 303} {"train_loss": -32.264129638671875, "global_step": 36678, "epoch": 303} {"train_loss": -32.196292877197266, "global_step": 36679, "epoch": 303} {"train_loss": -32.01861572265625, "global_step": 36680, "epoch": 303} {"train_loss": -32.109066009521484, "global_step": 36681, "epoch": 303} {"train_loss": -32.57643508911133, "global_step": 36682, "epoch": 303} {"train_loss": -32.64655685424805, "global_step": 36683, "epoch": 303} {"train_loss": -32.2741584777832, "global_step": 36684, "epoch": 303} {"train_loss": -32.83659744262695, "global_step": 36685, "epoch": 303} {"train_loss": -32.685211181640625, "global_step": 36686, "epoch": 303} {"train_loss": -32.656986236572266, "global_step": 36687, "epoch": 303} {"train_loss": -33.20859909057617, "global_step": 36688, "epoch": 303} {"train_loss": -33.204524993896484, "global_step": 36689, "epoch": 303} {"train_loss": -33.11770248413086, "global_step": 36690, "epoch": 303} {"train_loss": -33.392822265625, "global_step": 36691, "epoch": 303} {"train_loss": -33.20887756347656, "global_step": 36692, "epoch": 303} {"train_loss": -33.17604446411133, "global_step": 36693, "epoch": 303} {"train_loss": -33.44364929199219, "global_step": 36694, "epoch": 303} {"train_loss": -33.586395263671875, "global_step": 36695, "epoch": 303} {"train_loss": -33.48826217651367, "global_step": 36696, "epoch": 303} {"train_loss": -33.45085525512695, "global_step": 36697, "epoch": 303} {"train_loss": -33.505882263183594, "global_step": 36698, "epoch": 303} {"train_loss": -33.922908782958984, "global_step": 36699, "epoch": 303} {"train_loss": -33.59435272216797, "global_step": 36700, "epoch": 303} {"train_loss": -33.735198974609375, "global_step": 36701, "epoch": 303} {"train_loss": -33.98911666870117, "global_step": 36702, "epoch": 303} {"train_loss": -33.75164794921875, "global_step": 36703, "epoch": 303} {"train_loss": -33.71010208129883, "global_step": 36704, "epoch": 303} {"train_loss": -33.676963806152344, "global_step": 36705, "epoch": 303} {"train_loss": -33.72763442993164, "global_step": 36706, "epoch": 303} {"train_loss": -34.14836502075195, "global_step": 36707, "epoch": 303} {"train_loss": -34.23550033569336, "global_step": 36708, "epoch": 303} {"train_loss": -33.92086410522461, "global_step": 36709, "epoch": 303} {"train_loss": -34.24044418334961, "global_step": 36710, "epoch": 303} {"train_loss": -33.90675354003906, "global_step": 36711, "epoch": 303} {"train_loss": -34.1795539855957, "global_step": 36712, "epoch": 303} {"train_loss": -34.13726806640625, "global_step": 36713, "epoch": 303} {"train_loss": -33.55536651611328, "global_step": 36714, "epoch": 303} {"train_loss": -34.50791549682617, "global_step": 36715, "epoch": 303} {"train_loss": -34.45554733276367, "global_step": 36716, "epoch": 303} {"train_loss": -33.51597213745117, "global_step": 36717, "epoch": 303} {"train_loss": -34.06104278564453, "global_step": 36718, "epoch": 303} {"train_loss": -34.2743034362793, "global_step": 36719, "epoch": 303} {"train_loss": -32.959651947021484, "global_step": 36720, "epoch": 303} {"train_loss": -30.017303466796875, "global_step": 36721, "epoch": 303} {"train_loss": -18.880264282226562, "global_step": 36722, "epoch": 303} {"train_loss": 5.250229358673096, "global_step": 36723, "epoch": 303} {"train_loss": -17.886917114257812, "global_step": 36724, "epoch": 303} {"train_loss": -27.984466552734375, "global_step": 36725, "epoch": 303} {"train_loss": -27.635099411010742, "global_step": 36726, "epoch": 303} {"train_loss": -27.318395614624023, "global_step": 36727, "epoch": 303} {"train_loss": -32.25703048706055, "global_step": 36728, "epoch": 303} {"train_loss": -27.54121971130371, "global_step": 36729, "epoch": 303} {"train_loss": -31.010908126831055, "global_step": 36730, "epoch": 303} {"train_loss": -32.42887496948242, "global_step": 36731, "epoch": 303} {"train_loss": -30.087060928344727, "global_step": 36732, "epoch": 303} {"train_loss": -30.274612426757812, "global_step": 36733, "epoch": 303} {"train_loss": -30.593847274780273, "global_step": 36734, "epoch": 303} {"train_loss": -31.826007843017578, "global_step": 36735, "epoch": 303} {"train_loss": -31.67742347717285, "global_step": 36736, "epoch": 303} {"train_loss": -30.039968490600586, "global_step": 36737, "epoch": 303} {"train_loss": -31.4759464263916, "global_step": 36738, "epoch": 303} {"train_loss": -31.82086753845215, "global_step": 36739, "epoch": 303} {"train_loss": -32.29154586791992, "global_step": 36740, "epoch": 303} {"train_loss": -29.003477096557617, "global_step": 36741, "epoch": 303} {"train_loss": -31.955900192260742, "global_step": 36742, "epoch": 303} {"train_loss": -29.345285415649414, "global_step": 36743, "epoch": 303} {"train_loss": -30.83233070373535, "global_step": 36744, "epoch": 303} {"train_loss": -31.747343063354492, "global_step": 36745, "epoch": 303} {"train_loss": -31.866926193237305, "global_step": 36746, "epoch": 303} {"train_loss": -32.35224151611328, "global_step": 36747, "epoch": 303} {"train_loss": -31.371164321899414, "global_step": 36748, "epoch": 303} {"train_loss": -31.161787033081055, "global_step": 36749, "epoch": 303} {"train_loss": -29.1599178314209, "global_step": 36750, "epoch": 303} {"train_loss": -31.200178146362305, "global_step": 36751, "epoch": 303} {"train_loss": -31.954626083374023, "global_step": 36752, "epoch": 303} {"train_loss": -31.26116371154785, "global_step": 36753, "epoch": 303} {"train_loss": -31.558380126953125, "global_step": 36754, "epoch": 303} {"train_loss": -31.510663986206055, "global_step": 36755, "epoch": 303} {"train_loss": -31.226476669311523, "global_step": 36756, "epoch": 303} {"train_loss": -31.52052116394043, "global_step": 36757, "epoch": 303} {"train_loss": -29.797269821166992, "global_step": 36758, "epoch": 303} {"train_loss": -31.338342666625977, "global_step": 36759, "epoch": 303} {"train_loss": -31.55389404296875, "global_step": 36760, "epoch": 303} {"train_loss": -31.51190185546875, "global_step": 36761, "epoch": 303} {"train_loss": -31.248687744140625, "global_step": 36762, "epoch": 303} {"train_loss": -31.356552124023438, "global_step": 36763, "epoch": 303} {"train_loss": -31.317106246948242, "global_step": 36764, "epoch": 303} {"train_loss": -32.07557678222656, "global_step": 36765, "epoch": 303} {"train_loss": -31.807641983032227, "global_step": 36766, "epoch": 303} {"train_loss": -31.66939353942871, "global_step": 36767, "epoch": 303} {"train_loss": -31.24649429321289, "global_step": 36768, "epoch": 303} {"train_loss": -32.143402099609375, "global_step": 36769, "epoch": 303} {"train_loss": -32.15653610229492, "global_step": 36770, "epoch": 303} {"train_loss": -32.02244567871094, "global_step": 36771, "epoch": 303} {"train_loss": -32.1004638671875, "global_step": 36772, "epoch": 303} {"train_loss": -31.675962448120117, "global_step": 36773, "epoch": 303} {"train_loss": -32.081764221191406, "global_step": 36774, "epoch": 303} {"train_loss": -32.20769119262695, "global_step": 36775, "epoch": 303} {"train_loss": -32.35481643676758, "global_step": 36776, "epoch": 303} {"train_loss": -31.8051700592041, "global_step": 36777, "epoch": 303} {"train_loss": -32.40888595581055, "global_step": 36778, "epoch": 303} {"train_loss": -32.980323791503906, "global_step": 36779, "epoch": 303} {"train_loss": -32.76139831542969, "global_step": 36780, "epoch": 303} {"train_loss": -32.65752410888672, "global_step": 36781, "epoch": 303} {"train_loss": -32.78470993041992, "global_step": 36782, "epoch": 303} {"train_loss": -31.554299011703364, "global_step": 36783, "epoch": 303, "val_loss": 2596090.0} {"train_loss": -32.170562744140625, "global_step": 36784, "epoch": 304} {"train_loss": -32.570980072021484, "global_step": 36785, "epoch": 304} {"train_loss": -32.9614143371582, "global_step": 36786, "epoch": 304} {"train_loss": -32.68680953979492, "global_step": 36787, "epoch": 304} {"train_loss": -32.77090072631836, "global_step": 36788, "epoch": 304} {"train_loss": -32.793312072753906, "global_step": 36789, "epoch": 304} {"train_loss": -32.42298126220703, "global_step": 36790, "epoch": 304} {"train_loss": -32.24715042114258, "global_step": 36791, "epoch": 304} {"train_loss": -32.73637008666992, "global_step": 36792, "epoch": 304} {"train_loss": -32.154541015625, "global_step": 36793, "epoch": 304} {"train_loss": -33.31986618041992, "global_step": 36794, "epoch": 304} {"train_loss": -32.90913772583008, "global_step": 36795, "epoch": 304} {"train_loss": -32.811275482177734, "global_step": 36796, "epoch": 304} {"train_loss": -32.3585319519043, "global_step": 36797, "epoch": 304} {"train_loss": -33.01585006713867, "global_step": 36798, "epoch": 304} {"train_loss": -33.48358154296875, "global_step": 36799, "epoch": 304} {"train_loss": -33.35185623168945, "global_step": 36800, "epoch": 304} {"train_loss": -32.67108917236328, "global_step": 36801, "epoch": 304} {"train_loss": -32.82173156738281, "global_step": 36802, "epoch": 304} {"train_loss": -33.1496696472168, "global_step": 36803, "epoch": 304} {"train_loss": -33.15438461303711, "global_step": 36804, "epoch": 304} {"train_loss": -33.06938934326172, "global_step": 36805, "epoch": 304} {"train_loss": -31.523056030273438, "global_step": 36806, "epoch": 304} {"train_loss": -32.3933219909668, "global_step": 36807, "epoch": 304} {"train_loss": -31.52483558654785, "global_step": 36808, "epoch": 304} {"train_loss": -30.885238647460938, "global_step": 36809, "epoch": 304} {"train_loss": -30.6630916595459, "global_step": 36810, "epoch": 304} {"train_loss": -30.2523136138916, "global_step": 36811, "epoch": 304} {"train_loss": -31.553634643554688, "global_step": 36812, "epoch": 304} {"train_loss": -32.473262786865234, "global_step": 36813, "epoch": 304} {"train_loss": -31.83329200744629, "global_step": 36814, "epoch": 304} {"train_loss": -33.1699104309082, "global_step": 36815, "epoch": 304} {"train_loss": -32.54449462890625, "global_step": 36816, "epoch": 304} {"train_loss": -30.0498104095459, "global_step": 36817, "epoch": 304} {"train_loss": -31.420135498046875, "global_step": 36818, "epoch": 304} {"train_loss": -33.29402160644531, "global_step": 36819, "epoch": 304} {"train_loss": -32.06177520751953, "global_step": 36820, "epoch": 304} {"train_loss": -31.749774932861328, "global_step": 36821, "epoch": 304} {"train_loss": -32.3879508972168, "global_step": 36822, "epoch": 304} {"train_loss": -33.349266052246094, "global_step": 36823, "epoch": 304} {"train_loss": -32.77582931518555, "global_step": 36824, "epoch": 304} {"train_loss": -33.1352424621582, "global_step": 36825, "epoch": 304} {"train_loss": -32.225276947021484, "global_step": 36826, "epoch": 304} {"train_loss": -33.24054718017578, "global_step": 36827, "epoch": 304} {"train_loss": -32.2464714050293, "global_step": 36828, "epoch": 304} {"train_loss": -33.739112854003906, "global_step": 36829, "epoch": 304} {"train_loss": -32.89033126831055, "global_step": 36830, "epoch": 304} {"train_loss": -32.11980438232422, "global_step": 36831, "epoch": 304} {"train_loss": -31.534942626953125, "global_step": 36832, "epoch": 304} {"train_loss": -32.674598693847656, "global_step": 36833, "epoch": 304} {"train_loss": -32.30893325805664, "global_step": 36834, "epoch": 304} {"train_loss": -32.94160842895508, "global_step": 36835, "epoch": 304} {"train_loss": -32.779388427734375, "global_step": 36836, "epoch": 304} {"train_loss": -32.67434310913086, "global_step": 36837, "epoch": 304} {"train_loss": -32.067039489746094, "global_step": 36838, "epoch": 304} {"train_loss": -31.91742515563965, "global_step": 36839, "epoch": 304} {"train_loss": -31.43896484375, "global_step": 36840, "epoch": 304} {"train_loss": -32.060787200927734, "global_step": 36841, "epoch": 304} {"train_loss": -31.873090744018555, "global_step": 36842, "epoch": 304} {"train_loss": -31.78509521484375, "global_step": 36843, "epoch": 304} {"train_loss": -32.16709518432617, "global_step": 36844, "epoch": 304} {"train_loss": -31.90895652770996, "global_step": 36845, "epoch": 304} {"train_loss": -29.315784454345703, "global_step": 36846, "epoch": 304} {"train_loss": -29.198123931884766, "global_step": 36847, "epoch": 304} {"train_loss": -28.116485595703125, "global_step": 36848, "epoch": 304} {"train_loss": -30.45794677734375, "global_step": 36849, "epoch": 304} {"train_loss": -32.64374923706055, "global_step": 36850, "epoch": 304} {"train_loss": -31.718847274780273, "global_step": 36851, "epoch": 304} {"train_loss": -29.856775283813477, "global_step": 36852, "epoch": 304} {"train_loss": -31.647058486938477, "global_step": 36853, "epoch": 304} {"train_loss": -32.60680389404297, "global_step": 36854, "epoch": 304} {"train_loss": -31.453893661499023, "global_step": 36855, "epoch": 304} {"train_loss": -31.697595596313477, "global_step": 36856, "epoch": 304} {"train_loss": -31.80853271484375, "global_step": 36857, "epoch": 304} {"train_loss": -31.297887802124023, "global_step": 36858, "epoch": 304} {"train_loss": -31.970752716064453, "global_step": 36859, "epoch": 304} {"train_loss": -31.260290145874023, "global_step": 36860, "epoch": 304} {"train_loss": -31.643972396850586, "global_step": 36861, "epoch": 304} {"train_loss": -31.4904727935791, "global_step": 36862, "epoch": 304} {"train_loss": -31.927539825439453, "global_step": 36863, "epoch": 304} {"train_loss": -32.169776916503906, "global_step": 36864, "epoch": 304} {"train_loss": -31.509836196899414, "global_step": 36865, "epoch": 304} {"train_loss": -32.173519134521484, "global_step": 36866, "epoch": 304} {"train_loss": -31.88319206237793, "global_step": 36867, "epoch": 304} {"train_loss": -32.24098205566406, "global_step": 36868, "epoch": 304} {"train_loss": -31.523162841796875, "global_step": 36869, "epoch": 304} {"train_loss": -32.16215133666992, "global_step": 36870, "epoch": 304} {"train_loss": -32.5200309753418, "global_step": 36871, "epoch": 304} {"train_loss": -31.983203887939453, "global_step": 36872, "epoch": 304} {"train_loss": -32.226234436035156, "global_step": 36873, "epoch": 304} {"train_loss": -32.439735412597656, "global_step": 36874, "epoch": 304} {"train_loss": -32.408843994140625, "global_step": 36875, "epoch": 304} {"train_loss": -32.24050521850586, "global_step": 36876, "epoch": 304} {"train_loss": -32.39527130126953, "global_step": 36877, "epoch": 304} {"train_loss": -32.582359313964844, "global_step": 36878, "epoch": 304} {"train_loss": -32.7154655456543, "global_step": 36879, "epoch": 304} {"train_loss": -32.60685729980469, "global_step": 36880, "epoch": 304} {"train_loss": -32.552494049072266, "global_step": 36881, "epoch": 304} {"train_loss": -32.33515930175781, "global_step": 36882, "epoch": 304} {"train_loss": -32.69292449951172, "global_step": 36883, "epoch": 304} {"train_loss": -32.5566520690918, "global_step": 36884, "epoch": 304} {"train_loss": -32.62917709350586, "global_step": 36885, "epoch": 304} {"train_loss": -32.12617874145508, "global_step": 36886, "epoch": 304} {"train_loss": -32.05550003051758, "global_step": 36887, "epoch": 304} {"train_loss": -32.99794387817383, "global_step": 36888, "epoch": 304} {"train_loss": -32.806190490722656, "global_step": 36889, "epoch": 304} {"train_loss": -31.927820205688477, "global_step": 36890, "epoch": 304} {"train_loss": -32.384613037109375, "global_step": 36891, "epoch": 304} {"train_loss": -32.82288360595703, "global_step": 36892, "epoch": 304} {"train_loss": -33.23723220825195, "global_step": 36893, "epoch": 304} {"train_loss": -32.567569732666016, "global_step": 36894, "epoch": 304} {"train_loss": -32.60378646850586, "global_step": 36895, "epoch": 304} {"train_loss": -33.227176666259766, "global_step": 36896, "epoch": 304} {"train_loss": -32.72241973876953, "global_step": 36897, "epoch": 304} {"train_loss": -31.202543258666992, "global_step": 36898, "epoch": 304} {"train_loss": -32.331851959228516, "global_step": 36899, "epoch": 304} {"train_loss": -33.651607513427734, "global_step": 36900, "epoch": 304} {"train_loss": -32.471527099609375, "global_step": 36901, "epoch": 304} {"train_loss": -32.329254150390625, "global_step": 36902, "epoch": 304} {"train_loss": -33.56119918823242, "global_step": 36903, "epoch": 304} {"train_loss": -32.21304739014176, "global_step": 36904, "epoch": 304, "val_loss": 2518765.0} {"train_loss": -33.52657699584961, "global_step": 36905, "epoch": 305} {"train_loss": -32.863094329833984, "global_step": 36906, "epoch": 305} {"train_loss": -33.86205291748047, "global_step": 36907, "epoch": 305} {"train_loss": -33.33994674682617, "global_step": 36908, "epoch": 305} {"train_loss": -33.14034652709961, "global_step": 36909, "epoch": 305} {"train_loss": -33.59135818481445, "global_step": 36910, "epoch": 305} {"train_loss": -33.617889404296875, "global_step": 36911, "epoch": 305} {"train_loss": -33.2513542175293, "global_step": 36912, "epoch": 305} {"train_loss": -33.045875549316406, "global_step": 36913, "epoch": 305} {"train_loss": -34.113624572753906, "global_step": 36914, "epoch": 305} {"train_loss": -33.02212142944336, "global_step": 36915, "epoch": 305} {"train_loss": -32.67363357543945, "global_step": 36916, "epoch": 305} {"train_loss": -33.25661849975586, "global_step": 36917, "epoch": 305} {"train_loss": -33.5394401550293, "global_step": 36918, "epoch": 305} {"train_loss": -32.37819290161133, "global_step": 36919, "epoch": 305} {"train_loss": -33.46541976928711, "global_step": 36920, "epoch": 305} {"train_loss": -33.63874053955078, "global_step": 36921, "epoch": 305} {"train_loss": -33.78770065307617, "global_step": 36922, "epoch": 305} {"train_loss": -34.044677734375, "global_step": 36923, "epoch": 305} {"train_loss": -33.8857536315918, "global_step": 36924, "epoch": 305} {"train_loss": -33.74553680419922, "global_step": 36925, "epoch": 305} {"train_loss": -33.30832290649414, "global_step": 36926, "epoch": 305} {"train_loss": -33.5947380065918, "global_step": 36927, "epoch": 305} {"train_loss": -34.04166793823242, "global_step": 36928, "epoch": 305} {"train_loss": -32.12092590332031, "global_step": 36929, "epoch": 305} {"train_loss": -31.74033546447754, "global_step": 36930, "epoch": 305} {"train_loss": -33.107666015625, "global_step": 36931, "epoch": 305} {"train_loss": -33.43407440185547, "global_step": 36932, "epoch": 305} {"train_loss": -32.47536849975586, "global_step": 36933, "epoch": 305} {"train_loss": -33.084346771240234, "global_step": 36934, "epoch": 305} {"train_loss": -32.64039993286133, "global_step": 36935, "epoch": 305} {"train_loss": -32.36845016479492, "global_step": 36936, "epoch": 305} {"train_loss": -32.43130874633789, "global_step": 36937, "epoch": 305} {"train_loss": -32.24674606323242, "global_step": 36938, "epoch": 305} {"train_loss": -31.5855712890625, "global_step": 36939, "epoch": 305} {"train_loss": -31.912500381469727, "global_step": 36940, "epoch": 305} {"train_loss": -31.903430938720703, "global_step": 36941, "epoch": 305} {"train_loss": -29.8924617767334, "global_step": 36942, "epoch": 305} {"train_loss": -31.002979278564453, "global_step": 36943, "epoch": 305} {"train_loss": -31.970050811767578, "global_step": 36944, "epoch": 305} {"train_loss": -27.172199249267578, "global_step": 36945, "epoch": 305} {"train_loss": -32.17185592651367, "global_step": 36946, "epoch": 305} {"train_loss": -29.873334884643555, "global_step": 36947, "epoch": 305} {"train_loss": -32.54501724243164, "global_step": 36948, "epoch": 305} {"train_loss": -30.374792098999023, "global_step": 36949, "epoch": 305} {"train_loss": -31.610319137573242, "global_step": 36950, "epoch": 305} {"train_loss": -31.57037925720215, "global_step": 36951, "epoch": 305} {"train_loss": -30.9721622467041, "global_step": 36952, "epoch": 305} {"train_loss": -32.004329681396484, "global_step": 36953, "epoch": 305} {"train_loss": -30.881139755249023, "global_step": 36954, "epoch": 305} {"train_loss": -31.012226104736328, "global_step": 36955, "epoch": 305} {"train_loss": -31.042524337768555, "global_step": 36956, "epoch": 305} {"train_loss": -29.874906539916992, "global_step": 36957, "epoch": 305} {"train_loss": -29.759063720703125, "global_step": 36958, "epoch": 305} {"train_loss": -31.765466690063477, "global_step": 36959, "epoch": 305} {"train_loss": -31.504575729370117, "global_step": 36960, "epoch": 305} {"train_loss": -31.336566925048828, "global_step": 36961, "epoch": 305} {"train_loss": -29.7819766998291, "global_step": 36962, "epoch": 305} {"train_loss": -31.208362579345703, "global_step": 36963, "epoch": 305} {"train_loss": -30.723281860351562, "global_step": 36964, "epoch": 305} {"train_loss": -29.022205352783203, "global_step": 36965, "epoch": 305} {"train_loss": -30.343351364135742, "global_step": 36966, "epoch": 305} {"train_loss": -29.630538940429688, "global_step": 36967, "epoch": 305} {"train_loss": -30.187332153320312, "global_step": 36968, "epoch": 305} {"train_loss": -27.748397827148438, "global_step": 36969, "epoch": 305} {"train_loss": -29.666746139526367, "global_step": 36970, "epoch": 305} {"train_loss": -31.05510902404785, "global_step": 36971, "epoch": 305} {"train_loss": -30.417158126831055, "global_step": 36972, "epoch": 305} {"train_loss": -28.1029109954834, "global_step": 36973, "epoch": 305} {"train_loss": -31.7215576171875, "global_step": 36974, "epoch": 305} {"train_loss": -30.809125900268555, "global_step": 36975, "epoch": 305} {"train_loss": -31.150466918945312, "global_step": 36976, "epoch": 305} {"train_loss": -28.58917808532715, "global_step": 36977, "epoch": 305} {"train_loss": -28.56317710876465, "global_step": 36978, "epoch": 305} {"train_loss": -29.73042869567871, "global_step": 36979, "epoch": 305} {"train_loss": -30.37257194519043, "global_step": 36980, "epoch": 305} {"train_loss": -30.4805965423584, "global_step": 36981, "epoch": 305} {"train_loss": -30.721729278564453, "global_step": 36982, "epoch": 305} {"train_loss": -29.23231315612793, "global_step": 36983, "epoch": 305} {"train_loss": -28.806869506835938, "global_step": 36984, "epoch": 305} {"train_loss": -30.684412002563477, "global_step": 36985, "epoch": 305} {"train_loss": -31.451690673828125, "global_step": 36986, "epoch": 305} {"train_loss": -30.34330177307129, "global_step": 36987, "epoch": 305} {"train_loss": -29.83332633972168, "global_step": 36988, "epoch": 305} {"train_loss": -31.485578536987305, "global_step": 36989, "epoch": 305} {"train_loss": -30.529132843017578, "global_step": 36990, "epoch": 305} {"train_loss": -31.435028076171875, "global_step": 36991, "epoch": 305} {"train_loss": -31.42127799987793, "global_step": 36992, "epoch": 305} {"train_loss": -27.97075843811035, "global_step": 36993, "epoch": 305} {"train_loss": -31.190433502197266, "global_step": 36994, "epoch": 305} {"train_loss": -30.899463653564453, "global_step": 36995, "epoch": 305} {"train_loss": -31.02924919128418, "global_step": 36996, "epoch": 305} {"train_loss": -31.1263370513916, "global_step": 36997, "epoch": 305} {"train_loss": -30.222631454467773, "global_step": 36998, "epoch": 305} {"train_loss": -31.6241455078125, "global_step": 36999, "epoch": 305} {"train_loss": -31.65787124633789, "global_step": 37000, "epoch": 305} {"train_loss": -31.31426429748535, "global_step": 37001, "epoch": 305} {"train_loss": -31.688962936401367, "global_step": 37002, "epoch": 305} {"train_loss": -31.560102462768555, "global_step": 37003, "epoch": 305} {"train_loss": -31.976593017578125, "global_step": 37004, "epoch": 305} {"train_loss": -32.21978759765625, "global_step": 37005, "epoch": 305} {"train_loss": -31.94862174987793, "global_step": 37006, "epoch": 305} {"train_loss": -31.452001571655273, "global_step": 37007, "epoch": 305} {"train_loss": -31.028339385986328, "global_step": 37008, "epoch": 305} {"train_loss": -32.176048278808594, "global_step": 37009, "epoch": 305} {"train_loss": -31.65631103515625, "global_step": 37010, "epoch": 305} {"train_loss": -32.31962203979492, "global_step": 37011, "epoch": 305} {"train_loss": -32.20454406738281, "global_step": 37012, "epoch": 305} {"train_loss": -31.84486198425293, "global_step": 37013, "epoch": 305} {"train_loss": -32.219966888427734, "global_step": 37014, "epoch": 305} {"train_loss": -32.20015335083008, "global_step": 37015, "epoch": 305} {"train_loss": -32.46366500854492, "global_step": 37016, "epoch": 305} {"train_loss": -32.41960906982422, "global_step": 37017, "epoch": 305} {"train_loss": -32.04571533203125, "global_step": 37018, "epoch": 305} {"train_loss": -32.63967514038086, "global_step": 37019, "epoch": 305} {"train_loss": -32.28622055053711, "global_step": 37020, "epoch": 305} {"train_loss": -32.19769287109375, "global_step": 37021, "epoch": 305} {"train_loss": -33.00155258178711, "global_step": 37022, "epoch": 305} {"train_loss": -32.67767333984375, "global_step": 37023, "epoch": 305} {"train_loss": -33.001853942871094, "global_step": 37024, "epoch": 305} {"train_loss": -31.626962157320385, "global_step": 37025, "epoch": 305, "val_loss": 2457487.25} {"train_loss": -33.056270599365234, "global_step": 37026, "epoch": 306} {"train_loss": -32.8862419128418, "global_step": 37027, "epoch": 306} {"train_loss": -32.9369010925293, "global_step": 37028, "epoch": 306} {"train_loss": -32.6871223449707, "global_step": 37029, "epoch": 306} {"train_loss": -33.38700866699219, "global_step": 37030, "epoch": 306} {"train_loss": -33.311614990234375, "global_step": 37031, "epoch": 306} {"train_loss": -33.09348678588867, "global_step": 37032, "epoch": 306} {"train_loss": -33.077083587646484, "global_step": 37033, "epoch": 306} {"train_loss": -32.07513427734375, "global_step": 37034, "epoch": 306} {"train_loss": -30.951391220092773, "global_step": 37035, "epoch": 306} {"train_loss": -31.188535690307617, "global_step": 37036, "epoch": 306} {"train_loss": -32.832672119140625, "global_step": 37037, "epoch": 306} {"train_loss": -33.334903717041016, "global_step": 37038, "epoch": 306} {"train_loss": -30.690542221069336, "global_step": 37039, "epoch": 306} {"train_loss": -28.148975372314453, "global_step": 37040, "epoch": 306} {"train_loss": -30.1812744140625, "global_step": 37041, "epoch": 306} {"train_loss": -33.19045639038086, "global_step": 37042, "epoch": 306} {"train_loss": -31.38433837890625, "global_step": 37043, "epoch": 306} {"train_loss": -32.309661865234375, "global_step": 37044, "epoch": 306} {"train_loss": -33.60376739501953, "global_step": 37045, "epoch": 306} {"train_loss": -32.403709411621094, "global_step": 37046, "epoch": 306} {"train_loss": -33.40694046020508, "global_step": 37047, "epoch": 306} {"train_loss": -32.588558197021484, "global_step": 37048, "epoch": 306} {"train_loss": -34.04841995239258, "global_step": 37049, "epoch": 306} {"train_loss": -32.98899459838867, "global_step": 37050, "epoch": 306} {"train_loss": -33.92089080810547, "global_step": 37051, "epoch": 306} {"train_loss": -33.12285232543945, "global_step": 37052, "epoch": 306} {"train_loss": -33.80717849731445, "global_step": 37053, "epoch": 306} {"train_loss": -33.602481842041016, "global_step": 37054, "epoch": 306} {"train_loss": -33.56745529174805, "global_step": 37055, "epoch": 306} {"train_loss": -33.821044921875, "global_step": 37056, "epoch": 306} {"train_loss": -33.499053955078125, "global_step": 37057, "epoch": 306} {"train_loss": -33.30825424194336, "global_step": 37058, "epoch": 306} {"train_loss": -33.8772087097168, "global_step": 37059, "epoch": 306} {"train_loss": -33.831153869628906, "global_step": 37060, "epoch": 306} {"train_loss": -33.61040115356445, "global_step": 37061, "epoch": 306} {"train_loss": -34.077796936035156, "global_step": 37062, "epoch": 306} {"train_loss": -33.89284896850586, "global_step": 37063, "epoch": 306} {"train_loss": -34.177635192871094, "global_step": 37064, "epoch": 306} {"train_loss": -34.0463752746582, "global_step": 37065, "epoch": 306} {"train_loss": -34.2226676940918, "global_step": 37066, "epoch": 306} {"train_loss": -33.6722297668457, "global_step": 37067, "epoch": 306} {"train_loss": -33.94279098510742, "global_step": 37068, "epoch": 306} {"train_loss": -33.39785385131836, "global_step": 37069, "epoch": 306} {"train_loss": -33.863502502441406, "global_step": 37070, "epoch": 306} {"train_loss": -34.07468795776367, "global_step": 37071, "epoch": 306} {"train_loss": -33.260406494140625, "global_step": 37072, "epoch": 306} {"train_loss": -33.82291793823242, "global_step": 37073, "epoch": 306} {"train_loss": -34.08395004272461, "global_step": 37074, "epoch": 306} {"train_loss": -33.50895309448242, "global_step": 37075, "epoch": 306} {"train_loss": -33.8447265625, "global_step": 37076, "epoch": 306} {"train_loss": -33.60590362548828, "global_step": 37077, "epoch": 306} {"train_loss": -33.61299514770508, "global_step": 37078, "epoch": 306} {"train_loss": -33.84846115112305, "global_step": 37079, "epoch": 306} {"train_loss": -33.11739730834961, "global_step": 37080, "epoch": 306} {"train_loss": -33.4869384765625, "global_step": 37081, "epoch": 306} {"train_loss": -33.24222946166992, "global_step": 37082, "epoch": 306} {"train_loss": -32.59490966796875, "global_step": 37083, "epoch": 306} {"train_loss": -32.989654541015625, "global_step": 37084, "epoch": 306} {"train_loss": -33.07648849487305, "global_step": 37085, "epoch": 306} {"train_loss": -32.774017333984375, "global_step": 37086, "epoch": 306} {"train_loss": -31.819019317626953, "global_step": 37087, "epoch": 306} {"train_loss": -31.775836944580078, "global_step": 37088, "epoch": 306} {"train_loss": -31.200885772705078, "global_step": 37089, "epoch": 306} {"train_loss": -23.167112350463867, "global_step": 37090, "epoch": 306} {"train_loss": -19.647594451904297, "global_step": 37091, "epoch": 306} {"train_loss": -27.907636642456055, "global_step": 37092, "epoch": 306} {"train_loss": -30.723785400390625, "global_step": 37093, "epoch": 306} {"train_loss": -28.596881866455078, "global_step": 37094, "epoch": 306} {"train_loss": -31.851886749267578, "global_step": 37095, "epoch": 306} {"train_loss": -29.876256942749023, "global_step": 37096, "epoch": 306} {"train_loss": -31.17823600769043, "global_step": 37097, "epoch": 306} {"train_loss": -31.687768936157227, "global_step": 37098, "epoch": 306} {"train_loss": -30.251916885375977, "global_step": 37099, "epoch": 306} {"train_loss": -32.017024993896484, "global_step": 37100, "epoch": 306} {"train_loss": -32.09181594848633, "global_step": 37101, "epoch": 306} {"train_loss": -30.93234634399414, "global_step": 37102, "epoch": 306} {"train_loss": -31.959821701049805, "global_step": 37103, "epoch": 306} {"train_loss": -32.23291015625, "global_step": 37104, "epoch": 306} {"train_loss": -31.939987182617188, "global_step": 37105, "epoch": 306} {"train_loss": -31.651208877563477, "global_step": 37106, "epoch": 306} {"train_loss": -31.924137115478516, "global_step": 37107, "epoch": 306} {"train_loss": -31.710920333862305, "global_step": 37108, "epoch": 306} {"train_loss": -32.70473861694336, "global_step": 37109, "epoch": 306} {"train_loss": -30.92510414123535, "global_step": 37110, "epoch": 306} {"train_loss": -32.765594482421875, "global_step": 37111, "epoch": 306} {"train_loss": -31.504907608032227, "global_step": 37112, "epoch": 306} {"train_loss": -31.57745933532715, "global_step": 37113, "epoch": 306} {"train_loss": -32.611236572265625, "global_step": 37114, "epoch": 306} {"train_loss": -32.178035736083984, "global_step": 37115, "epoch": 306} {"train_loss": -32.62369918823242, "global_step": 37116, "epoch": 306} {"train_loss": -32.95185852050781, "global_step": 37117, "epoch": 306} {"train_loss": -32.319156646728516, "global_step": 37118, "epoch": 306} {"train_loss": -32.41267776489258, "global_step": 37119, "epoch": 306} {"train_loss": -32.64394760131836, "global_step": 37120, "epoch": 306} {"train_loss": -32.4625129699707, "global_step": 37121, "epoch": 306} {"train_loss": -32.71038818359375, "global_step": 37122, "epoch": 306} {"train_loss": -33.50217819213867, "global_step": 37123, "epoch": 306} {"train_loss": -32.8675422668457, "global_step": 37124, "epoch": 306} {"train_loss": -33.11689758300781, "global_step": 37125, "epoch": 306} {"train_loss": -33.36383819580078, "global_step": 37126, "epoch": 306} {"train_loss": -33.250484466552734, "global_step": 37127, "epoch": 306} {"train_loss": -33.0589714050293, "global_step": 37128, "epoch": 306} {"train_loss": -32.81789779663086, "global_step": 37129, "epoch": 306} {"train_loss": -33.60760498046875, "global_step": 37130, "epoch": 306} {"train_loss": -33.1385383605957, "global_step": 37131, "epoch": 306} {"train_loss": -33.55570602416992, "global_step": 37132, "epoch": 306} {"train_loss": -33.458045959472656, "global_step": 37133, "epoch": 306} {"train_loss": -33.434444427490234, "global_step": 37134, "epoch": 306} {"train_loss": -33.11945724487305, "global_step": 37135, "epoch": 306} {"train_loss": -32.87981414794922, "global_step": 37136, "epoch": 306} {"train_loss": -31.824344635009766, "global_step": 37137, "epoch": 306} {"train_loss": -30.828466415405273, "global_step": 37138, "epoch": 306} {"train_loss": -29.041833877563477, "global_step": 37139, "epoch": 306} {"train_loss": -26.738004684448242, "global_step": 37140, "epoch": 306} {"train_loss": -25.727224349975586, "global_step": 37141, "epoch": 306} {"train_loss": -29.77874755859375, "global_step": 37142, "epoch": 306} {"train_loss": -33.1530647277832, "global_step": 37143, "epoch": 306} {"train_loss": -31.43682289123535, "global_step": 37144, "epoch": 306} {"train_loss": -30.41948890686035, "global_step": 37145, "epoch": 306} {"train_loss": -32.28075180368975, "global_step": 37146, "epoch": 306, "val_loss": 2693713.75} {"train_loss": -30.56977653503418, "global_step": 37147, "epoch": 307} {"train_loss": -32.61430740356445, "global_step": 37148, "epoch": 307} {"train_loss": -31.114599227905273, "global_step": 37149, "epoch": 307} {"train_loss": -32.913490295410156, "global_step": 37150, "epoch": 307} {"train_loss": -31.8320255279541, "global_step": 37151, "epoch": 307} {"train_loss": -32.28443145751953, "global_step": 37152, "epoch": 307} {"train_loss": -31.516782760620117, "global_step": 37153, "epoch": 307} {"train_loss": -32.850318908691406, "global_step": 37154, "epoch": 307} {"train_loss": -31.593265533447266, "global_step": 37155, "epoch": 307} {"train_loss": -32.7686653137207, "global_step": 37156, "epoch": 307} {"train_loss": -32.183815002441406, "global_step": 37157, "epoch": 307} {"train_loss": -32.50630187988281, "global_step": 37158, "epoch": 307} {"train_loss": -32.12458038330078, "global_step": 37159, "epoch": 307} {"train_loss": -31.446609497070312, "global_step": 37160, "epoch": 307} {"train_loss": -33.30106735229492, "global_step": 37161, "epoch": 307} {"train_loss": -31.727750778198242, "global_step": 37162, "epoch": 307} {"train_loss": -32.85302734375, "global_step": 37163, "epoch": 307} {"train_loss": -32.1611328125, "global_step": 37164, "epoch": 307} {"train_loss": -32.050514221191406, "global_step": 37165, "epoch": 307} {"train_loss": -32.74619674682617, "global_step": 37166, "epoch": 307} {"train_loss": -32.583595275878906, "global_step": 37167, "epoch": 307} {"train_loss": -32.00592041015625, "global_step": 37168, "epoch": 307} {"train_loss": -32.06976318359375, "global_step": 37169, "epoch": 307} {"train_loss": -32.53790283203125, "global_step": 37170, "epoch": 307} {"train_loss": -30.647003173828125, "global_step": 37171, "epoch": 307} {"train_loss": -31.207517623901367, "global_step": 37172, "epoch": 307} {"train_loss": -32.32647705078125, "global_step": 37173, "epoch": 307} {"train_loss": -32.23474884033203, "global_step": 37174, "epoch": 307} {"train_loss": -31.964651107788086, "global_step": 37175, "epoch": 307} {"train_loss": -31.915708541870117, "global_step": 37176, "epoch": 307} {"train_loss": -31.751890182495117, "global_step": 37177, "epoch": 307} {"train_loss": -32.40811538696289, "global_step": 37178, "epoch": 307} {"train_loss": -31.230329513549805, "global_step": 37179, "epoch": 307} {"train_loss": -31.2950496673584, "global_step": 37180, "epoch": 307} {"train_loss": -32.75529098510742, "global_step": 37181, "epoch": 307} {"train_loss": -32.36334228515625, "global_step": 37182, "epoch": 307} {"train_loss": -32.54508590698242, "global_step": 37183, "epoch": 307} {"train_loss": -32.40583419799805, "global_step": 37184, "epoch": 307} {"train_loss": -32.46631622314453, "global_step": 37185, "epoch": 307} {"train_loss": -32.31987380981445, "global_step": 37186, "epoch": 307} {"train_loss": -32.55841827392578, "global_step": 37187, "epoch": 307} {"train_loss": -32.59827423095703, "global_step": 37188, "epoch": 307} {"train_loss": -32.83812713623047, "global_step": 37189, "epoch": 307} {"train_loss": -32.485992431640625, "global_step": 37190, "epoch": 307} {"train_loss": -32.48139572143555, "global_step": 37191, "epoch": 307} {"train_loss": -32.47977828979492, "global_step": 37192, "epoch": 307} {"train_loss": -31.55608558654785, "global_step": 37193, "epoch": 307} {"train_loss": -32.13147735595703, "global_step": 37194, "epoch": 307} {"train_loss": -32.097259521484375, "global_step": 37195, "epoch": 307} {"train_loss": -32.535369873046875, "global_step": 37196, "epoch": 307} {"train_loss": -32.778621673583984, "global_step": 37197, "epoch": 307} {"train_loss": -33.19132614135742, "global_step": 37198, "epoch": 307} {"train_loss": -32.59668731689453, "global_step": 37199, "epoch": 307} {"train_loss": -32.320953369140625, "global_step": 37200, "epoch": 307} {"train_loss": -32.21029281616211, "global_step": 37201, "epoch": 307} {"train_loss": -32.50733184814453, "global_step": 37202, "epoch": 307} {"train_loss": -31.905155181884766, "global_step": 37203, "epoch": 307} {"train_loss": -31.887235641479492, "global_step": 37204, "epoch": 307} {"train_loss": -31.919971466064453, "global_step": 37205, "epoch": 307} {"train_loss": -33.355926513671875, "global_step": 37206, "epoch": 307} {"train_loss": -32.574703216552734, "global_step": 37207, "epoch": 307} {"train_loss": -30.7676944732666, "global_step": 37208, "epoch": 307} {"train_loss": -32.30215835571289, "global_step": 37209, "epoch": 307} {"train_loss": -32.99025344848633, "global_step": 37210, "epoch": 307} {"train_loss": -31.999740600585938, "global_step": 37211, "epoch": 307} {"train_loss": -32.010169982910156, "global_step": 37212, "epoch": 307} {"train_loss": -33.32658386230469, "global_step": 37213, "epoch": 307} {"train_loss": -32.04375076293945, "global_step": 37214, "epoch": 307} {"train_loss": -32.99391555786133, "global_step": 37215, "epoch": 307} {"train_loss": -32.96308898925781, "global_step": 37216, "epoch": 307} {"train_loss": -32.30072784423828, "global_step": 37217, "epoch": 307} {"train_loss": -33.0104866027832, "global_step": 37218, "epoch": 307} {"train_loss": -32.97364807128906, "global_step": 37219, "epoch": 307} {"train_loss": -33.31867218017578, "global_step": 37220, "epoch": 307} {"train_loss": -33.023555755615234, "global_step": 37221, "epoch": 307} {"train_loss": -32.90452575683594, "global_step": 37222, "epoch": 307} {"train_loss": -33.396236419677734, "global_step": 37223, "epoch": 307} {"train_loss": -33.22288513183594, "global_step": 37224, "epoch": 307} {"train_loss": -33.37446975708008, "global_step": 37225, "epoch": 307} {"train_loss": -33.20731735229492, "global_step": 37226, "epoch": 307} {"train_loss": -32.97359085083008, "global_step": 37227, "epoch": 307} {"train_loss": -33.317684173583984, "global_step": 37228, "epoch": 307} {"train_loss": -33.049407958984375, "global_step": 37229, "epoch": 307} {"train_loss": -33.59176254272461, "global_step": 37230, "epoch": 307} {"train_loss": -32.87192153930664, "global_step": 37231, "epoch": 307} {"train_loss": -32.66764450073242, "global_step": 37232, "epoch": 307} {"train_loss": -33.66819381713867, "global_step": 37233, "epoch": 307} {"train_loss": -33.85416793823242, "global_step": 37234, "epoch": 307} {"train_loss": -34.00059127807617, "global_step": 37235, "epoch": 307} {"train_loss": -33.42820358276367, "global_step": 37236, "epoch": 307} {"train_loss": -33.60956573486328, "global_step": 37237, "epoch": 307} {"train_loss": -33.80082321166992, "global_step": 37238, "epoch": 307} {"train_loss": -33.69636154174805, "global_step": 37239, "epoch": 307} {"train_loss": -34.096702575683594, "global_step": 37240, "epoch": 307} {"train_loss": -33.76201629638672, "global_step": 37241, "epoch": 307} {"train_loss": -32.9659538269043, "global_step": 37242, "epoch": 307} {"train_loss": -34.4683952331543, "global_step": 37243, "epoch": 307} {"train_loss": -33.80514907836914, "global_step": 37244, "epoch": 307} {"train_loss": -33.775306701660156, "global_step": 37245, "epoch": 307} {"train_loss": -34.26991653442383, "global_step": 37246, "epoch": 307} {"train_loss": -34.3756217956543, "global_step": 37247, "epoch": 307} {"train_loss": -33.938697814941406, "global_step": 37248, "epoch": 307} {"train_loss": -33.31612777709961, "global_step": 37249, "epoch": 307} {"train_loss": -32.801849365234375, "global_step": 37250, "epoch": 307} {"train_loss": -34.230438232421875, "global_step": 37251, "epoch": 307} {"train_loss": -33.95105743408203, "global_step": 37252, "epoch": 307} {"train_loss": -33.531490325927734, "global_step": 37253, "epoch": 307} {"train_loss": -34.30406951904297, "global_step": 37254, "epoch": 307} {"train_loss": -33.687774658203125, "global_step": 37255, "epoch": 307} {"train_loss": -33.836761474609375, "global_step": 37256, "epoch": 307} {"train_loss": -33.09109115600586, "global_step": 37257, "epoch": 307} {"train_loss": -33.43943405151367, "global_step": 37258, "epoch": 307} {"train_loss": -33.736167907714844, "global_step": 37259, "epoch": 307} {"train_loss": -33.8076057434082, "global_step": 37260, "epoch": 307} {"train_loss": -33.67129135131836, "global_step": 37261, "epoch": 307} {"train_loss": -33.914608001708984, "global_step": 37262, "epoch": 307} {"train_loss": -33.73861312866211, "global_step": 37263, "epoch": 307} {"train_loss": -33.42939376831055, "global_step": 37264, "epoch": 307} {"train_loss": -33.75735092163086, "global_step": 37265, "epoch": 307} {"train_loss": -33.95744323730469, "global_step": 37266, "epoch": 307} {"train_loss": -32.78467200413223, "global_step": 37267, "epoch": 307, "val_loss": 2614067.25} {"train_loss": -33.496517181396484, "global_step": 37268, "epoch": 308} {"train_loss": -33.48369598388672, "global_step": 37269, "epoch": 308} {"train_loss": -34.37166976928711, "global_step": 37270, "epoch": 308} {"train_loss": -33.13947677612305, "global_step": 37271, "epoch": 308} {"train_loss": -33.169586181640625, "global_step": 37272, "epoch": 308} {"train_loss": -34.021209716796875, "global_step": 37273, "epoch": 308} {"train_loss": -32.10709762573242, "global_step": 37274, "epoch": 308} {"train_loss": -31.28168296813965, "global_step": 37275, "epoch": 308} {"train_loss": -33.89518356323242, "global_step": 37276, "epoch": 308} {"train_loss": -32.57208251953125, "global_step": 37277, "epoch": 308} {"train_loss": -33.37582015991211, "global_step": 37278, "epoch": 308} {"train_loss": -32.99550247192383, "global_step": 37279, "epoch": 308} {"train_loss": -30.576526641845703, "global_step": 37280, "epoch": 308} {"train_loss": -33.94094467163086, "global_step": 37281, "epoch": 308} {"train_loss": -32.162086486816406, "global_step": 37282, "epoch": 308} {"train_loss": -32.13776779174805, "global_step": 37283, "epoch": 308} {"train_loss": -33.6797981262207, "global_step": 37284, "epoch": 308} {"train_loss": -32.338111877441406, "global_step": 37285, "epoch": 308} {"train_loss": -33.055213928222656, "global_step": 37286, "epoch": 308} {"train_loss": -32.411293029785156, "global_step": 37287, "epoch": 308} {"train_loss": -33.206172943115234, "global_step": 37288, "epoch": 308} {"train_loss": -32.84273910522461, "global_step": 37289, "epoch": 308} {"train_loss": -33.17317581176758, "global_step": 37290, "epoch": 308} {"train_loss": -32.93085861206055, "global_step": 37291, "epoch": 308} {"train_loss": -32.51079177856445, "global_step": 37292, "epoch": 308} {"train_loss": -32.95347213745117, "global_step": 37293, "epoch": 308} {"train_loss": -31.89739990234375, "global_step": 37294, "epoch": 308} {"train_loss": -33.020015716552734, "global_step": 37295, "epoch": 308} {"train_loss": -32.77362823486328, "global_step": 37296, "epoch": 308} {"train_loss": -32.47658920288086, "global_step": 37297, "epoch": 308} {"train_loss": -32.48275375366211, "global_step": 37298, "epoch": 308} {"train_loss": -32.212032318115234, "global_step": 37299, "epoch": 308} {"train_loss": -33.09391403198242, "global_step": 37300, "epoch": 308} {"train_loss": -32.7023811340332, "global_step": 37301, "epoch": 308} {"train_loss": -32.648468017578125, "global_step": 37302, "epoch": 308} {"train_loss": -33.5088996887207, "global_step": 37303, "epoch": 308} {"train_loss": -32.92877197265625, "global_step": 37304, "epoch": 308} {"train_loss": -32.70484161376953, "global_step": 37305, "epoch": 308} {"train_loss": -33.02192306518555, "global_step": 37306, "epoch": 308} {"train_loss": -33.15142822265625, "global_step": 37307, "epoch": 308} {"train_loss": -33.12482833862305, "global_step": 37308, "epoch": 308} {"train_loss": -32.4152946472168, "global_step": 37309, "epoch": 308} {"train_loss": -30.310155868530273, "global_step": 37310, "epoch": 308} {"train_loss": -30.060956954956055, "global_step": 37311, "epoch": 308} {"train_loss": -28.876785278320312, "global_step": 37312, "epoch": 308} {"train_loss": -32.327693939208984, "global_step": 37313, "epoch": 308} {"train_loss": -32.67464828491211, "global_step": 37314, "epoch": 308} {"train_loss": -31.471784591674805, "global_step": 37315, "epoch": 308} {"train_loss": -32.84938430786133, "global_step": 37316, "epoch": 308} {"train_loss": -32.72970199584961, "global_step": 37317, "epoch": 308} {"train_loss": -32.43746566772461, "global_step": 37318, "epoch": 308} {"train_loss": -32.37320327758789, "global_step": 37319, "epoch": 308} {"train_loss": -32.865394592285156, "global_step": 37320, "epoch": 308} {"train_loss": -33.6699104309082, "global_step": 37321, "epoch": 308} {"train_loss": -32.09999465942383, "global_step": 37322, "epoch": 308} {"train_loss": -33.19306182861328, "global_step": 37323, "epoch": 308} {"train_loss": -32.825538635253906, "global_step": 37324, "epoch": 308} {"train_loss": -33.148433685302734, "global_step": 37325, "epoch": 308} {"train_loss": -33.37002182006836, "global_step": 37326, "epoch": 308} {"train_loss": -33.37736511230469, "global_step": 37327, "epoch": 308} {"train_loss": -33.02643585205078, "global_step": 37328, "epoch": 308} {"train_loss": -33.41962814331055, "global_step": 37329, "epoch": 308} {"train_loss": -33.11305618286133, "global_step": 37330, "epoch": 308} {"train_loss": -33.66633224487305, "global_step": 37331, "epoch": 308} {"train_loss": -32.9200553894043, "global_step": 37332, "epoch": 308} {"train_loss": -32.877906799316406, "global_step": 37333, "epoch": 308} {"train_loss": -33.246864318847656, "global_step": 37334, "epoch": 308} {"train_loss": -33.29423141479492, "global_step": 37335, "epoch": 308} {"train_loss": -34.0831413269043, "global_step": 37336, "epoch": 308} {"train_loss": -33.25696563720703, "global_step": 37337, "epoch": 308} {"train_loss": -33.02350997924805, "global_step": 37338, "epoch": 308} {"train_loss": -33.17696762084961, "global_step": 37339, "epoch": 308} {"train_loss": -34.261837005615234, "global_step": 37340, "epoch": 308} {"train_loss": -33.013160705566406, "global_step": 37341, "epoch": 308} {"train_loss": -33.296199798583984, "global_step": 37342, "epoch": 308} {"train_loss": -33.70064163208008, "global_step": 37343, "epoch": 308} {"train_loss": -33.728797912597656, "global_step": 37344, "epoch": 308} {"train_loss": -33.76702117919922, "global_step": 37345, "epoch": 308} {"train_loss": -33.680633544921875, "global_step": 37346, "epoch": 308} {"train_loss": -33.55332946777344, "global_step": 37347, "epoch": 308} {"train_loss": -33.64814376831055, "global_step": 37348, "epoch": 308} {"train_loss": -34.04335403442383, "global_step": 37349, "epoch": 308} {"train_loss": -34.454158782958984, "global_step": 37350, "epoch": 308} {"train_loss": -33.4130859375, "global_step": 37351, "epoch": 308} {"train_loss": -33.32143783569336, "global_step": 37352, "epoch": 308} {"train_loss": -33.11478042602539, "global_step": 37353, "epoch": 308} {"train_loss": -33.36670684814453, "global_step": 37354, "epoch": 308} {"train_loss": -33.85467529296875, "global_step": 37355, "epoch": 308} {"train_loss": -33.5504264831543, "global_step": 37356, "epoch": 308} {"train_loss": -33.7928581237793, "global_step": 37357, "epoch": 308} {"train_loss": -32.81507110595703, "global_step": 37358, "epoch": 308} {"train_loss": -33.274314880371094, "global_step": 37359, "epoch": 308} {"train_loss": -34.21346664428711, "global_step": 37360, "epoch": 308} {"train_loss": -33.79612350463867, "global_step": 37361, "epoch": 308} {"train_loss": -33.30290603637695, "global_step": 37362, "epoch": 308} {"train_loss": -32.831398010253906, "global_step": 37363, "epoch": 308} {"train_loss": -33.5472526550293, "global_step": 37364, "epoch": 308} {"train_loss": -33.72538375854492, "global_step": 37365, "epoch": 308} {"train_loss": -33.7846565246582, "global_step": 37366, "epoch": 308} {"train_loss": -33.28998947143555, "global_step": 37367, "epoch": 308} {"train_loss": -34.223628997802734, "global_step": 37368, "epoch": 308} {"train_loss": -33.63783264160156, "global_step": 37369, "epoch": 308} {"train_loss": -34.08662796020508, "global_step": 37370, "epoch": 308} {"train_loss": -34.1596565246582, "global_step": 37371, "epoch": 308} {"train_loss": -34.15678024291992, "global_step": 37372, "epoch": 308} {"train_loss": -33.98014450073242, "global_step": 37373, "epoch": 308} {"train_loss": -33.95808029174805, "global_step": 37374, "epoch": 308} {"train_loss": -33.15838623046875, "global_step": 37375, "epoch": 308} {"train_loss": -34.38574981689453, "global_step": 37376, "epoch": 308} {"train_loss": -33.201698303222656, "global_step": 37377, "epoch": 308} {"train_loss": -34.15998077392578, "global_step": 37378, "epoch": 308} {"train_loss": -34.328460693359375, "global_step": 37379, "epoch": 308} {"train_loss": -34.544044494628906, "global_step": 37380, "epoch": 308} {"train_loss": -34.14585494995117, "global_step": 37381, "epoch": 308} {"train_loss": -33.79907989501953, "global_step": 37382, "epoch": 308} {"train_loss": -34.0727653503418, "global_step": 37383, "epoch": 308} {"train_loss": -33.93804931640625, "global_step": 37384, "epoch": 308} {"train_loss": -33.52443313598633, "global_step": 37385, "epoch": 308} {"train_loss": -34.39616012573242, "global_step": 37386, "epoch": 308} {"train_loss": -34.330230712890625, "global_step": 37387, "epoch": 308} {"train_loss": -33.17660856641029, "global_step": 37388, "epoch": 308, "val_loss": 2639967.0} {"train_loss": -34.332603454589844, "global_step": 37389, "epoch": 309} {"train_loss": -34.10211181640625, "global_step": 37390, "epoch": 309} {"train_loss": -33.95027542114258, "global_step": 37391, "epoch": 309} {"train_loss": -33.86623001098633, "global_step": 37392, "epoch": 309} {"train_loss": -33.93653106689453, "global_step": 37393, "epoch": 309} {"train_loss": -34.41679000854492, "global_step": 37394, "epoch": 309} {"train_loss": -34.76697540283203, "global_step": 37395, "epoch": 309} {"train_loss": -34.29627227783203, "global_step": 37396, "epoch": 309} {"train_loss": -33.899024963378906, "global_step": 37397, "epoch": 309} {"train_loss": -34.52144241333008, "global_step": 37398, "epoch": 309} {"train_loss": -34.60821533203125, "global_step": 37399, "epoch": 309} {"train_loss": -34.653377532958984, "global_step": 37400, "epoch": 309} {"train_loss": -34.5146484375, "global_step": 37401, "epoch": 309} {"train_loss": -33.87327194213867, "global_step": 37402, "epoch": 309} {"train_loss": -33.7247200012207, "global_step": 37403, "epoch": 309} {"train_loss": -34.21295166015625, "global_step": 37404, "epoch": 309} {"train_loss": -32.29863357543945, "global_step": 37405, "epoch": 309} {"train_loss": -30.462121963500977, "global_step": 37406, "epoch": 309} {"train_loss": -23.062063217163086, "global_step": 37407, "epoch": 309} {"train_loss": -7.396331787109375, "global_step": 37408, "epoch": 309} {"train_loss": -10.026615142822266, "global_step": 37409, "epoch": 309} {"train_loss": -32.089595794677734, "global_step": 37410, "epoch": 309} {"train_loss": -20.223413467407227, "global_step": 37411, "epoch": 309} {"train_loss": -25.89512062072754, "global_step": 37412, "epoch": 309} {"train_loss": -21.90184211730957, "global_step": 37413, "epoch": 309} {"train_loss": -31.110061645507812, "global_step": 37414, "epoch": 309} {"train_loss": -26.38372230529785, "global_step": 37415, "epoch": 309} {"train_loss": -26.675373077392578, "global_step": 37416, "epoch": 309} {"train_loss": -31.340009689331055, "global_step": 37417, "epoch": 309} {"train_loss": -29.977407455444336, "global_step": 37418, "epoch": 309} {"train_loss": -27.377294540405273, "global_step": 37419, "epoch": 309} {"train_loss": -30.334272384643555, "global_step": 37420, "epoch": 309} {"train_loss": -31.752105712890625, "global_step": 37421, "epoch": 309} {"train_loss": -31.28376579284668, "global_step": 37422, "epoch": 309} {"train_loss": -30.576587677001953, "global_step": 37423, "epoch": 309} {"train_loss": -29.663013458251953, "global_step": 37424, "epoch": 309} {"train_loss": -31.531396865844727, "global_step": 37425, "epoch": 309} {"train_loss": -31.127704620361328, "global_step": 37426, "epoch": 309} {"train_loss": -31.794301986694336, "global_step": 37427, "epoch": 309} {"train_loss": -31.537687301635742, "global_step": 37428, "epoch": 309} {"train_loss": -30.7313289642334, "global_step": 37429, "epoch": 309} {"train_loss": -31.48103904724121, "global_step": 37430, "epoch": 309} {"train_loss": -31.360015869140625, "global_step": 37431, "epoch": 309} {"train_loss": -31.822345733642578, "global_step": 37432, "epoch": 309} {"train_loss": -31.791837692260742, "global_step": 37433, "epoch": 309} {"train_loss": -32.2971305847168, "global_step": 37434, "epoch": 309} {"train_loss": -32.133033752441406, "global_step": 37435, "epoch": 309} {"train_loss": -32.31147003173828, "global_step": 37436, "epoch": 309} {"train_loss": -32.17947006225586, "global_step": 37437, "epoch": 309} {"train_loss": -32.031272888183594, "global_step": 37438, "epoch": 309} {"train_loss": -32.10993576049805, "global_step": 37439, "epoch": 309} {"train_loss": -32.129940032958984, "global_step": 37440, "epoch": 309} {"train_loss": -32.20216751098633, "global_step": 37441, "epoch": 309} {"train_loss": -32.4222297668457, "global_step": 37442, "epoch": 309} {"train_loss": -32.53422164916992, "global_step": 37443, "epoch": 309} {"train_loss": -32.31643295288086, "global_step": 37444, "epoch": 309} {"train_loss": -32.49314880371094, "global_step": 37445, "epoch": 309} {"train_loss": -32.55592346191406, "global_step": 37446, "epoch": 309} {"train_loss": -32.95344161987305, "global_step": 37447, "epoch": 309} {"train_loss": -32.770320892333984, "global_step": 37448, "epoch": 309} {"train_loss": -32.684112548828125, "global_step": 37449, "epoch": 309} {"train_loss": -32.740169525146484, "global_step": 37450, "epoch": 309} {"train_loss": -32.4934196472168, "global_step": 37451, "epoch": 309} {"train_loss": -33.00068283081055, "global_step": 37452, "epoch": 309} {"train_loss": -32.80725860595703, "global_step": 37453, "epoch": 309} {"train_loss": -33.07872009277344, "global_step": 37454, "epoch": 309} {"train_loss": -33.03186798095703, "global_step": 37455, "epoch": 309} {"train_loss": -33.211910247802734, "global_step": 37456, "epoch": 309} {"train_loss": -33.1168212890625, "global_step": 37457, "epoch": 309} {"train_loss": -33.440242767333984, "global_step": 37458, "epoch": 309} {"train_loss": -33.616249084472656, "global_step": 37459, "epoch": 309} {"train_loss": -33.47307586669922, "global_step": 37460, "epoch": 309} {"train_loss": -33.51218795776367, "global_step": 37461, "epoch": 309} {"train_loss": -32.963226318359375, "global_step": 37462, "epoch": 309} {"train_loss": -32.893978118896484, "global_step": 37463, "epoch": 309} {"train_loss": -32.83256149291992, "global_step": 37464, "epoch": 309} {"train_loss": -32.74276351928711, "global_step": 37465, "epoch": 309} {"train_loss": -33.52090072631836, "global_step": 37466, "epoch": 309} {"train_loss": -33.51093292236328, "global_step": 37467, "epoch": 309} {"train_loss": -33.10177230834961, "global_step": 37468, "epoch": 309} {"train_loss": -33.480709075927734, "global_step": 37469, "epoch": 309} {"train_loss": -33.785926818847656, "global_step": 37470, "epoch": 309} {"train_loss": -32.8994026184082, "global_step": 37471, "epoch": 309} {"train_loss": -33.22751998901367, "global_step": 37472, "epoch": 309} {"train_loss": -33.68117904663086, "global_step": 37473, "epoch": 309} {"train_loss": -33.813961029052734, "global_step": 37474, "epoch": 309} {"train_loss": -33.144805908203125, "global_step": 37475, "epoch": 309} {"train_loss": -33.1942138671875, "global_step": 37476, "epoch": 309} {"train_loss": -30.98792839050293, "global_step": 37477, "epoch": 309} {"train_loss": -31.07330322265625, "global_step": 37478, "epoch": 309} {"train_loss": -28.404569625854492, "global_step": 37479, "epoch": 309} {"train_loss": -27.840192794799805, "global_step": 37480, "epoch": 309} {"train_loss": -29.687158584594727, "global_step": 37481, "epoch": 309} {"train_loss": -31.398962020874023, "global_step": 37482, "epoch": 309} {"train_loss": -29.5070858001709, "global_step": 37483, "epoch": 309} {"train_loss": -30.380529403686523, "global_step": 37484, "epoch": 309} {"train_loss": -31.00037956237793, "global_step": 37485, "epoch": 309} {"train_loss": -29.559280395507812, "global_step": 37486, "epoch": 309} {"train_loss": -29.037750244140625, "global_step": 37487, "epoch": 309} {"train_loss": -30.77937889099121, "global_step": 37488, "epoch": 309} {"train_loss": -28.722333908081055, "global_step": 37489, "epoch": 309} {"train_loss": -28.287378311157227, "global_step": 37490, "epoch": 309} {"train_loss": -30.81272315979004, "global_step": 37491, "epoch": 309} {"train_loss": -29.285776138305664, "global_step": 37492, "epoch": 309} {"train_loss": -31.690698623657227, "global_step": 37493, "epoch": 309} {"train_loss": -30.640121459960938, "global_step": 37494, "epoch": 309} {"train_loss": -30.244577407836914, "global_step": 37495, "epoch": 309} {"train_loss": -30.406030654907227, "global_step": 37496, "epoch": 309} {"train_loss": -30.590368270874023, "global_step": 37497, "epoch": 309} {"train_loss": -31.124174118041992, "global_step": 37498, "epoch": 309} {"train_loss": -31.377103805541992, "global_step": 37499, "epoch": 309} {"train_loss": -31.40815544128418, "global_step": 37500, "epoch": 309} {"train_loss": -30.963287353515625, "global_step": 37501, "epoch": 309} {"train_loss": -31.40950584411621, "global_step": 37502, "epoch": 309} {"train_loss": -31.558828353881836, "global_step": 37503, "epoch": 309} {"train_loss": -31.73459815979004, "global_step": 37504, "epoch": 309} {"train_loss": -31.290456771850586, "global_step": 37505, "epoch": 309} {"train_loss": -31.45383071899414, "global_step": 37506, "epoch": 309} {"train_loss": -31.759153366088867, "global_step": 37507, "epoch": 309} {"train_loss": -31.780170440673828, "global_step": 37508, "epoch": 309} {"train_loss": -31.259142000813128, "global_step": 37509, "epoch": 309, "val_loss": 2629867.25} {"train_loss": -31.624557495117188, "global_step": 37510, "epoch": 310} {"train_loss": -31.780029296875, "global_step": 37511, "epoch": 310} {"train_loss": -32.454830169677734, "global_step": 37512, "epoch": 310} {"train_loss": -31.94775390625, "global_step": 37513, "epoch": 310} {"train_loss": -32.08376693725586, "global_step": 37514, "epoch": 310} {"train_loss": -32.07289505004883, "global_step": 37515, "epoch": 310} {"train_loss": -31.754302978515625, "global_step": 37516, "epoch": 310} {"train_loss": -32.06748580932617, "global_step": 37517, "epoch": 310} {"train_loss": -32.46438217163086, "global_step": 37518, "epoch": 310} {"train_loss": -32.440059661865234, "global_step": 37519, "epoch": 310} {"train_loss": -32.44131088256836, "global_step": 37520, "epoch": 310} {"train_loss": -32.59428787231445, "global_step": 37521, "epoch": 310} {"train_loss": -32.360042572021484, "global_step": 37522, "epoch": 310} {"train_loss": -31.69269371032715, "global_step": 37523, "epoch": 310} {"train_loss": -31.966543197631836, "global_step": 37524, "epoch": 310} {"train_loss": -30.360998153686523, "global_step": 37525, "epoch": 310} {"train_loss": -31.334396362304688, "global_step": 37526, "epoch": 310} {"train_loss": -31.512561798095703, "global_step": 37527, "epoch": 310} {"train_loss": -29.14356803894043, "global_step": 37528, "epoch": 310} {"train_loss": -30.597822189331055, "global_step": 37529, "epoch": 310} {"train_loss": -32.47889709472656, "global_step": 37530, "epoch": 310} {"train_loss": -31.14178466796875, "global_step": 37531, "epoch": 310} {"train_loss": -32.42585372924805, "global_step": 37532, "epoch": 310} {"train_loss": -31.690099716186523, "global_step": 37533, "epoch": 310} {"train_loss": -32.29244613647461, "global_step": 37534, "epoch": 310} {"train_loss": -32.4501953125, "global_step": 37535, "epoch": 310} {"train_loss": -31.88958740234375, "global_step": 37536, "epoch": 310} {"train_loss": -32.05604934692383, "global_step": 37537, "epoch": 310} {"train_loss": -31.599374771118164, "global_step": 37538, "epoch": 310} {"train_loss": -32.47149658203125, "global_step": 37539, "epoch": 310} {"train_loss": -32.681514739990234, "global_step": 37540, "epoch": 310} {"train_loss": -32.25661087036133, "global_step": 37541, "epoch": 310} {"train_loss": -33.11143112182617, "global_step": 37542, "epoch": 310} {"train_loss": -33.02400588989258, "global_step": 37543, "epoch": 310} {"train_loss": -32.824317932128906, "global_step": 37544, "epoch": 310} {"train_loss": -32.934661865234375, "global_step": 37545, "epoch": 310} {"train_loss": -33.65200424194336, "global_step": 37546, "epoch": 310} {"train_loss": -32.81385803222656, "global_step": 37547, "epoch": 310} {"train_loss": -33.21430587768555, "global_step": 37548, "epoch": 310} {"train_loss": -32.99303436279297, "global_step": 37549, "epoch": 310} {"train_loss": -33.3754768371582, "global_step": 37550, "epoch": 310} {"train_loss": -33.280120849609375, "global_step": 37551, "epoch": 310} {"train_loss": -33.321533203125, "global_step": 37552, "epoch": 310} {"train_loss": -33.30727767944336, "global_step": 37553, "epoch": 310} {"train_loss": -32.70541000366211, "global_step": 37554, "epoch": 310} {"train_loss": -29.079700469970703, "global_step": 37555, "epoch": 310} {"train_loss": -22.099464416503906, "global_step": 37556, "epoch": 310} {"train_loss": -22.34370994567871, "global_step": 37557, "epoch": 310} {"train_loss": -28.73089027404785, "global_step": 37558, "epoch": 310} {"train_loss": -32.5268669128418, "global_step": 37559, "epoch": 310} {"train_loss": -30.309213638305664, "global_step": 37560, "epoch": 310} {"train_loss": -32.394222259521484, "global_step": 37561, "epoch": 310} {"train_loss": -32.10979080200195, "global_step": 37562, "epoch": 310} {"train_loss": -32.763214111328125, "global_step": 37563, "epoch": 310} {"train_loss": -32.25386047363281, "global_step": 37564, "epoch": 310} {"train_loss": -33.279640197753906, "global_step": 37565, "epoch": 310} {"train_loss": -32.48061752319336, "global_step": 37566, "epoch": 310} {"train_loss": -33.060699462890625, "global_step": 37567, "epoch": 310} {"train_loss": -32.777923583984375, "global_step": 37568, "epoch": 310} {"train_loss": -32.241580963134766, "global_step": 37569, "epoch": 310} {"train_loss": -33.00163269042969, "global_step": 37570, "epoch": 310} {"train_loss": -33.22280502319336, "global_step": 37571, "epoch": 310} {"train_loss": -32.72100830078125, "global_step": 37572, "epoch": 310} {"train_loss": -33.36884307861328, "global_step": 37573, "epoch": 310} {"train_loss": -33.32463836669922, "global_step": 37574, "epoch": 310} {"train_loss": -33.13079833984375, "global_step": 37575, "epoch": 310} {"train_loss": -33.12406539916992, "global_step": 37576, "epoch": 310} {"train_loss": -33.398189544677734, "global_step": 37577, "epoch": 310} {"train_loss": -33.41374969482422, "global_step": 37578, "epoch": 310} {"train_loss": -32.90903854370117, "global_step": 37579, "epoch": 310} {"train_loss": -33.16679763793945, "global_step": 37580, "epoch": 310} {"train_loss": -33.785614013671875, "global_step": 37581, "epoch": 310} {"train_loss": -33.25189971923828, "global_step": 37582, "epoch": 310} {"train_loss": -33.420650482177734, "global_step": 37583, "epoch": 310} {"train_loss": -33.49606704711914, "global_step": 37584, "epoch": 310} {"train_loss": -33.41813278198242, "global_step": 37585, "epoch": 310} {"train_loss": -33.72220993041992, "global_step": 37586, "epoch": 310} {"train_loss": -33.43248748779297, "global_step": 37587, "epoch": 310} {"train_loss": -33.55792999267578, "global_step": 37588, "epoch": 310} {"train_loss": -33.18387985229492, "global_step": 37589, "epoch": 310} {"train_loss": -33.61942672729492, "global_step": 37590, "epoch": 310} {"train_loss": -33.638938903808594, "global_step": 37591, "epoch": 310} {"train_loss": -33.7513427734375, "global_step": 37592, "epoch": 310} {"train_loss": -33.70904541015625, "global_step": 37593, "epoch": 310} {"train_loss": -33.72657012939453, "global_step": 37594, "epoch": 310} {"train_loss": -33.51134490966797, "global_step": 37595, "epoch": 310} {"train_loss": -34.024574279785156, "global_step": 37596, "epoch": 310} {"train_loss": -33.86274337768555, "global_step": 37597, "epoch": 310} {"train_loss": -33.4993782043457, "global_step": 37598, "epoch": 310} {"train_loss": -32.94563674926758, "global_step": 37599, "epoch": 310} {"train_loss": -32.79793167114258, "global_step": 37600, "epoch": 310} {"train_loss": -31.172168731689453, "global_step": 37601, "epoch": 310} {"train_loss": -28.836023330688477, "global_step": 37602, "epoch": 310} {"train_loss": -28.90423583984375, "global_step": 37603, "epoch": 310} {"train_loss": -29.3421688079834, "global_step": 37604, "epoch": 310} {"train_loss": -32.38688278198242, "global_step": 37605, "epoch": 310} {"train_loss": -33.19636154174805, "global_step": 37606, "epoch": 310} {"train_loss": -31.847644805908203, "global_step": 37607, "epoch": 310} {"train_loss": -31.350727081298828, "global_step": 37608, "epoch": 310} {"train_loss": -31.81760597229004, "global_step": 37609, "epoch": 310} {"train_loss": -30.600683212280273, "global_step": 37610, "epoch": 310} {"train_loss": -27.600574493408203, "global_step": 37611, "epoch": 310} {"train_loss": -27.264453887939453, "global_step": 37612, "epoch": 310} {"train_loss": -28.34683609008789, "global_step": 37613, "epoch": 310} {"train_loss": -32.492034912109375, "global_step": 37614, "epoch": 310} {"train_loss": -30.734785079956055, "global_step": 37615, "epoch": 310} {"train_loss": -32.829280853271484, "global_step": 37616, "epoch": 310} {"train_loss": -31.176549911499023, "global_step": 37617, "epoch": 310} {"train_loss": -33.00075912475586, "global_step": 37618, "epoch": 310} {"train_loss": -31.132888793945312, "global_step": 37619, "epoch": 310} {"train_loss": -32.78644561767578, "global_step": 37620, "epoch": 310} {"train_loss": -31.825708389282227, "global_step": 37621, "epoch": 310} {"train_loss": -32.19021224975586, "global_step": 37622, "epoch": 310} {"train_loss": -32.12030029296875, "global_step": 37623, "epoch": 310} {"train_loss": -31.454870223999023, "global_step": 37624, "epoch": 310} {"train_loss": -32.12302780151367, "global_step": 37625, "epoch": 310} {"train_loss": -32.3682975769043, "global_step": 37626, "epoch": 310} {"train_loss": -32.46029281616211, "global_step": 37627, "epoch": 310} {"train_loss": -33.11083984375, "global_step": 37628, "epoch": 310} {"train_loss": -32.60288619995117, "global_step": 37629, "epoch": 310} {"train_loss": -32.1022422096946, "global_step": 37630, "epoch": 310, "val_loss": 2668730.0} {"train_loss": -32.66682815551758, "global_step": 37631, "epoch": 311} {"train_loss": -32.80127716064453, "global_step": 37632, "epoch": 311} {"train_loss": -32.6434440612793, "global_step": 37633, "epoch": 311} {"train_loss": -33.1702995300293, "global_step": 37634, "epoch": 311} {"train_loss": -33.13100051879883, "global_step": 37635, "epoch": 311} {"train_loss": -32.928890228271484, "global_step": 37636, "epoch": 311} {"train_loss": -32.95493698120117, "global_step": 37637, "epoch": 311} {"train_loss": -32.95085144042969, "global_step": 37638, "epoch": 311} {"train_loss": -33.51358413696289, "global_step": 37639, "epoch": 311} {"train_loss": -33.286067962646484, "global_step": 37640, "epoch": 311} {"train_loss": -33.08423614501953, "global_step": 37641, "epoch": 311} {"train_loss": -33.55152130126953, "global_step": 37642, "epoch": 311} {"train_loss": -33.50905990600586, "global_step": 37643, "epoch": 311} {"train_loss": -33.50322341918945, "global_step": 37644, "epoch": 311} {"train_loss": -33.50971603393555, "global_step": 37645, "epoch": 311} {"train_loss": -33.73543930053711, "global_step": 37646, "epoch": 311} {"train_loss": -33.397674560546875, "global_step": 37647, "epoch": 311} {"train_loss": -33.86264419555664, "global_step": 37648, "epoch": 311} {"train_loss": -33.697261810302734, "global_step": 37649, "epoch": 311} {"train_loss": -33.72555160522461, "global_step": 37650, "epoch": 311} {"train_loss": -33.8885612487793, "global_step": 37651, "epoch": 311} {"train_loss": -33.715152740478516, "global_step": 37652, "epoch": 311} {"train_loss": -33.809967041015625, "global_step": 37653, "epoch": 311} {"train_loss": -33.58087158203125, "global_step": 37654, "epoch": 311} {"train_loss": -33.52712631225586, "global_step": 37655, "epoch": 311} {"train_loss": -33.773738861083984, "global_step": 37656, "epoch": 311} {"train_loss": -33.9538688659668, "global_step": 37657, "epoch": 311} {"train_loss": -34.22574234008789, "global_step": 37658, "epoch": 311} {"train_loss": -33.90052032470703, "global_step": 37659, "epoch": 311} {"train_loss": -34.003170013427734, "global_step": 37660, "epoch": 311} {"train_loss": -33.87650680541992, "global_step": 37661, "epoch": 311} {"train_loss": -34.29011917114258, "global_step": 37662, "epoch": 311} {"train_loss": -34.1515007019043, "global_step": 37663, "epoch": 311} {"train_loss": -34.05544662475586, "global_step": 37664, "epoch": 311} {"train_loss": -34.04494857788086, "global_step": 37665, "epoch": 311} {"train_loss": -34.00733947753906, "global_step": 37666, "epoch": 311} {"train_loss": -34.31376266479492, "global_step": 37667, "epoch": 311} {"train_loss": -33.65620040893555, "global_step": 37668, "epoch": 311} {"train_loss": -33.3375129699707, "global_step": 37669, "epoch": 311} {"train_loss": -33.471248626708984, "global_step": 37670, "epoch": 311} {"train_loss": -33.812599182128906, "global_step": 37671, "epoch": 311} {"train_loss": -34.24416732788086, "global_step": 37672, "epoch": 311} {"train_loss": -32.539390563964844, "global_step": 37673, "epoch": 311} {"train_loss": -33.85095977783203, "global_step": 37674, "epoch": 311} {"train_loss": -33.45960998535156, "global_step": 37675, "epoch": 311} {"train_loss": -33.5573844909668, "global_step": 37676, "epoch": 311} {"train_loss": -34.29655838012695, "global_step": 37677, "epoch": 311} {"train_loss": -33.498870849609375, "global_step": 37678, "epoch": 311} {"train_loss": -33.99192428588867, "global_step": 37679, "epoch": 311} {"train_loss": -33.61361312866211, "global_step": 37680, "epoch": 311} {"train_loss": -33.74390411376953, "global_step": 37681, "epoch": 311} {"train_loss": -34.33340072631836, "global_step": 37682, "epoch": 311} {"train_loss": -33.676021575927734, "global_step": 37683, "epoch": 311} {"train_loss": -34.208251953125, "global_step": 37684, "epoch": 311} {"train_loss": -34.14994430541992, "global_step": 37685, "epoch": 311} {"train_loss": -34.150943756103516, "global_step": 37686, "epoch": 311} {"train_loss": -33.984169006347656, "global_step": 37687, "epoch": 311} {"train_loss": -34.297237396240234, "global_step": 37688, "epoch": 311} {"train_loss": -34.56758499145508, "global_step": 37689, "epoch": 311} {"train_loss": -34.37032699584961, "global_step": 37690, "epoch": 311} {"train_loss": -34.45180892944336, "global_step": 37691, "epoch": 311} {"train_loss": -34.52991485595703, "global_step": 37692, "epoch": 311} {"train_loss": -34.269691467285156, "global_step": 37693, "epoch": 311} {"train_loss": -34.05085372924805, "global_step": 37694, "epoch": 311} {"train_loss": -34.048309326171875, "global_step": 37695, "epoch": 311} {"train_loss": -34.1696891784668, "global_step": 37696, "epoch": 311} {"train_loss": -33.08597946166992, "global_step": 37697, "epoch": 311} {"train_loss": -33.94757080078125, "global_step": 37698, "epoch": 311} {"train_loss": -33.4694938659668, "global_step": 37699, "epoch": 311} {"train_loss": -33.33994674682617, "global_step": 37700, "epoch": 311} {"train_loss": -33.24238204956055, "global_step": 37701, "epoch": 311} {"train_loss": -34.20166778564453, "global_step": 37702, "epoch": 311} {"train_loss": -34.278621673583984, "global_step": 37703, "epoch": 311} {"train_loss": -34.349605560302734, "global_step": 37704, "epoch": 311} {"train_loss": -34.57817459106445, "global_step": 37705, "epoch": 311} {"train_loss": -33.570343017578125, "global_step": 37706, "epoch": 311} {"train_loss": -32.6668701171875, "global_step": 37707, "epoch": 311} {"train_loss": -34.66929626464844, "global_step": 37708, "epoch": 311} {"train_loss": -34.044307708740234, "global_step": 37709, "epoch": 311} {"train_loss": -34.23574447631836, "global_step": 37710, "epoch": 311} {"train_loss": -34.00962448120117, "global_step": 37711, "epoch": 311} {"train_loss": -34.06791305541992, "global_step": 37712, "epoch": 311} {"train_loss": -32.19382858276367, "global_step": 37713, "epoch": 311} {"train_loss": -33.307044982910156, "global_step": 37714, "epoch": 311} {"train_loss": -31.6531925201416, "global_step": 37715, "epoch": 311} {"train_loss": -31.615798950195312, "global_step": 37716, "epoch": 311} {"train_loss": -29.794763565063477, "global_step": 37717, "epoch": 311} {"train_loss": -27.09735679626465, "global_step": 37718, "epoch": 311} {"train_loss": -19.189455032348633, "global_step": 37719, "epoch": 311} {"train_loss": -11.31843090057373, "global_step": 37720, "epoch": 311} {"train_loss": -19.757810592651367, "global_step": 37721, "epoch": 311} {"train_loss": -31.218103408813477, "global_step": 37722, "epoch": 311} {"train_loss": -24.30329704284668, "global_step": 37723, "epoch": 311} {"train_loss": -31.764148712158203, "global_step": 37724, "epoch": 311} {"train_loss": -27.1984920501709, "global_step": 37725, "epoch": 311} {"train_loss": -32.1014518737793, "global_step": 37726, "epoch": 311} {"train_loss": -30.341720581054688, "global_step": 37727, "epoch": 311} {"train_loss": -29.696659088134766, "global_step": 37728, "epoch": 311} {"train_loss": -32.678890228271484, "global_step": 37729, "epoch": 311} {"train_loss": -31.74845314025879, "global_step": 37730, "epoch": 311} {"train_loss": -30.596485137939453, "global_step": 37731, "epoch": 311} {"train_loss": -30.901077270507812, "global_step": 37732, "epoch": 311} {"train_loss": -32.0095329284668, "global_step": 37733, "epoch": 311} {"train_loss": -30.553268432617188, "global_step": 37734, "epoch": 311} {"train_loss": -31.86002540588379, "global_step": 37735, "epoch": 311} {"train_loss": -32.398841857910156, "global_step": 37736, "epoch": 311} {"train_loss": -30.67628288269043, "global_step": 37737, "epoch": 311} {"train_loss": -30.715646743774414, "global_step": 37738, "epoch": 311} {"train_loss": -32.49951934814453, "global_step": 37739, "epoch": 311} {"train_loss": -32.114410400390625, "global_step": 37740, "epoch": 311} {"train_loss": -32.69808578491211, "global_step": 37741, "epoch": 311} {"train_loss": -32.174583435058594, "global_step": 37742, "epoch": 311} {"train_loss": -32.17150115966797, "global_step": 37743, "epoch": 311} {"train_loss": -32.68978500366211, "global_step": 37744, "epoch": 311} {"train_loss": -32.19948196411133, "global_step": 37745, "epoch": 311} {"train_loss": -32.2662239074707, "global_step": 37746, "epoch": 311} {"train_loss": -32.39037322998047, "global_step": 37747, "epoch": 311} {"train_loss": -32.475406646728516, "global_step": 37748, "epoch": 311} {"train_loss": -32.92246627807617, "global_step": 37749, "epoch": 311} {"train_loss": -32.92783737182617, "global_step": 37750, "epoch": 311} {"train_loss": -32.62413515926393, "global_step": 37751, "epoch": 311, "val_loss": 2499752.75} {"train_loss": -32.725406646728516, "global_step": 37752, "epoch": 312} {"train_loss": -32.91664123535156, "global_step": 37753, "epoch": 312} {"train_loss": -32.97909164428711, "global_step": 37754, "epoch": 312} {"train_loss": -32.185302734375, "global_step": 37755, "epoch": 312} {"train_loss": -33.06098175048828, "global_step": 37756, "epoch": 312} {"train_loss": -33.23927688598633, "global_step": 37757, "epoch": 312} {"train_loss": -32.86393356323242, "global_step": 37758, "epoch": 312} {"train_loss": -32.615535736083984, "global_step": 37759, "epoch": 312} {"train_loss": -32.99257278442383, "global_step": 37760, "epoch": 312} {"train_loss": -33.25569152832031, "global_step": 37761, "epoch": 312} {"train_loss": -33.12034225463867, "global_step": 37762, "epoch": 312} {"train_loss": -33.45038986206055, "global_step": 37763, "epoch": 312} {"train_loss": -33.80717849731445, "global_step": 37764, "epoch": 312} {"train_loss": -33.04995346069336, "global_step": 37765, "epoch": 312} {"train_loss": -32.75763702392578, "global_step": 37766, "epoch": 312} {"train_loss": -33.02173614501953, "global_step": 37767, "epoch": 312} {"train_loss": -33.26300811767578, "global_step": 37768, "epoch": 312} {"train_loss": -32.583457946777344, "global_step": 37769, "epoch": 312} {"train_loss": -33.09356689453125, "global_step": 37770, "epoch": 312} {"train_loss": -33.49684524536133, "global_step": 37771, "epoch": 312} {"train_loss": -33.70402526855469, "global_step": 37772, "epoch": 312} {"train_loss": -33.6364860534668, "global_step": 37773, "epoch": 312} {"train_loss": -33.71424102783203, "global_step": 37774, "epoch": 312} {"train_loss": -33.473838806152344, "global_step": 37775, "epoch": 312} {"train_loss": -33.837318420410156, "global_step": 37776, "epoch": 312} {"train_loss": -33.72220993041992, "global_step": 37777, "epoch": 312} {"train_loss": -33.94934844970703, "global_step": 37778, "epoch": 312} {"train_loss": -33.57427978515625, "global_step": 37779, "epoch": 312} {"train_loss": -33.02427291870117, "global_step": 37780, "epoch": 312} {"train_loss": -32.924781799316406, "global_step": 37781, "epoch": 312} {"train_loss": -34.194393157958984, "global_step": 37782, "epoch": 312} {"train_loss": -34.08059310913086, "global_step": 37783, "epoch": 312} {"train_loss": -33.586891174316406, "global_step": 37784, "epoch": 312} {"train_loss": -34.335514068603516, "global_step": 37785, "epoch": 312} {"train_loss": -33.818721771240234, "global_step": 37786, "epoch": 312} {"train_loss": -34.057003021240234, "global_step": 37787, "epoch": 312} {"train_loss": -33.41978073120117, "global_step": 37788, "epoch": 312} {"train_loss": -33.52156448364258, "global_step": 37789, "epoch": 312} {"train_loss": -34.021629333496094, "global_step": 37790, "epoch": 312} {"train_loss": -32.85698318481445, "global_step": 37791, "epoch": 312} {"train_loss": -31.76145362854004, "global_step": 37792, "epoch": 312} {"train_loss": -31.029434204101562, "global_step": 37793, "epoch": 312} {"train_loss": -29.604278564453125, "global_step": 37794, "epoch": 312} {"train_loss": -29.264867782592773, "global_step": 37795, "epoch": 312} {"train_loss": -31.270963668823242, "global_step": 37796, "epoch": 312} {"train_loss": -33.37575149536133, "global_step": 37797, "epoch": 312} {"train_loss": -31.988037109375, "global_step": 37798, "epoch": 312} {"train_loss": -32.88666534423828, "global_step": 37799, "epoch": 312} {"train_loss": -33.46500778198242, "global_step": 37800, "epoch": 312} {"train_loss": -32.35465621948242, "global_step": 37801, "epoch": 312} {"train_loss": -32.65143966674805, "global_step": 37802, "epoch": 312} {"train_loss": -31.71782875061035, "global_step": 37803, "epoch": 312} {"train_loss": -33.17003631591797, "global_step": 37804, "epoch": 312} {"train_loss": -32.70061111450195, "global_step": 37805, "epoch": 312} {"train_loss": -32.870155334472656, "global_step": 37806, "epoch": 312} {"train_loss": -32.631309509277344, "global_step": 37807, "epoch": 312} {"train_loss": -32.055335998535156, "global_step": 37808, "epoch": 312} {"train_loss": -32.86439514160156, "global_step": 37809, "epoch": 312} {"train_loss": -32.90769577026367, "global_step": 37810, "epoch": 312} {"train_loss": -31.421545028686523, "global_step": 37811, "epoch": 312} {"train_loss": -28.287113189697266, "global_step": 37812, "epoch": 312} {"train_loss": -32.99675750732422, "global_step": 37813, "epoch": 312} {"train_loss": -31.09639549255371, "global_step": 37814, "epoch": 312} {"train_loss": -30.585285186767578, "global_step": 37815, "epoch": 312} {"train_loss": -28.465803146362305, "global_step": 37816, "epoch": 312} {"train_loss": -31.814199447631836, "global_step": 37817, "epoch": 312} {"train_loss": -27.677927017211914, "global_step": 37818, "epoch": 312} {"train_loss": -30.802978515625, "global_step": 37819, "epoch": 312} {"train_loss": -31.0037841796875, "global_step": 37820, "epoch": 312} {"train_loss": -31.849990844726562, "global_step": 37821, "epoch": 312} {"train_loss": -31.8968563079834, "global_step": 37822, "epoch": 312} {"train_loss": -26.34083366394043, "global_step": 37823, "epoch": 312} {"train_loss": -30.020416259765625, "global_step": 37824, "epoch": 312} {"train_loss": -30.925390243530273, "global_step": 37825, "epoch": 312} {"train_loss": -30.553028106689453, "global_step": 37826, "epoch": 312} {"train_loss": -27.804550170898438, "global_step": 37827, "epoch": 312} {"train_loss": -27.753131866455078, "global_step": 37828, "epoch": 312} {"train_loss": -31.4671630859375, "global_step": 37829, "epoch": 312} {"train_loss": -31.213184356689453, "global_step": 37830, "epoch": 312} {"train_loss": -31.263513565063477, "global_step": 37831, "epoch": 312} {"train_loss": -29.9207706451416, "global_step": 37832, "epoch": 312} {"train_loss": -30.864288330078125, "global_step": 37833, "epoch": 312} {"train_loss": -30.253026962280273, "global_step": 37834, "epoch": 312} {"train_loss": -31.302001953125, "global_step": 37835, "epoch": 312} {"train_loss": -31.13234519958496, "global_step": 37836, "epoch": 312} {"train_loss": -30.991079330444336, "global_step": 37837, "epoch": 312} {"train_loss": -31.404342651367188, "global_step": 37838, "epoch": 312} {"train_loss": -31.137588500976562, "global_step": 37839, "epoch": 312} {"train_loss": -31.021350860595703, "global_step": 37840, "epoch": 312} {"train_loss": -31.939228057861328, "global_step": 37841, "epoch": 312} {"train_loss": -31.42561149597168, "global_step": 37842, "epoch": 312} {"train_loss": -31.951990127563477, "global_step": 37843, "epoch": 312} {"train_loss": -31.992502212524414, "global_step": 37844, "epoch": 312} {"train_loss": -31.901569366455078, "global_step": 37845, "epoch": 312} {"train_loss": -31.913105010986328, "global_step": 37846, "epoch": 312} {"train_loss": -31.999378204345703, "global_step": 37847, "epoch": 312} {"train_loss": -31.338871002197266, "global_step": 37848, "epoch": 312} {"train_loss": -32.12992477416992, "global_step": 37849, "epoch": 312} {"train_loss": -32.178951263427734, "global_step": 37850, "epoch": 312} {"train_loss": -31.737201690673828, "global_step": 37851, "epoch": 312} {"train_loss": -32.31244659423828, "global_step": 37852, "epoch": 312} {"train_loss": -32.46608352661133, "global_step": 37853, "epoch": 312} {"train_loss": -32.603214263916016, "global_step": 37854, "epoch": 312} {"train_loss": -32.15232467651367, "global_step": 37855, "epoch": 312} {"train_loss": -32.329437255859375, "global_step": 37856, "epoch": 312} {"train_loss": -32.65913009643555, "global_step": 37857, "epoch": 312} {"train_loss": -32.5139045715332, "global_step": 37858, "epoch": 312} {"train_loss": -32.92774200439453, "global_step": 37859, "epoch": 312} {"train_loss": -33.2026481628418, "global_step": 37860, "epoch": 312} {"train_loss": -32.71843338012695, "global_step": 37861, "epoch": 312} {"train_loss": -32.78367233276367, "global_step": 37862, "epoch": 312} {"train_loss": -32.5838508605957, "global_step": 37863, "epoch": 312} {"train_loss": -33.0875358581543, "global_step": 37864, "epoch": 312} {"train_loss": -32.41433334350586, "global_step": 37865, "epoch": 312} {"train_loss": -32.6722297668457, "global_step": 37866, "epoch": 312} {"train_loss": -32.7237434387207, "global_step": 37867, "epoch": 312} {"train_loss": -32.08626937866211, "global_step": 37868, "epoch": 312} {"train_loss": -32.626747131347656, "global_step": 37869, "epoch": 312} {"train_loss": -33.4359130859375, "global_step": 37870, "epoch": 312} {"train_loss": -33.27129364013672, "global_step": 37871, "epoch": 312} {"train_loss": -32.18723246676863, "global_step": 37872, "epoch": 312, "val_loss": 2582191.5} {"train_loss": -31.93035888671875, "global_step": 37873, "epoch": 313} {"train_loss": -30.121967315673828, "global_step": 37874, "epoch": 313} {"train_loss": -27.97922134399414, "global_step": 37875, "epoch": 313} {"train_loss": -30.286609649658203, "global_step": 37876, "epoch": 313} {"train_loss": -32.44961929321289, "global_step": 37877, "epoch": 313} {"train_loss": -32.68111038208008, "global_step": 37878, "epoch": 313} {"train_loss": -32.922298431396484, "global_step": 37879, "epoch": 313} {"train_loss": -32.72751998901367, "global_step": 37880, "epoch": 313} {"train_loss": -33.30119705200195, "global_step": 37881, "epoch": 313} {"train_loss": -33.269195556640625, "global_step": 37882, "epoch": 313} {"train_loss": -33.590816497802734, "global_step": 37883, "epoch": 313} {"train_loss": -33.262306213378906, "global_step": 37884, "epoch": 313} {"train_loss": -33.31354904174805, "global_step": 37885, "epoch": 313} {"train_loss": -33.36417770385742, "global_step": 37886, "epoch": 313} {"train_loss": -32.967533111572266, "global_step": 37887, "epoch": 313} {"train_loss": -33.63402557373047, "global_step": 37888, "epoch": 313} {"train_loss": -32.647212982177734, "global_step": 37889, "epoch": 313} {"train_loss": -33.419525146484375, "global_step": 37890, "epoch": 313} {"train_loss": -34.054656982421875, "global_step": 37891, "epoch": 313} {"train_loss": -33.518062591552734, "global_step": 37892, "epoch": 313} {"train_loss": -32.977046966552734, "global_step": 37893, "epoch": 313} {"train_loss": -33.85398483276367, "global_step": 37894, "epoch": 313} {"train_loss": -34.06129455566406, "global_step": 37895, "epoch": 313} {"train_loss": -33.40351867675781, "global_step": 37896, "epoch": 313} {"train_loss": -34.40669631958008, "global_step": 37897, "epoch": 313} {"train_loss": -33.2412223815918, "global_step": 37898, "epoch": 313} {"train_loss": -34.357723236083984, "global_step": 37899, "epoch": 313} {"train_loss": -34.02688217163086, "global_step": 37900, "epoch": 313} {"train_loss": -34.358333587646484, "global_step": 37901, "epoch": 313} {"train_loss": -34.030120849609375, "global_step": 37902, "epoch": 313} {"train_loss": -34.30385208129883, "global_step": 37903, "epoch": 313} {"train_loss": -33.89243698120117, "global_step": 37904, "epoch": 313} {"train_loss": -34.695457458496094, "global_step": 37905, "epoch": 313} {"train_loss": -34.31427001953125, "global_step": 37906, "epoch": 313} {"train_loss": -34.75304412841797, "global_step": 37907, "epoch": 313} {"train_loss": -34.292449951171875, "global_step": 37908, "epoch": 313} {"train_loss": -34.45845031738281, "global_step": 37909, "epoch": 313} {"train_loss": -34.63057327270508, "global_step": 37910, "epoch": 313} {"train_loss": -34.044586181640625, "global_step": 37911, "epoch": 313} {"train_loss": -34.099395751953125, "global_step": 37912, "epoch": 313} {"train_loss": -32.70866775512695, "global_step": 37913, "epoch": 313} {"train_loss": -32.49911117553711, "global_step": 37914, "epoch": 313} {"train_loss": -34.473812103271484, "global_step": 37915, "epoch": 313} {"train_loss": -32.19842529296875, "global_step": 37916, "epoch": 313} {"train_loss": -33.6811408996582, "global_step": 37917, "epoch": 313} {"train_loss": -32.111961364746094, "global_step": 37918, "epoch": 313} {"train_loss": -34.02899169921875, "global_step": 37919, "epoch": 313} {"train_loss": -33.22287368774414, "global_step": 37920, "epoch": 313} {"train_loss": -32.2856559753418, "global_step": 37921, "epoch": 313} {"train_loss": -34.070167541503906, "global_step": 37922, "epoch": 313} {"train_loss": -32.868282318115234, "global_step": 37923, "epoch": 313} {"train_loss": -33.82939529418945, "global_step": 37924, "epoch": 313} {"train_loss": -33.807247161865234, "global_step": 37925, "epoch": 313} {"train_loss": -32.51536560058594, "global_step": 37926, "epoch": 313} {"train_loss": -31.8049373626709, "global_step": 37927, "epoch": 313} {"train_loss": -31.145750045776367, "global_step": 37928, "epoch": 313} {"train_loss": -32.48804473876953, "global_step": 37929, "epoch": 313} {"train_loss": -33.385318756103516, "global_step": 37930, "epoch": 313} {"train_loss": -33.514808654785156, "global_step": 37931, "epoch": 313} {"train_loss": -32.3232307434082, "global_step": 37932, "epoch": 313} {"train_loss": -32.50810623168945, "global_step": 37933, "epoch": 313} {"train_loss": -33.679019927978516, "global_step": 37934, "epoch": 313} {"train_loss": -33.270626068115234, "global_step": 37935, "epoch": 313} {"train_loss": -33.5802116394043, "global_step": 37936, "epoch": 313} {"train_loss": -33.93267822265625, "global_step": 37937, "epoch": 313} {"train_loss": -33.67841339111328, "global_step": 37938, "epoch": 313} {"train_loss": -33.37223815917969, "global_step": 37939, "epoch": 313} {"train_loss": -33.72368240356445, "global_step": 37940, "epoch": 313} {"train_loss": -33.784095764160156, "global_step": 37941, "epoch": 313} {"train_loss": -32.899986267089844, "global_step": 37942, "epoch": 313} {"train_loss": -33.805213928222656, "global_step": 37943, "epoch": 313} {"train_loss": -34.05475997924805, "global_step": 37944, "epoch": 313} {"train_loss": -33.957069396972656, "global_step": 37945, "epoch": 313} {"train_loss": -33.59591293334961, "global_step": 37946, "epoch": 313} {"train_loss": -34.308040618896484, "global_step": 37947, "epoch": 313} {"train_loss": -34.0297966003418, "global_step": 37948, "epoch": 313} {"train_loss": -34.1508674621582, "global_step": 37949, "epoch": 313} {"train_loss": -33.5387077331543, "global_step": 37950, "epoch": 313} {"train_loss": -34.09520721435547, "global_step": 37951, "epoch": 313} {"train_loss": -34.22245788574219, "global_step": 37952, "epoch": 313} {"train_loss": -33.65678024291992, "global_step": 37953, "epoch": 313} {"train_loss": -33.788490295410156, "global_step": 37954, "epoch": 313} {"train_loss": -34.29442596435547, "global_step": 37955, "epoch": 313} {"train_loss": -33.791255950927734, "global_step": 37956, "epoch": 313} {"train_loss": -33.41785430908203, "global_step": 37957, "epoch": 313} {"train_loss": -34.31180953979492, "global_step": 37958, "epoch": 313} {"train_loss": -34.204349517822266, "global_step": 37959, "epoch": 313} {"train_loss": -33.744728088378906, "global_step": 37960, "epoch": 313} {"train_loss": -34.20265197753906, "global_step": 37961, "epoch": 313} {"train_loss": -33.99348068237305, "global_step": 37962, "epoch": 313} {"train_loss": -34.456966400146484, "global_step": 37963, "epoch": 313} {"train_loss": -33.935237884521484, "global_step": 37964, "epoch": 313} {"train_loss": -34.25807571411133, "global_step": 37965, "epoch": 313} {"train_loss": -34.1879768371582, "global_step": 37966, "epoch": 313} {"train_loss": -34.20368576049805, "global_step": 37967, "epoch": 313} {"train_loss": -34.43312072753906, "global_step": 37968, "epoch": 313} {"train_loss": -34.54633712768555, "global_step": 37969, "epoch": 313} {"train_loss": -34.12185287475586, "global_step": 37970, "epoch": 313} {"train_loss": -33.58290481567383, "global_step": 37971, "epoch": 313} {"train_loss": -34.27439498901367, "global_step": 37972, "epoch": 313} {"train_loss": -34.51622772216797, "global_step": 37973, "epoch": 313} {"train_loss": -34.13550567626953, "global_step": 37974, "epoch": 313} {"train_loss": -32.843170166015625, "global_step": 37975, "epoch": 313} {"train_loss": -32.384639739990234, "global_step": 37976, "epoch": 313} {"train_loss": -32.40943908691406, "global_step": 37977, "epoch": 313} {"train_loss": -34.58210372924805, "global_step": 37978, "epoch": 313} {"train_loss": -33.952789306640625, "global_step": 37979, "epoch": 313} {"train_loss": -33.09769821166992, "global_step": 37980, "epoch": 313} {"train_loss": -34.18551254272461, "global_step": 37981, "epoch": 313} {"train_loss": -33.59702682495117, "global_step": 37982, "epoch": 313} {"train_loss": -33.32763671875, "global_step": 37983, "epoch": 313} {"train_loss": -33.87333297729492, "global_step": 37984, "epoch": 313} {"train_loss": -33.17262649536133, "global_step": 37985, "epoch": 313} {"train_loss": -33.8017463684082, "global_step": 37986, "epoch": 313} {"train_loss": -34.00696563720703, "global_step": 37987, "epoch": 313} {"train_loss": -33.77465057373047, "global_step": 37988, "epoch": 313} {"train_loss": -34.87520217895508, "global_step": 37989, "epoch": 313} {"train_loss": -33.962554931640625, "global_step": 37990, "epoch": 313} {"train_loss": -33.27357864379883, "global_step": 37991, "epoch": 313} {"train_loss": -33.323699951171875, "global_step": 37992, "epoch": 313} {"train_loss": -33.51259638258248, "global_step": 37993, "epoch": 313, "val_loss": 2534607.5} {"train_loss": -33.03141784667969, "global_step": 37994, "epoch": 314} {"train_loss": -34.180908203125, "global_step": 37995, "epoch": 314} {"train_loss": -32.41713333129883, "global_step": 37996, "epoch": 314} {"train_loss": -33.635379791259766, "global_step": 37997, "epoch": 314} {"train_loss": -32.4868278503418, "global_step": 37998, "epoch": 314} {"train_loss": -33.437538146972656, "global_step": 37999, "epoch": 314} {"train_loss": -33.2032585144043, "global_step": 38000, "epoch": 314} {"train_loss": -33.71550369262695, "global_step": 38001, "epoch": 314} {"train_loss": -33.41596603393555, "global_step": 38002, "epoch": 314} {"train_loss": -33.91987991333008, "global_step": 38003, "epoch": 314} {"train_loss": -33.340396881103516, "global_step": 38004, "epoch": 314} {"train_loss": -33.691585540771484, "global_step": 38005, "epoch": 314} {"train_loss": -33.76620101928711, "global_step": 38006, "epoch": 314} {"train_loss": -32.95215606689453, "global_step": 38007, "epoch": 314} {"train_loss": -33.1713752746582, "global_step": 38008, "epoch": 314} {"train_loss": -32.75750732421875, "global_step": 38009, "epoch": 314} {"train_loss": -33.21228790283203, "global_step": 38010, "epoch": 314} {"train_loss": -34.00736618041992, "global_step": 38011, "epoch": 314} {"train_loss": -32.92993927001953, "global_step": 38012, "epoch": 314} {"train_loss": -32.974666595458984, "global_step": 38013, "epoch": 314} {"train_loss": -32.29578399658203, "global_step": 38014, "epoch": 314} {"train_loss": -32.6505126953125, "global_step": 38015, "epoch": 314} {"train_loss": -33.80537033081055, "global_step": 38016, "epoch": 314} {"train_loss": -33.6995964050293, "global_step": 38017, "epoch": 314} {"train_loss": -34.05714797973633, "global_step": 38018, "epoch": 314} {"train_loss": -33.566619873046875, "global_step": 38019, "epoch": 314} {"train_loss": -34.068695068359375, "global_step": 38020, "epoch": 314} {"train_loss": -33.15596389770508, "global_step": 38021, "epoch": 314} {"train_loss": -33.8852424621582, "global_step": 38022, "epoch": 314} {"train_loss": -33.80371856689453, "global_step": 38023, "epoch": 314} {"train_loss": -33.552703857421875, "global_step": 38024, "epoch": 314} {"train_loss": -34.369842529296875, "global_step": 38025, "epoch": 314} {"train_loss": -33.6221809387207, "global_step": 38026, "epoch": 314} {"train_loss": -34.05964279174805, "global_step": 38027, "epoch": 314} {"train_loss": -34.029293060302734, "global_step": 38028, "epoch": 314} {"train_loss": -34.7549934387207, "global_step": 38029, "epoch": 314} {"train_loss": -34.070884704589844, "global_step": 38030, "epoch": 314} {"train_loss": -34.14471435546875, "global_step": 38031, "epoch": 314} {"train_loss": -34.45032501220703, "global_step": 38032, "epoch": 314} {"train_loss": -33.76677703857422, "global_step": 38033, "epoch": 314} {"train_loss": -34.3267707824707, "global_step": 38034, "epoch": 314} {"train_loss": -34.12045669555664, "global_step": 38035, "epoch": 314} {"train_loss": -33.91152572631836, "global_step": 38036, "epoch": 314} {"train_loss": -31.8887996673584, "global_step": 38037, "epoch": 314} {"train_loss": -25.546371459960938, "global_step": 38038, "epoch": 314} {"train_loss": -14.918008804321289, "global_step": 38039, "epoch": 314} {"train_loss": -2.4495816230773926, "global_step": 38040, "epoch": 314} {"train_loss": -14.102951049804688, "global_step": 38041, "epoch": 314} {"train_loss": -30.222003936767578, "global_step": 38042, "epoch": 314} {"train_loss": -21.59675407409668, "global_step": 38043, "epoch": 314} {"train_loss": -32.43619155883789, "global_step": 38044, "epoch": 314} {"train_loss": -26.167932510375977, "global_step": 38045, "epoch": 314} {"train_loss": -28.668859481811523, "global_step": 38046, "epoch": 314} {"train_loss": -31.99163246154785, "global_step": 38047, "epoch": 314} {"train_loss": -29.059921264648438, "global_step": 38048, "epoch": 314} {"train_loss": -30.422082901000977, "global_step": 38049, "epoch": 314} {"train_loss": -31.570322036743164, "global_step": 38050, "epoch": 314} {"train_loss": -32.707977294921875, "global_step": 38051, "epoch": 314} {"train_loss": -30.699237823486328, "global_step": 38052, "epoch": 314} {"train_loss": -32.051612854003906, "global_step": 38053, "epoch": 314} {"train_loss": -31.392175674438477, "global_step": 38054, "epoch": 314} {"train_loss": -33.08557891845703, "global_step": 38055, "epoch": 314} {"train_loss": -31.796222686767578, "global_step": 38056, "epoch": 314} {"train_loss": -32.25727462768555, "global_step": 38057, "epoch": 314} {"train_loss": -32.01334762573242, "global_step": 38058, "epoch": 314} {"train_loss": -32.6739387512207, "global_step": 38059, "epoch": 314} {"train_loss": -33.03508758544922, "global_step": 38060, "epoch": 314} {"train_loss": -31.564294815063477, "global_step": 38061, "epoch": 314} {"train_loss": -32.88877487182617, "global_step": 38062, "epoch": 314} {"train_loss": -32.432464599609375, "global_step": 38063, "epoch": 314} {"train_loss": -32.530364990234375, "global_step": 38064, "epoch": 314} {"train_loss": -33.06406784057617, "global_step": 38065, "epoch": 314} {"train_loss": -32.50641632080078, "global_step": 38066, "epoch": 314} {"train_loss": -33.548519134521484, "global_step": 38067, "epoch": 314} {"train_loss": -32.76571273803711, "global_step": 38068, "epoch": 314} {"train_loss": -33.053646087646484, "global_step": 38069, "epoch": 314} {"train_loss": -33.042694091796875, "global_step": 38070, "epoch": 314} {"train_loss": -33.08491134643555, "global_step": 38071, "epoch": 314} {"train_loss": -33.2899284362793, "global_step": 38072, "epoch": 314} {"train_loss": -33.09395980834961, "global_step": 38073, "epoch": 314} {"train_loss": -33.165035247802734, "global_step": 38074, "epoch": 314} {"train_loss": -33.08234786987305, "global_step": 38075, "epoch": 314} {"train_loss": -32.81523132324219, "global_step": 38076, "epoch": 314} {"train_loss": -33.13882827758789, "global_step": 38077, "epoch": 314} {"train_loss": -32.59815216064453, "global_step": 38078, "epoch": 314} {"train_loss": -33.21381759643555, "global_step": 38079, "epoch": 314} {"train_loss": -32.19071578979492, "global_step": 38080, "epoch": 314} {"train_loss": -33.00967025756836, "global_step": 38081, "epoch": 314} {"train_loss": -32.9846076965332, "global_step": 38082, "epoch": 314} {"train_loss": -33.4998779296875, "global_step": 38083, "epoch": 314} {"train_loss": -33.49444580078125, "global_step": 38084, "epoch": 314} {"train_loss": -32.82611083984375, "global_step": 38085, "epoch": 314} {"train_loss": -33.4034309387207, "global_step": 38086, "epoch": 314} {"train_loss": -33.485984802246094, "global_step": 38087, "epoch": 314} {"train_loss": -33.566219329833984, "global_step": 38088, "epoch": 314} {"train_loss": -33.75996017456055, "global_step": 38089, "epoch": 314} {"train_loss": -33.42634582519531, "global_step": 38090, "epoch": 314} {"train_loss": -33.489051818847656, "global_step": 38091, "epoch": 314} {"train_loss": -33.57605743408203, "global_step": 38092, "epoch": 314} {"train_loss": -33.081695556640625, "global_step": 38093, "epoch": 314} {"train_loss": -34.13653564453125, "global_step": 38094, "epoch": 314} {"train_loss": -33.138771057128906, "global_step": 38095, "epoch": 314} {"train_loss": -33.104896545410156, "global_step": 38096, "epoch": 314} {"train_loss": -33.33835220336914, "global_step": 38097, "epoch": 314} {"train_loss": -33.44993591308594, "global_step": 38098, "epoch": 314} {"train_loss": -33.69154739379883, "global_step": 38099, "epoch": 314} {"train_loss": -33.05866622924805, "global_step": 38100, "epoch": 314} {"train_loss": -33.62667465209961, "global_step": 38101, "epoch": 314} {"train_loss": -33.41926956176758, "global_step": 38102, "epoch": 314} {"train_loss": -32.944190979003906, "global_step": 38103, "epoch": 314} {"train_loss": -33.622772216796875, "global_step": 38104, "epoch": 314} {"train_loss": -33.358272552490234, "global_step": 38105, "epoch": 314} {"train_loss": -32.99738693237305, "global_step": 38106, "epoch": 314} {"train_loss": -33.648048400878906, "global_step": 38107, "epoch": 314} {"train_loss": -32.646663665771484, "global_step": 38108, "epoch": 314} {"train_loss": -33.60887145996094, "global_step": 38109, "epoch": 314} {"train_loss": -32.6182975769043, "global_step": 38110, "epoch": 314} {"train_loss": -33.52041244506836, "global_step": 38111, "epoch": 314} {"train_loss": -32.625362396240234, "global_step": 38112, "epoch": 314} {"train_loss": -32.580230712890625, "global_step": 38113, "epoch": 314} {"train_loss": -32.27093786838626, "global_step": 38114, "epoch": 314, "val_loss": 2724636.0} {"train_loss": -29.729022979736328, "global_step": 38115, "epoch": 315} {"train_loss": -26.840543746948242, "global_step": 38116, "epoch": 315} {"train_loss": -19.8431453704834, "global_step": 38117, "epoch": 315} {"train_loss": -24.979570388793945, "global_step": 38118, "epoch": 315} {"train_loss": -32.816375732421875, "global_step": 38119, "epoch": 315} {"train_loss": -25.370267868041992, "global_step": 38120, "epoch": 315} {"train_loss": -30.077152252197266, "global_step": 38121, "epoch": 315} {"train_loss": -28.68222427368164, "global_step": 38122, "epoch": 315} {"train_loss": -29.32465171813965, "global_step": 38123, "epoch": 315} {"train_loss": -30.010541915893555, "global_step": 38124, "epoch": 315} {"train_loss": -32.40625, "global_step": 38125, "epoch": 315} {"train_loss": -29.542896270751953, "global_step": 38126, "epoch": 315} {"train_loss": -32.47690200805664, "global_step": 38127, "epoch": 315} {"train_loss": -30.9239444732666, "global_step": 38128, "epoch": 315} {"train_loss": -31.658252716064453, "global_step": 38129, "epoch": 315} {"train_loss": -33.447017669677734, "global_step": 38130, "epoch": 315} {"train_loss": -32.199405670166016, "global_step": 38131, "epoch": 315} {"train_loss": -32.0704460144043, "global_step": 38132, "epoch": 315} {"train_loss": -33.3055305480957, "global_step": 38133, "epoch": 315} {"train_loss": -33.181880950927734, "global_step": 38134, "epoch": 315} {"train_loss": -32.671775817871094, "global_step": 38135, "epoch": 315} {"train_loss": -33.035736083984375, "global_step": 38136, "epoch": 315} {"train_loss": -33.30275344848633, "global_step": 38137, "epoch": 315} {"train_loss": -32.45070266723633, "global_step": 38138, "epoch": 315} {"train_loss": -33.14163589477539, "global_step": 38139, "epoch": 315} {"train_loss": -32.86387634277344, "global_step": 38140, "epoch": 315} {"train_loss": -32.702144622802734, "global_step": 38141, "epoch": 315} {"train_loss": -33.20804214477539, "global_step": 38142, "epoch": 315} {"train_loss": -33.39154815673828, "global_step": 38143, "epoch": 315} {"train_loss": -33.332271575927734, "global_step": 38144, "epoch": 315} {"train_loss": -33.60204315185547, "global_step": 38145, "epoch": 315} {"train_loss": -32.97081756591797, "global_step": 38146, "epoch": 315} {"train_loss": -33.61470031738281, "global_step": 38147, "epoch": 315} {"train_loss": -32.865718841552734, "global_step": 38148, "epoch": 315} {"train_loss": -33.30120849609375, "global_step": 38149, "epoch": 315} {"train_loss": -33.442222595214844, "global_step": 38150, "epoch": 315} {"train_loss": -33.780879974365234, "global_step": 38151, "epoch": 315} {"train_loss": -33.316314697265625, "global_step": 38152, "epoch": 315} {"train_loss": -33.76226806640625, "global_step": 38153, "epoch": 315} {"train_loss": -33.251373291015625, "global_step": 38154, "epoch": 315} {"train_loss": -33.409706115722656, "global_step": 38155, "epoch": 315} {"train_loss": -33.31203079223633, "global_step": 38156, "epoch": 315} {"train_loss": -33.56449508666992, "global_step": 38157, "epoch": 315} {"train_loss": -33.6537971496582, "global_step": 38158, "epoch": 315} {"train_loss": -33.87946701049805, "global_step": 38159, "epoch": 315} {"train_loss": -33.77217483520508, "global_step": 38160, "epoch": 315} {"train_loss": -33.71894454956055, "global_step": 38161, "epoch": 315} {"train_loss": -33.60627365112305, "global_step": 38162, "epoch": 315} {"train_loss": -32.613075256347656, "global_step": 38163, "epoch": 315} {"train_loss": -33.211544036865234, "global_step": 38164, "epoch": 315} {"train_loss": -33.4876708984375, "global_step": 38165, "epoch": 315} {"train_loss": -34.13257598876953, "global_step": 38166, "epoch": 315} {"train_loss": -33.229305267333984, "global_step": 38167, "epoch": 315} {"train_loss": -33.355770111083984, "global_step": 38168, "epoch": 315} {"train_loss": -33.53386688232422, "global_step": 38169, "epoch": 315} {"train_loss": -33.54561996459961, "global_step": 38170, "epoch": 315} {"train_loss": -33.471065521240234, "global_step": 38171, "epoch": 315} {"train_loss": -33.3231315612793, "global_step": 38172, "epoch": 315} {"train_loss": -33.83705520629883, "global_step": 38173, "epoch": 315} {"train_loss": -32.67292022705078, "global_step": 38174, "epoch": 315} {"train_loss": -33.79301834106445, "global_step": 38175, "epoch": 315} {"train_loss": -32.8555908203125, "global_step": 38176, "epoch": 315} {"train_loss": -31.5190486907959, "global_step": 38177, "epoch": 315} {"train_loss": -31.76093864440918, "global_step": 38178, "epoch": 315} {"train_loss": -31.317962646484375, "global_step": 38179, "epoch": 315} {"train_loss": -31.204975128173828, "global_step": 38180, "epoch": 315} {"train_loss": -31.450708389282227, "global_step": 38181, "epoch": 315} {"train_loss": -32.166717529296875, "global_step": 38182, "epoch": 315} {"train_loss": -32.871299743652344, "global_step": 38183, "epoch": 315} {"train_loss": -33.58866500854492, "global_step": 38184, "epoch": 315} {"train_loss": -33.423336029052734, "global_step": 38185, "epoch": 315} {"train_loss": -32.74138259887695, "global_step": 38186, "epoch": 315} {"train_loss": -32.81781005859375, "global_step": 38187, "epoch": 315} {"train_loss": -32.27206039428711, "global_step": 38188, "epoch": 315} {"train_loss": -32.10457992553711, "global_step": 38189, "epoch": 315} {"train_loss": -33.39323806762695, "global_step": 38190, "epoch": 315} {"train_loss": -32.79819869995117, "global_step": 38191, "epoch": 315} {"train_loss": -32.82069396972656, "global_step": 38192, "epoch": 315} {"train_loss": -32.14461135864258, "global_step": 38193, "epoch": 315} {"train_loss": -33.56610107421875, "global_step": 38194, "epoch": 315} {"train_loss": -31.75359535217285, "global_step": 38195, "epoch": 315} {"train_loss": -32.7608757019043, "global_step": 38196, "epoch": 315} {"train_loss": -31.290185928344727, "global_step": 38197, "epoch": 315} {"train_loss": -32.933284759521484, "global_step": 38198, "epoch": 315} {"train_loss": -29.680801391601562, "global_step": 38199, "epoch": 315} {"train_loss": -31.679412841796875, "global_step": 38200, "epoch": 315} {"train_loss": -32.68321990966797, "global_step": 38201, "epoch": 315} {"train_loss": -31.934289932250977, "global_step": 38202, "epoch": 315} {"train_loss": -32.4387092590332, "global_step": 38203, "epoch": 315} {"train_loss": -32.09002685546875, "global_step": 38204, "epoch": 315} {"train_loss": -32.490081787109375, "global_step": 38205, "epoch": 315} {"train_loss": -32.447017669677734, "global_step": 38206, "epoch": 315} {"train_loss": -32.576576232910156, "global_step": 38207, "epoch": 315} {"train_loss": -32.296295166015625, "global_step": 38208, "epoch": 315} {"train_loss": -32.03923416137695, "global_step": 38209, "epoch": 315} {"train_loss": -32.709228515625, "global_step": 38210, "epoch": 315} {"train_loss": -32.30961227416992, "global_step": 38211, "epoch": 315} {"train_loss": -32.684783935546875, "global_step": 38212, "epoch": 315} {"train_loss": -32.493595123291016, "global_step": 38213, "epoch": 315} {"train_loss": -32.17733383178711, "global_step": 38214, "epoch": 315} {"train_loss": -32.5838508605957, "global_step": 38215, "epoch": 315} {"train_loss": -32.14009475708008, "global_step": 38216, "epoch": 315} {"train_loss": -32.330726623535156, "global_step": 38217, "epoch": 315} {"train_loss": -32.645362854003906, "global_step": 38218, "epoch": 315} {"train_loss": -33.214263916015625, "global_step": 38219, "epoch": 315} {"train_loss": -32.82560348510742, "global_step": 38220, "epoch": 315} {"train_loss": -33.14305114746094, "global_step": 38221, "epoch": 315} {"train_loss": -33.28657150268555, "global_step": 38222, "epoch": 315} {"train_loss": -32.9217414855957, "global_step": 38223, "epoch": 315} {"train_loss": -32.95575714111328, "global_step": 38224, "epoch": 315} {"train_loss": -32.94123077392578, "global_step": 38225, "epoch": 315} {"train_loss": -33.16426467895508, "global_step": 38226, "epoch": 315} {"train_loss": -33.5985221862793, "global_step": 38227, "epoch": 315} {"train_loss": -33.041927337646484, "global_step": 38228, "epoch": 315} {"train_loss": -33.17827224731445, "global_step": 38229, "epoch": 315} {"train_loss": -33.247032165527344, "global_step": 38230, "epoch": 315} {"train_loss": -32.36680221557617, "global_step": 38231, "epoch": 315} {"train_loss": -32.861915588378906, "global_step": 38232, "epoch": 315} {"train_loss": -33.26015853881836, "global_step": 38233, "epoch": 315} {"train_loss": -33.3171501159668, "global_step": 38234, "epoch": 315} {"train_loss": -32.38590330328823, "global_step": 38235, "epoch": 315, "val_loss": 2626850.25} {"train_loss": -33.00954818725586, "global_step": 38236, "epoch": 316} {"train_loss": -33.570594787597656, "global_step": 38237, "epoch": 316} {"train_loss": -33.02986526489258, "global_step": 38238, "epoch": 316} {"train_loss": -32.98958969116211, "global_step": 38239, "epoch": 316} {"train_loss": -32.34797286987305, "global_step": 38240, "epoch": 316} {"train_loss": -32.520790100097656, "global_step": 38241, "epoch": 316} {"train_loss": -32.49320602416992, "global_step": 38242, "epoch": 316} {"train_loss": -32.917842864990234, "global_step": 38243, "epoch": 316} {"train_loss": -33.15814971923828, "global_step": 38244, "epoch": 316} {"train_loss": -33.17764663696289, "global_step": 38245, "epoch": 316} {"train_loss": -33.0975341796875, "global_step": 38246, "epoch": 316} {"train_loss": -33.02688217163086, "global_step": 38247, "epoch": 316} {"train_loss": -33.60419464111328, "global_step": 38248, "epoch": 316} {"train_loss": -31.7786808013916, "global_step": 38249, "epoch": 316} {"train_loss": -33.87234115600586, "global_step": 38250, "epoch": 316} {"train_loss": -32.8272819519043, "global_step": 38251, "epoch": 316} {"train_loss": -33.38215255737305, "global_step": 38252, "epoch": 316} {"train_loss": -33.24168014526367, "global_step": 38253, "epoch": 316} {"train_loss": -32.39365768432617, "global_step": 38254, "epoch": 316} {"train_loss": -33.84926986694336, "global_step": 38255, "epoch": 316} {"train_loss": -33.57596206665039, "global_step": 38256, "epoch": 316} {"train_loss": -33.64219284057617, "global_step": 38257, "epoch": 316} {"train_loss": -33.71852493286133, "global_step": 38258, "epoch": 316} {"train_loss": -33.29048538208008, "global_step": 38259, "epoch": 316} {"train_loss": -33.23945236206055, "global_step": 38260, "epoch": 316} {"train_loss": -33.273834228515625, "global_step": 38261, "epoch": 316} {"train_loss": -33.6389045715332, "global_step": 38262, "epoch": 316} {"train_loss": -33.32727813720703, "global_step": 38263, "epoch": 316} {"train_loss": -33.84373092651367, "global_step": 38264, "epoch": 316} {"train_loss": -33.46501159667969, "global_step": 38265, "epoch": 316} {"train_loss": -33.83307647705078, "global_step": 38266, "epoch": 316} {"train_loss": -33.50883102416992, "global_step": 38267, "epoch": 316} {"train_loss": -33.81377029418945, "global_step": 38268, "epoch": 316} {"train_loss": -33.44553756713867, "global_step": 38269, "epoch": 316} {"train_loss": -34.05739974975586, "global_step": 38270, "epoch": 316} {"train_loss": -34.342193603515625, "global_step": 38271, "epoch": 316} {"train_loss": -33.899288177490234, "global_step": 38272, "epoch": 316} {"train_loss": -34.16347885131836, "global_step": 38273, "epoch": 316} {"train_loss": -34.4133186340332, "global_step": 38274, "epoch": 316} {"train_loss": -34.28607177734375, "global_step": 38275, "epoch": 316} {"train_loss": -34.12061309814453, "global_step": 38276, "epoch": 316} {"train_loss": -34.38338851928711, "global_step": 38277, "epoch": 316} {"train_loss": -34.284934997558594, "global_step": 38278, "epoch": 316} {"train_loss": -34.554100036621094, "global_step": 38279, "epoch": 316} {"train_loss": -34.42487716674805, "global_step": 38280, "epoch": 316} {"train_loss": -34.366634368896484, "global_step": 38281, "epoch": 316} {"train_loss": -34.179779052734375, "global_step": 38282, "epoch": 316} {"train_loss": -34.2724494934082, "global_step": 38283, "epoch": 316} {"train_loss": -34.258174896240234, "global_step": 38284, "epoch": 316} {"train_loss": -34.66726303100586, "global_step": 38285, "epoch": 316} {"train_loss": -34.61838150024414, "global_step": 38286, "epoch": 316} {"train_loss": -34.07950973510742, "global_step": 38287, "epoch": 316} {"train_loss": -33.9550895690918, "global_step": 38288, "epoch": 316} {"train_loss": -34.24143981933594, "global_step": 38289, "epoch": 316} {"train_loss": -34.9567756652832, "global_step": 38290, "epoch": 316} {"train_loss": -34.4278564453125, "global_step": 38291, "epoch": 316} {"train_loss": -34.7418212890625, "global_step": 38292, "epoch": 316} {"train_loss": -33.770267486572266, "global_step": 38293, "epoch": 316} {"train_loss": -34.26882553100586, "global_step": 38294, "epoch": 316} {"train_loss": -33.97468185424805, "global_step": 38295, "epoch": 316} {"train_loss": -32.60738754272461, "global_step": 38296, "epoch": 316} {"train_loss": -33.3546142578125, "global_step": 38297, "epoch": 316} {"train_loss": -32.548580169677734, "global_step": 38298, "epoch": 316} {"train_loss": -33.33683395385742, "global_step": 38299, "epoch": 316} {"train_loss": -33.35799026489258, "global_step": 38300, "epoch": 316} {"train_loss": -32.810386657714844, "global_step": 38301, "epoch": 316} {"train_loss": -33.281959533691406, "global_step": 38302, "epoch": 316} {"train_loss": -34.46444320678711, "global_step": 38303, "epoch": 316} {"train_loss": -33.20054244995117, "global_step": 38304, "epoch": 316} {"train_loss": -33.81992721557617, "global_step": 38305, "epoch": 316} {"train_loss": -34.23307418823242, "global_step": 38306, "epoch": 316} {"train_loss": -33.5500602722168, "global_step": 38307, "epoch": 316} {"train_loss": -33.545753479003906, "global_step": 38308, "epoch": 316} {"train_loss": -33.68518829345703, "global_step": 38309, "epoch": 316} {"train_loss": -34.238067626953125, "global_step": 38310, "epoch": 316} {"train_loss": -33.19272232055664, "global_step": 38311, "epoch": 316} {"train_loss": -33.778804779052734, "global_step": 38312, "epoch": 316} {"train_loss": -33.72575759887695, "global_step": 38313, "epoch": 316} {"train_loss": -33.72414779663086, "global_step": 38314, "epoch": 316} {"train_loss": -33.62350082397461, "global_step": 38315, "epoch": 316} {"train_loss": -33.33408737182617, "global_step": 38316, "epoch": 316} {"train_loss": -33.87541580200195, "global_step": 38317, "epoch": 316} {"train_loss": -33.751075744628906, "global_step": 38318, "epoch": 316} {"train_loss": -33.5374641418457, "global_step": 38319, "epoch": 316} {"train_loss": -33.916255950927734, "global_step": 38320, "epoch": 316} {"train_loss": -33.44350051879883, "global_step": 38321, "epoch": 316} {"train_loss": -32.72822189331055, "global_step": 38322, "epoch": 316} {"train_loss": -30.93914794921875, "global_step": 38323, "epoch": 316} {"train_loss": -32.119110107421875, "global_step": 38324, "epoch": 316} {"train_loss": -27.518421173095703, "global_step": 38325, "epoch": 316} {"train_loss": -33.26546859741211, "global_step": 38326, "epoch": 316} {"train_loss": -30.660058975219727, "global_step": 38327, "epoch": 316} {"train_loss": -33.4110107421875, "global_step": 38328, "epoch": 316} {"train_loss": -31.258142471313477, "global_step": 38329, "epoch": 316} {"train_loss": -31.749835968017578, "global_step": 38330, "epoch": 316} {"train_loss": -33.24879837036133, "global_step": 38331, "epoch": 316} {"train_loss": -30.690418243408203, "global_step": 38332, "epoch": 316} {"train_loss": -33.17503356933594, "global_step": 38333, "epoch": 316} {"train_loss": -31.8299503326416, "global_step": 38334, "epoch": 316} {"train_loss": -32.32929611206055, "global_step": 38335, "epoch": 316} {"train_loss": -31.30197525024414, "global_step": 38336, "epoch": 316} {"train_loss": -31.7060546875, "global_step": 38337, "epoch": 316} {"train_loss": -32.396705627441406, "global_step": 38338, "epoch": 316} {"train_loss": -31.8167781829834, "global_step": 38339, "epoch": 316} {"train_loss": -33.25608444213867, "global_step": 38340, "epoch": 316} {"train_loss": -32.64093017578125, "global_step": 38341, "epoch": 316} {"train_loss": -33.3637580871582, "global_step": 38342, "epoch": 316} {"train_loss": -32.78402328491211, "global_step": 38343, "epoch": 316} {"train_loss": -32.2408447265625, "global_step": 38344, "epoch": 316} {"train_loss": -33.346351623535156, "global_step": 38345, "epoch": 316} {"train_loss": -32.63652038574219, "global_step": 38346, "epoch": 316} {"train_loss": -33.360443115234375, "global_step": 38347, "epoch": 316} {"train_loss": -32.957210540771484, "global_step": 38348, "epoch": 316} {"train_loss": -32.576934814453125, "global_step": 38349, "epoch": 316} {"train_loss": -32.865806579589844, "global_step": 38350, "epoch": 316} {"train_loss": -33.304344177246094, "global_step": 38351, "epoch": 316} {"train_loss": -33.28774642944336, "global_step": 38352, "epoch": 316} {"train_loss": -33.16167449951172, "global_step": 38353, "epoch": 316} {"train_loss": -33.36729049682617, "global_step": 38354, "epoch": 316} {"train_loss": -30.948108673095703, "global_step": 38355, "epoch": 316} {"train_loss": -33.26378781342309, "global_step": 38356, "epoch": 316, "val_loss": 2642589.0} {"train_loss": -33.89289474487305, "global_step": 38357, "epoch": 317} {"train_loss": -33.306495666503906, "global_step": 38358, "epoch": 317} {"train_loss": -33.19470977783203, "global_step": 38359, "epoch": 317} {"train_loss": -34.00618362426758, "global_step": 38360, "epoch": 317} {"train_loss": -33.4638671875, "global_step": 38361, "epoch": 317} {"train_loss": -33.235164642333984, "global_step": 38362, "epoch": 317} {"train_loss": -33.59348678588867, "global_step": 38363, "epoch": 317} {"train_loss": -33.4478874206543, "global_step": 38364, "epoch": 317} {"train_loss": -32.89969253540039, "global_step": 38365, "epoch": 317} {"train_loss": -32.98542404174805, "global_step": 38366, "epoch": 317} {"train_loss": -33.70927429199219, "global_step": 38367, "epoch": 317} {"train_loss": -33.44753646850586, "global_step": 38368, "epoch": 317} {"train_loss": -33.30778121948242, "global_step": 38369, "epoch": 317} {"train_loss": -32.939117431640625, "global_step": 38370, "epoch": 317} {"train_loss": -33.62190628051758, "global_step": 38371, "epoch": 317} {"train_loss": -33.300140380859375, "global_step": 38372, "epoch": 317} {"train_loss": -33.862648010253906, "global_step": 38373, "epoch": 317} {"train_loss": -33.88928985595703, "global_step": 38374, "epoch": 317} {"train_loss": -34.04841232299805, "global_step": 38375, "epoch": 317} {"train_loss": -34.27704620361328, "global_step": 38376, "epoch": 317} {"train_loss": -33.88460922241211, "global_step": 38377, "epoch": 317} {"train_loss": -33.640899658203125, "global_step": 38378, "epoch": 317} {"train_loss": -33.84912109375, "global_step": 38379, "epoch": 317} {"train_loss": -34.4322509765625, "global_step": 38380, "epoch": 317} {"train_loss": -34.060401916503906, "global_step": 38381, "epoch": 317} {"train_loss": -33.55326461791992, "global_step": 38382, "epoch": 317} {"train_loss": -33.65412521362305, "global_step": 38383, "epoch": 317} {"train_loss": -34.02891159057617, "global_step": 38384, "epoch": 317} {"train_loss": -34.12200927734375, "global_step": 38385, "epoch": 317} {"train_loss": -34.2629508972168, "global_step": 38386, "epoch": 317} {"train_loss": -33.76212692260742, "global_step": 38387, "epoch": 317} {"train_loss": -33.83677673339844, "global_step": 38388, "epoch": 317} {"train_loss": -34.45646286010742, "global_step": 38389, "epoch": 317} {"train_loss": -34.075347900390625, "global_step": 38390, "epoch": 317} {"train_loss": -34.237998962402344, "global_step": 38391, "epoch": 317} {"train_loss": -34.40830612182617, "global_step": 38392, "epoch": 317} {"train_loss": -34.5357551574707, "global_step": 38393, "epoch": 317} {"train_loss": -34.649009704589844, "global_step": 38394, "epoch": 317} {"train_loss": -34.519710540771484, "global_step": 38395, "epoch": 317} {"train_loss": -34.697166442871094, "global_step": 38396, "epoch": 317} {"train_loss": -34.64960861206055, "global_step": 38397, "epoch": 317} {"train_loss": -34.5443000793457, "global_step": 38398, "epoch": 317} {"train_loss": -32.987361907958984, "global_step": 38399, "epoch": 317} {"train_loss": -33.74311447143555, "global_step": 38400, "epoch": 317} {"train_loss": -33.48088073730469, "global_step": 38401, "epoch": 317} {"train_loss": -33.016822814941406, "global_step": 38402, "epoch": 317} {"train_loss": -33.96171569824219, "global_step": 38403, "epoch": 317} {"train_loss": -34.31904602050781, "global_step": 38404, "epoch": 317} {"train_loss": -34.55721664428711, "global_step": 38405, "epoch": 317} {"train_loss": -33.37812042236328, "global_step": 38406, "epoch": 317} {"train_loss": -32.98371505737305, "global_step": 38407, "epoch": 317} {"train_loss": -33.066585540771484, "global_step": 38408, "epoch": 317} {"train_loss": -33.42629623413086, "global_step": 38409, "epoch": 317} {"train_loss": -33.633602142333984, "global_step": 38410, "epoch": 317} {"train_loss": -34.36719512939453, "global_step": 38411, "epoch": 317} {"train_loss": -32.153133392333984, "global_step": 38412, "epoch": 317} {"train_loss": -32.314697265625, "global_step": 38413, "epoch": 317} {"train_loss": -33.6479377746582, "global_step": 38414, "epoch": 317} {"train_loss": -33.10091781616211, "global_step": 38415, "epoch": 317} {"train_loss": -34.47391891479492, "global_step": 38416, "epoch": 317} {"train_loss": -33.1217041015625, "global_step": 38417, "epoch": 317} {"train_loss": -32.5660285949707, "global_step": 38418, "epoch": 317} {"train_loss": -33.6519660949707, "global_step": 38419, "epoch": 317} {"train_loss": -34.013572692871094, "global_step": 38420, "epoch": 317} {"train_loss": -33.27924728393555, "global_step": 38421, "epoch": 317} {"train_loss": -33.47024154663086, "global_step": 38422, "epoch": 317} {"train_loss": -33.841060638427734, "global_step": 38423, "epoch": 317} {"train_loss": -33.1925163269043, "global_step": 38424, "epoch": 317} {"train_loss": -33.80782699584961, "global_step": 38425, "epoch": 317} {"train_loss": -33.89870834350586, "global_step": 38426, "epoch": 317} {"train_loss": -33.98640441894531, "global_step": 38427, "epoch": 317} {"train_loss": -32.7900276184082, "global_step": 38428, "epoch": 317} {"train_loss": -34.04024124145508, "global_step": 38429, "epoch": 317} {"train_loss": -31.91645622253418, "global_step": 38430, "epoch": 317} {"train_loss": -33.7065544128418, "global_step": 38431, "epoch": 317} {"train_loss": -34.004638671875, "global_step": 38432, "epoch": 317} {"train_loss": -33.279273986816406, "global_step": 38433, "epoch": 317} {"train_loss": -33.8670539855957, "global_step": 38434, "epoch": 317} {"train_loss": -33.89868927001953, "global_step": 38435, "epoch": 317} {"train_loss": -33.523841857910156, "global_step": 38436, "epoch": 317} {"train_loss": -33.42053985595703, "global_step": 38437, "epoch": 317} {"train_loss": -32.36391067504883, "global_step": 38438, "epoch": 317} {"train_loss": -33.279388427734375, "global_step": 38439, "epoch": 317} {"train_loss": -33.341651916503906, "global_step": 38440, "epoch": 317} {"train_loss": -32.816898345947266, "global_step": 38441, "epoch": 317} {"train_loss": -33.554908752441406, "global_step": 38442, "epoch": 317} {"train_loss": -32.83807373046875, "global_step": 38443, "epoch": 317} {"train_loss": -30.80878257751465, "global_step": 38444, "epoch": 317} {"train_loss": -31.107572555541992, "global_step": 38445, "epoch": 317} {"train_loss": -29.253164291381836, "global_step": 38446, "epoch": 317} {"train_loss": -29.582416534423828, "global_step": 38447, "epoch": 317} {"train_loss": -31.9265079498291, "global_step": 38448, "epoch": 317} {"train_loss": -32.71209716796875, "global_step": 38449, "epoch": 317} {"train_loss": -32.72710037231445, "global_step": 38450, "epoch": 317} {"train_loss": -31.786550521850586, "global_step": 38451, "epoch": 317} {"train_loss": -31.717496871948242, "global_step": 38452, "epoch": 317} {"train_loss": -33.84113693237305, "global_step": 38453, "epoch": 317} {"train_loss": -32.453651428222656, "global_step": 38454, "epoch": 317} {"train_loss": -32.534278869628906, "global_step": 38455, "epoch": 317} {"train_loss": -33.262508392333984, "global_step": 38456, "epoch": 317} {"train_loss": -33.49119567871094, "global_step": 38457, "epoch": 317} {"train_loss": -32.35777282714844, "global_step": 38458, "epoch": 317} {"train_loss": -33.549293518066406, "global_step": 38459, "epoch": 317} {"train_loss": -33.21965408325195, "global_step": 38460, "epoch": 317} {"train_loss": -33.42196273803711, "global_step": 38461, "epoch": 317} {"train_loss": -33.95048141479492, "global_step": 38462, "epoch": 317} {"train_loss": -32.59243392944336, "global_step": 38463, "epoch": 317} {"train_loss": -33.68197250366211, "global_step": 38464, "epoch": 317} {"train_loss": -33.18514633178711, "global_step": 38465, "epoch": 317} {"train_loss": -32.937801361083984, "global_step": 38466, "epoch": 317} {"train_loss": -32.98114776611328, "global_step": 38467, "epoch": 317} {"train_loss": -32.484222412109375, "global_step": 38468, "epoch": 317} {"train_loss": -34.33271408081055, "global_step": 38469, "epoch": 317} {"train_loss": -33.392967224121094, "global_step": 38470, "epoch": 317} {"train_loss": -33.935848236083984, "global_step": 38471, "epoch": 317} {"train_loss": -34.11233139038086, "global_step": 38472, "epoch": 317} {"train_loss": -34.17477035522461, "global_step": 38473, "epoch": 317} {"train_loss": -34.20332336425781, "global_step": 38474, "epoch": 317} {"train_loss": -34.107173919677734, "global_step": 38475, "epoch": 317} {"train_loss": -34.13890838623047, "global_step": 38476, "epoch": 317} {"train_loss": -33.411302125158386, "global_step": 38477, "epoch": 317, "val_loss": 2469920.0} {"train_loss": -33.970603942871094, "global_step": 38478, "epoch": 318} {"train_loss": -34.15000534057617, "global_step": 38479, "epoch": 318} {"train_loss": -34.07849884033203, "global_step": 38480, "epoch": 318} {"train_loss": -34.121788024902344, "global_step": 38481, "epoch": 318} {"train_loss": -34.7346305847168, "global_step": 38482, "epoch": 318} {"train_loss": -33.922847747802734, "global_step": 38483, "epoch": 318} {"train_loss": -34.69222640991211, "global_step": 38484, "epoch": 318} {"train_loss": -34.25482940673828, "global_step": 38485, "epoch": 318} {"train_loss": -34.120330810546875, "global_step": 38486, "epoch": 318} {"train_loss": -34.647586822509766, "global_step": 38487, "epoch": 318} {"train_loss": -34.71483612060547, "global_step": 38488, "epoch": 318} {"train_loss": -34.78383255004883, "global_step": 38489, "epoch": 318} {"train_loss": -35.03413772583008, "global_step": 38490, "epoch": 318} {"train_loss": -34.334747314453125, "global_step": 38491, "epoch": 318} {"train_loss": -34.82023620605469, "global_step": 38492, "epoch": 318} {"train_loss": -34.05826950073242, "global_step": 38493, "epoch": 318} {"train_loss": -34.11100769042969, "global_step": 38494, "epoch": 318} {"train_loss": -34.2774543762207, "global_step": 38495, "epoch": 318} {"train_loss": -33.96249008178711, "global_step": 38496, "epoch": 318} {"train_loss": -33.9331169128418, "global_step": 38497, "epoch": 318} {"train_loss": -34.239383697509766, "global_step": 38498, "epoch": 318} {"train_loss": -34.332340240478516, "global_step": 38499, "epoch": 318} {"train_loss": -34.24126434326172, "global_step": 38500, "epoch": 318} {"train_loss": -34.38375473022461, "global_step": 38501, "epoch": 318} {"train_loss": -34.28807067871094, "global_step": 38502, "epoch": 318} {"train_loss": -34.61206817626953, "global_step": 38503, "epoch": 318} {"train_loss": -34.462867736816406, "global_step": 38504, "epoch": 318} {"train_loss": -34.87746810913086, "global_step": 38505, "epoch": 318} {"train_loss": -32.615211486816406, "global_step": 38506, "epoch": 318} {"train_loss": -33.91545104980469, "global_step": 38507, "epoch": 318} {"train_loss": -34.23305892944336, "global_step": 38508, "epoch": 318} {"train_loss": -34.5594596862793, "global_step": 38509, "epoch": 318} {"train_loss": -34.43991470336914, "global_step": 38510, "epoch": 318} {"train_loss": -34.287811279296875, "global_step": 38511, "epoch": 318} {"train_loss": -34.3475456237793, "global_step": 38512, "epoch": 318} {"train_loss": -34.028011322021484, "global_step": 38513, "epoch": 318} {"train_loss": -33.75954818725586, "global_step": 38514, "epoch": 318} {"train_loss": -34.527896881103516, "global_step": 38515, "epoch": 318} {"train_loss": -33.912193298339844, "global_step": 38516, "epoch": 318} {"train_loss": -33.7523078918457, "global_step": 38517, "epoch": 318} {"train_loss": -34.254188537597656, "global_step": 38518, "epoch": 318} {"train_loss": -32.33956527709961, "global_step": 38519, "epoch": 318} {"train_loss": -30.310575485229492, "global_step": 38520, "epoch": 318} {"train_loss": -27.494964599609375, "global_step": 38521, "epoch": 318} {"train_loss": -27.199338912963867, "global_step": 38522, "epoch": 318} {"train_loss": -32.03789138793945, "global_step": 38523, "epoch": 318} {"train_loss": -34.10767364501953, "global_step": 38524, "epoch": 318} {"train_loss": -32.5507698059082, "global_step": 38525, "epoch": 318} {"train_loss": -31.887128829956055, "global_step": 38526, "epoch": 318} {"train_loss": -32.86357879638672, "global_step": 38527, "epoch": 318} {"train_loss": -31.95525550842285, "global_step": 38528, "epoch": 318} {"train_loss": -33.57364273071289, "global_step": 38529, "epoch": 318} {"train_loss": -31.963088989257812, "global_step": 38530, "epoch": 318} {"train_loss": -32.625762939453125, "global_step": 38531, "epoch": 318} {"train_loss": -31.953229904174805, "global_step": 38532, "epoch": 318} {"train_loss": -33.99456787109375, "global_step": 38533, "epoch": 318} {"train_loss": -33.407562255859375, "global_step": 38534, "epoch": 318} {"train_loss": -33.68468475341797, "global_step": 38535, "epoch": 318} {"train_loss": -32.72488021850586, "global_step": 38536, "epoch": 318} {"train_loss": -32.58799362182617, "global_step": 38537, "epoch": 318} {"train_loss": -33.552799224853516, "global_step": 38538, "epoch": 318} {"train_loss": -34.132537841796875, "global_step": 38539, "epoch": 318} {"train_loss": -33.350196838378906, "global_step": 38540, "epoch": 318} {"train_loss": -33.94636535644531, "global_step": 38541, "epoch": 318} {"train_loss": -33.768035888671875, "global_step": 38542, "epoch": 318} {"train_loss": -34.2227783203125, "global_step": 38543, "epoch": 318} {"train_loss": -33.24550247192383, "global_step": 38544, "epoch": 318} {"train_loss": -33.540283203125, "global_step": 38545, "epoch": 318} {"train_loss": -32.89303970336914, "global_step": 38546, "epoch": 318} {"train_loss": -33.01845932006836, "global_step": 38547, "epoch": 318} {"train_loss": -33.4233512878418, "global_step": 38548, "epoch": 318} {"train_loss": -33.3370246887207, "global_step": 38549, "epoch": 318} {"train_loss": -33.459815979003906, "global_step": 38550, "epoch": 318} {"train_loss": -33.29013442993164, "global_step": 38551, "epoch": 318} {"train_loss": -33.52187728881836, "global_step": 38552, "epoch": 318} {"train_loss": -32.79008483886719, "global_step": 38553, "epoch": 318} {"train_loss": -33.31234359741211, "global_step": 38554, "epoch": 318} {"train_loss": -34.27972412109375, "global_step": 38555, "epoch": 318} {"train_loss": -34.102989196777344, "global_step": 38556, "epoch": 318} {"train_loss": -33.656288146972656, "global_step": 38557, "epoch": 318} {"train_loss": -33.30913162231445, "global_step": 38558, "epoch": 318} {"train_loss": -32.11802291870117, "global_step": 38559, "epoch": 318} {"train_loss": -32.419185638427734, "global_step": 38560, "epoch": 318} {"train_loss": -33.38945388793945, "global_step": 38561, "epoch": 318} {"train_loss": -33.99721145629883, "global_step": 38562, "epoch": 318} {"train_loss": -34.14350891113281, "global_step": 38563, "epoch": 318} {"train_loss": -33.741981506347656, "global_step": 38564, "epoch": 318} {"train_loss": -34.503623962402344, "global_step": 38565, "epoch": 318} {"train_loss": -34.63715744018555, "global_step": 38566, "epoch": 318} {"train_loss": -34.36345291137695, "global_step": 38567, "epoch": 318} {"train_loss": -33.173213958740234, "global_step": 38568, "epoch": 318} {"train_loss": -33.89674758911133, "global_step": 38569, "epoch": 318} {"train_loss": -33.850040435791016, "global_step": 38570, "epoch": 318} {"train_loss": -34.151790618896484, "global_step": 38571, "epoch": 318} {"train_loss": -34.4625129699707, "global_step": 38572, "epoch": 318} {"train_loss": -34.02497482299805, "global_step": 38573, "epoch": 318} {"train_loss": -34.04084396362305, "global_step": 38574, "epoch": 318} {"train_loss": -34.29903793334961, "global_step": 38575, "epoch": 318} {"train_loss": -34.45180892944336, "global_step": 38576, "epoch": 318} {"train_loss": -33.71582794189453, "global_step": 38577, "epoch": 318} {"train_loss": -34.75834274291992, "global_step": 38578, "epoch": 318} {"train_loss": -33.98774337768555, "global_step": 38579, "epoch": 318} {"train_loss": -33.87923049926758, "global_step": 38580, "epoch": 318} {"train_loss": -34.691036224365234, "global_step": 38581, "epoch": 318} {"train_loss": -33.969337463378906, "global_step": 38582, "epoch": 318} {"train_loss": -35.20552444458008, "global_step": 38583, "epoch": 318} {"train_loss": -33.923038482666016, "global_step": 38584, "epoch": 318} {"train_loss": -34.2861328125, "global_step": 38585, "epoch": 318} {"train_loss": -34.09267044067383, "global_step": 38586, "epoch": 318} {"train_loss": -34.42506790161133, "global_step": 38587, "epoch": 318} {"train_loss": -34.240474700927734, "global_step": 38588, "epoch": 318} {"train_loss": -35.01682662963867, "global_step": 38589, "epoch": 318} {"train_loss": -34.8834114074707, "global_step": 38590, "epoch": 318} {"train_loss": -34.45967483520508, "global_step": 38591, "epoch": 318} {"train_loss": -33.828792572021484, "global_step": 38592, "epoch": 318} {"train_loss": -34.20683288574219, "global_step": 38593, "epoch": 318} {"train_loss": -33.37273025512695, "global_step": 38594, "epoch": 318} {"train_loss": -33.565372467041016, "global_step": 38595, "epoch": 318} {"train_loss": -34.2369384765625, "global_step": 38596, "epoch": 318} {"train_loss": -34.32878112792969, "global_step": 38597, "epoch": 318} {"train_loss": -33.723571667001266, "global_step": 38598, "epoch": 318, "val_loss": 2530307.0} {"train_loss": -34.13628005981445, "global_step": 38599, "epoch": 319} {"train_loss": -34.29301452636719, "global_step": 38600, "epoch": 319} {"train_loss": -34.75791931152344, "global_step": 38601, "epoch": 319} {"train_loss": -33.97334671020508, "global_step": 38602, "epoch": 319} {"train_loss": -33.41372299194336, "global_step": 38603, "epoch": 319} {"train_loss": -33.81966018676758, "global_step": 38604, "epoch": 319} {"train_loss": -33.4586067199707, "global_step": 38605, "epoch": 319} {"train_loss": -34.28771209716797, "global_step": 38606, "epoch": 319} {"train_loss": -34.07993698120117, "global_step": 38607, "epoch": 319} {"train_loss": -31.139379501342773, "global_step": 38608, "epoch": 319} {"train_loss": -28.273923873901367, "global_step": 38609, "epoch": 319} {"train_loss": -29.493427276611328, "global_step": 38610, "epoch": 319} {"train_loss": -33.54033279418945, "global_step": 38611, "epoch": 319} {"train_loss": -31.590362548828125, "global_step": 38612, "epoch": 319} {"train_loss": -29.28995704650879, "global_step": 38613, "epoch": 319} {"train_loss": -29.603830337524414, "global_step": 38614, "epoch": 319} {"train_loss": -33.14918899536133, "global_step": 38615, "epoch": 319} {"train_loss": -31.347761154174805, "global_step": 38616, "epoch": 319} {"train_loss": -30.750946044921875, "global_step": 38617, "epoch": 319} {"train_loss": -32.155723571777344, "global_step": 38618, "epoch": 319} {"train_loss": -31.223072052001953, "global_step": 38619, "epoch": 319} {"train_loss": -32.51685333251953, "global_step": 38620, "epoch": 319} {"train_loss": -32.709754943847656, "global_step": 38621, "epoch": 319} {"train_loss": -32.3860969543457, "global_step": 38622, "epoch": 319} {"train_loss": -32.71383285522461, "global_step": 38623, "epoch": 319} {"train_loss": -32.90999984741211, "global_step": 38624, "epoch": 319} {"train_loss": -32.69147872924805, "global_step": 38625, "epoch": 319} {"train_loss": -33.301326751708984, "global_step": 38626, "epoch": 319} {"train_loss": -32.588470458984375, "global_step": 38627, "epoch": 319} {"train_loss": -32.42975616455078, "global_step": 38628, "epoch": 319} {"train_loss": -33.667598724365234, "global_step": 38629, "epoch": 319} {"train_loss": -32.47792434692383, "global_step": 38630, "epoch": 319} {"train_loss": -33.172367095947266, "global_step": 38631, "epoch": 319} {"train_loss": -33.371543884277344, "global_step": 38632, "epoch": 319} {"train_loss": -33.39942169189453, "global_step": 38633, "epoch": 319} {"train_loss": -33.921722412109375, "global_step": 38634, "epoch": 319} {"train_loss": -31.968719482421875, "global_step": 38635, "epoch": 319} {"train_loss": -33.623939514160156, "global_step": 38636, "epoch": 319} {"train_loss": -32.722957611083984, "global_step": 38637, "epoch": 319} {"train_loss": -33.002220153808594, "global_step": 38638, "epoch": 319} {"train_loss": -33.14822006225586, "global_step": 38639, "epoch": 319} {"train_loss": -33.86806869506836, "global_step": 38640, "epoch": 319} {"train_loss": -33.778987884521484, "global_step": 38641, "epoch": 319} {"train_loss": -33.91720199584961, "global_step": 38642, "epoch": 319} {"train_loss": -33.40481185913086, "global_step": 38643, "epoch": 319} {"train_loss": -33.94770431518555, "global_step": 38644, "epoch": 319} {"train_loss": -33.96458053588867, "global_step": 38645, "epoch": 319} {"train_loss": -34.24378204345703, "global_step": 38646, "epoch": 319} {"train_loss": -33.89537048339844, "global_step": 38647, "epoch": 319} {"train_loss": -33.83846664428711, "global_step": 38648, "epoch": 319} {"train_loss": -33.39068603515625, "global_step": 38649, "epoch": 319} {"train_loss": -33.24647903442383, "global_step": 38650, "epoch": 319} {"train_loss": -33.48430633544922, "global_step": 38651, "epoch": 319} {"train_loss": -33.95039749145508, "global_step": 38652, "epoch": 319} {"train_loss": -34.16211700439453, "global_step": 38653, "epoch": 319} {"train_loss": -34.05138397216797, "global_step": 38654, "epoch": 319} {"train_loss": -34.32545471191406, "global_step": 38655, "epoch": 319} {"train_loss": -34.200767517089844, "global_step": 38656, "epoch": 319} {"train_loss": -33.97386169433594, "global_step": 38657, "epoch": 319} {"train_loss": -34.31015396118164, "global_step": 38658, "epoch": 319} {"train_loss": -34.14436340332031, "global_step": 38659, "epoch": 319} {"train_loss": -34.20172119140625, "global_step": 38660, "epoch": 319} {"train_loss": -34.47993087768555, "global_step": 38661, "epoch": 319} {"train_loss": -33.886138916015625, "global_step": 38662, "epoch": 319} {"train_loss": -34.03169631958008, "global_step": 38663, "epoch": 319} {"train_loss": -33.833744049072266, "global_step": 38664, "epoch": 319} {"train_loss": -34.394466400146484, "global_step": 38665, "epoch": 319} {"train_loss": -34.204689025878906, "global_step": 38666, "epoch": 319} {"train_loss": -33.894371032714844, "global_step": 38667, "epoch": 319} {"train_loss": -33.37800216674805, "global_step": 38668, "epoch": 319} {"train_loss": -34.329734802246094, "global_step": 38669, "epoch": 319} {"train_loss": -33.6075439453125, "global_step": 38670, "epoch": 319} {"train_loss": -33.53773880004883, "global_step": 38671, "epoch": 319} {"train_loss": -33.98030471801758, "global_step": 38672, "epoch": 319} {"train_loss": -33.7268180847168, "global_step": 38673, "epoch": 319} {"train_loss": -34.37384033203125, "global_step": 38674, "epoch": 319} {"train_loss": -34.06536865234375, "global_step": 38675, "epoch": 319} {"train_loss": -33.817501068115234, "global_step": 38676, "epoch": 319} {"train_loss": -34.360687255859375, "global_step": 38677, "epoch": 319} {"train_loss": -33.57255935668945, "global_step": 38678, "epoch": 319} {"train_loss": -33.52630615234375, "global_step": 38679, "epoch": 319} {"train_loss": -30.194915771484375, "global_step": 38680, "epoch": 319} {"train_loss": -25.00033950805664, "global_step": 38681, "epoch": 319} {"train_loss": -25.891271591186523, "global_step": 38682, "epoch": 319} {"train_loss": -28.041528701782227, "global_step": 38683, "epoch": 319} {"train_loss": -32.36153030395508, "global_step": 38684, "epoch": 319} {"train_loss": -31.97859001159668, "global_step": 38685, "epoch": 319} {"train_loss": -31.699941635131836, "global_step": 38686, "epoch": 319} {"train_loss": -33.5252799987793, "global_step": 38687, "epoch": 319} {"train_loss": -32.57533645629883, "global_step": 38688, "epoch": 319} {"train_loss": -32.97648239135742, "global_step": 38689, "epoch": 319} {"train_loss": -33.589176177978516, "global_step": 38690, "epoch": 319} {"train_loss": -33.51465606689453, "global_step": 38691, "epoch": 319} {"train_loss": -33.44271469116211, "global_step": 38692, "epoch": 319} {"train_loss": -32.92026901245117, "global_step": 38693, "epoch": 319} {"train_loss": -31.4881591796875, "global_step": 38694, "epoch": 319} {"train_loss": -33.75326156616211, "global_step": 38695, "epoch": 319} {"train_loss": -33.245235443115234, "global_step": 38696, "epoch": 319} {"train_loss": -34.00917434692383, "global_step": 38697, "epoch": 319} {"train_loss": -33.23942184448242, "global_step": 38698, "epoch": 319} {"train_loss": -34.029296875, "global_step": 38699, "epoch": 319} {"train_loss": -33.96183395385742, "global_step": 38700, "epoch": 319} {"train_loss": -34.26432418823242, "global_step": 38701, "epoch": 319} {"train_loss": -34.27347183227539, "global_step": 38702, "epoch": 319} {"train_loss": -33.735626220703125, "global_step": 38703, "epoch": 319} {"train_loss": -34.25715637207031, "global_step": 38704, "epoch": 319} {"train_loss": -34.30786895751953, "global_step": 38705, "epoch": 319} {"train_loss": -34.1803092956543, "global_step": 38706, "epoch": 319} {"train_loss": -33.68169021606445, "global_step": 38707, "epoch": 319} {"train_loss": -33.67545700073242, "global_step": 38708, "epoch": 319} {"train_loss": -34.059261322021484, "global_step": 38709, "epoch": 319} {"train_loss": -34.248260498046875, "global_step": 38710, "epoch": 319} {"train_loss": -33.803253173828125, "global_step": 38711, "epoch": 319} {"train_loss": -34.35931396484375, "global_step": 38712, "epoch": 319} {"train_loss": -34.00831604003906, "global_step": 38713, "epoch": 319} {"train_loss": -33.44651412963867, "global_step": 38714, "epoch": 319} {"train_loss": -34.38718032836914, "global_step": 38715, "epoch": 319} {"train_loss": -34.130672454833984, "global_step": 38716, "epoch": 319} {"train_loss": -34.43636703491211, "global_step": 38717, "epoch": 319} {"train_loss": -34.199886322021484, "global_step": 38718, "epoch": 319} {"train_loss": -33.157516652887516, "global_step": 38719, "epoch": 319, "val_loss": 2455268.75} {"train_loss": -33.109352111816406, "global_step": 38720, "epoch": 320} {"train_loss": -30.763586044311523, "global_step": 38721, "epoch": 320} {"train_loss": -29.78028678894043, "global_step": 38722, "epoch": 320} {"train_loss": -27.997543334960938, "global_step": 38723, "epoch": 320} {"train_loss": -26.725027084350586, "global_step": 38724, "epoch": 320} {"train_loss": -31.00800132751465, "global_step": 38725, "epoch": 320} {"train_loss": -33.04542541503906, "global_step": 38726, "epoch": 320} {"train_loss": -32.64616012573242, "global_step": 38727, "epoch": 320} {"train_loss": -33.35321807861328, "global_step": 38728, "epoch": 320} {"train_loss": -32.4681510925293, "global_step": 38729, "epoch": 320} {"train_loss": -31.64676856994629, "global_step": 38730, "epoch": 320} {"train_loss": -34.18512725830078, "global_step": 38731, "epoch": 320} {"train_loss": -32.68488693237305, "global_step": 38732, "epoch": 320} {"train_loss": -33.718929290771484, "global_step": 38733, "epoch": 320} {"train_loss": -32.52427291870117, "global_step": 38734, "epoch": 320} {"train_loss": -33.7008056640625, "global_step": 38735, "epoch": 320} {"train_loss": -32.66627883911133, "global_step": 38736, "epoch": 320} {"train_loss": -32.978031158447266, "global_step": 38737, "epoch": 320} {"train_loss": -33.572505950927734, "global_step": 38738, "epoch": 320} {"train_loss": -33.24534225463867, "global_step": 38739, "epoch": 320} {"train_loss": -32.85836410522461, "global_step": 38740, "epoch": 320} {"train_loss": -32.650203704833984, "global_step": 38741, "epoch": 320} {"train_loss": -33.70011520385742, "global_step": 38742, "epoch": 320} {"train_loss": -32.70689010620117, "global_step": 38743, "epoch": 320} {"train_loss": -32.53654861450195, "global_step": 38744, "epoch": 320} {"train_loss": -33.97883987426758, "global_step": 38745, "epoch": 320} {"train_loss": -32.50679016113281, "global_step": 38746, "epoch": 320} {"train_loss": -32.53388595581055, "global_step": 38747, "epoch": 320} {"train_loss": -32.807891845703125, "global_step": 38748, "epoch": 320} {"train_loss": -32.96112823486328, "global_step": 38749, "epoch": 320} {"train_loss": -30.6744384765625, "global_step": 38750, "epoch": 320} {"train_loss": -29.09528923034668, "global_step": 38751, "epoch": 320} {"train_loss": -29.676252365112305, "global_step": 38752, "epoch": 320} {"train_loss": -25.161405563354492, "global_step": 38753, "epoch": 320} {"train_loss": -31.14166259765625, "global_step": 38754, "epoch": 320} {"train_loss": -28.80763053894043, "global_step": 38755, "epoch": 320} {"train_loss": -29.72059440612793, "global_step": 38756, "epoch": 320} {"train_loss": -28.45330810546875, "global_step": 38757, "epoch": 320} {"train_loss": -30.335498809814453, "global_step": 38758, "epoch": 320} {"train_loss": -29.92742347717285, "global_step": 38759, "epoch": 320} {"train_loss": -31.6165828704834, "global_step": 38760, "epoch": 320} {"train_loss": -29.59451675415039, "global_step": 38761, "epoch": 320} {"train_loss": -30.338455200195312, "global_step": 38762, "epoch": 320} {"train_loss": -31.6409912109375, "global_step": 38763, "epoch": 320} {"train_loss": -31.230966567993164, "global_step": 38764, "epoch": 320} {"train_loss": -32.44350051879883, "global_step": 38765, "epoch": 320} {"train_loss": -31.654233932495117, "global_step": 38766, "epoch": 320} {"train_loss": -31.006887435913086, "global_step": 38767, "epoch": 320} {"train_loss": -30.752731323242188, "global_step": 38768, "epoch": 320} {"train_loss": -31.773773193359375, "global_step": 38769, "epoch": 320} {"train_loss": -31.738882064819336, "global_step": 38770, "epoch": 320} {"train_loss": -31.648483276367188, "global_step": 38771, "epoch": 320} {"train_loss": -31.851438522338867, "global_step": 38772, "epoch": 320} {"train_loss": -31.873498916625977, "global_step": 38773, "epoch": 320} {"train_loss": -32.07137680053711, "global_step": 38774, "epoch": 320} {"train_loss": -31.726186752319336, "global_step": 38775, "epoch": 320} {"train_loss": -32.132442474365234, "global_step": 38776, "epoch": 320} {"train_loss": -32.2552375793457, "global_step": 38777, "epoch": 320} {"train_loss": -32.21452331542969, "global_step": 38778, "epoch": 320} {"train_loss": -32.36103439331055, "global_step": 38779, "epoch": 320} {"train_loss": -32.15876388549805, "global_step": 38780, "epoch": 320} {"train_loss": -32.680397033691406, "global_step": 38781, "epoch": 320} {"train_loss": -32.391780853271484, "global_step": 38782, "epoch": 320} {"train_loss": -32.07363510131836, "global_step": 38783, "epoch": 320} {"train_loss": -32.3692741394043, "global_step": 38784, "epoch": 320} {"train_loss": -31.879409790039062, "global_step": 38785, "epoch": 320} {"train_loss": -32.879329681396484, "global_step": 38786, "epoch": 320} {"train_loss": -32.683650970458984, "global_step": 38787, "epoch": 320} {"train_loss": -32.82301330566406, "global_step": 38788, "epoch": 320} {"train_loss": -32.69645690917969, "global_step": 38789, "epoch": 320} {"train_loss": -32.23990249633789, "global_step": 38790, "epoch": 320} {"train_loss": -32.170963287353516, "global_step": 38791, "epoch": 320} {"train_loss": -33.128997802734375, "global_step": 38792, "epoch": 320} {"train_loss": -33.31056213378906, "global_step": 38793, "epoch": 320} {"train_loss": -32.980064392089844, "global_step": 38794, "epoch": 320} {"train_loss": -32.86444091796875, "global_step": 38795, "epoch": 320} {"train_loss": -32.9056282043457, "global_step": 38796, "epoch": 320} {"train_loss": -32.54309844970703, "global_step": 38797, "epoch": 320} {"train_loss": -32.56895065307617, "global_step": 38798, "epoch": 320} {"train_loss": -31.966693878173828, "global_step": 38799, "epoch": 320} {"train_loss": -31.909204483032227, "global_step": 38800, "epoch": 320} {"train_loss": -32.58002471923828, "global_step": 38801, "epoch": 320} {"train_loss": -33.14829635620117, "global_step": 38802, "epoch": 320} {"train_loss": -32.98161697387695, "global_step": 38803, "epoch": 320} {"train_loss": -32.476505279541016, "global_step": 38804, "epoch": 320} {"train_loss": -31.528079986572266, "global_step": 38805, "epoch": 320} {"train_loss": -33.25249099731445, "global_step": 38806, "epoch": 320} {"train_loss": -33.728981018066406, "global_step": 38807, "epoch": 320} {"train_loss": -33.060035705566406, "global_step": 38808, "epoch": 320} {"train_loss": -33.47353744506836, "global_step": 38809, "epoch": 320} {"train_loss": -33.011260986328125, "global_step": 38810, "epoch": 320} {"train_loss": -33.55183029174805, "global_step": 38811, "epoch": 320} {"train_loss": -33.72799301147461, "global_step": 38812, "epoch": 320} {"train_loss": -33.81037521362305, "global_step": 38813, "epoch": 320} {"train_loss": -33.144344329833984, "global_step": 38814, "epoch": 320} {"train_loss": -33.76815414428711, "global_step": 38815, "epoch": 320} {"train_loss": -33.96302032470703, "global_step": 38816, "epoch": 320} {"train_loss": -33.76205062866211, "global_step": 38817, "epoch": 320} {"train_loss": -33.2581787109375, "global_step": 38818, "epoch": 320} {"train_loss": -33.842472076416016, "global_step": 38819, "epoch": 320} {"train_loss": -33.4775390625, "global_step": 38820, "epoch": 320} {"train_loss": -33.97220993041992, "global_step": 38821, "epoch": 320} {"train_loss": -34.13362503051758, "global_step": 38822, "epoch": 320} {"train_loss": -34.13935470581055, "global_step": 38823, "epoch": 320} {"train_loss": -33.79585647583008, "global_step": 38824, "epoch": 320} {"train_loss": -32.879676818847656, "global_step": 38825, "epoch": 320} {"train_loss": -34.03224563598633, "global_step": 38826, "epoch": 320} {"train_loss": -33.73248291015625, "global_step": 38827, "epoch": 320} {"train_loss": -34.0207633972168, "global_step": 38828, "epoch": 320} {"train_loss": -34.097652435302734, "global_step": 38829, "epoch": 320} {"train_loss": -34.14743423461914, "global_step": 38830, "epoch": 320} {"train_loss": -34.2095832824707, "global_step": 38831, "epoch": 320} {"train_loss": -34.2469367980957, "global_step": 38832, "epoch": 320} {"train_loss": -34.117530822753906, "global_step": 38833, "epoch": 320} {"train_loss": -33.945091247558594, "global_step": 38834, "epoch": 320} {"train_loss": -34.016780853271484, "global_step": 38835, "epoch": 320} {"train_loss": -33.104736328125, "global_step": 38836, "epoch": 320} {"train_loss": -34.16120529174805, "global_step": 38837, "epoch": 320} {"train_loss": -32.96415328979492, "global_step": 38838, "epoch": 320} {"train_loss": -33.60479736328125, "global_step": 38839, "epoch": 320} {"train_loss": -32.41375527500121, "global_step": 38840, "epoch": 320, "val_loss": 2568753.25} {"train_loss": -32.55202102661133, "global_step": 38841, "epoch": 321} {"train_loss": -21.079721450805664, "global_step": 38842, "epoch": 321} {"train_loss": -30.617080688476562, "global_step": 38843, "epoch": 321} {"train_loss": -32.853065490722656, "global_step": 38844, "epoch": 321} {"train_loss": -27.213972091674805, "global_step": 38845, "epoch": 321} {"train_loss": -26.21040916442871, "global_step": 38846, "epoch": 321} {"train_loss": -27.4891357421875, "global_step": 38847, "epoch": 321} {"train_loss": -24.467309951782227, "global_step": 38848, "epoch": 321} {"train_loss": -24.86386489868164, "global_step": 38849, "epoch": 321} {"train_loss": -28.451242446899414, "global_step": 38850, "epoch": 321} {"train_loss": -29.705961227416992, "global_step": 38851, "epoch": 321} {"train_loss": -28.232603073120117, "global_step": 38852, "epoch": 321} {"train_loss": -29.57301139831543, "global_step": 38853, "epoch": 321} {"train_loss": -29.82551383972168, "global_step": 38854, "epoch": 321} {"train_loss": -29.09792137145996, "global_step": 38855, "epoch": 321} {"train_loss": -28.4034423828125, "global_step": 38856, "epoch": 321} {"train_loss": -28.835012435913086, "global_step": 38857, "epoch": 321} {"train_loss": -31.502050399780273, "global_step": 38858, "epoch": 321} {"train_loss": -29.347070693969727, "global_step": 38859, "epoch": 321} {"train_loss": -31.0465087890625, "global_step": 38860, "epoch": 321} {"train_loss": -29.33827018737793, "global_step": 38861, "epoch": 321} {"train_loss": -30.355167388916016, "global_step": 38862, "epoch": 321} {"train_loss": -29.695240020751953, "global_step": 38863, "epoch": 321} {"train_loss": -30.526330947875977, "global_step": 38864, "epoch": 321} {"train_loss": -30.005659103393555, "global_step": 38865, "epoch": 321} {"train_loss": -30.938093185424805, "global_step": 38866, "epoch": 321} {"train_loss": -30.489599227905273, "global_step": 38867, "epoch": 321} {"train_loss": -30.947858810424805, "global_step": 38868, "epoch": 321} {"train_loss": -30.207462310791016, "global_step": 38869, "epoch": 321} {"train_loss": -31.5408935546875, "global_step": 38870, "epoch": 321} {"train_loss": -31.18863868713379, "global_step": 38871, "epoch": 321} {"train_loss": -31.268451690673828, "global_step": 38872, "epoch": 321} {"train_loss": -31.82822036743164, "global_step": 38873, "epoch": 321} {"train_loss": -31.751068115234375, "global_step": 38874, "epoch": 321} {"train_loss": -31.218408584594727, "global_step": 38875, "epoch": 321} {"train_loss": -31.552631378173828, "global_step": 38876, "epoch": 321} {"train_loss": -31.53948974609375, "global_step": 38877, "epoch": 321} {"train_loss": -31.752416610717773, "global_step": 38878, "epoch": 321} {"train_loss": -31.5964298248291, "global_step": 38879, "epoch": 321} {"train_loss": -31.417724609375, "global_step": 38880, "epoch": 321} {"train_loss": -31.48691749572754, "global_step": 38881, "epoch": 321} {"train_loss": -31.9464111328125, "global_step": 38882, "epoch": 321} {"train_loss": -32.00347137451172, "global_step": 38883, "epoch": 321} {"train_loss": -31.872406005859375, "global_step": 38884, "epoch": 321} {"train_loss": -31.995901107788086, "global_step": 38885, "epoch": 321} {"train_loss": -32.4034538269043, "global_step": 38886, "epoch": 321} {"train_loss": -32.18879318237305, "global_step": 38887, "epoch": 321} {"train_loss": -32.48214340209961, "global_step": 38888, "epoch": 321} {"train_loss": -32.52421188354492, "global_step": 38889, "epoch": 321} {"train_loss": -31.956430435180664, "global_step": 38890, "epoch": 321} {"train_loss": -32.536720275878906, "global_step": 38891, "epoch": 321} {"train_loss": -32.45084762573242, "global_step": 38892, "epoch": 321} {"train_loss": -32.82985305786133, "global_step": 38893, "epoch": 321} {"train_loss": -32.72300338745117, "global_step": 38894, "epoch": 321} {"train_loss": -32.75758743286133, "global_step": 38895, "epoch": 321} {"train_loss": -32.10639572143555, "global_step": 38896, "epoch": 321} {"train_loss": -32.8243522644043, "global_step": 38897, "epoch": 321} {"train_loss": -32.93357467651367, "global_step": 38898, "epoch": 321} {"train_loss": -33.07611846923828, "global_step": 38899, "epoch": 321} {"train_loss": -32.778621673583984, "global_step": 38900, "epoch": 321} {"train_loss": -32.6160888671875, "global_step": 38901, "epoch": 321} {"train_loss": -32.461700439453125, "global_step": 38902, "epoch": 321} {"train_loss": -32.85592269897461, "global_step": 38903, "epoch": 321} {"train_loss": -33.16443634033203, "global_step": 38904, "epoch": 321} {"train_loss": -32.91341018676758, "global_step": 38905, "epoch": 321} {"train_loss": -33.819332122802734, "global_step": 38906, "epoch": 321} {"train_loss": -33.117835998535156, "global_step": 38907, "epoch": 321} {"train_loss": -33.531002044677734, "global_step": 38908, "epoch": 321} {"train_loss": -33.23482894897461, "global_step": 38909, "epoch": 321} {"train_loss": -33.35402297973633, "global_step": 38910, "epoch": 321} {"train_loss": -32.73185729980469, "global_step": 38911, "epoch": 321} {"train_loss": -31.799142837524414, "global_step": 38912, "epoch": 321} {"train_loss": -30.0887508392334, "global_step": 38913, "epoch": 321} {"train_loss": -24.353492736816406, "global_step": 38914, "epoch": 321} {"train_loss": -19.925994873046875, "global_step": 38915, "epoch": 321} {"train_loss": -22.38568687438965, "global_step": 38916, "epoch": 321} {"train_loss": -29.463621139526367, "global_step": 38917, "epoch": 321} {"train_loss": -32.27023696899414, "global_step": 38918, "epoch": 321} {"train_loss": -30.448047637939453, "global_step": 38919, "epoch": 321} {"train_loss": -32.15275955200195, "global_step": 38920, "epoch": 321} {"train_loss": -30.315643310546875, "global_step": 38921, "epoch": 321} {"train_loss": -32.10744857788086, "global_step": 38922, "epoch": 321} {"train_loss": -31.766620635986328, "global_step": 38923, "epoch": 321} {"train_loss": -32.349239349365234, "global_step": 38924, "epoch": 321} {"train_loss": -32.96592330932617, "global_step": 38925, "epoch": 321} {"train_loss": -32.16614532470703, "global_step": 38926, "epoch": 321} {"train_loss": -33.2324333190918, "global_step": 38927, "epoch": 321} {"train_loss": -32.69957733154297, "global_step": 38928, "epoch": 321} {"train_loss": -32.95547103881836, "global_step": 38929, "epoch": 321} {"train_loss": -33.573219299316406, "global_step": 38930, "epoch": 321} {"train_loss": -32.961341857910156, "global_step": 38931, "epoch": 321} {"train_loss": -33.15801239013672, "global_step": 38932, "epoch": 321} {"train_loss": -33.71314239501953, "global_step": 38933, "epoch": 321} {"train_loss": -32.816890716552734, "global_step": 38934, "epoch": 321} {"train_loss": -33.64005661010742, "global_step": 38935, "epoch": 321} {"train_loss": -32.660491943359375, "global_step": 38936, "epoch": 321} {"train_loss": -32.372859954833984, "global_step": 38937, "epoch": 321} {"train_loss": -33.9387092590332, "global_step": 38938, "epoch": 321} {"train_loss": -33.55255126953125, "global_step": 38939, "epoch": 321} {"train_loss": -33.75094223022461, "global_step": 38940, "epoch": 321} {"train_loss": -33.74317932128906, "global_step": 38941, "epoch": 321} {"train_loss": -33.10346603393555, "global_step": 38942, "epoch": 321} {"train_loss": -33.87665557861328, "global_step": 38943, "epoch": 321} {"train_loss": -33.11234664916992, "global_step": 38944, "epoch": 321} {"train_loss": -33.2109260559082, "global_step": 38945, "epoch": 321} {"train_loss": -33.681854248046875, "global_step": 38946, "epoch": 321} {"train_loss": -33.8006706237793, "global_step": 38947, "epoch": 321} {"train_loss": -33.3389778137207, "global_step": 38948, "epoch": 321} {"train_loss": -33.97930908203125, "global_step": 38949, "epoch": 321} {"train_loss": -33.80833053588867, "global_step": 38950, "epoch": 321} {"train_loss": -33.99320602416992, "global_step": 38951, "epoch": 321} {"train_loss": -34.18986129760742, "global_step": 38952, "epoch": 321} {"train_loss": -34.06373977661133, "global_step": 38953, "epoch": 321} {"train_loss": -34.13377380371094, "global_step": 38954, "epoch": 321} {"train_loss": -33.18621063232422, "global_step": 38955, "epoch": 321} {"train_loss": -33.789188385009766, "global_step": 38956, "epoch": 321} {"train_loss": -33.890621185302734, "global_step": 38957, "epoch": 321} {"train_loss": -33.71033477783203, "global_step": 38958, "epoch": 321} {"train_loss": -34.28431701660156, "global_step": 38959, "epoch": 321} {"train_loss": -33.61483383178711, "global_step": 38960, "epoch": 321} {"train_loss": -31.57277181325865, "global_step": 38961, "epoch": 321, "val_loss": 2543277.0} {"train_loss": -33.1102294921875, "global_step": 38962, "epoch": 322} {"train_loss": -33.82661819458008, "global_step": 38963, "epoch": 322} {"train_loss": -33.4687385559082, "global_step": 38964, "epoch": 322} {"train_loss": -32.96763229370117, "global_step": 38965, "epoch": 322} {"train_loss": -34.46232986450195, "global_step": 38966, "epoch": 322} {"train_loss": -33.77565002441406, "global_step": 38967, "epoch": 322} {"train_loss": -32.42938232421875, "global_step": 38968, "epoch": 322} {"train_loss": -34.207157135009766, "global_step": 38969, "epoch": 322} {"train_loss": -33.75120162963867, "global_step": 38970, "epoch": 322} {"train_loss": -33.906585693359375, "global_step": 38971, "epoch": 322} {"train_loss": -33.578338623046875, "global_step": 38972, "epoch": 322} {"train_loss": -33.447975158691406, "global_step": 38973, "epoch": 322} {"train_loss": -33.243675231933594, "global_step": 38974, "epoch": 322} {"train_loss": -33.94851303100586, "global_step": 38975, "epoch": 322} {"train_loss": -33.7823486328125, "global_step": 38976, "epoch": 322} {"train_loss": -33.81882858276367, "global_step": 38977, "epoch": 322} {"train_loss": -33.16291809082031, "global_step": 38978, "epoch": 322} {"train_loss": -33.74700927734375, "global_step": 38979, "epoch": 322} {"train_loss": -33.2260856628418, "global_step": 38980, "epoch": 322} {"train_loss": -33.025634765625, "global_step": 38981, "epoch": 322} {"train_loss": -32.17259979248047, "global_step": 38982, "epoch": 322} {"train_loss": -32.477996826171875, "global_step": 38983, "epoch": 322} {"train_loss": -33.76758575439453, "global_step": 38984, "epoch": 322} {"train_loss": -33.635963439941406, "global_step": 38985, "epoch": 322} {"train_loss": -33.15132141113281, "global_step": 38986, "epoch": 322} {"train_loss": -33.063175201416016, "global_step": 38987, "epoch": 322} {"train_loss": -33.17537307739258, "global_step": 38988, "epoch": 322} {"train_loss": -33.616485595703125, "global_step": 38989, "epoch": 322} {"train_loss": -32.77622604370117, "global_step": 38990, "epoch": 322} {"train_loss": -33.6522102355957, "global_step": 38991, "epoch": 322} {"train_loss": -33.54836654663086, "global_step": 38992, "epoch": 322} {"train_loss": -33.30819320678711, "global_step": 38993, "epoch": 322} {"train_loss": -33.603878021240234, "global_step": 38994, "epoch": 322} {"train_loss": -33.009952545166016, "global_step": 38995, "epoch": 322} {"train_loss": -32.570777893066406, "global_step": 38996, "epoch": 322} {"train_loss": -32.10966491699219, "global_step": 38997, "epoch": 322} {"train_loss": -33.020206451416016, "global_step": 38998, "epoch": 322} {"train_loss": -33.00653076171875, "global_step": 38999, "epoch": 322} {"train_loss": -33.47412872314453, "global_step": 39000, "epoch": 322} {"train_loss": -33.565067291259766, "global_step": 39001, "epoch": 322} {"train_loss": -32.9356803894043, "global_step": 39002, "epoch": 322} {"train_loss": -33.32845687866211, "global_step": 39003, "epoch": 322} {"train_loss": -33.53156661987305, "global_step": 39004, "epoch": 322} {"train_loss": -33.15720748901367, "global_step": 39005, "epoch": 322} {"train_loss": -33.22793197631836, "global_step": 39006, "epoch": 322} {"train_loss": -33.702239990234375, "global_step": 39007, "epoch": 322} {"train_loss": -32.137447357177734, "global_step": 39008, "epoch": 322} {"train_loss": -32.424842834472656, "global_step": 39009, "epoch": 322} {"train_loss": -33.382904052734375, "global_step": 39010, "epoch": 322} {"train_loss": -33.7658576965332, "global_step": 39011, "epoch": 322} {"train_loss": -34.270973205566406, "global_step": 39012, "epoch": 322} {"train_loss": -33.520668029785156, "global_step": 39013, "epoch": 322} {"train_loss": -32.944217681884766, "global_step": 39014, "epoch": 322} {"train_loss": -32.77142333984375, "global_step": 39015, "epoch": 322} {"train_loss": -33.868614196777344, "global_step": 39016, "epoch": 322} {"train_loss": -34.22231674194336, "global_step": 39017, "epoch": 322} {"train_loss": -33.49736022949219, "global_step": 39018, "epoch": 322} {"train_loss": -33.756771087646484, "global_step": 39019, "epoch": 322} {"train_loss": -33.09809875488281, "global_step": 39020, "epoch": 322} {"train_loss": -33.42500686645508, "global_step": 39021, "epoch": 322} {"train_loss": -34.13505935668945, "global_step": 39022, "epoch": 322} {"train_loss": -33.166439056396484, "global_step": 39023, "epoch": 322} {"train_loss": -32.8998908996582, "global_step": 39024, "epoch": 322} {"train_loss": -33.44417190551758, "global_step": 39025, "epoch": 322} {"train_loss": -33.69013214111328, "global_step": 39026, "epoch": 322} {"train_loss": -33.886566162109375, "global_step": 39027, "epoch": 322} {"train_loss": -33.26336669921875, "global_step": 39028, "epoch": 322} {"train_loss": -33.13661193847656, "global_step": 39029, "epoch": 322} {"train_loss": -34.453704833984375, "global_step": 39030, "epoch": 322} {"train_loss": -33.69907760620117, "global_step": 39031, "epoch": 322} {"train_loss": -34.429317474365234, "global_step": 39032, "epoch": 322} {"train_loss": -34.181941986083984, "global_step": 39033, "epoch": 322} {"train_loss": -33.713314056396484, "global_step": 39034, "epoch": 322} {"train_loss": -34.31044387817383, "global_step": 39035, "epoch": 322} {"train_loss": -34.219451904296875, "global_step": 39036, "epoch": 322} {"train_loss": -33.96596908569336, "global_step": 39037, "epoch": 322} {"train_loss": -34.16697311401367, "global_step": 39038, "epoch": 322} {"train_loss": -34.532955169677734, "global_step": 39039, "epoch": 322} {"train_loss": -33.31654357910156, "global_step": 39040, "epoch": 322} {"train_loss": -32.677486419677734, "global_step": 39041, "epoch": 322} {"train_loss": -30.895843505859375, "global_step": 39042, "epoch": 322} {"train_loss": -31.947437286376953, "global_step": 39043, "epoch": 322} {"train_loss": -34.02580642700195, "global_step": 39044, "epoch": 322} {"train_loss": -34.04914093017578, "global_step": 39045, "epoch": 322} {"train_loss": -33.621307373046875, "global_step": 39046, "epoch": 322} {"train_loss": -32.503936767578125, "global_step": 39047, "epoch": 322} {"train_loss": -33.27122116088867, "global_step": 39048, "epoch": 322} {"train_loss": -34.300838470458984, "global_step": 39049, "epoch": 322} {"train_loss": -33.64548110961914, "global_step": 39050, "epoch": 322} {"train_loss": -33.5368537902832, "global_step": 39051, "epoch": 322} {"train_loss": -34.67089080810547, "global_step": 39052, "epoch": 322} {"train_loss": -33.13444900512695, "global_step": 39053, "epoch": 322} {"train_loss": -34.494476318359375, "global_step": 39054, "epoch": 322} {"train_loss": -34.42301559448242, "global_step": 39055, "epoch": 322} {"train_loss": -33.95709991455078, "global_step": 39056, "epoch": 322} {"train_loss": -34.42213439941406, "global_step": 39057, "epoch": 322} {"train_loss": -34.40156936645508, "global_step": 39058, "epoch": 322} {"train_loss": -34.33734893798828, "global_step": 39059, "epoch": 322} {"train_loss": -34.27995681762695, "global_step": 39060, "epoch": 322} {"train_loss": -34.05663299560547, "global_step": 39061, "epoch": 322} {"train_loss": -34.67341995239258, "global_step": 39062, "epoch": 322} {"train_loss": -33.50507354736328, "global_step": 39063, "epoch": 322} {"train_loss": -33.50844955444336, "global_step": 39064, "epoch": 322} {"train_loss": -33.96114730834961, "global_step": 39065, "epoch": 322} {"train_loss": -32.9874153137207, "global_step": 39066, "epoch": 322} {"train_loss": -34.464969635009766, "global_step": 39067, "epoch": 322} {"train_loss": -33.654415130615234, "global_step": 39068, "epoch": 322} {"train_loss": -34.15118408203125, "global_step": 39069, "epoch": 322} {"train_loss": -34.36730194091797, "global_step": 39070, "epoch": 322} {"train_loss": -34.435245513916016, "global_step": 39071, "epoch": 322} {"train_loss": -33.986114501953125, "global_step": 39072, "epoch": 322} {"train_loss": -34.28385543823242, "global_step": 39073, "epoch": 322} {"train_loss": -34.692684173583984, "global_step": 39074, "epoch": 322} {"train_loss": -34.49943161010742, "global_step": 39075, "epoch": 322} {"train_loss": -34.36782455444336, "global_step": 39076, "epoch": 322} {"train_loss": -34.37625503540039, "global_step": 39077, "epoch": 322} {"train_loss": -33.83561706542969, "global_step": 39078, "epoch": 322} {"train_loss": -34.087703704833984, "global_step": 39079, "epoch": 322} {"train_loss": -34.70869445800781, "global_step": 39080, "epoch": 322} {"train_loss": -34.40067672729492, "global_step": 39081, "epoch": 322} {"train_loss": -33.614999629249255, "global_step": 39082, "epoch": 322, "val_loss": 2375198.75} {"train_loss": -34.843448638916016, "global_step": 39083, "epoch": 323} {"train_loss": -34.71700668334961, "global_step": 39084, "epoch": 323} {"train_loss": -34.88636779785156, "global_step": 39085, "epoch": 323} {"train_loss": -34.94350814819336, "global_step": 39086, "epoch": 323} {"train_loss": -34.60066223144531, "global_step": 39087, "epoch": 323} {"train_loss": -34.5091667175293, "global_step": 39088, "epoch": 323} {"train_loss": -32.09859085083008, "global_step": 39089, "epoch": 323} {"train_loss": -29.79999351501465, "global_step": 39090, "epoch": 323} {"train_loss": -25.372150421142578, "global_step": 39091, "epoch": 323} {"train_loss": -23.00312042236328, "global_step": 39092, "epoch": 323} {"train_loss": -31.718107223510742, "global_step": 39093, "epoch": 323} {"train_loss": -31.732574462890625, "global_step": 39094, "epoch": 323} {"train_loss": -32.30049514770508, "global_step": 39095, "epoch": 323} {"train_loss": -32.15719223022461, "global_step": 39096, "epoch": 323} {"train_loss": -33.4056282043457, "global_step": 39097, "epoch": 323} {"train_loss": -32.5019416809082, "global_step": 39098, "epoch": 323} {"train_loss": -33.9796028137207, "global_step": 39099, "epoch": 323} {"train_loss": -32.859493255615234, "global_step": 39100, "epoch": 323} {"train_loss": -33.67020034790039, "global_step": 39101, "epoch": 323} {"train_loss": -33.40072250366211, "global_step": 39102, "epoch": 323} {"train_loss": -32.85179138183594, "global_step": 39103, "epoch": 323} {"train_loss": -33.479713439941406, "global_step": 39104, "epoch": 323} {"train_loss": -33.41901779174805, "global_step": 39105, "epoch": 323} {"train_loss": -33.11628341674805, "global_step": 39106, "epoch": 323} {"train_loss": -33.636104583740234, "global_step": 39107, "epoch": 323} {"train_loss": -34.15133285522461, "global_step": 39108, "epoch": 323} {"train_loss": -33.84299850463867, "global_step": 39109, "epoch": 323} {"train_loss": -33.977500915527344, "global_step": 39110, "epoch": 323} {"train_loss": -33.313201904296875, "global_step": 39111, "epoch": 323} {"train_loss": -33.18024444580078, "global_step": 39112, "epoch": 323} {"train_loss": -33.486202239990234, "global_step": 39113, "epoch": 323} {"train_loss": -33.73378372192383, "global_step": 39114, "epoch": 323} {"train_loss": -33.748626708984375, "global_step": 39115, "epoch": 323} {"train_loss": -33.52155303955078, "global_step": 39116, "epoch": 323} {"train_loss": -33.35694122314453, "global_step": 39117, "epoch": 323} {"train_loss": -34.08127975463867, "global_step": 39118, "epoch": 323} {"train_loss": -33.297813415527344, "global_step": 39119, "epoch": 323} {"train_loss": -32.944793701171875, "global_step": 39120, "epoch": 323} {"train_loss": -32.75808334350586, "global_step": 39121, "epoch": 323} {"train_loss": -33.06715774536133, "global_step": 39122, "epoch": 323} {"train_loss": -33.11782455444336, "global_step": 39123, "epoch": 323} {"train_loss": -33.352046966552734, "global_step": 39124, "epoch": 323} {"train_loss": -33.258121490478516, "global_step": 39125, "epoch": 323} {"train_loss": -34.09682846069336, "global_step": 39126, "epoch": 323} {"train_loss": -33.72902297973633, "global_step": 39127, "epoch": 323} {"train_loss": -33.19472122192383, "global_step": 39128, "epoch": 323} {"train_loss": -33.588775634765625, "global_step": 39129, "epoch": 323} {"train_loss": -33.2088508605957, "global_step": 39130, "epoch": 323} {"train_loss": -33.7655029296875, "global_step": 39131, "epoch": 323} {"train_loss": -33.700347900390625, "global_step": 39132, "epoch": 323} {"train_loss": -33.5695915222168, "global_step": 39133, "epoch": 323} {"train_loss": -32.75926971435547, "global_step": 39134, "epoch": 323} {"train_loss": -32.3330192565918, "global_step": 39135, "epoch": 323} {"train_loss": -33.47664260864258, "global_step": 39136, "epoch": 323} {"train_loss": -33.856056213378906, "global_step": 39137, "epoch": 323} {"train_loss": -33.507568359375, "global_step": 39138, "epoch": 323} {"train_loss": -33.08640670776367, "global_step": 39139, "epoch": 323} {"train_loss": -33.325130462646484, "global_step": 39140, "epoch": 323} {"train_loss": -33.31181335449219, "global_step": 39141, "epoch": 323} {"train_loss": -33.668418884277344, "global_step": 39142, "epoch": 323} {"train_loss": -33.84791946411133, "global_step": 39143, "epoch": 323} {"train_loss": -33.447967529296875, "global_step": 39144, "epoch": 323} {"train_loss": -34.06313705444336, "global_step": 39145, "epoch": 323} {"train_loss": -33.596866607666016, "global_step": 39146, "epoch": 323} {"train_loss": -33.95092010498047, "global_step": 39147, "epoch": 323} {"train_loss": -33.613861083984375, "global_step": 39148, "epoch": 323} {"train_loss": -34.10631561279297, "global_step": 39149, "epoch": 323} {"train_loss": -33.932891845703125, "global_step": 39150, "epoch": 323} {"train_loss": -34.15739059448242, "global_step": 39151, "epoch": 323} {"train_loss": -32.7210693359375, "global_step": 39152, "epoch": 323} {"train_loss": -33.60445022583008, "global_step": 39153, "epoch": 323} {"train_loss": -34.318626403808594, "global_step": 39154, "epoch": 323} {"train_loss": -34.384700775146484, "global_step": 39155, "epoch": 323} {"train_loss": -33.3079719543457, "global_step": 39156, "epoch": 323} {"train_loss": -33.377071380615234, "global_step": 39157, "epoch": 323} {"train_loss": -32.99526596069336, "global_step": 39158, "epoch": 323} {"train_loss": -32.99908447265625, "global_step": 39159, "epoch": 323} {"train_loss": -33.44600296020508, "global_step": 39160, "epoch": 323} {"train_loss": -33.50291061401367, "global_step": 39161, "epoch": 323} {"train_loss": -33.868324279785156, "global_step": 39162, "epoch": 323} {"train_loss": -32.108089447021484, "global_step": 39163, "epoch": 323} {"train_loss": -31.81085777282715, "global_step": 39164, "epoch": 323} {"train_loss": -32.74339294433594, "global_step": 39165, "epoch": 323} {"train_loss": -34.01743698120117, "global_step": 39166, "epoch": 323} {"train_loss": -33.61439895629883, "global_step": 39167, "epoch": 323} {"train_loss": -31.902700424194336, "global_step": 39168, "epoch": 323} {"train_loss": -31.32676124572754, "global_step": 39169, "epoch": 323} {"train_loss": -34.1955680847168, "global_step": 39170, "epoch": 323} {"train_loss": -32.03730010986328, "global_step": 39171, "epoch": 323} {"train_loss": -32.03374481201172, "global_step": 39172, "epoch": 323} {"train_loss": -33.91510009765625, "global_step": 39173, "epoch": 323} {"train_loss": -33.08217239379883, "global_step": 39174, "epoch": 323} {"train_loss": -32.411231994628906, "global_step": 39175, "epoch": 323} {"train_loss": -33.420406341552734, "global_step": 39176, "epoch": 323} {"train_loss": -33.10834884643555, "global_step": 39177, "epoch": 323} {"train_loss": -32.63326644897461, "global_step": 39178, "epoch": 323} {"train_loss": -32.43900680541992, "global_step": 39179, "epoch": 323} {"train_loss": -33.63846969604492, "global_step": 39180, "epoch": 323} {"train_loss": -33.827083587646484, "global_step": 39181, "epoch": 323} {"train_loss": -32.82731628417969, "global_step": 39182, "epoch": 323} {"train_loss": -32.83564376831055, "global_step": 39183, "epoch": 323} {"train_loss": -34.09912872314453, "global_step": 39184, "epoch": 323} {"train_loss": -32.69503402709961, "global_step": 39185, "epoch": 323} {"train_loss": -32.65393829345703, "global_step": 39186, "epoch": 323} {"train_loss": -33.835731506347656, "global_step": 39187, "epoch": 323} {"train_loss": -33.387752532958984, "global_step": 39188, "epoch": 323} {"train_loss": -33.46022415161133, "global_step": 39189, "epoch": 323} {"train_loss": -33.72179412841797, "global_step": 39190, "epoch": 323} {"train_loss": -32.9481086730957, "global_step": 39191, "epoch": 323} {"train_loss": -33.1047248840332, "global_step": 39192, "epoch": 323} {"train_loss": -34.121437072753906, "global_step": 39193, "epoch": 323} {"train_loss": -33.212833404541016, "global_step": 39194, "epoch": 323} {"train_loss": -33.585235595703125, "global_step": 39195, "epoch": 323} {"train_loss": -33.8575439453125, "global_step": 39196, "epoch": 323} {"train_loss": -34.01243209838867, "global_step": 39197, "epoch": 323} {"train_loss": -33.928001403808594, "global_step": 39198, "epoch": 323} {"train_loss": -32.69525146484375, "global_step": 39199, "epoch": 323} {"train_loss": -32.655738830566406, "global_step": 39200, "epoch": 323} {"train_loss": -32.41520309448242, "global_step": 39201, "epoch": 323} {"train_loss": -32.29220199584961, "global_step": 39202, "epoch": 323} {"train_loss": -33.14882866410184, "global_step": 39203, "epoch": 323, "val_loss": 2589187.75} {"train_loss": -31.454710006713867, "global_step": 39204, "epoch": 324} {"train_loss": -31.6534423828125, "global_step": 39205, "epoch": 324} {"train_loss": -30.056476593017578, "global_step": 39206, "epoch": 324} {"train_loss": -31.358173370361328, "global_step": 39207, "epoch": 324} {"train_loss": -26.1322078704834, "global_step": 39208, "epoch": 324} {"train_loss": -30.22991943359375, "global_step": 39209, "epoch": 324} {"train_loss": -30.985794067382812, "global_step": 39210, "epoch": 324} {"train_loss": -26.756351470947266, "global_step": 39211, "epoch": 324} {"train_loss": -31.221006393432617, "global_step": 39212, "epoch": 324} {"train_loss": -29.683645248413086, "global_step": 39213, "epoch": 324} {"train_loss": -33.437320709228516, "global_step": 39214, "epoch": 324} {"train_loss": -30.45505714416504, "global_step": 39215, "epoch": 324} {"train_loss": -33.469356536865234, "global_step": 39216, "epoch": 324} {"train_loss": -32.4372444152832, "global_step": 39217, "epoch": 324} {"train_loss": -32.324371337890625, "global_step": 39218, "epoch": 324} {"train_loss": -32.77036666870117, "global_step": 39219, "epoch": 324} {"train_loss": -33.72407150268555, "global_step": 39220, "epoch": 324} {"train_loss": -32.79936218261719, "global_step": 39221, "epoch": 324} {"train_loss": -33.429988861083984, "global_step": 39222, "epoch": 324} {"train_loss": -33.600318908691406, "global_step": 39223, "epoch": 324} {"train_loss": -33.52985382080078, "global_step": 39224, "epoch": 324} {"train_loss": -33.6058235168457, "global_step": 39225, "epoch": 324} {"train_loss": -33.094364166259766, "global_step": 39226, "epoch": 324} {"train_loss": -33.85243606567383, "global_step": 39227, "epoch": 324} {"train_loss": -33.81069564819336, "global_step": 39228, "epoch": 324} {"train_loss": -33.953895568847656, "global_step": 39229, "epoch": 324} {"train_loss": -33.53536605834961, "global_step": 39230, "epoch": 324} {"train_loss": -33.988037109375, "global_step": 39231, "epoch": 324} {"train_loss": -34.301753997802734, "global_step": 39232, "epoch": 324} {"train_loss": -34.093284606933594, "global_step": 39233, "epoch": 324} {"train_loss": -34.371891021728516, "global_step": 39234, "epoch": 324} {"train_loss": -34.31690979003906, "global_step": 39235, "epoch": 324} {"train_loss": -33.714168548583984, "global_step": 39236, "epoch": 324} {"train_loss": -34.45895004272461, "global_step": 39237, "epoch": 324} {"train_loss": -34.394920349121094, "global_step": 39238, "epoch": 324} {"train_loss": -33.757083892822266, "global_step": 39239, "epoch": 324} {"train_loss": -34.3363151550293, "global_step": 39240, "epoch": 324} {"train_loss": -33.93900680541992, "global_step": 39241, "epoch": 324} {"train_loss": -34.21787643432617, "global_step": 39242, "epoch": 324} {"train_loss": -33.92557907104492, "global_step": 39243, "epoch": 324} {"train_loss": -33.962074279785156, "global_step": 39244, "epoch": 324} {"train_loss": -33.69708251953125, "global_step": 39245, "epoch": 324} {"train_loss": -34.27431869506836, "global_step": 39246, "epoch": 324} {"train_loss": -33.27829360961914, "global_step": 39247, "epoch": 324} {"train_loss": -34.159706115722656, "global_step": 39248, "epoch": 324} {"train_loss": -34.32817459106445, "global_step": 39249, "epoch": 324} {"train_loss": -33.25693893432617, "global_step": 39250, "epoch": 324} {"train_loss": -33.77817153930664, "global_step": 39251, "epoch": 324} {"train_loss": -34.44429397583008, "global_step": 39252, "epoch": 324} {"train_loss": -33.610107421875, "global_step": 39253, "epoch": 324} {"train_loss": -33.44599151611328, "global_step": 39254, "epoch": 324} {"train_loss": -33.96928024291992, "global_step": 39255, "epoch": 324} {"train_loss": -32.55057907104492, "global_step": 39256, "epoch": 324} {"train_loss": -32.283203125, "global_step": 39257, "epoch": 324} {"train_loss": -32.935882568359375, "global_step": 39258, "epoch": 324} {"train_loss": -34.0622673034668, "global_step": 39259, "epoch": 324} {"train_loss": -32.23798370361328, "global_step": 39260, "epoch": 324} {"train_loss": -32.34778594970703, "global_step": 39261, "epoch": 324} {"train_loss": -33.314735412597656, "global_step": 39262, "epoch": 324} {"train_loss": -32.80260467529297, "global_step": 39263, "epoch": 324} {"train_loss": -32.616756439208984, "global_step": 39264, "epoch": 324} {"train_loss": -32.989437103271484, "global_step": 39265, "epoch": 324} {"train_loss": -32.873165130615234, "global_step": 39266, "epoch": 324} {"train_loss": -33.62544631958008, "global_step": 39267, "epoch": 324} {"train_loss": -31.979679107666016, "global_step": 39268, "epoch": 324} {"train_loss": -31.531064987182617, "global_step": 39269, "epoch": 324} {"train_loss": -30.28525161743164, "global_step": 39270, "epoch": 324} {"train_loss": -31.06974220275879, "global_step": 39271, "epoch": 324} {"train_loss": -32.10283660888672, "global_step": 39272, "epoch": 324} {"train_loss": -32.18262481689453, "global_step": 39273, "epoch": 324} {"train_loss": -31.958642959594727, "global_step": 39274, "epoch": 324} {"train_loss": -32.33789825439453, "global_step": 39275, "epoch": 324} {"train_loss": -32.765663146972656, "global_step": 39276, "epoch": 324} {"train_loss": -31.8497257232666, "global_step": 39277, "epoch": 324} {"train_loss": -32.2834587097168, "global_step": 39278, "epoch": 324} {"train_loss": -33.36117935180664, "global_step": 39279, "epoch": 324} {"train_loss": -32.540382385253906, "global_step": 39280, "epoch": 324} {"train_loss": -32.792110443115234, "global_step": 39281, "epoch": 324} {"train_loss": -33.01051712036133, "global_step": 39282, "epoch": 324} {"train_loss": -32.47111892700195, "global_step": 39283, "epoch": 324} {"train_loss": -33.33809280395508, "global_step": 39284, "epoch": 324} {"train_loss": -32.787025451660156, "global_step": 39285, "epoch": 324} {"train_loss": -33.4057731628418, "global_step": 39286, "epoch": 324} {"train_loss": -32.63536071777344, "global_step": 39287, "epoch": 324} {"train_loss": -33.43398666381836, "global_step": 39288, "epoch": 324} {"train_loss": -33.14625930786133, "global_step": 39289, "epoch": 324} {"train_loss": -33.49569320678711, "global_step": 39290, "epoch": 324} {"train_loss": -32.912147521972656, "global_step": 39291, "epoch": 324} {"train_loss": -33.62124252319336, "global_step": 39292, "epoch": 324} {"train_loss": -33.826839447021484, "global_step": 39293, "epoch": 324} {"train_loss": -33.082637786865234, "global_step": 39294, "epoch": 324} {"train_loss": -33.007869720458984, "global_step": 39295, "epoch": 324} {"train_loss": -33.274471282958984, "global_step": 39296, "epoch": 324} {"train_loss": -33.267677307128906, "global_step": 39297, "epoch": 324} {"train_loss": -33.894065856933594, "global_step": 39298, "epoch": 324} {"train_loss": -33.533966064453125, "global_step": 39299, "epoch": 324} {"train_loss": -33.913360595703125, "global_step": 39300, "epoch": 324} {"train_loss": -33.493873596191406, "global_step": 39301, "epoch": 324} {"train_loss": -33.428993225097656, "global_step": 39302, "epoch": 324} {"train_loss": -33.450592041015625, "global_step": 39303, "epoch": 324} {"train_loss": -33.695552825927734, "global_step": 39304, "epoch": 324} {"train_loss": -33.55045700073242, "global_step": 39305, "epoch": 324} {"train_loss": -33.13040542602539, "global_step": 39306, "epoch": 324} {"train_loss": -33.34827423095703, "global_step": 39307, "epoch": 324} {"train_loss": -34.05661392211914, "global_step": 39308, "epoch": 324} {"train_loss": -34.12517166137695, "global_step": 39309, "epoch": 324} {"train_loss": -34.45682907104492, "global_step": 39310, "epoch": 324} {"train_loss": -33.85152053833008, "global_step": 39311, "epoch": 324} {"train_loss": -34.203163146972656, "global_step": 39312, "epoch": 324} {"train_loss": -34.35110092163086, "global_step": 39313, "epoch": 324} {"train_loss": -34.214454650878906, "global_step": 39314, "epoch": 324} {"train_loss": -33.91158676147461, "global_step": 39315, "epoch": 324} {"train_loss": -34.8185920715332, "global_step": 39316, "epoch": 324} {"train_loss": -34.234127044677734, "global_step": 39317, "epoch": 324} {"train_loss": -34.429561614990234, "global_step": 39318, "epoch": 324} {"train_loss": -34.52915573120117, "global_step": 39319, "epoch": 324} {"train_loss": -34.07802963256836, "global_step": 39320, "epoch": 324} {"train_loss": -33.2081184387207, "global_step": 39321, "epoch": 324} {"train_loss": -32.85989761352539, "global_step": 39322, "epoch": 324} {"train_loss": -31.82960319519043, "global_step": 39323, "epoch": 324} {"train_loss": -33.039662952265466, "global_step": 39324, "epoch": 324, "val_loss": 2524197.0} {"train_loss": -30.30801773071289, "global_step": 39325, "epoch": 325} {"train_loss": -32.277523040771484, "global_step": 39326, "epoch": 325} {"train_loss": -34.605690002441406, "global_step": 39327, "epoch": 325} {"train_loss": -33.269927978515625, "global_step": 39328, "epoch": 325} {"train_loss": -32.85153579711914, "global_step": 39329, "epoch": 325} {"train_loss": -34.453060150146484, "global_step": 39330, "epoch": 325} {"train_loss": -34.57941818237305, "global_step": 39331, "epoch": 325} {"train_loss": -33.277000427246094, "global_step": 39332, "epoch": 325} {"train_loss": -32.38496780395508, "global_step": 39333, "epoch": 325} {"train_loss": -32.86649703979492, "global_step": 39334, "epoch": 325} {"train_loss": -32.870262145996094, "global_step": 39335, "epoch": 325} {"train_loss": -32.187557220458984, "global_step": 39336, "epoch": 325} {"train_loss": -34.37397003173828, "global_step": 39337, "epoch": 325} {"train_loss": -33.12862777709961, "global_step": 39338, "epoch": 325} {"train_loss": -32.4626579284668, "global_step": 39339, "epoch": 325} {"train_loss": -33.774784088134766, "global_step": 39340, "epoch": 325} {"train_loss": -31.796445846557617, "global_step": 39341, "epoch": 325} {"train_loss": -32.594200134277344, "global_step": 39342, "epoch": 325} {"train_loss": -32.95906448364258, "global_step": 39343, "epoch": 325} {"train_loss": -34.08046340942383, "global_step": 39344, "epoch": 325} {"train_loss": -33.000038146972656, "global_step": 39345, "epoch": 325} {"train_loss": -32.858375549316406, "global_step": 39346, "epoch": 325} {"train_loss": -32.80569076538086, "global_step": 39347, "epoch": 325} {"train_loss": -33.94415283203125, "global_step": 39348, "epoch": 325} {"train_loss": -32.74542236328125, "global_step": 39349, "epoch": 325} {"train_loss": -32.108089447021484, "global_step": 39350, "epoch": 325} {"train_loss": -33.67255783081055, "global_step": 39351, "epoch": 325} {"train_loss": -33.494781494140625, "global_step": 39352, "epoch": 325} {"train_loss": -32.60791015625, "global_step": 39353, "epoch": 325} {"train_loss": -33.55664825439453, "global_step": 39354, "epoch": 325} {"train_loss": -31.861343383789062, "global_step": 39355, "epoch": 325} {"train_loss": -31.936620712280273, "global_step": 39356, "epoch": 325} {"train_loss": -33.64448165893555, "global_step": 39357, "epoch": 325} {"train_loss": -33.64252853393555, "global_step": 39358, "epoch": 325} {"train_loss": -33.12556076049805, "global_step": 39359, "epoch": 325} {"train_loss": -33.07726287841797, "global_step": 39360, "epoch": 325} {"train_loss": -33.663177490234375, "global_step": 39361, "epoch": 325} {"train_loss": -33.32558822631836, "global_step": 39362, "epoch": 325} {"train_loss": -33.225154876708984, "global_step": 39363, "epoch": 325} {"train_loss": -32.78985595703125, "global_step": 39364, "epoch": 325} {"train_loss": -33.56660461425781, "global_step": 39365, "epoch": 325} {"train_loss": -33.868751525878906, "global_step": 39366, "epoch": 325} {"train_loss": -33.47504425048828, "global_step": 39367, "epoch": 325} {"train_loss": -33.27457809448242, "global_step": 39368, "epoch": 325} {"train_loss": -32.7675895690918, "global_step": 39369, "epoch": 325} {"train_loss": -33.2404670715332, "global_step": 39370, "epoch": 325} {"train_loss": -34.116939544677734, "global_step": 39371, "epoch": 325} {"train_loss": -33.79047393798828, "global_step": 39372, "epoch": 325} {"train_loss": -33.71966552734375, "global_step": 39373, "epoch": 325} {"train_loss": -33.370582580566406, "global_step": 39374, "epoch": 325} {"train_loss": -33.62625503540039, "global_step": 39375, "epoch": 325} {"train_loss": -34.268898010253906, "global_step": 39376, "epoch": 325} {"train_loss": -33.440216064453125, "global_step": 39377, "epoch": 325} {"train_loss": -33.66061019897461, "global_step": 39378, "epoch": 325} {"train_loss": -33.81631088256836, "global_step": 39379, "epoch": 325} {"train_loss": -33.648258209228516, "global_step": 39380, "epoch": 325} {"train_loss": -34.000858306884766, "global_step": 39381, "epoch": 325} {"train_loss": -34.129573822021484, "global_step": 39382, "epoch": 325} {"train_loss": -33.991737365722656, "global_step": 39383, "epoch": 325} {"train_loss": -33.56707763671875, "global_step": 39384, "epoch": 325} {"train_loss": -34.15534591674805, "global_step": 39385, "epoch": 325} {"train_loss": -33.79656982421875, "global_step": 39386, "epoch": 325} {"train_loss": -33.381004333496094, "global_step": 39387, "epoch": 325} {"train_loss": -34.0191764831543, "global_step": 39388, "epoch": 325} {"train_loss": -33.97801971435547, "global_step": 39389, "epoch": 325} {"train_loss": -34.197879791259766, "global_step": 39390, "epoch": 325} {"train_loss": -33.98427200317383, "global_step": 39391, "epoch": 325} {"train_loss": -33.96639633178711, "global_step": 39392, "epoch": 325} {"train_loss": -34.03947067260742, "global_step": 39393, "epoch": 325} {"train_loss": -34.037715911865234, "global_step": 39394, "epoch": 325} {"train_loss": -34.7102165222168, "global_step": 39395, "epoch": 325} {"train_loss": -34.172607421875, "global_step": 39396, "epoch": 325} {"train_loss": -34.784725189208984, "global_step": 39397, "epoch": 325} {"train_loss": -34.062076568603516, "global_step": 39398, "epoch": 325} {"train_loss": -34.24995040893555, "global_step": 39399, "epoch": 325} {"train_loss": -33.61341094970703, "global_step": 39400, "epoch": 325} {"train_loss": -35.08527755737305, "global_step": 39401, "epoch": 325} {"train_loss": -34.79831314086914, "global_step": 39402, "epoch": 325} {"train_loss": -34.46409225463867, "global_step": 39403, "epoch": 325} {"train_loss": -34.791751861572266, "global_step": 39404, "epoch": 325} {"train_loss": -34.89765167236328, "global_step": 39405, "epoch": 325} {"train_loss": -35.0211296081543, "global_step": 39406, "epoch": 325} {"train_loss": -34.90268325805664, "global_step": 39407, "epoch": 325} {"train_loss": -34.68220901489258, "global_step": 39408, "epoch": 325} {"train_loss": -33.91672897338867, "global_step": 39409, "epoch": 325} {"train_loss": -33.28642654418945, "global_step": 39410, "epoch": 325} {"train_loss": -31.1053524017334, "global_step": 39411, "epoch": 325} {"train_loss": -23.685720443725586, "global_step": 39412, "epoch": 325} {"train_loss": -5.402284622192383, "global_step": 39413, "epoch": 325} {"train_loss": -2.308640241622925, "global_step": 39414, "epoch": 325} {"train_loss": -24.080846786499023, "global_step": 39415, "epoch": 325} {"train_loss": -28.571393966674805, "global_step": 39416, "epoch": 325} {"train_loss": -25.978200912475586, "global_step": 39417, "epoch": 325} {"train_loss": -28.5469913482666, "global_step": 39418, "epoch": 325} {"train_loss": -32.17594909667969, "global_step": 39419, "epoch": 325} {"train_loss": -26.991125106811523, "global_step": 39420, "epoch": 325} {"train_loss": -28.3494930267334, "global_step": 39421, "epoch": 325} {"train_loss": -31.9393367767334, "global_step": 39422, "epoch": 325} {"train_loss": -29.535842895507812, "global_step": 39423, "epoch": 325} {"train_loss": -28.245615005493164, "global_step": 39424, "epoch": 325} {"train_loss": -31.372730255126953, "global_step": 39425, "epoch": 325} {"train_loss": -32.23653793334961, "global_step": 39426, "epoch": 325} {"train_loss": -32.01791000366211, "global_step": 39427, "epoch": 325} {"train_loss": -29.938507080078125, "global_step": 39428, "epoch": 325} {"train_loss": -31.945844650268555, "global_step": 39429, "epoch": 325} {"train_loss": -32.29402542114258, "global_step": 39430, "epoch": 325} {"train_loss": -32.13685607910156, "global_step": 39431, "epoch": 325} {"train_loss": -31.931196212768555, "global_step": 39432, "epoch": 325} {"train_loss": -32.27664566040039, "global_step": 39433, "epoch": 325} {"train_loss": -31.8257999420166, "global_step": 39434, "epoch": 325} {"train_loss": -32.12601852416992, "global_step": 39435, "epoch": 325} {"train_loss": -32.62185287475586, "global_step": 39436, "epoch": 325} {"train_loss": -32.72318649291992, "global_step": 39437, "epoch": 325} {"train_loss": -32.56320571899414, "global_step": 39438, "epoch": 325} {"train_loss": -32.093807220458984, "global_step": 39439, "epoch": 325} {"train_loss": -32.2933349609375, "global_step": 39440, "epoch": 325} {"train_loss": -31.823637008666992, "global_step": 39441, "epoch": 325} {"train_loss": -32.68095779418945, "global_step": 39442, "epoch": 325} {"train_loss": -32.82988739013672, "global_step": 39443, "epoch": 325} {"train_loss": -32.73037338256836, "global_step": 39444, "epoch": 325} {"train_loss": -32.302922956214466, "global_step": 39445, "epoch": 325, "val_loss": 2701137.25} {"train_loss": -32.5566520690918, "global_step": 39446, "epoch": 326} {"train_loss": -32.693965911865234, "global_step": 39447, "epoch": 326} {"train_loss": -32.537384033203125, "global_step": 39448, "epoch": 326} {"train_loss": -32.161800384521484, "global_step": 39449, "epoch": 326} {"train_loss": -32.73728561401367, "global_step": 39450, "epoch": 326} {"train_loss": -33.389564514160156, "global_step": 39451, "epoch": 326} {"train_loss": -33.2890510559082, "global_step": 39452, "epoch": 326} {"train_loss": -33.071041107177734, "global_step": 39453, "epoch": 326} {"train_loss": -33.316734313964844, "global_step": 39454, "epoch": 326} {"train_loss": -32.47303009033203, "global_step": 39455, "epoch": 326} {"train_loss": -33.361507415771484, "global_step": 39456, "epoch": 326} {"train_loss": -33.290157318115234, "global_step": 39457, "epoch": 326} {"train_loss": -32.694427490234375, "global_step": 39458, "epoch": 326} {"train_loss": -33.06740951538086, "global_step": 39459, "epoch": 326} {"train_loss": -33.70771408081055, "global_step": 39460, "epoch": 326} {"train_loss": -32.456520080566406, "global_step": 39461, "epoch": 326} {"train_loss": -33.15003204345703, "global_step": 39462, "epoch": 326} {"train_loss": -32.540096282958984, "global_step": 39463, "epoch": 326} {"train_loss": -33.16366195678711, "global_step": 39464, "epoch": 326} {"train_loss": -33.794830322265625, "global_step": 39465, "epoch": 326} {"train_loss": -33.452579498291016, "global_step": 39466, "epoch": 326} {"train_loss": -33.22554016113281, "global_step": 39467, "epoch": 326} {"train_loss": -33.74808883666992, "global_step": 39468, "epoch": 326} {"train_loss": -33.194820404052734, "global_step": 39469, "epoch": 326} {"train_loss": -33.30000305175781, "global_step": 39470, "epoch": 326} {"train_loss": -34.10288619995117, "global_step": 39471, "epoch": 326} {"train_loss": -33.47116470336914, "global_step": 39472, "epoch": 326} {"train_loss": -34.13381576538086, "global_step": 39473, "epoch": 326} {"train_loss": -33.5821533203125, "global_step": 39474, "epoch": 326} {"train_loss": -34.34082794189453, "global_step": 39475, "epoch": 326} {"train_loss": -33.58546829223633, "global_step": 39476, "epoch": 326} {"train_loss": -34.41785430908203, "global_step": 39477, "epoch": 326} {"train_loss": -33.52397537231445, "global_step": 39478, "epoch": 326} {"train_loss": -34.00297164916992, "global_step": 39479, "epoch": 326} {"train_loss": -34.151893615722656, "global_step": 39480, "epoch": 326} {"train_loss": -33.998046875, "global_step": 39481, "epoch": 326} {"train_loss": -33.179908752441406, "global_step": 39482, "epoch": 326} {"train_loss": -32.95481491088867, "global_step": 39483, "epoch": 326} {"train_loss": -32.775672912597656, "global_step": 39484, "epoch": 326} {"train_loss": -31.76267433166504, "global_step": 39485, "epoch": 326} {"train_loss": -31.263065338134766, "global_step": 39486, "epoch": 326} {"train_loss": -30.552112579345703, "global_step": 39487, "epoch": 326} {"train_loss": -28.118488311767578, "global_step": 39488, "epoch": 326} {"train_loss": -25.079320907592773, "global_step": 39489, "epoch": 326} {"train_loss": -30.160446166992188, "global_step": 39490, "epoch": 326} {"train_loss": -33.360504150390625, "global_step": 39491, "epoch": 326} {"train_loss": -27.9139461517334, "global_step": 39492, "epoch": 326} {"train_loss": -33.81547164916992, "global_step": 39493, "epoch": 326} {"train_loss": -26.281213760375977, "global_step": 39494, "epoch": 326} {"train_loss": -33.097633361816406, "global_step": 39495, "epoch": 326} {"train_loss": -30.076404571533203, "global_step": 39496, "epoch": 326} {"train_loss": -33.69843292236328, "global_step": 39497, "epoch": 326} {"train_loss": -31.701257705688477, "global_step": 39498, "epoch": 326} {"train_loss": -33.28239440917969, "global_step": 39499, "epoch": 326} {"train_loss": -32.57529830932617, "global_step": 39500, "epoch": 326} {"train_loss": -33.42008590698242, "global_step": 39501, "epoch": 326} {"train_loss": -33.450653076171875, "global_step": 39502, "epoch": 326} {"train_loss": -32.240234375, "global_step": 39503, "epoch": 326} {"train_loss": -33.7367057800293, "global_step": 39504, "epoch": 326} {"train_loss": -32.598628997802734, "global_step": 39505, "epoch": 326} {"train_loss": -32.504459381103516, "global_step": 39506, "epoch": 326} {"train_loss": -33.42311477661133, "global_step": 39507, "epoch": 326} {"train_loss": -32.986122131347656, "global_step": 39508, "epoch": 326} {"train_loss": -33.562530517578125, "global_step": 39509, "epoch": 326} {"train_loss": -33.755245208740234, "global_step": 39510, "epoch": 326} {"train_loss": -33.61748123168945, "global_step": 39511, "epoch": 326} {"train_loss": -33.349613189697266, "global_step": 39512, "epoch": 326} {"train_loss": -33.10793685913086, "global_step": 39513, "epoch": 326} {"train_loss": -33.506736755371094, "global_step": 39514, "epoch": 326} {"train_loss": -33.887901306152344, "global_step": 39515, "epoch": 326} {"train_loss": -33.64960861206055, "global_step": 39516, "epoch": 326} {"train_loss": -33.00973129272461, "global_step": 39517, "epoch": 326} {"train_loss": -34.103363037109375, "global_step": 39518, "epoch": 326} {"train_loss": -33.59387969970703, "global_step": 39519, "epoch": 326} {"train_loss": -33.434383392333984, "global_step": 39520, "epoch": 326} {"train_loss": -33.79364776611328, "global_step": 39521, "epoch": 326} {"train_loss": -34.20073699951172, "global_step": 39522, "epoch": 326} {"train_loss": -33.83393478393555, "global_step": 39523, "epoch": 326} {"train_loss": -34.03029251098633, "global_step": 39524, "epoch": 326} {"train_loss": -33.965675354003906, "global_step": 39525, "epoch": 326} {"train_loss": -33.617103576660156, "global_step": 39526, "epoch": 326} {"train_loss": -33.79845428466797, "global_step": 39527, "epoch": 326} {"train_loss": -33.70986557006836, "global_step": 39528, "epoch": 326} {"train_loss": -33.9940299987793, "global_step": 39529, "epoch": 326} {"train_loss": -33.754329681396484, "global_step": 39530, "epoch": 326} {"train_loss": -33.66781234741211, "global_step": 39531, "epoch": 326} {"train_loss": -33.55066680908203, "global_step": 39532, "epoch": 326} {"train_loss": -33.70426559448242, "global_step": 39533, "epoch": 326} {"train_loss": -32.761539459228516, "global_step": 39534, "epoch": 326} {"train_loss": -30.721817016601562, "global_step": 39535, "epoch": 326} {"train_loss": -27.43019676208496, "global_step": 39536, "epoch": 326} {"train_loss": -34.05963897705078, "global_step": 39537, "epoch": 326} {"train_loss": -30.164417266845703, "global_step": 39538, "epoch": 326} {"train_loss": -33.17403793334961, "global_step": 39539, "epoch": 326} {"train_loss": -29.71653175354004, "global_step": 39540, "epoch": 326} {"train_loss": -32.778076171875, "global_step": 39541, "epoch": 326} {"train_loss": -32.31906509399414, "global_step": 39542, "epoch": 326} {"train_loss": -31.854196548461914, "global_step": 39543, "epoch": 326} {"train_loss": -33.779476165771484, "global_step": 39544, "epoch": 326} {"train_loss": -33.400081634521484, "global_step": 39545, "epoch": 326} {"train_loss": -32.43854904174805, "global_step": 39546, "epoch": 326} {"train_loss": -33.425533294677734, "global_step": 39547, "epoch": 326} {"train_loss": -33.929847717285156, "global_step": 39548, "epoch": 326} {"train_loss": -33.99283218383789, "global_step": 39549, "epoch": 326} {"train_loss": -33.51426696777344, "global_step": 39550, "epoch": 326} {"train_loss": -33.72621536254883, "global_step": 39551, "epoch": 326} {"train_loss": -33.464351654052734, "global_step": 39552, "epoch": 326} {"train_loss": -33.53487777709961, "global_step": 39553, "epoch": 326} {"train_loss": -33.56862258911133, "global_step": 39554, "epoch": 326} {"train_loss": -33.1510124206543, "global_step": 39555, "epoch": 326} {"train_loss": -32.879390716552734, "global_step": 39556, "epoch": 326} {"train_loss": -33.60308837890625, "global_step": 39557, "epoch": 326} {"train_loss": -34.362831115722656, "global_step": 39558, "epoch": 326} {"train_loss": -34.3607177734375, "global_step": 39559, "epoch": 326} {"train_loss": -33.77949142456055, "global_step": 39560, "epoch": 326} {"train_loss": -33.61528015136719, "global_step": 39561, "epoch": 326} {"train_loss": -33.522613525390625, "global_step": 39562, "epoch": 326} {"train_loss": -34.119544982910156, "global_step": 39563, "epoch": 326} {"train_loss": -33.9873046875, "global_step": 39564, "epoch": 326} {"train_loss": -34.0831184387207, "global_step": 39565, "epoch": 326} {"train_loss": -32.948845161879355, "global_step": 39566, "epoch": 326, "val_loss": 2583216.25} {"train_loss": -33.92416000366211, "global_step": 39567, "epoch": 327} {"train_loss": -32.90742111206055, "global_step": 39568, "epoch": 327} {"train_loss": -31.820829391479492, "global_step": 39569, "epoch": 327} {"train_loss": -30.886289596557617, "global_step": 39570, "epoch": 327} {"train_loss": -30.295080184936523, "global_step": 39571, "epoch": 327} {"train_loss": -32.201900482177734, "global_step": 39572, "epoch": 327} {"train_loss": -33.90138244628906, "global_step": 39573, "epoch": 327} {"train_loss": -32.467960357666016, "global_step": 39574, "epoch": 327} {"train_loss": -32.52845001220703, "global_step": 39575, "epoch": 327} {"train_loss": -33.38825607299805, "global_step": 39576, "epoch": 327} {"train_loss": -32.52254867553711, "global_step": 39577, "epoch": 327} {"train_loss": -33.49395751953125, "global_step": 39578, "epoch": 327} {"train_loss": -32.808040618896484, "global_step": 39579, "epoch": 327} {"train_loss": -33.3783073425293, "global_step": 39580, "epoch": 327} {"train_loss": -33.64335250854492, "global_step": 39581, "epoch": 327} {"train_loss": -32.131221771240234, "global_step": 39582, "epoch": 327} {"train_loss": -32.37998580932617, "global_step": 39583, "epoch": 327} {"train_loss": -32.81517791748047, "global_step": 39584, "epoch": 327} {"train_loss": -32.19538879394531, "global_step": 39585, "epoch": 327} {"train_loss": -31.652196884155273, "global_step": 39586, "epoch": 327} {"train_loss": -32.12167739868164, "global_step": 39587, "epoch": 327} {"train_loss": -32.552093505859375, "global_step": 39588, "epoch": 327} {"train_loss": -32.84382247924805, "global_step": 39589, "epoch": 327} {"train_loss": -32.5570068359375, "global_step": 39590, "epoch": 327} {"train_loss": -32.8192024230957, "global_step": 39591, "epoch": 327} {"train_loss": -33.226924896240234, "global_step": 39592, "epoch": 327} {"train_loss": -33.16617965698242, "global_step": 39593, "epoch": 327} {"train_loss": -33.473506927490234, "global_step": 39594, "epoch": 327} {"train_loss": -33.186153411865234, "global_step": 39595, "epoch": 327} {"train_loss": -33.5885124206543, "global_step": 39596, "epoch": 327} {"train_loss": -33.50313949584961, "global_step": 39597, "epoch": 327} {"train_loss": -33.908782958984375, "global_step": 39598, "epoch": 327} {"train_loss": -33.95671844482422, "global_step": 39599, "epoch": 327} {"train_loss": -32.8944206237793, "global_step": 39600, "epoch": 327} {"train_loss": -33.993770599365234, "global_step": 39601, "epoch": 327} {"train_loss": -32.919185638427734, "global_step": 39602, "epoch": 327} {"train_loss": -33.534080505371094, "global_step": 39603, "epoch": 327} {"train_loss": -34.34221267700195, "global_step": 39604, "epoch": 327} {"train_loss": -34.178871154785156, "global_step": 39605, "epoch": 327} {"train_loss": -33.523651123046875, "global_step": 39606, "epoch": 327} {"train_loss": -34.03852462768555, "global_step": 39607, "epoch": 327} {"train_loss": -33.71839904785156, "global_step": 39608, "epoch": 327} {"train_loss": -34.0333251953125, "global_step": 39609, "epoch": 327} {"train_loss": -34.58062744140625, "global_step": 39610, "epoch": 327} {"train_loss": -34.212886810302734, "global_step": 39611, "epoch": 327} {"train_loss": -34.280029296875, "global_step": 39612, "epoch": 327} {"train_loss": -34.3536262512207, "global_step": 39613, "epoch": 327} {"train_loss": -33.81024169921875, "global_step": 39614, "epoch": 327} {"train_loss": -34.47901153564453, "global_step": 39615, "epoch": 327} {"train_loss": -34.06096267700195, "global_step": 39616, "epoch": 327} {"train_loss": -34.01371383666992, "global_step": 39617, "epoch": 327} {"train_loss": -34.717872619628906, "global_step": 39618, "epoch": 327} {"train_loss": -34.39069366455078, "global_step": 39619, "epoch": 327} {"train_loss": -34.48160934448242, "global_step": 39620, "epoch": 327} {"train_loss": -34.52344512939453, "global_step": 39621, "epoch": 327} {"train_loss": -34.865028381347656, "global_step": 39622, "epoch": 327} {"train_loss": -34.65755081176758, "global_step": 39623, "epoch": 327} {"train_loss": -34.78121566772461, "global_step": 39624, "epoch": 327} {"train_loss": -34.416622161865234, "global_step": 39625, "epoch": 327} {"train_loss": -34.75346755981445, "global_step": 39626, "epoch": 327} {"train_loss": -34.898555755615234, "global_step": 39627, "epoch": 327} {"train_loss": -34.4510383605957, "global_step": 39628, "epoch": 327} {"train_loss": -34.887542724609375, "global_step": 39629, "epoch": 327} {"train_loss": -33.33414840698242, "global_step": 39630, "epoch": 327} {"train_loss": -34.07678985595703, "global_step": 39631, "epoch": 327} {"train_loss": -34.554386138916016, "global_step": 39632, "epoch": 327} {"train_loss": -35.105159759521484, "global_step": 39633, "epoch": 327} {"train_loss": -34.740264892578125, "global_step": 39634, "epoch": 327} {"train_loss": -33.860321044921875, "global_step": 39635, "epoch": 327} {"train_loss": -34.23845291137695, "global_step": 39636, "epoch": 327} {"train_loss": -34.409645080566406, "global_step": 39637, "epoch": 327} {"train_loss": -33.881736755371094, "global_step": 39638, "epoch": 327} {"train_loss": -34.36497116088867, "global_step": 39639, "epoch": 327} {"train_loss": -34.84067916870117, "global_step": 39640, "epoch": 327} {"train_loss": -34.286563873291016, "global_step": 39641, "epoch": 327} {"train_loss": -33.991878509521484, "global_step": 39642, "epoch": 327} {"train_loss": -31.650827407836914, "global_step": 39643, "epoch": 327} {"train_loss": -29.401580810546875, "global_step": 39644, "epoch": 327} {"train_loss": -33.35348892211914, "global_step": 39645, "epoch": 327} {"train_loss": -31.87164878845215, "global_step": 39646, "epoch": 327} {"train_loss": -33.242950439453125, "global_step": 39647, "epoch": 327} {"train_loss": -32.6717643737793, "global_step": 39648, "epoch": 327} {"train_loss": -33.9985466003418, "global_step": 39649, "epoch": 327} {"train_loss": -31.1533145904541, "global_step": 39650, "epoch": 327} {"train_loss": -33.8358039855957, "global_step": 39651, "epoch": 327} {"train_loss": -32.3458137512207, "global_step": 39652, "epoch": 327} {"train_loss": -32.84012985229492, "global_step": 39653, "epoch": 327} {"train_loss": -32.7810173034668, "global_step": 39654, "epoch": 327} {"train_loss": -31.843250274658203, "global_step": 39655, "epoch": 327} {"train_loss": -32.742366790771484, "global_step": 39656, "epoch": 327} {"train_loss": -32.11817932128906, "global_step": 39657, "epoch": 327} {"train_loss": -30.634740829467773, "global_step": 39658, "epoch": 327} {"train_loss": -28.042570114135742, "global_step": 39659, "epoch": 327} {"train_loss": -30.890405654907227, "global_step": 39660, "epoch": 327} {"train_loss": -33.53446578979492, "global_step": 39661, "epoch": 327} {"train_loss": -30.15128517150879, "global_step": 39662, "epoch": 327} {"train_loss": -30.66425895690918, "global_step": 39663, "epoch": 327} {"train_loss": -33.33610916137695, "global_step": 39664, "epoch": 327} {"train_loss": -30.96735954284668, "global_step": 39665, "epoch": 327} {"train_loss": -33.430110931396484, "global_step": 39666, "epoch": 327} {"train_loss": -31.73847770690918, "global_step": 39667, "epoch": 327} {"train_loss": -32.468849182128906, "global_step": 39668, "epoch": 327} {"train_loss": -32.416805267333984, "global_step": 39669, "epoch": 327} {"train_loss": -33.99648666381836, "global_step": 39670, "epoch": 327} {"train_loss": -32.99337387084961, "global_step": 39671, "epoch": 327} {"train_loss": -33.65910720825195, "global_step": 39672, "epoch": 327} {"train_loss": -33.5616569519043, "global_step": 39673, "epoch": 327} {"train_loss": -33.24636459350586, "global_step": 39674, "epoch": 327} {"train_loss": -33.90987014770508, "global_step": 39675, "epoch": 327} {"train_loss": -33.19582748413086, "global_step": 39676, "epoch": 327} {"train_loss": -33.34365463256836, "global_step": 39677, "epoch": 327} {"train_loss": -33.6137580871582, "global_step": 39678, "epoch": 327} {"train_loss": -33.3600959777832, "global_step": 39679, "epoch": 327} {"train_loss": -33.65360641479492, "global_step": 39680, "epoch": 327} {"train_loss": -33.473995208740234, "global_step": 39681, "epoch": 327} {"train_loss": -33.84247589111328, "global_step": 39682, "epoch": 327} {"train_loss": -33.59765625, "global_step": 39683, "epoch": 327} {"train_loss": -34.14797592163086, "global_step": 39684, "epoch": 327} {"train_loss": -33.50373458862305, "global_step": 39685, "epoch": 327} {"train_loss": -33.6215934753418, "global_step": 39686, "epoch": 327} {"train_loss": -33.24550184139535, "global_step": 39687, "epoch": 327, "val_loss": 2621909.25} {"train_loss": -33.61500930786133, "global_step": 39688, "epoch": 328} {"train_loss": -33.66850280761719, "global_step": 39689, "epoch": 328} {"train_loss": -34.00508499145508, "global_step": 39690, "epoch": 328} {"train_loss": -34.06433868408203, "global_step": 39691, "epoch": 328} {"train_loss": -33.46669387817383, "global_step": 39692, "epoch": 328} {"train_loss": -33.25068664550781, "global_step": 39693, "epoch": 328} {"train_loss": -33.0687370300293, "global_step": 39694, "epoch": 328} {"train_loss": -33.866153717041016, "global_step": 39695, "epoch": 328} {"train_loss": -34.379642486572266, "global_step": 39696, "epoch": 328} {"train_loss": -32.059757232666016, "global_step": 39697, "epoch": 328} {"train_loss": -31.196258544921875, "global_step": 39698, "epoch": 328} {"train_loss": -32.42594528198242, "global_step": 39699, "epoch": 328} {"train_loss": -34.126277923583984, "global_step": 39700, "epoch": 328} {"train_loss": -32.66533660888672, "global_step": 39701, "epoch": 328} {"train_loss": -31.201221466064453, "global_step": 39702, "epoch": 328} {"train_loss": -34.15615463256836, "global_step": 39703, "epoch": 328} {"train_loss": -34.21015930175781, "global_step": 39704, "epoch": 328} {"train_loss": -33.23800277709961, "global_step": 39705, "epoch": 328} {"train_loss": -34.61094284057617, "global_step": 39706, "epoch": 328} {"train_loss": -34.06937789916992, "global_step": 39707, "epoch": 328} {"train_loss": -34.66986846923828, "global_step": 39708, "epoch": 328} {"train_loss": -33.972633361816406, "global_step": 39709, "epoch": 328} {"train_loss": -34.19517135620117, "global_step": 39710, "epoch": 328} {"train_loss": -33.603485107421875, "global_step": 39711, "epoch": 328} {"train_loss": -29.980422973632812, "global_step": 39712, "epoch": 328} {"train_loss": -32.36433029174805, "global_step": 39713, "epoch": 328} {"train_loss": -27.86203384399414, "global_step": 39714, "epoch": 328} {"train_loss": -27.864837646484375, "global_step": 39715, "epoch": 328} {"train_loss": -28.717330932617188, "global_step": 39716, "epoch": 328} {"train_loss": -31.962738037109375, "global_step": 39717, "epoch": 328} {"train_loss": -31.355615615844727, "global_step": 39718, "epoch": 328} {"train_loss": -30.887094497680664, "global_step": 39719, "epoch": 328} {"train_loss": -29.655237197875977, "global_step": 39720, "epoch": 328} {"train_loss": -32.219329833984375, "global_step": 39721, "epoch": 328} {"train_loss": -31.633031845092773, "global_step": 39722, "epoch": 328} {"train_loss": -30.37601661682129, "global_step": 39723, "epoch": 328} {"train_loss": -31.269062042236328, "global_step": 39724, "epoch": 328} {"train_loss": -30.779891967773438, "global_step": 39725, "epoch": 328} {"train_loss": -31.947980880737305, "global_step": 39726, "epoch": 328} {"train_loss": -31.9700927734375, "global_step": 39727, "epoch": 328} {"train_loss": -31.69292640686035, "global_step": 39728, "epoch": 328} {"train_loss": -31.5728759765625, "global_step": 39729, "epoch": 328} {"train_loss": -31.48084831237793, "global_step": 39730, "epoch": 328} {"train_loss": -31.45013427734375, "global_step": 39731, "epoch": 328} {"train_loss": -32.238704681396484, "global_step": 39732, "epoch": 328} {"train_loss": -32.466644287109375, "global_step": 39733, "epoch": 328} {"train_loss": -32.19983673095703, "global_step": 39734, "epoch": 328} {"train_loss": -31.773996353149414, "global_step": 39735, "epoch": 328} {"train_loss": -32.1508903503418, "global_step": 39736, "epoch": 328} {"train_loss": -32.55863571166992, "global_step": 39737, "epoch": 328} {"train_loss": -32.622615814208984, "global_step": 39738, "epoch": 328} {"train_loss": -30.528888702392578, "global_step": 39739, "epoch": 328} {"train_loss": -32.398345947265625, "global_step": 39740, "epoch": 328} {"train_loss": -32.038795471191406, "global_step": 39741, "epoch": 328} {"train_loss": -32.271881103515625, "global_step": 39742, "epoch": 328} {"train_loss": -31.8054141998291, "global_step": 39743, "epoch": 328} {"train_loss": -32.79868698120117, "global_step": 39744, "epoch": 328} {"train_loss": -32.71549606323242, "global_step": 39745, "epoch": 328} {"train_loss": -32.703983306884766, "global_step": 39746, "epoch": 328} {"train_loss": -32.69527816772461, "global_step": 39747, "epoch": 328} {"train_loss": -33.11187744140625, "global_step": 39748, "epoch": 328} {"train_loss": -33.227149963378906, "global_step": 39749, "epoch": 328} {"train_loss": -32.88690185546875, "global_step": 39750, "epoch": 328} {"train_loss": -33.190338134765625, "global_step": 39751, "epoch": 328} {"train_loss": -33.17121124267578, "global_step": 39752, "epoch": 328} {"train_loss": -32.9764289855957, "global_step": 39753, "epoch": 328} {"train_loss": -32.8927001953125, "global_step": 39754, "epoch": 328} {"train_loss": -33.294002532958984, "global_step": 39755, "epoch": 328} {"train_loss": -33.52199172973633, "global_step": 39756, "epoch": 328} {"train_loss": -33.28163528442383, "global_step": 39757, "epoch": 328} {"train_loss": -33.43125534057617, "global_step": 39758, "epoch": 328} {"train_loss": -33.674049377441406, "global_step": 39759, "epoch": 328} {"train_loss": -33.558441162109375, "global_step": 39760, "epoch": 328} {"train_loss": -33.7843132019043, "global_step": 39761, "epoch": 328} {"train_loss": -34.01713180541992, "global_step": 39762, "epoch": 328} {"train_loss": -34.04154586791992, "global_step": 39763, "epoch": 328} {"train_loss": -33.15177917480469, "global_step": 39764, "epoch": 328} {"train_loss": -33.198326110839844, "global_step": 39765, "epoch": 328} {"train_loss": -34.1855583190918, "global_step": 39766, "epoch": 328} {"train_loss": -33.70075607299805, "global_step": 39767, "epoch": 328} {"train_loss": -34.31697463989258, "global_step": 39768, "epoch": 328} {"train_loss": -33.89360046386719, "global_step": 39769, "epoch": 328} {"train_loss": -33.707305908203125, "global_step": 39770, "epoch": 328} {"train_loss": -33.55183792114258, "global_step": 39771, "epoch": 328} {"train_loss": -34.66438674926758, "global_step": 39772, "epoch": 328} {"train_loss": -34.3734245300293, "global_step": 39773, "epoch": 328} {"train_loss": -34.70998764038086, "global_step": 39774, "epoch": 328} {"train_loss": -34.46405029296875, "global_step": 39775, "epoch": 328} {"train_loss": -33.4935417175293, "global_step": 39776, "epoch": 328} {"train_loss": -34.05923080444336, "global_step": 39777, "epoch": 328} {"train_loss": -34.37449264526367, "global_step": 39778, "epoch": 328} {"train_loss": -34.48060607910156, "global_step": 39779, "epoch": 328} {"train_loss": -34.415401458740234, "global_step": 39780, "epoch": 328} {"train_loss": -34.15590286254883, "global_step": 39781, "epoch": 328} {"train_loss": -32.54785919189453, "global_step": 39782, "epoch": 328} {"train_loss": -31.018136978149414, "global_step": 39783, "epoch": 328} {"train_loss": -28.31064796447754, "global_step": 39784, "epoch": 328} {"train_loss": -27.171600341796875, "global_step": 39785, "epoch": 328} {"train_loss": -23.50452995300293, "global_step": 39786, "epoch": 328} {"train_loss": -22.79598045349121, "global_step": 39787, "epoch": 328} {"train_loss": -24.07111930847168, "global_step": 39788, "epoch": 328} {"train_loss": -21.8561954498291, "global_step": 39789, "epoch": 328} {"train_loss": -22.755990982055664, "global_step": 39790, "epoch": 328} {"train_loss": -29.029605865478516, "global_step": 39791, "epoch": 328} {"train_loss": -31.21858787536621, "global_step": 39792, "epoch": 328} {"train_loss": -30.526931762695312, "global_step": 39793, "epoch": 328} {"train_loss": -31.69695472717285, "global_step": 39794, "epoch": 328} {"train_loss": -29.822742462158203, "global_step": 39795, "epoch": 328} {"train_loss": -31.18586540222168, "global_step": 39796, "epoch": 328} {"train_loss": -30.522846221923828, "global_step": 39797, "epoch": 328} {"train_loss": -31.22275161743164, "global_step": 39798, "epoch": 328} {"train_loss": -32.41030502319336, "global_step": 39799, "epoch": 328} {"train_loss": -31.49649429321289, "global_step": 39800, "epoch": 328} {"train_loss": -31.679340362548828, "global_step": 39801, "epoch": 328} {"train_loss": -32.24959182739258, "global_step": 39802, "epoch": 328} {"train_loss": -32.691585540771484, "global_step": 39803, "epoch": 328} {"train_loss": -31.454320907592773, "global_step": 39804, "epoch": 328} {"train_loss": -32.753746032714844, "global_step": 39805, "epoch": 328} {"train_loss": -32.05596923828125, "global_step": 39806, "epoch": 328} {"train_loss": -32.48868942260742, "global_step": 39807, "epoch": 328} {"train_loss": -32.104323789107895, "global_step": 39808, "epoch": 328, "val_loss": 2611724.75} {"train_loss": -32.22892761230469, "global_step": 39809, "epoch": 329} {"train_loss": -32.44684982299805, "global_step": 39810, "epoch": 329} {"train_loss": -33.35256576538086, "global_step": 39811, "epoch": 329} {"train_loss": -32.40470504760742, "global_step": 39812, "epoch": 329} {"train_loss": -32.95127487182617, "global_step": 39813, "epoch": 329} {"train_loss": -33.29560852050781, "global_step": 39814, "epoch": 329} {"train_loss": -32.70942306518555, "global_step": 39815, "epoch": 329} {"train_loss": -33.22368621826172, "global_step": 39816, "epoch": 329} {"train_loss": -32.9553108215332, "global_step": 39817, "epoch": 329} {"train_loss": -32.7464485168457, "global_step": 39818, "epoch": 329} {"train_loss": -33.31047439575195, "global_step": 39819, "epoch": 329} {"train_loss": -33.82203674316406, "global_step": 39820, "epoch": 329} {"train_loss": -33.363250732421875, "global_step": 39821, "epoch": 329} {"train_loss": -33.18581771850586, "global_step": 39822, "epoch": 329} {"train_loss": -32.36113357543945, "global_step": 39823, "epoch": 329} {"train_loss": -33.594600677490234, "global_step": 39824, "epoch": 329} {"train_loss": -33.254512786865234, "global_step": 39825, "epoch": 329} {"train_loss": -32.502437591552734, "global_step": 39826, "epoch": 329} {"train_loss": -31.078582763671875, "global_step": 39827, "epoch": 329} {"train_loss": -31.973875045776367, "global_step": 39828, "epoch": 329} {"train_loss": -32.877349853515625, "global_step": 39829, "epoch": 329} {"train_loss": -33.354339599609375, "global_step": 39830, "epoch": 329} {"train_loss": -32.351314544677734, "global_step": 39831, "epoch": 329} {"train_loss": -32.21208572387695, "global_step": 39832, "epoch": 329} {"train_loss": -33.186946868896484, "global_step": 39833, "epoch": 329} {"train_loss": -33.797760009765625, "global_step": 39834, "epoch": 329} {"train_loss": -33.28913116455078, "global_step": 39835, "epoch": 329} {"train_loss": -32.838783264160156, "global_step": 39836, "epoch": 329} {"train_loss": -32.79712677001953, "global_step": 39837, "epoch": 329} {"train_loss": -33.216373443603516, "global_step": 39838, "epoch": 329} {"train_loss": -33.10624313354492, "global_step": 39839, "epoch": 329} {"train_loss": -33.40818405151367, "global_step": 39840, "epoch": 329} {"train_loss": -33.49842071533203, "global_step": 39841, "epoch": 329} {"train_loss": -32.71224594116211, "global_step": 39842, "epoch": 329} {"train_loss": -33.53886413574219, "global_step": 39843, "epoch": 329} {"train_loss": -33.39455032348633, "global_step": 39844, "epoch": 329} {"train_loss": -33.36812973022461, "global_step": 39845, "epoch": 329} {"train_loss": -33.85272979736328, "global_step": 39846, "epoch": 329} {"train_loss": -33.70740509033203, "global_step": 39847, "epoch": 329} {"train_loss": -33.72096633911133, "global_step": 39848, "epoch": 329} {"train_loss": -32.79361343383789, "global_step": 39849, "epoch": 329} {"train_loss": -33.66309356689453, "global_step": 39850, "epoch": 329} {"train_loss": -33.53762435913086, "global_step": 39851, "epoch": 329} {"train_loss": -33.416378021240234, "global_step": 39852, "epoch": 329} {"train_loss": -33.835914611816406, "global_step": 39853, "epoch": 329} {"train_loss": -33.93852996826172, "global_step": 39854, "epoch": 329} {"train_loss": -34.140106201171875, "global_step": 39855, "epoch": 329} {"train_loss": -34.287940979003906, "global_step": 39856, "epoch": 329} {"train_loss": -33.816551208496094, "global_step": 39857, "epoch": 329} {"train_loss": -33.863643646240234, "global_step": 39858, "epoch": 329} {"train_loss": -33.93556594848633, "global_step": 39859, "epoch": 329} {"train_loss": -34.1681022644043, "global_step": 39860, "epoch": 329} {"train_loss": -33.72385787963867, "global_step": 39861, "epoch": 329} {"train_loss": -33.91465377807617, "global_step": 39862, "epoch": 329} {"train_loss": -34.41929244995117, "global_step": 39863, "epoch": 329} {"train_loss": -34.40517044067383, "global_step": 39864, "epoch": 329} {"train_loss": -34.013797760009766, "global_step": 39865, "epoch": 329} {"train_loss": -34.226497650146484, "global_step": 39866, "epoch": 329} {"train_loss": -34.032894134521484, "global_step": 39867, "epoch": 329} {"train_loss": -34.177886962890625, "global_step": 39868, "epoch": 329} {"train_loss": -33.672176361083984, "global_step": 39869, "epoch": 329} {"train_loss": -34.41486740112305, "global_step": 39870, "epoch": 329} {"train_loss": -33.865596771240234, "global_step": 39871, "epoch": 329} {"train_loss": -34.64332962036133, "global_step": 39872, "epoch": 329} {"train_loss": -33.47517013549805, "global_step": 39873, "epoch": 329} {"train_loss": -34.57455062866211, "global_step": 39874, "epoch": 329} {"train_loss": -33.304901123046875, "global_step": 39875, "epoch": 329} {"train_loss": -32.413570404052734, "global_step": 39876, "epoch": 329} {"train_loss": -32.29100799560547, "global_step": 39877, "epoch": 329} {"train_loss": -33.65324020385742, "global_step": 39878, "epoch": 329} {"train_loss": -32.89760208129883, "global_step": 39879, "epoch": 329} {"train_loss": -33.957698822021484, "global_step": 39880, "epoch": 329} {"train_loss": -32.46747970581055, "global_step": 39881, "epoch": 329} {"train_loss": -33.651763916015625, "global_step": 39882, "epoch": 329} {"train_loss": -33.586490631103516, "global_step": 39883, "epoch": 329} {"train_loss": -32.54486083984375, "global_step": 39884, "epoch": 329} {"train_loss": -33.797359466552734, "global_step": 39885, "epoch": 329} {"train_loss": -33.61311340332031, "global_step": 39886, "epoch": 329} {"train_loss": -33.45568084716797, "global_step": 39887, "epoch": 329} {"train_loss": -33.7886848449707, "global_step": 39888, "epoch": 329} {"train_loss": -34.02068328857422, "global_step": 39889, "epoch": 329} {"train_loss": -33.09886932373047, "global_step": 39890, "epoch": 329} {"train_loss": -33.217220306396484, "global_step": 39891, "epoch": 329} {"train_loss": -32.513916015625, "global_step": 39892, "epoch": 329} {"train_loss": -32.902259826660156, "global_step": 39893, "epoch": 329} {"train_loss": -33.09455871582031, "global_step": 39894, "epoch": 329} {"train_loss": -31.87306022644043, "global_step": 39895, "epoch": 329} {"train_loss": -30.970687866210938, "global_step": 39896, "epoch": 329} {"train_loss": -31.55889892578125, "global_step": 39897, "epoch": 329} {"train_loss": -31.969877243041992, "global_step": 39898, "epoch": 329} {"train_loss": -31.791772842407227, "global_step": 39899, "epoch": 329} {"train_loss": -31.1754207611084, "global_step": 39900, "epoch": 329} {"train_loss": -32.78223419189453, "global_step": 39901, "epoch": 329} {"train_loss": -32.46369552612305, "global_step": 39902, "epoch": 329} {"train_loss": -31.45570182800293, "global_step": 39903, "epoch": 329} {"train_loss": -33.03345489501953, "global_step": 39904, "epoch": 329} {"train_loss": -32.69538116455078, "global_step": 39905, "epoch": 329} {"train_loss": -30.158857345581055, "global_step": 39906, "epoch": 329} {"train_loss": -30.984054565429688, "global_step": 39907, "epoch": 329} {"train_loss": -31.854537963867188, "global_step": 39908, "epoch": 329} {"train_loss": -32.2304573059082, "global_step": 39909, "epoch": 329} {"train_loss": -32.13621139526367, "global_step": 39910, "epoch": 329} {"train_loss": -32.959938049316406, "global_step": 39911, "epoch": 329} {"train_loss": -33.344181060791016, "global_step": 39912, "epoch": 329} {"train_loss": -32.33770751953125, "global_step": 39913, "epoch": 329} {"train_loss": -32.305564880371094, "global_step": 39914, "epoch": 329} {"train_loss": -32.61558151245117, "global_step": 39915, "epoch": 329} {"train_loss": -32.11812973022461, "global_step": 39916, "epoch": 329} {"train_loss": -32.129852294921875, "global_step": 39917, "epoch": 329} {"train_loss": -32.49080276489258, "global_step": 39918, "epoch": 329} {"train_loss": -33.22166061401367, "global_step": 39919, "epoch": 329} {"train_loss": -33.04673385620117, "global_step": 39920, "epoch": 329} {"train_loss": -32.96916961669922, "global_step": 39921, "epoch": 329} {"train_loss": -33.143409729003906, "global_step": 39922, "epoch": 329} {"train_loss": -32.90879440307617, "global_step": 39923, "epoch": 329} {"train_loss": -33.53938293457031, "global_step": 39924, "epoch": 329} {"train_loss": -33.38017654418945, "global_step": 39925, "epoch": 329} {"train_loss": -33.71387481689453, "global_step": 39926, "epoch": 329} {"train_loss": -33.908203125, "global_step": 39927, "epoch": 329} {"train_loss": -33.85105895996094, "global_step": 39928, "epoch": 329} {"train_loss": -33.10157994987551, "global_step": 39929, "epoch": 329, "val_loss": 2659777.0} {"train_loss": -33.95863723754883, "global_step": 39930, "epoch": 330} {"train_loss": -33.795440673828125, "global_step": 39931, "epoch": 330} {"train_loss": -34.19603729248047, "global_step": 39932, "epoch": 330} {"train_loss": -33.27347946166992, "global_step": 39933, "epoch": 330} {"train_loss": -34.245052337646484, "global_step": 39934, "epoch": 330} {"train_loss": -33.96446990966797, "global_step": 39935, "epoch": 330} {"train_loss": -34.098140716552734, "global_step": 39936, "epoch": 330} {"train_loss": -34.488861083984375, "global_step": 39937, "epoch": 330} {"train_loss": -34.296443939208984, "global_step": 39938, "epoch": 330} {"train_loss": -34.28916549682617, "global_step": 39939, "epoch": 330} {"train_loss": -33.9478874206543, "global_step": 39940, "epoch": 330} {"train_loss": -34.440711975097656, "global_step": 39941, "epoch": 330} {"train_loss": -34.356868743896484, "global_step": 39942, "epoch": 330} {"train_loss": -34.53078842163086, "global_step": 39943, "epoch": 330} {"train_loss": -34.66204833984375, "global_step": 39944, "epoch": 330} {"train_loss": -34.11342239379883, "global_step": 39945, "epoch": 330} {"train_loss": -34.68955612182617, "global_step": 39946, "epoch": 330} {"train_loss": -34.634437561035156, "global_step": 39947, "epoch": 330} {"train_loss": -34.85971450805664, "global_step": 39948, "epoch": 330} {"train_loss": -34.575439453125, "global_step": 39949, "epoch": 330} {"train_loss": -35.09074020385742, "global_step": 39950, "epoch": 330} {"train_loss": -34.86064529418945, "global_step": 39951, "epoch": 330} {"train_loss": -34.849727630615234, "global_step": 39952, "epoch": 330} {"train_loss": -34.88225555419922, "global_step": 39953, "epoch": 330} {"train_loss": -35.2029914855957, "global_step": 39954, "epoch": 330} {"train_loss": -34.94808578491211, "global_step": 39955, "epoch": 330} {"train_loss": -35.0395622253418, "global_step": 39956, "epoch": 330} {"train_loss": -34.973567962646484, "global_step": 39957, "epoch": 330} {"train_loss": -34.342750549316406, "global_step": 39958, "epoch": 330} {"train_loss": -33.41665267944336, "global_step": 39959, "epoch": 330} {"train_loss": -32.9439811706543, "global_step": 39960, "epoch": 330} {"train_loss": -32.55402755737305, "global_step": 39961, "epoch": 330} {"train_loss": -34.05989456176758, "global_step": 39962, "epoch": 330} {"train_loss": -34.695552825927734, "global_step": 39963, "epoch": 330} {"train_loss": -35.19984817504883, "global_step": 39964, "epoch": 330} {"train_loss": -33.54848098754883, "global_step": 39965, "epoch": 330} {"train_loss": -32.86810302734375, "global_step": 39966, "epoch": 330} {"train_loss": -33.4431266784668, "global_step": 39967, "epoch": 330} {"train_loss": -34.08134078979492, "global_step": 39968, "epoch": 330} {"train_loss": -34.22815704345703, "global_step": 39969, "epoch": 330} {"train_loss": -33.37700271606445, "global_step": 39970, "epoch": 330} {"train_loss": -34.1070442199707, "global_step": 39971, "epoch": 330} {"train_loss": -35.419715881347656, "global_step": 39972, "epoch": 330} {"train_loss": -34.45208740234375, "global_step": 39973, "epoch": 330} {"train_loss": -34.50050735473633, "global_step": 39974, "epoch": 330} {"train_loss": -34.48568344116211, "global_step": 39975, "epoch": 330} {"train_loss": -34.49231719970703, "global_step": 39976, "epoch": 330} {"train_loss": -34.51577377319336, "global_step": 39977, "epoch": 330} {"train_loss": -34.23821258544922, "global_step": 39978, "epoch": 330} {"train_loss": -33.33293151855469, "global_step": 39979, "epoch": 330} {"train_loss": -35.12163543701172, "global_step": 39980, "epoch": 330} {"train_loss": -34.36553192138672, "global_step": 39981, "epoch": 330} {"train_loss": -33.84856033325195, "global_step": 39982, "epoch": 330} {"train_loss": -33.74189376831055, "global_step": 39983, "epoch": 330} {"train_loss": -33.9519157409668, "global_step": 39984, "epoch": 330} {"train_loss": -33.852989196777344, "global_step": 39985, "epoch": 330} {"train_loss": -29.386972427368164, "global_step": 39986, "epoch": 330} {"train_loss": -24.012720108032227, "global_step": 39987, "epoch": 330} {"train_loss": -16.373701095581055, "global_step": 39988, "epoch": 330} {"train_loss": -18.42866325378418, "global_step": 39989, "epoch": 330} {"train_loss": -32.10859298706055, "global_step": 39990, "epoch": 330} {"train_loss": -27.2452449798584, "global_step": 39991, "epoch": 330} {"train_loss": -33.00486373901367, "global_step": 39992, "epoch": 330} {"train_loss": -30.240549087524414, "global_step": 39993, "epoch": 330} {"train_loss": -33.48944091796875, "global_step": 39994, "epoch": 330} {"train_loss": -32.261810302734375, "global_step": 39995, "epoch": 330} {"train_loss": -31.992883682250977, "global_step": 39996, "epoch": 330} {"train_loss": -32.39870071411133, "global_step": 39997, "epoch": 330} {"train_loss": -33.15476989746094, "global_step": 39998, "epoch": 330} {"train_loss": -32.522254943847656, "global_step": 39999, "epoch": 330} {"train_loss": -33.588661193847656, "global_step": 40000, "epoch": 330} {"train_loss": -33.068763732910156, "global_step": 40001, "epoch": 330} {"train_loss": -33.26151657104492, "global_step": 40002, "epoch": 330} {"train_loss": -32.46215057373047, "global_step": 40003, "epoch": 330} {"train_loss": -33.81757736206055, "global_step": 40004, "epoch": 330} {"train_loss": -33.62437438964844, "global_step": 40005, "epoch": 330} {"train_loss": -33.60146713256836, "global_step": 40006, "epoch": 330} {"train_loss": -33.679996490478516, "global_step": 40007, "epoch": 330} {"train_loss": -33.412147521972656, "global_step": 40008, "epoch": 330} {"train_loss": -33.80843734741211, "global_step": 40009, "epoch": 330} {"train_loss": -34.20602035522461, "global_step": 40010, "epoch": 330} {"train_loss": -33.341094970703125, "global_step": 40011, "epoch": 330} {"train_loss": -34.04501724243164, "global_step": 40012, "epoch": 330} {"train_loss": -33.457401275634766, "global_step": 40013, "epoch": 330} {"train_loss": -34.00128936767578, "global_step": 40014, "epoch": 330} {"train_loss": -33.99121856689453, "global_step": 40015, "epoch": 330} {"train_loss": -34.210819244384766, "global_step": 40016, "epoch": 330} {"train_loss": -34.37553024291992, "global_step": 40017, "epoch": 330} {"train_loss": -33.55525588989258, "global_step": 40018, "epoch": 330} {"train_loss": -34.14909362792969, "global_step": 40019, "epoch": 330} {"train_loss": -34.22733688354492, "global_step": 40020, "epoch": 330} {"train_loss": -34.0518684387207, "global_step": 40021, "epoch": 330} {"train_loss": -33.9345817565918, "global_step": 40022, "epoch": 330} {"train_loss": -34.04602813720703, "global_step": 40023, "epoch": 330} {"train_loss": -33.934326171875, "global_step": 40024, "epoch": 330} {"train_loss": -34.46788024902344, "global_step": 40025, "epoch": 330} {"train_loss": -33.81806945800781, "global_step": 40026, "epoch": 330} {"train_loss": -34.411739349365234, "global_step": 40027, "epoch": 330} {"train_loss": -33.457557678222656, "global_step": 40028, "epoch": 330} {"train_loss": -34.21106719970703, "global_step": 40029, "epoch": 330} {"train_loss": -33.938724517822266, "global_step": 40030, "epoch": 330} {"train_loss": -34.063079833984375, "global_step": 40031, "epoch": 330} {"train_loss": -34.36573791503906, "global_step": 40032, "epoch": 330} {"train_loss": -33.64515686035156, "global_step": 40033, "epoch": 330} {"train_loss": -34.01618576049805, "global_step": 40034, "epoch": 330} {"train_loss": -32.9779167175293, "global_step": 40035, "epoch": 330} {"train_loss": -31.936878204345703, "global_step": 40036, "epoch": 330} {"train_loss": -29.848108291625977, "global_step": 40037, "epoch": 330} {"train_loss": -29.15106201171875, "global_step": 40038, "epoch": 330} {"train_loss": -27.4733829498291, "global_step": 40039, "epoch": 330} {"train_loss": -27.73529624938965, "global_step": 40040, "epoch": 330} {"train_loss": -30.341617584228516, "global_step": 40041, "epoch": 330} {"train_loss": -33.43906784057617, "global_step": 40042, "epoch": 330} {"train_loss": -31.486841201782227, "global_step": 40043, "epoch": 330} {"train_loss": -33.24382019042969, "global_step": 40044, "epoch": 330} {"train_loss": -31.487817764282227, "global_step": 40045, "epoch": 330} {"train_loss": -33.733428955078125, "global_step": 40046, "epoch": 330} {"train_loss": -30.8518123626709, "global_step": 40047, "epoch": 330} {"train_loss": -33.034149169921875, "global_step": 40048, "epoch": 330} {"train_loss": -32.50110626220703, "global_step": 40049, "epoch": 330} {"train_loss": -33.15599200351179, "global_step": 40050, "epoch": 330, "val_loss": 2605606.25} {"train_loss": -32.6886100769043, "global_step": 40051, "epoch": 331} {"train_loss": -33.85194778442383, "global_step": 40052, "epoch": 331} {"train_loss": -33.60676574707031, "global_step": 40053, "epoch": 331} {"train_loss": -33.04841613769531, "global_step": 40054, "epoch": 331} {"train_loss": -33.41515350341797, "global_step": 40055, "epoch": 331} {"train_loss": -33.4790153503418, "global_step": 40056, "epoch": 331} {"train_loss": -33.72354507446289, "global_step": 40057, "epoch": 331} {"train_loss": -33.86676788330078, "global_step": 40058, "epoch": 331} {"train_loss": -33.88580322265625, "global_step": 40059, "epoch": 331} {"train_loss": -33.740333557128906, "global_step": 40060, "epoch": 331} {"train_loss": -33.75697326660156, "global_step": 40061, "epoch": 331} {"train_loss": -33.881263732910156, "global_step": 40062, "epoch": 331} {"train_loss": -33.834346771240234, "global_step": 40063, "epoch": 331} {"train_loss": -34.06902313232422, "global_step": 40064, "epoch": 331} {"train_loss": -33.67509078979492, "global_step": 40065, "epoch": 331} {"train_loss": -33.909915924072266, "global_step": 40066, "epoch": 331} {"train_loss": -33.47628402709961, "global_step": 40067, "epoch": 331} {"train_loss": -33.880271911621094, "global_step": 40068, "epoch": 331} {"train_loss": -34.43707275390625, "global_step": 40069, "epoch": 331} {"train_loss": -34.316158294677734, "global_step": 40070, "epoch": 331} {"train_loss": -34.53116989135742, "global_step": 40071, "epoch": 331} {"train_loss": -33.92943572998047, "global_step": 40072, "epoch": 331} {"train_loss": -33.98792266845703, "global_step": 40073, "epoch": 331} {"train_loss": -34.179439544677734, "global_step": 40074, "epoch": 331} {"train_loss": -34.162384033203125, "global_step": 40075, "epoch": 331} {"train_loss": -33.86897659301758, "global_step": 40076, "epoch": 331} {"train_loss": -34.691131591796875, "global_step": 40077, "epoch": 331} {"train_loss": -33.91102981567383, "global_step": 40078, "epoch": 331} {"train_loss": -34.044708251953125, "global_step": 40079, "epoch": 331} {"train_loss": -34.5846061706543, "global_step": 40080, "epoch": 331} {"train_loss": -34.74979782104492, "global_step": 40081, "epoch": 331} {"train_loss": -34.341773986816406, "global_step": 40082, "epoch": 331} {"train_loss": -33.12370681762695, "global_step": 40083, "epoch": 331} {"train_loss": -32.774566650390625, "global_step": 40084, "epoch": 331} {"train_loss": -31.778430938720703, "global_step": 40085, "epoch": 331} {"train_loss": -27.083587646484375, "global_step": 40086, "epoch": 331} {"train_loss": -19.987112045288086, "global_step": 40087, "epoch": 331} {"train_loss": -17.601428985595703, "global_step": 40088, "epoch": 331} {"train_loss": -27.41969108581543, "global_step": 40089, "epoch": 331} {"train_loss": -32.63887405395508, "global_step": 40090, "epoch": 331} {"train_loss": -27.61933708190918, "global_step": 40091, "epoch": 331} {"train_loss": -33.802650451660156, "global_step": 40092, "epoch": 331} {"train_loss": -29.967798233032227, "global_step": 40093, "epoch": 331} {"train_loss": -33.370216369628906, "global_step": 40094, "epoch": 331} {"train_loss": -31.677661895751953, "global_step": 40095, "epoch": 331} {"train_loss": -32.266845703125, "global_step": 40096, "epoch": 331} {"train_loss": -33.493709564208984, "global_step": 40097, "epoch": 331} {"train_loss": -32.90067672729492, "global_step": 40098, "epoch": 331} {"train_loss": -33.11979293823242, "global_step": 40099, "epoch": 331} {"train_loss": -33.74905014038086, "global_step": 40100, "epoch": 331} {"train_loss": -33.41327667236328, "global_step": 40101, "epoch": 331} {"train_loss": -32.74055099487305, "global_step": 40102, "epoch": 331} {"train_loss": -33.683589935302734, "global_step": 40103, "epoch": 331} {"train_loss": -33.69548416137695, "global_step": 40104, "epoch": 331} {"train_loss": -33.49452590942383, "global_step": 40105, "epoch": 331} {"train_loss": -33.70045852661133, "global_step": 40106, "epoch": 331} {"train_loss": -34.01436996459961, "global_step": 40107, "epoch": 331} {"train_loss": -33.36848831176758, "global_step": 40108, "epoch": 331} {"train_loss": -33.07171630859375, "global_step": 40109, "epoch": 331} {"train_loss": -33.700740814208984, "global_step": 40110, "epoch": 331} {"train_loss": -33.62765121459961, "global_step": 40111, "epoch": 331} {"train_loss": -33.57404327392578, "global_step": 40112, "epoch": 331} {"train_loss": -33.025081634521484, "global_step": 40113, "epoch": 331} {"train_loss": -32.598731994628906, "global_step": 40114, "epoch": 331} {"train_loss": -34.00344467163086, "global_step": 40115, "epoch": 331} {"train_loss": -32.74974060058594, "global_step": 40116, "epoch": 331} {"train_loss": -33.574005126953125, "global_step": 40117, "epoch": 331} {"train_loss": -33.37701416015625, "global_step": 40118, "epoch": 331} {"train_loss": -33.811317443847656, "global_step": 40119, "epoch": 331} {"train_loss": -33.82484817504883, "global_step": 40120, "epoch": 331} {"train_loss": -33.65043258666992, "global_step": 40121, "epoch": 331} {"train_loss": -34.19608688354492, "global_step": 40122, "epoch": 331} {"train_loss": -33.75346755981445, "global_step": 40123, "epoch": 331} {"train_loss": -33.91081619262695, "global_step": 40124, "epoch": 331} {"train_loss": -34.323307037353516, "global_step": 40125, "epoch": 331} {"train_loss": -33.42836380004883, "global_step": 40126, "epoch": 331} {"train_loss": -34.217525482177734, "global_step": 40127, "epoch": 331} {"train_loss": -34.05914306640625, "global_step": 40128, "epoch": 331} {"train_loss": -34.0883674621582, "global_step": 40129, "epoch": 331} {"train_loss": -34.39892578125, "global_step": 40130, "epoch": 331} {"train_loss": -34.39986038208008, "global_step": 40131, "epoch": 331} {"train_loss": -34.18830490112305, "global_step": 40132, "epoch": 331} {"train_loss": -34.527191162109375, "global_step": 40133, "epoch": 331} {"train_loss": -32.942726135253906, "global_step": 40134, "epoch": 331} {"train_loss": -33.46306228637695, "global_step": 40135, "epoch": 331} {"train_loss": -32.950477600097656, "global_step": 40136, "epoch": 331} {"train_loss": -33.41744613647461, "global_step": 40137, "epoch": 331} {"train_loss": -34.347625732421875, "global_step": 40138, "epoch": 331} {"train_loss": -33.45919418334961, "global_step": 40139, "epoch": 331} {"train_loss": -33.971988677978516, "global_step": 40140, "epoch": 331} {"train_loss": -34.59614181518555, "global_step": 40141, "epoch": 331} {"train_loss": -34.17338180541992, "global_step": 40142, "epoch": 331} {"train_loss": -34.15945053100586, "global_step": 40143, "epoch": 331} {"train_loss": -33.6799430847168, "global_step": 40144, "epoch": 331} {"train_loss": -34.085330963134766, "global_step": 40145, "epoch": 331} {"train_loss": -33.61613845825195, "global_step": 40146, "epoch": 331} {"train_loss": -34.09382247924805, "global_step": 40147, "epoch": 331} {"train_loss": -34.5799674987793, "global_step": 40148, "epoch": 331} {"train_loss": -33.69697570800781, "global_step": 40149, "epoch": 331} {"train_loss": -34.448944091796875, "global_step": 40150, "epoch": 331} {"train_loss": -33.554866790771484, "global_step": 40151, "epoch": 331} {"train_loss": -33.675838470458984, "global_step": 40152, "epoch": 331} {"train_loss": -32.79835891723633, "global_step": 40153, "epoch": 331} {"train_loss": -33.958534240722656, "global_step": 40154, "epoch": 331} {"train_loss": -33.91761779785156, "global_step": 40155, "epoch": 331} {"train_loss": -33.192359924316406, "global_step": 40156, "epoch": 331} {"train_loss": -33.95026779174805, "global_step": 40157, "epoch": 331} {"train_loss": -33.784767150878906, "global_step": 40158, "epoch": 331} {"train_loss": -33.7685432434082, "global_step": 40159, "epoch": 331} {"train_loss": -33.96657943725586, "global_step": 40160, "epoch": 331} {"train_loss": -33.13386154174805, "global_step": 40161, "epoch": 331} {"train_loss": -34.09885787963867, "global_step": 40162, "epoch": 331} {"train_loss": -33.77022933959961, "global_step": 40163, "epoch": 331} {"train_loss": -33.48208999633789, "global_step": 40164, "epoch": 331} {"train_loss": -34.24299240112305, "global_step": 40165, "epoch": 331} {"train_loss": -32.60715866088867, "global_step": 40166, "epoch": 331} {"train_loss": -34.0894889831543, "global_step": 40167, "epoch": 331} {"train_loss": -33.716793060302734, "global_step": 40168, "epoch": 331} {"train_loss": -34.3595085144043, "global_step": 40169, "epoch": 331} {"train_loss": -33.66090774536133, "global_step": 40170, "epoch": 331} {"train_loss": -33.269105863965244, "global_step": 40171, "epoch": 331, "val_loss": 2700598.0} {"train_loss": -33.96384811401367, "global_step": 40172, "epoch": 332} {"train_loss": -33.9459114074707, "global_step": 40173, "epoch": 332} {"train_loss": -34.269344329833984, "global_step": 40174, "epoch": 332} {"train_loss": -33.79914474487305, "global_step": 40175, "epoch": 332} {"train_loss": -33.60371398925781, "global_step": 40176, "epoch": 332} {"train_loss": -34.366695404052734, "global_step": 40177, "epoch": 332} {"train_loss": -33.45101547241211, "global_step": 40178, "epoch": 332} {"train_loss": -34.163665771484375, "global_step": 40179, "epoch": 332} {"train_loss": -34.29838180541992, "global_step": 40180, "epoch": 332} {"train_loss": -33.803646087646484, "global_step": 40181, "epoch": 332} {"train_loss": -34.161651611328125, "global_step": 40182, "epoch": 332} {"train_loss": -34.521568298339844, "global_step": 40183, "epoch": 332} {"train_loss": -34.12551498413086, "global_step": 40184, "epoch": 332} {"train_loss": -33.71201705932617, "global_step": 40185, "epoch": 332} {"train_loss": -34.551639556884766, "global_step": 40186, "epoch": 332} {"train_loss": -34.45185089111328, "global_step": 40187, "epoch": 332} {"train_loss": -34.36723327636719, "global_step": 40188, "epoch": 332} {"train_loss": -34.26398468017578, "global_step": 40189, "epoch": 332} {"train_loss": -34.6112174987793, "global_step": 40190, "epoch": 332} {"train_loss": -34.655853271484375, "global_step": 40191, "epoch": 332} {"train_loss": -34.69403839111328, "global_step": 40192, "epoch": 332} {"train_loss": -34.120086669921875, "global_step": 40193, "epoch": 332} {"train_loss": -34.817378997802734, "global_step": 40194, "epoch": 332} {"train_loss": -34.81905746459961, "global_step": 40195, "epoch": 332} {"train_loss": -34.533973693847656, "global_step": 40196, "epoch": 332} {"train_loss": -34.2609977722168, "global_step": 40197, "epoch": 332} {"train_loss": -34.75114822387695, "global_step": 40198, "epoch": 332} {"train_loss": -34.8070182800293, "global_step": 40199, "epoch": 332} {"train_loss": -34.562068939208984, "global_step": 40200, "epoch": 332} {"train_loss": -34.12861633300781, "global_step": 40201, "epoch": 332} {"train_loss": -34.44430923461914, "global_step": 40202, "epoch": 332} {"train_loss": -34.27041244506836, "global_step": 40203, "epoch": 332} {"train_loss": -35.23830032348633, "global_step": 40204, "epoch": 332} {"train_loss": -33.094234466552734, "global_step": 40205, "epoch": 332} {"train_loss": -33.5401611328125, "global_step": 40206, "epoch": 332} {"train_loss": -34.432838439941406, "global_step": 40207, "epoch": 332} {"train_loss": -33.13055419921875, "global_step": 40208, "epoch": 332} {"train_loss": -34.31039047241211, "global_step": 40209, "epoch": 332} {"train_loss": -33.387874603271484, "global_step": 40210, "epoch": 332} {"train_loss": -34.2818717956543, "global_step": 40211, "epoch": 332} {"train_loss": -33.46733093261719, "global_step": 40212, "epoch": 332} {"train_loss": -32.552207946777344, "global_step": 40213, "epoch": 332} {"train_loss": -33.78217315673828, "global_step": 40214, "epoch": 332} {"train_loss": -33.14327621459961, "global_step": 40215, "epoch": 332} {"train_loss": -32.95930099487305, "global_step": 40216, "epoch": 332} {"train_loss": -32.51017379760742, "global_step": 40217, "epoch": 332} {"train_loss": -32.81748962402344, "global_step": 40218, "epoch": 332} {"train_loss": -34.40332794189453, "global_step": 40219, "epoch": 332} {"train_loss": -33.24167251586914, "global_step": 40220, "epoch": 332} {"train_loss": -33.86542510986328, "global_step": 40221, "epoch": 332} {"train_loss": -34.671600341796875, "global_step": 40222, "epoch": 332} {"train_loss": -34.09534454345703, "global_step": 40223, "epoch": 332} {"train_loss": -33.15043640136719, "global_step": 40224, "epoch": 332} {"train_loss": -33.61552429199219, "global_step": 40225, "epoch": 332} {"train_loss": -33.23358154296875, "global_step": 40226, "epoch": 332} {"train_loss": -32.80491638183594, "global_step": 40227, "epoch": 332} {"train_loss": -33.89429473876953, "global_step": 40228, "epoch": 332} {"train_loss": -34.11490249633789, "global_step": 40229, "epoch": 332} {"train_loss": -33.87538528442383, "global_step": 40230, "epoch": 332} {"train_loss": -34.56345748901367, "global_step": 40231, "epoch": 332} {"train_loss": -33.83100128173828, "global_step": 40232, "epoch": 332} {"train_loss": -34.28608322143555, "global_step": 40233, "epoch": 332} {"train_loss": -33.92887878417969, "global_step": 40234, "epoch": 332} {"train_loss": -33.894649505615234, "global_step": 40235, "epoch": 332} {"train_loss": -33.65510177612305, "global_step": 40236, "epoch": 332} {"train_loss": -33.70751953125, "global_step": 40237, "epoch": 332} {"train_loss": -34.36145782470703, "global_step": 40238, "epoch": 332} {"train_loss": -33.95281219482422, "global_step": 40239, "epoch": 332} {"train_loss": -32.2542610168457, "global_step": 40240, "epoch": 332} {"train_loss": -32.21629333496094, "global_step": 40241, "epoch": 332} {"train_loss": -34.24445724487305, "global_step": 40242, "epoch": 332} {"train_loss": -34.42818832397461, "global_step": 40243, "epoch": 332} {"train_loss": -33.9755973815918, "global_step": 40244, "epoch": 332} {"train_loss": -34.52974319458008, "global_step": 40245, "epoch": 332} {"train_loss": -34.2337646484375, "global_step": 40246, "epoch": 332} {"train_loss": -34.17207717895508, "global_step": 40247, "epoch": 332} {"train_loss": -34.60539627075195, "global_step": 40248, "epoch": 332} {"train_loss": -34.85029602050781, "global_step": 40249, "epoch": 332} {"train_loss": -34.2320671081543, "global_step": 40250, "epoch": 332} {"train_loss": -34.551368713378906, "global_step": 40251, "epoch": 332} {"train_loss": -34.47907638549805, "global_step": 40252, "epoch": 332} {"train_loss": -34.90177536010742, "global_step": 40253, "epoch": 332} {"train_loss": -34.78468704223633, "global_step": 40254, "epoch": 332} {"train_loss": -35.30392837524414, "global_step": 40255, "epoch": 332} {"train_loss": -34.1550407409668, "global_step": 40256, "epoch": 332} {"train_loss": -34.839141845703125, "global_step": 40257, "epoch": 332} {"train_loss": -34.73930358886719, "global_step": 40258, "epoch": 332} {"train_loss": -33.889095306396484, "global_step": 40259, "epoch": 332} {"train_loss": -34.48613739013672, "global_step": 40260, "epoch": 332} {"train_loss": -33.962154388427734, "global_step": 40261, "epoch": 332} {"train_loss": -34.250911712646484, "global_step": 40262, "epoch": 332} {"train_loss": -33.17169189453125, "global_step": 40263, "epoch": 332} {"train_loss": -33.53377151489258, "global_step": 40264, "epoch": 332} {"train_loss": -34.50641632080078, "global_step": 40265, "epoch": 332} {"train_loss": -33.782501220703125, "global_step": 40266, "epoch": 332} {"train_loss": -33.906795501708984, "global_step": 40267, "epoch": 332} {"train_loss": -34.36672592163086, "global_step": 40268, "epoch": 332} {"train_loss": -33.06547927856445, "global_step": 40269, "epoch": 332} {"train_loss": -34.420188903808594, "global_step": 40270, "epoch": 332} {"train_loss": -33.79901885986328, "global_step": 40271, "epoch": 332} {"train_loss": -34.210235595703125, "global_step": 40272, "epoch": 332} {"train_loss": -34.41830062866211, "global_step": 40273, "epoch": 332} {"train_loss": -34.30527877807617, "global_step": 40274, "epoch": 332} {"train_loss": -34.41020965576172, "global_step": 40275, "epoch": 332} {"train_loss": -34.19277572631836, "global_step": 40276, "epoch": 332} {"train_loss": -33.614280700683594, "global_step": 40277, "epoch": 332} {"train_loss": -34.465553283691406, "global_step": 40278, "epoch": 332} {"train_loss": -34.3945426940918, "global_step": 40279, "epoch": 332} {"train_loss": -33.5493278503418, "global_step": 40280, "epoch": 332} {"train_loss": -34.32816696166992, "global_step": 40281, "epoch": 332} {"train_loss": -34.18030548095703, "global_step": 40282, "epoch": 332} {"train_loss": -32.558406829833984, "global_step": 40283, "epoch": 332} {"train_loss": -29.90972328186035, "global_step": 40284, "epoch": 332} {"train_loss": -31.876630783081055, "global_step": 40285, "epoch": 332} {"train_loss": -31.74787712097168, "global_step": 40286, "epoch": 332} {"train_loss": -32.21601104736328, "global_step": 40287, "epoch": 332} {"train_loss": -32.799713134765625, "global_step": 40288, "epoch": 332} {"train_loss": -32.72483825683594, "global_step": 40289, "epoch": 332} {"train_loss": -33.43817138671875, "global_step": 40290, "epoch": 332} {"train_loss": -31.19349479675293, "global_step": 40291, "epoch": 332} {"train_loss": -33.90314357536884, "global_step": 40292, "epoch": 332, "val_loss": 2602212.75} {"train_loss": -33.5371208190918, "global_step": 40293, "epoch": 333} {"train_loss": -31.706317901611328, "global_step": 40294, "epoch": 333} {"train_loss": -32.648868560791016, "global_step": 40295, "epoch": 333} {"train_loss": -33.021854400634766, "global_step": 40296, "epoch": 333} {"train_loss": -31.71119499206543, "global_step": 40297, "epoch": 333} {"train_loss": -32.13865661621094, "global_step": 40298, "epoch": 333} {"train_loss": -32.484893798828125, "global_step": 40299, "epoch": 333} {"train_loss": -32.581787109375, "global_step": 40300, "epoch": 333} {"train_loss": -32.17033004760742, "global_step": 40301, "epoch": 333} {"train_loss": -32.254032135009766, "global_step": 40302, "epoch": 333} {"train_loss": -31.13482666015625, "global_step": 40303, "epoch": 333} {"train_loss": -33.147071838378906, "global_step": 40304, "epoch": 333} {"train_loss": -32.45975875854492, "global_step": 40305, "epoch": 333} {"train_loss": -31.9156494140625, "global_step": 40306, "epoch": 333} {"train_loss": -31.970102310180664, "global_step": 40307, "epoch": 333} {"train_loss": -31.765066146850586, "global_step": 40308, "epoch": 333} {"train_loss": -31.815948486328125, "global_step": 40309, "epoch": 333} {"train_loss": -32.68429183959961, "global_step": 40310, "epoch": 333} {"train_loss": -33.5811653137207, "global_step": 40311, "epoch": 333} {"train_loss": -32.231361389160156, "global_step": 40312, "epoch": 333} {"train_loss": -32.27915954589844, "global_step": 40313, "epoch": 333} {"train_loss": -31.3369083404541, "global_step": 40314, "epoch": 333} {"train_loss": -33.32662582397461, "global_step": 40315, "epoch": 333} {"train_loss": -32.77911376953125, "global_step": 40316, "epoch": 333} {"train_loss": -33.28257369995117, "global_step": 40317, "epoch": 333} {"train_loss": -33.189762115478516, "global_step": 40318, "epoch": 333} {"train_loss": -33.33314895629883, "global_step": 40319, "epoch": 333} {"train_loss": -32.96140670776367, "global_step": 40320, "epoch": 333} {"train_loss": -33.474483489990234, "global_step": 40321, "epoch": 333} {"train_loss": -33.44089889526367, "global_step": 40322, "epoch": 333} {"train_loss": -33.62359619140625, "global_step": 40323, "epoch": 333} {"train_loss": -33.28831100463867, "global_step": 40324, "epoch": 333} {"train_loss": -33.72058868408203, "global_step": 40325, "epoch": 333} {"train_loss": -33.34606170654297, "global_step": 40326, "epoch": 333} {"train_loss": -33.8136100769043, "global_step": 40327, "epoch": 333} {"train_loss": -33.87605667114258, "global_step": 40328, "epoch": 333} {"train_loss": -33.79885482788086, "global_step": 40329, "epoch": 333} {"train_loss": -33.59050369262695, "global_step": 40330, "epoch": 333} {"train_loss": -33.833473205566406, "global_step": 40331, "epoch": 333} {"train_loss": -34.10719680786133, "global_step": 40332, "epoch": 333} {"train_loss": -34.15594482421875, "global_step": 40333, "epoch": 333} {"train_loss": -34.13380432128906, "global_step": 40334, "epoch": 333} {"train_loss": -34.478275299072266, "global_step": 40335, "epoch": 333} {"train_loss": -34.18445587158203, "global_step": 40336, "epoch": 333} {"train_loss": -34.34797286987305, "global_step": 40337, "epoch": 333} {"train_loss": -33.46955490112305, "global_step": 40338, "epoch": 333} {"train_loss": -34.167724609375, "global_step": 40339, "epoch": 333} {"train_loss": -34.49349594116211, "global_step": 40340, "epoch": 333} {"train_loss": -34.2590217590332, "global_step": 40341, "epoch": 333} {"train_loss": -34.60681915283203, "global_step": 40342, "epoch": 333} {"train_loss": -34.0871696472168, "global_step": 40343, "epoch": 333} {"train_loss": -34.59586715698242, "global_step": 40344, "epoch": 333} {"train_loss": -34.139068603515625, "global_step": 40345, "epoch": 333} {"train_loss": -33.93867111206055, "global_step": 40346, "epoch": 333} {"train_loss": -33.830116271972656, "global_step": 40347, "epoch": 333} {"train_loss": -34.76617431640625, "global_step": 40348, "epoch": 333} {"train_loss": -35.060386657714844, "global_step": 40349, "epoch": 333} {"train_loss": -35.124935150146484, "global_step": 40350, "epoch": 333} {"train_loss": -34.30579376220703, "global_step": 40351, "epoch": 333} {"train_loss": -33.927791595458984, "global_step": 40352, "epoch": 333} {"train_loss": -33.00297164916992, "global_step": 40353, "epoch": 333} {"train_loss": -33.398189544677734, "global_step": 40354, "epoch": 333} {"train_loss": -32.43965148925781, "global_step": 40355, "epoch": 333} {"train_loss": -28.553451538085938, "global_step": 40356, "epoch": 333} {"train_loss": -24.364046096801758, "global_step": 40357, "epoch": 333} {"train_loss": -30.541568756103516, "global_step": 40358, "epoch": 333} {"train_loss": -34.706180572509766, "global_step": 40359, "epoch": 333} {"train_loss": -31.71685791015625, "global_step": 40360, "epoch": 333} {"train_loss": -32.32427978515625, "global_step": 40361, "epoch": 333} {"train_loss": -34.38681411743164, "global_step": 40362, "epoch": 333} {"train_loss": -31.77267837524414, "global_step": 40363, "epoch": 333} {"train_loss": -33.81190872192383, "global_step": 40364, "epoch": 333} {"train_loss": -33.67036056518555, "global_step": 40365, "epoch": 333} {"train_loss": -34.137386322021484, "global_step": 40366, "epoch": 333} {"train_loss": -34.467952728271484, "global_step": 40367, "epoch": 333} {"train_loss": -34.37958908081055, "global_step": 40368, "epoch": 333} {"train_loss": -34.38932418823242, "global_step": 40369, "epoch": 333} {"train_loss": -34.423152923583984, "global_step": 40370, "epoch": 333} {"train_loss": -34.459529876708984, "global_step": 40371, "epoch": 333} {"train_loss": -34.82307052612305, "global_step": 40372, "epoch": 333} {"train_loss": -34.7451057434082, "global_step": 40373, "epoch": 333} {"train_loss": -34.776275634765625, "global_step": 40374, "epoch": 333} {"train_loss": -34.57378005981445, "global_step": 40375, "epoch": 333} {"train_loss": -34.572052001953125, "global_step": 40376, "epoch": 333} {"train_loss": -35.08001708984375, "global_step": 40377, "epoch": 333} {"train_loss": -34.51423263549805, "global_step": 40378, "epoch": 333} {"train_loss": -34.794002532958984, "global_step": 40379, "epoch": 333} {"train_loss": -34.35519027709961, "global_step": 40380, "epoch": 333} {"train_loss": -33.758460998535156, "global_step": 40381, "epoch": 333} {"train_loss": -33.92879867553711, "global_step": 40382, "epoch": 333} {"train_loss": -34.34961700439453, "global_step": 40383, "epoch": 333} {"train_loss": -32.11651611328125, "global_step": 40384, "epoch": 333} {"train_loss": -30.972253799438477, "global_step": 40385, "epoch": 333} {"train_loss": -32.77580642700195, "global_step": 40386, "epoch": 333} {"train_loss": -33.11288070678711, "global_step": 40387, "epoch": 333} {"train_loss": -33.72216796875, "global_step": 40388, "epoch": 333} {"train_loss": -34.0552978515625, "global_step": 40389, "epoch": 333} {"train_loss": -34.45830154418945, "global_step": 40390, "epoch": 333} {"train_loss": -33.70172119140625, "global_step": 40391, "epoch": 333} {"train_loss": -32.494747161865234, "global_step": 40392, "epoch": 333} {"train_loss": -32.4986572265625, "global_step": 40393, "epoch": 333} {"train_loss": -32.88369369506836, "global_step": 40394, "epoch": 333} {"train_loss": -32.97182846069336, "global_step": 40395, "epoch": 333} {"train_loss": -30.92376136779785, "global_step": 40396, "epoch": 333} {"train_loss": -28.34640884399414, "global_step": 40397, "epoch": 333} {"train_loss": -29.730688095092773, "global_step": 40398, "epoch": 333} {"train_loss": -30.957660675048828, "global_step": 40399, "epoch": 333} {"train_loss": -33.1743278503418, "global_step": 40400, "epoch": 333} {"train_loss": -31.74309730529785, "global_step": 40401, "epoch": 333} {"train_loss": -30.7034912109375, "global_step": 40402, "epoch": 333} {"train_loss": -33.786495208740234, "global_step": 40403, "epoch": 333} {"train_loss": -31.6649112701416, "global_step": 40404, "epoch": 333} {"train_loss": -33.4300651550293, "global_step": 40405, "epoch": 333} {"train_loss": -32.90304183959961, "global_step": 40406, "epoch": 333} {"train_loss": -32.706764221191406, "global_step": 40407, "epoch": 333} {"train_loss": -32.287628173828125, "global_step": 40408, "epoch": 333} {"train_loss": -32.7787971496582, "global_step": 40409, "epoch": 333} {"train_loss": -32.466732025146484, "global_step": 40410, "epoch": 333} {"train_loss": -32.97603988647461, "global_step": 40411, "epoch": 333} {"train_loss": -32.3231315612793, "global_step": 40412, "epoch": 333} {"train_loss": -33.11402640855017, "global_step": 40413, "epoch": 333, "val_loss": 2505753.75} {"train_loss": -32.30404281616211, "global_step": 40414, "epoch": 334} {"train_loss": -31.574512481689453, "global_step": 40415, "epoch": 334} {"train_loss": -33.019691467285156, "global_step": 40416, "epoch": 334} {"train_loss": -29.989049911499023, "global_step": 40417, "epoch": 334} {"train_loss": -32.93484878540039, "global_step": 40418, "epoch": 334} {"train_loss": -32.41115951538086, "global_step": 40419, "epoch": 334} {"train_loss": -31.732070922851562, "global_step": 40420, "epoch": 334} {"train_loss": -33.64569091796875, "global_step": 40421, "epoch": 334} {"train_loss": -33.365028381347656, "global_step": 40422, "epoch": 334} {"train_loss": -32.53123092651367, "global_step": 40423, "epoch": 334} {"train_loss": -32.969703674316406, "global_step": 40424, "epoch": 334} {"train_loss": -34.02104568481445, "global_step": 40425, "epoch": 334} {"train_loss": -33.16512680053711, "global_step": 40426, "epoch": 334} {"train_loss": -32.8099250793457, "global_step": 40427, "epoch": 334} {"train_loss": -33.7259635925293, "global_step": 40428, "epoch": 334} {"train_loss": -34.32101058959961, "global_step": 40429, "epoch": 334} {"train_loss": -33.771785736083984, "global_step": 40430, "epoch": 334} {"train_loss": -33.72359848022461, "global_step": 40431, "epoch": 334} {"train_loss": -33.980751037597656, "global_step": 40432, "epoch": 334} {"train_loss": -34.370460510253906, "global_step": 40433, "epoch": 334} {"train_loss": -34.301883697509766, "global_step": 40434, "epoch": 334} {"train_loss": -34.50511932373047, "global_step": 40435, "epoch": 334} {"train_loss": -34.441436767578125, "global_step": 40436, "epoch": 334} {"train_loss": -34.30644607543945, "global_step": 40437, "epoch": 334} {"train_loss": -34.416072845458984, "global_step": 40438, "epoch": 334} {"train_loss": -34.33231735229492, "global_step": 40439, "epoch": 334} {"train_loss": -34.34138107299805, "global_step": 40440, "epoch": 334} {"train_loss": -34.7547492980957, "global_step": 40441, "epoch": 334} {"train_loss": -34.4267578125, "global_step": 40442, "epoch": 334} {"train_loss": -34.50699996948242, "global_step": 40443, "epoch": 334} {"train_loss": -34.328617095947266, "global_step": 40444, "epoch": 334} {"train_loss": -34.90087890625, "global_step": 40445, "epoch": 334} {"train_loss": -34.55623245239258, "global_step": 40446, "epoch": 334} {"train_loss": -34.862239837646484, "global_step": 40447, "epoch": 334} {"train_loss": -34.96338653564453, "global_step": 40448, "epoch": 334} {"train_loss": -34.7930908203125, "global_step": 40449, "epoch": 334} {"train_loss": -34.912452697753906, "global_step": 40450, "epoch": 334} {"train_loss": -34.12022018432617, "global_step": 40451, "epoch": 334} {"train_loss": -34.89604187011719, "global_step": 40452, "epoch": 334} {"train_loss": -33.66504669189453, "global_step": 40453, "epoch": 334} {"train_loss": -34.34187316894531, "global_step": 40454, "epoch": 334} {"train_loss": -34.926998138427734, "global_step": 40455, "epoch": 334} {"train_loss": -33.47280502319336, "global_step": 40456, "epoch": 334} {"train_loss": -33.570945739746094, "global_step": 40457, "epoch": 334} {"train_loss": -35.01888656616211, "global_step": 40458, "epoch": 334} {"train_loss": -32.13984298706055, "global_step": 40459, "epoch": 334} {"train_loss": -31.807321548461914, "global_step": 40460, "epoch": 334} {"train_loss": -31.930078506469727, "global_step": 40461, "epoch": 334} {"train_loss": -32.66780471801758, "global_step": 40462, "epoch": 334} {"train_loss": -33.49928283691406, "global_step": 40463, "epoch": 334} {"train_loss": -33.94336700439453, "global_step": 40464, "epoch": 334} {"train_loss": -34.089046478271484, "global_step": 40465, "epoch": 334} {"train_loss": -33.76055145263672, "global_step": 40466, "epoch": 334} {"train_loss": -33.838558197021484, "global_step": 40467, "epoch": 334} {"train_loss": -34.343387603759766, "global_step": 40468, "epoch": 334} {"train_loss": -34.05707550048828, "global_step": 40469, "epoch": 334} {"train_loss": -34.25640869140625, "global_step": 40470, "epoch": 334} {"train_loss": -34.10884475708008, "global_step": 40471, "epoch": 334} {"train_loss": -34.01318359375, "global_step": 40472, "epoch": 334} {"train_loss": -33.9749641418457, "global_step": 40473, "epoch": 334} {"train_loss": -34.6508674621582, "global_step": 40474, "epoch": 334} {"train_loss": -34.57332229614258, "global_step": 40475, "epoch": 334} {"train_loss": -34.660091400146484, "global_step": 40476, "epoch": 334} {"train_loss": -34.3880729675293, "global_step": 40477, "epoch": 334} {"train_loss": -34.749122619628906, "global_step": 40478, "epoch": 334} {"train_loss": -34.34547805786133, "global_step": 40479, "epoch": 334} {"train_loss": -34.23536682128906, "global_step": 40480, "epoch": 334} {"train_loss": -34.31394577026367, "global_step": 40481, "epoch": 334} {"train_loss": -34.969905853271484, "global_step": 40482, "epoch": 334} {"train_loss": -34.898902893066406, "global_step": 40483, "epoch": 334} {"train_loss": -34.246856689453125, "global_step": 40484, "epoch": 334} {"train_loss": -33.740333557128906, "global_step": 40485, "epoch": 334} {"train_loss": -32.814979553222656, "global_step": 40486, "epoch": 334} {"train_loss": -31.137704849243164, "global_step": 40487, "epoch": 334} {"train_loss": -29.613861083984375, "global_step": 40488, "epoch": 334} {"train_loss": -32.70260238647461, "global_step": 40489, "epoch": 334} {"train_loss": -34.6198844909668, "global_step": 40490, "epoch": 334} {"train_loss": -32.83304977416992, "global_step": 40491, "epoch": 334} {"train_loss": -31.98958396911621, "global_step": 40492, "epoch": 334} {"train_loss": -32.405426025390625, "global_step": 40493, "epoch": 334} {"train_loss": -32.85547637939453, "global_step": 40494, "epoch": 334} {"train_loss": -33.19565963745117, "global_step": 40495, "epoch": 334} {"train_loss": -33.11106491088867, "global_step": 40496, "epoch": 334} {"train_loss": -32.72249984741211, "global_step": 40497, "epoch": 334} {"train_loss": -31.160226821899414, "global_step": 40498, "epoch": 334} {"train_loss": -31.07204246520996, "global_step": 40499, "epoch": 334} {"train_loss": -33.109615325927734, "global_step": 40500, "epoch": 334} {"train_loss": -31.954334259033203, "global_step": 40501, "epoch": 334} {"train_loss": -30.538925170898438, "global_step": 40502, "epoch": 334} {"train_loss": -33.562557220458984, "global_step": 40503, "epoch": 334} {"train_loss": -32.38566589355469, "global_step": 40504, "epoch": 334} {"train_loss": -32.238216400146484, "global_step": 40505, "epoch": 334} {"train_loss": -33.888214111328125, "global_step": 40506, "epoch": 334} {"train_loss": -34.551265716552734, "global_step": 40507, "epoch": 334} {"train_loss": -33.382930755615234, "global_step": 40508, "epoch": 334} {"train_loss": -33.68912124633789, "global_step": 40509, "epoch": 334} {"train_loss": -33.6353645324707, "global_step": 40510, "epoch": 334} {"train_loss": -34.33864212036133, "global_step": 40511, "epoch": 334} {"train_loss": -34.90214157104492, "global_step": 40512, "epoch": 334} {"train_loss": -34.52131271362305, "global_step": 40513, "epoch": 334} {"train_loss": -34.831092834472656, "global_step": 40514, "epoch": 334} {"train_loss": -34.16457748413086, "global_step": 40515, "epoch": 334} {"train_loss": -34.524417877197266, "global_step": 40516, "epoch": 334} {"train_loss": -34.4667854309082, "global_step": 40517, "epoch": 334} {"train_loss": -35.01372146606445, "global_step": 40518, "epoch": 334} {"train_loss": -34.86823654174805, "global_step": 40519, "epoch": 334} {"train_loss": -34.40010452270508, "global_step": 40520, "epoch": 334} {"train_loss": -34.65765380859375, "global_step": 40521, "epoch": 334} {"train_loss": -34.77499008178711, "global_step": 40522, "epoch": 334} {"train_loss": -33.75494384765625, "global_step": 40523, "epoch": 334} {"train_loss": -34.4006233215332, "global_step": 40524, "epoch": 334} {"train_loss": -34.715755462646484, "global_step": 40525, "epoch": 334} {"train_loss": -34.54460144042969, "global_step": 40526, "epoch": 334} {"train_loss": -33.5910530090332, "global_step": 40527, "epoch": 334} {"train_loss": -32.19890594482422, "global_step": 40528, "epoch": 334} {"train_loss": -33.467830657958984, "global_step": 40529, "epoch": 334} {"train_loss": -33.367916107177734, "global_step": 40530, "epoch": 334} {"train_loss": -34.39911651611328, "global_step": 40531, "epoch": 334} {"train_loss": -34.0498046875, "global_step": 40532, "epoch": 334} {"train_loss": -33.7789306640625, "global_step": 40533, "epoch": 334} {"train_loss": -33.681121589723695, "global_step": 40534, "epoch": 334, "val_loss": 2444948.75} {"train_loss": -32.57843017578125, "global_step": 40535, "epoch": 335} {"train_loss": -32.425621032714844, "global_step": 40536, "epoch": 335} {"train_loss": -32.68873977661133, "global_step": 40537, "epoch": 335} {"train_loss": -32.4552001953125, "global_step": 40538, "epoch": 335} {"train_loss": -28.750385284423828, "global_step": 40539, "epoch": 335} {"train_loss": -29.655805587768555, "global_step": 40540, "epoch": 335} {"train_loss": -26.659698486328125, "global_step": 40541, "epoch": 335} {"train_loss": -20.501953125, "global_step": 40542, "epoch": 335} {"train_loss": -28.02631187438965, "global_step": 40543, "epoch": 335} {"train_loss": -32.468902587890625, "global_step": 40544, "epoch": 335} {"train_loss": -28.547216415405273, "global_step": 40545, "epoch": 335} {"train_loss": -28.555572509765625, "global_step": 40546, "epoch": 335} {"train_loss": -31.321426391601562, "global_step": 40547, "epoch": 335} {"train_loss": -27.81971549987793, "global_step": 40548, "epoch": 335} {"train_loss": -31.050968170166016, "global_step": 40549, "epoch": 335} {"train_loss": -30.197052001953125, "global_step": 40550, "epoch": 335} {"train_loss": -33.12307357788086, "global_step": 40551, "epoch": 335} {"train_loss": -31.302841186523438, "global_step": 40552, "epoch": 335} {"train_loss": -32.39565658569336, "global_step": 40553, "epoch": 335} {"train_loss": -31.670557022094727, "global_step": 40554, "epoch": 335} {"train_loss": -31.48260498046875, "global_step": 40555, "epoch": 335} {"train_loss": -32.33903121948242, "global_step": 40556, "epoch": 335} {"train_loss": -32.00665283203125, "global_step": 40557, "epoch": 335} {"train_loss": -32.68644714355469, "global_step": 40558, "epoch": 335} {"train_loss": -32.86434555053711, "global_step": 40559, "epoch": 335} {"train_loss": -32.18059158325195, "global_step": 40560, "epoch": 335} {"train_loss": -32.27443313598633, "global_step": 40561, "epoch": 335} {"train_loss": -32.33856964111328, "global_step": 40562, "epoch": 335} {"train_loss": -32.93241882324219, "global_step": 40563, "epoch": 335} {"train_loss": -32.7837028503418, "global_step": 40564, "epoch": 335} {"train_loss": -32.42346954345703, "global_step": 40565, "epoch": 335} {"train_loss": -33.184871673583984, "global_step": 40566, "epoch": 335} {"train_loss": -33.043270111083984, "global_step": 40567, "epoch": 335} {"train_loss": -33.26782989501953, "global_step": 40568, "epoch": 335} {"train_loss": -32.994300842285156, "global_step": 40569, "epoch": 335} {"train_loss": -33.26717758178711, "global_step": 40570, "epoch": 335} {"train_loss": -33.19683837890625, "global_step": 40571, "epoch": 335} {"train_loss": -33.15424346923828, "global_step": 40572, "epoch": 335} {"train_loss": -33.467464447021484, "global_step": 40573, "epoch": 335} {"train_loss": -33.506134033203125, "global_step": 40574, "epoch": 335} {"train_loss": -33.54458236694336, "global_step": 40575, "epoch": 335} {"train_loss": -33.292781829833984, "global_step": 40576, "epoch": 335} {"train_loss": -33.52179718017578, "global_step": 40577, "epoch": 335} {"train_loss": -33.72893142700195, "global_step": 40578, "epoch": 335} {"train_loss": -33.43951416015625, "global_step": 40579, "epoch": 335} {"train_loss": -33.82506561279297, "global_step": 40580, "epoch": 335} {"train_loss": -33.49271774291992, "global_step": 40581, "epoch": 335} {"train_loss": -33.85567855834961, "global_step": 40582, "epoch": 335} {"train_loss": -34.1179313659668, "global_step": 40583, "epoch": 335} {"train_loss": -33.76554489135742, "global_step": 40584, "epoch": 335} {"train_loss": -34.02549362182617, "global_step": 40585, "epoch": 335} {"train_loss": -33.85443115234375, "global_step": 40586, "epoch": 335} {"train_loss": -34.15108108520508, "global_step": 40587, "epoch": 335} {"train_loss": -34.234371185302734, "global_step": 40588, "epoch": 335} {"train_loss": -34.00960159301758, "global_step": 40589, "epoch": 335} {"train_loss": -33.51753234863281, "global_step": 40590, "epoch": 335} {"train_loss": -34.18916702270508, "global_step": 40591, "epoch": 335} {"train_loss": -34.332149505615234, "global_step": 40592, "epoch": 335} {"train_loss": -34.336544036865234, "global_step": 40593, "epoch": 335} {"train_loss": -34.470455169677734, "global_step": 40594, "epoch": 335} {"train_loss": -34.195526123046875, "global_step": 40595, "epoch": 335} {"train_loss": -34.08639907836914, "global_step": 40596, "epoch": 335} {"train_loss": -33.910247802734375, "global_step": 40597, "epoch": 335} {"train_loss": -34.526363372802734, "global_step": 40598, "epoch": 335} {"train_loss": -34.3481559753418, "global_step": 40599, "epoch": 335} {"train_loss": -33.856964111328125, "global_step": 40600, "epoch": 335} {"train_loss": -34.19898223876953, "global_step": 40601, "epoch": 335} {"train_loss": -34.07111740112305, "global_step": 40602, "epoch": 335} {"train_loss": -30.929248809814453, "global_step": 40603, "epoch": 335} {"train_loss": -33.646820068359375, "global_step": 40604, "epoch": 335} {"train_loss": -31.774831771850586, "global_step": 40605, "epoch": 335} {"train_loss": -30.997949600219727, "global_step": 40606, "epoch": 335} {"train_loss": -28.7088565826416, "global_step": 40607, "epoch": 335} {"train_loss": -6.586219787597656, "global_step": 40608, "epoch": 335} {"train_loss": 50.6376953125, "global_step": 40609, "epoch": 335} {"train_loss": 25.389806747436523, "global_step": 40610, "epoch": 335} {"train_loss": -26.142614364624023, "global_step": 40611, "epoch": 335} {"train_loss": -7.361821174621582, "global_step": 40612, "epoch": 335} {"train_loss": -16.213619232177734, "global_step": 40613, "epoch": 335} {"train_loss": -30.195642471313477, "global_step": 40614, "epoch": 335} {"train_loss": -17.033193588256836, "global_step": 40615, "epoch": 335} {"train_loss": -20.0440616607666, "global_step": 40616, "epoch": 335} {"train_loss": -31.229772567749023, "global_step": 40617, "epoch": 335} {"train_loss": -29.9158935546875, "global_step": 40618, "epoch": 335} {"train_loss": -27.22208023071289, "global_step": 40619, "epoch": 335} {"train_loss": -27.063932418823242, "global_step": 40620, "epoch": 335} {"train_loss": -27.866657257080078, "global_step": 40621, "epoch": 335} {"train_loss": -30.28680419921875, "global_step": 40622, "epoch": 335} {"train_loss": -31.841049194335938, "global_step": 40623, "epoch": 335} {"train_loss": -31.741662979125977, "global_step": 40624, "epoch": 335} {"train_loss": -30.164859771728516, "global_step": 40625, "epoch": 335} {"train_loss": -30.474716186523438, "global_step": 40626, "epoch": 335} {"train_loss": -30.43116569519043, "global_step": 40627, "epoch": 335} {"train_loss": -30.76352882385254, "global_step": 40628, "epoch": 335} {"train_loss": -31.24314308166504, "global_step": 40629, "epoch": 335} {"train_loss": -31.528486251831055, "global_step": 40630, "epoch": 335} {"train_loss": -32.06889724731445, "global_step": 40631, "epoch": 335} {"train_loss": -32.00349807739258, "global_step": 40632, "epoch": 335} {"train_loss": -31.124670028686523, "global_step": 40633, "epoch": 335} {"train_loss": -31.688634872436523, "global_step": 40634, "epoch": 335} {"train_loss": -31.010705947875977, "global_step": 40635, "epoch": 335} {"train_loss": -31.495092391967773, "global_step": 40636, "epoch": 335} {"train_loss": -31.571975708007812, "global_step": 40637, "epoch": 335} {"train_loss": -31.995014190673828, "global_step": 40638, "epoch": 335} {"train_loss": -32.298641204833984, "global_step": 40639, "epoch": 335} {"train_loss": -32.19301986694336, "global_step": 40640, "epoch": 335} {"train_loss": -32.392417907714844, "global_step": 40641, "epoch": 335} {"train_loss": -32.15181350708008, "global_step": 40642, "epoch": 335} {"train_loss": -32.362361907958984, "global_step": 40643, "epoch": 335} {"train_loss": -32.5621452331543, "global_step": 40644, "epoch": 335} {"train_loss": -32.57501983642578, "global_step": 40645, "epoch": 335} {"train_loss": -32.586402893066406, "global_step": 40646, "epoch": 335} {"train_loss": -32.31393051147461, "global_step": 40647, "epoch": 335} {"train_loss": -32.072174072265625, "global_step": 40648, "epoch": 335} {"train_loss": -32.355255126953125, "global_step": 40649, "epoch": 335} {"train_loss": -32.72559356689453, "global_step": 40650, "epoch": 335} {"train_loss": -32.64639663696289, "global_step": 40651, "epoch": 335} {"train_loss": -32.850555419921875, "global_step": 40652, "epoch": 335} {"train_loss": -32.921119689941406, "global_step": 40653, "epoch": 335} {"train_loss": -32.97514343261719, "global_step": 40654, "epoch": 335} {"train_loss": -30.08180395236685, "global_step": 40655, "epoch": 335, "val_loss": 2538747.25} {"train_loss": -33.09206008911133, "global_step": 40656, "epoch": 336} {"train_loss": -33.01884841918945, "global_step": 40657, "epoch": 336} {"train_loss": -32.961849212646484, "global_step": 40658, "epoch": 336} {"train_loss": -33.30768966674805, "global_step": 40659, "epoch": 336} {"train_loss": -33.3656005859375, "global_step": 40660, "epoch": 336} {"train_loss": -32.887062072753906, "global_step": 40661, "epoch": 336} {"train_loss": -33.493953704833984, "global_step": 40662, "epoch": 336} {"train_loss": -33.45307540893555, "global_step": 40663, "epoch": 336} {"train_loss": -33.28047561645508, "global_step": 40664, "epoch": 336} {"train_loss": -33.69667434692383, "global_step": 40665, "epoch": 336} {"train_loss": -33.61589050292969, "global_step": 40666, "epoch": 336} {"train_loss": -33.623165130615234, "global_step": 40667, "epoch": 336} {"train_loss": -33.5196533203125, "global_step": 40668, "epoch": 336} {"train_loss": -33.264766693115234, "global_step": 40669, "epoch": 336} {"train_loss": -33.414947509765625, "global_step": 40670, "epoch": 336} {"train_loss": -33.77618408203125, "global_step": 40671, "epoch": 336} {"train_loss": -34.01853561401367, "global_step": 40672, "epoch": 336} {"train_loss": -32.96132278442383, "global_step": 40673, "epoch": 336} {"train_loss": -34.106605529785156, "global_step": 40674, "epoch": 336} {"train_loss": -33.598060607910156, "global_step": 40675, "epoch": 336} {"train_loss": -33.71709060668945, "global_step": 40676, "epoch": 336} {"train_loss": -33.596858978271484, "global_step": 40677, "epoch": 336} {"train_loss": -33.5695915222168, "global_step": 40678, "epoch": 336} {"train_loss": -33.80132293701172, "global_step": 40679, "epoch": 336} {"train_loss": -32.80210494995117, "global_step": 40680, "epoch": 336} {"train_loss": -33.95418930053711, "global_step": 40681, "epoch": 336} {"train_loss": -33.39681625366211, "global_step": 40682, "epoch": 336} {"train_loss": -33.1090202331543, "global_step": 40683, "epoch": 336} {"train_loss": -32.51034927368164, "global_step": 40684, "epoch": 336} {"train_loss": -33.018333435058594, "global_step": 40685, "epoch": 336} {"train_loss": -33.34098434448242, "global_step": 40686, "epoch": 336} {"train_loss": -33.2280387878418, "global_step": 40687, "epoch": 336} {"train_loss": -33.787052154541016, "global_step": 40688, "epoch": 336} {"train_loss": -33.02560043334961, "global_step": 40689, "epoch": 336} {"train_loss": -33.38555908203125, "global_step": 40690, "epoch": 336} {"train_loss": -32.395381927490234, "global_step": 40691, "epoch": 336} {"train_loss": -33.10972213745117, "global_step": 40692, "epoch": 336} {"train_loss": -33.44558334350586, "global_step": 40693, "epoch": 336} {"train_loss": -33.4061164855957, "global_step": 40694, "epoch": 336} {"train_loss": -33.2276496887207, "global_step": 40695, "epoch": 336} {"train_loss": -30.658044815063477, "global_step": 40696, "epoch": 336} {"train_loss": -32.906673431396484, "global_step": 40697, "epoch": 336} {"train_loss": -32.97023391723633, "global_step": 40698, "epoch": 336} {"train_loss": -32.19790267944336, "global_step": 40699, "epoch": 336} {"train_loss": -31.950489044189453, "global_step": 40700, "epoch": 336} {"train_loss": -30.964258193969727, "global_step": 40701, "epoch": 336} {"train_loss": -32.08948516845703, "global_step": 40702, "epoch": 336} {"train_loss": -32.39326858520508, "global_step": 40703, "epoch": 336} {"train_loss": -31.753101348876953, "global_step": 40704, "epoch": 336} {"train_loss": -31.41167640686035, "global_step": 40705, "epoch": 336} {"train_loss": -28.27052116394043, "global_step": 40706, "epoch": 336} {"train_loss": -30.047460556030273, "global_step": 40707, "epoch": 336} {"train_loss": -30.673124313354492, "global_step": 40708, "epoch": 336} {"train_loss": -32.3712158203125, "global_step": 40709, "epoch": 336} {"train_loss": -31.94721794128418, "global_step": 40710, "epoch": 336} {"train_loss": -31.1431827545166, "global_step": 40711, "epoch": 336} {"train_loss": -31.052270889282227, "global_step": 40712, "epoch": 336} {"train_loss": -32.60342025756836, "global_step": 40713, "epoch": 336} {"train_loss": -31.878522872924805, "global_step": 40714, "epoch": 336} {"train_loss": -30.8391170501709, "global_step": 40715, "epoch": 336} {"train_loss": -32.77753448486328, "global_step": 40716, "epoch": 336} {"train_loss": -32.0368537902832, "global_step": 40717, "epoch": 336} {"train_loss": -31.315216064453125, "global_step": 40718, "epoch": 336} {"train_loss": -31.85407066345215, "global_step": 40719, "epoch": 336} {"train_loss": -32.123199462890625, "global_step": 40720, "epoch": 336} {"train_loss": -33.06013107299805, "global_step": 40721, "epoch": 336} {"train_loss": -33.06064987182617, "global_step": 40722, "epoch": 336} {"train_loss": -32.225799560546875, "global_step": 40723, "epoch": 336} {"train_loss": -32.80453872680664, "global_step": 40724, "epoch": 336} {"train_loss": -32.77960205078125, "global_step": 40725, "epoch": 336} {"train_loss": -32.9371337890625, "global_step": 40726, "epoch": 336} {"train_loss": -32.226715087890625, "global_step": 40727, "epoch": 336} {"train_loss": -32.478092193603516, "global_step": 40728, "epoch": 336} {"train_loss": -33.16659927368164, "global_step": 40729, "epoch": 336} {"train_loss": -32.71739959716797, "global_step": 40730, "epoch": 336} {"train_loss": -32.62855911254883, "global_step": 40731, "epoch": 336} {"train_loss": -32.74283981323242, "global_step": 40732, "epoch": 336} {"train_loss": -33.03675079345703, "global_step": 40733, "epoch": 336} {"train_loss": -32.9415283203125, "global_step": 40734, "epoch": 336} {"train_loss": -33.201168060302734, "global_step": 40735, "epoch": 336} {"train_loss": -32.932491302490234, "global_step": 40736, "epoch": 336} {"train_loss": -32.895198822021484, "global_step": 40737, "epoch": 336} {"train_loss": -33.186927795410156, "global_step": 40738, "epoch": 336} {"train_loss": -32.62644577026367, "global_step": 40739, "epoch": 336} {"train_loss": -31.915679931640625, "global_step": 40740, "epoch": 336} {"train_loss": -32.261322021484375, "global_step": 40741, "epoch": 336} {"train_loss": -32.9671745300293, "global_step": 40742, "epoch": 336} {"train_loss": -33.46274948120117, "global_step": 40743, "epoch": 336} {"train_loss": -33.091426849365234, "global_step": 40744, "epoch": 336} {"train_loss": -33.274391174316406, "global_step": 40745, "epoch": 336} {"train_loss": -33.28081130981445, "global_step": 40746, "epoch": 336} {"train_loss": -33.3945198059082, "global_step": 40747, "epoch": 336} {"train_loss": -33.13454818725586, "global_step": 40748, "epoch": 336} {"train_loss": -33.62765121459961, "global_step": 40749, "epoch": 336} {"train_loss": -33.744930267333984, "global_step": 40750, "epoch": 336} {"train_loss": -33.54423141479492, "global_step": 40751, "epoch": 336} {"train_loss": -33.9794807434082, "global_step": 40752, "epoch": 336} {"train_loss": -34.06353759765625, "global_step": 40753, "epoch": 336} {"train_loss": -33.808998107910156, "global_step": 40754, "epoch": 336} {"train_loss": -34.26234817504883, "global_step": 40755, "epoch": 336} {"train_loss": -34.09210968017578, "global_step": 40756, "epoch": 336} {"train_loss": -34.204063415527344, "global_step": 40757, "epoch": 336} {"train_loss": -34.2361946105957, "global_step": 40758, "epoch": 336} {"train_loss": -34.41185760498047, "global_step": 40759, "epoch": 336} {"train_loss": -34.3913459777832, "global_step": 40760, "epoch": 336} {"train_loss": -34.4123420715332, "global_step": 40761, "epoch": 336} {"train_loss": -34.642059326171875, "global_step": 40762, "epoch": 336} {"train_loss": -34.22936248779297, "global_step": 40763, "epoch": 336} {"train_loss": -33.654747009277344, "global_step": 40764, "epoch": 336} {"train_loss": -32.84204864501953, "global_step": 40765, "epoch": 336} {"train_loss": -31.98994255065918, "global_step": 40766, "epoch": 336} {"train_loss": -29.212982177734375, "global_step": 40767, "epoch": 336} {"train_loss": -25.762128829956055, "global_step": 40768, "epoch": 336} {"train_loss": -26.44118309020996, "global_step": 40769, "epoch": 336} {"train_loss": -33.48342514038086, "global_step": 40770, "epoch": 336} {"train_loss": -30.362287521362305, "global_step": 40771, "epoch": 336} {"train_loss": -26.808795928955078, "global_step": 40772, "epoch": 336} {"train_loss": -33.186580657958984, "global_step": 40773, "epoch": 336} {"train_loss": -28.3822021484375, "global_step": 40774, "epoch": 336} {"train_loss": -33.3663215637207, "global_step": 40775, "epoch": 336} {"train_loss": -32.671135106362584, "global_step": 40776, "epoch": 336, "val_loss": 2475941.25} {"train_loss": -33.70072555541992, "global_step": 40777, "epoch": 337} {"train_loss": -31.988554000854492, "global_step": 40778, "epoch": 337} {"train_loss": -32.883663177490234, "global_step": 40779, "epoch": 337} {"train_loss": -33.70685577392578, "global_step": 40780, "epoch": 337} {"train_loss": -32.95618438720703, "global_step": 40781, "epoch": 337} {"train_loss": -32.67901611328125, "global_step": 40782, "epoch": 337} {"train_loss": -33.44437789916992, "global_step": 40783, "epoch": 337} {"train_loss": -32.94265365600586, "global_step": 40784, "epoch": 337} {"train_loss": -33.036895751953125, "global_step": 40785, "epoch": 337} {"train_loss": -33.293678283691406, "global_step": 40786, "epoch": 337} {"train_loss": -33.30564498901367, "global_step": 40787, "epoch": 337} {"train_loss": -33.197574615478516, "global_step": 40788, "epoch": 337} {"train_loss": -33.43790817260742, "global_step": 40789, "epoch": 337} {"train_loss": -33.97480392456055, "global_step": 40790, "epoch": 337} {"train_loss": -33.77540969848633, "global_step": 40791, "epoch": 337} {"train_loss": -33.519466400146484, "global_step": 40792, "epoch": 337} {"train_loss": -33.32053756713867, "global_step": 40793, "epoch": 337} {"train_loss": -32.4666862487793, "global_step": 40794, "epoch": 337} {"train_loss": -32.31806564331055, "global_step": 40795, "epoch": 337} {"train_loss": -33.545936584472656, "global_step": 40796, "epoch": 337} {"train_loss": -33.385250091552734, "global_step": 40797, "epoch": 337} {"train_loss": -33.030338287353516, "global_step": 40798, "epoch": 337} {"train_loss": -33.1862678527832, "global_step": 40799, "epoch": 337} {"train_loss": -33.43841552734375, "global_step": 40800, "epoch": 337} {"train_loss": -33.04279708862305, "global_step": 40801, "epoch": 337} {"train_loss": -33.58234405517578, "global_step": 40802, "epoch": 337} {"train_loss": -33.4669303894043, "global_step": 40803, "epoch": 337} {"train_loss": -33.447261810302734, "global_step": 40804, "epoch": 337} {"train_loss": -33.725704193115234, "global_step": 40805, "epoch": 337} {"train_loss": -33.37000274658203, "global_step": 40806, "epoch": 337} {"train_loss": -33.814453125, "global_step": 40807, "epoch": 337} {"train_loss": -33.45860290527344, "global_step": 40808, "epoch": 337} {"train_loss": -33.549842834472656, "global_step": 40809, "epoch": 337} {"train_loss": -33.712642669677734, "global_step": 40810, "epoch": 337} {"train_loss": -33.226863861083984, "global_step": 40811, "epoch": 337} {"train_loss": -33.224830627441406, "global_step": 40812, "epoch": 337} {"train_loss": -34.072269439697266, "global_step": 40813, "epoch": 337} {"train_loss": -33.02082443237305, "global_step": 40814, "epoch": 337} {"train_loss": -32.73062515258789, "global_step": 40815, "epoch": 337} {"train_loss": -33.78519058227539, "global_step": 40816, "epoch": 337} {"train_loss": -33.163055419921875, "global_step": 40817, "epoch": 337} {"train_loss": -33.01982879638672, "global_step": 40818, "epoch": 337} {"train_loss": -33.115516662597656, "global_step": 40819, "epoch": 337} {"train_loss": -31.941177368164062, "global_step": 40820, "epoch": 337} {"train_loss": -33.19326400756836, "global_step": 40821, "epoch": 337} {"train_loss": -33.56740951538086, "global_step": 40822, "epoch": 337} {"train_loss": -32.64638137817383, "global_step": 40823, "epoch": 337} {"train_loss": -33.43184280395508, "global_step": 40824, "epoch": 337} {"train_loss": -31.508955001831055, "global_step": 40825, "epoch": 337} {"train_loss": -33.981109619140625, "global_step": 40826, "epoch": 337} {"train_loss": -32.380306243896484, "global_step": 40827, "epoch": 337} {"train_loss": -34.07871627807617, "global_step": 40828, "epoch": 337} {"train_loss": -33.722774505615234, "global_step": 40829, "epoch": 337} {"train_loss": -33.34749984741211, "global_step": 40830, "epoch": 337} {"train_loss": -34.4168586730957, "global_step": 40831, "epoch": 337} {"train_loss": -33.17953109741211, "global_step": 40832, "epoch": 337} {"train_loss": -33.95260238647461, "global_step": 40833, "epoch": 337} {"train_loss": -33.697235107421875, "global_step": 40834, "epoch": 337} {"train_loss": -32.553035736083984, "global_step": 40835, "epoch": 337} {"train_loss": -34.090919494628906, "global_step": 40836, "epoch": 337} {"train_loss": -33.49152755737305, "global_step": 40837, "epoch": 337} {"train_loss": -33.74048614501953, "global_step": 40838, "epoch": 337} {"train_loss": -34.100830078125, "global_step": 40839, "epoch": 337} {"train_loss": -33.768001556396484, "global_step": 40840, "epoch": 337} {"train_loss": -32.33454513549805, "global_step": 40841, "epoch": 337} {"train_loss": -34.06727981567383, "global_step": 40842, "epoch": 337} {"train_loss": -33.3550910949707, "global_step": 40843, "epoch": 337} {"train_loss": -34.05842590332031, "global_step": 40844, "epoch": 337} {"train_loss": -33.381591796875, "global_step": 40845, "epoch": 337} {"train_loss": -33.853206634521484, "global_step": 40846, "epoch": 337} {"train_loss": -32.600006103515625, "global_step": 40847, "epoch": 337} {"train_loss": -33.46039962768555, "global_step": 40848, "epoch": 337} {"train_loss": -31.564783096313477, "global_step": 40849, "epoch": 337} {"train_loss": -30.298267364501953, "global_step": 40850, "epoch": 337} {"train_loss": -26.003997802734375, "global_step": 40851, "epoch": 337} {"train_loss": -30.644153594970703, "global_step": 40852, "epoch": 337} {"train_loss": -25.337865829467773, "global_step": 40853, "epoch": 337} {"train_loss": -25.81841468811035, "global_step": 40854, "epoch": 337} {"train_loss": -25.79249382019043, "global_step": 40855, "epoch": 337} {"train_loss": -25.460845947265625, "global_step": 40856, "epoch": 337} {"train_loss": -25.830652236938477, "global_step": 40857, "epoch": 337} {"train_loss": -26.24403190612793, "global_step": 40858, "epoch": 337} {"train_loss": -26.500152587890625, "global_step": 40859, "epoch": 337} {"train_loss": -27.079986572265625, "global_step": 40860, "epoch": 337} {"train_loss": -26.916961669921875, "global_step": 40861, "epoch": 337} {"train_loss": -28.642175674438477, "global_step": 40862, "epoch": 337} {"train_loss": -29.432083129882812, "global_step": 40863, "epoch": 337} {"train_loss": -28.631229400634766, "global_step": 40864, "epoch": 337} {"train_loss": -28.798009872436523, "global_step": 40865, "epoch": 337} {"train_loss": -27.006820678710938, "global_step": 40866, "epoch": 337} {"train_loss": -16.18922233581543, "global_step": 40867, "epoch": 337} {"train_loss": -26.7895450592041, "global_step": 40868, "epoch": 337} {"train_loss": -26.229272842407227, "global_step": 40869, "epoch": 337} {"train_loss": -29.30036735534668, "global_step": 40870, "epoch": 337} {"train_loss": -27.149566650390625, "global_step": 40871, "epoch": 337} {"train_loss": -29.48538589477539, "global_step": 40872, "epoch": 337} {"train_loss": -29.65924072265625, "global_step": 40873, "epoch": 337} {"train_loss": -26.582965850830078, "global_step": 40874, "epoch": 337} {"train_loss": -28.713275909423828, "global_step": 40875, "epoch": 337} {"train_loss": -30.700910568237305, "global_step": 40876, "epoch": 337} {"train_loss": -29.601865768432617, "global_step": 40877, "epoch": 337} {"train_loss": -30.3200626373291, "global_step": 40878, "epoch": 337} {"train_loss": -30.3634090423584, "global_step": 40879, "epoch": 337} {"train_loss": -30.202014923095703, "global_step": 40880, "epoch": 337} {"train_loss": -30.868070602416992, "global_step": 40881, "epoch": 337} {"train_loss": -29.00715446472168, "global_step": 40882, "epoch": 337} {"train_loss": -23.537120819091797, "global_step": 40883, "epoch": 337} {"train_loss": -22.006330490112305, "global_step": 40884, "epoch": 337} {"train_loss": -28.740863800048828, "global_step": 40885, "epoch": 337} {"train_loss": -21.05209732055664, "global_step": 40886, "epoch": 337} {"train_loss": -23.426740646362305, "global_step": 40887, "epoch": 337} {"train_loss": -30.243000030517578, "global_step": 40888, "epoch": 337} {"train_loss": -23.88701820373535, "global_step": 40889, "epoch": 337} {"train_loss": -28.424896240234375, "global_step": 40890, "epoch": 337} {"train_loss": -30.511808395385742, "global_step": 40891, "epoch": 337} {"train_loss": -28.62302589416504, "global_step": 40892, "epoch": 337} {"train_loss": -28.28278923034668, "global_step": 40893, "epoch": 337} {"train_loss": -30.03447914123535, "global_step": 40894, "epoch": 337} {"train_loss": -30.597375869750977, "global_step": 40895, "epoch": 337} {"train_loss": -30.478179931640625, "global_step": 40896, "epoch": 337} {"train_loss": -31.050419641920357, "global_step": 40897, "epoch": 337, "val_loss": 2595908.5} {"train_loss": -30.277822494506836, "global_step": 40898, "epoch": 338} {"train_loss": -29.891864776611328, "global_step": 40899, "epoch": 338} {"train_loss": -30.327062606811523, "global_step": 40900, "epoch": 338} {"train_loss": -30.68369483947754, "global_step": 40901, "epoch": 338} {"train_loss": -31.001026153564453, "global_step": 40902, "epoch": 338} {"train_loss": -31.2447509765625, "global_step": 40903, "epoch": 338} {"train_loss": -30.73076820373535, "global_step": 40904, "epoch": 338} {"train_loss": -30.892133712768555, "global_step": 40905, "epoch": 338} {"train_loss": -31.0262508392334, "global_step": 40906, "epoch": 338} {"train_loss": -30.718368530273438, "global_step": 40907, "epoch": 338} {"train_loss": -30.806793212890625, "global_step": 40908, "epoch": 338} {"train_loss": -30.553861618041992, "global_step": 40909, "epoch": 338} {"train_loss": -31.61322593688965, "global_step": 40910, "epoch": 338} {"train_loss": -31.21079444885254, "global_step": 40911, "epoch": 338} {"train_loss": -28.06693458557129, "global_step": 40912, "epoch": 338} {"train_loss": -32.0586051940918, "global_step": 40913, "epoch": 338} {"train_loss": -27.85027503967285, "global_step": 40914, "epoch": 338} {"train_loss": -32.0457649230957, "global_step": 40915, "epoch": 338} {"train_loss": -27.795331954956055, "global_step": 40916, "epoch": 338} {"train_loss": -31.65399169921875, "global_step": 40917, "epoch": 338} {"train_loss": -30.97275161743164, "global_step": 40918, "epoch": 338} {"train_loss": -31.76259422302246, "global_step": 40919, "epoch": 338} {"train_loss": -31.42915153503418, "global_step": 40920, "epoch": 338} {"train_loss": -30.846715927124023, "global_step": 40921, "epoch": 338} {"train_loss": -31.261743545532227, "global_step": 40922, "epoch": 338} {"train_loss": -31.226612091064453, "global_step": 40923, "epoch": 338} {"train_loss": -30.82366371154785, "global_step": 40924, "epoch": 338} {"train_loss": -27.276411056518555, "global_step": 40925, "epoch": 338} {"train_loss": -27.413593292236328, "global_step": 40926, "epoch": 338} {"train_loss": -32.04570007324219, "global_step": 40927, "epoch": 338} {"train_loss": -29.716781616210938, "global_step": 40928, "epoch": 338} {"train_loss": -31.306644439697266, "global_step": 40929, "epoch": 338} {"train_loss": -30.848358154296875, "global_step": 40930, "epoch": 338} {"train_loss": -31.7529354095459, "global_step": 40931, "epoch": 338} {"train_loss": -32.476600646972656, "global_step": 40932, "epoch": 338} {"train_loss": -31.481779098510742, "global_step": 40933, "epoch": 338} {"train_loss": -32.52097702026367, "global_step": 40934, "epoch": 338} {"train_loss": -32.73188018798828, "global_step": 40935, "epoch": 338} {"train_loss": -32.01459503173828, "global_step": 40936, "epoch": 338} {"train_loss": -32.682918548583984, "global_step": 40937, "epoch": 338} {"train_loss": -33.18778991699219, "global_step": 40938, "epoch": 338} {"train_loss": -32.45033645629883, "global_step": 40939, "epoch": 338} {"train_loss": -32.49087142944336, "global_step": 40940, "epoch": 338} {"train_loss": -33.38009262084961, "global_step": 40941, "epoch": 338} {"train_loss": -33.57793045043945, "global_step": 40942, "epoch": 338} {"train_loss": -33.3161735534668, "global_step": 40943, "epoch": 338} {"train_loss": -32.90861129760742, "global_step": 40944, "epoch": 338} {"train_loss": -33.54416275024414, "global_step": 40945, "epoch": 338} {"train_loss": -33.5302619934082, "global_step": 40946, "epoch": 338} {"train_loss": -34.04948043823242, "global_step": 40947, "epoch": 338} {"train_loss": -33.65406036376953, "global_step": 40948, "epoch": 338} {"train_loss": -32.874263763427734, "global_step": 40949, "epoch": 338} {"train_loss": -33.553401947021484, "global_step": 40950, "epoch": 338} {"train_loss": -33.830387115478516, "global_step": 40951, "epoch": 338} {"train_loss": -34.038604736328125, "global_step": 40952, "epoch": 338} {"train_loss": -33.997920989990234, "global_step": 40953, "epoch": 338} {"train_loss": -34.08535385131836, "global_step": 40954, "epoch": 338} {"train_loss": -33.70450210571289, "global_step": 40955, "epoch": 338} {"train_loss": -33.474029541015625, "global_step": 40956, "epoch": 338} {"train_loss": -33.914554595947266, "global_step": 40957, "epoch": 338} {"train_loss": -34.06483840942383, "global_step": 40958, "epoch": 338} {"train_loss": -34.146148681640625, "global_step": 40959, "epoch": 338} {"train_loss": -34.10506057739258, "global_step": 40960, "epoch": 338} {"train_loss": -33.980133056640625, "global_step": 40961, "epoch": 338} {"train_loss": -33.80483627319336, "global_step": 40962, "epoch": 338} {"train_loss": -34.49311065673828, "global_step": 40963, "epoch": 338} {"train_loss": -33.46914291381836, "global_step": 40964, "epoch": 338} {"train_loss": -33.5507926940918, "global_step": 40965, "epoch": 338} {"train_loss": -34.39506149291992, "global_step": 40966, "epoch": 338} {"train_loss": -34.118324279785156, "global_step": 40967, "epoch": 338} {"train_loss": -33.5549201965332, "global_step": 40968, "epoch": 338} {"train_loss": -34.03093338012695, "global_step": 40969, "epoch": 338} {"train_loss": -34.06825637817383, "global_step": 40970, "epoch": 338} {"train_loss": -33.520503997802734, "global_step": 40971, "epoch": 338} {"train_loss": -33.877967834472656, "global_step": 40972, "epoch": 338} {"train_loss": -32.52877426147461, "global_step": 40973, "epoch": 338} {"train_loss": -33.47248077392578, "global_step": 40974, "epoch": 338} {"train_loss": -33.49903106689453, "global_step": 40975, "epoch": 338} {"train_loss": -33.62543869018555, "global_step": 40976, "epoch": 338} {"train_loss": -33.82332229614258, "global_step": 40977, "epoch": 338} {"train_loss": -34.175498962402344, "global_step": 40978, "epoch": 338} {"train_loss": -34.2674446105957, "global_step": 40979, "epoch": 338} {"train_loss": -34.16947555541992, "global_step": 40980, "epoch": 338} {"train_loss": -33.90603256225586, "global_step": 40981, "epoch": 338} {"train_loss": -33.5407600402832, "global_step": 40982, "epoch": 338} {"train_loss": -33.24160385131836, "global_step": 40983, "epoch": 338} {"train_loss": -33.37935256958008, "global_step": 40984, "epoch": 338} {"train_loss": -34.27836227416992, "global_step": 40985, "epoch": 338} {"train_loss": -33.86408615112305, "global_step": 40986, "epoch": 338} {"train_loss": -33.41472244262695, "global_step": 40987, "epoch": 338} {"train_loss": -33.769630432128906, "global_step": 40988, "epoch": 338} {"train_loss": -33.55446243286133, "global_step": 40989, "epoch": 338} {"train_loss": -33.11152267456055, "global_step": 40990, "epoch": 338} {"train_loss": -32.80584716796875, "global_step": 40991, "epoch": 338} {"train_loss": -32.98247528076172, "global_step": 40992, "epoch": 338} {"train_loss": -33.51418685913086, "global_step": 40993, "epoch": 338} {"train_loss": -33.9804573059082, "global_step": 40994, "epoch": 338} {"train_loss": -32.77359390258789, "global_step": 40995, "epoch": 338} {"train_loss": -33.824241638183594, "global_step": 40996, "epoch": 338} {"train_loss": -34.10444259643555, "global_step": 40997, "epoch": 338} {"train_loss": -33.24056625366211, "global_step": 40998, "epoch": 338} {"train_loss": -34.027523040771484, "global_step": 40999, "epoch": 338} {"train_loss": -33.78971862792969, "global_step": 41000, "epoch": 338} {"train_loss": -33.5693473815918, "global_step": 41001, "epoch": 338} {"train_loss": -33.50160598754883, "global_step": 41002, "epoch": 338} {"train_loss": -33.887081146240234, "global_step": 41003, "epoch": 338} {"train_loss": -33.932098388671875, "global_step": 41004, "epoch": 338} {"train_loss": -33.97141647338867, "global_step": 41005, "epoch": 338} {"train_loss": -34.13663864135742, "global_step": 41006, "epoch": 338} {"train_loss": -34.322837829589844, "global_step": 41007, "epoch": 338} {"train_loss": -34.394073486328125, "global_step": 41008, "epoch": 338} {"train_loss": -33.824947357177734, "global_step": 41009, "epoch": 338} {"train_loss": -34.421356201171875, "global_step": 41010, "epoch": 338} {"train_loss": -34.22935104370117, "global_step": 41011, "epoch": 338} {"train_loss": -34.32229232788086, "global_step": 41012, "epoch": 338} {"train_loss": -34.498023986816406, "global_step": 41013, "epoch": 338} {"train_loss": -34.06881332397461, "global_step": 41014, "epoch": 338} {"train_loss": -34.3096923828125, "global_step": 41015, "epoch": 338} {"train_loss": -34.432403564453125, "global_step": 41016, "epoch": 338} {"train_loss": -34.33561325073242, "global_step": 41017, "epoch": 338} {"train_loss": -32.78652780706232, "global_step": 41018, "epoch": 338, "val_loss": 2536332.75} {"train_loss": -34.528865814208984, "global_step": 41019, "epoch": 339} {"train_loss": -34.624908447265625, "global_step": 41020, "epoch": 339} {"train_loss": -34.10496139526367, "global_step": 41021, "epoch": 339} {"train_loss": -34.550655364990234, "global_step": 41022, "epoch": 339} {"train_loss": -34.33992385864258, "global_step": 41023, "epoch": 339} {"train_loss": -34.1679573059082, "global_step": 41024, "epoch": 339} {"train_loss": -34.38140869140625, "global_step": 41025, "epoch": 339} {"train_loss": -34.39379119873047, "global_step": 41026, "epoch": 339} {"train_loss": -34.3032341003418, "global_step": 41027, "epoch": 339} {"train_loss": -34.1735725402832, "global_step": 41028, "epoch": 339} {"train_loss": -34.48556137084961, "global_step": 41029, "epoch": 339} {"train_loss": -33.9017219543457, "global_step": 41030, "epoch": 339} {"train_loss": -34.29339599609375, "global_step": 41031, "epoch": 339} {"train_loss": -33.08054733276367, "global_step": 41032, "epoch": 339} {"train_loss": -31.7493839263916, "global_step": 41033, "epoch": 339} {"train_loss": -32.74055099487305, "global_step": 41034, "epoch": 339} {"train_loss": -34.500083923339844, "global_step": 41035, "epoch": 339} {"train_loss": -33.68343734741211, "global_step": 41036, "epoch": 339} {"train_loss": -33.7036247253418, "global_step": 41037, "epoch": 339} {"train_loss": -33.18757247924805, "global_step": 41038, "epoch": 339} {"train_loss": -32.851531982421875, "global_step": 41039, "epoch": 339} {"train_loss": -34.11396026611328, "global_step": 41040, "epoch": 339} {"train_loss": -34.51576614379883, "global_step": 41041, "epoch": 339} {"train_loss": -33.76129150390625, "global_step": 41042, "epoch": 339} {"train_loss": -32.12212371826172, "global_step": 41043, "epoch": 339} {"train_loss": -34.2686767578125, "global_step": 41044, "epoch": 339} {"train_loss": -34.12614822387695, "global_step": 41045, "epoch": 339} {"train_loss": -34.40815734863281, "global_step": 41046, "epoch": 339} {"train_loss": -34.19338607788086, "global_step": 41047, "epoch": 339} {"train_loss": -34.20682907104492, "global_step": 41048, "epoch": 339} {"train_loss": -34.73813247680664, "global_step": 41049, "epoch": 339} {"train_loss": -34.454891204833984, "global_step": 41050, "epoch": 339} {"train_loss": -34.742610931396484, "global_step": 41051, "epoch": 339} {"train_loss": -34.5572395324707, "global_step": 41052, "epoch": 339} {"train_loss": -34.983516693115234, "global_step": 41053, "epoch": 339} {"train_loss": -35.02973556518555, "global_step": 41054, "epoch": 339} {"train_loss": -34.80076217651367, "global_step": 41055, "epoch": 339} {"train_loss": -34.458858489990234, "global_step": 41056, "epoch": 339} {"train_loss": -34.699851989746094, "global_step": 41057, "epoch": 339} {"train_loss": -34.89408493041992, "global_step": 41058, "epoch": 339} {"train_loss": -34.910003662109375, "global_step": 41059, "epoch": 339} {"train_loss": -34.54951095581055, "global_step": 41060, "epoch": 339} {"train_loss": -34.270111083984375, "global_step": 41061, "epoch": 339} {"train_loss": -34.612300872802734, "global_step": 41062, "epoch": 339} {"train_loss": -34.07242202758789, "global_step": 41063, "epoch": 339} {"train_loss": -34.73240280151367, "global_step": 41064, "epoch": 339} {"train_loss": -34.57561111450195, "global_step": 41065, "epoch": 339} {"train_loss": -33.513362884521484, "global_step": 41066, "epoch": 339} {"train_loss": -32.783668518066406, "global_step": 41067, "epoch": 339} {"train_loss": -33.44243240356445, "global_step": 41068, "epoch": 339} {"train_loss": -33.305908203125, "global_step": 41069, "epoch": 339} {"train_loss": -30.91645622253418, "global_step": 41070, "epoch": 339} {"train_loss": -29.15321159362793, "global_step": 41071, "epoch": 339} {"train_loss": -22.76137351989746, "global_step": 41072, "epoch": 339} {"train_loss": -24.657602310180664, "global_step": 41073, "epoch": 339} {"train_loss": -28.51936149597168, "global_step": 41074, "epoch": 339} {"train_loss": -26.384912490844727, "global_step": 41075, "epoch": 339} {"train_loss": -28.2927188873291, "global_step": 41076, "epoch": 339} {"train_loss": -29.4747371673584, "global_step": 41077, "epoch": 339} {"train_loss": -28.448978424072266, "global_step": 41078, "epoch": 339} {"train_loss": -29.721662521362305, "global_step": 41079, "epoch": 339} {"train_loss": -28.70452880859375, "global_step": 41080, "epoch": 339} {"train_loss": -28.828657150268555, "global_step": 41081, "epoch": 339} {"train_loss": -29.930585861206055, "global_step": 41082, "epoch": 339} {"train_loss": -30.19703483581543, "global_step": 41083, "epoch": 339} {"train_loss": -29.8691349029541, "global_step": 41084, "epoch": 339} {"train_loss": -30.32293128967285, "global_step": 41085, "epoch": 339} {"train_loss": -30.016651153564453, "global_step": 41086, "epoch": 339} {"train_loss": -30.116422653198242, "global_step": 41087, "epoch": 339} {"train_loss": -30.769250869750977, "global_step": 41088, "epoch": 339} {"train_loss": -30.621601104736328, "global_step": 41089, "epoch": 339} {"train_loss": -31.338077545166016, "global_step": 41090, "epoch": 339} {"train_loss": -30.584583282470703, "global_step": 41091, "epoch": 339} {"train_loss": -30.189382553100586, "global_step": 41092, "epoch": 339} {"train_loss": -21.25855255126953, "global_step": 41093, "epoch": 339} {"train_loss": -1.3679296970367432, "global_step": 41094, "epoch": 339} {"train_loss": -30.6959171295166, "global_step": 41095, "epoch": 339} {"train_loss": -13.560256958007812, "global_step": 41096, "epoch": 339} {"train_loss": -31.784698486328125, "global_step": 41097, "epoch": 339} {"train_loss": -22.346616744995117, "global_step": 41098, "epoch": 339} {"train_loss": -26.695301055908203, "global_step": 41099, "epoch": 339} {"train_loss": -31.32988929748535, "global_step": 41100, "epoch": 339} {"train_loss": -28.85965919494629, "global_step": 41101, "epoch": 339} {"train_loss": -27.459110260009766, "global_step": 41102, "epoch": 339} {"train_loss": -29.782608032226562, "global_step": 41103, "epoch": 339} {"train_loss": -31.5872745513916, "global_step": 41104, "epoch": 339} {"train_loss": -31.31879234313965, "global_step": 41105, "epoch": 339} {"train_loss": -29.79781150817871, "global_step": 41106, "epoch": 339} {"train_loss": -30.15559196472168, "global_step": 41107, "epoch": 339} {"train_loss": -30.895950317382812, "global_step": 41108, "epoch": 339} {"train_loss": -31.432798385620117, "global_step": 41109, "epoch": 339} {"train_loss": -31.47635841369629, "global_step": 41110, "epoch": 339} {"train_loss": -31.170007705688477, "global_step": 41111, "epoch": 339} {"train_loss": -28.35268211364746, "global_step": 41112, "epoch": 339} {"train_loss": -19.205814361572266, "global_step": 41113, "epoch": 339} {"train_loss": -19.673294067382812, "global_step": 41114, "epoch": 339} {"train_loss": -25.864013671875, "global_step": 41115, "epoch": 339} {"train_loss": -19.867565155029297, "global_step": 41116, "epoch": 339} {"train_loss": -23.052658081054688, "global_step": 41117, "epoch": 339} {"train_loss": -30.420413970947266, "global_step": 41118, "epoch": 339} {"train_loss": -25.347440719604492, "global_step": 41119, "epoch": 339} {"train_loss": -25.804914474487305, "global_step": 41120, "epoch": 339} {"train_loss": -30.227588653564453, "global_step": 41121, "epoch": 339} {"train_loss": -30.05047607421875, "global_step": 41122, "epoch": 339} {"train_loss": -28.66080093383789, "global_step": 41123, "epoch": 339} {"train_loss": -27.9965877532959, "global_step": 41124, "epoch": 339} {"train_loss": -30.055377960205078, "global_step": 41125, "epoch": 339} {"train_loss": -30.454687118530273, "global_step": 41126, "epoch": 339} {"train_loss": -31.57550048828125, "global_step": 41127, "epoch": 339} {"train_loss": -31.281492233276367, "global_step": 41128, "epoch": 339} {"train_loss": -30.9683780670166, "global_step": 41129, "epoch": 339} {"train_loss": -31.091171264648438, "global_step": 41130, "epoch": 339} {"train_loss": -30.76906394958496, "global_step": 41131, "epoch": 339} {"train_loss": -30.6359806060791, "global_step": 41132, "epoch": 339} {"train_loss": -31.3814754486084, "global_step": 41133, "epoch": 339} {"train_loss": -31.227935791015625, "global_step": 41134, "epoch": 339} {"train_loss": -31.544458389282227, "global_step": 41135, "epoch": 339} {"train_loss": -31.580307006835938, "global_step": 41136, "epoch": 339} {"train_loss": -31.09328269958496, "global_step": 41137, "epoch": 339} {"train_loss": -32.169918060302734, "global_step": 41138, "epoch": 339} {"train_loss": -30.782699019455713, "global_step": 41139, "epoch": 339, "val_loss": 2505186.75} {"train_loss": -32.27278518676758, "global_step": 41140, "epoch": 340} {"train_loss": -32.12390899658203, "global_step": 41141, "epoch": 340} {"train_loss": -31.67824363708496, "global_step": 41142, "epoch": 340} {"train_loss": -31.596561431884766, "global_step": 41143, "epoch": 340} {"train_loss": -32.119869232177734, "global_step": 41144, "epoch": 340} {"train_loss": -32.0303840637207, "global_step": 41145, "epoch": 340} {"train_loss": -32.771018981933594, "global_step": 41146, "epoch": 340} {"train_loss": -32.04362487792969, "global_step": 41147, "epoch": 340} {"train_loss": -32.26658248901367, "global_step": 41148, "epoch": 340} {"train_loss": -32.57861328125, "global_step": 41149, "epoch": 340} {"train_loss": -32.53477096557617, "global_step": 41150, "epoch": 340} {"train_loss": -32.74412155151367, "global_step": 41151, "epoch": 340} {"train_loss": -32.506900787353516, "global_step": 41152, "epoch": 340} {"train_loss": -32.448097229003906, "global_step": 41153, "epoch": 340} {"train_loss": -32.2535514831543, "global_step": 41154, "epoch": 340} {"train_loss": -32.3399772644043, "global_step": 41155, "epoch": 340} {"train_loss": -32.4415397644043, "global_step": 41156, "epoch": 340} {"train_loss": -32.047977447509766, "global_step": 41157, "epoch": 340} {"train_loss": -33.142784118652344, "global_step": 41158, "epoch": 340} {"train_loss": -33.17361831665039, "global_step": 41159, "epoch": 340} {"train_loss": -32.8849983215332, "global_step": 41160, "epoch": 340} {"train_loss": -32.9109992980957, "global_step": 41161, "epoch": 340} {"train_loss": -30.963708877563477, "global_step": 41162, "epoch": 340} {"train_loss": -32.8698616027832, "global_step": 41163, "epoch": 340} {"train_loss": -33.22764205932617, "global_step": 41164, "epoch": 340} {"train_loss": -32.133766174316406, "global_step": 41165, "epoch": 340} {"train_loss": -31.714771270751953, "global_step": 41166, "epoch": 340} {"train_loss": -32.20899963378906, "global_step": 41167, "epoch": 340} {"train_loss": -32.88893508911133, "global_step": 41168, "epoch": 340} {"train_loss": -32.11574935913086, "global_step": 41169, "epoch": 340} {"train_loss": -32.57823944091797, "global_step": 41170, "epoch": 340} {"train_loss": -32.74748229980469, "global_step": 41171, "epoch": 340} {"train_loss": -32.00725555419922, "global_step": 41172, "epoch": 340} {"train_loss": -32.25301742553711, "global_step": 41173, "epoch": 340} {"train_loss": -32.73971176147461, "global_step": 41174, "epoch": 340} {"train_loss": -33.339473724365234, "global_step": 41175, "epoch": 340} {"train_loss": -33.13717269897461, "global_step": 41176, "epoch": 340} {"train_loss": -32.68717575073242, "global_step": 41177, "epoch": 340} {"train_loss": -32.9401741027832, "global_step": 41178, "epoch": 340} {"train_loss": -33.1728401184082, "global_step": 41179, "epoch": 340} {"train_loss": -32.953857421875, "global_step": 41180, "epoch": 340} {"train_loss": -29.02251625061035, "global_step": 41181, "epoch": 340} {"train_loss": -29.632709503173828, "global_step": 41182, "epoch": 340} {"train_loss": -32.45304489135742, "global_step": 41183, "epoch": 340} {"train_loss": -32.5092887878418, "global_step": 41184, "epoch": 340} {"train_loss": -32.496238708496094, "global_step": 41185, "epoch": 340} {"train_loss": -32.186614990234375, "global_step": 41186, "epoch": 340} {"train_loss": -32.51655197143555, "global_step": 41187, "epoch": 340} {"train_loss": -32.18659591674805, "global_step": 41188, "epoch": 340} {"train_loss": -32.4146842956543, "global_step": 41189, "epoch": 340} {"train_loss": -32.81937026977539, "global_step": 41190, "epoch": 340} {"train_loss": -29.839263916015625, "global_step": 41191, "epoch": 340} {"train_loss": -32.28449630737305, "global_step": 41192, "epoch": 340} {"train_loss": -33.06895065307617, "global_step": 41193, "epoch": 340} {"train_loss": -32.142147064208984, "global_step": 41194, "epoch": 340} {"train_loss": -31.444793701171875, "global_step": 41195, "epoch": 340} {"train_loss": -30.72588539123535, "global_step": 41196, "epoch": 340} {"train_loss": -28.76731300354004, "global_step": 41197, "epoch": 340} {"train_loss": -32.38493347167969, "global_step": 41198, "epoch": 340} {"train_loss": -31.338972091674805, "global_step": 41199, "epoch": 340} {"train_loss": -32.057613372802734, "global_step": 41200, "epoch": 340} {"train_loss": -31.35330581665039, "global_step": 41201, "epoch": 340} {"train_loss": -32.12392807006836, "global_step": 41202, "epoch": 340} {"train_loss": -31.863285064697266, "global_step": 41203, "epoch": 340} {"train_loss": -32.45630645751953, "global_step": 41204, "epoch": 340} {"train_loss": -32.28318405151367, "global_step": 41205, "epoch": 340} {"train_loss": -32.919857025146484, "global_step": 41206, "epoch": 340} {"train_loss": -32.42849349975586, "global_step": 41207, "epoch": 340} {"train_loss": -33.01253890991211, "global_step": 41208, "epoch": 340} {"train_loss": -32.699851989746094, "global_step": 41209, "epoch": 340} {"train_loss": -32.87593078613281, "global_step": 41210, "epoch": 340} {"train_loss": -33.173763275146484, "global_step": 41211, "epoch": 340} {"train_loss": -32.96522903442383, "global_step": 41212, "epoch": 340} {"train_loss": -32.00509262084961, "global_step": 41213, "epoch": 340} {"train_loss": -31.814985275268555, "global_step": 41214, "epoch": 340} {"train_loss": -32.8950309753418, "global_step": 41215, "epoch": 340} {"train_loss": -32.491249084472656, "global_step": 41216, "epoch": 340} {"train_loss": -32.0248908996582, "global_step": 41217, "epoch": 340} {"train_loss": -33.53939437866211, "global_step": 41218, "epoch": 340} {"train_loss": -32.921112060546875, "global_step": 41219, "epoch": 340} {"train_loss": -33.12199020385742, "global_step": 41220, "epoch": 340} {"train_loss": -32.735694885253906, "global_step": 41221, "epoch": 340} {"train_loss": -33.52348709106445, "global_step": 41222, "epoch": 340} {"train_loss": -33.207027435302734, "global_step": 41223, "epoch": 340} {"train_loss": -33.092071533203125, "global_step": 41224, "epoch": 340} {"train_loss": -33.53683090209961, "global_step": 41225, "epoch": 340} {"train_loss": -33.5327033996582, "global_step": 41226, "epoch": 340} {"train_loss": -34.1037712097168, "global_step": 41227, "epoch": 340} {"train_loss": -33.72011947631836, "global_step": 41228, "epoch": 340} {"train_loss": -33.38434982299805, "global_step": 41229, "epoch": 340} {"train_loss": -33.838722229003906, "global_step": 41230, "epoch": 340} {"train_loss": -32.87501907348633, "global_step": 41231, "epoch": 340} {"train_loss": -33.548824310302734, "global_step": 41232, "epoch": 340} {"train_loss": -34.10233688354492, "global_step": 41233, "epoch": 340} {"train_loss": -34.143592834472656, "global_step": 41234, "epoch": 340} {"train_loss": -34.17740249633789, "global_step": 41235, "epoch": 340} {"train_loss": -34.14915084838867, "global_step": 41236, "epoch": 340} {"train_loss": -33.9923210144043, "global_step": 41237, "epoch": 340} {"train_loss": -34.261146545410156, "global_step": 41238, "epoch": 340} {"train_loss": -34.1317253112793, "global_step": 41239, "epoch": 340} {"train_loss": -33.32600021362305, "global_step": 41240, "epoch": 340} {"train_loss": -34.34758377075195, "global_step": 41241, "epoch": 340} {"train_loss": -34.288326263427734, "global_step": 41242, "epoch": 340} {"train_loss": -34.43174362182617, "global_step": 41243, "epoch": 340} {"train_loss": -33.99098587036133, "global_step": 41244, "epoch": 340} {"train_loss": -33.94692611694336, "global_step": 41245, "epoch": 340} {"train_loss": -34.00330352783203, "global_step": 41246, "epoch": 340} {"train_loss": -33.98659133911133, "global_step": 41247, "epoch": 340} {"train_loss": -33.65877151489258, "global_step": 41248, "epoch": 340} {"train_loss": -33.90373611450195, "global_step": 41249, "epoch": 340} {"train_loss": -34.380706787109375, "global_step": 41250, "epoch": 340} {"train_loss": -33.94907760620117, "global_step": 41251, "epoch": 340} {"train_loss": -34.70454025268555, "global_step": 41252, "epoch": 340} {"train_loss": -34.388206481933594, "global_step": 41253, "epoch": 340} {"train_loss": -34.142860412597656, "global_step": 41254, "epoch": 340} {"train_loss": -34.08840560913086, "global_step": 41255, "epoch": 340} {"train_loss": -33.96513748168945, "global_step": 41256, "epoch": 340} {"train_loss": -33.32330322265625, "global_step": 41257, "epoch": 340} {"train_loss": -33.40891647338867, "global_step": 41258, "epoch": 340} {"train_loss": -34.17060470581055, "global_step": 41259, "epoch": 340} {"train_loss": -32.80457458811358, "global_step": 41260, "epoch": 340, "val_loss": 2632864.25} {"train_loss": -34.25972366333008, "global_step": 41261, "epoch": 341} {"train_loss": -33.872314453125, "global_step": 41262, "epoch": 341} {"train_loss": -33.635467529296875, "global_step": 41263, "epoch": 341} {"train_loss": -34.949825286865234, "global_step": 41264, "epoch": 341} {"train_loss": -33.491756439208984, "global_step": 41265, "epoch": 341} {"train_loss": -34.05130386352539, "global_step": 41266, "epoch": 341} {"train_loss": -34.67852783203125, "global_step": 41267, "epoch": 341} {"train_loss": -32.62058639526367, "global_step": 41268, "epoch": 341} {"train_loss": -32.49473190307617, "global_step": 41269, "epoch": 341} {"train_loss": -32.71845245361328, "global_step": 41270, "epoch": 341} {"train_loss": -26.533613204956055, "global_step": 41271, "epoch": 341} {"train_loss": -30.70574951171875, "global_step": 41272, "epoch": 341} {"train_loss": -25.72391700744629, "global_step": 41273, "epoch": 341} {"train_loss": -28.951040267944336, "global_step": 41274, "epoch": 341} {"train_loss": -24.642658233642578, "global_step": 41275, "epoch": 341} {"train_loss": -25.799142837524414, "global_step": 41276, "epoch": 341} {"train_loss": -20.453754425048828, "global_step": 41277, "epoch": 341} {"train_loss": -28.0671443939209, "global_step": 41278, "epoch": 341} {"train_loss": -30.87163734436035, "global_step": 41279, "epoch": 341} {"train_loss": -28.402151107788086, "global_step": 41280, "epoch": 341} {"train_loss": -31.615558624267578, "global_step": 41281, "epoch": 341} {"train_loss": -29.889907836914062, "global_step": 41282, "epoch": 341} {"train_loss": -31.294891357421875, "global_step": 41283, "epoch": 341} {"train_loss": -30.940185546875, "global_step": 41284, "epoch": 341} {"train_loss": -32.16202926635742, "global_step": 41285, "epoch": 341} {"train_loss": -30.83772087097168, "global_step": 41286, "epoch": 341} {"train_loss": -32.00200653076172, "global_step": 41287, "epoch": 341} {"train_loss": -32.19285202026367, "global_step": 41288, "epoch": 341} {"train_loss": -31.820636749267578, "global_step": 41289, "epoch": 341} {"train_loss": -32.12433624267578, "global_step": 41290, "epoch": 341} {"train_loss": -32.769142150878906, "global_step": 41291, "epoch": 341} {"train_loss": -32.006900787353516, "global_step": 41292, "epoch": 341} {"train_loss": -32.366371154785156, "global_step": 41293, "epoch": 341} {"train_loss": -32.52031707763672, "global_step": 41294, "epoch": 341} {"train_loss": -32.520172119140625, "global_step": 41295, "epoch": 341} {"train_loss": -32.88642501831055, "global_step": 41296, "epoch": 341} {"train_loss": -32.6741828918457, "global_step": 41297, "epoch": 341} {"train_loss": -32.4198112487793, "global_step": 41298, "epoch": 341} {"train_loss": -32.622467041015625, "global_step": 41299, "epoch": 341} {"train_loss": -32.963714599609375, "global_step": 41300, "epoch": 341} {"train_loss": -33.02277374267578, "global_step": 41301, "epoch": 341} {"train_loss": -33.051082611083984, "global_step": 41302, "epoch": 341} {"train_loss": -33.06854248046875, "global_step": 41303, "epoch": 341} {"train_loss": -32.73969650268555, "global_step": 41304, "epoch": 341} {"train_loss": -32.85917282104492, "global_step": 41305, "epoch": 341} {"train_loss": -33.3455924987793, "global_step": 41306, "epoch": 341} {"train_loss": -33.265785217285156, "global_step": 41307, "epoch": 341} {"train_loss": -33.46992111206055, "global_step": 41308, "epoch": 341} {"train_loss": -33.532752990722656, "global_step": 41309, "epoch": 341} {"train_loss": -33.30583572387695, "global_step": 41310, "epoch": 341} {"train_loss": -33.33330154418945, "global_step": 41311, "epoch": 341} {"train_loss": -33.46906280517578, "global_step": 41312, "epoch": 341} {"train_loss": -33.72563171386719, "global_step": 41313, "epoch": 341} {"train_loss": -33.249755859375, "global_step": 41314, "epoch": 341} {"train_loss": -33.33850860595703, "global_step": 41315, "epoch": 341} {"train_loss": -33.95024871826172, "global_step": 41316, "epoch": 341} {"train_loss": -33.74968338012695, "global_step": 41317, "epoch": 341} {"train_loss": -34.092506408691406, "global_step": 41318, "epoch": 341} {"train_loss": -34.0484733581543, "global_step": 41319, "epoch": 341} {"train_loss": -33.71438217163086, "global_step": 41320, "epoch": 341} {"train_loss": -33.94330978393555, "global_step": 41321, "epoch": 341} {"train_loss": -34.16566848754883, "global_step": 41322, "epoch": 341} {"train_loss": -34.2191047668457, "global_step": 41323, "epoch": 341} {"train_loss": -34.14143753051758, "global_step": 41324, "epoch": 341} {"train_loss": -34.38521194458008, "global_step": 41325, "epoch": 341} {"train_loss": -33.76040267944336, "global_step": 41326, "epoch": 341} {"train_loss": -33.715118408203125, "global_step": 41327, "epoch": 341} {"train_loss": -33.849674224853516, "global_step": 41328, "epoch": 341} {"train_loss": -34.73246765136719, "global_step": 41329, "epoch": 341} {"train_loss": -34.13524627685547, "global_step": 41330, "epoch": 341} {"train_loss": -34.2651481628418, "global_step": 41331, "epoch": 341} {"train_loss": -34.55510330200195, "global_step": 41332, "epoch": 341} {"train_loss": -34.77378463745117, "global_step": 41333, "epoch": 341} {"train_loss": -34.66866683959961, "global_step": 41334, "epoch": 341} {"train_loss": -34.2924919128418, "global_step": 41335, "epoch": 341} {"train_loss": -34.1688346862793, "global_step": 41336, "epoch": 341} {"train_loss": -33.89044952392578, "global_step": 41337, "epoch": 341} {"train_loss": -34.081241607666016, "global_step": 41338, "epoch": 341} {"train_loss": -33.373905181884766, "global_step": 41339, "epoch": 341} {"train_loss": -33.78947830200195, "global_step": 41340, "epoch": 341} {"train_loss": -34.89971923828125, "global_step": 41341, "epoch": 341} {"train_loss": -34.182979583740234, "global_step": 41342, "epoch": 341} {"train_loss": -33.07654571533203, "global_step": 41343, "epoch": 341} {"train_loss": -32.538902282714844, "global_step": 41344, "epoch": 341} {"train_loss": -34.23584747314453, "global_step": 41345, "epoch": 341} {"train_loss": -33.048580169677734, "global_step": 41346, "epoch": 341} {"train_loss": -32.4185676574707, "global_step": 41347, "epoch": 341} {"train_loss": -33.39288330078125, "global_step": 41348, "epoch": 341} {"train_loss": -34.1348762512207, "global_step": 41349, "epoch": 341} {"train_loss": -33.7853889465332, "global_step": 41350, "epoch": 341} {"train_loss": -33.886085510253906, "global_step": 41351, "epoch": 341} {"train_loss": -34.81848907470703, "global_step": 41352, "epoch": 341} {"train_loss": -34.607337951660156, "global_step": 41353, "epoch": 341} {"train_loss": -34.17556381225586, "global_step": 41354, "epoch": 341} {"train_loss": -34.798309326171875, "global_step": 41355, "epoch": 341} {"train_loss": -34.37183380126953, "global_step": 41356, "epoch": 341} {"train_loss": -34.82682800292969, "global_step": 41357, "epoch": 341} {"train_loss": -34.66777801513672, "global_step": 41358, "epoch": 341} {"train_loss": -33.55131530761719, "global_step": 41359, "epoch": 341} {"train_loss": -34.85552215576172, "global_step": 41360, "epoch": 341} {"train_loss": -34.417362213134766, "global_step": 41361, "epoch": 341} {"train_loss": -34.627376556396484, "global_step": 41362, "epoch": 341} {"train_loss": -34.52315902709961, "global_step": 41363, "epoch": 341} {"train_loss": -34.85710525512695, "global_step": 41364, "epoch": 341} {"train_loss": -34.852603912353516, "global_step": 41365, "epoch": 341} {"train_loss": -34.74589538574219, "global_step": 41366, "epoch": 341} {"train_loss": -34.67995071411133, "global_step": 41367, "epoch": 341} {"train_loss": -34.64272689819336, "global_step": 41368, "epoch": 341} {"train_loss": -34.66728973388672, "global_step": 41369, "epoch": 341} {"train_loss": -34.5167236328125, "global_step": 41370, "epoch": 341} {"train_loss": -33.77411651611328, "global_step": 41371, "epoch": 341} {"train_loss": -34.550411224365234, "global_step": 41372, "epoch": 341} {"train_loss": -34.45642852783203, "global_step": 41373, "epoch": 341} {"train_loss": -34.684810638427734, "global_step": 41374, "epoch": 341} {"train_loss": -34.48853302001953, "global_step": 41375, "epoch": 341} {"train_loss": -33.864009857177734, "global_step": 41376, "epoch": 341} {"train_loss": -35.03236389160156, "global_step": 41377, "epoch": 341} {"train_loss": -34.289546966552734, "global_step": 41378, "epoch": 341} {"train_loss": -34.24917221069336, "global_step": 41379, "epoch": 341} {"train_loss": -33.68996810913086, "global_step": 41380, "epoch": 341} {"train_loss": -33.082352756468715, "global_step": 41381, "epoch": 341, "val_loss": 2596489.75} {"train_loss": -34.758636474609375, "global_step": 41382, "epoch": 342} {"train_loss": -34.390785217285156, "global_step": 41383, "epoch": 342} {"train_loss": -34.198909759521484, "global_step": 41384, "epoch": 342} {"train_loss": -33.7531623840332, "global_step": 41385, "epoch": 342} {"train_loss": -34.59076690673828, "global_step": 41386, "epoch": 342} {"train_loss": -33.874549865722656, "global_step": 41387, "epoch": 342} {"train_loss": -34.116722106933594, "global_step": 41388, "epoch": 342} {"train_loss": -33.986106872558594, "global_step": 41389, "epoch": 342} {"train_loss": -34.54039764404297, "global_step": 41390, "epoch": 342} {"train_loss": -34.179046630859375, "global_step": 41391, "epoch": 342} {"train_loss": -34.54621124267578, "global_step": 41392, "epoch": 342} {"train_loss": -34.94856643676758, "global_step": 41393, "epoch": 342} {"train_loss": -34.45699691772461, "global_step": 41394, "epoch": 342} {"train_loss": -34.57783126831055, "global_step": 41395, "epoch": 342} {"train_loss": -33.99470901489258, "global_step": 41396, "epoch": 342} {"train_loss": -34.56804275512695, "global_step": 41397, "epoch": 342} {"train_loss": -33.80930709838867, "global_step": 41398, "epoch": 342} {"train_loss": -31.8725643157959, "global_step": 41399, "epoch": 342} {"train_loss": -34.21129608154297, "global_step": 41400, "epoch": 342} {"train_loss": -34.36343765258789, "global_step": 41401, "epoch": 342} {"train_loss": -34.85188674926758, "global_step": 41402, "epoch": 342} {"train_loss": -34.93159103393555, "global_step": 41403, "epoch": 342} {"train_loss": -34.888427734375, "global_step": 41404, "epoch": 342} {"train_loss": -34.544921875, "global_step": 41405, "epoch": 342} {"train_loss": -34.406036376953125, "global_step": 41406, "epoch": 342} {"train_loss": -34.86859130859375, "global_step": 41407, "epoch": 342} {"train_loss": -35.04214096069336, "global_step": 41408, "epoch": 342} {"train_loss": -35.0595817565918, "global_step": 41409, "epoch": 342} {"train_loss": -34.65443801879883, "global_step": 41410, "epoch": 342} {"train_loss": -34.70984649658203, "global_step": 41411, "epoch": 342} {"train_loss": -34.82780075073242, "global_step": 41412, "epoch": 342} {"train_loss": -34.564273834228516, "global_step": 41413, "epoch": 342} {"train_loss": -35.010677337646484, "global_step": 41414, "epoch": 342} {"train_loss": -34.530364990234375, "global_step": 41415, "epoch": 342} {"train_loss": -33.749755859375, "global_step": 41416, "epoch": 342} {"train_loss": -30.937849044799805, "global_step": 41417, "epoch": 342} {"train_loss": -21.39483642578125, "global_step": 41418, "epoch": 342} {"train_loss": 2.8293728828430176, "global_step": 41419, "epoch": 342} {"train_loss": 19.563077926635742, "global_step": 41420, "epoch": 342} {"train_loss": -31.2462158203125, "global_step": 41421, "epoch": 342} {"train_loss": -7.772263526916504, "global_step": 41422, "epoch": 342} {"train_loss": -31.2955265045166, "global_step": 41423, "epoch": 342} {"train_loss": -12.804858207702637, "global_step": 41424, "epoch": 342} {"train_loss": -31.791906356811523, "global_step": 41425, "epoch": 342} {"train_loss": -28.392120361328125, "global_step": 41426, "epoch": 342} {"train_loss": -23.370929718017578, "global_step": 41427, "epoch": 342} {"train_loss": -29.800079345703125, "global_step": 41428, "epoch": 342} {"train_loss": -32.39484786987305, "global_step": 41429, "epoch": 342} {"train_loss": -30.131864547729492, "global_step": 41430, "epoch": 342} {"train_loss": -28.93889808654785, "global_step": 41431, "epoch": 342} {"train_loss": -30.3138484954834, "global_step": 41432, "epoch": 342} {"train_loss": -32.762596130371094, "global_step": 41433, "epoch": 342} {"train_loss": -32.140472412109375, "global_step": 41434, "epoch": 342} {"train_loss": -32.94482421875, "global_step": 41435, "epoch": 342} {"train_loss": -31.299224853515625, "global_step": 41436, "epoch": 342} {"train_loss": -31.19654655456543, "global_step": 41437, "epoch": 342} {"train_loss": -32.04098129272461, "global_step": 41438, "epoch": 342} {"train_loss": -32.53251647949219, "global_step": 41439, "epoch": 342} {"train_loss": -32.28228759765625, "global_step": 41440, "epoch": 342} {"train_loss": -32.593048095703125, "global_step": 41441, "epoch": 342} {"train_loss": -32.84495162963867, "global_step": 41442, "epoch": 342} {"train_loss": -32.79026794433594, "global_step": 41443, "epoch": 342} {"train_loss": -32.758419036865234, "global_step": 41444, "epoch": 342} {"train_loss": -32.876953125, "global_step": 41445, "epoch": 342} {"train_loss": -32.91926574707031, "global_step": 41446, "epoch": 342} {"train_loss": -33.05024337768555, "global_step": 41447, "epoch": 342} {"train_loss": -32.911373138427734, "global_step": 41448, "epoch": 342} {"train_loss": -33.61323165893555, "global_step": 41449, "epoch": 342} {"train_loss": -33.53945541381836, "global_step": 41450, "epoch": 342} {"train_loss": -33.562530517578125, "global_step": 41451, "epoch": 342} {"train_loss": -32.966033935546875, "global_step": 41452, "epoch": 342} {"train_loss": -33.55660629272461, "global_step": 41453, "epoch": 342} {"train_loss": -33.620140075683594, "global_step": 41454, "epoch": 342} {"train_loss": -33.62002944946289, "global_step": 41455, "epoch": 342} {"train_loss": -33.712501525878906, "global_step": 41456, "epoch": 342} {"train_loss": -33.52083206176758, "global_step": 41457, "epoch": 342} {"train_loss": -34.040061950683594, "global_step": 41458, "epoch": 342} {"train_loss": -33.658451080322266, "global_step": 41459, "epoch": 342} {"train_loss": -33.64327621459961, "global_step": 41460, "epoch": 342} {"train_loss": -33.846092224121094, "global_step": 41461, "epoch": 342} {"train_loss": -34.0994987487793, "global_step": 41462, "epoch": 342} {"train_loss": -33.729095458984375, "global_step": 41463, "epoch": 342} {"train_loss": -34.062538146972656, "global_step": 41464, "epoch": 342} {"train_loss": -33.4251823425293, "global_step": 41465, "epoch": 342} {"train_loss": -34.51233673095703, "global_step": 41466, "epoch": 342} {"train_loss": -33.772518157958984, "global_step": 41467, "epoch": 342} {"train_loss": -33.83028793334961, "global_step": 41468, "epoch": 342} {"train_loss": -34.35969924926758, "global_step": 41469, "epoch": 342} {"train_loss": -34.39243698120117, "global_step": 41470, "epoch": 342} {"train_loss": -34.5181770324707, "global_step": 41471, "epoch": 342} {"train_loss": -34.25828170776367, "global_step": 41472, "epoch": 342} {"train_loss": -34.4011344909668, "global_step": 41473, "epoch": 342} {"train_loss": -34.33309555053711, "global_step": 41474, "epoch": 342} {"train_loss": -34.310550689697266, "global_step": 41475, "epoch": 342} {"train_loss": -34.28193283081055, "global_step": 41476, "epoch": 342} {"train_loss": -34.16496658325195, "global_step": 41477, "epoch": 342} {"train_loss": -34.45596694946289, "global_step": 41478, "epoch": 342} {"train_loss": -33.96265411376953, "global_step": 41479, "epoch": 342} {"train_loss": -34.43359375, "global_step": 41480, "epoch": 342} {"train_loss": -33.940799713134766, "global_step": 41481, "epoch": 342} {"train_loss": -34.592254638671875, "global_step": 41482, "epoch": 342} {"train_loss": -34.4824333190918, "global_step": 41483, "epoch": 342} {"train_loss": -34.19524383544922, "global_step": 41484, "epoch": 342} {"train_loss": -34.22553253173828, "global_step": 41485, "epoch": 342} {"train_loss": -34.101104736328125, "global_step": 41486, "epoch": 342} {"train_loss": -33.31279754638672, "global_step": 41487, "epoch": 342} {"train_loss": -32.481685638427734, "global_step": 41488, "epoch": 342} {"train_loss": -31.24531364440918, "global_step": 41489, "epoch": 342} {"train_loss": -31.074338912963867, "global_step": 41490, "epoch": 342} {"train_loss": -32.80567169189453, "global_step": 41491, "epoch": 342} {"train_loss": -31.3073787689209, "global_step": 41492, "epoch": 342} {"train_loss": -32.87895202636719, "global_step": 41493, "epoch": 342} {"train_loss": -32.82642364501953, "global_step": 41494, "epoch": 342} {"train_loss": -32.19866943359375, "global_step": 41495, "epoch": 342} {"train_loss": -30.94687271118164, "global_step": 41496, "epoch": 342} {"train_loss": -31.256330490112305, "global_step": 41497, "epoch": 342} {"train_loss": -31.65504264831543, "global_step": 41498, "epoch": 342} {"train_loss": -32.1225700378418, "global_step": 41499, "epoch": 342} {"train_loss": -30.404333114624023, "global_step": 41500, "epoch": 342} {"train_loss": -29.977710723876953, "global_step": 41501, "epoch": 342} {"train_loss": -31.998279630645246, "global_step": 41502, "epoch": 342, "val_loss": 2419257.25} {"train_loss": -31.77412223815918, "global_step": 41503, "epoch": 343} {"train_loss": -31.202014923095703, "global_step": 41504, "epoch": 343} {"train_loss": -32.59414291381836, "global_step": 41505, "epoch": 343} {"train_loss": -32.0700798034668, "global_step": 41506, "epoch": 343} {"train_loss": -32.17613220214844, "global_step": 41507, "epoch": 343} {"train_loss": -32.07777786254883, "global_step": 41508, "epoch": 343} {"train_loss": -32.10700225830078, "global_step": 41509, "epoch": 343} {"train_loss": -32.60136032104492, "global_step": 41510, "epoch": 343} {"train_loss": -32.512489318847656, "global_step": 41511, "epoch": 343} {"train_loss": -32.44361114501953, "global_step": 41512, "epoch": 343} {"train_loss": -32.4588737487793, "global_step": 41513, "epoch": 343} {"train_loss": -32.020530700683594, "global_step": 41514, "epoch": 343} {"train_loss": -32.254451751708984, "global_step": 41515, "epoch": 343} {"train_loss": -32.83281326293945, "global_step": 41516, "epoch": 343} {"train_loss": -32.322139739990234, "global_step": 41517, "epoch": 343} {"train_loss": -30.199390411376953, "global_step": 41518, "epoch": 343} {"train_loss": -30.692106246948242, "global_step": 41519, "epoch": 343} {"train_loss": -30.389301300048828, "global_step": 41520, "epoch": 343} {"train_loss": -30.227813720703125, "global_step": 41521, "epoch": 343} {"train_loss": -31.3946475982666, "global_step": 41522, "epoch": 343} {"train_loss": -29.064294815063477, "global_step": 41523, "epoch": 343} {"train_loss": -31.003820419311523, "global_step": 41524, "epoch": 343} {"train_loss": -31.213882446289062, "global_step": 41525, "epoch": 343} {"train_loss": -30.942428588867188, "global_step": 41526, "epoch": 343} {"train_loss": -32.264312744140625, "global_step": 41527, "epoch": 343} {"train_loss": -31.801733016967773, "global_step": 41528, "epoch": 343} {"train_loss": -32.33626174926758, "global_step": 41529, "epoch": 343} {"train_loss": -31.699491500854492, "global_step": 41530, "epoch": 343} {"train_loss": -32.689849853515625, "global_step": 41531, "epoch": 343} {"train_loss": -31.726825714111328, "global_step": 41532, "epoch": 343} {"train_loss": -31.856653213500977, "global_step": 41533, "epoch": 343} {"train_loss": -31.95688247680664, "global_step": 41534, "epoch": 343} {"train_loss": -32.9082145690918, "global_step": 41535, "epoch": 343} {"train_loss": -32.22813034057617, "global_step": 41536, "epoch": 343} {"train_loss": -32.68172836303711, "global_step": 41537, "epoch": 343} {"train_loss": -32.55817413330078, "global_step": 41538, "epoch": 343} {"train_loss": -32.731788635253906, "global_step": 41539, "epoch": 343} {"train_loss": -33.372955322265625, "global_step": 41540, "epoch": 343} {"train_loss": -33.26955795288086, "global_step": 41541, "epoch": 343} {"train_loss": -32.9588737487793, "global_step": 41542, "epoch": 343} {"train_loss": -33.082889556884766, "global_step": 41543, "epoch": 343} {"train_loss": -33.27350616455078, "global_step": 41544, "epoch": 343} {"train_loss": -32.9898796081543, "global_step": 41545, "epoch": 343} {"train_loss": -33.342529296875, "global_step": 41546, "epoch": 343} {"train_loss": -33.536964416503906, "global_step": 41547, "epoch": 343} {"train_loss": -33.414119720458984, "global_step": 41548, "epoch": 343} {"train_loss": -33.39160919189453, "global_step": 41549, "epoch": 343} {"train_loss": -33.15975570678711, "global_step": 41550, "epoch": 343} {"train_loss": -33.685546875, "global_step": 41551, "epoch": 343} {"train_loss": -33.74486541748047, "global_step": 41552, "epoch": 343} {"train_loss": -33.85897445678711, "global_step": 41553, "epoch": 343} {"train_loss": -33.671016693115234, "global_step": 41554, "epoch": 343} {"train_loss": -33.86293411254883, "global_step": 41555, "epoch": 343} {"train_loss": -33.89033889770508, "global_step": 41556, "epoch": 343} {"train_loss": -32.68370819091797, "global_step": 41557, "epoch": 343} {"train_loss": -33.89661407470703, "global_step": 41558, "epoch": 343} {"train_loss": -34.41012191772461, "global_step": 41559, "epoch": 343} {"train_loss": -33.7594108581543, "global_step": 41560, "epoch": 343} {"train_loss": -33.86118698120117, "global_step": 41561, "epoch": 343} {"train_loss": -33.409481048583984, "global_step": 41562, "epoch": 343} {"train_loss": -34.03679275512695, "global_step": 41563, "epoch": 343} {"train_loss": -34.22808837890625, "global_step": 41564, "epoch": 343} {"train_loss": -33.96506881713867, "global_step": 41565, "epoch": 343} {"train_loss": -34.01057815551758, "global_step": 41566, "epoch": 343} {"train_loss": -34.199066162109375, "global_step": 41567, "epoch": 343} {"train_loss": -34.09519577026367, "global_step": 41568, "epoch": 343} {"train_loss": -34.46644592285156, "global_step": 41569, "epoch": 343} {"train_loss": -34.66459274291992, "global_step": 41570, "epoch": 343} {"train_loss": -34.37061309814453, "global_step": 41571, "epoch": 343} {"train_loss": -34.87166213989258, "global_step": 41572, "epoch": 343} {"train_loss": -33.20024108886719, "global_step": 41573, "epoch": 343} {"train_loss": -31.985761642456055, "global_step": 41574, "epoch": 343} {"train_loss": -34.153717041015625, "global_step": 41575, "epoch": 343} {"train_loss": -34.59025955200195, "global_step": 41576, "epoch": 343} {"train_loss": -34.198055267333984, "global_step": 41577, "epoch": 343} {"train_loss": -33.93305206298828, "global_step": 41578, "epoch": 343} {"train_loss": -34.2346305847168, "global_step": 41579, "epoch": 343} {"train_loss": -34.164920806884766, "global_step": 41580, "epoch": 343} {"train_loss": -32.9782829284668, "global_step": 41581, "epoch": 343} {"train_loss": -32.890384674072266, "global_step": 41582, "epoch": 343} {"train_loss": -33.76030349731445, "global_step": 41583, "epoch": 343} {"train_loss": -34.109859466552734, "global_step": 41584, "epoch": 343} {"train_loss": -33.66059494018555, "global_step": 41585, "epoch": 343} {"train_loss": -33.16718673706055, "global_step": 41586, "epoch": 343} {"train_loss": -33.754459381103516, "global_step": 41587, "epoch": 343} {"train_loss": -33.36887741088867, "global_step": 41588, "epoch": 343} {"train_loss": -33.95645523071289, "global_step": 41589, "epoch": 343} {"train_loss": -32.13740158081055, "global_step": 41590, "epoch": 343} {"train_loss": -33.8538818359375, "global_step": 41591, "epoch": 343} {"train_loss": -32.37785720825195, "global_step": 41592, "epoch": 343} {"train_loss": -31.531591415405273, "global_step": 41593, "epoch": 343} {"train_loss": -33.617530822753906, "global_step": 41594, "epoch": 343} {"train_loss": -33.2320556640625, "global_step": 41595, "epoch": 343} {"train_loss": -32.87299728393555, "global_step": 41596, "epoch": 343} {"train_loss": -33.31364822387695, "global_step": 41597, "epoch": 343} {"train_loss": -33.65970993041992, "global_step": 41598, "epoch": 343} {"train_loss": -32.57160949707031, "global_step": 41599, "epoch": 343} {"train_loss": -31.284299850463867, "global_step": 41600, "epoch": 343} {"train_loss": -32.63429641723633, "global_step": 41601, "epoch": 343} {"train_loss": -32.74104690551758, "global_step": 41602, "epoch": 343} {"train_loss": -29.78608512878418, "global_step": 41603, "epoch": 343} {"train_loss": -31.430570602416992, "global_step": 41604, "epoch": 343} {"train_loss": -31.643360137939453, "global_step": 41605, "epoch": 343} {"train_loss": -32.75416946411133, "global_step": 41606, "epoch": 343} {"train_loss": -30.659423828125, "global_step": 41607, "epoch": 343} {"train_loss": -30.974796295166016, "global_step": 41608, "epoch": 343} {"train_loss": -31.331613540649414, "global_step": 41609, "epoch": 343} {"train_loss": -33.087303161621094, "global_step": 41610, "epoch": 343} {"train_loss": -31.53046226501465, "global_step": 41611, "epoch": 343} {"train_loss": -32.37443923950195, "global_step": 41612, "epoch": 343} {"train_loss": -31.389097213745117, "global_step": 41613, "epoch": 343} {"train_loss": -31.074020385742188, "global_step": 41614, "epoch": 343} {"train_loss": -32.54380798339844, "global_step": 41615, "epoch": 343} {"train_loss": -33.14449691772461, "global_step": 41616, "epoch": 343} {"train_loss": -32.48899841308594, "global_step": 41617, "epoch": 343} {"train_loss": -32.737098693847656, "global_step": 41618, "epoch": 343} {"train_loss": -32.82423782348633, "global_step": 41619, "epoch": 343} {"train_loss": -33.294219970703125, "global_step": 41620, "epoch": 343} {"train_loss": -32.75127410888672, "global_step": 41621, "epoch": 343} {"train_loss": -32.35966110229492, "global_step": 41622, "epoch": 343} {"train_loss": -32.75002645066947, "global_step": 41623, "epoch": 343, "val_loss": 2659085.75} {"train_loss": -33.017337799072266, "global_step": 41624, "epoch": 344} {"train_loss": -33.381351470947266, "global_step": 41625, "epoch": 344} {"train_loss": -32.19234848022461, "global_step": 41626, "epoch": 344} {"train_loss": -32.923397064208984, "global_step": 41627, "epoch": 344} {"train_loss": -33.08317184448242, "global_step": 41628, "epoch": 344} {"train_loss": -32.828529357910156, "global_step": 41629, "epoch": 344} {"train_loss": -33.497291564941406, "global_step": 41630, "epoch": 344} {"train_loss": -32.78802490234375, "global_step": 41631, "epoch": 344} {"train_loss": -33.15039825439453, "global_step": 41632, "epoch": 344} {"train_loss": -32.590728759765625, "global_step": 41633, "epoch": 344} {"train_loss": -33.692138671875, "global_step": 41634, "epoch": 344} {"train_loss": -33.182167053222656, "global_step": 41635, "epoch": 344} {"train_loss": -33.69594192504883, "global_step": 41636, "epoch": 344} {"train_loss": -33.692779541015625, "global_step": 41637, "epoch": 344} {"train_loss": -33.436279296875, "global_step": 41638, "epoch": 344} {"train_loss": -33.673091888427734, "global_step": 41639, "epoch": 344} {"train_loss": -33.852447509765625, "global_step": 41640, "epoch": 344} {"train_loss": -33.861610412597656, "global_step": 41641, "epoch": 344} {"train_loss": -33.70225143432617, "global_step": 41642, "epoch": 344} {"train_loss": -32.59281539916992, "global_step": 41643, "epoch": 344} {"train_loss": -33.68463134765625, "global_step": 41644, "epoch": 344} {"train_loss": -34.02436065673828, "global_step": 41645, "epoch": 344} {"train_loss": -33.53560256958008, "global_step": 41646, "epoch": 344} {"train_loss": -34.15861892700195, "global_step": 41647, "epoch": 344} {"train_loss": -34.07582473754883, "global_step": 41648, "epoch": 344} {"train_loss": -34.20962142944336, "global_step": 41649, "epoch": 344} {"train_loss": -34.21026611328125, "global_step": 41650, "epoch": 344} {"train_loss": -33.646846771240234, "global_step": 41651, "epoch": 344} {"train_loss": -34.0832633972168, "global_step": 41652, "epoch": 344} {"train_loss": -34.477943420410156, "global_step": 41653, "epoch": 344} {"train_loss": -34.31183624267578, "global_step": 41654, "epoch": 344} {"train_loss": -34.26728057861328, "global_step": 41655, "epoch": 344} {"train_loss": -34.47683334350586, "global_step": 41656, "epoch": 344} {"train_loss": -34.49702835083008, "global_step": 41657, "epoch": 344} {"train_loss": -34.439422607421875, "global_step": 41658, "epoch": 344} {"train_loss": -34.3748893737793, "global_step": 41659, "epoch": 344} {"train_loss": -34.396297454833984, "global_step": 41660, "epoch": 344} {"train_loss": -34.22569274902344, "global_step": 41661, "epoch": 344} {"train_loss": -34.54379653930664, "global_step": 41662, "epoch": 344} {"train_loss": -33.52858352661133, "global_step": 41663, "epoch": 344} {"train_loss": -34.37324142456055, "global_step": 41664, "epoch": 344} {"train_loss": -34.1437873840332, "global_step": 41665, "epoch": 344} {"train_loss": -34.147274017333984, "global_step": 41666, "epoch": 344} {"train_loss": -34.83677291870117, "global_step": 41667, "epoch": 344} {"train_loss": -34.093727111816406, "global_step": 41668, "epoch": 344} {"train_loss": -34.57688522338867, "global_step": 41669, "epoch": 344} {"train_loss": -34.52218246459961, "global_step": 41670, "epoch": 344} {"train_loss": -34.500240325927734, "global_step": 41671, "epoch": 344} {"train_loss": -34.493431091308594, "global_step": 41672, "epoch": 344} {"train_loss": -34.88285827636719, "global_step": 41673, "epoch": 344} {"train_loss": -34.95249557495117, "global_step": 41674, "epoch": 344} {"train_loss": -34.76836013793945, "global_step": 41675, "epoch": 344} {"train_loss": -33.80702209472656, "global_step": 41676, "epoch": 344} {"train_loss": -34.90391540527344, "global_step": 41677, "epoch": 344} {"train_loss": -34.24189376831055, "global_step": 41678, "epoch": 344} {"train_loss": -34.18765640258789, "global_step": 41679, "epoch": 344} {"train_loss": -33.90351486206055, "global_step": 41680, "epoch": 344} {"train_loss": -34.98869323730469, "global_step": 41681, "epoch": 344} {"train_loss": -34.65822219848633, "global_step": 41682, "epoch": 344} {"train_loss": -34.36210632324219, "global_step": 41683, "epoch": 344} {"train_loss": -33.99570846557617, "global_step": 41684, "epoch": 344} {"train_loss": -33.77806854248047, "global_step": 41685, "epoch": 344} {"train_loss": -34.355430603027344, "global_step": 41686, "epoch": 344} {"train_loss": -34.16567611694336, "global_step": 41687, "epoch": 344} {"train_loss": -30.86823081970215, "global_step": 41688, "epoch": 344} {"train_loss": -29.2100830078125, "global_step": 41689, "epoch": 344} {"train_loss": -27.886920928955078, "global_step": 41690, "epoch": 344} {"train_loss": -28.221221923828125, "global_step": 41691, "epoch": 344} {"train_loss": -32.57533645629883, "global_step": 41692, "epoch": 344} {"train_loss": -24.5092716217041, "global_step": 41693, "epoch": 344} {"train_loss": -25.635543823242188, "global_step": 41694, "epoch": 344} {"train_loss": -30.1420841217041, "global_step": 41695, "epoch": 344} {"train_loss": -26.463586807250977, "global_step": 41696, "epoch": 344} {"train_loss": -32.39400100708008, "global_step": 41697, "epoch": 344} {"train_loss": -29.383743286132812, "global_step": 41698, "epoch": 344} {"train_loss": -30.058338165283203, "global_step": 41699, "epoch": 344} {"train_loss": -27.159265518188477, "global_step": 41700, "epoch": 344} {"train_loss": -31.53412437438965, "global_step": 41701, "epoch": 344} {"train_loss": -29.686710357666016, "global_step": 41702, "epoch": 344} {"train_loss": -30.12446403503418, "global_step": 41703, "epoch": 344} {"train_loss": -32.14188766479492, "global_step": 41704, "epoch": 344} {"train_loss": -31.723783493041992, "global_step": 41705, "epoch": 344} {"train_loss": -30.478612899780273, "global_step": 41706, "epoch": 344} {"train_loss": -31.48940086364746, "global_step": 41707, "epoch": 344} {"train_loss": -31.737735748291016, "global_step": 41708, "epoch": 344} {"train_loss": -31.523223876953125, "global_step": 41709, "epoch": 344} {"train_loss": -32.37411117553711, "global_step": 41710, "epoch": 344} {"train_loss": -32.09291076660156, "global_step": 41711, "epoch": 344} {"train_loss": -31.85658073425293, "global_step": 41712, "epoch": 344} {"train_loss": -31.983963012695312, "global_step": 41713, "epoch": 344} {"train_loss": -32.531219482421875, "global_step": 41714, "epoch": 344} {"train_loss": -31.743255615234375, "global_step": 41715, "epoch": 344} {"train_loss": -32.54475021362305, "global_step": 41716, "epoch": 344} {"train_loss": -32.21334457397461, "global_step": 41717, "epoch": 344} {"train_loss": -32.376319885253906, "global_step": 41718, "epoch": 344} {"train_loss": -32.7094841003418, "global_step": 41719, "epoch": 344} {"train_loss": -32.2905387878418, "global_step": 41720, "epoch": 344} {"train_loss": -32.734676361083984, "global_step": 41721, "epoch": 344} {"train_loss": -32.472408294677734, "global_step": 41722, "epoch": 344} {"train_loss": -32.98580551147461, "global_step": 41723, "epoch": 344} {"train_loss": -32.65859603881836, "global_step": 41724, "epoch": 344} {"train_loss": -32.90665054321289, "global_step": 41725, "epoch": 344} {"train_loss": -33.65645217895508, "global_step": 41726, "epoch": 344} {"train_loss": -33.10188674926758, "global_step": 41727, "epoch": 344} {"train_loss": -33.531436920166016, "global_step": 41728, "epoch": 344} {"train_loss": -33.1989860534668, "global_step": 41729, "epoch": 344} {"train_loss": -32.7905387878418, "global_step": 41730, "epoch": 344} {"train_loss": -33.26428985595703, "global_step": 41731, "epoch": 344} {"train_loss": -33.17695236206055, "global_step": 41732, "epoch": 344} {"train_loss": -33.584877014160156, "global_step": 41733, "epoch": 344} {"train_loss": -33.53208541870117, "global_step": 41734, "epoch": 344} {"train_loss": -33.71279525756836, "global_step": 41735, "epoch": 344} {"train_loss": -34.12575912475586, "global_step": 41736, "epoch": 344} {"train_loss": -33.580665588378906, "global_step": 41737, "epoch": 344} {"train_loss": -33.53721618652344, "global_step": 41738, "epoch": 344} {"train_loss": -33.96088790893555, "global_step": 41739, "epoch": 344} {"train_loss": -33.91449737548828, "global_step": 41740, "epoch": 344} {"train_loss": -33.897987365722656, "global_step": 41741, "epoch": 344} {"train_loss": -33.96232986450195, "global_step": 41742, "epoch": 344} {"train_loss": -34.125938415527344, "global_step": 41743, "epoch": 344} {"train_loss": -32.941250241492405, "global_step": 41744, "epoch": 344, "val_loss": 2596356.25} {"train_loss": -33.935909271240234, "global_step": 41745, "epoch": 345} {"train_loss": -33.74238967895508, "global_step": 41746, "epoch": 345} {"train_loss": -33.92957305908203, "global_step": 41747, "epoch": 345} {"train_loss": -34.55540084838867, "global_step": 41748, "epoch": 345} {"train_loss": -34.350833892822266, "global_step": 41749, "epoch": 345} {"train_loss": -34.5136604309082, "global_step": 41750, "epoch": 345} {"train_loss": -34.367183685302734, "global_step": 41751, "epoch": 345} {"train_loss": -34.201053619384766, "global_step": 41752, "epoch": 345} {"train_loss": -34.89422607421875, "global_step": 41753, "epoch": 345} {"train_loss": -34.56400680541992, "global_step": 41754, "epoch": 345} {"train_loss": -34.962921142578125, "global_step": 41755, "epoch": 345} {"train_loss": -34.70405960083008, "global_step": 41756, "epoch": 345} {"train_loss": -34.409175872802734, "global_step": 41757, "epoch": 345} {"train_loss": -34.38252639770508, "global_step": 41758, "epoch": 345} {"train_loss": -34.76570129394531, "global_step": 41759, "epoch": 345} {"train_loss": -35.1022834777832, "global_step": 41760, "epoch": 345} {"train_loss": -34.252803802490234, "global_step": 41761, "epoch": 345} {"train_loss": -34.66178512573242, "global_step": 41762, "epoch": 345} {"train_loss": -34.88910675048828, "global_step": 41763, "epoch": 345} {"train_loss": -35.15997314453125, "global_step": 41764, "epoch": 345} {"train_loss": -35.01997756958008, "global_step": 41765, "epoch": 345} {"train_loss": -35.339813232421875, "global_step": 41766, "epoch": 345} {"train_loss": -34.995174407958984, "global_step": 41767, "epoch": 345} {"train_loss": -35.15768814086914, "global_step": 41768, "epoch": 345} {"train_loss": -35.10653305053711, "global_step": 41769, "epoch": 345} {"train_loss": -34.5003776550293, "global_step": 41770, "epoch": 345} {"train_loss": -34.345333099365234, "global_step": 41771, "epoch": 345} {"train_loss": -35.22920608520508, "global_step": 41772, "epoch": 345} {"train_loss": -35.0880012512207, "global_step": 41773, "epoch": 345} {"train_loss": -34.8061637878418, "global_step": 41774, "epoch": 345} {"train_loss": -34.29572296142578, "global_step": 41775, "epoch": 345} {"train_loss": -34.24469757080078, "global_step": 41776, "epoch": 345} {"train_loss": -34.89521408081055, "global_step": 41777, "epoch": 345} {"train_loss": -35.57484817504883, "global_step": 41778, "epoch": 345} {"train_loss": -33.585994720458984, "global_step": 41779, "epoch": 345} {"train_loss": -30.73423194885254, "global_step": 41780, "epoch": 345} {"train_loss": -30.742639541625977, "global_step": 41781, "epoch": 345} {"train_loss": -32.515594482421875, "global_step": 41782, "epoch": 345} {"train_loss": -29.41927146911621, "global_step": 41783, "epoch": 345} {"train_loss": -33.07838439941406, "global_step": 41784, "epoch": 345} {"train_loss": -27.195362091064453, "global_step": 41785, "epoch": 345} {"train_loss": -26.5194091796875, "global_step": 41786, "epoch": 345} {"train_loss": -27.208545684814453, "global_step": 41787, "epoch": 345} {"train_loss": -26.877592086791992, "global_step": 41788, "epoch": 345} {"train_loss": -27.222522735595703, "global_step": 41789, "epoch": 345} {"train_loss": -26.202253341674805, "global_step": 41790, "epoch": 345} {"train_loss": -29.152631759643555, "global_step": 41791, "epoch": 345} {"train_loss": -25.960763931274414, "global_step": 41792, "epoch": 345} {"train_loss": -27.00094985961914, "global_step": 41793, "epoch": 345} {"train_loss": -26.131072998046875, "global_step": 41794, "epoch": 345} {"train_loss": -19.796586990356445, "global_step": 41795, "epoch": 345} {"train_loss": -27.7219181060791, "global_step": 41796, "epoch": 345} {"train_loss": -24.039670944213867, "global_step": 41797, "epoch": 345} {"train_loss": -26.019287109375, "global_step": 41798, "epoch": 345} {"train_loss": -28.75667381286621, "global_step": 41799, "epoch": 345} {"train_loss": -25.3998966217041, "global_step": 41800, "epoch": 345} {"train_loss": -28.693435668945312, "global_step": 41801, "epoch": 345} {"train_loss": -28.749719619750977, "global_step": 41802, "epoch": 345} {"train_loss": -28.15506935119629, "global_step": 41803, "epoch": 345} {"train_loss": -27.790359497070312, "global_step": 41804, "epoch": 345} {"train_loss": -29.408151626586914, "global_step": 41805, "epoch": 345} {"train_loss": -29.03671646118164, "global_step": 41806, "epoch": 345} {"train_loss": -30.032068252563477, "global_step": 41807, "epoch": 345} {"train_loss": -29.333444595336914, "global_step": 41808, "epoch": 345} {"train_loss": -29.975570678710938, "global_step": 41809, "epoch": 345} {"train_loss": -30.95795249938965, "global_step": 41810, "epoch": 345} {"train_loss": -30.51633644104004, "global_step": 41811, "epoch": 345} {"train_loss": -30.875646591186523, "global_step": 41812, "epoch": 345} {"train_loss": -31.18073081970215, "global_step": 41813, "epoch": 345} {"train_loss": -31.48866844177246, "global_step": 41814, "epoch": 345} {"train_loss": -31.346847534179688, "global_step": 41815, "epoch": 345} {"train_loss": -31.61565589904785, "global_step": 41816, "epoch": 345} {"train_loss": -31.59577751159668, "global_step": 41817, "epoch": 345} {"train_loss": -31.922895431518555, "global_step": 41818, "epoch": 345} {"train_loss": -32.09199142456055, "global_step": 41819, "epoch": 345} {"train_loss": -32.03475570678711, "global_step": 41820, "epoch": 345} {"train_loss": -32.659175872802734, "global_step": 41821, "epoch": 345} {"train_loss": -32.38265609741211, "global_step": 41822, "epoch": 345} {"train_loss": -31.9729061126709, "global_step": 41823, "epoch": 345} {"train_loss": -30.666400909423828, "global_step": 41824, "epoch": 345} {"train_loss": -29.817596435546875, "global_step": 41825, "epoch": 345} {"train_loss": -32.23125076293945, "global_step": 41826, "epoch": 345} {"train_loss": -31.976856231689453, "global_step": 41827, "epoch": 345} {"train_loss": -32.1005744934082, "global_step": 41828, "epoch": 345} {"train_loss": -32.587581634521484, "global_step": 41829, "epoch": 345} {"train_loss": -31.258710861206055, "global_step": 41830, "epoch": 345} {"train_loss": -29.4465274810791, "global_step": 41831, "epoch": 345} {"train_loss": -16.454849243164062, "global_step": 41832, "epoch": 345} {"train_loss": -7.983525276184082, "global_step": 41833, "epoch": 345} {"train_loss": -30.523059844970703, "global_step": 41834, "epoch": 345} {"train_loss": -21.611364364624023, "global_step": 41835, "epoch": 345} {"train_loss": -32.63612747192383, "global_step": 41836, "epoch": 345} {"train_loss": -26.009748458862305, "global_step": 41837, "epoch": 345} {"train_loss": -28.055164337158203, "global_step": 41838, "epoch": 345} {"train_loss": -32.50429153442383, "global_step": 41839, "epoch": 345} {"train_loss": -29.45009422302246, "global_step": 41840, "epoch": 345} {"train_loss": -29.027896881103516, "global_step": 41841, "epoch": 345} {"train_loss": -31.22308349609375, "global_step": 41842, "epoch": 345} {"train_loss": -32.32285690307617, "global_step": 41843, "epoch": 345} {"train_loss": -31.262205123901367, "global_step": 41844, "epoch": 345} {"train_loss": -30.621572494506836, "global_step": 41845, "epoch": 345} {"train_loss": -31.117389678955078, "global_step": 41846, "epoch": 345} {"train_loss": -32.036922454833984, "global_step": 41847, "epoch": 345} {"train_loss": -32.68667221069336, "global_step": 41848, "epoch": 345} {"train_loss": -32.12296676635742, "global_step": 41849, "epoch": 345} {"train_loss": -31.419147491455078, "global_step": 41850, "epoch": 345} {"train_loss": -32.14572525024414, "global_step": 41851, "epoch": 345} {"train_loss": -31.642255783081055, "global_step": 41852, "epoch": 345} {"train_loss": -27.167449951171875, "global_step": 41853, "epoch": 345} {"train_loss": -32.0855598449707, "global_step": 41854, "epoch": 345} {"train_loss": -32.055755615234375, "global_step": 41855, "epoch": 345} {"train_loss": -31.908300399780273, "global_step": 41856, "epoch": 345} {"train_loss": -30.8051700592041, "global_step": 41857, "epoch": 345} {"train_loss": -30.79867935180664, "global_step": 41858, "epoch": 345} {"train_loss": -32.59879684448242, "global_step": 41859, "epoch": 345} {"train_loss": -31.848203659057617, "global_step": 41860, "epoch": 345} {"train_loss": -31.200244903564453, "global_step": 41861, "epoch": 345} {"train_loss": -31.991180419921875, "global_step": 41862, "epoch": 345} {"train_loss": -32.04179763793945, "global_step": 41863, "epoch": 345} {"train_loss": -30.695409774780273, "global_step": 41864, "epoch": 345} {"train_loss": -31.022726208710473, "global_step": 41865, "epoch": 345, "val_loss": 2333545.75} {"train_loss": -31.038043975830078, "global_step": 41866, "epoch": 346} {"train_loss": -31.96180534362793, "global_step": 41867, "epoch": 346} {"train_loss": -31.995275497436523, "global_step": 41868, "epoch": 346} {"train_loss": -31.688861846923828, "global_step": 41869, "epoch": 346} {"train_loss": -32.12431716918945, "global_step": 41870, "epoch": 346} {"train_loss": -31.9620304107666, "global_step": 41871, "epoch": 346} {"train_loss": -31.155710220336914, "global_step": 41872, "epoch": 346} {"train_loss": -32.06221389770508, "global_step": 41873, "epoch": 346} {"train_loss": -31.41971778869629, "global_step": 41874, "epoch": 346} {"train_loss": -31.55792236328125, "global_step": 41875, "epoch": 346} {"train_loss": -32.28658676147461, "global_step": 41876, "epoch": 346} {"train_loss": -31.65237808227539, "global_step": 41877, "epoch": 346} {"train_loss": -31.410375595092773, "global_step": 41878, "epoch": 346} {"train_loss": -32.17829132080078, "global_step": 41879, "epoch": 346} {"train_loss": -32.1141242980957, "global_step": 41880, "epoch": 346} {"train_loss": -32.04200744628906, "global_step": 41881, "epoch": 346} {"train_loss": -32.11745834350586, "global_step": 41882, "epoch": 346} {"train_loss": -31.19000816345215, "global_step": 41883, "epoch": 346} {"train_loss": -31.961816787719727, "global_step": 41884, "epoch": 346} {"train_loss": -32.034915924072266, "global_step": 41885, "epoch": 346} {"train_loss": -32.678985595703125, "global_step": 41886, "epoch": 346} {"train_loss": -32.09856033325195, "global_step": 41887, "epoch": 346} {"train_loss": -32.09027862548828, "global_step": 41888, "epoch": 346} {"train_loss": -32.5771484375, "global_step": 41889, "epoch": 346} {"train_loss": -31.78179359436035, "global_step": 41890, "epoch": 346} {"train_loss": -31.97833824157715, "global_step": 41891, "epoch": 346} {"train_loss": -32.71891403198242, "global_step": 41892, "epoch": 346} {"train_loss": -32.56329345703125, "global_step": 41893, "epoch": 346} {"train_loss": -32.39934539794922, "global_step": 41894, "epoch": 346} {"train_loss": -33.05318832397461, "global_step": 41895, "epoch": 346} {"train_loss": -33.26041793823242, "global_step": 41896, "epoch": 346} {"train_loss": -32.705989837646484, "global_step": 41897, "epoch": 346} {"train_loss": -32.52861404418945, "global_step": 41898, "epoch": 346} {"train_loss": -32.5878791809082, "global_step": 41899, "epoch": 346} {"train_loss": -32.95941925048828, "global_step": 41900, "epoch": 346} {"train_loss": -32.7112922668457, "global_step": 41901, "epoch": 346} {"train_loss": -33.12458801269531, "global_step": 41902, "epoch": 346} {"train_loss": -32.8092041015625, "global_step": 41903, "epoch": 346} {"train_loss": -32.29635238647461, "global_step": 41904, "epoch": 346} {"train_loss": -32.66569900512695, "global_step": 41905, "epoch": 346} {"train_loss": -32.94084548950195, "global_step": 41906, "epoch": 346} {"train_loss": -33.04901123046875, "global_step": 41907, "epoch": 346} {"train_loss": -33.24705123901367, "global_step": 41908, "epoch": 346} {"train_loss": -32.43017578125, "global_step": 41909, "epoch": 346} {"train_loss": -33.506011962890625, "global_step": 41910, "epoch": 346} {"train_loss": -33.26469802856445, "global_step": 41911, "epoch": 346} {"train_loss": -33.12302780151367, "global_step": 41912, "epoch": 346} {"train_loss": -32.44800567626953, "global_step": 41913, "epoch": 346} {"train_loss": -32.00857162475586, "global_step": 41914, "epoch": 346} {"train_loss": -29.580297470092773, "global_step": 41915, "epoch": 346} {"train_loss": -16.524673461914062, "global_step": 41916, "epoch": 346} {"train_loss": 3.976095676422119, "global_step": 41917, "epoch": 346} {"train_loss": -28.62360191345215, "global_step": 41918, "epoch": 346} {"train_loss": -6.150091648101807, "global_step": 41919, "epoch": 346} {"train_loss": -31.815845489501953, "global_step": 41920, "epoch": 346} {"train_loss": -17.021575927734375, "global_step": 41921, "epoch": 346} {"train_loss": -23.66839599609375, "global_step": 41922, "epoch": 346} {"train_loss": -30.486886978149414, "global_step": 41923, "epoch": 346} {"train_loss": -26.061227798461914, "global_step": 41924, "epoch": 346} {"train_loss": -24.722646713256836, "global_step": 41925, "epoch": 346} {"train_loss": -29.552106857299805, "global_step": 41926, "epoch": 346} {"train_loss": -31.834192276000977, "global_step": 41927, "epoch": 346} {"train_loss": -29.0628662109375, "global_step": 41928, "epoch": 346} {"train_loss": -29.548654556274414, "global_step": 41929, "epoch": 346} {"train_loss": -30.030719757080078, "global_step": 41930, "epoch": 346} {"train_loss": -30.575225830078125, "global_step": 41931, "epoch": 346} {"train_loss": -31.366962432861328, "global_step": 41932, "epoch": 346} {"train_loss": -31.509992599487305, "global_step": 41933, "epoch": 346} {"train_loss": -31.484577178955078, "global_step": 41934, "epoch": 346} {"train_loss": -30.98785400390625, "global_step": 41935, "epoch": 346} {"train_loss": -31.185733795166016, "global_step": 41936, "epoch": 346} {"train_loss": -29.92124366760254, "global_step": 41937, "epoch": 346} {"train_loss": -31.36383056640625, "global_step": 41938, "epoch": 346} {"train_loss": -31.822772979736328, "global_step": 41939, "epoch": 346} {"train_loss": -31.767547607421875, "global_step": 41940, "epoch": 346} {"train_loss": -31.930191040039062, "global_step": 41941, "epoch": 346} {"train_loss": -32.12985610961914, "global_step": 41942, "epoch": 346} {"train_loss": -32.41194152832031, "global_step": 41943, "epoch": 346} {"train_loss": -32.1807861328125, "global_step": 41944, "epoch": 346} {"train_loss": -31.983068466186523, "global_step": 41945, "epoch": 346} {"train_loss": -31.807214736938477, "global_step": 41946, "epoch": 346} {"train_loss": -31.85040283203125, "global_step": 41947, "epoch": 346} {"train_loss": -32.28962707519531, "global_step": 41948, "epoch": 346} {"train_loss": -32.483154296875, "global_step": 41949, "epoch": 346} {"train_loss": -32.51215362548828, "global_step": 41950, "epoch": 346} {"train_loss": -32.49025344848633, "global_step": 41951, "epoch": 346} {"train_loss": -32.63956832885742, "global_step": 41952, "epoch": 346} {"train_loss": -31.01220703125, "global_step": 41953, "epoch": 346} {"train_loss": -32.262332916259766, "global_step": 41954, "epoch": 346} {"train_loss": -32.739933013916016, "global_step": 41955, "epoch": 346} {"train_loss": -32.43130111694336, "global_step": 41956, "epoch": 346} {"train_loss": -32.210540771484375, "global_step": 41957, "epoch": 346} {"train_loss": -31.995229721069336, "global_step": 41958, "epoch": 346} {"train_loss": -31.910078048706055, "global_step": 41959, "epoch": 346} {"train_loss": -32.8193473815918, "global_step": 41960, "epoch": 346} {"train_loss": -32.48680877685547, "global_step": 41961, "epoch": 346} {"train_loss": -32.235897064208984, "global_step": 41962, "epoch": 346} {"train_loss": -32.8313102722168, "global_step": 41963, "epoch": 346} {"train_loss": -32.50762939453125, "global_step": 41964, "epoch": 346} {"train_loss": -31.973983764648438, "global_step": 41965, "epoch": 346} {"train_loss": -31.86701011657715, "global_step": 41966, "epoch": 346} {"train_loss": -31.40064811706543, "global_step": 41967, "epoch": 346} {"train_loss": -30.48370361328125, "global_step": 41968, "epoch": 346} {"train_loss": -31.892972946166992, "global_step": 41969, "epoch": 346} {"train_loss": -33.180233001708984, "global_step": 41970, "epoch": 346} {"train_loss": -32.00212478637695, "global_step": 41971, "epoch": 346} {"train_loss": -32.04127883911133, "global_step": 41972, "epoch": 346} {"train_loss": -32.42869567871094, "global_step": 41973, "epoch": 346} {"train_loss": -32.205379486083984, "global_step": 41974, "epoch": 346} {"train_loss": -31.664142608642578, "global_step": 41975, "epoch": 346} {"train_loss": -32.36105728149414, "global_step": 41976, "epoch": 346} {"train_loss": -31.62517738342285, "global_step": 41977, "epoch": 346} {"train_loss": -32.672157287597656, "global_step": 41978, "epoch": 346} {"train_loss": -31.3868350982666, "global_step": 41979, "epoch": 346} {"train_loss": -32.46274948120117, "global_step": 41980, "epoch": 346} {"train_loss": -32.72809982299805, "global_step": 41981, "epoch": 346} {"train_loss": -32.05612564086914, "global_step": 41982, "epoch": 346} {"train_loss": -33.184635162353516, "global_step": 41983, "epoch": 346} {"train_loss": -32.3535041809082, "global_step": 41984, "epoch": 346} {"train_loss": -32.563232421875, "global_step": 41985, "epoch": 346} {"train_loss": -31.056372067159856, "global_step": 41986, "epoch": 346, "val_loss": 2401195.25} {"train_loss": -32.5732307434082, "global_step": 41987, "epoch": 347} {"train_loss": -32.437835693359375, "global_step": 41988, "epoch": 347} {"train_loss": -32.51507568359375, "global_step": 41989, "epoch": 347} {"train_loss": -32.42403793334961, "global_step": 41990, "epoch": 347} {"train_loss": -32.54655075073242, "global_step": 41991, "epoch": 347} {"train_loss": -32.056758880615234, "global_step": 41992, "epoch": 347} {"train_loss": -32.38544464111328, "global_step": 41993, "epoch": 347} {"train_loss": -31.57953453063965, "global_step": 41994, "epoch": 347} {"train_loss": -31.3807315826416, "global_step": 41995, "epoch": 347} {"train_loss": -30.68536949157715, "global_step": 41996, "epoch": 347} {"train_loss": -31.305973052978516, "global_step": 41997, "epoch": 347} {"train_loss": -30.9495906829834, "global_step": 41998, "epoch": 347} {"train_loss": -32.727333068847656, "global_step": 41999, "epoch": 347} {"train_loss": -32.5547981262207, "global_step": 42000, "epoch": 347} {"train_loss": -32.08919906616211, "global_step": 42001, "epoch": 347} {"train_loss": -30.66228675842285, "global_step": 42002, "epoch": 347} {"train_loss": -31.734079360961914, "global_step": 42003, "epoch": 347} {"train_loss": -32.571571350097656, "global_step": 42004, "epoch": 347} {"train_loss": -32.48850631713867, "global_step": 42005, "epoch": 347} {"train_loss": -31.198450088500977, "global_step": 42006, "epoch": 347} {"train_loss": -32.2739372253418, "global_step": 42007, "epoch": 347} {"train_loss": -33.14888381958008, "global_step": 42008, "epoch": 347} {"train_loss": -31.124753952026367, "global_step": 42009, "epoch": 347} {"train_loss": -31.773008346557617, "global_step": 42010, "epoch": 347} {"train_loss": -33.2430534362793, "global_step": 42011, "epoch": 347} {"train_loss": -32.00544357299805, "global_step": 42012, "epoch": 347} {"train_loss": -32.28974151611328, "global_step": 42013, "epoch": 347} {"train_loss": -33.021629333496094, "global_step": 42014, "epoch": 347} {"train_loss": -32.09419250488281, "global_step": 42015, "epoch": 347} {"train_loss": -33.437660217285156, "global_step": 42016, "epoch": 347} {"train_loss": -32.97150421142578, "global_step": 42017, "epoch": 347} {"train_loss": -32.94118881225586, "global_step": 42018, "epoch": 347} {"train_loss": -33.21337890625, "global_step": 42019, "epoch": 347} {"train_loss": -32.78749084472656, "global_step": 42020, "epoch": 347} {"train_loss": -33.26302719116211, "global_step": 42021, "epoch": 347} {"train_loss": -33.077392578125, "global_step": 42022, "epoch": 347} {"train_loss": -32.93742752075195, "global_step": 42023, "epoch": 347} {"train_loss": -33.11014938354492, "global_step": 42024, "epoch": 347} {"train_loss": -32.94772720336914, "global_step": 42025, "epoch": 347} {"train_loss": -33.1963996887207, "global_step": 42026, "epoch": 347} {"train_loss": -33.50825500488281, "global_step": 42027, "epoch": 347} {"train_loss": -32.527645111083984, "global_step": 42028, "epoch": 347} {"train_loss": -32.666934967041016, "global_step": 42029, "epoch": 347} {"train_loss": -32.80778121948242, "global_step": 42030, "epoch": 347} {"train_loss": -33.02827453613281, "global_step": 42031, "epoch": 347} {"train_loss": -33.506439208984375, "global_step": 42032, "epoch": 347} {"train_loss": -32.80952072143555, "global_step": 42033, "epoch": 347} {"train_loss": -33.55559158325195, "global_step": 42034, "epoch": 347} {"train_loss": -33.24928665161133, "global_step": 42035, "epoch": 347} {"train_loss": -32.7911376953125, "global_step": 42036, "epoch": 347} {"train_loss": -32.977291107177734, "global_step": 42037, "epoch": 347} {"train_loss": -33.515438079833984, "global_step": 42038, "epoch": 347} {"train_loss": -33.06196975708008, "global_step": 42039, "epoch": 347} {"train_loss": -32.8976936340332, "global_step": 42040, "epoch": 347} {"train_loss": -33.27120590209961, "global_step": 42041, "epoch": 347} {"train_loss": -33.34108352661133, "global_step": 42042, "epoch": 347} {"train_loss": -32.85802459716797, "global_step": 42043, "epoch": 347} {"train_loss": -33.398006439208984, "global_step": 42044, "epoch": 347} {"train_loss": -32.5265998840332, "global_step": 42045, "epoch": 347} {"train_loss": -33.06563186645508, "global_step": 42046, "epoch": 347} {"train_loss": -32.63161849975586, "global_step": 42047, "epoch": 347} {"train_loss": -32.0648193359375, "global_step": 42048, "epoch": 347} {"train_loss": -30.058929443359375, "global_step": 42049, "epoch": 347} {"train_loss": -26.64453125, "global_step": 42050, "epoch": 347} {"train_loss": -26.821577072143555, "global_step": 42051, "epoch": 347} {"train_loss": -29.632328033447266, "global_step": 42052, "epoch": 347} {"train_loss": -26.6297664642334, "global_step": 42053, "epoch": 347} {"train_loss": -30.10359001159668, "global_step": 42054, "epoch": 347} {"train_loss": -29.375869750976562, "global_step": 42055, "epoch": 347} {"train_loss": -31.605976104736328, "global_step": 42056, "epoch": 347} {"train_loss": -28.943866729736328, "global_step": 42057, "epoch": 347} {"train_loss": -31.537841796875, "global_step": 42058, "epoch": 347} {"train_loss": -30.999059677124023, "global_step": 42059, "epoch": 347} {"train_loss": -31.491331100463867, "global_step": 42060, "epoch": 347} {"train_loss": -30.669971466064453, "global_step": 42061, "epoch": 347} {"train_loss": -31.208044052124023, "global_step": 42062, "epoch": 347} {"train_loss": -30.898731231689453, "global_step": 42063, "epoch": 347} {"train_loss": -32.06254959106445, "global_step": 42064, "epoch": 347} {"train_loss": -31.001148223876953, "global_step": 42065, "epoch": 347} {"train_loss": -31.371479034423828, "global_step": 42066, "epoch": 347} {"train_loss": -31.582244873046875, "global_step": 42067, "epoch": 347} {"train_loss": -31.7065372467041, "global_step": 42068, "epoch": 347} {"train_loss": -31.713214874267578, "global_step": 42069, "epoch": 347} {"train_loss": -32.0719108581543, "global_step": 42070, "epoch": 347} {"train_loss": -31.648550033569336, "global_step": 42071, "epoch": 347} {"train_loss": -31.586395263671875, "global_step": 42072, "epoch": 347} {"train_loss": -31.823400497436523, "global_step": 42073, "epoch": 347} {"train_loss": -32.57894515991211, "global_step": 42074, "epoch": 347} {"train_loss": -32.38833236694336, "global_step": 42075, "epoch": 347} {"train_loss": -32.74473190307617, "global_step": 42076, "epoch": 347} {"train_loss": -32.48973083496094, "global_step": 42077, "epoch": 347} {"train_loss": -31.920297622680664, "global_step": 42078, "epoch": 347} {"train_loss": -32.24990463256836, "global_step": 42079, "epoch": 347} {"train_loss": -32.74224853515625, "global_step": 42080, "epoch": 347} {"train_loss": -32.403785705566406, "global_step": 42081, "epoch": 347} {"train_loss": -32.92854690551758, "global_step": 42082, "epoch": 347} {"train_loss": -32.67271041870117, "global_step": 42083, "epoch": 347} {"train_loss": -31.98902702331543, "global_step": 42084, "epoch": 347} {"train_loss": -32.7059440612793, "global_step": 42085, "epoch": 347} {"train_loss": -32.67094802856445, "global_step": 42086, "epoch": 347} {"train_loss": -32.702022552490234, "global_step": 42087, "epoch": 347} {"train_loss": -32.524757385253906, "global_step": 42088, "epoch": 347} {"train_loss": -32.75742721557617, "global_step": 42089, "epoch": 347} {"train_loss": -33.089359283447266, "global_step": 42090, "epoch": 347} {"train_loss": -32.894561767578125, "global_step": 42091, "epoch": 347} {"train_loss": -33.23006820678711, "global_step": 42092, "epoch": 347} {"train_loss": -32.632354736328125, "global_step": 42093, "epoch": 347} {"train_loss": -33.207759857177734, "global_step": 42094, "epoch": 347} {"train_loss": -32.096153259277344, "global_step": 42095, "epoch": 347} {"train_loss": -32.3957633972168, "global_step": 42096, "epoch": 347} {"train_loss": -33.288387298583984, "global_step": 42097, "epoch": 347} {"train_loss": -32.22134017944336, "global_step": 42098, "epoch": 347} {"train_loss": -33.19758605957031, "global_step": 42099, "epoch": 347} {"train_loss": -32.989139556884766, "global_step": 42100, "epoch": 347} {"train_loss": -32.3756217956543, "global_step": 42101, "epoch": 347} {"train_loss": -32.49135971069336, "global_step": 42102, "epoch": 347} {"train_loss": -29.28025245666504, "global_step": 42103, "epoch": 347} {"train_loss": -23.826955795288086, "global_step": 42104, "epoch": 347} {"train_loss": -20.997236251831055, "global_step": 42105, "epoch": 347} {"train_loss": -30.095312118530273, "global_step": 42106, "epoch": 347} {"train_loss": -31.93724728418776, "global_step": 42107, "epoch": 347, "val_loss": 2338205.25} {"train_loss": -28.288522720336914, "global_step": 42108, "epoch": 348} {"train_loss": -32.672637939453125, "global_step": 42109, "epoch": 348} {"train_loss": -29.537403106689453, "global_step": 42110, "epoch": 348} {"train_loss": -31.407419204711914, "global_step": 42111, "epoch": 348} {"train_loss": -31.108572006225586, "global_step": 42112, "epoch": 348} {"train_loss": -31.175573348999023, "global_step": 42113, "epoch": 348} {"train_loss": -33.115440368652344, "global_step": 42114, "epoch": 348} {"train_loss": -30.37505531311035, "global_step": 42115, "epoch": 348} {"train_loss": -32.63507843017578, "global_step": 42116, "epoch": 348} {"train_loss": -28.2210636138916, "global_step": 42117, "epoch": 348} {"train_loss": -31.79107093811035, "global_step": 42118, "epoch": 348} {"train_loss": -32.18361282348633, "global_step": 42119, "epoch": 348} {"train_loss": -32.545806884765625, "global_step": 42120, "epoch": 348} {"train_loss": -32.32268142700195, "global_step": 42121, "epoch": 348} {"train_loss": -28.82472038269043, "global_step": 42122, "epoch": 348} {"train_loss": -31.783618927001953, "global_step": 42123, "epoch": 348} {"train_loss": -32.616024017333984, "global_step": 42124, "epoch": 348} {"train_loss": -32.315921783447266, "global_step": 42125, "epoch": 348} {"train_loss": -32.146949768066406, "global_step": 42126, "epoch": 348} {"train_loss": -29.8662109375, "global_step": 42127, "epoch": 348} {"train_loss": -32.49406814575195, "global_step": 42128, "epoch": 348} {"train_loss": -31.021039962768555, "global_step": 42129, "epoch": 348} {"train_loss": -32.15240478515625, "global_step": 42130, "epoch": 348} {"train_loss": -32.11137771606445, "global_step": 42131, "epoch": 348} {"train_loss": -32.48069381713867, "global_step": 42132, "epoch": 348} {"train_loss": -32.520511627197266, "global_step": 42133, "epoch": 348} {"train_loss": -32.708778381347656, "global_step": 42134, "epoch": 348} {"train_loss": -30.858551025390625, "global_step": 42135, "epoch": 348} {"train_loss": -32.291011810302734, "global_step": 42136, "epoch": 348} {"train_loss": -31.85699462890625, "global_step": 42137, "epoch": 348} {"train_loss": -30.8984375, "global_step": 42138, "epoch": 348} {"train_loss": -31.931848526000977, "global_step": 42139, "epoch": 348} {"train_loss": -31.900876998901367, "global_step": 42140, "epoch": 348} {"train_loss": -32.370452880859375, "global_step": 42141, "epoch": 348} {"train_loss": -32.91971969604492, "global_step": 42142, "epoch": 348} {"train_loss": -32.50311279296875, "global_step": 42143, "epoch": 348} {"train_loss": -32.51587677001953, "global_step": 42144, "epoch": 348} {"train_loss": -32.54264450073242, "global_step": 42145, "epoch": 348} {"train_loss": -32.839988708496094, "global_step": 42146, "epoch": 348} {"train_loss": -32.332881927490234, "global_step": 42147, "epoch": 348} {"train_loss": -32.17350769042969, "global_step": 42148, "epoch": 348} {"train_loss": -32.02888107299805, "global_step": 42149, "epoch": 348} {"train_loss": -32.06137466430664, "global_step": 42150, "epoch": 348} {"train_loss": -32.78813171386719, "global_step": 42151, "epoch": 348} {"train_loss": -32.440643310546875, "global_step": 42152, "epoch": 348} {"train_loss": -32.214027404785156, "global_step": 42153, "epoch": 348} {"train_loss": -31.965576171875, "global_step": 42154, "epoch": 348} {"train_loss": -32.106971740722656, "global_step": 42155, "epoch": 348} {"train_loss": -33.13644790649414, "global_step": 42156, "epoch": 348} {"train_loss": -33.423255920410156, "global_step": 42157, "epoch": 348} {"train_loss": -32.95024490356445, "global_step": 42158, "epoch": 348} {"train_loss": -32.25593185424805, "global_step": 42159, "epoch": 348} {"train_loss": -33.23963165283203, "global_step": 42160, "epoch": 348} {"train_loss": -33.574684143066406, "global_step": 42161, "epoch": 348} {"train_loss": -33.10227584838867, "global_step": 42162, "epoch": 348} {"train_loss": -33.1919059753418, "global_step": 42163, "epoch": 348} {"train_loss": -33.19013214111328, "global_step": 42164, "epoch": 348} {"train_loss": -33.3206901550293, "global_step": 42165, "epoch": 348} {"train_loss": -33.779335021972656, "global_step": 42166, "epoch": 348} {"train_loss": -33.58442306518555, "global_step": 42167, "epoch": 348} {"train_loss": -33.477108001708984, "global_step": 42168, "epoch": 348} {"train_loss": -33.975765228271484, "global_step": 42169, "epoch": 348} {"train_loss": -33.93354034423828, "global_step": 42170, "epoch": 348} {"train_loss": -33.34225845336914, "global_step": 42171, "epoch": 348} {"train_loss": -33.80256271362305, "global_step": 42172, "epoch": 348} {"train_loss": -33.843719482421875, "global_step": 42173, "epoch": 348} {"train_loss": -33.93077087402344, "global_step": 42174, "epoch": 348} {"train_loss": -34.12116622924805, "global_step": 42175, "epoch": 348} {"train_loss": -34.1676139831543, "global_step": 42176, "epoch": 348} {"train_loss": -33.92498016357422, "global_step": 42177, "epoch": 348} {"train_loss": -33.9776496887207, "global_step": 42178, "epoch": 348} {"train_loss": -32.8054313659668, "global_step": 42179, "epoch": 348} {"train_loss": -30.279382705688477, "global_step": 42180, "epoch": 348} {"train_loss": -33.431270599365234, "global_step": 42181, "epoch": 348} {"train_loss": -34.11323165893555, "global_step": 42182, "epoch": 348} {"train_loss": -33.55001449584961, "global_step": 42183, "epoch": 348} {"train_loss": -33.25173568725586, "global_step": 42184, "epoch": 348} {"train_loss": -34.2357063293457, "global_step": 42185, "epoch": 348} {"train_loss": -33.3658561706543, "global_step": 42186, "epoch": 348} {"train_loss": -33.11729049682617, "global_step": 42187, "epoch": 348} {"train_loss": -33.5849723815918, "global_step": 42188, "epoch": 348} {"train_loss": -32.314857482910156, "global_step": 42189, "epoch": 348} {"train_loss": -29.799365997314453, "global_step": 42190, "epoch": 348} {"train_loss": -20.27179527282715, "global_step": 42191, "epoch": 348} {"train_loss": -7.958215236663818, "global_step": 42192, "epoch": 348} {"train_loss": -27.004186630249023, "global_step": 42193, "epoch": 348} {"train_loss": -27.710784912109375, "global_step": 42194, "epoch": 348} {"train_loss": -26.99295997619629, "global_step": 42195, "epoch": 348} {"train_loss": -28.37665367126465, "global_step": 42196, "epoch": 348} {"train_loss": -30.6021785736084, "global_step": 42197, "epoch": 348} {"train_loss": -27.6573429107666, "global_step": 42198, "epoch": 348} {"train_loss": -32.843990325927734, "global_step": 42199, "epoch": 348} {"train_loss": -31.619409561157227, "global_step": 42200, "epoch": 348} {"train_loss": -30.817520141601562, "global_step": 42201, "epoch": 348} {"train_loss": -32.69953536987305, "global_step": 42202, "epoch": 348} {"train_loss": -32.98626708984375, "global_step": 42203, "epoch": 348} {"train_loss": -31.48505210876465, "global_step": 42204, "epoch": 348} {"train_loss": -32.15705490112305, "global_step": 42205, "epoch": 348} {"train_loss": -33.04036331176758, "global_step": 42206, "epoch": 348} {"train_loss": -32.91896438598633, "global_step": 42207, "epoch": 348} {"train_loss": -32.33425521850586, "global_step": 42208, "epoch": 348} {"train_loss": -32.851646423339844, "global_step": 42209, "epoch": 348} {"train_loss": -32.97671127319336, "global_step": 42210, "epoch": 348} {"train_loss": -33.00722885131836, "global_step": 42211, "epoch": 348} {"train_loss": -33.63508224487305, "global_step": 42212, "epoch": 348} {"train_loss": -33.086185455322266, "global_step": 42213, "epoch": 348} {"train_loss": -33.115509033203125, "global_step": 42214, "epoch": 348} {"train_loss": -32.526641845703125, "global_step": 42215, "epoch": 348} {"train_loss": -33.45039749145508, "global_step": 42216, "epoch": 348} {"train_loss": -33.693580627441406, "global_step": 42217, "epoch": 348} {"train_loss": -33.234535217285156, "global_step": 42218, "epoch": 348} {"train_loss": -33.43337631225586, "global_step": 42219, "epoch": 348} {"train_loss": -33.36981201171875, "global_step": 42220, "epoch": 348} {"train_loss": -32.82672882080078, "global_step": 42221, "epoch": 348} {"train_loss": -33.66105651855469, "global_step": 42222, "epoch": 348} {"train_loss": -33.615203857421875, "global_step": 42223, "epoch": 348} {"train_loss": -33.42835235595703, "global_step": 42224, "epoch": 348} {"train_loss": -33.065486907958984, "global_step": 42225, "epoch": 348} {"train_loss": -33.38371276855469, "global_step": 42226, "epoch": 348} {"train_loss": -33.25923538208008, "global_step": 42227, "epoch": 348} {"train_loss": -32.027309650231985, "global_step": 42228, "epoch": 348, "val_loss": 2483649.0} {"train_loss": -32.78792953491211, "global_step": 42229, "epoch": 349} {"train_loss": -31.72934341430664, "global_step": 42230, "epoch": 349} {"train_loss": -31.293272018432617, "global_step": 42231, "epoch": 349} {"train_loss": -32.7789306640625, "global_step": 42232, "epoch": 349} {"train_loss": -32.8685302734375, "global_step": 42233, "epoch": 349} {"train_loss": -30.931970596313477, "global_step": 42234, "epoch": 349} {"train_loss": -32.50985336303711, "global_step": 42235, "epoch": 349} {"train_loss": -33.14210891723633, "global_step": 42236, "epoch": 349} {"train_loss": -30.176279067993164, "global_step": 42237, "epoch": 349} {"train_loss": -29.361175537109375, "global_step": 42238, "epoch": 349} {"train_loss": -32.013023376464844, "global_step": 42239, "epoch": 349} {"train_loss": -30.506372451782227, "global_step": 42240, "epoch": 349} {"train_loss": -31.805646896362305, "global_step": 42241, "epoch": 349} {"train_loss": -31.770666122436523, "global_step": 42242, "epoch": 349} {"train_loss": -31.599756240844727, "global_step": 42243, "epoch": 349} {"train_loss": -31.740421295166016, "global_step": 42244, "epoch": 349} {"train_loss": -32.021907806396484, "global_step": 42245, "epoch": 349} {"train_loss": -32.88915252685547, "global_step": 42246, "epoch": 349} {"train_loss": -29.099609375, "global_step": 42247, "epoch": 349} {"train_loss": -31.110898971557617, "global_step": 42248, "epoch": 349} {"train_loss": -30.639795303344727, "global_step": 42249, "epoch": 349} {"train_loss": -31.172260284423828, "global_step": 42250, "epoch": 349} {"train_loss": -30.602100372314453, "global_step": 42251, "epoch": 349} {"train_loss": -31.97614860534668, "global_step": 42252, "epoch": 349} {"train_loss": -32.346923828125, "global_step": 42253, "epoch": 349} {"train_loss": -32.16115188598633, "global_step": 42254, "epoch": 349} {"train_loss": -32.08639144897461, "global_step": 42255, "epoch": 349} {"train_loss": -31.906225204467773, "global_step": 42256, "epoch": 349} {"train_loss": -32.142822265625, "global_step": 42257, "epoch": 349} {"train_loss": -32.205318450927734, "global_step": 42258, "epoch": 349} {"train_loss": -32.485511779785156, "global_step": 42259, "epoch": 349} {"train_loss": -32.24958038330078, "global_step": 42260, "epoch": 349} {"train_loss": -32.50993728637695, "global_step": 42261, "epoch": 349} {"train_loss": -32.596336364746094, "global_step": 42262, "epoch": 349} {"train_loss": -32.421260833740234, "global_step": 42263, "epoch": 349} {"train_loss": -32.54273223876953, "global_step": 42264, "epoch": 349} {"train_loss": -32.8376350402832, "global_step": 42265, "epoch": 349} {"train_loss": -33.06980514526367, "global_step": 42266, "epoch": 349} {"train_loss": -32.656612396240234, "global_step": 42267, "epoch": 349} {"train_loss": -32.50064468383789, "global_step": 42268, "epoch": 349} {"train_loss": -32.803070068359375, "global_step": 42269, "epoch": 349} {"train_loss": -32.69700622558594, "global_step": 42270, "epoch": 349} {"train_loss": -32.77036666870117, "global_step": 42271, "epoch": 349} {"train_loss": -32.996009826660156, "global_step": 42272, "epoch": 349} {"train_loss": -33.10417175292969, "global_step": 42273, "epoch": 349} {"train_loss": -32.99909210205078, "global_step": 42274, "epoch": 349} {"train_loss": -33.38624954223633, "global_step": 42275, "epoch": 349} {"train_loss": -33.16401290893555, "global_step": 42276, "epoch": 349} {"train_loss": -33.32527160644531, "global_step": 42277, "epoch": 349} {"train_loss": -32.835445404052734, "global_step": 42278, "epoch": 349} {"train_loss": -33.26628875732422, "global_step": 42279, "epoch": 349} {"train_loss": -33.12653732299805, "global_step": 42280, "epoch": 349} {"train_loss": -33.002742767333984, "global_step": 42281, "epoch": 349} {"train_loss": -33.282386779785156, "global_step": 42282, "epoch": 349} {"train_loss": -33.42205810546875, "global_step": 42283, "epoch": 349} {"train_loss": -33.49120330810547, "global_step": 42284, "epoch": 349} {"train_loss": -33.52815628051758, "global_step": 42285, "epoch": 349} {"train_loss": -33.321563720703125, "global_step": 42286, "epoch": 349} {"train_loss": -33.5129508972168, "global_step": 42287, "epoch": 349} {"train_loss": -33.8073616027832, "global_step": 42288, "epoch": 349} {"train_loss": -33.76905059814453, "global_step": 42289, "epoch": 349} {"train_loss": -33.82581329345703, "global_step": 42290, "epoch": 349} {"train_loss": -33.70417404174805, "global_step": 42291, "epoch": 349} {"train_loss": -33.503021240234375, "global_step": 42292, "epoch": 349} {"train_loss": -33.86438751220703, "global_step": 42293, "epoch": 349} {"train_loss": -33.82596206665039, "global_step": 42294, "epoch": 349} {"train_loss": -33.09929656982422, "global_step": 42295, "epoch": 349} {"train_loss": -33.94136428833008, "global_step": 42296, "epoch": 349} {"train_loss": -33.94712829589844, "global_step": 42297, "epoch": 349} {"train_loss": -32.896705627441406, "global_step": 42298, "epoch": 349} {"train_loss": -33.879249572753906, "global_step": 42299, "epoch": 349} {"train_loss": -32.95490264892578, "global_step": 42300, "epoch": 349} {"train_loss": -30.7697811126709, "global_step": 42301, "epoch": 349} {"train_loss": -32.80251693725586, "global_step": 42302, "epoch": 349} {"train_loss": -31.527908325195312, "global_step": 42303, "epoch": 349} {"train_loss": -31.10200309753418, "global_step": 42304, "epoch": 349} {"train_loss": -32.10185623168945, "global_step": 42305, "epoch": 349} {"train_loss": -31.843626022338867, "global_step": 42306, "epoch": 349} {"train_loss": -33.54418182373047, "global_step": 42307, "epoch": 349} {"train_loss": -33.21651077270508, "global_step": 42308, "epoch": 349} {"train_loss": -32.472076416015625, "global_step": 42309, "epoch": 349} {"train_loss": -32.770965576171875, "global_step": 42310, "epoch": 349} {"train_loss": -33.312477111816406, "global_step": 42311, "epoch": 349} {"train_loss": -33.610687255859375, "global_step": 42312, "epoch": 349} {"train_loss": -32.25334548950195, "global_step": 42313, "epoch": 349} {"train_loss": -33.46060562133789, "global_step": 42314, "epoch": 349} {"train_loss": -33.659114837646484, "global_step": 42315, "epoch": 349} {"train_loss": -33.30544662475586, "global_step": 42316, "epoch": 349} {"train_loss": -33.32758712768555, "global_step": 42317, "epoch": 349} {"train_loss": -33.883243560791016, "global_step": 42318, "epoch": 349} {"train_loss": -33.531776428222656, "global_step": 42319, "epoch": 349} {"train_loss": -34.039756774902344, "global_step": 42320, "epoch": 349} {"train_loss": -33.897850036621094, "global_step": 42321, "epoch": 349} {"train_loss": -34.100494384765625, "global_step": 42322, "epoch": 349} {"train_loss": -34.325557708740234, "global_step": 42323, "epoch": 349} {"train_loss": -34.03738021850586, "global_step": 42324, "epoch": 349} {"train_loss": -34.17001724243164, "global_step": 42325, "epoch": 349} {"train_loss": -34.091190338134766, "global_step": 42326, "epoch": 349} {"train_loss": -33.7237548828125, "global_step": 42327, "epoch": 349} {"train_loss": -33.91801452636719, "global_step": 42328, "epoch": 349} {"train_loss": -34.449005126953125, "global_step": 42329, "epoch": 349} {"train_loss": -33.931236267089844, "global_step": 42330, "epoch": 349} {"train_loss": -33.55160140991211, "global_step": 42331, "epoch": 349} {"train_loss": -33.27153396606445, "global_step": 42332, "epoch": 349} {"train_loss": -33.77728271484375, "global_step": 42333, "epoch": 349} {"train_loss": -33.77765655517578, "global_step": 42334, "epoch": 349} {"train_loss": -34.53806686401367, "global_step": 42335, "epoch": 349} {"train_loss": -34.00777053833008, "global_step": 42336, "epoch": 349} {"train_loss": -33.202518463134766, "global_step": 42337, "epoch": 349} {"train_loss": -32.78541946411133, "global_step": 42338, "epoch": 349} {"train_loss": -33.512969970703125, "global_step": 42339, "epoch": 349} {"train_loss": -34.388118743896484, "global_step": 42340, "epoch": 349} {"train_loss": -32.868446350097656, "global_step": 42341, "epoch": 349} {"train_loss": -33.45144271850586, "global_step": 42342, "epoch": 349} {"train_loss": -34.32160568237305, "global_step": 42343, "epoch": 349} {"train_loss": -33.121482849121094, "global_step": 42344, "epoch": 349} {"train_loss": -33.36488723754883, "global_step": 42345, "epoch": 349} {"train_loss": -33.81370162963867, "global_step": 42346, "epoch": 349} {"train_loss": -33.43509292602539, "global_step": 42347, "epoch": 349} {"train_loss": -34.01412582397461, "global_step": 42348, "epoch": 349} {"train_loss": -32.88253213551419, "global_step": 42349, "epoch": 349, "val_loss": 2503582.0} {"train_loss": -34.04110336303711, "global_step": 42350, "epoch": 350} {"train_loss": -33.91969680786133, "global_step": 42351, "epoch": 350} {"train_loss": -34.031864166259766, "global_step": 42352, "epoch": 350} {"train_loss": -33.705902099609375, "global_step": 42353, "epoch": 350} {"train_loss": -34.33494186401367, "global_step": 42354, "epoch": 350} {"train_loss": -34.36032485961914, "global_step": 42355, "epoch": 350} {"train_loss": -34.747310638427734, "global_step": 42356, "epoch": 350} {"train_loss": -34.3256950378418, "global_step": 42357, "epoch": 350} {"train_loss": -34.48617172241211, "global_step": 42358, "epoch": 350} {"train_loss": -34.3189582824707, "global_step": 42359, "epoch": 350} {"train_loss": -34.2690544128418, "global_step": 42360, "epoch": 350} {"train_loss": -34.85016632080078, "global_step": 42361, "epoch": 350} {"train_loss": -34.542415618896484, "global_step": 42362, "epoch": 350} {"train_loss": -34.248146057128906, "global_step": 42363, "epoch": 350} {"train_loss": -34.343772888183594, "global_step": 42364, "epoch": 350} {"train_loss": -34.556495666503906, "global_step": 42365, "epoch": 350} {"train_loss": -34.82207107543945, "global_step": 42366, "epoch": 350} {"train_loss": -34.87351989746094, "global_step": 42367, "epoch": 350} {"train_loss": -34.61802291870117, "global_step": 42368, "epoch": 350} {"train_loss": -34.60896682739258, "global_step": 42369, "epoch": 350} {"train_loss": -34.863380432128906, "global_step": 42370, "epoch": 350} {"train_loss": -34.594234466552734, "global_step": 42371, "epoch": 350} {"train_loss": -34.1866569519043, "global_step": 42372, "epoch": 350} {"train_loss": -34.61601257324219, "global_step": 42373, "epoch": 350} {"train_loss": -34.441688537597656, "global_step": 42374, "epoch": 350} {"train_loss": -34.05764389038086, "global_step": 42375, "epoch": 350} {"train_loss": -33.53392028808594, "global_step": 42376, "epoch": 350} {"train_loss": -33.59578323364258, "global_step": 42377, "epoch": 350} {"train_loss": -31.47530174255371, "global_step": 42378, "epoch": 350} {"train_loss": -32.20921325683594, "global_step": 42379, "epoch": 350} {"train_loss": -31.40960121154785, "global_step": 42380, "epoch": 350} {"train_loss": -31.3762149810791, "global_step": 42381, "epoch": 350} {"train_loss": -32.821197509765625, "global_step": 42382, "epoch": 350} {"train_loss": -33.11391830444336, "global_step": 42383, "epoch": 350} {"train_loss": -34.581478118896484, "global_step": 42384, "epoch": 350} {"train_loss": -33.14714813232422, "global_step": 42385, "epoch": 350} {"train_loss": -33.767513275146484, "global_step": 42386, "epoch": 350} {"train_loss": -33.07322692871094, "global_step": 42387, "epoch": 350} {"train_loss": -33.2761344909668, "global_step": 42388, "epoch": 350} {"train_loss": -34.69233322143555, "global_step": 42389, "epoch": 350} {"train_loss": -33.71706008911133, "global_step": 42390, "epoch": 350} {"train_loss": -33.63041305541992, "global_step": 42391, "epoch": 350} {"train_loss": -33.887977600097656, "global_step": 42392, "epoch": 350} {"train_loss": -34.28071594238281, "global_step": 42393, "epoch": 350} {"train_loss": -34.24491500854492, "global_step": 42394, "epoch": 350} {"train_loss": -34.39131546020508, "global_step": 42395, "epoch": 350} {"train_loss": -34.62284469604492, "global_step": 42396, "epoch": 350} {"train_loss": -33.49911117553711, "global_step": 42397, "epoch": 350} {"train_loss": -33.859962463378906, "global_step": 42398, "epoch": 350} {"train_loss": -33.64480972290039, "global_step": 42399, "epoch": 350} {"train_loss": -33.924224853515625, "global_step": 42400, "epoch": 350} {"train_loss": -34.26948165893555, "global_step": 42401, "epoch": 350} {"train_loss": -34.03495407104492, "global_step": 42402, "epoch": 350} {"train_loss": -34.26540756225586, "global_step": 42403, "epoch": 350} {"train_loss": -34.122283935546875, "global_step": 42404, "epoch": 350} {"train_loss": -34.9338264465332, "global_step": 42405, "epoch": 350} {"train_loss": -34.11273193359375, "global_step": 42406, "epoch": 350} {"train_loss": -34.29242706298828, "global_step": 42407, "epoch": 350} {"train_loss": -34.404693603515625, "global_step": 42408, "epoch": 350} {"train_loss": -33.88595199584961, "global_step": 42409, "epoch": 350} {"train_loss": -33.82802963256836, "global_step": 42410, "epoch": 350} {"train_loss": -34.058380126953125, "global_step": 42411, "epoch": 350} {"train_loss": -34.21272277832031, "global_step": 42412, "epoch": 350} {"train_loss": -34.13187789916992, "global_step": 42413, "epoch": 350} {"train_loss": -34.57554244995117, "global_step": 42414, "epoch": 350} {"train_loss": -34.383480072021484, "global_step": 42415, "epoch": 350} {"train_loss": -34.81439971923828, "global_step": 42416, "epoch": 350} {"train_loss": -34.14670944213867, "global_step": 42417, "epoch": 350} {"train_loss": -33.59839630126953, "global_step": 42418, "epoch": 350} {"train_loss": -33.84980392456055, "global_step": 42419, "epoch": 350} {"train_loss": -34.42808151245117, "global_step": 42420, "epoch": 350} {"train_loss": -33.8634147644043, "global_step": 42421, "epoch": 350} {"train_loss": -33.63642501831055, "global_step": 42422, "epoch": 350} {"train_loss": -32.65987777709961, "global_step": 42423, "epoch": 350} {"train_loss": -32.76304244995117, "global_step": 42424, "epoch": 350} {"train_loss": -32.26266098022461, "global_step": 42425, "epoch": 350} {"train_loss": -31.46835708618164, "global_step": 42426, "epoch": 350} {"train_loss": -32.185951232910156, "global_step": 42427, "epoch": 350} {"train_loss": -33.94389724731445, "global_step": 42428, "epoch": 350} {"train_loss": -32.12996292114258, "global_step": 42429, "epoch": 350} {"train_loss": -32.54315185546875, "global_step": 42430, "epoch": 350} {"train_loss": -34.38642883300781, "global_step": 42431, "epoch": 350} {"train_loss": -33.608333587646484, "global_step": 42432, "epoch": 350} {"train_loss": -34.23673629760742, "global_step": 42433, "epoch": 350} {"train_loss": -33.67850875854492, "global_step": 42434, "epoch": 350} {"train_loss": -34.41527557373047, "global_step": 42435, "epoch": 350} {"train_loss": -34.594242095947266, "global_step": 42436, "epoch": 350} {"train_loss": -34.32530975341797, "global_step": 42437, "epoch": 350} {"train_loss": -34.20640182495117, "global_step": 42438, "epoch": 350} {"train_loss": -34.270294189453125, "global_step": 42439, "epoch": 350} {"train_loss": -34.10919952392578, "global_step": 42440, "epoch": 350} {"train_loss": -34.2303581237793, "global_step": 42441, "epoch": 350} {"train_loss": -34.86909866333008, "global_step": 42442, "epoch": 350} {"train_loss": -33.6609001159668, "global_step": 42443, "epoch": 350} {"train_loss": -34.11019515991211, "global_step": 42444, "epoch": 350} {"train_loss": -33.7855339050293, "global_step": 42445, "epoch": 350} {"train_loss": -34.3409423828125, "global_step": 42446, "epoch": 350} {"train_loss": -34.114559173583984, "global_step": 42447, "epoch": 350} {"train_loss": -34.77267074584961, "global_step": 42448, "epoch": 350} {"train_loss": -34.95920944213867, "global_step": 42449, "epoch": 350} {"train_loss": -34.61910629272461, "global_step": 42450, "epoch": 350} {"train_loss": -35.0909423828125, "global_step": 42451, "epoch": 350} {"train_loss": -34.72252655029297, "global_step": 42452, "epoch": 350} {"train_loss": -34.75757598876953, "global_step": 42453, "epoch": 350} {"train_loss": -34.17203903198242, "global_step": 42454, "epoch": 350} {"train_loss": -33.694610595703125, "global_step": 42455, "epoch": 350} {"train_loss": -34.37889862060547, "global_step": 42456, "epoch": 350} {"train_loss": -33.79252624511719, "global_step": 42457, "epoch": 350} {"train_loss": -34.671688079833984, "global_step": 42458, "epoch": 350} {"train_loss": -33.73904037475586, "global_step": 42459, "epoch": 350} {"train_loss": -34.48002243041992, "global_step": 42460, "epoch": 350} {"train_loss": -33.550655364990234, "global_step": 42461, "epoch": 350} {"train_loss": -34.581905364990234, "global_step": 42462, "epoch": 350} {"train_loss": -33.31220626831055, "global_step": 42463, "epoch": 350} {"train_loss": -34.52712631225586, "global_step": 42464, "epoch": 350} {"train_loss": -34.0595703125, "global_step": 42465, "epoch": 350} {"train_loss": -34.47600173950195, "global_step": 42466, "epoch": 350} {"train_loss": -33.26278305053711, "global_step": 42467, "epoch": 350} {"train_loss": -34.38970947265625, "global_step": 42468, "epoch": 350} {"train_loss": -32.911163330078125, "global_step": 42469, "epoch": 350} {"train_loss": -33.965791292427, "global_step": 42470, "epoch": 350, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4400000": 1.0, "test/sim_max_reward_4400001": 1.0, "test/sim_max_reward_4400002": 1.0, "test/sim_max_reward_4400003": 1.0, "test/sim_max_reward_4400004": 1.0, "test/sim_max_reward_4400005": 1.0, "test/sim_max_reward_4400006": 1.0, "test/sim_max_reward_4400007": 1.0, "test/sim_max_reward_4400008": 1.0, "test/sim_max_reward_4400009": 1.0, "test/sim_max_reward_4400010": 1.0, "test/sim_max_reward_4400011": 1.0, "test/sim_max_reward_4400012": 1.0, "test/sim_max_reward_4400013": 1.0, "test/sim_max_reward_4400014": 1.0, "test/sim_max_reward_4400015": 1.0, "test/sim_max_reward_4400016": 1.0, "test/sim_max_reward_4400017": 1.0, "test/sim_max_reward_4400018": 1.0, "test/sim_max_reward_4400019": 1.0, "test/sim_max_reward_4400020": 1.0, "test/sim_max_reward_4400021": 1.0, "train/mean_score": 1.0, "test/mean_score": 1.0, "val_loss": 2386767.0} {"train_loss": -33.60395812988281, "global_step": 42471, "epoch": 351} {"train_loss": -33.51979446411133, "global_step": 42472, "epoch": 351} {"train_loss": -32.89760971069336, "global_step": 42473, "epoch": 351} {"train_loss": -33.529659271240234, "global_step": 42474, "epoch": 351} {"train_loss": -31.226224899291992, "global_step": 42475, "epoch": 351} {"train_loss": -30.52212905883789, "global_step": 42476, "epoch": 351} {"train_loss": -30.359277725219727, "global_step": 42477, "epoch": 351} {"train_loss": -31.87483787536621, "global_step": 42478, "epoch": 351} {"train_loss": -32.34366989135742, "global_step": 42479, "epoch": 351} {"train_loss": -33.14919662475586, "global_step": 42480, "epoch": 351} {"train_loss": -33.64964294433594, "global_step": 42481, "epoch": 351} {"train_loss": -33.731204986572266, "global_step": 42482, "epoch": 351} {"train_loss": -33.292572021484375, "global_step": 42483, "epoch": 351} {"train_loss": -33.943599700927734, "global_step": 42484, "epoch": 351} {"train_loss": -32.7085075378418, "global_step": 42485, "epoch": 351} {"train_loss": -33.298309326171875, "global_step": 42486, "epoch": 351} {"train_loss": -34.12752914428711, "global_step": 42487, "epoch": 351} {"train_loss": -34.389225006103516, "global_step": 42488, "epoch": 351} {"train_loss": -33.24861526489258, "global_step": 42489, "epoch": 351} {"train_loss": -33.76787185668945, "global_step": 42490, "epoch": 351} {"train_loss": -34.34959030151367, "global_step": 42491, "epoch": 351} {"train_loss": -33.930667877197266, "global_step": 42492, "epoch": 351} {"train_loss": -34.22346115112305, "global_step": 42493, "epoch": 351} {"train_loss": -34.1572380065918, "global_step": 42494, "epoch": 351} {"train_loss": -34.14852523803711, "global_step": 42495, "epoch": 351} {"train_loss": -34.047607421875, "global_step": 42496, "epoch": 351} {"train_loss": -34.08030319213867, "global_step": 42497, "epoch": 351} {"train_loss": -34.142669677734375, "global_step": 42498, "epoch": 351} {"train_loss": -34.185791015625, "global_step": 42499, "epoch": 351} {"train_loss": -33.444217681884766, "global_step": 42500, "epoch": 351} {"train_loss": -34.147911071777344, "global_step": 42501, "epoch": 351} {"train_loss": -34.052730560302734, "global_step": 42502, "epoch": 351} {"train_loss": -34.37411117553711, "global_step": 42503, "epoch": 351} {"train_loss": -34.230506896972656, "global_step": 42504, "epoch": 351} {"train_loss": -34.4068717956543, "global_step": 42505, "epoch": 351} {"train_loss": -33.937416076660156, "global_step": 42506, "epoch": 351} {"train_loss": -33.807674407958984, "global_step": 42507, "epoch": 351} {"train_loss": -34.14674758911133, "global_step": 42508, "epoch": 351} {"train_loss": -34.11823272705078, "global_step": 42509, "epoch": 351} {"train_loss": -34.83232116699219, "global_step": 42510, "epoch": 351} {"train_loss": -33.80504608154297, "global_step": 42511, "epoch": 351} {"train_loss": -33.75491714477539, "global_step": 42512, "epoch": 351} {"train_loss": -33.64413070678711, "global_step": 42513, "epoch": 351} {"train_loss": -33.409873962402344, "global_step": 42514, "epoch": 351} {"train_loss": -33.727561950683594, "global_step": 42515, "epoch": 351} {"train_loss": -34.72590255737305, "global_step": 42516, "epoch": 351} {"train_loss": -34.042205810546875, "global_step": 42517, "epoch": 351} {"train_loss": -35.195350646972656, "global_step": 42518, "epoch": 351} {"train_loss": -34.30292510986328, "global_step": 42519, "epoch": 351} {"train_loss": -35.055755615234375, "global_step": 42520, "epoch": 351} {"train_loss": -34.53336715698242, "global_step": 42521, "epoch": 351} {"train_loss": -34.619693756103516, "global_step": 42522, "epoch": 351} {"train_loss": -34.5448112487793, "global_step": 42523, "epoch": 351} {"train_loss": -34.34818649291992, "global_step": 42524, "epoch": 351} {"train_loss": -34.263580322265625, "global_step": 42525, "epoch": 351} {"train_loss": -33.71470260620117, "global_step": 42526, "epoch": 351} {"train_loss": -32.971900939941406, "global_step": 42527, "epoch": 351} {"train_loss": -33.17097854614258, "global_step": 42528, "epoch": 351} {"train_loss": -32.67204284667969, "global_step": 42529, "epoch": 351} {"train_loss": -33.06936264038086, "global_step": 42530, "epoch": 351} {"train_loss": -34.655303955078125, "global_step": 42531, "epoch": 351} {"train_loss": -34.37026596069336, "global_step": 42532, "epoch": 351} {"train_loss": -33.90262985229492, "global_step": 42533, "epoch": 351} {"train_loss": -33.82313919067383, "global_step": 42534, "epoch": 351} {"train_loss": -34.25614547729492, "global_step": 42535, "epoch": 351} {"train_loss": -33.85001754760742, "global_step": 42536, "epoch": 351} {"train_loss": -33.3997688293457, "global_step": 42537, "epoch": 351} {"train_loss": -33.87468338012695, "global_step": 42538, "epoch": 351} {"train_loss": -32.771881103515625, "global_step": 42539, "epoch": 351} {"train_loss": -33.437957763671875, "global_step": 42540, "epoch": 351} {"train_loss": -32.62667465209961, "global_step": 42541, "epoch": 351} {"train_loss": -31.5105037689209, "global_step": 42542, "epoch": 351} {"train_loss": -33.10087966918945, "global_step": 42543, "epoch": 351} {"train_loss": -33.42094039916992, "global_step": 42544, "epoch": 351} {"train_loss": -33.63948059082031, "global_step": 42545, "epoch": 351} {"train_loss": -34.721893310546875, "global_step": 42546, "epoch": 351} {"train_loss": -33.632118225097656, "global_step": 42547, "epoch": 351} {"train_loss": -33.42934799194336, "global_step": 42548, "epoch": 351} {"train_loss": -34.22412109375, "global_step": 42549, "epoch": 351} {"train_loss": -34.04131317138672, "global_step": 42550, "epoch": 351} {"train_loss": -33.227596282958984, "global_step": 42551, "epoch": 351} {"train_loss": -34.61420440673828, "global_step": 42552, "epoch": 351} {"train_loss": -34.8519287109375, "global_step": 42553, "epoch": 351} {"train_loss": -34.09128952026367, "global_step": 42554, "epoch": 351} {"train_loss": -34.83417892456055, "global_step": 42555, "epoch": 351} {"train_loss": -35.03981399536133, "global_step": 42556, "epoch": 351} {"train_loss": -34.71026611328125, "global_step": 42557, "epoch": 351} {"train_loss": -34.617794036865234, "global_step": 42558, "epoch": 351} {"train_loss": -34.43851852416992, "global_step": 42559, "epoch": 351} {"train_loss": -34.72595977783203, "global_step": 42560, "epoch": 351} {"train_loss": -34.76217269897461, "global_step": 42561, "epoch": 351} {"train_loss": -34.653743743896484, "global_step": 42562, "epoch": 351} {"train_loss": -33.96334457397461, "global_step": 42563, "epoch": 351} {"train_loss": -34.49761962890625, "global_step": 42564, "epoch": 351} {"train_loss": -34.54682540893555, "global_step": 42565, "epoch": 351} {"train_loss": -34.429542541503906, "global_step": 42566, "epoch": 351} {"train_loss": -34.86800765991211, "global_step": 42567, "epoch": 351} {"train_loss": -34.52171325683594, "global_step": 42568, "epoch": 351} {"train_loss": -33.83250045776367, "global_step": 42569, "epoch": 351} {"train_loss": -34.78938293457031, "global_step": 42570, "epoch": 351} {"train_loss": -34.62262725830078, "global_step": 42571, "epoch": 351} {"train_loss": -33.67287063598633, "global_step": 42572, "epoch": 351} {"train_loss": -34.78177261352539, "global_step": 42573, "epoch": 351} {"train_loss": -34.53520965576172, "global_step": 42574, "epoch": 351} {"train_loss": -33.58446502685547, "global_step": 42575, "epoch": 351} {"train_loss": -34.55765914916992, "global_step": 42576, "epoch": 351} {"train_loss": -34.10731887817383, "global_step": 42577, "epoch": 351} {"train_loss": -34.455074310302734, "global_step": 42578, "epoch": 351} {"train_loss": -34.502288818359375, "global_step": 42579, "epoch": 351} {"train_loss": -34.67588424682617, "global_step": 42580, "epoch": 351} {"train_loss": -34.23948669433594, "global_step": 42581, "epoch": 351} {"train_loss": -35.37063217163086, "global_step": 42582, "epoch": 351} {"train_loss": -34.840457916259766, "global_step": 42583, "epoch": 351} {"train_loss": -33.992218017578125, "global_step": 42584, "epoch": 351} {"train_loss": -32.85920715332031, "global_step": 42585, "epoch": 351} {"train_loss": -34.85514450073242, "global_step": 42586, "epoch": 351} {"train_loss": -33.191287994384766, "global_step": 42587, "epoch": 351} {"train_loss": -32.79664993286133, "global_step": 42588, "epoch": 351} {"train_loss": -32.410003662109375, "global_step": 42589, "epoch": 351} {"train_loss": -31.418731689453125, "global_step": 42590, "epoch": 351} {"train_loss": -33.841416414118996, "global_step": 42591, "epoch": 351, "val_loss": 2563804.75} {"train_loss": -32.84778594970703, "global_step": 42592, "epoch": 352} {"train_loss": -33.54302978515625, "global_step": 42593, "epoch": 352} {"train_loss": -33.42672348022461, "global_step": 42594, "epoch": 352} {"train_loss": -31.71015739440918, "global_step": 42595, "epoch": 352} {"train_loss": -34.16010665893555, "global_step": 42596, "epoch": 352} {"train_loss": -33.90885543823242, "global_step": 42597, "epoch": 352} {"train_loss": -32.586891174316406, "global_step": 42598, "epoch": 352} {"train_loss": -34.13518524169922, "global_step": 42599, "epoch": 352} {"train_loss": -33.757572174072266, "global_step": 42600, "epoch": 352} {"train_loss": -32.88563537597656, "global_step": 42601, "epoch": 352} {"train_loss": -32.63898849487305, "global_step": 42602, "epoch": 352} {"train_loss": -30.505706787109375, "global_step": 42603, "epoch": 352} {"train_loss": -32.65027618408203, "global_step": 42604, "epoch": 352} {"train_loss": -34.099727630615234, "global_step": 42605, "epoch": 352} {"train_loss": -33.684627532958984, "global_step": 42606, "epoch": 352} {"train_loss": -34.21258544921875, "global_step": 42607, "epoch": 352} {"train_loss": -33.466331481933594, "global_step": 42608, "epoch": 352} {"train_loss": -34.27212142944336, "global_step": 42609, "epoch": 352} {"train_loss": -33.66739273071289, "global_step": 42610, "epoch": 352} {"train_loss": -33.37263107299805, "global_step": 42611, "epoch": 352} {"train_loss": -33.466217041015625, "global_step": 42612, "epoch": 352} {"train_loss": -34.492225646972656, "global_step": 42613, "epoch": 352} {"train_loss": -33.52408981323242, "global_step": 42614, "epoch": 352} {"train_loss": -34.47150802612305, "global_step": 42615, "epoch": 352} {"train_loss": -34.184871673583984, "global_step": 42616, "epoch": 352} {"train_loss": -34.634029388427734, "global_step": 42617, "epoch": 352} {"train_loss": -34.0750846862793, "global_step": 42618, "epoch": 352} {"train_loss": -34.62815475463867, "global_step": 42619, "epoch": 352} {"train_loss": -34.76108932495117, "global_step": 42620, "epoch": 352} {"train_loss": -34.31376266479492, "global_step": 42621, "epoch": 352} {"train_loss": -34.52252960205078, "global_step": 42622, "epoch": 352} {"train_loss": -35.176239013671875, "global_step": 42623, "epoch": 352} {"train_loss": -34.52840805053711, "global_step": 42624, "epoch": 352} {"train_loss": -34.40217971801758, "global_step": 42625, "epoch": 352} {"train_loss": -34.960079193115234, "global_step": 42626, "epoch": 352} {"train_loss": -34.62921142578125, "global_step": 42627, "epoch": 352} {"train_loss": -34.32017135620117, "global_step": 42628, "epoch": 352} {"train_loss": -33.713897705078125, "global_step": 42629, "epoch": 352} {"train_loss": -33.66868209838867, "global_step": 42630, "epoch": 352} {"train_loss": -33.695465087890625, "global_step": 42631, "epoch": 352} {"train_loss": -34.58450698852539, "global_step": 42632, "epoch": 352} {"train_loss": -34.765377044677734, "global_step": 42633, "epoch": 352} {"train_loss": -34.795894622802734, "global_step": 42634, "epoch": 352} {"train_loss": -33.42656326293945, "global_step": 42635, "epoch": 352} {"train_loss": -34.36907958984375, "global_step": 42636, "epoch": 352} {"train_loss": -34.38277053833008, "global_step": 42637, "epoch": 352} {"train_loss": -35.392024993896484, "global_step": 42638, "epoch": 352} {"train_loss": -34.8565788269043, "global_step": 42639, "epoch": 352} {"train_loss": -34.67119216918945, "global_step": 42640, "epoch": 352} {"train_loss": -35.17266082763672, "global_step": 42641, "epoch": 352} {"train_loss": -34.77593231201172, "global_step": 42642, "epoch": 352} {"train_loss": -35.38508987426758, "global_step": 42643, "epoch": 352} {"train_loss": -34.500953674316406, "global_step": 42644, "epoch": 352} {"train_loss": -34.9326286315918, "global_step": 42645, "epoch": 352} {"train_loss": -35.25143051147461, "global_step": 42646, "epoch": 352} {"train_loss": -35.19558334350586, "global_step": 42647, "epoch": 352} {"train_loss": -34.36663818359375, "global_step": 42648, "epoch": 352} {"train_loss": -34.67518997192383, "global_step": 42649, "epoch": 352} {"train_loss": -34.89754867553711, "global_step": 42650, "epoch": 352} {"train_loss": -34.650203704833984, "global_step": 42651, "epoch": 352} {"train_loss": -35.2747917175293, "global_step": 42652, "epoch": 352} {"train_loss": -35.50086212158203, "global_step": 42653, "epoch": 352} {"train_loss": -34.31342315673828, "global_step": 42654, "epoch": 352} {"train_loss": -34.503849029541016, "global_step": 42655, "epoch": 352} {"train_loss": -34.35651779174805, "global_step": 42656, "epoch": 352} {"train_loss": -34.47837829589844, "global_step": 42657, "epoch": 352} {"train_loss": -34.565128326416016, "global_step": 42658, "epoch": 352} {"train_loss": -35.047569274902344, "global_step": 42659, "epoch": 352} {"train_loss": -35.020320892333984, "global_step": 42660, "epoch": 352} {"train_loss": -34.77854537963867, "global_step": 42661, "epoch": 352} {"train_loss": -34.31069564819336, "global_step": 42662, "epoch": 352} {"train_loss": -33.79513168334961, "global_step": 42663, "epoch": 352} {"train_loss": -34.0561408996582, "global_step": 42664, "epoch": 352} {"train_loss": -33.88004684448242, "global_step": 42665, "epoch": 352} {"train_loss": -34.96049880981445, "global_step": 42666, "epoch": 352} {"train_loss": -35.09987258911133, "global_step": 42667, "epoch": 352} {"train_loss": -34.18120193481445, "global_step": 42668, "epoch": 352} {"train_loss": -34.157379150390625, "global_step": 42669, "epoch": 352} {"train_loss": -33.954402923583984, "global_step": 42670, "epoch": 352} {"train_loss": -32.98018264770508, "global_step": 42671, "epoch": 352} {"train_loss": -33.01367950439453, "global_step": 42672, "epoch": 352} {"train_loss": -34.332942962646484, "global_step": 42673, "epoch": 352} {"train_loss": -33.27090072631836, "global_step": 42674, "epoch": 352} {"train_loss": -32.3044319152832, "global_step": 42675, "epoch": 352} {"train_loss": -34.252864837646484, "global_step": 42676, "epoch": 352} {"train_loss": -33.82247543334961, "global_step": 42677, "epoch": 352} {"train_loss": -31.228885650634766, "global_step": 42678, "epoch": 352} {"train_loss": -33.979854583740234, "global_step": 42679, "epoch": 352} {"train_loss": -29.817602157592773, "global_step": 42680, "epoch": 352} {"train_loss": -32.42446517944336, "global_step": 42681, "epoch": 352} {"train_loss": -28.297821044921875, "global_step": 42682, "epoch": 352} {"train_loss": -26.812124252319336, "global_step": 42683, "epoch": 352} {"train_loss": -26.091693878173828, "global_step": 42684, "epoch": 352} {"train_loss": -26.268875122070312, "global_step": 42685, "epoch": 352} {"train_loss": -28.506305694580078, "global_step": 42686, "epoch": 352} {"train_loss": -30.077871322631836, "global_step": 42687, "epoch": 352} {"train_loss": -27.719465255737305, "global_step": 42688, "epoch": 352} {"train_loss": -28.293222427368164, "global_step": 42689, "epoch": 352} {"train_loss": -29.7370662689209, "global_step": 42690, "epoch": 352} {"train_loss": -29.06149673461914, "global_step": 42691, "epoch": 352} {"train_loss": -27.968469619750977, "global_step": 42692, "epoch": 352} {"train_loss": -30.15729331970215, "global_step": 42693, "epoch": 352} {"train_loss": -30.019224166870117, "global_step": 42694, "epoch": 352} {"train_loss": -30.35104751586914, "global_step": 42695, "epoch": 352} {"train_loss": -31.141956329345703, "global_step": 42696, "epoch": 352} {"train_loss": -30.228851318359375, "global_step": 42697, "epoch": 352} {"train_loss": -30.88457679748535, "global_step": 42698, "epoch": 352} {"train_loss": -31.13905143737793, "global_step": 42699, "epoch": 352} {"train_loss": -31.054784774780273, "global_step": 42700, "epoch": 352} {"train_loss": -32.08869552612305, "global_step": 42701, "epoch": 352} {"train_loss": -31.90168571472168, "global_step": 42702, "epoch": 352} {"train_loss": -31.851078033447266, "global_step": 42703, "epoch": 352} {"train_loss": -32.42424392700195, "global_step": 42704, "epoch": 352} {"train_loss": -32.71441650390625, "global_step": 42705, "epoch": 352} {"train_loss": -32.222835540771484, "global_step": 42706, "epoch": 352} {"train_loss": -32.97212219238281, "global_step": 42707, "epoch": 352} {"train_loss": -32.308284759521484, "global_step": 42708, "epoch": 352} {"train_loss": -33.160316467285156, "global_step": 42709, "epoch": 352} {"train_loss": -32.998714447021484, "global_step": 42710, "epoch": 352} {"train_loss": -33.52861785888672, "global_step": 42711, "epoch": 352} {"train_loss": -33.13406655808126, "global_step": 42712, "epoch": 352, "val_loss": 2488856.25} {"train_loss": -33.85453796386719, "global_step": 42713, "epoch": 353} {"train_loss": -33.35886764526367, "global_step": 42714, "epoch": 353} {"train_loss": -34.1230583190918, "global_step": 42715, "epoch": 353} {"train_loss": -33.98751449584961, "global_step": 42716, "epoch": 353} {"train_loss": -34.00982666015625, "global_step": 42717, "epoch": 353} {"train_loss": -34.4096794128418, "global_step": 42718, "epoch": 353} {"train_loss": -34.36572265625, "global_step": 42719, "epoch": 353} {"train_loss": -34.67792892456055, "global_step": 42720, "epoch": 353} {"train_loss": -34.3621711730957, "global_step": 42721, "epoch": 353} {"train_loss": -34.55322265625, "global_step": 42722, "epoch": 353} {"train_loss": -34.591854095458984, "global_step": 42723, "epoch": 353} {"train_loss": -34.680904388427734, "global_step": 42724, "epoch": 353} {"train_loss": -34.946075439453125, "global_step": 42725, "epoch": 353} {"train_loss": -33.93418502807617, "global_step": 42726, "epoch": 353} {"train_loss": -33.30784606933594, "global_step": 42727, "epoch": 353} {"train_loss": -31.892820358276367, "global_step": 42728, "epoch": 353} {"train_loss": -32.14387893676758, "global_step": 42729, "epoch": 353} {"train_loss": -32.98970413208008, "global_step": 42730, "epoch": 353} {"train_loss": -33.418575286865234, "global_step": 42731, "epoch": 353} {"train_loss": -32.98673629760742, "global_step": 42732, "epoch": 353} {"train_loss": -33.56637191772461, "global_step": 42733, "epoch": 353} {"train_loss": -33.356807708740234, "global_step": 42734, "epoch": 353} {"train_loss": -31.04368019104004, "global_step": 42735, "epoch": 353} {"train_loss": -27.3328857421875, "global_step": 42736, "epoch": 353} {"train_loss": -32.00338363647461, "global_step": 42737, "epoch": 353} {"train_loss": -32.213924407958984, "global_step": 42738, "epoch": 353} {"train_loss": -29.683700561523438, "global_step": 42739, "epoch": 353} {"train_loss": -32.65627670288086, "global_step": 42740, "epoch": 353} {"train_loss": -32.79636001586914, "global_step": 42741, "epoch": 353} {"train_loss": -29.97442626953125, "global_step": 42742, "epoch": 353} {"train_loss": -33.389156341552734, "global_step": 42743, "epoch": 353} {"train_loss": -31.616479873657227, "global_step": 42744, "epoch": 353} {"train_loss": -31.607065200805664, "global_step": 42745, "epoch": 353} {"train_loss": -33.149169921875, "global_step": 42746, "epoch": 353} {"train_loss": -31.695173263549805, "global_step": 42747, "epoch": 353} {"train_loss": -32.82275390625, "global_step": 42748, "epoch": 353} {"train_loss": -33.167633056640625, "global_step": 42749, "epoch": 353} {"train_loss": -33.221588134765625, "global_step": 42750, "epoch": 353} {"train_loss": -33.202735900878906, "global_step": 42751, "epoch": 353} {"train_loss": -33.33762741088867, "global_step": 42752, "epoch": 353} {"train_loss": -33.03860855102539, "global_step": 42753, "epoch": 353} {"train_loss": -33.41096115112305, "global_step": 42754, "epoch": 353} {"train_loss": -33.34686279296875, "global_step": 42755, "epoch": 353} {"train_loss": -33.91848373413086, "global_step": 42756, "epoch": 353} {"train_loss": -33.458229064941406, "global_step": 42757, "epoch": 353} {"train_loss": -33.66508865356445, "global_step": 42758, "epoch": 353} {"train_loss": -33.85257339477539, "global_step": 42759, "epoch": 353} {"train_loss": -33.990875244140625, "global_step": 42760, "epoch": 353} {"train_loss": -33.97719192504883, "global_step": 42761, "epoch": 353} {"train_loss": -34.10449981689453, "global_step": 42762, "epoch": 353} {"train_loss": -33.994869232177734, "global_step": 42763, "epoch": 353} {"train_loss": -33.95072937011719, "global_step": 42764, "epoch": 353} {"train_loss": -34.2717170715332, "global_step": 42765, "epoch": 353} {"train_loss": -34.23802185058594, "global_step": 42766, "epoch": 353} {"train_loss": -34.13508224487305, "global_step": 42767, "epoch": 353} {"train_loss": -34.4577751159668, "global_step": 42768, "epoch": 353} {"train_loss": -34.443511962890625, "global_step": 42769, "epoch": 353} {"train_loss": -34.05568313598633, "global_step": 42770, "epoch": 353} {"train_loss": -34.560604095458984, "global_step": 42771, "epoch": 353} {"train_loss": -34.64925765991211, "global_step": 42772, "epoch": 353} {"train_loss": -34.195735931396484, "global_step": 42773, "epoch": 353} {"train_loss": -34.41853713989258, "global_step": 42774, "epoch": 353} {"train_loss": -34.68828201293945, "global_step": 42775, "epoch": 353} {"train_loss": -34.84395980834961, "global_step": 42776, "epoch": 353} {"train_loss": -34.09144973754883, "global_step": 42777, "epoch": 353} {"train_loss": -34.56696701049805, "global_step": 42778, "epoch": 353} {"train_loss": -34.56833267211914, "global_step": 42779, "epoch": 353} {"train_loss": -34.611480712890625, "global_step": 42780, "epoch": 353} {"train_loss": -34.3612060546875, "global_step": 42781, "epoch": 353} {"train_loss": -34.82674026489258, "global_step": 42782, "epoch": 353} {"train_loss": -34.68001937866211, "global_step": 42783, "epoch": 353} {"train_loss": -34.85749435424805, "global_step": 42784, "epoch": 353} {"train_loss": -34.63159942626953, "global_step": 42785, "epoch": 353} {"train_loss": -34.96807861328125, "global_step": 42786, "epoch": 353} {"train_loss": -34.50455856323242, "global_step": 42787, "epoch": 353} {"train_loss": -34.32008743286133, "global_step": 42788, "epoch": 353} {"train_loss": -35.23060989379883, "global_step": 42789, "epoch": 353} {"train_loss": -34.16107177734375, "global_step": 42790, "epoch": 353} {"train_loss": -34.629302978515625, "global_step": 42791, "epoch": 353} {"train_loss": -34.5335578918457, "global_step": 42792, "epoch": 353} {"train_loss": -34.211788177490234, "global_step": 42793, "epoch": 353} {"train_loss": -34.50883102416992, "global_step": 42794, "epoch": 353} {"train_loss": -34.56037139892578, "global_step": 42795, "epoch": 353} {"train_loss": -34.776180267333984, "global_step": 42796, "epoch": 353} {"train_loss": -35.047584533691406, "global_step": 42797, "epoch": 353} {"train_loss": -34.91963577270508, "global_step": 42798, "epoch": 353} {"train_loss": -34.385108947753906, "global_step": 42799, "epoch": 353} {"train_loss": -34.52582931518555, "global_step": 42800, "epoch": 353} {"train_loss": -34.43867111206055, "global_step": 42801, "epoch": 353} {"train_loss": -34.04914474487305, "global_step": 42802, "epoch": 353} {"train_loss": -34.03362274169922, "global_step": 42803, "epoch": 353} {"train_loss": -31.886510848999023, "global_step": 42804, "epoch": 353} {"train_loss": -31.47650718688965, "global_step": 42805, "epoch": 353} {"train_loss": -32.3065299987793, "global_step": 42806, "epoch": 353} {"train_loss": -32.88856887817383, "global_step": 42807, "epoch": 353} {"train_loss": -33.806819915771484, "global_step": 42808, "epoch": 353} {"train_loss": -34.73865509033203, "global_step": 42809, "epoch": 353} {"train_loss": -33.30133819580078, "global_step": 42810, "epoch": 353} {"train_loss": -29.122461318969727, "global_step": 42811, "epoch": 353} {"train_loss": -23.9736385345459, "global_step": 42812, "epoch": 353} {"train_loss": -28.776845932006836, "global_step": 42813, "epoch": 353} {"train_loss": -31.057397842407227, "global_step": 42814, "epoch": 353} {"train_loss": -29.52874183654785, "global_step": 42815, "epoch": 353} {"train_loss": -31.614477157592773, "global_step": 42816, "epoch": 353} {"train_loss": -33.27633285522461, "global_step": 42817, "epoch": 353} {"train_loss": -31.9028377532959, "global_step": 42818, "epoch": 353} {"train_loss": -33.966041564941406, "global_step": 42819, "epoch": 353} {"train_loss": -32.866004943847656, "global_step": 42820, "epoch": 353} {"train_loss": -33.480106353759766, "global_step": 42821, "epoch": 353} {"train_loss": -32.54955291748047, "global_step": 42822, "epoch": 353} {"train_loss": -33.59418487548828, "global_step": 42823, "epoch": 353} {"train_loss": -33.582435607910156, "global_step": 42824, "epoch": 353} {"train_loss": -34.30325698852539, "global_step": 42825, "epoch": 353} {"train_loss": -33.74579620361328, "global_step": 42826, "epoch": 353} {"train_loss": -34.104949951171875, "global_step": 42827, "epoch": 353} {"train_loss": -34.460166931152344, "global_step": 42828, "epoch": 353} {"train_loss": -34.03567123413086, "global_step": 42829, "epoch": 353} {"train_loss": -34.321529388427734, "global_step": 42830, "epoch": 353} {"train_loss": -34.319705963134766, "global_step": 42831, "epoch": 353} {"train_loss": -34.67639923095703, "global_step": 42832, "epoch": 353} {"train_loss": -33.44519102868955, "global_step": 42833, "epoch": 353, "val_loss": 2432655.0} {"train_loss": -34.28095245361328, "global_step": 42834, "epoch": 354} {"train_loss": -34.57535934448242, "global_step": 42835, "epoch": 354} {"train_loss": -34.05297088623047, "global_step": 42836, "epoch": 354} {"train_loss": -34.8106575012207, "global_step": 42837, "epoch": 354} {"train_loss": -34.41847610473633, "global_step": 42838, "epoch": 354} {"train_loss": -34.581634521484375, "global_step": 42839, "epoch": 354} {"train_loss": -34.15812683105469, "global_step": 42840, "epoch": 354} {"train_loss": -34.14724349975586, "global_step": 42841, "epoch": 354} {"train_loss": -34.33820724487305, "global_step": 42842, "epoch": 354} {"train_loss": -34.440338134765625, "global_step": 42843, "epoch": 354} {"train_loss": -34.05479049682617, "global_step": 42844, "epoch": 354} {"train_loss": -33.893856048583984, "global_step": 42845, "epoch": 354} {"train_loss": -33.90940856933594, "global_step": 42846, "epoch": 354} {"train_loss": -35.022579193115234, "global_step": 42847, "epoch": 354} {"train_loss": -34.63956832885742, "global_step": 42848, "epoch": 354} {"train_loss": -34.257869720458984, "global_step": 42849, "epoch": 354} {"train_loss": -34.88594055175781, "global_step": 42850, "epoch": 354} {"train_loss": -33.82587432861328, "global_step": 42851, "epoch": 354} {"train_loss": -34.76780319213867, "global_step": 42852, "epoch": 354} {"train_loss": -34.50297164916992, "global_step": 42853, "epoch": 354} {"train_loss": -34.474464416503906, "global_step": 42854, "epoch": 354} {"train_loss": -33.81679916381836, "global_step": 42855, "epoch": 354} {"train_loss": -33.65443801879883, "global_step": 42856, "epoch": 354} {"train_loss": -34.72311019897461, "global_step": 42857, "epoch": 354} {"train_loss": -34.90278244018555, "global_step": 42858, "epoch": 354} {"train_loss": -33.93671417236328, "global_step": 42859, "epoch": 354} {"train_loss": -34.34896469116211, "global_step": 42860, "epoch": 354} {"train_loss": -34.46151351928711, "global_step": 42861, "epoch": 354} {"train_loss": -34.3056640625, "global_step": 42862, "epoch": 354} {"train_loss": -34.60947036743164, "global_step": 42863, "epoch": 354} {"train_loss": -34.53743362426758, "global_step": 42864, "epoch": 354} {"train_loss": -34.20183181762695, "global_step": 42865, "epoch": 354} {"train_loss": -33.87827682495117, "global_step": 42866, "epoch": 354} {"train_loss": -33.142127990722656, "global_step": 42867, "epoch": 354} {"train_loss": -34.800846099853516, "global_step": 42868, "epoch": 354} {"train_loss": -33.185951232910156, "global_step": 42869, "epoch": 354} {"train_loss": -33.41804504394531, "global_step": 42870, "epoch": 354} {"train_loss": -33.850067138671875, "global_step": 42871, "epoch": 354} {"train_loss": -34.109432220458984, "global_step": 42872, "epoch": 354} {"train_loss": -33.88656234741211, "global_step": 42873, "epoch": 354} {"train_loss": -32.07976150512695, "global_step": 42874, "epoch": 354} {"train_loss": -32.95045852661133, "global_step": 42875, "epoch": 354} {"train_loss": -33.14168930053711, "global_step": 42876, "epoch": 354} {"train_loss": -30.62835693359375, "global_step": 42877, "epoch": 354} {"train_loss": -33.76318359375, "global_step": 42878, "epoch": 354} {"train_loss": -33.55213165283203, "global_step": 42879, "epoch": 354} {"train_loss": -33.44062423706055, "global_step": 42880, "epoch": 354} {"train_loss": -30.833784103393555, "global_step": 42881, "epoch": 354} {"train_loss": -32.9755744934082, "global_step": 42882, "epoch": 354} {"train_loss": -31.22477149963379, "global_step": 42883, "epoch": 354} {"train_loss": -29.11358070373535, "global_step": 42884, "epoch": 354} {"train_loss": -25.93345069885254, "global_step": 42885, "epoch": 354} {"train_loss": -28.934118270874023, "global_step": 42886, "epoch": 354} {"train_loss": -30.94378089904785, "global_step": 42887, "epoch": 354} {"train_loss": -30.474029541015625, "global_step": 42888, "epoch": 354} {"train_loss": -31.21101951599121, "global_step": 42889, "epoch": 354} {"train_loss": -31.078622817993164, "global_step": 42890, "epoch": 354} {"train_loss": -32.00095748901367, "global_step": 42891, "epoch": 354} {"train_loss": -32.89986801147461, "global_step": 42892, "epoch": 354} {"train_loss": -31.020111083984375, "global_step": 42893, "epoch": 354} {"train_loss": -32.3490104675293, "global_step": 42894, "epoch": 354} {"train_loss": -32.484397888183594, "global_step": 42895, "epoch": 354} {"train_loss": -31.372180938720703, "global_step": 42896, "epoch": 354} {"train_loss": -30.22934341430664, "global_step": 42897, "epoch": 354} {"train_loss": -31.74176597595215, "global_step": 42898, "epoch": 354} {"train_loss": -31.871057510375977, "global_step": 42899, "epoch": 354} {"train_loss": -32.24827194213867, "global_step": 42900, "epoch": 354} {"train_loss": -32.27347946166992, "global_step": 42901, "epoch": 354} {"train_loss": -32.74814224243164, "global_step": 42902, "epoch": 354} {"train_loss": -31.87440299987793, "global_step": 42903, "epoch": 354} {"train_loss": -33.043758392333984, "global_step": 42904, "epoch": 354} {"train_loss": -32.268592834472656, "global_step": 42905, "epoch": 354} {"train_loss": -33.180091857910156, "global_step": 42906, "epoch": 354} {"train_loss": -32.3702392578125, "global_step": 42907, "epoch": 354} {"train_loss": -32.89852523803711, "global_step": 42908, "epoch": 354} {"train_loss": -33.19303894042969, "global_step": 42909, "epoch": 354} {"train_loss": -32.919742584228516, "global_step": 42910, "epoch": 354} {"train_loss": -32.672603607177734, "global_step": 42911, "epoch": 354} {"train_loss": -32.43389129638672, "global_step": 42912, "epoch": 354} {"train_loss": -33.43974685668945, "global_step": 42913, "epoch": 354} {"train_loss": -32.86980056762695, "global_step": 42914, "epoch": 354} {"train_loss": -33.42323303222656, "global_step": 42915, "epoch": 354} {"train_loss": -33.49300765991211, "global_step": 42916, "epoch": 354} {"train_loss": -33.5724983215332, "global_step": 42917, "epoch": 354} {"train_loss": -33.69388961791992, "global_step": 42918, "epoch": 354} {"train_loss": -33.83464813232422, "global_step": 42919, "epoch": 354} {"train_loss": -33.18708801269531, "global_step": 42920, "epoch": 354} {"train_loss": -33.8394775390625, "global_step": 42921, "epoch": 354} {"train_loss": -33.625701904296875, "global_step": 42922, "epoch": 354} {"train_loss": -33.828731536865234, "global_step": 42923, "epoch": 354} {"train_loss": -34.169342041015625, "global_step": 42924, "epoch": 354} {"train_loss": -34.385414123535156, "global_step": 42925, "epoch": 354} {"train_loss": -34.27918243408203, "global_step": 42926, "epoch": 354} {"train_loss": -34.1184196472168, "global_step": 42927, "epoch": 354} {"train_loss": -34.58843994140625, "global_step": 42928, "epoch": 354} {"train_loss": -34.484466552734375, "global_step": 42929, "epoch": 354} {"train_loss": -34.60791015625, "global_step": 42930, "epoch": 354} {"train_loss": -34.356502532958984, "global_step": 42931, "epoch": 354} {"train_loss": -34.459205627441406, "global_step": 42932, "epoch": 354} {"train_loss": -34.50175094604492, "global_step": 42933, "epoch": 354} {"train_loss": -34.6199951171875, "global_step": 42934, "epoch": 354} {"train_loss": -34.57699966430664, "global_step": 42935, "epoch": 354} {"train_loss": -34.46968460083008, "global_step": 42936, "epoch": 354} {"train_loss": -34.801361083984375, "global_step": 42937, "epoch": 354} {"train_loss": -34.79907989501953, "global_step": 42938, "epoch": 354} {"train_loss": -35.1723747253418, "global_step": 42939, "epoch": 354} {"train_loss": -34.75048828125, "global_step": 42940, "epoch": 354} {"train_loss": -35.27177047729492, "global_step": 42941, "epoch": 354} {"train_loss": -34.614013671875, "global_step": 42942, "epoch": 354} {"train_loss": -34.78773880004883, "global_step": 42943, "epoch": 354} {"train_loss": -35.07477569580078, "global_step": 42944, "epoch": 354} {"train_loss": -34.88511276245117, "global_step": 42945, "epoch": 354} {"train_loss": -35.288185119628906, "global_step": 42946, "epoch": 354} {"train_loss": -35.131526947021484, "global_step": 42947, "epoch": 354} {"train_loss": -35.22712326049805, "global_step": 42948, "epoch": 354} {"train_loss": -35.83108139038086, "global_step": 42949, "epoch": 354} {"train_loss": -35.234378814697266, "global_step": 42950, "epoch": 354} {"train_loss": -35.204490661621094, "global_step": 42951, "epoch": 354} {"train_loss": -35.681610107421875, "global_step": 42952, "epoch": 354} {"train_loss": -35.22491455078125, "global_step": 42953, "epoch": 354} {"train_loss": -33.561184922525705, "global_step": 42954, "epoch": 354, "val_loss": 2526742.75} {"train_loss": -35.604976654052734, "global_step": 42955, "epoch": 355} {"train_loss": -35.6384162902832, "global_step": 42956, "epoch": 355} {"train_loss": -34.811031341552734, "global_step": 42957, "epoch": 355} {"train_loss": -35.54622268676758, "global_step": 42958, "epoch": 355} {"train_loss": -35.391090393066406, "global_step": 42959, "epoch": 355} {"train_loss": -35.497474670410156, "global_step": 42960, "epoch": 355} {"train_loss": -35.346397399902344, "global_step": 42961, "epoch": 355} {"train_loss": -35.39153289794922, "global_step": 42962, "epoch": 355} {"train_loss": -35.27961730957031, "global_step": 42963, "epoch": 355} {"train_loss": -34.1416015625, "global_step": 42964, "epoch": 355} {"train_loss": -31.100040435791016, "global_step": 42965, "epoch": 355} {"train_loss": -23.28387451171875, "global_step": 42966, "epoch": 355} {"train_loss": -4.984822750091553, "global_step": 42967, "epoch": 355} {"train_loss": -14.383386611938477, "global_step": 42968, "epoch": 355} {"train_loss": -26.119094848632812, "global_step": 42969, "epoch": 355} {"train_loss": -24.835960388183594, "global_step": 42970, "epoch": 355} {"train_loss": -18.937732696533203, "global_step": 42971, "epoch": 355} {"train_loss": -16.482925415039062, "global_step": 42972, "epoch": 355} {"train_loss": -25.848495483398438, "global_step": 42973, "epoch": 355} {"train_loss": -23.649158477783203, "global_step": 42974, "epoch": 355} {"train_loss": -25.699766159057617, "global_step": 42975, "epoch": 355} {"train_loss": -31.59119987487793, "global_step": 42976, "epoch": 355} {"train_loss": -29.613605499267578, "global_step": 42977, "epoch": 355} {"train_loss": -29.396249771118164, "global_step": 42978, "epoch": 355} {"train_loss": -28.64312171936035, "global_step": 42979, "epoch": 355} {"train_loss": -29.195743560791016, "global_step": 42980, "epoch": 355} {"train_loss": -31.78252601623535, "global_step": 42981, "epoch": 355} {"train_loss": -31.3631591796875, "global_step": 42982, "epoch": 355} {"train_loss": -32.42511749267578, "global_step": 42983, "epoch": 355} {"train_loss": -31.62192153930664, "global_step": 42984, "epoch": 355} {"train_loss": -31.541311264038086, "global_step": 42985, "epoch": 355} {"train_loss": -31.901269912719727, "global_step": 42986, "epoch": 355} {"train_loss": -31.190454483032227, "global_step": 42987, "epoch": 355} {"train_loss": -31.684545516967773, "global_step": 42988, "epoch": 355} {"train_loss": -32.180580139160156, "global_step": 42989, "epoch": 355} {"train_loss": -31.962875366210938, "global_step": 42990, "epoch": 355} {"train_loss": -32.30080795288086, "global_step": 42991, "epoch": 355} {"train_loss": -32.28477096557617, "global_step": 42992, "epoch": 355} {"train_loss": -32.51179504394531, "global_step": 42993, "epoch": 355} {"train_loss": -32.493499755859375, "global_step": 42994, "epoch": 355} {"train_loss": -32.33626937866211, "global_step": 42995, "epoch": 355} {"train_loss": -32.82355880737305, "global_step": 42996, "epoch": 355} {"train_loss": -32.53126907348633, "global_step": 42997, "epoch": 355} {"train_loss": -32.651527404785156, "global_step": 42998, "epoch": 355} {"train_loss": -32.50032043457031, "global_step": 42999, "epoch": 355} {"train_loss": -32.39368438720703, "global_step": 43000, "epoch": 355} {"train_loss": -32.962432861328125, "global_step": 43001, "epoch": 355} {"train_loss": -32.5589599609375, "global_step": 43002, "epoch": 355} {"train_loss": -32.810096740722656, "global_step": 43003, "epoch": 355} {"train_loss": -32.86298370361328, "global_step": 43004, "epoch": 355} {"train_loss": -33.1152458190918, "global_step": 43005, "epoch": 355} {"train_loss": -33.175086975097656, "global_step": 43006, "epoch": 355} {"train_loss": -32.97578811645508, "global_step": 43007, "epoch": 355} {"train_loss": -33.40480041503906, "global_step": 43008, "epoch": 355} {"train_loss": -33.42597198486328, "global_step": 43009, "epoch": 355} {"train_loss": -33.36888885498047, "global_step": 43010, "epoch": 355} {"train_loss": -33.21465301513672, "global_step": 43011, "epoch": 355} {"train_loss": -33.668243408203125, "global_step": 43012, "epoch": 355} {"train_loss": -33.440006256103516, "global_step": 43013, "epoch": 355} {"train_loss": -33.49418640136719, "global_step": 43014, "epoch": 355} {"train_loss": -33.26774215698242, "global_step": 43015, "epoch": 355} {"train_loss": -33.54085922241211, "global_step": 43016, "epoch": 355} {"train_loss": -33.881343841552734, "global_step": 43017, "epoch": 355} {"train_loss": -33.70716094970703, "global_step": 43018, "epoch": 355} {"train_loss": -33.68047332763672, "global_step": 43019, "epoch": 355} {"train_loss": -33.56647872924805, "global_step": 43020, "epoch": 355} {"train_loss": -32.9862060546875, "global_step": 43021, "epoch": 355} {"train_loss": -33.54314041137695, "global_step": 43022, "epoch": 355} {"train_loss": -33.616512298583984, "global_step": 43023, "epoch": 355} {"train_loss": -33.656429290771484, "global_step": 43024, "epoch": 355} {"train_loss": -33.75551986694336, "global_step": 43025, "epoch": 355} {"train_loss": -34.01015853881836, "global_step": 43026, "epoch": 355} {"train_loss": -33.52775573730469, "global_step": 43027, "epoch": 355} {"train_loss": -33.7686653137207, "global_step": 43028, "epoch": 355} {"train_loss": -33.838191986083984, "global_step": 43029, "epoch": 355} {"train_loss": -33.70399856567383, "global_step": 43030, "epoch": 355} {"train_loss": -33.079345703125, "global_step": 43031, "epoch": 355} {"train_loss": -33.28622055053711, "global_step": 43032, "epoch": 355} {"train_loss": -32.68854904174805, "global_step": 43033, "epoch": 355} {"train_loss": -33.6288948059082, "global_step": 43034, "epoch": 355} {"train_loss": -33.814327239990234, "global_step": 43035, "epoch": 355} {"train_loss": -33.83277130126953, "global_step": 43036, "epoch": 355} {"train_loss": -34.17706298828125, "global_step": 43037, "epoch": 355} {"train_loss": -33.24142074584961, "global_step": 43038, "epoch": 355} {"train_loss": -33.17599105834961, "global_step": 43039, "epoch": 355} {"train_loss": -32.10691452026367, "global_step": 43040, "epoch": 355} {"train_loss": -30.620929718017578, "global_step": 43041, "epoch": 355} {"train_loss": -30.66705322265625, "global_step": 43042, "epoch": 355} {"train_loss": -29.687488555908203, "global_step": 43043, "epoch": 355} {"train_loss": -33.32699203491211, "global_step": 43044, "epoch": 355} {"train_loss": -33.01814270019531, "global_step": 43045, "epoch": 355} {"train_loss": -30.2540340423584, "global_step": 43046, "epoch": 355} {"train_loss": -32.28834915161133, "global_step": 43047, "epoch": 355} {"train_loss": -33.2432975769043, "global_step": 43048, "epoch": 355} {"train_loss": -32.80766296386719, "global_step": 43049, "epoch": 355} {"train_loss": -33.0712776184082, "global_step": 43050, "epoch": 355} {"train_loss": -33.7264289855957, "global_step": 43051, "epoch": 355} {"train_loss": -33.19094467163086, "global_step": 43052, "epoch": 355} {"train_loss": -33.18220901489258, "global_step": 43053, "epoch": 355} {"train_loss": -33.36906051635742, "global_step": 43054, "epoch": 355} {"train_loss": -32.921546936035156, "global_step": 43055, "epoch": 355} {"train_loss": -33.6257209777832, "global_step": 43056, "epoch": 355} {"train_loss": -33.4812126159668, "global_step": 43057, "epoch": 355} {"train_loss": -33.03944778442383, "global_step": 43058, "epoch": 355} {"train_loss": -33.80710983276367, "global_step": 43059, "epoch": 355} {"train_loss": -33.29975509643555, "global_step": 43060, "epoch": 355} {"train_loss": -33.593502044677734, "global_step": 43061, "epoch": 355} {"train_loss": -33.19721603393555, "global_step": 43062, "epoch": 355} {"train_loss": -33.82856369018555, "global_step": 43063, "epoch": 355} {"train_loss": -33.77793884277344, "global_step": 43064, "epoch": 355} {"train_loss": -33.515682220458984, "global_step": 43065, "epoch": 355} {"train_loss": -34.25893020629883, "global_step": 43066, "epoch": 355} {"train_loss": -33.82241439819336, "global_step": 43067, "epoch": 355} {"train_loss": -34.18561553955078, "global_step": 43068, "epoch": 355} {"train_loss": -33.54779052734375, "global_step": 43069, "epoch": 355} {"train_loss": -34.087398529052734, "global_step": 43070, "epoch": 355} {"train_loss": -34.17475509643555, "global_step": 43071, "epoch": 355} {"train_loss": -34.180397033691406, "global_step": 43072, "epoch": 355} {"train_loss": -33.972782135009766, "global_step": 43073, "epoch": 355} {"train_loss": -34.19275665283203, "global_step": 43074, "epoch": 355} {"train_loss": -32.031766335826276, "global_step": 43075, "epoch": 355, "val_loss": 2480983.75} {"train_loss": -33.88002395629883, "global_step": 43076, "epoch": 356} {"train_loss": -33.81254196166992, "global_step": 43077, "epoch": 356} {"train_loss": -34.14113998413086, "global_step": 43078, "epoch": 356} {"train_loss": -33.638267517089844, "global_step": 43079, "epoch": 356} {"train_loss": -34.15058135986328, "global_step": 43080, "epoch": 356} {"train_loss": -33.9775390625, "global_step": 43081, "epoch": 356} {"train_loss": -34.324073791503906, "global_step": 43082, "epoch": 356} {"train_loss": -34.32932662963867, "global_step": 43083, "epoch": 356} {"train_loss": -34.62184143066406, "global_step": 43084, "epoch": 356} {"train_loss": -34.46920394897461, "global_step": 43085, "epoch": 356} {"train_loss": -33.700531005859375, "global_step": 43086, "epoch": 356} {"train_loss": -34.128150939941406, "global_step": 43087, "epoch": 356} {"train_loss": -34.304344177246094, "global_step": 43088, "epoch": 356} {"train_loss": -32.496986389160156, "global_step": 43089, "epoch": 356} {"train_loss": -33.40088653564453, "global_step": 43090, "epoch": 356} {"train_loss": -32.97602081298828, "global_step": 43091, "epoch": 356} {"train_loss": -26.391584396362305, "global_step": 43092, "epoch": 356} {"train_loss": -25.827545166015625, "global_step": 43093, "epoch": 356} {"train_loss": -31.232269287109375, "global_step": 43094, "epoch": 356} {"train_loss": -33.138946533203125, "global_step": 43095, "epoch": 356} {"train_loss": -30.2720890045166, "global_step": 43096, "epoch": 356} {"train_loss": -34.309452056884766, "global_step": 43097, "epoch": 356} {"train_loss": -31.912403106689453, "global_step": 43098, "epoch": 356} {"train_loss": -35.07577896118164, "global_step": 43099, "epoch": 356} {"train_loss": -33.14122009277344, "global_step": 43100, "epoch": 356} {"train_loss": -33.986873626708984, "global_step": 43101, "epoch": 356} {"train_loss": -34.788917541503906, "global_step": 43102, "epoch": 356} {"train_loss": -34.21836853027344, "global_step": 43103, "epoch": 356} {"train_loss": -34.18501663208008, "global_step": 43104, "epoch": 356} {"train_loss": -33.69036102294922, "global_step": 43105, "epoch": 356} {"train_loss": -33.996063232421875, "global_step": 43106, "epoch": 356} {"train_loss": -33.69035339355469, "global_step": 43107, "epoch": 356} {"train_loss": -32.57646942138672, "global_step": 43108, "epoch": 356} {"train_loss": -32.61891555786133, "global_step": 43109, "epoch": 356} {"train_loss": -32.99496078491211, "global_step": 43110, "epoch": 356} {"train_loss": -32.669288635253906, "global_step": 43111, "epoch": 356} {"train_loss": -31.801044464111328, "global_step": 43112, "epoch": 356} {"train_loss": -30.215290069580078, "global_step": 43113, "epoch": 356} {"train_loss": -31.054336547851562, "global_step": 43114, "epoch": 356} {"train_loss": -28.02947998046875, "global_step": 43115, "epoch": 356} {"train_loss": -21.652082443237305, "global_step": 43116, "epoch": 356} {"train_loss": -22.801877975463867, "global_step": 43117, "epoch": 356} {"train_loss": -31.2279052734375, "global_step": 43118, "epoch": 356} {"train_loss": -28.808399200439453, "global_step": 43119, "epoch": 356} {"train_loss": -26.06064224243164, "global_step": 43120, "epoch": 356} {"train_loss": -32.585655212402344, "global_step": 43121, "epoch": 356} {"train_loss": -28.1707820892334, "global_step": 43122, "epoch": 356} {"train_loss": -32.64625930786133, "global_step": 43123, "epoch": 356} {"train_loss": -28.223453521728516, "global_step": 43124, "epoch": 356} {"train_loss": -30.45265769958496, "global_step": 43125, "epoch": 356} {"train_loss": -28.027021408081055, "global_step": 43126, "epoch": 356} {"train_loss": -31.879663467407227, "global_step": 43127, "epoch": 356} {"train_loss": -28.29668617248535, "global_step": 43128, "epoch": 356} {"train_loss": -30.11018180847168, "global_step": 43129, "epoch": 356} {"train_loss": -30.591772079467773, "global_step": 43130, "epoch": 356} {"train_loss": -28.717315673828125, "global_step": 43131, "epoch": 356} {"train_loss": -28.49875259399414, "global_step": 43132, "epoch": 356} {"train_loss": -29.860578536987305, "global_step": 43133, "epoch": 356} {"train_loss": -29.56671142578125, "global_step": 43134, "epoch": 356} {"train_loss": -31.88079261779785, "global_step": 43135, "epoch": 356} {"train_loss": -31.322778701782227, "global_step": 43136, "epoch": 356} {"train_loss": -30.382116317749023, "global_step": 43137, "epoch": 356} {"train_loss": -31.66012954711914, "global_step": 43138, "epoch": 356} {"train_loss": -30.964094161987305, "global_step": 43139, "epoch": 356} {"train_loss": -31.266372680664062, "global_step": 43140, "epoch": 356} {"train_loss": -31.133136749267578, "global_step": 43141, "epoch": 356} {"train_loss": -31.78411293029785, "global_step": 43142, "epoch": 356} {"train_loss": -31.929471969604492, "global_step": 43143, "epoch": 356} {"train_loss": -31.564054489135742, "global_step": 43144, "epoch": 356} {"train_loss": -32.089290618896484, "global_step": 43145, "epoch": 356} {"train_loss": -32.50175094604492, "global_step": 43146, "epoch": 356} {"train_loss": -32.144691467285156, "global_step": 43147, "epoch": 356} {"train_loss": -31.937246322631836, "global_step": 43148, "epoch": 356} {"train_loss": -32.07054901123047, "global_step": 43149, "epoch": 356} {"train_loss": -32.43125915527344, "global_step": 43150, "epoch": 356} {"train_loss": -32.208377838134766, "global_step": 43151, "epoch": 356} {"train_loss": -32.30451202392578, "global_step": 43152, "epoch": 356} {"train_loss": -32.638145446777344, "global_step": 43153, "epoch": 356} {"train_loss": -32.0079345703125, "global_step": 43154, "epoch": 356} {"train_loss": -32.44936752319336, "global_step": 43155, "epoch": 356} {"train_loss": -32.337921142578125, "global_step": 43156, "epoch": 356} {"train_loss": -32.71046829223633, "global_step": 43157, "epoch": 356} {"train_loss": -32.842506408691406, "global_step": 43158, "epoch": 356} {"train_loss": -33.24074935913086, "global_step": 43159, "epoch": 356} {"train_loss": -32.84420394897461, "global_step": 43160, "epoch": 356} {"train_loss": -32.8775520324707, "global_step": 43161, "epoch": 356} {"train_loss": -33.032894134521484, "global_step": 43162, "epoch": 356} {"train_loss": -33.46384811401367, "global_step": 43163, "epoch": 356} {"train_loss": -33.051734924316406, "global_step": 43164, "epoch": 356} {"train_loss": -33.06568145751953, "global_step": 43165, "epoch": 356} {"train_loss": -32.87975311279297, "global_step": 43166, "epoch": 356} {"train_loss": -33.6728630065918, "global_step": 43167, "epoch": 356} {"train_loss": -33.04865264892578, "global_step": 43168, "epoch": 356} {"train_loss": -33.55622482299805, "global_step": 43169, "epoch": 356} {"train_loss": -33.27081298828125, "global_step": 43170, "epoch": 356} {"train_loss": -33.44361877441406, "global_step": 43171, "epoch": 356} {"train_loss": -33.5299186706543, "global_step": 43172, "epoch": 356} {"train_loss": -33.604183197021484, "global_step": 43173, "epoch": 356} {"train_loss": -33.75515365600586, "global_step": 43174, "epoch": 356} {"train_loss": -33.34217834472656, "global_step": 43175, "epoch": 356} {"train_loss": -33.9676628112793, "global_step": 43176, "epoch": 356} {"train_loss": -33.99897384643555, "global_step": 43177, "epoch": 356} {"train_loss": -33.93833541870117, "global_step": 43178, "epoch": 356} {"train_loss": -33.90421676635742, "global_step": 43179, "epoch": 356} {"train_loss": -34.1418342590332, "global_step": 43180, "epoch": 356} {"train_loss": -34.2691535949707, "global_step": 43181, "epoch": 356} {"train_loss": -34.20991897583008, "global_step": 43182, "epoch": 356} {"train_loss": -34.40106964111328, "global_step": 43183, "epoch": 356} {"train_loss": -34.23818588256836, "global_step": 43184, "epoch": 356} {"train_loss": -33.96342086791992, "global_step": 43185, "epoch": 356} {"train_loss": -33.281009674072266, "global_step": 43186, "epoch": 356} {"train_loss": -31.946125030517578, "global_step": 43187, "epoch": 356} {"train_loss": -30.460737228393555, "global_step": 43188, "epoch": 356} {"train_loss": -28.845258712768555, "global_step": 43189, "epoch": 356} {"train_loss": -27.76797866821289, "global_step": 43190, "epoch": 356} {"train_loss": -32.28947830200195, "global_step": 43191, "epoch": 356} {"train_loss": -34.099239349365234, "global_step": 43192, "epoch": 356} {"train_loss": -31.631092071533203, "global_step": 43193, "epoch": 356} {"train_loss": -33.39740753173828, "global_step": 43194, "epoch": 356} {"train_loss": -33.56028366088867, "global_step": 43195, "epoch": 356} {"train_loss": -32.1170971137433, "global_step": 43196, "epoch": 356, "val_loss": 2444701.0} {"train_loss": -33.91986083984375, "global_step": 43197, "epoch": 357} {"train_loss": -32.59125900268555, "global_step": 43198, "epoch": 357} {"train_loss": -33.284915924072266, "global_step": 43199, "epoch": 357} {"train_loss": -33.661624908447266, "global_step": 43200, "epoch": 357} {"train_loss": -33.89482498168945, "global_step": 43201, "epoch": 357} {"train_loss": -32.562923431396484, "global_step": 43202, "epoch": 357} {"train_loss": -32.94591522216797, "global_step": 43203, "epoch": 357} {"train_loss": -33.306396484375, "global_step": 43204, "epoch": 357} {"train_loss": -31.835235595703125, "global_step": 43205, "epoch": 357} {"train_loss": -32.386627197265625, "global_step": 43206, "epoch": 357} {"train_loss": -33.9285888671875, "global_step": 43207, "epoch": 357} {"train_loss": -32.42366027832031, "global_step": 43208, "epoch": 357} {"train_loss": -31.4327449798584, "global_step": 43209, "epoch": 357} {"train_loss": -32.02630615234375, "global_step": 43210, "epoch": 357} {"train_loss": -31.238788604736328, "global_step": 43211, "epoch": 357} {"train_loss": -32.8065071105957, "global_step": 43212, "epoch": 357} {"train_loss": -33.507904052734375, "global_step": 43213, "epoch": 357} {"train_loss": -30.9281063079834, "global_step": 43214, "epoch": 357} {"train_loss": -32.039058685302734, "global_step": 43215, "epoch": 357} {"train_loss": -33.54092025756836, "global_step": 43216, "epoch": 357} {"train_loss": -32.6310920715332, "global_step": 43217, "epoch": 357} {"train_loss": -31.0633487701416, "global_step": 43218, "epoch": 357} {"train_loss": -33.1020393371582, "global_step": 43219, "epoch": 357} {"train_loss": -32.969703674316406, "global_step": 43220, "epoch": 357} {"train_loss": -32.70690155029297, "global_step": 43221, "epoch": 357} {"train_loss": -33.379234313964844, "global_step": 43222, "epoch": 357} {"train_loss": -32.810150146484375, "global_step": 43223, "epoch": 357} {"train_loss": -33.78853225708008, "global_step": 43224, "epoch": 357} {"train_loss": -33.554229736328125, "global_step": 43225, "epoch": 357} {"train_loss": -33.97787094116211, "global_step": 43226, "epoch": 357} {"train_loss": -33.633209228515625, "global_step": 43227, "epoch": 357} {"train_loss": -33.96738815307617, "global_step": 43228, "epoch": 357} {"train_loss": -34.28535079956055, "global_step": 43229, "epoch": 357} {"train_loss": -33.7630729675293, "global_step": 43230, "epoch": 357} {"train_loss": -34.10961151123047, "global_step": 43231, "epoch": 357} {"train_loss": -33.59406661987305, "global_step": 43232, "epoch": 357} {"train_loss": -34.239295959472656, "global_step": 43233, "epoch": 357} {"train_loss": -33.759071350097656, "global_step": 43234, "epoch": 357} {"train_loss": -33.557838439941406, "global_step": 43235, "epoch": 357} {"train_loss": -33.67940139770508, "global_step": 43236, "epoch": 357} {"train_loss": -34.28874588012695, "global_step": 43237, "epoch": 357} {"train_loss": -33.20503616333008, "global_step": 43238, "epoch": 357} {"train_loss": -33.99080276489258, "global_step": 43239, "epoch": 357} {"train_loss": -33.54981994628906, "global_step": 43240, "epoch": 357} {"train_loss": -33.06298828125, "global_step": 43241, "epoch": 357} {"train_loss": -32.895790100097656, "global_step": 43242, "epoch": 357} {"train_loss": -33.35893249511719, "global_step": 43243, "epoch": 357} {"train_loss": -33.691200256347656, "global_step": 43244, "epoch": 357} {"train_loss": -34.11077117919922, "global_step": 43245, "epoch": 357} {"train_loss": -33.75836181640625, "global_step": 43246, "epoch": 357} {"train_loss": -34.27839660644531, "global_step": 43247, "epoch": 357} {"train_loss": -33.90616989135742, "global_step": 43248, "epoch": 357} {"train_loss": -34.61503982543945, "global_step": 43249, "epoch": 357} {"train_loss": -33.851436614990234, "global_step": 43250, "epoch": 357} {"train_loss": -33.988677978515625, "global_step": 43251, "epoch": 357} {"train_loss": -34.26082229614258, "global_step": 43252, "epoch": 357} {"train_loss": -34.51824951171875, "global_step": 43253, "epoch": 357} {"train_loss": -34.1749267578125, "global_step": 43254, "epoch": 357} {"train_loss": -34.056453704833984, "global_step": 43255, "epoch": 357} {"train_loss": -34.68513107299805, "global_step": 43256, "epoch": 357} {"train_loss": -34.898536682128906, "global_step": 43257, "epoch": 357} {"train_loss": -34.579402923583984, "global_step": 43258, "epoch": 357} {"train_loss": -34.70061111450195, "global_step": 43259, "epoch": 357} {"train_loss": -34.4533576965332, "global_step": 43260, "epoch": 357} {"train_loss": -34.648983001708984, "global_step": 43261, "epoch": 357} {"train_loss": -34.9580192565918, "global_step": 43262, "epoch": 357} {"train_loss": -34.62480163574219, "global_step": 43263, "epoch": 357} {"train_loss": -34.8773078918457, "global_step": 43264, "epoch": 357} {"train_loss": -34.26188278198242, "global_step": 43265, "epoch": 357} {"train_loss": -34.614540100097656, "global_step": 43266, "epoch": 357} {"train_loss": -34.55977249145508, "global_step": 43267, "epoch": 357} {"train_loss": -35.05946350097656, "global_step": 43268, "epoch": 357} {"train_loss": -34.979923248291016, "global_step": 43269, "epoch": 357} {"train_loss": -35.141456604003906, "global_step": 43270, "epoch": 357} {"train_loss": -35.14143371582031, "global_step": 43271, "epoch": 357} {"train_loss": -34.95023727416992, "global_step": 43272, "epoch": 357} {"train_loss": -35.14807891845703, "global_step": 43273, "epoch": 357} {"train_loss": -34.99440383911133, "global_step": 43274, "epoch": 357} {"train_loss": -35.03580856323242, "global_step": 43275, "epoch": 357} {"train_loss": -35.13290023803711, "global_step": 43276, "epoch": 357} {"train_loss": -34.6888427734375, "global_step": 43277, "epoch": 357} {"train_loss": -35.28664016723633, "global_step": 43278, "epoch": 357} {"train_loss": -35.11899948120117, "global_step": 43279, "epoch": 357} {"train_loss": -35.13443374633789, "global_step": 43280, "epoch": 357} {"train_loss": -35.43940353393555, "global_step": 43281, "epoch": 357} {"train_loss": -35.53129959106445, "global_step": 43282, "epoch": 357} {"train_loss": -34.98767852783203, "global_step": 43283, "epoch": 357} {"train_loss": -34.80318832397461, "global_step": 43284, "epoch": 357} {"train_loss": -34.99659729003906, "global_step": 43285, "epoch": 357} {"train_loss": -35.34413528442383, "global_step": 43286, "epoch": 357} {"train_loss": -34.98651885986328, "global_step": 43287, "epoch": 357} {"train_loss": -34.259735107421875, "global_step": 43288, "epoch": 357} {"train_loss": -34.96900177001953, "global_step": 43289, "epoch": 357} {"train_loss": -35.21038055419922, "global_step": 43290, "epoch": 357} {"train_loss": -34.73403549194336, "global_step": 43291, "epoch": 357} {"train_loss": -34.12422561645508, "global_step": 43292, "epoch": 357} {"train_loss": -34.8559684753418, "global_step": 43293, "epoch": 357} {"train_loss": -34.435970306396484, "global_step": 43294, "epoch": 357} {"train_loss": -34.108097076416016, "global_step": 43295, "epoch": 357} {"train_loss": -35.01157760620117, "global_step": 43296, "epoch": 357} {"train_loss": -34.82351303100586, "global_step": 43297, "epoch": 357} {"train_loss": -34.65191650390625, "global_step": 43298, "epoch": 357} {"train_loss": -33.698585510253906, "global_step": 43299, "epoch": 357} {"train_loss": -33.867164611816406, "global_step": 43300, "epoch": 357} {"train_loss": -33.137386322021484, "global_step": 43301, "epoch": 357} {"train_loss": -33.203460693359375, "global_step": 43302, "epoch": 357} {"train_loss": -33.457576751708984, "global_step": 43303, "epoch": 357} {"train_loss": -32.84739685058594, "global_step": 43304, "epoch": 357} {"train_loss": -32.78946304321289, "global_step": 43305, "epoch": 357} {"train_loss": -34.82099151611328, "global_step": 43306, "epoch": 357} {"train_loss": -34.00889587402344, "global_step": 43307, "epoch": 357} {"train_loss": -33.663909912109375, "global_step": 43308, "epoch": 357} {"train_loss": -34.75663375854492, "global_step": 43309, "epoch": 357} {"train_loss": -32.90146255493164, "global_step": 43310, "epoch": 357} {"train_loss": -34.24050521850586, "global_step": 43311, "epoch": 357} {"train_loss": -33.375118255615234, "global_step": 43312, "epoch": 357} {"train_loss": -32.49755096435547, "global_step": 43313, "epoch": 357} {"train_loss": -32.63029861450195, "global_step": 43314, "epoch": 357} {"train_loss": -33.6241340637207, "global_step": 43315, "epoch": 357} {"train_loss": -33.34011459350586, "global_step": 43316, "epoch": 357} {"train_loss": -33.89851844409281, "global_step": 43317, "epoch": 357, "val_loss": 2519907.25} {"train_loss": -34.45690155029297, "global_step": 43318, "epoch": 358} {"train_loss": -33.28942108154297, "global_step": 43319, "epoch": 358} {"train_loss": -34.28651809692383, "global_step": 43320, "epoch": 358} {"train_loss": -33.83370590209961, "global_step": 43321, "epoch": 358} {"train_loss": -34.03193283081055, "global_step": 43322, "epoch": 358} {"train_loss": -32.469970703125, "global_step": 43323, "epoch": 358} {"train_loss": -34.04155349731445, "global_step": 43324, "epoch": 358} {"train_loss": -33.88944625854492, "global_step": 43325, "epoch": 358} {"train_loss": -32.6386604309082, "global_step": 43326, "epoch": 358} {"train_loss": -26.565832138061523, "global_step": 43327, "epoch": 358} {"train_loss": -32.668365478515625, "global_step": 43328, "epoch": 358} {"train_loss": -33.25068283081055, "global_step": 43329, "epoch": 358} {"train_loss": -32.42593765258789, "global_step": 43330, "epoch": 358} {"train_loss": -32.559627532958984, "global_step": 43331, "epoch": 358} {"train_loss": -32.49831008911133, "global_step": 43332, "epoch": 358} {"train_loss": -32.07734298706055, "global_step": 43333, "epoch": 358} {"train_loss": -32.42361068725586, "global_step": 43334, "epoch": 358} {"train_loss": -33.1636962890625, "global_step": 43335, "epoch": 358} {"train_loss": -31.468570709228516, "global_step": 43336, "epoch": 358} {"train_loss": -32.68596267700195, "global_step": 43337, "epoch": 358} {"train_loss": -32.691619873046875, "global_step": 43338, "epoch": 358} {"train_loss": -33.52768325805664, "global_step": 43339, "epoch": 358} {"train_loss": -33.745635986328125, "global_step": 43340, "epoch": 358} {"train_loss": -30.339139938354492, "global_step": 43341, "epoch": 358} {"train_loss": -31.3834285736084, "global_step": 43342, "epoch": 358} {"train_loss": -32.60519790649414, "global_step": 43343, "epoch": 358} {"train_loss": -32.8893928527832, "global_step": 43344, "epoch": 358} {"train_loss": -32.84404373168945, "global_step": 43345, "epoch": 358} {"train_loss": -33.09731674194336, "global_step": 43346, "epoch": 358} {"train_loss": -33.760555267333984, "global_step": 43347, "epoch": 358} {"train_loss": -33.31499481201172, "global_step": 43348, "epoch": 358} {"train_loss": -33.383453369140625, "global_step": 43349, "epoch": 358} {"train_loss": -33.435890197753906, "global_step": 43350, "epoch": 358} {"train_loss": -33.655189514160156, "global_step": 43351, "epoch": 358} {"train_loss": -34.32419967651367, "global_step": 43352, "epoch": 358} {"train_loss": -33.378902435302734, "global_step": 43353, "epoch": 358} {"train_loss": -33.154476165771484, "global_step": 43354, "epoch": 358} {"train_loss": -33.917236328125, "global_step": 43355, "epoch": 358} {"train_loss": -34.14101028442383, "global_step": 43356, "epoch": 358} {"train_loss": -33.906654357910156, "global_step": 43357, "epoch": 358} {"train_loss": -34.30107498168945, "global_step": 43358, "epoch": 358} {"train_loss": -34.03091049194336, "global_step": 43359, "epoch": 358} {"train_loss": -34.155033111572266, "global_step": 43360, "epoch": 358} {"train_loss": -33.8217887878418, "global_step": 43361, "epoch": 358} {"train_loss": -33.999324798583984, "global_step": 43362, "epoch": 358} {"train_loss": -33.74531173706055, "global_step": 43363, "epoch": 358} {"train_loss": -34.39376449584961, "global_step": 43364, "epoch": 358} {"train_loss": -33.440547943115234, "global_step": 43365, "epoch": 358} {"train_loss": -34.31014633178711, "global_step": 43366, "epoch": 358} {"train_loss": -34.39601135253906, "global_step": 43367, "epoch": 358} {"train_loss": -34.36684799194336, "global_step": 43368, "epoch": 358} {"train_loss": -34.124000549316406, "global_step": 43369, "epoch": 358} {"train_loss": -34.495582580566406, "global_step": 43370, "epoch": 358} {"train_loss": -34.542171478271484, "global_step": 43371, "epoch": 358} {"train_loss": -34.12738037109375, "global_step": 43372, "epoch": 358} {"train_loss": -34.80796813964844, "global_step": 43373, "epoch": 358} {"train_loss": -34.174800872802734, "global_step": 43374, "epoch": 358} {"train_loss": -34.89451217651367, "global_step": 43375, "epoch": 358} {"train_loss": -34.00016403198242, "global_step": 43376, "epoch": 358} {"train_loss": -34.80674362182617, "global_step": 43377, "epoch": 358} {"train_loss": -34.970008850097656, "global_step": 43378, "epoch": 358} {"train_loss": -34.38886642456055, "global_step": 43379, "epoch": 358} {"train_loss": -33.9525146484375, "global_step": 43380, "epoch": 358} {"train_loss": -34.40373992919922, "global_step": 43381, "epoch": 358} {"train_loss": -34.80482482910156, "global_step": 43382, "epoch": 358} {"train_loss": -34.920135498046875, "global_step": 43383, "epoch": 358} {"train_loss": -34.8549690246582, "global_step": 43384, "epoch": 358} {"train_loss": -34.776405334472656, "global_step": 43385, "epoch": 358} {"train_loss": -34.627132415771484, "global_step": 43386, "epoch": 358} {"train_loss": -34.86912155151367, "global_step": 43387, "epoch": 358} {"train_loss": -34.974300384521484, "global_step": 43388, "epoch": 358} {"train_loss": -34.009029388427734, "global_step": 43389, "epoch": 358} {"train_loss": -31.879663467407227, "global_step": 43390, "epoch": 358} {"train_loss": -33.662044525146484, "global_step": 43391, "epoch": 358} {"train_loss": -33.45468521118164, "global_step": 43392, "epoch": 358} {"train_loss": -33.329505920410156, "global_step": 43393, "epoch": 358} {"train_loss": -34.951690673828125, "global_step": 43394, "epoch": 358} {"train_loss": -35.13008499145508, "global_step": 43395, "epoch": 358} {"train_loss": -34.428550720214844, "global_step": 43396, "epoch": 358} {"train_loss": -34.0065803527832, "global_step": 43397, "epoch": 358} {"train_loss": -35.10493087768555, "global_step": 43398, "epoch": 358} {"train_loss": -35.64023971557617, "global_step": 43399, "epoch": 358} {"train_loss": -34.579524993896484, "global_step": 43400, "epoch": 358} {"train_loss": -34.986854553222656, "global_step": 43401, "epoch": 358} {"train_loss": -35.11104202270508, "global_step": 43402, "epoch": 358} {"train_loss": -35.680049896240234, "global_step": 43403, "epoch": 358} {"train_loss": -35.10588455200195, "global_step": 43404, "epoch": 358} {"train_loss": -34.741817474365234, "global_step": 43405, "epoch": 358} {"train_loss": -34.928924560546875, "global_step": 43406, "epoch": 358} {"train_loss": -35.42609405517578, "global_step": 43407, "epoch": 358} {"train_loss": -34.740562438964844, "global_step": 43408, "epoch": 358} {"train_loss": -34.635108947753906, "global_step": 43409, "epoch": 358} {"train_loss": -34.92493438720703, "global_step": 43410, "epoch": 358} {"train_loss": -34.74309539794922, "global_step": 43411, "epoch": 358} {"train_loss": -35.44301986694336, "global_step": 43412, "epoch": 358} {"train_loss": -35.360225677490234, "global_step": 43413, "epoch": 358} {"train_loss": -35.04852294921875, "global_step": 43414, "epoch": 358} {"train_loss": -35.42622756958008, "global_step": 43415, "epoch": 358} {"train_loss": -34.916717529296875, "global_step": 43416, "epoch": 358} {"train_loss": -35.06431198120117, "global_step": 43417, "epoch": 358} {"train_loss": -34.905494689941406, "global_step": 43418, "epoch": 358} {"train_loss": -34.341800689697266, "global_step": 43419, "epoch": 358} {"train_loss": -32.553218841552734, "global_step": 43420, "epoch": 358} {"train_loss": -33.8927116394043, "global_step": 43421, "epoch": 358} {"train_loss": -33.267852783203125, "global_step": 43422, "epoch": 358} {"train_loss": -30.404752731323242, "global_step": 43423, "epoch": 358} {"train_loss": -34.96135330200195, "global_step": 43424, "epoch": 358} {"train_loss": -35.164546966552734, "global_step": 43425, "epoch": 358} {"train_loss": -33.67258834838867, "global_step": 43426, "epoch": 358} {"train_loss": -30.710851669311523, "global_step": 43427, "epoch": 358} {"train_loss": -34.86918258666992, "global_step": 43428, "epoch": 358} {"train_loss": -32.34741973876953, "global_step": 43429, "epoch": 358} {"train_loss": -32.15946578979492, "global_step": 43430, "epoch": 358} {"train_loss": -32.59865951538086, "global_step": 43431, "epoch": 358} {"train_loss": -32.572139739990234, "global_step": 43432, "epoch": 358} {"train_loss": -32.3148078918457, "global_step": 43433, "epoch": 358} {"train_loss": -33.30125045776367, "global_step": 43434, "epoch": 358} {"train_loss": -32.326961517333984, "global_step": 43435, "epoch": 358} {"train_loss": -34.11236572265625, "global_step": 43436, "epoch": 358} {"train_loss": -33.488887786865234, "global_step": 43437, "epoch": 358} {"train_loss": -33.78020534042484, "global_step": 43438, "epoch": 358, "val_loss": 2615409.0} {"train_loss": -34.03483200073242, "global_step": 43439, "epoch": 359} {"train_loss": -32.1138916015625, "global_step": 43440, "epoch": 359} {"train_loss": -33.55751037597656, "global_step": 43441, "epoch": 359} {"train_loss": -31.996118545532227, "global_step": 43442, "epoch": 359} {"train_loss": -34.0322380065918, "global_step": 43443, "epoch": 359} {"train_loss": -30.728912353515625, "global_step": 43444, "epoch": 359} {"train_loss": -30.8510684967041, "global_step": 43445, "epoch": 359} {"train_loss": -31.642663955688477, "global_step": 43446, "epoch": 359} {"train_loss": -31.873865127563477, "global_step": 43447, "epoch": 359} {"train_loss": -31.489755630493164, "global_step": 43448, "epoch": 359} {"train_loss": -31.179594039916992, "global_step": 43449, "epoch": 359} {"train_loss": -29.65445327758789, "global_step": 43450, "epoch": 359} {"train_loss": -31.514760971069336, "global_step": 43451, "epoch": 359} {"train_loss": -31.662626266479492, "global_step": 43452, "epoch": 359} {"train_loss": -32.71336364746094, "global_step": 43453, "epoch": 359} {"train_loss": -33.54874801635742, "global_step": 43454, "epoch": 359} {"train_loss": -33.22216033935547, "global_step": 43455, "epoch": 359} {"train_loss": -32.22821044921875, "global_step": 43456, "epoch": 359} {"train_loss": -33.41726303100586, "global_step": 43457, "epoch": 359} {"train_loss": -33.48421859741211, "global_step": 43458, "epoch": 359} {"train_loss": -33.70539474487305, "global_step": 43459, "epoch": 359} {"train_loss": -33.5273551940918, "global_step": 43460, "epoch": 359} {"train_loss": -33.26615524291992, "global_step": 43461, "epoch": 359} {"train_loss": -34.23154830932617, "global_step": 43462, "epoch": 359} {"train_loss": -33.974578857421875, "global_step": 43463, "epoch": 359} {"train_loss": -34.228702545166016, "global_step": 43464, "epoch": 359} {"train_loss": -34.0330696105957, "global_step": 43465, "epoch": 359} {"train_loss": -34.32143783569336, "global_step": 43466, "epoch": 359} {"train_loss": -34.78622055053711, "global_step": 43467, "epoch": 359} {"train_loss": -34.65806198120117, "global_step": 43468, "epoch": 359} {"train_loss": -34.13203430175781, "global_step": 43469, "epoch": 359} {"train_loss": -34.3326301574707, "global_step": 43470, "epoch": 359} {"train_loss": -33.99155807495117, "global_step": 43471, "epoch": 359} {"train_loss": -34.64298629760742, "global_step": 43472, "epoch": 359} {"train_loss": -34.36055374145508, "global_step": 43473, "epoch": 359} {"train_loss": -34.35805892944336, "global_step": 43474, "epoch": 359} {"train_loss": -34.29276657104492, "global_step": 43475, "epoch": 359} {"train_loss": -34.10818099975586, "global_step": 43476, "epoch": 359} {"train_loss": -33.44517135620117, "global_step": 43477, "epoch": 359} {"train_loss": -32.929988861083984, "global_step": 43478, "epoch": 359} {"train_loss": -34.73008728027344, "global_step": 43479, "epoch": 359} {"train_loss": -34.466094970703125, "global_step": 43480, "epoch": 359} {"train_loss": -34.72119140625, "global_step": 43481, "epoch": 359} {"train_loss": -34.426395416259766, "global_step": 43482, "epoch": 359} {"train_loss": -34.09828567504883, "global_step": 43483, "epoch": 359} {"train_loss": -33.80402755737305, "global_step": 43484, "epoch": 359} {"train_loss": -33.53306198120117, "global_step": 43485, "epoch": 359} {"train_loss": -34.30682373046875, "global_step": 43486, "epoch": 359} {"train_loss": -35.06051254272461, "global_step": 43487, "epoch": 359} {"train_loss": -34.855953216552734, "global_step": 43488, "epoch": 359} {"train_loss": -34.1580810546875, "global_step": 43489, "epoch": 359} {"train_loss": -35.17947006225586, "global_step": 43490, "epoch": 359} {"train_loss": -34.7781867980957, "global_step": 43491, "epoch": 359} {"train_loss": -33.688392639160156, "global_step": 43492, "epoch": 359} {"train_loss": -33.757362365722656, "global_step": 43493, "epoch": 359} {"train_loss": -34.74050521850586, "global_step": 43494, "epoch": 359} {"train_loss": -35.07762908935547, "global_step": 43495, "epoch": 359} {"train_loss": -34.14303207397461, "global_step": 43496, "epoch": 359} {"train_loss": -34.671539306640625, "global_step": 43497, "epoch": 359} {"train_loss": -35.13418197631836, "global_step": 43498, "epoch": 359} {"train_loss": -34.8848876953125, "global_step": 43499, "epoch": 359} {"train_loss": -34.4809455871582, "global_step": 43500, "epoch": 359} {"train_loss": -34.8291130065918, "global_step": 43501, "epoch": 359} {"train_loss": -34.7739372253418, "global_step": 43502, "epoch": 359} {"train_loss": -34.896392822265625, "global_step": 43503, "epoch": 359} {"train_loss": -35.54287338256836, "global_step": 43504, "epoch": 359} {"train_loss": -35.11487579345703, "global_step": 43505, "epoch": 359} {"train_loss": -35.644466400146484, "global_step": 43506, "epoch": 359} {"train_loss": -35.31844711303711, "global_step": 43507, "epoch": 359} {"train_loss": -35.47631072998047, "global_step": 43508, "epoch": 359} {"train_loss": -35.51648712158203, "global_step": 43509, "epoch": 359} {"train_loss": -34.93495559692383, "global_step": 43510, "epoch": 359} {"train_loss": -34.75501251220703, "global_step": 43511, "epoch": 359} {"train_loss": -35.26682662963867, "global_step": 43512, "epoch": 359} {"train_loss": -34.594390869140625, "global_step": 43513, "epoch": 359} {"train_loss": -34.694759368896484, "global_step": 43514, "epoch": 359} {"train_loss": -34.257667541503906, "global_step": 43515, "epoch": 359} {"train_loss": -34.192386627197266, "global_step": 43516, "epoch": 359} {"train_loss": -34.71406936645508, "global_step": 43517, "epoch": 359} {"train_loss": -35.23476791381836, "global_step": 43518, "epoch": 359} {"train_loss": -34.228912353515625, "global_step": 43519, "epoch": 359} {"train_loss": -34.3358154296875, "global_step": 43520, "epoch": 359} {"train_loss": -32.96014404296875, "global_step": 43521, "epoch": 359} {"train_loss": -34.97943115234375, "global_step": 43522, "epoch": 359} {"train_loss": -35.03379440307617, "global_step": 43523, "epoch": 359} {"train_loss": -33.17195510864258, "global_step": 43524, "epoch": 359} {"train_loss": -34.90366744995117, "global_step": 43525, "epoch": 359} {"train_loss": -35.89809799194336, "global_step": 43526, "epoch": 359} {"train_loss": -34.07588195800781, "global_step": 43527, "epoch": 359} {"train_loss": -34.04631042480469, "global_step": 43528, "epoch": 359} {"train_loss": -35.01620101928711, "global_step": 43529, "epoch": 359} {"train_loss": -33.90594482421875, "global_step": 43530, "epoch": 359} {"train_loss": -31.931732177734375, "global_step": 43531, "epoch": 359} {"train_loss": -34.53992462158203, "global_step": 43532, "epoch": 359} {"train_loss": -33.280452728271484, "global_step": 43533, "epoch": 359} {"train_loss": -30.330724716186523, "global_step": 43534, "epoch": 359} {"train_loss": -28.95560646057129, "global_step": 43535, "epoch": 359} {"train_loss": -26.707921981811523, "global_step": 43536, "epoch": 359} {"train_loss": -16.050857543945312, "global_step": 43537, "epoch": 359} {"train_loss": -21.608266830444336, "global_step": 43538, "epoch": 359} {"train_loss": -2.6129722595214844, "global_step": 43539, "epoch": 359} {"train_loss": -29.559635162353516, "global_step": 43540, "epoch": 359} {"train_loss": -19.75726318359375, "global_step": 43541, "epoch": 359} {"train_loss": -27.454334259033203, "global_step": 43542, "epoch": 359} {"train_loss": -27.03700065612793, "global_step": 43543, "epoch": 359} {"train_loss": -26.170425415039062, "global_step": 43544, "epoch": 359} {"train_loss": -26.586511611938477, "global_step": 43545, "epoch": 359} {"train_loss": -27.353321075439453, "global_step": 43546, "epoch": 359} {"train_loss": -24.584148406982422, "global_step": 43547, "epoch": 359} {"train_loss": -28.425861358642578, "global_step": 43548, "epoch": 359} {"train_loss": -26.920734405517578, "global_step": 43549, "epoch": 359} {"train_loss": -28.23453712463379, "global_step": 43550, "epoch": 359} {"train_loss": -27.99648094177246, "global_step": 43551, "epoch": 359} {"train_loss": -28.67725944519043, "global_step": 43552, "epoch": 359} {"train_loss": -29.618061065673828, "global_step": 43553, "epoch": 359} {"train_loss": -29.395925521850586, "global_step": 43554, "epoch": 359} {"train_loss": -29.294082641601562, "global_step": 43555, "epoch": 359} {"train_loss": -29.902936935424805, "global_step": 43556, "epoch": 359} {"train_loss": -29.983667373657227, "global_step": 43557, "epoch": 359} {"train_loss": -30.1348934173584, "global_step": 43558, "epoch": 359} {"train_loss": -32.312699420393, "global_step": 43559, "epoch": 359, "val_loss": 2599654.25} {"train_loss": -30.09368896484375, "global_step": 43560, "epoch": 360} {"train_loss": -29.94524574279785, "global_step": 43561, "epoch": 360} {"train_loss": -30.941762924194336, "global_step": 43562, "epoch": 360} {"train_loss": -30.511274337768555, "global_step": 43563, "epoch": 360} {"train_loss": -31.037988662719727, "global_step": 43564, "epoch": 360} {"train_loss": -30.95399284362793, "global_step": 43565, "epoch": 360} {"train_loss": -31.24643898010254, "global_step": 43566, "epoch": 360} {"train_loss": -31.127395629882812, "global_step": 43567, "epoch": 360} {"train_loss": -32.038970947265625, "global_step": 43568, "epoch": 360} {"train_loss": -31.58455467224121, "global_step": 43569, "epoch": 360} {"train_loss": -31.702011108398438, "global_step": 43570, "epoch": 360} {"train_loss": -32.04902267456055, "global_step": 43571, "epoch": 360} {"train_loss": -31.932373046875, "global_step": 43572, "epoch": 360} {"train_loss": -32.29431915283203, "global_step": 43573, "epoch": 360} {"train_loss": -32.506832122802734, "global_step": 43574, "epoch": 360} {"train_loss": -32.65412521362305, "global_step": 43575, "epoch": 360} {"train_loss": -32.809696197509766, "global_step": 43576, "epoch": 360} {"train_loss": -32.62495040893555, "global_step": 43577, "epoch": 360} {"train_loss": -32.84693145751953, "global_step": 43578, "epoch": 360} {"train_loss": -33.0613899230957, "global_step": 43579, "epoch": 360} {"train_loss": -32.81399917602539, "global_step": 43580, "epoch": 360} {"train_loss": -33.10404586791992, "global_step": 43581, "epoch": 360} {"train_loss": -33.400115966796875, "global_step": 43582, "epoch": 360} {"train_loss": -33.416866302490234, "global_step": 43583, "epoch": 360} {"train_loss": -33.31903076171875, "global_step": 43584, "epoch": 360} {"train_loss": -33.68943405151367, "global_step": 43585, "epoch": 360} {"train_loss": -33.707210540771484, "global_step": 43586, "epoch": 360} {"train_loss": -33.75099563598633, "global_step": 43587, "epoch": 360} {"train_loss": -33.855159759521484, "global_step": 43588, "epoch": 360} {"train_loss": -33.862457275390625, "global_step": 43589, "epoch": 360} {"train_loss": -33.94491195678711, "global_step": 43590, "epoch": 360} {"train_loss": -34.14085006713867, "global_step": 43591, "epoch": 360} {"train_loss": -34.49684524536133, "global_step": 43592, "epoch": 360} {"train_loss": -34.1506462097168, "global_step": 43593, "epoch": 360} {"train_loss": -34.39516067504883, "global_step": 43594, "epoch": 360} {"train_loss": -34.11091995239258, "global_step": 43595, "epoch": 360} {"train_loss": -34.24641418457031, "global_step": 43596, "epoch": 360} {"train_loss": -34.531105041503906, "global_step": 43597, "epoch": 360} {"train_loss": -34.533302307128906, "global_step": 43598, "epoch": 360} {"train_loss": -33.92817306518555, "global_step": 43599, "epoch": 360} {"train_loss": -33.543155670166016, "global_step": 43600, "epoch": 360} {"train_loss": -34.020015716552734, "global_step": 43601, "epoch": 360} {"train_loss": -34.57874298095703, "global_step": 43602, "epoch": 360} {"train_loss": -34.26423263549805, "global_step": 43603, "epoch": 360} {"train_loss": -34.41219711303711, "global_step": 43604, "epoch": 360} {"train_loss": -34.63492965698242, "global_step": 43605, "epoch": 360} {"train_loss": -34.608436584472656, "global_step": 43606, "epoch": 360} {"train_loss": -34.22121047973633, "global_step": 43607, "epoch": 360} {"train_loss": -34.350860595703125, "global_step": 43608, "epoch": 360} {"train_loss": -34.02357482910156, "global_step": 43609, "epoch": 360} {"train_loss": -30.81654167175293, "global_step": 43610, "epoch": 360} {"train_loss": -18.922897338867188, "global_step": 43611, "epoch": 360} {"train_loss": 6.5245680809021, "global_step": 43612, "epoch": 360} {"train_loss": -19.565534591674805, "global_step": 43613, "epoch": 360} {"train_loss": -22.7115478515625, "global_step": 43614, "epoch": 360} {"train_loss": -27.027729034423828, "global_step": 43615, "epoch": 360} {"train_loss": -24.07754898071289, "global_step": 43616, "epoch": 360} {"train_loss": -31.451581954956055, "global_step": 43617, "epoch": 360} {"train_loss": -25.787012100219727, "global_step": 43618, "epoch": 360} {"train_loss": -30.352893829345703, "global_step": 43619, "epoch": 360} {"train_loss": -31.148096084594727, "global_step": 43620, "epoch": 360} {"train_loss": -29.201953887939453, "global_step": 43621, "epoch": 360} {"train_loss": -32.26084518432617, "global_step": 43622, "epoch": 360} {"train_loss": -30.718469619750977, "global_step": 43623, "epoch": 360} {"train_loss": -29.99322509765625, "global_step": 43624, "epoch": 360} {"train_loss": -31.578617095947266, "global_step": 43625, "epoch": 360} {"train_loss": -33.18098068237305, "global_step": 43626, "epoch": 360} {"train_loss": -32.00947952270508, "global_step": 43627, "epoch": 360} {"train_loss": -31.66952896118164, "global_step": 43628, "epoch": 360} {"train_loss": -31.80330467224121, "global_step": 43629, "epoch": 360} {"train_loss": -32.703590393066406, "global_step": 43630, "epoch": 360} {"train_loss": -32.12494659423828, "global_step": 43631, "epoch": 360} {"train_loss": -32.41371536254883, "global_step": 43632, "epoch": 360} {"train_loss": -32.72755813598633, "global_step": 43633, "epoch": 360} {"train_loss": -32.65647506713867, "global_step": 43634, "epoch": 360} {"train_loss": -32.752197265625, "global_step": 43635, "epoch": 360} {"train_loss": -32.693572998046875, "global_step": 43636, "epoch": 360} {"train_loss": -32.916656494140625, "global_step": 43637, "epoch": 360} {"train_loss": -33.3394889831543, "global_step": 43638, "epoch": 360} {"train_loss": -33.123661041259766, "global_step": 43639, "epoch": 360} {"train_loss": -33.374114990234375, "global_step": 43640, "epoch": 360} {"train_loss": -33.05451583862305, "global_step": 43641, "epoch": 360} {"train_loss": -33.37321090698242, "global_step": 43642, "epoch": 360} {"train_loss": -33.246620178222656, "global_step": 43643, "epoch": 360} {"train_loss": -33.13582992553711, "global_step": 43644, "epoch": 360} {"train_loss": -33.15558624267578, "global_step": 43645, "epoch": 360} {"train_loss": -33.64719772338867, "global_step": 43646, "epoch": 360} {"train_loss": -33.297821044921875, "global_step": 43647, "epoch": 360} {"train_loss": -33.76877975463867, "global_step": 43648, "epoch": 360} {"train_loss": -33.27101516723633, "global_step": 43649, "epoch": 360} {"train_loss": -33.581050872802734, "global_step": 43650, "epoch": 360} {"train_loss": -33.87185287475586, "global_step": 43651, "epoch": 360} {"train_loss": -33.965965270996094, "global_step": 43652, "epoch": 360} {"train_loss": -34.05410385131836, "global_step": 43653, "epoch": 360} {"train_loss": -33.86774826049805, "global_step": 43654, "epoch": 360} {"train_loss": -33.87968444824219, "global_step": 43655, "epoch": 360} {"train_loss": -34.11321258544922, "global_step": 43656, "epoch": 360} {"train_loss": -34.023311614990234, "global_step": 43657, "epoch": 360} {"train_loss": -34.434715270996094, "global_step": 43658, "epoch": 360} {"train_loss": -34.051570892333984, "global_step": 43659, "epoch": 360} {"train_loss": -33.86990737915039, "global_step": 43660, "epoch": 360} {"train_loss": -32.924564361572266, "global_step": 43661, "epoch": 360} {"train_loss": -31.62076759338379, "global_step": 43662, "epoch": 360} {"train_loss": -28.811481475830078, "global_step": 43663, "epoch": 360} {"train_loss": -19.87465476989746, "global_step": 43664, "epoch": 360} {"train_loss": -13.625389099121094, "global_step": 43665, "epoch": 360} {"train_loss": -25.161518096923828, "global_step": 43666, "epoch": 360} {"train_loss": -22.696823120117188, "global_step": 43667, "epoch": 360} {"train_loss": -29.6239070892334, "global_step": 43668, "epoch": 360} {"train_loss": -24.665943145751953, "global_step": 43669, "epoch": 360} {"train_loss": -32.011417388916016, "global_step": 43670, "epoch": 360} {"train_loss": -25.660375595092773, "global_step": 43671, "epoch": 360} {"train_loss": -31.073017120361328, "global_step": 43672, "epoch": 360} {"train_loss": -32.073787689208984, "global_step": 43673, "epoch": 360} {"train_loss": -28.83498191833496, "global_step": 43674, "epoch": 360} {"train_loss": -31.153417587280273, "global_step": 43675, "epoch": 360} {"train_loss": -32.05376052856445, "global_step": 43676, "epoch": 360} {"train_loss": -31.462371826171875, "global_step": 43677, "epoch": 360} {"train_loss": -31.211084365844727, "global_step": 43678, "epoch": 360} {"train_loss": -32.01718521118164, "global_step": 43679, "epoch": 360} {"train_loss": -31.366617821464853, "global_step": 43680, "epoch": 360, "val_loss": 2583980.75} {"train_loss": -32.753658294677734, "global_step": 43681, "epoch": 361} {"train_loss": -31.7480411529541, "global_step": 43682, "epoch": 361} {"train_loss": -31.777997970581055, "global_step": 43683, "epoch": 361} {"train_loss": -32.22437286376953, "global_step": 43684, "epoch": 361} {"train_loss": -32.464656829833984, "global_step": 43685, "epoch": 361} {"train_loss": -32.81913375854492, "global_step": 43686, "epoch": 361} {"train_loss": -32.14579391479492, "global_step": 43687, "epoch": 361} {"train_loss": -32.38771438598633, "global_step": 43688, "epoch": 361} {"train_loss": -32.89419937133789, "global_step": 43689, "epoch": 361} {"train_loss": -32.885986328125, "global_step": 43690, "epoch": 361} {"train_loss": -32.93938446044922, "global_step": 43691, "epoch": 361} {"train_loss": -32.85825729370117, "global_step": 43692, "epoch": 361} {"train_loss": -32.69983673095703, "global_step": 43693, "epoch": 361} {"train_loss": -32.988521575927734, "global_step": 43694, "epoch": 361} {"train_loss": -32.78654098510742, "global_step": 43695, "epoch": 361} {"train_loss": -33.14714431762695, "global_step": 43696, "epoch": 361} {"train_loss": -33.356414794921875, "global_step": 43697, "epoch": 361} {"train_loss": -32.93610763549805, "global_step": 43698, "epoch": 361} {"train_loss": -32.73432922363281, "global_step": 43699, "epoch": 361} {"train_loss": -32.50325012207031, "global_step": 43700, "epoch": 361} {"train_loss": -32.6303825378418, "global_step": 43701, "epoch": 361} {"train_loss": -32.275203704833984, "global_step": 43702, "epoch": 361} {"train_loss": -32.7132453918457, "global_step": 43703, "epoch": 361} {"train_loss": -33.21235275268555, "global_step": 43704, "epoch": 361} {"train_loss": -33.412078857421875, "global_step": 43705, "epoch": 361} {"train_loss": -33.406158447265625, "global_step": 43706, "epoch": 361} {"train_loss": -33.19523239135742, "global_step": 43707, "epoch": 361} {"train_loss": -31.808935165405273, "global_step": 43708, "epoch": 361} {"train_loss": -30.181249618530273, "global_step": 43709, "epoch": 361} {"train_loss": -29.07120704650879, "global_step": 43710, "epoch": 361} {"train_loss": -30.811847686767578, "global_step": 43711, "epoch": 361} {"train_loss": -33.681583404541016, "global_step": 43712, "epoch": 361} {"train_loss": -31.868988037109375, "global_step": 43713, "epoch": 361} {"train_loss": -32.49135971069336, "global_step": 43714, "epoch": 361} {"train_loss": -33.08539581298828, "global_step": 43715, "epoch": 361} {"train_loss": -32.09739685058594, "global_step": 43716, "epoch": 361} {"train_loss": -33.21643829345703, "global_step": 43717, "epoch": 361} {"train_loss": -33.665836334228516, "global_step": 43718, "epoch": 361} {"train_loss": -33.398441314697266, "global_step": 43719, "epoch": 361} {"train_loss": -33.44306945800781, "global_step": 43720, "epoch": 361} {"train_loss": -32.21397018432617, "global_step": 43721, "epoch": 361} {"train_loss": -32.30732345581055, "global_step": 43722, "epoch": 361} {"train_loss": -31.857343673706055, "global_step": 43723, "epoch": 361} {"train_loss": -32.828826904296875, "global_step": 43724, "epoch": 361} {"train_loss": -32.80813217163086, "global_step": 43725, "epoch": 361} {"train_loss": -34.156375885009766, "global_step": 43726, "epoch": 361} {"train_loss": -33.507259368896484, "global_step": 43727, "epoch": 361} {"train_loss": -32.88657760620117, "global_step": 43728, "epoch": 361} {"train_loss": -32.58329391479492, "global_step": 43729, "epoch": 361} {"train_loss": -33.559200286865234, "global_step": 43730, "epoch": 361} {"train_loss": -32.99114227294922, "global_step": 43731, "epoch": 361} {"train_loss": -30.864770889282227, "global_step": 43732, "epoch": 361} {"train_loss": -31.75611686706543, "global_step": 43733, "epoch": 361} {"train_loss": -33.343544006347656, "global_step": 43734, "epoch": 361} {"train_loss": -32.454532623291016, "global_step": 43735, "epoch": 361} {"train_loss": -31.185148239135742, "global_step": 43736, "epoch": 361} {"train_loss": -33.6185188293457, "global_step": 43737, "epoch": 361} {"train_loss": -32.1987419128418, "global_step": 43738, "epoch": 361} {"train_loss": -32.5660400390625, "global_step": 43739, "epoch": 361} {"train_loss": -33.748958587646484, "global_step": 43740, "epoch": 361} {"train_loss": -33.14420700073242, "global_step": 43741, "epoch": 361} {"train_loss": -33.85264205932617, "global_step": 43742, "epoch": 361} {"train_loss": -33.51936721801758, "global_step": 43743, "epoch": 361} {"train_loss": -33.26951217651367, "global_step": 43744, "epoch": 361} {"train_loss": -33.39191436767578, "global_step": 43745, "epoch": 361} {"train_loss": -33.91893768310547, "global_step": 43746, "epoch": 361} {"train_loss": -33.79273223876953, "global_step": 43747, "epoch": 361} {"train_loss": -33.74940872192383, "global_step": 43748, "epoch": 361} {"train_loss": -34.04928970336914, "global_step": 43749, "epoch": 361} {"train_loss": -33.4681396484375, "global_step": 43750, "epoch": 361} {"train_loss": -33.64585494995117, "global_step": 43751, "epoch": 361} {"train_loss": -33.776668548583984, "global_step": 43752, "epoch": 361} {"train_loss": -33.60187530517578, "global_step": 43753, "epoch": 361} {"train_loss": -34.15032958984375, "global_step": 43754, "epoch": 361} {"train_loss": -33.81435775756836, "global_step": 43755, "epoch": 361} {"train_loss": -33.25938415527344, "global_step": 43756, "epoch": 361} {"train_loss": -34.127498626708984, "global_step": 43757, "epoch": 361} {"train_loss": -32.4575080871582, "global_step": 43758, "epoch": 361} {"train_loss": -33.70041275024414, "global_step": 43759, "epoch": 361} {"train_loss": -32.68116760253906, "global_step": 43760, "epoch": 361} {"train_loss": -30.05274772644043, "global_step": 43761, "epoch": 361} {"train_loss": -32.6573600769043, "global_step": 43762, "epoch": 361} {"train_loss": -31.417104721069336, "global_step": 43763, "epoch": 361} {"train_loss": -32.52195358276367, "global_step": 43764, "epoch": 361} {"train_loss": -32.577266693115234, "global_step": 43765, "epoch": 361} {"train_loss": -31.950992584228516, "global_step": 43766, "epoch": 361} {"train_loss": -33.915740966796875, "global_step": 43767, "epoch": 361} {"train_loss": -31.384740829467773, "global_step": 43768, "epoch": 361} {"train_loss": -33.89170455932617, "global_step": 43769, "epoch": 361} {"train_loss": -33.300907135009766, "global_step": 43770, "epoch": 361} {"train_loss": -33.245784759521484, "global_step": 43771, "epoch": 361} {"train_loss": -32.5004768371582, "global_step": 43772, "epoch": 361} {"train_loss": -32.55213165283203, "global_step": 43773, "epoch": 361} {"train_loss": -32.577247619628906, "global_step": 43774, "epoch": 361} {"train_loss": -32.86323165893555, "global_step": 43775, "epoch": 361} {"train_loss": -33.6008186340332, "global_step": 43776, "epoch": 361} {"train_loss": -33.11811065673828, "global_step": 43777, "epoch": 361} {"train_loss": -32.85050582885742, "global_step": 43778, "epoch": 361} {"train_loss": -33.72713088989258, "global_step": 43779, "epoch": 361} {"train_loss": -33.9242057800293, "global_step": 43780, "epoch": 361} {"train_loss": -33.18976974487305, "global_step": 43781, "epoch": 361} {"train_loss": -33.5367431640625, "global_step": 43782, "epoch": 361} {"train_loss": -33.2021598815918, "global_step": 43783, "epoch": 361} {"train_loss": -33.28481674194336, "global_step": 43784, "epoch": 361} {"train_loss": -33.79218673706055, "global_step": 43785, "epoch": 361} {"train_loss": -33.60438919067383, "global_step": 43786, "epoch": 361} {"train_loss": -34.19755554199219, "global_step": 43787, "epoch": 361} {"train_loss": -33.43303680419922, "global_step": 43788, "epoch": 361} {"train_loss": -33.22798156738281, "global_step": 43789, "epoch": 361} {"train_loss": -33.59809875488281, "global_step": 43790, "epoch": 361} {"train_loss": -33.25033187866211, "global_step": 43791, "epoch": 361} {"train_loss": -31.68409538269043, "global_step": 43792, "epoch": 361} {"train_loss": -32.30253982543945, "global_step": 43793, "epoch": 361} {"train_loss": -29.017927169799805, "global_step": 43794, "epoch": 361} {"train_loss": -29.279001235961914, "global_step": 43795, "epoch": 361} {"train_loss": -33.99061965942383, "global_step": 43796, "epoch": 361} {"train_loss": -30.834915161132812, "global_step": 43797, "epoch": 361} {"train_loss": -31.40897560119629, "global_step": 43798, "epoch": 361} {"train_loss": -32.82341384887695, "global_step": 43799, "epoch": 361} {"train_loss": -33.399105072021484, "global_step": 43800, "epoch": 361} {"train_loss": -32.792882178440564, "global_step": 43801, "epoch": 361, "val_loss": 2542681.5} {"train_loss": -33.387752532958984, "global_step": 43802, "epoch": 362} {"train_loss": -32.946006774902344, "global_step": 43803, "epoch": 362} {"train_loss": -32.8447380065918, "global_step": 43804, "epoch": 362} {"train_loss": -29.636091232299805, "global_step": 43805, "epoch": 362} {"train_loss": -15.428155899047852, "global_step": 43806, "epoch": 362} {"train_loss": 10.256213188171387, "global_step": 43807, "epoch": 362} {"train_loss": -16.588979721069336, "global_step": 43808, "epoch": 362} {"train_loss": -27.980010986328125, "global_step": 43809, "epoch": 362} {"train_loss": -25.14360809326172, "global_step": 43810, "epoch": 362} {"train_loss": -24.112442016601562, "global_step": 43811, "epoch": 362} {"train_loss": -31.791629791259766, "global_step": 43812, "epoch": 362} {"train_loss": -24.638120651245117, "global_step": 43813, "epoch": 362} {"train_loss": -30.268085479736328, "global_step": 43814, "epoch": 362} {"train_loss": -32.48667526245117, "global_step": 43815, "epoch": 362} {"train_loss": -29.832111358642578, "global_step": 43816, "epoch": 362} {"train_loss": -30.229053497314453, "global_step": 43817, "epoch": 362} {"train_loss": -32.234344482421875, "global_step": 43818, "epoch": 362} {"train_loss": -32.89768600463867, "global_step": 43819, "epoch": 362} {"train_loss": -32.06654739379883, "global_step": 43820, "epoch": 362} {"train_loss": -31.153003692626953, "global_step": 43821, "epoch": 362} {"train_loss": -31.699405670166016, "global_step": 43822, "epoch": 362} {"train_loss": -32.48921203613281, "global_step": 43823, "epoch": 362} {"train_loss": -33.24756622314453, "global_step": 43824, "epoch": 362} {"train_loss": -33.048519134521484, "global_step": 43825, "epoch": 362} {"train_loss": -32.35597610473633, "global_step": 43826, "epoch": 362} {"train_loss": -32.2203483581543, "global_step": 43827, "epoch": 362} {"train_loss": -32.45455551147461, "global_step": 43828, "epoch": 362} {"train_loss": -32.83824157714844, "global_step": 43829, "epoch": 362} {"train_loss": -33.2509880065918, "global_step": 43830, "epoch": 362} {"train_loss": -33.03435134887695, "global_step": 43831, "epoch": 362} {"train_loss": -33.12600326538086, "global_step": 43832, "epoch": 362} {"train_loss": -32.91218185424805, "global_step": 43833, "epoch": 362} {"train_loss": -32.890071868896484, "global_step": 43834, "epoch": 362} {"train_loss": -33.06400680541992, "global_step": 43835, "epoch": 362} {"train_loss": -33.03129196166992, "global_step": 43836, "epoch": 362} {"train_loss": -33.63195037841797, "global_step": 43837, "epoch": 362} {"train_loss": -33.73004150390625, "global_step": 43838, "epoch": 362} {"train_loss": -33.05513000488281, "global_step": 43839, "epoch": 362} {"train_loss": -33.67942428588867, "global_step": 43840, "epoch": 362} {"train_loss": -33.65497589111328, "global_step": 43841, "epoch": 362} {"train_loss": -33.45682907104492, "global_step": 43842, "epoch": 362} {"train_loss": -33.473487854003906, "global_step": 43843, "epoch": 362} {"train_loss": -33.50879669189453, "global_step": 43844, "epoch": 362} {"train_loss": -33.737220764160156, "global_step": 43845, "epoch": 362} {"train_loss": -33.58863067626953, "global_step": 43846, "epoch": 362} {"train_loss": -33.6431884765625, "global_step": 43847, "epoch": 362} {"train_loss": -33.51917266845703, "global_step": 43848, "epoch": 362} {"train_loss": -33.58842086791992, "global_step": 43849, "epoch": 362} {"train_loss": -33.473751068115234, "global_step": 43850, "epoch": 362} {"train_loss": -32.97775650024414, "global_step": 43851, "epoch": 362} {"train_loss": -33.14259719848633, "global_step": 43852, "epoch": 362} {"train_loss": -33.90147399902344, "global_step": 43853, "epoch": 362} {"train_loss": -34.06388854980469, "global_step": 43854, "epoch": 362} {"train_loss": -33.70248794555664, "global_step": 43855, "epoch": 362} {"train_loss": -33.94801712036133, "global_step": 43856, "epoch": 362} {"train_loss": -33.74827194213867, "global_step": 43857, "epoch": 362} {"train_loss": -33.860321044921875, "global_step": 43858, "epoch": 362} {"train_loss": -33.794105529785156, "global_step": 43859, "epoch": 362} {"train_loss": -34.02030563354492, "global_step": 43860, "epoch": 362} {"train_loss": -33.62543869018555, "global_step": 43861, "epoch": 362} {"train_loss": -33.907318115234375, "global_step": 43862, "epoch": 362} {"train_loss": -34.177345275878906, "global_step": 43863, "epoch": 362} {"train_loss": -34.25419235229492, "global_step": 43864, "epoch": 362} {"train_loss": -34.16545486450195, "global_step": 43865, "epoch": 362} {"train_loss": -33.918540954589844, "global_step": 43866, "epoch": 362} {"train_loss": -34.155982971191406, "global_step": 43867, "epoch": 362} {"train_loss": -34.3973388671875, "global_step": 43868, "epoch": 362} {"train_loss": -34.28390121459961, "global_step": 43869, "epoch": 362} {"train_loss": -34.11821746826172, "global_step": 43870, "epoch": 362} {"train_loss": -33.745052337646484, "global_step": 43871, "epoch": 362} {"train_loss": -34.238399505615234, "global_step": 43872, "epoch": 362} {"train_loss": -34.102848052978516, "global_step": 43873, "epoch": 362} {"train_loss": -33.80667495727539, "global_step": 43874, "epoch": 362} {"train_loss": -34.275054931640625, "global_step": 43875, "epoch": 362} {"train_loss": -34.805152893066406, "global_step": 43876, "epoch": 362} {"train_loss": -34.70186996459961, "global_step": 43877, "epoch": 362} {"train_loss": -34.33063888549805, "global_step": 43878, "epoch": 362} {"train_loss": -34.48626708984375, "global_step": 43879, "epoch": 362} {"train_loss": -34.10401916503906, "global_step": 43880, "epoch": 362} {"train_loss": -34.56661605834961, "global_step": 43881, "epoch": 362} {"train_loss": -34.48981475830078, "global_step": 43882, "epoch": 362} {"train_loss": -34.41386413574219, "global_step": 43883, "epoch": 362} {"train_loss": -34.42979049682617, "global_step": 43884, "epoch": 362} {"train_loss": -34.1778678894043, "global_step": 43885, "epoch": 362} {"train_loss": -34.085243225097656, "global_step": 43886, "epoch": 362} {"train_loss": -33.5743293762207, "global_step": 43887, "epoch": 362} {"train_loss": -32.96880340576172, "global_step": 43888, "epoch": 362} {"train_loss": -32.287078857421875, "global_step": 43889, "epoch": 362} {"train_loss": -31.05916404724121, "global_step": 43890, "epoch": 362} {"train_loss": -27.147748947143555, "global_step": 43891, "epoch": 362} {"train_loss": -28.58786392211914, "global_step": 43892, "epoch": 362} {"train_loss": -33.11338424682617, "global_step": 43893, "epoch": 362} {"train_loss": -31.887319564819336, "global_step": 43894, "epoch": 362} {"train_loss": -31.89655113220215, "global_step": 43895, "epoch": 362} {"train_loss": -33.95964431762695, "global_step": 43896, "epoch": 362} {"train_loss": -32.41166305541992, "global_step": 43897, "epoch": 362} {"train_loss": -33.951324462890625, "global_step": 43898, "epoch": 362} {"train_loss": -32.59690475463867, "global_step": 43899, "epoch": 362} {"train_loss": -33.0992317199707, "global_step": 43900, "epoch": 362} {"train_loss": -33.45842742919922, "global_step": 43901, "epoch": 362} {"train_loss": -32.59845733642578, "global_step": 43902, "epoch": 362} {"train_loss": -33.615779876708984, "global_step": 43903, "epoch": 362} {"train_loss": -32.21035385131836, "global_step": 43904, "epoch": 362} {"train_loss": -34.15627670288086, "global_step": 43905, "epoch": 362} {"train_loss": -32.73514175415039, "global_step": 43906, "epoch": 362} {"train_loss": -33.37166213989258, "global_step": 43907, "epoch": 362} {"train_loss": -33.028846740722656, "global_step": 43908, "epoch": 362} {"train_loss": -33.62448501586914, "global_step": 43909, "epoch": 362} {"train_loss": -33.474830627441406, "global_step": 43910, "epoch": 362} {"train_loss": -33.39543533325195, "global_step": 43911, "epoch": 362} {"train_loss": -33.36715316772461, "global_step": 43912, "epoch": 362} {"train_loss": -33.442928314208984, "global_step": 43913, "epoch": 362} {"train_loss": -33.82809829711914, "global_step": 43914, "epoch": 362} {"train_loss": -33.421058654785156, "global_step": 43915, "epoch": 362} {"train_loss": -33.69338607788086, "global_step": 43916, "epoch": 362} {"train_loss": -34.073604583740234, "global_step": 43917, "epoch": 362} {"train_loss": -33.58695983886719, "global_step": 43918, "epoch": 362} {"train_loss": -34.390716552734375, "global_step": 43919, "epoch": 362} {"train_loss": -33.81391143798828, "global_step": 43920, "epoch": 362} {"train_loss": -33.8257942199707, "global_step": 43921, "epoch": 362} {"train_loss": -32.30959210514037, "global_step": 43922, "epoch": 362, "val_loss": 2530717.5} {"train_loss": -33.79514694213867, "global_step": 43923, "epoch": 363} {"train_loss": -34.237274169921875, "global_step": 43924, "epoch": 363} {"train_loss": -34.00783920288086, "global_step": 43925, "epoch": 363} {"train_loss": -33.4233512878418, "global_step": 43926, "epoch": 363} {"train_loss": -34.284000396728516, "global_step": 43927, "epoch": 363} {"train_loss": -33.77384567260742, "global_step": 43928, "epoch": 363} {"train_loss": -33.8734245300293, "global_step": 43929, "epoch": 363} {"train_loss": -33.930416107177734, "global_step": 43930, "epoch": 363} {"train_loss": -34.22119903564453, "global_step": 43931, "epoch": 363} {"train_loss": -34.271507263183594, "global_step": 43932, "epoch": 363} {"train_loss": -34.18689727783203, "global_step": 43933, "epoch": 363} {"train_loss": -34.22356414794922, "global_step": 43934, "epoch": 363} {"train_loss": -34.318031311035156, "global_step": 43935, "epoch": 363} {"train_loss": -34.36749267578125, "global_step": 43936, "epoch": 363} {"train_loss": -34.54560089111328, "global_step": 43937, "epoch": 363} {"train_loss": -34.435791015625, "global_step": 43938, "epoch": 363} {"train_loss": -34.30963897705078, "global_step": 43939, "epoch": 363} {"train_loss": -33.92333984375, "global_step": 43940, "epoch": 363} {"train_loss": -34.58367156982422, "global_step": 43941, "epoch": 363} {"train_loss": -34.65398025512695, "global_step": 43942, "epoch": 363} {"train_loss": -34.73336410522461, "global_step": 43943, "epoch": 363} {"train_loss": -34.72880554199219, "global_step": 43944, "epoch": 363} {"train_loss": -34.159950256347656, "global_step": 43945, "epoch": 363} {"train_loss": -34.764522552490234, "global_step": 43946, "epoch": 363} {"train_loss": -34.80710983276367, "global_step": 43947, "epoch": 363} {"train_loss": -34.706398010253906, "global_step": 43948, "epoch": 363} {"train_loss": -34.832576751708984, "global_step": 43949, "epoch": 363} {"train_loss": -34.872833251953125, "global_step": 43950, "epoch": 363} {"train_loss": -34.67100143432617, "global_step": 43951, "epoch": 363} {"train_loss": -34.97591781616211, "global_step": 43952, "epoch": 363} {"train_loss": -34.767127990722656, "global_step": 43953, "epoch": 363} {"train_loss": -34.56882858276367, "global_step": 43954, "epoch": 363} {"train_loss": -34.544830322265625, "global_step": 43955, "epoch": 363} {"train_loss": -34.78291702270508, "global_step": 43956, "epoch": 363} {"train_loss": -34.572898864746094, "global_step": 43957, "epoch": 363} {"train_loss": -34.95370864868164, "global_step": 43958, "epoch": 363} {"train_loss": -34.9218864440918, "global_step": 43959, "epoch": 363} {"train_loss": -34.78806686401367, "global_step": 43960, "epoch": 363} {"train_loss": -34.374366760253906, "global_step": 43961, "epoch": 363} {"train_loss": -34.644004821777344, "global_step": 43962, "epoch": 363} {"train_loss": -34.63039779663086, "global_step": 43963, "epoch": 363} {"train_loss": -35.083614349365234, "global_step": 43964, "epoch": 363} {"train_loss": -34.60677719116211, "global_step": 43965, "epoch": 363} {"train_loss": -34.411590576171875, "global_step": 43966, "epoch": 363} {"train_loss": -32.61085510253906, "global_step": 43967, "epoch": 363} {"train_loss": -23.50799560546875, "global_step": 43968, "epoch": 363} {"train_loss": 11.496330261230469, "global_step": 43969, "epoch": 363} {"train_loss": 23.438358306884766, "global_step": 43970, "epoch": 363} {"train_loss": -27.67451286315918, "global_step": 43971, "epoch": 363} {"train_loss": -9.826637268066406, "global_step": 43972, "epoch": 363} {"train_loss": -30.113889694213867, "global_step": 43973, "epoch": 363} {"train_loss": -17.62836265563965, "global_step": 43974, "epoch": 363} {"train_loss": -28.4385929107666, "global_step": 43975, "epoch": 363} {"train_loss": -30.906097412109375, "global_step": 43976, "epoch": 363} {"train_loss": -25.50221824645996, "global_step": 43977, "epoch": 363} {"train_loss": -26.38178062438965, "global_step": 43978, "epoch": 363} {"train_loss": -31.84467887878418, "global_step": 43979, "epoch": 363} {"train_loss": -30.82912254333496, "global_step": 43980, "epoch": 363} {"train_loss": -29.93463134765625, "global_step": 43981, "epoch": 363} {"train_loss": -28.82513427734375, "global_step": 43982, "epoch": 363} {"train_loss": -31.32880973815918, "global_step": 43983, "epoch": 363} {"train_loss": -32.054012298583984, "global_step": 43984, "epoch": 363} {"train_loss": -32.287662506103516, "global_step": 43985, "epoch": 363} {"train_loss": -31.206470489501953, "global_step": 43986, "epoch": 363} {"train_loss": -31.19447898864746, "global_step": 43987, "epoch": 363} {"train_loss": -31.0971736907959, "global_step": 43988, "epoch": 363} {"train_loss": -31.28523063659668, "global_step": 43989, "epoch": 363} {"train_loss": -32.43474197387695, "global_step": 43990, "epoch": 363} {"train_loss": -32.526119232177734, "global_step": 43991, "epoch": 363} {"train_loss": -31.954870223999023, "global_step": 43992, "epoch": 363} {"train_loss": -32.403377532958984, "global_step": 43993, "epoch": 363} {"train_loss": -32.41537857055664, "global_step": 43994, "epoch": 363} {"train_loss": -31.711353302001953, "global_step": 43995, "epoch": 363} {"train_loss": -31.446502685546875, "global_step": 43996, "epoch": 363} {"train_loss": -32.43092727661133, "global_step": 43997, "epoch": 363} {"train_loss": -32.64015197753906, "global_step": 43998, "epoch": 363} {"train_loss": -32.1453971862793, "global_step": 43999, "epoch": 363} {"train_loss": -32.70058822631836, "global_step": 44000, "epoch": 363} {"train_loss": -32.40639114379883, "global_step": 44001, "epoch": 363} {"train_loss": -32.44764709472656, "global_step": 44002, "epoch": 363} {"train_loss": -32.71308898925781, "global_step": 44003, "epoch": 363} {"train_loss": -32.60218048095703, "global_step": 44004, "epoch": 363} {"train_loss": -32.73002624511719, "global_step": 44005, "epoch": 363} {"train_loss": -32.98434829711914, "global_step": 44006, "epoch": 363} {"train_loss": -33.3717155456543, "global_step": 44007, "epoch": 363} {"train_loss": -32.89875411987305, "global_step": 44008, "epoch": 363} {"train_loss": -33.10377883911133, "global_step": 44009, "epoch": 363} {"train_loss": -32.78494644165039, "global_step": 44010, "epoch": 363} {"train_loss": -33.60219955444336, "global_step": 44011, "epoch": 363} {"train_loss": -33.31343078613281, "global_step": 44012, "epoch": 363} {"train_loss": -33.33418655395508, "global_step": 44013, "epoch": 363} {"train_loss": -33.64896774291992, "global_step": 44014, "epoch": 363} {"train_loss": -33.17531204223633, "global_step": 44015, "epoch": 363} {"train_loss": -33.71992874145508, "global_step": 44016, "epoch": 363} {"train_loss": -33.37983322143555, "global_step": 44017, "epoch": 363} {"train_loss": -34.091426849365234, "global_step": 44018, "epoch": 363} {"train_loss": -33.7406120300293, "global_step": 44019, "epoch": 363} {"train_loss": -33.52421188354492, "global_step": 44020, "epoch": 363} {"train_loss": -34.06325912475586, "global_step": 44021, "epoch": 363} {"train_loss": -33.49410629272461, "global_step": 44022, "epoch": 363} {"train_loss": -34.34644317626953, "global_step": 44023, "epoch": 363} {"train_loss": -34.134300231933594, "global_step": 44024, "epoch": 363} {"train_loss": -33.7104606628418, "global_step": 44025, "epoch": 363} {"train_loss": -33.7601432800293, "global_step": 44026, "epoch": 363} {"train_loss": -33.721561431884766, "global_step": 44027, "epoch": 363} {"train_loss": -33.83850860595703, "global_step": 44028, "epoch": 363} {"train_loss": -33.978370666503906, "global_step": 44029, "epoch": 363} {"train_loss": -34.1789436340332, "global_step": 44030, "epoch": 363} {"train_loss": -34.26846694946289, "global_step": 44031, "epoch": 363} {"train_loss": -34.014503479003906, "global_step": 44032, "epoch": 363} {"train_loss": -34.43703842163086, "global_step": 44033, "epoch": 363} {"train_loss": -34.225860595703125, "global_step": 44034, "epoch": 363} {"train_loss": -34.24363327026367, "global_step": 44035, "epoch": 363} {"train_loss": -33.98594665527344, "global_step": 44036, "epoch": 363} {"train_loss": -34.05477523803711, "global_step": 44037, "epoch": 363} {"train_loss": -34.07722854614258, "global_step": 44038, "epoch": 363} {"train_loss": -34.28059005737305, "global_step": 44039, "epoch": 363} {"train_loss": -33.29372787475586, "global_step": 44040, "epoch": 363} {"train_loss": -33.214820861816406, "global_step": 44041, "epoch": 363} {"train_loss": -33.90788650512695, "global_step": 44042, "epoch": 363} {"train_loss": -32.03304595001473, "global_step": 44043, "epoch": 363, "val_loss": 2618684.75} {"train_loss": -34.3819694519043, "global_step": 44044, "epoch": 364} {"train_loss": -33.51350402832031, "global_step": 44045, "epoch": 364} {"train_loss": -34.06939697265625, "global_step": 44046, "epoch": 364} {"train_loss": -33.8250846862793, "global_step": 44047, "epoch": 364} {"train_loss": -33.73014831542969, "global_step": 44048, "epoch": 364} {"train_loss": -34.32923126220703, "global_step": 44049, "epoch": 364} {"train_loss": -33.540550231933594, "global_step": 44050, "epoch": 364} {"train_loss": -34.275177001953125, "global_step": 44051, "epoch": 364} {"train_loss": -34.394287109375, "global_step": 44052, "epoch": 364} {"train_loss": -34.322181701660156, "global_step": 44053, "epoch": 364} {"train_loss": -34.261268615722656, "global_step": 44054, "epoch": 364} {"train_loss": -34.084693908691406, "global_step": 44055, "epoch": 364} {"train_loss": -34.09552764892578, "global_step": 44056, "epoch": 364} {"train_loss": -34.3824577331543, "global_step": 44057, "epoch": 364} {"train_loss": -31.65389060974121, "global_step": 44058, "epoch": 364} {"train_loss": -33.326690673828125, "global_step": 44059, "epoch": 364} {"train_loss": -32.601531982421875, "global_step": 44060, "epoch": 364} {"train_loss": -33.2623405456543, "global_step": 44061, "epoch": 364} {"train_loss": -33.345306396484375, "global_step": 44062, "epoch": 364} {"train_loss": -33.4699592590332, "global_step": 44063, "epoch": 364} {"train_loss": -34.14030075073242, "global_step": 44064, "epoch": 364} {"train_loss": -33.35576248168945, "global_step": 44065, "epoch": 364} {"train_loss": -34.270904541015625, "global_step": 44066, "epoch": 364} {"train_loss": -33.66279220581055, "global_step": 44067, "epoch": 364} {"train_loss": -33.79395294189453, "global_step": 44068, "epoch": 364} {"train_loss": -33.608333587646484, "global_step": 44069, "epoch": 364} {"train_loss": -33.37751770019531, "global_step": 44070, "epoch": 364} {"train_loss": -33.596614837646484, "global_step": 44071, "epoch": 364} {"train_loss": -33.718631744384766, "global_step": 44072, "epoch": 364} {"train_loss": -34.44334030151367, "global_step": 44073, "epoch": 364} {"train_loss": -34.08968734741211, "global_step": 44074, "epoch": 364} {"train_loss": -33.65584182739258, "global_step": 44075, "epoch": 364} {"train_loss": -32.10028839111328, "global_step": 44076, "epoch": 364} {"train_loss": -34.056819915771484, "global_step": 44077, "epoch": 364} {"train_loss": -33.955196380615234, "global_step": 44078, "epoch": 364} {"train_loss": -33.910667419433594, "global_step": 44079, "epoch": 364} {"train_loss": -32.61005783081055, "global_step": 44080, "epoch": 364} {"train_loss": -33.69390869140625, "global_step": 44081, "epoch": 364} {"train_loss": -33.473915100097656, "global_step": 44082, "epoch": 364} {"train_loss": -34.25213623046875, "global_step": 44083, "epoch": 364} {"train_loss": -34.208473205566406, "global_step": 44084, "epoch": 364} {"train_loss": -33.62220764160156, "global_step": 44085, "epoch": 364} {"train_loss": -33.68077850341797, "global_step": 44086, "epoch": 364} {"train_loss": -33.75167465209961, "global_step": 44087, "epoch": 364} {"train_loss": -34.095985412597656, "global_step": 44088, "epoch": 364} {"train_loss": -33.8121223449707, "global_step": 44089, "epoch": 364} {"train_loss": -33.87140655517578, "global_step": 44090, "epoch": 364} {"train_loss": -33.77363204956055, "global_step": 44091, "epoch": 364} {"train_loss": -34.264183044433594, "global_step": 44092, "epoch": 364} {"train_loss": -33.91350173950195, "global_step": 44093, "epoch": 364} {"train_loss": -33.0871696472168, "global_step": 44094, "epoch": 364} {"train_loss": -33.51696014404297, "global_step": 44095, "epoch": 364} {"train_loss": -33.488983154296875, "global_step": 44096, "epoch": 364} {"train_loss": -31.89104652404785, "global_step": 44097, "epoch": 364} {"train_loss": -34.13368606567383, "global_step": 44098, "epoch": 364} {"train_loss": -34.27845001220703, "global_step": 44099, "epoch": 364} {"train_loss": -33.64455795288086, "global_step": 44100, "epoch": 364} {"train_loss": -33.1858024597168, "global_step": 44101, "epoch": 364} {"train_loss": -32.604427337646484, "global_step": 44102, "epoch": 364} {"train_loss": -32.59868240356445, "global_step": 44103, "epoch": 364} {"train_loss": -33.254268646240234, "global_step": 44104, "epoch": 364} {"train_loss": -33.78205871582031, "global_step": 44105, "epoch": 364} {"train_loss": -33.732295989990234, "global_step": 44106, "epoch": 364} {"train_loss": -32.4813346862793, "global_step": 44107, "epoch": 364} {"train_loss": -33.760276794433594, "global_step": 44108, "epoch": 364} {"train_loss": -33.23155212402344, "global_step": 44109, "epoch": 364} {"train_loss": -32.722938537597656, "global_step": 44110, "epoch": 364} {"train_loss": -32.2452507019043, "global_step": 44111, "epoch": 364} {"train_loss": -32.194332122802734, "global_step": 44112, "epoch": 364} {"train_loss": -33.05043411254883, "global_step": 44113, "epoch": 364} {"train_loss": -32.20644760131836, "global_step": 44114, "epoch": 364} {"train_loss": -32.36548614501953, "global_step": 44115, "epoch": 364} {"train_loss": -30.733123779296875, "global_step": 44116, "epoch": 364} {"train_loss": -31.095518112182617, "global_step": 44117, "epoch": 364} {"train_loss": -30.400266647338867, "global_step": 44118, "epoch": 364} {"train_loss": -31.82256507873535, "global_step": 44119, "epoch": 364} {"train_loss": -33.03554916381836, "global_step": 44120, "epoch": 364} {"train_loss": -30.9428768157959, "global_step": 44121, "epoch": 364} {"train_loss": -31.999536514282227, "global_step": 44122, "epoch": 364} {"train_loss": -30.65654945373535, "global_step": 44123, "epoch": 364} {"train_loss": -30.561370849609375, "global_step": 44124, "epoch": 364} {"train_loss": -31.089933395385742, "global_step": 44125, "epoch": 364} {"train_loss": -31.15065574645996, "global_step": 44126, "epoch": 364} {"train_loss": -30.813913345336914, "global_step": 44127, "epoch": 364} {"train_loss": -32.18983459472656, "global_step": 44128, "epoch": 364} {"train_loss": -31.89777946472168, "global_step": 44129, "epoch": 364} {"train_loss": -31.08273696899414, "global_step": 44130, "epoch": 364} {"train_loss": -31.50043296813965, "global_step": 44131, "epoch": 364} {"train_loss": -31.93427085876465, "global_step": 44132, "epoch": 364} {"train_loss": -30.97492027282715, "global_step": 44133, "epoch": 364} {"train_loss": -31.146696090698242, "global_step": 44134, "epoch": 364} {"train_loss": -31.716039657592773, "global_step": 44135, "epoch": 364} {"train_loss": -31.82855224609375, "global_step": 44136, "epoch": 364} {"train_loss": -31.30878257751465, "global_step": 44137, "epoch": 364} {"train_loss": -31.9487361907959, "global_step": 44138, "epoch": 364} {"train_loss": -32.042152404785156, "global_step": 44139, "epoch": 364} {"train_loss": -32.52830123901367, "global_step": 44140, "epoch": 364} {"train_loss": -32.55340576171875, "global_step": 44141, "epoch": 364} {"train_loss": -32.04890060424805, "global_step": 44142, "epoch": 364} {"train_loss": -32.55176544189453, "global_step": 44143, "epoch": 364} {"train_loss": -32.5970344543457, "global_step": 44144, "epoch": 364} {"train_loss": -32.37632369995117, "global_step": 44145, "epoch": 364} {"train_loss": -31.52975845336914, "global_step": 44146, "epoch": 364} {"train_loss": -32.651668548583984, "global_step": 44147, "epoch": 364} {"train_loss": -33.044410705566406, "global_step": 44148, "epoch": 364} {"train_loss": -31.755117416381836, "global_step": 44149, "epoch": 364} {"train_loss": -31.82822036743164, "global_step": 44150, "epoch": 364} {"train_loss": -32.59082794189453, "global_step": 44151, "epoch": 364} {"train_loss": -32.03346633911133, "global_step": 44152, "epoch": 364} {"train_loss": -32.23008728027344, "global_step": 44153, "epoch": 364} {"train_loss": -33.340999603271484, "global_step": 44154, "epoch": 364} {"train_loss": -32.86662292480469, "global_step": 44155, "epoch": 364} {"train_loss": -32.397579193115234, "global_step": 44156, "epoch": 364} {"train_loss": -33.11611557006836, "global_step": 44157, "epoch": 364} {"train_loss": -32.271087646484375, "global_step": 44158, "epoch": 364} {"train_loss": -33.038387298583984, "global_step": 44159, "epoch": 364} {"train_loss": -33.22517776489258, "global_step": 44160, "epoch": 364} {"train_loss": -32.1034049987793, "global_step": 44161, "epoch": 364} {"train_loss": -31.928598403930664, "global_step": 44162, "epoch": 364} {"train_loss": -31.830053329467773, "global_step": 44163, "epoch": 364} {"train_loss": -32.893376500153344, "global_step": 44164, "epoch": 364, "val_loss": 2953611.75} {"train_loss": -33.362571716308594, "global_step": 44165, "epoch": 365} {"train_loss": -33.30132293701172, "global_step": 44166, "epoch": 365} {"train_loss": -32.796142578125, "global_step": 44167, "epoch": 365} {"train_loss": -32.134700775146484, "global_step": 44168, "epoch": 365} {"train_loss": -33.18479919433594, "global_step": 44169, "epoch": 365} {"train_loss": -33.69416427612305, "global_step": 44170, "epoch": 365} {"train_loss": -33.44521713256836, "global_step": 44171, "epoch": 365} {"train_loss": -33.48723602294922, "global_step": 44172, "epoch": 365} {"train_loss": -33.05439376831055, "global_step": 44173, "epoch": 365} {"train_loss": -32.92146682739258, "global_step": 44174, "epoch": 365} {"train_loss": -32.500953674316406, "global_step": 44175, "epoch": 365} {"train_loss": -33.102935791015625, "global_step": 44176, "epoch": 365} {"train_loss": -33.78137969970703, "global_step": 44177, "epoch": 365} {"train_loss": -33.609161376953125, "global_step": 44178, "epoch": 365} {"train_loss": -33.33565139770508, "global_step": 44179, "epoch": 365} {"train_loss": -33.397178649902344, "global_step": 44180, "epoch": 365} {"train_loss": -33.7884635925293, "global_step": 44181, "epoch": 365} {"train_loss": -33.55216598510742, "global_step": 44182, "epoch": 365} {"train_loss": -33.7010612487793, "global_step": 44183, "epoch": 365} {"train_loss": -33.996864318847656, "global_step": 44184, "epoch": 365} {"train_loss": -34.39147186279297, "global_step": 44185, "epoch": 365} {"train_loss": -33.83393478393555, "global_step": 44186, "epoch": 365} {"train_loss": -33.98884201049805, "global_step": 44187, "epoch": 365} {"train_loss": -33.736793518066406, "global_step": 44188, "epoch": 365} {"train_loss": -34.219844818115234, "global_step": 44189, "epoch": 365} {"train_loss": -34.122528076171875, "global_step": 44190, "epoch": 365} {"train_loss": -34.24110794067383, "global_step": 44191, "epoch": 365} {"train_loss": -34.31504440307617, "global_step": 44192, "epoch": 365} {"train_loss": -34.23793411254883, "global_step": 44193, "epoch": 365} {"train_loss": -34.294490814208984, "global_step": 44194, "epoch": 365} {"train_loss": -34.7152214050293, "global_step": 44195, "epoch": 365} {"train_loss": -34.73124313354492, "global_step": 44196, "epoch": 365} {"train_loss": -34.437225341796875, "global_step": 44197, "epoch": 365} {"train_loss": -34.364479064941406, "global_step": 44198, "epoch": 365} {"train_loss": -34.129573822021484, "global_step": 44199, "epoch": 365} {"train_loss": -34.679718017578125, "global_step": 44200, "epoch": 365} {"train_loss": -34.357391357421875, "global_step": 44201, "epoch": 365} {"train_loss": -34.69438552856445, "global_step": 44202, "epoch": 365} {"train_loss": -34.24494552612305, "global_step": 44203, "epoch": 365} {"train_loss": -34.537086486816406, "global_step": 44204, "epoch": 365} {"train_loss": -34.2870979309082, "global_step": 44205, "epoch": 365} {"train_loss": -34.95627975463867, "global_step": 44206, "epoch": 365} {"train_loss": -34.27889633178711, "global_step": 44207, "epoch": 365} {"train_loss": -33.4384880065918, "global_step": 44208, "epoch": 365} {"train_loss": -32.96849060058594, "global_step": 44209, "epoch": 365} {"train_loss": -31.561725616455078, "global_step": 44210, "epoch": 365} {"train_loss": -32.65486145019531, "global_step": 44211, "epoch": 365} {"train_loss": -34.6098747253418, "global_step": 44212, "epoch": 365} {"train_loss": -32.30995559692383, "global_step": 44213, "epoch": 365} {"train_loss": -33.044002532958984, "global_step": 44214, "epoch": 365} {"train_loss": -34.21632766723633, "global_step": 44215, "epoch": 365} {"train_loss": -34.67739486694336, "global_step": 44216, "epoch": 365} {"train_loss": -33.911739349365234, "global_step": 44217, "epoch": 365} {"train_loss": -31.917871475219727, "global_step": 44218, "epoch": 365} {"train_loss": -34.7473030090332, "global_step": 44219, "epoch": 365} {"train_loss": -33.76551055908203, "global_step": 44220, "epoch": 365} {"train_loss": -27.390827178955078, "global_step": 44221, "epoch": 365} {"train_loss": -24.343624114990234, "global_step": 44222, "epoch": 365} {"train_loss": -32.97265625, "global_step": 44223, "epoch": 365} {"train_loss": -26.51654624938965, "global_step": 44224, "epoch": 365} {"train_loss": -26.45599937438965, "global_step": 44225, "epoch": 365} {"train_loss": -29.68536949157715, "global_step": 44226, "epoch": 365} {"train_loss": -32.1053581237793, "global_step": 44227, "epoch": 365} {"train_loss": -27.836156845092773, "global_step": 44228, "epoch": 365} {"train_loss": -30.871234893798828, "global_step": 44229, "epoch": 365} {"train_loss": -31.384729385375977, "global_step": 44230, "epoch": 365} {"train_loss": -31.267614364624023, "global_step": 44231, "epoch": 365} {"train_loss": -31.181379318237305, "global_step": 44232, "epoch": 365} {"train_loss": -32.37328338623047, "global_step": 44233, "epoch": 365} {"train_loss": -33.20396041870117, "global_step": 44234, "epoch": 365} {"train_loss": -32.6501579284668, "global_step": 44235, "epoch": 365} {"train_loss": -32.173744201660156, "global_step": 44236, "epoch": 365} {"train_loss": -30.927549362182617, "global_step": 44237, "epoch": 365} {"train_loss": -32.6515007019043, "global_step": 44238, "epoch": 365} {"train_loss": -32.260345458984375, "global_step": 44239, "epoch": 365} {"train_loss": -33.0572624206543, "global_step": 44240, "epoch": 365} {"train_loss": -33.02454376220703, "global_step": 44241, "epoch": 365} {"train_loss": -33.16761016845703, "global_step": 44242, "epoch": 365} {"train_loss": -32.75709915161133, "global_step": 44243, "epoch": 365} {"train_loss": -32.886714935302734, "global_step": 44244, "epoch": 365} {"train_loss": -32.840843200683594, "global_step": 44245, "epoch": 365} {"train_loss": -32.09246826171875, "global_step": 44246, "epoch": 365} {"train_loss": -33.31753158569336, "global_step": 44247, "epoch": 365} {"train_loss": -32.82002258300781, "global_step": 44248, "epoch": 365} {"train_loss": -32.61081314086914, "global_step": 44249, "epoch": 365} {"train_loss": -33.70747756958008, "global_step": 44250, "epoch": 365} {"train_loss": -31.783191680908203, "global_step": 44251, "epoch": 365} {"train_loss": -33.31574630737305, "global_step": 44252, "epoch": 365} {"train_loss": -33.76543426513672, "global_step": 44253, "epoch": 365} {"train_loss": -31.34549331665039, "global_step": 44254, "epoch": 365} {"train_loss": -32.34071731567383, "global_step": 44255, "epoch": 365} {"train_loss": -33.47126388549805, "global_step": 44256, "epoch": 365} {"train_loss": -33.74160385131836, "global_step": 44257, "epoch": 365} {"train_loss": -33.17372131347656, "global_step": 44258, "epoch": 365} {"train_loss": -33.06757736206055, "global_step": 44259, "epoch": 365} {"train_loss": -33.9069938659668, "global_step": 44260, "epoch": 365} {"train_loss": -33.130401611328125, "global_step": 44261, "epoch": 365} {"train_loss": -33.78237533569336, "global_step": 44262, "epoch": 365} {"train_loss": -33.4818000793457, "global_step": 44263, "epoch": 365} {"train_loss": -33.472991943359375, "global_step": 44264, "epoch": 365} {"train_loss": -32.90717315673828, "global_step": 44265, "epoch": 365} {"train_loss": -33.657344818115234, "global_step": 44266, "epoch": 365} {"train_loss": -33.83127975463867, "global_step": 44267, "epoch": 365} {"train_loss": -32.94214630126953, "global_step": 44268, "epoch": 365} {"train_loss": -33.833370208740234, "global_step": 44269, "epoch": 365} {"train_loss": -33.060420989990234, "global_step": 44270, "epoch": 365} {"train_loss": -33.72731018066406, "global_step": 44271, "epoch": 365} {"train_loss": -33.0446662902832, "global_step": 44272, "epoch": 365} {"train_loss": -32.25599670410156, "global_step": 44273, "epoch": 365} {"train_loss": -33.62541198730469, "global_step": 44274, "epoch": 365} {"train_loss": -33.68819808959961, "global_step": 44275, "epoch": 365} {"train_loss": -34.19196319580078, "global_step": 44276, "epoch": 365} {"train_loss": -33.98305892944336, "global_step": 44277, "epoch": 365} {"train_loss": -33.699031829833984, "global_step": 44278, "epoch": 365} {"train_loss": -33.829345703125, "global_step": 44279, "epoch": 365} {"train_loss": -33.72788619995117, "global_step": 44280, "epoch": 365} {"train_loss": -33.926021575927734, "global_step": 44281, "epoch": 365} {"train_loss": -34.18545150756836, "global_step": 44282, "epoch": 365} {"train_loss": -34.65925216674805, "global_step": 44283, "epoch": 365} {"train_loss": -33.433868408203125, "global_step": 44284, "epoch": 365} {"train_loss": -33.05742905356667, "global_step": 44285, "epoch": 365, "val_loss": 2586619.25} {"train_loss": -33.870479583740234, "global_step": 44286, "epoch": 366} {"train_loss": -34.2017707824707, "global_step": 44287, "epoch": 366} {"train_loss": -33.8113899230957, "global_step": 44288, "epoch": 366} {"train_loss": -33.87174606323242, "global_step": 44289, "epoch": 366} {"train_loss": -33.721832275390625, "global_step": 44290, "epoch": 366} {"train_loss": -33.573516845703125, "global_step": 44291, "epoch": 366} {"train_loss": -34.43906784057617, "global_step": 44292, "epoch": 366} {"train_loss": -34.694976806640625, "global_step": 44293, "epoch": 366} {"train_loss": -34.45048522949219, "global_step": 44294, "epoch": 366} {"train_loss": -34.0661506652832, "global_step": 44295, "epoch": 366} {"train_loss": -33.697181701660156, "global_step": 44296, "epoch": 366} {"train_loss": -33.8829231262207, "global_step": 44297, "epoch": 366} {"train_loss": -32.32966995239258, "global_step": 44298, "epoch": 366} {"train_loss": -28.73079490661621, "global_step": 44299, "epoch": 366} {"train_loss": -33.87788772583008, "global_step": 44300, "epoch": 366} {"train_loss": -30.847204208374023, "global_step": 44301, "epoch": 366} {"train_loss": -32.995296478271484, "global_step": 44302, "epoch": 366} {"train_loss": -33.293006896972656, "global_step": 44303, "epoch": 366} {"train_loss": -34.57882308959961, "global_step": 44304, "epoch": 366} {"train_loss": -33.124263763427734, "global_step": 44305, "epoch": 366} {"train_loss": -30.724409103393555, "global_step": 44306, "epoch": 366} {"train_loss": -27.778818130493164, "global_step": 44307, "epoch": 366} {"train_loss": -29.794363021850586, "global_step": 44308, "epoch": 366} {"train_loss": -33.77647018432617, "global_step": 44309, "epoch": 366} {"train_loss": -32.03152084350586, "global_step": 44310, "epoch": 366} {"train_loss": -32.8030891418457, "global_step": 44311, "epoch": 366} {"train_loss": -33.40867233276367, "global_step": 44312, "epoch": 366} {"train_loss": -32.86576461791992, "global_step": 44313, "epoch": 366} {"train_loss": -33.44857406616211, "global_step": 44314, "epoch": 366} {"train_loss": -32.79129409790039, "global_step": 44315, "epoch": 366} {"train_loss": -33.8523063659668, "global_step": 44316, "epoch": 366} {"train_loss": -33.67353439331055, "global_step": 44317, "epoch": 366} {"train_loss": -33.133033752441406, "global_step": 44318, "epoch": 366} {"train_loss": -33.651031494140625, "global_step": 44319, "epoch": 366} {"train_loss": -33.137115478515625, "global_step": 44320, "epoch": 366} {"train_loss": -33.72536087036133, "global_step": 44321, "epoch": 366} {"train_loss": -33.654701232910156, "global_step": 44322, "epoch": 366} {"train_loss": -34.00740432739258, "global_step": 44323, "epoch": 366} {"train_loss": -34.023799896240234, "global_step": 44324, "epoch": 366} {"train_loss": -33.20419692993164, "global_step": 44325, "epoch": 366} {"train_loss": -34.654659271240234, "global_step": 44326, "epoch": 366} {"train_loss": -34.03037643432617, "global_step": 44327, "epoch": 366} {"train_loss": -33.69691467285156, "global_step": 44328, "epoch": 366} {"train_loss": -34.252384185791016, "global_step": 44329, "epoch": 366} {"train_loss": -34.09162139892578, "global_step": 44330, "epoch": 366} {"train_loss": -34.660945892333984, "global_step": 44331, "epoch": 366} {"train_loss": -33.92218780517578, "global_step": 44332, "epoch": 366} {"train_loss": -34.34617233276367, "global_step": 44333, "epoch": 366} {"train_loss": -33.97980880737305, "global_step": 44334, "epoch": 366} {"train_loss": -34.38302230834961, "global_step": 44335, "epoch": 366} {"train_loss": -34.396217346191406, "global_step": 44336, "epoch": 366} {"train_loss": -34.017913818359375, "global_step": 44337, "epoch": 366} {"train_loss": -33.442996978759766, "global_step": 44338, "epoch": 366} {"train_loss": -34.75466537475586, "global_step": 44339, "epoch": 366} {"train_loss": -33.62529754638672, "global_step": 44340, "epoch": 366} {"train_loss": -33.641849517822266, "global_step": 44341, "epoch": 366} {"train_loss": -33.9281005859375, "global_step": 44342, "epoch": 366} {"train_loss": -34.158878326416016, "global_step": 44343, "epoch": 366} {"train_loss": -34.09892272949219, "global_step": 44344, "epoch": 366} {"train_loss": -33.8575553894043, "global_step": 44345, "epoch": 366} {"train_loss": -33.87191390991211, "global_step": 44346, "epoch": 366} {"train_loss": -34.24949645996094, "global_step": 44347, "epoch": 366} {"train_loss": -33.82969284057617, "global_step": 44348, "epoch": 366} {"train_loss": -33.86568832397461, "global_step": 44349, "epoch": 366} {"train_loss": -34.95121383666992, "global_step": 44350, "epoch": 366} {"train_loss": -34.30823516845703, "global_step": 44351, "epoch": 366} {"train_loss": -33.97698974609375, "global_step": 44352, "epoch": 366} {"train_loss": -33.95888900756836, "global_step": 44353, "epoch": 366} {"train_loss": -33.64280700683594, "global_step": 44354, "epoch": 366} {"train_loss": -33.63853073120117, "global_step": 44355, "epoch": 366} {"train_loss": -33.16255569458008, "global_step": 44356, "epoch": 366} {"train_loss": -34.115482330322266, "global_step": 44357, "epoch": 366} {"train_loss": -33.413429260253906, "global_step": 44358, "epoch": 366} {"train_loss": -33.7911376953125, "global_step": 44359, "epoch": 366} {"train_loss": -33.30617904663086, "global_step": 44360, "epoch": 366} {"train_loss": -34.321285247802734, "global_step": 44361, "epoch": 366} {"train_loss": -33.733821868896484, "global_step": 44362, "epoch": 366} {"train_loss": -34.584930419921875, "global_step": 44363, "epoch": 366} {"train_loss": -33.52545166015625, "global_step": 44364, "epoch": 366} {"train_loss": -33.934017181396484, "global_step": 44365, "epoch": 366} {"train_loss": -32.86335754394531, "global_step": 44366, "epoch": 366} {"train_loss": -33.78150939941406, "global_step": 44367, "epoch": 366} {"train_loss": -34.560970306396484, "global_step": 44368, "epoch": 366} {"train_loss": -34.285335540771484, "global_step": 44369, "epoch": 366} {"train_loss": -34.439048767089844, "global_step": 44370, "epoch": 366} {"train_loss": -34.15498733520508, "global_step": 44371, "epoch": 366} {"train_loss": -34.093379974365234, "global_step": 44372, "epoch": 366} {"train_loss": -34.12316131591797, "global_step": 44373, "epoch": 366} {"train_loss": -34.53911209106445, "global_step": 44374, "epoch": 366} {"train_loss": -33.98612976074219, "global_step": 44375, "epoch": 366} {"train_loss": -34.83197021484375, "global_step": 44376, "epoch": 366} {"train_loss": -34.64528274536133, "global_step": 44377, "epoch": 366} {"train_loss": -34.5168342590332, "global_step": 44378, "epoch": 366} {"train_loss": -34.271053314208984, "global_step": 44379, "epoch": 366} {"train_loss": -34.95024490356445, "global_step": 44380, "epoch": 366} {"train_loss": -32.618465423583984, "global_step": 44381, "epoch": 366} {"train_loss": -34.59303665161133, "global_step": 44382, "epoch": 366} {"train_loss": -34.56154251098633, "global_step": 44383, "epoch": 366} {"train_loss": -33.946311950683594, "global_step": 44384, "epoch": 366} {"train_loss": -34.600399017333984, "global_step": 44385, "epoch": 366} {"train_loss": -34.812068939208984, "global_step": 44386, "epoch": 366} {"train_loss": -34.534175872802734, "global_step": 44387, "epoch": 366} {"train_loss": -34.40606689453125, "global_step": 44388, "epoch": 366} {"train_loss": -33.717403411865234, "global_step": 44389, "epoch": 366} {"train_loss": -34.29072189331055, "global_step": 44390, "epoch": 366} {"train_loss": -34.83070373535156, "global_step": 44391, "epoch": 366} {"train_loss": -34.306575775146484, "global_step": 44392, "epoch": 366} {"train_loss": -34.504493713378906, "global_step": 44393, "epoch": 366} {"train_loss": -34.538143157958984, "global_step": 44394, "epoch": 366} {"train_loss": -34.9487419128418, "global_step": 44395, "epoch": 366} {"train_loss": -34.75700759887695, "global_step": 44396, "epoch": 366} {"train_loss": -33.856788635253906, "global_step": 44397, "epoch": 366} {"train_loss": -34.5132942199707, "global_step": 44398, "epoch": 366} {"train_loss": -32.518463134765625, "global_step": 44399, "epoch": 366} {"train_loss": -34.66265869140625, "global_step": 44400, "epoch": 366} {"train_loss": -34.71323776245117, "global_step": 44401, "epoch": 366} {"train_loss": -33.838340759277344, "global_step": 44402, "epoch": 366} {"train_loss": -33.81732940673828, "global_step": 44403, "epoch": 366} {"train_loss": -34.91365432739258, "global_step": 44404, "epoch": 366} {"train_loss": -34.720638275146484, "global_step": 44405, "epoch": 366} {"train_loss": -33.79765810060107, "global_step": 44406, "epoch": 366, "val_loss": 2451469.75} {"train_loss": -34.57047653198242, "global_step": 44407, "epoch": 367} {"train_loss": -34.33324432373047, "global_step": 44408, "epoch": 367} {"train_loss": -34.082454681396484, "global_step": 44409, "epoch": 367} {"train_loss": -34.257869720458984, "global_step": 44410, "epoch": 367} {"train_loss": -34.094886779785156, "global_step": 44411, "epoch": 367} {"train_loss": -34.046630859375, "global_step": 44412, "epoch": 367} {"train_loss": -33.95066452026367, "global_step": 44413, "epoch": 367} {"train_loss": -34.75093460083008, "global_step": 44414, "epoch": 367} {"train_loss": -33.50337600708008, "global_step": 44415, "epoch": 367} {"train_loss": -34.11997604370117, "global_step": 44416, "epoch": 367} {"train_loss": -34.14201354980469, "global_step": 44417, "epoch": 367} {"train_loss": -34.30672836303711, "global_step": 44418, "epoch": 367} {"train_loss": -33.997371673583984, "global_step": 44419, "epoch": 367} {"train_loss": -34.98615264892578, "global_step": 44420, "epoch": 367} {"train_loss": -34.305599212646484, "global_step": 44421, "epoch": 367} {"train_loss": -34.1729736328125, "global_step": 44422, "epoch": 367} {"train_loss": -32.784828186035156, "global_step": 44423, "epoch": 367} {"train_loss": -27.952106475830078, "global_step": 44424, "epoch": 367} {"train_loss": -18.40584373474121, "global_step": 44425, "epoch": 367} {"train_loss": 2.9780776500701904, "global_step": 44426, "epoch": 367} {"train_loss": -26.055953979492188, "global_step": 44427, "epoch": 367} {"train_loss": -27.2838134765625, "global_step": 44428, "epoch": 367} {"train_loss": -24.889236450195312, "global_step": 44429, "epoch": 367} {"train_loss": -28.83344841003418, "global_step": 44430, "epoch": 367} {"train_loss": -27.991546630859375, "global_step": 44431, "epoch": 367} {"train_loss": -28.473474502563477, "global_step": 44432, "epoch": 367} {"train_loss": -32.486663818359375, "global_step": 44433, "epoch": 367} {"train_loss": -29.47173500061035, "global_step": 44434, "epoch": 367} {"train_loss": -31.5985107421875, "global_step": 44435, "epoch": 367} {"train_loss": -33.02828598022461, "global_step": 44436, "epoch": 367} {"train_loss": -31.729822158813477, "global_step": 44437, "epoch": 367} {"train_loss": -31.668909072875977, "global_step": 44438, "epoch": 367} {"train_loss": -33.08342361450195, "global_step": 44439, "epoch": 367} {"train_loss": -33.0361328125, "global_step": 44440, "epoch": 367} {"train_loss": -32.779075622558594, "global_step": 44441, "epoch": 367} {"train_loss": -32.73801803588867, "global_step": 44442, "epoch": 367} {"train_loss": -33.23044204711914, "global_step": 44443, "epoch": 367} {"train_loss": -33.05866622924805, "global_step": 44444, "epoch": 367} {"train_loss": -32.76441192626953, "global_step": 44445, "epoch": 367} {"train_loss": -33.155364990234375, "global_step": 44446, "epoch": 367} {"train_loss": -33.83198165893555, "global_step": 44447, "epoch": 367} {"train_loss": -33.792457580566406, "global_step": 44448, "epoch": 367} {"train_loss": -33.60567855834961, "global_step": 44449, "epoch": 367} {"train_loss": -33.50032424926758, "global_step": 44450, "epoch": 367} {"train_loss": -33.293006896972656, "global_step": 44451, "epoch": 367} {"train_loss": -33.97541427612305, "global_step": 44452, "epoch": 367} {"train_loss": -33.62751770019531, "global_step": 44453, "epoch": 367} {"train_loss": -33.7592887878418, "global_step": 44454, "epoch": 367} {"train_loss": -33.41024398803711, "global_step": 44455, "epoch": 367} {"train_loss": -33.7176513671875, "global_step": 44456, "epoch": 367} {"train_loss": -33.61855697631836, "global_step": 44457, "epoch": 367} {"train_loss": -34.445831298828125, "global_step": 44458, "epoch": 367} {"train_loss": -34.21764373779297, "global_step": 44459, "epoch": 367} {"train_loss": -34.08465576171875, "global_step": 44460, "epoch": 367} {"train_loss": -34.23979187011719, "global_step": 44461, "epoch": 367} {"train_loss": -33.5244026184082, "global_step": 44462, "epoch": 367} {"train_loss": -34.300228118896484, "global_step": 44463, "epoch": 367} {"train_loss": -34.37704086303711, "global_step": 44464, "epoch": 367} {"train_loss": -34.2581787109375, "global_step": 44465, "epoch": 367} {"train_loss": -33.44451141357422, "global_step": 44466, "epoch": 367} {"train_loss": -34.73183822631836, "global_step": 44467, "epoch": 367} {"train_loss": -33.87102127075195, "global_step": 44468, "epoch": 367} {"train_loss": -34.624656677246094, "global_step": 44469, "epoch": 367} {"train_loss": -34.551673889160156, "global_step": 44470, "epoch": 367} {"train_loss": -34.513668060302734, "global_step": 44471, "epoch": 367} {"train_loss": -33.822654724121094, "global_step": 44472, "epoch": 367} {"train_loss": -34.54014205932617, "global_step": 44473, "epoch": 367} {"train_loss": -34.97288131713867, "global_step": 44474, "epoch": 367} {"train_loss": -34.52769088745117, "global_step": 44475, "epoch": 367} {"train_loss": -34.217811584472656, "global_step": 44476, "epoch": 367} {"train_loss": -34.59178924560547, "global_step": 44477, "epoch": 367} {"train_loss": -34.78977584838867, "global_step": 44478, "epoch": 367} {"train_loss": -34.31177520751953, "global_step": 44479, "epoch": 367} {"train_loss": -34.62529373168945, "global_step": 44480, "epoch": 367} {"train_loss": -34.64097213745117, "global_step": 44481, "epoch": 367} {"train_loss": -34.911476135253906, "global_step": 44482, "epoch": 367} {"train_loss": -34.395668029785156, "global_step": 44483, "epoch": 367} {"train_loss": -34.5521354675293, "global_step": 44484, "epoch": 367} {"train_loss": -34.22075653076172, "global_step": 44485, "epoch": 367} {"train_loss": -34.51679992675781, "global_step": 44486, "epoch": 367} {"train_loss": -34.45330810546875, "global_step": 44487, "epoch": 367} {"train_loss": -34.5184440612793, "global_step": 44488, "epoch": 367} {"train_loss": -34.210514068603516, "global_step": 44489, "epoch": 367} {"train_loss": -34.24647521972656, "global_step": 44490, "epoch": 367} {"train_loss": -33.6826171875, "global_step": 44491, "epoch": 367} {"train_loss": -33.96553421020508, "global_step": 44492, "epoch": 367} {"train_loss": -34.537837982177734, "global_step": 44493, "epoch": 367} {"train_loss": -34.6835823059082, "global_step": 44494, "epoch": 367} {"train_loss": -34.39004135131836, "global_step": 44495, "epoch": 367} {"train_loss": -33.691139221191406, "global_step": 44496, "epoch": 367} {"train_loss": -32.587284088134766, "global_step": 44497, "epoch": 367} {"train_loss": -32.87435531616211, "global_step": 44498, "epoch": 367} {"train_loss": -32.8349494934082, "global_step": 44499, "epoch": 367} {"train_loss": -32.452735900878906, "global_step": 44500, "epoch": 367} {"train_loss": -33.71596908569336, "global_step": 44501, "epoch": 367} {"train_loss": -35.06581497192383, "global_step": 44502, "epoch": 367} {"train_loss": -32.56277084350586, "global_step": 44503, "epoch": 367} {"train_loss": -33.934608459472656, "global_step": 44504, "epoch": 367} {"train_loss": -34.09457015991211, "global_step": 44505, "epoch": 367} {"train_loss": -32.578739166259766, "global_step": 44506, "epoch": 367} {"train_loss": -33.02478790283203, "global_step": 44507, "epoch": 367} {"train_loss": -33.837158203125, "global_step": 44508, "epoch": 367} {"train_loss": -34.02592086791992, "global_step": 44509, "epoch": 367} {"train_loss": -33.8857307434082, "global_step": 44510, "epoch": 367} {"train_loss": -33.95783233642578, "global_step": 44511, "epoch": 367} {"train_loss": -34.21699142456055, "global_step": 44512, "epoch": 367} {"train_loss": -32.80308532714844, "global_step": 44513, "epoch": 367} {"train_loss": -33.640926361083984, "global_step": 44514, "epoch": 367} {"train_loss": -34.7193489074707, "global_step": 44515, "epoch": 367} {"train_loss": -34.19154739379883, "global_step": 44516, "epoch": 367} {"train_loss": -34.1228141784668, "global_step": 44517, "epoch": 367} {"train_loss": -34.36851119995117, "global_step": 44518, "epoch": 367} {"train_loss": -34.09614181518555, "global_step": 44519, "epoch": 367} {"train_loss": -34.73627853393555, "global_step": 44520, "epoch": 367} {"train_loss": -34.34917068481445, "global_step": 44521, "epoch": 367} {"train_loss": -33.95240020751953, "global_step": 44522, "epoch": 367} {"train_loss": -33.72899627685547, "global_step": 44523, "epoch": 367} {"train_loss": -33.9802131652832, "global_step": 44524, "epoch": 367} {"train_loss": -34.50950241088867, "global_step": 44525, "epoch": 367} {"train_loss": -34.34614181518555, "global_step": 44526, "epoch": 367} {"train_loss": -33.03830608060537, "global_step": 44527, "epoch": 367, "val_loss": 2387257.75} {"train_loss": -34.375709533691406, "global_step": 44528, "epoch": 368} {"train_loss": -33.3780403137207, "global_step": 44529, "epoch": 368} {"train_loss": -34.8197021484375, "global_step": 44530, "epoch": 368} {"train_loss": -33.88845443725586, "global_step": 44531, "epoch": 368} {"train_loss": -34.22370147705078, "global_step": 44532, "epoch": 368} {"train_loss": -34.60294723510742, "global_step": 44533, "epoch": 368} {"train_loss": -34.521583557128906, "global_step": 44534, "epoch": 368} {"train_loss": -33.81319046020508, "global_step": 44535, "epoch": 368} {"train_loss": -32.46262741088867, "global_step": 44536, "epoch": 368} {"train_loss": -34.031951904296875, "global_step": 44537, "epoch": 368} {"train_loss": -33.8016471862793, "global_step": 44538, "epoch": 368} {"train_loss": -33.764678955078125, "global_step": 44539, "epoch": 368} {"train_loss": -34.26737594604492, "global_step": 44540, "epoch": 368} {"train_loss": -32.82835388183594, "global_step": 44541, "epoch": 368} {"train_loss": -33.174659729003906, "global_step": 44542, "epoch": 368} {"train_loss": -33.567344665527344, "global_step": 44543, "epoch": 368} {"train_loss": -33.04587936401367, "global_step": 44544, "epoch": 368} {"train_loss": -32.59656524658203, "global_step": 44545, "epoch": 368} {"train_loss": -33.17841720581055, "global_step": 44546, "epoch": 368} {"train_loss": -32.82393264770508, "global_step": 44547, "epoch": 368} {"train_loss": -32.41115951538086, "global_step": 44548, "epoch": 368} {"train_loss": -33.275936126708984, "global_step": 44549, "epoch": 368} {"train_loss": -32.9586296081543, "global_step": 44550, "epoch": 368} {"train_loss": -33.30598449707031, "global_step": 44551, "epoch": 368} {"train_loss": -33.82399368286133, "global_step": 44552, "epoch": 368} {"train_loss": -32.47357940673828, "global_step": 44553, "epoch": 368} {"train_loss": -33.125614166259766, "global_step": 44554, "epoch": 368} {"train_loss": -31.545791625976562, "global_step": 44555, "epoch": 368} {"train_loss": -33.24956512451172, "global_step": 44556, "epoch": 368} {"train_loss": -32.9942741394043, "global_step": 44557, "epoch": 368} {"train_loss": -33.7928466796875, "global_step": 44558, "epoch": 368} {"train_loss": -32.54047775268555, "global_step": 44559, "epoch": 368} {"train_loss": -32.5317268371582, "global_step": 44560, "epoch": 368} {"train_loss": -33.37244415283203, "global_step": 44561, "epoch": 368} {"train_loss": -32.990962982177734, "global_step": 44562, "epoch": 368} {"train_loss": -33.60356140136719, "global_step": 44563, "epoch": 368} {"train_loss": -30.731191635131836, "global_step": 44564, "epoch": 368} {"train_loss": -32.60945510864258, "global_step": 44565, "epoch": 368} {"train_loss": -32.9238166809082, "global_step": 44566, "epoch": 368} {"train_loss": -33.661598205566406, "global_step": 44567, "epoch": 368} {"train_loss": -32.895973205566406, "global_step": 44568, "epoch": 368} {"train_loss": -33.24873733520508, "global_step": 44569, "epoch": 368} {"train_loss": -33.413822174072266, "global_step": 44570, "epoch": 368} {"train_loss": -33.409027099609375, "global_step": 44571, "epoch": 368} {"train_loss": -33.14119338989258, "global_step": 44572, "epoch": 368} {"train_loss": -30.8504638671875, "global_step": 44573, "epoch": 368} {"train_loss": -33.52238464355469, "global_step": 44574, "epoch": 368} {"train_loss": -33.50729751586914, "global_step": 44575, "epoch": 368} {"train_loss": -31.983570098876953, "global_step": 44576, "epoch": 368} {"train_loss": -32.86906051635742, "global_step": 44577, "epoch": 368} {"train_loss": -33.7926139831543, "global_step": 44578, "epoch": 368} {"train_loss": -32.4418830871582, "global_step": 44579, "epoch": 368} {"train_loss": -33.59906768798828, "global_step": 44580, "epoch": 368} {"train_loss": -34.17269515991211, "global_step": 44581, "epoch": 368} {"train_loss": -33.206764221191406, "global_step": 44582, "epoch": 368} {"train_loss": -32.483154296875, "global_step": 44583, "epoch": 368} {"train_loss": -33.51892852783203, "global_step": 44584, "epoch": 368} {"train_loss": -32.70545959472656, "global_step": 44585, "epoch": 368} {"train_loss": -34.11328125, "global_step": 44586, "epoch": 368} {"train_loss": -33.04288864135742, "global_step": 44587, "epoch": 368} {"train_loss": -33.73944854736328, "global_step": 44588, "epoch": 368} {"train_loss": -33.56594467163086, "global_step": 44589, "epoch": 368} {"train_loss": -33.44735336303711, "global_step": 44590, "epoch": 368} {"train_loss": -33.5646858215332, "global_step": 44591, "epoch": 368} {"train_loss": -32.96514892578125, "global_step": 44592, "epoch": 368} {"train_loss": -34.2943115234375, "global_step": 44593, "epoch": 368} {"train_loss": -33.761112213134766, "global_step": 44594, "epoch": 368} {"train_loss": -33.94611740112305, "global_step": 44595, "epoch": 368} {"train_loss": -34.11599349975586, "global_step": 44596, "epoch": 368} {"train_loss": -33.66412353515625, "global_step": 44597, "epoch": 368} {"train_loss": -33.35940170288086, "global_step": 44598, "epoch": 368} {"train_loss": -33.63705062866211, "global_step": 44599, "epoch": 368} {"train_loss": -33.811981201171875, "global_step": 44600, "epoch": 368} {"train_loss": -32.025962829589844, "global_step": 44601, "epoch": 368} {"train_loss": -32.975337982177734, "global_step": 44602, "epoch": 368} {"train_loss": -34.581111907958984, "global_step": 44603, "epoch": 368} {"train_loss": -33.96845626831055, "global_step": 44604, "epoch": 368} {"train_loss": -34.502113342285156, "global_step": 44605, "epoch": 368} {"train_loss": -34.1872444152832, "global_step": 44606, "epoch": 368} {"train_loss": -33.31831741333008, "global_step": 44607, "epoch": 368} {"train_loss": -33.95829772949219, "global_step": 44608, "epoch": 368} {"train_loss": -33.836788177490234, "global_step": 44609, "epoch": 368} {"train_loss": -33.899105072021484, "global_step": 44610, "epoch": 368} {"train_loss": -34.58552551269531, "global_step": 44611, "epoch": 368} {"train_loss": -34.35190963745117, "global_step": 44612, "epoch": 368} {"train_loss": -33.74087905883789, "global_step": 44613, "epoch": 368} {"train_loss": -34.69734191894531, "global_step": 44614, "epoch": 368} {"train_loss": -34.18238067626953, "global_step": 44615, "epoch": 368} {"train_loss": -32.89372634887695, "global_step": 44616, "epoch": 368} {"train_loss": -34.31856155395508, "global_step": 44617, "epoch": 368} {"train_loss": -34.99415969848633, "global_step": 44618, "epoch": 368} {"train_loss": -34.33837890625, "global_step": 44619, "epoch": 368} {"train_loss": -33.7570915222168, "global_step": 44620, "epoch": 368} {"train_loss": -34.82941436767578, "global_step": 44621, "epoch": 368} {"train_loss": -34.30842971801758, "global_step": 44622, "epoch": 368} {"train_loss": -34.01426315307617, "global_step": 44623, "epoch": 368} {"train_loss": -34.056339263916016, "global_step": 44624, "epoch": 368} {"train_loss": -34.543495178222656, "global_step": 44625, "epoch": 368} {"train_loss": -34.93794631958008, "global_step": 44626, "epoch": 368} {"train_loss": -35.1799201965332, "global_step": 44627, "epoch": 368} {"train_loss": -34.50948715209961, "global_step": 44628, "epoch": 368} {"train_loss": -34.60866928100586, "global_step": 44629, "epoch": 368} {"train_loss": -34.658111572265625, "global_step": 44630, "epoch": 368} {"train_loss": -34.4623908996582, "global_step": 44631, "epoch": 368} {"train_loss": -35.210227966308594, "global_step": 44632, "epoch": 368} {"train_loss": -34.69810104370117, "global_step": 44633, "epoch": 368} {"train_loss": -35.038150787353516, "global_step": 44634, "epoch": 368} {"train_loss": -33.10315704345703, "global_step": 44635, "epoch": 368} {"train_loss": -34.08675765991211, "global_step": 44636, "epoch": 368} {"train_loss": -32.56307601928711, "global_step": 44637, "epoch": 368} {"train_loss": -33.651344299316406, "global_step": 44638, "epoch": 368} {"train_loss": -33.95331954956055, "global_step": 44639, "epoch": 368} {"train_loss": -34.43319320678711, "global_step": 44640, "epoch": 368} {"train_loss": -33.475643157958984, "global_step": 44641, "epoch": 368} {"train_loss": -32.94386291503906, "global_step": 44642, "epoch": 368} {"train_loss": -34.03227615356445, "global_step": 44643, "epoch": 368} {"train_loss": -34.55758285522461, "global_step": 44644, "epoch": 368} {"train_loss": -33.16741180419922, "global_step": 44645, "epoch": 368} {"train_loss": -33.251617431640625, "global_step": 44646, "epoch": 368} {"train_loss": -33.3548698425293, "global_step": 44647, "epoch": 368} {"train_loss": -33.59709774364125, "global_step": 44648, "epoch": 368, "val_loss": 2541688.25} {"train_loss": -33.043678283691406, "global_step": 44649, "epoch": 369} {"train_loss": -33.07466506958008, "global_step": 44650, "epoch": 369} {"train_loss": -31.284515380859375, "global_step": 44651, "epoch": 369} {"train_loss": -30.862653732299805, "global_step": 44652, "epoch": 369} {"train_loss": -33.238285064697266, "global_step": 44653, "epoch": 369} {"train_loss": -32.40855026245117, "global_step": 44654, "epoch": 369} {"train_loss": -32.388153076171875, "global_step": 44655, "epoch": 369} {"train_loss": -31.11151123046875, "global_step": 44656, "epoch": 369} {"train_loss": -32.24658966064453, "global_step": 44657, "epoch": 369} {"train_loss": -32.972816467285156, "global_step": 44658, "epoch": 369} {"train_loss": -33.241878509521484, "global_step": 44659, "epoch": 369} {"train_loss": -32.538612365722656, "global_step": 44660, "epoch": 369} {"train_loss": -33.935791015625, "global_step": 44661, "epoch": 369} {"train_loss": -33.37837600708008, "global_step": 44662, "epoch": 369} {"train_loss": -33.2702751159668, "global_step": 44663, "epoch": 369} {"train_loss": -32.87630844116211, "global_step": 44664, "epoch": 369} {"train_loss": -33.37059783935547, "global_step": 44665, "epoch": 369} {"train_loss": -33.48851013183594, "global_step": 44666, "epoch": 369} {"train_loss": -33.84836196899414, "global_step": 44667, "epoch": 369} {"train_loss": -33.5404052734375, "global_step": 44668, "epoch": 369} {"train_loss": -33.593505859375, "global_step": 44669, "epoch": 369} {"train_loss": -33.95151901245117, "global_step": 44670, "epoch": 369} {"train_loss": -33.735538482666016, "global_step": 44671, "epoch": 369} {"train_loss": -33.76523971557617, "global_step": 44672, "epoch": 369} {"train_loss": -34.323848724365234, "global_step": 44673, "epoch": 369} {"train_loss": -31.162195205688477, "global_step": 44674, "epoch": 369} {"train_loss": -34.12714767456055, "global_step": 44675, "epoch": 369} {"train_loss": -33.92832565307617, "global_step": 44676, "epoch": 369} {"train_loss": -32.520912170410156, "global_step": 44677, "epoch": 369} {"train_loss": -34.07716751098633, "global_step": 44678, "epoch": 369} {"train_loss": -34.07621383666992, "global_step": 44679, "epoch": 369} {"train_loss": -34.03914260864258, "global_step": 44680, "epoch": 369} {"train_loss": -33.05139923095703, "global_step": 44681, "epoch": 369} {"train_loss": -34.6197395324707, "global_step": 44682, "epoch": 369} {"train_loss": -34.49941635131836, "global_step": 44683, "epoch": 369} {"train_loss": -33.89200973510742, "global_step": 44684, "epoch": 369} {"train_loss": -33.357357025146484, "global_step": 44685, "epoch": 369} {"train_loss": -34.2143440246582, "global_step": 44686, "epoch": 369} {"train_loss": -34.33120346069336, "global_step": 44687, "epoch": 369} {"train_loss": -34.81924057006836, "global_step": 44688, "epoch": 369} {"train_loss": -34.16307830810547, "global_step": 44689, "epoch": 369} {"train_loss": -33.467403411865234, "global_step": 44690, "epoch": 369} {"train_loss": -34.8067512512207, "global_step": 44691, "epoch": 369} {"train_loss": -34.1748161315918, "global_step": 44692, "epoch": 369} {"train_loss": -34.6851921081543, "global_step": 44693, "epoch": 369} {"train_loss": -33.79754638671875, "global_step": 44694, "epoch": 369} {"train_loss": -34.07250213623047, "global_step": 44695, "epoch": 369} {"train_loss": -33.803443908691406, "global_step": 44696, "epoch": 369} {"train_loss": -34.02783966064453, "global_step": 44697, "epoch": 369} {"train_loss": -34.86168670654297, "global_step": 44698, "epoch": 369} {"train_loss": -34.1954345703125, "global_step": 44699, "epoch": 369} {"train_loss": -33.969600677490234, "global_step": 44700, "epoch": 369} {"train_loss": -34.39889144897461, "global_step": 44701, "epoch": 369} {"train_loss": -33.89436340332031, "global_step": 44702, "epoch": 369} {"train_loss": -31.128854751586914, "global_step": 44703, "epoch": 369} {"train_loss": -29.34547996520996, "global_step": 44704, "epoch": 369} {"train_loss": -29.754703521728516, "global_step": 44705, "epoch": 369} {"train_loss": -32.70595169067383, "global_step": 44706, "epoch": 369} {"train_loss": -34.57543182373047, "global_step": 44707, "epoch": 369} {"train_loss": -32.28428268432617, "global_step": 44708, "epoch": 369} {"train_loss": -34.03580856323242, "global_step": 44709, "epoch": 369} {"train_loss": -33.271480560302734, "global_step": 44710, "epoch": 369} {"train_loss": -32.14674758911133, "global_step": 44711, "epoch": 369} {"train_loss": -34.211483001708984, "global_step": 44712, "epoch": 369} {"train_loss": -31.662216186523438, "global_step": 44713, "epoch": 369} {"train_loss": -34.43561935424805, "global_step": 44714, "epoch": 369} {"train_loss": -33.29480743408203, "global_step": 44715, "epoch": 369} {"train_loss": -34.18192672729492, "global_step": 44716, "epoch": 369} {"train_loss": -33.43202590942383, "global_step": 44717, "epoch": 369} {"train_loss": -33.88772964477539, "global_step": 44718, "epoch": 369} {"train_loss": -34.64530563354492, "global_step": 44719, "epoch": 369} {"train_loss": -34.014801025390625, "global_step": 44720, "epoch": 369} {"train_loss": -34.643489837646484, "global_step": 44721, "epoch": 369} {"train_loss": -34.00302505493164, "global_step": 44722, "epoch": 369} {"train_loss": -33.522193908691406, "global_step": 44723, "epoch": 369} {"train_loss": -34.17622756958008, "global_step": 44724, "epoch": 369} {"train_loss": -34.63169479370117, "global_step": 44725, "epoch": 369} {"train_loss": -33.66842269897461, "global_step": 44726, "epoch": 369} {"train_loss": -33.806175231933594, "global_step": 44727, "epoch": 369} {"train_loss": -33.37407684326172, "global_step": 44728, "epoch": 369} {"train_loss": -33.138763427734375, "global_step": 44729, "epoch": 369} {"train_loss": -33.64316177368164, "global_step": 44730, "epoch": 369} {"train_loss": -33.34670639038086, "global_step": 44731, "epoch": 369} {"train_loss": -33.901432037353516, "global_step": 44732, "epoch": 369} {"train_loss": -32.23835372924805, "global_step": 44733, "epoch": 369} {"train_loss": -33.865936279296875, "global_step": 44734, "epoch": 369} {"train_loss": -34.23439407348633, "global_step": 44735, "epoch": 369} {"train_loss": -34.07865524291992, "global_step": 44736, "epoch": 369} {"train_loss": -34.69485855102539, "global_step": 44737, "epoch": 369} {"train_loss": -33.412330627441406, "global_step": 44738, "epoch": 369} {"train_loss": -34.42745590209961, "global_step": 44739, "epoch": 369} {"train_loss": -34.475006103515625, "global_step": 44740, "epoch": 369} {"train_loss": -33.98382568359375, "global_step": 44741, "epoch": 369} {"train_loss": -34.13209915161133, "global_step": 44742, "epoch": 369} {"train_loss": -33.7712516784668, "global_step": 44743, "epoch": 369} {"train_loss": -34.38935852050781, "global_step": 44744, "epoch": 369} {"train_loss": -33.84274673461914, "global_step": 44745, "epoch": 369} {"train_loss": -34.554412841796875, "global_step": 44746, "epoch": 369} {"train_loss": -34.47169876098633, "global_step": 44747, "epoch": 369} {"train_loss": -33.73698043823242, "global_step": 44748, "epoch": 369} {"train_loss": -34.48955154418945, "global_step": 44749, "epoch": 369} {"train_loss": -34.43608474731445, "global_step": 44750, "epoch": 369} {"train_loss": -34.79653549194336, "global_step": 44751, "epoch": 369} {"train_loss": -33.739463806152344, "global_step": 44752, "epoch": 369} {"train_loss": -34.810543060302734, "global_step": 44753, "epoch": 369} {"train_loss": -34.30290985107422, "global_step": 44754, "epoch": 369} {"train_loss": -34.10732650756836, "global_step": 44755, "epoch": 369} {"train_loss": -34.471961975097656, "global_step": 44756, "epoch": 369} {"train_loss": -31.772146224975586, "global_step": 44757, "epoch": 369} {"train_loss": -33.30062484741211, "global_step": 44758, "epoch": 369} {"train_loss": -33.163818359375, "global_step": 44759, "epoch": 369} {"train_loss": -32.19955825805664, "global_step": 44760, "epoch": 369} {"train_loss": -32.28778839111328, "global_step": 44761, "epoch": 369} {"train_loss": -29.449960708618164, "global_step": 44762, "epoch": 369} {"train_loss": -32.11845016479492, "global_step": 44763, "epoch": 369} {"train_loss": -30.546823501586914, "global_step": 44764, "epoch": 369} {"train_loss": -31.32930564880371, "global_step": 44765, "epoch": 369} {"train_loss": -31.595579147338867, "global_step": 44766, "epoch": 369} {"train_loss": -31.688922882080078, "global_step": 44767, "epoch": 369} {"train_loss": -32.87473678588867, "global_step": 44768, "epoch": 369} {"train_loss": -33.41194955179514, "global_step": 44769, "epoch": 369, "val_loss": 2769388.75} {"train_loss": -32.46467971801758, "global_step": 44770, "epoch": 370} {"train_loss": -32.228309631347656, "global_step": 44771, "epoch": 370} {"train_loss": -31.220722198486328, "global_step": 44772, "epoch": 370} {"train_loss": -31.44089126586914, "global_step": 44773, "epoch": 370} {"train_loss": -30.529376983642578, "global_step": 44774, "epoch": 370} {"train_loss": -32.50228500366211, "global_step": 44775, "epoch": 370} {"train_loss": -30.467227935791016, "global_step": 44776, "epoch": 370} {"train_loss": -31.099027633666992, "global_step": 44777, "epoch": 370} {"train_loss": -29.407886505126953, "global_step": 44778, "epoch": 370} {"train_loss": -30.04183006286621, "global_step": 44779, "epoch": 370} {"train_loss": -31.6270751953125, "global_step": 44780, "epoch": 370} {"train_loss": -33.710330963134766, "global_step": 44781, "epoch": 370} {"train_loss": -32.087501525878906, "global_step": 44782, "epoch": 370} {"train_loss": -31.80938148498535, "global_step": 44783, "epoch": 370} {"train_loss": -32.953338623046875, "global_step": 44784, "epoch": 370} {"train_loss": -32.216915130615234, "global_step": 44785, "epoch": 370} {"train_loss": -32.9803466796875, "global_step": 44786, "epoch": 370} {"train_loss": -32.88636016845703, "global_step": 44787, "epoch": 370} {"train_loss": -32.702003479003906, "global_step": 44788, "epoch": 370} {"train_loss": -33.64931869506836, "global_step": 44789, "epoch": 370} {"train_loss": -33.123233795166016, "global_step": 44790, "epoch": 370} {"train_loss": -33.4222412109375, "global_step": 44791, "epoch": 370} {"train_loss": -32.729610443115234, "global_step": 44792, "epoch": 370} {"train_loss": -33.79710006713867, "global_step": 44793, "epoch": 370} {"train_loss": -34.058467864990234, "global_step": 44794, "epoch": 370} {"train_loss": -32.98982620239258, "global_step": 44795, "epoch": 370} {"train_loss": -33.326454162597656, "global_step": 44796, "epoch": 370} {"train_loss": -33.66096878051758, "global_step": 44797, "epoch": 370} {"train_loss": -33.83174133300781, "global_step": 44798, "epoch": 370} {"train_loss": -33.61536407470703, "global_step": 44799, "epoch": 370} {"train_loss": -33.324337005615234, "global_step": 44800, "epoch": 370} {"train_loss": -33.60725402832031, "global_step": 44801, "epoch": 370} {"train_loss": -33.65822219848633, "global_step": 44802, "epoch": 370} {"train_loss": -33.34198760986328, "global_step": 44803, "epoch": 370} {"train_loss": -33.501853942871094, "global_step": 44804, "epoch": 370} {"train_loss": -33.32267761230469, "global_step": 44805, "epoch": 370} {"train_loss": -34.312191009521484, "global_step": 44806, "epoch": 370} {"train_loss": -34.01783752441406, "global_step": 44807, "epoch": 370} {"train_loss": -34.03480911254883, "global_step": 44808, "epoch": 370} {"train_loss": -34.866329193115234, "global_step": 44809, "epoch": 370} {"train_loss": -33.975196838378906, "global_step": 44810, "epoch": 370} {"train_loss": -34.595550537109375, "global_step": 44811, "epoch": 370} {"train_loss": -34.69855880737305, "global_step": 44812, "epoch": 370} {"train_loss": -34.41748046875, "global_step": 44813, "epoch": 370} {"train_loss": -34.07861328125, "global_step": 44814, "epoch": 370} {"train_loss": -35.0659294128418, "global_step": 44815, "epoch": 370} {"train_loss": -34.76966857910156, "global_step": 44816, "epoch": 370} {"train_loss": -34.28261947631836, "global_step": 44817, "epoch": 370} {"train_loss": -35.09199142456055, "global_step": 44818, "epoch": 370} {"train_loss": -35.12416076660156, "global_step": 44819, "epoch": 370} {"train_loss": -35.27892303466797, "global_step": 44820, "epoch": 370} {"train_loss": -35.08079528808594, "global_step": 44821, "epoch": 370} {"train_loss": -34.90203857421875, "global_step": 44822, "epoch": 370} {"train_loss": -34.759674072265625, "global_step": 44823, "epoch": 370} {"train_loss": -35.50989532470703, "global_step": 44824, "epoch": 370} {"train_loss": -34.9074821472168, "global_step": 44825, "epoch": 370} {"train_loss": -35.317169189453125, "global_step": 44826, "epoch": 370} {"train_loss": -35.11284255981445, "global_step": 44827, "epoch": 370} {"train_loss": -35.13557434082031, "global_step": 44828, "epoch": 370} {"train_loss": -34.9957389831543, "global_step": 44829, "epoch": 370} {"train_loss": -34.916282653808594, "global_step": 44830, "epoch": 370} {"train_loss": -34.90266799926758, "global_step": 44831, "epoch": 370} {"train_loss": -35.31452941894531, "global_step": 44832, "epoch": 370} {"train_loss": -35.11436080932617, "global_step": 44833, "epoch": 370} {"train_loss": -35.26694869995117, "global_step": 44834, "epoch": 370} {"train_loss": -35.53214645385742, "global_step": 44835, "epoch": 370} {"train_loss": -35.08149337768555, "global_step": 44836, "epoch": 370} {"train_loss": -35.57163619995117, "global_step": 44837, "epoch": 370} {"train_loss": -35.41724395751953, "global_step": 44838, "epoch": 370} {"train_loss": -35.04568862915039, "global_step": 44839, "epoch": 370} {"train_loss": -35.53853988647461, "global_step": 44840, "epoch": 370} {"train_loss": -34.901485443115234, "global_step": 44841, "epoch": 370} {"train_loss": -34.94997024536133, "global_step": 44842, "epoch": 370} {"train_loss": -34.5848388671875, "global_step": 44843, "epoch": 370} {"train_loss": -33.34593963623047, "global_step": 44844, "epoch": 370} {"train_loss": -35.1893310546875, "global_step": 44845, "epoch": 370} {"train_loss": -34.86244583129883, "global_step": 44846, "epoch": 370} {"train_loss": -33.91079330444336, "global_step": 44847, "epoch": 370} {"train_loss": -33.2417106628418, "global_step": 44848, "epoch": 370} {"train_loss": -33.938411712646484, "global_step": 44849, "epoch": 370} {"train_loss": -34.36516189575195, "global_step": 44850, "epoch": 370} {"train_loss": -30.496124267578125, "global_step": 44851, "epoch": 370} {"train_loss": -24.306364059448242, "global_step": 44852, "epoch": 370} {"train_loss": -18.195362091064453, "global_step": 44853, "epoch": 370} {"train_loss": -18.603017807006836, "global_step": 44854, "epoch": 370} {"train_loss": -34.07003402709961, "global_step": 44855, "epoch": 370} {"train_loss": -25.64630699157715, "global_step": 44856, "epoch": 370} {"train_loss": -32.785926818847656, "global_step": 44857, "epoch": 370} {"train_loss": -27.745502471923828, "global_step": 44858, "epoch": 370} {"train_loss": -31.539106369018555, "global_step": 44859, "epoch": 370} {"train_loss": -30.508329391479492, "global_step": 44860, "epoch": 370} {"train_loss": -30.81568717956543, "global_step": 44861, "epoch": 370} {"train_loss": -33.333553314208984, "global_step": 44862, "epoch": 370} {"train_loss": -32.403995513916016, "global_step": 44863, "epoch": 370} {"train_loss": -31.00957679748535, "global_step": 44864, "epoch": 370} {"train_loss": -31.558401107788086, "global_step": 44865, "epoch": 370} {"train_loss": -32.36112594604492, "global_step": 44866, "epoch": 370} {"train_loss": -32.43450927734375, "global_step": 44867, "epoch": 370} {"train_loss": -32.150909423828125, "global_step": 44868, "epoch": 370} {"train_loss": -32.330867767333984, "global_step": 44869, "epoch": 370} {"train_loss": -32.762943267822266, "global_step": 44870, "epoch": 370} {"train_loss": -32.9374885559082, "global_step": 44871, "epoch": 370} {"train_loss": -32.583274841308594, "global_step": 44872, "epoch": 370} {"train_loss": -32.58844757080078, "global_step": 44873, "epoch": 370} {"train_loss": -33.0485725402832, "global_step": 44874, "epoch": 370} {"train_loss": -33.26909255981445, "global_step": 44875, "epoch": 370} {"train_loss": -33.8327751159668, "global_step": 44876, "epoch": 370} {"train_loss": -33.47379684448242, "global_step": 44877, "epoch": 370} {"train_loss": -33.00921630859375, "global_step": 44878, "epoch": 370} {"train_loss": -33.058631896972656, "global_step": 44879, "epoch": 370} {"train_loss": -32.83359909057617, "global_step": 44880, "epoch": 370} {"train_loss": -33.444576263427734, "global_step": 44881, "epoch": 370} {"train_loss": -33.75479507446289, "global_step": 44882, "epoch": 370} {"train_loss": -34.00631332397461, "global_step": 44883, "epoch": 370} {"train_loss": -33.409271240234375, "global_step": 44884, "epoch": 370} {"train_loss": -33.30222702026367, "global_step": 44885, "epoch": 370} {"train_loss": -33.592628479003906, "global_step": 44886, "epoch": 370} {"train_loss": -33.89488220214844, "global_step": 44887, "epoch": 370} {"train_loss": -33.898963928222656, "global_step": 44888, "epoch": 370} {"train_loss": -34.227203369140625, "global_step": 44889, "epoch": 370} {"train_loss": -33.070602905651754, "global_step": 44890, "epoch": 370, "val_loss": 2606314.25} {"train_loss": -33.73329162597656, "global_step": 44891, "epoch": 371} {"train_loss": -34.22683334350586, "global_step": 44892, "epoch": 371} {"train_loss": -33.73841094970703, "global_step": 44893, "epoch": 371} {"train_loss": -34.369873046875, "global_step": 44894, "epoch": 371} {"train_loss": -34.042057037353516, "global_step": 44895, "epoch": 371} {"train_loss": -34.61647415161133, "global_step": 44896, "epoch": 371} {"train_loss": -34.11323928833008, "global_step": 44897, "epoch": 371} {"train_loss": -34.30332565307617, "global_step": 44898, "epoch": 371} {"train_loss": -34.26035690307617, "global_step": 44899, "epoch": 371} {"train_loss": -34.20718765258789, "global_step": 44900, "epoch": 371} {"train_loss": -34.00027847290039, "global_step": 44901, "epoch": 371} {"train_loss": -34.7439079284668, "global_step": 44902, "epoch": 371} {"train_loss": -34.64680862426758, "global_step": 44903, "epoch": 371} {"train_loss": -34.3815803527832, "global_step": 44904, "epoch": 371} {"train_loss": -35.01060104370117, "global_step": 44905, "epoch": 371} {"train_loss": -35.20630645751953, "global_step": 44906, "epoch": 371} {"train_loss": -34.849037170410156, "global_step": 44907, "epoch": 371} {"train_loss": -34.72860336303711, "global_step": 44908, "epoch": 371} {"train_loss": -35.0158576965332, "global_step": 44909, "epoch": 371} {"train_loss": -34.6813850402832, "global_step": 44910, "epoch": 371} {"train_loss": -34.86184310913086, "global_step": 44911, "epoch": 371} {"train_loss": -35.00495529174805, "global_step": 44912, "epoch": 371} {"train_loss": -34.63019561767578, "global_step": 44913, "epoch": 371} {"train_loss": -33.65060043334961, "global_step": 44914, "epoch": 371} {"train_loss": -33.0064582824707, "global_step": 44915, "epoch": 371} {"train_loss": -32.72166061401367, "global_step": 44916, "epoch": 371} {"train_loss": -33.63685989379883, "global_step": 44917, "epoch": 371} {"train_loss": -33.0803337097168, "global_step": 44918, "epoch": 371} {"train_loss": -34.11333084106445, "global_step": 44919, "epoch": 371} {"train_loss": -34.99079513549805, "global_step": 44920, "epoch": 371} {"train_loss": -34.9915885925293, "global_step": 44921, "epoch": 371} {"train_loss": -34.761573791503906, "global_step": 44922, "epoch": 371} {"train_loss": -32.686767578125, "global_step": 44923, "epoch": 371} {"train_loss": -34.07046127319336, "global_step": 44924, "epoch": 371} {"train_loss": -34.43801498413086, "global_step": 44925, "epoch": 371} {"train_loss": -34.38904571533203, "global_step": 44926, "epoch": 371} {"train_loss": -34.9230842590332, "global_step": 44927, "epoch": 371} {"train_loss": -33.90522766113281, "global_step": 44928, "epoch": 371} {"train_loss": -34.56356430053711, "global_step": 44929, "epoch": 371} {"train_loss": -33.94609451293945, "global_step": 44930, "epoch": 371} {"train_loss": -34.50789260864258, "global_step": 44931, "epoch": 371} {"train_loss": -33.677001953125, "global_step": 44932, "epoch": 371} {"train_loss": -33.350250244140625, "global_step": 44933, "epoch": 371} {"train_loss": -33.60036087036133, "global_step": 44934, "epoch": 371} {"train_loss": -34.82838821411133, "global_step": 44935, "epoch": 371} {"train_loss": -33.865478515625, "global_step": 44936, "epoch": 371} {"train_loss": -32.45513153076172, "global_step": 44937, "epoch": 371} {"train_loss": -31.957422256469727, "global_step": 44938, "epoch": 371} {"train_loss": -33.93712615966797, "global_step": 44939, "epoch": 371} {"train_loss": -32.29940414428711, "global_step": 44940, "epoch": 371} {"train_loss": -33.075927734375, "global_step": 44941, "epoch": 371} {"train_loss": -34.25336456298828, "global_step": 44942, "epoch": 371} {"train_loss": -32.28559112548828, "global_step": 44943, "epoch": 371} {"train_loss": -33.37190246582031, "global_step": 44944, "epoch": 371} {"train_loss": -32.87520217895508, "global_step": 44945, "epoch": 371} {"train_loss": -32.7512092590332, "global_step": 44946, "epoch": 371} {"train_loss": -33.179927825927734, "global_step": 44947, "epoch": 371} {"train_loss": -33.87107467651367, "global_step": 44948, "epoch": 371} {"train_loss": -33.671607971191406, "global_step": 44949, "epoch": 371} {"train_loss": -33.742610931396484, "global_step": 44950, "epoch": 371} {"train_loss": -32.66774368286133, "global_step": 44951, "epoch": 371} {"train_loss": -32.32416915893555, "global_step": 44952, "epoch": 371} {"train_loss": -33.563392639160156, "global_step": 44953, "epoch": 371} {"train_loss": -34.00374984741211, "global_step": 44954, "epoch": 371} {"train_loss": -33.612850189208984, "global_step": 44955, "epoch": 371} {"train_loss": -32.31877517700195, "global_step": 44956, "epoch": 371} {"train_loss": -32.67254638671875, "global_step": 44957, "epoch": 371} {"train_loss": -32.34064865112305, "global_step": 44958, "epoch": 371} {"train_loss": -33.70750045776367, "global_step": 44959, "epoch": 371} {"train_loss": -34.25031661987305, "global_step": 44960, "epoch": 371} {"train_loss": -34.17244338989258, "global_step": 44961, "epoch": 371} {"train_loss": -33.4408073425293, "global_step": 44962, "epoch": 371} {"train_loss": -33.92442321777344, "global_step": 44963, "epoch": 371} {"train_loss": -33.615875244140625, "global_step": 44964, "epoch": 371} {"train_loss": -33.11484909057617, "global_step": 44965, "epoch": 371} {"train_loss": -33.654457092285156, "global_step": 44966, "epoch": 371} {"train_loss": -33.86603927612305, "global_step": 44967, "epoch": 371} {"train_loss": -33.48206329345703, "global_step": 44968, "epoch": 371} {"train_loss": -32.924537658691406, "global_step": 44969, "epoch": 371} {"train_loss": -33.787879943847656, "global_step": 44970, "epoch": 371} {"train_loss": -33.6677360534668, "global_step": 44971, "epoch": 371} {"train_loss": -34.47650909423828, "global_step": 44972, "epoch": 371} {"train_loss": -33.49201202392578, "global_step": 44973, "epoch": 371} {"train_loss": -34.19905090332031, "global_step": 44974, "epoch": 371} {"train_loss": -33.98649597167969, "global_step": 44975, "epoch": 371} {"train_loss": -33.93074417114258, "global_step": 44976, "epoch": 371} {"train_loss": -33.982215881347656, "global_step": 44977, "epoch": 371} {"train_loss": -33.4318733215332, "global_step": 44978, "epoch": 371} {"train_loss": -33.83289337158203, "global_step": 44979, "epoch": 371} {"train_loss": -31.168088912963867, "global_step": 44980, "epoch": 371} {"train_loss": -33.27519989013672, "global_step": 44981, "epoch": 371} {"train_loss": -33.50624465942383, "global_step": 44982, "epoch": 371} {"train_loss": -32.996299743652344, "global_step": 44983, "epoch": 371} {"train_loss": -32.787261962890625, "global_step": 44984, "epoch": 371} {"train_loss": -32.849605560302734, "global_step": 44985, "epoch": 371} {"train_loss": -33.898040771484375, "global_step": 44986, "epoch": 371} {"train_loss": -33.7280158996582, "global_step": 44987, "epoch": 371} {"train_loss": -34.32905197143555, "global_step": 44988, "epoch": 371} {"train_loss": -33.08588790893555, "global_step": 44989, "epoch": 371} {"train_loss": -33.161128997802734, "global_step": 44990, "epoch": 371} {"train_loss": -32.80228805541992, "global_step": 44991, "epoch": 371} {"train_loss": -33.57543182373047, "global_step": 44992, "epoch": 371} {"train_loss": -34.16352081298828, "global_step": 44993, "epoch": 371} {"train_loss": -34.41139221191406, "global_step": 44994, "epoch": 371} {"train_loss": -34.601844787597656, "global_step": 44995, "epoch": 371} {"train_loss": -33.045127868652344, "global_step": 44996, "epoch": 371} {"train_loss": -33.79827117919922, "global_step": 44997, "epoch": 371} {"train_loss": -33.213375091552734, "global_step": 44998, "epoch": 371} {"train_loss": -34.91048812866211, "global_step": 44999, "epoch": 371} {"train_loss": -33.99065017700195, "global_step": 45000, "epoch": 371} {"train_loss": -32.27138900756836, "global_step": 45001, "epoch": 371} {"train_loss": -34.38053512573242, "global_step": 45002, "epoch": 371} {"train_loss": -34.6308479309082, "global_step": 45003, "epoch": 371} {"train_loss": -34.27324295043945, "global_step": 45004, "epoch": 371} {"train_loss": -32.558448791503906, "global_step": 45005, "epoch": 371} {"train_loss": -30.267093658447266, "global_step": 45006, "epoch": 371} {"train_loss": -33.030879974365234, "global_step": 45007, "epoch": 371} {"train_loss": -34.3798942565918, "global_step": 45008, "epoch": 371} {"train_loss": -31.711811065673828, "global_step": 45009, "epoch": 371} {"train_loss": -30.699817657470703, "global_step": 45010, "epoch": 371} {"train_loss": -33.69161142396533, "global_step": 45011, "epoch": 371, "val_loss": 2585297.0} {"train_loss": -33.753662109375, "global_step": 45012, "epoch": 372} {"train_loss": -34.19004440307617, "global_step": 45013, "epoch": 372} {"train_loss": -31.865966796875, "global_step": 45014, "epoch": 372} {"train_loss": -33.76711654663086, "global_step": 45015, "epoch": 372} {"train_loss": -33.86634063720703, "global_step": 45016, "epoch": 372} {"train_loss": -32.1542854309082, "global_step": 45017, "epoch": 372} {"train_loss": -33.12242889404297, "global_step": 45018, "epoch": 372} {"train_loss": -34.04207992553711, "global_step": 45019, "epoch": 372} {"train_loss": -34.240234375, "global_step": 45020, "epoch": 372} {"train_loss": -33.47705078125, "global_step": 45021, "epoch": 372} {"train_loss": -33.73978805541992, "global_step": 45022, "epoch": 372} {"train_loss": -33.89917755126953, "global_step": 45023, "epoch": 372} {"train_loss": -33.873294830322266, "global_step": 45024, "epoch": 372} {"train_loss": -33.1125602722168, "global_step": 45025, "epoch": 372} {"train_loss": -33.524147033691406, "global_step": 45026, "epoch": 372} {"train_loss": -33.50851058959961, "global_step": 45027, "epoch": 372} {"train_loss": -33.10910415649414, "global_step": 45028, "epoch": 372} {"train_loss": -34.33094024658203, "global_step": 45029, "epoch": 372} {"train_loss": -34.232521057128906, "global_step": 45030, "epoch": 372} {"train_loss": -33.72734832763672, "global_step": 45031, "epoch": 372} {"train_loss": -34.13135528564453, "global_step": 45032, "epoch": 372} {"train_loss": -34.097869873046875, "global_step": 45033, "epoch": 372} {"train_loss": -33.80836868286133, "global_step": 45034, "epoch": 372} {"train_loss": -33.7366828918457, "global_step": 45035, "epoch": 372} {"train_loss": -34.15264129638672, "global_step": 45036, "epoch": 372} {"train_loss": -34.62480163574219, "global_step": 45037, "epoch": 372} {"train_loss": -33.693782806396484, "global_step": 45038, "epoch": 372} {"train_loss": -32.73617172241211, "global_step": 45039, "epoch": 372} {"train_loss": -33.69492721557617, "global_step": 45040, "epoch": 372} {"train_loss": -34.11420822143555, "global_step": 45041, "epoch": 372} {"train_loss": -33.93636703491211, "global_step": 45042, "epoch": 372} {"train_loss": -33.910152435302734, "global_step": 45043, "epoch": 372} {"train_loss": -34.14268493652344, "global_step": 45044, "epoch": 372} {"train_loss": -34.224212646484375, "global_step": 45045, "epoch": 372} {"train_loss": -34.656490325927734, "global_step": 45046, "epoch": 372} {"train_loss": -34.28731155395508, "global_step": 45047, "epoch": 372} {"train_loss": -32.46184158325195, "global_step": 45048, "epoch": 372} {"train_loss": -32.86467742919922, "global_step": 45049, "epoch": 372} {"train_loss": -34.176185607910156, "global_step": 45050, "epoch": 372} {"train_loss": -34.29151916503906, "global_step": 45051, "epoch": 372} {"train_loss": -34.22915267944336, "global_step": 45052, "epoch": 372} {"train_loss": -33.85001754760742, "global_step": 45053, "epoch": 372} {"train_loss": -34.02286148071289, "global_step": 45054, "epoch": 372} {"train_loss": -34.35441589355469, "global_step": 45055, "epoch": 372} {"train_loss": -35.2393798828125, "global_step": 45056, "epoch": 372} {"train_loss": -34.466514587402344, "global_step": 45057, "epoch": 372} {"train_loss": -34.18302536010742, "global_step": 45058, "epoch": 372} {"train_loss": -35.269710540771484, "global_step": 45059, "epoch": 372} {"train_loss": -34.7693977355957, "global_step": 45060, "epoch": 372} {"train_loss": -33.95949172973633, "global_step": 45061, "epoch": 372} {"train_loss": -32.85457992553711, "global_step": 45062, "epoch": 372} {"train_loss": -35.02427291870117, "global_step": 45063, "epoch": 372} {"train_loss": -34.220680236816406, "global_step": 45064, "epoch": 372} {"train_loss": -33.7188835144043, "global_step": 45065, "epoch": 372} {"train_loss": -32.606571197509766, "global_step": 45066, "epoch": 372} {"train_loss": -34.64418411254883, "global_step": 45067, "epoch": 372} {"train_loss": -34.636383056640625, "global_step": 45068, "epoch": 372} {"train_loss": -34.1340217590332, "global_step": 45069, "epoch": 372} {"train_loss": -35.21064758300781, "global_step": 45070, "epoch": 372} {"train_loss": -34.9327278137207, "global_step": 45071, "epoch": 372} {"train_loss": -34.81148910522461, "global_step": 45072, "epoch": 372} {"train_loss": -34.6103401184082, "global_step": 45073, "epoch": 372} {"train_loss": -35.21210861206055, "global_step": 45074, "epoch": 372} {"train_loss": -35.080379486083984, "global_step": 45075, "epoch": 372} {"train_loss": -35.43824005126953, "global_step": 45076, "epoch": 372} {"train_loss": -35.024593353271484, "global_step": 45077, "epoch": 372} {"train_loss": -34.53122329711914, "global_step": 45078, "epoch": 372} {"train_loss": -34.86520004272461, "global_step": 45079, "epoch": 372} {"train_loss": -35.10723876953125, "global_step": 45080, "epoch": 372} {"train_loss": -34.41597366333008, "global_step": 45081, "epoch": 372} {"train_loss": -35.12494659423828, "global_step": 45082, "epoch": 372} {"train_loss": -34.90867233276367, "global_step": 45083, "epoch": 372} {"train_loss": -35.37478256225586, "global_step": 45084, "epoch": 372} {"train_loss": -34.74861526489258, "global_step": 45085, "epoch": 372} {"train_loss": -35.31205368041992, "global_step": 45086, "epoch": 372} {"train_loss": -34.78447341918945, "global_step": 45087, "epoch": 372} {"train_loss": -35.142578125, "global_step": 45088, "epoch": 372} {"train_loss": -35.10141372680664, "global_step": 45089, "epoch": 372} {"train_loss": -35.0699348449707, "global_step": 45090, "epoch": 372} {"train_loss": -35.74409866333008, "global_step": 45091, "epoch": 372} {"train_loss": -34.84663009643555, "global_step": 45092, "epoch": 372} {"train_loss": -34.634521484375, "global_step": 45093, "epoch": 372} {"train_loss": -34.722896575927734, "global_step": 45094, "epoch": 372} {"train_loss": -34.31338882446289, "global_step": 45095, "epoch": 372} {"train_loss": -34.16591262817383, "global_step": 45096, "epoch": 372} {"train_loss": -34.4028434753418, "global_step": 45097, "epoch": 372} {"train_loss": -34.47673797607422, "global_step": 45098, "epoch": 372} {"train_loss": -34.89521408081055, "global_step": 45099, "epoch": 372} {"train_loss": -35.6504020690918, "global_step": 45100, "epoch": 372} {"train_loss": -35.863304138183594, "global_step": 45101, "epoch": 372} {"train_loss": -35.50128936767578, "global_step": 45102, "epoch": 372} {"train_loss": -35.937252044677734, "global_step": 45103, "epoch": 372} {"train_loss": -35.59566116333008, "global_step": 45104, "epoch": 372} {"train_loss": -34.538639068603516, "global_step": 45105, "epoch": 372} {"train_loss": -32.945430755615234, "global_step": 45106, "epoch": 372} {"train_loss": -32.638484954833984, "global_step": 45107, "epoch": 372} {"train_loss": -32.68205642700195, "global_step": 45108, "epoch": 372} {"train_loss": -33.047882080078125, "global_step": 45109, "epoch": 372} {"train_loss": -34.223487854003906, "global_step": 45110, "epoch": 372} {"train_loss": -33.829246520996094, "global_step": 45111, "epoch": 372} {"train_loss": -34.47172164916992, "global_step": 45112, "epoch": 372} {"train_loss": -35.149131774902344, "global_step": 45113, "epoch": 372} {"train_loss": -33.98601150512695, "global_step": 45114, "epoch": 372} {"train_loss": -34.8552360534668, "global_step": 45115, "epoch": 372} {"train_loss": -34.404273986816406, "global_step": 45116, "epoch": 372} {"train_loss": -34.59393310546875, "global_step": 45117, "epoch": 372} {"train_loss": -35.10780715942383, "global_step": 45118, "epoch": 372} {"train_loss": -35.101173400878906, "global_step": 45119, "epoch": 372} {"train_loss": -34.23908615112305, "global_step": 45120, "epoch": 372} {"train_loss": -33.537166595458984, "global_step": 45121, "epoch": 372} {"train_loss": -33.298500061035156, "global_step": 45122, "epoch": 372} {"train_loss": -31.301950454711914, "global_step": 45123, "epoch": 372} {"train_loss": -32.00869369506836, "global_step": 45124, "epoch": 372} {"train_loss": -33.478477478027344, "global_step": 45125, "epoch": 372} {"train_loss": -34.58453369140625, "global_step": 45126, "epoch": 372} {"train_loss": -32.89429473876953, "global_step": 45127, "epoch": 372} {"train_loss": -33.62453842163086, "global_step": 45128, "epoch": 372} {"train_loss": -35.222652435302734, "global_step": 45129, "epoch": 372} {"train_loss": -32.7601432800293, "global_step": 45130, "epoch": 372} {"train_loss": -31.9325008392334, "global_step": 45131, "epoch": 372} {"train_loss": -34.172212490365524, "global_step": 45132, "epoch": 372, "val_loss": 2551090.75} {"train_loss": -33.682098388671875, "global_step": 45133, "epoch": 373} {"train_loss": -32.09264373779297, "global_step": 45134, "epoch": 373} {"train_loss": -32.99605178833008, "global_step": 45135, "epoch": 373} {"train_loss": -33.288551330566406, "global_step": 45136, "epoch": 373} {"train_loss": -33.98218536376953, "global_step": 45137, "epoch": 373} {"train_loss": -34.440277099609375, "global_step": 45138, "epoch": 373} {"train_loss": -32.50251007080078, "global_step": 45139, "epoch": 373} {"train_loss": -33.73971176147461, "global_step": 45140, "epoch": 373} {"train_loss": -34.8186149597168, "global_step": 45141, "epoch": 373} {"train_loss": -33.576576232910156, "global_step": 45142, "epoch": 373} {"train_loss": -34.03736114501953, "global_step": 45143, "epoch": 373} {"train_loss": -33.9961051940918, "global_step": 45144, "epoch": 373} {"train_loss": -34.249725341796875, "global_step": 45145, "epoch": 373} {"train_loss": -33.86283493041992, "global_step": 45146, "epoch": 373} {"train_loss": -33.923763275146484, "global_step": 45147, "epoch": 373} {"train_loss": -33.39755630493164, "global_step": 45148, "epoch": 373} {"train_loss": -34.40864181518555, "global_step": 45149, "epoch": 373} {"train_loss": -34.095252990722656, "global_step": 45150, "epoch": 373} {"train_loss": -33.77342224121094, "global_step": 45151, "epoch": 373} {"train_loss": -32.96212387084961, "global_step": 45152, "epoch": 373} {"train_loss": -34.47621536254883, "global_step": 45153, "epoch": 373} {"train_loss": -33.68880844116211, "global_step": 45154, "epoch": 373} {"train_loss": -34.1677360534668, "global_step": 45155, "epoch": 373} {"train_loss": -33.000614166259766, "global_step": 45156, "epoch": 373} {"train_loss": -34.17562484741211, "global_step": 45157, "epoch": 373} {"train_loss": -34.06012725830078, "global_step": 45158, "epoch": 373} {"train_loss": -33.570823669433594, "global_step": 45159, "epoch": 373} {"train_loss": -34.009674072265625, "global_step": 45160, "epoch": 373} {"train_loss": -34.179664611816406, "global_step": 45161, "epoch": 373} {"train_loss": -34.67192840576172, "global_step": 45162, "epoch": 373} {"train_loss": -32.841312408447266, "global_step": 45163, "epoch": 373} {"train_loss": -33.888999938964844, "global_step": 45164, "epoch": 373} {"train_loss": -33.85850143432617, "global_step": 45165, "epoch": 373} {"train_loss": -34.66902542114258, "global_step": 45166, "epoch": 373} {"train_loss": -33.68140411376953, "global_step": 45167, "epoch": 373} {"train_loss": -33.865509033203125, "global_step": 45168, "epoch": 373} {"train_loss": -33.37094497680664, "global_step": 45169, "epoch": 373} {"train_loss": -34.36040115356445, "global_step": 45170, "epoch": 373} {"train_loss": -34.08943557739258, "global_step": 45171, "epoch": 373} {"train_loss": -34.11842727661133, "global_step": 45172, "epoch": 373} {"train_loss": -33.743160247802734, "global_step": 45173, "epoch": 373} {"train_loss": -33.62788772583008, "global_step": 45174, "epoch": 373} {"train_loss": -34.19626998901367, "global_step": 45175, "epoch": 373} {"train_loss": -33.35261154174805, "global_step": 45176, "epoch": 373} {"train_loss": -34.24496841430664, "global_step": 45177, "epoch": 373} {"train_loss": -34.38911819458008, "global_step": 45178, "epoch": 373} {"train_loss": -33.92588424682617, "global_step": 45179, "epoch": 373} {"train_loss": -33.82936096191406, "global_step": 45180, "epoch": 373} {"train_loss": -33.34619140625, "global_step": 45181, "epoch": 373} {"train_loss": -34.233699798583984, "global_step": 45182, "epoch": 373} {"train_loss": -34.90217590332031, "global_step": 45183, "epoch": 373} {"train_loss": -33.6854362487793, "global_step": 45184, "epoch": 373} {"train_loss": -33.35151290893555, "global_step": 45185, "epoch": 373} {"train_loss": -34.231136322021484, "global_step": 45186, "epoch": 373} {"train_loss": -34.37301254272461, "global_step": 45187, "epoch": 373} {"train_loss": -33.32074737548828, "global_step": 45188, "epoch": 373} {"train_loss": -33.74825668334961, "global_step": 45189, "epoch": 373} {"train_loss": -33.391265869140625, "global_step": 45190, "epoch": 373} {"train_loss": -34.2921142578125, "global_step": 45191, "epoch": 373} {"train_loss": -33.22831344604492, "global_step": 45192, "epoch": 373} {"train_loss": -30.871870040893555, "global_step": 45193, "epoch": 373} {"train_loss": -30.62282371520996, "global_step": 45194, "epoch": 373} {"train_loss": -31.968000411987305, "global_step": 45195, "epoch": 373} {"train_loss": -34.22465896606445, "global_step": 45196, "epoch": 373} {"train_loss": -34.50019454956055, "global_step": 45197, "epoch": 373} {"train_loss": -34.27151107788086, "global_step": 45198, "epoch": 373} {"train_loss": -34.573970794677734, "global_step": 45199, "epoch": 373} {"train_loss": -34.441341400146484, "global_step": 45200, "epoch": 373} {"train_loss": -33.68310546875, "global_step": 45201, "epoch": 373} {"train_loss": -34.63817596435547, "global_step": 45202, "epoch": 373} {"train_loss": -34.930660247802734, "global_step": 45203, "epoch": 373} {"train_loss": -33.664432525634766, "global_step": 45204, "epoch": 373} {"train_loss": -34.16172790527344, "global_step": 45205, "epoch": 373} {"train_loss": -33.72378158569336, "global_step": 45206, "epoch": 373} {"train_loss": -34.72346878051758, "global_step": 45207, "epoch": 373} {"train_loss": -34.2906494140625, "global_step": 45208, "epoch": 373} {"train_loss": -33.8769645690918, "global_step": 45209, "epoch": 373} {"train_loss": -33.95277404785156, "global_step": 45210, "epoch": 373} {"train_loss": -34.41550827026367, "global_step": 45211, "epoch": 373} {"train_loss": -34.254966735839844, "global_step": 45212, "epoch": 373} {"train_loss": -34.78288650512695, "global_step": 45213, "epoch": 373} {"train_loss": -34.04112243652344, "global_step": 45214, "epoch": 373} {"train_loss": -33.85653305053711, "global_step": 45215, "epoch": 373} {"train_loss": -34.29208755493164, "global_step": 45216, "epoch": 373} {"train_loss": -33.89657211303711, "global_step": 45217, "epoch": 373} {"train_loss": -34.435142517089844, "global_step": 45218, "epoch": 373} {"train_loss": -34.4896354675293, "global_step": 45219, "epoch": 373} {"train_loss": -33.92742156982422, "global_step": 45220, "epoch": 373} {"train_loss": -33.60184860229492, "global_step": 45221, "epoch": 373} {"train_loss": -34.529659271240234, "global_step": 45222, "epoch": 373} {"train_loss": -35.15302658081055, "global_step": 45223, "epoch": 373} {"train_loss": -33.92600631713867, "global_step": 45224, "epoch": 373} {"train_loss": -34.67377853393555, "global_step": 45225, "epoch": 373} {"train_loss": -34.71053695678711, "global_step": 45226, "epoch": 373} {"train_loss": -34.725791931152344, "global_step": 45227, "epoch": 373} {"train_loss": -34.605899810791016, "global_step": 45228, "epoch": 373} {"train_loss": -33.353546142578125, "global_step": 45229, "epoch": 373} {"train_loss": -33.93064498901367, "global_step": 45230, "epoch": 373} {"train_loss": -33.6925163269043, "global_step": 45231, "epoch": 373} {"train_loss": -32.05056381225586, "global_step": 45232, "epoch": 373} {"train_loss": -30.3642635345459, "global_step": 45233, "epoch": 373} {"train_loss": -30.859588623046875, "global_step": 45234, "epoch": 373} {"train_loss": -32.981075286865234, "global_step": 45235, "epoch": 373} {"train_loss": -33.94521713256836, "global_step": 45236, "epoch": 373} {"train_loss": -34.0201530456543, "global_step": 45237, "epoch": 373} {"train_loss": -32.12030029296875, "global_step": 45238, "epoch": 373} {"train_loss": -32.92881774902344, "global_step": 45239, "epoch": 373} {"train_loss": -34.06138610839844, "global_step": 45240, "epoch": 373} {"train_loss": -33.59604263305664, "global_step": 45241, "epoch": 373} {"train_loss": -33.1478271484375, "global_step": 45242, "epoch": 373} {"train_loss": -34.10701370239258, "global_step": 45243, "epoch": 373} {"train_loss": -33.990779876708984, "global_step": 45244, "epoch": 373} {"train_loss": -33.16850662231445, "global_step": 45245, "epoch": 373} {"train_loss": -33.9885139465332, "global_step": 45246, "epoch": 373} {"train_loss": -33.68500518798828, "global_step": 45247, "epoch": 373} {"train_loss": -34.06734848022461, "global_step": 45248, "epoch": 373} {"train_loss": -33.99477767944336, "global_step": 45249, "epoch": 373} {"train_loss": -33.71962356567383, "global_step": 45250, "epoch": 373} {"train_loss": -34.339027404785156, "global_step": 45251, "epoch": 373} {"train_loss": -34.076393127441406, "global_step": 45252, "epoch": 373} {"train_loss": -33.79908878547101, "global_step": 45253, "epoch": 373, "val_loss": 2573913.25} {"train_loss": -34.55093002319336, "global_step": 45254, "epoch": 374} {"train_loss": -34.559669494628906, "global_step": 45255, "epoch": 374} {"train_loss": -34.240386962890625, "global_step": 45256, "epoch": 374} {"train_loss": -34.286067962646484, "global_step": 45257, "epoch": 374} {"train_loss": -31.861236572265625, "global_step": 45258, "epoch": 374} {"train_loss": -34.00691223144531, "global_step": 45259, "epoch": 374} {"train_loss": -33.63663864135742, "global_step": 45260, "epoch": 374} {"train_loss": -33.60969161987305, "global_step": 45261, "epoch": 374} {"train_loss": -34.00105667114258, "global_step": 45262, "epoch": 374} {"train_loss": -33.583274841308594, "global_step": 45263, "epoch": 374} {"train_loss": -34.63391876220703, "global_step": 45264, "epoch": 374} {"train_loss": -33.59370803833008, "global_step": 45265, "epoch": 374} {"train_loss": -34.04111862182617, "global_step": 45266, "epoch": 374} {"train_loss": -34.00606918334961, "global_step": 45267, "epoch": 374} {"train_loss": -33.43209457397461, "global_step": 45268, "epoch": 374} {"train_loss": -30.47879981994629, "global_step": 45269, "epoch": 374} {"train_loss": -27.483657836914062, "global_step": 45270, "epoch": 374} {"train_loss": -29.13929557800293, "global_step": 45271, "epoch": 374} {"train_loss": -33.017433166503906, "global_step": 45272, "epoch": 374} {"train_loss": -33.163570404052734, "global_step": 45273, "epoch": 374} {"train_loss": -32.255096435546875, "global_step": 45274, "epoch": 374} {"train_loss": -33.84287643432617, "global_step": 45275, "epoch": 374} {"train_loss": -33.62064743041992, "global_step": 45276, "epoch": 374} {"train_loss": -33.248382568359375, "global_step": 45277, "epoch": 374} {"train_loss": -34.40228271484375, "global_step": 45278, "epoch": 374} {"train_loss": -32.555728912353516, "global_step": 45279, "epoch": 374} {"train_loss": -33.723541259765625, "global_step": 45280, "epoch": 374} {"train_loss": -33.43518829345703, "global_step": 45281, "epoch": 374} {"train_loss": -34.36013412475586, "global_step": 45282, "epoch": 374} {"train_loss": -34.07307815551758, "global_step": 45283, "epoch": 374} {"train_loss": -34.18428421020508, "global_step": 45284, "epoch": 374} {"train_loss": -34.249732971191406, "global_step": 45285, "epoch": 374} {"train_loss": -33.52602767944336, "global_step": 45286, "epoch": 374} {"train_loss": -34.34575271606445, "global_step": 45287, "epoch": 374} {"train_loss": -34.669654846191406, "global_step": 45288, "epoch": 374} {"train_loss": -34.13981246948242, "global_step": 45289, "epoch": 374} {"train_loss": -33.91419982910156, "global_step": 45290, "epoch": 374} {"train_loss": -34.43489456176758, "global_step": 45291, "epoch": 374} {"train_loss": -34.43118667602539, "global_step": 45292, "epoch": 374} {"train_loss": -34.33296203613281, "global_step": 45293, "epoch": 374} {"train_loss": -34.15198516845703, "global_step": 45294, "epoch": 374} {"train_loss": -34.19093704223633, "global_step": 45295, "epoch": 374} {"train_loss": -33.74003219604492, "global_step": 45296, "epoch": 374} {"train_loss": -33.466957092285156, "global_step": 45297, "epoch": 374} {"train_loss": -33.841636657714844, "global_step": 45298, "epoch": 374} {"train_loss": -33.43578338623047, "global_step": 45299, "epoch": 374} {"train_loss": -34.4663200378418, "global_step": 45300, "epoch": 374} {"train_loss": -33.88047409057617, "global_step": 45301, "epoch": 374} {"train_loss": -34.13676834106445, "global_step": 45302, "epoch": 374} {"train_loss": -34.06150436401367, "global_step": 45303, "epoch": 374} {"train_loss": -34.072914123535156, "global_step": 45304, "epoch": 374} {"train_loss": -33.369903564453125, "global_step": 45305, "epoch": 374} {"train_loss": -34.102352142333984, "global_step": 45306, "epoch": 374} {"train_loss": -33.755523681640625, "global_step": 45307, "epoch": 374} {"train_loss": -34.21854782104492, "global_step": 45308, "epoch": 374} {"train_loss": -34.275917053222656, "global_step": 45309, "epoch": 374} {"train_loss": -33.89744186401367, "global_step": 45310, "epoch": 374} {"train_loss": -25.182907104492188, "global_step": 45311, "epoch": 374} {"train_loss": -33.937904357910156, "global_step": 45312, "epoch": 374} {"train_loss": -33.2642707824707, "global_step": 45313, "epoch": 374} {"train_loss": -33.834938049316406, "global_step": 45314, "epoch": 374} {"train_loss": -32.16297149658203, "global_step": 45315, "epoch": 374} {"train_loss": -31.41468620300293, "global_step": 45316, "epoch": 374} {"train_loss": -32.21824264526367, "global_step": 45317, "epoch": 374} {"train_loss": -33.267616271972656, "global_step": 45318, "epoch": 374} {"train_loss": -32.64087677001953, "global_step": 45319, "epoch": 374} {"train_loss": -34.01658248901367, "global_step": 45320, "epoch": 374} {"train_loss": -33.69137954711914, "global_step": 45321, "epoch": 374} {"train_loss": -33.20858383178711, "global_step": 45322, "epoch": 374} {"train_loss": -32.2021369934082, "global_step": 45323, "epoch": 374} {"train_loss": -32.16233825683594, "global_step": 45324, "epoch": 374} {"train_loss": -33.34552764892578, "global_step": 45325, "epoch": 374} {"train_loss": -33.04048538208008, "global_step": 45326, "epoch": 374} {"train_loss": -32.43859100341797, "global_step": 45327, "epoch": 374} {"train_loss": -34.13724899291992, "global_step": 45328, "epoch": 374} {"train_loss": -33.512386322021484, "global_step": 45329, "epoch": 374} {"train_loss": -32.0379638671875, "global_step": 45330, "epoch": 374} {"train_loss": -33.3347282409668, "global_step": 45331, "epoch": 374} {"train_loss": -33.1663703918457, "global_step": 45332, "epoch": 374} {"train_loss": -33.877899169921875, "global_step": 45333, "epoch": 374} {"train_loss": -32.85364532470703, "global_step": 45334, "epoch": 374} {"train_loss": -33.07707214355469, "global_step": 45335, "epoch": 374} {"train_loss": -33.891151428222656, "global_step": 45336, "epoch": 374} {"train_loss": -33.013973236083984, "global_step": 45337, "epoch": 374} {"train_loss": -33.06116485595703, "global_step": 45338, "epoch": 374} {"train_loss": -33.923255920410156, "global_step": 45339, "epoch": 374} {"train_loss": -33.68424987792969, "global_step": 45340, "epoch": 374} {"train_loss": -33.63322067260742, "global_step": 45341, "epoch": 374} {"train_loss": -34.11652374267578, "global_step": 45342, "epoch": 374} {"train_loss": -34.35708999633789, "global_step": 45343, "epoch": 374} {"train_loss": -34.04472732543945, "global_step": 45344, "epoch": 374} {"train_loss": -34.16878128051758, "global_step": 45345, "epoch": 374} {"train_loss": -34.3163948059082, "global_step": 45346, "epoch": 374} {"train_loss": -34.730316162109375, "global_step": 45347, "epoch": 374} {"train_loss": -34.317813873291016, "global_step": 45348, "epoch": 374} {"train_loss": -34.56432342529297, "global_step": 45349, "epoch": 374} {"train_loss": -35.00288009643555, "global_step": 45350, "epoch": 374} {"train_loss": -34.708534240722656, "global_step": 45351, "epoch": 374} {"train_loss": -35.02451705932617, "global_step": 45352, "epoch": 374} {"train_loss": -34.81974792480469, "global_step": 45353, "epoch": 374} {"train_loss": -34.949642181396484, "global_step": 45354, "epoch": 374} {"train_loss": -34.81758499145508, "global_step": 45355, "epoch": 374} {"train_loss": -34.865047454833984, "global_step": 45356, "epoch": 374} {"train_loss": -34.878196716308594, "global_step": 45357, "epoch": 374} {"train_loss": -35.029945373535156, "global_step": 45358, "epoch": 374} {"train_loss": -35.20102310180664, "global_step": 45359, "epoch": 374} {"train_loss": -34.92365646362305, "global_step": 45360, "epoch": 374} {"train_loss": -35.084415435791016, "global_step": 45361, "epoch": 374} {"train_loss": -34.96887969970703, "global_step": 45362, "epoch": 374} {"train_loss": -35.40766525268555, "global_step": 45363, "epoch": 374} {"train_loss": -35.593570709228516, "global_step": 45364, "epoch": 374} {"train_loss": -35.40308380126953, "global_step": 45365, "epoch": 374} {"train_loss": -35.112037658691406, "global_step": 45366, "epoch": 374} {"train_loss": -35.36956024169922, "global_step": 45367, "epoch": 374} {"train_loss": -35.77132797241211, "global_step": 45368, "epoch": 374} {"train_loss": -35.40729904174805, "global_step": 45369, "epoch": 374} {"train_loss": -35.098731994628906, "global_step": 45370, "epoch": 374} {"train_loss": -35.40606689453125, "global_step": 45371, "epoch": 374} {"train_loss": -34.4403190612793, "global_step": 45372, "epoch": 374} {"train_loss": -33.85035705566406, "global_step": 45373, "epoch": 374} {"train_loss": -33.76337229515895, "global_step": 45374, "epoch": 374, "val_loss": 2538999.25} {"train_loss": -34.540828704833984, "global_step": 45375, "epoch": 375} {"train_loss": -34.9044075012207, "global_step": 45376, "epoch": 375} {"train_loss": -33.544586181640625, "global_step": 45377, "epoch": 375} {"train_loss": -33.7365608215332, "global_step": 45378, "epoch": 375} {"train_loss": -34.744903564453125, "global_step": 45379, "epoch": 375} {"train_loss": -33.199031829833984, "global_step": 45380, "epoch": 375} {"train_loss": -33.83319091796875, "global_step": 45381, "epoch": 375} {"train_loss": -33.81948471069336, "global_step": 45382, "epoch": 375} {"train_loss": -32.836673736572266, "global_step": 45383, "epoch": 375} {"train_loss": -32.934444427490234, "global_step": 45384, "epoch": 375} {"train_loss": -32.500545501708984, "global_step": 45385, "epoch": 375} {"train_loss": -32.08236312866211, "global_step": 45386, "epoch": 375} {"train_loss": -31.917387008666992, "global_step": 45387, "epoch": 375} {"train_loss": -27.604400634765625, "global_step": 45388, "epoch": 375} {"train_loss": -30.21424674987793, "global_step": 45389, "epoch": 375} {"train_loss": -27.612838745117188, "global_step": 45390, "epoch": 375} {"train_loss": -30.948373794555664, "global_step": 45391, "epoch": 375} {"train_loss": -27.04908561706543, "global_step": 45392, "epoch": 375} {"train_loss": -33.47982406616211, "global_step": 45393, "epoch": 375} {"train_loss": -29.343860626220703, "global_step": 45394, "epoch": 375} {"train_loss": -33.59373092651367, "global_step": 45395, "epoch": 375} {"train_loss": -32.62928009033203, "global_step": 45396, "epoch": 375} {"train_loss": -33.13804244995117, "global_step": 45397, "epoch": 375} {"train_loss": -32.910194396972656, "global_step": 45398, "epoch": 375} {"train_loss": -33.33827590942383, "global_step": 45399, "epoch": 375} {"train_loss": -34.133636474609375, "global_step": 45400, "epoch": 375} {"train_loss": -33.482627868652344, "global_step": 45401, "epoch": 375} {"train_loss": -31.924758911132812, "global_step": 45402, "epoch": 375} {"train_loss": -33.74140548706055, "global_step": 45403, "epoch": 375} {"train_loss": -33.53887176513672, "global_step": 45404, "epoch": 375} {"train_loss": -33.95819854736328, "global_step": 45405, "epoch": 375} {"train_loss": -34.58883285522461, "global_step": 45406, "epoch": 375} {"train_loss": -33.70946502685547, "global_step": 45407, "epoch": 375} {"train_loss": -33.48433303833008, "global_step": 45408, "epoch": 375} {"train_loss": -34.3291130065918, "global_step": 45409, "epoch": 375} {"train_loss": -34.24898147583008, "global_step": 45410, "epoch": 375} {"train_loss": -33.77622985839844, "global_step": 45411, "epoch": 375} {"train_loss": -33.59878921508789, "global_step": 45412, "epoch": 375} {"train_loss": -33.158782958984375, "global_step": 45413, "epoch": 375} {"train_loss": -34.67311096191406, "global_step": 45414, "epoch": 375} {"train_loss": -33.66120147705078, "global_step": 45415, "epoch": 375} {"train_loss": -34.45868682861328, "global_step": 45416, "epoch": 375} {"train_loss": -34.10819625854492, "global_step": 45417, "epoch": 375} {"train_loss": -34.69038391113281, "global_step": 45418, "epoch": 375} {"train_loss": -34.88959503173828, "global_step": 45419, "epoch": 375} {"train_loss": -34.36824035644531, "global_step": 45420, "epoch": 375} {"train_loss": -34.24056625366211, "global_step": 45421, "epoch": 375} {"train_loss": -34.86225128173828, "global_step": 45422, "epoch": 375} {"train_loss": -34.60767364501953, "global_step": 45423, "epoch": 375} {"train_loss": -33.85127258300781, "global_step": 45424, "epoch": 375} {"train_loss": -34.1787223815918, "global_step": 45425, "epoch": 375} {"train_loss": -34.45627975463867, "global_step": 45426, "epoch": 375} {"train_loss": -34.762908935546875, "global_step": 45427, "epoch": 375} {"train_loss": -34.8090934753418, "global_step": 45428, "epoch": 375} {"train_loss": -33.949737548828125, "global_step": 45429, "epoch": 375} {"train_loss": -33.08130645751953, "global_step": 45430, "epoch": 375} {"train_loss": -34.36948776245117, "global_step": 45431, "epoch": 375} {"train_loss": -34.22764205932617, "global_step": 45432, "epoch": 375} {"train_loss": -34.6141242980957, "global_step": 45433, "epoch": 375} {"train_loss": -34.332759857177734, "global_step": 45434, "epoch": 375} {"train_loss": -34.64622116088867, "global_step": 45435, "epoch": 375} {"train_loss": -35.06589889526367, "global_step": 45436, "epoch": 375} {"train_loss": -34.106895446777344, "global_step": 45437, "epoch": 375} {"train_loss": -34.796024322509766, "global_step": 45438, "epoch": 375} {"train_loss": -34.58624267578125, "global_step": 45439, "epoch": 375} {"train_loss": -35.33521270751953, "global_step": 45440, "epoch": 375} {"train_loss": -35.02134323120117, "global_step": 45441, "epoch": 375} {"train_loss": -33.78977584838867, "global_step": 45442, "epoch": 375} {"train_loss": -34.28377914428711, "global_step": 45443, "epoch": 375} {"train_loss": -35.06986999511719, "global_step": 45444, "epoch": 375} {"train_loss": -35.48624801635742, "global_step": 45445, "epoch": 375} {"train_loss": -35.08396530151367, "global_step": 45446, "epoch": 375} {"train_loss": -35.155887603759766, "global_step": 45447, "epoch": 375} {"train_loss": -35.23194122314453, "global_step": 45448, "epoch": 375} {"train_loss": -34.19814682006836, "global_step": 45449, "epoch": 375} {"train_loss": -34.100677490234375, "global_step": 45450, "epoch": 375} {"train_loss": -33.65726852416992, "global_step": 45451, "epoch": 375} {"train_loss": -34.67250442504883, "global_step": 45452, "epoch": 375} {"train_loss": -35.078399658203125, "global_step": 45453, "epoch": 375} {"train_loss": -34.857147216796875, "global_step": 45454, "epoch": 375} {"train_loss": -34.28167724609375, "global_step": 45455, "epoch": 375} {"train_loss": -33.84794998168945, "global_step": 45456, "epoch": 375} {"train_loss": -34.467655181884766, "global_step": 45457, "epoch": 375} {"train_loss": -34.39046096801758, "global_step": 45458, "epoch": 375} {"train_loss": -34.0905647277832, "global_step": 45459, "epoch": 375} {"train_loss": -34.937618255615234, "global_step": 45460, "epoch": 375} {"train_loss": -33.59492874145508, "global_step": 45461, "epoch": 375} {"train_loss": -33.131107330322266, "global_step": 45462, "epoch": 375} {"train_loss": -34.59772872924805, "global_step": 45463, "epoch": 375} {"train_loss": -34.592533111572266, "global_step": 45464, "epoch": 375} {"train_loss": -33.983734130859375, "global_step": 45465, "epoch": 375} {"train_loss": -31.9158992767334, "global_step": 45466, "epoch": 375} {"train_loss": -33.362178802490234, "global_step": 45467, "epoch": 375} {"train_loss": -34.36495590209961, "global_step": 45468, "epoch": 375} {"train_loss": -33.844398498535156, "global_step": 45469, "epoch": 375} {"train_loss": -32.201419830322266, "global_step": 45470, "epoch": 375} {"train_loss": -31.984664916992188, "global_step": 45471, "epoch": 375} {"train_loss": -32.43425369262695, "global_step": 45472, "epoch": 375} {"train_loss": -34.358062744140625, "global_step": 45473, "epoch": 375} {"train_loss": -34.642574310302734, "global_step": 45474, "epoch": 375} {"train_loss": -32.284950256347656, "global_step": 45475, "epoch": 375} {"train_loss": -33.64483642578125, "global_step": 45476, "epoch": 375} {"train_loss": -33.65460968017578, "global_step": 45477, "epoch": 375} {"train_loss": -33.43451690673828, "global_step": 45478, "epoch": 375} {"train_loss": -33.51469039916992, "global_step": 45479, "epoch": 375} {"train_loss": -35.275264739990234, "global_step": 45480, "epoch": 375} {"train_loss": -33.60274124145508, "global_step": 45481, "epoch": 375} {"train_loss": -34.377281188964844, "global_step": 45482, "epoch": 375} {"train_loss": -34.33635330200195, "global_step": 45483, "epoch": 375} {"train_loss": -34.095726013183594, "global_step": 45484, "epoch": 375} {"train_loss": -34.54116439819336, "global_step": 45485, "epoch": 375} {"train_loss": -33.827877044677734, "global_step": 45486, "epoch": 375} {"train_loss": -32.894649505615234, "global_step": 45487, "epoch": 375} {"train_loss": -34.72822570800781, "global_step": 45488, "epoch": 375} {"train_loss": -33.9237174987793, "global_step": 45489, "epoch": 375} {"train_loss": -34.624446868896484, "global_step": 45490, "epoch": 375} {"train_loss": -33.994991302490234, "global_step": 45491, "epoch": 375} {"train_loss": -35.17292404174805, "global_step": 45492, "epoch": 375} {"train_loss": -34.72015380859375, "global_step": 45493, "epoch": 375} {"train_loss": -34.408424377441406, "global_step": 45494, "epoch": 375} {"train_loss": -33.75079208563182, "global_step": 45495, "epoch": 375, "val_loss": 2594576.25} {"train_loss": -34.171058654785156, "global_step": 45496, "epoch": 376} {"train_loss": -34.310428619384766, "global_step": 45497, "epoch": 376} {"train_loss": -34.402042388916016, "global_step": 45498, "epoch": 376} {"train_loss": -33.35584259033203, "global_step": 45499, "epoch": 376} {"train_loss": -35.10853958129883, "global_step": 45500, "epoch": 376} {"train_loss": -33.658687591552734, "global_step": 45501, "epoch": 376} {"train_loss": -34.84291458129883, "global_step": 45502, "epoch": 376} {"train_loss": -34.293975830078125, "global_step": 45503, "epoch": 376} {"train_loss": -35.46765899658203, "global_step": 45504, "epoch": 376} {"train_loss": -34.79365158081055, "global_step": 45505, "epoch": 376} {"train_loss": -35.02861785888672, "global_step": 45506, "epoch": 376} {"train_loss": -34.49779510498047, "global_step": 45507, "epoch": 376} {"train_loss": -34.89131164550781, "global_step": 45508, "epoch": 376} {"train_loss": -33.05134201049805, "global_step": 45509, "epoch": 376} {"train_loss": -34.55376052856445, "global_step": 45510, "epoch": 376} {"train_loss": -34.376399993896484, "global_step": 45511, "epoch": 376} {"train_loss": -34.08749771118164, "global_step": 45512, "epoch": 376} {"train_loss": -34.41069412231445, "global_step": 45513, "epoch": 376} {"train_loss": -34.35139083862305, "global_step": 45514, "epoch": 376} {"train_loss": -34.8212890625, "global_step": 45515, "epoch": 376} {"train_loss": -35.07963562011719, "global_step": 45516, "epoch": 376} {"train_loss": -35.14606857299805, "global_step": 45517, "epoch": 376} {"train_loss": -35.319984436035156, "global_step": 45518, "epoch": 376} {"train_loss": -35.51070785522461, "global_step": 45519, "epoch": 376} {"train_loss": -34.25584030151367, "global_step": 45520, "epoch": 376} {"train_loss": -35.291561126708984, "global_step": 45521, "epoch": 376} {"train_loss": -34.95399856567383, "global_step": 45522, "epoch": 376} {"train_loss": -35.1478271484375, "global_step": 45523, "epoch": 376} {"train_loss": -35.2334098815918, "global_step": 45524, "epoch": 376} {"train_loss": -34.91667938232422, "global_step": 45525, "epoch": 376} {"train_loss": -35.275917053222656, "global_step": 45526, "epoch": 376} {"train_loss": -34.962860107421875, "global_step": 45527, "epoch": 376} {"train_loss": -34.27888107299805, "global_step": 45528, "epoch": 376} {"train_loss": -35.241546630859375, "global_step": 45529, "epoch": 376} {"train_loss": -35.23124313354492, "global_step": 45530, "epoch": 376} {"train_loss": -34.916748046875, "global_step": 45531, "epoch": 376} {"train_loss": -35.84944534301758, "global_step": 45532, "epoch": 376} {"train_loss": -34.51173782348633, "global_step": 45533, "epoch": 376} {"train_loss": -34.685420989990234, "global_step": 45534, "epoch": 376} {"train_loss": -35.63594436645508, "global_step": 45535, "epoch": 376} {"train_loss": -34.777191162109375, "global_step": 45536, "epoch": 376} {"train_loss": -34.99907302856445, "global_step": 45537, "epoch": 376} {"train_loss": -35.36050033569336, "global_step": 45538, "epoch": 376} {"train_loss": -35.68292236328125, "global_step": 45539, "epoch": 376} {"train_loss": -35.32670211791992, "global_step": 45540, "epoch": 376} {"train_loss": -34.82418441772461, "global_step": 45541, "epoch": 376} {"train_loss": -33.298248291015625, "global_step": 45542, "epoch": 376} {"train_loss": -31.93398094177246, "global_step": 45543, "epoch": 376} {"train_loss": -28.394559860229492, "global_step": 45544, "epoch": 376} {"train_loss": -34.715850830078125, "global_step": 45545, "epoch": 376} {"train_loss": -34.79656982421875, "global_step": 45546, "epoch": 376} {"train_loss": -31.61341667175293, "global_step": 45547, "epoch": 376} {"train_loss": -34.49715805053711, "global_step": 45548, "epoch": 376} {"train_loss": -34.72481918334961, "global_step": 45549, "epoch": 376} {"train_loss": -33.030296325683594, "global_step": 45550, "epoch": 376} {"train_loss": -35.22591781616211, "global_step": 45551, "epoch": 376} {"train_loss": -31.571680068969727, "global_step": 45552, "epoch": 376} {"train_loss": -32.03224563598633, "global_step": 45553, "epoch": 376} {"train_loss": -31.741125106811523, "global_step": 45554, "epoch": 376} {"train_loss": -30.97849464416504, "global_step": 45555, "epoch": 376} {"train_loss": -34.718326568603516, "global_step": 45556, "epoch": 376} {"train_loss": -33.13901901245117, "global_step": 45557, "epoch": 376} {"train_loss": -32.86894226074219, "global_step": 45558, "epoch": 376} {"train_loss": -33.616573333740234, "global_step": 45559, "epoch": 376} {"train_loss": -34.71442794799805, "global_step": 45560, "epoch": 376} {"train_loss": -32.34763717651367, "global_step": 45561, "epoch": 376} {"train_loss": -33.534523010253906, "global_step": 45562, "epoch": 376} {"train_loss": -34.16767501831055, "global_step": 45563, "epoch": 376} {"train_loss": -32.84202194213867, "global_step": 45564, "epoch": 376} {"train_loss": -32.30881881713867, "global_step": 45565, "epoch": 376} {"train_loss": -34.281639099121094, "global_step": 45566, "epoch": 376} {"train_loss": -34.00232696533203, "global_step": 45567, "epoch": 376} {"train_loss": -33.16537857055664, "global_step": 45568, "epoch": 376} {"train_loss": -35.132083892822266, "global_step": 45569, "epoch": 376} {"train_loss": -33.69233322143555, "global_step": 45570, "epoch": 376} {"train_loss": -34.24934768676758, "global_step": 45571, "epoch": 376} {"train_loss": -34.627044677734375, "global_step": 45572, "epoch": 376} {"train_loss": -34.01457214355469, "global_step": 45573, "epoch": 376} {"train_loss": -34.3600959777832, "global_step": 45574, "epoch": 376} {"train_loss": -34.55340576171875, "global_step": 45575, "epoch": 376} {"train_loss": -34.419734954833984, "global_step": 45576, "epoch": 376} {"train_loss": -34.92795181274414, "global_step": 45577, "epoch": 376} {"train_loss": -35.118438720703125, "global_step": 45578, "epoch": 376} {"train_loss": -34.66836166381836, "global_step": 45579, "epoch": 376} {"train_loss": -34.40296173095703, "global_step": 45580, "epoch": 376} {"train_loss": -34.03477478027344, "global_step": 45581, "epoch": 376} {"train_loss": -32.96390914916992, "global_step": 45582, "epoch": 376} {"train_loss": -30.4403018951416, "global_step": 45583, "epoch": 376} {"train_loss": -30.169431686401367, "global_step": 45584, "epoch": 376} {"train_loss": -34.64021682739258, "global_step": 45585, "epoch": 376} {"train_loss": -33.31599044799805, "global_step": 45586, "epoch": 376} {"train_loss": -27.94807243347168, "global_step": 45587, "epoch": 376} {"train_loss": -31.459009170532227, "global_step": 45588, "epoch": 376} {"train_loss": -23.563077926635742, "global_step": 45589, "epoch": 376} {"train_loss": -23.500537872314453, "global_step": 45590, "epoch": 376} {"train_loss": -33.73908615112305, "global_step": 45591, "epoch": 376} {"train_loss": -27.236215591430664, "global_step": 45592, "epoch": 376} {"train_loss": -27.043893814086914, "global_step": 45593, "epoch": 376} {"train_loss": -30.20318603515625, "global_step": 45594, "epoch": 376} {"train_loss": -31.42913818359375, "global_step": 45595, "epoch": 376} {"train_loss": -30.63649559020996, "global_step": 45596, "epoch": 376} {"train_loss": -34.083412170410156, "global_step": 45597, "epoch": 376} {"train_loss": -31.68727684020996, "global_step": 45598, "epoch": 376} {"train_loss": -34.21242141723633, "global_step": 45599, "epoch": 376} {"train_loss": -33.13582992553711, "global_step": 45600, "epoch": 376} {"train_loss": -33.6673698425293, "global_step": 45601, "epoch": 376} {"train_loss": -34.26731491088867, "global_step": 45602, "epoch": 376} {"train_loss": -33.460906982421875, "global_step": 45603, "epoch": 376} {"train_loss": -34.356449127197266, "global_step": 45604, "epoch": 376} {"train_loss": -34.29289245605469, "global_step": 45605, "epoch": 376} {"train_loss": -33.81728744506836, "global_step": 45606, "epoch": 376} {"train_loss": -34.670166015625, "global_step": 45607, "epoch": 376} {"train_loss": -34.581871032714844, "global_step": 45608, "epoch": 376} {"train_loss": -34.81489181518555, "global_step": 45609, "epoch": 376} {"train_loss": -34.637264251708984, "global_step": 45610, "epoch": 376} {"train_loss": -34.47492218017578, "global_step": 45611, "epoch": 376} {"train_loss": -34.91899490356445, "global_step": 45612, "epoch": 376} {"train_loss": -34.65607833862305, "global_step": 45613, "epoch": 376} {"train_loss": -34.92350387573242, "global_step": 45614, "epoch": 376} {"train_loss": -35.170719146728516, "global_step": 45615, "epoch": 376} {"train_loss": -33.69181658216744, "global_step": 45616, "epoch": 376, "val_loss": 2614372.25} {"train_loss": -35.21814727783203, "global_step": 45617, "epoch": 377} {"train_loss": -34.638336181640625, "global_step": 45618, "epoch": 377} {"train_loss": -34.69297409057617, "global_step": 45619, "epoch": 377} {"train_loss": -34.580528259277344, "global_step": 45620, "epoch": 377} {"train_loss": -34.09614562988281, "global_step": 45621, "epoch": 377} {"train_loss": -34.568241119384766, "global_step": 45622, "epoch": 377} {"train_loss": -34.5222282409668, "global_step": 45623, "epoch": 377} {"train_loss": -34.22898483276367, "global_step": 45624, "epoch": 377} {"train_loss": -35.167991638183594, "global_step": 45625, "epoch": 377} {"train_loss": -34.751220703125, "global_step": 45626, "epoch": 377} {"train_loss": -34.08466339111328, "global_step": 45627, "epoch": 377} {"train_loss": -34.55642318725586, "global_step": 45628, "epoch": 377} {"train_loss": -34.723052978515625, "global_step": 45629, "epoch": 377} {"train_loss": -34.33818435668945, "global_step": 45630, "epoch": 377} {"train_loss": -34.40496826171875, "global_step": 45631, "epoch": 377} {"train_loss": -34.987281799316406, "global_step": 45632, "epoch": 377} {"train_loss": -34.58490753173828, "global_step": 45633, "epoch": 377} {"train_loss": -35.51342010498047, "global_step": 45634, "epoch": 377} {"train_loss": -34.29734420776367, "global_step": 45635, "epoch": 377} {"train_loss": -34.761558532714844, "global_step": 45636, "epoch": 377} {"train_loss": -34.423362731933594, "global_step": 45637, "epoch": 377} {"train_loss": -34.78218460083008, "global_step": 45638, "epoch": 377} {"train_loss": -34.39323425292969, "global_step": 45639, "epoch": 377} {"train_loss": -34.80715560913086, "global_step": 45640, "epoch": 377} {"train_loss": -34.864410400390625, "global_step": 45641, "epoch": 377} {"train_loss": -35.0343017578125, "global_step": 45642, "epoch": 377} {"train_loss": -34.4162483215332, "global_step": 45643, "epoch": 377} {"train_loss": -34.54935836791992, "global_step": 45644, "epoch": 377} {"train_loss": -34.384273529052734, "global_step": 45645, "epoch": 377} {"train_loss": -35.04805374145508, "global_step": 45646, "epoch": 377} {"train_loss": -34.523231506347656, "global_step": 45647, "epoch": 377} {"train_loss": -34.22593688964844, "global_step": 45648, "epoch": 377} {"train_loss": -34.535743713378906, "global_step": 45649, "epoch": 377} {"train_loss": -35.056087493896484, "global_step": 45650, "epoch": 377} {"train_loss": -34.40021514892578, "global_step": 45651, "epoch": 377} {"train_loss": -31.583724975585938, "global_step": 45652, "epoch": 377} {"train_loss": -30.121992111206055, "global_step": 45653, "epoch": 377} {"train_loss": -33.1414909362793, "global_step": 45654, "epoch": 377} {"train_loss": -28.025287628173828, "global_step": 45655, "epoch": 377} {"train_loss": -28.8978214263916, "global_step": 45656, "epoch": 377} {"train_loss": -28.968961715698242, "global_step": 45657, "epoch": 377} {"train_loss": -28.518146514892578, "global_step": 45658, "epoch": 377} {"train_loss": -29.74177360534668, "global_step": 45659, "epoch": 377} {"train_loss": -29.2509708404541, "global_step": 45660, "epoch": 377} {"train_loss": -29.9387264251709, "global_step": 45661, "epoch": 377} {"train_loss": -30.378320693969727, "global_step": 45662, "epoch": 377} {"train_loss": -29.59793472290039, "global_step": 45663, "epoch": 377} {"train_loss": -30.94117546081543, "global_step": 45664, "epoch": 377} {"train_loss": -31.484577178955078, "global_step": 45665, "epoch": 377} {"train_loss": -31.0185546875, "global_step": 45666, "epoch": 377} {"train_loss": -31.061813354492188, "global_step": 45667, "epoch": 377} {"train_loss": -31.344757080078125, "global_step": 45668, "epoch": 377} {"train_loss": -31.556964874267578, "global_step": 45669, "epoch": 377} {"train_loss": -32.035640716552734, "global_step": 45670, "epoch": 377} {"train_loss": -32.02479934692383, "global_step": 45671, "epoch": 377} {"train_loss": -32.080318450927734, "global_step": 45672, "epoch": 377} {"train_loss": -32.34111404418945, "global_step": 45673, "epoch": 377} {"train_loss": -32.9047966003418, "global_step": 45674, "epoch": 377} {"train_loss": -32.905616760253906, "global_step": 45675, "epoch": 377} {"train_loss": -32.924564361572266, "global_step": 45676, "epoch": 377} {"train_loss": -32.71200180053711, "global_step": 45677, "epoch": 377} {"train_loss": -33.253841400146484, "global_step": 45678, "epoch": 377} {"train_loss": -33.34945297241211, "global_step": 45679, "epoch": 377} {"train_loss": -32.91103744506836, "global_step": 45680, "epoch": 377} {"train_loss": -32.21424102783203, "global_step": 45681, "epoch": 377} {"train_loss": -29.563268661499023, "global_step": 45682, "epoch": 377} {"train_loss": -25.626798629760742, "global_step": 45683, "epoch": 377} {"train_loss": -29.52742576599121, "global_step": 45684, "epoch": 377} {"train_loss": -33.97164535522461, "global_step": 45685, "epoch": 377} {"train_loss": -30.17913818359375, "global_step": 45686, "epoch": 377} {"train_loss": -33.00590133666992, "global_step": 45687, "epoch": 377} {"train_loss": -29.426355361938477, "global_step": 45688, "epoch": 377} {"train_loss": -20.638954162597656, "global_step": 45689, "epoch": 377} {"train_loss": -24.707889556884766, "global_step": 45690, "epoch": 377} {"train_loss": -28.36931800842285, "global_step": 45691, "epoch": 377} {"train_loss": -27.404266357421875, "global_step": 45692, "epoch": 377} {"train_loss": -28.160614013671875, "global_step": 45693, "epoch": 377} {"train_loss": -31.315113067626953, "global_step": 45694, "epoch": 377} {"train_loss": -30.270315170288086, "global_step": 45695, "epoch": 377} {"train_loss": -31.03425407409668, "global_step": 45696, "epoch": 377} {"train_loss": -31.969614028930664, "global_step": 45697, "epoch": 377} {"train_loss": -30.42085075378418, "global_step": 45698, "epoch": 377} {"train_loss": -30.93779945373535, "global_step": 45699, "epoch": 377} {"train_loss": -32.26496124267578, "global_step": 45700, "epoch": 377} {"train_loss": -32.62689208984375, "global_step": 45701, "epoch": 377} {"train_loss": -31.96236228942871, "global_step": 45702, "epoch": 377} {"train_loss": -31.99542236328125, "global_step": 45703, "epoch": 377} {"train_loss": -32.39447021484375, "global_step": 45704, "epoch": 377} {"train_loss": -32.70355987548828, "global_step": 45705, "epoch": 377} {"train_loss": -32.56476974487305, "global_step": 45706, "epoch": 377} {"train_loss": -31.88492774963379, "global_step": 45707, "epoch": 377} {"train_loss": -32.397525787353516, "global_step": 45708, "epoch": 377} {"train_loss": -32.20070266723633, "global_step": 45709, "epoch": 377} {"train_loss": -32.571044921875, "global_step": 45710, "epoch": 377} {"train_loss": -32.9384880065918, "global_step": 45711, "epoch": 377} {"train_loss": -32.9984245300293, "global_step": 45712, "epoch": 377} {"train_loss": -32.7656364440918, "global_step": 45713, "epoch": 377} {"train_loss": -32.7209587097168, "global_step": 45714, "epoch": 377} {"train_loss": -30.75504493713379, "global_step": 45715, "epoch": 377} {"train_loss": -28.687488555908203, "global_step": 45716, "epoch": 377} {"train_loss": -27.11872673034668, "global_step": 45717, "epoch": 377} {"train_loss": -28.383893966674805, "global_step": 45718, "epoch": 377} {"train_loss": -31.31180191040039, "global_step": 45719, "epoch": 377} {"train_loss": -31.652313232421875, "global_step": 45720, "epoch": 377} {"train_loss": -30.524789810180664, "global_step": 45721, "epoch": 377} {"train_loss": -31.918415069580078, "global_step": 45722, "epoch": 377} {"train_loss": -32.604644775390625, "global_step": 45723, "epoch": 377} {"train_loss": -32.3347053527832, "global_step": 45724, "epoch": 377} {"train_loss": -32.70461654663086, "global_step": 45725, "epoch": 377} {"train_loss": -31.979450225830078, "global_step": 45726, "epoch": 377} {"train_loss": -33.3574333190918, "global_step": 45727, "epoch": 377} {"train_loss": -31.835031509399414, "global_step": 45728, "epoch": 377} {"train_loss": -32.82195281982422, "global_step": 45729, "epoch": 377} {"train_loss": -32.5737419128418, "global_step": 45730, "epoch": 377} {"train_loss": -33.20264434814453, "global_step": 45731, "epoch": 377} {"train_loss": -32.715694427490234, "global_step": 45732, "epoch": 377} {"train_loss": -33.46574401855469, "global_step": 45733, "epoch": 377} {"train_loss": -33.02902603149414, "global_step": 45734, "epoch": 377} {"train_loss": -33.486328125, "global_step": 45735, "epoch": 377} {"train_loss": -33.30289840698242, "global_step": 45736, "epoch": 377} {"train_loss": -32.202794114420236, "global_step": 45737, "epoch": 377, "val_loss": 2657402.25} {"train_loss": -33.31768035888672, "global_step": 45738, "epoch": 378} {"train_loss": -33.37834548950195, "global_step": 45739, "epoch": 378} {"train_loss": -33.45436096191406, "global_step": 45740, "epoch": 378} {"train_loss": -33.58041000366211, "global_step": 45741, "epoch": 378} {"train_loss": -33.6378173828125, "global_step": 45742, "epoch": 378} {"train_loss": -33.40864944458008, "global_step": 45743, "epoch": 378} {"train_loss": -33.316688537597656, "global_step": 45744, "epoch": 378} {"train_loss": -33.821773529052734, "global_step": 45745, "epoch": 378} {"train_loss": -33.67439651489258, "global_step": 45746, "epoch": 378} {"train_loss": -34.04592514038086, "global_step": 45747, "epoch": 378} {"train_loss": -33.53619384765625, "global_step": 45748, "epoch": 378} {"train_loss": -34.15111541748047, "global_step": 45749, "epoch": 378} {"train_loss": -34.01466369628906, "global_step": 45750, "epoch": 378} {"train_loss": -34.18111038208008, "global_step": 45751, "epoch": 378} {"train_loss": -33.68238067626953, "global_step": 45752, "epoch": 378} {"train_loss": -33.74386215209961, "global_step": 45753, "epoch": 378} {"train_loss": -33.479183197021484, "global_step": 45754, "epoch": 378} {"train_loss": -32.3258171081543, "global_step": 45755, "epoch": 378} {"train_loss": -32.4595947265625, "global_step": 45756, "epoch": 378} {"train_loss": -33.73135757446289, "global_step": 45757, "epoch": 378} {"train_loss": -34.16413497924805, "global_step": 45758, "epoch": 378} {"train_loss": -33.98940658569336, "global_step": 45759, "epoch": 378} {"train_loss": -34.03303909301758, "global_step": 45760, "epoch": 378} {"train_loss": -34.45138168334961, "global_step": 45761, "epoch": 378} {"train_loss": -34.74310302734375, "global_step": 45762, "epoch": 378} {"train_loss": -34.248924255371094, "global_step": 45763, "epoch": 378} {"train_loss": -34.690589904785156, "global_step": 45764, "epoch": 378} {"train_loss": -34.137062072753906, "global_step": 45765, "epoch": 378} {"train_loss": -34.31716537475586, "global_step": 45766, "epoch": 378} {"train_loss": -34.58934783935547, "global_step": 45767, "epoch": 378} {"train_loss": -34.38445281982422, "global_step": 45768, "epoch": 378} {"train_loss": -34.41543197631836, "global_step": 45769, "epoch": 378} {"train_loss": -34.050479888916016, "global_step": 45770, "epoch": 378} {"train_loss": -34.143672943115234, "global_step": 45771, "epoch": 378} {"train_loss": -33.8631706237793, "global_step": 45772, "epoch": 378} {"train_loss": -33.60176467895508, "global_step": 45773, "epoch": 378} {"train_loss": -32.69226837158203, "global_step": 45774, "epoch": 378} {"train_loss": -35.0325813293457, "global_step": 45775, "epoch": 378} {"train_loss": -34.03737258911133, "global_step": 45776, "epoch": 378} {"train_loss": -34.60688400268555, "global_step": 45777, "epoch": 378} {"train_loss": -34.2027587890625, "global_step": 45778, "epoch": 378} {"train_loss": -33.67251205444336, "global_step": 45779, "epoch": 378} {"train_loss": -31.519128799438477, "global_step": 45780, "epoch": 378} {"train_loss": -26.526731491088867, "global_step": 45781, "epoch": 378} {"train_loss": -22.536558151245117, "global_step": 45782, "epoch": 378} {"train_loss": -32.61004638671875, "global_step": 45783, "epoch": 378} {"train_loss": -32.061649322509766, "global_step": 45784, "epoch": 378} {"train_loss": -29.601276397705078, "global_step": 45785, "epoch": 378} {"train_loss": -32.5208625793457, "global_step": 45786, "epoch": 378} {"train_loss": -28.80010414123535, "global_step": 45787, "epoch": 378} {"train_loss": -28.567626953125, "global_step": 45788, "epoch": 378} {"train_loss": -30.385684967041016, "global_step": 45789, "epoch": 378} {"train_loss": -31.8642520904541, "global_step": 45790, "epoch": 378} {"train_loss": -32.605987548828125, "global_step": 45791, "epoch": 378} {"train_loss": -31.22254753112793, "global_step": 45792, "epoch": 378} {"train_loss": -32.29313278198242, "global_step": 45793, "epoch": 378} {"train_loss": -31.945697784423828, "global_step": 45794, "epoch": 378} {"train_loss": -34.193023681640625, "global_step": 45795, "epoch": 378} {"train_loss": -32.393184661865234, "global_step": 45796, "epoch": 378} {"train_loss": -33.83113098144531, "global_step": 45797, "epoch": 378} {"train_loss": -33.345401763916016, "global_step": 45798, "epoch": 378} {"train_loss": -34.21030807495117, "global_step": 45799, "epoch": 378} {"train_loss": -33.270233154296875, "global_step": 45800, "epoch": 378} {"train_loss": -33.698219299316406, "global_step": 45801, "epoch": 378} {"train_loss": -34.236244201660156, "global_step": 45802, "epoch": 378} {"train_loss": -34.0005989074707, "global_step": 45803, "epoch": 378} {"train_loss": -34.20906448364258, "global_step": 45804, "epoch": 378} {"train_loss": -33.567996978759766, "global_step": 45805, "epoch": 378} {"train_loss": -33.23725128173828, "global_step": 45806, "epoch": 378} {"train_loss": -33.82990646362305, "global_step": 45807, "epoch": 378} {"train_loss": -33.30302047729492, "global_step": 45808, "epoch": 378} {"train_loss": -32.28927230834961, "global_step": 45809, "epoch": 378} {"train_loss": -31.615447998046875, "global_step": 45810, "epoch": 378} {"train_loss": -32.5980224609375, "global_step": 45811, "epoch": 378} {"train_loss": -33.799007415771484, "global_step": 45812, "epoch": 378} {"train_loss": -33.098121643066406, "global_step": 45813, "epoch": 378} {"train_loss": -31.024185180664062, "global_step": 45814, "epoch": 378} {"train_loss": -31.143842697143555, "global_step": 45815, "epoch": 378} {"train_loss": -31.78729248046875, "global_step": 45816, "epoch": 378} {"train_loss": -28.659332275390625, "global_step": 45817, "epoch": 378} {"train_loss": -30.521997451782227, "global_step": 45818, "epoch": 378} {"train_loss": -31.023426055908203, "global_step": 45819, "epoch": 378} {"train_loss": -33.61461639404297, "global_step": 45820, "epoch": 378} {"train_loss": -32.6532096862793, "global_step": 45821, "epoch": 378} {"train_loss": -33.50215530395508, "global_step": 45822, "epoch": 378} {"train_loss": -33.397491455078125, "global_step": 45823, "epoch": 378} {"train_loss": -32.93337631225586, "global_step": 45824, "epoch": 378} {"train_loss": -33.156829833984375, "global_step": 45825, "epoch": 378} {"train_loss": -32.88999557495117, "global_step": 45826, "epoch": 378} {"train_loss": -33.97026443481445, "global_step": 45827, "epoch": 378} {"train_loss": -32.87715530395508, "global_step": 45828, "epoch": 378} {"train_loss": -33.81463623046875, "global_step": 45829, "epoch": 378} {"train_loss": -33.45752716064453, "global_step": 45830, "epoch": 378} {"train_loss": -33.156978607177734, "global_step": 45831, "epoch": 378} {"train_loss": -33.35512924194336, "global_step": 45832, "epoch": 378} {"train_loss": -33.66851043701172, "global_step": 45833, "epoch": 378} {"train_loss": -33.53435134887695, "global_step": 45834, "epoch": 378} {"train_loss": -33.96487045288086, "global_step": 45835, "epoch": 378} {"train_loss": -33.54631423950195, "global_step": 45836, "epoch": 378} {"train_loss": -33.99641418457031, "global_step": 45837, "epoch": 378} {"train_loss": -33.75661849975586, "global_step": 45838, "epoch": 378} {"train_loss": -34.031185150146484, "global_step": 45839, "epoch": 378} {"train_loss": -33.611351013183594, "global_step": 45840, "epoch": 378} {"train_loss": -34.073890686035156, "global_step": 45841, "epoch": 378} {"train_loss": -34.170284271240234, "global_step": 45842, "epoch": 378} {"train_loss": -33.659053802490234, "global_step": 45843, "epoch": 378} {"train_loss": -34.04277038574219, "global_step": 45844, "epoch": 378} {"train_loss": -33.57967758178711, "global_step": 45845, "epoch": 378} {"train_loss": -33.77489471435547, "global_step": 45846, "epoch": 378} {"train_loss": -33.78999710083008, "global_step": 45847, "epoch": 378} {"train_loss": -33.69881820678711, "global_step": 45848, "epoch": 378} {"train_loss": -33.61642074584961, "global_step": 45849, "epoch": 378} {"train_loss": -33.8232536315918, "global_step": 45850, "epoch": 378} {"train_loss": -32.97591781616211, "global_step": 45851, "epoch": 378} {"train_loss": -34.122467041015625, "global_step": 45852, "epoch": 378} {"train_loss": -33.4443359375, "global_step": 45853, "epoch": 378} {"train_loss": -32.627742767333984, "global_step": 45854, "epoch": 378} {"train_loss": -33.10276412963867, "global_step": 45855, "epoch": 378} {"train_loss": -34.21721267700195, "global_step": 45856, "epoch": 378} {"train_loss": -34.46565628051758, "global_step": 45857, "epoch": 378} {"train_loss": -33.10959603175644, "global_step": 45858, "epoch": 378, "val_loss": 2712059.25} {"train_loss": -34.2281379699707, "global_step": 45859, "epoch": 379} {"train_loss": -33.475337982177734, "global_step": 45860, "epoch": 379} {"train_loss": -32.6385612487793, "global_step": 45861, "epoch": 379} {"train_loss": -34.27625274658203, "global_step": 45862, "epoch": 379} {"train_loss": -33.33363723754883, "global_step": 45863, "epoch": 379} {"train_loss": -34.70985794067383, "global_step": 45864, "epoch": 379} {"train_loss": -34.06136703491211, "global_step": 45865, "epoch": 379} {"train_loss": -34.57359313964844, "global_step": 45866, "epoch": 379} {"train_loss": -34.54319381713867, "global_step": 45867, "epoch": 379} {"train_loss": -34.64194869995117, "global_step": 45868, "epoch": 379} {"train_loss": -34.54820251464844, "global_step": 45869, "epoch": 379} {"train_loss": -34.99106979370117, "global_step": 45870, "epoch": 379} {"train_loss": -34.36376953125, "global_step": 45871, "epoch": 379} {"train_loss": -34.578773498535156, "global_step": 45872, "epoch": 379} {"train_loss": -34.66191482543945, "global_step": 45873, "epoch": 379} {"train_loss": -34.70803451538086, "global_step": 45874, "epoch": 379} {"train_loss": -34.385292053222656, "global_step": 45875, "epoch": 379} {"train_loss": -34.62150192260742, "global_step": 45876, "epoch": 379} {"train_loss": -35.023712158203125, "global_step": 45877, "epoch": 379} {"train_loss": -34.58325958251953, "global_step": 45878, "epoch": 379} {"train_loss": -35.03385543823242, "global_step": 45879, "epoch": 379} {"train_loss": -34.7130012512207, "global_step": 45880, "epoch": 379} {"train_loss": -34.755489349365234, "global_step": 45881, "epoch": 379} {"train_loss": -34.78727340698242, "global_step": 45882, "epoch": 379} {"train_loss": -35.10399627685547, "global_step": 45883, "epoch": 379} {"train_loss": -35.073570251464844, "global_step": 45884, "epoch": 379} {"train_loss": -35.248077392578125, "global_step": 45885, "epoch": 379} {"train_loss": -35.12720489501953, "global_step": 45886, "epoch": 379} {"train_loss": -34.71316909790039, "global_step": 45887, "epoch": 379} {"train_loss": -35.423248291015625, "global_step": 45888, "epoch": 379} {"train_loss": -35.02263641357422, "global_step": 45889, "epoch": 379} {"train_loss": -35.139034271240234, "global_step": 45890, "epoch": 379} {"train_loss": -33.48170852661133, "global_step": 45891, "epoch": 379} {"train_loss": -32.1761589050293, "global_step": 45892, "epoch": 379} {"train_loss": -32.94868469238281, "global_step": 45893, "epoch": 379} {"train_loss": -32.954036712646484, "global_step": 45894, "epoch": 379} {"train_loss": -33.0770263671875, "global_step": 45895, "epoch": 379} {"train_loss": -30.894575119018555, "global_step": 45896, "epoch": 379} {"train_loss": -24.04337501525879, "global_step": 45897, "epoch": 379} {"train_loss": -25.550188064575195, "global_step": 45898, "epoch": 379} {"train_loss": -35.060665130615234, "global_step": 45899, "epoch": 379} {"train_loss": -26.3812313079834, "global_step": 45900, "epoch": 379} {"train_loss": -30.7850284576416, "global_step": 45901, "epoch": 379} {"train_loss": -33.47982406616211, "global_step": 45902, "epoch": 379} {"train_loss": -32.40658950805664, "global_step": 45903, "epoch": 379} {"train_loss": -32.65398025512695, "global_step": 45904, "epoch": 379} {"train_loss": -32.120792388916016, "global_step": 45905, "epoch": 379} {"train_loss": -32.79604721069336, "global_step": 45906, "epoch": 379} {"train_loss": -33.85689163208008, "global_step": 45907, "epoch": 379} {"train_loss": -33.267765045166016, "global_step": 45908, "epoch": 379} {"train_loss": -33.55462646484375, "global_step": 45909, "epoch": 379} {"train_loss": -34.33720016479492, "global_step": 45910, "epoch": 379} {"train_loss": -33.4555778503418, "global_step": 45911, "epoch": 379} {"train_loss": -33.586299896240234, "global_step": 45912, "epoch": 379} {"train_loss": -34.087799072265625, "global_step": 45913, "epoch": 379} {"train_loss": -33.85247802734375, "global_step": 45914, "epoch": 379} {"train_loss": -33.38578414916992, "global_step": 45915, "epoch": 379} {"train_loss": -34.575008392333984, "global_step": 45916, "epoch": 379} {"train_loss": -34.20748519897461, "global_step": 45917, "epoch": 379} {"train_loss": -34.1396484375, "global_step": 45918, "epoch": 379} {"train_loss": -33.956451416015625, "global_step": 45919, "epoch": 379} {"train_loss": -34.211647033691406, "global_step": 45920, "epoch": 379} {"train_loss": -34.5373649597168, "global_step": 45921, "epoch": 379} {"train_loss": -34.47054672241211, "global_step": 45922, "epoch": 379} {"train_loss": -34.39829635620117, "global_step": 45923, "epoch": 379} {"train_loss": -33.956878662109375, "global_step": 45924, "epoch": 379} {"train_loss": -34.636104583740234, "global_step": 45925, "epoch": 379} {"train_loss": -33.947906494140625, "global_step": 45926, "epoch": 379} {"train_loss": -34.8545036315918, "global_step": 45927, "epoch": 379} {"train_loss": -33.9527587890625, "global_step": 45928, "epoch": 379} {"train_loss": -34.73276138305664, "global_step": 45929, "epoch": 379} {"train_loss": -34.855045318603516, "global_step": 45930, "epoch": 379} {"train_loss": -35.101314544677734, "global_step": 45931, "epoch": 379} {"train_loss": -34.65583038330078, "global_step": 45932, "epoch": 379} {"train_loss": -35.020118713378906, "global_step": 45933, "epoch": 379} {"train_loss": -32.259159088134766, "global_step": 45934, "epoch": 379} {"train_loss": -33.64730453491211, "global_step": 45935, "epoch": 379} {"train_loss": -34.689998626708984, "global_step": 45936, "epoch": 379} {"train_loss": -34.42721176147461, "global_step": 45937, "epoch": 379} {"train_loss": -34.072998046875, "global_step": 45938, "epoch": 379} {"train_loss": -33.909828186035156, "global_step": 45939, "epoch": 379} {"train_loss": -34.52434158325195, "global_step": 45940, "epoch": 379} {"train_loss": -34.45013427734375, "global_step": 45941, "epoch": 379} {"train_loss": -34.360294342041016, "global_step": 45942, "epoch": 379} {"train_loss": -34.85542297363281, "global_step": 45943, "epoch": 379} {"train_loss": -34.37554931640625, "global_step": 45944, "epoch": 379} {"train_loss": -34.46819305419922, "global_step": 45945, "epoch": 379} {"train_loss": -34.557395935058594, "global_step": 45946, "epoch": 379} {"train_loss": -35.0180778503418, "global_step": 45947, "epoch": 379} {"train_loss": -34.32316207885742, "global_step": 45948, "epoch": 379} {"train_loss": -33.843772888183594, "global_step": 45949, "epoch": 379} {"train_loss": -33.717105865478516, "global_step": 45950, "epoch": 379} {"train_loss": -33.1961555480957, "global_step": 45951, "epoch": 379} {"train_loss": -33.853450775146484, "global_step": 45952, "epoch": 379} {"train_loss": -33.666900634765625, "global_step": 45953, "epoch": 379} {"train_loss": -34.32337188720703, "global_step": 45954, "epoch": 379} {"train_loss": -33.10435104370117, "global_step": 45955, "epoch": 379} {"train_loss": -31.87113380432129, "global_step": 45956, "epoch": 379} {"train_loss": -27.86767578125, "global_step": 45957, "epoch": 379} {"train_loss": -21.63643455505371, "global_step": 45958, "epoch": 379} {"train_loss": -26.048120498657227, "global_step": 45959, "epoch": 379} {"train_loss": -33.558902740478516, "global_step": 45960, "epoch": 379} {"train_loss": -28.429296493530273, "global_step": 45961, "epoch": 379} {"train_loss": -33.780696868896484, "global_step": 45962, "epoch": 379} {"train_loss": -30.379072189331055, "global_step": 45963, "epoch": 379} {"train_loss": -33.35280227661133, "global_step": 45964, "epoch": 379} {"train_loss": -29.880929946899414, "global_step": 45965, "epoch": 379} {"train_loss": -34.27299880981445, "global_step": 45966, "epoch": 379} {"train_loss": -32.21112060546875, "global_step": 45967, "epoch": 379} {"train_loss": -33.30206298828125, "global_step": 45968, "epoch": 379} {"train_loss": -32.916107177734375, "global_step": 45969, "epoch": 379} {"train_loss": -32.573020935058594, "global_step": 45970, "epoch": 379} {"train_loss": -32.806514739990234, "global_step": 45971, "epoch": 379} {"train_loss": -32.87709045410156, "global_step": 45972, "epoch": 379} {"train_loss": -33.4509162902832, "global_step": 45973, "epoch": 379} {"train_loss": -32.921504974365234, "global_step": 45974, "epoch": 379} {"train_loss": -33.476985931396484, "global_step": 45975, "epoch": 379} {"train_loss": -33.74497604370117, "global_step": 45976, "epoch": 379} {"train_loss": -33.399192810058594, "global_step": 45977, "epoch": 379} {"train_loss": -33.825374603271484, "global_step": 45978, "epoch": 379} {"train_loss": -33.411381540219644, "global_step": 45979, "epoch": 379, "val_loss": 2646054.0} {"train_loss": -34.00419235229492, "global_step": 45980, "epoch": 380} {"train_loss": -34.3953742980957, "global_step": 45981, "epoch": 380} {"train_loss": -33.538753509521484, "global_step": 45982, "epoch": 380} {"train_loss": -33.731868743896484, "global_step": 45983, "epoch": 380} {"train_loss": -33.87575912475586, "global_step": 45984, "epoch": 380} {"train_loss": -33.936729431152344, "global_step": 45985, "epoch": 380} {"train_loss": -33.715572357177734, "global_step": 45986, "epoch": 380} {"train_loss": -34.176666259765625, "global_step": 45987, "epoch": 380} {"train_loss": -34.16410446166992, "global_step": 45988, "epoch": 380} {"train_loss": -33.9630241394043, "global_step": 45989, "epoch": 380} {"train_loss": -34.03299331665039, "global_step": 45990, "epoch": 380} {"train_loss": -33.82862091064453, "global_step": 45991, "epoch": 380} {"train_loss": -34.05907440185547, "global_step": 45992, "epoch": 380} {"train_loss": -34.1260871887207, "global_step": 45993, "epoch": 380} {"train_loss": -34.636898040771484, "global_step": 45994, "epoch": 380} {"train_loss": -34.74939727783203, "global_step": 45995, "epoch": 380} {"train_loss": -34.287689208984375, "global_step": 45996, "epoch": 380} {"train_loss": -34.46013259887695, "global_step": 45997, "epoch": 380} {"train_loss": -34.27682113647461, "global_step": 45998, "epoch": 380} {"train_loss": -33.259185791015625, "global_step": 45999, "epoch": 380} {"train_loss": -33.79669952392578, "global_step": 46000, "epoch": 380} {"train_loss": -33.76599884033203, "global_step": 46001, "epoch": 380} {"train_loss": -32.76836013793945, "global_step": 46002, "epoch": 380} {"train_loss": -33.6961784362793, "global_step": 46003, "epoch": 380} {"train_loss": -33.84558868408203, "global_step": 46004, "epoch": 380} {"train_loss": -32.43681716918945, "global_step": 46005, "epoch": 380} {"train_loss": -32.76082229614258, "global_step": 46006, "epoch": 380} {"train_loss": -32.663631439208984, "global_step": 46007, "epoch": 380} {"train_loss": -33.726112365722656, "global_step": 46008, "epoch": 380} {"train_loss": -33.0344352722168, "global_step": 46009, "epoch": 380} {"train_loss": -31.42876625061035, "global_step": 46010, "epoch": 380} {"train_loss": -31.721607208251953, "global_step": 46011, "epoch": 380} {"train_loss": -32.76201248168945, "global_step": 46012, "epoch": 380} {"train_loss": -31.69196891784668, "global_step": 46013, "epoch": 380} {"train_loss": -31.51590347290039, "global_step": 46014, "epoch": 380} {"train_loss": -32.3775749206543, "global_step": 46015, "epoch": 380} {"train_loss": -31.515100479125977, "global_step": 46016, "epoch": 380} {"train_loss": -32.436073303222656, "global_step": 46017, "epoch": 380} {"train_loss": -31.531827926635742, "global_step": 46018, "epoch": 380} {"train_loss": -29.329999923706055, "global_step": 46019, "epoch": 380} {"train_loss": -30.87623405456543, "global_step": 46020, "epoch": 380} {"train_loss": -32.46316146850586, "global_step": 46021, "epoch": 380} {"train_loss": -32.03396224975586, "global_step": 46022, "epoch": 380} {"train_loss": -29.142337799072266, "global_step": 46023, "epoch": 380} {"train_loss": -32.75968551635742, "global_step": 46024, "epoch": 380} {"train_loss": -30.185882568359375, "global_step": 46025, "epoch": 380} {"train_loss": -32.95744705200195, "global_step": 46026, "epoch": 380} {"train_loss": -31.620824813842773, "global_step": 46027, "epoch": 380} {"train_loss": -30.985233306884766, "global_step": 46028, "epoch": 380} {"train_loss": -32.343421936035156, "global_step": 46029, "epoch": 380} {"train_loss": -31.767316818237305, "global_step": 46030, "epoch": 380} {"train_loss": -30.911100387573242, "global_step": 46031, "epoch": 380} {"train_loss": -32.944759368896484, "global_step": 46032, "epoch": 380} {"train_loss": -29.771738052368164, "global_step": 46033, "epoch": 380} {"train_loss": -31.863073348999023, "global_step": 46034, "epoch": 380} {"train_loss": -32.41872024536133, "global_step": 46035, "epoch": 380} {"train_loss": -31.98377799987793, "global_step": 46036, "epoch": 380} {"train_loss": -29.271398544311523, "global_step": 46037, "epoch": 380} {"train_loss": -31.282495498657227, "global_step": 46038, "epoch": 380} {"train_loss": -31.48174476623535, "global_step": 46039, "epoch": 380} {"train_loss": -32.51121139526367, "global_step": 46040, "epoch": 380} {"train_loss": -32.15456008911133, "global_step": 46041, "epoch": 380} {"train_loss": -31.626386642456055, "global_step": 46042, "epoch": 380} {"train_loss": -32.40810775756836, "global_step": 46043, "epoch": 380} {"train_loss": -30.691495895385742, "global_step": 46044, "epoch": 380} {"train_loss": -32.16523742675781, "global_step": 46045, "epoch": 380} {"train_loss": -32.1341667175293, "global_step": 46046, "epoch": 380} {"train_loss": -32.4684944152832, "global_step": 46047, "epoch": 380} {"train_loss": -31.760251998901367, "global_step": 46048, "epoch": 380} {"train_loss": -31.06377601623535, "global_step": 46049, "epoch": 380} {"train_loss": -32.28392791748047, "global_step": 46050, "epoch": 380} {"train_loss": -31.8624324798584, "global_step": 46051, "epoch": 380} {"train_loss": -32.13127517700195, "global_step": 46052, "epoch": 380} {"train_loss": -32.558677673339844, "global_step": 46053, "epoch": 380} {"train_loss": -32.66841125488281, "global_step": 46054, "epoch": 380} {"train_loss": -33.36988067626953, "global_step": 46055, "epoch": 380} {"train_loss": -32.6967658996582, "global_step": 46056, "epoch": 380} {"train_loss": -32.143470764160156, "global_step": 46057, "epoch": 380} {"train_loss": -32.672088623046875, "global_step": 46058, "epoch": 380} {"train_loss": -32.99646759033203, "global_step": 46059, "epoch": 380} {"train_loss": -33.45040512084961, "global_step": 46060, "epoch": 380} {"train_loss": -31.85540199279785, "global_step": 46061, "epoch": 380} {"train_loss": -32.11617660522461, "global_step": 46062, "epoch": 380} {"train_loss": -33.01814270019531, "global_step": 46063, "epoch": 380} {"train_loss": -33.532833099365234, "global_step": 46064, "epoch": 380} {"train_loss": -32.729366302490234, "global_step": 46065, "epoch": 380} {"train_loss": -33.41660690307617, "global_step": 46066, "epoch": 380} {"train_loss": -33.301509857177734, "global_step": 46067, "epoch": 380} {"train_loss": -33.7039680480957, "global_step": 46068, "epoch": 380} {"train_loss": -33.277156829833984, "global_step": 46069, "epoch": 380} {"train_loss": -33.52362823486328, "global_step": 46070, "epoch": 380} {"train_loss": -33.722557067871094, "global_step": 46071, "epoch": 380} {"train_loss": -33.841915130615234, "global_step": 46072, "epoch": 380} {"train_loss": -33.9842643737793, "global_step": 46073, "epoch": 380} {"train_loss": -33.840476989746094, "global_step": 46074, "epoch": 380} {"train_loss": -33.75157165527344, "global_step": 46075, "epoch": 380} {"train_loss": -33.96142578125, "global_step": 46076, "epoch": 380} {"train_loss": -33.61048126220703, "global_step": 46077, "epoch": 380} {"train_loss": -34.09989547729492, "global_step": 46078, "epoch": 380} {"train_loss": -33.78022384643555, "global_step": 46079, "epoch": 380} {"train_loss": -33.3065071105957, "global_step": 46080, "epoch": 380} {"train_loss": -31.91657829284668, "global_step": 46081, "epoch": 380} {"train_loss": -31.132062911987305, "global_step": 46082, "epoch": 380} {"train_loss": -30.627826690673828, "global_step": 46083, "epoch": 380} {"train_loss": -33.77401351928711, "global_step": 46084, "epoch": 380} {"train_loss": -33.611839294433594, "global_step": 46085, "epoch": 380} {"train_loss": -30.70711326599121, "global_step": 46086, "epoch": 380} {"train_loss": -33.74557113647461, "global_step": 46087, "epoch": 380} {"train_loss": -32.478878021240234, "global_step": 46088, "epoch": 380} {"train_loss": -32.862464904785156, "global_step": 46089, "epoch": 380} {"train_loss": -33.9398307800293, "global_step": 46090, "epoch": 380} {"train_loss": -33.40009689331055, "global_step": 46091, "epoch": 380} {"train_loss": -33.874393463134766, "global_step": 46092, "epoch": 380} {"train_loss": -33.944480895996094, "global_step": 46093, "epoch": 380} {"train_loss": -33.9105224609375, "global_step": 46094, "epoch": 380} {"train_loss": -33.964599609375, "global_step": 46095, "epoch": 380} {"train_loss": -33.48102951049805, "global_step": 46096, "epoch": 380} {"train_loss": -34.593746185302734, "global_step": 46097, "epoch": 380} {"train_loss": -34.45708084106445, "global_step": 46098, "epoch": 380} {"train_loss": -34.24696731567383, "global_step": 46099, "epoch": 380} {"train_loss": -32.81533154574308, "global_step": 46100, "epoch": 380, "val_loss": 2624432.0} {"train_loss": -34.079132080078125, "global_step": 46101, "epoch": 381} {"train_loss": -34.25553512573242, "global_step": 46102, "epoch": 381} {"train_loss": -34.5136833190918, "global_step": 46103, "epoch": 381} {"train_loss": -34.45960235595703, "global_step": 46104, "epoch": 381} {"train_loss": -34.350318908691406, "global_step": 46105, "epoch": 381} {"train_loss": -35.14689636230469, "global_step": 46106, "epoch": 381} {"train_loss": -34.38532257080078, "global_step": 46107, "epoch": 381} {"train_loss": -35.238555908203125, "global_step": 46108, "epoch": 381} {"train_loss": -34.7662239074707, "global_step": 46109, "epoch": 381} {"train_loss": -34.31806564331055, "global_step": 46110, "epoch": 381} {"train_loss": -34.9517936706543, "global_step": 46111, "epoch": 381} {"train_loss": -33.871212005615234, "global_step": 46112, "epoch": 381} {"train_loss": -34.42632293701172, "global_step": 46113, "epoch": 381} {"train_loss": -34.75094985961914, "global_step": 46114, "epoch": 381} {"train_loss": -34.53158950805664, "global_step": 46115, "epoch": 381} {"train_loss": -32.63960647583008, "global_step": 46116, "epoch": 381} {"train_loss": -31.186826705932617, "global_step": 46117, "epoch": 381} {"train_loss": -29.266061782836914, "global_step": 46118, "epoch": 381} {"train_loss": -31.638141632080078, "global_step": 46119, "epoch": 381} {"train_loss": -35.283775329589844, "global_step": 46120, "epoch": 381} {"train_loss": -32.87722396850586, "global_step": 46121, "epoch": 381} {"train_loss": -33.909488677978516, "global_step": 46122, "epoch": 381} {"train_loss": -34.47014236450195, "global_step": 46123, "epoch": 381} {"train_loss": -33.8738899230957, "global_step": 46124, "epoch": 381} {"train_loss": -30.842620849609375, "global_step": 46125, "epoch": 381} {"train_loss": -33.697486877441406, "global_step": 46126, "epoch": 381} {"train_loss": -31.361249923706055, "global_step": 46127, "epoch": 381} {"train_loss": -28.780609130859375, "global_step": 46128, "epoch": 381} {"train_loss": -33.95929718017578, "global_step": 46129, "epoch": 381} {"train_loss": -31.82684898376465, "global_step": 46130, "epoch": 381} {"train_loss": -34.5854377746582, "global_step": 46131, "epoch": 381} {"train_loss": -33.568241119384766, "global_step": 46132, "epoch": 381} {"train_loss": -33.65485382080078, "global_step": 46133, "epoch": 381} {"train_loss": -33.917503356933594, "global_step": 46134, "epoch": 381} {"train_loss": -34.21372604370117, "global_step": 46135, "epoch": 381} {"train_loss": -32.86460494995117, "global_step": 46136, "epoch": 381} {"train_loss": -33.967342376708984, "global_step": 46137, "epoch": 381} {"train_loss": -33.710079193115234, "global_step": 46138, "epoch": 381} {"train_loss": -33.88090896606445, "global_step": 46139, "epoch": 381} {"train_loss": -33.99443435668945, "global_step": 46140, "epoch": 381} {"train_loss": -34.59995651245117, "global_step": 46141, "epoch": 381} {"train_loss": -34.26300048828125, "global_step": 46142, "epoch": 381} {"train_loss": -34.23231887817383, "global_step": 46143, "epoch": 381} {"train_loss": -34.22736740112305, "global_step": 46144, "epoch": 381} {"train_loss": -33.675880432128906, "global_step": 46145, "epoch": 381} {"train_loss": -34.59705352783203, "global_step": 46146, "epoch": 381} {"train_loss": -34.721282958984375, "global_step": 46147, "epoch": 381} {"train_loss": -34.742469787597656, "global_step": 46148, "epoch": 381} {"train_loss": -33.954524993896484, "global_step": 46149, "epoch": 381} {"train_loss": -34.74095916748047, "global_step": 46150, "epoch": 381} {"train_loss": -34.50873947143555, "global_step": 46151, "epoch": 381} {"train_loss": -34.7568473815918, "global_step": 46152, "epoch": 381} {"train_loss": -34.96998596191406, "global_step": 46153, "epoch": 381} {"train_loss": -34.69812774658203, "global_step": 46154, "epoch": 381} {"train_loss": -34.58222579956055, "global_step": 46155, "epoch": 381} {"train_loss": -35.381465911865234, "global_step": 46156, "epoch": 381} {"train_loss": -34.68867111206055, "global_step": 46157, "epoch": 381} {"train_loss": -34.60563278198242, "global_step": 46158, "epoch": 381} {"train_loss": -35.211151123046875, "global_step": 46159, "epoch": 381} {"train_loss": -35.1170768737793, "global_step": 46160, "epoch": 381} {"train_loss": -34.823028564453125, "global_step": 46161, "epoch": 381} {"train_loss": -35.45337677001953, "global_step": 46162, "epoch": 381} {"train_loss": -34.63687515258789, "global_step": 46163, "epoch": 381} {"train_loss": -35.74739074707031, "global_step": 46164, "epoch": 381} {"train_loss": -35.268653869628906, "global_step": 46165, "epoch": 381} {"train_loss": -34.73198318481445, "global_step": 46166, "epoch": 381} {"train_loss": -35.2547492980957, "global_step": 46167, "epoch": 381} {"train_loss": -34.979888916015625, "global_step": 46168, "epoch": 381} {"train_loss": -34.30028533935547, "global_step": 46169, "epoch": 381} {"train_loss": -33.35287857055664, "global_step": 46170, "epoch": 381} {"train_loss": -26.910663604736328, "global_step": 46171, "epoch": 381} {"train_loss": -14.930005073547363, "global_step": 46172, "epoch": 381} {"train_loss": -6.525154113769531, "global_step": 46173, "epoch": 381} {"train_loss": -32.50602340698242, "global_step": 46174, "epoch": 381} {"train_loss": -20.99481201171875, "global_step": 46175, "epoch": 381} {"train_loss": -28.923858642578125, "global_step": 46176, "epoch": 381} {"train_loss": -27.019287109375, "global_step": 46177, "epoch": 381} {"train_loss": -33.35649490356445, "global_step": 46178, "epoch": 381} {"train_loss": -28.793745040893555, "global_step": 46179, "epoch": 381} {"train_loss": -32.09259796142578, "global_step": 46180, "epoch": 381} {"train_loss": -33.65104293823242, "global_step": 46181, "epoch": 381} {"train_loss": -31.649219512939453, "global_step": 46182, "epoch": 381} {"train_loss": -31.18836784362793, "global_step": 46183, "epoch": 381} {"train_loss": -33.55410385131836, "global_step": 46184, "epoch": 381} {"train_loss": -34.04545211791992, "global_step": 46185, "epoch": 381} {"train_loss": -32.57423782348633, "global_step": 46186, "epoch": 381} {"train_loss": -32.54338455200195, "global_step": 46187, "epoch": 381} {"train_loss": -32.63486862182617, "global_step": 46188, "epoch": 381} {"train_loss": -33.80530548095703, "global_step": 46189, "epoch": 381} {"train_loss": -34.17083740234375, "global_step": 46190, "epoch": 381} {"train_loss": -33.4986686706543, "global_step": 46191, "epoch": 381} {"train_loss": -32.98134994506836, "global_step": 46192, "epoch": 381} {"train_loss": -33.484134674072266, "global_step": 46193, "epoch": 381} {"train_loss": -34.41082763671875, "global_step": 46194, "epoch": 381} {"train_loss": -33.540462493896484, "global_step": 46195, "epoch": 381} {"train_loss": -33.9449348449707, "global_step": 46196, "epoch": 381} {"train_loss": -34.36181640625, "global_step": 46197, "epoch": 381} {"train_loss": -33.80099105834961, "global_step": 46198, "epoch": 381} {"train_loss": -33.42253875732422, "global_step": 46199, "epoch": 381} {"train_loss": -34.25038146972656, "global_step": 46200, "epoch": 381} {"train_loss": -33.868064880371094, "global_step": 46201, "epoch": 381} {"train_loss": -34.72344970703125, "global_step": 46202, "epoch": 381} {"train_loss": -33.784423828125, "global_step": 46203, "epoch": 381} {"train_loss": -33.07100296020508, "global_step": 46204, "epoch": 381} {"train_loss": -33.64348220825195, "global_step": 46205, "epoch": 381} {"train_loss": -33.11234664916992, "global_step": 46206, "epoch": 381} {"train_loss": -33.02698516845703, "global_step": 46207, "epoch": 381} {"train_loss": -32.79608917236328, "global_step": 46208, "epoch": 381} {"train_loss": -30.570959091186523, "global_step": 46209, "epoch": 381} {"train_loss": -30.0845890045166, "global_step": 46210, "epoch": 381} {"train_loss": -32.24768829345703, "global_step": 46211, "epoch": 381} {"train_loss": -33.167640686035156, "global_step": 46212, "epoch": 381} {"train_loss": -31.32620620727539, "global_step": 46213, "epoch": 381} {"train_loss": -31.669050216674805, "global_step": 46214, "epoch": 381} {"train_loss": -34.25644302368164, "global_step": 46215, "epoch": 381} {"train_loss": -31.9346981048584, "global_step": 46216, "epoch": 381} {"train_loss": -33.99887466430664, "global_step": 46217, "epoch": 381} {"train_loss": -32.4249153137207, "global_step": 46218, "epoch": 381} {"train_loss": -33.87990951538086, "global_step": 46219, "epoch": 381} {"train_loss": -33.9427490234375, "global_step": 46220, "epoch": 381} {"train_loss": -33.004105820143515, "global_step": 46221, "epoch": 381, "val_loss": 2678910.75} {"train_loss": -33.137447357177734, "global_step": 46222, "epoch": 382} {"train_loss": -33.961936950683594, "global_step": 46223, "epoch": 382} {"train_loss": -33.349456787109375, "global_step": 46224, "epoch": 382} {"train_loss": -34.441871643066406, "global_step": 46225, "epoch": 382} {"train_loss": -34.09844970703125, "global_step": 46226, "epoch": 382} {"train_loss": -33.36509323120117, "global_step": 46227, "epoch": 382} {"train_loss": -34.18354034423828, "global_step": 46228, "epoch": 382} {"train_loss": -31.867292404174805, "global_step": 46229, "epoch": 382} {"train_loss": -33.16398620605469, "global_step": 46230, "epoch": 382} {"train_loss": -32.98848342895508, "global_step": 46231, "epoch": 382} {"train_loss": -33.79256057739258, "global_step": 46232, "epoch": 382} {"train_loss": -33.252235412597656, "global_step": 46233, "epoch": 382} {"train_loss": -33.287269592285156, "global_step": 46234, "epoch": 382} {"train_loss": -33.148799896240234, "global_step": 46235, "epoch": 382} {"train_loss": -32.40433120727539, "global_step": 46236, "epoch": 382} {"train_loss": -34.29022979736328, "global_step": 46237, "epoch": 382} {"train_loss": -33.22701644897461, "global_step": 46238, "epoch": 382} {"train_loss": -33.25289535522461, "global_step": 46239, "epoch": 382} {"train_loss": -33.290855407714844, "global_step": 46240, "epoch": 382} {"train_loss": -33.2765998840332, "global_step": 46241, "epoch": 382} {"train_loss": -34.011436462402344, "global_step": 46242, "epoch": 382} {"train_loss": -32.97579574584961, "global_step": 46243, "epoch": 382} {"train_loss": -33.847713470458984, "global_step": 46244, "epoch": 382} {"train_loss": -33.09930419921875, "global_step": 46245, "epoch": 382} {"train_loss": -32.633872985839844, "global_step": 46246, "epoch": 382} {"train_loss": -28.436079025268555, "global_step": 46247, "epoch": 382} {"train_loss": -25.088651657104492, "global_step": 46248, "epoch": 382} {"train_loss": -26.045312881469727, "global_step": 46249, "epoch": 382} {"train_loss": -33.201751708984375, "global_step": 46250, "epoch": 382} {"train_loss": -29.833181381225586, "global_step": 46251, "epoch": 382} {"train_loss": -31.4593448638916, "global_step": 46252, "epoch": 382} {"train_loss": -32.5884895324707, "global_step": 46253, "epoch": 382} {"train_loss": -31.622970581054688, "global_step": 46254, "epoch": 382} {"train_loss": -33.310482025146484, "global_step": 46255, "epoch": 382} {"train_loss": -32.12553787231445, "global_step": 46256, "epoch": 382} {"train_loss": -32.78831100463867, "global_step": 46257, "epoch": 382} {"train_loss": -33.4016227722168, "global_step": 46258, "epoch": 382} {"train_loss": -32.98648452758789, "global_step": 46259, "epoch": 382} {"train_loss": -33.35419464111328, "global_step": 46260, "epoch": 382} {"train_loss": -33.16042709350586, "global_step": 46261, "epoch": 382} {"train_loss": -33.27981185913086, "global_step": 46262, "epoch": 382} {"train_loss": -33.29987716674805, "global_step": 46263, "epoch": 382} {"train_loss": -33.4610595703125, "global_step": 46264, "epoch": 382} {"train_loss": -33.748592376708984, "global_step": 46265, "epoch": 382} {"train_loss": -33.629093170166016, "global_step": 46266, "epoch": 382} {"train_loss": -34.07052230834961, "global_step": 46267, "epoch": 382} {"train_loss": -33.23003005981445, "global_step": 46268, "epoch": 382} {"train_loss": -33.27451705932617, "global_step": 46269, "epoch": 382} {"train_loss": -33.85244369506836, "global_step": 46270, "epoch": 382} {"train_loss": -32.91213607788086, "global_step": 46271, "epoch": 382} {"train_loss": -32.93765640258789, "global_step": 46272, "epoch": 382} {"train_loss": -33.74848556518555, "global_step": 46273, "epoch": 382} {"train_loss": -33.67841720581055, "global_step": 46274, "epoch": 382} {"train_loss": -32.57338333129883, "global_step": 46275, "epoch": 382} {"train_loss": -33.73789978027344, "global_step": 46276, "epoch": 382} {"train_loss": -32.64653015136719, "global_step": 46277, "epoch": 382} {"train_loss": -33.601741790771484, "global_step": 46278, "epoch": 382} {"train_loss": -32.569252014160156, "global_step": 46279, "epoch": 382} {"train_loss": -33.47181701660156, "global_step": 46280, "epoch": 382} {"train_loss": -32.21249008178711, "global_step": 46281, "epoch": 382} {"train_loss": -32.83790969848633, "global_step": 46282, "epoch": 382} {"train_loss": -32.50180435180664, "global_step": 46283, "epoch": 382} {"train_loss": -31.7747859954834, "global_step": 46284, "epoch": 382} {"train_loss": -32.02165603637695, "global_step": 46285, "epoch": 382} {"train_loss": -31.09271812438965, "global_step": 46286, "epoch": 382} {"train_loss": -32.0596809387207, "global_step": 46287, "epoch": 382} {"train_loss": -32.23922348022461, "global_step": 46288, "epoch": 382} {"train_loss": -31.382673263549805, "global_step": 46289, "epoch": 382} {"train_loss": -32.565711975097656, "global_step": 46290, "epoch": 382} {"train_loss": -31.051010131835938, "global_step": 46291, "epoch": 382} {"train_loss": -31.758441925048828, "global_step": 46292, "epoch": 382} {"train_loss": -33.26681137084961, "global_step": 46293, "epoch": 382} {"train_loss": -32.92292404174805, "global_step": 46294, "epoch": 382} {"train_loss": -31.754383087158203, "global_step": 46295, "epoch": 382} {"train_loss": -33.17625045776367, "global_step": 46296, "epoch": 382} {"train_loss": -33.72811508178711, "global_step": 46297, "epoch": 382} {"train_loss": -32.582305908203125, "global_step": 46298, "epoch": 382} {"train_loss": -32.695316314697266, "global_step": 46299, "epoch": 382} {"train_loss": -32.89223098754883, "global_step": 46300, "epoch": 382} {"train_loss": -33.32706832885742, "global_step": 46301, "epoch": 382} {"train_loss": -33.25893783569336, "global_step": 46302, "epoch": 382} {"train_loss": -33.238739013671875, "global_step": 46303, "epoch": 382} {"train_loss": -33.588401794433594, "global_step": 46304, "epoch": 382} {"train_loss": -33.674808502197266, "global_step": 46305, "epoch": 382} {"train_loss": -33.1201286315918, "global_step": 46306, "epoch": 382} {"train_loss": -33.44020080566406, "global_step": 46307, "epoch": 382} {"train_loss": -33.41649627685547, "global_step": 46308, "epoch": 382} {"train_loss": -32.900550842285156, "global_step": 46309, "epoch": 382} {"train_loss": -33.41896438598633, "global_step": 46310, "epoch": 382} {"train_loss": -34.20841598510742, "global_step": 46311, "epoch": 382} {"train_loss": -31.5906925201416, "global_step": 46312, "epoch": 382} {"train_loss": -33.862789154052734, "global_step": 46313, "epoch": 382} {"train_loss": -33.089820861816406, "global_step": 46314, "epoch": 382} {"train_loss": -33.00313949584961, "global_step": 46315, "epoch": 382} {"train_loss": -33.135860443115234, "global_step": 46316, "epoch": 382} {"train_loss": -33.869789123535156, "global_step": 46317, "epoch": 382} {"train_loss": -33.38711166381836, "global_step": 46318, "epoch": 382} {"train_loss": -33.142696380615234, "global_step": 46319, "epoch": 382} {"train_loss": -33.32301712036133, "global_step": 46320, "epoch": 382} {"train_loss": -32.22727584838867, "global_step": 46321, "epoch": 382} {"train_loss": -34.11214828491211, "global_step": 46322, "epoch": 382} {"train_loss": -33.3613166809082, "global_step": 46323, "epoch": 382} {"train_loss": -32.621883392333984, "global_step": 46324, "epoch": 382} {"train_loss": -33.63562774658203, "global_step": 46325, "epoch": 382} {"train_loss": -33.97046661376953, "global_step": 46326, "epoch": 382} {"train_loss": -33.053741455078125, "global_step": 46327, "epoch": 382} {"train_loss": -33.22251892089844, "global_step": 46328, "epoch": 382} {"train_loss": -34.2000846862793, "global_step": 46329, "epoch": 382} {"train_loss": -33.771400451660156, "global_step": 46330, "epoch": 382} {"train_loss": -33.67427444458008, "global_step": 46331, "epoch": 382} {"train_loss": -33.75771713256836, "global_step": 46332, "epoch": 382} {"train_loss": -33.399349212646484, "global_step": 46333, "epoch": 382} {"train_loss": -34.11922836303711, "global_step": 46334, "epoch": 382} {"train_loss": -33.60091781616211, "global_step": 46335, "epoch": 382} {"train_loss": -33.924251556396484, "global_step": 46336, "epoch": 382} {"train_loss": -33.69063186645508, "global_step": 46337, "epoch": 382} {"train_loss": -32.54254150390625, "global_step": 46338, "epoch": 382} {"train_loss": -32.98467254638672, "global_step": 46339, "epoch": 382} {"train_loss": -33.07661056518555, "global_step": 46340, "epoch": 382} {"train_loss": -34.27656936645508, "global_step": 46341, "epoch": 382} {"train_loss": -32.95497471833032, "global_step": 46342, "epoch": 382, "val_loss": 2576889.0} {"train_loss": -33.91714096069336, "global_step": 46343, "epoch": 383} {"train_loss": -34.53744125366211, "global_step": 46344, "epoch": 383} {"train_loss": -34.28817367553711, "global_step": 46345, "epoch": 383} {"train_loss": -33.638301849365234, "global_step": 46346, "epoch": 383} {"train_loss": -34.44863510131836, "global_step": 46347, "epoch": 383} {"train_loss": -34.07139205932617, "global_step": 46348, "epoch": 383} {"train_loss": -33.28632354736328, "global_step": 46349, "epoch": 383} {"train_loss": -33.96635055541992, "global_step": 46350, "epoch": 383} {"train_loss": -34.2431755065918, "global_step": 46351, "epoch": 383} {"train_loss": -33.62510681152344, "global_step": 46352, "epoch": 383} {"train_loss": -34.44051742553711, "global_step": 46353, "epoch": 383} {"train_loss": -34.47758865356445, "global_step": 46354, "epoch": 383} {"train_loss": -34.23954391479492, "global_step": 46355, "epoch": 383} {"train_loss": -34.63631820678711, "global_step": 46356, "epoch": 383} {"train_loss": -32.982051849365234, "global_step": 46357, "epoch": 383} {"train_loss": -34.3397331237793, "global_step": 46358, "epoch": 383} {"train_loss": -34.90238571166992, "global_step": 46359, "epoch": 383} {"train_loss": -33.72809982299805, "global_step": 46360, "epoch": 383} {"train_loss": -33.46989059448242, "global_step": 46361, "epoch": 383} {"train_loss": -33.539573669433594, "global_step": 46362, "epoch": 383} {"train_loss": -33.76785659790039, "global_step": 46363, "epoch": 383} {"train_loss": -34.401710510253906, "global_step": 46364, "epoch": 383} {"train_loss": -33.84841537475586, "global_step": 46365, "epoch": 383} {"train_loss": -33.88450241088867, "global_step": 46366, "epoch": 383} {"train_loss": -34.32851028442383, "global_step": 46367, "epoch": 383} {"train_loss": -34.1602783203125, "global_step": 46368, "epoch": 383} {"train_loss": -34.19679641723633, "global_step": 46369, "epoch": 383} {"train_loss": -34.273807525634766, "global_step": 46370, "epoch": 383} {"train_loss": -34.2465705871582, "global_step": 46371, "epoch": 383} {"train_loss": -34.75977325439453, "global_step": 46372, "epoch": 383} {"train_loss": -33.840911865234375, "global_step": 46373, "epoch": 383} {"train_loss": -33.2164306640625, "global_step": 46374, "epoch": 383} {"train_loss": -34.40151596069336, "global_step": 46375, "epoch": 383} {"train_loss": -29.78925895690918, "global_step": 46376, "epoch": 383} {"train_loss": -33.83496856689453, "global_step": 46377, "epoch": 383} {"train_loss": -32.487579345703125, "global_step": 46378, "epoch": 383} {"train_loss": -31.463720321655273, "global_step": 46379, "epoch": 383} {"train_loss": -29.4716854095459, "global_step": 46380, "epoch": 383} {"train_loss": -27.494482040405273, "global_step": 46381, "epoch": 383} {"train_loss": -32.45771408081055, "global_step": 46382, "epoch": 383} {"train_loss": -33.871089935302734, "global_step": 46383, "epoch": 383} {"train_loss": -31.772079467773438, "global_step": 46384, "epoch": 383} {"train_loss": -31.46516990661621, "global_step": 46385, "epoch": 383} {"train_loss": -32.8948860168457, "global_step": 46386, "epoch": 383} {"train_loss": -30.420215606689453, "global_step": 46387, "epoch": 383} {"train_loss": -33.86069869995117, "global_step": 46388, "epoch": 383} {"train_loss": -31.817169189453125, "global_step": 46389, "epoch": 383} {"train_loss": -33.019386291503906, "global_step": 46390, "epoch": 383} {"train_loss": -32.136627197265625, "global_step": 46391, "epoch": 383} {"train_loss": -32.41254425048828, "global_step": 46392, "epoch": 383} {"train_loss": -31.613697052001953, "global_step": 46393, "epoch": 383} {"train_loss": -31.5096492767334, "global_step": 46394, "epoch": 383} {"train_loss": -31.840620040893555, "global_step": 46395, "epoch": 383} {"train_loss": -32.776031494140625, "global_step": 46396, "epoch": 383} {"train_loss": -33.17793273925781, "global_step": 46397, "epoch": 383} {"train_loss": -31.834760665893555, "global_step": 46398, "epoch": 383} {"train_loss": -32.7536506652832, "global_step": 46399, "epoch": 383} {"train_loss": -32.92020797729492, "global_step": 46400, "epoch": 383} {"train_loss": -32.903499603271484, "global_step": 46401, "epoch": 383} {"train_loss": -32.95661544799805, "global_step": 46402, "epoch": 383} {"train_loss": -32.7519416809082, "global_step": 46403, "epoch": 383} {"train_loss": -32.742374420166016, "global_step": 46404, "epoch": 383} {"train_loss": -32.84315872192383, "global_step": 46405, "epoch": 383} {"train_loss": -32.58854293823242, "global_step": 46406, "epoch": 383} {"train_loss": -33.50118637084961, "global_step": 46407, "epoch": 383} {"train_loss": -33.357398986816406, "global_step": 46408, "epoch": 383} {"train_loss": -33.206172943115234, "global_step": 46409, "epoch": 383} {"train_loss": -32.9974250793457, "global_step": 46410, "epoch": 383} {"train_loss": -33.06887435913086, "global_step": 46411, "epoch": 383} {"train_loss": -33.581031799316406, "global_step": 46412, "epoch": 383} {"train_loss": -33.81867599487305, "global_step": 46413, "epoch": 383} {"train_loss": -33.80831527709961, "global_step": 46414, "epoch": 383} {"train_loss": -33.2063102722168, "global_step": 46415, "epoch": 383} {"train_loss": -33.316802978515625, "global_step": 46416, "epoch": 383} {"train_loss": -34.010433197021484, "global_step": 46417, "epoch": 383} {"train_loss": -33.90296173095703, "global_step": 46418, "epoch": 383} {"train_loss": -33.512760162353516, "global_step": 46419, "epoch": 383} {"train_loss": -32.733436584472656, "global_step": 46420, "epoch": 383} {"train_loss": -34.14491271972656, "global_step": 46421, "epoch": 383} {"train_loss": -34.06405258178711, "global_step": 46422, "epoch": 383} {"train_loss": -33.97960662841797, "global_step": 46423, "epoch": 383} {"train_loss": -33.98672103881836, "global_step": 46424, "epoch": 383} {"train_loss": -33.58285140991211, "global_step": 46425, "epoch": 383} {"train_loss": -33.5926513671875, "global_step": 46426, "epoch": 383} {"train_loss": -32.925201416015625, "global_step": 46427, "epoch": 383} {"train_loss": -32.83723068237305, "global_step": 46428, "epoch": 383} {"train_loss": -32.8218994140625, "global_step": 46429, "epoch": 383} {"train_loss": -32.40385818481445, "global_step": 46430, "epoch": 383} {"train_loss": -33.20510482788086, "global_step": 46431, "epoch": 383} {"train_loss": -33.87909698486328, "global_step": 46432, "epoch": 383} {"train_loss": -33.3760871887207, "global_step": 46433, "epoch": 383} {"train_loss": -31.373687744140625, "global_step": 46434, "epoch": 383} {"train_loss": -33.0799560546875, "global_step": 46435, "epoch": 383} {"train_loss": -34.10578536987305, "global_step": 46436, "epoch": 383} {"train_loss": -32.56024169921875, "global_step": 46437, "epoch": 383} {"train_loss": -32.14600372314453, "global_step": 46438, "epoch": 383} {"train_loss": -33.5352668762207, "global_step": 46439, "epoch": 383} {"train_loss": -31.511505126953125, "global_step": 46440, "epoch": 383} {"train_loss": -33.218257904052734, "global_step": 46441, "epoch": 383} {"train_loss": -33.731475830078125, "global_step": 46442, "epoch": 383} {"train_loss": -33.52361297607422, "global_step": 46443, "epoch": 383} {"train_loss": -34.005531311035156, "global_step": 46444, "epoch": 383} {"train_loss": -33.715309143066406, "global_step": 46445, "epoch": 383} {"train_loss": -34.10327911376953, "global_step": 46446, "epoch": 383} {"train_loss": -33.00398635864258, "global_step": 46447, "epoch": 383} {"train_loss": -34.374481201171875, "global_step": 46448, "epoch": 383} {"train_loss": -34.05292510986328, "global_step": 46449, "epoch": 383} {"train_loss": -34.767059326171875, "global_step": 46450, "epoch": 383} {"train_loss": -34.340301513671875, "global_step": 46451, "epoch": 383} {"train_loss": -34.46616744995117, "global_step": 46452, "epoch": 383} {"train_loss": -34.39216995239258, "global_step": 46453, "epoch": 383} {"train_loss": -34.55841064453125, "global_step": 46454, "epoch": 383} {"train_loss": -34.60810852050781, "global_step": 46455, "epoch": 383} {"train_loss": -34.84234619140625, "global_step": 46456, "epoch": 383} {"train_loss": -34.977195739746094, "global_step": 46457, "epoch": 383} {"train_loss": -34.57773971557617, "global_step": 46458, "epoch": 383} {"train_loss": -35.11369323730469, "global_step": 46459, "epoch": 383} {"train_loss": -34.77162551879883, "global_step": 46460, "epoch": 383} {"train_loss": -34.37568664550781, "global_step": 46461, "epoch": 383} {"train_loss": -35.09919357299805, "global_step": 46462, "epoch": 383} {"train_loss": -33.395367047018254, "global_step": 46463, "epoch": 383, "val_loss": 2606620.0} {"train_loss": -35.08181381225586, "global_step": 46464, "epoch": 384} {"train_loss": -34.77595138549805, "global_step": 46465, "epoch": 384} {"train_loss": -34.87844467163086, "global_step": 46466, "epoch": 384} {"train_loss": -35.371829986572266, "global_step": 46467, "epoch": 384} {"train_loss": -34.97895431518555, "global_step": 46468, "epoch": 384} {"train_loss": -35.51543045043945, "global_step": 46469, "epoch": 384} {"train_loss": -34.381744384765625, "global_step": 46470, "epoch": 384} {"train_loss": -32.15506362915039, "global_step": 46471, "epoch": 384} {"train_loss": -30.646520614624023, "global_step": 46472, "epoch": 384} {"train_loss": -35.041770935058594, "global_step": 46473, "epoch": 384} {"train_loss": -31.35980796813965, "global_step": 46474, "epoch": 384} {"train_loss": -34.128841400146484, "global_step": 46475, "epoch": 384} {"train_loss": -31.410085678100586, "global_step": 46476, "epoch": 384} {"train_loss": -35.23673629760742, "global_step": 46477, "epoch": 384} {"train_loss": -32.67765426635742, "global_step": 46478, "epoch": 384} {"train_loss": -34.44318389892578, "global_step": 46479, "epoch": 384} {"train_loss": -34.46324157714844, "global_step": 46480, "epoch": 384} {"train_loss": -33.06101608276367, "global_step": 46481, "epoch": 384} {"train_loss": -33.82135772705078, "global_step": 46482, "epoch": 384} {"train_loss": -35.5478401184082, "global_step": 46483, "epoch": 384} {"train_loss": -33.778202056884766, "global_step": 46484, "epoch": 384} {"train_loss": -33.93436813354492, "global_step": 46485, "epoch": 384} {"train_loss": -32.61008834838867, "global_step": 46486, "epoch": 384} {"train_loss": -31.634008407592773, "global_step": 46487, "epoch": 384} {"train_loss": -31.837127685546875, "global_step": 46488, "epoch": 384} {"train_loss": -30.46087646484375, "global_step": 46489, "epoch": 384} {"train_loss": -31.967626571655273, "global_step": 46490, "epoch": 384} {"train_loss": -33.59547805786133, "global_step": 46491, "epoch": 384} {"train_loss": -33.90253448486328, "global_step": 46492, "epoch": 384} {"train_loss": -32.368072509765625, "global_step": 46493, "epoch": 384} {"train_loss": -32.9191780090332, "global_step": 46494, "epoch": 384} {"train_loss": -34.12222671508789, "global_step": 46495, "epoch": 384} {"train_loss": -32.53866958618164, "global_step": 46496, "epoch": 384} {"train_loss": -33.482601165771484, "global_step": 46497, "epoch": 384} {"train_loss": -34.46095275878906, "global_step": 46498, "epoch": 384} {"train_loss": -33.52900695800781, "global_step": 46499, "epoch": 384} {"train_loss": -33.977352142333984, "global_step": 46500, "epoch": 384} {"train_loss": -32.50909423828125, "global_step": 46501, "epoch": 384} {"train_loss": -33.9420280456543, "global_step": 46502, "epoch": 384} {"train_loss": -33.74934768676758, "global_step": 46503, "epoch": 384} {"train_loss": -34.91815948486328, "global_step": 46504, "epoch": 384} {"train_loss": -33.122074127197266, "global_step": 46505, "epoch": 384} {"train_loss": -34.0398063659668, "global_step": 46506, "epoch": 384} {"train_loss": -34.29691696166992, "global_step": 46507, "epoch": 384} {"train_loss": -33.5316276550293, "global_step": 46508, "epoch": 384} {"train_loss": -34.175418853759766, "global_step": 46509, "epoch": 384} {"train_loss": -34.09955596923828, "global_step": 46510, "epoch": 384} {"train_loss": -33.971656799316406, "global_step": 46511, "epoch": 384} {"train_loss": -33.757625579833984, "global_step": 46512, "epoch": 384} {"train_loss": -34.003108978271484, "global_step": 46513, "epoch": 384} {"train_loss": -33.79035568237305, "global_step": 46514, "epoch": 384} {"train_loss": -34.18620681762695, "global_step": 46515, "epoch": 384} {"train_loss": -34.361732482910156, "global_step": 46516, "epoch": 384} {"train_loss": -34.57474136352539, "global_step": 46517, "epoch": 384} {"train_loss": -33.91080856323242, "global_step": 46518, "epoch": 384} {"train_loss": -34.051448822021484, "global_step": 46519, "epoch": 384} {"train_loss": -35.047176361083984, "global_step": 46520, "epoch": 384} {"train_loss": -34.216434478759766, "global_step": 46521, "epoch": 384} {"train_loss": -34.23868179321289, "global_step": 46522, "epoch": 384} {"train_loss": -34.934814453125, "global_step": 46523, "epoch": 384} {"train_loss": -34.182960510253906, "global_step": 46524, "epoch": 384} {"train_loss": -34.609832763671875, "global_step": 46525, "epoch": 384} {"train_loss": -34.9059944152832, "global_step": 46526, "epoch": 384} {"train_loss": -34.09463119506836, "global_step": 46527, "epoch": 384} {"train_loss": -34.501220703125, "global_step": 46528, "epoch": 384} {"train_loss": -35.11995315551758, "global_step": 46529, "epoch": 384} {"train_loss": -35.12568283081055, "global_step": 46530, "epoch": 384} {"train_loss": -34.90132522583008, "global_step": 46531, "epoch": 384} {"train_loss": -34.800899505615234, "global_step": 46532, "epoch": 384} {"train_loss": -35.02538299560547, "global_step": 46533, "epoch": 384} {"train_loss": -35.23136520385742, "global_step": 46534, "epoch": 384} {"train_loss": -34.7235221862793, "global_step": 46535, "epoch": 384} {"train_loss": -35.0352668762207, "global_step": 46536, "epoch": 384} {"train_loss": -35.24784851074219, "global_step": 46537, "epoch": 384} {"train_loss": -34.98174285888672, "global_step": 46538, "epoch": 384} {"train_loss": -35.649078369140625, "global_step": 46539, "epoch": 384} {"train_loss": -34.96493911743164, "global_step": 46540, "epoch": 384} {"train_loss": -34.36003875732422, "global_step": 46541, "epoch": 384} {"train_loss": -35.215816497802734, "global_step": 46542, "epoch": 384} {"train_loss": -35.010955810546875, "global_step": 46543, "epoch": 384} {"train_loss": -34.9710578918457, "global_step": 46544, "epoch": 384} {"train_loss": -35.205474853515625, "global_step": 46545, "epoch": 384} {"train_loss": -35.566558837890625, "global_step": 46546, "epoch": 384} {"train_loss": -35.29060745239258, "global_step": 46547, "epoch": 384} {"train_loss": -35.28963088989258, "global_step": 46548, "epoch": 384} {"train_loss": -35.4907112121582, "global_step": 46549, "epoch": 384} {"train_loss": -35.124839782714844, "global_step": 46550, "epoch": 384} {"train_loss": -35.54926681518555, "global_step": 46551, "epoch": 384} {"train_loss": -34.90690231323242, "global_step": 46552, "epoch": 384} {"train_loss": -35.10763168334961, "global_step": 46553, "epoch": 384} {"train_loss": -35.588661193847656, "global_step": 46554, "epoch": 384} {"train_loss": -34.67861557006836, "global_step": 46555, "epoch": 384} {"train_loss": -33.435428619384766, "global_step": 46556, "epoch": 384} {"train_loss": -27.942102432250977, "global_step": 46557, "epoch": 384} {"train_loss": -6.203216075897217, "global_step": 46558, "epoch": 384} {"train_loss": 20.664316177368164, "global_step": 46559, "epoch": 384} {"train_loss": -7.4403228759765625, "global_step": 46560, "epoch": 384} {"train_loss": -16.247888565063477, "global_step": 46561, "epoch": 384} {"train_loss": -15.130459785461426, "global_step": 46562, "epoch": 384} {"train_loss": -23.245969772338867, "global_step": 46563, "epoch": 384} {"train_loss": -26.474945068359375, "global_step": 46564, "epoch": 384} {"train_loss": -20.515941619873047, "global_step": 46565, "epoch": 384} {"train_loss": -27.449193954467773, "global_step": 46566, "epoch": 384} {"train_loss": -30.123798370361328, "global_step": 46567, "epoch": 384} {"train_loss": -29.789810180664062, "global_step": 46568, "epoch": 384} {"train_loss": -28.397354125976562, "global_step": 46569, "epoch": 384} {"train_loss": -27.81292152404785, "global_step": 46570, "epoch": 384} {"train_loss": -32.066036224365234, "global_step": 46571, "epoch": 384} {"train_loss": -30.5030574798584, "global_step": 46572, "epoch": 384} {"train_loss": -31.9284725189209, "global_step": 46573, "epoch": 384} {"train_loss": -31.144826889038086, "global_step": 46574, "epoch": 384} {"train_loss": -28.92091178894043, "global_step": 46575, "epoch": 384} {"train_loss": -30.303241729736328, "global_step": 46576, "epoch": 384} {"train_loss": -31.90167808532715, "global_step": 46577, "epoch": 384} {"train_loss": -32.473323822021484, "global_step": 46578, "epoch": 384} {"train_loss": -32.43061447143555, "global_step": 46579, "epoch": 384} {"train_loss": -32.52545928955078, "global_step": 46580, "epoch": 384} {"train_loss": -32.15033721923828, "global_step": 46581, "epoch": 384} {"train_loss": -32.382598876953125, "global_step": 46582, "epoch": 384} {"train_loss": -32.265010833740234, "global_step": 46583, "epoch": 384} {"train_loss": -32.1229733908472, "global_step": 46584, "epoch": 384, "val_loss": 2667782.75} {"train_loss": -32.84855270385742, "global_step": 46585, "epoch": 385} {"train_loss": -32.77091598510742, "global_step": 46586, "epoch": 385} {"train_loss": -33.10456466674805, "global_step": 46587, "epoch": 385} {"train_loss": -33.14201736450195, "global_step": 46588, "epoch": 385} {"train_loss": -33.12374496459961, "global_step": 46589, "epoch": 385} {"train_loss": -32.33349609375, "global_step": 46590, "epoch": 385} {"train_loss": -33.219635009765625, "global_step": 46591, "epoch": 385} {"train_loss": -32.80591583251953, "global_step": 46592, "epoch": 385} {"train_loss": -32.90684509277344, "global_step": 46593, "epoch": 385} {"train_loss": -32.91016387939453, "global_step": 46594, "epoch": 385} {"train_loss": -33.07230758666992, "global_step": 46595, "epoch": 385} {"train_loss": -33.1485481262207, "global_step": 46596, "epoch": 385} {"train_loss": -32.90827560424805, "global_step": 46597, "epoch": 385} {"train_loss": -33.46397018432617, "global_step": 46598, "epoch": 385} {"train_loss": -33.26642990112305, "global_step": 46599, "epoch": 385} {"train_loss": -33.431610107421875, "global_step": 46600, "epoch": 385} {"train_loss": -33.203182220458984, "global_step": 46601, "epoch": 385} {"train_loss": -33.46575164794922, "global_step": 46602, "epoch": 385} {"train_loss": -33.60744857788086, "global_step": 46603, "epoch": 385} {"train_loss": -33.78507995605469, "global_step": 46604, "epoch": 385} {"train_loss": -33.6150016784668, "global_step": 46605, "epoch": 385} {"train_loss": -33.685970306396484, "global_step": 46606, "epoch": 385} {"train_loss": -33.910194396972656, "global_step": 46607, "epoch": 385} {"train_loss": -33.919063568115234, "global_step": 46608, "epoch": 385} {"train_loss": -33.8406982421875, "global_step": 46609, "epoch": 385} {"train_loss": -34.05582809448242, "global_step": 46610, "epoch": 385} {"train_loss": -33.81531524658203, "global_step": 46611, "epoch": 385} {"train_loss": -33.834468841552734, "global_step": 46612, "epoch": 385} {"train_loss": -34.29407501220703, "global_step": 46613, "epoch": 385} {"train_loss": -34.21773910522461, "global_step": 46614, "epoch": 385} {"train_loss": -34.32979202270508, "global_step": 46615, "epoch": 385} {"train_loss": -34.3162841796875, "global_step": 46616, "epoch": 385} {"train_loss": -34.684871673583984, "global_step": 46617, "epoch": 385} {"train_loss": -34.32064437866211, "global_step": 46618, "epoch": 385} {"train_loss": -34.54185104370117, "global_step": 46619, "epoch": 385} {"train_loss": -34.6183967590332, "global_step": 46620, "epoch": 385} {"train_loss": -33.36491775512695, "global_step": 46621, "epoch": 385} {"train_loss": -34.39588928222656, "global_step": 46622, "epoch": 385} {"train_loss": -34.5971794128418, "global_step": 46623, "epoch": 385} {"train_loss": -34.336673736572266, "global_step": 46624, "epoch": 385} {"train_loss": -34.379486083984375, "global_step": 46625, "epoch": 385} {"train_loss": -34.8046989440918, "global_step": 46626, "epoch": 385} {"train_loss": -34.47607421875, "global_step": 46627, "epoch": 385} {"train_loss": -34.621063232421875, "global_step": 46628, "epoch": 385} {"train_loss": -34.150108337402344, "global_step": 46629, "epoch": 385} {"train_loss": -34.305908203125, "global_step": 46630, "epoch": 385} {"train_loss": -34.912227630615234, "global_step": 46631, "epoch": 385} {"train_loss": -34.60978317260742, "global_step": 46632, "epoch": 385} {"train_loss": -34.5205192565918, "global_step": 46633, "epoch": 385} {"train_loss": -34.36988830566406, "global_step": 46634, "epoch": 385} {"train_loss": -32.8211784362793, "global_step": 46635, "epoch": 385} {"train_loss": -33.64664840698242, "global_step": 46636, "epoch": 385} {"train_loss": -33.14968490600586, "global_step": 46637, "epoch": 385} {"train_loss": -29.8986873626709, "global_step": 46638, "epoch": 385} {"train_loss": -31.00492286682129, "global_step": 46639, "epoch": 385} {"train_loss": -30.651594161987305, "global_step": 46640, "epoch": 385} {"train_loss": -28.924829483032227, "global_step": 46641, "epoch": 385} {"train_loss": -33.683773040771484, "global_step": 46642, "epoch": 385} {"train_loss": -32.10788345336914, "global_step": 46643, "epoch": 385} {"train_loss": -32.626399993896484, "global_step": 46644, "epoch": 385} {"train_loss": -32.58086013793945, "global_step": 46645, "epoch": 385} {"train_loss": -31.99086570739746, "global_step": 46646, "epoch": 385} {"train_loss": -33.400970458984375, "global_step": 46647, "epoch": 385} {"train_loss": -33.78310775756836, "global_step": 46648, "epoch": 385} {"train_loss": -32.2170295715332, "global_step": 46649, "epoch": 385} {"train_loss": -33.89667892456055, "global_step": 46650, "epoch": 385} {"train_loss": -33.650726318359375, "global_step": 46651, "epoch": 385} {"train_loss": -32.632564544677734, "global_step": 46652, "epoch": 385} {"train_loss": -33.42681121826172, "global_step": 46653, "epoch": 385} {"train_loss": -33.97301483154297, "global_step": 46654, "epoch": 385} {"train_loss": -32.5198860168457, "global_step": 46655, "epoch": 385} {"train_loss": -33.03622055053711, "global_step": 46656, "epoch": 385} {"train_loss": -33.832149505615234, "global_step": 46657, "epoch": 385} {"train_loss": -34.01874542236328, "global_step": 46658, "epoch": 385} {"train_loss": -32.419795989990234, "global_step": 46659, "epoch": 385} {"train_loss": -33.75928497314453, "global_step": 46660, "epoch": 385} {"train_loss": -33.343746185302734, "global_step": 46661, "epoch": 385} {"train_loss": -33.6177864074707, "global_step": 46662, "epoch": 385} {"train_loss": -33.34408187866211, "global_step": 46663, "epoch": 385} {"train_loss": -33.18386459350586, "global_step": 46664, "epoch": 385} {"train_loss": -33.51325225830078, "global_step": 46665, "epoch": 385} {"train_loss": -33.15602493286133, "global_step": 46666, "epoch": 385} {"train_loss": -33.022422790527344, "global_step": 46667, "epoch": 385} {"train_loss": -33.51963424682617, "global_step": 46668, "epoch": 385} {"train_loss": -34.215755462646484, "global_step": 46669, "epoch": 385} {"train_loss": -33.592262268066406, "global_step": 46670, "epoch": 385} {"train_loss": -33.49949645996094, "global_step": 46671, "epoch": 385} {"train_loss": -32.790504455566406, "global_step": 46672, "epoch": 385} {"train_loss": -34.27240753173828, "global_step": 46673, "epoch": 385} {"train_loss": -32.76985168457031, "global_step": 46674, "epoch": 385} {"train_loss": -32.3416748046875, "global_step": 46675, "epoch": 385} {"train_loss": -33.2491569519043, "global_step": 46676, "epoch": 385} {"train_loss": -34.11879348754883, "global_step": 46677, "epoch": 385} {"train_loss": -34.1146240234375, "global_step": 46678, "epoch": 385} {"train_loss": -33.4528923034668, "global_step": 46679, "epoch": 385} {"train_loss": -34.245235443115234, "global_step": 46680, "epoch": 385} {"train_loss": -33.8784065246582, "global_step": 46681, "epoch": 385} {"train_loss": -33.970367431640625, "global_step": 46682, "epoch": 385} {"train_loss": -34.463680267333984, "global_step": 46683, "epoch": 385} {"train_loss": -34.240478515625, "global_step": 46684, "epoch": 385} {"train_loss": -33.947601318359375, "global_step": 46685, "epoch": 385} {"train_loss": -34.22746658325195, "global_step": 46686, "epoch": 385} {"train_loss": -33.5465202331543, "global_step": 46687, "epoch": 385} {"train_loss": -34.30056381225586, "global_step": 46688, "epoch": 385} {"train_loss": -33.65397262573242, "global_step": 46689, "epoch": 385} {"train_loss": -33.52536392211914, "global_step": 46690, "epoch": 385} {"train_loss": -33.66266632080078, "global_step": 46691, "epoch": 385} {"train_loss": -34.414791107177734, "global_step": 46692, "epoch": 385} {"train_loss": -34.16473388671875, "global_step": 46693, "epoch": 385} {"train_loss": -34.41096115112305, "global_step": 46694, "epoch": 385} {"train_loss": -34.61428451538086, "global_step": 46695, "epoch": 385} {"train_loss": -34.16360092163086, "global_step": 46696, "epoch": 385} {"train_loss": -34.41748046875, "global_step": 46697, "epoch": 385} {"train_loss": -34.493526458740234, "global_step": 46698, "epoch": 385} {"train_loss": -34.5759391784668, "global_step": 46699, "epoch": 385} {"train_loss": -34.78993606567383, "global_step": 46700, "epoch": 385} {"train_loss": -34.15447998046875, "global_step": 46701, "epoch": 385} {"train_loss": -34.492286682128906, "global_step": 46702, "epoch": 385} {"train_loss": -34.65653610229492, "global_step": 46703, "epoch": 385} {"train_loss": -34.76408004760742, "global_step": 46704, "epoch": 385} {"train_loss": -33.59689342088936, "global_step": 46705, "epoch": 385, "val_loss": 2634491.75} {"train_loss": -33.68391799926758, "global_step": 46706, "epoch": 386} {"train_loss": -34.90168380737305, "global_step": 46707, "epoch": 386} {"train_loss": -34.232177734375, "global_step": 46708, "epoch": 386} {"train_loss": -34.349063873291016, "global_step": 46709, "epoch": 386} {"train_loss": -33.54655075073242, "global_step": 46710, "epoch": 386} {"train_loss": -34.69977951049805, "global_step": 46711, "epoch": 386} {"train_loss": -34.36814498901367, "global_step": 46712, "epoch": 386} {"train_loss": -34.8333625793457, "global_step": 46713, "epoch": 386} {"train_loss": -34.58230209350586, "global_step": 46714, "epoch": 386} {"train_loss": -34.002071380615234, "global_step": 46715, "epoch": 386} {"train_loss": -34.563995361328125, "global_step": 46716, "epoch": 386} {"train_loss": -34.7699089050293, "global_step": 46717, "epoch": 386} {"train_loss": -34.31742477416992, "global_step": 46718, "epoch": 386} {"train_loss": -34.171417236328125, "global_step": 46719, "epoch": 386} {"train_loss": -34.116798400878906, "global_step": 46720, "epoch": 386} {"train_loss": -33.12003707885742, "global_step": 46721, "epoch": 386} {"train_loss": -34.64216613769531, "global_step": 46722, "epoch": 386} {"train_loss": -33.79887008666992, "global_step": 46723, "epoch": 386} {"train_loss": -33.68728256225586, "global_step": 46724, "epoch": 386} {"train_loss": -34.26658630371094, "global_step": 46725, "epoch": 386} {"train_loss": -34.163021087646484, "global_step": 46726, "epoch": 386} {"train_loss": -30.55262565612793, "global_step": 46727, "epoch": 386} {"train_loss": -29.07281494140625, "global_step": 46728, "epoch": 386} {"train_loss": -24.37034034729004, "global_step": 46729, "epoch": 386} {"train_loss": -20.376901626586914, "global_step": 46730, "epoch": 386} {"train_loss": -11.314610481262207, "global_step": 46731, "epoch": 386} {"train_loss": -14.572253227233887, "global_step": 46732, "epoch": 386} {"train_loss": -31.45014762878418, "global_step": 46733, "epoch": 386} {"train_loss": -24.994556427001953, "global_step": 46734, "epoch": 386} {"train_loss": -32.0760612487793, "global_step": 46735, "epoch": 386} {"train_loss": -29.3354549407959, "global_step": 46736, "epoch": 386} {"train_loss": -33.2314338684082, "global_step": 46737, "epoch": 386} {"train_loss": -29.034381866455078, "global_step": 46738, "epoch": 386} {"train_loss": -31.43937110900879, "global_step": 46739, "epoch": 386} {"train_loss": -31.787073135375977, "global_step": 46740, "epoch": 386} {"train_loss": -31.41468620300293, "global_step": 46741, "epoch": 386} {"train_loss": -32.58256912231445, "global_step": 46742, "epoch": 386} {"train_loss": -33.18403244018555, "global_step": 46743, "epoch": 386} {"train_loss": -32.47705841064453, "global_step": 46744, "epoch": 386} {"train_loss": -32.055999755859375, "global_step": 46745, "epoch": 386} {"train_loss": -32.75080108642578, "global_step": 46746, "epoch": 386} {"train_loss": -32.837703704833984, "global_step": 46747, "epoch": 386} {"train_loss": -32.77809524536133, "global_step": 46748, "epoch": 386} {"train_loss": -32.99502182006836, "global_step": 46749, "epoch": 386} {"train_loss": -33.15378952026367, "global_step": 46750, "epoch": 386} {"train_loss": -32.8158073425293, "global_step": 46751, "epoch": 386} {"train_loss": -33.35913848876953, "global_step": 46752, "epoch": 386} {"train_loss": -32.43952178955078, "global_step": 46753, "epoch": 386} {"train_loss": -32.93613815307617, "global_step": 46754, "epoch": 386} {"train_loss": -32.764495849609375, "global_step": 46755, "epoch": 386} {"train_loss": -33.45724105834961, "global_step": 46756, "epoch": 386} {"train_loss": -33.35600662231445, "global_step": 46757, "epoch": 386} {"train_loss": -33.16318893432617, "global_step": 46758, "epoch": 386} {"train_loss": -33.182369232177734, "global_step": 46759, "epoch": 386} {"train_loss": -32.4421501159668, "global_step": 46760, "epoch": 386} {"train_loss": -33.218849182128906, "global_step": 46761, "epoch": 386} {"train_loss": -33.59564971923828, "global_step": 46762, "epoch": 386} {"train_loss": -33.13007736206055, "global_step": 46763, "epoch": 386} {"train_loss": -32.950801849365234, "global_step": 46764, "epoch": 386} {"train_loss": -33.433258056640625, "global_step": 46765, "epoch": 386} {"train_loss": -33.19808578491211, "global_step": 46766, "epoch": 386} {"train_loss": -32.530120849609375, "global_step": 46767, "epoch": 386} {"train_loss": -33.86469650268555, "global_step": 46768, "epoch": 386} {"train_loss": -33.947052001953125, "global_step": 46769, "epoch": 386} {"train_loss": -33.326454162597656, "global_step": 46770, "epoch": 386} {"train_loss": -34.032222747802734, "global_step": 46771, "epoch": 386} {"train_loss": -32.72614669799805, "global_step": 46772, "epoch": 386} {"train_loss": -33.59024429321289, "global_step": 46773, "epoch": 386} {"train_loss": -33.846336364746094, "global_step": 46774, "epoch": 386} {"train_loss": -34.1740837097168, "global_step": 46775, "epoch": 386} {"train_loss": -33.83230972290039, "global_step": 46776, "epoch": 386} {"train_loss": -34.23385238647461, "global_step": 46777, "epoch": 386} {"train_loss": -34.28440856933594, "global_step": 46778, "epoch": 386} {"train_loss": -34.13624954223633, "global_step": 46779, "epoch": 386} {"train_loss": -33.96113204956055, "global_step": 46780, "epoch": 386} {"train_loss": -34.24821090698242, "global_step": 46781, "epoch": 386} {"train_loss": -33.53829574584961, "global_step": 46782, "epoch": 386} {"train_loss": -33.83061599731445, "global_step": 46783, "epoch": 386} {"train_loss": -34.2177734375, "global_step": 46784, "epoch": 386} {"train_loss": -34.288185119628906, "global_step": 46785, "epoch": 386} {"train_loss": -34.24245834350586, "global_step": 46786, "epoch": 386} {"train_loss": -34.33749008178711, "global_step": 46787, "epoch": 386} {"train_loss": -34.39760208129883, "global_step": 46788, "epoch": 386} {"train_loss": -34.040252685546875, "global_step": 46789, "epoch": 386} {"train_loss": -34.360740661621094, "global_step": 46790, "epoch": 386} {"train_loss": -34.02830123901367, "global_step": 46791, "epoch": 386} {"train_loss": -34.55532455444336, "global_step": 46792, "epoch": 386} {"train_loss": -33.326416015625, "global_step": 46793, "epoch": 386} {"train_loss": -34.17449951171875, "global_step": 46794, "epoch": 386} {"train_loss": -34.299354553222656, "global_step": 46795, "epoch": 386} {"train_loss": -34.3936767578125, "global_step": 46796, "epoch": 386} {"train_loss": -34.97291564941406, "global_step": 46797, "epoch": 386} {"train_loss": -34.29448318481445, "global_step": 46798, "epoch": 386} {"train_loss": -34.43477249145508, "global_step": 46799, "epoch": 386} {"train_loss": -34.16189193725586, "global_step": 46800, "epoch": 386} {"train_loss": -34.48815155029297, "global_step": 46801, "epoch": 386} {"train_loss": -35.0197868347168, "global_step": 46802, "epoch": 386} {"train_loss": -34.60619354248047, "global_step": 46803, "epoch": 386} {"train_loss": -34.594398498535156, "global_step": 46804, "epoch": 386} {"train_loss": -34.698909759521484, "global_step": 46805, "epoch": 386} {"train_loss": -34.040924072265625, "global_step": 46806, "epoch": 386} {"train_loss": -34.496604919433594, "global_step": 46807, "epoch": 386} {"train_loss": -35.27821350097656, "global_step": 46808, "epoch": 386} {"train_loss": -34.77613067626953, "global_step": 46809, "epoch": 386} {"train_loss": -33.764076232910156, "global_step": 46810, "epoch": 386} {"train_loss": -33.37649154663086, "global_step": 46811, "epoch": 386} {"train_loss": -34.66178894042969, "global_step": 46812, "epoch": 386} {"train_loss": -32.237281799316406, "global_step": 46813, "epoch": 386} {"train_loss": -34.149471282958984, "global_step": 46814, "epoch": 386} {"train_loss": -33.539649963378906, "global_step": 46815, "epoch": 386} {"train_loss": -34.18292236328125, "global_step": 46816, "epoch": 386} {"train_loss": -33.079708099365234, "global_step": 46817, "epoch": 386} {"train_loss": -33.759559631347656, "global_step": 46818, "epoch": 386} {"train_loss": -33.45725631713867, "global_step": 46819, "epoch": 386} {"train_loss": -32.983192443847656, "global_step": 46820, "epoch": 386} {"train_loss": -34.74163818359375, "global_step": 46821, "epoch": 386} {"train_loss": -33.37721252441406, "global_step": 46822, "epoch": 386} {"train_loss": -33.85498046875, "global_step": 46823, "epoch": 386} {"train_loss": -34.14174270629883, "global_step": 46824, "epoch": 386} {"train_loss": -33.88255310058594, "global_step": 46825, "epoch": 386} {"train_loss": -32.97372278891319, "global_step": 46826, "epoch": 386, "val_loss": 2568545.25} {"train_loss": -33.79664611816406, "global_step": 46827, "epoch": 387} {"train_loss": -33.968170166015625, "global_step": 46828, "epoch": 387} {"train_loss": -33.91395950317383, "global_step": 46829, "epoch": 387} {"train_loss": -34.440120697021484, "global_step": 46830, "epoch": 387} {"train_loss": -33.898277282714844, "global_step": 46831, "epoch": 387} {"train_loss": -34.3360481262207, "global_step": 46832, "epoch": 387} {"train_loss": -33.54218673706055, "global_step": 46833, "epoch": 387} {"train_loss": -31.74036979675293, "global_step": 46834, "epoch": 387} {"train_loss": -31.945959091186523, "global_step": 46835, "epoch": 387} {"train_loss": -33.075469970703125, "global_step": 46836, "epoch": 387} {"train_loss": -33.038326263427734, "global_step": 46837, "epoch": 387} {"train_loss": -32.92670440673828, "global_step": 46838, "epoch": 387} {"train_loss": -33.72529983520508, "global_step": 46839, "epoch": 387} {"train_loss": -32.93855667114258, "global_step": 46840, "epoch": 387} {"train_loss": -33.157833099365234, "global_step": 46841, "epoch": 387} {"train_loss": -33.940773010253906, "global_step": 46842, "epoch": 387} {"train_loss": -31.566802978515625, "global_step": 46843, "epoch": 387} {"train_loss": -33.062679290771484, "global_step": 46844, "epoch": 387} {"train_loss": -33.66712188720703, "global_step": 46845, "epoch": 387} {"train_loss": -34.050758361816406, "global_step": 46846, "epoch": 387} {"train_loss": -33.60427474975586, "global_step": 46847, "epoch": 387} {"train_loss": -33.31970977783203, "global_step": 46848, "epoch": 387} {"train_loss": -33.97914505004883, "global_step": 46849, "epoch": 387} {"train_loss": -34.01731872558594, "global_step": 46850, "epoch": 387} {"train_loss": -32.71577835083008, "global_step": 46851, "epoch": 387} {"train_loss": -34.43130874633789, "global_step": 46852, "epoch": 387} {"train_loss": -33.12565231323242, "global_step": 46853, "epoch": 387} {"train_loss": -34.3226318359375, "global_step": 46854, "epoch": 387} {"train_loss": -33.3121452331543, "global_step": 46855, "epoch": 387} {"train_loss": -34.003944396972656, "global_step": 46856, "epoch": 387} {"train_loss": -33.602970123291016, "global_step": 46857, "epoch": 387} {"train_loss": -34.381996154785156, "global_step": 46858, "epoch": 387} {"train_loss": -33.9279670715332, "global_step": 46859, "epoch": 387} {"train_loss": -34.0135498046875, "global_step": 46860, "epoch": 387} {"train_loss": -34.029945373535156, "global_step": 46861, "epoch": 387} {"train_loss": -33.40883255004883, "global_step": 46862, "epoch": 387} {"train_loss": -33.7765007019043, "global_step": 46863, "epoch": 387} {"train_loss": -34.04133224487305, "global_step": 46864, "epoch": 387} {"train_loss": -34.54451370239258, "global_step": 46865, "epoch": 387} {"train_loss": -34.75714874267578, "global_step": 46866, "epoch": 387} {"train_loss": -33.82390213012695, "global_step": 46867, "epoch": 387} {"train_loss": -34.34138107299805, "global_step": 46868, "epoch": 387} {"train_loss": -34.73850631713867, "global_step": 46869, "epoch": 387} {"train_loss": -34.36247253417969, "global_step": 46870, "epoch": 387} {"train_loss": -34.08662033081055, "global_step": 46871, "epoch": 387} {"train_loss": -33.966487884521484, "global_step": 46872, "epoch": 387} {"train_loss": -32.53893280029297, "global_step": 46873, "epoch": 387} {"train_loss": -31.07131004333496, "global_step": 46874, "epoch": 387} {"train_loss": -27.104068756103516, "global_step": 46875, "epoch": 387} {"train_loss": -20.18459129333496, "global_step": 46876, "epoch": 387} {"train_loss": -20.341596603393555, "global_step": 46877, "epoch": 387} {"train_loss": -34.5337028503418, "global_step": 46878, "epoch": 387} {"train_loss": -26.14544105529785, "global_step": 46879, "epoch": 387} {"train_loss": -31.3359375, "global_step": 46880, "epoch": 387} {"train_loss": -31.154752731323242, "global_step": 46881, "epoch": 387} {"train_loss": -33.18282699584961, "global_step": 46882, "epoch": 387} {"train_loss": -30.868589401245117, "global_step": 46883, "epoch": 387} {"train_loss": -34.118553161621094, "global_step": 46884, "epoch": 387} {"train_loss": -31.21857261657715, "global_step": 46885, "epoch": 387} {"train_loss": -34.11507797241211, "global_step": 46886, "epoch": 387} {"train_loss": -33.65180969238281, "global_step": 46887, "epoch": 387} {"train_loss": -32.064552307128906, "global_step": 46888, "epoch": 387} {"train_loss": -34.24517059326172, "global_step": 46889, "epoch": 387} {"train_loss": -32.43243408203125, "global_step": 46890, "epoch": 387} {"train_loss": -33.70744323730469, "global_step": 46891, "epoch": 387} {"train_loss": -33.76536560058594, "global_step": 46892, "epoch": 387} {"train_loss": -33.81831359863281, "global_step": 46893, "epoch": 387} {"train_loss": -33.88685607910156, "global_step": 46894, "epoch": 387} {"train_loss": -33.563846588134766, "global_step": 46895, "epoch": 387} {"train_loss": -34.472225189208984, "global_step": 46896, "epoch": 387} {"train_loss": -34.232051849365234, "global_step": 46897, "epoch": 387} {"train_loss": -34.3017692565918, "global_step": 46898, "epoch": 387} {"train_loss": -34.72654342651367, "global_step": 46899, "epoch": 387} {"train_loss": -34.43687438964844, "global_step": 46900, "epoch": 387} {"train_loss": -34.0767707824707, "global_step": 46901, "epoch": 387} {"train_loss": -34.43790817260742, "global_step": 46902, "epoch": 387} {"train_loss": -34.76066207885742, "global_step": 46903, "epoch": 387} {"train_loss": -34.506195068359375, "global_step": 46904, "epoch": 387} {"train_loss": -34.61941146850586, "global_step": 46905, "epoch": 387} {"train_loss": -34.77456283569336, "global_step": 46906, "epoch": 387} {"train_loss": -34.79970932006836, "global_step": 46907, "epoch": 387} {"train_loss": -34.716068267822266, "global_step": 46908, "epoch": 387} {"train_loss": -34.82894515991211, "global_step": 46909, "epoch": 387} {"train_loss": -34.6446533203125, "global_step": 46910, "epoch": 387} {"train_loss": -34.75679397583008, "global_step": 46911, "epoch": 387} {"train_loss": -34.93040466308594, "global_step": 46912, "epoch": 387} {"train_loss": -35.26723861694336, "global_step": 46913, "epoch": 387} {"train_loss": -35.14917755126953, "global_step": 46914, "epoch": 387} {"train_loss": -34.77802276611328, "global_step": 46915, "epoch": 387} {"train_loss": -35.04891586303711, "global_step": 46916, "epoch": 387} {"train_loss": -34.7980842590332, "global_step": 46917, "epoch": 387} {"train_loss": -35.39357376098633, "global_step": 46918, "epoch": 387} {"train_loss": -34.7851676940918, "global_step": 46919, "epoch": 387} {"train_loss": -35.56537628173828, "global_step": 46920, "epoch": 387} {"train_loss": -35.215641021728516, "global_step": 46921, "epoch": 387} {"train_loss": -35.51572036743164, "global_step": 46922, "epoch": 387} {"train_loss": -35.098873138427734, "global_step": 46923, "epoch": 387} {"train_loss": -34.72877883911133, "global_step": 46924, "epoch": 387} {"train_loss": -35.06370162963867, "global_step": 46925, "epoch": 387} {"train_loss": -34.35206985473633, "global_step": 46926, "epoch": 387} {"train_loss": -34.94523620605469, "global_step": 46927, "epoch": 387} {"train_loss": -34.42168045043945, "global_step": 46928, "epoch": 387} {"train_loss": -34.32697296142578, "global_step": 46929, "epoch": 387} {"train_loss": -33.97609329223633, "global_step": 46930, "epoch": 387} {"train_loss": -34.17098617553711, "global_step": 46931, "epoch": 387} {"train_loss": -35.0456428527832, "global_step": 46932, "epoch": 387} {"train_loss": -34.36350631713867, "global_step": 46933, "epoch": 387} {"train_loss": -34.543792724609375, "global_step": 46934, "epoch": 387} {"train_loss": -35.12824630737305, "global_step": 46935, "epoch": 387} {"train_loss": -34.99275588989258, "global_step": 46936, "epoch": 387} {"train_loss": -34.26871871948242, "global_step": 46937, "epoch": 387} {"train_loss": -35.13880157470703, "global_step": 46938, "epoch": 387} {"train_loss": -34.8065185546875, "global_step": 46939, "epoch": 387} {"train_loss": -34.759151458740234, "global_step": 46940, "epoch": 387} {"train_loss": -34.864990234375, "global_step": 46941, "epoch": 387} {"train_loss": -34.461055755615234, "global_step": 46942, "epoch": 387} {"train_loss": -35.17546463012695, "global_step": 46943, "epoch": 387} {"train_loss": -33.82719421386719, "global_step": 46944, "epoch": 387} {"train_loss": -34.233360290527344, "global_step": 46945, "epoch": 387} {"train_loss": -34.306121826171875, "global_step": 46946, "epoch": 387} {"train_loss": -33.65926659008688, "global_step": 46947, "epoch": 387, "val_loss": 2649356.5} {"train_loss": -33.773536682128906, "global_step": 46948, "epoch": 388} {"train_loss": -34.70515060424805, "global_step": 46949, "epoch": 388} {"train_loss": -33.79560470581055, "global_step": 46950, "epoch": 388} {"train_loss": -32.48318862915039, "global_step": 46951, "epoch": 388} {"train_loss": -33.157955169677734, "global_step": 46952, "epoch": 388} {"train_loss": -34.75944137573242, "global_step": 46953, "epoch": 388} {"train_loss": -33.83913803100586, "global_step": 46954, "epoch": 388} {"train_loss": -33.321041107177734, "global_step": 46955, "epoch": 388} {"train_loss": -34.56244659423828, "global_step": 46956, "epoch": 388} {"train_loss": -34.138702392578125, "global_step": 46957, "epoch": 388} {"train_loss": -33.30131530761719, "global_step": 46958, "epoch": 388} {"train_loss": -34.492366790771484, "global_step": 46959, "epoch": 388} {"train_loss": -34.039161682128906, "global_step": 46960, "epoch": 388} {"train_loss": -34.63345718383789, "global_step": 46961, "epoch": 388} {"train_loss": -34.28551483154297, "global_step": 46962, "epoch": 388} {"train_loss": -34.00422286987305, "global_step": 46963, "epoch": 388} {"train_loss": -34.854095458984375, "global_step": 46964, "epoch": 388} {"train_loss": -33.73807907104492, "global_step": 46965, "epoch": 388} {"train_loss": -35.067440032958984, "global_step": 46966, "epoch": 388} {"train_loss": -34.665733337402344, "global_step": 46967, "epoch": 388} {"train_loss": -34.775840759277344, "global_step": 46968, "epoch": 388} {"train_loss": -34.90430450439453, "global_step": 46969, "epoch": 388} {"train_loss": -34.906402587890625, "global_step": 46970, "epoch": 388} {"train_loss": -34.905235290527344, "global_step": 46971, "epoch": 388} {"train_loss": -34.90592956542969, "global_step": 46972, "epoch": 388} {"train_loss": -34.66121292114258, "global_step": 46973, "epoch": 388} {"train_loss": -34.68328857421875, "global_step": 46974, "epoch": 388} {"train_loss": -34.6540412902832, "global_step": 46975, "epoch": 388} {"train_loss": -34.58231735229492, "global_step": 46976, "epoch": 388} {"train_loss": -35.013519287109375, "global_step": 46977, "epoch": 388} {"train_loss": -34.59321594238281, "global_step": 46978, "epoch": 388} {"train_loss": -35.06572341918945, "global_step": 46979, "epoch": 388} {"train_loss": -34.45859909057617, "global_step": 46980, "epoch": 388} {"train_loss": -34.8405647277832, "global_step": 46981, "epoch": 388} {"train_loss": -34.86862564086914, "global_step": 46982, "epoch": 388} {"train_loss": -35.26311492919922, "global_step": 46983, "epoch": 388} {"train_loss": -35.5172119140625, "global_step": 46984, "epoch": 388} {"train_loss": -34.70412826538086, "global_step": 46985, "epoch": 388} {"train_loss": -35.495975494384766, "global_step": 46986, "epoch": 388} {"train_loss": -35.087703704833984, "global_step": 46987, "epoch": 388} {"train_loss": -35.489845275878906, "global_step": 46988, "epoch": 388} {"train_loss": -35.10610580444336, "global_step": 46989, "epoch": 388} {"train_loss": -35.40813064575195, "global_step": 46990, "epoch": 388} {"train_loss": -35.3702392578125, "global_step": 46991, "epoch": 388} {"train_loss": -35.39765548706055, "global_step": 46992, "epoch": 388} {"train_loss": -35.108489990234375, "global_step": 46993, "epoch": 388} {"train_loss": -35.46274948120117, "global_step": 46994, "epoch": 388} {"train_loss": -35.90424346923828, "global_step": 46995, "epoch": 388} {"train_loss": -34.90067672729492, "global_step": 46996, "epoch": 388} {"train_loss": -34.664058685302734, "global_step": 46997, "epoch": 388} {"train_loss": -34.554744720458984, "global_step": 46998, "epoch": 388} {"train_loss": -33.126461029052734, "global_step": 46999, "epoch": 388} {"train_loss": -32.045928955078125, "global_step": 47000, "epoch": 388} {"train_loss": -32.14190673828125, "global_step": 47001, "epoch": 388} {"train_loss": -31.365814208984375, "global_step": 47002, "epoch": 388} {"train_loss": -31.01506996154785, "global_step": 47003, "epoch": 388} {"train_loss": -33.911415100097656, "global_step": 47004, "epoch": 388} {"train_loss": -34.80477523803711, "global_step": 47005, "epoch": 388} {"train_loss": -32.96084976196289, "global_step": 47006, "epoch": 388} {"train_loss": -34.053829193115234, "global_step": 47007, "epoch": 388} {"train_loss": -34.074378967285156, "global_step": 47008, "epoch": 388} {"train_loss": -32.5798454284668, "global_step": 47009, "epoch": 388} {"train_loss": -34.1417121887207, "global_step": 47010, "epoch": 388} {"train_loss": -34.0102424621582, "global_step": 47011, "epoch": 388} {"train_loss": -34.103023529052734, "global_step": 47012, "epoch": 388} {"train_loss": -33.81987380981445, "global_step": 47013, "epoch": 388} {"train_loss": -32.81047821044922, "global_step": 47014, "epoch": 388} {"train_loss": -35.18138885498047, "global_step": 47015, "epoch": 388} {"train_loss": -33.15237045288086, "global_step": 47016, "epoch": 388} {"train_loss": -34.89786911010742, "global_step": 47017, "epoch": 388} {"train_loss": -33.71978759765625, "global_step": 47018, "epoch": 388} {"train_loss": -34.357215881347656, "global_step": 47019, "epoch": 388} {"train_loss": -34.3941535949707, "global_step": 47020, "epoch": 388} {"train_loss": -33.97949981689453, "global_step": 47021, "epoch": 388} {"train_loss": -34.62184524536133, "global_step": 47022, "epoch": 388} {"train_loss": -34.2432975769043, "global_step": 47023, "epoch": 388} {"train_loss": -30.47918701171875, "global_step": 47024, "epoch": 388} {"train_loss": -33.4957160949707, "global_step": 47025, "epoch": 388} {"train_loss": -31.51441764831543, "global_step": 47026, "epoch": 388} {"train_loss": -27.3111515045166, "global_step": 47027, "epoch": 388} {"train_loss": -35.04558181762695, "global_step": 47028, "epoch": 388} {"train_loss": -30.899188995361328, "global_step": 47029, "epoch": 388} {"train_loss": -34.57375717163086, "global_step": 47030, "epoch": 388} {"train_loss": -33.65766143798828, "global_step": 47031, "epoch": 388} {"train_loss": -33.4022102355957, "global_step": 47032, "epoch": 388} {"train_loss": -34.094783782958984, "global_step": 47033, "epoch": 388} {"train_loss": -34.697113037109375, "global_step": 47034, "epoch": 388} {"train_loss": -33.808223724365234, "global_step": 47035, "epoch": 388} {"train_loss": -34.43744659423828, "global_step": 47036, "epoch": 388} {"train_loss": -35.00991439819336, "global_step": 47037, "epoch": 388} {"train_loss": -34.626312255859375, "global_step": 47038, "epoch": 388} {"train_loss": -34.82637405395508, "global_step": 47039, "epoch": 388} {"train_loss": -34.17583465576172, "global_step": 47040, "epoch": 388} {"train_loss": -35.26546859741211, "global_step": 47041, "epoch": 388} {"train_loss": -35.00740051269531, "global_step": 47042, "epoch": 388} {"train_loss": -34.46689987182617, "global_step": 47043, "epoch": 388} {"train_loss": -35.150611877441406, "global_step": 47044, "epoch": 388} {"train_loss": -34.96480178833008, "global_step": 47045, "epoch": 388} {"train_loss": -34.785606384277344, "global_step": 47046, "epoch": 388} {"train_loss": -35.414825439453125, "global_step": 47047, "epoch": 388} {"train_loss": -34.467220306396484, "global_step": 47048, "epoch": 388} {"train_loss": -35.164310455322266, "global_step": 47049, "epoch": 388} {"train_loss": -34.32654571533203, "global_step": 47050, "epoch": 388} {"train_loss": -35.21406173706055, "global_step": 47051, "epoch": 388} {"train_loss": -34.44052505493164, "global_step": 47052, "epoch": 388} {"train_loss": -34.8378791809082, "global_step": 47053, "epoch": 388} {"train_loss": -35.63166046142578, "global_step": 47054, "epoch": 388} {"train_loss": -35.624202728271484, "global_step": 47055, "epoch": 388} {"train_loss": -34.821128845214844, "global_step": 47056, "epoch": 388} {"train_loss": -35.149173736572266, "global_step": 47057, "epoch": 388} {"train_loss": -34.77601623535156, "global_step": 47058, "epoch": 388} {"train_loss": -35.3325309753418, "global_step": 47059, "epoch": 388} {"train_loss": -34.85675048828125, "global_step": 47060, "epoch": 388} {"train_loss": -35.1423454284668, "global_step": 47061, "epoch": 388} {"train_loss": -34.74394607543945, "global_step": 47062, "epoch": 388} {"train_loss": -34.61414337158203, "global_step": 47063, "epoch": 388} {"train_loss": -35.22821807861328, "global_step": 47064, "epoch": 388} {"train_loss": -34.86420822143555, "global_step": 47065, "epoch": 388} {"train_loss": -34.79759979248047, "global_step": 47066, "epoch": 388} {"train_loss": -35.028480529785156, "global_step": 47067, "epoch": 388} {"train_loss": -34.30621219666536, "global_step": 47068, "epoch": 388, "val_loss": 2688256.0} {"train_loss": -33.856422424316406, "global_step": 47069, "epoch": 389} {"train_loss": -33.91301727294922, "global_step": 47070, "epoch": 389} {"train_loss": -34.889892578125, "global_step": 47071, "epoch": 389} {"train_loss": -35.067752838134766, "global_step": 47072, "epoch": 389} {"train_loss": -35.00547409057617, "global_step": 47073, "epoch": 389} {"train_loss": -34.72943115234375, "global_step": 47074, "epoch": 389} {"train_loss": -35.04384994506836, "global_step": 47075, "epoch": 389} {"train_loss": -34.537601470947266, "global_step": 47076, "epoch": 389} {"train_loss": -35.02184295654297, "global_step": 47077, "epoch": 389} {"train_loss": -35.43553161621094, "global_step": 47078, "epoch": 389} {"train_loss": -35.089542388916016, "global_step": 47079, "epoch": 389} {"train_loss": -34.997745513916016, "global_step": 47080, "epoch": 389} {"train_loss": -34.779151916503906, "global_step": 47081, "epoch": 389} {"train_loss": -34.28237533569336, "global_step": 47082, "epoch": 389} {"train_loss": -35.390602111816406, "global_step": 47083, "epoch": 389} {"train_loss": -34.387840270996094, "global_step": 47084, "epoch": 389} {"train_loss": -35.50484085083008, "global_step": 47085, "epoch": 389} {"train_loss": -34.64358139038086, "global_step": 47086, "epoch": 389} {"train_loss": -35.28969955444336, "global_step": 47087, "epoch": 389} {"train_loss": -34.9530143737793, "global_step": 47088, "epoch": 389} {"train_loss": -35.555721282958984, "global_step": 47089, "epoch": 389} {"train_loss": -35.024635314941406, "global_step": 47090, "epoch": 389} {"train_loss": -34.90483856201172, "global_step": 47091, "epoch": 389} {"train_loss": -35.3222541809082, "global_step": 47092, "epoch": 389} {"train_loss": -34.551692962646484, "global_step": 47093, "epoch": 389} {"train_loss": -35.48209762573242, "global_step": 47094, "epoch": 389} {"train_loss": -35.29958724975586, "global_step": 47095, "epoch": 389} {"train_loss": -35.408172607421875, "global_step": 47096, "epoch": 389} {"train_loss": -35.515708923339844, "global_step": 47097, "epoch": 389} {"train_loss": -35.51829528808594, "global_step": 47098, "epoch": 389} {"train_loss": -35.074851989746094, "global_step": 47099, "epoch": 389} {"train_loss": -35.713531494140625, "global_step": 47100, "epoch": 389} {"train_loss": -35.0893440246582, "global_step": 47101, "epoch": 389} {"train_loss": -35.36258316040039, "global_step": 47102, "epoch": 389} {"train_loss": -35.34483337402344, "global_step": 47103, "epoch": 389} {"train_loss": -34.55524444580078, "global_step": 47104, "epoch": 389} {"train_loss": -35.5333366394043, "global_step": 47105, "epoch": 389} {"train_loss": -35.52659225463867, "global_step": 47106, "epoch": 389} {"train_loss": -34.57448196411133, "global_step": 47107, "epoch": 389} {"train_loss": -34.882225036621094, "global_step": 47108, "epoch": 389} {"train_loss": -33.58933639526367, "global_step": 47109, "epoch": 389} {"train_loss": -32.56403732299805, "global_step": 47110, "epoch": 389} {"train_loss": -29.768152236938477, "global_step": 47111, "epoch": 389} {"train_loss": -28.551624298095703, "global_step": 47112, "epoch": 389} {"train_loss": -27.993133544921875, "global_step": 47113, "epoch": 389} {"train_loss": -31.805194854736328, "global_step": 47114, "epoch": 389} {"train_loss": -33.75415802001953, "global_step": 47115, "epoch": 389} {"train_loss": -31.98162269592285, "global_step": 47116, "epoch": 389} {"train_loss": -31.393375396728516, "global_step": 47117, "epoch": 389} {"train_loss": -34.37934494018555, "global_step": 47118, "epoch": 389} {"train_loss": -31.816251754760742, "global_step": 47119, "epoch": 389} {"train_loss": -34.37135696411133, "global_step": 47120, "epoch": 389} {"train_loss": -32.84141159057617, "global_step": 47121, "epoch": 389} {"train_loss": -29.36532974243164, "global_step": 47122, "epoch": 389} {"train_loss": -32.97745895385742, "global_step": 47123, "epoch": 389} {"train_loss": -33.729949951171875, "global_step": 47124, "epoch": 389} {"train_loss": -33.34674835205078, "global_step": 47125, "epoch": 389} {"train_loss": -33.7917594909668, "global_step": 47126, "epoch": 389} {"train_loss": -33.26124954223633, "global_step": 47127, "epoch": 389} {"train_loss": -32.74491882324219, "global_step": 47128, "epoch": 389} {"train_loss": -32.429683685302734, "global_step": 47129, "epoch": 389} {"train_loss": -33.39216232299805, "global_step": 47130, "epoch": 389} {"train_loss": -34.13460159301758, "global_step": 47131, "epoch": 389} {"train_loss": -32.22907638549805, "global_step": 47132, "epoch": 389} {"train_loss": -33.562400817871094, "global_step": 47133, "epoch": 389} {"train_loss": -33.29629135131836, "global_step": 47134, "epoch": 389} {"train_loss": -33.43503952026367, "global_step": 47135, "epoch": 389} {"train_loss": -31.6354923248291, "global_step": 47136, "epoch": 389} {"train_loss": -31.843297958374023, "global_step": 47137, "epoch": 389} {"train_loss": -34.16676330566406, "global_step": 47138, "epoch": 389} {"train_loss": -33.544158935546875, "global_step": 47139, "epoch": 389} {"train_loss": -33.335750579833984, "global_step": 47140, "epoch": 389} {"train_loss": -33.050987243652344, "global_step": 47141, "epoch": 389} {"train_loss": -33.178462982177734, "global_step": 47142, "epoch": 389} {"train_loss": -33.81462478637695, "global_step": 47143, "epoch": 389} {"train_loss": -33.957366943359375, "global_step": 47144, "epoch": 389} {"train_loss": -34.23086166381836, "global_step": 47145, "epoch": 389} {"train_loss": -34.084537506103516, "global_step": 47146, "epoch": 389} {"train_loss": -34.10422897338867, "global_step": 47147, "epoch": 389} {"train_loss": -33.71393966674805, "global_step": 47148, "epoch": 389} {"train_loss": -33.818634033203125, "global_step": 47149, "epoch": 389} {"train_loss": -34.19417190551758, "global_step": 47150, "epoch": 389} {"train_loss": -34.325191497802734, "global_step": 47151, "epoch": 389} {"train_loss": -34.1997184753418, "global_step": 47152, "epoch": 389} {"train_loss": -34.03207778930664, "global_step": 47153, "epoch": 389} {"train_loss": -34.18152618408203, "global_step": 47154, "epoch": 389} {"train_loss": -34.360774993896484, "global_step": 47155, "epoch": 389} {"train_loss": -34.371273040771484, "global_step": 47156, "epoch": 389} {"train_loss": -34.619319915771484, "global_step": 47157, "epoch": 389} {"train_loss": -34.180294036865234, "global_step": 47158, "epoch": 389} {"train_loss": -34.12867736816406, "global_step": 47159, "epoch": 389} {"train_loss": -34.314083099365234, "global_step": 47160, "epoch": 389} {"train_loss": -34.402503967285156, "global_step": 47161, "epoch": 389} {"train_loss": -34.392356872558594, "global_step": 47162, "epoch": 389} {"train_loss": -34.827579498291016, "global_step": 47163, "epoch": 389} {"train_loss": -34.625770568847656, "global_step": 47164, "epoch": 389} {"train_loss": -34.90713882446289, "global_step": 47165, "epoch": 389} {"train_loss": -34.4722785949707, "global_step": 47166, "epoch": 389} {"train_loss": -33.964698791503906, "global_step": 47167, "epoch": 389} {"train_loss": -34.57073974609375, "global_step": 47168, "epoch": 389} {"train_loss": -34.44417190551758, "global_step": 47169, "epoch": 389} {"train_loss": -34.7834587097168, "global_step": 47170, "epoch": 389} {"train_loss": -33.472896575927734, "global_step": 47171, "epoch": 389} {"train_loss": -34.73653030395508, "global_step": 47172, "epoch": 389} {"train_loss": -33.9932975769043, "global_step": 47173, "epoch": 389} {"train_loss": -33.95856857299805, "global_step": 47174, "epoch": 389} {"train_loss": -32.919464111328125, "global_step": 47175, "epoch": 389} {"train_loss": -33.533756256103516, "global_step": 47176, "epoch": 389} {"train_loss": -32.974464416503906, "global_step": 47177, "epoch": 389} {"train_loss": -34.171939849853516, "global_step": 47178, "epoch": 389} {"train_loss": -32.860206604003906, "global_step": 47179, "epoch": 389} {"train_loss": -32.603759765625, "global_step": 47180, "epoch": 389} {"train_loss": -32.152896881103516, "global_step": 47181, "epoch": 389} {"train_loss": -32.130733489990234, "global_step": 47182, "epoch": 389} {"train_loss": -29.110700607299805, "global_step": 47183, "epoch": 389} {"train_loss": -29.71904945373535, "global_step": 47184, "epoch": 389} {"train_loss": -28.033239364624023, "global_step": 47185, "epoch": 389} {"train_loss": -26.4605712890625, "global_step": 47186, "epoch": 389} {"train_loss": -31.787954330444336, "global_step": 47187, "epoch": 389} {"train_loss": -33.318092346191406, "global_step": 47188, "epoch": 389} {"train_loss": -33.69043481054385, "global_step": 47189, "epoch": 389, "val_loss": 2581281.5} {"train_loss": -33.77301025390625, "global_step": 47190, "epoch": 390} {"train_loss": -32.170936584472656, "global_step": 47191, "epoch": 390} {"train_loss": -33.29094314575195, "global_step": 47192, "epoch": 390} {"train_loss": -33.627540588378906, "global_step": 47193, "epoch": 390} {"train_loss": -32.76356887817383, "global_step": 47194, "epoch": 390} {"train_loss": -34.1895637512207, "global_step": 47195, "epoch": 390} {"train_loss": -33.681819915771484, "global_step": 47196, "epoch": 390} {"train_loss": -34.03145980834961, "global_step": 47197, "epoch": 390} {"train_loss": -34.0677375793457, "global_step": 47198, "epoch": 390} {"train_loss": -33.93482971191406, "global_step": 47199, "epoch": 390} {"train_loss": -34.66000747680664, "global_step": 47200, "epoch": 390} {"train_loss": -34.644588470458984, "global_step": 47201, "epoch": 390} {"train_loss": -35.0713005065918, "global_step": 47202, "epoch": 390} {"train_loss": -34.20682907104492, "global_step": 47203, "epoch": 390} {"train_loss": -35.2573127746582, "global_step": 47204, "epoch": 390} {"train_loss": -35.23228073120117, "global_step": 47205, "epoch": 390} {"train_loss": -34.82548141479492, "global_step": 47206, "epoch": 390} {"train_loss": -35.459354400634766, "global_step": 47207, "epoch": 390} {"train_loss": -35.49785614013672, "global_step": 47208, "epoch": 390} {"train_loss": -35.14081954956055, "global_step": 47209, "epoch": 390} {"train_loss": -34.777122497558594, "global_step": 47210, "epoch": 390} {"train_loss": -35.69519805908203, "global_step": 47211, "epoch": 390} {"train_loss": -34.98725891113281, "global_step": 47212, "epoch": 390} {"train_loss": -35.130706787109375, "global_step": 47213, "epoch": 390} {"train_loss": -35.21720886230469, "global_step": 47214, "epoch": 390} {"train_loss": -35.28292465209961, "global_step": 47215, "epoch": 390} {"train_loss": -35.31532669067383, "global_step": 47216, "epoch": 390} {"train_loss": -35.26249313354492, "global_step": 47217, "epoch": 390} {"train_loss": -35.52786636352539, "global_step": 47218, "epoch": 390} {"train_loss": -35.359188079833984, "global_step": 47219, "epoch": 390} {"train_loss": -34.97746658325195, "global_step": 47220, "epoch": 390} {"train_loss": -34.563716888427734, "global_step": 47221, "epoch": 390} {"train_loss": -33.6274299621582, "global_step": 47222, "epoch": 390} {"train_loss": -34.29534149169922, "global_step": 47223, "epoch": 390} {"train_loss": -34.23210144042969, "global_step": 47224, "epoch": 390} {"train_loss": -34.122840881347656, "global_step": 47225, "epoch": 390} {"train_loss": -33.04391860961914, "global_step": 47226, "epoch": 390} {"train_loss": -34.86317825317383, "global_step": 47227, "epoch": 390} {"train_loss": -34.835941314697266, "global_step": 47228, "epoch": 390} {"train_loss": -34.5341796875, "global_step": 47229, "epoch": 390} {"train_loss": -35.194862365722656, "global_step": 47230, "epoch": 390} {"train_loss": -35.23187255859375, "global_step": 47231, "epoch": 390} {"train_loss": -34.612098693847656, "global_step": 47232, "epoch": 390} {"train_loss": -34.85343933105469, "global_step": 47233, "epoch": 390} {"train_loss": -35.244232177734375, "global_step": 47234, "epoch": 390} {"train_loss": -34.499698638916016, "global_step": 47235, "epoch": 390} {"train_loss": -35.118587493896484, "global_step": 47236, "epoch": 390} {"train_loss": -35.23155975341797, "global_step": 47237, "epoch": 390} {"train_loss": -34.604408264160156, "global_step": 47238, "epoch": 390} {"train_loss": -35.389137268066406, "global_step": 47239, "epoch": 390} {"train_loss": -35.72772979736328, "global_step": 47240, "epoch": 390} {"train_loss": -35.08313751220703, "global_step": 47241, "epoch": 390} {"train_loss": -35.164852142333984, "global_step": 47242, "epoch": 390} {"train_loss": -35.05713653564453, "global_step": 47243, "epoch": 390} {"train_loss": -35.12722396850586, "global_step": 47244, "epoch": 390} {"train_loss": -33.96255111694336, "global_step": 47245, "epoch": 390} {"train_loss": -34.145362854003906, "global_step": 47246, "epoch": 390} {"train_loss": -33.37726593017578, "global_step": 47247, "epoch": 390} {"train_loss": -34.70661163330078, "global_step": 47248, "epoch": 390} {"train_loss": -33.91791915893555, "global_step": 47249, "epoch": 390} {"train_loss": -33.848934173583984, "global_step": 47250, "epoch": 390} {"train_loss": -33.99912643432617, "global_step": 47251, "epoch": 390} {"train_loss": -33.45268630981445, "global_step": 47252, "epoch": 390} {"train_loss": -33.443824768066406, "global_step": 47253, "epoch": 390} {"train_loss": -33.809356689453125, "global_step": 47254, "epoch": 390} {"train_loss": -33.30097198486328, "global_step": 47255, "epoch": 390} {"train_loss": -33.363014221191406, "global_step": 47256, "epoch": 390} {"train_loss": -34.5501823425293, "global_step": 47257, "epoch": 390} {"train_loss": -35.193359375, "global_step": 47258, "epoch": 390} {"train_loss": -35.17494201660156, "global_step": 47259, "epoch": 390} {"train_loss": -34.962806701660156, "global_step": 47260, "epoch": 390} {"train_loss": -34.80971908569336, "global_step": 47261, "epoch": 390} {"train_loss": -34.58388137817383, "global_step": 47262, "epoch": 390} {"train_loss": -35.03497314453125, "global_step": 47263, "epoch": 390} {"train_loss": -34.34321212768555, "global_step": 47264, "epoch": 390} {"train_loss": -32.8652458190918, "global_step": 47265, "epoch": 390} {"train_loss": -34.661102294921875, "global_step": 47266, "epoch": 390} {"train_loss": -34.45039749145508, "global_step": 47267, "epoch": 390} {"train_loss": -34.90389633178711, "global_step": 47268, "epoch": 390} {"train_loss": -35.012001037597656, "global_step": 47269, "epoch": 390} {"train_loss": -34.35676574707031, "global_step": 47270, "epoch": 390} {"train_loss": -33.990020751953125, "global_step": 47271, "epoch": 390} {"train_loss": -32.872039794921875, "global_step": 47272, "epoch": 390} {"train_loss": -30.16352653503418, "global_step": 47273, "epoch": 390} {"train_loss": -26.61640739440918, "global_step": 47274, "epoch": 390} {"train_loss": -30.370771408081055, "global_step": 47275, "epoch": 390} {"train_loss": -34.75347137451172, "global_step": 47276, "epoch": 390} {"train_loss": -34.618141174316406, "global_step": 47277, "epoch": 390} {"train_loss": -33.22663116455078, "global_step": 47278, "epoch": 390} {"train_loss": -34.937164306640625, "global_step": 47279, "epoch": 390} {"train_loss": -34.4863395690918, "global_step": 47280, "epoch": 390} {"train_loss": -34.69767761230469, "global_step": 47281, "epoch": 390} {"train_loss": -35.25415802001953, "global_step": 47282, "epoch": 390} {"train_loss": -34.55839157104492, "global_step": 47283, "epoch": 390} {"train_loss": -35.44472885131836, "global_step": 47284, "epoch": 390} {"train_loss": -35.0638313293457, "global_step": 47285, "epoch": 390} {"train_loss": -35.687740325927734, "global_step": 47286, "epoch": 390} {"train_loss": -34.974735260009766, "global_step": 47287, "epoch": 390} {"train_loss": -35.34468460083008, "global_step": 47288, "epoch": 390} {"train_loss": -35.519527435302734, "global_step": 47289, "epoch": 390} {"train_loss": -34.94475173950195, "global_step": 47290, "epoch": 390} {"train_loss": -35.58320999145508, "global_step": 47291, "epoch": 390} {"train_loss": -35.02418899536133, "global_step": 47292, "epoch": 390} {"train_loss": -35.5730094909668, "global_step": 47293, "epoch": 390} {"train_loss": -35.29793167114258, "global_step": 47294, "epoch": 390} {"train_loss": -35.139217376708984, "global_step": 47295, "epoch": 390} {"train_loss": -35.278961181640625, "global_step": 47296, "epoch": 390} {"train_loss": -35.5286979675293, "global_step": 47297, "epoch": 390} {"train_loss": -35.22058868408203, "global_step": 47298, "epoch": 390} {"train_loss": -35.331871032714844, "global_step": 47299, "epoch": 390} {"train_loss": -36.019447326660156, "global_step": 47300, "epoch": 390} {"train_loss": -35.60398483276367, "global_step": 47301, "epoch": 390} {"train_loss": -35.68778610229492, "global_step": 47302, "epoch": 390} {"train_loss": -35.3577766418457, "global_step": 47303, "epoch": 390} {"train_loss": -36.001644134521484, "global_step": 47304, "epoch": 390} {"train_loss": -36.06173324584961, "global_step": 47305, "epoch": 390} {"train_loss": -34.223934173583984, "global_step": 47306, "epoch": 390} {"train_loss": -34.939510345458984, "global_step": 47307, "epoch": 390} {"train_loss": -35.22272872924805, "global_step": 47308, "epoch": 390} {"train_loss": -34.937782287597656, "global_step": 47309, "epoch": 390} {"train_loss": -34.56497364201822, "global_step": 47310, "epoch": 390, "val_loss": 2443900.25} {"train_loss": -34.25874710083008, "global_step": 47311, "epoch": 391} {"train_loss": -34.41608810424805, "global_step": 47312, "epoch": 391} {"train_loss": -35.907649993896484, "global_step": 47313, "epoch": 391} {"train_loss": -33.75038528442383, "global_step": 47314, "epoch": 391} {"train_loss": -34.595584869384766, "global_step": 47315, "epoch": 391} {"train_loss": -35.0775260925293, "global_step": 47316, "epoch": 391} {"train_loss": -34.648658752441406, "global_step": 47317, "epoch": 391} {"train_loss": -34.92396926879883, "global_step": 47318, "epoch": 391} {"train_loss": -35.284828186035156, "global_step": 47319, "epoch": 391} {"train_loss": -34.897525787353516, "global_step": 47320, "epoch": 391} {"train_loss": -33.25603485107422, "global_step": 47321, "epoch": 391} {"train_loss": -34.55230712890625, "global_step": 47322, "epoch": 391} {"train_loss": -35.48945236206055, "global_step": 47323, "epoch": 391} {"train_loss": -34.54595947265625, "global_step": 47324, "epoch": 391} {"train_loss": -31.72072410583496, "global_step": 47325, "epoch": 391} {"train_loss": -32.025779724121094, "global_step": 47326, "epoch": 391} {"train_loss": -33.74422836303711, "global_step": 47327, "epoch": 391} {"train_loss": -35.00032424926758, "global_step": 47328, "epoch": 391} {"train_loss": -34.773658752441406, "global_step": 47329, "epoch": 391} {"train_loss": -34.028656005859375, "global_step": 47330, "epoch": 391} {"train_loss": -35.07613754272461, "global_step": 47331, "epoch": 391} {"train_loss": -35.35894775390625, "global_step": 47332, "epoch": 391} {"train_loss": -34.14750289916992, "global_step": 47333, "epoch": 391} {"train_loss": -34.04167556762695, "global_step": 47334, "epoch": 391} {"train_loss": -35.374969482421875, "global_step": 47335, "epoch": 391} {"train_loss": -33.203895568847656, "global_step": 47336, "epoch": 391} {"train_loss": -35.34918975830078, "global_step": 47337, "epoch": 391} {"train_loss": -35.39329147338867, "global_step": 47338, "epoch": 391} {"train_loss": -34.18345260620117, "global_step": 47339, "epoch": 391} {"train_loss": -34.592041015625, "global_step": 47340, "epoch": 391} {"train_loss": -35.34769058227539, "global_step": 47341, "epoch": 391} {"train_loss": -34.79511260986328, "global_step": 47342, "epoch": 391} {"train_loss": -34.32783126831055, "global_step": 47343, "epoch": 391} {"train_loss": -35.0456657409668, "global_step": 47344, "epoch": 391} {"train_loss": -35.1314811706543, "global_step": 47345, "epoch": 391} {"train_loss": -35.094173431396484, "global_step": 47346, "epoch": 391} {"train_loss": -34.81764602661133, "global_step": 47347, "epoch": 391} {"train_loss": -34.484737396240234, "global_step": 47348, "epoch": 391} {"train_loss": -34.93049240112305, "global_step": 47349, "epoch": 391} {"train_loss": -34.70633316040039, "global_step": 47350, "epoch": 391} {"train_loss": -35.1937370300293, "global_step": 47351, "epoch": 391} {"train_loss": -35.29896926879883, "global_step": 47352, "epoch": 391} {"train_loss": -34.69572830200195, "global_step": 47353, "epoch": 391} {"train_loss": -34.73213577270508, "global_step": 47354, "epoch": 391} {"train_loss": -34.79025650024414, "global_step": 47355, "epoch": 391} {"train_loss": -35.42790603637695, "global_step": 47356, "epoch": 391} {"train_loss": -35.3892936706543, "global_step": 47357, "epoch": 391} {"train_loss": -35.458431243896484, "global_step": 47358, "epoch": 391} {"train_loss": -34.82599639892578, "global_step": 47359, "epoch": 391} {"train_loss": -34.7806510925293, "global_step": 47360, "epoch": 391} {"train_loss": -34.83845901489258, "global_step": 47361, "epoch": 391} {"train_loss": -34.456966400146484, "global_step": 47362, "epoch": 391} {"train_loss": -34.89193344116211, "global_step": 47363, "epoch": 391} {"train_loss": -35.18265914916992, "global_step": 47364, "epoch": 391} {"train_loss": -34.47195053100586, "global_step": 47365, "epoch": 391} {"train_loss": -35.14411544799805, "global_step": 47366, "epoch": 391} {"train_loss": -35.46407699584961, "global_step": 47367, "epoch": 391} {"train_loss": -34.237098693847656, "global_step": 47368, "epoch": 391} {"train_loss": -33.341487884521484, "global_step": 47369, "epoch": 391} {"train_loss": -31.5033016204834, "global_step": 47370, "epoch": 391} {"train_loss": -34.28139114379883, "global_step": 47371, "epoch": 391} {"train_loss": -28.439579010009766, "global_step": 47372, "epoch": 391} {"train_loss": -30.817127227783203, "global_step": 47373, "epoch": 391} {"train_loss": -29.592453002929688, "global_step": 47374, "epoch": 391} {"train_loss": -31.769184112548828, "global_step": 47375, "epoch": 391} {"train_loss": -28.49721336364746, "global_step": 47376, "epoch": 391} {"train_loss": -33.172035217285156, "global_step": 47377, "epoch": 391} {"train_loss": -31.496862411499023, "global_step": 47378, "epoch": 391} {"train_loss": -32.51998519897461, "global_step": 47379, "epoch": 391} {"train_loss": -33.0074577331543, "global_step": 47380, "epoch": 391} {"train_loss": -32.2953987121582, "global_step": 47381, "epoch": 391} {"train_loss": -31.848896026611328, "global_step": 47382, "epoch": 391} {"train_loss": -34.05435562133789, "global_step": 47383, "epoch": 391} {"train_loss": -32.73310470581055, "global_step": 47384, "epoch": 391} {"train_loss": -31.5638370513916, "global_step": 47385, "epoch": 391} {"train_loss": -33.253074645996094, "global_step": 47386, "epoch": 391} {"train_loss": -33.28007888793945, "global_step": 47387, "epoch": 391} {"train_loss": -34.12274932861328, "global_step": 47388, "epoch": 391} {"train_loss": -34.126590728759766, "global_step": 47389, "epoch": 391} {"train_loss": -33.1491813659668, "global_step": 47390, "epoch": 391} {"train_loss": -33.88071823120117, "global_step": 47391, "epoch": 391} {"train_loss": -32.70317459106445, "global_step": 47392, "epoch": 391} {"train_loss": -33.98050308227539, "global_step": 47393, "epoch": 391} {"train_loss": -33.39046096801758, "global_step": 47394, "epoch": 391} {"train_loss": -34.73005294799805, "global_step": 47395, "epoch": 391} {"train_loss": -34.2009391784668, "global_step": 47396, "epoch": 391} {"train_loss": -34.20286178588867, "global_step": 47397, "epoch": 391} {"train_loss": -34.47722625732422, "global_step": 47398, "epoch": 391} {"train_loss": -34.64385223388672, "global_step": 47399, "epoch": 391} {"train_loss": -34.339508056640625, "global_step": 47400, "epoch": 391} {"train_loss": -34.65684127807617, "global_step": 47401, "epoch": 391} {"train_loss": -34.67238235473633, "global_step": 47402, "epoch": 391} {"train_loss": -35.006004333496094, "global_step": 47403, "epoch": 391} {"train_loss": -34.679786682128906, "global_step": 47404, "epoch": 391} {"train_loss": -35.04016876220703, "global_step": 47405, "epoch": 391} {"train_loss": -34.68548583984375, "global_step": 47406, "epoch": 391} {"train_loss": -34.16569137573242, "global_step": 47407, "epoch": 391} {"train_loss": -35.102081298828125, "global_step": 47408, "epoch": 391} {"train_loss": -35.157958984375, "global_step": 47409, "epoch": 391} {"train_loss": -34.7021598815918, "global_step": 47410, "epoch": 391} {"train_loss": -34.82178497314453, "global_step": 47411, "epoch": 391} {"train_loss": -34.19985580444336, "global_step": 47412, "epoch": 391} {"train_loss": -35.07081604003906, "global_step": 47413, "epoch": 391} {"train_loss": -35.26364517211914, "global_step": 47414, "epoch": 391} {"train_loss": -34.68143844604492, "global_step": 47415, "epoch": 391} {"train_loss": -35.15345764160156, "global_step": 47416, "epoch": 391} {"train_loss": -34.6853141784668, "global_step": 47417, "epoch": 391} {"train_loss": -34.83572006225586, "global_step": 47418, "epoch": 391} {"train_loss": -34.61298370361328, "global_step": 47419, "epoch": 391} {"train_loss": -34.8245849609375, "global_step": 47420, "epoch": 391} {"train_loss": -35.00272750854492, "global_step": 47421, "epoch": 391} {"train_loss": -34.79619216918945, "global_step": 47422, "epoch": 391} {"train_loss": -34.9359016418457, "global_step": 47423, "epoch": 391} {"train_loss": -34.874691009521484, "global_step": 47424, "epoch": 391} {"train_loss": -34.83170700073242, "global_step": 47425, "epoch": 391} {"train_loss": -33.890804290771484, "global_step": 47426, "epoch": 391} {"train_loss": -34.515743255615234, "global_step": 47427, "epoch": 391} {"train_loss": -35.24691390991211, "global_step": 47428, "epoch": 391} {"train_loss": -34.63197708129883, "global_step": 47429, "epoch": 391} {"train_loss": -34.04233169555664, "global_step": 47430, "epoch": 391} {"train_loss": -34.18953161003176, "global_step": 47431, "epoch": 391, "val_loss": 2588630.25} {"train_loss": -35.3477897644043, "global_step": 47432, "epoch": 392} {"train_loss": -33.5485725402832, "global_step": 47433, "epoch": 392} {"train_loss": -33.68574905395508, "global_step": 47434, "epoch": 392} {"train_loss": -34.33625793457031, "global_step": 47435, "epoch": 392} {"train_loss": -34.737789154052734, "global_step": 47436, "epoch": 392} {"train_loss": -34.58220291137695, "global_step": 47437, "epoch": 392} {"train_loss": -33.03549575805664, "global_step": 47438, "epoch": 392} {"train_loss": -33.447357177734375, "global_step": 47439, "epoch": 392} {"train_loss": -33.120296478271484, "global_step": 47440, "epoch": 392} {"train_loss": -31.944181442260742, "global_step": 47441, "epoch": 392} {"train_loss": -32.588497161865234, "global_step": 47442, "epoch": 392} {"train_loss": -33.349365234375, "global_step": 47443, "epoch": 392} {"train_loss": -34.571136474609375, "global_step": 47444, "epoch": 392} {"train_loss": -34.13835525512695, "global_step": 47445, "epoch": 392} {"train_loss": -33.0589714050293, "global_step": 47446, "epoch": 392} {"train_loss": -33.564971923828125, "global_step": 47447, "epoch": 392} {"train_loss": -34.385719299316406, "global_step": 47448, "epoch": 392} {"train_loss": -34.33140182495117, "global_step": 47449, "epoch": 392} {"train_loss": -33.388641357421875, "global_step": 47450, "epoch": 392} {"train_loss": -33.4864616394043, "global_step": 47451, "epoch": 392} {"train_loss": -33.78339385986328, "global_step": 47452, "epoch": 392} {"train_loss": -32.809654235839844, "global_step": 47453, "epoch": 392} {"train_loss": -33.996063232421875, "global_step": 47454, "epoch": 392} {"train_loss": -34.74331283569336, "global_step": 47455, "epoch": 392} {"train_loss": -34.40243911743164, "global_step": 47456, "epoch": 392} {"train_loss": -34.26362609863281, "global_step": 47457, "epoch": 392} {"train_loss": -34.10415267944336, "global_step": 47458, "epoch": 392} {"train_loss": -34.56190490722656, "global_step": 47459, "epoch": 392} {"train_loss": -33.89015579223633, "global_step": 47460, "epoch": 392} {"train_loss": -33.99093246459961, "global_step": 47461, "epoch": 392} {"train_loss": -33.96499252319336, "global_step": 47462, "epoch": 392} {"train_loss": -33.889381408691406, "global_step": 47463, "epoch": 392} {"train_loss": -33.85029983520508, "global_step": 47464, "epoch": 392} {"train_loss": -33.65876388549805, "global_step": 47465, "epoch": 392} {"train_loss": -34.06597900390625, "global_step": 47466, "epoch": 392} {"train_loss": -34.3114128112793, "global_step": 47467, "epoch": 392} {"train_loss": -34.25349807739258, "global_step": 47468, "epoch": 392} {"train_loss": -34.647911071777344, "global_step": 47469, "epoch": 392} {"train_loss": -34.10795211791992, "global_step": 47470, "epoch": 392} {"train_loss": -34.63227462768555, "global_step": 47471, "epoch": 392} {"train_loss": -34.18475341796875, "global_step": 47472, "epoch": 392} {"train_loss": -34.04319763183594, "global_step": 47473, "epoch": 392} {"train_loss": -34.14667892456055, "global_step": 47474, "epoch": 392} {"train_loss": -34.91927719116211, "global_step": 47475, "epoch": 392} {"train_loss": -34.61995315551758, "global_step": 47476, "epoch": 392} {"train_loss": -34.393924713134766, "global_step": 47477, "epoch": 392} {"train_loss": -34.26577377319336, "global_step": 47478, "epoch": 392} {"train_loss": -34.60995864868164, "global_step": 47479, "epoch": 392} {"train_loss": -34.39969253540039, "global_step": 47480, "epoch": 392} {"train_loss": -34.516029357910156, "global_step": 47481, "epoch": 392} {"train_loss": -34.66007995605469, "global_step": 47482, "epoch": 392} {"train_loss": -34.419639587402344, "global_step": 47483, "epoch": 392} {"train_loss": -34.13521957397461, "global_step": 47484, "epoch": 392} {"train_loss": -33.34864044189453, "global_step": 47485, "epoch": 392} {"train_loss": -34.209754943847656, "global_step": 47486, "epoch": 392} {"train_loss": -34.74235534667969, "global_step": 47487, "epoch": 392} {"train_loss": -35.48076248168945, "global_step": 47488, "epoch": 392} {"train_loss": -34.80658721923828, "global_step": 47489, "epoch": 392} {"train_loss": -35.40979766845703, "global_step": 47490, "epoch": 392} {"train_loss": -35.05781173706055, "global_step": 47491, "epoch": 392} {"train_loss": -35.21479797363281, "global_step": 47492, "epoch": 392} {"train_loss": -34.206787109375, "global_step": 47493, "epoch": 392} {"train_loss": -33.789146423339844, "global_step": 47494, "epoch": 392} {"train_loss": -33.99774932861328, "global_step": 47495, "epoch": 392} {"train_loss": -35.270877838134766, "global_step": 47496, "epoch": 392} {"train_loss": -35.20958709716797, "global_step": 47497, "epoch": 392} {"train_loss": -34.46070861816406, "global_step": 47498, "epoch": 392} {"train_loss": -34.02718734741211, "global_step": 47499, "epoch": 392} {"train_loss": -35.39646530151367, "global_step": 47500, "epoch": 392} {"train_loss": -34.52669906616211, "global_step": 47501, "epoch": 392} {"train_loss": -32.70901870727539, "global_step": 47502, "epoch": 392} {"train_loss": -31.817960739135742, "global_step": 47503, "epoch": 392} {"train_loss": -33.7374382019043, "global_step": 47504, "epoch": 392} {"train_loss": -34.76533126831055, "global_step": 47505, "epoch": 392} {"train_loss": -32.950782775878906, "global_step": 47506, "epoch": 392} {"train_loss": -32.85282516479492, "global_step": 47507, "epoch": 392} {"train_loss": -35.43581771850586, "global_step": 47508, "epoch": 392} {"train_loss": -34.47837448120117, "global_step": 47509, "epoch": 392} {"train_loss": -31.785160064697266, "global_step": 47510, "epoch": 392} {"train_loss": -31.752613067626953, "global_step": 47511, "epoch": 392} {"train_loss": -34.350467681884766, "global_step": 47512, "epoch": 392} {"train_loss": -34.4305419921875, "global_step": 47513, "epoch": 392} {"train_loss": -33.135677337646484, "global_step": 47514, "epoch": 392} {"train_loss": -33.2310676574707, "global_step": 47515, "epoch": 392} {"train_loss": -35.21586227416992, "global_step": 47516, "epoch": 392} {"train_loss": -34.69367599487305, "global_step": 47517, "epoch": 392} {"train_loss": -33.74806594848633, "global_step": 47518, "epoch": 392} {"train_loss": -35.46721649169922, "global_step": 47519, "epoch": 392} {"train_loss": -35.432411193847656, "global_step": 47520, "epoch": 392} {"train_loss": -35.287994384765625, "global_step": 47521, "epoch": 392} {"train_loss": -35.660736083984375, "global_step": 47522, "epoch": 392} {"train_loss": -35.5632438659668, "global_step": 47523, "epoch": 392} {"train_loss": -35.38709259033203, "global_step": 47524, "epoch": 392} {"train_loss": -34.95130920410156, "global_step": 47525, "epoch": 392} {"train_loss": -34.81943893432617, "global_step": 47526, "epoch": 392} {"train_loss": -35.539791107177734, "global_step": 47527, "epoch": 392} {"train_loss": -35.59360885620117, "global_step": 47528, "epoch": 392} {"train_loss": -35.985862731933594, "global_step": 47529, "epoch": 392} {"train_loss": -35.57213592529297, "global_step": 47530, "epoch": 392} {"train_loss": -34.91350173950195, "global_step": 47531, "epoch": 392} {"train_loss": -35.21620178222656, "global_step": 47532, "epoch": 392} {"train_loss": -35.2490348815918, "global_step": 47533, "epoch": 392} {"train_loss": -34.845855712890625, "global_step": 47534, "epoch": 392} {"train_loss": -34.9218864440918, "global_step": 47535, "epoch": 392} {"train_loss": -33.49591064453125, "global_step": 47536, "epoch": 392} {"train_loss": -30.61244010925293, "global_step": 47537, "epoch": 392} {"train_loss": -28.83852195739746, "global_step": 47538, "epoch": 392} {"train_loss": -31.01490592956543, "global_step": 47539, "epoch": 392} {"train_loss": -33.1747932434082, "global_step": 47540, "epoch": 392} {"train_loss": -34.462528228759766, "global_step": 47541, "epoch": 392} {"train_loss": -34.8726921081543, "global_step": 47542, "epoch": 392} {"train_loss": -33.479164123535156, "global_step": 47543, "epoch": 392} {"train_loss": -34.18732452392578, "global_step": 47544, "epoch": 392} {"train_loss": -34.390193939208984, "global_step": 47545, "epoch": 392} {"train_loss": -32.930328369140625, "global_step": 47546, "epoch": 392} {"train_loss": -34.723594665527344, "global_step": 47547, "epoch": 392} {"train_loss": -33.889404296875, "global_step": 47548, "epoch": 392} {"train_loss": -34.0998420715332, "global_step": 47549, "epoch": 392} {"train_loss": -33.931129455566406, "global_step": 47550, "epoch": 392} {"train_loss": -33.486934661865234, "global_step": 47551, "epoch": 392} {"train_loss": -34.131073644338564, "global_step": 47552, "epoch": 392, "val_loss": 2551416.0} {"train_loss": -33.56249237060547, "global_step": 47553, "epoch": 393} {"train_loss": -32.50550079345703, "global_step": 47554, "epoch": 393} {"train_loss": -33.60234069824219, "global_step": 47555, "epoch": 393} {"train_loss": -34.18075180053711, "global_step": 47556, "epoch": 393} {"train_loss": -33.638511657714844, "global_step": 47557, "epoch": 393} {"train_loss": -34.42497253417969, "global_step": 47558, "epoch": 393} {"train_loss": -34.13763427734375, "global_step": 47559, "epoch": 393} {"train_loss": -34.77180099487305, "global_step": 47560, "epoch": 393} {"train_loss": -33.93144607543945, "global_step": 47561, "epoch": 393} {"train_loss": -35.024078369140625, "global_step": 47562, "epoch": 393} {"train_loss": -34.30381393432617, "global_step": 47563, "epoch": 393} {"train_loss": -34.2686767578125, "global_step": 47564, "epoch": 393} {"train_loss": -34.71552658081055, "global_step": 47565, "epoch": 393} {"train_loss": -34.880924224853516, "global_step": 47566, "epoch": 393} {"train_loss": -34.786312103271484, "global_step": 47567, "epoch": 393} {"train_loss": -35.21860885620117, "global_step": 47568, "epoch": 393} {"train_loss": -35.24612045288086, "global_step": 47569, "epoch": 393} {"train_loss": -35.10050582885742, "global_step": 47570, "epoch": 393} {"train_loss": -35.29390335083008, "global_step": 47571, "epoch": 393} {"train_loss": -35.255470275878906, "global_step": 47572, "epoch": 393} {"train_loss": -35.22653579711914, "global_step": 47573, "epoch": 393} {"train_loss": -35.44720458984375, "global_step": 47574, "epoch": 393} {"train_loss": -35.10575485229492, "global_step": 47575, "epoch": 393} {"train_loss": -35.28028106689453, "global_step": 47576, "epoch": 393} {"train_loss": -35.64801788330078, "global_step": 47577, "epoch": 393} {"train_loss": -35.419647216796875, "global_step": 47578, "epoch": 393} {"train_loss": -35.24855422973633, "global_step": 47579, "epoch": 393} {"train_loss": -35.56793212890625, "global_step": 47580, "epoch": 393} {"train_loss": -35.383766174316406, "global_step": 47581, "epoch": 393} {"train_loss": -34.935909271240234, "global_step": 47582, "epoch": 393} {"train_loss": -35.54095458984375, "global_step": 47583, "epoch": 393} {"train_loss": -35.368812561035156, "global_step": 47584, "epoch": 393} {"train_loss": -35.282901763916016, "global_step": 47585, "epoch": 393} {"train_loss": -35.7973747253418, "global_step": 47586, "epoch": 393} {"train_loss": -35.852996826171875, "global_step": 47587, "epoch": 393} {"train_loss": -35.60791015625, "global_step": 47588, "epoch": 393} {"train_loss": -35.90533447265625, "global_step": 47589, "epoch": 393} {"train_loss": -35.65159606933594, "global_step": 47590, "epoch": 393} {"train_loss": -35.548316955566406, "global_step": 47591, "epoch": 393} {"train_loss": -35.47929763793945, "global_step": 47592, "epoch": 393} {"train_loss": -35.41779327392578, "global_step": 47593, "epoch": 393} {"train_loss": -35.7349853515625, "global_step": 47594, "epoch": 393} {"train_loss": -35.84418869018555, "global_step": 47595, "epoch": 393} {"train_loss": -36.24058532714844, "global_step": 47596, "epoch": 393} {"train_loss": -35.586605072021484, "global_step": 47597, "epoch": 393} {"train_loss": -35.813072204589844, "global_step": 47598, "epoch": 393} {"train_loss": -35.24922561645508, "global_step": 47599, "epoch": 393} {"train_loss": -34.1479606628418, "global_step": 47600, "epoch": 393} {"train_loss": -35.376739501953125, "global_step": 47601, "epoch": 393} {"train_loss": -35.1749267578125, "global_step": 47602, "epoch": 393} {"train_loss": -35.512611389160156, "global_step": 47603, "epoch": 393} {"train_loss": -35.117591857910156, "global_step": 47604, "epoch": 393} {"train_loss": -35.56264114379883, "global_step": 47605, "epoch": 393} {"train_loss": -35.45427322387695, "global_step": 47606, "epoch": 393} {"train_loss": -35.76656723022461, "global_step": 47607, "epoch": 393} {"train_loss": -35.09014892578125, "global_step": 47608, "epoch": 393} {"train_loss": -33.44989776611328, "global_step": 47609, "epoch": 393} {"train_loss": -31.173688888549805, "global_step": 47610, "epoch": 393} {"train_loss": -33.16625213623047, "global_step": 47611, "epoch": 393} {"train_loss": -34.315982818603516, "global_step": 47612, "epoch": 393} {"train_loss": -34.517879486083984, "global_step": 47613, "epoch": 393} {"train_loss": -34.00299835205078, "global_step": 47614, "epoch": 393} {"train_loss": -34.329586029052734, "global_step": 47615, "epoch": 393} {"train_loss": -34.2242317199707, "global_step": 47616, "epoch": 393} {"train_loss": -33.089351654052734, "global_step": 47617, "epoch": 393} {"train_loss": -33.762638092041016, "global_step": 47618, "epoch": 393} {"train_loss": -32.97157669067383, "global_step": 47619, "epoch": 393} {"train_loss": -33.85165023803711, "global_step": 47620, "epoch": 393} {"train_loss": -33.4886589050293, "global_step": 47621, "epoch": 393} {"train_loss": -33.53718185424805, "global_step": 47622, "epoch": 393} {"train_loss": -34.80128860473633, "global_step": 47623, "epoch": 393} {"train_loss": -34.07235336303711, "global_step": 47624, "epoch": 393} {"train_loss": -33.401214599609375, "global_step": 47625, "epoch": 393} {"train_loss": -35.157814025878906, "global_step": 47626, "epoch": 393} {"train_loss": -33.12886047363281, "global_step": 47627, "epoch": 393} {"train_loss": -30.83942222595215, "global_step": 47628, "epoch": 393} {"train_loss": -34.241634368896484, "global_step": 47629, "epoch": 393} {"train_loss": -34.35599899291992, "global_step": 47630, "epoch": 393} {"train_loss": -33.595062255859375, "global_step": 47631, "epoch": 393} {"train_loss": -33.53462600708008, "global_step": 47632, "epoch": 393} {"train_loss": -35.53985595703125, "global_step": 47633, "epoch": 393} {"train_loss": -34.44442367553711, "global_step": 47634, "epoch": 393} {"train_loss": -34.362823486328125, "global_step": 47635, "epoch": 393} {"train_loss": -34.86865997314453, "global_step": 47636, "epoch": 393} {"train_loss": -34.73337936401367, "global_step": 47637, "epoch": 393} {"train_loss": -34.98331832885742, "global_step": 47638, "epoch": 393} {"train_loss": -34.62750244140625, "global_step": 47639, "epoch": 393} {"train_loss": -34.82894515991211, "global_step": 47640, "epoch": 393} {"train_loss": -32.62822341918945, "global_step": 47641, "epoch": 393} {"train_loss": -34.70096969604492, "global_step": 47642, "epoch": 393} {"train_loss": -34.4421272277832, "global_step": 47643, "epoch": 393} {"train_loss": -34.64828109741211, "global_step": 47644, "epoch": 393} {"train_loss": -34.148189544677734, "global_step": 47645, "epoch": 393} {"train_loss": -33.52882385253906, "global_step": 47646, "epoch": 393} {"train_loss": -32.67137908935547, "global_step": 47647, "epoch": 393} {"train_loss": -34.49332809448242, "global_step": 47648, "epoch": 393} {"train_loss": -33.5363883972168, "global_step": 47649, "epoch": 393} {"train_loss": -33.167442321777344, "global_step": 47650, "epoch": 393} {"train_loss": -33.86463165283203, "global_step": 47651, "epoch": 393} {"train_loss": -34.472408294677734, "global_step": 47652, "epoch": 393} {"train_loss": -34.852325439453125, "global_step": 47653, "epoch": 393} {"train_loss": -34.01551818847656, "global_step": 47654, "epoch": 393} {"train_loss": -34.021514892578125, "global_step": 47655, "epoch": 393} {"train_loss": -33.67097091674805, "global_step": 47656, "epoch": 393} {"train_loss": -34.87775802612305, "global_step": 47657, "epoch": 393} {"train_loss": -33.0585823059082, "global_step": 47658, "epoch": 393} {"train_loss": -33.333709716796875, "global_step": 47659, "epoch": 393} {"train_loss": -33.73884963989258, "global_step": 47660, "epoch": 393} {"train_loss": -34.624427795410156, "global_step": 47661, "epoch": 393} {"train_loss": -32.85702133178711, "global_step": 47662, "epoch": 393} {"train_loss": -33.8302001953125, "global_step": 47663, "epoch": 393} {"train_loss": -34.74325180053711, "global_step": 47664, "epoch": 393} {"train_loss": -33.42057418823242, "global_step": 47665, "epoch": 393} {"train_loss": -34.64918518066406, "global_step": 47666, "epoch": 393} {"train_loss": -33.094703674316406, "global_step": 47667, "epoch": 393} {"train_loss": -34.44338607788086, "global_step": 47668, "epoch": 393} {"train_loss": -34.2797737121582, "global_step": 47669, "epoch": 393} {"train_loss": -33.563270568847656, "global_step": 47670, "epoch": 393} {"train_loss": -33.83567428588867, "global_step": 47671, "epoch": 393} {"train_loss": -33.8637580871582, "global_step": 47672, "epoch": 393} {"train_loss": -34.46139195339739, "global_step": 47673, "epoch": 393, "val_loss": 2496183.75} {"train_loss": -34.01999282836914, "global_step": 47674, "epoch": 394} {"train_loss": -34.9012565612793, "global_step": 47675, "epoch": 394} {"train_loss": -34.08871841430664, "global_step": 47676, "epoch": 394} {"train_loss": -34.1148796081543, "global_step": 47677, "epoch": 394} {"train_loss": -34.15393829345703, "global_step": 47678, "epoch": 394} {"train_loss": -33.47365951538086, "global_step": 47679, "epoch": 394} {"train_loss": -32.72907638549805, "global_step": 47680, "epoch": 394} {"train_loss": -34.65574264526367, "global_step": 47681, "epoch": 394} {"train_loss": -33.92756271362305, "global_step": 47682, "epoch": 394} {"train_loss": -33.222312927246094, "global_step": 47683, "epoch": 394} {"train_loss": -34.62665939331055, "global_step": 47684, "epoch": 394} {"train_loss": -34.448665618896484, "global_step": 47685, "epoch": 394} {"train_loss": -34.2018928527832, "global_step": 47686, "epoch": 394} {"train_loss": -34.536251068115234, "global_step": 47687, "epoch": 394} {"train_loss": -34.313743591308594, "global_step": 47688, "epoch": 394} {"train_loss": -34.21216583251953, "global_step": 47689, "epoch": 394} {"train_loss": -33.683197021484375, "global_step": 47690, "epoch": 394} {"train_loss": -34.30611038208008, "global_step": 47691, "epoch": 394} {"train_loss": -33.738250732421875, "global_step": 47692, "epoch": 394} {"train_loss": -33.24116134643555, "global_step": 47693, "epoch": 394} {"train_loss": -30.926420211791992, "global_step": 47694, "epoch": 394} {"train_loss": -30.333728790283203, "global_step": 47695, "epoch": 394} {"train_loss": -30.78724479675293, "global_step": 47696, "epoch": 394} {"train_loss": -27.818836212158203, "global_step": 47697, "epoch": 394} {"train_loss": -33.43817138671875, "global_step": 47698, "epoch": 394} {"train_loss": -29.319732666015625, "global_step": 47699, "epoch": 394} {"train_loss": -30.801197052001953, "global_step": 47700, "epoch": 394} {"train_loss": -32.20587921142578, "global_step": 47701, "epoch": 394} {"train_loss": -31.954792022705078, "global_step": 47702, "epoch": 394} {"train_loss": -32.9919548034668, "global_step": 47703, "epoch": 394} {"train_loss": -34.025917053222656, "global_step": 47704, "epoch": 394} {"train_loss": -33.222442626953125, "global_step": 47705, "epoch": 394} {"train_loss": -33.054046630859375, "global_step": 47706, "epoch": 394} {"train_loss": -32.91364288330078, "global_step": 47707, "epoch": 394} {"train_loss": -32.923397064208984, "global_step": 47708, "epoch": 394} {"train_loss": -34.42728805541992, "global_step": 47709, "epoch": 394} {"train_loss": -34.35488510131836, "global_step": 47710, "epoch": 394} {"train_loss": -34.542171478271484, "global_step": 47711, "epoch": 394} {"train_loss": -34.182289123535156, "global_step": 47712, "epoch": 394} {"train_loss": -34.372802734375, "global_step": 47713, "epoch": 394} {"train_loss": -34.41450119018555, "global_step": 47714, "epoch": 394} {"train_loss": -34.854339599609375, "global_step": 47715, "epoch": 394} {"train_loss": -34.33357620239258, "global_step": 47716, "epoch": 394} {"train_loss": -34.72175979614258, "global_step": 47717, "epoch": 394} {"train_loss": -35.039737701416016, "global_step": 47718, "epoch": 394} {"train_loss": -34.2221794128418, "global_step": 47719, "epoch": 394} {"train_loss": -34.52093505859375, "global_step": 47720, "epoch": 394} {"train_loss": -35.00764083862305, "global_step": 47721, "epoch": 394} {"train_loss": -33.831111907958984, "global_step": 47722, "epoch": 394} {"train_loss": -33.865272521972656, "global_step": 47723, "epoch": 394} {"train_loss": -34.61092758178711, "global_step": 47724, "epoch": 394} {"train_loss": -34.29342269897461, "global_step": 47725, "epoch": 394} {"train_loss": -35.20676803588867, "global_step": 47726, "epoch": 394} {"train_loss": -34.46366500854492, "global_step": 47727, "epoch": 394} {"train_loss": -34.04447555541992, "global_step": 47728, "epoch": 394} {"train_loss": -34.28243637084961, "global_step": 47729, "epoch": 394} {"train_loss": -34.73439407348633, "global_step": 47730, "epoch": 394} {"train_loss": -34.56119918823242, "global_step": 47731, "epoch": 394} {"train_loss": -34.23590850830078, "global_step": 47732, "epoch": 394} {"train_loss": -35.80597686767578, "global_step": 47733, "epoch": 394} {"train_loss": -34.613548278808594, "global_step": 47734, "epoch": 394} {"train_loss": -34.872657775878906, "global_step": 47735, "epoch": 394} {"train_loss": -35.29032516479492, "global_step": 47736, "epoch": 394} {"train_loss": -34.72760009765625, "global_step": 47737, "epoch": 394} {"train_loss": -35.3005256652832, "global_step": 47738, "epoch": 394} {"train_loss": -35.518062591552734, "global_step": 47739, "epoch": 394} {"train_loss": -35.28678894042969, "global_step": 47740, "epoch": 394} {"train_loss": -35.8350944519043, "global_step": 47741, "epoch": 394} {"train_loss": -35.604671478271484, "global_step": 47742, "epoch": 394} {"train_loss": -35.250457763671875, "global_step": 47743, "epoch": 394} {"train_loss": -35.57038116455078, "global_step": 47744, "epoch": 394} {"train_loss": -35.635677337646484, "global_step": 47745, "epoch": 394} {"train_loss": -35.16118240356445, "global_step": 47746, "epoch": 394} {"train_loss": -34.99946212768555, "global_step": 47747, "epoch": 394} {"train_loss": -36.000179290771484, "global_step": 47748, "epoch": 394} {"train_loss": -35.65938949584961, "global_step": 47749, "epoch": 394} {"train_loss": -35.360958099365234, "global_step": 47750, "epoch": 394} {"train_loss": -35.53084945678711, "global_step": 47751, "epoch": 394} {"train_loss": -35.76810836791992, "global_step": 47752, "epoch": 394} {"train_loss": -35.741695404052734, "global_step": 47753, "epoch": 394} {"train_loss": -34.91376876831055, "global_step": 47754, "epoch": 394} {"train_loss": -35.090721130371094, "global_step": 47755, "epoch": 394} {"train_loss": -33.92471694946289, "global_step": 47756, "epoch": 394} {"train_loss": -32.70376205444336, "global_step": 47757, "epoch": 394} {"train_loss": -30.729360580444336, "global_step": 47758, "epoch": 394} {"train_loss": -31.8712158203125, "global_step": 47759, "epoch": 394} {"train_loss": -31.300886154174805, "global_step": 47760, "epoch": 394} {"train_loss": -33.69472885131836, "global_step": 47761, "epoch": 394} {"train_loss": -33.107696533203125, "global_step": 47762, "epoch": 394} {"train_loss": -33.7890625, "global_step": 47763, "epoch": 394} {"train_loss": -33.291282653808594, "global_step": 47764, "epoch": 394} {"train_loss": -32.62501907348633, "global_step": 47765, "epoch": 394} {"train_loss": -34.19781494140625, "global_step": 47766, "epoch": 394} {"train_loss": -33.30964279174805, "global_step": 47767, "epoch": 394} {"train_loss": -33.564109802246094, "global_step": 47768, "epoch": 394} {"train_loss": -35.6761589050293, "global_step": 47769, "epoch": 394} {"train_loss": -34.76922607421875, "global_step": 47770, "epoch": 394} {"train_loss": -34.79658889770508, "global_step": 47771, "epoch": 394} {"train_loss": -35.42122268676758, "global_step": 47772, "epoch": 394} {"train_loss": -33.66915512084961, "global_step": 47773, "epoch": 394} {"train_loss": -34.08280563354492, "global_step": 47774, "epoch": 394} {"train_loss": -33.5545768737793, "global_step": 47775, "epoch": 394} {"train_loss": -32.94264602661133, "global_step": 47776, "epoch": 394} {"train_loss": -33.89386749267578, "global_step": 47777, "epoch": 394} {"train_loss": -33.4681510925293, "global_step": 47778, "epoch": 394} {"train_loss": -32.914730072021484, "global_step": 47779, "epoch": 394} {"train_loss": -34.43709945678711, "global_step": 47780, "epoch": 394} {"train_loss": -34.09368896484375, "global_step": 47781, "epoch": 394} {"train_loss": -32.209815979003906, "global_step": 47782, "epoch": 394} {"train_loss": -34.21645736694336, "global_step": 47783, "epoch": 394} {"train_loss": -34.6306266784668, "global_step": 47784, "epoch": 394} {"train_loss": -34.63935470581055, "global_step": 47785, "epoch": 394} {"train_loss": -35.0926399230957, "global_step": 47786, "epoch": 394} {"train_loss": -34.958038330078125, "global_step": 47787, "epoch": 394} {"train_loss": -34.82621383666992, "global_step": 47788, "epoch": 394} {"train_loss": -34.69926834106445, "global_step": 47789, "epoch": 394} {"train_loss": -35.05777359008789, "global_step": 47790, "epoch": 394} {"train_loss": -35.42934036254883, "global_step": 47791, "epoch": 394} {"train_loss": -35.43235778808594, "global_step": 47792, "epoch": 394} {"train_loss": -35.51924514770508, "global_step": 47793, "epoch": 394} {"train_loss": -34.056126113765494, "global_step": 47794, "epoch": 394, "val_loss": 2707241.25} {"train_loss": -32.96600341796875, "global_step": 47795, "epoch": 395} {"train_loss": -34.79920196533203, "global_step": 47796, "epoch": 395} {"train_loss": -35.56203842163086, "global_step": 47797, "epoch": 395} {"train_loss": -34.78629684448242, "global_step": 47798, "epoch": 395} {"train_loss": -34.53398132324219, "global_step": 47799, "epoch": 395} {"train_loss": -34.774627685546875, "global_step": 47800, "epoch": 395} {"train_loss": -35.559173583984375, "global_step": 47801, "epoch": 395} {"train_loss": -34.79064178466797, "global_step": 47802, "epoch": 395} {"train_loss": -34.52118682861328, "global_step": 47803, "epoch": 395} {"train_loss": -34.80970001220703, "global_step": 47804, "epoch": 395} {"train_loss": -33.680904388427734, "global_step": 47805, "epoch": 395} {"train_loss": -34.71784591674805, "global_step": 47806, "epoch": 395} {"train_loss": -35.514129638671875, "global_step": 47807, "epoch": 395} {"train_loss": -35.10690689086914, "global_step": 47808, "epoch": 395} {"train_loss": -34.404296875, "global_step": 47809, "epoch": 395} {"train_loss": -35.26423263549805, "global_step": 47810, "epoch": 395} {"train_loss": -34.47835922241211, "global_step": 47811, "epoch": 395} {"train_loss": -34.773109436035156, "global_step": 47812, "epoch": 395} {"train_loss": -34.477291107177734, "global_step": 47813, "epoch": 395} {"train_loss": -34.64482498168945, "global_step": 47814, "epoch": 395} {"train_loss": -35.21796417236328, "global_step": 47815, "epoch": 395} {"train_loss": -35.29061508178711, "global_step": 47816, "epoch": 395} {"train_loss": -35.18830108642578, "global_step": 47817, "epoch": 395} {"train_loss": -35.0407600402832, "global_step": 47818, "epoch": 395} {"train_loss": -34.85200119018555, "global_step": 47819, "epoch": 395} {"train_loss": -34.28940963745117, "global_step": 47820, "epoch": 395} {"train_loss": -35.19409942626953, "global_step": 47821, "epoch": 395} {"train_loss": -34.70261764526367, "global_step": 47822, "epoch": 395} {"train_loss": -34.17862319946289, "global_step": 47823, "epoch": 395} {"train_loss": -34.878944396972656, "global_step": 47824, "epoch": 395} {"train_loss": -32.14091873168945, "global_step": 47825, "epoch": 395} {"train_loss": -34.70778274536133, "global_step": 47826, "epoch": 395} {"train_loss": -35.24248123168945, "global_step": 47827, "epoch": 395} {"train_loss": -34.726356506347656, "global_step": 47828, "epoch": 395} {"train_loss": -34.87590789794922, "global_step": 47829, "epoch": 395} {"train_loss": -34.21944808959961, "global_step": 47830, "epoch": 395} {"train_loss": -34.2129020690918, "global_step": 47831, "epoch": 395} {"train_loss": -33.9832763671875, "global_step": 47832, "epoch": 395} {"train_loss": -34.21614456176758, "global_step": 47833, "epoch": 395} {"train_loss": -35.29962158203125, "global_step": 47834, "epoch": 395} {"train_loss": -33.696868896484375, "global_step": 47835, "epoch": 395} {"train_loss": -34.770599365234375, "global_step": 47836, "epoch": 395} {"train_loss": -34.180519104003906, "global_step": 47837, "epoch": 395} {"train_loss": -34.938961029052734, "global_step": 47838, "epoch": 395} {"train_loss": -33.57971954345703, "global_step": 47839, "epoch": 395} {"train_loss": -33.646034240722656, "global_step": 47840, "epoch": 395} {"train_loss": -34.02272415161133, "global_step": 47841, "epoch": 395} {"train_loss": -33.74748611450195, "global_step": 47842, "epoch": 395} {"train_loss": -34.56856155395508, "global_step": 47843, "epoch": 395} {"train_loss": -32.87156295776367, "global_step": 47844, "epoch": 395} {"train_loss": -34.55302047729492, "global_step": 47845, "epoch": 395} {"train_loss": -33.074214935302734, "global_step": 47846, "epoch": 395} {"train_loss": -33.57918167114258, "global_step": 47847, "epoch": 395} {"train_loss": -34.301822662353516, "global_step": 47848, "epoch": 395} {"train_loss": -33.89631271362305, "global_step": 47849, "epoch": 395} {"train_loss": -32.83740997314453, "global_step": 47850, "epoch": 395} {"train_loss": -34.123897552490234, "global_step": 47851, "epoch": 395} {"train_loss": -34.165313720703125, "global_step": 47852, "epoch": 395} {"train_loss": -34.583248138427734, "global_step": 47853, "epoch": 395} {"train_loss": -31.3620548248291, "global_step": 47854, "epoch": 395} {"train_loss": -31.89443016052246, "global_step": 47855, "epoch": 395} {"train_loss": -32.49037170410156, "global_step": 47856, "epoch": 395} {"train_loss": -34.38759231567383, "global_step": 47857, "epoch": 395} {"train_loss": -34.3795166015625, "global_step": 47858, "epoch": 395} {"train_loss": -34.130062103271484, "global_step": 47859, "epoch": 395} {"train_loss": -33.4491081237793, "global_step": 47860, "epoch": 395} {"train_loss": -33.44647979736328, "global_step": 47861, "epoch": 395} {"train_loss": -34.27497482299805, "global_step": 47862, "epoch": 395} {"train_loss": -34.607845306396484, "global_step": 47863, "epoch": 395} {"train_loss": -34.499351501464844, "global_step": 47864, "epoch": 395} {"train_loss": -34.6889762878418, "global_step": 47865, "epoch": 395} {"train_loss": -34.77492141723633, "global_step": 47866, "epoch": 395} {"train_loss": -34.11027145385742, "global_step": 47867, "epoch": 395} {"train_loss": -34.42631149291992, "global_step": 47868, "epoch": 395} {"train_loss": -35.04902267456055, "global_step": 47869, "epoch": 395} {"train_loss": -34.710670471191406, "global_step": 47870, "epoch": 395} {"train_loss": -34.61470031738281, "global_step": 47871, "epoch": 395} {"train_loss": -34.81337356567383, "global_step": 47872, "epoch": 395} {"train_loss": -34.33280944824219, "global_step": 47873, "epoch": 395} {"train_loss": -34.84322738647461, "global_step": 47874, "epoch": 395} {"train_loss": -35.08870315551758, "global_step": 47875, "epoch": 395} {"train_loss": -34.65328598022461, "global_step": 47876, "epoch": 395} {"train_loss": -35.2811164855957, "global_step": 47877, "epoch": 395} {"train_loss": -34.876564025878906, "global_step": 47878, "epoch": 395} {"train_loss": -34.51626968383789, "global_step": 47879, "epoch": 395} {"train_loss": -34.979347229003906, "global_step": 47880, "epoch": 395} {"train_loss": -35.455848693847656, "global_step": 47881, "epoch": 395} {"train_loss": -34.66781234741211, "global_step": 47882, "epoch": 395} {"train_loss": -35.12506866455078, "global_step": 47883, "epoch": 395} {"train_loss": -35.36854934692383, "global_step": 47884, "epoch": 395} {"train_loss": -34.688106536865234, "global_step": 47885, "epoch": 395} {"train_loss": -34.82633590698242, "global_step": 47886, "epoch": 395} {"train_loss": -35.05588150024414, "global_step": 47887, "epoch": 395} {"train_loss": -34.981895446777344, "global_step": 47888, "epoch": 395} {"train_loss": -35.717403411865234, "global_step": 47889, "epoch": 395} {"train_loss": -35.19843673706055, "global_step": 47890, "epoch": 395} {"train_loss": -35.425071716308594, "global_step": 47891, "epoch": 395} {"train_loss": -34.97360610961914, "global_step": 47892, "epoch": 395} {"train_loss": -34.09942626953125, "global_step": 47893, "epoch": 395} {"train_loss": -31.8985595703125, "global_step": 47894, "epoch": 395} {"train_loss": -30.68476676940918, "global_step": 47895, "epoch": 395} {"train_loss": -30.956756591796875, "global_step": 47896, "epoch": 395} {"train_loss": -31.5943660736084, "global_step": 47897, "epoch": 395} {"train_loss": -33.917842864990234, "global_step": 47898, "epoch": 395} {"train_loss": -32.95691680908203, "global_step": 47899, "epoch": 395} {"train_loss": -32.476318359375, "global_step": 47900, "epoch": 395} {"train_loss": -33.920467376708984, "global_step": 47901, "epoch": 395} {"train_loss": -34.40349197387695, "global_step": 47902, "epoch": 395} {"train_loss": -34.26231002807617, "global_step": 47903, "epoch": 395} {"train_loss": -35.349769592285156, "global_step": 47904, "epoch": 395} {"train_loss": -34.216522216796875, "global_step": 47905, "epoch": 395} {"train_loss": -35.376827239990234, "global_step": 47906, "epoch": 395} {"train_loss": -35.39509582519531, "global_step": 47907, "epoch": 395} {"train_loss": -34.34177780151367, "global_step": 47908, "epoch": 395} {"train_loss": -33.83066940307617, "global_step": 47909, "epoch": 395} {"train_loss": -35.1050910949707, "global_step": 47910, "epoch": 395} {"train_loss": -33.729000091552734, "global_step": 47911, "epoch": 395} {"train_loss": -34.06658172607422, "global_step": 47912, "epoch": 395} {"train_loss": -32.92488479614258, "global_step": 47913, "epoch": 395} {"train_loss": -34.90447235107422, "global_step": 47914, "epoch": 395} {"train_loss": -34.313000261291, "global_step": 47915, "epoch": 395, "val_loss": 2588743.0} {"train_loss": -34.96842575073242, "global_step": 47916, "epoch": 396} {"train_loss": -34.845672607421875, "global_step": 47917, "epoch": 396} {"train_loss": -32.6484375, "global_step": 47918, "epoch": 396} {"train_loss": -34.899715423583984, "global_step": 47919, "epoch": 396} {"train_loss": -34.67799758911133, "global_step": 47920, "epoch": 396} {"train_loss": -34.798194885253906, "global_step": 47921, "epoch": 396} {"train_loss": -34.009578704833984, "global_step": 47922, "epoch": 396} {"train_loss": -33.30728530883789, "global_step": 47923, "epoch": 396} {"train_loss": -34.0812873840332, "global_step": 47924, "epoch": 396} {"train_loss": -34.80401611328125, "global_step": 47925, "epoch": 396} {"train_loss": -34.725826263427734, "global_step": 47926, "epoch": 396} {"train_loss": -33.76064682006836, "global_step": 47927, "epoch": 396} {"train_loss": -34.52724075317383, "global_step": 47928, "epoch": 396} {"train_loss": -35.021060943603516, "global_step": 47929, "epoch": 396} {"train_loss": -34.51137924194336, "global_step": 47930, "epoch": 396} {"train_loss": -34.22298812866211, "global_step": 47931, "epoch": 396} {"train_loss": -35.003944396972656, "global_step": 47932, "epoch": 396} {"train_loss": -34.312801361083984, "global_step": 47933, "epoch": 396} {"train_loss": -34.529109954833984, "global_step": 47934, "epoch": 396} {"train_loss": -34.4721565246582, "global_step": 47935, "epoch": 396} {"train_loss": -34.90930938720703, "global_step": 47936, "epoch": 396} {"train_loss": -34.42715072631836, "global_step": 47937, "epoch": 396} {"train_loss": -34.81307601928711, "global_step": 47938, "epoch": 396} {"train_loss": -35.46885299682617, "global_step": 47939, "epoch": 396} {"train_loss": -35.534236907958984, "global_step": 47940, "epoch": 396} {"train_loss": -35.04136276245117, "global_step": 47941, "epoch": 396} {"train_loss": -35.648719787597656, "global_step": 47942, "epoch": 396} {"train_loss": -35.06007766723633, "global_step": 47943, "epoch": 396} {"train_loss": -34.87576675415039, "global_step": 47944, "epoch": 396} {"train_loss": -34.48781967163086, "global_step": 47945, "epoch": 396} {"train_loss": -34.64264678955078, "global_step": 47946, "epoch": 396} {"train_loss": -35.199623107910156, "global_step": 47947, "epoch": 396} {"train_loss": -34.761863708496094, "global_step": 47948, "epoch": 396} {"train_loss": -34.75436019897461, "global_step": 47949, "epoch": 396} {"train_loss": -32.5439567565918, "global_step": 47950, "epoch": 396} {"train_loss": -30.784133911132812, "global_step": 47951, "epoch": 396} {"train_loss": -29.510793685913086, "global_step": 47952, "epoch": 396} {"train_loss": -31.2716007232666, "global_step": 47953, "epoch": 396} {"train_loss": -34.056488037109375, "global_step": 47954, "epoch": 396} {"train_loss": -34.11138153076172, "global_step": 47955, "epoch": 396} {"train_loss": -32.31964111328125, "global_step": 47956, "epoch": 396} {"train_loss": -34.108760833740234, "global_step": 47957, "epoch": 396} {"train_loss": -33.955753326416016, "global_step": 47958, "epoch": 396} {"train_loss": -33.153133392333984, "global_step": 47959, "epoch": 396} {"train_loss": -34.41953659057617, "global_step": 47960, "epoch": 396} {"train_loss": -31.840436935424805, "global_step": 47961, "epoch": 396} {"train_loss": -29.42179298400879, "global_step": 47962, "epoch": 396} {"train_loss": -31.979772567749023, "global_step": 47963, "epoch": 396} {"train_loss": -34.04994583129883, "global_step": 47964, "epoch": 396} {"train_loss": -33.80044174194336, "global_step": 47965, "epoch": 396} {"train_loss": -33.39244079589844, "global_step": 47966, "epoch": 396} {"train_loss": -32.99959945678711, "global_step": 47967, "epoch": 396} {"train_loss": -33.787353515625, "global_step": 47968, "epoch": 396} {"train_loss": -34.335079193115234, "global_step": 47969, "epoch": 396} {"train_loss": -34.62377166748047, "global_step": 47970, "epoch": 396} {"train_loss": -34.18378448486328, "global_step": 47971, "epoch": 396} {"train_loss": -34.08078384399414, "global_step": 47972, "epoch": 396} {"train_loss": -34.2899284362793, "global_step": 47973, "epoch": 396} {"train_loss": -33.99848175048828, "global_step": 47974, "epoch": 396} {"train_loss": -34.672969818115234, "global_step": 47975, "epoch": 396} {"train_loss": -34.40731430053711, "global_step": 47976, "epoch": 396} {"train_loss": -34.3693733215332, "global_step": 47977, "epoch": 396} {"train_loss": -34.704811096191406, "global_step": 47978, "epoch": 396} {"train_loss": -34.88605880737305, "global_step": 47979, "epoch": 396} {"train_loss": -34.56636428833008, "global_step": 47980, "epoch": 396} {"train_loss": -34.83718490600586, "global_step": 47981, "epoch": 396} {"train_loss": -35.093929290771484, "global_step": 47982, "epoch": 396} {"train_loss": -35.17938995361328, "global_step": 47983, "epoch": 396} {"train_loss": -34.45768356323242, "global_step": 47984, "epoch": 396} {"train_loss": -34.5084114074707, "global_step": 47985, "epoch": 396} {"train_loss": -35.000526428222656, "global_step": 47986, "epoch": 396} {"train_loss": -34.84086227416992, "global_step": 47987, "epoch": 396} {"train_loss": -34.77498245239258, "global_step": 47988, "epoch": 396} {"train_loss": -35.136810302734375, "global_step": 47989, "epoch": 396} {"train_loss": -35.225433349609375, "global_step": 47990, "epoch": 396} {"train_loss": -34.90373611450195, "global_step": 47991, "epoch": 396} {"train_loss": -34.083763122558594, "global_step": 47992, "epoch": 396} {"train_loss": -35.22417068481445, "global_step": 47993, "epoch": 396} {"train_loss": -35.617820739746094, "global_step": 47994, "epoch": 396} {"train_loss": -35.15116500854492, "global_step": 47995, "epoch": 396} {"train_loss": -35.260231018066406, "global_step": 47996, "epoch": 396} {"train_loss": -34.73463821411133, "global_step": 47997, "epoch": 396} {"train_loss": -35.430335998535156, "global_step": 47998, "epoch": 396} {"train_loss": -35.37785720825195, "global_step": 47999, "epoch": 396} {"train_loss": -35.62656784057617, "global_step": 48000, "epoch": 396} {"train_loss": -35.857967376708984, "global_step": 48001, "epoch": 396} {"train_loss": -36.03591537475586, "global_step": 48002, "epoch": 396} {"train_loss": -35.67704772949219, "global_step": 48003, "epoch": 396} {"train_loss": -35.432716369628906, "global_step": 48004, "epoch": 396} {"train_loss": -35.62974166870117, "global_step": 48005, "epoch": 396} {"train_loss": -35.705177307128906, "global_step": 48006, "epoch": 396} {"train_loss": -36.05807113647461, "global_step": 48007, "epoch": 396} {"train_loss": -35.602394104003906, "global_step": 48008, "epoch": 396} {"train_loss": -35.86593246459961, "global_step": 48009, "epoch": 396} {"train_loss": -36.107601165771484, "global_step": 48010, "epoch": 396} {"train_loss": -36.26779556274414, "global_step": 48011, "epoch": 396} {"train_loss": -35.8905029296875, "global_step": 48012, "epoch": 396} {"train_loss": -36.437705993652344, "global_step": 48013, "epoch": 396} {"train_loss": -36.34172439575195, "global_step": 48014, "epoch": 396} {"train_loss": -36.11747360229492, "global_step": 48015, "epoch": 396} {"train_loss": -35.954097747802734, "global_step": 48016, "epoch": 396} {"train_loss": -36.09815979003906, "global_step": 48017, "epoch": 396} {"train_loss": -36.06289291381836, "global_step": 48018, "epoch": 396} {"train_loss": -35.21699142456055, "global_step": 48019, "epoch": 396} {"train_loss": -35.635276794433594, "global_step": 48020, "epoch": 396} {"train_loss": -34.43001174926758, "global_step": 48021, "epoch": 396} {"train_loss": -31.852609634399414, "global_step": 48022, "epoch": 396} {"train_loss": -27.9405460357666, "global_step": 48023, "epoch": 396} {"train_loss": -13.861777305603027, "global_step": 48024, "epoch": 396} {"train_loss": 0.3186963200569153, "global_step": 48025, "epoch": 396} {"train_loss": -24.85883903503418, "global_step": 48026, "epoch": 396} {"train_loss": -26.05011558532715, "global_step": 48027, "epoch": 396} {"train_loss": -30.8387508392334, "global_step": 48028, "epoch": 396} {"train_loss": -24.74711036682129, "global_step": 48029, "epoch": 396} {"train_loss": -33.31191635131836, "global_step": 48030, "epoch": 396} {"train_loss": -27.87043571472168, "global_step": 48031, "epoch": 396} {"train_loss": -30.048980712890625, "global_step": 48032, "epoch": 396} {"train_loss": -33.686988830566406, "global_step": 48033, "epoch": 396} {"train_loss": -31.080093383789062, "global_step": 48034, "epoch": 396} {"train_loss": -31.330835342407227, "global_step": 48035, "epoch": 396} {"train_loss": -33.60473891082874, "global_step": 48036, "epoch": 396, "val_loss": 2567990.25} {"train_loss": -33.88874053955078, "global_step": 48037, "epoch": 397} {"train_loss": -32.38142776489258, "global_step": 48038, "epoch": 397} {"train_loss": -32.63485336303711, "global_step": 48039, "epoch": 397} {"train_loss": -33.29864501953125, "global_step": 48040, "epoch": 397} {"train_loss": -34.248897552490234, "global_step": 48041, "epoch": 397} {"train_loss": -34.5026969909668, "global_step": 48042, "epoch": 397} {"train_loss": -33.40499496459961, "global_step": 48043, "epoch": 397} {"train_loss": -33.59873580932617, "global_step": 48044, "epoch": 397} {"train_loss": -33.79825973510742, "global_step": 48045, "epoch": 397} {"train_loss": -34.413291931152344, "global_step": 48046, "epoch": 397} {"train_loss": -34.0179328918457, "global_step": 48047, "epoch": 397} {"train_loss": -34.41748809814453, "global_step": 48048, "epoch": 397} {"train_loss": -34.05190658569336, "global_step": 48049, "epoch": 397} {"train_loss": -33.91865158081055, "global_step": 48050, "epoch": 397} {"train_loss": -34.35784149169922, "global_step": 48051, "epoch": 397} {"train_loss": -34.7144889831543, "global_step": 48052, "epoch": 397} {"train_loss": -34.17365264892578, "global_step": 48053, "epoch": 397} {"train_loss": -34.78579330444336, "global_step": 48054, "epoch": 397} {"train_loss": -34.50821304321289, "global_step": 48055, "epoch": 397} {"train_loss": -34.69036865234375, "global_step": 48056, "epoch": 397} {"train_loss": -34.09415817260742, "global_step": 48057, "epoch": 397} {"train_loss": -35.305015563964844, "global_step": 48058, "epoch": 397} {"train_loss": -34.697811126708984, "global_step": 48059, "epoch": 397} {"train_loss": -35.179298400878906, "global_step": 48060, "epoch": 397} {"train_loss": -35.18128967285156, "global_step": 48061, "epoch": 397} {"train_loss": -35.05111312866211, "global_step": 48062, "epoch": 397} {"train_loss": -35.24419021606445, "global_step": 48063, "epoch": 397} {"train_loss": -35.04323959350586, "global_step": 48064, "epoch": 397} {"train_loss": -35.18388748168945, "global_step": 48065, "epoch": 397} {"train_loss": -34.989990234375, "global_step": 48066, "epoch": 397} {"train_loss": -34.96743392944336, "global_step": 48067, "epoch": 397} {"train_loss": -35.141475677490234, "global_step": 48068, "epoch": 397} {"train_loss": -35.04104995727539, "global_step": 48069, "epoch": 397} {"train_loss": -35.09137725830078, "global_step": 48070, "epoch": 397} {"train_loss": -35.1959342956543, "global_step": 48071, "epoch": 397} {"train_loss": -34.55171585083008, "global_step": 48072, "epoch": 397} {"train_loss": -34.612369537353516, "global_step": 48073, "epoch": 397} {"train_loss": -35.02451705932617, "global_step": 48074, "epoch": 397} {"train_loss": -34.96385955810547, "global_step": 48075, "epoch": 397} {"train_loss": -35.06241989135742, "global_step": 48076, "epoch": 397} {"train_loss": -35.10612869262695, "global_step": 48077, "epoch": 397} {"train_loss": -34.400047302246094, "global_step": 48078, "epoch": 397} {"train_loss": -33.54567337036133, "global_step": 48079, "epoch": 397} {"train_loss": -31.952306747436523, "global_step": 48080, "epoch": 397} {"train_loss": -32.180843353271484, "global_step": 48081, "epoch": 397} {"train_loss": -32.31555938720703, "global_step": 48082, "epoch": 397} {"train_loss": -34.89068603515625, "global_step": 48083, "epoch": 397} {"train_loss": -34.034481048583984, "global_step": 48084, "epoch": 397} {"train_loss": -34.4068489074707, "global_step": 48085, "epoch": 397} {"train_loss": -34.696407318115234, "global_step": 48086, "epoch": 397} {"train_loss": -34.76364517211914, "global_step": 48087, "epoch": 397} {"train_loss": -34.47169876098633, "global_step": 48088, "epoch": 397} {"train_loss": -34.887386322021484, "global_step": 48089, "epoch": 397} {"train_loss": -34.3014030456543, "global_step": 48090, "epoch": 397} {"train_loss": -34.485904693603516, "global_step": 48091, "epoch": 397} {"train_loss": -34.00786209106445, "global_step": 48092, "epoch": 397} {"train_loss": -33.92557907104492, "global_step": 48093, "epoch": 397} {"train_loss": -34.93244934082031, "global_step": 48094, "epoch": 397} {"train_loss": -34.75971603393555, "global_step": 48095, "epoch": 397} {"train_loss": -35.0513801574707, "global_step": 48096, "epoch": 397} {"train_loss": -34.466331481933594, "global_step": 48097, "epoch": 397} {"train_loss": -35.34091567993164, "global_step": 48098, "epoch": 397} {"train_loss": -35.143760681152344, "global_step": 48099, "epoch": 397} {"train_loss": -35.44275665283203, "global_step": 48100, "epoch": 397} {"train_loss": -35.414974212646484, "global_step": 48101, "epoch": 397} {"train_loss": -34.79277038574219, "global_step": 48102, "epoch": 397} {"train_loss": -34.991512298583984, "global_step": 48103, "epoch": 397} {"train_loss": -34.30501937866211, "global_step": 48104, "epoch": 397} {"train_loss": -34.640506744384766, "global_step": 48105, "epoch": 397} {"train_loss": -34.95000076293945, "global_step": 48106, "epoch": 397} {"train_loss": -34.10392761230469, "global_step": 48107, "epoch": 397} {"train_loss": -33.85596466064453, "global_step": 48108, "epoch": 397} {"train_loss": -34.27784729003906, "global_step": 48109, "epoch": 397} {"train_loss": -34.04076385498047, "global_step": 48110, "epoch": 397} {"train_loss": -33.4450798034668, "global_step": 48111, "epoch": 397} {"train_loss": -32.104705810546875, "global_step": 48112, "epoch": 397} {"train_loss": -31.625410079956055, "global_step": 48113, "epoch": 397} {"train_loss": -33.00736618041992, "global_step": 48114, "epoch": 397} {"train_loss": -34.588050842285156, "global_step": 48115, "epoch": 397} {"train_loss": -33.58382797241211, "global_step": 48116, "epoch": 397} {"train_loss": -34.00617218017578, "global_step": 48117, "epoch": 397} {"train_loss": -35.04740524291992, "global_step": 48118, "epoch": 397} {"train_loss": -34.86848831176758, "global_step": 48119, "epoch": 397} {"train_loss": -34.42573547363281, "global_step": 48120, "epoch": 397} {"train_loss": -35.138092041015625, "global_step": 48121, "epoch": 397} {"train_loss": -34.92995834350586, "global_step": 48122, "epoch": 397} {"train_loss": -35.235443115234375, "global_step": 48123, "epoch": 397} {"train_loss": -34.502925872802734, "global_step": 48124, "epoch": 397} {"train_loss": -34.56171417236328, "global_step": 48125, "epoch": 397} {"train_loss": -34.64047622680664, "global_step": 48126, "epoch": 397} {"train_loss": -34.80986404418945, "global_step": 48127, "epoch": 397} {"train_loss": -34.99723434448242, "global_step": 48128, "epoch": 397} {"train_loss": -35.24516677856445, "global_step": 48129, "epoch": 397} {"train_loss": -34.82902145385742, "global_step": 48130, "epoch": 397} {"train_loss": -34.4012336730957, "global_step": 48131, "epoch": 397} {"train_loss": -34.7374153137207, "global_step": 48132, "epoch": 397} {"train_loss": -35.36269760131836, "global_step": 48133, "epoch": 397} {"train_loss": -35.260101318359375, "global_step": 48134, "epoch": 397} {"train_loss": -35.204994201660156, "global_step": 48135, "epoch": 397} {"train_loss": -34.70815658569336, "global_step": 48136, "epoch": 397} {"train_loss": -34.724178314208984, "global_step": 48137, "epoch": 397} {"train_loss": -35.474971771240234, "global_step": 48138, "epoch": 397} {"train_loss": -35.383056640625, "global_step": 48139, "epoch": 397} {"train_loss": -33.81071472167969, "global_step": 48140, "epoch": 397} {"train_loss": -34.1363525390625, "global_step": 48141, "epoch": 397} {"train_loss": -35.09963607788086, "global_step": 48142, "epoch": 397} {"train_loss": -33.330806732177734, "global_step": 48143, "epoch": 397} {"train_loss": -31.902347564697266, "global_step": 48144, "epoch": 397} {"train_loss": -29.127958297729492, "global_step": 48145, "epoch": 397} {"train_loss": -31.29134178161621, "global_step": 48146, "epoch": 397} {"train_loss": -35.11996078491211, "global_step": 48147, "epoch": 397} {"train_loss": -32.6087760925293, "global_step": 48148, "epoch": 397} {"train_loss": -33.933528900146484, "global_step": 48149, "epoch": 397} {"train_loss": -33.80294418334961, "global_step": 48150, "epoch": 397} {"train_loss": -33.338531494140625, "global_step": 48151, "epoch": 397} {"train_loss": -34.787349700927734, "global_step": 48152, "epoch": 397} {"train_loss": -33.789283752441406, "global_step": 48153, "epoch": 397} {"train_loss": -34.46455001831055, "global_step": 48154, "epoch": 397} {"train_loss": -34.86875534057617, "global_step": 48155, "epoch": 397} {"train_loss": -34.37415313720703, "global_step": 48156, "epoch": 397} {"train_loss": -34.33282379276496, "global_step": 48157, "epoch": 397, "val_loss": 2513983.5} {"train_loss": -34.6368293762207, "global_step": 48158, "epoch": 398} {"train_loss": -34.370452880859375, "global_step": 48159, "epoch": 398} {"train_loss": -34.975746154785156, "global_step": 48160, "epoch": 398} {"train_loss": -34.72118377685547, "global_step": 48161, "epoch": 398} {"train_loss": -34.47062301635742, "global_step": 48162, "epoch": 398} {"train_loss": -34.83895492553711, "global_step": 48163, "epoch": 398} {"train_loss": -34.61747360229492, "global_step": 48164, "epoch": 398} {"train_loss": -34.504798889160156, "global_step": 48165, "epoch": 398} {"train_loss": -34.647274017333984, "global_step": 48166, "epoch": 398} {"train_loss": -35.085567474365234, "global_step": 48167, "epoch": 398} {"train_loss": -34.9644889831543, "global_step": 48168, "epoch": 398} {"train_loss": -34.925960540771484, "global_step": 48169, "epoch": 398} {"train_loss": -35.25864791870117, "global_step": 48170, "epoch": 398} {"train_loss": -35.23661422729492, "global_step": 48171, "epoch": 398} {"train_loss": -34.90720748901367, "global_step": 48172, "epoch": 398} {"train_loss": -35.061119079589844, "global_step": 48173, "epoch": 398} {"train_loss": -34.95055389404297, "global_step": 48174, "epoch": 398} {"train_loss": -33.86798858642578, "global_step": 48175, "epoch": 398} {"train_loss": -35.157752990722656, "global_step": 48176, "epoch": 398} {"train_loss": -35.3643913269043, "global_step": 48177, "epoch": 398} {"train_loss": -33.62538528442383, "global_step": 48178, "epoch": 398} {"train_loss": -33.659942626953125, "global_step": 48179, "epoch": 398} {"train_loss": -34.6723747253418, "global_step": 48180, "epoch": 398} {"train_loss": -34.0087890625, "global_step": 48181, "epoch": 398} {"train_loss": -33.73744583129883, "global_step": 48182, "epoch": 398} {"train_loss": -34.56294631958008, "global_step": 48183, "epoch": 398} {"train_loss": -34.930294036865234, "global_step": 48184, "epoch": 398} {"train_loss": -33.91694259643555, "global_step": 48185, "epoch": 398} {"train_loss": -34.6408576965332, "global_step": 48186, "epoch": 398} {"train_loss": -34.6395378112793, "global_step": 48187, "epoch": 398} {"train_loss": -34.62858963012695, "global_step": 48188, "epoch": 398} {"train_loss": -34.939491271972656, "global_step": 48189, "epoch": 398} {"train_loss": -34.82495880126953, "global_step": 48190, "epoch": 398} {"train_loss": -34.2784423828125, "global_step": 48191, "epoch": 398} {"train_loss": -34.732818603515625, "global_step": 48192, "epoch": 398} {"train_loss": -34.813079833984375, "global_step": 48193, "epoch": 398} {"train_loss": -35.02805709838867, "global_step": 48194, "epoch": 398} {"train_loss": -34.967647552490234, "global_step": 48195, "epoch": 398} {"train_loss": -34.9199104309082, "global_step": 48196, "epoch": 398} {"train_loss": -34.98152160644531, "global_step": 48197, "epoch": 398} {"train_loss": -35.04085159301758, "global_step": 48198, "epoch": 398} {"train_loss": -34.312435150146484, "global_step": 48199, "epoch": 398} {"train_loss": -35.277687072753906, "global_step": 48200, "epoch": 398} {"train_loss": -34.76169967651367, "global_step": 48201, "epoch": 398} {"train_loss": -33.422000885009766, "global_step": 48202, "epoch": 398} {"train_loss": -34.3089714050293, "global_step": 48203, "epoch": 398} {"train_loss": -34.68055725097656, "global_step": 48204, "epoch": 398} {"train_loss": -34.069637298583984, "global_step": 48205, "epoch": 398} {"train_loss": -34.78460693359375, "global_step": 48206, "epoch": 398} {"train_loss": -34.99070358276367, "global_step": 48207, "epoch": 398} {"train_loss": -34.15803146362305, "global_step": 48208, "epoch": 398} {"train_loss": -30.909976959228516, "global_step": 48209, "epoch": 398} {"train_loss": -23.27422523498535, "global_step": 48210, "epoch": 398} {"train_loss": -7.12332010269165, "global_step": 48211, "epoch": 398} {"train_loss": -10.041084289550781, "global_step": 48212, "epoch": 398} {"train_loss": -31.58711051940918, "global_step": 48213, "epoch": 398} {"train_loss": -27.23821449279785, "global_step": 48214, "epoch": 398} {"train_loss": -30.100208282470703, "global_step": 48215, "epoch": 398} {"train_loss": -28.39202308654785, "global_step": 48216, "epoch": 398} {"train_loss": -32.621517181396484, "global_step": 48217, "epoch": 398} {"train_loss": -29.2279052734375, "global_step": 48218, "epoch": 398} {"train_loss": -33.0618896484375, "global_step": 48219, "epoch": 398} {"train_loss": -32.59807586669922, "global_step": 48220, "epoch": 398} {"train_loss": -28.714147567749023, "global_step": 48221, "epoch": 398} {"train_loss": -32.772193908691406, "global_step": 48222, "epoch": 398} {"train_loss": -33.30710220336914, "global_step": 48223, "epoch": 398} {"train_loss": -29.3574161529541, "global_step": 48224, "epoch": 398} {"train_loss": -32.518829345703125, "global_step": 48225, "epoch": 398} {"train_loss": -32.91538619995117, "global_step": 48226, "epoch": 398} {"train_loss": -33.31215286254883, "global_step": 48227, "epoch": 398} {"train_loss": -32.62537384033203, "global_step": 48228, "epoch": 398} {"train_loss": -31.946659088134766, "global_step": 48229, "epoch": 398} {"train_loss": -32.992828369140625, "global_step": 48230, "epoch": 398} {"train_loss": -33.65740203857422, "global_step": 48231, "epoch": 398} {"train_loss": -33.35464859008789, "global_step": 48232, "epoch": 398} {"train_loss": -32.56714630126953, "global_step": 48233, "epoch": 398} {"train_loss": -32.48176193237305, "global_step": 48234, "epoch": 398} {"train_loss": -32.45215606689453, "global_step": 48235, "epoch": 398} {"train_loss": -33.277042388916016, "global_step": 48236, "epoch": 398} {"train_loss": -32.980010986328125, "global_step": 48237, "epoch": 398} {"train_loss": -31.893301010131836, "global_step": 48238, "epoch": 398} {"train_loss": -33.221553802490234, "global_step": 48239, "epoch": 398} {"train_loss": -33.18647384643555, "global_step": 48240, "epoch": 398} {"train_loss": -33.3519287109375, "global_step": 48241, "epoch": 398} {"train_loss": -33.39754867553711, "global_step": 48242, "epoch": 398} {"train_loss": -33.5026741027832, "global_step": 48243, "epoch": 398} {"train_loss": -33.283687591552734, "global_step": 48244, "epoch": 398} {"train_loss": -33.53866195678711, "global_step": 48245, "epoch": 398} {"train_loss": -33.3830680847168, "global_step": 48246, "epoch": 398} {"train_loss": -33.67243957519531, "global_step": 48247, "epoch": 398} {"train_loss": -32.97648239135742, "global_step": 48248, "epoch": 398} {"train_loss": -33.85282516479492, "global_step": 48249, "epoch": 398} {"train_loss": -34.51972579956055, "global_step": 48250, "epoch": 398} {"train_loss": -33.49458694458008, "global_step": 48251, "epoch": 398} {"train_loss": -33.88286209106445, "global_step": 48252, "epoch": 398} {"train_loss": -34.19236755371094, "global_step": 48253, "epoch": 398} {"train_loss": -33.12580108642578, "global_step": 48254, "epoch": 398} {"train_loss": -34.29230880737305, "global_step": 48255, "epoch": 398} {"train_loss": -33.73236083984375, "global_step": 48256, "epoch": 398} {"train_loss": -33.72459030151367, "global_step": 48257, "epoch": 398} {"train_loss": -33.21564865112305, "global_step": 48258, "epoch": 398} {"train_loss": -34.41223907470703, "global_step": 48259, "epoch": 398} {"train_loss": -33.972347259521484, "global_step": 48260, "epoch": 398} {"train_loss": -33.62492752075195, "global_step": 48261, "epoch": 398} {"train_loss": -34.44559860229492, "global_step": 48262, "epoch": 398} {"train_loss": -34.35701370239258, "global_step": 48263, "epoch": 398} {"train_loss": -34.21635818481445, "global_step": 48264, "epoch": 398} {"train_loss": -34.5640754699707, "global_step": 48265, "epoch": 398} {"train_loss": -34.50223922729492, "global_step": 48266, "epoch": 398} {"train_loss": -34.473182678222656, "global_step": 48267, "epoch": 398} {"train_loss": -33.90338897705078, "global_step": 48268, "epoch": 398} {"train_loss": -34.28858184814453, "global_step": 48269, "epoch": 398} {"train_loss": -34.732967376708984, "global_step": 48270, "epoch": 398} {"train_loss": -34.66256332397461, "global_step": 48271, "epoch": 398} {"train_loss": -35.110172271728516, "global_step": 48272, "epoch": 398} {"train_loss": -34.688720703125, "global_step": 48273, "epoch": 398} {"train_loss": -34.28190994262695, "global_step": 48274, "epoch": 398} {"train_loss": -33.24967575073242, "global_step": 48275, "epoch": 398} {"train_loss": -34.60969924926758, "global_step": 48276, "epoch": 398} {"train_loss": -34.53449249267578, "global_step": 48277, "epoch": 398} {"train_loss": -33.26442498214974, "global_step": 48278, "epoch": 398, "val_loss": 2603732.0} {"train_loss": -33.5294075012207, "global_step": 48279, "epoch": 399} {"train_loss": -34.458309173583984, "global_step": 48280, "epoch": 399} {"train_loss": -34.73725509643555, "global_step": 48281, "epoch": 399} {"train_loss": -34.107601165771484, "global_step": 48282, "epoch": 399} {"train_loss": -34.95050811767578, "global_step": 48283, "epoch": 399} {"train_loss": -34.37997055053711, "global_step": 48284, "epoch": 399} {"train_loss": -34.11946105957031, "global_step": 48285, "epoch": 399} {"train_loss": -34.71294021606445, "global_step": 48286, "epoch": 399} {"train_loss": -33.650787353515625, "global_step": 48287, "epoch": 399} {"train_loss": -34.24949264526367, "global_step": 48288, "epoch": 399} {"train_loss": -27.841257095336914, "global_step": 48289, "epoch": 399} {"train_loss": -32.274986267089844, "global_step": 48290, "epoch": 399} {"train_loss": -34.811580657958984, "global_step": 48291, "epoch": 399} {"train_loss": -34.44627380371094, "global_step": 48292, "epoch": 399} {"train_loss": -33.2329216003418, "global_step": 48293, "epoch": 399} {"train_loss": -33.27112579345703, "global_step": 48294, "epoch": 399} {"train_loss": -34.17603302001953, "global_step": 48295, "epoch": 399} {"train_loss": -33.85950469970703, "global_step": 48296, "epoch": 399} {"train_loss": -33.69575500488281, "global_step": 48297, "epoch": 399} {"train_loss": -34.13824462890625, "global_step": 48298, "epoch": 399} {"train_loss": -33.61195373535156, "global_step": 48299, "epoch": 399} {"train_loss": -30.99322509765625, "global_step": 48300, "epoch": 399} {"train_loss": -33.15570068359375, "global_step": 48301, "epoch": 399} {"train_loss": -33.98908615112305, "global_step": 48302, "epoch": 399} {"train_loss": -34.04534912109375, "global_step": 48303, "epoch": 399} {"train_loss": -29.44964599609375, "global_step": 48304, "epoch": 399} {"train_loss": -33.896976470947266, "global_step": 48305, "epoch": 399} {"train_loss": -33.9720344543457, "global_step": 48306, "epoch": 399} {"train_loss": -33.980464935302734, "global_step": 48307, "epoch": 399} {"train_loss": -32.83051300048828, "global_step": 48308, "epoch": 399} {"train_loss": -33.53355407714844, "global_step": 48309, "epoch": 399} {"train_loss": -33.909217834472656, "global_step": 48310, "epoch": 399} {"train_loss": -32.5073356628418, "global_step": 48311, "epoch": 399} {"train_loss": -33.612831115722656, "global_step": 48312, "epoch": 399} {"train_loss": -33.57258605957031, "global_step": 48313, "epoch": 399} {"train_loss": -33.19630813598633, "global_step": 48314, "epoch": 399} {"train_loss": -33.63944625854492, "global_step": 48315, "epoch": 399} {"train_loss": -34.07512664794922, "global_step": 48316, "epoch": 399} {"train_loss": -33.96986770629883, "global_step": 48317, "epoch": 399} {"train_loss": -32.153724670410156, "global_step": 48318, "epoch": 399} {"train_loss": -33.242977142333984, "global_step": 48319, "epoch": 399} {"train_loss": -33.23994827270508, "global_step": 48320, "epoch": 399} {"train_loss": -33.46421432495117, "global_step": 48321, "epoch": 399} {"train_loss": -33.5196533203125, "global_step": 48322, "epoch": 399} {"train_loss": -34.32929229736328, "global_step": 48323, "epoch": 399} {"train_loss": -33.84831619262695, "global_step": 48324, "epoch": 399} {"train_loss": -33.58634567260742, "global_step": 48325, "epoch": 399} {"train_loss": -33.4570426940918, "global_step": 48326, "epoch": 399} {"train_loss": -33.50482940673828, "global_step": 48327, "epoch": 399} {"train_loss": -34.17246627807617, "global_step": 48328, "epoch": 399} {"train_loss": -32.14715576171875, "global_step": 48329, "epoch": 399} {"train_loss": -32.93557357788086, "global_step": 48330, "epoch": 399} {"train_loss": -33.595741271972656, "global_step": 48331, "epoch": 399} {"train_loss": -32.548091888427734, "global_step": 48332, "epoch": 399} {"train_loss": -31.87190055847168, "global_step": 48333, "epoch": 399} {"train_loss": -25.950796127319336, "global_step": 48334, "epoch": 399} {"train_loss": -30.33953857421875, "global_step": 48335, "epoch": 399} {"train_loss": -31.900836944580078, "global_step": 48336, "epoch": 399} {"train_loss": -33.74745559692383, "global_step": 48337, "epoch": 399} {"train_loss": -31.286163330078125, "global_step": 48338, "epoch": 399} {"train_loss": -32.35932540893555, "global_step": 48339, "epoch": 399} {"train_loss": -31.08624267578125, "global_step": 48340, "epoch": 399} {"train_loss": -30.415613174438477, "global_step": 48341, "epoch": 399} {"train_loss": -31.410552978515625, "global_step": 48342, "epoch": 399} {"train_loss": -32.0244026184082, "global_step": 48343, "epoch": 399} {"train_loss": -33.166683197021484, "global_step": 48344, "epoch": 399} {"train_loss": -31.308568954467773, "global_step": 48345, "epoch": 399} {"train_loss": -31.595325469970703, "global_step": 48346, "epoch": 399} {"train_loss": -33.04852294921875, "global_step": 48347, "epoch": 399} {"train_loss": -31.616500854492188, "global_step": 48348, "epoch": 399} {"train_loss": -32.4964599609375, "global_step": 48349, "epoch": 399} {"train_loss": -33.12005615234375, "global_step": 48350, "epoch": 399} {"train_loss": -31.927570343017578, "global_step": 48351, "epoch": 399} {"train_loss": -33.71177291870117, "global_step": 48352, "epoch": 399} {"train_loss": -32.41577911376953, "global_step": 48353, "epoch": 399} {"train_loss": -32.33122253417969, "global_step": 48354, "epoch": 399} {"train_loss": -33.344661712646484, "global_step": 48355, "epoch": 399} {"train_loss": -32.951934814453125, "global_step": 48356, "epoch": 399} {"train_loss": -33.44664001464844, "global_step": 48357, "epoch": 399} {"train_loss": -31.964887619018555, "global_step": 48358, "epoch": 399} {"train_loss": -33.172847747802734, "global_step": 48359, "epoch": 399} {"train_loss": -33.22520065307617, "global_step": 48360, "epoch": 399} {"train_loss": -33.608272552490234, "global_step": 48361, "epoch": 399} {"train_loss": -33.56074142456055, "global_step": 48362, "epoch": 399} {"train_loss": -33.663387298583984, "global_step": 48363, "epoch": 399} {"train_loss": -34.08403778076172, "global_step": 48364, "epoch": 399} {"train_loss": -34.15903854370117, "global_step": 48365, "epoch": 399} {"train_loss": -33.8886604309082, "global_step": 48366, "epoch": 399} {"train_loss": -33.92204666137695, "global_step": 48367, "epoch": 399} {"train_loss": -34.508277893066406, "global_step": 48368, "epoch": 399} {"train_loss": -32.885921478271484, "global_step": 48369, "epoch": 399} {"train_loss": -34.1048469543457, "global_step": 48370, "epoch": 399} {"train_loss": -34.315547943115234, "global_step": 48371, "epoch": 399} {"train_loss": -33.5556755065918, "global_step": 48372, "epoch": 399} {"train_loss": -34.244869232177734, "global_step": 48373, "epoch": 399} {"train_loss": -34.11995315551758, "global_step": 48374, "epoch": 399} {"train_loss": -34.04294967651367, "global_step": 48375, "epoch": 399} {"train_loss": -34.518760681152344, "global_step": 48376, "epoch": 399} {"train_loss": -33.0794563293457, "global_step": 48377, "epoch": 399} {"train_loss": -33.5391845703125, "global_step": 48378, "epoch": 399} {"train_loss": -33.28164291381836, "global_step": 48379, "epoch": 399} {"train_loss": -34.57965087890625, "global_step": 48380, "epoch": 399} {"train_loss": -31.34211540222168, "global_step": 48381, "epoch": 399} {"train_loss": -33.907745361328125, "global_step": 48382, "epoch": 399} {"train_loss": -34.21195602416992, "global_step": 48383, "epoch": 399} {"train_loss": -34.60531234741211, "global_step": 48384, "epoch": 399} {"train_loss": -34.19293975830078, "global_step": 48385, "epoch": 399} {"train_loss": -34.76852035522461, "global_step": 48386, "epoch": 399} {"train_loss": -34.46249771118164, "global_step": 48387, "epoch": 399} {"train_loss": -34.42971420288086, "global_step": 48388, "epoch": 399} {"train_loss": -34.62262725830078, "global_step": 48389, "epoch": 399} {"train_loss": -34.04128646850586, "global_step": 48390, "epoch": 399} {"train_loss": -34.769466400146484, "global_step": 48391, "epoch": 399} {"train_loss": -34.91280746459961, "global_step": 48392, "epoch": 399} {"train_loss": -35.164852142333984, "global_step": 48393, "epoch": 399} {"train_loss": -35.165748596191406, "global_step": 48394, "epoch": 399} {"train_loss": -35.12107467651367, "global_step": 48395, "epoch": 399} {"train_loss": -35.23830032348633, "global_step": 48396, "epoch": 399} {"train_loss": -35.1455078125, "global_step": 48397, "epoch": 399} {"train_loss": -34.9927864074707, "global_step": 48398, "epoch": 399} {"train_loss": -33.368902364053014, "global_step": 48399, "epoch": 399, "val_loss": 2549517.75} {"train_loss": -35.439632415771484, "global_step": 48400, "epoch": 400} {"train_loss": -35.509517669677734, "global_step": 48401, "epoch": 400} {"train_loss": -35.01762008666992, "global_step": 48402, "epoch": 400} {"train_loss": -35.75929641723633, "global_step": 48403, "epoch": 400} {"train_loss": -35.307674407958984, "global_step": 48404, "epoch": 400} {"train_loss": -35.369483947753906, "global_step": 48405, "epoch": 400} {"train_loss": -34.7625732421875, "global_step": 48406, "epoch": 400} {"train_loss": -35.26011276245117, "global_step": 48407, "epoch": 400} {"train_loss": -35.57959747314453, "global_step": 48408, "epoch": 400} {"train_loss": -35.642425537109375, "global_step": 48409, "epoch": 400} {"train_loss": -34.92403793334961, "global_step": 48410, "epoch": 400} {"train_loss": -36.12510299682617, "global_step": 48411, "epoch": 400} {"train_loss": -35.93162155151367, "global_step": 48412, "epoch": 400} {"train_loss": -35.118446350097656, "global_step": 48413, "epoch": 400} {"train_loss": -35.67457962036133, "global_step": 48414, "epoch": 400} {"train_loss": -35.393707275390625, "global_step": 48415, "epoch": 400} {"train_loss": -35.31221389770508, "global_step": 48416, "epoch": 400} {"train_loss": -35.81429672241211, "global_step": 48417, "epoch": 400} {"train_loss": -35.54750442504883, "global_step": 48418, "epoch": 400} {"train_loss": -35.39055252075195, "global_step": 48419, "epoch": 400} {"train_loss": -35.608482360839844, "global_step": 48420, "epoch": 400} {"train_loss": -34.32420349121094, "global_step": 48421, "epoch": 400} {"train_loss": -35.745361328125, "global_step": 48422, "epoch": 400} {"train_loss": -35.54249954223633, "global_step": 48423, "epoch": 400} {"train_loss": -35.29094696044922, "global_step": 48424, "epoch": 400} {"train_loss": -35.365089416503906, "global_step": 48425, "epoch": 400} {"train_loss": -33.79411697387695, "global_step": 48426, "epoch": 400} {"train_loss": -33.95951461791992, "global_step": 48427, "epoch": 400} {"train_loss": -33.986629486083984, "global_step": 48428, "epoch": 400} {"train_loss": -35.10857009887695, "global_step": 48429, "epoch": 400} {"train_loss": -35.64550018310547, "global_step": 48430, "epoch": 400} {"train_loss": -33.9088134765625, "global_step": 48431, "epoch": 400} {"train_loss": -35.000579833984375, "global_step": 48432, "epoch": 400} {"train_loss": -34.661678314208984, "global_step": 48433, "epoch": 400} {"train_loss": -35.130794525146484, "global_step": 48434, "epoch": 400} {"train_loss": -33.97692108154297, "global_step": 48435, "epoch": 400} {"train_loss": -34.3481559753418, "global_step": 48436, "epoch": 400} {"train_loss": -33.4552116394043, "global_step": 48437, "epoch": 400} {"train_loss": -34.59453201293945, "global_step": 48438, "epoch": 400} {"train_loss": -34.47079086303711, "global_step": 48439, "epoch": 400} {"train_loss": -32.98005294799805, "global_step": 48440, "epoch": 400} {"train_loss": -33.28785705566406, "global_step": 48441, "epoch": 400} {"train_loss": -34.01346969604492, "global_step": 48442, "epoch": 400} {"train_loss": -34.312232971191406, "global_step": 48443, "epoch": 400} {"train_loss": -32.532745361328125, "global_step": 48444, "epoch": 400} {"train_loss": -34.51966094970703, "global_step": 48445, "epoch": 400} {"train_loss": -34.70621109008789, "global_step": 48446, "epoch": 400} {"train_loss": -32.99397277832031, "global_step": 48447, "epoch": 400} {"train_loss": -34.12874221801758, "global_step": 48448, "epoch": 400} {"train_loss": -34.62856674194336, "global_step": 48449, "epoch": 400} {"train_loss": -34.908992767333984, "global_step": 48450, "epoch": 400} {"train_loss": -34.391658782958984, "global_step": 48451, "epoch": 400} {"train_loss": -34.535884857177734, "global_step": 48452, "epoch": 400} {"train_loss": -33.63808059692383, "global_step": 48453, "epoch": 400} {"train_loss": -34.44332504272461, "global_step": 48454, "epoch": 400} {"train_loss": -35.301021575927734, "global_step": 48455, "epoch": 400} {"train_loss": -34.060420989990234, "global_step": 48456, "epoch": 400} {"train_loss": -32.83304977416992, "global_step": 48457, "epoch": 400} {"train_loss": -33.61220932006836, "global_step": 48458, "epoch": 400} {"train_loss": -34.97367858886719, "global_step": 48459, "epoch": 400} {"train_loss": -34.623470306396484, "global_step": 48460, "epoch": 400} {"train_loss": -34.671321868896484, "global_step": 48461, "epoch": 400} {"train_loss": -34.915069580078125, "global_step": 48462, "epoch": 400} {"train_loss": -34.63411331176758, "global_step": 48463, "epoch": 400} {"train_loss": -34.886165618896484, "global_step": 48464, "epoch": 400} {"train_loss": -33.90705490112305, "global_step": 48465, "epoch": 400} {"train_loss": -35.57185363769531, "global_step": 48466, "epoch": 400} {"train_loss": -33.5705680847168, "global_step": 48467, "epoch": 400} {"train_loss": -35.130794525146484, "global_step": 48468, "epoch": 400} {"train_loss": -35.19278335571289, "global_step": 48469, "epoch": 400} {"train_loss": -34.83025360107422, "global_step": 48470, "epoch": 400} {"train_loss": -35.099037170410156, "global_step": 48471, "epoch": 400} {"train_loss": -35.541805267333984, "global_step": 48472, "epoch": 400} {"train_loss": -35.05851745605469, "global_step": 48473, "epoch": 400} {"train_loss": -34.9208984375, "global_step": 48474, "epoch": 400} {"train_loss": -35.317298889160156, "global_step": 48475, "epoch": 400} {"train_loss": -35.13008499145508, "global_step": 48476, "epoch": 400} {"train_loss": -35.06876754760742, "global_step": 48477, "epoch": 400} {"train_loss": -35.2080192565918, "global_step": 48478, "epoch": 400} {"train_loss": -35.68911361694336, "global_step": 48479, "epoch": 400} {"train_loss": -35.77307891845703, "global_step": 48480, "epoch": 400} {"train_loss": -35.78345489501953, "global_step": 48481, "epoch": 400} {"train_loss": -35.3625602722168, "global_step": 48482, "epoch": 400} {"train_loss": -34.814727783203125, "global_step": 48483, "epoch": 400} {"train_loss": -35.29637908935547, "global_step": 48484, "epoch": 400} {"train_loss": -35.12824630737305, "global_step": 48485, "epoch": 400} {"train_loss": -34.93858337402344, "global_step": 48486, "epoch": 400} {"train_loss": -34.703861236572266, "global_step": 48487, "epoch": 400} {"train_loss": -34.23515701293945, "global_step": 48488, "epoch": 400} {"train_loss": -34.3384895324707, "global_step": 48489, "epoch": 400} {"train_loss": -35.208168029785156, "global_step": 48490, "epoch": 400} {"train_loss": -35.35385513305664, "global_step": 48491, "epoch": 400} {"train_loss": -34.29777145385742, "global_step": 48492, "epoch": 400} {"train_loss": -34.507041931152344, "global_step": 48493, "epoch": 400} {"train_loss": -34.17551803588867, "global_step": 48494, "epoch": 400} {"train_loss": -33.393028259277344, "global_step": 48495, "epoch": 400} {"train_loss": -32.58797836303711, "global_step": 48496, "epoch": 400} {"train_loss": -32.927085876464844, "global_step": 48497, "epoch": 400} {"train_loss": -35.37360382080078, "global_step": 48498, "epoch": 400} {"train_loss": -34.881587982177734, "global_step": 48499, "epoch": 400} {"train_loss": -32.63990020751953, "global_step": 48500, "epoch": 400} {"train_loss": -31.603790283203125, "global_step": 48501, "epoch": 400} {"train_loss": -34.13444900512695, "global_step": 48502, "epoch": 400} {"train_loss": -35.505165100097656, "global_step": 48503, "epoch": 400} {"train_loss": -32.35734939575195, "global_step": 48504, "epoch": 400} {"train_loss": -30.10205078125, "global_step": 48505, "epoch": 400} {"train_loss": -34.37781524658203, "global_step": 48506, "epoch": 400} {"train_loss": -34.04415512084961, "global_step": 48507, "epoch": 400} {"train_loss": -31.941511154174805, "global_step": 48508, "epoch": 400} {"train_loss": -34.030765533447266, "global_step": 48509, "epoch": 400} {"train_loss": -34.82389450073242, "global_step": 48510, "epoch": 400} {"train_loss": -33.8642578125, "global_step": 48511, "epoch": 400} {"train_loss": -34.42381286621094, "global_step": 48512, "epoch": 400} {"train_loss": -34.63298034667969, "global_step": 48513, "epoch": 400} {"train_loss": -34.3155632019043, "global_step": 48514, "epoch": 400} {"train_loss": -35.378562927246094, "global_step": 48515, "epoch": 400} {"train_loss": -34.01760482788086, "global_step": 48516, "epoch": 400} {"train_loss": -32.52532958984375, "global_step": 48517, "epoch": 400} {"train_loss": -34.59587478637695, "global_step": 48518, "epoch": 400} {"train_loss": -33.77744674682617, "global_step": 48519, "epoch": 400} {"train_loss": -34.57720012507163, "global_step": 48520, "epoch": 400, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4400000": 1.0, "test/sim_max_reward_4400001": 1.0, "test/sim_max_reward_4400002": 1.0, "test/sim_max_reward_4400003": 1.0, "test/sim_max_reward_4400004": 1.0, "test/sim_max_reward_4400005": 1.0, "test/sim_max_reward_4400006": 1.0, "test/sim_max_reward_4400007": 1.0, "test/sim_max_reward_4400008": 1.0, "test/sim_max_reward_4400009": 1.0, "test/sim_max_reward_4400010": 1.0, "test/sim_max_reward_4400011": 1.0, "test/sim_max_reward_4400012": 1.0, "test/sim_max_reward_4400013": 1.0, "test/sim_max_reward_4400014": 1.0, "test/sim_max_reward_4400015": 1.0, "test/sim_max_reward_4400016": 1.0, "test/sim_max_reward_4400017": 1.0, "test/sim_max_reward_4400018": 1.0, "test/sim_max_reward_4400019": 1.0, "test/sim_max_reward_4400020": 1.0, "test/sim_max_reward_4400021": 1.0, "train/mean_score": 1.0, "test/mean_score": 1.0, "val_loss": 2524765.25} {"train_loss": -34.19950485229492, "global_step": 48521, "epoch": 401} {"train_loss": -34.971351623535156, "global_step": 48522, "epoch": 401} {"train_loss": -34.648170471191406, "global_step": 48523, "epoch": 401} {"train_loss": -34.421348571777344, "global_step": 48524, "epoch": 401} {"train_loss": -34.76082992553711, "global_step": 48525, "epoch": 401} {"train_loss": -34.980838775634766, "global_step": 48526, "epoch": 401} {"train_loss": -35.009490966796875, "global_step": 48527, "epoch": 401} {"train_loss": -34.229820251464844, "global_step": 48528, "epoch": 401} {"train_loss": -35.28559875488281, "global_step": 48529, "epoch": 401} {"train_loss": -34.83443069458008, "global_step": 48530, "epoch": 401} {"train_loss": -35.30897903442383, "global_step": 48531, "epoch": 401} {"train_loss": -35.133888244628906, "global_step": 48532, "epoch": 401} {"train_loss": -35.355201721191406, "global_step": 48533, "epoch": 401} {"train_loss": -34.6351203918457, "global_step": 48534, "epoch": 401} {"train_loss": -35.51536560058594, "global_step": 48535, "epoch": 401} {"train_loss": -35.05536651611328, "global_step": 48536, "epoch": 401} {"train_loss": -35.24863815307617, "global_step": 48537, "epoch": 401} {"train_loss": -35.048011779785156, "global_step": 48538, "epoch": 401} {"train_loss": -34.1680793762207, "global_step": 48539, "epoch": 401} {"train_loss": -35.58232116699219, "global_step": 48540, "epoch": 401} {"train_loss": -34.89156723022461, "global_step": 48541, "epoch": 401} {"train_loss": -35.111854553222656, "global_step": 48542, "epoch": 401} {"train_loss": -34.24794387817383, "global_step": 48543, "epoch": 401} {"train_loss": -35.39517593383789, "global_step": 48544, "epoch": 401} {"train_loss": -35.55561447143555, "global_step": 48545, "epoch": 401} {"train_loss": -35.17298126220703, "global_step": 48546, "epoch": 401} {"train_loss": -35.642520904541016, "global_step": 48547, "epoch": 401} {"train_loss": -35.427974700927734, "global_step": 48548, "epoch": 401} {"train_loss": -35.35780715942383, "global_step": 48549, "epoch": 401} {"train_loss": -35.83094024658203, "global_step": 48550, "epoch": 401} {"train_loss": -35.73767852783203, "global_step": 48551, "epoch": 401} {"train_loss": -35.08747100830078, "global_step": 48552, "epoch": 401} {"train_loss": -35.89091110229492, "global_step": 48553, "epoch": 401} {"train_loss": -35.63026428222656, "global_step": 48554, "epoch": 401} {"train_loss": -35.42313766479492, "global_step": 48555, "epoch": 401} {"train_loss": -35.86676788330078, "global_step": 48556, "epoch": 401} {"train_loss": -35.25429153442383, "global_step": 48557, "epoch": 401} {"train_loss": -35.84769821166992, "global_step": 48558, "epoch": 401} {"train_loss": -35.62889862060547, "global_step": 48559, "epoch": 401} {"train_loss": -33.63098907470703, "global_step": 48560, "epoch": 401} {"train_loss": -35.190486907958984, "global_step": 48561, "epoch": 401} {"train_loss": -34.329627990722656, "global_step": 48562, "epoch": 401} {"train_loss": -35.50642776489258, "global_step": 48563, "epoch": 401} {"train_loss": -33.1650276184082, "global_step": 48564, "epoch": 401} {"train_loss": -30.7512264251709, "global_step": 48565, "epoch": 401} {"train_loss": -35.05387496948242, "global_step": 48566, "epoch": 401} {"train_loss": -34.621089935302734, "global_step": 48567, "epoch": 401} {"train_loss": -34.49325942993164, "global_step": 48568, "epoch": 401} {"train_loss": -34.46368408203125, "global_step": 48569, "epoch": 401} {"train_loss": -35.70093536376953, "global_step": 48570, "epoch": 401} {"train_loss": -34.305908203125, "global_step": 48571, "epoch": 401} {"train_loss": -35.42275619506836, "global_step": 48572, "epoch": 401} {"train_loss": -34.460506439208984, "global_step": 48573, "epoch": 401} {"train_loss": -34.378196716308594, "global_step": 48574, "epoch": 401} {"train_loss": -35.23429489135742, "global_step": 48575, "epoch": 401} {"train_loss": -35.51665115356445, "global_step": 48576, "epoch": 401} {"train_loss": -35.4671516418457, "global_step": 48577, "epoch": 401} {"train_loss": -34.79136276245117, "global_step": 48578, "epoch": 401} {"train_loss": -35.231109619140625, "global_step": 48579, "epoch": 401} {"train_loss": -35.335811614990234, "global_step": 48580, "epoch": 401} {"train_loss": -35.75337600708008, "global_step": 48581, "epoch": 401} {"train_loss": -35.341251373291016, "global_step": 48582, "epoch": 401} {"train_loss": -35.655635833740234, "global_step": 48583, "epoch": 401} {"train_loss": -35.262664794921875, "global_step": 48584, "epoch": 401} {"train_loss": -34.96687698364258, "global_step": 48585, "epoch": 401} {"train_loss": -34.94221496582031, "global_step": 48586, "epoch": 401} {"train_loss": -34.29111862182617, "global_step": 48587, "epoch": 401} {"train_loss": -34.585296630859375, "global_step": 48588, "epoch": 401} {"train_loss": -33.71514129638672, "global_step": 48589, "epoch": 401} {"train_loss": -34.904449462890625, "global_step": 48590, "epoch": 401} {"train_loss": -34.798152923583984, "global_step": 48591, "epoch": 401} {"train_loss": -35.14023971557617, "global_step": 48592, "epoch": 401} {"train_loss": -34.08600997924805, "global_step": 48593, "epoch": 401} {"train_loss": -35.02307891845703, "global_step": 48594, "epoch": 401} {"train_loss": -35.333717346191406, "global_step": 48595, "epoch": 401} {"train_loss": -35.36658477783203, "global_step": 48596, "epoch": 401} {"train_loss": -35.61550521850586, "global_step": 48597, "epoch": 401} {"train_loss": -34.94975280761719, "global_step": 48598, "epoch": 401} {"train_loss": -35.86227035522461, "global_step": 48599, "epoch": 401} {"train_loss": -35.791622161865234, "global_step": 48600, "epoch": 401} {"train_loss": -35.48333740234375, "global_step": 48601, "epoch": 401} {"train_loss": -35.820556640625, "global_step": 48602, "epoch": 401} {"train_loss": -35.32160568237305, "global_step": 48603, "epoch": 401} {"train_loss": -34.418148040771484, "global_step": 48604, "epoch": 401} {"train_loss": -35.367835998535156, "global_step": 48605, "epoch": 401} {"train_loss": -35.76299285888672, "global_step": 48606, "epoch": 401} {"train_loss": -34.9507942199707, "global_step": 48607, "epoch": 401} {"train_loss": -34.909488677978516, "global_step": 48608, "epoch": 401} {"train_loss": -35.08945846557617, "global_step": 48609, "epoch": 401} {"train_loss": -35.47661209106445, "global_step": 48610, "epoch": 401} {"train_loss": -34.898216247558594, "global_step": 48611, "epoch": 401} {"train_loss": -35.272193908691406, "global_step": 48612, "epoch": 401} {"train_loss": -34.56031036376953, "global_step": 48613, "epoch": 401} {"train_loss": -35.61627960205078, "global_step": 48614, "epoch": 401} {"train_loss": -34.21761703491211, "global_step": 48615, "epoch": 401} {"train_loss": -32.893611907958984, "global_step": 48616, "epoch": 401} {"train_loss": -35.26754379272461, "global_step": 48617, "epoch": 401} {"train_loss": -34.20698165893555, "global_step": 48618, "epoch": 401} {"train_loss": -34.1242790222168, "global_step": 48619, "epoch": 401} {"train_loss": -31.09043312072754, "global_step": 48620, "epoch": 401} {"train_loss": -32.358882904052734, "global_step": 48621, "epoch": 401} {"train_loss": -32.63727951049805, "global_step": 48622, "epoch": 401} {"train_loss": -32.884796142578125, "global_step": 48623, "epoch": 401} {"train_loss": -34.54324722290039, "global_step": 48624, "epoch": 401} {"train_loss": -34.034584045410156, "global_step": 48625, "epoch": 401} {"train_loss": -33.81013870239258, "global_step": 48626, "epoch": 401} {"train_loss": -33.41984176635742, "global_step": 48627, "epoch": 401} {"train_loss": -34.323856353759766, "global_step": 48628, "epoch": 401} {"train_loss": -33.258602142333984, "global_step": 48629, "epoch": 401} {"train_loss": -35.016597747802734, "global_step": 48630, "epoch": 401} {"train_loss": -33.895381927490234, "global_step": 48631, "epoch": 401} {"train_loss": -33.9298095703125, "global_step": 48632, "epoch": 401} {"train_loss": -35.42765426635742, "global_step": 48633, "epoch": 401} {"train_loss": -33.047481536865234, "global_step": 48634, "epoch": 401} {"train_loss": -35.023189544677734, "global_step": 48635, "epoch": 401} {"train_loss": -34.58970260620117, "global_step": 48636, "epoch": 401} {"train_loss": -35.32717514038086, "global_step": 48637, "epoch": 401} {"train_loss": -34.99233627319336, "global_step": 48638, "epoch": 401} {"train_loss": -34.98869705200195, "global_step": 48639, "epoch": 401} {"train_loss": -35.63926315307617, "global_step": 48640, "epoch": 401} {"train_loss": -34.80998545244706, "global_step": 48641, "epoch": 401, "val_loss": 2590760.75} {"train_loss": -35.40057373046875, "global_step": 48642, "epoch": 402} {"train_loss": -35.304359436035156, "global_step": 48643, "epoch": 402} {"train_loss": -34.52597427368164, "global_step": 48644, "epoch": 402} {"train_loss": -35.62195587158203, "global_step": 48645, "epoch": 402} {"train_loss": -34.29648208618164, "global_step": 48646, "epoch": 402} {"train_loss": -35.2062873840332, "global_step": 48647, "epoch": 402} {"train_loss": -35.52075958251953, "global_step": 48648, "epoch": 402} {"train_loss": -35.45920944213867, "global_step": 48649, "epoch": 402} {"train_loss": -35.4163703918457, "global_step": 48650, "epoch": 402} {"train_loss": -34.9183349609375, "global_step": 48651, "epoch": 402} {"train_loss": -35.24082565307617, "global_step": 48652, "epoch": 402} {"train_loss": -33.00296401977539, "global_step": 48653, "epoch": 402} {"train_loss": -35.30160140991211, "global_step": 48654, "epoch": 402} {"train_loss": -35.261234283447266, "global_step": 48655, "epoch": 402} {"train_loss": -35.0991325378418, "global_step": 48656, "epoch": 402} {"train_loss": -36.009830474853516, "global_step": 48657, "epoch": 402} {"train_loss": -34.98940658569336, "global_step": 48658, "epoch": 402} {"train_loss": -35.442813873291016, "global_step": 48659, "epoch": 402} {"train_loss": -35.72475814819336, "global_step": 48660, "epoch": 402} {"train_loss": -35.8084716796875, "global_step": 48661, "epoch": 402} {"train_loss": -35.76194381713867, "global_step": 48662, "epoch": 402} {"train_loss": -34.93355941772461, "global_step": 48663, "epoch": 402} {"train_loss": -35.73931884765625, "global_step": 48664, "epoch": 402} {"train_loss": -35.9560661315918, "global_step": 48665, "epoch": 402} {"train_loss": -34.61696243286133, "global_step": 48666, "epoch": 402} {"train_loss": -35.85421371459961, "global_step": 48667, "epoch": 402} {"train_loss": -35.59010696411133, "global_step": 48668, "epoch": 402} {"train_loss": -35.919307708740234, "global_step": 48669, "epoch": 402} {"train_loss": -36.3070182800293, "global_step": 48670, "epoch": 402} {"train_loss": -35.506893157958984, "global_step": 48671, "epoch": 402} {"train_loss": -35.6585807800293, "global_step": 48672, "epoch": 402} {"train_loss": -35.41905975341797, "global_step": 48673, "epoch": 402} {"train_loss": -35.440277099609375, "global_step": 48674, "epoch": 402} {"train_loss": -36.20785903930664, "global_step": 48675, "epoch": 402} {"train_loss": -35.841827392578125, "global_step": 48676, "epoch": 402} {"train_loss": -35.73563766479492, "global_step": 48677, "epoch": 402} {"train_loss": -34.78279113769531, "global_step": 48678, "epoch": 402} {"train_loss": -35.48814392089844, "global_step": 48679, "epoch": 402} {"train_loss": -35.35132598876953, "global_step": 48680, "epoch": 402} {"train_loss": -35.191715240478516, "global_step": 48681, "epoch": 402} {"train_loss": -34.843265533447266, "global_step": 48682, "epoch": 402} {"train_loss": -34.18711853027344, "global_step": 48683, "epoch": 402} {"train_loss": -33.52136993408203, "global_step": 48684, "epoch": 402} {"train_loss": -31.402759552001953, "global_step": 48685, "epoch": 402} {"train_loss": -33.1291389465332, "global_step": 48686, "epoch": 402} {"train_loss": -33.57876205444336, "global_step": 48687, "epoch": 402} {"train_loss": -34.73289108276367, "global_step": 48688, "epoch": 402} {"train_loss": -34.5489501953125, "global_step": 48689, "epoch": 402} {"train_loss": -33.302425384521484, "global_step": 48690, "epoch": 402} {"train_loss": -32.54730987548828, "global_step": 48691, "epoch": 402} {"train_loss": -34.87579345703125, "global_step": 48692, "epoch": 402} {"train_loss": -32.826805114746094, "global_step": 48693, "epoch": 402} {"train_loss": -35.27787399291992, "global_step": 48694, "epoch": 402} {"train_loss": -33.144248962402344, "global_step": 48695, "epoch": 402} {"train_loss": -32.55541229248047, "global_step": 48696, "epoch": 402} {"train_loss": -33.06655502319336, "global_step": 48697, "epoch": 402} {"train_loss": -33.86909866333008, "global_step": 48698, "epoch": 402} {"train_loss": -34.64936447143555, "global_step": 48699, "epoch": 402} {"train_loss": -35.07267379760742, "global_step": 48700, "epoch": 402} {"train_loss": -33.0443229675293, "global_step": 48701, "epoch": 402} {"train_loss": -34.71756362915039, "global_step": 48702, "epoch": 402} {"train_loss": -35.04724884033203, "global_step": 48703, "epoch": 402} {"train_loss": -33.11420822143555, "global_step": 48704, "epoch": 402} {"train_loss": -31.7115421295166, "global_step": 48705, "epoch": 402} {"train_loss": -33.98647689819336, "global_step": 48706, "epoch": 402} {"train_loss": -33.04217529296875, "global_step": 48707, "epoch": 402} {"train_loss": -32.46852493286133, "global_step": 48708, "epoch": 402} {"train_loss": -34.56964874267578, "global_step": 48709, "epoch": 402} {"train_loss": -32.69828414916992, "global_step": 48710, "epoch": 402} {"train_loss": -32.45166015625, "global_step": 48711, "epoch": 402} {"train_loss": -33.24855422973633, "global_step": 48712, "epoch": 402} {"train_loss": -32.12770462036133, "global_step": 48713, "epoch": 402} {"train_loss": -31.68889808654785, "global_step": 48714, "epoch": 402} {"train_loss": -33.131290435791016, "global_step": 48715, "epoch": 402} {"train_loss": -33.60076904296875, "global_step": 48716, "epoch": 402} {"train_loss": -33.72806930541992, "global_step": 48717, "epoch": 402} {"train_loss": -32.47761535644531, "global_step": 48718, "epoch": 402} {"train_loss": -32.00505447387695, "global_step": 48719, "epoch": 402} {"train_loss": -32.8946418762207, "global_step": 48720, "epoch": 402} {"train_loss": -32.693485260009766, "global_step": 48721, "epoch": 402} {"train_loss": -33.096309661865234, "global_step": 48722, "epoch": 402} {"train_loss": -32.21928405761719, "global_step": 48723, "epoch": 402} {"train_loss": -31.30580711364746, "global_step": 48724, "epoch": 402} {"train_loss": -33.33005905151367, "global_step": 48725, "epoch": 402} {"train_loss": -34.247703552246094, "global_step": 48726, "epoch": 402} {"train_loss": -32.999534606933594, "global_step": 48727, "epoch": 402} {"train_loss": -32.61952590942383, "global_step": 48728, "epoch": 402} {"train_loss": -33.252132415771484, "global_step": 48729, "epoch": 402} {"train_loss": -34.04254913330078, "global_step": 48730, "epoch": 402} {"train_loss": -33.482269287109375, "global_step": 48731, "epoch": 402} {"train_loss": -32.8367805480957, "global_step": 48732, "epoch": 402} {"train_loss": -33.8415641784668, "global_step": 48733, "epoch": 402} {"train_loss": -34.1768798828125, "global_step": 48734, "epoch": 402} {"train_loss": -33.93745803833008, "global_step": 48735, "epoch": 402} {"train_loss": -33.993438720703125, "global_step": 48736, "epoch": 402} {"train_loss": -33.58926010131836, "global_step": 48737, "epoch": 402} {"train_loss": -33.36027145385742, "global_step": 48738, "epoch": 402} {"train_loss": -34.20833206176758, "global_step": 48739, "epoch": 402} {"train_loss": -34.659584045410156, "global_step": 48740, "epoch": 402} {"train_loss": -34.478511810302734, "global_step": 48741, "epoch": 402} {"train_loss": -33.33275604248047, "global_step": 48742, "epoch": 402} {"train_loss": -34.4090576171875, "global_step": 48743, "epoch": 402} {"train_loss": -34.3978271484375, "global_step": 48744, "epoch": 402} {"train_loss": -34.47294235229492, "global_step": 48745, "epoch": 402} {"train_loss": -34.863441467285156, "global_step": 48746, "epoch": 402} {"train_loss": -34.36567687988281, "global_step": 48747, "epoch": 402} {"train_loss": -34.654273986816406, "global_step": 48748, "epoch": 402} {"train_loss": -34.861724853515625, "global_step": 48749, "epoch": 402} {"train_loss": -35.02518844604492, "global_step": 48750, "epoch": 402} {"train_loss": -33.3819694519043, "global_step": 48751, "epoch": 402} {"train_loss": -34.076778411865234, "global_step": 48752, "epoch": 402} {"train_loss": -35.082496643066406, "global_step": 48753, "epoch": 402} {"train_loss": -34.79755401611328, "global_step": 48754, "epoch": 402} {"train_loss": -34.815914154052734, "global_step": 48755, "epoch": 402} {"train_loss": -34.998756408691406, "global_step": 48756, "epoch": 402} {"train_loss": -34.25305938720703, "global_step": 48757, "epoch": 402} {"train_loss": -34.31803512573242, "global_step": 48758, "epoch": 402} {"train_loss": -34.16398239135742, "global_step": 48759, "epoch": 402} {"train_loss": -34.397560119628906, "global_step": 48760, "epoch": 402} {"train_loss": -34.82685470581055, "global_step": 48761, "epoch": 402} {"train_loss": -34.25417682553126, "global_step": 48762, "epoch": 402, "val_loss": 2578570.5} {"train_loss": -34.51295852661133, "global_step": 48763, "epoch": 403} {"train_loss": -34.43783187866211, "global_step": 48764, "epoch": 403} {"train_loss": -34.498619079589844, "global_step": 48765, "epoch": 403} {"train_loss": -35.226009368896484, "global_step": 48766, "epoch": 403} {"train_loss": -35.397438049316406, "global_step": 48767, "epoch": 403} {"train_loss": -34.85801315307617, "global_step": 48768, "epoch": 403} {"train_loss": -35.17379379272461, "global_step": 48769, "epoch": 403} {"train_loss": -35.5080680847168, "global_step": 48770, "epoch": 403} {"train_loss": -35.267112731933594, "global_step": 48771, "epoch": 403} {"train_loss": -35.10457992553711, "global_step": 48772, "epoch": 403} {"train_loss": -35.25910186767578, "global_step": 48773, "epoch": 403} {"train_loss": -35.48663330078125, "global_step": 48774, "epoch": 403} {"train_loss": -34.79641342163086, "global_step": 48775, "epoch": 403} {"train_loss": -33.909217834472656, "global_step": 48776, "epoch": 403} {"train_loss": -33.93706130981445, "global_step": 48777, "epoch": 403} {"train_loss": -33.06709671020508, "global_step": 48778, "epoch": 403} {"train_loss": -35.00295639038086, "global_step": 48779, "epoch": 403} {"train_loss": -33.514137268066406, "global_step": 48780, "epoch": 403} {"train_loss": -33.706756591796875, "global_step": 48781, "epoch": 403} {"train_loss": -34.52865219116211, "global_step": 48782, "epoch": 403} {"train_loss": -33.4063606262207, "global_step": 48783, "epoch": 403} {"train_loss": -35.55891799926758, "global_step": 48784, "epoch": 403} {"train_loss": -33.0335807800293, "global_step": 48785, "epoch": 403} {"train_loss": -33.30615997314453, "global_step": 48786, "epoch": 403} {"train_loss": -34.59493637084961, "global_step": 48787, "epoch": 403} {"train_loss": -35.10982131958008, "global_step": 48788, "epoch": 403} {"train_loss": -34.73118209838867, "global_step": 48789, "epoch": 403} {"train_loss": -34.30525207519531, "global_step": 48790, "epoch": 403} {"train_loss": -34.023475646972656, "global_step": 48791, "epoch": 403} {"train_loss": -34.93230056762695, "global_step": 48792, "epoch": 403} {"train_loss": -34.91300582885742, "global_step": 48793, "epoch": 403} {"train_loss": -35.22871780395508, "global_step": 48794, "epoch": 403} {"train_loss": -34.91562271118164, "global_step": 48795, "epoch": 403} {"train_loss": -34.102455139160156, "global_step": 48796, "epoch": 403} {"train_loss": -34.64413070678711, "global_step": 48797, "epoch": 403} {"train_loss": -35.64898681640625, "global_step": 48798, "epoch": 403} {"train_loss": -35.4299201965332, "global_step": 48799, "epoch": 403} {"train_loss": -34.197418212890625, "global_step": 48800, "epoch": 403} {"train_loss": -34.538307189941406, "global_step": 48801, "epoch": 403} {"train_loss": -34.94637680053711, "global_step": 48802, "epoch": 403} {"train_loss": -34.40081787109375, "global_step": 48803, "epoch": 403} {"train_loss": -36.05373001098633, "global_step": 48804, "epoch": 403} {"train_loss": -35.52164840698242, "global_step": 48805, "epoch": 403} {"train_loss": -34.640724182128906, "global_step": 48806, "epoch": 403} {"train_loss": -33.8718376159668, "global_step": 48807, "epoch": 403} {"train_loss": -35.857784271240234, "global_step": 48808, "epoch": 403} {"train_loss": -35.5196647644043, "global_step": 48809, "epoch": 403} {"train_loss": -33.39992141723633, "global_step": 48810, "epoch": 403} {"train_loss": -33.56744384765625, "global_step": 48811, "epoch": 403} {"train_loss": -34.98927688598633, "global_step": 48812, "epoch": 403} {"train_loss": -35.09235382080078, "global_step": 48813, "epoch": 403} {"train_loss": -34.83390808105469, "global_step": 48814, "epoch": 403} {"train_loss": -35.619503021240234, "global_step": 48815, "epoch": 403} {"train_loss": -35.916717529296875, "global_step": 48816, "epoch": 403} {"train_loss": -35.24594497680664, "global_step": 48817, "epoch": 403} {"train_loss": -34.80735397338867, "global_step": 48818, "epoch": 403} {"train_loss": -35.8768424987793, "global_step": 48819, "epoch": 403} {"train_loss": -35.016475677490234, "global_step": 48820, "epoch": 403} {"train_loss": -35.457366943359375, "global_step": 48821, "epoch": 403} {"train_loss": -35.38511657714844, "global_step": 48822, "epoch": 403} {"train_loss": -35.20155715942383, "global_step": 48823, "epoch": 403} {"train_loss": -35.40593338012695, "global_step": 48824, "epoch": 403} {"train_loss": -35.15155029296875, "global_step": 48825, "epoch": 403} {"train_loss": -34.272151947021484, "global_step": 48826, "epoch": 403} {"train_loss": -35.700016021728516, "global_step": 48827, "epoch": 403} {"train_loss": -35.07503890991211, "global_step": 48828, "epoch": 403} {"train_loss": -35.39162063598633, "global_step": 48829, "epoch": 403} {"train_loss": -35.47658920288086, "global_step": 48830, "epoch": 403} {"train_loss": -34.2667121887207, "global_step": 48831, "epoch": 403} {"train_loss": -34.77842330932617, "global_step": 48832, "epoch": 403} {"train_loss": -35.30824661254883, "global_step": 48833, "epoch": 403} {"train_loss": -35.83205795288086, "global_step": 48834, "epoch": 403} {"train_loss": -33.68545150756836, "global_step": 48835, "epoch": 403} {"train_loss": -33.66120147705078, "global_step": 48836, "epoch": 403} {"train_loss": -34.38062286376953, "global_step": 48837, "epoch": 403} {"train_loss": -34.896114349365234, "global_step": 48838, "epoch": 403} {"train_loss": -33.30717086791992, "global_step": 48839, "epoch": 403} {"train_loss": -32.622833251953125, "global_step": 48840, "epoch": 403} {"train_loss": -33.73992919921875, "global_step": 48841, "epoch": 403} {"train_loss": -33.34333801269531, "global_step": 48842, "epoch": 403} {"train_loss": -32.957271575927734, "global_step": 48843, "epoch": 403} {"train_loss": -33.78548812866211, "global_step": 48844, "epoch": 403} {"train_loss": -33.96592330932617, "global_step": 48845, "epoch": 403} {"train_loss": -33.538368225097656, "global_step": 48846, "epoch": 403} {"train_loss": -35.04787826538086, "global_step": 48847, "epoch": 403} {"train_loss": -33.583003997802734, "global_step": 48848, "epoch": 403} {"train_loss": -34.10999298095703, "global_step": 48849, "epoch": 403} {"train_loss": -34.314430236816406, "global_step": 48850, "epoch": 403} {"train_loss": -34.06987380981445, "global_step": 48851, "epoch": 403} {"train_loss": -33.629085540771484, "global_step": 48852, "epoch": 403} {"train_loss": -34.02861404418945, "global_step": 48853, "epoch": 403} {"train_loss": -34.27484893798828, "global_step": 48854, "epoch": 403} {"train_loss": -34.26210021972656, "global_step": 48855, "epoch": 403} {"train_loss": -35.08951187133789, "global_step": 48856, "epoch": 403} {"train_loss": -34.964393615722656, "global_step": 48857, "epoch": 403} {"train_loss": -34.91851806640625, "global_step": 48858, "epoch": 403} {"train_loss": -35.19621276855469, "global_step": 48859, "epoch": 403} {"train_loss": -35.125579833984375, "global_step": 48860, "epoch": 403} {"train_loss": -34.587684631347656, "global_step": 48861, "epoch": 403} {"train_loss": -35.29815673828125, "global_step": 48862, "epoch": 403} {"train_loss": -34.99115753173828, "global_step": 48863, "epoch": 403} {"train_loss": -34.616119384765625, "global_step": 48864, "epoch": 403} {"train_loss": -34.81911849975586, "global_step": 48865, "epoch": 403} {"train_loss": -34.84324264526367, "global_step": 48866, "epoch": 403} {"train_loss": -35.00603103637695, "global_step": 48867, "epoch": 403} {"train_loss": -35.21700668334961, "global_step": 48868, "epoch": 403} {"train_loss": -35.2852783203125, "global_step": 48869, "epoch": 403} {"train_loss": -35.70619583129883, "global_step": 48870, "epoch": 403} {"train_loss": -35.21146774291992, "global_step": 48871, "epoch": 403} {"train_loss": -34.91535568237305, "global_step": 48872, "epoch": 403} {"train_loss": -35.01996612548828, "global_step": 48873, "epoch": 403} {"train_loss": -34.955657958984375, "global_step": 48874, "epoch": 403} {"train_loss": -35.676063537597656, "global_step": 48875, "epoch": 403} {"train_loss": -35.03672409057617, "global_step": 48876, "epoch": 403} {"train_loss": -35.775020599365234, "global_step": 48877, "epoch": 403} {"train_loss": -35.521785736083984, "global_step": 48878, "epoch": 403} {"train_loss": -35.651119232177734, "global_step": 48879, "epoch": 403} {"train_loss": -35.45925521850586, "global_step": 48880, "epoch": 403} {"train_loss": -35.44758987426758, "global_step": 48881, "epoch": 403} {"train_loss": -36.12319564819336, "global_step": 48882, "epoch": 403} {"train_loss": -34.749012970727335, "global_step": 48883, "epoch": 403, "val_loss": 2572388.25} {"train_loss": -35.319252014160156, "global_step": 48884, "epoch": 404} {"train_loss": -35.07575607299805, "global_step": 48885, "epoch": 404} {"train_loss": -33.548622131347656, "global_step": 48886, "epoch": 404} {"train_loss": -30.508878707885742, "global_step": 48887, "epoch": 404} {"train_loss": -27.00606346130371, "global_step": 48888, "epoch": 404} {"train_loss": -28.962726593017578, "global_step": 48889, "epoch": 404} {"train_loss": -34.35402297973633, "global_step": 48890, "epoch": 404} {"train_loss": -33.481380462646484, "global_step": 48891, "epoch": 404} {"train_loss": -31.588184356689453, "global_step": 48892, "epoch": 404} {"train_loss": -33.83403778076172, "global_step": 48893, "epoch": 404} {"train_loss": -33.084449768066406, "global_step": 48894, "epoch": 404} {"train_loss": -32.98432540893555, "global_step": 48895, "epoch": 404} {"train_loss": -34.80127716064453, "global_step": 48896, "epoch": 404} {"train_loss": -33.08806228637695, "global_step": 48897, "epoch": 404} {"train_loss": -35.34023666381836, "global_step": 48898, "epoch": 404} {"train_loss": -32.627777099609375, "global_step": 48899, "epoch": 404} {"train_loss": -35.352291107177734, "global_step": 48900, "epoch": 404} {"train_loss": -33.71063995361328, "global_step": 48901, "epoch": 404} {"train_loss": -34.201507568359375, "global_step": 48902, "epoch": 404} {"train_loss": -35.49953079223633, "global_step": 48903, "epoch": 404} {"train_loss": -34.38421630859375, "global_step": 48904, "epoch": 404} {"train_loss": -35.37533187866211, "global_step": 48905, "epoch": 404} {"train_loss": -34.36417770385742, "global_step": 48906, "epoch": 404} {"train_loss": -35.389068603515625, "global_step": 48907, "epoch": 404} {"train_loss": -35.005348205566406, "global_step": 48908, "epoch": 404} {"train_loss": -34.656185150146484, "global_step": 48909, "epoch": 404} {"train_loss": -35.947505950927734, "global_step": 48910, "epoch": 404} {"train_loss": -34.86558532714844, "global_step": 48911, "epoch": 404} {"train_loss": -35.610897064208984, "global_step": 48912, "epoch": 404} {"train_loss": -35.312068939208984, "global_step": 48913, "epoch": 404} {"train_loss": -35.168304443359375, "global_step": 48914, "epoch": 404} {"train_loss": -35.05134582519531, "global_step": 48915, "epoch": 404} {"train_loss": -35.18746566772461, "global_step": 48916, "epoch": 404} {"train_loss": -35.7745246887207, "global_step": 48917, "epoch": 404} {"train_loss": -35.788726806640625, "global_step": 48918, "epoch": 404} {"train_loss": -35.99195098876953, "global_step": 48919, "epoch": 404} {"train_loss": -35.361263275146484, "global_step": 48920, "epoch": 404} {"train_loss": -35.95560073852539, "global_step": 48921, "epoch": 404} {"train_loss": -35.45277786254883, "global_step": 48922, "epoch": 404} {"train_loss": -35.242469787597656, "global_step": 48923, "epoch": 404} {"train_loss": -35.63702392578125, "global_step": 48924, "epoch": 404} {"train_loss": -35.209983825683594, "global_step": 48925, "epoch": 404} {"train_loss": -35.385128021240234, "global_step": 48926, "epoch": 404} {"train_loss": -35.71247863769531, "global_step": 48927, "epoch": 404} {"train_loss": -35.81170654296875, "global_step": 48928, "epoch": 404} {"train_loss": -35.777069091796875, "global_step": 48929, "epoch": 404} {"train_loss": -35.28059005737305, "global_step": 48930, "epoch": 404} {"train_loss": -35.11444091796875, "global_step": 48931, "epoch": 404} {"train_loss": -35.581172943115234, "global_step": 48932, "epoch": 404} {"train_loss": -35.92991256713867, "global_step": 48933, "epoch": 404} {"train_loss": -35.79158401489258, "global_step": 48934, "epoch": 404} {"train_loss": -35.01013946533203, "global_step": 48935, "epoch": 404} {"train_loss": -34.937965393066406, "global_step": 48936, "epoch": 404} {"train_loss": -33.99154281616211, "global_step": 48937, "epoch": 404} {"train_loss": -33.813629150390625, "global_step": 48938, "epoch": 404} {"train_loss": -31.640668869018555, "global_step": 48939, "epoch": 404} {"train_loss": -27.169031143188477, "global_step": 48940, "epoch": 404} {"train_loss": -25.011838912963867, "global_step": 48941, "epoch": 404} {"train_loss": -28.477832794189453, "global_step": 48942, "epoch": 404} {"train_loss": -31.32587242126465, "global_step": 48943, "epoch": 404} {"train_loss": -35.27543258666992, "global_step": 48944, "epoch": 404} {"train_loss": -29.442279815673828, "global_step": 48945, "epoch": 404} {"train_loss": -33.38138198852539, "global_step": 48946, "epoch": 404} {"train_loss": -34.26039123535156, "global_step": 48947, "epoch": 404} {"train_loss": -33.76109313964844, "global_step": 48948, "epoch": 404} {"train_loss": -34.113121032714844, "global_step": 48949, "epoch": 404} {"train_loss": -34.35094451904297, "global_step": 48950, "epoch": 404} {"train_loss": -34.447265625, "global_step": 48951, "epoch": 404} {"train_loss": -34.9061393737793, "global_step": 48952, "epoch": 404} {"train_loss": -34.521724700927734, "global_step": 48953, "epoch": 404} {"train_loss": -34.668785095214844, "global_step": 48954, "epoch": 404} {"train_loss": -34.41246032714844, "global_step": 48955, "epoch": 404} {"train_loss": -34.1776237487793, "global_step": 48956, "epoch": 404} {"train_loss": -34.17327880859375, "global_step": 48957, "epoch": 404} {"train_loss": -34.16085433959961, "global_step": 48958, "epoch": 404} {"train_loss": -33.84999465942383, "global_step": 48959, "epoch": 404} {"train_loss": -33.95753860473633, "global_step": 48960, "epoch": 404} {"train_loss": -34.68366622924805, "global_step": 48961, "epoch": 404} {"train_loss": -35.24711990356445, "global_step": 48962, "epoch": 404} {"train_loss": -34.470760345458984, "global_step": 48963, "epoch": 404} {"train_loss": -33.21380615234375, "global_step": 48964, "epoch": 404} {"train_loss": -31.796728134155273, "global_step": 48965, "epoch": 404} {"train_loss": -34.06694412231445, "global_step": 48966, "epoch": 404} {"train_loss": -34.86035919189453, "global_step": 48967, "epoch": 404} {"train_loss": -32.11163330078125, "global_step": 48968, "epoch": 404} {"train_loss": -32.973785400390625, "global_step": 48969, "epoch": 404} {"train_loss": -35.26560592651367, "global_step": 48970, "epoch": 404} {"train_loss": -34.29030990600586, "global_step": 48971, "epoch": 404} {"train_loss": -34.937740325927734, "global_step": 48972, "epoch": 404} {"train_loss": -35.264705657958984, "global_step": 48973, "epoch": 404} {"train_loss": -34.805538177490234, "global_step": 48974, "epoch": 404} {"train_loss": -35.48305130004883, "global_step": 48975, "epoch": 404} {"train_loss": -34.84518051147461, "global_step": 48976, "epoch": 404} {"train_loss": -35.453857421875, "global_step": 48977, "epoch": 404} {"train_loss": -34.40309524536133, "global_step": 48978, "epoch": 404} {"train_loss": -35.48015213012695, "global_step": 48979, "epoch": 404} {"train_loss": -35.83378601074219, "global_step": 48980, "epoch": 404} {"train_loss": -35.70254135131836, "global_step": 48981, "epoch": 404} {"train_loss": -35.38291549682617, "global_step": 48982, "epoch": 404} {"train_loss": -35.581459045410156, "global_step": 48983, "epoch": 404} {"train_loss": -35.84247589111328, "global_step": 48984, "epoch": 404} {"train_loss": -35.84760284423828, "global_step": 48985, "epoch": 404} {"train_loss": -35.32039260864258, "global_step": 48986, "epoch": 404} {"train_loss": -35.980712890625, "global_step": 48987, "epoch": 404} {"train_loss": -35.49653244018555, "global_step": 48988, "epoch": 404} {"train_loss": -35.632789611816406, "global_step": 48989, "epoch": 404} {"train_loss": -35.21577835083008, "global_step": 48990, "epoch": 404} {"train_loss": -35.92325210571289, "global_step": 48991, "epoch": 404} {"train_loss": -35.76978302001953, "global_step": 48992, "epoch": 404} {"train_loss": -35.19590377807617, "global_step": 48993, "epoch": 404} {"train_loss": -36.03193283081055, "global_step": 48994, "epoch": 404} {"train_loss": -36.02106857299805, "global_step": 48995, "epoch": 404} {"train_loss": -35.979183197021484, "global_step": 48996, "epoch": 404} {"train_loss": -35.86052322387695, "global_step": 48997, "epoch": 404} {"train_loss": -36.32306671142578, "global_step": 48998, "epoch": 404} {"train_loss": -35.87519073486328, "global_step": 48999, "epoch": 404} {"train_loss": -35.8943977355957, "global_step": 49000, "epoch": 404} {"train_loss": -36.0374641418457, "global_step": 49001, "epoch": 404} {"train_loss": -35.586097717285156, "global_step": 49002, "epoch": 404} {"train_loss": -35.42434310913086, "global_step": 49003, "epoch": 404} {"train_loss": -34.44382506756743, "global_step": 49004, "epoch": 404, "val_loss": 2572940.75} {"train_loss": -36.153228759765625, "global_step": 49005, "epoch": 405} {"train_loss": -36.11455154418945, "global_step": 49006, "epoch": 405} {"train_loss": -35.920955657958984, "global_step": 49007, "epoch": 405} {"train_loss": -34.95762634277344, "global_step": 49008, "epoch": 405} {"train_loss": -35.51508712768555, "global_step": 49009, "epoch": 405} {"train_loss": -35.30134201049805, "global_step": 49010, "epoch": 405} {"train_loss": -35.71070098876953, "global_step": 49011, "epoch": 405} {"train_loss": -36.072853088378906, "global_step": 49012, "epoch": 405} {"train_loss": -35.56338119506836, "global_step": 49013, "epoch": 405} {"train_loss": -34.03538131713867, "global_step": 49014, "epoch": 405} {"train_loss": -34.508338928222656, "global_step": 49015, "epoch": 405} {"train_loss": -32.708831787109375, "global_step": 49016, "epoch": 405} {"train_loss": -33.62827682495117, "global_step": 49017, "epoch": 405} {"train_loss": -35.184268951416016, "global_step": 49018, "epoch": 405} {"train_loss": -32.12031936645508, "global_step": 49019, "epoch": 405} {"train_loss": -34.15810775756836, "global_step": 49020, "epoch": 405} {"train_loss": -32.30359649658203, "global_step": 49021, "epoch": 405} {"train_loss": -33.617794036865234, "global_step": 49022, "epoch": 405} {"train_loss": -34.387550354003906, "global_step": 49023, "epoch": 405} {"train_loss": -34.83614730834961, "global_step": 49024, "epoch": 405} {"train_loss": -33.132015228271484, "global_step": 49025, "epoch": 405} {"train_loss": -33.86249542236328, "global_step": 49026, "epoch": 405} {"train_loss": -32.15397262573242, "global_step": 49027, "epoch": 405} {"train_loss": -33.3433952331543, "global_step": 49028, "epoch": 405} {"train_loss": -32.8726921081543, "global_step": 49029, "epoch": 405} {"train_loss": -33.77589797973633, "global_step": 49030, "epoch": 405} {"train_loss": -34.41893768310547, "global_step": 49031, "epoch": 405} {"train_loss": -33.15340805053711, "global_step": 49032, "epoch": 405} {"train_loss": -33.21737289428711, "global_step": 49033, "epoch": 405} {"train_loss": -34.024532318115234, "global_step": 49034, "epoch": 405} {"train_loss": -34.08304977416992, "global_step": 49035, "epoch": 405} {"train_loss": -34.24886703491211, "global_step": 49036, "epoch": 405} {"train_loss": -34.629150390625, "global_step": 49037, "epoch": 405} {"train_loss": -33.9085807800293, "global_step": 49038, "epoch": 405} {"train_loss": -34.38236618041992, "global_step": 49039, "epoch": 405} {"train_loss": -33.988319396972656, "global_step": 49040, "epoch": 405} {"train_loss": -33.44972610473633, "global_step": 49041, "epoch": 405} {"train_loss": -34.95389175415039, "global_step": 49042, "epoch": 405} {"train_loss": -34.12447738647461, "global_step": 49043, "epoch": 405} {"train_loss": -34.52618408203125, "global_step": 49044, "epoch": 405} {"train_loss": -33.535701751708984, "global_step": 49045, "epoch": 405} {"train_loss": -34.56040573120117, "global_step": 49046, "epoch": 405} {"train_loss": -34.642127990722656, "global_step": 49047, "epoch": 405} {"train_loss": -34.6814079284668, "global_step": 49048, "epoch": 405} {"train_loss": -34.640384674072266, "global_step": 49049, "epoch": 405} {"train_loss": -34.73816680908203, "global_step": 49050, "epoch": 405} {"train_loss": -34.88640213012695, "global_step": 49051, "epoch": 405} {"train_loss": -35.158321380615234, "global_step": 49052, "epoch": 405} {"train_loss": -34.7554817199707, "global_step": 49053, "epoch": 405} {"train_loss": -34.362037658691406, "global_step": 49054, "epoch": 405} {"train_loss": -34.841068267822266, "global_step": 49055, "epoch": 405} {"train_loss": -34.72419738769531, "global_step": 49056, "epoch": 405} {"train_loss": -35.176063537597656, "global_step": 49057, "epoch": 405} {"train_loss": -35.013458251953125, "global_step": 49058, "epoch": 405} {"train_loss": -35.1737174987793, "global_step": 49059, "epoch": 405} {"train_loss": -35.52952194213867, "global_step": 49060, "epoch": 405} {"train_loss": -35.28944778442383, "global_step": 49061, "epoch": 405} {"train_loss": -35.2844123840332, "global_step": 49062, "epoch": 405} {"train_loss": -35.31901168823242, "global_step": 49063, "epoch": 405} {"train_loss": -35.253902435302734, "global_step": 49064, "epoch": 405} {"train_loss": -34.727237701416016, "global_step": 49065, "epoch": 405} {"train_loss": -35.263736724853516, "global_step": 49066, "epoch": 405} {"train_loss": -35.45732498168945, "global_step": 49067, "epoch": 405} {"train_loss": -35.444881439208984, "global_step": 49068, "epoch": 405} {"train_loss": -34.84743118286133, "global_step": 49069, "epoch": 405} {"train_loss": -35.32011795043945, "global_step": 49070, "epoch": 405} {"train_loss": -34.488075256347656, "global_step": 49071, "epoch": 405} {"train_loss": -33.90385055541992, "global_step": 49072, "epoch": 405} {"train_loss": -33.48109817504883, "global_step": 49073, "epoch": 405} {"train_loss": -33.373992919921875, "global_step": 49074, "epoch": 405} {"train_loss": -34.59074020385742, "global_step": 49075, "epoch": 405} {"train_loss": -35.42052459716797, "global_step": 49076, "epoch": 405} {"train_loss": -35.16608810424805, "global_step": 49077, "epoch": 405} {"train_loss": -34.92079544067383, "global_step": 49078, "epoch": 405} {"train_loss": -35.148529052734375, "global_step": 49079, "epoch": 405} {"train_loss": -35.63981246948242, "global_step": 49080, "epoch": 405} {"train_loss": -35.8602409362793, "global_step": 49081, "epoch": 405} {"train_loss": -34.94965744018555, "global_step": 49082, "epoch": 405} {"train_loss": -35.384193420410156, "global_step": 49083, "epoch": 405} {"train_loss": -35.847564697265625, "global_step": 49084, "epoch": 405} {"train_loss": -34.955440521240234, "global_step": 49085, "epoch": 405} {"train_loss": -34.25202178955078, "global_step": 49086, "epoch": 405} {"train_loss": -35.56107711791992, "global_step": 49087, "epoch": 405} {"train_loss": -35.882667541503906, "global_step": 49088, "epoch": 405} {"train_loss": -34.651119232177734, "global_step": 49089, "epoch": 405} {"train_loss": -35.827392578125, "global_step": 49090, "epoch": 405} {"train_loss": -36.095436096191406, "global_step": 49091, "epoch": 405} {"train_loss": -36.23323440551758, "global_step": 49092, "epoch": 405} {"train_loss": -36.35103988647461, "global_step": 49093, "epoch": 405} {"train_loss": -35.32061767578125, "global_step": 49094, "epoch": 405} {"train_loss": -35.48348617553711, "global_step": 49095, "epoch": 405} {"train_loss": -35.88201904296875, "global_step": 49096, "epoch": 405} {"train_loss": -36.09994888305664, "global_step": 49097, "epoch": 405} {"train_loss": -36.20528793334961, "global_step": 49098, "epoch": 405} {"train_loss": -35.93138122558594, "global_step": 49099, "epoch": 405} {"train_loss": -35.66875076293945, "global_step": 49100, "epoch": 405} {"train_loss": -34.420509338378906, "global_step": 49101, "epoch": 405} {"train_loss": -33.79631805419922, "global_step": 49102, "epoch": 405} {"train_loss": -33.27574157714844, "global_step": 49103, "epoch": 405} {"train_loss": -33.48732376098633, "global_step": 49104, "epoch": 405} {"train_loss": -35.30866622924805, "global_step": 49105, "epoch": 405} {"train_loss": -35.890926361083984, "global_step": 49106, "epoch": 405} {"train_loss": -35.399383544921875, "global_step": 49107, "epoch": 405} {"train_loss": -35.97004318237305, "global_step": 49108, "epoch": 405} {"train_loss": -35.589962005615234, "global_step": 49109, "epoch": 405} {"train_loss": -34.97652053833008, "global_step": 49110, "epoch": 405} {"train_loss": -35.3731689453125, "global_step": 49111, "epoch": 405} {"train_loss": -33.873756408691406, "global_step": 49112, "epoch": 405} {"train_loss": -33.8465690612793, "global_step": 49113, "epoch": 405} {"train_loss": -32.773250579833984, "global_step": 49114, "epoch": 405} {"train_loss": -32.84352111816406, "global_step": 49115, "epoch": 405} {"train_loss": -33.653228759765625, "global_step": 49116, "epoch": 405} {"train_loss": -33.28013229370117, "global_step": 49117, "epoch": 405} {"train_loss": -34.5509147644043, "global_step": 49118, "epoch": 405} {"train_loss": -34.85869216918945, "global_step": 49119, "epoch": 405} {"train_loss": -33.6538200378418, "global_step": 49120, "epoch": 405} {"train_loss": -34.62502670288086, "global_step": 49121, "epoch": 405} {"train_loss": -33.73634719848633, "global_step": 49122, "epoch": 405} {"train_loss": -34.67841339111328, "global_step": 49123, "epoch": 405} {"train_loss": -35.816749572753906, "global_step": 49124, "epoch": 405} {"train_loss": -34.683033084081224, "global_step": 49125, "epoch": 405, "val_loss": 2643142.25} {"train_loss": -33.60991287231445, "global_step": 49126, "epoch": 406} {"train_loss": -33.91300582885742, "global_step": 49127, "epoch": 406} {"train_loss": -35.08955001831055, "global_step": 49128, "epoch": 406} {"train_loss": -32.733245849609375, "global_step": 49129, "epoch": 406} {"train_loss": -33.08013153076172, "global_step": 49130, "epoch": 406} {"train_loss": -33.25957489013672, "global_step": 49131, "epoch": 406} {"train_loss": -31.27947998046875, "global_step": 49132, "epoch": 406} {"train_loss": -33.577919006347656, "global_step": 49133, "epoch": 406} {"train_loss": -34.42523193359375, "global_step": 49134, "epoch": 406} {"train_loss": -34.38857650756836, "global_step": 49135, "epoch": 406} {"train_loss": -34.39834213256836, "global_step": 49136, "epoch": 406} {"train_loss": -34.8583869934082, "global_step": 49137, "epoch": 406} {"train_loss": -35.27016067504883, "global_step": 49138, "epoch": 406} {"train_loss": -35.07953643798828, "global_step": 49139, "epoch": 406} {"train_loss": -35.464813232421875, "global_step": 49140, "epoch": 406} {"train_loss": -34.93825149536133, "global_step": 49141, "epoch": 406} {"train_loss": -35.347469329833984, "global_step": 49142, "epoch": 406} {"train_loss": -35.254451751708984, "global_step": 49143, "epoch": 406} {"train_loss": -35.59975814819336, "global_step": 49144, "epoch": 406} {"train_loss": -35.42082595825195, "global_step": 49145, "epoch": 406} {"train_loss": -35.41594314575195, "global_step": 49146, "epoch": 406} {"train_loss": -35.647499084472656, "global_step": 49147, "epoch": 406} {"train_loss": -35.92792892456055, "global_step": 49148, "epoch": 406} {"train_loss": -35.352577209472656, "global_step": 49149, "epoch": 406} {"train_loss": -35.45166778564453, "global_step": 49150, "epoch": 406} {"train_loss": -36.10897445678711, "global_step": 49151, "epoch": 406} {"train_loss": -35.821781158447266, "global_step": 49152, "epoch": 406} {"train_loss": -35.44965744018555, "global_step": 49153, "epoch": 406} {"train_loss": -35.308631896972656, "global_step": 49154, "epoch": 406} {"train_loss": -35.842159271240234, "global_step": 49155, "epoch": 406} {"train_loss": -35.844696044921875, "global_step": 49156, "epoch": 406} {"train_loss": -36.27219772338867, "global_step": 49157, "epoch": 406} {"train_loss": -35.93016052246094, "global_step": 49158, "epoch": 406} {"train_loss": -35.586822509765625, "global_step": 49159, "epoch": 406} {"train_loss": -36.04694747924805, "global_step": 49160, "epoch": 406} {"train_loss": -35.7800407409668, "global_step": 49161, "epoch": 406} {"train_loss": -35.238887786865234, "global_step": 49162, "epoch": 406} {"train_loss": -36.094276428222656, "global_step": 49163, "epoch": 406} {"train_loss": -35.360504150390625, "global_step": 49164, "epoch": 406} {"train_loss": -35.132198333740234, "global_step": 49165, "epoch": 406} {"train_loss": -36.025794982910156, "global_step": 49166, "epoch": 406} {"train_loss": -36.310787200927734, "global_step": 49167, "epoch": 406} {"train_loss": -36.31199264526367, "global_step": 49168, "epoch": 406} {"train_loss": -34.851478576660156, "global_step": 49169, "epoch": 406} {"train_loss": -36.003440856933594, "global_step": 49170, "epoch": 406} {"train_loss": -36.12681198120117, "global_step": 49171, "epoch": 406} {"train_loss": -35.87061309814453, "global_step": 49172, "epoch": 406} {"train_loss": -35.704837799072266, "global_step": 49173, "epoch": 406} {"train_loss": -35.6411247253418, "global_step": 49174, "epoch": 406} {"train_loss": -35.58836364746094, "global_step": 49175, "epoch": 406} {"train_loss": -36.29291534423828, "global_step": 49176, "epoch": 406} {"train_loss": -34.76023483276367, "global_step": 49177, "epoch": 406} {"train_loss": -35.68740463256836, "global_step": 49178, "epoch": 406} {"train_loss": -33.56684112548828, "global_step": 49179, "epoch": 406} {"train_loss": -34.99433517456055, "global_step": 49180, "epoch": 406} {"train_loss": -34.47636795043945, "global_step": 49181, "epoch": 406} {"train_loss": -34.1870231628418, "global_step": 49182, "epoch": 406} {"train_loss": -34.22764587402344, "global_step": 49183, "epoch": 406} {"train_loss": -31.88947105407715, "global_step": 49184, "epoch": 406} {"train_loss": -29.545135498046875, "global_step": 49185, "epoch": 406} {"train_loss": -31.97405433654785, "global_step": 49186, "epoch": 406} {"train_loss": -32.91965866088867, "global_step": 49187, "epoch": 406} {"train_loss": -32.86021041870117, "global_step": 49188, "epoch": 406} {"train_loss": -30.761795043945312, "global_step": 49189, "epoch": 406} {"train_loss": -31.616666793823242, "global_step": 49190, "epoch": 406} {"train_loss": -33.135555267333984, "global_step": 49191, "epoch": 406} {"train_loss": -34.503456115722656, "global_step": 49192, "epoch": 406} {"train_loss": -31.75604248046875, "global_step": 49193, "epoch": 406} {"train_loss": -32.83024215698242, "global_step": 49194, "epoch": 406} {"train_loss": -32.74396896362305, "global_step": 49195, "epoch": 406} {"train_loss": -34.04840850830078, "global_step": 49196, "epoch": 406} {"train_loss": -33.96999740600586, "global_step": 49197, "epoch": 406} {"train_loss": -34.265506744384766, "global_step": 49198, "epoch": 406} {"train_loss": -33.7409553527832, "global_step": 49199, "epoch": 406} {"train_loss": -34.64702606201172, "global_step": 49200, "epoch": 406} {"train_loss": -35.45052719116211, "global_step": 49201, "epoch": 406} {"train_loss": -33.589229583740234, "global_step": 49202, "epoch": 406} {"train_loss": -34.673526763916016, "global_step": 49203, "epoch": 406} {"train_loss": -34.77423095703125, "global_step": 49204, "epoch": 406} {"train_loss": -34.84897232055664, "global_step": 49205, "epoch": 406} {"train_loss": -33.99943923950195, "global_step": 49206, "epoch": 406} {"train_loss": -34.2508430480957, "global_step": 49207, "epoch": 406} {"train_loss": -34.662818908691406, "global_step": 49208, "epoch": 406} {"train_loss": -34.33913803100586, "global_step": 49209, "epoch": 406} {"train_loss": -35.26061248779297, "global_step": 49210, "epoch": 406} {"train_loss": -34.56965255737305, "global_step": 49211, "epoch": 406} {"train_loss": -35.38234329223633, "global_step": 49212, "epoch": 406} {"train_loss": -35.121070861816406, "global_step": 49213, "epoch": 406} {"train_loss": -34.69477081298828, "global_step": 49214, "epoch": 406} {"train_loss": -35.13176727294922, "global_step": 49215, "epoch": 406} {"train_loss": -35.024349212646484, "global_step": 49216, "epoch": 406} {"train_loss": -34.82204818725586, "global_step": 49217, "epoch": 406} {"train_loss": -34.73476791381836, "global_step": 49218, "epoch": 406} {"train_loss": -35.3928108215332, "global_step": 49219, "epoch": 406} {"train_loss": -35.249874114990234, "global_step": 49220, "epoch": 406} {"train_loss": -35.26323318481445, "global_step": 49221, "epoch": 406} {"train_loss": -34.7852668762207, "global_step": 49222, "epoch": 406} {"train_loss": -35.4752082824707, "global_step": 49223, "epoch": 406} {"train_loss": -35.42430877685547, "global_step": 49224, "epoch": 406} {"train_loss": -35.142330169677734, "global_step": 49225, "epoch": 406} {"train_loss": -34.292816162109375, "global_step": 49226, "epoch": 406} {"train_loss": -35.001094818115234, "global_step": 49227, "epoch": 406} {"train_loss": -35.41567611694336, "global_step": 49228, "epoch": 406} {"train_loss": -35.56254196166992, "global_step": 49229, "epoch": 406} {"train_loss": -34.99934387207031, "global_step": 49230, "epoch": 406} {"train_loss": -35.736202239990234, "global_step": 49231, "epoch": 406} {"train_loss": -35.6081657409668, "global_step": 49232, "epoch": 406} {"train_loss": -35.13698959350586, "global_step": 49233, "epoch": 406} {"train_loss": -36.06482696533203, "global_step": 49234, "epoch": 406} {"train_loss": -35.3409309387207, "global_step": 49235, "epoch": 406} {"train_loss": -35.844783782958984, "global_step": 49236, "epoch": 406} {"train_loss": -35.773597717285156, "global_step": 49237, "epoch": 406} {"train_loss": -35.615272521972656, "global_step": 49238, "epoch": 406} {"train_loss": -35.94977569580078, "global_step": 49239, "epoch": 406} {"train_loss": -35.66193771362305, "global_step": 49240, "epoch": 406} {"train_loss": -35.35072326660156, "global_step": 49241, "epoch": 406} {"train_loss": -34.93821334838867, "global_step": 49242, "epoch": 406} {"train_loss": -36.164005279541016, "global_step": 49243, "epoch": 406} {"train_loss": -35.80231475830078, "global_step": 49244, "epoch": 406} {"train_loss": -35.9298210144043, "global_step": 49245, "epoch": 406} {"train_loss": -34.80916048475533, "global_step": 49246, "epoch": 406, "val_loss": 2594497.25} {"train_loss": -34.39631271362305, "global_step": 49247, "epoch": 407} {"train_loss": -35.34098434448242, "global_step": 49248, "epoch": 407} {"train_loss": -33.882930755615234, "global_step": 49249, "epoch": 407} {"train_loss": -36.13097381591797, "global_step": 49250, "epoch": 407} {"train_loss": -35.50344467163086, "global_step": 49251, "epoch": 407} {"train_loss": -34.526432037353516, "global_step": 49252, "epoch": 407} {"train_loss": -35.666236877441406, "global_step": 49253, "epoch": 407} {"train_loss": -35.92537307739258, "global_step": 49254, "epoch": 407} {"train_loss": -33.86908721923828, "global_step": 49255, "epoch": 407} {"train_loss": -34.22418212890625, "global_step": 49256, "epoch": 407} {"train_loss": -35.678062438964844, "global_step": 49257, "epoch": 407} {"train_loss": -35.87873840332031, "global_step": 49258, "epoch": 407} {"train_loss": -35.37395095825195, "global_step": 49259, "epoch": 407} {"train_loss": -35.87791061401367, "global_step": 49260, "epoch": 407} {"train_loss": -36.1811637878418, "global_step": 49261, "epoch": 407} {"train_loss": -34.99530792236328, "global_step": 49262, "epoch": 407} {"train_loss": -35.372352600097656, "global_step": 49263, "epoch": 407} {"train_loss": -36.09225082397461, "global_step": 49264, "epoch": 407} {"train_loss": -35.56541061401367, "global_step": 49265, "epoch": 407} {"train_loss": -34.07221221923828, "global_step": 49266, "epoch": 407} {"train_loss": -32.429229736328125, "global_step": 49267, "epoch": 407} {"train_loss": -32.00703048706055, "global_step": 49268, "epoch": 407} {"train_loss": -34.00333786010742, "global_step": 49269, "epoch": 407} {"train_loss": -34.31205749511719, "global_step": 49270, "epoch": 407} {"train_loss": -33.830421447753906, "global_step": 49271, "epoch": 407} {"train_loss": -34.82783508300781, "global_step": 49272, "epoch": 407} {"train_loss": -34.900386810302734, "global_step": 49273, "epoch": 407} {"train_loss": -33.986724853515625, "global_step": 49274, "epoch": 407} {"train_loss": -35.39681625366211, "global_step": 49275, "epoch": 407} {"train_loss": -34.69565963745117, "global_step": 49276, "epoch": 407} {"train_loss": -34.904876708984375, "global_step": 49277, "epoch": 407} {"train_loss": -34.9661979675293, "global_step": 49278, "epoch": 407} {"train_loss": -35.045963287353516, "global_step": 49279, "epoch": 407} {"train_loss": -34.74363327026367, "global_step": 49280, "epoch": 407} {"train_loss": -35.05965805053711, "global_step": 49281, "epoch": 407} {"train_loss": -35.732208251953125, "global_step": 49282, "epoch": 407} {"train_loss": -35.4055061340332, "global_step": 49283, "epoch": 407} {"train_loss": -34.92649459838867, "global_step": 49284, "epoch": 407} {"train_loss": -35.33376693725586, "global_step": 49285, "epoch": 407} {"train_loss": -35.7907829284668, "global_step": 49286, "epoch": 407} {"train_loss": -35.92288589477539, "global_step": 49287, "epoch": 407} {"train_loss": -35.436004638671875, "global_step": 49288, "epoch": 407} {"train_loss": -34.9804573059082, "global_step": 49289, "epoch": 407} {"train_loss": -35.772151947021484, "global_step": 49290, "epoch": 407} {"train_loss": -35.622352600097656, "global_step": 49291, "epoch": 407} {"train_loss": -35.65095138549805, "global_step": 49292, "epoch": 407} {"train_loss": -35.9517936706543, "global_step": 49293, "epoch": 407} {"train_loss": -34.91141891479492, "global_step": 49294, "epoch": 407} {"train_loss": -35.29830551147461, "global_step": 49295, "epoch": 407} {"train_loss": -35.330928802490234, "global_step": 49296, "epoch": 407} {"train_loss": -36.24054718017578, "global_step": 49297, "epoch": 407} {"train_loss": -35.08637237548828, "global_step": 49298, "epoch": 407} {"train_loss": -35.67344284057617, "global_step": 49299, "epoch": 407} {"train_loss": -35.92866897583008, "global_step": 49300, "epoch": 407} {"train_loss": -35.31797790527344, "global_step": 49301, "epoch": 407} {"train_loss": -35.46648406982422, "global_step": 49302, "epoch": 407} {"train_loss": -34.61653137207031, "global_step": 49303, "epoch": 407} {"train_loss": -35.81338119506836, "global_step": 49304, "epoch": 407} {"train_loss": -34.02841567993164, "global_step": 49305, "epoch": 407} {"train_loss": -34.948909759521484, "global_step": 49306, "epoch": 407} {"train_loss": -35.57322311401367, "global_step": 49307, "epoch": 407} {"train_loss": -34.25643539428711, "global_step": 49308, "epoch": 407} {"train_loss": -32.61806106567383, "global_step": 49309, "epoch": 407} {"train_loss": -33.48114776611328, "global_step": 49310, "epoch": 407} {"train_loss": -33.46092987060547, "global_step": 49311, "epoch": 407} {"train_loss": -33.29471206665039, "global_step": 49312, "epoch": 407} {"train_loss": -32.8224983215332, "global_step": 49313, "epoch": 407} {"train_loss": -33.63360595703125, "global_step": 49314, "epoch": 407} {"train_loss": -33.105384826660156, "global_step": 49315, "epoch": 407} {"train_loss": -33.16572189331055, "global_step": 49316, "epoch": 407} {"train_loss": -33.542335510253906, "global_step": 49317, "epoch": 407} {"train_loss": -34.41876220703125, "global_step": 49318, "epoch": 407} {"train_loss": -33.65261459350586, "global_step": 49319, "epoch": 407} {"train_loss": -34.3459358215332, "global_step": 49320, "epoch": 407} {"train_loss": -35.08163070678711, "global_step": 49321, "epoch": 407} {"train_loss": -34.93584442138672, "global_step": 49322, "epoch": 407} {"train_loss": -33.93819808959961, "global_step": 49323, "epoch": 407} {"train_loss": -34.69513702392578, "global_step": 49324, "epoch": 407} {"train_loss": -34.19422149658203, "global_step": 49325, "epoch": 407} {"train_loss": -34.880645751953125, "global_step": 49326, "epoch": 407} {"train_loss": -34.70600891113281, "global_step": 49327, "epoch": 407} {"train_loss": -35.15768051147461, "global_step": 49328, "epoch": 407} {"train_loss": -34.85357666015625, "global_step": 49329, "epoch": 407} {"train_loss": -34.41086196899414, "global_step": 49330, "epoch": 407} {"train_loss": -34.842140197753906, "global_step": 49331, "epoch": 407} {"train_loss": -34.697959899902344, "global_step": 49332, "epoch": 407} {"train_loss": -34.39701461791992, "global_step": 49333, "epoch": 407} {"train_loss": -35.18817138671875, "global_step": 49334, "epoch": 407} {"train_loss": -35.503395080566406, "global_step": 49335, "epoch": 407} {"train_loss": -34.49549102783203, "global_step": 49336, "epoch": 407} {"train_loss": -34.26947021484375, "global_step": 49337, "epoch": 407} {"train_loss": -34.96870040893555, "global_step": 49338, "epoch": 407} {"train_loss": -35.29985427856445, "global_step": 49339, "epoch": 407} {"train_loss": -32.80631637573242, "global_step": 49340, "epoch": 407} {"train_loss": -34.84446334838867, "global_step": 49341, "epoch": 407} {"train_loss": -35.09468460083008, "global_step": 49342, "epoch": 407} {"train_loss": -35.36845397949219, "global_step": 49343, "epoch": 407} {"train_loss": -33.77741622924805, "global_step": 49344, "epoch": 407} {"train_loss": -34.275325775146484, "global_step": 49345, "epoch": 407} {"train_loss": -34.347625732421875, "global_step": 49346, "epoch": 407} {"train_loss": -28.947717666625977, "global_step": 49347, "epoch": 407} {"train_loss": -33.744564056396484, "global_step": 49348, "epoch": 407} {"train_loss": -33.30153274536133, "global_step": 49349, "epoch": 407} {"train_loss": -34.13648986816406, "global_step": 49350, "epoch": 407} {"train_loss": -33.715919494628906, "global_step": 49351, "epoch": 407} {"train_loss": -32.78054428100586, "global_step": 49352, "epoch": 407} {"train_loss": -32.4864387512207, "global_step": 49353, "epoch": 407} {"train_loss": -34.64240646362305, "global_step": 49354, "epoch": 407} {"train_loss": -34.62258529663086, "global_step": 49355, "epoch": 407} {"train_loss": -33.720947265625, "global_step": 49356, "epoch": 407} {"train_loss": -32.34672927856445, "global_step": 49357, "epoch": 407} {"train_loss": -34.74018478393555, "global_step": 49358, "epoch": 407} {"train_loss": -34.81348419189453, "global_step": 49359, "epoch": 407} {"train_loss": -33.01517868041992, "global_step": 49360, "epoch": 407} {"train_loss": -33.973567962646484, "global_step": 49361, "epoch": 407} {"train_loss": -35.10403823852539, "global_step": 49362, "epoch": 407} {"train_loss": -34.627925872802734, "global_step": 49363, "epoch": 407} {"train_loss": -35.3330078125, "global_step": 49364, "epoch": 407} {"train_loss": -34.69259262084961, "global_step": 49365, "epoch": 407} {"train_loss": -35.223228454589844, "global_step": 49366, "epoch": 407} {"train_loss": -34.61640654319574, "global_step": 49367, "epoch": 407, "val_loss": 2637638.0} {"train_loss": -35.00288009643555, "global_step": 49368, "epoch": 408} {"train_loss": -35.09894561767578, "global_step": 49369, "epoch": 408} {"train_loss": -35.290130615234375, "global_step": 49370, "epoch": 408} {"train_loss": -35.081661224365234, "global_step": 49371, "epoch": 408} {"train_loss": -34.87630081176758, "global_step": 49372, "epoch": 408} {"train_loss": -34.953128814697266, "global_step": 49373, "epoch": 408} {"train_loss": -35.459354400634766, "global_step": 49374, "epoch": 408} {"train_loss": -35.09690475463867, "global_step": 49375, "epoch": 408} {"train_loss": -35.30567932128906, "global_step": 49376, "epoch": 408} {"train_loss": -34.52595520019531, "global_step": 49377, "epoch": 408} {"train_loss": -32.81462478637695, "global_step": 49378, "epoch": 408} {"train_loss": -27.090702056884766, "global_step": 49379, "epoch": 408} {"train_loss": -15.079745292663574, "global_step": 49380, "epoch": 408} {"train_loss": -7.951014995574951, "global_step": 49381, "epoch": 408} {"train_loss": -28.767980575561523, "global_step": 49382, "epoch": 408} {"train_loss": -28.910200119018555, "global_step": 49383, "epoch": 408} {"train_loss": -30.01844596862793, "global_step": 49384, "epoch": 408} {"train_loss": -32.0452766418457, "global_step": 49385, "epoch": 408} {"train_loss": -34.19913864135742, "global_step": 49386, "epoch": 408} {"train_loss": -32.37038040161133, "global_step": 49387, "epoch": 408} {"train_loss": -35.08695602416992, "global_step": 49388, "epoch": 408} {"train_loss": -33.930049896240234, "global_step": 49389, "epoch": 408} {"train_loss": -33.26765441894531, "global_step": 49390, "epoch": 408} {"train_loss": -34.86811447143555, "global_step": 49391, "epoch": 408} {"train_loss": -34.49174118041992, "global_step": 49392, "epoch": 408} {"train_loss": -33.97243881225586, "global_step": 49393, "epoch": 408} {"train_loss": -34.77448654174805, "global_step": 49394, "epoch": 408} {"train_loss": -35.01008987426758, "global_step": 49395, "epoch": 408} {"train_loss": -34.59699249267578, "global_step": 49396, "epoch": 408} {"train_loss": -34.645198822021484, "global_step": 49397, "epoch": 408} {"train_loss": -35.13911056518555, "global_step": 49398, "epoch": 408} {"train_loss": -35.307106018066406, "global_step": 49399, "epoch": 408} {"train_loss": -35.1661491394043, "global_step": 49400, "epoch": 408} {"train_loss": -34.987701416015625, "global_step": 49401, "epoch": 408} {"train_loss": -35.3975944519043, "global_step": 49402, "epoch": 408} {"train_loss": -35.00333786010742, "global_step": 49403, "epoch": 408} {"train_loss": -35.44050216674805, "global_step": 49404, "epoch": 408} {"train_loss": -35.33376693725586, "global_step": 49405, "epoch": 408} {"train_loss": -35.62701416015625, "global_step": 49406, "epoch": 408} {"train_loss": -35.710784912109375, "global_step": 49407, "epoch": 408} {"train_loss": -35.862823486328125, "global_step": 49408, "epoch": 408} {"train_loss": -35.32915115356445, "global_step": 49409, "epoch": 408} {"train_loss": -35.19680404663086, "global_step": 49410, "epoch": 408} {"train_loss": -35.83126449584961, "global_step": 49411, "epoch": 408} {"train_loss": -35.83761215209961, "global_step": 49412, "epoch": 408} {"train_loss": -35.7493896484375, "global_step": 49413, "epoch": 408} {"train_loss": -35.35708236694336, "global_step": 49414, "epoch": 408} {"train_loss": -35.67850875854492, "global_step": 49415, "epoch": 408} {"train_loss": -35.91436004638672, "global_step": 49416, "epoch": 408} {"train_loss": -35.806251525878906, "global_step": 49417, "epoch": 408} {"train_loss": -35.705810546875, "global_step": 49418, "epoch": 408} {"train_loss": -35.15554428100586, "global_step": 49419, "epoch": 408} {"train_loss": -36.04647445678711, "global_step": 49420, "epoch": 408} {"train_loss": -35.735687255859375, "global_step": 49421, "epoch": 408} {"train_loss": -35.07342529296875, "global_step": 49422, "epoch": 408} {"train_loss": -35.128231048583984, "global_step": 49423, "epoch": 408} {"train_loss": -34.42318344116211, "global_step": 49424, "epoch": 408} {"train_loss": -35.313758850097656, "global_step": 49425, "epoch": 408} {"train_loss": -35.322235107421875, "global_step": 49426, "epoch": 408} {"train_loss": -35.155635833740234, "global_step": 49427, "epoch": 408} {"train_loss": -34.37260818481445, "global_step": 49428, "epoch": 408} {"train_loss": -35.10114288330078, "global_step": 49429, "epoch": 408} {"train_loss": -35.237117767333984, "global_step": 49430, "epoch": 408} {"train_loss": -35.43634033203125, "global_step": 49431, "epoch": 408} {"train_loss": -34.09379196166992, "global_step": 49432, "epoch": 408} {"train_loss": -34.30946731567383, "global_step": 49433, "epoch": 408} {"train_loss": -31.985807418823242, "global_step": 49434, "epoch": 408} {"train_loss": -30.955453872680664, "global_step": 49435, "epoch": 408} {"train_loss": -29.770679473876953, "global_step": 49436, "epoch": 408} {"train_loss": -25.9901123046875, "global_step": 49437, "epoch": 408} {"train_loss": -25.21515464782715, "global_step": 49438, "epoch": 408} {"train_loss": -33.62227249145508, "global_step": 49439, "epoch": 408} {"train_loss": -33.67726135253906, "global_step": 49440, "epoch": 408} {"train_loss": -31.61594581604004, "global_step": 49441, "epoch": 408} {"train_loss": -34.699031829833984, "global_step": 49442, "epoch": 408} {"train_loss": -33.177467346191406, "global_step": 49443, "epoch": 408} {"train_loss": -34.555843353271484, "global_step": 49444, "epoch": 408} {"train_loss": -33.60501480102539, "global_step": 49445, "epoch": 408} {"train_loss": -34.20264434814453, "global_step": 49446, "epoch": 408} {"train_loss": -34.14071273803711, "global_step": 49447, "epoch": 408} {"train_loss": -34.44269943237305, "global_step": 49448, "epoch": 408} {"train_loss": -33.332088470458984, "global_step": 49449, "epoch": 408} {"train_loss": -34.76295852661133, "global_step": 49450, "epoch": 408} {"train_loss": -34.01897048950195, "global_step": 49451, "epoch": 408} {"train_loss": -34.788917541503906, "global_step": 49452, "epoch": 408} {"train_loss": -35.033695220947266, "global_step": 49453, "epoch": 408} {"train_loss": -34.96384811401367, "global_step": 49454, "epoch": 408} {"train_loss": -35.262691497802734, "global_step": 49455, "epoch": 408} {"train_loss": -34.846065521240234, "global_step": 49456, "epoch": 408} {"train_loss": -35.30452346801758, "global_step": 49457, "epoch": 408} {"train_loss": -34.23629379272461, "global_step": 49458, "epoch": 408} {"train_loss": -35.06654739379883, "global_step": 49459, "epoch": 408} {"train_loss": -35.34273910522461, "global_step": 49460, "epoch": 408} {"train_loss": -35.26215744018555, "global_step": 49461, "epoch": 408} {"train_loss": -35.45345687866211, "global_step": 49462, "epoch": 408} {"train_loss": -35.20423126220703, "global_step": 49463, "epoch": 408} {"train_loss": -35.75074005126953, "global_step": 49464, "epoch": 408} {"train_loss": -35.1803092956543, "global_step": 49465, "epoch": 408} {"train_loss": -35.65438461303711, "global_step": 49466, "epoch": 408} {"train_loss": -35.14585876464844, "global_step": 49467, "epoch": 408} {"train_loss": -35.4349365234375, "global_step": 49468, "epoch": 408} {"train_loss": -35.181800842285156, "global_step": 49469, "epoch": 408} {"train_loss": -34.878963470458984, "global_step": 49470, "epoch": 408} {"train_loss": -34.53742599487305, "global_step": 49471, "epoch": 408} {"train_loss": -34.78080368041992, "global_step": 49472, "epoch": 408} {"train_loss": -34.81367874145508, "global_step": 49473, "epoch": 408} {"train_loss": -35.30515670776367, "global_step": 49474, "epoch": 408} {"train_loss": -35.27890396118164, "global_step": 49475, "epoch": 408} {"train_loss": -35.30328369140625, "global_step": 49476, "epoch": 408} {"train_loss": -34.9557991027832, "global_step": 49477, "epoch": 408} {"train_loss": -34.99979782104492, "global_step": 49478, "epoch": 408} {"train_loss": -35.49711608886719, "global_step": 49479, "epoch": 408} {"train_loss": -34.835243225097656, "global_step": 49480, "epoch": 408} {"train_loss": -35.28634262084961, "global_step": 49481, "epoch": 408} {"train_loss": -34.96177291870117, "global_step": 49482, "epoch": 408} {"train_loss": -33.304786682128906, "global_step": 49483, "epoch": 408} {"train_loss": -28.358020782470703, "global_step": 49484, "epoch": 408} {"train_loss": -18.258710861206055, "global_step": 49485, "epoch": 408} {"train_loss": -22.1414852142334, "global_step": 49486, "epoch": 408} {"train_loss": -32.52666473388672, "global_step": 49487, "epoch": 408} {"train_loss": -33.67372623553946, "global_step": 49488, "epoch": 408, "val_loss": 2685584.25} {"train_loss": -30.324844360351562, "global_step": 49489, "epoch": 409} {"train_loss": -34.94765853881836, "global_step": 49490, "epoch": 409} {"train_loss": -33.99443054199219, "global_step": 49491, "epoch": 409} {"train_loss": -33.73918914794922, "global_step": 49492, "epoch": 409} {"train_loss": -34.5933837890625, "global_step": 49493, "epoch": 409} {"train_loss": -33.3344841003418, "global_step": 49494, "epoch": 409} {"train_loss": -33.94594192504883, "global_step": 49495, "epoch": 409} {"train_loss": -34.64359664916992, "global_step": 49496, "epoch": 409} {"train_loss": -33.95340347290039, "global_step": 49497, "epoch": 409} {"train_loss": -34.948768615722656, "global_step": 49498, "epoch": 409} {"train_loss": -34.839332580566406, "global_step": 49499, "epoch": 409} {"train_loss": -34.769203186035156, "global_step": 49500, "epoch": 409} {"train_loss": -34.08876419067383, "global_step": 49501, "epoch": 409} {"train_loss": -34.910247802734375, "global_step": 49502, "epoch": 409} {"train_loss": -34.92441177368164, "global_step": 49503, "epoch": 409} {"train_loss": -34.6900520324707, "global_step": 49504, "epoch": 409} {"train_loss": -34.66965866088867, "global_step": 49505, "epoch": 409} {"train_loss": -34.516353607177734, "global_step": 49506, "epoch": 409} {"train_loss": -34.61146926879883, "global_step": 49507, "epoch": 409} {"train_loss": -34.79085922241211, "global_step": 49508, "epoch": 409} {"train_loss": -34.90635299682617, "global_step": 49509, "epoch": 409} {"train_loss": -35.27070236206055, "global_step": 49510, "epoch": 409} {"train_loss": -35.20830154418945, "global_step": 49511, "epoch": 409} {"train_loss": -35.45596694946289, "global_step": 49512, "epoch": 409} {"train_loss": -35.14461135864258, "global_step": 49513, "epoch": 409} {"train_loss": -35.06245803833008, "global_step": 49514, "epoch": 409} {"train_loss": -35.168243408203125, "global_step": 49515, "epoch": 409} {"train_loss": -35.0547981262207, "global_step": 49516, "epoch": 409} {"train_loss": -35.31825637817383, "global_step": 49517, "epoch": 409} {"train_loss": -35.47114944458008, "global_step": 49518, "epoch": 409} {"train_loss": -34.870025634765625, "global_step": 49519, "epoch": 409} {"train_loss": -35.19334030151367, "global_step": 49520, "epoch": 409} {"train_loss": -35.24605178833008, "global_step": 49521, "epoch": 409} {"train_loss": -35.17641830444336, "global_step": 49522, "epoch": 409} {"train_loss": -35.2172737121582, "global_step": 49523, "epoch": 409} {"train_loss": -35.31398010253906, "global_step": 49524, "epoch": 409} {"train_loss": -35.278411865234375, "global_step": 49525, "epoch": 409} {"train_loss": -35.356536865234375, "global_step": 49526, "epoch": 409} {"train_loss": -34.22982406616211, "global_step": 49527, "epoch": 409} {"train_loss": -34.159698486328125, "global_step": 49528, "epoch": 409} {"train_loss": -33.49334716796875, "global_step": 49529, "epoch": 409} {"train_loss": -28.9682559967041, "global_step": 49530, "epoch": 409} {"train_loss": -21.26689910888672, "global_step": 49531, "epoch": 409} {"train_loss": -18.628873825073242, "global_step": 49532, "epoch": 409} {"train_loss": -33.799068450927734, "global_step": 49533, "epoch": 409} {"train_loss": -27.946399688720703, "global_step": 49534, "epoch": 409} {"train_loss": -34.858394622802734, "global_step": 49535, "epoch": 409} {"train_loss": -29.598834991455078, "global_step": 49536, "epoch": 409} {"train_loss": -33.20675277709961, "global_step": 49537, "epoch": 409} {"train_loss": -33.40748977661133, "global_step": 49538, "epoch": 409} {"train_loss": -34.14130401611328, "global_step": 49539, "epoch": 409} {"train_loss": -33.642005920410156, "global_step": 49540, "epoch": 409} {"train_loss": -34.78174591064453, "global_step": 49541, "epoch": 409} {"train_loss": -34.0719108581543, "global_step": 49542, "epoch": 409} {"train_loss": -34.39906692504883, "global_step": 49543, "epoch": 409} {"train_loss": -34.55378341674805, "global_step": 49544, "epoch": 409} {"train_loss": -35.21049118041992, "global_step": 49545, "epoch": 409} {"train_loss": -34.42965316772461, "global_step": 49546, "epoch": 409} {"train_loss": -34.52219772338867, "global_step": 49547, "epoch": 409} {"train_loss": -34.57150650024414, "global_step": 49548, "epoch": 409} {"train_loss": -35.22207260131836, "global_step": 49549, "epoch": 409} {"train_loss": -34.7228889465332, "global_step": 49550, "epoch": 409} {"train_loss": -34.56892013549805, "global_step": 49551, "epoch": 409} {"train_loss": -35.34984588623047, "global_step": 49552, "epoch": 409} {"train_loss": -35.33137893676758, "global_step": 49553, "epoch": 409} {"train_loss": -35.017147064208984, "global_step": 49554, "epoch": 409} {"train_loss": -35.068973541259766, "global_step": 49555, "epoch": 409} {"train_loss": -35.1216926574707, "global_step": 49556, "epoch": 409} {"train_loss": -35.40576171875, "global_step": 49557, "epoch": 409} {"train_loss": -35.166786193847656, "global_step": 49558, "epoch": 409} {"train_loss": -35.09394836425781, "global_step": 49559, "epoch": 409} {"train_loss": -35.266780853271484, "global_step": 49560, "epoch": 409} {"train_loss": -35.0523567199707, "global_step": 49561, "epoch": 409} {"train_loss": -35.39094924926758, "global_step": 49562, "epoch": 409} {"train_loss": -34.6272087097168, "global_step": 49563, "epoch": 409} {"train_loss": -33.599945068359375, "global_step": 49564, "epoch": 409} {"train_loss": -35.14341354370117, "global_step": 49565, "epoch": 409} {"train_loss": -34.876739501953125, "global_step": 49566, "epoch": 409} {"train_loss": -34.871482849121094, "global_step": 49567, "epoch": 409} {"train_loss": -34.80816650390625, "global_step": 49568, "epoch": 409} {"train_loss": -34.2659912109375, "global_step": 49569, "epoch": 409} {"train_loss": -34.676918029785156, "global_step": 49570, "epoch": 409} {"train_loss": -34.55369186401367, "global_step": 49571, "epoch": 409} {"train_loss": -35.3141975402832, "global_step": 49572, "epoch": 409} {"train_loss": -34.62580490112305, "global_step": 49573, "epoch": 409} {"train_loss": -35.403255462646484, "global_step": 49574, "epoch": 409} {"train_loss": -33.9903564453125, "global_step": 49575, "epoch": 409} {"train_loss": -34.63991928100586, "global_step": 49576, "epoch": 409} {"train_loss": -34.977447509765625, "global_step": 49577, "epoch": 409} {"train_loss": -35.070125579833984, "global_step": 49578, "epoch": 409} {"train_loss": -34.97625732421875, "global_step": 49579, "epoch": 409} {"train_loss": -35.13436508178711, "global_step": 49580, "epoch": 409} {"train_loss": -33.810264587402344, "global_step": 49581, "epoch": 409} {"train_loss": -34.93153762817383, "global_step": 49582, "epoch": 409} {"train_loss": -34.68180465698242, "global_step": 49583, "epoch": 409} {"train_loss": -35.54320526123047, "global_step": 49584, "epoch": 409} {"train_loss": -34.9337158203125, "global_step": 49585, "epoch": 409} {"train_loss": -34.973079681396484, "global_step": 49586, "epoch": 409} {"train_loss": -35.13727951049805, "global_step": 49587, "epoch": 409} {"train_loss": -35.13045883178711, "global_step": 49588, "epoch": 409} {"train_loss": -35.56801223754883, "global_step": 49589, "epoch": 409} {"train_loss": -35.32366943359375, "global_step": 49590, "epoch": 409} {"train_loss": -35.60503005981445, "global_step": 49591, "epoch": 409} {"train_loss": -35.65677261352539, "global_step": 49592, "epoch": 409} {"train_loss": -35.42045211791992, "global_step": 49593, "epoch": 409} {"train_loss": -35.969764709472656, "global_step": 49594, "epoch": 409} {"train_loss": -35.267333984375, "global_step": 49595, "epoch": 409} {"train_loss": -36.05070877075195, "global_step": 49596, "epoch": 409} {"train_loss": -35.619102478027344, "global_step": 49597, "epoch": 409} {"train_loss": -35.32009506225586, "global_step": 49598, "epoch": 409} {"train_loss": -35.62742614746094, "global_step": 49599, "epoch": 409} {"train_loss": -35.231361389160156, "global_step": 49600, "epoch": 409} {"train_loss": -34.80821990966797, "global_step": 49601, "epoch": 409} {"train_loss": -33.384883880615234, "global_step": 49602, "epoch": 409} {"train_loss": -28.991422653198242, "global_step": 49603, "epoch": 409} {"train_loss": -25.560413360595703, "global_step": 49604, "epoch": 409} {"train_loss": -30.7728271484375, "global_step": 49605, "epoch": 409} {"train_loss": -35.399349212646484, "global_step": 49606, "epoch": 409} {"train_loss": -32.329002380371094, "global_step": 49607, "epoch": 409} {"train_loss": -32.804725646972656, "global_step": 49608, "epoch": 409} {"train_loss": -34.21163314630177, "global_step": 49609, "epoch": 409, "val_loss": 2604171.75} {"train_loss": -33.49894332885742, "global_step": 49610, "epoch": 410} {"train_loss": -35.17267990112305, "global_step": 49611, "epoch": 410} {"train_loss": -35.09385681152344, "global_step": 49612, "epoch": 410} {"train_loss": -34.53615188598633, "global_step": 49613, "epoch": 410} {"train_loss": -35.308135986328125, "global_step": 49614, "epoch": 410} {"train_loss": -34.71718978881836, "global_step": 49615, "epoch": 410} {"train_loss": -35.44458770751953, "global_step": 49616, "epoch": 410} {"train_loss": -34.96268081665039, "global_step": 49617, "epoch": 410} {"train_loss": -34.63735580444336, "global_step": 49618, "epoch": 410} {"train_loss": -35.772743225097656, "global_step": 49619, "epoch": 410} {"train_loss": -34.86227035522461, "global_step": 49620, "epoch": 410} {"train_loss": -35.57002639770508, "global_step": 49621, "epoch": 410} {"train_loss": -34.67737579345703, "global_step": 49622, "epoch": 410} {"train_loss": -35.991878509521484, "global_step": 49623, "epoch": 410} {"train_loss": -35.28831100463867, "global_step": 49624, "epoch": 410} {"train_loss": -34.91213607788086, "global_step": 49625, "epoch": 410} {"train_loss": -35.18465805053711, "global_step": 49626, "epoch": 410} {"train_loss": -35.12860870361328, "global_step": 49627, "epoch": 410} {"train_loss": -35.65121078491211, "global_step": 49628, "epoch": 410} {"train_loss": -35.45256042480469, "global_step": 49629, "epoch": 410} {"train_loss": -35.4871940612793, "global_step": 49630, "epoch": 410} {"train_loss": -35.073219299316406, "global_step": 49631, "epoch": 410} {"train_loss": -35.79880905151367, "global_step": 49632, "epoch": 410} {"train_loss": -35.43170166015625, "global_step": 49633, "epoch": 410} {"train_loss": -35.59089279174805, "global_step": 49634, "epoch": 410} {"train_loss": -36.31528854370117, "global_step": 49635, "epoch": 410} {"train_loss": -34.8289794921875, "global_step": 49636, "epoch": 410} {"train_loss": -35.771400451660156, "global_step": 49637, "epoch": 410} {"train_loss": -35.86682891845703, "global_step": 49638, "epoch": 410} {"train_loss": -36.181819915771484, "global_step": 49639, "epoch": 410} {"train_loss": -35.979122161865234, "global_step": 49640, "epoch": 410} {"train_loss": -35.34524154663086, "global_step": 49641, "epoch": 410} {"train_loss": -35.634464263916016, "global_step": 49642, "epoch": 410} {"train_loss": -34.801456451416016, "global_step": 49643, "epoch": 410} {"train_loss": -35.103389739990234, "global_step": 49644, "epoch": 410} {"train_loss": -34.53876876831055, "global_step": 49645, "epoch": 410} {"train_loss": -33.03556442260742, "global_step": 49646, "epoch": 410} {"train_loss": -34.33877182006836, "global_step": 49647, "epoch": 410} {"train_loss": -34.94599533081055, "global_step": 49648, "epoch": 410} {"train_loss": -33.869625091552734, "global_step": 49649, "epoch": 410} {"train_loss": -33.647769927978516, "global_step": 49650, "epoch": 410} {"train_loss": -35.450252532958984, "global_step": 49651, "epoch": 410} {"train_loss": -33.82960510253906, "global_step": 49652, "epoch": 410} {"train_loss": -35.1279411315918, "global_step": 49653, "epoch": 410} {"train_loss": -33.3420295715332, "global_step": 49654, "epoch": 410} {"train_loss": -35.503211975097656, "global_step": 49655, "epoch": 410} {"train_loss": -34.68452072143555, "global_step": 49656, "epoch": 410} {"train_loss": -34.499446868896484, "global_step": 49657, "epoch": 410} {"train_loss": -34.132652282714844, "global_step": 49658, "epoch": 410} {"train_loss": -35.36939239501953, "global_step": 49659, "epoch": 410} {"train_loss": -34.844268798828125, "global_step": 49660, "epoch": 410} {"train_loss": -34.99612045288086, "global_step": 49661, "epoch": 410} {"train_loss": -34.66921615600586, "global_step": 49662, "epoch": 410} {"train_loss": -34.999366760253906, "global_step": 49663, "epoch": 410} {"train_loss": -35.10818099975586, "global_step": 49664, "epoch": 410} {"train_loss": -35.14279556274414, "global_step": 49665, "epoch": 410} {"train_loss": -35.265743255615234, "global_step": 49666, "epoch": 410} {"train_loss": -35.1288948059082, "global_step": 49667, "epoch": 410} {"train_loss": -34.9631462097168, "global_step": 49668, "epoch": 410} {"train_loss": -35.38444137573242, "global_step": 49669, "epoch": 410} {"train_loss": -35.722084045410156, "global_step": 49670, "epoch": 410} {"train_loss": -35.440338134765625, "global_step": 49671, "epoch": 410} {"train_loss": -35.17390823364258, "global_step": 49672, "epoch": 410} {"train_loss": -35.99026870727539, "global_step": 49673, "epoch": 410} {"train_loss": -35.729164123535156, "global_step": 49674, "epoch": 410} {"train_loss": -35.212982177734375, "global_step": 49675, "epoch": 410} {"train_loss": -35.733089447021484, "global_step": 49676, "epoch": 410} {"train_loss": -35.376766204833984, "global_step": 49677, "epoch": 410} {"train_loss": -35.42625045776367, "global_step": 49678, "epoch": 410} {"train_loss": -35.2287483215332, "global_step": 49679, "epoch": 410} {"train_loss": -35.70545196533203, "global_step": 49680, "epoch": 410} {"train_loss": -36.017330169677734, "global_step": 49681, "epoch": 410} {"train_loss": -35.34687042236328, "global_step": 49682, "epoch": 410} {"train_loss": -35.81463623046875, "global_step": 49683, "epoch": 410} {"train_loss": -36.25693893432617, "global_step": 49684, "epoch": 410} {"train_loss": -35.32528305053711, "global_step": 49685, "epoch": 410} {"train_loss": -36.107845306396484, "global_step": 49686, "epoch": 410} {"train_loss": -34.85053253173828, "global_step": 49687, "epoch": 410} {"train_loss": -35.946327209472656, "global_step": 49688, "epoch": 410} {"train_loss": -35.56840133666992, "global_step": 49689, "epoch": 410} {"train_loss": -33.63932418823242, "global_step": 49690, "epoch": 410} {"train_loss": -35.25383377075195, "global_step": 49691, "epoch": 410} {"train_loss": -35.6096076965332, "global_step": 49692, "epoch": 410} {"train_loss": -32.2542610168457, "global_step": 49693, "epoch": 410} {"train_loss": -34.93648910522461, "global_step": 49694, "epoch": 410} {"train_loss": -33.90884780883789, "global_step": 49695, "epoch": 410} {"train_loss": -34.73579788208008, "global_step": 49696, "epoch": 410} {"train_loss": -33.56269454956055, "global_step": 49697, "epoch": 410} {"train_loss": -33.05953598022461, "global_step": 49698, "epoch": 410} {"train_loss": -34.03157043457031, "global_step": 49699, "epoch": 410} {"train_loss": -34.462398529052734, "global_step": 49700, "epoch": 410} {"train_loss": -32.303653717041016, "global_step": 49701, "epoch": 410} {"train_loss": -32.74420166015625, "global_step": 49702, "epoch": 410} {"train_loss": -31.58997917175293, "global_step": 49703, "epoch": 410} {"train_loss": -33.46528625488281, "global_step": 49704, "epoch": 410} {"train_loss": -29.97861671447754, "global_step": 49705, "epoch": 410} {"train_loss": -27.24542808532715, "global_step": 49706, "epoch": 410} {"train_loss": -32.86759948730469, "global_step": 49707, "epoch": 410} {"train_loss": -32.834651947021484, "global_step": 49708, "epoch": 410} {"train_loss": -30.207197189331055, "global_step": 49709, "epoch": 410} {"train_loss": -29.6452579498291, "global_step": 49710, "epoch": 410} {"train_loss": -32.745208740234375, "global_step": 49711, "epoch": 410} {"train_loss": -33.198360443115234, "global_step": 49712, "epoch": 410} {"train_loss": -32.87706756591797, "global_step": 49713, "epoch": 410} {"train_loss": -30.430341720581055, "global_step": 49714, "epoch": 410} {"train_loss": -19.7249813079834, "global_step": 49715, "epoch": 410} {"train_loss": -29.10702896118164, "global_step": 49716, "epoch": 410} {"train_loss": -31.041522979736328, "global_step": 49717, "epoch": 410} {"train_loss": -13.643203735351562, "global_step": 49718, "epoch": 410} {"train_loss": -28.5081729888916, "global_step": 49719, "epoch": 410} {"train_loss": -24.548749923706055, "global_step": 49720, "epoch": 410} {"train_loss": -28.21930503845215, "global_step": 49721, "epoch": 410} {"train_loss": -28.687047958374023, "global_step": 49722, "epoch": 410} {"train_loss": -27.45489501953125, "global_step": 49723, "epoch": 410} {"train_loss": -31.7626895904541, "global_step": 49724, "epoch": 410} {"train_loss": -28.105295181274414, "global_step": 49725, "epoch": 410} {"train_loss": -29.170398712158203, "global_step": 49726, "epoch": 410} {"train_loss": -29.083255767822266, "global_step": 49727, "epoch": 410} {"train_loss": -30.528898239135742, "global_step": 49728, "epoch": 410} {"train_loss": -28.77387046813965, "global_step": 49729, "epoch": 410} {"train_loss": -33.61806043514535, "global_step": 49730, "epoch": 410, "val_loss": 2599635.25} {"train_loss": -29.520444869995117, "global_step": 49731, "epoch": 411} {"train_loss": -30.261554718017578, "global_step": 49732, "epoch": 411} {"train_loss": -29.102375030517578, "global_step": 49733, "epoch": 411} {"train_loss": -30.47842788696289, "global_step": 49734, "epoch": 411} {"train_loss": -30.01315689086914, "global_step": 49735, "epoch": 411} {"train_loss": -31.099130630493164, "global_step": 49736, "epoch": 411} {"train_loss": -31.022703170776367, "global_step": 49737, "epoch": 411} {"train_loss": -31.193891525268555, "global_step": 49738, "epoch": 411} {"train_loss": -30.63852310180664, "global_step": 49739, "epoch": 411} {"train_loss": -30.873640060424805, "global_step": 49740, "epoch": 411} {"train_loss": -31.297819137573242, "global_step": 49741, "epoch": 411} {"train_loss": -31.273284912109375, "global_step": 49742, "epoch": 411} {"train_loss": -31.3756103515625, "global_step": 49743, "epoch": 411} {"train_loss": -31.749975204467773, "global_step": 49744, "epoch": 411} {"train_loss": -31.51772117614746, "global_step": 49745, "epoch": 411} {"train_loss": -32.06276321411133, "global_step": 49746, "epoch": 411} {"train_loss": -27.109617233276367, "global_step": 49747, "epoch": 411} {"train_loss": -31.1685848236084, "global_step": 49748, "epoch": 411} {"train_loss": -31.65997886657715, "global_step": 49749, "epoch": 411} {"train_loss": -30.581701278686523, "global_step": 49750, "epoch": 411} {"train_loss": -32.15623092651367, "global_step": 49751, "epoch": 411} {"train_loss": -26.290281295776367, "global_step": 49752, "epoch": 411} {"train_loss": -32.17094039916992, "global_step": 49753, "epoch": 411} {"train_loss": -31.90555191040039, "global_step": 49754, "epoch": 411} {"train_loss": -31.930044174194336, "global_step": 49755, "epoch": 411} {"train_loss": -32.45095443725586, "global_step": 49756, "epoch": 411} {"train_loss": -31.84527587890625, "global_step": 49757, "epoch": 411} {"train_loss": -32.369258880615234, "global_step": 49758, "epoch": 411} {"train_loss": -31.609344482421875, "global_step": 49759, "epoch": 411} {"train_loss": -31.87345314025879, "global_step": 49760, "epoch": 411} {"train_loss": -32.497188568115234, "global_step": 49761, "epoch": 411} {"train_loss": -32.40533447265625, "global_step": 49762, "epoch": 411} {"train_loss": -26.307371139526367, "global_step": 49763, "epoch": 411} {"train_loss": -32.80060958862305, "global_step": 49764, "epoch": 411} {"train_loss": -32.92091751098633, "global_step": 49765, "epoch": 411} {"train_loss": -32.59404373168945, "global_step": 49766, "epoch": 411} {"train_loss": -33.07374572753906, "global_step": 49767, "epoch": 411} {"train_loss": -32.953338623046875, "global_step": 49768, "epoch": 411} {"train_loss": -33.20532989501953, "global_step": 49769, "epoch": 411} {"train_loss": -33.03178024291992, "global_step": 49770, "epoch": 411} {"train_loss": -32.57017135620117, "global_step": 49771, "epoch": 411} {"train_loss": -31.55625343322754, "global_step": 49772, "epoch": 411} {"train_loss": -33.04322052001953, "global_step": 49773, "epoch": 411} {"train_loss": -33.035926818847656, "global_step": 49774, "epoch": 411} {"train_loss": -33.449119567871094, "global_step": 49775, "epoch": 411} {"train_loss": -33.00934600830078, "global_step": 49776, "epoch": 411} {"train_loss": -33.147796630859375, "global_step": 49777, "epoch": 411} {"train_loss": -33.07444381713867, "global_step": 49778, "epoch": 411} {"train_loss": -33.95852279663086, "global_step": 49779, "epoch": 411} {"train_loss": -33.0168342590332, "global_step": 49780, "epoch": 411} {"train_loss": -33.171669006347656, "global_step": 49781, "epoch": 411} {"train_loss": -33.5398063659668, "global_step": 49782, "epoch": 411} {"train_loss": -33.122589111328125, "global_step": 49783, "epoch": 411} {"train_loss": -33.760658264160156, "global_step": 49784, "epoch": 411} {"train_loss": -33.28675079345703, "global_step": 49785, "epoch": 411} {"train_loss": -33.974178314208984, "global_step": 49786, "epoch": 411} {"train_loss": -33.00284957885742, "global_step": 49787, "epoch": 411} {"train_loss": -33.46653366088867, "global_step": 49788, "epoch": 411} {"train_loss": -33.83254623413086, "global_step": 49789, "epoch": 411} {"train_loss": -33.44639205932617, "global_step": 49790, "epoch": 411} {"train_loss": -34.001426696777344, "global_step": 49791, "epoch": 411} {"train_loss": -33.46997833251953, "global_step": 49792, "epoch": 411} {"train_loss": -33.9672966003418, "global_step": 49793, "epoch": 411} {"train_loss": -33.73836135864258, "global_step": 49794, "epoch": 411} {"train_loss": -34.45530319213867, "global_step": 49795, "epoch": 411} {"train_loss": -33.96458053588867, "global_step": 49796, "epoch": 411} {"train_loss": -33.970821380615234, "global_step": 49797, "epoch": 411} {"train_loss": -34.38838577270508, "global_step": 49798, "epoch": 411} {"train_loss": -34.7440299987793, "global_step": 49799, "epoch": 411} {"train_loss": -34.4573974609375, "global_step": 49800, "epoch": 411} {"train_loss": -34.79096221923828, "global_step": 49801, "epoch": 411} {"train_loss": -34.25443649291992, "global_step": 49802, "epoch": 411} {"train_loss": -34.30473709106445, "global_step": 49803, "epoch": 411} {"train_loss": -34.70174789428711, "global_step": 49804, "epoch": 411} {"train_loss": -34.909420013427734, "global_step": 49805, "epoch": 411} {"train_loss": -34.7492790222168, "global_step": 49806, "epoch": 411} {"train_loss": -34.4509162902832, "global_step": 49807, "epoch": 411} {"train_loss": -34.31842803955078, "global_step": 49808, "epoch": 411} {"train_loss": -34.29037094116211, "global_step": 49809, "epoch": 411} {"train_loss": -34.484161376953125, "global_step": 49810, "epoch": 411} {"train_loss": -34.9912109375, "global_step": 49811, "epoch": 411} {"train_loss": -35.1800651550293, "global_step": 49812, "epoch": 411} {"train_loss": -34.78532028198242, "global_step": 49813, "epoch": 411} {"train_loss": -34.23756790161133, "global_step": 49814, "epoch": 411} {"train_loss": -34.44608688354492, "global_step": 49815, "epoch": 411} {"train_loss": -34.795738220214844, "global_step": 49816, "epoch": 411} {"train_loss": -34.82540512084961, "global_step": 49817, "epoch": 411} {"train_loss": -34.88608932495117, "global_step": 49818, "epoch": 411} {"train_loss": -34.63884735107422, "global_step": 49819, "epoch": 411} {"train_loss": -35.28127670288086, "global_step": 49820, "epoch": 411} {"train_loss": -35.14729690551758, "global_step": 49821, "epoch": 411} {"train_loss": -35.75221633911133, "global_step": 49822, "epoch": 411} {"train_loss": -35.27671432495117, "global_step": 49823, "epoch": 411} {"train_loss": -35.68708419799805, "global_step": 49824, "epoch": 411} {"train_loss": -35.65155029296875, "global_step": 49825, "epoch": 411} {"train_loss": -35.286991119384766, "global_step": 49826, "epoch": 411} {"train_loss": -35.40078353881836, "global_step": 49827, "epoch": 411} {"train_loss": -35.55527114868164, "global_step": 49828, "epoch": 411} {"train_loss": -35.32472610473633, "global_step": 49829, "epoch": 411} {"train_loss": -35.61635971069336, "global_step": 49830, "epoch": 411} {"train_loss": -35.184532165527344, "global_step": 49831, "epoch": 411} {"train_loss": -33.25080490112305, "global_step": 49832, "epoch": 411} {"train_loss": -31.421527862548828, "global_step": 49833, "epoch": 411} {"train_loss": -26.333032608032227, "global_step": 49834, "epoch": 411} {"train_loss": -14.653185844421387, "global_step": 49835, "epoch": 411} {"train_loss": -9.793734550476074, "global_step": 49836, "epoch": 411} {"train_loss": -30.690038681030273, "global_step": 49837, "epoch": 411} {"train_loss": -32.32257843017578, "global_step": 49838, "epoch": 411} {"train_loss": -30.56450843811035, "global_step": 49839, "epoch": 411} {"train_loss": -33.84554672241211, "global_step": 49840, "epoch": 411} {"train_loss": -33.12788772583008, "global_step": 49841, "epoch": 411} {"train_loss": -32.1732063293457, "global_step": 49842, "epoch": 411} {"train_loss": -34.45624923706055, "global_step": 49843, "epoch": 411} {"train_loss": -32.628273010253906, "global_step": 49844, "epoch": 411} {"train_loss": -34.4610710144043, "global_step": 49845, "epoch": 411} {"train_loss": -34.62593460083008, "global_step": 49846, "epoch": 411} {"train_loss": -33.67171096801758, "global_step": 49847, "epoch": 411} {"train_loss": -34.3205451965332, "global_step": 49848, "epoch": 411} {"train_loss": -34.602081298828125, "global_step": 49849, "epoch": 411} {"train_loss": -34.01283264160156, "global_step": 49850, "epoch": 411} {"train_loss": -32.67881142797549, "global_step": 49851, "epoch": 411, "val_loss": 2717920.25} {"train_loss": -34.39634323120117, "global_step": 49852, "epoch": 412} {"train_loss": -34.740543365478516, "global_step": 49853, "epoch": 412} {"train_loss": -33.7821159362793, "global_step": 49854, "epoch": 412} {"train_loss": -34.93550491333008, "global_step": 49855, "epoch": 412} {"train_loss": -34.88460159301758, "global_step": 49856, "epoch": 412} {"train_loss": -34.704063415527344, "global_step": 49857, "epoch": 412} {"train_loss": -34.546241760253906, "global_step": 49858, "epoch": 412} {"train_loss": -34.81443405151367, "global_step": 49859, "epoch": 412} {"train_loss": -34.880374908447266, "global_step": 49860, "epoch": 412} {"train_loss": -34.996917724609375, "global_step": 49861, "epoch": 412} {"train_loss": -35.33539962768555, "global_step": 49862, "epoch": 412} {"train_loss": -34.75926208496094, "global_step": 49863, "epoch": 412} {"train_loss": -34.847900390625, "global_step": 49864, "epoch": 412} {"train_loss": -34.510257720947266, "global_step": 49865, "epoch": 412} {"train_loss": -34.954471588134766, "global_step": 49866, "epoch": 412} {"train_loss": -35.24846267700195, "global_step": 49867, "epoch": 412} {"train_loss": -35.36781692504883, "global_step": 49868, "epoch": 412} {"train_loss": -34.525814056396484, "global_step": 49869, "epoch": 412} {"train_loss": -34.3547477722168, "global_step": 49870, "epoch": 412} {"train_loss": -34.717586517333984, "global_step": 49871, "epoch": 412} {"train_loss": -34.81484603881836, "global_step": 49872, "epoch": 412} {"train_loss": -34.41891098022461, "global_step": 49873, "epoch": 412} {"train_loss": -34.35955047607422, "global_step": 49874, "epoch": 412} {"train_loss": -34.28125762939453, "global_step": 49875, "epoch": 412} {"train_loss": -33.55592346191406, "global_step": 49876, "epoch": 412} {"train_loss": -35.11216735839844, "global_step": 49877, "epoch": 412} {"train_loss": -35.1999397277832, "global_step": 49878, "epoch": 412} {"train_loss": -33.63039779663086, "global_step": 49879, "epoch": 412} {"train_loss": -31.6268310546875, "global_step": 49880, "epoch": 412} {"train_loss": -30.598541259765625, "global_step": 49881, "epoch": 412} {"train_loss": -32.597225189208984, "global_step": 49882, "epoch": 412} {"train_loss": -33.5943717956543, "global_step": 49883, "epoch": 412} {"train_loss": -31.868738174438477, "global_step": 49884, "epoch": 412} {"train_loss": -25.733200073242188, "global_step": 49885, "epoch": 412} {"train_loss": -27.200300216674805, "global_step": 49886, "epoch": 412} {"train_loss": -33.131046295166016, "global_step": 49887, "epoch": 412} {"train_loss": -32.12551498413086, "global_step": 49888, "epoch": 412} {"train_loss": -31.29562759399414, "global_step": 49889, "epoch": 412} {"train_loss": -33.10271072387695, "global_step": 49890, "epoch": 412} {"train_loss": -32.903079986572266, "global_step": 49891, "epoch": 412} {"train_loss": -33.8149528503418, "global_step": 49892, "epoch": 412} {"train_loss": -32.66959762573242, "global_step": 49893, "epoch": 412} {"train_loss": -34.083045959472656, "global_step": 49894, "epoch": 412} {"train_loss": -33.70751953125, "global_step": 49895, "epoch": 412} {"train_loss": -32.350948333740234, "global_step": 49896, "epoch": 412} {"train_loss": -34.39387130737305, "global_step": 49897, "epoch": 412} {"train_loss": -32.828468322753906, "global_step": 49898, "epoch": 412} {"train_loss": -34.082801818847656, "global_step": 49899, "epoch": 412} {"train_loss": -33.62441635131836, "global_step": 49900, "epoch": 412} {"train_loss": -34.015380859375, "global_step": 49901, "epoch": 412} {"train_loss": -33.4342155456543, "global_step": 49902, "epoch": 412} {"train_loss": -33.7486457824707, "global_step": 49903, "epoch": 412} {"train_loss": -33.52356719970703, "global_step": 49904, "epoch": 412} {"train_loss": -33.45829391479492, "global_step": 49905, "epoch": 412} {"train_loss": -34.06940841674805, "global_step": 49906, "epoch": 412} {"train_loss": -34.48666763305664, "global_step": 49907, "epoch": 412} {"train_loss": -29.961181640625, "global_step": 49908, "epoch": 412} {"train_loss": -33.12617492675781, "global_step": 49909, "epoch": 412} {"train_loss": -33.877193450927734, "global_step": 49910, "epoch": 412} {"train_loss": -32.652626037597656, "global_step": 49911, "epoch": 412} {"train_loss": -33.27842712402344, "global_step": 49912, "epoch": 412} {"train_loss": -32.77075958251953, "global_step": 49913, "epoch": 412} {"train_loss": -32.46736526489258, "global_step": 49914, "epoch": 412} {"train_loss": -33.072078704833984, "global_step": 49915, "epoch": 412} {"train_loss": -34.159881591796875, "global_step": 49916, "epoch": 412} {"train_loss": -34.266536712646484, "global_step": 49917, "epoch": 412} {"train_loss": -33.92923355102539, "global_step": 49918, "epoch": 412} {"train_loss": -33.65792465209961, "global_step": 49919, "epoch": 412} {"train_loss": -34.297794342041016, "global_step": 49920, "epoch": 412} {"train_loss": -33.84619140625, "global_step": 49921, "epoch": 412} {"train_loss": -33.56816482543945, "global_step": 49922, "epoch": 412} {"train_loss": -33.671051025390625, "global_step": 49923, "epoch": 412} {"train_loss": -34.036556243896484, "global_step": 49924, "epoch": 412} {"train_loss": -34.6447868347168, "global_step": 49925, "epoch": 412} {"train_loss": -34.380828857421875, "global_step": 49926, "epoch": 412} {"train_loss": -33.66352081298828, "global_step": 49927, "epoch": 412} {"train_loss": -34.18508529663086, "global_step": 49928, "epoch": 412} {"train_loss": -34.29885482788086, "global_step": 49929, "epoch": 412} {"train_loss": -32.70416259765625, "global_step": 49930, "epoch": 412} {"train_loss": -33.8421630859375, "global_step": 49931, "epoch": 412} {"train_loss": -34.1974983215332, "global_step": 49932, "epoch": 412} {"train_loss": -33.904640197753906, "global_step": 49933, "epoch": 412} {"train_loss": -34.60496139526367, "global_step": 49934, "epoch": 412} {"train_loss": -34.19386672973633, "global_step": 49935, "epoch": 412} {"train_loss": -33.814125061035156, "global_step": 49936, "epoch": 412} {"train_loss": -33.57381820678711, "global_step": 49937, "epoch": 412} {"train_loss": -34.462562561035156, "global_step": 49938, "epoch": 412} {"train_loss": -33.51076889038086, "global_step": 49939, "epoch": 412} {"train_loss": -34.36886215209961, "global_step": 49940, "epoch": 412} {"train_loss": -34.28939437866211, "global_step": 49941, "epoch": 412} {"train_loss": -34.213741302490234, "global_step": 49942, "epoch": 412} {"train_loss": -33.53862762451172, "global_step": 49943, "epoch": 412} {"train_loss": -34.417205810546875, "global_step": 49944, "epoch": 412} {"train_loss": -34.007869720458984, "global_step": 49945, "epoch": 412} {"train_loss": -34.55453109741211, "global_step": 49946, "epoch": 412} {"train_loss": -35.099365234375, "global_step": 49947, "epoch": 412} {"train_loss": -34.48312759399414, "global_step": 49948, "epoch": 412} {"train_loss": -34.60914993286133, "global_step": 49949, "epoch": 412} {"train_loss": -34.8885612487793, "global_step": 49950, "epoch": 412} {"train_loss": -35.11830520629883, "global_step": 49951, "epoch": 412} {"train_loss": -34.89306640625, "global_step": 49952, "epoch": 412} {"train_loss": -34.80536651611328, "global_step": 49953, "epoch": 412} {"train_loss": -35.494869232177734, "global_step": 49954, "epoch": 412} {"train_loss": -35.27851486206055, "global_step": 49955, "epoch": 412} {"train_loss": -35.130062103271484, "global_step": 49956, "epoch": 412} {"train_loss": -34.95673751831055, "global_step": 49957, "epoch": 412} {"train_loss": -35.069271087646484, "global_step": 49958, "epoch": 412} {"train_loss": -35.18735885620117, "global_step": 49959, "epoch": 412} {"train_loss": -34.87223434448242, "global_step": 49960, "epoch": 412} {"train_loss": -35.19037628173828, "global_step": 49961, "epoch": 412} {"train_loss": -35.09867477416992, "global_step": 49962, "epoch": 412} {"train_loss": -34.31553268432617, "global_step": 49963, "epoch": 412} {"train_loss": -34.927268981933594, "global_step": 49964, "epoch": 412} {"train_loss": -35.1511344909668, "global_step": 49965, "epoch": 412} {"train_loss": -35.163211822509766, "global_step": 49966, "epoch": 412} {"train_loss": -35.28391647338867, "global_step": 49967, "epoch": 412} {"train_loss": -35.37111282348633, "global_step": 49968, "epoch": 412} {"train_loss": -35.26011276245117, "global_step": 49969, "epoch": 412} {"train_loss": -35.264156341552734, "global_step": 49970, "epoch": 412} {"train_loss": -34.89949417114258, "global_step": 49971, "epoch": 412} {"train_loss": -33.96448242565817, "global_step": 49972, "epoch": 412, "val_loss": 2616073.25} {"train_loss": -34.75822830200195, "global_step": 49973, "epoch": 413} {"train_loss": -35.49066925048828, "global_step": 49974, "epoch": 413} {"train_loss": -34.59397506713867, "global_step": 49975, "epoch": 413} {"train_loss": -34.892333984375, "global_step": 49976, "epoch": 413} {"train_loss": -35.480674743652344, "global_step": 49977, "epoch": 413} {"train_loss": -35.37440490722656, "global_step": 49978, "epoch": 413} {"train_loss": -35.14571762084961, "global_step": 49979, "epoch": 413} {"train_loss": -35.400936126708984, "global_step": 49980, "epoch": 413} {"train_loss": -35.282222747802734, "global_step": 49981, "epoch": 413} {"train_loss": -35.06291580200195, "global_step": 49982, "epoch": 413} {"train_loss": -35.36239242553711, "global_step": 49983, "epoch": 413} {"train_loss": -33.419715881347656, "global_step": 49984, "epoch": 413} {"train_loss": -35.13712692260742, "global_step": 49985, "epoch": 413} {"train_loss": -35.067195892333984, "global_step": 49986, "epoch": 413} {"train_loss": -34.0527458190918, "global_step": 49987, "epoch": 413} {"train_loss": -32.248748779296875, "global_step": 49988, "epoch": 413} {"train_loss": -35.02360153198242, "global_step": 49989, "epoch": 413} {"train_loss": -34.83705520629883, "global_step": 49990, "epoch": 413} {"train_loss": -35.45711898803711, "global_step": 49991, "epoch": 413} {"train_loss": -35.2059211730957, "global_step": 49992, "epoch": 413} {"train_loss": -33.61037826538086, "global_step": 49993, "epoch": 413} {"train_loss": -35.0942497253418, "global_step": 49994, "epoch": 413} {"train_loss": -34.2232666015625, "global_step": 49995, "epoch": 413} {"train_loss": -34.04814147949219, "global_step": 49996, "epoch": 413} {"train_loss": -34.75102615356445, "global_step": 49997, "epoch": 413} {"train_loss": -34.09336853027344, "global_step": 49998, "epoch": 413} {"train_loss": -33.53403854370117, "global_step": 49999, "epoch": 413} {"train_loss": -34.65425491333008, "global_step": 50000, "epoch": 413} {"train_loss": -34.872737884521484, "global_step": 50001, "epoch": 413} {"train_loss": -34.8096809387207, "global_step": 50002, "epoch": 413} {"train_loss": -35.11025619506836, "global_step": 50003, "epoch": 413} {"train_loss": -34.594947814941406, "global_step": 50004, "epoch": 413} {"train_loss": -35.04735565185547, "global_step": 50005, "epoch": 413} {"train_loss": -35.37384033203125, "global_step": 50006, "epoch": 413} {"train_loss": -35.516170501708984, "global_step": 50007, "epoch": 413} {"train_loss": -35.345699310302734, "global_step": 50008, "epoch": 413} {"train_loss": -35.497047424316406, "global_step": 50009, "epoch": 413} {"train_loss": -35.822811126708984, "global_step": 50010, "epoch": 413} {"train_loss": -35.88831329345703, "global_step": 50011, "epoch": 413} {"train_loss": -35.342132568359375, "global_step": 50012, "epoch": 413} {"train_loss": -35.505062103271484, "global_step": 50013, "epoch": 413} {"train_loss": -35.22243881225586, "global_step": 50014, "epoch": 413} {"train_loss": -35.62064743041992, "global_step": 50015, "epoch": 413} {"train_loss": -34.745033264160156, "global_step": 50016, "epoch": 413} {"train_loss": -35.329952239990234, "global_step": 50017, "epoch": 413} {"train_loss": -35.392364501953125, "global_step": 50018, "epoch": 413} {"train_loss": -35.67232894897461, "global_step": 50019, "epoch": 413} {"train_loss": -34.650360107421875, "global_step": 50020, "epoch": 413} {"train_loss": -34.915771484375, "global_step": 50021, "epoch": 413} {"train_loss": -34.97304153442383, "global_step": 50022, "epoch": 413} {"train_loss": -34.38264846801758, "global_step": 50023, "epoch": 413} {"train_loss": -34.26173400878906, "global_step": 50024, "epoch": 413} {"train_loss": -35.66489791870117, "global_step": 50025, "epoch": 413} {"train_loss": -34.43903732299805, "global_step": 50026, "epoch": 413} {"train_loss": -35.08811950683594, "global_step": 50027, "epoch": 413} {"train_loss": -33.68629837036133, "global_step": 50028, "epoch": 413} {"train_loss": -32.97212600708008, "global_step": 50029, "epoch": 413} {"train_loss": -29.52386474609375, "global_step": 50030, "epoch": 413} {"train_loss": -33.89016342163086, "global_step": 50031, "epoch": 413} {"train_loss": -32.772029876708984, "global_step": 50032, "epoch": 413} {"train_loss": -34.39611053466797, "global_step": 50033, "epoch": 413} {"train_loss": -34.22369384765625, "global_step": 50034, "epoch": 413} {"train_loss": -32.2141227722168, "global_step": 50035, "epoch": 413} {"train_loss": -35.32032012939453, "global_step": 50036, "epoch": 413} {"train_loss": -33.783721923828125, "global_step": 50037, "epoch": 413} {"train_loss": -33.126399993896484, "global_step": 50038, "epoch": 413} {"train_loss": -35.56432342529297, "global_step": 50039, "epoch": 413} {"train_loss": -34.14034652709961, "global_step": 50040, "epoch": 413} {"train_loss": -34.85393142700195, "global_step": 50041, "epoch": 413} {"train_loss": -34.55585861206055, "global_step": 50042, "epoch": 413} {"train_loss": -34.871822357177734, "global_step": 50043, "epoch": 413} {"train_loss": -35.76314926147461, "global_step": 50044, "epoch": 413} {"train_loss": -35.12301254272461, "global_step": 50045, "epoch": 413} {"train_loss": -35.0866813659668, "global_step": 50046, "epoch": 413} {"train_loss": -35.66018295288086, "global_step": 50047, "epoch": 413} {"train_loss": -35.58014678955078, "global_step": 50048, "epoch": 413} {"train_loss": -35.396724700927734, "global_step": 50049, "epoch": 413} {"train_loss": -35.6088981628418, "global_step": 50050, "epoch": 413} {"train_loss": -35.44184494018555, "global_step": 50051, "epoch": 413} {"train_loss": -35.05154037475586, "global_step": 50052, "epoch": 413} {"train_loss": -35.87578201293945, "global_step": 50053, "epoch": 413} {"train_loss": -35.91740036010742, "global_step": 50054, "epoch": 413} {"train_loss": -34.885467529296875, "global_step": 50055, "epoch": 413} {"train_loss": -35.92456817626953, "global_step": 50056, "epoch": 413} {"train_loss": -35.49748229980469, "global_step": 50057, "epoch": 413} {"train_loss": -34.85396957397461, "global_step": 50058, "epoch": 413} {"train_loss": -35.38166427612305, "global_step": 50059, "epoch": 413} {"train_loss": -34.22646713256836, "global_step": 50060, "epoch": 413} {"train_loss": -35.229248046875, "global_step": 50061, "epoch": 413} {"train_loss": -35.29646682739258, "global_step": 50062, "epoch": 413} {"train_loss": -34.93504333496094, "global_step": 50063, "epoch": 413} {"train_loss": -35.25526809692383, "global_step": 50064, "epoch": 413} {"train_loss": -34.604225158691406, "global_step": 50065, "epoch": 413} {"train_loss": -34.766212463378906, "global_step": 50066, "epoch": 413} {"train_loss": -35.03397750854492, "global_step": 50067, "epoch": 413} {"train_loss": -34.616973876953125, "global_step": 50068, "epoch": 413} {"train_loss": -35.78712844848633, "global_step": 50069, "epoch": 413} {"train_loss": -34.7507438659668, "global_step": 50070, "epoch": 413} {"train_loss": -34.88790512084961, "global_step": 50071, "epoch": 413} {"train_loss": -34.381290435791016, "global_step": 50072, "epoch": 413} {"train_loss": -35.53957748413086, "global_step": 50073, "epoch": 413} {"train_loss": -34.47687911987305, "global_step": 50074, "epoch": 413} {"train_loss": -35.20859146118164, "global_step": 50075, "epoch": 413} {"train_loss": -34.703125, "global_step": 50076, "epoch": 413} {"train_loss": -35.0046501159668, "global_step": 50077, "epoch": 413} {"train_loss": -35.32950973510742, "global_step": 50078, "epoch": 413} {"train_loss": -34.99070358276367, "global_step": 50079, "epoch": 413} {"train_loss": -34.53999328613281, "global_step": 50080, "epoch": 413} {"train_loss": -34.58553695678711, "global_step": 50081, "epoch": 413} {"train_loss": -33.871334075927734, "global_step": 50082, "epoch": 413} {"train_loss": -35.48006820678711, "global_step": 50083, "epoch": 413} {"train_loss": -35.622650146484375, "global_step": 50084, "epoch": 413} {"train_loss": -35.39577865600586, "global_step": 50085, "epoch": 413} {"train_loss": -34.528480529785156, "global_step": 50086, "epoch": 413} {"train_loss": -35.13601303100586, "global_step": 50087, "epoch": 413} {"train_loss": -35.529170989990234, "global_step": 50088, "epoch": 413} {"train_loss": -34.88351821899414, "global_step": 50089, "epoch": 413} {"train_loss": -34.75584030151367, "global_step": 50090, "epoch": 413} {"train_loss": -34.8529052734375, "global_step": 50091, "epoch": 413} {"train_loss": -35.326690673828125, "global_step": 50092, "epoch": 413} {"train_loss": -34.842420467660446, "global_step": 50093, "epoch": 413, "val_loss": 2381140.0} {"train_loss": -34.96451950073242, "global_step": 50094, "epoch": 414} {"train_loss": -33.5659294128418, "global_step": 50095, "epoch": 414} {"train_loss": -35.526588439941406, "global_step": 50096, "epoch": 414} {"train_loss": -34.11414337158203, "global_step": 50097, "epoch": 414} {"train_loss": -34.61756134033203, "global_step": 50098, "epoch": 414} {"train_loss": -34.21085739135742, "global_step": 50099, "epoch": 414} {"train_loss": -33.91255569458008, "global_step": 50100, "epoch": 414} {"train_loss": -34.255279541015625, "global_step": 50101, "epoch": 414} {"train_loss": -34.927650451660156, "global_step": 50102, "epoch": 414} {"train_loss": -35.209815979003906, "global_step": 50103, "epoch": 414} {"train_loss": -33.46694564819336, "global_step": 50104, "epoch": 414} {"train_loss": -33.91755294799805, "global_step": 50105, "epoch": 414} {"train_loss": -33.78432083129883, "global_step": 50106, "epoch": 414} {"train_loss": -34.056819915771484, "global_step": 50107, "epoch": 414} {"train_loss": -34.82379150390625, "global_step": 50108, "epoch": 414} {"train_loss": -35.04368209838867, "global_step": 50109, "epoch": 414} {"train_loss": -34.08361053466797, "global_step": 50110, "epoch": 414} {"train_loss": -35.000099182128906, "global_step": 50111, "epoch": 414} {"train_loss": -34.96992111206055, "global_step": 50112, "epoch": 414} {"train_loss": -32.06904983520508, "global_step": 50113, "epoch": 414} {"train_loss": -34.71142578125, "global_step": 50114, "epoch": 414} {"train_loss": -34.94187545776367, "global_step": 50115, "epoch": 414} {"train_loss": -32.494163513183594, "global_step": 50116, "epoch": 414} {"train_loss": -34.320953369140625, "global_step": 50117, "epoch": 414} {"train_loss": -35.36700439453125, "global_step": 50118, "epoch": 414} {"train_loss": -29.175586700439453, "global_step": 50119, "epoch": 414} {"train_loss": -34.09600830078125, "global_step": 50120, "epoch": 414} {"train_loss": -34.59574508666992, "global_step": 50121, "epoch": 414} {"train_loss": -34.155662536621094, "global_step": 50122, "epoch": 414} {"train_loss": -34.125022888183594, "global_step": 50123, "epoch": 414} {"train_loss": -34.8463249206543, "global_step": 50124, "epoch": 414} {"train_loss": -35.347225189208984, "global_step": 50125, "epoch": 414} {"train_loss": -34.60799026489258, "global_step": 50126, "epoch": 414} {"train_loss": -34.19593811035156, "global_step": 50127, "epoch": 414} {"train_loss": -35.20515823364258, "global_step": 50128, "epoch": 414} {"train_loss": -35.14808654785156, "global_step": 50129, "epoch": 414} {"train_loss": -34.68450164794922, "global_step": 50130, "epoch": 414} {"train_loss": -35.08669662475586, "global_step": 50131, "epoch": 414} {"train_loss": -33.02024459838867, "global_step": 50132, "epoch": 414} {"train_loss": -33.79215621948242, "global_step": 50133, "epoch": 414} {"train_loss": -35.802120208740234, "global_step": 50134, "epoch": 414} {"train_loss": -34.9511833190918, "global_step": 50135, "epoch": 414} {"train_loss": -35.51015090942383, "global_step": 50136, "epoch": 414} {"train_loss": -35.2918815612793, "global_step": 50137, "epoch": 414} {"train_loss": -34.925350189208984, "global_step": 50138, "epoch": 414} {"train_loss": -35.186927795410156, "global_step": 50139, "epoch": 414} {"train_loss": -35.09479522705078, "global_step": 50140, "epoch": 414} {"train_loss": -35.05790328979492, "global_step": 50141, "epoch": 414} {"train_loss": -35.2473258972168, "global_step": 50142, "epoch": 414} {"train_loss": -35.642642974853516, "global_step": 50143, "epoch": 414} {"train_loss": -35.585205078125, "global_step": 50144, "epoch": 414} {"train_loss": -35.624305725097656, "global_step": 50145, "epoch": 414} {"train_loss": -35.73173522949219, "global_step": 50146, "epoch": 414} {"train_loss": -35.5096435546875, "global_step": 50147, "epoch": 414} {"train_loss": -35.221885681152344, "global_step": 50148, "epoch": 414} {"train_loss": -35.38955307006836, "global_step": 50149, "epoch": 414} {"train_loss": -35.22745895385742, "global_step": 50150, "epoch": 414} {"train_loss": -35.03030014038086, "global_step": 50151, "epoch": 414} {"train_loss": -35.401123046875, "global_step": 50152, "epoch": 414} {"train_loss": -35.15241622924805, "global_step": 50153, "epoch": 414} {"train_loss": -35.0330924987793, "global_step": 50154, "epoch": 414} {"train_loss": -35.61618423461914, "global_step": 50155, "epoch": 414} {"train_loss": -34.79778289794922, "global_step": 50156, "epoch": 414} {"train_loss": -33.288265228271484, "global_step": 50157, "epoch": 414} {"train_loss": -26.569580078125, "global_step": 50158, "epoch": 414} {"train_loss": -15.773782730102539, "global_step": 50159, "epoch": 414} {"train_loss": -21.975780487060547, "global_step": 50160, "epoch": 414} {"train_loss": -31.2142276763916, "global_step": 50161, "epoch": 414} {"train_loss": -34.465965270996094, "global_step": 50162, "epoch": 414} {"train_loss": -33.0562744140625, "global_step": 50163, "epoch": 414} {"train_loss": -34.515785217285156, "global_step": 50164, "epoch": 414} {"train_loss": -35.172542572021484, "global_step": 50165, "epoch": 414} {"train_loss": -34.14229202270508, "global_step": 50166, "epoch": 414} {"train_loss": -34.277381896972656, "global_step": 50167, "epoch": 414} {"train_loss": -35.441246032714844, "global_step": 50168, "epoch": 414} {"train_loss": -34.96943664550781, "global_step": 50169, "epoch": 414} {"train_loss": -35.268165588378906, "global_step": 50170, "epoch": 414} {"train_loss": -34.83841323852539, "global_step": 50171, "epoch": 414} {"train_loss": -35.306541442871094, "global_step": 50172, "epoch": 414} {"train_loss": -34.445953369140625, "global_step": 50173, "epoch": 414} {"train_loss": -35.44435119628906, "global_step": 50174, "epoch": 414} {"train_loss": -35.29237747192383, "global_step": 50175, "epoch": 414} {"train_loss": -35.41108703613281, "global_step": 50176, "epoch": 414} {"train_loss": -35.304473876953125, "global_step": 50177, "epoch": 414} {"train_loss": -35.526668548583984, "global_step": 50178, "epoch": 414} {"train_loss": -35.77560043334961, "global_step": 50179, "epoch": 414} {"train_loss": -35.913082122802734, "global_step": 50180, "epoch": 414} {"train_loss": -35.131893157958984, "global_step": 50181, "epoch": 414} {"train_loss": -35.2180290222168, "global_step": 50182, "epoch": 414} {"train_loss": -35.47553253173828, "global_step": 50183, "epoch": 414} {"train_loss": -35.43036651611328, "global_step": 50184, "epoch": 414} {"train_loss": -34.59294509887695, "global_step": 50185, "epoch": 414} {"train_loss": -34.65858840942383, "global_step": 50186, "epoch": 414} {"train_loss": -35.55968475341797, "global_step": 50187, "epoch": 414} {"train_loss": -35.44335174560547, "global_step": 50188, "epoch": 414} {"train_loss": -35.7279167175293, "global_step": 50189, "epoch": 414} {"train_loss": -35.116424560546875, "global_step": 50190, "epoch": 414} {"train_loss": -35.44475173950195, "global_step": 50191, "epoch": 414} {"train_loss": -34.97092819213867, "global_step": 50192, "epoch": 414} {"train_loss": -34.469173431396484, "global_step": 50193, "epoch": 414} {"train_loss": -35.3956413269043, "global_step": 50194, "epoch": 414} {"train_loss": -36.156795501708984, "global_step": 50195, "epoch": 414} {"train_loss": -35.45661544799805, "global_step": 50196, "epoch": 414} {"train_loss": -35.27787399291992, "global_step": 50197, "epoch": 414} {"train_loss": -34.86810302734375, "global_step": 50198, "epoch": 414} {"train_loss": -35.215606689453125, "global_step": 50199, "epoch": 414} {"train_loss": -34.78179931640625, "global_step": 50200, "epoch": 414} {"train_loss": -35.63678741455078, "global_step": 50201, "epoch": 414} {"train_loss": -36.114845275878906, "global_step": 50202, "epoch": 414} {"train_loss": -35.41898727416992, "global_step": 50203, "epoch": 414} {"train_loss": -35.042964935302734, "global_step": 50204, "epoch": 414} {"train_loss": -35.26813888549805, "global_step": 50205, "epoch": 414} {"train_loss": -34.72575759887695, "global_step": 50206, "epoch": 414} {"train_loss": -35.39601516723633, "global_step": 50207, "epoch": 414} {"train_loss": -36.079769134521484, "global_step": 50208, "epoch": 414} {"train_loss": -36.01451873779297, "global_step": 50209, "epoch": 414} {"train_loss": -35.66206741333008, "global_step": 50210, "epoch": 414} {"train_loss": -35.7006721496582, "global_step": 50211, "epoch": 414} {"train_loss": -36.05807113647461, "global_step": 50212, "epoch": 414} {"train_loss": -35.867889404296875, "global_step": 50213, "epoch": 414} {"train_loss": -34.538242876037096, "global_step": 50214, "epoch": 414, "val_loss": 2586955.75} {"train_loss": -36.02260971069336, "global_step": 50215, "epoch": 415} {"train_loss": -35.460205078125, "global_step": 50216, "epoch": 415} {"train_loss": -35.779296875, "global_step": 50217, "epoch": 415} {"train_loss": -35.971004486083984, "global_step": 50218, "epoch": 415} {"train_loss": -35.62861251831055, "global_step": 50219, "epoch": 415} {"train_loss": -35.80320739746094, "global_step": 50220, "epoch": 415} {"train_loss": -34.89390563964844, "global_step": 50221, "epoch": 415} {"train_loss": -33.64543914794922, "global_step": 50222, "epoch": 415} {"train_loss": -31.11024284362793, "global_step": 50223, "epoch": 415} {"train_loss": -27.49395751953125, "global_step": 50224, "epoch": 415} {"train_loss": -29.106613159179688, "global_step": 50225, "epoch": 415} {"train_loss": -34.7188720703125, "global_step": 50226, "epoch": 415} {"train_loss": -33.766170501708984, "global_step": 50227, "epoch": 415} {"train_loss": -28.66892433166504, "global_step": 50228, "epoch": 415} {"train_loss": -33.96725082397461, "global_step": 50229, "epoch": 415} {"train_loss": -33.66695785522461, "global_step": 50230, "epoch": 415} {"train_loss": -34.279212951660156, "global_step": 50231, "epoch": 415} {"train_loss": -34.862972259521484, "global_step": 50232, "epoch": 415} {"train_loss": -32.372493743896484, "global_step": 50233, "epoch": 415} {"train_loss": -34.115638732910156, "global_step": 50234, "epoch": 415} {"train_loss": -34.08192443847656, "global_step": 50235, "epoch": 415} {"train_loss": -35.2012939453125, "global_step": 50236, "epoch": 415} {"train_loss": -34.920833587646484, "global_step": 50237, "epoch": 415} {"train_loss": -33.746978759765625, "global_step": 50238, "epoch": 415} {"train_loss": -35.29853820800781, "global_step": 50239, "epoch": 415} {"train_loss": -34.81071853637695, "global_step": 50240, "epoch": 415} {"train_loss": -35.269134521484375, "global_step": 50241, "epoch": 415} {"train_loss": -35.11864471435547, "global_step": 50242, "epoch": 415} {"train_loss": -34.17995071411133, "global_step": 50243, "epoch": 415} {"train_loss": -35.61895751953125, "global_step": 50244, "epoch": 415} {"train_loss": -35.21416091918945, "global_step": 50245, "epoch": 415} {"train_loss": -34.5135612487793, "global_step": 50246, "epoch": 415} {"train_loss": -35.4525032043457, "global_step": 50247, "epoch": 415} {"train_loss": -35.3710823059082, "global_step": 50248, "epoch": 415} {"train_loss": -35.328887939453125, "global_step": 50249, "epoch": 415} {"train_loss": -35.968055725097656, "global_step": 50250, "epoch": 415} {"train_loss": -35.390892028808594, "global_step": 50251, "epoch": 415} {"train_loss": -35.97368240356445, "global_step": 50252, "epoch": 415} {"train_loss": -35.23223114013672, "global_step": 50253, "epoch": 415} {"train_loss": -35.817832946777344, "global_step": 50254, "epoch": 415} {"train_loss": -35.991241455078125, "global_step": 50255, "epoch": 415} {"train_loss": -36.03373336791992, "global_step": 50256, "epoch": 415} {"train_loss": -35.91961669921875, "global_step": 50257, "epoch": 415} {"train_loss": -35.68653106689453, "global_step": 50258, "epoch": 415} {"train_loss": -35.47833251953125, "global_step": 50259, "epoch": 415} {"train_loss": -35.335208892822266, "global_step": 50260, "epoch": 415} {"train_loss": -34.99861526489258, "global_step": 50261, "epoch": 415} {"train_loss": -35.877288818359375, "global_step": 50262, "epoch": 415} {"train_loss": -35.96136474609375, "global_step": 50263, "epoch": 415} {"train_loss": -35.19915771484375, "global_step": 50264, "epoch": 415} {"train_loss": -35.47085189819336, "global_step": 50265, "epoch": 415} {"train_loss": -35.56657028198242, "global_step": 50266, "epoch": 415} {"train_loss": -35.8499870300293, "global_step": 50267, "epoch": 415} {"train_loss": -34.06367111206055, "global_step": 50268, "epoch": 415} {"train_loss": -35.543792724609375, "global_step": 50269, "epoch": 415} {"train_loss": -34.65365982055664, "global_step": 50270, "epoch": 415} {"train_loss": -35.91706848144531, "global_step": 50271, "epoch": 415} {"train_loss": -34.246910095214844, "global_step": 50272, "epoch": 415} {"train_loss": -34.49414825439453, "global_step": 50273, "epoch": 415} {"train_loss": -34.056427001953125, "global_step": 50274, "epoch": 415} {"train_loss": -34.17042922973633, "global_step": 50275, "epoch": 415} {"train_loss": -34.262298583984375, "global_step": 50276, "epoch": 415} {"train_loss": -34.18999099731445, "global_step": 50277, "epoch": 415} {"train_loss": -34.6702880859375, "global_step": 50278, "epoch": 415} {"train_loss": -34.83591842651367, "global_step": 50279, "epoch": 415} {"train_loss": -34.3957405090332, "global_step": 50280, "epoch": 415} {"train_loss": -34.06856918334961, "global_step": 50281, "epoch": 415} {"train_loss": -34.91482162475586, "global_step": 50282, "epoch": 415} {"train_loss": -34.722389221191406, "global_step": 50283, "epoch": 415} {"train_loss": -35.12438201904297, "global_step": 50284, "epoch": 415} {"train_loss": -34.474483489990234, "global_step": 50285, "epoch": 415} {"train_loss": -34.69038009643555, "global_step": 50286, "epoch": 415} {"train_loss": -32.215858459472656, "global_step": 50287, "epoch": 415} {"train_loss": -31.676855087280273, "global_step": 50288, "epoch": 415} {"train_loss": -30.479145050048828, "global_step": 50289, "epoch": 415} {"train_loss": -33.53182601928711, "global_step": 50290, "epoch": 415} {"train_loss": -34.31315231323242, "global_step": 50291, "epoch": 415} {"train_loss": -33.90278625488281, "global_step": 50292, "epoch": 415} {"train_loss": -32.9665641784668, "global_step": 50293, "epoch": 415} {"train_loss": -34.143314361572266, "global_step": 50294, "epoch": 415} {"train_loss": -34.99721908569336, "global_step": 50295, "epoch": 415} {"train_loss": -33.51210403442383, "global_step": 50296, "epoch": 415} {"train_loss": -35.20223617553711, "global_step": 50297, "epoch": 415} {"train_loss": -34.37800216674805, "global_step": 50298, "epoch": 415} {"train_loss": -34.74365234375, "global_step": 50299, "epoch": 415} {"train_loss": -34.175472259521484, "global_step": 50300, "epoch": 415} {"train_loss": -33.806880950927734, "global_step": 50301, "epoch": 415} {"train_loss": -35.17116165161133, "global_step": 50302, "epoch": 415} {"train_loss": -34.0875358581543, "global_step": 50303, "epoch": 415} {"train_loss": -34.646549224853516, "global_step": 50304, "epoch": 415} {"train_loss": -34.307552337646484, "global_step": 50305, "epoch": 415} {"train_loss": -34.16382598876953, "global_step": 50306, "epoch": 415} {"train_loss": -35.193111419677734, "global_step": 50307, "epoch": 415} {"train_loss": -34.16111755371094, "global_step": 50308, "epoch": 415} {"train_loss": -34.91658401489258, "global_step": 50309, "epoch": 415} {"train_loss": -34.88410568237305, "global_step": 50310, "epoch": 415} {"train_loss": -35.61922073364258, "global_step": 50311, "epoch": 415} {"train_loss": -35.31356430053711, "global_step": 50312, "epoch": 415} {"train_loss": -35.69276809692383, "global_step": 50313, "epoch": 415} {"train_loss": -35.42361068725586, "global_step": 50314, "epoch": 415} {"train_loss": -35.887813568115234, "global_step": 50315, "epoch": 415} {"train_loss": -35.288787841796875, "global_step": 50316, "epoch": 415} {"train_loss": -35.99303436279297, "global_step": 50317, "epoch": 415} {"train_loss": -35.39774703979492, "global_step": 50318, "epoch": 415} {"train_loss": -35.69342041015625, "global_step": 50319, "epoch": 415} {"train_loss": -35.91668701171875, "global_step": 50320, "epoch": 415} {"train_loss": -36.08062744140625, "global_step": 50321, "epoch": 415} {"train_loss": -36.10118103027344, "global_step": 50322, "epoch": 415} {"train_loss": -35.9687385559082, "global_step": 50323, "epoch": 415} {"train_loss": -35.929420471191406, "global_step": 50324, "epoch": 415} {"train_loss": -36.32063293457031, "global_step": 50325, "epoch": 415} {"train_loss": -35.36845779418945, "global_step": 50326, "epoch": 415} {"train_loss": -36.473873138427734, "global_step": 50327, "epoch": 415} {"train_loss": -36.02592086791992, "global_step": 50328, "epoch": 415} {"train_loss": -36.12272262573242, "global_step": 50329, "epoch": 415} {"train_loss": -36.38201904296875, "global_step": 50330, "epoch": 415} {"train_loss": -34.9355354309082, "global_step": 50331, "epoch": 415} {"train_loss": -36.462310791015625, "global_step": 50332, "epoch": 415} {"train_loss": -36.34743881225586, "global_step": 50333, "epoch": 415} {"train_loss": -35.806270599365234, "global_step": 50334, "epoch": 415} {"train_loss": -34.77401214788768, "global_step": 50335, "epoch": 415, "val_loss": 2651524.25} {"train_loss": -36.01426696777344, "global_step": 50336, "epoch": 416} {"train_loss": -36.008880615234375, "global_step": 50337, "epoch": 416} {"train_loss": -35.93391036987305, "global_step": 50338, "epoch": 416} {"train_loss": -35.82270812988281, "global_step": 50339, "epoch": 416} {"train_loss": -35.78834915161133, "global_step": 50340, "epoch": 416} {"train_loss": -36.58529281616211, "global_step": 50341, "epoch": 416} {"train_loss": -33.82978057861328, "global_step": 50342, "epoch": 416} {"train_loss": -35.702392578125, "global_step": 50343, "epoch": 416} {"train_loss": -34.65277862548828, "global_step": 50344, "epoch": 416} {"train_loss": -34.043922424316406, "global_step": 50345, "epoch": 416} {"train_loss": -33.336849212646484, "global_step": 50346, "epoch": 416} {"train_loss": -34.32412338256836, "global_step": 50347, "epoch": 416} {"train_loss": -35.3089485168457, "global_step": 50348, "epoch": 416} {"train_loss": -33.54021072387695, "global_step": 50349, "epoch": 416} {"train_loss": -35.72773361206055, "global_step": 50350, "epoch": 416} {"train_loss": -35.475948333740234, "global_step": 50351, "epoch": 416} {"train_loss": -28.875085830688477, "global_step": 50352, "epoch": 416} {"train_loss": -31.6601505279541, "global_step": 50353, "epoch": 416} {"train_loss": -35.29065704345703, "global_step": 50354, "epoch": 416} {"train_loss": -33.79289627075195, "global_step": 50355, "epoch": 416} {"train_loss": -32.7152214050293, "global_step": 50356, "epoch": 416} {"train_loss": -30.875110626220703, "global_step": 50357, "epoch": 416} {"train_loss": -31.75347328186035, "global_step": 50358, "epoch": 416} {"train_loss": -30.925617218017578, "global_step": 50359, "epoch": 416} {"train_loss": -33.736793518066406, "global_step": 50360, "epoch": 416} {"train_loss": -33.66205596923828, "global_step": 50361, "epoch": 416} {"train_loss": -33.025856018066406, "global_step": 50362, "epoch": 416} {"train_loss": -33.99034881591797, "global_step": 50363, "epoch": 416} {"train_loss": -28.703840255737305, "global_step": 50364, "epoch": 416} {"train_loss": -33.0702018737793, "global_step": 50365, "epoch": 416} {"train_loss": -33.754241943359375, "global_step": 50366, "epoch": 416} {"train_loss": -32.50847244262695, "global_step": 50367, "epoch": 416} {"train_loss": -32.18728256225586, "global_step": 50368, "epoch": 416} {"train_loss": -32.93791580200195, "global_step": 50369, "epoch": 416} {"train_loss": -33.208126068115234, "global_step": 50370, "epoch": 416} {"train_loss": -31.36216163635254, "global_step": 50371, "epoch": 416} {"train_loss": -34.0244255065918, "global_step": 50372, "epoch": 416} {"train_loss": -31.35581398010254, "global_step": 50373, "epoch": 416} {"train_loss": -31.9323673248291, "global_step": 50374, "epoch": 416} {"train_loss": -33.59981918334961, "global_step": 50375, "epoch": 416} {"train_loss": -31.466257095336914, "global_step": 50376, "epoch": 416} {"train_loss": -33.5128059387207, "global_step": 50377, "epoch": 416} {"train_loss": -32.70195770263672, "global_step": 50378, "epoch": 416} {"train_loss": -33.16533660888672, "global_step": 50379, "epoch": 416} {"train_loss": -32.58527755737305, "global_step": 50380, "epoch": 416} {"train_loss": -33.295082092285156, "global_step": 50381, "epoch": 416} {"train_loss": -32.54153823852539, "global_step": 50382, "epoch": 416} {"train_loss": -33.620811462402344, "global_step": 50383, "epoch": 416} {"train_loss": -33.35404968261719, "global_step": 50384, "epoch": 416} {"train_loss": -33.8503532409668, "global_step": 50385, "epoch": 416} {"train_loss": -33.148231506347656, "global_step": 50386, "epoch": 416} {"train_loss": -33.43739700317383, "global_step": 50387, "epoch": 416} {"train_loss": -33.35757064819336, "global_step": 50388, "epoch": 416} {"train_loss": -33.45731735229492, "global_step": 50389, "epoch": 416} {"train_loss": -33.35526657104492, "global_step": 50390, "epoch": 416} {"train_loss": -33.6723747253418, "global_step": 50391, "epoch": 416} {"train_loss": -34.372222900390625, "global_step": 50392, "epoch": 416} {"train_loss": -34.3448600769043, "global_step": 50393, "epoch": 416} {"train_loss": -34.30263137817383, "global_step": 50394, "epoch": 416} {"train_loss": -34.776939392089844, "global_step": 50395, "epoch": 416} {"train_loss": -33.863033294677734, "global_step": 50396, "epoch": 416} {"train_loss": -34.556331634521484, "global_step": 50397, "epoch": 416} {"train_loss": -34.4359016418457, "global_step": 50398, "epoch": 416} {"train_loss": -34.79026412963867, "global_step": 50399, "epoch": 416} {"train_loss": -34.87852096557617, "global_step": 50400, "epoch": 416} {"train_loss": -34.003028869628906, "global_step": 50401, "epoch": 416} {"train_loss": -34.992000579833984, "global_step": 50402, "epoch": 416} {"train_loss": -33.98458480834961, "global_step": 50403, "epoch": 416} {"train_loss": -35.1251106262207, "global_step": 50404, "epoch": 416} {"train_loss": -34.967037200927734, "global_step": 50405, "epoch": 416} {"train_loss": -34.509334564208984, "global_step": 50406, "epoch": 416} {"train_loss": -34.69716262817383, "global_step": 50407, "epoch": 416} {"train_loss": -34.548091888427734, "global_step": 50408, "epoch": 416} {"train_loss": -34.774539947509766, "global_step": 50409, "epoch": 416} {"train_loss": -34.82369613647461, "global_step": 50410, "epoch": 416} {"train_loss": -34.934452056884766, "global_step": 50411, "epoch": 416} {"train_loss": -34.503814697265625, "global_step": 50412, "epoch": 416} {"train_loss": -34.79989242553711, "global_step": 50413, "epoch": 416} {"train_loss": -34.146480560302734, "global_step": 50414, "epoch": 416} {"train_loss": -34.435760498046875, "global_step": 50415, "epoch": 416} {"train_loss": -35.09401321411133, "global_step": 50416, "epoch": 416} {"train_loss": -35.08241653442383, "global_step": 50417, "epoch": 416} {"train_loss": -33.322059631347656, "global_step": 50418, "epoch": 416} {"train_loss": -33.0103645324707, "global_step": 50419, "epoch": 416} {"train_loss": -33.263282775878906, "global_step": 50420, "epoch": 416} {"train_loss": -33.84091567993164, "global_step": 50421, "epoch": 416} {"train_loss": -34.37442398071289, "global_step": 50422, "epoch": 416} {"train_loss": -35.05038070678711, "global_step": 50423, "epoch": 416} {"train_loss": -35.343223571777344, "global_step": 50424, "epoch": 416} {"train_loss": -35.20927810668945, "global_step": 50425, "epoch": 416} {"train_loss": -34.42075729370117, "global_step": 50426, "epoch": 416} {"train_loss": -35.2145881652832, "global_step": 50427, "epoch": 416} {"train_loss": -35.671363830566406, "global_step": 50428, "epoch": 416} {"train_loss": -34.785682678222656, "global_step": 50429, "epoch": 416} {"train_loss": -35.7708740234375, "global_step": 50430, "epoch": 416} {"train_loss": -35.4313850402832, "global_step": 50431, "epoch": 416} {"train_loss": -34.895477294921875, "global_step": 50432, "epoch": 416} {"train_loss": -35.028324127197266, "global_step": 50433, "epoch": 416} {"train_loss": -34.44388961791992, "global_step": 50434, "epoch": 416} {"train_loss": -33.577247619628906, "global_step": 50435, "epoch": 416} {"train_loss": -30.03287696838379, "global_step": 50436, "epoch": 416} {"train_loss": -27.838525772094727, "global_step": 50437, "epoch": 416} {"train_loss": -26.847360610961914, "global_step": 50438, "epoch": 416} {"train_loss": -28.88382339477539, "global_step": 50439, "epoch": 416} {"train_loss": -34.2027702331543, "global_step": 50440, "epoch": 416} {"train_loss": -34.971370697021484, "global_step": 50441, "epoch": 416} {"train_loss": -32.71310806274414, "global_step": 50442, "epoch": 416} {"train_loss": -34.9383659362793, "global_step": 50443, "epoch": 416} {"train_loss": -34.22956085205078, "global_step": 50444, "epoch": 416} {"train_loss": -35.08496856689453, "global_step": 50445, "epoch": 416} {"train_loss": -34.57358932495117, "global_step": 50446, "epoch": 416} {"train_loss": -34.87260055541992, "global_step": 50447, "epoch": 416} {"train_loss": -34.92234420776367, "global_step": 50448, "epoch": 416} {"train_loss": -35.397884368896484, "global_step": 50449, "epoch": 416} {"train_loss": -34.54499435424805, "global_step": 50450, "epoch": 416} {"train_loss": -35.760433197021484, "global_step": 50451, "epoch": 416} {"train_loss": -35.24735641479492, "global_step": 50452, "epoch": 416} {"train_loss": -35.03413772583008, "global_step": 50453, "epoch": 416} {"train_loss": -35.29620361328125, "global_step": 50454, "epoch": 416} {"train_loss": -35.01898193359375, "global_step": 50455, "epoch": 416} {"train_loss": -33.886123672989775, "global_step": 50456, "epoch": 416, "val_loss": 2661744.25} {"train_loss": -35.44928741455078, "global_step": 50457, "epoch": 417} {"train_loss": -34.57756423950195, "global_step": 50458, "epoch": 417} {"train_loss": -35.18789291381836, "global_step": 50459, "epoch": 417} {"train_loss": -35.8277473449707, "global_step": 50460, "epoch": 417} {"train_loss": -35.78767013549805, "global_step": 50461, "epoch": 417} {"train_loss": -34.879058837890625, "global_step": 50462, "epoch": 417} {"train_loss": -35.631893157958984, "global_step": 50463, "epoch": 417} {"train_loss": -35.8322639465332, "global_step": 50464, "epoch": 417} {"train_loss": -34.767086029052734, "global_step": 50465, "epoch": 417} {"train_loss": -34.732521057128906, "global_step": 50466, "epoch": 417} {"train_loss": -35.31298828125, "global_step": 50467, "epoch": 417} {"train_loss": -35.877220153808594, "global_step": 50468, "epoch": 417} {"train_loss": -34.49690628051758, "global_step": 50469, "epoch": 417} {"train_loss": -33.33998107910156, "global_step": 50470, "epoch": 417} {"train_loss": -32.206703186035156, "global_step": 50471, "epoch": 417} {"train_loss": -31.766233444213867, "global_step": 50472, "epoch": 417} {"train_loss": -35.14641189575195, "global_step": 50473, "epoch": 417} {"train_loss": -35.1446533203125, "global_step": 50474, "epoch": 417} {"train_loss": -33.975250244140625, "global_step": 50475, "epoch": 417} {"train_loss": -35.3746452331543, "global_step": 50476, "epoch": 417} {"train_loss": -34.379638671875, "global_step": 50477, "epoch": 417} {"train_loss": -35.59872817993164, "global_step": 50478, "epoch": 417} {"train_loss": -34.6749382019043, "global_step": 50479, "epoch": 417} {"train_loss": -35.579315185546875, "global_step": 50480, "epoch": 417} {"train_loss": -35.243709564208984, "global_step": 50481, "epoch": 417} {"train_loss": -35.66754913330078, "global_step": 50482, "epoch": 417} {"train_loss": -35.4638786315918, "global_step": 50483, "epoch": 417} {"train_loss": -35.52638626098633, "global_step": 50484, "epoch": 417} {"train_loss": -35.14678192138672, "global_step": 50485, "epoch": 417} {"train_loss": -35.8961296081543, "global_step": 50486, "epoch": 417} {"train_loss": -35.16532516479492, "global_step": 50487, "epoch": 417} {"train_loss": -35.84097671508789, "global_step": 50488, "epoch": 417} {"train_loss": -35.80439376831055, "global_step": 50489, "epoch": 417} {"train_loss": -35.65071487426758, "global_step": 50490, "epoch": 417} {"train_loss": -35.77436447143555, "global_step": 50491, "epoch": 417} {"train_loss": -34.81147003173828, "global_step": 50492, "epoch": 417} {"train_loss": -34.711578369140625, "global_step": 50493, "epoch": 417} {"train_loss": -34.10493087768555, "global_step": 50494, "epoch": 417} {"train_loss": -34.287261962890625, "global_step": 50495, "epoch": 417} {"train_loss": -32.21853256225586, "global_step": 50496, "epoch": 417} {"train_loss": -34.29230499267578, "global_step": 50497, "epoch": 417} {"train_loss": -35.35445022583008, "global_step": 50498, "epoch": 417} {"train_loss": -34.503604888916016, "global_step": 50499, "epoch": 417} {"train_loss": -33.141334533691406, "global_step": 50500, "epoch": 417} {"train_loss": -32.42709732055664, "global_step": 50501, "epoch": 417} {"train_loss": -33.85020065307617, "global_step": 50502, "epoch": 417} {"train_loss": -35.42655944824219, "global_step": 50503, "epoch": 417} {"train_loss": -32.30447006225586, "global_step": 50504, "epoch": 417} {"train_loss": -30.427799224853516, "global_step": 50505, "epoch": 417} {"train_loss": -33.793914794921875, "global_step": 50506, "epoch": 417} {"train_loss": -35.12650680541992, "global_step": 50507, "epoch": 417} {"train_loss": -32.194435119628906, "global_step": 50508, "epoch": 417} {"train_loss": -34.31291198730469, "global_step": 50509, "epoch": 417} {"train_loss": -35.19804763793945, "global_step": 50510, "epoch": 417} {"train_loss": -34.18277359008789, "global_step": 50511, "epoch": 417} {"train_loss": -35.3870849609375, "global_step": 50512, "epoch": 417} {"train_loss": -34.272308349609375, "global_step": 50513, "epoch": 417} {"train_loss": -34.242252349853516, "global_step": 50514, "epoch": 417} {"train_loss": -35.13277053833008, "global_step": 50515, "epoch": 417} {"train_loss": -35.18343734741211, "global_step": 50516, "epoch": 417} {"train_loss": -35.53657913208008, "global_step": 50517, "epoch": 417} {"train_loss": -35.717952728271484, "global_step": 50518, "epoch": 417} {"train_loss": -35.21525192260742, "global_step": 50519, "epoch": 417} {"train_loss": -35.733619689941406, "global_step": 50520, "epoch": 417} {"train_loss": -34.87922286987305, "global_step": 50521, "epoch": 417} {"train_loss": -35.78028106689453, "global_step": 50522, "epoch": 417} {"train_loss": -35.657264709472656, "global_step": 50523, "epoch": 417} {"train_loss": -35.082027435302734, "global_step": 50524, "epoch": 417} {"train_loss": -35.66787338256836, "global_step": 50525, "epoch": 417} {"train_loss": -35.121917724609375, "global_step": 50526, "epoch": 417} {"train_loss": -35.36996078491211, "global_step": 50527, "epoch": 417} {"train_loss": -35.271480560302734, "global_step": 50528, "epoch": 417} {"train_loss": -35.07157516479492, "global_step": 50529, "epoch": 417} {"train_loss": -35.80712890625, "global_step": 50530, "epoch": 417} {"train_loss": -35.521705627441406, "global_step": 50531, "epoch": 417} {"train_loss": -35.91220474243164, "global_step": 50532, "epoch": 417} {"train_loss": -36.10801696777344, "global_step": 50533, "epoch": 417} {"train_loss": -35.13764572143555, "global_step": 50534, "epoch": 417} {"train_loss": -36.071041107177734, "global_step": 50535, "epoch": 417} {"train_loss": -35.8951530456543, "global_step": 50536, "epoch": 417} {"train_loss": -35.61802291870117, "global_step": 50537, "epoch": 417} {"train_loss": -36.31560516357422, "global_step": 50538, "epoch": 417} {"train_loss": -35.48154830932617, "global_step": 50539, "epoch": 417} {"train_loss": -35.7969970703125, "global_step": 50540, "epoch": 417} {"train_loss": -35.89219284057617, "global_step": 50541, "epoch": 417} {"train_loss": -35.45280075073242, "global_step": 50542, "epoch": 417} {"train_loss": -35.93379211425781, "global_step": 50543, "epoch": 417} {"train_loss": -35.867225646972656, "global_step": 50544, "epoch": 417} {"train_loss": -36.0327033996582, "global_step": 50545, "epoch": 417} {"train_loss": -36.18037033081055, "global_step": 50546, "epoch": 417} {"train_loss": -35.940040588378906, "global_step": 50547, "epoch": 417} {"train_loss": -35.87953567504883, "global_step": 50548, "epoch": 417} {"train_loss": -36.40427780151367, "global_step": 50549, "epoch": 417} {"train_loss": -35.47624969482422, "global_step": 50550, "epoch": 417} {"train_loss": -36.344234466552734, "global_step": 50551, "epoch": 417} {"train_loss": -36.409095764160156, "global_step": 50552, "epoch": 417} {"train_loss": -35.98259353637695, "global_step": 50553, "epoch": 417} {"train_loss": -36.71682357788086, "global_step": 50554, "epoch": 417} {"train_loss": -36.09136962890625, "global_step": 50555, "epoch": 417} {"train_loss": -36.0484504699707, "global_step": 50556, "epoch": 417} {"train_loss": -36.335174560546875, "global_step": 50557, "epoch": 417} {"train_loss": -36.10902786254883, "global_step": 50558, "epoch": 417} {"train_loss": -35.31055450439453, "global_step": 50559, "epoch": 417} {"train_loss": -35.92043685913086, "global_step": 50560, "epoch": 417} {"train_loss": -36.246986389160156, "global_step": 50561, "epoch": 417} {"train_loss": -35.78179931640625, "global_step": 50562, "epoch": 417} {"train_loss": -34.06551742553711, "global_step": 50563, "epoch": 417} {"train_loss": -36.128116607666016, "global_step": 50564, "epoch": 417} {"train_loss": -34.52241134643555, "global_step": 50565, "epoch": 417} {"train_loss": -33.572784423828125, "global_step": 50566, "epoch": 417} {"train_loss": -35.99428939819336, "global_step": 50567, "epoch": 417} {"train_loss": -34.754085540771484, "global_step": 50568, "epoch": 417} {"train_loss": -33.55437088012695, "global_step": 50569, "epoch": 417} {"train_loss": -35.025062561035156, "global_step": 50570, "epoch": 417} {"train_loss": -35.621212005615234, "global_step": 50571, "epoch": 417} {"train_loss": -33.95362091064453, "global_step": 50572, "epoch": 417} {"train_loss": -33.526832580566406, "global_step": 50573, "epoch": 417} {"train_loss": -33.87767028808594, "global_step": 50574, "epoch": 417} {"train_loss": -32.98535919189453, "global_step": 50575, "epoch": 417} {"train_loss": -32.814971923828125, "global_step": 50576, "epoch": 417} {"train_loss": -35.03386343018082, "global_step": 50577, "epoch": 417, "val_loss": 2647794.75} {"train_loss": -34.44668197631836, "global_step": 50578, "epoch": 418} {"train_loss": -33.056514739990234, "global_step": 50579, "epoch": 418} {"train_loss": -30.481637954711914, "global_step": 50580, "epoch": 418} {"train_loss": -31.37298011779785, "global_step": 50581, "epoch": 418} {"train_loss": -33.59693145751953, "global_step": 50582, "epoch": 418} {"train_loss": -35.430267333984375, "global_step": 50583, "epoch": 418} {"train_loss": -32.97246170043945, "global_step": 50584, "epoch": 418} {"train_loss": -34.522789001464844, "global_step": 50585, "epoch": 418} {"train_loss": -34.98795700073242, "global_step": 50586, "epoch": 418} {"train_loss": -34.84357452392578, "global_step": 50587, "epoch": 418} {"train_loss": -35.535064697265625, "global_step": 50588, "epoch": 418} {"train_loss": -35.39741897583008, "global_step": 50589, "epoch": 418} {"train_loss": -35.50772476196289, "global_step": 50590, "epoch": 418} {"train_loss": -35.51975631713867, "global_step": 50591, "epoch": 418} {"train_loss": -35.83762741088867, "global_step": 50592, "epoch": 418} {"train_loss": -34.98500061035156, "global_step": 50593, "epoch": 418} {"train_loss": -35.520713806152344, "global_step": 50594, "epoch": 418} {"train_loss": -35.782344818115234, "global_step": 50595, "epoch": 418} {"train_loss": -35.739620208740234, "global_step": 50596, "epoch": 418} {"train_loss": -35.466217041015625, "global_step": 50597, "epoch": 418} {"train_loss": -35.54468536376953, "global_step": 50598, "epoch": 418} {"train_loss": -35.26713180541992, "global_step": 50599, "epoch": 418} {"train_loss": -35.0618782043457, "global_step": 50600, "epoch": 418} {"train_loss": -35.5108757019043, "global_step": 50601, "epoch": 418} {"train_loss": -36.04364776611328, "global_step": 50602, "epoch": 418} {"train_loss": -35.1828727722168, "global_step": 50603, "epoch": 418} {"train_loss": -35.64471435546875, "global_step": 50604, "epoch": 418} {"train_loss": -35.93595886230469, "global_step": 50605, "epoch": 418} {"train_loss": -36.31787109375, "global_step": 50606, "epoch": 418} {"train_loss": -35.68214416503906, "global_step": 50607, "epoch": 418} {"train_loss": -36.111915588378906, "global_step": 50608, "epoch": 418} {"train_loss": -36.41166305541992, "global_step": 50609, "epoch": 418} {"train_loss": -36.44875717163086, "global_step": 50610, "epoch": 418} {"train_loss": -35.791019439697266, "global_step": 50611, "epoch": 418} {"train_loss": -36.17204666137695, "global_step": 50612, "epoch": 418} {"train_loss": -35.6335563659668, "global_step": 50613, "epoch": 418} {"train_loss": -36.02378463745117, "global_step": 50614, "epoch": 418} {"train_loss": -36.1915168762207, "global_step": 50615, "epoch": 418} {"train_loss": -36.03489303588867, "global_step": 50616, "epoch": 418} {"train_loss": -36.1650390625, "global_step": 50617, "epoch": 418} {"train_loss": -36.40648651123047, "global_step": 50618, "epoch": 418} {"train_loss": -35.646785736083984, "global_step": 50619, "epoch": 418} {"train_loss": -35.146514892578125, "global_step": 50620, "epoch": 418} {"train_loss": -34.87360763549805, "global_step": 50621, "epoch": 418} {"train_loss": -33.35987854003906, "global_step": 50622, "epoch": 418} {"train_loss": -32.406341552734375, "global_step": 50623, "epoch": 418} {"train_loss": -33.874202728271484, "global_step": 50624, "epoch": 418} {"train_loss": -35.758270263671875, "global_step": 50625, "epoch": 418} {"train_loss": -31.0869197845459, "global_step": 50626, "epoch": 418} {"train_loss": -28.553442001342773, "global_step": 50627, "epoch": 418} {"train_loss": -24.92792320251465, "global_step": 50628, "epoch": 418} {"train_loss": -28.72791862487793, "global_step": 50629, "epoch": 418} {"train_loss": -30.398401260375977, "global_step": 50630, "epoch": 418} {"train_loss": -32.15657424926758, "global_step": 50631, "epoch": 418} {"train_loss": -34.637969970703125, "global_step": 50632, "epoch": 418} {"train_loss": -33.59061813354492, "global_step": 50633, "epoch": 418} {"train_loss": -33.03321075439453, "global_step": 50634, "epoch": 418} {"train_loss": -34.91339111328125, "global_step": 50635, "epoch": 418} {"train_loss": -32.87482833862305, "global_step": 50636, "epoch": 418} {"train_loss": -34.6464729309082, "global_step": 50637, "epoch": 418} {"train_loss": -33.96167755126953, "global_step": 50638, "epoch": 418} {"train_loss": -34.73079299926758, "global_step": 50639, "epoch": 418} {"train_loss": -34.94059753417969, "global_step": 50640, "epoch": 418} {"train_loss": -34.588356018066406, "global_step": 50641, "epoch": 418} {"train_loss": -35.32841873168945, "global_step": 50642, "epoch": 418} {"train_loss": -35.27523422241211, "global_step": 50643, "epoch": 418} {"train_loss": -35.23765182495117, "global_step": 50644, "epoch": 418} {"train_loss": -34.52842330932617, "global_step": 50645, "epoch": 418} {"train_loss": -36.15963363647461, "global_step": 50646, "epoch": 418} {"train_loss": -35.15607833862305, "global_step": 50647, "epoch": 418} {"train_loss": -35.87359619140625, "global_step": 50648, "epoch": 418} {"train_loss": -34.992122650146484, "global_step": 50649, "epoch": 418} {"train_loss": -35.605987548828125, "global_step": 50650, "epoch": 418} {"train_loss": -35.7485466003418, "global_step": 50651, "epoch": 418} {"train_loss": -35.60770797729492, "global_step": 50652, "epoch": 418} {"train_loss": -35.82536697387695, "global_step": 50653, "epoch": 418} {"train_loss": -35.864532470703125, "global_step": 50654, "epoch": 418} {"train_loss": -35.03430938720703, "global_step": 50655, "epoch": 418} {"train_loss": -35.18142318725586, "global_step": 50656, "epoch": 418} {"train_loss": -35.168487548828125, "global_step": 50657, "epoch": 418} {"train_loss": -35.62481689453125, "global_step": 50658, "epoch": 418} {"train_loss": -35.34571075439453, "global_step": 50659, "epoch": 418} {"train_loss": -34.92332077026367, "global_step": 50660, "epoch": 418} {"train_loss": -34.996429443359375, "global_step": 50661, "epoch": 418} {"train_loss": -34.844268798828125, "global_step": 50662, "epoch": 418} {"train_loss": -35.688480377197266, "global_step": 50663, "epoch": 418} {"train_loss": -35.720455169677734, "global_step": 50664, "epoch": 418} {"train_loss": -36.302860260009766, "global_step": 50665, "epoch": 418} {"train_loss": -36.03969192504883, "global_step": 50666, "epoch": 418} {"train_loss": -36.080665588378906, "global_step": 50667, "epoch": 418} {"train_loss": -35.857818603515625, "global_step": 50668, "epoch": 418} {"train_loss": -35.858856201171875, "global_step": 50669, "epoch": 418} {"train_loss": -35.8077507019043, "global_step": 50670, "epoch": 418} {"train_loss": -35.95002365112305, "global_step": 50671, "epoch": 418} {"train_loss": -36.28169631958008, "global_step": 50672, "epoch": 418} {"train_loss": -36.196563720703125, "global_step": 50673, "epoch": 418} {"train_loss": -36.2380485534668, "global_step": 50674, "epoch": 418} {"train_loss": -36.0293083190918, "global_step": 50675, "epoch": 418} {"train_loss": -35.8719596862793, "global_step": 50676, "epoch": 418} {"train_loss": -36.18072509765625, "global_step": 50677, "epoch": 418} {"train_loss": -36.13680648803711, "global_step": 50678, "epoch": 418} {"train_loss": -36.13654327392578, "global_step": 50679, "epoch": 418} {"train_loss": -35.965389251708984, "global_step": 50680, "epoch": 418} {"train_loss": -35.92985916137695, "global_step": 50681, "epoch": 418} {"train_loss": -36.308692932128906, "global_step": 50682, "epoch": 418} {"train_loss": -36.406978607177734, "global_step": 50683, "epoch": 418} {"train_loss": -35.86954116821289, "global_step": 50684, "epoch": 418} {"train_loss": -36.71387481689453, "global_step": 50685, "epoch": 418} {"train_loss": -36.49949264526367, "global_step": 50686, "epoch": 418} {"train_loss": -35.89863204956055, "global_step": 50687, "epoch": 418} {"train_loss": -35.842586517333984, "global_step": 50688, "epoch": 418} {"train_loss": -34.167083740234375, "global_step": 50689, "epoch": 418} {"train_loss": -33.92513656616211, "global_step": 50690, "epoch": 418} {"train_loss": -33.97380447387695, "global_step": 50691, "epoch": 418} {"train_loss": -33.846832275390625, "global_step": 50692, "epoch": 418} {"train_loss": -32.50328826904297, "global_step": 50693, "epoch": 418} {"train_loss": -34.76824951171875, "global_step": 50694, "epoch": 418} {"train_loss": -35.23416519165039, "global_step": 50695, "epoch": 418} {"train_loss": -34.41508102416992, "global_step": 50696, "epoch": 418} {"train_loss": -34.93605041503906, "global_step": 50697, "epoch": 418} {"train_loss": -34.935498560755704, "global_step": 50698, "epoch": 418, "val_loss": 2642722.25} {"train_loss": -35.260616302490234, "global_step": 50699, "epoch": 419} {"train_loss": -34.68132400512695, "global_step": 50700, "epoch": 419} {"train_loss": -35.32533645629883, "global_step": 50701, "epoch": 419} {"train_loss": -34.789337158203125, "global_step": 50702, "epoch": 419} {"train_loss": -36.04542922973633, "global_step": 50703, "epoch": 419} {"train_loss": -35.1018180847168, "global_step": 50704, "epoch": 419} {"train_loss": -34.77126693725586, "global_step": 50705, "epoch": 419} {"train_loss": -31.574832916259766, "global_step": 50706, "epoch": 419} {"train_loss": -34.8608512878418, "global_step": 50707, "epoch": 419} {"train_loss": -34.9310188293457, "global_step": 50708, "epoch": 419} {"train_loss": -34.39902877807617, "global_step": 50709, "epoch": 419} {"train_loss": -34.62098693847656, "global_step": 50710, "epoch": 419} {"train_loss": -34.85987854003906, "global_step": 50711, "epoch": 419} {"train_loss": -4.885433197021484, "global_step": 50712, "epoch": 419} {"train_loss": -33.55342102050781, "global_step": 50713, "epoch": 419} {"train_loss": -13.105814933776855, "global_step": 50714, "epoch": 419} {"train_loss": -29.65753746032715, "global_step": 50715, "epoch": 419} {"train_loss": -27.36404800415039, "global_step": 50716, "epoch": 419} {"train_loss": -29.762109756469727, "global_step": 50717, "epoch": 419} {"train_loss": -28.98798942565918, "global_step": 50718, "epoch": 419} {"train_loss": -27.8867130279541, "global_step": 50719, "epoch": 419} {"train_loss": -27.838773727416992, "global_step": 50720, "epoch": 419} {"train_loss": -29.127424240112305, "global_step": 50721, "epoch": 419} {"train_loss": -31.128843307495117, "global_step": 50722, "epoch": 419} {"train_loss": -29.256183624267578, "global_step": 50723, "epoch": 419} {"train_loss": -30.203418731689453, "global_step": 50724, "epoch": 419} {"train_loss": -31.100589752197266, "global_step": 50725, "epoch": 419} {"train_loss": -30.72847557067871, "global_step": 50726, "epoch": 419} {"train_loss": -29.9823055267334, "global_step": 50727, "epoch": 419} {"train_loss": -31.402185440063477, "global_step": 50728, "epoch": 419} {"train_loss": -31.976932525634766, "global_step": 50729, "epoch": 419} {"train_loss": -31.468454360961914, "global_step": 50730, "epoch": 419} {"train_loss": -30.796667098999023, "global_step": 50731, "epoch": 419} {"train_loss": -32.26079559326172, "global_step": 50732, "epoch": 419} {"train_loss": -30.541614532470703, "global_step": 50733, "epoch": 419} {"train_loss": -32.10567855834961, "global_step": 50734, "epoch": 419} {"train_loss": -31.788440704345703, "global_step": 50735, "epoch": 419} {"train_loss": -31.946393966674805, "global_step": 50736, "epoch": 419} {"train_loss": -32.33246994018555, "global_step": 50737, "epoch": 419} {"train_loss": -32.3621711730957, "global_step": 50738, "epoch": 419} {"train_loss": -32.083168029785156, "global_step": 50739, "epoch": 419} {"train_loss": -32.513587951660156, "global_step": 50740, "epoch": 419} {"train_loss": -32.05147171020508, "global_step": 50741, "epoch": 419} {"train_loss": -32.25771713256836, "global_step": 50742, "epoch": 419} {"train_loss": -32.716060638427734, "global_step": 50743, "epoch": 419} {"train_loss": -32.69641876220703, "global_step": 50744, "epoch": 419} {"train_loss": -32.2536506652832, "global_step": 50745, "epoch": 419} {"train_loss": -33.13294219970703, "global_step": 50746, "epoch": 419} {"train_loss": -33.22472381591797, "global_step": 50747, "epoch": 419} {"train_loss": -32.78963088989258, "global_step": 50748, "epoch": 419} {"train_loss": -32.8266716003418, "global_step": 50749, "epoch": 419} {"train_loss": -32.53550720214844, "global_step": 50750, "epoch": 419} {"train_loss": -32.07884979248047, "global_step": 50751, "epoch": 419} {"train_loss": -32.50765609741211, "global_step": 50752, "epoch": 419} {"train_loss": -33.71798324584961, "global_step": 50753, "epoch": 419} {"train_loss": -33.111236572265625, "global_step": 50754, "epoch": 419} {"train_loss": -33.43113708496094, "global_step": 50755, "epoch": 419} {"train_loss": -33.70176315307617, "global_step": 50756, "epoch": 419} {"train_loss": -33.518165588378906, "global_step": 50757, "epoch": 419} {"train_loss": -32.80238342285156, "global_step": 50758, "epoch": 419} {"train_loss": -33.98842239379883, "global_step": 50759, "epoch": 419} {"train_loss": -33.1262321472168, "global_step": 50760, "epoch": 419} {"train_loss": -33.8907470703125, "global_step": 50761, "epoch": 419} {"train_loss": -34.00349807739258, "global_step": 50762, "epoch": 419} {"train_loss": -34.39413833618164, "global_step": 50763, "epoch": 419} {"train_loss": -33.41218948364258, "global_step": 50764, "epoch": 419} {"train_loss": -34.166603088378906, "global_step": 50765, "epoch": 419} {"train_loss": -34.086360931396484, "global_step": 50766, "epoch": 419} {"train_loss": -34.00980758666992, "global_step": 50767, "epoch": 419} {"train_loss": -34.07293701171875, "global_step": 50768, "epoch": 419} {"train_loss": -34.446617126464844, "global_step": 50769, "epoch": 419} {"train_loss": -34.7071418762207, "global_step": 50770, "epoch": 419} {"train_loss": -34.42173385620117, "global_step": 50771, "epoch": 419} {"train_loss": -34.28567123413086, "global_step": 50772, "epoch": 419} {"train_loss": -34.5105094909668, "global_step": 50773, "epoch": 419} {"train_loss": -34.127567291259766, "global_step": 50774, "epoch": 419} {"train_loss": -34.033138275146484, "global_step": 50775, "epoch": 419} {"train_loss": -34.74393844604492, "global_step": 50776, "epoch": 419} {"train_loss": -34.34511184692383, "global_step": 50777, "epoch": 419} {"train_loss": -34.68150329589844, "global_step": 50778, "epoch": 419} {"train_loss": -35.11445236206055, "global_step": 50779, "epoch": 419} {"train_loss": -34.60095977783203, "global_step": 50780, "epoch": 419} {"train_loss": -34.43812561035156, "global_step": 50781, "epoch": 419} {"train_loss": -34.69371795654297, "global_step": 50782, "epoch": 419} {"train_loss": -33.71770095825195, "global_step": 50783, "epoch": 419} {"train_loss": -32.51295852661133, "global_step": 50784, "epoch": 419} {"train_loss": -29.838134765625, "global_step": 50785, "epoch": 419} {"train_loss": -21.0728816986084, "global_step": 50786, "epoch": 419} {"train_loss": -12.907190322875977, "global_step": 50787, "epoch": 419} {"train_loss": -9.485869407653809, "global_step": 50788, "epoch": 419} {"train_loss": -31.525476455688477, "global_step": 50789, "epoch": 419} {"train_loss": -27.871423721313477, "global_step": 50790, "epoch": 419} {"train_loss": -31.29463005065918, "global_step": 50791, "epoch": 419} {"train_loss": -30.634265899658203, "global_step": 50792, "epoch": 419} {"train_loss": -32.7952995300293, "global_step": 50793, "epoch": 419} {"train_loss": -31.14896583557129, "global_step": 50794, "epoch": 419} {"train_loss": -34.41826248168945, "global_step": 50795, "epoch": 419} {"train_loss": -31.951635360717773, "global_step": 50796, "epoch": 419} {"train_loss": -32.924591064453125, "global_step": 50797, "epoch": 419} {"train_loss": -34.74325180053711, "global_step": 50798, "epoch": 419} {"train_loss": -33.44694519042969, "global_step": 50799, "epoch": 419} {"train_loss": -33.05294418334961, "global_step": 50800, "epoch": 419} {"train_loss": -34.294097900390625, "global_step": 50801, "epoch": 419} {"train_loss": -34.10517120361328, "global_step": 50802, "epoch": 419} {"train_loss": -33.55903244018555, "global_step": 50803, "epoch": 419} {"train_loss": -34.16310501098633, "global_step": 50804, "epoch": 419} {"train_loss": -34.84147644042969, "global_step": 50805, "epoch": 419} {"train_loss": -33.8115348815918, "global_step": 50806, "epoch": 419} {"train_loss": -34.02415084838867, "global_step": 50807, "epoch": 419} {"train_loss": -34.72407150268555, "global_step": 50808, "epoch": 419} {"train_loss": -33.71165084838867, "global_step": 50809, "epoch": 419} {"train_loss": -34.505126953125, "global_step": 50810, "epoch": 419} {"train_loss": -34.37712478637695, "global_step": 50811, "epoch": 419} {"train_loss": -34.019046783447266, "global_step": 50812, "epoch": 419} {"train_loss": -35.05488204956055, "global_step": 50813, "epoch": 419} {"train_loss": -34.412811279296875, "global_step": 50814, "epoch": 419} {"train_loss": -34.575923919677734, "global_step": 50815, "epoch": 419} {"train_loss": -34.704463958740234, "global_step": 50816, "epoch": 419} {"train_loss": -34.30349349975586, "global_step": 50817, "epoch": 419} {"train_loss": -35.48594284057617, "global_step": 50818, "epoch": 419} {"train_loss": -32.16500717352245, "global_step": 50819, "epoch": 419, "val_loss": 2657297.0} {"train_loss": -34.97942352294922, "global_step": 50820, "epoch": 420} {"train_loss": -34.7193489074707, "global_step": 50821, "epoch": 420} {"train_loss": -35.04935836791992, "global_step": 50822, "epoch": 420} {"train_loss": -34.78757858276367, "global_step": 50823, "epoch": 420} {"train_loss": -35.3111686706543, "global_step": 50824, "epoch": 420} {"train_loss": -35.35927200317383, "global_step": 50825, "epoch": 420} {"train_loss": -35.526947021484375, "global_step": 50826, "epoch": 420} {"train_loss": -35.64195251464844, "global_step": 50827, "epoch": 420} {"train_loss": -35.412689208984375, "global_step": 50828, "epoch": 420} {"train_loss": -35.04174041748047, "global_step": 50829, "epoch": 420} {"train_loss": -35.1953125, "global_step": 50830, "epoch": 420} {"train_loss": -35.555145263671875, "global_step": 50831, "epoch": 420} {"train_loss": -35.55820846557617, "global_step": 50832, "epoch": 420} {"train_loss": -35.3188362121582, "global_step": 50833, "epoch": 420} {"train_loss": -35.457157135009766, "global_step": 50834, "epoch": 420} {"train_loss": -35.681514739990234, "global_step": 50835, "epoch": 420} {"train_loss": -35.441070556640625, "global_step": 50836, "epoch": 420} {"train_loss": -34.9640998840332, "global_step": 50837, "epoch": 420} {"train_loss": -35.14051055908203, "global_step": 50838, "epoch": 420} {"train_loss": -36.01893997192383, "global_step": 50839, "epoch": 420} {"train_loss": -34.77194595336914, "global_step": 50840, "epoch": 420} {"train_loss": -34.75871276855469, "global_step": 50841, "epoch": 420} {"train_loss": -34.95235061645508, "global_step": 50842, "epoch": 420} {"train_loss": -34.37207794189453, "global_step": 50843, "epoch": 420} {"train_loss": -34.006980895996094, "global_step": 50844, "epoch": 420} {"train_loss": -32.19926452636719, "global_step": 50845, "epoch": 420} {"train_loss": -25.6694278717041, "global_step": 50846, "epoch": 420} {"train_loss": -17.421140670776367, "global_step": 50847, "epoch": 420} {"train_loss": -16.388185501098633, "global_step": 50848, "epoch": 420} {"train_loss": -31.559167861938477, "global_step": 50849, "epoch": 420} {"train_loss": -25.673437118530273, "global_step": 50850, "epoch": 420} {"train_loss": -29.65260124206543, "global_step": 50851, "epoch": 420} {"train_loss": -30.259321212768555, "global_step": 50852, "epoch": 420} {"train_loss": -31.448572158813477, "global_step": 50853, "epoch": 420} {"train_loss": -29.289581298828125, "global_step": 50854, "epoch": 420} {"train_loss": -34.414798736572266, "global_step": 50855, "epoch": 420} {"train_loss": -32.30117416381836, "global_step": 50856, "epoch": 420} {"train_loss": -31.7457332611084, "global_step": 50857, "epoch": 420} {"train_loss": -33.72587203979492, "global_step": 50858, "epoch": 420} {"train_loss": -33.62331771850586, "global_step": 50859, "epoch": 420} {"train_loss": -31.948577880859375, "global_step": 50860, "epoch": 420} {"train_loss": -33.36785888671875, "global_step": 50861, "epoch": 420} {"train_loss": -34.01282501220703, "global_step": 50862, "epoch": 420} {"train_loss": -34.11165237426758, "global_step": 50863, "epoch": 420} {"train_loss": -32.88335037231445, "global_step": 50864, "epoch": 420} {"train_loss": -34.069236755371094, "global_step": 50865, "epoch": 420} {"train_loss": -34.26505661010742, "global_step": 50866, "epoch": 420} {"train_loss": -34.174190521240234, "global_step": 50867, "epoch": 420} {"train_loss": -34.12763214111328, "global_step": 50868, "epoch": 420} {"train_loss": -33.72645950317383, "global_step": 50869, "epoch": 420} {"train_loss": -34.00861740112305, "global_step": 50870, "epoch": 420} {"train_loss": -34.483123779296875, "global_step": 50871, "epoch": 420} {"train_loss": -34.64622497558594, "global_step": 50872, "epoch": 420} {"train_loss": -33.986568450927734, "global_step": 50873, "epoch": 420} {"train_loss": -34.544498443603516, "global_step": 50874, "epoch": 420} {"train_loss": -34.35320281982422, "global_step": 50875, "epoch": 420} {"train_loss": -34.148773193359375, "global_step": 50876, "epoch": 420} {"train_loss": -34.8425407409668, "global_step": 50877, "epoch": 420} {"train_loss": -34.603633880615234, "global_step": 50878, "epoch": 420} {"train_loss": -34.60934066772461, "global_step": 50879, "epoch": 420} {"train_loss": -34.34121322631836, "global_step": 50880, "epoch": 420} {"train_loss": -33.94126510620117, "global_step": 50881, "epoch": 420} {"train_loss": -34.389259338378906, "global_step": 50882, "epoch": 420} {"train_loss": -35.02142333984375, "global_step": 50883, "epoch": 420} {"train_loss": -35.015350341796875, "global_step": 50884, "epoch": 420} {"train_loss": -34.17803955078125, "global_step": 50885, "epoch": 420} {"train_loss": -34.7338981628418, "global_step": 50886, "epoch": 420} {"train_loss": -34.43369674682617, "global_step": 50887, "epoch": 420} {"train_loss": -34.74565887451172, "global_step": 50888, "epoch": 420} {"train_loss": -34.56951904296875, "global_step": 50889, "epoch": 420} {"train_loss": -35.02337646484375, "global_step": 50890, "epoch": 420} {"train_loss": -34.78690719604492, "global_step": 50891, "epoch": 420} {"train_loss": -34.3538818359375, "global_step": 50892, "epoch": 420} {"train_loss": -34.457130432128906, "global_step": 50893, "epoch": 420} {"train_loss": -34.257930755615234, "global_step": 50894, "epoch": 420} {"train_loss": -34.33341598510742, "global_step": 50895, "epoch": 420} {"train_loss": -35.34584426879883, "global_step": 50896, "epoch": 420} {"train_loss": -34.884056091308594, "global_step": 50897, "epoch": 420} {"train_loss": -34.89406967163086, "global_step": 50898, "epoch": 420} {"train_loss": -34.23115921020508, "global_step": 50899, "epoch": 420} {"train_loss": -34.017513275146484, "global_step": 50900, "epoch": 420} {"train_loss": -33.025291442871094, "global_step": 50901, "epoch": 420} {"train_loss": -33.51280212402344, "global_step": 50902, "epoch": 420} {"train_loss": -35.092586517333984, "global_step": 50903, "epoch": 420} {"train_loss": -35.11845016479492, "global_step": 50904, "epoch": 420} {"train_loss": -33.44304275512695, "global_step": 50905, "epoch": 420} {"train_loss": -32.14014434814453, "global_step": 50906, "epoch": 420} {"train_loss": -32.32892990112305, "global_step": 50907, "epoch": 420} {"train_loss": -34.621612548828125, "global_step": 50908, "epoch": 420} {"train_loss": -33.51754379272461, "global_step": 50909, "epoch": 420} {"train_loss": -33.30222702026367, "global_step": 50910, "epoch": 420} {"train_loss": -35.4860954284668, "global_step": 50911, "epoch": 420} {"train_loss": -33.415374755859375, "global_step": 50912, "epoch": 420} {"train_loss": -34.52413558959961, "global_step": 50913, "epoch": 420} {"train_loss": -34.44992446899414, "global_step": 50914, "epoch": 420} {"train_loss": -34.30733871459961, "global_step": 50915, "epoch": 420} {"train_loss": -34.4337158203125, "global_step": 50916, "epoch": 420} {"train_loss": -35.1903076171875, "global_step": 50917, "epoch": 420} {"train_loss": -34.196502685546875, "global_step": 50918, "epoch": 420} {"train_loss": -34.88702392578125, "global_step": 50919, "epoch": 420} {"train_loss": -34.563507080078125, "global_step": 50920, "epoch": 420} {"train_loss": -35.204463958740234, "global_step": 50921, "epoch": 420} {"train_loss": -35.00093078613281, "global_step": 50922, "epoch": 420} {"train_loss": -34.69317626953125, "global_step": 50923, "epoch": 420} {"train_loss": -34.683998107910156, "global_step": 50924, "epoch": 420} {"train_loss": -34.28913879394531, "global_step": 50925, "epoch": 420} {"train_loss": -34.819732666015625, "global_step": 50926, "epoch": 420} {"train_loss": -35.1805534362793, "global_step": 50927, "epoch": 420} {"train_loss": -34.99164962768555, "global_step": 50928, "epoch": 420} {"train_loss": -35.243743896484375, "global_step": 50929, "epoch": 420} {"train_loss": -34.84429931640625, "global_step": 50930, "epoch": 420} {"train_loss": -35.090667724609375, "global_step": 50931, "epoch": 420} {"train_loss": -35.19447708129883, "global_step": 50932, "epoch": 420} {"train_loss": -35.81467056274414, "global_step": 50933, "epoch": 420} {"train_loss": -35.068241119384766, "global_step": 50934, "epoch": 420} {"train_loss": -35.20376205444336, "global_step": 50935, "epoch": 420} {"train_loss": -35.65108871459961, "global_step": 50936, "epoch": 420} {"train_loss": -35.528194427490234, "global_step": 50937, "epoch": 420} {"train_loss": -35.39774703979492, "global_step": 50938, "epoch": 420} {"train_loss": -34.94671630859375, "global_step": 50939, "epoch": 420} {"train_loss": -33.925962763384355, "global_step": 50940, "epoch": 420, "val_loss": 2696797.0} {"train_loss": -34.7108154296875, "global_step": 50941, "epoch": 421} {"train_loss": -34.623653411865234, "global_step": 50942, "epoch": 421} {"train_loss": -34.896949768066406, "global_step": 50943, "epoch": 421} {"train_loss": -34.869873046875, "global_step": 50944, "epoch": 421} {"train_loss": -35.04903793334961, "global_step": 50945, "epoch": 421} {"train_loss": -34.14962387084961, "global_step": 50946, "epoch": 421} {"train_loss": -35.058837890625, "global_step": 50947, "epoch": 421} {"train_loss": -34.73185348510742, "global_step": 50948, "epoch": 421} {"train_loss": -34.22718811035156, "global_step": 50949, "epoch": 421} {"train_loss": -35.2286262512207, "global_step": 50950, "epoch": 421} {"train_loss": -34.5985107421875, "global_step": 50951, "epoch": 421} {"train_loss": -35.44477844238281, "global_step": 50952, "epoch": 421} {"train_loss": -34.268157958984375, "global_step": 50953, "epoch": 421} {"train_loss": -34.45526885986328, "global_step": 50954, "epoch": 421} {"train_loss": -34.59370422363281, "global_step": 50955, "epoch": 421} {"train_loss": -34.5406379699707, "global_step": 50956, "epoch": 421} {"train_loss": -34.34849166870117, "global_step": 50957, "epoch": 421} {"train_loss": -34.981422424316406, "global_step": 50958, "epoch": 421} {"train_loss": -35.68585968017578, "global_step": 50959, "epoch": 421} {"train_loss": -34.37128448486328, "global_step": 50960, "epoch": 421} {"train_loss": -34.81791305541992, "global_step": 50961, "epoch": 421} {"train_loss": -35.45314407348633, "global_step": 50962, "epoch": 421} {"train_loss": -35.005104064941406, "global_step": 50963, "epoch": 421} {"train_loss": -35.16219711303711, "global_step": 50964, "epoch": 421} {"train_loss": -34.938114166259766, "global_step": 50965, "epoch": 421} {"train_loss": -35.37869644165039, "global_step": 50966, "epoch": 421} {"train_loss": -35.19623947143555, "global_step": 50967, "epoch": 421} {"train_loss": -35.070213317871094, "global_step": 50968, "epoch": 421} {"train_loss": -34.95595169067383, "global_step": 50969, "epoch": 421} {"train_loss": -35.30665969848633, "global_step": 50970, "epoch": 421} {"train_loss": -35.588626861572266, "global_step": 50971, "epoch": 421} {"train_loss": -35.40633010864258, "global_step": 50972, "epoch": 421} {"train_loss": -35.48664855957031, "global_step": 50973, "epoch": 421} {"train_loss": -35.326255798339844, "global_step": 50974, "epoch": 421} {"train_loss": -35.10983657836914, "global_step": 50975, "epoch": 421} {"train_loss": -35.27851104736328, "global_step": 50976, "epoch": 421} {"train_loss": -35.64131546020508, "global_step": 50977, "epoch": 421} {"train_loss": -35.035118103027344, "global_step": 50978, "epoch": 421} {"train_loss": -34.041748046875, "global_step": 50979, "epoch": 421} {"train_loss": -34.26039123535156, "global_step": 50980, "epoch": 421} {"train_loss": -32.43293380737305, "global_step": 50981, "epoch": 421} {"train_loss": -32.371341705322266, "global_step": 50982, "epoch": 421} {"train_loss": -35.341732025146484, "global_step": 50983, "epoch": 421} {"train_loss": -33.8125114440918, "global_step": 50984, "epoch": 421} {"train_loss": -35.0797119140625, "global_step": 50985, "epoch": 421} {"train_loss": -34.03264236450195, "global_step": 50986, "epoch": 421} {"train_loss": -34.72447204589844, "global_step": 50987, "epoch": 421} {"train_loss": -35.1218147277832, "global_step": 50988, "epoch": 421} {"train_loss": -34.620758056640625, "global_step": 50989, "epoch": 421} {"train_loss": -34.82648849487305, "global_step": 50990, "epoch": 421} {"train_loss": -35.22144317626953, "global_step": 50991, "epoch": 421} {"train_loss": -34.61023712158203, "global_step": 50992, "epoch": 421} {"train_loss": -33.99580001831055, "global_step": 50993, "epoch": 421} {"train_loss": -33.75827407836914, "global_step": 50994, "epoch": 421} {"train_loss": -33.501548767089844, "global_step": 50995, "epoch": 421} {"train_loss": -33.3863410949707, "global_step": 50996, "epoch": 421} {"train_loss": -34.253658294677734, "global_step": 50997, "epoch": 421} {"train_loss": -34.0159797668457, "global_step": 50998, "epoch": 421} {"train_loss": -34.15340805053711, "global_step": 50999, "epoch": 421} {"train_loss": -33.9097900390625, "global_step": 51000, "epoch": 421} {"train_loss": -34.444923400878906, "global_step": 51001, "epoch": 421} {"train_loss": -33.89488220214844, "global_step": 51002, "epoch": 421} {"train_loss": -34.0174674987793, "global_step": 51003, "epoch": 421} {"train_loss": -34.444984436035156, "global_step": 51004, "epoch": 421} {"train_loss": -33.419002532958984, "global_step": 51005, "epoch": 421} {"train_loss": -34.404903411865234, "global_step": 51006, "epoch": 421} {"train_loss": -34.484500885009766, "global_step": 51007, "epoch": 421} {"train_loss": -33.678192138671875, "global_step": 51008, "epoch": 421} {"train_loss": -34.389156341552734, "global_step": 51009, "epoch": 421} {"train_loss": -33.95328140258789, "global_step": 51010, "epoch": 421} {"train_loss": -34.97908401489258, "global_step": 51011, "epoch": 421} {"train_loss": -34.861942291259766, "global_step": 51012, "epoch": 421} {"train_loss": -35.276153564453125, "global_step": 51013, "epoch": 421} {"train_loss": -34.338321685791016, "global_step": 51014, "epoch": 421} {"train_loss": -34.83278274536133, "global_step": 51015, "epoch": 421} {"train_loss": -34.712799072265625, "global_step": 51016, "epoch": 421} {"train_loss": -35.41049575805664, "global_step": 51017, "epoch": 421} {"train_loss": -35.060211181640625, "global_step": 51018, "epoch": 421} {"train_loss": -34.799381256103516, "global_step": 51019, "epoch": 421} {"train_loss": -34.615901947021484, "global_step": 51020, "epoch": 421} {"train_loss": -35.35170364379883, "global_step": 51021, "epoch": 421} {"train_loss": -35.204280853271484, "global_step": 51022, "epoch": 421} {"train_loss": -34.7357292175293, "global_step": 51023, "epoch": 421} {"train_loss": -35.30592727661133, "global_step": 51024, "epoch": 421} {"train_loss": -35.398990631103516, "global_step": 51025, "epoch": 421} {"train_loss": -35.29859161376953, "global_step": 51026, "epoch": 421} {"train_loss": -35.582698822021484, "global_step": 51027, "epoch": 421} {"train_loss": -35.375972747802734, "global_step": 51028, "epoch": 421} {"train_loss": -35.239288330078125, "global_step": 51029, "epoch": 421} {"train_loss": -35.86096954345703, "global_step": 51030, "epoch": 421} {"train_loss": -35.57462692260742, "global_step": 51031, "epoch": 421} {"train_loss": -35.45359420776367, "global_step": 51032, "epoch": 421} {"train_loss": -35.32407760620117, "global_step": 51033, "epoch": 421} {"train_loss": -35.56207275390625, "global_step": 51034, "epoch": 421} {"train_loss": -35.76898956298828, "global_step": 51035, "epoch": 421} {"train_loss": -35.82908248901367, "global_step": 51036, "epoch": 421} {"train_loss": -35.41189193725586, "global_step": 51037, "epoch": 421} {"train_loss": -35.95551681518555, "global_step": 51038, "epoch": 421} {"train_loss": -35.77512741088867, "global_step": 51039, "epoch": 421} {"train_loss": -35.930145263671875, "global_step": 51040, "epoch": 421} {"train_loss": -35.400489807128906, "global_step": 51041, "epoch": 421} {"train_loss": -35.45574188232422, "global_step": 51042, "epoch": 421} {"train_loss": -35.34292221069336, "global_step": 51043, "epoch": 421} {"train_loss": -35.52421951293945, "global_step": 51044, "epoch": 421} {"train_loss": -35.61885452270508, "global_step": 51045, "epoch": 421} {"train_loss": -35.92167282104492, "global_step": 51046, "epoch": 421} {"train_loss": -36.199424743652344, "global_step": 51047, "epoch": 421} {"train_loss": -35.83753204345703, "global_step": 51048, "epoch": 421} {"train_loss": -36.2086296081543, "global_step": 51049, "epoch": 421} {"train_loss": -35.78357696533203, "global_step": 51050, "epoch": 421} {"train_loss": -35.96804428100586, "global_step": 51051, "epoch": 421} {"train_loss": -36.268985748291016, "global_step": 51052, "epoch": 421} {"train_loss": -35.87031555175781, "global_step": 51053, "epoch": 421} {"train_loss": -35.99625778198242, "global_step": 51054, "epoch": 421} {"train_loss": -36.32950973510742, "global_step": 51055, "epoch": 421} {"train_loss": -36.336692810058594, "global_step": 51056, "epoch": 421} {"train_loss": -36.20882797241211, "global_step": 51057, "epoch": 421} {"train_loss": -35.38018798828125, "global_step": 51058, "epoch": 421} {"train_loss": -35.723487854003906, "global_step": 51059, "epoch": 421} {"train_loss": -34.86775207519531, "global_step": 51060, "epoch": 421} {"train_loss": -34.96981783149656, "global_step": 51061, "epoch": 421, "val_loss": 2666628.25} {"train_loss": -32.5335693359375, "global_step": 51062, "epoch": 422} {"train_loss": -26.615528106689453, "global_step": 51063, "epoch": 422} {"train_loss": -24.341577529907227, "global_step": 51064, "epoch": 422} {"train_loss": -28.835357666015625, "global_step": 51065, "epoch": 422} {"train_loss": -34.66907501220703, "global_step": 51066, "epoch": 422} {"train_loss": -31.511945724487305, "global_step": 51067, "epoch": 422} {"train_loss": -32.03507995605469, "global_step": 51068, "epoch": 422} {"train_loss": -33.84334945678711, "global_step": 51069, "epoch": 422} {"train_loss": -34.0416374206543, "global_step": 51070, "epoch": 422} {"train_loss": -33.736995697021484, "global_step": 51071, "epoch": 422} {"train_loss": -33.78828048706055, "global_step": 51072, "epoch": 422} {"train_loss": -33.66395950317383, "global_step": 51073, "epoch": 422} {"train_loss": -34.73876190185547, "global_step": 51074, "epoch": 422} {"train_loss": -34.283546447753906, "global_step": 51075, "epoch": 422} {"train_loss": -35.28789138793945, "global_step": 51076, "epoch": 422} {"train_loss": -34.388851165771484, "global_step": 51077, "epoch": 422} {"train_loss": -35.2251091003418, "global_step": 51078, "epoch": 422} {"train_loss": -34.99055862426758, "global_step": 51079, "epoch": 422} {"train_loss": -34.796836853027344, "global_step": 51080, "epoch": 422} {"train_loss": -35.14420700073242, "global_step": 51081, "epoch": 422} {"train_loss": -35.15827178955078, "global_step": 51082, "epoch": 422} {"train_loss": -35.15488815307617, "global_step": 51083, "epoch": 422} {"train_loss": -34.7220573425293, "global_step": 51084, "epoch": 422} {"train_loss": -34.90135955810547, "global_step": 51085, "epoch": 422} {"train_loss": -35.15926742553711, "global_step": 51086, "epoch": 422} {"train_loss": -35.045310974121094, "global_step": 51087, "epoch": 422} {"train_loss": -34.277767181396484, "global_step": 51088, "epoch": 422} {"train_loss": -35.299346923828125, "global_step": 51089, "epoch": 422} {"train_loss": -35.51165008544922, "global_step": 51090, "epoch": 422} {"train_loss": -35.34016036987305, "global_step": 51091, "epoch": 422} {"train_loss": -35.81345748901367, "global_step": 51092, "epoch": 422} {"train_loss": -35.885189056396484, "global_step": 51093, "epoch": 422} {"train_loss": -35.436851501464844, "global_step": 51094, "epoch": 422} {"train_loss": -35.58266830444336, "global_step": 51095, "epoch": 422} {"train_loss": -35.36959457397461, "global_step": 51096, "epoch": 422} {"train_loss": -35.82414627075195, "global_step": 51097, "epoch": 422} {"train_loss": -35.101253509521484, "global_step": 51098, "epoch": 422} {"train_loss": -35.738121032714844, "global_step": 51099, "epoch": 422} {"train_loss": -35.354976654052734, "global_step": 51100, "epoch": 422} {"train_loss": -35.11104965209961, "global_step": 51101, "epoch": 422} {"train_loss": -34.783470153808594, "global_step": 51102, "epoch": 422} {"train_loss": -35.73212814331055, "global_step": 51103, "epoch": 422} {"train_loss": -35.680030822753906, "global_step": 51104, "epoch": 422} {"train_loss": -35.83688735961914, "global_step": 51105, "epoch": 422} {"train_loss": -36.019195556640625, "global_step": 51106, "epoch": 422} {"train_loss": -35.438148498535156, "global_step": 51107, "epoch": 422} {"train_loss": -35.83313751220703, "global_step": 51108, "epoch": 422} {"train_loss": -35.524627685546875, "global_step": 51109, "epoch": 422} {"train_loss": -35.615352630615234, "global_step": 51110, "epoch": 422} {"train_loss": -35.56705856323242, "global_step": 51111, "epoch": 422} {"train_loss": -34.477291107177734, "global_step": 51112, "epoch": 422} {"train_loss": -34.98114776611328, "global_step": 51113, "epoch": 422} {"train_loss": -34.13776779174805, "global_step": 51114, "epoch": 422} {"train_loss": -33.18003463745117, "global_step": 51115, "epoch": 422} {"train_loss": -35.11023712158203, "global_step": 51116, "epoch": 422} {"train_loss": -35.02250289916992, "global_step": 51117, "epoch": 422} {"train_loss": -32.96683883666992, "global_step": 51118, "epoch": 422} {"train_loss": -34.05919647216797, "global_step": 51119, "epoch": 422} {"train_loss": -35.222164154052734, "global_step": 51120, "epoch": 422} {"train_loss": -33.98228073120117, "global_step": 51121, "epoch": 422} {"train_loss": -33.15970230102539, "global_step": 51122, "epoch": 422} {"train_loss": -35.312042236328125, "global_step": 51123, "epoch": 422} {"train_loss": -34.42924880981445, "global_step": 51124, "epoch": 422} {"train_loss": -34.906551361083984, "global_step": 51125, "epoch": 422} {"train_loss": -33.61664581298828, "global_step": 51126, "epoch": 422} {"train_loss": -34.1081657409668, "global_step": 51127, "epoch": 422} {"train_loss": -33.22876739501953, "global_step": 51128, "epoch": 422} {"train_loss": -33.79238510131836, "global_step": 51129, "epoch": 422} {"train_loss": -33.81524658203125, "global_step": 51130, "epoch": 422} {"train_loss": -33.930267333984375, "global_step": 51131, "epoch": 422} {"train_loss": -33.43561553955078, "global_step": 51132, "epoch": 422} {"train_loss": -32.00320053100586, "global_step": 51133, "epoch": 422} {"train_loss": -30.753610610961914, "global_step": 51134, "epoch": 422} {"train_loss": -32.56997299194336, "global_step": 51135, "epoch": 422} {"train_loss": -29.361175537109375, "global_step": 51136, "epoch": 422} {"train_loss": -21.866708755493164, "global_step": 51137, "epoch": 422} {"train_loss": -28.202880859375, "global_step": 51138, "epoch": 422} {"train_loss": -9.556278228759766, "global_step": 51139, "epoch": 422} {"train_loss": 8.291511535644531, "global_step": 51140, "epoch": 422} {"train_loss": -1.488211989402771, "global_step": 51141, "epoch": 422} {"train_loss": -30.017179489135742, "global_step": 51142, "epoch": 422} {"train_loss": 22.117618560791016, "global_step": 51143, "epoch": 422} {"train_loss": -8.322842597961426, "global_step": 51144, "epoch": 422} {"train_loss": -31.490758895874023, "global_step": 51145, "epoch": 422} {"train_loss": -25.835973739624023, "global_step": 51146, "epoch": 422} {"train_loss": -16.480497360229492, "global_step": 51147, "epoch": 422} {"train_loss": -10.234628677368164, "global_step": 51148, "epoch": 422} {"train_loss": -26.5489444732666, "global_step": 51149, "epoch": 422} {"train_loss": -29.713468551635742, "global_step": 51150, "epoch": 422} {"train_loss": -31.99812126159668, "global_step": 51151, "epoch": 422} {"train_loss": -32.695411682128906, "global_step": 51152, "epoch": 422} {"train_loss": -32.010406494140625, "global_step": 51153, "epoch": 422} {"train_loss": -29.75623893737793, "global_step": 51154, "epoch": 422} {"train_loss": -31.307418823242188, "global_step": 51155, "epoch": 422} {"train_loss": -29.737985610961914, "global_step": 51156, "epoch": 422} {"train_loss": -28.966367721557617, "global_step": 51157, "epoch": 422} {"train_loss": -30.666196823120117, "global_step": 51158, "epoch": 422} {"train_loss": -30.475305557250977, "global_step": 51159, "epoch": 422} {"train_loss": -31.4328670501709, "global_step": 51160, "epoch": 422} {"train_loss": -32.011470794677734, "global_step": 51161, "epoch": 422} {"train_loss": -32.12142562866211, "global_step": 51162, "epoch": 422} {"train_loss": -32.029541015625, "global_step": 51163, "epoch": 422} {"train_loss": -33.021507263183594, "global_step": 51164, "epoch": 422} {"train_loss": -33.2093505859375, "global_step": 51165, "epoch": 422} {"train_loss": -32.8787841796875, "global_step": 51166, "epoch": 422} {"train_loss": -32.444393157958984, "global_step": 51167, "epoch": 422} {"train_loss": -33.25057601928711, "global_step": 51168, "epoch": 422} {"train_loss": -32.84185791015625, "global_step": 51169, "epoch": 422} {"train_loss": -33.233314514160156, "global_step": 51170, "epoch": 422} {"train_loss": -33.10345458984375, "global_step": 51171, "epoch": 422} {"train_loss": -33.35475540161133, "global_step": 51172, "epoch": 422} {"train_loss": -33.245357513427734, "global_step": 51173, "epoch": 422} {"train_loss": -33.39141845703125, "global_step": 51174, "epoch": 422} {"train_loss": -33.83545684814453, "global_step": 51175, "epoch": 422} {"train_loss": -33.60068893432617, "global_step": 51176, "epoch": 422} {"train_loss": -33.97658920288086, "global_step": 51177, "epoch": 422} {"train_loss": -33.994075775146484, "global_step": 51178, "epoch": 422} {"train_loss": -33.7667121887207, "global_step": 51179, "epoch": 422} {"train_loss": -33.79792404174805, "global_step": 51180, "epoch": 422} {"train_loss": -33.69182205200195, "global_step": 51181, "epoch": 422} {"train_loss": -31.493331092448273, "global_step": 51182, "epoch": 422, "val_loss": 2653563.0} {"train_loss": -34.25989532470703, "global_step": 51183, "epoch": 423} {"train_loss": -34.40595626831055, "global_step": 51184, "epoch": 423} {"train_loss": -33.41753005981445, "global_step": 51185, "epoch": 423} {"train_loss": -34.356117248535156, "global_step": 51186, "epoch": 423} {"train_loss": -34.26798629760742, "global_step": 51187, "epoch": 423} {"train_loss": -34.697113037109375, "global_step": 51188, "epoch": 423} {"train_loss": -34.20539474487305, "global_step": 51189, "epoch": 423} {"train_loss": -34.96661376953125, "global_step": 51190, "epoch": 423} {"train_loss": -35.16632843017578, "global_step": 51191, "epoch": 423} {"train_loss": -34.64213562011719, "global_step": 51192, "epoch": 423} {"train_loss": -34.82670593261719, "global_step": 51193, "epoch": 423} {"train_loss": -34.72990036010742, "global_step": 51194, "epoch": 423} {"train_loss": -34.68728256225586, "global_step": 51195, "epoch": 423} {"train_loss": -35.219764709472656, "global_step": 51196, "epoch": 423} {"train_loss": -35.37949752807617, "global_step": 51197, "epoch": 423} {"train_loss": -35.003273010253906, "global_step": 51198, "epoch": 423} {"train_loss": -35.194183349609375, "global_step": 51199, "epoch": 423} {"train_loss": -35.10311508178711, "global_step": 51200, "epoch": 423} {"train_loss": -34.502235412597656, "global_step": 51201, "epoch": 423} {"train_loss": -35.17360305786133, "global_step": 51202, "epoch": 423} {"train_loss": -35.49840545654297, "global_step": 51203, "epoch": 423} {"train_loss": -35.196773529052734, "global_step": 51204, "epoch": 423} {"train_loss": -35.633846282958984, "global_step": 51205, "epoch": 423} {"train_loss": -35.0615234375, "global_step": 51206, "epoch": 423} {"train_loss": -35.5962028503418, "global_step": 51207, "epoch": 423} {"train_loss": -35.59444046020508, "global_step": 51208, "epoch": 423} {"train_loss": -35.590728759765625, "global_step": 51209, "epoch": 423} {"train_loss": -35.526588439941406, "global_step": 51210, "epoch": 423} {"train_loss": -36.17814254760742, "global_step": 51211, "epoch": 423} {"train_loss": -35.18544387817383, "global_step": 51212, "epoch": 423} {"train_loss": -34.547088623046875, "global_step": 51213, "epoch": 423} {"train_loss": -35.49288558959961, "global_step": 51214, "epoch": 423} {"train_loss": -35.62173080444336, "global_step": 51215, "epoch": 423} {"train_loss": -35.569496154785156, "global_step": 51216, "epoch": 423} {"train_loss": -35.69717025756836, "global_step": 51217, "epoch": 423} {"train_loss": -35.47291564941406, "global_step": 51218, "epoch": 423} {"train_loss": -35.78152084350586, "global_step": 51219, "epoch": 423} {"train_loss": -34.878746032714844, "global_step": 51220, "epoch": 423} {"train_loss": -33.60662841796875, "global_step": 51221, "epoch": 423} {"train_loss": -34.61237716674805, "global_step": 51222, "epoch": 423} {"train_loss": -35.50849151611328, "global_step": 51223, "epoch": 423} {"train_loss": -35.82326126098633, "global_step": 51224, "epoch": 423} {"train_loss": -35.48575973510742, "global_step": 51225, "epoch": 423} {"train_loss": -34.65348434448242, "global_step": 51226, "epoch": 423} {"train_loss": -32.67409896850586, "global_step": 51227, "epoch": 423} {"train_loss": -31.42664909362793, "global_step": 51228, "epoch": 423} {"train_loss": -33.982059478759766, "global_step": 51229, "epoch": 423} {"train_loss": -34.88829040527344, "global_step": 51230, "epoch": 423} {"train_loss": -33.82157516479492, "global_step": 51231, "epoch": 423} {"train_loss": -34.65439987182617, "global_step": 51232, "epoch": 423} {"train_loss": -33.636104583740234, "global_step": 51233, "epoch": 423} {"train_loss": -34.7953987121582, "global_step": 51234, "epoch": 423} {"train_loss": -34.798797607421875, "global_step": 51235, "epoch": 423} {"train_loss": -34.61044692993164, "global_step": 51236, "epoch": 423} {"train_loss": -34.527626037597656, "global_step": 51237, "epoch": 423} {"train_loss": -35.125648498535156, "global_step": 51238, "epoch": 423} {"train_loss": -34.913230895996094, "global_step": 51239, "epoch": 423} {"train_loss": -33.889381408691406, "global_step": 51240, "epoch": 423} {"train_loss": -33.9588508605957, "global_step": 51241, "epoch": 423} {"train_loss": -34.092220306396484, "global_step": 51242, "epoch": 423} {"train_loss": -35.006771087646484, "global_step": 51243, "epoch": 423} {"train_loss": -33.67920684814453, "global_step": 51244, "epoch": 423} {"train_loss": -33.84544372558594, "global_step": 51245, "epoch": 423} {"train_loss": -34.77620315551758, "global_step": 51246, "epoch": 423} {"train_loss": -35.562984466552734, "global_step": 51247, "epoch": 423} {"train_loss": -33.62656784057617, "global_step": 51248, "epoch": 423} {"train_loss": -32.91875076293945, "global_step": 51249, "epoch": 423} {"train_loss": -33.160987854003906, "global_step": 51250, "epoch": 423} {"train_loss": -34.86488723754883, "global_step": 51251, "epoch": 423} {"train_loss": -34.7988395690918, "global_step": 51252, "epoch": 423} {"train_loss": -34.425106048583984, "global_step": 51253, "epoch": 423} {"train_loss": -35.22823715209961, "global_step": 51254, "epoch": 423} {"train_loss": -35.158016204833984, "global_step": 51255, "epoch": 423} {"train_loss": -34.62481689453125, "global_step": 51256, "epoch": 423} {"train_loss": -35.59404754638672, "global_step": 51257, "epoch": 423} {"train_loss": -35.23607635498047, "global_step": 51258, "epoch": 423} {"train_loss": -35.77654266357422, "global_step": 51259, "epoch": 423} {"train_loss": -35.336151123046875, "global_step": 51260, "epoch": 423} {"train_loss": -35.1762580871582, "global_step": 51261, "epoch": 423} {"train_loss": -35.214149475097656, "global_step": 51262, "epoch": 423} {"train_loss": -35.6572265625, "global_step": 51263, "epoch": 423} {"train_loss": -35.02873611450195, "global_step": 51264, "epoch": 423} {"train_loss": -35.53160095214844, "global_step": 51265, "epoch": 423} {"train_loss": -35.660377502441406, "global_step": 51266, "epoch": 423} {"train_loss": -34.8111457824707, "global_step": 51267, "epoch": 423} {"train_loss": -35.21120834350586, "global_step": 51268, "epoch": 423} {"train_loss": -35.00516891479492, "global_step": 51269, "epoch": 423} {"train_loss": -34.32496643066406, "global_step": 51270, "epoch": 423} {"train_loss": -34.63429641723633, "global_step": 51271, "epoch": 423} {"train_loss": -35.267879486083984, "global_step": 51272, "epoch": 423} {"train_loss": -35.19350051879883, "global_step": 51273, "epoch": 423} {"train_loss": -34.31120681762695, "global_step": 51274, "epoch": 423} {"train_loss": -33.359981536865234, "global_step": 51275, "epoch": 423} {"train_loss": -33.5687255859375, "global_step": 51276, "epoch": 423} {"train_loss": -33.72896194458008, "global_step": 51277, "epoch": 423} {"train_loss": -33.3148078918457, "global_step": 51278, "epoch": 423} {"train_loss": -34.23916244506836, "global_step": 51279, "epoch": 423} {"train_loss": -35.2155876159668, "global_step": 51280, "epoch": 423} {"train_loss": -32.48897933959961, "global_step": 51281, "epoch": 423} {"train_loss": -29.34442710876465, "global_step": 51282, "epoch": 423} {"train_loss": -27.39985466003418, "global_step": 51283, "epoch": 423} {"train_loss": -28.8786563873291, "global_step": 51284, "epoch": 423} {"train_loss": -35.05604934692383, "global_step": 51285, "epoch": 423} {"train_loss": -32.15317916870117, "global_step": 51286, "epoch": 423} {"train_loss": -28.532550811767578, "global_step": 51287, "epoch": 423} {"train_loss": -34.4720458984375, "global_step": 51288, "epoch": 423} {"train_loss": -30.02667236328125, "global_step": 51289, "epoch": 423} {"train_loss": -32.30827713012695, "global_step": 51290, "epoch": 423} {"train_loss": -33.375911712646484, "global_step": 51291, "epoch": 423} {"train_loss": -33.848079681396484, "global_step": 51292, "epoch": 423} {"train_loss": -33.3487434387207, "global_step": 51293, "epoch": 423} {"train_loss": -34.09397506713867, "global_step": 51294, "epoch": 423} {"train_loss": -31.879613876342773, "global_step": 51295, "epoch": 423} {"train_loss": -33.548667907714844, "global_step": 51296, "epoch": 423} {"train_loss": -33.842803955078125, "global_step": 51297, "epoch": 423} {"train_loss": -34.43496322631836, "global_step": 51298, "epoch": 423} {"train_loss": -34.50242233276367, "global_step": 51299, "epoch": 423} {"train_loss": -33.38528823852539, "global_step": 51300, "epoch": 423} {"train_loss": -34.817420959472656, "global_step": 51301, "epoch": 423} {"train_loss": -34.29704666137695, "global_step": 51302, "epoch": 423} {"train_loss": -34.34937341548195, "global_step": 51303, "epoch": 423, "val_loss": 2599403.5} {"train_loss": -34.92124557495117, "global_step": 51304, "epoch": 424} {"train_loss": -34.272056579589844, "global_step": 51305, "epoch": 424} {"train_loss": -34.520931243896484, "global_step": 51306, "epoch": 424} {"train_loss": -34.281368255615234, "global_step": 51307, "epoch": 424} {"train_loss": -34.24467468261719, "global_step": 51308, "epoch": 424} {"train_loss": -34.95370101928711, "global_step": 51309, "epoch": 424} {"train_loss": -34.68506622314453, "global_step": 51310, "epoch": 424} {"train_loss": -34.83905792236328, "global_step": 51311, "epoch": 424} {"train_loss": -34.82121276855469, "global_step": 51312, "epoch": 424} {"train_loss": -35.140254974365234, "global_step": 51313, "epoch": 424} {"train_loss": -34.926971435546875, "global_step": 51314, "epoch": 424} {"train_loss": -35.09487533569336, "global_step": 51315, "epoch": 424} {"train_loss": -35.04122543334961, "global_step": 51316, "epoch": 424} {"train_loss": -34.99168014526367, "global_step": 51317, "epoch": 424} {"train_loss": -35.48653793334961, "global_step": 51318, "epoch": 424} {"train_loss": -35.35722732543945, "global_step": 51319, "epoch": 424} {"train_loss": -35.409847259521484, "global_step": 51320, "epoch": 424} {"train_loss": -35.66666793823242, "global_step": 51321, "epoch": 424} {"train_loss": -35.46967697143555, "global_step": 51322, "epoch": 424} {"train_loss": -34.95216369628906, "global_step": 51323, "epoch": 424} {"train_loss": -35.180938720703125, "global_step": 51324, "epoch": 424} {"train_loss": -35.12007522583008, "global_step": 51325, "epoch": 424} {"train_loss": -35.757259368896484, "global_step": 51326, "epoch": 424} {"train_loss": -35.66575241088867, "global_step": 51327, "epoch": 424} {"train_loss": -35.083099365234375, "global_step": 51328, "epoch": 424} {"train_loss": -34.15634536743164, "global_step": 51329, "epoch": 424} {"train_loss": -32.812557220458984, "global_step": 51330, "epoch": 424} {"train_loss": -32.047340393066406, "global_step": 51331, "epoch": 424} {"train_loss": -32.869232177734375, "global_step": 51332, "epoch": 424} {"train_loss": -33.81832504272461, "global_step": 51333, "epoch": 424} {"train_loss": -35.251800537109375, "global_step": 51334, "epoch": 424} {"train_loss": -35.34641647338867, "global_step": 51335, "epoch": 424} {"train_loss": -34.14565658569336, "global_step": 51336, "epoch": 424} {"train_loss": -33.425270080566406, "global_step": 51337, "epoch": 424} {"train_loss": -34.384674072265625, "global_step": 51338, "epoch": 424} {"train_loss": -35.17824935913086, "global_step": 51339, "epoch": 424} {"train_loss": -33.761329650878906, "global_step": 51340, "epoch": 424} {"train_loss": -34.000274658203125, "global_step": 51341, "epoch": 424} {"train_loss": -33.693199157714844, "global_step": 51342, "epoch": 424} {"train_loss": -34.2342414855957, "global_step": 51343, "epoch": 424} {"train_loss": -34.921844482421875, "global_step": 51344, "epoch": 424} {"train_loss": -33.628936767578125, "global_step": 51345, "epoch": 424} {"train_loss": -32.683143615722656, "global_step": 51346, "epoch": 424} {"train_loss": -32.29784393310547, "global_step": 51347, "epoch": 424} {"train_loss": -35.271854400634766, "global_step": 51348, "epoch": 424} {"train_loss": -33.363861083984375, "global_step": 51349, "epoch": 424} {"train_loss": -34.12461471557617, "global_step": 51350, "epoch": 424} {"train_loss": -34.90300750732422, "global_step": 51351, "epoch": 424} {"train_loss": -34.60047912597656, "global_step": 51352, "epoch": 424} {"train_loss": -34.860225677490234, "global_step": 51353, "epoch": 424} {"train_loss": -35.6056022644043, "global_step": 51354, "epoch": 424} {"train_loss": -34.88200759887695, "global_step": 51355, "epoch": 424} {"train_loss": -35.39974594116211, "global_step": 51356, "epoch": 424} {"train_loss": -34.502723693847656, "global_step": 51357, "epoch": 424} {"train_loss": -35.057708740234375, "global_step": 51358, "epoch": 424} {"train_loss": -34.872859954833984, "global_step": 51359, "epoch": 424} {"train_loss": -34.69942092895508, "global_step": 51360, "epoch": 424} {"train_loss": -34.967708587646484, "global_step": 51361, "epoch": 424} {"train_loss": -34.82221603393555, "global_step": 51362, "epoch": 424} {"train_loss": -35.23788833618164, "global_step": 51363, "epoch": 424} {"train_loss": -34.10987854003906, "global_step": 51364, "epoch": 424} {"train_loss": -35.381778717041016, "global_step": 51365, "epoch": 424} {"train_loss": -35.60651397705078, "global_step": 51366, "epoch": 424} {"train_loss": -34.661155700683594, "global_step": 51367, "epoch": 424} {"train_loss": -34.79933166503906, "global_step": 51368, "epoch": 424} {"train_loss": -35.776790618896484, "global_step": 51369, "epoch": 424} {"train_loss": -35.3431510925293, "global_step": 51370, "epoch": 424} {"train_loss": -35.16887283325195, "global_step": 51371, "epoch": 424} {"train_loss": -35.901058197021484, "global_step": 51372, "epoch": 424} {"train_loss": -34.72434616088867, "global_step": 51373, "epoch": 424} {"train_loss": -35.03328323364258, "global_step": 51374, "epoch": 424} {"train_loss": -35.80427932739258, "global_step": 51375, "epoch": 424} {"train_loss": -34.805416107177734, "global_step": 51376, "epoch": 424} {"train_loss": -34.860477447509766, "global_step": 51377, "epoch": 424} {"train_loss": -34.99696731567383, "global_step": 51378, "epoch": 424} {"train_loss": -34.478126525878906, "global_step": 51379, "epoch": 424} {"train_loss": -35.96372985839844, "global_step": 51380, "epoch": 424} {"train_loss": -35.88178253173828, "global_step": 51381, "epoch": 424} {"train_loss": -34.42220687866211, "global_step": 51382, "epoch": 424} {"train_loss": -34.428138732910156, "global_step": 51383, "epoch": 424} {"train_loss": -33.69281768798828, "global_step": 51384, "epoch": 424} {"train_loss": -32.924537658691406, "global_step": 51385, "epoch": 424} {"train_loss": -33.84101867675781, "global_step": 51386, "epoch": 424} {"train_loss": -35.00257110595703, "global_step": 51387, "epoch": 424} {"train_loss": -35.41628646850586, "global_step": 51388, "epoch": 424} {"train_loss": -34.813838958740234, "global_step": 51389, "epoch": 424} {"train_loss": -35.30093002319336, "global_step": 51390, "epoch": 424} {"train_loss": -33.59840774536133, "global_step": 51391, "epoch": 424} {"train_loss": -34.95989227294922, "global_step": 51392, "epoch": 424} {"train_loss": -35.236167907714844, "global_step": 51393, "epoch": 424} {"train_loss": -34.559417724609375, "global_step": 51394, "epoch": 424} {"train_loss": -35.01801681518555, "global_step": 51395, "epoch": 424} {"train_loss": -35.078834533691406, "global_step": 51396, "epoch": 424} {"train_loss": -35.12367248535156, "global_step": 51397, "epoch": 424} {"train_loss": -34.64425277709961, "global_step": 51398, "epoch": 424} {"train_loss": -35.780147552490234, "global_step": 51399, "epoch": 424} {"train_loss": -35.1745719909668, "global_step": 51400, "epoch": 424} {"train_loss": -35.62329864501953, "global_step": 51401, "epoch": 424} {"train_loss": -35.40346908569336, "global_step": 51402, "epoch": 424} {"train_loss": -35.701778411865234, "global_step": 51403, "epoch": 424} {"train_loss": -34.9576301574707, "global_step": 51404, "epoch": 424} {"train_loss": -35.93134307861328, "global_step": 51405, "epoch": 424} {"train_loss": -35.60970687866211, "global_step": 51406, "epoch": 424} {"train_loss": -35.288570404052734, "global_step": 51407, "epoch": 424} {"train_loss": -35.10367202758789, "global_step": 51408, "epoch": 424} {"train_loss": -35.80282974243164, "global_step": 51409, "epoch": 424} {"train_loss": -35.213260650634766, "global_step": 51410, "epoch": 424} {"train_loss": -34.67317581176758, "global_step": 51411, "epoch": 424} {"train_loss": -35.70693588256836, "global_step": 51412, "epoch": 424} {"train_loss": -35.4012451171875, "global_step": 51413, "epoch": 424} {"train_loss": -35.04312515258789, "global_step": 51414, "epoch": 424} {"train_loss": -34.93242645263672, "global_step": 51415, "epoch": 424} {"train_loss": -35.468631744384766, "global_step": 51416, "epoch": 424} {"train_loss": -35.796051025390625, "global_step": 51417, "epoch": 424} {"train_loss": -35.02970504760742, "global_step": 51418, "epoch": 424} {"train_loss": -35.23613739013672, "global_step": 51419, "epoch": 424} {"train_loss": -35.293209075927734, "global_step": 51420, "epoch": 424} {"train_loss": -34.63043212890625, "global_step": 51421, "epoch": 424} {"train_loss": -34.55582809448242, "global_step": 51422, "epoch": 424} {"train_loss": -33.56397247314453, "global_step": 51423, "epoch": 424} {"train_loss": -34.79238133391073, "global_step": 51424, "epoch": 424, "val_loss": 2674505.0} {"train_loss": -31.002334594726562, "global_step": 51425, "epoch": 425} {"train_loss": -32.63338088989258, "global_step": 51426, "epoch": 425} {"train_loss": -35.41579055786133, "global_step": 51427, "epoch": 425} {"train_loss": -34.7642936706543, "global_step": 51428, "epoch": 425} {"train_loss": -34.32633590698242, "global_step": 51429, "epoch": 425} {"train_loss": -35.07711410522461, "global_step": 51430, "epoch": 425} {"train_loss": -35.31167984008789, "global_step": 51431, "epoch": 425} {"train_loss": -34.54719924926758, "global_step": 51432, "epoch": 425} {"train_loss": -32.8745002746582, "global_step": 51433, "epoch": 425} {"train_loss": -34.15067672729492, "global_step": 51434, "epoch": 425} {"train_loss": -33.67822265625, "global_step": 51435, "epoch": 425} {"train_loss": -34.62413024902344, "global_step": 51436, "epoch": 425} {"train_loss": -34.956363677978516, "global_step": 51437, "epoch": 425} {"train_loss": -34.17408752441406, "global_step": 51438, "epoch": 425} {"train_loss": -34.62400817871094, "global_step": 51439, "epoch": 425} {"train_loss": -35.05982208251953, "global_step": 51440, "epoch": 425} {"train_loss": -34.61825180053711, "global_step": 51441, "epoch": 425} {"train_loss": -34.66010284423828, "global_step": 51442, "epoch": 425} {"train_loss": -34.62876510620117, "global_step": 51443, "epoch": 425} {"train_loss": -35.35619354248047, "global_step": 51444, "epoch": 425} {"train_loss": -34.650054931640625, "global_step": 51445, "epoch": 425} {"train_loss": -35.233489990234375, "global_step": 51446, "epoch": 425} {"train_loss": -34.995479583740234, "global_step": 51447, "epoch": 425} {"train_loss": -35.3807373046875, "global_step": 51448, "epoch": 425} {"train_loss": -35.3850212097168, "global_step": 51449, "epoch": 425} {"train_loss": -34.5938835144043, "global_step": 51450, "epoch": 425} {"train_loss": -34.96883773803711, "global_step": 51451, "epoch": 425} {"train_loss": -34.94554901123047, "global_step": 51452, "epoch": 425} {"train_loss": -36.19411849975586, "global_step": 51453, "epoch": 425} {"train_loss": -35.35542678833008, "global_step": 51454, "epoch": 425} {"train_loss": -35.36886215209961, "global_step": 51455, "epoch": 425} {"train_loss": -35.62209701538086, "global_step": 51456, "epoch": 425} {"train_loss": -35.340736389160156, "global_step": 51457, "epoch": 425} {"train_loss": -35.500343322753906, "global_step": 51458, "epoch": 425} {"train_loss": -35.77853775024414, "global_step": 51459, "epoch": 425} {"train_loss": -35.7613525390625, "global_step": 51460, "epoch": 425} {"train_loss": -35.74012756347656, "global_step": 51461, "epoch": 425} {"train_loss": -35.47553634643555, "global_step": 51462, "epoch": 425} {"train_loss": -35.38486862182617, "global_step": 51463, "epoch": 425} {"train_loss": -34.173866271972656, "global_step": 51464, "epoch": 425} {"train_loss": -34.855690002441406, "global_step": 51465, "epoch": 425} {"train_loss": -35.666561126708984, "global_step": 51466, "epoch": 425} {"train_loss": -35.515663146972656, "global_step": 51467, "epoch": 425} {"train_loss": -34.953033447265625, "global_step": 51468, "epoch": 425} {"train_loss": -35.54812240600586, "global_step": 51469, "epoch": 425} {"train_loss": -34.47536849975586, "global_step": 51470, "epoch": 425} {"train_loss": -35.61020278930664, "global_step": 51471, "epoch": 425} {"train_loss": -34.7321891784668, "global_step": 51472, "epoch": 425} {"train_loss": -35.16078567504883, "global_step": 51473, "epoch": 425} {"train_loss": -35.05475997924805, "global_step": 51474, "epoch": 425} {"train_loss": -33.94242858886719, "global_step": 51475, "epoch": 425} {"train_loss": -34.99831771850586, "global_step": 51476, "epoch": 425} {"train_loss": -35.54618453979492, "global_step": 51477, "epoch": 425} {"train_loss": -34.15880584716797, "global_step": 51478, "epoch": 425} {"train_loss": -34.21578598022461, "global_step": 51479, "epoch": 425} {"train_loss": -34.50970458984375, "global_step": 51480, "epoch": 425} {"train_loss": -34.81294631958008, "global_step": 51481, "epoch": 425} {"train_loss": -34.21055221557617, "global_step": 51482, "epoch": 425} {"train_loss": -31.098236083984375, "global_step": 51483, "epoch": 425} {"train_loss": -34.90910720825195, "global_step": 51484, "epoch": 425} {"train_loss": -33.484046936035156, "global_step": 51485, "epoch": 425} {"train_loss": -33.618324279785156, "global_step": 51486, "epoch": 425} {"train_loss": -33.76360321044922, "global_step": 51487, "epoch": 425} {"train_loss": -32.20963668823242, "global_step": 51488, "epoch": 425} {"train_loss": -34.639217376708984, "global_step": 51489, "epoch": 425} {"train_loss": -33.18935775756836, "global_step": 51490, "epoch": 425} {"train_loss": -32.99015808105469, "global_step": 51491, "epoch": 425} {"train_loss": -34.384254455566406, "global_step": 51492, "epoch": 425} {"train_loss": -34.040523529052734, "global_step": 51493, "epoch": 425} {"train_loss": -34.91587448120117, "global_step": 51494, "epoch": 425} {"train_loss": -34.09169006347656, "global_step": 51495, "epoch": 425} {"train_loss": -33.34695053100586, "global_step": 51496, "epoch": 425} {"train_loss": -34.375179290771484, "global_step": 51497, "epoch": 425} {"train_loss": -34.122047424316406, "global_step": 51498, "epoch": 425} {"train_loss": -34.18270492553711, "global_step": 51499, "epoch": 425} {"train_loss": -34.41329574584961, "global_step": 51500, "epoch": 425} {"train_loss": -34.404232025146484, "global_step": 51501, "epoch": 425} {"train_loss": -34.841156005859375, "global_step": 51502, "epoch": 425} {"train_loss": -35.12688064575195, "global_step": 51503, "epoch": 425} {"train_loss": -35.06862258911133, "global_step": 51504, "epoch": 425} {"train_loss": -35.33500289916992, "global_step": 51505, "epoch": 425} {"train_loss": -34.63368606567383, "global_step": 51506, "epoch": 425} {"train_loss": -35.140037536621094, "global_step": 51507, "epoch": 425} {"train_loss": -35.381980895996094, "global_step": 51508, "epoch": 425} {"train_loss": -35.30224609375, "global_step": 51509, "epoch": 425} {"train_loss": -34.98177719116211, "global_step": 51510, "epoch": 425} {"train_loss": -35.11289596557617, "global_step": 51511, "epoch": 425} {"train_loss": -35.640785217285156, "global_step": 51512, "epoch": 425} {"train_loss": -35.20640182495117, "global_step": 51513, "epoch": 425} {"train_loss": -35.342926025390625, "global_step": 51514, "epoch": 425} {"train_loss": -35.47595977783203, "global_step": 51515, "epoch": 425} {"train_loss": -35.54664611816406, "global_step": 51516, "epoch": 425} {"train_loss": -35.10808181762695, "global_step": 51517, "epoch": 425} {"train_loss": -35.454200744628906, "global_step": 51518, "epoch": 425} {"train_loss": -35.60169219970703, "global_step": 51519, "epoch": 425} {"train_loss": -35.74755859375, "global_step": 51520, "epoch": 425} {"train_loss": -35.891456604003906, "global_step": 51521, "epoch": 425} {"train_loss": -35.57194137573242, "global_step": 51522, "epoch": 425} {"train_loss": -35.629817962646484, "global_step": 51523, "epoch": 425} {"train_loss": -36.32057571411133, "global_step": 51524, "epoch": 425} {"train_loss": -35.40134811401367, "global_step": 51525, "epoch": 425} {"train_loss": -34.774044036865234, "global_step": 51526, "epoch": 425} {"train_loss": -35.853851318359375, "global_step": 51527, "epoch": 425} {"train_loss": -35.64919662475586, "global_step": 51528, "epoch": 425} {"train_loss": -35.562049865722656, "global_step": 51529, "epoch": 425} {"train_loss": -35.19669723510742, "global_step": 51530, "epoch": 425} {"train_loss": -34.87837219238281, "global_step": 51531, "epoch": 425} {"train_loss": -35.14506912231445, "global_step": 51532, "epoch": 425} {"train_loss": -35.172183990478516, "global_step": 51533, "epoch": 425} {"train_loss": -34.96760177612305, "global_step": 51534, "epoch": 425} {"train_loss": -34.65519714355469, "global_step": 51535, "epoch": 425} {"train_loss": -35.9372673034668, "global_step": 51536, "epoch": 425} {"train_loss": -35.25565719604492, "global_step": 51537, "epoch": 425} {"train_loss": -35.08313751220703, "global_step": 51538, "epoch": 425} {"train_loss": -35.18119430541992, "global_step": 51539, "epoch": 425} {"train_loss": -34.77381896972656, "global_step": 51540, "epoch": 425} {"train_loss": -33.67353439331055, "global_step": 51541, "epoch": 425} {"train_loss": -34.09845733642578, "global_step": 51542, "epoch": 425} {"train_loss": -32.67451858520508, "global_step": 51543, "epoch": 425} {"train_loss": -33.49903869628906, "global_step": 51544, "epoch": 425} {"train_loss": -34.7604680967725, "global_step": 51545, "epoch": 425, "val_loss": 2554429.0} {"train_loss": -30.791181564331055, "global_step": 51546, "epoch": 426} {"train_loss": -32.744415283203125, "global_step": 51547, "epoch": 426} {"train_loss": -34.1535758972168, "global_step": 51548, "epoch": 426} {"train_loss": -32.08266830444336, "global_step": 51549, "epoch": 426} {"train_loss": -32.11323928833008, "global_step": 51550, "epoch": 426} {"train_loss": -30.006362915039062, "global_step": 51551, "epoch": 426} {"train_loss": -35.83283615112305, "global_step": 51552, "epoch": 426} {"train_loss": -32.81148910522461, "global_step": 51553, "epoch": 426} {"train_loss": -35.1272087097168, "global_step": 51554, "epoch": 426} {"train_loss": -33.59296417236328, "global_step": 51555, "epoch": 426} {"train_loss": -35.268516540527344, "global_step": 51556, "epoch": 426} {"train_loss": -33.11465072631836, "global_step": 51557, "epoch": 426} {"train_loss": -35.78279495239258, "global_step": 51558, "epoch": 426} {"train_loss": -34.41195297241211, "global_step": 51559, "epoch": 426} {"train_loss": -35.64954376220703, "global_step": 51560, "epoch": 426} {"train_loss": -34.351959228515625, "global_step": 51561, "epoch": 426} {"train_loss": -35.083343505859375, "global_step": 51562, "epoch": 426} {"train_loss": -35.09955978393555, "global_step": 51563, "epoch": 426} {"train_loss": -35.53140640258789, "global_step": 51564, "epoch": 426} {"train_loss": -35.25895309448242, "global_step": 51565, "epoch": 426} {"train_loss": -35.498104095458984, "global_step": 51566, "epoch": 426} {"train_loss": -35.368892669677734, "global_step": 51567, "epoch": 426} {"train_loss": -33.09413146972656, "global_step": 51568, "epoch": 426} {"train_loss": -35.75602340698242, "global_step": 51569, "epoch": 426} {"train_loss": -35.1789665222168, "global_step": 51570, "epoch": 426} {"train_loss": -35.30459213256836, "global_step": 51571, "epoch": 426} {"train_loss": -35.1553955078125, "global_step": 51572, "epoch": 426} {"train_loss": -35.643550872802734, "global_step": 51573, "epoch": 426} {"train_loss": -34.925140380859375, "global_step": 51574, "epoch": 426} {"train_loss": -34.990657806396484, "global_step": 51575, "epoch": 426} {"train_loss": -35.64812088012695, "global_step": 51576, "epoch": 426} {"train_loss": -35.58543014526367, "global_step": 51577, "epoch": 426} {"train_loss": -35.656246185302734, "global_step": 51578, "epoch": 426} {"train_loss": -36.13825607299805, "global_step": 51579, "epoch": 426} {"train_loss": -35.46210861206055, "global_step": 51580, "epoch": 426} {"train_loss": -35.6888542175293, "global_step": 51581, "epoch": 426} {"train_loss": -35.05623245239258, "global_step": 51582, "epoch": 426} {"train_loss": -34.340877532958984, "global_step": 51583, "epoch": 426} {"train_loss": -35.90983581542969, "global_step": 51584, "epoch": 426} {"train_loss": -35.918304443359375, "global_step": 51585, "epoch": 426} {"train_loss": -35.99277877807617, "global_step": 51586, "epoch": 426} {"train_loss": -35.57728958129883, "global_step": 51587, "epoch": 426} {"train_loss": -35.40496826171875, "global_step": 51588, "epoch": 426} {"train_loss": -35.44758987426758, "global_step": 51589, "epoch": 426} {"train_loss": -35.75068283081055, "global_step": 51590, "epoch": 426} {"train_loss": -35.474708557128906, "global_step": 51591, "epoch": 426} {"train_loss": -34.92556381225586, "global_step": 51592, "epoch": 426} {"train_loss": -33.88067626953125, "global_step": 51593, "epoch": 426} {"train_loss": -34.275691986083984, "global_step": 51594, "epoch": 426} {"train_loss": -36.223514556884766, "global_step": 51595, "epoch": 426} {"train_loss": -35.19221878051758, "global_step": 51596, "epoch": 426} {"train_loss": -35.92996597290039, "global_step": 51597, "epoch": 426} {"train_loss": -34.88140869140625, "global_step": 51598, "epoch": 426} {"train_loss": -34.43683624267578, "global_step": 51599, "epoch": 426} {"train_loss": -34.76046371459961, "global_step": 51600, "epoch": 426} {"train_loss": -35.3951416015625, "global_step": 51601, "epoch": 426} {"train_loss": -35.23154830932617, "global_step": 51602, "epoch": 426} {"train_loss": -35.03524398803711, "global_step": 51603, "epoch": 426} {"train_loss": -35.34687042236328, "global_step": 51604, "epoch": 426} {"train_loss": -35.79822540283203, "global_step": 51605, "epoch": 426} {"train_loss": -34.76981735229492, "global_step": 51606, "epoch": 426} {"train_loss": -35.842620849609375, "global_step": 51607, "epoch": 426} {"train_loss": -35.00405502319336, "global_step": 51608, "epoch": 426} {"train_loss": -35.72681427001953, "global_step": 51609, "epoch": 426} {"train_loss": -35.03217697143555, "global_step": 51610, "epoch": 426} {"train_loss": -35.50336837768555, "global_step": 51611, "epoch": 426} {"train_loss": -36.17086410522461, "global_step": 51612, "epoch": 426} {"train_loss": -34.087215423583984, "global_step": 51613, "epoch": 426} {"train_loss": -33.83818435668945, "global_step": 51614, "epoch": 426} {"train_loss": -35.08063507080078, "global_step": 51615, "epoch": 426} {"train_loss": -36.125953674316406, "global_step": 51616, "epoch": 426} {"train_loss": -34.180179595947266, "global_step": 51617, "epoch": 426} {"train_loss": -34.94316482543945, "global_step": 51618, "epoch": 426} {"train_loss": -34.91106033325195, "global_step": 51619, "epoch": 426} {"train_loss": -35.17646026611328, "global_step": 51620, "epoch": 426} {"train_loss": -35.409114837646484, "global_step": 51621, "epoch": 426} {"train_loss": -35.15180587768555, "global_step": 51622, "epoch": 426} {"train_loss": -35.482723236083984, "global_step": 51623, "epoch": 426} {"train_loss": -34.621803283691406, "global_step": 51624, "epoch": 426} {"train_loss": -35.68513870239258, "global_step": 51625, "epoch": 426} {"train_loss": -34.0564079284668, "global_step": 51626, "epoch": 426} {"train_loss": -35.090721130371094, "global_step": 51627, "epoch": 426} {"train_loss": -34.96546173095703, "global_step": 51628, "epoch": 426} {"train_loss": -35.660682678222656, "global_step": 51629, "epoch": 426} {"train_loss": -32.78642654418945, "global_step": 51630, "epoch": 426} {"train_loss": -31.578298568725586, "global_step": 51631, "epoch": 426} {"train_loss": -34.98136520385742, "global_step": 51632, "epoch": 426} {"train_loss": -35.56045150756836, "global_step": 51633, "epoch": 426} {"train_loss": -34.710205078125, "global_step": 51634, "epoch": 426} {"train_loss": -35.19536209106445, "global_step": 51635, "epoch": 426} {"train_loss": -35.80686569213867, "global_step": 51636, "epoch": 426} {"train_loss": -35.168670654296875, "global_step": 51637, "epoch": 426} {"train_loss": -34.331356048583984, "global_step": 51638, "epoch": 426} {"train_loss": -35.144691467285156, "global_step": 51639, "epoch": 426} {"train_loss": -35.795162200927734, "global_step": 51640, "epoch": 426} {"train_loss": -36.19546127319336, "global_step": 51641, "epoch": 426} {"train_loss": -35.46662139892578, "global_step": 51642, "epoch": 426} {"train_loss": -35.473323822021484, "global_step": 51643, "epoch": 426} {"train_loss": -36.051876068115234, "global_step": 51644, "epoch": 426} {"train_loss": -35.644039154052734, "global_step": 51645, "epoch": 426} {"train_loss": -35.861576080322266, "global_step": 51646, "epoch": 426} {"train_loss": -35.7304573059082, "global_step": 51647, "epoch": 426} {"train_loss": -35.9759635925293, "global_step": 51648, "epoch": 426} {"train_loss": -35.50320816040039, "global_step": 51649, "epoch": 426} {"train_loss": -35.91990661621094, "global_step": 51650, "epoch": 426} {"train_loss": -35.48582077026367, "global_step": 51651, "epoch": 426} {"train_loss": -36.16279983520508, "global_step": 51652, "epoch": 426} {"train_loss": -35.96770477294922, "global_step": 51653, "epoch": 426} {"train_loss": -36.032264709472656, "global_step": 51654, "epoch": 426} {"train_loss": -35.34711837768555, "global_step": 51655, "epoch": 426} {"train_loss": -35.28278732299805, "global_step": 51656, "epoch": 426} {"train_loss": -36.002952575683594, "global_step": 51657, "epoch": 426} {"train_loss": -35.77381896972656, "global_step": 51658, "epoch": 426} {"train_loss": -35.15382766723633, "global_step": 51659, "epoch": 426} {"train_loss": -35.81637954711914, "global_step": 51660, "epoch": 426} {"train_loss": -35.4720573425293, "global_step": 51661, "epoch": 426} {"train_loss": -35.7154655456543, "global_step": 51662, "epoch": 426} {"train_loss": -34.08388900756836, "global_step": 51663, "epoch": 426} {"train_loss": -32.26430130004883, "global_step": 51664, "epoch": 426} {"train_loss": -32.455562591552734, "global_step": 51665, "epoch": 426} {"train_loss": -34.9705038464759, "global_step": 51666, "epoch": 426, "val_loss": 2638195.0} {"train_loss": -33.165077209472656, "global_step": 51667, "epoch": 427} {"train_loss": -31.7476863861084, "global_step": 51668, "epoch": 427} {"train_loss": -35.365840911865234, "global_step": 51669, "epoch": 427} {"train_loss": -33.5597038269043, "global_step": 51670, "epoch": 427} {"train_loss": -33.232810974121094, "global_step": 51671, "epoch": 427} {"train_loss": -32.62314987182617, "global_step": 51672, "epoch": 427} {"train_loss": -34.38811111450195, "global_step": 51673, "epoch": 427} {"train_loss": -34.132164001464844, "global_step": 51674, "epoch": 427} {"train_loss": -34.72675704956055, "global_step": 51675, "epoch": 427} {"train_loss": -34.064910888671875, "global_step": 51676, "epoch": 427} {"train_loss": -34.71489334106445, "global_step": 51677, "epoch": 427} {"train_loss": -34.828609466552734, "global_step": 51678, "epoch": 427} {"train_loss": -34.893959045410156, "global_step": 51679, "epoch": 427} {"train_loss": -34.27279281616211, "global_step": 51680, "epoch": 427} {"train_loss": -34.79256057739258, "global_step": 51681, "epoch": 427} {"train_loss": -34.61381530761719, "global_step": 51682, "epoch": 427} {"train_loss": -35.17916488647461, "global_step": 51683, "epoch": 427} {"train_loss": -33.93535232543945, "global_step": 51684, "epoch": 427} {"train_loss": -34.78583526611328, "global_step": 51685, "epoch": 427} {"train_loss": -34.65093994140625, "global_step": 51686, "epoch": 427} {"train_loss": -34.737728118896484, "global_step": 51687, "epoch": 427} {"train_loss": -35.510929107666016, "global_step": 51688, "epoch": 427} {"train_loss": -34.826904296875, "global_step": 51689, "epoch": 427} {"train_loss": -34.84933090209961, "global_step": 51690, "epoch": 427} {"train_loss": -35.27997589111328, "global_step": 51691, "epoch": 427} {"train_loss": -35.144649505615234, "global_step": 51692, "epoch": 427} {"train_loss": -34.63600158691406, "global_step": 51693, "epoch": 427} {"train_loss": -35.6751594543457, "global_step": 51694, "epoch": 427} {"train_loss": -34.790443420410156, "global_step": 51695, "epoch": 427} {"train_loss": -34.40106201171875, "global_step": 51696, "epoch": 427} {"train_loss": -35.46290969848633, "global_step": 51697, "epoch": 427} {"train_loss": -35.17853546142578, "global_step": 51698, "epoch": 427} {"train_loss": -34.400421142578125, "global_step": 51699, "epoch": 427} {"train_loss": -35.35579299926758, "global_step": 51700, "epoch": 427} {"train_loss": -34.568267822265625, "global_step": 51701, "epoch": 427} {"train_loss": -34.45574188232422, "global_step": 51702, "epoch": 427} {"train_loss": -35.914485931396484, "global_step": 51703, "epoch": 427} {"train_loss": -35.399723052978516, "global_step": 51704, "epoch": 427} {"train_loss": -34.941383361816406, "global_step": 51705, "epoch": 427} {"train_loss": -36.13705062866211, "global_step": 51706, "epoch": 427} {"train_loss": -35.12837219238281, "global_step": 51707, "epoch": 427} {"train_loss": -33.33035659790039, "global_step": 51708, "epoch": 427} {"train_loss": -34.0020637512207, "global_step": 51709, "epoch": 427} {"train_loss": -34.172847747802734, "global_step": 51710, "epoch": 427} {"train_loss": -34.03231430053711, "global_step": 51711, "epoch": 427} {"train_loss": -35.29115295410156, "global_step": 51712, "epoch": 427} {"train_loss": -35.28656005859375, "global_step": 51713, "epoch": 427} {"train_loss": -33.39924621582031, "global_step": 51714, "epoch": 427} {"train_loss": -34.7159538269043, "global_step": 51715, "epoch": 427} {"train_loss": -35.3646354675293, "global_step": 51716, "epoch": 427} {"train_loss": -34.55582809448242, "global_step": 51717, "epoch": 427} {"train_loss": -35.09200668334961, "global_step": 51718, "epoch": 427} {"train_loss": -35.14496612548828, "global_step": 51719, "epoch": 427} {"train_loss": -35.34197235107422, "global_step": 51720, "epoch": 427} {"train_loss": -35.01522445678711, "global_step": 51721, "epoch": 427} {"train_loss": -35.42146301269531, "global_step": 51722, "epoch": 427} {"train_loss": -35.482757568359375, "global_step": 51723, "epoch": 427} {"train_loss": -35.81840515136719, "global_step": 51724, "epoch": 427} {"train_loss": -34.77141571044922, "global_step": 51725, "epoch": 427} {"train_loss": -33.94709014892578, "global_step": 51726, "epoch": 427} {"train_loss": -33.79375076293945, "global_step": 51727, "epoch": 427} {"train_loss": -35.411861419677734, "global_step": 51728, "epoch": 427} {"train_loss": -35.80515670776367, "global_step": 51729, "epoch": 427} {"train_loss": -34.771400451660156, "global_step": 51730, "epoch": 427} {"train_loss": -34.371822357177734, "global_step": 51731, "epoch": 427} {"train_loss": -35.48658752441406, "global_step": 51732, "epoch": 427} {"train_loss": -35.721797943115234, "global_step": 51733, "epoch": 427} {"train_loss": -35.4078369140625, "global_step": 51734, "epoch": 427} {"train_loss": -35.548248291015625, "global_step": 51735, "epoch": 427} {"train_loss": -35.46222686767578, "global_step": 51736, "epoch": 427} {"train_loss": -35.35622787475586, "global_step": 51737, "epoch": 427} {"train_loss": -35.87649154663086, "global_step": 51738, "epoch": 427} {"train_loss": -35.752437591552734, "global_step": 51739, "epoch": 427} {"train_loss": -35.78050231933594, "global_step": 51740, "epoch": 427} {"train_loss": -36.054988861083984, "global_step": 51741, "epoch": 427} {"train_loss": -35.438087463378906, "global_step": 51742, "epoch": 427} {"train_loss": -36.1519660949707, "global_step": 51743, "epoch": 427} {"train_loss": -35.819393157958984, "global_step": 51744, "epoch": 427} {"train_loss": -35.15993118286133, "global_step": 51745, "epoch": 427} {"train_loss": -36.35748291015625, "global_step": 51746, "epoch": 427} {"train_loss": -35.73066711425781, "global_step": 51747, "epoch": 427} {"train_loss": -34.920082092285156, "global_step": 51748, "epoch": 427} {"train_loss": -34.63748550415039, "global_step": 51749, "epoch": 427} {"train_loss": -34.40973663330078, "global_step": 51750, "epoch": 427} {"train_loss": -33.1599006652832, "global_step": 51751, "epoch": 427} {"train_loss": -31.64788246154785, "global_step": 51752, "epoch": 427} {"train_loss": -27.60037612915039, "global_step": 51753, "epoch": 427} {"train_loss": -31.656522750854492, "global_step": 51754, "epoch": 427} {"train_loss": -23.135650634765625, "global_step": 51755, "epoch": 427} {"train_loss": -18.29878807067871, "global_step": 51756, "epoch": 427} {"train_loss": -26.439111709594727, "global_step": 51757, "epoch": 427} {"train_loss": -20.320804595947266, "global_step": 51758, "epoch": 427} {"train_loss": -25.69571876525879, "global_step": 51759, "epoch": 427} {"train_loss": -25.333744049072266, "global_step": 51760, "epoch": 427} {"train_loss": -23.288528442382812, "global_step": 51761, "epoch": 427} {"train_loss": -26.784381866455078, "global_step": 51762, "epoch": 427} {"train_loss": -25.938440322875977, "global_step": 51763, "epoch": 427} {"train_loss": -23.986188888549805, "global_step": 51764, "epoch": 427} {"train_loss": -26.74273681640625, "global_step": 51765, "epoch": 427} {"train_loss": -25.802900314331055, "global_step": 51766, "epoch": 427} {"train_loss": -26.33847999572754, "global_step": 51767, "epoch": 427} {"train_loss": -26.77569580078125, "global_step": 51768, "epoch": 427} {"train_loss": -26.627155303955078, "global_step": 51769, "epoch": 427} {"train_loss": -26.964496612548828, "global_step": 51770, "epoch": 427} {"train_loss": -28.513538360595703, "global_step": 51771, "epoch": 427} {"train_loss": -30.0517520904541, "global_step": 51772, "epoch": 427} {"train_loss": -28.172901153564453, "global_step": 51773, "epoch": 427} {"train_loss": -27.916601181030273, "global_step": 51774, "epoch": 427} {"train_loss": -27.0440673828125, "global_step": 51775, "epoch": 427} {"train_loss": -29.07806968688965, "global_step": 51776, "epoch": 427} {"train_loss": -29.04697036743164, "global_step": 51777, "epoch": 427} {"train_loss": -30.687963485717773, "global_step": 51778, "epoch": 427} {"train_loss": -29.733749389648438, "global_step": 51779, "epoch": 427} {"train_loss": -30.31439208984375, "global_step": 51780, "epoch": 427} {"train_loss": -30.15234375, "global_step": 51781, "epoch": 427} {"train_loss": -30.76076316833496, "global_step": 51782, "epoch": 427} {"train_loss": -30.3555850982666, "global_step": 51783, "epoch": 427} {"train_loss": -28.9300537109375, "global_step": 51784, "epoch": 427} {"train_loss": -26.953765869140625, "global_step": 51785, "epoch": 427} {"train_loss": -30.425220489501953, "global_step": 51786, "epoch": 427} {"train_loss": -32.64450323877256, "global_step": 51787, "epoch": 427, "val_loss": 2608621.75} {"train_loss": -28.392765045166016, "global_step": 51788, "epoch": 428} {"train_loss": -28.313634872436523, "global_step": 51789, "epoch": 428} {"train_loss": -31.84046745300293, "global_step": 51790, "epoch": 428} {"train_loss": -28.437997817993164, "global_step": 51791, "epoch": 428} {"train_loss": -31.131982803344727, "global_step": 51792, "epoch": 428} {"train_loss": -30.472822189331055, "global_step": 51793, "epoch": 428} {"train_loss": -31.204788208007812, "global_step": 51794, "epoch": 428} {"train_loss": -31.82013511657715, "global_step": 51795, "epoch": 428} {"train_loss": -32.5030403137207, "global_step": 51796, "epoch": 428} {"train_loss": -31.056737899780273, "global_step": 51797, "epoch": 428} {"train_loss": -31.12518882751465, "global_step": 51798, "epoch": 428} {"train_loss": -31.704675674438477, "global_step": 51799, "epoch": 428} {"train_loss": -31.886096954345703, "global_step": 51800, "epoch": 428} {"train_loss": -32.1572151184082, "global_step": 51801, "epoch": 428} {"train_loss": -32.38798904418945, "global_step": 51802, "epoch": 428} {"train_loss": -32.10067367553711, "global_step": 51803, "epoch": 428} {"train_loss": -32.10761260986328, "global_step": 51804, "epoch": 428} {"train_loss": -32.019256591796875, "global_step": 51805, "epoch": 428} {"train_loss": -32.24225616455078, "global_step": 51806, "epoch": 428} {"train_loss": -32.50777053833008, "global_step": 51807, "epoch": 428} {"train_loss": -32.51665115356445, "global_step": 51808, "epoch": 428} {"train_loss": -31.271595001220703, "global_step": 51809, "epoch": 428} {"train_loss": -29.302404403686523, "global_step": 51810, "epoch": 428} {"train_loss": -29.145898818969727, "global_step": 51811, "epoch": 428} {"train_loss": -32.45222091674805, "global_step": 51812, "epoch": 428} {"train_loss": -30.64790153503418, "global_step": 51813, "epoch": 428} {"train_loss": -30.136005401611328, "global_step": 51814, "epoch": 428} {"train_loss": -21.525440216064453, "global_step": 51815, "epoch": 428} {"train_loss": -25.943017959594727, "global_step": 51816, "epoch": 428} {"train_loss": -28.97523307800293, "global_step": 51817, "epoch": 428} {"train_loss": -28.396841049194336, "global_step": 51818, "epoch": 428} {"train_loss": -29.918787002563477, "global_step": 51819, "epoch": 428} {"train_loss": -29.585968017578125, "global_step": 51820, "epoch": 428} {"train_loss": -30.797483444213867, "global_step": 51821, "epoch": 428} {"train_loss": -28.955991744995117, "global_step": 51822, "epoch": 428} {"train_loss": -31.142730712890625, "global_step": 51823, "epoch": 428} {"train_loss": -29.836294174194336, "global_step": 51824, "epoch": 428} {"train_loss": -29.980789184570312, "global_step": 51825, "epoch": 428} {"train_loss": -32.116600036621094, "global_step": 51826, "epoch": 428} {"train_loss": -30.80826187133789, "global_step": 51827, "epoch": 428} {"train_loss": -31.55767250061035, "global_step": 51828, "epoch": 428} {"train_loss": -31.2622013092041, "global_step": 51829, "epoch": 428} {"train_loss": -31.644336700439453, "global_step": 51830, "epoch": 428} {"train_loss": -31.511173248291016, "global_step": 51831, "epoch": 428} {"train_loss": -31.67036247253418, "global_step": 51832, "epoch": 428} {"train_loss": -32.33683395385742, "global_step": 51833, "epoch": 428} {"train_loss": -32.183326721191406, "global_step": 51834, "epoch": 428} {"train_loss": -31.876209259033203, "global_step": 51835, "epoch": 428} {"train_loss": -32.0554313659668, "global_step": 51836, "epoch": 428} {"train_loss": -31.781057357788086, "global_step": 51837, "epoch": 428} {"train_loss": -32.194496154785156, "global_step": 51838, "epoch": 428} {"train_loss": -31.022647857666016, "global_step": 51839, "epoch": 428} {"train_loss": -26.540882110595703, "global_step": 51840, "epoch": 428} {"train_loss": -26.995258331298828, "global_step": 51841, "epoch": 428} {"train_loss": -32.79539108276367, "global_step": 51842, "epoch": 428} {"train_loss": -28.54888343811035, "global_step": 51843, "epoch": 428} {"train_loss": -32.98906707763672, "global_step": 51844, "epoch": 428} {"train_loss": -30.781641006469727, "global_step": 51845, "epoch": 428} {"train_loss": -32.762046813964844, "global_step": 51846, "epoch": 428} {"train_loss": -32.2451057434082, "global_step": 51847, "epoch": 428} {"train_loss": -31.722900390625, "global_step": 51848, "epoch": 428} {"train_loss": -33.108970642089844, "global_step": 51849, "epoch": 428} {"train_loss": -32.15488815307617, "global_step": 51850, "epoch": 428} {"train_loss": -32.39057159423828, "global_step": 51851, "epoch": 428} {"train_loss": -32.99078369140625, "global_step": 51852, "epoch": 428} {"train_loss": -32.8016242980957, "global_step": 51853, "epoch": 428} {"train_loss": -32.55150604248047, "global_step": 51854, "epoch": 428} {"train_loss": -32.86886215209961, "global_step": 51855, "epoch": 428} {"train_loss": -33.35957336425781, "global_step": 51856, "epoch": 428} {"train_loss": -32.968223571777344, "global_step": 51857, "epoch": 428} {"train_loss": -32.71315383911133, "global_step": 51858, "epoch": 428} {"train_loss": -32.689022064208984, "global_step": 51859, "epoch": 428} {"train_loss": -32.19552230834961, "global_step": 51860, "epoch": 428} {"train_loss": -30.956335067749023, "global_step": 51861, "epoch": 428} {"train_loss": -32.27500534057617, "global_step": 51862, "epoch": 428} {"train_loss": -33.85193634033203, "global_step": 51863, "epoch": 428} {"train_loss": -33.06941223144531, "global_step": 51864, "epoch": 428} {"train_loss": -33.10386276245117, "global_step": 51865, "epoch": 428} {"train_loss": -33.99797058105469, "global_step": 51866, "epoch": 428} {"train_loss": -33.33102035522461, "global_step": 51867, "epoch": 428} {"train_loss": -33.64656448364258, "global_step": 51868, "epoch": 428} {"train_loss": -33.71279525756836, "global_step": 51869, "epoch": 428} {"train_loss": -33.598873138427734, "global_step": 51870, "epoch": 428} {"train_loss": -33.13190841674805, "global_step": 51871, "epoch": 428} {"train_loss": -33.76634979248047, "global_step": 51872, "epoch": 428} {"train_loss": -33.7247200012207, "global_step": 51873, "epoch": 428} {"train_loss": -32.55625534057617, "global_step": 51874, "epoch": 428} {"train_loss": -31.72932243347168, "global_step": 51875, "epoch": 428} {"train_loss": -30.142118453979492, "global_step": 51876, "epoch": 428} {"train_loss": -31.6031494140625, "global_step": 51877, "epoch": 428} {"train_loss": -33.80929183959961, "global_step": 51878, "epoch": 428} {"train_loss": -32.88673400878906, "global_step": 51879, "epoch": 428} {"train_loss": -33.40221405029297, "global_step": 51880, "epoch": 428} {"train_loss": -32.96577453613281, "global_step": 51881, "epoch": 428} {"train_loss": -33.36467361450195, "global_step": 51882, "epoch": 428} {"train_loss": -33.59291458129883, "global_step": 51883, "epoch": 428} {"train_loss": -33.74045944213867, "global_step": 51884, "epoch": 428} {"train_loss": -33.89954376220703, "global_step": 51885, "epoch": 428} {"train_loss": -33.639278411865234, "global_step": 51886, "epoch": 428} {"train_loss": -32.926666259765625, "global_step": 51887, "epoch": 428} {"train_loss": -31.946304321289062, "global_step": 51888, "epoch": 428} {"train_loss": -29.915668487548828, "global_step": 51889, "epoch": 428} {"train_loss": -31.94849967956543, "global_step": 51890, "epoch": 428} {"train_loss": -33.591949462890625, "global_step": 51891, "epoch": 428} {"train_loss": -31.911422729492188, "global_step": 51892, "epoch": 428} {"train_loss": -33.15983963012695, "global_step": 51893, "epoch": 428} {"train_loss": -32.5251579284668, "global_step": 51894, "epoch": 428} {"train_loss": -33.339839935302734, "global_step": 51895, "epoch": 428} {"train_loss": -32.99315643310547, "global_step": 51896, "epoch": 428} {"train_loss": -32.47268295288086, "global_step": 51897, "epoch": 428} {"train_loss": -32.78797912597656, "global_step": 51898, "epoch": 428} {"train_loss": -34.44557571411133, "global_step": 51899, "epoch": 428} {"train_loss": -33.56903076171875, "global_step": 51900, "epoch": 428} {"train_loss": -33.677371978759766, "global_step": 51901, "epoch": 428} {"train_loss": -33.83506393432617, "global_step": 51902, "epoch": 428} {"train_loss": -33.1700439453125, "global_step": 51903, "epoch": 428} {"train_loss": -32.96392822265625, "global_step": 51904, "epoch": 428} {"train_loss": -29.058902740478516, "global_step": 51905, "epoch": 428} {"train_loss": -12.878381729125977, "global_step": 51906, "epoch": 428} {"train_loss": -24.847454071044922, "global_step": 51907, "epoch": 428} {"train_loss": -31.53706323607894, "global_step": 51908, "epoch": 428, "val_loss": 2653907.0} {"train_loss": -24.3012638092041, "global_step": 51909, "epoch": 429} {"train_loss": -29.401479721069336, "global_step": 51910, "epoch": 429} {"train_loss": -27.986902236938477, "global_step": 51911, "epoch": 429} {"train_loss": -29.797500610351562, "global_step": 51912, "epoch": 429} {"train_loss": -33.07182312011719, "global_step": 51913, "epoch": 429} {"train_loss": -30.464527130126953, "global_step": 51914, "epoch": 429} {"train_loss": -31.325773239135742, "global_step": 51915, "epoch": 429} {"train_loss": -31.956140518188477, "global_step": 51916, "epoch": 429} {"train_loss": -33.901485443115234, "global_step": 51917, "epoch": 429} {"train_loss": -32.17920684814453, "global_step": 51918, "epoch": 429} {"train_loss": -32.4320182800293, "global_step": 51919, "epoch": 429} {"train_loss": -32.49311447143555, "global_step": 51920, "epoch": 429} {"train_loss": -34.00930404663086, "global_step": 51921, "epoch": 429} {"train_loss": -33.40655517578125, "global_step": 51922, "epoch": 429} {"train_loss": -33.009796142578125, "global_step": 51923, "epoch": 429} {"train_loss": -32.8156852722168, "global_step": 51924, "epoch": 429} {"train_loss": -33.43812942504883, "global_step": 51925, "epoch": 429} {"train_loss": -33.99528884887695, "global_step": 51926, "epoch": 429} {"train_loss": -33.892372131347656, "global_step": 51927, "epoch": 429} {"train_loss": -34.02745056152344, "global_step": 51928, "epoch": 429} {"train_loss": -33.4356575012207, "global_step": 51929, "epoch": 429} {"train_loss": -33.670528411865234, "global_step": 51930, "epoch": 429} {"train_loss": -33.723392486572266, "global_step": 51931, "epoch": 429} {"train_loss": -33.99137496948242, "global_step": 51932, "epoch": 429} {"train_loss": -34.2635498046875, "global_step": 51933, "epoch": 429} {"train_loss": -33.8650016784668, "global_step": 51934, "epoch": 429} {"train_loss": -33.669151306152344, "global_step": 51935, "epoch": 429} {"train_loss": -34.03123092651367, "global_step": 51936, "epoch": 429} {"train_loss": -34.2686767578125, "global_step": 51937, "epoch": 429} {"train_loss": -34.337135314941406, "global_step": 51938, "epoch": 429} {"train_loss": -34.57668685913086, "global_step": 51939, "epoch": 429} {"train_loss": -34.21147537231445, "global_step": 51940, "epoch": 429} {"train_loss": -33.794403076171875, "global_step": 51941, "epoch": 429} {"train_loss": -33.81453323364258, "global_step": 51942, "epoch": 429} {"train_loss": -34.05548858642578, "global_step": 51943, "epoch": 429} {"train_loss": -34.443695068359375, "global_step": 51944, "epoch": 429} {"train_loss": -34.774658203125, "global_step": 51945, "epoch": 429} {"train_loss": -34.46365737915039, "global_step": 51946, "epoch": 429} {"train_loss": -34.22575759887695, "global_step": 51947, "epoch": 429} {"train_loss": -34.63053512573242, "global_step": 51948, "epoch": 429} {"train_loss": -33.95646286010742, "global_step": 51949, "epoch": 429} {"train_loss": -33.97576141357422, "global_step": 51950, "epoch": 429} {"train_loss": -32.1933479309082, "global_step": 51951, "epoch": 429} {"train_loss": -28.928272247314453, "global_step": 51952, "epoch": 429} {"train_loss": -25.432401657104492, "global_step": 51953, "epoch": 429} {"train_loss": -30.54157066345215, "global_step": 51954, "epoch": 429} {"train_loss": -27.814990997314453, "global_step": 51955, "epoch": 429} {"train_loss": -24.846220016479492, "global_step": 51956, "epoch": 429} {"train_loss": -31.565942764282227, "global_step": 51957, "epoch": 429} {"train_loss": -30.795576095581055, "global_step": 51958, "epoch": 429} {"train_loss": -32.19416809082031, "global_step": 51959, "epoch": 429} {"train_loss": -33.826229095458984, "global_step": 51960, "epoch": 429} {"train_loss": -31.701690673828125, "global_step": 51961, "epoch": 429} {"train_loss": -33.2075309753418, "global_step": 51962, "epoch": 429} {"train_loss": -32.9454231262207, "global_step": 51963, "epoch": 429} {"train_loss": -33.25638961791992, "global_step": 51964, "epoch": 429} {"train_loss": -32.87300491333008, "global_step": 51965, "epoch": 429} {"train_loss": -33.59623336791992, "global_step": 51966, "epoch": 429} {"train_loss": -33.619895935058594, "global_step": 51967, "epoch": 429} {"train_loss": -32.99190139770508, "global_step": 51968, "epoch": 429} {"train_loss": -33.96213912963867, "global_step": 51969, "epoch": 429} {"train_loss": -33.54531478881836, "global_step": 51970, "epoch": 429} {"train_loss": -33.90158462524414, "global_step": 51971, "epoch": 429} {"train_loss": -33.628807067871094, "global_step": 51972, "epoch": 429} {"train_loss": -33.972225189208984, "global_step": 51973, "epoch": 429} {"train_loss": -33.381954193115234, "global_step": 51974, "epoch": 429} {"train_loss": -34.24005889892578, "global_step": 51975, "epoch": 429} {"train_loss": -33.783966064453125, "global_step": 51976, "epoch": 429} {"train_loss": -33.86979293823242, "global_step": 51977, "epoch": 429} {"train_loss": -33.98096466064453, "global_step": 51978, "epoch": 429} {"train_loss": -34.22407913208008, "global_step": 51979, "epoch": 429} {"train_loss": -34.00981140136719, "global_step": 51980, "epoch": 429} {"train_loss": -34.19921875, "global_step": 51981, "epoch": 429} {"train_loss": -33.444183349609375, "global_step": 51982, "epoch": 429} {"train_loss": -33.71212387084961, "global_step": 51983, "epoch": 429} {"train_loss": -34.37717056274414, "global_step": 51984, "epoch": 429} {"train_loss": -34.346675872802734, "global_step": 51985, "epoch": 429} {"train_loss": -34.22181701660156, "global_step": 51986, "epoch": 429} {"train_loss": -34.19485092163086, "global_step": 51987, "epoch": 429} {"train_loss": -33.83952713012695, "global_step": 51988, "epoch": 429} {"train_loss": -33.376861572265625, "global_step": 51989, "epoch": 429} {"train_loss": -31.789052963256836, "global_step": 51990, "epoch": 429} {"train_loss": -27.281198501586914, "global_step": 51991, "epoch": 429} {"train_loss": -21.986282348632812, "global_step": 51992, "epoch": 429} {"train_loss": -31.65041160583496, "global_step": 51993, "epoch": 429} {"train_loss": -30.427444458007812, "global_step": 51994, "epoch": 429} {"train_loss": -28.976245880126953, "global_step": 51995, "epoch": 429} {"train_loss": -32.5649528503418, "global_step": 51996, "epoch": 429} {"train_loss": -32.95180892944336, "global_step": 51997, "epoch": 429} {"train_loss": -32.27614212036133, "global_step": 51998, "epoch": 429} {"train_loss": -32.73661422729492, "global_step": 51999, "epoch": 429} {"train_loss": -30.02496910095215, "global_step": 52000, "epoch": 429} {"train_loss": -32.82781982421875, "global_step": 52001, "epoch": 429} {"train_loss": -33.88814163208008, "global_step": 52002, "epoch": 429} {"train_loss": -30.899518966674805, "global_step": 52003, "epoch": 429} {"train_loss": -32.94213104248047, "global_step": 52004, "epoch": 429} {"train_loss": -33.67524337768555, "global_step": 52005, "epoch": 429} {"train_loss": -32.819915771484375, "global_step": 52006, "epoch": 429} {"train_loss": -33.30331039428711, "global_step": 52007, "epoch": 429} {"train_loss": -33.850257873535156, "global_step": 52008, "epoch": 429} {"train_loss": -33.9566764831543, "global_step": 52009, "epoch": 429} {"train_loss": -33.84925079345703, "global_step": 52010, "epoch": 429} {"train_loss": -33.8543815612793, "global_step": 52011, "epoch": 429} {"train_loss": -33.86930465698242, "global_step": 52012, "epoch": 429} {"train_loss": -34.12070846557617, "global_step": 52013, "epoch": 429} {"train_loss": -33.89519119262695, "global_step": 52014, "epoch": 429} {"train_loss": -34.04043960571289, "global_step": 52015, "epoch": 429} {"train_loss": -33.674678802490234, "global_step": 52016, "epoch": 429} {"train_loss": -34.58480453491211, "global_step": 52017, "epoch": 429} {"train_loss": -34.308162689208984, "global_step": 52018, "epoch": 429} {"train_loss": -34.18910598754883, "global_step": 52019, "epoch": 429} {"train_loss": -34.435428619384766, "global_step": 52020, "epoch": 429} {"train_loss": -34.267372131347656, "global_step": 52021, "epoch": 429} {"train_loss": -34.09290313720703, "global_step": 52022, "epoch": 429} {"train_loss": -34.6361198425293, "global_step": 52023, "epoch": 429} {"train_loss": -34.31380081176758, "global_step": 52024, "epoch": 429} {"train_loss": -33.639129638671875, "global_step": 52025, "epoch": 429} {"train_loss": -33.619869232177734, "global_step": 52026, "epoch": 429} {"train_loss": -33.969329833984375, "global_step": 52027, "epoch": 429} {"train_loss": -34.91514587402344, "global_step": 52028, "epoch": 429} {"train_loss": -32.86297416687012, "global_step": 52029, "epoch": 429, "val_loss": 2629506.0} {"train_loss": -34.89349365234375, "global_step": 52030, "epoch": 430} {"train_loss": -34.86935043334961, "global_step": 52031, "epoch": 430} {"train_loss": -34.86777877807617, "global_step": 52032, "epoch": 430} {"train_loss": -34.76143264770508, "global_step": 52033, "epoch": 430} {"train_loss": -34.93557357788086, "global_step": 52034, "epoch": 430} {"train_loss": -34.88684844970703, "global_step": 52035, "epoch": 430} {"train_loss": -34.97071075439453, "global_step": 52036, "epoch": 430} {"train_loss": -35.63083267211914, "global_step": 52037, "epoch": 430} {"train_loss": -35.25977325439453, "global_step": 52038, "epoch": 430} {"train_loss": -35.1025505065918, "global_step": 52039, "epoch": 430} {"train_loss": -35.06986999511719, "global_step": 52040, "epoch": 430} {"train_loss": -35.043861389160156, "global_step": 52041, "epoch": 430} {"train_loss": -34.87057113647461, "global_step": 52042, "epoch": 430} {"train_loss": -34.37574005126953, "global_step": 52043, "epoch": 430} {"train_loss": -34.90534973144531, "global_step": 52044, "epoch": 430} {"train_loss": -34.82518005371094, "global_step": 52045, "epoch": 430} {"train_loss": -34.738380432128906, "global_step": 52046, "epoch": 430} {"train_loss": -29.50300407409668, "global_step": 52047, "epoch": 430} {"train_loss": -26.57236671447754, "global_step": 52048, "epoch": 430} {"train_loss": -30.188785552978516, "global_step": 52049, "epoch": 430} {"train_loss": -19.14569854736328, "global_step": 52050, "epoch": 430} {"train_loss": -24.84657096862793, "global_step": 52051, "epoch": 430} {"train_loss": -32.31093978881836, "global_step": 52052, "epoch": 430} {"train_loss": -27.068256378173828, "global_step": 52053, "epoch": 430} {"train_loss": -26.492773056030273, "global_step": 52054, "epoch": 430} {"train_loss": -30.293689727783203, "global_step": 52055, "epoch": 430} {"train_loss": -31.64661979675293, "global_step": 52056, "epoch": 430} {"train_loss": -25.07481575012207, "global_step": 52057, "epoch": 430} {"train_loss": -31.518299102783203, "global_step": 52058, "epoch": 430} {"train_loss": -31.174121856689453, "global_step": 52059, "epoch": 430} {"train_loss": -31.370513916015625, "global_step": 52060, "epoch": 430} {"train_loss": -33.26826095581055, "global_step": 52061, "epoch": 430} {"train_loss": -33.165184020996094, "global_step": 52062, "epoch": 430} {"train_loss": -31.8413028717041, "global_step": 52063, "epoch": 430} {"train_loss": -30.1532039642334, "global_step": 52064, "epoch": 430} {"train_loss": -30.191741943359375, "global_step": 52065, "epoch": 430} {"train_loss": -32.02189254760742, "global_step": 52066, "epoch": 430} {"train_loss": -31.76019287109375, "global_step": 52067, "epoch": 430} {"train_loss": -27.984830856323242, "global_step": 52068, "epoch": 430} {"train_loss": -31.108068466186523, "global_step": 52069, "epoch": 430} {"train_loss": -24.217618942260742, "global_step": 52070, "epoch": 430} {"train_loss": -29.436725616455078, "global_step": 52071, "epoch": 430} {"train_loss": -32.41226577758789, "global_step": 52072, "epoch": 430} {"train_loss": -31.250415802001953, "global_step": 52073, "epoch": 430} {"train_loss": -31.191986083984375, "global_step": 52074, "epoch": 430} {"train_loss": -30.6898250579834, "global_step": 52075, "epoch": 430} {"train_loss": -31.69280433654785, "global_step": 52076, "epoch": 430} {"train_loss": -30.755542755126953, "global_step": 52077, "epoch": 430} {"train_loss": -31.07901954650879, "global_step": 52078, "epoch": 430} {"train_loss": -31.58965492248535, "global_step": 52079, "epoch": 430} {"train_loss": -32.70590591430664, "global_step": 52080, "epoch": 430} {"train_loss": -31.926054000854492, "global_step": 52081, "epoch": 430} {"train_loss": -32.25572967529297, "global_step": 52082, "epoch": 430} {"train_loss": -32.55544662475586, "global_step": 52083, "epoch": 430} {"train_loss": -32.4415168762207, "global_step": 52084, "epoch": 430} {"train_loss": -32.10763168334961, "global_step": 52085, "epoch": 430} {"train_loss": -32.72724533081055, "global_step": 52086, "epoch": 430} {"train_loss": -31.790481567382812, "global_step": 52087, "epoch": 430} {"train_loss": -33.162662506103516, "global_step": 52088, "epoch": 430} {"train_loss": -32.42666244506836, "global_step": 52089, "epoch": 430} {"train_loss": -32.7087516784668, "global_step": 52090, "epoch": 430} {"train_loss": -32.73869323730469, "global_step": 52091, "epoch": 430} {"train_loss": -32.89008712768555, "global_step": 52092, "epoch": 430} {"train_loss": -32.771907806396484, "global_step": 52093, "epoch": 430} {"train_loss": -33.17932891845703, "global_step": 52094, "epoch": 430} {"train_loss": -33.15251159667969, "global_step": 52095, "epoch": 430} {"train_loss": -32.92969512939453, "global_step": 52096, "epoch": 430} {"train_loss": -33.08890914916992, "global_step": 52097, "epoch": 430} {"train_loss": -33.057125091552734, "global_step": 52098, "epoch": 430} {"train_loss": -33.01100540161133, "global_step": 52099, "epoch": 430} {"train_loss": -33.5439567565918, "global_step": 52100, "epoch": 430} {"train_loss": -33.56476593017578, "global_step": 52101, "epoch": 430} {"train_loss": -33.02155685424805, "global_step": 52102, "epoch": 430} {"train_loss": -32.8424186706543, "global_step": 52103, "epoch": 430} {"train_loss": -33.74869918823242, "global_step": 52104, "epoch": 430} {"train_loss": -33.879329681396484, "global_step": 52105, "epoch": 430} {"train_loss": -33.690528869628906, "global_step": 52106, "epoch": 430} {"train_loss": -33.756717681884766, "global_step": 52107, "epoch": 430} {"train_loss": -34.02327346801758, "global_step": 52108, "epoch": 430} {"train_loss": -33.964210510253906, "global_step": 52109, "epoch": 430} {"train_loss": -34.088069915771484, "global_step": 52110, "epoch": 430} {"train_loss": -34.304134368896484, "global_step": 52111, "epoch": 430} {"train_loss": -33.98199462890625, "global_step": 52112, "epoch": 430} {"train_loss": -34.20787811279297, "global_step": 52113, "epoch": 430} {"train_loss": -34.47719955444336, "global_step": 52114, "epoch": 430} {"train_loss": -34.31570053100586, "global_step": 52115, "epoch": 430} {"train_loss": -34.272151947021484, "global_step": 52116, "epoch": 430} {"train_loss": -34.00812530517578, "global_step": 52117, "epoch": 430} {"train_loss": -33.6276969909668, "global_step": 52118, "epoch": 430} {"train_loss": -32.310523986816406, "global_step": 52119, "epoch": 430} {"train_loss": -20.73224639892578, "global_step": 52120, "epoch": 430} {"train_loss": 4.475637912750244, "global_step": 52121, "epoch": 430} {"train_loss": -8.458174705505371, "global_step": 52122, "epoch": 430} {"train_loss": -32.97228240966797, "global_step": 52123, "epoch": 430} {"train_loss": -19.70513343811035, "global_step": 52124, "epoch": 430} {"train_loss": -32.19758987426758, "global_step": 52125, "epoch": 430} {"train_loss": -27.718908309936523, "global_step": 52126, "epoch": 430} {"train_loss": -27.049280166625977, "global_step": 52127, "epoch": 430} {"train_loss": -33.24653244018555, "global_step": 52128, "epoch": 430} {"train_loss": -30.670408248901367, "global_step": 52129, "epoch": 430} {"train_loss": -28.682157516479492, "global_step": 52130, "epoch": 430} {"train_loss": -31.436628341674805, "global_step": 52131, "epoch": 430} {"train_loss": -32.80755615234375, "global_step": 52132, "epoch": 430} {"train_loss": -31.401325225830078, "global_step": 52133, "epoch": 430} {"train_loss": -31.064794540405273, "global_step": 52134, "epoch": 430} {"train_loss": -31.9168758392334, "global_step": 52135, "epoch": 430} {"train_loss": -32.72978591918945, "global_step": 52136, "epoch": 430} {"train_loss": -33.121639251708984, "global_step": 52137, "epoch": 430} {"train_loss": -31.927337646484375, "global_step": 52138, "epoch": 430} {"train_loss": -32.22041320800781, "global_step": 52139, "epoch": 430} {"train_loss": -33.02930450439453, "global_step": 52140, "epoch": 430} {"train_loss": -33.613197326660156, "global_step": 52141, "epoch": 430} {"train_loss": -33.5015754699707, "global_step": 52142, "epoch": 430} {"train_loss": -33.22571563720703, "global_step": 52143, "epoch": 430} {"train_loss": -32.310272216796875, "global_step": 52144, "epoch": 430} {"train_loss": -32.92922592163086, "global_step": 52145, "epoch": 430} {"train_loss": -33.52296447753906, "global_step": 52146, "epoch": 430} {"train_loss": -33.2226676940918, "global_step": 52147, "epoch": 430} {"train_loss": -33.729408264160156, "global_step": 52148, "epoch": 430} {"train_loss": -33.12229537963867, "global_step": 52149, "epoch": 430} {"train_loss": -31.55181746443441, "global_step": 52150, "epoch": 430, "val_loss": 2616771.75} {"train_loss": -33.759239196777344, "global_step": 52151, "epoch": 431} {"train_loss": -33.820125579833984, "global_step": 52152, "epoch": 431} {"train_loss": -34.04016876220703, "global_step": 52153, "epoch": 431} {"train_loss": -34.066253662109375, "global_step": 52154, "epoch": 431} {"train_loss": -33.80817413330078, "global_step": 52155, "epoch": 431} {"train_loss": -33.99184799194336, "global_step": 52156, "epoch": 431} {"train_loss": -34.111785888671875, "global_step": 52157, "epoch": 431} {"train_loss": -33.83570098876953, "global_step": 52158, "epoch": 431} {"train_loss": -34.08332443237305, "global_step": 52159, "epoch": 431} {"train_loss": -34.427040100097656, "global_step": 52160, "epoch": 431} {"train_loss": -34.319541931152344, "global_step": 52161, "epoch": 431} {"train_loss": -34.460205078125, "global_step": 52162, "epoch": 431} {"train_loss": -34.39265441894531, "global_step": 52163, "epoch": 431} {"train_loss": -34.70374298095703, "global_step": 52164, "epoch": 431} {"train_loss": -34.38615417480469, "global_step": 52165, "epoch": 431} {"train_loss": -34.282012939453125, "global_step": 52166, "epoch": 431} {"train_loss": -34.63893508911133, "global_step": 52167, "epoch": 431} {"train_loss": -34.74195861816406, "global_step": 52168, "epoch": 431} {"train_loss": -34.86006546020508, "global_step": 52169, "epoch": 431} {"train_loss": -34.846492767333984, "global_step": 52170, "epoch": 431} {"train_loss": -34.390228271484375, "global_step": 52171, "epoch": 431} {"train_loss": -34.97233963012695, "global_step": 52172, "epoch": 431} {"train_loss": -34.64947509765625, "global_step": 52173, "epoch": 431} {"train_loss": -34.38604736328125, "global_step": 52174, "epoch": 431} {"train_loss": -35.073028564453125, "global_step": 52175, "epoch": 431} {"train_loss": -34.77464294433594, "global_step": 52176, "epoch": 431} {"train_loss": -34.57728958129883, "global_step": 52177, "epoch": 431} {"train_loss": -34.947566986083984, "global_step": 52178, "epoch": 431} {"train_loss": -35.33890914916992, "global_step": 52179, "epoch": 431} {"train_loss": -34.857872009277344, "global_step": 52180, "epoch": 431} {"train_loss": -34.6307373046875, "global_step": 52181, "epoch": 431} {"train_loss": -35.016902923583984, "global_step": 52182, "epoch": 431} {"train_loss": -34.94080352783203, "global_step": 52183, "epoch": 431} {"train_loss": -35.20513153076172, "global_step": 52184, "epoch": 431} {"train_loss": -35.06989669799805, "global_step": 52185, "epoch": 431} {"train_loss": -34.91071701049805, "global_step": 52186, "epoch": 431} {"train_loss": -34.014713287353516, "global_step": 52187, "epoch": 431} {"train_loss": -28.2745304107666, "global_step": 52188, "epoch": 431} {"train_loss": -17.367952346801758, "global_step": 52189, "epoch": 431} {"train_loss": -18.886110305786133, "global_step": 52190, "epoch": 431} {"train_loss": -29.551279067993164, "global_step": 52191, "epoch": 431} {"train_loss": -32.5698127746582, "global_step": 52192, "epoch": 431} {"train_loss": -29.356048583984375, "global_step": 52193, "epoch": 431} {"train_loss": -33.48795700073242, "global_step": 52194, "epoch": 431} {"train_loss": -31.23807716369629, "global_step": 52195, "epoch": 431} {"train_loss": -32.708797454833984, "global_step": 52196, "epoch": 431} {"train_loss": -32.05868148803711, "global_step": 52197, "epoch": 431} {"train_loss": -33.34450912475586, "global_step": 52198, "epoch": 431} {"train_loss": -30.475248336791992, "global_step": 52199, "epoch": 431} {"train_loss": -33.86037063598633, "global_step": 52200, "epoch": 431} {"train_loss": -30.570606231689453, "global_step": 52201, "epoch": 431} {"train_loss": -33.91554641723633, "global_step": 52202, "epoch": 431} {"train_loss": -32.21382522583008, "global_step": 52203, "epoch": 431} {"train_loss": -32.57999801635742, "global_step": 52204, "epoch": 431} {"train_loss": -33.75299835205078, "global_step": 52205, "epoch": 431} {"train_loss": -31.87994956970215, "global_step": 52206, "epoch": 431} {"train_loss": -33.338008880615234, "global_step": 52207, "epoch": 431} {"train_loss": -34.10902786254883, "global_step": 52208, "epoch": 431} {"train_loss": -33.98750686645508, "global_step": 52209, "epoch": 431} {"train_loss": -33.493896484375, "global_step": 52210, "epoch": 431} {"train_loss": -33.92193603515625, "global_step": 52211, "epoch": 431} {"train_loss": -34.453025817871094, "global_step": 52212, "epoch": 431} {"train_loss": -34.18334197998047, "global_step": 52213, "epoch": 431} {"train_loss": -33.14033126831055, "global_step": 52214, "epoch": 431} {"train_loss": -33.415775299072266, "global_step": 52215, "epoch": 431} {"train_loss": -34.170528411865234, "global_step": 52216, "epoch": 431} {"train_loss": -34.294586181640625, "global_step": 52217, "epoch": 431} {"train_loss": -33.14516830444336, "global_step": 52218, "epoch": 431} {"train_loss": -34.040687561035156, "global_step": 52219, "epoch": 431} {"train_loss": -34.38552474975586, "global_step": 52220, "epoch": 431} {"train_loss": -33.823760986328125, "global_step": 52221, "epoch": 431} {"train_loss": -33.076778411865234, "global_step": 52222, "epoch": 431} {"train_loss": -32.48189926147461, "global_step": 52223, "epoch": 431} {"train_loss": -31.96683120727539, "global_step": 52224, "epoch": 431} {"train_loss": -30.681745529174805, "global_step": 52225, "epoch": 431} {"train_loss": -30.907262802124023, "global_step": 52226, "epoch": 431} {"train_loss": -32.962318420410156, "global_step": 52227, "epoch": 431} {"train_loss": -33.2996940612793, "global_step": 52228, "epoch": 431} {"train_loss": -31.921873092651367, "global_step": 52229, "epoch": 431} {"train_loss": -32.66853332519531, "global_step": 52230, "epoch": 431} {"train_loss": -34.40483856201172, "global_step": 52231, "epoch": 431} {"train_loss": -32.562347412109375, "global_step": 52232, "epoch": 431} {"train_loss": -32.97346878051758, "global_step": 52233, "epoch": 431} {"train_loss": -34.3858757019043, "global_step": 52234, "epoch": 431} {"train_loss": -33.54310607910156, "global_step": 52235, "epoch": 431} {"train_loss": -34.19710922241211, "global_step": 52236, "epoch": 431} {"train_loss": -32.982730865478516, "global_step": 52237, "epoch": 431} {"train_loss": -33.74983596801758, "global_step": 52238, "epoch": 431} {"train_loss": -33.720191955566406, "global_step": 52239, "epoch": 431} {"train_loss": -33.98761749267578, "global_step": 52240, "epoch": 431} {"train_loss": -33.51062774658203, "global_step": 52241, "epoch": 431} {"train_loss": -34.29726791381836, "global_step": 52242, "epoch": 431} {"train_loss": -33.799251556396484, "global_step": 52243, "epoch": 431} {"train_loss": -34.1608772277832, "global_step": 52244, "epoch": 431} {"train_loss": -34.332305908203125, "global_step": 52245, "epoch": 431} {"train_loss": -33.98106002807617, "global_step": 52246, "epoch": 431} {"train_loss": -34.01030349731445, "global_step": 52247, "epoch": 431} {"train_loss": -33.9242057800293, "global_step": 52248, "epoch": 431} {"train_loss": -34.365386962890625, "global_step": 52249, "epoch": 431} {"train_loss": -34.200050354003906, "global_step": 52250, "epoch": 431} {"train_loss": -34.59087371826172, "global_step": 52251, "epoch": 431} {"train_loss": -34.285133361816406, "global_step": 52252, "epoch": 431} {"train_loss": -34.462642669677734, "global_step": 52253, "epoch": 431} {"train_loss": -34.18522262573242, "global_step": 52254, "epoch": 431} {"train_loss": -34.210655212402344, "global_step": 52255, "epoch": 431} {"train_loss": -34.91809844970703, "global_step": 52256, "epoch": 431} {"train_loss": -34.12668991088867, "global_step": 52257, "epoch": 431} {"train_loss": -34.42352294921875, "global_step": 52258, "epoch": 431} {"train_loss": -34.97080993652344, "global_step": 52259, "epoch": 431} {"train_loss": -34.06254196166992, "global_step": 52260, "epoch": 431} {"train_loss": -34.76814651489258, "global_step": 52261, "epoch": 431} {"train_loss": -34.53129959106445, "global_step": 52262, "epoch": 431} {"train_loss": -34.609718322753906, "global_step": 52263, "epoch": 431} {"train_loss": -34.81100082397461, "global_step": 52264, "epoch": 431} {"train_loss": -34.98896026611328, "global_step": 52265, "epoch": 431} {"train_loss": -35.18533706665039, "global_step": 52266, "epoch": 431} {"train_loss": -35.44103240966797, "global_step": 52267, "epoch": 431} {"train_loss": -34.838436126708984, "global_step": 52268, "epoch": 431} {"train_loss": -34.9587287902832, "global_step": 52269, "epoch": 431} {"train_loss": -35.1983528137207, "global_step": 52270, "epoch": 431} {"train_loss": -33.537527825221545, "global_step": 52271, "epoch": 431, "val_loss": 2613609.25} {"train_loss": -31.709264755249023, "global_step": 52272, "epoch": 432} {"train_loss": -25.9765567779541, "global_step": 52273, "epoch": 432} {"train_loss": -30.05392837524414, "global_step": 52274, "epoch": 432} {"train_loss": -33.7192268371582, "global_step": 52275, "epoch": 432} {"train_loss": -33.4008903503418, "global_step": 52276, "epoch": 432} {"train_loss": -33.7104606628418, "global_step": 52277, "epoch": 432} {"train_loss": -33.4804801940918, "global_step": 52278, "epoch": 432} {"train_loss": -32.234535217285156, "global_step": 52279, "epoch": 432} {"train_loss": -34.08201217651367, "global_step": 52280, "epoch": 432} {"train_loss": -34.647987365722656, "global_step": 52281, "epoch": 432} {"train_loss": -33.418907165527344, "global_step": 52282, "epoch": 432} {"train_loss": -34.4482536315918, "global_step": 52283, "epoch": 432} {"train_loss": -34.7828483581543, "global_step": 52284, "epoch": 432} {"train_loss": -34.60159683227539, "global_step": 52285, "epoch": 432} {"train_loss": -34.16659164428711, "global_step": 52286, "epoch": 432} {"train_loss": -34.69538497924805, "global_step": 52287, "epoch": 432} {"train_loss": -34.95540237426758, "global_step": 52288, "epoch": 432} {"train_loss": -34.48781204223633, "global_step": 52289, "epoch": 432} {"train_loss": -34.3157958984375, "global_step": 52290, "epoch": 432} {"train_loss": -35.18112564086914, "global_step": 52291, "epoch": 432} {"train_loss": -35.20746994018555, "global_step": 52292, "epoch": 432} {"train_loss": -34.81805419921875, "global_step": 52293, "epoch": 432} {"train_loss": -34.679359436035156, "global_step": 52294, "epoch": 432} {"train_loss": -34.89802169799805, "global_step": 52295, "epoch": 432} {"train_loss": -35.14152908325195, "global_step": 52296, "epoch": 432} {"train_loss": -35.472686767578125, "global_step": 52297, "epoch": 432} {"train_loss": -35.10519027709961, "global_step": 52298, "epoch": 432} {"train_loss": -34.93980026245117, "global_step": 52299, "epoch": 432} {"train_loss": -35.368099212646484, "global_step": 52300, "epoch": 432} {"train_loss": -35.09739303588867, "global_step": 52301, "epoch": 432} {"train_loss": -35.040863037109375, "global_step": 52302, "epoch": 432} {"train_loss": -34.29817581176758, "global_step": 52303, "epoch": 432} {"train_loss": -35.07501983642578, "global_step": 52304, "epoch": 432} {"train_loss": -34.64515686035156, "global_step": 52305, "epoch": 432} {"train_loss": -34.73139572143555, "global_step": 52306, "epoch": 432} {"train_loss": -35.06666946411133, "global_step": 52307, "epoch": 432} {"train_loss": -34.87364959716797, "global_step": 52308, "epoch": 432} {"train_loss": -35.24858474731445, "global_step": 52309, "epoch": 432} {"train_loss": -34.948238372802734, "global_step": 52310, "epoch": 432} {"train_loss": -33.603240966796875, "global_step": 52311, "epoch": 432} {"train_loss": -31.66912269592285, "global_step": 52312, "epoch": 432} {"train_loss": -20.530256271362305, "global_step": 52313, "epoch": 432} {"train_loss": 14.31326961517334, "global_step": 52314, "epoch": 432} {"train_loss": -6.33388614654541, "global_step": 52315, "epoch": 432} {"train_loss": -27.069711685180664, "global_step": 52316, "epoch": 432} {"train_loss": -15.668701171875, "global_step": 52317, "epoch": 432} {"train_loss": -21.38437843322754, "global_step": 52318, "epoch": 432} {"train_loss": -28.471073150634766, "global_step": 52319, "epoch": 432} {"train_loss": -18.601682662963867, "global_step": 52320, "epoch": 432} {"train_loss": -29.71763038635254, "global_step": 52321, "epoch": 432} {"train_loss": -32.09930419921875, "global_step": 52322, "epoch": 432} {"train_loss": -27.048986434936523, "global_step": 52323, "epoch": 432} {"train_loss": -26.271814346313477, "global_step": 52324, "epoch": 432} {"train_loss": -30.674285888671875, "global_step": 52325, "epoch": 432} {"train_loss": -33.212154388427734, "global_step": 52326, "epoch": 432} {"train_loss": -32.365997314453125, "global_step": 52327, "epoch": 432} {"train_loss": -30.667810440063477, "global_step": 52328, "epoch": 432} {"train_loss": -30.2495174407959, "global_step": 52329, "epoch": 432} {"train_loss": -32.015235900878906, "global_step": 52330, "epoch": 432} {"train_loss": -32.49153518676758, "global_step": 52331, "epoch": 432} {"train_loss": -32.94312286376953, "global_step": 52332, "epoch": 432} {"train_loss": -32.633575439453125, "global_step": 52333, "epoch": 432} {"train_loss": -32.378780364990234, "global_step": 52334, "epoch": 432} {"train_loss": -32.37168884277344, "global_step": 52335, "epoch": 432} {"train_loss": -32.22713088989258, "global_step": 52336, "epoch": 432} {"train_loss": -32.55915451049805, "global_step": 52337, "epoch": 432} {"train_loss": -32.47901153564453, "global_step": 52338, "epoch": 432} {"train_loss": -33.098751068115234, "global_step": 52339, "epoch": 432} {"train_loss": -33.2844123840332, "global_step": 52340, "epoch": 432} {"train_loss": -33.55997848510742, "global_step": 52341, "epoch": 432} {"train_loss": -32.97571563720703, "global_step": 52342, "epoch": 432} {"train_loss": -33.22139358520508, "global_step": 52343, "epoch": 432} {"train_loss": -33.3774528503418, "global_step": 52344, "epoch": 432} {"train_loss": -33.31421661376953, "global_step": 52345, "epoch": 432} {"train_loss": -33.39667510986328, "global_step": 52346, "epoch": 432} {"train_loss": -33.66410446166992, "global_step": 52347, "epoch": 432} {"train_loss": -33.99045944213867, "global_step": 52348, "epoch": 432} {"train_loss": -33.443572998046875, "global_step": 52349, "epoch": 432} {"train_loss": -33.917991638183594, "global_step": 52350, "epoch": 432} {"train_loss": -34.123687744140625, "global_step": 52351, "epoch": 432} {"train_loss": -33.82402038574219, "global_step": 52352, "epoch": 432} {"train_loss": -33.854461669921875, "global_step": 52353, "epoch": 432} {"train_loss": -34.114654541015625, "global_step": 52354, "epoch": 432} {"train_loss": -34.30721664428711, "global_step": 52355, "epoch": 432} {"train_loss": -34.04039764404297, "global_step": 52356, "epoch": 432} {"train_loss": -34.2043571472168, "global_step": 52357, "epoch": 432} {"train_loss": -34.422149658203125, "global_step": 52358, "epoch": 432} {"train_loss": -33.96975326538086, "global_step": 52359, "epoch": 432} {"train_loss": -34.33076858520508, "global_step": 52360, "epoch": 432} {"train_loss": -34.233943939208984, "global_step": 52361, "epoch": 432} {"train_loss": -34.69318771362305, "global_step": 52362, "epoch": 432} {"train_loss": -34.641929626464844, "global_step": 52363, "epoch": 432} {"train_loss": -34.52729415893555, "global_step": 52364, "epoch": 432} {"train_loss": -34.86098861694336, "global_step": 52365, "epoch": 432} {"train_loss": -34.588958740234375, "global_step": 52366, "epoch": 432} {"train_loss": -34.756282806396484, "global_step": 52367, "epoch": 432} {"train_loss": -34.665950775146484, "global_step": 52368, "epoch": 432} {"train_loss": -34.70426559448242, "global_step": 52369, "epoch": 432} {"train_loss": -34.26316452026367, "global_step": 52370, "epoch": 432} {"train_loss": -34.68624496459961, "global_step": 52371, "epoch": 432} {"train_loss": -34.92464065551758, "global_step": 52372, "epoch": 432} {"train_loss": -34.5495491027832, "global_step": 52373, "epoch": 432} {"train_loss": -34.592430114746094, "global_step": 52374, "epoch": 432} {"train_loss": -34.702877044677734, "global_step": 52375, "epoch": 432} {"train_loss": -35.098628997802734, "global_step": 52376, "epoch": 432} {"train_loss": -35.01570510864258, "global_step": 52377, "epoch": 432} {"train_loss": -34.831966400146484, "global_step": 52378, "epoch": 432} {"train_loss": -34.9515495300293, "global_step": 52379, "epoch": 432} {"train_loss": -35.22813034057617, "global_step": 52380, "epoch": 432} {"train_loss": -35.34039306640625, "global_step": 52381, "epoch": 432} {"train_loss": -34.75527572631836, "global_step": 52382, "epoch": 432} {"train_loss": -34.64079666137695, "global_step": 52383, "epoch": 432} {"train_loss": -33.6687126159668, "global_step": 52384, "epoch": 432} {"train_loss": -31.384252548217773, "global_step": 52385, "epoch": 432} {"train_loss": -31.322158813476562, "global_step": 52386, "epoch": 432} {"train_loss": -32.9119987487793, "global_step": 52387, "epoch": 432} {"train_loss": -34.82664108276367, "global_step": 52388, "epoch": 432} {"train_loss": -34.03135299682617, "global_step": 52389, "epoch": 432} {"train_loss": -34.15334701538086, "global_step": 52390, "epoch": 432} {"train_loss": -34.57638168334961, "global_step": 52391, "epoch": 432} {"train_loss": -32.47712710672174, "global_step": 52392, "epoch": 432, "val_loss": 2738901.75} {"train_loss": -34.57558059692383, "global_step": 52393, "epoch": 433} {"train_loss": -35.27509307861328, "global_step": 52394, "epoch": 433} {"train_loss": -33.64066696166992, "global_step": 52395, "epoch": 433} {"train_loss": -34.34845733642578, "global_step": 52396, "epoch": 433} {"train_loss": -34.24279022216797, "global_step": 52397, "epoch": 433} {"train_loss": -31.47334098815918, "global_step": 52398, "epoch": 433} {"train_loss": -34.35542297363281, "global_step": 52399, "epoch": 433} {"train_loss": -34.48698043823242, "global_step": 52400, "epoch": 433} {"train_loss": -33.778072357177734, "global_step": 52401, "epoch": 433} {"train_loss": -33.50994873046875, "global_step": 52402, "epoch": 433} {"train_loss": -33.216434478759766, "global_step": 52403, "epoch": 433} {"train_loss": -33.835567474365234, "global_step": 52404, "epoch": 433} {"train_loss": -33.81568145751953, "global_step": 52405, "epoch": 433} {"train_loss": -30.65679359436035, "global_step": 52406, "epoch": 433} {"train_loss": -32.47137451171875, "global_step": 52407, "epoch": 433} {"train_loss": -30.7420654296875, "global_step": 52408, "epoch": 433} {"train_loss": -31.635717391967773, "global_step": 52409, "epoch": 433} {"train_loss": -29.24956703186035, "global_step": 52410, "epoch": 433} {"train_loss": -29.449234008789062, "global_step": 52411, "epoch": 433} {"train_loss": -29.746885299682617, "global_step": 52412, "epoch": 433} {"train_loss": -32.841590881347656, "global_step": 52413, "epoch": 433} {"train_loss": -29.471424102783203, "global_step": 52414, "epoch": 433} {"train_loss": -33.277099609375, "global_step": 52415, "epoch": 433} {"train_loss": -30.086130142211914, "global_step": 52416, "epoch": 433} {"train_loss": -31.411579132080078, "global_step": 52417, "epoch": 433} {"train_loss": -30.757389068603516, "global_step": 52418, "epoch": 433} {"train_loss": -31.14472770690918, "global_step": 52419, "epoch": 433} {"train_loss": -29.569684982299805, "global_step": 52420, "epoch": 433} {"train_loss": -30.8525447845459, "global_step": 52421, "epoch": 433} {"train_loss": -25.915332794189453, "global_step": 52422, "epoch": 433} {"train_loss": -31.475812911987305, "global_step": 52423, "epoch": 433} {"train_loss": -31.926837921142578, "global_step": 52424, "epoch": 433} {"train_loss": -30.078962326049805, "global_step": 52425, "epoch": 433} {"train_loss": -31.522558212280273, "global_step": 52426, "epoch": 433} {"train_loss": -30.365217208862305, "global_step": 52427, "epoch": 433} {"train_loss": -31.4987735748291, "global_step": 52428, "epoch": 433} {"train_loss": -31.882862091064453, "global_step": 52429, "epoch": 433} {"train_loss": -31.309370040893555, "global_step": 52430, "epoch": 433} {"train_loss": -30.087066650390625, "global_step": 52431, "epoch": 433} {"train_loss": -30.799474716186523, "global_step": 52432, "epoch": 433} {"train_loss": -31.394367218017578, "global_step": 52433, "epoch": 433} {"train_loss": -29.852649688720703, "global_step": 52434, "epoch": 433} {"train_loss": -31.235998153686523, "global_step": 52435, "epoch": 433} {"train_loss": -31.447223663330078, "global_step": 52436, "epoch": 433} {"train_loss": -31.593475341796875, "global_step": 52437, "epoch": 433} {"train_loss": -30.37568473815918, "global_step": 52438, "epoch": 433} {"train_loss": -31.461856842041016, "global_step": 52439, "epoch": 433} {"train_loss": -32.157386779785156, "global_step": 52440, "epoch": 433} {"train_loss": -31.88679313659668, "global_step": 52441, "epoch": 433} {"train_loss": -30.198362350463867, "global_step": 52442, "epoch": 433} {"train_loss": -31.721982955932617, "global_step": 52443, "epoch": 433} {"train_loss": -31.653608322143555, "global_step": 52444, "epoch": 433} {"train_loss": -30.953100204467773, "global_step": 52445, "epoch": 433} {"train_loss": -31.6357421875, "global_step": 52446, "epoch": 433} {"train_loss": -32.44639205932617, "global_step": 52447, "epoch": 433} {"train_loss": -32.04222869873047, "global_step": 52448, "epoch": 433} {"train_loss": -32.28010177612305, "global_step": 52449, "epoch": 433} {"train_loss": -32.22290802001953, "global_step": 52450, "epoch": 433} {"train_loss": -31.8612117767334, "global_step": 52451, "epoch": 433} {"train_loss": -32.231388092041016, "global_step": 52452, "epoch": 433} {"train_loss": -32.187862396240234, "global_step": 52453, "epoch": 433} {"train_loss": -32.63796615600586, "global_step": 52454, "epoch": 433} {"train_loss": -32.92959213256836, "global_step": 52455, "epoch": 433} {"train_loss": -32.68618392944336, "global_step": 52456, "epoch": 433} {"train_loss": -32.89475631713867, "global_step": 52457, "epoch": 433} {"train_loss": -33.06892776489258, "global_step": 52458, "epoch": 433} {"train_loss": -32.93263626098633, "global_step": 52459, "epoch": 433} {"train_loss": -33.027137756347656, "global_step": 52460, "epoch": 433} {"train_loss": -33.048519134521484, "global_step": 52461, "epoch": 433} {"train_loss": -33.30885696411133, "global_step": 52462, "epoch": 433} {"train_loss": -33.1314811706543, "global_step": 52463, "epoch": 433} {"train_loss": -33.336212158203125, "global_step": 52464, "epoch": 433} {"train_loss": -32.32926940917969, "global_step": 52465, "epoch": 433} {"train_loss": -32.28336715698242, "global_step": 52466, "epoch": 433} {"train_loss": -32.896873474121094, "global_step": 52467, "epoch": 433} {"train_loss": -33.516658782958984, "global_step": 52468, "epoch": 433} {"train_loss": -33.83222579956055, "global_step": 52469, "epoch": 433} {"train_loss": -33.3897590637207, "global_step": 52470, "epoch": 433} {"train_loss": -32.92086410522461, "global_step": 52471, "epoch": 433} {"train_loss": -33.20241928100586, "global_step": 52472, "epoch": 433} {"train_loss": -33.73574447631836, "global_step": 52473, "epoch": 433} {"train_loss": -33.60061264038086, "global_step": 52474, "epoch": 433} {"train_loss": -33.655452728271484, "global_step": 52475, "epoch": 433} {"train_loss": -33.57033157348633, "global_step": 52476, "epoch": 433} {"train_loss": -33.9747314453125, "global_step": 52477, "epoch": 433} {"train_loss": -33.96116638183594, "global_step": 52478, "epoch": 433} {"train_loss": -33.71723175048828, "global_step": 52479, "epoch": 433} {"train_loss": -33.575496673583984, "global_step": 52480, "epoch": 433} {"train_loss": -33.94000244140625, "global_step": 52481, "epoch": 433} {"train_loss": -33.9271240234375, "global_step": 52482, "epoch": 433} {"train_loss": -34.03730392456055, "global_step": 52483, "epoch": 433} {"train_loss": -33.5385856628418, "global_step": 52484, "epoch": 433} {"train_loss": -33.63346481323242, "global_step": 52485, "epoch": 433} {"train_loss": -33.73234558105469, "global_step": 52486, "epoch": 433} {"train_loss": -33.4346809387207, "global_step": 52487, "epoch": 433} {"train_loss": -34.07351303100586, "global_step": 52488, "epoch": 433} {"train_loss": -34.080238342285156, "global_step": 52489, "epoch": 433} {"train_loss": -34.03774642944336, "global_step": 52490, "epoch": 433} {"train_loss": -34.43025588989258, "global_step": 52491, "epoch": 433} {"train_loss": -34.539066314697266, "global_step": 52492, "epoch": 433} {"train_loss": -34.52616500854492, "global_step": 52493, "epoch": 433} {"train_loss": -34.45831298828125, "global_step": 52494, "epoch": 433} {"train_loss": -34.74278259277344, "global_step": 52495, "epoch": 433} {"train_loss": -34.536720275878906, "global_step": 52496, "epoch": 433} {"train_loss": -34.560760498046875, "global_step": 52497, "epoch": 433} {"train_loss": -34.166683197021484, "global_step": 52498, "epoch": 433} {"train_loss": -34.51051330566406, "global_step": 52499, "epoch": 433} {"train_loss": -33.97243881225586, "global_step": 52500, "epoch": 433} {"train_loss": -33.963436126708984, "global_step": 52501, "epoch": 433} {"train_loss": -33.52970504760742, "global_step": 52502, "epoch": 433} {"train_loss": -34.58624267578125, "global_step": 52503, "epoch": 433} {"train_loss": -35.20562744140625, "global_step": 52504, "epoch": 433} {"train_loss": -34.52360153198242, "global_step": 52505, "epoch": 433} {"train_loss": -33.64825439453125, "global_step": 52506, "epoch": 433} {"train_loss": -33.19371795654297, "global_step": 52507, "epoch": 433} {"train_loss": -32.68697738647461, "global_step": 52508, "epoch": 433} {"train_loss": -34.418067932128906, "global_step": 52509, "epoch": 433} {"train_loss": -35.11965560913086, "global_step": 52510, "epoch": 433} {"train_loss": -34.533851623535156, "global_step": 52511, "epoch": 433} {"train_loss": -33.440208435058594, "global_step": 52512, "epoch": 433} {"train_loss": -32.69087635387074, "global_step": 52513, "epoch": 433, "val_loss": 2712522.75} {"train_loss": -33.8018684387207, "global_step": 52514, "epoch": 434} {"train_loss": -35.39942932128906, "global_step": 52515, "epoch": 434} {"train_loss": -34.50208282470703, "global_step": 52516, "epoch": 434} {"train_loss": -34.20903396606445, "global_step": 52517, "epoch": 434} {"train_loss": -35.39706039428711, "global_step": 52518, "epoch": 434} {"train_loss": -34.64083480834961, "global_step": 52519, "epoch": 434} {"train_loss": -35.26002502441406, "global_step": 52520, "epoch": 434} {"train_loss": -35.474910736083984, "global_step": 52521, "epoch": 434} {"train_loss": -35.42123031616211, "global_step": 52522, "epoch": 434} {"train_loss": -35.36946487426758, "global_step": 52523, "epoch": 434} {"train_loss": -35.10429000854492, "global_step": 52524, "epoch": 434} {"train_loss": -35.55866622924805, "global_step": 52525, "epoch": 434} {"train_loss": -35.13674545288086, "global_step": 52526, "epoch": 434} {"train_loss": -35.29417037963867, "global_step": 52527, "epoch": 434} {"train_loss": -35.1905403137207, "global_step": 52528, "epoch": 434} {"train_loss": -35.12982940673828, "global_step": 52529, "epoch": 434} {"train_loss": -35.43553161621094, "global_step": 52530, "epoch": 434} {"train_loss": -35.336700439453125, "global_step": 52531, "epoch": 434} {"train_loss": -35.19089126586914, "global_step": 52532, "epoch": 434} {"train_loss": -35.632598876953125, "global_step": 52533, "epoch": 434} {"train_loss": -35.931156158447266, "global_step": 52534, "epoch": 434} {"train_loss": -35.433448791503906, "global_step": 52535, "epoch": 434} {"train_loss": -35.20465850830078, "global_step": 52536, "epoch": 434} {"train_loss": -35.74495315551758, "global_step": 52537, "epoch": 434} {"train_loss": -34.779823303222656, "global_step": 52538, "epoch": 434} {"train_loss": -35.160072326660156, "global_step": 52539, "epoch": 434} {"train_loss": -35.674556732177734, "global_step": 52540, "epoch": 434} {"train_loss": -35.7896842956543, "global_step": 52541, "epoch": 434} {"train_loss": -35.72243881225586, "global_step": 52542, "epoch": 434} {"train_loss": -35.416595458984375, "global_step": 52543, "epoch": 434} {"train_loss": -35.08777618408203, "global_step": 52544, "epoch": 434} {"train_loss": -35.6211051940918, "global_step": 52545, "epoch": 434} {"train_loss": -35.4344482421875, "global_step": 52546, "epoch": 434} {"train_loss": -34.854881286621094, "global_step": 52547, "epoch": 434} {"train_loss": -35.82094192504883, "global_step": 52548, "epoch": 434} {"train_loss": -35.57417678833008, "global_step": 52549, "epoch": 434} {"train_loss": -34.05019760131836, "global_step": 52550, "epoch": 434} {"train_loss": -33.71418380737305, "global_step": 52551, "epoch": 434} {"train_loss": -34.23790740966797, "global_step": 52552, "epoch": 434} {"train_loss": -32.91621017456055, "global_step": 52553, "epoch": 434} {"train_loss": -34.3609733581543, "global_step": 52554, "epoch": 434} {"train_loss": -34.43889236450195, "global_step": 52555, "epoch": 434} {"train_loss": -33.2983283996582, "global_step": 52556, "epoch": 434} {"train_loss": -34.78084945678711, "global_step": 52557, "epoch": 434} {"train_loss": -32.95270919799805, "global_step": 52558, "epoch": 434} {"train_loss": -32.46351623535156, "global_step": 52559, "epoch": 434} {"train_loss": -34.47536087036133, "global_step": 52560, "epoch": 434} {"train_loss": -34.76513671875, "global_step": 52561, "epoch": 434} {"train_loss": -33.03898239135742, "global_step": 52562, "epoch": 434} {"train_loss": -33.972328186035156, "global_step": 52563, "epoch": 434} {"train_loss": -33.68688201904297, "global_step": 52564, "epoch": 434} {"train_loss": -33.811397552490234, "global_step": 52565, "epoch": 434} {"train_loss": -34.44257736206055, "global_step": 52566, "epoch": 434} {"train_loss": -33.21073913574219, "global_step": 52567, "epoch": 434} {"train_loss": -32.82845687866211, "global_step": 52568, "epoch": 434} {"train_loss": -33.092994689941406, "global_step": 52569, "epoch": 434} {"train_loss": -33.4457893371582, "global_step": 52570, "epoch": 434} {"train_loss": -32.45941925048828, "global_step": 52571, "epoch": 434} {"train_loss": -32.18778610229492, "global_step": 52572, "epoch": 434} {"train_loss": -34.639957427978516, "global_step": 52573, "epoch": 434} {"train_loss": -32.05833435058594, "global_step": 52574, "epoch": 434} {"train_loss": -32.81458282470703, "global_step": 52575, "epoch": 434} {"train_loss": -34.15625, "global_step": 52576, "epoch": 434} {"train_loss": -34.05673599243164, "global_step": 52577, "epoch": 434} {"train_loss": -33.400604248046875, "global_step": 52578, "epoch": 434} {"train_loss": -33.43482208251953, "global_step": 52579, "epoch": 434} {"train_loss": -33.92277908325195, "global_step": 52580, "epoch": 434} {"train_loss": -33.22864532470703, "global_step": 52581, "epoch": 434} {"train_loss": -33.89852523803711, "global_step": 52582, "epoch": 434} {"train_loss": -33.8662109375, "global_step": 52583, "epoch": 434} {"train_loss": -33.970497131347656, "global_step": 52584, "epoch": 434} {"train_loss": -34.255496978759766, "global_step": 52585, "epoch": 434} {"train_loss": -31.158283233642578, "global_step": 52586, "epoch": 434} {"train_loss": -33.197689056396484, "global_step": 52587, "epoch": 434} {"train_loss": -34.36994171142578, "global_step": 52588, "epoch": 434} {"train_loss": -34.16718673706055, "global_step": 52589, "epoch": 434} {"train_loss": -33.475521087646484, "global_step": 52590, "epoch": 434} {"train_loss": -34.055198669433594, "global_step": 52591, "epoch": 434} {"train_loss": -34.1946907043457, "global_step": 52592, "epoch": 434} {"train_loss": -33.280704498291016, "global_step": 52593, "epoch": 434} {"train_loss": -32.94197082519531, "global_step": 52594, "epoch": 434} {"train_loss": -34.6303596496582, "global_step": 52595, "epoch": 434} {"train_loss": -34.16472244262695, "global_step": 52596, "epoch": 434} {"train_loss": -34.05374526977539, "global_step": 52597, "epoch": 434} {"train_loss": -34.069374084472656, "global_step": 52598, "epoch": 434} {"train_loss": -34.169090270996094, "global_step": 52599, "epoch": 434} {"train_loss": -34.10292434692383, "global_step": 52600, "epoch": 434} {"train_loss": -33.86505126953125, "global_step": 52601, "epoch": 434} {"train_loss": -32.70998764038086, "global_step": 52602, "epoch": 434} {"train_loss": -33.58436584472656, "global_step": 52603, "epoch": 434} {"train_loss": -34.13993453979492, "global_step": 52604, "epoch": 434} {"train_loss": -33.0717658996582, "global_step": 52605, "epoch": 434} {"train_loss": -34.304649353027344, "global_step": 52606, "epoch": 434} {"train_loss": -33.20197677612305, "global_step": 52607, "epoch": 434} {"train_loss": -32.6060676574707, "global_step": 52608, "epoch": 434} {"train_loss": -33.9301872253418, "global_step": 52609, "epoch": 434} {"train_loss": -34.36117935180664, "global_step": 52610, "epoch": 434} {"train_loss": -33.503448486328125, "global_step": 52611, "epoch": 434} {"train_loss": -34.13924026489258, "global_step": 52612, "epoch": 434} {"train_loss": -34.09595489501953, "global_step": 52613, "epoch": 434} {"train_loss": -34.916500091552734, "global_step": 52614, "epoch": 434} {"train_loss": -34.131832122802734, "global_step": 52615, "epoch": 434} {"train_loss": -33.92770004272461, "global_step": 52616, "epoch": 434} {"train_loss": -34.265533447265625, "global_step": 52617, "epoch": 434} {"train_loss": -34.68980026245117, "global_step": 52618, "epoch": 434} {"train_loss": -33.61675262451172, "global_step": 52619, "epoch": 434} {"train_loss": -33.51539993286133, "global_step": 52620, "epoch": 434} {"train_loss": -33.432125091552734, "global_step": 52621, "epoch": 434} {"train_loss": -34.503662109375, "global_step": 52622, "epoch": 434} {"train_loss": -34.670799255371094, "global_step": 52623, "epoch": 434} {"train_loss": -33.74382400512695, "global_step": 52624, "epoch": 434} {"train_loss": -32.76994705200195, "global_step": 52625, "epoch": 434} {"train_loss": -32.518924713134766, "global_step": 52626, "epoch": 434} {"train_loss": -33.62038040161133, "global_step": 52627, "epoch": 434} {"train_loss": -34.72365188598633, "global_step": 52628, "epoch": 434} {"train_loss": -33.300392150878906, "global_step": 52629, "epoch": 434} {"train_loss": -33.9457893371582, "global_step": 52630, "epoch": 434} {"train_loss": -34.50021743774414, "global_step": 52631, "epoch": 434} {"train_loss": -34.651939392089844, "global_step": 52632, "epoch": 434} {"train_loss": -34.219139099121094, "global_step": 52633, "epoch": 434} {"train_loss": -34.20032526441842, "global_step": 52634, "epoch": 434, "val_loss": 2672039.0} {"train_loss": -34.7992057800293, "global_step": 52635, "epoch": 435} {"train_loss": -34.37607955932617, "global_step": 52636, "epoch": 435} {"train_loss": -34.65207290649414, "global_step": 52637, "epoch": 435} {"train_loss": -35.03214645385742, "global_step": 52638, "epoch": 435} {"train_loss": -34.34780502319336, "global_step": 52639, "epoch": 435} {"train_loss": -35.14243698120117, "global_step": 52640, "epoch": 435} {"train_loss": -34.7138786315918, "global_step": 52641, "epoch": 435} {"train_loss": -35.109561920166016, "global_step": 52642, "epoch": 435} {"train_loss": -35.033416748046875, "global_step": 52643, "epoch": 435} {"train_loss": -35.20821762084961, "global_step": 52644, "epoch": 435} {"train_loss": -35.287353515625, "global_step": 52645, "epoch": 435} {"train_loss": -34.92979049682617, "global_step": 52646, "epoch": 435} {"train_loss": -35.436073303222656, "global_step": 52647, "epoch": 435} {"train_loss": -35.19980239868164, "global_step": 52648, "epoch": 435} {"train_loss": -35.12166213989258, "global_step": 52649, "epoch": 435} {"train_loss": -35.706642150878906, "global_step": 52650, "epoch": 435} {"train_loss": -35.82411193847656, "global_step": 52651, "epoch": 435} {"train_loss": -35.49968338012695, "global_step": 52652, "epoch": 435} {"train_loss": -35.85062789916992, "global_step": 52653, "epoch": 435} {"train_loss": -36.044883728027344, "global_step": 52654, "epoch": 435} {"train_loss": -35.72917556762695, "global_step": 52655, "epoch": 435} {"train_loss": -35.84572982788086, "global_step": 52656, "epoch": 435} {"train_loss": -35.50394821166992, "global_step": 52657, "epoch": 435} {"train_loss": -35.29461669921875, "global_step": 52658, "epoch": 435} {"train_loss": -35.42902374267578, "global_step": 52659, "epoch": 435} {"train_loss": -35.18964767456055, "global_step": 52660, "epoch": 435} {"train_loss": -35.91503143310547, "global_step": 52661, "epoch": 435} {"train_loss": -35.27131271362305, "global_step": 52662, "epoch": 435} {"train_loss": -35.140872955322266, "global_step": 52663, "epoch": 435} {"train_loss": -35.38987350463867, "global_step": 52664, "epoch": 435} {"train_loss": -34.68476486206055, "global_step": 52665, "epoch": 435} {"train_loss": -34.41743469238281, "global_step": 52666, "epoch": 435} {"train_loss": -32.740684509277344, "global_step": 52667, "epoch": 435} {"train_loss": -29.40655517578125, "global_step": 52668, "epoch": 435} {"train_loss": -27.27753257751465, "global_step": 52669, "epoch": 435} {"train_loss": -33.79191207885742, "global_step": 52670, "epoch": 435} {"train_loss": -35.25532150268555, "global_step": 52671, "epoch": 435} {"train_loss": -31.560468673706055, "global_step": 52672, "epoch": 435} {"train_loss": -34.1126708984375, "global_step": 52673, "epoch": 435} {"train_loss": -34.04888916015625, "global_step": 52674, "epoch": 435} {"train_loss": -31.123929977416992, "global_step": 52675, "epoch": 435} {"train_loss": -35.16205978393555, "global_step": 52676, "epoch": 435} {"train_loss": -32.812713623046875, "global_step": 52677, "epoch": 435} {"train_loss": -34.99448776245117, "global_step": 52678, "epoch": 435} {"train_loss": -32.868526458740234, "global_step": 52679, "epoch": 435} {"train_loss": -34.18362045288086, "global_step": 52680, "epoch": 435} {"train_loss": -35.214534759521484, "global_step": 52681, "epoch": 435} {"train_loss": -34.17670822143555, "global_step": 52682, "epoch": 435} {"train_loss": -34.447425842285156, "global_step": 52683, "epoch": 435} {"train_loss": -34.68324661254883, "global_step": 52684, "epoch": 435} {"train_loss": -34.81504440307617, "global_step": 52685, "epoch": 435} {"train_loss": -35.22849655151367, "global_step": 52686, "epoch": 435} {"train_loss": -34.76675796508789, "global_step": 52687, "epoch": 435} {"train_loss": -35.01444625854492, "global_step": 52688, "epoch": 435} {"train_loss": -35.380123138427734, "global_step": 52689, "epoch": 435} {"train_loss": -35.41744613647461, "global_step": 52690, "epoch": 435} {"train_loss": -35.05257034301758, "global_step": 52691, "epoch": 435} {"train_loss": -34.94286346435547, "global_step": 52692, "epoch": 435} {"train_loss": -35.57670211791992, "global_step": 52693, "epoch": 435} {"train_loss": -35.01385498046875, "global_step": 52694, "epoch": 435} {"train_loss": -35.27838134765625, "global_step": 52695, "epoch": 435} {"train_loss": -35.26655197143555, "global_step": 52696, "epoch": 435} {"train_loss": -35.25852584838867, "global_step": 52697, "epoch": 435} {"train_loss": -35.580589294433594, "global_step": 52698, "epoch": 435} {"train_loss": -35.0257682800293, "global_step": 52699, "epoch": 435} {"train_loss": -35.011619567871094, "global_step": 52700, "epoch": 435} {"train_loss": -35.1715087890625, "global_step": 52701, "epoch": 435} {"train_loss": -34.96186065673828, "global_step": 52702, "epoch": 435} {"train_loss": -35.48303985595703, "global_step": 52703, "epoch": 435} {"train_loss": -35.176631927490234, "global_step": 52704, "epoch": 435} {"train_loss": -35.35595703125, "global_step": 52705, "epoch": 435} {"train_loss": -34.3648567199707, "global_step": 52706, "epoch": 435} {"train_loss": -34.5021858215332, "global_step": 52707, "epoch": 435} {"train_loss": -33.930206298828125, "global_step": 52708, "epoch": 435} {"train_loss": -28.16133689880371, "global_step": 52709, "epoch": 435} {"train_loss": -25.501243591308594, "global_step": 52710, "epoch": 435} {"train_loss": -27.072406768798828, "global_step": 52711, "epoch": 435} {"train_loss": -16.787946701049805, "global_step": 52712, "epoch": 435} {"train_loss": -33.45799255371094, "global_step": 52713, "epoch": 435} {"train_loss": -28.096242904663086, "global_step": 52714, "epoch": 435} {"train_loss": -29.62860107421875, "global_step": 52715, "epoch": 435} {"train_loss": -33.21710968017578, "global_step": 52716, "epoch": 435} {"train_loss": -32.57429122924805, "global_step": 52717, "epoch": 435} {"train_loss": -33.452880859375, "global_step": 52718, "epoch": 435} {"train_loss": -28.442230224609375, "global_step": 52719, "epoch": 435} {"train_loss": -33.9749870300293, "global_step": 52720, "epoch": 435} {"train_loss": -33.48771286010742, "global_step": 52721, "epoch": 435} {"train_loss": -32.30397415161133, "global_step": 52722, "epoch": 435} {"train_loss": -32.39482498168945, "global_step": 52723, "epoch": 435} {"train_loss": -30.98591423034668, "global_step": 52724, "epoch": 435} {"train_loss": -32.28387451171875, "global_step": 52725, "epoch": 435} {"train_loss": -33.449974060058594, "global_step": 52726, "epoch": 435} {"train_loss": -33.01792526245117, "global_step": 52727, "epoch": 435} {"train_loss": -33.442745208740234, "global_step": 52728, "epoch": 435} {"train_loss": -31.412708282470703, "global_step": 52729, "epoch": 435} {"train_loss": -32.910789489746094, "global_step": 52730, "epoch": 435} {"train_loss": -32.999874114990234, "global_step": 52731, "epoch": 435} {"train_loss": -34.014373779296875, "global_step": 52732, "epoch": 435} {"train_loss": -33.42832565307617, "global_step": 52733, "epoch": 435} {"train_loss": -33.50336837768555, "global_step": 52734, "epoch": 435} {"train_loss": -33.901851654052734, "global_step": 52735, "epoch": 435} {"train_loss": -33.931610107421875, "global_step": 52736, "epoch": 435} {"train_loss": -34.37204360961914, "global_step": 52737, "epoch": 435} {"train_loss": -34.31647872924805, "global_step": 52738, "epoch": 435} {"train_loss": -33.820953369140625, "global_step": 52739, "epoch": 435} {"train_loss": -34.082977294921875, "global_step": 52740, "epoch": 435} {"train_loss": -34.13979721069336, "global_step": 52741, "epoch": 435} {"train_loss": -34.16844177246094, "global_step": 52742, "epoch": 435} {"train_loss": -32.57609176635742, "global_step": 52743, "epoch": 435} {"train_loss": -34.19532775878906, "global_step": 52744, "epoch": 435} {"train_loss": -34.33226013183594, "global_step": 52745, "epoch": 435} {"train_loss": -34.66506576538086, "global_step": 52746, "epoch": 435} {"train_loss": -34.57229995727539, "global_step": 52747, "epoch": 435} {"train_loss": -33.60405349731445, "global_step": 52748, "epoch": 435} {"train_loss": -34.34541702270508, "global_step": 52749, "epoch": 435} {"train_loss": -34.78831100463867, "global_step": 52750, "epoch": 435} {"train_loss": -34.5404052734375, "global_step": 52751, "epoch": 435} {"train_loss": -34.67940902709961, "global_step": 52752, "epoch": 435} {"train_loss": -34.90726852416992, "global_step": 52753, "epoch": 435} {"train_loss": -34.542213439941406, "global_step": 52754, "epoch": 435} {"train_loss": -33.85231202495985, "global_step": 52755, "epoch": 435, "val_loss": 2598118.25} {"train_loss": -35.10347366333008, "global_step": 52756, "epoch": 436} {"train_loss": -34.84562301635742, "global_step": 52757, "epoch": 436} {"train_loss": -33.68463134765625, "global_step": 52758, "epoch": 436} {"train_loss": -34.748634338378906, "global_step": 52759, "epoch": 436} {"train_loss": -35.341064453125, "global_step": 52760, "epoch": 436} {"train_loss": -34.44344711303711, "global_step": 52761, "epoch": 436} {"train_loss": -35.04069137573242, "global_step": 52762, "epoch": 436} {"train_loss": -34.67491149902344, "global_step": 52763, "epoch": 436} {"train_loss": -34.08673858642578, "global_step": 52764, "epoch": 436} {"train_loss": -34.43153762817383, "global_step": 52765, "epoch": 436} {"train_loss": -34.67362594604492, "global_step": 52766, "epoch": 436} {"train_loss": -34.661441802978516, "global_step": 52767, "epoch": 436} {"train_loss": -34.719520568847656, "global_step": 52768, "epoch": 436} {"train_loss": -34.5129508972168, "global_step": 52769, "epoch": 436} {"train_loss": -30.25884437561035, "global_step": 52770, "epoch": 436} {"train_loss": -34.37367630004883, "global_step": 52771, "epoch": 436} {"train_loss": -35.046600341796875, "global_step": 52772, "epoch": 436} {"train_loss": -34.015628814697266, "global_step": 52773, "epoch": 436} {"train_loss": -33.61677169799805, "global_step": 52774, "epoch": 436} {"train_loss": -33.191253662109375, "global_step": 52775, "epoch": 436} {"train_loss": -33.8152961730957, "global_step": 52776, "epoch": 436} {"train_loss": -33.6225700378418, "global_step": 52777, "epoch": 436} {"train_loss": -31.3394718170166, "global_step": 52778, "epoch": 436} {"train_loss": -33.757781982421875, "global_step": 52779, "epoch": 436} {"train_loss": -32.87504577636719, "global_step": 52780, "epoch": 436} {"train_loss": -31.687255859375, "global_step": 52781, "epoch": 436} {"train_loss": -33.2739372253418, "global_step": 52782, "epoch": 436} {"train_loss": -32.9043083190918, "global_step": 52783, "epoch": 436} {"train_loss": -34.286685943603516, "global_step": 52784, "epoch": 436} {"train_loss": -31.653913497924805, "global_step": 52785, "epoch": 436} {"train_loss": -33.17240905761719, "global_step": 52786, "epoch": 436} {"train_loss": -32.732540130615234, "global_step": 52787, "epoch": 436} {"train_loss": -33.441646575927734, "global_step": 52788, "epoch": 436} {"train_loss": -33.84078598022461, "global_step": 52789, "epoch": 436} {"train_loss": -33.52184295654297, "global_step": 52790, "epoch": 436} {"train_loss": -33.30373764038086, "global_step": 52791, "epoch": 436} {"train_loss": -33.52507400512695, "global_step": 52792, "epoch": 436} {"train_loss": -32.239784240722656, "global_step": 52793, "epoch": 436} {"train_loss": -33.8936767578125, "global_step": 52794, "epoch": 436} {"train_loss": -33.69422149658203, "global_step": 52795, "epoch": 436} {"train_loss": -32.07490158081055, "global_step": 52796, "epoch": 436} {"train_loss": -33.9521484375, "global_step": 52797, "epoch": 436} {"train_loss": -33.75112533569336, "global_step": 52798, "epoch": 436} {"train_loss": -34.04226303100586, "global_step": 52799, "epoch": 436} {"train_loss": -34.50421905517578, "global_step": 52800, "epoch": 436} {"train_loss": -34.181724548339844, "global_step": 52801, "epoch": 436} {"train_loss": -34.23986053466797, "global_step": 52802, "epoch": 436} {"train_loss": -34.29024887084961, "global_step": 52803, "epoch": 436} {"train_loss": -33.8028450012207, "global_step": 52804, "epoch": 436} {"train_loss": -33.44660186767578, "global_step": 52805, "epoch": 436} {"train_loss": -34.35398483276367, "global_step": 52806, "epoch": 436} {"train_loss": -34.516727447509766, "global_step": 52807, "epoch": 436} {"train_loss": -33.68901443481445, "global_step": 52808, "epoch": 436} {"train_loss": -34.524166107177734, "global_step": 52809, "epoch": 436} {"train_loss": -34.48965835571289, "global_step": 52810, "epoch": 436} {"train_loss": -34.563392639160156, "global_step": 52811, "epoch": 436} {"train_loss": -34.5574836730957, "global_step": 52812, "epoch": 436} {"train_loss": -34.08906173706055, "global_step": 52813, "epoch": 436} {"train_loss": -34.02006912231445, "global_step": 52814, "epoch": 436} {"train_loss": -34.23622512817383, "global_step": 52815, "epoch": 436} {"train_loss": -34.50373077392578, "global_step": 52816, "epoch": 436} {"train_loss": -35.0150032043457, "global_step": 52817, "epoch": 436} {"train_loss": -34.80226516723633, "global_step": 52818, "epoch": 436} {"train_loss": -34.37537384033203, "global_step": 52819, "epoch": 436} {"train_loss": -34.978546142578125, "global_step": 52820, "epoch": 436} {"train_loss": -34.84432601928711, "global_step": 52821, "epoch": 436} {"train_loss": -34.60518264770508, "global_step": 52822, "epoch": 436} {"train_loss": -34.69021224975586, "global_step": 52823, "epoch": 436} {"train_loss": -34.84360885620117, "global_step": 52824, "epoch": 436} {"train_loss": -34.68240737915039, "global_step": 52825, "epoch": 436} {"train_loss": -34.97005081176758, "global_step": 52826, "epoch": 436} {"train_loss": -34.38595199584961, "global_step": 52827, "epoch": 436} {"train_loss": -35.29728698730469, "global_step": 52828, "epoch": 436} {"train_loss": -34.99732208251953, "global_step": 52829, "epoch": 436} {"train_loss": -35.4088249206543, "global_step": 52830, "epoch": 436} {"train_loss": -35.360435485839844, "global_step": 52831, "epoch": 436} {"train_loss": -35.54407501220703, "global_step": 52832, "epoch": 436} {"train_loss": -34.816017150878906, "global_step": 52833, "epoch": 436} {"train_loss": -34.83881378173828, "global_step": 52834, "epoch": 436} {"train_loss": -35.04292678833008, "global_step": 52835, "epoch": 436} {"train_loss": -34.1806755065918, "global_step": 52836, "epoch": 436} {"train_loss": -33.77112579345703, "global_step": 52837, "epoch": 436} {"train_loss": -33.06965255737305, "global_step": 52838, "epoch": 436} {"train_loss": -34.14052200317383, "global_step": 52839, "epoch": 436} {"train_loss": -35.11751937866211, "global_step": 52840, "epoch": 436} {"train_loss": -35.5295524597168, "global_step": 52841, "epoch": 436} {"train_loss": -35.798194885253906, "global_step": 52842, "epoch": 436} {"train_loss": -35.34400177001953, "global_step": 52843, "epoch": 436} {"train_loss": -35.3593864440918, "global_step": 52844, "epoch": 436} {"train_loss": -34.262367248535156, "global_step": 52845, "epoch": 436} {"train_loss": -32.42110824584961, "global_step": 52846, "epoch": 436} {"train_loss": -31.111303329467773, "global_step": 52847, "epoch": 436} {"train_loss": -34.120845794677734, "global_step": 52848, "epoch": 436} {"train_loss": -35.02122116088867, "global_step": 52849, "epoch": 436} {"train_loss": -32.971309661865234, "global_step": 52850, "epoch": 436} {"train_loss": -33.8994255065918, "global_step": 52851, "epoch": 436} {"train_loss": -35.5267333984375, "global_step": 52852, "epoch": 436} {"train_loss": -34.24872970581055, "global_step": 52853, "epoch": 436} {"train_loss": -33.48087692260742, "global_step": 52854, "epoch": 436} {"train_loss": -34.7939567565918, "global_step": 52855, "epoch": 436} {"train_loss": -33.83706283569336, "global_step": 52856, "epoch": 436} {"train_loss": -34.93296432495117, "global_step": 52857, "epoch": 436} {"train_loss": -35.0899543762207, "global_step": 52858, "epoch": 436} {"train_loss": -34.72750473022461, "global_step": 52859, "epoch": 436} {"train_loss": -34.6185417175293, "global_step": 52860, "epoch": 436} {"train_loss": -33.809574127197266, "global_step": 52861, "epoch": 436} {"train_loss": -34.76412582397461, "global_step": 52862, "epoch": 436} {"train_loss": -35.665035247802734, "global_step": 52863, "epoch": 436} {"train_loss": -35.50101852416992, "global_step": 52864, "epoch": 436} {"train_loss": -35.505550384521484, "global_step": 52865, "epoch": 436} {"train_loss": -34.684139251708984, "global_step": 52866, "epoch": 436} {"train_loss": -35.32343673706055, "global_step": 52867, "epoch": 436} {"train_loss": -34.4504508972168, "global_step": 52868, "epoch": 436} {"train_loss": -35.8439826965332, "global_step": 52869, "epoch": 436} {"train_loss": -34.99319076538086, "global_step": 52870, "epoch": 436} {"train_loss": -35.124183654785156, "global_step": 52871, "epoch": 436} {"train_loss": -35.80315017700195, "global_step": 52872, "epoch": 436} {"train_loss": -35.17824172973633, "global_step": 52873, "epoch": 436} {"train_loss": -35.12942123413086, "global_step": 52874, "epoch": 436} {"train_loss": -35.673240661621094, "global_step": 52875, "epoch": 436} {"train_loss": -34.269387394928735, "global_step": 52876, "epoch": 436, "val_loss": 2592592.25} {"train_loss": -35.6230354309082, "global_step": 52877, "epoch": 437} {"train_loss": -35.03389358520508, "global_step": 52878, "epoch": 437} {"train_loss": -35.43503952026367, "global_step": 52879, "epoch": 437} {"train_loss": -35.809383392333984, "global_step": 52880, "epoch": 437} {"train_loss": -35.568687438964844, "global_step": 52881, "epoch": 437} {"train_loss": -35.96717834472656, "global_step": 52882, "epoch": 437} {"train_loss": -35.93979263305664, "global_step": 52883, "epoch": 437} {"train_loss": -35.751380920410156, "global_step": 52884, "epoch": 437} {"train_loss": -35.8051872253418, "global_step": 52885, "epoch": 437} {"train_loss": -35.85451126098633, "global_step": 52886, "epoch": 437} {"train_loss": -35.5955810546875, "global_step": 52887, "epoch": 437} {"train_loss": -35.880706787109375, "global_step": 52888, "epoch": 437} {"train_loss": -35.20643997192383, "global_step": 52889, "epoch": 437} {"train_loss": -35.78400802612305, "global_step": 52890, "epoch": 437} {"train_loss": -35.88612747192383, "global_step": 52891, "epoch": 437} {"train_loss": -35.74858093261719, "global_step": 52892, "epoch": 437} {"train_loss": -35.99300765991211, "global_step": 52893, "epoch": 437} {"train_loss": -35.095497131347656, "global_step": 52894, "epoch": 437} {"train_loss": -35.28447341918945, "global_step": 52895, "epoch": 437} {"train_loss": -36.369415283203125, "global_step": 52896, "epoch": 437} {"train_loss": -35.736148834228516, "global_step": 52897, "epoch": 437} {"train_loss": -34.05155563354492, "global_step": 52898, "epoch": 437} {"train_loss": -33.391178131103516, "global_step": 52899, "epoch": 437} {"train_loss": -32.73582077026367, "global_step": 52900, "epoch": 437} {"train_loss": -31.033981323242188, "global_step": 52901, "epoch": 437} {"train_loss": -30.893783569335938, "global_step": 52902, "epoch": 437} {"train_loss": -32.932952880859375, "global_step": 52903, "epoch": 437} {"train_loss": -34.61204147338867, "global_step": 52904, "epoch": 437} {"train_loss": -32.44120407104492, "global_step": 52905, "epoch": 437} {"train_loss": -28.953369140625, "global_step": 52906, "epoch": 437} {"train_loss": -32.4669189453125, "global_step": 52907, "epoch": 437} {"train_loss": -34.914306640625, "global_step": 52908, "epoch": 437} {"train_loss": -34.1413459777832, "global_step": 52909, "epoch": 437} {"train_loss": -33.57246017456055, "global_step": 52910, "epoch": 437} {"train_loss": -34.650489807128906, "global_step": 52911, "epoch": 437} {"train_loss": -34.21360397338867, "global_step": 52912, "epoch": 437} {"train_loss": -33.91738510131836, "global_step": 52913, "epoch": 437} {"train_loss": -34.623870849609375, "global_step": 52914, "epoch": 437} {"train_loss": -33.000274658203125, "global_step": 52915, "epoch": 437} {"train_loss": -34.92728805541992, "global_step": 52916, "epoch": 437} {"train_loss": -34.854061126708984, "global_step": 52917, "epoch": 437} {"train_loss": -34.70246505737305, "global_step": 52918, "epoch": 437} {"train_loss": -34.65815353393555, "global_step": 52919, "epoch": 437} {"train_loss": -33.7824592590332, "global_step": 52920, "epoch": 437} {"train_loss": -34.2156982421875, "global_step": 52921, "epoch": 437} {"train_loss": -35.16652297973633, "global_step": 52922, "epoch": 437} {"train_loss": -33.103328704833984, "global_step": 52923, "epoch": 437} {"train_loss": -34.58393096923828, "global_step": 52924, "epoch": 437} {"train_loss": -33.38734817504883, "global_step": 52925, "epoch": 437} {"train_loss": -34.79817581176758, "global_step": 52926, "epoch": 437} {"train_loss": -34.86930465698242, "global_step": 52927, "epoch": 437} {"train_loss": -33.341705322265625, "global_step": 52928, "epoch": 437} {"train_loss": -34.173240661621094, "global_step": 52929, "epoch": 437} {"train_loss": -34.69350051879883, "global_step": 52930, "epoch": 437} {"train_loss": -34.42818832397461, "global_step": 52931, "epoch": 437} {"train_loss": -34.37845993041992, "global_step": 52932, "epoch": 437} {"train_loss": -34.4830322265625, "global_step": 52933, "epoch": 437} {"train_loss": -34.64582824707031, "global_step": 52934, "epoch": 437} {"train_loss": -33.88778305053711, "global_step": 52935, "epoch": 437} {"train_loss": -34.4042854309082, "global_step": 52936, "epoch": 437} {"train_loss": -34.68160629272461, "global_step": 52937, "epoch": 437} {"train_loss": -34.726314544677734, "global_step": 52938, "epoch": 437} {"train_loss": -35.406959533691406, "global_step": 52939, "epoch": 437} {"train_loss": -34.36640548706055, "global_step": 52940, "epoch": 437} {"train_loss": -34.81767272949219, "global_step": 52941, "epoch": 437} {"train_loss": -35.59323501586914, "global_step": 52942, "epoch": 437} {"train_loss": -34.45777893066406, "global_step": 52943, "epoch": 437} {"train_loss": -34.11782455444336, "global_step": 52944, "epoch": 437} {"train_loss": -34.94742965698242, "global_step": 52945, "epoch": 437} {"train_loss": -34.56288528442383, "global_step": 52946, "epoch": 437} {"train_loss": -35.114540100097656, "global_step": 52947, "epoch": 437} {"train_loss": -34.762603759765625, "global_step": 52948, "epoch": 437} {"train_loss": -34.753387451171875, "global_step": 52949, "epoch": 437} {"train_loss": -35.371795654296875, "global_step": 52950, "epoch": 437} {"train_loss": -35.087615966796875, "global_step": 52951, "epoch": 437} {"train_loss": -35.45785140991211, "global_step": 52952, "epoch": 437} {"train_loss": -34.83772659301758, "global_step": 52953, "epoch": 437} {"train_loss": -35.82581329345703, "global_step": 52954, "epoch": 437} {"train_loss": -35.421932220458984, "global_step": 52955, "epoch": 437} {"train_loss": -34.89398956298828, "global_step": 52956, "epoch": 437} {"train_loss": -35.540618896484375, "global_step": 52957, "epoch": 437} {"train_loss": -35.02293395996094, "global_step": 52958, "epoch": 437} {"train_loss": -35.298587799072266, "global_step": 52959, "epoch": 437} {"train_loss": -35.142250061035156, "global_step": 52960, "epoch": 437} {"train_loss": -35.120391845703125, "global_step": 52961, "epoch": 437} {"train_loss": -35.594139099121094, "global_step": 52962, "epoch": 437} {"train_loss": -35.46065902709961, "global_step": 52963, "epoch": 437} {"train_loss": -35.6893310546875, "global_step": 52964, "epoch": 437} {"train_loss": -34.812843322753906, "global_step": 52965, "epoch": 437} {"train_loss": -35.26052474975586, "global_step": 52966, "epoch": 437} {"train_loss": -34.79474639892578, "global_step": 52967, "epoch": 437} {"train_loss": -32.8627815246582, "global_step": 52968, "epoch": 437} {"train_loss": -33.871150970458984, "global_step": 52969, "epoch": 437} {"train_loss": -33.748023986816406, "global_step": 52970, "epoch": 437} {"train_loss": -33.9273796081543, "global_step": 52971, "epoch": 437} {"train_loss": -33.86879348754883, "global_step": 52972, "epoch": 437} {"train_loss": -34.19782638549805, "global_step": 52973, "epoch": 437} {"train_loss": -34.102230072021484, "global_step": 52974, "epoch": 437} {"train_loss": -34.609195709228516, "global_step": 52975, "epoch": 437} {"train_loss": -35.460906982421875, "global_step": 52976, "epoch": 437} {"train_loss": -34.95940399169922, "global_step": 52977, "epoch": 437} {"train_loss": -34.786983489990234, "global_step": 52978, "epoch": 437} {"train_loss": -36.141357421875, "global_step": 52979, "epoch": 437} {"train_loss": -34.99323654174805, "global_step": 52980, "epoch": 437} {"train_loss": -35.03090286254883, "global_step": 52981, "epoch": 437} {"train_loss": -35.8408203125, "global_step": 52982, "epoch": 437} {"train_loss": -35.08369827270508, "global_step": 52983, "epoch": 437} {"train_loss": -35.21567916870117, "global_step": 52984, "epoch": 437} {"train_loss": -35.67325973510742, "global_step": 52985, "epoch": 437} {"train_loss": -35.908241271972656, "global_step": 52986, "epoch": 437} {"train_loss": -35.658809661865234, "global_step": 52987, "epoch": 437} {"train_loss": -35.79863739013672, "global_step": 52988, "epoch": 437} {"train_loss": -35.9249153137207, "global_step": 52989, "epoch": 437} {"train_loss": -36.28334426879883, "global_step": 52990, "epoch": 437} {"train_loss": -35.865081787109375, "global_step": 52991, "epoch": 437} {"train_loss": -36.272151947021484, "global_step": 52992, "epoch": 437} {"train_loss": -35.737060546875, "global_step": 52993, "epoch": 437} {"train_loss": -35.369842529296875, "global_step": 52994, "epoch": 437} {"train_loss": -36.33683395385742, "global_step": 52995, "epoch": 437} {"train_loss": -36.324371337890625, "global_step": 52996, "epoch": 437} {"train_loss": -34.79589705033736, "global_step": 52997, "epoch": 437, "val_loss": 2588190.75} {"train_loss": -35.52809524536133, "global_step": 52998, "epoch": 438} {"train_loss": -35.858123779296875, "global_step": 52999, "epoch": 438} {"train_loss": -35.6799430847168, "global_step": 53000, "epoch": 438} {"train_loss": -35.88499069213867, "global_step": 53001, "epoch": 438} {"train_loss": -35.952449798583984, "global_step": 53002, "epoch": 438} {"train_loss": -35.986507415771484, "global_step": 53003, "epoch": 438} {"train_loss": -34.969566345214844, "global_step": 53004, "epoch": 438} {"train_loss": -35.790992736816406, "global_step": 53005, "epoch": 438} {"train_loss": -35.74565505981445, "global_step": 53006, "epoch": 438} {"train_loss": -35.67512130737305, "global_step": 53007, "epoch": 438} {"train_loss": -36.01225280761719, "global_step": 53008, "epoch": 438} {"train_loss": -35.85010528564453, "global_step": 53009, "epoch": 438} {"train_loss": -34.03567123413086, "global_step": 53010, "epoch": 438} {"train_loss": -35.74919509887695, "global_step": 53011, "epoch": 438} {"train_loss": -36.30320358276367, "global_step": 53012, "epoch": 438} {"train_loss": -36.202327728271484, "global_step": 53013, "epoch": 438} {"train_loss": -36.31943893432617, "global_step": 53014, "epoch": 438} {"train_loss": -35.62255096435547, "global_step": 53015, "epoch": 438} {"train_loss": -35.998374938964844, "global_step": 53016, "epoch": 438} {"train_loss": -36.20353317260742, "global_step": 53017, "epoch": 438} {"train_loss": -36.15892791748047, "global_step": 53018, "epoch": 438} {"train_loss": -36.46273422241211, "global_step": 53019, "epoch": 438} {"train_loss": -36.184967041015625, "global_step": 53020, "epoch": 438} {"train_loss": -35.851959228515625, "global_step": 53021, "epoch": 438} {"train_loss": -36.309146881103516, "global_step": 53022, "epoch": 438} {"train_loss": -35.445804595947266, "global_step": 53023, "epoch": 438} {"train_loss": -35.56570053100586, "global_step": 53024, "epoch": 438} {"train_loss": -35.908817291259766, "global_step": 53025, "epoch": 438} {"train_loss": -35.96116256713867, "global_step": 53026, "epoch": 438} {"train_loss": -36.293701171875, "global_step": 53027, "epoch": 438} {"train_loss": -35.89530944824219, "global_step": 53028, "epoch": 438} {"train_loss": -35.51645278930664, "global_step": 53029, "epoch": 438} {"train_loss": -35.00307846069336, "global_step": 53030, "epoch": 438} {"train_loss": -34.76034164428711, "global_step": 53031, "epoch": 438} {"train_loss": -34.49953079223633, "global_step": 53032, "epoch": 438} {"train_loss": -35.03456497192383, "global_step": 53033, "epoch": 438} {"train_loss": -34.9729118347168, "global_step": 53034, "epoch": 438} {"train_loss": -21.974470138549805, "global_step": 53035, "epoch": 438} {"train_loss": -33.06106185913086, "global_step": 53036, "epoch": 438} {"train_loss": -32.577003479003906, "global_step": 53037, "epoch": 438} {"train_loss": -21.134977340698242, "global_step": 53038, "epoch": 438} {"train_loss": -13.730006217956543, "global_step": 53039, "epoch": 438} {"train_loss": -15.907519340515137, "global_step": 53040, "epoch": 438} {"train_loss": -10.726229667663574, "global_step": 53041, "epoch": 438} {"train_loss": -27.070714950561523, "global_step": 53042, "epoch": 438} {"train_loss": -21.80792236328125, "global_step": 53043, "epoch": 438} {"train_loss": -23.354612350463867, "global_step": 53044, "epoch": 438} {"train_loss": -23.86043930053711, "global_step": 53045, "epoch": 438} {"train_loss": -29.260061264038086, "global_step": 53046, "epoch": 438} {"train_loss": -23.314685821533203, "global_step": 53047, "epoch": 438} {"train_loss": -29.04559326171875, "global_step": 53048, "epoch": 438} {"train_loss": -27.53435707092285, "global_step": 53049, "epoch": 438} {"train_loss": -25.417783737182617, "global_step": 53050, "epoch": 438} {"train_loss": -31.45293617248535, "global_step": 53051, "epoch": 438} {"train_loss": -29.270883560180664, "global_step": 53052, "epoch": 438} {"train_loss": -30.24869728088379, "global_step": 53053, "epoch": 438} {"train_loss": -30.376800537109375, "global_step": 53054, "epoch": 438} {"train_loss": -31.563953399658203, "global_step": 53055, "epoch": 438} {"train_loss": -30.553022384643555, "global_step": 53056, "epoch": 438} {"train_loss": -30.74506187438965, "global_step": 53057, "epoch": 438} {"train_loss": -32.243064880371094, "global_step": 53058, "epoch": 438} {"train_loss": -31.699811935424805, "global_step": 53059, "epoch": 438} {"train_loss": -31.733997344970703, "global_step": 53060, "epoch": 438} {"train_loss": -31.67494773864746, "global_step": 53061, "epoch": 438} {"train_loss": -32.14237976074219, "global_step": 53062, "epoch": 438} {"train_loss": -31.921228408813477, "global_step": 53063, "epoch": 438} {"train_loss": -31.5631160736084, "global_step": 53064, "epoch": 438} {"train_loss": -32.2845344543457, "global_step": 53065, "epoch": 438} {"train_loss": -32.15813064575195, "global_step": 53066, "epoch": 438} {"train_loss": -32.47615432739258, "global_step": 53067, "epoch": 438} {"train_loss": -32.248207092285156, "global_step": 53068, "epoch": 438} {"train_loss": -31.87409782409668, "global_step": 53069, "epoch": 438} {"train_loss": -32.84070587158203, "global_step": 53070, "epoch": 438} {"train_loss": -32.881439208984375, "global_step": 53071, "epoch": 438} {"train_loss": -32.22671127319336, "global_step": 53072, "epoch": 438} {"train_loss": -32.9239616394043, "global_step": 53073, "epoch": 438} {"train_loss": -32.99751663208008, "global_step": 53074, "epoch": 438} {"train_loss": -32.9222526550293, "global_step": 53075, "epoch": 438} {"train_loss": -32.7978630065918, "global_step": 53076, "epoch": 438} {"train_loss": -33.168697357177734, "global_step": 53077, "epoch": 438} {"train_loss": -33.215938568115234, "global_step": 53078, "epoch": 438} {"train_loss": -32.375545501708984, "global_step": 53079, "epoch": 438} {"train_loss": -33.266544342041016, "global_step": 53080, "epoch": 438} {"train_loss": -33.119468688964844, "global_step": 53081, "epoch": 438} {"train_loss": -33.03550720214844, "global_step": 53082, "epoch": 438} {"train_loss": -33.45158767700195, "global_step": 53083, "epoch": 438} {"train_loss": -33.37104415893555, "global_step": 53084, "epoch": 438} {"train_loss": -33.501949310302734, "global_step": 53085, "epoch": 438} {"train_loss": -33.12044906616211, "global_step": 53086, "epoch": 438} {"train_loss": -33.28535079956055, "global_step": 53087, "epoch": 438} {"train_loss": -33.66189193725586, "global_step": 53088, "epoch": 438} {"train_loss": -33.43029022216797, "global_step": 53089, "epoch": 438} {"train_loss": -33.795406341552734, "global_step": 53090, "epoch": 438} {"train_loss": -33.18925094604492, "global_step": 53091, "epoch": 438} {"train_loss": -33.567012786865234, "global_step": 53092, "epoch": 438} {"train_loss": -33.55369567871094, "global_step": 53093, "epoch": 438} {"train_loss": -33.703304290771484, "global_step": 53094, "epoch": 438} {"train_loss": -33.95000076293945, "global_step": 53095, "epoch": 438} {"train_loss": -33.897422790527344, "global_step": 53096, "epoch": 438} {"train_loss": -34.143619537353516, "global_step": 53097, "epoch": 438} {"train_loss": -34.025569915771484, "global_step": 53098, "epoch": 438} {"train_loss": -33.917701721191406, "global_step": 53099, "epoch": 438} {"train_loss": -33.954586029052734, "global_step": 53100, "epoch": 438} {"train_loss": -34.405731201171875, "global_step": 53101, "epoch": 438} {"train_loss": -34.148860931396484, "global_step": 53102, "epoch": 438} {"train_loss": -34.11600875854492, "global_step": 53103, "epoch": 438} {"train_loss": -33.96057891845703, "global_step": 53104, "epoch": 438} {"train_loss": -34.30120086669922, "global_step": 53105, "epoch": 438} {"train_loss": -34.18426513671875, "global_step": 53106, "epoch": 438} {"train_loss": -34.64712142944336, "global_step": 53107, "epoch": 438} {"train_loss": -34.55659866333008, "global_step": 53108, "epoch": 438} {"train_loss": -34.52531814575195, "global_step": 53109, "epoch": 438} {"train_loss": -34.409969329833984, "global_step": 53110, "epoch": 438} {"train_loss": -34.48484420776367, "global_step": 53111, "epoch": 438} {"train_loss": -34.69619369506836, "global_step": 53112, "epoch": 438} {"train_loss": -34.636356353759766, "global_step": 53113, "epoch": 438} {"train_loss": -34.75370788574219, "global_step": 53114, "epoch": 438} {"train_loss": -34.58758544921875, "global_step": 53115, "epoch": 438} {"train_loss": -35.058448791503906, "global_step": 53116, "epoch": 438} {"train_loss": -34.9654655456543, "global_step": 53117, "epoch": 438} {"train_loss": -32.675527801198406, "global_step": 53118, "epoch": 438, "val_loss": 2628343.75} {"train_loss": -34.94303512573242, "global_step": 53119, "epoch": 439} {"train_loss": -35.194244384765625, "global_step": 53120, "epoch": 439} {"train_loss": -35.282676696777344, "global_step": 53121, "epoch": 439} {"train_loss": -35.090545654296875, "global_step": 53122, "epoch": 439} {"train_loss": -35.09682846069336, "global_step": 53123, "epoch": 439} {"train_loss": -33.77042007446289, "global_step": 53124, "epoch": 439} {"train_loss": -33.74833679199219, "global_step": 53125, "epoch": 439} {"train_loss": -33.788639068603516, "global_step": 53126, "epoch": 439} {"train_loss": -35.08091354370117, "global_step": 53127, "epoch": 439} {"train_loss": -35.46725082397461, "global_step": 53128, "epoch": 439} {"train_loss": -34.42281723022461, "global_step": 53129, "epoch": 439} {"train_loss": -31.85699462890625, "global_step": 53130, "epoch": 439} {"train_loss": -30.25711441040039, "global_step": 53131, "epoch": 439} {"train_loss": -30.489667892456055, "global_step": 53132, "epoch": 439} {"train_loss": -30.409713745117188, "global_step": 53133, "epoch": 439} {"train_loss": -33.721649169921875, "global_step": 53134, "epoch": 439} {"train_loss": -34.627235412597656, "global_step": 53135, "epoch": 439} {"train_loss": -31.908130645751953, "global_step": 53136, "epoch": 439} {"train_loss": -33.49394607543945, "global_step": 53137, "epoch": 439} {"train_loss": -34.90857696533203, "global_step": 53138, "epoch": 439} {"train_loss": -32.862144470214844, "global_step": 53139, "epoch": 439} {"train_loss": -34.20811080932617, "global_step": 53140, "epoch": 439} {"train_loss": -33.52676010131836, "global_step": 53141, "epoch": 439} {"train_loss": -33.304622650146484, "global_step": 53142, "epoch": 439} {"train_loss": -34.60988235473633, "global_step": 53143, "epoch": 439} {"train_loss": -34.1559944152832, "global_step": 53144, "epoch": 439} {"train_loss": -35.309242248535156, "global_step": 53145, "epoch": 439} {"train_loss": -33.86223220825195, "global_step": 53146, "epoch": 439} {"train_loss": -34.79160690307617, "global_step": 53147, "epoch": 439} {"train_loss": -34.336727142333984, "global_step": 53148, "epoch": 439} {"train_loss": -34.69291687011719, "global_step": 53149, "epoch": 439} {"train_loss": -34.57124710083008, "global_step": 53150, "epoch": 439} {"train_loss": -34.54938507080078, "global_step": 53151, "epoch": 439} {"train_loss": -34.93294906616211, "global_step": 53152, "epoch": 439} {"train_loss": -35.190914154052734, "global_step": 53153, "epoch": 439} {"train_loss": -34.41304397583008, "global_step": 53154, "epoch": 439} {"train_loss": -35.72316360473633, "global_step": 53155, "epoch": 439} {"train_loss": -35.28737258911133, "global_step": 53156, "epoch": 439} {"train_loss": -35.11056137084961, "global_step": 53157, "epoch": 439} {"train_loss": -35.15260314941406, "global_step": 53158, "epoch": 439} {"train_loss": -35.06889724731445, "global_step": 53159, "epoch": 439} {"train_loss": -35.561824798583984, "global_step": 53160, "epoch": 439} {"train_loss": -35.57806396484375, "global_step": 53161, "epoch": 439} {"train_loss": -35.71613311767578, "global_step": 53162, "epoch": 439} {"train_loss": -35.957576751708984, "global_step": 53163, "epoch": 439} {"train_loss": -35.46813201904297, "global_step": 53164, "epoch": 439} {"train_loss": -35.20425033569336, "global_step": 53165, "epoch": 439} {"train_loss": -35.35673522949219, "global_step": 53166, "epoch": 439} {"train_loss": -34.9729118347168, "global_step": 53167, "epoch": 439} {"train_loss": -35.11045837402344, "global_step": 53168, "epoch": 439} {"train_loss": -35.677734375, "global_step": 53169, "epoch": 439} {"train_loss": -35.85744857788086, "global_step": 53170, "epoch": 439} {"train_loss": -35.612735748291016, "global_step": 53171, "epoch": 439} {"train_loss": -35.929622650146484, "global_step": 53172, "epoch": 439} {"train_loss": -35.43408203125, "global_step": 53173, "epoch": 439} {"train_loss": -35.53750228881836, "global_step": 53174, "epoch": 439} {"train_loss": -35.69960403442383, "global_step": 53175, "epoch": 439} {"train_loss": -35.803157806396484, "global_step": 53176, "epoch": 439} {"train_loss": -35.88689041137695, "global_step": 53177, "epoch": 439} {"train_loss": -35.80558395385742, "global_step": 53178, "epoch": 439} {"train_loss": -35.2419319152832, "global_step": 53179, "epoch": 439} {"train_loss": -34.99856185913086, "global_step": 53180, "epoch": 439} {"train_loss": -35.027618408203125, "global_step": 53181, "epoch": 439} {"train_loss": -35.05317306518555, "global_step": 53182, "epoch": 439} {"train_loss": -35.85382080078125, "global_step": 53183, "epoch": 439} {"train_loss": -36.1584587097168, "global_step": 53184, "epoch": 439} {"train_loss": -35.665042877197266, "global_step": 53185, "epoch": 439} {"train_loss": -35.91324996948242, "global_step": 53186, "epoch": 439} {"train_loss": -36.094398498535156, "global_step": 53187, "epoch": 439} {"train_loss": -35.50941467285156, "global_step": 53188, "epoch": 439} {"train_loss": -33.27128982543945, "global_step": 53189, "epoch": 439} {"train_loss": -28.35259437561035, "global_step": 53190, "epoch": 439} {"train_loss": -20.615007400512695, "global_step": 53191, "epoch": 439} {"train_loss": -15.388340950012207, "global_step": 53192, "epoch": 439} {"train_loss": -28.364164352416992, "global_step": 53193, "epoch": 439} {"train_loss": -34.451969146728516, "global_step": 53194, "epoch": 439} {"train_loss": -30.919666290283203, "global_step": 53195, "epoch": 439} {"train_loss": -34.077674865722656, "global_step": 53196, "epoch": 439} {"train_loss": -32.47404098510742, "global_step": 53197, "epoch": 439} {"train_loss": -32.94039535522461, "global_step": 53198, "epoch": 439} {"train_loss": -34.1983757019043, "global_step": 53199, "epoch": 439} {"train_loss": -33.597286224365234, "global_step": 53200, "epoch": 439} {"train_loss": -35.21090316772461, "global_step": 53201, "epoch": 439} {"train_loss": -34.439666748046875, "global_step": 53202, "epoch": 439} {"train_loss": -34.17311477661133, "global_step": 53203, "epoch": 439} {"train_loss": -34.76299285888672, "global_step": 53204, "epoch": 439} {"train_loss": -34.46215057373047, "global_step": 53205, "epoch": 439} {"train_loss": -34.54269790649414, "global_step": 53206, "epoch": 439} {"train_loss": -34.88603591918945, "global_step": 53207, "epoch": 439} {"train_loss": -35.22015380859375, "global_step": 53208, "epoch": 439} {"train_loss": -35.31362533569336, "global_step": 53209, "epoch": 439} {"train_loss": -35.46075439453125, "global_step": 53210, "epoch": 439} {"train_loss": -35.1373176574707, "global_step": 53211, "epoch": 439} {"train_loss": -35.14603042602539, "global_step": 53212, "epoch": 439} {"train_loss": -35.534149169921875, "global_step": 53213, "epoch": 439} {"train_loss": -35.222015380859375, "global_step": 53214, "epoch": 439} {"train_loss": -35.169952392578125, "global_step": 53215, "epoch": 439} {"train_loss": -35.19219970703125, "global_step": 53216, "epoch": 439} {"train_loss": -35.5089225769043, "global_step": 53217, "epoch": 439} {"train_loss": -35.35783004760742, "global_step": 53218, "epoch": 439} {"train_loss": -35.26265335083008, "global_step": 53219, "epoch": 439} {"train_loss": -35.42271041870117, "global_step": 53220, "epoch": 439} {"train_loss": -35.747562408447266, "global_step": 53221, "epoch": 439} {"train_loss": -35.66643142700195, "global_step": 53222, "epoch": 439} {"train_loss": -35.673519134521484, "global_step": 53223, "epoch": 439} {"train_loss": -35.30722427368164, "global_step": 53224, "epoch": 439} {"train_loss": -35.47577667236328, "global_step": 53225, "epoch": 439} {"train_loss": -35.16632080078125, "global_step": 53226, "epoch": 439} {"train_loss": -35.3939208984375, "global_step": 53227, "epoch": 439} {"train_loss": -34.53947830200195, "global_step": 53228, "epoch": 439} {"train_loss": -35.34684371948242, "global_step": 53229, "epoch": 439} {"train_loss": -35.4384880065918, "global_step": 53230, "epoch": 439} {"train_loss": -34.84819412231445, "global_step": 53231, "epoch": 439} {"train_loss": -34.83112716674805, "global_step": 53232, "epoch": 439} {"train_loss": -35.447669982910156, "global_step": 53233, "epoch": 439} {"train_loss": -35.4986686706543, "global_step": 53234, "epoch": 439} {"train_loss": -35.80842208862305, "global_step": 53235, "epoch": 439} {"train_loss": -34.48023223876953, "global_step": 53236, "epoch": 439} {"train_loss": -34.77534866333008, "global_step": 53237, "epoch": 439} {"train_loss": -35.469146728515625, "global_step": 53238, "epoch": 439} {"train_loss": -34.39287993533552, "global_step": 53239, "epoch": 439, "val_loss": 2567064.75} {"train_loss": -34.66333770751953, "global_step": 53240, "epoch": 440} {"train_loss": -34.941749572753906, "global_step": 53241, "epoch": 440} {"train_loss": -35.32265853881836, "global_step": 53242, "epoch": 440} {"train_loss": -28.8586483001709, "global_step": 53243, "epoch": 440} {"train_loss": -35.035858154296875, "global_step": 53244, "epoch": 440} {"train_loss": -35.08967590332031, "global_step": 53245, "epoch": 440} {"train_loss": -34.56676483154297, "global_step": 53246, "epoch": 440} {"train_loss": -33.90098190307617, "global_step": 53247, "epoch": 440} {"train_loss": -34.54134750366211, "global_step": 53248, "epoch": 440} {"train_loss": -34.799163818359375, "global_step": 53249, "epoch": 440} {"train_loss": -34.1148567199707, "global_step": 53250, "epoch": 440} {"train_loss": -35.495574951171875, "global_step": 53251, "epoch": 440} {"train_loss": -34.36672592163086, "global_step": 53252, "epoch": 440} {"train_loss": -35.5091438293457, "global_step": 53253, "epoch": 440} {"train_loss": -33.50172424316406, "global_step": 53254, "epoch": 440} {"train_loss": -34.74999237060547, "global_step": 53255, "epoch": 440} {"train_loss": -35.159297943115234, "global_step": 53256, "epoch": 440} {"train_loss": -34.77595138549805, "global_step": 53257, "epoch": 440} {"train_loss": -34.55595016479492, "global_step": 53258, "epoch": 440} {"train_loss": -34.88376998901367, "global_step": 53259, "epoch": 440} {"train_loss": -35.43172073364258, "global_step": 53260, "epoch": 440} {"train_loss": -35.48930740356445, "global_step": 53261, "epoch": 440} {"train_loss": -34.72657012939453, "global_step": 53262, "epoch": 440} {"train_loss": -33.97444534301758, "global_step": 53263, "epoch": 440} {"train_loss": -34.12544631958008, "global_step": 53264, "epoch": 440} {"train_loss": -35.17255401611328, "global_step": 53265, "epoch": 440} {"train_loss": -34.973907470703125, "global_step": 53266, "epoch": 440} {"train_loss": -34.976478576660156, "global_step": 53267, "epoch": 440} {"train_loss": -35.16191482543945, "global_step": 53268, "epoch": 440} {"train_loss": -35.151798248291016, "global_step": 53269, "epoch": 440} {"train_loss": -35.400062561035156, "global_step": 53270, "epoch": 440} {"train_loss": -34.86503982543945, "global_step": 53271, "epoch": 440} {"train_loss": -35.2667350769043, "global_step": 53272, "epoch": 440} {"train_loss": -33.598873138427734, "global_step": 53273, "epoch": 440} {"train_loss": -34.98249053955078, "global_step": 53274, "epoch": 440} {"train_loss": -34.34486770629883, "global_step": 53275, "epoch": 440} {"train_loss": -35.2100715637207, "global_step": 53276, "epoch": 440} {"train_loss": -34.7220573425293, "global_step": 53277, "epoch": 440} {"train_loss": -35.127742767333984, "global_step": 53278, "epoch": 440} {"train_loss": -34.77132034301758, "global_step": 53279, "epoch": 440} {"train_loss": -34.97109603881836, "global_step": 53280, "epoch": 440} {"train_loss": -35.42557907104492, "global_step": 53281, "epoch": 440} {"train_loss": -35.05582046508789, "global_step": 53282, "epoch": 440} {"train_loss": -35.3370475769043, "global_step": 53283, "epoch": 440} {"train_loss": -34.65011215209961, "global_step": 53284, "epoch": 440} {"train_loss": -35.245941162109375, "global_step": 53285, "epoch": 440} {"train_loss": -34.63311004638672, "global_step": 53286, "epoch": 440} {"train_loss": -34.15309524536133, "global_step": 53287, "epoch": 440} {"train_loss": -34.96619415283203, "global_step": 53288, "epoch": 440} {"train_loss": -35.26682662963867, "global_step": 53289, "epoch": 440} {"train_loss": -34.61002731323242, "global_step": 53290, "epoch": 440} {"train_loss": -34.327754974365234, "global_step": 53291, "epoch": 440} {"train_loss": -34.31294631958008, "global_step": 53292, "epoch": 440} {"train_loss": -34.62702178955078, "global_step": 53293, "epoch": 440} {"train_loss": -33.96718215942383, "global_step": 53294, "epoch": 440} {"train_loss": -33.52845001220703, "global_step": 53295, "epoch": 440} {"train_loss": -35.39583969116211, "global_step": 53296, "epoch": 440} {"train_loss": -33.29478073120117, "global_step": 53297, "epoch": 440} {"train_loss": -33.299598693847656, "global_step": 53298, "epoch": 440} {"train_loss": -34.62493896484375, "global_step": 53299, "epoch": 440} {"train_loss": -33.24204635620117, "global_step": 53300, "epoch": 440} {"train_loss": -33.99664306640625, "global_step": 53301, "epoch": 440} {"train_loss": -31.5862979888916, "global_step": 53302, "epoch": 440} {"train_loss": -28.013452529907227, "global_step": 53303, "epoch": 440} {"train_loss": -33.505062103271484, "global_step": 53304, "epoch": 440} {"train_loss": -32.56926345825195, "global_step": 53305, "epoch": 440} {"train_loss": -31.708913803100586, "global_step": 53306, "epoch": 440} {"train_loss": -33.42336654663086, "global_step": 53307, "epoch": 440} {"train_loss": -34.24369812011719, "global_step": 53308, "epoch": 440} {"train_loss": -29.728910446166992, "global_step": 53309, "epoch": 440} {"train_loss": -33.6076774597168, "global_step": 53310, "epoch": 440} {"train_loss": -33.19809341430664, "global_step": 53311, "epoch": 440} {"train_loss": -31.49006462097168, "global_step": 53312, "epoch": 440} {"train_loss": -34.246917724609375, "global_step": 53313, "epoch": 440} {"train_loss": -32.361324310302734, "global_step": 53314, "epoch": 440} {"train_loss": -33.190956115722656, "global_step": 53315, "epoch": 440} {"train_loss": -34.238861083984375, "global_step": 53316, "epoch": 440} {"train_loss": -32.28129196166992, "global_step": 53317, "epoch": 440} {"train_loss": -33.6646614074707, "global_step": 53318, "epoch": 440} {"train_loss": -34.61772537231445, "global_step": 53319, "epoch": 440} {"train_loss": -32.686058044433594, "global_step": 53320, "epoch": 440} {"train_loss": -33.9549560546875, "global_step": 53321, "epoch": 440} {"train_loss": -30.228036880493164, "global_step": 53322, "epoch": 440} {"train_loss": -33.12469482421875, "global_step": 53323, "epoch": 440} {"train_loss": -29.269916534423828, "global_step": 53324, "epoch": 440} {"train_loss": -19.33377456665039, "global_step": 53325, "epoch": 440} {"train_loss": -31.830005645751953, "global_step": 53326, "epoch": 440} {"train_loss": -26.561120986938477, "global_step": 53327, "epoch": 440} {"train_loss": -12.417671203613281, "global_step": 53328, "epoch": 440} {"train_loss": -28.731433868408203, "global_step": 53329, "epoch": 440} {"train_loss": -27.520612716674805, "global_step": 53330, "epoch": 440} {"train_loss": -26.339139938354492, "global_step": 53331, "epoch": 440} {"train_loss": -24.108741760253906, "global_step": 53332, "epoch": 440} {"train_loss": -27.01594352722168, "global_step": 53333, "epoch": 440} {"train_loss": -28.523757934570312, "global_step": 53334, "epoch": 440} {"train_loss": -27.194440841674805, "global_step": 53335, "epoch": 440} {"train_loss": -26.373645782470703, "global_step": 53336, "epoch": 440} {"train_loss": -28.62476921081543, "global_step": 53337, "epoch": 440} {"train_loss": -27.7163143157959, "global_step": 53338, "epoch": 440} {"train_loss": -28.82843589782715, "global_step": 53339, "epoch": 440} {"train_loss": -30.35711097717285, "global_step": 53340, "epoch": 440} {"train_loss": -29.670194625854492, "global_step": 53341, "epoch": 440} {"train_loss": -30.440656661987305, "global_step": 53342, "epoch": 440} {"train_loss": -28.620563507080078, "global_step": 53343, "epoch": 440} {"train_loss": -29.41083335876465, "global_step": 53344, "epoch": 440} {"train_loss": -29.388647079467773, "global_step": 53345, "epoch": 440} {"train_loss": -28.654504776000977, "global_step": 53346, "epoch": 440} {"train_loss": -30.08941650390625, "global_step": 53347, "epoch": 440} {"train_loss": -30.328535079956055, "global_step": 53348, "epoch": 440} {"train_loss": -30.440597534179688, "global_step": 53349, "epoch": 440} {"train_loss": -30.22942543029785, "global_step": 53350, "epoch": 440} {"train_loss": -29.860830307006836, "global_step": 53351, "epoch": 440} {"train_loss": -30.411230087280273, "global_step": 53352, "epoch": 440} {"train_loss": -30.961139678955078, "global_step": 53353, "epoch": 440} {"train_loss": -30.728591918945312, "global_step": 53354, "epoch": 440} {"train_loss": -31.138381958007812, "global_step": 53355, "epoch": 440} {"train_loss": -30.778409957885742, "global_step": 53356, "epoch": 440} {"train_loss": -31.118213653564453, "global_step": 53357, "epoch": 440} {"train_loss": -31.25955581665039, "global_step": 53358, "epoch": 440} {"train_loss": -30.952957153320312, "global_step": 53359, "epoch": 440} {"train_loss": -32.393292419181385, "global_step": 53360, "epoch": 440, "val_loss": 2553994.5} {"train_loss": -31.218149185180664, "global_step": 53361, "epoch": 441} {"train_loss": -30.50962257385254, "global_step": 53362, "epoch": 441} {"train_loss": -31.59462547302246, "global_step": 53363, "epoch": 441} {"train_loss": -31.832868576049805, "global_step": 53364, "epoch": 441} {"train_loss": -31.921979904174805, "global_step": 53365, "epoch": 441} {"train_loss": -31.747364044189453, "global_step": 53366, "epoch": 441} {"train_loss": -31.832141876220703, "global_step": 53367, "epoch": 441} {"train_loss": -32.020843505859375, "global_step": 53368, "epoch": 441} {"train_loss": -32.04185104370117, "global_step": 53369, "epoch": 441} {"train_loss": -31.834869384765625, "global_step": 53370, "epoch": 441} {"train_loss": -32.65788269042969, "global_step": 53371, "epoch": 441} {"train_loss": -32.00564956665039, "global_step": 53372, "epoch": 441} {"train_loss": -32.515647888183594, "global_step": 53373, "epoch": 441} {"train_loss": -32.12771987915039, "global_step": 53374, "epoch": 441} {"train_loss": -32.0453987121582, "global_step": 53375, "epoch": 441} {"train_loss": -32.52456283569336, "global_step": 53376, "epoch": 441} {"train_loss": -32.69411087036133, "global_step": 53377, "epoch": 441} {"train_loss": -32.861854553222656, "global_step": 53378, "epoch": 441} {"train_loss": -33.18267822265625, "global_step": 53379, "epoch": 441} {"train_loss": -32.642486572265625, "global_step": 53380, "epoch": 441} {"train_loss": -32.67447280883789, "global_step": 53381, "epoch": 441} {"train_loss": -32.83637619018555, "global_step": 53382, "epoch": 441} {"train_loss": -32.69960403442383, "global_step": 53383, "epoch": 441} {"train_loss": -33.11758804321289, "global_step": 53384, "epoch": 441} {"train_loss": -32.869930267333984, "global_step": 53385, "epoch": 441} {"train_loss": -33.107818603515625, "global_step": 53386, "epoch": 441} {"train_loss": -32.672847747802734, "global_step": 53387, "epoch": 441} {"train_loss": -33.67499542236328, "global_step": 53388, "epoch": 441} {"train_loss": -33.34090805053711, "global_step": 53389, "epoch": 441} {"train_loss": -32.676605224609375, "global_step": 53390, "epoch": 441} {"train_loss": -33.0596923828125, "global_step": 53391, "epoch": 441} {"train_loss": -33.1090087890625, "global_step": 53392, "epoch": 441} {"train_loss": -33.29939651489258, "global_step": 53393, "epoch": 441} {"train_loss": -33.8783073425293, "global_step": 53394, "epoch": 441} {"train_loss": -33.62165832519531, "global_step": 53395, "epoch": 441} {"train_loss": -33.375877380371094, "global_step": 53396, "epoch": 441} {"train_loss": -33.13712692260742, "global_step": 53397, "epoch": 441} {"train_loss": -33.61359786987305, "global_step": 53398, "epoch": 441} {"train_loss": -33.234031677246094, "global_step": 53399, "epoch": 441} {"train_loss": -33.37271499633789, "global_step": 53400, "epoch": 441} {"train_loss": -33.5632438659668, "global_step": 53401, "epoch": 441} {"train_loss": -34.31692123413086, "global_step": 53402, "epoch": 441} {"train_loss": -33.85053253173828, "global_step": 53403, "epoch": 441} {"train_loss": -33.852718353271484, "global_step": 53404, "epoch": 441} {"train_loss": -33.743995666503906, "global_step": 53405, "epoch": 441} {"train_loss": -33.45326614379883, "global_step": 53406, "epoch": 441} {"train_loss": -34.0771598815918, "global_step": 53407, "epoch": 441} {"train_loss": -34.027557373046875, "global_step": 53408, "epoch": 441} {"train_loss": -34.484169006347656, "global_step": 53409, "epoch": 441} {"train_loss": -34.216609954833984, "global_step": 53410, "epoch": 441} {"train_loss": -34.387046813964844, "global_step": 53411, "epoch": 441} {"train_loss": -33.067562103271484, "global_step": 53412, "epoch": 441} {"train_loss": -34.062381744384766, "global_step": 53413, "epoch": 441} {"train_loss": -34.379920959472656, "global_step": 53414, "epoch": 441} {"train_loss": -34.08867263793945, "global_step": 53415, "epoch": 441} {"train_loss": -34.80318069458008, "global_step": 53416, "epoch": 441} {"train_loss": -34.72011947631836, "global_step": 53417, "epoch": 441} {"train_loss": -34.52827835083008, "global_step": 53418, "epoch": 441} {"train_loss": -34.75878143310547, "global_step": 53419, "epoch": 441} {"train_loss": -34.35837936401367, "global_step": 53420, "epoch": 441} {"train_loss": -34.923316955566406, "global_step": 53421, "epoch": 441} {"train_loss": -34.92474365234375, "global_step": 53422, "epoch": 441} {"train_loss": -34.87602233886719, "global_step": 53423, "epoch": 441} {"train_loss": -34.800777435302734, "global_step": 53424, "epoch": 441} {"train_loss": -34.62294006347656, "global_step": 53425, "epoch": 441} {"train_loss": -34.87896728515625, "global_step": 53426, "epoch": 441} {"train_loss": -34.639007568359375, "global_step": 53427, "epoch": 441} {"train_loss": -35.20492935180664, "global_step": 53428, "epoch": 441} {"train_loss": -34.66336441040039, "global_step": 53429, "epoch": 441} {"train_loss": -35.412269592285156, "global_step": 53430, "epoch": 441} {"train_loss": -35.05794143676758, "global_step": 53431, "epoch": 441} {"train_loss": -35.25520706176758, "global_step": 53432, "epoch": 441} {"train_loss": -35.050140380859375, "global_step": 53433, "epoch": 441} {"train_loss": -35.1779670715332, "global_step": 53434, "epoch": 441} {"train_loss": -35.0634880065918, "global_step": 53435, "epoch": 441} {"train_loss": -35.162105560302734, "global_step": 53436, "epoch": 441} {"train_loss": -35.453975677490234, "global_step": 53437, "epoch": 441} {"train_loss": -34.97364807128906, "global_step": 53438, "epoch": 441} {"train_loss": -34.821510314941406, "global_step": 53439, "epoch": 441} {"train_loss": -35.27206039428711, "global_step": 53440, "epoch": 441} {"train_loss": -35.68283462524414, "global_step": 53441, "epoch": 441} {"train_loss": -35.403934478759766, "global_step": 53442, "epoch": 441} {"train_loss": -34.79802322387695, "global_step": 53443, "epoch": 441} {"train_loss": -34.5584716796875, "global_step": 53444, "epoch": 441} {"train_loss": -34.617977142333984, "global_step": 53445, "epoch": 441} {"train_loss": -35.707393646240234, "global_step": 53446, "epoch": 441} {"train_loss": -35.53420639038086, "global_step": 53447, "epoch": 441} {"train_loss": -35.452266693115234, "global_step": 53448, "epoch": 441} {"train_loss": -35.56343460083008, "global_step": 53449, "epoch": 441} {"train_loss": -35.50936508178711, "global_step": 53450, "epoch": 441} {"train_loss": -35.66072463989258, "global_step": 53451, "epoch": 441} {"train_loss": -35.21371841430664, "global_step": 53452, "epoch": 441} {"train_loss": -35.29075241088867, "global_step": 53453, "epoch": 441} {"train_loss": -35.572669982910156, "global_step": 53454, "epoch": 441} {"train_loss": -35.28281021118164, "global_step": 53455, "epoch": 441} {"train_loss": -35.454750061035156, "global_step": 53456, "epoch": 441} {"train_loss": -34.520668029785156, "global_step": 53457, "epoch": 441} {"train_loss": -33.571956634521484, "global_step": 53458, "epoch": 441} {"train_loss": -34.655555725097656, "global_step": 53459, "epoch": 441} {"train_loss": -33.7677116394043, "global_step": 53460, "epoch": 441} {"train_loss": -32.93618392944336, "global_step": 53461, "epoch": 441} {"train_loss": -33.47392654418945, "global_step": 53462, "epoch": 441} {"train_loss": -28.569860458374023, "global_step": 53463, "epoch": 441} {"train_loss": -22.929630279541016, "global_step": 53464, "epoch": 441} {"train_loss": -21.89626121520996, "global_step": 53465, "epoch": 441} {"train_loss": -25.393884658813477, "global_step": 53466, "epoch": 441} {"train_loss": -23.98146629333496, "global_step": 53467, "epoch": 441} {"train_loss": -25.50508689880371, "global_step": 53468, "epoch": 441} {"train_loss": -30.22420310974121, "global_step": 53469, "epoch": 441} {"train_loss": -25.551559448242188, "global_step": 53470, "epoch": 441} {"train_loss": -31.3712215423584, "global_step": 53471, "epoch": 441} {"train_loss": -27.76226806640625, "global_step": 53472, "epoch": 441} {"train_loss": -31.238815307617188, "global_step": 53473, "epoch": 441} {"train_loss": -29.847671508789062, "global_step": 53474, "epoch": 441} {"train_loss": -31.809350967407227, "global_step": 53475, "epoch": 441} {"train_loss": -32.14875030517578, "global_step": 53476, "epoch": 441} {"train_loss": -32.686309814453125, "global_step": 53477, "epoch": 441} {"train_loss": -32.22450637817383, "global_step": 53478, "epoch": 441} {"train_loss": -34.33051300048828, "global_step": 53479, "epoch": 441} {"train_loss": -31.12123680114746, "global_step": 53480, "epoch": 441} {"train_loss": -33.127871584301154, "global_step": 53481, "epoch": 441, "val_loss": 2570878.25} {"train_loss": -32.6030158996582, "global_step": 53482, "epoch": 442} {"train_loss": -33.339759826660156, "global_step": 53483, "epoch": 442} {"train_loss": -33.80262756347656, "global_step": 53484, "epoch": 442} {"train_loss": -33.19347381591797, "global_step": 53485, "epoch": 442} {"train_loss": -33.506996154785156, "global_step": 53486, "epoch": 442} {"train_loss": -33.66180419921875, "global_step": 53487, "epoch": 442} {"train_loss": -33.3436393737793, "global_step": 53488, "epoch": 442} {"train_loss": -34.267555236816406, "global_step": 53489, "epoch": 442} {"train_loss": -34.255611419677734, "global_step": 53490, "epoch": 442} {"train_loss": -33.85171890258789, "global_step": 53491, "epoch": 442} {"train_loss": -34.37677764892578, "global_step": 53492, "epoch": 442} {"train_loss": -34.152713775634766, "global_step": 53493, "epoch": 442} {"train_loss": -34.51493453979492, "global_step": 53494, "epoch": 442} {"train_loss": -34.62263107299805, "global_step": 53495, "epoch": 442} {"train_loss": -33.959102630615234, "global_step": 53496, "epoch": 442} {"train_loss": -34.489288330078125, "global_step": 53497, "epoch": 442} {"train_loss": -34.81324768066406, "global_step": 53498, "epoch": 442} {"train_loss": -34.73263168334961, "global_step": 53499, "epoch": 442} {"train_loss": -34.731475830078125, "global_step": 53500, "epoch": 442} {"train_loss": -34.712158203125, "global_step": 53501, "epoch": 442} {"train_loss": -35.021385192871094, "global_step": 53502, "epoch": 442} {"train_loss": -35.32865524291992, "global_step": 53503, "epoch": 442} {"train_loss": -35.23603820800781, "global_step": 53504, "epoch": 442} {"train_loss": -35.12017822265625, "global_step": 53505, "epoch": 442} {"train_loss": -35.158905029296875, "global_step": 53506, "epoch": 442} {"train_loss": -35.371742248535156, "global_step": 53507, "epoch": 442} {"train_loss": -35.32841110229492, "global_step": 53508, "epoch": 442} {"train_loss": -35.16395950317383, "global_step": 53509, "epoch": 442} {"train_loss": -34.93729782104492, "global_step": 53510, "epoch": 442} {"train_loss": -35.15871810913086, "global_step": 53511, "epoch": 442} {"train_loss": -35.766563415527344, "global_step": 53512, "epoch": 442} {"train_loss": -35.528236389160156, "global_step": 53513, "epoch": 442} {"train_loss": -35.25783157348633, "global_step": 53514, "epoch": 442} {"train_loss": -35.64144515991211, "global_step": 53515, "epoch": 442} {"train_loss": -35.824039459228516, "global_step": 53516, "epoch": 442} {"train_loss": -35.714134216308594, "global_step": 53517, "epoch": 442} {"train_loss": -35.82556915283203, "global_step": 53518, "epoch": 442} {"train_loss": -36.1337890625, "global_step": 53519, "epoch": 442} {"train_loss": -35.50620651245117, "global_step": 53520, "epoch": 442} {"train_loss": -35.416053771972656, "global_step": 53521, "epoch": 442} {"train_loss": -35.85358810424805, "global_step": 53522, "epoch": 442} {"train_loss": -35.81963348388672, "global_step": 53523, "epoch": 442} {"train_loss": -35.946937561035156, "global_step": 53524, "epoch": 442} {"train_loss": -35.443904876708984, "global_step": 53525, "epoch": 442} {"train_loss": -35.77024459838867, "global_step": 53526, "epoch": 442} {"train_loss": -35.6317253112793, "global_step": 53527, "epoch": 442} {"train_loss": -35.84877395629883, "global_step": 53528, "epoch": 442} {"train_loss": -35.56905746459961, "global_step": 53529, "epoch": 442} {"train_loss": -35.20882797241211, "global_step": 53530, "epoch": 442} {"train_loss": -33.59133529663086, "global_step": 53531, "epoch": 442} {"train_loss": -33.17070388793945, "global_step": 53532, "epoch": 442} {"train_loss": -35.012176513671875, "global_step": 53533, "epoch": 442} {"train_loss": -35.88880920410156, "global_step": 53534, "epoch": 442} {"train_loss": -35.103675842285156, "global_step": 53535, "epoch": 442} {"train_loss": -34.093231201171875, "global_step": 53536, "epoch": 442} {"train_loss": -35.146976470947266, "global_step": 53537, "epoch": 442} {"train_loss": -35.88387680053711, "global_step": 53538, "epoch": 442} {"train_loss": -35.2392692565918, "global_step": 53539, "epoch": 442} {"train_loss": -34.948089599609375, "global_step": 53540, "epoch": 442} {"train_loss": -34.754310607910156, "global_step": 53541, "epoch": 442} {"train_loss": -34.51925277709961, "global_step": 53542, "epoch": 442} {"train_loss": -34.67280197143555, "global_step": 53543, "epoch": 442} {"train_loss": -31.749561309814453, "global_step": 53544, "epoch": 442} {"train_loss": -31.48126792907715, "global_step": 53545, "epoch": 442} {"train_loss": -31.82606315612793, "global_step": 53546, "epoch": 442} {"train_loss": -32.51850128173828, "global_step": 53547, "epoch": 442} {"train_loss": -33.59343719482422, "global_step": 53548, "epoch": 442} {"train_loss": -35.34518051147461, "global_step": 53549, "epoch": 442} {"train_loss": -35.498111724853516, "global_step": 53550, "epoch": 442} {"train_loss": -32.90536880493164, "global_step": 53551, "epoch": 442} {"train_loss": -34.07644271850586, "global_step": 53552, "epoch": 442} {"train_loss": -35.42757034301758, "global_step": 53553, "epoch": 442} {"train_loss": -34.5374870300293, "global_step": 53554, "epoch": 442} {"train_loss": -34.5528678894043, "global_step": 53555, "epoch": 442} {"train_loss": -35.1410026550293, "global_step": 53556, "epoch": 442} {"train_loss": -33.32063674926758, "global_step": 53557, "epoch": 442} {"train_loss": -35.390159606933594, "global_step": 53558, "epoch": 442} {"train_loss": -33.5271110534668, "global_step": 53559, "epoch": 442} {"train_loss": -34.956478118896484, "global_step": 53560, "epoch": 442} {"train_loss": -33.68685531616211, "global_step": 53561, "epoch": 442} {"train_loss": -34.779781341552734, "global_step": 53562, "epoch": 442} {"train_loss": -34.79680252075195, "global_step": 53563, "epoch": 442} {"train_loss": -34.463134765625, "global_step": 53564, "epoch": 442} {"train_loss": -34.9895133972168, "global_step": 53565, "epoch": 442} {"train_loss": -34.65397262573242, "global_step": 53566, "epoch": 442} {"train_loss": -34.901397705078125, "global_step": 53567, "epoch": 442} {"train_loss": -35.377254486083984, "global_step": 53568, "epoch": 442} {"train_loss": -34.763607025146484, "global_step": 53569, "epoch": 442} {"train_loss": -34.6135139465332, "global_step": 53570, "epoch": 442} {"train_loss": -35.27145004272461, "global_step": 53571, "epoch": 442} {"train_loss": -34.67571258544922, "global_step": 53572, "epoch": 442} {"train_loss": -35.08655548095703, "global_step": 53573, "epoch": 442} {"train_loss": -35.23795700073242, "global_step": 53574, "epoch": 442} {"train_loss": -34.7654914855957, "global_step": 53575, "epoch": 442} {"train_loss": -35.513763427734375, "global_step": 53576, "epoch": 442} {"train_loss": -34.82020568847656, "global_step": 53577, "epoch": 442} {"train_loss": -35.611915588378906, "global_step": 53578, "epoch": 442} {"train_loss": -35.184749603271484, "global_step": 53579, "epoch": 442} {"train_loss": -35.967891693115234, "global_step": 53580, "epoch": 442} {"train_loss": -35.432952880859375, "global_step": 53581, "epoch": 442} {"train_loss": -35.27054977416992, "global_step": 53582, "epoch": 442} {"train_loss": -35.368621826171875, "global_step": 53583, "epoch": 442} {"train_loss": -34.620967864990234, "global_step": 53584, "epoch": 442} {"train_loss": -34.9425048828125, "global_step": 53585, "epoch": 442} {"train_loss": -35.587894439697266, "global_step": 53586, "epoch": 442} {"train_loss": -35.737117767333984, "global_step": 53587, "epoch": 442} {"train_loss": -35.01371383666992, "global_step": 53588, "epoch": 442} {"train_loss": -35.30949020385742, "global_step": 53589, "epoch": 442} {"train_loss": -35.52539825439453, "global_step": 53590, "epoch": 442} {"train_loss": -35.113616943359375, "global_step": 53591, "epoch": 442} {"train_loss": -35.48701858520508, "global_step": 53592, "epoch": 442} {"train_loss": -35.58726119995117, "global_step": 53593, "epoch": 442} {"train_loss": -35.84292221069336, "global_step": 53594, "epoch": 442} {"train_loss": -35.89408493041992, "global_step": 53595, "epoch": 442} {"train_loss": -35.66750717163086, "global_step": 53596, "epoch": 442} {"train_loss": -35.77424240112305, "global_step": 53597, "epoch": 442} {"train_loss": -35.7837028503418, "global_step": 53598, "epoch": 442} {"train_loss": -35.66256332397461, "global_step": 53599, "epoch": 442} {"train_loss": -35.7581787109375, "global_step": 53600, "epoch": 442} {"train_loss": -35.636817932128906, "global_step": 53601, "epoch": 442} {"train_loss": -34.86744683636122, "global_step": 53602, "epoch": 442, "val_loss": 2504805.75} {"train_loss": -35.28657150268555, "global_step": 53603, "epoch": 443} {"train_loss": -36.10679626464844, "global_step": 53604, "epoch": 443} {"train_loss": -36.45487594604492, "global_step": 53605, "epoch": 443} {"train_loss": -36.301918029785156, "global_step": 53606, "epoch": 443} {"train_loss": -36.050113677978516, "global_step": 53607, "epoch": 443} {"train_loss": -36.39435958862305, "global_step": 53608, "epoch": 443} {"train_loss": -36.03083801269531, "global_step": 53609, "epoch": 443} {"train_loss": -36.235748291015625, "global_step": 53610, "epoch": 443} {"train_loss": -36.485721588134766, "global_step": 53611, "epoch": 443} {"train_loss": -35.926666259765625, "global_step": 53612, "epoch": 443} {"train_loss": -36.31290817260742, "global_step": 53613, "epoch": 443} {"train_loss": -36.35517120361328, "global_step": 53614, "epoch": 443} {"train_loss": -36.4433479309082, "global_step": 53615, "epoch": 443} {"train_loss": -36.271095275878906, "global_step": 53616, "epoch": 443} {"train_loss": -36.52932357788086, "global_step": 53617, "epoch": 443} {"train_loss": -36.16495132446289, "global_step": 53618, "epoch": 443} {"train_loss": -36.33850860595703, "global_step": 53619, "epoch": 443} {"train_loss": -36.248836517333984, "global_step": 53620, "epoch": 443} {"train_loss": -36.72565841674805, "global_step": 53621, "epoch": 443} {"train_loss": -36.57569885253906, "global_step": 53622, "epoch": 443} {"train_loss": -37.069183349609375, "global_step": 53623, "epoch": 443} {"train_loss": -36.08552551269531, "global_step": 53624, "epoch": 443} {"train_loss": -36.696624755859375, "global_step": 53625, "epoch": 443} {"train_loss": -35.842159271240234, "global_step": 53626, "epoch": 443} {"train_loss": -35.556060791015625, "global_step": 53627, "epoch": 443} {"train_loss": -36.073482513427734, "global_step": 53628, "epoch": 443} {"train_loss": -36.18925476074219, "global_step": 53629, "epoch": 443} {"train_loss": -36.100738525390625, "global_step": 53630, "epoch": 443} {"train_loss": -35.2707633972168, "global_step": 53631, "epoch": 443} {"train_loss": -36.10380172729492, "global_step": 53632, "epoch": 443} {"train_loss": -36.1463623046875, "global_step": 53633, "epoch": 443} {"train_loss": -35.414878845214844, "global_step": 53634, "epoch": 443} {"train_loss": -35.28449630737305, "global_step": 53635, "epoch": 443} {"train_loss": -36.12900924682617, "global_step": 53636, "epoch": 443} {"train_loss": -35.206748962402344, "global_step": 53637, "epoch": 443} {"train_loss": -35.12635040283203, "global_step": 53638, "epoch": 443} {"train_loss": -34.81587600708008, "global_step": 53639, "epoch": 443} {"train_loss": -35.905975341796875, "global_step": 53640, "epoch": 443} {"train_loss": -35.01612854003906, "global_step": 53641, "epoch": 443} {"train_loss": -34.389530181884766, "global_step": 53642, "epoch": 443} {"train_loss": -35.57149887084961, "global_step": 53643, "epoch": 443} {"train_loss": -35.283203125, "global_step": 53644, "epoch": 443} {"train_loss": -35.566532135009766, "global_step": 53645, "epoch": 443} {"train_loss": -35.72907638549805, "global_step": 53646, "epoch": 443} {"train_loss": -33.37751388549805, "global_step": 53647, "epoch": 443} {"train_loss": -34.49265670776367, "global_step": 53648, "epoch": 443} {"train_loss": -33.27994918823242, "global_step": 53649, "epoch": 443} {"train_loss": -33.51398849487305, "global_step": 53650, "epoch": 443} {"train_loss": -30.275802612304688, "global_step": 53651, "epoch": 443} {"train_loss": -29.216571807861328, "global_step": 53652, "epoch": 443} {"train_loss": -30.017780303955078, "global_step": 53653, "epoch": 443} {"train_loss": -31.937707901000977, "global_step": 53654, "epoch": 443} {"train_loss": -34.760616302490234, "global_step": 53655, "epoch": 443} {"train_loss": -33.882118225097656, "global_step": 53656, "epoch": 443} {"train_loss": -34.0503044128418, "global_step": 53657, "epoch": 443} {"train_loss": -33.930233001708984, "global_step": 53658, "epoch": 443} {"train_loss": -34.76456832885742, "global_step": 53659, "epoch": 443} {"train_loss": -33.21449279785156, "global_step": 53660, "epoch": 443} {"train_loss": -34.741878509521484, "global_step": 53661, "epoch": 443} {"train_loss": -33.99653244018555, "global_step": 53662, "epoch": 443} {"train_loss": -35.54877471923828, "global_step": 53663, "epoch": 443} {"train_loss": -33.4072151184082, "global_step": 53664, "epoch": 443} {"train_loss": -35.23822784423828, "global_step": 53665, "epoch": 443} {"train_loss": -34.163917541503906, "global_step": 53666, "epoch": 443} {"train_loss": -35.261199951171875, "global_step": 53667, "epoch": 443} {"train_loss": -34.73530197143555, "global_step": 53668, "epoch": 443} {"train_loss": -35.43729782104492, "global_step": 53669, "epoch": 443} {"train_loss": -35.02606201171875, "global_step": 53670, "epoch": 443} {"train_loss": -34.79719161987305, "global_step": 53671, "epoch": 443} {"train_loss": -34.68091583251953, "global_step": 53672, "epoch": 443} {"train_loss": -34.02669906616211, "global_step": 53673, "epoch": 443} {"train_loss": -35.58631134033203, "global_step": 53674, "epoch": 443} {"train_loss": -34.311012268066406, "global_step": 53675, "epoch": 443} {"train_loss": -35.57147216796875, "global_step": 53676, "epoch": 443} {"train_loss": -34.286739349365234, "global_step": 53677, "epoch": 443} {"train_loss": -35.483802795410156, "global_step": 53678, "epoch": 443} {"train_loss": -35.6537971496582, "global_step": 53679, "epoch": 443} {"train_loss": -35.13162612915039, "global_step": 53680, "epoch": 443} {"train_loss": -35.88015365600586, "global_step": 53681, "epoch": 443} {"train_loss": -35.001075744628906, "global_step": 53682, "epoch": 443} {"train_loss": -35.82284164428711, "global_step": 53683, "epoch": 443} {"train_loss": -35.41203689575195, "global_step": 53684, "epoch": 443} {"train_loss": -36.011146545410156, "global_step": 53685, "epoch": 443} {"train_loss": -33.70237350463867, "global_step": 53686, "epoch": 443} {"train_loss": -35.00580596923828, "global_step": 53687, "epoch": 443} {"train_loss": -35.33018112182617, "global_step": 53688, "epoch": 443} {"train_loss": -35.722259521484375, "global_step": 53689, "epoch": 443} {"train_loss": -36.213871002197266, "global_step": 53690, "epoch": 443} {"train_loss": -34.98495101928711, "global_step": 53691, "epoch": 443} {"train_loss": -35.24677658081055, "global_step": 53692, "epoch": 443} {"train_loss": -35.75938034057617, "global_step": 53693, "epoch": 443} {"train_loss": -35.64551544189453, "global_step": 53694, "epoch": 443} {"train_loss": -35.88662338256836, "global_step": 53695, "epoch": 443} {"train_loss": -35.9974479675293, "global_step": 53696, "epoch": 443} {"train_loss": -35.7536735534668, "global_step": 53697, "epoch": 443} {"train_loss": -36.15007400512695, "global_step": 53698, "epoch": 443} {"train_loss": -35.7464599609375, "global_step": 53699, "epoch": 443} {"train_loss": -35.426937103271484, "global_step": 53700, "epoch": 443} {"train_loss": -35.00611877441406, "global_step": 53701, "epoch": 443} {"train_loss": -36.29438018798828, "global_step": 53702, "epoch": 443} {"train_loss": -35.79585647583008, "global_step": 53703, "epoch": 443} {"train_loss": -35.15077590942383, "global_step": 53704, "epoch": 443} {"train_loss": -35.402034759521484, "global_step": 53705, "epoch": 443} {"train_loss": -35.56450653076172, "global_step": 53706, "epoch": 443} {"train_loss": -35.27549362182617, "global_step": 53707, "epoch": 443} {"train_loss": -36.45710372924805, "global_step": 53708, "epoch": 443} {"train_loss": -36.18534469604492, "global_step": 53709, "epoch": 443} {"train_loss": -36.024898529052734, "global_step": 53710, "epoch": 443} {"train_loss": -35.8162956237793, "global_step": 53711, "epoch": 443} {"train_loss": -35.8132438659668, "global_step": 53712, "epoch": 443} {"train_loss": -36.00783920288086, "global_step": 53713, "epoch": 443} {"train_loss": -35.77336502075195, "global_step": 53714, "epoch": 443} {"train_loss": -35.49483871459961, "global_step": 53715, "epoch": 443} {"train_loss": -35.00969696044922, "global_step": 53716, "epoch": 443} {"train_loss": -28.880407333374023, "global_step": 53717, "epoch": 443} {"train_loss": -12.817410469055176, "global_step": 53718, "epoch": 443} {"train_loss": 4.159684658050537, "global_step": 53719, "epoch": 443} {"train_loss": -19.906965255737305, "global_step": 53720, "epoch": 443} {"train_loss": -33.158939361572266, "global_step": 53721, "epoch": 443} {"train_loss": -25.9742431640625, "global_step": 53722, "epoch": 443} {"train_loss": -34.47043254552794, "global_step": 53723, "epoch": 443, "val_loss": 2609967.25} {"train_loss": -29.442325592041016, "global_step": 53724, "epoch": 444} {"train_loss": -33.263790130615234, "global_step": 53725, "epoch": 444} {"train_loss": -34.773067474365234, "global_step": 53726, "epoch": 444} {"train_loss": -32.066558837890625, "global_step": 53727, "epoch": 444} {"train_loss": -35.49421310424805, "global_step": 53728, "epoch": 444} {"train_loss": -34.53510284423828, "global_step": 53729, "epoch": 444} {"train_loss": -33.70402145385742, "global_step": 53730, "epoch": 444} {"train_loss": -34.84308624267578, "global_step": 53731, "epoch": 444} {"train_loss": -34.95388412475586, "global_step": 53732, "epoch": 444} {"train_loss": -34.69464111328125, "global_step": 53733, "epoch": 444} {"train_loss": -34.4493293762207, "global_step": 53734, "epoch": 444} {"train_loss": -35.310096740722656, "global_step": 53735, "epoch": 444} {"train_loss": -35.32293701171875, "global_step": 53736, "epoch": 444} {"train_loss": -35.18404769897461, "global_step": 53737, "epoch": 444} {"train_loss": -35.002723693847656, "global_step": 53738, "epoch": 444} {"train_loss": -35.24013137817383, "global_step": 53739, "epoch": 444} {"train_loss": -35.40449142456055, "global_step": 53740, "epoch": 444} {"train_loss": -35.29945373535156, "global_step": 53741, "epoch": 444} {"train_loss": -35.3901481628418, "global_step": 53742, "epoch": 444} {"train_loss": -35.44292068481445, "global_step": 53743, "epoch": 444} {"train_loss": -35.00129318237305, "global_step": 53744, "epoch": 444} {"train_loss": -35.591861724853516, "global_step": 53745, "epoch": 444} {"train_loss": -35.36138916015625, "global_step": 53746, "epoch": 444} {"train_loss": -35.70912551879883, "global_step": 53747, "epoch": 444} {"train_loss": -35.2204475402832, "global_step": 53748, "epoch": 444} {"train_loss": -35.540340423583984, "global_step": 53749, "epoch": 444} {"train_loss": -35.75008773803711, "global_step": 53750, "epoch": 444} {"train_loss": -35.70637893676758, "global_step": 53751, "epoch": 444} {"train_loss": -36.35427474975586, "global_step": 53752, "epoch": 444} {"train_loss": -36.12915802001953, "global_step": 53753, "epoch": 444} {"train_loss": -35.863399505615234, "global_step": 53754, "epoch": 444} {"train_loss": -35.99315643310547, "global_step": 53755, "epoch": 444} {"train_loss": -35.76758575439453, "global_step": 53756, "epoch": 444} {"train_loss": -36.25849914550781, "global_step": 53757, "epoch": 444} {"train_loss": -36.173519134521484, "global_step": 53758, "epoch": 444} {"train_loss": -36.154109954833984, "global_step": 53759, "epoch": 444} {"train_loss": -36.03616714477539, "global_step": 53760, "epoch": 444} {"train_loss": -36.14838790893555, "global_step": 53761, "epoch": 444} {"train_loss": -36.12040328979492, "global_step": 53762, "epoch": 444} {"train_loss": -35.95433044433594, "global_step": 53763, "epoch": 444} {"train_loss": -36.21503448486328, "global_step": 53764, "epoch": 444} {"train_loss": -34.35115051269531, "global_step": 53765, "epoch": 444} {"train_loss": -35.597049713134766, "global_step": 53766, "epoch": 444} {"train_loss": -35.462066650390625, "global_step": 53767, "epoch": 444} {"train_loss": -36.06679916381836, "global_step": 53768, "epoch": 444} {"train_loss": -36.1620979309082, "global_step": 53769, "epoch": 444} {"train_loss": -35.6004524230957, "global_step": 53770, "epoch": 444} {"train_loss": -35.9207649230957, "global_step": 53771, "epoch": 444} {"train_loss": -35.915550231933594, "global_step": 53772, "epoch": 444} {"train_loss": -35.641937255859375, "global_step": 53773, "epoch": 444} {"train_loss": -36.46153259277344, "global_step": 53774, "epoch": 444} {"train_loss": -36.33127975463867, "global_step": 53775, "epoch": 444} {"train_loss": -35.09305953979492, "global_step": 53776, "epoch": 444} {"train_loss": -34.5788459777832, "global_step": 53777, "epoch": 444} {"train_loss": -35.75756072998047, "global_step": 53778, "epoch": 444} {"train_loss": -34.8556022644043, "global_step": 53779, "epoch": 444} {"train_loss": -34.258541107177734, "global_step": 53780, "epoch": 444} {"train_loss": -34.30572509765625, "global_step": 53781, "epoch": 444} {"train_loss": -33.38711166381836, "global_step": 53782, "epoch": 444} {"train_loss": -33.94520950317383, "global_step": 53783, "epoch": 444} {"train_loss": -34.97676086425781, "global_step": 53784, "epoch": 444} {"train_loss": -34.298099517822266, "global_step": 53785, "epoch": 444} {"train_loss": -34.74656295776367, "global_step": 53786, "epoch": 444} {"train_loss": -36.06306457519531, "global_step": 53787, "epoch": 444} {"train_loss": -34.66843795776367, "global_step": 53788, "epoch": 444} {"train_loss": -35.0925178527832, "global_step": 53789, "epoch": 444} {"train_loss": -33.01079559326172, "global_step": 53790, "epoch": 444} {"train_loss": -33.43059539794922, "global_step": 53791, "epoch": 444} {"train_loss": -35.37534713745117, "global_step": 53792, "epoch": 444} {"train_loss": -34.878456115722656, "global_step": 53793, "epoch": 444} {"train_loss": -35.16181182861328, "global_step": 53794, "epoch": 444} {"train_loss": -33.905948638916016, "global_step": 53795, "epoch": 444} {"train_loss": -35.3291130065918, "global_step": 53796, "epoch": 444} {"train_loss": -33.975990295410156, "global_step": 53797, "epoch": 444} {"train_loss": -34.8601188659668, "global_step": 53798, "epoch": 444} {"train_loss": -34.95579528808594, "global_step": 53799, "epoch": 444} {"train_loss": -35.65683364868164, "global_step": 53800, "epoch": 444} {"train_loss": -34.78847122192383, "global_step": 53801, "epoch": 444} {"train_loss": -34.92840576171875, "global_step": 53802, "epoch": 444} {"train_loss": -34.064849853515625, "global_step": 53803, "epoch": 444} {"train_loss": -34.80451583862305, "global_step": 53804, "epoch": 444} {"train_loss": -34.736228942871094, "global_step": 53805, "epoch": 444} {"train_loss": -33.73922348022461, "global_step": 53806, "epoch": 444} {"train_loss": -34.37147903442383, "global_step": 53807, "epoch": 444} {"train_loss": -34.626625061035156, "global_step": 53808, "epoch": 444} {"train_loss": -32.88581085205078, "global_step": 53809, "epoch": 444} {"train_loss": -31.046842575073242, "global_step": 53810, "epoch": 444} {"train_loss": -28.834768295288086, "global_step": 53811, "epoch": 444} {"train_loss": -32.73560333251953, "global_step": 53812, "epoch": 444} {"train_loss": -33.69336700439453, "global_step": 53813, "epoch": 444} {"train_loss": -34.44667434692383, "global_step": 53814, "epoch": 444} {"train_loss": -32.42781448364258, "global_step": 53815, "epoch": 444} {"train_loss": -32.85163497924805, "global_step": 53816, "epoch": 444} {"train_loss": -34.396278381347656, "global_step": 53817, "epoch": 444} {"train_loss": -33.5670280456543, "global_step": 53818, "epoch": 444} {"train_loss": -33.53139114379883, "global_step": 53819, "epoch": 444} {"train_loss": -33.78536605834961, "global_step": 53820, "epoch": 444} {"train_loss": -34.690303802490234, "global_step": 53821, "epoch": 444} {"train_loss": -33.6171760559082, "global_step": 53822, "epoch": 444} {"train_loss": -34.787567138671875, "global_step": 53823, "epoch": 444} {"train_loss": -35.03740692138672, "global_step": 53824, "epoch": 444} {"train_loss": -34.0490608215332, "global_step": 53825, "epoch": 444} {"train_loss": -35.17932891845703, "global_step": 53826, "epoch": 444} {"train_loss": -34.04517364501953, "global_step": 53827, "epoch": 444} {"train_loss": -35.12528610229492, "global_step": 53828, "epoch": 444} {"train_loss": -35.205623626708984, "global_step": 53829, "epoch": 444} {"train_loss": -35.000457763671875, "global_step": 53830, "epoch": 444} {"train_loss": -34.94472122192383, "global_step": 53831, "epoch": 444} {"train_loss": -34.90264892578125, "global_step": 53832, "epoch": 444} {"train_loss": -35.184078216552734, "global_step": 53833, "epoch": 444} {"train_loss": -34.48615646362305, "global_step": 53834, "epoch": 444} {"train_loss": -35.81299591064453, "global_step": 53835, "epoch": 444} {"train_loss": -34.69259262084961, "global_step": 53836, "epoch": 444} {"train_loss": -35.33749008178711, "global_step": 53837, "epoch": 444} {"train_loss": -35.017250061035156, "global_step": 53838, "epoch": 444} {"train_loss": -35.689292907714844, "global_step": 53839, "epoch": 444} {"train_loss": -35.03214645385742, "global_step": 53840, "epoch": 444} {"train_loss": -35.31928634643555, "global_step": 53841, "epoch": 444} {"train_loss": -35.331783294677734, "global_step": 53842, "epoch": 444} {"train_loss": -34.87003707885742, "global_step": 53843, "epoch": 444} {"train_loss": -34.811991037416064, "global_step": 53844, "epoch": 444, "val_loss": 2595037.25} {"train_loss": -35.8475456237793, "global_step": 53845, "epoch": 445} {"train_loss": -35.70344543457031, "global_step": 53846, "epoch": 445} {"train_loss": -35.83698654174805, "global_step": 53847, "epoch": 445} {"train_loss": -35.8189811706543, "global_step": 53848, "epoch": 445} {"train_loss": -35.866886138916016, "global_step": 53849, "epoch": 445} {"train_loss": -35.67844009399414, "global_step": 53850, "epoch": 445} {"train_loss": -35.69207763671875, "global_step": 53851, "epoch": 445} {"train_loss": -36.35175704956055, "global_step": 53852, "epoch": 445} {"train_loss": -35.79159927368164, "global_step": 53853, "epoch": 445} {"train_loss": -35.61040115356445, "global_step": 53854, "epoch": 445} {"train_loss": -33.902828216552734, "global_step": 53855, "epoch": 445} {"train_loss": -30.456933975219727, "global_step": 53856, "epoch": 445} {"train_loss": -18.70745849609375, "global_step": 53857, "epoch": 445} {"train_loss": -15.357690811157227, "global_step": 53858, "epoch": 445} {"train_loss": -31.858428955078125, "global_step": 53859, "epoch": 445} {"train_loss": -31.440601348876953, "global_step": 53860, "epoch": 445} {"train_loss": -27.455780029296875, "global_step": 53861, "epoch": 445} {"train_loss": -33.12928009033203, "global_step": 53862, "epoch": 445} {"train_loss": -29.283985137939453, "global_step": 53863, "epoch": 445} {"train_loss": -33.88987350463867, "global_step": 53864, "epoch": 445} {"train_loss": -31.470991134643555, "global_step": 53865, "epoch": 445} {"train_loss": -33.852500915527344, "global_step": 53866, "epoch": 445} {"train_loss": -33.024959564208984, "global_step": 53867, "epoch": 445} {"train_loss": -33.09672164916992, "global_step": 53868, "epoch": 445} {"train_loss": -34.1574821472168, "global_step": 53869, "epoch": 445} {"train_loss": -34.35117721557617, "global_step": 53870, "epoch": 445} {"train_loss": -32.90896224975586, "global_step": 53871, "epoch": 445} {"train_loss": -34.81783676147461, "global_step": 53872, "epoch": 445} {"train_loss": -33.97016525268555, "global_step": 53873, "epoch": 445} {"train_loss": -34.545989990234375, "global_step": 53874, "epoch": 445} {"train_loss": -34.814857482910156, "global_step": 53875, "epoch": 445} {"train_loss": -34.87745666503906, "global_step": 53876, "epoch": 445} {"train_loss": -34.73359680175781, "global_step": 53877, "epoch": 445} {"train_loss": -35.08395767211914, "global_step": 53878, "epoch": 445} {"train_loss": -35.28176498413086, "global_step": 53879, "epoch": 445} {"train_loss": -35.18305206298828, "global_step": 53880, "epoch": 445} {"train_loss": -34.853816986083984, "global_step": 53881, "epoch": 445} {"train_loss": -35.09092330932617, "global_step": 53882, "epoch": 445} {"train_loss": -34.8789176940918, "global_step": 53883, "epoch": 445} {"train_loss": -35.01154327392578, "global_step": 53884, "epoch": 445} {"train_loss": -35.314353942871094, "global_step": 53885, "epoch": 445} {"train_loss": -35.70960235595703, "global_step": 53886, "epoch": 445} {"train_loss": -35.55506134033203, "global_step": 53887, "epoch": 445} {"train_loss": -35.76740646362305, "global_step": 53888, "epoch": 445} {"train_loss": -34.9248046875, "global_step": 53889, "epoch": 445} {"train_loss": -35.84382247924805, "global_step": 53890, "epoch": 445} {"train_loss": -35.6593132019043, "global_step": 53891, "epoch": 445} {"train_loss": -35.52637481689453, "global_step": 53892, "epoch": 445} {"train_loss": -35.74869918823242, "global_step": 53893, "epoch": 445} {"train_loss": -35.73958206176758, "global_step": 53894, "epoch": 445} {"train_loss": -35.723934173583984, "global_step": 53895, "epoch": 445} {"train_loss": -35.635005950927734, "global_step": 53896, "epoch": 445} {"train_loss": -35.59800720214844, "global_step": 53897, "epoch": 445} {"train_loss": -35.832340240478516, "global_step": 53898, "epoch": 445} {"train_loss": -36.01813888549805, "global_step": 53899, "epoch": 445} {"train_loss": -35.41461181640625, "global_step": 53900, "epoch": 445} {"train_loss": -35.48285675048828, "global_step": 53901, "epoch": 445} {"train_loss": -35.77909469604492, "global_step": 53902, "epoch": 445} {"train_loss": -36.13410186767578, "global_step": 53903, "epoch": 445} {"train_loss": -35.960811614990234, "global_step": 53904, "epoch": 445} {"train_loss": -35.554100036621094, "global_step": 53905, "epoch": 445} {"train_loss": -35.81960678100586, "global_step": 53906, "epoch": 445} {"train_loss": -35.84488296508789, "global_step": 53907, "epoch": 445} {"train_loss": -36.40366744995117, "global_step": 53908, "epoch": 445} {"train_loss": -35.84321212768555, "global_step": 53909, "epoch": 445} {"train_loss": -36.08890914916992, "global_step": 53910, "epoch": 445} {"train_loss": -35.4886360168457, "global_step": 53911, "epoch": 445} {"train_loss": -36.24093246459961, "global_step": 53912, "epoch": 445} {"train_loss": -36.46256637573242, "global_step": 53913, "epoch": 445} {"train_loss": -35.92838668823242, "global_step": 53914, "epoch": 445} {"train_loss": -35.69856643676758, "global_step": 53915, "epoch": 445} {"train_loss": -36.10483932495117, "global_step": 53916, "epoch": 445} {"train_loss": -35.52509307861328, "global_step": 53917, "epoch": 445} {"train_loss": -35.17735290527344, "global_step": 53918, "epoch": 445} {"train_loss": -35.639747619628906, "global_step": 53919, "epoch": 445} {"train_loss": -35.71270751953125, "global_step": 53920, "epoch": 445} {"train_loss": -35.94729232788086, "global_step": 53921, "epoch": 445} {"train_loss": -34.987892150878906, "global_step": 53922, "epoch": 445} {"train_loss": -34.110816955566406, "global_step": 53923, "epoch": 445} {"train_loss": -34.75509262084961, "global_step": 53924, "epoch": 445} {"train_loss": -36.19618225097656, "global_step": 53925, "epoch": 445} {"train_loss": -35.16935729980469, "global_step": 53926, "epoch": 445} {"train_loss": -34.262481689453125, "global_step": 53927, "epoch": 445} {"train_loss": -35.528114318847656, "global_step": 53928, "epoch": 445} {"train_loss": -36.05731964111328, "global_step": 53929, "epoch": 445} {"train_loss": -34.941810607910156, "global_step": 53930, "epoch": 445} {"train_loss": -35.22026443481445, "global_step": 53931, "epoch": 445} {"train_loss": -36.23336410522461, "global_step": 53932, "epoch": 445} {"train_loss": -35.29926681518555, "global_step": 53933, "epoch": 445} {"train_loss": -35.88344955444336, "global_step": 53934, "epoch": 445} {"train_loss": -35.39671325683594, "global_step": 53935, "epoch": 445} {"train_loss": -35.56885528564453, "global_step": 53936, "epoch": 445} {"train_loss": -36.0369758605957, "global_step": 53937, "epoch": 445} {"train_loss": -35.852012634277344, "global_step": 53938, "epoch": 445} {"train_loss": -35.697532653808594, "global_step": 53939, "epoch": 445} {"train_loss": -35.542110443115234, "global_step": 53940, "epoch": 445} {"train_loss": -35.8204345703125, "global_step": 53941, "epoch": 445} {"train_loss": -35.85282897949219, "global_step": 53942, "epoch": 445} {"train_loss": -35.49647903442383, "global_step": 53943, "epoch": 445} {"train_loss": -36.16831588745117, "global_step": 53944, "epoch": 445} {"train_loss": -35.702850341796875, "global_step": 53945, "epoch": 445} {"train_loss": -36.3980598449707, "global_step": 53946, "epoch": 445} {"train_loss": -35.83430099487305, "global_step": 53947, "epoch": 445} {"train_loss": -36.38888931274414, "global_step": 53948, "epoch": 445} {"train_loss": -35.468204498291016, "global_step": 53949, "epoch": 445} {"train_loss": -36.104740142822266, "global_step": 53950, "epoch": 445} {"train_loss": -35.611427307128906, "global_step": 53951, "epoch": 445} {"train_loss": -35.76026153564453, "global_step": 53952, "epoch": 445} {"train_loss": -35.4542350769043, "global_step": 53953, "epoch": 445} {"train_loss": -35.164466857910156, "global_step": 53954, "epoch": 445} {"train_loss": -35.16090774536133, "global_step": 53955, "epoch": 445} {"train_loss": -34.671424865722656, "global_step": 53956, "epoch": 445} {"train_loss": -34.36975860595703, "global_step": 53957, "epoch": 445} {"train_loss": -34.69411087036133, "global_step": 53958, "epoch": 445} {"train_loss": -32.92412185668945, "global_step": 53959, "epoch": 445} {"train_loss": -31.97173500061035, "global_step": 53960, "epoch": 445} {"train_loss": -33.82772445678711, "global_step": 53961, "epoch": 445} {"train_loss": -34.412986755371094, "global_step": 53962, "epoch": 445} {"train_loss": -35.65061950683594, "global_step": 53963, "epoch": 445} {"train_loss": -35.69565200805664, "global_step": 53964, "epoch": 445} {"train_loss": -34.73874352195046, "global_step": 53965, "epoch": 445, "val_loss": 2470687.25} {"train_loss": -34.32175827026367, "global_step": 53966, "epoch": 446} {"train_loss": -35.54863357543945, "global_step": 53967, "epoch": 446} {"train_loss": -34.68134689331055, "global_step": 53968, "epoch": 446} {"train_loss": -34.71125030517578, "global_step": 53969, "epoch": 446} {"train_loss": -35.9193000793457, "global_step": 53970, "epoch": 446} {"train_loss": -35.15351486206055, "global_step": 53971, "epoch": 446} {"train_loss": -35.82719039916992, "global_step": 53972, "epoch": 446} {"train_loss": -35.69094467163086, "global_step": 53973, "epoch": 446} {"train_loss": -35.21323013305664, "global_step": 53974, "epoch": 446} {"train_loss": -35.98842239379883, "global_step": 53975, "epoch": 446} {"train_loss": -35.73722839355469, "global_step": 53976, "epoch": 446} {"train_loss": -35.14656448364258, "global_step": 53977, "epoch": 446} {"train_loss": -36.179317474365234, "global_step": 53978, "epoch": 446} {"train_loss": -35.672607421875, "global_step": 53979, "epoch": 446} {"train_loss": -36.074398040771484, "global_step": 53980, "epoch": 446} {"train_loss": -35.569149017333984, "global_step": 53981, "epoch": 446} {"train_loss": -35.8759880065918, "global_step": 53982, "epoch": 446} {"train_loss": -35.55139923095703, "global_step": 53983, "epoch": 446} {"train_loss": -36.0028076171875, "global_step": 53984, "epoch": 446} {"train_loss": -35.99625778198242, "global_step": 53985, "epoch": 446} {"train_loss": -35.750709533691406, "global_step": 53986, "epoch": 446} {"train_loss": -36.121826171875, "global_step": 53987, "epoch": 446} {"train_loss": -36.17795944213867, "global_step": 53988, "epoch": 446} {"train_loss": -35.71670150756836, "global_step": 53989, "epoch": 446} {"train_loss": -36.359291076660156, "global_step": 53990, "epoch": 446} {"train_loss": -34.98671340942383, "global_step": 53991, "epoch": 446} {"train_loss": -35.70426559448242, "global_step": 53992, "epoch": 446} {"train_loss": -36.198787689208984, "global_step": 53993, "epoch": 446} {"train_loss": -36.0399055480957, "global_step": 53994, "epoch": 446} {"train_loss": -35.566314697265625, "global_step": 53995, "epoch": 446} {"train_loss": -36.22465896606445, "global_step": 53996, "epoch": 446} {"train_loss": -36.113243103027344, "global_step": 53997, "epoch": 446} {"train_loss": -35.89765548706055, "global_step": 53998, "epoch": 446} {"train_loss": -35.69369888305664, "global_step": 53999, "epoch": 446} {"train_loss": -35.97078323364258, "global_step": 54000, "epoch": 446} {"train_loss": -34.789974212646484, "global_step": 54001, "epoch": 446} {"train_loss": -35.738216400146484, "global_step": 54002, "epoch": 446} {"train_loss": -36.07081985473633, "global_step": 54003, "epoch": 446} {"train_loss": -35.837276458740234, "global_step": 54004, "epoch": 446} {"train_loss": -36.11205291748047, "global_step": 54005, "epoch": 446} {"train_loss": -35.66913604736328, "global_step": 54006, "epoch": 446} {"train_loss": -35.66588592529297, "global_step": 54007, "epoch": 446} {"train_loss": -35.83778762817383, "global_step": 54008, "epoch": 446} {"train_loss": -36.25895309448242, "global_step": 54009, "epoch": 446} {"train_loss": -36.10503387451172, "global_step": 54010, "epoch": 446} {"train_loss": -36.26578140258789, "global_step": 54011, "epoch": 446} {"train_loss": -36.139312744140625, "global_step": 54012, "epoch": 446} {"train_loss": -35.449066162109375, "global_step": 54013, "epoch": 446} {"train_loss": -36.46274948120117, "global_step": 54014, "epoch": 446} {"train_loss": -35.884769439697266, "global_step": 54015, "epoch": 446} {"train_loss": -35.53263473510742, "global_step": 54016, "epoch": 446} {"train_loss": -36.27693557739258, "global_step": 54017, "epoch": 446} {"train_loss": -35.922576904296875, "global_step": 54018, "epoch": 446} {"train_loss": -34.22444534301758, "global_step": 54019, "epoch": 446} {"train_loss": -35.64793395996094, "global_step": 54020, "epoch": 446} {"train_loss": -35.705726623535156, "global_step": 54021, "epoch": 446} {"train_loss": -35.18326187133789, "global_step": 54022, "epoch": 446} {"train_loss": -33.4061164855957, "global_step": 54023, "epoch": 446} {"train_loss": -33.241798400878906, "global_step": 54024, "epoch": 446} {"train_loss": -34.65776824951172, "global_step": 54025, "epoch": 446} {"train_loss": -33.9295768737793, "global_step": 54026, "epoch": 446} {"train_loss": -33.15531539916992, "global_step": 54027, "epoch": 446} {"train_loss": -33.0290641784668, "global_step": 54028, "epoch": 446} {"train_loss": -32.8835334777832, "global_step": 54029, "epoch": 446} {"train_loss": -35.1866569519043, "global_step": 54030, "epoch": 446} {"train_loss": -28.62721061706543, "global_step": 54031, "epoch": 446} {"train_loss": -27.557830810546875, "global_step": 54032, "epoch": 446} {"train_loss": -32.81770706176758, "global_step": 54033, "epoch": 446} {"train_loss": -29.88905143737793, "global_step": 54034, "epoch": 446} {"train_loss": -31.551422119140625, "global_step": 54035, "epoch": 446} {"train_loss": -35.14794921875, "global_step": 54036, "epoch": 446} {"train_loss": -32.33420944213867, "global_step": 54037, "epoch": 446} {"train_loss": -33.89204788208008, "global_step": 54038, "epoch": 446} {"train_loss": -35.58295822143555, "global_step": 54039, "epoch": 446} {"train_loss": -34.37412643432617, "global_step": 54040, "epoch": 446} {"train_loss": -34.9734001159668, "global_step": 54041, "epoch": 446} {"train_loss": -35.16189956665039, "global_step": 54042, "epoch": 446} {"train_loss": -34.597015380859375, "global_step": 54043, "epoch": 446} {"train_loss": -34.27838134765625, "global_step": 54044, "epoch": 446} {"train_loss": -35.693031311035156, "global_step": 54045, "epoch": 446} {"train_loss": -34.96537399291992, "global_step": 54046, "epoch": 446} {"train_loss": -34.810447692871094, "global_step": 54047, "epoch": 446} {"train_loss": -35.043663024902344, "global_step": 54048, "epoch": 446} {"train_loss": -35.388885498046875, "global_step": 54049, "epoch": 446} {"train_loss": -35.661598205566406, "global_step": 54050, "epoch": 446} {"train_loss": -35.53962707519531, "global_step": 54051, "epoch": 446} {"train_loss": -34.93656539916992, "global_step": 54052, "epoch": 446} {"train_loss": -35.82003402709961, "global_step": 54053, "epoch": 446} {"train_loss": -36.03113555908203, "global_step": 54054, "epoch": 446} {"train_loss": -35.69580841064453, "global_step": 54055, "epoch": 446} {"train_loss": -35.26140594482422, "global_step": 54056, "epoch": 446} {"train_loss": -35.728431701660156, "global_step": 54057, "epoch": 446} {"train_loss": -34.587154388427734, "global_step": 54058, "epoch": 446} {"train_loss": -35.61501693725586, "global_step": 54059, "epoch": 446} {"train_loss": -35.413631439208984, "global_step": 54060, "epoch": 446} {"train_loss": -35.33550262451172, "global_step": 54061, "epoch": 446} {"train_loss": -35.738380432128906, "global_step": 54062, "epoch": 446} {"train_loss": -35.3319206237793, "global_step": 54063, "epoch": 446} {"train_loss": -35.75094985961914, "global_step": 54064, "epoch": 446} {"train_loss": -35.17157745361328, "global_step": 54065, "epoch": 446} {"train_loss": -34.85105514526367, "global_step": 54066, "epoch": 446} {"train_loss": -35.51052474975586, "global_step": 54067, "epoch": 446} {"train_loss": -32.327117919921875, "global_step": 54068, "epoch": 446} {"train_loss": -35.452178955078125, "global_step": 54069, "epoch": 446} {"train_loss": -34.51852798461914, "global_step": 54070, "epoch": 446} {"train_loss": -27.310672760009766, "global_step": 54071, "epoch": 446} {"train_loss": -33.74457931518555, "global_step": 54072, "epoch": 446} {"train_loss": -32.53152847290039, "global_step": 54073, "epoch": 446} {"train_loss": -28.026519775390625, "global_step": 54074, "epoch": 446} {"train_loss": -30.429645538330078, "global_step": 54075, "epoch": 446} {"train_loss": -30.944883346557617, "global_step": 54076, "epoch": 446} {"train_loss": -28.6195068359375, "global_step": 54077, "epoch": 446} {"train_loss": -26.962635040283203, "global_step": 54078, "epoch": 446} {"train_loss": -29.36859703063965, "global_step": 54079, "epoch": 446} {"train_loss": -28.689260482788086, "global_step": 54080, "epoch": 446} {"train_loss": -29.55118179321289, "global_step": 54081, "epoch": 446} {"train_loss": -28.194772720336914, "global_step": 54082, "epoch": 446} {"train_loss": -31.923675537109375, "global_step": 54083, "epoch": 446} {"train_loss": -31.375757217407227, "global_step": 54084, "epoch": 446} {"train_loss": -32.8293571472168, "global_step": 54085, "epoch": 446} {"train_loss": -34.41389028691063, "global_step": 54086, "epoch": 446, "val_loss": 2727368.5} {"train_loss": -32.520172119140625, "global_step": 54087, "epoch": 447} {"train_loss": -32.20524978637695, "global_step": 54088, "epoch": 447} {"train_loss": -31.876434326171875, "global_step": 54089, "epoch": 447} {"train_loss": -32.929962158203125, "global_step": 54090, "epoch": 447} {"train_loss": -33.190853118896484, "global_step": 54091, "epoch": 447} {"train_loss": -32.05897903442383, "global_step": 54092, "epoch": 447} {"train_loss": -33.202430725097656, "global_step": 54093, "epoch": 447} {"train_loss": -32.922218322753906, "global_step": 54094, "epoch": 447} {"train_loss": -32.97890090942383, "global_step": 54095, "epoch": 447} {"train_loss": -32.37659454345703, "global_step": 54096, "epoch": 447} {"train_loss": -33.54399490356445, "global_step": 54097, "epoch": 447} {"train_loss": -33.51778030395508, "global_step": 54098, "epoch": 447} {"train_loss": -33.46455001831055, "global_step": 54099, "epoch": 447} {"train_loss": -33.42625045776367, "global_step": 54100, "epoch": 447} {"train_loss": -33.5597038269043, "global_step": 54101, "epoch": 447} {"train_loss": -34.00438690185547, "global_step": 54102, "epoch": 447} {"train_loss": -33.90031433105469, "global_step": 54103, "epoch": 447} {"train_loss": -33.06545639038086, "global_step": 54104, "epoch": 447} {"train_loss": -33.5513916015625, "global_step": 54105, "epoch": 447} {"train_loss": -33.872291564941406, "global_step": 54106, "epoch": 447} {"train_loss": -33.29752731323242, "global_step": 54107, "epoch": 447} {"train_loss": -34.31987762451172, "global_step": 54108, "epoch": 447} {"train_loss": -33.9734992980957, "global_step": 54109, "epoch": 447} {"train_loss": -34.23429870605469, "global_step": 54110, "epoch": 447} {"train_loss": -34.13856887817383, "global_step": 54111, "epoch": 447} {"train_loss": -34.081581115722656, "global_step": 54112, "epoch": 447} {"train_loss": -34.57990264892578, "global_step": 54113, "epoch": 447} {"train_loss": -34.43470001220703, "global_step": 54114, "epoch": 447} {"train_loss": -34.21810531616211, "global_step": 54115, "epoch": 447} {"train_loss": -34.494361877441406, "global_step": 54116, "epoch": 447} {"train_loss": -34.806976318359375, "global_step": 54117, "epoch": 447} {"train_loss": -35.205562591552734, "global_step": 54118, "epoch": 447} {"train_loss": -34.9217414855957, "global_step": 54119, "epoch": 447} {"train_loss": -34.663856506347656, "global_step": 54120, "epoch": 447} {"train_loss": -34.824424743652344, "global_step": 54121, "epoch": 447} {"train_loss": -35.1895637512207, "global_step": 54122, "epoch": 447} {"train_loss": -35.1042594909668, "global_step": 54123, "epoch": 447} {"train_loss": -35.390193939208984, "global_step": 54124, "epoch": 447} {"train_loss": -34.9569206237793, "global_step": 54125, "epoch": 447} {"train_loss": -35.52161407470703, "global_step": 54126, "epoch": 447} {"train_loss": -35.396663665771484, "global_step": 54127, "epoch": 447} {"train_loss": -35.180702209472656, "global_step": 54128, "epoch": 447} {"train_loss": -35.228790283203125, "global_step": 54129, "epoch": 447} {"train_loss": -35.23527145385742, "global_step": 54130, "epoch": 447} {"train_loss": -35.563758850097656, "global_step": 54131, "epoch": 447} {"train_loss": -35.60102081298828, "global_step": 54132, "epoch": 447} {"train_loss": -35.495967864990234, "global_step": 54133, "epoch": 447} {"train_loss": -35.48114013671875, "global_step": 54134, "epoch": 447} {"train_loss": -35.56597900390625, "global_step": 54135, "epoch": 447} {"train_loss": -35.64359664916992, "global_step": 54136, "epoch": 447} {"train_loss": -35.87056350708008, "global_step": 54137, "epoch": 447} {"train_loss": -35.71371078491211, "global_step": 54138, "epoch": 447} {"train_loss": -35.861083984375, "global_step": 54139, "epoch": 447} {"train_loss": -35.37351989746094, "global_step": 54140, "epoch": 447} {"train_loss": -35.72919845581055, "global_step": 54141, "epoch": 447} {"train_loss": -36.005550384521484, "global_step": 54142, "epoch": 447} {"train_loss": -35.25257110595703, "global_step": 54143, "epoch": 447} {"train_loss": -35.26418685913086, "global_step": 54144, "epoch": 447} {"train_loss": -35.72109603881836, "global_step": 54145, "epoch": 447} {"train_loss": -35.9304084777832, "global_step": 54146, "epoch": 447} {"train_loss": -35.51527786254883, "global_step": 54147, "epoch": 447} {"train_loss": -34.91947555541992, "global_step": 54148, "epoch": 447} {"train_loss": -35.53502655029297, "global_step": 54149, "epoch": 447} {"train_loss": -35.91367721557617, "global_step": 54150, "epoch": 447} {"train_loss": -35.609535217285156, "global_step": 54151, "epoch": 447} {"train_loss": -34.93083572387695, "global_step": 54152, "epoch": 447} {"train_loss": -33.13973617553711, "global_step": 54153, "epoch": 447} {"train_loss": -31.067731857299805, "global_step": 54154, "epoch": 447} {"train_loss": -35.98493194580078, "global_step": 54155, "epoch": 447} {"train_loss": -35.09181213378906, "global_step": 54156, "epoch": 447} {"train_loss": -34.6328010559082, "global_step": 54157, "epoch": 447} {"train_loss": -35.20920181274414, "global_step": 54158, "epoch": 447} {"train_loss": -35.46782302856445, "global_step": 54159, "epoch": 447} {"train_loss": -35.71552658081055, "global_step": 54160, "epoch": 447} {"train_loss": -35.98167037963867, "global_step": 54161, "epoch": 447} {"train_loss": -35.302146911621094, "global_step": 54162, "epoch": 447} {"train_loss": -35.44730758666992, "global_step": 54163, "epoch": 447} {"train_loss": -34.96758270263672, "global_step": 54164, "epoch": 447} {"train_loss": -36.49092483520508, "global_step": 54165, "epoch": 447} {"train_loss": -36.180294036865234, "global_step": 54166, "epoch": 447} {"train_loss": -35.85862350463867, "global_step": 54167, "epoch": 447} {"train_loss": -35.446285247802734, "global_step": 54168, "epoch": 447} {"train_loss": -36.01644515991211, "global_step": 54169, "epoch": 447} {"train_loss": -36.47551345825195, "global_step": 54170, "epoch": 447} {"train_loss": -36.509822845458984, "global_step": 54171, "epoch": 447} {"train_loss": -35.697505950927734, "global_step": 54172, "epoch": 447} {"train_loss": -35.20686340332031, "global_step": 54173, "epoch": 447} {"train_loss": -35.477203369140625, "global_step": 54174, "epoch": 447} {"train_loss": -35.78337860107422, "global_step": 54175, "epoch": 447} {"train_loss": -35.65198516845703, "global_step": 54176, "epoch": 447} {"train_loss": -35.48256301879883, "global_step": 54177, "epoch": 447} {"train_loss": -35.281864166259766, "global_step": 54178, "epoch": 447} {"train_loss": -34.491485595703125, "global_step": 54179, "epoch": 447} {"train_loss": -34.048919677734375, "global_step": 54180, "epoch": 447} {"train_loss": -34.79888916015625, "global_step": 54181, "epoch": 447} {"train_loss": -34.35308837890625, "global_step": 54182, "epoch": 447} {"train_loss": -32.47640609741211, "global_step": 54183, "epoch": 447} {"train_loss": -32.721099853515625, "global_step": 54184, "epoch": 447} {"train_loss": -34.6817512512207, "global_step": 54185, "epoch": 447} {"train_loss": -34.70315170288086, "global_step": 54186, "epoch": 447} {"train_loss": -34.964752197265625, "global_step": 54187, "epoch": 447} {"train_loss": -35.01493453979492, "global_step": 54188, "epoch": 447} {"train_loss": -34.996273040771484, "global_step": 54189, "epoch": 447} {"train_loss": -35.269832611083984, "global_step": 54190, "epoch": 447} {"train_loss": -35.80497360229492, "global_step": 54191, "epoch": 447} {"train_loss": -35.519527435302734, "global_step": 54192, "epoch": 447} {"train_loss": -34.20924758911133, "global_step": 54193, "epoch": 447} {"train_loss": -35.031410217285156, "global_step": 54194, "epoch": 447} {"train_loss": -35.287940979003906, "global_step": 54195, "epoch": 447} {"train_loss": -34.061397552490234, "global_step": 54196, "epoch": 447} {"train_loss": -35.14402770996094, "global_step": 54197, "epoch": 447} {"train_loss": -35.928096771240234, "global_step": 54198, "epoch": 447} {"train_loss": -33.74321365356445, "global_step": 54199, "epoch": 447} {"train_loss": -35.44790267944336, "global_step": 54200, "epoch": 447} {"train_loss": -35.97968673706055, "global_step": 54201, "epoch": 447} {"train_loss": -35.31647872924805, "global_step": 54202, "epoch": 447} {"train_loss": -34.7092399597168, "global_step": 54203, "epoch": 447} {"train_loss": -35.93681716918945, "global_step": 54204, "epoch": 447} {"train_loss": -35.14480209350586, "global_step": 54205, "epoch": 447} {"train_loss": -35.14861297607422, "global_step": 54206, "epoch": 447} {"train_loss": -34.7855705229704, "global_step": 54207, "epoch": 447, "val_loss": 2563864.75} {"train_loss": -35.28867721557617, "global_step": 54208, "epoch": 448} {"train_loss": -35.36656951904297, "global_step": 54209, "epoch": 448} {"train_loss": -36.31492233276367, "global_step": 54210, "epoch": 448} {"train_loss": -35.693668365478516, "global_step": 54211, "epoch": 448} {"train_loss": -36.03758239746094, "global_step": 54212, "epoch": 448} {"train_loss": -36.19240951538086, "global_step": 54213, "epoch": 448} {"train_loss": -36.185813903808594, "global_step": 54214, "epoch": 448} {"train_loss": -36.30373764038086, "global_step": 54215, "epoch": 448} {"train_loss": -35.915374755859375, "global_step": 54216, "epoch": 448} {"train_loss": -35.04594039916992, "global_step": 54217, "epoch": 448} {"train_loss": -36.36730194091797, "global_step": 54218, "epoch": 448} {"train_loss": -35.96003341674805, "global_step": 54219, "epoch": 448} {"train_loss": -36.012603759765625, "global_step": 54220, "epoch": 448} {"train_loss": -36.177268981933594, "global_step": 54221, "epoch": 448} {"train_loss": -36.54227066040039, "global_step": 54222, "epoch": 448} {"train_loss": -36.76009750366211, "global_step": 54223, "epoch": 448} {"train_loss": -36.2266845703125, "global_step": 54224, "epoch": 448} {"train_loss": -36.17423629760742, "global_step": 54225, "epoch": 448} {"train_loss": -36.539241790771484, "global_step": 54226, "epoch": 448} {"train_loss": -36.45288848876953, "global_step": 54227, "epoch": 448} {"train_loss": -35.898597717285156, "global_step": 54228, "epoch": 448} {"train_loss": -35.49276351928711, "global_step": 54229, "epoch": 448} {"train_loss": -35.525909423828125, "global_step": 54230, "epoch": 448} {"train_loss": -35.2957649230957, "global_step": 54231, "epoch": 448} {"train_loss": -34.23566818237305, "global_step": 54232, "epoch": 448} {"train_loss": -35.0729866027832, "global_step": 54233, "epoch": 448} {"train_loss": -34.98977279663086, "global_step": 54234, "epoch": 448} {"train_loss": -32.066654205322266, "global_step": 54235, "epoch": 448} {"train_loss": -30.24530601501465, "global_step": 54236, "epoch": 448} {"train_loss": -28.75254249572754, "global_step": 54237, "epoch": 448} {"train_loss": -24.393016815185547, "global_step": 54238, "epoch": 448} {"train_loss": -27.960311889648438, "global_step": 54239, "epoch": 448} {"train_loss": -35.0852165222168, "global_step": 54240, "epoch": 448} {"train_loss": -30.158740997314453, "global_step": 54241, "epoch": 448} {"train_loss": -32.23202133178711, "global_step": 54242, "epoch": 448} {"train_loss": -34.19221115112305, "global_step": 54243, "epoch": 448} {"train_loss": -32.724708557128906, "global_step": 54244, "epoch": 448} {"train_loss": -34.763301849365234, "global_step": 54245, "epoch": 448} {"train_loss": -33.88346481323242, "global_step": 54246, "epoch": 448} {"train_loss": -34.487335205078125, "global_step": 54247, "epoch": 448} {"train_loss": -33.44505310058594, "global_step": 54248, "epoch": 448} {"train_loss": -34.8961181640625, "global_step": 54249, "epoch": 448} {"train_loss": -34.11464309692383, "global_step": 54250, "epoch": 448} {"train_loss": -34.50698471069336, "global_step": 54251, "epoch": 448} {"train_loss": -35.14210891723633, "global_step": 54252, "epoch": 448} {"train_loss": -35.00483703613281, "global_step": 54253, "epoch": 448} {"train_loss": -35.055381774902344, "global_step": 54254, "epoch": 448} {"train_loss": -35.33204650878906, "global_step": 54255, "epoch": 448} {"train_loss": -34.46345520019531, "global_step": 54256, "epoch": 448} {"train_loss": -35.41151809692383, "global_step": 54257, "epoch": 448} {"train_loss": -35.11421585083008, "global_step": 54258, "epoch": 448} {"train_loss": -35.6440544128418, "global_step": 54259, "epoch": 448} {"train_loss": -34.77180099487305, "global_step": 54260, "epoch": 448} {"train_loss": -35.437557220458984, "global_step": 54261, "epoch": 448} {"train_loss": -35.43941116333008, "global_step": 54262, "epoch": 448} {"train_loss": -35.66327667236328, "global_step": 54263, "epoch": 448} {"train_loss": -35.64835739135742, "global_step": 54264, "epoch": 448} {"train_loss": -35.368377685546875, "global_step": 54265, "epoch": 448} {"train_loss": -35.27411651611328, "global_step": 54266, "epoch": 448} {"train_loss": -36.007572174072266, "global_step": 54267, "epoch": 448} {"train_loss": -35.82901382446289, "global_step": 54268, "epoch": 448} {"train_loss": -36.222076416015625, "global_step": 54269, "epoch": 448} {"train_loss": -36.005367279052734, "global_step": 54270, "epoch": 448} {"train_loss": -36.03818893432617, "global_step": 54271, "epoch": 448} {"train_loss": -36.10134506225586, "global_step": 54272, "epoch": 448} {"train_loss": -36.20792770385742, "global_step": 54273, "epoch": 448} {"train_loss": -36.06202697753906, "global_step": 54274, "epoch": 448} {"train_loss": -35.91218185424805, "global_step": 54275, "epoch": 448} {"train_loss": -35.965484619140625, "global_step": 54276, "epoch": 448} {"train_loss": -36.1276969909668, "global_step": 54277, "epoch": 448} {"train_loss": -36.06806182861328, "global_step": 54278, "epoch": 448} {"train_loss": -36.54877853393555, "global_step": 54279, "epoch": 448} {"train_loss": -36.325828552246094, "global_step": 54280, "epoch": 448} {"train_loss": -36.2929573059082, "global_step": 54281, "epoch": 448} {"train_loss": -36.231544494628906, "global_step": 54282, "epoch": 448} {"train_loss": -36.407527923583984, "global_step": 54283, "epoch": 448} {"train_loss": -36.62421798706055, "global_step": 54284, "epoch": 448} {"train_loss": -36.64065170288086, "global_step": 54285, "epoch": 448} {"train_loss": -36.205909729003906, "global_step": 54286, "epoch": 448} {"train_loss": -36.680397033691406, "global_step": 54287, "epoch": 448} {"train_loss": -36.1910514831543, "global_step": 54288, "epoch": 448} {"train_loss": -35.31657791137695, "global_step": 54289, "epoch": 448} {"train_loss": -33.87165451049805, "global_step": 54290, "epoch": 448} {"train_loss": -33.05460739135742, "global_step": 54291, "epoch": 448} {"train_loss": -33.24302673339844, "global_step": 54292, "epoch": 448} {"train_loss": -33.7142448425293, "global_step": 54293, "epoch": 448} {"train_loss": -34.20619583129883, "global_step": 54294, "epoch": 448} {"train_loss": -35.37973403930664, "global_step": 54295, "epoch": 448} {"train_loss": -35.5452766418457, "global_step": 54296, "epoch": 448} {"train_loss": -36.31239700317383, "global_step": 54297, "epoch": 448} {"train_loss": -36.408260345458984, "global_step": 54298, "epoch": 448} {"train_loss": -36.02486801147461, "global_step": 54299, "epoch": 448} {"train_loss": -36.29903030395508, "global_step": 54300, "epoch": 448} {"train_loss": -36.3442497253418, "global_step": 54301, "epoch": 448} {"train_loss": -35.86553955078125, "global_step": 54302, "epoch": 448} {"train_loss": -36.68947982788086, "global_step": 54303, "epoch": 448} {"train_loss": -36.51516342163086, "global_step": 54304, "epoch": 448} {"train_loss": -35.863861083984375, "global_step": 54305, "epoch": 448} {"train_loss": -36.52085494995117, "global_step": 54306, "epoch": 448} {"train_loss": -36.23063278198242, "global_step": 54307, "epoch": 448} {"train_loss": -36.39460372924805, "global_step": 54308, "epoch": 448} {"train_loss": -36.05710983276367, "global_step": 54309, "epoch": 448} {"train_loss": -35.66144561767578, "global_step": 54310, "epoch": 448} {"train_loss": -35.70445251464844, "global_step": 54311, "epoch": 448} {"train_loss": -34.91476058959961, "global_step": 54312, "epoch": 448} {"train_loss": -35.429298400878906, "global_step": 54313, "epoch": 448} {"train_loss": -36.54425048828125, "global_step": 54314, "epoch": 448} {"train_loss": -36.250118255615234, "global_step": 54315, "epoch": 448} {"train_loss": -35.61777114868164, "global_step": 54316, "epoch": 448} {"train_loss": -36.00189208984375, "global_step": 54317, "epoch": 448} {"train_loss": -36.26845932006836, "global_step": 54318, "epoch": 448} {"train_loss": -35.998043060302734, "global_step": 54319, "epoch": 448} {"train_loss": -36.598934173583984, "global_step": 54320, "epoch": 448} {"train_loss": -36.28601837158203, "global_step": 54321, "epoch": 448} {"train_loss": -36.470069885253906, "global_step": 54322, "epoch": 448} {"train_loss": -36.204856872558594, "global_step": 54323, "epoch": 448} {"train_loss": -36.13859939575195, "global_step": 54324, "epoch": 448} {"train_loss": -36.59980392456055, "global_step": 54325, "epoch": 448} {"train_loss": -35.851200103759766, "global_step": 54326, "epoch": 448} {"train_loss": -36.16124725341797, "global_step": 54327, "epoch": 448} {"train_loss": -35.30316489984181, "global_step": 54328, "epoch": 448, "val_loss": 2646104.0} {"train_loss": -33.78066635131836, "global_step": 54329, "epoch": 449} {"train_loss": -30.999963760375977, "global_step": 54330, "epoch": 449} {"train_loss": -36.288204193115234, "global_step": 54331, "epoch": 449} {"train_loss": -35.32236862182617, "global_step": 54332, "epoch": 449} {"train_loss": -33.275699615478516, "global_step": 54333, "epoch": 449} {"train_loss": -34.62593460083008, "global_step": 54334, "epoch": 449} {"train_loss": -34.759517669677734, "global_step": 54335, "epoch": 449} {"train_loss": -33.90122604370117, "global_step": 54336, "epoch": 449} {"train_loss": -32.8001823425293, "global_step": 54337, "epoch": 449} {"train_loss": -32.048370361328125, "global_step": 54338, "epoch": 449} {"train_loss": -32.53068161010742, "global_step": 54339, "epoch": 449} {"train_loss": -32.151222229003906, "global_step": 54340, "epoch": 449} {"train_loss": -32.428035736083984, "global_step": 54341, "epoch": 449} {"train_loss": -34.17116165161133, "global_step": 54342, "epoch": 449} {"train_loss": -34.50766372680664, "global_step": 54343, "epoch": 449} {"train_loss": -32.72097396850586, "global_step": 54344, "epoch": 449} {"train_loss": -31.109811782836914, "global_step": 54345, "epoch": 449} {"train_loss": -35.463809967041016, "global_step": 54346, "epoch": 449} {"train_loss": -33.91270446777344, "global_step": 54347, "epoch": 449} {"train_loss": -33.936988830566406, "global_step": 54348, "epoch": 449} {"train_loss": -35.29865264892578, "global_step": 54349, "epoch": 449} {"train_loss": -34.141902923583984, "global_step": 54350, "epoch": 449} {"train_loss": -35.81825637817383, "global_step": 54351, "epoch": 449} {"train_loss": -34.10718536376953, "global_step": 54352, "epoch": 449} {"train_loss": -33.53392028808594, "global_step": 54353, "epoch": 449} {"train_loss": -35.040462493896484, "global_step": 54354, "epoch": 449} {"train_loss": -34.70471954345703, "global_step": 54355, "epoch": 449} {"train_loss": -35.274288177490234, "global_step": 54356, "epoch": 449} {"train_loss": -35.02779006958008, "global_step": 54357, "epoch": 449} {"train_loss": -35.31889724731445, "global_step": 54358, "epoch": 449} {"train_loss": -32.539424896240234, "global_step": 54359, "epoch": 449} {"train_loss": -35.61210250854492, "global_step": 54360, "epoch": 449} {"train_loss": -35.34273147583008, "global_step": 54361, "epoch": 449} {"train_loss": -35.68119430541992, "global_step": 54362, "epoch": 449} {"train_loss": -34.940589904785156, "global_step": 54363, "epoch": 449} {"train_loss": -35.306365966796875, "global_step": 54364, "epoch": 449} {"train_loss": -35.24091720581055, "global_step": 54365, "epoch": 449} {"train_loss": -35.29207229614258, "global_step": 54366, "epoch": 449} {"train_loss": -35.37002944946289, "global_step": 54367, "epoch": 449} {"train_loss": -35.68180465698242, "global_step": 54368, "epoch": 449} {"train_loss": -35.323333740234375, "global_step": 54369, "epoch": 449} {"train_loss": -35.471458435058594, "global_step": 54370, "epoch": 449} {"train_loss": -35.07455825805664, "global_step": 54371, "epoch": 449} {"train_loss": -35.51565170288086, "global_step": 54372, "epoch": 449} {"train_loss": -35.27790069580078, "global_step": 54373, "epoch": 449} {"train_loss": -35.25776290893555, "global_step": 54374, "epoch": 449} {"train_loss": -35.607147216796875, "global_step": 54375, "epoch": 449} {"train_loss": -35.718936920166016, "global_step": 54376, "epoch": 449} {"train_loss": -35.56949234008789, "global_step": 54377, "epoch": 449} {"train_loss": -35.532203674316406, "global_step": 54378, "epoch": 449} {"train_loss": -35.69466018676758, "global_step": 54379, "epoch": 449} {"train_loss": -35.59965133666992, "global_step": 54380, "epoch": 449} {"train_loss": -35.96595001220703, "global_step": 54381, "epoch": 449} {"train_loss": -34.347816467285156, "global_step": 54382, "epoch": 449} {"train_loss": -35.707008361816406, "global_step": 54383, "epoch": 449} {"train_loss": -35.58579635620117, "global_step": 54384, "epoch": 449} {"train_loss": -35.61441421508789, "global_step": 54385, "epoch": 449} {"train_loss": -35.6358642578125, "global_step": 54386, "epoch": 449} {"train_loss": -36.18441390991211, "global_step": 54387, "epoch": 449} {"train_loss": -36.15483474731445, "global_step": 54388, "epoch": 449} {"train_loss": -35.52286148071289, "global_step": 54389, "epoch": 449} {"train_loss": -35.75844192504883, "global_step": 54390, "epoch": 449} {"train_loss": -36.02404022216797, "global_step": 54391, "epoch": 449} {"train_loss": -35.79276657104492, "global_step": 54392, "epoch": 449} {"train_loss": -35.41665267944336, "global_step": 54393, "epoch": 449} {"train_loss": -36.3803596496582, "global_step": 54394, "epoch": 449} {"train_loss": -35.65156555175781, "global_step": 54395, "epoch": 449} {"train_loss": -36.04324722290039, "global_step": 54396, "epoch": 449} {"train_loss": -36.2811164855957, "global_step": 54397, "epoch": 449} {"train_loss": -35.77614974975586, "global_step": 54398, "epoch": 449} {"train_loss": -36.28276443481445, "global_step": 54399, "epoch": 449} {"train_loss": -36.09766387939453, "global_step": 54400, "epoch": 449} {"train_loss": -36.20134353637695, "global_step": 54401, "epoch": 449} {"train_loss": -36.672401428222656, "global_step": 54402, "epoch": 449} {"train_loss": -36.13645935058594, "global_step": 54403, "epoch": 449} {"train_loss": -36.61473846435547, "global_step": 54404, "epoch": 449} {"train_loss": -35.90194320678711, "global_step": 54405, "epoch": 449} {"train_loss": -36.5645866394043, "global_step": 54406, "epoch": 449} {"train_loss": -36.7425651550293, "global_step": 54407, "epoch": 449} {"train_loss": -36.46804428100586, "global_step": 54408, "epoch": 449} {"train_loss": -36.381561279296875, "global_step": 54409, "epoch": 449} {"train_loss": -35.95820617675781, "global_step": 54410, "epoch": 449} {"train_loss": -36.498779296875, "global_step": 54411, "epoch": 449} {"train_loss": -35.9048957824707, "global_step": 54412, "epoch": 449} {"train_loss": -36.41620635986328, "global_step": 54413, "epoch": 449} {"train_loss": -35.97355651855469, "global_step": 54414, "epoch": 449} {"train_loss": -33.287227630615234, "global_step": 54415, "epoch": 449} {"train_loss": -35.7725830078125, "global_step": 54416, "epoch": 449} {"train_loss": -35.94387435913086, "global_step": 54417, "epoch": 449} {"train_loss": -35.6372184753418, "global_step": 54418, "epoch": 449} {"train_loss": -36.158843994140625, "global_step": 54419, "epoch": 449} {"train_loss": -35.76075744628906, "global_step": 54420, "epoch": 449} {"train_loss": -35.414974212646484, "global_step": 54421, "epoch": 449} {"train_loss": -35.4004020690918, "global_step": 54422, "epoch": 449} {"train_loss": -36.2823600769043, "global_step": 54423, "epoch": 449} {"train_loss": -36.16168975830078, "global_step": 54424, "epoch": 449} {"train_loss": -34.41054916381836, "global_step": 54425, "epoch": 449} {"train_loss": -34.24528121948242, "global_step": 54426, "epoch": 449} {"train_loss": -35.218196868896484, "global_step": 54427, "epoch": 449} {"train_loss": -34.92120361328125, "global_step": 54428, "epoch": 449} {"train_loss": -34.42131805419922, "global_step": 54429, "epoch": 449} {"train_loss": -33.613616943359375, "global_step": 54430, "epoch": 449} {"train_loss": -34.29867172241211, "global_step": 54431, "epoch": 449} {"train_loss": -35.69618606567383, "global_step": 54432, "epoch": 449} {"train_loss": -35.70540237426758, "global_step": 54433, "epoch": 449} {"train_loss": -35.63949203491211, "global_step": 54434, "epoch": 449} {"train_loss": -35.31725311279297, "global_step": 54435, "epoch": 449} {"train_loss": -35.45528030395508, "global_step": 54436, "epoch": 449} {"train_loss": -35.5413818359375, "global_step": 54437, "epoch": 449} {"train_loss": -35.98857498168945, "global_step": 54438, "epoch": 449} {"train_loss": -35.48000717163086, "global_step": 54439, "epoch": 449} {"train_loss": -35.55450439453125, "global_step": 54440, "epoch": 449} {"train_loss": -34.432472229003906, "global_step": 54441, "epoch": 449} {"train_loss": -36.050697326660156, "global_step": 54442, "epoch": 449} {"train_loss": -34.12112045288086, "global_step": 54443, "epoch": 449} {"train_loss": -35.4488410949707, "global_step": 54444, "epoch": 449} {"train_loss": -35.40293502807617, "global_step": 54445, "epoch": 449} {"train_loss": -35.9067497253418, "global_step": 54446, "epoch": 449} {"train_loss": -35.115596771240234, "global_step": 54447, "epoch": 449} {"train_loss": -33.37009811401367, "global_step": 54448, "epoch": 449} {"train_loss": -35.13269809060846, "global_step": 54449, "epoch": 449, "val_loss": 2671025.0} {"train_loss": -35.298011779785156, "global_step": 54450, "epoch": 450} {"train_loss": -35.266056060791016, "global_step": 54451, "epoch": 450} {"train_loss": -33.14080810546875, "global_step": 54452, "epoch": 450} {"train_loss": -34.983612060546875, "global_step": 54453, "epoch": 450} {"train_loss": -32.787899017333984, "global_step": 54454, "epoch": 450} {"train_loss": -34.26229476928711, "global_step": 54455, "epoch": 450} {"train_loss": -34.00211715698242, "global_step": 54456, "epoch": 450} {"train_loss": -33.506614685058594, "global_step": 54457, "epoch": 450} {"train_loss": -34.291847229003906, "global_step": 54458, "epoch": 450} {"train_loss": -34.218849182128906, "global_step": 54459, "epoch": 450} {"train_loss": -33.75077438354492, "global_step": 54460, "epoch": 450} {"train_loss": -34.6087646484375, "global_step": 54461, "epoch": 450} {"train_loss": -34.285430908203125, "global_step": 54462, "epoch": 450} {"train_loss": -33.07844924926758, "global_step": 54463, "epoch": 450} {"train_loss": -33.44511032104492, "global_step": 54464, "epoch": 450} {"train_loss": -33.323848724365234, "global_step": 54465, "epoch": 450} {"train_loss": -33.3714599609375, "global_step": 54466, "epoch": 450} {"train_loss": -34.184059143066406, "global_step": 54467, "epoch": 450} {"train_loss": -35.1960334777832, "global_step": 54468, "epoch": 450} {"train_loss": -33.33402633666992, "global_step": 54469, "epoch": 450} {"train_loss": -34.402488708496094, "global_step": 54470, "epoch": 450} {"train_loss": -30.159305572509766, "global_step": 54471, "epoch": 450} {"train_loss": -32.91794967651367, "global_step": 54472, "epoch": 450} {"train_loss": -34.3356819152832, "global_step": 54473, "epoch": 450} {"train_loss": -33.35874938964844, "global_step": 54474, "epoch": 450} {"train_loss": -34.37841033935547, "global_step": 54475, "epoch": 450} {"train_loss": -31.7714786529541, "global_step": 54476, "epoch": 450} {"train_loss": -34.514190673828125, "global_step": 54477, "epoch": 450} {"train_loss": -34.84368896484375, "global_step": 54478, "epoch": 450} {"train_loss": -33.70139694213867, "global_step": 54479, "epoch": 450} {"train_loss": -33.49339294433594, "global_step": 54480, "epoch": 450} {"train_loss": -32.49827575683594, "global_step": 54481, "epoch": 450} {"train_loss": -34.315242767333984, "global_step": 54482, "epoch": 450} {"train_loss": -34.12879943847656, "global_step": 54483, "epoch": 450} {"train_loss": -33.873817443847656, "global_step": 54484, "epoch": 450} {"train_loss": -33.32808303833008, "global_step": 54485, "epoch": 450} {"train_loss": -34.90018844604492, "global_step": 54486, "epoch": 450} {"train_loss": -34.65389633178711, "global_step": 54487, "epoch": 450} {"train_loss": -32.71322250366211, "global_step": 54488, "epoch": 450} {"train_loss": -34.39582061767578, "global_step": 54489, "epoch": 450} {"train_loss": -34.80070114135742, "global_step": 54490, "epoch": 450} {"train_loss": -34.497840881347656, "global_step": 54491, "epoch": 450} {"train_loss": -34.12009811401367, "global_step": 54492, "epoch": 450} {"train_loss": -34.9140739440918, "global_step": 54493, "epoch": 450} {"train_loss": -34.556884765625, "global_step": 54494, "epoch": 450} {"train_loss": -34.89493179321289, "global_step": 54495, "epoch": 450} {"train_loss": -34.7526969909668, "global_step": 54496, "epoch": 450} {"train_loss": -35.031044006347656, "global_step": 54497, "epoch": 450} {"train_loss": -34.66938400268555, "global_step": 54498, "epoch": 450} {"train_loss": -34.350791931152344, "global_step": 54499, "epoch": 450} {"train_loss": -34.35455322265625, "global_step": 54500, "epoch": 450} {"train_loss": -34.22749328613281, "global_step": 54501, "epoch": 450} {"train_loss": -34.655879974365234, "global_step": 54502, "epoch": 450} {"train_loss": -33.4005241394043, "global_step": 54503, "epoch": 450} {"train_loss": -34.964508056640625, "global_step": 54504, "epoch": 450} {"train_loss": -34.35232162475586, "global_step": 54505, "epoch": 450} {"train_loss": -35.13813400268555, "global_step": 54506, "epoch": 450} {"train_loss": -34.68135452270508, "global_step": 54507, "epoch": 450} {"train_loss": -34.989105224609375, "global_step": 54508, "epoch": 450} {"train_loss": -35.20393371582031, "global_step": 54509, "epoch": 450} {"train_loss": -34.66392135620117, "global_step": 54510, "epoch": 450} {"train_loss": -35.339595794677734, "global_step": 54511, "epoch": 450} {"train_loss": -34.752540588378906, "global_step": 54512, "epoch": 450} {"train_loss": -33.39821243286133, "global_step": 54513, "epoch": 450} {"train_loss": -33.30168914794922, "global_step": 54514, "epoch": 450} {"train_loss": -34.00856399536133, "global_step": 54515, "epoch": 450} {"train_loss": -35.061702728271484, "global_step": 54516, "epoch": 450} {"train_loss": -35.02510070800781, "global_step": 54517, "epoch": 450} {"train_loss": -34.408668518066406, "global_step": 54518, "epoch": 450} {"train_loss": -35.5607795715332, "global_step": 54519, "epoch": 450} {"train_loss": -35.36650085449219, "global_step": 54520, "epoch": 450} {"train_loss": -35.55754089355469, "global_step": 54521, "epoch": 450} {"train_loss": -35.02582931518555, "global_step": 54522, "epoch": 450} {"train_loss": -35.527587890625, "global_step": 54523, "epoch": 450} {"train_loss": -35.76184844970703, "global_step": 54524, "epoch": 450} {"train_loss": -35.10015106201172, "global_step": 54525, "epoch": 450} {"train_loss": -35.5921745300293, "global_step": 54526, "epoch": 450} {"train_loss": -35.508819580078125, "global_step": 54527, "epoch": 450} {"train_loss": -35.14691162109375, "global_step": 54528, "epoch": 450} {"train_loss": -34.51507568359375, "global_step": 54529, "epoch": 450} {"train_loss": -34.96437072753906, "global_step": 54530, "epoch": 450} {"train_loss": -34.832515716552734, "global_step": 54531, "epoch": 450} {"train_loss": -34.885868072509766, "global_step": 54532, "epoch": 450} {"train_loss": -35.86351013183594, "global_step": 54533, "epoch": 450} {"train_loss": -35.377593994140625, "global_step": 54534, "epoch": 450} {"train_loss": -34.76016616821289, "global_step": 54535, "epoch": 450} {"train_loss": -34.697017669677734, "global_step": 54536, "epoch": 450} {"train_loss": -35.50327682495117, "global_step": 54537, "epoch": 450} {"train_loss": -35.864261627197266, "global_step": 54538, "epoch": 450} {"train_loss": -35.784828186035156, "global_step": 54539, "epoch": 450} {"train_loss": -34.6017951965332, "global_step": 54540, "epoch": 450} {"train_loss": -32.168209075927734, "global_step": 54541, "epoch": 450} {"train_loss": -33.035186767578125, "global_step": 54542, "epoch": 450} {"train_loss": -34.10780334472656, "global_step": 54543, "epoch": 450} {"train_loss": -34.00934600830078, "global_step": 54544, "epoch": 450} {"train_loss": -34.40745162963867, "global_step": 54545, "epoch": 450} {"train_loss": -35.4741325378418, "global_step": 54546, "epoch": 450} {"train_loss": -35.22096252441406, "global_step": 54547, "epoch": 450} {"train_loss": -34.62081527709961, "global_step": 54548, "epoch": 450} {"train_loss": -34.58634567260742, "global_step": 54549, "epoch": 450} {"train_loss": -34.92570114135742, "global_step": 54550, "epoch": 450} {"train_loss": -33.054443359375, "global_step": 54551, "epoch": 450} {"train_loss": -34.08756637573242, "global_step": 54552, "epoch": 450} {"train_loss": -35.459495544433594, "global_step": 54553, "epoch": 450} {"train_loss": -35.183162689208984, "global_step": 54554, "epoch": 450} {"train_loss": -34.007205963134766, "global_step": 54555, "epoch": 450} {"train_loss": -34.23512649536133, "global_step": 54556, "epoch": 450} {"train_loss": -35.82333755493164, "global_step": 54557, "epoch": 450} {"train_loss": -34.46175003051758, "global_step": 54558, "epoch": 450} {"train_loss": -34.001949310302734, "global_step": 54559, "epoch": 450} {"train_loss": -35.78142547607422, "global_step": 54560, "epoch": 450} {"train_loss": -35.547515869140625, "global_step": 54561, "epoch": 450} {"train_loss": -33.98049545288086, "global_step": 54562, "epoch": 450} {"train_loss": -35.13558578491211, "global_step": 54563, "epoch": 450} {"train_loss": -34.8828239440918, "global_step": 54564, "epoch": 450} {"train_loss": -34.695552825927734, "global_step": 54565, "epoch": 450} {"train_loss": -34.4462890625, "global_step": 54566, "epoch": 450} {"train_loss": -33.596473693847656, "global_step": 54567, "epoch": 450} {"train_loss": -34.23674011230469, "global_step": 54568, "epoch": 450} {"train_loss": -35.639400482177734, "global_step": 54569, "epoch": 450} {"train_loss": -34.429159006796596, "global_step": 54570, "epoch": 450, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 0.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4400000": 0.0, "test/sim_max_reward_4400001": 1.0, "test/sim_max_reward_4400002": 1.0, "test/sim_max_reward_4400003": 1.0, "test/sim_max_reward_4400004": 1.0, "test/sim_max_reward_4400005": 1.0, "test/sim_max_reward_4400006": 1.0, "test/sim_max_reward_4400007": 1.0, "test/sim_max_reward_4400008": 1.0, "test/sim_max_reward_4400009": 1.0, "test/sim_max_reward_4400010": 1.0, "test/sim_max_reward_4400011": 1.0, "test/sim_max_reward_4400012": 1.0, "test/sim_max_reward_4400013": 1.0, "test/sim_max_reward_4400014": 1.0, "test/sim_max_reward_4400015": 1.0, "test/sim_max_reward_4400016": 1.0, "test/sim_max_reward_4400017": 1.0, "test/sim_max_reward_4400018": 1.0, "test/sim_max_reward_4400019": 1.0, "test/sim_max_reward_4400020": 1.0, "test/sim_max_reward_4400021": 1.0, "train/mean_score": 0.8333333333333334, "test/mean_score": 0.9545454545454546, "val_loss": 2809476.25} {"train_loss": -34.00394821166992, "global_step": 54571, "epoch": 451} {"train_loss": -34.97793197631836, "global_step": 54572, "epoch": 451} {"train_loss": -33.93172836303711, "global_step": 54573, "epoch": 451} {"train_loss": -32.566017150878906, "global_step": 54574, "epoch": 451} {"train_loss": -34.5779914855957, "global_step": 54575, "epoch": 451} {"train_loss": -33.127593994140625, "global_step": 54576, "epoch": 451} {"train_loss": -34.86228561401367, "global_step": 54577, "epoch": 451} {"train_loss": -33.492855072021484, "global_step": 54578, "epoch": 451} {"train_loss": -33.653724670410156, "global_step": 54579, "epoch": 451} {"train_loss": -34.42544937133789, "global_step": 54580, "epoch": 451} {"train_loss": -34.37006378173828, "global_step": 54581, "epoch": 451} {"train_loss": -33.01889419555664, "global_step": 54582, "epoch": 451} {"train_loss": -34.75991439819336, "global_step": 54583, "epoch": 451} {"train_loss": -34.4759635925293, "global_step": 54584, "epoch": 451} {"train_loss": -31.196502685546875, "global_step": 54585, "epoch": 451} {"train_loss": -32.715301513671875, "global_step": 54586, "epoch": 451} {"train_loss": -32.842262268066406, "global_step": 54587, "epoch": 451} {"train_loss": -32.25846862792969, "global_step": 54588, "epoch": 451} {"train_loss": -33.48837661743164, "global_step": 54589, "epoch": 451} {"train_loss": -33.386043548583984, "global_step": 54590, "epoch": 451} {"train_loss": -34.3646125793457, "global_step": 54591, "epoch": 451} {"train_loss": -32.354549407958984, "global_step": 54592, "epoch": 451} {"train_loss": -33.729461669921875, "global_step": 54593, "epoch": 451} {"train_loss": -33.853607177734375, "global_step": 54594, "epoch": 451} {"train_loss": -33.24580001831055, "global_step": 54595, "epoch": 451} {"train_loss": -34.61934280395508, "global_step": 54596, "epoch": 451} {"train_loss": -35.45113754272461, "global_step": 54597, "epoch": 451} {"train_loss": -33.81919479370117, "global_step": 54598, "epoch": 451} {"train_loss": -34.18430709838867, "global_step": 54599, "epoch": 451} {"train_loss": -34.87691879272461, "global_step": 54600, "epoch": 451} {"train_loss": -34.87089920043945, "global_step": 54601, "epoch": 451} {"train_loss": -35.39790725708008, "global_step": 54602, "epoch": 451} {"train_loss": -35.11008834838867, "global_step": 54603, "epoch": 451} {"train_loss": -34.19591522216797, "global_step": 54604, "epoch": 451} {"train_loss": -34.04514694213867, "global_step": 54605, "epoch": 451} {"train_loss": -34.988826751708984, "global_step": 54606, "epoch": 451} {"train_loss": -34.91393280029297, "global_step": 54607, "epoch": 451} {"train_loss": -34.6537971496582, "global_step": 54608, "epoch": 451} {"train_loss": -34.485443115234375, "global_step": 54609, "epoch": 451} {"train_loss": -34.870731353759766, "global_step": 54610, "epoch": 451} {"train_loss": -35.0321159362793, "global_step": 54611, "epoch": 451} {"train_loss": -34.23516845703125, "global_step": 54612, "epoch": 451} {"train_loss": -34.48075485229492, "global_step": 54613, "epoch": 451} {"train_loss": -35.213558197021484, "global_step": 54614, "epoch": 451} {"train_loss": -34.26401901245117, "global_step": 54615, "epoch": 451} {"train_loss": -35.084251403808594, "global_step": 54616, "epoch": 451} {"train_loss": -35.60647201538086, "global_step": 54617, "epoch": 451} {"train_loss": -34.76912307739258, "global_step": 54618, "epoch": 451} {"train_loss": -35.28207015991211, "global_step": 54619, "epoch": 451} {"train_loss": -34.79026412963867, "global_step": 54620, "epoch": 451} {"train_loss": -36.04410934448242, "global_step": 54621, "epoch": 451} {"train_loss": -35.15066146850586, "global_step": 54622, "epoch": 451} {"train_loss": -35.14286422729492, "global_step": 54623, "epoch": 451} {"train_loss": -34.66261672973633, "global_step": 54624, "epoch": 451} {"train_loss": -35.376888275146484, "global_step": 54625, "epoch": 451} {"train_loss": -34.98550796508789, "global_step": 54626, "epoch": 451} {"train_loss": -35.504554748535156, "global_step": 54627, "epoch": 451} {"train_loss": -35.57179641723633, "global_step": 54628, "epoch": 451} {"train_loss": -35.22660446166992, "global_step": 54629, "epoch": 451} {"train_loss": -35.2867317199707, "global_step": 54630, "epoch": 451} {"train_loss": -35.457393646240234, "global_step": 54631, "epoch": 451} {"train_loss": -35.39630889892578, "global_step": 54632, "epoch": 451} {"train_loss": -34.78057861328125, "global_step": 54633, "epoch": 451} {"train_loss": -34.4126091003418, "global_step": 54634, "epoch": 451} {"train_loss": -34.51759719848633, "global_step": 54635, "epoch": 451} {"train_loss": -35.446041107177734, "global_step": 54636, "epoch": 451} {"train_loss": -35.7540168762207, "global_step": 54637, "epoch": 451} {"train_loss": -34.4593620300293, "global_step": 54638, "epoch": 451} {"train_loss": -34.66843795776367, "global_step": 54639, "epoch": 451} {"train_loss": -34.61379623413086, "global_step": 54640, "epoch": 451} {"train_loss": -33.3016242980957, "global_step": 54641, "epoch": 451} {"train_loss": -33.4042854309082, "global_step": 54642, "epoch": 451} {"train_loss": -33.0411491394043, "global_step": 54643, "epoch": 451} {"train_loss": -34.60093688964844, "global_step": 54644, "epoch": 451} {"train_loss": -34.96201705932617, "global_step": 54645, "epoch": 451} {"train_loss": -34.413543701171875, "global_step": 54646, "epoch": 451} {"train_loss": -34.75455093383789, "global_step": 54647, "epoch": 451} {"train_loss": -35.18783187866211, "global_step": 54648, "epoch": 451} {"train_loss": -34.578651428222656, "global_step": 54649, "epoch": 451} {"train_loss": -34.9493408203125, "global_step": 54650, "epoch": 451} {"train_loss": -34.83380889892578, "global_step": 54651, "epoch": 451} {"train_loss": -33.81322479248047, "global_step": 54652, "epoch": 451} {"train_loss": -34.82426071166992, "global_step": 54653, "epoch": 451} {"train_loss": -34.404197692871094, "global_step": 54654, "epoch": 451} {"train_loss": -34.70747756958008, "global_step": 54655, "epoch": 451} {"train_loss": -34.18537521362305, "global_step": 54656, "epoch": 451} {"train_loss": -34.87397003173828, "global_step": 54657, "epoch": 451} {"train_loss": -35.526119232177734, "global_step": 54658, "epoch": 451} {"train_loss": -34.7786979675293, "global_step": 54659, "epoch": 451} {"train_loss": -34.97846603393555, "global_step": 54660, "epoch": 451} {"train_loss": -34.99776077270508, "global_step": 54661, "epoch": 451} {"train_loss": -35.509822845458984, "global_step": 54662, "epoch": 451} {"train_loss": -35.544921875, "global_step": 54663, "epoch": 451} {"train_loss": -35.0450553894043, "global_step": 54664, "epoch": 451} {"train_loss": -34.86655807495117, "global_step": 54665, "epoch": 451} {"train_loss": -35.74626541137695, "global_step": 54666, "epoch": 451} {"train_loss": -32.97359085083008, "global_step": 54667, "epoch": 451} {"train_loss": -31.404560089111328, "global_step": 54668, "epoch": 451} {"train_loss": -28.611536026000977, "global_step": 54669, "epoch": 451} {"train_loss": -26.590299606323242, "global_step": 54670, "epoch": 451} {"train_loss": -34.28987503051758, "global_step": 54671, "epoch": 451} {"train_loss": -34.737178802490234, "global_step": 54672, "epoch": 451} {"train_loss": -31.713485717773438, "global_step": 54673, "epoch": 451} {"train_loss": -34.08061599731445, "global_step": 54674, "epoch": 451} {"train_loss": -34.544921875, "global_step": 54675, "epoch": 451} {"train_loss": -33.12346649169922, "global_step": 54676, "epoch": 451} {"train_loss": -34.4300422668457, "global_step": 54677, "epoch": 451} {"train_loss": -34.692474365234375, "global_step": 54678, "epoch": 451} {"train_loss": -34.7666130065918, "global_step": 54679, "epoch": 451} {"train_loss": -34.67736053466797, "global_step": 54680, "epoch": 451} {"train_loss": -35.1132698059082, "global_step": 54681, "epoch": 451} {"train_loss": -34.904293060302734, "global_step": 54682, "epoch": 451} {"train_loss": -34.330299377441406, "global_step": 54683, "epoch": 451} {"train_loss": -34.48237991333008, "global_step": 54684, "epoch": 451} {"train_loss": -34.79946517944336, "global_step": 54685, "epoch": 451} {"train_loss": -33.80110549926758, "global_step": 54686, "epoch": 451} {"train_loss": -34.72245407104492, "global_step": 54687, "epoch": 451} {"train_loss": -35.75020217895508, "global_step": 54688, "epoch": 451} {"train_loss": -35.227394104003906, "global_step": 54689, "epoch": 451} {"train_loss": -34.94633102416992, "global_step": 54690, "epoch": 451} {"train_loss": -34.35632538598431, "global_step": 54691, "epoch": 451, "val_loss": 2478923.0} {"train_loss": -35.229244232177734, "global_step": 54692, "epoch": 452} {"train_loss": -35.87368392944336, "global_step": 54693, "epoch": 452} {"train_loss": -36.09830856323242, "global_step": 54694, "epoch": 452} {"train_loss": -35.7077751159668, "global_step": 54695, "epoch": 452} {"train_loss": -35.72844314575195, "global_step": 54696, "epoch": 452} {"train_loss": -35.682674407958984, "global_step": 54697, "epoch": 452} {"train_loss": -36.017066955566406, "global_step": 54698, "epoch": 452} {"train_loss": -36.27093505859375, "global_step": 54699, "epoch": 452} {"train_loss": -34.2816276550293, "global_step": 54700, "epoch": 452} {"train_loss": -35.856483459472656, "global_step": 54701, "epoch": 452} {"train_loss": -35.72623825073242, "global_step": 54702, "epoch": 452} {"train_loss": -36.557861328125, "global_step": 54703, "epoch": 452} {"train_loss": -35.746456146240234, "global_step": 54704, "epoch": 452} {"train_loss": -35.954933166503906, "global_step": 54705, "epoch": 452} {"train_loss": -36.00663375854492, "global_step": 54706, "epoch": 452} {"train_loss": -35.690696716308594, "global_step": 54707, "epoch": 452} {"train_loss": -36.0491828918457, "global_step": 54708, "epoch": 452} {"train_loss": -36.337745666503906, "global_step": 54709, "epoch": 452} {"train_loss": -36.27125930786133, "global_step": 54710, "epoch": 452} {"train_loss": -36.168521881103516, "global_step": 54711, "epoch": 452} {"train_loss": -36.58013916015625, "global_step": 54712, "epoch": 452} {"train_loss": -35.906185150146484, "global_step": 54713, "epoch": 452} {"train_loss": -35.952064514160156, "global_step": 54714, "epoch": 452} {"train_loss": -34.8920783996582, "global_step": 54715, "epoch": 452} {"train_loss": -33.25409698486328, "global_step": 54716, "epoch": 452} {"train_loss": -34.30595397949219, "global_step": 54717, "epoch": 452} {"train_loss": -34.97719955444336, "global_step": 54718, "epoch": 452} {"train_loss": -35.09632110595703, "global_step": 54719, "epoch": 452} {"train_loss": -32.29094696044922, "global_step": 54720, "epoch": 452} {"train_loss": -35.093658447265625, "global_step": 54721, "epoch": 452} {"train_loss": -31.5601749420166, "global_step": 54722, "epoch": 452} {"train_loss": -32.936954498291016, "global_step": 54723, "epoch": 452} {"train_loss": -33.702613830566406, "global_step": 54724, "epoch": 452} {"train_loss": -35.784847259521484, "global_step": 54725, "epoch": 452} {"train_loss": -32.640625, "global_step": 54726, "epoch": 452} {"train_loss": -34.23701858520508, "global_step": 54727, "epoch": 452} {"train_loss": -33.99673080444336, "global_step": 54728, "epoch": 452} {"train_loss": -33.91022872924805, "global_step": 54729, "epoch": 452} {"train_loss": -34.38934326171875, "global_step": 54730, "epoch": 452} {"train_loss": -36.335594177246094, "global_step": 54731, "epoch": 452} {"train_loss": -34.46479034423828, "global_step": 54732, "epoch": 452} {"train_loss": -34.30189895629883, "global_step": 54733, "epoch": 452} {"train_loss": -35.56879425048828, "global_step": 54734, "epoch": 452} {"train_loss": -34.851112365722656, "global_step": 54735, "epoch": 452} {"train_loss": -35.074462890625, "global_step": 54736, "epoch": 452} {"train_loss": -36.39127731323242, "global_step": 54737, "epoch": 452} {"train_loss": -35.114776611328125, "global_step": 54738, "epoch": 452} {"train_loss": -36.05170822143555, "global_step": 54739, "epoch": 452} {"train_loss": -35.56757354736328, "global_step": 54740, "epoch": 452} {"train_loss": -35.9149055480957, "global_step": 54741, "epoch": 452} {"train_loss": -36.629112243652344, "global_step": 54742, "epoch": 452} {"train_loss": -35.81821823120117, "global_step": 54743, "epoch": 452} {"train_loss": -35.6327018737793, "global_step": 54744, "epoch": 452} {"train_loss": -36.539833068847656, "global_step": 54745, "epoch": 452} {"train_loss": -35.370361328125, "global_step": 54746, "epoch": 452} {"train_loss": -36.432796478271484, "global_step": 54747, "epoch": 452} {"train_loss": -36.561279296875, "global_step": 54748, "epoch": 452} {"train_loss": -36.041168212890625, "global_step": 54749, "epoch": 452} {"train_loss": -36.56926345825195, "global_step": 54750, "epoch": 452} {"train_loss": -36.2171516418457, "global_step": 54751, "epoch": 452} {"train_loss": -36.04710006713867, "global_step": 54752, "epoch": 452} {"train_loss": -36.41669845581055, "global_step": 54753, "epoch": 452} {"train_loss": -36.85184860229492, "global_step": 54754, "epoch": 452} {"train_loss": -36.09223175048828, "global_step": 54755, "epoch": 452} {"train_loss": -35.92501449584961, "global_step": 54756, "epoch": 452} {"train_loss": -36.520111083984375, "global_step": 54757, "epoch": 452} {"train_loss": -35.608314514160156, "global_step": 54758, "epoch": 452} {"train_loss": -36.13017654418945, "global_step": 54759, "epoch": 452} {"train_loss": -36.443214416503906, "global_step": 54760, "epoch": 452} {"train_loss": -35.356815338134766, "global_step": 54761, "epoch": 452} {"train_loss": -35.081783294677734, "global_step": 54762, "epoch": 452} {"train_loss": -35.658111572265625, "global_step": 54763, "epoch": 452} {"train_loss": -33.81589126586914, "global_step": 54764, "epoch": 452} {"train_loss": -35.335933685302734, "global_step": 54765, "epoch": 452} {"train_loss": -34.665340423583984, "global_step": 54766, "epoch": 452} {"train_loss": -35.83928298950195, "global_step": 54767, "epoch": 452} {"train_loss": -36.23823547363281, "global_step": 54768, "epoch": 452} {"train_loss": -35.77519607543945, "global_step": 54769, "epoch": 452} {"train_loss": -36.599952697753906, "global_step": 54770, "epoch": 452} {"train_loss": -35.91981506347656, "global_step": 54771, "epoch": 452} {"train_loss": -36.714935302734375, "global_step": 54772, "epoch": 452} {"train_loss": -35.83893585205078, "global_step": 54773, "epoch": 452} {"train_loss": -36.09566879272461, "global_step": 54774, "epoch": 452} {"train_loss": -35.96357345581055, "global_step": 54775, "epoch": 452} {"train_loss": -35.098201751708984, "global_step": 54776, "epoch": 452} {"train_loss": -35.33549499511719, "global_step": 54777, "epoch": 452} {"train_loss": -35.15793991088867, "global_step": 54778, "epoch": 452} {"train_loss": -34.43159103393555, "global_step": 54779, "epoch": 452} {"train_loss": -35.325042724609375, "global_step": 54780, "epoch": 452} {"train_loss": -35.844757080078125, "global_step": 54781, "epoch": 452} {"train_loss": -35.58280563354492, "global_step": 54782, "epoch": 452} {"train_loss": -35.791324615478516, "global_step": 54783, "epoch": 452} {"train_loss": -33.69697189331055, "global_step": 54784, "epoch": 452} {"train_loss": -35.13608932495117, "global_step": 54785, "epoch": 452} {"train_loss": -32.43252182006836, "global_step": 54786, "epoch": 452} {"train_loss": -34.0760612487793, "global_step": 54787, "epoch": 452} {"train_loss": -35.58597946166992, "global_step": 54788, "epoch": 452} {"train_loss": -35.06327438354492, "global_step": 54789, "epoch": 452} {"train_loss": -35.06052017211914, "global_step": 54790, "epoch": 452} {"train_loss": -34.555904388427734, "global_step": 54791, "epoch": 452} {"train_loss": -35.051513671875, "global_step": 54792, "epoch": 452} {"train_loss": -34.97591781616211, "global_step": 54793, "epoch": 452} {"train_loss": -35.257598876953125, "global_step": 54794, "epoch": 452} {"train_loss": -34.305824279785156, "global_step": 54795, "epoch": 452} {"train_loss": -34.12154006958008, "global_step": 54796, "epoch": 452} {"train_loss": -32.013187408447266, "global_step": 54797, "epoch": 452} {"train_loss": -31.623336791992188, "global_step": 54798, "epoch": 452} {"train_loss": -33.62877655029297, "global_step": 54799, "epoch": 452} {"train_loss": -32.88869857788086, "global_step": 54800, "epoch": 452} {"train_loss": -35.15174865722656, "global_step": 54801, "epoch": 452} {"train_loss": -33.3148078918457, "global_step": 54802, "epoch": 452} {"train_loss": -33.06598663330078, "global_step": 54803, "epoch": 452} {"train_loss": -33.15324401855469, "global_step": 54804, "epoch": 452} {"train_loss": -33.875160217285156, "global_step": 54805, "epoch": 452} {"train_loss": -33.68531036376953, "global_step": 54806, "epoch": 452} {"train_loss": -33.815948486328125, "global_step": 54807, "epoch": 452} {"train_loss": -34.41139221191406, "global_step": 54808, "epoch": 452} {"train_loss": -34.363948822021484, "global_step": 54809, "epoch": 452} {"train_loss": -34.74593734741211, "global_step": 54810, "epoch": 452} {"train_loss": -35.0062255859375, "global_step": 54811, "epoch": 452} {"train_loss": -35.136818294682776, "global_step": 54812, "epoch": 452, "val_loss": 2495897.5} {"train_loss": -35.43408966064453, "global_step": 54813, "epoch": 453} {"train_loss": -35.40924835205078, "global_step": 54814, "epoch": 453} {"train_loss": -35.43702697753906, "global_step": 54815, "epoch": 453} {"train_loss": -35.5359001159668, "global_step": 54816, "epoch": 453} {"train_loss": -35.220516204833984, "global_step": 54817, "epoch": 453} {"train_loss": -34.89753341674805, "global_step": 54818, "epoch": 453} {"train_loss": -35.10157012939453, "global_step": 54819, "epoch": 453} {"train_loss": -35.02553176879883, "global_step": 54820, "epoch": 453} {"train_loss": -35.795005798339844, "global_step": 54821, "epoch": 453} {"train_loss": -35.777156829833984, "global_step": 54822, "epoch": 453} {"train_loss": -35.87900924682617, "global_step": 54823, "epoch": 453} {"train_loss": -35.44452667236328, "global_step": 54824, "epoch": 453} {"train_loss": -35.660579681396484, "global_step": 54825, "epoch": 453} {"train_loss": -35.496273040771484, "global_step": 54826, "epoch": 453} {"train_loss": -35.606136322021484, "global_step": 54827, "epoch": 453} {"train_loss": -35.88734436035156, "global_step": 54828, "epoch": 453} {"train_loss": -36.00422286987305, "global_step": 54829, "epoch": 453} {"train_loss": -36.189300537109375, "global_step": 54830, "epoch": 453} {"train_loss": -35.921566009521484, "global_step": 54831, "epoch": 453} {"train_loss": -36.200443267822266, "global_step": 54832, "epoch": 453} {"train_loss": -35.368255615234375, "global_step": 54833, "epoch": 453} {"train_loss": -36.15684127807617, "global_step": 54834, "epoch": 453} {"train_loss": -36.117408752441406, "global_step": 54835, "epoch": 453} {"train_loss": -36.009769439697266, "global_step": 54836, "epoch": 453} {"train_loss": -36.11375045776367, "global_step": 54837, "epoch": 453} {"train_loss": -36.615447998046875, "global_step": 54838, "epoch": 453} {"train_loss": -36.3387565612793, "global_step": 54839, "epoch": 453} {"train_loss": -36.39449691772461, "global_step": 54840, "epoch": 453} {"train_loss": -36.23390197753906, "global_step": 54841, "epoch": 453} {"train_loss": -36.0407829284668, "global_step": 54842, "epoch": 453} {"train_loss": -35.990211486816406, "global_step": 54843, "epoch": 453} {"train_loss": -36.44154357910156, "global_step": 54844, "epoch": 453} {"train_loss": -36.6746711730957, "global_step": 54845, "epoch": 453} {"train_loss": -36.50349807739258, "global_step": 54846, "epoch": 453} {"train_loss": -36.75813674926758, "global_step": 54847, "epoch": 453} {"train_loss": -36.217010498046875, "global_step": 54848, "epoch": 453} {"train_loss": -35.65060806274414, "global_step": 54849, "epoch": 453} {"train_loss": -35.36970901489258, "global_step": 54850, "epoch": 453} {"train_loss": -35.97324752807617, "global_step": 54851, "epoch": 453} {"train_loss": -35.05801010131836, "global_step": 54852, "epoch": 453} {"train_loss": -35.21371078491211, "global_step": 54853, "epoch": 453} {"train_loss": -35.45263671875, "global_step": 54854, "epoch": 453} {"train_loss": -35.89619827270508, "global_step": 54855, "epoch": 453} {"train_loss": -35.07759475708008, "global_step": 54856, "epoch": 453} {"train_loss": -33.71991729736328, "global_step": 54857, "epoch": 453} {"train_loss": -31.78223991394043, "global_step": 54858, "epoch": 453} {"train_loss": -27.224218368530273, "global_step": 54859, "epoch": 453} {"train_loss": -21.582782745361328, "global_step": 54860, "epoch": 453} {"train_loss": -25.12137794494629, "global_step": 54861, "epoch": 453} {"train_loss": -33.3245735168457, "global_step": 54862, "epoch": 453} {"train_loss": -28.389392852783203, "global_step": 54863, "epoch": 453} {"train_loss": -35.890899658203125, "global_step": 54864, "epoch": 453} {"train_loss": -30.811933517456055, "global_step": 54865, "epoch": 453} {"train_loss": -34.83174514770508, "global_step": 54866, "epoch": 453} {"train_loss": -32.18955993652344, "global_step": 54867, "epoch": 453} {"train_loss": -34.127742767333984, "global_step": 54868, "epoch": 453} {"train_loss": -35.21073532104492, "global_step": 54869, "epoch": 453} {"train_loss": -33.835289001464844, "global_step": 54870, "epoch": 453} {"train_loss": -34.97697830200195, "global_step": 54871, "epoch": 453} {"train_loss": -35.9932975769043, "global_step": 54872, "epoch": 453} {"train_loss": -34.51799011230469, "global_step": 54873, "epoch": 453} {"train_loss": -35.27360916137695, "global_step": 54874, "epoch": 453} {"train_loss": -35.72329330444336, "global_step": 54875, "epoch": 453} {"train_loss": -35.75459671020508, "global_step": 54876, "epoch": 453} {"train_loss": -35.3706169128418, "global_step": 54877, "epoch": 453} {"train_loss": -35.31088638305664, "global_step": 54878, "epoch": 453} {"train_loss": -35.69138717651367, "global_step": 54879, "epoch": 453} {"train_loss": -35.91289138793945, "global_step": 54880, "epoch": 453} {"train_loss": -35.2985725402832, "global_step": 54881, "epoch": 453} {"train_loss": -35.815521240234375, "global_step": 54882, "epoch": 453} {"train_loss": -35.37446975708008, "global_step": 54883, "epoch": 453} {"train_loss": -36.13206481933594, "global_step": 54884, "epoch": 453} {"train_loss": -35.748130798339844, "global_step": 54885, "epoch": 453} {"train_loss": -35.596824645996094, "global_step": 54886, "epoch": 453} {"train_loss": -35.783145904541016, "global_step": 54887, "epoch": 453} {"train_loss": -35.4010124206543, "global_step": 54888, "epoch": 453} {"train_loss": -36.4123649597168, "global_step": 54889, "epoch": 453} {"train_loss": -35.347232818603516, "global_step": 54890, "epoch": 453} {"train_loss": -35.5346794128418, "global_step": 54891, "epoch": 453} {"train_loss": -36.05341720581055, "global_step": 54892, "epoch": 453} {"train_loss": -36.11936569213867, "global_step": 54893, "epoch": 453} {"train_loss": -36.26374816894531, "global_step": 54894, "epoch": 453} {"train_loss": -35.71701431274414, "global_step": 54895, "epoch": 453} {"train_loss": -35.72704315185547, "global_step": 54896, "epoch": 453} {"train_loss": -36.05804443359375, "global_step": 54897, "epoch": 453} {"train_loss": -35.808406829833984, "global_step": 54898, "epoch": 453} {"train_loss": -36.012569427490234, "global_step": 54899, "epoch": 453} {"train_loss": -35.63269805908203, "global_step": 54900, "epoch": 453} {"train_loss": -34.63738250732422, "global_step": 54901, "epoch": 453} {"train_loss": -31.00440788269043, "global_step": 54902, "epoch": 453} {"train_loss": -26.28725242614746, "global_step": 54903, "epoch": 453} {"train_loss": -26.913818359375, "global_step": 54904, "epoch": 453} {"train_loss": -35.497894287109375, "global_step": 54905, "epoch": 453} {"train_loss": -33.30405807495117, "global_step": 54906, "epoch": 453} {"train_loss": -34.202308654785156, "global_step": 54907, "epoch": 453} {"train_loss": -34.51258087158203, "global_step": 54908, "epoch": 453} {"train_loss": -34.1303825378418, "global_step": 54909, "epoch": 453} {"train_loss": -34.43674850463867, "global_step": 54910, "epoch": 453} {"train_loss": -34.222537994384766, "global_step": 54911, "epoch": 453} {"train_loss": -35.72304916381836, "global_step": 54912, "epoch": 453} {"train_loss": -34.989070892333984, "global_step": 54913, "epoch": 453} {"train_loss": -34.967506408691406, "global_step": 54914, "epoch": 453} {"train_loss": -35.49149703979492, "global_step": 54915, "epoch": 453} {"train_loss": -35.07170486450195, "global_step": 54916, "epoch": 453} {"train_loss": -34.99748992919922, "global_step": 54917, "epoch": 453} {"train_loss": -35.59550094604492, "global_step": 54918, "epoch": 453} {"train_loss": -35.357826232910156, "global_step": 54919, "epoch": 453} {"train_loss": -35.27267074584961, "global_step": 54920, "epoch": 453} {"train_loss": -35.06808090209961, "global_step": 54921, "epoch": 453} {"train_loss": -35.63170623779297, "global_step": 54922, "epoch": 453} {"train_loss": -35.71846008300781, "global_step": 54923, "epoch": 453} {"train_loss": -35.13692092895508, "global_step": 54924, "epoch": 453} {"train_loss": -34.21529769897461, "global_step": 54925, "epoch": 453} {"train_loss": -34.664306640625, "global_step": 54926, "epoch": 453} {"train_loss": -34.28044509887695, "global_step": 54927, "epoch": 453} {"train_loss": -35.408935546875, "global_step": 54928, "epoch": 453} {"train_loss": -35.7410888671875, "global_step": 54929, "epoch": 453} {"train_loss": -34.54667282104492, "global_step": 54930, "epoch": 453} {"train_loss": -33.8162956237793, "global_step": 54931, "epoch": 453} {"train_loss": -35.0810546875, "global_step": 54932, "epoch": 453} {"train_loss": -34.838799027372, "global_step": 54933, "epoch": 453, "val_loss": 2567575.0} {"train_loss": -35.227081298828125, "global_step": 54934, "epoch": 454} {"train_loss": -34.56759262084961, "global_step": 54935, "epoch": 454} {"train_loss": -34.62467956542969, "global_step": 54936, "epoch": 454} {"train_loss": -35.794273376464844, "global_step": 54937, "epoch": 454} {"train_loss": -35.27318572998047, "global_step": 54938, "epoch": 454} {"train_loss": -35.14381790161133, "global_step": 54939, "epoch": 454} {"train_loss": -35.7604866027832, "global_step": 54940, "epoch": 454} {"train_loss": -33.22275924682617, "global_step": 54941, "epoch": 454} {"train_loss": -33.64628219604492, "global_step": 54942, "epoch": 454} {"train_loss": -35.739479064941406, "global_step": 54943, "epoch": 454} {"train_loss": -34.78375244140625, "global_step": 54944, "epoch": 454} {"train_loss": -34.8128547668457, "global_step": 54945, "epoch": 454} {"train_loss": -34.864051818847656, "global_step": 54946, "epoch": 454} {"train_loss": -34.885921478271484, "global_step": 54947, "epoch": 454} {"train_loss": -34.1701545715332, "global_step": 54948, "epoch": 454} {"train_loss": -34.1313591003418, "global_step": 54949, "epoch": 454} {"train_loss": -35.30012893676758, "global_step": 54950, "epoch": 454} {"train_loss": -33.908016204833984, "global_step": 54951, "epoch": 454} {"train_loss": -34.944000244140625, "global_step": 54952, "epoch": 454} {"train_loss": -34.88233184814453, "global_step": 54953, "epoch": 454} {"train_loss": -34.23812484741211, "global_step": 54954, "epoch": 454} {"train_loss": -35.896629333496094, "global_step": 54955, "epoch": 454} {"train_loss": -35.21256637573242, "global_step": 54956, "epoch": 454} {"train_loss": -35.363033294677734, "global_step": 54957, "epoch": 454} {"train_loss": -35.79890441894531, "global_step": 54958, "epoch": 454} {"train_loss": -35.5295295715332, "global_step": 54959, "epoch": 454} {"train_loss": -35.25989532470703, "global_step": 54960, "epoch": 454} {"train_loss": -35.80447006225586, "global_step": 54961, "epoch": 454} {"train_loss": -35.55790328979492, "global_step": 54962, "epoch": 454} {"train_loss": -36.071685791015625, "global_step": 54963, "epoch": 454} {"train_loss": -36.11587142944336, "global_step": 54964, "epoch": 454} {"train_loss": -35.16617965698242, "global_step": 54965, "epoch": 454} {"train_loss": -36.14600372314453, "global_step": 54966, "epoch": 454} {"train_loss": -35.86198425292969, "global_step": 54967, "epoch": 454} {"train_loss": -35.76454544067383, "global_step": 54968, "epoch": 454} {"train_loss": -36.14039611816406, "global_step": 54969, "epoch": 454} {"train_loss": -36.381072998046875, "global_step": 54970, "epoch": 454} {"train_loss": -35.67989730834961, "global_step": 54971, "epoch": 454} {"train_loss": -35.741371154785156, "global_step": 54972, "epoch": 454} {"train_loss": -35.326629638671875, "global_step": 54973, "epoch": 454} {"train_loss": -35.468326568603516, "global_step": 54974, "epoch": 454} {"train_loss": -34.954612731933594, "global_step": 54975, "epoch": 454} {"train_loss": -33.97893524169922, "global_step": 54976, "epoch": 454} {"train_loss": -30.834644317626953, "global_step": 54977, "epoch": 454} {"train_loss": -29.495237350463867, "global_step": 54978, "epoch": 454} {"train_loss": -23.191617965698242, "global_step": 54979, "epoch": 454} {"train_loss": -13.964434623718262, "global_step": 54980, "epoch": 454} {"train_loss": -21.063573837280273, "global_step": 54981, "epoch": 454} {"train_loss": -35.729827880859375, "global_step": 54982, "epoch": 454} {"train_loss": -27.54054069519043, "global_step": 54983, "epoch": 454} {"train_loss": -34.72224044799805, "global_step": 54984, "epoch": 454} {"train_loss": -31.11701011657715, "global_step": 54985, "epoch": 454} {"train_loss": -34.244415283203125, "global_step": 54986, "epoch": 454} {"train_loss": -33.0520133972168, "global_step": 54987, "epoch": 454} {"train_loss": -32.357215881347656, "global_step": 54988, "epoch": 454} {"train_loss": -34.30631637573242, "global_step": 54989, "epoch": 454} {"train_loss": -33.852874755859375, "global_step": 54990, "epoch": 454} {"train_loss": -33.580223083496094, "global_step": 54991, "epoch": 454} {"train_loss": -35.37522888183594, "global_step": 54992, "epoch": 454} {"train_loss": -34.270652770996094, "global_step": 54993, "epoch": 454} {"train_loss": -34.06025314331055, "global_step": 54994, "epoch": 454} {"train_loss": -34.72365188598633, "global_step": 54995, "epoch": 454} {"train_loss": -34.73564529418945, "global_step": 54996, "epoch": 454} {"train_loss": -34.25608444213867, "global_step": 54997, "epoch": 454} {"train_loss": -34.39583969116211, "global_step": 54998, "epoch": 454} {"train_loss": -35.17571258544922, "global_step": 54999, "epoch": 454} {"train_loss": -34.91180419921875, "global_step": 55000, "epoch": 454} {"train_loss": -34.79092788696289, "global_step": 55001, "epoch": 454} {"train_loss": -34.875244140625, "global_step": 55002, "epoch": 454} {"train_loss": -35.57589340209961, "global_step": 55003, "epoch": 454} {"train_loss": -35.30931091308594, "global_step": 55004, "epoch": 454} {"train_loss": -35.94710922241211, "global_step": 55005, "epoch": 454} {"train_loss": -34.84139633178711, "global_step": 55006, "epoch": 454} {"train_loss": -35.349220275878906, "global_step": 55007, "epoch": 454} {"train_loss": -35.48957061767578, "global_step": 55008, "epoch": 454} {"train_loss": -35.497840881347656, "global_step": 55009, "epoch": 454} {"train_loss": -35.407936096191406, "global_step": 55010, "epoch": 454} {"train_loss": -35.72456359863281, "global_step": 55011, "epoch": 454} {"train_loss": -35.90290832519531, "global_step": 55012, "epoch": 454} {"train_loss": -35.6994743347168, "global_step": 55013, "epoch": 454} {"train_loss": -36.03364944458008, "global_step": 55014, "epoch": 454} {"train_loss": -35.96739196777344, "global_step": 55015, "epoch": 454} {"train_loss": -36.038848876953125, "global_step": 55016, "epoch": 454} {"train_loss": -36.06856918334961, "global_step": 55017, "epoch": 454} {"train_loss": -36.064796447753906, "global_step": 55018, "epoch": 454} {"train_loss": -36.33755111694336, "global_step": 55019, "epoch": 454} {"train_loss": -36.29317855834961, "global_step": 55020, "epoch": 454} {"train_loss": -36.277198791503906, "global_step": 55021, "epoch": 454} {"train_loss": -36.439449310302734, "global_step": 55022, "epoch": 454} {"train_loss": -36.27704620361328, "global_step": 55023, "epoch": 454} {"train_loss": -36.34124755859375, "global_step": 55024, "epoch": 454} {"train_loss": -36.434322357177734, "global_step": 55025, "epoch": 454} {"train_loss": -36.5712776184082, "global_step": 55026, "epoch": 454} {"train_loss": -36.566951751708984, "global_step": 55027, "epoch": 454} {"train_loss": -36.70934295654297, "global_step": 55028, "epoch": 454} {"train_loss": -36.53190612792969, "global_step": 55029, "epoch": 454} {"train_loss": -36.6500358581543, "global_step": 55030, "epoch": 454} {"train_loss": -36.84475326538086, "global_step": 55031, "epoch": 454} {"train_loss": -36.564353942871094, "global_step": 55032, "epoch": 454} {"train_loss": -36.72880554199219, "global_step": 55033, "epoch": 454} {"train_loss": -36.29367446899414, "global_step": 55034, "epoch": 454} {"train_loss": -36.60822296142578, "global_step": 55035, "epoch": 454} {"train_loss": -36.3691291809082, "global_step": 55036, "epoch": 454} {"train_loss": -36.62142562866211, "global_step": 55037, "epoch": 454} {"train_loss": -36.78475570678711, "global_step": 55038, "epoch": 454} {"train_loss": -36.39649963378906, "global_step": 55039, "epoch": 454} {"train_loss": -36.15541458129883, "global_step": 55040, "epoch": 454} {"train_loss": -36.12617111206055, "global_step": 55041, "epoch": 454} {"train_loss": -36.29833221435547, "global_step": 55042, "epoch": 454} {"train_loss": -36.377105712890625, "global_step": 55043, "epoch": 454} {"train_loss": -36.4290885925293, "global_step": 55044, "epoch": 454} {"train_loss": -34.102561950683594, "global_step": 55045, "epoch": 454} {"train_loss": -27.995542526245117, "global_step": 55046, "epoch": 454} {"train_loss": -26.289627075195312, "global_step": 55047, "epoch": 454} {"train_loss": -29.495849609375, "global_step": 55048, "epoch": 454} {"train_loss": -32.78886032104492, "global_step": 55049, "epoch": 454} {"train_loss": -25.427515029907227, "global_step": 55050, "epoch": 454} {"train_loss": -23.688756942749023, "global_step": 55051, "epoch": 454} {"train_loss": -20.11555290222168, "global_step": 55052, "epoch": 454} {"train_loss": -34.43528747558594, "global_step": 55053, "epoch": 454} {"train_loss": -34.28094478481072, "global_step": 55054, "epoch": 454, "val_loss": 2693159.0} {"train_loss": -33.42926025390625, "global_step": 55055, "epoch": 455} {"train_loss": -33.20171356201172, "global_step": 55056, "epoch": 455} {"train_loss": -33.0304069519043, "global_step": 55057, "epoch": 455} {"train_loss": -32.7205696105957, "global_step": 55058, "epoch": 455} {"train_loss": -33.9748420715332, "global_step": 55059, "epoch": 455} {"train_loss": -32.256622314453125, "global_step": 55060, "epoch": 455} {"train_loss": -34.94490432739258, "global_step": 55061, "epoch": 455} {"train_loss": -33.63475036621094, "global_step": 55062, "epoch": 455} {"train_loss": -33.910430908203125, "global_step": 55063, "epoch": 455} {"train_loss": -34.60215377807617, "global_step": 55064, "epoch": 455} {"train_loss": -34.26636505126953, "global_step": 55065, "epoch": 455} {"train_loss": -34.54917907714844, "global_step": 55066, "epoch": 455} {"train_loss": -34.26538848876953, "global_step": 55067, "epoch": 455} {"train_loss": -34.10835647583008, "global_step": 55068, "epoch": 455} {"train_loss": -35.320308685302734, "global_step": 55069, "epoch": 455} {"train_loss": -35.15898513793945, "global_step": 55070, "epoch": 455} {"train_loss": -34.88349914550781, "global_step": 55071, "epoch": 455} {"train_loss": -35.105133056640625, "global_step": 55072, "epoch": 455} {"train_loss": -35.50794982910156, "global_step": 55073, "epoch": 455} {"train_loss": -35.292701721191406, "global_step": 55074, "epoch": 455} {"train_loss": -35.459449768066406, "global_step": 55075, "epoch": 455} {"train_loss": -35.451690673828125, "global_step": 55076, "epoch": 455} {"train_loss": -35.52886962890625, "global_step": 55077, "epoch": 455} {"train_loss": -35.617469787597656, "global_step": 55078, "epoch": 455} {"train_loss": -35.4793586730957, "global_step": 55079, "epoch": 455} {"train_loss": -35.5174446105957, "global_step": 55080, "epoch": 455} {"train_loss": -35.73985290527344, "global_step": 55081, "epoch": 455} {"train_loss": -35.78504180908203, "global_step": 55082, "epoch": 455} {"train_loss": -35.45695495605469, "global_step": 55083, "epoch": 455} {"train_loss": -35.908145904541016, "global_step": 55084, "epoch": 455} {"train_loss": -35.68074417114258, "global_step": 55085, "epoch": 455} {"train_loss": -35.733463287353516, "global_step": 55086, "epoch": 455} {"train_loss": -36.0355224609375, "global_step": 55087, "epoch": 455} {"train_loss": -35.939056396484375, "global_step": 55088, "epoch": 455} {"train_loss": -35.5087890625, "global_step": 55089, "epoch": 455} {"train_loss": -36.0578727722168, "global_step": 55090, "epoch": 455} {"train_loss": -35.90153884887695, "global_step": 55091, "epoch": 455} {"train_loss": -35.89655303955078, "global_step": 55092, "epoch": 455} {"train_loss": -35.43111801147461, "global_step": 55093, "epoch": 455} {"train_loss": -35.54619216918945, "global_step": 55094, "epoch": 455} {"train_loss": -35.724647521972656, "global_step": 55095, "epoch": 455} {"train_loss": -35.081573486328125, "global_step": 55096, "epoch": 455} {"train_loss": -35.739139556884766, "global_step": 55097, "epoch": 455} {"train_loss": -36.35882568359375, "global_step": 55098, "epoch": 455} {"train_loss": -34.79055404663086, "global_step": 55099, "epoch": 455} {"train_loss": -32.87559127807617, "global_step": 55100, "epoch": 455} {"train_loss": -35.17753219604492, "global_step": 55101, "epoch": 455} {"train_loss": -34.80359649658203, "global_step": 55102, "epoch": 455} {"train_loss": -31.45696449279785, "global_step": 55103, "epoch": 455} {"train_loss": -35.796443939208984, "global_step": 55104, "epoch": 455} {"train_loss": -31.798383712768555, "global_step": 55105, "epoch": 455} {"train_loss": -35.18427276611328, "global_step": 55106, "epoch": 455} {"train_loss": -33.6081657409668, "global_step": 55107, "epoch": 455} {"train_loss": -36.1677131652832, "global_step": 55108, "epoch": 455} {"train_loss": -33.648193359375, "global_step": 55109, "epoch": 455} {"train_loss": -34.767513275146484, "global_step": 55110, "epoch": 455} {"train_loss": -33.68246078491211, "global_step": 55111, "epoch": 455} {"train_loss": -35.200679779052734, "global_step": 55112, "epoch": 455} {"train_loss": -34.4674186706543, "global_step": 55113, "epoch": 455} {"train_loss": -34.76115798950195, "global_step": 55114, "epoch": 455} {"train_loss": -35.42641830444336, "global_step": 55115, "epoch": 455} {"train_loss": -34.08662414550781, "global_step": 55116, "epoch": 455} {"train_loss": -33.68962478637695, "global_step": 55117, "epoch": 455} {"train_loss": -33.070587158203125, "global_step": 55118, "epoch": 455} {"train_loss": -33.99605941772461, "global_step": 55119, "epoch": 455} {"train_loss": -34.42881393432617, "global_step": 55120, "epoch": 455} {"train_loss": -34.66727066040039, "global_step": 55121, "epoch": 455} {"train_loss": -34.916900634765625, "global_step": 55122, "epoch": 455} {"train_loss": -31.8248291015625, "global_step": 55123, "epoch": 455} {"train_loss": -33.674774169921875, "global_step": 55124, "epoch": 455} {"train_loss": -33.68467330932617, "global_step": 55125, "epoch": 455} {"train_loss": -35.39945602416992, "global_step": 55126, "epoch": 455} {"train_loss": -34.97380828857422, "global_step": 55127, "epoch": 455} {"train_loss": -34.47977828979492, "global_step": 55128, "epoch": 455} {"train_loss": -35.30079650878906, "global_step": 55129, "epoch": 455} {"train_loss": -35.06924057006836, "global_step": 55130, "epoch": 455} {"train_loss": -34.967227935791016, "global_step": 55131, "epoch": 455} {"train_loss": -35.275657653808594, "global_step": 55132, "epoch": 455} {"train_loss": -35.16422653198242, "global_step": 55133, "epoch": 455} {"train_loss": -34.5235481262207, "global_step": 55134, "epoch": 455} {"train_loss": -35.74430465698242, "global_step": 55135, "epoch": 455} {"train_loss": -35.02360916137695, "global_step": 55136, "epoch": 455} {"train_loss": -35.11346435546875, "global_step": 55137, "epoch": 455} {"train_loss": -35.62705612182617, "global_step": 55138, "epoch": 455} {"train_loss": -35.574302673339844, "global_step": 55139, "epoch": 455} {"train_loss": -35.756202697753906, "global_step": 55140, "epoch": 455} {"train_loss": -36.080806732177734, "global_step": 55141, "epoch": 455} {"train_loss": -35.504615783691406, "global_step": 55142, "epoch": 455} {"train_loss": -35.88648223876953, "global_step": 55143, "epoch": 455} {"train_loss": -35.45964431762695, "global_step": 55144, "epoch": 455} {"train_loss": -35.312347412109375, "global_step": 55145, "epoch": 455} {"train_loss": -35.494197845458984, "global_step": 55146, "epoch": 455} {"train_loss": -35.83921813964844, "global_step": 55147, "epoch": 455} {"train_loss": -35.94797897338867, "global_step": 55148, "epoch": 455} {"train_loss": -35.56740188598633, "global_step": 55149, "epoch": 455} {"train_loss": -35.319000244140625, "global_step": 55150, "epoch": 455} {"train_loss": -34.401390075683594, "global_step": 55151, "epoch": 455} {"train_loss": -32.85993576049805, "global_step": 55152, "epoch": 455} {"train_loss": -34.32057571411133, "global_step": 55153, "epoch": 455} {"train_loss": -35.300750732421875, "global_step": 55154, "epoch": 455} {"train_loss": -33.82495880126953, "global_step": 55155, "epoch": 455} {"train_loss": -31.67559814453125, "global_step": 55156, "epoch": 455} {"train_loss": -32.485740661621094, "global_step": 55157, "epoch": 455} {"train_loss": -35.3056640625, "global_step": 55158, "epoch": 455} {"train_loss": -34.74082565307617, "global_step": 55159, "epoch": 455} {"train_loss": -33.45515060424805, "global_step": 55160, "epoch": 455} {"train_loss": -35.98292922973633, "global_step": 55161, "epoch": 455} {"train_loss": -33.71673583984375, "global_step": 55162, "epoch": 455} {"train_loss": -34.42474365234375, "global_step": 55163, "epoch": 455} {"train_loss": -35.43668746948242, "global_step": 55164, "epoch": 455} {"train_loss": -34.799495697021484, "global_step": 55165, "epoch": 455} {"train_loss": -35.63679504394531, "global_step": 55166, "epoch": 455} {"train_loss": -35.37520217895508, "global_step": 55167, "epoch": 455} {"train_loss": -35.559120178222656, "global_step": 55168, "epoch": 455} {"train_loss": -35.80622863769531, "global_step": 55169, "epoch": 455} {"train_loss": -35.623592376708984, "global_step": 55170, "epoch": 455} {"train_loss": -35.622596740722656, "global_step": 55171, "epoch": 455} {"train_loss": -35.656768798828125, "global_step": 55172, "epoch": 455} {"train_loss": -36.35800552368164, "global_step": 55173, "epoch": 455} {"train_loss": -36.04946517944336, "global_step": 55174, "epoch": 455} {"train_loss": -34.8556560484831, "global_step": 55175, "epoch": 455, "val_loss": 2605918.75} {"train_loss": -36.228355407714844, "global_step": 55176, "epoch": 456} {"train_loss": -36.691829681396484, "global_step": 55177, "epoch": 456} {"train_loss": -36.09723663330078, "global_step": 55178, "epoch": 456} {"train_loss": -36.539676666259766, "global_step": 55179, "epoch": 456} {"train_loss": -36.320030212402344, "global_step": 55180, "epoch": 456} {"train_loss": -36.40084457397461, "global_step": 55181, "epoch": 456} {"train_loss": -36.53571701049805, "global_step": 55182, "epoch": 456} {"train_loss": -36.69587326049805, "global_step": 55183, "epoch": 456} {"train_loss": -36.784095764160156, "global_step": 55184, "epoch": 456} {"train_loss": -36.49283981323242, "global_step": 55185, "epoch": 456} {"train_loss": -36.83445358276367, "global_step": 55186, "epoch": 456} {"train_loss": -36.29724884033203, "global_step": 55187, "epoch": 456} {"train_loss": -36.87282943725586, "global_step": 55188, "epoch": 456} {"train_loss": -36.66272735595703, "global_step": 55189, "epoch": 456} {"train_loss": -36.8424186706543, "global_step": 55190, "epoch": 456} {"train_loss": -36.88386917114258, "global_step": 55191, "epoch": 456} {"train_loss": -36.5279426574707, "global_step": 55192, "epoch": 456} {"train_loss": -36.79271697998047, "global_step": 55193, "epoch": 456} {"train_loss": -37.164180755615234, "global_step": 55194, "epoch": 456} {"train_loss": -36.459163665771484, "global_step": 55195, "epoch": 456} {"train_loss": -36.93348693847656, "global_step": 55196, "epoch": 456} {"train_loss": -36.937355041503906, "global_step": 55197, "epoch": 456} {"train_loss": -36.3586311340332, "global_step": 55198, "epoch": 456} {"train_loss": -36.97816848754883, "global_step": 55199, "epoch": 456} {"train_loss": -36.324195861816406, "global_step": 55200, "epoch": 456} {"train_loss": -36.8285026550293, "global_step": 55201, "epoch": 456} {"train_loss": -36.63320541381836, "global_step": 55202, "epoch": 456} {"train_loss": -36.80173110961914, "global_step": 55203, "epoch": 456} {"train_loss": -36.87355422973633, "global_step": 55204, "epoch": 456} {"train_loss": -36.94961166381836, "global_step": 55205, "epoch": 456} {"train_loss": -37.089210510253906, "global_step": 55206, "epoch": 456} {"train_loss": -35.90150833129883, "global_step": 55207, "epoch": 456} {"train_loss": -35.211517333984375, "global_step": 55208, "epoch": 456} {"train_loss": -35.63621139526367, "global_step": 55209, "epoch": 456} {"train_loss": -36.41612243652344, "global_step": 55210, "epoch": 456} {"train_loss": -36.652191162109375, "global_step": 55211, "epoch": 456} {"train_loss": -35.62960433959961, "global_step": 55212, "epoch": 456} {"train_loss": -34.33676528930664, "global_step": 55213, "epoch": 456} {"train_loss": -36.33814239501953, "global_step": 55214, "epoch": 456} {"train_loss": -35.72589874267578, "global_step": 55215, "epoch": 456} {"train_loss": -35.12028884887695, "global_step": 55216, "epoch": 456} {"train_loss": -37.05172348022461, "global_step": 55217, "epoch": 456} {"train_loss": -35.910091400146484, "global_step": 55218, "epoch": 456} {"train_loss": -35.72237777709961, "global_step": 55219, "epoch": 456} {"train_loss": -36.564552307128906, "global_step": 55220, "epoch": 456} {"train_loss": -35.46352767944336, "global_step": 55221, "epoch": 456} {"train_loss": -36.74668502807617, "global_step": 55222, "epoch": 456} {"train_loss": -36.349281311035156, "global_step": 55223, "epoch": 456} {"train_loss": -36.90025329589844, "global_step": 55224, "epoch": 456} {"train_loss": -36.609127044677734, "global_step": 55225, "epoch": 456} {"train_loss": -36.503536224365234, "global_step": 55226, "epoch": 456} {"train_loss": -36.72187042236328, "global_step": 55227, "epoch": 456} {"train_loss": -36.66654586791992, "global_step": 55228, "epoch": 456} {"train_loss": -36.69098663330078, "global_step": 55229, "epoch": 456} {"train_loss": -36.501338958740234, "global_step": 55230, "epoch": 456} {"train_loss": -36.657047271728516, "global_step": 55231, "epoch": 456} {"train_loss": -36.81427764892578, "global_step": 55232, "epoch": 456} {"train_loss": -36.78447341918945, "global_step": 55233, "epoch": 456} {"train_loss": -36.347412109375, "global_step": 55234, "epoch": 456} {"train_loss": -36.23210525512695, "global_step": 55235, "epoch": 456} {"train_loss": -37.046730041503906, "global_step": 55236, "epoch": 456} {"train_loss": -36.46609878540039, "global_step": 55237, "epoch": 456} {"train_loss": -35.75727081298828, "global_step": 55238, "epoch": 456} {"train_loss": -36.67041015625, "global_step": 55239, "epoch": 456} {"train_loss": -36.6209831237793, "global_step": 55240, "epoch": 456} {"train_loss": -36.77534103393555, "global_step": 55241, "epoch": 456} {"train_loss": -36.384578704833984, "global_step": 55242, "epoch": 456} {"train_loss": -36.64909744262695, "global_step": 55243, "epoch": 456} {"train_loss": -36.194549560546875, "global_step": 55244, "epoch": 456} {"train_loss": -36.66030502319336, "global_step": 55245, "epoch": 456} {"train_loss": -36.80067825317383, "global_step": 55246, "epoch": 456} {"train_loss": -35.75031280517578, "global_step": 55247, "epoch": 456} {"train_loss": -34.62124252319336, "global_step": 55248, "epoch": 456} {"train_loss": -35.703407287597656, "global_step": 55249, "epoch": 456} {"train_loss": -36.09036636352539, "global_step": 55250, "epoch": 456} {"train_loss": -36.36039352416992, "global_step": 55251, "epoch": 456} {"train_loss": -36.305091857910156, "global_step": 55252, "epoch": 456} {"train_loss": -36.344696044921875, "global_step": 55253, "epoch": 456} {"train_loss": -35.79063034057617, "global_step": 55254, "epoch": 456} {"train_loss": -34.642147064208984, "global_step": 55255, "epoch": 456} {"train_loss": -36.23486328125, "global_step": 55256, "epoch": 456} {"train_loss": -36.385955810546875, "global_step": 55257, "epoch": 456} {"train_loss": -36.68071365356445, "global_step": 55258, "epoch": 456} {"train_loss": -35.908233642578125, "global_step": 55259, "epoch": 456} {"train_loss": -35.40877914428711, "global_step": 55260, "epoch": 456} {"train_loss": -36.39352035522461, "global_step": 55261, "epoch": 456} {"train_loss": -36.277366638183594, "global_step": 55262, "epoch": 456} {"train_loss": -35.247127532958984, "global_step": 55263, "epoch": 456} {"train_loss": -35.42391586303711, "global_step": 55264, "epoch": 456} {"train_loss": -34.35968780517578, "global_step": 55265, "epoch": 456} {"train_loss": -33.97455978393555, "global_step": 55266, "epoch": 456} {"train_loss": -31.845458984375, "global_step": 55267, "epoch": 456} {"train_loss": -32.455230712890625, "global_step": 55268, "epoch": 456} {"train_loss": -34.65052032470703, "global_step": 55269, "epoch": 456} {"train_loss": -36.17976760864258, "global_step": 55270, "epoch": 456} {"train_loss": -33.987239837646484, "global_step": 55271, "epoch": 456} {"train_loss": -30.65353775024414, "global_step": 55272, "epoch": 456} {"train_loss": -34.631099700927734, "global_step": 55273, "epoch": 456} {"train_loss": -35.7900390625, "global_step": 55274, "epoch": 456} {"train_loss": -34.87276077270508, "global_step": 55275, "epoch": 456} {"train_loss": -35.830013275146484, "global_step": 55276, "epoch": 456} {"train_loss": -35.823665618896484, "global_step": 55277, "epoch": 456} {"train_loss": -35.274192810058594, "global_step": 55278, "epoch": 456} {"train_loss": -36.17780303955078, "global_step": 55279, "epoch": 456} {"train_loss": -36.06917953491211, "global_step": 55280, "epoch": 456} {"train_loss": -35.47522735595703, "global_step": 55281, "epoch": 456} {"train_loss": -35.23381423950195, "global_step": 55282, "epoch": 456} {"train_loss": -35.5633430480957, "global_step": 55283, "epoch": 456} {"train_loss": -35.51869201660156, "global_step": 55284, "epoch": 456} {"train_loss": -35.72087860107422, "global_step": 55285, "epoch": 456} {"train_loss": -35.77387619018555, "global_step": 55286, "epoch": 456} {"train_loss": -35.84455490112305, "global_step": 55287, "epoch": 456} {"train_loss": -36.02324295043945, "global_step": 55288, "epoch": 456} {"train_loss": -36.193363189697266, "global_step": 55289, "epoch": 456} {"train_loss": -36.671165466308594, "global_step": 55290, "epoch": 456} {"train_loss": -35.88214111328125, "global_step": 55291, "epoch": 456} {"train_loss": -36.67877197265625, "global_step": 55292, "epoch": 456} {"train_loss": -35.909156799316406, "global_step": 55293, "epoch": 456} {"train_loss": -36.80501174926758, "global_step": 55294, "epoch": 456} {"train_loss": -36.24352264404297, "global_step": 55295, "epoch": 456} {"train_loss": -36.06271359152045, "global_step": 55296, "epoch": 456, "val_loss": 2617544.75} {"train_loss": -35.804466247558594, "global_step": 55297, "epoch": 457} {"train_loss": -36.691856384277344, "global_step": 55298, "epoch": 457} {"train_loss": -35.9204216003418, "global_step": 55299, "epoch": 457} {"train_loss": -36.92197799682617, "global_step": 55300, "epoch": 457} {"train_loss": -36.53434371948242, "global_step": 55301, "epoch": 457} {"train_loss": -36.443817138671875, "global_step": 55302, "epoch": 457} {"train_loss": -35.94063186645508, "global_step": 55303, "epoch": 457} {"train_loss": -34.88230514526367, "global_step": 55304, "epoch": 457} {"train_loss": -33.493953704833984, "global_step": 55305, "epoch": 457} {"train_loss": -31.364896774291992, "global_step": 55306, "epoch": 457} {"train_loss": -30.533878326416016, "global_step": 55307, "epoch": 457} {"train_loss": -33.98084259033203, "global_step": 55308, "epoch": 457} {"train_loss": -36.75178909301758, "global_step": 55309, "epoch": 457} {"train_loss": -34.98629379272461, "global_step": 55310, "epoch": 457} {"train_loss": -35.05780792236328, "global_step": 55311, "epoch": 457} {"train_loss": -35.82822799682617, "global_step": 55312, "epoch": 457} {"train_loss": -35.20331573486328, "global_step": 55313, "epoch": 457} {"train_loss": -34.97474670410156, "global_step": 55314, "epoch": 457} {"train_loss": -35.25312042236328, "global_step": 55315, "epoch": 457} {"train_loss": -34.44808578491211, "global_step": 55316, "epoch": 457} {"train_loss": -36.098915100097656, "global_step": 55317, "epoch": 457} {"train_loss": -35.20581817626953, "global_step": 55318, "epoch": 457} {"train_loss": -34.284786224365234, "global_step": 55319, "epoch": 457} {"train_loss": -35.791419982910156, "global_step": 55320, "epoch": 457} {"train_loss": -36.0570068359375, "global_step": 55321, "epoch": 457} {"train_loss": -34.07503128051758, "global_step": 55322, "epoch": 457} {"train_loss": -33.30036544799805, "global_step": 55323, "epoch": 457} {"train_loss": -35.3250846862793, "global_step": 55324, "epoch": 457} {"train_loss": -35.52928924560547, "global_step": 55325, "epoch": 457} {"train_loss": -32.49031448364258, "global_step": 55326, "epoch": 457} {"train_loss": -33.93696212768555, "global_step": 55327, "epoch": 457} {"train_loss": -35.00080490112305, "global_step": 55328, "epoch": 457} {"train_loss": -33.25323486328125, "global_step": 55329, "epoch": 457} {"train_loss": -35.15694808959961, "global_step": 55330, "epoch": 457} {"train_loss": -34.70685958862305, "global_step": 55331, "epoch": 457} {"train_loss": -32.32607650756836, "global_step": 55332, "epoch": 457} {"train_loss": -35.55073165893555, "global_step": 55333, "epoch": 457} {"train_loss": -35.10525131225586, "global_step": 55334, "epoch": 457} {"train_loss": -35.00213623046875, "global_step": 55335, "epoch": 457} {"train_loss": -35.16360092163086, "global_step": 55336, "epoch": 457} {"train_loss": -34.88923263549805, "global_step": 55337, "epoch": 457} {"train_loss": -36.15194320678711, "global_step": 55338, "epoch": 457} {"train_loss": -35.33087921142578, "global_step": 55339, "epoch": 457} {"train_loss": -36.103546142578125, "global_step": 55340, "epoch": 457} {"train_loss": -36.066246032714844, "global_step": 55341, "epoch": 457} {"train_loss": -35.767669677734375, "global_step": 55342, "epoch": 457} {"train_loss": -36.23662185668945, "global_step": 55343, "epoch": 457} {"train_loss": -36.138729095458984, "global_step": 55344, "epoch": 457} {"train_loss": -35.966941833496094, "global_step": 55345, "epoch": 457} {"train_loss": -36.2926025390625, "global_step": 55346, "epoch": 457} {"train_loss": -35.341026306152344, "global_step": 55347, "epoch": 457} {"train_loss": -36.43632125854492, "global_step": 55348, "epoch": 457} {"train_loss": -35.649295806884766, "global_step": 55349, "epoch": 457} {"train_loss": -35.87846374511719, "global_step": 55350, "epoch": 457} {"train_loss": -35.71397018432617, "global_step": 55351, "epoch": 457} {"train_loss": -36.048091888427734, "global_step": 55352, "epoch": 457} {"train_loss": -36.03310775756836, "global_step": 55353, "epoch": 457} {"train_loss": -36.32051467895508, "global_step": 55354, "epoch": 457} {"train_loss": -36.21409225463867, "global_step": 55355, "epoch": 457} {"train_loss": -36.17828369140625, "global_step": 55356, "epoch": 457} {"train_loss": -36.378902435302734, "global_step": 55357, "epoch": 457} {"train_loss": -35.51970291137695, "global_step": 55358, "epoch": 457} {"train_loss": -36.20640182495117, "global_step": 55359, "epoch": 457} {"train_loss": -35.68798065185547, "global_step": 55360, "epoch": 457} {"train_loss": -36.36407470703125, "global_step": 55361, "epoch": 457} {"train_loss": -36.23631286621094, "global_step": 55362, "epoch": 457} {"train_loss": -36.007598876953125, "global_step": 55363, "epoch": 457} {"train_loss": -36.525848388671875, "global_step": 55364, "epoch": 457} {"train_loss": -36.62063217163086, "global_step": 55365, "epoch": 457} {"train_loss": -36.308624267578125, "global_step": 55366, "epoch": 457} {"train_loss": -36.49201202392578, "global_step": 55367, "epoch": 457} {"train_loss": -36.60799789428711, "global_step": 55368, "epoch": 457} {"train_loss": -36.49026870727539, "global_step": 55369, "epoch": 457} {"train_loss": -36.80073928833008, "global_step": 55370, "epoch": 457} {"train_loss": -36.65393829345703, "global_step": 55371, "epoch": 457} {"train_loss": -36.558135986328125, "global_step": 55372, "epoch": 457} {"train_loss": -36.596778869628906, "global_step": 55373, "epoch": 457} {"train_loss": -36.903839111328125, "global_step": 55374, "epoch": 457} {"train_loss": -35.95085525512695, "global_step": 55375, "epoch": 457} {"train_loss": -36.8094367980957, "global_step": 55376, "epoch": 457} {"train_loss": -36.96442794799805, "global_step": 55377, "epoch": 457} {"train_loss": -36.823829650878906, "global_step": 55378, "epoch": 457} {"train_loss": -36.67847442626953, "global_step": 55379, "epoch": 457} {"train_loss": -36.73300552368164, "global_step": 55380, "epoch": 457} {"train_loss": -36.14151382446289, "global_step": 55381, "epoch": 457} {"train_loss": -36.02708435058594, "global_step": 55382, "epoch": 457} {"train_loss": -36.509639739990234, "global_step": 55383, "epoch": 457} {"train_loss": -36.22153854370117, "global_step": 55384, "epoch": 457} {"train_loss": -35.83134078979492, "global_step": 55385, "epoch": 457} {"train_loss": -37.007869720458984, "global_step": 55386, "epoch": 457} {"train_loss": -36.7442512512207, "global_step": 55387, "epoch": 457} {"train_loss": -36.117733001708984, "global_step": 55388, "epoch": 457} {"train_loss": -36.618682861328125, "global_step": 55389, "epoch": 457} {"train_loss": -37.13201141357422, "global_step": 55390, "epoch": 457} {"train_loss": -36.092899322509766, "global_step": 55391, "epoch": 457} {"train_loss": -36.880374908447266, "global_step": 55392, "epoch": 457} {"train_loss": -36.93302536010742, "global_step": 55393, "epoch": 457} {"train_loss": -35.82075500488281, "global_step": 55394, "epoch": 457} {"train_loss": -35.76512908935547, "global_step": 55395, "epoch": 457} {"train_loss": -35.79207992553711, "global_step": 55396, "epoch": 457} {"train_loss": -35.825477600097656, "global_step": 55397, "epoch": 457} {"train_loss": -35.20564651489258, "global_step": 55398, "epoch": 457} {"train_loss": -35.06130599975586, "global_step": 55399, "epoch": 457} {"train_loss": -34.5986442565918, "global_step": 55400, "epoch": 457} {"train_loss": -32.83913803100586, "global_step": 55401, "epoch": 457} {"train_loss": -27.697803497314453, "global_step": 55402, "epoch": 457} {"train_loss": -29.836225509643555, "global_step": 55403, "epoch": 457} {"train_loss": -35.727027893066406, "global_step": 55404, "epoch": 457} {"train_loss": -33.35768508911133, "global_step": 55405, "epoch": 457} {"train_loss": -32.307804107666016, "global_step": 55406, "epoch": 457} {"train_loss": -34.8852653503418, "global_step": 55407, "epoch": 457} {"train_loss": -32.8333625793457, "global_step": 55408, "epoch": 457} {"train_loss": -32.98969268798828, "global_step": 55409, "epoch": 457} {"train_loss": -34.316829681396484, "global_step": 55410, "epoch": 457} {"train_loss": -33.947017669677734, "global_step": 55411, "epoch": 457} {"train_loss": -33.69175338745117, "global_step": 55412, "epoch": 457} {"train_loss": -31.026214599609375, "global_step": 55413, "epoch": 457} {"train_loss": -12.256216049194336, "global_step": 55414, "epoch": 457} {"train_loss": -31.941495895385742, "global_step": 55415, "epoch": 457} {"train_loss": -28.66680908203125, "global_step": 55416, "epoch": 457} {"train_loss": -35.032985056727384, "global_step": 55417, "epoch": 457, "val_loss": 2702201.75} {"train_loss": -25.92854881286621, "global_step": 55418, "epoch": 458} {"train_loss": -28.42792320251465, "global_step": 55419, "epoch": 458} {"train_loss": -30.3607120513916, "global_step": 55420, "epoch": 458} {"train_loss": -26.16217041015625, "global_step": 55421, "epoch": 458} {"train_loss": -15.785880088806152, "global_step": 55422, "epoch": 458} {"train_loss": -30.38629150390625, "global_step": 55423, "epoch": 458} {"train_loss": -24.36676788330078, "global_step": 55424, "epoch": 458} {"train_loss": -29.894622802734375, "global_step": 55425, "epoch": 458} {"train_loss": -30.862335205078125, "global_step": 55426, "epoch": 458} {"train_loss": -30.074432373046875, "global_step": 55427, "epoch": 458} {"train_loss": -26.478179931640625, "global_step": 55428, "epoch": 458} {"train_loss": -29.71880531311035, "global_step": 55429, "epoch": 458} {"train_loss": -28.384687423706055, "global_step": 55430, "epoch": 458} {"train_loss": -25.795730590820312, "global_step": 55431, "epoch": 458} {"train_loss": -30.021894454956055, "global_step": 55432, "epoch": 458} {"train_loss": -29.428380966186523, "global_step": 55433, "epoch": 458} {"train_loss": -30.614500045776367, "global_step": 55434, "epoch": 458} {"train_loss": -31.53705406188965, "global_step": 55435, "epoch": 458} {"train_loss": -31.26019859313965, "global_step": 55436, "epoch": 458} {"train_loss": -29.217519760131836, "global_step": 55437, "epoch": 458} {"train_loss": -28.1784610748291, "global_step": 55438, "epoch": 458} {"train_loss": -30.329938888549805, "global_step": 55439, "epoch": 458} {"train_loss": -30.454208374023438, "global_step": 55440, "epoch": 458} {"train_loss": -31.04060173034668, "global_step": 55441, "epoch": 458} {"train_loss": -31.15309715270996, "global_step": 55442, "epoch": 458} {"train_loss": -31.36054801940918, "global_step": 55443, "epoch": 458} {"train_loss": -30.978601455688477, "global_step": 55444, "epoch": 458} {"train_loss": -30.217283248901367, "global_step": 55445, "epoch": 458} {"train_loss": -31.383045196533203, "global_step": 55446, "epoch": 458} {"train_loss": -31.716794967651367, "global_step": 55447, "epoch": 458} {"train_loss": -32.0482292175293, "global_step": 55448, "epoch": 458} {"train_loss": -31.332212448120117, "global_step": 55449, "epoch": 458} {"train_loss": -32.48759078979492, "global_step": 55450, "epoch": 458} {"train_loss": -31.565317153930664, "global_step": 55451, "epoch": 458} {"train_loss": -31.776281356811523, "global_step": 55452, "epoch": 458} {"train_loss": -33.041378021240234, "global_step": 55453, "epoch": 458} {"train_loss": -31.986108779907227, "global_step": 55454, "epoch": 458} {"train_loss": -30.91058349609375, "global_step": 55455, "epoch": 458} {"train_loss": -32.41429901123047, "global_step": 55456, "epoch": 458} {"train_loss": -32.61518096923828, "global_step": 55457, "epoch": 458} {"train_loss": -32.52918243408203, "global_step": 55458, "epoch": 458} {"train_loss": -32.469234466552734, "global_step": 55459, "epoch": 458} {"train_loss": -32.750465393066406, "global_step": 55460, "epoch": 458} {"train_loss": -32.47803497314453, "global_step": 55461, "epoch": 458} {"train_loss": -32.27628707885742, "global_step": 55462, "epoch": 458} {"train_loss": -32.651527404785156, "global_step": 55463, "epoch": 458} {"train_loss": -33.14179611206055, "global_step": 55464, "epoch": 458} {"train_loss": -32.5070686340332, "global_step": 55465, "epoch": 458} {"train_loss": -32.52039337158203, "global_step": 55466, "epoch": 458} {"train_loss": -32.73450469970703, "global_step": 55467, "epoch": 458} {"train_loss": -33.017181396484375, "global_step": 55468, "epoch": 458} {"train_loss": -33.33383560180664, "global_step": 55469, "epoch": 458} {"train_loss": -33.37841796875, "global_step": 55470, "epoch": 458} {"train_loss": -33.3561897277832, "global_step": 55471, "epoch": 458} {"train_loss": -32.95606231689453, "global_step": 55472, "epoch": 458} {"train_loss": -33.147884368896484, "global_step": 55473, "epoch": 458} {"train_loss": -33.60627365112305, "global_step": 55474, "epoch": 458} {"train_loss": -33.7672119140625, "global_step": 55475, "epoch": 458} {"train_loss": -33.83421325683594, "global_step": 55476, "epoch": 458} {"train_loss": -34.56533432006836, "global_step": 55477, "epoch": 458} {"train_loss": -33.85249710083008, "global_step": 55478, "epoch": 458} {"train_loss": -33.471588134765625, "global_step": 55479, "epoch": 458} {"train_loss": -33.599422454833984, "global_step": 55480, "epoch": 458} {"train_loss": -33.66040802001953, "global_step": 55481, "epoch": 458} {"train_loss": -33.91297149658203, "global_step": 55482, "epoch": 458} {"train_loss": -34.450618743896484, "global_step": 55483, "epoch": 458} {"train_loss": -33.43644332885742, "global_step": 55484, "epoch": 458} {"train_loss": -34.37561798095703, "global_step": 55485, "epoch": 458} {"train_loss": -34.5901985168457, "global_step": 55486, "epoch": 458} {"train_loss": -34.21794891357422, "global_step": 55487, "epoch": 458} {"train_loss": -34.48968505859375, "global_step": 55488, "epoch": 458} {"train_loss": -34.818946838378906, "global_step": 55489, "epoch": 458} {"train_loss": -34.938873291015625, "global_step": 55490, "epoch": 458} {"train_loss": -34.50239944458008, "global_step": 55491, "epoch": 458} {"train_loss": -34.6402587890625, "global_step": 55492, "epoch": 458} {"train_loss": -34.51578140258789, "global_step": 55493, "epoch": 458} {"train_loss": -34.751888275146484, "global_step": 55494, "epoch": 458} {"train_loss": -34.145206451416016, "global_step": 55495, "epoch": 458} {"train_loss": -34.6870002746582, "global_step": 55496, "epoch": 458} {"train_loss": -35.028358459472656, "global_step": 55497, "epoch": 458} {"train_loss": -34.83347702026367, "global_step": 55498, "epoch": 458} {"train_loss": -35.289608001708984, "global_step": 55499, "epoch": 458} {"train_loss": -34.52592468261719, "global_step": 55500, "epoch": 458} {"train_loss": -35.32007598876953, "global_step": 55501, "epoch": 458} {"train_loss": -35.20849609375, "global_step": 55502, "epoch": 458} {"train_loss": -34.84455490112305, "global_step": 55503, "epoch": 458} {"train_loss": -34.725494384765625, "global_step": 55504, "epoch": 458} {"train_loss": -33.670982360839844, "global_step": 55505, "epoch": 458} {"train_loss": -35.13660430908203, "global_step": 55506, "epoch": 458} {"train_loss": -34.693756103515625, "global_step": 55507, "epoch": 458} {"train_loss": -34.9613037109375, "global_step": 55508, "epoch": 458} {"train_loss": -34.41140365600586, "global_step": 55509, "epoch": 458} {"train_loss": -35.19774627685547, "global_step": 55510, "epoch": 458} {"train_loss": -35.499114990234375, "global_step": 55511, "epoch": 458} {"train_loss": -35.25741195678711, "global_step": 55512, "epoch": 458} {"train_loss": -35.02259826660156, "global_step": 55513, "epoch": 458} {"train_loss": -34.6451416015625, "global_step": 55514, "epoch": 458} {"train_loss": -34.797203063964844, "global_step": 55515, "epoch": 458} {"train_loss": -35.97617721557617, "global_step": 55516, "epoch": 458} {"train_loss": -35.18480682373047, "global_step": 55517, "epoch": 458} {"train_loss": -35.4870491027832, "global_step": 55518, "epoch": 458} {"train_loss": -35.483882904052734, "global_step": 55519, "epoch": 458} {"train_loss": -35.34089660644531, "global_step": 55520, "epoch": 458} {"train_loss": -35.60049057006836, "global_step": 55521, "epoch": 458} {"train_loss": -35.333126068115234, "global_step": 55522, "epoch": 458} {"train_loss": -35.404781341552734, "global_step": 55523, "epoch": 458} {"train_loss": -35.373348236083984, "global_step": 55524, "epoch": 458} {"train_loss": -35.780696868896484, "global_step": 55525, "epoch": 458} {"train_loss": -34.94614791870117, "global_step": 55526, "epoch": 458} {"train_loss": -35.85774612426758, "global_step": 55527, "epoch": 458} {"train_loss": -34.895450592041016, "global_step": 55528, "epoch": 458} {"train_loss": -34.3764762878418, "global_step": 55529, "epoch": 458} {"train_loss": -33.613582611083984, "global_step": 55530, "epoch": 458} {"train_loss": -32.7001838684082, "global_step": 55531, "epoch": 458} {"train_loss": -34.95165252685547, "global_step": 55532, "epoch": 458} {"train_loss": -35.95303726196289, "global_step": 55533, "epoch": 458} {"train_loss": -34.35697937011719, "global_step": 55534, "epoch": 458} {"train_loss": -32.15906524658203, "global_step": 55535, "epoch": 458} {"train_loss": -30.783353805541992, "global_step": 55536, "epoch": 458} {"train_loss": -33.52717590332031, "global_step": 55537, "epoch": 458} {"train_loss": -32.772586121046835, "global_step": 55538, "epoch": 458, "val_loss": 2561606.25} {"train_loss": -33.85480499267578, "global_step": 55539, "epoch": 459} {"train_loss": -34.906253814697266, "global_step": 55540, "epoch": 459} {"train_loss": -35.496124267578125, "global_step": 55541, "epoch": 459} {"train_loss": -33.91522216796875, "global_step": 55542, "epoch": 459} {"train_loss": -35.36125183105469, "global_step": 55543, "epoch": 459} {"train_loss": -35.28324508666992, "global_step": 55544, "epoch": 459} {"train_loss": -34.84029769897461, "global_step": 55545, "epoch": 459} {"train_loss": -35.360260009765625, "global_step": 55546, "epoch": 459} {"train_loss": -35.285736083984375, "global_step": 55547, "epoch": 459} {"train_loss": -35.306636810302734, "global_step": 55548, "epoch": 459} {"train_loss": -35.3120231628418, "global_step": 55549, "epoch": 459} {"train_loss": -35.49794387817383, "global_step": 55550, "epoch": 459} {"train_loss": -35.69944763183594, "global_step": 55551, "epoch": 459} {"train_loss": -35.644012451171875, "global_step": 55552, "epoch": 459} {"train_loss": -36.03223419189453, "global_step": 55553, "epoch": 459} {"train_loss": -35.40976333618164, "global_step": 55554, "epoch": 459} {"train_loss": -36.085784912109375, "global_step": 55555, "epoch": 459} {"train_loss": -36.16289138793945, "global_step": 55556, "epoch": 459} {"train_loss": -35.69755172729492, "global_step": 55557, "epoch": 459} {"train_loss": -35.41415023803711, "global_step": 55558, "epoch": 459} {"train_loss": -35.99965286254883, "global_step": 55559, "epoch": 459} {"train_loss": -36.0999870300293, "global_step": 55560, "epoch": 459} {"train_loss": -35.92176055908203, "global_step": 55561, "epoch": 459} {"train_loss": -36.278846740722656, "global_step": 55562, "epoch": 459} {"train_loss": -36.37739562988281, "global_step": 55563, "epoch": 459} {"train_loss": -36.42585372924805, "global_step": 55564, "epoch": 459} {"train_loss": -36.93523025512695, "global_step": 55565, "epoch": 459} {"train_loss": -36.64179611206055, "global_step": 55566, "epoch": 459} {"train_loss": -35.6408576965332, "global_step": 55567, "epoch": 459} {"train_loss": -36.12025451660156, "global_step": 55568, "epoch": 459} {"train_loss": -36.916378021240234, "global_step": 55569, "epoch": 459} {"train_loss": -36.10624694824219, "global_step": 55570, "epoch": 459} {"train_loss": -37.05453109741211, "global_step": 55571, "epoch": 459} {"train_loss": -36.7775993347168, "global_step": 55572, "epoch": 459} {"train_loss": -37.07662582397461, "global_step": 55573, "epoch": 459} {"train_loss": -36.98305892944336, "global_step": 55574, "epoch": 459} {"train_loss": -36.88886642456055, "global_step": 55575, "epoch": 459} {"train_loss": -36.42182159423828, "global_step": 55576, "epoch": 459} {"train_loss": -36.83643341064453, "global_step": 55577, "epoch": 459} {"train_loss": -36.905548095703125, "global_step": 55578, "epoch": 459} {"train_loss": -36.11226272583008, "global_step": 55579, "epoch": 459} {"train_loss": -37.02579116821289, "global_step": 55580, "epoch": 459} {"train_loss": -36.55615234375, "global_step": 55581, "epoch": 459} {"train_loss": -35.848697662353516, "global_step": 55582, "epoch": 459} {"train_loss": -35.97297286987305, "global_step": 55583, "epoch": 459} {"train_loss": -36.2686882019043, "global_step": 55584, "epoch": 459} {"train_loss": -37.04490280151367, "global_step": 55585, "epoch": 459} {"train_loss": -36.665992736816406, "global_step": 55586, "epoch": 459} {"train_loss": -36.194889068603516, "global_step": 55587, "epoch": 459} {"train_loss": -36.00457763671875, "global_step": 55588, "epoch": 459} {"train_loss": -33.84043502807617, "global_step": 55589, "epoch": 459} {"train_loss": -31.17119789123535, "global_step": 55590, "epoch": 459} {"train_loss": -27.490436553955078, "global_step": 55591, "epoch": 459} {"train_loss": -24.766033172607422, "global_step": 55592, "epoch": 459} {"train_loss": -32.491180419921875, "global_step": 55593, "epoch": 459} {"train_loss": -34.59294509887695, "global_step": 55594, "epoch": 459} {"train_loss": -29.691577911376953, "global_step": 55595, "epoch": 459} {"train_loss": -33.95538330078125, "global_step": 55596, "epoch": 459} {"train_loss": -34.30738830566406, "global_step": 55597, "epoch": 459} {"train_loss": -34.002132415771484, "global_step": 55598, "epoch": 459} {"train_loss": -34.1844367980957, "global_step": 55599, "epoch": 459} {"train_loss": -33.493385314941406, "global_step": 55600, "epoch": 459} {"train_loss": -35.85177230834961, "global_step": 55601, "epoch": 459} {"train_loss": -34.03827667236328, "global_step": 55602, "epoch": 459} {"train_loss": -35.02043151855469, "global_step": 55603, "epoch": 459} {"train_loss": -35.041988372802734, "global_step": 55604, "epoch": 459} {"train_loss": -34.84542465209961, "global_step": 55605, "epoch": 459} {"train_loss": -35.06797409057617, "global_step": 55606, "epoch": 459} {"train_loss": -35.17036819458008, "global_step": 55607, "epoch": 459} {"train_loss": -35.59441375732422, "global_step": 55608, "epoch": 459} {"train_loss": -35.0049934387207, "global_step": 55609, "epoch": 459} {"train_loss": -35.63332748413086, "global_step": 55610, "epoch": 459} {"train_loss": -35.736507415771484, "global_step": 55611, "epoch": 459} {"train_loss": -35.353572845458984, "global_step": 55612, "epoch": 459} {"train_loss": -36.125797271728516, "global_step": 55613, "epoch": 459} {"train_loss": -35.628780364990234, "global_step": 55614, "epoch": 459} {"train_loss": -35.52912521362305, "global_step": 55615, "epoch": 459} {"train_loss": -34.96134567260742, "global_step": 55616, "epoch": 459} {"train_loss": -36.00269317626953, "global_step": 55617, "epoch": 459} {"train_loss": -35.95295715332031, "global_step": 55618, "epoch": 459} {"train_loss": -35.727317810058594, "global_step": 55619, "epoch": 459} {"train_loss": -36.183956146240234, "global_step": 55620, "epoch": 459} {"train_loss": -36.010616302490234, "global_step": 55621, "epoch": 459} {"train_loss": -35.270118713378906, "global_step": 55622, "epoch": 459} {"train_loss": -35.42934036254883, "global_step": 55623, "epoch": 459} {"train_loss": -36.05111312866211, "global_step": 55624, "epoch": 459} {"train_loss": -35.93447494506836, "global_step": 55625, "epoch": 459} {"train_loss": -35.192787170410156, "global_step": 55626, "epoch": 459} {"train_loss": -35.500770568847656, "global_step": 55627, "epoch": 459} {"train_loss": -36.454132080078125, "global_step": 55628, "epoch": 459} {"train_loss": -35.866058349609375, "global_step": 55629, "epoch": 459} {"train_loss": -35.96771240234375, "global_step": 55630, "epoch": 459} {"train_loss": -35.56351852416992, "global_step": 55631, "epoch": 459} {"train_loss": -34.87937545776367, "global_step": 55632, "epoch": 459} {"train_loss": -34.92598342895508, "global_step": 55633, "epoch": 459} {"train_loss": -34.0999641418457, "global_step": 55634, "epoch": 459} {"train_loss": -35.20631790161133, "global_step": 55635, "epoch": 459} {"train_loss": -36.422607421875, "global_step": 55636, "epoch": 459} {"train_loss": -36.138336181640625, "global_step": 55637, "epoch": 459} {"train_loss": -36.058021545410156, "global_step": 55638, "epoch": 459} {"train_loss": -36.22493362426758, "global_step": 55639, "epoch": 459} {"train_loss": -36.58754348754883, "global_step": 55640, "epoch": 459} {"train_loss": -36.02417755126953, "global_step": 55641, "epoch": 459} {"train_loss": -36.04905319213867, "global_step": 55642, "epoch": 459} {"train_loss": -35.53902053833008, "global_step": 55643, "epoch": 459} {"train_loss": -36.197853088378906, "global_step": 55644, "epoch": 459} {"train_loss": -35.20565414428711, "global_step": 55645, "epoch": 459} {"train_loss": -34.791255950927734, "global_step": 55646, "epoch": 459} {"train_loss": -35.80189895629883, "global_step": 55647, "epoch": 459} {"train_loss": -36.262367248535156, "global_step": 55648, "epoch": 459} {"train_loss": -35.028411865234375, "global_step": 55649, "epoch": 459} {"train_loss": -35.51205825805664, "global_step": 55650, "epoch": 459} {"train_loss": -35.04136657714844, "global_step": 55651, "epoch": 459} {"train_loss": -35.116554260253906, "global_step": 55652, "epoch": 459} {"train_loss": -36.31635284423828, "global_step": 55653, "epoch": 459} {"train_loss": -35.801631927490234, "global_step": 55654, "epoch": 459} {"train_loss": -36.19513702392578, "global_step": 55655, "epoch": 459} {"train_loss": -36.329750061035156, "global_step": 55656, "epoch": 459} {"train_loss": -35.78683090209961, "global_step": 55657, "epoch": 459} {"train_loss": -35.05250930786133, "global_step": 55658, "epoch": 459} {"train_loss": -35.41428963211942, "global_step": 55659, "epoch": 459, "val_loss": 2591595.0} {"train_loss": -36.223785400390625, "global_step": 55660, "epoch": 460} {"train_loss": -35.037757873535156, "global_step": 55661, "epoch": 460} {"train_loss": -36.375057220458984, "global_step": 55662, "epoch": 460} {"train_loss": -35.426612854003906, "global_step": 55663, "epoch": 460} {"train_loss": -35.673011779785156, "global_step": 55664, "epoch": 460} {"train_loss": -35.16389465332031, "global_step": 55665, "epoch": 460} {"train_loss": -36.08867263793945, "global_step": 55666, "epoch": 460} {"train_loss": -35.965118408203125, "global_step": 55667, "epoch": 460} {"train_loss": -36.18363571166992, "global_step": 55668, "epoch": 460} {"train_loss": -35.3034782409668, "global_step": 55669, "epoch": 460} {"train_loss": -33.39136505126953, "global_step": 55670, "epoch": 460} {"train_loss": -36.07973098754883, "global_step": 55671, "epoch": 460} {"train_loss": -35.25455856323242, "global_step": 55672, "epoch": 460} {"train_loss": -35.45356750488281, "global_step": 55673, "epoch": 460} {"train_loss": -36.158870697021484, "global_step": 55674, "epoch": 460} {"train_loss": -35.41053771972656, "global_step": 55675, "epoch": 460} {"train_loss": -33.77565383911133, "global_step": 55676, "epoch": 460} {"train_loss": -34.37733840942383, "global_step": 55677, "epoch": 460} {"train_loss": -36.02755355834961, "global_step": 55678, "epoch": 460} {"train_loss": -35.68502426147461, "global_step": 55679, "epoch": 460} {"train_loss": -35.87124252319336, "global_step": 55680, "epoch": 460} {"train_loss": -35.90476608276367, "global_step": 55681, "epoch": 460} {"train_loss": -34.19104766845703, "global_step": 55682, "epoch": 460} {"train_loss": -36.12152099609375, "global_step": 55683, "epoch": 460} {"train_loss": -35.91813278198242, "global_step": 55684, "epoch": 460} {"train_loss": -34.86712646484375, "global_step": 55685, "epoch": 460} {"train_loss": -35.69564437866211, "global_step": 55686, "epoch": 460} {"train_loss": -36.793357849121094, "global_step": 55687, "epoch": 460} {"train_loss": -35.38762283325195, "global_step": 55688, "epoch": 460} {"train_loss": -36.255096435546875, "global_step": 55689, "epoch": 460} {"train_loss": -36.22651290893555, "global_step": 55690, "epoch": 460} {"train_loss": -36.66521072387695, "global_step": 55691, "epoch": 460} {"train_loss": -35.545467376708984, "global_step": 55692, "epoch": 460} {"train_loss": -35.08972930908203, "global_step": 55693, "epoch": 460} {"train_loss": -35.09489440917969, "global_step": 55694, "epoch": 460} {"train_loss": -36.138526916503906, "global_step": 55695, "epoch": 460} {"train_loss": -35.95566177368164, "global_step": 55696, "epoch": 460} {"train_loss": -35.49385070800781, "global_step": 55697, "epoch": 460} {"train_loss": -36.556640625, "global_step": 55698, "epoch": 460} {"train_loss": -34.86085510253906, "global_step": 55699, "epoch": 460} {"train_loss": -35.645633697509766, "global_step": 55700, "epoch": 460} {"train_loss": -35.70916748046875, "global_step": 55701, "epoch": 460} {"train_loss": -35.803436279296875, "global_step": 55702, "epoch": 460} {"train_loss": -33.99619674682617, "global_step": 55703, "epoch": 460} {"train_loss": -36.41608810424805, "global_step": 55704, "epoch": 460} {"train_loss": -35.11172103881836, "global_step": 55705, "epoch": 460} {"train_loss": -36.21148681640625, "global_step": 55706, "epoch": 460} {"train_loss": -35.52119827270508, "global_step": 55707, "epoch": 460} {"train_loss": -35.773555755615234, "global_step": 55708, "epoch": 460} {"train_loss": -36.09237289428711, "global_step": 55709, "epoch": 460} {"train_loss": -34.533843994140625, "global_step": 55710, "epoch": 460} {"train_loss": -35.42937469482422, "global_step": 55711, "epoch": 460} {"train_loss": -34.186702728271484, "global_step": 55712, "epoch": 460} {"train_loss": -35.4205436706543, "global_step": 55713, "epoch": 460} {"train_loss": -36.30702590942383, "global_step": 55714, "epoch": 460} {"train_loss": -36.00336837768555, "global_step": 55715, "epoch": 460} {"train_loss": -34.169490814208984, "global_step": 55716, "epoch": 460} {"train_loss": -34.002410888671875, "global_step": 55717, "epoch": 460} {"train_loss": -33.995628356933594, "global_step": 55718, "epoch": 460} {"train_loss": -35.10093688964844, "global_step": 55719, "epoch": 460} {"train_loss": -34.77259063720703, "global_step": 55720, "epoch": 460} {"train_loss": -34.92787551879883, "global_step": 55721, "epoch": 460} {"train_loss": -35.42056655883789, "global_step": 55722, "epoch": 460} {"train_loss": -34.48501205444336, "global_step": 55723, "epoch": 460} {"train_loss": -35.55038833618164, "global_step": 55724, "epoch": 460} {"train_loss": -35.555702209472656, "global_step": 55725, "epoch": 460} {"train_loss": -35.167503356933594, "global_step": 55726, "epoch": 460} {"train_loss": -36.23408126831055, "global_step": 55727, "epoch": 460} {"train_loss": -35.135005950927734, "global_step": 55728, "epoch": 460} {"train_loss": -35.03190231323242, "global_step": 55729, "epoch": 460} {"train_loss": -35.90891647338867, "global_step": 55730, "epoch": 460} {"train_loss": -35.00972366333008, "global_step": 55731, "epoch": 460} {"train_loss": -35.71568298339844, "global_step": 55732, "epoch": 460} {"train_loss": -35.34901809692383, "global_step": 55733, "epoch": 460} {"train_loss": -36.17116928100586, "global_step": 55734, "epoch": 460} {"train_loss": -35.736690521240234, "global_step": 55735, "epoch": 460} {"train_loss": -35.51271438598633, "global_step": 55736, "epoch": 460} {"train_loss": -36.32061767578125, "global_step": 55737, "epoch": 460} {"train_loss": -35.56624984741211, "global_step": 55738, "epoch": 460} {"train_loss": -35.79357147216797, "global_step": 55739, "epoch": 460} {"train_loss": -36.23568344116211, "global_step": 55740, "epoch": 460} {"train_loss": -34.28872299194336, "global_step": 55741, "epoch": 460} {"train_loss": -35.38433837890625, "global_step": 55742, "epoch": 460} {"train_loss": -35.65507125854492, "global_step": 55743, "epoch": 460} {"train_loss": -34.778560638427734, "global_step": 55744, "epoch": 460} {"train_loss": -35.58768844604492, "global_step": 55745, "epoch": 460} {"train_loss": -35.04420852661133, "global_step": 55746, "epoch": 460} {"train_loss": -35.57912063598633, "global_step": 55747, "epoch": 460} {"train_loss": -36.36792755126953, "global_step": 55748, "epoch": 460} {"train_loss": -35.35595703125, "global_step": 55749, "epoch": 460} {"train_loss": -35.4978141784668, "global_step": 55750, "epoch": 460} {"train_loss": -36.106773376464844, "global_step": 55751, "epoch": 460} {"train_loss": -35.1655387878418, "global_step": 55752, "epoch": 460} {"train_loss": -36.19868850708008, "global_step": 55753, "epoch": 460} {"train_loss": -35.72075271606445, "global_step": 55754, "epoch": 460} {"train_loss": -35.9210090637207, "global_step": 55755, "epoch": 460} {"train_loss": -36.053401947021484, "global_step": 55756, "epoch": 460} {"train_loss": -35.14207077026367, "global_step": 55757, "epoch": 460} {"train_loss": -36.2250862121582, "global_step": 55758, "epoch": 460} {"train_loss": -35.81997299194336, "global_step": 55759, "epoch": 460} {"train_loss": -35.132347106933594, "global_step": 55760, "epoch": 460} {"train_loss": -36.06954574584961, "global_step": 55761, "epoch": 460} {"train_loss": -35.93798828125, "global_step": 55762, "epoch": 460} {"train_loss": -35.954959869384766, "global_step": 55763, "epoch": 460} {"train_loss": -35.73786163330078, "global_step": 55764, "epoch": 460} {"train_loss": -35.888423919677734, "global_step": 55765, "epoch": 460} {"train_loss": -34.81547164916992, "global_step": 55766, "epoch": 460} {"train_loss": -35.24637985229492, "global_step": 55767, "epoch": 460} {"train_loss": -35.37952423095703, "global_step": 55768, "epoch": 460} {"train_loss": -35.45327377319336, "global_step": 55769, "epoch": 460} {"train_loss": -36.2342414855957, "global_step": 55770, "epoch": 460} {"train_loss": -34.85355758666992, "global_step": 55771, "epoch": 460} {"train_loss": -33.46419906616211, "global_step": 55772, "epoch": 460} {"train_loss": -34.737274169921875, "global_step": 55773, "epoch": 460} {"train_loss": -31.69917869567871, "global_step": 55774, "epoch": 460} {"train_loss": -26.902912139892578, "global_step": 55775, "epoch": 460} {"train_loss": -12.376866340637207, "global_step": 55776, "epoch": 460} {"train_loss": 19.640026092529297, "global_step": 55777, "epoch": 460} {"train_loss": -1.7904748916625977, "global_step": 55778, "epoch": 460} {"train_loss": -34.25583267211914, "global_step": 55779, "epoch": 460} {"train_loss": -34.289498132122446, "global_step": 55780, "epoch": 460, "val_loss": 2572704.5} {"train_loss": -33.17616653442383, "global_step": 55781, "epoch": 461} {"train_loss": -27.270782470703125, "global_step": 55782, "epoch": 461} {"train_loss": -27.40168571472168, "global_step": 55783, "epoch": 461} {"train_loss": -32.92268753051758, "global_step": 55784, "epoch": 461} {"train_loss": -28.977603912353516, "global_step": 55785, "epoch": 461} {"train_loss": -28.5023193359375, "global_step": 55786, "epoch": 461} {"train_loss": -33.18937301635742, "global_step": 55787, "epoch": 461} {"train_loss": -32.74393844604492, "global_step": 55788, "epoch": 461} {"train_loss": -29.950519561767578, "global_step": 55789, "epoch": 461} {"train_loss": -32.43104934692383, "global_step": 55790, "epoch": 461} {"train_loss": -32.829750061035156, "global_step": 55791, "epoch": 461} {"train_loss": -33.1528205871582, "global_step": 55792, "epoch": 461} {"train_loss": -32.631866455078125, "global_step": 55793, "epoch": 461} {"train_loss": -30.8153076171875, "global_step": 55794, "epoch": 461} {"train_loss": -32.4295654296875, "global_step": 55795, "epoch": 461} {"train_loss": -33.723182678222656, "global_step": 55796, "epoch": 461} {"train_loss": -32.916839599609375, "global_step": 55797, "epoch": 461} {"train_loss": -33.06639862060547, "global_step": 55798, "epoch": 461} {"train_loss": -32.85995101928711, "global_step": 55799, "epoch": 461} {"train_loss": -32.91984939575195, "global_step": 55800, "epoch": 461} {"train_loss": -33.60573959350586, "global_step": 55801, "epoch": 461} {"train_loss": -33.8658561706543, "global_step": 55802, "epoch": 461} {"train_loss": -33.14742660522461, "global_step": 55803, "epoch": 461} {"train_loss": -33.37200927734375, "global_step": 55804, "epoch": 461} {"train_loss": -33.37274932861328, "global_step": 55805, "epoch": 461} {"train_loss": -34.011165618896484, "global_step": 55806, "epoch": 461} {"train_loss": -33.665992736816406, "global_step": 55807, "epoch": 461} {"train_loss": -34.586334228515625, "global_step": 55808, "epoch": 461} {"train_loss": -33.90944290161133, "global_step": 55809, "epoch": 461} {"train_loss": -34.22930145263672, "global_step": 55810, "epoch": 461} {"train_loss": -34.031768798828125, "global_step": 55811, "epoch": 461} {"train_loss": -34.47228240966797, "global_step": 55812, "epoch": 461} {"train_loss": -34.48414993286133, "global_step": 55813, "epoch": 461} {"train_loss": -34.690589904785156, "global_step": 55814, "epoch": 461} {"train_loss": -34.89907455444336, "global_step": 55815, "epoch": 461} {"train_loss": -33.961402893066406, "global_step": 55816, "epoch": 461} {"train_loss": -34.46041488647461, "global_step": 55817, "epoch": 461} {"train_loss": -34.85712432861328, "global_step": 55818, "epoch": 461} {"train_loss": -34.38444900512695, "global_step": 55819, "epoch": 461} {"train_loss": -35.03384017944336, "global_step": 55820, "epoch": 461} {"train_loss": -35.105167388916016, "global_step": 55821, "epoch": 461} {"train_loss": -35.140316009521484, "global_step": 55822, "epoch": 461} {"train_loss": -35.07216262817383, "global_step": 55823, "epoch": 461} {"train_loss": -34.750633239746094, "global_step": 55824, "epoch": 461} {"train_loss": -35.16109848022461, "global_step": 55825, "epoch": 461} {"train_loss": -35.2090950012207, "global_step": 55826, "epoch": 461} {"train_loss": -34.776832580566406, "global_step": 55827, "epoch": 461} {"train_loss": -35.706417083740234, "global_step": 55828, "epoch": 461} {"train_loss": -35.06972122192383, "global_step": 55829, "epoch": 461} {"train_loss": -35.20306396484375, "global_step": 55830, "epoch": 461} {"train_loss": -35.12041091918945, "global_step": 55831, "epoch": 461} {"train_loss": -35.528533935546875, "global_step": 55832, "epoch": 461} {"train_loss": -35.55928421020508, "global_step": 55833, "epoch": 461} {"train_loss": -35.604183197021484, "global_step": 55834, "epoch": 461} {"train_loss": -35.72941970825195, "global_step": 55835, "epoch": 461} {"train_loss": -35.713340759277344, "global_step": 55836, "epoch": 461} {"train_loss": -35.54052734375, "global_step": 55837, "epoch": 461} {"train_loss": -35.64065170288086, "global_step": 55838, "epoch": 461} {"train_loss": -35.64670944213867, "global_step": 55839, "epoch": 461} {"train_loss": -35.84304428100586, "global_step": 55840, "epoch": 461} {"train_loss": -35.95925521850586, "global_step": 55841, "epoch": 461} {"train_loss": -35.88113021850586, "global_step": 55842, "epoch": 461} {"train_loss": -35.81234359741211, "global_step": 55843, "epoch": 461} {"train_loss": -35.99686813354492, "global_step": 55844, "epoch": 461} {"train_loss": -35.62971115112305, "global_step": 55845, "epoch": 461} {"train_loss": -35.9023323059082, "global_step": 55846, "epoch": 461} {"train_loss": -36.015079498291016, "global_step": 55847, "epoch": 461} {"train_loss": -36.432193756103516, "global_step": 55848, "epoch": 461} {"train_loss": -36.233970642089844, "global_step": 55849, "epoch": 461} {"train_loss": -36.138671875, "global_step": 55850, "epoch": 461} {"train_loss": -36.59726333618164, "global_step": 55851, "epoch": 461} {"train_loss": -36.07168960571289, "global_step": 55852, "epoch": 461} {"train_loss": -36.3287353515625, "global_step": 55853, "epoch": 461} {"train_loss": -36.21912384033203, "global_step": 55854, "epoch": 461} {"train_loss": -36.296932220458984, "global_step": 55855, "epoch": 461} {"train_loss": -36.61603546142578, "global_step": 55856, "epoch": 461} {"train_loss": -36.23847198486328, "global_step": 55857, "epoch": 461} {"train_loss": -36.50519561767578, "global_step": 55858, "epoch": 461} {"train_loss": -36.194671630859375, "global_step": 55859, "epoch": 461} {"train_loss": -36.40243148803711, "global_step": 55860, "epoch": 461} {"train_loss": -35.69265365600586, "global_step": 55861, "epoch": 461} {"train_loss": -36.0427360534668, "global_step": 55862, "epoch": 461} {"train_loss": -35.79412841796875, "global_step": 55863, "epoch": 461} {"train_loss": -36.08550262451172, "global_step": 55864, "epoch": 461} {"train_loss": -35.25338363647461, "global_step": 55865, "epoch": 461} {"train_loss": -34.08277130126953, "global_step": 55866, "epoch": 461} {"train_loss": -32.14060592651367, "global_step": 55867, "epoch": 461} {"train_loss": -32.907711029052734, "global_step": 55868, "epoch": 461} {"train_loss": -35.14704513549805, "global_step": 55869, "epoch": 461} {"train_loss": -36.68258285522461, "global_step": 55870, "epoch": 461} {"train_loss": -35.6484375, "global_step": 55871, "epoch": 461} {"train_loss": -35.63480758666992, "global_step": 55872, "epoch": 461} {"train_loss": -36.56576156616211, "global_step": 55873, "epoch": 461} {"train_loss": -34.79409408569336, "global_step": 55874, "epoch": 461} {"train_loss": -35.30942916870117, "global_step": 55875, "epoch": 461} {"train_loss": -36.20026779174805, "global_step": 55876, "epoch": 461} {"train_loss": -34.580665588378906, "global_step": 55877, "epoch": 461} {"train_loss": -35.26259994506836, "global_step": 55878, "epoch": 461} {"train_loss": -35.97666549682617, "global_step": 55879, "epoch": 461} {"train_loss": -34.612361907958984, "global_step": 55880, "epoch": 461} {"train_loss": -34.6683235168457, "global_step": 55881, "epoch": 461} {"train_loss": -32.21445083618164, "global_step": 55882, "epoch": 461} {"train_loss": -32.36643981933594, "global_step": 55883, "epoch": 461} {"train_loss": -33.51557540893555, "global_step": 55884, "epoch": 461} {"train_loss": -34.550777435302734, "global_step": 55885, "epoch": 461} {"train_loss": -34.75453567504883, "global_step": 55886, "epoch": 461} {"train_loss": -32.808509826660156, "global_step": 55887, "epoch": 461} {"train_loss": -33.808773040771484, "global_step": 55888, "epoch": 461} {"train_loss": -34.7441291809082, "global_step": 55889, "epoch": 461} {"train_loss": -34.21722412109375, "global_step": 55890, "epoch": 461} {"train_loss": -33.21912384033203, "global_step": 55891, "epoch": 461} {"train_loss": -33.627071380615234, "global_step": 55892, "epoch": 461} {"train_loss": -35.382720947265625, "global_step": 55893, "epoch": 461} {"train_loss": -35.06458282470703, "global_step": 55894, "epoch": 461} {"train_loss": -34.1250114440918, "global_step": 55895, "epoch": 461} {"train_loss": -34.72221755981445, "global_step": 55896, "epoch": 461} {"train_loss": -35.75023651123047, "global_step": 55897, "epoch": 461} {"train_loss": -34.13325881958008, "global_step": 55898, "epoch": 461} {"train_loss": -35.24460983276367, "global_step": 55899, "epoch": 461} {"train_loss": -35.34064865112305, "global_step": 55900, "epoch": 461} {"train_loss": -34.47152191351268, "global_step": 55901, "epoch": 461, "val_loss": 2689381.5} {"train_loss": -35.51996994018555, "global_step": 55902, "epoch": 462} {"train_loss": -34.83674240112305, "global_step": 55903, "epoch": 462} {"train_loss": -34.93806838989258, "global_step": 55904, "epoch": 462} {"train_loss": -35.5044059753418, "global_step": 55905, "epoch": 462} {"train_loss": -34.5065803527832, "global_step": 55906, "epoch": 462} {"train_loss": -35.625057220458984, "global_step": 55907, "epoch": 462} {"train_loss": -34.83628463745117, "global_step": 55908, "epoch": 462} {"train_loss": -35.188255310058594, "global_step": 55909, "epoch": 462} {"train_loss": -33.126220703125, "global_step": 55910, "epoch": 462} {"train_loss": -35.20551681518555, "global_step": 55911, "epoch": 462} {"train_loss": -33.97125244140625, "global_step": 55912, "epoch": 462} {"train_loss": -35.02512741088867, "global_step": 55913, "epoch": 462} {"train_loss": -34.332496643066406, "global_step": 55914, "epoch": 462} {"train_loss": -34.14626693725586, "global_step": 55915, "epoch": 462} {"train_loss": -34.10353469848633, "global_step": 55916, "epoch": 462} {"train_loss": -34.09100341796875, "global_step": 55917, "epoch": 462} {"train_loss": -33.42133331298828, "global_step": 55918, "epoch": 462} {"train_loss": -33.516136169433594, "global_step": 55919, "epoch": 462} {"train_loss": -33.505615234375, "global_step": 55920, "epoch": 462} {"train_loss": -34.95087814331055, "global_step": 55921, "epoch": 462} {"train_loss": -32.9031982421875, "global_step": 55922, "epoch": 462} {"train_loss": -35.298065185546875, "global_step": 55923, "epoch": 462} {"train_loss": -33.91034698486328, "global_step": 55924, "epoch": 462} {"train_loss": -35.23603439331055, "global_step": 55925, "epoch": 462} {"train_loss": -35.42573165893555, "global_step": 55926, "epoch": 462} {"train_loss": -34.161598205566406, "global_step": 55927, "epoch": 462} {"train_loss": -34.66958236694336, "global_step": 55928, "epoch": 462} {"train_loss": -35.18605422973633, "global_step": 55929, "epoch": 462} {"train_loss": -35.46230697631836, "global_step": 55930, "epoch": 462} {"train_loss": -34.819068908691406, "global_step": 55931, "epoch": 462} {"train_loss": -35.904571533203125, "global_step": 55932, "epoch": 462} {"train_loss": -34.74457931518555, "global_step": 55933, "epoch": 462} {"train_loss": -34.7480354309082, "global_step": 55934, "epoch": 462} {"train_loss": -34.84620666503906, "global_step": 55935, "epoch": 462} {"train_loss": -35.899169921875, "global_step": 55936, "epoch": 462} {"train_loss": -35.483551025390625, "global_step": 55937, "epoch": 462} {"train_loss": -35.41499710083008, "global_step": 55938, "epoch": 462} {"train_loss": -35.745906829833984, "global_step": 55939, "epoch": 462} {"train_loss": -35.77769088745117, "global_step": 55940, "epoch": 462} {"train_loss": -35.63582992553711, "global_step": 55941, "epoch": 462} {"train_loss": -35.36806869506836, "global_step": 55942, "epoch": 462} {"train_loss": -35.537391662597656, "global_step": 55943, "epoch": 462} {"train_loss": -35.48736572265625, "global_step": 55944, "epoch": 462} {"train_loss": -35.531524658203125, "global_step": 55945, "epoch": 462} {"train_loss": -35.64503860473633, "global_step": 55946, "epoch": 462} {"train_loss": -35.72249984741211, "global_step": 55947, "epoch": 462} {"train_loss": -34.61072540283203, "global_step": 55948, "epoch": 462} {"train_loss": -35.2276725769043, "global_step": 55949, "epoch": 462} {"train_loss": -35.085662841796875, "global_step": 55950, "epoch": 462} {"train_loss": -35.716651916503906, "global_step": 55951, "epoch": 462} {"train_loss": -34.772830963134766, "global_step": 55952, "epoch": 462} {"train_loss": -35.161312103271484, "global_step": 55953, "epoch": 462} {"train_loss": -35.370513916015625, "global_step": 55954, "epoch": 462} {"train_loss": -35.72185134887695, "global_step": 55955, "epoch": 462} {"train_loss": -35.58464431762695, "global_step": 55956, "epoch": 462} {"train_loss": -36.350181579589844, "global_step": 55957, "epoch": 462} {"train_loss": -35.7779541015625, "global_step": 55958, "epoch": 462} {"train_loss": -34.92291259765625, "global_step": 55959, "epoch": 462} {"train_loss": -36.444557189941406, "global_step": 55960, "epoch": 462} {"train_loss": -35.579139709472656, "global_step": 55961, "epoch": 462} {"train_loss": -35.56708526611328, "global_step": 55962, "epoch": 462} {"train_loss": -36.3172607421875, "global_step": 55963, "epoch": 462} {"train_loss": -32.93278884887695, "global_step": 55964, "epoch": 462} {"train_loss": -35.804012298583984, "global_step": 55965, "epoch": 462} {"train_loss": -35.23044967651367, "global_step": 55966, "epoch": 462} {"train_loss": -35.07963943481445, "global_step": 55967, "epoch": 462} {"train_loss": -36.30930709838867, "global_step": 55968, "epoch": 462} {"train_loss": -35.327606201171875, "global_step": 55969, "epoch": 462} {"train_loss": -36.21370315551758, "global_step": 55970, "epoch": 462} {"train_loss": -35.98760986328125, "global_step": 55971, "epoch": 462} {"train_loss": -35.91950225830078, "global_step": 55972, "epoch": 462} {"train_loss": -34.735469818115234, "global_step": 55973, "epoch": 462} {"train_loss": -35.15180587768555, "global_step": 55974, "epoch": 462} {"train_loss": -36.009254455566406, "global_step": 55975, "epoch": 462} {"train_loss": -35.348365783691406, "global_step": 55976, "epoch": 462} {"train_loss": -35.101375579833984, "global_step": 55977, "epoch": 462} {"train_loss": -35.757835388183594, "global_step": 55978, "epoch": 462} {"train_loss": -35.29987716674805, "global_step": 55979, "epoch": 462} {"train_loss": -35.59920120239258, "global_step": 55980, "epoch": 462} {"train_loss": -34.471153259277344, "global_step": 55981, "epoch": 462} {"train_loss": -36.05320358276367, "global_step": 55982, "epoch": 462} {"train_loss": -35.528804779052734, "global_step": 55983, "epoch": 462} {"train_loss": -34.874080657958984, "global_step": 55984, "epoch": 462} {"train_loss": -36.107994079589844, "global_step": 55985, "epoch": 462} {"train_loss": -35.64173889160156, "global_step": 55986, "epoch": 462} {"train_loss": -35.07137680053711, "global_step": 55987, "epoch": 462} {"train_loss": -35.88405227661133, "global_step": 55988, "epoch": 462} {"train_loss": -35.47845458984375, "global_step": 55989, "epoch": 462} {"train_loss": -34.5423583984375, "global_step": 55990, "epoch": 462} {"train_loss": -35.69430160522461, "global_step": 55991, "epoch": 462} {"train_loss": -35.587623596191406, "global_step": 55992, "epoch": 462} {"train_loss": -34.93092727661133, "global_step": 55993, "epoch": 462} {"train_loss": -32.73867416381836, "global_step": 55994, "epoch": 462} {"train_loss": -33.783321380615234, "global_step": 55995, "epoch": 462} {"train_loss": -31.298431396484375, "global_step": 55996, "epoch": 462} {"train_loss": -30.856201171875, "global_step": 55997, "epoch": 462} {"train_loss": -32.08702850341797, "global_step": 55998, "epoch": 462} {"train_loss": -33.99294662475586, "global_step": 55999, "epoch": 462} {"train_loss": -31.49810218811035, "global_step": 56000, "epoch": 462} {"train_loss": -32.78208923339844, "global_step": 56001, "epoch": 462} {"train_loss": -34.86766052246094, "global_step": 56002, "epoch": 462} {"train_loss": -32.318939208984375, "global_step": 56003, "epoch": 462} {"train_loss": -31.792200088500977, "global_step": 56004, "epoch": 462} {"train_loss": -31.173816680908203, "global_step": 56005, "epoch": 462} {"train_loss": -35.137176513671875, "global_step": 56006, "epoch": 462} {"train_loss": -33.137046813964844, "global_step": 56007, "epoch": 462} {"train_loss": -33.0242805480957, "global_step": 56008, "epoch": 462} {"train_loss": -33.398921966552734, "global_step": 56009, "epoch": 462} {"train_loss": -32.75860595703125, "global_step": 56010, "epoch": 462} {"train_loss": -31.618371963500977, "global_step": 56011, "epoch": 462} {"train_loss": -33.04063034057617, "global_step": 56012, "epoch": 462} {"train_loss": -34.1180534362793, "global_step": 56013, "epoch": 462} {"train_loss": -34.18562316894531, "global_step": 56014, "epoch": 462} {"train_loss": -33.04011154174805, "global_step": 56015, "epoch": 462} {"train_loss": -33.614662170410156, "global_step": 56016, "epoch": 462} {"train_loss": -34.92403030395508, "global_step": 56017, "epoch": 462} {"train_loss": -33.12355422973633, "global_step": 56018, "epoch": 462} {"train_loss": -32.72663497924805, "global_step": 56019, "epoch": 462} {"train_loss": -33.54948806762695, "global_step": 56020, "epoch": 462} {"train_loss": -33.789371490478516, "global_step": 56021, "epoch": 462} {"train_loss": -34.639636410169366, "global_step": 56022, "epoch": 462, "val_loss": 2517580.75} {"train_loss": -32.82461166381836, "global_step": 56023, "epoch": 463} {"train_loss": -33.69993591308594, "global_step": 56024, "epoch": 463} {"train_loss": -33.44258499145508, "global_step": 56025, "epoch": 463} {"train_loss": -33.286041259765625, "global_step": 56026, "epoch": 463} {"train_loss": -34.44743728637695, "global_step": 56027, "epoch": 463} {"train_loss": -33.689537048339844, "global_step": 56028, "epoch": 463} {"train_loss": -33.88117218017578, "global_step": 56029, "epoch": 463} {"train_loss": -33.674190521240234, "global_step": 56030, "epoch": 463} {"train_loss": -32.75813293457031, "global_step": 56031, "epoch": 463} {"train_loss": -33.614112854003906, "global_step": 56032, "epoch": 463} {"train_loss": -33.751617431640625, "global_step": 56033, "epoch": 463} {"train_loss": -34.080780029296875, "global_step": 56034, "epoch": 463} {"train_loss": -31.51832389831543, "global_step": 56035, "epoch": 463} {"train_loss": -33.93547821044922, "global_step": 56036, "epoch": 463} {"train_loss": -34.32246017456055, "global_step": 56037, "epoch": 463} {"train_loss": -34.363258361816406, "global_step": 56038, "epoch": 463} {"train_loss": -34.5482292175293, "global_step": 56039, "epoch": 463} {"train_loss": -34.667755126953125, "global_step": 56040, "epoch": 463} {"train_loss": -34.482975006103516, "global_step": 56041, "epoch": 463} {"train_loss": -35.06574249267578, "global_step": 56042, "epoch": 463} {"train_loss": -34.1667366027832, "global_step": 56043, "epoch": 463} {"train_loss": -35.00397491455078, "global_step": 56044, "epoch": 463} {"train_loss": -34.364967346191406, "global_step": 56045, "epoch": 463} {"train_loss": -34.42291259765625, "global_step": 56046, "epoch": 463} {"train_loss": -34.91816329956055, "global_step": 56047, "epoch": 463} {"train_loss": -34.9390869140625, "global_step": 56048, "epoch": 463} {"train_loss": -32.762908935546875, "global_step": 56049, "epoch": 463} {"train_loss": -34.84853744506836, "global_step": 56050, "epoch": 463} {"train_loss": -34.628211975097656, "global_step": 56051, "epoch": 463} {"train_loss": -34.500484466552734, "global_step": 56052, "epoch": 463} {"train_loss": -34.82756423950195, "global_step": 56053, "epoch": 463} {"train_loss": -35.23179244995117, "global_step": 56054, "epoch": 463} {"train_loss": -35.47773361206055, "global_step": 56055, "epoch": 463} {"train_loss": -34.806461334228516, "global_step": 56056, "epoch": 463} {"train_loss": -34.810489654541016, "global_step": 56057, "epoch": 463} {"train_loss": -35.50022506713867, "global_step": 56058, "epoch": 463} {"train_loss": -35.16331100463867, "global_step": 56059, "epoch": 463} {"train_loss": -35.543846130371094, "global_step": 56060, "epoch": 463} {"train_loss": -35.11983871459961, "global_step": 56061, "epoch": 463} {"train_loss": -35.51455307006836, "global_step": 56062, "epoch": 463} {"train_loss": -35.47646713256836, "global_step": 56063, "epoch": 463} {"train_loss": -34.86549758911133, "global_step": 56064, "epoch": 463} {"train_loss": -35.18022537231445, "global_step": 56065, "epoch": 463} {"train_loss": -35.321632385253906, "global_step": 56066, "epoch": 463} {"train_loss": -35.60740280151367, "global_step": 56067, "epoch": 463} {"train_loss": -35.00883483886719, "global_step": 56068, "epoch": 463} {"train_loss": -35.173431396484375, "global_step": 56069, "epoch": 463} {"train_loss": -35.87517547607422, "global_step": 56070, "epoch": 463} {"train_loss": -35.2884521484375, "global_step": 56071, "epoch": 463} {"train_loss": -35.68028259277344, "global_step": 56072, "epoch": 463} {"train_loss": -35.39299392700195, "global_step": 56073, "epoch": 463} {"train_loss": -35.913841247558594, "global_step": 56074, "epoch": 463} {"train_loss": -35.67546463012695, "global_step": 56075, "epoch": 463} {"train_loss": -35.80951690673828, "global_step": 56076, "epoch": 463} {"train_loss": -36.034088134765625, "global_step": 56077, "epoch": 463} {"train_loss": -35.90576934814453, "global_step": 56078, "epoch": 463} {"train_loss": -35.931190490722656, "global_step": 56079, "epoch": 463} {"train_loss": -35.878875732421875, "global_step": 56080, "epoch": 463} {"train_loss": -36.08552932739258, "global_step": 56081, "epoch": 463} {"train_loss": -35.92141342163086, "global_step": 56082, "epoch": 463} {"train_loss": -35.98051071166992, "global_step": 56083, "epoch": 463} {"train_loss": -35.84587478637695, "global_step": 56084, "epoch": 463} {"train_loss": -36.0275993347168, "global_step": 56085, "epoch": 463} {"train_loss": -36.229698181152344, "global_step": 56086, "epoch": 463} {"train_loss": -36.34782791137695, "global_step": 56087, "epoch": 463} {"train_loss": -36.2671012878418, "global_step": 56088, "epoch": 463} {"train_loss": -36.75494384765625, "global_step": 56089, "epoch": 463} {"train_loss": -36.111572265625, "global_step": 56090, "epoch": 463} {"train_loss": -36.626800537109375, "global_step": 56091, "epoch": 463} {"train_loss": -36.260623931884766, "global_step": 56092, "epoch": 463} {"train_loss": -36.45317840576172, "global_step": 56093, "epoch": 463} {"train_loss": -36.57538986206055, "global_step": 56094, "epoch": 463} {"train_loss": -36.01442337036133, "global_step": 56095, "epoch": 463} {"train_loss": -36.094295501708984, "global_step": 56096, "epoch": 463} {"train_loss": -35.953956604003906, "global_step": 56097, "epoch": 463} {"train_loss": -33.913299560546875, "global_step": 56098, "epoch": 463} {"train_loss": -32.580989837646484, "global_step": 56099, "epoch": 463} {"train_loss": -28.934656143188477, "global_step": 56100, "epoch": 463} {"train_loss": -23.152225494384766, "global_step": 56101, "epoch": 463} {"train_loss": -26.448713302612305, "global_step": 56102, "epoch": 463} {"train_loss": -35.207942962646484, "global_step": 56103, "epoch": 463} {"train_loss": -32.82101821899414, "global_step": 56104, "epoch": 463} {"train_loss": -29.293670654296875, "global_step": 56105, "epoch": 463} {"train_loss": -35.01490020751953, "global_step": 56106, "epoch": 463} {"train_loss": -31.23298454284668, "global_step": 56107, "epoch": 463} {"train_loss": -34.29989242553711, "global_step": 56108, "epoch": 463} {"train_loss": -33.672080993652344, "global_step": 56109, "epoch": 463} {"train_loss": -31.901330947875977, "global_step": 56110, "epoch": 463} {"train_loss": -33.704017639160156, "global_step": 56111, "epoch": 463} {"train_loss": -34.80547332763672, "global_step": 56112, "epoch": 463} {"train_loss": -33.44599533081055, "global_step": 56113, "epoch": 463} {"train_loss": -34.689754486083984, "global_step": 56114, "epoch": 463} {"train_loss": -32.998573303222656, "global_step": 56115, "epoch": 463} {"train_loss": -33.68062973022461, "global_step": 56116, "epoch": 463} {"train_loss": -32.46381759643555, "global_step": 56117, "epoch": 463} {"train_loss": -34.28010559082031, "global_step": 56118, "epoch": 463} {"train_loss": -30.470712661743164, "global_step": 56119, "epoch": 463} {"train_loss": -33.53168487548828, "global_step": 56120, "epoch": 463} {"train_loss": -34.58888244628906, "global_step": 56121, "epoch": 463} {"train_loss": -33.76735305786133, "global_step": 56122, "epoch": 463} {"train_loss": -34.597232818603516, "global_step": 56123, "epoch": 463} {"train_loss": -34.263919830322266, "global_step": 56124, "epoch": 463} {"train_loss": -34.320159912109375, "global_step": 56125, "epoch": 463} {"train_loss": -34.74912643432617, "global_step": 56126, "epoch": 463} {"train_loss": -34.27311706542969, "global_step": 56127, "epoch": 463} {"train_loss": -34.6275520324707, "global_step": 56128, "epoch": 463} {"train_loss": -34.769412994384766, "global_step": 56129, "epoch": 463} {"train_loss": -35.164466857910156, "global_step": 56130, "epoch": 463} {"train_loss": -35.068294525146484, "global_step": 56131, "epoch": 463} {"train_loss": -35.072662353515625, "global_step": 56132, "epoch": 463} {"train_loss": -33.94654846191406, "global_step": 56133, "epoch": 463} {"train_loss": -35.51428985595703, "global_step": 56134, "epoch": 463} {"train_loss": -35.5904655456543, "global_step": 56135, "epoch": 463} {"train_loss": -35.3538932800293, "global_step": 56136, "epoch": 463} {"train_loss": -34.69810104370117, "global_step": 56137, "epoch": 463} {"train_loss": -35.65813064575195, "global_step": 56138, "epoch": 463} {"train_loss": -35.44149398803711, "global_step": 56139, "epoch": 463} {"train_loss": -35.550472259521484, "global_step": 56140, "epoch": 463} {"train_loss": -35.38792037963867, "global_step": 56141, "epoch": 463} {"train_loss": -35.65739822387695, "global_step": 56142, "epoch": 463} {"train_loss": -34.49880994055882, "global_step": 56143, "epoch": 463, "val_loss": 2590636.75} {"train_loss": -35.82844543457031, "global_step": 56144, "epoch": 464} {"train_loss": -35.36518478393555, "global_step": 56145, "epoch": 464} {"train_loss": -35.11701583862305, "global_step": 56146, "epoch": 464} {"train_loss": -35.259090423583984, "global_step": 56147, "epoch": 464} {"train_loss": -35.11440658569336, "global_step": 56148, "epoch": 464} {"train_loss": -35.3531494140625, "global_step": 56149, "epoch": 464} {"train_loss": -35.46244430541992, "global_step": 56150, "epoch": 464} {"train_loss": -34.760719299316406, "global_step": 56151, "epoch": 464} {"train_loss": -34.25973129272461, "global_step": 56152, "epoch": 464} {"train_loss": -34.338287353515625, "global_step": 56153, "epoch": 464} {"train_loss": -31.176925659179688, "global_step": 56154, "epoch": 464} {"train_loss": -24.461809158325195, "global_step": 56155, "epoch": 464} {"train_loss": -19.390625, "global_step": 56156, "epoch": 464} {"train_loss": -23.80403709411621, "global_step": 56157, "epoch": 464} {"train_loss": -32.799922943115234, "global_step": 56158, "epoch": 464} {"train_loss": -34.29643249511719, "global_step": 56159, "epoch": 464} {"train_loss": -31.937360763549805, "global_step": 56160, "epoch": 464} {"train_loss": -34.99575424194336, "global_step": 56161, "epoch": 464} {"train_loss": -33.054195404052734, "global_step": 56162, "epoch": 464} {"train_loss": -34.851444244384766, "global_step": 56163, "epoch": 464} {"train_loss": -33.82275390625, "global_step": 56164, "epoch": 464} {"train_loss": -35.059932708740234, "global_step": 56165, "epoch": 464} {"train_loss": -34.483245849609375, "global_step": 56166, "epoch": 464} {"train_loss": -34.877010345458984, "global_step": 56167, "epoch": 464} {"train_loss": -34.876094818115234, "global_step": 56168, "epoch": 464} {"train_loss": -34.730224609375, "global_step": 56169, "epoch": 464} {"train_loss": -34.382816314697266, "global_step": 56170, "epoch": 464} {"train_loss": -34.15447998046875, "global_step": 56171, "epoch": 464} {"train_loss": -35.472267150878906, "global_step": 56172, "epoch": 464} {"train_loss": -35.32312774658203, "global_step": 56173, "epoch": 464} {"train_loss": -34.72639083862305, "global_step": 56174, "epoch": 464} {"train_loss": -33.92667770385742, "global_step": 56175, "epoch": 464} {"train_loss": -34.8465576171875, "global_step": 56176, "epoch": 464} {"train_loss": -34.07596969604492, "global_step": 56177, "epoch": 464} {"train_loss": -35.83460235595703, "global_step": 56178, "epoch": 464} {"train_loss": -33.13486862182617, "global_step": 56179, "epoch": 464} {"train_loss": -34.676021575927734, "global_step": 56180, "epoch": 464} {"train_loss": -34.42440414428711, "global_step": 56181, "epoch": 464} {"train_loss": -34.806182861328125, "global_step": 56182, "epoch": 464} {"train_loss": -35.401092529296875, "global_step": 56183, "epoch": 464} {"train_loss": -35.2866096496582, "global_step": 56184, "epoch": 464} {"train_loss": -34.8003044128418, "global_step": 56185, "epoch": 464} {"train_loss": -34.65004348754883, "global_step": 56186, "epoch": 464} {"train_loss": -34.92049789428711, "global_step": 56187, "epoch": 464} {"train_loss": -35.42580032348633, "global_step": 56188, "epoch": 464} {"train_loss": -34.09783935546875, "global_step": 56189, "epoch": 464} {"train_loss": -34.60287094116211, "global_step": 56190, "epoch": 464} {"train_loss": -34.66015625, "global_step": 56191, "epoch": 464} {"train_loss": -35.46409225463867, "global_step": 56192, "epoch": 464} {"train_loss": -34.2049674987793, "global_step": 56193, "epoch": 464} {"train_loss": -35.104286193847656, "global_step": 56194, "epoch": 464} {"train_loss": -34.361637115478516, "global_step": 56195, "epoch": 464} {"train_loss": -34.994144439697266, "global_step": 56196, "epoch": 464} {"train_loss": -35.419795989990234, "global_step": 56197, "epoch": 464} {"train_loss": -35.2097282409668, "global_step": 56198, "epoch": 464} {"train_loss": -34.899078369140625, "global_step": 56199, "epoch": 464} {"train_loss": -35.072547912597656, "global_step": 56200, "epoch": 464} {"train_loss": -34.986019134521484, "global_step": 56201, "epoch": 464} {"train_loss": -35.41333770751953, "global_step": 56202, "epoch": 464} {"train_loss": -34.83600616455078, "global_step": 56203, "epoch": 464} {"train_loss": -35.79677200317383, "global_step": 56204, "epoch": 464} {"train_loss": -34.780067443847656, "global_step": 56205, "epoch": 464} {"train_loss": -35.35152053833008, "global_step": 56206, "epoch": 464} {"train_loss": -33.89004135131836, "global_step": 56207, "epoch": 464} {"train_loss": -34.897499084472656, "global_step": 56208, "epoch": 464} {"train_loss": -34.36918258666992, "global_step": 56209, "epoch": 464} {"train_loss": -34.84774398803711, "global_step": 56210, "epoch": 464} {"train_loss": -35.077552795410156, "global_step": 56211, "epoch": 464} {"train_loss": -34.288551330566406, "global_step": 56212, "epoch": 464} {"train_loss": -35.83429718017578, "global_step": 56213, "epoch": 464} {"train_loss": -35.683013916015625, "global_step": 56214, "epoch": 464} {"train_loss": -35.108375549316406, "global_step": 56215, "epoch": 464} {"train_loss": -35.93175506591797, "global_step": 56216, "epoch": 464} {"train_loss": -34.95231246948242, "global_step": 56217, "epoch": 464} {"train_loss": -35.77194595336914, "global_step": 56218, "epoch": 464} {"train_loss": -35.813148498535156, "global_step": 56219, "epoch": 464} {"train_loss": -35.871212005615234, "global_step": 56220, "epoch": 464} {"train_loss": -35.836669921875, "global_step": 56221, "epoch": 464} {"train_loss": -36.01077651977539, "global_step": 56222, "epoch": 464} {"train_loss": -35.72266387939453, "global_step": 56223, "epoch": 464} {"train_loss": -35.982666015625, "global_step": 56224, "epoch": 464} {"train_loss": -35.21059799194336, "global_step": 56225, "epoch": 464} {"train_loss": -36.04371643066406, "global_step": 56226, "epoch": 464} {"train_loss": -35.96422576904297, "global_step": 56227, "epoch": 464} {"train_loss": -35.923763275146484, "global_step": 56228, "epoch": 464} {"train_loss": -35.52851104736328, "global_step": 56229, "epoch": 464} {"train_loss": -35.85694885253906, "global_step": 56230, "epoch": 464} {"train_loss": -36.21114730834961, "global_step": 56231, "epoch": 464} {"train_loss": -36.375545501708984, "global_step": 56232, "epoch": 464} {"train_loss": -35.55781173706055, "global_step": 56233, "epoch": 464} {"train_loss": -35.71058654785156, "global_step": 56234, "epoch": 464} {"train_loss": -36.06734085083008, "global_step": 56235, "epoch": 464} {"train_loss": -36.238975524902344, "global_step": 56236, "epoch": 464} {"train_loss": -35.575801849365234, "global_step": 56237, "epoch": 464} {"train_loss": -35.4208984375, "global_step": 56238, "epoch": 464} {"train_loss": -35.995079040527344, "global_step": 56239, "epoch": 464} {"train_loss": -36.62805938720703, "global_step": 56240, "epoch": 464} {"train_loss": -35.653446197509766, "global_step": 56241, "epoch": 464} {"train_loss": -36.07755661010742, "global_step": 56242, "epoch": 464} {"train_loss": -34.59775924682617, "global_step": 56243, "epoch": 464} {"train_loss": -35.505916595458984, "global_step": 56244, "epoch": 464} {"train_loss": -36.52871322631836, "global_step": 56245, "epoch": 464} {"train_loss": -35.853389739990234, "global_step": 56246, "epoch": 464} {"train_loss": -36.019283294677734, "global_step": 56247, "epoch": 464} {"train_loss": -35.5858039855957, "global_step": 56248, "epoch": 464} {"train_loss": -35.159481048583984, "global_step": 56249, "epoch": 464} {"train_loss": -34.40339279174805, "global_step": 56250, "epoch": 464} {"train_loss": -33.5012321472168, "global_step": 56251, "epoch": 464} {"train_loss": -34.23122787475586, "global_step": 56252, "epoch": 464} {"train_loss": -30.429838180541992, "global_step": 56253, "epoch": 464} {"train_loss": -26.00630760192871, "global_step": 56254, "epoch": 464} {"train_loss": -32.11997985839844, "global_step": 56255, "epoch": 464} {"train_loss": -34.33158493041992, "global_step": 56256, "epoch": 464} {"train_loss": -32.43046951293945, "global_step": 56257, "epoch": 464} {"train_loss": -31.084882736206055, "global_step": 56258, "epoch": 464} {"train_loss": -33.906646728515625, "global_step": 56259, "epoch": 464} {"train_loss": -32.52309036254883, "global_step": 56260, "epoch": 464} {"train_loss": -33.68933868408203, "global_step": 56261, "epoch": 464} {"train_loss": -32.572418212890625, "global_step": 56262, "epoch": 464} {"train_loss": -33.66378402709961, "global_step": 56263, "epoch": 464} {"train_loss": -34.4613731951753, "global_step": 56264, "epoch": 464, "val_loss": 2595275.5} {"train_loss": -33.45756912231445, "global_step": 56265, "epoch": 465} {"train_loss": -31.18305015563965, "global_step": 56266, "epoch": 465} {"train_loss": -32.47470474243164, "global_step": 56267, "epoch": 465} {"train_loss": -33.6411018371582, "global_step": 56268, "epoch": 465} {"train_loss": -33.6489372253418, "global_step": 56269, "epoch": 465} {"train_loss": -34.026214599609375, "global_step": 56270, "epoch": 465} {"train_loss": -33.065677642822266, "global_step": 56271, "epoch": 465} {"train_loss": -30.643980026245117, "global_step": 56272, "epoch": 465} {"train_loss": -34.33414840698242, "global_step": 56273, "epoch": 465} {"train_loss": -33.679595947265625, "global_step": 56274, "epoch": 465} {"train_loss": -32.86832809448242, "global_step": 56275, "epoch": 465} {"train_loss": -33.48649978637695, "global_step": 56276, "epoch": 465} {"train_loss": -34.114402770996094, "global_step": 56277, "epoch": 465} {"train_loss": -34.20580291748047, "global_step": 56278, "epoch": 465} {"train_loss": -34.568519592285156, "global_step": 56279, "epoch": 465} {"train_loss": -34.08832931518555, "global_step": 56280, "epoch": 465} {"train_loss": -34.581050872802734, "global_step": 56281, "epoch": 465} {"train_loss": -33.84159469604492, "global_step": 56282, "epoch": 465} {"train_loss": -34.56808853149414, "global_step": 56283, "epoch": 465} {"train_loss": -34.5897216796875, "global_step": 56284, "epoch": 465} {"train_loss": -32.52299880981445, "global_step": 56285, "epoch": 465} {"train_loss": -33.63045883178711, "global_step": 56286, "epoch": 465} {"train_loss": -34.52787399291992, "global_step": 56287, "epoch": 465} {"train_loss": -34.288394927978516, "global_step": 56288, "epoch": 465} {"train_loss": -34.47249221801758, "global_step": 56289, "epoch": 465} {"train_loss": -34.895965576171875, "global_step": 56290, "epoch": 465} {"train_loss": -35.184600830078125, "global_step": 56291, "epoch": 465} {"train_loss": -34.85575485229492, "global_step": 56292, "epoch": 465} {"train_loss": -34.62301254272461, "global_step": 56293, "epoch": 465} {"train_loss": -35.0865592956543, "global_step": 56294, "epoch": 465} {"train_loss": -35.08747482299805, "global_step": 56295, "epoch": 465} {"train_loss": -34.82197952270508, "global_step": 56296, "epoch": 465} {"train_loss": -34.908302307128906, "global_step": 56297, "epoch": 465} {"train_loss": -34.95448303222656, "global_step": 56298, "epoch": 465} {"train_loss": -35.02090072631836, "global_step": 56299, "epoch": 465} {"train_loss": -35.32782745361328, "global_step": 56300, "epoch": 465} {"train_loss": -35.36972427368164, "global_step": 56301, "epoch": 465} {"train_loss": -35.47576904296875, "global_step": 56302, "epoch": 465} {"train_loss": -35.221309661865234, "global_step": 56303, "epoch": 465} {"train_loss": -35.49338150024414, "global_step": 56304, "epoch": 465} {"train_loss": -35.55451583862305, "global_step": 56305, "epoch": 465} {"train_loss": -35.83210754394531, "global_step": 56306, "epoch": 465} {"train_loss": -35.98899459838867, "global_step": 56307, "epoch": 465} {"train_loss": -35.38778305053711, "global_step": 56308, "epoch": 465} {"train_loss": -35.32787322998047, "global_step": 56309, "epoch": 465} {"train_loss": -35.773414611816406, "global_step": 56310, "epoch": 465} {"train_loss": -35.89065170288086, "global_step": 56311, "epoch": 465} {"train_loss": -34.53965377807617, "global_step": 56312, "epoch": 465} {"train_loss": -35.98772430419922, "global_step": 56313, "epoch": 465} {"train_loss": -35.4936408996582, "global_step": 56314, "epoch": 465} {"train_loss": -35.93470001220703, "global_step": 56315, "epoch": 465} {"train_loss": -35.99079132080078, "global_step": 56316, "epoch": 465} {"train_loss": -35.60322189331055, "global_step": 56317, "epoch": 465} {"train_loss": -36.089210510253906, "global_step": 56318, "epoch": 465} {"train_loss": -35.90211486816406, "global_step": 56319, "epoch": 465} {"train_loss": -36.35367965698242, "global_step": 56320, "epoch": 465} {"train_loss": -35.94599533081055, "global_step": 56321, "epoch": 465} {"train_loss": -36.41276550292969, "global_step": 56322, "epoch": 465} {"train_loss": -35.85004425048828, "global_step": 56323, "epoch": 465} {"train_loss": -36.19059371948242, "global_step": 56324, "epoch": 465} {"train_loss": -36.147071838378906, "global_step": 56325, "epoch": 465} {"train_loss": -35.497859954833984, "global_step": 56326, "epoch": 465} {"train_loss": -36.207942962646484, "global_step": 56327, "epoch": 465} {"train_loss": -36.390323638916016, "global_step": 56328, "epoch": 465} {"train_loss": -36.003292083740234, "global_step": 56329, "epoch": 465} {"train_loss": -36.39815139770508, "global_step": 56330, "epoch": 465} {"train_loss": -36.1424674987793, "global_step": 56331, "epoch": 465} {"train_loss": -36.74395751953125, "global_step": 56332, "epoch": 465} {"train_loss": -36.65462112426758, "global_step": 56333, "epoch": 465} {"train_loss": -36.498348236083984, "global_step": 56334, "epoch": 465} {"train_loss": -36.144989013671875, "global_step": 56335, "epoch": 465} {"train_loss": -36.18315505981445, "global_step": 56336, "epoch": 465} {"train_loss": -36.90275955200195, "global_step": 56337, "epoch": 465} {"train_loss": -34.982940673828125, "global_step": 56338, "epoch": 465} {"train_loss": -36.55857467651367, "global_step": 56339, "epoch": 465} {"train_loss": -35.966522216796875, "global_step": 56340, "epoch": 465} {"train_loss": -35.851165771484375, "global_step": 56341, "epoch": 465} {"train_loss": -36.78178787231445, "global_step": 56342, "epoch": 465} {"train_loss": -36.57072830200195, "global_step": 56343, "epoch": 465} {"train_loss": -36.4640007019043, "global_step": 56344, "epoch": 465} {"train_loss": -36.727657318115234, "global_step": 56345, "epoch": 465} {"train_loss": -36.73997116088867, "global_step": 56346, "epoch": 465} {"train_loss": -36.91389846801758, "global_step": 56347, "epoch": 465} {"train_loss": -36.15486526489258, "global_step": 56348, "epoch": 465} {"train_loss": -36.387691497802734, "global_step": 56349, "epoch": 465} {"train_loss": -37.07670974731445, "global_step": 56350, "epoch": 465} {"train_loss": -36.4699821472168, "global_step": 56351, "epoch": 465} {"train_loss": -36.36488342285156, "global_step": 56352, "epoch": 465} {"train_loss": -36.13874435424805, "global_step": 56353, "epoch": 465} {"train_loss": -36.401222229003906, "global_step": 56354, "epoch": 465} {"train_loss": -36.87226104736328, "global_step": 56355, "epoch": 465} {"train_loss": -36.51239013671875, "global_step": 56356, "epoch": 465} {"train_loss": -35.45088577270508, "global_step": 56357, "epoch": 465} {"train_loss": -36.24348831176758, "global_step": 56358, "epoch": 465} {"train_loss": -35.65902328491211, "global_step": 56359, "epoch": 465} {"train_loss": -35.32906723022461, "global_step": 56360, "epoch": 465} {"train_loss": -33.37302780151367, "global_step": 56361, "epoch": 465} {"train_loss": -33.491817474365234, "global_step": 56362, "epoch": 465} {"train_loss": -32.379737854003906, "global_step": 56363, "epoch": 465} {"train_loss": -30.95026969909668, "global_step": 56364, "epoch": 465} {"train_loss": -31.4006404876709, "global_step": 56365, "epoch": 465} {"train_loss": -31.160261154174805, "global_step": 56366, "epoch": 465} {"train_loss": -33.41748809814453, "global_step": 56367, "epoch": 465} {"train_loss": -31.880523681640625, "global_step": 56368, "epoch": 465} {"train_loss": -28.500640869140625, "global_step": 56369, "epoch": 465} {"train_loss": -30.292856216430664, "global_step": 56370, "epoch": 465} {"train_loss": -33.34328842163086, "global_step": 56371, "epoch": 465} {"train_loss": -30.684350967407227, "global_step": 56372, "epoch": 465} {"train_loss": -34.71639633178711, "global_step": 56373, "epoch": 465} {"train_loss": -31.486072540283203, "global_step": 56374, "epoch": 465} {"train_loss": -33.75165939331055, "global_step": 56375, "epoch": 465} {"train_loss": -33.1939811706543, "global_step": 56376, "epoch": 465} {"train_loss": -35.281002044677734, "global_step": 56377, "epoch": 465} {"train_loss": -34.2286491394043, "global_step": 56378, "epoch": 465} {"train_loss": -33.94364929199219, "global_step": 56379, "epoch": 465} {"train_loss": -34.999061584472656, "global_step": 56380, "epoch": 465} {"train_loss": -34.88783264160156, "global_step": 56381, "epoch": 465} {"train_loss": -34.50527572631836, "global_step": 56382, "epoch": 465} {"train_loss": -33.976966857910156, "global_step": 56383, "epoch": 465} {"train_loss": -34.07619094848633, "global_step": 56384, "epoch": 465} {"train_loss": -34.82889971457237, "global_step": 56385, "epoch": 465, "val_loss": 2551647.25} {"train_loss": -35.710487365722656, "global_step": 56386, "epoch": 466} {"train_loss": -34.048397064208984, "global_step": 56387, "epoch": 466} {"train_loss": -34.74253463745117, "global_step": 56388, "epoch": 466} {"train_loss": -33.51333236694336, "global_step": 56389, "epoch": 466} {"train_loss": -35.0801887512207, "global_step": 56390, "epoch": 466} {"train_loss": -34.92959976196289, "global_step": 56391, "epoch": 466} {"train_loss": -35.47439193725586, "global_step": 56392, "epoch": 466} {"train_loss": -35.589847564697266, "global_step": 56393, "epoch": 466} {"train_loss": -35.23937225341797, "global_step": 56394, "epoch": 466} {"train_loss": -35.18070602416992, "global_step": 56395, "epoch": 466} {"train_loss": -34.94224548339844, "global_step": 56396, "epoch": 466} {"train_loss": -35.11882019042969, "global_step": 56397, "epoch": 466} {"train_loss": -35.07969284057617, "global_step": 56398, "epoch": 466} {"train_loss": -33.815406799316406, "global_step": 56399, "epoch": 466} {"train_loss": -34.189083099365234, "global_step": 56400, "epoch": 466} {"train_loss": -34.52486801147461, "global_step": 56401, "epoch": 466} {"train_loss": -34.60787582397461, "global_step": 56402, "epoch": 466} {"train_loss": -35.31516647338867, "global_step": 56403, "epoch": 466} {"train_loss": -34.51839828491211, "global_step": 56404, "epoch": 466} {"train_loss": -35.438961029052734, "global_step": 56405, "epoch": 466} {"train_loss": -35.232948303222656, "global_step": 56406, "epoch": 466} {"train_loss": -35.30575180053711, "global_step": 56407, "epoch": 466} {"train_loss": -34.61151885986328, "global_step": 56408, "epoch": 466} {"train_loss": -35.17681121826172, "global_step": 56409, "epoch": 466} {"train_loss": -35.36775588989258, "global_step": 56410, "epoch": 466} {"train_loss": -34.37168502807617, "global_step": 56411, "epoch": 466} {"train_loss": -33.63745880126953, "global_step": 56412, "epoch": 466} {"train_loss": -35.201045989990234, "global_step": 56413, "epoch": 466} {"train_loss": -34.84774398803711, "global_step": 56414, "epoch": 466} {"train_loss": -34.89349365234375, "global_step": 56415, "epoch": 466} {"train_loss": -35.14658737182617, "global_step": 56416, "epoch": 466} {"train_loss": -35.38011169433594, "global_step": 56417, "epoch": 466} {"train_loss": -35.635406494140625, "global_step": 56418, "epoch": 466} {"train_loss": -35.45670700073242, "global_step": 56419, "epoch": 466} {"train_loss": -35.05129623413086, "global_step": 56420, "epoch": 466} {"train_loss": -35.25925827026367, "global_step": 56421, "epoch": 466} {"train_loss": -35.32625198364258, "global_step": 56422, "epoch": 466} {"train_loss": -35.2418212890625, "global_step": 56423, "epoch": 466} {"train_loss": -35.52254867553711, "global_step": 56424, "epoch": 466} {"train_loss": -34.014137268066406, "global_step": 56425, "epoch": 466} {"train_loss": -33.17837142944336, "global_step": 56426, "epoch": 466} {"train_loss": -31.794260025024414, "global_step": 56427, "epoch": 466} {"train_loss": -31.55230140686035, "global_step": 56428, "epoch": 466} {"train_loss": -32.116756439208984, "global_step": 56429, "epoch": 466} {"train_loss": -35.231536865234375, "global_step": 56430, "epoch": 466} {"train_loss": -35.9969596862793, "global_step": 56431, "epoch": 466} {"train_loss": -33.91132736206055, "global_step": 56432, "epoch": 466} {"train_loss": -34.755001068115234, "global_step": 56433, "epoch": 466} {"train_loss": -36.11416244506836, "global_step": 56434, "epoch": 466} {"train_loss": -35.06864547729492, "global_step": 56435, "epoch": 466} {"train_loss": -35.81622314453125, "global_step": 56436, "epoch": 466} {"train_loss": -35.83405685424805, "global_step": 56437, "epoch": 466} {"train_loss": -36.05950164794922, "global_step": 56438, "epoch": 466} {"train_loss": -36.08694839477539, "global_step": 56439, "epoch": 466} {"train_loss": -36.199974060058594, "global_step": 56440, "epoch": 466} {"train_loss": -36.314697265625, "global_step": 56441, "epoch": 466} {"train_loss": -36.29960250854492, "global_step": 56442, "epoch": 466} {"train_loss": -36.043792724609375, "global_step": 56443, "epoch": 466} {"train_loss": -35.69014358520508, "global_step": 56444, "epoch": 466} {"train_loss": -36.33512496948242, "global_step": 56445, "epoch": 466} {"train_loss": -35.917579650878906, "global_step": 56446, "epoch": 466} {"train_loss": -36.5096435546875, "global_step": 56447, "epoch": 466} {"train_loss": -36.32780456542969, "global_step": 56448, "epoch": 466} {"train_loss": -36.44983673095703, "global_step": 56449, "epoch": 466} {"train_loss": -35.88926315307617, "global_step": 56450, "epoch": 466} {"train_loss": -36.15471649169922, "global_step": 56451, "epoch": 466} {"train_loss": -36.3513069152832, "global_step": 56452, "epoch": 466} {"train_loss": -36.984676361083984, "global_step": 56453, "epoch": 466} {"train_loss": -36.36396408081055, "global_step": 56454, "epoch": 466} {"train_loss": -36.53116989135742, "global_step": 56455, "epoch": 466} {"train_loss": -36.87186050415039, "global_step": 56456, "epoch": 466} {"train_loss": -36.68852615356445, "global_step": 56457, "epoch": 466} {"train_loss": -36.53098678588867, "global_step": 56458, "epoch": 466} {"train_loss": -35.21662521362305, "global_step": 56459, "epoch": 466} {"train_loss": -33.23089599609375, "global_step": 56460, "epoch": 466} {"train_loss": -29.692716598510742, "global_step": 56461, "epoch": 466} {"train_loss": -26.7529354095459, "global_step": 56462, "epoch": 466} {"train_loss": -28.33649253845215, "global_step": 56463, "epoch": 466} {"train_loss": -35.9488410949707, "global_step": 56464, "epoch": 466} {"train_loss": -32.0091552734375, "global_step": 56465, "epoch": 466} {"train_loss": -31.158145904541016, "global_step": 56466, "epoch": 466} {"train_loss": -35.1908073425293, "global_step": 56467, "epoch": 466} {"train_loss": -31.927204132080078, "global_step": 56468, "epoch": 466} {"train_loss": -35.599552154541016, "global_step": 56469, "epoch": 466} {"train_loss": -33.15091323852539, "global_step": 56470, "epoch": 466} {"train_loss": -35.789794921875, "global_step": 56471, "epoch": 466} {"train_loss": -34.43745040893555, "global_step": 56472, "epoch": 466} {"train_loss": -35.593379974365234, "global_step": 56473, "epoch": 466} {"train_loss": -36.160945892333984, "global_step": 56474, "epoch": 466} {"train_loss": -35.31667709350586, "global_step": 56475, "epoch": 466} {"train_loss": -35.87272262573242, "global_step": 56476, "epoch": 466} {"train_loss": -35.135494232177734, "global_step": 56477, "epoch": 466} {"train_loss": -34.93132781982422, "global_step": 56478, "epoch": 466} {"train_loss": -35.53554153442383, "global_step": 56479, "epoch": 466} {"train_loss": -35.95489501953125, "global_step": 56480, "epoch": 466} {"train_loss": -35.60774612426758, "global_step": 56481, "epoch": 466} {"train_loss": -35.951229095458984, "global_step": 56482, "epoch": 466} {"train_loss": -35.69886016845703, "global_step": 56483, "epoch": 466} {"train_loss": -35.70580291748047, "global_step": 56484, "epoch": 466} {"train_loss": -35.95783615112305, "global_step": 56485, "epoch": 466} {"train_loss": -35.495548248291016, "global_step": 56486, "epoch": 466} {"train_loss": -36.217220306396484, "global_step": 56487, "epoch": 466} {"train_loss": -36.4819450378418, "global_step": 56488, "epoch": 466} {"train_loss": -36.256439208984375, "global_step": 56489, "epoch": 466} {"train_loss": -36.607391357421875, "global_step": 56490, "epoch": 466} {"train_loss": -36.015071868896484, "global_step": 56491, "epoch": 466} {"train_loss": -36.14335250854492, "global_step": 56492, "epoch": 466} {"train_loss": -36.444976806640625, "global_step": 56493, "epoch": 466} {"train_loss": -36.456424713134766, "global_step": 56494, "epoch": 466} {"train_loss": -36.65604019165039, "global_step": 56495, "epoch": 466} {"train_loss": -36.615264892578125, "global_step": 56496, "epoch": 466} {"train_loss": -35.59981155395508, "global_step": 56497, "epoch": 466} {"train_loss": -36.571170806884766, "global_step": 56498, "epoch": 466} {"train_loss": -36.18891525268555, "global_step": 56499, "epoch": 466} {"train_loss": -36.584312438964844, "global_step": 56500, "epoch": 466} {"train_loss": -37.01080322265625, "global_step": 56501, "epoch": 466} {"train_loss": -36.387969970703125, "global_step": 56502, "epoch": 466} {"train_loss": -36.52440643310547, "global_step": 56503, "epoch": 466} {"train_loss": -36.138118743896484, "global_step": 56504, "epoch": 466} {"train_loss": -36.238685607910156, "global_step": 56505, "epoch": 466} {"train_loss": -35.175647057777596, "global_step": 56506, "epoch": 466, "val_loss": 2505784.0} {"train_loss": -36.273681640625, "global_step": 56507, "epoch": 467} {"train_loss": -35.605743408203125, "global_step": 56508, "epoch": 467} {"train_loss": -36.2712516784668, "global_step": 56509, "epoch": 467} {"train_loss": -36.37425231933594, "global_step": 56510, "epoch": 467} {"train_loss": -36.76322937011719, "global_step": 56511, "epoch": 467} {"train_loss": -36.25821304321289, "global_step": 56512, "epoch": 467} {"train_loss": -36.423728942871094, "global_step": 56513, "epoch": 467} {"train_loss": -36.52606964111328, "global_step": 56514, "epoch": 467} {"train_loss": -36.757328033447266, "global_step": 56515, "epoch": 467} {"train_loss": -35.97193145751953, "global_step": 56516, "epoch": 467} {"train_loss": -36.375244140625, "global_step": 56517, "epoch": 467} {"train_loss": -35.8337516784668, "global_step": 56518, "epoch": 467} {"train_loss": -36.59999084472656, "global_step": 56519, "epoch": 467} {"train_loss": -36.07562255859375, "global_step": 56520, "epoch": 467} {"train_loss": -36.11445617675781, "global_step": 56521, "epoch": 467} {"train_loss": -34.52227783203125, "global_step": 56522, "epoch": 467} {"train_loss": -32.60067367553711, "global_step": 56523, "epoch": 467} {"train_loss": -31.043439865112305, "global_step": 56524, "epoch": 467} {"train_loss": -29.876174926757812, "global_step": 56525, "epoch": 467} {"train_loss": -27.348804473876953, "global_step": 56526, "epoch": 467} {"train_loss": -23.310293197631836, "global_step": 56527, "epoch": 467} {"train_loss": -30.330488204956055, "global_step": 56528, "epoch": 467} {"train_loss": -32.93038558959961, "global_step": 56529, "epoch": 467} {"train_loss": -30.57582664489746, "global_step": 56530, "epoch": 467} {"train_loss": -35.69427490234375, "global_step": 56531, "epoch": 467} {"train_loss": -30.608184814453125, "global_step": 56532, "epoch": 467} {"train_loss": -35.24483871459961, "global_step": 56533, "epoch": 467} {"train_loss": -32.33933639526367, "global_step": 56534, "epoch": 467} {"train_loss": -34.89484786987305, "global_step": 56535, "epoch": 467} {"train_loss": -32.21123504638672, "global_step": 56536, "epoch": 467} {"train_loss": -35.00715255737305, "global_step": 56537, "epoch": 467} {"train_loss": -32.786415100097656, "global_step": 56538, "epoch": 467} {"train_loss": -34.93378829956055, "global_step": 56539, "epoch": 467} {"train_loss": -34.9351921081543, "global_step": 56540, "epoch": 467} {"train_loss": -34.03791427612305, "global_step": 56541, "epoch": 467} {"train_loss": -35.20759582519531, "global_step": 56542, "epoch": 467} {"train_loss": -33.2878532409668, "global_step": 56543, "epoch": 467} {"train_loss": -34.729000091552734, "global_step": 56544, "epoch": 467} {"train_loss": -35.71017074584961, "global_step": 56545, "epoch": 467} {"train_loss": -33.98143005371094, "global_step": 56546, "epoch": 467} {"train_loss": -35.045406341552734, "global_step": 56547, "epoch": 467} {"train_loss": -35.92302322387695, "global_step": 56548, "epoch": 467} {"train_loss": -34.434120178222656, "global_step": 56549, "epoch": 467} {"train_loss": -34.973960876464844, "global_step": 56550, "epoch": 467} {"train_loss": -35.53583908081055, "global_step": 56551, "epoch": 467} {"train_loss": -35.76800537109375, "global_step": 56552, "epoch": 467} {"train_loss": -34.27968215942383, "global_step": 56553, "epoch": 467} {"train_loss": -34.895408630371094, "global_step": 56554, "epoch": 467} {"train_loss": -34.4992790222168, "global_step": 56555, "epoch": 467} {"train_loss": -35.03466796875, "global_step": 56556, "epoch": 467} {"train_loss": -34.61697769165039, "global_step": 56557, "epoch": 467} {"train_loss": -35.13996887207031, "global_step": 56558, "epoch": 467} {"train_loss": -35.12932205200195, "global_step": 56559, "epoch": 467} {"train_loss": -34.488243103027344, "global_step": 56560, "epoch": 467} {"train_loss": -34.534637451171875, "global_step": 56561, "epoch": 467} {"train_loss": -35.30144500732422, "global_step": 56562, "epoch": 467} {"train_loss": -35.846824645996094, "global_step": 56563, "epoch": 467} {"train_loss": -35.3575553894043, "global_step": 56564, "epoch": 467} {"train_loss": -34.23629379272461, "global_step": 56565, "epoch": 467} {"train_loss": -35.11002731323242, "global_step": 56566, "epoch": 467} {"train_loss": -35.35427474975586, "global_step": 56567, "epoch": 467} {"train_loss": -36.0044059753418, "global_step": 56568, "epoch": 467} {"train_loss": -35.441036224365234, "global_step": 56569, "epoch": 467} {"train_loss": -36.34810256958008, "global_step": 56570, "epoch": 467} {"train_loss": -35.60215377807617, "global_step": 56571, "epoch": 467} {"train_loss": -35.14373779296875, "global_step": 56572, "epoch": 467} {"train_loss": -35.127296447753906, "global_step": 56573, "epoch": 467} {"train_loss": -34.945369720458984, "global_step": 56574, "epoch": 467} {"train_loss": -36.333255767822266, "global_step": 56575, "epoch": 467} {"train_loss": -35.61143112182617, "global_step": 56576, "epoch": 467} {"train_loss": -36.147216796875, "global_step": 56577, "epoch": 467} {"train_loss": -35.926063537597656, "global_step": 56578, "epoch": 467} {"train_loss": -36.585365295410156, "global_step": 56579, "epoch": 467} {"train_loss": -36.23016357421875, "global_step": 56580, "epoch": 467} {"train_loss": -35.548828125, "global_step": 56581, "epoch": 467} {"train_loss": -36.166934967041016, "global_step": 56582, "epoch": 467} {"train_loss": -36.29758834838867, "global_step": 56583, "epoch": 467} {"train_loss": -35.6055908203125, "global_step": 56584, "epoch": 467} {"train_loss": -36.27328109741211, "global_step": 56585, "epoch": 467} {"train_loss": -36.03277587890625, "global_step": 56586, "epoch": 467} {"train_loss": -36.1838264465332, "global_step": 56587, "epoch": 467} {"train_loss": -35.959228515625, "global_step": 56588, "epoch": 467} {"train_loss": -35.97397994995117, "global_step": 56589, "epoch": 467} {"train_loss": -35.997535705566406, "global_step": 56590, "epoch": 467} {"train_loss": -36.43515396118164, "global_step": 56591, "epoch": 467} {"train_loss": -35.741493225097656, "global_step": 56592, "epoch": 467} {"train_loss": -35.77651596069336, "global_step": 56593, "epoch": 467} {"train_loss": -35.816017150878906, "global_step": 56594, "epoch": 467} {"train_loss": -35.14397430419922, "global_step": 56595, "epoch": 467} {"train_loss": -35.09044647216797, "global_step": 56596, "epoch": 467} {"train_loss": -35.45199203491211, "global_step": 56597, "epoch": 467} {"train_loss": -35.939659118652344, "global_step": 56598, "epoch": 467} {"train_loss": -36.41148376464844, "global_step": 56599, "epoch": 467} {"train_loss": -36.38248825073242, "global_step": 56600, "epoch": 467} {"train_loss": -34.06592559814453, "global_step": 56601, "epoch": 467} {"train_loss": -36.09850311279297, "global_step": 56602, "epoch": 467} {"train_loss": -36.612403869628906, "global_step": 56603, "epoch": 467} {"train_loss": -35.097042083740234, "global_step": 56604, "epoch": 467} {"train_loss": -35.065711975097656, "global_step": 56605, "epoch": 467} {"train_loss": -36.05967330932617, "global_step": 56606, "epoch": 467} {"train_loss": -35.58819580078125, "global_step": 56607, "epoch": 467} {"train_loss": -35.844085693359375, "global_step": 56608, "epoch": 467} {"train_loss": -35.43709945678711, "global_step": 56609, "epoch": 467} {"train_loss": -35.592159271240234, "global_step": 56610, "epoch": 467} {"train_loss": -35.25593185424805, "global_step": 56611, "epoch": 467} {"train_loss": -36.5060920715332, "global_step": 56612, "epoch": 467} {"train_loss": -35.57964324951172, "global_step": 56613, "epoch": 467} {"train_loss": -36.281768798828125, "global_step": 56614, "epoch": 467} {"train_loss": -34.31769561767578, "global_step": 56615, "epoch": 467} {"train_loss": -35.03355026245117, "global_step": 56616, "epoch": 467} {"train_loss": -35.65613555908203, "global_step": 56617, "epoch": 467} {"train_loss": -36.01823806762695, "global_step": 56618, "epoch": 467} {"train_loss": -34.19921112060547, "global_step": 56619, "epoch": 467} {"train_loss": -35.50117874145508, "global_step": 56620, "epoch": 467} {"train_loss": -34.994361877441406, "global_step": 56621, "epoch": 467} {"train_loss": -33.16431427001953, "global_step": 56622, "epoch": 467} {"train_loss": -34.624176025390625, "global_step": 56623, "epoch": 467} {"train_loss": -32.256263732910156, "global_step": 56624, "epoch": 467} {"train_loss": -33.099700927734375, "global_step": 56625, "epoch": 467} {"train_loss": -33.3623161315918, "global_step": 56626, "epoch": 467} {"train_loss": -34.931478705287965, "global_step": 56627, "epoch": 467, "val_loss": 2425240.0} {"train_loss": -34.74620819091797, "global_step": 56628, "epoch": 468} {"train_loss": -34.037532806396484, "global_step": 56629, "epoch": 468} {"train_loss": -35.16295623779297, "global_step": 56630, "epoch": 468} {"train_loss": -35.052391052246094, "global_step": 56631, "epoch": 468} {"train_loss": -35.49276351928711, "global_step": 56632, "epoch": 468} {"train_loss": -34.05704879760742, "global_step": 56633, "epoch": 468} {"train_loss": -36.14654541015625, "global_step": 56634, "epoch": 468} {"train_loss": -35.233116149902344, "global_step": 56635, "epoch": 468} {"train_loss": -35.84660720825195, "global_step": 56636, "epoch": 468} {"train_loss": -35.49406051635742, "global_step": 56637, "epoch": 468} {"train_loss": -35.175960540771484, "global_step": 56638, "epoch": 468} {"train_loss": -36.21672439575195, "global_step": 56639, "epoch": 468} {"train_loss": -35.9258918762207, "global_step": 56640, "epoch": 468} {"train_loss": -35.98896408081055, "global_step": 56641, "epoch": 468} {"train_loss": -35.42603302001953, "global_step": 56642, "epoch": 468} {"train_loss": -35.313846588134766, "global_step": 56643, "epoch": 468} {"train_loss": -35.844722747802734, "global_step": 56644, "epoch": 468} {"train_loss": -35.768592834472656, "global_step": 56645, "epoch": 468} {"train_loss": -36.38206100463867, "global_step": 56646, "epoch": 468} {"train_loss": -35.6995735168457, "global_step": 56647, "epoch": 468} {"train_loss": -36.079647064208984, "global_step": 56648, "epoch": 468} {"train_loss": -35.69329833984375, "global_step": 56649, "epoch": 468} {"train_loss": -36.0546989440918, "global_step": 56650, "epoch": 468} {"train_loss": -36.14376449584961, "global_step": 56651, "epoch": 468} {"train_loss": -35.17259979248047, "global_step": 56652, "epoch": 468} {"train_loss": -36.20203399658203, "global_step": 56653, "epoch": 468} {"train_loss": -36.12984085083008, "global_step": 56654, "epoch": 468} {"train_loss": -36.15359878540039, "global_step": 56655, "epoch": 468} {"train_loss": -35.006446838378906, "global_step": 56656, "epoch": 468} {"train_loss": -36.34368896484375, "global_step": 56657, "epoch": 468} {"train_loss": -35.48086166381836, "global_step": 56658, "epoch": 468} {"train_loss": -35.60142135620117, "global_step": 56659, "epoch": 468} {"train_loss": -35.2159309387207, "global_step": 56660, "epoch": 468} {"train_loss": -35.643280029296875, "global_step": 56661, "epoch": 468} {"train_loss": -36.384193420410156, "global_step": 56662, "epoch": 468} {"train_loss": -36.188331604003906, "global_step": 56663, "epoch": 468} {"train_loss": -36.57268524169922, "global_step": 56664, "epoch": 468} {"train_loss": -36.565120697021484, "global_step": 56665, "epoch": 468} {"train_loss": -36.356109619140625, "global_step": 56666, "epoch": 468} {"train_loss": -36.3156852722168, "global_step": 56667, "epoch": 468} {"train_loss": -35.87673568725586, "global_step": 56668, "epoch": 468} {"train_loss": -36.839256286621094, "global_step": 56669, "epoch": 468} {"train_loss": -36.15528106689453, "global_step": 56670, "epoch": 468} {"train_loss": -36.31856918334961, "global_step": 56671, "epoch": 468} {"train_loss": -36.83951950073242, "global_step": 56672, "epoch": 468} {"train_loss": -36.49192428588867, "global_step": 56673, "epoch": 468} {"train_loss": -36.40098190307617, "global_step": 56674, "epoch": 468} {"train_loss": -36.02518844604492, "global_step": 56675, "epoch": 468} {"train_loss": -35.99567794799805, "global_step": 56676, "epoch": 468} {"train_loss": -36.16698455810547, "global_step": 56677, "epoch": 468} {"train_loss": -36.87850570678711, "global_step": 56678, "epoch": 468} {"train_loss": -35.78944396972656, "global_step": 56679, "epoch": 468} {"train_loss": -36.590423583984375, "global_step": 56680, "epoch": 468} {"train_loss": -36.53047561645508, "global_step": 56681, "epoch": 468} {"train_loss": -36.25401306152344, "global_step": 56682, "epoch": 468} {"train_loss": -36.36945724487305, "global_step": 56683, "epoch": 468} {"train_loss": -36.14600372314453, "global_step": 56684, "epoch": 468} {"train_loss": -36.11548614501953, "global_step": 56685, "epoch": 468} {"train_loss": -36.59160614013672, "global_step": 56686, "epoch": 468} {"train_loss": -34.84299850463867, "global_step": 56687, "epoch": 468} {"train_loss": -33.114498138427734, "global_step": 56688, "epoch": 468} {"train_loss": -35.911041259765625, "global_step": 56689, "epoch": 468} {"train_loss": -35.965789794921875, "global_step": 56690, "epoch": 468} {"train_loss": -36.747318267822266, "global_step": 56691, "epoch": 468} {"train_loss": -36.623291015625, "global_step": 56692, "epoch": 468} {"train_loss": -34.99319839477539, "global_step": 56693, "epoch": 468} {"train_loss": -36.35270309448242, "global_step": 56694, "epoch": 468} {"train_loss": -36.449214935302734, "global_step": 56695, "epoch": 468} {"train_loss": -36.722145080566406, "global_step": 56696, "epoch": 468} {"train_loss": -36.07136154174805, "global_step": 56697, "epoch": 468} {"train_loss": -36.6658821105957, "global_step": 56698, "epoch": 468} {"train_loss": -36.20598602294922, "global_step": 56699, "epoch": 468} {"train_loss": -36.15892028808594, "global_step": 56700, "epoch": 468} {"train_loss": -34.78242111206055, "global_step": 56701, "epoch": 468} {"train_loss": -35.84128952026367, "global_step": 56702, "epoch": 468} {"train_loss": -35.31011962890625, "global_step": 56703, "epoch": 468} {"train_loss": -35.8234977722168, "global_step": 56704, "epoch": 468} {"train_loss": -36.30531692504883, "global_step": 56705, "epoch": 468} {"train_loss": -33.01580810546875, "global_step": 56706, "epoch": 468} {"train_loss": -33.39638900756836, "global_step": 56707, "epoch": 468} {"train_loss": -32.43766403198242, "global_step": 56708, "epoch": 468} {"train_loss": -35.754638671875, "global_step": 56709, "epoch": 468} {"train_loss": -31.225305557250977, "global_step": 56710, "epoch": 468} {"train_loss": -33.675811767578125, "global_step": 56711, "epoch": 468} {"train_loss": -31.454715728759766, "global_step": 56712, "epoch": 468} {"train_loss": -34.41950607299805, "global_step": 56713, "epoch": 468} {"train_loss": -28.96442222595215, "global_step": 56714, "epoch": 468} {"train_loss": -36.23942184448242, "global_step": 56715, "epoch": 468} {"train_loss": -31.372190475463867, "global_step": 56716, "epoch": 468} {"train_loss": -34.51191329956055, "global_step": 56717, "epoch": 468} {"train_loss": -35.239376068115234, "global_step": 56718, "epoch": 468} {"train_loss": -31.865894317626953, "global_step": 56719, "epoch": 468} {"train_loss": -35.126277923583984, "global_step": 56720, "epoch": 468} {"train_loss": -33.41840362548828, "global_step": 56721, "epoch": 468} {"train_loss": -34.12740707397461, "global_step": 56722, "epoch": 468} {"train_loss": -35.26888656616211, "global_step": 56723, "epoch": 468} {"train_loss": -34.7624626159668, "global_step": 56724, "epoch": 468} {"train_loss": -35.009769439697266, "global_step": 56725, "epoch": 468} {"train_loss": -35.047096252441406, "global_step": 56726, "epoch": 468} {"train_loss": -33.58714294433594, "global_step": 56727, "epoch": 468} {"train_loss": -34.457069396972656, "global_step": 56728, "epoch": 468} {"train_loss": -35.41302490234375, "global_step": 56729, "epoch": 468} {"train_loss": -35.0964469909668, "global_step": 56730, "epoch": 468} {"train_loss": -33.79240036010742, "global_step": 56731, "epoch": 468} {"train_loss": -35.71547317504883, "global_step": 56732, "epoch": 468} {"train_loss": -34.77279281616211, "global_step": 56733, "epoch": 468} {"train_loss": -34.77204513549805, "global_step": 56734, "epoch": 468} {"train_loss": -35.33868408203125, "global_step": 56735, "epoch": 468} {"train_loss": -34.69044876098633, "global_step": 56736, "epoch": 468} {"train_loss": -34.818336486816406, "global_step": 56737, "epoch": 468} {"train_loss": -35.940616607666016, "global_step": 56738, "epoch": 468} {"train_loss": -33.81569290161133, "global_step": 56739, "epoch": 468} {"train_loss": -35.09127426147461, "global_step": 56740, "epoch": 468} {"train_loss": -35.4611701965332, "global_step": 56741, "epoch": 468} {"train_loss": -35.308815002441406, "global_step": 56742, "epoch": 468} {"train_loss": -35.7169303894043, "global_step": 56743, "epoch": 468} {"train_loss": -34.83866500854492, "global_step": 56744, "epoch": 468} {"train_loss": -34.82980728149414, "global_step": 56745, "epoch": 468} {"train_loss": -35.662113189697266, "global_step": 56746, "epoch": 468} {"train_loss": -35.058292388916016, "global_step": 56747, "epoch": 468} {"train_loss": -35.329064345556844, "global_step": 56748, "epoch": 468, "val_loss": 2474510.5} {"train_loss": -35.899417877197266, "global_step": 56749, "epoch": 469} {"train_loss": -35.1234016418457, "global_step": 56750, "epoch": 469} {"train_loss": -34.8539924621582, "global_step": 56751, "epoch": 469} {"train_loss": -35.92594528198242, "global_step": 56752, "epoch": 469} {"train_loss": -35.03644943237305, "global_step": 56753, "epoch": 469} {"train_loss": -35.03642654418945, "global_step": 56754, "epoch": 469} {"train_loss": -35.7129020690918, "global_step": 56755, "epoch": 469} {"train_loss": -35.391292572021484, "global_step": 56756, "epoch": 469} {"train_loss": -35.79680252075195, "global_step": 56757, "epoch": 469} {"train_loss": -35.37821578979492, "global_step": 56758, "epoch": 469} {"train_loss": -35.89385986328125, "global_step": 56759, "epoch": 469} {"train_loss": -36.380489349365234, "global_step": 56760, "epoch": 469} {"train_loss": -35.505062103271484, "global_step": 56761, "epoch": 469} {"train_loss": -35.30350875854492, "global_step": 56762, "epoch": 469} {"train_loss": -36.08315658569336, "global_step": 56763, "epoch": 469} {"train_loss": -36.544918060302734, "global_step": 56764, "epoch": 469} {"train_loss": -35.86098861694336, "global_step": 56765, "epoch": 469} {"train_loss": -35.839351654052734, "global_step": 56766, "epoch": 469} {"train_loss": -36.24252700805664, "global_step": 56767, "epoch": 469} {"train_loss": -36.4115104675293, "global_step": 56768, "epoch": 469} {"train_loss": -35.68886184692383, "global_step": 56769, "epoch": 469} {"train_loss": -36.183349609375, "global_step": 56770, "epoch": 469} {"train_loss": -36.04130172729492, "global_step": 56771, "epoch": 469} {"train_loss": -33.31728744506836, "global_step": 56772, "epoch": 469} {"train_loss": -35.79731750488281, "global_step": 56773, "epoch": 469} {"train_loss": -36.02487564086914, "global_step": 56774, "epoch": 469} {"train_loss": -36.349220275878906, "global_step": 56775, "epoch": 469} {"train_loss": -36.62030029296875, "global_step": 56776, "epoch": 469} {"train_loss": -36.090797424316406, "global_step": 56777, "epoch": 469} {"train_loss": -36.602725982666016, "global_step": 56778, "epoch": 469} {"train_loss": -36.48017120361328, "global_step": 56779, "epoch": 469} {"train_loss": -36.20978546142578, "global_step": 56780, "epoch": 469} {"train_loss": -36.09493637084961, "global_step": 56781, "epoch": 469} {"train_loss": -35.97676467895508, "global_step": 56782, "epoch": 469} {"train_loss": -36.01410675048828, "global_step": 56783, "epoch": 469} {"train_loss": -36.11106491088867, "global_step": 56784, "epoch": 469} {"train_loss": -35.959136962890625, "global_step": 56785, "epoch": 469} {"train_loss": -36.1095085144043, "global_step": 56786, "epoch": 469} {"train_loss": -36.25396728515625, "global_step": 56787, "epoch": 469} {"train_loss": -36.497840881347656, "global_step": 56788, "epoch": 469} {"train_loss": -36.48927307128906, "global_step": 56789, "epoch": 469} {"train_loss": -36.72040557861328, "global_step": 56790, "epoch": 469} {"train_loss": -36.23845672607422, "global_step": 56791, "epoch": 469} {"train_loss": -35.50593185424805, "global_step": 56792, "epoch": 469} {"train_loss": -34.29898452758789, "global_step": 56793, "epoch": 469} {"train_loss": -32.45867919921875, "global_step": 56794, "epoch": 469} {"train_loss": -30.838586807250977, "global_step": 56795, "epoch": 469} {"train_loss": -31.831378936767578, "global_step": 56796, "epoch": 469} {"train_loss": -32.94721984863281, "global_step": 56797, "epoch": 469} {"train_loss": -33.06169509887695, "global_step": 56798, "epoch": 469} {"train_loss": -32.722434997558594, "global_step": 56799, "epoch": 469} {"train_loss": -30.530797958374023, "global_step": 56800, "epoch": 469} {"train_loss": -29.293371200561523, "global_step": 56801, "epoch": 469} {"train_loss": -31.560287475585938, "global_step": 56802, "epoch": 469} {"train_loss": -33.73014831542969, "global_step": 56803, "epoch": 469} {"train_loss": -34.937355041503906, "global_step": 56804, "epoch": 469} {"train_loss": -33.09305191040039, "global_step": 56805, "epoch": 469} {"train_loss": -33.73218536376953, "global_step": 56806, "epoch": 469} {"train_loss": -35.07536697387695, "global_step": 56807, "epoch": 469} {"train_loss": -33.309146881103516, "global_step": 56808, "epoch": 469} {"train_loss": -34.24787521362305, "global_step": 56809, "epoch": 469} {"train_loss": -34.54752731323242, "global_step": 56810, "epoch": 469} {"train_loss": -34.28125762939453, "global_step": 56811, "epoch": 469} {"train_loss": -34.37336349487305, "global_step": 56812, "epoch": 469} {"train_loss": -34.43388366699219, "global_step": 56813, "epoch": 469} {"train_loss": -34.84993362426758, "global_step": 56814, "epoch": 469} {"train_loss": -35.19246292114258, "global_step": 56815, "epoch": 469} {"train_loss": -35.80792236328125, "global_step": 56816, "epoch": 469} {"train_loss": -34.925697326660156, "global_step": 56817, "epoch": 469} {"train_loss": -35.428192138671875, "global_step": 56818, "epoch": 469} {"train_loss": -34.925384521484375, "global_step": 56819, "epoch": 469} {"train_loss": -35.950592041015625, "global_step": 56820, "epoch": 469} {"train_loss": -35.11672592163086, "global_step": 56821, "epoch": 469} {"train_loss": -35.552242279052734, "global_step": 56822, "epoch": 469} {"train_loss": -34.38856887817383, "global_step": 56823, "epoch": 469} {"train_loss": -35.80499267578125, "global_step": 56824, "epoch": 469} {"train_loss": -35.76358413696289, "global_step": 56825, "epoch": 469} {"train_loss": -35.38779067993164, "global_step": 56826, "epoch": 469} {"train_loss": -35.166873931884766, "global_step": 56827, "epoch": 469} {"train_loss": -36.04777908325195, "global_step": 56828, "epoch": 469} {"train_loss": -35.628875732421875, "global_step": 56829, "epoch": 469} {"train_loss": -35.635887145996094, "global_step": 56830, "epoch": 469} {"train_loss": -36.15528106689453, "global_step": 56831, "epoch": 469} {"train_loss": -36.11253356933594, "global_step": 56832, "epoch": 469} {"train_loss": -36.12519073486328, "global_step": 56833, "epoch": 469} {"train_loss": -36.166603088378906, "global_step": 56834, "epoch": 469} {"train_loss": -36.37075424194336, "global_step": 56835, "epoch": 469} {"train_loss": -36.033634185791016, "global_step": 56836, "epoch": 469} {"train_loss": -36.09645462036133, "global_step": 56837, "epoch": 469} {"train_loss": -35.188331604003906, "global_step": 56838, "epoch": 469} {"train_loss": -36.243473052978516, "global_step": 56839, "epoch": 469} {"train_loss": -35.64531326293945, "global_step": 56840, "epoch": 469} {"train_loss": -35.865325927734375, "global_step": 56841, "epoch": 469} {"train_loss": -35.93400573730469, "global_step": 56842, "epoch": 469} {"train_loss": -36.2970085144043, "global_step": 56843, "epoch": 469} {"train_loss": -34.45199203491211, "global_step": 56844, "epoch": 469} {"train_loss": -35.840492248535156, "global_step": 56845, "epoch": 469} {"train_loss": -35.88039779663086, "global_step": 56846, "epoch": 469} {"train_loss": -36.221248626708984, "global_step": 56847, "epoch": 469} {"train_loss": -36.00300979614258, "global_step": 56848, "epoch": 469} {"train_loss": -35.22222900390625, "global_step": 56849, "epoch": 469} {"train_loss": -34.968502044677734, "global_step": 56850, "epoch": 469} {"train_loss": -32.58302688598633, "global_step": 56851, "epoch": 469} {"train_loss": -35.90090560913086, "global_step": 56852, "epoch": 469} {"train_loss": -35.79888153076172, "global_step": 56853, "epoch": 469} {"train_loss": -35.8028450012207, "global_step": 56854, "epoch": 469} {"train_loss": -35.512813568115234, "global_step": 56855, "epoch": 469} {"train_loss": -35.30995559692383, "global_step": 56856, "epoch": 469} {"train_loss": -35.91669845581055, "global_step": 56857, "epoch": 469} {"train_loss": -35.1776123046875, "global_step": 56858, "epoch": 469} {"train_loss": -35.31919479370117, "global_step": 56859, "epoch": 469} {"train_loss": -36.051021575927734, "global_step": 56860, "epoch": 469} {"train_loss": -36.07735824584961, "global_step": 56861, "epoch": 469} {"train_loss": -36.12776565551758, "global_step": 56862, "epoch": 469} {"train_loss": -35.69057846069336, "global_step": 56863, "epoch": 469} {"train_loss": -35.294002532958984, "global_step": 56864, "epoch": 469} {"train_loss": -35.175540924072266, "global_step": 56865, "epoch": 469} {"train_loss": -36.064125061035156, "global_step": 56866, "epoch": 469} {"train_loss": -36.50759506225586, "global_step": 56867, "epoch": 469} {"train_loss": -35.755958557128906, "global_step": 56868, "epoch": 469} {"train_loss": -35.284954086808135, "global_step": 56869, "epoch": 469, "val_loss": 2468143.0} {"train_loss": -35.97249984741211, "global_step": 56870, "epoch": 470} {"train_loss": -36.15479278564453, "global_step": 56871, "epoch": 470} {"train_loss": -36.17853546142578, "global_step": 56872, "epoch": 470} {"train_loss": -35.58724594116211, "global_step": 56873, "epoch": 470} {"train_loss": -36.13991928100586, "global_step": 56874, "epoch": 470} {"train_loss": -36.405574798583984, "global_step": 56875, "epoch": 470} {"train_loss": -35.269256591796875, "global_step": 56876, "epoch": 470} {"train_loss": -35.847740173339844, "global_step": 56877, "epoch": 470} {"train_loss": -36.05386734008789, "global_step": 56878, "epoch": 470} {"train_loss": -36.406349182128906, "global_step": 56879, "epoch": 470} {"train_loss": -34.562965393066406, "global_step": 56880, "epoch": 470} {"train_loss": -36.06217575073242, "global_step": 56881, "epoch": 470} {"train_loss": -35.435237884521484, "global_step": 56882, "epoch": 470} {"train_loss": -36.47271728515625, "global_step": 56883, "epoch": 470} {"train_loss": -35.39385986328125, "global_step": 56884, "epoch": 470} {"train_loss": -34.98198318481445, "global_step": 56885, "epoch": 470} {"train_loss": -36.43731689453125, "global_step": 56886, "epoch": 470} {"train_loss": -36.5943489074707, "global_step": 56887, "epoch": 470} {"train_loss": -36.83926010131836, "global_step": 56888, "epoch": 470} {"train_loss": -36.0744743347168, "global_step": 56889, "epoch": 470} {"train_loss": -34.75343704223633, "global_step": 56890, "epoch": 470} {"train_loss": -34.781951904296875, "global_step": 56891, "epoch": 470} {"train_loss": -35.37972640991211, "global_step": 56892, "epoch": 470} {"train_loss": -35.05567169189453, "global_step": 56893, "epoch": 470} {"train_loss": -34.64990234375, "global_step": 56894, "epoch": 470} {"train_loss": -33.39885711669922, "global_step": 56895, "epoch": 470} {"train_loss": -35.29271697998047, "global_step": 56896, "epoch": 470} {"train_loss": -35.42686462402344, "global_step": 56897, "epoch": 470} {"train_loss": -34.47734451293945, "global_step": 56898, "epoch": 470} {"train_loss": -34.78327178955078, "global_step": 56899, "epoch": 470} {"train_loss": -35.11642837524414, "global_step": 56900, "epoch": 470} {"train_loss": -34.761932373046875, "global_step": 56901, "epoch": 470} {"train_loss": -34.45805740356445, "global_step": 56902, "epoch": 470} {"train_loss": -34.669490814208984, "global_step": 56903, "epoch": 470} {"train_loss": -34.87144088745117, "global_step": 56904, "epoch": 470} {"train_loss": -34.19471740722656, "global_step": 56905, "epoch": 470} {"train_loss": -33.47642135620117, "global_step": 56906, "epoch": 470} {"train_loss": -34.39167022705078, "global_step": 56907, "epoch": 470} {"train_loss": -34.84040451049805, "global_step": 56908, "epoch": 470} {"train_loss": -30.565271377563477, "global_step": 56909, "epoch": 470} {"train_loss": -35.266639709472656, "global_step": 56910, "epoch": 470} {"train_loss": -34.68111038208008, "global_step": 56911, "epoch": 470} {"train_loss": -33.916969299316406, "global_step": 56912, "epoch": 470} {"train_loss": -33.50996780395508, "global_step": 56913, "epoch": 470} {"train_loss": -32.39702224731445, "global_step": 56914, "epoch": 470} {"train_loss": -33.14752197265625, "global_step": 56915, "epoch": 470} {"train_loss": -33.62296676635742, "global_step": 56916, "epoch": 470} {"train_loss": -32.47560501098633, "global_step": 56917, "epoch": 470} {"train_loss": -31.910785675048828, "global_step": 56918, "epoch": 470} {"train_loss": -32.98784255981445, "global_step": 56919, "epoch": 470} {"train_loss": -32.99393844604492, "global_step": 56920, "epoch": 470} {"train_loss": -33.917266845703125, "global_step": 56921, "epoch": 470} {"train_loss": -34.29822540283203, "global_step": 56922, "epoch": 470} {"train_loss": -32.96358871459961, "global_step": 56923, "epoch": 470} {"train_loss": -34.735469818115234, "global_step": 56924, "epoch": 470} {"train_loss": -31.55238151550293, "global_step": 56925, "epoch": 470} {"train_loss": -33.28530502319336, "global_step": 56926, "epoch": 470} {"train_loss": -34.220890045166016, "global_step": 56927, "epoch": 470} {"train_loss": -34.09101867675781, "global_step": 56928, "epoch": 470} {"train_loss": -34.826358795166016, "global_step": 56929, "epoch": 470} {"train_loss": -35.2164306640625, "global_step": 56930, "epoch": 470} {"train_loss": -35.045040130615234, "global_step": 56931, "epoch": 470} {"train_loss": -33.509925842285156, "global_step": 56932, "epoch": 470} {"train_loss": -34.363765716552734, "global_step": 56933, "epoch": 470} {"train_loss": -33.393531799316406, "global_step": 56934, "epoch": 470} {"train_loss": -34.13051223754883, "global_step": 56935, "epoch": 470} {"train_loss": -34.301265716552734, "global_step": 56936, "epoch": 470} {"train_loss": -34.45746994018555, "global_step": 56937, "epoch": 470} {"train_loss": -34.340606689453125, "global_step": 56938, "epoch": 470} {"train_loss": -34.83639144897461, "global_step": 56939, "epoch": 470} {"train_loss": -35.17784881591797, "global_step": 56940, "epoch": 470} {"train_loss": -34.78664016723633, "global_step": 56941, "epoch": 470} {"train_loss": -34.60310745239258, "global_step": 56942, "epoch": 470} {"train_loss": -34.10990905761719, "global_step": 56943, "epoch": 470} {"train_loss": -34.84828567504883, "global_step": 56944, "epoch": 470} {"train_loss": -34.52132034301758, "global_step": 56945, "epoch": 470} {"train_loss": -35.07780838012695, "global_step": 56946, "epoch": 470} {"train_loss": -34.06313705444336, "global_step": 56947, "epoch": 470} {"train_loss": -34.06769943237305, "global_step": 56948, "epoch": 470} {"train_loss": -34.60498809814453, "global_step": 56949, "epoch": 470} {"train_loss": -33.86842727661133, "global_step": 56950, "epoch": 470} {"train_loss": -34.26795196533203, "global_step": 56951, "epoch": 470} {"train_loss": -30.80740737915039, "global_step": 56952, "epoch": 470} {"train_loss": -30.92902946472168, "global_step": 56953, "epoch": 470} {"train_loss": -34.90636444091797, "global_step": 56954, "epoch": 470} {"train_loss": -33.96453857421875, "global_step": 56955, "epoch": 470} {"train_loss": -33.861976623535156, "global_step": 56956, "epoch": 470} {"train_loss": -34.71539306640625, "global_step": 56957, "epoch": 470} {"train_loss": -35.15523910522461, "global_step": 56958, "epoch": 470} {"train_loss": -33.965633392333984, "global_step": 56959, "epoch": 470} {"train_loss": -34.1187744140625, "global_step": 56960, "epoch": 470} {"train_loss": -35.52764892578125, "global_step": 56961, "epoch": 470} {"train_loss": -35.53961181640625, "global_step": 56962, "epoch": 470} {"train_loss": -34.97573471069336, "global_step": 56963, "epoch": 470} {"train_loss": -35.96000289916992, "global_step": 56964, "epoch": 470} {"train_loss": -35.70852279663086, "global_step": 56965, "epoch": 470} {"train_loss": -35.566097259521484, "global_step": 56966, "epoch": 470} {"train_loss": -35.50387191772461, "global_step": 56967, "epoch": 470} {"train_loss": -35.82117462158203, "global_step": 56968, "epoch": 470} {"train_loss": -36.17578125, "global_step": 56969, "epoch": 470} {"train_loss": -35.422119140625, "global_step": 56970, "epoch": 470} {"train_loss": -35.67963790893555, "global_step": 56971, "epoch": 470} {"train_loss": -35.70956802368164, "global_step": 56972, "epoch": 470} {"train_loss": -36.139278411865234, "global_step": 56973, "epoch": 470} {"train_loss": -35.97785186767578, "global_step": 56974, "epoch": 470} {"train_loss": -35.96804428100586, "global_step": 56975, "epoch": 470} {"train_loss": -36.16606140136719, "global_step": 56976, "epoch": 470} {"train_loss": -35.866355895996094, "global_step": 56977, "epoch": 470} {"train_loss": -35.890377044677734, "global_step": 56978, "epoch": 470} {"train_loss": -36.07468795776367, "global_step": 56979, "epoch": 470} {"train_loss": -35.96474838256836, "global_step": 56980, "epoch": 470} {"train_loss": -36.41062545776367, "global_step": 56981, "epoch": 470} {"train_loss": -36.608795166015625, "global_step": 56982, "epoch": 470} {"train_loss": -36.275081634521484, "global_step": 56983, "epoch": 470} {"train_loss": -36.28748321533203, "global_step": 56984, "epoch": 470} {"train_loss": -36.08770751953125, "global_step": 56985, "epoch": 470} {"train_loss": -35.884376525878906, "global_step": 56986, "epoch": 470} {"train_loss": -36.58748245239258, "global_step": 56987, "epoch": 470} {"train_loss": -35.925689697265625, "global_step": 56988, "epoch": 470} {"train_loss": -36.05260467529297, "global_step": 56989, "epoch": 470} {"train_loss": -34.85316998505395, "global_step": 56990, "epoch": 470, "val_loss": 2526482.75} {"train_loss": -36.33405303955078, "global_step": 56991, "epoch": 471} {"train_loss": -36.357872009277344, "global_step": 56992, "epoch": 471} {"train_loss": -36.47578430175781, "global_step": 56993, "epoch": 471} {"train_loss": -36.65339279174805, "global_step": 56994, "epoch": 471} {"train_loss": -36.36659622192383, "global_step": 56995, "epoch": 471} {"train_loss": -36.150814056396484, "global_step": 56996, "epoch": 471} {"train_loss": -36.11577606201172, "global_step": 56997, "epoch": 471} {"train_loss": -36.15473175048828, "global_step": 56998, "epoch": 471} {"train_loss": -35.558414459228516, "global_step": 56999, "epoch": 471} {"train_loss": -34.355796813964844, "global_step": 57000, "epoch": 471} {"train_loss": -32.883995056152344, "global_step": 57001, "epoch": 471} {"train_loss": -28.859975814819336, "global_step": 57002, "epoch": 471} {"train_loss": -24.18672752380371, "global_step": 57003, "epoch": 471} {"train_loss": -25.812936782836914, "global_step": 57004, "epoch": 471} {"train_loss": -32.3322639465332, "global_step": 57005, "epoch": 471} {"train_loss": -35.041629791259766, "global_step": 57006, "epoch": 471} {"train_loss": -31.8915958404541, "global_step": 57007, "epoch": 471} {"train_loss": -34.608375549316406, "global_step": 57008, "epoch": 471} {"train_loss": -35.21023178100586, "global_step": 57009, "epoch": 471} {"train_loss": -34.757904052734375, "global_step": 57010, "epoch": 471} {"train_loss": -34.68668746948242, "global_step": 57011, "epoch": 471} {"train_loss": -33.11123275756836, "global_step": 57012, "epoch": 471} {"train_loss": -35.85944747924805, "global_step": 57013, "epoch": 471} {"train_loss": -35.443275451660156, "global_step": 57014, "epoch": 471} {"train_loss": -36.22869110107422, "global_step": 57015, "epoch": 471} {"train_loss": -35.87675094604492, "global_step": 57016, "epoch": 471} {"train_loss": -36.06455612182617, "global_step": 57017, "epoch": 471} {"train_loss": -34.340606689453125, "global_step": 57018, "epoch": 471} {"train_loss": -35.965476989746094, "global_step": 57019, "epoch": 471} {"train_loss": -36.3902702331543, "global_step": 57020, "epoch": 471} {"train_loss": -32.867977142333984, "global_step": 57021, "epoch": 471} {"train_loss": -36.34254455566406, "global_step": 57022, "epoch": 471} {"train_loss": -35.78778076171875, "global_step": 57023, "epoch": 471} {"train_loss": -30.821996688842773, "global_step": 57024, "epoch": 471} {"train_loss": -35.20461654663086, "global_step": 57025, "epoch": 471} {"train_loss": -35.52157211303711, "global_step": 57026, "epoch": 471} {"train_loss": -34.557064056396484, "global_step": 57027, "epoch": 471} {"train_loss": -32.21989059448242, "global_step": 57028, "epoch": 471} {"train_loss": -32.45899200439453, "global_step": 57029, "epoch": 471} {"train_loss": -35.850093841552734, "global_step": 57030, "epoch": 471} {"train_loss": -34.76393508911133, "global_step": 57031, "epoch": 471} {"train_loss": -35.42617416381836, "global_step": 57032, "epoch": 471} {"train_loss": -34.419456481933594, "global_step": 57033, "epoch": 471} {"train_loss": -34.35260772705078, "global_step": 57034, "epoch": 471} {"train_loss": -33.06997299194336, "global_step": 57035, "epoch": 471} {"train_loss": -28.685232162475586, "global_step": 57036, "epoch": 471} {"train_loss": -34.40681076049805, "global_step": 57037, "epoch": 471} {"train_loss": -31.341867446899414, "global_step": 57038, "epoch": 471} {"train_loss": -34.77494430541992, "global_step": 57039, "epoch": 471} {"train_loss": -32.8773307800293, "global_step": 57040, "epoch": 471} {"train_loss": -34.69364547729492, "global_step": 57041, "epoch": 471} {"train_loss": -34.39460754394531, "global_step": 57042, "epoch": 471} {"train_loss": -34.28889846801758, "global_step": 57043, "epoch": 471} {"train_loss": -34.31859588623047, "global_step": 57044, "epoch": 471} {"train_loss": -31.590702056884766, "global_step": 57045, "epoch": 471} {"train_loss": -33.35785675048828, "global_step": 57046, "epoch": 471} {"train_loss": -34.21915817260742, "global_step": 57047, "epoch": 471} {"train_loss": -33.936126708984375, "global_step": 57048, "epoch": 471} {"train_loss": -34.51164627075195, "global_step": 57049, "epoch": 471} {"train_loss": -34.500457763671875, "global_step": 57050, "epoch": 471} {"train_loss": -33.860618591308594, "global_step": 57051, "epoch": 471} {"train_loss": -34.43968200683594, "global_step": 57052, "epoch": 471} {"train_loss": -34.124237060546875, "global_step": 57053, "epoch": 471} {"train_loss": -35.140296936035156, "global_step": 57054, "epoch": 471} {"train_loss": -34.06509780883789, "global_step": 57055, "epoch": 471} {"train_loss": -34.974788665771484, "global_step": 57056, "epoch": 471} {"train_loss": -33.869991302490234, "global_step": 57057, "epoch": 471} {"train_loss": -34.87886047363281, "global_step": 57058, "epoch": 471} {"train_loss": -34.284202575683594, "global_step": 57059, "epoch": 471} {"train_loss": -35.235511779785156, "global_step": 57060, "epoch": 471} {"train_loss": -34.3691291809082, "global_step": 57061, "epoch": 471} {"train_loss": -34.241275787353516, "global_step": 57062, "epoch": 471} {"train_loss": -35.5984001159668, "global_step": 57063, "epoch": 471} {"train_loss": -34.2506103515625, "global_step": 57064, "epoch": 471} {"train_loss": -34.72266387939453, "global_step": 57065, "epoch": 471} {"train_loss": -34.79893112182617, "global_step": 57066, "epoch": 471} {"train_loss": -34.882076263427734, "global_step": 57067, "epoch": 471} {"train_loss": -35.43098068237305, "global_step": 57068, "epoch": 471} {"train_loss": -35.73649597167969, "global_step": 57069, "epoch": 471} {"train_loss": -35.56795883178711, "global_step": 57070, "epoch": 471} {"train_loss": -35.44806671142578, "global_step": 57071, "epoch": 471} {"train_loss": -35.52227783203125, "global_step": 57072, "epoch": 471} {"train_loss": -35.60349655151367, "global_step": 57073, "epoch": 471} {"train_loss": -35.693851470947266, "global_step": 57074, "epoch": 471} {"train_loss": -35.56760787963867, "global_step": 57075, "epoch": 471} {"train_loss": -35.88491439819336, "global_step": 57076, "epoch": 471} {"train_loss": -36.287628173828125, "global_step": 57077, "epoch": 471} {"train_loss": -35.66816329956055, "global_step": 57078, "epoch": 471} {"train_loss": -34.79606628417969, "global_step": 57079, "epoch": 471} {"train_loss": -33.80575180053711, "global_step": 57080, "epoch": 471} {"train_loss": -34.56248474121094, "global_step": 57081, "epoch": 471} {"train_loss": -35.10624313354492, "global_step": 57082, "epoch": 471} {"train_loss": -35.68891143798828, "global_step": 57083, "epoch": 471} {"train_loss": -36.1091423034668, "global_step": 57084, "epoch": 471} {"train_loss": -35.94682693481445, "global_step": 57085, "epoch": 471} {"train_loss": -34.80358123779297, "global_step": 57086, "epoch": 471} {"train_loss": -35.369293212890625, "global_step": 57087, "epoch": 471} {"train_loss": -33.51449203491211, "global_step": 57088, "epoch": 471} {"train_loss": -33.790138244628906, "global_step": 57089, "epoch": 471} {"train_loss": -34.00349044799805, "global_step": 57090, "epoch": 471} {"train_loss": -33.30744171142578, "global_step": 57091, "epoch": 471} {"train_loss": -34.10551834106445, "global_step": 57092, "epoch": 471} {"train_loss": -35.908111572265625, "global_step": 57093, "epoch": 471} {"train_loss": -35.428367614746094, "global_step": 57094, "epoch": 471} {"train_loss": -35.05093002319336, "global_step": 57095, "epoch": 471} {"train_loss": -34.715354919433594, "global_step": 57096, "epoch": 471} {"train_loss": -35.48734664916992, "global_step": 57097, "epoch": 471} {"train_loss": -34.969722747802734, "global_step": 57098, "epoch": 471} {"train_loss": -35.201168060302734, "global_step": 57099, "epoch": 471} {"train_loss": -34.828094482421875, "global_step": 57100, "epoch": 471} {"train_loss": -35.24219512939453, "global_step": 57101, "epoch": 471} {"train_loss": -35.198036193847656, "global_step": 57102, "epoch": 471} {"train_loss": -34.154212951660156, "global_step": 57103, "epoch": 471} {"train_loss": -35.9966926574707, "global_step": 57104, "epoch": 471} {"train_loss": -34.4809684753418, "global_step": 57105, "epoch": 471} {"train_loss": -33.487823486328125, "global_step": 57106, "epoch": 471} {"train_loss": -35.501060485839844, "global_step": 57107, "epoch": 471} {"train_loss": -33.16170883178711, "global_step": 57108, "epoch": 471} {"train_loss": -35.636070251464844, "global_step": 57109, "epoch": 471} {"train_loss": -34.61432647705078, "global_step": 57110, "epoch": 471} {"train_loss": -34.507580575864175, "global_step": 57111, "epoch": 471, "val_loss": 2518448.25} {"train_loss": -31.9985408782959, "global_step": 57112, "epoch": 472} {"train_loss": -34.40778732299805, "global_step": 57113, "epoch": 472} {"train_loss": -34.59678649902344, "global_step": 57114, "epoch": 472} {"train_loss": -34.21218490600586, "global_step": 57115, "epoch": 472} {"train_loss": -33.602596282958984, "global_step": 57116, "epoch": 472} {"train_loss": -35.540313720703125, "global_step": 57117, "epoch": 472} {"train_loss": -34.583499908447266, "global_step": 57118, "epoch": 472} {"train_loss": -35.06199264526367, "global_step": 57119, "epoch": 472} {"train_loss": -35.94497299194336, "global_step": 57120, "epoch": 472} {"train_loss": -33.867706298828125, "global_step": 57121, "epoch": 472} {"train_loss": -35.06134796142578, "global_step": 57122, "epoch": 472} {"train_loss": -36.007293701171875, "global_step": 57123, "epoch": 472} {"train_loss": -35.201229095458984, "global_step": 57124, "epoch": 472} {"train_loss": -35.428436279296875, "global_step": 57125, "epoch": 472} {"train_loss": -35.89512252807617, "global_step": 57126, "epoch": 472} {"train_loss": -35.28599166870117, "global_step": 57127, "epoch": 472} {"train_loss": -35.89323043823242, "global_step": 57128, "epoch": 472} {"train_loss": -35.47587203979492, "global_step": 57129, "epoch": 472} {"train_loss": -35.97370147705078, "global_step": 57130, "epoch": 472} {"train_loss": -35.737693786621094, "global_step": 57131, "epoch": 472} {"train_loss": -35.68488693237305, "global_step": 57132, "epoch": 472} {"train_loss": -36.720176696777344, "global_step": 57133, "epoch": 472} {"train_loss": -34.780147552490234, "global_step": 57134, "epoch": 472} {"train_loss": -36.02864456176758, "global_step": 57135, "epoch": 472} {"train_loss": -36.5389404296875, "global_step": 57136, "epoch": 472} {"train_loss": -36.29281234741211, "global_step": 57137, "epoch": 472} {"train_loss": -36.400142669677734, "global_step": 57138, "epoch": 472} {"train_loss": -35.06218338012695, "global_step": 57139, "epoch": 472} {"train_loss": -33.94988250732422, "global_step": 57140, "epoch": 472} {"train_loss": -31.88291358947754, "global_step": 57141, "epoch": 472} {"train_loss": -30.597578048706055, "global_step": 57142, "epoch": 472} {"train_loss": -34.27235794067383, "global_step": 57143, "epoch": 472} {"train_loss": -36.438087463378906, "global_step": 57144, "epoch": 472} {"train_loss": -34.992584228515625, "global_step": 57145, "epoch": 472} {"train_loss": -34.25484848022461, "global_step": 57146, "epoch": 472} {"train_loss": -35.86478805541992, "global_step": 57147, "epoch": 472} {"train_loss": -36.504215240478516, "global_step": 57148, "epoch": 472} {"train_loss": -35.419612884521484, "global_step": 57149, "epoch": 472} {"train_loss": -36.12388229370117, "global_step": 57150, "epoch": 472} {"train_loss": -36.58474349975586, "global_step": 57151, "epoch": 472} {"train_loss": -35.619537353515625, "global_step": 57152, "epoch": 472} {"train_loss": -36.4868049621582, "global_step": 57153, "epoch": 472} {"train_loss": -35.77362823486328, "global_step": 57154, "epoch": 472} {"train_loss": -36.54597091674805, "global_step": 57155, "epoch": 472} {"train_loss": -35.42713165283203, "global_step": 57156, "epoch": 472} {"train_loss": -36.02582550048828, "global_step": 57157, "epoch": 472} {"train_loss": -36.21403121948242, "global_step": 57158, "epoch": 472} {"train_loss": -36.17411422729492, "global_step": 57159, "epoch": 472} {"train_loss": -36.192684173583984, "global_step": 57160, "epoch": 472} {"train_loss": -36.14760971069336, "global_step": 57161, "epoch": 472} {"train_loss": -36.423744201660156, "global_step": 57162, "epoch": 472} {"train_loss": -36.15327072143555, "global_step": 57163, "epoch": 472} {"train_loss": -36.7121467590332, "global_step": 57164, "epoch": 472} {"train_loss": -36.478363037109375, "global_step": 57165, "epoch": 472} {"train_loss": -35.97904586791992, "global_step": 57166, "epoch": 472} {"train_loss": -36.396827697753906, "global_step": 57167, "epoch": 472} {"train_loss": -36.0716667175293, "global_step": 57168, "epoch": 472} {"train_loss": -36.2186393737793, "global_step": 57169, "epoch": 472} {"train_loss": -36.4273567199707, "global_step": 57170, "epoch": 472} {"train_loss": -36.80750274658203, "global_step": 57171, "epoch": 472} {"train_loss": -35.79388427734375, "global_step": 57172, "epoch": 472} {"train_loss": -36.40055465698242, "global_step": 57173, "epoch": 472} {"train_loss": -35.8842658996582, "global_step": 57174, "epoch": 472} {"train_loss": -36.525230407714844, "global_step": 57175, "epoch": 472} {"train_loss": -36.68333435058594, "global_step": 57176, "epoch": 472} {"train_loss": -36.349422454833984, "global_step": 57177, "epoch": 472} {"train_loss": -35.81572341918945, "global_step": 57178, "epoch": 472} {"train_loss": -36.1318473815918, "global_step": 57179, "epoch": 472} {"train_loss": -36.763240814208984, "global_step": 57180, "epoch": 472} {"train_loss": -35.75120162963867, "global_step": 57181, "epoch": 472} {"train_loss": -36.523006439208984, "global_step": 57182, "epoch": 472} {"train_loss": -36.160579681396484, "global_step": 57183, "epoch": 472} {"train_loss": -36.14272689819336, "global_step": 57184, "epoch": 472} {"train_loss": -35.16015625, "global_step": 57185, "epoch": 472} {"train_loss": -36.486846923828125, "global_step": 57186, "epoch": 472} {"train_loss": -36.10459518432617, "global_step": 57187, "epoch": 472} {"train_loss": -35.805084228515625, "global_step": 57188, "epoch": 472} {"train_loss": -35.81852340698242, "global_step": 57189, "epoch": 472} {"train_loss": -36.00232696533203, "global_step": 57190, "epoch": 472} {"train_loss": -35.55207443237305, "global_step": 57191, "epoch": 472} {"train_loss": -35.364192962646484, "global_step": 57192, "epoch": 472} {"train_loss": -36.14384841918945, "global_step": 57193, "epoch": 472} {"train_loss": -36.54632568359375, "global_step": 57194, "epoch": 472} {"train_loss": -36.04072189331055, "global_step": 57195, "epoch": 472} {"train_loss": -35.974159240722656, "global_step": 57196, "epoch": 472} {"train_loss": -35.9288444519043, "global_step": 57197, "epoch": 472} {"train_loss": -36.20431137084961, "global_step": 57198, "epoch": 472} {"train_loss": -34.917335510253906, "global_step": 57199, "epoch": 472} {"train_loss": -34.55554962158203, "global_step": 57200, "epoch": 472} {"train_loss": -36.8922233581543, "global_step": 57201, "epoch": 472} {"train_loss": -35.60394287109375, "global_step": 57202, "epoch": 472} {"train_loss": -35.8818359375, "global_step": 57203, "epoch": 472} {"train_loss": -35.98175811767578, "global_step": 57204, "epoch": 472} {"train_loss": -35.7496452331543, "global_step": 57205, "epoch": 472} {"train_loss": -35.39632034301758, "global_step": 57206, "epoch": 472} {"train_loss": -35.032649993896484, "global_step": 57207, "epoch": 472} {"train_loss": -35.20119857788086, "global_step": 57208, "epoch": 472} {"train_loss": -35.334754943847656, "global_step": 57209, "epoch": 472} {"train_loss": -34.30129623413086, "global_step": 57210, "epoch": 472} {"train_loss": -32.7736930847168, "global_step": 57211, "epoch": 472} {"train_loss": -35.478755950927734, "global_step": 57212, "epoch": 472} {"train_loss": -36.306243896484375, "global_step": 57213, "epoch": 472} {"train_loss": -35.314815521240234, "global_step": 57214, "epoch": 472} {"train_loss": -33.45161437988281, "global_step": 57215, "epoch": 472} {"train_loss": -35.274024963378906, "global_step": 57216, "epoch": 472} {"train_loss": -34.6852912902832, "global_step": 57217, "epoch": 472} {"train_loss": -34.1396598815918, "global_step": 57218, "epoch": 472} {"train_loss": -36.01708221435547, "global_step": 57219, "epoch": 472} {"train_loss": -35.5509033203125, "global_step": 57220, "epoch": 472} {"train_loss": -35.1805534362793, "global_step": 57221, "epoch": 472} {"train_loss": -35.98310089111328, "global_step": 57222, "epoch": 472} {"train_loss": -35.175655364990234, "global_step": 57223, "epoch": 472} {"train_loss": -36.10523223876953, "global_step": 57224, "epoch": 472} {"train_loss": -35.91530990600586, "global_step": 57225, "epoch": 472} {"train_loss": -35.14667510986328, "global_step": 57226, "epoch": 472} {"train_loss": -36.6362419128418, "global_step": 57227, "epoch": 472} {"train_loss": -35.8157958984375, "global_step": 57228, "epoch": 472} {"train_loss": -36.18024826049805, "global_step": 57229, "epoch": 472} {"train_loss": -35.989681243896484, "global_step": 57230, "epoch": 472} {"train_loss": -35.89754104614258, "global_step": 57231, "epoch": 472} {"train_loss": -35.58101144900992, "global_step": 57232, "epoch": 472, "val_loss": 2555485.25} {"train_loss": -36.20708465576172, "global_step": 57233, "epoch": 473} {"train_loss": -36.0648307800293, "global_step": 57234, "epoch": 473} {"train_loss": -35.6392936706543, "global_step": 57235, "epoch": 473} {"train_loss": -35.27755355834961, "global_step": 57236, "epoch": 473} {"train_loss": -36.10868453979492, "global_step": 57237, "epoch": 473} {"train_loss": -34.53453826904297, "global_step": 57238, "epoch": 473} {"train_loss": -35.20493698120117, "global_step": 57239, "epoch": 473} {"train_loss": -35.755435943603516, "global_step": 57240, "epoch": 473} {"train_loss": -36.21745681762695, "global_step": 57241, "epoch": 473} {"train_loss": -35.51518249511719, "global_step": 57242, "epoch": 473} {"train_loss": -35.745548248291016, "global_step": 57243, "epoch": 473} {"train_loss": -36.000526428222656, "global_step": 57244, "epoch": 473} {"train_loss": -36.54941940307617, "global_step": 57245, "epoch": 473} {"train_loss": -35.247684478759766, "global_step": 57246, "epoch": 473} {"train_loss": -36.16119384765625, "global_step": 57247, "epoch": 473} {"train_loss": -36.09170150756836, "global_step": 57248, "epoch": 473} {"train_loss": -36.024810791015625, "global_step": 57249, "epoch": 473} {"train_loss": -35.21345520019531, "global_step": 57250, "epoch": 473} {"train_loss": -35.00756072998047, "global_step": 57251, "epoch": 473} {"train_loss": -36.01272964477539, "global_step": 57252, "epoch": 473} {"train_loss": -34.8971061706543, "global_step": 57253, "epoch": 473} {"train_loss": -33.9154167175293, "global_step": 57254, "epoch": 473} {"train_loss": -34.25728225708008, "global_step": 57255, "epoch": 473} {"train_loss": -35.026527404785156, "global_step": 57256, "epoch": 473} {"train_loss": -35.991031646728516, "global_step": 57257, "epoch": 473} {"train_loss": -34.85696029663086, "global_step": 57258, "epoch": 473} {"train_loss": -35.564064025878906, "global_step": 57259, "epoch": 473} {"train_loss": -36.0196418762207, "global_step": 57260, "epoch": 473} {"train_loss": -34.94941711425781, "global_step": 57261, "epoch": 473} {"train_loss": -35.35799789428711, "global_step": 57262, "epoch": 473} {"train_loss": -35.828914642333984, "global_step": 57263, "epoch": 473} {"train_loss": -34.35483169555664, "global_step": 57264, "epoch": 473} {"train_loss": -35.3622932434082, "global_step": 57265, "epoch": 473} {"train_loss": -35.44041442871094, "global_step": 57266, "epoch": 473} {"train_loss": -34.2733268737793, "global_step": 57267, "epoch": 473} {"train_loss": -32.81535339355469, "global_step": 57268, "epoch": 473} {"train_loss": -32.98530960083008, "global_step": 57269, "epoch": 473} {"train_loss": -30.883594512939453, "global_step": 57270, "epoch": 473} {"train_loss": -31.94768714904785, "global_step": 57271, "epoch": 473} {"train_loss": -34.29774856567383, "global_step": 57272, "epoch": 473} {"train_loss": -36.19449996948242, "global_step": 57273, "epoch": 473} {"train_loss": -33.955360412597656, "global_step": 57274, "epoch": 473} {"train_loss": -33.37327194213867, "global_step": 57275, "epoch": 473} {"train_loss": -35.6418342590332, "global_step": 57276, "epoch": 473} {"train_loss": -35.3268928527832, "global_step": 57277, "epoch": 473} {"train_loss": -32.17975997924805, "global_step": 57278, "epoch": 473} {"train_loss": -35.75778579711914, "global_step": 57279, "epoch": 473} {"train_loss": -35.487117767333984, "global_step": 57280, "epoch": 473} {"train_loss": -35.76308822631836, "global_step": 57281, "epoch": 473} {"train_loss": -35.270748138427734, "global_step": 57282, "epoch": 473} {"train_loss": -35.82221221923828, "global_step": 57283, "epoch": 473} {"train_loss": -35.80824661254883, "global_step": 57284, "epoch": 473} {"train_loss": -34.82001495361328, "global_step": 57285, "epoch": 473} {"train_loss": -36.061187744140625, "global_step": 57286, "epoch": 473} {"train_loss": -35.264522552490234, "global_step": 57287, "epoch": 473} {"train_loss": -34.95726776123047, "global_step": 57288, "epoch": 473} {"train_loss": -36.11997604370117, "global_step": 57289, "epoch": 473} {"train_loss": -35.57926559448242, "global_step": 57290, "epoch": 473} {"train_loss": -34.087623596191406, "global_step": 57291, "epoch": 473} {"train_loss": -35.74955368041992, "global_step": 57292, "epoch": 473} {"train_loss": -35.92574691772461, "global_step": 57293, "epoch": 473} {"train_loss": -35.91664505004883, "global_step": 57294, "epoch": 473} {"train_loss": -34.749725341796875, "global_step": 57295, "epoch": 473} {"train_loss": -35.52242660522461, "global_step": 57296, "epoch": 473} {"train_loss": -35.44758605957031, "global_step": 57297, "epoch": 473} {"train_loss": -35.64695358276367, "global_step": 57298, "epoch": 473} {"train_loss": -36.184326171875, "global_step": 57299, "epoch": 473} {"train_loss": -35.22393798828125, "global_step": 57300, "epoch": 473} {"train_loss": -34.41450119018555, "global_step": 57301, "epoch": 473} {"train_loss": -35.957149505615234, "global_step": 57302, "epoch": 473} {"train_loss": -35.65070724487305, "global_step": 57303, "epoch": 473} {"train_loss": -36.039947509765625, "global_step": 57304, "epoch": 473} {"train_loss": -35.2856330871582, "global_step": 57305, "epoch": 473} {"train_loss": -35.74784469604492, "global_step": 57306, "epoch": 473} {"train_loss": -35.53182601928711, "global_step": 57307, "epoch": 473} {"train_loss": -35.271156311035156, "global_step": 57308, "epoch": 473} {"train_loss": -34.60966110229492, "global_step": 57309, "epoch": 473} {"train_loss": -35.80228805541992, "global_step": 57310, "epoch": 473} {"train_loss": -35.26487350463867, "global_step": 57311, "epoch": 473} {"train_loss": -34.83604049682617, "global_step": 57312, "epoch": 473} {"train_loss": -35.979339599609375, "global_step": 57313, "epoch": 473} {"train_loss": -36.0983772277832, "global_step": 57314, "epoch": 473} {"train_loss": -35.847900390625, "global_step": 57315, "epoch": 473} {"train_loss": -35.764766693115234, "global_step": 57316, "epoch": 473} {"train_loss": -36.283546447753906, "global_step": 57317, "epoch": 473} {"train_loss": -35.464046478271484, "global_step": 57318, "epoch": 473} {"train_loss": -36.420223236083984, "global_step": 57319, "epoch": 473} {"train_loss": -36.13581466674805, "global_step": 57320, "epoch": 473} {"train_loss": -35.979248046875, "global_step": 57321, "epoch": 473} {"train_loss": -36.005271911621094, "global_step": 57322, "epoch": 473} {"train_loss": -36.26213073730469, "global_step": 57323, "epoch": 473} {"train_loss": -36.35383987426758, "global_step": 57324, "epoch": 473} {"train_loss": -36.510414123535156, "global_step": 57325, "epoch": 473} {"train_loss": -36.45085906982422, "global_step": 57326, "epoch": 473} {"train_loss": -36.12881088256836, "global_step": 57327, "epoch": 473} {"train_loss": -36.123104095458984, "global_step": 57328, "epoch": 473} {"train_loss": -35.95420455932617, "global_step": 57329, "epoch": 473} {"train_loss": -36.1538200378418, "global_step": 57330, "epoch": 473} {"train_loss": -35.78398513793945, "global_step": 57331, "epoch": 473} {"train_loss": -35.43684768676758, "global_step": 57332, "epoch": 473} {"train_loss": -35.0403938293457, "global_step": 57333, "epoch": 473} {"train_loss": -35.76904296875, "global_step": 57334, "epoch": 473} {"train_loss": -35.6911506652832, "global_step": 57335, "epoch": 473} {"train_loss": -36.5012092590332, "global_step": 57336, "epoch": 473} {"train_loss": -35.600276947021484, "global_step": 57337, "epoch": 473} {"train_loss": -36.266597747802734, "global_step": 57338, "epoch": 473} {"train_loss": -34.209285736083984, "global_step": 57339, "epoch": 473} {"train_loss": -36.26237106323242, "global_step": 57340, "epoch": 473} {"train_loss": -36.29749298095703, "global_step": 57341, "epoch": 473} {"train_loss": -36.25857162475586, "global_step": 57342, "epoch": 473} {"train_loss": -35.8484001159668, "global_step": 57343, "epoch": 473} {"train_loss": -36.228084564208984, "global_step": 57344, "epoch": 473} {"train_loss": -36.68342971801758, "global_step": 57345, "epoch": 473} {"train_loss": -36.3028450012207, "global_step": 57346, "epoch": 473} {"train_loss": -36.71308898925781, "global_step": 57347, "epoch": 473} {"train_loss": -36.11552047729492, "global_step": 57348, "epoch": 473} {"train_loss": -34.4886360168457, "global_step": 57349, "epoch": 473} {"train_loss": -36.0472412109375, "global_step": 57350, "epoch": 473} {"train_loss": -36.37095260620117, "global_step": 57351, "epoch": 473} {"train_loss": -35.346981048583984, "global_step": 57352, "epoch": 473} {"train_loss": -35.46472235750561, "global_step": 57353, "epoch": 473, "val_loss": 2548909.25} {"train_loss": -34.27492904663086, "global_step": 57354, "epoch": 474} {"train_loss": -34.90302658081055, "global_step": 57355, "epoch": 474} {"train_loss": -35.50587844848633, "global_step": 57356, "epoch": 474} {"train_loss": -35.30385971069336, "global_step": 57357, "epoch": 474} {"train_loss": -35.87055206298828, "global_step": 57358, "epoch": 474} {"train_loss": -35.372982025146484, "global_step": 57359, "epoch": 474} {"train_loss": -35.07809066772461, "global_step": 57360, "epoch": 474} {"train_loss": -35.838584899902344, "global_step": 57361, "epoch": 474} {"train_loss": -36.403358459472656, "global_step": 57362, "epoch": 474} {"train_loss": -35.393394470214844, "global_step": 57363, "epoch": 474} {"train_loss": -35.308929443359375, "global_step": 57364, "epoch": 474} {"train_loss": -35.91015625, "global_step": 57365, "epoch": 474} {"train_loss": -35.354148864746094, "global_step": 57366, "epoch": 474} {"train_loss": -33.41507339477539, "global_step": 57367, "epoch": 474} {"train_loss": -34.06834030151367, "global_step": 57368, "epoch": 474} {"train_loss": -35.205162048339844, "global_step": 57369, "epoch": 474} {"train_loss": -34.18048095703125, "global_step": 57370, "epoch": 474} {"train_loss": -34.853389739990234, "global_step": 57371, "epoch": 474} {"train_loss": -34.2410888671875, "global_step": 57372, "epoch": 474} {"train_loss": -33.94904327392578, "global_step": 57373, "epoch": 474} {"train_loss": -34.366905212402344, "global_step": 57374, "epoch": 474} {"train_loss": -33.77185821533203, "global_step": 57375, "epoch": 474} {"train_loss": -35.10538864135742, "global_step": 57376, "epoch": 474} {"train_loss": -34.82437515258789, "global_step": 57377, "epoch": 474} {"train_loss": -34.8958740234375, "global_step": 57378, "epoch": 474} {"train_loss": -35.69511795043945, "global_step": 57379, "epoch": 474} {"train_loss": -35.34942626953125, "global_step": 57380, "epoch": 474} {"train_loss": -35.79401397705078, "global_step": 57381, "epoch": 474} {"train_loss": -35.535247802734375, "global_step": 57382, "epoch": 474} {"train_loss": -34.68549728393555, "global_step": 57383, "epoch": 474} {"train_loss": -35.98891067504883, "global_step": 57384, "epoch": 474} {"train_loss": -35.26816940307617, "global_step": 57385, "epoch": 474} {"train_loss": -34.6280517578125, "global_step": 57386, "epoch": 474} {"train_loss": -35.39065933227539, "global_step": 57387, "epoch": 474} {"train_loss": -35.27690887451172, "global_step": 57388, "epoch": 474} {"train_loss": -35.852027893066406, "global_step": 57389, "epoch": 474} {"train_loss": -35.100303649902344, "global_step": 57390, "epoch": 474} {"train_loss": -35.62776184082031, "global_step": 57391, "epoch": 474} {"train_loss": -35.21184158325195, "global_step": 57392, "epoch": 474} {"train_loss": -35.85805130004883, "global_step": 57393, "epoch": 474} {"train_loss": -35.983848571777344, "global_step": 57394, "epoch": 474} {"train_loss": -35.923309326171875, "global_step": 57395, "epoch": 474} {"train_loss": -35.92988204956055, "global_step": 57396, "epoch": 474} {"train_loss": -35.386558532714844, "global_step": 57397, "epoch": 474} {"train_loss": -35.85245132446289, "global_step": 57398, "epoch": 474} {"train_loss": -35.164520263671875, "global_step": 57399, "epoch": 474} {"train_loss": -35.90391159057617, "global_step": 57400, "epoch": 474} {"train_loss": -36.30202865600586, "global_step": 57401, "epoch": 474} {"train_loss": -35.58192825317383, "global_step": 57402, "epoch": 474} {"train_loss": -36.17806625366211, "global_step": 57403, "epoch": 474} {"train_loss": -36.53469467163086, "global_step": 57404, "epoch": 474} {"train_loss": -36.17866897583008, "global_step": 57405, "epoch": 474} {"train_loss": -35.922542572021484, "global_step": 57406, "epoch": 474} {"train_loss": -35.31707000732422, "global_step": 57407, "epoch": 474} {"train_loss": -35.11104965209961, "global_step": 57408, "epoch": 474} {"train_loss": -32.161720275878906, "global_step": 57409, "epoch": 474} {"train_loss": -28.719833374023438, "global_step": 57410, "epoch": 474} {"train_loss": -26.39069175720215, "global_step": 57411, "epoch": 474} {"train_loss": -27.197011947631836, "global_step": 57412, "epoch": 474} {"train_loss": -34.36480712890625, "global_step": 57413, "epoch": 474} {"train_loss": -34.52902603149414, "global_step": 57414, "epoch": 474} {"train_loss": -35.065364837646484, "global_step": 57415, "epoch": 474} {"train_loss": -34.40348434448242, "global_step": 57416, "epoch": 474} {"train_loss": -36.048980712890625, "global_step": 57417, "epoch": 474} {"train_loss": -34.945777893066406, "global_step": 57418, "epoch": 474} {"train_loss": -35.65998840332031, "global_step": 57419, "epoch": 474} {"train_loss": -35.37726974487305, "global_step": 57420, "epoch": 474} {"train_loss": -35.3429069519043, "global_step": 57421, "epoch": 474} {"train_loss": -35.86054992675781, "global_step": 57422, "epoch": 474} {"train_loss": -35.03867721557617, "global_step": 57423, "epoch": 474} {"train_loss": -35.687049865722656, "global_step": 57424, "epoch": 474} {"train_loss": -35.31010055541992, "global_step": 57425, "epoch": 474} {"train_loss": -35.77208709716797, "global_step": 57426, "epoch": 474} {"train_loss": -36.063331604003906, "global_step": 57427, "epoch": 474} {"train_loss": -35.655487060546875, "global_step": 57428, "epoch": 474} {"train_loss": -35.92954635620117, "global_step": 57429, "epoch": 474} {"train_loss": -36.462005615234375, "global_step": 57430, "epoch": 474} {"train_loss": -36.0150260925293, "global_step": 57431, "epoch": 474} {"train_loss": -36.35137939453125, "global_step": 57432, "epoch": 474} {"train_loss": -36.545047760009766, "global_step": 57433, "epoch": 474} {"train_loss": -36.5804443359375, "global_step": 57434, "epoch": 474} {"train_loss": -36.278167724609375, "global_step": 57435, "epoch": 474} {"train_loss": -36.28723907470703, "global_step": 57436, "epoch": 474} {"train_loss": -36.22990798950195, "global_step": 57437, "epoch": 474} {"train_loss": -36.43378829956055, "global_step": 57438, "epoch": 474} {"train_loss": -36.41722869873047, "global_step": 57439, "epoch": 474} {"train_loss": -37.107173919677734, "global_step": 57440, "epoch": 474} {"train_loss": -36.2110481262207, "global_step": 57441, "epoch": 474} {"train_loss": -36.2443733215332, "global_step": 57442, "epoch": 474} {"train_loss": -36.03239059448242, "global_step": 57443, "epoch": 474} {"train_loss": -34.04862594604492, "global_step": 57444, "epoch": 474} {"train_loss": -33.73480987548828, "global_step": 57445, "epoch": 474} {"train_loss": -32.40962600708008, "global_step": 57446, "epoch": 474} {"train_loss": -31.040771484375, "global_step": 57447, "epoch": 474} {"train_loss": -31.786497116088867, "global_step": 57448, "epoch": 474} {"train_loss": -35.32444381713867, "global_step": 57449, "epoch": 474} {"train_loss": -36.8697624206543, "global_step": 57450, "epoch": 474} {"train_loss": -34.65851974487305, "global_step": 57451, "epoch": 474} {"train_loss": -35.65642547607422, "global_step": 57452, "epoch": 474} {"train_loss": -36.375545501708984, "global_step": 57453, "epoch": 474} {"train_loss": -35.31278610229492, "global_step": 57454, "epoch": 474} {"train_loss": -36.76481246948242, "global_step": 57455, "epoch": 474} {"train_loss": -35.340877532958984, "global_step": 57456, "epoch": 474} {"train_loss": -36.56709671020508, "global_step": 57457, "epoch": 474} {"train_loss": -36.65810012817383, "global_step": 57458, "epoch": 474} {"train_loss": -36.76182174682617, "global_step": 57459, "epoch": 474} {"train_loss": -36.8498649597168, "global_step": 57460, "epoch": 474} {"train_loss": -36.77246856689453, "global_step": 57461, "epoch": 474} {"train_loss": -36.3668098449707, "global_step": 57462, "epoch": 474} {"train_loss": -36.88616943359375, "global_step": 57463, "epoch": 474} {"train_loss": -35.85768508911133, "global_step": 57464, "epoch": 474} {"train_loss": -36.301918029785156, "global_step": 57465, "epoch": 474} {"train_loss": -36.602169036865234, "global_step": 57466, "epoch": 474} {"train_loss": -36.98862838745117, "global_step": 57467, "epoch": 474} {"train_loss": -35.9658203125, "global_step": 57468, "epoch": 474} {"train_loss": -36.520687103271484, "global_step": 57469, "epoch": 474} {"train_loss": -36.58060836791992, "global_step": 57470, "epoch": 474} {"train_loss": -36.68831253051758, "global_step": 57471, "epoch": 474} {"train_loss": -34.411529541015625, "global_step": 57472, "epoch": 474} {"train_loss": -36.10895919799805, "global_step": 57473, "epoch": 474} {"train_loss": -35.286884796520894, "global_step": 57474, "epoch": 474, "val_loss": 2485369.75} {"train_loss": -36.960567474365234, "global_step": 57475, "epoch": 475} {"train_loss": -36.14799880981445, "global_step": 57476, "epoch": 475} {"train_loss": -36.089759826660156, "global_step": 57477, "epoch": 475} {"train_loss": -35.077392578125, "global_step": 57478, "epoch": 475} {"train_loss": -34.1412239074707, "global_step": 57479, "epoch": 475} {"train_loss": -35.735633850097656, "global_step": 57480, "epoch": 475} {"train_loss": -36.095882415771484, "global_step": 57481, "epoch": 475} {"train_loss": -35.1767578125, "global_step": 57482, "epoch": 475} {"train_loss": -37.00984573364258, "global_step": 57483, "epoch": 475} {"train_loss": -36.28286361694336, "global_step": 57484, "epoch": 475} {"train_loss": -35.224578857421875, "global_step": 57485, "epoch": 475} {"train_loss": -35.83711624145508, "global_step": 57486, "epoch": 475} {"train_loss": -35.46670913696289, "global_step": 57487, "epoch": 475} {"train_loss": -35.562049865722656, "global_step": 57488, "epoch": 475} {"train_loss": -32.15543746948242, "global_step": 57489, "epoch": 475} {"train_loss": -29.489599227905273, "global_step": 57490, "epoch": 475} {"train_loss": -26.892541885375977, "global_step": 57491, "epoch": 475} {"train_loss": -30.542322158813477, "global_step": 57492, "epoch": 475} {"train_loss": -35.83960723876953, "global_step": 57493, "epoch": 475} {"train_loss": -31.726337432861328, "global_step": 57494, "epoch": 475} {"train_loss": -34.7108154296875, "global_step": 57495, "epoch": 475} {"train_loss": -33.9678955078125, "global_step": 57496, "epoch": 475} {"train_loss": -33.32558822631836, "global_step": 57497, "epoch": 475} {"train_loss": -35.148048400878906, "global_step": 57498, "epoch": 475} {"train_loss": -32.253780364990234, "global_step": 57499, "epoch": 475} {"train_loss": -35.15133285522461, "global_step": 57500, "epoch": 475} {"train_loss": -34.492977142333984, "global_step": 57501, "epoch": 475} {"train_loss": -34.300472259521484, "global_step": 57502, "epoch": 475} {"train_loss": -34.57281494140625, "global_step": 57503, "epoch": 475} {"train_loss": -33.898494720458984, "global_step": 57504, "epoch": 475} {"train_loss": -35.63020706176758, "global_step": 57505, "epoch": 475} {"train_loss": -34.658538818359375, "global_step": 57506, "epoch": 475} {"train_loss": -34.91718673706055, "global_step": 57507, "epoch": 475} {"train_loss": -35.02850341796875, "global_step": 57508, "epoch": 475} {"train_loss": -35.06886672973633, "global_step": 57509, "epoch": 475} {"train_loss": -34.90852737426758, "global_step": 57510, "epoch": 475} {"train_loss": -34.930580139160156, "global_step": 57511, "epoch": 475} {"train_loss": -34.66677474975586, "global_step": 57512, "epoch": 475} {"train_loss": -32.60879135131836, "global_step": 57513, "epoch": 475} {"train_loss": -34.68027877807617, "global_step": 57514, "epoch": 475} {"train_loss": -36.15376281738281, "global_step": 57515, "epoch": 475} {"train_loss": -34.236167907714844, "global_step": 57516, "epoch": 475} {"train_loss": -34.810035705566406, "global_step": 57517, "epoch": 475} {"train_loss": -35.20756530761719, "global_step": 57518, "epoch": 475} {"train_loss": -35.28413772583008, "global_step": 57519, "epoch": 475} {"train_loss": -35.580810546875, "global_step": 57520, "epoch": 475} {"train_loss": -35.766902923583984, "global_step": 57521, "epoch": 475} {"train_loss": -36.0455207824707, "global_step": 57522, "epoch": 475} {"train_loss": -35.54670333862305, "global_step": 57523, "epoch": 475} {"train_loss": -36.062007904052734, "global_step": 57524, "epoch": 475} {"train_loss": -35.5018196105957, "global_step": 57525, "epoch": 475} {"train_loss": -35.78737258911133, "global_step": 57526, "epoch": 475} {"train_loss": -35.27348709106445, "global_step": 57527, "epoch": 475} {"train_loss": -35.8513298034668, "global_step": 57528, "epoch": 475} {"train_loss": -35.945919036865234, "global_step": 57529, "epoch": 475} {"train_loss": -36.050697326660156, "global_step": 57530, "epoch": 475} {"train_loss": -35.833492279052734, "global_step": 57531, "epoch": 475} {"train_loss": -35.604793548583984, "global_step": 57532, "epoch": 475} {"train_loss": -35.739830017089844, "global_step": 57533, "epoch": 475} {"train_loss": -35.72285079956055, "global_step": 57534, "epoch": 475} {"train_loss": -35.386837005615234, "global_step": 57535, "epoch": 475} {"train_loss": -35.9268798828125, "global_step": 57536, "epoch": 475} {"train_loss": -36.29281997680664, "global_step": 57537, "epoch": 475} {"train_loss": -35.48283767700195, "global_step": 57538, "epoch": 475} {"train_loss": -35.58991622924805, "global_step": 57539, "epoch": 475} {"train_loss": -35.7242431640625, "global_step": 57540, "epoch": 475} {"train_loss": -35.994876861572266, "global_step": 57541, "epoch": 475} {"train_loss": -36.23466110229492, "global_step": 57542, "epoch": 475} {"train_loss": -36.50587844848633, "global_step": 57543, "epoch": 475} {"train_loss": -36.059383392333984, "global_step": 57544, "epoch": 475} {"train_loss": -36.23115158081055, "global_step": 57545, "epoch": 475} {"train_loss": -34.82528305053711, "global_step": 57546, "epoch": 475} {"train_loss": -35.93872833251953, "global_step": 57547, "epoch": 475} {"train_loss": -36.1611442565918, "global_step": 57548, "epoch": 475} {"train_loss": -36.4729118347168, "global_step": 57549, "epoch": 475} {"train_loss": -36.84619903564453, "global_step": 57550, "epoch": 475} {"train_loss": -35.71162796020508, "global_step": 57551, "epoch": 475} {"train_loss": -35.007015228271484, "global_step": 57552, "epoch": 475} {"train_loss": -36.46735763549805, "global_step": 57553, "epoch": 475} {"train_loss": -35.18732452392578, "global_step": 57554, "epoch": 475} {"train_loss": -33.68865203857422, "global_step": 57555, "epoch": 475} {"train_loss": -35.192134857177734, "global_step": 57556, "epoch": 475} {"train_loss": -33.89396286010742, "global_step": 57557, "epoch": 475} {"train_loss": -34.9994010925293, "global_step": 57558, "epoch": 475} {"train_loss": -34.68550491333008, "global_step": 57559, "epoch": 475} {"train_loss": -34.16782760620117, "global_step": 57560, "epoch": 475} {"train_loss": -34.95621109008789, "global_step": 57561, "epoch": 475} {"train_loss": -36.22197341918945, "global_step": 57562, "epoch": 475} {"train_loss": -34.96821212768555, "global_step": 57563, "epoch": 475} {"train_loss": -35.60600662231445, "global_step": 57564, "epoch": 475} {"train_loss": -34.66856002807617, "global_step": 57565, "epoch": 475} {"train_loss": -36.18910598754883, "global_step": 57566, "epoch": 475} {"train_loss": -34.90088653564453, "global_step": 57567, "epoch": 475} {"train_loss": -34.702308654785156, "global_step": 57568, "epoch": 475} {"train_loss": -35.1572151184082, "global_step": 57569, "epoch": 475} {"train_loss": -36.561336517333984, "global_step": 57570, "epoch": 475} {"train_loss": -34.6989631652832, "global_step": 57571, "epoch": 475} {"train_loss": -36.0385856628418, "global_step": 57572, "epoch": 475} {"train_loss": -35.664920806884766, "global_step": 57573, "epoch": 475} {"train_loss": -35.1887321472168, "global_step": 57574, "epoch": 475} {"train_loss": -36.02888107299805, "global_step": 57575, "epoch": 475} {"train_loss": -34.647422790527344, "global_step": 57576, "epoch": 475} {"train_loss": -34.45414733886719, "global_step": 57577, "epoch": 475} {"train_loss": -36.278926849365234, "global_step": 57578, "epoch": 475} {"train_loss": -35.17824935913086, "global_step": 57579, "epoch": 475} {"train_loss": -36.30343246459961, "global_step": 57580, "epoch": 475} {"train_loss": -34.01952362060547, "global_step": 57581, "epoch": 475} {"train_loss": -36.306087493896484, "global_step": 57582, "epoch": 475} {"train_loss": -34.70180130004883, "global_step": 57583, "epoch": 475} {"train_loss": -35.596343994140625, "global_step": 57584, "epoch": 475} {"train_loss": -35.850250244140625, "global_step": 57585, "epoch": 475} {"train_loss": -35.4061164855957, "global_step": 57586, "epoch": 475} {"train_loss": -34.6346321105957, "global_step": 57587, "epoch": 475} {"train_loss": -36.0208854675293, "global_step": 57588, "epoch": 475} {"train_loss": -34.008827209472656, "global_step": 57589, "epoch": 475} {"train_loss": -34.21798324584961, "global_step": 57590, "epoch": 475} {"train_loss": -31.935693740844727, "global_step": 57591, "epoch": 475} {"train_loss": -29.79578971862793, "global_step": 57592, "epoch": 475} {"train_loss": -27.069055557250977, "global_step": 57593, "epoch": 475} {"train_loss": -29.378576278686523, "global_step": 57594, "epoch": 475} {"train_loss": -34.908942466925, "global_step": 57595, "epoch": 475, "val_loss": 2506898.5} {"train_loss": -33.5128059387207, "global_step": 57596, "epoch": 476} {"train_loss": -32.03445053100586, "global_step": 57597, "epoch": 476} {"train_loss": -31.092731475830078, "global_step": 57598, "epoch": 476} {"train_loss": -33.81191635131836, "global_step": 57599, "epoch": 476} {"train_loss": -33.49650955200195, "global_step": 57600, "epoch": 476} {"train_loss": -34.99163818359375, "global_step": 57601, "epoch": 476} {"train_loss": -31.95355224609375, "global_step": 57602, "epoch": 476} {"train_loss": -33.72178268432617, "global_step": 57603, "epoch": 476} {"train_loss": -34.8392448425293, "global_step": 57604, "epoch": 476} {"train_loss": -34.920040130615234, "global_step": 57605, "epoch": 476} {"train_loss": -33.85366439819336, "global_step": 57606, "epoch": 476} {"train_loss": -35.3376579284668, "global_step": 57607, "epoch": 476} {"train_loss": -34.38734817504883, "global_step": 57608, "epoch": 476} {"train_loss": -35.05308532714844, "global_step": 57609, "epoch": 476} {"train_loss": -34.573482513427734, "global_step": 57610, "epoch": 476} {"train_loss": -34.79653549194336, "global_step": 57611, "epoch": 476} {"train_loss": -35.21946334838867, "global_step": 57612, "epoch": 476} {"train_loss": -35.3871955871582, "global_step": 57613, "epoch": 476} {"train_loss": -35.39970016479492, "global_step": 57614, "epoch": 476} {"train_loss": -35.42580795288086, "global_step": 57615, "epoch": 476} {"train_loss": -35.53475570678711, "global_step": 57616, "epoch": 476} {"train_loss": -35.12582015991211, "global_step": 57617, "epoch": 476} {"train_loss": -34.68553161621094, "global_step": 57618, "epoch": 476} {"train_loss": -35.71787643432617, "global_step": 57619, "epoch": 476} {"train_loss": -36.09465408325195, "global_step": 57620, "epoch": 476} {"train_loss": -34.91268539428711, "global_step": 57621, "epoch": 476} {"train_loss": -35.08356475830078, "global_step": 57622, "epoch": 476} {"train_loss": -34.54207229614258, "global_step": 57623, "epoch": 476} {"train_loss": -35.87252426147461, "global_step": 57624, "epoch": 476} {"train_loss": -36.039669036865234, "global_step": 57625, "epoch": 476} {"train_loss": -35.37679672241211, "global_step": 57626, "epoch": 476} {"train_loss": -36.04112243652344, "global_step": 57627, "epoch": 476} {"train_loss": -35.605384826660156, "global_step": 57628, "epoch": 476} {"train_loss": -35.514251708984375, "global_step": 57629, "epoch": 476} {"train_loss": -36.03743362426758, "global_step": 57630, "epoch": 476} {"train_loss": -36.0228157043457, "global_step": 57631, "epoch": 476} {"train_loss": -35.7161865234375, "global_step": 57632, "epoch": 476} {"train_loss": -36.215396881103516, "global_step": 57633, "epoch": 476} {"train_loss": -36.22654342651367, "global_step": 57634, "epoch": 476} {"train_loss": -35.259246826171875, "global_step": 57635, "epoch": 476} {"train_loss": -35.93378448486328, "global_step": 57636, "epoch": 476} {"train_loss": -36.29679870605469, "global_step": 57637, "epoch": 476} {"train_loss": -35.877166748046875, "global_step": 57638, "epoch": 476} {"train_loss": -35.846954345703125, "global_step": 57639, "epoch": 476} {"train_loss": -36.54948425292969, "global_step": 57640, "epoch": 476} {"train_loss": -36.64516067504883, "global_step": 57641, "epoch": 476} {"train_loss": -36.62699508666992, "global_step": 57642, "epoch": 476} {"train_loss": -36.302093505859375, "global_step": 57643, "epoch": 476} {"train_loss": -35.88419723510742, "global_step": 57644, "epoch": 476} {"train_loss": -36.617374420166016, "global_step": 57645, "epoch": 476} {"train_loss": -36.44868469238281, "global_step": 57646, "epoch": 476} {"train_loss": -36.58567428588867, "global_step": 57647, "epoch": 476} {"train_loss": -36.314510345458984, "global_step": 57648, "epoch": 476} {"train_loss": -36.968536376953125, "global_step": 57649, "epoch": 476} {"train_loss": -35.78922653198242, "global_step": 57650, "epoch": 476} {"train_loss": -36.53615951538086, "global_step": 57651, "epoch": 476} {"train_loss": -36.78165817260742, "global_step": 57652, "epoch": 476} {"train_loss": -36.16115951538086, "global_step": 57653, "epoch": 476} {"train_loss": -36.62421798706055, "global_step": 57654, "epoch": 476} {"train_loss": -36.35630798339844, "global_step": 57655, "epoch": 476} {"train_loss": -36.66499710083008, "global_step": 57656, "epoch": 476} {"train_loss": -36.72270965576172, "global_step": 57657, "epoch": 476} {"train_loss": -36.65753173828125, "global_step": 57658, "epoch": 476} {"train_loss": -35.68178176879883, "global_step": 57659, "epoch": 476} {"train_loss": -36.325374603271484, "global_step": 57660, "epoch": 476} {"train_loss": -36.045936584472656, "global_step": 57661, "epoch": 476} {"train_loss": -36.53535079956055, "global_step": 57662, "epoch": 476} {"train_loss": -36.675086975097656, "global_step": 57663, "epoch": 476} {"train_loss": -36.35721969604492, "global_step": 57664, "epoch": 476} {"train_loss": -36.102474212646484, "global_step": 57665, "epoch": 476} {"train_loss": -35.659576416015625, "global_step": 57666, "epoch": 476} {"train_loss": -32.723934173583984, "global_step": 57667, "epoch": 476} {"train_loss": -24.451744079589844, "global_step": 57668, "epoch": 476} {"train_loss": -18.31462860107422, "global_step": 57669, "epoch": 476} {"train_loss": -23.21577262878418, "global_step": 57670, "epoch": 476} {"train_loss": -35.39581298828125, "global_step": 57671, "epoch": 476} {"train_loss": -29.298599243164062, "global_step": 57672, "epoch": 476} {"train_loss": -27.474180221557617, "global_step": 57673, "epoch": 476} {"train_loss": -35.37385559082031, "global_step": 57674, "epoch": 476} {"train_loss": -31.675704956054688, "global_step": 57675, "epoch": 476} {"train_loss": -34.82469940185547, "global_step": 57676, "epoch": 476} {"train_loss": -34.201690673828125, "global_step": 57677, "epoch": 476} {"train_loss": -33.60951232910156, "global_step": 57678, "epoch": 476} {"train_loss": -36.28679275512695, "global_step": 57679, "epoch": 476} {"train_loss": -33.42667007446289, "global_step": 57680, "epoch": 476} {"train_loss": -36.2271842956543, "global_step": 57681, "epoch": 476} {"train_loss": -34.518428802490234, "global_step": 57682, "epoch": 476} {"train_loss": -35.473426818847656, "global_step": 57683, "epoch": 476} {"train_loss": -35.377925872802734, "global_step": 57684, "epoch": 476} {"train_loss": -35.74654769897461, "global_step": 57685, "epoch": 476} {"train_loss": -35.2811279296875, "global_step": 57686, "epoch": 476} {"train_loss": -36.228858947753906, "global_step": 57687, "epoch": 476} {"train_loss": -35.734500885009766, "global_step": 57688, "epoch": 476} {"train_loss": -35.94111251831055, "global_step": 57689, "epoch": 476} {"train_loss": -36.17549514770508, "global_step": 57690, "epoch": 476} {"train_loss": -36.29055404663086, "global_step": 57691, "epoch": 476} {"train_loss": -35.83826446533203, "global_step": 57692, "epoch": 476} {"train_loss": -35.87987518310547, "global_step": 57693, "epoch": 476} {"train_loss": -36.5415153503418, "global_step": 57694, "epoch": 476} {"train_loss": -36.14216613769531, "global_step": 57695, "epoch": 476} {"train_loss": -35.85578536987305, "global_step": 57696, "epoch": 476} {"train_loss": -35.2530403137207, "global_step": 57697, "epoch": 476} {"train_loss": -36.191383361816406, "global_step": 57698, "epoch": 476} {"train_loss": -36.20134353637695, "global_step": 57699, "epoch": 476} {"train_loss": -36.27946090698242, "global_step": 57700, "epoch": 476} {"train_loss": -36.24860382080078, "global_step": 57701, "epoch": 476} {"train_loss": -36.284889221191406, "global_step": 57702, "epoch": 476} {"train_loss": -35.99922561645508, "global_step": 57703, "epoch": 476} {"train_loss": -34.63743209838867, "global_step": 57704, "epoch": 476} {"train_loss": -35.48826599121094, "global_step": 57705, "epoch": 476} {"train_loss": -36.09543228149414, "global_step": 57706, "epoch": 476} {"train_loss": -35.638423919677734, "global_step": 57707, "epoch": 476} {"train_loss": -35.987056732177734, "global_step": 57708, "epoch": 476} {"train_loss": -35.27341842651367, "global_step": 57709, "epoch": 476} {"train_loss": -36.200435638427734, "global_step": 57710, "epoch": 476} {"train_loss": -36.600013732910156, "global_step": 57711, "epoch": 476} {"train_loss": -36.6073112487793, "global_step": 57712, "epoch": 476} {"train_loss": -36.433868408203125, "global_step": 57713, "epoch": 476} {"train_loss": -36.80462646484375, "global_step": 57714, "epoch": 476} {"train_loss": -36.881412506103516, "global_step": 57715, "epoch": 476} {"train_loss": -35.09928402230759, "global_step": 57716, "epoch": 476, "val_loss": 2510220.25} {"train_loss": -36.6754035949707, "global_step": 57717, "epoch": 477} {"train_loss": -36.24750900268555, "global_step": 57718, "epoch": 477} {"train_loss": -36.50393295288086, "global_step": 57719, "epoch": 477} {"train_loss": -36.7620849609375, "global_step": 57720, "epoch": 477} {"train_loss": -35.718170166015625, "global_step": 57721, "epoch": 477} {"train_loss": -36.23965072631836, "global_step": 57722, "epoch": 477} {"train_loss": -36.636226654052734, "global_step": 57723, "epoch": 477} {"train_loss": -36.71102523803711, "global_step": 57724, "epoch": 477} {"train_loss": -36.982723236083984, "global_step": 57725, "epoch": 477} {"train_loss": -36.382080078125, "global_step": 57726, "epoch": 477} {"train_loss": -36.493831634521484, "global_step": 57727, "epoch": 477} {"train_loss": -35.7764778137207, "global_step": 57728, "epoch": 477} {"train_loss": -36.7032356262207, "global_step": 57729, "epoch": 477} {"train_loss": -35.94626998901367, "global_step": 57730, "epoch": 477} {"train_loss": -35.44442367553711, "global_step": 57731, "epoch": 477} {"train_loss": -35.00202560424805, "global_step": 57732, "epoch": 477} {"train_loss": -35.8905143737793, "global_step": 57733, "epoch": 477} {"train_loss": -35.96929931640625, "global_step": 57734, "epoch": 477} {"train_loss": -36.501197814941406, "global_step": 57735, "epoch": 477} {"train_loss": -35.7601318359375, "global_step": 57736, "epoch": 477} {"train_loss": -33.51353073120117, "global_step": 57737, "epoch": 477} {"train_loss": -32.93548583984375, "global_step": 57738, "epoch": 477} {"train_loss": -33.43758773803711, "global_step": 57739, "epoch": 477} {"train_loss": -35.09061813354492, "global_step": 57740, "epoch": 477} {"train_loss": -34.5750846862793, "global_step": 57741, "epoch": 477} {"train_loss": -30.253793716430664, "global_step": 57742, "epoch": 477} {"train_loss": -33.846046447753906, "global_step": 57743, "epoch": 477} {"train_loss": -34.12588119506836, "global_step": 57744, "epoch": 477} {"train_loss": -36.00835418701172, "global_step": 57745, "epoch": 477} {"train_loss": -34.4780158996582, "global_step": 57746, "epoch": 477} {"train_loss": -35.26164627075195, "global_step": 57747, "epoch": 477} {"train_loss": -35.747432708740234, "global_step": 57748, "epoch": 477} {"train_loss": -34.512020111083984, "global_step": 57749, "epoch": 477} {"train_loss": -36.363338470458984, "global_step": 57750, "epoch": 477} {"train_loss": -35.604793548583984, "global_step": 57751, "epoch": 477} {"train_loss": -34.31026077270508, "global_step": 57752, "epoch": 477} {"train_loss": -33.21855163574219, "global_step": 57753, "epoch": 477} {"train_loss": -35.97817611694336, "global_step": 57754, "epoch": 477} {"train_loss": -34.15620803833008, "global_step": 57755, "epoch": 477} {"train_loss": -35.48723602294922, "global_step": 57756, "epoch": 477} {"train_loss": -33.801551818847656, "global_step": 57757, "epoch": 477} {"train_loss": -35.442745208740234, "global_step": 57758, "epoch": 477} {"train_loss": -34.6834602355957, "global_step": 57759, "epoch": 477} {"train_loss": -35.02116012573242, "global_step": 57760, "epoch": 477} {"train_loss": -32.63262176513672, "global_step": 57761, "epoch": 477} {"train_loss": -34.32673645019531, "global_step": 57762, "epoch": 477} {"train_loss": -34.96730422973633, "global_step": 57763, "epoch": 477} {"train_loss": -34.27357482910156, "global_step": 57764, "epoch": 477} {"train_loss": -33.949073791503906, "global_step": 57765, "epoch": 477} {"train_loss": -34.69593048095703, "global_step": 57766, "epoch": 477} {"train_loss": -33.746620178222656, "global_step": 57767, "epoch": 477} {"train_loss": -35.38240051269531, "global_step": 57768, "epoch": 477} {"train_loss": -34.647335052490234, "global_step": 57769, "epoch": 477} {"train_loss": -35.657257080078125, "global_step": 57770, "epoch": 477} {"train_loss": -33.90690231323242, "global_step": 57771, "epoch": 477} {"train_loss": -33.91134262084961, "global_step": 57772, "epoch": 477} {"train_loss": -30.543310165405273, "global_step": 57773, "epoch": 477} {"train_loss": -25.065044403076172, "global_step": 57774, "epoch": 477} {"train_loss": -28.119352340698242, "global_step": 57775, "epoch": 477} {"train_loss": -34.115501403808594, "global_step": 57776, "epoch": 477} {"train_loss": -33.5869026184082, "global_step": 57777, "epoch": 477} {"train_loss": -26.25864028930664, "global_step": 57778, "epoch": 477} {"train_loss": -32.395870208740234, "global_step": 57779, "epoch": 477} {"train_loss": -34.56622314453125, "global_step": 57780, "epoch": 477} {"train_loss": -33.81877517700195, "global_step": 57781, "epoch": 477} {"train_loss": -34.90930938720703, "global_step": 57782, "epoch": 477} {"train_loss": -34.59969711303711, "global_step": 57783, "epoch": 477} {"train_loss": -34.01942825317383, "global_step": 57784, "epoch": 477} {"train_loss": -34.735191345214844, "global_step": 57785, "epoch": 477} {"train_loss": -34.16096878051758, "global_step": 57786, "epoch": 477} {"train_loss": -34.84077835083008, "global_step": 57787, "epoch": 477} {"train_loss": -35.113338470458984, "global_step": 57788, "epoch": 477} {"train_loss": -34.644622802734375, "global_step": 57789, "epoch": 477} {"train_loss": -34.88279342651367, "global_step": 57790, "epoch": 477} {"train_loss": -34.6762580871582, "global_step": 57791, "epoch": 477} {"train_loss": -34.7811164855957, "global_step": 57792, "epoch": 477} {"train_loss": -35.786495208740234, "global_step": 57793, "epoch": 477} {"train_loss": -34.29340744018555, "global_step": 57794, "epoch": 477} {"train_loss": -35.20998764038086, "global_step": 57795, "epoch": 477} {"train_loss": -35.37578582763672, "global_step": 57796, "epoch": 477} {"train_loss": -34.82981491088867, "global_step": 57797, "epoch": 477} {"train_loss": -35.171138763427734, "global_step": 57798, "epoch": 477} {"train_loss": -35.881126403808594, "global_step": 57799, "epoch": 477} {"train_loss": -35.27066421508789, "global_step": 57800, "epoch": 477} {"train_loss": -35.84611129760742, "global_step": 57801, "epoch": 477} {"train_loss": -35.60869216918945, "global_step": 57802, "epoch": 477} {"train_loss": -35.43190002441406, "global_step": 57803, "epoch": 477} {"train_loss": -35.59517288208008, "global_step": 57804, "epoch": 477} {"train_loss": -35.82466506958008, "global_step": 57805, "epoch": 477} {"train_loss": -36.20184326171875, "global_step": 57806, "epoch": 477} {"train_loss": -35.93262481689453, "global_step": 57807, "epoch": 477} {"train_loss": -36.12775802612305, "global_step": 57808, "epoch": 477} {"train_loss": -36.201717376708984, "global_step": 57809, "epoch": 477} {"train_loss": -35.80194091796875, "global_step": 57810, "epoch": 477} {"train_loss": -35.85547637939453, "global_step": 57811, "epoch": 477} {"train_loss": -35.362003326416016, "global_step": 57812, "epoch": 477} {"train_loss": -35.7952995300293, "global_step": 57813, "epoch": 477} {"train_loss": -36.31256103515625, "global_step": 57814, "epoch": 477} {"train_loss": -35.89054489135742, "global_step": 57815, "epoch": 477} {"train_loss": -36.22011947631836, "global_step": 57816, "epoch": 477} {"train_loss": -35.57646560668945, "global_step": 57817, "epoch": 477} {"train_loss": -36.42987060546875, "global_step": 57818, "epoch": 477} {"train_loss": -36.08320617675781, "global_step": 57819, "epoch": 477} {"train_loss": -36.315513610839844, "global_step": 57820, "epoch": 477} {"train_loss": -36.47095489501953, "global_step": 57821, "epoch": 477} {"train_loss": -35.89235305786133, "global_step": 57822, "epoch": 477} {"train_loss": -36.07050323486328, "global_step": 57823, "epoch": 477} {"train_loss": -36.63827133178711, "global_step": 57824, "epoch": 477} {"train_loss": -35.803279876708984, "global_step": 57825, "epoch": 477} {"train_loss": -36.56184768676758, "global_step": 57826, "epoch": 477} {"train_loss": -36.39129638671875, "global_step": 57827, "epoch": 477} {"train_loss": -36.312843322753906, "global_step": 57828, "epoch": 477} {"train_loss": -35.7667350769043, "global_step": 57829, "epoch": 477} {"train_loss": -36.718040466308594, "global_step": 57830, "epoch": 477} {"train_loss": -34.4256477355957, "global_step": 57831, "epoch": 477} {"train_loss": -35.784393310546875, "global_step": 57832, "epoch": 477} {"train_loss": -35.9942512512207, "global_step": 57833, "epoch": 477} {"train_loss": -35.30084991455078, "global_step": 57834, "epoch": 477} {"train_loss": -34.96647262573242, "global_step": 57835, "epoch": 477} {"train_loss": -33.39501953125, "global_step": 57836, "epoch": 477} {"train_loss": -34.96132863257542, "global_step": 57837, "epoch": 477, "val_loss": 2614869.0} {"train_loss": -33.67692565917969, "global_step": 57838, "epoch": 478} {"train_loss": -35.37911605834961, "global_step": 57839, "epoch": 478} {"train_loss": -35.9633903503418, "global_step": 57840, "epoch": 478} {"train_loss": -35.095577239990234, "global_step": 57841, "epoch": 478} {"train_loss": -35.81087112426758, "global_step": 57842, "epoch": 478} {"train_loss": -32.8616943359375, "global_step": 57843, "epoch": 478} {"train_loss": -35.496585845947266, "global_step": 57844, "epoch": 478} {"train_loss": -35.16351318359375, "global_step": 57845, "epoch": 478} {"train_loss": -35.84556198120117, "global_step": 57846, "epoch": 478} {"train_loss": -35.50013732910156, "global_step": 57847, "epoch": 478} {"train_loss": -35.37908935546875, "global_step": 57848, "epoch": 478} {"train_loss": -34.97537612915039, "global_step": 57849, "epoch": 478} {"train_loss": -35.478065490722656, "global_step": 57850, "epoch": 478} {"train_loss": -35.710838317871094, "global_step": 57851, "epoch": 478} {"train_loss": -34.730342864990234, "global_step": 57852, "epoch": 478} {"train_loss": -34.976600646972656, "global_step": 57853, "epoch": 478} {"train_loss": -34.9841423034668, "global_step": 57854, "epoch": 478} {"train_loss": -35.43596649169922, "global_step": 57855, "epoch": 478} {"train_loss": -35.39866256713867, "global_step": 57856, "epoch": 478} {"train_loss": -35.5372314453125, "global_step": 57857, "epoch": 478} {"train_loss": -34.87321853637695, "global_step": 57858, "epoch": 478} {"train_loss": -35.60079574584961, "global_step": 57859, "epoch": 478} {"train_loss": -35.079166412353516, "global_step": 57860, "epoch": 478} {"train_loss": -35.50215148925781, "global_step": 57861, "epoch": 478} {"train_loss": -34.9791259765625, "global_step": 57862, "epoch": 478} {"train_loss": -35.96356201171875, "global_step": 57863, "epoch": 478} {"train_loss": -36.07601547241211, "global_step": 57864, "epoch": 478} {"train_loss": -36.08098220825195, "global_step": 57865, "epoch": 478} {"train_loss": -35.674468994140625, "global_step": 57866, "epoch": 478} {"train_loss": -35.66469955444336, "global_step": 57867, "epoch": 478} {"train_loss": -36.195186614990234, "global_step": 57868, "epoch": 478} {"train_loss": -36.251564025878906, "global_step": 57869, "epoch": 478} {"train_loss": -35.719783782958984, "global_step": 57870, "epoch": 478} {"train_loss": -36.12892532348633, "global_step": 57871, "epoch": 478} {"train_loss": -35.765933990478516, "global_step": 57872, "epoch": 478} {"train_loss": -36.10287094116211, "global_step": 57873, "epoch": 478} {"train_loss": -35.24488830566406, "global_step": 57874, "epoch": 478} {"train_loss": -34.92681121826172, "global_step": 57875, "epoch": 478} {"train_loss": -35.435157775878906, "global_step": 57876, "epoch": 478} {"train_loss": -35.26931381225586, "global_step": 57877, "epoch": 478} {"train_loss": -36.0931510925293, "global_step": 57878, "epoch": 478} {"train_loss": -35.323970794677734, "global_step": 57879, "epoch": 478} {"train_loss": -35.60957336425781, "global_step": 57880, "epoch": 478} {"train_loss": -35.605812072753906, "global_step": 57881, "epoch": 478} {"train_loss": -35.793609619140625, "global_step": 57882, "epoch": 478} {"train_loss": -36.01681137084961, "global_step": 57883, "epoch": 478} {"train_loss": -36.403236389160156, "global_step": 57884, "epoch": 478} {"train_loss": -35.55810546875, "global_step": 57885, "epoch": 478} {"train_loss": -35.473384857177734, "global_step": 57886, "epoch": 478} {"train_loss": -36.05656433105469, "global_step": 57887, "epoch": 478} {"train_loss": -36.218570709228516, "global_step": 57888, "epoch": 478} {"train_loss": -35.31277847290039, "global_step": 57889, "epoch": 478} {"train_loss": -35.838417053222656, "global_step": 57890, "epoch": 478} {"train_loss": -35.61246871948242, "global_step": 57891, "epoch": 478} {"train_loss": -36.41923141479492, "global_step": 57892, "epoch": 478} {"train_loss": -34.763427734375, "global_step": 57893, "epoch": 478} {"train_loss": -35.452056884765625, "global_step": 57894, "epoch": 478} {"train_loss": -36.277076721191406, "global_step": 57895, "epoch": 478} {"train_loss": -35.22067642211914, "global_step": 57896, "epoch": 478} {"train_loss": -35.525997161865234, "global_step": 57897, "epoch": 478} {"train_loss": -36.316261291503906, "global_step": 57898, "epoch": 478} {"train_loss": -34.700828552246094, "global_step": 57899, "epoch": 478} {"train_loss": -35.829532623291016, "global_step": 57900, "epoch": 478} {"train_loss": -35.95878601074219, "global_step": 57901, "epoch": 478} {"train_loss": -35.308837890625, "global_step": 57902, "epoch": 478} {"train_loss": -35.977054595947266, "global_step": 57903, "epoch": 478} {"train_loss": -36.21664047241211, "global_step": 57904, "epoch": 478} {"train_loss": -36.62704086303711, "global_step": 57905, "epoch": 478} {"train_loss": -35.912601470947266, "global_step": 57906, "epoch": 478} {"train_loss": -35.58388137817383, "global_step": 57907, "epoch": 478} {"train_loss": -36.04185104370117, "global_step": 57908, "epoch": 478} {"train_loss": -36.00338363647461, "global_step": 57909, "epoch": 478} {"train_loss": -36.2753791809082, "global_step": 57910, "epoch": 478} {"train_loss": -36.17605209350586, "global_step": 57911, "epoch": 478} {"train_loss": -36.76945495605469, "global_step": 57912, "epoch": 478} {"train_loss": -36.41682815551758, "global_step": 57913, "epoch": 478} {"train_loss": -36.43590545654297, "global_step": 57914, "epoch": 478} {"train_loss": -36.37427520751953, "global_step": 57915, "epoch": 478} {"train_loss": -36.44795227050781, "global_step": 57916, "epoch": 478} {"train_loss": -35.95927810668945, "global_step": 57917, "epoch": 478} {"train_loss": -36.151790618896484, "global_step": 57918, "epoch": 478} {"train_loss": -36.580963134765625, "global_step": 57919, "epoch": 478} {"train_loss": -36.231483459472656, "global_step": 57920, "epoch": 478} {"train_loss": -36.33193588256836, "global_step": 57921, "epoch": 478} {"train_loss": -36.26351547241211, "global_step": 57922, "epoch": 478} {"train_loss": -35.29706573486328, "global_step": 57923, "epoch": 478} {"train_loss": -35.724884033203125, "global_step": 57924, "epoch": 478} {"train_loss": -36.22758102416992, "global_step": 57925, "epoch": 478} {"train_loss": -36.48796463012695, "global_step": 57926, "epoch": 478} {"train_loss": -34.807586669921875, "global_step": 57927, "epoch": 478} {"train_loss": -34.659149169921875, "global_step": 57928, "epoch": 478} {"train_loss": -36.881996154785156, "global_step": 57929, "epoch": 478} {"train_loss": -33.82009506225586, "global_step": 57930, "epoch": 478} {"train_loss": -36.56205368041992, "global_step": 57931, "epoch": 478} {"train_loss": -35.165122985839844, "global_step": 57932, "epoch": 478} {"train_loss": -34.58476257324219, "global_step": 57933, "epoch": 478} {"train_loss": -36.05356979370117, "global_step": 57934, "epoch": 478} {"train_loss": -33.758644104003906, "global_step": 57935, "epoch": 478} {"train_loss": -36.40650177001953, "global_step": 57936, "epoch": 478} {"train_loss": -36.305477142333984, "global_step": 57937, "epoch": 478} {"train_loss": -34.97402572631836, "global_step": 57938, "epoch": 478} {"train_loss": -35.421382904052734, "global_step": 57939, "epoch": 478} {"train_loss": -34.72883224487305, "global_step": 57940, "epoch": 478} {"train_loss": -36.13793182373047, "global_step": 57941, "epoch": 478} {"train_loss": -34.6318244934082, "global_step": 57942, "epoch": 478} {"train_loss": -35.9395866394043, "global_step": 57943, "epoch": 478} {"train_loss": -36.03298568725586, "global_step": 57944, "epoch": 478} {"train_loss": -36.33477783203125, "global_step": 57945, "epoch": 478} {"train_loss": -36.554298400878906, "global_step": 57946, "epoch": 478} {"train_loss": -36.41529846191406, "global_step": 57947, "epoch": 478} {"train_loss": -34.783485412597656, "global_step": 57948, "epoch": 478} {"train_loss": -36.307777404785156, "global_step": 57949, "epoch": 478} {"train_loss": -35.39435958862305, "global_step": 57950, "epoch": 478} {"train_loss": -35.75714111328125, "global_step": 57951, "epoch": 478} {"train_loss": -34.1802978515625, "global_step": 57952, "epoch": 478} {"train_loss": -34.71586990356445, "global_step": 57953, "epoch": 478} {"train_loss": -35.834129333496094, "global_step": 57954, "epoch": 478} {"train_loss": -35.250091552734375, "global_step": 57955, "epoch": 478} {"train_loss": -34.84975051879883, "global_step": 57956, "epoch": 478} {"train_loss": -34.63424301147461, "global_step": 57957, "epoch": 478} {"train_loss": -35.622059246725286, "global_step": 57958, "epoch": 478, "val_loss": 2529425.75} {"train_loss": -35.137298583984375, "global_step": 57959, "epoch": 479} {"train_loss": -34.72004318237305, "global_step": 57960, "epoch": 479} {"train_loss": -34.933773040771484, "global_step": 57961, "epoch": 479} {"train_loss": -32.89374923706055, "global_step": 57962, "epoch": 479} {"train_loss": -33.393310546875, "global_step": 57963, "epoch": 479} {"train_loss": -34.55769348144531, "global_step": 57964, "epoch": 479} {"train_loss": -35.96698760986328, "global_step": 57965, "epoch": 479} {"train_loss": -33.89053726196289, "global_step": 57966, "epoch": 479} {"train_loss": -33.906005859375, "global_step": 57967, "epoch": 479} {"train_loss": -35.85179901123047, "global_step": 57968, "epoch": 479} {"train_loss": -35.43496322631836, "global_step": 57969, "epoch": 479} {"train_loss": -35.38375473022461, "global_step": 57970, "epoch": 479} {"train_loss": -34.651206970214844, "global_step": 57971, "epoch": 479} {"train_loss": -36.28094482421875, "global_step": 57972, "epoch": 479} {"train_loss": -35.46866989135742, "global_step": 57973, "epoch": 479} {"train_loss": -35.97303009033203, "global_step": 57974, "epoch": 479} {"train_loss": -36.411460876464844, "global_step": 57975, "epoch": 479} {"train_loss": -35.78589630126953, "global_step": 57976, "epoch": 479} {"train_loss": -35.65339279174805, "global_step": 57977, "epoch": 479} {"train_loss": -35.7917366027832, "global_step": 57978, "epoch": 479} {"train_loss": -35.6219596862793, "global_step": 57979, "epoch": 479} {"train_loss": -35.584896087646484, "global_step": 57980, "epoch": 479} {"train_loss": -36.17655563354492, "global_step": 57981, "epoch": 479} {"train_loss": -35.558223724365234, "global_step": 57982, "epoch": 479} {"train_loss": -35.8021240234375, "global_step": 57983, "epoch": 479} {"train_loss": -36.650569915771484, "global_step": 57984, "epoch": 479} {"train_loss": -36.28351974487305, "global_step": 57985, "epoch": 479} {"train_loss": -36.234432220458984, "global_step": 57986, "epoch": 479} {"train_loss": -36.199222564697266, "global_step": 57987, "epoch": 479} {"train_loss": -36.149024963378906, "global_step": 57988, "epoch": 479} {"train_loss": -35.995418548583984, "global_step": 57989, "epoch": 479} {"train_loss": -36.30939865112305, "global_step": 57990, "epoch": 479} {"train_loss": -36.45055389404297, "global_step": 57991, "epoch": 479} {"train_loss": -35.3410530090332, "global_step": 57992, "epoch": 479} {"train_loss": -36.505645751953125, "global_step": 57993, "epoch": 479} {"train_loss": -36.540836334228516, "global_step": 57994, "epoch": 479} {"train_loss": -35.72650146484375, "global_step": 57995, "epoch": 479} {"train_loss": -36.78570556640625, "global_step": 57996, "epoch": 479} {"train_loss": -36.835845947265625, "global_step": 57997, "epoch": 479} {"train_loss": -36.80910873413086, "global_step": 57998, "epoch": 479} {"train_loss": -36.72283172607422, "global_step": 57999, "epoch": 479} {"train_loss": -36.90665817260742, "global_step": 58000, "epoch": 479} {"train_loss": -36.63491439819336, "global_step": 58001, "epoch": 479} {"train_loss": -36.64370346069336, "global_step": 58002, "epoch": 479} {"train_loss": -36.73843002319336, "global_step": 58003, "epoch": 479} {"train_loss": -36.80658721923828, "global_step": 58004, "epoch": 479} {"train_loss": -36.67439270019531, "global_step": 58005, "epoch": 479} {"train_loss": -36.701759338378906, "global_step": 58006, "epoch": 479} {"train_loss": -36.9564323425293, "global_step": 58007, "epoch": 479} {"train_loss": -35.92258834838867, "global_step": 58008, "epoch": 479} {"train_loss": -36.81403732299805, "global_step": 58009, "epoch": 479} {"train_loss": -36.41769027709961, "global_step": 58010, "epoch": 479} {"train_loss": -35.307498931884766, "global_step": 58011, "epoch": 479} {"train_loss": -34.55766677856445, "global_step": 58012, "epoch": 479} {"train_loss": -32.59357452392578, "global_step": 58013, "epoch": 479} {"train_loss": -30.938817977905273, "global_step": 58014, "epoch": 479} {"train_loss": -31.42853355407715, "global_step": 58015, "epoch": 479} {"train_loss": -23.65732192993164, "global_step": 58016, "epoch": 479} {"train_loss": -19.217248916625977, "global_step": 58017, "epoch": 479} {"train_loss": -27.11868667602539, "global_step": 58018, "epoch": 479} {"train_loss": -35.06513977050781, "global_step": 58019, "epoch": 479} {"train_loss": -26.594470977783203, "global_step": 58020, "epoch": 479} {"train_loss": -34.42523193359375, "global_step": 58021, "epoch": 479} {"train_loss": -30.995319366455078, "global_step": 58022, "epoch": 479} {"train_loss": -34.44377136230469, "global_step": 58023, "epoch": 479} {"train_loss": -32.35554885864258, "global_step": 58024, "epoch": 479} {"train_loss": -35.01575469970703, "global_step": 58025, "epoch": 479} {"train_loss": -33.18971252441406, "global_step": 58026, "epoch": 479} {"train_loss": -35.60400390625, "global_step": 58027, "epoch": 479} {"train_loss": -34.43172836303711, "global_step": 58028, "epoch": 479} {"train_loss": -34.1361198425293, "global_step": 58029, "epoch": 479} {"train_loss": -34.904293060302734, "global_step": 58030, "epoch": 479} {"train_loss": -35.00849151611328, "global_step": 58031, "epoch": 479} {"train_loss": -34.57676696777344, "global_step": 58032, "epoch": 479} {"train_loss": -35.95269775390625, "global_step": 58033, "epoch": 479} {"train_loss": -35.271949768066406, "global_step": 58034, "epoch": 479} {"train_loss": -35.488765716552734, "global_step": 58035, "epoch": 479} {"train_loss": -36.11973571777344, "global_step": 58036, "epoch": 479} {"train_loss": -35.835208892822266, "global_step": 58037, "epoch": 479} {"train_loss": -35.406673431396484, "global_step": 58038, "epoch": 479} {"train_loss": -35.59084701538086, "global_step": 58039, "epoch": 479} {"train_loss": -35.84223175048828, "global_step": 58040, "epoch": 479} {"train_loss": -35.34428405761719, "global_step": 58041, "epoch": 479} {"train_loss": -34.89432907104492, "global_step": 58042, "epoch": 479} {"train_loss": -36.20443344116211, "global_step": 58043, "epoch": 479} {"train_loss": -35.84678268432617, "global_step": 58044, "epoch": 479} {"train_loss": -35.66010665893555, "global_step": 58045, "epoch": 479} {"train_loss": -36.11067581176758, "global_step": 58046, "epoch": 479} {"train_loss": -36.052978515625, "global_step": 58047, "epoch": 479} {"train_loss": -35.45341110229492, "global_step": 58048, "epoch": 479} {"train_loss": -34.806941986083984, "global_step": 58049, "epoch": 479} {"train_loss": -35.409271240234375, "global_step": 58050, "epoch": 479} {"train_loss": -35.093292236328125, "global_step": 58051, "epoch": 479} {"train_loss": -34.39081573486328, "global_step": 58052, "epoch": 479} {"train_loss": -35.17759323120117, "global_step": 58053, "epoch": 479} {"train_loss": -36.68589401245117, "global_step": 58054, "epoch": 479} {"train_loss": -35.261356353759766, "global_step": 58055, "epoch": 479} {"train_loss": -34.5297966003418, "global_step": 58056, "epoch": 479} {"train_loss": -36.36640167236328, "global_step": 58057, "epoch": 479} {"train_loss": -34.092132568359375, "global_step": 58058, "epoch": 479} {"train_loss": -34.569732666015625, "global_step": 58059, "epoch": 479} {"train_loss": -36.07941436767578, "global_step": 58060, "epoch": 479} {"train_loss": -32.945369720458984, "global_step": 58061, "epoch": 479} {"train_loss": -35.968807220458984, "global_step": 58062, "epoch": 479} {"train_loss": -36.133766174316406, "global_step": 58063, "epoch": 479} {"train_loss": -34.80295944213867, "global_step": 58064, "epoch": 479} {"train_loss": -35.86443328857422, "global_step": 58065, "epoch": 479} {"train_loss": -35.689735412597656, "global_step": 58066, "epoch": 479} {"train_loss": -34.98784637451172, "global_step": 58067, "epoch": 479} {"train_loss": -35.443214416503906, "global_step": 58068, "epoch": 479} {"train_loss": -35.62940216064453, "global_step": 58069, "epoch": 479} {"train_loss": -35.77777099609375, "global_step": 58070, "epoch": 479} {"train_loss": -35.42385482788086, "global_step": 58071, "epoch": 479} {"train_loss": -36.04694747924805, "global_step": 58072, "epoch": 479} {"train_loss": -34.93685531616211, "global_step": 58073, "epoch": 479} {"train_loss": -35.97524642944336, "global_step": 58074, "epoch": 479} {"train_loss": -35.37336349487305, "global_step": 58075, "epoch": 479} {"train_loss": -35.883460998535156, "global_step": 58076, "epoch": 479} {"train_loss": -35.766117095947266, "global_step": 58077, "epoch": 479} {"train_loss": -36.19462203979492, "global_step": 58078, "epoch": 479} {"train_loss": -35.03245211829824, "global_step": 58079, "epoch": 479, "val_loss": 2616598.0} {"train_loss": -34.679439544677734, "global_step": 58080, "epoch": 480} {"train_loss": -33.34872055053711, "global_step": 58081, "epoch": 480} {"train_loss": -32.05013656616211, "global_step": 58082, "epoch": 480} {"train_loss": -33.7480583190918, "global_step": 58083, "epoch": 480} {"train_loss": -36.05521774291992, "global_step": 58084, "epoch": 480} {"train_loss": -33.938785552978516, "global_step": 58085, "epoch": 480} {"train_loss": -28.123743057250977, "global_step": 58086, "epoch": 480} {"train_loss": -22.467790603637695, "global_step": 58087, "epoch": 480} {"train_loss": -35.15171432495117, "global_step": 58088, "epoch": 480} {"train_loss": -30.107168197631836, "global_step": 58089, "epoch": 480} {"train_loss": -31.733625411987305, "global_step": 58090, "epoch": 480} {"train_loss": -32.53916549682617, "global_step": 58091, "epoch": 480} {"train_loss": -29.68128776550293, "global_step": 58092, "epoch": 480} {"train_loss": -34.757625579833984, "global_step": 58093, "epoch": 480} {"train_loss": -31.596044540405273, "global_step": 58094, "epoch": 480} {"train_loss": -34.204402923583984, "global_step": 58095, "epoch": 480} {"train_loss": -33.040260314941406, "global_step": 58096, "epoch": 480} {"train_loss": -33.644840240478516, "global_step": 58097, "epoch": 480} {"train_loss": -32.7711067199707, "global_step": 58098, "epoch": 480} {"train_loss": -25.803869247436523, "global_step": 58099, "epoch": 480} {"train_loss": -34.770301818847656, "global_step": 58100, "epoch": 480} {"train_loss": -33.2962760925293, "global_step": 58101, "epoch": 480} {"train_loss": -33.36012649536133, "global_step": 58102, "epoch": 480} {"train_loss": -33.74556350708008, "global_step": 58103, "epoch": 480} {"train_loss": -33.996315002441406, "global_step": 58104, "epoch": 480} {"train_loss": -34.474979400634766, "global_step": 58105, "epoch": 480} {"train_loss": -33.524940490722656, "global_step": 58106, "epoch": 480} {"train_loss": -33.41788864135742, "global_step": 58107, "epoch": 480} {"train_loss": -31.914539337158203, "global_step": 58108, "epoch": 480} {"train_loss": -34.62947463989258, "global_step": 58109, "epoch": 480} {"train_loss": -33.65521240234375, "global_step": 58110, "epoch": 480} {"train_loss": -34.73668670654297, "global_step": 58111, "epoch": 480} {"train_loss": -34.74074935913086, "global_step": 58112, "epoch": 480} {"train_loss": -34.00918197631836, "global_step": 58113, "epoch": 480} {"train_loss": -32.698707580566406, "global_step": 58114, "epoch": 480} {"train_loss": -34.75309371948242, "global_step": 58115, "epoch": 480} {"train_loss": -34.48514938354492, "global_step": 58116, "epoch": 480} {"train_loss": -34.26799392700195, "global_step": 58117, "epoch": 480} {"train_loss": -34.72290802001953, "global_step": 58118, "epoch": 480} {"train_loss": -32.26805114746094, "global_step": 58119, "epoch": 480} {"train_loss": -33.93560791015625, "global_step": 58120, "epoch": 480} {"train_loss": -34.792667388916016, "global_step": 58121, "epoch": 480} {"train_loss": -34.16638946533203, "global_step": 58122, "epoch": 480} {"train_loss": -34.41925811767578, "global_step": 58123, "epoch": 480} {"train_loss": -35.04240417480469, "global_step": 58124, "epoch": 480} {"train_loss": -35.04669952392578, "global_step": 58125, "epoch": 480} {"train_loss": -34.91333770751953, "global_step": 58126, "epoch": 480} {"train_loss": -34.7720947265625, "global_step": 58127, "epoch": 480} {"train_loss": -34.62531280517578, "global_step": 58128, "epoch": 480} {"train_loss": -33.9777717590332, "global_step": 58129, "epoch": 480} {"train_loss": -34.87616729736328, "global_step": 58130, "epoch": 480} {"train_loss": -35.12255859375, "global_step": 58131, "epoch": 480} {"train_loss": -34.51771545410156, "global_step": 58132, "epoch": 480} {"train_loss": -35.01766586303711, "global_step": 58133, "epoch": 480} {"train_loss": -34.99985885620117, "global_step": 58134, "epoch": 480} {"train_loss": -35.223812103271484, "global_step": 58135, "epoch": 480} {"train_loss": -34.58604431152344, "global_step": 58136, "epoch": 480} {"train_loss": -34.9637565612793, "global_step": 58137, "epoch": 480} {"train_loss": -35.43575668334961, "global_step": 58138, "epoch": 480} {"train_loss": -35.29257583618164, "global_step": 58139, "epoch": 480} {"train_loss": -35.83171463012695, "global_step": 58140, "epoch": 480} {"train_loss": -35.66509246826172, "global_step": 58141, "epoch": 480} {"train_loss": -35.75349044799805, "global_step": 58142, "epoch": 480} {"train_loss": -35.35811233520508, "global_step": 58143, "epoch": 480} {"train_loss": -35.82321548461914, "global_step": 58144, "epoch": 480} {"train_loss": -34.99494552612305, "global_step": 58145, "epoch": 480} {"train_loss": -35.76604461669922, "global_step": 58146, "epoch": 480} {"train_loss": -35.73820495605469, "global_step": 58147, "epoch": 480} {"train_loss": -35.417537689208984, "global_step": 58148, "epoch": 480} {"train_loss": -35.83169174194336, "global_step": 58149, "epoch": 480} {"train_loss": -35.99501419067383, "global_step": 58150, "epoch": 480} {"train_loss": -34.19301223754883, "global_step": 58151, "epoch": 480} {"train_loss": -35.67672348022461, "global_step": 58152, "epoch": 480} {"train_loss": -35.15350341796875, "global_step": 58153, "epoch": 480} {"train_loss": -35.07518005371094, "global_step": 58154, "epoch": 480} {"train_loss": -35.55329513549805, "global_step": 58155, "epoch": 480} {"train_loss": -35.71509552001953, "global_step": 58156, "epoch": 480} {"train_loss": -35.43256378173828, "global_step": 58157, "epoch": 480} {"train_loss": -35.5612907409668, "global_step": 58158, "epoch": 480} {"train_loss": -35.42695999145508, "global_step": 58159, "epoch": 480} {"train_loss": -34.35974884033203, "global_step": 58160, "epoch": 480} {"train_loss": -35.22431564331055, "global_step": 58161, "epoch": 480} {"train_loss": -35.51865768432617, "global_step": 58162, "epoch": 480} {"train_loss": -35.87868881225586, "global_step": 58163, "epoch": 480} {"train_loss": -35.2991943359375, "global_step": 58164, "epoch": 480} {"train_loss": -34.79072952270508, "global_step": 58165, "epoch": 480} {"train_loss": -36.2263069152832, "global_step": 58166, "epoch": 480} {"train_loss": -36.06429672241211, "global_step": 58167, "epoch": 480} {"train_loss": -35.973941802978516, "global_step": 58168, "epoch": 480} {"train_loss": -35.448402404785156, "global_step": 58169, "epoch": 480} {"train_loss": -35.889564514160156, "global_step": 58170, "epoch": 480} {"train_loss": -35.91672897338867, "global_step": 58171, "epoch": 480} {"train_loss": -36.10028839111328, "global_step": 58172, "epoch": 480} {"train_loss": -36.0474967956543, "global_step": 58173, "epoch": 480} {"train_loss": -36.08828353881836, "global_step": 58174, "epoch": 480} {"train_loss": -36.19807052612305, "global_step": 58175, "epoch": 480} {"train_loss": -36.65830612182617, "global_step": 58176, "epoch": 480} {"train_loss": -36.043914794921875, "global_step": 58177, "epoch": 480} {"train_loss": -36.25010299682617, "global_step": 58178, "epoch": 480} {"train_loss": -36.02707290649414, "global_step": 58179, "epoch": 480} {"train_loss": -35.62477493286133, "global_step": 58180, "epoch": 480} {"train_loss": -35.83787155151367, "global_step": 58181, "epoch": 480} {"train_loss": -36.3046989440918, "global_step": 58182, "epoch": 480} {"train_loss": -36.07902145385742, "global_step": 58183, "epoch": 480} {"train_loss": -36.187252044677734, "global_step": 58184, "epoch": 480} {"train_loss": -34.4052848815918, "global_step": 58185, "epoch": 480} {"train_loss": -36.53745651245117, "global_step": 58186, "epoch": 480} {"train_loss": -35.28797149658203, "global_step": 58187, "epoch": 480} {"train_loss": -35.03494644165039, "global_step": 58188, "epoch": 480} {"train_loss": -34.430137634277344, "global_step": 58189, "epoch": 480} {"train_loss": -35.817169189453125, "global_step": 58190, "epoch": 480} {"train_loss": -34.6700439453125, "global_step": 58191, "epoch": 480} {"train_loss": -34.89374923706055, "global_step": 58192, "epoch": 480} {"train_loss": -36.096961975097656, "global_step": 58193, "epoch": 480} {"train_loss": -34.872554779052734, "global_step": 58194, "epoch": 480} {"train_loss": -34.48586654663086, "global_step": 58195, "epoch": 480} {"train_loss": -35.97287368774414, "global_step": 58196, "epoch": 480} {"train_loss": -33.786720275878906, "global_step": 58197, "epoch": 480} {"train_loss": -35.43746566772461, "global_step": 58198, "epoch": 480} {"train_loss": -36.24123764038086, "global_step": 58199, "epoch": 480} {"train_loss": -34.50660343012534, "global_step": 58200, "epoch": 480, "val_loss": 2584401.0} {"train_loss": -35.991119384765625, "global_step": 58201, "epoch": 481} {"train_loss": -34.36770248413086, "global_step": 58202, "epoch": 481} {"train_loss": -35.85627746582031, "global_step": 58203, "epoch": 481} {"train_loss": -36.017269134521484, "global_step": 58204, "epoch": 481} {"train_loss": -32.05870819091797, "global_step": 58205, "epoch": 481} {"train_loss": -35.062129974365234, "global_step": 58206, "epoch": 481} {"train_loss": -35.634090423583984, "global_step": 58207, "epoch": 481} {"train_loss": -35.4119987487793, "global_step": 58208, "epoch": 481} {"train_loss": -35.8508415222168, "global_step": 58209, "epoch": 481} {"train_loss": -34.8050651550293, "global_step": 58210, "epoch": 481} {"train_loss": -35.03242874145508, "global_step": 58211, "epoch": 481} {"train_loss": -35.35085678100586, "global_step": 58212, "epoch": 481} {"train_loss": -35.90025329589844, "global_step": 58213, "epoch": 481} {"train_loss": -35.75858688354492, "global_step": 58214, "epoch": 481} {"train_loss": -35.70418930053711, "global_step": 58215, "epoch": 481} {"train_loss": -35.3839225769043, "global_step": 58216, "epoch": 481} {"train_loss": -34.32798385620117, "global_step": 58217, "epoch": 481} {"train_loss": -35.68939971923828, "global_step": 58218, "epoch": 481} {"train_loss": -35.86762619018555, "global_step": 58219, "epoch": 481} {"train_loss": -35.40768814086914, "global_step": 58220, "epoch": 481} {"train_loss": -35.8411979675293, "global_step": 58221, "epoch": 481} {"train_loss": -35.783748626708984, "global_step": 58222, "epoch": 481} {"train_loss": -35.788177490234375, "global_step": 58223, "epoch": 481} {"train_loss": -35.5771369934082, "global_step": 58224, "epoch": 481} {"train_loss": -35.743656158447266, "global_step": 58225, "epoch": 481} {"train_loss": -35.94411087036133, "global_step": 58226, "epoch": 481} {"train_loss": -36.21272277832031, "global_step": 58227, "epoch": 481} {"train_loss": -35.999969482421875, "global_step": 58228, "epoch": 481} {"train_loss": -34.874263763427734, "global_step": 58229, "epoch": 481} {"train_loss": -35.51493453979492, "global_step": 58230, "epoch": 481} {"train_loss": -35.52607345581055, "global_step": 58231, "epoch": 481} {"train_loss": -35.877376556396484, "global_step": 58232, "epoch": 481} {"train_loss": -36.382789611816406, "global_step": 58233, "epoch": 481} {"train_loss": -36.56178665161133, "global_step": 58234, "epoch": 481} {"train_loss": -36.53524398803711, "global_step": 58235, "epoch": 481} {"train_loss": -36.54096221923828, "global_step": 58236, "epoch": 481} {"train_loss": -36.406211853027344, "global_step": 58237, "epoch": 481} {"train_loss": -36.6381721496582, "global_step": 58238, "epoch": 481} {"train_loss": -36.99982833862305, "global_step": 58239, "epoch": 481} {"train_loss": -36.161903381347656, "global_step": 58240, "epoch": 481} {"train_loss": -36.50715255737305, "global_step": 58241, "epoch": 481} {"train_loss": -36.735469818115234, "global_step": 58242, "epoch": 481} {"train_loss": -36.77943420410156, "global_step": 58243, "epoch": 481} {"train_loss": -35.790340423583984, "global_step": 58244, "epoch": 481} {"train_loss": -36.41804885864258, "global_step": 58245, "epoch": 481} {"train_loss": -35.53818130493164, "global_step": 58246, "epoch": 481} {"train_loss": -36.90482711791992, "global_step": 58247, "epoch": 481} {"train_loss": -36.708309173583984, "global_step": 58248, "epoch": 481} {"train_loss": -36.83156204223633, "global_step": 58249, "epoch": 481} {"train_loss": -37.336570739746094, "global_step": 58250, "epoch": 481} {"train_loss": -37.123512268066406, "global_step": 58251, "epoch": 481} {"train_loss": -37.17929458618164, "global_step": 58252, "epoch": 481} {"train_loss": -36.7406120300293, "global_step": 58253, "epoch": 481} {"train_loss": -37.14809036254883, "global_step": 58254, "epoch": 481} {"train_loss": -37.02360153198242, "global_step": 58255, "epoch": 481} {"train_loss": -37.213191986083984, "global_step": 58256, "epoch": 481} {"train_loss": -37.08500289916992, "global_step": 58257, "epoch": 481} {"train_loss": -36.26636505126953, "global_step": 58258, "epoch": 481} {"train_loss": -36.67586135864258, "global_step": 58259, "epoch": 481} {"train_loss": -36.0220832824707, "global_step": 58260, "epoch": 481} {"train_loss": -35.08601760864258, "global_step": 58261, "epoch": 481} {"train_loss": -35.64344024658203, "global_step": 58262, "epoch": 481} {"train_loss": -36.86821746826172, "global_step": 58263, "epoch": 481} {"train_loss": -37.18423080444336, "global_step": 58264, "epoch": 481} {"train_loss": -37.45188522338867, "global_step": 58265, "epoch": 481} {"train_loss": -36.71704864501953, "global_step": 58266, "epoch": 481} {"train_loss": -36.06108093261719, "global_step": 58267, "epoch": 481} {"train_loss": -36.68033981323242, "global_step": 58268, "epoch": 481} {"train_loss": -36.11655807495117, "global_step": 58269, "epoch": 481} {"train_loss": -36.31095886230469, "global_step": 58270, "epoch": 481} {"train_loss": -36.560543060302734, "global_step": 58271, "epoch": 481} {"train_loss": -37.1529426574707, "global_step": 58272, "epoch": 481} {"train_loss": -35.4564323425293, "global_step": 58273, "epoch": 481} {"train_loss": -35.43551254272461, "global_step": 58274, "epoch": 481} {"train_loss": -34.71087646484375, "global_step": 58275, "epoch": 481} {"train_loss": -36.5252571105957, "global_step": 58276, "epoch": 481} {"train_loss": -35.167781829833984, "global_step": 58277, "epoch": 481} {"train_loss": -35.71930694580078, "global_step": 58278, "epoch": 481} {"train_loss": -33.74310302734375, "global_step": 58279, "epoch": 481} {"train_loss": -34.251441955566406, "global_step": 58280, "epoch": 481} {"train_loss": -32.170902252197266, "global_step": 58281, "epoch": 481} {"train_loss": -27.388891220092773, "global_step": 58282, "epoch": 481} {"train_loss": -8.501142501831055, "global_step": 58283, "epoch": 481} {"train_loss": -1.8934059143066406, "global_step": 58284, "epoch": 481} {"train_loss": -27.521991729736328, "global_step": 58285, "epoch": 481} {"train_loss": -27.582605361938477, "global_step": 58286, "epoch": 481} {"train_loss": -24.693984985351562, "global_step": 58287, "epoch": 481} {"train_loss": -31.273115158081055, "global_step": 58288, "epoch": 481} {"train_loss": -31.557096481323242, "global_step": 58289, "epoch": 481} {"train_loss": -28.5552978515625, "global_step": 58290, "epoch": 481} {"train_loss": -35.42879867553711, "global_step": 58291, "epoch": 481} {"train_loss": -30.544286727905273, "global_step": 58292, "epoch": 481} {"train_loss": -32.4053840637207, "global_step": 58293, "epoch": 481} {"train_loss": -34.697994232177734, "global_step": 58294, "epoch": 481} {"train_loss": -33.980751037597656, "global_step": 58295, "epoch": 481} {"train_loss": -33.17554473876953, "global_step": 58296, "epoch": 481} {"train_loss": -35.28121566772461, "global_step": 58297, "epoch": 481} {"train_loss": -35.626739501953125, "global_step": 58298, "epoch": 481} {"train_loss": -34.99138259887695, "global_step": 58299, "epoch": 481} {"train_loss": -34.67525863647461, "global_step": 58300, "epoch": 481} {"train_loss": -35.16611862182617, "global_step": 58301, "epoch": 481} {"train_loss": -35.27932357788086, "global_step": 58302, "epoch": 481} {"train_loss": -35.55392074584961, "global_step": 58303, "epoch": 481} {"train_loss": -34.8363151550293, "global_step": 58304, "epoch": 481} {"train_loss": -34.97431564331055, "global_step": 58305, "epoch": 481} {"train_loss": -35.10480880737305, "global_step": 58306, "epoch": 481} {"train_loss": -35.44095993041992, "global_step": 58307, "epoch": 481} {"train_loss": -35.982139587402344, "global_step": 58308, "epoch": 481} {"train_loss": -35.390262603759766, "global_step": 58309, "epoch": 481} {"train_loss": -34.88179397583008, "global_step": 58310, "epoch": 481} {"train_loss": -35.73419952392578, "global_step": 58311, "epoch": 481} {"train_loss": -35.99376678466797, "global_step": 58312, "epoch": 481} {"train_loss": -36.028995513916016, "global_step": 58313, "epoch": 481} {"train_loss": -34.84287643432617, "global_step": 58314, "epoch": 481} {"train_loss": -35.502498626708984, "global_step": 58315, "epoch": 481} {"train_loss": -35.96934509277344, "global_step": 58316, "epoch": 481} {"train_loss": -35.5543212890625, "global_step": 58317, "epoch": 481} {"train_loss": -35.90380859375, "global_step": 58318, "epoch": 481} {"train_loss": -36.0055046081543, "global_step": 58319, "epoch": 481} {"train_loss": -35.777427673339844, "global_step": 58320, "epoch": 481} {"train_loss": -34.76990647749467, "global_step": 58321, "epoch": 481, "val_loss": 2654433.0} {"train_loss": -35.93863296508789, "global_step": 58322, "epoch": 482} {"train_loss": -36.22659683227539, "global_step": 58323, "epoch": 482} {"train_loss": -36.20307540893555, "global_step": 58324, "epoch": 482} {"train_loss": -36.26157760620117, "global_step": 58325, "epoch": 482} {"train_loss": -36.077720642089844, "global_step": 58326, "epoch": 482} {"train_loss": -35.80493927001953, "global_step": 58327, "epoch": 482} {"train_loss": -36.210567474365234, "global_step": 58328, "epoch": 482} {"train_loss": -35.737335205078125, "global_step": 58329, "epoch": 482} {"train_loss": -35.82233810424805, "global_step": 58330, "epoch": 482} {"train_loss": -35.96971893310547, "global_step": 58331, "epoch": 482} {"train_loss": -35.670379638671875, "global_step": 58332, "epoch": 482} {"train_loss": -35.595436096191406, "global_step": 58333, "epoch": 482} {"train_loss": -36.1145133972168, "global_step": 58334, "epoch": 482} {"train_loss": -36.69300079345703, "global_step": 58335, "epoch": 482} {"train_loss": -35.930419921875, "global_step": 58336, "epoch": 482} {"train_loss": -36.38751220703125, "global_step": 58337, "epoch": 482} {"train_loss": -36.57562255859375, "global_step": 58338, "epoch": 482} {"train_loss": -36.500465393066406, "global_step": 58339, "epoch": 482} {"train_loss": -36.59286880493164, "global_step": 58340, "epoch": 482} {"train_loss": -36.420345306396484, "global_step": 58341, "epoch": 482} {"train_loss": -36.675167083740234, "global_step": 58342, "epoch": 482} {"train_loss": -36.954376220703125, "global_step": 58343, "epoch": 482} {"train_loss": -36.51272201538086, "global_step": 58344, "epoch": 482} {"train_loss": -36.58549880981445, "global_step": 58345, "epoch": 482} {"train_loss": -36.271175384521484, "global_step": 58346, "epoch": 482} {"train_loss": -36.02132797241211, "global_step": 58347, "epoch": 482} {"train_loss": -36.206214904785156, "global_step": 58348, "epoch": 482} {"train_loss": -35.821624755859375, "global_step": 58349, "epoch": 482} {"train_loss": -35.233062744140625, "global_step": 58350, "epoch": 482} {"train_loss": -35.389404296875, "global_step": 58351, "epoch": 482} {"train_loss": -36.06928253173828, "global_step": 58352, "epoch": 482} {"train_loss": -36.138404846191406, "global_step": 58353, "epoch": 482} {"train_loss": -35.42826461791992, "global_step": 58354, "epoch": 482} {"train_loss": -34.30670928955078, "global_step": 58355, "epoch": 482} {"train_loss": -33.584774017333984, "global_step": 58356, "epoch": 482} {"train_loss": -34.78937530517578, "global_step": 58357, "epoch": 482} {"train_loss": -36.19812774658203, "global_step": 58358, "epoch": 482} {"train_loss": -35.184547424316406, "global_step": 58359, "epoch": 482} {"train_loss": -33.680938720703125, "global_step": 58360, "epoch": 482} {"train_loss": -30.296735763549805, "global_step": 58361, "epoch": 482} {"train_loss": -33.17573165893555, "global_step": 58362, "epoch": 482} {"train_loss": -34.39812088012695, "global_step": 58363, "epoch": 482} {"train_loss": -35.703765869140625, "global_step": 58364, "epoch": 482} {"train_loss": -35.116695404052734, "global_step": 58365, "epoch": 482} {"train_loss": -32.53456497192383, "global_step": 58366, "epoch": 482} {"train_loss": -34.94318771362305, "global_step": 58367, "epoch": 482} {"train_loss": -35.15914535522461, "global_step": 58368, "epoch": 482} {"train_loss": -34.389686584472656, "global_step": 58369, "epoch": 482} {"train_loss": -34.40432357788086, "global_step": 58370, "epoch": 482} {"train_loss": -35.50271224975586, "global_step": 58371, "epoch": 482} {"train_loss": -34.15188980102539, "global_step": 58372, "epoch": 482} {"train_loss": -33.65949630737305, "global_step": 58373, "epoch": 482} {"train_loss": -32.3839225769043, "global_step": 58374, "epoch": 482} {"train_loss": -34.500823974609375, "global_step": 58375, "epoch": 482} {"train_loss": -35.78909683227539, "global_step": 58376, "epoch": 482} {"train_loss": -34.750186920166016, "global_step": 58377, "epoch": 482} {"train_loss": -33.880958557128906, "global_step": 58378, "epoch": 482} {"train_loss": -34.931190490722656, "global_step": 58379, "epoch": 482} {"train_loss": -35.1738166809082, "global_step": 58380, "epoch": 482} {"train_loss": -35.7116584777832, "global_step": 58381, "epoch": 482} {"train_loss": -34.21678924560547, "global_step": 58382, "epoch": 482} {"train_loss": -35.05129623413086, "global_step": 58383, "epoch": 482} {"train_loss": -35.57272720336914, "global_step": 58384, "epoch": 482} {"train_loss": -35.86168670654297, "global_step": 58385, "epoch": 482} {"train_loss": -35.39072799682617, "global_step": 58386, "epoch": 482} {"train_loss": -35.51967239379883, "global_step": 58387, "epoch": 482} {"train_loss": -36.22886276245117, "global_step": 58388, "epoch": 482} {"train_loss": -35.596534729003906, "global_step": 58389, "epoch": 482} {"train_loss": -36.50592041015625, "global_step": 58390, "epoch": 482} {"train_loss": -35.87007141113281, "global_step": 58391, "epoch": 482} {"train_loss": -35.99454879760742, "global_step": 58392, "epoch": 482} {"train_loss": -36.32444381713867, "global_step": 58393, "epoch": 482} {"train_loss": -36.040340423583984, "global_step": 58394, "epoch": 482} {"train_loss": -35.739723205566406, "global_step": 58395, "epoch": 482} {"train_loss": -36.270694732666016, "global_step": 58396, "epoch": 482} {"train_loss": -36.17024230957031, "global_step": 58397, "epoch": 482} {"train_loss": -36.13652038574219, "global_step": 58398, "epoch": 482} {"train_loss": -36.272274017333984, "global_step": 58399, "epoch": 482} {"train_loss": -36.42718505859375, "global_step": 58400, "epoch": 482} {"train_loss": -36.3602409362793, "global_step": 58401, "epoch": 482} {"train_loss": -35.839046478271484, "global_step": 58402, "epoch": 482} {"train_loss": -36.02805709838867, "global_step": 58403, "epoch": 482} {"train_loss": -36.36465072631836, "global_step": 58404, "epoch": 482} {"train_loss": -36.173892974853516, "global_step": 58405, "epoch": 482} {"train_loss": -36.31765365600586, "global_step": 58406, "epoch": 482} {"train_loss": -36.7260627746582, "global_step": 58407, "epoch": 482} {"train_loss": -36.72134017944336, "global_step": 58408, "epoch": 482} {"train_loss": -35.97840881347656, "global_step": 58409, "epoch": 482} {"train_loss": -36.89152145385742, "global_step": 58410, "epoch": 482} {"train_loss": -36.54243469238281, "global_step": 58411, "epoch": 482} {"train_loss": -36.3740119934082, "global_step": 58412, "epoch": 482} {"train_loss": -36.81631088256836, "global_step": 58413, "epoch": 482} {"train_loss": -36.592987060546875, "global_step": 58414, "epoch": 482} {"train_loss": -36.549652099609375, "global_step": 58415, "epoch": 482} {"train_loss": -36.692142486572266, "global_step": 58416, "epoch": 482} {"train_loss": -36.11214065551758, "global_step": 58417, "epoch": 482} {"train_loss": -36.09823989868164, "global_step": 58418, "epoch": 482} {"train_loss": -36.499244689941406, "global_step": 58419, "epoch": 482} {"train_loss": -36.769073486328125, "global_step": 58420, "epoch": 482} {"train_loss": -35.86757278442383, "global_step": 58421, "epoch": 482} {"train_loss": -35.161067962646484, "global_step": 58422, "epoch": 482} {"train_loss": -36.45752716064453, "global_step": 58423, "epoch": 482} {"train_loss": -34.93643569946289, "global_step": 58424, "epoch": 482} {"train_loss": -34.11223220825195, "global_step": 58425, "epoch": 482} {"train_loss": -35.89604949951172, "global_step": 58426, "epoch": 482} {"train_loss": -34.69382095336914, "global_step": 58427, "epoch": 482} {"train_loss": -35.400848388671875, "global_step": 58428, "epoch": 482} {"train_loss": -35.28083038330078, "global_step": 58429, "epoch": 482} {"train_loss": -34.38448715209961, "global_step": 58430, "epoch": 482} {"train_loss": -35.27585220336914, "global_step": 58431, "epoch": 482} {"train_loss": -34.619544982910156, "global_step": 58432, "epoch": 482} {"train_loss": -34.48098373413086, "global_step": 58433, "epoch": 482} {"train_loss": -34.89442825317383, "global_step": 58434, "epoch": 482} {"train_loss": -34.45046615600586, "global_step": 58435, "epoch": 482} {"train_loss": -33.2093620300293, "global_step": 58436, "epoch": 482} {"train_loss": -33.82322311401367, "global_step": 58437, "epoch": 482} {"train_loss": -33.19875717163086, "global_step": 58438, "epoch": 482} {"train_loss": -32.37672805786133, "global_step": 58439, "epoch": 482} {"train_loss": -33.125404357910156, "global_step": 58440, "epoch": 482} {"train_loss": -33.020240783691406, "global_step": 58441, "epoch": 482} {"train_loss": -35.382118461545836, "global_step": 58442, "epoch": 482, "val_loss": 2666424.0} {"train_loss": -32.15938186645508, "global_step": 58443, "epoch": 483} {"train_loss": -33.4065055847168, "global_step": 58444, "epoch": 483} {"train_loss": -31.1757869720459, "global_step": 58445, "epoch": 483} {"train_loss": -32.009456634521484, "global_step": 58446, "epoch": 483} {"train_loss": -31.06903076171875, "global_step": 58447, "epoch": 483} {"train_loss": -30.555479049682617, "global_step": 58448, "epoch": 483} {"train_loss": -31.894018173217773, "global_step": 58449, "epoch": 483} {"train_loss": -30.065275192260742, "global_step": 58450, "epoch": 483} {"train_loss": -31.745450973510742, "global_step": 58451, "epoch": 483} {"train_loss": -31.972625732421875, "global_step": 58452, "epoch": 483} {"train_loss": -30.913684844970703, "global_step": 58453, "epoch": 483} {"train_loss": -31.97694206237793, "global_step": 58454, "epoch": 483} {"train_loss": -32.450923919677734, "global_step": 58455, "epoch": 483} {"train_loss": -33.545650482177734, "global_step": 58456, "epoch": 483} {"train_loss": -32.30857467651367, "global_step": 58457, "epoch": 483} {"train_loss": -31.316242218017578, "global_step": 58458, "epoch": 483} {"train_loss": -33.29655075073242, "global_step": 58459, "epoch": 483} {"train_loss": -32.43476104736328, "global_step": 58460, "epoch": 483} {"train_loss": -32.84524917602539, "global_step": 58461, "epoch": 483} {"train_loss": -33.178157806396484, "global_step": 58462, "epoch": 483} {"train_loss": -29.55683708190918, "global_step": 58463, "epoch": 483} {"train_loss": -30.269269943237305, "global_step": 58464, "epoch": 483} {"train_loss": -33.470760345458984, "global_step": 58465, "epoch": 483} {"train_loss": -32.594825744628906, "global_step": 58466, "epoch": 483} {"train_loss": -32.92344665527344, "global_step": 58467, "epoch": 483} {"train_loss": -32.40766906738281, "global_step": 58468, "epoch": 483} {"train_loss": -31.560840606689453, "global_step": 58469, "epoch": 483} {"train_loss": -33.391788482666016, "global_step": 58470, "epoch": 483} {"train_loss": -32.57430648803711, "global_step": 58471, "epoch": 483} {"train_loss": -33.79336166381836, "global_step": 58472, "epoch": 483} {"train_loss": -33.35279083251953, "global_step": 58473, "epoch": 483} {"train_loss": -33.19199752807617, "global_step": 58474, "epoch": 483} {"train_loss": -32.322505950927734, "global_step": 58475, "epoch": 483} {"train_loss": -31.12757682800293, "global_step": 58476, "epoch": 483} {"train_loss": -32.853614807128906, "global_step": 58477, "epoch": 483} {"train_loss": -33.45779800415039, "global_step": 58478, "epoch": 483} {"train_loss": -32.674560546875, "global_step": 58479, "epoch": 483} {"train_loss": -33.843772888183594, "global_step": 58480, "epoch": 483} {"train_loss": -33.43181610107422, "global_step": 58481, "epoch": 483} {"train_loss": -33.96955490112305, "global_step": 58482, "epoch": 483} {"train_loss": -33.23871612548828, "global_step": 58483, "epoch": 483} {"train_loss": -33.260684967041016, "global_step": 58484, "epoch": 483} {"train_loss": -34.331356048583984, "global_step": 58485, "epoch": 483} {"train_loss": -34.039215087890625, "global_step": 58486, "epoch": 483} {"train_loss": -34.06672286987305, "global_step": 58487, "epoch": 483} {"train_loss": -33.98130416870117, "global_step": 58488, "epoch": 483} {"train_loss": -33.5589485168457, "global_step": 58489, "epoch": 483} {"train_loss": -34.10211181640625, "global_step": 58490, "epoch": 483} {"train_loss": -34.6492919921875, "global_step": 58491, "epoch": 483} {"train_loss": -33.182403564453125, "global_step": 58492, "epoch": 483} {"train_loss": -33.88603591918945, "global_step": 58493, "epoch": 483} {"train_loss": -34.42158889770508, "global_step": 58494, "epoch": 483} {"train_loss": -34.47500228881836, "global_step": 58495, "epoch": 483} {"train_loss": -34.28127670288086, "global_step": 58496, "epoch": 483} {"train_loss": -35.028621673583984, "global_step": 58497, "epoch": 483} {"train_loss": -34.52498245239258, "global_step": 58498, "epoch": 483} {"train_loss": -34.48012924194336, "global_step": 58499, "epoch": 483} {"train_loss": -34.95444869995117, "global_step": 58500, "epoch": 483} {"train_loss": -34.8228759765625, "global_step": 58501, "epoch": 483} {"train_loss": -35.015987396240234, "global_step": 58502, "epoch": 483} {"train_loss": -35.335174560546875, "global_step": 58503, "epoch": 483} {"train_loss": -35.52130126953125, "global_step": 58504, "epoch": 483} {"train_loss": -34.91904830932617, "global_step": 58505, "epoch": 483} {"train_loss": -34.54376220703125, "global_step": 58506, "epoch": 483} {"train_loss": -35.54941177368164, "global_step": 58507, "epoch": 483} {"train_loss": -34.93570327758789, "global_step": 58508, "epoch": 483} {"train_loss": -35.23173141479492, "global_step": 58509, "epoch": 483} {"train_loss": -35.29302978515625, "global_step": 58510, "epoch": 483} {"train_loss": -35.174354553222656, "global_step": 58511, "epoch": 483} {"train_loss": -35.428375244140625, "global_step": 58512, "epoch": 483} {"train_loss": -35.2105827331543, "global_step": 58513, "epoch": 483} {"train_loss": -35.434696197509766, "global_step": 58514, "epoch": 483} {"train_loss": -35.59579086303711, "global_step": 58515, "epoch": 483} {"train_loss": -36.025360107421875, "global_step": 58516, "epoch": 483} {"train_loss": -35.83079147338867, "global_step": 58517, "epoch": 483} {"train_loss": -35.94529342651367, "global_step": 58518, "epoch": 483} {"train_loss": -35.63176345825195, "global_step": 58519, "epoch": 483} {"train_loss": -35.8141975402832, "global_step": 58520, "epoch": 483} {"train_loss": -35.9901008605957, "global_step": 58521, "epoch": 483} {"train_loss": -35.78396224975586, "global_step": 58522, "epoch": 483} {"train_loss": -35.607357025146484, "global_step": 58523, "epoch": 483} {"train_loss": -35.6273078918457, "global_step": 58524, "epoch": 483} {"train_loss": -36.15825271606445, "global_step": 58525, "epoch": 483} {"train_loss": -36.27814865112305, "global_step": 58526, "epoch": 483} {"train_loss": -36.22391891479492, "global_step": 58527, "epoch": 483} {"train_loss": -35.774024963378906, "global_step": 58528, "epoch": 483} {"train_loss": -34.7300910949707, "global_step": 58529, "epoch": 483} {"train_loss": -34.78792953491211, "global_step": 58530, "epoch": 483} {"train_loss": -34.085479736328125, "global_step": 58531, "epoch": 483} {"train_loss": -34.765316009521484, "global_step": 58532, "epoch": 483} {"train_loss": -35.25338363647461, "global_step": 58533, "epoch": 483} {"train_loss": -35.38243865966797, "global_step": 58534, "epoch": 483} {"train_loss": -36.09859085083008, "global_step": 58535, "epoch": 483} {"train_loss": -35.80182647705078, "global_step": 58536, "epoch": 483} {"train_loss": -36.31413650512695, "global_step": 58537, "epoch": 483} {"train_loss": -36.465171813964844, "global_step": 58538, "epoch": 483} {"train_loss": -36.586669921875, "global_step": 58539, "epoch": 483} {"train_loss": -36.396461486816406, "global_step": 58540, "epoch": 483} {"train_loss": -36.120933532714844, "global_step": 58541, "epoch": 483} {"train_loss": -35.41028594970703, "global_step": 58542, "epoch": 483} {"train_loss": -34.67525863647461, "global_step": 58543, "epoch": 483} {"train_loss": -33.60282897949219, "global_step": 58544, "epoch": 483} {"train_loss": -34.82062911987305, "global_step": 58545, "epoch": 483} {"train_loss": -35.87590408325195, "global_step": 58546, "epoch": 483} {"train_loss": -36.87259292602539, "global_step": 58547, "epoch": 483} {"train_loss": -35.755611419677734, "global_step": 58548, "epoch": 483} {"train_loss": -36.25263595581055, "global_step": 58549, "epoch": 483} {"train_loss": -36.579994201660156, "global_step": 58550, "epoch": 483} {"train_loss": -35.603187561035156, "global_step": 58551, "epoch": 483} {"train_loss": -35.80564880371094, "global_step": 58552, "epoch": 483} {"train_loss": -35.53828811645508, "global_step": 58553, "epoch": 483} {"train_loss": -34.38532638549805, "global_step": 58554, "epoch": 483} {"train_loss": -35.659812927246094, "global_step": 58555, "epoch": 483} {"train_loss": -35.172489166259766, "global_step": 58556, "epoch": 483} {"train_loss": -34.42407989501953, "global_step": 58557, "epoch": 483} {"train_loss": -35.07107162475586, "global_step": 58558, "epoch": 483} {"train_loss": -33.04997634887695, "global_step": 58559, "epoch": 483} {"train_loss": -27.490497589111328, "global_step": 58560, "epoch": 483} {"train_loss": -24.762474060058594, "global_step": 58561, "epoch": 483} {"train_loss": -25.601633071899414, "global_step": 58562, "epoch": 483} {"train_loss": -33.98577729532541, "global_step": 58563, "epoch": 483, "val_loss": 2613207.0} {"train_loss": -31.81158447265625, "global_step": 58564, "epoch": 484} {"train_loss": -32.923927307128906, "global_step": 58565, "epoch": 484} {"train_loss": -32.08766555786133, "global_step": 58566, "epoch": 484} {"train_loss": -33.912445068359375, "global_step": 58567, "epoch": 484} {"train_loss": -32.53013229370117, "global_step": 58568, "epoch": 484} {"train_loss": -34.589656829833984, "global_step": 58569, "epoch": 484} {"train_loss": -34.470245361328125, "global_step": 58570, "epoch": 484} {"train_loss": -34.26162338256836, "global_step": 58571, "epoch": 484} {"train_loss": -34.82509994506836, "global_step": 58572, "epoch": 484} {"train_loss": -29.908056259155273, "global_step": 58573, "epoch": 484} {"train_loss": -33.22494125366211, "global_step": 58574, "epoch": 484} {"train_loss": -33.48293685913086, "global_step": 58575, "epoch": 484} {"train_loss": -34.2876091003418, "global_step": 58576, "epoch": 484} {"train_loss": -33.67017364501953, "global_step": 58577, "epoch": 484} {"train_loss": -34.5521240234375, "global_step": 58578, "epoch": 484} {"train_loss": -34.81655502319336, "global_step": 58579, "epoch": 484} {"train_loss": -34.35203552246094, "global_step": 58580, "epoch": 484} {"train_loss": -34.56635284423828, "global_step": 58581, "epoch": 484} {"train_loss": -34.84119415283203, "global_step": 58582, "epoch": 484} {"train_loss": -34.443050384521484, "global_step": 58583, "epoch": 484} {"train_loss": -35.09235382080078, "global_step": 58584, "epoch": 484} {"train_loss": -34.015586853027344, "global_step": 58585, "epoch": 484} {"train_loss": -34.34123611450195, "global_step": 58586, "epoch": 484} {"train_loss": -34.713165283203125, "global_step": 58587, "epoch": 484} {"train_loss": -35.243473052978516, "global_step": 58588, "epoch": 484} {"train_loss": -34.60880661010742, "global_step": 58589, "epoch": 484} {"train_loss": -34.51752471923828, "global_step": 58590, "epoch": 484} {"train_loss": -34.958526611328125, "global_step": 58591, "epoch": 484} {"train_loss": -35.08592987060547, "global_step": 58592, "epoch": 484} {"train_loss": -34.99351501464844, "global_step": 58593, "epoch": 484} {"train_loss": -35.07960510253906, "global_step": 58594, "epoch": 484} {"train_loss": -35.008827209472656, "global_step": 58595, "epoch": 484} {"train_loss": -34.549739837646484, "global_step": 58596, "epoch": 484} {"train_loss": -34.40826416015625, "global_step": 58597, "epoch": 484} {"train_loss": -35.04121398925781, "global_step": 58598, "epoch": 484} {"train_loss": -34.82726287841797, "global_step": 58599, "epoch": 484} {"train_loss": -35.5493278503418, "global_step": 58600, "epoch": 484} {"train_loss": -35.34540939331055, "global_step": 58601, "epoch": 484} {"train_loss": -35.43412399291992, "global_step": 58602, "epoch": 484} {"train_loss": -35.73637771606445, "global_step": 58603, "epoch": 484} {"train_loss": -35.41273498535156, "global_step": 58604, "epoch": 484} {"train_loss": -35.183380126953125, "global_step": 58605, "epoch": 484} {"train_loss": -34.972408294677734, "global_step": 58606, "epoch": 484} {"train_loss": -35.30325698852539, "global_step": 58607, "epoch": 484} {"train_loss": -35.242897033691406, "global_step": 58608, "epoch": 484} {"train_loss": -35.363311767578125, "global_step": 58609, "epoch": 484} {"train_loss": -36.01984405517578, "global_step": 58610, "epoch": 484} {"train_loss": -35.5665397644043, "global_step": 58611, "epoch": 484} {"train_loss": -35.65327072143555, "global_step": 58612, "epoch": 484} {"train_loss": -35.56005096435547, "global_step": 58613, "epoch": 484} {"train_loss": -35.89788818359375, "global_step": 58614, "epoch": 484} {"train_loss": -35.699066162109375, "global_step": 58615, "epoch": 484} {"train_loss": -35.65501022338867, "global_step": 58616, "epoch": 484} {"train_loss": -36.0943717956543, "global_step": 58617, "epoch": 484} {"train_loss": -35.46684646606445, "global_step": 58618, "epoch": 484} {"train_loss": -36.000911712646484, "global_step": 58619, "epoch": 484} {"train_loss": -35.409420013427734, "global_step": 58620, "epoch": 484} {"train_loss": -35.771785736083984, "global_step": 58621, "epoch": 484} {"train_loss": -35.88283920288086, "global_step": 58622, "epoch": 484} {"train_loss": -36.05286407470703, "global_step": 58623, "epoch": 484} {"train_loss": -35.95656967163086, "global_step": 58624, "epoch": 484} {"train_loss": -35.82601547241211, "global_step": 58625, "epoch": 484} {"train_loss": -35.21242904663086, "global_step": 58626, "epoch": 484} {"train_loss": -36.0742301940918, "global_step": 58627, "epoch": 484} {"train_loss": -36.11299514770508, "global_step": 58628, "epoch": 484} {"train_loss": -34.22357177734375, "global_step": 58629, "epoch": 484} {"train_loss": -32.9368896484375, "global_step": 58630, "epoch": 484} {"train_loss": -32.70463943481445, "global_step": 58631, "epoch": 484} {"train_loss": -35.517059326171875, "global_step": 58632, "epoch": 484} {"train_loss": -33.523311614990234, "global_step": 58633, "epoch": 484} {"train_loss": -34.624210357666016, "global_step": 58634, "epoch": 484} {"train_loss": -35.59940719604492, "global_step": 58635, "epoch": 484} {"train_loss": -34.76656723022461, "global_step": 58636, "epoch": 484} {"train_loss": -35.32098388671875, "global_step": 58637, "epoch": 484} {"train_loss": -35.60154342651367, "global_step": 58638, "epoch": 484} {"train_loss": -35.61182403564453, "global_step": 58639, "epoch": 484} {"train_loss": -35.976318359375, "global_step": 58640, "epoch": 484} {"train_loss": -35.49769973754883, "global_step": 58641, "epoch": 484} {"train_loss": -35.94292449951172, "global_step": 58642, "epoch": 484} {"train_loss": -36.05082702636719, "global_step": 58643, "epoch": 484} {"train_loss": -35.98066329956055, "global_step": 58644, "epoch": 484} {"train_loss": -36.21017074584961, "global_step": 58645, "epoch": 484} {"train_loss": -36.54307174682617, "global_step": 58646, "epoch": 484} {"train_loss": -36.18914794921875, "global_step": 58647, "epoch": 484} {"train_loss": -35.75642776489258, "global_step": 58648, "epoch": 484} {"train_loss": -36.85103225708008, "global_step": 58649, "epoch": 484} {"train_loss": -36.31965255737305, "global_step": 58650, "epoch": 484} {"train_loss": -36.51762771606445, "global_step": 58651, "epoch": 484} {"train_loss": -36.37255859375, "global_step": 58652, "epoch": 484} {"train_loss": -36.5920295715332, "global_step": 58653, "epoch": 484} {"train_loss": -36.87715530395508, "global_step": 58654, "epoch": 484} {"train_loss": -36.5931282043457, "global_step": 58655, "epoch": 484} {"train_loss": -36.685970306396484, "global_step": 58656, "epoch": 484} {"train_loss": -36.6212272644043, "global_step": 58657, "epoch": 484} {"train_loss": -36.53059387207031, "global_step": 58658, "epoch": 484} {"train_loss": -36.47544479370117, "global_step": 58659, "epoch": 484} {"train_loss": -36.67814636230469, "global_step": 58660, "epoch": 484} {"train_loss": -36.8561897277832, "global_step": 58661, "epoch": 484} {"train_loss": -36.443824768066406, "global_step": 58662, "epoch": 484} {"train_loss": -36.47626495361328, "global_step": 58663, "epoch": 484} {"train_loss": -35.57378387451172, "global_step": 58664, "epoch": 484} {"train_loss": -36.82786178588867, "global_step": 58665, "epoch": 484} {"train_loss": -36.372047424316406, "global_step": 58666, "epoch": 484} {"train_loss": -36.55428695678711, "global_step": 58667, "epoch": 484} {"train_loss": -36.58893966674805, "global_step": 58668, "epoch": 484} {"train_loss": -36.49515151977539, "global_step": 58669, "epoch": 484} {"train_loss": -37.04874801635742, "global_step": 58670, "epoch": 484} {"train_loss": -37.19997787475586, "global_step": 58671, "epoch": 484} {"train_loss": -36.4372444152832, "global_step": 58672, "epoch": 484} {"train_loss": -35.68743133544922, "global_step": 58673, "epoch": 484} {"train_loss": -35.20524215698242, "global_step": 58674, "epoch": 484} {"train_loss": -33.27142333984375, "global_step": 58675, "epoch": 484} {"train_loss": -29.454303741455078, "global_step": 58676, "epoch": 484} {"train_loss": -30.927032470703125, "global_step": 58677, "epoch": 484} {"train_loss": -34.371212005615234, "global_step": 58678, "epoch": 484} {"train_loss": -25.2030086517334, "global_step": 58679, "epoch": 484} {"train_loss": -31.990188598632812, "global_step": 58680, "epoch": 484} {"train_loss": -33.92043685913086, "global_step": 58681, "epoch": 484} {"train_loss": -30.525665283203125, "global_step": 58682, "epoch": 484} {"train_loss": -30.129194259643555, "global_step": 58683, "epoch": 484} {"train_loss": -34.9278938514142, "global_step": 58684, "epoch": 484, "val_loss": 2572073.25} {"train_loss": -33.37285614013672, "global_step": 58685, "epoch": 485} {"train_loss": -24.89374542236328, "global_step": 58686, "epoch": 485} {"train_loss": -35.029998779296875, "global_step": 58687, "epoch": 485} {"train_loss": -29.1385555267334, "global_step": 58688, "epoch": 485} {"train_loss": -29.397241592407227, "global_step": 58689, "epoch": 485} {"train_loss": -34.414276123046875, "global_step": 58690, "epoch": 485} {"train_loss": -31.918928146362305, "global_step": 58691, "epoch": 485} {"train_loss": -35.15632629394531, "global_step": 58692, "epoch": 485} {"train_loss": -32.284603118896484, "global_step": 58693, "epoch": 485} {"train_loss": -34.88491439819336, "global_step": 58694, "epoch": 485} {"train_loss": -33.76835632324219, "global_step": 58695, "epoch": 485} {"train_loss": -34.60405349731445, "global_step": 58696, "epoch": 485} {"train_loss": -34.474037170410156, "global_step": 58697, "epoch": 485} {"train_loss": -33.93971633911133, "global_step": 58698, "epoch": 485} {"train_loss": -35.191619873046875, "global_step": 58699, "epoch": 485} {"train_loss": -34.37205123901367, "global_step": 58700, "epoch": 485} {"train_loss": -35.37672805786133, "global_step": 58701, "epoch": 485} {"train_loss": -35.10677719116211, "global_step": 58702, "epoch": 485} {"train_loss": -34.518436431884766, "global_step": 58703, "epoch": 485} {"train_loss": -35.123863220214844, "global_step": 58704, "epoch": 485} {"train_loss": -34.97629928588867, "global_step": 58705, "epoch": 485} {"train_loss": -35.52755355834961, "global_step": 58706, "epoch": 485} {"train_loss": -35.42068099975586, "global_step": 58707, "epoch": 485} {"train_loss": -35.23075485229492, "global_step": 58708, "epoch": 485} {"train_loss": -36.030853271484375, "global_step": 58709, "epoch": 485} {"train_loss": -35.402652740478516, "global_step": 58710, "epoch": 485} {"train_loss": -35.169158935546875, "global_step": 58711, "epoch": 485} {"train_loss": -36.07682418823242, "global_step": 58712, "epoch": 485} {"train_loss": -35.74442672729492, "global_step": 58713, "epoch": 485} {"train_loss": -35.95388412475586, "global_step": 58714, "epoch": 485} {"train_loss": -35.739295959472656, "global_step": 58715, "epoch": 485} {"train_loss": -35.505340576171875, "global_step": 58716, "epoch": 485} {"train_loss": -35.870704650878906, "global_step": 58717, "epoch": 485} {"train_loss": -35.93915557861328, "global_step": 58718, "epoch": 485} {"train_loss": -35.803741455078125, "global_step": 58719, "epoch": 485} {"train_loss": -35.8922233581543, "global_step": 58720, "epoch": 485} {"train_loss": -36.131988525390625, "global_step": 58721, "epoch": 485} {"train_loss": -36.10270690917969, "global_step": 58722, "epoch": 485} {"train_loss": -36.39524459838867, "global_step": 58723, "epoch": 485} {"train_loss": -36.339839935302734, "global_step": 58724, "epoch": 485} {"train_loss": -36.4116096496582, "global_step": 58725, "epoch": 485} {"train_loss": -36.35304641723633, "global_step": 58726, "epoch": 485} {"train_loss": -36.58740234375, "global_step": 58727, "epoch": 485} {"train_loss": -36.16709518432617, "global_step": 58728, "epoch": 485} {"train_loss": -36.58692932128906, "global_step": 58729, "epoch": 485} {"train_loss": -36.042938232421875, "global_step": 58730, "epoch": 485} {"train_loss": -36.19670104980469, "global_step": 58731, "epoch": 485} {"train_loss": -36.383304595947266, "global_step": 58732, "epoch": 485} {"train_loss": -36.714534759521484, "global_step": 58733, "epoch": 485} {"train_loss": -36.856849670410156, "global_step": 58734, "epoch": 485} {"train_loss": -36.59575653076172, "global_step": 58735, "epoch": 485} {"train_loss": -36.37784194946289, "global_step": 58736, "epoch": 485} {"train_loss": -36.51295852661133, "global_step": 58737, "epoch": 485} {"train_loss": -36.80434036254883, "global_step": 58738, "epoch": 485} {"train_loss": -36.8912239074707, "global_step": 58739, "epoch": 485} {"train_loss": -36.65769577026367, "global_step": 58740, "epoch": 485} {"train_loss": -36.65665817260742, "global_step": 58741, "epoch": 485} {"train_loss": -36.888179779052734, "global_step": 58742, "epoch": 485} {"train_loss": -37.34098434448242, "global_step": 58743, "epoch": 485} {"train_loss": -36.156368255615234, "global_step": 58744, "epoch": 485} {"train_loss": -36.55158996582031, "global_step": 58745, "epoch": 485} {"train_loss": -36.92739486694336, "global_step": 58746, "epoch": 485} {"train_loss": -36.73957061767578, "global_step": 58747, "epoch": 485} {"train_loss": -36.65546417236328, "global_step": 58748, "epoch": 485} {"train_loss": -36.51604080200195, "global_step": 58749, "epoch": 485} {"train_loss": -37.37434005737305, "global_step": 58750, "epoch": 485} {"train_loss": -37.26640701293945, "global_step": 58751, "epoch": 485} {"train_loss": -36.80217742919922, "global_step": 58752, "epoch": 485} {"train_loss": -36.94266891479492, "global_step": 58753, "epoch": 485} {"train_loss": -37.37843704223633, "global_step": 58754, "epoch": 485} {"train_loss": -36.29050064086914, "global_step": 58755, "epoch": 485} {"train_loss": -36.50146484375, "global_step": 58756, "epoch": 485} {"train_loss": -36.58973693847656, "global_step": 58757, "epoch": 485} {"train_loss": -36.9614372253418, "global_step": 58758, "epoch": 485} {"train_loss": -36.05115509033203, "global_step": 58759, "epoch": 485} {"train_loss": -35.14255905151367, "global_step": 58760, "epoch": 485} {"train_loss": -36.55139923095703, "global_step": 58761, "epoch": 485} {"train_loss": -37.08713150024414, "global_step": 58762, "epoch": 485} {"train_loss": -35.88199996948242, "global_step": 58763, "epoch": 485} {"train_loss": -36.207611083984375, "global_step": 58764, "epoch": 485} {"train_loss": -36.951656341552734, "global_step": 58765, "epoch": 485} {"train_loss": -35.91848373413086, "global_step": 58766, "epoch": 485} {"train_loss": -35.25617980957031, "global_step": 58767, "epoch": 485} {"train_loss": -35.376338958740234, "global_step": 58768, "epoch": 485} {"train_loss": -34.263126373291016, "global_step": 58769, "epoch": 485} {"train_loss": -35.12361145019531, "global_step": 58770, "epoch": 485} {"train_loss": -33.89619445800781, "global_step": 58771, "epoch": 485} {"train_loss": -35.723663330078125, "global_step": 58772, "epoch": 485} {"train_loss": -33.72817611694336, "global_step": 58773, "epoch": 485} {"train_loss": -34.47376251220703, "global_step": 58774, "epoch": 485} {"train_loss": -33.73396682739258, "global_step": 58775, "epoch": 485} {"train_loss": -33.53071212768555, "global_step": 58776, "epoch": 485} {"train_loss": -34.62040328979492, "global_step": 58777, "epoch": 485} {"train_loss": -34.780879974365234, "global_step": 58778, "epoch": 485} {"train_loss": -31.623703002929688, "global_step": 58779, "epoch": 485} {"train_loss": -33.70615768432617, "global_step": 58780, "epoch": 485} {"train_loss": -29.413986206054688, "global_step": 58781, "epoch": 485} {"train_loss": -32.8505859375, "global_step": 58782, "epoch": 485} {"train_loss": -36.08404541015625, "global_step": 58783, "epoch": 485} {"train_loss": -33.706790924072266, "global_step": 58784, "epoch": 485} {"train_loss": -35.152488708496094, "global_step": 58785, "epoch": 485} {"train_loss": -35.66753005981445, "global_step": 58786, "epoch": 485} {"train_loss": -35.6143913269043, "global_step": 58787, "epoch": 485} {"train_loss": -35.58266830444336, "global_step": 58788, "epoch": 485} {"train_loss": -36.23043441772461, "global_step": 58789, "epoch": 485} {"train_loss": -35.5302734375, "global_step": 58790, "epoch": 485} {"train_loss": -35.95289611816406, "global_step": 58791, "epoch": 485} {"train_loss": -35.351558685302734, "global_step": 58792, "epoch": 485} {"train_loss": -36.26691818237305, "global_step": 58793, "epoch": 485} {"train_loss": -35.7912712097168, "global_step": 58794, "epoch": 485} {"train_loss": -35.787174224853516, "global_step": 58795, "epoch": 485} {"train_loss": -36.54098892211914, "global_step": 58796, "epoch": 485} {"train_loss": -36.285518646240234, "global_step": 58797, "epoch": 485} {"train_loss": -36.2891845703125, "global_step": 58798, "epoch": 485} {"train_loss": -36.09836196899414, "global_step": 58799, "epoch": 485} {"train_loss": -36.41495895385742, "global_step": 58800, "epoch": 485} {"train_loss": -36.17194747924805, "global_step": 58801, "epoch": 485} {"train_loss": -36.399166107177734, "global_step": 58802, "epoch": 485} {"train_loss": -36.3585319519043, "global_step": 58803, "epoch": 485} {"train_loss": -36.711238861083984, "global_step": 58804, "epoch": 485} {"train_loss": -35.43139845477648, "global_step": 58805, "epoch": 485, "val_loss": 2605236.75} {"train_loss": -36.80662155151367, "global_step": 58806, "epoch": 486} {"train_loss": -36.69730758666992, "global_step": 58807, "epoch": 486} {"train_loss": -36.547386169433594, "global_step": 58808, "epoch": 486} {"train_loss": -36.56085968017578, "global_step": 58809, "epoch": 486} {"train_loss": -36.56294631958008, "global_step": 58810, "epoch": 486} {"train_loss": -36.756378173828125, "global_step": 58811, "epoch": 486} {"train_loss": -36.97783279418945, "global_step": 58812, "epoch": 486} {"train_loss": -36.78522872924805, "global_step": 58813, "epoch": 486} {"train_loss": -36.2738037109375, "global_step": 58814, "epoch": 486} {"train_loss": -35.94004821777344, "global_step": 58815, "epoch": 486} {"train_loss": -36.68265151977539, "global_step": 58816, "epoch": 486} {"train_loss": -36.39476013183594, "global_step": 58817, "epoch": 486} {"train_loss": -36.64642333984375, "global_step": 58818, "epoch": 486} {"train_loss": -35.726619720458984, "global_step": 58819, "epoch": 486} {"train_loss": -33.362525939941406, "global_step": 58820, "epoch": 486} {"train_loss": -30.1352596282959, "global_step": 58821, "epoch": 486} {"train_loss": -23.7501277923584, "global_step": 58822, "epoch": 486} {"train_loss": -25.087326049804688, "global_step": 58823, "epoch": 486} {"train_loss": -33.20677185058594, "global_step": 58824, "epoch": 486} {"train_loss": -36.16750717163086, "global_step": 58825, "epoch": 486} {"train_loss": -32.230995178222656, "global_step": 58826, "epoch": 486} {"train_loss": -35.80916976928711, "global_step": 58827, "epoch": 486} {"train_loss": -34.56565475463867, "global_step": 58828, "epoch": 486} {"train_loss": -35.425270080566406, "global_step": 58829, "epoch": 486} {"train_loss": -34.81898880004883, "global_step": 58830, "epoch": 486} {"train_loss": -36.07319259643555, "global_step": 58831, "epoch": 486} {"train_loss": -35.84357452392578, "global_step": 58832, "epoch": 486} {"train_loss": -35.40957260131836, "global_step": 58833, "epoch": 486} {"train_loss": -35.60207748413086, "global_step": 58834, "epoch": 486} {"train_loss": -35.42534255981445, "global_step": 58835, "epoch": 486} {"train_loss": -33.82404327392578, "global_step": 58836, "epoch": 486} {"train_loss": -35.94737243652344, "global_step": 58837, "epoch": 486} {"train_loss": -35.271602630615234, "global_step": 58838, "epoch": 486} {"train_loss": -34.11715316772461, "global_step": 58839, "epoch": 486} {"train_loss": -35.33362579345703, "global_step": 58840, "epoch": 486} {"train_loss": -34.53889083862305, "global_step": 58841, "epoch": 486} {"train_loss": -36.543888092041016, "global_step": 58842, "epoch": 486} {"train_loss": -35.777015686035156, "global_step": 58843, "epoch": 486} {"train_loss": -35.06827926635742, "global_step": 58844, "epoch": 486} {"train_loss": -35.67416000366211, "global_step": 58845, "epoch": 486} {"train_loss": -35.579463958740234, "global_step": 58846, "epoch": 486} {"train_loss": -26.2406005859375, "global_step": 58847, "epoch": 486} {"train_loss": -33.58964157104492, "global_step": 58848, "epoch": 486} {"train_loss": -34.19495391845703, "global_step": 58849, "epoch": 486} {"train_loss": -33.73042678833008, "global_step": 58850, "epoch": 486} {"train_loss": -32.19819259643555, "global_step": 58851, "epoch": 486} {"train_loss": -35.23540115356445, "global_step": 58852, "epoch": 486} {"train_loss": -33.802913665771484, "global_step": 58853, "epoch": 486} {"train_loss": -35.22277069091797, "global_step": 58854, "epoch": 486} {"train_loss": -33.75161361694336, "global_step": 58855, "epoch": 486} {"train_loss": -34.248661041259766, "global_step": 58856, "epoch": 486} {"train_loss": -34.350624084472656, "global_step": 58857, "epoch": 486} {"train_loss": -34.10857391357422, "global_step": 58858, "epoch": 486} {"train_loss": -35.35271072387695, "global_step": 58859, "epoch": 486} {"train_loss": -33.85652542114258, "global_step": 58860, "epoch": 486} {"train_loss": -34.661285400390625, "global_step": 58861, "epoch": 486} {"train_loss": -34.975582122802734, "global_step": 58862, "epoch": 486} {"train_loss": -34.4031982421875, "global_step": 58863, "epoch": 486} {"train_loss": -35.41420364379883, "global_step": 58864, "epoch": 486} {"train_loss": -35.271854400634766, "global_step": 58865, "epoch": 486} {"train_loss": -34.944644927978516, "global_step": 58866, "epoch": 486} {"train_loss": -34.95530319213867, "global_step": 58867, "epoch": 486} {"train_loss": -34.294551849365234, "global_step": 58868, "epoch": 486} {"train_loss": -35.621578216552734, "global_step": 58869, "epoch": 486} {"train_loss": -35.31611633300781, "global_step": 58870, "epoch": 486} {"train_loss": -35.111019134521484, "global_step": 58871, "epoch": 486} {"train_loss": -35.167518615722656, "global_step": 58872, "epoch": 486} {"train_loss": -35.1824836730957, "global_step": 58873, "epoch": 486} {"train_loss": -35.46802520751953, "global_step": 58874, "epoch": 486} {"train_loss": -35.8228759765625, "global_step": 58875, "epoch": 486} {"train_loss": -35.81105422973633, "global_step": 58876, "epoch": 486} {"train_loss": -35.57074737548828, "global_step": 58877, "epoch": 486} {"train_loss": -35.91975402832031, "global_step": 58878, "epoch": 486} {"train_loss": -35.941890716552734, "global_step": 58879, "epoch": 486} {"train_loss": -35.93241500854492, "global_step": 58880, "epoch": 486} {"train_loss": -36.260921478271484, "global_step": 58881, "epoch": 486} {"train_loss": -36.03272247314453, "global_step": 58882, "epoch": 486} {"train_loss": -36.01290512084961, "global_step": 58883, "epoch": 486} {"train_loss": -36.32902908325195, "global_step": 58884, "epoch": 486} {"train_loss": -35.83153533935547, "global_step": 58885, "epoch": 486} {"train_loss": -35.73441696166992, "global_step": 58886, "epoch": 486} {"train_loss": -36.15302658081055, "global_step": 58887, "epoch": 486} {"train_loss": -36.387298583984375, "global_step": 58888, "epoch": 486} {"train_loss": -36.19668197631836, "global_step": 58889, "epoch": 486} {"train_loss": -36.70692825317383, "global_step": 58890, "epoch": 486} {"train_loss": -36.471771240234375, "global_step": 58891, "epoch": 486} {"train_loss": -36.367794036865234, "global_step": 58892, "epoch": 486} {"train_loss": -36.269771575927734, "global_step": 58893, "epoch": 486} {"train_loss": -36.264705657958984, "global_step": 58894, "epoch": 486} {"train_loss": -36.19277572631836, "global_step": 58895, "epoch": 486} {"train_loss": -36.492977142333984, "global_step": 58896, "epoch": 486} {"train_loss": -36.0495719909668, "global_step": 58897, "epoch": 486} {"train_loss": -36.613704681396484, "global_step": 58898, "epoch": 486} {"train_loss": -36.839046478271484, "global_step": 58899, "epoch": 486} {"train_loss": -36.358577728271484, "global_step": 58900, "epoch": 486} {"train_loss": -36.62117385864258, "global_step": 58901, "epoch": 486} {"train_loss": -36.48272705078125, "global_step": 58902, "epoch": 486} {"train_loss": -36.64837646484375, "global_step": 58903, "epoch": 486} {"train_loss": -36.53022384643555, "global_step": 58904, "epoch": 486} {"train_loss": -36.2802734375, "global_step": 58905, "epoch": 486} {"train_loss": -36.75751876831055, "global_step": 58906, "epoch": 486} {"train_loss": -36.73530960083008, "global_step": 58907, "epoch": 486} {"train_loss": -36.70579147338867, "global_step": 58908, "epoch": 486} {"train_loss": -36.99526596069336, "global_step": 58909, "epoch": 486} {"train_loss": -35.587642669677734, "global_step": 58910, "epoch": 486} {"train_loss": -35.808990478515625, "global_step": 58911, "epoch": 486} {"train_loss": -36.33037185668945, "global_step": 58912, "epoch": 486} {"train_loss": -34.44562530517578, "global_step": 58913, "epoch": 486} {"train_loss": -31.58379554748535, "global_step": 58914, "epoch": 486} {"train_loss": -31.382797241210938, "global_step": 58915, "epoch": 486} {"train_loss": -33.76336669921875, "global_step": 58916, "epoch": 486} {"train_loss": -36.73115539550781, "global_step": 58917, "epoch": 486} {"train_loss": -35.6923713684082, "global_step": 58918, "epoch": 486} {"train_loss": -32.940128326416016, "global_step": 58919, "epoch": 486} {"train_loss": -27.55759620666504, "global_step": 58920, "epoch": 486} {"train_loss": -15.82299518585205, "global_step": 58921, "epoch": 486} {"train_loss": -17.390249252319336, "global_step": 58922, "epoch": 486} {"train_loss": -20.109928131103516, "global_step": 58923, "epoch": 486} {"train_loss": -34.815040588378906, "global_step": 58924, "epoch": 486} {"train_loss": -24.730113983154297, "global_step": 58925, "epoch": 486} {"train_loss": -34.5089157908416, "global_step": 58926, "epoch": 486, "val_loss": 2312798.0} {"train_loss": -32.30308151245117, "global_step": 58927, "epoch": 487} {"train_loss": -30.43857765197754, "global_step": 58928, "epoch": 487} {"train_loss": -32.92104721069336, "global_step": 58929, "epoch": 487} {"train_loss": -33.539833068847656, "global_step": 58930, "epoch": 487} {"train_loss": -32.012752532958984, "global_step": 58931, "epoch": 487} {"train_loss": -34.7171745300293, "global_step": 58932, "epoch": 487} {"train_loss": -33.23103713989258, "global_step": 58933, "epoch": 487} {"train_loss": -34.35263442993164, "global_step": 58934, "epoch": 487} {"train_loss": -34.22323226928711, "global_step": 58935, "epoch": 487} {"train_loss": -34.30826950073242, "global_step": 58936, "epoch": 487} {"train_loss": -34.6085205078125, "global_step": 58937, "epoch": 487} {"train_loss": -34.81742477416992, "global_step": 58938, "epoch": 487} {"train_loss": -34.269405364990234, "global_step": 58939, "epoch": 487} {"train_loss": -35.08567428588867, "global_step": 58940, "epoch": 487} {"train_loss": -34.89752960205078, "global_step": 58941, "epoch": 487} {"train_loss": -35.11465072631836, "global_step": 58942, "epoch": 487} {"train_loss": -35.25727462768555, "global_step": 58943, "epoch": 487} {"train_loss": -34.9266357421875, "global_step": 58944, "epoch": 487} {"train_loss": -35.3747673034668, "global_step": 58945, "epoch": 487} {"train_loss": -35.23421859741211, "global_step": 58946, "epoch": 487} {"train_loss": -35.0015754699707, "global_step": 58947, "epoch": 487} {"train_loss": -35.50293731689453, "global_step": 58948, "epoch": 487} {"train_loss": -35.727569580078125, "global_step": 58949, "epoch": 487} {"train_loss": -35.26581954956055, "global_step": 58950, "epoch": 487} {"train_loss": -35.89777755737305, "global_step": 58951, "epoch": 487} {"train_loss": -35.89974594116211, "global_step": 58952, "epoch": 487} {"train_loss": -35.83899688720703, "global_step": 58953, "epoch": 487} {"train_loss": -35.8608512878418, "global_step": 58954, "epoch": 487} {"train_loss": -35.60183334350586, "global_step": 58955, "epoch": 487} {"train_loss": -35.64484786987305, "global_step": 58956, "epoch": 487} {"train_loss": -35.60225296020508, "global_step": 58957, "epoch": 487} {"train_loss": -35.97499465942383, "global_step": 58958, "epoch": 487} {"train_loss": -36.00459289550781, "global_step": 58959, "epoch": 487} {"train_loss": -35.959991455078125, "global_step": 58960, "epoch": 487} {"train_loss": -36.357749938964844, "global_step": 58961, "epoch": 487} {"train_loss": -35.7906379699707, "global_step": 58962, "epoch": 487} {"train_loss": -35.90946960449219, "global_step": 58963, "epoch": 487} {"train_loss": -36.35642623901367, "global_step": 58964, "epoch": 487} {"train_loss": -36.08608627319336, "global_step": 58965, "epoch": 487} {"train_loss": -36.0057487487793, "global_step": 58966, "epoch": 487} {"train_loss": -36.26142501831055, "global_step": 58967, "epoch": 487} {"train_loss": -36.1099853515625, "global_step": 58968, "epoch": 487} {"train_loss": -36.75423049926758, "global_step": 58969, "epoch": 487} {"train_loss": -36.220848083496094, "global_step": 58970, "epoch": 487} {"train_loss": -36.749446868896484, "global_step": 58971, "epoch": 487} {"train_loss": -36.5842399597168, "global_step": 58972, "epoch": 487} {"train_loss": -36.0475959777832, "global_step": 58973, "epoch": 487} {"train_loss": -36.712799072265625, "global_step": 58974, "epoch": 487} {"train_loss": -36.933258056640625, "global_step": 58975, "epoch": 487} {"train_loss": -36.567378997802734, "global_step": 58976, "epoch": 487} {"train_loss": -36.670772552490234, "global_step": 58977, "epoch": 487} {"train_loss": -36.7194709777832, "global_step": 58978, "epoch": 487} {"train_loss": -36.90291976928711, "global_step": 58979, "epoch": 487} {"train_loss": -36.622920989990234, "global_step": 58980, "epoch": 487} {"train_loss": -36.90159225463867, "global_step": 58981, "epoch": 487} {"train_loss": -36.025047302246094, "global_step": 58982, "epoch": 487} {"train_loss": -36.940242767333984, "global_step": 58983, "epoch": 487} {"train_loss": -37.16106033325195, "global_step": 58984, "epoch": 487} {"train_loss": -36.82147979736328, "global_step": 58985, "epoch": 487} {"train_loss": -36.818965911865234, "global_step": 58986, "epoch": 487} {"train_loss": -36.78882598876953, "global_step": 58987, "epoch": 487} {"train_loss": -36.5549201965332, "global_step": 58988, "epoch": 487} {"train_loss": -36.71350860595703, "global_step": 58989, "epoch": 487} {"train_loss": -36.63787841796875, "global_step": 58990, "epoch": 487} {"train_loss": -36.6958122253418, "global_step": 58991, "epoch": 487} {"train_loss": -36.07124710083008, "global_step": 58992, "epoch": 487} {"train_loss": -36.477901458740234, "global_step": 58993, "epoch": 487} {"train_loss": -36.12179183959961, "global_step": 58994, "epoch": 487} {"train_loss": -35.74403762817383, "global_step": 58995, "epoch": 487} {"train_loss": -32.84382247924805, "global_step": 58996, "epoch": 487} {"train_loss": -32.94886016845703, "global_step": 58997, "epoch": 487} {"train_loss": -34.8232536315918, "global_step": 58998, "epoch": 487} {"train_loss": -35.395957946777344, "global_step": 58999, "epoch": 487} {"train_loss": -32.82196044921875, "global_step": 59000, "epoch": 487} {"train_loss": -34.04261016845703, "global_step": 59001, "epoch": 487} {"train_loss": -35.11562728881836, "global_step": 59002, "epoch": 487} {"train_loss": -34.087562561035156, "global_step": 59003, "epoch": 487} {"train_loss": -32.96165084838867, "global_step": 59004, "epoch": 487} {"train_loss": -34.180137634277344, "global_step": 59005, "epoch": 487} {"train_loss": -32.252227783203125, "global_step": 59006, "epoch": 487} {"train_loss": -34.41944122314453, "global_step": 59007, "epoch": 487} {"train_loss": -34.27383804321289, "global_step": 59008, "epoch": 487} {"train_loss": -33.85893630981445, "global_step": 59009, "epoch": 487} {"train_loss": -34.51308822631836, "global_step": 59010, "epoch": 487} {"train_loss": -33.67981719970703, "global_step": 59011, "epoch": 487} {"train_loss": -34.67753982543945, "global_step": 59012, "epoch": 487} {"train_loss": -35.31838607788086, "global_step": 59013, "epoch": 487} {"train_loss": -32.863582611083984, "global_step": 59014, "epoch": 487} {"train_loss": -32.889888763427734, "global_step": 59015, "epoch": 487} {"train_loss": -35.11906433105469, "global_step": 59016, "epoch": 487} {"train_loss": -32.81818389892578, "global_step": 59017, "epoch": 487} {"train_loss": -33.984798431396484, "global_step": 59018, "epoch": 487} {"train_loss": -35.13618087768555, "global_step": 59019, "epoch": 487} {"train_loss": -34.80134201049805, "global_step": 59020, "epoch": 487} {"train_loss": -34.71113204956055, "global_step": 59021, "epoch": 487} {"train_loss": -35.33266830444336, "global_step": 59022, "epoch": 487} {"train_loss": -35.340267181396484, "global_step": 59023, "epoch": 487} {"train_loss": -35.53999710083008, "global_step": 59024, "epoch": 487} {"train_loss": -35.410552978515625, "global_step": 59025, "epoch": 487} {"train_loss": -35.464088439941406, "global_step": 59026, "epoch": 487} {"train_loss": -34.54851150512695, "global_step": 59027, "epoch": 487} {"train_loss": -35.25997543334961, "global_step": 59028, "epoch": 487} {"train_loss": -35.47259521484375, "global_step": 59029, "epoch": 487} {"train_loss": -35.840694427490234, "global_step": 59030, "epoch": 487} {"train_loss": -35.70235061645508, "global_step": 59031, "epoch": 487} {"train_loss": -35.404258728027344, "global_step": 59032, "epoch": 487} {"train_loss": -35.696815490722656, "global_step": 59033, "epoch": 487} {"train_loss": -36.17300033569336, "global_step": 59034, "epoch": 487} {"train_loss": -35.5395622253418, "global_step": 59035, "epoch": 487} {"train_loss": -35.9605598449707, "global_step": 59036, "epoch": 487} {"train_loss": -36.494049072265625, "global_step": 59037, "epoch": 487} {"train_loss": -36.23920440673828, "global_step": 59038, "epoch": 487} {"train_loss": -36.583858489990234, "global_step": 59039, "epoch": 487} {"train_loss": -35.78868103027344, "global_step": 59040, "epoch": 487} {"train_loss": -36.13874435424805, "global_step": 59041, "epoch": 487} {"train_loss": -36.245330810546875, "global_step": 59042, "epoch": 487} {"train_loss": -36.475467681884766, "global_step": 59043, "epoch": 487} {"train_loss": -36.11349868774414, "global_step": 59044, "epoch": 487} {"train_loss": -36.566471099853516, "global_step": 59045, "epoch": 487} {"train_loss": -36.11355209350586, "global_step": 59046, "epoch": 487} {"train_loss": -35.32675604386763, "global_step": 59047, "epoch": 487, "val_loss": 2462358.0} {"train_loss": -36.76677322387695, "global_step": 59048, "epoch": 488} {"train_loss": -36.474159240722656, "global_step": 59049, "epoch": 488} {"train_loss": -36.3967399597168, "global_step": 59050, "epoch": 488} {"train_loss": -36.667198181152344, "global_step": 59051, "epoch": 488} {"train_loss": -36.59638214111328, "global_step": 59052, "epoch": 488} {"train_loss": -36.215335845947266, "global_step": 59053, "epoch": 488} {"train_loss": -36.2819938659668, "global_step": 59054, "epoch": 488} {"train_loss": -35.806495666503906, "global_step": 59055, "epoch": 488} {"train_loss": -35.46157455444336, "global_step": 59056, "epoch": 488} {"train_loss": -35.4395866394043, "global_step": 59057, "epoch": 488} {"train_loss": -36.39575958251953, "global_step": 59058, "epoch": 488} {"train_loss": -36.64799118041992, "global_step": 59059, "epoch": 488} {"train_loss": -37.1074104309082, "global_step": 59060, "epoch": 488} {"train_loss": -36.38767623901367, "global_step": 59061, "epoch": 488} {"train_loss": -35.01719284057617, "global_step": 59062, "epoch": 488} {"train_loss": -35.356231689453125, "global_step": 59063, "epoch": 488} {"train_loss": -36.676692962646484, "global_step": 59064, "epoch": 488} {"train_loss": -36.852455139160156, "global_step": 59065, "epoch": 488} {"train_loss": -36.00086975097656, "global_step": 59066, "epoch": 488} {"train_loss": -35.858375549316406, "global_step": 59067, "epoch": 488} {"train_loss": -36.389404296875, "global_step": 59068, "epoch": 488} {"train_loss": -36.361202239990234, "global_step": 59069, "epoch": 488} {"train_loss": -36.54957580566406, "global_step": 59070, "epoch": 488} {"train_loss": -35.5517692565918, "global_step": 59071, "epoch": 488} {"train_loss": -35.78512191772461, "global_step": 59072, "epoch": 488} {"train_loss": -35.855308532714844, "global_step": 59073, "epoch": 488} {"train_loss": -37.21419906616211, "global_step": 59074, "epoch": 488} {"train_loss": -35.83744812011719, "global_step": 59075, "epoch": 488} {"train_loss": -36.3919563293457, "global_step": 59076, "epoch": 488} {"train_loss": -36.26043701171875, "global_step": 59077, "epoch": 488} {"train_loss": -36.76921463012695, "global_step": 59078, "epoch": 488} {"train_loss": -36.3422737121582, "global_step": 59079, "epoch": 488} {"train_loss": -36.26495361328125, "global_step": 59080, "epoch": 488} {"train_loss": -36.5178337097168, "global_step": 59081, "epoch": 488} {"train_loss": -36.387935638427734, "global_step": 59082, "epoch": 488} {"train_loss": -37.1180305480957, "global_step": 59083, "epoch": 488} {"train_loss": -36.33108139038086, "global_step": 59084, "epoch": 488} {"train_loss": -36.71613693237305, "global_step": 59085, "epoch": 488} {"train_loss": -36.44255828857422, "global_step": 59086, "epoch": 488} {"train_loss": -36.201297760009766, "global_step": 59087, "epoch": 488} {"train_loss": -37.040157318115234, "global_step": 59088, "epoch": 488} {"train_loss": -37.061988830566406, "global_step": 59089, "epoch": 488} {"train_loss": -36.558013916015625, "global_step": 59090, "epoch": 488} {"train_loss": -36.6118278503418, "global_step": 59091, "epoch": 488} {"train_loss": -36.33727264404297, "global_step": 59092, "epoch": 488} {"train_loss": -36.66141891479492, "global_step": 59093, "epoch": 488} {"train_loss": -36.93191909790039, "global_step": 59094, "epoch": 488} {"train_loss": -35.96467208862305, "global_step": 59095, "epoch": 488} {"train_loss": -36.70144271850586, "global_step": 59096, "epoch": 488} {"train_loss": -35.96696853637695, "global_step": 59097, "epoch": 488} {"train_loss": -35.43624496459961, "global_step": 59098, "epoch": 488} {"train_loss": -36.21921920776367, "global_step": 59099, "epoch": 488} {"train_loss": -36.15843963623047, "global_step": 59100, "epoch": 488} {"train_loss": -36.853485107421875, "global_step": 59101, "epoch": 488} {"train_loss": -36.03110885620117, "global_step": 59102, "epoch": 488} {"train_loss": -35.694679260253906, "global_step": 59103, "epoch": 488} {"train_loss": -35.93450927734375, "global_step": 59104, "epoch": 488} {"train_loss": -35.812660217285156, "global_step": 59105, "epoch": 488} {"train_loss": -35.252113342285156, "global_step": 59106, "epoch": 488} {"train_loss": -36.343536376953125, "global_step": 59107, "epoch": 488} {"train_loss": -35.29199981689453, "global_step": 59108, "epoch": 488} {"train_loss": -36.31108093261719, "global_step": 59109, "epoch": 488} {"train_loss": -34.90238571166992, "global_step": 59110, "epoch": 488} {"train_loss": -35.698028564453125, "global_step": 59111, "epoch": 488} {"train_loss": -36.52588653564453, "global_step": 59112, "epoch": 488} {"train_loss": -36.501033782958984, "global_step": 59113, "epoch": 488} {"train_loss": -36.18903732299805, "global_step": 59114, "epoch": 488} {"train_loss": -36.28757858276367, "global_step": 59115, "epoch": 488} {"train_loss": -36.45152282714844, "global_step": 59116, "epoch": 488} {"train_loss": -36.57719802856445, "global_step": 59117, "epoch": 488} {"train_loss": -36.740455627441406, "global_step": 59118, "epoch": 488} {"train_loss": -36.602203369140625, "global_step": 59119, "epoch": 488} {"train_loss": -36.97378158569336, "global_step": 59120, "epoch": 488} {"train_loss": -37.45540237426758, "global_step": 59121, "epoch": 488} {"train_loss": -36.80042266845703, "global_step": 59122, "epoch": 488} {"train_loss": -37.04775619506836, "global_step": 59123, "epoch": 488} {"train_loss": -36.76686096191406, "global_step": 59124, "epoch": 488} {"train_loss": -36.6119270324707, "global_step": 59125, "epoch": 488} {"train_loss": -36.102455139160156, "global_step": 59126, "epoch": 488} {"train_loss": -35.8603630065918, "global_step": 59127, "epoch": 488} {"train_loss": -35.6220703125, "global_step": 59128, "epoch": 488} {"train_loss": -34.74269485473633, "global_step": 59129, "epoch": 488} {"train_loss": -33.47666549682617, "global_step": 59130, "epoch": 488} {"train_loss": -31.218463897705078, "global_step": 59131, "epoch": 488} {"train_loss": -36.450992584228516, "global_step": 59132, "epoch": 488} {"train_loss": -35.954891204833984, "global_step": 59133, "epoch": 488} {"train_loss": -33.31905746459961, "global_step": 59134, "epoch": 488} {"train_loss": -33.93944549560547, "global_step": 59135, "epoch": 488} {"train_loss": -36.60554122924805, "global_step": 59136, "epoch": 488} {"train_loss": -36.25994873046875, "global_step": 59137, "epoch": 488} {"train_loss": -34.66883850097656, "global_step": 59138, "epoch": 488} {"train_loss": -36.13014221191406, "global_step": 59139, "epoch": 488} {"train_loss": -36.589664459228516, "global_step": 59140, "epoch": 488} {"train_loss": -35.08485794067383, "global_step": 59141, "epoch": 488} {"train_loss": -36.34820556640625, "global_step": 59142, "epoch": 488} {"train_loss": -36.05371856689453, "global_step": 59143, "epoch": 488} {"train_loss": -36.38372802734375, "global_step": 59144, "epoch": 488} {"train_loss": -36.94927215576172, "global_step": 59145, "epoch": 488} {"train_loss": -36.12773513793945, "global_step": 59146, "epoch": 488} {"train_loss": -36.2864875793457, "global_step": 59147, "epoch": 488} {"train_loss": -36.65897750854492, "global_step": 59148, "epoch": 488} {"train_loss": -36.449825286865234, "global_step": 59149, "epoch": 488} {"train_loss": -36.49721908569336, "global_step": 59150, "epoch": 488} {"train_loss": -36.87213134765625, "global_step": 59151, "epoch": 488} {"train_loss": -35.972686767578125, "global_step": 59152, "epoch": 488} {"train_loss": -36.48313522338867, "global_step": 59153, "epoch": 488} {"train_loss": -36.8691520690918, "global_step": 59154, "epoch": 488} {"train_loss": -35.74592971801758, "global_step": 59155, "epoch": 488} {"train_loss": -33.972713470458984, "global_step": 59156, "epoch": 488} {"train_loss": -36.28229904174805, "global_step": 59157, "epoch": 488} {"train_loss": -35.521240234375, "global_step": 59158, "epoch": 488} {"train_loss": -32.93319320678711, "global_step": 59159, "epoch": 488} {"train_loss": -35.7359733581543, "global_step": 59160, "epoch": 488} {"train_loss": -33.275177001953125, "global_step": 59161, "epoch": 488} {"train_loss": -34.77972412109375, "global_step": 59162, "epoch": 488} {"train_loss": -34.41609573364258, "global_step": 59163, "epoch": 488} {"train_loss": -35.68359375, "global_step": 59164, "epoch": 488} {"train_loss": -34.15837860107422, "global_step": 59165, "epoch": 488} {"train_loss": -31.632598876953125, "global_step": 59166, "epoch": 488} {"train_loss": -36.342159271240234, "global_step": 59167, "epoch": 488} {"train_loss": -35.98085157536278, "global_step": 59168, "epoch": 488, "val_loss": 2489892.0} {"train_loss": -30.73243522644043, "global_step": 59169, "epoch": 489} {"train_loss": -36.342098236083984, "global_step": 59170, "epoch": 489} {"train_loss": -32.574703216552734, "global_step": 59171, "epoch": 489} {"train_loss": -34.13838577270508, "global_step": 59172, "epoch": 489} {"train_loss": -36.078914642333984, "global_step": 59173, "epoch": 489} {"train_loss": -35.83774185180664, "global_step": 59174, "epoch": 489} {"train_loss": -35.822532653808594, "global_step": 59175, "epoch": 489} {"train_loss": -35.50357437133789, "global_step": 59176, "epoch": 489} {"train_loss": -35.137939453125, "global_step": 59177, "epoch": 489} {"train_loss": -36.0743408203125, "global_step": 59178, "epoch": 489} {"train_loss": -36.064666748046875, "global_step": 59179, "epoch": 489} {"train_loss": -35.77605056762695, "global_step": 59180, "epoch": 489} {"train_loss": -35.40024948120117, "global_step": 59181, "epoch": 489} {"train_loss": -35.79677963256836, "global_step": 59182, "epoch": 489} {"train_loss": -36.06370162963867, "global_step": 59183, "epoch": 489} {"train_loss": -35.76277542114258, "global_step": 59184, "epoch": 489} {"train_loss": -36.37580490112305, "global_step": 59185, "epoch": 489} {"train_loss": -35.11553955078125, "global_step": 59186, "epoch": 489} {"train_loss": -35.772300720214844, "global_step": 59187, "epoch": 489} {"train_loss": -36.11704635620117, "global_step": 59188, "epoch": 489} {"train_loss": -36.03096008300781, "global_step": 59189, "epoch": 489} {"train_loss": -36.13570022583008, "global_step": 59190, "epoch": 489} {"train_loss": -36.39790725708008, "global_step": 59191, "epoch": 489} {"train_loss": -36.57594299316406, "global_step": 59192, "epoch": 489} {"train_loss": -36.608238220214844, "global_step": 59193, "epoch": 489} {"train_loss": -36.672916412353516, "global_step": 59194, "epoch": 489} {"train_loss": -36.81999588012695, "global_step": 59195, "epoch": 489} {"train_loss": -36.541168212890625, "global_step": 59196, "epoch": 489} {"train_loss": -36.70551300048828, "global_step": 59197, "epoch": 489} {"train_loss": -36.891937255859375, "global_step": 59198, "epoch": 489} {"train_loss": -36.158782958984375, "global_step": 59199, "epoch": 489} {"train_loss": -36.273921966552734, "global_step": 59200, "epoch": 489} {"train_loss": -37.019775390625, "global_step": 59201, "epoch": 489} {"train_loss": -36.70139694213867, "global_step": 59202, "epoch": 489} {"train_loss": -36.3736686706543, "global_step": 59203, "epoch": 489} {"train_loss": -36.62630081176758, "global_step": 59204, "epoch": 489} {"train_loss": -36.14951705932617, "global_step": 59205, "epoch": 489} {"train_loss": -36.7745475769043, "global_step": 59206, "epoch": 489} {"train_loss": -36.974056243896484, "global_step": 59207, "epoch": 489} {"train_loss": -36.71053695678711, "global_step": 59208, "epoch": 489} {"train_loss": -36.85917282104492, "global_step": 59209, "epoch": 489} {"train_loss": -36.955013275146484, "global_step": 59210, "epoch": 489} {"train_loss": -37.01870346069336, "global_step": 59211, "epoch": 489} {"train_loss": -37.216651916503906, "global_step": 59212, "epoch": 489} {"train_loss": -36.83979034423828, "global_step": 59213, "epoch": 489} {"train_loss": -36.560970306396484, "global_step": 59214, "epoch": 489} {"train_loss": -37.02922058105469, "global_step": 59215, "epoch": 489} {"train_loss": -36.13337326049805, "global_step": 59216, "epoch": 489} {"train_loss": -36.85175323486328, "global_step": 59217, "epoch": 489} {"train_loss": -37.01862716674805, "global_step": 59218, "epoch": 489} {"train_loss": -35.44990921020508, "global_step": 59219, "epoch": 489} {"train_loss": -36.16447830200195, "global_step": 59220, "epoch": 489} {"train_loss": -36.58648681640625, "global_step": 59221, "epoch": 489} {"train_loss": -36.31043243408203, "global_step": 59222, "epoch": 489} {"train_loss": -36.06678009033203, "global_step": 59223, "epoch": 489} {"train_loss": -36.40535354614258, "global_step": 59224, "epoch": 489} {"train_loss": -36.340206146240234, "global_step": 59225, "epoch": 489} {"train_loss": -35.655616760253906, "global_step": 59226, "epoch": 489} {"train_loss": -35.72647476196289, "global_step": 59227, "epoch": 489} {"train_loss": -36.59814453125, "global_step": 59228, "epoch": 489} {"train_loss": -36.367244720458984, "global_step": 59229, "epoch": 489} {"train_loss": -35.510353088378906, "global_step": 59230, "epoch": 489} {"train_loss": -36.934993743896484, "global_step": 59231, "epoch": 489} {"train_loss": -35.955726623535156, "global_step": 59232, "epoch": 489} {"train_loss": -34.802398681640625, "global_step": 59233, "epoch": 489} {"train_loss": -35.21408462524414, "global_step": 59234, "epoch": 489} {"train_loss": -35.28725814819336, "global_step": 59235, "epoch": 489} {"train_loss": -36.636470794677734, "global_step": 59236, "epoch": 489} {"train_loss": -34.038726806640625, "global_step": 59237, "epoch": 489} {"train_loss": -34.30947494506836, "global_step": 59238, "epoch": 489} {"train_loss": -33.26331329345703, "global_step": 59239, "epoch": 489} {"train_loss": -34.52202224731445, "global_step": 59240, "epoch": 489} {"train_loss": -36.14925765991211, "global_step": 59241, "epoch": 489} {"train_loss": -34.43189239501953, "global_step": 59242, "epoch": 489} {"train_loss": -34.42118453979492, "global_step": 59243, "epoch": 489} {"train_loss": -35.2957649230957, "global_step": 59244, "epoch": 489} {"train_loss": -34.45231246948242, "global_step": 59245, "epoch": 489} {"train_loss": -35.60567855834961, "global_step": 59246, "epoch": 489} {"train_loss": -34.42778015136719, "global_step": 59247, "epoch": 489} {"train_loss": -36.35427474975586, "global_step": 59248, "epoch": 489} {"train_loss": -34.346343994140625, "global_step": 59249, "epoch": 489} {"train_loss": -36.14785385131836, "global_step": 59250, "epoch": 489} {"train_loss": -35.563053131103516, "global_step": 59251, "epoch": 489} {"train_loss": -35.60908126831055, "global_step": 59252, "epoch": 489} {"train_loss": -36.516910552978516, "global_step": 59253, "epoch": 489} {"train_loss": -34.97832107543945, "global_step": 59254, "epoch": 489} {"train_loss": -36.47103500366211, "global_step": 59255, "epoch": 489} {"train_loss": -35.970726013183594, "global_step": 59256, "epoch": 489} {"train_loss": -36.05730056762695, "global_step": 59257, "epoch": 489} {"train_loss": -36.544273376464844, "global_step": 59258, "epoch": 489} {"train_loss": -36.39058303833008, "global_step": 59259, "epoch": 489} {"train_loss": -36.20234298706055, "global_step": 59260, "epoch": 489} {"train_loss": -36.713191986083984, "global_step": 59261, "epoch": 489} {"train_loss": -36.78841018676758, "global_step": 59262, "epoch": 489} {"train_loss": -36.74851608276367, "global_step": 59263, "epoch": 489} {"train_loss": -36.623382568359375, "global_step": 59264, "epoch": 489} {"train_loss": -36.71888732910156, "global_step": 59265, "epoch": 489} {"train_loss": -36.62990951538086, "global_step": 59266, "epoch": 489} {"train_loss": -36.74270248413086, "global_step": 59267, "epoch": 489} {"train_loss": -36.66592025756836, "global_step": 59268, "epoch": 489} {"train_loss": -36.92664337158203, "global_step": 59269, "epoch": 489} {"train_loss": -37.1079216003418, "global_step": 59270, "epoch": 489} {"train_loss": -36.85792922973633, "global_step": 59271, "epoch": 489} {"train_loss": -37.17591094970703, "global_step": 59272, "epoch": 489} {"train_loss": -37.160247802734375, "global_step": 59273, "epoch": 489} {"train_loss": -37.16624450683594, "global_step": 59274, "epoch": 489} {"train_loss": -37.0345344543457, "global_step": 59275, "epoch": 489} {"train_loss": -37.490840911865234, "global_step": 59276, "epoch": 489} {"train_loss": -37.2495002746582, "global_step": 59277, "epoch": 489} {"train_loss": -36.92216110229492, "global_step": 59278, "epoch": 489} {"train_loss": -37.37213897705078, "global_step": 59279, "epoch": 489} {"train_loss": -37.37955093383789, "global_step": 59280, "epoch": 489} {"train_loss": -36.650184631347656, "global_step": 59281, "epoch": 489} {"train_loss": -34.309566497802734, "global_step": 59282, "epoch": 489} {"train_loss": -32.738189697265625, "global_step": 59283, "epoch": 489} {"train_loss": -33.15617752075195, "global_step": 59284, "epoch": 489} {"train_loss": -34.18345642089844, "global_step": 59285, "epoch": 489} {"train_loss": -35.84371566772461, "global_step": 59286, "epoch": 489} {"train_loss": -36.77669143676758, "global_step": 59287, "epoch": 489} {"train_loss": -33.496429443359375, "global_step": 59288, "epoch": 489} {"train_loss": -35.97494514717543, "global_step": 59289, "epoch": 489, "val_loss": 2461544.25} {"train_loss": -36.87978744506836, "global_step": 59290, "epoch": 490} {"train_loss": -30.50852394104004, "global_step": 59291, "epoch": 490} {"train_loss": -37.04457092285156, "global_step": 59292, "epoch": 490} {"train_loss": -31.855085372924805, "global_step": 59293, "epoch": 490} {"train_loss": -32.42681884765625, "global_step": 59294, "epoch": 490} {"train_loss": -36.40597152709961, "global_step": 59295, "epoch": 490} {"train_loss": -32.011817932128906, "global_step": 59296, "epoch": 490} {"train_loss": -35.78118896484375, "global_step": 59297, "epoch": 490} {"train_loss": -34.376617431640625, "global_step": 59298, "epoch": 490} {"train_loss": -33.245582580566406, "global_step": 59299, "epoch": 490} {"train_loss": -34.41032409667969, "global_step": 59300, "epoch": 490} {"train_loss": -32.48735427856445, "global_step": 59301, "epoch": 490} {"train_loss": -35.6683464050293, "global_step": 59302, "epoch": 490} {"train_loss": -34.22019577026367, "global_step": 59303, "epoch": 490} {"train_loss": -35.92963790893555, "global_step": 59304, "epoch": 490} {"train_loss": -33.91279220581055, "global_step": 59305, "epoch": 490} {"train_loss": -36.31887435913086, "global_step": 59306, "epoch": 490} {"train_loss": -35.3519172668457, "global_step": 59307, "epoch": 490} {"train_loss": -34.14132308959961, "global_step": 59308, "epoch": 490} {"train_loss": -36.61568069458008, "global_step": 59309, "epoch": 490} {"train_loss": -34.844970703125, "global_step": 59310, "epoch": 490} {"train_loss": -36.22981262207031, "global_step": 59311, "epoch": 490} {"train_loss": -35.74821090698242, "global_step": 59312, "epoch": 490} {"train_loss": -36.5484504699707, "global_step": 59313, "epoch": 490} {"train_loss": -36.28603744506836, "global_step": 59314, "epoch": 490} {"train_loss": -36.37009048461914, "global_step": 59315, "epoch": 490} {"train_loss": -36.1577033996582, "global_step": 59316, "epoch": 490} {"train_loss": -36.76810073852539, "global_step": 59317, "epoch": 490} {"train_loss": -36.77266311645508, "global_step": 59318, "epoch": 490} {"train_loss": -36.7637939453125, "global_step": 59319, "epoch": 490} {"train_loss": -36.61876678466797, "global_step": 59320, "epoch": 490} {"train_loss": -36.781253814697266, "global_step": 59321, "epoch": 490} {"train_loss": -36.92836380004883, "global_step": 59322, "epoch": 490} {"train_loss": -36.499263763427734, "global_step": 59323, "epoch": 490} {"train_loss": -36.339332580566406, "global_step": 59324, "epoch": 490} {"train_loss": -36.85069274902344, "global_step": 59325, "epoch": 490} {"train_loss": -36.98733901977539, "global_step": 59326, "epoch": 490} {"train_loss": -36.68666076660156, "global_step": 59327, "epoch": 490} {"train_loss": -36.241512298583984, "global_step": 59328, "epoch": 490} {"train_loss": -36.21949768066406, "global_step": 59329, "epoch": 490} {"train_loss": -37.25471878051758, "global_step": 59330, "epoch": 490} {"train_loss": -37.0555534362793, "global_step": 59331, "epoch": 490} {"train_loss": -36.100765228271484, "global_step": 59332, "epoch": 490} {"train_loss": -36.7238883972168, "global_step": 59333, "epoch": 490} {"train_loss": -37.40336990356445, "global_step": 59334, "epoch": 490} {"train_loss": -36.74086380004883, "global_step": 59335, "epoch": 490} {"train_loss": -34.94321823120117, "global_step": 59336, "epoch": 490} {"train_loss": -33.84189987182617, "global_step": 59337, "epoch": 490} {"train_loss": -36.06776809692383, "global_step": 59338, "epoch": 490} {"train_loss": -36.23786926269531, "global_step": 59339, "epoch": 490} {"train_loss": -33.544647216796875, "global_step": 59340, "epoch": 490} {"train_loss": -34.3033332824707, "global_step": 59341, "epoch": 490} {"train_loss": -36.10248565673828, "global_step": 59342, "epoch": 490} {"train_loss": -34.54157257080078, "global_step": 59343, "epoch": 490} {"train_loss": -33.52703857421875, "global_step": 59344, "epoch": 490} {"train_loss": -36.724552154541016, "global_step": 59345, "epoch": 490} {"train_loss": -34.426021575927734, "global_step": 59346, "epoch": 490} {"train_loss": -35.564449310302734, "global_step": 59347, "epoch": 490} {"train_loss": -36.70701217651367, "global_step": 59348, "epoch": 490} {"train_loss": -35.61458969116211, "global_step": 59349, "epoch": 490} {"train_loss": -37.14216232299805, "global_step": 59350, "epoch": 490} {"train_loss": -35.50520706176758, "global_step": 59351, "epoch": 490} {"train_loss": -36.65840530395508, "global_step": 59352, "epoch": 490} {"train_loss": -36.90159225463867, "global_step": 59353, "epoch": 490} {"train_loss": -36.945003509521484, "global_step": 59354, "epoch": 490} {"train_loss": -36.04037857055664, "global_step": 59355, "epoch": 490} {"train_loss": -36.77230453491211, "global_step": 59356, "epoch": 490} {"train_loss": -36.49405288696289, "global_step": 59357, "epoch": 490} {"train_loss": -36.72720718383789, "global_step": 59358, "epoch": 490} {"train_loss": -36.320613861083984, "global_step": 59359, "epoch": 490} {"train_loss": -36.33262252807617, "global_step": 59360, "epoch": 490} {"train_loss": -37.07477951049805, "global_step": 59361, "epoch": 490} {"train_loss": -36.956329345703125, "global_step": 59362, "epoch": 490} {"train_loss": -36.69220733642578, "global_step": 59363, "epoch": 490} {"train_loss": -36.14376449584961, "global_step": 59364, "epoch": 490} {"train_loss": -36.58335494995117, "global_step": 59365, "epoch": 490} {"train_loss": -35.67925262451172, "global_step": 59366, "epoch": 490} {"train_loss": -36.7572021484375, "global_step": 59367, "epoch": 490} {"train_loss": -36.9666862487793, "global_step": 59368, "epoch": 490} {"train_loss": -36.425350189208984, "global_step": 59369, "epoch": 490} {"train_loss": -35.3176383972168, "global_step": 59370, "epoch": 490} {"train_loss": -34.40966796875, "global_step": 59371, "epoch": 490} {"train_loss": -34.14918899536133, "global_step": 59372, "epoch": 490} {"train_loss": -36.055091857910156, "global_step": 59373, "epoch": 490} {"train_loss": -36.13150405883789, "global_step": 59374, "epoch": 490} {"train_loss": -35.972373962402344, "global_step": 59375, "epoch": 490} {"train_loss": -34.1571159362793, "global_step": 59376, "epoch": 490} {"train_loss": -34.71455001831055, "global_step": 59377, "epoch": 490} {"train_loss": -34.21636962890625, "global_step": 59378, "epoch": 490} {"train_loss": -34.289398193359375, "global_step": 59379, "epoch": 490} {"train_loss": -36.557613372802734, "global_step": 59380, "epoch": 490} {"train_loss": -34.7146110534668, "global_step": 59381, "epoch": 490} {"train_loss": -33.561737060546875, "global_step": 59382, "epoch": 490} {"train_loss": -34.77337646484375, "global_step": 59383, "epoch": 490} {"train_loss": -35.724464416503906, "global_step": 59384, "epoch": 490} {"train_loss": -35.549041748046875, "global_step": 59385, "epoch": 490} {"train_loss": -36.45133590698242, "global_step": 59386, "epoch": 490} {"train_loss": -36.10166549682617, "global_step": 59387, "epoch": 490} {"train_loss": -36.43012619018555, "global_step": 59388, "epoch": 490} {"train_loss": -36.18879699707031, "global_step": 59389, "epoch": 490} {"train_loss": -36.434627532958984, "global_step": 59390, "epoch": 490} {"train_loss": -35.996299743652344, "global_step": 59391, "epoch": 490} {"train_loss": -35.501708984375, "global_step": 59392, "epoch": 490} {"train_loss": -36.61643600463867, "global_step": 59393, "epoch": 490} {"train_loss": -36.069698333740234, "global_step": 59394, "epoch": 490} {"train_loss": -35.872589111328125, "global_step": 59395, "epoch": 490} {"train_loss": -36.94102478027344, "global_step": 59396, "epoch": 490} {"train_loss": -36.271522521972656, "global_step": 59397, "epoch": 490} {"train_loss": -35.895687103271484, "global_step": 59398, "epoch": 490} {"train_loss": -37.0013542175293, "global_step": 59399, "epoch": 490} {"train_loss": -36.592952728271484, "global_step": 59400, "epoch": 490} {"train_loss": -36.491397857666016, "global_step": 59401, "epoch": 490} {"train_loss": -36.861183166503906, "global_step": 59402, "epoch": 490} {"train_loss": -36.92768096923828, "global_step": 59403, "epoch": 490} {"train_loss": -37.188568115234375, "global_step": 59404, "epoch": 490} {"train_loss": -36.4666633605957, "global_step": 59405, "epoch": 490} {"train_loss": -36.99216842651367, "global_step": 59406, "epoch": 490} {"train_loss": -37.1549072265625, "global_step": 59407, "epoch": 490} {"train_loss": -37.48366165161133, "global_step": 59408, "epoch": 490} {"train_loss": -36.51642608642578, "global_step": 59409, "epoch": 490} {"train_loss": -35.84020100743317, "global_step": 59410, "epoch": 490, "val_loss": 2486157.25} {"train_loss": -37.04909133911133, "global_step": 59411, "epoch": 491} {"train_loss": -37.1944694519043, "global_step": 59412, "epoch": 491} {"train_loss": -37.23041915893555, "global_step": 59413, "epoch": 491} {"train_loss": -37.30844497680664, "global_step": 59414, "epoch": 491} {"train_loss": -37.48362350463867, "global_step": 59415, "epoch": 491} {"train_loss": -37.34742736816406, "global_step": 59416, "epoch": 491} {"train_loss": -37.31026840209961, "global_step": 59417, "epoch": 491} {"train_loss": -37.3577766418457, "global_step": 59418, "epoch": 491} {"train_loss": -37.42289352416992, "global_step": 59419, "epoch": 491} {"train_loss": -37.4514045715332, "global_step": 59420, "epoch": 491} {"train_loss": -37.34218978881836, "global_step": 59421, "epoch": 491} {"train_loss": -37.61237716674805, "global_step": 59422, "epoch": 491} {"train_loss": -37.284156799316406, "global_step": 59423, "epoch": 491} {"train_loss": -37.000221252441406, "global_step": 59424, "epoch": 491} {"train_loss": -37.128639221191406, "global_step": 59425, "epoch": 491} {"train_loss": -37.21564865112305, "global_step": 59426, "epoch": 491} {"train_loss": -37.37569808959961, "global_step": 59427, "epoch": 491} {"train_loss": -37.82138442993164, "global_step": 59428, "epoch": 491} {"train_loss": -37.22894287109375, "global_step": 59429, "epoch": 491} {"train_loss": -37.3930549621582, "global_step": 59430, "epoch": 491} {"train_loss": -37.396724700927734, "global_step": 59431, "epoch": 491} {"train_loss": -37.8663330078125, "global_step": 59432, "epoch": 491} {"train_loss": -37.717201232910156, "global_step": 59433, "epoch": 491} {"train_loss": -38.0188102722168, "global_step": 59434, "epoch": 491} {"train_loss": -37.84926986694336, "global_step": 59435, "epoch": 491} {"train_loss": -38.02289962768555, "global_step": 59436, "epoch": 491} {"train_loss": -37.637813568115234, "global_step": 59437, "epoch": 491} {"train_loss": -37.703346252441406, "global_step": 59438, "epoch": 491} {"train_loss": -37.36417007446289, "global_step": 59439, "epoch": 491} {"train_loss": -37.19373321533203, "global_step": 59440, "epoch": 491} {"train_loss": -37.10976791381836, "global_step": 59441, "epoch": 491} {"train_loss": -37.03129959106445, "global_step": 59442, "epoch": 491} {"train_loss": -37.33328628540039, "global_step": 59443, "epoch": 491} {"train_loss": -37.37226486206055, "global_step": 59444, "epoch": 491} {"train_loss": -36.303462982177734, "global_step": 59445, "epoch": 491} {"train_loss": -33.14113998413086, "global_step": 59446, "epoch": 491} {"train_loss": -34.9014778137207, "global_step": 59447, "epoch": 491} {"train_loss": -36.851192474365234, "global_step": 59448, "epoch": 491} {"train_loss": -35.552772521972656, "global_step": 59449, "epoch": 491} {"train_loss": -37.15198516845703, "global_step": 59450, "epoch": 491} {"train_loss": -36.73606491088867, "global_step": 59451, "epoch": 491} {"train_loss": -36.492523193359375, "global_step": 59452, "epoch": 491} {"train_loss": -36.1927375793457, "global_step": 59453, "epoch": 491} {"train_loss": -36.8892936706543, "global_step": 59454, "epoch": 491} {"train_loss": -35.7389030456543, "global_step": 59455, "epoch": 491} {"train_loss": -36.562007904052734, "global_step": 59456, "epoch": 491} {"train_loss": -34.065711975097656, "global_step": 59457, "epoch": 491} {"train_loss": -35.9222526550293, "global_step": 59458, "epoch": 491} {"train_loss": -35.116981506347656, "global_step": 59459, "epoch": 491} {"train_loss": -35.72860336303711, "global_step": 59460, "epoch": 491} {"train_loss": -33.96631622314453, "global_step": 59461, "epoch": 491} {"train_loss": -35.9979248046875, "global_step": 59462, "epoch": 491} {"train_loss": -35.0872917175293, "global_step": 59463, "epoch": 491} {"train_loss": -34.85247039794922, "global_step": 59464, "epoch": 491} {"train_loss": -35.962581634521484, "global_step": 59465, "epoch": 491} {"train_loss": -36.00876998901367, "global_step": 59466, "epoch": 491} {"train_loss": -36.00748062133789, "global_step": 59467, "epoch": 491} {"train_loss": -36.797061920166016, "global_step": 59468, "epoch": 491} {"train_loss": -35.105018615722656, "global_step": 59469, "epoch": 491} {"train_loss": -36.417171478271484, "global_step": 59470, "epoch": 491} {"train_loss": -35.37810516357422, "global_step": 59471, "epoch": 491} {"train_loss": -36.10165023803711, "global_step": 59472, "epoch": 491} {"train_loss": -36.613182067871094, "global_step": 59473, "epoch": 491} {"train_loss": -36.14384841918945, "global_step": 59474, "epoch": 491} {"train_loss": -36.37992477416992, "global_step": 59475, "epoch": 491} {"train_loss": -36.886104583740234, "global_step": 59476, "epoch": 491} {"train_loss": -35.765995025634766, "global_step": 59477, "epoch": 491} {"train_loss": -36.1356315612793, "global_step": 59478, "epoch": 491} {"train_loss": -36.8905029296875, "global_step": 59479, "epoch": 491} {"train_loss": -34.839942932128906, "global_step": 59480, "epoch": 491} {"train_loss": -35.28127670288086, "global_step": 59481, "epoch": 491} {"train_loss": -35.10749435424805, "global_step": 59482, "epoch": 491} {"train_loss": -34.95104217529297, "global_step": 59483, "epoch": 491} {"train_loss": -34.66526412963867, "global_step": 59484, "epoch": 491} {"train_loss": -35.495399475097656, "global_step": 59485, "epoch": 491} {"train_loss": -36.33296203613281, "global_step": 59486, "epoch": 491} {"train_loss": -35.60955047607422, "global_step": 59487, "epoch": 491} {"train_loss": -35.5439453125, "global_step": 59488, "epoch": 491} {"train_loss": -35.804134368896484, "global_step": 59489, "epoch": 491} {"train_loss": -35.635986328125, "global_step": 59490, "epoch": 491} {"train_loss": -33.734046936035156, "global_step": 59491, "epoch": 491} {"train_loss": -35.50385284423828, "global_step": 59492, "epoch": 491} {"train_loss": -36.738765716552734, "global_step": 59493, "epoch": 491} {"train_loss": -35.55044937133789, "global_step": 59494, "epoch": 491} {"train_loss": -33.5206413269043, "global_step": 59495, "epoch": 491} {"train_loss": -35.79907989501953, "global_step": 59496, "epoch": 491} {"train_loss": -36.0565299987793, "global_step": 59497, "epoch": 491} {"train_loss": -33.81982421875, "global_step": 59498, "epoch": 491} {"train_loss": -33.77863693237305, "global_step": 59499, "epoch": 491} {"train_loss": -35.51412582397461, "global_step": 59500, "epoch": 491} {"train_loss": -35.57621383666992, "global_step": 59501, "epoch": 491} {"train_loss": -34.992610931396484, "global_step": 59502, "epoch": 491} {"train_loss": -36.69009017944336, "global_step": 59503, "epoch": 491} {"train_loss": -35.298858642578125, "global_step": 59504, "epoch": 491} {"train_loss": -36.119380950927734, "global_step": 59505, "epoch": 491} {"train_loss": -36.24483871459961, "global_step": 59506, "epoch": 491} {"train_loss": -34.99839401245117, "global_step": 59507, "epoch": 491} {"train_loss": -36.388118743896484, "global_step": 59508, "epoch": 491} {"train_loss": -35.56709289550781, "global_step": 59509, "epoch": 491} {"train_loss": -33.752010345458984, "global_step": 59510, "epoch": 491} {"train_loss": -34.95524215698242, "global_step": 59511, "epoch": 491} {"train_loss": -35.47507858276367, "global_step": 59512, "epoch": 491} {"train_loss": -35.338043212890625, "global_step": 59513, "epoch": 491} {"train_loss": -35.756038665771484, "global_step": 59514, "epoch": 491} {"train_loss": -36.10759353637695, "global_step": 59515, "epoch": 491} {"train_loss": -35.1635856628418, "global_step": 59516, "epoch": 491} {"train_loss": -36.684295654296875, "global_step": 59517, "epoch": 491} {"train_loss": -36.57086944580078, "global_step": 59518, "epoch": 491} {"train_loss": -35.5604248046875, "global_step": 59519, "epoch": 491} {"train_loss": -36.400421142578125, "global_step": 59520, "epoch": 491} {"train_loss": -37.314537048339844, "global_step": 59521, "epoch": 491} {"train_loss": -35.991004943847656, "global_step": 59522, "epoch": 491} {"train_loss": -37.06849670410156, "global_step": 59523, "epoch": 491} {"train_loss": -36.782005310058594, "global_step": 59524, "epoch": 491} {"train_loss": -36.735862731933594, "global_step": 59525, "epoch": 491} {"train_loss": -36.87514877319336, "global_step": 59526, "epoch": 491} {"train_loss": -36.724647521972656, "global_step": 59527, "epoch": 491} {"train_loss": -37.09944534301758, "global_step": 59528, "epoch": 491} {"train_loss": -36.51418685913086, "global_step": 59529, "epoch": 491} {"train_loss": -36.93307113647461, "global_step": 59530, "epoch": 491} {"train_loss": -36.24964293172537, "global_step": 59531, "epoch": 491, "val_loss": 2529864.75} {"train_loss": -36.91184616088867, "global_step": 59532, "epoch": 492} {"train_loss": -37.087825775146484, "global_step": 59533, "epoch": 492} {"train_loss": -37.31963348388672, "global_step": 59534, "epoch": 492} {"train_loss": -37.32319259643555, "global_step": 59535, "epoch": 492} {"train_loss": -37.69517135620117, "global_step": 59536, "epoch": 492} {"train_loss": -37.57205581665039, "global_step": 59537, "epoch": 492} {"train_loss": -37.26338577270508, "global_step": 59538, "epoch": 492} {"train_loss": -37.811729431152344, "global_step": 59539, "epoch": 492} {"train_loss": -37.55668258666992, "global_step": 59540, "epoch": 492} {"train_loss": -37.6079216003418, "global_step": 59541, "epoch": 492} {"train_loss": -37.577083587646484, "global_step": 59542, "epoch": 492} {"train_loss": -37.05047607421875, "global_step": 59543, "epoch": 492} {"train_loss": -36.640281677246094, "global_step": 59544, "epoch": 492} {"train_loss": -34.055423736572266, "global_step": 59545, "epoch": 492} {"train_loss": -29.233259201049805, "global_step": 59546, "epoch": 492} {"train_loss": -35.414730072021484, "global_step": 59547, "epoch": 492} {"train_loss": -36.99128341674805, "global_step": 59548, "epoch": 492} {"train_loss": -35.517024993896484, "global_step": 59549, "epoch": 492} {"train_loss": -34.921905517578125, "global_step": 59550, "epoch": 492} {"train_loss": -37.21700668334961, "global_step": 59551, "epoch": 492} {"train_loss": -36.3217887878418, "global_step": 59552, "epoch": 492} {"train_loss": -36.20058059692383, "global_step": 59553, "epoch": 492} {"train_loss": -37.138729095458984, "global_step": 59554, "epoch": 492} {"train_loss": -37.14658737182617, "global_step": 59555, "epoch": 492} {"train_loss": -36.424903869628906, "global_step": 59556, "epoch": 492} {"train_loss": -35.7459831237793, "global_step": 59557, "epoch": 492} {"train_loss": -37.288963317871094, "global_step": 59558, "epoch": 492} {"train_loss": -35.954254150390625, "global_step": 59559, "epoch": 492} {"train_loss": -34.40862274169922, "global_step": 59560, "epoch": 492} {"train_loss": -34.637718200683594, "global_step": 59561, "epoch": 492} {"train_loss": -34.6912727355957, "global_step": 59562, "epoch": 492} {"train_loss": -34.957088470458984, "global_step": 59563, "epoch": 492} {"train_loss": -34.495643615722656, "global_step": 59564, "epoch": 492} {"train_loss": -34.8750114440918, "global_step": 59565, "epoch": 492} {"train_loss": -34.961849212646484, "global_step": 59566, "epoch": 492} {"train_loss": -36.03725814819336, "global_step": 59567, "epoch": 492} {"train_loss": -35.996368408203125, "global_step": 59568, "epoch": 492} {"train_loss": -34.95603561401367, "global_step": 59569, "epoch": 492} {"train_loss": -35.57048416137695, "global_step": 59570, "epoch": 492} {"train_loss": -37.2289924621582, "global_step": 59571, "epoch": 492} {"train_loss": -36.2148323059082, "global_step": 59572, "epoch": 492} {"train_loss": -35.731746673583984, "global_step": 59573, "epoch": 492} {"train_loss": -36.728614807128906, "global_step": 59574, "epoch": 492} {"train_loss": -36.6716423034668, "global_step": 59575, "epoch": 492} {"train_loss": -36.63137435913086, "global_step": 59576, "epoch": 492} {"train_loss": -36.97810745239258, "global_step": 59577, "epoch": 492} {"train_loss": -36.666168212890625, "global_step": 59578, "epoch": 492} {"train_loss": -36.7386589050293, "global_step": 59579, "epoch": 492} {"train_loss": -36.82786178588867, "global_step": 59580, "epoch": 492} {"train_loss": -37.18973922729492, "global_step": 59581, "epoch": 492} {"train_loss": -36.77252960205078, "global_step": 59582, "epoch": 492} {"train_loss": -37.02854537963867, "global_step": 59583, "epoch": 492} {"train_loss": -36.73331832885742, "global_step": 59584, "epoch": 492} {"train_loss": -37.126461029052734, "global_step": 59585, "epoch": 492} {"train_loss": -37.261436462402344, "global_step": 59586, "epoch": 492} {"train_loss": -37.23768997192383, "global_step": 59587, "epoch": 492} {"train_loss": -37.18474197387695, "global_step": 59588, "epoch": 492} {"train_loss": -36.42918014526367, "global_step": 59589, "epoch": 492} {"train_loss": -37.45026397705078, "global_step": 59590, "epoch": 492} {"train_loss": -36.84577941894531, "global_step": 59591, "epoch": 492} {"train_loss": -36.82339096069336, "global_step": 59592, "epoch": 492} {"train_loss": -37.42604446411133, "global_step": 59593, "epoch": 492} {"train_loss": -36.84321212768555, "global_step": 59594, "epoch": 492} {"train_loss": -37.142791748046875, "global_step": 59595, "epoch": 492} {"train_loss": -37.49568557739258, "global_step": 59596, "epoch": 492} {"train_loss": -37.52067565917969, "global_step": 59597, "epoch": 492} {"train_loss": -37.04482650756836, "global_step": 59598, "epoch": 492} {"train_loss": -37.48232650756836, "global_step": 59599, "epoch": 492} {"train_loss": -37.4100227355957, "global_step": 59600, "epoch": 492} {"train_loss": -37.186893463134766, "global_step": 59601, "epoch": 492} {"train_loss": -37.37422561645508, "global_step": 59602, "epoch": 492} {"train_loss": -37.75969314575195, "global_step": 59603, "epoch": 492} {"train_loss": -37.44643020629883, "global_step": 59604, "epoch": 492} {"train_loss": -37.06327438354492, "global_step": 59605, "epoch": 492} {"train_loss": -37.441219329833984, "global_step": 59606, "epoch": 492} {"train_loss": -37.53090286254883, "global_step": 59607, "epoch": 492} {"train_loss": -37.294281005859375, "global_step": 59608, "epoch": 492} {"train_loss": -36.1096305847168, "global_step": 59609, "epoch": 492} {"train_loss": -34.895511627197266, "global_step": 59610, "epoch": 492} {"train_loss": -31.56183433532715, "global_step": 59611, "epoch": 492} {"train_loss": -28.0125675201416, "global_step": 59612, "epoch": 492} {"train_loss": -33.369144439697266, "global_step": 59613, "epoch": 492} {"train_loss": -33.18833541870117, "global_step": 59614, "epoch": 492} {"train_loss": -34.74345779418945, "global_step": 59615, "epoch": 492} {"train_loss": -35.05593490600586, "global_step": 59616, "epoch": 492} {"train_loss": -31.736560821533203, "global_step": 59617, "epoch": 492} {"train_loss": -34.368499755859375, "global_step": 59618, "epoch": 492} {"train_loss": -32.04262161254883, "global_step": 59619, "epoch": 492} {"train_loss": -31.791584014892578, "global_step": 59620, "epoch": 492} {"train_loss": -31.973907470703125, "global_step": 59621, "epoch": 492} {"train_loss": -18.84639549255371, "global_step": 59622, "epoch": 492} {"train_loss": -30.545246124267578, "global_step": 59623, "epoch": 492} {"train_loss": -31.187854766845703, "global_step": 59624, "epoch": 492} {"train_loss": -26.4555606842041, "global_step": 59625, "epoch": 492} {"train_loss": -30.836462020874023, "global_step": 59626, "epoch": 492} {"train_loss": -31.79094886779785, "global_step": 59627, "epoch": 492} {"train_loss": -26.12788963317871, "global_step": 59628, "epoch": 492} {"train_loss": -29.314512252807617, "global_step": 59629, "epoch": 492} {"train_loss": -30.047697067260742, "global_step": 59630, "epoch": 492} {"train_loss": -29.20696449279785, "global_step": 59631, "epoch": 492} {"train_loss": -32.05912399291992, "global_step": 59632, "epoch": 492} {"train_loss": -32.75454330444336, "global_step": 59633, "epoch": 492} {"train_loss": -31.835803985595703, "global_step": 59634, "epoch": 492} {"train_loss": -31.82669448852539, "global_step": 59635, "epoch": 492} {"train_loss": -29.952672958374023, "global_step": 59636, "epoch": 492} {"train_loss": -31.165510177612305, "global_step": 59637, "epoch": 492} {"train_loss": -30.66265296936035, "global_step": 59638, "epoch": 492} {"train_loss": -31.718505859375, "global_step": 59639, "epoch": 492} {"train_loss": -32.4654655456543, "global_step": 59640, "epoch": 492} {"train_loss": -33.09610366821289, "global_step": 59641, "epoch": 492} {"train_loss": -32.7952995300293, "global_step": 59642, "epoch": 492} {"train_loss": -33.53480911254883, "global_step": 59643, "epoch": 492} {"train_loss": -33.32744216918945, "global_step": 59644, "epoch": 492} {"train_loss": -33.45724105834961, "global_step": 59645, "epoch": 492} {"train_loss": -33.62248611450195, "global_step": 59646, "epoch": 492} {"train_loss": -33.649940490722656, "global_step": 59647, "epoch": 492} {"train_loss": -33.65129852294922, "global_step": 59648, "epoch": 492} {"train_loss": -33.83765411376953, "global_step": 59649, "epoch": 492} {"train_loss": -34.210914611816406, "global_step": 59650, "epoch": 492} {"train_loss": -34.40681457519531, "global_step": 59651, "epoch": 492} {"train_loss": -34.846260922014224, "global_step": 59652, "epoch": 492, "val_loss": 2374593.75} {"train_loss": -34.36423873901367, "global_step": 59653, "epoch": 493} {"train_loss": -34.1904411315918, "global_step": 59654, "epoch": 493} {"train_loss": -34.5964241027832, "global_step": 59655, "epoch": 493} {"train_loss": -34.96551513671875, "global_step": 59656, "epoch": 493} {"train_loss": -34.72779083251953, "global_step": 59657, "epoch": 493} {"train_loss": -34.31901168823242, "global_step": 59658, "epoch": 493} {"train_loss": -34.555328369140625, "global_step": 59659, "epoch": 493} {"train_loss": -34.94865417480469, "global_step": 59660, "epoch": 493} {"train_loss": -35.07374572753906, "global_step": 59661, "epoch": 493} {"train_loss": -35.21270751953125, "global_step": 59662, "epoch": 493} {"train_loss": -34.803314208984375, "global_step": 59663, "epoch": 493} {"train_loss": -35.46856689453125, "global_step": 59664, "epoch": 493} {"train_loss": -35.018436431884766, "global_step": 59665, "epoch": 493} {"train_loss": -35.62462615966797, "global_step": 59666, "epoch": 493} {"train_loss": -35.2120246887207, "global_step": 59667, "epoch": 493} {"train_loss": -35.49882888793945, "global_step": 59668, "epoch": 493} {"train_loss": -35.445125579833984, "global_step": 59669, "epoch": 493} {"train_loss": -35.440059661865234, "global_step": 59670, "epoch": 493} {"train_loss": -35.72937774658203, "global_step": 59671, "epoch": 493} {"train_loss": -35.61556625366211, "global_step": 59672, "epoch": 493} {"train_loss": -35.4869270324707, "global_step": 59673, "epoch": 493} {"train_loss": -35.65046310424805, "global_step": 59674, "epoch": 493} {"train_loss": -35.35210037231445, "global_step": 59675, "epoch": 493} {"train_loss": -36.03723907470703, "global_step": 59676, "epoch": 493} {"train_loss": -35.84205627441406, "global_step": 59677, "epoch": 493} {"train_loss": -35.4348030090332, "global_step": 59678, "epoch": 493} {"train_loss": -36.16576385498047, "global_step": 59679, "epoch": 493} {"train_loss": -35.59128952026367, "global_step": 59680, "epoch": 493} {"train_loss": -36.06239318847656, "global_step": 59681, "epoch": 493} {"train_loss": -36.51458740234375, "global_step": 59682, "epoch": 493} {"train_loss": -36.1904411315918, "global_step": 59683, "epoch": 493} {"train_loss": -36.045162200927734, "global_step": 59684, "epoch": 493} {"train_loss": -36.68635940551758, "global_step": 59685, "epoch": 493} {"train_loss": -36.4399528503418, "global_step": 59686, "epoch": 493} {"train_loss": -36.64227294921875, "global_step": 59687, "epoch": 493} {"train_loss": -36.75189208984375, "global_step": 59688, "epoch": 493} {"train_loss": -36.87274932861328, "global_step": 59689, "epoch": 493} {"train_loss": -36.77080154418945, "global_step": 59690, "epoch": 493} {"train_loss": -36.79256057739258, "global_step": 59691, "epoch": 493} {"train_loss": -36.667152404785156, "global_step": 59692, "epoch": 493} {"train_loss": -36.61150360107422, "global_step": 59693, "epoch": 493} {"train_loss": -36.60547637939453, "global_step": 59694, "epoch": 493} {"train_loss": -36.5658073425293, "global_step": 59695, "epoch": 493} {"train_loss": -36.74562454223633, "global_step": 59696, "epoch": 493} {"train_loss": -36.69387435913086, "global_step": 59697, "epoch": 493} {"train_loss": -36.884342193603516, "global_step": 59698, "epoch": 493} {"train_loss": -36.72806167602539, "global_step": 59699, "epoch": 493} {"train_loss": -36.70888900756836, "global_step": 59700, "epoch": 493} {"train_loss": -36.879573822021484, "global_step": 59701, "epoch": 493} {"train_loss": -37.05921936035156, "global_step": 59702, "epoch": 493} {"train_loss": -37.14680862426758, "global_step": 59703, "epoch": 493} {"train_loss": -36.57468795776367, "global_step": 59704, "epoch": 493} {"train_loss": -36.91657257080078, "global_step": 59705, "epoch": 493} {"train_loss": -36.79977035522461, "global_step": 59706, "epoch": 493} {"train_loss": -36.68891143798828, "global_step": 59707, "epoch": 493} {"train_loss": -37.51729202270508, "global_step": 59708, "epoch": 493} {"train_loss": -36.58559036254883, "global_step": 59709, "epoch": 493} {"train_loss": -36.75471496582031, "global_step": 59710, "epoch": 493} {"train_loss": -36.08074188232422, "global_step": 59711, "epoch": 493} {"train_loss": -35.600379943847656, "global_step": 59712, "epoch": 493} {"train_loss": -36.325904846191406, "global_step": 59713, "epoch": 493} {"train_loss": -36.83411407470703, "global_step": 59714, "epoch": 493} {"train_loss": -36.661495208740234, "global_step": 59715, "epoch": 493} {"train_loss": -36.57234191894531, "global_step": 59716, "epoch": 493} {"train_loss": -37.1286735534668, "global_step": 59717, "epoch": 493} {"train_loss": -36.65055465698242, "global_step": 59718, "epoch": 493} {"train_loss": -35.221954345703125, "global_step": 59719, "epoch": 493} {"train_loss": -34.66144943237305, "global_step": 59720, "epoch": 493} {"train_loss": -33.945980072021484, "global_step": 59721, "epoch": 493} {"train_loss": -34.261070251464844, "global_step": 59722, "epoch": 493} {"train_loss": -35.724361419677734, "global_step": 59723, "epoch": 493} {"train_loss": -36.58451461791992, "global_step": 59724, "epoch": 493} {"train_loss": -35.28597640991211, "global_step": 59725, "epoch": 493} {"train_loss": -32.86591339111328, "global_step": 59726, "epoch": 493} {"train_loss": -33.4383659362793, "global_step": 59727, "epoch": 493} {"train_loss": -36.779022216796875, "global_step": 59728, "epoch": 493} {"train_loss": -37.17689514160156, "global_step": 59729, "epoch": 493} {"train_loss": -36.219478607177734, "global_step": 59730, "epoch": 493} {"train_loss": -36.38592529296875, "global_step": 59731, "epoch": 493} {"train_loss": -36.6808967590332, "global_step": 59732, "epoch": 493} {"train_loss": -35.64556884765625, "global_step": 59733, "epoch": 493} {"train_loss": -36.752655029296875, "global_step": 59734, "epoch": 493} {"train_loss": -36.550350189208984, "global_step": 59735, "epoch": 493} {"train_loss": -36.00962448120117, "global_step": 59736, "epoch": 493} {"train_loss": -36.89316940307617, "global_step": 59737, "epoch": 493} {"train_loss": -36.47041702270508, "global_step": 59738, "epoch": 493} {"train_loss": -36.09431457519531, "global_step": 59739, "epoch": 493} {"train_loss": -36.379974365234375, "global_step": 59740, "epoch": 493} {"train_loss": -36.1853141784668, "global_step": 59741, "epoch": 493} {"train_loss": -36.93418502807617, "global_step": 59742, "epoch": 493} {"train_loss": -36.02788162231445, "global_step": 59743, "epoch": 493} {"train_loss": -36.30451583862305, "global_step": 59744, "epoch": 493} {"train_loss": -35.361793518066406, "global_step": 59745, "epoch": 493} {"train_loss": -35.77528762817383, "global_step": 59746, "epoch": 493} {"train_loss": -36.19106674194336, "global_step": 59747, "epoch": 493} {"train_loss": -36.77828598022461, "global_step": 59748, "epoch": 493} {"train_loss": -35.69849395751953, "global_step": 59749, "epoch": 493} {"train_loss": -35.06393051147461, "global_step": 59750, "epoch": 493} {"train_loss": -34.53470230102539, "global_step": 59751, "epoch": 493} {"train_loss": -36.64249038696289, "global_step": 59752, "epoch": 493} {"train_loss": -35.88328170776367, "global_step": 59753, "epoch": 493} {"train_loss": -34.817970275878906, "global_step": 59754, "epoch": 493} {"train_loss": -35.00272750854492, "global_step": 59755, "epoch": 493} {"train_loss": -35.12431335449219, "global_step": 59756, "epoch": 493} {"train_loss": -35.47462844848633, "global_step": 59757, "epoch": 493} {"train_loss": -34.3430290222168, "global_step": 59758, "epoch": 493} {"train_loss": -35.504940032958984, "global_step": 59759, "epoch": 493} {"train_loss": -35.894683837890625, "global_step": 59760, "epoch": 493} {"train_loss": -35.533668518066406, "global_step": 59761, "epoch": 493} {"train_loss": -34.05820846557617, "global_step": 59762, "epoch": 493} {"train_loss": -34.43195724487305, "global_step": 59763, "epoch": 493} {"train_loss": -36.319576263427734, "global_step": 59764, "epoch": 493} {"train_loss": -35.93696975708008, "global_step": 59765, "epoch": 493} {"train_loss": -36.351356506347656, "global_step": 59766, "epoch": 493} {"train_loss": -36.20698165893555, "global_step": 59767, "epoch": 493} {"train_loss": -34.306884765625, "global_step": 59768, "epoch": 493} {"train_loss": -34.79656219482422, "global_step": 59769, "epoch": 493} {"train_loss": -35.46875, "global_step": 59770, "epoch": 493} {"train_loss": -34.17505645751953, "global_step": 59771, "epoch": 493} {"train_loss": -34.52482986450195, "global_step": 59772, "epoch": 493} {"train_loss": -35.84417875936209, "global_step": 59773, "epoch": 493, "val_loss": 3103095.75} {"train_loss": -34.69489669799805, "global_step": 59774, "epoch": 494} {"train_loss": -32.026153564453125, "global_step": 59775, "epoch": 494} {"train_loss": -33.88076400756836, "global_step": 59776, "epoch": 494} {"train_loss": -36.078582763671875, "global_step": 59777, "epoch": 494} {"train_loss": -34.44765853881836, "global_step": 59778, "epoch": 494} {"train_loss": -32.359580993652344, "global_step": 59779, "epoch": 494} {"train_loss": -30.5806941986084, "global_step": 59780, "epoch": 494} {"train_loss": -35.274375915527344, "global_step": 59781, "epoch": 494} {"train_loss": -34.700347900390625, "global_step": 59782, "epoch": 494} {"train_loss": -35.049015045166016, "global_step": 59783, "epoch": 494} {"train_loss": -32.89362335205078, "global_step": 59784, "epoch": 494} {"train_loss": -35.36491775512695, "global_step": 59785, "epoch": 494} {"train_loss": -34.606292724609375, "global_step": 59786, "epoch": 494} {"train_loss": -33.888694763183594, "global_step": 59787, "epoch": 494} {"train_loss": -33.595516204833984, "global_step": 59788, "epoch": 494} {"train_loss": -34.73247146606445, "global_step": 59789, "epoch": 494} {"train_loss": -33.66300582885742, "global_step": 59790, "epoch": 494} {"train_loss": -33.97636032104492, "global_step": 59791, "epoch": 494} {"train_loss": -32.95956039428711, "global_step": 59792, "epoch": 494} {"train_loss": -35.89522171020508, "global_step": 59793, "epoch": 494} {"train_loss": -34.453975677490234, "global_step": 59794, "epoch": 494} {"train_loss": -34.52254867553711, "global_step": 59795, "epoch": 494} {"train_loss": -34.07021713256836, "global_step": 59796, "epoch": 494} {"train_loss": -35.436424255371094, "global_step": 59797, "epoch": 494} {"train_loss": -35.2087516784668, "global_step": 59798, "epoch": 494} {"train_loss": -35.292335510253906, "global_step": 59799, "epoch": 494} {"train_loss": -35.49586868286133, "global_step": 59800, "epoch": 494} {"train_loss": -35.55017852783203, "global_step": 59801, "epoch": 494} {"train_loss": -35.40795135498047, "global_step": 59802, "epoch": 494} {"train_loss": -35.202903747558594, "global_step": 59803, "epoch": 494} {"train_loss": -35.58193588256836, "global_step": 59804, "epoch": 494} {"train_loss": -34.666961669921875, "global_step": 59805, "epoch": 494} {"train_loss": -35.18290328979492, "global_step": 59806, "epoch": 494} {"train_loss": -35.00419235229492, "global_step": 59807, "epoch": 494} {"train_loss": -35.91535568237305, "global_step": 59808, "epoch": 494} {"train_loss": -35.37602615356445, "global_step": 59809, "epoch": 494} {"train_loss": -35.807838439941406, "global_step": 59810, "epoch": 494} {"train_loss": -36.1715087890625, "global_step": 59811, "epoch": 494} {"train_loss": -35.35171127319336, "global_step": 59812, "epoch": 494} {"train_loss": -35.49161911010742, "global_step": 59813, "epoch": 494} {"train_loss": -35.83150863647461, "global_step": 59814, "epoch": 494} {"train_loss": -35.96510314941406, "global_step": 59815, "epoch": 494} {"train_loss": -35.325599670410156, "global_step": 59816, "epoch": 494} {"train_loss": -35.78896713256836, "global_step": 59817, "epoch": 494} {"train_loss": -36.05394744873047, "global_step": 59818, "epoch": 494} {"train_loss": -36.37962341308594, "global_step": 59819, "epoch": 494} {"train_loss": -36.30337142944336, "global_step": 59820, "epoch": 494} {"train_loss": -36.09303283691406, "global_step": 59821, "epoch": 494} {"train_loss": -36.451229095458984, "global_step": 59822, "epoch": 494} {"train_loss": -36.50180435180664, "global_step": 59823, "epoch": 494} {"train_loss": -36.09876251220703, "global_step": 59824, "epoch": 494} {"train_loss": -36.44038009643555, "global_step": 59825, "epoch": 494} {"train_loss": -36.457759857177734, "global_step": 59826, "epoch": 494} {"train_loss": -36.540767669677734, "global_step": 59827, "epoch": 494} {"train_loss": -36.439849853515625, "global_step": 59828, "epoch": 494} {"train_loss": -36.18043899536133, "global_step": 59829, "epoch": 494} {"train_loss": -36.25925827026367, "global_step": 59830, "epoch": 494} {"train_loss": -36.32267379760742, "global_step": 59831, "epoch": 494} {"train_loss": -36.25919723510742, "global_step": 59832, "epoch": 494} {"train_loss": -36.65324020385742, "global_step": 59833, "epoch": 494} {"train_loss": -36.71230697631836, "global_step": 59834, "epoch": 494} {"train_loss": -36.72534942626953, "global_step": 59835, "epoch": 494} {"train_loss": -36.37432861328125, "global_step": 59836, "epoch": 494} {"train_loss": -35.79946517944336, "global_step": 59837, "epoch": 494} {"train_loss": -35.29825973510742, "global_step": 59838, "epoch": 494} {"train_loss": -35.28428268432617, "global_step": 59839, "epoch": 494} {"train_loss": -35.9893913269043, "global_step": 59840, "epoch": 494} {"train_loss": -36.3817138671875, "global_step": 59841, "epoch": 494} {"train_loss": -35.458412170410156, "global_step": 59842, "epoch": 494} {"train_loss": -32.93170928955078, "global_step": 59843, "epoch": 494} {"train_loss": -30.694665908813477, "global_step": 59844, "epoch": 494} {"train_loss": -36.03105926513672, "global_step": 59845, "epoch": 494} {"train_loss": -35.30876922607422, "global_step": 59846, "epoch": 494} {"train_loss": -31.72315788269043, "global_step": 59847, "epoch": 494} {"train_loss": -33.96443557739258, "global_step": 59848, "epoch": 494} {"train_loss": -36.210811614990234, "global_step": 59849, "epoch": 494} {"train_loss": -32.80139923095703, "global_step": 59850, "epoch": 494} {"train_loss": -35.09165573120117, "global_step": 59851, "epoch": 494} {"train_loss": -35.59687042236328, "global_step": 59852, "epoch": 494} {"train_loss": -34.09859085083008, "global_step": 59853, "epoch": 494} {"train_loss": -35.5073356628418, "global_step": 59854, "epoch": 494} {"train_loss": -34.20038986206055, "global_step": 59855, "epoch": 494} {"train_loss": -34.5665168762207, "global_step": 59856, "epoch": 494} {"train_loss": -35.07478332519531, "global_step": 59857, "epoch": 494} {"train_loss": -35.84480285644531, "global_step": 59858, "epoch": 494} {"train_loss": -34.26264572143555, "global_step": 59859, "epoch": 494} {"train_loss": -35.947147369384766, "global_step": 59860, "epoch": 494} {"train_loss": -35.0701789855957, "global_step": 59861, "epoch": 494} {"train_loss": -35.64223861694336, "global_step": 59862, "epoch": 494} {"train_loss": -35.826751708984375, "global_step": 59863, "epoch": 494} {"train_loss": -35.7047233581543, "global_step": 59864, "epoch": 494} {"train_loss": -36.201416015625, "global_step": 59865, "epoch": 494} {"train_loss": -36.198177337646484, "global_step": 59866, "epoch": 494} {"train_loss": -36.20594024658203, "global_step": 59867, "epoch": 494} {"train_loss": -36.34467697143555, "global_step": 59868, "epoch": 494} {"train_loss": -35.910213470458984, "global_step": 59869, "epoch": 494} {"train_loss": -34.479618072509766, "global_step": 59870, "epoch": 494} {"train_loss": -33.82854080200195, "global_step": 59871, "epoch": 494} {"train_loss": -30.526681900024414, "global_step": 59872, "epoch": 494} {"train_loss": -32.54055404663086, "global_step": 59873, "epoch": 494} {"train_loss": -34.07147216796875, "global_step": 59874, "epoch": 494} {"train_loss": -36.069129943847656, "global_step": 59875, "epoch": 494} {"train_loss": -35.99164962768555, "global_step": 59876, "epoch": 494} {"train_loss": -35.087947845458984, "global_step": 59877, "epoch": 494} {"train_loss": -35.96665573120117, "global_step": 59878, "epoch": 494} {"train_loss": -36.22346878051758, "global_step": 59879, "epoch": 494} {"train_loss": -35.75537872314453, "global_step": 59880, "epoch": 494} {"train_loss": -35.31598663330078, "global_step": 59881, "epoch": 494} {"train_loss": -36.88138961791992, "global_step": 59882, "epoch": 494} {"train_loss": -36.106056213378906, "global_step": 59883, "epoch": 494} {"train_loss": -36.106197357177734, "global_step": 59884, "epoch": 494} {"train_loss": -36.75996017456055, "global_step": 59885, "epoch": 494} {"train_loss": -36.23462677001953, "global_step": 59886, "epoch": 494} {"train_loss": -36.03989791870117, "global_step": 59887, "epoch": 494} {"train_loss": -36.21395492553711, "global_step": 59888, "epoch": 494} {"train_loss": -36.34852981567383, "global_step": 59889, "epoch": 494} {"train_loss": -36.28723907470703, "global_step": 59890, "epoch": 494} {"train_loss": -37.07072067260742, "global_step": 59891, "epoch": 494} {"train_loss": -36.697235107421875, "global_step": 59892, "epoch": 494} {"train_loss": -36.26893997192383, "global_step": 59893, "epoch": 494} {"train_loss": -35.26725214177912, "global_step": 59894, "epoch": 494, "val_loss": 2576744.75} {"train_loss": -37.00831985473633, "global_step": 59895, "epoch": 495} {"train_loss": -36.81775665283203, "global_step": 59896, "epoch": 495} {"train_loss": -36.90064239501953, "global_step": 59897, "epoch": 495} {"train_loss": -37.0402946472168, "global_step": 59898, "epoch": 495} {"train_loss": -37.086421966552734, "global_step": 59899, "epoch": 495} {"train_loss": -36.670928955078125, "global_step": 59900, "epoch": 495} {"train_loss": -36.93160629272461, "global_step": 59901, "epoch": 495} {"train_loss": -35.81421661376953, "global_step": 59902, "epoch": 495} {"train_loss": -37.013771057128906, "global_step": 59903, "epoch": 495} {"train_loss": -36.29841995239258, "global_step": 59904, "epoch": 495} {"train_loss": -35.467933654785156, "global_step": 59905, "epoch": 495} {"train_loss": -35.727657318115234, "global_step": 59906, "epoch": 495} {"train_loss": -36.271209716796875, "global_step": 59907, "epoch": 495} {"train_loss": -36.12721633911133, "global_step": 59908, "epoch": 495} {"train_loss": -36.169960021972656, "global_step": 59909, "epoch": 495} {"train_loss": -35.8575553894043, "global_step": 59910, "epoch": 495} {"train_loss": -36.49457931518555, "global_step": 59911, "epoch": 495} {"train_loss": -35.895992279052734, "global_step": 59912, "epoch": 495} {"train_loss": -35.33765411376953, "global_step": 59913, "epoch": 495} {"train_loss": -35.50002670288086, "global_step": 59914, "epoch": 495} {"train_loss": -35.51791763305664, "global_step": 59915, "epoch": 495} {"train_loss": -35.34700393676758, "global_step": 59916, "epoch": 495} {"train_loss": -33.350746154785156, "global_step": 59917, "epoch": 495} {"train_loss": -36.176971435546875, "global_step": 59918, "epoch": 495} {"train_loss": -34.9458122253418, "global_step": 59919, "epoch": 495} {"train_loss": -35.31390380859375, "global_step": 59920, "epoch": 495} {"train_loss": -35.77058029174805, "global_step": 59921, "epoch": 495} {"train_loss": -34.54384231567383, "global_step": 59922, "epoch": 495} {"train_loss": -36.0026741027832, "global_step": 59923, "epoch": 495} {"train_loss": -34.86703109741211, "global_step": 59924, "epoch": 495} {"train_loss": -35.21784210205078, "global_step": 59925, "epoch": 495} {"train_loss": -35.714332580566406, "global_step": 59926, "epoch": 495} {"train_loss": -34.065853118896484, "global_step": 59927, "epoch": 495} {"train_loss": -36.3392448425293, "global_step": 59928, "epoch": 495} {"train_loss": -34.866783142089844, "global_step": 59929, "epoch": 495} {"train_loss": -35.82444763183594, "global_step": 59930, "epoch": 495} {"train_loss": -34.7157096862793, "global_step": 59931, "epoch": 495} {"train_loss": -36.5449333190918, "global_step": 59932, "epoch": 495} {"train_loss": -35.425148010253906, "global_step": 59933, "epoch": 495} {"train_loss": -36.382381439208984, "global_step": 59934, "epoch": 495} {"train_loss": -36.08271408081055, "global_step": 59935, "epoch": 495} {"train_loss": -36.26591873168945, "global_step": 59936, "epoch": 495} {"train_loss": -36.2330322265625, "global_step": 59937, "epoch": 495} {"train_loss": -35.41527557373047, "global_step": 59938, "epoch": 495} {"train_loss": -36.8838996887207, "global_step": 59939, "epoch": 495} {"train_loss": -36.23396301269531, "global_step": 59940, "epoch": 495} {"train_loss": -36.970611572265625, "global_step": 59941, "epoch": 495} {"train_loss": -36.56715774536133, "global_step": 59942, "epoch": 495} {"train_loss": -36.630897521972656, "global_step": 59943, "epoch": 495} {"train_loss": -37.02213668823242, "global_step": 59944, "epoch": 495} {"train_loss": -37.143917083740234, "global_step": 59945, "epoch": 495} {"train_loss": -36.75816345214844, "global_step": 59946, "epoch": 495} {"train_loss": -36.89155960083008, "global_step": 59947, "epoch": 495} {"train_loss": -36.563594818115234, "global_step": 59948, "epoch": 495} {"train_loss": -36.88030242919922, "global_step": 59949, "epoch": 495} {"train_loss": -36.88654708862305, "global_step": 59950, "epoch": 495} {"train_loss": -36.81301498413086, "global_step": 59951, "epoch": 495} {"train_loss": -36.926143646240234, "global_step": 59952, "epoch": 495} {"train_loss": -36.50344467163086, "global_step": 59953, "epoch": 495} {"train_loss": -36.630409240722656, "global_step": 59954, "epoch": 495} {"train_loss": -37.007015228271484, "global_step": 59955, "epoch": 495} {"train_loss": -37.661643981933594, "global_step": 59956, "epoch": 495} {"train_loss": -37.118228912353516, "global_step": 59957, "epoch": 495} {"train_loss": -36.67018508911133, "global_step": 59958, "epoch": 495} {"train_loss": -36.09531784057617, "global_step": 59959, "epoch": 495} {"train_loss": -35.17338943481445, "global_step": 59960, "epoch": 495} {"train_loss": -32.999237060546875, "global_step": 59961, "epoch": 495} {"train_loss": -28.799915313720703, "global_step": 59962, "epoch": 495} {"train_loss": -32.43307113647461, "global_step": 59963, "epoch": 495} {"train_loss": -26.631250381469727, "global_step": 59964, "epoch": 495} {"train_loss": 4.508326530456543, "global_step": 59965, "epoch": 495} {"train_loss": -26.73064613342285, "global_step": 59966, "epoch": 495} {"train_loss": -5.894298553466797, "global_step": 59967, "epoch": 495} {"train_loss": -21.059795379638672, "global_step": 59968, "epoch": 495} {"train_loss": -27.070058822631836, "global_step": 59969, "epoch": 495} {"train_loss": -16.406082153320312, "global_step": 59970, "epoch": 495} {"train_loss": -21.44437026977539, "global_step": 59971, "epoch": 495} {"train_loss": -28.369104385375977, "global_step": 59972, "epoch": 495} {"train_loss": -27.63295555114746, "global_step": 59973, "epoch": 495} {"train_loss": -25.316373825073242, "global_step": 59974, "epoch": 495} {"train_loss": -25.069225311279297, "global_step": 59975, "epoch": 495} {"train_loss": -25.302352905273438, "global_step": 59976, "epoch": 495} {"train_loss": -29.2523193359375, "global_step": 59977, "epoch": 495} {"train_loss": -29.705163955688477, "global_step": 59978, "epoch": 495} {"train_loss": -29.843708038330078, "global_step": 59979, "epoch": 495} {"train_loss": -28.896894454956055, "global_step": 59980, "epoch": 495} {"train_loss": -28.807453155517578, "global_step": 59981, "epoch": 495} {"train_loss": -28.629133224487305, "global_step": 59982, "epoch": 495} {"train_loss": -29.953378677368164, "global_step": 59983, "epoch": 495} {"train_loss": -28.880029678344727, "global_step": 59984, "epoch": 495} {"train_loss": -31.912946701049805, "global_step": 59985, "epoch": 495} {"train_loss": -30.49349021911621, "global_step": 59986, "epoch": 495} {"train_loss": -31.0827693939209, "global_step": 59987, "epoch": 495} {"train_loss": -31.069211959838867, "global_step": 59988, "epoch": 495} {"train_loss": -30.594690322875977, "global_step": 59989, "epoch": 495} {"train_loss": -31.057449340820312, "global_step": 59990, "epoch": 495} {"train_loss": -31.21717643737793, "global_step": 59991, "epoch": 495} {"train_loss": -32.119564056396484, "global_step": 59992, "epoch": 495} {"train_loss": -31.63996696472168, "global_step": 59993, "epoch": 495} {"train_loss": -31.490650177001953, "global_step": 59994, "epoch": 495} {"train_loss": -32.058685302734375, "global_step": 59995, "epoch": 495} {"train_loss": -29.3780460357666, "global_step": 59996, "epoch": 495} {"train_loss": -25.87298583984375, "global_step": 59997, "epoch": 495} {"train_loss": -31.85201072692871, "global_step": 59998, "epoch": 495} {"train_loss": -28.757970809936523, "global_step": 59999, "epoch": 495} {"train_loss": -30.740461349487305, "global_step": 60000, "epoch": 495} {"train_loss": -27.621774673461914, "global_step": 60001, "epoch": 495} {"train_loss": -31.737218856811523, "global_step": 60002, "epoch": 495} {"train_loss": -31.58478355407715, "global_step": 60003, "epoch": 495} {"train_loss": -31.366750717163086, "global_step": 60004, "epoch": 495} {"train_loss": -31.753864288330078, "global_step": 60005, "epoch": 495} {"train_loss": -32.54364776611328, "global_step": 60006, "epoch": 495} {"train_loss": -31.105146408081055, "global_step": 60007, "epoch": 495} {"train_loss": -32.370975494384766, "global_step": 60008, "epoch": 495} {"train_loss": -32.013671875, "global_step": 60009, "epoch": 495} {"train_loss": -31.23432731628418, "global_step": 60010, "epoch": 495} {"train_loss": -28.756345748901367, "global_step": 60011, "epoch": 495} {"train_loss": -28.173797607421875, "global_step": 60012, "epoch": 495} {"train_loss": -32.790340423583984, "global_step": 60013, "epoch": 495} {"train_loss": -30.2569580078125, "global_step": 60014, "epoch": 495} {"train_loss": -32.58577506798358, "global_step": 60015, "epoch": 495, "val_loss": 2589048.25} {"train_loss": -32.15291976928711, "global_step": 60016, "epoch": 496} {"train_loss": -32.389888763427734, "global_step": 60017, "epoch": 496} {"train_loss": -33.1275634765625, "global_step": 60018, "epoch": 496} {"train_loss": -32.4390754699707, "global_step": 60019, "epoch": 496} {"train_loss": -32.78022766113281, "global_step": 60020, "epoch": 496} {"train_loss": -33.007545471191406, "global_step": 60021, "epoch": 496} {"train_loss": -32.823577880859375, "global_step": 60022, "epoch": 496} {"train_loss": -33.09574508666992, "global_step": 60023, "epoch": 496} {"train_loss": -32.73398971557617, "global_step": 60024, "epoch": 496} {"train_loss": -32.929046630859375, "global_step": 60025, "epoch": 496} {"train_loss": -32.5371208190918, "global_step": 60026, "epoch": 496} {"train_loss": -31.929950714111328, "global_step": 60027, "epoch": 496} {"train_loss": -32.02982711791992, "global_step": 60028, "epoch": 496} {"train_loss": -33.43389892578125, "global_step": 60029, "epoch": 496} {"train_loss": -33.01908493041992, "global_step": 60030, "epoch": 496} {"train_loss": -32.060203552246094, "global_step": 60031, "epoch": 496} {"train_loss": -28.4573917388916, "global_step": 60032, "epoch": 496} {"train_loss": -21.96755027770996, "global_step": 60033, "epoch": 496} {"train_loss": -30.721643447875977, "global_step": 60034, "epoch": 496} {"train_loss": -28.558069229125977, "global_step": 60035, "epoch": 496} {"train_loss": -31.730146408081055, "global_step": 60036, "epoch": 496} {"train_loss": -29.095632553100586, "global_step": 60037, "epoch": 496} {"train_loss": -33.19926071166992, "global_step": 60038, "epoch": 496} {"train_loss": -29.528213500976562, "global_step": 60039, "epoch": 496} {"train_loss": -32.63054656982422, "global_step": 60040, "epoch": 496} {"train_loss": -32.28078842163086, "global_step": 60041, "epoch": 496} {"train_loss": -31.891845703125, "global_step": 60042, "epoch": 496} {"train_loss": -31.1070556640625, "global_step": 60043, "epoch": 496} {"train_loss": -32.50095748901367, "global_step": 60044, "epoch": 496} {"train_loss": -32.49449920654297, "global_step": 60045, "epoch": 496} {"train_loss": -31.30853271484375, "global_step": 60046, "epoch": 496} {"train_loss": -27.488462448120117, "global_step": 60047, "epoch": 496} {"train_loss": -18.892431259155273, "global_step": 60048, "epoch": 496} {"train_loss": -30.8110408782959, "global_step": 60049, "epoch": 496} {"train_loss": -27.419055938720703, "global_step": 60050, "epoch": 496} {"train_loss": -31.931461334228516, "global_step": 60051, "epoch": 496} {"train_loss": -28.209497451782227, "global_step": 60052, "epoch": 496} {"train_loss": -32.23733139038086, "global_step": 60053, "epoch": 496} {"train_loss": -31.5906925201416, "global_step": 60054, "epoch": 496} {"train_loss": -29.4697322845459, "global_step": 60055, "epoch": 496} {"train_loss": -32.292293548583984, "global_step": 60056, "epoch": 496} {"train_loss": -31.79740333557129, "global_step": 60057, "epoch": 496} {"train_loss": -31.776838302612305, "global_step": 60058, "epoch": 496} {"train_loss": -32.73372268676758, "global_step": 60059, "epoch": 496} {"train_loss": -32.56769943237305, "global_step": 60060, "epoch": 496} {"train_loss": -32.407047271728516, "global_step": 60061, "epoch": 496} {"train_loss": -32.39006423950195, "global_step": 60062, "epoch": 496} {"train_loss": -32.33189010620117, "global_step": 60063, "epoch": 496} {"train_loss": -32.8421745300293, "global_step": 60064, "epoch": 496} {"train_loss": -32.73336410522461, "global_step": 60065, "epoch": 496} {"train_loss": -32.70283126831055, "global_step": 60066, "epoch": 496} {"train_loss": -32.47532653808594, "global_step": 60067, "epoch": 496} {"train_loss": -32.585296630859375, "global_step": 60068, "epoch": 496} {"train_loss": -32.869686126708984, "global_step": 60069, "epoch": 496} {"train_loss": -33.424713134765625, "global_step": 60070, "epoch": 496} {"train_loss": -33.11723709106445, "global_step": 60071, "epoch": 496} {"train_loss": -32.865230560302734, "global_step": 60072, "epoch": 496} {"train_loss": -33.44814682006836, "global_step": 60073, "epoch": 496} {"train_loss": -33.5645866394043, "global_step": 60074, "epoch": 496} {"train_loss": -33.36711502075195, "global_step": 60075, "epoch": 496} {"train_loss": -32.82697677612305, "global_step": 60076, "epoch": 496} {"train_loss": -33.88752365112305, "global_step": 60077, "epoch": 496} {"train_loss": -33.574134826660156, "global_step": 60078, "epoch": 496} {"train_loss": -34.019142150878906, "global_step": 60079, "epoch": 496} {"train_loss": -34.10847473144531, "global_step": 60080, "epoch": 496} {"train_loss": -33.70406723022461, "global_step": 60081, "epoch": 496} {"train_loss": -33.86749267578125, "global_step": 60082, "epoch": 496} {"train_loss": -33.84016418457031, "global_step": 60083, "epoch": 496} {"train_loss": -33.9365119934082, "global_step": 60084, "epoch": 496} {"train_loss": -33.96992874145508, "global_step": 60085, "epoch": 496} {"train_loss": -33.644691467285156, "global_step": 60086, "epoch": 496} {"train_loss": -34.18989181518555, "global_step": 60087, "epoch": 496} {"train_loss": -34.17988967895508, "global_step": 60088, "epoch": 496} {"train_loss": -34.375118255615234, "global_step": 60089, "epoch": 496} {"train_loss": -34.2370719909668, "global_step": 60090, "epoch": 496} {"train_loss": -34.384117126464844, "global_step": 60091, "epoch": 496} {"train_loss": -34.56028747558594, "global_step": 60092, "epoch": 496} {"train_loss": -33.7273063659668, "global_step": 60093, "epoch": 496} {"train_loss": -29.111425399780273, "global_step": 60094, "epoch": 496} {"train_loss": -8.968347549438477, "global_step": 60095, "epoch": 496} {"train_loss": -21.110877990722656, "global_step": 60096, "epoch": 496} {"train_loss": -23.6729679107666, "global_step": 60097, "epoch": 496} {"train_loss": -27.916486740112305, "global_step": 60098, "epoch": 496} {"train_loss": -22.990076065063477, "global_step": 60099, "epoch": 496} {"train_loss": -32.48752975463867, "global_step": 60100, "epoch": 496} {"train_loss": -26.148807525634766, "global_step": 60101, "epoch": 496} {"train_loss": -28.437088012695312, "global_step": 60102, "epoch": 496} {"train_loss": -32.7911491394043, "global_step": 60103, "epoch": 496} {"train_loss": -32.33223342895508, "global_step": 60104, "epoch": 496} {"train_loss": -30.40639305114746, "global_step": 60105, "epoch": 496} {"train_loss": -31.262664794921875, "global_step": 60106, "epoch": 496} {"train_loss": -32.65669631958008, "global_step": 60107, "epoch": 496} {"train_loss": -32.86318588256836, "global_step": 60108, "epoch": 496} {"train_loss": -32.73381042480469, "global_step": 60109, "epoch": 496} {"train_loss": -32.03998947143555, "global_step": 60110, "epoch": 496} {"train_loss": -32.44035339355469, "global_step": 60111, "epoch": 496} {"train_loss": -33.51710510253906, "global_step": 60112, "epoch": 496} {"train_loss": -34.00098419189453, "global_step": 60113, "epoch": 496} {"train_loss": -32.98061752319336, "global_step": 60114, "epoch": 496} {"train_loss": -32.50497055053711, "global_step": 60115, "epoch": 496} {"train_loss": -32.403839111328125, "global_step": 60116, "epoch": 496} {"train_loss": -32.98897933959961, "global_step": 60117, "epoch": 496} {"train_loss": -33.235626220703125, "global_step": 60118, "epoch": 496} {"train_loss": -33.152854919433594, "global_step": 60119, "epoch": 496} {"train_loss": -33.845848083496094, "global_step": 60120, "epoch": 496} {"train_loss": -33.045597076416016, "global_step": 60121, "epoch": 496} {"train_loss": -33.34846878051758, "global_step": 60122, "epoch": 496} {"train_loss": -33.63580322265625, "global_step": 60123, "epoch": 496} {"train_loss": -33.1701545715332, "global_step": 60124, "epoch": 496} {"train_loss": -34.08612823486328, "global_step": 60125, "epoch": 496} {"train_loss": -33.180274963378906, "global_step": 60126, "epoch": 496} {"train_loss": -33.34358215332031, "global_step": 60127, "epoch": 496} {"train_loss": -33.34154510498047, "global_step": 60128, "epoch": 496} {"train_loss": -33.96033477783203, "global_step": 60129, "epoch": 496} {"train_loss": -33.58087921142578, "global_step": 60130, "epoch": 496} {"train_loss": -33.508975982666016, "global_step": 60131, "epoch": 496} {"train_loss": -33.791107177734375, "global_step": 60132, "epoch": 496} {"train_loss": -33.723506927490234, "global_step": 60133, "epoch": 496} {"train_loss": -33.91796875, "global_step": 60134, "epoch": 496} {"train_loss": -34.05302047729492, "global_step": 60135, "epoch": 496} {"train_loss": -31.820775654690326, "global_step": 60136, "epoch": 496, "val_loss": 2655853.0} {"train_loss": -33.97647476196289, "global_step": 60137, "epoch": 497} {"train_loss": -33.806312561035156, "global_step": 60138, "epoch": 497} {"train_loss": -33.87498092651367, "global_step": 60139, "epoch": 497} {"train_loss": -34.18617630004883, "global_step": 60140, "epoch": 497} {"train_loss": -33.59756851196289, "global_step": 60141, "epoch": 497} {"train_loss": -33.381256103515625, "global_step": 60142, "epoch": 497} {"train_loss": -33.8213996887207, "global_step": 60143, "epoch": 497} {"train_loss": -33.244014739990234, "global_step": 60144, "epoch": 497} {"train_loss": -30.70588493347168, "global_step": 60145, "epoch": 497} {"train_loss": -29.557214736938477, "global_step": 60146, "epoch": 497} {"train_loss": -33.846675872802734, "global_step": 60147, "epoch": 497} {"train_loss": -28.807769775390625, "global_step": 60148, "epoch": 497} {"train_loss": -30.848783493041992, "global_step": 60149, "epoch": 497} {"train_loss": -28.897220611572266, "global_step": 60150, "epoch": 497} {"train_loss": -33.695953369140625, "global_step": 60151, "epoch": 497} {"train_loss": -31.00784683227539, "global_step": 60152, "epoch": 497} {"train_loss": -33.53229904174805, "global_step": 60153, "epoch": 497} {"train_loss": -32.33298873901367, "global_step": 60154, "epoch": 497} {"train_loss": -33.6760368347168, "global_step": 60155, "epoch": 497} {"train_loss": -33.16501998901367, "global_step": 60156, "epoch": 497} {"train_loss": -32.77734375, "global_step": 60157, "epoch": 497} {"train_loss": -33.67522430419922, "global_step": 60158, "epoch": 497} {"train_loss": -34.093170166015625, "global_step": 60159, "epoch": 497} {"train_loss": -32.67021942138672, "global_step": 60160, "epoch": 497} {"train_loss": -34.65230941772461, "global_step": 60161, "epoch": 497} {"train_loss": -34.0257568359375, "global_step": 60162, "epoch": 497} {"train_loss": -33.16102981567383, "global_step": 60163, "epoch": 497} {"train_loss": -33.91755294799805, "global_step": 60164, "epoch": 497} {"train_loss": -34.08943176269531, "global_step": 60165, "epoch": 497} {"train_loss": -33.52793502807617, "global_step": 60166, "epoch": 497} {"train_loss": -32.982730865478516, "global_step": 60167, "epoch": 497} {"train_loss": -32.971187591552734, "global_step": 60168, "epoch": 497} {"train_loss": -34.15998458862305, "global_step": 60169, "epoch": 497} {"train_loss": -33.91318893432617, "global_step": 60170, "epoch": 497} {"train_loss": -34.062740325927734, "global_step": 60171, "epoch": 497} {"train_loss": -32.65287780761719, "global_step": 60172, "epoch": 497} {"train_loss": -33.39222717285156, "global_step": 60173, "epoch": 497} {"train_loss": -33.32891845703125, "global_step": 60174, "epoch": 497} {"train_loss": -33.41462707519531, "global_step": 60175, "epoch": 497} {"train_loss": -33.308101654052734, "global_step": 60176, "epoch": 497} {"train_loss": -33.54997634887695, "global_step": 60177, "epoch": 497} {"train_loss": -34.44207763671875, "global_step": 60178, "epoch": 497} {"train_loss": -34.72184371948242, "global_step": 60179, "epoch": 497} {"train_loss": -34.1644401550293, "global_step": 60180, "epoch": 497} {"train_loss": -34.05137252807617, "global_step": 60181, "epoch": 497} {"train_loss": -34.47621536254883, "global_step": 60182, "epoch": 497} {"train_loss": -34.12123489379883, "global_step": 60183, "epoch": 497} {"train_loss": -34.0615234375, "global_step": 60184, "epoch": 497} {"train_loss": -34.63396453857422, "global_step": 60185, "epoch": 497} {"train_loss": -34.760162353515625, "global_step": 60186, "epoch": 497} {"train_loss": -34.02781677246094, "global_step": 60187, "epoch": 497} {"train_loss": -34.36213302612305, "global_step": 60188, "epoch": 497} {"train_loss": -34.169185638427734, "global_step": 60189, "epoch": 497} {"train_loss": -33.79730987548828, "global_step": 60190, "epoch": 497} {"train_loss": -34.207244873046875, "global_step": 60191, "epoch": 497} {"train_loss": -34.48244857788086, "global_step": 60192, "epoch": 497} {"train_loss": -24.870840072631836, "global_step": 60193, "epoch": 497} {"train_loss": -33.81174850463867, "global_step": 60194, "epoch": 497} {"train_loss": -33.65153121948242, "global_step": 60195, "epoch": 497} {"train_loss": -24.755762100219727, "global_step": 60196, "epoch": 497} {"train_loss": -31.369754791259766, "global_step": 60197, "epoch": 497} {"train_loss": -30.28515625, "global_step": 60198, "epoch": 497} {"train_loss": -31.922571182250977, "global_step": 60199, "epoch": 497} {"train_loss": -32.88724899291992, "global_step": 60200, "epoch": 497} {"train_loss": -32.20529556274414, "global_step": 60201, "epoch": 497} {"train_loss": -30.233325958251953, "global_step": 60202, "epoch": 497} {"train_loss": -30.537206649780273, "global_step": 60203, "epoch": 497} {"train_loss": -31.49848747253418, "global_step": 60204, "epoch": 497} {"train_loss": -30.543659210205078, "global_step": 60205, "epoch": 497} {"train_loss": -29.82258415222168, "global_step": 60206, "epoch": 497} {"train_loss": -32.94647216796875, "global_step": 60207, "epoch": 497} {"train_loss": -33.042213439941406, "global_step": 60208, "epoch": 497} {"train_loss": -30.96184730529785, "global_step": 60209, "epoch": 497} {"train_loss": -32.54297637939453, "global_step": 60210, "epoch": 497} {"train_loss": -33.14179611206055, "global_step": 60211, "epoch": 497} {"train_loss": -29.586135864257812, "global_step": 60212, "epoch": 497} {"train_loss": -32.946922302246094, "global_step": 60213, "epoch": 497} {"train_loss": -32.51682662963867, "global_step": 60214, "epoch": 497} {"train_loss": -32.14326095581055, "global_step": 60215, "epoch": 497} {"train_loss": -32.85155487060547, "global_step": 60216, "epoch": 497} {"train_loss": -30.9174747467041, "global_step": 60217, "epoch": 497} {"train_loss": -32.28455352783203, "global_step": 60218, "epoch": 497} {"train_loss": -31.286630630493164, "global_step": 60219, "epoch": 497} {"train_loss": -32.82057571411133, "global_step": 60220, "epoch": 497} {"train_loss": -32.30952072143555, "global_step": 60221, "epoch": 497} {"train_loss": -32.6185417175293, "global_step": 60222, "epoch": 497} {"train_loss": -30.998868942260742, "global_step": 60223, "epoch": 497} {"train_loss": -31.391345977783203, "global_step": 60224, "epoch": 497} {"train_loss": -31.852991104125977, "global_step": 60225, "epoch": 497} {"train_loss": -31.359975814819336, "global_step": 60226, "epoch": 497} {"train_loss": -32.34658432006836, "global_step": 60227, "epoch": 497} {"train_loss": -33.12752914428711, "global_step": 60228, "epoch": 497} {"train_loss": -31.78118324279785, "global_step": 60229, "epoch": 497} {"train_loss": -32.26049041748047, "global_step": 60230, "epoch": 497} {"train_loss": -32.66514587402344, "global_step": 60231, "epoch": 497} {"train_loss": -31.320226669311523, "global_step": 60232, "epoch": 497} {"train_loss": -33.35710906982422, "global_step": 60233, "epoch": 497} {"train_loss": -28.005664825439453, "global_step": 60234, "epoch": 497} {"train_loss": -32.925777435302734, "global_step": 60235, "epoch": 497} {"train_loss": -32.58270263671875, "global_step": 60236, "epoch": 497} {"train_loss": -33.32075500488281, "global_step": 60237, "epoch": 497} {"train_loss": -31.820697784423828, "global_step": 60238, "epoch": 497} {"train_loss": -32.81742858886719, "global_step": 60239, "epoch": 497} {"train_loss": -31.530323028564453, "global_step": 60240, "epoch": 497} {"train_loss": -31.985736846923828, "global_step": 60241, "epoch": 497} {"train_loss": -32.69346618652344, "global_step": 60242, "epoch": 497} {"train_loss": -32.73195266723633, "global_step": 60243, "epoch": 497} {"train_loss": -31.657922744750977, "global_step": 60244, "epoch": 497} {"train_loss": -32.63290023803711, "global_step": 60245, "epoch": 497} {"train_loss": -30.713193893432617, "global_step": 60246, "epoch": 497} {"train_loss": -31.741392135620117, "global_step": 60247, "epoch": 497} {"train_loss": -31.902820587158203, "global_step": 60248, "epoch": 497} {"train_loss": -33.284114837646484, "global_step": 60249, "epoch": 497} {"train_loss": -33.31831359863281, "global_step": 60250, "epoch": 497} {"train_loss": -32.31240463256836, "global_step": 60251, "epoch": 497} {"train_loss": -32.252174377441406, "global_step": 60252, "epoch": 497} {"train_loss": -32.6963996887207, "global_step": 60253, "epoch": 497} {"train_loss": -33.18981170654297, "global_step": 60254, "epoch": 497} {"train_loss": -32.688987731933594, "global_step": 60255, "epoch": 497} {"train_loss": -33.180145263671875, "global_step": 60256, "epoch": 497} {"train_loss": -32.551332804782334, "global_step": 60257, "epoch": 497, "val_loss": 2581204.25} {"train_loss": -31.89208984375, "global_step": 60258, "epoch": 498} {"train_loss": -32.5126838684082, "global_step": 60259, "epoch": 498} {"train_loss": -32.1832160949707, "global_step": 60260, "epoch": 498} {"train_loss": -32.45918655395508, "global_step": 60261, "epoch": 498} {"train_loss": -32.60358428955078, "global_step": 60262, "epoch": 498} {"train_loss": -32.209598541259766, "global_step": 60263, "epoch": 498} {"train_loss": -33.07146072387695, "global_step": 60264, "epoch": 498} {"train_loss": -33.6876335144043, "global_step": 60265, "epoch": 498} {"train_loss": -32.786956787109375, "global_step": 60266, "epoch": 498} {"train_loss": -32.705745697021484, "global_step": 60267, "epoch": 498} {"train_loss": -33.74858856201172, "global_step": 60268, "epoch": 498} {"train_loss": -33.4412956237793, "global_step": 60269, "epoch": 498} {"train_loss": -32.402618408203125, "global_step": 60270, "epoch": 498} {"train_loss": -31.057220458984375, "global_step": 60271, "epoch": 498} {"train_loss": -33.372859954833984, "global_step": 60272, "epoch": 498} {"train_loss": -33.88912582397461, "global_step": 60273, "epoch": 498} {"train_loss": -33.666595458984375, "global_step": 60274, "epoch": 498} {"train_loss": -33.59126663208008, "global_step": 60275, "epoch": 498} {"train_loss": -33.82455062866211, "global_step": 60276, "epoch": 498} {"train_loss": -33.91109848022461, "global_step": 60277, "epoch": 498} {"train_loss": -34.15913009643555, "global_step": 60278, "epoch": 498} {"train_loss": -33.30218505859375, "global_step": 60279, "epoch": 498} {"train_loss": -34.1154670715332, "global_step": 60280, "epoch": 498} {"train_loss": -33.74686813354492, "global_step": 60281, "epoch": 498} {"train_loss": -34.29157638549805, "global_step": 60282, "epoch": 498} {"train_loss": -34.35797119140625, "global_step": 60283, "epoch": 498} {"train_loss": -34.27798080444336, "global_step": 60284, "epoch": 498} {"train_loss": -34.32302474975586, "global_step": 60285, "epoch": 498} {"train_loss": -34.01791763305664, "global_step": 60286, "epoch": 498} {"train_loss": -34.55681610107422, "global_step": 60287, "epoch": 498} {"train_loss": -34.43658447265625, "global_step": 60288, "epoch": 498} {"train_loss": -34.46138000488281, "global_step": 60289, "epoch": 498} {"train_loss": -34.33799362182617, "global_step": 60290, "epoch": 498} {"train_loss": -34.70359420776367, "global_step": 60291, "epoch": 498} {"train_loss": -34.59729766845703, "global_step": 60292, "epoch": 498} {"train_loss": -33.858001708984375, "global_step": 60293, "epoch": 498} {"train_loss": -34.783790588378906, "global_step": 60294, "epoch": 498} {"train_loss": -34.07340621948242, "global_step": 60295, "epoch": 498} {"train_loss": -34.61247634887695, "global_step": 60296, "epoch": 498} {"train_loss": -34.75254821777344, "global_step": 60297, "epoch": 498} {"train_loss": -34.51066589355469, "global_step": 60298, "epoch": 498} {"train_loss": -34.317684173583984, "global_step": 60299, "epoch": 498} {"train_loss": -32.73594284057617, "global_step": 60300, "epoch": 498} {"train_loss": -28.963815689086914, "global_step": 60301, "epoch": 498} {"train_loss": -23.494428634643555, "global_step": 60302, "epoch": 498} {"train_loss": -19.882183074951172, "global_step": 60303, "epoch": 498} {"train_loss": -34.016822814941406, "global_step": 60304, "epoch": 498} {"train_loss": -27.035131454467773, "global_step": 60305, "epoch": 498} {"train_loss": -33.85333251953125, "global_step": 60306, "epoch": 498} {"train_loss": -28.947717666625977, "global_step": 60307, "epoch": 498} {"train_loss": -34.10759353637695, "global_step": 60308, "epoch": 498} {"train_loss": -29.5821590423584, "global_step": 60309, "epoch": 498} {"train_loss": -31.731311798095703, "global_step": 60310, "epoch": 498} {"train_loss": -33.89812469482422, "global_step": 60311, "epoch": 498} {"train_loss": -32.43098068237305, "global_step": 60312, "epoch": 498} {"train_loss": -33.2958984375, "global_step": 60313, "epoch": 498} {"train_loss": -34.160213470458984, "global_step": 60314, "epoch": 498} {"train_loss": -33.850616455078125, "global_step": 60315, "epoch": 498} {"train_loss": -29.732120513916016, "global_step": 60316, "epoch": 498} {"train_loss": -33.02910232543945, "global_step": 60317, "epoch": 498} {"train_loss": -34.629310607910156, "global_step": 60318, "epoch": 498} {"train_loss": -33.83305740356445, "global_step": 60319, "epoch": 498} {"train_loss": -32.04381561279297, "global_step": 60320, "epoch": 498} {"train_loss": -29.5566349029541, "global_step": 60321, "epoch": 498} {"train_loss": -34.489009857177734, "global_step": 60322, "epoch": 498} {"train_loss": -33.42495346069336, "global_step": 60323, "epoch": 498} {"train_loss": -33.90966796875, "global_step": 60324, "epoch": 498} {"train_loss": -33.82123947143555, "global_step": 60325, "epoch": 498} {"train_loss": -32.803382873535156, "global_step": 60326, "epoch": 498} {"train_loss": -33.478309631347656, "global_step": 60327, "epoch": 498} {"train_loss": -33.655757904052734, "global_step": 60328, "epoch": 498} {"train_loss": -33.37388229370117, "global_step": 60329, "epoch": 498} {"train_loss": -33.09815979003906, "global_step": 60330, "epoch": 498} {"train_loss": -33.882469177246094, "global_step": 60331, "epoch": 498} {"train_loss": -33.67335510253906, "global_step": 60332, "epoch": 498} {"train_loss": -34.042884826660156, "global_step": 60333, "epoch": 498} {"train_loss": -33.13541793823242, "global_step": 60334, "epoch": 498} {"train_loss": -33.464210510253906, "global_step": 60335, "epoch": 498} {"train_loss": -33.96929168701172, "global_step": 60336, "epoch": 498} {"train_loss": -33.927913665771484, "global_step": 60337, "epoch": 498} {"train_loss": -34.61724853515625, "global_step": 60338, "epoch": 498} {"train_loss": -34.26968765258789, "global_step": 60339, "epoch": 498} {"train_loss": -33.57688903808594, "global_step": 60340, "epoch": 498} {"train_loss": -33.95954132080078, "global_step": 60341, "epoch": 498} {"train_loss": -33.54175567626953, "global_step": 60342, "epoch": 498} {"train_loss": -33.26972198486328, "global_step": 60343, "epoch": 498} {"train_loss": -34.61579513549805, "global_step": 60344, "epoch": 498} {"train_loss": -33.83857727050781, "global_step": 60345, "epoch": 498} {"train_loss": -34.45559310913086, "global_step": 60346, "epoch": 498} {"train_loss": -34.47648239135742, "global_step": 60347, "epoch": 498} {"train_loss": -34.32893371582031, "global_step": 60348, "epoch": 498} {"train_loss": -34.61713409423828, "global_step": 60349, "epoch": 498} {"train_loss": -34.7723503112793, "global_step": 60350, "epoch": 498} {"train_loss": -34.2276611328125, "global_step": 60351, "epoch": 498} {"train_loss": -34.75511932373047, "global_step": 60352, "epoch": 498} {"train_loss": -35.015655517578125, "global_step": 60353, "epoch": 498} {"train_loss": -34.609901428222656, "global_step": 60354, "epoch": 498} {"train_loss": -34.80298614501953, "global_step": 60355, "epoch": 498} {"train_loss": -34.888336181640625, "global_step": 60356, "epoch": 498} {"train_loss": -35.139129638671875, "global_step": 60357, "epoch": 498} {"train_loss": -35.11690902709961, "global_step": 60358, "epoch": 498} {"train_loss": -34.840755462646484, "global_step": 60359, "epoch": 498} {"train_loss": -34.82207107543945, "global_step": 60360, "epoch": 498} {"train_loss": -34.74170684814453, "global_step": 60361, "epoch": 498} {"train_loss": -34.84159469604492, "global_step": 60362, "epoch": 498} {"train_loss": -34.94633102416992, "global_step": 60363, "epoch": 498} {"train_loss": -35.687408447265625, "global_step": 60364, "epoch": 498} {"train_loss": -35.15110397338867, "global_step": 60365, "epoch": 498} {"train_loss": -34.62392807006836, "global_step": 60366, "epoch": 498} {"train_loss": -35.623817443847656, "global_step": 60367, "epoch": 498} {"train_loss": -35.21185302734375, "global_step": 60368, "epoch": 498} {"train_loss": -35.136966705322266, "global_step": 60369, "epoch": 498} {"train_loss": -35.3952751159668, "global_step": 60370, "epoch": 498} {"train_loss": -35.36487579345703, "global_step": 60371, "epoch": 498} {"train_loss": -35.653961181640625, "global_step": 60372, "epoch": 498} {"train_loss": -35.10238265991211, "global_step": 60373, "epoch": 498} {"train_loss": -35.384857177734375, "global_step": 60374, "epoch": 498} {"train_loss": -34.94752883911133, "global_step": 60375, "epoch": 498} {"train_loss": -35.55855178833008, "global_step": 60376, "epoch": 498} {"train_loss": -34.97701644897461, "global_step": 60377, "epoch": 498} {"train_loss": -33.581926109377015, "global_step": 60378, "epoch": 498, "val_loss": 2637762.0} {"train_loss": -34.63679122924805, "global_step": 60379, "epoch": 499} {"train_loss": -34.1015625, "global_step": 60380, "epoch": 499} {"train_loss": -33.384891510009766, "global_step": 60381, "epoch": 499} {"train_loss": -35.32407760620117, "global_step": 60382, "epoch": 499} {"train_loss": -35.77446365356445, "global_step": 60383, "epoch": 499} {"train_loss": -35.85426330566406, "global_step": 60384, "epoch": 499} {"train_loss": -35.476741790771484, "global_step": 60385, "epoch": 499} {"train_loss": -35.13902282714844, "global_step": 60386, "epoch": 499} {"train_loss": -35.04738998413086, "global_step": 60387, "epoch": 499} {"train_loss": -36.04789352416992, "global_step": 60388, "epoch": 499} {"train_loss": -33.703330993652344, "global_step": 60389, "epoch": 499} {"train_loss": -35.19718551635742, "global_step": 60390, "epoch": 499} {"train_loss": -34.97493362426758, "global_step": 60391, "epoch": 499} {"train_loss": -35.181636810302734, "global_step": 60392, "epoch": 499} {"train_loss": -34.375160217285156, "global_step": 60393, "epoch": 499} {"train_loss": -35.17484664916992, "global_step": 60394, "epoch": 499} {"train_loss": -34.382198333740234, "global_step": 60395, "epoch": 499} {"train_loss": -33.50702667236328, "global_step": 60396, "epoch": 499} {"train_loss": -35.19208526611328, "global_step": 60397, "epoch": 499} {"train_loss": -32.230445861816406, "global_step": 60398, "epoch": 499} {"train_loss": -35.605003356933594, "global_step": 60399, "epoch": 499} {"train_loss": -34.42058181762695, "global_step": 60400, "epoch": 499} {"train_loss": -34.821903228759766, "global_step": 60401, "epoch": 499} {"train_loss": -34.37160873413086, "global_step": 60402, "epoch": 499} {"train_loss": -35.38105010986328, "global_step": 60403, "epoch": 499} {"train_loss": -34.12038803100586, "global_step": 60404, "epoch": 499} {"train_loss": -33.825408935546875, "global_step": 60405, "epoch": 499} {"train_loss": -33.79657745361328, "global_step": 60406, "epoch": 499} {"train_loss": -34.5297966003418, "global_step": 60407, "epoch": 499} {"train_loss": -34.79907989501953, "global_step": 60408, "epoch": 499} {"train_loss": -32.5400276184082, "global_step": 60409, "epoch": 499} {"train_loss": -34.79488754272461, "global_step": 60410, "epoch": 499} {"train_loss": -32.71804428100586, "global_step": 60411, "epoch": 499} {"train_loss": -33.228492736816406, "global_step": 60412, "epoch": 499} {"train_loss": -34.94692611694336, "global_step": 60413, "epoch": 499} {"train_loss": -32.75814437866211, "global_step": 60414, "epoch": 499} {"train_loss": -33.81024169921875, "global_step": 60415, "epoch": 499} {"train_loss": -33.357330322265625, "global_step": 60416, "epoch": 499} {"train_loss": -34.11025619506836, "global_step": 60417, "epoch": 499} {"train_loss": -34.05652618408203, "global_step": 60418, "epoch": 499} {"train_loss": -34.59387969970703, "global_step": 60419, "epoch": 499} {"train_loss": -34.459651947021484, "global_step": 60420, "epoch": 499} {"train_loss": -33.531036376953125, "global_step": 60421, "epoch": 499} {"train_loss": -31.934080123901367, "global_step": 60422, "epoch": 499} {"train_loss": -33.159339904785156, "global_step": 60423, "epoch": 499} {"train_loss": -33.616146087646484, "global_step": 60424, "epoch": 499} {"train_loss": -33.48883056640625, "global_step": 60425, "epoch": 499} {"train_loss": -33.173240661621094, "global_step": 60426, "epoch": 499} {"train_loss": -34.77912139892578, "global_step": 60427, "epoch": 499} {"train_loss": -32.1428337097168, "global_step": 60428, "epoch": 499} {"train_loss": -34.595314025878906, "global_step": 60429, "epoch": 499} {"train_loss": -34.094905853271484, "global_step": 60430, "epoch": 499} {"train_loss": -34.573089599609375, "global_step": 60431, "epoch": 499} {"train_loss": -33.89326858520508, "global_step": 60432, "epoch": 499} {"train_loss": -34.47516632080078, "global_step": 60433, "epoch": 499} {"train_loss": -33.47796630859375, "global_step": 60434, "epoch": 499} {"train_loss": -34.32914352416992, "global_step": 60435, "epoch": 499} {"train_loss": -33.83376693725586, "global_step": 60436, "epoch": 499} {"train_loss": -34.42677307128906, "global_step": 60437, "epoch": 499} {"train_loss": -33.89680862426758, "global_step": 60438, "epoch": 499} {"train_loss": -35.23432159423828, "global_step": 60439, "epoch": 499} {"train_loss": -35.50557327270508, "global_step": 60440, "epoch": 499} {"train_loss": -34.097225189208984, "global_step": 60441, "epoch": 499} {"train_loss": -34.69993209838867, "global_step": 60442, "epoch": 499} {"train_loss": -34.493408203125, "global_step": 60443, "epoch": 499} {"train_loss": -34.28689193725586, "global_step": 60444, "epoch": 499} {"train_loss": -34.37428283691406, "global_step": 60445, "epoch": 499} {"train_loss": -35.419734954833984, "global_step": 60446, "epoch": 499} {"train_loss": -34.74576950073242, "global_step": 60447, "epoch": 499} {"train_loss": -34.655025482177734, "global_step": 60448, "epoch": 499} {"train_loss": -35.60789108276367, "global_step": 60449, "epoch": 499} {"train_loss": -35.464717864990234, "global_step": 60450, "epoch": 499} {"train_loss": -35.144649505615234, "global_step": 60451, "epoch": 499} {"train_loss": -35.67389678955078, "global_step": 60452, "epoch": 499} {"train_loss": -35.60804748535156, "global_step": 60453, "epoch": 499} {"train_loss": -35.56099319458008, "global_step": 60454, "epoch": 499} {"train_loss": -35.0771484375, "global_step": 60455, "epoch": 499} {"train_loss": -35.26028823852539, "global_step": 60456, "epoch": 499} {"train_loss": -35.73825454711914, "global_step": 60457, "epoch": 499} {"train_loss": -35.29970169067383, "global_step": 60458, "epoch": 499} {"train_loss": -35.39632797241211, "global_step": 60459, "epoch": 499} {"train_loss": -35.417510986328125, "global_step": 60460, "epoch": 499} {"train_loss": -33.47866439819336, "global_step": 60461, "epoch": 499} {"train_loss": -28.294879913330078, "global_step": 60462, "epoch": 499} {"train_loss": -22.301408767700195, "global_step": 60463, "epoch": 499} {"train_loss": -23.19257926940918, "global_step": 60464, "epoch": 499} {"train_loss": -34.98224639892578, "global_step": 60465, "epoch": 499} {"train_loss": -28.47617530822754, "global_step": 60466, "epoch": 499} {"train_loss": -32.9759635925293, "global_step": 60467, "epoch": 499} {"train_loss": -30.270353317260742, "global_step": 60468, "epoch": 499} {"train_loss": -34.12177658081055, "global_step": 60469, "epoch": 499} {"train_loss": -31.261917114257812, "global_step": 60470, "epoch": 499} {"train_loss": -34.5029411315918, "global_step": 60471, "epoch": 499} {"train_loss": -31.799331665039062, "global_step": 60472, "epoch": 499} {"train_loss": -34.914119720458984, "global_step": 60473, "epoch": 499} {"train_loss": -33.93540573120117, "global_step": 60474, "epoch": 499} {"train_loss": -33.70015335083008, "global_step": 60475, "epoch": 499} {"train_loss": -34.59922409057617, "global_step": 60476, "epoch": 499} {"train_loss": -33.65631103515625, "global_step": 60477, "epoch": 499} {"train_loss": -34.509029388427734, "global_step": 60478, "epoch": 499} {"train_loss": -34.15874099731445, "global_step": 60479, "epoch": 499} {"train_loss": -34.6901969909668, "global_step": 60480, "epoch": 499} {"train_loss": -34.46940994262695, "global_step": 60481, "epoch": 499} {"train_loss": -34.46236038208008, "global_step": 60482, "epoch": 499} {"train_loss": -35.56356430053711, "global_step": 60483, "epoch": 499} {"train_loss": -34.88186264038086, "global_step": 60484, "epoch": 499} {"train_loss": -34.68660354614258, "global_step": 60485, "epoch": 499} {"train_loss": -35.36240768432617, "global_step": 60486, "epoch": 499} {"train_loss": -34.658321380615234, "global_step": 60487, "epoch": 499} {"train_loss": -34.83366012573242, "global_step": 60488, "epoch": 499} {"train_loss": -35.22343826293945, "global_step": 60489, "epoch": 499} {"train_loss": -35.5059700012207, "global_step": 60490, "epoch": 499} {"train_loss": -35.38652420043945, "global_step": 60491, "epoch": 499} {"train_loss": -35.48035430908203, "global_step": 60492, "epoch": 499} {"train_loss": -35.63151931762695, "global_step": 60493, "epoch": 499} {"train_loss": -35.46438217163086, "global_step": 60494, "epoch": 499} {"train_loss": -35.8353271484375, "global_step": 60495, "epoch": 499} {"train_loss": -35.29780197143555, "global_step": 60496, "epoch": 499} {"train_loss": -35.75086212158203, "global_step": 60497, "epoch": 499} {"train_loss": -35.976280212402344, "global_step": 60498, "epoch": 499} {"train_loss": -34.182702639871394, "global_step": 60499, "epoch": 499, "val_loss": 2504152.25} {"train_loss": -35.87156295776367, "global_step": 60500, "epoch": 500} {"train_loss": -36.14382553100586, "global_step": 60501, "epoch": 500} {"train_loss": -34.89631652832031, "global_step": 60502, "epoch": 500} {"train_loss": -36.26606369018555, "global_step": 60503, "epoch": 500} {"train_loss": -36.08308029174805, "global_step": 60504, "epoch": 500} {"train_loss": -35.42964553833008, "global_step": 60505, "epoch": 500} {"train_loss": -36.01374816894531, "global_step": 60506, "epoch": 500} {"train_loss": -36.160194396972656, "global_step": 60507, "epoch": 500} {"train_loss": -35.67327880859375, "global_step": 60508, "epoch": 500} {"train_loss": -34.258392333984375, "global_step": 60509, "epoch": 500} {"train_loss": -36.178260803222656, "global_step": 60510, "epoch": 500} {"train_loss": -35.434051513671875, "global_step": 60511, "epoch": 500} {"train_loss": -36.20771789550781, "global_step": 60512, "epoch": 500} {"train_loss": -35.944679260253906, "global_step": 60513, "epoch": 500} {"train_loss": -35.23604202270508, "global_step": 60514, "epoch": 500} {"train_loss": -35.034942626953125, "global_step": 60515, "epoch": 500} {"train_loss": -35.13767623901367, "global_step": 60516, "epoch": 500} {"train_loss": -34.607330322265625, "global_step": 60517, "epoch": 500} {"train_loss": -33.97904586791992, "global_step": 60518, "epoch": 500} {"train_loss": -35.40407943725586, "global_step": 60519, "epoch": 500} {"train_loss": -35.44401168823242, "global_step": 60520, "epoch": 500} {"train_loss": -35.03197479248047, "global_step": 60521, "epoch": 500} {"train_loss": -35.58860397338867, "global_step": 60522, "epoch": 500} {"train_loss": -34.98626708984375, "global_step": 60523, "epoch": 500} {"train_loss": -33.79408264160156, "global_step": 60524, "epoch": 500} {"train_loss": -34.1246223449707, "global_step": 60525, "epoch": 500} {"train_loss": -34.7794303894043, "global_step": 60526, "epoch": 500} {"train_loss": -36.57522964477539, "global_step": 60527, "epoch": 500} {"train_loss": -33.73183059692383, "global_step": 60528, "epoch": 500} {"train_loss": -33.33097457885742, "global_step": 60529, "epoch": 500} {"train_loss": -32.82638168334961, "global_step": 60530, "epoch": 500} {"train_loss": -33.235870361328125, "global_step": 60531, "epoch": 500} {"train_loss": -35.597599029541016, "global_step": 60532, "epoch": 500} {"train_loss": -32.98290252685547, "global_step": 60533, "epoch": 500} {"train_loss": -34.631446838378906, "global_step": 60534, "epoch": 500} {"train_loss": -32.71569061279297, "global_step": 60535, "epoch": 500} {"train_loss": -34.82991409301758, "global_step": 60536, "epoch": 500} {"train_loss": -34.24678039550781, "global_step": 60537, "epoch": 500} {"train_loss": -34.012168884277344, "global_step": 60538, "epoch": 500} {"train_loss": -34.34766387939453, "global_step": 60539, "epoch": 500} {"train_loss": -35.390132904052734, "global_step": 60540, "epoch": 500} {"train_loss": -34.69286346435547, "global_step": 60541, "epoch": 500} {"train_loss": -34.509891510009766, "global_step": 60542, "epoch": 500} {"train_loss": -35.294151306152344, "global_step": 60543, "epoch": 500} {"train_loss": -35.697265625, "global_step": 60544, "epoch": 500} {"train_loss": -35.05434799194336, "global_step": 60545, "epoch": 500} {"train_loss": -35.08723068237305, "global_step": 60546, "epoch": 500} {"train_loss": -35.24713897705078, "global_step": 60547, "epoch": 500} {"train_loss": -35.34855270385742, "global_step": 60548, "epoch": 500} {"train_loss": -34.56992721557617, "global_step": 60549, "epoch": 500} {"train_loss": -34.00773239135742, "global_step": 60550, "epoch": 500} {"train_loss": -35.301387786865234, "global_step": 60551, "epoch": 500} {"train_loss": -34.91571807861328, "global_step": 60552, "epoch": 500} {"train_loss": -34.89540481567383, "global_step": 60553, "epoch": 500} {"train_loss": -35.02910232543945, "global_step": 60554, "epoch": 500} {"train_loss": -34.83934783935547, "global_step": 60555, "epoch": 500} {"train_loss": -34.73383331298828, "global_step": 60556, "epoch": 500} {"train_loss": -34.8925895690918, "global_step": 60557, "epoch": 500} {"train_loss": -34.54220199584961, "global_step": 60558, "epoch": 500} {"train_loss": -35.133697509765625, "global_step": 60559, "epoch": 500} {"train_loss": -33.68410873413086, "global_step": 60560, "epoch": 500} {"train_loss": -31.8715877532959, "global_step": 60561, "epoch": 500} {"train_loss": -28.321460723876953, "global_step": 60562, "epoch": 500} {"train_loss": -18.4547119140625, "global_step": 60563, "epoch": 500} {"train_loss": -16.72052001953125, "global_step": 60564, "epoch": 500} {"train_loss": -34.95623779296875, "global_step": 60565, "epoch": 500} {"train_loss": -24.4995174407959, "global_step": 60566, "epoch": 500} {"train_loss": -32.275230407714844, "global_step": 60567, "epoch": 500} {"train_loss": -27.682159423828125, "global_step": 60568, "epoch": 500} {"train_loss": -33.3084831237793, "global_step": 60569, "epoch": 500} {"train_loss": -28.2705078125, "global_step": 60570, "epoch": 500} {"train_loss": -34.06147384643555, "global_step": 60571, "epoch": 500} {"train_loss": -31.856414794921875, "global_step": 60572, "epoch": 500} {"train_loss": -32.02836990356445, "global_step": 60573, "epoch": 500} {"train_loss": -33.88980484008789, "global_step": 60574, "epoch": 500} {"train_loss": -33.11749267578125, "global_step": 60575, "epoch": 500} {"train_loss": -33.29254913330078, "global_step": 60576, "epoch": 500} {"train_loss": -34.58224868774414, "global_step": 60577, "epoch": 500} {"train_loss": -33.37873840332031, "global_step": 60578, "epoch": 500} {"train_loss": -33.39400863647461, "global_step": 60579, "epoch": 500} {"train_loss": -33.3779411315918, "global_step": 60580, "epoch": 500} {"train_loss": -34.299434661865234, "global_step": 60581, "epoch": 500} {"train_loss": -34.50307083129883, "global_step": 60582, "epoch": 500} {"train_loss": -34.08302688598633, "global_step": 60583, "epoch": 500} {"train_loss": -34.14190673828125, "global_step": 60584, "epoch": 500} {"train_loss": -34.64542770385742, "global_step": 60585, "epoch": 500} {"train_loss": -34.4207763671875, "global_step": 60586, "epoch": 500} {"train_loss": -34.62607192993164, "global_step": 60587, "epoch": 500} {"train_loss": -34.7047233581543, "global_step": 60588, "epoch": 500} {"train_loss": -34.70866775512695, "global_step": 60589, "epoch": 500} {"train_loss": -34.63130569458008, "global_step": 60590, "epoch": 500} {"train_loss": -34.91282653808594, "global_step": 60591, "epoch": 500} {"train_loss": -34.68893051147461, "global_step": 60592, "epoch": 500} {"train_loss": -34.86541748046875, "global_step": 60593, "epoch": 500} {"train_loss": -35.13139724731445, "global_step": 60594, "epoch": 500} {"train_loss": -35.07231521606445, "global_step": 60595, "epoch": 500} {"train_loss": -34.8714485168457, "global_step": 60596, "epoch": 500} {"train_loss": -34.522178649902344, "global_step": 60597, "epoch": 500} {"train_loss": -34.748313903808594, "global_step": 60598, "epoch": 500} {"train_loss": -35.55232238769531, "global_step": 60599, "epoch": 500} {"train_loss": -35.60099411010742, "global_step": 60600, "epoch": 500} {"train_loss": -35.01628494262695, "global_step": 60601, "epoch": 500} {"train_loss": -35.62113952636719, "global_step": 60602, "epoch": 500} {"train_loss": -35.277503967285156, "global_step": 60603, "epoch": 500} {"train_loss": -35.235530853271484, "global_step": 60604, "epoch": 500} {"train_loss": -35.317413330078125, "global_step": 60605, "epoch": 500} {"train_loss": -35.54880142211914, "global_step": 60606, "epoch": 500} {"train_loss": -35.80360794067383, "global_step": 60607, "epoch": 500} {"train_loss": -35.28231430053711, "global_step": 60608, "epoch": 500} {"train_loss": -35.53190231323242, "global_step": 60609, "epoch": 500} {"train_loss": -35.51527786254883, "global_step": 60610, "epoch": 500} {"train_loss": -35.45888900756836, "global_step": 60611, "epoch": 500} {"train_loss": -35.635169982910156, "global_step": 60612, "epoch": 500} {"train_loss": -35.113731384277344, "global_step": 60613, "epoch": 500} {"train_loss": -35.43197250366211, "global_step": 60614, "epoch": 500} {"train_loss": -35.73408889770508, "global_step": 60615, "epoch": 500} {"train_loss": -35.52253341674805, "global_step": 60616, "epoch": 500} {"train_loss": -35.30719757080078, "global_step": 60617, "epoch": 500} {"train_loss": -35.44919204711914, "global_step": 60618, "epoch": 500} {"train_loss": -35.47677230834961, "global_step": 60619, "epoch": 500} {"train_loss": -34.23895547409688, "global_step": 60620, "epoch": 500, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4400000": 1.0, "test/sim_max_reward_4400001": 1.0, "test/sim_max_reward_4400002": 1.0, "test/sim_max_reward_4400003": 0.0, "test/sim_max_reward_4400004": 1.0, "test/sim_max_reward_4400005": 1.0, "test/sim_max_reward_4400006": 1.0, "test/sim_max_reward_4400007": 1.0, "test/sim_max_reward_4400008": 1.0, "test/sim_max_reward_4400009": 1.0, "test/sim_max_reward_4400010": 1.0, "test/sim_max_reward_4400011": 1.0, "test/sim_max_reward_4400012": 1.0, "test/sim_max_reward_4400013": 1.0, "test/sim_max_reward_4400014": 1.0, "test/sim_max_reward_4400015": 1.0, "test/sim_max_reward_4400016": 1.0, "test/sim_max_reward_4400017": 1.0, "test/sim_max_reward_4400018": 1.0, "test/sim_max_reward_4400019": 1.0, "test/sim_max_reward_4400020": 1.0, "test/sim_max_reward_4400021": 1.0, "train/mean_score": 1.0, "test/mean_score": 0.9545454545454546, "val_loss": 2517439.25} {"train_loss": -35.80158615112305, "global_step": 60621, "epoch": 501} {"train_loss": -36.25826644897461, "global_step": 60622, "epoch": 501} {"train_loss": -34.49314498901367, "global_step": 60623, "epoch": 501} {"train_loss": -35.532470703125, "global_step": 60624, "epoch": 501} {"train_loss": -36.24361801147461, "global_step": 60625, "epoch": 501} {"train_loss": -35.196685791015625, "global_step": 60626, "epoch": 501} {"train_loss": -35.56411361694336, "global_step": 60627, "epoch": 501} {"train_loss": -35.24580764770508, "global_step": 60628, "epoch": 501} {"train_loss": -35.993892669677734, "global_step": 60629, "epoch": 501} {"train_loss": -35.71078109741211, "global_step": 60630, "epoch": 501} {"train_loss": -36.49937438964844, "global_step": 60631, "epoch": 501} {"train_loss": -35.76406478881836, "global_step": 60632, "epoch": 501} {"train_loss": -35.8537483215332, "global_step": 60633, "epoch": 501} {"train_loss": -35.26736831665039, "global_step": 60634, "epoch": 501} {"train_loss": -36.11576461791992, "global_step": 60635, "epoch": 501} {"train_loss": -34.92219924926758, "global_step": 60636, "epoch": 501} {"train_loss": -36.07479476928711, "global_step": 60637, "epoch": 501} {"train_loss": -36.2083854675293, "global_step": 60638, "epoch": 501} {"train_loss": -35.499332427978516, "global_step": 60639, "epoch": 501} {"train_loss": -35.70156478881836, "global_step": 60640, "epoch": 501} {"train_loss": -36.13419723510742, "global_step": 60641, "epoch": 501} {"train_loss": -35.853179931640625, "global_step": 60642, "epoch": 501} {"train_loss": -34.76319122314453, "global_step": 60643, "epoch": 501} {"train_loss": -34.58645248413086, "global_step": 60644, "epoch": 501} {"train_loss": -32.815826416015625, "global_step": 60645, "epoch": 501} {"train_loss": -31.92217445373535, "global_step": 60646, "epoch": 501} {"train_loss": -26.976531982421875, "global_step": 60647, "epoch": 501} {"train_loss": -26.310346603393555, "global_step": 60648, "epoch": 501} {"train_loss": -32.5571174621582, "global_step": 60649, "epoch": 501} {"train_loss": -29.553918838500977, "global_step": 60650, "epoch": 501} {"train_loss": -23.42669105529785, "global_step": 60651, "epoch": 501} {"train_loss": -27.416717529296875, "global_step": 60652, "epoch": 501} {"train_loss": -26.470550537109375, "global_step": 60653, "epoch": 501} {"train_loss": -30.83803367614746, "global_step": 60654, "epoch": 501} {"train_loss": -29.617212295532227, "global_step": 60655, "epoch": 501} {"train_loss": -32.55997848510742, "global_step": 60656, "epoch": 501} {"train_loss": -29.263776779174805, "global_step": 60657, "epoch": 501} {"train_loss": -34.50257110595703, "global_step": 60658, "epoch": 501} {"train_loss": -30.256986618041992, "global_step": 60659, "epoch": 501} {"train_loss": -32.994789123535156, "global_step": 60660, "epoch": 501} {"train_loss": -34.27812576293945, "global_step": 60661, "epoch": 501} {"train_loss": -32.535736083984375, "global_step": 60662, "epoch": 501} {"train_loss": -33.343135833740234, "global_step": 60663, "epoch": 501} {"train_loss": -33.47517013549805, "global_step": 60664, "epoch": 501} {"train_loss": -34.082332611083984, "global_step": 60665, "epoch": 501} {"train_loss": -34.39374923706055, "global_step": 60666, "epoch": 501} {"train_loss": -34.62372970581055, "global_step": 60667, "epoch": 501} {"train_loss": -33.97451400756836, "global_step": 60668, "epoch": 501} {"train_loss": -34.20928955078125, "global_step": 60669, "epoch": 501} {"train_loss": -34.87858200073242, "global_step": 60670, "epoch": 501} {"train_loss": -33.93204879760742, "global_step": 60671, "epoch": 501} {"train_loss": -34.383304595947266, "global_step": 60672, "epoch": 501} {"train_loss": -34.28548049926758, "global_step": 60673, "epoch": 501} {"train_loss": -33.260169982910156, "global_step": 60674, "epoch": 501} {"train_loss": -34.15135192871094, "global_step": 60675, "epoch": 501} {"train_loss": -34.0305061340332, "global_step": 60676, "epoch": 501} {"train_loss": -33.966796875, "global_step": 60677, "epoch": 501} {"train_loss": -35.22092819213867, "global_step": 60678, "epoch": 501} {"train_loss": -34.269466400146484, "global_step": 60679, "epoch": 501} {"train_loss": -34.34113693237305, "global_step": 60680, "epoch": 501} {"train_loss": -35.154090881347656, "global_step": 60681, "epoch": 501} {"train_loss": -34.69582748413086, "global_step": 60682, "epoch": 501} {"train_loss": -34.37268829345703, "global_step": 60683, "epoch": 501} {"train_loss": -34.48250198364258, "global_step": 60684, "epoch": 501} {"train_loss": -35.12522506713867, "global_step": 60685, "epoch": 501} {"train_loss": -34.6043815612793, "global_step": 60686, "epoch": 501} {"train_loss": -34.9965705871582, "global_step": 60687, "epoch": 501} {"train_loss": -35.030784606933594, "global_step": 60688, "epoch": 501} {"train_loss": -34.928199768066406, "global_step": 60689, "epoch": 501} {"train_loss": -35.45085525512695, "global_step": 60690, "epoch": 501} {"train_loss": -35.251285552978516, "global_step": 60691, "epoch": 501} {"train_loss": -35.09645080566406, "global_step": 60692, "epoch": 501} {"train_loss": -35.004554748535156, "global_step": 60693, "epoch": 501} {"train_loss": -35.06144714355469, "global_step": 60694, "epoch": 501} {"train_loss": -35.49558639526367, "global_step": 60695, "epoch": 501} {"train_loss": -35.14706039428711, "global_step": 60696, "epoch": 501} {"train_loss": -34.37055206298828, "global_step": 60697, "epoch": 501} {"train_loss": -35.02436447143555, "global_step": 60698, "epoch": 501} {"train_loss": -35.607582092285156, "global_step": 60699, "epoch": 501} {"train_loss": -35.176753997802734, "global_step": 60700, "epoch": 501} {"train_loss": -35.36079025268555, "global_step": 60701, "epoch": 501} {"train_loss": -35.143917083740234, "global_step": 60702, "epoch": 501} {"train_loss": -35.89115524291992, "global_step": 60703, "epoch": 501} {"train_loss": -34.9119987487793, "global_step": 60704, "epoch": 501} {"train_loss": -34.442298889160156, "global_step": 60705, "epoch": 501} {"train_loss": -34.708492279052734, "global_step": 60706, "epoch": 501} {"train_loss": -35.499305725097656, "global_step": 60707, "epoch": 501} {"train_loss": -35.625831604003906, "global_step": 60708, "epoch": 501} {"train_loss": -35.6498908996582, "global_step": 60709, "epoch": 501} {"train_loss": -35.31352996826172, "global_step": 60710, "epoch": 501} {"train_loss": -34.33729553222656, "global_step": 60711, "epoch": 501} {"train_loss": -36.02363204956055, "global_step": 60712, "epoch": 501} {"train_loss": -35.6656494140625, "global_step": 60713, "epoch": 501} {"train_loss": -35.34410858154297, "global_step": 60714, "epoch": 501} {"train_loss": -35.56345748901367, "global_step": 60715, "epoch": 501} {"train_loss": -34.92948532104492, "global_step": 60716, "epoch": 501} {"train_loss": -35.037384033203125, "global_step": 60717, "epoch": 501} {"train_loss": -33.30352783203125, "global_step": 60718, "epoch": 501} {"train_loss": -35.359466552734375, "global_step": 60719, "epoch": 501} {"train_loss": -34.360328674316406, "global_step": 60720, "epoch": 501} {"train_loss": -35.51206970214844, "global_step": 60721, "epoch": 501} {"train_loss": -34.02590560913086, "global_step": 60722, "epoch": 501} {"train_loss": -35.38795852661133, "global_step": 60723, "epoch": 501} {"train_loss": -34.85115432739258, "global_step": 60724, "epoch": 501} {"train_loss": -34.214698791503906, "global_step": 60725, "epoch": 501} {"train_loss": -35.16811752319336, "global_step": 60726, "epoch": 501} {"train_loss": -35.071075439453125, "global_step": 60727, "epoch": 501} {"train_loss": -35.7255744934082, "global_step": 60728, "epoch": 501} {"train_loss": -34.667724609375, "global_step": 60729, "epoch": 501} {"train_loss": -35.59031295776367, "global_step": 60730, "epoch": 501} {"train_loss": -33.40895462036133, "global_step": 60731, "epoch": 501} {"train_loss": -35.953102111816406, "global_step": 60732, "epoch": 501} {"train_loss": -34.997535705566406, "global_step": 60733, "epoch": 501} {"train_loss": -34.794925689697266, "global_step": 60734, "epoch": 501} {"train_loss": -35.60214614868164, "global_step": 60735, "epoch": 501} {"train_loss": -36.32330322265625, "global_step": 60736, "epoch": 501} {"train_loss": -35.31122589111328, "global_step": 60737, "epoch": 501} {"train_loss": -35.37493896484375, "global_step": 60738, "epoch": 501} {"train_loss": -35.09760665893555, "global_step": 60739, "epoch": 501} {"train_loss": -34.84321975708008, "global_step": 60740, "epoch": 501} {"train_loss": -34.33284062787521, "global_step": 60741, "epoch": 501, "val_loss": 2537353.75} {"train_loss": -34.47076416015625, "global_step": 60742, "epoch": 502} {"train_loss": -34.94611740112305, "global_step": 60743, "epoch": 502} {"train_loss": -35.594058990478516, "global_step": 60744, "epoch": 502} {"train_loss": -35.2979621887207, "global_step": 60745, "epoch": 502} {"train_loss": -34.89445495605469, "global_step": 60746, "epoch": 502} {"train_loss": -35.565242767333984, "global_step": 60747, "epoch": 502} {"train_loss": -35.42021942138672, "global_step": 60748, "epoch": 502} {"train_loss": -34.472686767578125, "global_step": 60749, "epoch": 502} {"train_loss": -35.680397033691406, "global_step": 60750, "epoch": 502} {"train_loss": -36.30513381958008, "global_step": 60751, "epoch": 502} {"train_loss": -34.40675735473633, "global_step": 60752, "epoch": 502} {"train_loss": -35.72581100463867, "global_step": 60753, "epoch": 502} {"train_loss": -35.656593322753906, "global_step": 60754, "epoch": 502} {"train_loss": -35.60982894897461, "global_step": 60755, "epoch": 502} {"train_loss": -34.231510162353516, "global_step": 60756, "epoch": 502} {"train_loss": -30.484302520751953, "global_step": 60757, "epoch": 502} {"train_loss": -23.908649444580078, "global_step": 60758, "epoch": 502} {"train_loss": -15.61913776397705, "global_step": 60759, "epoch": 502} {"train_loss": -22.428159713745117, "global_step": 60760, "epoch": 502} {"train_loss": -34.37984848022461, "global_step": 60761, "epoch": 502} {"train_loss": -25.07620620727539, "global_step": 60762, "epoch": 502} {"train_loss": -35.11817932128906, "global_step": 60763, "epoch": 502} {"train_loss": -29.308103561401367, "global_step": 60764, "epoch": 502} {"train_loss": -35.277713775634766, "global_step": 60765, "epoch": 502} {"train_loss": -31.3397274017334, "global_step": 60766, "epoch": 502} {"train_loss": -33.54386520385742, "global_step": 60767, "epoch": 502} {"train_loss": -33.59397888183594, "global_step": 60768, "epoch": 502} {"train_loss": -32.566497802734375, "global_step": 60769, "epoch": 502} {"train_loss": -34.96466827392578, "global_step": 60770, "epoch": 502} {"train_loss": -34.5977668762207, "global_step": 60771, "epoch": 502} {"train_loss": -33.590728759765625, "global_step": 60772, "epoch": 502} {"train_loss": -35.248477935791016, "global_step": 60773, "epoch": 502} {"train_loss": -35.282222747802734, "global_step": 60774, "epoch": 502} {"train_loss": -34.46397018432617, "global_step": 60775, "epoch": 502} {"train_loss": -34.92387008666992, "global_step": 60776, "epoch": 502} {"train_loss": -35.82955551147461, "global_step": 60777, "epoch": 502} {"train_loss": -34.382347106933594, "global_step": 60778, "epoch": 502} {"train_loss": -34.08768844604492, "global_step": 60779, "epoch": 502} {"train_loss": -35.093475341796875, "global_step": 60780, "epoch": 502} {"train_loss": -35.28003692626953, "global_step": 60781, "epoch": 502} {"train_loss": -33.994651794433594, "global_step": 60782, "epoch": 502} {"train_loss": -35.42739486694336, "global_step": 60783, "epoch": 502} {"train_loss": -35.58443069458008, "global_step": 60784, "epoch": 502} {"train_loss": -35.31891632080078, "global_step": 60785, "epoch": 502} {"train_loss": -35.4790153503418, "global_step": 60786, "epoch": 502} {"train_loss": -34.89536666870117, "global_step": 60787, "epoch": 502} {"train_loss": -35.66785430908203, "global_step": 60788, "epoch": 502} {"train_loss": -35.598358154296875, "global_step": 60789, "epoch": 502} {"train_loss": -35.60302734375, "global_step": 60790, "epoch": 502} {"train_loss": -35.76923370361328, "global_step": 60791, "epoch": 502} {"train_loss": -35.679656982421875, "global_step": 60792, "epoch": 502} {"train_loss": -35.97158432006836, "global_step": 60793, "epoch": 502} {"train_loss": -35.22214126586914, "global_step": 60794, "epoch": 502} {"train_loss": -35.42399215698242, "global_step": 60795, "epoch": 502} {"train_loss": -36.066856384277344, "global_step": 60796, "epoch": 502} {"train_loss": -35.85007858276367, "global_step": 60797, "epoch": 502} {"train_loss": -36.64129638671875, "global_step": 60798, "epoch": 502} {"train_loss": -36.013179779052734, "global_step": 60799, "epoch": 502} {"train_loss": -36.167842864990234, "global_step": 60800, "epoch": 502} {"train_loss": -36.05054473876953, "global_step": 60801, "epoch": 502} {"train_loss": -35.38261795043945, "global_step": 60802, "epoch": 502} {"train_loss": -36.32094955444336, "global_step": 60803, "epoch": 502} {"train_loss": -36.43955612182617, "global_step": 60804, "epoch": 502} {"train_loss": -36.36176300048828, "global_step": 60805, "epoch": 502} {"train_loss": -36.504058837890625, "global_step": 60806, "epoch": 502} {"train_loss": -36.4761962890625, "global_step": 60807, "epoch": 502} {"train_loss": -36.530853271484375, "global_step": 60808, "epoch": 502} {"train_loss": -36.40060043334961, "global_step": 60809, "epoch": 502} {"train_loss": -36.23630905151367, "global_step": 60810, "epoch": 502} {"train_loss": -36.595088958740234, "global_step": 60811, "epoch": 502} {"train_loss": -36.7254753112793, "global_step": 60812, "epoch": 502} {"train_loss": -36.236019134521484, "global_step": 60813, "epoch": 502} {"train_loss": -36.018253326416016, "global_step": 60814, "epoch": 502} {"train_loss": -36.368080139160156, "global_step": 60815, "epoch": 502} {"train_loss": -36.95100784301758, "global_step": 60816, "epoch": 502} {"train_loss": -36.038421630859375, "global_step": 60817, "epoch": 502} {"train_loss": -33.81543731689453, "global_step": 60818, "epoch": 502} {"train_loss": -32.60107421875, "global_step": 60819, "epoch": 502} {"train_loss": -33.154518127441406, "global_step": 60820, "epoch": 502} {"train_loss": -33.566890716552734, "global_step": 60821, "epoch": 502} {"train_loss": -34.94940948486328, "global_step": 60822, "epoch": 502} {"train_loss": -34.06447982788086, "global_step": 60823, "epoch": 502} {"train_loss": -32.72371292114258, "global_step": 60824, "epoch": 502} {"train_loss": -31.51783561706543, "global_step": 60825, "epoch": 502} {"train_loss": -31.842008590698242, "global_step": 60826, "epoch": 502} {"train_loss": -33.214229583740234, "global_step": 60827, "epoch": 502} {"train_loss": -34.780792236328125, "global_step": 60828, "epoch": 502} {"train_loss": -32.534915924072266, "global_step": 60829, "epoch": 502} {"train_loss": -32.314205169677734, "global_step": 60830, "epoch": 502} {"train_loss": -32.30984115600586, "global_step": 60831, "epoch": 502} {"train_loss": -33.363441467285156, "global_step": 60832, "epoch": 502} {"train_loss": -29.794544219970703, "global_step": 60833, "epoch": 502} {"train_loss": -33.34370040893555, "global_step": 60834, "epoch": 502} {"train_loss": -30.263864517211914, "global_step": 60835, "epoch": 502} {"train_loss": -33.257972717285156, "global_step": 60836, "epoch": 502} {"train_loss": -32.862831115722656, "global_step": 60837, "epoch": 502} {"train_loss": -33.44330596923828, "global_step": 60838, "epoch": 502} {"train_loss": -32.63372039794922, "global_step": 60839, "epoch": 502} {"train_loss": -33.47993850708008, "global_step": 60840, "epoch": 502} {"train_loss": -34.431209564208984, "global_step": 60841, "epoch": 502} {"train_loss": -33.75193405151367, "global_step": 60842, "epoch": 502} {"train_loss": -33.24880599975586, "global_step": 60843, "epoch": 502} {"train_loss": -33.03327178955078, "global_step": 60844, "epoch": 502} {"train_loss": -35.09307098388672, "global_step": 60845, "epoch": 502} {"train_loss": -34.6403923034668, "global_step": 60846, "epoch": 502} {"train_loss": -34.39553451538086, "global_step": 60847, "epoch": 502} {"train_loss": -33.64735794067383, "global_step": 60848, "epoch": 502} {"train_loss": -34.92136001586914, "global_step": 60849, "epoch": 502} {"train_loss": -34.08964157104492, "global_step": 60850, "epoch": 502} {"train_loss": -35.25885772705078, "global_step": 60851, "epoch": 502} {"train_loss": -34.45748519897461, "global_step": 60852, "epoch": 502} {"train_loss": -34.518646240234375, "global_step": 60853, "epoch": 502} {"train_loss": -34.35834884643555, "global_step": 60854, "epoch": 502} {"train_loss": -34.8167724609375, "global_step": 60855, "epoch": 502} {"train_loss": -34.38563537597656, "global_step": 60856, "epoch": 502} {"train_loss": -35.15039825439453, "global_step": 60857, "epoch": 502} {"train_loss": -34.66193771362305, "global_step": 60858, "epoch": 502} {"train_loss": -35.537899017333984, "global_step": 60859, "epoch": 502} {"train_loss": -35.11605453491211, "global_step": 60860, "epoch": 502} {"train_loss": -35.103477478027344, "global_step": 60861, "epoch": 502} {"train_loss": -34.20225497316723, "global_step": 60862, "epoch": 502, "val_loss": 2633384.25} {"train_loss": -35.15945053100586, "global_step": 60863, "epoch": 503} {"train_loss": -35.29609680175781, "global_step": 60864, "epoch": 503} {"train_loss": -35.079341888427734, "global_step": 60865, "epoch": 503} {"train_loss": -35.61940383911133, "global_step": 60866, "epoch": 503} {"train_loss": -34.560848236083984, "global_step": 60867, "epoch": 503} {"train_loss": -34.89583969116211, "global_step": 60868, "epoch": 503} {"train_loss": -34.93390655517578, "global_step": 60869, "epoch": 503} {"train_loss": -34.66875076293945, "global_step": 60870, "epoch": 503} {"train_loss": -34.66058349609375, "global_step": 60871, "epoch": 503} {"train_loss": -35.67489242553711, "global_step": 60872, "epoch": 503} {"train_loss": -35.47235870361328, "global_step": 60873, "epoch": 503} {"train_loss": -34.57574462890625, "global_step": 60874, "epoch": 503} {"train_loss": -34.90096664428711, "global_step": 60875, "epoch": 503} {"train_loss": -35.59475326538086, "global_step": 60876, "epoch": 503} {"train_loss": -35.677547454833984, "global_step": 60877, "epoch": 503} {"train_loss": -35.70069122314453, "global_step": 60878, "epoch": 503} {"train_loss": -34.987117767333984, "global_step": 60879, "epoch": 503} {"train_loss": -34.857276916503906, "global_step": 60880, "epoch": 503} {"train_loss": -35.67474365234375, "global_step": 60881, "epoch": 503} {"train_loss": -34.89229202270508, "global_step": 60882, "epoch": 503} {"train_loss": -35.27069091796875, "global_step": 60883, "epoch": 503} {"train_loss": -33.08793258666992, "global_step": 60884, "epoch": 503} {"train_loss": -35.45514678955078, "global_step": 60885, "epoch": 503} {"train_loss": -35.68727493286133, "global_step": 60886, "epoch": 503} {"train_loss": -34.35067367553711, "global_step": 60887, "epoch": 503} {"train_loss": -34.986263275146484, "global_step": 60888, "epoch": 503} {"train_loss": -34.84303665161133, "global_step": 60889, "epoch": 503} {"train_loss": -33.95869827270508, "global_step": 60890, "epoch": 503} {"train_loss": -35.51467514038086, "global_step": 60891, "epoch": 503} {"train_loss": -35.60202407836914, "global_step": 60892, "epoch": 503} {"train_loss": -33.65470886230469, "global_step": 60893, "epoch": 503} {"train_loss": -35.0753288269043, "global_step": 60894, "epoch": 503} {"train_loss": -35.27125930786133, "global_step": 60895, "epoch": 503} {"train_loss": -34.160884857177734, "global_step": 60896, "epoch": 503} {"train_loss": -35.22308349609375, "global_step": 60897, "epoch": 503} {"train_loss": -34.26393508911133, "global_step": 60898, "epoch": 503} {"train_loss": -32.98966598510742, "global_step": 60899, "epoch": 503} {"train_loss": -34.344993591308594, "global_step": 60900, "epoch": 503} {"train_loss": -34.8649787902832, "global_step": 60901, "epoch": 503} {"train_loss": -34.948516845703125, "global_step": 60902, "epoch": 503} {"train_loss": -33.65767288208008, "global_step": 60903, "epoch": 503} {"train_loss": -32.48369598388672, "global_step": 60904, "epoch": 503} {"train_loss": -31.632253646850586, "global_step": 60905, "epoch": 503} {"train_loss": -32.58967971801758, "global_step": 60906, "epoch": 503} {"train_loss": -35.353111267089844, "global_step": 60907, "epoch": 503} {"train_loss": -33.5670166015625, "global_step": 60908, "epoch": 503} {"train_loss": -32.77158737182617, "global_step": 60909, "epoch": 503} {"train_loss": -35.41252517700195, "global_step": 60910, "epoch": 503} {"train_loss": -35.24653244018555, "global_step": 60911, "epoch": 503} {"train_loss": -34.22187805175781, "global_step": 60912, "epoch": 503} {"train_loss": -34.7923698425293, "global_step": 60913, "epoch": 503} {"train_loss": -34.729427337646484, "global_step": 60914, "epoch": 503} {"train_loss": -34.537899017333984, "global_step": 60915, "epoch": 503} {"train_loss": -35.334083557128906, "global_step": 60916, "epoch": 503} {"train_loss": -34.74549865722656, "global_step": 60917, "epoch": 503} {"train_loss": -34.898468017578125, "global_step": 60918, "epoch": 503} {"train_loss": -35.34064865112305, "global_step": 60919, "epoch": 503} {"train_loss": -34.20119094848633, "global_step": 60920, "epoch": 503} {"train_loss": -35.900447845458984, "global_step": 60921, "epoch": 503} {"train_loss": -35.22663497924805, "global_step": 60922, "epoch": 503} {"train_loss": -34.76362228393555, "global_step": 60923, "epoch": 503} {"train_loss": -35.543067932128906, "global_step": 60924, "epoch": 503} {"train_loss": -34.789794921875, "global_step": 60925, "epoch": 503} {"train_loss": -35.78475570678711, "global_step": 60926, "epoch": 503} {"train_loss": -35.584716796875, "global_step": 60927, "epoch": 503} {"train_loss": -35.504737854003906, "global_step": 60928, "epoch": 503} {"train_loss": -35.842559814453125, "global_step": 60929, "epoch": 503} {"train_loss": -35.40730667114258, "global_step": 60930, "epoch": 503} {"train_loss": -35.35364532470703, "global_step": 60931, "epoch": 503} {"train_loss": -35.57585525512695, "global_step": 60932, "epoch": 503} {"train_loss": -35.752105712890625, "global_step": 60933, "epoch": 503} {"train_loss": -35.940155029296875, "global_step": 60934, "epoch": 503} {"train_loss": -35.928466796875, "global_step": 60935, "epoch": 503} {"train_loss": -36.10158920288086, "global_step": 60936, "epoch": 503} {"train_loss": -36.06624984741211, "global_step": 60937, "epoch": 503} {"train_loss": -35.64420700073242, "global_step": 60938, "epoch": 503} {"train_loss": -36.28152084350586, "global_step": 60939, "epoch": 503} {"train_loss": -35.980224609375, "global_step": 60940, "epoch": 503} {"train_loss": -36.03620147705078, "global_step": 60941, "epoch": 503} {"train_loss": -36.38357162475586, "global_step": 60942, "epoch": 503} {"train_loss": -36.42450714111328, "global_step": 60943, "epoch": 503} {"train_loss": -36.11500930786133, "global_step": 60944, "epoch": 503} {"train_loss": -35.700096130371094, "global_step": 60945, "epoch": 503} {"train_loss": -36.25115966796875, "global_step": 60946, "epoch": 503} {"train_loss": -35.0357780456543, "global_step": 60947, "epoch": 503} {"train_loss": -35.383399963378906, "global_step": 60948, "epoch": 503} {"train_loss": -36.146453857421875, "global_step": 60949, "epoch": 503} {"train_loss": -36.17159652709961, "global_step": 60950, "epoch": 503} {"train_loss": -32.7674674987793, "global_step": 60951, "epoch": 503} {"train_loss": -30.612852096557617, "global_step": 60952, "epoch": 503} {"train_loss": -30.177631378173828, "global_step": 60953, "epoch": 503} {"train_loss": -33.50517654418945, "global_step": 60954, "epoch": 503} {"train_loss": -35.77299118041992, "global_step": 60955, "epoch": 503} {"train_loss": -34.21519470214844, "global_step": 60956, "epoch": 503} {"train_loss": -31.617380142211914, "global_step": 60957, "epoch": 503} {"train_loss": -33.51121139526367, "global_step": 60958, "epoch": 503} {"train_loss": -33.36347961425781, "global_step": 60959, "epoch": 503} {"train_loss": -30.426313400268555, "global_step": 60960, "epoch": 503} {"train_loss": -33.58610153198242, "global_step": 60961, "epoch": 503} {"train_loss": -33.55720138549805, "global_step": 60962, "epoch": 503} {"train_loss": -32.388999938964844, "global_step": 60963, "epoch": 503} {"train_loss": -32.884193420410156, "global_step": 60964, "epoch": 503} {"train_loss": -30.34161376953125, "global_step": 60965, "epoch": 503} {"train_loss": -34.212982177734375, "global_step": 60966, "epoch": 503} {"train_loss": -33.83802032470703, "global_step": 60967, "epoch": 503} {"train_loss": -34.89633560180664, "global_step": 60968, "epoch": 503} {"train_loss": -33.704490661621094, "global_step": 60969, "epoch": 503} {"train_loss": -33.47919464111328, "global_step": 60970, "epoch": 503} {"train_loss": -34.982242584228516, "global_step": 60971, "epoch": 503} {"train_loss": -34.12966537475586, "global_step": 60972, "epoch": 503} {"train_loss": -33.99171447753906, "global_step": 60973, "epoch": 503} {"train_loss": -34.14919662475586, "global_step": 60974, "epoch": 503} {"train_loss": -33.09640121459961, "global_step": 60975, "epoch": 503} {"train_loss": -34.17783737182617, "global_step": 60976, "epoch": 503} {"train_loss": -33.91939926147461, "global_step": 60977, "epoch": 503} {"train_loss": -34.75700378417969, "global_step": 60978, "epoch": 503} {"train_loss": -34.32278060913086, "global_step": 60979, "epoch": 503} {"train_loss": -33.49647903442383, "global_step": 60980, "epoch": 503} {"train_loss": -34.612361907958984, "global_step": 60981, "epoch": 503} {"train_loss": -34.23796081542969, "global_step": 60982, "epoch": 503} {"train_loss": -34.60526363908752, "global_step": 60983, "epoch": 503, "val_loss": 2698857.25} {"train_loss": -32.468055725097656, "global_step": 60984, "epoch": 504} {"train_loss": -34.42226028442383, "global_step": 60985, "epoch": 504} {"train_loss": -30.361984252929688, "global_step": 60986, "epoch": 504} {"train_loss": -33.18166732788086, "global_step": 60987, "epoch": 504} {"train_loss": -34.35783386230469, "global_step": 60988, "epoch": 504} {"train_loss": -32.77325439453125, "global_step": 60989, "epoch": 504} {"train_loss": -33.37419891357422, "global_step": 60990, "epoch": 504} {"train_loss": -34.42362594604492, "global_step": 60991, "epoch": 504} {"train_loss": -34.12076187133789, "global_step": 60992, "epoch": 504} {"train_loss": -34.6062126159668, "global_step": 60993, "epoch": 504} {"train_loss": -34.1358757019043, "global_step": 60994, "epoch": 504} {"train_loss": -34.35398483276367, "global_step": 60995, "epoch": 504} {"train_loss": -33.87390899658203, "global_step": 60996, "epoch": 504} {"train_loss": -34.300819396972656, "global_step": 60997, "epoch": 504} {"train_loss": -34.900978088378906, "global_step": 60998, "epoch": 504} {"train_loss": -34.37746810913086, "global_step": 60999, "epoch": 504} {"train_loss": -35.201263427734375, "global_step": 61000, "epoch": 504} {"train_loss": -34.9157600402832, "global_step": 61001, "epoch": 504} {"train_loss": -34.86798095703125, "global_step": 61002, "epoch": 504} {"train_loss": -34.698577880859375, "global_step": 61003, "epoch": 504} {"train_loss": -33.36975860595703, "global_step": 61004, "epoch": 504} {"train_loss": -34.604270935058594, "global_step": 61005, "epoch": 504} {"train_loss": -34.254398345947266, "global_step": 61006, "epoch": 504} {"train_loss": -34.301937103271484, "global_step": 61007, "epoch": 504} {"train_loss": -35.208099365234375, "global_step": 61008, "epoch": 504} {"train_loss": -34.718379974365234, "global_step": 61009, "epoch": 504} {"train_loss": -34.714656829833984, "global_step": 61010, "epoch": 504} {"train_loss": -34.75309371948242, "global_step": 61011, "epoch": 504} {"train_loss": -34.162696838378906, "global_step": 61012, "epoch": 504} {"train_loss": -34.56075668334961, "global_step": 61013, "epoch": 504} {"train_loss": -35.062313079833984, "global_step": 61014, "epoch": 504} {"train_loss": -34.266029357910156, "global_step": 61015, "epoch": 504} {"train_loss": -35.17450714111328, "global_step": 61016, "epoch": 504} {"train_loss": -35.35856246948242, "global_step": 61017, "epoch": 504} {"train_loss": -34.39081573486328, "global_step": 61018, "epoch": 504} {"train_loss": -35.0288200378418, "global_step": 61019, "epoch": 504} {"train_loss": -34.9517707824707, "global_step": 61020, "epoch": 504} {"train_loss": -35.09557342529297, "global_step": 61021, "epoch": 504} {"train_loss": -34.647335052490234, "global_step": 61022, "epoch": 504} {"train_loss": -34.007389068603516, "global_step": 61023, "epoch": 504} {"train_loss": -34.300418853759766, "global_step": 61024, "epoch": 504} {"train_loss": -35.29917526245117, "global_step": 61025, "epoch": 504} {"train_loss": -34.91933059692383, "global_step": 61026, "epoch": 504} {"train_loss": -35.04309844970703, "global_step": 61027, "epoch": 504} {"train_loss": -35.30807876586914, "global_step": 61028, "epoch": 504} {"train_loss": -35.285797119140625, "global_step": 61029, "epoch": 504} {"train_loss": -35.68668746948242, "global_step": 61030, "epoch": 504} {"train_loss": -35.4556999206543, "global_step": 61031, "epoch": 504} {"train_loss": -35.7407341003418, "global_step": 61032, "epoch": 504} {"train_loss": -35.814266204833984, "global_step": 61033, "epoch": 504} {"train_loss": -35.40796661376953, "global_step": 61034, "epoch": 504} {"train_loss": -35.6803092956543, "global_step": 61035, "epoch": 504} {"train_loss": -36.09511184692383, "global_step": 61036, "epoch": 504} {"train_loss": -36.209999084472656, "global_step": 61037, "epoch": 504} {"train_loss": -35.80389404296875, "global_step": 61038, "epoch": 504} {"train_loss": -35.916622161865234, "global_step": 61039, "epoch": 504} {"train_loss": -36.24469757080078, "global_step": 61040, "epoch": 504} {"train_loss": -35.83608627319336, "global_step": 61041, "epoch": 504} {"train_loss": -35.2775764465332, "global_step": 61042, "epoch": 504} {"train_loss": -36.13344955444336, "global_step": 61043, "epoch": 504} {"train_loss": -36.05877685546875, "global_step": 61044, "epoch": 504} {"train_loss": -36.045021057128906, "global_step": 61045, "epoch": 504} {"train_loss": -35.72982406616211, "global_step": 61046, "epoch": 504} {"train_loss": -35.91476821899414, "global_step": 61047, "epoch": 504} {"train_loss": -35.89141082763672, "global_step": 61048, "epoch": 504} {"train_loss": -35.65289306640625, "global_step": 61049, "epoch": 504} {"train_loss": -35.15558624267578, "global_step": 61050, "epoch": 504} {"train_loss": -34.01175308227539, "global_step": 61051, "epoch": 504} {"train_loss": -32.655662536621094, "global_step": 61052, "epoch": 504} {"train_loss": -32.08877944946289, "global_step": 61053, "epoch": 504} {"train_loss": -34.39506149291992, "global_step": 61054, "epoch": 504} {"train_loss": -34.68734359741211, "global_step": 61055, "epoch": 504} {"train_loss": -35.16752243041992, "global_step": 61056, "epoch": 504} {"train_loss": -35.29045486450195, "global_step": 61057, "epoch": 504} {"train_loss": -35.12473678588867, "global_step": 61058, "epoch": 504} {"train_loss": -35.8597526550293, "global_step": 61059, "epoch": 504} {"train_loss": -36.50320053100586, "global_step": 61060, "epoch": 504} {"train_loss": -36.008399963378906, "global_step": 61061, "epoch": 504} {"train_loss": -35.758792877197266, "global_step": 61062, "epoch": 504} {"train_loss": -36.55073165893555, "global_step": 61063, "epoch": 504} {"train_loss": -36.78467559814453, "global_step": 61064, "epoch": 504} {"train_loss": -36.17591857910156, "global_step": 61065, "epoch": 504} {"train_loss": -34.850677490234375, "global_step": 61066, "epoch": 504} {"train_loss": -36.31209945678711, "global_step": 61067, "epoch": 504} {"train_loss": -35.76234817504883, "global_step": 61068, "epoch": 504} {"train_loss": -36.033321380615234, "global_step": 61069, "epoch": 504} {"train_loss": -35.863826751708984, "global_step": 61070, "epoch": 504} {"train_loss": -35.90523147583008, "global_step": 61071, "epoch": 504} {"train_loss": -35.55089569091797, "global_step": 61072, "epoch": 504} {"train_loss": -34.356964111328125, "global_step": 61073, "epoch": 504} {"train_loss": -35.546199798583984, "global_step": 61074, "epoch": 504} {"train_loss": -34.18111801147461, "global_step": 61075, "epoch": 504} {"train_loss": -35.45473861694336, "global_step": 61076, "epoch": 504} {"train_loss": -33.964900970458984, "global_step": 61077, "epoch": 504} {"train_loss": -35.27558135986328, "global_step": 61078, "epoch": 504} {"train_loss": -33.28861618041992, "global_step": 61079, "epoch": 504} {"train_loss": -30.20890235900879, "global_step": 61080, "epoch": 504} {"train_loss": -27.143112182617188, "global_step": 61081, "epoch": 504} {"train_loss": -31.80765724182129, "global_step": 61082, "epoch": 504} {"train_loss": -35.37744140625, "global_step": 61083, "epoch": 504} {"train_loss": -35.669857025146484, "global_step": 61084, "epoch": 504} {"train_loss": -33.31187057495117, "global_step": 61085, "epoch": 504} {"train_loss": -33.78190231323242, "global_step": 61086, "epoch": 504} {"train_loss": -34.4096565246582, "global_step": 61087, "epoch": 504} {"train_loss": -34.15236282348633, "global_step": 61088, "epoch": 504} {"train_loss": -30.71787452697754, "global_step": 61089, "epoch": 504} {"train_loss": -34.24177169799805, "global_step": 61090, "epoch": 504} {"train_loss": -34.182796478271484, "global_step": 61091, "epoch": 504} {"train_loss": -32.90203094482422, "global_step": 61092, "epoch": 504} {"train_loss": -33.880245208740234, "global_step": 61093, "epoch": 504} {"train_loss": -32.87214279174805, "global_step": 61094, "epoch": 504} {"train_loss": -34.175865173339844, "global_step": 61095, "epoch": 504} {"train_loss": -33.621070861816406, "global_step": 61096, "epoch": 504} {"train_loss": -33.863929748535156, "global_step": 61097, "epoch": 504} {"train_loss": -32.22117614746094, "global_step": 61098, "epoch": 504} {"train_loss": -31.896154403686523, "global_step": 61099, "epoch": 504} {"train_loss": -34.14250564575195, "global_step": 61100, "epoch": 504} {"train_loss": -33.72581100463867, "global_step": 61101, "epoch": 504} {"train_loss": -34.378509521484375, "global_step": 61102, "epoch": 504} {"train_loss": -34.10753631591797, "global_step": 61103, "epoch": 504} {"train_loss": -34.583480645802396, "global_step": 61104, "epoch": 504, "val_loss": 2628189.25} {"train_loss": -33.53791427612305, "global_step": 61105, "epoch": 505} {"train_loss": -34.772579193115234, "global_step": 61106, "epoch": 505} {"train_loss": -34.61795425415039, "global_step": 61107, "epoch": 505} {"train_loss": -33.82169723510742, "global_step": 61108, "epoch": 505} {"train_loss": -33.51179885864258, "global_step": 61109, "epoch": 505} {"train_loss": -33.79390335083008, "global_step": 61110, "epoch": 505} {"train_loss": -33.187564849853516, "global_step": 61111, "epoch": 505} {"train_loss": -34.47443389892578, "global_step": 61112, "epoch": 505} {"train_loss": -34.88111114501953, "global_step": 61113, "epoch": 505} {"train_loss": -34.87907409667969, "global_step": 61114, "epoch": 505} {"train_loss": -35.09926223754883, "global_step": 61115, "epoch": 505} {"train_loss": -34.898921966552734, "global_step": 61116, "epoch": 505} {"train_loss": -34.84332275390625, "global_step": 61117, "epoch": 505} {"train_loss": -35.273338317871094, "global_step": 61118, "epoch": 505} {"train_loss": -34.898193359375, "global_step": 61119, "epoch": 505} {"train_loss": -35.42100143432617, "global_step": 61120, "epoch": 505} {"train_loss": -35.365089416503906, "global_step": 61121, "epoch": 505} {"train_loss": -34.23994064331055, "global_step": 61122, "epoch": 505} {"train_loss": -35.2913932800293, "global_step": 61123, "epoch": 505} {"train_loss": -34.732112884521484, "global_step": 61124, "epoch": 505} {"train_loss": -35.326690673828125, "global_step": 61125, "epoch": 505} {"train_loss": -35.469661712646484, "global_step": 61126, "epoch": 505} {"train_loss": -35.50189971923828, "global_step": 61127, "epoch": 505} {"train_loss": -35.34457015991211, "global_step": 61128, "epoch": 505} {"train_loss": -35.320220947265625, "global_step": 61129, "epoch": 505} {"train_loss": -35.075355529785156, "global_step": 61130, "epoch": 505} {"train_loss": -34.27079391479492, "global_step": 61131, "epoch": 505} {"train_loss": -34.84542465209961, "global_step": 61132, "epoch": 505} {"train_loss": -34.56429672241211, "global_step": 61133, "epoch": 505} {"train_loss": -35.928524017333984, "global_step": 61134, "epoch": 505} {"train_loss": -34.75958251953125, "global_step": 61135, "epoch": 505} {"train_loss": -35.71333312988281, "global_step": 61136, "epoch": 505} {"train_loss": -35.576934814453125, "global_step": 61137, "epoch": 505} {"train_loss": -34.99992752075195, "global_step": 61138, "epoch": 505} {"train_loss": -35.466609954833984, "global_step": 61139, "epoch": 505} {"train_loss": -35.70846939086914, "global_step": 61140, "epoch": 505} {"train_loss": -35.49678421020508, "global_step": 61141, "epoch": 505} {"train_loss": -36.2661247253418, "global_step": 61142, "epoch": 505} {"train_loss": -35.763336181640625, "global_step": 61143, "epoch": 505} {"train_loss": -35.99585723876953, "global_step": 61144, "epoch": 505} {"train_loss": -35.365623474121094, "global_step": 61145, "epoch": 505} {"train_loss": -36.263126373291016, "global_step": 61146, "epoch": 505} {"train_loss": -35.94488525390625, "global_step": 61147, "epoch": 505} {"train_loss": -36.437862396240234, "global_step": 61148, "epoch": 505} {"train_loss": -35.65690231323242, "global_step": 61149, "epoch": 505} {"train_loss": -36.49956130981445, "global_step": 61150, "epoch": 505} {"train_loss": -36.19647979736328, "global_step": 61151, "epoch": 505} {"train_loss": -36.27874755859375, "global_step": 61152, "epoch": 505} {"train_loss": -35.981510162353516, "global_step": 61153, "epoch": 505} {"train_loss": -36.35649108886719, "global_step": 61154, "epoch": 505} {"train_loss": -36.47723388671875, "global_step": 61155, "epoch": 505} {"train_loss": -36.59806442260742, "global_step": 61156, "epoch": 505} {"train_loss": -36.52250289916992, "global_step": 61157, "epoch": 505} {"train_loss": -36.73472213745117, "global_step": 61158, "epoch": 505} {"train_loss": -36.544700622558594, "global_step": 61159, "epoch": 505} {"train_loss": -36.864742279052734, "global_step": 61160, "epoch": 505} {"train_loss": -36.79411697387695, "global_step": 61161, "epoch": 505} {"train_loss": -36.464473724365234, "global_step": 61162, "epoch": 505} {"train_loss": -35.67512130737305, "global_step": 61163, "epoch": 505} {"train_loss": -36.01884841918945, "global_step": 61164, "epoch": 505} {"train_loss": -36.446685791015625, "global_step": 61165, "epoch": 505} {"train_loss": -36.86179733276367, "global_step": 61166, "epoch": 505} {"train_loss": -36.50442123413086, "global_step": 61167, "epoch": 505} {"train_loss": -35.42021560668945, "global_step": 61168, "epoch": 505} {"train_loss": -33.92387008666992, "global_step": 61169, "epoch": 505} {"train_loss": -34.06342315673828, "global_step": 61170, "epoch": 505} {"train_loss": -35.88328170776367, "global_step": 61171, "epoch": 505} {"train_loss": -36.474571228027344, "global_step": 61172, "epoch": 505} {"train_loss": -36.53789138793945, "global_step": 61173, "epoch": 505} {"train_loss": -35.366127014160156, "global_step": 61174, "epoch": 505} {"train_loss": -35.09687423706055, "global_step": 61175, "epoch": 505} {"train_loss": -34.076263427734375, "global_step": 61176, "epoch": 505} {"train_loss": -36.04322052001953, "global_step": 61177, "epoch": 505} {"train_loss": -35.37406539916992, "global_step": 61178, "epoch": 505} {"train_loss": -33.66639709472656, "global_step": 61179, "epoch": 505} {"train_loss": -34.9446907043457, "global_step": 61180, "epoch": 505} {"train_loss": -36.76430130004883, "global_step": 61181, "epoch": 505} {"train_loss": -35.02896499633789, "global_step": 61182, "epoch": 505} {"train_loss": -33.45319366455078, "global_step": 61183, "epoch": 505} {"train_loss": -34.21590805053711, "global_step": 61184, "epoch": 505} {"train_loss": -34.98396682739258, "global_step": 61185, "epoch": 505} {"train_loss": -35.96086120605469, "global_step": 61186, "epoch": 505} {"train_loss": -34.1690559387207, "global_step": 61187, "epoch": 505} {"train_loss": -34.56349563598633, "global_step": 61188, "epoch": 505} {"train_loss": -35.1846809387207, "global_step": 61189, "epoch": 505} {"train_loss": -33.93870162963867, "global_step": 61190, "epoch": 505} {"train_loss": -35.27351760864258, "global_step": 61191, "epoch": 505} {"train_loss": -35.82240676879883, "global_step": 61192, "epoch": 505} {"train_loss": -35.839439392089844, "global_step": 61193, "epoch": 505} {"train_loss": -35.94418716430664, "global_step": 61194, "epoch": 505} {"train_loss": -36.064064025878906, "global_step": 61195, "epoch": 505} {"train_loss": -35.06166458129883, "global_step": 61196, "epoch": 505} {"train_loss": -35.900333404541016, "global_step": 61197, "epoch": 505} {"train_loss": -35.72227096557617, "global_step": 61198, "epoch": 505} {"train_loss": -35.70509338378906, "global_step": 61199, "epoch": 505} {"train_loss": -34.75727844238281, "global_step": 61200, "epoch": 505} {"train_loss": -36.57141876220703, "global_step": 61201, "epoch": 505} {"train_loss": -35.56093978881836, "global_step": 61202, "epoch": 505} {"train_loss": -36.13874816894531, "global_step": 61203, "epoch": 505} {"train_loss": -34.642696380615234, "global_step": 61204, "epoch": 505} {"train_loss": -35.564453125, "global_step": 61205, "epoch": 505} {"train_loss": -35.2424201965332, "global_step": 61206, "epoch": 505} {"train_loss": -34.09371566772461, "global_step": 61207, "epoch": 505} {"train_loss": -35.375831604003906, "global_step": 61208, "epoch": 505} {"train_loss": -35.74517822265625, "global_step": 61209, "epoch": 505} {"train_loss": -33.8604850769043, "global_step": 61210, "epoch": 505} {"train_loss": -34.871639251708984, "global_step": 61211, "epoch": 505} {"train_loss": -35.829498291015625, "global_step": 61212, "epoch": 505} {"train_loss": -33.96967315673828, "global_step": 61213, "epoch": 505} {"train_loss": -36.05141067504883, "global_step": 61214, "epoch": 505} {"train_loss": -35.141963958740234, "global_step": 61215, "epoch": 505} {"train_loss": -35.496337890625, "global_step": 61216, "epoch": 505} {"train_loss": -35.052120208740234, "global_step": 61217, "epoch": 505} {"train_loss": -35.45320510864258, "global_step": 61218, "epoch": 505} {"train_loss": -35.97478103637695, "global_step": 61219, "epoch": 505} {"train_loss": -35.96828842163086, "global_step": 61220, "epoch": 505} {"train_loss": -36.0162353515625, "global_step": 61221, "epoch": 505} {"train_loss": -35.73002243041992, "global_step": 61222, "epoch": 505} {"train_loss": -35.39226531982422, "global_step": 61223, "epoch": 505} {"train_loss": -35.84170150756836, "global_step": 61224, "epoch": 505} {"train_loss": -35.37453337740307, "global_step": 61225, "epoch": 505, "val_loss": 2568405.25} {"train_loss": -35.33513259887695, "global_step": 61226, "epoch": 506} {"train_loss": -35.3917236328125, "global_step": 61227, "epoch": 506} {"train_loss": -36.08323287963867, "global_step": 61228, "epoch": 506} {"train_loss": -34.71046829223633, "global_step": 61229, "epoch": 506} {"train_loss": -34.641395568847656, "global_step": 61230, "epoch": 506} {"train_loss": -34.08639144897461, "global_step": 61231, "epoch": 506} {"train_loss": -35.937835693359375, "global_step": 61232, "epoch": 506} {"train_loss": -35.80715560913086, "global_step": 61233, "epoch": 506} {"train_loss": -33.830074310302734, "global_step": 61234, "epoch": 506} {"train_loss": -35.331939697265625, "global_step": 61235, "epoch": 506} {"train_loss": -34.112525939941406, "global_step": 61236, "epoch": 506} {"train_loss": -32.96944808959961, "global_step": 61237, "epoch": 506} {"train_loss": -30.94293785095215, "global_step": 61238, "epoch": 506} {"train_loss": -32.240108489990234, "global_step": 61239, "epoch": 506} {"train_loss": -34.73590850830078, "global_step": 61240, "epoch": 506} {"train_loss": -31.822778701782227, "global_step": 61241, "epoch": 506} {"train_loss": -33.675899505615234, "global_step": 61242, "epoch": 506} {"train_loss": -33.40651321411133, "global_step": 61243, "epoch": 506} {"train_loss": -34.75461959838867, "global_step": 61244, "epoch": 506} {"train_loss": -32.002079010009766, "global_step": 61245, "epoch": 506} {"train_loss": -33.09554672241211, "global_step": 61246, "epoch": 506} {"train_loss": -35.74441146850586, "global_step": 61247, "epoch": 506} {"train_loss": -35.06892395019531, "global_step": 61248, "epoch": 506} {"train_loss": -35.11094284057617, "global_step": 61249, "epoch": 506} {"train_loss": -34.738826751708984, "global_step": 61250, "epoch": 506} {"train_loss": -34.66157150268555, "global_step": 61251, "epoch": 506} {"train_loss": -29.316858291625977, "global_step": 61252, "epoch": 506} {"train_loss": -35.635353088378906, "global_step": 61253, "epoch": 506} {"train_loss": -35.019752502441406, "global_step": 61254, "epoch": 506} {"train_loss": -34.783103942871094, "global_step": 61255, "epoch": 506} {"train_loss": -34.7305793762207, "global_step": 61256, "epoch": 506} {"train_loss": -35.052520751953125, "global_step": 61257, "epoch": 506} {"train_loss": -32.574371337890625, "global_step": 61258, "epoch": 506} {"train_loss": -31.92959976196289, "global_step": 61259, "epoch": 506} {"train_loss": -34.08329391479492, "global_step": 61260, "epoch": 506} {"train_loss": -34.871273040771484, "global_step": 61261, "epoch": 506} {"train_loss": -34.40871047973633, "global_step": 61262, "epoch": 506} {"train_loss": -35.394474029541016, "global_step": 61263, "epoch": 506} {"train_loss": -34.559608459472656, "global_step": 61264, "epoch": 506} {"train_loss": -34.966041564941406, "global_step": 61265, "epoch": 506} {"train_loss": -34.47673797607422, "global_step": 61266, "epoch": 506} {"train_loss": -32.65688705444336, "global_step": 61267, "epoch": 506} {"train_loss": -34.896724700927734, "global_step": 61268, "epoch": 506} {"train_loss": -33.60200119018555, "global_step": 61269, "epoch": 506} {"train_loss": -34.58646774291992, "global_step": 61270, "epoch": 506} {"train_loss": -34.76762008666992, "global_step": 61271, "epoch": 506} {"train_loss": -34.65199661254883, "global_step": 61272, "epoch": 506} {"train_loss": -34.53828811645508, "global_step": 61273, "epoch": 506} {"train_loss": -34.30259323120117, "global_step": 61274, "epoch": 506} {"train_loss": -34.3077278137207, "global_step": 61275, "epoch": 506} {"train_loss": -34.780086517333984, "global_step": 61276, "epoch": 506} {"train_loss": -34.17096710205078, "global_step": 61277, "epoch": 506} {"train_loss": -34.34110641479492, "global_step": 61278, "epoch": 506} {"train_loss": -33.36774826049805, "global_step": 61279, "epoch": 506} {"train_loss": -33.7428092956543, "global_step": 61280, "epoch": 506} {"train_loss": -35.54669952392578, "global_step": 61281, "epoch": 506} {"train_loss": -34.565147399902344, "global_step": 61282, "epoch": 506} {"train_loss": -34.969078063964844, "global_step": 61283, "epoch": 506} {"train_loss": -35.05489730834961, "global_step": 61284, "epoch": 506} {"train_loss": -34.013885498046875, "global_step": 61285, "epoch": 506} {"train_loss": -35.56459045410156, "global_step": 61286, "epoch": 506} {"train_loss": -33.936458587646484, "global_step": 61287, "epoch": 506} {"train_loss": -35.53487777709961, "global_step": 61288, "epoch": 506} {"train_loss": -35.81052017211914, "global_step": 61289, "epoch": 506} {"train_loss": -35.64896774291992, "global_step": 61290, "epoch": 506} {"train_loss": -34.417091369628906, "global_step": 61291, "epoch": 506} {"train_loss": -35.28766632080078, "global_step": 61292, "epoch": 506} {"train_loss": -35.14908218383789, "global_step": 61293, "epoch": 506} {"train_loss": -34.205726623535156, "global_step": 61294, "epoch": 506} {"train_loss": -34.90840148925781, "global_step": 61295, "epoch": 506} {"train_loss": -35.17552947998047, "global_step": 61296, "epoch": 506} {"train_loss": -35.369720458984375, "global_step": 61297, "epoch": 506} {"train_loss": -35.76695251464844, "global_step": 61298, "epoch": 506} {"train_loss": -35.93856430053711, "global_step": 61299, "epoch": 506} {"train_loss": -35.84322738647461, "global_step": 61300, "epoch": 506} {"train_loss": -35.65293502807617, "global_step": 61301, "epoch": 506} {"train_loss": -35.810604095458984, "global_step": 61302, "epoch": 506} {"train_loss": -34.6760368347168, "global_step": 61303, "epoch": 506} {"train_loss": -35.648536682128906, "global_step": 61304, "epoch": 506} {"train_loss": -35.80450439453125, "global_step": 61305, "epoch": 506} {"train_loss": -35.751853942871094, "global_step": 61306, "epoch": 506} {"train_loss": -35.98622131347656, "global_step": 61307, "epoch": 506} {"train_loss": -35.3577766418457, "global_step": 61308, "epoch": 506} {"train_loss": -36.285438537597656, "global_step": 61309, "epoch": 506} {"train_loss": -36.103919982910156, "global_step": 61310, "epoch": 506} {"train_loss": -35.79759979248047, "global_step": 61311, "epoch": 506} {"train_loss": -34.793880462646484, "global_step": 61312, "epoch": 506} {"train_loss": -34.48240280151367, "global_step": 61313, "epoch": 506} {"train_loss": -33.70471954345703, "global_step": 61314, "epoch": 506} {"train_loss": -35.12702178955078, "global_step": 61315, "epoch": 506} {"train_loss": -36.40754318237305, "global_step": 61316, "epoch": 506} {"train_loss": -35.96479415893555, "global_step": 61317, "epoch": 506} {"train_loss": -35.340450286865234, "global_step": 61318, "epoch": 506} {"train_loss": -35.77018356323242, "global_step": 61319, "epoch": 506} {"train_loss": -35.52570724487305, "global_step": 61320, "epoch": 506} {"train_loss": -34.32857894897461, "global_step": 61321, "epoch": 506} {"train_loss": -34.63886642456055, "global_step": 61322, "epoch": 506} {"train_loss": -34.697391510009766, "global_step": 61323, "epoch": 506} {"train_loss": -35.26691818237305, "global_step": 61324, "epoch": 506} {"train_loss": -35.38228988647461, "global_step": 61325, "epoch": 506} {"train_loss": -35.10974884033203, "global_step": 61326, "epoch": 506} {"train_loss": -34.24863052368164, "global_step": 61327, "epoch": 506} {"train_loss": -35.5161018371582, "global_step": 61328, "epoch": 506} {"train_loss": -36.484764099121094, "global_step": 61329, "epoch": 506} {"train_loss": -35.62949752807617, "global_step": 61330, "epoch": 506} {"train_loss": -35.5224723815918, "global_step": 61331, "epoch": 506} {"train_loss": -35.699790954589844, "global_step": 61332, "epoch": 506} {"train_loss": -35.668006896972656, "global_step": 61333, "epoch": 506} {"train_loss": -34.6611328125, "global_step": 61334, "epoch": 506} {"train_loss": -36.394901275634766, "global_step": 61335, "epoch": 506} {"train_loss": -36.25118637084961, "global_step": 61336, "epoch": 506} {"train_loss": -35.484920501708984, "global_step": 61337, "epoch": 506} {"train_loss": -36.381317138671875, "global_step": 61338, "epoch": 506} {"train_loss": -36.31122589111328, "global_step": 61339, "epoch": 506} {"train_loss": -36.61532211303711, "global_step": 61340, "epoch": 506} {"train_loss": -36.28278732299805, "global_step": 61341, "epoch": 506} {"train_loss": -36.608821868896484, "global_step": 61342, "epoch": 506} {"train_loss": -35.88843536376953, "global_step": 61343, "epoch": 506} {"train_loss": -35.74078369140625, "global_step": 61344, "epoch": 506} {"train_loss": -34.88213348388672, "global_step": 61345, "epoch": 506} {"train_loss": -34.87488734032497, "global_step": 61346, "epoch": 506, "val_loss": 2591523.25} {"train_loss": -36.69986343383789, "global_step": 61347, "epoch": 507} {"train_loss": -35.9195671081543, "global_step": 61348, "epoch": 507} {"train_loss": -35.743011474609375, "global_step": 61349, "epoch": 507} {"train_loss": -35.887508392333984, "global_step": 61350, "epoch": 507} {"train_loss": -36.40125274658203, "global_step": 61351, "epoch": 507} {"train_loss": -34.36553955078125, "global_step": 61352, "epoch": 507} {"train_loss": -35.06814193725586, "global_step": 61353, "epoch": 507} {"train_loss": -35.305789947509766, "global_step": 61354, "epoch": 507} {"train_loss": -34.918331146240234, "global_step": 61355, "epoch": 507} {"train_loss": -35.060115814208984, "global_step": 61356, "epoch": 507} {"train_loss": -32.980873107910156, "global_step": 61357, "epoch": 507} {"train_loss": -30.055524826049805, "global_step": 61358, "epoch": 507} {"train_loss": -20.61318016052246, "global_step": 61359, "epoch": 507} {"train_loss": -4.94373083114624, "global_step": 61360, "epoch": 507} {"train_loss": -24.38918113708496, "global_step": 61361, "epoch": 507} {"train_loss": -29.876352310180664, "global_step": 61362, "epoch": 507} {"train_loss": -21.67799949645996, "global_step": 61363, "epoch": 507} {"train_loss": -31.100500106811523, "global_step": 61364, "epoch": 507} {"train_loss": -28.0986385345459, "global_step": 61365, "epoch": 507} {"train_loss": -29.107763290405273, "global_step": 61366, "epoch": 507} {"train_loss": -34.05408477783203, "global_step": 61367, "epoch": 507} {"train_loss": -27.538883209228516, "global_step": 61368, "epoch": 507} {"train_loss": -29.802398681640625, "global_step": 61369, "epoch": 507} {"train_loss": -34.77326583862305, "global_step": 61370, "epoch": 507} {"train_loss": -30.40389060974121, "global_step": 61371, "epoch": 507} {"train_loss": -32.1290397644043, "global_step": 61372, "epoch": 507} {"train_loss": -33.55958557128906, "global_step": 61373, "epoch": 507} {"train_loss": -34.044219970703125, "global_step": 61374, "epoch": 507} {"train_loss": -33.12348556518555, "global_step": 61375, "epoch": 507} {"train_loss": -34.14377975463867, "global_step": 61376, "epoch": 507} {"train_loss": -34.49650192260742, "global_step": 61377, "epoch": 507} {"train_loss": -34.87843704223633, "global_step": 61378, "epoch": 507} {"train_loss": -34.24868392944336, "global_step": 61379, "epoch": 507} {"train_loss": -31.91572380065918, "global_step": 61380, "epoch": 507} {"train_loss": -33.35954284667969, "global_step": 61381, "epoch": 507} {"train_loss": -34.68730163574219, "global_step": 61382, "epoch": 507} {"train_loss": -34.721466064453125, "global_step": 61383, "epoch": 507} {"train_loss": -34.73707962036133, "global_step": 61384, "epoch": 507} {"train_loss": -34.857845306396484, "global_step": 61385, "epoch": 507} {"train_loss": -34.727943420410156, "global_step": 61386, "epoch": 507} {"train_loss": -35.17879867553711, "global_step": 61387, "epoch": 507} {"train_loss": -34.203514099121094, "global_step": 61388, "epoch": 507} {"train_loss": -34.63235855102539, "global_step": 61389, "epoch": 507} {"train_loss": -34.626373291015625, "global_step": 61390, "epoch": 507} {"train_loss": -35.168968200683594, "global_step": 61391, "epoch": 507} {"train_loss": -35.45136260986328, "global_step": 61392, "epoch": 507} {"train_loss": -35.21442413330078, "global_step": 61393, "epoch": 507} {"train_loss": -35.355079650878906, "global_step": 61394, "epoch": 507} {"train_loss": -35.6520881652832, "global_step": 61395, "epoch": 507} {"train_loss": -34.82906723022461, "global_step": 61396, "epoch": 507} {"train_loss": -35.57929992675781, "global_step": 61397, "epoch": 507} {"train_loss": -35.080265045166016, "global_step": 61398, "epoch": 507} {"train_loss": -35.55109786987305, "global_step": 61399, "epoch": 507} {"train_loss": -35.61525344848633, "global_step": 61400, "epoch": 507} {"train_loss": -35.752437591552734, "global_step": 61401, "epoch": 507} {"train_loss": -35.743927001953125, "global_step": 61402, "epoch": 507} {"train_loss": -35.82905197143555, "global_step": 61403, "epoch": 507} {"train_loss": -35.60432052612305, "global_step": 61404, "epoch": 507} {"train_loss": -35.47116470336914, "global_step": 61405, "epoch": 507} {"train_loss": -35.782508850097656, "global_step": 61406, "epoch": 507} {"train_loss": -34.28089141845703, "global_step": 61407, "epoch": 507} {"train_loss": -35.832923889160156, "global_step": 61408, "epoch": 507} {"train_loss": -35.694786071777344, "global_step": 61409, "epoch": 507} {"train_loss": -33.3792610168457, "global_step": 61410, "epoch": 507} {"train_loss": -31.656238555908203, "global_step": 61411, "epoch": 507} {"train_loss": -34.98914337158203, "global_step": 61412, "epoch": 507} {"train_loss": -36.28772735595703, "global_step": 61413, "epoch": 507} {"train_loss": -32.50779342651367, "global_step": 61414, "epoch": 507} {"train_loss": -34.9722900390625, "global_step": 61415, "epoch": 507} {"train_loss": -34.82351303100586, "global_step": 61416, "epoch": 507} {"train_loss": -34.06280517578125, "global_step": 61417, "epoch": 507} {"train_loss": -35.247440338134766, "global_step": 61418, "epoch": 507} {"train_loss": -34.66981506347656, "global_step": 61419, "epoch": 507} {"train_loss": -35.0451774597168, "global_step": 61420, "epoch": 507} {"train_loss": -32.71352005004883, "global_step": 61421, "epoch": 507} {"train_loss": -34.93985366821289, "global_step": 61422, "epoch": 507} {"train_loss": -30.176305770874023, "global_step": 61423, "epoch": 507} {"train_loss": -33.1922721862793, "global_step": 61424, "epoch": 507} {"train_loss": -33.35063552856445, "global_step": 61425, "epoch": 507} {"train_loss": -30.822021484375, "global_step": 61426, "epoch": 507} {"train_loss": -32.06478500366211, "global_step": 61427, "epoch": 507} {"train_loss": -33.6406364440918, "global_step": 61428, "epoch": 507} {"train_loss": -35.13759994506836, "global_step": 61429, "epoch": 507} {"train_loss": -34.99176788330078, "global_step": 61430, "epoch": 507} {"train_loss": -33.63147735595703, "global_step": 61431, "epoch": 507} {"train_loss": -32.93250274658203, "global_step": 61432, "epoch": 507} {"train_loss": -34.08588409423828, "global_step": 61433, "epoch": 507} {"train_loss": -33.914825439453125, "global_step": 61434, "epoch": 507} {"train_loss": -32.02784729003906, "global_step": 61435, "epoch": 507} {"train_loss": -33.87759017944336, "global_step": 61436, "epoch": 507} {"train_loss": -34.615333557128906, "global_step": 61437, "epoch": 507} {"train_loss": -35.10459518432617, "global_step": 61438, "epoch": 507} {"train_loss": -34.686500549316406, "global_step": 61439, "epoch": 507} {"train_loss": -35.001033782958984, "global_step": 61440, "epoch": 507} {"train_loss": -34.51949691772461, "global_step": 61441, "epoch": 507} {"train_loss": -34.6030387878418, "global_step": 61442, "epoch": 507} {"train_loss": -34.19063949584961, "global_step": 61443, "epoch": 507} {"train_loss": -34.70862579345703, "global_step": 61444, "epoch": 507} {"train_loss": -35.3729362487793, "global_step": 61445, "epoch": 507} {"train_loss": -34.494869232177734, "global_step": 61446, "epoch": 507} {"train_loss": -34.381954193115234, "global_step": 61447, "epoch": 507} {"train_loss": -34.871551513671875, "global_step": 61448, "epoch": 507} {"train_loss": -34.69910430908203, "global_step": 61449, "epoch": 507} {"train_loss": -34.26013946533203, "global_step": 61450, "epoch": 507} {"train_loss": -35.00075149536133, "global_step": 61451, "epoch": 507} {"train_loss": -34.34124755859375, "global_step": 61452, "epoch": 507} {"train_loss": -33.779075622558594, "global_step": 61453, "epoch": 507} {"train_loss": -34.46110153198242, "global_step": 61454, "epoch": 507} {"train_loss": -33.853370666503906, "global_step": 61455, "epoch": 507} {"train_loss": -34.67305374145508, "global_step": 61456, "epoch": 507} {"train_loss": -35.154903411865234, "global_step": 61457, "epoch": 507} {"train_loss": -34.557613372802734, "global_step": 61458, "epoch": 507} {"train_loss": -35.23616027832031, "global_step": 61459, "epoch": 507} {"train_loss": -35.129085540771484, "global_step": 61460, "epoch": 507} {"train_loss": -34.70574951171875, "global_step": 61461, "epoch": 507} {"train_loss": -35.5879020690918, "global_step": 61462, "epoch": 507} {"train_loss": -35.43885803222656, "global_step": 61463, "epoch": 507} {"train_loss": -35.54287338256836, "global_step": 61464, "epoch": 507} {"train_loss": -34.418800354003906, "global_step": 61465, "epoch": 507} {"train_loss": -33.729896545410156, "global_step": 61466, "epoch": 507} {"train_loss": -33.645933951228116, "global_step": 61467, "epoch": 507, "val_loss": 2604204.0} {"train_loss": -34.998695373535156, "global_step": 61468, "epoch": 508} {"train_loss": -34.32219696044922, "global_step": 61469, "epoch": 508} {"train_loss": -34.9644889831543, "global_step": 61470, "epoch": 508} {"train_loss": -35.30939865112305, "global_step": 61471, "epoch": 508} {"train_loss": -35.55732345581055, "global_step": 61472, "epoch": 508} {"train_loss": -35.95960235595703, "global_step": 61473, "epoch": 508} {"train_loss": -35.80419158935547, "global_step": 61474, "epoch": 508} {"train_loss": -36.03703308105469, "global_step": 61475, "epoch": 508} {"train_loss": -33.720367431640625, "global_step": 61476, "epoch": 508} {"train_loss": -35.067230224609375, "global_step": 61477, "epoch": 508} {"train_loss": -35.451663970947266, "global_step": 61478, "epoch": 508} {"train_loss": -35.69060134887695, "global_step": 61479, "epoch": 508} {"train_loss": -35.784034729003906, "global_step": 61480, "epoch": 508} {"train_loss": -35.92391586303711, "global_step": 61481, "epoch": 508} {"train_loss": -35.78410720825195, "global_step": 61482, "epoch": 508} {"train_loss": -35.81284713745117, "global_step": 61483, "epoch": 508} {"train_loss": -35.05085372924805, "global_step": 61484, "epoch": 508} {"train_loss": -35.00126647949219, "global_step": 61485, "epoch": 508} {"train_loss": -35.17537307739258, "global_step": 61486, "epoch": 508} {"train_loss": -35.75428009033203, "global_step": 61487, "epoch": 508} {"train_loss": -35.73894119262695, "global_step": 61488, "epoch": 508} {"train_loss": -35.056915283203125, "global_step": 61489, "epoch": 508} {"train_loss": -35.70353317260742, "global_step": 61490, "epoch": 508} {"train_loss": -35.54311752319336, "global_step": 61491, "epoch": 508} {"train_loss": -35.70938491821289, "global_step": 61492, "epoch": 508} {"train_loss": -34.01316452026367, "global_step": 61493, "epoch": 508} {"train_loss": -32.995697021484375, "global_step": 61494, "epoch": 508} {"train_loss": -30.158262252807617, "global_step": 61495, "epoch": 508} {"train_loss": -25.449260711669922, "global_step": 61496, "epoch": 508} {"train_loss": -22.00672721862793, "global_step": 61497, "epoch": 508} {"train_loss": -20.81009292602539, "global_step": 61498, "epoch": 508} {"train_loss": -31.735462188720703, "global_step": 61499, "epoch": 508} {"train_loss": -32.8404541015625, "global_step": 61500, "epoch": 508} {"train_loss": -29.511072158813477, "global_step": 61501, "epoch": 508} {"train_loss": -34.32597732543945, "global_step": 61502, "epoch": 508} {"train_loss": -32.94502639770508, "global_step": 61503, "epoch": 508} {"train_loss": -33.81932830810547, "global_step": 61504, "epoch": 508} {"train_loss": -33.50031280517578, "global_step": 61505, "epoch": 508} {"train_loss": -33.84086227416992, "global_step": 61506, "epoch": 508} {"train_loss": -35.019126892089844, "global_step": 61507, "epoch": 508} {"train_loss": -34.04322052001953, "global_step": 61508, "epoch": 508} {"train_loss": -35.11812210083008, "global_step": 61509, "epoch": 508} {"train_loss": -34.651336669921875, "global_step": 61510, "epoch": 508} {"train_loss": -34.659523010253906, "global_step": 61511, "epoch": 508} {"train_loss": -35.136295318603516, "global_step": 61512, "epoch": 508} {"train_loss": -35.30320358276367, "global_step": 61513, "epoch": 508} {"train_loss": -34.24824142456055, "global_step": 61514, "epoch": 508} {"train_loss": -34.604156494140625, "global_step": 61515, "epoch": 508} {"train_loss": -35.014564514160156, "global_step": 61516, "epoch": 508} {"train_loss": -34.975826263427734, "global_step": 61517, "epoch": 508} {"train_loss": -35.6223030090332, "global_step": 61518, "epoch": 508} {"train_loss": -35.64374542236328, "global_step": 61519, "epoch": 508} {"train_loss": -34.90960693359375, "global_step": 61520, "epoch": 508} {"train_loss": -35.02192687988281, "global_step": 61521, "epoch": 508} {"train_loss": -35.50556564331055, "global_step": 61522, "epoch": 508} {"train_loss": -35.69608688354492, "global_step": 61523, "epoch": 508} {"train_loss": -35.6119384765625, "global_step": 61524, "epoch": 508} {"train_loss": -35.835445404052734, "global_step": 61525, "epoch": 508} {"train_loss": -35.17820739746094, "global_step": 61526, "epoch": 508} {"train_loss": -35.58756637573242, "global_step": 61527, "epoch": 508} {"train_loss": -35.34423065185547, "global_step": 61528, "epoch": 508} {"train_loss": -35.44733810424805, "global_step": 61529, "epoch": 508} {"train_loss": -35.98208236694336, "global_step": 61530, "epoch": 508} {"train_loss": -35.98234939575195, "global_step": 61531, "epoch": 508} {"train_loss": -35.655818939208984, "global_step": 61532, "epoch": 508} {"train_loss": -36.11814498901367, "global_step": 61533, "epoch": 508} {"train_loss": -35.872188568115234, "global_step": 61534, "epoch": 508} {"train_loss": -36.16170120239258, "global_step": 61535, "epoch": 508} {"train_loss": -36.31710433959961, "global_step": 61536, "epoch": 508} {"train_loss": -36.07416915893555, "global_step": 61537, "epoch": 508} {"train_loss": -34.90436935424805, "global_step": 61538, "epoch": 508} {"train_loss": -36.35605239868164, "global_step": 61539, "epoch": 508} {"train_loss": -35.92379379272461, "global_step": 61540, "epoch": 508} {"train_loss": -36.20478439331055, "global_step": 61541, "epoch": 508} {"train_loss": -35.97077941894531, "global_step": 61542, "epoch": 508} {"train_loss": -36.07234573364258, "global_step": 61543, "epoch": 508} {"train_loss": -35.1939811706543, "global_step": 61544, "epoch": 508} {"train_loss": -36.03237533569336, "global_step": 61545, "epoch": 508} {"train_loss": -35.97419357299805, "global_step": 61546, "epoch": 508} {"train_loss": -35.428558349609375, "global_step": 61547, "epoch": 508} {"train_loss": -35.285400390625, "global_step": 61548, "epoch": 508} {"train_loss": -35.78685760498047, "global_step": 61549, "epoch": 508} {"train_loss": -34.67156219482422, "global_step": 61550, "epoch": 508} {"train_loss": -35.39617919921875, "global_step": 61551, "epoch": 508} {"train_loss": -34.158634185791016, "global_step": 61552, "epoch": 508} {"train_loss": -33.75370407104492, "global_step": 61553, "epoch": 508} {"train_loss": -32.63755416870117, "global_step": 61554, "epoch": 508} {"train_loss": -34.56734085083008, "global_step": 61555, "epoch": 508} {"train_loss": -32.80147171020508, "global_step": 61556, "epoch": 508} {"train_loss": -33.91658020019531, "global_step": 61557, "epoch": 508} {"train_loss": -33.20589828491211, "global_step": 61558, "epoch": 508} {"train_loss": -33.95246505737305, "global_step": 61559, "epoch": 508} {"train_loss": -33.12858200073242, "global_step": 61560, "epoch": 508} {"train_loss": -33.75404357910156, "global_step": 61561, "epoch": 508} {"train_loss": -34.165645599365234, "global_step": 61562, "epoch": 508} {"train_loss": -34.41428756713867, "global_step": 61563, "epoch": 508} {"train_loss": -34.36599349975586, "global_step": 61564, "epoch": 508} {"train_loss": -34.993804931640625, "global_step": 61565, "epoch": 508} {"train_loss": -34.2552604675293, "global_step": 61566, "epoch": 508} {"train_loss": -33.94203567504883, "global_step": 61567, "epoch": 508} {"train_loss": -32.801265716552734, "global_step": 61568, "epoch": 508} {"train_loss": -34.83785629272461, "global_step": 61569, "epoch": 508} {"train_loss": -35.230220794677734, "global_step": 61570, "epoch": 508} {"train_loss": -35.245697021484375, "global_step": 61571, "epoch": 508} {"train_loss": -35.33372497558594, "global_step": 61572, "epoch": 508} {"train_loss": -35.01553726196289, "global_step": 61573, "epoch": 508} {"train_loss": -33.643096923828125, "global_step": 61574, "epoch": 508} {"train_loss": -34.577728271484375, "global_step": 61575, "epoch": 508} {"train_loss": -35.5036506652832, "global_step": 61576, "epoch": 508} {"train_loss": -34.62677001953125, "global_step": 61577, "epoch": 508} {"train_loss": -35.11434555053711, "global_step": 61578, "epoch": 508} {"train_loss": -34.67974853515625, "global_step": 61579, "epoch": 508} {"train_loss": -35.27580261230469, "global_step": 61580, "epoch": 508} {"train_loss": -35.19706726074219, "global_step": 61581, "epoch": 508} {"train_loss": -35.16482925415039, "global_step": 61582, "epoch": 508} {"train_loss": -35.05173873901367, "global_step": 61583, "epoch": 508} {"train_loss": -35.113101959228516, "global_step": 61584, "epoch": 508} {"train_loss": -35.78011703491211, "global_step": 61585, "epoch": 508} {"train_loss": -33.74592590332031, "global_step": 61586, "epoch": 508} {"train_loss": -35.42563247680664, "global_step": 61587, "epoch": 508} {"train_loss": -34.55774141737252, "global_step": 61588, "epoch": 508, "val_loss": 2560046.75} {"train_loss": -35.368133544921875, "global_step": 61589, "epoch": 509} {"train_loss": -33.149600982666016, "global_step": 61590, "epoch": 509} {"train_loss": -34.600704193115234, "global_step": 61591, "epoch": 509} {"train_loss": -34.380367279052734, "global_step": 61592, "epoch": 509} {"train_loss": -35.914581298828125, "global_step": 61593, "epoch": 509} {"train_loss": -34.46602249145508, "global_step": 61594, "epoch": 509} {"train_loss": -34.994667053222656, "global_step": 61595, "epoch": 509} {"train_loss": -34.18049240112305, "global_step": 61596, "epoch": 509} {"train_loss": -35.16086959838867, "global_step": 61597, "epoch": 509} {"train_loss": -35.07242202758789, "global_step": 61598, "epoch": 509} {"train_loss": -35.01544952392578, "global_step": 61599, "epoch": 509} {"train_loss": -34.93098068237305, "global_step": 61600, "epoch": 509} {"train_loss": -34.23868942260742, "global_step": 61601, "epoch": 509} {"train_loss": -35.220916748046875, "global_step": 61602, "epoch": 509} {"train_loss": -34.60334777832031, "global_step": 61603, "epoch": 509} {"train_loss": -32.966426849365234, "global_step": 61604, "epoch": 509} {"train_loss": -35.9181022644043, "global_step": 61605, "epoch": 509} {"train_loss": -35.03445053100586, "global_step": 61606, "epoch": 509} {"train_loss": -34.63574981689453, "global_step": 61607, "epoch": 509} {"train_loss": -35.20158767700195, "global_step": 61608, "epoch": 509} {"train_loss": -33.96915817260742, "global_step": 61609, "epoch": 509} {"train_loss": -34.72832107543945, "global_step": 61610, "epoch": 509} {"train_loss": -35.252784729003906, "global_step": 61611, "epoch": 509} {"train_loss": -35.73921203613281, "global_step": 61612, "epoch": 509} {"train_loss": -34.93156051635742, "global_step": 61613, "epoch": 509} {"train_loss": -34.685935974121094, "global_step": 61614, "epoch": 509} {"train_loss": -34.4065055847168, "global_step": 61615, "epoch": 509} {"train_loss": -35.09687423706055, "global_step": 61616, "epoch": 509} {"train_loss": -35.724365234375, "global_step": 61617, "epoch": 509} {"train_loss": -35.5146484375, "global_step": 61618, "epoch": 509} {"train_loss": -34.423431396484375, "global_step": 61619, "epoch": 509} {"train_loss": -34.85260009765625, "global_step": 61620, "epoch": 509} {"train_loss": -34.843624114990234, "global_step": 61621, "epoch": 509} {"train_loss": -35.266902923583984, "global_step": 61622, "epoch": 509} {"train_loss": -35.51323699951172, "global_step": 61623, "epoch": 509} {"train_loss": -35.521087646484375, "global_step": 61624, "epoch": 509} {"train_loss": -34.947845458984375, "global_step": 61625, "epoch": 509} {"train_loss": -34.43751907348633, "global_step": 61626, "epoch": 509} {"train_loss": -35.75334930419922, "global_step": 61627, "epoch": 509} {"train_loss": -34.436607360839844, "global_step": 61628, "epoch": 509} {"train_loss": -35.372310638427734, "global_step": 61629, "epoch": 509} {"train_loss": -35.249385833740234, "global_step": 61630, "epoch": 509} {"train_loss": -34.49970626831055, "global_step": 61631, "epoch": 509} {"train_loss": -34.70012283325195, "global_step": 61632, "epoch": 509} {"train_loss": -34.968257904052734, "global_step": 61633, "epoch": 509} {"train_loss": -35.30513381958008, "global_step": 61634, "epoch": 509} {"train_loss": -34.717926025390625, "global_step": 61635, "epoch": 509} {"train_loss": -33.77805709838867, "global_step": 61636, "epoch": 509} {"train_loss": -33.646324157714844, "global_step": 61637, "epoch": 509} {"train_loss": -34.66899108886719, "global_step": 61638, "epoch": 509} {"train_loss": -35.675384521484375, "global_step": 61639, "epoch": 509} {"train_loss": -35.212135314941406, "global_step": 61640, "epoch": 509} {"train_loss": -34.621063232421875, "global_step": 61641, "epoch": 509} {"train_loss": -34.57113265991211, "global_step": 61642, "epoch": 509} {"train_loss": -34.66762924194336, "global_step": 61643, "epoch": 509} {"train_loss": -34.38671112060547, "global_step": 61644, "epoch": 509} {"train_loss": -35.77248764038086, "global_step": 61645, "epoch": 509} {"train_loss": -35.44950866699219, "global_step": 61646, "epoch": 509} {"train_loss": -35.83632278442383, "global_step": 61647, "epoch": 509} {"train_loss": -35.39221954345703, "global_step": 61648, "epoch": 509} {"train_loss": -35.9434700012207, "global_step": 61649, "epoch": 509} {"train_loss": -36.168453216552734, "global_step": 61650, "epoch": 509} {"train_loss": -35.5734977722168, "global_step": 61651, "epoch": 509} {"train_loss": -35.3834228515625, "global_step": 61652, "epoch": 509} {"train_loss": -35.972572326660156, "global_step": 61653, "epoch": 509} {"train_loss": -36.072872161865234, "global_step": 61654, "epoch": 509} {"train_loss": -36.210575103759766, "global_step": 61655, "epoch": 509} {"train_loss": -36.05000686645508, "global_step": 61656, "epoch": 509} {"train_loss": -36.68110656738281, "global_step": 61657, "epoch": 509} {"train_loss": -36.61809158325195, "global_step": 61658, "epoch": 509} {"train_loss": -36.36556625366211, "global_step": 61659, "epoch": 509} {"train_loss": -36.333621978759766, "global_step": 61660, "epoch": 509} {"train_loss": -35.80146408081055, "global_step": 61661, "epoch": 509} {"train_loss": -36.62449264526367, "global_step": 61662, "epoch": 509} {"train_loss": -36.482662200927734, "global_step": 61663, "epoch": 509} {"train_loss": -36.23736572265625, "global_step": 61664, "epoch": 509} {"train_loss": -36.39907455444336, "global_step": 61665, "epoch": 509} {"train_loss": -35.39387893676758, "global_step": 61666, "epoch": 509} {"train_loss": -36.10026931762695, "global_step": 61667, "epoch": 509} {"train_loss": -35.3878173828125, "global_step": 61668, "epoch": 509} {"train_loss": -35.601043701171875, "global_step": 61669, "epoch": 509} {"train_loss": -36.083309173583984, "global_step": 61670, "epoch": 509} {"train_loss": -36.1896858215332, "global_step": 61671, "epoch": 509} {"train_loss": -36.559749603271484, "global_step": 61672, "epoch": 509} {"train_loss": -34.649658203125, "global_step": 61673, "epoch": 509} {"train_loss": -36.02227783203125, "global_step": 61674, "epoch": 509} {"train_loss": -36.65278244018555, "global_step": 61675, "epoch": 509} {"train_loss": -36.20859146118164, "global_step": 61676, "epoch": 509} {"train_loss": -36.70028305053711, "global_step": 61677, "epoch": 509} {"train_loss": -35.945640563964844, "global_step": 61678, "epoch": 509} {"train_loss": -36.17100143432617, "global_step": 61679, "epoch": 509} {"train_loss": -34.479103088378906, "global_step": 61680, "epoch": 509} {"train_loss": -36.13662338256836, "global_step": 61681, "epoch": 509} {"train_loss": -36.98284149169922, "global_step": 61682, "epoch": 509} {"train_loss": -36.21176528930664, "global_step": 61683, "epoch": 509} {"train_loss": -36.192291259765625, "global_step": 61684, "epoch": 509} {"train_loss": -35.993553161621094, "global_step": 61685, "epoch": 509} {"train_loss": -36.24601364135742, "global_step": 61686, "epoch": 509} {"train_loss": -35.838714599609375, "global_step": 61687, "epoch": 509} {"train_loss": -35.6738395690918, "global_step": 61688, "epoch": 509} {"train_loss": -31.44532585144043, "global_step": 61689, "epoch": 509} {"train_loss": -35.00396728515625, "global_step": 61690, "epoch": 509} {"train_loss": -35.02396774291992, "global_step": 61691, "epoch": 509} {"train_loss": -32.37382888793945, "global_step": 61692, "epoch": 509} {"train_loss": -32.94923782348633, "global_step": 61693, "epoch": 509} {"train_loss": -34.24504470825195, "global_step": 61694, "epoch": 509} {"train_loss": -32.42290496826172, "global_step": 61695, "epoch": 509} {"train_loss": -33.328861236572266, "global_step": 61696, "epoch": 509} {"train_loss": -32.840309143066406, "global_step": 61697, "epoch": 509} {"train_loss": -31.22706413269043, "global_step": 61698, "epoch": 509} {"train_loss": -32.40633010864258, "global_step": 61699, "epoch": 509} {"train_loss": -32.536800384521484, "global_step": 61700, "epoch": 509} {"train_loss": -34.24861145019531, "global_step": 61701, "epoch": 509} {"train_loss": -32.09138870239258, "global_step": 61702, "epoch": 509} {"train_loss": -32.478633880615234, "global_step": 61703, "epoch": 509} {"train_loss": -33.0880012512207, "global_step": 61704, "epoch": 509} {"train_loss": -33.124359130859375, "global_step": 61705, "epoch": 509} {"train_loss": -34.29706573486328, "global_step": 61706, "epoch": 509} {"train_loss": -34.10636901855469, "global_step": 61707, "epoch": 509} {"train_loss": -30.799890518188477, "global_step": 61708, "epoch": 509} {"train_loss": -34.94670021435446, "global_step": 61709, "epoch": 509, "val_loss": 2610485.75} {"train_loss": -33.68232345581055, "global_step": 61710, "epoch": 510} {"train_loss": -32.08409881591797, "global_step": 61711, "epoch": 510} {"train_loss": -33.083580017089844, "global_step": 61712, "epoch": 510} {"train_loss": -33.41032028198242, "global_step": 61713, "epoch": 510} {"train_loss": -33.87723159790039, "global_step": 61714, "epoch": 510} {"train_loss": -32.340877532958984, "global_step": 61715, "epoch": 510} {"train_loss": -34.73563766479492, "global_step": 61716, "epoch": 510} {"train_loss": -32.77560043334961, "global_step": 61717, "epoch": 510} {"train_loss": -34.157100677490234, "global_step": 61718, "epoch": 510} {"train_loss": -34.32784652709961, "global_step": 61719, "epoch": 510} {"train_loss": -34.316444396972656, "global_step": 61720, "epoch": 510} {"train_loss": -34.27916717529297, "global_step": 61721, "epoch": 510} {"train_loss": -34.406490325927734, "global_step": 61722, "epoch": 510} {"train_loss": -35.004188537597656, "global_step": 61723, "epoch": 510} {"train_loss": -34.59806442260742, "global_step": 61724, "epoch": 510} {"train_loss": -34.76193618774414, "global_step": 61725, "epoch": 510} {"train_loss": -34.50302505493164, "global_step": 61726, "epoch": 510} {"train_loss": -35.5881462097168, "global_step": 61727, "epoch": 510} {"train_loss": -34.583919525146484, "global_step": 61728, "epoch": 510} {"train_loss": -35.34695053100586, "global_step": 61729, "epoch": 510} {"train_loss": -35.07949447631836, "global_step": 61730, "epoch": 510} {"train_loss": -35.419044494628906, "global_step": 61731, "epoch": 510} {"train_loss": -35.10285568237305, "global_step": 61732, "epoch": 510} {"train_loss": -35.46267318725586, "global_step": 61733, "epoch": 510} {"train_loss": -35.504634857177734, "global_step": 61734, "epoch": 510} {"train_loss": -35.66572952270508, "global_step": 61735, "epoch": 510} {"train_loss": -35.52629470825195, "global_step": 61736, "epoch": 510} {"train_loss": -35.426841735839844, "global_step": 61737, "epoch": 510} {"train_loss": -35.980220794677734, "global_step": 61738, "epoch": 510} {"train_loss": -35.966522216796875, "global_step": 61739, "epoch": 510} {"train_loss": -36.08824157714844, "global_step": 61740, "epoch": 510} {"train_loss": -36.15102005004883, "global_step": 61741, "epoch": 510} {"train_loss": -35.714847564697266, "global_step": 61742, "epoch": 510} {"train_loss": -36.082157135009766, "global_step": 61743, "epoch": 510} {"train_loss": -36.010494232177734, "global_step": 61744, "epoch": 510} {"train_loss": -35.82207107543945, "global_step": 61745, "epoch": 510} {"train_loss": -36.0327262878418, "global_step": 61746, "epoch": 510} {"train_loss": -36.170562744140625, "global_step": 61747, "epoch": 510} {"train_loss": -36.36434555053711, "global_step": 61748, "epoch": 510} {"train_loss": -36.28602981567383, "global_step": 61749, "epoch": 510} {"train_loss": -36.30100631713867, "global_step": 61750, "epoch": 510} {"train_loss": -35.901851654052734, "global_step": 61751, "epoch": 510} {"train_loss": -36.7599983215332, "global_step": 61752, "epoch": 510} {"train_loss": -36.28425216674805, "global_step": 61753, "epoch": 510} {"train_loss": -36.4107666015625, "global_step": 61754, "epoch": 510} {"train_loss": -36.350830078125, "global_step": 61755, "epoch": 510} {"train_loss": -36.57012939453125, "global_step": 61756, "epoch": 510} {"train_loss": -36.64310073852539, "global_step": 61757, "epoch": 510} {"train_loss": -36.0332145690918, "global_step": 61758, "epoch": 510} {"train_loss": -36.84296798706055, "global_step": 61759, "epoch": 510} {"train_loss": -36.60019302368164, "global_step": 61760, "epoch": 510} {"train_loss": -36.076995849609375, "global_step": 61761, "epoch": 510} {"train_loss": -36.75374984741211, "global_step": 61762, "epoch": 510} {"train_loss": -36.548439025878906, "global_step": 61763, "epoch": 510} {"train_loss": -36.63834762573242, "global_step": 61764, "epoch": 510} {"train_loss": -36.5175666809082, "global_step": 61765, "epoch": 510} {"train_loss": -36.11165237426758, "global_step": 61766, "epoch": 510} {"train_loss": -34.7403564453125, "global_step": 61767, "epoch": 510} {"train_loss": -35.414947509765625, "global_step": 61768, "epoch": 510} {"train_loss": -35.2033576965332, "global_step": 61769, "epoch": 510} {"train_loss": -36.0309944152832, "global_step": 61770, "epoch": 510} {"train_loss": -36.61983871459961, "global_step": 61771, "epoch": 510} {"train_loss": -35.804359436035156, "global_step": 61772, "epoch": 510} {"train_loss": -35.391876220703125, "global_step": 61773, "epoch": 510} {"train_loss": -34.924720764160156, "global_step": 61774, "epoch": 510} {"train_loss": -35.15655517578125, "global_step": 61775, "epoch": 510} {"train_loss": -35.95078659057617, "global_step": 61776, "epoch": 510} {"train_loss": -35.74428939819336, "global_step": 61777, "epoch": 510} {"train_loss": -36.42799758911133, "global_step": 61778, "epoch": 510} {"train_loss": -36.448097229003906, "global_step": 61779, "epoch": 510} {"train_loss": -36.66919708251953, "global_step": 61780, "epoch": 510} {"train_loss": -36.628204345703125, "global_step": 61781, "epoch": 510} {"train_loss": -36.167537689208984, "global_step": 61782, "epoch": 510} {"train_loss": -36.15863800048828, "global_step": 61783, "epoch": 510} {"train_loss": -35.62260055541992, "global_step": 61784, "epoch": 510} {"train_loss": -35.6338996887207, "global_step": 61785, "epoch": 510} {"train_loss": -36.3800048828125, "global_step": 61786, "epoch": 510} {"train_loss": -36.6622200012207, "global_step": 61787, "epoch": 510} {"train_loss": -35.78738021850586, "global_step": 61788, "epoch": 510} {"train_loss": -36.81887435913086, "global_step": 61789, "epoch": 510} {"train_loss": -36.05678176879883, "global_step": 61790, "epoch": 510} {"train_loss": -36.3792610168457, "global_step": 61791, "epoch": 510} {"train_loss": -36.60299301147461, "global_step": 61792, "epoch": 510} {"train_loss": -35.323387145996094, "global_step": 61793, "epoch": 510} {"train_loss": -33.94178771972656, "global_step": 61794, "epoch": 510} {"train_loss": -33.849281311035156, "global_step": 61795, "epoch": 510} {"train_loss": -32.53757858276367, "global_step": 61796, "epoch": 510} {"train_loss": -33.28826904296875, "global_step": 61797, "epoch": 510} {"train_loss": -35.4614372253418, "global_step": 61798, "epoch": 510} {"train_loss": -33.896053314208984, "global_step": 61799, "epoch": 510} {"train_loss": -34.728729248046875, "global_step": 61800, "epoch": 510} {"train_loss": -32.85884094238281, "global_step": 61801, "epoch": 510} {"train_loss": -33.2217903137207, "global_step": 61802, "epoch": 510} {"train_loss": -36.16049575805664, "global_step": 61803, "epoch": 510} {"train_loss": -33.36798095703125, "global_step": 61804, "epoch": 510} {"train_loss": -34.7467041015625, "global_step": 61805, "epoch": 510} {"train_loss": -35.18476104736328, "global_step": 61806, "epoch": 510} {"train_loss": -34.71511459350586, "global_step": 61807, "epoch": 510} {"train_loss": -34.308467864990234, "global_step": 61808, "epoch": 510} {"train_loss": -35.48408889770508, "global_step": 61809, "epoch": 510} {"train_loss": -36.20410919189453, "global_step": 61810, "epoch": 510} {"train_loss": -35.509765625, "global_step": 61811, "epoch": 510} {"train_loss": -33.95956039428711, "global_step": 61812, "epoch": 510} {"train_loss": -35.165557861328125, "global_step": 61813, "epoch": 510} {"train_loss": -35.89174270629883, "global_step": 61814, "epoch": 510} {"train_loss": -36.18110275268555, "global_step": 61815, "epoch": 510} {"train_loss": -36.03083038330078, "global_step": 61816, "epoch": 510} {"train_loss": -35.93943786621094, "global_step": 61817, "epoch": 510} {"train_loss": -35.762229919433594, "global_step": 61818, "epoch": 510} {"train_loss": -35.52201461791992, "global_step": 61819, "epoch": 510} {"train_loss": -36.11460876464844, "global_step": 61820, "epoch": 510} {"train_loss": -35.58003616333008, "global_step": 61821, "epoch": 510} {"train_loss": -36.24997329711914, "global_step": 61822, "epoch": 510} {"train_loss": -35.902122497558594, "global_step": 61823, "epoch": 510} {"train_loss": -36.235633850097656, "global_step": 61824, "epoch": 510} {"train_loss": -35.28951644897461, "global_step": 61825, "epoch": 510} {"train_loss": -36.49601745605469, "global_step": 61826, "epoch": 510} {"train_loss": -36.44824981689453, "global_step": 61827, "epoch": 510} {"train_loss": -36.073951721191406, "global_step": 61828, "epoch": 510} {"train_loss": -36.040035247802734, "global_step": 61829, "epoch": 510} {"train_loss": -35.43979531280265, "global_step": 61830, "epoch": 510, "val_loss": 2600827.75} {"train_loss": -36.53791046142578, "global_step": 61831, "epoch": 511} {"train_loss": -36.24452590942383, "global_step": 61832, "epoch": 511} {"train_loss": -36.36646270751953, "global_step": 61833, "epoch": 511} {"train_loss": -36.55009841918945, "global_step": 61834, "epoch": 511} {"train_loss": -36.56968307495117, "global_step": 61835, "epoch": 511} {"train_loss": -36.416534423828125, "global_step": 61836, "epoch": 511} {"train_loss": -36.26946258544922, "global_step": 61837, "epoch": 511} {"train_loss": -36.148582458496094, "global_step": 61838, "epoch": 511} {"train_loss": -35.887393951416016, "global_step": 61839, "epoch": 511} {"train_loss": -35.85425567626953, "global_step": 61840, "epoch": 511} {"train_loss": -35.1243896484375, "global_step": 61841, "epoch": 511} {"train_loss": -35.808895111083984, "global_step": 61842, "epoch": 511} {"train_loss": -36.54923629760742, "global_step": 61843, "epoch": 511} {"train_loss": -36.67570114135742, "global_step": 61844, "epoch": 511} {"train_loss": -36.27161407470703, "global_step": 61845, "epoch": 511} {"train_loss": -35.879573822021484, "global_step": 61846, "epoch": 511} {"train_loss": -36.61677932739258, "global_step": 61847, "epoch": 511} {"train_loss": -36.520931243896484, "global_step": 61848, "epoch": 511} {"train_loss": -36.44308090209961, "global_step": 61849, "epoch": 511} {"train_loss": -36.39669418334961, "global_step": 61850, "epoch": 511} {"train_loss": -36.40593338012695, "global_step": 61851, "epoch": 511} {"train_loss": -35.98196029663086, "global_step": 61852, "epoch": 511} {"train_loss": -36.862361907958984, "global_step": 61853, "epoch": 511} {"train_loss": -35.6085090637207, "global_step": 61854, "epoch": 511} {"train_loss": -35.03574752807617, "global_step": 61855, "epoch": 511} {"train_loss": -34.94743728637695, "global_step": 61856, "epoch": 511} {"train_loss": -36.460933685302734, "global_step": 61857, "epoch": 511} {"train_loss": -33.75701904296875, "global_step": 61858, "epoch": 511} {"train_loss": -35.74485778808594, "global_step": 61859, "epoch": 511} {"train_loss": -35.722103118896484, "global_step": 61860, "epoch": 511} {"train_loss": -34.40845489501953, "global_step": 61861, "epoch": 511} {"train_loss": -33.420440673828125, "global_step": 61862, "epoch": 511} {"train_loss": -35.3413200378418, "global_step": 61863, "epoch": 511} {"train_loss": -35.88291549682617, "global_step": 61864, "epoch": 511} {"train_loss": -35.06764602661133, "global_step": 61865, "epoch": 511} {"train_loss": -35.1347541809082, "global_step": 61866, "epoch": 511} {"train_loss": -34.22003936767578, "global_step": 61867, "epoch": 511} {"train_loss": -36.5831298828125, "global_step": 61868, "epoch": 511} {"train_loss": -35.03649139404297, "global_step": 61869, "epoch": 511} {"train_loss": -35.708030700683594, "global_step": 61870, "epoch": 511} {"train_loss": -35.719112396240234, "global_step": 61871, "epoch": 511} {"train_loss": -35.15540313720703, "global_step": 61872, "epoch": 511} {"train_loss": -35.292388916015625, "global_step": 61873, "epoch": 511} {"train_loss": -35.328609466552734, "global_step": 61874, "epoch": 511} {"train_loss": -35.93085861206055, "global_step": 61875, "epoch": 511} {"train_loss": -35.75899887084961, "global_step": 61876, "epoch": 511} {"train_loss": -34.80035400390625, "global_step": 61877, "epoch": 511} {"train_loss": -34.403587341308594, "global_step": 61878, "epoch": 511} {"train_loss": -36.09046173095703, "global_step": 61879, "epoch": 511} {"train_loss": -36.589473724365234, "global_step": 61880, "epoch": 511} {"train_loss": -35.4213752746582, "global_step": 61881, "epoch": 511} {"train_loss": -35.556888580322266, "global_step": 61882, "epoch": 511} {"train_loss": -36.67795944213867, "global_step": 61883, "epoch": 511} {"train_loss": -35.445186614990234, "global_step": 61884, "epoch": 511} {"train_loss": -36.27092742919922, "global_step": 61885, "epoch": 511} {"train_loss": -36.131126403808594, "global_step": 61886, "epoch": 511} {"train_loss": -36.65255355834961, "global_step": 61887, "epoch": 511} {"train_loss": -36.249629974365234, "global_step": 61888, "epoch": 511} {"train_loss": -36.92589569091797, "global_step": 61889, "epoch": 511} {"train_loss": -35.600502014160156, "global_step": 61890, "epoch": 511} {"train_loss": -36.131656646728516, "global_step": 61891, "epoch": 511} {"train_loss": -36.83622360229492, "global_step": 61892, "epoch": 511} {"train_loss": -35.81892013549805, "global_step": 61893, "epoch": 511} {"train_loss": -36.43290328979492, "global_step": 61894, "epoch": 511} {"train_loss": -34.51648712158203, "global_step": 61895, "epoch": 511} {"train_loss": -34.92476272583008, "global_step": 61896, "epoch": 511} {"train_loss": -32.264095306396484, "global_step": 61897, "epoch": 511} {"train_loss": -31.9753360748291, "global_step": 61898, "epoch": 511} {"train_loss": -34.127986907958984, "global_step": 61899, "epoch": 511} {"train_loss": -36.34318542480469, "global_step": 61900, "epoch": 511} {"train_loss": -35.299285888671875, "global_step": 61901, "epoch": 511} {"train_loss": -34.636878967285156, "global_step": 61902, "epoch": 511} {"train_loss": -35.80110549926758, "global_step": 61903, "epoch": 511} {"train_loss": -35.95003128051758, "global_step": 61904, "epoch": 511} {"train_loss": -35.7818603515625, "global_step": 61905, "epoch": 511} {"train_loss": -36.747493743896484, "global_step": 61906, "epoch": 511} {"train_loss": -34.90104293823242, "global_step": 61907, "epoch": 511} {"train_loss": -35.13602828979492, "global_step": 61908, "epoch": 511} {"train_loss": -35.979957580566406, "global_step": 61909, "epoch": 511} {"train_loss": -35.774009704589844, "global_step": 61910, "epoch": 511} {"train_loss": -35.98141098022461, "global_step": 61911, "epoch": 511} {"train_loss": -36.36155319213867, "global_step": 61912, "epoch": 511} {"train_loss": -36.030120849609375, "global_step": 61913, "epoch": 511} {"train_loss": -35.6268196105957, "global_step": 61914, "epoch": 511} {"train_loss": -35.563377380371094, "global_step": 61915, "epoch": 511} {"train_loss": -35.62491989135742, "global_step": 61916, "epoch": 511} {"train_loss": -36.21038055419922, "global_step": 61917, "epoch": 511} {"train_loss": -35.6761589050293, "global_step": 61918, "epoch": 511} {"train_loss": -35.901058197021484, "global_step": 61919, "epoch": 511} {"train_loss": -35.63676452636719, "global_step": 61920, "epoch": 511} {"train_loss": -35.590301513671875, "global_step": 61921, "epoch": 511} {"train_loss": -35.91547775268555, "global_step": 61922, "epoch": 511} {"train_loss": -35.018611907958984, "global_step": 61923, "epoch": 511} {"train_loss": -35.86690902709961, "global_step": 61924, "epoch": 511} {"train_loss": -33.71772384643555, "global_step": 61925, "epoch": 511} {"train_loss": -35.94316482543945, "global_step": 61926, "epoch": 511} {"train_loss": -33.48701095581055, "global_step": 61927, "epoch": 511} {"train_loss": -34.6626091003418, "global_step": 61928, "epoch": 511} {"train_loss": -35.31199645996094, "global_step": 61929, "epoch": 511} {"train_loss": -33.07872772216797, "global_step": 61930, "epoch": 511} {"train_loss": -34.423702239990234, "global_step": 61931, "epoch": 511} {"train_loss": -34.93616485595703, "global_step": 61932, "epoch": 511} {"train_loss": -35.26353073120117, "global_step": 61933, "epoch": 511} {"train_loss": -34.360687255859375, "global_step": 61934, "epoch": 511} {"train_loss": -34.11343002319336, "global_step": 61935, "epoch": 511} {"train_loss": -33.9657096862793, "global_step": 61936, "epoch": 511} {"train_loss": -34.79291534423828, "global_step": 61937, "epoch": 511} {"train_loss": -34.20168685913086, "global_step": 61938, "epoch": 511} {"train_loss": -33.39415740966797, "global_step": 61939, "epoch": 511} {"train_loss": -34.01149368286133, "global_step": 61940, "epoch": 511} {"train_loss": -34.58440399169922, "global_step": 61941, "epoch": 511} {"train_loss": -33.3881721496582, "global_step": 61942, "epoch": 511} {"train_loss": -35.14533233642578, "global_step": 61943, "epoch": 511} {"train_loss": -33.4619140625, "global_step": 61944, "epoch": 511} {"train_loss": -33.427276611328125, "global_step": 61945, "epoch": 511} {"train_loss": -34.1644401550293, "global_step": 61946, "epoch": 511} {"train_loss": -34.28965377807617, "global_step": 61947, "epoch": 511} {"train_loss": -34.96397399902344, "global_step": 61948, "epoch": 511} {"train_loss": -34.691280364990234, "global_step": 61949, "epoch": 511} {"train_loss": -35.682586669921875, "global_step": 61950, "epoch": 511} {"train_loss": -35.3946746164117, "global_step": 61951, "epoch": 511, "val_loss": 2573170.75} {"train_loss": -34.989990234375, "global_step": 61952, "epoch": 512} {"train_loss": -34.88107681274414, "global_step": 61953, "epoch": 512} {"train_loss": -34.918270111083984, "global_step": 61954, "epoch": 512} {"train_loss": -34.719635009765625, "global_step": 61955, "epoch": 512} {"train_loss": -36.21487045288086, "global_step": 61956, "epoch": 512} {"train_loss": -35.754798889160156, "global_step": 61957, "epoch": 512} {"train_loss": -35.29924774169922, "global_step": 61958, "epoch": 512} {"train_loss": -35.6722412109375, "global_step": 61959, "epoch": 512} {"train_loss": -35.373779296875, "global_step": 61960, "epoch": 512} {"train_loss": -35.76178741455078, "global_step": 61961, "epoch": 512} {"train_loss": -35.802162170410156, "global_step": 61962, "epoch": 512} {"train_loss": -35.510135650634766, "global_step": 61963, "epoch": 512} {"train_loss": -35.911781311035156, "global_step": 61964, "epoch": 512} {"train_loss": -35.248313903808594, "global_step": 61965, "epoch": 512} {"train_loss": -36.318382263183594, "global_step": 61966, "epoch": 512} {"train_loss": -35.94223403930664, "global_step": 61967, "epoch": 512} {"train_loss": -36.156829833984375, "global_step": 61968, "epoch": 512} {"train_loss": -36.21151351928711, "global_step": 61969, "epoch": 512} {"train_loss": -35.619075775146484, "global_step": 61970, "epoch": 512} {"train_loss": -35.8719482421875, "global_step": 61971, "epoch": 512} {"train_loss": -34.940948486328125, "global_step": 61972, "epoch": 512} {"train_loss": -35.97550582885742, "global_step": 61973, "epoch": 512} {"train_loss": -36.37146759033203, "global_step": 61974, "epoch": 512} {"train_loss": -36.73903274536133, "global_step": 61975, "epoch": 512} {"train_loss": -36.255104064941406, "global_step": 61976, "epoch": 512} {"train_loss": -36.21671676635742, "global_step": 61977, "epoch": 512} {"train_loss": -36.71193313598633, "global_step": 61978, "epoch": 512} {"train_loss": -36.08646774291992, "global_step": 61979, "epoch": 512} {"train_loss": -36.65817642211914, "global_step": 61980, "epoch": 512} {"train_loss": -36.26582717895508, "global_step": 61981, "epoch": 512} {"train_loss": -36.43067169189453, "global_step": 61982, "epoch": 512} {"train_loss": -36.67225646972656, "global_step": 61983, "epoch": 512} {"train_loss": -36.629920959472656, "global_step": 61984, "epoch": 512} {"train_loss": -36.6054801940918, "global_step": 61985, "epoch": 512} {"train_loss": -36.19924545288086, "global_step": 61986, "epoch": 512} {"train_loss": -36.481624603271484, "global_step": 61987, "epoch": 512} {"train_loss": -36.88368225097656, "global_step": 61988, "epoch": 512} {"train_loss": -36.65236282348633, "global_step": 61989, "epoch": 512} {"train_loss": -36.772762298583984, "global_step": 61990, "epoch": 512} {"train_loss": -35.85274887084961, "global_step": 61991, "epoch": 512} {"train_loss": -35.27682113647461, "global_step": 61992, "epoch": 512} {"train_loss": -36.28948211669922, "global_step": 61993, "epoch": 512} {"train_loss": -36.50647735595703, "global_step": 61994, "epoch": 512} {"train_loss": -35.43737030029297, "global_step": 61995, "epoch": 512} {"train_loss": -33.597145080566406, "global_step": 61996, "epoch": 512} {"train_loss": -31.303043365478516, "global_step": 61997, "epoch": 512} {"train_loss": -30.350019454956055, "global_step": 61998, "epoch": 512} {"train_loss": -30.496612548828125, "global_step": 61999, "epoch": 512} {"train_loss": -31.67010498046875, "global_step": 62000, "epoch": 512} {"train_loss": -32.85670852661133, "global_step": 62001, "epoch": 512} {"train_loss": -34.828887939453125, "global_step": 62002, "epoch": 512} {"train_loss": -33.33468246459961, "global_step": 62003, "epoch": 512} {"train_loss": -33.01319885253906, "global_step": 62004, "epoch": 512} {"train_loss": -35.06746292114258, "global_step": 62005, "epoch": 512} {"train_loss": -33.88002395629883, "global_step": 62006, "epoch": 512} {"train_loss": -33.92928695678711, "global_step": 62007, "epoch": 512} {"train_loss": -36.2587776184082, "global_step": 62008, "epoch": 512} {"train_loss": -35.91120529174805, "global_step": 62009, "epoch": 512} {"train_loss": -36.23041915893555, "global_step": 62010, "epoch": 512} {"train_loss": -35.188533782958984, "global_step": 62011, "epoch": 512} {"train_loss": -33.70672607421875, "global_step": 62012, "epoch": 512} {"train_loss": -33.86425018310547, "global_step": 62013, "epoch": 512} {"train_loss": -33.07101058959961, "global_step": 62014, "epoch": 512} {"train_loss": -31.50661277770996, "global_step": 62015, "epoch": 512} {"train_loss": -35.78081130981445, "global_step": 62016, "epoch": 512} {"train_loss": -34.535701751708984, "global_step": 62017, "epoch": 512} {"train_loss": -35.12699890136719, "global_step": 62018, "epoch": 512} {"train_loss": -34.464073181152344, "global_step": 62019, "epoch": 512} {"train_loss": -35.80733871459961, "global_step": 62020, "epoch": 512} {"train_loss": -34.611751556396484, "global_step": 62021, "epoch": 512} {"train_loss": -35.33417510986328, "global_step": 62022, "epoch": 512} {"train_loss": -36.24139404296875, "global_step": 62023, "epoch": 512} {"train_loss": -35.417396545410156, "global_step": 62024, "epoch": 512} {"train_loss": -35.874351501464844, "global_step": 62025, "epoch": 512} {"train_loss": -36.03922653198242, "global_step": 62026, "epoch": 512} {"train_loss": -36.0447998046875, "global_step": 62027, "epoch": 512} {"train_loss": -35.33734130859375, "global_step": 62028, "epoch": 512} {"train_loss": -36.20663833618164, "global_step": 62029, "epoch": 512} {"train_loss": -35.3482551574707, "global_step": 62030, "epoch": 512} {"train_loss": -35.53489303588867, "global_step": 62031, "epoch": 512} {"train_loss": -36.18560791015625, "global_step": 62032, "epoch": 512} {"train_loss": -36.233192443847656, "global_step": 62033, "epoch": 512} {"train_loss": -35.93061447143555, "global_step": 62034, "epoch": 512} {"train_loss": -36.29165267944336, "global_step": 62035, "epoch": 512} {"train_loss": -35.409645080566406, "global_step": 62036, "epoch": 512} {"train_loss": -36.28758239746094, "global_step": 62037, "epoch": 512} {"train_loss": -35.439212799072266, "global_step": 62038, "epoch": 512} {"train_loss": -35.24302291870117, "global_step": 62039, "epoch": 512} {"train_loss": -35.9889030456543, "global_step": 62040, "epoch": 512} {"train_loss": -34.988006591796875, "global_step": 62041, "epoch": 512} {"train_loss": -32.961612701416016, "global_step": 62042, "epoch": 512} {"train_loss": -33.352447509765625, "global_step": 62043, "epoch": 512} {"train_loss": -35.776912689208984, "global_step": 62044, "epoch": 512} {"train_loss": -34.8148307800293, "global_step": 62045, "epoch": 512} {"train_loss": -32.78718948364258, "global_step": 62046, "epoch": 512} {"train_loss": -33.98224639892578, "global_step": 62047, "epoch": 512} {"train_loss": -33.74150466918945, "global_step": 62048, "epoch": 512} {"train_loss": -33.007259368896484, "global_step": 62049, "epoch": 512} {"train_loss": -33.3836669921875, "global_step": 62050, "epoch": 512} {"train_loss": -31.80274772644043, "global_step": 62051, "epoch": 512} {"train_loss": -34.1295166015625, "global_step": 62052, "epoch": 512} {"train_loss": -35.80164337158203, "global_step": 62053, "epoch": 512} {"train_loss": -32.961265563964844, "global_step": 62054, "epoch": 512} {"train_loss": -36.05147171020508, "global_step": 62055, "epoch": 512} {"train_loss": -35.335140228271484, "global_step": 62056, "epoch": 512} {"train_loss": -33.27090835571289, "global_step": 62057, "epoch": 512} {"train_loss": -35.849815368652344, "global_step": 62058, "epoch": 512} {"train_loss": -34.79314041137695, "global_step": 62059, "epoch": 512} {"train_loss": -34.33747863769531, "global_step": 62060, "epoch": 512} {"train_loss": -35.839111328125, "global_step": 62061, "epoch": 512} {"train_loss": -35.01176834106445, "global_step": 62062, "epoch": 512} {"train_loss": -32.480995178222656, "global_step": 62063, "epoch": 512} {"train_loss": -35.311439514160156, "global_step": 62064, "epoch": 512} {"train_loss": -36.150508880615234, "global_step": 62065, "epoch": 512} {"train_loss": -34.060176849365234, "global_step": 62066, "epoch": 512} {"train_loss": -35.20698165893555, "global_step": 62067, "epoch": 512} {"train_loss": -35.75504684448242, "global_step": 62068, "epoch": 512} {"train_loss": -35.113582611083984, "global_step": 62069, "epoch": 512} {"train_loss": -36.34082794189453, "global_step": 62070, "epoch": 512} {"train_loss": -35.58985137939453, "global_step": 62071, "epoch": 512} {"train_loss": -35.11845390067613, "global_step": 62072, "epoch": 512, "val_loss": 2695842.0} {"train_loss": -35.24853515625, "global_step": 62073, "epoch": 513} {"train_loss": -35.89484786987305, "global_step": 62074, "epoch": 513} {"train_loss": -35.4041862487793, "global_step": 62075, "epoch": 513} {"train_loss": -35.29768753051758, "global_step": 62076, "epoch": 513} {"train_loss": -35.47660446166992, "global_step": 62077, "epoch": 513} {"train_loss": -34.95246124267578, "global_step": 62078, "epoch": 513} {"train_loss": -35.261775970458984, "global_step": 62079, "epoch": 513} {"train_loss": -32.85819625854492, "global_step": 62080, "epoch": 513} {"train_loss": -34.664424896240234, "global_step": 62081, "epoch": 513} {"train_loss": -35.46481704711914, "global_step": 62082, "epoch": 513} {"train_loss": -34.35979080200195, "global_step": 62083, "epoch": 513} {"train_loss": -33.0134391784668, "global_step": 62084, "epoch": 513} {"train_loss": -33.901119232177734, "global_step": 62085, "epoch": 513} {"train_loss": -34.65678787231445, "global_step": 62086, "epoch": 513} {"train_loss": -34.8145751953125, "global_step": 62087, "epoch": 513} {"train_loss": -34.597137451171875, "global_step": 62088, "epoch": 513} {"train_loss": -35.39750289916992, "global_step": 62089, "epoch": 513} {"train_loss": -35.28593063354492, "global_step": 62090, "epoch": 513} {"train_loss": -34.45105743408203, "global_step": 62091, "epoch": 513} {"train_loss": -35.37934875488281, "global_step": 62092, "epoch": 513} {"train_loss": -35.79816436767578, "global_step": 62093, "epoch": 513} {"train_loss": -34.90841293334961, "global_step": 62094, "epoch": 513} {"train_loss": -35.94143295288086, "global_step": 62095, "epoch": 513} {"train_loss": -35.85268783569336, "global_step": 62096, "epoch": 513} {"train_loss": -35.685848236083984, "global_step": 62097, "epoch": 513} {"train_loss": -36.50242233276367, "global_step": 62098, "epoch": 513} {"train_loss": -35.88175582885742, "global_step": 62099, "epoch": 513} {"train_loss": -36.0694465637207, "global_step": 62100, "epoch": 513} {"train_loss": -35.294124603271484, "global_step": 62101, "epoch": 513} {"train_loss": -35.14027404785156, "global_step": 62102, "epoch": 513} {"train_loss": -35.23157501220703, "global_step": 62103, "epoch": 513} {"train_loss": -35.90851593017578, "global_step": 62104, "epoch": 513} {"train_loss": -35.60834884643555, "global_step": 62105, "epoch": 513} {"train_loss": -36.30561065673828, "global_step": 62106, "epoch": 513} {"train_loss": -36.08845138549805, "global_step": 62107, "epoch": 513} {"train_loss": -36.20692825317383, "global_step": 62108, "epoch": 513} {"train_loss": -36.33742141723633, "global_step": 62109, "epoch": 513} {"train_loss": -35.98319625854492, "global_step": 62110, "epoch": 513} {"train_loss": -36.381492614746094, "global_step": 62111, "epoch": 513} {"train_loss": -35.65436553955078, "global_step": 62112, "epoch": 513} {"train_loss": -36.428768157958984, "global_step": 62113, "epoch": 513} {"train_loss": -36.40242385864258, "global_step": 62114, "epoch": 513} {"train_loss": -35.78181838989258, "global_step": 62115, "epoch": 513} {"train_loss": -36.32362365722656, "global_step": 62116, "epoch": 513} {"train_loss": -35.997833251953125, "global_step": 62117, "epoch": 513} {"train_loss": -36.27086639404297, "global_step": 62118, "epoch": 513} {"train_loss": -35.029788970947266, "global_step": 62119, "epoch": 513} {"train_loss": -36.28380584716797, "global_step": 62120, "epoch": 513} {"train_loss": -35.8460578918457, "global_step": 62121, "epoch": 513} {"train_loss": -36.036293029785156, "global_step": 62122, "epoch": 513} {"train_loss": -34.67060470581055, "global_step": 62123, "epoch": 513} {"train_loss": -36.57234573364258, "global_step": 62124, "epoch": 513} {"train_loss": -36.849056243896484, "global_step": 62125, "epoch": 513} {"train_loss": -35.3776969909668, "global_step": 62126, "epoch": 513} {"train_loss": -36.38534164428711, "global_step": 62127, "epoch": 513} {"train_loss": -36.4749641418457, "global_step": 62128, "epoch": 513} {"train_loss": -36.129798889160156, "global_step": 62129, "epoch": 513} {"train_loss": -34.614315032958984, "global_step": 62130, "epoch": 513} {"train_loss": -35.314605712890625, "global_step": 62131, "epoch": 513} {"train_loss": -36.24403762817383, "global_step": 62132, "epoch": 513} {"train_loss": -34.99193572998047, "global_step": 62133, "epoch": 513} {"train_loss": -35.11625289916992, "global_step": 62134, "epoch": 513} {"train_loss": -35.92617416381836, "global_step": 62135, "epoch": 513} {"train_loss": -35.938987731933594, "global_step": 62136, "epoch": 513} {"train_loss": -35.94053649902344, "global_step": 62137, "epoch": 513} {"train_loss": -34.80200958251953, "global_step": 62138, "epoch": 513} {"train_loss": -36.89339065551758, "global_step": 62139, "epoch": 513} {"train_loss": -35.468353271484375, "global_step": 62140, "epoch": 513} {"train_loss": -34.59585189819336, "global_step": 62141, "epoch": 513} {"train_loss": -36.91264724731445, "global_step": 62142, "epoch": 513} {"train_loss": -35.09379196166992, "global_step": 62143, "epoch": 513} {"train_loss": -35.840755462646484, "global_step": 62144, "epoch": 513} {"train_loss": -36.64760971069336, "global_step": 62145, "epoch": 513} {"train_loss": -29.0594539642334, "global_step": 62146, "epoch": 513} {"train_loss": -33.56119918823242, "global_step": 62147, "epoch": 513} {"train_loss": -28.280059814453125, "global_step": 62148, "epoch": 513} {"train_loss": -25.751733779907227, "global_step": 62149, "epoch": 513} {"train_loss": -30.21009635925293, "global_step": 62150, "epoch": 513} {"train_loss": -28.233539581298828, "global_step": 62151, "epoch": 513} {"train_loss": -27.707965850830078, "global_step": 62152, "epoch": 513} {"train_loss": -28.407285690307617, "global_step": 62153, "epoch": 513} {"train_loss": -31.010211944580078, "global_step": 62154, "epoch": 513} {"train_loss": -33.75348663330078, "global_step": 62155, "epoch": 513} {"train_loss": -28.46406364440918, "global_step": 62156, "epoch": 513} {"train_loss": -31.04717445373535, "global_step": 62157, "epoch": 513} {"train_loss": -31.584457397460938, "global_step": 62158, "epoch": 513} {"train_loss": -28.950475692749023, "global_step": 62159, "epoch": 513} {"train_loss": -30.339374542236328, "global_step": 62160, "epoch": 513} {"train_loss": -33.86688995361328, "global_step": 62161, "epoch": 513} {"train_loss": -32.897735595703125, "global_step": 62162, "epoch": 513} {"train_loss": -32.273860931396484, "global_step": 62163, "epoch": 513} {"train_loss": -33.57767868041992, "global_step": 62164, "epoch": 513} {"train_loss": -32.65302276611328, "global_step": 62165, "epoch": 513} {"train_loss": -33.755523681640625, "global_step": 62166, "epoch": 513} {"train_loss": -31.7557430267334, "global_step": 62167, "epoch": 513} {"train_loss": -33.6558837890625, "global_step": 62168, "epoch": 513} {"train_loss": -31.010955810546875, "global_step": 62169, "epoch": 513} {"train_loss": -33.11732864379883, "global_step": 62170, "epoch": 513} {"train_loss": -32.78662872314453, "global_step": 62171, "epoch": 513} {"train_loss": -33.3796272277832, "global_step": 62172, "epoch": 513} {"train_loss": -32.998443603515625, "global_step": 62173, "epoch": 513} {"train_loss": -33.14463424682617, "global_step": 62174, "epoch": 513} {"train_loss": -33.42249298095703, "global_step": 62175, "epoch": 513} {"train_loss": -31.99237632751465, "global_step": 62176, "epoch": 513} {"train_loss": -33.703121185302734, "global_step": 62177, "epoch": 513} {"train_loss": -33.00248336791992, "global_step": 62178, "epoch": 513} {"train_loss": -33.95139694213867, "global_step": 62179, "epoch": 513} {"train_loss": -33.52714157104492, "global_step": 62180, "epoch": 513} {"train_loss": -34.11595153808594, "global_step": 62181, "epoch": 513} {"train_loss": -34.444210052490234, "global_step": 62182, "epoch": 513} {"train_loss": -34.06092071533203, "global_step": 62183, "epoch": 513} {"train_loss": -33.91593551635742, "global_step": 62184, "epoch": 513} {"train_loss": -33.63668441772461, "global_step": 62185, "epoch": 513} {"train_loss": -33.75868606567383, "global_step": 62186, "epoch": 513} {"train_loss": -33.653011322021484, "global_step": 62187, "epoch": 513} {"train_loss": -33.68476486206055, "global_step": 62188, "epoch": 513} {"train_loss": -33.30656051635742, "global_step": 62189, "epoch": 513} {"train_loss": -33.280426025390625, "global_step": 62190, "epoch": 513} {"train_loss": -34.21073532104492, "global_step": 62191, "epoch": 513} {"train_loss": -34.219268798828125, "global_step": 62192, "epoch": 513} {"train_loss": -34.24499018330219, "global_step": 62193, "epoch": 513, "val_loss": 2537687.0} {"train_loss": -34.669307708740234, "global_step": 62194, "epoch": 514} {"train_loss": -34.283870697021484, "global_step": 62195, "epoch": 514} {"train_loss": -34.25362014770508, "global_step": 62196, "epoch": 514} {"train_loss": -35.283809661865234, "global_step": 62197, "epoch": 514} {"train_loss": -34.90825271606445, "global_step": 62198, "epoch": 514} {"train_loss": -34.54555130004883, "global_step": 62199, "epoch": 514} {"train_loss": -35.16838455200195, "global_step": 62200, "epoch": 514} {"train_loss": -35.21234130859375, "global_step": 62201, "epoch": 514} {"train_loss": -34.983184814453125, "global_step": 62202, "epoch": 514} {"train_loss": -35.03400802612305, "global_step": 62203, "epoch": 514} {"train_loss": -35.09432601928711, "global_step": 62204, "epoch": 514} {"train_loss": -35.3986930847168, "global_step": 62205, "epoch": 514} {"train_loss": -35.18431091308594, "global_step": 62206, "epoch": 514} {"train_loss": -35.3385009765625, "global_step": 62207, "epoch": 514} {"train_loss": -34.98914337158203, "global_step": 62208, "epoch": 514} {"train_loss": -34.984859466552734, "global_step": 62209, "epoch": 514} {"train_loss": -35.52733612060547, "global_step": 62210, "epoch": 514} {"train_loss": -35.94474792480469, "global_step": 62211, "epoch": 514} {"train_loss": -35.783363342285156, "global_step": 62212, "epoch": 514} {"train_loss": -35.306880950927734, "global_step": 62213, "epoch": 514} {"train_loss": -35.767330169677734, "global_step": 62214, "epoch": 514} {"train_loss": -35.955780029296875, "global_step": 62215, "epoch": 514} {"train_loss": -35.87093734741211, "global_step": 62216, "epoch": 514} {"train_loss": -34.58282470703125, "global_step": 62217, "epoch": 514} {"train_loss": -35.74229049682617, "global_step": 62218, "epoch": 514} {"train_loss": -35.56660079956055, "global_step": 62219, "epoch": 514} {"train_loss": -35.41972732543945, "global_step": 62220, "epoch": 514} {"train_loss": -35.17524337768555, "global_step": 62221, "epoch": 514} {"train_loss": -36.06689453125, "global_step": 62222, "epoch": 514} {"train_loss": -35.715003967285156, "global_step": 62223, "epoch": 514} {"train_loss": -35.024253845214844, "global_step": 62224, "epoch": 514} {"train_loss": -35.446022033691406, "global_step": 62225, "epoch": 514} {"train_loss": -34.773529052734375, "global_step": 62226, "epoch": 514} {"train_loss": -35.4963264465332, "global_step": 62227, "epoch": 514} {"train_loss": -35.560245513916016, "global_step": 62228, "epoch": 514} {"train_loss": -35.42800521850586, "global_step": 62229, "epoch": 514} {"train_loss": -36.709022521972656, "global_step": 62230, "epoch": 514} {"train_loss": -36.42607498168945, "global_step": 62231, "epoch": 514} {"train_loss": -36.19398880004883, "global_step": 62232, "epoch": 514} {"train_loss": -36.39216995239258, "global_step": 62233, "epoch": 514} {"train_loss": -36.27915573120117, "global_step": 62234, "epoch": 514} {"train_loss": -35.92951583862305, "global_step": 62235, "epoch": 514} {"train_loss": -36.03471755981445, "global_step": 62236, "epoch": 514} {"train_loss": -35.26292037963867, "global_step": 62237, "epoch": 514} {"train_loss": -33.81904602050781, "global_step": 62238, "epoch": 514} {"train_loss": -31.225732803344727, "global_step": 62239, "epoch": 514} {"train_loss": -31.032764434814453, "global_step": 62240, "epoch": 514} {"train_loss": -32.49969482421875, "global_step": 62241, "epoch": 514} {"train_loss": -35.54476547241211, "global_step": 62242, "epoch": 514} {"train_loss": -34.841800689697266, "global_step": 62243, "epoch": 514} {"train_loss": -32.956966400146484, "global_step": 62244, "epoch": 514} {"train_loss": -36.05325698852539, "global_step": 62245, "epoch": 514} {"train_loss": -35.868797302246094, "global_step": 62246, "epoch": 514} {"train_loss": -35.81707763671875, "global_step": 62247, "epoch": 514} {"train_loss": -34.5385627746582, "global_step": 62248, "epoch": 514} {"train_loss": -35.7939453125, "global_step": 62249, "epoch": 514} {"train_loss": -36.13614273071289, "global_step": 62250, "epoch": 514} {"train_loss": -35.35700225830078, "global_step": 62251, "epoch": 514} {"train_loss": -35.062713623046875, "global_step": 62252, "epoch": 514} {"train_loss": -34.235755920410156, "global_step": 62253, "epoch": 514} {"train_loss": -35.4296989440918, "global_step": 62254, "epoch": 514} {"train_loss": -32.50800323486328, "global_step": 62255, "epoch": 514} {"train_loss": -30.302204132080078, "global_step": 62256, "epoch": 514} {"train_loss": -28.7104434967041, "global_step": 62257, "epoch": 514} {"train_loss": -30.07796287536621, "global_step": 62258, "epoch": 514} {"train_loss": -35.90009689331055, "global_step": 62259, "epoch": 514} {"train_loss": -33.939762115478516, "global_step": 62260, "epoch": 514} {"train_loss": -32.4911994934082, "global_step": 62261, "epoch": 514} {"train_loss": -34.32511901855469, "global_step": 62262, "epoch": 514} {"train_loss": -34.86611557006836, "global_step": 62263, "epoch": 514} {"train_loss": -33.333351135253906, "global_step": 62264, "epoch": 514} {"train_loss": -35.070186614990234, "global_step": 62265, "epoch": 514} {"train_loss": -34.12489700317383, "global_step": 62266, "epoch": 514} {"train_loss": -35.499507904052734, "global_step": 62267, "epoch": 514} {"train_loss": -34.13502883911133, "global_step": 62268, "epoch": 514} {"train_loss": -35.48621368408203, "global_step": 62269, "epoch": 514} {"train_loss": -35.04985427856445, "global_step": 62270, "epoch": 514} {"train_loss": -36.389488220214844, "global_step": 62271, "epoch": 514} {"train_loss": -35.60627365112305, "global_step": 62272, "epoch": 514} {"train_loss": -35.67780303955078, "global_step": 62273, "epoch": 514} {"train_loss": -34.82041931152344, "global_step": 62274, "epoch": 514} {"train_loss": -35.7440071105957, "global_step": 62275, "epoch": 514} {"train_loss": -35.267616271972656, "global_step": 62276, "epoch": 514} {"train_loss": -35.22991180419922, "global_step": 62277, "epoch": 514} {"train_loss": -35.43748092651367, "global_step": 62278, "epoch": 514} {"train_loss": -35.65494155883789, "global_step": 62279, "epoch": 514} {"train_loss": -36.173641204833984, "global_step": 62280, "epoch": 514} {"train_loss": -35.84942626953125, "global_step": 62281, "epoch": 514} {"train_loss": -35.29848861694336, "global_step": 62282, "epoch": 514} {"train_loss": -36.431915283203125, "global_step": 62283, "epoch": 514} {"train_loss": -36.29517364501953, "global_step": 62284, "epoch": 514} {"train_loss": -35.97162628173828, "global_step": 62285, "epoch": 514} {"train_loss": -36.76423263549805, "global_step": 62286, "epoch": 514} {"train_loss": -36.29322052001953, "global_step": 62287, "epoch": 514} {"train_loss": -36.1487922668457, "global_step": 62288, "epoch": 514} {"train_loss": -36.04399490356445, "global_step": 62289, "epoch": 514} {"train_loss": -36.16216278076172, "global_step": 62290, "epoch": 514} {"train_loss": -36.0208854675293, "global_step": 62291, "epoch": 514} {"train_loss": -35.6140022277832, "global_step": 62292, "epoch": 514} {"train_loss": -35.31711959838867, "global_step": 62293, "epoch": 514} {"train_loss": -33.42988967895508, "global_step": 62294, "epoch": 514} {"train_loss": -35.607269287109375, "global_step": 62295, "epoch": 514} {"train_loss": -35.695430755615234, "global_step": 62296, "epoch": 514} {"train_loss": -35.20597457885742, "global_step": 62297, "epoch": 514} {"train_loss": -35.97492980957031, "global_step": 62298, "epoch": 514} {"train_loss": -35.084571838378906, "global_step": 62299, "epoch": 514} {"train_loss": -35.853736877441406, "global_step": 62300, "epoch": 514} {"train_loss": -35.96577072143555, "global_step": 62301, "epoch": 514} {"train_loss": -35.50213623046875, "global_step": 62302, "epoch": 514} {"train_loss": -35.6275749206543, "global_step": 62303, "epoch": 514} {"train_loss": -35.85216522216797, "global_step": 62304, "epoch": 514} {"train_loss": -35.8140983581543, "global_step": 62305, "epoch": 514} {"train_loss": -36.174285888671875, "global_step": 62306, "epoch": 514} {"train_loss": -35.69755554199219, "global_step": 62307, "epoch": 514} {"train_loss": -36.23246383666992, "global_step": 62308, "epoch": 514} {"train_loss": -36.4995002746582, "global_step": 62309, "epoch": 514} {"train_loss": -35.76654815673828, "global_step": 62310, "epoch": 514} {"train_loss": -36.10514831542969, "global_step": 62311, "epoch": 514} {"train_loss": -37.03824996948242, "global_step": 62312, "epoch": 514} {"train_loss": -36.5037956237793, "global_step": 62313, "epoch": 514} {"train_loss": -35.17448080078629, "global_step": 62314, "epoch": 514, "val_loss": 2648496.25} {"train_loss": -36.5377082824707, "global_step": 62315, "epoch": 515} {"train_loss": -36.08796310424805, "global_step": 62316, "epoch": 515} {"train_loss": -36.30736541748047, "global_step": 62317, "epoch": 515} {"train_loss": -36.9560661315918, "global_step": 62318, "epoch": 515} {"train_loss": -36.45359420776367, "global_step": 62319, "epoch": 515} {"train_loss": -37.214359283447266, "global_step": 62320, "epoch": 515} {"train_loss": -36.13291549682617, "global_step": 62321, "epoch": 515} {"train_loss": -36.4415283203125, "global_step": 62322, "epoch": 515} {"train_loss": -35.93697738647461, "global_step": 62323, "epoch": 515} {"train_loss": -34.741249084472656, "global_step": 62324, "epoch": 515} {"train_loss": -31.47308349609375, "global_step": 62325, "epoch": 515} {"train_loss": -26.41617774963379, "global_step": 62326, "epoch": 515} {"train_loss": -27.75739097595215, "global_step": 62327, "epoch": 515} {"train_loss": -35.230499267578125, "global_step": 62328, "epoch": 515} {"train_loss": -32.90509796142578, "global_step": 62329, "epoch": 515} {"train_loss": -31.106115341186523, "global_step": 62330, "epoch": 515} {"train_loss": -36.389652252197266, "global_step": 62331, "epoch": 515} {"train_loss": -33.14418411254883, "global_step": 62332, "epoch": 515} {"train_loss": -35.76737594604492, "global_step": 62333, "epoch": 515} {"train_loss": -33.9901008605957, "global_step": 62334, "epoch": 515} {"train_loss": -35.489990234375, "global_step": 62335, "epoch": 515} {"train_loss": -35.1823616027832, "global_step": 62336, "epoch": 515} {"train_loss": -36.089595794677734, "global_step": 62337, "epoch": 515} {"train_loss": -35.64894485473633, "global_step": 62338, "epoch": 515} {"train_loss": -36.14005661010742, "global_step": 62339, "epoch": 515} {"train_loss": -35.1016731262207, "global_step": 62340, "epoch": 515} {"train_loss": -35.861663818359375, "global_step": 62341, "epoch": 515} {"train_loss": -36.128414154052734, "global_step": 62342, "epoch": 515} {"train_loss": -35.800682067871094, "global_step": 62343, "epoch": 515} {"train_loss": -36.52357864379883, "global_step": 62344, "epoch": 515} {"train_loss": -36.26347732543945, "global_step": 62345, "epoch": 515} {"train_loss": -36.0692024230957, "global_step": 62346, "epoch": 515} {"train_loss": -37.12575912475586, "global_step": 62347, "epoch": 515} {"train_loss": -36.06357955932617, "global_step": 62348, "epoch": 515} {"train_loss": -36.29462814331055, "global_step": 62349, "epoch": 515} {"train_loss": -36.7514762878418, "global_step": 62350, "epoch": 515} {"train_loss": -36.56281280517578, "global_step": 62351, "epoch": 515} {"train_loss": -36.7697868347168, "global_step": 62352, "epoch": 515} {"train_loss": -36.53619384765625, "global_step": 62353, "epoch": 515} {"train_loss": -36.341854095458984, "global_step": 62354, "epoch": 515} {"train_loss": -37.139442443847656, "global_step": 62355, "epoch": 515} {"train_loss": -35.8557243347168, "global_step": 62356, "epoch": 515} {"train_loss": -36.695472717285156, "global_step": 62357, "epoch": 515} {"train_loss": -36.567283630371094, "global_step": 62358, "epoch": 515} {"train_loss": -36.80674362182617, "global_step": 62359, "epoch": 515} {"train_loss": -37.05690383911133, "global_step": 62360, "epoch": 515} {"train_loss": -37.56620407104492, "global_step": 62361, "epoch": 515} {"train_loss": -36.89509963989258, "global_step": 62362, "epoch": 515} {"train_loss": -37.13728332519531, "global_step": 62363, "epoch": 515} {"train_loss": -36.787288665771484, "global_step": 62364, "epoch": 515} {"train_loss": -37.260963439941406, "global_step": 62365, "epoch": 515} {"train_loss": -36.69929122924805, "global_step": 62366, "epoch": 515} {"train_loss": -36.947021484375, "global_step": 62367, "epoch": 515} {"train_loss": -36.511512756347656, "global_step": 62368, "epoch": 515} {"train_loss": -37.10392379760742, "global_step": 62369, "epoch": 515} {"train_loss": -36.98642349243164, "global_step": 62370, "epoch": 515} {"train_loss": -36.81085968017578, "global_step": 62371, "epoch": 515} {"train_loss": -36.511695861816406, "global_step": 62372, "epoch": 515} {"train_loss": -36.493995666503906, "global_step": 62373, "epoch": 515} {"train_loss": -36.00211715698242, "global_step": 62374, "epoch": 515} {"train_loss": -35.638126373291016, "global_step": 62375, "epoch": 515} {"train_loss": -34.63399124145508, "global_step": 62376, "epoch": 515} {"train_loss": -35.38796615600586, "global_step": 62377, "epoch": 515} {"train_loss": -36.127933502197266, "global_step": 62378, "epoch": 515} {"train_loss": -35.841773986816406, "global_step": 62379, "epoch": 515} {"train_loss": -36.90194320678711, "global_step": 62380, "epoch": 515} {"train_loss": -35.41510772705078, "global_step": 62381, "epoch": 515} {"train_loss": -35.813899993896484, "global_step": 62382, "epoch": 515} {"train_loss": -32.47388458251953, "global_step": 62383, "epoch": 515} {"train_loss": -28.41847801208496, "global_step": 62384, "epoch": 515} {"train_loss": -29.080175399780273, "global_step": 62385, "epoch": 515} {"train_loss": -35.25365447998047, "global_step": 62386, "epoch": 515} {"train_loss": -34.4180908203125, "global_step": 62387, "epoch": 515} {"train_loss": -31.73677635192871, "global_step": 62388, "epoch": 515} {"train_loss": -33.40007400512695, "global_step": 62389, "epoch": 515} {"train_loss": -35.364315032958984, "global_step": 62390, "epoch": 515} {"train_loss": -33.181724548339844, "global_step": 62391, "epoch": 515} {"train_loss": -35.878475189208984, "global_step": 62392, "epoch": 515} {"train_loss": -33.513145446777344, "global_step": 62393, "epoch": 515} {"train_loss": -33.42274856567383, "global_step": 62394, "epoch": 515} {"train_loss": -35.27413558959961, "global_step": 62395, "epoch": 515} {"train_loss": -32.98344039916992, "global_step": 62396, "epoch": 515} {"train_loss": -34.422523498535156, "global_step": 62397, "epoch": 515} {"train_loss": -33.818885803222656, "global_step": 62398, "epoch": 515} {"train_loss": -34.8245964050293, "global_step": 62399, "epoch": 515} {"train_loss": -33.88226318359375, "global_step": 62400, "epoch": 515} {"train_loss": -35.99654006958008, "global_step": 62401, "epoch": 515} {"train_loss": -34.262237548828125, "global_step": 62402, "epoch": 515} {"train_loss": -35.3541374206543, "global_step": 62403, "epoch": 515} {"train_loss": -35.39741134643555, "global_step": 62404, "epoch": 515} {"train_loss": -35.56166076660156, "global_step": 62405, "epoch": 515} {"train_loss": -35.81943893432617, "global_step": 62406, "epoch": 515} {"train_loss": -35.26899719238281, "global_step": 62407, "epoch": 515} {"train_loss": -36.033180236816406, "global_step": 62408, "epoch": 515} {"train_loss": -35.505035400390625, "global_step": 62409, "epoch": 515} {"train_loss": -35.71399688720703, "global_step": 62410, "epoch": 515} {"train_loss": -36.190467834472656, "global_step": 62411, "epoch": 515} {"train_loss": -35.686763763427734, "global_step": 62412, "epoch": 515} {"train_loss": -36.09988021850586, "global_step": 62413, "epoch": 515} {"train_loss": -36.14634704589844, "global_step": 62414, "epoch": 515} {"train_loss": -36.44364929199219, "global_step": 62415, "epoch": 515} {"train_loss": -36.02522277832031, "global_step": 62416, "epoch": 515} {"train_loss": -36.51434326171875, "global_step": 62417, "epoch": 515} {"train_loss": -36.050296783447266, "global_step": 62418, "epoch": 515} {"train_loss": -36.616519927978516, "global_step": 62419, "epoch": 515} {"train_loss": -36.937171936035156, "global_step": 62420, "epoch": 515} {"train_loss": -36.48408889770508, "global_step": 62421, "epoch": 515} {"train_loss": -36.39124298095703, "global_step": 62422, "epoch": 515} {"train_loss": -36.73871612548828, "global_step": 62423, "epoch": 515} {"train_loss": -36.445411682128906, "global_step": 62424, "epoch": 515} {"train_loss": -36.17533493041992, "global_step": 62425, "epoch": 515} {"train_loss": -36.58052062988281, "global_step": 62426, "epoch": 515} {"train_loss": -36.8885498046875, "global_step": 62427, "epoch": 515} {"train_loss": -37.19041442871094, "global_step": 62428, "epoch": 515} {"train_loss": -36.74532699584961, "global_step": 62429, "epoch": 515} {"train_loss": -37.042720794677734, "global_step": 62430, "epoch": 515} {"train_loss": -36.97491455078125, "global_step": 62431, "epoch": 515} {"train_loss": -36.76821517944336, "global_step": 62432, "epoch": 515} {"train_loss": -37.025779724121094, "global_step": 62433, "epoch": 515} {"train_loss": -36.269081115722656, "global_step": 62434, "epoch": 515} {"train_loss": -35.53254321389947, "global_step": 62435, "epoch": 515, "val_loss": 2629675.25} {"train_loss": -37.010948181152344, "global_step": 62436, "epoch": 516} {"train_loss": -32.78028106689453, "global_step": 62437, "epoch": 516} {"train_loss": -36.174251556396484, "global_step": 62438, "epoch": 516} {"train_loss": -35.65547180175781, "global_step": 62439, "epoch": 516} {"train_loss": -35.17879867553711, "global_step": 62440, "epoch": 516} {"train_loss": -36.399452209472656, "global_step": 62441, "epoch": 516} {"train_loss": -35.050018310546875, "global_step": 62442, "epoch": 516} {"train_loss": -35.6677360534668, "global_step": 62443, "epoch": 516} {"train_loss": -35.044769287109375, "global_step": 62444, "epoch": 516} {"train_loss": -36.400447845458984, "global_step": 62445, "epoch": 516} {"train_loss": -36.64875030517578, "global_step": 62446, "epoch": 516} {"train_loss": -35.254695892333984, "global_step": 62447, "epoch": 516} {"train_loss": -36.304622650146484, "global_step": 62448, "epoch": 516} {"train_loss": -35.93665313720703, "global_step": 62449, "epoch": 516} {"train_loss": -36.404640197753906, "global_step": 62450, "epoch": 516} {"train_loss": -36.12455749511719, "global_step": 62451, "epoch": 516} {"train_loss": -36.60757064819336, "global_step": 62452, "epoch": 516} {"train_loss": -36.0868034362793, "global_step": 62453, "epoch": 516} {"train_loss": -35.972381591796875, "global_step": 62454, "epoch": 516} {"train_loss": -35.42393493652344, "global_step": 62455, "epoch": 516} {"train_loss": -35.615562438964844, "global_step": 62456, "epoch": 516} {"train_loss": -36.3038444519043, "global_step": 62457, "epoch": 516} {"train_loss": -34.779083251953125, "global_step": 62458, "epoch": 516} {"train_loss": -34.46699905395508, "global_step": 62459, "epoch": 516} {"train_loss": -32.2452507019043, "global_step": 62460, "epoch": 516} {"train_loss": -33.05678939819336, "global_step": 62461, "epoch": 516} {"train_loss": -35.64958190917969, "global_step": 62462, "epoch": 516} {"train_loss": -35.873939514160156, "global_step": 62463, "epoch": 516} {"train_loss": -32.748138427734375, "global_step": 62464, "epoch": 516} {"train_loss": -33.88003158569336, "global_step": 62465, "epoch": 516} {"train_loss": -36.415706634521484, "global_step": 62466, "epoch": 516} {"train_loss": -33.27192306518555, "global_step": 62467, "epoch": 516} {"train_loss": -35.87177276611328, "global_step": 62468, "epoch": 516} {"train_loss": -34.41249465942383, "global_step": 62469, "epoch": 516} {"train_loss": -35.725215911865234, "global_step": 62470, "epoch": 516} {"train_loss": -35.46268844604492, "global_step": 62471, "epoch": 516} {"train_loss": -35.907222747802734, "global_step": 62472, "epoch": 516} {"train_loss": -36.25020980834961, "global_step": 62473, "epoch": 516} {"train_loss": -35.42804718017578, "global_step": 62474, "epoch": 516} {"train_loss": -35.604095458984375, "global_step": 62475, "epoch": 516} {"train_loss": -34.02537155151367, "global_step": 62476, "epoch": 516} {"train_loss": -34.47589874267578, "global_step": 62477, "epoch": 516} {"train_loss": -34.79049301147461, "global_step": 62478, "epoch": 516} {"train_loss": -36.178646087646484, "global_step": 62479, "epoch": 516} {"train_loss": -36.46271896362305, "global_step": 62480, "epoch": 516} {"train_loss": -36.26618194580078, "global_step": 62481, "epoch": 516} {"train_loss": -36.352783203125, "global_step": 62482, "epoch": 516} {"train_loss": -36.3841667175293, "global_step": 62483, "epoch": 516} {"train_loss": -35.84531784057617, "global_step": 62484, "epoch": 516} {"train_loss": -36.05744552612305, "global_step": 62485, "epoch": 516} {"train_loss": -36.670127868652344, "global_step": 62486, "epoch": 516} {"train_loss": -35.381675720214844, "global_step": 62487, "epoch": 516} {"train_loss": -35.51406478881836, "global_step": 62488, "epoch": 516} {"train_loss": -36.85573959350586, "global_step": 62489, "epoch": 516} {"train_loss": -36.0694465637207, "global_step": 62490, "epoch": 516} {"train_loss": -36.47534942626953, "global_step": 62491, "epoch": 516} {"train_loss": -35.93989181518555, "global_step": 62492, "epoch": 516} {"train_loss": -34.91532516479492, "global_step": 62493, "epoch": 516} {"train_loss": -36.19169235229492, "global_step": 62494, "epoch": 516} {"train_loss": -36.241878509521484, "global_step": 62495, "epoch": 516} {"train_loss": -36.5016975402832, "global_step": 62496, "epoch": 516} {"train_loss": -36.49337387084961, "global_step": 62497, "epoch": 516} {"train_loss": -36.1898078918457, "global_step": 62498, "epoch": 516} {"train_loss": -35.78696060180664, "global_step": 62499, "epoch": 516} {"train_loss": -35.85154724121094, "global_step": 62500, "epoch": 516} {"train_loss": -36.497188568115234, "global_step": 62501, "epoch": 516} {"train_loss": -36.90147399902344, "global_step": 62502, "epoch": 516} {"train_loss": -36.304962158203125, "global_step": 62503, "epoch": 516} {"train_loss": -36.4160041809082, "global_step": 62504, "epoch": 516} {"train_loss": -36.54305648803711, "global_step": 62505, "epoch": 516} {"train_loss": -36.906768798828125, "global_step": 62506, "epoch": 516} {"train_loss": -36.96854782104492, "global_step": 62507, "epoch": 516} {"train_loss": -36.58109664916992, "global_step": 62508, "epoch": 516} {"train_loss": -36.62325668334961, "global_step": 62509, "epoch": 516} {"train_loss": -37.10820770263672, "global_step": 62510, "epoch": 516} {"train_loss": -36.817596435546875, "global_step": 62511, "epoch": 516} {"train_loss": -35.54104232788086, "global_step": 62512, "epoch": 516} {"train_loss": -34.86356735229492, "global_step": 62513, "epoch": 516} {"train_loss": -36.23807907104492, "global_step": 62514, "epoch": 516} {"train_loss": -36.829978942871094, "global_step": 62515, "epoch": 516} {"train_loss": -36.22349548339844, "global_step": 62516, "epoch": 516} {"train_loss": -36.36603546142578, "global_step": 62517, "epoch": 516} {"train_loss": -36.858055114746094, "global_step": 62518, "epoch": 516} {"train_loss": -36.752845764160156, "global_step": 62519, "epoch": 516} {"train_loss": -36.074195861816406, "global_step": 62520, "epoch": 516} {"train_loss": -34.63814926147461, "global_step": 62521, "epoch": 516} {"train_loss": -31.690549850463867, "global_step": 62522, "epoch": 516} {"train_loss": -31.418384552001953, "global_step": 62523, "epoch": 516} {"train_loss": -33.7240104675293, "global_step": 62524, "epoch": 516} {"train_loss": -36.824031829833984, "global_step": 62525, "epoch": 516} {"train_loss": -34.83780288696289, "global_step": 62526, "epoch": 516} {"train_loss": -33.81709671020508, "global_step": 62527, "epoch": 516} {"train_loss": -36.08735656738281, "global_step": 62528, "epoch": 516} {"train_loss": -35.91685104370117, "global_step": 62529, "epoch": 516} {"train_loss": -34.83043670654297, "global_step": 62530, "epoch": 516} {"train_loss": -36.74802780151367, "global_step": 62531, "epoch": 516} {"train_loss": -35.24215316772461, "global_step": 62532, "epoch": 516} {"train_loss": -35.01302719116211, "global_step": 62533, "epoch": 516} {"train_loss": -35.86494064331055, "global_step": 62534, "epoch": 516} {"train_loss": -35.78417205810547, "global_step": 62535, "epoch": 516} {"train_loss": -34.566627502441406, "global_step": 62536, "epoch": 516} {"train_loss": -35.61106491088867, "global_step": 62537, "epoch": 516} {"train_loss": -36.44337463378906, "global_step": 62538, "epoch": 516} {"train_loss": -36.543365478515625, "global_step": 62539, "epoch": 516} {"train_loss": -36.30237579345703, "global_step": 62540, "epoch": 516} {"train_loss": -36.945289611816406, "global_step": 62541, "epoch": 516} {"train_loss": -36.74739456176758, "global_step": 62542, "epoch": 516} {"train_loss": -36.27812576293945, "global_step": 62543, "epoch": 516} {"train_loss": -36.44195556640625, "global_step": 62544, "epoch": 516} {"train_loss": -35.75970458984375, "global_step": 62545, "epoch": 516} {"train_loss": -36.036685943603516, "global_step": 62546, "epoch": 516} {"train_loss": -36.10415267944336, "global_step": 62547, "epoch": 516} {"train_loss": -36.7401237487793, "global_step": 62548, "epoch": 516} {"train_loss": -36.58585739135742, "global_step": 62549, "epoch": 516} {"train_loss": -36.958099365234375, "global_step": 62550, "epoch": 516} {"train_loss": -36.55366516113281, "global_step": 62551, "epoch": 516} {"train_loss": -36.523250579833984, "global_step": 62552, "epoch": 516} {"train_loss": -37.004859924316406, "global_step": 62553, "epoch": 516} {"train_loss": -36.05883026123047, "global_step": 62554, "epoch": 516} {"train_loss": -36.94247055053711, "global_step": 62555, "epoch": 516} {"train_loss": -35.77253768857845, "global_step": 62556, "epoch": 516, "val_loss": 2472423.25} {"train_loss": -36.70893859863281, "global_step": 62557, "epoch": 517} {"train_loss": -36.784236907958984, "global_step": 62558, "epoch": 517} {"train_loss": -36.926177978515625, "global_step": 62559, "epoch": 517} {"train_loss": -36.73298263549805, "global_step": 62560, "epoch": 517} {"train_loss": -37.01587677001953, "global_step": 62561, "epoch": 517} {"train_loss": -36.82135009765625, "global_step": 62562, "epoch": 517} {"train_loss": -35.97245788574219, "global_step": 62563, "epoch": 517} {"train_loss": -36.75797653198242, "global_step": 62564, "epoch": 517} {"train_loss": -36.75629425048828, "global_step": 62565, "epoch": 517} {"train_loss": -35.4220085144043, "global_step": 62566, "epoch": 517} {"train_loss": -35.33028793334961, "global_step": 62567, "epoch": 517} {"train_loss": -36.35405731201172, "global_step": 62568, "epoch": 517} {"train_loss": -34.9842643737793, "global_step": 62569, "epoch": 517} {"train_loss": -35.5897216796875, "global_step": 62570, "epoch": 517} {"train_loss": -36.190460205078125, "global_step": 62571, "epoch": 517} {"train_loss": -36.76586151123047, "global_step": 62572, "epoch": 517} {"train_loss": -36.26820755004883, "global_step": 62573, "epoch": 517} {"train_loss": -36.65242004394531, "global_step": 62574, "epoch": 517} {"train_loss": -36.01443099975586, "global_step": 62575, "epoch": 517} {"train_loss": -36.46753692626953, "global_step": 62576, "epoch": 517} {"train_loss": -36.41660690307617, "global_step": 62577, "epoch": 517} {"train_loss": -36.76789474487305, "global_step": 62578, "epoch": 517} {"train_loss": -35.8885498046875, "global_step": 62579, "epoch": 517} {"train_loss": -36.4339714050293, "global_step": 62580, "epoch": 517} {"train_loss": -35.118324279785156, "global_step": 62581, "epoch": 517} {"train_loss": -34.77323532104492, "global_step": 62582, "epoch": 517} {"train_loss": -35.48952865600586, "global_step": 62583, "epoch": 517} {"train_loss": -34.84034729003906, "global_step": 62584, "epoch": 517} {"train_loss": -36.00957107543945, "global_step": 62585, "epoch": 517} {"train_loss": -37.305908203125, "global_step": 62586, "epoch": 517} {"train_loss": -36.51131820678711, "global_step": 62587, "epoch": 517} {"train_loss": -36.246604919433594, "global_step": 62588, "epoch": 517} {"train_loss": -35.549468994140625, "global_step": 62589, "epoch": 517} {"train_loss": -35.625850677490234, "global_step": 62590, "epoch": 517} {"train_loss": -36.11130905151367, "global_step": 62591, "epoch": 517} {"train_loss": -35.94785690307617, "global_step": 62592, "epoch": 517} {"train_loss": -35.88971710205078, "global_step": 62593, "epoch": 517} {"train_loss": -35.66558837890625, "global_step": 62594, "epoch": 517} {"train_loss": -36.202659606933594, "global_step": 62595, "epoch": 517} {"train_loss": -36.8934440612793, "global_step": 62596, "epoch": 517} {"train_loss": -34.39289093017578, "global_step": 62597, "epoch": 517} {"train_loss": -34.79315185546875, "global_step": 62598, "epoch": 517} {"train_loss": -36.16907501220703, "global_step": 62599, "epoch": 517} {"train_loss": -35.94141387939453, "global_step": 62600, "epoch": 517} {"train_loss": -35.331668853759766, "global_step": 62601, "epoch": 517} {"train_loss": -35.962154388427734, "global_step": 62602, "epoch": 517} {"train_loss": -36.02126693725586, "global_step": 62603, "epoch": 517} {"train_loss": -35.99916076660156, "global_step": 62604, "epoch": 517} {"train_loss": -36.342227935791016, "global_step": 62605, "epoch": 517} {"train_loss": -35.7121696472168, "global_step": 62606, "epoch": 517} {"train_loss": -37.02227783203125, "global_step": 62607, "epoch": 517} {"train_loss": -36.263404846191406, "global_step": 62608, "epoch": 517} {"train_loss": -37.094173431396484, "global_step": 62609, "epoch": 517} {"train_loss": -36.734657287597656, "global_step": 62610, "epoch": 517} {"train_loss": -36.919551849365234, "global_step": 62611, "epoch": 517} {"train_loss": -36.479496002197266, "global_step": 62612, "epoch": 517} {"train_loss": -36.94493103027344, "global_step": 62613, "epoch": 517} {"train_loss": -37.13320541381836, "global_step": 62614, "epoch": 517} {"train_loss": -36.9830436706543, "global_step": 62615, "epoch": 517} {"train_loss": -37.056331634521484, "global_step": 62616, "epoch": 517} {"train_loss": -37.034114837646484, "global_step": 62617, "epoch": 517} {"train_loss": -36.82102584838867, "global_step": 62618, "epoch": 517} {"train_loss": -37.30959701538086, "global_step": 62619, "epoch": 517} {"train_loss": -36.26292419433594, "global_step": 62620, "epoch": 517} {"train_loss": -36.60755157470703, "global_step": 62621, "epoch": 517} {"train_loss": -36.91719436645508, "global_step": 62622, "epoch": 517} {"train_loss": -35.53483200073242, "global_step": 62623, "epoch": 517} {"train_loss": -35.644134521484375, "global_step": 62624, "epoch": 517} {"train_loss": -35.836177825927734, "global_step": 62625, "epoch": 517} {"train_loss": -31.90960121154785, "global_step": 62626, "epoch": 517} {"train_loss": -26.40937614440918, "global_step": 62627, "epoch": 517} {"train_loss": -7.315832614898682, "global_step": 62628, "epoch": 517} {"train_loss": 7.7978997230529785, "global_step": 62629, "epoch": 517} {"train_loss": -32.0555419921875, "global_step": 62630, "epoch": 517} {"train_loss": -19.223752975463867, "global_step": 62631, "epoch": 517} {"train_loss": -28.762624740600586, "global_step": 62632, "epoch": 517} {"train_loss": -28.1839542388916, "global_step": 62633, "epoch": 517} {"train_loss": -34.16034698486328, "global_step": 62634, "epoch": 517} {"train_loss": -30.207494735717773, "global_step": 62635, "epoch": 517} {"train_loss": -34.10732650756836, "global_step": 62636, "epoch": 517} {"train_loss": -34.0257453918457, "global_step": 62637, "epoch": 517} {"train_loss": -32.242149353027344, "global_step": 62638, "epoch": 517} {"train_loss": -33.843502044677734, "global_step": 62639, "epoch": 517} {"train_loss": -35.75393295288086, "global_step": 62640, "epoch": 517} {"train_loss": -33.743709564208984, "global_step": 62641, "epoch": 517} {"train_loss": -34.45390701293945, "global_step": 62642, "epoch": 517} {"train_loss": -34.4890251159668, "global_step": 62643, "epoch": 517} {"train_loss": -35.3226203918457, "global_step": 62644, "epoch": 517} {"train_loss": -34.73215866088867, "global_step": 62645, "epoch": 517} {"train_loss": -34.47700881958008, "global_step": 62646, "epoch": 517} {"train_loss": -35.400794982910156, "global_step": 62647, "epoch": 517} {"train_loss": -35.620262145996094, "global_step": 62648, "epoch": 517} {"train_loss": -35.68358612060547, "global_step": 62649, "epoch": 517} {"train_loss": -35.6484375, "global_step": 62650, "epoch": 517} {"train_loss": -35.608184814453125, "global_step": 62651, "epoch": 517} {"train_loss": -35.7319450378418, "global_step": 62652, "epoch": 517} {"train_loss": -36.165164947509766, "global_step": 62653, "epoch": 517} {"train_loss": -35.6381721496582, "global_step": 62654, "epoch": 517} {"train_loss": -36.182373046875, "global_step": 62655, "epoch": 517} {"train_loss": -35.60479736328125, "global_step": 62656, "epoch": 517} {"train_loss": -35.96959686279297, "global_step": 62657, "epoch": 517} {"train_loss": -35.9158935546875, "global_step": 62658, "epoch": 517} {"train_loss": -36.51816940307617, "global_step": 62659, "epoch": 517} {"train_loss": -36.30472183227539, "global_step": 62660, "epoch": 517} {"train_loss": -36.12705612182617, "global_step": 62661, "epoch": 517} {"train_loss": -36.0001220703125, "global_step": 62662, "epoch": 517} {"train_loss": -36.24469757080078, "global_step": 62663, "epoch": 517} {"train_loss": -36.708431243896484, "global_step": 62664, "epoch": 517} {"train_loss": -36.293941497802734, "global_step": 62665, "epoch": 517} {"train_loss": -36.628170013427734, "global_step": 62666, "epoch": 517} {"train_loss": -36.61631774902344, "global_step": 62667, "epoch": 517} {"train_loss": -36.59457778930664, "global_step": 62668, "epoch": 517} {"train_loss": -36.48188018798828, "global_step": 62669, "epoch": 517} {"train_loss": -36.634674072265625, "global_step": 62670, "epoch": 517} {"train_loss": -36.76467514038086, "global_step": 62671, "epoch": 517} {"train_loss": -36.38752365112305, "global_step": 62672, "epoch": 517} {"train_loss": -36.8121452331543, "global_step": 62673, "epoch": 517} {"train_loss": -36.78825759887695, "global_step": 62674, "epoch": 517} {"train_loss": -36.68951416015625, "global_step": 62675, "epoch": 517} {"train_loss": -36.77022933959961, "global_step": 62676, "epoch": 517} {"train_loss": -34.96170620878866, "global_step": 62677, "epoch": 517, "val_loss": 2568331.0} {"train_loss": -37.01644515991211, "global_step": 62678, "epoch": 518} {"train_loss": -37.03386306762695, "global_step": 62679, "epoch": 518} {"train_loss": -37.20684814453125, "global_step": 62680, "epoch": 518} {"train_loss": -37.305904388427734, "global_step": 62681, "epoch": 518} {"train_loss": -37.38819885253906, "global_step": 62682, "epoch": 518} {"train_loss": -37.14805221557617, "global_step": 62683, "epoch": 518} {"train_loss": -37.334083557128906, "global_step": 62684, "epoch": 518} {"train_loss": -36.91787338256836, "global_step": 62685, "epoch": 518} {"train_loss": -37.5659065246582, "global_step": 62686, "epoch": 518} {"train_loss": -37.16975021362305, "global_step": 62687, "epoch": 518} {"train_loss": -37.410736083984375, "global_step": 62688, "epoch": 518} {"train_loss": -37.7152099609375, "global_step": 62689, "epoch": 518} {"train_loss": -37.25227355957031, "global_step": 62690, "epoch": 518} {"train_loss": -36.83016586303711, "global_step": 62691, "epoch": 518} {"train_loss": -36.99266815185547, "global_step": 62692, "epoch": 518} {"train_loss": -36.54285430908203, "global_step": 62693, "epoch": 518} {"train_loss": -36.65620040893555, "global_step": 62694, "epoch": 518} {"train_loss": -36.49704360961914, "global_step": 62695, "epoch": 518} {"train_loss": -35.244903564453125, "global_step": 62696, "epoch": 518} {"train_loss": -34.62324142456055, "global_step": 62697, "epoch": 518} {"train_loss": -33.165679931640625, "global_step": 62698, "epoch": 518} {"train_loss": -30.063201904296875, "global_step": 62699, "epoch": 518} {"train_loss": -28.875965118408203, "global_step": 62700, "epoch": 518} {"train_loss": -31.859760284423828, "global_step": 62701, "epoch": 518} {"train_loss": -34.89803695678711, "global_step": 62702, "epoch": 518} {"train_loss": -35.098182678222656, "global_step": 62703, "epoch": 518} {"train_loss": -34.82236862182617, "global_step": 62704, "epoch": 518} {"train_loss": -34.49020004272461, "global_step": 62705, "epoch": 518} {"train_loss": -35.18787384033203, "global_step": 62706, "epoch": 518} {"train_loss": -34.382442474365234, "global_step": 62707, "epoch": 518} {"train_loss": -34.72336196899414, "global_step": 62708, "epoch": 518} {"train_loss": -34.727638244628906, "global_step": 62709, "epoch": 518} {"train_loss": -35.924312591552734, "global_step": 62710, "epoch": 518} {"train_loss": -35.29271697998047, "global_step": 62711, "epoch": 518} {"train_loss": -35.69460678100586, "global_step": 62712, "epoch": 518} {"train_loss": -35.57598876953125, "global_step": 62713, "epoch": 518} {"train_loss": -35.184383392333984, "global_step": 62714, "epoch": 518} {"train_loss": -35.84689712524414, "global_step": 62715, "epoch": 518} {"train_loss": -36.25350570678711, "global_step": 62716, "epoch": 518} {"train_loss": -34.72347640991211, "global_step": 62717, "epoch": 518} {"train_loss": -35.96632385253906, "global_step": 62718, "epoch": 518} {"train_loss": -34.89453125, "global_step": 62719, "epoch": 518} {"train_loss": -35.46702194213867, "global_step": 62720, "epoch": 518} {"train_loss": -35.218353271484375, "global_step": 62721, "epoch": 518} {"train_loss": -34.84534454345703, "global_step": 62722, "epoch": 518} {"train_loss": -35.809967041015625, "global_step": 62723, "epoch": 518} {"train_loss": -35.160152435302734, "global_step": 62724, "epoch": 518} {"train_loss": -36.16740036010742, "global_step": 62725, "epoch": 518} {"train_loss": -36.22588348388672, "global_step": 62726, "epoch": 518} {"train_loss": -35.89931106567383, "global_step": 62727, "epoch": 518} {"train_loss": -36.22502517700195, "global_step": 62728, "epoch": 518} {"train_loss": -36.09664535522461, "global_step": 62729, "epoch": 518} {"train_loss": -35.90267562866211, "global_step": 62730, "epoch": 518} {"train_loss": -35.99036407470703, "global_step": 62731, "epoch": 518} {"train_loss": -35.6480827331543, "global_step": 62732, "epoch": 518} {"train_loss": -35.511444091796875, "global_step": 62733, "epoch": 518} {"train_loss": -35.99700927734375, "global_step": 62734, "epoch": 518} {"train_loss": -35.6364860534668, "global_step": 62735, "epoch": 518} {"train_loss": -35.45058822631836, "global_step": 62736, "epoch": 518} {"train_loss": -36.42304611206055, "global_step": 62737, "epoch": 518} {"train_loss": -36.04602813720703, "global_step": 62738, "epoch": 518} {"train_loss": -35.82874298095703, "global_step": 62739, "epoch": 518} {"train_loss": -35.90829086303711, "global_step": 62740, "epoch": 518} {"train_loss": -36.18811798095703, "global_step": 62741, "epoch": 518} {"train_loss": -35.7529296875, "global_step": 62742, "epoch": 518} {"train_loss": -35.54663848876953, "global_step": 62743, "epoch": 518} {"train_loss": -36.451385498046875, "global_step": 62744, "epoch": 518} {"train_loss": -35.54998779296875, "global_step": 62745, "epoch": 518} {"train_loss": -35.2336540222168, "global_step": 62746, "epoch": 518} {"train_loss": -34.10295104980469, "global_step": 62747, "epoch": 518} {"train_loss": -36.207279205322266, "global_step": 62748, "epoch": 518} {"train_loss": -34.33346176147461, "global_step": 62749, "epoch": 518} {"train_loss": -35.176082611083984, "global_step": 62750, "epoch": 518} {"train_loss": -35.24634552001953, "global_step": 62751, "epoch": 518} {"train_loss": -35.33442306518555, "global_step": 62752, "epoch": 518} {"train_loss": -35.23517608642578, "global_step": 62753, "epoch": 518} {"train_loss": -35.7946662902832, "global_step": 62754, "epoch": 518} {"train_loss": -36.562320709228516, "global_step": 62755, "epoch": 518} {"train_loss": -35.87311553955078, "global_step": 62756, "epoch": 518} {"train_loss": -36.05460739135742, "global_step": 62757, "epoch": 518} {"train_loss": -35.86825180053711, "global_step": 62758, "epoch": 518} {"train_loss": -35.61542892456055, "global_step": 62759, "epoch": 518} {"train_loss": -36.6256217956543, "global_step": 62760, "epoch": 518} {"train_loss": -36.485469818115234, "global_step": 62761, "epoch": 518} {"train_loss": -36.21454620361328, "global_step": 62762, "epoch": 518} {"train_loss": -36.504608154296875, "global_step": 62763, "epoch": 518} {"train_loss": -36.649078369140625, "global_step": 62764, "epoch": 518} {"train_loss": -36.37128448486328, "global_step": 62765, "epoch": 518} {"train_loss": -36.44518280029297, "global_step": 62766, "epoch": 518} {"train_loss": -36.43509292602539, "global_step": 62767, "epoch": 518} {"train_loss": -36.424560546875, "global_step": 62768, "epoch": 518} {"train_loss": -36.53071212768555, "global_step": 62769, "epoch": 518} {"train_loss": -36.76214599609375, "global_step": 62770, "epoch": 518} {"train_loss": -36.042564392089844, "global_step": 62771, "epoch": 518} {"train_loss": -36.598724365234375, "global_step": 62772, "epoch": 518} {"train_loss": -36.522274017333984, "global_step": 62773, "epoch": 518} {"train_loss": -37.022151947021484, "global_step": 62774, "epoch": 518} {"train_loss": -36.781166076660156, "global_step": 62775, "epoch": 518} {"train_loss": -36.6725959777832, "global_step": 62776, "epoch": 518} {"train_loss": -36.88241958618164, "global_step": 62777, "epoch": 518} {"train_loss": -35.8813591003418, "global_step": 62778, "epoch": 518} {"train_loss": -36.53317642211914, "global_step": 62779, "epoch": 518} {"train_loss": -36.55571365356445, "global_step": 62780, "epoch": 518} {"train_loss": -35.92483139038086, "global_step": 62781, "epoch": 518} {"train_loss": -36.470252990722656, "global_step": 62782, "epoch": 518} {"train_loss": -36.29330062866211, "global_step": 62783, "epoch": 518} {"train_loss": -36.313812255859375, "global_step": 62784, "epoch": 518} {"train_loss": -37.20490646362305, "global_step": 62785, "epoch": 518} {"train_loss": -36.633522033691406, "global_step": 62786, "epoch": 518} {"train_loss": -35.60305404663086, "global_step": 62787, "epoch": 518} {"train_loss": -36.98709487915039, "global_step": 62788, "epoch": 518} {"train_loss": -36.928260803222656, "global_step": 62789, "epoch": 518} {"train_loss": -36.7541618347168, "global_step": 62790, "epoch": 518} {"train_loss": -36.73298263549805, "global_step": 62791, "epoch": 518} {"train_loss": -36.77109909057617, "global_step": 62792, "epoch": 518} {"train_loss": -36.609107971191406, "global_step": 62793, "epoch": 518} {"train_loss": -36.7194938659668, "global_step": 62794, "epoch": 518} {"train_loss": -36.524471282958984, "global_step": 62795, "epoch": 518} {"train_loss": -36.69496536254883, "global_step": 62796, "epoch": 518} {"train_loss": -36.422950744628906, "global_step": 62797, "epoch": 518} {"train_loss": -35.935605577200896, "global_step": 62798, "epoch": 518, "val_loss": 2521444.0} {"train_loss": -36.72785568237305, "global_step": 62799, "epoch": 519} {"train_loss": -35.31012725830078, "global_step": 62800, "epoch": 519} {"train_loss": -35.07627487182617, "global_step": 62801, "epoch": 519} {"train_loss": -36.77167892456055, "global_step": 62802, "epoch": 519} {"train_loss": -35.53178405761719, "global_step": 62803, "epoch": 519} {"train_loss": -32.16189193725586, "global_step": 62804, "epoch": 519} {"train_loss": -31.447961807250977, "global_step": 62805, "epoch": 519} {"train_loss": -34.70342254638672, "global_step": 62806, "epoch": 519} {"train_loss": -34.41706466674805, "global_step": 62807, "epoch": 519} {"train_loss": -33.929622650146484, "global_step": 62808, "epoch": 519} {"train_loss": -31.415618896484375, "global_step": 62809, "epoch": 519} {"train_loss": -35.8499641418457, "global_step": 62810, "epoch": 519} {"train_loss": -34.17667770385742, "global_step": 62811, "epoch": 519} {"train_loss": -33.94795608520508, "global_step": 62812, "epoch": 519} {"train_loss": -30.70794677734375, "global_step": 62813, "epoch": 519} {"train_loss": -35.620723724365234, "global_step": 62814, "epoch": 519} {"train_loss": -32.6276741027832, "global_step": 62815, "epoch": 519} {"train_loss": -34.73270034790039, "global_step": 62816, "epoch": 519} {"train_loss": -33.900390625, "global_step": 62817, "epoch": 519} {"train_loss": -32.98093795776367, "global_step": 62818, "epoch": 519} {"train_loss": -35.322959899902344, "global_step": 62819, "epoch": 519} {"train_loss": -35.3000602722168, "global_step": 62820, "epoch": 519} {"train_loss": -34.777732849121094, "global_step": 62821, "epoch": 519} {"train_loss": -34.90108871459961, "global_step": 62822, "epoch": 519} {"train_loss": -33.78529739379883, "global_step": 62823, "epoch": 519} {"train_loss": -34.71479415893555, "global_step": 62824, "epoch": 519} {"train_loss": -35.112606048583984, "global_step": 62825, "epoch": 519} {"train_loss": -34.412410736083984, "global_step": 62826, "epoch": 519} {"train_loss": -34.61190414428711, "global_step": 62827, "epoch": 519} {"train_loss": -35.53316116333008, "global_step": 62828, "epoch": 519} {"train_loss": -34.735225677490234, "global_step": 62829, "epoch": 519} {"train_loss": -34.96952438354492, "global_step": 62830, "epoch": 519} {"train_loss": -34.82587814331055, "global_step": 62831, "epoch": 519} {"train_loss": -33.403560638427734, "global_step": 62832, "epoch": 519} {"train_loss": -33.86773681640625, "global_step": 62833, "epoch": 519} {"train_loss": -33.5245475769043, "global_step": 62834, "epoch": 519} {"train_loss": -34.289703369140625, "global_step": 62835, "epoch": 519} {"train_loss": -33.625240325927734, "global_step": 62836, "epoch": 519} {"train_loss": -35.512062072753906, "global_step": 62837, "epoch": 519} {"train_loss": -34.75041580200195, "global_step": 62838, "epoch": 519} {"train_loss": -33.6968879699707, "global_step": 62839, "epoch": 519} {"train_loss": -35.63796615600586, "global_step": 62840, "epoch": 519} {"train_loss": -35.23295211791992, "global_step": 62841, "epoch": 519} {"train_loss": -34.67507553100586, "global_step": 62842, "epoch": 519} {"train_loss": -34.57267761230469, "global_step": 62843, "epoch": 519} {"train_loss": -35.125770568847656, "global_step": 62844, "epoch": 519} {"train_loss": -34.68410110473633, "global_step": 62845, "epoch": 519} {"train_loss": -34.72758865356445, "global_step": 62846, "epoch": 519} {"train_loss": -35.37896728515625, "global_step": 62847, "epoch": 519} {"train_loss": -35.75606155395508, "global_step": 62848, "epoch": 519} {"train_loss": -35.7643928527832, "global_step": 62849, "epoch": 519} {"train_loss": -35.11068344116211, "global_step": 62850, "epoch": 519} {"train_loss": -35.34482955932617, "global_step": 62851, "epoch": 519} {"train_loss": -36.110286712646484, "global_step": 62852, "epoch": 519} {"train_loss": -36.27211380004883, "global_step": 62853, "epoch": 519} {"train_loss": -36.128299713134766, "global_step": 62854, "epoch": 519} {"train_loss": -35.97980880737305, "global_step": 62855, "epoch": 519} {"train_loss": -36.654052734375, "global_step": 62856, "epoch": 519} {"train_loss": -36.449459075927734, "global_step": 62857, "epoch": 519} {"train_loss": -34.82966995239258, "global_step": 62858, "epoch": 519} {"train_loss": -35.80659866333008, "global_step": 62859, "epoch": 519} {"train_loss": -36.469505310058594, "global_step": 62860, "epoch": 519} {"train_loss": -35.987030029296875, "global_step": 62861, "epoch": 519} {"train_loss": -35.52619934082031, "global_step": 62862, "epoch": 519} {"train_loss": -36.04765701293945, "global_step": 62863, "epoch": 519} {"train_loss": -36.378509521484375, "global_step": 62864, "epoch": 519} {"train_loss": -36.078739166259766, "global_step": 62865, "epoch": 519} {"train_loss": -36.39044952392578, "global_step": 62866, "epoch": 519} {"train_loss": -35.47129440307617, "global_step": 62867, "epoch": 519} {"train_loss": -35.65102005004883, "global_step": 62868, "epoch": 519} {"train_loss": -36.5634880065918, "global_step": 62869, "epoch": 519} {"train_loss": -36.13349533081055, "global_step": 62870, "epoch": 519} {"train_loss": -35.693634033203125, "global_step": 62871, "epoch": 519} {"train_loss": -36.405517578125, "global_step": 62872, "epoch": 519} {"train_loss": -35.88535690307617, "global_step": 62873, "epoch": 519} {"train_loss": -35.7235107421875, "global_step": 62874, "epoch": 519} {"train_loss": -35.88542938232422, "global_step": 62875, "epoch": 519} {"train_loss": -36.426483154296875, "global_step": 62876, "epoch": 519} {"train_loss": -36.70912551879883, "global_step": 62877, "epoch": 519} {"train_loss": -36.3228874206543, "global_step": 62878, "epoch": 519} {"train_loss": -34.83808898925781, "global_step": 62879, "epoch": 519} {"train_loss": -36.00580978393555, "global_step": 62880, "epoch": 519} {"train_loss": -35.484214782714844, "global_step": 62881, "epoch": 519} {"train_loss": -35.72585678100586, "global_step": 62882, "epoch": 519} {"train_loss": -35.89547348022461, "global_step": 62883, "epoch": 519} {"train_loss": -35.70863342285156, "global_step": 62884, "epoch": 519} {"train_loss": -36.16917037963867, "global_step": 62885, "epoch": 519} {"train_loss": -34.51136779785156, "global_step": 62886, "epoch": 519} {"train_loss": -36.26475143432617, "global_step": 62887, "epoch": 519} {"train_loss": -35.870845794677734, "global_step": 62888, "epoch": 519} {"train_loss": -36.05329513549805, "global_step": 62889, "epoch": 519} {"train_loss": -36.088809967041016, "global_step": 62890, "epoch": 519} {"train_loss": -35.55411148071289, "global_step": 62891, "epoch": 519} {"train_loss": -36.376895904541016, "global_step": 62892, "epoch": 519} {"train_loss": -36.188087463378906, "global_step": 62893, "epoch": 519} {"train_loss": -36.35036087036133, "global_step": 62894, "epoch": 519} {"train_loss": -35.708736419677734, "global_step": 62895, "epoch": 519} {"train_loss": -36.390098571777344, "global_step": 62896, "epoch": 519} {"train_loss": -36.099205017089844, "global_step": 62897, "epoch": 519} {"train_loss": -36.9354133605957, "global_step": 62898, "epoch": 519} {"train_loss": -36.12565231323242, "global_step": 62899, "epoch": 519} {"train_loss": -36.294677734375, "global_step": 62900, "epoch": 519} {"train_loss": -35.53786849975586, "global_step": 62901, "epoch": 519} {"train_loss": -36.22187042236328, "global_step": 62902, "epoch": 519} {"train_loss": -36.06135177612305, "global_step": 62903, "epoch": 519} {"train_loss": -36.89955520629883, "global_step": 62904, "epoch": 519} {"train_loss": -36.06573486328125, "global_step": 62905, "epoch": 519} {"train_loss": -35.367645263671875, "global_step": 62906, "epoch": 519} {"train_loss": -34.50601577758789, "global_step": 62907, "epoch": 519} {"train_loss": -33.39765548706055, "global_step": 62908, "epoch": 519} {"train_loss": -35.609344482421875, "global_step": 62909, "epoch": 519} {"train_loss": -34.902198791503906, "global_step": 62910, "epoch": 519} {"train_loss": -32.195159912109375, "global_step": 62911, "epoch": 519} {"train_loss": -32.20564651489258, "global_step": 62912, "epoch": 519} {"train_loss": -33.25332260131836, "global_step": 62913, "epoch": 519} {"train_loss": -34.50682830810547, "global_step": 62914, "epoch": 519} {"train_loss": -34.880577087402344, "global_step": 62915, "epoch": 519} {"train_loss": -35.4476318359375, "global_step": 62916, "epoch": 519} {"train_loss": -34.016761779785156, "global_step": 62917, "epoch": 519} {"train_loss": -35.34375, "global_step": 62918, "epoch": 519} {"train_loss": -35.18164997258462, "global_step": 62919, "epoch": 519, "val_loss": 2592406.25} {"train_loss": -36.06269454956055, "global_step": 62920, "epoch": 520} {"train_loss": -36.32094192504883, "global_step": 62921, "epoch": 520} {"train_loss": -35.14726257324219, "global_step": 62922, "epoch": 520} {"train_loss": -35.73606872558594, "global_step": 62923, "epoch": 520} {"train_loss": -36.14255905151367, "global_step": 62924, "epoch": 520} {"train_loss": -36.00818634033203, "global_step": 62925, "epoch": 520} {"train_loss": -36.281246185302734, "global_step": 62926, "epoch": 520} {"train_loss": -36.42524337768555, "global_step": 62927, "epoch": 520} {"train_loss": -35.926753997802734, "global_step": 62928, "epoch": 520} {"train_loss": -36.33441925048828, "global_step": 62929, "epoch": 520} {"train_loss": -36.0692024230957, "global_step": 62930, "epoch": 520} {"train_loss": -36.71687698364258, "global_step": 62931, "epoch": 520} {"train_loss": -36.22310256958008, "global_step": 62932, "epoch": 520} {"train_loss": -36.71400833129883, "global_step": 62933, "epoch": 520} {"train_loss": -35.657081604003906, "global_step": 62934, "epoch": 520} {"train_loss": -36.72663116455078, "global_step": 62935, "epoch": 520} {"train_loss": -36.913726806640625, "global_step": 62936, "epoch": 520} {"train_loss": -36.8756103515625, "global_step": 62937, "epoch": 520} {"train_loss": -36.65525436401367, "global_step": 62938, "epoch": 520} {"train_loss": -35.603763580322266, "global_step": 62939, "epoch": 520} {"train_loss": -36.6069221496582, "global_step": 62940, "epoch": 520} {"train_loss": -36.337928771972656, "global_step": 62941, "epoch": 520} {"train_loss": -36.75068283081055, "global_step": 62942, "epoch": 520} {"train_loss": -36.81206130981445, "global_step": 62943, "epoch": 520} {"train_loss": -35.27912521362305, "global_step": 62944, "epoch": 520} {"train_loss": -36.97013854980469, "global_step": 62945, "epoch": 520} {"train_loss": -36.74446487426758, "global_step": 62946, "epoch": 520} {"train_loss": -36.21261215209961, "global_step": 62947, "epoch": 520} {"train_loss": -36.09767532348633, "global_step": 62948, "epoch": 520} {"train_loss": -37.13866424560547, "global_step": 62949, "epoch": 520} {"train_loss": -36.88882064819336, "global_step": 62950, "epoch": 520} {"train_loss": -36.29581832885742, "global_step": 62951, "epoch": 520} {"train_loss": -37.09831619262695, "global_step": 62952, "epoch": 520} {"train_loss": -35.2859992980957, "global_step": 62953, "epoch": 520} {"train_loss": -36.39155960083008, "global_step": 62954, "epoch": 520} {"train_loss": -36.852108001708984, "global_step": 62955, "epoch": 520} {"train_loss": -36.38505172729492, "global_step": 62956, "epoch": 520} {"train_loss": -36.69586944580078, "global_step": 62957, "epoch": 520} {"train_loss": -36.086082458496094, "global_step": 62958, "epoch": 520} {"train_loss": -35.56484603881836, "global_step": 62959, "epoch": 520} {"train_loss": -36.9489860534668, "global_step": 62960, "epoch": 520} {"train_loss": -36.4584846496582, "global_step": 62961, "epoch": 520} {"train_loss": -37.05332565307617, "global_step": 62962, "epoch": 520} {"train_loss": -36.402076721191406, "global_step": 62963, "epoch": 520} {"train_loss": -36.83203887939453, "global_step": 62964, "epoch": 520} {"train_loss": -32.77413558959961, "global_step": 62965, "epoch": 520} {"train_loss": -36.86600875854492, "global_step": 62966, "epoch": 520} {"train_loss": -36.764163970947266, "global_step": 62967, "epoch": 520} {"train_loss": -36.059078216552734, "global_step": 62968, "epoch": 520} {"train_loss": -35.42507553100586, "global_step": 62969, "epoch": 520} {"train_loss": -36.776546478271484, "global_step": 62970, "epoch": 520} {"train_loss": -36.7740592956543, "global_step": 62971, "epoch": 520} {"train_loss": -35.46226119995117, "global_step": 62972, "epoch": 520} {"train_loss": -35.908050537109375, "global_step": 62973, "epoch": 520} {"train_loss": -36.45542526245117, "global_step": 62974, "epoch": 520} {"train_loss": -36.908538818359375, "global_step": 62975, "epoch": 520} {"train_loss": -36.45542526245117, "global_step": 62976, "epoch": 520} {"train_loss": -37.03384017944336, "global_step": 62977, "epoch": 520} {"train_loss": -36.60425567626953, "global_step": 62978, "epoch": 520} {"train_loss": -34.17075729370117, "global_step": 62979, "epoch": 520} {"train_loss": -36.17515182495117, "global_step": 62980, "epoch": 520} {"train_loss": -36.26449966430664, "global_step": 62981, "epoch": 520} {"train_loss": -36.66842269897461, "global_step": 62982, "epoch": 520} {"train_loss": -34.68833541870117, "global_step": 62983, "epoch": 520} {"train_loss": -36.04850769042969, "global_step": 62984, "epoch": 520} {"train_loss": -35.647674560546875, "global_step": 62985, "epoch": 520} {"train_loss": -34.88010787963867, "global_step": 62986, "epoch": 520} {"train_loss": -32.49011993408203, "global_step": 62987, "epoch": 520} {"train_loss": -33.65462112426758, "global_step": 62988, "epoch": 520} {"train_loss": -35.944313049316406, "global_step": 62989, "epoch": 520} {"train_loss": -34.49703598022461, "global_step": 62990, "epoch": 520} {"train_loss": -33.42422103881836, "global_step": 62991, "epoch": 520} {"train_loss": -35.33966827392578, "global_step": 62992, "epoch": 520} {"train_loss": -34.5434455871582, "global_step": 62993, "epoch": 520} {"train_loss": -34.64628219604492, "global_step": 62994, "epoch": 520} {"train_loss": -35.191986083984375, "global_step": 62995, "epoch": 520} {"train_loss": -34.177677154541016, "global_step": 62996, "epoch": 520} {"train_loss": -32.12885284423828, "global_step": 62997, "epoch": 520} {"train_loss": -35.05118942260742, "global_step": 62998, "epoch": 520} {"train_loss": -35.4461669921875, "global_step": 62999, "epoch": 520} {"train_loss": -34.36305618286133, "global_step": 63000, "epoch": 520} {"train_loss": -34.57304763793945, "global_step": 63001, "epoch": 520} {"train_loss": -30.7301082611084, "global_step": 63002, "epoch": 520} {"train_loss": -35.85157012939453, "global_step": 63003, "epoch": 520} {"train_loss": -33.902496337890625, "global_step": 63004, "epoch": 520} {"train_loss": -34.88007736206055, "global_step": 63005, "epoch": 520} {"train_loss": -33.46391296386719, "global_step": 63006, "epoch": 520} {"train_loss": -32.573299407958984, "global_step": 63007, "epoch": 520} {"train_loss": -35.49269104003906, "global_step": 63008, "epoch": 520} {"train_loss": -33.45954513549805, "global_step": 63009, "epoch": 520} {"train_loss": -33.96543884277344, "global_step": 63010, "epoch": 520} {"train_loss": -34.61265182495117, "global_step": 63011, "epoch": 520} {"train_loss": -33.42347717285156, "global_step": 63012, "epoch": 520} {"train_loss": -34.497440338134766, "global_step": 63013, "epoch": 520} {"train_loss": -33.87482452392578, "global_step": 63014, "epoch": 520} {"train_loss": -33.53403091430664, "global_step": 63015, "epoch": 520} {"train_loss": -34.90109634399414, "global_step": 63016, "epoch": 520} {"train_loss": -35.28260040283203, "global_step": 63017, "epoch": 520} {"train_loss": -34.526119232177734, "global_step": 63018, "epoch": 520} {"train_loss": -34.82966995239258, "global_step": 63019, "epoch": 520} {"train_loss": -35.241790771484375, "global_step": 63020, "epoch": 520} {"train_loss": -35.328948974609375, "global_step": 63021, "epoch": 520} {"train_loss": -35.463863372802734, "global_step": 63022, "epoch": 520} {"train_loss": -35.81911087036133, "global_step": 63023, "epoch": 520} {"train_loss": -36.026912689208984, "global_step": 63024, "epoch": 520} {"train_loss": -35.15998458862305, "global_step": 63025, "epoch": 520} {"train_loss": -35.68792724609375, "global_step": 63026, "epoch": 520} {"train_loss": -35.6966667175293, "global_step": 63027, "epoch": 520} {"train_loss": -35.254024505615234, "global_step": 63028, "epoch": 520} {"train_loss": -35.56496810913086, "global_step": 63029, "epoch": 520} {"train_loss": -35.83698272705078, "global_step": 63030, "epoch": 520} {"train_loss": -35.575984954833984, "global_step": 63031, "epoch": 520} {"train_loss": -35.69525909423828, "global_step": 63032, "epoch": 520} {"train_loss": -35.68035888671875, "global_step": 63033, "epoch": 520} {"train_loss": -36.2835693359375, "global_step": 63034, "epoch": 520} {"train_loss": -36.21803665161133, "global_step": 63035, "epoch": 520} {"train_loss": -36.16707229614258, "global_step": 63036, "epoch": 520} {"train_loss": -36.50975799560547, "global_step": 63037, "epoch": 520} {"train_loss": -36.035762786865234, "global_step": 63038, "epoch": 520} {"train_loss": -36.07207107543945, "global_step": 63039, "epoch": 520} {"train_loss": -35.609978998988126, "global_step": 63040, "epoch": 520, "val_loss": 2623311.25} {"train_loss": -37.097877502441406, "global_step": 63041, "epoch": 521} {"train_loss": -36.338008880615234, "global_step": 63042, "epoch": 521} {"train_loss": -36.07672882080078, "global_step": 63043, "epoch": 521} {"train_loss": -36.114986419677734, "global_step": 63044, "epoch": 521} {"train_loss": -37.103267669677734, "global_step": 63045, "epoch": 521} {"train_loss": -36.440608978271484, "global_step": 63046, "epoch": 521} {"train_loss": -35.52862548828125, "global_step": 63047, "epoch": 521} {"train_loss": -36.7549934387207, "global_step": 63048, "epoch": 521} {"train_loss": -36.6888427734375, "global_step": 63049, "epoch": 521} {"train_loss": -36.47620391845703, "global_step": 63050, "epoch": 521} {"train_loss": -36.49665451049805, "global_step": 63051, "epoch": 521} {"train_loss": -36.69426345825195, "global_step": 63052, "epoch": 521} {"train_loss": -36.95457077026367, "global_step": 63053, "epoch": 521} {"train_loss": -37.24386215209961, "global_step": 63054, "epoch": 521} {"train_loss": -35.85161590576172, "global_step": 63055, "epoch": 521} {"train_loss": -35.518436431884766, "global_step": 63056, "epoch": 521} {"train_loss": -34.718746185302734, "global_step": 63057, "epoch": 521} {"train_loss": -34.558101654052734, "global_step": 63058, "epoch": 521} {"train_loss": -34.48786544799805, "global_step": 63059, "epoch": 521} {"train_loss": -33.74402618408203, "global_step": 63060, "epoch": 521} {"train_loss": -32.99048614501953, "global_step": 63061, "epoch": 521} {"train_loss": -34.415740966796875, "global_step": 63062, "epoch": 521} {"train_loss": -35.16419219970703, "global_step": 63063, "epoch": 521} {"train_loss": -36.32053756713867, "global_step": 63064, "epoch": 521} {"train_loss": -36.230628967285156, "global_step": 63065, "epoch": 521} {"train_loss": -35.20655059814453, "global_step": 63066, "epoch": 521} {"train_loss": -36.86851119995117, "global_step": 63067, "epoch": 521} {"train_loss": -35.75181579589844, "global_step": 63068, "epoch": 521} {"train_loss": -35.34798049926758, "global_step": 63069, "epoch": 521} {"train_loss": -36.16562271118164, "global_step": 63070, "epoch": 521} {"train_loss": -37.00045394897461, "global_step": 63071, "epoch": 521} {"train_loss": -36.722164154052734, "global_step": 63072, "epoch": 521} {"train_loss": -36.972469329833984, "global_step": 63073, "epoch": 521} {"train_loss": -36.85077667236328, "global_step": 63074, "epoch": 521} {"train_loss": -36.95484161376953, "global_step": 63075, "epoch": 521} {"train_loss": -36.737979888916016, "global_step": 63076, "epoch": 521} {"train_loss": -36.11417770385742, "global_step": 63077, "epoch": 521} {"train_loss": -36.744075775146484, "global_step": 63078, "epoch": 521} {"train_loss": -36.64725112915039, "global_step": 63079, "epoch": 521} {"train_loss": -35.980892181396484, "global_step": 63080, "epoch": 521} {"train_loss": -37.2296142578125, "global_step": 63081, "epoch": 521} {"train_loss": -36.999794006347656, "global_step": 63082, "epoch": 521} {"train_loss": -35.98591232299805, "global_step": 63083, "epoch": 521} {"train_loss": -37.181793212890625, "global_step": 63084, "epoch": 521} {"train_loss": -36.8325309753418, "global_step": 63085, "epoch": 521} {"train_loss": -37.478511810302734, "global_step": 63086, "epoch": 521} {"train_loss": -36.862998962402344, "global_step": 63087, "epoch": 521} {"train_loss": -37.04478454589844, "global_step": 63088, "epoch": 521} {"train_loss": -36.675411224365234, "global_step": 63089, "epoch": 521} {"train_loss": -37.38509750366211, "global_step": 63090, "epoch": 521} {"train_loss": -35.483211517333984, "global_step": 63091, "epoch": 521} {"train_loss": -36.985382080078125, "global_step": 63092, "epoch": 521} {"train_loss": -36.40522766113281, "global_step": 63093, "epoch": 521} {"train_loss": -36.51163864135742, "global_step": 63094, "epoch": 521} {"train_loss": -35.90699005126953, "global_step": 63095, "epoch": 521} {"train_loss": -37.15340805053711, "global_step": 63096, "epoch": 521} {"train_loss": -36.67867660522461, "global_step": 63097, "epoch": 521} {"train_loss": -34.029884338378906, "global_step": 63098, "epoch": 521} {"train_loss": -32.50168228149414, "global_step": 63099, "epoch": 521} {"train_loss": -31.269855499267578, "global_step": 63100, "epoch": 521} {"train_loss": -34.19160079956055, "global_step": 63101, "epoch": 521} {"train_loss": -35.8225212097168, "global_step": 63102, "epoch": 521} {"train_loss": -31.622419357299805, "global_step": 63103, "epoch": 521} {"train_loss": -36.287872314453125, "global_step": 63104, "epoch": 521} {"train_loss": -36.18605422973633, "global_step": 63105, "epoch": 521} {"train_loss": -34.79233932495117, "global_step": 63106, "epoch": 521} {"train_loss": -34.66530990600586, "global_step": 63107, "epoch": 521} {"train_loss": -33.01118087768555, "global_step": 63108, "epoch": 521} {"train_loss": -35.59342575073242, "global_step": 63109, "epoch": 521} {"train_loss": -29.754308700561523, "global_step": 63110, "epoch": 521} {"train_loss": -33.98594284057617, "global_step": 63111, "epoch": 521} {"train_loss": -32.168548583984375, "global_step": 63112, "epoch": 521} {"train_loss": -33.47578811645508, "global_step": 63113, "epoch": 521} {"train_loss": -34.240020751953125, "global_step": 63114, "epoch": 521} {"train_loss": -35.04044723510742, "global_step": 63115, "epoch": 521} {"train_loss": -34.04340362548828, "global_step": 63116, "epoch": 521} {"train_loss": -34.60280227661133, "global_step": 63117, "epoch": 521} {"train_loss": -33.972007751464844, "global_step": 63118, "epoch": 521} {"train_loss": -34.084529876708984, "global_step": 63119, "epoch": 521} {"train_loss": -34.33938217163086, "global_step": 63120, "epoch": 521} {"train_loss": -34.71047592163086, "global_step": 63121, "epoch": 521} {"train_loss": -33.4941291809082, "global_step": 63122, "epoch": 521} {"train_loss": -33.77952194213867, "global_step": 63123, "epoch": 521} {"train_loss": -34.073936462402344, "global_step": 63124, "epoch": 521} {"train_loss": -34.352535247802734, "global_step": 63125, "epoch": 521} {"train_loss": -35.34908676147461, "global_step": 63126, "epoch": 521} {"train_loss": -35.23223114013672, "global_step": 63127, "epoch": 521} {"train_loss": -34.96378707885742, "global_step": 63128, "epoch": 521} {"train_loss": -35.005950927734375, "global_step": 63129, "epoch": 521} {"train_loss": -34.17264175415039, "global_step": 63130, "epoch": 521} {"train_loss": -35.20369338989258, "global_step": 63131, "epoch": 521} {"train_loss": -33.95870590209961, "global_step": 63132, "epoch": 521} {"train_loss": -35.976985931396484, "global_step": 63133, "epoch": 521} {"train_loss": -35.22306823730469, "global_step": 63134, "epoch": 521} {"train_loss": -34.776451110839844, "global_step": 63135, "epoch": 521} {"train_loss": -33.44789123535156, "global_step": 63136, "epoch": 521} {"train_loss": -35.03147506713867, "global_step": 63137, "epoch": 521} {"train_loss": -35.08217239379883, "global_step": 63138, "epoch": 521} {"train_loss": -35.241981506347656, "global_step": 63139, "epoch": 521} {"train_loss": -35.70430374145508, "global_step": 63140, "epoch": 521} {"train_loss": -35.359500885009766, "global_step": 63141, "epoch": 521} {"train_loss": -35.63505554199219, "global_step": 63142, "epoch": 521} {"train_loss": -35.12728500366211, "global_step": 63143, "epoch": 521} {"train_loss": -35.49494552612305, "global_step": 63144, "epoch": 521} {"train_loss": -35.526859283447266, "global_step": 63145, "epoch": 521} {"train_loss": -35.805171966552734, "global_step": 63146, "epoch": 521} {"train_loss": -36.57954788208008, "global_step": 63147, "epoch": 521} {"train_loss": -35.890926361083984, "global_step": 63148, "epoch": 521} {"train_loss": -35.591434478759766, "global_step": 63149, "epoch": 521} {"train_loss": -36.01200485229492, "global_step": 63150, "epoch": 521} {"train_loss": -36.33887481689453, "global_step": 63151, "epoch": 521} {"train_loss": -35.4169921875, "global_step": 63152, "epoch": 521} {"train_loss": -36.46087646484375, "global_step": 63153, "epoch": 521} {"train_loss": -36.82429122924805, "global_step": 63154, "epoch": 521} {"train_loss": -36.37508773803711, "global_step": 63155, "epoch": 521} {"train_loss": -36.53281784057617, "global_step": 63156, "epoch": 521} {"train_loss": -36.591793060302734, "global_step": 63157, "epoch": 521} {"train_loss": -36.984737396240234, "global_step": 63158, "epoch": 521} {"train_loss": -35.62864303588867, "global_step": 63159, "epoch": 521} {"train_loss": -35.42421340942383, "global_step": 63160, "epoch": 521} {"train_loss": -35.51938077437976, "global_step": 63161, "epoch": 521, "val_loss": 2649079.25} {"train_loss": -36.5911979675293, "global_step": 63162, "epoch": 522} {"train_loss": -37.06787109375, "global_step": 63163, "epoch": 522} {"train_loss": -36.550254821777344, "global_step": 63164, "epoch": 522} {"train_loss": -36.87001419067383, "global_step": 63165, "epoch": 522} {"train_loss": -36.51585006713867, "global_step": 63166, "epoch": 522} {"train_loss": -36.7261962890625, "global_step": 63167, "epoch": 522} {"train_loss": -36.97710418701172, "global_step": 63168, "epoch": 522} {"train_loss": -36.94792556762695, "global_step": 63169, "epoch": 522} {"train_loss": -36.70659255981445, "global_step": 63170, "epoch": 522} {"train_loss": -36.94196319580078, "global_step": 63171, "epoch": 522} {"train_loss": -36.73966598510742, "global_step": 63172, "epoch": 522} {"train_loss": -37.19009017944336, "global_step": 63173, "epoch": 522} {"train_loss": -36.4553337097168, "global_step": 63174, "epoch": 522} {"train_loss": -36.64445877075195, "global_step": 63175, "epoch": 522} {"train_loss": -36.871944427490234, "global_step": 63176, "epoch": 522} {"train_loss": -37.45362091064453, "global_step": 63177, "epoch": 522} {"train_loss": -36.84511184692383, "global_step": 63178, "epoch": 522} {"train_loss": -37.26433181762695, "global_step": 63179, "epoch": 522} {"train_loss": -36.96076583862305, "global_step": 63180, "epoch": 522} {"train_loss": -35.879676818847656, "global_step": 63181, "epoch": 522} {"train_loss": -32.71196365356445, "global_step": 63182, "epoch": 522} {"train_loss": -23.276531219482422, "global_step": 63183, "epoch": 522} {"train_loss": -16.21028709411621, "global_step": 63184, "epoch": 522} {"train_loss": 1.4471100568771362, "global_step": 63185, "epoch": 522} {"train_loss": 3.5090794563293457, "global_step": 63186, "epoch": 522} {"train_loss": -32.34049606323242, "global_step": 63187, "epoch": 522} {"train_loss": -16.158309936523438, "global_step": 63188, "epoch": 522} {"train_loss": -28.211130142211914, "global_step": 63189, "epoch": 522} {"train_loss": -27.248682022094727, "global_step": 63190, "epoch": 522} {"train_loss": -19.32779312133789, "global_step": 63191, "epoch": 522} {"train_loss": -34.770118713378906, "global_step": 63192, "epoch": 522} {"train_loss": -28.55482292175293, "global_step": 63193, "epoch": 522} {"train_loss": -27.242115020751953, "global_step": 63194, "epoch": 522} {"train_loss": -32.65256881713867, "global_step": 63195, "epoch": 522} {"train_loss": -32.10055160522461, "global_step": 63196, "epoch": 522} {"train_loss": -31.570295333862305, "global_step": 63197, "epoch": 522} {"train_loss": -31.209211349487305, "global_step": 63198, "epoch": 522} {"train_loss": -31.85420036315918, "global_step": 63199, "epoch": 522} {"train_loss": -32.95759201049805, "global_step": 63200, "epoch": 522} {"train_loss": -34.4233283996582, "global_step": 63201, "epoch": 522} {"train_loss": -34.09999084472656, "global_step": 63202, "epoch": 522} {"train_loss": -32.96326446533203, "global_step": 63203, "epoch": 522} {"train_loss": -33.47422409057617, "global_step": 63204, "epoch": 522} {"train_loss": -34.557430267333984, "global_step": 63205, "epoch": 522} {"train_loss": -34.37982177734375, "global_step": 63206, "epoch": 522} {"train_loss": -35.0271110534668, "global_step": 63207, "epoch": 522} {"train_loss": -35.0203971862793, "global_step": 63208, "epoch": 522} {"train_loss": -34.3481330871582, "global_step": 63209, "epoch": 522} {"train_loss": -34.60695266723633, "global_step": 63210, "epoch": 522} {"train_loss": -34.78474044799805, "global_step": 63211, "epoch": 522} {"train_loss": -35.25986862182617, "global_step": 63212, "epoch": 522} {"train_loss": -35.30773162841797, "global_step": 63213, "epoch": 522} {"train_loss": -34.53315353393555, "global_step": 63214, "epoch": 522} {"train_loss": -34.70758056640625, "global_step": 63215, "epoch": 522} {"train_loss": -34.848106384277344, "global_step": 63216, "epoch": 522} {"train_loss": -35.338592529296875, "global_step": 63217, "epoch": 522} {"train_loss": -35.4221305847168, "global_step": 63218, "epoch": 522} {"train_loss": -35.23787307739258, "global_step": 63219, "epoch": 522} {"train_loss": -35.47237014770508, "global_step": 63220, "epoch": 522} {"train_loss": -35.394439697265625, "global_step": 63221, "epoch": 522} {"train_loss": -35.360591888427734, "global_step": 63222, "epoch": 522} {"train_loss": -35.091426849365234, "global_step": 63223, "epoch": 522} {"train_loss": -35.32513427734375, "global_step": 63224, "epoch": 522} {"train_loss": -35.48257064819336, "global_step": 63225, "epoch": 522} {"train_loss": -35.6218376159668, "global_step": 63226, "epoch": 522} {"train_loss": -35.42560958862305, "global_step": 63227, "epoch": 522} {"train_loss": -35.63188552856445, "global_step": 63228, "epoch": 522} {"train_loss": -35.597530364990234, "global_step": 63229, "epoch": 522} {"train_loss": -35.32456588745117, "global_step": 63230, "epoch": 522} {"train_loss": -35.929325103759766, "global_step": 63231, "epoch": 522} {"train_loss": -35.77395248413086, "global_step": 63232, "epoch": 522} {"train_loss": -35.91238784790039, "global_step": 63233, "epoch": 522} {"train_loss": -36.16652297973633, "global_step": 63234, "epoch": 522} {"train_loss": -36.43131637573242, "global_step": 63235, "epoch": 522} {"train_loss": -36.043060302734375, "global_step": 63236, "epoch": 522} {"train_loss": -36.004249572753906, "global_step": 63237, "epoch": 522} {"train_loss": -35.61298751831055, "global_step": 63238, "epoch": 522} {"train_loss": -36.46637725830078, "global_step": 63239, "epoch": 522} {"train_loss": -36.3603515625, "global_step": 63240, "epoch": 522} {"train_loss": -36.36701965332031, "global_step": 63241, "epoch": 522} {"train_loss": -36.516258239746094, "global_step": 63242, "epoch": 522} {"train_loss": -36.213409423828125, "global_step": 63243, "epoch": 522} {"train_loss": -36.17695236206055, "global_step": 63244, "epoch": 522} {"train_loss": -36.5192756652832, "global_step": 63245, "epoch": 522} {"train_loss": -35.86841583251953, "global_step": 63246, "epoch": 522} {"train_loss": -36.21390151977539, "global_step": 63247, "epoch": 522} {"train_loss": -36.27021026611328, "global_step": 63248, "epoch": 522} {"train_loss": -32.901302337646484, "global_step": 63249, "epoch": 522} {"train_loss": -35.972999572753906, "global_step": 63250, "epoch": 522} {"train_loss": -36.53413391113281, "global_step": 63251, "epoch": 522} {"train_loss": -36.512603759765625, "global_step": 63252, "epoch": 522} {"train_loss": -36.37329864501953, "global_step": 63253, "epoch": 522} {"train_loss": -36.64714050292969, "global_step": 63254, "epoch": 522} {"train_loss": -35.52993392944336, "global_step": 63255, "epoch": 522} {"train_loss": -35.56368637084961, "global_step": 63256, "epoch": 522} {"train_loss": -35.549068450927734, "global_step": 63257, "epoch": 522} {"train_loss": -34.9375114440918, "global_step": 63258, "epoch": 522} {"train_loss": -34.843929290771484, "global_step": 63259, "epoch": 522} {"train_loss": -35.36469650268555, "global_step": 63260, "epoch": 522} {"train_loss": -35.75216293334961, "global_step": 63261, "epoch": 522} {"train_loss": -35.238792419433594, "global_step": 63262, "epoch": 522} {"train_loss": -35.443359375, "global_step": 63263, "epoch": 522} {"train_loss": -35.82450485229492, "global_step": 63264, "epoch": 522} {"train_loss": -34.05878448486328, "global_step": 63265, "epoch": 522} {"train_loss": -35.8044548034668, "global_step": 63266, "epoch": 522} {"train_loss": -35.76992416381836, "global_step": 63267, "epoch": 522} {"train_loss": -35.462677001953125, "global_step": 63268, "epoch": 522} {"train_loss": -35.448150634765625, "global_step": 63269, "epoch": 522} {"train_loss": -35.163631439208984, "global_step": 63270, "epoch": 522} {"train_loss": -36.34902572631836, "global_step": 63271, "epoch": 522} {"train_loss": -35.574432373046875, "global_step": 63272, "epoch": 522} {"train_loss": -33.484397888183594, "global_step": 63273, "epoch": 522} {"train_loss": -35.76716995239258, "global_step": 63274, "epoch": 522} {"train_loss": -36.18391799926758, "global_step": 63275, "epoch": 522} {"train_loss": -36.09884262084961, "global_step": 63276, "epoch": 522} {"train_loss": -35.92512893676758, "global_step": 63277, "epoch": 522} {"train_loss": -33.55042266845703, "global_step": 63278, "epoch": 522} {"train_loss": -31.484888076782227, "global_step": 63279, "epoch": 522} {"train_loss": -34.02912521362305, "global_step": 63280, "epoch": 522} {"train_loss": -33.613670349121094, "global_step": 63281, "epoch": 522} {"train_loss": -33.903553770593376, "global_step": 63282, "epoch": 522, "val_loss": 2630694.25} {"train_loss": -29.375579833984375, "global_step": 63283, "epoch": 523} {"train_loss": -32.069183349609375, "global_step": 63284, "epoch": 523} {"train_loss": -25.6898250579834, "global_step": 63285, "epoch": 523} {"train_loss": -20.852380752563477, "global_step": 63286, "epoch": 523} {"train_loss": -26.371200561523438, "global_step": 63287, "epoch": 523} {"train_loss": -21.03338050842285, "global_step": 63288, "epoch": 523} {"train_loss": -31.374298095703125, "global_step": 63289, "epoch": 523} {"train_loss": -26.545978546142578, "global_step": 63290, "epoch": 523} {"train_loss": -25.658802032470703, "global_step": 63291, "epoch": 523} {"train_loss": -30.441238403320312, "global_step": 63292, "epoch": 523} {"train_loss": -28.595050811767578, "global_step": 63293, "epoch": 523} {"train_loss": -31.2119140625, "global_step": 63294, "epoch": 523} {"train_loss": -32.634246826171875, "global_step": 63295, "epoch": 523} {"train_loss": -29.082853317260742, "global_step": 63296, "epoch": 523} {"train_loss": -32.11173629760742, "global_step": 63297, "epoch": 523} {"train_loss": -33.54937744140625, "global_step": 63298, "epoch": 523} {"train_loss": -32.861061096191406, "global_step": 63299, "epoch": 523} {"train_loss": -32.84519577026367, "global_step": 63300, "epoch": 523} {"train_loss": -32.3128547668457, "global_step": 63301, "epoch": 523} {"train_loss": -33.47996139526367, "global_step": 63302, "epoch": 523} {"train_loss": -32.30904769897461, "global_step": 63303, "epoch": 523} {"train_loss": -33.6082878112793, "global_step": 63304, "epoch": 523} {"train_loss": -33.111385345458984, "global_step": 63305, "epoch": 523} {"train_loss": -33.23399353027344, "global_step": 63306, "epoch": 523} {"train_loss": -33.26605224609375, "global_step": 63307, "epoch": 523} {"train_loss": -33.33649826049805, "global_step": 63308, "epoch": 523} {"train_loss": -34.00827407836914, "global_step": 63309, "epoch": 523} {"train_loss": -33.524169921875, "global_step": 63310, "epoch": 523} {"train_loss": -33.01583480834961, "global_step": 63311, "epoch": 523} {"train_loss": -33.72703170776367, "global_step": 63312, "epoch": 523} {"train_loss": -33.512264251708984, "global_step": 63313, "epoch": 523} {"train_loss": -34.242427825927734, "global_step": 63314, "epoch": 523} {"train_loss": -34.27968978881836, "global_step": 63315, "epoch": 523} {"train_loss": -34.251094818115234, "global_step": 63316, "epoch": 523} {"train_loss": -34.208370208740234, "global_step": 63317, "epoch": 523} {"train_loss": -34.43072509765625, "global_step": 63318, "epoch": 523} {"train_loss": -34.30294418334961, "global_step": 63319, "epoch": 523} {"train_loss": -34.934383392333984, "global_step": 63320, "epoch": 523} {"train_loss": -34.822078704833984, "global_step": 63321, "epoch": 523} {"train_loss": -34.7719612121582, "global_step": 63322, "epoch": 523} {"train_loss": -34.29873275756836, "global_step": 63323, "epoch": 523} {"train_loss": -34.87181091308594, "global_step": 63324, "epoch": 523} {"train_loss": -34.51018142700195, "global_step": 63325, "epoch": 523} {"train_loss": -34.85624313354492, "global_step": 63326, "epoch": 523} {"train_loss": -34.72260284423828, "global_step": 63327, "epoch": 523} {"train_loss": -34.4326286315918, "global_step": 63328, "epoch": 523} {"train_loss": -34.811458587646484, "global_step": 63329, "epoch": 523} {"train_loss": -34.92841720581055, "global_step": 63330, "epoch": 523} {"train_loss": -34.62440872192383, "global_step": 63331, "epoch": 523} {"train_loss": -35.194644927978516, "global_step": 63332, "epoch": 523} {"train_loss": -35.19301986694336, "global_step": 63333, "epoch": 523} {"train_loss": -35.16722869873047, "global_step": 63334, "epoch": 523} {"train_loss": -35.562965393066406, "global_step": 63335, "epoch": 523} {"train_loss": -35.10600280761719, "global_step": 63336, "epoch": 523} {"train_loss": -35.1407585144043, "global_step": 63337, "epoch": 523} {"train_loss": -35.30233383178711, "global_step": 63338, "epoch": 523} {"train_loss": -35.779754638671875, "global_step": 63339, "epoch": 523} {"train_loss": -35.50125503540039, "global_step": 63340, "epoch": 523} {"train_loss": -35.23269271850586, "global_step": 63341, "epoch": 523} {"train_loss": -35.281856536865234, "global_step": 63342, "epoch": 523} {"train_loss": -35.150238037109375, "global_step": 63343, "epoch": 523} {"train_loss": -35.77912521362305, "global_step": 63344, "epoch": 523} {"train_loss": -35.56543731689453, "global_step": 63345, "epoch": 523} {"train_loss": -35.930389404296875, "global_step": 63346, "epoch": 523} {"train_loss": -35.97322463989258, "global_step": 63347, "epoch": 523} {"train_loss": -35.64967346191406, "global_step": 63348, "epoch": 523} {"train_loss": -35.98679733276367, "global_step": 63349, "epoch": 523} {"train_loss": -35.79828643798828, "global_step": 63350, "epoch": 523} {"train_loss": -35.76746368408203, "global_step": 63351, "epoch": 523} {"train_loss": -36.1182975769043, "global_step": 63352, "epoch": 523} {"train_loss": -36.10196304321289, "global_step": 63353, "epoch": 523} {"train_loss": -35.777870178222656, "global_step": 63354, "epoch": 523} {"train_loss": -36.50732421875, "global_step": 63355, "epoch": 523} {"train_loss": -36.13161849975586, "global_step": 63356, "epoch": 523} {"train_loss": -36.16074752807617, "global_step": 63357, "epoch": 523} {"train_loss": -36.32607650756836, "global_step": 63358, "epoch": 523} {"train_loss": -36.03644561767578, "global_step": 63359, "epoch": 523} {"train_loss": -36.2184944152832, "global_step": 63360, "epoch": 523} {"train_loss": -36.483455657958984, "global_step": 63361, "epoch": 523} {"train_loss": -36.407833099365234, "global_step": 63362, "epoch": 523} {"train_loss": -36.19489669799805, "global_step": 63363, "epoch": 523} {"train_loss": -36.23200607299805, "global_step": 63364, "epoch": 523} {"train_loss": -36.26224899291992, "global_step": 63365, "epoch": 523} {"train_loss": -36.66286849975586, "global_step": 63366, "epoch": 523} {"train_loss": -36.3691520690918, "global_step": 63367, "epoch": 523} {"train_loss": -36.188419342041016, "global_step": 63368, "epoch": 523} {"train_loss": -36.64118194580078, "global_step": 63369, "epoch": 523} {"train_loss": -36.88116455078125, "global_step": 63370, "epoch": 523} {"train_loss": -36.46503829956055, "global_step": 63371, "epoch": 523} {"train_loss": -36.03589630126953, "global_step": 63372, "epoch": 523} {"train_loss": -36.18536376953125, "global_step": 63373, "epoch": 523} {"train_loss": -36.14744186401367, "global_step": 63374, "epoch": 523} {"train_loss": -35.78915023803711, "global_step": 63375, "epoch": 523} {"train_loss": -35.86100387573242, "global_step": 63376, "epoch": 523} {"train_loss": -35.07414627075195, "global_step": 63377, "epoch": 523} {"train_loss": -32.4755859375, "global_step": 63378, "epoch": 523} {"train_loss": -23.5414981842041, "global_step": 63379, "epoch": 523} {"train_loss": -4.084466457366943, "global_step": 63380, "epoch": 523} {"train_loss": -1.5053505897521973, "global_step": 63381, "epoch": 523} {"train_loss": -30.54570960998535, "global_step": 63382, "epoch": 523} {"train_loss": -22.12503433227539, "global_step": 63383, "epoch": 523} {"train_loss": -18.452123641967773, "global_step": 63384, "epoch": 523} {"train_loss": -31.71186637878418, "global_step": 63385, "epoch": 523} {"train_loss": -27.824420928955078, "global_step": 63386, "epoch": 523} {"train_loss": -30.38663673400879, "global_step": 63387, "epoch": 523} {"train_loss": -31.88226890563965, "global_step": 63388, "epoch": 523} {"train_loss": -31.776142120361328, "global_step": 63389, "epoch": 523} {"train_loss": -32.33354568481445, "global_step": 63390, "epoch": 523} {"train_loss": -34.36705017089844, "global_step": 63391, "epoch": 523} {"train_loss": -32.248291015625, "global_step": 63392, "epoch": 523} {"train_loss": -33.700992584228516, "global_step": 63393, "epoch": 523} {"train_loss": -34.93793487548828, "global_step": 63394, "epoch": 523} {"train_loss": -33.262413024902344, "global_step": 63395, "epoch": 523} {"train_loss": -33.64777374267578, "global_step": 63396, "epoch": 523} {"train_loss": -34.009647369384766, "global_step": 63397, "epoch": 523} {"train_loss": -34.330787658691406, "global_step": 63398, "epoch": 523} {"train_loss": -34.33973693847656, "global_step": 63399, "epoch": 523} {"train_loss": -34.1667594909668, "global_step": 63400, "epoch": 523} {"train_loss": -34.36383819580078, "global_step": 63401, "epoch": 523} {"train_loss": -34.75749588012695, "global_step": 63402, "epoch": 523} {"train_loss": -32.968610810839444, "global_step": 63403, "epoch": 523, "val_loss": 2605732.25} {"train_loss": -34.90043258666992, "global_step": 63404, "epoch": 524} {"train_loss": -34.75181198120117, "global_step": 63405, "epoch": 524} {"train_loss": -34.77579116821289, "global_step": 63406, "epoch": 524} {"train_loss": -34.75675582885742, "global_step": 63407, "epoch": 524} {"train_loss": -34.40623092651367, "global_step": 63408, "epoch": 524} {"train_loss": -35.03963088989258, "global_step": 63409, "epoch": 524} {"train_loss": -35.004356384277344, "global_step": 63410, "epoch": 524} {"train_loss": -35.2938117980957, "global_step": 63411, "epoch": 524} {"train_loss": -35.27558135986328, "global_step": 63412, "epoch": 524} {"train_loss": -35.335323333740234, "global_step": 63413, "epoch": 524} {"train_loss": -35.60634994506836, "global_step": 63414, "epoch": 524} {"train_loss": -35.45200729370117, "global_step": 63415, "epoch": 524} {"train_loss": -35.58320999145508, "global_step": 63416, "epoch": 524} {"train_loss": -35.26860427856445, "global_step": 63417, "epoch": 524} {"train_loss": -35.76166915893555, "global_step": 63418, "epoch": 524} {"train_loss": -35.645782470703125, "global_step": 63419, "epoch": 524} {"train_loss": -35.442108154296875, "global_step": 63420, "epoch": 524} {"train_loss": -35.489688873291016, "global_step": 63421, "epoch": 524} {"train_loss": -35.83243179321289, "global_step": 63422, "epoch": 524} {"train_loss": -35.55427932739258, "global_step": 63423, "epoch": 524} {"train_loss": -35.984920501708984, "global_step": 63424, "epoch": 524} {"train_loss": -35.73427963256836, "global_step": 63425, "epoch": 524} {"train_loss": -35.68268966674805, "global_step": 63426, "epoch": 524} {"train_loss": -36.01704025268555, "global_step": 63427, "epoch": 524} {"train_loss": -35.86843490600586, "global_step": 63428, "epoch": 524} {"train_loss": -36.04160690307617, "global_step": 63429, "epoch": 524} {"train_loss": -36.090755462646484, "global_step": 63430, "epoch": 524} {"train_loss": -36.05266189575195, "global_step": 63431, "epoch": 524} {"train_loss": -36.02643966674805, "global_step": 63432, "epoch": 524} {"train_loss": -35.3890266418457, "global_step": 63433, "epoch": 524} {"train_loss": -35.350791931152344, "global_step": 63434, "epoch": 524} {"train_loss": -35.717811584472656, "global_step": 63435, "epoch": 524} {"train_loss": -36.16645431518555, "global_step": 63436, "epoch": 524} {"train_loss": -36.48189163208008, "global_step": 63437, "epoch": 524} {"train_loss": -36.11797332763672, "global_step": 63438, "epoch": 524} {"train_loss": -35.676513671875, "global_step": 63439, "epoch": 524} {"train_loss": -36.13163375854492, "global_step": 63440, "epoch": 524} {"train_loss": -36.208187103271484, "global_step": 63441, "epoch": 524} {"train_loss": -35.791473388671875, "global_step": 63442, "epoch": 524} {"train_loss": -35.659122467041016, "global_step": 63443, "epoch": 524} {"train_loss": -36.35173034667969, "global_step": 63444, "epoch": 524} {"train_loss": -36.468605041503906, "global_step": 63445, "epoch": 524} {"train_loss": -35.82533645629883, "global_step": 63446, "epoch": 524} {"train_loss": -35.23204040527344, "global_step": 63447, "epoch": 524} {"train_loss": -34.753719329833984, "global_step": 63448, "epoch": 524} {"train_loss": -34.7376594543457, "global_step": 63449, "epoch": 524} {"train_loss": -34.93268966674805, "global_step": 63450, "epoch": 524} {"train_loss": -35.040531158447266, "global_step": 63451, "epoch": 524} {"train_loss": -35.61843490600586, "global_step": 63452, "epoch": 524} {"train_loss": -36.13302230834961, "global_step": 63453, "epoch": 524} {"train_loss": -36.0189323425293, "global_step": 63454, "epoch": 524} {"train_loss": -36.108604431152344, "global_step": 63455, "epoch": 524} {"train_loss": -36.385955810546875, "global_step": 63456, "epoch": 524} {"train_loss": -36.3070182800293, "global_step": 63457, "epoch": 524} {"train_loss": -36.17507553100586, "global_step": 63458, "epoch": 524} {"train_loss": -35.99219512939453, "global_step": 63459, "epoch": 524} {"train_loss": -36.112613677978516, "global_step": 63460, "epoch": 524} {"train_loss": -36.15033721923828, "global_step": 63461, "epoch": 524} {"train_loss": -36.57329177856445, "global_step": 63462, "epoch": 524} {"train_loss": -35.279781341552734, "global_step": 63463, "epoch": 524} {"train_loss": -35.851078033447266, "global_step": 63464, "epoch": 524} {"train_loss": -35.69529724121094, "global_step": 63465, "epoch": 524} {"train_loss": -36.33235549926758, "global_step": 63466, "epoch": 524} {"train_loss": -34.95119857788086, "global_step": 63467, "epoch": 524} {"train_loss": -36.091163635253906, "global_step": 63468, "epoch": 524} {"train_loss": -35.023651123046875, "global_step": 63469, "epoch": 524} {"train_loss": -33.574275970458984, "global_step": 63470, "epoch": 524} {"train_loss": -30.232961654663086, "global_step": 63471, "epoch": 524} {"train_loss": -29.574615478515625, "global_step": 63472, "epoch": 524} {"train_loss": -31.94550132751465, "global_step": 63473, "epoch": 524} {"train_loss": -36.211647033691406, "global_step": 63474, "epoch": 524} {"train_loss": -34.557735443115234, "global_step": 63475, "epoch": 524} {"train_loss": -34.46442794799805, "global_step": 63476, "epoch": 524} {"train_loss": -34.831298828125, "global_step": 63477, "epoch": 524} {"train_loss": -35.21303176879883, "global_step": 63478, "epoch": 524} {"train_loss": -34.23394775390625, "global_step": 63479, "epoch": 524} {"train_loss": -35.56697463989258, "global_step": 63480, "epoch": 524} {"train_loss": -34.496822357177734, "global_step": 63481, "epoch": 524} {"train_loss": -35.12995529174805, "global_step": 63482, "epoch": 524} {"train_loss": -35.04401397705078, "global_step": 63483, "epoch": 524} {"train_loss": -35.460933685302734, "global_step": 63484, "epoch": 524} {"train_loss": -35.173316955566406, "global_step": 63485, "epoch": 524} {"train_loss": -35.73670196533203, "global_step": 63486, "epoch": 524} {"train_loss": -35.167747497558594, "global_step": 63487, "epoch": 524} {"train_loss": -35.34237289428711, "global_step": 63488, "epoch": 524} {"train_loss": -35.31443786621094, "global_step": 63489, "epoch": 524} {"train_loss": -35.274166107177734, "global_step": 63490, "epoch": 524} {"train_loss": -36.16386795043945, "global_step": 63491, "epoch": 524} {"train_loss": -35.16432189941406, "global_step": 63492, "epoch": 524} {"train_loss": -36.250762939453125, "global_step": 63493, "epoch": 524} {"train_loss": -34.867977142333984, "global_step": 63494, "epoch": 524} {"train_loss": -36.036800384521484, "global_step": 63495, "epoch": 524} {"train_loss": -35.44099044799805, "global_step": 63496, "epoch": 524} {"train_loss": -35.42695999145508, "global_step": 63497, "epoch": 524} {"train_loss": -35.45785140991211, "global_step": 63498, "epoch": 524} {"train_loss": -35.80927658081055, "global_step": 63499, "epoch": 524} {"train_loss": -35.144405364990234, "global_step": 63500, "epoch": 524} {"train_loss": -35.47603988647461, "global_step": 63501, "epoch": 524} {"train_loss": -35.81196975708008, "global_step": 63502, "epoch": 524} {"train_loss": -35.89314270019531, "global_step": 63503, "epoch": 524} {"train_loss": -35.70943832397461, "global_step": 63504, "epoch": 524} {"train_loss": -35.8092155456543, "global_step": 63505, "epoch": 524} {"train_loss": -35.45277404785156, "global_step": 63506, "epoch": 524} {"train_loss": -35.961090087890625, "global_step": 63507, "epoch": 524} {"train_loss": -36.076229095458984, "global_step": 63508, "epoch": 524} {"train_loss": -36.39826583862305, "global_step": 63509, "epoch": 524} {"train_loss": -35.919105529785156, "global_step": 63510, "epoch": 524} {"train_loss": -36.010231018066406, "global_step": 63511, "epoch": 524} {"train_loss": -36.25041580200195, "global_step": 63512, "epoch": 524} {"train_loss": -36.93434143066406, "global_step": 63513, "epoch": 524} {"train_loss": -36.27683639526367, "global_step": 63514, "epoch": 524} {"train_loss": -36.44556427001953, "global_step": 63515, "epoch": 524} {"train_loss": -36.40886306762695, "global_step": 63516, "epoch": 524} {"train_loss": -36.70912170410156, "global_step": 63517, "epoch": 524} {"train_loss": -36.43144989013672, "global_step": 63518, "epoch": 524} {"train_loss": -36.13410186767578, "global_step": 63519, "epoch": 524} {"train_loss": -36.32253646850586, "global_step": 63520, "epoch": 524} {"train_loss": -36.04659652709961, "global_step": 63521, "epoch": 524} {"train_loss": -36.175540924072266, "global_step": 63522, "epoch": 524} {"train_loss": -36.15991973876953, "global_step": 63523, "epoch": 524} {"train_loss": -35.53024178497062, "global_step": 63524, "epoch": 524, "val_loss": 2590215.25} {"train_loss": -36.3254280090332, "global_step": 63525, "epoch": 525} {"train_loss": -36.16315841674805, "global_step": 63526, "epoch": 525} {"train_loss": -36.0997428894043, "global_step": 63527, "epoch": 525} {"train_loss": -36.95306396484375, "global_step": 63528, "epoch": 525} {"train_loss": -36.44895553588867, "global_step": 63529, "epoch": 525} {"train_loss": -36.26070785522461, "global_step": 63530, "epoch": 525} {"train_loss": -37.04810333251953, "global_step": 63531, "epoch": 525} {"train_loss": -35.62384796142578, "global_step": 63532, "epoch": 525} {"train_loss": -31.991485595703125, "global_step": 63533, "epoch": 525} {"train_loss": -34.095855712890625, "global_step": 63534, "epoch": 525} {"train_loss": -33.24730682373047, "global_step": 63535, "epoch": 525} {"train_loss": -31.977277755737305, "global_step": 63536, "epoch": 525} {"train_loss": -34.905677795410156, "global_step": 63537, "epoch": 525} {"train_loss": -33.29495620727539, "global_step": 63538, "epoch": 525} {"train_loss": -34.69776153564453, "global_step": 63539, "epoch": 525} {"train_loss": -34.641944885253906, "global_step": 63540, "epoch": 525} {"train_loss": -35.38134765625, "global_step": 63541, "epoch": 525} {"train_loss": -34.60597610473633, "global_step": 63542, "epoch": 525} {"train_loss": -36.75407028198242, "global_step": 63543, "epoch": 525} {"train_loss": -34.00606155395508, "global_step": 63544, "epoch": 525} {"train_loss": -35.766658782958984, "global_step": 63545, "epoch": 525} {"train_loss": -35.023834228515625, "global_step": 63546, "epoch": 525} {"train_loss": -35.367225646972656, "global_step": 63547, "epoch": 525} {"train_loss": -34.98957443237305, "global_step": 63548, "epoch": 525} {"train_loss": -35.47170639038086, "global_step": 63549, "epoch": 525} {"train_loss": -36.007659912109375, "global_step": 63550, "epoch": 525} {"train_loss": -35.4281120300293, "global_step": 63551, "epoch": 525} {"train_loss": -35.40665817260742, "global_step": 63552, "epoch": 525} {"train_loss": -34.983131408691406, "global_step": 63553, "epoch": 525} {"train_loss": -34.806522369384766, "global_step": 63554, "epoch": 525} {"train_loss": -35.629638671875, "global_step": 63555, "epoch": 525} {"train_loss": -36.17896270751953, "global_step": 63556, "epoch": 525} {"train_loss": -35.04544448852539, "global_step": 63557, "epoch": 525} {"train_loss": -35.6472282409668, "global_step": 63558, "epoch": 525} {"train_loss": -35.391685485839844, "global_step": 63559, "epoch": 525} {"train_loss": -35.33289337158203, "global_step": 63560, "epoch": 525} {"train_loss": -36.50127029418945, "global_step": 63561, "epoch": 525} {"train_loss": -36.030941009521484, "global_step": 63562, "epoch": 525} {"train_loss": -36.18255615234375, "global_step": 63563, "epoch": 525} {"train_loss": -34.822689056396484, "global_step": 63564, "epoch": 525} {"train_loss": -35.672725677490234, "global_step": 63565, "epoch": 525} {"train_loss": -36.03899383544922, "global_step": 63566, "epoch": 525} {"train_loss": -35.75686264038086, "global_step": 63567, "epoch": 525} {"train_loss": -36.28642654418945, "global_step": 63568, "epoch": 525} {"train_loss": -35.793006896972656, "global_step": 63569, "epoch": 525} {"train_loss": -35.87466049194336, "global_step": 63570, "epoch": 525} {"train_loss": -36.050086975097656, "global_step": 63571, "epoch": 525} {"train_loss": -35.910343170166016, "global_step": 63572, "epoch": 525} {"train_loss": -36.5025749206543, "global_step": 63573, "epoch": 525} {"train_loss": -36.098793029785156, "global_step": 63574, "epoch": 525} {"train_loss": -36.31901168823242, "global_step": 63575, "epoch": 525} {"train_loss": -36.278804779052734, "global_step": 63576, "epoch": 525} {"train_loss": -36.6802864074707, "global_step": 63577, "epoch": 525} {"train_loss": -36.46125411987305, "global_step": 63578, "epoch": 525} {"train_loss": -36.2213020324707, "global_step": 63579, "epoch": 525} {"train_loss": -36.00948715209961, "global_step": 63580, "epoch": 525} {"train_loss": -36.23516845703125, "global_step": 63581, "epoch": 525} {"train_loss": -35.791900634765625, "global_step": 63582, "epoch": 525} {"train_loss": -36.342750549316406, "global_step": 63583, "epoch": 525} {"train_loss": -35.886878967285156, "global_step": 63584, "epoch": 525} {"train_loss": -36.773433685302734, "global_step": 63585, "epoch": 525} {"train_loss": -36.691837310791016, "global_step": 63586, "epoch": 525} {"train_loss": -36.304195404052734, "global_step": 63587, "epoch": 525} {"train_loss": -35.825138092041016, "global_step": 63588, "epoch": 525} {"train_loss": -36.76424026489258, "global_step": 63589, "epoch": 525} {"train_loss": -36.066219329833984, "global_step": 63590, "epoch": 525} {"train_loss": -36.48316192626953, "global_step": 63591, "epoch": 525} {"train_loss": -34.00507736206055, "global_step": 63592, "epoch": 525} {"train_loss": -35.310665130615234, "global_step": 63593, "epoch": 525} {"train_loss": -36.324642181396484, "global_step": 63594, "epoch": 525} {"train_loss": -36.334896087646484, "global_step": 63595, "epoch": 525} {"train_loss": -33.14962387084961, "global_step": 63596, "epoch": 525} {"train_loss": -34.31973648071289, "global_step": 63597, "epoch": 525} {"train_loss": -33.29348373413086, "global_step": 63598, "epoch": 525} {"train_loss": -29.259296417236328, "global_step": 63599, "epoch": 525} {"train_loss": -32.2406120300293, "global_step": 63600, "epoch": 525} {"train_loss": -33.48746871948242, "global_step": 63601, "epoch": 525} {"train_loss": -31.3477783203125, "global_step": 63602, "epoch": 525} {"train_loss": -32.01995086669922, "global_step": 63603, "epoch": 525} {"train_loss": -29.01323890686035, "global_step": 63604, "epoch": 525} {"train_loss": -32.3988151550293, "global_step": 63605, "epoch": 525} {"train_loss": -34.745147705078125, "global_step": 63606, "epoch": 525} {"train_loss": -32.69021224975586, "global_step": 63607, "epoch": 525} {"train_loss": -24.394027709960938, "global_step": 63608, "epoch": 525} {"train_loss": -25.305957794189453, "global_step": 63609, "epoch": 525} {"train_loss": -34.03541946411133, "global_step": 63610, "epoch": 525} {"train_loss": -32.478355407714844, "global_step": 63611, "epoch": 525} {"train_loss": -30.835357666015625, "global_step": 63612, "epoch": 525} {"train_loss": -32.57558822631836, "global_step": 63613, "epoch": 525} {"train_loss": -32.2083854675293, "global_step": 63614, "epoch": 525} {"train_loss": -33.35659408569336, "global_step": 63615, "epoch": 525} {"train_loss": -32.27522659301758, "global_step": 63616, "epoch": 525} {"train_loss": -30.432514190673828, "global_step": 63617, "epoch": 525} {"train_loss": -29.83332633972168, "global_step": 63618, "epoch": 525} {"train_loss": -33.03888702392578, "global_step": 63619, "epoch": 525} {"train_loss": -33.128780364990234, "global_step": 63620, "epoch": 525} {"train_loss": -30.378095626831055, "global_step": 63621, "epoch": 525} {"train_loss": -31.00090980529785, "global_step": 63622, "epoch": 525} {"train_loss": -31.585926055908203, "global_step": 63623, "epoch": 525} {"train_loss": -32.87797927856445, "global_step": 63624, "epoch": 525} {"train_loss": -33.1203727722168, "global_step": 63625, "epoch": 525} {"train_loss": -32.19431686401367, "global_step": 63626, "epoch": 525} {"train_loss": -32.467464447021484, "global_step": 63627, "epoch": 525} {"train_loss": -32.289005279541016, "global_step": 63628, "epoch": 525} {"train_loss": -30.591184616088867, "global_step": 63629, "epoch": 525} {"train_loss": -32.252357482910156, "global_step": 63630, "epoch": 525} {"train_loss": -33.058135986328125, "global_step": 63631, "epoch": 525} {"train_loss": -33.53656768798828, "global_step": 63632, "epoch": 525} {"train_loss": -33.35963821411133, "global_step": 63633, "epoch": 525} {"train_loss": -33.144073486328125, "global_step": 63634, "epoch": 525} {"train_loss": -33.59991455078125, "global_step": 63635, "epoch": 525} {"train_loss": -33.01245880126953, "global_step": 63636, "epoch": 525} {"train_loss": -33.70774459838867, "global_step": 63637, "epoch": 525} {"train_loss": -33.108009338378906, "global_step": 63638, "epoch": 525} {"train_loss": -33.190547943115234, "global_step": 63639, "epoch": 525} {"train_loss": -34.299190521240234, "global_step": 63640, "epoch": 525} {"train_loss": -34.18600082397461, "global_step": 63641, "epoch": 525} {"train_loss": -33.967708587646484, "global_step": 63642, "epoch": 525} {"train_loss": -34.41796875, "global_step": 63643, "epoch": 525} {"train_loss": -33.68318176269531, "global_step": 63644, "epoch": 525} {"train_loss": -34.25417431918058, "global_step": 63645, "epoch": 525, "val_loss": 2548019.0} {"train_loss": -34.413700103759766, "global_step": 63646, "epoch": 526} {"train_loss": -33.7651252746582, "global_step": 63647, "epoch": 526} {"train_loss": -34.7511100769043, "global_step": 63648, "epoch": 526} {"train_loss": -34.1993293762207, "global_step": 63649, "epoch": 526} {"train_loss": -34.32233428955078, "global_step": 63650, "epoch": 526} {"train_loss": -34.324886322021484, "global_step": 63651, "epoch": 526} {"train_loss": -34.61665725708008, "global_step": 63652, "epoch": 526} {"train_loss": -34.529693603515625, "global_step": 63653, "epoch": 526} {"train_loss": -34.7572021484375, "global_step": 63654, "epoch": 526} {"train_loss": -34.65644073486328, "global_step": 63655, "epoch": 526} {"train_loss": -34.73249053955078, "global_step": 63656, "epoch": 526} {"train_loss": -34.4817008972168, "global_step": 63657, "epoch": 526} {"train_loss": -34.644508361816406, "global_step": 63658, "epoch": 526} {"train_loss": -34.65446853637695, "global_step": 63659, "epoch": 526} {"train_loss": -35.032527923583984, "global_step": 63660, "epoch": 526} {"train_loss": -34.94807052612305, "global_step": 63661, "epoch": 526} {"train_loss": -35.381690979003906, "global_step": 63662, "epoch": 526} {"train_loss": -34.99497604370117, "global_step": 63663, "epoch": 526} {"train_loss": -35.25855255126953, "global_step": 63664, "epoch": 526} {"train_loss": -35.18873977661133, "global_step": 63665, "epoch": 526} {"train_loss": -35.07442855834961, "global_step": 63666, "epoch": 526} {"train_loss": -34.440364837646484, "global_step": 63667, "epoch": 526} {"train_loss": -35.38969802856445, "global_step": 63668, "epoch": 526} {"train_loss": -34.95804977416992, "global_step": 63669, "epoch": 526} {"train_loss": -35.72266387939453, "global_step": 63670, "epoch": 526} {"train_loss": -35.57588577270508, "global_step": 63671, "epoch": 526} {"train_loss": -34.87697982788086, "global_step": 63672, "epoch": 526} {"train_loss": -35.20344543457031, "global_step": 63673, "epoch": 526} {"train_loss": -35.81303024291992, "global_step": 63674, "epoch": 526} {"train_loss": -35.65809631347656, "global_step": 63675, "epoch": 526} {"train_loss": -36.275421142578125, "global_step": 63676, "epoch": 526} {"train_loss": -35.718814849853516, "global_step": 63677, "epoch": 526} {"train_loss": -34.6671257019043, "global_step": 63678, "epoch": 526} {"train_loss": -36.14539337158203, "global_step": 63679, "epoch": 526} {"train_loss": -36.02127456665039, "global_step": 63680, "epoch": 526} {"train_loss": -36.140098571777344, "global_step": 63681, "epoch": 526} {"train_loss": -35.84383773803711, "global_step": 63682, "epoch": 526} {"train_loss": -36.260597229003906, "global_step": 63683, "epoch": 526} {"train_loss": -36.030330657958984, "global_step": 63684, "epoch": 526} {"train_loss": -36.18290328979492, "global_step": 63685, "epoch": 526} {"train_loss": -36.2261962890625, "global_step": 63686, "epoch": 526} {"train_loss": -36.14234924316406, "global_step": 63687, "epoch": 526} {"train_loss": -36.144561767578125, "global_step": 63688, "epoch": 526} {"train_loss": -36.300533294677734, "global_step": 63689, "epoch": 526} {"train_loss": -35.695396423339844, "global_step": 63690, "epoch": 526} {"train_loss": -36.32133865356445, "global_step": 63691, "epoch": 526} {"train_loss": -36.27437973022461, "global_step": 63692, "epoch": 526} {"train_loss": -36.15107727050781, "global_step": 63693, "epoch": 526} {"train_loss": -36.50852584838867, "global_step": 63694, "epoch": 526} {"train_loss": -36.21170425415039, "global_step": 63695, "epoch": 526} {"train_loss": -36.68488311767578, "global_step": 63696, "epoch": 526} {"train_loss": -34.87228012084961, "global_step": 63697, "epoch": 526} {"train_loss": -36.70135498046875, "global_step": 63698, "epoch": 526} {"train_loss": -36.14033126831055, "global_step": 63699, "epoch": 526} {"train_loss": -36.62698745727539, "global_step": 63700, "epoch": 526} {"train_loss": -35.79322814941406, "global_step": 63701, "epoch": 526} {"train_loss": -36.26447677612305, "global_step": 63702, "epoch": 526} {"train_loss": -36.10973358154297, "global_step": 63703, "epoch": 526} {"train_loss": -35.46652603149414, "global_step": 63704, "epoch": 526} {"train_loss": -36.35385513305664, "global_step": 63705, "epoch": 526} {"train_loss": -36.8496208190918, "global_step": 63706, "epoch": 526} {"train_loss": -36.353736877441406, "global_step": 63707, "epoch": 526} {"train_loss": -36.74154281616211, "global_step": 63708, "epoch": 526} {"train_loss": -36.45101547241211, "global_step": 63709, "epoch": 526} {"train_loss": -36.94580078125, "global_step": 63710, "epoch": 526} {"train_loss": -37.009700775146484, "global_step": 63711, "epoch": 526} {"train_loss": -36.637962341308594, "global_step": 63712, "epoch": 526} {"train_loss": -36.375633239746094, "global_step": 63713, "epoch": 526} {"train_loss": -36.71354293823242, "global_step": 63714, "epoch": 526} {"train_loss": -34.97629165649414, "global_step": 63715, "epoch": 526} {"train_loss": -37.21364212036133, "global_step": 63716, "epoch": 526} {"train_loss": -37.20466995239258, "global_step": 63717, "epoch": 526} {"train_loss": -36.6501350402832, "global_step": 63718, "epoch": 526} {"train_loss": -37.155181884765625, "global_step": 63719, "epoch": 526} {"train_loss": -37.36608123779297, "global_step": 63720, "epoch": 526} {"train_loss": -37.4219970703125, "global_step": 63721, "epoch": 526} {"train_loss": -37.119667053222656, "global_step": 63722, "epoch": 526} {"train_loss": -36.87773895263672, "global_step": 63723, "epoch": 526} {"train_loss": -37.04740524291992, "global_step": 63724, "epoch": 526} {"train_loss": -37.282596588134766, "global_step": 63725, "epoch": 526} {"train_loss": -37.16654586791992, "global_step": 63726, "epoch": 526} {"train_loss": -36.65474319458008, "global_step": 63727, "epoch": 526} {"train_loss": -36.50444412231445, "global_step": 63728, "epoch": 526} {"train_loss": -36.85762405395508, "global_step": 63729, "epoch": 526} {"train_loss": -37.03579330444336, "global_step": 63730, "epoch": 526} {"train_loss": -37.2557487487793, "global_step": 63731, "epoch": 526} {"train_loss": -37.58015823364258, "global_step": 63732, "epoch": 526} {"train_loss": -37.28977584838867, "global_step": 63733, "epoch": 526} {"train_loss": -37.6280403137207, "global_step": 63734, "epoch": 526} {"train_loss": -37.88632583618164, "global_step": 63735, "epoch": 526} {"train_loss": -37.44716262817383, "global_step": 63736, "epoch": 526} {"train_loss": -37.670326232910156, "global_step": 63737, "epoch": 526} {"train_loss": -37.61677169799805, "global_step": 63738, "epoch": 526} {"train_loss": -37.7553825378418, "global_step": 63739, "epoch": 526} {"train_loss": -37.270931243896484, "global_step": 63740, "epoch": 526} {"train_loss": -37.5859260559082, "global_step": 63741, "epoch": 526} {"train_loss": -37.21781539916992, "global_step": 63742, "epoch": 526} {"train_loss": -37.14714050292969, "global_step": 63743, "epoch": 526} {"train_loss": -37.63017654418945, "global_step": 63744, "epoch": 526} {"train_loss": -37.428585052490234, "global_step": 63745, "epoch": 526} {"train_loss": -36.426429748535156, "global_step": 63746, "epoch": 526} {"train_loss": -37.5189323425293, "global_step": 63747, "epoch": 526} {"train_loss": -36.77118682861328, "global_step": 63748, "epoch": 526} {"train_loss": -37.15352249145508, "global_step": 63749, "epoch": 526} {"train_loss": -37.153385162353516, "global_step": 63750, "epoch": 526} {"train_loss": -37.116363525390625, "global_step": 63751, "epoch": 526} {"train_loss": -36.7641716003418, "global_step": 63752, "epoch": 526} {"train_loss": -36.34212112426758, "global_step": 63753, "epoch": 526} {"train_loss": -37.23431396484375, "global_step": 63754, "epoch": 526} {"train_loss": -36.162113189697266, "global_step": 63755, "epoch": 526} {"train_loss": -35.11955261230469, "global_step": 63756, "epoch": 526} {"train_loss": -37.11298751831055, "global_step": 63757, "epoch": 526} {"train_loss": -35.34379577636719, "global_step": 63758, "epoch": 526} {"train_loss": -37.0010986328125, "global_step": 63759, "epoch": 526} {"train_loss": -35.39944076538086, "global_step": 63760, "epoch": 526} {"train_loss": -36.02395248413086, "global_step": 63761, "epoch": 526} {"train_loss": -34.16147232055664, "global_step": 63762, "epoch": 526} {"train_loss": -34.00216293334961, "global_step": 63763, "epoch": 526} {"train_loss": -34.644290924072266, "global_step": 63764, "epoch": 526} {"train_loss": -35.3718147277832, "global_step": 63765, "epoch": 526} {"train_loss": -36.120433712793776, "global_step": 63766, "epoch": 526, "val_loss": 2603995.75} {"train_loss": -33.643836975097656, "global_step": 63767, "epoch": 527} {"train_loss": -36.26534652709961, "global_step": 63768, "epoch": 527} {"train_loss": -36.47161865234375, "global_step": 63769, "epoch": 527} {"train_loss": -35.470149993896484, "global_step": 63770, "epoch": 527} {"train_loss": -35.0825080871582, "global_step": 63771, "epoch": 527} {"train_loss": -33.55116271972656, "global_step": 63772, "epoch": 527} {"train_loss": -32.660011291503906, "global_step": 63773, "epoch": 527} {"train_loss": -34.2868766784668, "global_step": 63774, "epoch": 527} {"train_loss": -34.98786544799805, "global_step": 63775, "epoch": 527} {"train_loss": -34.987056732177734, "global_step": 63776, "epoch": 527} {"train_loss": -35.35831832885742, "global_step": 63777, "epoch": 527} {"train_loss": -35.673736572265625, "global_step": 63778, "epoch": 527} {"train_loss": -35.08888626098633, "global_step": 63779, "epoch": 527} {"train_loss": -35.71320724487305, "global_step": 63780, "epoch": 527} {"train_loss": -36.281463623046875, "global_step": 63781, "epoch": 527} {"train_loss": -35.69268035888672, "global_step": 63782, "epoch": 527} {"train_loss": -35.503273010253906, "global_step": 63783, "epoch": 527} {"train_loss": -36.845916748046875, "global_step": 63784, "epoch": 527} {"train_loss": -35.83176803588867, "global_step": 63785, "epoch": 527} {"train_loss": -36.41115188598633, "global_step": 63786, "epoch": 527} {"train_loss": -36.21293640136719, "global_step": 63787, "epoch": 527} {"train_loss": -36.088314056396484, "global_step": 63788, "epoch": 527} {"train_loss": -36.574424743652344, "global_step": 63789, "epoch": 527} {"train_loss": -36.58919143676758, "global_step": 63790, "epoch": 527} {"train_loss": -36.97659683227539, "global_step": 63791, "epoch": 527} {"train_loss": -36.276275634765625, "global_step": 63792, "epoch": 527} {"train_loss": -36.92409133911133, "global_step": 63793, "epoch": 527} {"train_loss": -36.77392578125, "global_step": 63794, "epoch": 527} {"train_loss": -36.63511276245117, "global_step": 63795, "epoch": 527} {"train_loss": -36.40123748779297, "global_step": 63796, "epoch": 527} {"train_loss": -36.38393020629883, "global_step": 63797, "epoch": 527} {"train_loss": -35.97310256958008, "global_step": 63798, "epoch": 527} {"train_loss": -36.30924606323242, "global_step": 63799, "epoch": 527} {"train_loss": -35.91242599487305, "global_step": 63800, "epoch": 527} {"train_loss": -36.41655731201172, "global_step": 63801, "epoch": 527} {"train_loss": -36.71992111206055, "global_step": 63802, "epoch": 527} {"train_loss": -35.8692741394043, "global_step": 63803, "epoch": 527} {"train_loss": -36.71577072143555, "global_step": 63804, "epoch": 527} {"train_loss": -36.5457649230957, "global_step": 63805, "epoch": 527} {"train_loss": -35.607234954833984, "global_step": 63806, "epoch": 527} {"train_loss": -36.34806442260742, "global_step": 63807, "epoch": 527} {"train_loss": -36.46852493286133, "global_step": 63808, "epoch": 527} {"train_loss": -35.96232223510742, "global_step": 63809, "epoch": 527} {"train_loss": -35.99956130981445, "global_step": 63810, "epoch": 527} {"train_loss": -35.8313102722168, "global_step": 63811, "epoch": 527} {"train_loss": -35.608055114746094, "global_step": 63812, "epoch": 527} {"train_loss": -36.11566925048828, "global_step": 63813, "epoch": 527} {"train_loss": -36.4017333984375, "global_step": 63814, "epoch": 527} {"train_loss": -35.970401763916016, "global_step": 63815, "epoch": 527} {"train_loss": -36.8104362487793, "global_step": 63816, "epoch": 527} {"train_loss": -35.82375717163086, "global_step": 63817, "epoch": 527} {"train_loss": -34.64243698120117, "global_step": 63818, "epoch": 527} {"train_loss": -30.744312286376953, "global_step": 63819, "epoch": 527} {"train_loss": -34.15252685546875, "global_step": 63820, "epoch": 527} {"train_loss": -33.79803466796875, "global_step": 63821, "epoch": 527} {"train_loss": -34.83852005004883, "global_step": 63822, "epoch": 527} {"train_loss": -34.15214920043945, "global_step": 63823, "epoch": 527} {"train_loss": -36.38102340698242, "global_step": 63824, "epoch": 527} {"train_loss": -28.863927841186523, "global_step": 63825, "epoch": 527} {"train_loss": -33.90797805786133, "global_step": 63826, "epoch": 527} {"train_loss": -30.37274169921875, "global_step": 63827, "epoch": 527} {"train_loss": -32.944637298583984, "global_step": 63828, "epoch": 527} {"train_loss": -36.873287200927734, "global_step": 63829, "epoch": 527} {"train_loss": -33.533084869384766, "global_step": 63830, "epoch": 527} {"train_loss": -34.459381103515625, "global_step": 63831, "epoch": 527} {"train_loss": -34.051387786865234, "global_step": 63832, "epoch": 527} {"train_loss": -36.09127426147461, "global_step": 63833, "epoch": 527} {"train_loss": -35.17904281616211, "global_step": 63834, "epoch": 527} {"train_loss": -33.74457931518555, "global_step": 63835, "epoch": 527} {"train_loss": -33.155555725097656, "global_step": 63836, "epoch": 527} {"train_loss": -35.49456024169922, "global_step": 63837, "epoch": 527} {"train_loss": -35.6770133972168, "global_step": 63838, "epoch": 527} {"train_loss": -35.311012268066406, "global_step": 63839, "epoch": 527} {"train_loss": -35.549217224121094, "global_step": 63840, "epoch": 527} {"train_loss": -35.27500915527344, "global_step": 63841, "epoch": 527} {"train_loss": -36.30342483520508, "global_step": 63842, "epoch": 527} {"train_loss": -36.600677490234375, "global_step": 63843, "epoch": 527} {"train_loss": -36.38720703125, "global_step": 63844, "epoch": 527} {"train_loss": -35.659732818603516, "global_step": 63845, "epoch": 527} {"train_loss": -35.54970932006836, "global_step": 63846, "epoch": 527} {"train_loss": -35.230560302734375, "global_step": 63847, "epoch": 527} {"train_loss": -35.73574447631836, "global_step": 63848, "epoch": 527} {"train_loss": -35.86051559448242, "global_step": 63849, "epoch": 527} {"train_loss": -36.354888916015625, "global_step": 63850, "epoch": 527} {"train_loss": -35.705535888671875, "global_step": 63851, "epoch": 527} {"train_loss": -36.42306137084961, "global_step": 63852, "epoch": 527} {"train_loss": -35.56074905395508, "global_step": 63853, "epoch": 527} {"train_loss": -36.261592864990234, "global_step": 63854, "epoch": 527} {"train_loss": -35.87589645385742, "global_step": 63855, "epoch": 527} {"train_loss": -36.434627532958984, "global_step": 63856, "epoch": 527} {"train_loss": -36.0222053527832, "global_step": 63857, "epoch": 527} {"train_loss": -35.740234375, "global_step": 63858, "epoch": 527} {"train_loss": -36.81608963012695, "global_step": 63859, "epoch": 527} {"train_loss": -36.75140380859375, "global_step": 63860, "epoch": 527} {"train_loss": -36.39493179321289, "global_step": 63861, "epoch": 527} {"train_loss": -36.647216796875, "global_step": 63862, "epoch": 527} {"train_loss": -36.11206817626953, "global_step": 63863, "epoch": 527} {"train_loss": -37.19770050048828, "global_step": 63864, "epoch": 527} {"train_loss": -36.82003402709961, "global_step": 63865, "epoch": 527} {"train_loss": -36.41420364379883, "global_step": 63866, "epoch": 527} {"train_loss": -37.148048400878906, "global_step": 63867, "epoch": 527} {"train_loss": -36.93809127807617, "global_step": 63868, "epoch": 527} {"train_loss": -36.438575744628906, "global_step": 63869, "epoch": 527} {"train_loss": -36.54402160644531, "global_step": 63870, "epoch": 527} {"train_loss": -36.60007095336914, "global_step": 63871, "epoch": 527} {"train_loss": -36.85102081298828, "global_step": 63872, "epoch": 527} {"train_loss": -36.46290969848633, "global_step": 63873, "epoch": 527} {"train_loss": -36.604984283447266, "global_step": 63874, "epoch": 527} {"train_loss": -36.888580322265625, "global_step": 63875, "epoch": 527} {"train_loss": -36.602874755859375, "global_step": 63876, "epoch": 527} {"train_loss": -36.31316375732422, "global_step": 63877, "epoch": 527} {"train_loss": -36.525997161865234, "global_step": 63878, "epoch": 527} {"train_loss": -37.045013427734375, "global_step": 63879, "epoch": 527} {"train_loss": -36.90717697143555, "global_step": 63880, "epoch": 527} {"train_loss": -35.47813034057617, "global_step": 63881, "epoch": 527} {"train_loss": -36.6187858581543, "global_step": 63882, "epoch": 527} {"train_loss": -37.084129333496094, "global_step": 63883, "epoch": 527} {"train_loss": -36.21576690673828, "global_step": 63884, "epoch": 527} {"train_loss": -37.29834747314453, "global_step": 63885, "epoch": 527} {"train_loss": -36.14288330078125, "global_step": 63886, "epoch": 527} {"train_loss": -35.71619845618886, "global_step": 63887, "epoch": 527, "val_loss": 2670261.0} {"train_loss": -37.143165588378906, "global_step": 63888, "epoch": 528} {"train_loss": -37.01290512084961, "global_step": 63889, "epoch": 528} {"train_loss": -36.69242477416992, "global_step": 63890, "epoch": 528} {"train_loss": -36.07192611694336, "global_step": 63891, "epoch": 528} {"train_loss": -37.04818344116211, "global_step": 63892, "epoch": 528} {"train_loss": -35.660621643066406, "global_step": 63893, "epoch": 528} {"train_loss": -36.64309310913086, "global_step": 63894, "epoch": 528} {"train_loss": -35.752235412597656, "global_step": 63895, "epoch": 528} {"train_loss": -34.371822357177734, "global_step": 63896, "epoch": 528} {"train_loss": -34.764678955078125, "global_step": 63897, "epoch": 528} {"train_loss": -36.11411666870117, "global_step": 63898, "epoch": 528} {"train_loss": -35.2552490234375, "global_step": 63899, "epoch": 528} {"train_loss": -35.92996597290039, "global_step": 63900, "epoch": 528} {"train_loss": -35.361419677734375, "global_step": 63901, "epoch": 528} {"train_loss": -34.17969512939453, "global_step": 63902, "epoch": 528} {"train_loss": -33.10313034057617, "global_step": 63903, "epoch": 528} {"train_loss": -35.575531005859375, "global_step": 63904, "epoch": 528} {"train_loss": -36.068355560302734, "global_step": 63905, "epoch": 528} {"train_loss": -35.5252571105957, "global_step": 63906, "epoch": 528} {"train_loss": -34.92074203491211, "global_step": 63907, "epoch": 528} {"train_loss": -34.977596282958984, "global_step": 63908, "epoch": 528} {"train_loss": -35.40949630737305, "global_step": 63909, "epoch": 528} {"train_loss": -35.61371612548828, "global_step": 63910, "epoch": 528} {"train_loss": -24.648679733276367, "global_step": 63911, "epoch": 528} {"train_loss": -34.93347930908203, "global_step": 63912, "epoch": 528} {"train_loss": -34.850345611572266, "global_step": 63913, "epoch": 528} {"train_loss": -33.60211181640625, "global_step": 63914, "epoch": 528} {"train_loss": -35.0091552734375, "global_step": 63915, "epoch": 528} {"train_loss": -33.13839340209961, "global_step": 63916, "epoch": 528} {"train_loss": -33.10345458984375, "global_step": 63917, "epoch": 528} {"train_loss": -33.03218460083008, "global_step": 63918, "epoch": 528} {"train_loss": -34.354793548583984, "global_step": 63919, "epoch": 528} {"train_loss": -34.2025146484375, "global_step": 63920, "epoch": 528} {"train_loss": -34.22603225708008, "global_step": 63921, "epoch": 528} {"train_loss": -33.09634780883789, "global_step": 63922, "epoch": 528} {"train_loss": -31.182462692260742, "global_step": 63923, "epoch": 528} {"train_loss": -31.212427139282227, "global_step": 63924, "epoch": 528} {"train_loss": -32.181697845458984, "global_step": 63925, "epoch": 528} {"train_loss": -34.24918746948242, "global_step": 63926, "epoch": 528} {"train_loss": -33.74944305419922, "global_step": 63927, "epoch": 528} {"train_loss": -33.162776947021484, "global_step": 63928, "epoch": 528} {"train_loss": -34.42269515991211, "global_step": 63929, "epoch": 528} {"train_loss": -34.00676345825195, "global_step": 63930, "epoch": 528} {"train_loss": -29.486730575561523, "global_step": 63931, "epoch": 528} {"train_loss": -34.684669494628906, "global_step": 63932, "epoch": 528} {"train_loss": -32.770851135253906, "global_step": 63933, "epoch": 528} {"train_loss": -33.48905944824219, "global_step": 63934, "epoch": 528} {"train_loss": -34.16541290283203, "global_step": 63935, "epoch": 528} {"train_loss": -32.16933822631836, "global_step": 63936, "epoch": 528} {"train_loss": -34.735172271728516, "global_step": 63937, "epoch": 528} {"train_loss": -34.045372009277344, "global_step": 63938, "epoch": 528} {"train_loss": -33.310096740722656, "global_step": 63939, "epoch": 528} {"train_loss": -35.109649658203125, "global_step": 63940, "epoch": 528} {"train_loss": -33.979557037353516, "global_step": 63941, "epoch": 528} {"train_loss": -33.54500198364258, "global_step": 63942, "epoch": 528} {"train_loss": -33.16164016723633, "global_step": 63943, "epoch": 528} {"train_loss": -34.134559631347656, "global_step": 63944, "epoch": 528} {"train_loss": -34.37807083129883, "global_step": 63945, "epoch": 528} {"train_loss": -34.67240524291992, "global_step": 63946, "epoch": 528} {"train_loss": -33.84873962402344, "global_step": 63947, "epoch": 528} {"train_loss": -34.70113754272461, "global_step": 63948, "epoch": 528} {"train_loss": -34.658016204833984, "global_step": 63949, "epoch": 528} {"train_loss": -34.863399505615234, "global_step": 63950, "epoch": 528} {"train_loss": -35.02259826660156, "global_step": 63951, "epoch": 528} {"train_loss": -34.76105880737305, "global_step": 63952, "epoch": 528} {"train_loss": -34.8610954284668, "global_step": 63953, "epoch": 528} {"train_loss": -35.443153381347656, "global_step": 63954, "epoch": 528} {"train_loss": -34.87866973876953, "global_step": 63955, "epoch": 528} {"train_loss": -35.32548141479492, "global_step": 63956, "epoch": 528} {"train_loss": -35.377044677734375, "global_step": 63957, "epoch": 528} {"train_loss": -35.18660354614258, "global_step": 63958, "epoch": 528} {"train_loss": -34.95140075683594, "global_step": 63959, "epoch": 528} {"train_loss": -35.06340408325195, "global_step": 63960, "epoch": 528} {"train_loss": -34.37350082397461, "global_step": 63961, "epoch": 528} {"train_loss": -35.63943099975586, "global_step": 63962, "epoch": 528} {"train_loss": -34.70699691772461, "global_step": 63963, "epoch": 528} {"train_loss": -36.11223220825195, "global_step": 63964, "epoch": 528} {"train_loss": -35.09693145751953, "global_step": 63965, "epoch": 528} {"train_loss": -35.5792121887207, "global_step": 63966, "epoch": 528} {"train_loss": -34.93301010131836, "global_step": 63967, "epoch": 528} {"train_loss": -35.62123489379883, "global_step": 63968, "epoch": 528} {"train_loss": -35.740169525146484, "global_step": 63969, "epoch": 528} {"train_loss": -35.35686111450195, "global_step": 63970, "epoch": 528} {"train_loss": -36.152278900146484, "global_step": 63971, "epoch": 528} {"train_loss": -35.6870231628418, "global_step": 63972, "epoch": 528} {"train_loss": -35.748870849609375, "global_step": 63973, "epoch": 528} {"train_loss": -36.255043029785156, "global_step": 63974, "epoch": 528} {"train_loss": -36.11872100830078, "global_step": 63975, "epoch": 528} {"train_loss": -35.960533142089844, "global_step": 63976, "epoch": 528} {"train_loss": -35.925514221191406, "global_step": 63977, "epoch": 528} {"train_loss": -36.2828254699707, "global_step": 63978, "epoch": 528} {"train_loss": -36.38215255737305, "global_step": 63979, "epoch": 528} {"train_loss": -36.63261032104492, "global_step": 63980, "epoch": 528} {"train_loss": -36.0937614440918, "global_step": 63981, "epoch": 528} {"train_loss": -36.35702896118164, "global_step": 63982, "epoch": 528} {"train_loss": -36.689334869384766, "global_step": 63983, "epoch": 528} {"train_loss": -36.6455192565918, "global_step": 63984, "epoch": 528} {"train_loss": -35.839569091796875, "global_step": 63985, "epoch": 528} {"train_loss": -36.410404205322266, "global_step": 63986, "epoch": 528} {"train_loss": -36.456573486328125, "global_step": 63987, "epoch": 528} {"train_loss": -36.95768737792969, "global_step": 63988, "epoch": 528} {"train_loss": -36.87525939941406, "global_step": 63989, "epoch": 528} {"train_loss": -36.27787399291992, "global_step": 63990, "epoch": 528} {"train_loss": -35.27534103393555, "global_step": 63991, "epoch": 528} {"train_loss": -35.405372619628906, "global_step": 63992, "epoch": 528} {"train_loss": -34.89449691772461, "global_step": 63993, "epoch": 528} {"train_loss": -33.29036331176758, "global_step": 63994, "epoch": 528} {"train_loss": -21.78529167175293, "global_step": 63995, "epoch": 528} {"train_loss": 0.8437415957450867, "global_step": 63996, "epoch": 528} {"train_loss": 2.078533172607422, "global_step": 63997, "epoch": 528} {"train_loss": -33.583885192871094, "global_step": 63998, "epoch": 528} {"train_loss": -5.719559192657471, "global_step": 63999, "epoch": 528} {"train_loss": -33.95840072631836, "global_step": 64000, "epoch": 528} {"train_loss": -21.1865234375, "global_step": 64001, "epoch": 528} {"train_loss": -31.22846031188965, "global_step": 64002, "epoch": 528} {"train_loss": -29.791730880737305, "global_step": 64003, "epoch": 528} {"train_loss": -26.58550453186035, "global_step": 64004, "epoch": 528} {"train_loss": -34.66579818725586, "global_step": 64005, "epoch": 528} {"train_loss": -30.383319854736328, "global_step": 64006, "epoch": 528} {"train_loss": -29.602216720581055, "global_step": 64007, "epoch": 528} {"train_loss": -33.52171296767952, "global_step": 64008, "epoch": 528, "val_loss": 2499497.25} {"train_loss": -33.62009048461914, "global_step": 64009, "epoch": 529} {"train_loss": -30.33808708190918, "global_step": 64010, "epoch": 529} {"train_loss": -31.094268798828125, "global_step": 64011, "epoch": 529} {"train_loss": -35.265411376953125, "global_step": 64012, "epoch": 529} {"train_loss": -34.019920349121094, "global_step": 64013, "epoch": 529} {"train_loss": -33.38186264038086, "global_step": 64014, "epoch": 529} {"train_loss": -32.03772735595703, "global_step": 64015, "epoch": 529} {"train_loss": -34.457244873046875, "global_step": 64016, "epoch": 529} {"train_loss": -35.03923416137695, "global_step": 64017, "epoch": 529} {"train_loss": -34.6427001953125, "global_step": 64018, "epoch": 529} {"train_loss": -33.67013931274414, "global_step": 64019, "epoch": 529} {"train_loss": -34.060665130615234, "global_step": 64020, "epoch": 529} {"train_loss": -35.23747634887695, "global_step": 64021, "epoch": 529} {"train_loss": -34.725276947021484, "global_step": 64022, "epoch": 529} {"train_loss": -34.760231018066406, "global_step": 64023, "epoch": 529} {"train_loss": -35.23695755004883, "global_step": 64024, "epoch": 529} {"train_loss": -34.71649169921875, "global_step": 64025, "epoch": 529} {"train_loss": -35.108882904052734, "global_step": 64026, "epoch": 529} {"train_loss": -35.36886215209961, "global_step": 64027, "epoch": 529} {"train_loss": -35.5240364074707, "global_step": 64028, "epoch": 529} {"train_loss": -35.71560287475586, "global_step": 64029, "epoch": 529} {"train_loss": -35.46356964111328, "global_step": 64030, "epoch": 529} {"train_loss": -35.224853515625, "global_step": 64031, "epoch": 529} {"train_loss": -36.075653076171875, "global_step": 64032, "epoch": 529} {"train_loss": -35.842079162597656, "global_step": 64033, "epoch": 529} {"train_loss": -35.87960433959961, "global_step": 64034, "epoch": 529} {"train_loss": -35.859649658203125, "global_step": 64035, "epoch": 529} {"train_loss": -35.61542892456055, "global_step": 64036, "epoch": 529} {"train_loss": -35.85542678833008, "global_step": 64037, "epoch": 529} {"train_loss": -36.418846130371094, "global_step": 64038, "epoch": 529} {"train_loss": -36.3572998046875, "global_step": 64039, "epoch": 529} {"train_loss": -35.716793060302734, "global_step": 64040, "epoch": 529} {"train_loss": -36.0153923034668, "global_step": 64041, "epoch": 529} {"train_loss": -36.126251220703125, "global_step": 64042, "epoch": 529} {"train_loss": -35.999839782714844, "global_step": 64043, "epoch": 529} {"train_loss": -36.237850189208984, "global_step": 64044, "epoch": 529} {"train_loss": -36.05940628051758, "global_step": 64045, "epoch": 529} {"train_loss": -36.268096923828125, "global_step": 64046, "epoch": 529} {"train_loss": -36.496070861816406, "global_step": 64047, "epoch": 529} {"train_loss": -36.240501403808594, "global_step": 64048, "epoch": 529} {"train_loss": -36.33720016479492, "global_step": 64049, "epoch": 529} {"train_loss": -36.60251998901367, "global_step": 64050, "epoch": 529} {"train_loss": -36.63112258911133, "global_step": 64051, "epoch": 529} {"train_loss": -36.55585861206055, "global_step": 64052, "epoch": 529} {"train_loss": -36.5805549621582, "global_step": 64053, "epoch": 529} {"train_loss": -36.41289138793945, "global_step": 64054, "epoch": 529} {"train_loss": -36.92542266845703, "global_step": 64055, "epoch": 529} {"train_loss": -36.12514877319336, "global_step": 64056, "epoch": 529} {"train_loss": -36.420509338378906, "global_step": 64057, "epoch": 529} {"train_loss": -36.653594970703125, "global_step": 64058, "epoch": 529} {"train_loss": -36.947147369384766, "global_step": 64059, "epoch": 529} {"train_loss": -36.69249725341797, "global_step": 64060, "epoch": 529} {"train_loss": -36.73764419555664, "global_step": 64061, "epoch": 529} {"train_loss": -36.80731964111328, "global_step": 64062, "epoch": 529} {"train_loss": -36.863990783691406, "global_step": 64063, "epoch": 529} {"train_loss": -36.2095832824707, "global_step": 64064, "epoch": 529} {"train_loss": -36.60792922973633, "global_step": 64065, "epoch": 529} {"train_loss": -36.53076171875, "global_step": 64066, "epoch": 529} {"train_loss": -36.945709228515625, "global_step": 64067, "epoch": 529} {"train_loss": -37.12550735473633, "global_step": 64068, "epoch": 529} {"train_loss": -36.357177734375, "global_step": 64069, "epoch": 529} {"train_loss": -36.07529830932617, "global_step": 64070, "epoch": 529} {"train_loss": -35.88496017456055, "global_step": 64071, "epoch": 529} {"train_loss": -34.97319030761719, "global_step": 64072, "epoch": 529} {"train_loss": -33.69126892089844, "global_step": 64073, "epoch": 529} {"train_loss": -32.39338302612305, "global_step": 64074, "epoch": 529} {"train_loss": -33.762325286865234, "global_step": 64075, "epoch": 529} {"train_loss": -36.71268844604492, "global_step": 64076, "epoch": 529} {"train_loss": -35.91259002685547, "global_step": 64077, "epoch": 529} {"train_loss": -35.209896087646484, "global_step": 64078, "epoch": 529} {"train_loss": -35.8856086730957, "global_step": 64079, "epoch": 529} {"train_loss": -35.092994689941406, "global_step": 64080, "epoch": 529} {"train_loss": -36.21272659301758, "global_step": 64081, "epoch": 529} {"train_loss": -35.41938400268555, "global_step": 64082, "epoch": 529} {"train_loss": -35.5475959777832, "global_step": 64083, "epoch": 529} {"train_loss": -35.389991760253906, "global_step": 64084, "epoch": 529} {"train_loss": -35.89253234863281, "global_step": 64085, "epoch": 529} {"train_loss": -36.37046432495117, "global_step": 64086, "epoch": 529} {"train_loss": -36.504432678222656, "global_step": 64087, "epoch": 529} {"train_loss": -35.51937484741211, "global_step": 64088, "epoch": 529} {"train_loss": -34.641563415527344, "global_step": 64089, "epoch": 529} {"train_loss": -34.62124252319336, "global_step": 64090, "epoch": 529} {"train_loss": -35.244483947753906, "global_step": 64091, "epoch": 529} {"train_loss": -35.62656021118164, "global_step": 64092, "epoch": 529} {"train_loss": -34.912071228027344, "global_step": 64093, "epoch": 529} {"train_loss": -33.46719741821289, "global_step": 64094, "epoch": 529} {"train_loss": -34.851661682128906, "global_step": 64095, "epoch": 529} {"train_loss": -30.88629150390625, "global_step": 64096, "epoch": 529} {"train_loss": -32.4455680847168, "global_step": 64097, "epoch": 529} {"train_loss": -19.688718795776367, "global_step": 64098, "epoch": 529} {"train_loss": -25.017852783203125, "global_step": 64099, "epoch": 529} {"train_loss": -23.70667839050293, "global_step": 64100, "epoch": 529} {"train_loss": -30.087045669555664, "global_step": 64101, "epoch": 529} {"train_loss": -29.8133487701416, "global_step": 64102, "epoch": 529} {"train_loss": -30.360029220581055, "global_step": 64103, "epoch": 529} {"train_loss": -24.67842674255371, "global_step": 64104, "epoch": 529} {"train_loss": -31.261219024658203, "global_step": 64105, "epoch": 529} {"train_loss": -24.44767189025879, "global_step": 64106, "epoch": 529} {"train_loss": -30.599592208862305, "global_step": 64107, "epoch": 529} {"train_loss": -32.51566696166992, "global_step": 64108, "epoch": 529} {"train_loss": -32.0046272277832, "global_step": 64109, "epoch": 529} {"train_loss": -31.3075008392334, "global_step": 64110, "epoch": 529} {"train_loss": -32.212608337402344, "global_step": 64111, "epoch": 529} {"train_loss": -31.401479721069336, "global_step": 64112, "epoch": 529} {"train_loss": -31.49146842956543, "global_step": 64113, "epoch": 529} {"train_loss": -32.769927978515625, "global_step": 64114, "epoch": 529} {"train_loss": -33.07389450073242, "global_step": 64115, "epoch": 529} {"train_loss": -30.95757484436035, "global_step": 64116, "epoch": 529} {"train_loss": -33.53296661376953, "global_step": 64117, "epoch": 529} {"train_loss": -32.742130279541016, "global_step": 64118, "epoch": 529} {"train_loss": -32.9686393737793, "global_step": 64119, "epoch": 529} {"train_loss": -33.531219482421875, "global_step": 64120, "epoch": 529} {"train_loss": -33.015071868896484, "global_step": 64121, "epoch": 529} {"train_loss": -33.46261215209961, "global_step": 64122, "epoch": 529} {"train_loss": -33.50214385986328, "global_step": 64123, "epoch": 529} {"train_loss": -33.1916618347168, "global_step": 64124, "epoch": 529} {"train_loss": -33.42696762084961, "global_step": 64125, "epoch": 529} {"train_loss": -33.672298431396484, "global_step": 64126, "epoch": 529} {"train_loss": -33.699527740478516, "global_step": 64127, "epoch": 529} {"train_loss": -33.53369903564453, "global_step": 64128, "epoch": 529} {"train_loss": -34.21997752859573, "global_step": 64129, "epoch": 529, "val_loss": 2562356.0} {"train_loss": -33.55237579345703, "global_step": 64130, "epoch": 530} {"train_loss": -33.4329719543457, "global_step": 64131, "epoch": 530} {"train_loss": -33.855159759521484, "global_step": 64132, "epoch": 530} {"train_loss": -34.0023078918457, "global_step": 64133, "epoch": 530} {"train_loss": -33.524166107177734, "global_step": 64134, "epoch": 530} {"train_loss": -34.2234001159668, "global_step": 64135, "epoch": 530} {"train_loss": -33.93479537963867, "global_step": 64136, "epoch": 530} {"train_loss": -33.64685821533203, "global_step": 64137, "epoch": 530} {"train_loss": -34.33420944213867, "global_step": 64138, "epoch": 530} {"train_loss": -33.85905075073242, "global_step": 64139, "epoch": 530} {"train_loss": -34.225746154785156, "global_step": 64140, "epoch": 530} {"train_loss": -34.4780158996582, "global_step": 64141, "epoch": 530} {"train_loss": -34.15506362915039, "global_step": 64142, "epoch": 530} {"train_loss": -34.255889892578125, "global_step": 64143, "epoch": 530} {"train_loss": -33.9080924987793, "global_step": 64144, "epoch": 530} {"train_loss": -34.34648513793945, "global_step": 64145, "epoch": 530} {"train_loss": -34.72813034057617, "global_step": 64146, "epoch": 530} {"train_loss": -34.32843780517578, "global_step": 64147, "epoch": 530} {"train_loss": -34.13673400878906, "global_step": 64148, "epoch": 530} {"train_loss": -34.63954544067383, "global_step": 64149, "epoch": 530} {"train_loss": -34.679317474365234, "global_step": 64150, "epoch": 530} {"train_loss": -34.61125183105469, "global_step": 64151, "epoch": 530} {"train_loss": -34.895912170410156, "global_step": 64152, "epoch": 530} {"train_loss": -34.86286544799805, "global_step": 64153, "epoch": 530} {"train_loss": -34.66888427734375, "global_step": 64154, "epoch": 530} {"train_loss": -34.328773498535156, "global_step": 64155, "epoch": 530} {"train_loss": -34.420753479003906, "global_step": 64156, "epoch": 530} {"train_loss": -34.85154724121094, "global_step": 64157, "epoch": 530} {"train_loss": -35.07613754272461, "global_step": 64158, "epoch": 530} {"train_loss": -35.0251579284668, "global_step": 64159, "epoch": 530} {"train_loss": -35.24394226074219, "global_step": 64160, "epoch": 530} {"train_loss": -35.15560531616211, "global_step": 64161, "epoch": 530} {"train_loss": -34.97590255737305, "global_step": 64162, "epoch": 530} {"train_loss": -34.87522506713867, "global_step": 64163, "epoch": 530} {"train_loss": -35.3912239074707, "global_step": 64164, "epoch": 530} {"train_loss": -35.01285934448242, "global_step": 64165, "epoch": 530} {"train_loss": -35.547908782958984, "global_step": 64166, "epoch": 530} {"train_loss": -35.38884735107422, "global_step": 64167, "epoch": 530} {"train_loss": -35.288448333740234, "global_step": 64168, "epoch": 530} {"train_loss": -35.34393310546875, "global_step": 64169, "epoch": 530} {"train_loss": -34.86104202270508, "global_step": 64170, "epoch": 530} {"train_loss": -35.925411224365234, "global_step": 64171, "epoch": 530} {"train_loss": -35.05772018432617, "global_step": 64172, "epoch": 530} {"train_loss": -34.9844970703125, "global_step": 64173, "epoch": 530} {"train_loss": -35.86665344238281, "global_step": 64174, "epoch": 530} {"train_loss": -35.5077018737793, "global_step": 64175, "epoch": 530} {"train_loss": -35.23029708862305, "global_step": 64176, "epoch": 530} {"train_loss": -35.23127365112305, "global_step": 64177, "epoch": 530} {"train_loss": -32.88852310180664, "global_step": 64178, "epoch": 530} {"train_loss": -29.80209732055664, "global_step": 64179, "epoch": 530} {"train_loss": -29.89697265625, "global_step": 64180, "epoch": 530} {"train_loss": -28.12932777404785, "global_step": 64181, "epoch": 530} {"train_loss": -24.99765396118164, "global_step": 64182, "epoch": 530} {"train_loss": -26.667728424072266, "global_step": 64183, "epoch": 530} {"train_loss": -29.50632667541504, "global_step": 64184, "epoch": 530} {"train_loss": -35.14194107055664, "global_step": 64185, "epoch": 530} {"train_loss": -31.317462921142578, "global_step": 64186, "epoch": 530} {"train_loss": -32.87043380737305, "global_step": 64187, "epoch": 530} {"train_loss": -33.854835510253906, "global_step": 64188, "epoch": 530} {"train_loss": -32.646724700927734, "global_step": 64189, "epoch": 530} {"train_loss": -35.19557189941406, "global_step": 64190, "epoch": 530} {"train_loss": -32.53986740112305, "global_step": 64191, "epoch": 530} {"train_loss": -34.251644134521484, "global_step": 64192, "epoch": 530} {"train_loss": -33.91135787963867, "global_step": 64193, "epoch": 530} {"train_loss": -34.81787109375, "global_step": 64194, "epoch": 530} {"train_loss": -34.38859558105469, "global_step": 64195, "epoch": 530} {"train_loss": -35.57636642456055, "global_step": 64196, "epoch": 530} {"train_loss": -34.60182571411133, "global_step": 64197, "epoch": 530} {"train_loss": -35.02267074584961, "global_step": 64198, "epoch": 530} {"train_loss": -35.65053176879883, "global_step": 64199, "epoch": 530} {"train_loss": -35.777374267578125, "global_step": 64200, "epoch": 530} {"train_loss": -35.28078842163086, "global_step": 64201, "epoch": 530} {"train_loss": -35.68246078491211, "global_step": 64202, "epoch": 530} {"train_loss": -36.0039176940918, "global_step": 64203, "epoch": 530} {"train_loss": -35.83572769165039, "global_step": 64204, "epoch": 530} {"train_loss": -35.72408676147461, "global_step": 64205, "epoch": 530} {"train_loss": -35.93513107299805, "global_step": 64206, "epoch": 530} {"train_loss": -36.03377914428711, "global_step": 64207, "epoch": 530} {"train_loss": -35.285987854003906, "global_step": 64208, "epoch": 530} {"train_loss": -35.554527282714844, "global_step": 64209, "epoch": 530} {"train_loss": -35.51398849487305, "global_step": 64210, "epoch": 530} {"train_loss": -35.85777282714844, "global_step": 64211, "epoch": 530} {"train_loss": -35.685264587402344, "global_step": 64212, "epoch": 530} {"train_loss": -36.05414962768555, "global_step": 64213, "epoch": 530} {"train_loss": -36.07601547241211, "global_step": 64214, "epoch": 530} {"train_loss": -36.26619338989258, "global_step": 64215, "epoch": 530} {"train_loss": -36.067420959472656, "global_step": 64216, "epoch": 530} {"train_loss": -36.106746673583984, "global_step": 64217, "epoch": 530} {"train_loss": -36.51542663574219, "global_step": 64218, "epoch": 530} {"train_loss": -36.398799896240234, "global_step": 64219, "epoch": 530} {"train_loss": -36.16598129272461, "global_step": 64220, "epoch": 530} {"train_loss": -35.89449691772461, "global_step": 64221, "epoch": 530} {"train_loss": -36.36077880859375, "global_step": 64222, "epoch": 530} {"train_loss": -35.90052032470703, "global_step": 64223, "epoch": 530} {"train_loss": -36.50252914428711, "global_step": 64224, "epoch": 530} {"train_loss": -36.40251541137695, "global_step": 64225, "epoch": 530} {"train_loss": -36.131954193115234, "global_step": 64226, "epoch": 530} {"train_loss": -36.48845672607422, "global_step": 64227, "epoch": 530} {"train_loss": -36.4935417175293, "global_step": 64228, "epoch": 530} {"train_loss": -36.236141204833984, "global_step": 64229, "epoch": 530} {"train_loss": -36.69194412231445, "global_step": 64230, "epoch": 530} {"train_loss": -36.7055778503418, "global_step": 64231, "epoch": 530} {"train_loss": -36.131832122802734, "global_step": 64232, "epoch": 530} {"train_loss": -36.852508544921875, "global_step": 64233, "epoch": 530} {"train_loss": -36.11272048950195, "global_step": 64234, "epoch": 530} {"train_loss": -36.020999908447266, "global_step": 64235, "epoch": 530} {"train_loss": -36.436946868896484, "global_step": 64236, "epoch": 530} {"train_loss": -36.095924377441406, "global_step": 64237, "epoch": 530} {"train_loss": -35.51862716674805, "global_step": 64238, "epoch": 530} {"train_loss": -36.42363357543945, "global_step": 64239, "epoch": 530} {"train_loss": -36.42755126953125, "global_step": 64240, "epoch": 530} {"train_loss": -36.393123626708984, "global_step": 64241, "epoch": 530} {"train_loss": -36.4682731628418, "global_step": 64242, "epoch": 530} {"train_loss": -37.066810607910156, "global_step": 64243, "epoch": 530} {"train_loss": -36.72663497924805, "global_step": 64244, "epoch": 530} {"train_loss": -36.52291488647461, "global_step": 64245, "epoch": 530} {"train_loss": -35.72479248046875, "global_step": 64246, "epoch": 530} {"train_loss": -35.83683395385742, "global_step": 64247, "epoch": 530} {"train_loss": -34.59153366088867, "global_step": 64248, "epoch": 530} {"train_loss": -35.26833724975586, "global_step": 64249, "epoch": 530} {"train_loss": -34.84012014215643, "global_step": 64250, "epoch": 530, "val_loss": 2504171.25} {"train_loss": -31.646835327148438, "global_step": 64251, "epoch": 531} {"train_loss": -28.516992568969727, "global_step": 64252, "epoch": 531} {"train_loss": -14.14292049407959, "global_step": 64253, "epoch": 531} {"train_loss": 4.774393558502197, "global_step": 64254, "epoch": 531} {"train_loss": -19.360929489135742, "global_step": 64255, "epoch": 531} {"train_loss": -32.915462493896484, "global_step": 64256, "epoch": 531} {"train_loss": -24.670867919921875, "global_step": 64257, "epoch": 531} {"train_loss": -30.731689453125, "global_step": 64258, "epoch": 531} {"train_loss": -29.687458038330078, "global_step": 64259, "epoch": 531} {"train_loss": -30.5831241607666, "global_step": 64260, "epoch": 531} {"train_loss": -35.02677536010742, "global_step": 64261, "epoch": 531} {"train_loss": -32.752254486083984, "global_step": 64262, "epoch": 531} {"train_loss": -33.257015228271484, "global_step": 64263, "epoch": 531} {"train_loss": -34.5722770690918, "global_step": 64264, "epoch": 531} {"train_loss": -33.97590637207031, "global_step": 64265, "epoch": 531} {"train_loss": -33.909664154052734, "global_step": 64266, "epoch": 531} {"train_loss": -33.8133659362793, "global_step": 64267, "epoch": 531} {"train_loss": -35.21867752075195, "global_step": 64268, "epoch": 531} {"train_loss": -34.67131423950195, "global_step": 64269, "epoch": 531} {"train_loss": -34.32870864868164, "global_step": 64270, "epoch": 531} {"train_loss": -35.067867279052734, "global_step": 64271, "epoch": 531} {"train_loss": -35.17629623413086, "global_step": 64272, "epoch": 531} {"train_loss": -35.63778305053711, "global_step": 64273, "epoch": 531} {"train_loss": -34.98176193237305, "global_step": 64274, "epoch": 531} {"train_loss": -35.23410415649414, "global_step": 64275, "epoch": 531} {"train_loss": -35.24752426147461, "global_step": 64276, "epoch": 531} {"train_loss": -35.48110580444336, "global_step": 64277, "epoch": 531} {"train_loss": -35.43498992919922, "global_step": 64278, "epoch": 531} {"train_loss": -35.04079055786133, "global_step": 64279, "epoch": 531} {"train_loss": -34.79940414428711, "global_step": 64280, "epoch": 531} {"train_loss": -35.22783660888672, "global_step": 64281, "epoch": 531} {"train_loss": -35.75092315673828, "global_step": 64282, "epoch": 531} {"train_loss": -35.64788818359375, "global_step": 64283, "epoch": 531} {"train_loss": -35.799659729003906, "global_step": 64284, "epoch": 531} {"train_loss": -34.88218307495117, "global_step": 64285, "epoch": 531} {"train_loss": -35.54940414428711, "global_step": 64286, "epoch": 531} {"train_loss": -35.297908782958984, "global_step": 64287, "epoch": 531} {"train_loss": -36.189613342285156, "global_step": 64288, "epoch": 531} {"train_loss": -34.98643112182617, "global_step": 64289, "epoch": 531} {"train_loss": -35.07246398925781, "global_step": 64290, "epoch": 531} {"train_loss": -35.677467346191406, "global_step": 64291, "epoch": 531} {"train_loss": -35.30764389038086, "global_step": 64292, "epoch": 531} {"train_loss": -35.632476806640625, "global_step": 64293, "epoch": 531} {"train_loss": -35.81869125366211, "global_step": 64294, "epoch": 531} {"train_loss": -35.96807098388672, "global_step": 64295, "epoch": 531} {"train_loss": -35.65828323364258, "global_step": 64296, "epoch": 531} {"train_loss": -35.94386291503906, "global_step": 64297, "epoch": 531} {"train_loss": -36.2503776550293, "global_step": 64298, "epoch": 531} {"train_loss": -36.244483947753906, "global_step": 64299, "epoch": 531} {"train_loss": -36.299949645996094, "global_step": 64300, "epoch": 531} {"train_loss": -35.76148986816406, "global_step": 64301, "epoch": 531} {"train_loss": -36.05097961425781, "global_step": 64302, "epoch": 531} {"train_loss": -35.78363037109375, "global_step": 64303, "epoch": 531} {"train_loss": -36.33539962768555, "global_step": 64304, "epoch": 531} {"train_loss": -35.5909309387207, "global_step": 64305, "epoch": 531} {"train_loss": -36.6084098815918, "global_step": 64306, "epoch": 531} {"train_loss": -35.894935607910156, "global_step": 64307, "epoch": 531} {"train_loss": -36.1971435546875, "global_step": 64308, "epoch": 531} {"train_loss": -36.25723648071289, "global_step": 64309, "epoch": 531} {"train_loss": -36.4367561340332, "global_step": 64310, "epoch": 531} {"train_loss": -35.11054992675781, "global_step": 64311, "epoch": 531} {"train_loss": -35.754547119140625, "global_step": 64312, "epoch": 531} {"train_loss": -36.452972412109375, "global_step": 64313, "epoch": 531} {"train_loss": -35.134578704833984, "global_step": 64314, "epoch": 531} {"train_loss": -36.053924560546875, "global_step": 64315, "epoch": 531} {"train_loss": -35.80239486694336, "global_step": 64316, "epoch": 531} {"train_loss": -36.211944580078125, "global_step": 64317, "epoch": 531} {"train_loss": -36.3482551574707, "global_step": 64318, "epoch": 531} {"train_loss": -36.35171127319336, "global_step": 64319, "epoch": 531} {"train_loss": -36.60225296020508, "global_step": 64320, "epoch": 531} {"train_loss": -35.759254455566406, "global_step": 64321, "epoch": 531} {"train_loss": -35.959190368652344, "global_step": 64322, "epoch": 531} {"train_loss": -36.51399612426758, "global_step": 64323, "epoch": 531} {"train_loss": -35.940101623535156, "global_step": 64324, "epoch": 531} {"train_loss": -36.11128234863281, "global_step": 64325, "epoch": 531} {"train_loss": -36.5601921081543, "global_step": 64326, "epoch": 531} {"train_loss": -36.468360900878906, "global_step": 64327, "epoch": 531} {"train_loss": -36.77724838256836, "global_step": 64328, "epoch": 531} {"train_loss": -36.52457809448242, "global_step": 64329, "epoch": 531} {"train_loss": -36.13801193237305, "global_step": 64330, "epoch": 531} {"train_loss": -36.5523567199707, "global_step": 64331, "epoch": 531} {"train_loss": -35.92353439331055, "global_step": 64332, "epoch": 531} {"train_loss": -36.5864143371582, "global_step": 64333, "epoch": 531} {"train_loss": -36.341033935546875, "global_step": 64334, "epoch": 531} {"train_loss": -35.50051498413086, "global_step": 64335, "epoch": 531} {"train_loss": -36.01929473876953, "global_step": 64336, "epoch": 531} {"train_loss": -36.75672149658203, "global_step": 64337, "epoch": 531} {"train_loss": -35.91602325439453, "global_step": 64338, "epoch": 531} {"train_loss": -35.484981536865234, "global_step": 64339, "epoch": 531} {"train_loss": -36.45402908325195, "global_step": 64340, "epoch": 531} {"train_loss": -36.636043548583984, "global_step": 64341, "epoch": 531} {"train_loss": -33.91033935546875, "global_step": 64342, "epoch": 531} {"train_loss": -36.64200973510742, "global_step": 64343, "epoch": 531} {"train_loss": -36.03795623779297, "global_step": 64344, "epoch": 531} {"train_loss": -35.569122314453125, "global_step": 64345, "epoch": 531} {"train_loss": -24.92046356201172, "global_step": 64346, "epoch": 531} {"train_loss": -34.60761260986328, "global_step": 64347, "epoch": 531} {"train_loss": -30.816701889038086, "global_step": 64348, "epoch": 531} {"train_loss": -32.5119514465332, "global_step": 64349, "epoch": 531} {"train_loss": -21.413007736206055, "global_step": 64350, "epoch": 531} {"train_loss": -28.445051193237305, "global_step": 64351, "epoch": 531} {"train_loss": -29.83460807800293, "global_step": 64352, "epoch": 531} {"train_loss": -25.832693099975586, "global_step": 64353, "epoch": 531} {"train_loss": -32.1480827331543, "global_step": 64354, "epoch": 531} {"train_loss": -23.381847381591797, "global_step": 64355, "epoch": 531} {"train_loss": -29.37262535095215, "global_step": 64356, "epoch": 531} {"train_loss": -31.76255226135254, "global_step": 64357, "epoch": 531} {"train_loss": -29.19476318359375, "global_step": 64358, "epoch": 531} {"train_loss": -30.758686065673828, "global_step": 64359, "epoch": 531} {"train_loss": -31.7531681060791, "global_step": 64360, "epoch": 531} {"train_loss": -30.856033325195312, "global_step": 64361, "epoch": 531} {"train_loss": -30.616180419921875, "global_step": 64362, "epoch": 531} {"train_loss": -33.92816925048828, "global_step": 64363, "epoch": 531} {"train_loss": -32.63434982299805, "global_step": 64364, "epoch": 531} {"train_loss": -31.9654598236084, "global_step": 64365, "epoch": 531} {"train_loss": -31.000646591186523, "global_step": 64366, "epoch": 531} {"train_loss": -32.85114669799805, "global_step": 64367, "epoch": 531} {"train_loss": -31.744089126586914, "global_step": 64368, "epoch": 531} {"train_loss": -32.316959381103516, "global_step": 64369, "epoch": 531} {"train_loss": -32.90963363647461, "global_step": 64370, "epoch": 531} {"train_loss": -33.54350659472883, "global_step": 64371, "epoch": 531, "val_loss": 2691270.0} {"train_loss": -32.445613861083984, "global_step": 64372, "epoch": 532} {"train_loss": -33.01454544067383, "global_step": 64373, "epoch": 532} {"train_loss": -32.39337921142578, "global_step": 64374, "epoch": 532} {"train_loss": -32.970943450927734, "global_step": 64375, "epoch": 532} {"train_loss": -32.2717170715332, "global_step": 64376, "epoch": 532} {"train_loss": -32.704551696777344, "global_step": 64377, "epoch": 532} {"train_loss": -33.16228103637695, "global_step": 64378, "epoch": 532} {"train_loss": -32.968502044677734, "global_step": 64379, "epoch": 532} {"train_loss": -33.91059112548828, "global_step": 64380, "epoch": 532} {"train_loss": -33.19757843017578, "global_step": 64381, "epoch": 532} {"train_loss": -33.609615325927734, "global_step": 64382, "epoch": 532} {"train_loss": -33.61476516723633, "global_step": 64383, "epoch": 532} {"train_loss": -33.86475372314453, "global_step": 64384, "epoch": 532} {"train_loss": -33.36837387084961, "global_step": 64385, "epoch": 532} {"train_loss": -33.73427963256836, "global_step": 64386, "epoch": 532} {"train_loss": -33.761085510253906, "global_step": 64387, "epoch": 532} {"train_loss": -33.56063461303711, "global_step": 64388, "epoch": 532} {"train_loss": -32.489540100097656, "global_step": 64389, "epoch": 532} {"train_loss": -33.81541061401367, "global_step": 64390, "epoch": 532} {"train_loss": -33.27202224731445, "global_step": 64391, "epoch": 532} {"train_loss": -34.34211730957031, "global_step": 64392, "epoch": 532} {"train_loss": -33.89750289916992, "global_step": 64393, "epoch": 532} {"train_loss": -34.07429122924805, "global_step": 64394, "epoch": 532} {"train_loss": -34.78919219970703, "global_step": 64395, "epoch": 532} {"train_loss": -34.642059326171875, "global_step": 64396, "epoch": 532} {"train_loss": -34.648406982421875, "global_step": 64397, "epoch": 532} {"train_loss": -34.77494430541992, "global_step": 64398, "epoch": 532} {"train_loss": -34.655086517333984, "global_step": 64399, "epoch": 532} {"train_loss": -34.6693000793457, "global_step": 64400, "epoch": 532} {"train_loss": -34.38804244995117, "global_step": 64401, "epoch": 532} {"train_loss": -34.91850662231445, "global_step": 64402, "epoch": 532} {"train_loss": -34.83208084106445, "global_step": 64403, "epoch": 532} {"train_loss": -34.61085510253906, "global_step": 64404, "epoch": 532} {"train_loss": -34.80801010131836, "global_step": 64405, "epoch": 532} {"train_loss": -35.26240921020508, "global_step": 64406, "epoch": 532} {"train_loss": -35.26142501831055, "global_step": 64407, "epoch": 532} {"train_loss": -35.058956146240234, "global_step": 64408, "epoch": 532} {"train_loss": -35.125526428222656, "global_step": 64409, "epoch": 532} {"train_loss": -35.140506744384766, "global_step": 64410, "epoch": 532} {"train_loss": -35.037933349609375, "global_step": 64411, "epoch": 532} {"train_loss": -35.45498275756836, "global_step": 64412, "epoch": 532} {"train_loss": -34.965267181396484, "global_step": 64413, "epoch": 532} {"train_loss": -35.40787887573242, "global_step": 64414, "epoch": 532} {"train_loss": -35.581912994384766, "global_step": 64415, "epoch": 532} {"train_loss": -35.138938903808594, "global_step": 64416, "epoch": 532} {"train_loss": -35.47298812866211, "global_step": 64417, "epoch": 532} {"train_loss": -35.45370101928711, "global_step": 64418, "epoch": 532} {"train_loss": -35.6463623046875, "global_step": 64419, "epoch": 532} {"train_loss": -35.573307037353516, "global_step": 64420, "epoch": 532} {"train_loss": -35.55501937866211, "global_step": 64421, "epoch": 532} {"train_loss": -35.12839889526367, "global_step": 64422, "epoch": 532} {"train_loss": -35.50246810913086, "global_step": 64423, "epoch": 532} {"train_loss": -35.31668472290039, "global_step": 64424, "epoch": 532} {"train_loss": -35.73944091796875, "global_step": 64425, "epoch": 532} {"train_loss": -35.82570266723633, "global_step": 64426, "epoch": 532} {"train_loss": -35.8282470703125, "global_step": 64427, "epoch": 532} {"train_loss": -36.0321159362793, "global_step": 64428, "epoch": 532} {"train_loss": -35.8094482421875, "global_step": 64429, "epoch": 532} {"train_loss": -35.81587600708008, "global_step": 64430, "epoch": 532} {"train_loss": -36.4446907043457, "global_step": 64431, "epoch": 532} {"train_loss": -36.02357482910156, "global_step": 64432, "epoch": 532} {"train_loss": -36.41109085083008, "global_step": 64433, "epoch": 532} {"train_loss": -36.22761917114258, "global_step": 64434, "epoch": 532} {"train_loss": -36.23014450073242, "global_step": 64435, "epoch": 532} {"train_loss": -36.252803802490234, "global_step": 64436, "epoch": 532} {"train_loss": -36.04111862182617, "global_step": 64437, "epoch": 532} {"train_loss": -36.20119857788086, "global_step": 64438, "epoch": 532} {"train_loss": -36.10158157348633, "global_step": 64439, "epoch": 532} {"train_loss": -36.21305465698242, "global_step": 64440, "epoch": 532} {"train_loss": -36.41341018676758, "global_step": 64441, "epoch": 532} {"train_loss": -36.5095329284668, "global_step": 64442, "epoch": 532} {"train_loss": -36.388221740722656, "global_step": 64443, "epoch": 532} {"train_loss": -36.57547378540039, "global_step": 64444, "epoch": 532} {"train_loss": -36.24888610839844, "global_step": 64445, "epoch": 532} {"train_loss": -36.15314865112305, "global_step": 64446, "epoch": 532} {"train_loss": -36.09547424316406, "global_step": 64447, "epoch": 532} {"train_loss": -35.97671127319336, "global_step": 64448, "epoch": 532} {"train_loss": -34.755584716796875, "global_step": 64449, "epoch": 532} {"train_loss": -34.46165084838867, "global_step": 64450, "epoch": 532} {"train_loss": -31.139331817626953, "global_step": 64451, "epoch": 532} {"train_loss": -28.032323837280273, "global_step": 64452, "epoch": 532} {"train_loss": -16.582626342773438, "global_step": 64453, "epoch": 532} {"train_loss": -7.963305950164795, "global_step": 64454, "epoch": 532} {"train_loss": -28.853612899780273, "global_step": 64455, "epoch": 532} {"train_loss": -33.05967330932617, "global_step": 64456, "epoch": 532} {"train_loss": -25.26902198791504, "global_step": 64457, "epoch": 532} {"train_loss": -34.03593826293945, "global_step": 64458, "epoch": 532} {"train_loss": -30.766494750976562, "global_step": 64459, "epoch": 532} {"train_loss": -33.99357223510742, "global_step": 64460, "epoch": 532} {"train_loss": -31.036575317382812, "global_step": 64461, "epoch": 532} {"train_loss": -34.21697998046875, "global_step": 64462, "epoch": 532} {"train_loss": -33.0533561706543, "global_step": 64463, "epoch": 532} {"train_loss": -30.942707061767578, "global_step": 64464, "epoch": 532} {"train_loss": -33.307926177978516, "global_step": 64465, "epoch": 532} {"train_loss": -33.59270095825195, "global_step": 64466, "epoch": 532} {"train_loss": -33.8859977722168, "global_step": 64467, "epoch": 532} {"train_loss": -34.5775260925293, "global_step": 64468, "epoch": 532} {"train_loss": -33.09258270263672, "global_step": 64469, "epoch": 532} {"train_loss": -34.29365921020508, "global_step": 64470, "epoch": 532} {"train_loss": -33.96271896362305, "global_step": 64471, "epoch": 532} {"train_loss": -33.4852180480957, "global_step": 64472, "epoch": 532} {"train_loss": -33.99392318725586, "global_step": 64473, "epoch": 532} {"train_loss": -34.37822341918945, "global_step": 64474, "epoch": 532} {"train_loss": -33.3580436706543, "global_step": 64475, "epoch": 532} {"train_loss": -33.39924240112305, "global_step": 64476, "epoch": 532} {"train_loss": -35.07166290283203, "global_step": 64477, "epoch": 532} {"train_loss": -34.294612884521484, "global_step": 64478, "epoch": 532} {"train_loss": -35.14536666870117, "global_step": 64479, "epoch": 532} {"train_loss": -33.73805236816406, "global_step": 64480, "epoch": 532} {"train_loss": -35.242515563964844, "global_step": 64481, "epoch": 532} {"train_loss": -33.9490966796875, "global_step": 64482, "epoch": 532} {"train_loss": -34.63767623901367, "global_step": 64483, "epoch": 532} {"train_loss": -35.141761779785156, "global_step": 64484, "epoch": 532} {"train_loss": -34.696556091308594, "global_step": 64485, "epoch": 532} {"train_loss": -35.1911506652832, "global_step": 64486, "epoch": 532} {"train_loss": -35.53642654418945, "global_step": 64487, "epoch": 532} {"train_loss": -35.739051818847656, "global_step": 64488, "epoch": 532} {"train_loss": -35.26205062866211, "global_step": 64489, "epoch": 532} {"train_loss": -35.04998779296875, "global_step": 64490, "epoch": 532} {"train_loss": -35.96405029296875, "global_step": 64491, "epoch": 532} {"train_loss": -34.056155003792, "global_step": 64492, "epoch": 532, "val_loss": 2423431.75} {"train_loss": -35.302608489990234, "global_step": 64493, "epoch": 533} {"train_loss": -35.83583450317383, "global_step": 64494, "epoch": 533} {"train_loss": -35.46659469604492, "global_step": 64495, "epoch": 533} {"train_loss": -35.81149673461914, "global_step": 64496, "epoch": 533} {"train_loss": -35.68692398071289, "global_step": 64497, "epoch": 533} {"train_loss": -36.29020309448242, "global_step": 64498, "epoch": 533} {"train_loss": -35.97459030151367, "global_step": 64499, "epoch": 533} {"train_loss": -35.9443244934082, "global_step": 64500, "epoch": 533} {"train_loss": -36.10881423950195, "global_step": 64501, "epoch": 533} {"train_loss": -35.90354919433594, "global_step": 64502, "epoch": 533} {"train_loss": -36.023319244384766, "global_step": 64503, "epoch": 533} {"train_loss": -36.20090866088867, "global_step": 64504, "epoch": 533} {"train_loss": -36.43577194213867, "global_step": 64505, "epoch": 533} {"train_loss": -36.101219177246094, "global_step": 64506, "epoch": 533} {"train_loss": -36.06353759765625, "global_step": 64507, "epoch": 533} {"train_loss": -36.043453216552734, "global_step": 64508, "epoch": 533} {"train_loss": -36.3753776550293, "global_step": 64509, "epoch": 533} {"train_loss": -36.79806137084961, "global_step": 64510, "epoch": 533} {"train_loss": -36.71698760986328, "global_step": 64511, "epoch": 533} {"train_loss": -36.66654586791992, "global_step": 64512, "epoch": 533} {"train_loss": -36.34444808959961, "global_step": 64513, "epoch": 533} {"train_loss": -35.80862808227539, "global_step": 64514, "epoch": 533} {"train_loss": -36.596466064453125, "global_step": 64515, "epoch": 533} {"train_loss": -36.3966178894043, "global_step": 64516, "epoch": 533} {"train_loss": -36.963741302490234, "global_step": 64517, "epoch": 533} {"train_loss": -37.01607894897461, "global_step": 64518, "epoch": 533} {"train_loss": -36.49300765991211, "global_step": 64519, "epoch": 533} {"train_loss": -36.676876068115234, "global_step": 64520, "epoch": 533} {"train_loss": -36.59616470336914, "global_step": 64521, "epoch": 533} {"train_loss": -36.805877685546875, "global_step": 64522, "epoch": 533} {"train_loss": -36.943580627441406, "global_step": 64523, "epoch": 533} {"train_loss": -36.67739486694336, "global_step": 64524, "epoch": 533} {"train_loss": -36.912601470947266, "global_step": 64525, "epoch": 533} {"train_loss": -36.94012451171875, "global_step": 64526, "epoch": 533} {"train_loss": -36.382511138916016, "global_step": 64527, "epoch": 533} {"train_loss": -37.109580993652344, "global_step": 64528, "epoch": 533} {"train_loss": -36.3839111328125, "global_step": 64529, "epoch": 533} {"train_loss": -35.8141975402832, "global_step": 64530, "epoch": 533} {"train_loss": -37.03811264038086, "global_step": 64531, "epoch": 533} {"train_loss": -36.794185638427734, "global_step": 64532, "epoch": 533} {"train_loss": -37.18311309814453, "global_step": 64533, "epoch": 533} {"train_loss": -37.26241683959961, "global_step": 64534, "epoch": 533} {"train_loss": -37.08218765258789, "global_step": 64535, "epoch": 533} {"train_loss": -36.88375473022461, "global_step": 64536, "epoch": 533} {"train_loss": -37.02960968017578, "global_step": 64537, "epoch": 533} {"train_loss": -36.06509017944336, "global_step": 64538, "epoch": 533} {"train_loss": -36.94765853881836, "global_step": 64539, "epoch": 533} {"train_loss": -36.6364860534668, "global_step": 64540, "epoch": 533} {"train_loss": -36.776790618896484, "global_step": 64541, "epoch": 533} {"train_loss": -37.13833236694336, "global_step": 64542, "epoch": 533} {"train_loss": -36.185455322265625, "global_step": 64543, "epoch": 533} {"train_loss": -36.03494644165039, "global_step": 64544, "epoch": 533} {"train_loss": -37.245479583740234, "global_step": 64545, "epoch": 533} {"train_loss": -36.48110580444336, "global_step": 64546, "epoch": 533} {"train_loss": -35.73735427856445, "global_step": 64547, "epoch": 533} {"train_loss": -35.0450553894043, "global_step": 64548, "epoch": 533} {"train_loss": -36.640411376953125, "global_step": 64549, "epoch": 533} {"train_loss": -36.354347229003906, "global_step": 64550, "epoch": 533} {"train_loss": -35.14614486694336, "global_step": 64551, "epoch": 533} {"train_loss": -35.015647888183594, "global_step": 64552, "epoch": 533} {"train_loss": -36.242916107177734, "global_step": 64553, "epoch": 533} {"train_loss": -33.2561149597168, "global_step": 64554, "epoch": 533} {"train_loss": -35.230892181396484, "global_step": 64555, "epoch": 533} {"train_loss": -35.9615478515625, "global_step": 64556, "epoch": 533} {"train_loss": -35.67493438720703, "global_step": 64557, "epoch": 533} {"train_loss": -35.78617477416992, "global_step": 64558, "epoch": 533} {"train_loss": -35.16575241088867, "global_step": 64559, "epoch": 533} {"train_loss": -35.66421127319336, "global_step": 64560, "epoch": 533} {"train_loss": -33.64677429199219, "global_step": 64561, "epoch": 533} {"train_loss": -34.64296340942383, "global_step": 64562, "epoch": 533} {"train_loss": -35.54551696777344, "global_step": 64563, "epoch": 533} {"train_loss": -34.573333740234375, "global_step": 64564, "epoch": 533} {"train_loss": -34.664466857910156, "global_step": 64565, "epoch": 533} {"train_loss": -35.64045715332031, "global_step": 64566, "epoch": 533} {"train_loss": -33.423336029052734, "global_step": 64567, "epoch": 533} {"train_loss": -34.56098556518555, "global_step": 64568, "epoch": 533} {"train_loss": -35.76638412475586, "global_step": 64569, "epoch": 533} {"train_loss": -34.223236083984375, "global_step": 64570, "epoch": 533} {"train_loss": -36.10146713256836, "global_step": 64571, "epoch": 533} {"train_loss": -34.8213005065918, "global_step": 64572, "epoch": 533} {"train_loss": -35.545406341552734, "global_step": 64573, "epoch": 533} {"train_loss": -35.28948974609375, "global_step": 64574, "epoch": 533} {"train_loss": -35.2482795715332, "global_step": 64575, "epoch": 533} {"train_loss": -36.132293701171875, "global_step": 64576, "epoch": 533} {"train_loss": -35.86432647705078, "global_step": 64577, "epoch": 533} {"train_loss": -35.63758087158203, "global_step": 64578, "epoch": 533} {"train_loss": -34.83561325073242, "global_step": 64579, "epoch": 533} {"train_loss": -36.18854904174805, "global_step": 64580, "epoch": 533} {"train_loss": -36.09197998046875, "global_step": 64581, "epoch": 533} {"train_loss": -35.61161804199219, "global_step": 64582, "epoch": 533} {"train_loss": -36.727203369140625, "global_step": 64583, "epoch": 533} {"train_loss": -36.51552200317383, "global_step": 64584, "epoch": 533} {"train_loss": -36.16804885864258, "global_step": 64585, "epoch": 533} {"train_loss": -36.604652404785156, "global_step": 64586, "epoch": 533} {"train_loss": -36.073211669921875, "global_step": 64587, "epoch": 533} {"train_loss": -36.472347259521484, "global_step": 64588, "epoch": 533} {"train_loss": -35.00043487548828, "global_step": 64589, "epoch": 533} {"train_loss": -36.6858024597168, "global_step": 64590, "epoch": 533} {"train_loss": -35.55207443237305, "global_step": 64591, "epoch": 533} {"train_loss": -36.35791778564453, "global_step": 64592, "epoch": 533} {"train_loss": -36.630374908447266, "global_step": 64593, "epoch": 533} {"train_loss": -36.14826583862305, "global_step": 64594, "epoch": 533} {"train_loss": -36.15793991088867, "global_step": 64595, "epoch": 533} {"train_loss": -36.93088912963867, "global_step": 64596, "epoch": 533} {"train_loss": -36.67320251464844, "global_step": 64597, "epoch": 533} {"train_loss": -36.81685256958008, "global_step": 64598, "epoch": 533} {"train_loss": -36.40583801269531, "global_step": 64599, "epoch": 533} {"train_loss": -36.79624557495117, "global_step": 64600, "epoch": 533} {"train_loss": -36.15694046020508, "global_step": 64601, "epoch": 533} {"train_loss": -36.983219146728516, "global_step": 64602, "epoch": 533} {"train_loss": -36.57768249511719, "global_step": 64603, "epoch": 533} {"train_loss": -37.062660217285156, "global_step": 64604, "epoch": 533} {"train_loss": -36.36037063598633, "global_step": 64605, "epoch": 533} {"train_loss": -37.10078048706055, "global_step": 64606, "epoch": 533} {"train_loss": -36.65418243408203, "global_step": 64607, "epoch": 533} {"train_loss": -36.91115951538086, "global_step": 64608, "epoch": 533} {"train_loss": -36.383872985839844, "global_step": 64609, "epoch": 533} {"train_loss": -35.53080368041992, "global_step": 64610, "epoch": 533} {"train_loss": -36.326171875, "global_step": 64611, "epoch": 533} {"train_loss": -36.521881103515625, "global_step": 64612, "epoch": 533} {"train_loss": -36.12069339594565, "global_step": 64613, "epoch": 533, "val_loss": 2433441.0} {"train_loss": -37.17068099975586, "global_step": 64614, "epoch": 534} {"train_loss": -36.79235076904297, "global_step": 64615, "epoch": 534} {"train_loss": -37.109989166259766, "global_step": 64616, "epoch": 534} {"train_loss": -35.8248405456543, "global_step": 64617, "epoch": 534} {"train_loss": -36.91472244262695, "global_step": 64618, "epoch": 534} {"train_loss": -36.71987533569336, "global_step": 64619, "epoch": 534} {"train_loss": -36.8904914855957, "global_step": 64620, "epoch": 534} {"train_loss": -37.205020904541016, "global_step": 64621, "epoch": 534} {"train_loss": -36.931026458740234, "global_step": 64622, "epoch": 534} {"train_loss": -36.896480560302734, "global_step": 64623, "epoch": 534} {"train_loss": -36.93168258666992, "global_step": 64624, "epoch": 534} {"train_loss": -37.03086471557617, "global_step": 64625, "epoch": 534} {"train_loss": -37.13815689086914, "global_step": 64626, "epoch": 534} {"train_loss": -37.37713623046875, "global_step": 64627, "epoch": 534} {"train_loss": -37.39057922363281, "global_step": 64628, "epoch": 534} {"train_loss": -36.93571090698242, "global_step": 64629, "epoch": 534} {"train_loss": -37.26777267456055, "global_step": 64630, "epoch": 534} {"train_loss": -36.86112594604492, "global_step": 64631, "epoch": 534} {"train_loss": -36.912696838378906, "global_step": 64632, "epoch": 534} {"train_loss": -36.552146911621094, "global_step": 64633, "epoch": 534} {"train_loss": -36.94550323486328, "global_step": 64634, "epoch": 534} {"train_loss": -35.24348068237305, "global_step": 64635, "epoch": 534} {"train_loss": -35.560951232910156, "global_step": 64636, "epoch": 534} {"train_loss": -36.2668571472168, "global_step": 64637, "epoch": 534} {"train_loss": -34.009788513183594, "global_step": 64638, "epoch": 534} {"train_loss": -37.218868255615234, "global_step": 64639, "epoch": 534} {"train_loss": -35.68323516845703, "global_step": 64640, "epoch": 534} {"train_loss": -36.555580139160156, "global_step": 64641, "epoch": 534} {"train_loss": -34.4193229675293, "global_step": 64642, "epoch": 534} {"train_loss": -36.09259796142578, "global_step": 64643, "epoch": 534} {"train_loss": -35.627681732177734, "global_step": 64644, "epoch": 534} {"train_loss": -36.27046203613281, "global_step": 64645, "epoch": 534} {"train_loss": -35.31266403198242, "global_step": 64646, "epoch": 534} {"train_loss": -34.7676887512207, "global_step": 64647, "epoch": 534} {"train_loss": -34.013336181640625, "global_step": 64648, "epoch": 534} {"train_loss": -36.81917953491211, "global_step": 64649, "epoch": 534} {"train_loss": -35.87318801879883, "global_step": 64650, "epoch": 534} {"train_loss": -33.47908020019531, "global_step": 64651, "epoch": 534} {"train_loss": -27.779296875, "global_step": 64652, "epoch": 534} {"train_loss": -29.174535751342773, "global_step": 64653, "epoch": 534} {"train_loss": -36.842445373535156, "global_step": 64654, "epoch": 534} {"train_loss": -29.858739852905273, "global_step": 64655, "epoch": 534} {"train_loss": -32.861724853515625, "global_step": 64656, "epoch": 534} {"train_loss": -35.84495162963867, "global_step": 64657, "epoch": 534} {"train_loss": -32.89299011230469, "global_step": 64658, "epoch": 534} {"train_loss": -36.2401008605957, "global_step": 64659, "epoch": 534} {"train_loss": -34.114009857177734, "global_step": 64660, "epoch": 534} {"train_loss": -36.37265396118164, "global_step": 64661, "epoch": 534} {"train_loss": -34.100643157958984, "global_step": 64662, "epoch": 534} {"train_loss": -36.454524993896484, "global_step": 64663, "epoch": 534} {"train_loss": -34.95234298706055, "global_step": 64664, "epoch": 534} {"train_loss": -36.70309066772461, "global_step": 64665, "epoch": 534} {"train_loss": -35.29376983642578, "global_step": 64666, "epoch": 534} {"train_loss": -36.7033805847168, "global_step": 64667, "epoch": 534} {"train_loss": -35.22587966918945, "global_step": 64668, "epoch": 534} {"train_loss": -36.710235595703125, "global_step": 64669, "epoch": 534} {"train_loss": -35.495792388916016, "global_step": 64670, "epoch": 534} {"train_loss": -36.595821380615234, "global_step": 64671, "epoch": 534} {"train_loss": -36.274356842041016, "global_step": 64672, "epoch": 534} {"train_loss": -36.7596435546875, "global_step": 64673, "epoch": 534} {"train_loss": -36.757957458496094, "global_step": 64674, "epoch": 534} {"train_loss": -36.762386322021484, "global_step": 64675, "epoch": 534} {"train_loss": -37.09637451171875, "global_step": 64676, "epoch": 534} {"train_loss": -36.28266525268555, "global_step": 64677, "epoch": 534} {"train_loss": -36.96106719970703, "global_step": 64678, "epoch": 534} {"train_loss": -36.66484451293945, "global_step": 64679, "epoch": 534} {"train_loss": -36.58642578125, "global_step": 64680, "epoch": 534} {"train_loss": -36.88932418823242, "global_step": 64681, "epoch": 534} {"train_loss": -37.04701614379883, "global_step": 64682, "epoch": 534} {"train_loss": -36.970062255859375, "global_step": 64683, "epoch": 534} {"train_loss": -36.798736572265625, "global_step": 64684, "epoch": 534} {"train_loss": -36.66622543334961, "global_step": 64685, "epoch": 534} {"train_loss": -37.410614013671875, "global_step": 64686, "epoch": 534} {"train_loss": -36.93754577636719, "global_step": 64687, "epoch": 534} {"train_loss": -36.8477897644043, "global_step": 64688, "epoch": 534} {"train_loss": -36.84031295776367, "global_step": 64689, "epoch": 534} {"train_loss": -37.1768798828125, "global_step": 64690, "epoch": 534} {"train_loss": -37.43735885620117, "global_step": 64691, "epoch": 534} {"train_loss": -36.2471809387207, "global_step": 64692, "epoch": 534} {"train_loss": -36.25974655151367, "global_step": 64693, "epoch": 534} {"train_loss": -37.124027252197266, "global_step": 64694, "epoch": 534} {"train_loss": -36.822349548339844, "global_step": 64695, "epoch": 534} {"train_loss": -36.97230911254883, "global_step": 64696, "epoch": 534} {"train_loss": -35.006195068359375, "global_step": 64697, "epoch": 534} {"train_loss": -36.63849639892578, "global_step": 64698, "epoch": 534} {"train_loss": -35.6234245300293, "global_step": 64699, "epoch": 534} {"train_loss": -36.023048400878906, "global_step": 64700, "epoch": 534} {"train_loss": -35.46186065673828, "global_step": 64701, "epoch": 534} {"train_loss": -36.06199645996094, "global_step": 64702, "epoch": 534} {"train_loss": -36.29591369628906, "global_step": 64703, "epoch": 534} {"train_loss": -36.29448699951172, "global_step": 64704, "epoch": 534} {"train_loss": -36.83900451660156, "global_step": 64705, "epoch": 534} {"train_loss": -36.55903244018555, "global_step": 64706, "epoch": 534} {"train_loss": -36.55654525756836, "global_step": 64707, "epoch": 534} {"train_loss": -36.930809020996094, "global_step": 64708, "epoch": 534} {"train_loss": -36.59407043457031, "global_step": 64709, "epoch": 534} {"train_loss": -35.43428421020508, "global_step": 64710, "epoch": 534} {"train_loss": -34.73086166381836, "global_step": 64711, "epoch": 534} {"train_loss": -33.771217346191406, "global_step": 64712, "epoch": 534} {"train_loss": -36.372230529785156, "global_step": 64713, "epoch": 534} {"train_loss": -36.590087890625, "global_step": 64714, "epoch": 534} {"train_loss": -35.77492904663086, "global_step": 64715, "epoch": 534} {"train_loss": -36.282047271728516, "global_step": 64716, "epoch": 534} {"train_loss": -36.01340866088867, "global_step": 64717, "epoch": 534} {"train_loss": -36.2944450378418, "global_step": 64718, "epoch": 534} {"train_loss": -35.440425872802734, "global_step": 64719, "epoch": 534} {"train_loss": -34.960968017578125, "global_step": 64720, "epoch": 534} {"train_loss": -37.07450485229492, "global_step": 64721, "epoch": 534} {"train_loss": -35.520599365234375, "global_step": 64722, "epoch": 534} {"train_loss": -33.913875579833984, "global_step": 64723, "epoch": 534} {"train_loss": -34.11796188354492, "global_step": 64724, "epoch": 534} {"train_loss": -34.43239212036133, "global_step": 64725, "epoch": 534} {"train_loss": -35.764007568359375, "global_step": 64726, "epoch": 534} {"train_loss": -35.39280700683594, "global_step": 64727, "epoch": 534} {"train_loss": -35.365299224853516, "global_step": 64728, "epoch": 534} {"train_loss": -36.55495071411133, "global_step": 64729, "epoch": 534} {"train_loss": -35.294837951660156, "global_step": 64730, "epoch": 534} {"train_loss": -35.475425720214844, "global_step": 64731, "epoch": 534} {"train_loss": -36.20331573486328, "global_step": 64732, "epoch": 534} {"train_loss": -35.88228988647461, "global_step": 64733, "epoch": 534} {"train_loss": -35.94909478810208, "global_step": 64734, "epoch": 534, "val_loss": 2423149.25} {"train_loss": -35.77743148803711, "global_step": 64735, "epoch": 535} {"train_loss": -36.70978927612305, "global_step": 64736, "epoch": 535} {"train_loss": -36.581417083740234, "global_step": 64737, "epoch": 535} {"train_loss": -36.400943756103516, "global_step": 64738, "epoch": 535} {"train_loss": -36.29506301879883, "global_step": 64739, "epoch": 535} {"train_loss": -36.66936111450195, "global_step": 64740, "epoch": 535} {"train_loss": -36.877498626708984, "global_step": 64741, "epoch": 535} {"train_loss": -36.90547561645508, "global_step": 64742, "epoch": 535} {"train_loss": -37.081417083740234, "global_step": 64743, "epoch": 535} {"train_loss": -36.79376220703125, "global_step": 64744, "epoch": 535} {"train_loss": -36.736995697021484, "global_step": 64745, "epoch": 535} {"train_loss": -37.18732833862305, "global_step": 64746, "epoch": 535} {"train_loss": -37.25080490112305, "global_step": 64747, "epoch": 535} {"train_loss": -37.444313049316406, "global_step": 64748, "epoch": 535} {"train_loss": -37.08262252807617, "global_step": 64749, "epoch": 535} {"train_loss": -37.26064682006836, "global_step": 64750, "epoch": 535} {"train_loss": -37.54185104370117, "global_step": 64751, "epoch": 535} {"train_loss": -37.12163543701172, "global_step": 64752, "epoch": 535} {"train_loss": -37.14262390136719, "global_step": 64753, "epoch": 535} {"train_loss": -37.27778244018555, "global_step": 64754, "epoch": 535} {"train_loss": -37.49388885498047, "global_step": 64755, "epoch": 535} {"train_loss": -37.22870635986328, "global_step": 64756, "epoch": 535} {"train_loss": -36.88654708862305, "global_step": 64757, "epoch": 535} {"train_loss": -36.86374282836914, "global_step": 64758, "epoch": 535} {"train_loss": -37.60397720336914, "global_step": 64759, "epoch": 535} {"train_loss": -37.649993896484375, "global_step": 64760, "epoch": 535} {"train_loss": -37.48088455200195, "global_step": 64761, "epoch": 535} {"train_loss": -37.095088958740234, "global_step": 64762, "epoch": 535} {"train_loss": -37.65488815307617, "global_step": 64763, "epoch": 535} {"train_loss": -37.84278106689453, "global_step": 64764, "epoch": 535} {"train_loss": -36.73452377319336, "global_step": 64765, "epoch": 535} {"train_loss": -36.57163619995117, "global_step": 64766, "epoch": 535} {"train_loss": -37.339542388916016, "global_step": 64767, "epoch": 535} {"train_loss": -37.484920501708984, "global_step": 64768, "epoch": 535} {"train_loss": -36.98273468017578, "global_step": 64769, "epoch": 535} {"train_loss": -36.601539611816406, "global_step": 64770, "epoch": 535} {"train_loss": -36.33243942260742, "global_step": 64771, "epoch": 535} {"train_loss": -37.55923080444336, "global_step": 64772, "epoch": 535} {"train_loss": -37.0002326965332, "global_step": 64773, "epoch": 535} {"train_loss": -35.70184326171875, "global_step": 64774, "epoch": 535} {"train_loss": -36.54458999633789, "global_step": 64775, "epoch": 535} {"train_loss": -37.348655700683594, "global_step": 64776, "epoch": 535} {"train_loss": -37.141292572021484, "global_step": 64777, "epoch": 535} {"train_loss": -35.959896087646484, "global_step": 64778, "epoch": 535} {"train_loss": -36.33269119262695, "global_step": 64779, "epoch": 535} {"train_loss": -37.3738899230957, "global_step": 64780, "epoch": 535} {"train_loss": -37.27545166015625, "global_step": 64781, "epoch": 535} {"train_loss": -36.07088851928711, "global_step": 64782, "epoch": 535} {"train_loss": -35.9066162109375, "global_step": 64783, "epoch": 535} {"train_loss": -37.361446380615234, "global_step": 64784, "epoch": 535} {"train_loss": -36.947811126708984, "global_step": 64785, "epoch": 535} {"train_loss": -36.74958038330078, "global_step": 64786, "epoch": 535} {"train_loss": -37.91756820678711, "global_step": 64787, "epoch": 535} {"train_loss": -37.653411865234375, "global_step": 64788, "epoch": 535} {"train_loss": -36.30015182495117, "global_step": 64789, "epoch": 535} {"train_loss": -34.459529876708984, "global_step": 64790, "epoch": 535} {"train_loss": -31.938953399658203, "global_step": 64791, "epoch": 535} {"train_loss": -31.311803817749023, "global_step": 64792, "epoch": 535} {"train_loss": -35.969215393066406, "global_step": 64793, "epoch": 535} {"train_loss": -35.53156661987305, "global_step": 64794, "epoch": 535} {"train_loss": -34.81039047241211, "global_step": 64795, "epoch": 535} {"train_loss": -35.625701904296875, "global_step": 64796, "epoch": 535} {"train_loss": -35.411865234375, "global_step": 64797, "epoch": 535} {"train_loss": -37.05857849121094, "global_step": 64798, "epoch": 535} {"train_loss": -34.088253021240234, "global_step": 64799, "epoch": 535} {"train_loss": -36.55741500854492, "global_step": 64800, "epoch": 535} {"train_loss": -35.777557373046875, "global_step": 64801, "epoch": 535} {"train_loss": -34.89384078979492, "global_step": 64802, "epoch": 535} {"train_loss": -35.33502197265625, "global_step": 64803, "epoch": 535} {"train_loss": -36.42316818237305, "global_step": 64804, "epoch": 535} {"train_loss": -35.00429153442383, "global_step": 64805, "epoch": 535} {"train_loss": -35.72107696533203, "global_step": 64806, "epoch": 535} {"train_loss": -36.21247863769531, "global_step": 64807, "epoch": 535} {"train_loss": -34.862030029296875, "global_step": 64808, "epoch": 535} {"train_loss": -36.35807800292969, "global_step": 64809, "epoch": 535} {"train_loss": -35.68599319458008, "global_step": 64810, "epoch": 535} {"train_loss": -35.56832504272461, "global_step": 64811, "epoch": 535} {"train_loss": -37.062496185302734, "global_step": 64812, "epoch": 535} {"train_loss": -35.396331787109375, "global_step": 64813, "epoch": 535} {"train_loss": -36.84408187866211, "global_step": 64814, "epoch": 535} {"train_loss": -34.5211181640625, "global_step": 64815, "epoch": 535} {"train_loss": -35.86176300048828, "global_step": 64816, "epoch": 535} {"train_loss": -36.544281005859375, "global_step": 64817, "epoch": 535} {"train_loss": -35.75230026245117, "global_step": 64818, "epoch": 535} {"train_loss": -36.4921989440918, "global_step": 64819, "epoch": 535} {"train_loss": -35.694091796875, "global_step": 64820, "epoch": 535} {"train_loss": -36.45920944213867, "global_step": 64821, "epoch": 535} {"train_loss": -35.51213455200195, "global_step": 64822, "epoch": 535} {"train_loss": -36.582454681396484, "global_step": 64823, "epoch": 535} {"train_loss": -36.20253372192383, "global_step": 64824, "epoch": 535} {"train_loss": -36.133140563964844, "global_step": 64825, "epoch": 535} {"train_loss": -36.887813568115234, "global_step": 64826, "epoch": 535} {"train_loss": -36.55322265625, "global_step": 64827, "epoch": 535} {"train_loss": -36.342098236083984, "global_step": 64828, "epoch": 535} {"train_loss": -36.16730499267578, "global_step": 64829, "epoch": 535} {"train_loss": -36.40937423706055, "global_step": 64830, "epoch": 535} {"train_loss": -37.121891021728516, "global_step": 64831, "epoch": 535} {"train_loss": -36.3763427734375, "global_step": 64832, "epoch": 535} {"train_loss": -36.44240951538086, "global_step": 64833, "epoch": 535} {"train_loss": -36.712196350097656, "global_step": 64834, "epoch": 535} {"train_loss": -37.11211013793945, "global_step": 64835, "epoch": 535} {"train_loss": -36.92208480834961, "global_step": 64836, "epoch": 535} {"train_loss": -36.87526321411133, "global_step": 64837, "epoch": 535} {"train_loss": -37.42183303833008, "global_step": 64838, "epoch": 535} {"train_loss": -36.398868560791016, "global_step": 64839, "epoch": 535} {"train_loss": -37.304805755615234, "global_step": 64840, "epoch": 535} {"train_loss": -37.14657211303711, "global_step": 64841, "epoch": 535} {"train_loss": -36.60807418823242, "global_step": 64842, "epoch": 535} {"train_loss": -36.98116683959961, "global_step": 64843, "epoch": 535} {"train_loss": -36.79035568237305, "global_step": 64844, "epoch": 535} {"train_loss": -37.2546501159668, "global_step": 64845, "epoch": 535} {"train_loss": -36.53438949584961, "global_step": 64846, "epoch": 535} {"train_loss": -36.6142463684082, "global_step": 64847, "epoch": 535} {"train_loss": -37.19857406616211, "global_step": 64848, "epoch": 535} {"train_loss": -36.3851432800293, "global_step": 64849, "epoch": 535} {"train_loss": -37.25566101074219, "global_step": 64850, "epoch": 535} {"train_loss": -36.592594146728516, "global_step": 64851, "epoch": 535} {"train_loss": -35.96603012084961, "global_step": 64852, "epoch": 535} {"train_loss": -37.47406005859375, "global_step": 64853, "epoch": 535} {"train_loss": -36.04612731933594, "global_step": 64854, "epoch": 535} {"train_loss": -36.49508438425616, "global_step": 64855, "epoch": 535, "val_loss": 2479595.75} {"train_loss": -37.17683029174805, "global_step": 64856, "epoch": 536} {"train_loss": -37.09585189819336, "global_step": 64857, "epoch": 536} {"train_loss": -36.435508728027344, "global_step": 64858, "epoch": 536} {"train_loss": -37.71857833862305, "global_step": 64859, "epoch": 536} {"train_loss": -36.656734466552734, "global_step": 64860, "epoch": 536} {"train_loss": -37.210391998291016, "global_step": 64861, "epoch": 536} {"train_loss": -36.49334716796875, "global_step": 64862, "epoch": 536} {"train_loss": -37.70578384399414, "global_step": 64863, "epoch": 536} {"train_loss": -36.983795166015625, "global_step": 64864, "epoch": 536} {"train_loss": -37.15192413330078, "global_step": 64865, "epoch": 536} {"train_loss": -37.67765426635742, "global_step": 64866, "epoch": 536} {"train_loss": -36.72698974609375, "global_step": 64867, "epoch": 536} {"train_loss": -37.8589973449707, "global_step": 64868, "epoch": 536} {"train_loss": -36.97194290161133, "global_step": 64869, "epoch": 536} {"train_loss": -36.949256896972656, "global_step": 64870, "epoch": 536} {"train_loss": -37.41635513305664, "global_step": 64871, "epoch": 536} {"train_loss": -37.84568405151367, "global_step": 64872, "epoch": 536} {"train_loss": -37.151668548583984, "global_step": 64873, "epoch": 536} {"train_loss": -36.9625129699707, "global_step": 64874, "epoch": 536} {"train_loss": -37.199119567871094, "global_step": 64875, "epoch": 536} {"train_loss": -37.18040084838867, "global_step": 64876, "epoch": 536} {"train_loss": -36.41543197631836, "global_step": 64877, "epoch": 536} {"train_loss": -34.82558822631836, "global_step": 64878, "epoch": 536} {"train_loss": -30.926761627197266, "global_step": 64879, "epoch": 536} {"train_loss": -36.79082107543945, "global_step": 64880, "epoch": 536} {"train_loss": -27.45654296875, "global_step": 64881, "epoch": 536} {"train_loss": 8.238175392150879, "global_step": 64882, "epoch": 536} {"train_loss": 21.405048370361328, "global_step": 64883, "epoch": 536} {"train_loss": 64.5937728881836, "global_step": 64884, "epoch": 536} {"train_loss": 42.806209564208984, "global_step": 64885, "epoch": 536} {"train_loss": 51.50387191772461, "global_step": 64886, "epoch": 536} {"train_loss": -22.80521011352539, "global_step": 64887, "epoch": 536} {"train_loss": 5.226319789886475, "global_step": 64888, "epoch": 536} {"train_loss": 14.219449043273926, "global_step": 64889, "epoch": 536} {"train_loss": -11.493212699890137, "global_step": 64890, "epoch": 536} {"train_loss": -20.124164581298828, "global_step": 64891, "epoch": 536} {"train_loss": -17.548368453979492, "global_step": 64892, "epoch": 536} {"train_loss": -17.76875877380371, "global_step": 64893, "epoch": 536} {"train_loss": -13.462666511535645, "global_step": 64894, "epoch": 536} {"train_loss": -16.580286026000977, "global_step": 64895, "epoch": 536} {"train_loss": -21.72303581237793, "global_step": 64896, "epoch": 536} {"train_loss": -23.73296546936035, "global_step": 64897, "epoch": 536} {"train_loss": -24.268049240112305, "global_step": 64898, "epoch": 536} {"train_loss": -24.19171142578125, "global_step": 64899, "epoch": 536} {"train_loss": -24.775943756103516, "global_step": 64900, "epoch": 536} {"train_loss": -24.861392974853516, "global_step": 64901, "epoch": 536} {"train_loss": -24.958274841308594, "global_step": 64902, "epoch": 536} {"train_loss": -25.23933219909668, "global_step": 64903, "epoch": 536} {"train_loss": -24.921388626098633, "global_step": 64904, "epoch": 536} {"train_loss": -26.009342193603516, "global_step": 64905, "epoch": 536} {"train_loss": -26.198652267456055, "global_step": 64906, "epoch": 536} {"train_loss": -26.752744674682617, "global_step": 64907, "epoch": 536} {"train_loss": -27.358057022094727, "global_step": 64908, "epoch": 536} {"train_loss": -27.489110946655273, "global_step": 64909, "epoch": 536} {"train_loss": -27.343435287475586, "global_step": 64910, "epoch": 536} {"train_loss": -26.999515533447266, "global_step": 64911, "epoch": 536} {"train_loss": -27.762441635131836, "global_step": 64912, "epoch": 536} {"train_loss": -28.070722579956055, "global_step": 64913, "epoch": 536} {"train_loss": -28.01043701171875, "global_step": 64914, "epoch": 536} {"train_loss": -28.658246994018555, "global_step": 64915, "epoch": 536} {"train_loss": -28.94794273376465, "global_step": 64916, "epoch": 536} {"train_loss": -29.22266960144043, "global_step": 64917, "epoch": 536} {"train_loss": -29.616132736206055, "global_step": 64918, "epoch": 536} {"train_loss": -30.019916534423828, "global_step": 64919, "epoch": 536} {"train_loss": -29.588851928710938, "global_step": 64920, "epoch": 536} {"train_loss": -30.016559600830078, "global_step": 64921, "epoch": 536} {"train_loss": -30.353910446166992, "global_step": 64922, "epoch": 536} {"train_loss": -29.906824111938477, "global_step": 64923, "epoch": 536} {"train_loss": -30.01374626159668, "global_step": 64924, "epoch": 536} {"train_loss": -28.767324447631836, "global_step": 64925, "epoch": 536} {"train_loss": -25.545347213745117, "global_step": 64926, "epoch": 536} {"train_loss": -28.679410934448242, "global_step": 64927, "epoch": 536} {"train_loss": -30.36945152282715, "global_step": 64928, "epoch": 536} {"train_loss": -29.237207412719727, "global_step": 64929, "epoch": 536} {"train_loss": -30.70600700378418, "global_step": 64930, "epoch": 536} {"train_loss": -29.7325382232666, "global_step": 64931, "epoch": 536} {"train_loss": -30.00543785095215, "global_step": 64932, "epoch": 536} {"train_loss": -31.07769203186035, "global_step": 64933, "epoch": 536} {"train_loss": -30.245084762573242, "global_step": 64934, "epoch": 536} {"train_loss": -32.04048538208008, "global_step": 64935, "epoch": 536} {"train_loss": -31.516138076782227, "global_step": 64936, "epoch": 536} {"train_loss": -30.993885040283203, "global_step": 64937, "epoch": 536} {"train_loss": -31.582366943359375, "global_step": 64938, "epoch": 536} {"train_loss": -31.499921798706055, "global_step": 64939, "epoch": 536} {"train_loss": -29.82940673828125, "global_step": 64940, "epoch": 536} {"train_loss": -29.589599609375, "global_step": 64941, "epoch": 536} {"train_loss": -31.740234375, "global_step": 64942, "epoch": 536} {"train_loss": -30.663694381713867, "global_step": 64943, "epoch": 536} {"train_loss": -31.700000762939453, "global_step": 64944, "epoch": 536} {"train_loss": -31.882801055908203, "global_step": 64945, "epoch": 536} {"train_loss": -31.943378448486328, "global_step": 64946, "epoch": 536} {"train_loss": -31.92390251159668, "global_step": 64947, "epoch": 536} {"train_loss": -31.58905029296875, "global_step": 64948, "epoch": 536} {"train_loss": -30.947967529296875, "global_step": 64949, "epoch": 536} {"train_loss": -31.08916664123535, "global_step": 64950, "epoch": 536} {"train_loss": -31.988744735717773, "global_step": 64951, "epoch": 536} {"train_loss": -31.681659698486328, "global_step": 64952, "epoch": 536} {"train_loss": -31.2039852142334, "global_step": 64953, "epoch": 536} {"train_loss": -32.68276596069336, "global_step": 64954, "epoch": 536} {"train_loss": -32.03020095825195, "global_step": 64955, "epoch": 536} {"train_loss": -31.91364097595215, "global_step": 64956, "epoch": 536} {"train_loss": -32.39496612548828, "global_step": 64957, "epoch": 536} {"train_loss": -32.35268783569336, "global_step": 64958, "epoch": 536} {"train_loss": -32.592864990234375, "global_step": 64959, "epoch": 536} {"train_loss": -33.22140884399414, "global_step": 64960, "epoch": 536} {"train_loss": -32.59739303588867, "global_step": 64961, "epoch": 536} {"train_loss": -33.04096603393555, "global_step": 64962, "epoch": 536} {"train_loss": -33.00379180908203, "global_step": 64963, "epoch": 536} {"train_loss": -33.02067947387695, "global_step": 64964, "epoch": 536} {"train_loss": -32.40796661376953, "global_step": 64965, "epoch": 536} {"train_loss": -29.7280216217041, "global_step": 64966, "epoch": 536} {"train_loss": -20.125396728515625, "global_step": 64967, "epoch": 536} {"train_loss": -25.086944580078125, "global_step": 64968, "epoch": 536} {"train_loss": -32.52983093261719, "global_step": 64969, "epoch": 536} {"train_loss": -28.19748306274414, "global_step": 64970, "epoch": 536} {"train_loss": -31.840356826782227, "global_step": 64971, "epoch": 536} {"train_loss": -30.445236206054688, "global_step": 64972, "epoch": 536} {"train_loss": -30.101301193237305, "global_step": 64973, "epoch": 536} {"train_loss": -33.008907318115234, "global_step": 64974, "epoch": 536} {"train_loss": -29.450769424438477, "global_step": 64975, "epoch": 536} {"train_loss": -26.854189064877094, "global_step": 64976, "epoch": 536, "val_loss": 2470360.0} {"train_loss": -31.782196044921875, "global_step": 64977, "epoch": 537} {"train_loss": -30.709558486938477, "global_step": 64978, "epoch": 537} {"train_loss": -32.05021286010742, "global_step": 64979, "epoch": 537} {"train_loss": -32.752384185791016, "global_step": 64980, "epoch": 537} {"train_loss": -32.07985305786133, "global_step": 64981, "epoch": 537} {"train_loss": -32.41547393798828, "global_step": 64982, "epoch": 537} {"train_loss": -32.760772705078125, "global_step": 64983, "epoch": 537} {"train_loss": -33.0362434387207, "global_step": 64984, "epoch": 537} {"train_loss": -32.151668548583984, "global_step": 64985, "epoch": 537} {"train_loss": -31.68316078186035, "global_step": 64986, "epoch": 537} {"train_loss": -33.18282699584961, "global_step": 64987, "epoch": 537} {"train_loss": -32.145751953125, "global_step": 64988, "epoch": 537} {"train_loss": -33.0994987487793, "global_step": 64989, "epoch": 537} {"train_loss": -32.10343933105469, "global_step": 64990, "epoch": 537} {"train_loss": -33.16236877441406, "global_step": 64991, "epoch": 537} {"train_loss": -33.28435134887695, "global_step": 64992, "epoch": 537} {"train_loss": -33.0726203918457, "global_step": 64993, "epoch": 537} {"train_loss": -33.591896057128906, "global_step": 64994, "epoch": 537} {"train_loss": -33.06282043457031, "global_step": 64995, "epoch": 537} {"train_loss": -30.727741241455078, "global_step": 64996, "epoch": 537} {"train_loss": -24.933944702148438, "global_step": 64997, "epoch": 537} {"train_loss": -23.70265769958496, "global_step": 64998, "epoch": 537} {"train_loss": -31.430822372436523, "global_step": 64999, "epoch": 537} {"train_loss": -28.4813175201416, "global_step": 65000, "epoch": 537} {"train_loss": -30.81791114807129, "global_step": 65001, "epoch": 537} {"train_loss": -29.77682876586914, "global_step": 65002, "epoch": 537} {"train_loss": -32.61252212524414, "global_step": 65003, "epoch": 537} {"train_loss": -28.941370010375977, "global_step": 65004, "epoch": 537} {"train_loss": -32.4683723449707, "global_step": 65005, "epoch": 537} {"train_loss": -30.591461181640625, "global_step": 65006, "epoch": 537} {"train_loss": -31.71706199645996, "global_step": 65007, "epoch": 537} {"train_loss": -32.32636642456055, "global_step": 65008, "epoch": 537} {"train_loss": -31.41254997253418, "global_step": 65009, "epoch": 537} {"train_loss": -31.863605499267578, "global_step": 65010, "epoch": 537} {"train_loss": -32.96879959106445, "global_step": 65011, "epoch": 537} {"train_loss": -32.54355239868164, "global_step": 65012, "epoch": 537} {"train_loss": -31.930112838745117, "global_step": 65013, "epoch": 537} {"train_loss": -32.67672348022461, "global_step": 65014, "epoch": 537} {"train_loss": -32.80340576171875, "global_step": 65015, "epoch": 537} {"train_loss": -32.414791107177734, "global_step": 65016, "epoch": 537} {"train_loss": -32.9212760925293, "global_step": 65017, "epoch": 537} {"train_loss": -32.839656829833984, "global_step": 65018, "epoch": 537} {"train_loss": -32.7243766784668, "global_step": 65019, "epoch": 537} {"train_loss": -32.96303176879883, "global_step": 65020, "epoch": 537} {"train_loss": -33.0916633605957, "global_step": 65021, "epoch": 537} {"train_loss": -32.82597732543945, "global_step": 65022, "epoch": 537} {"train_loss": -32.57062530517578, "global_step": 65023, "epoch": 537} {"train_loss": -32.246761322021484, "global_step": 65024, "epoch": 537} {"train_loss": -32.15131759643555, "global_step": 65025, "epoch": 537} {"train_loss": -32.15973663330078, "global_step": 65026, "epoch": 537} {"train_loss": -33.50665283203125, "global_step": 65027, "epoch": 537} {"train_loss": -33.07841491699219, "global_step": 65028, "epoch": 537} {"train_loss": -32.680904388427734, "global_step": 65029, "epoch": 537} {"train_loss": -32.58130645751953, "global_step": 65030, "epoch": 537} {"train_loss": -33.91086959838867, "global_step": 65031, "epoch": 537} {"train_loss": -32.512123107910156, "global_step": 65032, "epoch": 537} {"train_loss": -32.73345947265625, "global_step": 65033, "epoch": 537} {"train_loss": -33.96615219116211, "global_step": 65034, "epoch": 537} {"train_loss": -32.578392028808594, "global_step": 65035, "epoch": 537} {"train_loss": -33.64162826538086, "global_step": 65036, "epoch": 537} {"train_loss": -32.79651641845703, "global_step": 65037, "epoch": 537} {"train_loss": -33.1159782409668, "global_step": 65038, "epoch": 537} {"train_loss": -33.07963180541992, "global_step": 65039, "epoch": 537} {"train_loss": -32.88682174682617, "global_step": 65040, "epoch": 537} {"train_loss": -32.82086944580078, "global_step": 65041, "epoch": 537} {"train_loss": -32.39742660522461, "global_step": 65042, "epoch": 537} {"train_loss": -33.097286224365234, "global_step": 65043, "epoch": 537} {"train_loss": -33.38786697387695, "global_step": 65044, "epoch": 537} {"train_loss": -33.6638069152832, "global_step": 65045, "epoch": 537} {"train_loss": -33.5467643737793, "global_step": 65046, "epoch": 537} {"train_loss": -33.37549591064453, "global_step": 65047, "epoch": 537} {"train_loss": -33.95979690551758, "global_step": 65048, "epoch": 537} {"train_loss": -33.35260009765625, "global_step": 65049, "epoch": 537} {"train_loss": -33.19623947143555, "global_step": 65050, "epoch": 537} {"train_loss": -33.922664642333984, "global_step": 65051, "epoch": 537} {"train_loss": -33.649009704589844, "global_step": 65052, "epoch": 537} {"train_loss": -33.658538818359375, "global_step": 65053, "epoch": 537} {"train_loss": -33.926124572753906, "global_step": 65054, "epoch": 537} {"train_loss": -33.37331771850586, "global_step": 65055, "epoch": 537} {"train_loss": -33.317134857177734, "global_step": 65056, "epoch": 537} {"train_loss": -33.7100944519043, "global_step": 65057, "epoch": 537} {"train_loss": -33.64826583862305, "global_step": 65058, "epoch": 537} {"train_loss": -34.24951934814453, "global_step": 65059, "epoch": 537} {"train_loss": -33.722442626953125, "global_step": 65060, "epoch": 537} {"train_loss": -33.94184112548828, "global_step": 65061, "epoch": 537} {"train_loss": -33.838680267333984, "global_step": 65062, "epoch": 537} {"train_loss": -33.95659637451172, "global_step": 65063, "epoch": 537} {"train_loss": -33.934181213378906, "global_step": 65064, "epoch": 537} {"train_loss": -33.7086296081543, "global_step": 65065, "epoch": 537} {"train_loss": -33.81449508666992, "global_step": 65066, "epoch": 537} {"train_loss": -33.77946472167969, "global_step": 65067, "epoch": 537} {"train_loss": -33.99801254272461, "global_step": 65068, "epoch": 537} {"train_loss": -34.0216064453125, "global_step": 65069, "epoch": 537} {"train_loss": -33.878414154052734, "global_step": 65070, "epoch": 537} {"train_loss": -33.5776481628418, "global_step": 65071, "epoch": 537} {"train_loss": -34.5198860168457, "global_step": 65072, "epoch": 537} {"train_loss": -33.64419174194336, "global_step": 65073, "epoch": 537} {"train_loss": -33.76105499267578, "global_step": 65074, "epoch": 537} {"train_loss": -34.50667953491211, "global_step": 65075, "epoch": 537} {"train_loss": -33.3653678894043, "global_step": 65076, "epoch": 537} {"train_loss": -34.032958984375, "global_step": 65077, "epoch": 537} {"train_loss": -33.95501708984375, "global_step": 65078, "epoch": 537} {"train_loss": -32.73981475830078, "global_step": 65079, "epoch": 537} {"train_loss": -32.935062408447266, "global_step": 65080, "epoch": 537} {"train_loss": -33.67694854736328, "global_step": 65081, "epoch": 537} {"train_loss": -31.969562530517578, "global_step": 65082, "epoch": 537} {"train_loss": -33.953975677490234, "global_step": 65083, "epoch": 537} {"train_loss": -33.544952392578125, "global_step": 65084, "epoch": 537} {"train_loss": -33.8933219909668, "global_step": 65085, "epoch": 537} {"train_loss": -33.82358932495117, "global_step": 65086, "epoch": 537} {"train_loss": -34.04183578491211, "global_step": 65087, "epoch": 537} {"train_loss": -34.08143997192383, "global_step": 65088, "epoch": 537} {"train_loss": -33.900665283203125, "global_step": 65089, "epoch": 537} {"train_loss": -34.37869644165039, "global_step": 65090, "epoch": 537} {"train_loss": -34.788150787353516, "global_step": 65091, "epoch": 537} {"train_loss": -34.08883285522461, "global_step": 65092, "epoch": 537} {"train_loss": -33.71112823486328, "global_step": 65093, "epoch": 537} {"train_loss": -33.84609603881836, "global_step": 65094, "epoch": 537} {"train_loss": -34.53076934814453, "global_step": 65095, "epoch": 537} {"train_loss": -34.319435119628906, "global_step": 65096, "epoch": 537} {"train_loss": -32.8714647529539, "global_step": 65097, "epoch": 537, "val_loss": 2558070.75} {"train_loss": -34.80393981933594, "global_step": 65098, "epoch": 538} {"train_loss": -34.39933395385742, "global_step": 65099, "epoch": 538} {"train_loss": -34.7071533203125, "global_step": 65100, "epoch": 538} {"train_loss": -34.75115966796875, "global_step": 65101, "epoch": 538} {"train_loss": -34.787391662597656, "global_step": 65102, "epoch": 538} {"train_loss": -34.58114242553711, "global_step": 65103, "epoch": 538} {"train_loss": -33.37006759643555, "global_step": 65104, "epoch": 538} {"train_loss": -31.985809326171875, "global_step": 65105, "epoch": 538} {"train_loss": -31.30804443359375, "global_step": 65106, "epoch": 538} {"train_loss": -33.06887435913086, "global_step": 65107, "epoch": 538} {"train_loss": -34.449241638183594, "global_step": 65108, "epoch": 538} {"train_loss": -33.442989349365234, "global_step": 65109, "epoch": 538} {"train_loss": -33.32269287109375, "global_step": 65110, "epoch": 538} {"train_loss": -34.076351165771484, "global_step": 65111, "epoch": 538} {"train_loss": -34.42702865600586, "global_step": 65112, "epoch": 538} {"train_loss": -33.90491485595703, "global_step": 65113, "epoch": 538} {"train_loss": -34.749732971191406, "global_step": 65114, "epoch": 538} {"train_loss": -33.18342590332031, "global_step": 65115, "epoch": 538} {"train_loss": -34.43938064575195, "global_step": 65116, "epoch": 538} {"train_loss": -34.05070877075195, "global_step": 65117, "epoch": 538} {"train_loss": -34.173248291015625, "global_step": 65118, "epoch": 538} {"train_loss": -33.79824447631836, "global_step": 65119, "epoch": 538} {"train_loss": -33.55909729003906, "global_step": 65120, "epoch": 538} {"train_loss": -34.043174743652344, "global_step": 65121, "epoch": 538} {"train_loss": -33.684112548828125, "global_step": 65122, "epoch": 538} {"train_loss": -29.782583236694336, "global_step": 65123, "epoch": 538} {"train_loss": -34.310611724853516, "global_step": 65124, "epoch": 538} {"train_loss": -30.53326416015625, "global_step": 65125, "epoch": 538} {"train_loss": -33.57754135131836, "global_step": 65126, "epoch": 538} {"train_loss": -31.277135848999023, "global_step": 65127, "epoch": 538} {"train_loss": -26.518497467041016, "global_step": 65128, "epoch": 538} {"train_loss": -32.30259323120117, "global_step": 65129, "epoch": 538} {"train_loss": -27.110889434814453, "global_step": 65130, "epoch": 538} {"train_loss": -30.669599533081055, "global_step": 65131, "epoch": 538} {"train_loss": -31.737186431884766, "global_step": 65132, "epoch": 538} {"train_loss": -32.38667678833008, "global_step": 65133, "epoch": 538} {"train_loss": -27.335416793823242, "global_step": 65134, "epoch": 538} {"train_loss": -30.871688842773438, "global_step": 65135, "epoch": 538} {"train_loss": -31.74629020690918, "global_step": 65136, "epoch": 538} {"train_loss": -29.909347534179688, "global_step": 65137, "epoch": 538} {"train_loss": -31.408950805664062, "global_step": 65138, "epoch": 538} {"train_loss": -32.74552536010742, "global_step": 65139, "epoch": 538} {"train_loss": -30.422861099243164, "global_step": 65140, "epoch": 538} {"train_loss": -31.04938316345215, "global_step": 65141, "epoch": 538} {"train_loss": -30.594446182250977, "global_step": 65142, "epoch": 538} {"train_loss": -30.837726593017578, "global_step": 65143, "epoch": 538} {"train_loss": -31.85489273071289, "global_step": 65144, "epoch": 538} {"train_loss": -32.81099319458008, "global_step": 65145, "epoch": 538} {"train_loss": -31.487455368041992, "global_step": 65146, "epoch": 538} {"train_loss": -32.53336715698242, "global_step": 65147, "epoch": 538} {"train_loss": -31.55338478088379, "global_step": 65148, "epoch": 538} {"train_loss": -31.925281524658203, "global_step": 65149, "epoch": 538} {"train_loss": -32.56884765625, "global_step": 65150, "epoch": 538} {"train_loss": -32.16335678100586, "global_step": 65151, "epoch": 538} {"train_loss": -32.64929962158203, "global_step": 65152, "epoch": 538} {"train_loss": -31.776952743530273, "global_step": 65153, "epoch": 538} {"train_loss": -33.110321044921875, "global_step": 65154, "epoch": 538} {"train_loss": -33.287147521972656, "global_step": 65155, "epoch": 538} {"train_loss": -31.92535972595215, "global_step": 65156, "epoch": 538} {"train_loss": -32.816471099853516, "global_step": 65157, "epoch": 538} {"train_loss": -33.206111907958984, "global_step": 65158, "epoch": 538} {"train_loss": -32.80811309814453, "global_step": 65159, "epoch": 538} {"train_loss": -32.725154876708984, "global_step": 65160, "epoch": 538} {"train_loss": -32.2712516784668, "global_step": 65161, "epoch": 538} {"train_loss": -33.4432373046875, "global_step": 65162, "epoch": 538} {"train_loss": -33.61430740356445, "global_step": 65163, "epoch": 538} {"train_loss": -33.308448791503906, "global_step": 65164, "epoch": 538} {"train_loss": -33.345863342285156, "global_step": 65165, "epoch": 538} {"train_loss": -33.253963470458984, "global_step": 65166, "epoch": 538} {"train_loss": -33.5292854309082, "global_step": 65167, "epoch": 538} {"train_loss": -33.84312057495117, "global_step": 65168, "epoch": 538} {"train_loss": -33.488746643066406, "global_step": 65169, "epoch": 538} {"train_loss": -33.57072067260742, "global_step": 65170, "epoch": 538} {"train_loss": -34.266998291015625, "global_step": 65171, "epoch": 538} {"train_loss": -33.725093841552734, "global_step": 65172, "epoch": 538} {"train_loss": -34.04728317260742, "global_step": 65173, "epoch": 538} {"train_loss": -33.92157745361328, "global_step": 65174, "epoch": 538} {"train_loss": -33.88411331176758, "global_step": 65175, "epoch": 538} {"train_loss": -33.83683395385742, "global_step": 65176, "epoch": 538} {"train_loss": -33.65165328979492, "global_step": 65177, "epoch": 538} {"train_loss": -33.31049728393555, "global_step": 65178, "epoch": 538} {"train_loss": -33.54507064819336, "global_step": 65179, "epoch": 538} {"train_loss": -33.07173156738281, "global_step": 65180, "epoch": 538} {"train_loss": -32.886985778808594, "global_step": 65181, "epoch": 538} {"train_loss": -32.56142044067383, "global_step": 65182, "epoch": 538} {"train_loss": -31.916446685791016, "global_step": 65183, "epoch": 538} {"train_loss": -33.30366134643555, "global_step": 65184, "epoch": 538} {"train_loss": -33.88566970825195, "global_step": 65185, "epoch": 538} {"train_loss": -33.20859909057617, "global_step": 65186, "epoch": 538} {"train_loss": -32.625423431396484, "global_step": 65187, "epoch": 538} {"train_loss": -33.68267822265625, "global_step": 65188, "epoch": 538} {"train_loss": -34.22931671142578, "global_step": 65189, "epoch": 538} {"train_loss": -33.752498626708984, "global_step": 65190, "epoch": 538} {"train_loss": -33.775203704833984, "global_step": 65191, "epoch": 538} {"train_loss": -33.74534606933594, "global_step": 65192, "epoch": 538} {"train_loss": -33.27029037475586, "global_step": 65193, "epoch": 538} {"train_loss": -34.092166900634766, "global_step": 65194, "epoch": 538} {"train_loss": -33.975677490234375, "global_step": 65195, "epoch": 538} {"train_loss": -33.95158386230469, "global_step": 65196, "epoch": 538} {"train_loss": -34.625, "global_step": 65197, "epoch": 538} {"train_loss": -33.4812126159668, "global_step": 65198, "epoch": 538} {"train_loss": -34.44671630859375, "global_step": 65199, "epoch": 538} {"train_loss": -32.53125762939453, "global_step": 65200, "epoch": 538} {"train_loss": -33.30640411376953, "global_step": 65201, "epoch": 538} {"train_loss": -31.57769203186035, "global_step": 65202, "epoch": 538} {"train_loss": -34.36083221435547, "global_step": 65203, "epoch": 538} {"train_loss": -32.063533782958984, "global_step": 65204, "epoch": 538} {"train_loss": -33.83137893676758, "global_step": 65205, "epoch": 538} {"train_loss": -33.091064453125, "global_step": 65206, "epoch": 538} {"train_loss": -34.26203536987305, "global_step": 65207, "epoch": 538} {"train_loss": -34.30813217163086, "global_step": 65208, "epoch": 538} {"train_loss": -33.8996696472168, "global_step": 65209, "epoch": 538} {"train_loss": -34.699378967285156, "global_step": 65210, "epoch": 538} {"train_loss": -34.027976989746094, "global_step": 65211, "epoch": 538} {"train_loss": -34.195213317871094, "global_step": 65212, "epoch": 538} {"train_loss": -34.10561752319336, "global_step": 65213, "epoch": 538} {"train_loss": -34.54669189453125, "global_step": 65214, "epoch": 538} {"train_loss": -34.87871170043945, "global_step": 65215, "epoch": 538} {"train_loss": -34.4093017578125, "global_step": 65216, "epoch": 538} {"train_loss": -35.02716827392578, "global_step": 65217, "epoch": 538} {"train_loss": -33.03943118576176, "global_step": 65218, "epoch": 538, "val_loss": 2520897.25} {"train_loss": -34.48092269897461, "global_step": 65219, "epoch": 539} {"train_loss": -34.84309005737305, "global_step": 65220, "epoch": 539} {"train_loss": -34.78936767578125, "global_step": 65221, "epoch": 539} {"train_loss": -35.044166564941406, "global_step": 65222, "epoch": 539} {"train_loss": -34.54977035522461, "global_step": 65223, "epoch": 539} {"train_loss": -35.072471618652344, "global_step": 65224, "epoch": 539} {"train_loss": -35.45867919921875, "global_step": 65225, "epoch": 539} {"train_loss": -34.982933044433594, "global_step": 65226, "epoch": 539} {"train_loss": -34.9990348815918, "global_step": 65227, "epoch": 539} {"train_loss": -35.28418731689453, "global_step": 65228, "epoch": 539} {"train_loss": -34.96358108520508, "global_step": 65229, "epoch": 539} {"train_loss": -34.81343460083008, "global_step": 65230, "epoch": 539} {"train_loss": -34.8912467956543, "global_step": 65231, "epoch": 539} {"train_loss": -34.509918212890625, "global_step": 65232, "epoch": 539} {"train_loss": -33.51567840576172, "global_step": 65233, "epoch": 539} {"train_loss": -34.40999221801758, "global_step": 65234, "epoch": 539} {"train_loss": -35.01851272583008, "global_step": 65235, "epoch": 539} {"train_loss": -33.6006965637207, "global_step": 65236, "epoch": 539} {"train_loss": -31.940977096557617, "global_step": 65237, "epoch": 539} {"train_loss": -31.500791549682617, "global_step": 65238, "epoch": 539} {"train_loss": -34.734188079833984, "global_step": 65239, "epoch": 539} {"train_loss": -32.04362106323242, "global_step": 65240, "epoch": 539} {"train_loss": -30.78445816040039, "global_step": 65241, "epoch": 539} {"train_loss": -31.733922958374023, "global_step": 65242, "epoch": 539} {"train_loss": -32.18729782104492, "global_step": 65243, "epoch": 539} {"train_loss": -31.853559494018555, "global_step": 65244, "epoch": 539} {"train_loss": -25.882165908813477, "global_step": 65245, "epoch": 539} {"train_loss": -30.2275447845459, "global_step": 65246, "epoch": 539} {"train_loss": -30.236957550048828, "global_step": 65247, "epoch": 539} {"train_loss": -32.34716796875, "global_step": 65248, "epoch": 539} {"train_loss": -32.84527587890625, "global_step": 65249, "epoch": 539} {"train_loss": -32.427886962890625, "global_step": 65250, "epoch": 539} {"train_loss": -33.339019775390625, "global_step": 65251, "epoch": 539} {"train_loss": -33.45894241333008, "global_step": 65252, "epoch": 539} {"train_loss": -33.67946243286133, "global_step": 65253, "epoch": 539} {"train_loss": -33.38359069824219, "global_step": 65254, "epoch": 539} {"train_loss": -33.73774337768555, "global_step": 65255, "epoch": 539} {"train_loss": -33.44527816772461, "global_step": 65256, "epoch": 539} {"train_loss": -34.34046173095703, "global_step": 65257, "epoch": 539} {"train_loss": -34.097991943359375, "global_step": 65258, "epoch": 539} {"train_loss": -33.753475189208984, "global_step": 65259, "epoch": 539} {"train_loss": -34.28483200073242, "global_step": 65260, "epoch": 539} {"train_loss": -34.20473861694336, "global_step": 65261, "epoch": 539} {"train_loss": -34.07637023925781, "global_step": 65262, "epoch": 539} {"train_loss": -34.19914245605469, "global_step": 65263, "epoch": 539} {"train_loss": -34.53762435913086, "global_step": 65264, "epoch": 539} {"train_loss": -34.282806396484375, "global_step": 65265, "epoch": 539} {"train_loss": -34.41300582885742, "global_step": 65266, "epoch": 539} {"train_loss": -34.693363189697266, "global_step": 65267, "epoch": 539} {"train_loss": -34.4290657043457, "global_step": 65268, "epoch": 539} {"train_loss": -34.9291877746582, "global_step": 65269, "epoch": 539} {"train_loss": -34.614227294921875, "global_step": 65270, "epoch": 539} {"train_loss": -34.580265045166016, "global_step": 65271, "epoch": 539} {"train_loss": -34.726558685302734, "global_step": 65272, "epoch": 539} {"train_loss": -34.40413284301758, "global_step": 65273, "epoch": 539} {"train_loss": -34.74565505981445, "global_step": 65274, "epoch": 539} {"train_loss": -35.01383972167969, "global_step": 65275, "epoch": 539} {"train_loss": -35.057037353515625, "global_step": 65276, "epoch": 539} {"train_loss": -34.736846923828125, "global_step": 65277, "epoch": 539} {"train_loss": -34.87890625, "global_step": 65278, "epoch": 539} {"train_loss": -35.19026565551758, "global_step": 65279, "epoch": 539} {"train_loss": -35.055389404296875, "global_step": 65280, "epoch": 539} {"train_loss": -35.1256217956543, "global_step": 65281, "epoch": 539} {"train_loss": -34.65970993041992, "global_step": 65282, "epoch": 539} {"train_loss": -35.3247184753418, "global_step": 65283, "epoch": 539} {"train_loss": -35.27875518798828, "global_step": 65284, "epoch": 539} {"train_loss": -35.43867111206055, "global_step": 65285, "epoch": 539} {"train_loss": -35.020263671875, "global_step": 65286, "epoch": 539} {"train_loss": -35.1757926940918, "global_step": 65287, "epoch": 539} {"train_loss": -35.487831115722656, "global_step": 65288, "epoch": 539} {"train_loss": -35.236637115478516, "global_step": 65289, "epoch": 539} {"train_loss": -34.97590255737305, "global_step": 65290, "epoch": 539} {"train_loss": -35.588287353515625, "global_step": 65291, "epoch": 539} {"train_loss": -35.47615432739258, "global_step": 65292, "epoch": 539} {"train_loss": -36.28629684448242, "global_step": 65293, "epoch": 539} {"train_loss": -35.477088928222656, "global_step": 65294, "epoch": 539} {"train_loss": -35.94327926635742, "global_step": 65295, "epoch": 539} {"train_loss": -35.88800048828125, "global_step": 65296, "epoch": 539} {"train_loss": -35.381370544433594, "global_step": 65297, "epoch": 539} {"train_loss": -36.13240051269531, "global_step": 65298, "epoch": 539} {"train_loss": -35.87397384643555, "global_step": 65299, "epoch": 539} {"train_loss": -35.76056671142578, "global_step": 65300, "epoch": 539} {"train_loss": -35.8800048828125, "global_step": 65301, "epoch": 539} {"train_loss": -35.396827697753906, "global_step": 65302, "epoch": 539} {"train_loss": -35.263179779052734, "global_step": 65303, "epoch": 539} {"train_loss": -35.4583625793457, "global_step": 65304, "epoch": 539} {"train_loss": -34.96884536743164, "global_step": 65305, "epoch": 539} {"train_loss": -34.158180236816406, "global_step": 65306, "epoch": 539} {"train_loss": -35.06534194946289, "global_step": 65307, "epoch": 539} {"train_loss": -35.98665237426758, "global_step": 65308, "epoch": 539} {"train_loss": -35.49532699584961, "global_step": 65309, "epoch": 539} {"train_loss": -35.05481719970703, "global_step": 65310, "epoch": 539} {"train_loss": -35.69872283935547, "global_step": 65311, "epoch": 539} {"train_loss": -36.061500549316406, "global_step": 65312, "epoch": 539} {"train_loss": -34.87586212158203, "global_step": 65313, "epoch": 539} {"train_loss": -35.534095764160156, "global_step": 65314, "epoch": 539} {"train_loss": -35.65158462524414, "global_step": 65315, "epoch": 539} {"train_loss": -35.93412399291992, "global_step": 65316, "epoch": 539} {"train_loss": -35.92376708984375, "global_step": 65317, "epoch": 539} {"train_loss": -36.100276947021484, "global_step": 65318, "epoch": 539} {"train_loss": -36.205909729003906, "global_step": 65319, "epoch": 539} {"train_loss": -35.98196029663086, "global_step": 65320, "epoch": 539} {"train_loss": -35.91820526123047, "global_step": 65321, "epoch": 539} {"train_loss": -35.822784423828125, "global_step": 65322, "epoch": 539} {"train_loss": -35.99958038330078, "global_step": 65323, "epoch": 539} {"train_loss": -36.20664596557617, "global_step": 65324, "epoch": 539} {"train_loss": -35.95387649536133, "global_step": 65325, "epoch": 539} {"train_loss": -35.47346878051758, "global_step": 65326, "epoch": 539} {"train_loss": -35.31187057495117, "global_step": 65327, "epoch": 539} {"train_loss": -34.23124694824219, "global_step": 65328, "epoch": 539} {"train_loss": -33.826351165771484, "global_step": 65329, "epoch": 539} {"train_loss": -31.45647621154785, "global_step": 65330, "epoch": 539} {"train_loss": -31.08687400817871, "global_step": 65331, "epoch": 539} {"train_loss": -30.236703872680664, "global_step": 65332, "epoch": 539} {"train_loss": -33.168495178222656, "global_step": 65333, "epoch": 539} {"train_loss": -34.81329345703125, "global_step": 65334, "epoch": 539} {"train_loss": -34.73906326293945, "global_step": 65335, "epoch": 539} {"train_loss": -34.86879348754883, "global_step": 65336, "epoch": 539} {"train_loss": -34.34735107421875, "global_step": 65337, "epoch": 539} {"train_loss": -34.91386032104492, "global_step": 65338, "epoch": 539} {"train_loss": -34.466407854694964, "global_step": 65339, "epoch": 539, "val_loss": 2497874.25} {"train_loss": -35.065162658691406, "global_step": 65340, "epoch": 540} {"train_loss": -35.559383392333984, "global_step": 65341, "epoch": 540} {"train_loss": -35.33734893798828, "global_step": 65342, "epoch": 540} {"train_loss": -35.668670654296875, "global_step": 65343, "epoch": 540} {"train_loss": -35.3370475769043, "global_step": 65344, "epoch": 540} {"train_loss": -35.268775939941406, "global_step": 65345, "epoch": 540} {"train_loss": -34.75968551635742, "global_step": 65346, "epoch": 540} {"train_loss": -34.911624908447266, "global_step": 65347, "epoch": 540} {"train_loss": -34.82181930541992, "global_step": 65348, "epoch": 540} {"train_loss": -35.1656608581543, "global_step": 65349, "epoch": 540} {"train_loss": -34.4292106628418, "global_step": 65350, "epoch": 540} {"train_loss": -34.940799713134766, "global_step": 65351, "epoch": 540} {"train_loss": -35.7676887512207, "global_step": 65352, "epoch": 540} {"train_loss": -34.85039520263672, "global_step": 65353, "epoch": 540} {"train_loss": -34.36118698120117, "global_step": 65354, "epoch": 540} {"train_loss": -35.13361358642578, "global_step": 65355, "epoch": 540} {"train_loss": -35.26838302612305, "global_step": 65356, "epoch": 540} {"train_loss": -35.49616622924805, "global_step": 65357, "epoch": 540} {"train_loss": -35.21259689331055, "global_step": 65358, "epoch": 540} {"train_loss": -34.83207321166992, "global_step": 65359, "epoch": 540} {"train_loss": -34.58700180053711, "global_step": 65360, "epoch": 540} {"train_loss": -34.968505859375, "global_step": 65361, "epoch": 540} {"train_loss": -34.664859771728516, "global_step": 65362, "epoch": 540} {"train_loss": -35.2730712890625, "global_step": 65363, "epoch": 540} {"train_loss": -34.886898040771484, "global_step": 65364, "epoch": 540} {"train_loss": -34.49644088745117, "global_step": 65365, "epoch": 540} {"train_loss": -35.131874084472656, "global_step": 65366, "epoch": 540} {"train_loss": -34.7904167175293, "global_step": 65367, "epoch": 540} {"train_loss": -35.053688049316406, "global_step": 65368, "epoch": 540} {"train_loss": -34.983909606933594, "global_step": 65369, "epoch": 540} {"train_loss": -35.17256164550781, "global_step": 65370, "epoch": 540} {"train_loss": -35.63634490966797, "global_step": 65371, "epoch": 540} {"train_loss": -35.5988655090332, "global_step": 65372, "epoch": 540} {"train_loss": -35.38587188720703, "global_step": 65373, "epoch": 540} {"train_loss": -34.69977569580078, "global_step": 65374, "epoch": 540} {"train_loss": -34.70591354370117, "global_step": 65375, "epoch": 540} {"train_loss": -34.808982849121094, "global_step": 65376, "epoch": 540} {"train_loss": -35.41103744506836, "global_step": 65377, "epoch": 540} {"train_loss": -35.73995590209961, "global_step": 65378, "epoch": 540} {"train_loss": -35.48421859741211, "global_step": 65379, "epoch": 540} {"train_loss": -35.96954345703125, "global_step": 65380, "epoch": 540} {"train_loss": -35.281517028808594, "global_step": 65381, "epoch": 540} {"train_loss": -35.68817901611328, "global_step": 65382, "epoch": 540} {"train_loss": -35.76884078979492, "global_step": 65383, "epoch": 540} {"train_loss": -35.445655822753906, "global_step": 65384, "epoch": 540} {"train_loss": -35.50366973876953, "global_step": 65385, "epoch": 540} {"train_loss": -35.72066879272461, "global_step": 65386, "epoch": 540} {"train_loss": -35.43040084838867, "global_step": 65387, "epoch": 540} {"train_loss": -34.71274948120117, "global_step": 65388, "epoch": 540} {"train_loss": -35.81785202026367, "global_step": 65389, "epoch": 540} {"train_loss": -35.69266128540039, "global_step": 65390, "epoch": 540} {"train_loss": -35.50297927856445, "global_step": 65391, "epoch": 540} {"train_loss": -35.74212646484375, "global_step": 65392, "epoch": 540} {"train_loss": -35.87075424194336, "global_step": 65393, "epoch": 540} {"train_loss": -36.06098556518555, "global_step": 65394, "epoch": 540} {"train_loss": -36.2181510925293, "global_step": 65395, "epoch": 540} {"train_loss": -35.83372497558594, "global_step": 65396, "epoch": 540} {"train_loss": -36.10499954223633, "global_step": 65397, "epoch": 540} {"train_loss": -35.34461212158203, "global_step": 65398, "epoch": 540} {"train_loss": -36.137367248535156, "global_step": 65399, "epoch": 540} {"train_loss": -35.82050704956055, "global_step": 65400, "epoch": 540} {"train_loss": -35.129486083984375, "global_step": 65401, "epoch": 540} {"train_loss": -36.00228500366211, "global_step": 65402, "epoch": 540} {"train_loss": -36.23719024658203, "global_step": 65403, "epoch": 540} {"train_loss": -35.70928955078125, "global_step": 65404, "epoch": 540} {"train_loss": -35.095401763916016, "global_step": 65405, "epoch": 540} {"train_loss": -35.58552932739258, "global_step": 65406, "epoch": 540} {"train_loss": -36.275936126708984, "global_step": 65407, "epoch": 540} {"train_loss": -35.6739616394043, "global_step": 65408, "epoch": 540} {"train_loss": -35.187103271484375, "global_step": 65409, "epoch": 540} {"train_loss": -34.50178146362305, "global_step": 65410, "epoch": 540} {"train_loss": -32.93900680541992, "global_step": 65411, "epoch": 540} {"train_loss": -31.302291870117188, "global_step": 65412, "epoch": 540} {"train_loss": -32.6305046081543, "global_step": 65413, "epoch": 540} {"train_loss": -34.30124282836914, "global_step": 65414, "epoch": 540} {"train_loss": -35.252960205078125, "global_step": 65415, "epoch": 540} {"train_loss": -31.563175201416016, "global_step": 65416, "epoch": 540} {"train_loss": -29.860641479492188, "global_step": 65417, "epoch": 540} {"train_loss": -30.821563720703125, "global_step": 65418, "epoch": 540} {"train_loss": -34.97576904296875, "global_step": 65419, "epoch": 540} {"train_loss": -31.6568603515625, "global_step": 65420, "epoch": 540} {"train_loss": -31.748510360717773, "global_step": 65421, "epoch": 540} {"train_loss": -35.1433219909668, "global_step": 65422, "epoch": 540} {"train_loss": -32.934322357177734, "global_step": 65423, "epoch": 540} {"train_loss": -34.91695022583008, "global_step": 65424, "epoch": 540} {"train_loss": -34.08646011352539, "global_step": 65425, "epoch": 540} {"train_loss": -34.009910583496094, "global_step": 65426, "epoch": 540} {"train_loss": -34.05635452270508, "global_step": 65427, "epoch": 540} {"train_loss": -34.79047393798828, "global_step": 65428, "epoch": 540} {"train_loss": -34.7639274597168, "global_step": 65429, "epoch": 540} {"train_loss": -34.38286590576172, "global_step": 65430, "epoch": 540} {"train_loss": -34.820308685302734, "global_step": 65431, "epoch": 540} {"train_loss": -34.724769592285156, "global_step": 65432, "epoch": 540} {"train_loss": -35.628353118896484, "global_step": 65433, "epoch": 540} {"train_loss": -34.45034408569336, "global_step": 65434, "epoch": 540} {"train_loss": -34.58852767944336, "global_step": 65435, "epoch": 540} {"train_loss": -34.8687629699707, "global_step": 65436, "epoch": 540} {"train_loss": -34.86799240112305, "global_step": 65437, "epoch": 540} {"train_loss": -34.501827239990234, "global_step": 65438, "epoch": 540} {"train_loss": -34.74972152709961, "global_step": 65439, "epoch": 540} {"train_loss": -35.31111526489258, "global_step": 65440, "epoch": 540} {"train_loss": -35.25117111206055, "global_step": 65441, "epoch": 540} {"train_loss": -34.90334701538086, "global_step": 65442, "epoch": 540} {"train_loss": -34.402400970458984, "global_step": 65443, "epoch": 540} {"train_loss": -34.327247619628906, "global_step": 65444, "epoch": 540} {"train_loss": -34.769683837890625, "global_step": 65445, "epoch": 540} {"train_loss": -34.885921478271484, "global_step": 65446, "epoch": 540} {"train_loss": -34.98284912109375, "global_step": 65447, "epoch": 540} {"train_loss": -35.33397674560547, "global_step": 65448, "epoch": 540} {"train_loss": -35.10561752319336, "global_step": 65449, "epoch": 540} {"train_loss": -34.447906494140625, "global_step": 65450, "epoch": 540} {"train_loss": -33.71681594848633, "global_step": 65451, "epoch": 540} {"train_loss": -32.79607009887695, "global_step": 65452, "epoch": 540} {"train_loss": -35.3138313293457, "global_step": 65453, "epoch": 540} {"train_loss": -35.12103271484375, "global_step": 65454, "epoch": 540} {"train_loss": -34.39681625366211, "global_step": 65455, "epoch": 540} {"train_loss": -35.194332122802734, "global_step": 65456, "epoch": 540} {"train_loss": -35.1593132019043, "global_step": 65457, "epoch": 540} {"train_loss": -34.258663177490234, "global_step": 65458, "epoch": 540} {"train_loss": -35.59185791015625, "global_step": 65459, "epoch": 540} {"train_loss": -34.864726626183376, "global_step": 65460, "epoch": 540, "val_loss": 2482688.0} {"train_loss": -35.4197883605957, "global_step": 65461, "epoch": 541} {"train_loss": -34.91684341430664, "global_step": 65462, "epoch": 541} {"train_loss": -35.48723220825195, "global_step": 65463, "epoch": 541} {"train_loss": -35.491310119628906, "global_step": 65464, "epoch": 541} {"train_loss": -35.66041946411133, "global_step": 65465, "epoch": 541} {"train_loss": -36.0823974609375, "global_step": 65466, "epoch": 541} {"train_loss": -35.32550048828125, "global_step": 65467, "epoch": 541} {"train_loss": -35.682064056396484, "global_step": 65468, "epoch": 541} {"train_loss": -35.35501480102539, "global_step": 65469, "epoch": 541} {"train_loss": -34.533912658691406, "global_step": 65470, "epoch": 541} {"train_loss": -35.12319564819336, "global_step": 65471, "epoch": 541} {"train_loss": -35.3443489074707, "global_step": 65472, "epoch": 541} {"train_loss": -34.768856048583984, "global_step": 65473, "epoch": 541} {"train_loss": -35.54989242553711, "global_step": 65474, "epoch": 541} {"train_loss": -35.67741775512695, "global_step": 65475, "epoch": 541} {"train_loss": -35.74973678588867, "global_step": 65476, "epoch": 541} {"train_loss": -35.32898712158203, "global_step": 65477, "epoch": 541} {"train_loss": -35.36072540283203, "global_step": 65478, "epoch": 541} {"train_loss": -35.74604034423828, "global_step": 65479, "epoch": 541} {"train_loss": -35.5639762878418, "global_step": 65480, "epoch": 541} {"train_loss": -35.47658157348633, "global_step": 65481, "epoch": 541} {"train_loss": -35.016693115234375, "global_step": 65482, "epoch": 541} {"train_loss": -35.71090316772461, "global_step": 65483, "epoch": 541} {"train_loss": -35.13420104980469, "global_step": 65484, "epoch": 541} {"train_loss": -35.627376556396484, "global_step": 65485, "epoch": 541} {"train_loss": -36.0366325378418, "global_step": 65486, "epoch": 541} {"train_loss": -35.93750762939453, "global_step": 65487, "epoch": 541} {"train_loss": -36.045040130615234, "global_step": 65488, "epoch": 541} {"train_loss": -35.50667953491211, "global_step": 65489, "epoch": 541} {"train_loss": -35.649417877197266, "global_step": 65490, "epoch": 541} {"train_loss": -36.08486557006836, "global_step": 65491, "epoch": 541} {"train_loss": -35.76667404174805, "global_step": 65492, "epoch": 541} {"train_loss": -36.30159378051758, "global_step": 65493, "epoch": 541} {"train_loss": -35.67793273925781, "global_step": 65494, "epoch": 541} {"train_loss": -35.39799880981445, "global_step": 65495, "epoch": 541} {"train_loss": -35.87405014038086, "global_step": 65496, "epoch": 541} {"train_loss": -35.71136474609375, "global_step": 65497, "epoch": 541} {"train_loss": -36.27982711791992, "global_step": 65498, "epoch": 541} {"train_loss": -36.44108963012695, "global_step": 65499, "epoch": 541} {"train_loss": -35.590328216552734, "global_step": 65500, "epoch": 541} {"train_loss": -36.0986328125, "global_step": 65501, "epoch": 541} {"train_loss": -35.46881103515625, "global_step": 65502, "epoch": 541} {"train_loss": -35.904781341552734, "global_step": 65503, "epoch": 541} {"train_loss": -35.41554641723633, "global_step": 65504, "epoch": 541} {"train_loss": -36.5016975402832, "global_step": 65505, "epoch": 541} {"train_loss": -35.666133880615234, "global_step": 65506, "epoch": 541} {"train_loss": -35.97532272338867, "global_step": 65507, "epoch": 541} {"train_loss": -35.9679069519043, "global_step": 65508, "epoch": 541} {"train_loss": -35.92246627807617, "global_step": 65509, "epoch": 541} {"train_loss": -36.13813400268555, "global_step": 65510, "epoch": 541} {"train_loss": -36.08107376098633, "global_step": 65511, "epoch": 541} {"train_loss": -36.58944320678711, "global_step": 65512, "epoch": 541} {"train_loss": -36.44465255737305, "global_step": 65513, "epoch": 541} {"train_loss": -36.75510787963867, "global_step": 65514, "epoch": 541} {"train_loss": -36.412715911865234, "global_step": 65515, "epoch": 541} {"train_loss": -35.79899215698242, "global_step": 65516, "epoch": 541} {"train_loss": -36.81333923339844, "global_step": 65517, "epoch": 541} {"train_loss": -36.19110107421875, "global_step": 65518, "epoch": 541} {"train_loss": -35.9952392578125, "global_step": 65519, "epoch": 541} {"train_loss": -36.66106414794922, "global_step": 65520, "epoch": 541} {"train_loss": -36.76083755493164, "global_step": 65521, "epoch": 541} {"train_loss": -36.5708122253418, "global_step": 65522, "epoch": 541} {"train_loss": -36.321102142333984, "global_step": 65523, "epoch": 541} {"train_loss": -36.721473693847656, "global_step": 65524, "epoch": 541} {"train_loss": -35.85664749145508, "global_step": 65525, "epoch": 541} {"train_loss": -35.96560287475586, "global_step": 65526, "epoch": 541} {"train_loss": -35.89955520629883, "global_step": 65527, "epoch": 541} {"train_loss": -35.36903762817383, "global_step": 65528, "epoch": 541} {"train_loss": -36.47658920288086, "global_step": 65529, "epoch": 541} {"train_loss": -35.54926300048828, "global_step": 65530, "epoch": 541} {"train_loss": -36.3938102722168, "global_step": 65531, "epoch": 541} {"train_loss": -35.9040641784668, "global_step": 65532, "epoch": 541} {"train_loss": -35.61076354980469, "global_step": 65533, "epoch": 541} {"train_loss": -36.408573150634766, "global_step": 65534, "epoch": 541} {"train_loss": -35.11625289916992, "global_step": 65535, "epoch": 541} {"train_loss": -34.42330551147461, "global_step": 65536, "epoch": 541} {"train_loss": -32.200401306152344, "global_step": 65537, "epoch": 541} {"train_loss": -30.982685089111328, "global_step": 65538, "epoch": 541} {"train_loss": -32.857452392578125, "global_step": 65539, "epoch": 541} {"train_loss": -34.839473724365234, "global_step": 65540, "epoch": 541} {"train_loss": -35.836551666259766, "global_step": 65541, "epoch": 541} {"train_loss": -34.62641525268555, "global_step": 65542, "epoch": 541} {"train_loss": -33.144535064697266, "global_step": 65543, "epoch": 541} {"train_loss": -34.80934524536133, "global_step": 65544, "epoch": 541} {"train_loss": -35.39231491088867, "global_step": 65545, "epoch": 541} {"train_loss": -34.671566009521484, "global_step": 65546, "epoch": 541} {"train_loss": -35.31472396850586, "global_step": 65547, "epoch": 541} {"train_loss": -35.77294158935547, "global_step": 65548, "epoch": 541} {"train_loss": -35.95607376098633, "global_step": 65549, "epoch": 541} {"train_loss": -35.450679779052734, "global_step": 65550, "epoch": 541} {"train_loss": -35.24607467651367, "global_step": 65551, "epoch": 541} {"train_loss": -36.359588623046875, "global_step": 65552, "epoch": 541} {"train_loss": -35.74164581298828, "global_step": 65553, "epoch": 541} {"train_loss": -36.2621955871582, "global_step": 65554, "epoch": 541} {"train_loss": -35.70219039916992, "global_step": 65555, "epoch": 541} {"train_loss": -36.18649673461914, "global_step": 65556, "epoch": 541} {"train_loss": -36.16820526123047, "global_step": 65557, "epoch": 541} {"train_loss": -36.33024215698242, "global_step": 65558, "epoch": 541} {"train_loss": -35.76719665527344, "global_step": 65559, "epoch": 541} {"train_loss": -35.766700744628906, "global_step": 65560, "epoch": 541} {"train_loss": -35.76960372924805, "global_step": 65561, "epoch": 541} {"train_loss": -36.260169982910156, "global_step": 65562, "epoch": 541} {"train_loss": -36.28811264038086, "global_step": 65563, "epoch": 541} {"train_loss": -35.84920120239258, "global_step": 65564, "epoch": 541} {"train_loss": -36.5111198425293, "global_step": 65565, "epoch": 541} {"train_loss": -34.49725341796875, "global_step": 65566, "epoch": 541} {"train_loss": -36.376712799072266, "global_step": 65567, "epoch": 541} {"train_loss": -35.917579650878906, "global_step": 65568, "epoch": 541} {"train_loss": -36.395301818847656, "global_step": 65569, "epoch": 541} {"train_loss": -35.38649368286133, "global_step": 65570, "epoch": 541} {"train_loss": -36.06550979614258, "global_step": 65571, "epoch": 541} {"train_loss": -36.46669006347656, "global_step": 65572, "epoch": 541} {"train_loss": -36.27210235595703, "global_step": 65573, "epoch": 541} {"train_loss": -36.38641357421875, "global_step": 65574, "epoch": 541} {"train_loss": -36.46246337890625, "global_step": 65575, "epoch": 541} {"train_loss": -36.441192626953125, "global_step": 65576, "epoch": 541} {"train_loss": -36.4528923034668, "global_step": 65577, "epoch": 541} {"train_loss": -36.39128875732422, "global_step": 65578, "epoch": 541} {"train_loss": -36.045528411865234, "global_step": 65579, "epoch": 541} {"train_loss": -35.93379592895508, "global_step": 65580, "epoch": 541} {"train_loss": -35.7102810883325, "global_step": 65581, "epoch": 541, "val_loss": 2596752.25} {"train_loss": -35.08977127075195, "global_step": 65582, "epoch": 542} {"train_loss": -35.74312973022461, "global_step": 65583, "epoch": 542} {"train_loss": -35.93373107910156, "global_step": 65584, "epoch": 542} {"train_loss": -36.51070785522461, "global_step": 65585, "epoch": 542} {"train_loss": -36.34415817260742, "global_step": 65586, "epoch": 542} {"train_loss": -32.99873733520508, "global_step": 65587, "epoch": 542} {"train_loss": -31.79587173461914, "global_step": 65588, "epoch": 542} {"train_loss": -34.95798873901367, "global_step": 65589, "epoch": 542} {"train_loss": -35.09116744995117, "global_step": 65590, "epoch": 542} {"train_loss": -34.76751708984375, "global_step": 65591, "epoch": 542} {"train_loss": -33.1479606628418, "global_step": 65592, "epoch": 542} {"train_loss": -35.00458526611328, "global_step": 65593, "epoch": 542} {"train_loss": -35.40829086303711, "global_step": 65594, "epoch": 542} {"train_loss": -32.82710647583008, "global_step": 65595, "epoch": 542} {"train_loss": -35.12431335449219, "global_step": 65596, "epoch": 542} {"train_loss": -32.12990951538086, "global_step": 65597, "epoch": 542} {"train_loss": -34.40380096435547, "global_step": 65598, "epoch": 542} {"train_loss": -34.8109245300293, "global_step": 65599, "epoch": 542} {"train_loss": -33.46715545654297, "global_step": 65600, "epoch": 542} {"train_loss": -34.41898727416992, "global_step": 65601, "epoch": 542} {"train_loss": -34.552955627441406, "global_step": 65602, "epoch": 542} {"train_loss": -35.25880813598633, "global_step": 65603, "epoch": 542} {"train_loss": -34.62771224975586, "global_step": 65604, "epoch": 542} {"train_loss": -34.931396484375, "global_step": 65605, "epoch": 542} {"train_loss": -33.91592025756836, "global_step": 65606, "epoch": 542} {"train_loss": -34.715667724609375, "global_step": 65607, "epoch": 542} {"train_loss": -35.302001953125, "global_step": 65608, "epoch": 542} {"train_loss": -34.77366256713867, "global_step": 65609, "epoch": 542} {"train_loss": -35.040672302246094, "global_step": 65610, "epoch": 542} {"train_loss": -34.4698600769043, "global_step": 65611, "epoch": 542} {"train_loss": -34.82252502441406, "global_step": 65612, "epoch": 542} {"train_loss": -33.71342468261719, "global_step": 65613, "epoch": 542} {"train_loss": -34.4544563293457, "global_step": 65614, "epoch": 542} {"train_loss": -35.32340621948242, "global_step": 65615, "epoch": 542} {"train_loss": -34.88538360595703, "global_step": 65616, "epoch": 542} {"train_loss": -35.30707550048828, "global_step": 65617, "epoch": 542} {"train_loss": -35.28286361694336, "global_step": 65618, "epoch": 542} {"train_loss": -35.166046142578125, "global_step": 65619, "epoch": 542} {"train_loss": -35.402381896972656, "global_step": 65620, "epoch": 542} {"train_loss": -35.461769104003906, "global_step": 65621, "epoch": 542} {"train_loss": -35.26477813720703, "global_step": 65622, "epoch": 542} {"train_loss": -35.436405181884766, "global_step": 65623, "epoch": 542} {"train_loss": -35.4090690612793, "global_step": 65624, "epoch": 542} {"train_loss": -35.259151458740234, "global_step": 65625, "epoch": 542} {"train_loss": -35.90081024169922, "global_step": 65626, "epoch": 542} {"train_loss": -35.311187744140625, "global_step": 65627, "epoch": 542} {"train_loss": -35.4073371887207, "global_step": 65628, "epoch": 542} {"train_loss": -35.552677154541016, "global_step": 65629, "epoch": 542} {"train_loss": -35.281917572021484, "global_step": 65630, "epoch": 542} {"train_loss": -36.075138092041016, "global_step": 65631, "epoch": 542} {"train_loss": -35.41091537475586, "global_step": 65632, "epoch": 542} {"train_loss": -36.374202728271484, "global_step": 65633, "epoch": 542} {"train_loss": -35.94973373413086, "global_step": 65634, "epoch": 542} {"train_loss": -35.66547775268555, "global_step": 65635, "epoch": 542} {"train_loss": -36.434814453125, "global_step": 65636, "epoch": 542} {"train_loss": -35.408546447753906, "global_step": 65637, "epoch": 542} {"train_loss": -35.87468338012695, "global_step": 65638, "epoch": 542} {"train_loss": -36.26522445678711, "global_step": 65639, "epoch": 542} {"train_loss": -35.61227035522461, "global_step": 65640, "epoch": 542} {"train_loss": -36.16986083984375, "global_step": 65641, "epoch": 542} {"train_loss": -36.46516036987305, "global_step": 65642, "epoch": 542} {"train_loss": -36.096778869628906, "global_step": 65643, "epoch": 542} {"train_loss": -36.43282699584961, "global_step": 65644, "epoch": 542} {"train_loss": -36.410491943359375, "global_step": 65645, "epoch": 542} {"train_loss": -35.81303405761719, "global_step": 65646, "epoch": 542} {"train_loss": -36.43291091918945, "global_step": 65647, "epoch": 542} {"train_loss": -36.195621490478516, "global_step": 65648, "epoch": 542} {"train_loss": -36.15095901489258, "global_step": 65649, "epoch": 542} {"train_loss": -36.1894645690918, "global_step": 65650, "epoch": 542} {"train_loss": -34.191139221191406, "global_step": 65651, "epoch": 542} {"train_loss": -30.572751998901367, "global_step": 65652, "epoch": 542} {"train_loss": -24.33188247680664, "global_step": 65653, "epoch": 542} {"train_loss": -16.753461837768555, "global_step": 65654, "epoch": 542} {"train_loss": -22.984241485595703, "global_step": 65655, "epoch": 542} {"train_loss": -35.904232025146484, "global_step": 65656, "epoch": 542} {"train_loss": -29.555500030517578, "global_step": 65657, "epoch": 542} {"train_loss": -34.9832878112793, "global_step": 65658, "epoch": 542} {"train_loss": -30.916162490844727, "global_step": 65659, "epoch": 542} {"train_loss": -36.16400909423828, "global_step": 65660, "epoch": 542} {"train_loss": -32.42508316040039, "global_step": 65661, "epoch": 542} {"train_loss": -34.915809631347656, "global_step": 65662, "epoch": 542} {"train_loss": -33.991661071777344, "global_step": 65663, "epoch": 542} {"train_loss": -33.74374771118164, "global_step": 65664, "epoch": 542} {"train_loss": -35.35915756225586, "global_step": 65665, "epoch": 542} {"train_loss": -34.31522750854492, "global_step": 65666, "epoch": 542} {"train_loss": -34.92106246948242, "global_step": 65667, "epoch": 542} {"train_loss": -34.820037841796875, "global_step": 65668, "epoch": 542} {"train_loss": -35.58216094970703, "global_step": 65669, "epoch": 542} {"train_loss": -34.99728012084961, "global_step": 65670, "epoch": 542} {"train_loss": -35.624263763427734, "global_step": 65671, "epoch": 542} {"train_loss": -35.31019973754883, "global_step": 65672, "epoch": 542} {"train_loss": -35.89191436767578, "global_step": 65673, "epoch": 542} {"train_loss": -35.75126266479492, "global_step": 65674, "epoch": 542} {"train_loss": -36.030860900878906, "global_step": 65675, "epoch": 542} {"train_loss": -35.801021575927734, "global_step": 65676, "epoch": 542} {"train_loss": -36.27845764160156, "global_step": 65677, "epoch": 542} {"train_loss": -35.74272537231445, "global_step": 65678, "epoch": 542} {"train_loss": -36.082645416259766, "global_step": 65679, "epoch": 542} {"train_loss": -36.25170135498047, "global_step": 65680, "epoch": 542} {"train_loss": -35.892208099365234, "global_step": 65681, "epoch": 542} {"train_loss": -36.17353439331055, "global_step": 65682, "epoch": 542} {"train_loss": -36.30502700805664, "global_step": 65683, "epoch": 542} {"train_loss": -36.26405334472656, "global_step": 65684, "epoch": 542} {"train_loss": -36.10285568237305, "global_step": 65685, "epoch": 542} {"train_loss": -36.03873825073242, "global_step": 65686, "epoch": 542} {"train_loss": -35.89029312133789, "global_step": 65687, "epoch": 542} {"train_loss": -35.94327926635742, "global_step": 65688, "epoch": 542} {"train_loss": -35.8477897644043, "global_step": 65689, "epoch": 542} {"train_loss": -36.09646224975586, "global_step": 65690, "epoch": 542} {"train_loss": -35.789485931396484, "global_step": 65691, "epoch": 542} {"train_loss": -36.448280334472656, "global_step": 65692, "epoch": 542} {"train_loss": -36.4357795715332, "global_step": 65693, "epoch": 542} {"train_loss": -36.568546295166016, "global_step": 65694, "epoch": 542} {"train_loss": -36.448360443115234, "global_step": 65695, "epoch": 542} {"train_loss": -36.06893539428711, "global_step": 65696, "epoch": 542} {"train_loss": -35.37335968017578, "global_step": 65697, "epoch": 542} {"train_loss": -36.65389633178711, "global_step": 65698, "epoch": 542} {"train_loss": -36.18526840209961, "global_step": 65699, "epoch": 542} {"train_loss": -36.673248291015625, "global_step": 65700, "epoch": 542} {"train_loss": -34.81723403930664, "global_step": 65701, "epoch": 542} {"train_loss": -34.890879560108026, "global_step": 65702, "epoch": 542, "val_loss": 2555781.75} {"train_loss": -24.48979377746582, "global_step": 65703, "epoch": 543} {"train_loss": -34.634952545166016, "global_step": 65704, "epoch": 543} {"train_loss": -35.827449798583984, "global_step": 65705, "epoch": 543} {"train_loss": -34.373260498046875, "global_step": 65706, "epoch": 543} {"train_loss": -33.9042854309082, "global_step": 65707, "epoch": 543} {"train_loss": -36.1422119140625, "global_step": 65708, "epoch": 543} {"train_loss": -34.95743942260742, "global_step": 65709, "epoch": 543} {"train_loss": -33.70595932006836, "global_step": 65710, "epoch": 543} {"train_loss": -35.55037307739258, "global_step": 65711, "epoch": 543} {"train_loss": -34.86285400390625, "global_step": 65712, "epoch": 543} {"train_loss": -35.33191680908203, "global_step": 65713, "epoch": 543} {"train_loss": -35.644264221191406, "global_step": 65714, "epoch": 543} {"train_loss": -35.680946350097656, "global_step": 65715, "epoch": 543} {"train_loss": -35.60835647583008, "global_step": 65716, "epoch": 543} {"train_loss": -35.496944427490234, "global_step": 65717, "epoch": 543} {"train_loss": -35.460201263427734, "global_step": 65718, "epoch": 543} {"train_loss": -36.16785430908203, "global_step": 65719, "epoch": 543} {"train_loss": -35.468223571777344, "global_step": 65720, "epoch": 543} {"train_loss": -34.5698127746582, "global_step": 65721, "epoch": 543} {"train_loss": -34.53826141357422, "global_step": 65722, "epoch": 543} {"train_loss": -34.812232971191406, "global_step": 65723, "epoch": 543} {"train_loss": -34.460914611816406, "global_step": 65724, "epoch": 543} {"train_loss": -36.20992660522461, "global_step": 65725, "epoch": 543} {"train_loss": -35.34880447387695, "global_step": 65726, "epoch": 543} {"train_loss": -34.27178192138672, "global_step": 65727, "epoch": 543} {"train_loss": -34.667396545410156, "global_step": 65728, "epoch": 543} {"train_loss": -34.8172492980957, "global_step": 65729, "epoch": 543} {"train_loss": -35.700382232666016, "global_step": 65730, "epoch": 543} {"train_loss": -34.87186050415039, "global_step": 65731, "epoch": 543} {"train_loss": -34.75725173950195, "global_step": 65732, "epoch": 543} {"train_loss": -35.08396911621094, "global_step": 65733, "epoch": 543} {"train_loss": -34.571292877197266, "global_step": 65734, "epoch": 543} {"train_loss": -35.089271545410156, "global_step": 65735, "epoch": 543} {"train_loss": -35.27891159057617, "global_step": 65736, "epoch": 543} {"train_loss": -34.340065002441406, "global_step": 65737, "epoch": 543} {"train_loss": -35.416786193847656, "global_step": 65738, "epoch": 543} {"train_loss": -35.6572265625, "global_step": 65739, "epoch": 543} {"train_loss": -34.83372497558594, "global_step": 65740, "epoch": 543} {"train_loss": -33.51402282714844, "global_step": 65741, "epoch": 543} {"train_loss": -34.52479934692383, "global_step": 65742, "epoch": 543} {"train_loss": -36.30283737182617, "global_step": 65743, "epoch": 543} {"train_loss": -35.14208984375, "global_step": 65744, "epoch": 543} {"train_loss": -32.617164611816406, "global_step": 65745, "epoch": 543} {"train_loss": -35.71369552612305, "global_step": 65746, "epoch": 543} {"train_loss": -35.93650436401367, "global_step": 65747, "epoch": 543} {"train_loss": -35.53033447265625, "global_step": 65748, "epoch": 543} {"train_loss": -35.31363296508789, "global_step": 65749, "epoch": 543} {"train_loss": -35.77592468261719, "global_step": 65750, "epoch": 543} {"train_loss": -36.22249984741211, "global_step": 65751, "epoch": 543} {"train_loss": -36.11408996582031, "global_step": 65752, "epoch": 543} {"train_loss": -35.935791015625, "global_step": 65753, "epoch": 543} {"train_loss": -35.72013473510742, "global_step": 65754, "epoch": 543} {"train_loss": -36.098915100097656, "global_step": 65755, "epoch": 543} {"train_loss": -35.27730941772461, "global_step": 65756, "epoch": 543} {"train_loss": -35.2043571472168, "global_step": 65757, "epoch": 543} {"train_loss": -36.04983139038086, "global_step": 65758, "epoch": 543} {"train_loss": -36.3074951171875, "global_step": 65759, "epoch": 543} {"train_loss": -35.5567741394043, "global_step": 65760, "epoch": 543} {"train_loss": -34.74399948120117, "global_step": 65761, "epoch": 543} {"train_loss": -35.536128997802734, "global_step": 65762, "epoch": 543} {"train_loss": -35.25543212890625, "global_step": 65763, "epoch": 543} {"train_loss": -35.89154052734375, "global_step": 65764, "epoch": 543} {"train_loss": -35.16816329956055, "global_step": 65765, "epoch": 543} {"train_loss": -34.47060775756836, "global_step": 65766, "epoch": 543} {"train_loss": -34.927642822265625, "global_step": 65767, "epoch": 543} {"train_loss": -32.62847900390625, "global_step": 65768, "epoch": 543} {"train_loss": -34.65660095214844, "global_step": 65769, "epoch": 543} {"train_loss": -35.89806365966797, "global_step": 65770, "epoch": 543} {"train_loss": -35.74991989135742, "global_step": 65771, "epoch": 543} {"train_loss": -35.9700927734375, "global_step": 65772, "epoch": 543} {"train_loss": -35.503753662109375, "global_step": 65773, "epoch": 543} {"train_loss": -35.08079147338867, "global_step": 65774, "epoch": 543} {"train_loss": -35.88114547729492, "global_step": 65775, "epoch": 543} {"train_loss": -36.01328659057617, "global_step": 65776, "epoch": 543} {"train_loss": -36.14778137207031, "global_step": 65777, "epoch": 543} {"train_loss": -35.52220916748047, "global_step": 65778, "epoch": 543} {"train_loss": -36.0849494934082, "global_step": 65779, "epoch": 543} {"train_loss": -35.894554138183594, "global_step": 65780, "epoch": 543} {"train_loss": -35.90887451171875, "global_step": 65781, "epoch": 543} {"train_loss": -36.30296325683594, "global_step": 65782, "epoch": 543} {"train_loss": -35.7890739440918, "global_step": 65783, "epoch": 543} {"train_loss": -36.39308166503906, "global_step": 65784, "epoch": 543} {"train_loss": -35.94331741333008, "global_step": 65785, "epoch": 543} {"train_loss": -37.010459899902344, "global_step": 65786, "epoch": 543} {"train_loss": -35.44214630126953, "global_step": 65787, "epoch": 543} {"train_loss": -35.14094543457031, "global_step": 65788, "epoch": 543} {"train_loss": -35.519134521484375, "global_step": 65789, "epoch": 543} {"train_loss": -36.32978439331055, "global_step": 65790, "epoch": 543} {"train_loss": -35.55889129638672, "global_step": 65791, "epoch": 543} {"train_loss": -35.34493637084961, "global_step": 65792, "epoch": 543} {"train_loss": -36.29590606689453, "global_step": 65793, "epoch": 543} {"train_loss": -36.59638214111328, "global_step": 65794, "epoch": 543} {"train_loss": -36.560218811035156, "global_step": 65795, "epoch": 543} {"train_loss": -36.08931350708008, "global_step": 65796, "epoch": 543} {"train_loss": -35.387062072753906, "global_step": 65797, "epoch": 543} {"train_loss": -35.92502975463867, "global_step": 65798, "epoch": 543} {"train_loss": -35.5835075378418, "global_step": 65799, "epoch": 543} {"train_loss": -35.21908187866211, "global_step": 65800, "epoch": 543} {"train_loss": -35.6212158203125, "global_step": 65801, "epoch": 543} {"train_loss": -36.131866455078125, "global_step": 65802, "epoch": 543} {"train_loss": -35.883697509765625, "global_step": 65803, "epoch": 543} {"train_loss": -36.38484191894531, "global_step": 65804, "epoch": 543} {"train_loss": -34.82110595703125, "global_step": 65805, "epoch": 543} {"train_loss": -36.535282135009766, "global_step": 65806, "epoch": 543} {"train_loss": -35.733001708984375, "global_step": 65807, "epoch": 543} {"train_loss": -33.49678039550781, "global_step": 65808, "epoch": 543} {"train_loss": -35.431129455566406, "global_step": 65809, "epoch": 543} {"train_loss": -34.7347412109375, "global_step": 65810, "epoch": 543} {"train_loss": -34.70656204223633, "global_step": 65811, "epoch": 543} {"train_loss": -29.470947265625, "global_step": 65812, "epoch": 543} {"train_loss": -34.19319152832031, "global_step": 65813, "epoch": 543} {"train_loss": -32.44023513793945, "global_step": 65814, "epoch": 543} {"train_loss": -31.094970703125, "global_step": 65815, "epoch": 543} {"train_loss": -23.360422134399414, "global_step": 65816, "epoch": 543} {"train_loss": -30.10504150390625, "global_step": 65817, "epoch": 543} {"train_loss": -29.227725982666016, "global_step": 65818, "epoch": 543} {"train_loss": -32.77462387084961, "global_step": 65819, "epoch": 543} {"train_loss": -31.362319946289062, "global_step": 65820, "epoch": 543} {"train_loss": -32.31856918334961, "global_step": 65821, "epoch": 543} {"train_loss": -27.36356544494629, "global_step": 65822, "epoch": 543} {"train_loss": -34.779824075620034, "global_step": 65823, "epoch": 543, "val_loss": 2637624.0} {"train_loss": -31.447778701782227, "global_step": 65824, "epoch": 544} {"train_loss": -32.834938049316406, "global_step": 65825, "epoch": 544} {"train_loss": -32.25751876831055, "global_step": 65826, "epoch": 544} {"train_loss": -33.147281646728516, "global_step": 65827, "epoch": 544} {"train_loss": -31.063146591186523, "global_step": 65828, "epoch": 544} {"train_loss": -32.34629440307617, "global_step": 65829, "epoch": 544} {"train_loss": -32.431114196777344, "global_step": 65830, "epoch": 544} {"train_loss": -31.932477951049805, "global_step": 65831, "epoch": 544} {"train_loss": -32.222904205322266, "global_step": 65832, "epoch": 544} {"train_loss": -32.62434768676758, "global_step": 65833, "epoch": 544} {"train_loss": -33.9119987487793, "global_step": 65834, "epoch": 544} {"train_loss": -32.418697357177734, "global_step": 65835, "epoch": 544} {"train_loss": -33.211238861083984, "global_step": 65836, "epoch": 544} {"train_loss": -33.64014434814453, "global_step": 65837, "epoch": 544} {"train_loss": -33.288330078125, "global_step": 65838, "epoch": 544} {"train_loss": -33.69661331176758, "global_step": 65839, "epoch": 544} {"train_loss": -34.1081428527832, "global_step": 65840, "epoch": 544} {"train_loss": -33.38345718383789, "global_step": 65841, "epoch": 544} {"train_loss": -33.26669692993164, "global_step": 65842, "epoch": 544} {"train_loss": -34.08482360839844, "global_step": 65843, "epoch": 544} {"train_loss": -32.4415168762207, "global_step": 65844, "epoch": 544} {"train_loss": -34.389068603515625, "global_step": 65845, "epoch": 544} {"train_loss": -33.57487106323242, "global_step": 65846, "epoch": 544} {"train_loss": -33.86417007446289, "global_step": 65847, "epoch": 544} {"train_loss": -33.870521545410156, "global_step": 65848, "epoch": 544} {"train_loss": -34.22212600708008, "global_step": 65849, "epoch": 544} {"train_loss": -34.52635192871094, "global_step": 65850, "epoch": 544} {"train_loss": -34.26205062866211, "global_step": 65851, "epoch": 544} {"train_loss": -34.454917907714844, "global_step": 65852, "epoch": 544} {"train_loss": -34.9403190612793, "global_step": 65853, "epoch": 544} {"train_loss": -34.30221176147461, "global_step": 65854, "epoch": 544} {"train_loss": -34.343563079833984, "global_step": 65855, "epoch": 544} {"train_loss": -34.43488311767578, "global_step": 65856, "epoch": 544} {"train_loss": -34.74445724487305, "global_step": 65857, "epoch": 544} {"train_loss": -34.282623291015625, "global_step": 65858, "epoch": 544} {"train_loss": -34.80771255493164, "global_step": 65859, "epoch": 544} {"train_loss": -34.97764205932617, "global_step": 65860, "epoch": 544} {"train_loss": -34.85829162597656, "global_step": 65861, "epoch": 544} {"train_loss": -35.12982177734375, "global_step": 65862, "epoch": 544} {"train_loss": -34.98307418823242, "global_step": 65863, "epoch": 544} {"train_loss": -34.94089126586914, "global_step": 65864, "epoch": 544} {"train_loss": -34.96479415893555, "global_step": 65865, "epoch": 544} {"train_loss": -35.23256301879883, "global_step": 65866, "epoch": 544} {"train_loss": -35.506629943847656, "global_step": 65867, "epoch": 544} {"train_loss": -35.2886848449707, "global_step": 65868, "epoch": 544} {"train_loss": -34.99043655395508, "global_step": 65869, "epoch": 544} {"train_loss": -35.85224151611328, "global_step": 65870, "epoch": 544} {"train_loss": -35.06602478027344, "global_step": 65871, "epoch": 544} {"train_loss": -35.3101692199707, "global_step": 65872, "epoch": 544} {"train_loss": -35.212066650390625, "global_step": 65873, "epoch": 544} {"train_loss": -36.02438735961914, "global_step": 65874, "epoch": 544} {"train_loss": -35.4757194519043, "global_step": 65875, "epoch": 544} {"train_loss": -35.827945709228516, "global_step": 65876, "epoch": 544} {"train_loss": -36.137786865234375, "global_step": 65877, "epoch": 544} {"train_loss": -35.51198959350586, "global_step": 65878, "epoch": 544} {"train_loss": -35.325950622558594, "global_step": 65879, "epoch": 544} {"train_loss": -35.48682403564453, "global_step": 65880, "epoch": 544} {"train_loss": -35.61478805541992, "global_step": 65881, "epoch": 544} {"train_loss": -35.24528121948242, "global_step": 65882, "epoch": 544} {"train_loss": -35.71577072143555, "global_step": 65883, "epoch": 544} {"train_loss": -36.23361587524414, "global_step": 65884, "epoch": 544} {"train_loss": -35.483089447021484, "global_step": 65885, "epoch": 544} {"train_loss": -35.39608383178711, "global_step": 65886, "epoch": 544} {"train_loss": -36.216156005859375, "global_step": 65887, "epoch": 544} {"train_loss": -35.989131927490234, "global_step": 65888, "epoch": 544} {"train_loss": -35.6767578125, "global_step": 65889, "epoch": 544} {"train_loss": -35.963287353515625, "global_step": 65890, "epoch": 544} {"train_loss": -36.19453430175781, "global_step": 65891, "epoch": 544} {"train_loss": -35.72136306762695, "global_step": 65892, "epoch": 544} {"train_loss": -35.400150299072266, "global_step": 65893, "epoch": 544} {"train_loss": -35.79282760620117, "global_step": 65894, "epoch": 544} {"train_loss": -36.5120964050293, "global_step": 65895, "epoch": 544} {"train_loss": -36.713966369628906, "global_step": 65896, "epoch": 544} {"train_loss": -36.39463806152344, "global_step": 65897, "epoch": 544} {"train_loss": -36.393333435058594, "global_step": 65898, "epoch": 544} {"train_loss": -36.579803466796875, "global_step": 65899, "epoch": 544} {"train_loss": -36.117897033691406, "global_step": 65900, "epoch": 544} {"train_loss": -36.97701644897461, "global_step": 65901, "epoch": 544} {"train_loss": -36.40721130371094, "global_step": 65902, "epoch": 544} {"train_loss": -36.364986419677734, "global_step": 65903, "epoch": 544} {"train_loss": -36.597835540771484, "global_step": 65904, "epoch": 544} {"train_loss": -36.69727325439453, "global_step": 65905, "epoch": 544} {"train_loss": -36.477378845214844, "global_step": 65906, "epoch": 544} {"train_loss": -36.687068939208984, "global_step": 65907, "epoch": 544} {"train_loss": -36.967041015625, "global_step": 65908, "epoch": 544} {"train_loss": -36.971397399902344, "global_step": 65909, "epoch": 544} {"train_loss": -36.85136795043945, "global_step": 65910, "epoch": 544} {"train_loss": -36.657371520996094, "global_step": 65911, "epoch": 544} {"train_loss": -36.44029998779297, "global_step": 65912, "epoch": 544} {"train_loss": -37.30916976928711, "global_step": 65913, "epoch": 544} {"train_loss": -36.826168060302734, "global_step": 65914, "epoch": 544} {"train_loss": -37.003623962402344, "global_step": 65915, "epoch": 544} {"train_loss": -36.34418487548828, "global_step": 65916, "epoch": 544} {"train_loss": -36.890132904052734, "global_step": 65917, "epoch": 544} {"train_loss": -37.04237747192383, "global_step": 65918, "epoch": 544} {"train_loss": -37.122642517089844, "global_step": 65919, "epoch": 544} {"train_loss": -36.52923583984375, "global_step": 65920, "epoch": 544} {"train_loss": -36.40757751464844, "global_step": 65921, "epoch": 544} {"train_loss": -36.843929290771484, "global_step": 65922, "epoch": 544} {"train_loss": -36.0162467956543, "global_step": 65923, "epoch": 544} {"train_loss": -35.625816345214844, "global_step": 65924, "epoch": 544} {"train_loss": -33.3624267578125, "global_step": 65925, "epoch": 544} {"train_loss": -32.14070129394531, "global_step": 65926, "epoch": 544} {"train_loss": -30.23846435546875, "global_step": 65927, "epoch": 544} {"train_loss": -27.717817306518555, "global_step": 65928, "epoch": 544} {"train_loss": -28.33808708190918, "global_step": 65929, "epoch": 544} {"train_loss": -33.886695861816406, "global_step": 65930, "epoch": 544} {"train_loss": -34.37725830078125, "global_step": 65931, "epoch": 544} {"train_loss": -32.28398132324219, "global_step": 65932, "epoch": 544} {"train_loss": -31.610891342163086, "global_step": 65933, "epoch": 544} {"train_loss": -34.09413528442383, "global_step": 65934, "epoch": 544} {"train_loss": -33.92531967163086, "global_step": 65935, "epoch": 544} {"train_loss": -33.288875579833984, "global_step": 65936, "epoch": 544} {"train_loss": -32.81551742553711, "global_step": 65937, "epoch": 544} {"train_loss": -32.690975189208984, "global_step": 65938, "epoch": 544} {"train_loss": -34.88837814331055, "global_step": 65939, "epoch": 544} {"train_loss": -34.555171966552734, "global_step": 65940, "epoch": 544} {"train_loss": -34.61863327026367, "global_step": 65941, "epoch": 544} {"train_loss": -34.375301361083984, "global_step": 65942, "epoch": 544} {"train_loss": -35.7207145690918, "global_step": 65943, "epoch": 544} {"train_loss": -34.76349264728136, "global_step": 65944, "epoch": 544, "val_loss": 2510402.5} {"train_loss": -34.323238372802734, "global_step": 65945, "epoch": 545} {"train_loss": -35.64101791381836, "global_step": 65946, "epoch": 545} {"train_loss": -33.9561767578125, "global_step": 65947, "epoch": 545} {"train_loss": -35.989479064941406, "global_step": 65948, "epoch": 545} {"train_loss": -35.33675765991211, "global_step": 65949, "epoch": 545} {"train_loss": -35.47774124145508, "global_step": 65950, "epoch": 545} {"train_loss": -35.94571304321289, "global_step": 65951, "epoch": 545} {"train_loss": -35.463809967041016, "global_step": 65952, "epoch": 545} {"train_loss": -35.408416748046875, "global_step": 65953, "epoch": 545} {"train_loss": -36.091304779052734, "global_step": 65954, "epoch": 545} {"train_loss": -36.294395446777344, "global_step": 65955, "epoch": 545} {"train_loss": -35.736053466796875, "global_step": 65956, "epoch": 545} {"train_loss": -35.95494079589844, "global_step": 65957, "epoch": 545} {"train_loss": -35.52958297729492, "global_step": 65958, "epoch": 545} {"train_loss": -36.08747482299805, "global_step": 65959, "epoch": 545} {"train_loss": -35.95840072631836, "global_step": 65960, "epoch": 545} {"train_loss": -36.08919906616211, "global_step": 65961, "epoch": 545} {"train_loss": -36.05386734008789, "global_step": 65962, "epoch": 545} {"train_loss": -36.68581771850586, "global_step": 65963, "epoch": 545} {"train_loss": -35.910030364990234, "global_step": 65964, "epoch": 545} {"train_loss": -36.37114334106445, "global_step": 65965, "epoch": 545} {"train_loss": -36.68805694580078, "global_step": 65966, "epoch": 545} {"train_loss": -36.23713302612305, "global_step": 65967, "epoch": 545} {"train_loss": -36.079505920410156, "global_step": 65968, "epoch": 545} {"train_loss": -36.704097747802734, "global_step": 65969, "epoch": 545} {"train_loss": -36.87691879272461, "global_step": 65970, "epoch": 545} {"train_loss": -36.727970123291016, "global_step": 65971, "epoch": 545} {"train_loss": -36.7365608215332, "global_step": 65972, "epoch": 545} {"train_loss": -37.018829345703125, "global_step": 65973, "epoch": 545} {"train_loss": -37.05146408081055, "global_step": 65974, "epoch": 545} {"train_loss": -36.87177658081055, "global_step": 65975, "epoch": 545} {"train_loss": -36.736732482910156, "global_step": 65976, "epoch": 545} {"train_loss": -36.29555892944336, "global_step": 65977, "epoch": 545} {"train_loss": -36.197113037109375, "global_step": 65978, "epoch": 545} {"train_loss": -34.75283432006836, "global_step": 65979, "epoch": 545} {"train_loss": -30.384536743164062, "global_step": 65980, "epoch": 545} {"train_loss": -19.490060806274414, "global_step": 65981, "epoch": 545} {"train_loss": -25.23370933532715, "global_step": 65982, "epoch": 545} {"train_loss": -35.485843658447266, "global_step": 65983, "epoch": 545} {"train_loss": -29.049596786499023, "global_step": 65984, "epoch": 545} {"train_loss": -35.206233978271484, "global_step": 65985, "epoch": 545} {"train_loss": -29.986576080322266, "global_step": 65986, "epoch": 545} {"train_loss": -34.712440490722656, "global_step": 65987, "epoch": 545} {"train_loss": -31.04938316345215, "global_step": 65988, "epoch": 545} {"train_loss": -35.2631721496582, "global_step": 65989, "epoch": 545} {"train_loss": -35.060726165771484, "global_step": 65990, "epoch": 545} {"train_loss": -31.190826416015625, "global_step": 65991, "epoch": 545} {"train_loss": -34.38311767578125, "global_step": 65992, "epoch": 545} {"train_loss": -35.13737869262695, "global_step": 65993, "epoch": 545} {"train_loss": -34.625640869140625, "global_step": 65994, "epoch": 545} {"train_loss": -34.6285514831543, "global_step": 65995, "epoch": 545} {"train_loss": -35.310916900634766, "global_step": 65996, "epoch": 545} {"train_loss": -35.130916595458984, "global_step": 65997, "epoch": 545} {"train_loss": -35.790428161621094, "global_step": 65998, "epoch": 545} {"train_loss": -35.5556526184082, "global_step": 65999, "epoch": 545} {"train_loss": -35.444580078125, "global_step": 66000, "epoch": 545} {"train_loss": -35.3355827331543, "global_step": 66001, "epoch": 545} {"train_loss": -36.083221435546875, "global_step": 66002, "epoch": 545} {"train_loss": -35.490577697753906, "global_step": 66003, "epoch": 545} {"train_loss": -36.2623405456543, "global_step": 66004, "epoch": 545} {"train_loss": -35.84989929199219, "global_step": 66005, "epoch": 545} {"train_loss": -35.58512496948242, "global_step": 66006, "epoch": 545} {"train_loss": -36.13904571533203, "global_step": 66007, "epoch": 545} {"train_loss": -36.206722259521484, "global_step": 66008, "epoch": 545} {"train_loss": -35.894710540771484, "global_step": 66009, "epoch": 545} {"train_loss": -36.225460052490234, "global_step": 66010, "epoch": 545} {"train_loss": -36.18008041381836, "global_step": 66011, "epoch": 545} {"train_loss": -36.42306137084961, "global_step": 66012, "epoch": 545} {"train_loss": -35.56301498413086, "global_step": 66013, "epoch": 545} {"train_loss": -36.52664566040039, "global_step": 66014, "epoch": 545} {"train_loss": -36.301856994628906, "global_step": 66015, "epoch": 545} {"train_loss": -36.261138916015625, "global_step": 66016, "epoch": 545} {"train_loss": -35.3028564453125, "global_step": 66017, "epoch": 545} {"train_loss": -35.762611389160156, "global_step": 66018, "epoch": 545} {"train_loss": -35.35361862182617, "global_step": 66019, "epoch": 545} {"train_loss": -35.6317253112793, "global_step": 66020, "epoch": 545} {"train_loss": -36.162200927734375, "global_step": 66021, "epoch": 545} {"train_loss": -36.60599899291992, "global_step": 66022, "epoch": 545} {"train_loss": -36.59456253051758, "global_step": 66023, "epoch": 545} {"train_loss": -35.88345718383789, "global_step": 66024, "epoch": 545} {"train_loss": -34.69993209838867, "global_step": 66025, "epoch": 545} {"train_loss": -32.18260955810547, "global_step": 66026, "epoch": 545} {"train_loss": -30.8005428314209, "global_step": 66027, "epoch": 545} {"train_loss": -27.965864181518555, "global_step": 66028, "epoch": 545} {"train_loss": -28.36224365234375, "global_step": 66029, "epoch": 545} {"train_loss": -33.49330520629883, "global_step": 66030, "epoch": 545} {"train_loss": -32.97344207763672, "global_step": 66031, "epoch": 545} {"train_loss": -31.95551872253418, "global_step": 66032, "epoch": 545} {"train_loss": -34.61033248901367, "global_step": 66033, "epoch": 545} {"train_loss": -33.95589828491211, "global_step": 66034, "epoch": 545} {"train_loss": -33.99540328979492, "global_step": 66035, "epoch": 545} {"train_loss": -35.48476791381836, "global_step": 66036, "epoch": 545} {"train_loss": -34.73091506958008, "global_step": 66037, "epoch": 545} {"train_loss": -35.102210998535156, "global_step": 66038, "epoch": 545} {"train_loss": -34.95258712768555, "global_step": 66039, "epoch": 545} {"train_loss": -34.05050277709961, "global_step": 66040, "epoch": 545} {"train_loss": -33.64311218261719, "global_step": 66041, "epoch": 545} {"train_loss": -35.343727111816406, "global_step": 66042, "epoch": 545} {"train_loss": -34.815059661865234, "global_step": 66043, "epoch": 545} {"train_loss": -34.48726272583008, "global_step": 66044, "epoch": 545} {"train_loss": -34.57925033569336, "global_step": 66045, "epoch": 545} {"train_loss": -35.8289680480957, "global_step": 66046, "epoch": 545} {"train_loss": -36.058250427246094, "global_step": 66047, "epoch": 545} {"train_loss": -35.23673629760742, "global_step": 66048, "epoch": 545} {"train_loss": -36.013675689697266, "global_step": 66049, "epoch": 545} {"train_loss": -35.752986907958984, "global_step": 66050, "epoch": 545} {"train_loss": -35.96342086791992, "global_step": 66051, "epoch": 545} {"train_loss": -35.69971466064453, "global_step": 66052, "epoch": 545} {"train_loss": -36.2308349609375, "global_step": 66053, "epoch": 545} {"train_loss": -36.083282470703125, "global_step": 66054, "epoch": 545} {"train_loss": -36.2557258605957, "global_step": 66055, "epoch": 545} {"train_loss": -36.0330924987793, "global_step": 66056, "epoch": 545} {"train_loss": -36.32233428955078, "global_step": 66057, "epoch": 545} {"train_loss": -36.356300354003906, "global_step": 66058, "epoch": 545} {"train_loss": -36.5037841796875, "global_step": 66059, "epoch": 545} {"train_loss": -35.89044189453125, "global_step": 66060, "epoch": 545} {"train_loss": -36.348182678222656, "global_step": 66061, "epoch": 545} {"train_loss": -36.25020980834961, "global_step": 66062, "epoch": 545} {"train_loss": -36.53965377807617, "global_step": 66063, "epoch": 545} {"train_loss": -36.60249710083008, "global_step": 66064, "epoch": 545} {"train_loss": -35.02124185798582, "global_step": 66065, "epoch": 545, "val_loss": 2495208.5} {"train_loss": -36.47206497192383, "global_step": 66066, "epoch": 546} {"train_loss": -36.67831802368164, "global_step": 66067, "epoch": 546} {"train_loss": -36.21700668334961, "global_step": 66068, "epoch": 546} {"train_loss": -36.534019470214844, "global_step": 66069, "epoch": 546} {"train_loss": -36.78078842163086, "global_step": 66070, "epoch": 546} {"train_loss": -36.813663482666016, "global_step": 66071, "epoch": 546} {"train_loss": -36.75440216064453, "global_step": 66072, "epoch": 546} {"train_loss": -36.73347091674805, "global_step": 66073, "epoch": 546} {"train_loss": -36.73960494995117, "global_step": 66074, "epoch": 546} {"train_loss": -36.96525192260742, "global_step": 66075, "epoch": 546} {"train_loss": -36.423492431640625, "global_step": 66076, "epoch": 546} {"train_loss": -37.268402099609375, "global_step": 66077, "epoch": 546} {"train_loss": -36.354888916015625, "global_step": 66078, "epoch": 546} {"train_loss": -36.48508834838867, "global_step": 66079, "epoch": 546} {"train_loss": -36.43528366088867, "global_step": 66080, "epoch": 546} {"train_loss": -36.96500015258789, "global_step": 66081, "epoch": 546} {"train_loss": -35.61184310913086, "global_step": 66082, "epoch": 546} {"train_loss": -35.984771728515625, "global_step": 66083, "epoch": 546} {"train_loss": -35.7615852355957, "global_step": 66084, "epoch": 546} {"train_loss": -36.18971633911133, "global_step": 66085, "epoch": 546} {"train_loss": -36.68442916870117, "global_step": 66086, "epoch": 546} {"train_loss": -36.08027267456055, "global_step": 66087, "epoch": 546} {"train_loss": -35.4837760925293, "global_step": 66088, "epoch": 546} {"train_loss": -36.88639831542969, "global_step": 66089, "epoch": 546} {"train_loss": -35.35060501098633, "global_step": 66090, "epoch": 546} {"train_loss": -35.64607620239258, "global_step": 66091, "epoch": 546} {"train_loss": -36.674617767333984, "global_step": 66092, "epoch": 546} {"train_loss": -34.910003662109375, "global_step": 66093, "epoch": 546} {"train_loss": -35.44284439086914, "global_step": 66094, "epoch": 546} {"train_loss": -35.78867721557617, "global_step": 66095, "epoch": 546} {"train_loss": -35.88994216918945, "global_step": 66096, "epoch": 546} {"train_loss": -36.165157318115234, "global_step": 66097, "epoch": 546} {"train_loss": -36.06319808959961, "global_step": 66098, "epoch": 546} {"train_loss": -36.210567474365234, "global_step": 66099, "epoch": 546} {"train_loss": -32.30656051635742, "global_step": 66100, "epoch": 546} {"train_loss": -30.154541015625, "global_step": 66101, "epoch": 546} {"train_loss": -33.68384552001953, "global_step": 66102, "epoch": 546} {"train_loss": -35.88079071044922, "global_step": 66103, "epoch": 546} {"train_loss": -33.87111282348633, "global_step": 66104, "epoch": 546} {"train_loss": -34.69753646850586, "global_step": 66105, "epoch": 546} {"train_loss": -31.1971492767334, "global_step": 66106, "epoch": 546} {"train_loss": -33.10648727416992, "global_step": 66107, "epoch": 546} {"train_loss": -34.869720458984375, "global_step": 66108, "epoch": 546} {"train_loss": -34.526878356933594, "global_step": 66109, "epoch": 546} {"train_loss": -34.5472297668457, "global_step": 66110, "epoch": 546} {"train_loss": -34.22837448120117, "global_step": 66111, "epoch": 546} {"train_loss": -33.213890075683594, "global_step": 66112, "epoch": 546} {"train_loss": -32.92765426635742, "global_step": 66113, "epoch": 546} {"train_loss": -32.59015655517578, "global_step": 66114, "epoch": 546} {"train_loss": -31.634733200073242, "global_step": 66115, "epoch": 546} {"train_loss": -33.483497619628906, "global_step": 66116, "epoch": 546} {"train_loss": -35.7938232421875, "global_step": 66117, "epoch": 546} {"train_loss": -35.15798568725586, "global_step": 66118, "epoch": 546} {"train_loss": -35.2464714050293, "global_step": 66119, "epoch": 546} {"train_loss": -35.6251335144043, "global_step": 66120, "epoch": 546} {"train_loss": -34.65487289428711, "global_step": 66121, "epoch": 546} {"train_loss": -34.54676055908203, "global_step": 66122, "epoch": 546} {"train_loss": -35.376094818115234, "global_step": 66123, "epoch": 546} {"train_loss": -35.039432525634766, "global_step": 66124, "epoch": 546} {"train_loss": -34.73723220825195, "global_step": 66125, "epoch": 546} {"train_loss": -35.63897705078125, "global_step": 66126, "epoch": 546} {"train_loss": -35.46006393432617, "global_step": 66127, "epoch": 546} {"train_loss": -35.46052932739258, "global_step": 66128, "epoch": 546} {"train_loss": -34.900489807128906, "global_step": 66129, "epoch": 546} {"train_loss": -35.64849853515625, "global_step": 66130, "epoch": 546} {"train_loss": -33.73124313354492, "global_step": 66131, "epoch": 546} {"train_loss": -35.48960494995117, "global_step": 66132, "epoch": 546} {"train_loss": -35.44865036010742, "global_step": 66133, "epoch": 546} {"train_loss": -35.63025665283203, "global_step": 66134, "epoch": 546} {"train_loss": -36.08552932739258, "global_step": 66135, "epoch": 546} {"train_loss": -35.66965103149414, "global_step": 66136, "epoch": 546} {"train_loss": -36.04096984863281, "global_step": 66137, "epoch": 546} {"train_loss": -35.82379150390625, "global_step": 66138, "epoch": 546} {"train_loss": -35.90370559692383, "global_step": 66139, "epoch": 546} {"train_loss": -36.167625427246094, "global_step": 66140, "epoch": 546} {"train_loss": -36.076358795166016, "global_step": 66141, "epoch": 546} {"train_loss": -35.856021881103516, "global_step": 66142, "epoch": 546} {"train_loss": -36.31693649291992, "global_step": 66143, "epoch": 546} {"train_loss": -36.128353118896484, "global_step": 66144, "epoch": 546} {"train_loss": -35.85407257080078, "global_step": 66145, "epoch": 546} {"train_loss": -35.63864517211914, "global_step": 66146, "epoch": 546} {"train_loss": -36.10000228881836, "global_step": 66147, "epoch": 546} {"train_loss": -36.515167236328125, "global_step": 66148, "epoch": 546} {"train_loss": -36.0196647644043, "global_step": 66149, "epoch": 546} {"train_loss": -35.946441650390625, "global_step": 66150, "epoch": 546} {"train_loss": -36.10927963256836, "global_step": 66151, "epoch": 546} {"train_loss": -36.57567596435547, "global_step": 66152, "epoch": 546} {"train_loss": -35.7814826965332, "global_step": 66153, "epoch": 546} {"train_loss": -35.1193962097168, "global_step": 66154, "epoch": 546} {"train_loss": -35.41487121582031, "global_step": 66155, "epoch": 546} {"train_loss": -36.00092697143555, "global_step": 66156, "epoch": 546} {"train_loss": -36.65005111694336, "global_step": 66157, "epoch": 546} {"train_loss": -36.44590377807617, "global_step": 66158, "epoch": 546} {"train_loss": -36.10414123535156, "global_step": 66159, "epoch": 546} {"train_loss": -35.63867950439453, "global_step": 66160, "epoch": 546} {"train_loss": -34.96589279174805, "global_step": 66161, "epoch": 546} {"train_loss": -34.77592086791992, "global_step": 66162, "epoch": 546} {"train_loss": -36.49214553833008, "global_step": 66163, "epoch": 546} {"train_loss": -36.532405853271484, "global_step": 66164, "epoch": 546} {"train_loss": -35.58645248413086, "global_step": 66165, "epoch": 546} {"train_loss": -36.91512680053711, "global_step": 66166, "epoch": 546} {"train_loss": -36.80817794799805, "global_step": 66167, "epoch": 546} {"train_loss": -36.209041595458984, "global_step": 66168, "epoch": 546} {"train_loss": -35.61376953125, "global_step": 66169, "epoch": 546} {"train_loss": -36.27744674682617, "global_step": 66170, "epoch": 546} {"train_loss": -36.313636779785156, "global_step": 66171, "epoch": 546} {"train_loss": -36.106258392333984, "global_step": 66172, "epoch": 546} {"train_loss": -35.936458587646484, "global_step": 66173, "epoch": 546} {"train_loss": -36.30306625366211, "global_step": 66174, "epoch": 546} {"train_loss": -36.00431442260742, "global_step": 66175, "epoch": 546} {"train_loss": -37.045955657958984, "global_step": 66176, "epoch": 546} {"train_loss": -36.23407745361328, "global_step": 66177, "epoch": 546} {"train_loss": -36.44537353515625, "global_step": 66178, "epoch": 546} {"train_loss": -34.98786163330078, "global_step": 66179, "epoch": 546} {"train_loss": -35.536128997802734, "global_step": 66180, "epoch": 546} {"train_loss": -35.708736419677734, "global_step": 66181, "epoch": 546} {"train_loss": -34.850276947021484, "global_step": 66182, "epoch": 546} {"train_loss": -34.9460563659668, "global_step": 66183, "epoch": 546} {"train_loss": -34.97072982788086, "global_step": 66184, "epoch": 546} {"train_loss": -35.95941925048828, "global_step": 66185, "epoch": 546} {"train_loss": -35.54333158761017, "global_step": 66186, "epoch": 546, "val_loss": 2500460.0} {"train_loss": -32.38331985473633, "global_step": 66187, "epoch": 547} {"train_loss": -33.6201171875, "global_step": 66188, "epoch": 547} {"train_loss": -34.12440490722656, "global_step": 66189, "epoch": 547} {"train_loss": -35.07485580444336, "global_step": 66190, "epoch": 547} {"train_loss": -35.40800094604492, "global_step": 66191, "epoch": 547} {"train_loss": -33.5828742980957, "global_step": 66192, "epoch": 547} {"train_loss": -34.2561149597168, "global_step": 66193, "epoch": 547} {"train_loss": -33.97265625, "global_step": 66194, "epoch": 547} {"train_loss": -34.09663009643555, "global_step": 66195, "epoch": 547} {"train_loss": -34.30367660522461, "global_step": 66196, "epoch": 547} {"train_loss": -35.123146057128906, "global_step": 66197, "epoch": 547} {"train_loss": -36.14667510986328, "global_step": 66198, "epoch": 547} {"train_loss": -35.08769226074219, "global_step": 66199, "epoch": 547} {"train_loss": -35.389400482177734, "global_step": 66200, "epoch": 547} {"train_loss": -35.835750579833984, "global_step": 66201, "epoch": 547} {"train_loss": -36.380149841308594, "global_step": 66202, "epoch": 547} {"train_loss": -34.868770599365234, "global_step": 66203, "epoch": 547} {"train_loss": -35.88771438598633, "global_step": 66204, "epoch": 547} {"train_loss": -36.3642578125, "global_step": 66205, "epoch": 547} {"train_loss": -36.12871170043945, "global_step": 66206, "epoch": 547} {"train_loss": -35.892459869384766, "global_step": 66207, "epoch": 547} {"train_loss": -36.29933166503906, "global_step": 66208, "epoch": 547} {"train_loss": -36.2415771484375, "global_step": 66209, "epoch": 547} {"train_loss": -35.475929260253906, "global_step": 66210, "epoch": 547} {"train_loss": -36.15814208984375, "global_step": 66211, "epoch": 547} {"train_loss": -36.4239387512207, "global_step": 66212, "epoch": 547} {"train_loss": -35.688575744628906, "global_step": 66213, "epoch": 547} {"train_loss": -35.29281234741211, "global_step": 66214, "epoch": 547} {"train_loss": -36.3099479675293, "global_step": 66215, "epoch": 547} {"train_loss": -35.5808219909668, "global_step": 66216, "epoch": 547} {"train_loss": -35.72970199584961, "global_step": 66217, "epoch": 547} {"train_loss": -35.483699798583984, "global_step": 66218, "epoch": 547} {"train_loss": -36.16718673706055, "global_step": 66219, "epoch": 547} {"train_loss": -34.926971435546875, "global_step": 66220, "epoch": 547} {"train_loss": -36.49803161621094, "global_step": 66221, "epoch": 547} {"train_loss": -36.21980285644531, "global_step": 66222, "epoch": 547} {"train_loss": -35.13509750366211, "global_step": 66223, "epoch": 547} {"train_loss": -36.00620651245117, "global_step": 66224, "epoch": 547} {"train_loss": -36.01968002319336, "global_step": 66225, "epoch": 547} {"train_loss": -34.47599792480469, "global_step": 66226, "epoch": 547} {"train_loss": -35.9141960144043, "global_step": 66227, "epoch": 547} {"train_loss": -36.02408218383789, "global_step": 66228, "epoch": 547} {"train_loss": -35.22200012207031, "global_step": 66229, "epoch": 547} {"train_loss": -35.49150466918945, "global_step": 66230, "epoch": 547} {"train_loss": -33.66145324707031, "global_step": 66231, "epoch": 547} {"train_loss": -34.86647415161133, "global_step": 66232, "epoch": 547} {"train_loss": -35.29050827026367, "global_step": 66233, "epoch": 547} {"train_loss": -34.26447677612305, "global_step": 66234, "epoch": 547} {"train_loss": -32.448326110839844, "global_step": 66235, "epoch": 547} {"train_loss": -35.473445892333984, "global_step": 66236, "epoch": 547} {"train_loss": -35.79063034057617, "global_step": 66237, "epoch": 547} {"train_loss": -34.10578918457031, "global_step": 66238, "epoch": 547} {"train_loss": -34.206298828125, "global_step": 66239, "epoch": 547} {"train_loss": -34.048439025878906, "global_step": 66240, "epoch": 547} {"train_loss": -31.301679611206055, "global_step": 66241, "epoch": 547} {"train_loss": -33.012245178222656, "global_step": 66242, "epoch": 547} {"train_loss": -34.68870162963867, "global_step": 66243, "epoch": 547} {"train_loss": -32.12144088745117, "global_step": 66244, "epoch": 547} {"train_loss": -31.26604652404785, "global_step": 66245, "epoch": 547} {"train_loss": -30.03140640258789, "global_step": 66246, "epoch": 547} {"train_loss": -33.912445068359375, "global_step": 66247, "epoch": 547} {"train_loss": -31.505462646484375, "global_step": 66248, "epoch": 547} {"train_loss": -32.12430191040039, "global_step": 66249, "epoch": 547} {"train_loss": -32.430397033691406, "global_step": 66250, "epoch": 547} {"train_loss": -32.67899703979492, "global_step": 66251, "epoch": 547} {"train_loss": -34.409725189208984, "global_step": 66252, "epoch": 547} {"train_loss": -30.99785804748535, "global_step": 66253, "epoch": 547} {"train_loss": -32.44221115112305, "global_step": 66254, "epoch": 547} {"train_loss": -30.427581787109375, "global_step": 66255, "epoch": 547} {"train_loss": -32.58461380004883, "global_step": 66256, "epoch": 547} {"train_loss": -33.31568145751953, "global_step": 66257, "epoch": 547} {"train_loss": -32.21503448486328, "global_step": 66258, "epoch": 547} {"train_loss": -32.78843688964844, "global_step": 66259, "epoch": 547} {"train_loss": -33.0078010559082, "global_step": 66260, "epoch": 547} {"train_loss": -32.95774459838867, "global_step": 66261, "epoch": 547} {"train_loss": -33.07710647583008, "global_step": 66262, "epoch": 547} {"train_loss": -34.508148193359375, "global_step": 66263, "epoch": 547} {"train_loss": -34.19341278076172, "global_step": 66264, "epoch": 547} {"train_loss": -33.2199821472168, "global_step": 66265, "epoch": 547} {"train_loss": -35.1879768371582, "global_step": 66266, "epoch": 547} {"train_loss": -34.037750244140625, "global_step": 66267, "epoch": 547} {"train_loss": -34.542335510253906, "global_step": 66268, "epoch": 547} {"train_loss": -33.696590423583984, "global_step": 66269, "epoch": 547} {"train_loss": -34.79513168334961, "global_step": 66270, "epoch": 547} {"train_loss": -34.288482666015625, "global_step": 66271, "epoch": 547} {"train_loss": -34.910884857177734, "global_step": 66272, "epoch": 547} {"train_loss": -34.29301834106445, "global_step": 66273, "epoch": 547} {"train_loss": -33.826412200927734, "global_step": 66274, "epoch": 547} {"train_loss": -35.31992721557617, "global_step": 66275, "epoch": 547} {"train_loss": -34.852378845214844, "global_step": 66276, "epoch": 547} {"train_loss": -34.3807373046875, "global_step": 66277, "epoch": 547} {"train_loss": -34.784420013427734, "global_step": 66278, "epoch": 547} {"train_loss": -34.40684127807617, "global_step": 66279, "epoch": 547} {"train_loss": -35.102962493896484, "global_step": 66280, "epoch": 547} {"train_loss": -34.915443420410156, "global_step": 66281, "epoch": 547} {"train_loss": -34.233924865722656, "global_step": 66282, "epoch": 547} {"train_loss": -35.530487060546875, "global_step": 66283, "epoch": 547} {"train_loss": -34.46049499511719, "global_step": 66284, "epoch": 547} {"train_loss": -35.386138916015625, "global_step": 66285, "epoch": 547} {"train_loss": -35.18482971191406, "global_step": 66286, "epoch": 547} {"train_loss": -35.1270637512207, "global_step": 66287, "epoch": 547} {"train_loss": -35.29971694946289, "global_step": 66288, "epoch": 547} {"train_loss": -35.7518196105957, "global_step": 66289, "epoch": 547} {"train_loss": -35.61720657348633, "global_step": 66290, "epoch": 547} {"train_loss": -35.30464553833008, "global_step": 66291, "epoch": 547} {"train_loss": -34.33462142944336, "global_step": 66292, "epoch": 547} {"train_loss": -35.29597473144531, "global_step": 66293, "epoch": 547} {"train_loss": -35.65298080444336, "global_step": 66294, "epoch": 547} {"train_loss": -35.85249710083008, "global_step": 66295, "epoch": 547} {"train_loss": -35.03990173339844, "global_step": 66296, "epoch": 547} {"train_loss": -35.83331298828125, "global_step": 66297, "epoch": 547} {"train_loss": -36.012596130371094, "global_step": 66298, "epoch": 547} {"train_loss": -35.54384994506836, "global_step": 66299, "epoch": 547} {"train_loss": -36.245906829833984, "global_step": 66300, "epoch": 547} {"train_loss": -36.190093994140625, "global_step": 66301, "epoch": 547} {"train_loss": -36.10341262817383, "global_step": 66302, "epoch": 547} {"train_loss": -35.14148712158203, "global_step": 66303, "epoch": 547} {"train_loss": -36.0721549987793, "global_step": 66304, "epoch": 547} {"train_loss": -36.16253662109375, "global_step": 66305, "epoch": 547} {"train_loss": -36.69210433959961, "global_step": 66306, "epoch": 547} {"train_loss": -34.658623324938056, "global_step": 66307, "epoch": 547, "val_loss": 2470948.25} {"train_loss": -35.4465217590332, "global_step": 66308, "epoch": 548} {"train_loss": -35.96369934082031, "global_step": 66309, "epoch": 548} {"train_loss": -36.11928176879883, "global_step": 66310, "epoch": 548} {"train_loss": -36.85304641723633, "global_step": 66311, "epoch": 548} {"train_loss": -36.57760238647461, "global_step": 66312, "epoch": 548} {"train_loss": -36.65021896362305, "global_step": 66313, "epoch": 548} {"train_loss": -36.468345642089844, "global_step": 66314, "epoch": 548} {"train_loss": -36.73728561401367, "global_step": 66315, "epoch": 548} {"train_loss": -36.80881881713867, "global_step": 66316, "epoch": 548} {"train_loss": -36.618316650390625, "global_step": 66317, "epoch": 548} {"train_loss": -36.553863525390625, "global_step": 66318, "epoch": 548} {"train_loss": -35.77071762084961, "global_step": 66319, "epoch": 548} {"train_loss": -36.71528625488281, "global_step": 66320, "epoch": 548} {"train_loss": -36.64478302001953, "global_step": 66321, "epoch": 548} {"train_loss": -36.49908447265625, "global_step": 66322, "epoch": 548} {"train_loss": -34.49820327758789, "global_step": 66323, "epoch": 548} {"train_loss": -34.369869232177734, "global_step": 66324, "epoch": 548} {"train_loss": -36.765869140625, "global_step": 66325, "epoch": 548} {"train_loss": -35.578575134277344, "global_step": 66326, "epoch": 548} {"train_loss": -34.9299201965332, "global_step": 66327, "epoch": 548} {"train_loss": -36.00747299194336, "global_step": 66328, "epoch": 548} {"train_loss": -35.7331657409668, "global_step": 66329, "epoch": 548} {"train_loss": -35.46733474731445, "global_step": 66330, "epoch": 548} {"train_loss": -35.88912582397461, "global_step": 66331, "epoch": 548} {"train_loss": -36.88300323486328, "global_step": 66332, "epoch": 548} {"train_loss": -35.44142532348633, "global_step": 66333, "epoch": 548} {"train_loss": -34.807491302490234, "global_step": 66334, "epoch": 548} {"train_loss": -33.31534957885742, "global_step": 66335, "epoch": 548} {"train_loss": -35.64506912231445, "global_step": 66336, "epoch": 548} {"train_loss": -36.239356994628906, "global_step": 66337, "epoch": 548} {"train_loss": -36.585052490234375, "global_step": 66338, "epoch": 548} {"train_loss": -34.651241302490234, "global_step": 66339, "epoch": 548} {"train_loss": -34.59348678588867, "global_step": 66340, "epoch": 548} {"train_loss": -34.716224670410156, "global_step": 66341, "epoch": 548} {"train_loss": -35.441524505615234, "global_step": 66342, "epoch": 548} {"train_loss": -36.0455322265625, "global_step": 66343, "epoch": 548} {"train_loss": -34.69880294799805, "global_step": 66344, "epoch": 548} {"train_loss": -31.8336238861084, "global_step": 66345, "epoch": 548} {"train_loss": -29.539365768432617, "global_step": 66346, "epoch": 548} {"train_loss": -33.84431457519531, "global_step": 66347, "epoch": 548} {"train_loss": -36.62641525268555, "global_step": 66348, "epoch": 548} {"train_loss": -33.65578842163086, "global_step": 66349, "epoch": 548} {"train_loss": -35.632789611816406, "global_step": 66350, "epoch": 548} {"train_loss": -35.140254974365234, "global_step": 66351, "epoch": 548} {"train_loss": -31.7823543548584, "global_step": 66352, "epoch": 548} {"train_loss": -35.360321044921875, "global_step": 66353, "epoch": 548} {"train_loss": -33.4034309387207, "global_step": 66354, "epoch": 548} {"train_loss": -35.105690002441406, "global_step": 66355, "epoch": 548} {"train_loss": -32.61021423339844, "global_step": 66356, "epoch": 548} {"train_loss": -34.352149963378906, "global_step": 66357, "epoch": 548} {"train_loss": -35.82291030883789, "global_step": 66358, "epoch": 548} {"train_loss": -34.763023376464844, "global_step": 66359, "epoch": 548} {"train_loss": -35.55016326904297, "global_step": 66360, "epoch": 548} {"train_loss": -34.77294921875, "global_step": 66361, "epoch": 548} {"train_loss": -33.53562545776367, "global_step": 66362, "epoch": 548} {"train_loss": -35.05705642700195, "global_step": 66363, "epoch": 548} {"train_loss": -33.860103607177734, "global_step": 66364, "epoch": 548} {"train_loss": -35.349998474121094, "global_step": 66365, "epoch": 548} {"train_loss": -36.043739318847656, "global_step": 66366, "epoch": 548} {"train_loss": -35.36007308959961, "global_step": 66367, "epoch": 548} {"train_loss": -34.718807220458984, "global_step": 66368, "epoch": 548} {"train_loss": -35.940185546875, "global_step": 66369, "epoch": 548} {"train_loss": -35.88026428222656, "global_step": 66370, "epoch": 548} {"train_loss": -35.020751953125, "global_step": 66371, "epoch": 548} {"train_loss": -36.05927658081055, "global_step": 66372, "epoch": 548} {"train_loss": -36.63507843017578, "global_step": 66373, "epoch": 548} {"train_loss": -33.6624755859375, "global_step": 66374, "epoch": 548} {"train_loss": -36.44801330566406, "global_step": 66375, "epoch": 548} {"train_loss": -36.57789993286133, "global_step": 66376, "epoch": 548} {"train_loss": -36.569602966308594, "global_step": 66377, "epoch": 548} {"train_loss": -36.28963851928711, "global_step": 66378, "epoch": 548} {"train_loss": -35.93650436401367, "global_step": 66379, "epoch": 548} {"train_loss": -36.03849411010742, "global_step": 66380, "epoch": 548} {"train_loss": -36.24949264526367, "global_step": 66381, "epoch": 548} {"train_loss": -36.33793258666992, "global_step": 66382, "epoch": 548} {"train_loss": -24.484622955322266, "global_step": 66383, "epoch": 548} {"train_loss": -35.7538948059082, "global_step": 66384, "epoch": 548} {"train_loss": -33.69757080078125, "global_step": 66385, "epoch": 548} {"train_loss": -33.94099426269531, "global_step": 66386, "epoch": 548} {"train_loss": -33.764583587646484, "global_step": 66387, "epoch": 548} {"train_loss": -34.83213424682617, "global_step": 66388, "epoch": 548} {"train_loss": -34.06326675415039, "global_step": 66389, "epoch": 548} {"train_loss": -33.8546142578125, "global_step": 66390, "epoch": 548} {"train_loss": -35.42672348022461, "global_step": 66391, "epoch": 548} {"train_loss": -34.50550079345703, "global_step": 66392, "epoch": 548} {"train_loss": -35.20832061767578, "global_step": 66393, "epoch": 548} {"train_loss": -34.63908004760742, "global_step": 66394, "epoch": 548} {"train_loss": -35.092987060546875, "global_step": 66395, "epoch": 548} {"train_loss": -33.93036651611328, "global_step": 66396, "epoch": 548} {"train_loss": -34.252296447753906, "global_step": 66397, "epoch": 548} {"train_loss": -35.013824462890625, "global_step": 66398, "epoch": 548} {"train_loss": -34.34413528442383, "global_step": 66399, "epoch": 548} {"train_loss": -34.95853805541992, "global_step": 66400, "epoch": 548} {"train_loss": -34.020320892333984, "global_step": 66401, "epoch": 548} {"train_loss": -34.54193878173828, "global_step": 66402, "epoch": 548} {"train_loss": -35.85700225830078, "global_step": 66403, "epoch": 548} {"train_loss": -34.49007034301758, "global_step": 66404, "epoch": 548} {"train_loss": -35.526493072509766, "global_step": 66405, "epoch": 548} {"train_loss": -34.339508056640625, "global_step": 66406, "epoch": 548} {"train_loss": -34.092376708984375, "global_step": 66407, "epoch": 548} {"train_loss": -31.108692169189453, "global_step": 66408, "epoch": 548} {"train_loss": -34.94603729248047, "global_step": 66409, "epoch": 548} {"train_loss": -35.13984680175781, "global_step": 66410, "epoch": 548} {"train_loss": -34.54829025268555, "global_step": 66411, "epoch": 548} {"train_loss": -33.44947052001953, "global_step": 66412, "epoch": 548} {"train_loss": -35.58488845825195, "global_step": 66413, "epoch": 548} {"train_loss": -34.658363342285156, "global_step": 66414, "epoch": 548} {"train_loss": -34.39457321166992, "global_step": 66415, "epoch": 548} {"train_loss": -34.954097747802734, "global_step": 66416, "epoch": 548} {"train_loss": -35.236793518066406, "global_step": 66417, "epoch": 548} {"train_loss": -35.14811325073242, "global_step": 66418, "epoch": 548} {"train_loss": -35.318389892578125, "global_step": 66419, "epoch": 548} {"train_loss": -35.057247161865234, "global_step": 66420, "epoch": 548} {"train_loss": -35.47924041748047, "global_step": 66421, "epoch": 548} {"train_loss": -34.02421188354492, "global_step": 66422, "epoch": 548} {"train_loss": -34.91132736206055, "global_step": 66423, "epoch": 548} {"train_loss": -35.335662841796875, "global_step": 66424, "epoch": 548} {"train_loss": -35.57307052612305, "global_step": 66425, "epoch": 548} {"train_loss": -35.53676986694336, "global_step": 66426, "epoch": 548} {"train_loss": -35.658729553222656, "global_step": 66427, "epoch": 548} {"train_loss": -35.02843748045362, "global_step": 66428, "epoch": 548, "val_loss": 2561876.75} {"train_loss": -35.53078079223633, "global_step": 66429, "epoch": 549} {"train_loss": -36.21706771850586, "global_step": 66430, "epoch": 549} {"train_loss": -35.64478302001953, "global_step": 66431, "epoch": 549} {"train_loss": -35.727535247802734, "global_step": 66432, "epoch": 549} {"train_loss": -35.78120040893555, "global_step": 66433, "epoch": 549} {"train_loss": -35.86298751831055, "global_step": 66434, "epoch": 549} {"train_loss": -36.449195861816406, "global_step": 66435, "epoch": 549} {"train_loss": -35.64497756958008, "global_step": 66436, "epoch": 549} {"train_loss": -36.138954162597656, "global_step": 66437, "epoch": 549} {"train_loss": -36.13010787963867, "global_step": 66438, "epoch": 549} {"train_loss": -35.28995132446289, "global_step": 66439, "epoch": 549} {"train_loss": -36.15719223022461, "global_step": 66440, "epoch": 549} {"train_loss": -36.06353759765625, "global_step": 66441, "epoch": 549} {"train_loss": -36.36860275268555, "global_step": 66442, "epoch": 549} {"train_loss": -36.436561584472656, "global_step": 66443, "epoch": 549} {"train_loss": -36.24068069458008, "global_step": 66444, "epoch": 549} {"train_loss": -36.32375717163086, "global_step": 66445, "epoch": 549} {"train_loss": -36.775665283203125, "global_step": 66446, "epoch": 549} {"train_loss": -36.340667724609375, "global_step": 66447, "epoch": 549} {"train_loss": -36.360137939453125, "global_step": 66448, "epoch": 549} {"train_loss": -36.22722625732422, "global_step": 66449, "epoch": 549} {"train_loss": -36.21076202392578, "global_step": 66450, "epoch": 549} {"train_loss": -36.500911712646484, "global_step": 66451, "epoch": 549} {"train_loss": -36.18657302856445, "global_step": 66452, "epoch": 549} {"train_loss": -36.3268928527832, "global_step": 66453, "epoch": 549} {"train_loss": -36.90199279785156, "global_step": 66454, "epoch": 549} {"train_loss": -36.170780181884766, "global_step": 66455, "epoch": 549} {"train_loss": -36.17594528198242, "global_step": 66456, "epoch": 549} {"train_loss": -36.798954010009766, "global_step": 66457, "epoch": 549} {"train_loss": -35.58442306518555, "global_step": 66458, "epoch": 549} {"train_loss": -36.6937370300293, "global_step": 66459, "epoch": 549} {"train_loss": -36.26752853393555, "global_step": 66460, "epoch": 549} {"train_loss": -36.89620590209961, "global_step": 66461, "epoch": 549} {"train_loss": -35.208595275878906, "global_step": 66462, "epoch": 549} {"train_loss": -33.39496994018555, "global_step": 66463, "epoch": 549} {"train_loss": -30.176502227783203, "global_step": 66464, "epoch": 549} {"train_loss": -26.621994018554688, "global_step": 66465, "epoch": 549} {"train_loss": -24.368940353393555, "global_step": 66466, "epoch": 549} {"train_loss": -32.63955307006836, "global_step": 66467, "epoch": 549} {"train_loss": -36.3658447265625, "global_step": 66468, "epoch": 549} {"train_loss": -31.124897003173828, "global_step": 66469, "epoch": 549} {"train_loss": -32.74436569213867, "global_step": 66470, "epoch": 549} {"train_loss": -35.95321273803711, "global_step": 66471, "epoch": 549} {"train_loss": -34.0485725402832, "global_step": 66472, "epoch": 549} {"train_loss": -33.891998291015625, "global_step": 66473, "epoch": 549} {"train_loss": -34.21136474609375, "global_step": 66474, "epoch": 549} {"train_loss": -32.94630432128906, "global_step": 66475, "epoch": 549} {"train_loss": -31.230640411376953, "global_step": 66476, "epoch": 549} {"train_loss": -34.57933044433594, "global_step": 66477, "epoch": 549} {"train_loss": -34.61037826538086, "global_step": 66478, "epoch": 549} {"train_loss": -32.61005783081055, "global_step": 66479, "epoch": 549} {"train_loss": -34.240936279296875, "global_step": 66480, "epoch": 549} {"train_loss": -32.81947708129883, "global_step": 66481, "epoch": 549} {"train_loss": -34.2474365234375, "global_step": 66482, "epoch": 549} {"train_loss": -34.7140998840332, "global_step": 66483, "epoch": 549} {"train_loss": -33.000484466552734, "global_step": 66484, "epoch": 549} {"train_loss": -33.74597930908203, "global_step": 66485, "epoch": 549} {"train_loss": -33.96364974975586, "global_step": 66486, "epoch": 549} {"train_loss": -33.53019332885742, "global_step": 66487, "epoch": 549} {"train_loss": -34.0853271484375, "global_step": 66488, "epoch": 549} {"train_loss": -34.95046615600586, "global_step": 66489, "epoch": 549} {"train_loss": -33.6959342956543, "global_step": 66490, "epoch": 549} {"train_loss": -35.255672454833984, "global_step": 66491, "epoch": 549} {"train_loss": -35.74345016479492, "global_step": 66492, "epoch": 549} {"train_loss": -33.56650924682617, "global_step": 66493, "epoch": 549} {"train_loss": -36.13668441772461, "global_step": 66494, "epoch": 549} {"train_loss": -35.33787155151367, "global_step": 66495, "epoch": 549} {"train_loss": -34.02317428588867, "global_step": 66496, "epoch": 549} {"train_loss": -35.46990966796875, "global_step": 66497, "epoch": 549} {"train_loss": -36.02555465698242, "global_step": 66498, "epoch": 549} {"train_loss": -36.16713333129883, "global_step": 66499, "epoch": 549} {"train_loss": -35.09132766723633, "global_step": 66500, "epoch": 549} {"train_loss": -36.018375396728516, "global_step": 66501, "epoch": 549} {"train_loss": -35.75628662109375, "global_step": 66502, "epoch": 549} {"train_loss": -36.134857177734375, "global_step": 66503, "epoch": 549} {"train_loss": -36.03107452392578, "global_step": 66504, "epoch": 549} {"train_loss": -35.84787368774414, "global_step": 66505, "epoch": 549} {"train_loss": -36.48823165893555, "global_step": 66506, "epoch": 549} {"train_loss": -36.12913131713867, "global_step": 66507, "epoch": 549} {"train_loss": -35.62037658691406, "global_step": 66508, "epoch": 549} {"train_loss": -36.06827926635742, "global_step": 66509, "epoch": 549} {"train_loss": -36.87430953979492, "global_step": 66510, "epoch": 549} {"train_loss": -36.33625030517578, "global_step": 66511, "epoch": 549} {"train_loss": -36.01179122924805, "global_step": 66512, "epoch": 549} {"train_loss": -34.878841400146484, "global_step": 66513, "epoch": 549} {"train_loss": -36.590538024902344, "global_step": 66514, "epoch": 549} {"train_loss": -35.376747131347656, "global_step": 66515, "epoch": 549} {"train_loss": -36.555477142333984, "global_step": 66516, "epoch": 549} {"train_loss": -36.70198440551758, "global_step": 66517, "epoch": 549} {"train_loss": -35.64005661010742, "global_step": 66518, "epoch": 549} {"train_loss": -36.40109634399414, "global_step": 66519, "epoch": 549} {"train_loss": -36.38899612426758, "global_step": 66520, "epoch": 549} {"train_loss": -36.63728332519531, "global_step": 66521, "epoch": 549} {"train_loss": -36.4764518737793, "global_step": 66522, "epoch": 549} {"train_loss": -36.662841796875, "global_step": 66523, "epoch": 549} {"train_loss": -35.4692268371582, "global_step": 66524, "epoch": 549} {"train_loss": -36.04022216796875, "global_step": 66525, "epoch": 549} {"train_loss": -33.582332611083984, "global_step": 66526, "epoch": 549} {"train_loss": -34.660316467285156, "global_step": 66527, "epoch": 549} {"train_loss": -35.14680862426758, "global_step": 66528, "epoch": 549} {"train_loss": -36.20133972167969, "global_step": 66529, "epoch": 549} {"train_loss": -34.65882873535156, "global_step": 66530, "epoch": 549} {"train_loss": -35.299922943115234, "global_step": 66531, "epoch": 549} {"train_loss": -35.17080307006836, "global_step": 66532, "epoch": 549} {"train_loss": -35.92301559448242, "global_step": 66533, "epoch": 549} {"train_loss": -36.75505828857422, "global_step": 66534, "epoch": 549} {"train_loss": -36.235198974609375, "global_step": 66535, "epoch": 549} {"train_loss": -35.599403381347656, "global_step": 66536, "epoch": 549} {"train_loss": -34.92698287963867, "global_step": 66537, "epoch": 549} {"train_loss": -35.20463562011719, "global_step": 66538, "epoch": 549} {"train_loss": -36.340797424316406, "global_step": 66539, "epoch": 549} {"train_loss": -36.713436126708984, "global_step": 66540, "epoch": 549} {"train_loss": -36.61223602294922, "global_step": 66541, "epoch": 549} {"train_loss": -36.391353607177734, "global_step": 66542, "epoch": 549} {"train_loss": -36.67849349975586, "global_step": 66543, "epoch": 549} {"train_loss": -35.277339935302734, "global_step": 66544, "epoch": 549} {"train_loss": -36.086544036865234, "global_step": 66545, "epoch": 549} {"train_loss": -36.60367965698242, "global_step": 66546, "epoch": 549} {"train_loss": -36.65546798706055, "global_step": 66547, "epoch": 549} {"train_loss": -36.66769027709961, "global_step": 66548, "epoch": 549} {"train_loss": -35.26230225681273, "global_step": 66549, "epoch": 549, "val_loss": 2708579.75} {"train_loss": -36.34137725830078, "global_step": 66550, "epoch": 550} {"train_loss": -36.70528030395508, "global_step": 66551, "epoch": 550} {"train_loss": -36.25990295410156, "global_step": 66552, "epoch": 550} {"train_loss": -36.16530990600586, "global_step": 66553, "epoch": 550} {"train_loss": -34.541805267333984, "global_step": 66554, "epoch": 550} {"train_loss": -35.91970443725586, "global_step": 66555, "epoch": 550} {"train_loss": -36.1975212097168, "global_step": 66556, "epoch": 550} {"train_loss": -35.47196960449219, "global_step": 66557, "epoch": 550} {"train_loss": -32.36652374267578, "global_step": 66558, "epoch": 550} {"train_loss": -32.21491622924805, "global_step": 66559, "epoch": 550} {"train_loss": -36.0297737121582, "global_step": 66560, "epoch": 550} {"train_loss": -34.63410568237305, "global_step": 66561, "epoch": 550} {"train_loss": -29.52813720703125, "global_step": 66562, "epoch": 550} {"train_loss": -29.801618576049805, "global_step": 66563, "epoch": 550} {"train_loss": -36.36015701293945, "global_step": 66564, "epoch": 550} {"train_loss": -33.08933639526367, "global_step": 66565, "epoch": 550} {"train_loss": -32.18529510498047, "global_step": 66566, "epoch": 550} {"train_loss": -35.701595306396484, "global_step": 66567, "epoch": 550} {"train_loss": -32.98655319213867, "global_step": 66568, "epoch": 550} {"train_loss": -35.75651550292969, "global_step": 66569, "epoch": 550} {"train_loss": -32.13182067871094, "global_step": 66570, "epoch": 550} {"train_loss": -34.92799377441406, "global_step": 66571, "epoch": 550} {"train_loss": -34.88874816894531, "global_step": 66572, "epoch": 550} {"train_loss": -35.5085334777832, "global_step": 66573, "epoch": 550} {"train_loss": -29.52495765686035, "global_step": 66574, "epoch": 550} {"train_loss": -35.1985969543457, "global_step": 66575, "epoch": 550} {"train_loss": -34.898921966552734, "global_step": 66576, "epoch": 550} {"train_loss": -33.42084503173828, "global_step": 66577, "epoch": 550} {"train_loss": -30.595571517944336, "global_step": 66578, "epoch": 550} {"train_loss": -32.846893310546875, "global_step": 66579, "epoch": 550} {"train_loss": -32.13790512084961, "global_step": 66580, "epoch": 550} {"train_loss": -33.972900390625, "global_step": 66581, "epoch": 550} {"train_loss": -29.413074493408203, "global_step": 66582, "epoch": 550} {"train_loss": -34.378780364990234, "global_step": 66583, "epoch": 550} {"train_loss": -33.2818603515625, "global_step": 66584, "epoch": 550} {"train_loss": -33.472713470458984, "global_step": 66585, "epoch": 550} {"train_loss": -31.119632720947266, "global_step": 66586, "epoch": 550} {"train_loss": -33.96571731567383, "global_step": 66587, "epoch": 550} {"train_loss": -33.54276657104492, "global_step": 66588, "epoch": 550} {"train_loss": -34.94505310058594, "global_step": 66589, "epoch": 550} {"train_loss": -34.7349967956543, "global_step": 66590, "epoch": 550} {"train_loss": -34.49414825439453, "global_step": 66591, "epoch": 550} {"train_loss": -34.41358184814453, "global_step": 66592, "epoch": 550} {"train_loss": -34.989776611328125, "global_step": 66593, "epoch": 550} {"train_loss": -34.761558532714844, "global_step": 66594, "epoch": 550} {"train_loss": -34.42802047729492, "global_step": 66595, "epoch": 550} {"train_loss": -34.54840850830078, "global_step": 66596, "epoch": 550} {"train_loss": -35.237037658691406, "global_step": 66597, "epoch": 550} {"train_loss": -34.69512939453125, "global_step": 66598, "epoch": 550} {"train_loss": -31.474811553955078, "global_step": 66599, "epoch": 550} {"train_loss": -35.01456069946289, "global_step": 66600, "epoch": 550} {"train_loss": -34.540931701660156, "global_step": 66601, "epoch": 550} {"train_loss": -34.0091438293457, "global_step": 66602, "epoch": 550} {"train_loss": -32.721893310546875, "global_step": 66603, "epoch": 550} {"train_loss": -33.939178466796875, "global_step": 66604, "epoch": 550} {"train_loss": -35.097496032714844, "global_step": 66605, "epoch": 550} {"train_loss": -33.05093002319336, "global_step": 66606, "epoch": 550} {"train_loss": -35.5174560546875, "global_step": 66607, "epoch": 550} {"train_loss": -35.446834564208984, "global_step": 66608, "epoch": 550} {"train_loss": -35.399261474609375, "global_step": 66609, "epoch": 550} {"train_loss": -35.08266830444336, "global_step": 66610, "epoch": 550} {"train_loss": -35.18408203125, "global_step": 66611, "epoch": 550} {"train_loss": -35.146636962890625, "global_step": 66612, "epoch": 550} {"train_loss": -35.65597152709961, "global_step": 66613, "epoch": 550} {"train_loss": -35.778926849365234, "global_step": 66614, "epoch": 550} {"train_loss": -35.828731536865234, "global_step": 66615, "epoch": 550} {"train_loss": -34.92880630493164, "global_step": 66616, "epoch": 550} {"train_loss": -35.51594161987305, "global_step": 66617, "epoch": 550} {"train_loss": -35.67372131347656, "global_step": 66618, "epoch": 550} {"train_loss": -35.491302490234375, "global_step": 66619, "epoch": 550} {"train_loss": -35.38370895385742, "global_step": 66620, "epoch": 550} {"train_loss": -35.799983978271484, "global_step": 66621, "epoch": 550} {"train_loss": -35.91546630859375, "global_step": 66622, "epoch": 550} {"train_loss": -35.537078857421875, "global_step": 66623, "epoch": 550} {"train_loss": -36.18416213989258, "global_step": 66624, "epoch": 550} {"train_loss": -35.0068359375, "global_step": 66625, "epoch": 550} {"train_loss": -35.35186767578125, "global_step": 66626, "epoch": 550} {"train_loss": -35.22672653198242, "global_step": 66627, "epoch": 550} {"train_loss": -34.45484924316406, "global_step": 66628, "epoch": 550} {"train_loss": -36.086219787597656, "global_step": 66629, "epoch": 550} {"train_loss": -35.65574264526367, "global_step": 66630, "epoch": 550} {"train_loss": -35.89974594116211, "global_step": 66631, "epoch": 550} {"train_loss": -36.02378463745117, "global_step": 66632, "epoch": 550} {"train_loss": -36.09013366699219, "global_step": 66633, "epoch": 550} {"train_loss": -36.22517776489258, "global_step": 66634, "epoch": 550} {"train_loss": -35.15633773803711, "global_step": 66635, "epoch": 550} {"train_loss": -36.0943489074707, "global_step": 66636, "epoch": 550} {"train_loss": -36.33590316772461, "global_step": 66637, "epoch": 550} {"train_loss": -35.48348617553711, "global_step": 66638, "epoch": 550} {"train_loss": -35.830101013183594, "global_step": 66639, "epoch": 550} {"train_loss": -35.781978607177734, "global_step": 66640, "epoch": 550} {"train_loss": -35.41889953613281, "global_step": 66641, "epoch": 550} {"train_loss": -35.55141830444336, "global_step": 66642, "epoch": 550} {"train_loss": -35.622650146484375, "global_step": 66643, "epoch": 550} {"train_loss": -36.03276824951172, "global_step": 66644, "epoch": 550} {"train_loss": -36.145320892333984, "global_step": 66645, "epoch": 550} {"train_loss": -34.9694938659668, "global_step": 66646, "epoch": 550} {"train_loss": -34.87862014770508, "global_step": 66647, "epoch": 550} {"train_loss": -35.10614013671875, "global_step": 66648, "epoch": 550} {"train_loss": -35.9556999206543, "global_step": 66649, "epoch": 550} {"train_loss": -36.15583419799805, "global_step": 66650, "epoch": 550} {"train_loss": -36.535335540771484, "global_step": 66651, "epoch": 550} {"train_loss": -35.00505828857422, "global_step": 66652, "epoch": 550} {"train_loss": -34.94416427612305, "global_step": 66653, "epoch": 550} {"train_loss": -35.069732666015625, "global_step": 66654, "epoch": 550} {"train_loss": -36.00120162963867, "global_step": 66655, "epoch": 550} {"train_loss": -36.63050079345703, "global_step": 66656, "epoch": 550} {"train_loss": -35.4318962097168, "global_step": 66657, "epoch": 550} {"train_loss": -35.18510437011719, "global_step": 66658, "epoch": 550} {"train_loss": -35.6438102722168, "global_step": 66659, "epoch": 550} {"train_loss": -36.607540130615234, "global_step": 66660, "epoch": 550} {"train_loss": -36.27725601196289, "global_step": 66661, "epoch": 550} {"train_loss": -36.10505294799805, "global_step": 66662, "epoch": 550} {"train_loss": -35.913421630859375, "global_step": 66663, "epoch": 550} {"train_loss": -35.7423210144043, "global_step": 66664, "epoch": 550} {"train_loss": -36.02531814575195, "global_step": 66665, "epoch": 550} {"train_loss": -35.62675094604492, "global_step": 66666, "epoch": 550} {"train_loss": -35.352386474609375, "global_step": 66667, "epoch": 550} {"train_loss": -35.86912155151367, "global_step": 66668, "epoch": 550} {"train_loss": -35.007537841796875, "global_step": 66669, "epoch": 550} {"train_loss": -34.836499726476745, "global_step": 66670, "epoch": 550, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4400000": 1.0, "test/sim_max_reward_4400001": 1.0, "test/sim_max_reward_4400002": 1.0, "test/sim_max_reward_4400003": 0.0, "test/sim_max_reward_4400004": 1.0, "test/sim_max_reward_4400005": 1.0, "test/sim_max_reward_4400006": 1.0, "test/sim_max_reward_4400007": 1.0, "test/sim_max_reward_4400008": 1.0, "test/sim_max_reward_4400009": 1.0, "test/sim_max_reward_4400010": 1.0, "test/sim_max_reward_4400011": 1.0, "test/sim_max_reward_4400012": 1.0, "test/sim_max_reward_4400013": 1.0, "test/sim_max_reward_4400014": 1.0, "test/sim_max_reward_4400015": 1.0, "test/sim_max_reward_4400016": 1.0, "test/sim_max_reward_4400017": 1.0, "test/sim_max_reward_4400018": 1.0, "test/sim_max_reward_4400019": 1.0, "test/sim_max_reward_4400020": 1.0, "test/sim_max_reward_4400021": 1.0, "train/mean_score": 1.0, "test/mean_score": 0.9545454545454546, "val_loss": 2613153.25} {"train_loss": -35.12751007080078, "global_step": 66671, "epoch": 551} {"train_loss": -36.24479293823242, "global_step": 66672, "epoch": 551} {"train_loss": -35.302791595458984, "global_step": 66673, "epoch": 551} {"train_loss": -35.870052337646484, "global_step": 66674, "epoch": 551} {"train_loss": -35.32621383666992, "global_step": 66675, "epoch": 551} {"train_loss": -34.57119369506836, "global_step": 66676, "epoch": 551} {"train_loss": -36.14582443237305, "global_step": 66677, "epoch": 551} {"train_loss": -35.73826599121094, "global_step": 66678, "epoch": 551} {"train_loss": -35.482688903808594, "global_step": 66679, "epoch": 551} {"train_loss": -36.2280387878418, "global_step": 66680, "epoch": 551} {"train_loss": -36.13503646850586, "global_step": 66681, "epoch": 551} {"train_loss": -35.34339141845703, "global_step": 66682, "epoch": 551} {"train_loss": -35.361671447753906, "global_step": 66683, "epoch": 551} {"train_loss": -35.9871711730957, "global_step": 66684, "epoch": 551} {"train_loss": -35.82452392578125, "global_step": 66685, "epoch": 551} {"train_loss": -34.97271728515625, "global_step": 66686, "epoch": 551} {"train_loss": -36.03596115112305, "global_step": 66687, "epoch": 551} {"train_loss": -36.576351165771484, "global_step": 66688, "epoch": 551} {"train_loss": -36.089046478271484, "global_step": 66689, "epoch": 551} {"train_loss": -36.5355339050293, "global_step": 66690, "epoch": 551} {"train_loss": -35.966651916503906, "global_step": 66691, "epoch": 551} {"train_loss": -36.57301712036133, "global_step": 66692, "epoch": 551} {"train_loss": -36.03400421142578, "global_step": 66693, "epoch": 551} {"train_loss": -36.243621826171875, "global_step": 66694, "epoch": 551} {"train_loss": -33.813228607177734, "global_step": 66695, "epoch": 551} {"train_loss": -35.858638763427734, "global_step": 66696, "epoch": 551} {"train_loss": -36.23208236694336, "global_step": 66697, "epoch": 551} {"train_loss": -36.526649475097656, "global_step": 66698, "epoch": 551} {"train_loss": -36.57685470581055, "global_step": 66699, "epoch": 551} {"train_loss": -36.169166564941406, "global_step": 66700, "epoch": 551} {"train_loss": -36.27626419067383, "global_step": 66701, "epoch": 551} {"train_loss": -36.5631217956543, "global_step": 66702, "epoch": 551} {"train_loss": -35.850528717041016, "global_step": 66703, "epoch": 551} {"train_loss": -35.59383773803711, "global_step": 66704, "epoch": 551} {"train_loss": -36.3343505859375, "global_step": 66705, "epoch": 551} {"train_loss": -35.8377685546875, "global_step": 66706, "epoch": 551} {"train_loss": -36.39289474487305, "global_step": 66707, "epoch": 551} {"train_loss": -35.368492126464844, "global_step": 66708, "epoch": 551} {"train_loss": -29.156024932861328, "global_step": 66709, "epoch": 551} {"train_loss": -22.867719650268555, "global_step": 66710, "epoch": 551} {"train_loss": -6.922094821929932, "global_step": 66711, "epoch": 551} {"train_loss": -15.542132377624512, "global_step": 66712, "epoch": 551} {"train_loss": -33.312435150146484, "global_step": 66713, "epoch": 551} {"train_loss": -28.05423355102539, "global_step": 66714, "epoch": 551} {"train_loss": -29.5926570892334, "global_step": 66715, "epoch": 551} {"train_loss": -31.340377807617188, "global_step": 66716, "epoch": 551} {"train_loss": -33.86237335205078, "global_step": 66717, "epoch": 551} {"train_loss": -30.638446807861328, "global_step": 66718, "epoch": 551} {"train_loss": -35.323177337646484, "global_step": 66719, "epoch": 551} {"train_loss": -31.026926040649414, "global_step": 66720, "epoch": 551} {"train_loss": -32.50175857543945, "global_step": 66721, "epoch": 551} {"train_loss": -33.58645248413086, "global_step": 66722, "epoch": 551} {"train_loss": -32.481971740722656, "global_step": 66723, "epoch": 551} {"train_loss": -33.44363021850586, "global_step": 66724, "epoch": 551} {"train_loss": -34.279300689697266, "global_step": 66725, "epoch": 551} {"train_loss": -33.87443923950195, "global_step": 66726, "epoch": 551} {"train_loss": -33.59642791748047, "global_step": 66727, "epoch": 551} {"train_loss": -35.166282653808594, "global_step": 66728, "epoch": 551} {"train_loss": -34.786739349365234, "global_step": 66729, "epoch": 551} {"train_loss": -32.52702713012695, "global_step": 66730, "epoch": 551} {"train_loss": -34.90389633178711, "global_step": 66731, "epoch": 551} {"train_loss": -35.248382568359375, "global_step": 66732, "epoch": 551} {"train_loss": -35.08628845214844, "global_step": 66733, "epoch": 551} {"train_loss": -35.121700286865234, "global_step": 66734, "epoch": 551} {"train_loss": -35.39817810058594, "global_step": 66735, "epoch": 551} {"train_loss": -35.54093551635742, "global_step": 66736, "epoch": 551} {"train_loss": -35.23440170288086, "global_step": 66737, "epoch": 551} {"train_loss": -35.247989654541016, "global_step": 66738, "epoch": 551} {"train_loss": -35.3853645324707, "global_step": 66739, "epoch": 551} {"train_loss": -35.4041862487793, "global_step": 66740, "epoch": 551} {"train_loss": -35.84716796875, "global_step": 66741, "epoch": 551} {"train_loss": -35.24102020263672, "global_step": 66742, "epoch": 551} {"train_loss": -35.69306564331055, "global_step": 66743, "epoch": 551} {"train_loss": -35.572723388671875, "global_step": 66744, "epoch": 551} {"train_loss": -35.623809814453125, "global_step": 66745, "epoch": 551} {"train_loss": -35.95624923706055, "global_step": 66746, "epoch": 551} {"train_loss": -35.96812057495117, "global_step": 66747, "epoch": 551} {"train_loss": -35.78310775756836, "global_step": 66748, "epoch": 551} {"train_loss": -36.221248626708984, "global_step": 66749, "epoch": 551} {"train_loss": -36.19950485229492, "global_step": 66750, "epoch": 551} {"train_loss": -36.40707015991211, "global_step": 66751, "epoch": 551} {"train_loss": -31.709508895874023, "global_step": 66752, "epoch": 551} {"train_loss": -35.47502517700195, "global_step": 66753, "epoch": 551} {"train_loss": -35.91260528564453, "global_step": 66754, "epoch": 551} {"train_loss": -32.01375961303711, "global_step": 66755, "epoch": 551} {"train_loss": -36.1148796081543, "global_step": 66756, "epoch": 551} {"train_loss": -35.169429779052734, "global_step": 66757, "epoch": 551} {"train_loss": -33.62465286254883, "global_step": 66758, "epoch": 551} {"train_loss": -34.22136306762695, "global_step": 66759, "epoch": 551} {"train_loss": -35.79345703125, "global_step": 66760, "epoch": 551} {"train_loss": -34.857887268066406, "global_step": 66761, "epoch": 551} {"train_loss": -35.33287048339844, "global_step": 66762, "epoch": 551} {"train_loss": -33.88808059692383, "global_step": 66763, "epoch": 551} {"train_loss": -28.29461669921875, "global_step": 66764, "epoch": 551} {"train_loss": -31.993671417236328, "global_step": 66765, "epoch": 551} {"train_loss": -33.60614013671875, "global_step": 66766, "epoch": 551} {"train_loss": -34.58649826049805, "global_step": 66767, "epoch": 551} {"train_loss": -34.850677490234375, "global_step": 66768, "epoch": 551} {"train_loss": -34.29730224609375, "global_step": 66769, "epoch": 551} {"train_loss": -33.78626251220703, "global_step": 66770, "epoch": 551} {"train_loss": -34.988677978515625, "global_step": 66771, "epoch": 551} {"train_loss": -35.23440170288086, "global_step": 66772, "epoch": 551} {"train_loss": -34.967926025390625, "global_step": 66773, "epoch": 551} {"train_loss": -35.549015045166016, "global_step": 66774, "epoch": 551} {"train_loss": -34.88918685913086, "global_step": 66775, "epoch": 551} {"train_loss": -35.831031799316406, "global_step": 66776, "epoch": 551} {"train_loss": -35.244083404541016, "global_step": 66777, "epoch": 551} {"train_loss": -35.71356964111328, "global_step": 66778, "epoch": 551} {"train_loss": -35.054542541503906, "global_step": 66779, "epoch": 551} {"train_loss": -35.96696472167969, "global_step": 66780, "epoch": 551} {"train_loss": -35.8920783996582, "global_step": 66781, "epoch": 551} {"train_loss": -36.10340118408203, "global_step": 66782, "epoch": 551} {"train_loss": -35.89191436767578, "global_step": 66783, "epoch": 551} {"train_loss": -35.6276969909668, "global_step": 66784, "epoch": 551} {"train_loss": -35.10078430175781, "global_step": 66785, "epoch": 551} {"train_loss": -35.918704986572266, "global_step": 66786, "epoch": 551} {"train_loss": -35.17533493041992, "global_step": 66787, "epoch": 551} {"train_loss": -36.27410125732422, "global_step": 66788, "epoch": 551} {"train_loss": -36.040035247802734, "global_step": 66789, "epoch": 551} {"train_loss": -36.232662200927734, "global_step": 66790, "epoch": 551} {"train_loss": -34.44345194840234, "global_step": 66791, "epoch": 551, "val_loss": 2554585.75} {"train_loss": -36.044952392578125, "global_step": 66792, "epoch": 552} {"train_loss": -35.2303466796875, "global_step": 66793, "epoch": 552} {"train_loss": -36.20405197143555, "global_step": 66794, "epoch": 552} {"train_loss": -36.38045883178711, "global_step": 66795, "epoch": 552} {"train_loss": -36.63335037231445, "global_step": 66796, "epoch": 552} {"train_loss": -36.07425308227539, "global_step": 66797, "epoch": 552} {"train_loss": -36.16658020019531, "global_step": 66798, "epoch": 552} {"train_loss": -34.97724533081055, "global_step": 66799, "epoch": 552} {"train_loss": -35.69374465942383, "global_step": 66800, "epoch": 552} {"train_loss": -35.38758087158203, "global_step": 66801, "epoch": 552} {"train_loss": -36.165958404541016, "global_step": 66802, "epoch": 552} {"train_loss": -35.62491989135742, "global_step": 66803, "epoch": 552} {"train_loss": -36.111549377441406, "global_step": 66804, "epoch": 552} {"train_loss": -36.18001174926758, "global_step": 66805, "epoch": 552} {"train_loss": -35.810176849365234, "global_step": 66806, "epoch": 552} {"train_loss": -35.424774169921875, "global_step": 66807, "epoch": 552} {"train_loss": -36.35519790649414, "global_step": 66808, "epoch": 552} {"train_loss": -34.94722366333008, "global_step": 66809, "epoch": 552} {"train_loss": -35.692440032958984, "global_step": 66810, "epoch": 552} {"train_loss": -35.17142868041992, "global_step": 66811, "epoch": 552} {"train_loss": -34.97737503051758, "global_step": 66812, "epoch": 552} {"train_loss": -35.72724151611328, "global_step": 66813, "epoch": 552} {"train_loss": -36.59285354614258, "global_step": 66814, "epoch": 552} {"train_loss": -35.6905632019043, "global_step": 66815, "epoch": 552} {"train_loss": -36.20064163208008, "global_step": 66816, "epoch": 552} {"train_loss": -35.477745056152344, "global_step": 66817, "epoch": 552} {"train_loss": -36.63180160522461, "global_step": 66818, "epoch": 552} {"train_loss": -35.93115234375, "global_step": 66819, "epoch": 552} {"train_loss": -36.705379486083984, "global_step": 66820, "epoch": 552} {"train_loss": -36.00738525390625, "global_step": 66821, "epoch": 552} {"train_loss": -35.94356918334961, "global_step": 66822, "epoch": 552} {"train_loss": -36.68946838378906, "global_step": 66823, "epoch": 552} {"train_loss": -36.70527648925781, "global_step": 66824, "epoch": 552} {"train_loss": -36.40120315551758, "global_step": 66825, "epoch": 552} {"train_loss": -36.07240676879883, "global_step": 66826, "epoch": 552} {"train_loss": -36.51681137084961, "global_step": 66827, "epoch": 552} {"train_loss": -36.5616569519043, "global_step": 66828, "epoch": 552} {"train_loss": -36.58913803100586, "global_step": 66829, "epoch": 552} {"train_loss": -37.120147705078125, "global_step": 66830, "epoch": 552} {"train_loss": -35.71639633178711, "global_step": 66831, "epoch": 552} {"train_loss": -35.837974548339844, "global_step": 66832, "epoch": 552} {"train_loss": -35.97114944458008, "global_step": 66833, "epoch": 552} {"train_loss": -35.107234954833984, "global_step": 66834, "epoch": 552} {"train_loss": -36.18845748901367, "global_step": 66835, "epoch": 552} {"train_loss": -36.70166015625, "global_step": 66836, "epoch": 552} {"train_loss": -36.38102340698242, "global_step": 66837, "epoch": 552} {"train_loss": -35.506832122802734, "global_step": 66838, "epoch": 552} {"train_loss": -35.09872055053711, "global_step": 66839, "epoch": 552} {"train_loss": -34.98691940307617, "global_step": 66840, "epoch": 552} {"train_loss": -34.94314193725586, "global_step": 66841, "epoch": 552} {"train_loss": -35.75105285644531, "global_step": 66842, "epoch": 552} {"train_loss": -36.64430236816406, "global_step": 66843, "epoch": 552} {"train_loss": -34.32073211669922, "global_step": 66844, "epoch": 552} {"train_loss": -32.51303482055664, "global_step": 66845, "epoch": 552} {"train_loss": -27.733936309814453, "global_step": 66846, "epoch": 552} {"train_loss": -24.28997802734375, "global_step": 66847, "epoch": 552} {"train_loss": -31.519287109375, "global_step": 66848, "epoch": 552} {"train_loss": -35.4506950378418, "global_step": 66849, "epoch": 552} {"train_loss": -30.708478927612305, "global_step": 66850, "epoch": 552} {"train_loss": -35.47620391845703, "global_step": 66851, "epoch": 552} {"train_loss": -34.21444320678711, "global_step": 66852, "epoch": 552} {"train_loss": -33.619136810302734, "global_step": 66853, "epoch": 552} {"train_loss": -35.62158966064453, "global_step": 66854, "epoch": 552} {"train_loss": -33.63630294799805, "global_step": 66855, "epoch": 552} {"train_loss": -34.976654052734375, "global_step": 66856, "epoch": 552} {"train_loss": -34.754512786865234, "global_step": 66857, "epoch": 552} {"train_loss": -35.798858642578125, "global_step": 66858, "epoch": 552} {"train_loss": -34.52821731567383, "global_step": 66859, "epoch": 552} {"train_loss": -35.74257278442383, "global_step": 66860, "epoch": 552} {"train_loss": -34.7813835144043, "global_step": 66861, "epoch": 552} {"train_loss": -35.978153228759766, "global_step": 66862, "epoch": 552} {"train_loss": -35.264930725097656, "global_step": 66863, "epoch": 552} {"train_loss": -35.08805465698242, "global_step": 66864, "epoch": 552} {"train_loss": -35.38739776611328, "global_step": 66865, "epoch": 552} {"train_loss": -36.0776252746582, "global_step": 66866, "epoch": 552} {"train_loss": -35.31886672973633, "global_step": 66867, "epoch": 552} {"train_loss": -36.17936325073242, "global_step": 66868, "epoch": 552} {"train_loss": -35.494354248046875, "global_step": 66869, "epoch": 552} {"train_loss": -36.33266067504883, "global_step": 66870, "epoch": 552} {"train_loss": -35.68081283569336, "global_step": 66871, "epoch": 552} {"train_loss": -36.899757385253906, "global_step": 66872, "epoch": 552} {"train_loss": -35.60947799682617, "global_step": 66873, "epoch": 552} {"train_loss": -33.6058464050293, "global_step": 66874, "epoch": 552} {"train_loss": -35.90687942504883, "global_step": 66875, "epoch": 552} {"train_loss": -36.3693962097168, "global_step": 66876, "epoch": 552} {"train_loss": -35.60400390625, "global_step": 66877, "epoch": 552} {"train_loss": -36.308223724365234, "global_step": 66878, "epoch": 552} {"train_loss": -34.25872802734375, "global_step": 66879, "epoch": 552} {"train_loss": -34.3777961730957, "global_step": 66880, "epoch": 552} {"train_loss": -34.721004486083984, "global_step": 66881, "epoch": 552} {"train_loss": -35.50967025756836, "global_step": 66882, "epoch": 552} {"train_loss": -35.43877029418945, "global_step": 66883, "epoch": 552} {"train_loss": -35.31901931762695, "global_step": 66884, "epoch": 552} {"train_loss": -35.629608154296875, "global_step": 66885, "epoch": 552} {"train_loss": -35.29426956176758, "global_step": 66886, "epoch": 552} {"train_loss": -35.7592887878418, "global_step": 66887, "epoch": 552} {"train_loss": -34.97255325317383, "global_step": 66888, "epoch": 552} {"train_loss": -35.71891403198242, "global_step": 66889, "epoch": 552} {"train_loss": -35.6187629699707, "global_step": 66890, "epoch": 552} {"train_loss": -35.984371185302734, "global_step": 66891, "epoch": 552} {"train_loss": -35.39475631713867, "global_step": 66892, "epoch": 552} {"train_loss": -35.73332214355469, "global_step": 66893, "epoch": 552} {"train_loss": -33.918025970458984, "global_step": 66894, "epoch": 552} {"train_loss": -35.477134704589844, "global_step": 66895, "epoch": 552} {"train_loss": -35.5212516784668, "global_step": 66896, "epoch": 552} {"train_loss": -36.2424430847168, "global_step": 66897, "epoch": 552} {"train_loss": -35.306697845458984, "global_step": 66898, "epoch": 552} {"train_loss": -36.23341751098633, "global_step": 66899, "epoch": 552} {"train_loss": -35.50165557861328, "global_step": 66900, "epoch": 552} {"train_loss": -36.28428268432617, "global_step": 66901, "epoch": 552} {"train_loss": -35.83539962768555, "global_step": 66902, "epoch": 552} {"train_loss": -35.52602767944336, "global_step": 66903, "epoch": 552} {"train_loss": -36.38129425048828, "global_step": 66904, "epoch": 552} {"train_loss": -36.21039962768555, "global_step": 66905, "epoch": 552} {"train_loss": -36.574615478515625, "global_step": 66906, "epoch": 552} {"train_loss": -36.2494010925293, "global_step": 66907, "epoch": 552} {"train_loss": -36.24287033081055, "global_step": 66908, "epoch": 552} {"train_loss": -34.2697868347168, "global_step": 66909, "epoch": 552} {"train_loss": -36.43754959106445, "global_step": 66910, "epoch": 552} {"train_loss": -36.120609283447266, "global_step": 66911, "epoch": 552} {"train_loss": -35.42361212170814, "global_step": 66912, "epoch": 552, "val_loss": 2524047.25} {"train_loss": -35.677066802978516, "global_step": 66913, "epoch": 553} {"train_loss": -35.60799026489258, "global_step": 66914, "epoch": 553} {"train_loss": -35.61058807373047, "global_step": 66915, "epoch": 553} {"train_loss": -35.47446823120117, "global_step": 66916, "epoch": 553} {"train_loss": -36.52619934082031, "global_step": 66917, "epoch": 553} {"train_loss": -36.460693359375, "global_step": 66918, "epoch": 553} {"train_loss": -34.61785888671875, "global_step": 66919, "epoch": 553} {"train_loss": -35.54753494262695, "global_step": 66920, "epoch": 553} {"train_loss": -35.9186897277832, "global_step": 66921, "epoch": 553} {"train_loss": -36.17958450317383, "global_step": 66922, "epoch": 553} {"train_loss": -34.34870910644531, "global_step": 66923, "epoch": 553} {"train_loss": -36.50800704956055, "global_step": 66924, "epoch": 553} {"train_loss": -36.67024612426758, "global_step": 66925, "epoch": 553} {"train_loss": -36.879093170166016, "global_step": 66926, "epoch": 553} {"train_loss": -36.74115753173828, "global_step": 66927, "epoch": 553} {"train_loss": -36.3416748046875, "global_step": 66928, "epoch": 553} {"train_loss": -36.031532287597656, "global_step": 66929, "epoch": 553} {"train_loss": -36.13943099975586, "global_step": 66930, "epoch": 553} {"train_loss": -35.85634231567383, "global_step": 66931, "epoch": 553} {"train_loss": -36.14717483520508, "global_step": 66932, "epoch": 553} {"train_loss": -36.576778411865234, "global_step": 66933, "epoch": 553} {"train_loss": -36.30695343017578, "global_step": 66934, "epoch": 553} {"train_loss": -36.628536224365234, "global_step": 66935, "epoch": 553} {"train_loss": -36.26375961303711, "global_step": 66936, "epoch": 553} {"train_loss": -36.27749252319336, "global_step": 66937, "epoch": 553} {"train_loss": -35.96550369262695, "global_step": 66938, "epoch": 553} {"train_loss": -36.471893310546875, "global_step": 66939, "epoch": 553} {"train_loss": -36.90412139892578, "global_step": 66940, "epoch": 553} {"train_loss": -35.71208953857422, "global_step": 66941, "epoch": 553} {"train_loss": -36.055763244628906, "global_step": 66942, "epoch": 553} {"train_loss": -36.47319793701172, "global_step": 66943, "epoch": 553} {"train_loss": -35.80660629272461, "global_step": 66944, "epoch": 553} {"train_loss": -35.758419036865234, "global_step": 66945, "epoch": 553} {"train_loss": -35.708805084228516, "global_step": 66946, "epoch": 553} {"train_loss": -36.9012451171875, "global_step": 66947, "epoch": 553} {"train_loss": -35.16794967651367, "global_step": 66948, "epoch": 553} {"train_loss": -34.53034210205078, "global_step": 66949, "epoch": 553} {"train_loss": -36.09618377685547, "global_step": 66950, "epoch": 553} {"train_loss": -35.33064270019531, "global_step": 66951, "epoch": 553} {"train_loss": -35.9139518737793, "global_step": 66952, "epoch": 553} {"train_loss": -35.46616744995117, "global_step": 66953, "epoch": 553} {"train_loss": -36.72789764404297, "global_step": 66954, "epoch": 553} {"train_loss": -36.117130279541016, "global_step": 66955, "epoch": 553} {"train_loss": -35.87931442260742, "global_step": 66956, "epoch": 553} {"train_loss": -36.753047943115234, "global_step": 66957, "epoch": 553} {"train_loss": -36.541988372802734, "global_step": 66958, "epoch": 553} {"train_loss": -36.290225982666016, "global_step": 66959, "epoch": 553} {"train_loss": -36.47787094116211, "global_step": 66960, "epoch": 553} {"train_loss": -36.78557205200195, "global_step": 66961, "epoch": 553} {"train_loss": -36.94879913330078, "global_step": 66962, "epoch": 553} {"train_loss": -36.31730270385742, "global_step": 66963, "epoch": 553} {"train_loss": -36.8558349609375, "global_step": 66964, "epoch": 553} {"train_loss": -36.77806854248047, "global_step": 66965, "epoch": 553} {"train_loss": -35.83903121948242, "global_step": 66966, "epoch": 553} {"train_loss": -36.13405227661133, "global_step": 66967, "epoch": 553} {"train_loss": -36.56627655029297, "global_step": 66968, "epoch": 553} {"train_loss": -36.77729415893555, "global_step": 66969, "epoch": 553} {"train_loss": -36.2662353515625, "global_step": 66970, "epoch": 553} {"train_loss": -36.01918411254883, "global_step": 66971, "epoch": 553} {"train_loss": -33.80437088012695, "global_step": 66972, "epoch": 553} {"train_loss": -27.901111602783203, "global_step": 66973, "epoch": 553} {"train_loss": -33.40508270263672, "global_step": 66974, "epoch": 553} {"train_loss": -36.45219421386719, "global_step": 66975, "epoch": 553} {"train_loss": -35.348419189453125, "global_step": 66976, "epoch": 553} {"train_loss": -35.82600784301758, "global_step": 66977, "epoch": 553} {"train_loss": -34.26722717285156, "global_step": 66978, "epoch": 553} {"train_loss": -36.37954330444336, "global_step": 66979, "epoch": 553} {"train_loss": -35.861122131347656, "global_step": 66980, "epoch": 553} {"train_loss": -36.6954345703125, "global_step": 66981, "epoch": 553} {"train_loss": -36.6838264465332, "global_step": 66982, "epoch": 553} {"train_loss": -33.9558219909668, "global_step": 66983, "epoch": 553} {"train_loss": -36.46246337890625, "global_step": 66984, "epoch": 553} {"train_loss": -36.08192825317383, "global_step": 66985, "epoch": 553} {"train_loss": -35.22343063354492, "global_step": 66986, "epoch": 553} {"train_loss": -36.783973693847656, "global_step": 66987, "epoch": 553} {"train_loss": -36.32838821411133, "global_step": 66988, "epoch": 553} {"train_loss": -36.13190841674805, "global_step": 66989, "epoch": 553} {"train_loss": -35.40918731689453, "global_step": 66990, "epoch": 553} {"train_loss": -35.79951858520508, "global_step": 66991, "epoch": 553} {"train_loss": -35.70193099975586, "global_step": 66992, "epoch": 553} {"train_loss": -36.32234573364258, "global_step": 66993, "epoch": 553} {"train_loss": -35.215667724609375, "global_step": 66994, "epoch": 553} {"train_loss": -37.00176239013672, "global_step": 66995, "epoch": 553} {"train_loss": -36.743919372558594, "global_step": 66996, "epoch": 553} {"train_loss": -35.185340881347656, "global_step": 66997, "epoch": 553} {"train_loss": -36.52412796020508, "global_step": 66998, "epoch": 553} {"train_loss": -36.460853576660156, "global_step": 66999, "epoch": 553} {"train_loss": -35.24236297607422, "global_step": 67000, "epoch": 553} {"train_loss": -36.6973762512207, "global_step": 67001, "epoch": 553} {"train_loss": -36.7355842590332, "global_step": 67002, "epoch": 553} {"train_loss": -36.115386962890625, "global_step": 67003, "epoch": 553} {"train_loss": -36.89448165893555, "global_step": 67004, "epoch": 553} {"train_loss": -35.56704330444336, "global_step": 67005, "epoch": 553} {"train_loss": -36.32255172729492, "global_step": 67006, "epoch": 553} {"train_loss": -36.39083480834961, "global_step": 67007, "epoch": 553} {"train_loss": -36.78727340698242, "global_step": 67008, "epoch": 553} {"train_loss": -36.50600814819336, "global_step": 67009, "epoch": 553} {"train_loss": -34.7994384765625, "global_step": 67010, "epoch": 553} {"train_loss": -36.65877914428711, "global_step": 67011, "epoch": 553} {"train_loss": -36.79283142089844, "global_step": 67012, "epoch": 553} {"train_loss": -36.77987289428711, "global_step": 67013, "epoch": 553} {"train_loss": -36.1151237487793, "global_step": 67014, "epoch": 553} {"train_loss": -36.741004943847656, "global_step": 67015, "epoch": 553} {"train_loss": -36.65712356567383, "global_step": 67016, "epoch": 553} {"train_loss": -36.68001174926758, "global_step": 67017, "epoch": 553} {"train_loss": -36.38276290893555, "global_step": 67018, "epoch": 553} {"train_loss": -36.49617385864258, "global_step": 67019, "epoch": 553} {"train_loss": -36.33303451538086, "global_step": 67020, "epoch": 553} {"train_loss": -36.394798278808594, "global_step": 67021, "epoch": 553} {"train_loss": -35.40482711791992, "global_step": 67022, "epoch": 553} {"train_loss": -35.893131256103516, "global_step": 67023, "epoch": 553} {"train_loss": -36.19388961791992, "global_step": 67024, "epoch": 553} {"train_loss": -34.99686813354492, "global_step": 67025, "epoch": 553} {"train_loss": -36.377845764160156, "global_step": 67026, "epoch": 553} {"train_loss": -35.3488883972168, "global_step": 67027, "epoch": 553} {"train_loss": -35.39114761352539, "global_step": 67028, "epoch": 553} {"train_loss": -35.45794677734375, "global_step": 67029, "epoch": 553} {"train_loss": -35.75398635864258, "global_step": 67030, "epoch": 553} {"train_loss": -36.43278121948242, "global_step": 67031, "epoch": 553} {"train_loss": -35.1207275390625, "global_step": 67032, "epoch": 553} {"train_loss": -35.99007340108068, "global_step": 67033, "epoch": 553, "val_loss": 2725066.25} {"train_loss": -36.25977325439453, "global_step": 67034, "epoch": 554} {"train_loss": -36.9622917175293, "global_step": 67035, "epoch": 554} {"train_loss": -36.67700958251953, "global_step": 67036, "epoch": 554} {"train_loss": -35.25442123413086, "global_step": 67037, "epoch": 554} {"train_loss": -36.99586486816406, "global_step": 67038, "epoch": 554} {"train_loss": -36.64776611328125, "global_step": 67039, "epoch": 554} {"train_loss": -36.281341552734375, "global_step": 67040, "epoch": 554} {"train_loss": -36.030582427978516, "global_step": 67041, "epoch": 554} {"train_loss": -35.49551010131836, "global_step": 67042, "epoch": 554} {"train_loss": -35.79109573364258, "global_step": 67043, "epoch": 554} {"train_loss": -36.281593322753906, "global_step": 67044, "epoch": 554} {"train_loss": -36.42518997192383, "global_step": 67045, "epoch": 554} {"train_loss": -36.464515686035156, "global_step": 67046, "epoch": 554} {"train_loss": -35.940826416015625, "global_step": 67047, "epoch": 554} {"train_loss": -37.210636138916016, "global_step": 67048, "epoch": 554} {"train_loss": -35.25075912475586, "global_step": 67049, "epoch": 554} {"train_loss": -35.697357177734375, "global_step": 67050, "epoch": 554} {"train_loss": -36.4075813293457, "global_step": 67051, "epoch": 554} {"train_loss": -36.725582122802734, "global_step": 67052, "epoch": 554} {"train_loss": -36.6881103515625, "global_step": 67053, "epoch": 554} {"train_loss": -37.04657745361328, "global_step": 67054, "epoch": 554} {"train_loss": -36.03105926513672, "global_step": 67055, "epoch": 554} {"train_loss": -36.985015869140625, "global_step": 67056, "epoch": 554} {"train_loss": -37.62017822265625, "global_step": 67057, "epoch": 554} {"train_loss": -36.892364501953125, "global_step": 67058, "epoch": 554} {"train_loss": -36.36103057861328, "global_step": 67059, "epoch": 554} {"train_loss": -35.51312255859375, "global_step": 67060, "epoch": 554} {"train_loss": -36.09663009643555, "global_step": 67061, "epoch": 554} {"train_loss": -36.879634857177734, "global_step": 67062, "epoch": 554} {"train_loss": -37.32969284057617, "global_step": 67063, "epoch": 554} {"train_loss": -36.967525482177734, "global_step": 67064, "epoch": 554} {"train_loss": -37.08635330200195, "global_step": 67065, "epoch": 554} {"train_loss": -36.16437911987305, "global_step": 67066, "epoch": 554} {"train_loss": -36.213600158691406, "global_step": 67067, "epoch": 554} {"train_loss": -36.7353401184082, "global_step": 67068, "epoch": 554} {"train_loss": -35.9309196472168, "global_step": 67069, "epoch": 554} {"train_loss": -35.9090690612793, "global_step": 67070, "epoch": 554} {"train_loss": -36.413753509521484, "global_step": 67071, "epoch": 554} {"train_loss": -36.96602249145508, "global_step": 67072, "epoch": 554} {"train_loss": -34.95498275756836, "global_step": 67073, "epoch": 554} {"train_loss": -35.8919677734375, "global_step": 67074, "epoch": 554} {"train_loss": -34.888484954833984, "global_step": 67075, "epoch": 554} {"train_loss": -31.779539108276367, "global_step": 67076, "epoch": 554} {"train_loss": -23.5040283203125, "global_step": 67077, "epoch": 554} {"train_loss": -7.598281383514404, "global_step": 67078, "epoch": 554} {"train_loss": -19.446319580078125, "global_step": 67079, "epoch": 554} {"train_loss": -33.10844802856445, "global_step": 67080, "epoch": 554} {"train_loss": -24.364032745361328, "global_step": 67081, "epoch": 554} {"train_loss": -32.20056915283203, "global_step": 67082, "epoch": 554} {"train_loss": -29.258625030517578, "global_step": 67083, "epoch": 554} {"train_loss": -32.35261154174805, "global_step": 67084, "epoch": 554} {"train_loss": -30.380020141601562, "global_step": 67085, "epoch": 554} {"train_loss": -32.21799087524414, "global_step": 67086, "epoch": 554} {"train_loss": -31.98247718811035, "global_step": 67087, "epoch": 554} {"train_loss": -32.857521057128906, "global_step": 67088, "epoch": 554} {"train_loss": -32.22588348388672, "global_step": 67089, "epoch": 554} {"train_loss": -32.013580322265625, "global_step": 67090, "epoch": 554} {"train_loss": -33.01411437988281, "global_step": 67091, "epoch": 554} {"train_loss": -33.57672119140625, "global_step": 67092, "epoch": 554} {"train_loss": -34.502323150634766, "global_step": 67093, "epoch": 554} {"train_loss": -34.02513122558594, "global_step": 67094, "epoch": 554} {"train_loss": -34.62997055053711, "global_step": 67095, "epoch": 554} {"train_loss": -35.31096267700195, "global_step": 67096, "epoch": 554} {"train_loss": -34.90060043334961, "global_step": 67097, "epoch": 554} {"train_loss": -34.98686981201172, "global_step": 67098, "epoch": 554} {"train_loss": -35.93028259277344, "global_step": 67099, "epoch": 554} {"train_loss": -35.63437271118164, "global_step": 67100, "epoch": 554} {"train_loss": -35.87565994262695, "global_step": 67101, "epoch": 554} {"train_loss": -35.0009880065918, "global_step": 67102, "epoch": 554} {"train_loss": -35.48896026611328, "global_step": 67103, "epoch": 554} {"train_loss": -35.629058837890625, "global_step": 67104, "epoch": 554} {"train_loss": -35.99686813354492, "global_step": 67105, "epoch": 554} {"train_loss": -35.94729232788086, "global_step": 67106, "epoch": 554} {"train_loss": -35.64618682861328, "global_step": 67107, "epoch": 554} {"train_loss": -35.8907585144043, "global_step": 67108, "epoch": 554} {"train_loss": -36.384803771972656, "global_step": 67109, "epoch": 554} {"train_loss": -36.13619613647461, "global_step": 67110, "epoch": 554} {"train_loss": -36.08340072631836, "global_step": 67111, "epoch": 554} {"train_loss": -35.87332534790039, "global_step": 67112, "epoch": 554} {"train_loss": -35.82383346557617, "global_step": 67113, "epoch": 554} {"train_loss": -35.89027786254883, "global_step": 67114, "epoch": 554} {"train_loss": -36.52253341674805, "global_step": 67115, "epoch": 554} {"train_loss": -36.7413444519043, "global_step": 67116, "epoch": 554} {"train_loss": -36.71767807006836, "global_step": 67117, "epoch": 554} {"train_loss": -36.34299850463867, "global_step": 67118, "epoch": 554} {"train_loss": -36.73186111450195, "global_step": 67119, "epoch": 554} {"train_loss": -36.69610595703125, "global_step": 67120, "epoch": 554} {"train_loss": -36.33414077758789, "global_step": 67121, "epoch": 554} {"train_loss": -36.527191162109375, "global_step": 67122, "epoch": 554} {"train_loss": -36.27960205078125, "global_step": 67123, "epoch": 554} {"train_loss": -36.75544357299805, "global_step": 67124, "epoch": 554} {"train_loss": -36.640716552734375, "global_step": 67125, "epoch": 554} {"train_loss": -36.6999626159668, "global_step": 67126, "epoch": 554} {"train_loss": -36.76451110839844, "global_step": 67127, "epoch": 554} {"train_loss": -36.85805892944336, "global_step": 67128, "epoch": 554} {"train_loss": -36.86322021484375, "global_step": 67129, "epoch": 554} {"train_loss": -36.347164154052734, "global_step": 67130, "epoch": 554} {"train_loss": -36.42376708984375, "global_step": 67131, "epoch": 554} {"train_loss": -36.96770477294922, "global_step": 67132, "epoch": 554} {"train_loss": -36.01708221435547, "global_step": 67133, "epoch": 554} {"train_loss": -36.467185974121094, "global_step": 67134, "epoch": 554} {"train_loss": -36.91897201538086, "global_step": 67135, "epoch": 554} {"train_loss": -36.1602783203125, "global_step": 67136, "epoch": 554} {"train_loss": -36.14015579223633, "global_step": 67137, "epoch": 554} {"train_loss": -36.5706787109375, "global_step": 67138, "epoch": 554} {"train_loss": -36.628658294677734, "global_step": 67139, "epoch": 554} {"train_loss": -36.86332321166992, "global_step": 67140, "epoch": 554} {"train_loss": -36.714866638183594, "global_step": 67141, "epoch": 554} {"train_loss": -37.130287170410156, "global_step": 67142, "epoch": 554} {"train_loss": -36.834590911865234, "global_step": 67143, "epoch": 554} {"train_loss": -36.75084686279297, "global_step": 67144, "epoch": 554} {"train_loss": -37.24947738647461, "global_step": 67145, "epoch": 554} {"train_loss": -37.02242660522461, "global_step": 67146, "epoch": 554} {"train_loss": -37.08209228515625, "global_step": 67147, "epoch": 554} {"train_loss": -37.361297607421875, "global_step": 67148, "epoch": 554} {"train_loss": -37.01955795288086, "global_step": 67149, "epoch": 554} {"train_loss": -37.224178314208984, "global_step": 67150, "epoch": 554} {"train_loss": -36.960933685302734, "global_step": 67151, "epoch": 554} {"train_loss": -35.75214385986328, "global_step": 67152, "epoch": 554} {"train_loss": -34.03186798095703, "global_step": 67153, "epoch": 554} {"train_loss": -35.20633460667508, "global_step": 67154, "epoch": 554, "val_loss": 2531559.0} {"train_loss": -35.306800842285156, "global_step": 67155, "epoch": 555} {"train_loss": -36.733890533447266, "global_step": 67156, "epoch": 555} {"train_loss": -33.20896530151367, "global_step": 67157, "epoch": 555} {"train_loss": -28.20967674255371, "global_step": 67158, "epoch": 555} {"train_loss": -21.558534622192383, "global_step": 67159, "epoch": 555} {"train_loss": -31.150390625, "global_step": 67160, "epoch": 555} {"train_loss": -34.93610763549805, "global_step": 67161, "epoch": 555} {"train_loss": -27.484130859375, "global_step": 67162, "epoch": 555} {"train_loss": -33.628265380859375, "global_step": 67163, "epoch": 555} {"train_loss": -29.315814971923828, "global_step": 67164, "epoch": 555} {"train_loss": -33.3421516418457, "global_step": 67165, "epoch": 555} {"train_loss": -32.590877532958984, "global_step": 67166, "epoch": 555} {"train_loss": -35.47152328491211, "global_step": 67167, "epoch": 555} {"train_loss": -33.74842071533203, "global_step": 67168, "epoch": 555} {"train_loss": -33.64181137084961, "global_step": 67169, "epoch": 555} {"train_loss": -35.49897384643555, "global_step": 67170, "epoch": 555} {"train_loss": -34.00754928588867, "global_step": 67171, "epoch": 555} {"train_loss": -34.876380920410156, "global_step": 67172, "epoch": 555} {"train_loss": -34.70777130126953, "global_step": 67173, "epoch": 555} {"train_loss": -34.022865295410156, "global_step": 67174, "epoch": 555} {"train_loss": -34.784236907958984, "global_step": 67175, "epoch": 555} {"train_loss": -35.632328033447266, "global_step": 67176, "epoch": 555} {"train_loss": -33.81288528442383, "global_step": 67177, "epoch": 555} {"train_loss": -35.023311614990234, "global_step": 67178, "epoch": 555} {"train_loss": -35.328102111816406, "global_step": 67179, "epoch": 555} {"train_loss": -33.784149169921875, "global_step": 67180, "epoch": 555} {"train_loss": -34.992977142333984, "global_step": 67181, "epoch": 555} {"train_loss": -35.494380950927734, "global_step": 67182, "epoch": 555} {"train_loss": -35.56767272949219, "global_step": 67183, "epoch": 555} {"train_loss": -35.21449661254883, "global_step": 67184, "epoch": 555} {"train_loss": -35.66506576538086, "global_step": 67185, "epoch": 555} {"train_loss": -35.88495635986328, "global_step": 67186, "epoch": 555} {"train_loss": -35.509639739990234, "global_step": 67187, "epoch": 555} {"train_loss": -35.17873001098633, "global_step": 67188, "epoch": 555} {"train_loss": -36.059120178222656, "global_step": 67189, "epoch": 555} {"train_loss": -35.743507385253906, "global_step": 67190, "epoch": 555} {"train_loss": -35.44734573364258, "global_step": 67191, "epoch": 555} {"train_loss": -35.92847442626953, "global_step": 67192, "epoch": 555} {"train_loss": -36.074951171875, "global_step": 67193, "epoch": 555} {"train_loss": -36.4099006652832, "global_step": 67194, "epoch": 555} {"train_loss": -35.99042892456055, "global_step": 67195, "epoch": 555} {"train_loss": -36.483455657958984, "global_step": 67196, "epoch": 555} {"train_loss": -36.10042953491211, "global_step": 67197, "epoch": 555} {"train_loss": -36.59703826904297, "global_step": 67198, "epoch": 555} {"train_loss": -36.13507843017578, "global_step": 67199, "epoch": 555} {"train_loss": -36.1182975769043, "global_step": 67200, "epoch": 555} {"train_loss": -36.287933349609375, "global_step": 67201, "epoch": 555} {"train_loss": -36.19257736206055, "global_step": 67202, "epoch": 555} {"train_loss": -36.57527160644531, "global_step": 67203, "epoch": 555} {"train_loss": -36.47621154785156, "global_step": 67204, "epoch": 555} {"train_loss": -36.29561233520508, "global_step": 67205, "epoch": 555} {"train_loss": -36.00654220581055, "global_step": 67206, "epoch": 555} {"train_loss": -36.718379974365234, "global_step": 67207, "epoch": 555} {"train_loss": -36.612545013427734, "global_step": 67208, "epoch": 555} {"train_loss": -36.416748046875, "global_step": 67209, "epoch": 555} {"train_loss": -35.75173568725586, "global_step": 67210, "epoch": 555} {"train_loss": -36.625518798828125, "global_step": 67211, "epoch": 555} {"train_loss": -36.53390121459961, "global_step": 67212, "epoch": 555} {"train_loss": -36.090576171875, "global_step": 67213, "epoch": 555} {"train_loss": -36.54281234741211, "global_step": 67214, "epoch": 555} {"train_loss": -36.69327163696289, "global_step": 67215, "epoch": 555} {"train_loss": -37.014461517333984, "global_step": 67216, "epoch": 555} {"train_loss": -36.99020004272461, "global_step": 67217, "epoch": 555} {"train_loss": -37.30816650390625, "global_step": 67218, "epoch": 555} {"train_loss": -37.028472900390625, "global_step": 67219, "epoch": 555} {"train_loss": -36.776729583740234, "global_step": 67220, "epoch": 555} {"train_loss": -37.27206039428711, "global_step": 67221, "epoch": 555} {"train_loss": -37.04755783081055, "global_step": 67222, "epoch": 555} {"train_loss": -36.782264709472656, "global_step": 67223, "epoch": 555} {"train_loss": -37.05796432495117, "global_step": 67224, "epoch": 555} {"train_loss": -37.14208221435547, "global_step": 67225, "epoch": 555} {"train_loss": -36.889183044433594, "global_step": 67226, "epoch": 555} {"train_loss": -37.18675994873047, "global_step": 67227, "epoch": 555} {"train_loss": -37.40523147583008, "global_step": 67228, "epoch": 555} {"train_loss": -36.97518539428711, "global_step": 67229, "epoch": 555} {"train_loss": -36.894020080566406, "global_step": 67230, "epoch": 555} {"train_loss": -37.1462287902832, "global_step": 67231, "epoch": 555} {"train_loss": -37.489559173583984, "global_step": 67232, "epoch": 555} {"train_loss": -35.31975173950195, "global_step": 67233, "epoch": 555} {"train_loss": -36.37234115600586, "global_step": 67234, "epoch": 555} {"train_loss": -35.55012893676758, "global_step": 67235, "epoch": 555} {"train_loss": -33.38721466064453, "global_step": 67236, "epoch": 555} {"train_loss": -33.10694122314453, "global_step": 67237, "epoch": 555} {"train_loss": -34.059261322021484, "global_step": 67238, "epoch": 555} {"train_loss": -35.20209503173828, "global_step": 67239, "epoch": 555} {"train_loss": -34.3534049987793, "global_step": 67240, "epoch": 555} {"train_loss": -36.99916076660156, "global_step": 67241, "epoch": 555} {"train_loss": -34.4804573059082, "global_step": 67242, "epoch": 555} {"train_loss": -36.36774444580078, "global_step": 67243, "epoch": 555} {"train_loss": -35.57994079589844, "global_step": 67244, "epoch": 555} {"train_loss": -35.922569274902344, "global_step": 67245, "epoch": 555} {"train_loss": -36.90869140625, "global_step": 67246, "epoch": 555} {"train_loss": -35.308712005615234, "global_step": 67247, "epoch": 555} {"train_loss": -36.60587692260742, "global_step": 67248, "epoch": 555} {"train_loss": -36.15793991088867, "global_step": 67249, "epoch": 555} {"train_loss": -35.589149475097656, "global_step": 67250, "epoch": 555} {"train_loss": -36.32181930541992, "global_step": 67251, "epoch": 555} {"train_loss": -36.173301696777344, "global_step": 67252, "epoch": 555} {"train_loss": -35.92613983154297, "global_step": 67253, "epoch": 555} {"train_loss": -36.2973747253418, "global_step": 67254, "epoch": 555} {"train_loss": -35.964508056640625, "global_step": 67255, "epoch": 555} {"train_loss": -36.165889739990234, "global_step": 67256, "epoch": 555} {"train_loss": -36.341121673583984, "global_step": 67257, "epoch": 555} {"train_loss": -34.5272216796875, "global_step": 67258, "epoch": 555} {"train_loss": -36.24585723876953, "global_step": 67259, "epoch": 555} {"train_loss": -34.95720291137695, "global_step": 67260, "epoch": 555} {"train_loss": -35.0441780090332, "global_step": 67261, "epoch": 555} {"train_loss": -34.75260925292969, "global_step": 67262, "epoch": 555} {"train_loss": -35.59849166870117, "global_step": 67263, "epoch": 555} {"train_loss": -35.13520431518555, "global_step": 67264, "epoch": 555} {"train_loss": -32.94544219970703, "global_step": 67265, "epoch": 555} {"train_loss": -36.57080841064453, "global_step": 67266, "epoch": 555} {"train_loss": -35.609737396240234, "global_step": 67267, "epoch": 555} {"train_loss": -33.904964447021484, "global_step": 67268, "epoch": 555} {"train_loss": -31.727096557617188, "global_step": 67269, "epoch": 555} {"train_loss": -23.44656753540039, "global_step": 67270, "epoch": 555} {"train_loss": -20.406282424926758, "global_step": 67271, "epoch": 555} {"train_loss": -29.286962509155273, "global_step": 67272, "epoch": 555} {"train_loss": -35.41610336303711, "global_step": 67273, "epoch": 555} {"train_loss": -28.893848419189453, "global_step": 67274, "epoch": 555} {"train_loss": -35.004271325986245, "global_step": 67275, "epoch": 555, "val_loss": 2618601.0} {"train_loss": -33.13088607788086, "global_step": 67276, "epoch": 556} {"train_loss": -35.13112258911133, "global_step": 67277, "epoch": 556} {"train_loss": -33.37844467163086, "global_step": 67278, "epoch": 556} {"train_loss": -33.616615295410156, "global_step": 67279, "epoch": 556} {"train_loss": -33.7987174987793, "global_step": 67280, "epoch": 556} {"train_loss": -33.19452667236328, "global_step": 67281, "epoch": 556} {"train_loss": -35.073822021484375, "global_step": 67282, "epoch": 556} {"train_loss": -34.596290588378906, "global_step": 67283, "epoch": 556} {"train_loss": -33.9542236328125, "global_step": 67284, "epoch": 556} {"train_loss": -33.730648040771484, "global_step": 67285, "epoch": 556} {"train_loss": -34.24336242675781, "global_step": 67286, "epoch": 556} {"train_loss": -35.40263748168945, "global_step": 67287, "epoch": 556} {"train_loss": -34.99222183227539, "global_step": 67288, "epoch": 556} {"train_loss": -34.93246078491211, "global_step": 67289, "epoch": 556} {"train_loss": -35.21405792236328, "global_step": 67290, "epoch": 556} {"train_loss": -34.8192253112793, "global_step": 67291, "epoch": 556} {"train_loss": -34.557228088378906, "global_step": 67292, "epoch": 556} {"train_loss": -35.63515090942383, "global_step": 67293, "epoch": 556} {"train_loss": -35.89599609375, "global_step": 67294, "epoch": 556} {"train_loss": -35.8055305480957, "global_step": 67295, "epoch": 556} {"train_loss": -35.539573669433594, "global_step": 67296, "epoch": 556} {"train_loss": -34.4631462097168, "global_step": 67297, "epoch": 556} {"train_loss": -35.39839172363281, "global_step": 67298, "epoch": 556} {"train_loss": -36.287601470947266, "global_step": 67299, "epoch": 556} {"train_loss": -35.46821975708008, "global_step": 67300, "epoch": 556} {"train_loss": -35.3255729675293, "global_step": 67301, "epoch": 556} {"train_loss": -36.176536560058594, "global_step": 67302, "epoch": 556} {"train_loss": -36.201351165771484, "global_step": 67303, "epoch": 556} {"train_loss": -36.118743896484375, "global_step": 67304, "epoch": 556} {"train_loss": -36.213172912597656, "global_step": 67305, "epoch": 556} {"train_loss": -36.232810974121094, "global_step": 67306, "epoch": 556} {"train_loss": -35.850643157958984, "global_step": 67307, "epoch": 556} {"train_loss": -35.850975036621094, "global_step": 67308, "epoch": 556} {"train_loss": -36.07002258300781, "global_step": 67309, "epoch": 556} {"train_loss": -36.34416580200195, "global_step": 67310, "epoch": 556} {"train_loss": -36.24897766113281, "global_step": 67311, "epoch": 556} {"train_loss": -36.03340148925781, "global_step": 67312, "epoch": 556} {"train_loss": -36.48149490356445, "global_step": 67313, "epoch": 556} {"train_loss": -36.31474685668945, "global_step": 67314, "epoch": 556} {"train_loss": -36.512840270996094, "global_step": 67315, "epoch": 556} {"train_loss": -35.138465881347656, "global_step": 67316, "epoch": 556} {"train_loss": -36.06319808959961, "global_step": 67317, "epoch": 556} {"train_loss": -35.90743637084961, "global_step": 67318, "epoch": 556} {"train_loss": -36.09685134887695, "global_step": 67319, "epoch": 556} {"train_loss": -37.026737213134766, "global_step": 67320, "epoch": 556} {"train_loss": -36.45370101928711, "global_step": 67321, "epoch": 556} {"train_loss": -35.44743728637695, "global_step": 67322, "epoch": 556} {"train_loss": -36.22502136230469, "global_step": 67323, "epoch": 556} {"train_loss": -36.16107940673828, "global_step": 67324, "epoch": 556} {"train_loss": -36.600486755371094, "global_step": 67325, "epoch": 556} {"train_loss": -36.5554313659668, "global_step": 67326, "epoch": 556} {"train_loss": -36.82346725463867, "global_step": 67327, "epoch": 556} {"train_loss": -36.738990783691406, "global_step": 67328, "epoch": 556} {"train_loss": -36.79311752319336, "global_step": 67329, "epoch": 556} {"train_loss": -36.46809387207031, "global_step": 67330, "epoch": 556} {"train_loss": -37.2730598449707, "global_step": 67331, "epoch": 556} {"train_loss": -36.1876335144043, "global_step": 67332, "epoch": 556} {"train_loss": -36.20723342895508, "global_step": 67333, "epoch": 556} {"train_loss": -36.86894607543945, "global_step": 67334, "epoch": 556} {"train_loss": -37.24753952026367, "global_step": 67335, "epoch": 556} {"train_loss": -35.26443099975586, "global_step": 67336, "epoch": 556} {"train_loss": -35.745548248291016, "global_step": 67337, "epoch": 556} {"train_loss": -36.03762435913086, "global_step": 67338, "epoch": 556} {"train_loss": -37.13595199584961, "global_step": 67339, "epoch": 556} {"train_loss": -36.5213623046875, "global_step": 67340, "epoch": 556} {"train_loss": -33.8607292175293, "global_step": 67341, "epoch": 556} {"train_loss": -35.34331512451172, "global_step": 67342, "epoch": 556} {"train_loss": -36.7186279296875, "global_step": 67343, "epoch": 556} {"train_loss": -36.24477767944336, "global_step": 67344, "epoch": 556} {"train_loss": -34.35295486450195, "global_step": 67345, "epoch": 556} {"train_loss": -34.90657043457031, "global_step": 67346, "epoch": 556} {"train_loss": -35.6150016784668, "global_step": 67347, "epoch": 556} {"train_loss": -35.42460250854492, "global_step": 67348, "epoch": 556} {"train_loss": -35.20711135864258, "global_step": 67349, "epoch": 556} {"train_loss": -36.369075775146484, "global_step": 67350, "epoch": 556} {"train_loss": -36.94666290283203, "global_step": 67351, "epoch": 556} {"train_loss": -34.84900665283203, "global_step": 67352, "epoch": 556} {"train_loss": -35.85100173950195, "global_step": 67353, "epoch": 556} {"train_loss": -36.4819450378418, "global_step": 67354, "epoch": 556} {"train_loss": -36.5588493347168, "global_step": 67355, "epoch": 556} {"train_loss": -36.20090866088867, "global_step": 67356, "epoch": 556} {"train_loss": -34.641632080078125, "global_step": 67357, "epoch": 556} {"train_loss": -36.38978958129883, "global_step": 67358, "epoch": 556} {"train_loss": -36.51725387573242, "global_step": 67359, "epoch": 556} {"train_loss": -36.823570251464844, "global_step": 67360, "epoch": 556} {"train_loss": -36.78411865234375, "global_step": 67361, "epoch": 556} {"train_loss": -35.7507438659668, "global_step": 67362, "epoch": 556} {"train_loss": -36.353431701660156, "global_step": 67363, "epoch": 556} {"train_loss": -35.69378662109375, "global_step": 67364, "epoch": 556} {"train_loss": -36.31595993041992, "global_step": 67365, "epoch": 556} {"train_loss": -35.91425323486328, "global_step": 67366, "epoch": 556} {"train_loss": -36.26847457885742, "global_step": 67367, "epoch": 556} {"train_loss": -35.69083023071289, "global_step": 67368, "epoch": 556} {"train_loss": -36.41542434692383, "global_step": 67369, "epoch": 556} {"train_loss": -36.7051887512207, "global_step": 67370, "epoch": 556} {"train_loss": -36.242454528808594, "global_step": 67371, "epoch": 556} {"train_loss": -36.79295349121094, "global_step": 67372, "epoch": 556} {"train_loss": -36.9238166809082, "global_step": 67373, "epoch": 556} {"train_loss": -36.322021484375, "global_step": 67374, "epoch": 556} {"train_loss": -36.28794479370117, "global_step": 67375, "epoch": 556} {"train_loss": -35.79720687866211, "global_step": 67376, "epoch": 556} {"train_loss": -36.42687225341797, "global_step": 67377, "epoch": 556} {"train_loss": -35.43359375, "global_step": 67378, "epoch": 556} {"train_loss": -37.028194427490234, "global_step": 67379, "epoch": 556} {"train_loss": -36.83797836303711, "global_step": 67380, "epoch": 556} {"train_loss": -36.792781829833984, "global_step": 67381, "epoch": 556} {"train_loss": -36.166114807128906, "global_step": 67382, "epoch": 556} {"train_loss": -36.73857498168945, "global_step": 67383, "epoch": 556} {"train_loss": -36.88099670410156, "global_step": 67384, "epoch": 556} {"train_loss": -35.913185119628906, "global_step": 67385, "epoch": 556} {"train_loss": -36.49488067626953, "global_step": 67386, "epoch": 556} {"train_loss": -36.35658645629883, "global_step": 67387, "epoch": 556} {"train_loss": -36.466529846191406, "global_step": 67388, "epoch": 556} {"train_loss": -36.16010665893555, "global_step": 67389, "epoch": 556} {"train_loss": -36.54937744140625, "global_step": 67390, "epoch": 556} {"train_loss": -35.91151809692383, "global_step": 67391, "epoch": 556} {"train_loss": -34.009891510009766, "global_step": 67392, "epoch": 556} {"train_loss": -35.968441009521484, "global_step": 67393, "epoch": 556} {"train_loss": -35.04412078857422, "global_step": 67394, "epoch": 556} {"train_loss": -36.581024169921875, "global_step": 67395, "epoch": 556} {"train_loss": -35.861354386510925, "global_step": 67396, "epoch": 556, "val_loss": 2658730.25} {"train_loss": -35.91735076904297, "global_step": 67397, "epoch": 557} {"train_loss": -35.760040283203125, "global_step": 67398, "epoch": 557} {"train_loss": -35.80379867553711, "global_step": 67399, "epoch": 557} {"train_loss": -36.7295036315918, "global_step": 67400, "epoch": 557} {"train_loss": -36.074947357177734, "global_step": 67401, "epoch": 557} {"train_loss": -35.77872085571289, "global_step": 67402, "epoch": 557} {"train_loss": -36.719635009765625, "global_step": 67403, "epoch": 557} {"train_loss": -29.667102813720703, "global_step": 67404, "epoch": 557} {"train_loss": -36.31602096557617, "global_step": 67405, "epoch": 557} {"train_loss": -34.72402572631836, "global_step": 67406, "epoch": 557} {"train_loss": -34.534637451171875, "global_step": 67407, "epoch": 557} {"train_loss": -34.42933654785156, "global_step": 67408, "epoch": 557} {"train_loss": -34.35151290893555, "global_step": 67409, "epoch": 557} {"train_loss": -34.3005485534668, "global_step": 67410, "epoch": 557} {"train_loss": -34.71990966796875, "global_step": 67411, "epoch": 557} {"train_loss": -34.71309280395508, "global_step": 67412, "epoch": 557} {"train_loss": -32.436676025390625, "global_step": 67413, "epoch": 557} {"train_loss": -33.66778564453125, "global_step": 67414, "epoch": 557} {"train_loss": -34.359771728515625, "global_step": 67415, "epoch": 557} {"train_loss": -34.225826263427734, "global_step": 67416, "epoch": 557} {"train_loss": -34.795650482177734, "global_step": 67417, "epoch": 557} {"train_loss": -35.6203727722168, "global_step": 67418, "epoch": 557} {"train_loss": -35.213279724121094, "global_step": 67419, "epoch": 557} {"train_loss": -35.637359619140625, "global_step": 67420, "epoch": 557} {"train_loss": -34.05794906616211, "global_step": 67421, "epoch": 557} {"train_loss": -33.66746139526367, "global_step": 67422, "epoch": 557} {"train_loss": -34.0608024597168, "global_step": 67423, "epoch": 557} {"train_loss": -33.51639938354492, "global_step": 67424, "epoch": 557} {"train_loss": -32.24509811401367, "global_step": 67425, "epoch": 557} {"train_loss": -33.588714599609375, "global_step": 67426, "epoch": 557} {"train_loss": -32.039031982421875, "global_step": 67427, "epoch": 557} {"train_loss": -34.98994064331055, "global_step": 67428, "epoch": 557} {"train_loss": -33.24138259887695, "global_step": 67429, "epoch": 557} {"train_loss": -35.128170013427734, "global_step": 67430, "epoch": 557} {"train_loss": -35.5669059753418, "global_step": 67431, "epoch": 557} {"train_loss": -33.94686508178711, "global_step": 67432, "epoch": 557} {"train_loss": -36.10707092285156, "global_step": 67433, "epoch": 557} {"train_loss": -35.76554489135742, "global_step": 67434, "epoch": 557} {"train_loss": -34.88573455810547, "global_step": 67435, "epoch": 557} {"train_loss": -36.08147048950195, "global_step": 67436, "epoch": 557} {"train_loss": -35.83271408081055, "global_step": 67437, "epoch": 557} {"train_loss": -35.419921875, "global_step": 67438, "epoch": 557} {"train_loss": -35.24317169189453, "global_step": 67439, "epoch": 557} {"train_loss": -36.208251953125, "global_step": 67440, "epoch": 557} {"train_loss": -35.84107971191406, "global_step": 67441, "epoch": 557} {"train_loss": -35.648468017578125, "global_step": 67442, "epoch": 557} {"train_loss": -35.865047454833984, "global_step": 67443, "epoch": 557} {"train_loss": -35.897579193115234, "global_step": 67444, "epoch": 557} {"train_loss": -35.96002960205078, "global_step": 67445, "epoch": 557} {"train_loss": -36.13728713989258, "global_step": 67446, "epoch": 557} {"train_loss": -35.959266662597656, "global_step": 67447, "epoch": 557} {"train_loss": -35.62977600097656, "global_step": 67448, "epoch": 557} {"train_loss": -35.99508285522461, "global_step": 67449, "epoch": 557} {"train_loss": -36.551551818847656, "global_step": 67450, "epoch": 557} {"train_loss": -35.890987396240234, "global_step": 67451, "epoch": 557} {"train_loss": -36.47731399536133, "global_step": 67452, "epoch": 557} {"train_loss": -36.598628997802734, "global_step": 67453, "epoch": 557} {"train_loss": -36.169918060302734, "global_step": 67454, "epoch": 557} {"train_loss": -36.49723815917969, "global_step": 67455, "epoch": 557} {"train_loss": -36.650970458984375, "global_step": 67456, "epoch": 557} {"train_loss": -36.86897659301758, "global_step": 67457, "epoch": 557} {"train_loss": -36.44869613647461, "global_step": 67458, "epoch": 557} {"train_loss": -36.659019470214844, "global_step": 67459, "epoch": 557} {"train_loss": -36.733394622802734, "global_step": 67460, "epoch": 557} {"train_loss": -35.96799087524414, "global_step": 67461, "epoch": 557} {"train_loss": -36.91176986694336, "global_step": 67462, "epoch": 557} {"train_loss": -36.6276741027832, "global_step": 67463, "epoch": 557} {"train_loss": -36.688167572021484, "global_step": 67464, "epoch": 557} {"train_loss": -36.6978759765625, "global_step": 67465, "epoch": 557} {"train_loss": -37.03515625, "global_step": 67466, "epoch": 557} {"train_loss": -37.15450668334961, "global_step": 67467, "epoch": 557} {"train_loss": -37.395660400390625, "global_step": 67468, "epoch": 557} {"train_loss": -36.90714645385742, "global_step": 67469, "epoch": 557} {"train_loss": -36.18935775756836, "global_step": 67470, "epoch": 557} {"train_loss": -35.79871368408203, "global_step": 67471, "epoch": 557} {"train_loss": -35.495635986328125, "global_step": 67472, "epoch": 557} {"train_loss": -34.89619064331055, "global_step": 67473, "epoch": 557} {"train_loss": -34.72739791870117, "global_step": 67474, "epoch": 557} {"train_loss": -36.0875358581543, "global_step": 67475, "epoch": 557} {"train_loss": -36.93606948852539, "global_step": 67476, "epoch": 557} {"train_loss": -36.624061584472656, "global_step": 67477, "epoch": 557} {"train_loss": -36.367530822753906, "global_step": 67478, "epoch": 557} {"train_loss": -36.670921325683594, "global_step": 67479, "epoch": 557} {"train_loss": -37.037715911865234, "global_step": 67480, "epoch": 557} {"train_loss": -36.64023971557617, "global_step": 67481, "epoch": 557} {"train_loss": -35.94914627075195, "global_step": 67482, "epoch": 557} {"train_loss": -35.7561149597168, "global_step": 67483, "epoch": 557} {"train_loss": -35.815608978271484, "global_step": 67484, "epoch": 557} {"train_loss": -37.05146026611328, "global_step": 67485, "epoch": 557} {"train_loss": -37.20085144042969, "global_step": 67486, "epoch": 557} {"train_loss": -36.183876037597656, "global_step": 67487, "epoch": 557} {"train_loss": -37.28987503051758, "global_step": 67488, "epoch": 557} {"train_loss": -37.03106689453125, "global_step": 67489, "epoch": 557} {"train_loss": -37.4542236328125, "global_step": 67490, "epoch": 557} {"train_loss": -37.2262077331543, "global_step": 67491, "epoch": 557} {"train_loss": -37.74387741088867, "global_step": 67492, "epoch": 557} {"train_loss": -37.57726287841797, "global_step": 67493, "epoch": 557} {"train_loss": -37.4569206237793, "global_step": 67494, "epoch": 557} {"train_loss": -37.64809036254883, "global_step": 67495, "epoch": 557} {"train_loss": -36.93707275390625, "global_step": 67496, "epoch": 557} {"train_loss": -36.67237091064453, "global_step": 67497, "epoch": 557} {"train_loss": -35.86255645751953, "global_step": 67498, "epoch": 557} {"train_loss": -37.197383880615234, "global_step": 67499, "epoch": 557} {"train_loss": -37.310359954833984, "global_step": 67500, "epoch": 557} {"train_loss": -36.63160705566406, "global_step": 67501, "epoch": 557} {"train_loss": -36.97529983520508, "global_step": 67502, "epoch": 557} {"train_loss": -37.646209716796875, "global_step": 67503, "epoch": 557} {"train_loss": -36.67733383178711, "global_step": 67504, "epoch": 557} {"train_loss": -37.337196350097656, "global_step": 67505, "epoch": 557} {"train_loss": -37.35703659057617, "global_step": 67506, "epoch": 557} {"train_loss": -36.650291442871094, "global_step": 67507, "epoch": 557} {"train_loss": -36.193115234375, "global_step": 67508, "epoch": 557} {"train_loss": -37.06892013549805, "global_step": 67509, "epoch": 557} {"train_loss": -37.26970291137695, "global_step": 67510, "epoch": 557} {"train_loss": -36.445579528808594, "global_step": 67511, "epoch": 557} {"train_loss": -35.75661087036133, "global_step": 67512, "epoch": 557} {"train_loss": -34.07261657714844, "global_step": 67513, "epoch": 557} {"train_loss": -33.98626708984375, "global_step": 67514, "epoch": 557} {"train_loss": -33.39107131958008, "global_step": 67515, "epoch": 557} {"train_loss": -35.503448486328125, "global_step": 67516, "epoch": 557} {"train_loss": -35.8301779691838, "global_step": 67517, "epoch": 557, "val_loss": 2551020.75} {"train_loss": -37.31889343261719, "global_step": 67518, "epoch": 558} {"train_loss": -37.642147064208984, "global_step": 67519, "epoch": 558} {"train_loss": -37.594905853271484, "global_step": 67520, "epoch": 558} {"train_loss": -37.36491012573242, "global_step": 67521, "epoch": 558} {"train_loss": -37.05323028564453, "global_step": 67522, "epoch": 558} {"train_loss": -37.713287353515625, "global_step": 67523, "epoch": 558} {"train_loss": -37.13892364501953, "global_step": 67524, "epoch": 558} {"train_loss": -37.097286224365234, "global_step": 67525, "epoch": 558} {"train_loss": -36.98265838623047, "global_step": 67526, "epoch": 558} {"train_loss": -37.43134307861328, "global_step": 67527, "epoch": 558} {"train_loss": -36.684425354003906, "global_step": 67528, "epoch": 558} {"train_loss": -37.492469787597656, "global_step": 67529, "epoch": 558} {"train_loss": -36.936100006103516, "global_step": 67530, "epoch": 558} {"train_loss": -36.5003776550293, "global_step": 67531, "epoch": 558} {"train_loss": -35.99189376831055, "global_step": 67532, "epoch": 558} {"train_loss": -35.25006103515625, "global_step": 67533, "epoch": 558} {"train_loss": -34.961238861083984, "global_step": 67534, "epoch": 558} {"train_loss": -33.42955780029297, "global_step": 67535, "epoch": 558} {"train_loss": -33.11758041381836, "global_step": 67536, "epoch": 558} {"train_loss": -30.8028507232666, "global_step": 67537, "epoch": 558} {"train_loss": -31.937482833862305, "global_step": 67538, "epoch": 558} {"train_loss": -35.48717498779297, "global_step": 67539, "epoch": 558} {"train_loss": -30.030780792236328, "global_step": 67540, "epoch": 558} {"train_loss": -33.301753997802734, "global_step": 67541, "epoch": 558} {"train_loss": -35.85913848876953, "global_step": 67542, "epoch": 558} {"train_loss": -34.19234085083008, "global_step": 67543, "epoch": 558} {"train_loss": -35.16495132446289, "global_step": 67544, "epoch": 558} {"train_loss": -34.80833435058594, "global_step": 67545, "epoch": 558} {"train_loss": -36.657066345214844, "global_step": 67546, "epoch": 558} {"train_loss": -35.65068435668945, "global_step": 67547, "epoch": 558} {"train_loss": -34.391658782958984, "global_step": 67548, "epoch": 558} {"train_loss": -35.88990020751953, "global_step": 67549, "epoch": 558} {"train_loss": -35.34589767456055, "global_step": 67550, "epoch": 558} {"train_loss": -35.81679916381836, "global_step": 67551, "epoch": 558} {"train_loss": -36.29166793823242, "global_step": 67552, "epoch": 558} {"train_loss": -35.953975677490234, "global_step": 67553, "epoch": 558} {"train_loss": -35.349884033203125, "global_step": 67554, "epoch": 558} {"train_loss": -35.934234619140625, "global_step": 67555, "epoch": 558} {"train_loss": -35.55458450317383, "global_step": 67556, "epoch": 558} {"train_loss": -36.11256408691406, "global_step": 67557, "epoch": 558} {"train_loss": -36.54667663574219, "global_step": 67558, "epoch": 558} {"train_loss": -35.689720153808594, "global_step": 67559, "epoch": 558} {"train_loss": -36.032508850097656, "global_step": 67560, "epoch": 558} {"train_loss": -36.661231994628906, "global_step": 67561, "epoch": 558} {"train_loss": -36.22755432128906, "global_step": 67562, "epoch": 558} {"train_loss": -36.743621826171875, "global_step": 67563, "epoch": 558} {"train_loss": -36.7510986328125, "global_step": 67564, "epoch": 558} {"train_loss": -36.48910140991211, "global_step": 67565, "epoch": 558} {"train_loss": -36.35921096801758, "global_step": 67566, "epoch": 558} {"train_loss": -36.100379943847656, "global_step": 67567, "epoch": 558} {"train_loss": -36.72828674316406, "global_step": 67568, "epoch": 558} {"train_loss": -34.42771530151367, "global_step": 67569, "epoch": 558} {"train_loss": -36.65167999267578, "global_step": 67570, "epoch": 558} {"train_loss": -36.42006301879883, "global_step": 67571, "epoch": 558} {"train_loss": -35.73611068725586, "global_step": 67572, "epoch": 558} {"train_loss": -34.96863555908203, "global_step": 67573, "epoch": 558} {"train_loss": -36.82061767578125, "global_step": 67574, "epoch": 558} {"train_loss": -36.53644943237305, "global_step": 67575, "epoch": 558} {"train_loss": -35.492225646972656, "global_step": 67576, "epoch": 558} {"train_loss": -36.70737838745117, "global_step": 67577, "epoch": 558} {"train_loss": -36.14181137084961, "global_step": 67578, "epoch": 558} {"train_loss": -36.86448287963867, "global_step": 67579, "epoch": 558} {"train_loss": -36.655704498291016, "global_step": 67580, "epoch": 558} {"train_loss": -36.493167877197266, "global_step": 67581, "epoch": 558} {"train_loss": -36.62915802001953, "global_step": 67582, "epoch": 558} {"train_loss": -36.12001419067383, "global_step": 67583, "epoch": 558} {"train_loss": -36.12770462036133, "global_step": 67584, "epoch": 558} {"train_loss": -37.169185638427734, "global_step": 67585, "epoch": 558} {"train_loss": -36.67597961425781, "global_step": 67586, "epoch": 558} {"train_loss": -36.70579528808594, "global_step": 67587, "epoch": 558} {"train_loss": -36.798561096191406, "global_step": 67588, "epoch": 558} {"train_loss": -36.861785888671875, "global_step": 67589, "epoch": 558} {"train_loss": -36.91752243041992, "global_step": 67590, "epoch": 558} {"train_loss": -36.05281448364258, "global_step": 67591, "epoch": 558} {"train_loss": -37.353759765625, "global_step": 67592, "epoch": 558} {"train_loss": -35.622459411621094, "global_step": 67593, "epoch": 558} {"train_loss": -35.8076171875, "global_step": 67594, "epoch": 558} {"train_loss": -36.38792037963867, "global_step": 67595, "epoch": 558} {"train_loss": -35.80091094970703, "global_step": 67596, "epoch": 558} {"train_loss": -37.07611083984375, "global_step": 67597, "epoch": 558} {"train_loss": -36.505104064941406, "global_step": 67598, "epoch": 558} {"train_loss": -36.87841796875, "global_step": 67599, "epoch": 558} {"train_loss": -37.082271575927734, "global_step": 67600, "epoch": 558} {"train_loss": -36.36865234375, "global_step": 67601, "epoch": 558} {"train_loss": -36.402400970458984, "global_step": 67602, "epoch": 558} {"train_loss": -37.2467155456543, "global_step": 67603, "epoch": 558} {"train_loss": -37.09616470336914, "global_step": 67604, "epoch": 558} {"train_loss": -37.17483139038086, "global_step": 67605, "epoch": 558} {"train_loss": -36.470603942871094, "global_step": 67606, "epoch": 558} {"train_loss": -37.289390563964844, "global_step": 67607, "epoch": 558} {"train_loss": -37.33576583862305, "global_step": 67608, "epoch": 558} {"train_loss": -37.11177444458008, "global_step": 67609, "epoch": 558} {"train_loss": -36.1306037902832, "global_step": 67610, "epoch": 558} {"train_loss": -36.81755065917969, "global_step": 67611, "epoch": 558} {"train_loss": -37.519615173339844, "global_step": 67612, "epoch": 558} {"train_loss": -37.2321891784668, "global_step": 67613, "epoch": 558} {"train_loss": -37.275203704833984, "global_step": 67614, "epoch": 558} {"train_loss": -37.691707611083984, "global_step": 67615, "epoch": 558} {"train_loss": -36.902130126953125, "global_step": 67616, "epoch": 558} {"train_loss": -37.00089645385742, "global_step": 67617, "epoch": 558} {"train_loss": -36.90614700317383, "global_step": 67618, "epoch": 558} {"train_loss": -36.96044921875, "global_step": 67619, "epoch": 558} {"train_loss": -36.0649299621582, "global_step": 67620, "epoch": 558} {"train_loss": -36.7904052734375, "global_step": 67621, "epoch": 558} {"train_loss": -36.606685638427734, "global_step": 67622, "epoch": 558} {"train_loss": -37.5343132019043, "global_step": 67623, "epoch": 558} {"train_loss": -37.543087005615234, "global_step": 67624, "epoch": 558} {"train_loss": -37.28938674926758, "global_step": 67625, "epoch": 558} {"train_loss": -37.175148010253906, "global_step": 67626, "epoch": 558} {"train_loss": -37.13391876220703, "global_step": 67627, "epoch": 558} {"train_loss": -37.111568450927734, "global_step": 67628, "epoch": 558} {"train_loss": -37.19087600708008, "global_step": 67629, "epoch": 558} {"train_loss": -37.300933837890625, "global_step": 67630, "epoch": 558} {"train_loss": -35.99356460571289, "global_step": 67631, "epoch": 558} {"train_loss": -36.07503890991211, "global_step": 67632, "epoch": 558} {"train_loss": -35.8052978515625, "global_step": 67633, "epoch": 558} {"train_loss": -34.1186408996582, "global_step": 67634, "epoch": 558} {"train_loss": -26.842695236206055, "global_step": 67635, "epoch": 558} {"train_loss": -10.453554153442383, "global_step": 67636, "epoch": 558} {"train_loss": -7.626237392425537, "global_step": 67637, "epoch": 558} {"train_loss": -35.665540785828895, "global_step": 67638, "epoch": 558, "val_loss": 2533292.75} {"train_loss": -30.51910400390625, "global_step": 67639, "epoch": 559} {"train_loss": -28.50310707092285, "global_step": 67640, "epoch": 559} {"train_loss": -32.27999496459961, "global_step": 67641, "epoch": 559} {"train_loss": -30.996505737304688, "global_step": 67642, "epoch": 559} {"train_loss": -33.15532684326172, "global_step": 67643, "epoch": 559} {"train_loss": -32.71760177612305, "global_step": 67644, "epoch": 559} {"train_loss": -33.18636703491211, "global_step": 67645, "epoch": 559} {"train_loss": -34.44536209106445, "global_step": 67646, "epoch": 559} {"train_loss": -33.88896179199219, "global_step": 67647, "epoch": 559} {"train_loss": -33.73029708862305, "global_step": 67648, "epoch": 559} {"train_loss": -34.8814582824707, "global_step": 67649, "epoch": 559} {"train_loss": -33.36542510986328, "global_step": 67650, "epoch": 559} {"train_loss": -32.620399475097656, "global_step": 67651, "epoch": 559} {"train_loss": -35.59224319458008, "global_step": 67652, "epoch": 559} {"train_loss": -33.08614730834961, "global_step": 67653, "epoch": 559} {"train_loss": -32.88532638549805, "global_step": 67654, "epoch": 559} {"train_loss": -34.48336410522461, "global_step": 67655, "epoch": 559} {"train_loss": -35.53388214111328, "global_step": 67656, "epoch": 559} {"train_loss": -33.36402130126953, "global_step": 67657, "epoch": 559} {"train_loss": -34.707435607910156, "global_step": 67658, "epoch": 559} {"train_loss": -35.23418045043945, "global_step": 67659, "epoch": 559} {"train_loss": -33.917781829833984, "global_step": 67660, "epoch": 559} {"train_loss": -35.09450149536133, "global_step": 67661, "epoch": 559} {"train_loss": -34.25978469848633, "global_step": 67662, "epoch": 559} {"train_loss": -35.82497787475586, "global_step": 67663, "epoch": 559} {"train_loss": -35.45566177368164, "global_step": 67664, "epoch": 559} {"train_loss": -35.052730560302734, "global_step": 67665, "epoch": 559} {"train_loss": -35.09608840942383, "global_step": 67666, "epoch": 559} {"train_loss": -34.87358474731445, "global_step": 67667, "epoch": 559} {"train_loss": -34.490692138671875, "global_step": 67668, "epoch": 559} {"train_loss": -35.58723068237305, "global_step": 67669, "epoch": 559} {"train_loss": -35.367469787597656, "global_step": 67670, "epoch": 559} {"train_loss": -35.19846725463867, "global_step": 67671, "epoch": 559} {"train_loss": -35.234004974365234, "global_step": 67672, "epoch": 559} {"train_loss": -34.60529327392578, "global_step": 67673, "epoch": 559} {"train_loss": -35.36208724975586, "global_step": 67674, "epoch": 559} {"train_loss": -35.12067794799805, "global_step": 67675, "epoch": 559} {"train_loss": -35.34291076660156, "global_step": 67676, "epoch": 559} {"train_loss": -35.53205490112305, "global_step": 67677, "epoch": 559} {"train_loss": -35.433685302734375, "global_step": 67678, "epoch": 559} {"train_loss": -35.02976989746094, "global_step": 67679, "epoch": 559} {"train_loss": -34.558074951171875, "global_step": 67680, "epoch": 559} {"train_loss": -35.852272033691406, "global_step": 67681, "epoch": 559} {"train_loss": -34.76279830932617, "global_step": 67682, "epoch": 559} {"train_loss": -35.36611557006836, "global_step": 67683, "epoch": 559} {"train_loss": -35.75297927856445, "global_step": 67684, "epoch": 559} {"train_loss": -35.250457763671875, "global_step": 67685, "epoch": 559} {"train_loss": -36.091705322265625, "global_step": 67686, "epoch": 559} {"train_loss": -35.91487503051758, "global_step": 67687, "epoch": 559} {"train_loss": -35.71321105957031, "global_step": 67688, "epoch": 559} {"train_loss": -35.603511810302734, "global_step": 67689, "epoch": 559} {"train_loss": -36.372188568115234, "global_step": 67690, "epoch": 559} {"train_loss": -36.075653076171875, "global_step": 67691, "epoch": 559} {"train_loss": -36.43376922607422, "global_step": 67692, "epoch": 559} {"train_loss": -35.2227668762207, "global_step": 67693, "epoch": 559} {"train_loss": -34.602657318115234, "global_step": 67694, "epoch": 559} {"train_loss": -35.16102981567383, "global_step": 67695, "epoch": 559} {"train_loss": -36.34526062011719, "global_step": 67696, "epoch": 559} {"train_loss": -35.74835205078125, "global_step": 67697, "epoch": 559} {"train_loss": -35.40475082397461, "global_step": 67698, "epoch": 559} {"train_loss": -35.82358932495117, "global_step": 67699, "epoch": 559} {"train_loss": -35.8032341003418, "global_step": 67700, "epoch": 559} {"train_loss": -35.37892150878906, "global_step": 67701, "epoch": 559} {"train_loss": -35.557579040527344, "global_step": 67702, "epoch": 559} {"train_loss": -35.08321762084961, "global_step": 67703, "epoch": 559} {"train_loss": -35.11986541748047, "global_step": 67704, "epoch": 559} {"train_loss": -35.66749572753906, "global_step": 67705, "epoch": 559} {"train_loss": -36.2197380065918, "global_step": 67706, "epoch": 559} {"train_loss": -36.39418029785156, "global_step": 67707, "epoch": 559} {"train_loss": -35.6903190612793, "global_step": 67708, "epoch": 559} {"train_loss": -35.52773666381836, "global_step": 67709, "epoch": 559} {"train_loss": -35.949459075927734, "global_step": 67710, "epoch": 559} {"train_loss": -36.24797439575195, "global_step": 67711, "epoch": 559} {"train_loss": -36.42280197143555, "global_step": 67712, "epoch": 559} {"train_loss": -35.80963897705078, "global_step": 67713, "epoch": 559} {"train_loss": -36.111572265625, "global_step": 67714, "epoch": 559} {"train_loss": -35.853851318359375, "global_step": 67715, "epoch": 559} {"train_loss": -36.2243537902832, "global_step": 67716, "epoch": 559} {"train_loss": -35.28291702270508, "global_step": 67717, "epoch": 559} {"train_loss": -36.610530853271484, "global_step": 67718, "epoch": 559} {"train_loss": -36.391929626464844, "global_step": 67719, "epoch": 559} {"train_loss": -35.50614547729492, "global_step": 67720, "epoch": 559} {"train_loss": -34.77315902709961, "global_step": 67721, "epoch": 559} {"train_loss": -34.81801986694336, "global_step": 67722, "epoch": 559} {"train_loss": -36.59425735473633, "global_step": 67723, "epoch": 559} {"train_loss": -34.651424407958984, "global_step": 67724, "epoch": 559} {"train_loss": -31.784448623657227, "global_step": 67725, "epoch": 559} {"train_loss": -31.35793113708496, "global_step": 67726, "epoch": 559} {"train_loss": -33.505184173583984, "global_step": 67727, "epoch": 559} {"train_loss": -36.15541458129883, "global_step": 67728, "epoch": 559} {"train_loss": -35.32407760620117, "global_step": 67729, "epoch": 559} {"train_loss": -35.42374801635742, "global_step": 67730, "epoch": 559} {"train_loss": -36.1953239440918, "global_step": 67731, "epoch": 559} {"train_loss": -36.47684860229492, "global_step": 67732, "epoch": 559} {"train_loss": -35.48444366455078, "global_step": 67733, "epoch": 559} {"train_loss": -36.57784652709961, "global_step": 67734, "epoch": 559} {"train_loss": -36.218868255615234, "global_step": 67735, "epoch": 559} {"train_loss": -36.66621780395508, "global_step": 67736, "epoch": 559} {"train_loss": -36.77926254272461, "global_step": 67737, "epoch": 559} {"train_loss": -36.58475875854492, "global_step": 67738, "epoch": 559} {"train_loss": -36.39640808105469, "global_step": 67739, "epoch": 559} {"train_loss": -36.391536712646484, "global_step": 67740, "epoch": 559} {"train_loss": -36.47202682495117, "global_step": 67741, "epoch": 559} {"train_loss": -36.26996994018555, "global_step": 67742, "epoch": 559} {"train_loss": -36.50175476074219, "global_step": 67743, "epoch": 559} {"train_loss": -36.24102020263672, "global_step": 67744, "epoch": 559} {"train_loss": -36.36417007446289, "global_step": 67745, "epoch": 559} {"train_loss": -35.906776428222656, "global_step": 67746, "epoch": 559} {"train_loss": -36.41792297363281, "global_step": 67747, "epoch": 559} {"train_loss": -35.76782989501953, "global_step": 67748, "epoch": 559} {"train_loss": -34.288631439208984, "global_step": 67749, "epoch": 559} {"train_loss": -35.26353073120117, "global_step": 67750, "epoch": 559} {"train_loss": -36.18086624145508, "global_step": 67751, "epoch": 559} {"train_loss": -35.45595169067383, "global_step": 67752, "epoch": 559} {"train_loss": -35.52463150024414, "global_step": 67753, "epoch": 559} {"train_loss": -36.10853576660156, "global_step": 67754, "epoch": 559} {"train_loss": -36.14118576049805, "global_step": 67755, "epoch": 559} {"train_loss": -36.19292449951172, "global_step": 67756, "epoch": 559} {"train_loss": -36.1132926940918, "global_step": 67757, "epoch": 559} {"train_loss": -36.7475471496582, "global_step": 67758, "epoch": 559} {"train_loss": -35.19073194708706, "global_step": 67759, "epoch": 559, "val_loss": 2616044.0} {"train_loss": -35.559425354003906, "global_step": 67760, "epoch": 560} {"train_loss": -35.33091354370117, "global_step": 67761, "epoch": 560} {"train_loss": -35.03439712524414, "global_step": 67762, "epoch": 560} {"train_loss": -34.24824905395508, "global_step": 67763, "epoch": 560} {"train_loss": -35.67390823364258, "global_step": 67764, "epoch": 560} {"train_loss": -36.545387268066406, "global_step": 67765, "epoch": 560} {"train_loss": -36.14754867553711, "global_step": 67766, "epoch": 560} {"train_loss": -35.927757263183594, "global_step": 67767, "epoch": 560} {"train_loss": -35.9056282043457, "global_step": 67768, "epoch": 560} {"train_loss": -35.864959716796875, "global_step": 67769, "epoch": 560} {"train_loss": -36.405147552490234, "global_step": 67770, "epoch": 560} {"train_loss": -34.7972412109375, "global_step": 67771, "epoch": 560} {"train_loss": -35.29096603393555, "global_step": 67772, "epoch": 560} {"train_loss": -36.134918212890625, "global_step": 67773, "epoch": 560} {"train_loss": -35.383888244628906, "global_step": 67774, "epoch": 560} {"train_loss": -35.40814208984375, "global_step": 67775, "epoch": 560} {"train_loss": -35.88033676147461, "global_step": 67776, "epoch": 560} {"train_loss": -35.25710678100586, "global_step": 67777, "epoch": 560} {"train_loss": -36.783782958984375, "global_step": 67778, "epoch": 560} {"train_loss": -35.33479309082031, "global_step": 67779, "epoch": 560} {"train_loss": -35.58913803100586, "global_step": 67780, "epoch": 560} {"train_loss": -36.33684539794922, "global_step": 67781, "epoch": 560} {"train_loss": -36.07936477661133, "global_step": 67782, "epoch": 560} {"train_loss": -35.374847412109375, "global_step": 67783, "epoch": 560} {"train_loss": -36.20310592651367, "global_step": 67784, "epoch": 560} {"train_loss": -36.62997055053711, "global_step": 67785, "epoch": 560} {"train_loss": -36.28645706176758, "global_step": 67786, "epoch": 560} {"train_loss": -36.52888107299805, "global_step": 67787, "epoch": 560} {"train_loss": -36.77928161621094, "global_step": 67788, "epoch": 560} {"train_loss": -36.53074645996094, "global_step": 67789, "epoch": 560} {"train_loss": -36.306007385253906, "global_step": 67790, "epoch": 560} {"train_loss": -36.24553298950195, "global_step": 67791, "epoch": 560} {"train_loss": -36.25156784057617, "global_step": 67792, "epoch": 560} {"train_loss": -37.06205368041992, "global_step": 67793, "epoch": 560} {"train_loss": -36.20319747924805, "global_step": 67794, "epoch": 560} {"train_loss": -36.961204528808594, "global_step": 67795, "epoch": 560} {"train_loss": -36.769527435302734, "global_step": 67796, "epoch": 560} {"train_loss": -35.44288635253906, "global_step": 67797, "epoch": 560} {"train_loss": -36.390560150146484, "global_step": 67798, "epoch": 560} {"train_loss": -36.4141960144043, "global_step": 67799, "epoch": 560} {"train_loss": -37.1324462890625, "global_step": 67800, "epoch": 560} {"train_loss": -36.83651351928711, "global_step": 67801, "epoch": 560} {"train_loss": -37.236873626708984, "global_step": 67802, "epoch": 560} {"train_loss": -36.237640380859375, "global_step": 67803, "epoch": 560} {"train_loss": -36.994140625, "global_step": 67804, "epoch": 560} {"train_loss": -37.26654052734375, "global_step": 67805, "epoch": 560} {"train_loss": -36.23057174682617, "global_step": 67806, "epoch": 560} {"train_loss": -36.610496520996094, "global_step": 67807, "epoch": 560} {"train_loss": -36.481353759765625, "global_step": 67808, "epoch": 560} {"train_loss": -36.3303108215332, "global_step": 67809, "epoch": 560} {"train_loss": -36.44849395751953, "global_step": 67810, "epoch": 560} {"train_loss": -35.95021438598633, "global_step": 67811, "epoch": 560} {"train_loss": -36.2280387878418, "global_step": 67812, "epoch": 560} {"train_loss": -35.276466369628906, "global_step": 67813, "epoch": 560} {"train_loss": -35.32887268066406, "global_step": 67814, "epoch": 560} {"train_loss": -36.66758346557617, "global_step": 67815, "epoch": 560} {"train_loss": -36.33048629760742, "global_step": 67816, "epoch": 560} {"train_loss": -36.45748519897461, "global_step": 67817, "epoch": 560} {"train_loss": -36.480567932128906, "global_step": 67818, "epoch": 560} {"train_loss": -36.82450485229492, "global_step": 67819, "epoch": 560} {"train_loss": -36.67506790161133, "global_step": 67820, "epoch": 560} {"train_loss": -35.94350814819336, "global_step": 67821, "epoch": 560} {"train_loss": -36.18748092651367, "global_step": 67822, "epoch": 560} {"train_loss": -35.01906204223633, "global_step": 67823, "epoch": 560} {"train_loss": -34.743812561035156, "global_step": 67824, "epoch": 560} {"train_loss": -35.739437103271484, "global_step": 67825, "epoch": 560} {"train_loss": -36.55333709716797, "global_step": 67826, "epoch": 560} {"train_loss": -34.72071838378906, "global_step": 67827, "epoch": 560} {"train_loss": -36.14079284667969, "global_step": 67828, "epoch": 560} {"train_loss": -36.69295883178711, "global_step": 67829, "epoch": 560} {"train_loss": -35.03324508666992, "global_step": 67830, "epoch": 560} {"train_loss": -35.061729431152344, "global_step": 67831, "epoch": 560} {"train_loss": -34.929466247558594, "global_step": 67832, "epoch": 560} {"train_loss": -35.221839904785156, "global_step": 67833, "epoch": 560} {"train_loss": -35.82979202270508, "global_step": 67834, "epoch": 560} {"train_loss": -33.800376892089844, "global_step": 67835, "epoch": 560} {"train_loss": -35.87665939331055, "global_step": 67836, "epoch": 560} {"train_loss": -35.94161605834961, "global_step": 67837, "epoch": 560} {"train_loss": -35.78367233276367, "global_step": 67838, "epoch": 560} {"train_loss": -36.32834243774414, "global_step": 67839, "epoch": 560} {"train_loss": -35.36750030517578, "global_step": 67840, "epoch": 560} {"train_loss": -35.56283187866211, "global_step": 67841, "epoch": 560} {"train_loss": -35.14716720581055, "global_step": 67842, "epoch": 560} {"train_loss": -32.975406646728516, "global_step": 67843, "epoch": 560} {"train_loss": -35.04102325439453, "global_step": 67844, "epoch": 560} {"train_loss": -34.35897445678711, "global_step": 67845, "epoch": 560} {"train_loss": -34.876502990722656, "global_step": 67846, "epoch": 560} {"train_loss": -30.49861717224121, "global_step": 67847, "epoch": 560} {"train_loss": -30.563390731811523, "global_step": 67848, "epoch": 560} {"train_loss": -33.499874114990234, "global_step": 67849, "epoch": 560} {"train_loss": -31.632070541381836, "global_step": 67850, "epoch": 560} {"train_loss": -35.02854537963867, "global_step": 67851, "epoch": 560} {"train_loss": -31.147130966186523, "global_step": 67852, "epoch": 560} {"train_loss": -33.623043060302734, "global_step": 67853, "epoch": 560} {"train_loss": -34.001556396484375, "global_step": 67854, "epoch": 560} {"train_loss": -34.9510498046875, "global_step": 67855, "epoch": 560} {"train_loss": -33.116188049316406, "global_step": 67856, "epoch": 560} {"train_loss": -35.292999267578125, "global_step": 67857, "epoch": 560} {"train_loss": -34.160091400146484, "global_step": 67858, "epoch": 560} {"train_loss": -35.39198684692383, "global_step": 67859, "epoch": 560} {"train_loss": -34.69977569580078, "global_step": 67860, "epoch": 560} {"train_loss": -35.885677337646484, "global_step": 67861, "epoch": 560} {"train_loss": -33.77613067626953, "global_step": 67862, "epoch": 560} {"train_loss": -35.460899353027344, "global_step": 67863, "epoch": 560} {"train_loss": -34.74441909790039, "global_step": 67864, "epoch": 560} {"train_loss": -35.5130729675293, "global_step": 67865, "epoch": 560} {"train_loss": -35.414405822753906, "global_step": 67866, "epoch": 560} {"train_loss": -35.73816680908203, "global_step": 67867, "epoch": 560} {"train_loss": -35.20856475830078, "global_step": 67868, "epoch": 560} {"train_loss": -35.646236419677734, "global_step": 67869, "epoch": 560} {"train_loss": -36.305233001708984, "global_step": 67870, "epoch": 560} {"train_loss": -35.5952033996582, "global_step": 67871, "epoch": 560} {"train_loss": -35.805580139160156, "global_step": 67872, "epoch": 560} {"train_loss": -36.351131439208984, "global_step": 67873, "epoch": 560} {"train_loss": -36.73465347290039, "global_step": 67874, "epoch": 560} {"train_loss": -35.858516693115234, "global_step": 67875, "epoch": 560} {"train_loss": -36.843994140625, "global_step": 67876, "epoch": 560} {"train_loss": -36.452003479003906, "global_step": 67877, "epoch": 560} {"train_loss": -34.76326370239258, "global_step": 67878, "epoch": 560} {"train_loss": -36.31284713745117, "global_step": 67879, "epoch": 560} {"train_loss": -35.59294733725304, "global_step": 67880, "epoch": 560, "val_loss": 2632148.25} {"train_loss": -36.295711517333984, "global_step": 67881, "epoch": 561} {"train_loss": -36.62397003173828, "global_step": 67882, "epoch": 561} {"train_loss": -36.38346862792969, "global_step": 67883, "epoch": 561} {"train_loss": -36.5034294128418, "global_step": 67884, "epoch": 561} {"train_loss": -35.854164123535156, "global_step": 67885, "epoch": 561} {"train_loss": -36.978981018066406, "global_step": 67886, "epoch": 561} {"train_loss": -36.584510803222656, "global_step": 67887, "epoch": 561} {"train_loss": -36.26778030395508, "global_step": 67888, "epoch": 561} {"train_loss": -37.25407028198242, "global_step": 67889, "epoch": 561} {"train_loss": -37.06288528442383, "global_step": 67890, "epoch": 561} {"train_loss": -36.80317306518555, "global_step": 67891, "epoch": 561} {"train_loss": -37.215553283691406, "global_step": 67892, "epoch": 561} {"train_loss": -36.621490478515625, "global_step": 67893, "epoch": 561} {"train_loss": -36.24534225463867, "global_step": 67894, "epoch": 561} {"train_loss": -37.063785552978516, "global_step": 67895, "epoch": 561} {"train_loss": -37.10066604614258, "global_step": 67896, "epoch": 561} {"train_loss": -36.81039810180664, "global_step": 67897, "epoch": 561} {"train_loss": -36.787811279296875, "global_step": 67898, "epoch": 561} {"train_loss": -37.36997985839844, "global_step": 67899, "epoch": 561} {"train_loss": -37.53341293334961, "global_step": 67900, "epoch": 561} {"train_loss": -37.24305725097656, "global_step": 67901, "epoch": 561} {"train_loss": -36.820716857910156, "global_step": 67902, "epoch": 561} {"train_loss": -37.45359420776367, "global_step": 67903, "epoch": 561} {"train_loss": -37.247005462646484, "global_step": 67904, "epoch": 561} {"train_loss": -37.08415985107422, "global_step": 67905, "epoch": 561} {"train_loss": -36.639991760253906, "global_step": 67906, "epoch": 561} {"train_loss": -37.11554718017578, "global_step": 67907, "epoch": 561} {"train_loss": -37.380348205566406, "global_step": 67908, "epoch": 561} {"train_loss": -37.05256652832031, "global_step": 67909, "epoch": 561} {"train_loss": -36.475868225097656, "global_step": 67910, "epoch": 561} {"train_loss": -36.879390716552734, "global_step": 67911, "epoch": 561} {"train_loss": -35.875221252441406, "global_step": 67912, "epoch": 561} {"train_loss": -34.23249435424805, "global_step": 67913, "epoch": 561} {"train_loss": -30.402997970581055, "global_step": 67914, "epoch": 561} {"train_loss": -31.98914909362793, "global_step": 67915, "epoch": 561} {"train_loss": -36.44416427612305, "global_step": 67916, "epoch": 561} {"train_loss": -36.06568145751953, "global_step": 67917, "epoch": 561} {"train_loss": -32.104103088378906, "global_step": 67918, "epoch": 561} {"train_loss": -35.105796813964844, "global_step": 67919, "epoch": 561} {"train_loss": -35.494625091552734, "global_step": 67920, "epoch": 561} {"train_loss": -34.45687484741211, "global_step": 67921, "epoch": 561} {"train_loss": -36.93497848510742, "global_step": 67922, "epoch": 561} {"train_loss": -35.06875228881836, "global_step": 67923, "epoch": 561} {"train_loss": -34.6709098815918, "global_step": 67924, "epoch": 561} {"train_loss": -35.878963470458984, "global_step": 67925, "epoch": 561} {"train_loss": -34.6014289855957, "global_step": 67926, "epoch": 561} {"train_loss": -37.067386627197266, "global_step": 67927, "epoch": 561} {"train_loss": -32.455169677734375, "global_step": 67928, "epoch": 561} {"train_loss": -35.689937591552734, "global_step": 67929, "epoch": 561} {"train_loss": -34.131134033203125, "global_step": 67930, "epoch": 561} {"train_loss": -35.98862838745117, "global_step": 67931, "epoch": 561} {"train_loss": -34.49904251098633, "global_step": 67932, "epoch": 561} {"train_loss": -35.529083251953125, "global_step": 67933, "epoch": 561} {"train_loss": -35.23326873779297, "global_step": 67934, "epoch": 561} {"train_loss": -35.14890670776367, "global_step": 67935, "epoch": 561} {"train_loss": -34.12040328979492, "global_step": 67936, "epoch": 561} {"train_loss": -35.35482406616211, "global_step": 67937, "epoch": 561} {"train_loss": -33.86259841918945, "global_step": 67938, "epoch": 561} {"train_loss": -35.533660888671875, "global_step": 67939, "epoch": 561} {"train_loss": -35.96647644042969, "global_step": 67940, "epoch": 561} {"train_loss": -35.36444854736328, "global_step": 67941, "epoch": 561} {"train_loss": -34.02135467529297, "global_step": 67942, "epoch": 561} {"train_loss": -35.04010009765625, "global_step": 67943, "epoch": 561} {"train_loss": -35.96151351928711, "global_step": 67944, "epoch": 561} {"train_loss": -34.99247360229492, "global_step": 67945, "epoch": 561} {"train_loss": -33.99210739135742, "global_step": 67946, "epoch": 561} {"train_loss": -34.407989501953125, "global_step": 67947, "epoch": 561} {"train_loss": -34.74163055419922, "global_step": 67948, "epoch": 561} {"train_loss": -34.67045211791992, "global_step": 67949, "epoch": 561} {"train_loss": -33.59893798828125, "global_step": 67950, "epoch": 561} {"train_loss": -34.6478271484375, "global_step": 67951, "epoch": 561} {"train_loss": -34.31526184082031, "global_step": 67952, "epoch": 561} {"train_loss": -35.99557113647461, "global_step": 67953, "epoch": 561} {"train_loss": -35.13883590698242, "global_step": 67954, "epoch": 561} {"train_loss": -33.929168701171875, "global_step": 67955, "epoch": 561} {"train_loss": -34.33748245239258, "global_step": 67956, "epoch": 561} {"train_loss": -35.178627014160156, "global_step": 67957, "epoch": 561} {"train_loss": -36.042354583740234, "global_step": 67958, "epoch": 561} {"train_loss": -34.28763198852539, "global_step": 67959, "epoch": 561} {"train_loss": -34.571773529052734, "global_step": 67960, "epoch": 561} {"train_loss": -35.51044845581055, "global_step": 67961, "epoch": 561} {"train_loss": -34.15351486206055, "global_step": 67962, "epoch": 561} {"train_loss": -33.31766891479492, "global_step": 67963, "epoch": 561} {"train_loss": -35.28338623046875, "global_step": 67964, "epoch": 561} {"train_loss": -35.08824157714844, "global_step": 67965, "epoch": 561} {"train_loss": -33.524078369140625, "global_step": 67966, "epoch": 561} {"train_loss": -35.27720260620117, "global_step": 67967, "epoch": 561} {"train_loss": -35.347869873046875, "global_step": 67968, "epoch": 561} {"train_loss": -35.444454193115234, "global_step": 67969, "epoch": 561} {"train_loss": -35.47800827026367, "global_step": 67970, "epoch": 561} {"train_loss": -34.624820709228516, "global_step": 67971, "epoch": 561} {"train_loss": -35.520965576171875, "global_step": 67972, "epoch": 561} {"train_loss": -34.801082611083984, "global_step": 67973, "epoch": 561} {"train_loss": -36.65514373779297, "global_step": 67974, "epoch": 561} {"train_loss": -34.58273696899414, "global_step": 67975, "epoch": 561} {"train_loss": -36.4607048034668, "global_step": 67976, "epoch": 561} {"train_loss": -35.921138763427734, "global_step": 67977, "epoch": 561} {"train_loss": -35.990081787109375, "global_step": 67978, "epoch": 561} {"train_loss": -35.529170989990234, "global_step": 67979, "epoch": 561} {"train_loss": -36.52225875854492, "global_step": 67980, "epoch": 561} {"train_loss": -36.223236083984375, "global_step": 67981, "epoch": 561} {"train_loss": -35.8021354675293, "global_step": 67982, "epoch": 561} {"train_loss": -36.26446533203125, "global_step": 67983, "epoch": 561} {"train_loss": -36.39917755126953, "global_step": 67984, "epoch": 561} {"train_loss": -36.540340423583984, "global_step": 67985, "epoch": 561} {"train_loss": -36.546142578125, "global_step": 67986, "epoch": 561} {"train_loss": -36.66059494018555, "global_step": 67987, "epoch": 561} {"train_loss": -36.43072509765625, "global_step": 67988, "epoch": 561} {"train_loss": -36.82786178588867, "global_step": 67989, "epoch": 561} {"train_loss": -36.8800163269043, "global_step": 67990, "epoch": 561} {"train_loss": -36.419166564941406, "global_step": 67991, "epoch": 561} {"train_loss": -36.81142044067383, "global_step": 67992, "epoch": 561} {"train_loss": -36.785369873046875, "global_step": 67993, "epoch": 561} {"train_loss": -37.03450393676758, "global_step": 67994, "epoch": 561} {"train_loss": -37.10797882080078, "global_step": 67995, "epoch": 561} {"train_loss": -37.01654052734375, "global_step": 67996, "epoch": 561} {"train_loss": -36.92924880981445, "global_step": 67997, "epoch": 561} {"train_loss": -36.40240478515625, "global_step": 67998, "epoch": 561} {"train_loss": -37.49372482299805, "global_step": 67999, "epoch": 561} {"train_loss": -37.28508758544922, "global_step": 68000, "epoch": 561} {"train_loss": -35.736684941063245, "global_step": 68001, "epoch": 561, "val_loss": 2562956.75} {"train_loss": -37.3599853515625, "global_step": 68002, "epoch": 562} {"train_loss": -37.53114318847656, "global_step": 68003, "epoch": 562} {"train_loss": -37.63398361206055, "global_step": 68004, "epoch": 562} {"train_loss": -37.550689697265625, "global_step": 68005, "epoch": 562} {"train_loss": -37.36556625366211, "global_step": 68006, "epoch": 562} {"train_loss": -37.413631439208984, "global_step": 68007, "epoch": 562} {"train_loss": -37.93391036987305, "global_step": 68008, "epoch": 562} {"train_loss": -37.362770080566406, "global_step": 68009, "epoch": 562} {"train_loss": -37.333152770996094, "global_step": 68010, "epoch": 562} {"train_loss": -37.68489074707031, "global_step": 68011, "epoch": 562} {"train_loss": -37.6496467590332, "global_step": 68012, "epoch": 562} {"train_loss": -37.91053009033203, "global_step": 68013, "epoch": 562} {"train_loss": -37.72241973876953, "global_step": 68014, "epoch": 562} {"train_loss": -36.30961990356445, "global_step": 68015, "epoch": 562} {"train_loss": -37.664794921875, "global_step": 68016, "epoch": 562} {"train_loss": -37.03998947143555, "global_step": 68017, "epoch": 562} {"train_loss": -37.49567794799805, "global_step": 68018, "epoch": 562} {"train_loss": -37.69073486328125, "global_step": 68019, "epoch": 562} {"train_loss": -37.39958572387695, "global_step": 68020, "epoch": 562} {"train_loss": -37.566341400146484, "global_step": 68021, "epoch": 562} {"train_loss": -37.30312728881836, "global_step": 68022, "epoch": 562} {"train_loss": -36.7418098449707, "global_step": 68023, "epoch": 562} {"train_loss": -37.71796798706055, "global_step": 68024, "epoch": 562} {"train_loss": -36.8844108581543, "global_step": 68025, "epoch": 562} {"train_loss": -37.38140869140625, "global_step": 68026, "epoch": 562} {"train_loss": -37.60707473754883, "global_step": 68027, "epoch": 562} {"train_loss": -36.2103385925293, "global_step": 68028, "epoch": 562} {"train_loss": -36.84119415283203, "global_step": 68029, "epoch": 562} {"train_loss": -36.25162887573242, "global_step": 68030, "epoch": 562} {"train_loss": -35.90545654296875, "global_step": 68031, "epoch": 562} {"train_loss": -36.689735412597656, "global_step": 68032, "epoch": 562} {"train_loss": -37.60124588012695, "global_step": 68033, "epoch": 562} {"train_loss": -35.18925094604492, "global_step": 68034, "epoch": 562} {"train_loss": -34.675758361816406, "global_step": 68035, "epoch": 562} {"train_loss": -36.56299591064453, "global_step": 68036, "epoch": 562} {"train_loss": -36.74091720581055, "global_step": 68037, "epoch": 562} {"train_loss": -34.88998031616211, "global_step": 68038, "epoch": 562} {"train_loss": -35.9677619934082, "global_step": 68039, "epoch": 562} {"train_loss": -35.79169464111328, "global_step": 68040, "epoch": 562} {"train_loss": -34.83805465698242, "global_step": 68041, "epoch": 562} {"train_loss": -36.65443801879883, "global_step": 68042, "epoch": 562} {"train_loss": -36.29381561279297, "global_step": 68043, "epoch": 562} {"train_loss": -36.40692138671875, "global_step": 68044, "epoch": 562} {"train_loss": -35.231483459472656, "global_step": 68045, "epoch": 562} {"train_loss": -36.09587097167969, "global_step": 68046, "epoch": 562} {"train_loss": -35.12093734741211, "global_step": 68047, "epoch": 562} {"train_loss": -35.18511962890625, "global_step": 68048, "epoch": 562} {"train_loss": -34.96790313720703, "global_step": 68049, "epoch": 562} {"train_loss": -34.2005500793457, "global_step": 68050, "epoch": 562} {"train_loss": -34.45011520385742, "global_step": 68051, "epoch": 562} {"train_loss": -35.1517448425293, "global_step": 68052, "epoch": 562} {"train_loss": -36.00142288208008, "global_step": 68053, "epoch": 562} {"train_loss": -33.531105041503906, "global_step": 68054, "epoch": 562} {"train_loss": -36.1530876159668, "global_step": 68055, "epoch": 562} {"train_loss": -32.71162414550781, "global_step": 68056, "epoch": 562} {"train_loss": -36.328426361083984, "global_step": 68057, "epoch": 562} {"train_loss": -35.251220703125, "global_step": 68058, "epoch": 562} {"train_loss": -35.7763786315918, "global_step": 68059, "epoch": 562} {"train_loss": -35.84696578979492, "global_step": 68060, "epoch": 562} {"train_loss": -35.356510162353516, "global_step": 68061, "epoch": 562} {"train_loss": -36.34501647949219, "global_step": 68062, "epoch": 562} {"train_loss": -36.21492385864258, "global_step": 68063, "epoch": 562} {"train_loss": -36.257450103759766, "global_step": 68064, "epoch": 562} {"train_loss": -35.855438232421875, "global_step": 68065, "epoch": 562} {"train_loss": -36.375213623046875, "global_step": 68066, "epoch": 562} {"train_loss": -36.083675384521484, "global_step": 68067, "epoch": 562} {"train_loss": -36.3517951965332, "global_step": 68068, "epoch": 562} {"train_loss": -36.29059982299805, "global_step": 68069, "epoch": 562} {"train_loss": -36.2823600769043, "global_step": 68070, "epoch": 562} {"train_loss": -35.99258041381836, "global_step": 68071, "epoch": 562} {"train_loss": -36.840789794921875, "global_step": 68072, "epoch": 562} {"train_loss": -36.68300247192383, "global_step": 68073, "epoch": 562} {"train_loss": -36.78961181640625, "global_step": 68074, "epoch": 562} {"train_loss": -35.71831130981445, "global_step": 68075, "epoch": 562} {"train_loss": -36.60360336303711, "global_step": 68076, "epoch": 562} {"train_loss": -36.760467529296875, "global_step": 68077, "epoch": 562} {"train_loss": -36.48788070678711, "global_step": 68078, "epoch": 562} {"train_loss": -35.917503356933594, "global_step": 68079, "epoch": 562} {"train_loss": -36.40754318237305, "global_step": 68080, "epoch": 562} {"train_loss": -36.8094482421875, "global_step": 68081, "epoch": 562} {"train_loss": -36.859130859375, "global_step": 68082, "epoch": 562} {"train_loss": -36.65605926513672, "global_step": 68083, "epoch": 562} {"train_loss": -36.339229583740234, "global_step": 68084, "epoch": 562} {"train_loss": -35.80309295654297, "global_step": 68085, "epoch": 562} {"train_loss": -36.18918991088867, "global_step": 68086, "epoch": 562} {"train_loss": -36.871212005615234, "global_step": 68087, "epoch": 562} {"train_loss": -37.14484405517578, "global_step": 68088, "epoch": 562} {"train_loss": -36.924774169921875, "global_step": 68089, "epoch": 562} {"train_loss": -36.41497039794922, "global_step": 68090, "epoch": 562} {"train_loss": -36.26122283935547, "global_step": 68091, "epoch": 562} {"train_loss": -36.16816711425781, "global_step": 68092, "epoch": 562} {"train_loss": -35.442230224609375, "global_step": 68093, "epoch": 562} {"train_loss": -32.77845001220703, "global_step": 68094, "epoch": 562} {"train_loss": -28.661779403686523, "global_step": 68095, "epoch": 562} {"train_loss": -22.7592830657959, "global_step": 68096, "epoch": 562} {"train_loss": -25.6287784576416, "global_step": 68097, "epoch": 562} {"train_loss": -35.252784729003906, "global_step": 68098, "epoch": 562} {"train_loss": -35.17607879638672, "global_step": 68099, "epoch": 562} {"train_loss": -31.167510986328125, "global_step": 68100, "epoch": 562} {"train_loss": -36.25322723388672, "global_step": 68101, "epoch": 562} {"train_loss": -34.245914459228516, "global_step": 68102, "epoch": 562} {"train_loss": -34.67631149291992, "global_step": 68103, "epoch": 562} {"train_loss": -35.952022552490234, "global_step": 68104, "epoch": 562} {"train_loss": -34.51913833618164, "global_step": 68105, "epoch": 562} {"train_loss": -36.6059684753418, "global_step": 68106, "epoch": 562} {"train_loss": -34.31061935424805, "global_step": 68107, "epoch": 562} {"train_loss": -35.4296989440918, "global_step": 68108, "epoch": 562} {"train_loss": -35.819087982177734, "global_step": 68109, "epoch": 562} {"train_loss": -35.76975631713867, "global_step": 68110, "epoch": 562} {"train_loss": -36.70728302001953, "global_step": 68111, "epoch": 562} {"train_loss": -35.94932174682617, "global_step": 68112, "epoch": 562} {"train_loss": -36.32395553588867, "global_step": 68113, "epoch": 562} {"train_loss": -36.164608001708984, "global_step": 68114, "epoch": 562} {"train_loss": -37.366024017333984, "global_step": 68115, "epoch": 562} {"train_loss": -36.52958297729492, "global_step": 68116, "epoch": 562} {"train_loss": -36.53416061401367, "global_step": 68117, "epoch": 562} {"train_loss": -37.1767463684082, "global_step": 68118, "epoch": 562} {"train_loss": -36.472633361816406, "global_step": 68119, "epoch": 562} {"train_loss": -37.22220993041992, "global_step": 68120, "epoch": 562} {"train_loss": -36.78013229370117, "global_step": 68121, "epoch": 562} {"train_loss": -35.979087750773786, "global_step": 68122, "epoch": 562, "val_loss": 2537888.75} {"train_loss": -37.070003509521484, "global_step": 68123, "epoch": 563} {"train_loss": -36.52735900878906, "global_step": 68124, "epoch": 563} {"train_loss": -37.70988845825195, "global_step": 68125, "epoch": 563} {"train_loss": -37.265220642089844, "global_step": 68126, "epoch": 563} {"train_loss": -37.471588134765625, "global_step": 68127, "epoch": 563} {"train_loss": -37.370277404785156, "global_step": 68128, "epoch": 563} {"train_loss": -37.372982025146484, "global_step": 68129, "epoch": 563} {"train_loss": -37.05265808105469, "global_step": 68130, "epoch": 563} {"train_loss": -37.19240188598633, "global_step": 68131, "epoch": 563} {"train_loss": -37.78152084350586, "global_step": 68132, "epoch": 563} {"train_loss": -37.67371368408203, "global_step": 68133, "epoch": 563} {"train_loss": -37.717872619628906, "global_step": 68134, "epoch": 563} {"train_loss": -37.900489807128906, "global_step": 68135, "epoch": 563} {"train_loss": -37.833038330078125, "global_step": 68136, "epoch": 563} {"train_loss": -37.47892379760742, "global_step": 68137, "epoch": 563} {"train_loss": -37.68669509887695, "global_step": 68138, "epoch": 563} {"train_loss": -37.40085983276367, "global_step": 68139, "epoch": 563} {"train_loss": -36.67568588256836, "global_step": 68140, "epoch": 563} {"train_loss": -36.1239013671875, "global_step": 68141, "epoch": 563} {"train_loss": -36.36579513549805, "global_step": 68142, "epoch": 563} {"train_loss": -36.467342376708984, "global_step": 68143, "epoch": 563} {"train_loss": -37.426597595214844, "global_step": 68144, "epoch": 563} {"train_loss": -37.8594970703125, "global_step": 68145, "epoch": 563} {"train_loss": -36.82859420776367, "global_step": 68146, "epoch": 563} {"train_loss": -35.4171257019043, "global_step": 68147, "epoch": 563} {"train_loss": -36.27870559692383, "global_step": 68148, "epoch": 563} {"train_loss": -36.24897384643555, "global_step": 68149, "epoch": 563} {"train_loss": -36.07997131347656, "global_step": 68150, "epoch": 563} {"train_loss": -37.884193420410156, "global_step": 68151, "epoch": 563} {"train_loss": -35.79383087158203, "global_step": 68152, "epoch": 563} {"train_loss": -36.73876953125, "global_step": 68153, "epoch": 563} {"train_loss": -36.104618072509766, "global_step": 68154, "epoch": 563} {"train_loss": -36.5947265625, "global_step": 68155, "epoch": 563} {"train_loss": -36.942256927490234, "global_step": 68156, "epoch": 563} {"train_loss": -36.22744369506836, "global_step": 68157, "epoch": 563} {"train_loss": -33.23200225830078, "global_step": 68158, "epoch": 563} {"train_loss": -32.91328811645508, "global_step": 68159, "epoch": 563} {"train_loss": -33.83119201660156, "global_step": 68160, "epoch": 563} {"train_loss": -34.818904876708984, "global_step": 68161, "epoch": 563} {"train_loss": -33.9902458190918, "global_step": 68162, "epoch": 563} {"train_loss": -34.30418014526367, "global_step": 68163, "epoch": 563} {"train_loss": -33.73534393310547, "global_step": 68164, "epoch": 563} {"train_loss": -33.30282211303711, "global_step": 68165, "epoch": 563} {"train_loss": -32.13078689575195, "global_step": 68166, "epoch": 563} {"train_loss": -34.87685775756836, "global_step": 68167, "epoch": 563} {"train_loss": -34.653526306152344, "global_step": 68168, "epoch": 563} {"train_loss": -32.82453536987305, "global_step": 68169, "epoch": 563} {"train_loss": -33.025970458984375, "global_step": 68170, "epoch": 563} {"train_loss": -35.17035675048828, "global_step": 68171, "epoch": 563} {"train_loss": -32.790340423583984, "global_step": 68172, "epoch": 563} {"train_loss": -33.59207534790039, "global_step": 68173, "epoch": 563} {"train_loss": -35.37778854370117, "global_step": 68174, "epoch": 563} {"train_loss": -32.36091613769531, "global_step": 68175, "epoch": 563} {"train_loss": -34.9776725769043, "global_step": 68176, "epoch": 563} {"train_loss": -34.12789535522461, "global_step": 68177, "epoch": 563} {"train_loss": -34.076072692871094, "global_step": 68178, "epoch": 563} {"train_loss": -36.09294891357422, "global_step": 68179, "epoch": 563} {"train_loss": -34.415592193603516, "global_step": 68180, "epoch": 563} {"train_loss": -35.62307357788086, "global_step": 68181, "epoch": 563} {"train_loss": -34.657344818115234, "global_step": 68182, "epoch": 563} {"train_loss": -35.67552185058594, "global_step": 68183, "epoch": 563} {"train_loss": -35.7780876159668, "global_step": 68184, "epoch": 563} {"train_loss": -35.81770706176758, "global_step": 68185, "epoch": 563} {"train_loss": -35.959842681884766, "global_step": 68186, "epoch": 563} {"train_loss": -35.89266586303711, "global_step": 68187, "epoch": 563} {"train_loss": -36.448974609375, "global_step": 68188, "epoch": 563} {"train_loss": -35.99990463256836, "global_step": 68189, "epoch": 563} {"train_loss": -36.380531311035156, "global_step": 68190, "epoch": 563} {"train_loss": -35.71109390258789, "global_step": 68191, "epoch": 563} {"train_loss": -36.0013427734375, "global_step": 68192, "epoch": 563} {"train_loss": -36.57722854614258, "global_step": 68193, "epoch": 563} {"train_loss": -36.470211029052734, "global_step": 68194, "epoch": 563} {"train_loss": -36.563480377197266, "global_step": 68195, "epoch": 563} {"train_loss": -36.31869888305664, "global_step": 68196, "epoch": 563} {"train_loss": -36.661651611328125, "global_step": 68197, "epoch": 563} {"train_loss": -36.60358810424805, "global_step": 68198, "epoch": 563} {"train_loss": -36.74011993408203, "global_step": 68199, "epoch": 563} {"train_loss": -37.091129302978516, "global_step": 68200, "epoch": 563} {"train_loss": -36.80306625366211, "global_step": 68201, "epoch": 563} {"train_loss": -36.56875228881836, "global_step": 68202, "epoch": 563} {"train_loss": -35.7514762878418, "global_step": 68203, "epoch": 563} {"train_loss": -36.7030143737793, "global_step": 68204, "epoch": 563} {"train_loss": -37.06348419189453, "global_step": 68205, "epoch": 563} {"train_loss": -37.0386962890625, "global_step": 68206, "epoch": 563} {"train_loss": -37.2905387878418, "global_step": 68207, "epoch": 563} {"train_loss": -37.217037200927734, "global_step": 68208, "epoch": 563} {"train_loss": -37.29011917114258, "global_step": 68209, "epoch": 563} {"train_loss": -37.00639343261719, "global_step": 68210, "epoch": 563} {"train_loss": -36.972957611083984, "global_step": 68211, "epoch": 563} {"train_loss": -37.10688400268555, "global_step": 68212, "epoch": 563} {"train_loss": -36.99327087402344, "global_step": 68213, "epoch": 563} {"train_loss": -36.40053939819336, "global_step": 68214, "epoch": 563} {"train_loss": -37.261409759521484, "global_step": 68215, "epoch": 563} {"train_loss": -37.60129165649414, "global_step": 68216, "epoch": 563} {"train_loss": -37.19302749633789, "global_step": 68217, "epoch": 563} {"train_loss": -37.58070373535156, "global_step": 68218, "epoch": 563} {"train_loss": -37.50619125366211, "global_step": 68219, "epoch": 563} {"train_loss": -37.56513595581055, "global_step": 68220, "epoch": 563} {"train_loss": -36.78974533081055, "global_step": 68221, "epoch": 563} {"train_loss": -37.57973098754883, "global_step": 68222, "epoch": 563} {"train_loss": -37.082645416259766, "global_step": 68223, "epoch": 563} {"train_loss": -37.510231018066406, "global_step": 68224, "epoch": 563} {"train_loss": -36.904178619384766, "global_step": 68225, "epoch": 563} {"train_loss": -37.3465576171875, "global_step": 68226, "epoch": 563} {"train_loss": -37.63025665283203, "global_step": 68227, "epoch": 563} {"train_loss": -37.38208770751953, "global_step": 68228, "epoch": 563} {"train_loss": -37.65693664550781, "global_step": 68229, "epoch": 563} {"train_loss": -37.034297943115234, "global_step": 68230, "epoch": 563} {"train_loss": -37.087432861328125, "global_step": 68231, "epoch": 563} {"train_loss": -37.387020111083984, "global_step": 68232, "epoch": 563} {"train_loss": -37.486900329589844, "global_step": 68233, "epoch": 563} {"train_loss": -36.456172943115234, "global_step": 68234, "epoch": 563} {"train_loss": -37.99506759643555, "global_step": 68235, "epoch": 563} {"train_loss": -37.15240478515625, "global_step": 68236, "epoch": 563} {"train_loss": -37.065975189208984, "global_step": 68237, "epoch": 563} {"train_loss": -36.37750244140625, "global_step": 68238, "epoch": 563} {"train_loss": -37.57136917114258, "global_step": 68239, "epoch": 563} {"train_loss": -37.20541000366211, "global_step": 68240, "epoch": 563} {"train_loss": -37.1897087097168, "global_step": 68241, "epoch": 563} {"train_loss": -37.516868591308594, "global_step": 68242, "epoch": 563} {"train_loss": -36.33000192563396, "global_step": 68243, "epoch": 563, "val_loss": 2552176.25} {"train_loss": -37.71282958984375, "global_step": 68244, "epoch": 564} {"train_loss": -35.06047439575195, "global_step": 68245, "epoch": 564} {"train_loss": -37.08809280395508, "global_step": 68246, "epoch": 564} {"train_loss": -36.83376693725586, "global_step": 68247, "epoch": 564} {"train_loss": -37.08241271972656, "global_step": 68248, "epoch": 564} {"train_loss": -36.969234466552734, "global_step": 68249, "epoch": 564} {"train_loss": -36.047645568847656, "global_step": 68250, "epoch": 564} {"train_loss": -37.50840377807617, "global_step": 68251, "epoch": 564} {"train_loss": -36.73212814331055, "global_step": 68252, "epoch": 564} {"train_loss": -36.41823196411133, "global_step": 68253, "epoch": 564} {"train_loss": -35.139530181884766, "global_step": 68254, "epoch": 564} {"train_loss": -36.424072265625, "global_step": 68255, "epoch": 564} {"train_loss": -35.94863510131836, "global_step": 68256, "epoch": 564} {"train_loss": -36.40150451660156, "global_step": 68257, "epoch": 564} {"train_loss": -35.3979606628418, "global_step": 68258, "epoch": 564} {"train_loss": -35.382293701171875, "global_step": 68259, "epoch": 564} {"train_loss": -34.2747688293457, "global_step": 68260, "epoch": 564} {"train_loss": -37.26648712158203, "global_step": 68261, "epoch": 564} {"train_loss": -34.22040939331055, "global_step": 68262, "epoch": 564} {"train_loss": -34.51504135131836, "global_step": 68263, "epoch": 564} {"train_loss": -36.5323600769043, "global_step": 68264, "epoch": 564} {"train_loss": -34.85151672363281, "global_step": 68265, "epoch": 564} {"train_loss": -35.86910629272461, "global_step": 68266, "epoch": 564} {"train_loss": -35.01123809814453, "global_step": 68267, "epoch": 564} {"train_loss": -29.87226676940918, "global_step": 68268, "epoch": 564} {"train_loss": -35.3530158996582, "global_step": 68269, "epoch": 564} {"train_loss": -34.63544845581055, "global_step": 68270, "epoch": 564} {"train_loss": -32.24003982543945, "global_step": 68271, "epoch": 564} {"train_loss": -32.64330291748047, "global_step": 68272, "epoch": 564} {"train_loss": -27.789831161499023, "global_step": 68273, "epoch": 564} {"train_loss": -27.018543243408203, "global_step": 68274, "epoch": 564} {"train_loss": -32.78679275512695, "global_step": 68275, "epoch": 564} {"train_loss": -33.78794860839844, "global_step": 68276, "epoch": 564} {"train_loss": -24.484745025634766, "global_step": 68277, "epoch": 564} {"train_loss": -28.915109634399414, "global_step": 68278, "epoch": 564} {"train_loss": -34.37079620361328, "global_step": 68279, "epoch": 564} {"train_loss": -32.82743453979492, "global_step": 68280, "epoch": 564} {"train_loss": -34.69034957885742, "global_step": 68281, "epoch": 564} {"train_loss": -33.10907745361328, "global_step": 68282, "epoch": 564} {"train_loss": -32.837646484375, "global_step": 68283, "epoch": 564} {"train_loss": -34.12586975097656, "global_step": 68284, "epoch": 564} {"train_loss": -34.67982864379883, "global_step": 68285, "epoch": 564} {"train_loss": -34.40871047973633, "global_step": 68286, "epoch": 564} {"train_loss": -34.42911911010742, "global_step": 68287, "epoch": 564} {"train_loss": -36.02565383911133, "global_step": 68288, "epoch": 564} {"train_loss": -35.42905807495117, "global_step": 68289, "epoch": 564} {"train_loss": -34.95130920410156, "global_step": 68290, "epoch": 564} {"train_loss": -35.4940071105957, "global_step": 68291, "epoch": 564} {"train_loss": -35.124996185302734, "global_step": 68292, "epoch": 564} {"train_loss": -35.45536422729492, "global_step": 68293, "epoch": 564} {"train_loss": -35.1852912902832, "global_step": 68294, "epoch": 564} {"train_loss": -35.99984359741211, "global_step": 68295, "epoch": 564} {"train_loss": -35.60078048706055, "global_step": 68296, "epoch": 564} {"train_loss": -36.236915588378906, "global_step": 68297, "epoch": 564} {"train_loss": -35.848121643066406, "global_step": 68298, "epoch": 564} {"train_loss": -35.67546844482422, "global_step": 68299, "epoch": 564} {"train_loss": -36.16314697265625, "global_step": 68300, "epoch": 564} {"train_loss": -35.81584930419922, "global_step": 68301, "epoch": 564} {"train_loss": -36.12309646606445, "global_step": 68302, "epoch": 564} {"train_loss": -36.00349807739258, "global_step": 68303, "epoch": 564} {"train_loss": -36.39937973022461, "global_step": 68304, "epoch": 564} {"train_loss": -36.17110061645508, "global_step": 68305, "epoch": 564} {"train_loss": -36.4998893737793, "global_step": 68306, "epoch": 564} {"train_loss": -36.79634094238281, "global_step": 68307, "epoch": 564} {"train_loss": -35.9857292175293, "global_step": 68308, "epoch": 564} {"train_loss": -36.618324279785156, "global_step": 68309, "epoch": 564} {"train_loss": -36.422847747802734, "global_step": 68310, "epoch": 564} {"train_loss": -36.99455261230469, "global_step": 68311, "epoch": 564} {"train_loss": -36.878700256347656, "global_step": 68312, "epoch": 564} {"train_loss": -36.864234924316406, "global_step": 68313, "epoch": 564} {"train_loss": -36.726318359375, "global_step": 68314, "epoch": 564} {"train_loss": -36.77358627319336, "global_step": 68315, "epoch": 564} {"train_loss": -36.981292724609375, "global_step": 68316, "epoch": 564} {"train_loss": -36.663326263427734, "global_step": 68317, "epoch": 564} {"train_loss": -37.33099365234375, "global_step": 68318, "epoch": 564} {"train_loss": -37.22184371948242, "global_step": 68319, "epoch": 564} {"train_loss": -37.14198684692383, "global_step": 68320, "epoch": 564} {"train_loss": -36.76777267456055, "global_step": 68321, "epoch": 564} {"train_loss": -36.92687225341797, "global_step": 68322, "epoch": 564} {"train_loss": -36.93679428100586, "global_step": 68323, "epoch": 564} {"train_loss": -37.254940032958984, "global_step": 68324, "epoch": 564} {"train_loss": -37.27130889892578, "global_step": 68325, "epoch": 564} {"train_loss": -37.45733642578125, "global_step": 68326, "epoch": 564} {"train_loss": -37.77092361450195, "global_step": 68327, "epoch": 564} {"train_loss": -37.48019027709961, "global_step": 68328, "epoch": 564} {"train_loss": -37.7210807800293, "global_step": 68329, "epoch": 564} {"train_loss": -37.399742126464844, "global_step": 68330, "epoch": 564} {"train_loss": -37.668331146240234, "global_step": 68331, "epoch": 564} {"train_loss": -37.23308563232422, "global_step": 68332, "epoch": 564} {"train_loss": -37.341796875, "global_step": 68333, "epoch": 564} {"train_loss": -36.92716598510742, "global_step": 68334, "epoch": 564} {"train_loss": -37.55288314819336, "global_step": 68335, "epoch": 564} {"train_loss": -37.41733932495117, "global_step": 68336, "epoch": 564} {"train_loss": -37.00339889526367, "global_step": 68337, "epoch": 564} {"train_loss": -37.77779769897461, "global_step": 68338, "epoch": 564} {"train_loss": -37.22998809814453, "global_step": 68339, "epoch": 564} {"train_loss": -37.43832015991211, "global_step": 68340, "epoch": 564} {"train_loss": -37.81391143798828, "global_step": 68341, "epoch": 564} {"train_loss": -37.22786331176758, "global_step": 68342, "epoch": 564} {"train_loss": -37.35261917114258, "global_step": 68343, "epoch": 564} {"train_loss": -36.68052291870117, "global_step": 68344, "epoch": 564} {"train_loss": -36.793312072753906, "global_step": 68345, "epoch": 564} {"train_loss": -35.559295654296875, "global_step": 68346, "epoch": 564} {"train_loss": -35.3409309387207, "global_step": 68347, "epoch": 564} {"train_loss": -34.13581466674805, "global_step": 68348, "epoch": 564} {"train_loss": -33.5351676940918, "global_step": 68349, "epoch": 564} {"train_loss": -35.5030632019043, "global_step": 68350, "epoch": 564} {"train_loss": -37.3242073059082, "global_step": 68351, "epoch": 564} {"train_loss": -35.14265060424805, "global_step": 68352, "epoch": 564} {"train_loss": -34.397010803222656, "global_step": 68353, "epoch": 564} {"train_loss": -37.60361862182617, "global_step": 68354, "epoch": 564} {"train_loss": -36.24235916137695, "global_step": 68355, "epoch": 564} {"train_loss": -35.69016647338867, "global_step": 68356, "epoch": 564} {"train_loss": -36.67989730834961, "global_step": 68357, "epoch": 564} {"train_loss": -34.47382736206055, "global_step": 68358, "epoch": 564} {"train_loss": -33.65045928955078, "global_step": 68359, "epoch": 564} {"train_loss": -36.28289794921875, "global_step": 68360, "epoch": 564} {"train_loss": -36.31710433959961, "global_step": 68361, "epoch": 564} {"train_loss": -35.61251449584961, "global_step": 68362, "epoch": 564} {"train_loss": -35.430580139160156, "global_step": 68363, "epoch": 564} {"train_loss": -35.634830112299646, "global_step": 68364, "epoch": 564, "val_loss": 2589200.25} {"train_loss": -36.68452835083008, "global_step": 68365, "epoch": 565} {"train_loss": -35.33148956298828, "global_step": 68366, "epoch": 565} {"train_loss": -37.1971549987793, "global_step": 68367, "epoch": 565} {"train_loss": -35.72040939331055, "global_step": 68368, "epoch": 565} {"train_loss": -36.18872833251953, "global_step": 68369, "epoch": 565} {"train_loss": -36.16392135620117, "global_step": 68370, "epoch": 565} {"train_loss": -37.1090202331543, "global_step": 68371, "epoch": 565} {"train_loss": -35.61177062988281, "global_step": 68372, "epoch": 565} {"train_loss": -36.93833541870117, "global_step": 68373, "epoch": 565} {"train_loss": -35.487770080566406, "global_step": 68374, "epoch": 565} {"train_loss": -36.56942367553711, "global_step": 68375, "epoch": 565} {"train_loss": -36.865936279296875, "global_step": 68376, "epoch": 565} {"train_loss": -36.767486572265625, "global_step": 68377, "epoch": 565} {"train_loss": -36.78178024291992, "global_step": 68378, "epoch": 565} {"train_loss": -36.87543869018555, "global_step": 68379, "epoch": 565} {"train_loss": -36.95356369018555, "global_step": 68380, "epoch": 565} {"train_loss": -37.071285247802734, "global_step": 68381, "epoch": 565} {"train_loss": -37.45043182373047, "global_step": 68382, "epoch": 565} {"train_loss": -37.06038284301758, "global_step": 68383, "epoch": 565} {"train_loss": -37.084205627441406, "global_step": 68384, "epoch": 565} {"train_loss": -36.8619499206543, "global_step": 68385, "epoch": 565} {"train_loss": -37.06035614013672, "global_step": 68386, "epoch": 565} {"train_loss": -37.01898193359375, "global_step": 68387, "epoch": 565} {"train_loss": -37.7925910949707, "global_step": 68388, "epoch": 565} {"train_loss": -37.428321838378906, "global_step": 68389, "epoch": 565} {"train_loss": -37.38431167602539, "global_step": 68390, "epoch": 565} {"train_loss": -37.0871696472168, "global_step": 68391, "epoch": 565} {"train_loss": -37.2807731628418, "global_step": 68392, "epoch": 565} {"train_loss": -37.10993194580078, "global_step": 68393, "epoch": 565} {"train_loss": -35.63360595703125, "global_step": 68394, "epoch": 565} {"train_loss": -34.780948638916016, "global_step": 68395, "epoch": 565} {"train_loss": -34.418521881103516, "global_step": 68396, "epoch": 565} {"train_loss": -36.58293151855469, "global_step": 68397, "epoch": 565} {"train_loss": -37.54377365112305, "global_step": 68398, "epoch": 565} {"train_loss": -34.673126220703125, "global_step": 68399, "epoch": 565} {"train_loss": -31.0946102142334, "global_step": 68400, "epoch": 565} {"train_loss": -26.134092330932617, "global_step": 68401, "epoch": 565} {"train_loss": -31.733190536499023, "global_step": 68402, "epoch": 565} {"train_loss": -37.185699462890625, "global_step": 68403, "epoch": 565} {"train_loss": -36.1220703125, "global_step": 68404, "epoch": 565} {"train_loss": -35.05874252319336, "global_step": 68405, "epoch": 565} {"train_loss": -37.5349235534668, "global_step": 68406, "epoch": 565} {"train_loss": -35.62071228027344, "global_step": 68407, "epoch": 565} {"train_loss": -37.15077590942383, "global_step": 68408, "epoch": 565} {"train_loss": -35.42091369628906, "global_step": 68409, "epoch": 565} {"train_loss": -37.01462936401367, "global_step": 68410, "epoch": 565} {"train_loss": -36.34296798706055, "global_step": 68411, "epoch": 565} {"train_loss": -36.02769088745117, "global_step": 68412, "epoch": 565} {"train_loss": -36.190162658691406, "global_step": 68413, "epoch": 565} {"train_loss": -36.96631622314453, "global_step": 68414, "epoch": 565} {"train_loss": -36.49555587768555, "global_step": 68415, "epoch": 565} {"train_loss": -36.95443344116211, "global_step": 68416, "epoch": 565} {"train_loss": -36.33918380737305, "global_step": 68417, "epoch": 565} {"train_loss": -36.724971771240234, "global_step": 68418, "epoch": 565} {"train_loss": -35.33757019042969, "global_step": 68419, "epoch": 565} {"train_loss": -37.60590744018555, "global_step": 68420, "epoch": 565} {"train_loss": -36.41069412231445, "global_step": 68421, "epoch": 565} {"train_loss": -37.694610595703125, "global_step": 68422, "epoch": 565} {"train_loss": -36.59475326538086, "global_step": 68423, "epoch": 565} {"train_loss": -37.84990692138672, "global_step": 68424, "epoch": 565} {"train_loss": -36.55123519897461, "global_step": 68425, "epoch": 565} {"train_loss": -37.39347457885742, "global_step": 68426, "epoch": 565} {"train_loss": -37.26290512084961, "global_step": 68427, "epoch": 565} {"train_loss": -36.261619567871094, "global_step": 68428, "epoch": 565} {"train_loss": -37.7041130065918, "global_step": 68429, "epoch": 565} {"train_loss": -36.29282760620117, "global_step": 68430, "epoch": 565} {"train_loss": -37.62144088745117, "global_step": 68431, "epoch": 565} {"train_loss": -37.06766891479492, "global_step": 68432, "epoch": 565} {"train_loss": -37.5962028503418, "global_step": 68433, "epoch": 565} {"train_loss": -36.37696075439453, "global_step": 68434, "epoch": 565} {"train_loss": -38.024871826171875, "global_step": 68435, "epoch": 565} {"train_loss": -37.84623336791992, "global_step": 68436, "epoch": 565} {"train_loss": -37.215728759765625, "global_step": 68437, "epoch": 565} {"train_loss": -37.65153121948242, "global_step": 68438, "epoch": 565} {"train_loss": -37.43411636352539, "global_step": 68439, "epoch": 565} {"train_loss": -37.319488525390625, "global_step": 68440, "epoch": 565} {"train_loss": -37.60052490234375, "global_step": 68441, "epoch": 565} {"train_loss": -37.50254440307617, "global_step": 68442, "epoch": 565} {"train_loss": -37.782936096191406, "global_step": 68443, "epoch": 565} {"train_loss": -34.72355270385742, "global_step": 68444, "epoch": 565} {"train_loss": -37.103363037109375, "global_step": 68445, "epoch": 565} {"train_loss": -35.32809066772461, "global_step": 68446, "epoch": 565} {"train_loss": -36.791683197021484, "global_step": 68447, "epoch": 565} {"train_loss": -36.72730255126953, "global_step": 68448, "epoch": 565} {"train_loss": -36.34414291381836, "global_step": 68449, "epoch": 565} {"train_loss": -35.89870834350586, "global_step": 68450, "epoch": 565} {"train_loss": -37.170528411865234, "global_step": 68451, "epoch": 565} {"train_loss": -36.56645965576172, "global_step": 68452, "epoch": 565} {"train_loss": -36.57391357421875, "global_step": 68453, "epoch": 565} {"train_loss": -36.37472915649414, "global_step": 68454, "epoch": 565} {"train_loss": -35.18547439575195, "global_step": 68455, "epoch": 565} {"train_loss": -36.7025032043457, "global_step": 68456, "epoch": 565} {"train_loss": -36.69712829589844, "global_step": 68457, "epoch": 565} {"train_loss": -36.40458297729492, "global_step": 68458, "epoch": 565} {"train_loss": -36.7688102722168, "global_step": 68459, "epoch": 565} {"train_loss": -36.464717864990234, "global_step": 68460, "epoch": 565} {"train_loss": -36.69032287597656, "global_step": 68461, "epoch": 565} {"train_loss": -37.20903396606445, "global_step": 68462, "epoch": 565} {"train_loss": -32.97343063354492, "global_step": 68463, "epoch": 565} {"train_loss": -36.728397369384766, "global_step": 68464, "epoch": 565} {"train_loss": -36.993507385253906, "global_step": 68465, "epoch": 565} {"train_loss": -36.38869094848633, "global_step": 68466, "epoch": 565} {"train_loss": -36.97602462768555, "global_step": 68467, "epoch": 565} {"train_loss": -37.129451751708984, "global_step": 68468, "epoch": 565} {"train_loss": -36.985286712646484, "global_step": 68469, "epoch": 565} {"train_loss": -36.515846252441406, "global_step": 68470, "epoch": 565} {"train_loss": -36.17037582397461, "global_step": 68471, "epoch": 565} {"train_loss": -36.84384536743164, "global_step": 68472, "epoch": 565} {"train_loss": -35.72074508666992, "global_step": 68473, "epoch": 565} {"train_loss": -35.467681884765625, "global_step": 68474, "epoch": 565} {"train_loss": -35.7475471496582, "global_step": 68475, "epoch": 565} {"train_loss": -36.177101135253906, "global_step": 68476, "epoch": 565} {"train_loss": -36.09696578979492, "global_step": 68477, "epoch": 565} {"train_loss": -36.08230209350586, "global_step": 68478, "epoch": 565} {"train_loss": -36.86806869506836, "global_step": 68479, "epoch": 565} {"train_loss": -34.36148452758789, "global_step": 68480, "epoch": 565} {"train_loss": -35.96320724487305, "global_step": 68481, "epoch": 565} {"train_loss": -35.77842330932617, "global_step": 68482, "epoch": 565} {"train_loss": -36.36091613769531, "global_step": 68483, "epoch": 565} {"train_loss": -36.489322662353516, "global_step": 68484, "epoch": 565} {"train_loss": -36.404162083775546, "global_step": 68485, "epoch": 565, "val_loss": 2537881.25} {"train_loss": -36.6502571105957, "global_step": 68486, "epoch": 566} {"train_loss": -35.82481002807617, "global_step": 68487, "epoch": 566} {"train_loss": -36.1208610534668, "global_step": 68488, "epoch": 566} {"train_loss": -36.14313507080078, "global_step": 68489, "epoch": 566} {"train_loss": -35.7322998046875, "global_step": 68490, "epoch": 566} {"train_loss": -36.259700775146484, "global_step": 68491, "epoch": 566} {"train_loss": -34.57038116455078, "global_step": 68492, "epoch": 566} {"train_loss": -36.38674545288086, "global_step": 68493, "epoch": 566} {"train_loss": -37.28608322143555, "global_step": 68494, "epoch": 566} {"train_loss": -36.318782806396484, "global_step": 68495, "epoch": 566} {"train_loss": -35.82448196411133, "global_step": 68496, "epoch": 566} {"train_loss": -36.37763214111328, "global_step": 68497, "epoch": 566} {"train_loss": -36.54785919189453, "global_step": 68498, "epoch": 566} {"train_loss": -36.67280960083008, "global_step": 68499, "epoch": 566} {"train_loss": -36.00404739379883, "global_step": 68500, "epoch": 566} {"train_loss": -36.75630569458008, "global_step": 68501, "epoch": 566} {"train_loss": -36.256378173828125, "global_step": 68502, "epoch": 566} {"train_loss": -37.53421401977539, "global_step": 68503, "epoch": 566} {"train_loss": -36.96246337890625, "global_step": 68504, "epoch": 566} {"train_loss": -37.169456481933594, "global_step": 68505, "epoch": 566} {"train_loss": -37.9127082824707, "global_step": 68506, "epoch": 566} {"train_loss": -36.99092102050781, "global_step": 68507, "epoch": 566} {"train_loss": -36.94031524658203, "global_step": 68508, "epoch": 566} {"train_loss": -36.94065856933594, "global_step": 68509, "epoch": 566} {"train_loss": -37.1519660949707, "global_step": 68510, "epoch": 566} {"train_loss": -36.87599182128906, "global_step": 68511, "epoch": 566} {"train_loss": -37.21140670776367, "global_step": 68512, "epoch": 566} {"train_loss": -36.95185089111328, "global_step": 68513, "epoch": 566} {"train_loss": -36.39860534667969, "global_step": 68514, "epoch": 566} {"train_loss": -37.13810348510742, "global_step": 68515, "epoch": 566} {"train_loss": -37.508277893066406, "global_step": 68516, "epoch": 566} {"train_loss": -37.0406379699707, "global_step": 68517, "epoch": 566} {"train_loss": -37.11471176147461, "global_step": 68518, "epoch": 566} {"train_loss": -37.41530990600586, "global_step": 68519, "epoch": 566} {"train_loss": -37.072113037109375, "global_step": 68520, "epoch": 566} {"train_loss": -37.475276947021484, "global_step": 68521, "epoch": 566} {"train_loss": -36.79449462890625, "global_step": 68522, "epoch": 566} {"train_loss": -37.23714065551758, "global_step": 68523, "epoch": 566} {"train_loss": -37.296630859375, "global_step": 68524, "epoch": 566} {"train_loss": -37.58882522583008, "global_step": 68525, "epoch": 566} {"train_loss": -36.586544036865234, "global_step": 68526, "epoch": 566} {"train_loss": -36.24906921386719, "global_step": 68527, "epoch": 566} {"train_loss": -36.2510986328125, "global_step": 68528, "epoch": 566} {"train_loss": -36.09184646606445, "global_step": 68529, "epoch": 566} {"train_loss": -36.10628128051758, "global_step": 68530, "epoch": 566} {"train_loss": -37.06269836425781, "global_step": 68531, "epoch": 566} {"train_loss": -37.07763671875, "global_step": 68532, "epoch": 566} {"train_loss": -35.892234802246094, "global_step": 68533, "epoch": 566} {"train_loss": -33.453548431396484, "global_step": 68534, "epoch": 566} {"train_loss": -27.663793563842773, "global_step": 68535, "epoch": 566} {"train_loss": -20.01435089111328, "global_step": 68536, "epoch": 566} {"train_loss": -24.269872665405273, "global_step": 68537, "epoch": 566} {"train_loss": -36.35076904296875, "global_step": 68538, "epoch": 566} {"train_loss": -32.22588348388672, "global_step": 68539, "epoch": 566} {"train_loss": -30.94077491760254, "global_step": 68540, "epoch": 566} {"train_loss": -34.98188400268555, "global_step": 68541, "epoch": 566} {"train_loss": -31.77058982849121, "global_step": 68542, "epoch": 566} {"train_loss": -34.81095504760742, "global_step": 68543, "epoch": 566} {"train_loss": -33.82463836669922, "global_step": 68544, "epoch": 566} {"train_loss": -31.16958999633789, "global_step": 68545, "epoch": 566} {"train_loss": -35.19441604614258, "global_step": 68546, "epoch": 566} {"train_loss": -32.75457763671875, "global_step": 68547, "epoch": 566} {"train_loss": -34.964717864990234, "global_step": 68548, "epoch": 566} {"train_loss": -34.85092544555664, "global_step": 68549, "epoch": 566} {"train_loss": -34.2390251159668, "global_step": 68550, "epoch": 566} {"train_loss": -35.0203857421875, "global_step": 68551, "epoch": 566} {"train_loss": -35.81760025024414, "global_step": 68552, "epoch": 566} {"train_loss": -34.94939422607422, "global_step": 68553, "epoch": 566} {"train_loss": -35.89899826049805, "global_step": 68554, "epoch": 566} {"train_loss": -36.06301498413086, "global_step": 68555, "epoch": 566} {"train_loss": -34.239990234375, "global_step": 68556, "epoch": 566} {"train_loss": -33.33317565917969, "global_step": 68557, "epoch": 566} {"train_loss": -33.947357177734375, "global_step": 68558, "epoch": 566} {"train_loss": -33.846649169921875, "global_step": 68559, "epoch": 566} {"train_loss": -35.80377960205078, "global_step": 68560, "epoch": 566} {"train_loss": -34.18436050415039, "global_step": 68561, "epoch": 566} {"train_loss": -35.8228759765625, "global_step": 68562, "epoch": 566} {"train_loss": -34.088130950927734, "global_step": 68563, "epoch": 566} {"train_loss": -34.97272491455078, "global_step": 68564, "epoch": 566} {"train_loss": -34.36326599121094, "global_step": 68565, "epoch": 566} {"train_loss": -36.29299545288086, "global_step": 68566, "epoch": 566} {"train_loss": -35.47956085205078, "global_step": 68567, "epoch": 566} {"train_loss": -36.34449768066406, "global_step": 68568, "epoch": 566} {"train_loss": -35.449134826660156, "global_step": 68569, "epoch": 566} {"train_loss": -35.88169479370117, "global_step": 68570, "epoch": 566} {"train_loss": -36.20818328857422, "global_step": 68571, "epoch": 566} {"train_loss": -35.92353439331055, "global_step": 68572, "epoch": 566} {"train_loss": -35.66282272338867, "global_step": 68573, "epoch": 566} {"train_loss": -31.9978084564209, "global_step": 68574, "epoch": 566} {"train_loss": -36.33248519897461, "global_step": 68575, "epoch": 566} {"train_loss": -36.5864372253418, "global_step": 68576, "epoch": 566} {"train_loss": -34.07820510864258, "global_step": 68577, "epoch": 566} {"train_loss": -35.334835052490234, "global_step": 68578, "epoch": 566} {"train_loss": -35.922332763671875, "global_step": 68579, "epoch": 566} {"train_loss": -36.38129806518555, "global_step": 68580, "epoch": 566} {"train_loss": -35.67464828491211, "global_step": 68581, "epoch": 566} {"train_loss": -35.610443115234375, "global_step": 68582, "epoch": 566} {"train_loss": -35.38169479370117, "global_step": 68583, "epoch": 566} {"train_loss": -36.10891342163086, "global_step": 68584, "epoch": 566} {"train_loss": -36.119075775146484, "global_step": 68585, "epoch": 566} {"train_loss": -35.551795959472656, "global_step": 68586, "epoch": 566} {"train_loss": -34.87449264526367, "global_step": 68587, "epoch": 566} {"train_loss": -35.569271087646484, "global_step": 68588, "epoch": 566} {"train_loss": -35.807167053222656, "global_step": 68589, "epoch": 566} {"train_loss": -35.573097229003906, "global_step": 68590, "epoch": 566} {"train_loss": -36.28352355957031, "global_step": 68591, "epoch": 566} {"train_loss": -35.88490295410156, "global_step": 68592, "epoch": 566} {"train_loss": -32.55343246459961, "global_step": 68593, "epoch": 566} {"train_loss": -35.87191390991211, "global_step": 68594, "epoch": 566} {"train_loss": -35.410118103027344, "global_step": 68595, "epoch": 566} {"train_loss": -35.548309326171875, "global_step": 68596, "epoch": 566} {"train_loss": -35.979305267333984, "global_step": 68597, "epoch": 566} {"train_loss": -33.27395248413086, "global_step": 68598, "epoch": 566} {"train_loss": -35.18416213989258, "global_step": 68599, "epoch": 566} {"train_loss": -36.07088088989258, "global_step": 68600, "epoch": 566} {"train_loss": -36.13291549682617, "global_step": 68601, "epoch": 566} {"train_loss": -35.734901428222656, "global_step": 68602, "epoch": 566} {"train_loss": -34.43337631225586, "global_step": 68603, "epoch": 566} {"train_loss": -34.69839096069336, "global_step": 68604, "epoch": 566} {"train_loss": -33.688541412353516, "global_step": 68605, "epoch": 566} {"train_loss": -35.36059474156908, "global_step": 68606, "epoch": 566, "val_loss": 2637533.0} {"train_loss": -34.02876663208008, "global_step": 68607, "epoch": 567} {"train_loss": -35.16704177856445, "global_step": 68608, "epoch": 567} {"train_loss": -35.57173156738281, "global_step": 68609, "epoch": 567} {"train_loss": -35.446292877197266, "global_step": 68610, "epoch": 567} {"train_loss": -34.7655029296875, "global_step": 68611, "epoch": 567} {"train_loss": -33.19694137573242, "global_step": 68612, "epoch": 567} {"train_loss": -35.74471664428711, "global_step": 68613, "epoch": 567} {"train_loss": -35.50362014770508, "global_step": 68614, "epoch": 567} {"train_loss": -35.144596099853516, "global_step": 68615, "epoch": 567} {"train_loss": -34.79524230957031, "global_step": 68616, "epoch": 567} {"train_loss": -36.11017990112305, "global_step": 68617, "epoch": 567} {"train_loss": -34.979644775390625, "global_step": 68618, "epoch": 567} {"train_loss": -35.86767578125, "global_step": 68619, "epoch": 567} {"train_loss": -35.373287200927734, "global_step": 68620, "epoch": 567} {"train_loss": -35.78852462768555, "global_step": 68621, "epoch": 567} {"train_loss": -36.132625579833984, "global_step": 68622, "epoch": 567} {"train_loss": -35.6247444152832, "global_step": 68623, "epoch": 567} {"train_loss": -36.26424789428711, "global_step": 68624, "epoch": 567} {"train_loss": -36.066402435302734, "global_step": 68625, "epoch": 567} {"train_loss": -34.59174728393555, "global_step": 68626, "epoch": 567} {"train_loss": -35.72871017456055, "global_step": 68627, "epoch": 567} {"train_loss": -36.30967330932617, "global_step": 68628, "epoch": 567} {"train_loss": -35.77559280395508, "global_step": 68629, "epoch": 567} {"train_loss": -36.40311813354492, "global_step": 68630, "epoch": 567} {"train_loss": -35.83541488647461, "global_step": 68631, "epoch": 567} {"train_loss": -36.66328811645508, "global_step": 68632, "epoch": 567} {"train_loss": -35.84438705444336, "global_step": 68633, "epoch": 567} {"train_loss": -36.541481018066406, "global_step": 68634, "epoch": 567} {"train_loss": -36.24027633666992, "global_step": 68635, "epoch": 567} {"train_loss": -36.37006378173828, "global_step": 68636, "epoch": 567} {"train_loss": -36.78345489501953, "global_step": 68637, "epoch": 567} {"train_loss": -36.72207260131836, "global_step": 68638, "epoch": 567} {"train_loss": -36.23521041870117, "global_step": 68639, "epoch": 567} {"train_loss": -36.8372688293457, "global_step": 68640, "epoch": 567} {"train_loss": -35.793487548828125, "global_step": 68641, "epoch": 567} {"train_loss": -36.897701263427734, "global_step": 68642, "epoch": 567} {"train_loss": -36.487770080566406, "global_step": 68643, "epoch": 567} {"train_loss": -36.33002853393555, "global_step": 68644, "epoch": 567} {"train_loss": -36.51226806640625, "global_step": 68645, "epoch": 567} {"train_loss": -37.21596145629883, "global_step": 68646, "epoch": 567} {"train_loss": -36.76972961425781, "global_step": 68647, "epoch": 567} {"train_loss": -36.973854064941406, "global_step": 68648, "epoch": 567} {"train_loss": -36.6809196472168, "global_step": 68649, "epoch": 567} {"train_loss": -36.998199462890625, "global_step": 68650, "epoch": 567} {"train_loss": -36.490840911865234, "global_step": 68651, "epoch": 567} {"train_loss": -37.365352630615234, "global_step": 68652, "epoch": 567} {"train_loss": -36.95457458496094, "global_step": 68653, "epoch": 567} {"train_loss": -36.88679504394531, "global_step": 68654, "epoch": 567} {"train_loss": -37.29072189331055, "global_step": 68655, "epoch": 567} {"train_loss": -37.150203704833984, "global_step": 68656, "epoch": 567} {"train_loss": -37.53019332885742, "global_step": 68657, "epoch": 567} {"train_loss": -37.246742248535156, "global_step": 68658, "epoch": 567} {"train_loss": -36.9056396484375, "global_step": 68659, "epoch": 567} {"train_loss": -37.293426513671875, "global_step": 68660, "epoch": 567} {"train_loss": -36.82821273803711, "global_step": 68661, "epoch": 567} {"train_loss": -35.48210525512695, "global_step": 68662, "epoch": 567} {"train_loss": -36.75059127807617, "global_step": 68663, "epoch": 567} {"train_loss": -36.936927795410156, "global_step": 68664, "epoch": 567} {"train_loss": -37.08924102783203, "global_step": 68665, "epoch": 567} {"train_loss": -36.78416061401367, "global_step": 68666, "epoch": 567} {"train_loss": -36.89061737060547, "global_step": 68667, "epoch": 567} {"train_loss": -28.3230037689209, "global_step": 68668, "epoch": 567} {"train_loss": -34.52279281616211, "global_step": 68669, "epoch": 567} {"train_loss": -34.98094177246094, "global_step": 68670, "epoch": 567} {"train_loss": -31.03057289123535, "global_step": 68671, "epoch": 567} {"train_loss": -34.125362396240234, "global_step": 68672, "epoch": 567} {"train_loss": -35.59257125854492, "global_step": 68673, "epoch": 567} {"train_loss": -34.231266021728516, "global_step": 68674, "epoch": 567} {"train_loss": -31.498197555541992, "global_step": 68675, "epoch": 567} {"train_loss": -29.521406173706055, "global_step": 68676, "epoch": 567} {"train_loss": -35.1941032409668, "global_step": 68677, "epoch": 567} {"train_loss": -33.90349197387695, "global_step": 68678, "epoch": 567} {"train_loss": -30.31268310546875, "global_step": 68679, "epoch": 567} {"train_loss": -32.10541915893555, "global_step": 68680, "epoch": 567} {"train_loss": -34.86570358276367, "global_step": 68681, "epoch": 567} {"train_loss": -33.89003372192383, "global_step": 68682, "epoch": 567} {"train_loss": -32.8054084777832, "global_step": 68683, "epoch": 567} {"train_loss": -33.575443267822266, "global_step": 68684, "epoch": 567} {"train_loss": -33.17495346069336, "global_step": 68685, "epoch": 567} {"train_loss": -30.96192741394043, "global_step": 68686, "epoch": 567} {"train_loss": -34.395137786865234, "global_step": 68687, "epoch": 567} {"train_loss": -33.01925277709961, "global_step": 68688, "epoch": 567} {"train_loss": -35.14866256713867, "global_step": 68689, "epoch": 567} {"train_loss": -33.79729080200195, "global_step": 68690, "epoch": 567} {"train_loss": -34.093143463134766, "global_step": 68691, "epoch": 567} {"train_loss": -35.69919967651367, "global_step": 68692, "epoch": 567} {"train_loss": -35.116729736328125, "global_step": 68693, "epoch": 567} {"train_loss": -34.616085052490234, "global_step": 68694, "epoch": 567} {"train_loss": -32.34833526611328, "global_step": 68695, "epoch": 567} {"train_loss": -34.78985595703125, "global_step": 68696, "epoch": 567} {"train_loss": -34.20172882080078, "global_step": 68697, "epoch": 567} {"train_loss": -33.40302658081055, "global_step": 68698, "epoch": 567} {"train_loss": -34.68607711791992, "global_step": 68699, "epoch": 567} {"train_loss": -33.609493255615234, "global_step": 68700, "epoch": 567} {"train_loss": -34.57595443725586, "global_step": 68701, "epoch": 567} {"train_loss": -34.710689544677734, "global_step": 68702, "epoch": 567} {"train_loss": -34.25913619995117, "global_step": 68703, "epoch": 567} {"train_loss": -34.92527389526367, "global_step": 68704, "epoch": 567} {"train_loss": -34.979732513427734, "global_step": 68705, "epoch": 567} {"train_loss": -33.91184616088867, "global_step": 68706, "epoch": 567} {"train_loss": -35.16141891479492, "global_step": 68707, "epoch": 567} {"train_loss": -34.81808090209961, "global_step": 68708, "epoch": 567} {"train_loss": -35.10951232910156, "global_step": 68709, "epoch": 567} {"train_loss": -35.20012283325195, "global_step": 68710, "epoch": 567} {"train_loss": -35.09812927246094, "global_step": 68711, "epoch": 567} {"train_loss": -34.89144515991211, "global_step": 68712, "epoch": 567} {"train_loss": -34.54389190673828, "global_step": 68713, "epoch": 567} {"train_loss": -35.477691650390625, "global_step": 68714, "epoch": 567} {"train_loss": -34.81171417236328, "global_step": 68715, "epoch": 567} {"train_loss": -35.30881881713867, "global_step": 68716, "epoch": 567} {"train_loss": -34.762115478515625, "global_step": 68717, "epoch": 567} {"train_loss": -33.944801330566406, "global_step": 68718, "epoch": 567} {"train_loss": -35.17864227294922, "global_step": 68719, "epoch": 567} {"train_loss": -35.604705810546875, "global_step": 68720, "epoch": 567} {"train_loss": -35.15562057495117, "global_step": 68721, "epoch": 567} {"train_loss": -35.68569564819336, "global_step": 68722, "epoch": 567} {"train_loss": -35.94404602050781, "global_step": 68723, "epoch": 567} {"train_loss": -35.6318473815918, "global_step": 68724, "epoch": 567} {"train_loss": -35.4700927734375, "global_step": 68725, "epoch": 567} {"train_loss": -35.1970329284668, "global_step": 68726, "epoch": 567} {"train_loss": -35.19108800651613, "global_step": 68727, "epoch": 567, "val_loss": 2538729.75} {"train_loss": -35.58896255493164, "global_step": 68728, "epoch": 568} {"train_loss": -35.8346061706543, "global_step": 68729, "epoch": 568} {"train_loss": -36.149192810058594, "global_step": 68730, "epoch": 568} {"train_loss": -35.521968841552734, "global_step": 68731, "epoch": 568} {"train_loss": -35.84352493286133, "global_step": 68732, "epoch": 568} {"train_loss": -36.07453155517578, "global_step": 68733, "epoch": 568} {"train_loss": -36.48044967651367, "global_step": 68734, "epoch": 568} {"train_loss": -35.31392288208008, "global_step": 68735, "epoch": 568} {"train_loss": -35.7937126159668, "global_step": 68736, "epoch": 568} {"train_loss": -34.51582336425781, "global_step": 68737, "epoch": 568} {"train_loss": -36.25718688964844, "global_step": 68738, "epoch": 568} {"train_loss": -34.96043014526367, "global_step": 68739, "epoch": 568} {"train_loss": -35.7801628112793, "global_step": 68740, "epoch": 568} {"train_loss": -35.52555465698242, "global_step": 68741, "epoch": 568} {"train_loss": -36.70222473144531, "global_step": 68742, "epoch": 568} {"train_loss": -35.618282318115234, "global_step": 68743, "epoch": 568} {"train_loss": -36.054229736328125, "global_step": 68744, "epoch": 568} {"train_loss": -35.00265121459961, "global_step": 68745, "epoch": 568} {"train_loss": -36.0201416015625, "global_step": 68746, "epoch": 568} {"train_loss": -36.02049255371094, "global_step": 68747, "epoch": 568} {"train_loss": -36.034603118896484, "global_step": 68748, "epoch": 568} {"train_loss": -36.25263595581055, "global_step": 68749, "epoch": 568} {"train_loss": -36.72459030151367, "global_step": 68750, "epoch": 568} {"train_loss": -36.2533073425293, "global_step": 68751, "epoch": 568} {"train_loss": -34.248138427734375, "global_step": 68752, "epoch": 568} {"train_loss": -36.301513671875, "global_step": 68753, "epoch": 568} {"train_loss": -35.21434783935547, "global_step": 68754, "epoch": 568} {"train_loss": -36.447444915771484, "global_step": 68755, "epoch": 568} {"train_loss": -35.30683135986328, "global_step": 68756, "epoch": 568} {"train_loss": -36.43435287475586, "global_step": 68757, "epoch": 568} {"train_loss": -36.2189826965332, "global_step": 68758, "epoch": 568} {"train_loss": -34.65351104736328, "global_step": 68759, "epoch": 568} {"train_loss": -37.03993225097656, "global_step": 68760, "epoch": 568} {"train_loss": -34.27946090698242, "global_step": 68761, "epoch": 568} {"train_loss": -35.730831146240234, "global_step": 68762, "epoch": 568} {"train_loss": -36.148555755615234, "global_step": 68763, "epoch": 568} {"train_loss": -35.71540451049805, "global_step": 68764, "epoch": 568} {"train_loss": -36.42109298706055, "global_step": 68765, "epoch": 568} {"train_loss": -36.258338928222656, "global_step": 68766, "epoch": 568} {"train_loss": -36.07906723022461, "global_step": 68767, "epoch": 568} {"train_loss": -36.96303939819336, "global_step": 68768, "epoch": 568} {"train_loss": -36.32368469238281, "global_step": 68769, "epoch": 568} {"train_loss": -35.13576889038086, "global_step": 68770, "epoch": 568} {"train_loss": -36.36812973022461, "global_step": 68771, "epoch": 568} {"train_loss": -36.94578170776367, "global_step": 68772, "epoch": 568} {"train_loss": -36.4788932800293, "global_step": 68773, "epoch": 568} {"train_loss": -35.98188018798828, "global_step": 68774, "epoch": 568} {"train_loss": -36.727779388427734, "global_step": 68775, "epoch": 568} {"train_loss": -36.95841598510742, "global_step": 68776, "epoch": 568} {"train_loss": -36.83901596069336, "global_step": 68777, "epoch": 568} {"train_loss": -36.837890625, "global_step": 68778, "epoch": 568} {"train_loss": -37.09086227416992, "global_step": 68779, "epoch": 568} {"train_loss": -36.822486877441406, "global_step": 68780, "epoch": 568} {"train_loss": -37.33201217651367, "global_step": 68781, "epoch": 568} {"train_loss": -36.93941879272461, "global_step": 68782, "epoch": 568} {"train_loss": -37.35513687133789, "global_step": 68783, "epoch": 568} {"train_loss": -36.89155197143555, "global_step": 68784, "epoch": 568} {"train_loss": -37.70169448852539, "global_step": 68785, "epoch": 568} {"train_loss": -37.35293197631836, "global_step": 68786, "epoch": 568} {"train_loss": -36.84330368041992, "global_step": 68787, "epoch": 568} {"train_loss": -37.383968353271484, "global_step": 68788, "epoch": 568} {"train_loss": -37.487396240234375, "global_step": 68789, "epoch": 568} {"train_loss": -37.4209098815918, "global_step": 68790, "epoch": 568} {"train_loss": -36.04243469238281, "global_step": 68791, "epoch": 568} {"train_loss": -37.544307708740234, "global_step": 68792, "epoch": 568} {"train_loss": -36.9683837890625, "global_step": 68793, "epoch": 568} {"train_loss": -37.74296188354492, "global_step": 68794, "epoch": 568} {"train_loss": -37.67698287963867, "global_step": 68795, "epoch": 568} {"train_loss": -36.37655258178711, "global_step": 68796, "epoch": 568} {"train_loss": -36.8195686340332, "global_step": 68797, "epoch": 568} {"train_loss": -36.01858139038086, "global_step": 68798, "epoch": 568} {"train_loss": -35.96955490112305, "global_step": 68799, "epoch": 568} {"train_loss": -35.71770095825195, "global_step": 68800, "epoch": 568} {"train_loss": -35.1706657409668, "global_step": 68801, "epoch": 568} {"train_loss": -33.297607421875, "global_step": 68802, "epoch": 568} {"train_loss": -35.73052215576172, "global_step": 68803, "epoch": 568} {"train_loss": -35.94293975830078, "global_step": 68804, "epoch": 568} {"train_loss": -35.74711990356445, "global_step": 68805, "epoch": 568} {"train_loss": -36.431941986083984, "global_step": 68806, "epoch": 568} {"train_loss": -34.82080078125, "global_step": 68807, "epoch": 568} {"train_loss": -34.955047607421875, "global_step": 68808, "epoch": 568} {"train_loss": -35.779266357421875, "global_step": 68809, "epoch": 568} {"train_loss": -35.62196731567383, "global_step": 68810, "epoch": 568} {"train_loss": -36.36322784423828, "global_step": 68811, "epoch": 568} {"train_loss": -35.08391189575195, "global_step": 68812, "epoch": 568} {"train_loss": -35.45791244506836, "global_step": 68813, "epoch": 568} {"train_loss": -34.69121170043945, "global_step": 68814, "epoch": 568} {"train_loss": -33.9639778137207, "global_step": 68815, "epoch": 568} {"train_loss": -36.457088470458984, "global_step": 68816, "epoch": 568} {"train_loss": -36.68363952636719, "global_step": 68817, "epoch": 568} {"train_loss": -36.39777755737305, "global_step": 68818, "epoch": 568} {"train_loss": -34.93335723876953, "global_step": 68819, "epoch": 568} {"train_loss": -35.056640625, "global_step": 68820, "epoch": 568} {"train_loss": -34.630706787109375, "global_step": 68821, "epoch": 568} {"train_loss": -34.6634521484375, "global_step": 68822, "epoch": 568} {"train_loss": -35.997947692871094, "global_step": 68823, "epoch": 568} {"train_loss": -35.65652084350586, "global_step": 68824, "epoch": 568} {"train_loss": -35.2075309753418, "global_step": 68825, "epoch": 568} {"train_loss": -36.38254165649414, "global_step": 68826, "epoch": 568} {"train_loss": -36.76148986816406, "global_step": 68827, "epoch": 568} {"train_loss": -35.00638961791992, "global_step": 68828, "epoch": 568} {"train_loss": -36.22383499145508, "global_step": 68829, "epoch": 568} {"train_loss": -35.92743682861328, "global_step": 68830, "epoch": 568} {"train_loss": -36.70491409301758, "global_step": 68831, "epoch": 568} {"train_loss": -35.44108200073242, "global_step": 68832, "epoch": 568} {"train_loss": -36.45792770385742, "global_step": 68833, "epoch": 568} {"train_loss": -35.613155364990234, "global_step": 68834, "epoch": 568} {"train_loss": -33.2149658203125, "global_step": 68835, "epoch": 568} {"train_loss": -32.238487243652344, "global_step": 68836, "epoch": 568} {"train_loss": -28.21591567993164, "global_step": 68837, "epoch": 568} {"train_loss": -22.34158706665039, "global_step": 68838, "epoch": 568} {"train_loss": -31.43682861328125, "global_step": 68839, "epoch": 568} {"train_loss": -35.09101104736328, "global_step": 68840, "epoch": 568} {"train_loss": -30.652114868164062, "global_step": 68841, "epoch": 568} {"train_loss": -34.25932693481445, "global_step": 68842, "epoch": 568} {"train_loss": -32.7271842956543, "global_step": 68843, "epoch": 568} {"train_loss": -34.89139938354492, "global_step": 68844, "epoch": 568} {"train_loss": -33.63712692260742, "global_step": 68845, "epoch": 568} {"train_loss": -35.73729705810547, "global_step": 68846, "epoch": 568} {"train_loss": -34.47829818725586, "global_step": 68847, "epoch": 568} {"train_loss": -35.63275256826858, "global_step": 68848, "epoch": 568, "val_loss": 2881649.25} {"train_loss": -35.275814056396484, "global_step": 68849, "epoch": 569} {"train_loss": -34.90888214111328, "global_step": 68850, "epoch": 569} {"train_loss": -35.57094192504883, "global_step": 68851, "epoch": 569} {"train_loss": -35.7940788269043, "global_step": 68852, "epoch": 569} {"train_loss": -36.03048324584961, "global_step": 68853, "epoch": 569} {"train_loss": -35.90864944458008, "global_step": 68854, "epoch": 569} {"train_loss": -35.60354995727539, "global_step": 68855, "epoch": 569} {"train_loss": -35.53316879272461, "global_step": 68856, "epoch": 569} {"train_loss": -36.126548767089844, "global_step": 68857, "epoch": 569} {"train_loss": -36.614620208740234, "global_step": 68858, "epoch": 569} {"train_loss": -36.12567901611328, "global_step": 68859, "epoch": 569} {"train_loss": -36.43949508666992, "global_step": 68860, "epoch": 569} {"train_loss": -36.879756927490234, "global_step": 68861, "epoch": 569} {"train_loss": -36.130165100097656, "global_step": 68862, "epoch": 569} {"train_loss": -36.80892562866211, "global_step": 68863, "epoch": 569} {"train_loss": -35.75204086303711, "global_step": 68864, "epoch": 569} {"train_loss": -36.49785614013672, "global_step": 68865, "epoch": 569} {"train_loss": -37.19716262817383, "global_step": 68866, "epoch": 569} {"train_loss": -36.30084228515625, "global_step": 68867, "epoch": 569} {"train_loss": -36.66364669799805, "global_step": 68868, "epoch": 569} {"train_loss": -36.27454376220703, "global_step": 68869, "epoch": 569} {"train_loss": -37.10810470581055, "global_step": 68870, "epoch": 569} {"train_loss": -36.80501937866211, "global_step": 68871, "epoch": 569} {"train_loss": -36.647010803222656, "global_step": 68872, "epoch": 569} {"train_loss": -36.68894958496094, "global_step": 68873, "epoch": 569} {"train_loss": -36.49190902709961, "global_step": 68874, "epoch": 569} {"train_loss": -36.869571685791016, "global_step": 68875, "epoch": 569} {"train_loss": -36.60299301147461, "global_step": 68876, "epoch": 569} {"train_loss": -36.6784782409668, "global_step": 68877, "epoch": 569} {"train_loss": -36.42561340332031, "global_step": 68878, "epoch": 569} {"train_loss": -36.762969970703125, "global_step": 68879, "epoch": 569} {"train_loss": -37.05210494995117, "global_step": 68880, "epoch": 569} {"train_loss": -37.93635177612305, "global_step": 68881, "epoch": 569} {"train_loss": -37.16965103149414, "global_step": 68882, "epoch": 569} {"train_loss": -36.651710510253906, "global_step": 68883, "epoch": 569} {"train_loss": -36.67750930786133, "global_step": 68884, "epoch": 569} {"train_loss": -36.4128532409668, "global_step": 68885, "epoch": 569} {"train_loss": -36.91546630859375, "global_step": 68886, "epoch": 569} {"train_loss": -36.767879486083984, "global_step": 68887, "epoch": 569} {"train_loss": -36.780670166015625, "global_step": 68888, "epoch": 569} {"train_loss": -36.26052474975586, "global_step": 68889, "epoch": 569} {"train_loss": -36.248085021972656, "global_step": 68890, "epoch": 569} {"train_loss": -36.879878997802734, "global_step": 68891, "epoch": 569} {"train_loss": -37.03828430175781, "global_step": 68892, "epoch": 569} {"train_loss": -37.61469268798828, "global_step": 68893, "epoch": 569} {"train_loss": -37.25156784057617, "global_step": 68894, "epoch": 569} {"train_loss": -36.593502044677734, "global_step": 68895, "epoch": 569} {"train_loss": -35.755043029785156, "global_step": 68896, "epoch": 569} {"train_loss": -34.412601470947266, "global_step": 68897, "epoch": 569} {"train_loss": -33.17138671875, "global_step": 68898, "epoch": 569} {"train_loss": -29.895648956298828, "global_step": 68899, "epoch": 569} {"train_loss": -27.275943756103516, "global_step": 68900, "epoch": 569} {"train_loss": -26.037397384643555, "global_step": 68901, "epoch": 569} {"train_loss": -29.7474308013916, "global_step": 68902, "epoch": 569} {"train_loss": -36.047584533691406, "global_step": 68903, "epoch": 569} {"train_loss": -34.358070373535156, "global_step": 68904, "epoch": 569} {"train_loss": -31.901357650756836, "global_step": 68905, "epoch": 569} {"train_loss": -35.21538162231445, "global_step": 68906, "epoch": 569} {"train_loss": -35.70039749145508, "global_step": 68907, "epoch": 569} {"train_loss": -35.550838470458984, "global_step": 68908, "epoch": 569} {"train_loss": -34.99442672729492, "global_step": 68909, "epoch": 569} {"train_loss": -34.93073654174805, "global_step": 68910, "epoch": 569} {"train_loss": -35.35062026977539, "global_step": 68911, "epoch": 569} {"train_loss": -34.22114944458008, "global_step": 68912, "epoch": 569} {"train_loss": -33.457149505615234, "global_step": 68913, "epoch": 569} {"train_loss": -35.199127197265625, "global_step": 68914, "epoch": 569} {"train_loss": -31.840682983398438, "global_step": 68915, "epoch": 569} {"train_loss": -34.9726676940918, "global_step": 68916, "epoch": 569} {"train_loss": -34.179481506347656, "global_step": 68917, "epoch": 569} {"train_loss": -34.90962600708008, "global_step": 68918, "epoch": 569} {"train_loss": -34.786495208740234, "global_step": 68919, "epoch": 569} {"train_loss": -35.64817428588867, "global_step": 68920, "epoch": 569} {"train_loss": -34.811397552490234, "global_step": 68921, "epoch": 569} {"train_loss": -36.283451080322266, "global_step": 68922, "epoch": 569} {"train_loss": -35.39445877075195, "global_step": 68923, "epoch": 569} {"train_loss": -36.188716888427734, "global_step": 68924, "epoch": 569} {"train_loss": -31.521926879882812, "global_step": 68925, "epoch": 569} {"train_loss": -35.81078338623047, "global_step": 68926, "epoch": 569} {"train_loss": -35.93492889404297, "global_step": 68927, "epoch": 569} {"train_loss": -33.901145935058594, "global_step": 68928, "epoch": 569} {"train_loss": -35.04301834106445, "global_step": 68929, "epoch": 569} {"train_loss": -35.80343246459961, "global_step": 68930, "epoch": 569} {"train_loss": -35.891475677490234, "global_step": 68931, "epoch": 569} {"train_loss": -35.28718948364258, "global_step": 68932, "epoch": 569} {"train_loss": -28.33052635192871, "global_step": 68933, "epoch": 569} {"train_loss": -35.033748626708984, "global_step": 68934, "epoch": 569} {"train_loss": -34.5147819519043, "global_step": 68935, "epoch": 569} {"train_loss": -35.428855895996094, "global_step": 68936, "epoch": 569} {"train_loss": -35.378047943115234, "global_step": 68937, "epoch": 569} {"train_loss": -35.60129928588867, "global_step": 68938, "epoch": 569} {"train_loss": -35.17730712890625, "global_step": 68939, "epoch": 569} {"train_loss": -35.885963439941406, "global_step": 68940, "epoch": 569} {"train_loss": -34.356170654296875, "global_step": 68941, "epoch": 569} {"train_loss": -34.37844467163086, "global_step": 68942, "epoch": 569} {"train_loss": -36.2203369140625, "global_step": 68943, "epoch": 569} {"train_loss": -35.76692581176758, "global_step": 68944, "epoch": 569} {"train_loss": -35.85927963256836, "global_step": 68945, "epoch": 569} {"train_loss": -34.61587142944336, "global_step": 68946, "epoch": 569} {"train_loss": -33.88562774658203, "global_step": 68947, "epoch": 569} {"train_loss": -35.696651458740234, "global_step": 68948, "epoch": 569} {"train_loss": -34.1296501159668, "global_step": 68949, "epoch": 569} {"train_loss": -34.385154724121094, "global_step": 68950, "epoch": 569} {"train_loss": -34.85313415527344, "global_step": 68951, "epoch": 569} {"train_loss": -35.24256134033203, "global_step": 68952, "epoch": 569} {"train_loss": -35.97031784057617, "global_step": 68953, "epoch": 569} {"train_loss": -34.71818923950195, "global_step": 68954, "epoch": 569} {"train_loss": -36.12350845336914, "global_step": 68955, "epoch": 569} {"train_loss": -35.288970947265625, "global_step": 68956, "epoch": 569} {"train_loss": -35.62611770629883, "global_step": 68957, "epoch": 569} {"train_loss": -34.990230560302734, "global_step": 68958, "epoch": 569} {"train_loss": -34.87020492553711, "global_step": 68959, "epoch": 569} {"train_loss": -35.7354736328125, "global_step": 68960, "epoch": 569} {"train_loss": -35.99200439453125, "global_step": 68961, "epoch": 569} {"train_loss": -35.95673751831055, "global_step": 68962, "epoch": 569} {"train_loss": -34.88564682006836, "global_step": 68963, "epoch": 569} {"train_loss": -33.44273376464844, "global_step": 68964, "epoch": 569} {"train_loss": -35.814361572265625, "global_step": 68965, "epoch": 569} {"train_loss": -34.9527702331543, "global_step": 68966, "epoch": 569} {"train_loss": -35.132301330566406, "global_step": 68967, "epoch": 569} {"train_loss": -34.4683723449707, "global_step": 68968, "epoch": 569} {"train_loss": -35.28767161723996, "global_step": 68969, "epoch": 569, "val_loss": 2908406.0} {"train_loss": -35.62595748901367, "global_step": 68970, "epoch": 570} {"train_loss": -34.60649108886719, "global_step": 68971, "epoch": 570} {"train_loss": -36.10867691040039, "global_step": 68972, "epoch": 570} {"train_loss": -36.091182708740234, "global_step": 68973, "epoch": 570} {"train_loss": -34.49849319458008, "global_step": 68974, "epoch": 570} {"train_loss": -31.36847496032715, "global_step": 68975, "epoch": 570} {"train_loss": -30.85096549987793, "global_step": 68976, "epoch": 570} {"train_loss": -29.37342643737793, "global_step": 68977, "epoch": 570} {"train_loss": -34.105926513671875, "global_step": 68978, "epoch": 570} {"train_loss": -35.238868713378906, "global_step": 68979, "epoch": 570} {"train_loss": -32.034481048583984, "global_step": 68980, "epoch": 570} {"train_loss": -34.346492767333984, "global_step": 68981, "epoch": 570} {"train_loss": -35.71511459350586, "global_step": 68982, "epoch": 570} {"train_loss": -33.84846878051758, "global_step": 68983, "epoch": 570} {"train_loss": -35.77778244018555, "global_step": 68984, "epoch": 570} {"train_loss": -33.44733810424805, "global_step": 68985, "epoch": 570} {"train_loss": -33.66602325439453, "global_step": 68986, "epoch": 570} {"train_loss": -36.05402755737305, "global_step": 68987, "epoch": 570} {"train_loss": -34.0803337097168, "global_step": 68988, "epoch": 570} {"train_loss": -35.07988357543945, "global_step": 68989, "epoch": 570} {"train_loss": -35.57603073120117, "global_step": 68990, "epoch": 570} {"train_loss": -33.918800354003906, "global_step": 68991, "epoch": 570} {"train_loss": -36.0363655090332, "global_step": 68992, "epoch": 570} {"train_loss": -34.703834533691406, "global_step": 68993, "epoch": 570} {"train_loss": -36.109859466552734, "global_step": 68994, "epoch": 570} {"train_loss": -34.622901916503906, "global_step": 68995, "epoch": 570} {"train_loss": -34.91572952270508, "global_step": 68996, "epoch": 570} {"train_loss": -34.775848388671875, "global_step": 68997, "epoch": 570} {"train_loss": -35.33989334106445, "global_step": 68998, "epoch": 570} {"train_loss": -35.79180145263672, "global_step": 68999, "epoch": 570} {"train_loss": -34.74099349975586, "global_step": 69000, "epoch": 570} {"train_loss": -35.808650970458984, "global_step": 69001, "epoch": 570} {"train_loss": -35.16740798950195, "global_step": 69002, "epoch": 570} {"train_loss": -35.177608489990234, "global_step": 69003, "epoch": 570} {"train_loss": -36.50760269165039, "global_step": 69004, "epoch": 570} {"train_loss": -35.911930084228516, "global_step": 69005, "epoch": 570} {"train_loss": -35.88766098022461, "global_step": 69006, "epoch": 570} {"train_loss": -36.04461669921875, "global_step": 69007, "epoch": 570} {"train_loss": -35.396785736083984, "global_step": 69008, "epoch": 570} {"train_loss": -35.90372085571289, "global_step": 69009, "epoch": 570} {"train_loss": -36.333595275878906, "global_step": 69010, "epoch": 570} {"train_loss": -36.19948196411133, "global_step": 69011, "epoch": 570} {"train_loss": -36.5550651550293, "global_step": 69012, "epoch": 570} {"train_loss": -36.90747833251953, "global_step": 69013, "epoch": 570} {"train_loss": -36.110267639160156, "global_step": 69014, "epoch": 570} {"train_loss": -36.18213653564453, "global_step": 69015, "epoch": 570} {"train_loss": -36.15792465209961, "global_step": 69016, "epoch": 570} {"train_loss": -36.62153625488281, "global_step": 69017, "epoch": 570} {"train_loss": -35.42800521850586, "global_step": 69018, "epoch": 570} {"train_loss": -35.884674072265625, "global_step": 69019, "epoch": 570} {"train_loss": -36.9381217956543, "global_step": 69020, "epoch": 570} {"train_loss": -36.66417694091797, "global_step": 69021, "epoch": 570} {"train_loss": -36.43045425415039, "global_step": 69022, "epoch": 570} {"train_loss": -37.05726623535156, "global_step": 69023, "epoch": 570} {"train_loss": -36.91627883911133, "global_step": 69024, "epoch": 570} {"train_loss": -35.577083587646484, "global_step": 69025, "epoch": 570} {"train_loss": -36.56782913208008, "global_step": 69026, "epoch": 570} {"train_loss": -36.41424560546875, "global_step": 69027, "epoch": 570} {"train_loss": -36.491756439208984, "global_step": 69028, "epoch": 570} {"train_loss": -36.83378601074219, "global_step": 69029, "epoch": 570} {"train_loss": -36.196258544921875, "global_step": 69030, "epoch": 570} {"train_loss": -37.19514083862305, "global_step": 69031, "epoch": 570} {"train_loss": -36.980308532714844, "global_step": 69032, "epoch": 570} {"train_loss": -36.45125961303711, "global_step": 69033, "epoch": 570} {"train_loss": -36.90291213989258, "global_step": 69034, "epoch": 570} {"train_loss": -36.26852035522461, "global_step": 69035, "epoch": 570} {"train_loss": -36.89201736450195, "global_step": 69036, "epoch": 570} {"train_loss": -36.993839263916016, "global_step": 69037, "epoch": 570} {"train_loss": -35.906097412109375, "global_step": 69038, "epoch": 570} {"train_loss": -33.66292953491211, "global_step": 69039, "epoch": 570} {"train_loss": -36.54008483886719, "global_step": 69040, "epoch": 570} {"train_loss": -34.847198486328125, "global_step": 69041, "epoch": 570} {"train_loss": -34.31843948364258, "global_step": 69042, "epoch": 570} {"train_loss": -35.71651077270508, "global_step": 69043, "epoch": 570} {"train_loss": -34.926116943359375, "global_step": 69044, "epoch": 570} {"train_loss": -36.71676254272461, "global_step": 69045, "epoch": 570} {"train_loss": -36.60335922241211, "global_step": 69046, "epoch": 570} {"train_loss": -36.9600944519043, "global_step": 69047, "epoch": 570} {"train_loss": -36.48318099975586, "global_step": 69048, "epoch": 570} {"train_loss": -36.82575225830078, "global_step": 69049, "epoch": 570} {"train_loss": -36.26994705200195, "global_step": 69050, "epoch": 570} {"train_loss": -35.92995834350586, "global_step": 69051, "epoch": 570} {"train_loss": -36.4045524597168, "global_step": 69052, "epoch": 570} {"train_loss": -36.59674835205078, "global_step": 69053, "epoch": 570} {"train_loss": -35.5064811706543, "global_step": 69054, "epoch": 570} {"train_loss": -36.89285659790039, "global_step": 69055, "epoch": 570} {"train_loss": -36.74479293823242, "global_step": 69056, "epoch": 570} {"train_loss": -36.696388244628906, "global_step": 69057, "epoch": 570} {"train_loss": -37.159156799316406, "global_step": 69058, "epoch": 570} {"train_loss": -36.93901443481445, "global_step": 69059, "epoch": 570} {"train_loss": -36.24686813354492, "global_step": 69060, "epoch": 570} {"train_loss": -35.12114715576172, "global_step": 69061, "epoch": 570} {"train_loss": -35.5915641784668, "global_step": 69062, "epoch": 570} {"train_loss": -35.627593994140625, "global_step": 69063, "epoch": 570} {"train_loss": -31.635828018188477, "global_step": 69064, "epoch": 570} {"train_loss": -28.759057998657227, "global_step": 69065, "epoch": 570} {"train_loss": -32.45359420776367, "global_step": 69066, "epoch": 570} {"train_loss": -36.08442306518555, "global_step": 69067, "epoch": 570} {"train_loss": -32.210792541503906, "global_step": 69068, "epoch": 570} {"train_loss": -31.993993759155273, "global_step": 69069, "epoch": 570} {"train_loss": -35.7868537902832, "global_step": 69070, "epoch": 570} {"train_loss": -31.61592674255371, "global_step": 69071, "epoch": 570} {"train_loss": -33.26980209350586, "global_step": 69072, "epoch": 570} {"train_loss": -35.515380859375, "global_step": 69073, "epoch": 570} {"train_loss": -34.92879104614258, "global_step": 69074, "epoch": 570} {"train_loss": -35.963191986083984, "global_step": 69075, "epoch": 570} {"train_loss": -35.572265625, "global_step": 69076, "epoch": 570} {"train_loss": -36.388671875, "global_step": 69077, "epoch": 570} {"train_loss": -35.3818244934082, "global_step": 69078, "epoch": 570} {"train_loss": -36.2041130065918, "global_step": 69079, "epoch": 570} {"train_loss": -35.64016342163086, "global_step": 69080, "epoch": 570} {"train_loss": -36.0991325378418, "global_step": 69081, "epoch": 570} {"train_loss": -35.86417770385742, "global_step": 69082, "epoch": 570} {"train_loss": -36.09623336791992, "global_step": 69083, "epoch": 570} {"train_loss": -36.6101188659668, "global_step": 69084, "epoch": 570} {"train_loss": -36.104103088378906, "global_step": 69085, "epoch": 570} {"train_loss": -36.15928649902344, "global_step": 69086, "epoch": 570} {"train_loss": -36.67200469970703, "global_step": 69087, "epoch": 570} {"train_loss": -35.2581787109375, "global_step": 69088, "epoch": 570} {"train_loss": -36.548500061035156, "global_step": 69089, "epoch": 570} {"train_loss": -35.45909217960578, "global_step": 69090, "epoch": 570, "val_loss": 2596672.25} {"train_loss": -36.8321418762207, "global_step": 69091, "epoch": 571} {"train_loss": -35.76021957397461, "global_step": 69092, "epoch": 571} {"train_loss": -36.628170013427734, "global_step": 69093, "epoch": 571} {"train_loss": -36.108558654785156, "global_step": 69094, "epoch": 571} {"train_loss": -36.11090087890625, "global_step": 69095, "epoch": 571} {"train_loss": -36.691341400146484, "global_step": 69096, "epoch": 571} {"train_loss": -36.85200500488281, "global_step": 69097, "epoch": 571} {"train_loss": -34.33138656616211, "global_step": 69098, "epoch": 571} {"train_loss": -35.19560623168945, "global_step": 69099, "epoch": 571} {"train_loss": -36.5737419128418, "global_step": 69100, "epoch": 571} {"train_loss": -37.247432708740234, "global_step": 69101, "epoch": 571} {"train_loss": -36.96989822387695, "global_step": 69102, "epoch": 571} {"train_loss": -36.80978775024414, "global_step": 69103, "epoch": 571} {"train_loss": -36.942237854003906, "global_step": 69104, "epoch": 571} {"train_loss": -35.85749435424805, "global_step": 69105, "epoch": 571} {"train_loss": -36.82640838623047, "global_step": 69106, "epoch": 571} {"train_loss": -37.03235626220703, "global_step": 69107, "epoch": 571} {"train_loss": -36.87885284423828, "global_step": 69108, "epoch": 571} {"train_loss": -37.052734375, "global_step": 69109, "epoch": 571} {"train_loss": -37.28589630126953, "global_step": 69110, "epoch": 571} {"train_loss": -37.29343032836914, "global_step": 69111, "epoch": 571} {"train_loss": -37.08869934082031, "global_step": 69112, "epoch": 571} {"train_loss": -36.38334274291992, "global_step": 69113, "epoch": 571} {"train_loss": -36.753456115722656, "global_step": 69114, "epoch": 571} {"train_loss": -37.59477615356445, "global_step": 69115, "epoch": 571} {"train_loss": -36.99860763549805, "global_step": 69116, "epoch": 571} {"train_loss": -37.52744674682617, "global_step": 69117, "epoch": 571} {"train_loss": -36.92128372192383, "global_step": 69118, "epoch": 571} {"train_loss": -37.255043029785156, "global_step": 69119, "epoch": 571} {"train_loss": -37.2363166809082, "global_step": 69120, "epoch": 571} {"train_loss": -37.48931884765625, "global_step": 69121, "epoch": 571} {"train_loss": -37.22438049316406, "global_step": 69122, "epoch": 571} {"train_loss": -36.49671173095703, "global_step": 69123, "epoch": 571} {"train_loss": -33.238006591796875, "global_step": 69124, "epoch": 571} {"train_loss": -27.377643585205078, "global_step": 69125, "epoch": 571} {"train_loss": -10.58936595916748, "global_step": 69126, "epoch": 571} {"train_loss": -10.104290962219238, "global_step": 69127, "epoch": 571} {"train_loss": -36.29936599731445, "global_step": 69128, "epoch": 571} {"train_loss": -18.544584274291992, "global_step": 69129, "epoch": 571} {"train_loss": -26.9466495513916, "global_step": 69130, "epoch": 571} {"train_loss": -31.116580963134766, "global_step": 69131, "epoch": 571} {"train_loss": -29.434650421142578, "global_step": 69132, "epoch": 571} {"train_loss": -29.2603702545166, "global_step": 69133, "epoch": 571} {"train_loss": -33.363548278808594, "global_step": 69134, "epoch": 571} {"train_loss": -30.232166290283203, "global_step": 69135, "epoch": 571} {"train_loss": -34.573944091796875, "global_step": 69136, "epoch": 571} {"train_loss": -34.12110900878906, "global_step": 69137, "epoch": 571} {"train_loss": -31.952316284179688, "global_step": 69138, "epoch": 571} {"train_loss": -34.35847854614258, "global_step": 69139, "epoch": 571} {"train_loss": -35.82820510864258, "global_step": 69140, "epoch": 571} {"train_loss": -34.34719467163086, "global_step": 69141, "epoch": 571} {"train_loss": -34.48912811279297, "global_step": 69142, "epoch": 571} {"train_loss": -35.14274215698242, "global_step": 69143, "epoch": 571} {"train_loss": -36.05532455444336, "global_step": 69144, "epoch": 571} {"train_loss": -34.943077087402344, "global_step": 69145, "epoch": 571} {"train_loss": -35.08902359008789, "global_step": 69146, "epoch": 571} {"train_loss": -35.51184844970703, "global_step": 69147, "epoch": 571} {"train_loss": -35.61655807495117, "global_step": 69148, "epoch": 571} {"train_loss": -35.903350830078125, "global_step": 69149, "epoch": 571} {"train_loss": -35.77705383300781, "global_step": 69150, "epoch": 571} {"train_loss": -35.6870231628418, "global_step": 69151, "epoch": 571} {"train_loss": -35.51919174194336, "global_step": 69152, "epoch": 571} {"train_loss": -36.26527786254883, "global_step": 69153, "epoch": 571} {"train_loss": -35.81730270385742, "global_step": 69154, "epoch": 571} {"train_loss": -36.46771240234375, "global_step": 69155, "epoch": 571} {"train_loss": -36.20615768432617, "global_step": 69156, "epoch": 571} {"train_loss": -36.15272903442383, "global_step": 69157, "epoch": 571} {"train_loss": -36.44047164916992, "global_step": 69158, "epoch": 571} {"train_loss": -36.291603088378906, "global_step": 69159, "epoch": 571} {"train_loss": -36.5128288269043, "global_step": 69160, "epoch": 571} {"train_loss": -36.32345199584961, "global_step": 69161, "epoch": 571} {"train_loss": -36.41835403442383, "global_step": 69162, "epoch": 571} {"train_loss": -36.86125183105469, "global_step": 69163, "epoch": 571} {"train_loss": -36.52294921875, "global_step": 69164, "epoch": 571} {"train_loss": -36.507869720458984, "global_step": 69165, "epoch": 571} {"train_loss": -35.65872573852539, "global_step": 69166, "epoch": 571} {"train_loss": -36.774654388427734, "global_step": 69167, "epoch": 571} {"train_loss": -36.48276901245117, "global_step": 69168, "epoch": 571} {"train_loss": -36.409217834472656, "global_step": 69169, "epoch": 571} {"train_loss": -36.34428787231445, "global_step": 69170, "epoch": 571} {"train_loss": -36.81037902832031, "global_step": 69171, "epoch": 571} {"train_loss": -36.45729446411133, "global_step": 69172, "epoch": 571} {"train_loss": -36.90204620361328, "global_step": 69173, "epoch": 571} {"train_loss": -36.87468338012695, "global_step": 69174, "epoch": 571} {"train_loss": -36.81512451171875, "global_step": 69175, "epoch": 571} {"train_loss": -37.26229476928711, "global_step": 69176, "epoch": 571} {"train_loss": -37.47823715209961, "global_step": 69177, "epoch": 571} {"train_loss": -36.73637771606445, "global_step": 69178, "epoch": 571} {"train_loss": -36.94495391845703, "global_step": 69179, "epoch": 571} {"train_loss": -37.457008361816406, "global_step": 69180, "epoch": 571} {"train_loss": -37.08328628540039, "global_step": 69181, "epoch": 571} {"train_loss": -36.89466094970703, "global_step": 69182, "epoch": 571} {"train_loss": -37.06789779663086, "global_step": 69183, "epoch": 571} {"train_loss": -36.71352767944336, "global_step": 69184, "epoch": 571} {"train_loss": -37.367191314697266, "global_step": 69185, "epoch": 571} {"train_loss": -36.77480697631836, "global_step": 69186, "epoch": 571} {"train_loss": -37.19626235961914, "global_step": 69187, "epoch": 571} {"train_loss": -37.344242095947266, "global_step": 69188, "epoch": 571} {"train_loss": -37.263980865478516, "global_step": 69189, "epoch": 571} {"train_loss": -37.17375564575195, "global_step": 69190, "epoch": 571} {"train_loss": -37.44113540649414, "global_step": 69191, "epoch": 571} {"train_loss": -37.1184196472168, "global_step": 69192, "epoch": 571} {"train_loss": -37.10480499267578, "global_step": 69193, "epoch": 571} {"train_loss": -37.39042282104492, "global_step": 69194, "epoch": 571} {"train_loss": -37.44108963012695, "global_step": 69195, "epoch": 571} {"train_loss": -36.9527587890625, "global_step": 69196, "epoch": 571} {"train_loss": -36.36920166015625, "global_step": 69197, "epoch": 571} {"train_loss": -35.59328842163086, "global_step": 69198, "epoch": 571} {"train_loss": -35.66427230834961, "global_step": 69199, "epoch": 571} {"train_loss": -31.979333877563477, "global_step": 69200, "epoch": 571} {"train_loss": -24.57742691040039, "global_step": 69201, "epoch": 571} {"train_loss": -9.093131065368652, "global_step": 69202, "epoch": 571} {"train_loss": -7.317346096038818, "global_step": 69203, "epoch": 571} {"train_loss": -35.58891677856445, "global_step": 69204, "epoch": 571} {"train_loss": -22.98799705505371, "global_step": 69205, "epoch": 571} {"train_loss": -33.059085845947266, "global_step": 69206, "epoch": 571} {"train_loss": -27.132781982421875, "global_step": 69207, "epoch": 571} {"train_loss": -35.089962005615234, "global_step": 69208, "epoch": 571} {"train_loss": -28.439069747924805, "global_step": 69209, "epoch": 571} {"train_loss": -35.08243179321289, "global_step": 69210, "epoch": 571} {"train_loss": -34.5025964886689, "global_step": 69211, "epoch": 571, "val_loss": 2531617.75} {"train_loss": -31.34766960144043, "global_step": 69212, "epoch": 572} {"train_loss": -35.679595947265625, "global_step": 69213, "epoch": 572} {"train_loss": -34.400264739990234, "global_step": 69214, "epoch": 572} {"train_loss": -32.694393157958984, "global_step": 69215, "epoch": 572} {"train_loss": -35.66157150268555, "global_step": 69216, "epoch": 572} {"train_loss": -35.09583282470703, "global_step": 69217, "epoch": 572} {"train_loss": -34.37717819213867, "global_step": 69218, "epoch": 572} {"train_loss": -35.05097579956055, "global_step": 69219, "epoch": 572} {"train_loss": -35.963069915771484, "global_step": 69220, "epoch": 572} {"train_loss": -35.57552719116211, "global_step": 69221, "epoch": 572} {"train_loss": -35.398101806640625, "global_step": 69222, "epoch": 572} {"train_loss": -35.7010498046875, "global_step": 69223, "epoch": 572} {"train_loss": -35.854957580566406, "global_step": 69224, "epoch": 572} {"train_loss": -35.561038970947266, "global_step": 69225, "epoch": 572} {"train_loss": -35.69070053100586, "global_step": 69226, "epoch": 572} {"train_loss": -35.90147018432617, "global_step": 69227, "epoch": 572} {"train_loss": -35.81521224975586, "global_step": 69228, "epoch": 572} {"train_loss": -36.44588851928711, "global_step": 69229, "epoch": 572} {"train_loss": -35.740692138671875, "global_step": 69230, "epoch": 572} {"train_loss": -35.901573181152344, "global_step": 69231, "epoch": 572} {"train_loss": -36.0035514831543, "global_step": 69232, "epoch": 572} {"train_loss": -36.44881057739258, "global_step": 69233, "epoch": 572} {"train_loss": -36.85072708129883, "global_step": 69234, "epoch": 572} {"train_loss": -36.33944320678711, "global_step": 69235, "epoch": 572} {"train_loss": -36.341766357421875, "global_step": 69236, "epoch": 572} {"train_loss": -36.73849868774414, "global_step": 69237, "epoch": 572} {"train_loss": -36.5515251159668, "global_step": 69238, "epoch": 572} {"train_loss": -36.77714157104492, "global_step": 69239, "epoch": 572} {"train_loss": -36.54892349243164, "global_step": 69240, "epoch": 572} {"train_loss": -36.230987548828125, "global_step": 69241, "epoch": 572} {"train_loss": -37.21607971191406, "global_step": 69242, "epoch": 572} {"train_loss": -36.675498962402344, "global_step": 69243, "epoch": 572} {"train_loss": -36.68345260620117, "global_step": 69244, "epoch": 572} {"train_loss": -37.21879196166992, "global_step": 69245, "epoch": 572} {"train_loss": -36.738704681396484, "global_step": 69246, "epoch": 572} {"train_loss": -36.53095626831055, "global_step": 69247, "epoch": 572} {"train_loss": -36.85947799682617, "global_step": 69248, "epoch": 572} {"train_loss": -37.080562591552734, "global_step": 69249, "epoch": 572} {"train_loss": -37.030643463134766, "global_step": 69250, "epoch": 572} {"train_loss": -36.8517951965332, "global_step": 69251, "epoch": 572} {"train_loss": -36.66207504272461, "global_step": 69252, "epoch": 572} {"train_loss": -37.3456916809082, "global_step": 69253, "epoch": 572} {"train_loss": -37.21039581298828, "global_step": 69254, "epoch": 572} {"train_loss": -36.703216552734375, "global_step": 69255, "epoch": 572} {"train_loss": -36.5661735534668, "global_step": 69256, "epoch": 572} {"train_loss": -36.5072135925293, "global_step": 69257, "epoch": 572} {"train_loss": -35.527984619140625, "global_step": 69258, "epoch": 572} {"train_loss": -35.38802719116211, "global_step": 69259, "epoch": 572} {"train_loss": -36.19405746459961, "global_step": 69260, "epoch": 572} {"train_loss": -36.728668212890625, "global_step": 69261, "epoch": 572} {"train_loss": -36.10969161987305, "global_step": 69262, "epoch": 572} {"train_loss": -36.40447235107422, "global_step": 69263, "epoch": 572} {"train_loss": -35.381568908691406, "global_step": 69264, "epoch": 572} {"train_loss": -36.49995040893555, "global_step": 69265, "epoch": 572} {"train_loss": -35.589385986328125, "global_step": 69266, "epoch": 572} {"train_loss": -36.00709915161133, "global_step": 69267, "epoch": 572} {"train_loss": -33.96133804321289, "global_step": 69268, "epoch": 572} {"train_loss": -36.23727798461914, "global_step": 69269, "epoch": 572} {"train_loss": -35.565948486328125, "global_step": 69270, "epoch": 572} {"train_loss": -35.652034759521484, "global_step": 69271, "epoch": 572} {"train_loss": -36.355873107910156, "global_step": 69272, "epoch": 572} {"train_loss": -33.8442268371582, "global_step": 69273, "epoch": 572} {"train_loss": -34.40388870239258, "global_step": 69274, "epoch": 572} {"train_loss": -33.1228141784668, "global_step": 69275, "epoch": 572} {"train_loss": -35.562129974365234, "global_step": 69276, "epoch": 572} {"train_loss": -34.53021240234375, "global_step": 69277, "epoch": 572} {"train_loss": -32.94084930419922, "global_step": 69278, "epoch": 572} {"train_loss": -34.645870208740234, "global_step": 69279, "epoch": 572} {"train_loss": -35.58148193359375, "global_step": 69280, "epoch": 572} {"train_loss": -34.2668342590332, "global_step": 69281, "epoch": 572} {"train_loss": -34.454620361328125, "global_step": 69282, "epoch": 572} {"train_loss": -34.424583435058594, "global_step": 69283, "epoch": 572} {"train_loss": -36.11451721191406, "global_step": 69284, "epoch": 572} {"train_loss": -35.425411224365234, "global_step": 69285, "epoch": 572} {"train_loss": -35.08893966674805, "global_step": 69286, "epoch": 572} {"train_loss": -36.29142761230469, "global_step": 69287, "epoch": 572} {"train_loss": -35.60061264038086, "global_step": 69288, "epoch": 572} {"train_loss": -36.02345657348633, "global_step": 69289, "epoch": 572} {"train_loss": -35.73622131347656, "global_step": 69290, "epoch": 572} {"train_loss": -36.46388244628906, "global_step": 69291, "epoch": 572} {"train_loss": -36.09035110473633, "global_step": 69292, "epoch": 572} {"train_loss": -36.38528060913086, "global_step": 69293, "epoch": 572} {"train_loss": -36.100982666015625, "global_step": 69294, "epoch": 572} {"train_loss": -36.287681579589844, "global_step": 69295, "epoch": 572} {"train_loss": -34.48702621459961, "global_step": 69296, "epoch": 572} {"train_loss": -35.5396728515625, "global_step": 69297, "epoch": 572} {"train_loss": -35.770233154296875, "global_step": 69298, "epoch": 572} {"train_loss": -36.59599685668945, "global_step": 69299, "epoch": 572} {"train_loss": -35.59615707397461, "global_step": 69300, "epoch": 572} {"train_loss": -36.67158126831055, "global_step": 69301, "epoch": 572} {"train_loss": -35.76667022705078, "global_step": 69302, "epoch": 572} {"train_loss": -36.2696647644043, "global_step": 69303, "epoch": 572} {"train_loss": -35.970272064208984, "global_step": 69304, "epoch": 572} {"train_loss": -35.63256072998047, "global_step": 69305, "epoch": 572} {"train_loss": -36.109188079833984, "global_step": 69306, "epoch": 572} {"train_loss": -36.332611083984375, "global_step": 69307, "epoch": 572} {"train_loss": -35.76930618286133, "global_step": 69308, "epoch": 572} {"train_loss": -36.317989349365234, "global_step": 69309, "epoch": 572} {"train_loss": -37.13064193725586, "global_step": 69310, "epoch": 572} {"train_loss": -36.67658233642578, "global_step": 69311, "epoch": 572} {"train_loss": -36.24168014526367, "global_step": 69312, "epoch": 572} {"train_loss": -36.8325080871582, "global_step": 69313, "epoch": 572} {"train_loss": -37.011680603027344, "global_step": 69314, "epoch": 572} {"train_loss": -36.56303405761719, "global_step": 69315, "epoch": 572} {"train_loss": -36.63405227661133, "global_step": 69316, "epoch": 572} {"train_loss": -36.905914306640625, "global_step": 69317, "epoch": 572} {"train_loss": -36.79301071166992, "global_step": 69318, "epoch": 572} {"train_loss": -36.59223556518555, "global_step": 69319, "epoch": 572} {"train_loss": -36.07490921020508, "global_step": 69320, "epoch": 572} {"train_loss": -36.501399993896484, "global_step": 69321, "epoch": 572} {"train_loss": -36.62744140625, "global_step": 69322, "epoch": 572} {"train_loss": -36.529170989990234, "global_step": 69323, "epoch": 572} {"train_loss": -36.379878997802734, "global_step": 69324, "epoch": 572} {"train_loss": -37.254600524902344, "global_step": 69325, "epoch": 572} {"train_loss": -36.84754180908203, "global_step": 69326, "epoch": 572} {"train_loss": -36.29633712768555, "global_step": 69327, "epoch": 572} {"train_loss": -36.28643798828125, "global_step": 69328, "epoch": 572} {"train_loss": -37.061500549316406, "global_step": 69329, "epoch": 572} {"train_loss": -37.07365798950195, "global_step": 69330, "epoch": 572} {"train_loss": -36.00704574584961, "global_step": 69331, "epoch": 572} {"train_loss": -35.95190008809744, "global_step": 69332, "epoch": 572, "val_loss": 2668288.25} {"train_loss": -33.128273010253906, "global_step": 69333, "epoch": 573} {"train_loss": -30.0450382232666, "global_step": 69334, "epoch": 573} {"train_loss": -34.507659912109375, "global_step": 69335, "epoch": 573} {"train_loss": -36.463130950927734, "global_step": 69336, "epoch": 573} {"train_loss": -35.710975646972656, "global_step": 69337, "epoch": 573} {"train_loss": -36.076637268066406, "global_step": 69338, "epoch": 573} {"train_loss": -35.72883224487305, "global_step": 69339, "epoch": 573} {"train_loss": -35.2615966796875, "global_step": 69340, "epoch": 573} {"train_loss": -35.31048583984375, "global_step": 69341, "epoch": 573} {"train_loss": -34.20171356201172, "global_step": 69342, "epoch": 573} {"train_loss": -36.46356201171875, "global_step": 69343, "epoch": 573} {"train_loss": -36.471595764160156, "global_step": 69344, "epoch": 573} {"train_loss": -36.073890686035156, "global_step": 69345, "epoch": 573} {"train_loss": -35.5485954284668, "global_step": 69346, "epoch": 573} {"train_loss": -36.56049346923828, "global_step": 69347, "epoch": 573} {"train_loss": -33.41776657104492, "global_step": 69348, "epoch": 573} {"train_loss": -34.99464797973633, "global_step": 69349, "epoch": 573} {"train_loss": -35.9520149230957, "global_step": 69350, "epoch": 573} {"train_loss": -35.896114349365234, "global_step": 69351, "epoch": 573} {"train_loss": -36.74285888671875, "global_step": 69352, "epoch": 573} {"train_loss": -36.004573822021484, "global_step": 69353, "epoch": 573} {"train_loss": -35.65248107910156, "global_step": 69354, "epoch": 573} {"train_loss": -35.25447082519531, "global_step": 69355, "epoch": 573} {"train_loss": -36.90564727783203, "global_step": 69356, "epoch": 573} {"train_loss": -35.585140228271484, "global_step": 69357, "epoch": 573} {"train_loss": -36.006839752197266, "global_step": 69358, "epoch": 573} {"train_loss": -36.6987190246582, "global_step": 69359, "epoch": 573} {"train_loss": -36.447513580322266, "global_step": 69360, "epoch": 573} {"train_loss": -36.077999114990234, "global_step": 69361, "epoch": 573} {"train_loss": -36.531864166259766, "global_step": 69362, "epoch": 573} {"train_loss": -36.657039642333984, "global_step": 69363, "epoch": 573} {"train_loss": -36.17311477661133, "global_step": 69364, "epoch": 573} {"train_loss": -36.66953659057617, "global_step": 69365, "epoch": 573} {"train_loss": -36.413360595703125, "global_step": 69366, "epoch": 573} {"train_loss": -36.575191497802734, "global_step": 69367, "epoch": 573} {"train_loss": -35.94380187988281, "global_step": 69368, "epoch": 573} {"train_loss": -36.13864517211914, "global_step": 69369, "epoch": 573} {"train_loss": -36.11963653564453, "global_step": 69370, "epoch": 573} {"train_loss": -37.01388168334961, "global_step": 69371, "epoch": 573} {"train_loss": -36.10200500488281, "global_step": 69372, "epoch": 573} {"train_loss": -36.88153076171875, "global_step": 69373, "epoch": 573} {"train_loss": -37.19234848022461, "global_step": 69374, "epoch": 573} {"train_loss": -36.714412689208984, "global_step": 69375, "epoch": 573} {"train_loss": -36.302059173583984, "global_step": 69376, "epoch": 573} {"train_loss": -36.86435317993164, "global_step": 69377, "epoch": 573} {"train_loss": -36.6119499206543, "global_step": 69378, "epoch": 573} {"train_loss": -36.84538269042969, "global_step": 69379, "epoch": 573} {"train_loss": -37.06135940551758, "global_step": 69380, "epoch": 573} {"train_loss": -37.266822814941406, "global_step": 69381, "epoch": 573} {"train_loss": -37.13983917236328, "global_step": 69382, "epoch": 573} {"train_loss": -36.99982452392578, "global_step": 69383, "epoch": 573} {"train_loss": -35.25598907470703, "global_step": 69384, "epoch": 573} {"train_loss": -36.8429069519043, "global_step": 69385, "epoch": 573} {"train_loss": -36.57284164428711, "global_step": 69386, "epoch": 573} {"train_loss": -37.02090072631836, "global_step": 69387, "epoch": 573} {"train_loss": -35.47313690185547, "global_step": 69388, "epoch": 573} {"train_loss": -36.721126556396484, "global_step": 69389, "epoch": 573} {"train_loss": -36.22473907470703, "global_step": 69390, "epoch": 573} {"train_loss": -36.443668365478516, "global_step": 69391, "epoch": 573} {"train_loss": -34.49627685546875, "global_step": 69392, "epoch": 573} {"train_loss": -37.10174560546875, "global_step": 69393, "epoch": 573} {"train_loss": -37.0143928527832, "global_step": 69394, "epoch": 573} {"train_loss": -35.80990219116211, "global_step": 69395, "epoch": 573} {"train_loss": -32.93317794799805, "global_step": 69396, "epoch": 573} {"train_loss": -34.112709045410156, "global_step": 69397, "epoch": 573} {"train_loss": -31.885400772094727, "global_step": 69398, "epoch": 573} {"train_loss": -34.538936614990234, "global_step": 69399, "epoch": 573} {"train_loss": -33.96246337890625, "global_step": 69400, "epoch": 573} {"train_loss": -32.3068962097168, "global_step": 69401, "epoch": 573} {"train_loss": -33.203163146972656, "global_step": 69402, "epoch": 573} {"train_loss": -34.954505920410156, "global_step": 69403, "epoch": 573} {"train_loss": -34.792022705078125, "global_step": 69404, "epoch": 573} {"train_loss": -34.1020393371582, "global_step": 69405, "epoch": 573} {"train_loss": -33.65963363647461, "global_step": 69406, "epoch": 573} {"train_loss": -35.0118522644043, "global_step": 69407, "epoch": 573} {"train_loss": -34.250701904296875, "global_step": 69408, "epoch": 573} {"train_loss": -33.08599853515625, "global_step": 69409, "epoch": 573} {"train_loss": -35.643367767333984, "global_step": 69410, "epoch": 573} {"train_loss": -36.17523193359375, "global_step": 69411, "epoch": 573} {"train_loss": -35.111263275146484, "global_step": 69412, "epoch": 573} {"train_loss": -35.56402587890625, "global_step": 69413, "epoch": 573} {"train_loss": -35.571083068847656, "global_step": 69414, "epoch": 573} {"train_loss": -35.638221740722656, "global_step": 69415, "epoch": 573} {"train_loss": -35.9899787902832, "global_step": 69416, "epoch": 573} {"train_loss": -35.52354049682617, "global_step": 69417, "epoch": 573} {"train_loss": -36.004188537597656, "global_step": 69418, "epoch": 573} {"train_loss": -34.80464553833008, "global_step": 69419, "epoch": 573} {"train_loss": -35.287017822265625, "global_step": 69420, "epoch": 573} {"train_loss": -35.458492279052734, "global_step": 69421, "epoch": 573} {"train_loss": -35.8730583190918, "global_step": 69422, "epoch": 573} {"train_loss": -35.65924835205078, "global_step": 69423, "epoch": 573} {"train_loss": -36.06245040893555, "global_step": 69424, "epoch": 573} {"train_loss": -35.47856521606445, "global_step": 69425, "epoch": 573} {"train_loss": -36.103946685791016, "global_step": 69426, "epoch": 573} {"train_loss": -36.09883499145508, "global_step": 69427, "epoch": 573} {"train_loss": -35.66197204589844, "global_step": 69428, "epoch": 573} {"train_loss": -36.329803466796875, "global_step": 69429, "epoch": 573} {"train_loss": -36.670166015625, "global_step": 69430, "epoch": 573} {"train_loss": -35.996742248535156, "global_step": 69431, "epoch": 573} {"train_loss": -35.72770309448242, "global_step": 69432, "epoch": 573} {"train_loss": -36.11147689819336, "global_step": 69433, "epoch": 573} {"train_loss": -36.48394012451172, "global_step": 69434, "epoch": 573} {"train_loss": -36.08645248413086, "global_step": 69435, "epoch": 573} {"train_loss": -36.43204879760742, "global_step": 69436, "epoch": 573} {"train_loss": -35.978267669677734, "global_step": 69437, "epoch": 573} {"train_loss": -36.856170654296875, "global_step": 69438, "epoch": 573} {"train_loss": -36.317726135253906, "global_step": 69439, "epoch": 573} {"train_loss": -36.700740814208984, "global_step": 69440, "epoch": 573} {"train_loss": -36.3616828918457, "global_step": 69441, "epoch": 573} {"train_loss": -36.74674987792969, "global_step": 69442, "epoch": 573} {"train_loss": -36.02826690673828, "global_step": 69443, "epoch": 573} {"train_loss": -36.3298454284668, "global_step": 69444, "epoch": 573} {"train_loss": -36.947391510009766, "global_step": 69445, "epoch": 573} {"train_loss": -36.80830001831055, "global_step": 69446, "epoch": 573} {"train_loss": -36.75905227661133, "global_step": 69447, "epoch": 573} {"train_loss": -36.9968376159668, "global_step": 69448, "epoch": 573} {"train_loss": -36.402427673339844, "global_step": 69449, "epoch": 573} {"train_loss": -37.140296936035156, "global_step": 69450, "epoch": 573} {"train_loss": -36.80181884765625, "global_step": 69451, "epoch": 573} {"train_loss": -36.59536361694336, "global_step": 69452, "epoch": 573} {"train_loss": -35.811169774079126, "global_step": 69453, "epoch": 573, "val_loss": 2729433.0} {"train_loss": -36.814327239990234, "global_step": 69454, "epoch": 574} {"train_loss": -36.685699462890625, "global_step": 69455, "epoch": 574} {"train_loss": -37.212127685546875, "global_step": 69456, "epoch": 574} {"train_loss": -36.84112548828125, "global_step": 69457, "epoch": 574} {"train_loss": -37.3350944519043, "global_step": 69458, "epoch": 574} {"train_loss": -36.87945556640625, "global_step": 69459, "epoch": 574} {"train_loss": -37.297306060791016, "global_step": 69460, "epoch": 574} {"train_loss": -37.26721954345703, "global_step": 69461, "epoch": 574} {"train_loss": -37.09197998046875, "global_step": 69462, "epoch": 574} {"train_loss": -37.049861907958984, "global_step": 69463, "epoch": 574} {"train_loss": -37.81284713745117, "global_step": 69464, "epoch": 574} {"train_loss": -37.36948776245117, "global_step": 69465, "epoch": 574} {"train_loss": -36.969398498535156, "global_step": 69466, "epoch": 574} {"train_loss": -36.61991500854492, "global_step": 69467, "epoch": 574} {"train_loss": -37.37221145629883, "global_step": 69468, "epoch": 574} {"train_loss": -37.36093521118164, "global_step": 69469, "epoch": 574} {"train_loss": -37.593231201171875, "global_step": 69470, "epoch": 574} {"train_loss": -37.48084259033203, "global_step": 69471, "epoch": 574} {"train_loss": -37.820404052734375, "global_step": 69472, "epoch": 574} {"train_loss": -37.10138702392578, "global_step": 69473, "epoch": 574} {"train_loss": -37.20760726928711, "global_step": 69474, "epoch": 574} {"train_loss": -37.621826171875, "global_step": 69475, "epoch": 574} {"train_loss": -37.98291015625, "global_step": 69476, "epoch": 574} {"train_loss": -37.642677307128906, "global_step": 69477, "epoch": 574} {"train_loss": -37.171051025390625, "global_step": 69478, "epoch": 574} {"train_loss": -37.16141891479492, "global_step": 69479, "epoch": 574} {"train_loss": -37.3613395690918, "global_step": 69480, "epoch": 574} {"train_loss": -37.618377685546875, "global_step": 69481, "epoch": 574} {"train_loss": -37.219024658203125, "global_step": 69482, "epoch": 574} {"train_loss": -37.32733917236328, "global_step": 69483, "epoch": 574} {"train_loss": -37.28890609741211, "global_step": 69484, "epoch": 574} {"train_loss": -37.465396881103516, "global_step": 69485, "epoch": 574} {"train_loss": -36.59835433959961, "global_step": 69486, "epoch": 574} {"train_loss": -37.84210205078125, "global_step": 69487, "epoch": 574} {"train_loss": -37.46062469482422, "global_step": 69488, "epoch": 574} {"train_loss": -37.3836555480957, "global_step": 69489, "epoch": 574} {"train_loss": -37.934139251708984, "global_step": 69490, "epoch": 574} {"train_loss": -37.293094635009766, "global_step": 69491, "epoch": 574} {"train_loss": -37.29348373413086, "global_step": 69492, "epoch": 574} {"train_loss": -37.65172576904297, "global_step": 69493, "epoch": 574} {"train_loss": -36.86101150512695, "global_step": 69494, "epoch": 574} {"train_loss": -36.30081558227539, "global_step": 69495, "epoch": 574} {"train_loss": -37.46413803100586, "global_step": 69496, "epoch": 574} {"train_loss": -34.59047317504883, "global_step": 69497, "epoch": 574} {"train_loss": -35.34162521362305, "global_step": 69498, "epoch": 574} {"train_loss": -34.77408981323242, "global_step": 69499, "epoch": 574} {"train_loss": -35.45920181274414, "global_step": 69500, "epoch": 574} {"train_loss": -36.46229934692383, "global_step": 69501, "epoch": 574} {"train_loss": -35.367713928222656, "global_step": 69502, "epoch": 574} {"train_loss": -33.83572769165039, "global_step": 69503, "epoch": 574} {"train_loss": -33.060604095458984, "global_step": 69504, "epoch": 574} {"train_loss": -33.622314453125, "global_step": 69505, "epoch": 574} {"train_loss": -30.507963180541992, "global_step": 69506, "epoch": 574} {"train_loss": -29.449548721313477, "global_step": 69507, "epoch": 574} {"train_loss": -31.477689743041992, "global_step": 69508, "epoch": 574} {"train_loss": -35.34072494506836, "global_step": 69509, "epoch": 574} {"train_loss": -27.673004150390625, "global_step": 69510, "epoch": 574} {"train_loss": -30.883893966674805, "global_step": 69511, "epoch": 574} {"train_loss": -33.735008239746094, "global_step": 69512, "epoch": 574} {"train_loss": -32.286895751953125, "global_step": 69513, "epoch": 574} {"train_loss": -29.472930908203125, "global_step": 69514, "epoch": 574} {"train_loss": -31.9858455657959, "global_step": 69515, "epoch": 574} {"train_loss": -34.145423889160156, "global_step": 69516, "epoch": 574} {"train_loss": -35.338134765625, "global_step": 69517, "epoch": 574} {"train_loss": -34.54513168334961, "global_step": 69518, "epoch": 574} {"train_loss": -32.178340911865234, "global_step": 69519, "epoch": 574} {"train_loss": -34.29530715942383, "global_step": 69520, "epoch": 574} {"train_loss": -32.10197067260742, "global_step": 69521, "epoch": 574} {"train_loss": -33.725013732910156, "global_step": 69522, "epoch": 574} {"train_loss": -32.96206283569336, "global_step": 69523, "epoch": 574} {"train_loss": -35.261531829833984, "global_step": 69524, "epoch": 574} {"train_loss": -34.394771575927734, "global_step": 69525, "epoch": 574} {"train_loss": -35.16978073120117, "global_step": 69526, "epoch": 574} {"train_loss": -35.33435821533203, "global_step": 69527, "epoch": 574} {"train_loss": -33.80463790893555, "global_step": 69528, "epoch": 574} {"train_loss": -34.6721305847168, "global_step": 69529, "epoch": 574} {"train_loss": -32.608699798583984, "global_step": 69530, "epoch": 574} {"train_loss": -35.020896911621094, "global_step": 69531, "epoch": 574} {"train_loss": -34.89939498901367, "global_step": 69532, "epoch": 574} {"train_loss": -35.21805953979492, "global_step": 69533, "epoch": 574} {"train_loss": -35.48762130737305, "global_step": 69534, "epoch": 574} {"train_loss": -35.85306167602539, "global_step": 69535, "epoch": 574} {"train_loss": -35.68806076049805, "global_step": 69536, "epoch": 574} {"train_loss": -35.46772384643555, "global_step": 69537, "epoch": 574} {"train_loss": -35.0423469543457, "global_step": 69538, "epoch": 574} {"train_loss": -34.89177322387695, "global_step": 69539, "epoch": 574} {"train_loss": -35.6366081237793, "global_step": 69540, "epoch": 574} {"train_loss": -35.45487594604492, "global_step": 69541, "epoch": 574} {"train_loss": -35.50387191772461, "global_step": 69542, "epoch": 574} {"train_loss": -35.20857238769531, "global_step": 69543, "epoch": 574} {"train_loss": -36.220855712890625, "global_step": 69544, "epoch": 574} {"train_loss": -33.11765670776367, "global_step": 69545, "epoch": 574} {"train_loss": -35.873226165771484, "global_step": 69546, "epoch": 574} {"train_loss": -36.210262298583984, "global_step": 69547, "epoch": 574} {"train_loss": -35.77028274536133, "global_step": 69548, "epoch": 574} {"train_loss": -36.390254974365234, "global_step": 69549, "epoch": 574} {"train_loss": -36.1378059387207, "global_step": 69550, "epoch": 574} {"train_loss": -35.99594497680664, "global_step": 69551, "epoch": 574} {"train_loss": -36.32091522216797, "global_step": 69552, "epoch": 574} {"train_loss": -34.903724670410156, "global_step": 69553, "epoch": 574} {"train_loss": -35.992820739746094, "global_step": 69554, "epoch": 574} {"train_loss": -36.10860824584961, "global_step": 69555, "epoch": 574} {"train_loss": -36.330413818359375, "global_step": 69556, "epoch": 574} {"train_loss": -36.21000671386719, "global_step": 69557, "epoch": 574} {"train_loss": -36.62963104248047, "global_step": 69558, "epoch": 574} {"train_loss": -36.0181770324707, "global_step": 69559, "epoch": 574} {"train_loss": -36.591041564941406, "global_step": 69560, "epoch": 574} {"train_loss": -36.15642166137695, "global_step": 69561, "epoch": 574} {"train_loss": -36.67430114746094, "global_step": 69562, "epoch": 574} {"train_loss": -36.95619583129883, "global_step": 69563, "epoch": 574} {"train_loss": -36.73577880859375, "global_step": 69564, "epoch": 574} {"train_loss": -36.4012451171875, "global_step": 69565, "epoch": 574} {"train_loss": -36.70103454589844, "global_step": 69566, "epoch": 574} {"train_loss": -36.478919982910156, "global_step": 69567, "epoch": 574} {"train_loss": -37.11381912231445, "global_step": 69568, "epoch": 574} {"train_loss": -36.98777389526367, "global_step": 69569, "epoch": 574} {"train_loss": -36.86931610107422, "global_step": 69570, "epoch": 574} {"train_loss": -37.04592514038086, "global_step": 69571, "epoch": 574} {"train_loss": -36.64107131958008, "global_step": 69572, "epoch": 574} {"train_loss": -36.16782760620117, "global_step": 69573, "epoch": 574} {"train_loss": -35.73127101866667, "global_step": 69574, "epoch": 574, "val_loss": 2570708.25} {"train_loss": -36.715518951416016, "global_step": 69575, "epoch": 575} {"train_loss": -37.1053466796875, "global_step": 69576, "epoch": 575} {"train_loss": -37.48127365112305, "global_step": 69577, "epoch": 575} {"train_loss": -37.24645233154297, "global_step": 69578, "epoch": 575} {"train_loss": -36.958717346191406, "global_step": 69579, "epoch": 575} {"train_loss": -37.1049919128418, "global_step": 69580, "epoch": 575} {"train_loss": -36.38330078125, "global_step": 69581, "epoch": 575} {"train_loss": -37.1181755065918, "global_step": 69582, "epoch": 575} {"train_loss": -36.71390914916992, "global_step": 69583, "epoch": 575} {"train_loss": -37.50299835205078, "global_step": 69584, "epoch": 575} {"train_loss": -37.47256088256836, "global_step": 69585, "epoch": 575} {"train_loss": -36.50498962402344, "global_step": 69586, "epoch": 575} {"train_loss": -36.68661880493164, "global_step": 69587, "epoch": 575} {"train_loss": -37.56364059448242, "global_step": 69588, "epoch": 575} {"train_loss": -37.21036148071289, "global_step": 69589, "epoch": 575} {"train_loss": -36.95652770996094, "global_step": 69590, "epoch": 575} {"train_loss": -35.92522430419922, "global_step": 69591, "epoch": 575} {"train_loss": -36.52513122558594, "global_step": 69592, "epoch": 575} {"train_loss": -37.250118255615234, "global_step": 69593, "epoch": 575} {"train_loss": -37.42075729370117, "global_step": 69594, "epoch": 575} {"train_loss": -37.838905334472656, "global_step": 69595, "epoch": 575} {"train_loss": -37.21893310546875, "global_step": 69596, "epoch": 575} {"train_loss": -37.38010025024414, "global_step": 69597, "epoch": 575} {"train_loss": -36.281280517578125, "global_step": 69598, "epoch": 575} {"train_loss": -35.59026336669922, "global_step": 69599, "epoch": 575} {"train_loss": -34.71656799316406, "global_step": 69600, "epoch": 575} {"train_loss": -34.96099090576172, "global_step": 69601, "epoch": 575} {"train_loss": -35.038692474365234, "global_step": 69602, "epoch": 575} {"train_loss": -36.7473030090332, "global_step": 69603, "epoch": 575} {"train_loss": -37.324520111083984, "global_step": 69604, "epoch": 575} {"train_loss": -35.86820602416992, "global_step": 69605, "epoch": 575} {"train_loss": -36.60111618041992, "global_step": 69606, "epoch": 575} {"train_loss": -37.14815139770508, "global_step": 69607, "epoch": 575} {"train_loss": -37.759002685546875, "global_step": 69608, "epoch": 575} {"train_loss": -36.01168441772461, "global_step": 69609, "epoch": 575} {"train_loss": -35.82046127319336, "global_step": 69610, "epoch": 575} {"train_loss": -37.026039123535156, "global_step": 69611, "epoch": 575} {"train_loss": -37.27334213256836, "global_step": 69612, "epoch": 575} {"train_loss": -36.79167556762695, "global_step": 69613, "epoch": 575} {"train_loss": -37.03577423095703, "global_step": 69614, "epoch": 575} {"train_loss": -36.601863861083984, "global_step": 69615, "epoch": 575} {"train_loss": -35.833534240722656, "global_step": 69616, "epoch": 575} {"train_loss": -33.91594314575195, "global_step": 69617, "epoch": 575} {"train_loss": -35.30823516845703, "global_step": 69618, "epoch": 575} {"train_loss": -34.34037780761719, "global_step": 69619, "epoch": 575} {"train_loss": -37.27676010131836, "global_step": 69620, "epoch": 575} {"train_loss": -36.433170318603516, "global_step": 69621, "epoch": 575} {"train_loss": -34.77278518676758, "global_step": 69622, "epoch": 575} {"train_loss": -36.30323028564453, "global_step": 69623, "epoch": 575} {"train_loss": -32.8165283203125, "global_step": 69624, "epoch": 575} {"train_loss": -34.62882614135742, "global_step": 69625, "epoch": 575} {"train_loss": -35.902610778808594, "global_step": 69626, "epoch": 575} {"train_loss": -34.287071228027344, "global_step": 69627, "epoch": 575} {"train_loss": -36.28446578979492, "global_step": 69628, "epoch": 575} {"train_loss": -36.174922943115234, "global_step": 69629, "epoch": 575} {"train_loss": -35.364593505859375, "global_step": 69630, "epoch": 575} {"train_loss": -33.94047164916992, "global_step": 69631, "epoch": 575} {"train_loss": -36.0876579284668, "global_step": 69632, "epoch": 575} {"train_loss": -35.204750061035156, "global_step": 69633, "epoch": 575} {"train_loss": -34.05793380737305, "global_step": 69634, "epoch": 575} {"train_loss": -34.38135528564453, "global_step": 69635, "epoch": 575} {"train_loss": -36.1338996887207, "global_step": 69636, "epoch": 575} {"train_loss": -35.5146598815918, "global_step": 69637, "epoch": 575} {"train_loss": -33.82128143310547, "global_step": 69638, "epoch": 575} {"train_loss": -36.0970573425293, "global_step": 69639, "epoch": 575} {"train_loss": -35.69136047363281, "global_step": 69640, "epoch": 575} {"train_loss": -33.504371643066406, "global_step": 69641, "epoch": 575} {"train_loss": -36.628841400146484, "global_step": 69642, "epoch": 575} {"train_loss": -35.8204460144043, "global_step": 69643, "epoch": 575} {"train_loss": -36.272308349609375, "global_step": 69644, "epoch": 575} {"train_loss": -36.2998161315918, "global_step": 69645, "epoch": 575} {"train_loss": -36.88201904296875, "global_step": 69646, "epoch": 575} {"train_loss": -35.4425048828125, "global_step": 69647, "epoch": 575} {"train_loss": -36.8730583190918, "global_step": 69648, "epoch": 575} {"train_loss": -35.91860580444336, "global_step": 69649, "epoch": 575} {"train_loss": -36.78974151611328, "global_step": 69650, "epoch": 575} {"train_loss": -36.16621017456055, "global_step": 69651, "epoch": 575} {"train_loss": -36.31752395629883, "global_step": 69652, "epoch": 575} {"train_loss": -36.60298538208008, "global_step": 69653, "epoch": 575} {"train_loss": -36.89070510864258, "global_step": 69654, "epoch": 575} {"train_loss": -36.784576416015625, "global_step": 69655, "epoch": 575} {"train_loss": -36.5104866027832, "global_step": 69656, "epoch": 575} {"train_loss": -36.7522087097168, "global_step": 69657, "epoch": 575} {"train_loss": -37.0947151184082, "global_step": 69658, "epoch": 575} {"train_loss": -37.35659408569336, "global_step": 69659, "epoch": 575} {"train_loss": -36.82078170776367, "global_step": 69660, "epoch": 575} {"train_loss": -36.83102035522461, "global_step": 69661, "epoch": 575} {"train_loss": -37.12953567504883, "global_step": 69662, "epoch": 575} {"train_loss": -36.9066162109375, "global_step": 69663, "epoch": 575} {"train_loss": -36.93165588378906, "global_step": 69664, "epoch": 575} {"train_loss": -36.8192024230957, "global_step": 69665, "epoch": 575} {"train_loss": -36.91452407836914, "global_step": 69666, "epoch": 575} {"train_loss": -37.13285446166992, "global_step": 69667, "epoch": 575} {"train_loss": -37.49484634399414, "global_step": 69668, "epoch": 575} {"train_loss": -37.11148452758789, "global_step": 69669, "epoch": 575} {"train_loss": -37.276729583740234, "global_step": 69670, "epoch": 575} {"train_loss": -37.24392318725586, "global_step": 69671, "epoch": 575} {"train_loss": -37.65031814575195, "global_step": 69672, "epoch": 575} {"train_loss": -37.22716522216797, "global_step": 69673, "epoch": 575} {"train_loss": -37.27727508544922, "global_step": 69674, "epoch": 575} {"train_loss": -37.3311767578125, "global_step": 69675, "epoch": 575} {"train_loss": -37.782867431640625, "global_step": 69676, "epoch": 575} {"train_loss": -37.25780487060547, "global_step": 69677, "epoch": 575} {"train_loss": -37.92719268798828, "global_step": 69678, "epoch": 575} {"train_loss": -37.46624755859375, "global_step": 69679, "epoch": 575} {"train_loss": -37.55752182006836, "global_step": 69680, "epoch": 575} {"train_loss": -37.83083724975586, "global_step": 69681, "epoch": 575} {"train_loss": -37.367897033691406, "global_step": 69682, "epoch": 575} {"train_loss": -37.50037384033203, "global_step": 69683, "epoch": 575} {"train_loss": -37.833919525146484, "global_step": 69684, "epoch": 575} {"train_loss": -36.697288513183594, "global_step": 69685, "epoch": 575} {"train_loss": -36.76410675048828, "global_step": 69686, "epoch": 575} {"train_loss": -35.24789810180664, "global_step": 69687, "epoch": 575} {"train_loss": -33.178829193115234, "global_step": 69688, "epoch": 575} {"train_loss": -27.268522262573242, "global_step": 69689, "epoch": 575} {"train_loss": -26.29764175415039, "global_step": 69690, "epoch": 575} {"train_loss": -32.32460403442383, "global_step": 69691, "epoch": 575} {"train_loss": -36.832847595214844, "global_step": 69692, "epoch": 575} {"train_loss": -33.35988998413086, "global_step": 69693, "epoch": 575} {"train_loss": -34.61286163330078, "global_step": 69694, "epoch": 575} {"train_loss": -36.20309708335183, "global_step": 69695, "epoch": 575, "val_loss": 2578533.0} {"train_loss": -35.93572998046875, "global_step": 69696, "epoch": 576} {"train_loss": -34.47163009643555, "global_step": 69697, "epoch": 576} {"train_loss": -34.430267333984375, "global_step": 69698, "epoch": 576} {"train_loss": -36.63300704956055, "global_step": 69699, "epoch": 576} {"train_loss": -35.707088470458984, "global_step": 69700, "epoch": 576} {"train_loss": -36.62479782104492, "global_step": 69701, "epoch": 576} {"train_loss": -35.92607498168945, "global_step": 69702, "epoch": 576} {"train_loss": -37.21218490600586, "global_step": 69703, "epoch": 576} {"train_loss": -36.243797302246094, "global_step": 69704, "epoch": 576} {"train_loss": -37.1972770690918, "global_step": 69705, "epoch": 576} {"train_loss": -36.162994384765625, "global_step": 69706, "epoch": 576} {"train_loss": -37.43637466430664, "global_step": 69707, "epoch": 576} {"train_loss": -36.39296340942383, "global_step": 69708, "epoch": 576} {"train_loss": -36.58064651489258, "global_step": 69709, "epoch": 576} {"train_loss": -37.33486557006836, "global_step": 69710, "epoch": 576} {"train_loss": -36.78286361694336, "global_step": 69711, "epoch": 576} {"train_loss": -37.10578536987305, "global_step": 69712, "epoch": 576} {"train_loss": -37.294708251953125, "global_step": 69713, "epoch": 576} {"train_loss": -37.051761627197266, "global_step": 69714, "epoch": 576} {"train_loss": -37.30284881591797, "global_step": 69715, "epoch": 576} {"train_loss": -37.16498947143555, "global_step": 69716, "epoch": 576} {"train_loss": -36.547752380371094, "global_step": 69717, "epoch": 576} {"train_loss": -36.8944091796875, "global_step": 69718, "epoch": 576} {"train_loss": -36.0416145324707, "global_step": 69719, "epoch": 576} {"train_loss": -36.30777359008789, "global_step": 69720, "epoch": 576} {"train_loss": -36.4208984375, "global_step": 69721, "epoch": 576} {"train_loss": -36.89435958862305, "global_step": 69722, "epoch": 576} {"train_loss": -36.7687873840332, "global_step": 69723, "epoch": 576} {"train_loss": -37.22949981689453, "global_step": 69724, "epoch": 576} {"train_loss": -37.213436126708984, "global_step": 69725, "epoch": 576} {"train_loss": -36.863548278808594, "global_step": 69726, "epoch": 576} {"train_loss": -36.9005126953125, "global_step": 69727, "epoch": 576} {"train_loss": -37.174537658691406, "global_step": 69728, "epoch": 576} {"train_loss": -36.581146240234375, "global_step": 69729, "epoch": 576} {"train_loss": -36.94080352783203, "global_step": 69730, "epoch": 576} {"train_loss": -37.333274841308594, "global_step": 69731, "epoch": 576} {"train_loss": -37.07664108276367, "global_step": 69732, "epoch": 576} {"train_loss": -37.29450607299805, "global_step": 69733, "epoch": 576} {"train_loss": -37.1842041015625, "global_step": 69734, "epoch": 576} {"train_loss": -37.02579879760742, "global_step": 69735, "epoch": 576} {"train_loss": -37.70305633544922, "global_step": 69736, "epoch": 576} {"train_loss": -36.012489318847656, "global_step": 69737, "epoch": 576} {"train_loss": -37.29219436645508, "global_step": 69738, "epoch": 576} {"train_loss": -36.43117141723633, "global_step": 69739, "epoch": 576} {"train_loss": -37.224910736083984, "global_step": 69740, "epoch": 576} {"train_loss": -37.18382263183594, "global_step": 69741, "epoch": 576} {"train_loss": -36.59743881225586, "global_step": 69742, "epoch": 576} {"train_loss": -37.11549758911133, "global_step": 69743, "epoch": 576} {"train_loss": -36.0813102722168, "global_step": 69744, "epoch": 576} {"train_loss": -36.289974212646484, "global_step": 69745, "epoch": 576} {"train_loss": -37.36979293823242, "global_step": 69746, "epoch": 576} {"train_loss": -35.99666213989258, "global_step": 69747, "epoch": 576} {"train_loss": -35.98714828491211, "global_step": 69748, "epoch": 576} {"train_loss": -34.65857696533203, "global_step": 69749, "epoch": 576} {"train_loss": -28.705474853515625, "global_step": 69750, "epoch": 576} {"train_loss": -18.967695236206055, "global_step": 69751, "epoch": 576} {"train_loss": -20.515361785888672, "global_step": 69752, "epoch": 576} {"train_loss": -33.08253479003906, "global_step": 69753, "epoch": 576} {"train_loss": -35.0548210144043, "global_step": 69754, "epoch": 576} {"train_loss": -32.08674240112305, "global_step": 69755, "epoch": 576} {"train_loss": -34.32865524291992, "global_step": 69756, "epoch": 576} {"train_loss": -32.46853256225586, "global_step": 69757, "epoch": 576} {"train_loss": -32.10798263549805, "global_step": 69758, "epoch": 576} {"train_loss": -35.19900131225586, "global_step": 69759, "epoch": 576} {"train_loss": -35.42911911010742, "global_step": 69760, "epoch": 576} {"train_loss": -35.267311096191406, "global_step": 69761, "epoch": 576} {"train_loss": -34.76944351196289, "global_step": 69762, "epoch": 576} {"train_loss": -35.312374114990234, "global_step": 69763, "epoch": 576} {"train_loss": -35.006526947021484, "global_step": 69764, "epoch": 576} {"train_loss": -35.23828887939453, "global_step": 69765, "epoch": 576} {"train_loss": -34.546382904052734, "global_step": 69766, "epoch": 576} {"train_loss": -36.31400680541992, "global_step": 69767, "epoch": 576} {"train_loss": -35.070716857910156, "global_step": 69768, "epoch": 576} {"train_loss": -36.26496124267578, "global_step": 69769, "epoch": 576} {"train_loss": -35.73676300048828, "global_step": 69770, "epoch": 576} {"train_loss": -35.92910385131836, "global_step": 69771, "epoch": 576} {"train_loss": -36.32859420776367, "global_step": 69772, "epoch": 576} {"train_loss": -35.79981231689453, "global_step": 69773, "epoch": 576} {"train_loss": -35.457275390625, "global_step": 69774, "epoch": 576} {"train_loss": -36.41318893432617, "global_step": 69775, "epoch": 576} {"train_loss": -36.34158706665039, "global_step": 69776, "epoch": 576} {"train_loss": -36.21865463256836, "global_step": 69777, "epoch": 576} {"train_loss": -36.292030334472656, "global_step": 69778, "epoch": 576} {"train_loss": -36.01216506958008, "global_step": 69779, "epoch": 576} {"train_loss": -35.90496063232422, "global_step": 69780, "epoch": 576} {"train_loss": -36.87472152709961, "global_step": 69781, "epoch": 576} {"train_loss": -36.38468551635742, "global_step": 69782, "epoch": 576} {"train_loss": -35.6321907043457, "global_step": 69783, "epoch": 576} {"train_loss": -36.873111724853516, "global_step": 69784, "epoch": 576} {"train_loss": -36.56519317626953, "global_step": 69785, "epoch": 576} {"train_loss": -36.81881332397461, "global_step": 69786, "epoch": 576} {"train_loss": -35.87896728515625, "global_step": 69787, "epoch": 576} {"train_loss": -36.4197998046875, "global_step": 69788, "epoch": 576} {"train_loss": -36.586029052734375, "global_step": 69789, "epoch": 576} {"train_loss": -36.759613037109375, "global_step": 69790, "epoch": 576} {"train_loss": -36.41591262817383, "global_step": 69791, "epoch": 576} {"train_loss": -36.68709945678711, "global_step": 69792, "epoch": 576} {"train_loss": -36.69733428955078, "global_step": 69793, "epoch": 576} {"train_loss": -37.06928634643555, "global_step": 69794, "epoch": 576} {"train_loss": -36.795692443847656, "global_step": 69795, "epoch": 576} {"train_loss": -36.663368225097656, "global_step": 69796, "epoch": 576} {"train_loss": -36.926048278808594, "global_step": 69797, "epoch": 576} {"train_loss": -37.040313720703125, "global_step": 69798, "epoch": 576} {"train_loss": -36.27166748046875, "global_step": 69799, "epoch": 576} {"train_loss": -36.1042594909668, "global_step": 69800, "epoch": 576} {"train_loss": -36.724151611328125, "global_step": 69801, "epoch": 576} {"train_loss": -36.998592376708984, "global_step": 69802, "epoch": 576} {"train_loss": -36.42367172241211, "global_step": 69803, "epoch": 576} {"train_loss": -35.76475524902344, "global_step": 69804, "epoch": 576} {"train_loss": -35.77274703979492, "global_step": 69805, "epoch": 576} {"train_loss": -37.084896087646484, "global_step": 69806, "epoch": 576} {"train_loss": -37.14429473876953, "global_step": 69807, "epoch": 576} {"train_loss": -35.83419418334961, "global_step": 69808, "epoch": 576} {"train_loss": -34.402339935302734, "global_step": 69809, "epoch": 576} {"train_loss": -33.7071647644043, "global_step": 69810, "epoch": 576} {"train_loss": -35.4511604309082, "global_step": 69811, "epoch": 576} {"train_loss": -36.817298889160156, "global_step": 69812, "epoch": 576} {"train_loss": -37.69968795776367, "global_step": 69813, "epoch": 576} {"train_loss": -37.038177490234375, "global_step": 69814, "epoch": 576} {"train_loss": -36.938167572021484, "global_step": 69815, "epoch": 576} {"train_loss": -35.90618415706414, "global_step": 69816, "epoch": 576, "val_loss": 2599741.25} {"train_loss": -36.97612762451172, "global_step": 69817, "epoch": 577} {"train_loss": -37.144561767578125, "global_step": 69818, "epoch": 577} {"train_loss": -37.58414077758789, "global_step": 69819, "epoch": 577} {"train_loss": -37.68550491333008, "global_step": 69820, "epoch": 577} {"train_loss": -37.28790283203125, "global_step": 69821, "epoch": 577} {"train_loss": -37.4321403503418, "global_step": 69822, "epoch": 577} {"train_loss": -37.438472747802734, "global_step": 69823, "epoch": 577} {"train_loss": -37.5222282409668, "global_step": 69824, "epoch": 577} {"train_loss": -37.39790344238281, "global_step": 69825, "epoch": 577} {"train_loss": -37.80686950683594, "global_step": 69826, "epoch": 577} {"train_loss": -37.27760314941406, "global_step": 69827, "epoch": 577} {"train_loss": -37.81241226196289, "global_step": 69828, "epoch": 577} {"train_loss": -37.69002151489258, "global_step": 69829, "epoch": 577} {"train_loss": -37.18219757080078, "global_step": 69830, "epoch": 577} {"train_loss": -36.874664306640625, "global_step": 69831, "epoch": 577} {"train_loss": -37.25094223022461, "global_step": 69832, "epoch": 577} {"train_loss": -37.30898666381836, "global_step": 69833, "epoch": 577} {"train_loss": -37.30031204223633, "global_step": 69834, "epoch": 577} {"train_loss": -36.7729606628418, "global_step": 69835, "epoch": 577} {"train_loss": -37.43062973022461, "global_step": 69836, "epoch": 577} {"train_loss": -36.3411979675293, "global_step": 69837, "epoch": 577} {"train_loss": -34.93845748901367, "global_step": 69838, "epoch": 577} {"train_loss": -34.36604690551758, "global_step": 69839, "epoch": 577} {"train_loss": -35.285770416259766, "global_step": 69840, "epoch": 577} {"train_loss": -35.44995880126953, "global_step": 69841, "epoch": 577} {"train_loss": -36.142860412597656, "global_step": 69842, "epoch": 577} {"train_loss": -36.35601806640625, "global_step": 69843, "epoch": 577} {"train_loss": -33.34527587890625, "global_step": 69844, "epoch": 577} {"train_loss": -36.46360397338867, "global_step": 69845, "epoch": 577} {"train_loss": -36.56993865966797, "global_step": 69846, "epoch": 577} {"train_loss": -35.90655517578125, "global_step": 69847, "epoch": 577} {"train_loss": -36.81267166137695, "global_step": 69848, "epoch": 577} {"train_loss": -35.73316192626953, "global_step": 69849, "epoch": 577} {"train_loss": -37.489723205566406, "global_step": 69850, "epoch": 577} {"train_loss": -36.593605041503906, "global_step": 69851, "epoch": 577} {"train_loss": -36.61777877807617, "global_step": 69852, "epoch": 577} {"train_loss": -36.60908889770508, "global_step": 69853, "epoch": 577} {"train_loss": -28.726831436157227, "global_step": 69854, "epoch": 577} {"train_loss": -37.00762939453125, "global_step": 69855, "epoch": 577} {"train_loss": -33.486534118652344, "global_step": 69856, "epoch": 577} {"train_loss": -37.136775970458984, "global_step": 69857, "epoch": 577} {"train_loss": -36.736026763916016, "global_step": 69858, "epoch": 577} {"train_loss": -37.005287170410156, "global_step": 69859, "epoch": 577} {"train_loss": -36.79697799682617, "global_step": 69860, "epoch": 577} {"train_loss": -36.016883850097656, "global_step": 69861, "epoch": 577} {"train_loss": -36.6380500793457, "global_step": 69862, "epoch": 577} {"train_loss": -36.53534698486328, "global_step": 69863, "epoch": 577} {"train_loss": -36.101776123046875, "global_step": 69864, "epoch": 577} {"train_loss": -36.983638763427734, "global_step": 69865, "epoch": 577} {"train_loss": -36.43587112426758, "global_step": 69866, "epoch": 577} {"train_loss": -36.75667953491211, "global_step": 69867, "epoch": 577} {"train_loss": -37.327728271484375, "global_step": 69868, "epoch": 577} {"train_loss": -36.15235900878906, "global_step": 69869, "epoch": 577} {"train_loss": -36.7994384765625, "global_step": 69870, "epoch": 577} {"train_loss": -36.91530990600586, "global_step": 69871, "epoch": 577} {"train_loss": -36.83304977416992, "global_step": 69872, "epoch": 577} {"train_loss": -37.018524169921875, "global_step": 69873, "epoch": 577} {"train_loss": -37.27024459838867, "global_step": 69874, "epoch": 577} {"train_loss": -37.194705963134766, "global_step": 69875, "epoch": 577} {"train_loss": -36.766334533691406, "global_step": 69876, "epoch": 577} {"train_loss": -37.36302947998047, "global_step": 69877, "epoch": 577} {"train_loss": -37.042701721191406, "global_step": 69878, "epoch": 577} {"train_loss": -35.219520568847656, "global_step": 69879, "epoch": 577} {"train_loss": -36.14857482910156, "global_step": 69880, "epoch": 577} {"train_loss": -37.260040283203125, "global_step": 69881, "epoch": 577} {"train_loss": -36.36960983276367, "global_step": 69882, "epoch": 577} {"train_loss": -36.615447998046875, "global_step": 69883, "epoch": 577} {"train_loss": -36.06475067138672, "global_step": 69884, "epoch": 577} {"train_loss": -37.45915985107422, "global_step": 69885, "epoch": 577} {"train_loss": -36.06761169433594, "global_step": 69886, "epoch": 577} {"train_loss": -35.643310546875, "global_step": 69887, "epoch": 577} {"train_loss": -36.67607879638672, "global_step": 69888, "epoch": 577} {"train_loss": -36.80582809448242, "global_step": 69889, "epoch": 577} {"train_loss": -36.71257400512695, "global_step": 69890, "epoch": 577} {"train_loss": -35.72322463989258, "global_step": 69891, "epoch": 577} {"train_loss": -36.938411712646484, "global_step": 69892, "epoch": 577} {"train_loss": -36.98310852050781, "global_step": 69893, "epoch": 577} {"train_loss": -36.91171646118164, "global_step": 69894, "epoch": 577} {"train_loss": -36.23585891723633, "global_step": 69895, "epoch": 577} {"train_loss": -37.16425704956055, "global_step": 69896, "epoch": 577} {"train_loss": -37.01288986206055, "global_step": 69897, "epoch": 577} {"train_loss": -36.29993438720703, "global_step": 69898, "epoch": 577} {"train_loss": -35.584774017333984, "global_step": 69899, "epoch": 577} {"train_loss": -36.664119720458984, "global_step": 69900, "epoch": 577} {"train_loss": -36.99603271484375, "global_step": 69901, "epoch": 577} {"train_loss": -36.05997848510742, "global_step": 69902, "epoch": 577} {"train_loss": -30.331378936767578, "global_step": 69903, "epoch": 577} {"train_loss": -28.610685348510742, "global_step": 69904, "epoch": 577} {"train_loss": -35.2333984375, "global_step": 69905, "epoch": 577} {"train_loss": -35.93688201904297, "global_step": 69906, "epoch": 577} {"train_loss": -33.149410247802734, "global_step": 69907, "epoch": 577} {"train_loss": -34.60479736328125, "global_step": 69908, "epoch": 577} {"train_loss": -36.111385345458984, "global_step": 69909, "epoch": 577} {"train_loss": -36.17232894897461, "global_step": 69910, "epoch": 577} {"train_loss": -34.69852828979492, "global_step": 69911, "epoch": 577} {"train_loss": -35.42523193359375, "global_step": 69912, "epoch": 577} {"train_loss": -35.291542053222656, "global_step": 69913, "epoch": 577} {"train_loss": -35.730464935302734, "global_step": 69914, "epoch": 577} {"train_loss": -33.995697021484375, "global_step": 69915, "epoch": 577} {"train_loss": -35.94675827026367, "global_step": 69916, "epoch": 577} {"train_loss": -35.064083099365234, "global_step": 69917, "epoch": 577} {"train_loss": -35.950233459472656, "global_step": 69918, "epoch": 577} {"train_loss": -34.91743087768555, "global_step": 69919, "epoch": 577} {"train_loss": -36.98657989501953, "global_step": 69920, "epoch": 577} {"train_loss": -34.42115020751953, "global_step": 69921, "epoch": 577} {"train_loss": -36.40882110595703, "global_step": 69922, "epoch": 577} {"train_loss": -36.865272521972656, "global_step": 69923, "epoch": 577} {"train_loss": -35.003902435302734, "global_step": 69924, "epoch": 577} {"train_loss": -35.0131950378418, "global_step": 69925, "epoch": 577} {"train_loss": -36.64911651611328, "global_step": 69926, "epoch": 577} {"train_loss": -36.609527587890625, "global_step": 69927, "epoch": 577} {"train_loss": -37.04067611694336, "global_step": 69928, "epoch": 577} {"train_loss": -35.42488098144531, "global_step": 69929, "epoch": 577} {"train_loss": -37.090065002441406, "global_step": 69930, "epoch": 577} {"train_loss": -36.80417251586914, "global_step": 69931, "epoch": 577} {"train_loss": -37.132328033447266, "global_step": 69932, "epoch": 577} {"train_loss": -37.28825759887695, "global_step": 69933, "epoch": 577} {"train_loss": -36.363441467285156, "global_step": 69934, "epoch": 577} {"train_loss": -36.87174987792969, "global_step": 69935, "epoch": 577} {"train_loss": -36.74960708618164, "global_step": 69936, "epoch": 577} {"train_loss": -36.24500492190526, "global_step": 69937, "epoch": 577, "val_loss": 2558495.5} {"train_loss": -36.090572357177734, "global_step": 69938, "epoch": 578} {"train_loss": -36.67647933959961, "global_step": 69939, "epoch": 578} {"train_loss": -37.12726974487305, "global_step": 69940, "epoch": 578} {"train_loss": -36.837886810302734, "global_step": 69941, "epoch": 578} {"train_loss": -36.012359619140625, "global_step": 69942, "epoch": 578} {"train_loss": -36.921424865722656, "global_step": 69943, "epoch": 578} {"train_loss": -36.75638961791992, "global_step": 69944, "epoch": 578} {"train_loss": -36.19631576538086, "global_step": 69945, "epoch": 578} {"train_loss": -37.226348876953125, "global_step": 69946, "epoch": 578} {"train_loss": -37.24940872192383, "global_step": 69947, "epoch": 578} {"train_loss": -36.578067779541016, "global_step": 69948, "epoch": 578} {"train_loss": -37.11683654785156, "global_step": 69949, "epoch": 578} {"train_loss": -36.69697189331055, "global_step": 69950, "epoch": 578} {"train_loss": -37.09895706176758, "global_step": 69951, "epoch": 578} {"train_loss": -37.555294036865234, "global_step": 69952, "epoch": 578} {"train_loss": -36.424312591552734, "global_step": 69953, "epoch": 578} {"train_loss": -37.50914001464844, "global_step": 69954, "epoch": 578} {"train_loss": -36.53031921386719, "global_step": 69955, "epoch": 578} {"train_loss": -37.421607971191406, "global_step": 69956, "epoch": 578} {"train_loss": -37.622703552246094, "global_step": 69957, "epoch": 578} {"train_loss": -36.857479095458984, "global_step": 69958, "epoch": 578} {"train_loss": -37.11260986328125, "global_step": 69959, "epoch": 578} {"train_loss": -36.982051849365234, "global_step": 69960, "epoch": 578} {"train_loss": -36.19735336303711, "global_step": 69961, "epoch": 578} {"train_loss": -37.123680114746094, "global_step": 69962, "epoch": 578} {"train_loss": -35.15468978881836, "global_step": 69963, "epoch": 578} {"train_loss": -35.872161865234375, "global_step": 69964, "epoch": 578} {"train_loss": -35.25812530517578, "global_step": 69965, "epoch": 578} {"train_loss": -36.775352478027344, "global_step": 69966, "epoch": 578} {"train_loss": -35.7403564453125, "global_step": 69967, "epoch": 578} {"train_loss": -34.64449691772461, "global_step": 69968, "epoch": 578} {"train_loss": -35.06372833251953, "global_step": 69969, "epoch": 578} {"train_loss": -33.2987174987793, "global_step": 69970, "epoch": 578} {"train_loss": -35.2895622253418, "global_step": 69971, "epoch": 578} {"train_loss": -31.44061851501465, "global_step": 69972, "epoch": 578} {"train_loss": -29.76304054260254, "global_step": 69973, "epoch": 578} {"train_loss": -31.24688720703125, "global_step": 69974, "epoch": 578} {"train_loss": -34.3580322265625, "global_step": 69975, "epoch": 578} {"train_loss": -29.91218376159668, "global_step": 69976, "epoch": 578} {"train_loss": -29.198272705078125, "global_step": 69977, "epoch": 578} {"train_loss": -34.873016357421875, "global_step": 69978, "epoch": 578} {"train_loss": -32.38676071166992, "global_step": 69979, "epoch": 578} {"train_loss": -32.423439025878906, "global_step": 69980, "epoch": 578} {"train_loss": -32.67781448364258, "global_step": 69981, "epoch": 578} {"train_loss": -35.148929595947266, "global_step": 69982, "epoch": 578} {"train_loss": -31.243152618408203, "global_step": 69983, "epoch": 578} {"train_loss": -30.53968620300293, "global_step": 69984, "epoch": 578} {"train_loss": -32.522884368896484, "global_step": 69985, "epoch": 578} {"train_loss": -31.17214012145996, "global_step": 69986, "epoch": 578} {"train_loss": -32.689212799072266, "global_step": 69987, "epoch": 578} {"train_loss": -33.3109245300293, "global_step": 69988, "epoch": 578} {"train_loss": -33.37482833862305, "global_step": 69989, "epoch": 578} {"train_loss": -33.92878341674805, "global_step": 69990, "epoch": 578} {"train_loss": -34.244503021240234, "global_step": 69991, "epoch": 578} {"train_loss": -33.7038459777832, "global_step": 69992, "epoch": 578} {"train_loss": -34.705081939697266, "global_step": 69993, "epoch": 578} {"train_loss": -33.612037658691406, "global_step": 69994, "epoch": 578} {"train_loss": -33.87086868286133, "global_step": 69995, "epoch": 578} {"train_loss": -34.38778305053711, "global_step": 69996, "epoch": 578} {"train_loss": -33.769371032714844, "global_step": 69997, "epoch": 578} {"train_loss": -34.20924758911133, "global_step": 69998, "epoch": 578} {"train_loss": -34.90842819213867, "global_step": 69999, "epoch": 578} {"train_loss": -34.94147872924805, "global_step": 70000, "epoch": 578} {"train_loss": -34.60403060913086, "global_step": 70001, "epoch": 578} {"train_loss": -34.388221740722656, "global_step": 70002, "epoch": 578} {"train_loss": -34.55304718017578, "global_step": 70003, "epoch": 578} {"train_loss": -34.527442932128906, "global_step": 70004, "epoch": 578} {"train_loss": -31.940475463867188, "global_step": 70005, "epoch": 578} {"train_loss": -34.70766830444336, "global_step": 70006, "epoch": 578} {"train_loss": -34.609066009521484, "global_step": 70007, "epoch": 578} {"train_loss": -34.10527420043945, "global_step": 70008, "epoch": 578} {"train_loss": -35.25308609008789, "global_step": 70009, "epoch": 578} {"train_loss": -35.377174377441406, "global_step": 70010, "epoch": 578} {"train_loss": -34.848751068115234, "global_step": 70011, "epoch": 578} {"train_loss": -34.97325134277344, "global_step": 70012, "epoch": 578} {"train_loss": -35.481563568115234, "global_step": 70013, "epoch": 578} {"train_loss": -35.174354553222656, "global_step": 70014, "epoch": 578} {"train_loss": -35.070472717285156, "global_step": 70015, "epoch": 578} {"train_loss": -32.397064208984375, "global_step": 70016, "epoch": 578} {"train_loss": -35.736202239990234, "global_step": 70017, "epoch": 578} {"train_loss": -35.73922348022461, "global_step": 70018, "epoch": 578} {"train_loss": -35.73673629760742, "global_step": 70019, "epoch": 578} {"train_loss": -35.65340805053711, "global_step": 70020, "epoch": 578} {"train_loss": -35.48435592651367, "global_step": 70021, "epoch": 578} {"train_loss": -35.966121673583984, "global_step": 70022, "epoch": 578} {"train_loss": -35.56053161621094, "global_step": 70023, "epoch": 578} {"train_loss": -35.50105285644531, "global_step": 70024, "epoch": 578} {"train_loss": -35.80525588989258, "global_step": 70025, "epoch": 578} {"train_loss": -36.1673698425293, "global_step": 70026, "epoch": 578} {"train_loss": -35.608482360839844, "global_step": 70027, "epoch": 578} {"train_loss": -35.9700813293457, "global_step": 70028, "epoch": 578} {"train_loss": -35.878326416015625, "global_step": 70029, "epoch": 578} {"train_loss": -36.224815368652344, "global_step": 70030, "epoch": 578} {"train_loss": -36.22564697265625, "global_step": 70031, "epoch": 578} {"train_loss": -34.90450668334961, "global_step": 70032, "epoch": 578} {"train_loss": -36.05256271362305, "global_step": 70033, "epoch": 578} {"train_loss": -35.730552673339844, "global_step": 70034, "epoch": 578} {"train_loss": -36.2794189453125, "global_step": 70035, "epoch": 578} {"train_loss": -36.24440383911133, "global_step": 70036, "epoch": 578} {"train_loss": -35.27995300292969, "global_step": 70037, "epoch": 578} {"train_loss": -36.054317474365234, "global_step": 70038, "epoch": 578} {"train_loss": -35.626827239990234, "global_step": 70039, "epoch": 578} {"train_loss": -35.3744010925293, "global_step": 70040, "epoch": 578} {"train_loss": -35.94000244140625, "global_step": 70041, "epoch": 578} {"train_loss": -35.55931091308594, "global_step": 70042, "epoch": 578} {"train_loss": -35.9304084777832, "global_step": 70043, "epoch": 578} {"train_loss": -36.119483947753906, "global_step": 70044, "epoch": 578} {"train_loss": -35.09089279174805, "global_step": 70045, "epoch": 578} {"train_loss": -36.71512222290039, "global_step": 70046, "epoch": 578} {"train_loss": -35.37380599975586, "global_step": 70047, "epoch": 578} {"train_loss": -35.00444412231445, "global_step": 70048, "epoch": 578} {"train_loss": -35.7471923828125, "global_step": 70049, "epoch": 578} {"train_loss": -36.29981994628906, "global_step": 70050, "epoch": 578} {"train_loss": -37.01931381225586, "global_step": 70051, "epoch": 578} {"train_loss": -35.38030242919922, "global_step": 70052, "epoch": 578} {"train_loss": -36.77146530151367, "global_step": 70053, "epoch": 578} {"train_loss": -36.363155364990234, "global_step": 70054, "epoch": 578} {"train_loss": -37.06869125366211, "global_step": 70055, "epoch": 578} {"train_loss": -35.82295608520508, "global_step": 70056, "epoch": 578} {"train_loss": -37.12911605834961, "global_step": 70057, "epoch": 578} {"train_loss": -35.15588024233983, "global_step": 70058, "epoch": 578, "val_loss": 2582511.75} {"train_loss": -36.101951599121094, "global_step": 70059, "epoch": 579} {"train_loss": -36.789939880371094, "global_step": 70060, "epoch": 579} {"train_loss": -36.91974639892578, "global_step": 70061, "epoch": 579} {"train_loss": -37.29317855834961, "global_step": 70062, "epoch": 579} {"train_loss": -37.062068939208984, "global_step": 70063, "epoch": 579} {"train_loss": -37.371986389160156, "global_step": 70064, "epoch": 579} {"train_loss": -37.342018127441406, "global_step": 70065, "epoch": 579} {"train_loss": -37.495384216308594, "global_step": 70066, "epoch": 579} {"train_loss": -37.467220306396484, "global_step": 70067, "epoch": 579} {"train_loss": -37.40176010131836, "global_step": 70068, "epoch": 579} {"train_loss": -37.50640869140625, "global_step": 70069, "epoch": 579} {"train_loss": -37.61725997924805, "global_step": 70070, "epoch": 579} {"train_loss": -37.20112609863281, "global_step": 70071, "epoch": 579} {"train_loss": -37.72543716430664, "global_step": 70072, "epoch": 579} {"train_loss": -37.2887077331543, "global_step": 70073, "epoch": 579} {"train_loss": -37.62191390991211, "global_step": 70074, "epoch": 579} {"train_loss": -37.14500427246094, "global_step": 70075, "epoch": 579} {"train_loss": -36.443939208984375, "global_step": 70076, "epoch": 579} {"train_loss": -34.906063079833984, "global_step": 70077, "epoch": 579} {"train_loss": -33.989051818847656, "global_step": 70078, "epoch": 579} {"train_loss": -31.76230812072754, "global_step": 70079, "epoch": 579} {"train_loss": -32.39656448364258, "global_step": 70080, "epoch": 579} {"train_loss": -32.54941940307617, "global_step": 70081, "epoch": 579} {"train_loss": -30.58977699279785, "global_step": 70082, "epoch": 579} {"train_loss": -31.406335830688477, "global_step": 70083, "epoch": 579} {"train_loss": -36.83783721923828, "global_step": 70084, "epoch": 579} {"train_loss": -32.9412727355957, "global_step": 70085, "epoch": 579} {"train_loss": -30.876758575439453, "global_step": 70086, "epoch": 579} {"train_loss": -34.46562576293945, "global_step": 70087, "epoch": 579} {"train_loss": -36.6453857421875, "global_step": 70088, "epoch": 579} {"train_loss": -33.921688079833984, "global_step": 70089, "epoch": 579} {"train_loss": -35.722633361816406, "global_step": 70090, "epoch": 579} {"train_loss": -36.40774154663086, "global_step": 70091, "epoch": 579} {"train_loss": -35.255859375, "global_step": 70092, "epoch": 579} {"train_loss": -35.677162170410156, "global_step": 70093, "epoch": 579} {"train_loss": -36.62289810180664, "global_step": 70094, "epoch": 579} {"train_loss": -36.432212829589844, "global_step": 70095, "epoch": 579} {"train_loss": -36.694580078125, "global_step": 70096, "epoch": 579} {"train_loss": -35.720516204833984, "global_step": 70097, "epoch": 579} {"train_loss": -37.02954864501953, "global_step": 70098, "epoch": 579} {"train_loss": -36.545310974121094, "global_step": 70099, "epoch": 579} {"train_loss": -36.63299560546875, "global_step": 70100, "epoch": 579} {"train_loss": -36.66410446166992, "global_step": 70101, "epoch": 579} {"train_loss": -36.319374084472656, "global_step": 70102, "epoch": 579} {"train_loss": -36.327327728271484, "global_step": 70103, "epoch": 579} {"train_loss": -36.156272888183594, "global_step": 70104, "epoch": 579} {"train_loss": -36.678524017333984, "global_step": 70105, "epoch": 579} {"train_loss": -35.77407455444336, "global_step": 70106, "epoch": 579} {"train_loss": -37.29738998413086, "global_step": 70107, "epoch": 579} {"train_loss": -36.86726760864258, "global_step": 70108, "epoch": 579} {"train_loss": -36.70551300048828, "global_step": 70109, "epoch": 579} {"train_loss": -36.304229736328125, "global_step": 70110, "epoch": 579} {"train_loss": -36.63298034667969, "global_step": 70111, "epoch": 579} {"train_loss": -36.75252151489258, "global_step": 70112, "epoch": 579} {"train_loss": -36.7807502746582, "global_step": 70113, "epoch": 579} {"train_loss": -36.687198638916016, "global_step": 70114, "epoch": 579} {"train_loss": -36.8643913269043, "global_step": 70115, "epoch": 579} {"train_loss": -36.8950309753418, "global_step": 70116, "epoch": 579} {"train_loss": -36.70675277709961, "global_step": 70117, "epoch": 579} {"train_loss": -36.61518096923828, "global_step": 70118, "epoch": 579} {"train_loss": -36.92550277709961, "global_step": 70119, "epoch": 579} {"train_loss": -37.16533279418945, "global_step": 70120, "epoch": 579} {"train_loss": -37.41709518432617, "global_step": 70121, "epoch": 579} {"train_loss": -37.500186920166016, "global_step": 70122, "epoch": 579} {"train_loss": -37.41271209716797, "global_step": 70123, "epoch": 579} {"train_loss": -37.503570556640625, "global_step": 70124, "epoch": 579} {"train_loss": -37.33650207519531, "global_step": 70125, "epoch": 579} {"train_loss": -37.51493835449219, "global_step": 70126, "epoch": 579} {"train_loss": -37.02357864379883, "global_step": 70127, "epoch": 579} {"train_loss": -37.3045768737793, "global_step": 70128, "epoch": 579} {"train_loss": -37.41762161254883, "global_step": 70129, "epoch": 579} {"train_loss": -37.77553176879883, "global_step": 70130, "epoch": 579} {"train_loss": -36.88175582885742, "global_step": 70131, "epoch": 579} {"train_loss": -37.686439514160156, "global_step": 70132, "epoch": 579} {"train_loss": -37.53115463256836, "global_step": 70133, "epoch": 579} {"train_loss": -37.76752853393555, "global_step": 70134, "epoch": 579} {"train_loss": -37.5302848815918, "global_step": 70135, "epoch": 579} {"train_loss": -37.692596435546875, "global_step": 70136, "epoch": 579} {"train_loss": -37.303565979003906, "global_step": 70137, "epoch": 579} {"train_loss": -37.16840362548828, "global_step": 70138, "epoch": 579} {"train_loss": -37.278564453125, "global_step": 70139, "epoch": 579} {"train_loss": -36.926429748535156, "global_step": 70140, "epoch": 579} {"train_loss": -35.27833557128906, "global_step": 70141, "epoch": 579} {"train_loss": -35.7436408996582, "global_step": 70142, "epoch": 579} {"train_loss": -37.50250244140625, "global_step": 70143, "epoch": 579} {"train_loss": -36.53892517089844, "global_step": 70144, "epoch": 579} {"train_loss": -34.474342346191406, "global_step": 70145, "epoch": 579} {"train_loss": -30.49457359313965, "global_step": 70146, "epoch": 579} {"train_loss": -29.68735122680664, "global_step": 70147, "epoch": 579} {"train_loss": -26.990934371948242, "global_step": 70148, "epoch": 579} {"train_loss": -27.671844482421875, "global_step": 70149, "epoch": 579} {"train_loss": -29.822263717651367, "global_step": 70150, "epoch": 579} {"train_loss": -35.68160629272461, "global_step": 70151, "epoch": 579} {"train_loss": -33.12742233276367, "global_step": 70152, "epoch": 579} {"train_loss": -36.72519302368164, "global_step": 70153, "epoch": 579} {"train_loss": -35.07805252075195, "global_step": 70154, "epoch": 579} {"train_loss": -35.8765754699707, "global_step": 70155, "epoch": 579} {"train_loss": -35.974021911621094, "global_step": 70156, "epoch": 579} {"train_loss": -36.29579544067383, "global_step": 70157, "epoch": 579} {"train_loss": -36.121341705322266, "global_step": 70158, "epoch": 579} {"train_loss": -36.8451042175293, "global_step": 70159, "epoch": 579} {"train_loss": -36.077606201171875, "global_step": 70160, "epoch": 579} {"train_loss": -37.132511138916016, "global_step": 70161, "epoch": 579} {"train_loss": -37.28953170776367, "global_step": 70162, "epoch": 579} {"train_loss": -36.73838424682617, "global_step": 70163, "epoch": 579} {"train_loss": -37.10552978515625, "global_step": 70164, "epoch": 579} {"train_loss": -36.802433013916016, "global_step": 70165, "epoch": 579} {"train_loss": -36.98869323730469, "global_step": 70166, "epoch": 579} {"train_loss": -37.44388961791992, "global_step": 70167, "epoch": 579} {"train_loss": -36.666255950927734, "global_step": 70168, "epoch": 579} {"train_loss": -36.735313415527344, "global_step": 70169, "epoch": 579} {"train_loss": -37.61547088623047, "global_step": 70170, "epoch": 579} {"train_loss": -37.0073356628418, "global_step": 70171, "epoch": 579} {"train_loss": -37.57794952392578, "global_step": 70172, "epoch": 579} {"train_loss": -37.21363067626953, "global_step": 70173, "epoch": 579} {"train_loss": -37.4025764465332, "global_step": 70174, "epoch": 579} {"train_loss": -37.66218185424805, "global_step": 70175, "epoch": 579} {"train_loss": -37.01150131225586, "global_step": 70176, "epoch": 579} {"train_loss": -37.32345199584961, "global_step": 70177, "epoch": 579} {"train_loss": -37.08024215698242, "global_step": 70178, "epoch": 579} {"train_loss": -36.120696517061596, "global_step": 70179, "epoch": 579, "val_loss": 2581373.75} {"train_loss": -37.59058380126953, "global_step": 70180, "epoch": 580} {"train_loss": -36.69343948364258, "global_step": 70181, "epoch": 580} {"train_loss": -37.29719161987305, "global_step": 70182, "epoch": 580} {"train_loss": -37.172245025634766, "global_step": 70183, "epoch": 580} {"train_loss": -37.23307418823242, "global_step": 70184, "epoch": 580} {"train_loss": -37.311058044433594, "global_step": 70185, "epoch": 580} {"train_loss": -37.14201354980469, "global_step": 70186, "epoch": 580} {"train_loss": -37.66682052612305, "global_step": 70187, "epoch": 580} {"train_loss": -36.978614807128906, "global_step": 70188, "epoch": 580} {"train_loss": -37.86483383178711, "global_step": 70189, "epoch": 580} {"train_loss": -37.4553108215332, "global_step": 70190, "epoch": 580} {"train_loss": -37.501243591308594, "global_step": 70191, "epoch": 580} {"train_loss": -36.9929313659668, "global_step": 70192, "epoch": 580} {"train_loss": -37.436981201171875, "global_step": 70193, "epoch": 580} {"train_loss": -36.932350158691406, "global_step": 70194, "epoch": 580} {"train_loss": -37.544612884521484, "global_step": 70195, "epoch": 580} {"train_loss": -37.2396240234375, "global_step": 70196, "epoch": 580} {"train_loss": -37.11359786987305, "global_step": 70197, "epoch": 580} {"train_loss": -37.56230545043945, "global_step": 70198, "epoch": 580} {"train_loss": -37.11848068237305, "global_step": 70199, "epoch": 580} {"train_loss": -37.03778839111328, "global_step": 70200, "epoch": 580} {"train_loss": -37.7369384765625, "global_step": 70201, "epoch": 580} {"train_loss": -36.752342224121094, "global_step": 70202, "epoch": 580} {"train_loss": -37.46706008911133, "global_step": 70203, "epoch": 580} {"train_loss": -37.30540084838867, "global_step": 70204, "epoch": 580} {"train_loss": -37.1324462890625, "global_step": 70205, "epoch": 580} {"train_loss": -36.35346603393555, "global_step": 70206, "epoch": 580} {"train_loss": -34.06753921508789, "global_step": 70207, "epoch": 580} {"train_loss": -36.36246871948242, "global_step": 70208, "epoch": 580} {"train_loss": -36.84482955932617, "global_step": 70209, "epoch": 580} {"train_loss": -36.1682243347168, "global_step": 70210, "epoch": 580} {"train_loss": -36.2307243347168, "global_step": 70211, "epoch": 580} {"train_loss": -36.96746826171875, "global_step": 70212, "epoch": 580} {"train_loss": -35.30524826049805, "global_step": 70213, "epoch": 580} {"train_loss": -36.6500244140625, "global_step": 70214, "epoch": 580} {"train_loss": -36.29973602294922, "global_step": 70215, "epoch": 580} {"train_loss": -35.94691467285156, "global_step": 70216, "epoch": 580} {"train_loss": -35.5288200378418, "global_step": 70217, "epoch": 580} {"train_loss": -36.8136100769043, "global_step": 70218, "epoch": 580} {"train_loss": -35.82609939575195, "global_step": 70219, "epoch": 580} {"train_loss": -35.450557708740234, "global_step": 70220, "epoch": 580} {"train_loss": -34.40867233276367, "global_step": 70221, "epoch": 580} {"train_loss": -35.78077697753906, "global_step": 70222, "epoch": 580} {"train_loss": -35.305992126464844, "global_step": 70223, "epoch": 580} {"train_loss": -36.028587341308594, "global_step": 70224, "epoch": 580} {"train_loss": -35.899261474609375, "global_step": 70225, "epoch": 580} {"train_loss": -36.587196350097656, "global_step": 70226, "epoch": 580} {"train_loss": -36.032470703125, "global_step": 70227, "epoch": 580} {"train_loss": -36.1099853515625, "global_step": 70228, "epoch": 580} {"train_loss": -35.648685455322266, "global_step": 70229, "epoch": 580} {"train_loss": -36.05581283569336, "global_step": 70230, "epoch": 580} {"train_loss": -37.30953598022461, "global_step": 70231, "epoch": 580} {"train_loss": -36.00075912475586, "global_step": 70232, "epoch": 580} {"train_loss": -36.043373107910156, "global_step": 70233, "epoch": 580} {"train_loss": -35.62827682495117, "global_step": 70234, "epoch": 580} {"train_loss": -33.97004318237305, "global_step": 70235, "epoch": 580} {"train_loss": -31.374820709228516, "global_step": 70236, "epoch": 580} {"train_loss": -31.42535972595215, "global_step": 70237, "epoch": 580} {"train_loss": -35.293697357177734, "global_step": 70238, "epoch": 580} {"train_loss": -36.38200759887695, "global_step": 70239, "epoch": 580} {"train_loss": -33.69306564331055, "global_step": 70240, "epoch": 580} {"train_loss": -31.727018356323242, "global_step": 70241, "epoch": 580} {"train_loss": -35.68160629272461, "global_step": 70242, "epoch": 580} {"train_loss": -36.09943771362305, "global_step": 70243, "epoch": 580} {"train_loss": -34.0794792175293, "global_step": 70244, "epoch": 580} {"train_loss": -36.40522384643555, "global_step": 70245, "epoch": 580} {"train_loss": -35.44179916381836, "global_step": 70246, "epoch": 580} {"train_loss": -34.84572219848633, "global_step": 70247, "epoch": 580} {"train_loss": -34.07352828979492, "global_step": 70248, "epoch": 580} {"train_loss": -33.13473892211914, "global_step": 70249, "epoch": 580} {"train_loss": -37.06180191040039, "global_step": 70250, "epoch": 580} {"train_loss": -34.802345275878906, "global_step": 70251, "epoch": 580} {"train_loss": -36.6917610168457, "global_step": 70252, "epoch": 580} {"train_loss": -36.019561767578125, "global_step": 70253, "epoch": 580} {"train_loss": -36.38057327270508, "global_step": 70254, "epoch": 580} {"train_loss": -35.123165130615234, "global_step": 70255, "epoch": 580} {"train_loss": -36.41270065307617, "global_step": 70256, "epoch": 580} {"train_loss": -36.20917510986328, "global_step": 70257, "epoch": 580} {"train_loss": -36.39059066772461, "global_step": 70258, "epoch": 580} {"train_loss": -36.77649688720703, "global_step": 70259, "epoch": 580} {"train_loss": -36.54680252075195, "global_step": 70260, "epoch": 580} {"train_loss": -37.087039947509766, "global_step": 70261, "epoch": 580} {"train_loss": -36.58394241333008, "global_step": 70262, "epoch": 580} {"train_loss": -36.97222900390625, "global_step": 70263, "epoch": 580} {"train_loss": -36.81562042236328, "global_step": 70264, "epoch": 580} {"train_loss": -36.2159423828125, "global_step": 70265, "epoch": 580} {"train_loss": -36.26395797729492, "global_step": 70266, "epoch": 580} {"train_loss": -36.901611328125, "global_step": 70267, "epoch": 580} {"train_loss": -37.22756576538086, "global_step": 70268, "epoch": 580} {"train_loss": -36.28353500366211, "global_step": 70269, "epoch": 580} {"train_loss": -36.95771408081055, "global_step": 70270, "epoch": 580} {"train_loss": -37.03379440307617, "global_step": 70271, "epoch": 580} {"train_loss": -36.91740036010742, "global_step": 70272, "epoch": 580} {"train_loss": -36.73629379272461, "global_step": 70273, "epoch": 580} {"train_loss": -37.27862548828125, "global_step": 70274, "epoch": 580} {"train_loss": -36.92158508300781, "global_step": 70275, "epoch": 580} {"train_loss": -36.99604034423828, "global_step": 70276, "epoch": 580} {"train_loss": -37.07018280029297, "global_step": 70277, "epoch": 580} {"train_loss": -37.387725830078125, "global_step": 70278, "epoch": 580} {"train_loss": -36.93905258178711, "global_step": 70279, "epoch": 580} {"train_loss": -37.055763244628906, "global_step": 70280, "epoch": 580} {"train_loss": -37.46964645385742, "global_step": 70281, "epoch": 580} {"train_loss": -37.10055160522461, "global_step": 70282, "epoch": 580} {"train_loss": -36.1132926940918, "global_step": 70283, "epoch": 580} {"train_loss": -36.20930099487305, "global_step": 70284, "epoch": 580} {"train_loss": -35.51458740234375, "global_step": 70285, "epoch": 580} {"train_loss": -36.305973052978516, "global_step": 70286, "epoch": 580} {"train_loss": -36.71818161010742, "global_step": 70287, "epoch": 580} {"train_loss": -37.06610107421875, "global_step": 70288, "epoch": 580} {"train_loss": -35.98529815673828, "global_step": 70289, "epoch": 580} {"train_loss": -37.140159606933594, "global_step": 70290, "epoch": 580} {"train_loss": -37.00590133666992, "global_step": 70291, "epoch": 580} {"train_loss": -36.06135940551758, "global_step": 70292, "epoch": 580} {"train_loss": -37.298091888427734, "global_step": 70293, "epoch": 580} {"train_loss": -37.09027099609375, "global_step": 70294, "epoch": 580} {"train_loss": -37.53535461425781, "global_step": 70295, "epoch": 580} {"train_loss": -37.14051055908203, "global_step": 70296, "epoch": 580} {"train_loss": -35.7115592956543, "global_step": 70297, "epoch": 580} {"train_loss": -37.46944046020508, "global_step": 70298, "epoch": 580} {"train_loss": -36.22674560546875, "global_step": 70299, "epoch": 580} {"train_loss": -36.32689773937887, "global_step": 70300, "epoch": 580, "val_loss": 2765660.75} {"train_loss": -35.51047897338867, "global_step": 70301, "epoch": 581} {"train_loss": -35.5796012878418, "global_step": 70302, "epoch": 581} {"train_loss": -36.40537643432617, "global_step": 70303, "epoch": 581} {"train_loss": -35.35325241088867, "global_step": 70304, "epoch": 581} {"train_loss": -35.55634689331055, "global_step": 70305, "epoch": 581} {"train_loss": -36.245731353759766, "global_step": 70306, "epoch": 581} {"train_loss": -36.61399459838867, "global_step": 70307, "epoch": 581} {"train_loss": -37.17566680908203, "global_step": 70308, "epoch": 581} {"train_loss": -37.08980178833008, "global_step": 70309, "epoch": 581} {"train_loss": -36.44489669799805, "global_step": 70310, "epoch": 581} {"train_loss": -35.902984619140625, "global_step": 70311, "epoch": 581} {"train_loss": -36.73090362548828, "global_step": 70312, "epoch": 581} {"train_loss": -37.115501403808594, "global_step": 70313, "epoch": 581} {"train_loss": -36.99091339111328, "global_step": 70314, "epoch": 581} {"train_loss": -36.887569427490234, "global_step": 70315, "epoch": 581} {"train_loss": -36.28862380981445, "global_step": 70316, "epoch": 581} {"train_loss": -32.80320358276367, "global_step": 70317, "epoch": 581} {"train_loss": -37.30955123901367, "global_step": 70318, "epoch": 581} {"train_loss": -36.81474685668945, "global_step": 70319, "epoch": 581} {"train_loss": -36.349239349365234, "global_step": 70320, "epoch": 581} {"train_loss": -35.97969436645508, "global_step": 70321, "epoch": 581} {"train_loss": -36.44976806640625, "global_step": 70322, "epoch": 581} {"train_loss": -34.75821304321289, "global_step": 70323, "epoch": 581} {"train_loss": -35.7067985534668, "global_step": 70324, "epoch": 581} {"train_loss": -35.637081146240234, "global_step": 70325, "epoch": 581} {"train_loss": -36.25407791137695, "global_step": 70326, "epoch": 581} {"train_loss": -36.096649169921875, "global_step": 70327, "epoch": 581} {"train_loss": -36.157867431640625, "global_step": 70328, "epoch": 581} {"train_loss": -35.542083740234375, "global_step": 70329, "epoch": 581} {"train_loss": -37.056304931640625, "global_step": 70330, "epoch": 581} {"train_loss": -34.58389663696289, "global_step": 70331, "epoch": 581} {"train_loss": -36.3989372253418, "global_step": 70332, "epoch": 581} {"train_loss": -35.12984848022461, "global_step": 70333, "epoch": 581} {"train_loss": -36.22190856933594, "global_step": 70334, "epoch": 581} {"train_loss": -36.1449089050293, "global_step": 70335, "epoch": 581} {"train_loss": -34.64249038696289, "global_step": 70336, "epoch": 581} {"train_loss": -36.56776809692383, "global_step": 70337, "epoch": 581} {"train_loss": -36.6219367980957, "global_step": 70338, "epoch": 581} {"train_loss": -36.7413215637207, "global_step": 70339, "epoch": 581} {"train_loss": -34.768455505371094, "global_step": 70340, "epoch": 581} {"train_loss": -35.122982025146484, "global_step": 70341, "epoch": 581} {"train_loss": -36.8687629699707, "global_step": 70342, "epoch": 581} {"train_loss": -36.26978302001953, "global_step": 70343, "epoch": 581} {"train_loss": -35.40777587890625, "global_step": 70344, "epoch": 581} {"train_loss": -35.55987548828125, "global_step": 70345, "epoch": 581} {"train_loss": -35.35802459716797, "global_step": 70346, "epoch": 581} {"train_loss": -34.995479583740234, "global_step": 70347, "epoch": 581} {"train_loss": -37.08404541015625, "global_step": 70348, "epoch": 581} {"train_loss": -36.86172103881836, "global_step": 70349, "epoch": 581} {"train_loss": -36.7057991027832, "global_step": 70350, "epoch": 581} {"train_loss": -35.722930908203125, "global_step": 70351, "epoch": 581} {"train_loss": -35.437965393066406, "global_step": 70352, "epoch": 581} {"train_loss": -36.57532501220703, "global_step": 70353, "epoch": 581} {"train_loss": -36.4564323425293, "global_step": 70354, "epoch": 581} {"train_loss": -35.50668716430664, "global_step": 70355, "epoch": 581} {"train_loss": -37.21540451049805, "global_step": 70356, "epoch": 581} {"train_loss": -36.60160446166992, "global_step": 70357, "epoch": 581} {"train_loss": -35.33516311645508, "global_step": 70358, "epoch": 581} {"train_loss": -36.26063919067383, "global_step": 70359, "epoch": 581} {"train_loss": -37.20490646362305, "global_step": 70360, "epoch": 581} {"train_loss": -36.350608825683594, "global_step": 70361, "epoch": 581} {"train_loss": -36.624237060546875, "global_step": 70362, "epoch": 581} {"train_loss": -36.28499221801758, "global_step": 70363, "epoch": 581} {"train_loss": -36.77344512939453, "global_step": 70364, "epoch": 581} {"train_loss": -36.99961471557617, "global_step": 70365, "epoch": 581} {"train_loss": -36.6119499206543, "global_step": 70366, "epoch": 581} {"train_loss": -36.93647003173828, "global_step": 70367, "epoch": 581} {"train_loss": -36.52692413330078, "global_step": 70368, "epoch": 581} {"train_loss": -36.552520751953125, "global_step": 70369, "epoch": 581} {"train_loss": -37.41277313232422, "global_step": 70370, "epoch": 581} {"train_loss": -36.911346435546875, "global_step": 70371, "epoch": 581} {"train_loss": -36.5243034362793, "global_step": 70372, "epoch": 581} {"train_loss": -36.97364044189453, "global_step": 70373, "epoch": 581} {"train_loss": -37.47366714477539, "global_step": 70374, "epoch": 581} {"train_loss": -36.66741180419922, "global_step": 70375, "epoch": 581} {"train_loss": -36.47903060913086, "global_step": 70376, "epoch": 581} {"train_loss": -36.118656158447266, "global_step": 70377, "epoch": 581} {"train_loss": -36.6121940612793, "global_step": 70378, "epoch": 581} {"train_loss": -37.10517501831055, "global_step": 70379, "epoch": 581} {"train_loss": -37.17267608642578, "global_step": 70380, "epoch": 581} {"train_loss": -37.03190231323242, "global_step": 70381, "epoch": 581} {"train_loss": -36.77677917480469, "global_step": 70382, "epoch": 581} {"train_loss": -37.18862533569336, "global_step": 70383, "epoch": 581} {"train_loss": -37.16843032836914, "global_step": 70384, "epoch": 581} {"train_loss": -35.73850631713867, "global_step": 70385, "epoch": 581} {"train_loss": -36.71952438354492, "global_step": 70386, "epoch": 581} {"train_loss": -35.37163543701172, "global_step": 70387, "epoch": 581} {"train_loss": -34.17689895629883, "global_step": 70388, "epoch": 581} {"train_loss": -33.70459747314453, "global_step": 70389, "epoch": 581} {"train_loss": -33.00800323486328, "global_step": 70390, "epoch": 581} {"train_loss": -34.71506881713867, "global_step": 70391, "epoch": 581} {"train_loss": -36.95857620239258, "global_step": 70392, "epoch": 581} {"train_loss": -28.9132022857666, "global_step": 70393, "epoch": 581} {"train_loss": -30.509977340698242, "global_step": 70394, "epoch": 581} {"train_loss": -31.925878524780273, "global_step": 70395, "epoch": 581} {"train_loss": -34.410072326660156, "global_step": 70396, "epoch": 581} {"train_loss": -33.249244689941406, "global_step": 70397, "epoch": 581} {"train_loss": -31.948965072631836, "global_step": 70398, "epoch": 581} {"train_loss": -34.19295120239258, "global_step": 70399, "epoch": 581} {"train_loss": -34.69944381713867, "global_step": 70400, "epoch": 581} {"train_loss": -34.253108978271484, "global_step": 70401, "epoch": 581} {"train_loss": -31.548063278198242, "global_step": 70402, "epoch": 581} {"train_loss": -35.113521575927734, "global_step": 70403, "epoch": 581} {"train_loss": -32.75458908081055, "global_step": 70404, "epoch": 581} {"train_loss": -34.1880989074707, "global_step": 70405, "epoch": 581} {"train_loss": -36.16508102416992, "global_step": 70406, "epoch": 581} {"train_loss": -34.4118766784668, "global_step": 70407, "epoch": 581} {"train_loss": -32.75860595703125, "global_step": 70408, "epoch": 581} {"train_loss": -34.49399185180664, "global_step": 70409, "epoch": 581} {"train_loss": -33.98884963989258, "global_step": 70410, "epoch": 581} {"train_loss": -35.023780822753906, "global_step": 70411, "epoch": 581} {"train_loss": -35.59671401977539, "global_step": 70412, "epoch": 581} {"train_loss": -35.43361282348633, "global_step": 70413, "epoch": 581} {"train_loss": -35.07134246826172, "global_step": 70414, "epoch": 581} {"train_loss": -35.06888961791992, "global_step": 70415, "epoch": 581} {"train_loss": -34.2357177734375, "global_step": 70416, "epoch": 581} {"train_loss": -35.032955169677734, "global_step": 70417, "epoch": 581} {"train_loss": -35.25216293334961, "global_step": 70418, "epoch": 581} {"train_loss": -35.75728988647461, "global_step": 70419, "epoch": 581} {"train_loss": -34.894840240478516, "global_step": 70420, "epoch": 581} {"train_loss": -35.66522420142308, "global_step": 70421, "epoch": 581, "val_loss": 2596983.75} {"train_loss": -35.18163299560547, "global_step": 70422, "epoch": 582} {"train_loss": -35.68157196044922, "global_step": 70423, "epoch": 582} {"train_loss": -35.167110443115234, "global_step": 70424, "epoch": 582} {"train_loss": -35.381072998046875, "global_step": 70425, "epoch": 582} {"train_loss": -35.48402786254883, "global_step": 70426, "epoch": 582} {"train_loss": -34.97911071777344, "global_step": 70427, "epoch": 582} {"train_loss": -36.3430290222168, "global_step": 70428, "epoch": 582} {"train_loss": -35.478511810302734, "global_step": 70429, "epoch": 582} {"train_loss": -35.58808135986328, "global_step": 70430, "epoch": 582} {"train_loss": -36.60367965698242, "global_step": 70431, "epoch": 582} {"train_loss": -35.41506576538086, "global_step": 70432, "epoch": 582} {"train_loss": -36.47149658203125, "global_step": 70433, "epoch": 582} {"train_loss": -35.93619918823242, "global_step": 70434, "epoch": 582} {"train_loss": -36.83510971069336, "global_step": 70435, "epoch": 582} {"train_loss": -36.6277961730957, "global_step": 70436, "epoch": 582} {"train_loss": -35.90841293334961, "global_step": 70437, "epoch": 582} {"train_loss": -37.04469299316406, "global_step": 70438, "epoch": 582} {"train_loss": -36.50014877319336, "global_step": 70439, "epoch": 582} {"train_loss": -36.489017486572266, "global_step": 70440, "epoch": 582} {"train_loss": -36.98570251464844, "global_step": 70441, "epoch": 582} {"train_loss": -36.5740966796875, "global_step": 70442, "epoch": 582} {"train_loss": -36.73905563354492, "global_step": 70443, "epoch": 582} {"train_loss": -36.02692794799805, "global_step": 70444, "epoch": 582} {"train_loss": -36.28999710083008, "global_step": 70445, "epoch": 582} {"train_loss": -36.35383224487305, "global_step": 70446, "epoch": 582} {"train_loss": -36.99526596069336, "global_step": 70447, "epoch": 582} {"train_loss": -36.323299407958984, "global_step": 70448, "epoch": 582} {"train_loss": -36.74897384643555, "global_step": 70449, "epoch": 582} {"train_loss": -36.99412155151367, "global_step": 70450, "epoch": 582} {"train_loss": -37.52669906616211, "global_step": 70451, "epoch": 582} {"train_loss": -36.54810333251953, "global_step": 70452, "epoch": 582} {"train_loss": -37.298316955566406, "global_step": 70453, "epoch": 582} {"train_loss": -37.382816314697266, "global_step": 70454, "epoch": 582} {"train_loss": -37.62543869018555, "global_step": 70455, "epoch": 582} {"train_loss": -37.33779525756836, "global_step": 70456, "epoch": 582} {"train_loss": -37.61487579345703, "global_step": 70457, "epoch": 582} {"train_loss": -37.24585723876953, "global_step": 70458, "epoch": 582} {"train_loss": -37.146949768066406, "global_step": 70459, "epoch": 582} {"train_loss": -37.245296478271484, "global_step": 70460, "epoch": 582} {"train_loss": -37.77350997924805, "global_step": 70461, "epoch": 582} {"train_loss": -37.64484786987305, "global_step": 70462, "epoch": 582} {"train_loss": -37.567138671875, "global_step": 70463, "epoch": 582} {"train_loss": -37.46676254272461, "global_step": 70464, "epoch": 582} {"train_loss": -37.743412017822266, "global_step": 70465, "epoch": 582} {"train_loss": -37.27177047729492, "global_step": 70466, "epoch": 582} {"train_loss": -37.66809844970703, "global_step": 70467, "epoch": 582} {"train_loss": -37.41128158569336, "global_step": 70468, "epoch": 582} {"train_loss": -38.259132385253906, "global_step": 70469, "epoch": 582} {"train_loss": -37.44312286376953, "global_step": 70470, "epoch": 582} {"train_loss": -37.56120681762695, "global_step": 70471, "epoch": 582} {"train_loss": -37.852149963378906, "global_step": 70472, "epoch": 582} {"train_loss": -38.18068313598633, "global_step": 70473, "epoch": 582} {"train_loss": -37.75006103515625, "global_step": 70474, "epoch": 582} {"train_loss": -37.49839401245117, "global_step": 70475, "epoch": 582} {"train_loss": -36.4631462097168, "global_step": 70476, "epoch": 582} {"train_loss": -34.732452392578125, "global_step": 70477, "epoch": 582} {"train_loss": -31.54623794555664, "global_step": 70478, "epoch": 582} {"train_loss": -25.415557861328125, "global_step": 70479, "epoch": 582} {"train_loss": -23.833723068237305, "global_step": 70480, "epoch": 582} {"train_loss": -27.80352210998535, "global_step": 70481, "epoch": 582} {"train_loss": -31.574451446533203, "global_step": 70482, "epoch": 582} {"train_loss": -34.40497970581055, "global_step": 70483, "epoch": 582} {"train_loss": -34.546905517578125, "global_step": 70484, "epoch": 582} {"train_loss": -35.4451904296875, "global_step": 70485, "epoch": 582} {"train_loss": -33.951019287109375, "global_step": 70486, "epoch": 582} {"train_loss": -34.593013763427734, "global_step": 70487, "epoch": 582} {"train_loss": -35.39238357543945, "global_step": 70488, "epoch": 582} {"train_loss": -35.4747314453125, "global_step": 70489, "epoch": 582} {"train_loss": -33.5953254699707, "global_step": 70490, "epoch": 582} {"train_loss": -35.43973922729492, "global_step": 70491, "epoch": 582} {"train_loss": -34.04973220825195, "global_step": 70492, "epoch": 582} {"train_loss": -35.847389221191406, "global_step": 70493, "epoch": 582} {"train_loss": -36.18597412109375, "global_step": 70494, "epoch": 582} {"train_loss": -35.08003234863281, "global_step": 70495, "epoch": 582} {"train_loss": -34.81069564819336, "global_step": 70496, "epoch": 582} {"train_loss": -35.79597473144531, "global_step": 70497, "epoch": 582} {"train_loss": -35.74127960205078, "global_step": 70498, "epoch": 582} {"train_loss": -33.03473663330078, "global_step": 70499, "epoch": 582} {"train_loss": -34.947479248046875, "global_step": 70500, "epoch": 582} {"train_loss": -36.00647735595703, "global_step": 70501, "epoch": 582} {"train_loss": -36.12250900268555, "global_step": 70502, "epoch": 582} {"train_loss": -33.67196273803711, "global_step": 70503, "epoch": 582} {"train_loss": -35.91769790649414, "global_step": 70504, "epoch": 582} {"train_loss": -36.220760345458984, "global_step": 70505, "epoch": 582} {"train_loss": -34.175498962402344, "global_step": 70506, "epoch": 582} {"train_loss": -35.60568618774414, "global_step": 70507, "epoch": 582} {"train_loss": -34.86252975463867, "global_step": 70508, "epoch": 582} {"train_loss": -34.734283447265625, "global_step": 70509, "epoch": 582} {"train_loss": -27.483728408813477, "global_step": 70510, "epoch": 582} {"train_loss": -34.65418243408203, "global_step": 70511, "epoch": 582} {"train_loss": -34.69347381591797, "global_step": 70512, "epoch": 582} {"train_loss": -32.560707092285156, "global_step": 70513, "epoch": 582} {"train_loss": -33.81616973876953, "global_step": 70514, "epoch": 582} {"train_loss": -34.61979293823242, "global_step": 70515, "epoch": 582} {"train_loss": -34.41309356689453, "global_step": 70516, "epoch": 582} {"train_loss": -34.32200241088867, "global_step": 70517, "epoch": 582} {"train_loss": -35.385311126708984, "global_step": 70518, "epoch": 582} {"train_loss": -34.41854476928711, "global_step": 70519, "epoch": 582} {"train_loss": -34.083282470703125, "global_step": 70520, "epoch": 582} {"train_loss": -35.04738998413086, "global_step": 70521, "epoch": 582} {"train_loss": -34.37578582763672, "global_step": 70522, "epoch": 582} {"train_loss": -32.631038665771484, "global_step": 70523, "epoch": 582} {"train_loss": -35.134883880615234, "global_step": 70524, "epoch": 582} {"train_loss": -32.93736267089844, "global_step": 70525, "epoch": 582} {"train_loss": -35.0096435546875, "global_step": 70526, "epoch": 582} {"train_loss": -35.74869918823242, "global_step": 70527, "epoch": 582} {"train_loss": -35.54902267456055, "global_step": 70528, "epoch": 582} {"train_loss": -35.54755783081055, "global_step": 70529, "epoch": 582} {"train_loss": -36.23536682128906, "global_step": 70530, "epoch": 582} {"train_loss": -35.28373718261719, "global_step": 70531, "epoch": 582} {"train_loss": -35.22092819213867, "global_step": 70532, "epoch": 582} {"train_loss": -35.332332611083984, "global_step": 70533, "epoch": 582} {"train_loss": -35.228702545166016, "global_step": 70534, "epoch": 582} {"train_loss": -35.719825744628906, "global_step": 70535, "epoch": 582} {"train_loss": -35.189849853515625, "global_step": 70536, "epoch": 582} {"train_loss": -36.14473342895508, "global_step": 70537, "epoch": 582} {"train_loss": -35.76620101928711, "global_step": 70538, "epoch": 582} {"train_loss": -35.87858963012695, "global_step": 70539, "epoch": 582} {"train_loss": -35.809974670410156, "global_step": 70540, "epoch": 582} {"train_loss": -35.47581100463867, "global_step": 70541, "epoch": 582} {"train_loss": -35.45399631153453, "global_step": 70542, "epoch": 582, "val_loss": 2722951.5} {"train_loss": -35.55990219116211, "global_step": 70543, "epoch": 583} {"train_loss": -36.33432388305664, "global_step": 70544, "epoch": 583} {"train_loss": -35.967350006103516, "global_step": 70545, "epoch": 583} {"train_loss": -36.25398635864258, "global_step": 70546, "epoch": 583} {"train_loss": -36.21034622192383, "global_step": 70547, "epoch": 583} {"train_loss": -36.46721267700195, "global_step": 70548, "epoch": 583} {"train_loss": -36.37044906616211, "global_step": 70549, "epoch": 583} {"train_loss": -36.751102447509766, "global_step": 70550, "epoch": 583} {"train_loss": -36.578857421875, "global_step": 70551, "epoch": 583} {"train_loss": -36.24309158325195, "global_step": 70552, "epoch": 583} {"train_loss": -36.513153076171875, "global_step": 70553, "epoch": 583} {"train_loss": -36.8527946472168, "global_step": 70554, "epoch": 583} {"train_loss": -36.55224609375, "global_step": 70555, "epoch": 583} {"train_loss": -36.39516830444336, "global_step": 70556, "epoch": 583} {"train_loss": -36.30768585205078, "global_step": 70557, "epoch": 583} {"train_loss": -36.80924606323242, "global_step": 70558, "epoch": 583} {"train_loss": -36.87052536010742, "global_step": 70559, "epoch": 583} {"train_loss": -36.9599723815918, "global_step": 70560, "epoch": 583} {"train_loss": -37.25751495361328, "global_step": 70561, "epoch": 583} {"train_loss": -36.1926383972168, "global_step": 70562, "epoch": 583} {"train_loss": -36.4869384765625, "global_step": 70563, "epoch": 583} {"train_loss": -36.19806671142578, "global_step": 70564, "epoch": 583} {"train_loss": -36.00216293334961, "global_step": 70565, "epoch": 583} {"train_loss": -36.659183502197266, "global_step": 70566, "epoch": 583} {"train_loss": -36.27573776245117, "global_step": 70567, "epoch": 583} {"train_loss": -35.83047103881836, "global_step": 70568, "epoch": 583} {"train_loss": -35.14751052856445, "global_step": 70569, "epoch": 583} {"train_loss": -37.10920333862305, "global_step": 70570, "epoch": 583} {"train_loss": -37.2001838684082, "global_step": 70571, "epoch": 583} {"train_loss": -36.96135711669922, "global_step": 70572, "epoch": 583} {"train_loss": -37.70675277709961, "global_step": 70573, "epoch": 583} {"train_loss": -37.0083122253418, "global_step": 70574, "epoch": 583} {"train_loss": -37.38235092163086, "global_step": 70575, "epoch": 583} {"train_loss": -37.17707824707031, "global_step": 70576, "epoch": 583} {"train_loss": -37.54710006713867, "global_step": 70577, "epoch": 583} {"train_loss": -37.1378288269043, "global_step": 70578, "epoch": 583} {"train_loss": -37.07475662231445, "global_step": 70579, "epoch": 583} {"train_loss": -36.833839416503906, "global_step": 70580, "epoch": 583} {"train_loss": -36.88471603393555, "global_step": 70581, "epoch": 583} {"train_loss": -36.90315628051758, "global_step": 70582, "epoch": 583} {"train_loss": -37.319732666015625, "global_step": 70583, "epoch": 583} {"train_loss": -37.366188049316406, "global_step": 70584, "epoch": 583} {"train_loss": -35.190608978271484, "global_step": 70585, "epoch": 583} {"train_loss": -35.33770751953125, "global_step": 70586, "epoch": 583} {"train_loss": -36.40451431274414, "global_step": 70587, "epoch": 583} {"train_loss": -37.05957794189453, "global_step": 70588, "epoch": 583} {"train_loss": -37.05827713012695, "global_step": 70589, "epoch": 583} {"train_loss": -37.683712005615234, "global_step": 70590, "epoch": 583} {"train_loss": -37.07990264892578, "global_step": 70591, "epoch": 583} {"train_loss": -36.66392135620117, "global_step": 70592, "epoch": 583} {"train_loss": -37.2514533996582, "global_step": 70593, "epoch": 583} {"train_loss": -37.23703384399414, "global_step": 70594, "epoch": 583} {"train_loss": -33.20734786987305, "global_step": 70595, "epoch": 583} {"train_loss": -37.613250732421875, "global_step": 70596, "epoch": 583} {"train_loss": -37.553951263427734, "global_step": 70597, "epoch": 583} {"train_loss": -36.05316162109375, "global_step": 70598, "epoch": 583} {"train_loss": -34.832359313964844, "global_step": 70599, "epoch": 583} {"train_loss": -36.40110397338867, "global_step": 70600, "epoch": 583} {"train_loss": -35.44242858886719, "global_step": 70601, "epoch": 583} {"train_loss": -36.03834915161133, "global_step": 70602, "epoch": 583} {"train_loss": -36.6573486328125, "global_step": 70603, "epoch": 583} {"train_loss": -36.84934616088867, "global_step": 70604, "epoch": 583} {"train_loss": -36.99365234375, "global_step": 70605, "epoch": 583} {"train_loss": -35.76851272583008, "global_step": 70606, "epoch": 583} {"train_loss": -36.23817825317383, "global_step": 70607, "epoch": 583} {"train_loss": -36.677040100097656, "global_step": 70608, "epoch": 583} {"train_loss": -37.07307815551758, "global_step": 70609, "epoch": 583} {"train_loss": -36.189449310302734, "global_step": 70610, "epoch": 583} {"train_loss": -33.870079040527344, "global_step": 70611, "epoch": 583} {"train_loss": -35.23054885864258, "global_step": 70612, "epoch": 583} {"train_loss": -35.5352668762207, "global_step": 70613, "epoch": 583} {"train_loss": -24.150007247924805, "global_step": 70614, "epoch": 583} {"train_loss": -33.599369049072266, "global_step": 70615, "epoch": 583} {"train_loss": -34.81952667236328, "global_step": 70616, "epoch": 583} {"train_loss": -22.446352005004883, "global_step": 70617, "epoch": 583} {"train_loss": -33.42830276489258, "global_step": 70618, "epoch": 583} {"train_loss": -34.23246765136719, "global_step": 70619, "epoch": 583} {"train_loss": -34.192596435546875, "global_step": 70620, "epoch": 583} {"train_loss": -29.975616455078125, "global_step": 70621, "epoch": 583} {"train_loss": -16.792606353759766, "global_step": 70622, "epoch": 583} {"train_loss": -33.21327590942383, "global_step": 70623, "epoch": 583} {"train_loss": -33.378116607666016, "global_step": 70624, "epoch": 583} {"train_loss": -33.264312744140625, "global_step": 70625, "epoch": 583} {"train_loss": -32.79325866699219, "global_step": 70626, "epoch": 583} {"train_loss": -30.181121826171875, "global_step": 70627, "epoch": 583} {"train_loss": -31.3251895904541, "global_step": 70628, "epoch": 583} {"train_loss": -32.904136657714844, "global_step": 70629, "epoch": 583} {"train_loss": -34.04448318481445, "global_step": 70630, "epoch": 583} {"train_loss": -33.14131164550781, "global_step": 70631, "epoch": 583} {"train_loss": -33.593868255615234, "global_step": 70632, "epoch": 583} {"train_loss": -33.90995407104492, "global_step": 70633, "epoch": 583} {"train_loss": -33.28409957885742, "global_step": 70634, "epoch": 583} {"train_loss": -33.85908126831055, "global_step": 70635, "epoch": 583} {"train_loss": -33.60275650024414, "global_step": 70636, "epoch": 583} {"train_loss": -34.72757339477539, "global_step": 70637, "epoch": 583} {"train_loss": -32.853851318359375, "global_step": 70638, "epoch": 583} {"train_loss": -34.51005554199219, "global_step": 70639, "epoch": 583} {"train_loss": -34.51577377319336, "global_step": 70640, "epoch": 583} {"train_loss": -33.78890609741211, "global_step": 70641, "epoch": 583} {"train_loss": -34.488948822021484, "global_step": 70642, "epoch": 583} {"train_loss": -35.34332275390625, "global_step": 70643, "epoch": 583} {"train_loss": -34.33302307128906, "global_step": 70644, "epoch": 583} {"train_loss": -34.31197738647461, "global_step": 70645, "epoch": 583} {"train_loss": -33.84684371948242, "global_step": 70646, "epoch": 583} {"train_loss": -35.04932403564453, "global_step": 70647, "epoch": 583} {"train_loss": -34.8245964050293, "global_step": 70648, "epoch": 583} {"train_loss": -34.961761474609375, "global_step": 70649, "epoch": 583} {"train_loss": -34.843013763427734, "global_step": 70650, "epoch": 583} {"train_loss": -35.77197265625, "global_step": 70651, "epoch": 583} {"train_loss": -35.13333511352539, "global_step": 70652, "epoch": 583} {"train_loss": -35.49958038330078, "global_step": 70653, "epoch": 583} {"train_loss": -35.018367767333984, "global_step": 70654, "epoch": 583} {"train_loss": -36.130706787109375, "global_step": 70655, "epoch": 583} {"train_loss": -35.40625762939453, "global_step": 70656, "epoch": 583} {"train_loss": -35.894466400146484, "global_step": 70657, "epoch": 583} {"train_loss": -35.98053741455078, "global_step": 70658, "epoch": 583} {"train_loss": -35.6676139831543, "global_step": 70659, "epoch": 583} {"train_loss": -36.08698654174805, "global_step": 70660, "epoch": 583} {"train_loss": -35.488800048828125, "global_step": 70661, "epoch": 583} {"train_loss": -35.57279586791992, "global_step": 70662, "epoch": 583} {"train_loss": -35.23096644188747, "global_step": 70663, "epoch": 583, "val_loss": 2711348.25} {"train_loss": -35.712249755859375, "global_step": 70664, "epoch": 584} {"train_loss": -36.2281379699707, "global_step": 70665, "epoch": 584} {"train_loss": -35.997039794921875, "global_step": 70666, "epoch": 584} {"train_loss": -36.517032623291016, "global_step": 70667, "epoch": 584} {"train_loss": -36.89163589477539, "global_step": 70668, "epoch": 584} {"train_loss": -36.27657699584961, "global_step": 70669, "epoch": 584} {"train_loss": -36.674312591552734, "global_step": 70670, "epoch": 584} {"train_loss": -36.57120895385742, "global_step": 70671, "epoch": 584} {"train_loss": -36.89377975463867, "global_step": 70672, "epoch": 584} {"train_loss": -36.40651321411133, "global_step": 70673, "epoch": 584} {"train_loss": -37.341556549072266, "global_step": 70674, "epoch": 584} {"train_loss": -36.989498138427734, "global_step": 70675, "epoch": 584} {"train_loss": -37.08420944213867, "global_step": 70676, "epoch": 584} {"train_loss": -36.515010833740234, "global_step": 70677, "epoch": 584} {"train_loss": -36.54575729370117, "global_step": 70678, "epoch": 584} {"train_loss": -36.653228759765625, "global_step": 70679, "epoch": 584} {"train_loss": -36.96987533569336, "global_step": 70680, "epoch": 584} {"train_loss": -37.35587692260742, "global_step": 70681, "epoch": 584} {"train_loss": -37.198097229003906, "global_step": 70682, "epoch": 584} {"train_loss": -37.46014404296875, "global_step": 70683, "epoch": 584} {"train_loss": -37.10952377319336, "global_step": 70684, "epoch": 584} {"train_loss": -37.46431350708008, "global_step": 70685, "epoch": 584} {"train_loss": -37.4349479675293, "global_step": 70686, "epoch": 584} {"train_loss": -37.52706527709961, "global_step": 70687, "epoch": 584} {"train_loss": -37.43465042114258, "global_step": 70688, "epoch": 584} {"train_loss": -37.502315521240234, "global_step": 70689, "epoch": 584} {"train_loss": -37.72771072387695, "global_step": 70690, "epoch": 584} {"train_loss": -37.476234436035156, "global_step": 70691, "epoch": 584} {"train_loss": -37.470970153808594, "global_step": 70692, "epoch": 584} {"train_loss": -37.59279251098633, "global_step": 70693, "epoch": 584} {"train_loss": -37.6877555847168, "global_step": 70694, "epoch": 584} {"train_loss": -37.718048095703125, "global_step": 70695, "epoch": 584} {"train_loss": -37.521114349365234, "global_step": 70696, "epoch": 584} {"train_loss": -37.657814025878906, "global_step": 70697, "epoch": 584} {"train_loss": -37.92512130737305, "global_step": 70698, "epoch": 584} {"train_loss": -37.825958251953125, "global_step": 70699, "epoch": 584} {"train_loss": -37.555294036865234, "global_step": 70700, "epoch": 584} {"train_loss": -37.88036346435547, "global_step": 70701, "epoch": 584} {"train_loss": -37.83148193359375, "global_step": 70702, "epoch": 584} {"train_loss": -37.824642181396484, "global_step": 70703, "epoch": 584} {"train_loss": -37.647857666015625, "global_step": 70704, "epoch": 584} {"train_loss": -37.507320404052734, "global_step": 70705, "epoch": 584} {"train_loss": -38.13482666015625, "global_step": 70706, "epoch": 584} {"train_loss": -37.673316955566406, "global_step": 70707, "epoch": 584} {"train_loss": -34.6596565246582, "global_step": 70708, "epoch": 584} {"train_loss": -33.94804763793945, "global_step": 70709, "epoch": 584} {"train_loss": -36.05207061767578, "global_step": 70710, "epoch": 584} {"train_loss": -35.065494537353516, "global_step": 70711, "epoch": 584} {"train_loss": -33.72929382324219, "global_step": 70712, "epoch": 584} {"train_loss": -36.880062103271484, "global_step": 70713, "epoch": 584} {"train_loss": -36.21220397949219, "global_step": 70714, "epoch": 584} {"train_loss": -35.55971145629883, "global_step": 70715, "epoch": 584} {"train_loss": -32.3942985534668, "global_step": 70716, "epoch": 584} {"train_loss": -33.42300033569336, "global_step": 70717, "epoch": 584} {"train_loss": -30.12900161743164, "global_step": 70718, "epoch": 584} {"train_loss": -30.699920654296875, "global_step": 70719, "epoch": 584} {"train_loss": -34.3392219543457, "global_step": 70720, "epoch": 584} {"train_loss": -32.96229934692383, "global_step": 70721, "epoch": 584} {"train_loss": -33.265663146972656, "global_step": 70722, "epoch": 584} {"train_loss": -29.8181209564209, "global_step": 70723, "epoch": 584} {"train_loss": -32.97050476074219, "global_step": 70724, "epoch": 584} {"train_loss": -28.4633846282959, "global_step": 70725, "epoch": 584} {"train_loss": -26.8769474029541, "global_step": 70726, "epoch": 584} {"train_loss": -26.193479537963867, "global_step": 70727, "epoch": 584} {"train_loss": -20.2011661529541, "global_step": 70728, "epoch": 584} {"train_loss": -23.406728744506836, "global_step": 70729, "epoch": 584} {"train_loss": -28.842376708984375, "global_step": 70730, "epoch": 584} {"train_loss": -25.13557243347168, "global_step": 70731, "epoch": 584} {"train_loss": -29.51413917541504, "global_step": 70732, "epoch": 584} {"train_loss": -27.598051071166992, "global_step": 70733, "epoch": 584} {"train_loss": -29.225830078125, "global_step": 70734, "epoch": 584} {"train_loss": -30.521142959594727, "global_step": 70735, "epoch": 584} {"train_loss": -29.047033309936523, "global_step": 70736, "epoch": 584} {"train_loss": -29.343427658081055, "global_step": 70737, "epoch": 584} {"train_loss": -30.119251251220703, "global_step": 70738, "epoch": 584} {"train_loss": -30.081649780273438, "global_step": 70739, "epoch": 584} {"train_loss": -29.74256706237793, "global_step": 70740, "epoch": 584} {"train_loss": -30.486364364624023, "global_step": 70741, "epoch": 584} {"train_loss": -31.40218162536621, "global_step": 70742, "epoch": 584} {"train_loss": -30.89387321472168, "global_step": 70743, "epoch": 584} {"train_loss": -31.0970458984375, "global_step": 70744, "epoch": 584} {"train_loss": -31.2972412109375, "global_step": 70745, "epoch": 584} {"train_loss": -31.965967178344727, "global_step": 70746, "epoch": 584} {"train_loss": -32.20286178588867, "global_step": 70747, "epoch": 584} {"train_loss": -32.20703887939453, "global_step": 70748, "epoch": 584} {"train_loss": -33.14602279663086, "global_step": 70749, "epoch": 584} {"train_loss": -32.84043884277344, "global_step": 70750, "epoch": 584} {"train_loss": -32.631065368652344, "global_step": 70751, "epoch": 584} {"train_loss": -32.12527084350586, "global_step": 70752, "epoch": 584} {"train_loss": -32.623695373535156, "global_step": 70753, "epoch": 584} {"train_loss": -33.93073272705078, "global_step": 70754, "epoch": 584} {"train_loss": -32.9564094543457, "global_step": 70755, "epoch": 584} {"train_loss": -32.96384811401367, "global_step": 70756, "epoch": 584} {"train_loss": -30.086105346679688, "global_step": 70757, "epoch": 584} {"train_loss": -26.568744659423828, "global_step": 70758, "epoch": 584} {"train_loss": -32.899085998535156, "global_step": 70759, "epoch": 584} {"train_loss": -29.810781478881836, "global_step": 70760, "epoch": 584} {"train_loss": -32.34943771362305, "global_step": 70761, "epoch": 584} {"train_loss": -31.491352081298828, "global_step": 70762, "epoch": 584} {"train_loss": -31.931354522705078, "global_step": 70763, "epoch": 584} {"train_loss": -31.935216903686523, "global_step": 70764, "epoch": 584} {"train_loss": -28.5080509185791, "global_step": 70765, "epoch": 584} {"train_loss": -27.7220458984375, "global_step": 70766, "epoch": 584} {"train_loss": -29.6196346282959, "global_step": 70767, "epoch": 584} {"train_loss": -31.201705932617188, "global_step": 70768, "epoch": 584} {"train_loss": -31.883529663085938, "global_step": 70769, "epoch": 584} {"train_loss": -30.797393798828125, "global_step": 70770, "epoch": 584} {"train_loss": -31.905502319335938, "global_step": 70771, "epoch": 584} {"train_loss": -27.80854606628418, "global_step": 70772, "epoch": 584} {"train_loss": -31.90665054321289, "global_step": 70773, "epoch": 584} {"train_loss": -32.338741302490234, "global_step": 70774, "epoch": 584} {"train_loss": -31.181421279907227, "global_step": 70775, "epoch": 584} {"train_loss": -33.28488540649414, "global_step": 70776, "epoch": 584} {"train_loss": -32.0930290222168, "global_step": 70777, "epoch": 584} {"train_loss": -33.400245666503906, "global_step": 70778, "epoch": 584} {"train_loss": -32.1971549987793, "global_step": 70779, "epoch": 584} {"train_loss": -33.57443618774414, "global_step": 70780, "epoch": 584} {"train_loss": -33.01048278808594, "global_step": 70781, "epoch": 584} {"train_loss": -33.78078842163086, "global_step": 70782, "epoch": 584} {"train_loss": -33.248077392578125, "global_step": 70783, "epoch": 584} {"train_loss": -33.457040282320385, "global_step": 70784, "epoch": 584, "val_loss": 2595916.25} {"train_loss": -33.685462951660156, "global_step": 70785, "epoch": 585} {"train_loss": -32.8629264831543, "global_step": 70786, "epoch": 585} {"train_loss": -32.768959045410156, "global_step": 70787, "epoch": 585} {"train_loss": -33.190032958984375, "global_step": 70788, "epoch": 585} {"train_loss": -34.07361602783203, "global_step": 70789, "epoch": 585} {"train_loss": -34.14463806152344, "global_step": 70790, "epoch": 585} {"train_loss": -34.34530258178711, "global_step": 70791, "epoch": 585} {"train_loss": -33.98237609863281, "global_step": 70792, "epoch": 585} {"train_loss": -34.19824981689453, "global_step": 70793, "epoch": 585} {"train_loss": -34.415443420410156, "global_step": 70794, "epoch": 585} {"train_loss": -34.64756393432617, "global_step": 70795, "epoch": 585} {"train_loss": -34.33781051635742, "global_step": 70796, "epoch": 585} {"train_loss": -34.487796783447266, "global_step": 70797, "epoch": 585} {"train_loss": -34.655853271484375, "global_step": 70798, "epoch": 585} {"train_loss": -34.73494338989258, "global_step": 70799, "epoch": 585} {"train_loss": -33.817501068115234, "global_step": 70800, "epoch": 585} {"train_loss": -35.13474655151367, "global_step": 70801, "epoch": 585} {"train_loss": -34.75063705444336, "global_step": 70802, "epoch": 585} {"train_loss": -35.36685562133789, "global_step": 70803, "epoch": 585} {"train_loss": -34.806480407714844, "global_step": 70804, "epoch": 585} {"train_loss": -35.2452392578125, "global_step": 70805, "epoch": 585} {"train_loss": -35.03261947631836, "global_step": 70806, "epoch": 585} {"train_loss": -35.3974609375, "global_step": 70807, "epoch": 585} {"train_loss": -34.885276794433594, "global_step": 70808, "epoch": 585} {"train_loss": -34.96776580810547, "global_step": 70809, "epoch": 585} {"train_loss": -35.19462203979492, "global_step": 70810, "epoch": 585} {"train_loss": -35.3736457824707, "global_step": 70811, "epoch": 585} {"train_loss": -35.490333557128906, "global_step": 70812, "epoch": 585} {"train_loss": -35.00411605834961, "global_step": 70813, "epoch": 585} {"train_loss": -35.61449432373047, "global_step": 70814, "epoch": 585} {"train_loss": -35.155357360839844, "global_step": 70815, "epoch": 585} {"train_loss": -34.988529205322266, "global_step": 70816, "epoch": 585} {"train_loss": -35.58789825439453, "global_step": 70817, "epoch": 585} {"train_loss": -35.46735763549805, "global_step": 70818, "epoch": 585} {"train_loss": -35.232418060302734, "global_step": 70819, "epoch": 585} {"train_loss": -34.965980529785156, "global_step": 70820, "epoch": 585} {"train_loss": -35.62893295288086, "global_step": 70821, "epoch": 585} {"train_loss": -34.681148529052734, "global_step": 70822, "epoch": 585} {"train_loss": -35.57278060913086, "global_step": 70823, "epoch": 585} {"train_loss": -36.07642364501953, "global_step": 70824, "epoch": 585} {"train_loss": -35.94074249267578, "global_step": 70825, "epoch": 585} {"train_loss": -35.85074996948242, "global_step": 70826, "epoch": 585} {"train_loss": -36.332576751708984, "global_step": 70827, "epoch": 585} {"train_loss": -35.81760787963867, "global_step": 70828, "epoch": 585} {"train_loss": -36.32378005981445, "global_step": 70829, "epoch": 585} {"train_loss": -35.477813720703125, "global_step": 70830, "epoch": 585} {"train_loss": -35.81423568725586, "global_step": 70831, "epoch": 585} {"train_loss": -34.85747146606445, "global_step": 70832, "epoch": 585} {"train_loss": -31.61994743347168, "global_step": 70833, "epoch": 585} {"train_loss": -20.711559295654297, "global_step": 70834, "epoch": 585} {"train_loss": -14.668556213378906, "global_step": 70835, "epoch": 585} {"train_loss": -24.891454696655273, "global_step": 70836, "epoch": 585} {"train_loss": -27.88545799255371, "global_step": 70837, "epoch": 585} {"train_loss": -28.549962997436523, "global_step": 70838, "epoch": 585} {"train_loss": -29.799335479736328, "global_step": 70839, "epoch": 585} {"train_loss": -30.3198299407959, "global_step": 70840, "epoch": 585} {"train_loss": -33.38944625854492, "global_step": 70841, "epoch": 585} {"train_loss": -29.165485382080078, "global_step": 70842, "epoch": 585} {"train_loss": -33.70478439331055, "global_step": 70843, "epoch": 585} {"train_loss": -33.23503875732422, "global_step": 70844, "epoch": 585} {"train_loss": -32.356014251708984, "global_step": 70845, "epoch": 585} {"train_loss": -34.31316375732422, "global_step": 70846, "epoch": 585} {"train_loss": -33.8878059387207, "global_step": 70847, "epoch": 585} {"train_loss": -33.6856575012207, "global_step": 70848, "epoch": 585} {"train_loss": -34.17466354370117, "global_step": 70849, "epoch": 585} {"train_loss": -34.783016204833984, "global_step": 70850, "epoch": 585} {"train_loss": -34.62860107421875, "global_step": 70851, "epoch": 585} {"train_loss": -34.86922836303711, "global_step": 70852, "epoch": 585} {"train_loss": -34.65497970581055, "global_step": 70853, "epoch": 585} {"train_loss": -34.12929916381836, "global_step": 70854, "epoch": 585} {"train_loss": -34.80354690551758, "global_step": 70855, "epoch": 585} {"train_loss": -34.9090461730957, "global_step": 70856, "epoch": 585} {"train_loss": -34.493221282958984, "global_step": 70857, "epoch": 585} {"train_loss": -35.08612060546875, "global_step": 70858, "epoch": 585} {"train_loss": -34.93264389038086, "global_step": 70859, "epoch": 585} {"train_loss": -35.150917053222656, "global_step": 70860, "epoch": 585} {"train_loss": -34.95021057128906, "global_step": 70861, "epoch": 585} {"train_loss": -35.0368766784668, "global_step": 70862, "epoch": 585} {"train_loss": -35.045082092285156, "global_step": 70863, "epoch": 585} {"train_loss": -35.32752227783203, "global_step": 70864, "epoch": 585} {"train_loss": -34.866275787353516, "global_step": 70865, "epoch": 585} {"train_loss": -35.0933952331543, "global_step": 70866, "epoch": 585} {"train_loss": -35.54729080200195, "global_step": 70867, "epoch": 585} {"train_loss": -35.381160736083984, "global_step": 70868, "epoch": 585} {"train_loss": -35.30007553100586, "global_step": 70869, "epoch": 585} {"train_loss": -35.49949264526367, "global_step": 70870, "epoch": 585} {"train_loss": -35.27984619140625, "global_step": 70871, "epoch": 585} {"train_loss": -35.47683334350586, "global_step": 70872, "epoch": 585} {"train_loss": -35.4633674621582, "global_step": 70873, "epoch": 585} {"train_loss": -35.58511734008789, "global_step": 70874, "epoch": 585} {"train_loss": -36.02569580078125, "global_step": 70875, "epoch": 585} {"train_loss": -35.420188903808594, "global_step": 70876, "epoch": 585} {"train_loss": -34.8155517578125, "global_step": 70877, "epoch": 585} {"train_loss": -35.6990966796875, "global_step": 70878, "epoch": 585} {"train_loss": -35.48783874511719, "global_step": 70879, "epoch": 585} {"train_loss": -36.19384765625, "global_step": 70880, "epoch": 585} {"train_loss": -35.8243522644043, "global_step": 70881, "epoch": 585} {"train_loss": -35.49443817138672, "global_step": 70882, "epoch": 585} {"train_loss": -33.50947189331055, "global_step": 70883, "epoch": 585} {"train_loss": -26.0581111907959, "global_step": 70884, "epoch": 585} {"train_loss": -14.972311973571777, "global_step": 70885, "epoch": 585} {"train_loss": -29.780261993408203, "global_step": 70886, "epoch": 585} {"train_loss": -30.118213653564453, "global_step": 70887, "epoch": 585} {"train_loss": -30.86419677734375, "global_step": 70888, "epoch": 585} {"train_loss": -29.986425399780273, "global_step": 70889, "epoch": 585} {"train_loss": -34.0764274597168, "global_step": 70890, "epoch": 585} {"train_loss": -28.946271896362305, "global_step": 70891, "epoch": 585} {"train_loss": -34.582637786865234, "global_step": 70892, "epoch": 585} {"train_loss": -32.42257308959961, "global_step": 70893, "epoch": 585} {"train_loss": -32.872562408447266, "global_step": 70894, "epoch": 585} {"train_loss": -34.60758590698242, "global_step": 70895, "epoch": 585} {"train_loss": -33.19411849975586, "global_step": 70896, "epoch": 585} {"train_loss": -33.041259765625, "global_step": 70897, "epoch": 585} {"train_loss": -34.7457275390625, "global_step": 70898, "epoch": 585} {"train_loss": -34.2758903503418, "global_step": 70899, "epoch": 585} {"train_loss": -33.727867126464844, "global_step": 70900, "epoch": 585} {"train_loss": -34.17652130126953, "global_step": 70901, "epoch": 585} {"train_loss": -34.546058654785156, "global_step": 70902, "epoch": 585} {"train_loss": -34.3917236328125, "global_step": 70903, "epoch": 585} {"train_loss": -33.982452392578125, "global_step": 70904, "epoch": 585} {"train_loss": -33.695746516393235, "global_step": 70905, "epoch": 585, "val_loss": 2546268.0} {"train_loss": -34.72944259643555, "global_step": 70906, "epoch": 586} {"train_loss": -34.89033889770508, "global_step": 70907, "epoch": 586} {"train_loss": -34.29592514038086, "global_step": 70908, "epoch": 586} {"train_loss": -34.73212814331055, "global_step": 70909, "epoch": 586} {"train_loss": -34.91038131713867, "global_step": 70910, "epoch": 586} {"train_loss": -34.12655258178711, "global_step": 70911, "epoch": 586} {"train_loss": -34.9496955871582, "global_step": 70912, "epoch": 586} {"train_loss": -34.81108856201172, "global_step": 70913, "epoch": 586} {"train_loss": -34.85830307006836, "global_step": 70914, "epoch": 586} {"train_loss": -34.73033905029297, "global_step": 70915, "epoch": 586} {"train_loss": -35.43402862548828, "global_step": 70916, "epoch": 586} {"train_loss": -35.10529327392578, "global_step": 70917, "epoch": 586} {"train_loss": -34.413429260253906, "global_step": 70918, "epoch": 586} {"train_loss": -34.67965316772461, "global_step": 70919, "epoch": 586} {"train_loss": -35.58240509033203, "global_step": 70920, "epoch": 586} {"train_loss": -35.59210205078125, "global_step": 70921, "epoch": 586} {"train_loss": -35.01155471801758, "global_step": 70922, "epoch": 586} {"train_loss": -35.78401565551758, "global_step": 70923, "epoch": 586} {"train_loss": -35.681678771972656, "global_step": 70924, "epoch": 586} {"train_loss": -35.071041107177734, "global_step": 70925, "epoch": 586} {"train_loss": -35.49158477783203, "global_step": 70926, "epoch": 586} {"train_loss": -36.12015151977539, "global_step": 70927, "epoch": 586} {"train_loss": -35.744625091552734, "global_step": 70928, "epoch": 586} {"train_loss": -35.4376106262207, "global_step": 70929, "epoch": 586} {"train_loss": -34.06641387939453, "global_step": 70930, "epoch": 586} {"train_loss": -36.02756881713867, "global_step": 70931, "epoch": 586} {"train_loss": -35.6272087097168, "global_step": 70932, "epoch": 586} {"train_loss": -35.64068603515625, "global_step": 70933, "epoch": 586} {"train_loss": -36.172645568847656, "global_step": 70934, "epoch": 586} {"train_loss": -35.604732513427734, "global_step": 70935, "epoch": 586} {"train_loss": -35.014991760253906, "global_step": 70936, "epoch": 586} {"train_loss": -35.9566650390625, "global_step": 70937, "epoch": 586} {"train_loss": -35.91920471191406, "global_step": 70938, "epoch": 586} {"train_loss": -35.031593322753906, "global_step": 70939, "epoch": 586} {"train_loss": -36.227657318115234, "global_step": 70940, "epoch": 586} {"train_loss": -35.99745559692383, "global_step": 70941, "epoch": 586} {"train_loss": -35.744239807128906, "global_step": 70942, "epoch": 586} {"train_loss": -35.60564041137695, "global_step": 70943, "epoch": 586} {"train_loss": -36.31332015991211, "global_step": 70944, "epoch": 586} {"train_loss": -35.83535385131836, "global_step": 70945, "epoch": 586} {"train_loss": -35.48994827270508, "global_step": 70946, "epoch": 586} {"train_loss": -36.20151138305664, "global_step": 70947, "epoch": 586} {"train_loss": -35.4093017578125, "global_step": 70948, "epoch": 586} {"train_loss": -36.02225875854492, "global_step": 70949, "epoch": 586} {"train_loss": -35.899044036865234, "global_step": 70950, "epoch": 586} {"train_loss": -35.56638717651367, "global_step": 70951, "epoch": 586} {"train_loss": -35.538204193115234, "global_step": 70952, "epoch": 586} {"train_loss": -34.2071418762207, "global_step": 70953, "epoch": 586} {"train_loss": -31.78572654724121, "global_step": 70954, "epoch": 586} {"train_loss": -29.159961700439453, "global_step": 70955, "epoch": 586} {"train_loss": -27.01862907409668, "global_step": 70956, "epoch": 586} {"train_loss": -32.13072204589844, "global_step": 70957, "epoch": 586} {"train_loss": -33.11299133300781, "global_step": 70958, "epoch": 586} {"train_loss": -30.089263916015625, "global_step": 70959, "epoch": 586} {"train_loss": -34.876644134521484, "global_step": 70960, "epoch": 586} {"train_loss": -32.545745849609375, "global_step": 70961, "epoch": 586} {"train_loss": -35.328468322753906, "global_step": 70962, "epoch": 586} {"train_loss": -33.912410736083984, "global_step": 70963, "epoch": 586} {"train_loss": -35.90481948852539, "global_step": 70964, "epoch": 586} {"train_loss": -35.09013366699219, "global_step": 70965, "epoch": 586} {"train_loss": -35.43563461303711, "global_step": 70966, "epoch": 586} {"train_loss": -35.66743087768555, "global_step": 70967, "epoch": 586} {"train_loss": -35.50868606567383, "global_step": 70968, "epoch": 586} {"train_loss": -34.81210708618164, "global_step": 70969, "epoch": 586} {"train_loss": -35.950653076171875, "global_step": 70970, "epoch": 586} {"train_loss": -35.061195373535156, "global_step": 70971, "epoch": 586} {"train_loss": -35.568477630615234, "global_step": 70972, "epoch": 586} {"train_loss": -35.82685089111328, "global_step": 70973, "epoch": 586} {"train_loss": -35.80253219604492, "global_step": 70974, "epoch": 586} {"train_loss": -35.188201904296875, "global_step": 70975, "epoch": 586} {"train_loss": -36.04569625854492, "global_step": 70976, "epoch": 586} {"train_loss": -36.222877502441406, "global_step": 70977, "epoch": 586} {"train_loss": -35.543006896972656, "global_step": 70978, "epoch": 586} {"train_loss": -35.38888168334961, "global_step": 70979, "epoch": 586} {"train_loss": -36.159358978271484, "global_step": 70980, "epoch": 586} {"train_loss": -35.633174896240234, "global_step": 70981, "epoch": 586} {"train_loss": -35.381797790527344, "global_step": 70982, "epoch": 586} {"train_loss": -36.06867218017578, "global_step": 70983, "epoch": 586} {"train_loss": -35.7138671875, "global_step": 70984, "epoch": 586} {"train_loss": -35.79887008666992, "global_step": 70985, "epoch": 586} {"train_loss": -35.57551956176758, "global_step": 70986, "epoch": 586} {"train_loss": -35.63020706176758, "global_step": 70987, "epoch": 586} {"train_loss": -35.765838623046875, "global_step": 70988, "epoch": 586} {"train_loss": -36.197017669677734, "global_step": 70989, "epoch": 586} {"train_loss": -36.17791748046875, "global_step": 70990, "epoch": 586} {"train_loss": -36.56318664550781, "global_step": 70991, "epoch": 586} {"train_loss": -36.35687255859375, "global_step": 70992, "epoch": 586} {"train_loss": -36.684410095214844, "global_step": 70993, "epoch": 586} {"train_loss": -35.79998779296875, "global_step": 70994, "epoch": 586} {"train_loss": -35.6307487487793, "global_step": 70995, "epoch": 586} {"train_loss": -33.426937103271484, "global_step": 70996, "epoch": 586} {"train_loss": -27.04819107055664, "global_step": 70997, "epoch": 586} {"train_loss": -25.031631469726562, "global_step": 70998, "epoch": 586} {"train_loss": -34.00224685668945, "global_step": 70999, "epoch": 586} {"train_loss": -30.13136100769043, "global_step": 71000, "epoch": 586} {"train_loss": -30.99298667907715, "global_step": 71001, "epoch": 586} {"train_loss": -32.77933120727539, "global_step": 71002, "epoch": 586} {"train_loss": -33.5460205078125, "global_step": 71003, "epoch": 586} {"train_loss": -32.21805953979492, "global_step": 71004, "epoch": 586} {"train_loss": -34.806087493896484, "global_step": 71005, "epoch": 586} {"train_loss": -34.215248107910156, "global_step": 71006, "epoch": 586} {"train_loss": -33.5307731628418, "global_step": 71007, "epoch": 586} {"train_loss": -33.98733139038086, "global_step": 71008, "epoch": 586} {"train_loss": -34.63386917114258, "global_step": 71009, "epoch": 586} {"train_loss": -34.38308334350586, "global_step": 71010, "epoch": 586} {"train_loss": -33.87405014038086, "global_step": 71011, "epoch": 586} {"train_loss": -34.835418701171875, "global_step": 71012, "epoch": 586} {"train_loss": -33.145294189453125, "global_step": 71013, "epoch": 586} {"train_loss": -34.98293685913086, "global_step": 71014, "epoch": 586} {"train_loss": -35.07143783569336, "global_step": 71015, "epoch": 586} {"train_loss": -33.60416793823242, "global_step": 71016, "epoch": 586} {"train_loss": -34.916160583496094, "global_step": 71017, "epoch": 586} {"train_loss": -35.241844177246094, "global_step": 71018, "epoch": 586} {"train_loss": -35.40045928955078, "global_step": 71019, "epoch": 586} {"train_loss": -35.04153060913086, "global_step": 71020, "epoch": 586} {"train_loss": -35.759239196777344, "global_step": 71021, "epoch": 586} {"train_loss": -35.054134368896484, "global_step": 71022, "epoch": 586} {"train_loss": -35.67778396606445, "global_step": 71023, "epoch": 586} {"train_loss": -35.2177734375, "global_step": 71024, "epoch": 586} {"train_loss": -35.5913200378418, "global_step": 71025, "epoch": 586} {"train_loss": -34.754370350483036, "global_step": 71026, "epoch": 586, "val_loss": 2565376.75} {"train_loss": -36.06437301635742, "global_step": 71027, "epoch": 587} {"train_loss": -35.69652557373047, "global_step": 71028, "epoch": 587} {"train_loss": -35.986385345458984, "global_step": 71029, "epoch": 587} {"train_loss": -36.151912689208984, "global_step": 71030, "epoch": 587} {"train_loss": -36.2567253112793, "global_step": 71031, "epoch": 587} {"train_loss": -35.7360954284668, "global_step": 71032, "epoch": 587} {"train_loss": -36.23945236206055, "global_step": 71033, "epoch": 587} {"train_loss": -36.10175323486328, "global_step": 71034, "epoch": 587} {"train_loss": -36.252662658691406, "global_step": 71035, "epoch": 587} {"train_loss": -35.501060485839844, "global_step": 71036, "epoch": 587} {"train_loss": -36.13758087158203, "global_step": 71037, "epoch": 587} {"train_loss": -36.405845642089844, "global_step": 71038, "epoch": 587} {"train_loss": -36.668983459472656, "global_step": 71039, "epoch": 587} {"train_loss": -36.18284606933594, "global_step": 71040, "epoch": 587} {"train_loss": -36.220645904541016, "global_step": 71041, "epoch": 587} {"train_loss": -36.44952392578125, "global_step": 71042, "epoch": 587} {"train_loss": -36.72099685668945, "global_step": 71043, "epoch": 587} {"train_loss": -36.6677360534668, "global_step": 71044, "epoch": 587} {"train_loss": -36.61123275756836, "global_step": 71045, "epoch": 587} {"train_loss": -36.55656051635742, "global_step": 71046, "epoch": 587} {"train_loss": -36.48045349121094, "global_step": 71047, "epoch": 587} {"train_loss": -37.00873565673828, "global_step": 71048, "epoch": 587} {"train_loss": -36.60783004760742, "global_step": 71049, "epoch": 587} {"train_loss": -35.17792892456055, "global_step": 71050, "epoch": 587} {"train_loss": -31.9228458404541, "global_step": 71051, "epoch": 587} {"train_loss": -31.424428939819336, "global_step": 71052, "epoch": 587} {"train_loss": -30.76063346862793, "global_step": 71053, "epoch": 587} {"train_loss": -28.00054359436035, "global_step": 71054, "epoch": 587} {"train_loss": -29.33954429626465, "global_step": 71055, "epoch": 587} {"train_loss": -35.94021224975586, "global_step": 71056, "epoch": 587} {"train_loss": -33.65412139892578, "global_step": 71057, "epoch": 587} {"train_loss": -34.09234619140625, "global_step": 71058, "epoch": 587} {"train_loss": -36.002288818359375, "global_step": 71059, "epoch": 587} {"train_loss": -33.63943099975586, "global_step": 71060, "epoch": 587} {"train_loss": -36.49593734741211, "global_step": 71061, "epoch": 587} {"train_loss": -34.769203186035156, "global_step": 71062, "epoch": 587} {"train_loss": -36.02180480957031, "global_step": 71063, "epoch": 587} {"train_loss": -35.66205978393555, "global_step": 71064, "epoch": 587} {"train_loss": -36.782142639160156, "global_step": 71065, "epoch": 587} {"train_loss": -35.908302307128906, "global_step": 71066, "epoch": 587} {"train_loss": -36.31678771972656, "global_step": 71067, "epoch": 587} {"train_loss": -36.46752166748047, "global_step": 71068, "epoch": 587} {"train_loss": -36.44411087036133, "global_step": 71069, "epoch": 587} {"train_loss": -36.688472747802734, "global_step": 71070, "epoch": 587} {"train_loss": -36.097286224365234, "global_step": 71071, "epoch": 587} {"train_loss": -36.948272705078125, "global_step": 71072, "epoch": 587} {"train_loss": -36.27924728393555, "global_step": 71073, "epoch": 587} {"train_loss": -36.84287643432617, "global_step": 71074, "epoch": 587} {"train_loss": -36.7843132019043, "global_step": 71075, "epoch": 587} {"train_loss": -36.53939437866211, "global_step": 71076, "epoch": 587} {"train_loss": -36.7956657409668, "global_step": 71077, "epoch": 587} {"train_loss": -36.39506912231445, "global_step": 71078, "epoch": 587} {"train_loss": -37.16984558105469, "global_step": 71079, "epoch": 587} {"train_loss": -37.04609298706055, "global_step": 71080, "epoch": 587} {"train_loss": -36.86802291870117, "global_step": 71081, "epoch": 587} {"train_loss": -36.64460754394531, "global_step": 71082, "epoch": 587} {"train_loss": -36.600074768066406, "global_step": 71083, "epoch": 587} {"train_loss": -36.45720291137695, "global_step": 71084, "epoch": 587} {"train_loss": -36.638641357421875, "global_step": 71085, "epoch": 587} {"train_loss": -36.484439849853516, "global_step": 71086, "epoch": 587} {"train_loss": -36.81867218017578, "global_step": 71087, "epoch": 587} {"train_loss": -36.73381423950195, "global_step": 71088, "epoch": 587} {"train_loss": -36.426883697509766, "global_step": 71089, "epoch": 587} {"train_loss": -35.9936637878418, "global_step": 71090, "epoch": 587} {"train_loss": -36.48330307006836, "global_step": 71091, "epoch": 587} {"train_loss": -36.45541763305664, "global_step": 71092, "epoch": 587} {"train_loss": -37.102813720703125, "global_step": 71093, "epoch": 587} {"train_loss": -36.22638702392578, "global_step": 71094, "epoch": 587} {"train_loss": -33.72682571411133, "global_step": 71095, "epoch": 587} {"train_loss": -28.21259117126465, "global_step": 71096, "epoch": 587} {"train_loss": -22.09077262878418, "global_step": 71097, "epoch": 587} {"train_loss": -24.361572265625, "global_step": 71098, "epoch": 587} {"train_loss": -35.34101486206055, "global_step": 71099, "epoch": 587} {"train_loss": -30.194717407226562, "global_step": 71100, "epoch": 587} {"train_loss": -32.35334014892578, "global_step": 71101, "epoch": 587} {"train_loss": -34.4113883972168, "global_step": 71102, "epoch": 587} {"train_loss": -34.02839660644531, "global_step": 71103, "epoch": 587} {"train_loss": -33.67144012451172, "global_step": 71104, "epoch": 587} {"train_loss": -35.04846954345703, "global_step": 71105, "epoch": 587} {"train_loss": -34.31342315673828, "global_step": 71106, "epoch": 587} {"train_loss": -36.75026321411133, "global_step": 71107, "epoch": 587} {"train_loss": -35.53348922729492, "global_step": 71108, "epoch": 587} {"train_loss": -34.89881134033203, "global_step": 71109, "epoch": 587} {"train_loss": -36.12848663330078, "global_step": 71110, "epoch": 587} {"train_loss": -35.382728576660156, "global_step": 71111, "epoch": 587} {"train_loss": -35.04583740234375, "global_step": 71112, "epoch": 587} {"train_loss": -36.66604995727539, "global_step": 71113, "epoch": 587} {"train_loss": -36.18095016479492, "global_step": 71114, "epoch": 587} {"train_loss": -35.706520080566406, "global_step": 71115, "epoch": 587} {"train_loss": -36.53847885131836, "global_step": 71116, "epoch": 587} {"train_loss": -36.658782958984375, "global_step": 71117, "epoch": 587} {"train_loss": -36.453941345214844, "global_step": 71118, "epoch": 587} {"train_loss": -36.38334274291992, "global_step": 71119, "epoch": 587} {"train_loss": -36.37044906616211, "global_step": 71120, "epoch": 587} {"train_loss": -36.586483001708984, "global_step": 71121, "epoch": 587} {"train_loss": -36.60957717895508, "global_step": 71122, "epoch": 587} {"train_loss": -36.13574981689453, "global_step": 71123, "epoch": 587} {"train_loss": -37.0384521484375, "global_step": 71124, "epoch": 587} {"train_loss": -36.501670837402344, "global_step": 71125, "epoch": 587} {"train_loss": -36.286190032958984, "global_step": 71126, "epoch": 587} {"train_loss": -36.6834602355957, "global_step": 71127, "epoch": 587} {"train_loss": -37.00334548950195, "global_step": 71128, "epoch": 587} {"train_loss": -37.155879974365234, "global_step": 71129, "epoch": 587} {"train_loss": -36.60007095336914, "global_step": 71130, "epoch": 587} {"train_loss": -36.93317794799805, "global_step": 71131, "epoch": 587} {"train_loss": -36.673160552978516, "global_step": 71132, "epoch": 587} {"train_loss": -36.9692497253418, "global_step": 71133, "epoch": 587} {"train_loss": -36.7116584777832, "global_step": 71134, "epoch": 587} {"train_loss": -37.085018157958984, "global_step": 71135, "epoch": 587} {"train_loss": -36.72956848144531, "global_step": 71136, "epoch": 587} {"train_loss": -36.724647521972656, "global_step": 71137, "epoch": 587} {"train_loss": -36.34658432006836, "global_step": 71138, "epoch": 587} {"train_loss": -37.16034698486328, "global_step": 71139, "epoch": 587} {"train_loss": -36.646827697753906, "global_step": 71140, "epoch": 587} {"train_loss": -37.07529830932617, "global_step": 71141, "epoch": 587} {"train_loss": -36.735328674316406, "global_step": 71142, "epoch": 587} {"train_loss": -37.06363296508789, "global_step": 71143, "epoch": 587} {"train_loss": -36.908782958984375, "global_step": 71144, "epoch": 587} {"train_loss": -37.001617431640625, "global_step": 71145, "epoch": 587} {"train_loss": -36.47886276245117, "global_step": 71146, "epoch": 587} {"train_loss": -35.6132210818204, "global_step": 71147, "epoch": 587, "val_loss": 2504234.0} {"train_loss": -35.423885345458984, "global_step": 71148, "epoch": 588} {"train_loss": -33.71553421020508, "global_step": 71149, "epoch": 588} {"train_loss": -25.775129318237305, "global_step": 71150, "epoch": 588} {"train_loss": -25.036672592163086, "global_step": 71151, "epoch": 588} {"train_loss": -36.015777587890625, "global_step": 71152, "epoch": 588} {"train_loss": -30.822336196899414, "global_step": 71153, "epoch": 588} {"train_loss": -29.729719161987305, "global_step": 71154, "epoch": 588} {"train_loss": -33.82064437866211, "global_step": 71155, "epoch": 588} {"train_loss": -33.63714599609375, "global_step": 71156, "epoch": 588} {"train_loss": -34.037654876708984, "global_step": 71157, "epoch": 588} {"train_loss": -34.63227462768555, "global_step": 71158, "epoch": 588} {"train_loss": -32.83966064453125, "global_step": 71159, "epoch": 588} {"train_loss": -34.714385986328125, "global_step": 71160, "epoch": 588} {"train_loss": -34.97150421142578, "global_step": 71161, "epoch": 588} {"train_loss": -32.76625442504883, "global_step": 71162, "epoch": 588} {"train_loss": -36.01146697998047, "global_step": 71163, "epoch": 588} {"train_loss": -32.93391418457031, "global_step": 71164, "epoch": 588} {"train_loss": -35.184810638427734, "global_step": 71165, "epoch": 588} {"train_loss": -35.593997955322266, "global_step": 71166, "epoch": 588} {"train_loss": -35.11393737792969, "global_step": 71167, "epoch": 588} {"train_loss": -35.11994171142578, "global_step": 71168, "epoch": 588} {"train_loss": -35.699562072753906, "global_step": 71169, "epoch": 588} {"train_loss": -34.57406234741211, "global_step": 71170, "epoch": 588} {"train_loss": -36.2701301574707, "global_step": 71171, "epoch": 588} {"train_loss": -34.327484130859375, "global_step": 71172, "epoch": 588} {"train_loss": -36.439422607421875, "global_step": 71173, "epoch": 588} {"train_loss": -36.07230758666992, "global_step": 71174, "epoch": 588} {"train_loss": -35.459983825683594, "global_step": 71175, "epoch": 588} {"train_loss": -35.656429290771484, "global_step": 71176, "epoch": 588} {"train_loss": -35.88922882080078, "global_step": 71177, "epoch": 588} {"train_loss": -35.63955307006836, "global_step": 71178, "epoch": 588} {"train_loss": -35.960018157958984, "global_step": 71179, "epoch": 588} {"train_loss": -36.12453842163086, "global_step": 71180, "epoch": 588} {"train_loss": -36.23857498168945, "global_step": 71181, "epoch": 588} {"train_loss": -36.605140686035156, "global_step": 71182, "epoch": 588} {"train_loss": -35.86062240600586, "global_step": 71183, "epoch": 588} {"train_loss": -36.77122116088867, "global_step": 71184, "epoch": 588} {"train_loss": -36.7719841003418, "global_step": 71185, "epoch": 588} {"train_loss": -36.42910385131836, "global_step": 71186, "epoch": 588} {"train_loss": -36.44404220581055, "global_step": 71187, "epoch": 588} {"train_loss": -35.95844650268555, "global_step": 71188, "epoch": 588} {"train_loss": -36.37723922729492, "global_step": 71189, "epoch": 588} {"train_loss": -36.4817008972168, "global_step": 71190, "epoch": 588} {"train_loss": -36.2972412109375, "global_step": 71191, "epoch": 588} {"train_loss": -36.542537689208984, "global_step": 71192, "epoch": 588} {"train_loss": -36.1262321472168, "global_step": 71193, "epoch": 588} {"train_loss": -36.51595687866211, "global_step": 71194, "epoch": 588} {"train_loss": -36.22536087036133, "global_step": 71195, "epoch": 588} {"train_loss": -36.18986892700195, "global_step": 71196, "epoch": 588} {"train_loss": -36.64743423461914, "global_step": 71197, "epoch": 588} {"train_loss": -35.86407470703125, "global_step": 71198, "epoch": 588} {"train_loss": -36.51191329956055, "global_step": 71199, "epoch": 588} {"train_loss": -37.253780364990234, "global_step": 71200, "epoch": 588} {"train_loss": -36.8489875793457, "global_step": 71201, "epoch": 588} {"train_loss": -36.565956115722656, "global_step": 71202, "epoch": 588} {"train_loss": -35.41849899291992, "global_step": 71203, "epoch": 588} {"train_loss": -34.726463317871094, "global_step": 71204, "epoch": 588} {"train_loss": -35.996368408203125, "global_step": 71205, "epoch": 588} {"train_loss": -36.9351921081543, "global_step": 71206, "epoch": 588} {"train_loss": -36.64480972290039, "global_step": 71207, "epoch": 588} {"train_loss": -36.78612518310547, "global_step": 71208, "epoch": 588} {"train_loss": -36.0876350402832, "global_step": 71209, "epoch": 588} {"train_loss": -32.150333404541016, "global_step": 71210, "epoch": 588} {"train_loss": -23.36224937438965, "global_step": 71211, "epoch": 588} {"train_loss": -14.45511531829834, "global_step": 71212, "epoch": 588} {"train_loss": -26.30487632751465, "global_step": 71213, "epoch": 588} {"train_loss": -32.6593132019043, "global_step": 71214, "epoch": 588} {"train_loss": -31.822772979736328, "global_step": 71215, "epoch": 588} {"train_loss": -34.197357177734375, "global_step": 71216, "epoch": 588} {"train_loss": -33.34259033203125, "global_step": 71217, "epoch": 588} {"train_loss": -31.64554214477539, "global_step": 71218, "epoch": 588} {"train_loss": -34.28773880004883, "global_step": 71219, "epoch": 588} {"train_loss": -35.1099967956543, "global_step": 71220, "epoch": 588} {"train_loss": -34.28866195678711, "global_step": 71221, "epoch": 588} {"train_loss": -35.047332763671875, "global_step": 71222, "epoch": 588} {"train_loss": -35.623783111572266, "global_step": 71223, "epoch": 588} {"train_loss": -34.961517333984375, "global_step": 71224, "epoch": 588} {"train_loss": -33.62128448486328, "global_step": 71225, "epoch": 588} {"train_loss": -35.87458038330078, "global_step": 71226, "epoch": 588} {"train_loss": -34.96148681640625, "global_step": 71227, "epoch": 588} {"train_loss": -35.17203903198242, "global_step": 71228, "epoch": 588} {"train_loss": -35.50056076049805, "global_step": 71229, "epoch": 588} {"train_loss": -36.015899658203125, "global_step": 71230, "epoch": 588} {"train_loss": -35.65363311767578, "global_step": 71231, "epoch": 588} {"train_loss": -35.73237991333008, "global_step": 71232, "epoch": 588} {"train_loss": -35.98386764526367, "global_step": 71233, "epoch": 588} {"train_loss": -35.99811553955078, "global_step": 71234, "epoch": 588} {"train_loss": -36.39039993286133, "global_step": 71235, "epoch": 588} {"train_loss": -35.96711349487305, "global_step": 71236, "epoch": 588} {"train_loss": -36.389156341552734, "global_step": 71237, "epoch": 588} {"train_loss": -35.68308639526367, "global_step": 71238, "epoch": 588} {"train_loss": -35.4499626159668, "global_step": 71239, "epoch": 588} {"train_loss": -36.1885871887207, "global_step": 71240, "epoch": 588} {"train_loss": -36.466861724853516, "global_step": 71241, "epoch": 588} {"train_loss": -35.40133285522461, "global_step": 71242, "epoch": 588} {"train_loss": -36.16585159301758, "global_step": 71243, "epoch": 588} {"train_loss": -36.19178771972656, "global_step": 71244, "epoch": 588} {"train_loss": -36.388816833496094, "global_step": 71245, "epoch": 588} {"train_loss": -36.478939056396484, "global_step": 71246, "epoch": 588} {"train_loss": -35.0712890625, "global_step": 71247, "epoch": 588} {"train_loss": -36.295772552490234, "global_step": 71248, "epoch": 588} {"train_loss": -35.982669830322266, "global_step": 71249, "epoch": 588} {"train_loss": -35.91813278198242, "global_step": 71250, "epoch": 588} {"train_loss": -36.416412353515625, "global_step": 71251, "epoch": 588} {"train_loss": -36.47688674926758, "global_step": 71252, "epoch": 588} {"train_loss": -36.39297103881836, "global_step": 71253, "epoch": 588} {"train_loss": -36.62021255493164, "global_step": 71254, "epoch": 588} {"train_loss": -36.82493209838867, "global_step": 71255, "epoch": 588} {"train_loss": -36.85139465332031, "global_step": 71256, "epoch": 588} {"train_loss": -35.66209411621094, "global_step": 71257, "epoch": 588} {"train_loss": -36.09511947631836, "global_step": 71258, "epoch": 588} {"train_loss": -35.849422454833984, "global_step": 71259, "epoch": 588} {"train_loss": -37.041988372802734, "global_step": 71260, "epoch": 588} {"train_loss": -36.48102569580078, "global_step": 71261, "epoch": 588} {"train_loss": -34.61921310424805, "global_step": 71262, "epoch": 588} {"train_loss": -34.304840087890625, "global_step": 71263, "epoch": 588} {"train_loss": -35.615543365478516, "global_step": 71264, "epoch": 588} {"train_loss": -37.054927825927734, "global_step": 71265, "epoch": 588} {"train_loss": -36.61310577392578, "global_step": 71266, "epoch": 588} {"train_loss": -35.254425048828125, "global_step": 71267, "epoch": 588} {"train_loss": -34.96295556155118, "global_step": 71268, "epoch": 588, "val_loss": 2522504.75} {"train_loss": -36.818660736083984, "global_step": 71269, "epoch": 589} {"train_loss": -36.385292053222656, "global_step": 71270, "epoch": 589} {"train_loss": -35.7603874206543, "global_step": 71271, "epoch": 589} {"train_loss": -36.77239990234375, "global_step": 71272, "epoch": 589} {"train_loss": -36.967891693115234, "global_step": 71273, "epoch": 589} {"train_loss": -35.751522064208984, "global_step": 71274, "epoch": 589} {"train_loss": -36.638343811035156, "global_step": 71275, "epoch": 589} {"train_loss": -36.76005935668945, "global_step": 71276, "epoch": 589} {"train_loss": -36.81950759887695, "global_step": 71277, "epoch": 589} {"train_loss": -35.06462097167969, "global_step": 71278, "epoch": 589} {"train_loss": -37.18027877807617, "global_step": 71279, "epoch": 589} {"train_loss": -37.40945816040039, "global_step": 71280, "epoch": 589} {"train_loss": -36.79010009765625, "global_step": 71281, "epoch": 589} {"train_loss": -37.1497688293457, "global_step": 71282, "epoch": 589} {"train_loss": -35.760597229003906, "global_step": 71283, "epoch": 589} {"train_loss": -37.330299377441406, "global_step": 71284, "epoch": 589} {"train_loss": -37.38694763183594, "global_step": 71285, "epoch": 589} {"train_loss": -36.924007415771484, "global_step": 71286, "epoch": 589} {"train_loss": -37.06800079345703, "global_step": 71287, "epoch": 589} {"train_loss": -36.88139343261719, "global_step": 71288, "epoch": 589} {"train_loss": -36.70388412475586, "global_step": 71289, "epoch": 589} {"train_loss": -37.43282699584961, "global_step": 71290, "epoch": 589} {"train_loss": -37.018829345703125, "global_step": 71291, "epoch": 589} {"train_loss": -36.770259857177734, "global_step": 71292, "epoch": 589} {"train_loss": -36.79011917114258, "global_step": 71293, "epoch": 589} {"train_loss": -36.7944221496582, "global_step": 71294, "epoch": 589} {"train_loss": -37.71666717529297, "global_step": 71295, "epoch": 589} {"train_loss": -36.947628021240234, "global_step": 71296, "epoch": 589} {"train_loss": -37.254058837890625, "global_step": 71297, "epoch": 589} {"train_loss": -37.18518829345703, "global_step": 71298, "epoch": 589} {"train_loss": -36.610443115234375, "global_step": 71299, "epoch": 589} {"train_loss": -37.178497314453125, "global_step": 71300, "epoch": 589} {"train_loss": -36.52955627441406, "global_step": 71301, "epoch": 589} {"train_loss": -36.196170806884766, "global_step": 71302, "epoch": 589} {"train_loss": -35.698570251464844, "global_step": 71303, "epoch": 589} {"train_loss": -37.107643127441406, "global_step": 71304, "epoch": 589} {"train_loss": -36.115943908691406, "global_step": 71305, "epoch": 589} {"train_loss": -37.22404479980469, "global_step": 71306, "epoch": 589} {"train_loss": -36.6235466003418, "global_step": 71307, "epoch": 589} {"train_loss": -35.45862579345703, "global_step": 71308, "epoch": 589} {"train_loss": -36.88849639892578, "global_step": 71309, "epoch": 589} {"train_loss": -36.44084167480469, "global_step": 71310, "epoch": 589} {"train_loss": -37.04249954223633, "global_step": 71311, "epoch": 589} {"train_loss": -35.205352783203125, "global_step": 71312, "epoch": 589} {"train_loss": -36.982234954833984, "global_step": 71313, "epoch": 589} {"train_loss": -36.181365966796875, "global_step": 71314, "epoch": 589} {"train_loss": -36.36042022705078, "global_step": 71315, "epoch": 589} {"train_loss": -35.91407775878906, "global_step": 71316, "epoch": 589} {"train_loss": -36.234676361083984, "global_step": 71317, "epoch": 589} {"train_loss": -35.93124008178711, "global_step": 71318, "epoch": 589} {"train_loss": -36.5164680480957, "global_step": 71319, "epoch": 589} {"train_loss": -36.13440704345703, "global_step": 71320, "epoch": 589} {"train_loss": -35.98516845703125, "global_step": 71321, "epoch": 589} {"train_loss": -32.0865592956543, "global_step": 71322, "epoch": 589} {"train_loss": -33.82832717895508, "global_step": 71323, "epoch": 589} {"train_loss": -34.217620849609375, "global_step": 71324, "epoch": 589} {"train_loss": -34.388526916503906, "global_step": 71325, "epoch": 589} {"train_loss": -35.193084716796875, "global_step": 71326, "epoch": 589} {"train_loss": -26.615009307861328, "global_step": 71327, "epoch": 589} {"train_loss": -34.86653518676758, "global_step": 71328, "epoch": 589} {"train_loss": -33.65555953979492, "global_step": 71329, "epoch": 589} {"train_loss": -32.46182632446289, "global_step": 71330, "epoch": 589} {"train_loss": -26.932226181030273, "global_step": 71331, "epoch": 589} {"train_loss": -30.122785568237305, "global_step": 71332, "epoch": 589} {"train_loss": -28.573505401611328, "global_step": 71333, "epoch": 589} {"train_loss": -26.036771774291992, "global_step": 71334, "epoch": 589} {"train_loss": -30.95875358581543, "global_step": 71335, "epoch": 589} {"train_loss": -31.738065719604492, "global_step": 71336, "epoch": 589} {"train_loss": -29.931203842163086, "global_step": 71337, "epoch": 589} {"train_loss": -31.438955307006836, "global_step": 71338, "epoch": 589} {"train_loss": -29.809370040893555, "global_step": 71339, "epoch": 589} {"train_loss": -31.162282943725586, "global_step": 71340, "epoch": 589} {"train_loss": -33.29622268676758, "global_step": 71341, "epoch": 589} {"train_loss": -34.14803695678711, "global_step": 71342, "epoch": 589} {"train_loss": -33.54066848754883, "global_step": 71343, "epoch": 589} {"train_loss": -32.05572509765625, "global_step": 71344, "epoch": 589} {"train_loss": -32.4495964050293, "global_step": 71345, "epoch": 589} {"train_loss": -31.70536231994629, "global_step": 71346, "epoch": 589} {"train_loss": -31.6052188873291, "global_step": 71347, "epoch": 589} {"train_loss": -32.53109359741211, "global_step": 71348, "epoch": 589} {"train_loss": -34.64896011352539, "global_step": 71349, "epoch": 589} {"train_loss": -32.85500717163086, "global_step": 71350, "epoch": 589} {"train_loss": -34.39469528198242, "global_step": 71351, "epoch": 589} {"train_loss": -33.43927764892578, "global_step": 71352, "epoch": 589} {"train_loss": -33.371307373046875, "global_step": 71353, "epoch": 589} {"train_loss": -32.708316802978516, "global_step": 71354, "epoch": 589} {"train_loss": -34.788551330566406, "global_step": 71355, "epoch": 589} {"train_loss": -33.43123245239258, "global_step": 71356, "epoch": 589} {"train_loss": -34.52212142944336, "global_step": 71357, "epoch": 589} {"train_loss": -34.45098114013672, "global_step": 71358, "epoch": 589} {"train_loss": -34.96928024291992, "global_step": 71359, "epoch": 589} {"train_loss": -33.914833068847656, "global_step": 71360, "epoch": 589} {"train_loss": -34.62832260131836, "global_step": 71361, "epoch": 589} {"train_loss": -34.241859436035156, "global_step": 71362, "epoch": 589} {"train_loss": -34.593910217285156, "global_step": 71363, "epoch": 589} {"train_loss": -34.778751373291016, "global_step": 71364, "epoch": 589} {"train_loss": -34.85896682739258, "global_step": 71365, "epoch": 589} {"train_loss": -34.755680084228516, "global_step": 71366, "epoch": 589} {"train_loss": -35.142940521240234, "global_step": 71367, "epoch": 589} {"train_loss": -35.319740295410156, "global_step": 71368, "epoch": 589} {"train_loss": -34.911495208740234, "global_step": 71369, "epoch": 589} {"train_loss": -34.9836311340332, "global_step": 71370, "epoch": 589} {"train_loss": -33.913917541503906, "global_step": 71371, "epoch": 589} {"train_loss": -33.9735221862793, "global_step": 71372, "epoch": 589} {"train_loss": -34.467342376708984, "global_step": 71373, "epoch": 589} {"train_loss": -34.84672927856445, "global_step": 71374, "epoch": 589} {"train_loss": -35.40963363647461, "global_step": 71375, "epoch": 589} {"train_loss": -34.658382415771484, "global_step": 71376, "epoch": 589} {"train_loss": -35.22829055786133, "global_step": 71377, "epoch": 589} {"train_loss": -35.60714340209961, "global_step": 71378, "epoch": 589} {"train_loss": -35.08454132080078, "global_step": 71379, "epoch": 589} {"train_loss": -34.778438568115234, "global_step": 71380, "epoch": 589} {"train_loss": -35.81636428833008, "global_step": 71381, "epoch": 589} {"train_loss": -35.91410446166992, "global_step": 71382, "epoch": 589} {"train_loss": -36.00478744506836, "global_step": 71383, "epoch": 589} {"train_loss": -35.390350341796875, "global_step": 71384, "epoch": 589} {"train_loss": -35.361236572265625, "global_step": 71385, "epoch": 589} {"train_loss": -36.318355560302734, "global_step": 71386, "epoch": 589} {"train_loss": -36.13248825073242, "global_step": 71387, "epoch": 589} {"train_loss": -36.18635177612305, "global_step": 71388, "epoch": 589} {"train_loss": -34.90278762628224, "global_step": 71389, "epoch": 589, "val_loss": 2516586.25} {"train_loss": -36.467403411865234, "global_step": 71390, "epoch": 590} {"train_loss": -35.54293441772461, "global_step": 71391, "epoch": 590} {"train_loss": -36.11697006225586, "global_step": 71392, "epoch": 590} {"train_loss": -35.65079879760742, "global_step": 71393, "epoch": 590} {"train_loss": -35.999874114990234, "global_step": 71394, "epoch": 590} {"train_loss": -36.276458740234375, "global_step": 71395, "epoch": 590} {"train_loss": -36.175350189208984, "global_step": 71396, "epoch": 590} {"train_loss": -36.872833251953125, "global_step": 71397, "epoch": 590} {"train_loss": -36.51649475097656, "global_step": 71398, "epoch": 590} {"train_loss": -36.19912338256836, "global_step": 71399, "epoch": 590} {"train_loss": -35.738948822021484, "global_step": 71400, "epoch": 590} {"train_loss": -34.83740997314453, "global_step": 71401, "epoch": 590} {"train_loss": -32.85091781616211, "global_step": 71402, "epoch": 590} {"train_loss": -32.15053939819336, "global_step": 71403, "epoch": 590} {"train_loss": -30.390104293823242, "global_step": 71404, "epoch": 590} {"train_loss": -26.79950523376465, "global_step": 71405, "epoch": 590} {"train_loss": -28.167882919311523, "global_step": 71406, "epoch": 590} {"train_loss": -35.002037048339844, "global_step": 71407, "epoch": 590} {"train_loss": -35.647701263427734, "global_step": 71408, "epoch": 590} {"train_loss": -34.67945861816406, "global_step": 71409, "epoch": 590} {"train_loss": -35.781673431396484, "global_step": 71410, "epoch": 590} {"train_loss": -33.691551208496094, "global_step": 71411, "epoch": 590} {"train_loss": -36.356788635253906, "global_step": 71412, "epoch": 590} {"train_loss": -34.49564743041992, "global_step": 71413, "epoch": 590} {"train_loss": -36.42672348022461, "global_step": 71414, "epoch": 590} {"train_loss": -35.6929817199707, "global_step": 71415, "epoch": 590} {"train_loss": -36.266090393066406, "global_step": 71416, "epoch": 590} {"train_loss": -36.11719512939453, "global_step": 71417, "epoch": 590} {"train_loss": -36.547523498535156, "global_step": 71418, "epoch": 590} {"train_loss": -36.09229278564453, "global_step": 71419, "epoch": 590} {"train_loss": -35.1824836730957, "global_step": 71420, "epoch": 590} {"train_loss": -36.40280532836914, "global_step": 71421, "epoch": 590} {"train_loss": -35.8126220703125, "global_step": 71422, "epoch": 590} {"train_loss": -35.867774963378906, "global_step": 71423, "epoch": 590} {"train_loss": -36.383975982666016, "global_step": 71424, "epoch": 590} {"train_loss": -36.73455047607422, "global_step": 71425, "epoch": 590} {"train_loss": -36.208106994628906, "global_step": 71426, "epoch": 590} {"train_loss": -36.89044189453125, "global_step": 71427, "epoch": 590} {"train_loss": -36.89351272583008, "global_step": 71428, "epoch": 590} {"train_loss": -36.678741455078125, "global_step": 71429, "epoch": 590} {"train_loss": -36.7044563293457, "global_step": 71430, "epoch": 590} {"train_loss": -36.478515625, "global_step": 71431, "epoch": 590} {"train_loss": -36.60771179199219, "global_step": 71432, "epoch": 590} {"train_loss": -36.264801025390625, "global_step": 71433, "epoch": 590} {"train_loss": -35.449581146240234, "global_step": 71434, "epoch": 590} {"train_loss": -33.050010681152344, "global_step": 71435, "epoch": 590} {"train_loss": -28.613067626953125, "global_step": 71436, "epoch": 590} {"train_loss": -30.638538360595703, "global_step": 71437, "epoch": 590} {"train_loss": -34.899749755859375, "global_step": 71438, "epoch": 590} {"train_loss": -33.8101692199707, "global_step": 71439, "epoch": 590} {"train_loss": -32.954925537109375, "global_step": 71440, "epoch": 590} {"train_loss": -34.45223617553711, "global_step": 71441, "epoch": 590} {"train_loss": -33.349483489990234, "global_step": 71442, "epoch": 590} {"train_loss": -28.714801788330078, "global_step": 71443, "epoch": 590} {"train_loss": -24.803430557250977, "global_step": 71444, "epoch": 590} {"train_loss": -12.466879844665527, "global_step": 71445, "epoch": 590} {"train_loss": -24.542856216430664, "global_step": 71446, "epoch": 590} {"train_loss": -28.107755661010742, "global_step": 71447, "epoch": 590} {"train_loss": -17.445741653442383, "global_step": 71448, "epoch": 590} {"train_loss": -34.05677032470703, "global_step": 71449, "epoch": 590} {"train_loss": -25.1533260345459, "global_step": 71450, "epoch": 590} {"train_loss": -31.680896759033203, "global_step": 71451, "epoch": 590} {"train_loss": -30.80775260925293, "global_step": 71452, "epoch": 590} {"train_loss": -32.1078987121582, "global_step": 71453, "epoch": 590} {"train_loss": -34.32305908203125, "global_step": 71454, "epoch": 590} {"train_loss": -34.15277862548828, "global_step": 71455, "epoch": 590} {"train_loss": -33.03129196166992, "global_step": 71456, "epoch": 590} {"train_loss": -34.055728912353516, "global_step": 71457, "epoch": 590} {"train_loss": -35.0545768737793, "global_step": 71458, "epoch": 590} {"train_loss": -34.159908294677734, "global_step": 71459, "epoch": 590} {"train_loss": -33.739105224609375, "global_step": 71460, "epoch": 590} {"train_loss": -34.952266693115234, "global_step": 71461, "epoch": 590} {"train_loss": -35.11915969848633, "global_step": 71462, "epoch": 590} {"train_loss": -34.86492919921875, "global_step": 71463, "epoch": 590} {"train_loss": -34.526241302490234, "global_step": 71464, "epoch": 590} {"train_loss": -34.965885162353516, "global_step": 71465, "epoch": 590} {"train_loss": -35.116302490234375, "global_step": 71466, "epoch": 590} {"train_loss": -35.23775863647461, "global_step": 71467, "epoch": 590} {"train_loss": -35.29877471923828, "global_step": 71468, "epoch": 590} {"train_loss": -35.32501983642578, "global_step": 71469, "epoch": 590} {"train_loss": -35.24758529663086, "global_step": 71470, "epoch": 590} {"train_loss": -35.84868240356445, "global_step": 71471, "epoch": 590} {"train_loss": -35.440914154052734, "global_step": 71472, "epoch": 590} {"train_loss": -36.14161682128906, "global_step": 71473, "epoch": 590} {"train_loss": -35.82538604736328, "global_step": 71474, "epoch": 590} {"train_loss": -35.51675796508789, "global_step": 71475, "epoch": 590} {"train_loss": -35.98186111450195, "global_step": 71476, "epoch": 590} {"train_loss": -36.39072799682617, "global_step": 71477, "epoch": 590} {"train_loss": -36.0328483581543, "global_step": 71478, "epoch": 590} {"train_loss": -36.429969787597656, "global_step": 71479, "epoch": 590} {"train_loss": -36.24445724487305, "global_step": 71480, "epoch": 590} {"train_loss": -36.28585433959961, "global_step": 71481, "epoch": 590} {"train_loss": -36.32473373413086, "global_step": 71482, "epoch": 590} {"train_loss": -36.238487243652344, "global_step": 71483, "epoch": 590} {"train_loss": -36.33121871948242, "global_step": 71484, "epoch": 590} {"train_loss": -36.0776481628418, "global_step": 71485, "epoch": 590} {"train_loss": -36.25320053100586, "global_step": 71486, "epoch": 590} {"train_loss": -36.2603645324707, "global_step": 71487, "epoch": 590} {"train_loss": -36.75181198120117, "global_step": 71488, "epoch": 590} {"train_loss": -36.584381103515625, "global_step": 71489, "epoch": 590} {"train_loss": -36.10719299316406, "global_step": 71490, "epoch": 590} {"train_loss": -36.22443771362305, "global_step": 71491, "epoch": 590} {"train_loss": -36.45061111450195, "global_step": 71492, "epoch": 590} {"train_loss": -36.31856155395508, "global_step": 71493, "epoch": 590} {"train_loss": -35.2550163269043, "global_step": 71494, "epoch": 590} {"train_loss": -36.94664764404297, "global_step": 71495, "epoch": 590} {"train_loss": -36.59328079223633, "global_step": 71496, "epoch": 590} {"train_loss": -36.61962127685547, "global_step": 71497, "epoch": 590} {"train_loss": -36.36652755737305, "global_step": 71498, "epoch": 590} {"train_loss": -36.78513717651367, "global_step": 71499, "epoch": 590} {"train_loss": -36.582881927490234, "global_step": 71500, "epoch": 590} {"train_loss": -36.80314636230469, "global_step": 71501, "epoch": 590} {"train_loss": -36.6633415222168, "global_step": 71502, "epoch": 590} {"train_loss": -37.228633880615234, "global_step": 71503, "epoch": 590} {"train_loss": -35.8116455078125, "global_step": 71504, "epoch": 590} {"train_loss": -37.04977035522461, "global_step": 71505, "epoch": 590} {"train_loss": -37.22477340698242, "global_step": 71506, "epoch": 590} {"train_loss": -37.04079818725586, "global_step": 71507, "epoch": 590} {"train_loss": -36.987648010253906, "global_step": 71508, "epoch": 590} {"train_loss": -37.21427917480469, "global_step": 71509, "epoch": 590} {"train_loss": -34.59879035792075, "global_step": 71510, "epoch": 590, "val_loss": 2487966.0} {"train_loss": -37.66518783569336, "global_step": 71511, "epoch": 591} {"train_loss": -37.09333801269531, "global_step": 71512, "epoch": 591} {"train_loss": -37.2346076965332, "global_step": 71513, "epoch": 591} {"train_loss": -37.12565231323242, "global_step": 71514, "epoch": 591} {"train_loss": -36.751556396484375, "global_step": 71515, "epoch": 591} {"train_loss": -37.34775924682617, "global_step": 71516, "epoch": 591} {"train_loss": -36.41836929321289, "global_step": 71517, "epoch": 591} {"train_loss": -37.49834060668945, "global_step": 71518, "epoch": 591} {"train_loss": -37.37535858154297, "global_step": 71519, "epoch": 591} {"train_loss": -37.684295654296875, "global_step": 71520, "epoch": 591} {"train_loss": -36.762969970703125, "global_step": 71521, "epoch": 591} {"train_loss": -37.4415283203125, "global_step": 71522, "epoch": 591} {"train_loss": -37.341583251953125, "global_step": 71523, "epoch": 591} {"train_loss": -37.708641052246094, "global_step": 71524, "epoch": 591} {"train_loss": -36.36885070800781, "global_step": 71525, "epoch": 591} {"train_loss": -37.26937484741211, "global_step": 71526, "epoch": 591} {"train_loss": -37.21363067626953, "global_step": 71527, "epoch": 591} {"train_loss": -37.36482620239258, "global_step": 71528, "epoch": 591} {"train_loss": -37.59688949584961, "global_step": 71529, "epoch": 591} {"train_loss": -37.310585021972656, "global_step": 71530, "epoch": 591} {"train_loss": -37.40999984741211, "global_step": 71531, "epoch": 591} {"train_loss": -36.82256317138672, "global_step": 71532, "epoch": 591} {"train_loss": -37.53823471069336, "global_step": 71533, "epoch": 591} {"train_loss": -36.073238372802734, "global_step": 71534, "epoch": 591} {"train_loss": -37.658809661865234, "global_step": 71535, "epoch": 591} {"train_loss": -37.18941879272461, "global_step": 71536, "epoch": 591} {"train_loss": -36.01528549194336, "global_step": 71537, "epoch": 591} {"train_loss": -36.61279296875, "global_step": 71538, "epoch": 591} {"train_loss": -35.524566650390625, "global_step": 71539, "epoch": 591} {"train_loss": -36.91279983520508, "global_step": 71540, "epoch": 591} {"train_loss": -36.8488883972168, "global_step": 71541, "epoch": 591} {"train_loss": -33.49637985229492, "global_step": 71542, "epoch": 591} {"train_loss": -30.827285766601562, "global_step": 71543, "epoch": 591} {"train_loss": -34.12421417236328, "global_step": 71544, "epoch": 591} {"train_loss": -32.6209716796875, "global_step": 71545, "epoch": 591} {"train_loss": -35.4276237487793, "global_step": 71546, "epoch": 591} {"train_loss": -35.072654724121094, "global_step": 71547, "epoch": 591} {"train_loss": -31.6144962310791, "global_step": 71548, "epoch": 591} {"train_loss": -33.18967819213867, "global_step": 71549, "epoch": 591} {"train_loss": -34.0811767578125, "global_step": 71550, "epoch": 591} {"train_loss": -29.314451217651367, "global_step": 71551, "epoch": 591} {"train_loss": -25.936233520507812, "global_step": 71552, "epoch": 591} {"train_loss": -33.301509857177734, "global_step": 71553, "epoch": 591} {"train_loss": -30.0369930267334, "global_step": 71554, "epoch": 591} {"train_loss": -30.61372184753418, "global_step": 71555, "epoch": 591} {"train_loss": -32.95520782470703, "global_step": 71556, "epoch": 591} {"train_loss": -34.310909271240234, "global_step": 71557, "epoch": 591} {"train_loss": -31.78464698791504, "global_step": 71558, "epoch": 591} {"train_loss": -34.16866683959961, "global_step": 71559, "epoch": 591} {"train_loss": -31.978178024291992, "global_step": 71560, "epoch": 591} {"train_loss": -33.14957809448242, "global_step": 71561, "epoch": 591} {"train_loss": -33.05158615112305, "global_step": 71562, "epoch": 591} {"train_loss": -34.180416107177734, "global_step": 71563, "epoch": 591} {"train_loss": -34.4125862121582, "global_step": 71564, "epoch": 591} {"train_loss": -33.972816467285156, "global_step": 71565, "epoch": 591} {"train_loss": -34.75370407104492, "global_step": 71566, "epoch": 591} {"train_loss": -33.56610870361328, "global_step": 71567, "epoch": 591} {"train_loss": -33.5777473449707, "global_step": 71568, "epoch": 591} {"train_loss": -35.196529388427734, "global_step": 71569, "epoch": 591} {"train_loss": -34.6277961730957, "global_step": 71570, "epoch": 591} {"train_loss": -32.78499984741211, "global_step": 71571, "epoch": 591} {"train_loss": -32.0323371887207, "global_step": 71572, "epoch": 591} {"train_loss": -34.263954162597656, "global_step": 71573, "epoch": 591} {"train_loss": -34.963645935058594, "global_step": 71574, "epoch": 591} {"train_loss": -34.80855941772461, "global_step": 71575, "epoch": 591} {"train_loss": -33.504150390625, "global_step": 71576, "epoch": 591} {"train_loss": -34.3339958190918, "global_step": 71577, "epoch": 591} {"train_loss": -34.4039306640625, "global_step": 71578, "epoch": 591} {"train_loss": -34.921173095703125, "global_step": 71579, "epoch": 591} {"train_loss": -35.24068832397461, "global_step": 71580, "epoch": 591} {"train_loss": -33.95917510986328, "global_step": 71581, "epoch": 591} {"train_loss": -34.8617057800293, "global_step": 71582, "epoch": 591} {"train_loss": -34.870399475097656, "global_step": 71583, "epoch": 591} {"train_loss": -33.458709716796875, "global_step": 71584, "epoch": 591} {"train_loss": -34.67161178588867, "global_step": 71585, "epoch": 591} {"train_loss": -34.771785736083984, "global_step": 71586, "epoch": 591} {"train_loss": -33.32283401489258, "global_step": 71587, "epoch": 591} {"train_loss": -34.07801055908203, "global_step": 71588, "epoch": 591} {"train_loss": -34.35993576049805, "global_step": 71589, "epoch": 591} {"train_loss": -34.78925704956055, "global_step": 71590, "epoch": 591} {"train_loss": -35.33652877807617, "global_step": 71591, "epoch": 591} {"train_loss": -35.90818405151367, "global_step": 71592, "epoch": 591} {"train_loss": -33.65889358520508, "global_step": 71593, "epoch": 591} {"train_loss": -35.310768127441406, "global_step": 71594, "epoch": 591} {"train_loss": -35.317726135253906, "global_step": 71595, "epoch": 591} {"train_loss": -34.85372543334961, "global_step": 71596, "epoch": 591} {"train_loss": -34.26789093017578, "global_step": 71597, "epoch": 591} {"train_loss": -34.68752670288086, "global_step": 71598, "epoch": 591} {"train_loss": -34.5617561340332, "global_step": 71599, "epoch": 591} {"train_loss": -35.20724105834961, "global_step": 71600, "epoch": 591} {"train_loss": -34.517147064208984, "global_step": 71601, "epoch": 591} {"train_loss": -35.06031036376953, "global_step": 71602, "epoch": 591} {"train_loss": -35.23075485229492, "global_step": 71603, "epoch": 591} {"train_loss": -33.472412109375, "global_step": 71604, "epoch": 591} {"train_loss": -35.22983169555664, "global_step": 71605, "epoch": 591} {"train_loss": -33.38121795654297, "global_step": 71606, "epoch": 591} {"train_loss": -35.049468994140625, "global_step": 71607, "epoch": 591} {"train_loss": -34.336795806884766, "global_step": 71608, "epoch": 591} {"train_loss": -32.66535186767578, "global_step": 71609, "epoch": 591} {"train_loss": -32.538307189941406, "global_step": 71610, "epoch": 591} {"train_loss": -30.414636611938477, "global_step": 71611, "epoch": 591} {"train_loss": -31.631000518798828, "global_step": 71612, "epoch": 591} {"train_loss": -34.7175407409668, "global_step": 71613, "epoch": 591} {"train_loss": -35.200313568115234, "global_step": 71614, "epoch": 591} {"train_loss": -34.05501174926758, "global_step": 71615, "epoch": 591} {"train_loss": -35.22834396362305, "global_step": 71616, "epoch": 591} {"train_loss": -33.86711502075195, "global_step": 71617, "epoch": 591} {"train_loss": -35.09599685668945, "global_step": 71618, "epoch": 591} {"train_loss": -33.235233306884766, "global_step": 71619, "epoch": 591} {"train_loss": -35.5897102355957, "global_step": 71620, "epoch": 591} {"train_loss": -34.369903564453125, "global_step": 71621, "epoch": 591} {"train_loss": -34.443634033203125, "global_step": 71622, "epoch": 591} {"train_loss": -35.21699142456055, "global_step": 71623, "epoch": 591} {"train_loss": -34.1244010925293, "global_step": 71624, "epoch": 591} {"train_loss": -35.08736801147461, "global_step": 71625, "epoch": 591} {"train_loss": -35.14404296875, "global_step": 71626, "epoch": 591} {"train_loss": -35.24915313720703, "global_step": 71627, "epoch": 591} {"train_loss": -34.51319122314453, "global_step": 71628, "epoch": 591} {"train_loss": -34.30632400512695, "global_step": 71629, "epoch": 591} {"train_loss": -35.01123809814453, "global_step": 71630, "epoch": 591} {"train_loss": -34.72119312444009, "global_step": 71631, "epoch": 591, "val_loss": 2485339.0} {"train_loss": -34.151241302490234, "global_step": 71632, "epoch": 592} {"train_loss": -35.801483154296875, "global_step": 71633, "epoch": 592} {"train_loss": -34.85445785522461, "global_step": 71634, "epoch": 592} {"train_loss": -36.03402328491211, "global_step": 71635, "epoch": 592} {"train_loss": -35.45844650268555, "global_step": 71636, "epoch": 592} {"train_loss": -35.81413650512695, "global_step": 71637, "epoch": 592} {"train_loss": -36.0322151184082, "global_step": 71638, "epoch": 592} {"train_loss": -35.82489013671875, "global_step": 71639, "epoch": 592} {"train_loss": -36.16509246826172, "global_step": 71640, "epoch": 592} {"train_loss": -36.198158264160156, "global_step": 71641, "epoch": 592} {"train_loss": -36.0140266418457, "global_step": 71642, "epoch": 592} {"train_loss": -36.11958312988281, "global_step": 71643, "epoch": 592} {"train_loss": -36.24690628051758, "global_step": 71644, "epoch": 592} {"train_loss": -36.44857406616211, "global_step": 71645, "epoch": 592} {"train_loss": -35.72125244140625, "global_step": 71646, "epoch": 592} {"train_loss": -36.09018325805664, "global_step": 71647, "epoch": 592} {"train_loss": -36.506771087646484, "global_step": 71648, "epoch": 592} {"train_loss": -35.7384147644043, "global_step": 71649, "epoch": 592} {"train_loss": -36.57052230834961, "global_step": 71650, "epoch": 592} {"train_loss": -36.63844680786133, "global_step": 71651, "epoch": 592} {"train_loss": -36.31742477416992, "global_step": 71652, "epoch": 592} {"train_loss": -36.860530853271484, "global_step": 71653, "epoch": 592} {"train_loss": -36.332794189453125, "global_step": 71654, "epoch": 592} {"train_loss": -36.72441864013672, "global_step": 71655, "epoch": 592} {"train_loss": -36.24689483642578, "global_step": 71656, "epoch": 592} {"train_loss": -36.682289123535156, "global_step": 71657, "epoch": 592} {"train_loss": -36.96323776245117, "global_step": 71658, "epoch": 592} {"train_loss": -36.90708541870117, "global_step": 71659, "epoch": 592} {"train_loss": -36.88312530517578, "global_step": 71660, "epoch": 592} {"train_loss": -36.81501007080078, "global_step": 71661, "epoch": 592} {"train_loss": -36.74250793457031, "global_step": 71662, "epoch": 592} {"train_loss": -36.69719314575195, "global_step": 71663, "epoch": 592} {"train_loss": -36.557228088378906, "global_step": 71664, "epoch": 592} {"train_loss": -37.36077880859375, "global_step": 71665, "epoch": 592} {"train_loss": -37.056880950927734, "global_step": 71666, "epoch": 592} {"train_loss": -37.34949493408203, "global_step": 71667, "epoch": 592} {"train_loss": -36.77654266357422, "global_step": 71668, "epoch": 592} {"train_loss": -36.411224365234375, "global_step": 71669, "epoch": 592} {"train_loss": -37.28116989135742, "global_step": 71670, "epoch": 592} {"train_loss": -37.138343811035156, "global_step": 71671, "epoch": 592} {"train_loss": -36.97602844238281, "global_step": 71672, "epoch": 592} {"train_loss": -37.323917388916016, "global_step": 71673, "epoch": 592} {"train_loss": -37.006813049316406, "global_step": 71674, "epoch": 592} {"train_loss": -37.4791259765625, "global_step": 71675, "epoch": 592} {"train_loss": -36.86138916015625, "global_step": 71676, "epoch": 592} {"train_loss": -37.34268569946289, "global_step": 71677, "epoch": 592} {"train_loss": -36.66892623901367, "global_step": 71678, "epoch": 592} {"train_loss": -37.44475173950195, "global_step": 71679, "epoch": 592} {"train_loss": -37.27830123901367, "global_step": 71680, "epoch": 592} {"train_loss": -37.451839447021484, "global_step": 71681, "epoch": 592} {"train_loss": -37.62252426147461, "global_step": 71682, "epoch": 592} {"train_loss": -36.77086639404297, "global_step": 71683, "epoch": 592} {"train_loss": -36.42653274536133, "global_step": 71684, "epoch": 592} {"train_loss": -37.464969635009766, "global_step": 71685, "epoch": 592} {"train_loss": -37.09987258911133, "global_step": 71686, "epoch": 592} {"train_loss": -37.19948196411133, "global_step": 71687, "epoch": 592} {"train_loss": -37.28019332885742, "global_step": 71688, "epoch": 592} {"train_loss": -37.11985397338867, "global_step": 71689, "epoch": 592} {"train_loss": -37.10372543334961, "global_step": 71690, "epoch": 592} {"train_loss": -37.0139045715332, "global_step": 71691, "epoch": 592} {"train_loss": -37.79182052612305, "global_step": 71692, "epoch": 592} {"train_loss": -37.2362174987793, "global_step": 71693, "epoch": 592} {"train_loss": -36.468101501464844, "global_step": 71694, "epoch": 592} {"train_loss": -37.42463302612305, "global_step": 71695, "epoch": 592} {"train_loss": -37.341129302978516, "global_step": 71696, "epoch": 592} {"train_loss": -36.318058013916016, "global_step": 71697, "epoch": 592} {"train_loss": -37.05910873413086, "global_step": 71698, "epoch": 592} {"train_loss": -37.4796257019043, "global_step": 71699, "epoch": 592} {"train_loss": -35.790340423583984, "global_step": 71700, "epoch": 592} {"train_loss": -35.452880859375, "global_step": 71701, "epoch": 592} {"train_loss": -35.233245849609375, "global_step": 71702, "epoch": 592} {"train_loss": -36.1984977722168, "global_step": 71703, "epoch": 592} {"train_loss": -37.2481803894043, "global_step": 71704, "epoch": 592} {"train_loss": -35.92228317260742, "global_step": 71705, "epoch": 592} {"train_loss": -36.79001998901367, "global_step": 71706, "epoch": 592} {"train_loss": -36.61457061767578, "global_step": 71707, "epoch": 592} {"train_loss": -36.58107376098633, "global_step": 71708, "epoch": 592} {"train_loss": -36.98480987548828, "global_step": 71709, "epoch": 592} {"train_loss": -35.777809143066406, "global_step": 71710, "epoch": 592} {"train_loss": -37.01397705078125, "global_step": 71711, "epoch": 592} {"train_loss": -34.95072937011719, "global_step": 71712, "epoch": 592} {"train_loss": -36.895965576171875, "global_step": 71713, "epoch": 592} {"train_loss": -35.9288444519043, "global_step": 71714, "epoch": 592} {"train_loss": -37.35572052001953, "global_step": 71715, "epoch": 592} {"train_loss": -36.33873748779297, "global_step": 71716, "epoch": 592} {"train_loss": -36.74837875366211, "global_step": 71717, "epoch": 592} {"train_loss": -33.81327438354492, "global_step": 71718, "epoch": 592} {"train_loss": -35.3453254699707, "global_step": 71719, "epoch": 592} {"train_loss": -36.180179595947266, "global_step": 71720, "epoch": 592} {"train_loss": -35.6488151550293, "global_step": 71721, "epoch": 592} {"train_loss": -34.676204681396484, "global_step": 71722, "epoch": 592} {"train_loss": -36.6841926574707, "global_step": 71723, "epoch": 592} {"train_loss": -36.39095687866211, "global_step": 71724, "epoch": 592} {"train_loss": -37.080074310302734, "global_step": 71725, "epoch": 592} {"train_loss": -35.0462760925293, "global_step": 71726, "epoch": 592} {"train_loss": -36.15629959106445, "global_step": 71727, "epoch": 592} {"train_loss": -36.74109649658203, "global_step": 71728, "epoch": 592} {"train_loss": -36.69844055175781, "global_step": 71729, "epoch": 592} {"train_loss": -36.21873092651367, "global_step": 71730, "epoch": 592} {"train_loss": -35.10533142089844, "global_step": 71731, "epoch": 592} {"train_loss": -35.809791564941406, "global_step": 71732, "epoch": 592} {"train_loss": -35.22317886352539, "global_step": 71733, "epoch": 592} {"train_loss": -36.28654861450195, "global_step": 71734, "epoch": 592} {"train_loss": -34.98762893676758, "global_step": 71735, "epoch": 592} {"train_loss": -35.9888801574707, "global_step": 71736, "epoch": 592} {"train_loss": -35.06166458129883, "global_step": 71737, "epoch": 592} {"train_loss": -36.223106384277344, "global_step": 71738, "epoch": 592} {"train_loss": -35.762630462646484, "global_step": 71739, "epoch": 592} {"train_loss": -36.68280792236328, "global_step": 71740, "epoch": 592} {"train_loss": -36.1663932800293, "global_step": 71741, "epoch": 592} {"train_loss": -36.41347885131836, "global_step": 71742, "epoch": 592} {"train_loss": -36.26448440551758, "global_step": 71743, "epoch": 592} {"train_loss": -36.3756217956543, "global_step": 71744, "epoch": 592} {"train_loss": -35.107173919677734, "global_step": 71745, "epoch": 592} {"train_loss": -36.82113265991211, "global_step": 71746, "epoch": 592} {"train_loss": -36.24532699584961, "global_step": 71747, "epoch": 592} {"train_loss": -35.20380783081055, "global_step": 71748, "epoch": 592} {"train_loss": -35.652137756347656, "global_step": 71749, "epoch": 592} {"train_loss": -35.69169235229492, "global_step": 71750, "epoch": 592} {"train_loss": -34.28998565673828, "global_step": 71751, "epoch": 592} {"train_loss": -36.387821197509766, "global_step": 71752, "epoch": 592, "val_loss": 2413557.75} {"train_loss": -35.974788665771484, "global_step": 71753, "epoch": 593} {"train_loss": -35.618621826171875, "global_step": 71754, "epoch": 593} {"train_loss": -34.81473922729492, "global_step": 71755, "epoch": 593} {"train_loss": -36.26551055908203, "global_step": 71756, "epoch": 593} {"train_loss": -36.12715148925781, "global_step": 71757, "epoch": 593} {"train_loss": -35.849090576171875, "global_step": 71758, "epoch": 593} {"train_loss": -36.08989334106445, "global_step": 71759, "epoch": 593} {"train_loss": -33.87458419799805, "global_step": 71760, "epoch": 593} {"train_loss": -36.55978775024414, "global_step": 71761, "epoch": 593} {"train_loss": -36.32101058959961, "global_step": 71762, "epoch": 593} {"train_loss": -34.5345344543457, "global_step": 71763, "epoch": 593} {"train_loss": -36.25926971435547, "global_step": 71764, "epoch": 593} {"train_loss": -35.79085922241211, "global_step": 71765, "epoch": 593} {"train_loss": -34.13715362548828, "global_step": 71766, "epoch": 593} {"train_loss": -35.745826721191406, "global_step": 71767, "epoch": 593} {"train_loss": -35.79237747192383, "global_step": 71768, "epoch": 593} {"train_loss": -35.1358642578125, "global_step": 71769, "epoch": 593} {"train_loss": -35.35295867919922, "global_step": 71770, "epoch": 593} {"train_loss": -31.760028839111328, "global_step": 71771, "epoch": 593} {"train_loss": -34.700435638427734, "global_step": 71772, "epoch": 593} {"train_loss": -32.614013671875, "global_step": 71773, "epoch": 593} {"train_loss": -33.2567138671875, "global_step": 71774, "epoch": 593} {"train_loss": -34.25777816772461, "global_step": 71775, "epoch": 593} {"train_loss": -34.25086975097656, "global_step": 71776, "epoch": 593} {"train_loss": -34.38446807861328, "global_step": 71777, "epoch": 593} {"train_loss": -34.22614669799805, "global_step": 71778, "epoch": 593} {"train_loss": -33.84519958496094, "global_step": 71779, "epoch": 593} {"train_loss": -34.816280364990234, "global_step": 71780, "epoch": 593} {"train_loss": -34.74296188354492, "global_step": 71781, "epoch": 593} {"train_loss": -32.83941650390625, "global_step": 71782, "epoch": 593} {"train_loss": -33.07083511352539, "global_step": 71783, "epoch": 593} {"train_loss": -32.61175537109375, "global_step": 71784, "epoch": 593} {"train_loss": -34.675750732421875, "global_step": 71785, "epoch": 593} {"train_loss": -33.934932708740234, "global_step": 71786, "epoch": 593} {"train_loss": -33.961212158203125, "global_step": 71787, "epoch": 593} {"train_loss": -33.9235725402832, "global_step": 71788, "epoch": 593} {"train_loss": -33.87344741821289, "global_step": 71789, "epoch": 593} {"train_loss": -34.5209846496582, "global_step": 71790, "epoch": 593} {"train_loss": -35.587345123291016, "global_step": 71791, "epoch": 593} {"train_loss": -35.75703048706055, "global_step": 71792, "epoch": 593} {"train_loss": -34.221614837646484, "global_step": 71793, "epoch": 593} {"train_loss": -35.03743362426758, "global_step": 71794, "epoch": 593} {"train_loss": -34.902652740478516, "global_step": 71795, "epoch": 593} {"train_loss": -33.03879928588867, "global_step": 71796, "epoch": 593} {"train_loss": -35.44301986694336, "global_step": 71797, "epoch": 593} {"train_loss": -35.97336196899414, "global_step": 71798, "epoch": 593} {"train_loss": -35.219661712646484, "global_step": 71799, "epoch": 593} {"train_loss": -35.372642517089844, "global_step": 71800, "epoch": 593} {"train_loss": -35.65603256225586, "global_step": 71801, "epoch": 593} {"train_loss": -36.09648132324219, "global_step": 71802, "epoch": 593} {"train_loss": -35.876380920410156, "global_step": 71803, "epoch": 593} {"train_loss": -34.37649154663086, "global_step": 71804, "epoch": 593} {"train_loss": -34.955318450927734, "global_step": 71805, "epoch": 593} {"train_loss": -35.31632614135742, "global_step": 71806, "epoch": 593} {"train_loss": -35.51811599731445, "global_step": 71807, "epoch": 593} {"train_loss": -34.546913146972656, "global_step": 71808, "epoch": 593} {"train_loss": -35.16773223876953, "global_step": 71809, "epoch": 593} {"train_loss": -35.732845306396484, "global_step": 71810, "epoch": 593} {"train_loss": -35.48592758178711, "global_step": 71811, "epoch": 593} {"train_loss": -36.23426055908203, "global_step": 71812, "epoch": 593} {"train_loss": -35.94914627075195, "global_step": 71813, "epoch": 593} {"train_loss": -35.89243698120117, "global_step": 71814, "epoch": 593} {"train_loss": -36.31916046142578, "global_step": 71815, "epoch": 593} {"train_loss": -35.64152908325195, "global_step": 71816, "epoch": 593} {"train_loss": -36.13291549682617, "global_step": 71817, "epoch": 593} {"train_loss": -35.92322540283203, "global_step": 71818, "epoch": 593} {"train_loss": -35.62516784667969, "global_step": 71819, "epoch": 593} {"train_loss": -36.618961334228516, "global_step": 71820, "epoch": 593} {"train_loss": -36.38762283325195, "global_step": 71821, "epoch": 593} {"train_loss": -36.200889587402344, "global_step": 71822, "epoch": 593} {"train_loss": -36.2739143371582, "global_step": 71823, "epoch": 593} {"train_loss": -36.26467514038086, "global_step": 71824, "epoch": 593} {"train_loss": -36.2181510925293, "global_step": 71825, "epoch": 593} {"train_loss": -36.404727935791016, "global_step": 71826, "epoch": 593} {"train_loss": -35.79590606689453, "global_step": 71827, "epoch": 593} {"train_loss": -37.04202651977539, "global_step": 71828, "epoch": 593} {"train_loss": -36.65199661254883, "global_step": 71829, "epoch": 593} {"train_loss": -36.59238052368164, "global_step": 71830, "epoch": 593} {"train_loss": -35.22072982788086, "global_step": 71831, "epoch": 593} {"train_loss": -35.913997650146484, "global_step": 71832, "epoch": 593} {"train_loss": -36.26611328125, "global_step": 71833, "epoch": 593} {"train_loss": -36.466365814208984, "global_step": 71834, "epoch": 593} {"train_loss": -36.174949645996094, "global_step": 71835, "epoch": 593} {"train_loss": -35.90285873413086, "global_step": 71836, "epoch": 593} {"train_loss": -35.06647491455078, "global_step": 71837, "epoch": 593} {"train_loss": -35.140411376953125, "global_step": 71838, "epoch": 593} {"train_loss": -33.1922721862793, "global_step": 71839, "epoch": 593} {"train_loss": -33.78591537475586, "global_step": 71840, "epoch": 593} {"train_loss": -35.688228607177734, "global_step": 71841, "epoch": 593} {"train_loss": -36.33097839355469, "global_step": 71842, "epoch": 593} {"train_loss": -32.96760940551758, "global_step": 71843, "epoch": 593} {"train_loss": -30.913192749023438, "global_step": 71844, "epoch": 593} {"train_loss": -35.5126953125, "global_step": 71845, "epoch": 593} {"train_loss": -34.688026428222656, "global_step": 71846, "epoch": 593} {"train_loss": -32.46641540527344, "global_step": 71847, "epoch": 593} {"train_loss": -35.049312591552734, "global_step": 71848, "epoch": 593} {"train_loss": -33.26357650756836, "global_step": 71849, "epoch": 593} {"train_loss": -35.29594039916992, "global_step": 71850, "epoch": 593} {"train_loss": -34.59257888793945, "global_step": 71851, "epoch": 593} {"train_loss": -36.7747917175293, "global_step": 71852, "epoch": 593} {"train_loss": -33.92890548706055, "global_step": 71853, "epoch": 593} {"train_loss": -36.693946838378906, "global_step": 71854, "epoch": 593} {"train_loss": -33.64020538330078, "global_step": 71855, "epoch": 593} {"train_loss": -36.32736587524414, "global_step": 71856, "epoch": 593} {"train_loss": -34.988468170166016, "global_step": 71857, "epoch": 593} {"train_loss": -34.905975341796875, "global_step": 71858, "epoch": 593} {"train_loss": -36.684200286865234, "global_step": 71859, "epoch": 593} {"train_loss": -33.8768424987793, "global_step": 71860, "epoch": 593} {"train_loss": -36.279903411865234, "global_step": 71861, "epoch": 593} {"train_loss": -34.983863830566406, "global_step": 71862, "epoch": 593} {"train_loss": -34.724056243896484, "global_step": 71863, "epoch": 593} {"train_loss": -34.50269317626953, "global_step": 71864, "epoch": 593} {"train_loss": -34.32188415527344, "global_step": 71865, "epoch": 593} {"train_loss": -35.93581771850586, "global_step": 71866, "epoch": 593} {"train_loss": -34.2696647644043, "global_step": 71867, "epoch": 593} {"train_loss": -34.85602951049805, "global_step": 71868, "epoch": 593} {"train_loss": -36.5387077331543, "global_step": 71869, "epoch": 593} {"train_loss": -34.15475082397461, "global_step": 71870, "epoch": 593} {"train_loss": -35.63393783569336, "global_step": 71871, "epoch": 593} {"train_loss": -35.59843063354492, "global_step": 71872, "epoch": 593} {"train_loss": -35.10730598386654, "global_step": 71873, "epoch": 593, "val_loss": 2496089.25} {"train_loss": -35.08380889892578, "global_step": 71874, "epoch": 594} {"train_loss": -35.47340774536133, "global_step": 71875, "epoch": 594} {"train_loss": -36.09006881713867, "global_step": 71876, "epoch": 594} {"train_loss": -36.38167190551758, "global_step": 71877, "epoch": 594} {"train_loss": -36.365196228027344, "global_step": 71878, "epoch": 594} {"train_loss": -36.21061325073242, "global_step": 71879, "epoch": 594} {"train_loss": -36.80366134643555, "global_step": 71880, "epoch": 594} {"train_loss": -36.55583572387695, "global_step": 71881, "epoch": 594} {"train_loss": -36.65975570678711, "global_step": 71882, "epoch": 594} {"train_loss": -37.112056732177734, "global_step": 71883, "epoch": 594} {"train_loss": -36.68589401245117, "global_step": 71884, "epoch": 594} {"train_loss": -36.69401168823242, "global_step": 71885, "epoch": 594} {"train_loss": -36.0478515625, "global_step": 71886, "epoch": 594} {"train_loss": -35.89216232299805, "global_step": 71887, "epoch": 594} {"train_loss": -35.864776611328125, "global_step": 71888, "epoch": 594} {"train_loss": -35.8492317199707, "global_step": 71889, "epoch": 594} {"train_loss": -35.391754150390625, "global_step": 71890, "epoch": 594} {"train_loss": -34.2621955871582, "global_step": 71891, "epoch": 594} {"train_loss": -32.644683837890625, "global_step": 71892, "epoch": 594} {"train_loss": -33.632118225097656, "global_step": 71893, "epoch": 594} {"train_loss": -36.099002838134766, "global_step": 71894, "epoch": 594} {"train_loss": -36.87948226928711, "global_step": 71895, "epoch": 594} {"train_loss": -36.21622848510742, "global_step": 71896, "epoch": 594} {"train_loss": -36.053627014160156, "global_step": 71897, "epoch": 594} {"train_loss": -36.38083267211914, "global_step": 71898, "epoch": 594} {"train_loss": -36.71982955932617, "global_step": 71899, "epoch": 594} {"train_loss": -36.66193771362305, "global_step": 71900, "epoch": 594} {"train_loss": -36.892852783203125, "global_step": 71901, "epoch": 594} {"train_loss": -36.73444747924805, "global_step": 71902, "epoch": 594} {"train_loss": -36.45728302001953, "global_step": 71903, "epoch": 594} {"train_loss": -36.229671478271484, "global_step": 71904, "epoch": 594} {"train_loss": -36.421783447265625, "global_step": 71905, "epoch": 594} {"train_loss": -37.221065521240234, "global_step": 71906, "epoch": 594} {"train_loss": -36.451416015625, "global_step": 71907, "epoch": 594} {"train_loss": -36.20277404785156, "global_step": 71908, "epoch": 594} {"train_loss": -35.93790817260742, "global_step": 71909, "epoch": 594} {"train_loss": -36.269744873046875, "global_step": 71910, "epoch": 594} {"train_loss": -35.23653030395508, "global_step": 71911, "epoch": 594} {"train_loss": -35.4005012512207, "global_step": 71912, "epoch": 594} {"train_loss": -36.021400451660156, "global_step": 71913, "epoch": 594} {"train_loss": -35.9218635559082, "global_step": 71914, "epoch": 594} {"train_loss": -36.20310592651367, "global_step": 71915, "epoch": 594} {"train_loss": -36.904109954833984, "global_step": 71916, "epoch": 594} {"train_loss": -36.067359924316406, "global_step": 71917, "epoch": 594} {"train_loss": -36.474884033203125, "global_step": 71918, "epoch": 594} {"train_loss": -35.39884567260742, "global_step": 71919, "epoch": 594} {"train_loss": -36.66537094116211, "global_step": 71920, "epoch": 594} {"train_loss": -35.984127044677734, "global_step": 71921, "epoch": 594} {"train_loss": -36.92158126831055, "global_step": 71922, "epoch": 594} {"train_loss": -36.05012130737305, "global_step": 71923, "epoch": 594} {"train_loss": -36.552284240722656, "global_step": 71924, "epoch": 594} {"train_loss": -36.66714859008789, "global_step": 71925, "epoch": 594} {"train_loss": -36.226829528808594, "global_step": 71926, "epoch": 594} {"train_loss": -36.3373908996582, "global_step": 71927, "epoch": 594} {"train_loss": -37.083499908447266, "global_step": 71928, "epoch": 594} {"train_loss": -36.767948150634766, "global_step": 71929, "epoch": 594} {"train_loss": -36.62765884399414, "global_step": 71930, "epoch": 594} {"train_loss": -36.492733001708984, "global_step": 71931, "epoch": 594} {"train_loss": -35.84122848510742, "global_step": 71932, "epoch": 594} {"train_loss": -35.80318832397461, "global_step": 71933, "epoch": 594} {"train_loss": -36.40689468383789, "global_step": 71934, "epoch": 594} {"train_loss": -36.90822982788086, "global_step": 71935, "epoch": 594} {"train_loss": -36.15841293334961, "global_step": 71936, "epoch": 594} {"train_loss": -36.353363037109375, "global_step": 71937, "epoch": 594} {"train_loss": -36.21513748168945, "global_step": 71938, "epoch": 594} {"train_loss": -35.489742279052734, "global_step": 71939, "epoch": 594} {"train_loss": -36.24217987060547, "global_step": 71940, "epoch": 594} {"train_loss": -36.110687255859375, "global_step": 71941, "epoch": 594} {"train_loss": -36.39516067504883, "global_step": 71942, "epoch": 594} {"train_loss": -36.587257385253906, "global_step": 71943, "epoch": 594} {"train_loss": -35.21010971069336, "global_step": 71944, "epoch": 594} {"train_loss": -35.41694259643555, "global_step": 71945, "epoch": 594} {"train_loss": -34.86255645751953, "global_step": 71946, "epoch": 594} {"train_loss": -35.03579330444336, "global_step": 71947, "epoch": 594} {"train_loss": -35.691158294677734, "global_step": 71948, "epoch": 594} {"train_loss": -35.3675537109375, "global_step": 71949, "epoch": 594} {"train_loss": -34.66996383666992, "global_step": 71950, "epoch": 594} {"train_loss": -35.96779251098633, "global_step": 71951, "epoch": 594} {"train_loss": -34.818763732910156, "global_step": 71952, "epoch": 594} {"train_loss": -34.81167221069336, "global_step": 71953, "epoch": 594} {"train_loss": -36.065574645996094, "global_step": 71954, "epoch": 594} {"train_loss": -35.234130859375, "global_step": 71955, "epoch": 594} {"train_loss": -34.8673210144043, "global_step": 71956, "epoch": 594} {"train_loss": -35.507347106933594, "global_step": 71957, "epoch": 594} {"train_loss": -35.12983703613281, "global_step": 71958, "epoch": 594} {"train_loss": -35.685333251953125, "global_step": 71959, "epoch": 594} {"train_loss": -36.099464416503906, "global_step": 71960, "epoch": 594} {"train_loss": -35.54169464111328, "global_step": 71961, "epoch": 594} {"train_loss": -34.874916076660156, "global_step": 71962, "epoch": 594} {"train_loss": -36.01237869262695, "global_step": 71963, "epoch": 594} {"train_loss": -36.318233489990234, "global_step": 71964, "epoch": 594} {"train_loss": -36.16927719116211, "global_step": 71965, "epoch": 594} {"train_loss": -36.326290130615234, "global_step": 71966, "epoch": 594} {"train_loss": -36.447425842285156, "global_step": 71967, "epoch": 594} {"train_loss": -35.416595458984375, "global_step": 71968, "epoch": 594} {"train_loss": -35.9008674621582, "global_step": 71969, "epoch": 594} {"train_loss": -35.98286056518555, "global_step": 71970, "epoch": 594} {"train_loss": -36.017887115478516, "global_step": 71971, "epoch": 594} {"train_loss": -35.41708755493164, "global_step": 71972, "epoch": 594} {"train_loss": -33.91995620727539, "global_step": 71973, "epoch": 594} {"train_loss": -35.93402862548828, "global_step": 71974, "epoch": 594} {"train_loss": -36.43383026123047, "global_step": 71975, "epoch": 594} {"train_loss": -36.889747619628906, "global_step": 71976, "epoch": 594} {"train_loss": -36.13961410522461, "global_step": 71977, "epoch": 594} {"train_loss": -34.70575714111328, "global_step": 71978, "epoch": 594} {"train_loss": -35.88977813720703, "global_step": 71979, "epoch": 594} {"train_loss": -35.50828170776367, "global_step": 71980, "epoch": 594} {"train_loss": -36.70410919189453, "global_step": 71981, "epoch": 594} {"train_loss": -35.62837219238281, "global_step": 71982, "epoch": 594} {"train_loss": -36.14621353149414, "global_step": 71983, "epoch": 594} {"train_loss": -36.171966552734375, "global_step": 71984, "epoch": 594} {"train_loss": -35.86376953125, "global_step": 71985, "epoch": 594} {"train_loss": -35.55198287963867, "global_step": 71986, "epoch": 594} {"train_loss": -35.368263244628906, "global_step": 71987, "epoch": 594} {"train_loss": -33.88938522338867, "global_step": 71988, "epoch": 594} {"train_loss": -33.87278366088867, "global_step": 71989, "epoch": 594} {"train_loss": -35.55492401123047, "global_step": 71990, "epoch": 594} {"train_loss": -34.7425422668457, "global_step": 71991, "epoch": 594} {"train_loss": -35.87080764770508, "global_step": 71992, "epoch": 594} {"train_loss": -34.645484924316406, "global_step": 71993, "epoch": 594} {"train_loss": -35.88390968259701, "global_step": 71994, "epoch": 594, "val_loss": 2514889.25} {"train_loss": -36.48553466796875, "global_step": 71995, "epoch": 595} {"train_loss": -35.69574737548828, "global_step": 71996, "epoch": 595} {"train_loss": -36.178428649902344, "global_step": 71997, "epoch": 595} {"train_loss": -36.28229522705078, "global_step": 71998, "epoch": 595} {"train_loss": -35.340267181396484, "global_step": 71999, "epoch": 595} {"train_loss": -36.61224365234375, "global_step": 72000, "epoch": 595} {"train_loss": -36.72610092163086, "global_step": 72001, "epoch": 595} {"train_loss": -34.471073150634766, "global_step": 72002, "epoch": 595} {"train_loss": -33.009002685546875, "global_step": 72003, "epoch": 595} {"train_loss": -36.6544189453125, "global_step": 72004, "epoch": 595} {"train_loss": -36.9796142578125, "global_step": 72005, "epoch": 595} {"train_loss": -36.61103820800781, "global_step": 72006, "epoch": 595} {"train_loss": -36.493648529052734, "global_step": 72007, "epoch": 595} {"train_loss": -35.78072738647461, "global_step": 72008, "epoch": 595} {"train_loss": -36.3804817199707, "global_step": 72009, "epoch": 595} {"train_loss": -36.5318489074707, "global_step": 72010, "epoch": 595} {"train_loss": -36.55202102661133, "global_step": 72011, "epoch": 595} {"train_loss": -34.744171142578125, "global_step": 72012, "epoch": 595} {"train_loss": -35.9400520324707, "global_step": 72013, "epoch": 595} {"train_loss": -36.45063781738281, "global_step": 72014, "epoch": 595} {"train_loss": -36.74508285522461, "global_step": 72015, "epoch": 595} {"train_loss": -36.76829147338867, "global_step": 72016, "epoch": 595} {"train_loss": -35.48609924316406, "global_step": 72017, "epoch": 595} {"train_loss": -36.65858459472656, "global_step": 72018, "epoch": 595} {"train_loss": -35.84619140625, "global_step": 72019, "epoch": 595} {"train_loss": -34.222999572753906, "global_step": 72020, "epoch": 595} {"train_loss": -32.043880462646484, "global_step": 72021, "epoch": 595} {"train_loss": -31.225677490234375, "global_step": 72022, "epoch": 595} {"train_loss": -24.890073776245117, "global_step": 72023, "epoch": 595} {"train_loss": -24.902236938476562, "global_step": 72024, "epoch": 595} {"train_loss": -27.606922149658203, "global_step": 72025, "epoch": 595} {"train_loss": -28.670873641967773, "global_step": 72026, "epoch": 595} {"train_loss": -30.644855499267578, "global_step": 72027, "epoch": 595} {"train_loss": -34.02992630004883, "global_step": 72028, "epoch": 595} {"train_loss": -31.0743408203125, "global_step": 72029, "epoch": 595} {"train_loss": -34.65956497192383, "global_step": 72030, "epoch": 595} {"train_loss": -32.7368049621582, "global_step": 72031, "epoch": 595} {"train_loss": -34.32395553588867, "global_step": 72032, "epoch": 595} {"train_loss": -31.252582550048828, "global_step": 72033, "epoch": 595} {"train_loss": -34.24591064453125, "global_step": 72034, "epoch": 595} {"train_loss": -34.040016174316406, "global_step": 72035, "epoch": 595} {"train_loss": -35.22457504272461, "global_step": 72036, "epoch": 595} {"train_loss": -33.92356491088867, "global_step": 72037, "epoch": 595} {"train_loss": -35.67633056640625, "global_step": 72038, "epoch": 595} {"train_loss": -35.01762008666992, "global_step": 72039, "epoch": 595} {"train_loss": -34.812843322753906, "global_step": 72040, "epoch": 595} {"train_loss": -35.341190338134766, "global_step": 72041, "epoch": 595} {"train_loss": -33.78154373168945, "global_step": 72042, "epoch": 595} {"train_loss": -35.49717330932617, "global_step": 72043, "epoch": 595} {"train_loss": -35.7177619934082, "global_step": 72044, "epoch": 595} {"train_loss": -34.216068267822266, "global_step": 72045, "epoch": 595} {"train_loss": -36.3870735168457, "global_step": 72046, "epoch": 595} {"train_loss": -36.00015640258789, "global_step": 72047, "epoch": 595} {"train_loss": -35.21760559082031, "global_step": 72048, "epoch": 595} {"train_loss": -36.19498062133789, "global_step": 72049, "epoch": 595} {"train_loss": -35.995521545410156, "global_step": 72050, "epoch": 595} {"train_loss": -36.27808380126953, "global_step": 72051, "epoch": 595} {"train_loss": -35.494773864746094, "global_step": 72052, "epoch": 595} {"train_loss": -36.0832633972168, "global_step": 72053, "epoch": 595} {"train_loss": -35.90446853637695, "global_step": 72054, "epoch": 595} {"train_loss": -35.73735427856445, "global_step": 72055, "epoch": 595} {"train_loss": -36.71503448486328, "global_step": 72056, "epoch": 595} {"train_loss": -36.240272521972656, "global_step": 72057, "epoch": 595} {"train_loss": -36.599761962890625, "global_step": 72058, "epoch": 595} {"train_loss": -36.5996208190918, "global_step": 72059, "epoch": 595} {"train_loss": -36.669677734375, "global_step": 72060, "epoch": 595} {"train_loss": -36.78155517578125, "global_step": 72061, "epoch": 595} {"train_loss": -36.773380279541016, "global_step": 72062, "epoch": 595} {"train_loss": -36.4830436706543, "global_step": 72063, "epoch": 595} {"train_loss": -36.4211311340332, "global_step": 72064, "epoch": 595} {"train_loss": -36.8543701171875, "global_step": 72065, "epoch": 595} {"train_loss": -37.20616912841797, "global_step": 72066, "epoch": 595} {"train_loss": -36.83982467651367, "global_step": 72067, "epoch": 595} {"train_loss": -35.71083450317383, "global_step": 72068, "epoch": 595} {"train_loss": -36.79267501831055, "global_step": 72069, "epoch": 595} {"train_loss": -36.2155876159668, "global_step": 72070, "epoch": 595} {"train_loss": -37.15834045410156, "global_step": 72071, "epoch": 595} {"train_loss": -37.242950439453125, "global_step": 72072, "epoch": 595} {"train_loss": -37.467952728271484, "global_step": 72073, "epoch": 595} {"train_loss": -37.21799850463867, "global_step": 72074, "epoch": 595} {"train_loss": -36.77116012573242, "global_step": 72075, "epoch": 595} {"train_loss": -37.08477783203125, "global_step": 72076, "epoch": 595} {"train_loss": -37.079498291015625, "global_step": 72077, "epoch": 595} {"train_loss": -36.8027229309082, "global_step": 72078, "epoch": 595} {"train_loss": -35.929500579833984, "global_step": 72079, "epoch": 595} {"train_loss": -29.664148330688477, "global_step": 72080, "epoch": 595} {"train_loss": -4.902471542358398, "global_step": 72081, "epoch": 595} {"train_loss": 21.453842163085938, "global_step": 72082, "epoch": 595} {"train_loss": -4.599002361297607, "global_step": 72083, "epoch": 595} {"train_loss": -33.44533920288086, "global_step": 72084, "epoch": 595} {"train_loss": -16.77262306213379, "global_step": 72085, "epoch": 595} {"train_loss": -32.502864837646484, "global_step": 72086, "epoch": 595} {"train_loss": -25.542348861694336, "global_step": 72087, "epoch": 595} {"train_loss": -28.219039916992188, "global_step": 72088, "epoch": 595} {"train_loss": -32.830440521240234, "global_step": 72089, "epoch": 595} {"train_loss": -27.76681900024414, "global_step": 72090, "epoch": 595} {"train_loss": -32.74381637573242, "global_step": 72091, "epoch": 595} {"train_loss": -34.06669998168945, "global_step": 72092, "epoch": 595} {"train_loss": -32.81660079956055, "global_step": 72093, "epoch": 595} {"train_loss": -33.262142181396484, "global_step": 72094, "epoch": 595} {"train_loss": -34.11505889892578, "global_step": 72095, "epoch": 595} {"train_loss": -34.51743698120117, "global_step": 72096, "epoch": 595} {"train_loss": -33.37482833862305, "global_step": 72097, "epoch": 595} {"train_loss": -33.8263053894043, "global_step": 72098, "epoch": 595} {"train_loss": -34.48675537109375, "global_step": 72099, "epoch": 595} {"train_loss": -34.7326774597168, "global_step": 72100, "epoch": 595} {"train_loss": -35.165706634521484, "global_step": 72101, "epoch": 595} {"train_loss": -34.24030685424805, "global_step": 72102, "epoch": 595} {"train_loss": -34.06807327270508, "global_step": 72103, "epoch": 595} {"train_loss": -34.47394943237305, "global_step": 72104, "epoch": 595} {"train_loss": -35.321502685546875, "global_step": 72105, "epoch": 595} {"train_loss": -35.109554290771484, "global_step": 72106, "epoch": 595} {"train_loss": -34.801021575927734, "global_step": 72107, "epoch": 595} {"train_loss": -34.997047424316406, "global_step": 72108, "epoch": 595} {"train_loss": -35.265594482421875, "global_step": 72109, "epoch": 595} {"train_loss": -35.395328521728516, "global_step": 72110, "epoch": 595} {"train_loss": -35.606201171875, "global_step": 72111, "epoch": 595} {"train_loss": -35.394012451171875, "global_step": 72112, "epoch": 595} {"train_loss": -35.6351432800293, "global_step": 72113, "epoch": 595} {"train_loss": -35.655189514160156, "global_step": 72114, "epoch": 595} {"train_loss": -33.651062701359265, "global_step": 72115, "epoch": 595, "val_loss": 2450165.75} {"train_loss": -35.697296142578125, "global_step": 72116, "epoch": 596} {"train_loss": -35.8794059753418, "global_step": 72117, "epoch": 596} {"train_loss": -35.603248596191406, "global_step": 72118, "epoch": 596} {"train_loss": -35.86332321166992, "global_step": 72119, "epoch": 596} {"train_loss": -35.918495178222656, "global_step": 72120, "epoch": 596} {"train_loss": -36.12574005126953, "global_step": 72121, "epoch": 596} {"train_loss": -35.920204162597656, "global_step": 72122, "epoch": 596} {"train_loss": -36.29642868041992, "global_step": 72123, "epoch": 596} {"train_loss": -36.213809967041016, "global_step": 72124, "epoch": 596} {"train_loss": -36.322235107421875, "global_step": 72125, "epoch": 596} {"train_loss": -36.36714553833008, "global_step": 72126, "epoch": 596} {"train_loss": -36.41432571411133, "global_step": 72127, "epoch": 596} {"train_loss": -36.36239242553711, "global_step": 72128, "epoch": 596} {"train_loss": -36.6103630065918, "global_step": 72129, "epoch": 596} {"train_loss": -36.26310348510742, "global_step": 72130, "epoch": 596} {"train_loss": -36.59771728515625, "global_step": 72131, "epoch": 596} {"train_loss": -36.59980392456055, "global_step": 72132, "epoch": 596} {"train_loss": -36.5107307434082, "global_step": 72133, "epoch": 596} {"train_loss": -36.58278274536133, "global_step": 72134, "epoch": 596} {"train_loss": -36.481239318847656, "global_step": 72135, "epoch": 596} {"train_loss": -36.9579963684082, "global_step": 72136, "epoch": 596} {"train_loss": -36.636531829833984, "global_step": 72137, "epoch": 596} {"train_loss": -36.63283157348633, "global_step": 72138, "epoch": 596} {"train_loss": -36.99813461303711, "global_step": 72139, "epoch": 596} {"train_loss": -37.006629943847656, "global_step": 72140, "epoch": 596} {"train_loss": -37.10474395751953, "global_step": 72141, "epoch": 596} {"train_loss": -36.40073013305664, "global_step": 72142, "epoch": 596} {"train_loss": -36.81197738647461, "global_step": 72143, "epoch": 596} {"train_loss": -36.9730224609375, "global_step": 72144, "epoch": 596} {"train_loss": -36.649024963378906, "global_step": 72145, "epoch": 596} {"train_loss": -36.31533432006836, "global_step": 72146, "epoch": 596} {"train_loss": -34.87877655029297, "global_step": 72147, "epoch": 596} {"train_loss": -37.08766555786133, "global_step": 72148, "epoch": 596} {"train_loss": -37.161170959472656, "global_step": 72149, "epoch": 596} {"train_loss": -36.14971160888672, "global_step": 72150, "epoch": 596} {"train_loss": -37.04225540161133, "global_step": 72151, "epoch": 596} {"train_loss": -36.47329330444336, "global_step": 72152, "epoch": 596} {"train_loss": -37.05314254760742, "global_step": 72153, "epoch": 596} {"train_loss": -37.02265167236328, "global_step": 72154, "epoch": 596} {"train_loss": -35.727996826171875, "global_step": 72155, "epoch": 596} {"train_loss": -36.855804443359375, "global_step": 72156, "epoch": 596} {"train_loss": -37.28718185424805, "global_step": 72157, "epoch": 596} {"train_loss": -36.523719787597656, "global_step": 72158, "epoch": 596} {"train_loss": -36.53770065307617, "global_step": 72159, "epoch": 596} {"train_loss": -35.39900588989258, "global_step": 72160, "epoch": 596} {"train_loss": -37.24107360839844, "global_step": 72161, "epoch": 596} {"train_loss": -35.601768493652344, "global_step": 72162, "epoch": 596} {"train_loss": -34.49442672729492, "global_step": 72163, "epoch": 596} {"train_loss": -34.086727142333984, "global_step": 72164, "epoch": 596} {"train_loss": -37.03890609741211, "global_step": 72165, "epoch": 596} {"train_loss": -35.87678146362305, "global_step": 72166, "epoch": 596} {"train_loss": -36.26296615600586, "global_step": 72167, "epoch": 596} {"train_loss": -36.611549377441406, "global_step": 72168, "epoch": 596} {"train_loss": -36.28341293334961, "global_step": 72169, "epoch": 596} {"train_loss": -36.12303924560547, "global_step": 72170, "epoch": 596} {"train_loss": -34.5289192199707, "global_step": 72171, "epoch": 596} {"train_loss": -34.80759811401367, "global_step": 72172, "epoch": 596} {"train_loss": -33.8508186340332, "global_step": 72173, "epoch": 596} {"train_loss": -33.39775466918945, "global_step": 72174, "epoch": 596} {"train_loss": -36.22749710083008, "global_step": 72175, "epoch": 596} {"train_loss": -33.344757080078125, "global_step": 72176, "epoch": 596} {"train_loss": -31.501632690429688, "global_step": 72177, "epoch": 596} {"train_loss": -35.57017135620117, "global_step": 72178, "epoch": 596} {"train_loss": -28.9678955078125, "global_step": 72179, "epoch": 596} {"train_loss": -34.94629669189453, "global_step": 72180, "epoch": 596} {"train_loss": -33.079261779785156, "global_step": 72181, "epoch": 596} {"train_loss": -32.73111343383789, "global_step": 72182, "epoch": 596} {"train_loss": -35.80720901489258, "global_step": 72183, "epoch": 596} {"train_loss": -32.31634521484375, "global_step": 72184, "epoch": 596} {"train_loss": -34.93329620361328, "global_step": 72185, "epoch": 596} {"train_loss": -35.5523567199707, "global_step": 72186, "epoch": 596} {"train_loss": -34.37139129638672, "global_step": 72187, "epoch": 596} {"train_loss": -35.62348556518555, "global_step": 72188, "epoch": 596} {"train_loss": -35.50883865356445, "global_step": 72189, "epoch": 596} {"train_loss": -34.53867721557617, "global_step": 72190, "epoch": 596} {"train_loss": -34.71415710449219, "global_step": 72191, "epoch": 596} {"train_loss": -35.509944915771484, "global_step": 72192, "epoch": 596} {"train_loss": -35.65906524658203, "global_step": 72193, "epoch": 596} {"train_loss": -35.959659576416016, "global_step": 72194, "epoch": 596} {"train_loss": -35.02022933959961, "global_step": 72195, "epoch": 596} {"train_loss": -35.46867752075195, "global_step": 72196, "epoch": 596} {"train_loss": -34.31092071533203, "global_step": 72197, "epoch": 596} {"train_loss": -35.977516174316406, "global_step": 72198, "epoch": 596} {"train_loss": -35.50270462036133, "global_step": 72199, "epoch": 596} {"train_loss": -35.94175338745117, "global_step": 72200, "epoch": 596} {"train_loss": -35.3720588684082, "global_step": 72201, "epoch": 596} {"train_loss": -35.52234649658203, "global_step": 72202, "epoch": 596} {"train_loss": -35.6229362487793, "global_step": 72203, "epoch": 596} {"train_loss": -36.37017822265625, "global_step": 72204, "epoch": 596} {"train_loss": -36.52040100097656, "global_step": 72205, "epoch": 596} {"train_loss": -35.917015075683594, "global_step": 72206, "epoch": 596} {"train_loss": -36.18159866333008, "global_step": 72207, "epoch": 596} {"train_loss": -36.243099212646484, "global_step": 72208, "epoch": 596} {"train_loss": -36.609107971191406, "global_step": 72209, "epoch": 596} {"train_loss": -36.27083969116211, "global_step": 72210, "epoch": 596} {"train_loss": -35.99201965332031, "global_step": 72211, "epoch": 596} {"train_loss": -36.5329475402832, "global_step": 72212, "epoch": 596} {"train_loss": -35.72257995605469, "global_step": 72213, "epoch": 596} {"train_loss": -35.67245101928711, "global_step": 72214, "epoch": 596} {"train_loss": -35.070037841796875, "global_step": 72215, "epoch": 596} {"train_loss": -36.33424758911133, "global_step": 72216, "epoch": 596} {"train_loss": -36.05965042114258, "global_step": 72217, "epoch": 596} {"train_loss": -35.22993850708008, "global_step": 72218, "epoch": 596} {"train_loss": -34.711769104003906, "global_step": 72219, "epoch": 596} {"train_loss": -35.03902053833008, "global_step": 72220, "epoch": 596} {"train_loss": -36.12886428833008, "global_step": 72221, "epoch": 596} {"train_loss": -36.955020904541016, "global_step": 72222, "epoch": 596} {"train_loss": -36.35343551635742, "global_step": 72223, "epoch": 596} {"train_loss": -36.19047164916992, "global_step": 72224, "epoch": 596} {"train_loss": -36.18621063232422, "global_step": 72225, "epoch": 596} {"train_loss": -36.356624603271484, "global_step": 72226, "epoch": 596} {"train_loss": -35.45758056640625, "global_step": 72227, "epoch": 596} {"train_loss": -35.91622543334961, "global_step": 72228, "epoch": 596} {"train_loss": -36.53790283203125, "global_step": 72229, "epoch": 596} {"train_loss": -36.218074798583984, "global_step": 72230, "epoch": 596} {"train_loss": -35.74056625366211, "global_step": 72231, "epoch": 596} {"train_loss": -36.228614807128906, "global_step": 72232, "epoch": 596} {"train_loss": -36.56760787963867, "global_step": 72233, "epoch": 596} {"train_loss": -36.1835823059082, "global_step": 72234, "epoch": 596} {"train_loss": -36.218177795410156, "global_step": 72235, "epoch": 596} {"train_loss": -35.80098352353435, "global_step": 72236, "epoch": 596, "val_loss": 2499242.0} {"train_loss": -36.32807159423828, "global_step": 72237, "epoch": 597} {"train_loss": -36.96462631225586, "global_step": 72238, "epoch": 597} {"train_loss": -36.375038146972656, "global_step": 72239, "epoch": 597} {"train_loss": -35.700927734375, "global_step": 72240, "epoch": 597} {"train_loss": -35.45864486694336, "global_step": 72241, "epoch": 597} {"train_loss": -36.564064025878906, "global_step": 72242, "epoch": 597} {"train_loss": -36.320106506347656, "global_step": 72243, "epoch": 597} {"train_loss": -36.39116668701172, "global_step": 72244, "epoch": 597} {"train_loss": -36.17877960205078, "global_step": 72245, "epoch": 597} {"train_loss": -36.21017837524414, "global_step": 72246, "epoch": 597} {"train_loss": -37.209232330322266, "global_step": 72247, "epoch": 597} {"train_loss": -35.73857879638672, "global_step": 72248, "epoch": 597} {"train_loss": -36.64732360839844, "global_step": 72249, "epoch": 597} {"train_loss": -36.373348236083984, "global_step": 72250, "epoch": 597} {"train_loss": -36.03257369995117, "global_step": 72251, "epoch": 597} {"train_loss": -37.23970413208008, "global_step": 72252, "epoch": 597} {"train_loss": -36.287261962890625, "global_step": 72253, "epoch": 597} {"train_loss": -36.70172882080078, "global_step": 72254, "epoch": 597} {"train_loss": -36.890464782714844, "global_step": 72255, "epoch": 597} {"train_loss": -36.406795501708984, "global_step": 72256, "epoch": 597} {"train_loss": -36.7888298034668, "global_step": 72257, "epoch": 597} {"train_loss": -36.743316650390625, "global_step": 72258, "epoch": 597} {"train_loss": -35.71458053588867, "global_step": 72259, "epoch": 597} {"train_loss": -36.03407669067383, "global_step": 72260, "epoch": 597} {"train_loss": -36.80076217651367, "global_step": 72261, "epoch": 597} {"train_loss": -37.32633590698242, "global_step": 72262, "epoch": 597} {"train_loss": -37.028358459472656, "global_step": 72263, "epoch": 597} {"train_loss": -36.93682861328125, "global_step": 72264, "epoch": 597} {"train_loss": -36.70956039428711, "global_step": 72265, "epoch": 597} {"train_loss": -37.37635803222656, "global_step": 72266, "epoch": 597} {"train_loss": -37.60704040527344, "global_step": 72267, "epoch": 597} {"train_loss": -36.948516845703125, "global_step": 72268, "epoch": 597} {"train_loss": -36.80533981323242, "global_step": 72269, "epoch": 597} {"train_loss": -37.354888916015625, "global_step": 72270, "epoch": 597} {"train_loss": -37.39063262939453, "global_step": 72271, "epoch": 597} {"train_loss": -36.39252853393555, "global_step": 72272, "epoch": 597} {"train_loss": -37.124061584472656, "global_step": 72273, "epoch": 597} {"train_loss": -37.02109146118164, "global_step": 72274, "epoch": 597} {"train_loss": -37.40120315551758, "global_step": 72275, "epoch": 597} {"train_loss": -37.5670280456543, "global_step": 72276, "epoch": 597} {"train_loss": -37.48115158081055, "global_step": 72277, "epoch": 597} {"train_loss": -36.63595199584961, "global_step": 72278, "epoch": 597} {"train_loss": -36.99292755126953, "global_step": 72279, "epoch": 597} {"train_loss": -37.773231506347656, "global_step": 72280, "epoch": 597} {"train_loss": -36.966060638427734, "global_step": 72281, "epoch": 597} {"train_loss": -37.07001876831055, "global_step": 72282, "epoch": 597} {"train_loss": -35.762794494628906, "global_step": 72283, "epoch": 597} {"train_loss": -36.72368621826172, "global_step": 72284, "epoch": 597} {"train_loss": -37.196128845214844, "global_step": 72285, "epoch": 597} {"train_loss": -36.34705352783203, "global_step": 72286, "epoch": 597} {"train_loss": -35.80364990234375, "global_step": 72287, "epoch": 597} {"train_loss": -34.65806198120117, "global_step": 72288, "epoch": 597} {"train_loss": -34.46059036254883, "global_step": 72289, "epoch": 597} {"train_loss": -35.42070388793945, "global_step": 72290, "epoch": 597} {"train_loss": -36.594234466552734, "global_step": 72291, "epoch": 597} {"train_loss": -33.83419418334961, "global_step": 72292, "epoch": 597} {"train_loss": -35.024078369140625, "global_step": 72293, "epoch": 597} {"train_loss": -32.9472770690918, "global_step": 72294, "epoch": 597} {"train_loss": -33.96294021606445, "global_step": 72295, "epoch": 597} {"train_loss": -35.30440139770508, "global_step": 72296, "epoch": 597} {"train_loss": -35.320526123046875, "global_step": 72297, "epoch": 597} {"train_loss": -34.25935745239258, "global_step": 72298, "epoch": 597} {"train_loss": -33.22090530395508, "global_step": 72299, "epoch": 597} {"train_loss": -31.567724227905273, "global_step": 72300, "epoch": 597} {"train_loss": -35.92522048950195, "global_step": 72301, "epoch": 597} {"train_loss": -32.61613082885742, "global_step": 72302, "epoch": 597} {"train_loss": -35.963134765625, "global_step": 72303, "epoch": 597} {"train_loss": -34.74076461791992, "global_step": 72304, "epoch": 597} {"train_loss": -34.756629943847656, "global_step": 72305, "epoch": 597} {"train_loss": -36.22922897338867, "global_step": 72306, "epoch": 597} {"train_loss": -35.450130462646484, "global_step": 72307, "epoch": 597} {"train_loss": -34.68842697143555, "global_step": 72308, "epoch": 597} {"train_loss": -36.46328353881836, "global_step": 72309, "epoch": 597} {"train_loss": -35.23768997192383, "global_step": 72310, "epoch": 597} {"train_loss": -35.37501907348633, "global_step": 72311, "epoch": 597} {"train_loss": -36.49103927612305, "global_step": 72312, "epoch": 597} {"train_loss": -33.88992691040039, "global_step": 72313, "epoch": 597} {"train_loss": -35.06760787963867, "global_step": 72314, "epoch": 597} {"train_loss": -36.10944366455078, "global_step": 72315, "epoch": 597} {"train_loss": -35.599693298339844, "global_step": 72316, "epoch": 597} {"train_loss": -36.252235412597656, "global_step": 72317, "epoch": 597} {"train_loss": -35.759151458740234, "global_step": 72318, "epoch": 597} {"train_loss": -36.33636474609375, "global_step": 72319, "epoch": 597} {"train_loss": -36.3309211730957, "global_step": 72320, "epoch": 597} {"train_loss": -36.49005126953125, "global_step": 72321, "epoch": 597} {"train_loss": -36.65098571777344, "global_step": 72322, "epoch": 597} {"train_loss": -35.93159484863281, "global_step": 72323, "epoch": 597} {"train_loss": -36.87551498413086, "global_step": 72324, "epoch": 597} {"train_loss": -36.65058135986328, "global_step": 72325, "epoch": 597} {"train_loss": -36.215789794921875, "global_step": 72326, "epoch": 597} {"train_loss": -35.27845001220703, "global_step": 72327, "epoch": 597} {"train_loss": -36.26747131347656, "global_step": 72328, "epoch": 597} {"train_loss": -35.90918731689453, "global_step": 72329, "epoch": 597} {"train_loss": -35.704097747802734, "global_step": 72330, "epoch": 597} {"train_loss": -34.8393669128418, "global_step": 72331, "epoch": 597} {"train_loss": -33.751644134521484, "global_step": 72332, "epoch": 597} {"train_loss": -34.046260833740234, "global_step": 72333, "epoch": 597} {"train_loss": -34.38075256347656, "global_step": 72334, "epoch": 597} {"train_loss": -36.29267501831055, "global_step": 72335, "epoch": 597} {"train_loss": -36.43500518798828, "global_step": 72336, "epoch": 597} {"train_loss": -36.53102493286133, "global_step": 72337, "epoch": 597} {"train_loss": -35.51230239868164, "global_step": 72338, "epoch": 597} {"train_loss": -35.3975830078125, "global_step": 72339, "epoch": 597} {"train_loss": -36.625877380371094, "global_step": 72340, "epoch": 597} {"train_loss": -34.8177490234375, "global_step": 72341, "epoch": 597} {"train_loss": -36.43048095703125, "global_step": 72342, "epoch": 597} {"train_loss": -36.062713623046875, "global_step": 72343, "epoch": 597} {"train_loss": -36.15073013305664, "global_step": 72344, "epoch": 597} {"train_loss": -35.35791015625, "global_step": 72345, "epoch": 597} {"train_loss": -35.758544921875, "global_step": 72346, "epoch": 597} {"train_loss": -35.95163345336914, "global_step": 72347, "epoch": 597} {"train_loss": -36.39453887939453, "global_step": 72348, "epoch": 597} {"train_loss": -35.90998458862305, "global_step": 72349, "epoch": 597} {"train_loss": -36.05593490600586, "global_step": 72350, "epoch": 597} {"train_loss": -35.58790969848633, "global_step": 72351, "epoch": 597} {"train_loss": -36.7096061706543, "global_step": 72352, "epoch": 597} {"train_loss": -36.0080451965332, "global_step": 72353, "epoch": 597} {"train_loss": -34.59588623046875, "global_step": 72354, "epoch": 597} {"train_loss": -33.30254364013672, "global_step": 72355, "epoch": 597} {"train_loss": -33.53196716308594, "global_step": 72356, "epoch": 597} {"train_loss": -35.920438356635984, "global_step": 72357, "epoch": 597, "val_loss": 2555959.0} {"train_loss": -35.3495979309082, "global_step": 72358, "epoch": 598} {"train_loss": -35.70621109008789, "global_step": 72359, "epoch": 598} {"train_loss": -35.89439010620117, "global_step": 72360, "epoch": 598} {"train_loss": -34.8648567199707, "global_step": 72361, "epoch": 598} {"train_loss": -35.2255744934082, "global_step": 72362, "epoch": 598} {"train_loss": -35.85097122192383, "global_step": 72363, "epoch": 598} {"train_loss": -34.82731246948242, "global_step": 72364, "epoch": 598} {"train_loss": -35.6787109375, "global_step": 72365, "epoch": 598} {"train_loss": -34.14217758178711, "global_step": 72366, "epoch": 598} {"train_loss": -33.82853317260742, "global_step": 72367, "epoch": 598} {"train_loss": -35.546993255615234, "global_step": 72368, "epoch": 598} {"train_loss": -36.3034782409668, "global_step": 72369, "epoch": 598} {"train_loss": -35.42470932006836, "global_step": 72370, "epoch": 598} {"train_loss": -36.20524597167969, "global_step": 72371, "epoch": 598} {"train_loss": -32.11560821533203, "global_step": 72372, "epoch": 598} {"train_loss": -35.40536117553711, "global_step": 72373, "epoch": 598} {"train_loss": -35.973716735839844, "global_step": 72374, "epoch": 598} {"train_loss": -34.66075897216797, "global_step": 72375, "epoch": 598} {"train_loss": -36.33559799194336, "global_step": 72376, "epoch": 598} {"train_loss": -35.622798919677734, "global_step": 72377, "epoch": 598} {"train_loss": -34.73317337036133, "global_step": 72378, "epoch": 598} {"train_loss": -31.213300704956055, "global_step": 72379, "epoch": 598} {"train_loss": -35.35258865356445, "global_step": 72380, "epoch": 598} {"train_loss": -36.800045013427734, "global_step": 72381, "epoch": 598} {"train_loss": -34.41679763793945, "global_step": 72382, "epoch": 598} {"train_loss": -33.44834518432617, "global_step": 72383, "epoch": 598} {"train_loss": -35.513057708740234, "global_step": 72384, "epoch": 598} {"train_loss": -35.95386505126953, "global_step": 72385, "epoch": 598} {"train_loss": -35.31061553955078, "global_step": 72386, "epoch": 598} {"train_loss": -35.64352035522461, "global_step": 72387, "epoch": 598} {"train_loss": -36.003597259521484, "global_step": 72388, "epoch": 598} {"train_loss": -35.49813461303711, "global_step": 72389, "epoch": 598} {"train_loss": -32.58935546875, "global_step": 72390, "epoch": 598} {"train_loss": -35.52511215209961, "global_step": 72391, "epoch": 598} {"train_loss": -36.02909469604492, "global_step": 72392, "epoch": 598} {"train_loss": -35.11967849731445, "global_step": 72393, "epoch": 598} {"train_loss": -36.14085006713867, "global_step": 72394, "epoch": 598} {"train_loss": -35.85235595703125, "global_step": 72395, "epoch": 598} {"train_loss": -35.6069450378418, "global_step": 72396, "epoch": 598} {"train_loss": -35.94684982299805, "global_step": 72397, "epoch": 598} {"train_loss": -36.03776168823242, "global_step": 72398, "epoch": 598} {"train_loss": -34.48212432861328, "global_step": 72399, "epoch": 598} {"train_loss": -34.16024398803711, "global_step": 72400, "epoch": 598} {"train_loss": -36.11591720581055, "global_step": 72401, "epoch": 598} {"train_loss": -36.0122184753418, "global_step": 72402, "epoch": 598} {"train_loss": -36.06657791137695, "global_step": 72403, "epoch": 598} {"train_loss": -35.270233154296875, "global_step": 72404, "epoch": 598} {"train_loss": -35.91987228393555, "global_step": 72405, "epoch": 598} {"train_loss": -30.521162033081055, "global_step": 72406, "epoch": 598} {"train_loss": -36.234798431396484, "global_step": 72407, "epoch": 598} {"train_loss": -35.570960998535156, "global_step": 72408, "epoch": 598} {"train_loss": -35.73237228393555, "global_step": 72409, "epoch": 598} {"train_loss": -36.017967224121094, "global_step": 72410, "epoch": 598} {"train_loss": -34.913734436035156, "global_step": 72411, "epoch": 598} {"train_loss": -36.25252151489258, "global_step": 72412, "epoch": 598} {"train_loss": -36.68970489501953, "global_step": 72413, "epoch": 598} {"train_loss": -36.1188850402832, "global_step": 72414, "epoch": 598} {"train_loss": -36.20246124267578, "global_step": 72415, "epoch": 598} {"train_loss": -36.289669036865234, "global_step": 72416, "epoch": 598} {"train_loss": -36.1539421081543, "global_step": 72417, "epoch": 598} {"train_loss": -36.62727737426758, "global_step": 72418, "epoch": 598} {"train_loss": -35.9713249206543, "global_step": 72419, "epoch": 598} {"train_loss": -36.408050537109375, "global_step": 72420, "epoch": 598} {"train_loss": -36.67330551147461, "global_step": 72421, "epoch": 598} {"train_loss": -36.17981719970703, "global_step": 72422, "epoch": 598} {"train_loss": -35.4089241027832, "global_step": 72423, "epoch": 598} {"train_loss": -36.44747543334961, "global_step": 72424, "epoch": 598} {"train_loss": -36.36893081665039, "global_step": 72425, "epoch": 598} {"train_loss": -36.03535079956055, "global_step": 72426, "epoch": 598} {"train_loss": -35.94022750854492, "global_step": 72427, "epoch": 598} {"train_loss": -35.924598693847656, "global_step": 72428, "epoch": 598} {"train_loss": -35.85313034057617, "global_step": 72429, "epoch": 598} {"train_loss": -36.26784133911133, "global_step": 72430, "epoch": 598} {"train_loss": -36.02635955810547, "global_step": 72431, "epoch": 598} {"train_loss": -36.0728874206543, "global_step": 72432, "epoch": 598} {"train_loss": -36.21363067626953, "global_step": 72433, "epoch": 598} {"train_loss": -35.27528762817383, "global_step": 72434, "epoch": 598} {"train_loss": -35.591121673583984, "global_step": 72435, "epoch": 598} {"train_loss": -35.93231964111328, "global_step": 72436, "epoch": 598} {"train_loss": -34.580078125, "global_step": 72437, "epoch": 598} {"train_loss": -36.31744384765625, "global_step": 72438, "epoch": 598} {"train_loss": -33.42454147338867, "global_step": 72439, "epoch": 598} {"train_loss": -29.791324615478516, "global_step": 72440, "epoch": 598} {"train_loss": -26.641202926635742, "global_step": 72441, "epoch": 598} {"train_loss": -29.498823165893555, "global_step": 72442, "epoch": 598} {"train_loss": -33.018157958984375, "global_step": 72443, "epoch": 598} {"train_loss": -27.891767501831055, "global_step": 72444, "epoch": 598} {"train_loss": -32.01922607421875, "global_step": 72445, "epoch": 598} {"train_loss": -33.12578582763672, "global_step": 72446, "epoch": 598} {"train_loss": -31.62590980529785, "global_step": 72447, "epoch": 598} {"train_loss": -34.20522689819336, "global_step": 72448, "epoch": 598} {"train_loss": -34.24951171875, "global_step": 72449, "epoch": 598} {"train_loss": -34.348663330078125, "global_step": 72450, "epoch": 598} {"train_loss": -34.56290817260742, "global_step": 72451, "epoch": 598} {"train_loss": -35.96419143676758, "global_step": 72452, "epoch": 598} {"train_loss": -34.71639633178711, "global_step": 72453, "epoch": 598} {"train_loss": -33.91141891479492, "global_step": 72454, "epoch": 598} {"train_loss": -35.015621185302734, "global_step": 72455, "epoch": 598} {"train_loss": -35.31422805786133, "global_step": 72456, "epoch": 598} {"train_loss": -34.203346252441406, "global_step": 72457, "epoch": 598} {"train_loss": -35.423805236816406, "global_step": 72458, "epoch": 598} {"train_loss": -35.10602569580078, "global_step": 72459, "epoch": 598} {"train_loss": -35.241004943847656, "global_step": 72460, "epoch": 598} {"train_loss": -35.31437683105469, "global_step": 72461, "epoch": 598} {"train_loss": -36.067237854003906, "global_step": 72462, "epoch": 598} {"train_loss": -35.689876556396484, "global_step": 72463, "epoch": 598} {"train_loss": -35.93522262573242, "global_step": 72464, "epoch": 598} {"train_loss": -36.02082061767578, "global_step": 72465, "epoch": 598} {"train_loss": -35.93069076538086, "global_step": 72466, "epoch": 598} {"train_loss": -35.653560638427734, "global_step": 72467, "epoch": 598} {"train_loss": -35.41543197631836, "global_step": 72468, "epoch": 598} {"train_loss": -35.90147018432617, "global_step": 72469, "epoch": 598} {"train_loss": -36.3358039855957, "global_step": 72470, "epoch": 598} {"train_loss": -36.09036636352539, "global_step": 72471, "epoch": 598} {"train_loss": -35.9857063293457, "global_step": 72472, "epoch": 598} {"train_loss": -36.27396011352539, "global_step": 72473, "epoch": 598} {"train_loss": -35.729488372802734, "global_step": 72474, "epoch": 598} {"train_loss": -36.318626403808594, "global_step": 72475, "epoch": 598} {"train_loss": -35.80672836303711, "global_step": 72476, "epoch": 598} {"train_loss": -36.214111328125, "global_step": 72477, "epoch": 598} {"train_loss": -35.128514691817855, "global_step": 72478, "epoch": 598, "val_loss": 2570953.75} {"train_loss": -36.28089141845703, "global_step": 72479, "epoch": 599} {"train_loss": -36.29343795776367, "global_step": 72480, "epoch": 599} {"train_loss": -34.7667350769043, "global_step": 72481, "epoch": 599} {"train_loss": -36.7501335144043, "global_step": 72482, "epoch": 599} {"train_loss": -36.449493408203125, "global_step": 72483, "epoch": 599} {"train_loss": -37.003719329833984, "global_step": 72484, "epoch": 599} {"train_loss": -37.16386413574219, "global_step": 72485, "epoch": 599} {"train_loss": -36.77180099487305, "global_step": 72486, "epoch": 599} {"train_loss": -35.67226791381836, "global_step": 72487, "epoch": 599} {"train_loss": -36.8237419128418, "global_step": 72488, "epoch": 599} {"train_loss": -36.70490646362305, "global_step": 72489, "epoch": 599} {"train_loss": -37.13616943359375, "global_step": 72490, "epoch": 599} {"train_loss": -37.03867721557617, "global_step": 72491, "epoch": 599} {"train_loss": -36.18896484375, "global_step": 72492, "epoch": 599} {"train_loss": -36.960426330566406, "global_step": 72493, "epoch": 599} {"train_loss": -36.3847541809082, "global_step": 72494, "epoch": 599} {"train_loss": -37.11452865600586, "global_step": 72495, "epoch": 599} {"train_loss": -35.43960952758789, "global_step": 72496, "epoch": 599} {"train_loss": -37.16620635986328, "global_step": 72497, "epoch": 599} {"train_loss": -36.83504104614258, "global_step": 72498, "epoch": 599} {"train_loss": -37.0747184753418, "global_step": 72499, "epoch": 599} {"train_loss": -36.74650955200195, "global_step": 72500, "epoch": 599} {"train_loss": -37.23289108276367, "global_step": 72501, "epoch": 599} {"train_loss": -36.820796966552734, "global_step": 72502, "epoch": 599} {"train_loss": -37.183013916015625, "global_step": 72503, "epoch": 599} {"train_loss": -36.7776985168457, "global_step": 72504, "epoch": 599} {"train_loss": -36.97587966918945, "global_step": 72505, "epoch": 599} {"train_loss": -36.85183334350586, "global_step": 72506, "epoch": 599} {"train_loss": -35.95519256591797, "global_step": 72507, "epoch": 599} {"train_loss": -36.07640838623047, "global_step": 72508, "epoch": 599} {"train_loss": -36.532527923583984, "global_step": 72509, "epoch": 599} {"train_loss": -37.121768951416016, "global_step": 72510, "epoch": 599} {"train_loss": -36.5006103515625, "global_step": 72511, "epoch": 599} {"train_loss": -35.002010345458984, "global_step": 72512, "epoch": 599} {"train_loss": -31.161773681640625, "global_step": 72513, "epoch": 599} {"train_loss": -27.514307022094727, "global_step": 72514, "epoch": 599} {"train_loss": -33.51900100708008, "global_step": 72515, "epoch": 599} {"train_loss": -35.628265380859375, "global_step": 72516, "epoch": 599} {"train_loss": -32.66752243041992, "global_step": 72517, "epoch": 599} {"train_loss": -32.818336486816406, "global_step": 72518, "epoch": 599} {"train_loss": -35.901153564453125, "global_step": 72519, "epoch": 599} {"train_loss": -32.72290802001953, "global_step": 72520, "epoch": 599} {"train_loss": -32.79295349121094, "global_step": 72521, "epoch": 599} {"train_loss": -36.54153060913086, "global_step": 72522, "epoch": 599} {"train_loss": -33.07120895385742, "global_step": 72523, "epoch": 599} {"train_loss": -36.31867599487305, "global_step": 72524, "epoch": 599} {"train_loss": -35.8216667175293, "global_step": 72525, "epoch": 599} {"train_loss": -36.13616943359375, "global_step": 72526, "epoch": 599} {"train_loss": -34.94111633300781, "global_step": 72527, "epoch": 599} {"train_loss": -35.510223388671875, "global_step": 72528, "epoch": 599} {"train_loss": -36.59339141845703, "global_step": 72529, "epoch": 599} {"train_loss": -36.05227279663086, "global_step": 72530, "epoch": 599} {"train_loss": -36.28968048095703, "global_step": 72531, "epoch": 599} {"train_loss": -35.5010986328125, "global_step": 72532, "epoch": 599} {"train_loss": -35.81489944458008, "global_step": 72533, "epoch": 599} {"train_loss": -36.31515121459961, "global_step": 72534, "epoch": 599} {"train_loss": -35.87355041503906, "global_step": 72535, "epoch": 599} {"train_loss": -36.82015609741211, "global_step": 72536, "epoch": 599} {"train_loss": -36.190773010253906, "global_step": 72537, "epoch": 599} {"train_loss": -36.20654296875, "global_step": 72538, "epoch": 599} {"train_loss": -35.88481521606445, "global_step": 72539, "epoch": 599} {"train_loss": -35.99721145629883, "global_step": 72540, "epoch": 599} {"train_loss": -36.49774169921875, "global_step": 72541, "epoch": 599} {"train_loss": -36.49321746826172, "global_step": 72542, "epoch": 599} {"train_loss": -35.73247146606445, "global_step": 72543, "epoch": 599} {"train_loss": -36.63370895385742, "global_step": 72544, "epoch": 599} {"train_loss": -36.26475143432617, "global_step": 72545, "epoch": 599} {"train_loss": -36.959678649902344, "global_step": 72546, "epoch": 599} {"train_loss": -36.948482513427734, "global_step": 72547, "epoch": 599} {"train_loss": -36.52959060668945, "global_step": 72548, "epoch": 599} {"train_loss": -36.99533462524414, "global_step": 72549, "epoch": 599} {"train_loss": -36.80522918701172, "global_step": 72550, "epoch": 599} {"train_loss": -36.240020751953125, "global_step": 72551, "epoch": 599} {"train_loss": -36.860679626464844, "global_step": 72552, "epoch": 599} {"train_loss": -36.91516876220703, "global_step": 72553, "epoch": 599} {"train_loss": -36.999664306640625, "global_step": 72554, "epoch": 599} {"train_loss": -36.42095947265625, "global_step": 72555, "epoch": 599} {"train_loss": -37.37961959838867, "global_step": 72556, "epoch": 599} {"train_loss": -36.800872802734375, "global_step": 72557, "epoch": 599} {"train_loss": -36.70647048950195, "global_step": 72558, "epoch": 599} {"train_loss": -37.26713180541992, "global_step": 72559, "epoch": 599} {"train_loss": -37.27952575683594, "global_step": 72560, "epoch": 599} {"train_loss": -36.644954681396484, "global_step": 72561, "epoch": 599} {"train_loss": -36.509246826171875, "global_step": 72562, "epoch": 599} {"train_loss": -37.001583099365234, "global_step": 72563, "epoch": 599} {"train_loss": -37.20229721069336, "global_step": 72564, "epoch": 599} {"train_loss": -37.2218132019043, "global_step": 72565, "epoch": 599} {"train_loss": -36.97163009643555, "global_step": 72566, "epoch": 599} {"train_loss": -37.02396774291992, "global_step": 72567, "epoch": 599} {"train_loss": -36.90030288696289, "global_step": 72568, "epoch": 599} {"train_loss": -36.07331466674805, "global_step": 72569, "epoch": 599} {"train_loss": -36.98146438598633, "global_step": 72570, "epoch": 599} {"train_loss": -36.45400619506836, "global_step": 72571, "epoch": 599} {"train_loss": -37.22140884399414, "global_step": 72572, "epoch": 599} {"train_loss": -36.56874465942383, "global_step": 72573, "epoch": 599} {"train_loss": -36.865211486816406, "global_step": 72574, "epoch": 599} {"train_loss": -36.68687057495117, "global_step": 72575, "epoch": 599} {"train_loss": -36.33296585083008, "global_step": 72576, "epoch": 599} {"train_loss": -34.8192138671875, "global_step": 72577, "epoch": 599} {"train_loss": -36.45356369018555, "global_step": 72578, "epoch": 599} {"train_loss": -37.24357986450195, "global_step": 72579, "epoch": 599} {"train_loss": -35.46358871459961, "global_step": 72580, "epoch": 599} {"train_loss": -36.44771957397461, "global_step": 72581, "epoch": 599} {"train_loss": -35.43415451049805, "global_step": 72582, "epoch": 599} {"train_loss": -36.78120422363281, "global_step": 72583, "epoch": 599} {"train_loss": -37.142494201660156, "global_step": 72584, "epoch": 599} {"train_loss": -34.84071731567383, "global_step": 72585, "epoch": 599} {"train_loss": -35.89994430541992, "global_step": 72586, "epoch": 599} {"train_loss": -36.768707275390625, "global_step": 72587, "epoch": 599} {"train_loss": -34.77012252807617, "global_step": 72588, "epoch": 599} {"train_loss": -35.50272750854492, "global_step": 72589, "epoch": 599} {"train_loss": -36.1780891418457, "global_step": 72590, "epoch": 599} {"train_loss": -33.55725860595703, "global_step": 72591, "epoch": 599} {"train_loss": -35.86376953125, "global_step": 72592, "epoch": 599} {"train_loss": -35.78948211669922, "global_step": 72593, "epoch": 599} {"train_loss": -35.88405990600586, "global_step": 72594, "epoch": 599} {"train_loss": -36.18024826049805, "global_step": 72595, "epoch": 599} {"train_loss": -35.64875411987305, "global_step": 72596, "epoch": 599} {"train_loss": -35.42845916748047, "global_step": 72597, "epoch": 599} {"train_loss": -36.09162521362305, "global_step": 72598, "epoch": 599} {"train_loss": -36.09636576313618, "global_step": 72599, "epoch": 599, "val_loss": 2638559.25} {"train_loss": -36.86677932739258, "global_step": 72600, "epoch": 600} {"train_loss": -36.28181457519531, "global_step": 72601, "epoch": 600} {"train_loss": -35.98189926147461, "global_step": 72602, "epoch": 600} {"train_loss": -37.08236312866211, "global_step": 72603, "epoch": 600} {"train_loss": -35.56855392456055, "global_step": 72604, "epoch": 600} {"train_loss": -35.883182525634766, "global_step": 72605, "epoch": 600} {"train_loss": -34.53434371948242, "global_step": 72606, "epoch": 600} {"train_loss": -36.36392593383789, "global_step": 72607, "epoch": 600} {"train_loss": -36.5588264465332, "global_step": 72608, "epoch": 600} {"train_loss": -36.20245361328125, "global_step": 72609, "epoch": 600} {"train_loss": -35.806461334228516, "global_step": 72610, "epoch": 600} {"train_loss": -35.4659423828125, "global_step": 72611, "epoch": 600} {"train_loss": -36.553688049316406, "global_step": 72612, "epoch": 600} {"train_loss": -35.28487777709961, "global_step": 72613, "epoch": 600} {"train_loss": -34.1986083984375, "global_step": 72614, "epoch": 600} {"train_loss": -35.2671012878418, "global_step": 72615, "epoch": 600} {"train_loss": -36.227718353271484, "global_step": 72616, "epoch": 600} {"train_loss": -36.87266159057617, "global_step": 72617, "epoch": 600} {"train_loss": -36.087345123291016, "global_step": 72618, "epoch": 600} {"train_loss": -32.917354583740234, "global_step": 72619, "epoch": 600} {"train_loss": -30.283950805664062, "global_step": 72620, "epoch": 600} {"train_loss": -29.188138961791992, "global_step": 72621, "epoch": 600} {"train_loss": -31.95233726501465, "global_step": 72622, "epoch": 600} {"train_loss": -36.78007888793945, "global_step": 72623, "epoch": 600} {"train_loss": -33.46744918823242, "global_step": 72624, "epoch": 600} {"train_loss": -35.283870697021484, "global_step": 72625, "epoch": 600} {"train_loss": -35.81378936767578, "global_step": 72626, "epoch": 600} {"train_loss": -33.660343170166016, "global_step": 72627, "epoch": 600} {"train_loss": -35.596370697021484, "global_step": 72628, "epoch": 600} {"train_loss": -33.817909240722656, "global_step": 72629, "epoch": 600} {"train_loss": -33.95230484008789, "global_step": 72630, "epoch": 600} {"train_loss": -35.898658752441406, "global_step": 72631, "epoch": 600} {"train_loss": -36.67221450805664, "global_step": 72632, "epoch": 600} {"train_loss": -36.01578903198242, "global_step": 72633, "epoch": 600} {"train_loss": -34.34678649902344, "global_step": 72634, "epoch": 600} {"train_loss": -36.04175567626953, "global_step": 72635, "epoch": 600} {"train_loss": -35.67155075073242, "global_step": 72636, "epoch": 600} {"train_loss": -36.63410568237305, "global_step": 72637, "epoch": 600} {"train_loss": -35.95243453979492, "global_step": 72638, "epoch": 600} {"train_loss": -36.717613220214844, "global_step": 72639, "epoch": 600} {"train_loss": -35.417335510253906, "global_step": 72640, "epoch": 600} {"train_loss": -36.69911575317383, "global_step": 72641, "epoch": 600} {"train_loss": -36.581016540527344, "global_step": 72642, "epoch": 600} {"train_loss": -36.311275482177734, "global_step": 72643, "epoch": 600} {"train_loss": -36.3395881652832, "global_step": 72644, "epoch": 600} {"train_loss": -36.234527587890625, "global_step": 72645, "epoch": 600} {"train_loss": -36.4495735168457, "global_step": 72646, "epoch": 600} {"train_loss": -36.9905891418457, "global_step": 72647, "epoch": 600} {"train_loss": -35.26819610595703, "global_step": 72648, "epoch": 600} {"train_loss": -36.59214782714844, "global_step": 72649, "epoch": 600} {"train_loss": -36.57242965698242, "global_step": 72650, "epoch": 600} {"train_loss": -37.13547134399414, "global_step": 72651, "epoch": 600} {"train_loss": -36.53459548950195, "global_step": 72652, "epoch": 600} {"train_loss": -37.0014533996582, "global_step": 72653, "epoch": 600} {"train_loss": -36.22353744506836, "global_step": 72654, "epoch": 600} {"train_loss": -36.279884338378906, "global_step": 72655, "epoch": 600} {"train_loss": -36.27633285522461, "global_step": 72656, "epoch": 600} {"train_loss": -37.02726364135742, "global_step": 72657, "epoch": 600} {"train_loss": -36.85625076293945, "global_step": 72658, "epoch": 600} {"train_loss": -36.47439193725586, "global_step": 72659, "epoch": 600} {"train_loss": -36.883113861083984, "global_step": 72660, "epoch": 600} {"train_loss": -37.10246658325195, "global_step": 72661, "epoch": 600} {"train_loss": -37.1599006652832, "global_step": 72662, "epoch": 600} {"train_loss": -36.31893539428711, "global_step": 72663, "epoch": 600} {"train_loss": -37.064876556396484, "global_step": 72664, "epoch": 600} {"train_loss": -37.188777923583984, "global_step": 72665, "epoch": 600} {"train_loss": -36.94524002075195, "global_step": 72666, "epoch": 600} {"train_loss": -37.123435974121094, "global_step": 72667, "epoch": 600} {"train_loss": -37.10720443725586, "global_step": 72668, "epoch": 600} {"train_loss": -37.29316329956055, "global_step": 72669, "epoch": 600} {"train_loss": -37.151424407958984, "global_step": 72670, "epoch": 600} {"train_loss": -37.06884002685547, "global_step": 72671, "epoch": 600} {"train_loss": -37.007667541503906, "global_step": 72672, "epoch": 600} {"train_loss": -37.2001953125, "global_step": 72673, "epoch": 600} {"train_loss": -37.145938873291016, "global_step": 72674, "epoch": 600} {"train_loss": -37.417171478271484, "global_step": 72675, "epoch": 600} {"train_loss": -37.48674392700195, "global_step": 72676, "epoch": 600} {"train_loss": -37.27532958984375, "global_step": 72677, "epoch": 600} {"train_loss": -37.485137939453125, "global_step": 72678, "epoch": 600} {"train_loss": -37.06864547729492, "global_step": 72679, "epoch": 600} {"train_loss": -37.51015090942383, "global_step": 72680, "epoch": 600} {"train_loss": -37.108585357666016, "global_step": 72681, "epoch": 600} {"train_loss": -37.04462814331055, "global_step": 72682, "epoch": 600} {"train_loss": -37.7583122253418, "global_step": 72683, "epoch": 600} {"train_loss": -36.72098922729492, "global_step": 72684, "epoch": 600} {"train_loss": -37.70915603637695, "global_step": 72685, "epoch": 600} {"train_loss": -36.7652587890625, "global_step": 72686, "epoch": 600} {"train_loss": -37.80950927734375, "global_step": 72687, "epoch": 600} {"train_loss": -37.847572326660156, "global_step": 72688, "epoch": 600} {"train_loss": -37.388607025146484, "global_step": 72689, "epoch": 600} {"train_loss": -36.94927215576172, "global_step": 72690, "epoch": 600} {"train_loss": -37.5295524597168, "global_step": 72691, "epoch": 600} {"train_loss": -37.91341781616211, "global_step": 72692, "epoch": 600} {"train_loss": -37.4839973449707, "global_step": 72693, "epoch": 600} {"train_loss": -37.09983825683594, "global_step": 72694, "epoch": 600} {"train_loss": -37.693603515625, "global_step": 72695, "epoch": 600} {"train_loss": -36.789546966552734, "global_step": 72696, "epoch": 600} {"train_loss": -37.5894660949707, "global_step": 72697, "epoch": 600} {"train_loss": -38.0455322265625, "global_step": 72698, "epoch": 600} {"train_loss": -37.139862060546875, "global_step": 72699, "epoch": 600} {"train_loss": -37.0750732421875, "global_step": 72700, "epoch": 600} {"train_loss": -35.70140075683594, "global_step": 72701, "epoch": 600} {"train_loss": -30.23771095275879, "global_step": 72702, "epoch": 600} {"train_loss": -18.588397979736328, "global_step": 72703, "epoch": 600} {"train_loss": -19.102537155151367, "global_step": 72704, "epoch": 600} {"train_loss": -30.936203002929688, "global_step": 72705, "epoch": 600} {"train_loss": -31.623682022094727, "global_step": 72706, "epoch": 600} {"train_loss": -30.650257110595703, "global_step": 72707, "epoch": 600} {"train_loss": -33.17173767089844, "global_step": 72708, "epoch": 600} {"train_loss": -26.3994197845459, "global_step": 72709, "epoch": 600} {"train_loss": -34.61479568481445, "global_step": 72710, "epoch": 600} {"train_loss": -32.6215705871582, "global_step": 72711, "epoch": 600} {"train_loss": -33.61454391479492, "global_step": 72712, "epoch": 600} {"train_loss": -34.40666580200195, "global_step": 72713, "epoch": 600} {"train_loss": -34.026275634765625, "global_step": 72714, "epoch": 600} {"train_loss": -35.33665466308594, "global_step": 72715, "epoch": 600} {"train_loss": -35.44308090209961, "global_step": 72716, "epoch": 600} {"train_loss": -34.78792953491211, "global_step": 72717, "epoch": 600} {"train_loss": -36.001708984375, "global_step": 72718, "epoch": 600} {"train_loss": -35.555416107177734, "global_step": 72719, "epoch": 600} {"train_loss": -35.57723604943141, "global_step": 72720, "epoch": 600, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4400000": 1.0, "test/sim_max_reward_4400001": 1.0, "test/sim_max_reward_4400002": 1.0, "test/sim_max_reward_4400003": 1.0, "test/sim_max_reward_4400004": 1.0, "test/sim_max_reward_4400005": 1.0, "test/sim_max_reward_4400006": 1.0, "test/sim_max_reward_4400007": 1.0, "test/sim_max_reward_4400008": 1.0, "test/sim_max_reward_4400009": 1.0, "test/sim_max_reward_4400010": 1.0, "test/sim_max_reward_4400011": 1.0, "test/sim_max_reward_4400012": 1.0, "test/sim_max_reward_4400013": 1.0, "test/sim_max_reward_4400014": 1.0, "test/sim_max_reward_4400015": 1.0, "test/sim_max_reward_4400016": 1.0, "test/sim_max_reward_4400017": 1.0, "test/sim_max_reward_4400018": 1.0, "test/sim_max_reward_4400019": 1.0, "test/sim_max_reward_4400020": 1.0, "test/sim_max_reward_4400021": 1.0, "train/mean_score": 1.0, "test/mean_score": 1.0, "val_loss": 2597434.0} {"train_loss": -36.151763916015625, "global_step": 72721, "epoch": 601} {"train_loss": -35.90706253051758, "global_step": 72722, "epoch": 601} {"train_loss": -36.036983489990234, "global_step": 72723, "epoch": 601} {"train_loss": -36.158016204833984, "global_step": 72724, "epoch": 601} {"train_loss": -35.65386962890625, "global_step": 72725, "epoch": 601} {"train_loss": -35.68901443481445, "global_step": 72726, "epoch": 601} {"train_loss": -35.716976165771484, "global_step": 72727, "epoch": 601} {"train_loss": -36.33591842651367, "global_step": 72728, "epoch": 601} {"train_loss": -35.08440017700195, "global_step": 72729, "epoch": 601} {"train_loss": -36.32328414916992, "global_step": 72730, "epoch": 601} {"train_loss": -35.983131408691406, "global_step": 72731, "epoch": 601} {"train_loss": -36.53474426269531, "global_step": 72732, "epoch": 601} {"train_loss": -36.05056381225586, "global_step": 72733, "epoch": 601} {"train_loss": -36.27717971801758, "global_step": 72734, "epoch": 601} {"train_loss": -36.7613639831543, "global_step": 72735, "epoch": 601} {"train_loss": -36.602081298828125, "global_step": 72736, "epoch": 601} {"train_loss": -36.398738861083984, "global_step": 72737, "epoch": 601} {"train_loss": -36.12457275390625, "global_step": 72738, "epoch": 601} {"train_loss": -37.22068786621094, "global_step": 72739, "epoch": 601} {"train_loss": -36.798160552978516, "global_step": 72740, "epoch": 601} {"train_loss": -36.929481506347656, "global_step": 72741, "epoch": 601} {"train_loss": -37.04806900024414, "global_step": 72742, "epoch": 601} {"train_loss": -36.80532455444336, "global_step": 72743, "epoch": 601} {"train_loss": -36.9484977722168, "global_step": 72744, "epoch": 601} {"train_loss": -36.84273910522461, "global_step": 72745, "epoch": 601} {"train_loss": -36.807682037353516, "global_step": 72746, "epoch": 601} {"train_loss": -37.36287307739258, "global_step": 72747, "epoch": 601} {"train_loss": -37.17906188964844, "global_step": 72748, "epoch": 601} {"train_loss": -36.80723190307617, "global_step": 72749, "epoch": 601} {"train_loss": -37.5106086730957, "global_step": 72750, "epoch": 601} {"train_loss": -37.58280563354492, "global_step": 72751, "epoch": 601} {"train_loss": -37.37654495239258, "global_step": 72752, "epoch": 601} {"train_loss": -36.90267562866211, "global_step": 72753, "epoch": 601} {"train_loss": -37.1339225769043, "global_step": 72754, "epoch": 601} {"train_loss": -37.761634826660156, "global_step": 72755, "epoch": 601} {"train_loss": -37.78701400756836, "global_step": 72756, "epoch": 601} {"train_loss": -36.697444915771484, "global_step": 72757, "epoch": 601} {"train_loss": -37.48862838745117, "global_step": 72758, "epoch": 601} {"train_loss": -37.68394470214844, "global_step": 72759, "epoch": 601} {"train_loss": -37.44547653198242, "global_step": 72760, "epoch": 601} {"train_loss": -37.804115295410156, "global_step": 72761, "epoch": 601} {"train_loss": -38.02113342285156, "global_step": 72762, "epoch": 601} {"train_loss": -37.111419677734375, "global_step": 72763, "epoch": 601} {"train_loss": -37.11137008666992, "global_step": 72764, "epoch": 601} {"train_loss": -37.25273513793945, "global_step": 72765, "epoch": 601} {"train_loss": -36.733055114746094, "global_step": 72766, "epoch": 601} {"train_loss": -37.189849853515625, "global_step": 72767, "epoch": 601} {"train_loss": -37.06508255004883, "global_step": 72768, "epoch": 601} {"train_loss": -36.894046783447266, "global_step": 72769, "epoch": 601} {"train_loss": -37.29080581665039, "global_step": 72770, "epoch": 601} {"train_loss": -36.97787094116211, "global_step": 72771, "epoch": 601} {"train_loss": -37.691650390625, "global_step": 72772, "epoch": 601} {"train_loss": -37.083473205566406, "global_step": 72773, "epoch": 601} {"train_loss": -36.82073974609375, "global_step": 72774, "epoch": 601} {"train_loss": -36.04423522949219, "global_step": 72775, "epoch": 601} {"train_loss": -36.776824951171875, "global_step": 72776, "epoch": 601} {"train_loss": -37.52117919921875, "global_step": 72777, "epoch": 601} {"train_loss": -37.064998626708984, "global_step": 72778, "epoch": 601} {"train_loss": -37.02779006958008, "global_step": 72779, "epoch": 601} {"train_loss": -37.11846923828125, "global_step": 72780, "epoch": 601} {"train_loss": -36.63496017456055, "global_step": 72781, "epoch": 601} {"train_loss": -34.29851150512695, "global_step": 72782, "epoch": 601} {"train_loss": -29.950605392456055, "global_step": 72783, "epoch": 601} {"train_loss": -23.035009384155273, "global_step": 72784, "epoch": 601} {"train_loss": -25.563974380493164, "global_step": 72785, "epoch": 601} {"train_loss": -31.297470092773438, "global_step": 72786, "epoch": 601} {"train_loss": -36.44110107421875, "global_step": 72787, "epoch": 601} {"train_loss": -31.855056762695312, "global_step": 72788, "epoch": 601} {"train_loss": -34.97161865234375, "global_step": 72789, "epoch": 601} {"train_loss": -33.64241409301758, "global_step": 72790, "epoch": 601} {"train_loss": -35.60068893432617, "global_step": 72791, "epoch": 601} {"train_loss": -34.30878829956055, "global_step": 72792, "epoch": 601} {"train_loss": -36.306068420410156, "global_step": 72793, "epoch": 601} {"train_loss": -34.364906311035156, "global_step": 72794, "epoch": 601} {"train_loss": -35.03081130981445, "global_step": 72795, "epoch": 601} {"train_loss": -35.08230209350586, "global_step": 72796, "epoch": 601} {"train_loss": -34.68337631225586, "global_step": 72797, "epoch": 601} {"train_loss": -36.284908294677734, "global_step": 72798, "epoch": 601} {"train_loss": -34.985511779785156, "global_step": 72799, "epoch": 601} {"train_loss": -36.292091369628906, "global_step": 72800, "epoch": 601} {"train_loss": -36.296077728271484, "global_step": 72801, "epoch": 601} {"train_loss": -35.35897445678711, "global_step": 72802, "epoch": 601} {"train_loss": -36.58127212524414, "global_step": 72803, "epoch": 601} {"train_loss": -36.4688720703125, "global_step": 72804, "epoch": 601} {"train_loss": -36.37498092651367, "global_step": 72805, "epoch": 601} {"train_loss": -36.75069808959961, "global_step": 72806, "epoch": 601} {"train_loss": -36.637420654296875, "global_step": 72807, "epoch": 601} {"train_loss": -36.636138916015625, "global_step": 72808, "epoch": 601} {"train_loss": -36.777801513671875, "global_step": 72809, "epoch": 601} {"train_loss": -36.83213806152344, "global_step": 72810, "epoch": 601} {"train_loss": -36.656829833984375, "global_step": 72811, "epoch": 601} {"train_loss": -37.19552230834961, "global_step": 72812, "epoch": 601} {"train_loss": -36.02040100097656, "global_step": 72813, "epoch": 601} {"train_loss": -36.891963958740234, "global_step": 72814, "epoch": 601} {"train_loss": -36.835426330566406, "global_step": 72815, "epoch": 601} {"train_loss": -37.0421257019043, "global_step": 72816, "epoch": 601} {"train_loss": -37.05363845825195, "global_step": 72817, "epoch": 601} {"train_loss": -36.69150924682617, "global_step": 72818, "epoch": 601} {"train_loss": -37.548065185546875, "global_step": 72819, "epoch": 601} {"train_loss": -37.05183029174805, "global_step": 72820, "epoch": 601} {"train_loss": -36.87973403930664, "global_step": 72821, "epoch": 601} {"train_loss": -36.94315719604492, "global_step": 72822, "epoch": 601} {"train_loss": -36.67236328125, "global_step": 72823, "epoch": 601} {"train_loss": -36.99668502807617, "global_step": 72824, "epoch": 601} {"train_loss": -36.954071044921875, "global_step": 72825, "epoch": 601} {"train_loss": -37.384761810302734, "global_step": 72826, "epoch": 601} {"train_loss": -37.16484451293945, "global_step": 72827, "epoch": 601} {"train_loss": -37.420196533203125, "global_step": 72828, "epoch": 601} {"train_loss": -36.78946304321289, "global_step": 72829, "epoch": 601} {"train_loss": -37.32121276855469, "global_step": 72830, "epoch": 601} {"train_loss": -37.2590446472168, "global_step": 72831, "epoch": 601} {"train_loss": -37.12384033203125, "global_step": 72832, "epoch": 601} {"train_loss": -37.04470443725586, "global_step": 72833, "epoch": 601} {"train_loss": -37.07768249511719, "global_step": 72834, "epoch": 601} {"train_loss": -37.62080383300781, "global_step": 72835, "epoch": 601} {"train_loss": -37.70882797241211, "global_step": 72836, "epoch": 601} {"train_loss": -36.73712158203125, "global_step": 72837, "epoch": 601} {"train_loss": -37.00991439819336, "global_step": 72838, "epoch": 601} {"train_loss": -37.78310775756836, "global_step": 72839, "epoch": 601} {"train_loss": -36.59666061401367, "global_step": 72840, "epoch": 601} {"train_loss": -36.32241721980828, "global_step": 72841, "epoch": 601, "val_loss": 2728715.0} {"train_loss": -37.687198638916016, "global_step": 72842, "epoch": 602} {"train_loss": -37.092342376708984, "global_step": 72843, "epoch": 602} {"train_loss": -36.70612335205078, "global_step": 72844, "epoch": 602} {"train_loss": -37.65174102783203, "global_step": 72845, "epoch": 602} {"train_loss": -37.56356430053711, "global_step": 72846, "epoch": 602} {"train_loss": -37.743587493896484, "global_step": 72847, "epoch": 602} {"train_loss": -37.39473342895508, "global_step": 72848, "epoch": 602} {"train_loss": -36.93130874633789, "global_step": 72849, "epoch": 602} {"train_loss": -37.96731185913086, "global_step": 72850, "epoch": 602} {"train_loss": -37.34004592895508, "global_step": 72851, "epoch": 602} {"train_loss": -37.79363250732422, "global_step": 72852, "epoch": 602} {"train_loss": -37.39604187011719, "global_step": 72853, "epoch": 602} {"train_loss": -36.8031005859375, "global_step": 72854, "epoch": 602} {"train_loss": -34.4478759765625, "global_step": 72855, "epoch": 602} {"train_loss": -36.648799896240234, "global_step": 72856, "epoch": 602} {"train_loss": -37.412818908691406, "global_step": 72857, "epoch": 602} {"train_loss": -36.592411041259766, "global_step": 72858, "epoch": 602} {"train_loss": -36.2701530456543, "global_step": 72859, "epoch": 602} {"train_loss": -35.9841423034668, "global_step": 72860, "epoch": 602} {"train_loss": -36.74860763549805, "global_step": 72861, "epoch": 602} {"train_loss": -36.621803283691406, "global_step": 72862, "epoch": 602} {"train_loss": -37.005794525146484, "global_step": 72863, "epoch": 602} {"train_loss": -37.06718826293945, "global_step": 72864, "epoch": 602} {"train_loss": -35.543861389160156, "global_step": 72865, "epoch": 602} {"train_loss": -36.06888961791992, "global_step": 72866, "epoch": 602} {"train_loss": -35.999969482421875, "global_step": 72867, "epoch": 602} {"train_loss": -36.32168197631836, "global_step": 72868, "epoch": 602} {"train_loss": -37.24228286743164, "global_step": 72869, "epoch": 602} {"train_loss": -36.533077239990234, "global_step": 72870, "epoch": 602} {"train_loss": -37.17338943481445, "global_step": 72871, "epoch": 602} {"train_loss": -37.08248519897461, "global_step": 72872, "epoch": 602} {"train_loss": -37.13149642944336, "global_step": 72873, "epoch": 602} {"train_loss": -36.12398910522461, "global_step": 72874, "epoch": 602} {"train_loss": -36.381614685058594, "global_step": 72875, "epoch": 602} {"train_loss": -36.21328353881836, "global_step": 72876, "epoch": 602} {"train_loss": -37.421966552734375, "global_step": 72877, "epoch": 602} {"train_loss": -36.86516189575195, "global_step": 72878, "epoch": 602} {"train_loss": -36.54014205932617, "global_step": 72879, "epoch": 602} {"train_loss": -35.81403350830078, "global_step": 72880, "epoch": 602} {"train_loss": -36.83134078979492, "global_step": 72881, "epoch": 602} {"train_loss": -35.97564697265625, "global_step": 72882, "epoch": 602} {"train_loss": -36.39948272705078, "global_step": 72883, "epoch": 602} {"train_loss": -37.733184814453125, "global_step": 72884, "epoch": 602} {"train_loss": -36.27265548706055, "global_step": 72885, "epoch": 602} {"train_loss": -36.40153884887695, "global_step": 72886, "epoch": 602} {"train_loss": -35.31201171875, "global_step": 72887, "epoch": 602} {"train_loss": -35.90958786010742, "global_step": 72888, "epoch": 602} {"train_loss": -37.126827239990234, "global_step": 72889, "epoch": 602} {"train_loss": -37.002017974853516, "global_step": 72890, "epoch": 602} {"train_loss": -35.72901153564453, "global_step": 72891, "epoch": 602} {"train_loss": -34.90256881713867, "global_step": 72892, "epoch": 602} {"train_loss": -34.62437057495117, "global_step": 72893, "epoch": 602} {"train_loss": -35.868492126464844, "global_step": 72894, "epoch": 602} {"train_loss": -37.04072189331055, "global_step": 72895, "epoch": 602} {"train_loss": -37.097206115722656, "global_step": 72896, "epoch": 602} {"train_loss": -35.72483444213867, "global_step": 72897, "epoch": 602} {"train_loss": -35.854610443115234, "global_step": 72898, "epoch": 602} {"train_loss": -36.978450775146484, "global_step": 72899, "epoch": 602} {"train_loss": -37.342044830322266, "global_step": 72900, "epoch": 602} {"train_loss": -36.917457580566406, "global_step": 72901, "epoch": 602} {"train_loss": -37.07870101928711, "global_step": 72902, "epoch": 602} {"train_loss": -37.329830169677734, "global_step": 72903, "epoch": 602} {"train_loss": -37.55572509765625, "global_step": 72904, "epoch": 602} {"train_loss": -37.340301513671875, "global_step": 72905, "epoch": 602} {"train_loss": -37.14059066772461, "global_step": 72906, "epoch": 602} {"train_loss": -37.75490188598633, "global_step": 72907, "epoch": 602} {"train_loss": -37.582881927490234, "global_step": 72908, "epoch": 602} {"train_loss": -37.55433654785156, "global_step": 72909, "epoch": 602} {"train_loss": -37.529842376708984, "global_step": 72910, "epoch": 602} {"train_loss": -37.627227783203125, "global_step": 72911, "epoch": 602} {"train_loss": -37.43899154663086, "global_step": 72912, "epoch": 602} {"train_loss": -37.68992233276367, "global_step": 72913, "epoch": 602} {"train_loss": -37.815643310546875, "global_step": 72914, "epoch": 602} {"train_loss": -37.07339096069336, "global_step": 72915, "epoch": 602} {"train_loss": -37.694889068603516, "global_step": 72916, "epoch": 602} {"train_loss": -37.639495849609375, "global_step": 72917, "epoch": 602} {"train_loss": -38.15576934814453, "global_step": 72918, "epoch": 602} {"train_loss": -37.27402877807617, "global_step": 72919, "epoch": 602} {"train_loss": -36.828887939453125, "global_step": 72920, "epoch": 602} {"train_loss": -36.9144172668457, "global_step": 72921, "epoch": 602} {"train_loss": -37.571224212646484, "global_step": 72922, "epoch": 602} {"train_loss": -37.36286544799805, "global_step": 72923, "epoch": 602} {"train_loss": -36.91109085083008, "global_step": 72924, "epoch": 602} {"train_loss": -37.841243743896484, "global_step": 72925, "epoch": 602} {"train_loss": -36.102027893066406, "global_step": 72926, "epoch": 602} {"train_loss": -35.21436309814453, "global_step": 72927, "epoch": 602} {"train_loss": -36.5695686340332, "global_step": 72928, "epoch": 602} {"train_loss": -35.022308349609375, "global_step": 72929, "epoch": 602} {"train_loss": -35.56618881225586, "global_step": 72930, "epoch": 602} {"train_loss": -37.338680267333984, "global_step": 72931, "epoch": 602} {"train_loss": -38.101234436035156, "global_step": 72932, "epoch": 602} {"train_loss": -37.135311126708984, "global_step": 72933, "epoch": 602} {"train_loss": -36.92086410522461, "global_step": 72934, "epoch": 602} {"train_loss": -37.38579177856445, "global_step": 72935, "epoch": 602} {"train_loss": -37.4623908996582, "global_step": 72936, "epoch": 602} {"train_loss": -37.686927795410156, "global_step": 72937, "epoch": 602} {"train_loss": -37.96124267578125, "global_step": 72938, "epoch": 602} {"train_loss": -37.54764938354492, "global_step": 72939, "epoch": 602} {"train_loss": -37.8049201965332, "global_step": 72940, "epoch": 602} {"train_loss": -37.24085998535156, "global_step": 72941, "epoch": 602} {"train_loss": -37.21340560913086, "global_step": 72942, "epoch": 602} {"train_loss": -37.52667236328125, "global_step": 72943, "epoch": 602} {"train_loss": -37.8955192565918, "global_step": 72944, "epoch": 602} {"train_loss": -37.72483444213867, "global_step": 72945, "epoch": 602} {"train_loss": -37.36289978027344, "global_step": 72946, "epoch": 602} {"train_loss": -37.74264144897461, "global_step": 72947, "epoch": 602} {"train_loss": -37.858177185058594, "global_step": 72948, "epoch": 602} {"train_loss": -38.210227966308594, "global_step": 72949, "epoch": 602} {"train_loss": -38.159034729003906, "global_step": 72950, "epoch": 602} {"train_loss": -38.1097412109375, "global_step": 72951, "epoch": 602} {"train_loss": -37.8763427734375, "global_step": 72952, "epoch": 602} {"train_loss": -38.157100677490234, "global_step": 72953, "epoch": 602} {"train_loss": -38.126529693603516, "global_step": 72954, "epoch": 602} {"train_loss": -37.5102653503418, "global_step": 72955, "epoch": 602} {"train_loss": -37.19594192504883, "global_step": 72956, "epoch": 602} {"train_loss": -36.454833984375, "global_step": 72957, "epoch": 602} {"train_loss": -34.01893615722656, "global_step": 72958, "epoch": 602} {"train_loss": -33.9458122253418, "global_step": 72959, "epoch": 602} {"train_loss": -35.87237548828125, "global_step": 72960, "epoch": 602} {"train_loss": -35.553550720214844, "global_step": 72961, "epoch": 602} {"train_loss": -36.90603861532921, "global_step": 72962, "epoch": 602, "val_loss": 2544909.75} {"train_loss": -36.25238800048828, "global_step": 72963, "epoch": 603} {"train_loss": -36.57158660888672, "global_step": 72964, "epoch": 603} {"train_loss": -35.6851921081543, "global_step": 72965, "epoch": 603} {"train_loss": -37.2829704284668, "global_step": 72966, "epoch": 603} {"train_loss": -36.61283493041992, "global_step": 72967, "epoch": 603} {"train_loss": -37.209205627441406, "global_step": 72968, "epoch": 603} {"train_loss": -36.68464279174805, "global_step": 72969, "epoch": 603} {"train_loss": -37.33925247192383, "global_step": 72970, "epoch": 603} {"train_loss": -36.31984329223633, "global_step": 72971, "epoch": 603} {"train_loss": -36.440887451171875, "global_step": 72972, "epoch": 603} {"train_loss": -37.08367919921875, "global_step": 72973, "epoch": 603} {"train_loss": -36.87630844116211, "global_step": 72974, "epoch": 603} {"train_loss": -37.7152099609375, "global_step": 72975, "epoch": 603} {"train_loss": -36.918025970458984, "global_step": 72976, "epoch": 603} {"train_loss": -37.38218307495117, "global_step": 72977, "epoch": 603} {"train_loss": -37.89994430541992, "global_step": 72978, "epoch": 603} {"train_loss": -37.04521560668945, "global_step": 72979, "epoch": 603} {"train_loss": -37.21165084838867, "global_step": 72980, "epoch": 603} {"train_loss": -37.20827865600586, "global_step": 72981, "epoch": 603} {"train_loss": -37.37486267089844, "global_step": 72982, "epoch": 603} {"train_loss": -36.70857620239258, "global_step": 72983, "epoch": 603} {"train_loss": -34.85040283203125, "global_step": 72984, "epoch": 603} {"train_loss": -34.800167083740234, "global_step": 72985, "epoch": 603} {"train_loss": -36.52692413330078, "global_step": 72986, "epoch": 603} {"train_loss": -37.309539794921875, "global_step": 72987, "epoch": 603} {"train_loss": -37.367340087890625, "global_step": 72988, "epoch": 603} {"train_loss": -36.310768127441406, "global_step": 72989, "epoch": 603} {"train_loss": -36.54661178588867, "global_step": 72990, "epoch": 603} {"train_loss": -37.77383804321289, "global_step": 72991, "epoch": 603} {"train_loss": -37.41242218017578, "global_step": 72992, "epoch": 603} {"train_loss": -36.28581619262695, "global_step": 72993, "epoch": 603} {"train_loss": -37.32098388671875, "global_step": 72994, "epoch": 603} {"train_loss": -37.8092041015625, "global_step": 72995, "epoch": 603} {"train_loss": -37.26997756958008, "global_step": 72996, "epoch": 603} {"train_loss": -37.577510833740234, "global_step": 72997, "epoch": 603} {"train_loss": -37.377349853515625, "global_step": 72998, "epoch": 603} {"train_loss": -37.259246826171875, "global_step": 72999, "epoch": 603} {"train_loss": -37.63358688354492, "global_step": 73000, "epoch": 603} {"train_loss": -36.523895263671875, "global_step": 73001, "epoch": 603} {"train_loss": -36.846065521240234, "global_step": 73002, "epoch": 603} {"train_loss": -37.091732025146484, "global_step": 73003, "epoch": 603} {"train_loss": -36.95015335083008, "global_step": 73004, "epoch": 603} {"train_loss": -37.79330825805664, "global_step": 73005, "epoch": 603} {"train_loss": -38.44157791137695, "global_step": 73006, "epoch": 603} {"train_loss": -36.49158477783203, "global_step": 73007, "epoch": 603} {"train_loss": -37.46233367919922, "global_step": 73008, "epoch": 603} {"train_loss": -37.934486389160156, "global_step": 73009, "epoch": 603} {"train_loss": -37.356910705566406, "global_step": 73010, "epoch": 603} {"train_loss": -38.15970993041992, "global_step": 73011, "epoch": 603} {"train_loss": -37.93102264404297, "global_step": 73012, "epoch": 603} {"train_loss": -37.76530838012695, "global_step": 73013, "epoch": 603} {"train_loss": -38.062583923339844, "global_step": 73014, "epoch": 603} {"train_loss": -37.037200927734375, "global_step": 73015, "epoch": 603} {"train_loss": -37.336116790771484, "global_step": 73016, "epoch": 603} {"train_loss": -36.22341537475586, "global_step": 73017, "epoch": 603} {"train_loss": -36.51200866699219, "global_step": 73018, "epoch": 603} {"train_loss": -36.1557731628418, "global_step": 73019, "epoch": 603} {"train_loss": -36.8966178894043, "global_step": 73020, "epoch": 603} {"train_loss": -35.126800537109375, "global_step": 73021, "epoch": 603} {"train_loss": -33.50873947143555, "global_step": 73022, "epoch": 603} {"train_loss": -33.08938217163086, "global_step": 73023, "epoch": 603} {"train_loss": -29.55689811706543, "global_step": 73024, "epoch": 603} {"train_loss": -27.991107940673828, "global_step": 73025, "epoch": 603} {"train_loss": -33.90451431274414, "global_step": 73026, "epoch": 603} {"train_loss": -35.80010986328125, "global_step": 73027, "epoch": 603} {"train_loss": -30.452381134033203, "global_step": 73028, "epoch": 603} {"train_loss": -36.91636276245117, "global_step": 73029, "epoch": 603} {"train_loss": -34.8970832824707, "global_step": 73030, "epoch": 603} {"train_loss": -33.003875732421875, "global_step": 73031, "epoch": 603} {"train_loss": -36.54608917236328, "global_step": 73032, "epoch": 603} {"train_loss": -35.307247161865234, "global_step": 73033, "epoch": 603} {"train_loss": -36.24139404296875, "global_step": 73034, "epoch": 603} {"train_loss": -35.809688568115234, "global_step": 73035, "epoch": 603} {"train_loss": -36.26955795288086, "global_step": 73036, "epoch": 603} {"train_loss": -36.875205993652344, "global_step": 73037, "epoch": 603} {"train_loss": -36.92416763305664, "global_step": 73038, "epoch": 603} {"train_loss": -36.66805648803711, "global_step": 73039, "epoch": 603} {"train_loss": -35.78722381591797, "global_step": 73040, "epoch": 603} {"train_loss": -36.82610321044922, "global_step": 73041, "epoch": 603} {"train_loss": -37.21626663208008, "global_step": 73042, "epoch": 603} {"train_loss": -36.92832565307617, "global_step": 73043, "epoch": 603} {"train_loss": -37.26866912841797, "global_step": 73044, "epoch": 603} {"train_loss": -37.166748046875, "global_step": 73045, "epoch": 603} {"train_loss": -36.9755859375, "global_step": 73046, "epoch": 603} {"train_loss": -37.40568161010742, "global_step": 73047, "epoch": 603} {"train_loss": -37.07448959350586, "global_step": 73048, "epoch": 603} {"train_loss": -37.52949523925781, "global_step": 73049, "epoch": 603} {"train_loss": -37.279605865478516, "global_step": 73050, "epoch": 603} {"train_loss": -37.6917839050293, "global_step": 73051, "epoch": 603} {"train_loss": -37.50740432739258, "global_step": 73052, "epoch": 603} {"train_loss": -37.7352294921875, "global_step": 73053, "epoch": 603} {"train_loss": -37.54854965209961, "global_step": 73054, "epoch": 603} {"train_loss": -37.775447845458984, "global_step": 73055, "epoch": 603} {"train_loss": -37.5555419921875, "global_step": 73056, "epoch": 603} {"train_loss": -38.065216064453125, "global_step": 73057, "epoch": 603} {"train_loss": -37.63416290283203, "global_step": 73058, "epoch": 603} {"train_loss": -37.8710823059082, "global_step": 73059, "epoch": 603} {"train_loss": -37.88327407836914, "global_step": 73060, "epoch": 603} {"train_loss": -38.096771240234375, "global_step": 73061, "epoch": 603} {"train_loss": -37.87347412109375, "global_step": 73062, "epoch": 603} {"train_loss": -37.49720001220703, "global_step": 73063, "epoch": 603} {"train_loss": -37.60980987548828, "global_step": 73064, "epoch": 603} {"train_loss": -37.98276901245117, "global_step": 73065, "epoch": 603} {"train_loss": -38.210662841796875, "global_step": 73066, "epoch": 603} {"train_loss": -38.00684356689453, "global_step": 73067, "epoch": 603} {"train_loss": -37.75838088989258, "global_step": 73068, "epoch": 603} {"train_loss": -37.740901947021484, "global_step": 73069, "epoch": 603} {"train_loss": -37.612396240234375, "global_step": 73070, "epoch": 603} {"train_loss": -37.55178451538086, "global_step": 73071, "epoch": 603} {"train_loss": -36.95451736450195, "global_step": 73072, "epoch": 603} {"train_loss": -37.59661102294922, "global_step": 73073, "epoch": 603} {"train_loss": -38.28487014770508, "global_step": 73074, "epoch": 603} {"train_loss": -37.8769416809082, "global_step": 73075, "epoch": 603} {"train_loss": -37.12437057495117, "global_step": 73076, "epoch": 603} {"train_loss": -37.613250732421875, "global_step": 73077, "epoch": 603} {"train_loss": -38.39222717285156, "global_step": 73078, "epoch": 603} {"train_loss": -37.92086410522461, "global_step": 73079, "epoch": 603} {"train_loss": -37.065032958984375, "global_step": 73080, "epoch": 603} {"train_loss": -37.36455535888672, "global_step": 73081, "epoch": 603} {"train_loss": -36.79539108276367, "global_step": 73082, "epoch": 603} {"train_loss": -36.80296718187569, "global_step": 73083, "epoch": 603, "val_loss": 2582095.25} {"train_loss": -37.775550842285156, "global_step": 73084, "epoch": 604} {"train_loss": -37.41101837158203, "global_step": 73085, "epoch": 604} {"train_loss": -35.2628059387207, "global_step": 73086, "epoch": 604} {"train_loss": -36.578468322753906, "global_step": 73087, "epoch": 604} {"train_loss": -34.805171966552734, "global_step": 73088, "epoch": 604} {"train_loss": -34.18061828613281, "global_step": 73089, "epoch": 604} {"train_loss": -36.12765121459961, "global_step": 73090, "epoch": 604} {"train_loss": -37.044185638427734, "global_step": 73091, "epoch": 604} {"train_loss": -32.8722038269043, "global_step": 73092, "epoch": 604} {"train_loss": -36.43792724609375, "global_step": 73093, "epoch": 604} {"train_loss": -34.18706130981445, "global_step": 73094, "epoch": 604} {"train_loss": -36.587066650390625, "global_step": 73095, "epoch": 604} {"train_loss": -32.12459945678711, "global_step": 73096, "epoch": 604} {"train_loss": -34.98861312866211, "global_step": 73097, "epoch": 604} {"train_loss": -28.09286880493164, "global_step": 73098, "epoch": 604} {"train_loss": -35.908958435058594, "global_step": 73099, "epoch": 604} {"train_loss": -32.88385772705078, "global_step": 73100, "epoch": 604} {"train_loss": -34.3569221496582, "global_step": 73101, "epoch": 604} {"train_loss": -37.33543014526367, "global_step": 73102, "epoch": 604} {"train_loss": -35.736873626708984, "global_step": 73103, "epoch": 604} {"train_loss": -34.09859085083008, "global_step": 73104, "epoch": 604} {"train_loss": -36.63788986206055, "global_step": 73105, "epoch": 604} {"train_loss": -37.39430618286133, "global_step": 73106, "epoch": 604} {"train_loss": -36.4984016418457, "global_step": 73107, "epoch": 604} {"train_loss": -35.782840728759766, "global_step": 73108, "epoch": 604} {"train_loss": -37.02971267700195, "global_step": 73109, "epoch": 604} {"train_loss": -36.93666458129883, "global_step": 73110, "epoch": 604} {"train_loss": -37.68720626831055, "global_step": 73111, "epoch": 604} {"train_loss": -36.97597122192383, "global_step": 73112, "epoch": 604} {"train_loss": -37.277427673339844, "global_step": 73113, "epoch": 604} {"train_loss": -36.7503662109375, "global_step": 73114, "epoch": 604} {"train_loss": -36.95207977294922, "global_step": 73115, "epoch": 604} {"train_loss": -37.72831726074219, "global_step": 73116, "epoch": 604} {"train_loss": -38.19806671142578, "global_step": 73117, "epoch": 604} {"train_loss": -36.55475997924805, "global_step": 73118, "epoch": 604} {"train_loss": -36.07162094116211, "global_step": 73119, "epoch": 604} {"train_loss": -37.614131927490234, "global_step": 73120, "epoch": 604} {"train_loss": -36.424739837646484, "global_step": 73121, "epoch": 604} {"train_loss": -36.53141784667969, "global_step": 73122, "epoch": 604} {"train_loss": -36.7457275390625, "global_step": 73123, "epoch": 604} {"train_loss": -37.47719955444336, "global_step": 73124, "epoch": 604} {"train_loss": -37.10187530517578, "global_step": 73125, "epoch": 604} {"train_loss": -36.88685989379883, "global_step": 73126, "epoch": 604} {"train_loss": -37.36281967163086, "global_step": 73127, "epoch": 604} {"train_loss": -37.000946044921875, "global_step": 73128, "epoch": 604} {"train_loss": -37.598323822021484, "global_step": 73129, "epoch": 604} {"train_loss": -37.87275314331055, "global_step": 73130, "epoch": 604} {"train_loss": -37.90778350830078, "global_step": 73131, "epoch": 604} {"train_loss": -37.90515899658203, "global_step": 73132, "epoch": 604} {"train_loss": -37.89948654174805, "global_step": 73133, "epoch": 604} {"train_loss": -37.90286636352539, "global_step": 73134, "epoch": 604} {"train_loss": -37.635658264160156, "global_step": 73135, "epoch": 604} {"train_loss": -38.04412841796875, "global_step": 73136, "epoch": 604} {"train_loss": -37.53129196166992, "global_step": 73137, "epoch": 604} {"train_loss": -38.11915969848633, "global_step": 73138, "epoch": 604} {"train_loss": -37.28190612792969, "global_step": 73139, "epoch": 604} {"train_loss": -37.74567794799805, "global_step": 73140, "epoch": 604} {"train_loss": -37.37959671020508, "global_step": 73141, "epoch": 604} {"train_loss": -37.846309661865234, "global_step": 73142, "epoch": 604} {"train_loss": -37.33820343017578, "global_step": 73143, "epoch": 604} {"train_loss": -37.92271041870117, "global_step": 73144, "epoch": 604} {"train_loss": -37.80096435546875, "global_step": 73145, "epoch": 604} {"train_loss": -37.7733039855957, "global_step": 73146, "epoch": 604} {"train_loss": -37.976680755615234, "global_step": 73147, "epoch": 604} {"train_loss": -37.667598724365234, "global_step": 73148, "epoch": 604} {"train_loss": -36.99055099487305, "global_step": 73149, "epoch": 604} {"train_loss": -34.635799407958984, "global_step": 73150, "epoch": 604} {"train_loss": -30.214765548706055, "global_step": 73151, "epoch": 604} {"train_loss": -28.43903923034668, "global_step": 73152, "epoch": 604} {"train_loss": -25.889310836791992, "global_step": 73153, "epoch": 604} {"train_loss": -32.01034164428711, "global_step": 73154, "epoch": 604} {"train_loss": -36.94050979614258, "global_step": 73155, "epoch": 604} {"train_loss": -34.63002395629883, "global_step": 73156, "epoch": 604} {"train_loss": -35.978519439697266, "global_step": 73157, "epoch": 604} {"train_loss": -35.69999313354492, "global_step": 73158, "epoch": 604} {"train_loss": -35.22774124145508, "global_step": 73159, "epoch": 604} {"train_loss": -35.7867431640625, "global_step": 73160, "epoch": 604} {"train_loss": -35.81915283203125, "global_step": 73161, "epoch": 604} {"train_loss": -35.66948318481445, "global_step": 73162, "epoch": 604} {"train_loss": -37.15808868408203, "global_step": 73163, "epoch": 604} {"train_loss": -36.3603515625, "global_step": 73164, "epoch": 604} {"train_loss": -36.49293899536133, "global_step": 73165, "epoch": 604} {"train_loss": -36.95840072631836, "global_step": 73166, "epoch": 604} {"train_loss": -37.450538635253906, "global_step": 73167, "epoch": 604} {"train_loss": -36.488677978515625, "global_step": 73168, "epoch": 604} {"train_loss": -37.21737289428711, "global_step": 73169, "epoch": 604} {"train_loss": -36.62028121948242, "global_step": 73170, "epoch": 604} {"train_loss": -36.88269805908203, "global_step": 73171, "epoch": 604} {"train_loss": -36.85334014892578, "global_step": 73172, "epoch": 604} {"train_loss": -36.56232452392578, "global_step": 73173, "epoch": 604} {"train_loss": -37.41474151611328, "global_step": 73174, "epoch": 604} {"train_loss": -36.730587005615234, "global_step": 73175, "epoch": 604} {"train_loss": -36.32249069213867, "global_step": 73176, "epoch": 604} {"train_loss": -36.751033782958984, "global_step": 73177, "epoch": 604} {"train_loss": -35.482765197753906, "global_step": 73178, "epoch": 604} {"train_loss": -36.81025314331055, "global_step": 73179, "epoch": 604} {"train_loss": -36.66541290283203, "global_step": 73180, "epoch": 604} {"train_loss": -37.0037841796875, "global_step": 73181, "epoch": 604} {"train_loss": -36.60341262817383, "global_step": 73182, "epoch": 604} {"train_loss": -37.0499382019043, "global_step": 73183, "epoch": 604} {"train_loss": -37.328365325927734, "global_step": 73184, "epoch": 604} {"train_loss": -36.85762023925781, "global_step": 73185, "epoch": 604} {"train_loss": -37.86112594604492, "global_step": 73186, "epoch": 604} {"train_loss": -36.88556671142578, "global_step": 73187, "epoch": 604} {"train_loss": -37.602996826171875, "global_step": 73188, "epoch": 604} {"train_loss": -37.32099533081055, "global_step": 73189, "epoch": 604} {"train_loss": -37.15019989013672, "global_step": 73190, "epoch": 604} {"train_loss": -37.29545211791992, "global_step": 73191, "epoch": 604} {"train_loss": -37.6291618347168, "global_step": 73192, "epoch": 604} {"train_loss": -36.957027435302734, "global_step": 73193, "epoch": 604} {"train_loss": -37.445556640625, "global_step": 73194, "epoch": 604} {"train_loss": -37.1761589050293, "global_step": 73195, "epoch": 604} {"train_loss": -37.52064895629883, "global_step": 73196, "epoch": 604} {"train_loss": -37.33967208862305, "global_step": 73197, "epoch": 604} {"train_loss": -36.910118103027344, "global_step": 73198, "epoch": 604} {"train_loss": -36.961090087890625, "global_step": 73199, "epoch": 604} {"train_loss": -35.98268127441406, "global_step": 73200, "epoch": 604} {"train_loss": -36.39081954956055, "global_step": 73201, "epoch": 604} {"train_loss": -37.1485710144043, "global_step": 73202, "epoch": 604} {"train_loss": -37.8385009765625, "global_step": 73203, "epoch": 604} {"train_loss": -36.38711669228294, "global_step": 73204, "epoch": 604, "val_loss": 2581330.5} {"train_loss": -36.3043212890625, "global_step": 73205, "epoch": 605} {"train_loss": -36.39865493774414, "global_step": 73206, "epoch": 605} {"train_loss": -37.9092903137207, "global_step": 73207, "epoch": 605} {"train_loss": -37.33781814575195, "global_step": 73208, "epoch": 605} {"train_loss": -37.838191986083984, "global_step": 73209, "epoch": 605} {"train_loss": -38.02803421020508, "global_step": 73210, "epoch": 605} {"train_loss": -38.254127502441406, "global_step": 73211, "epoch": 605} {"train_loss": -38.16291046142578, "global_step": 73212, "epoch": 605} {"train_loss": -37.5075798034668, "global_step": 73213, "epoch": 605} {"train_loss": -37.526851654052734, "global_step": 73214, "epoch": 605} {"train_loss": -37.66459655761719, "global_step": 73215, "epoch": 605} {"train_loss": -38.14397048950195, "global_step": 73216, "epoch": 605} {"train_loss": -37.91558837890625, "global_step": 73217, "epoch": 605} {"train_loss": -37.71781539916992, "global_step": 73218, "epoch": 605} {"train_loss": -37.682533264160156, "global_step": 73219, "epoch": 605} {"train_loss": -37.95076370239258, "global_step": 73220, "epoch": 605} {"train_loss": -37.505611419677734, "global_step": 73221, "epoch": 605} {"train_loss": -38.178428649902344, "global_step": 73222, "epoch": 605} {"train_loss": -38.41355514526367, "global_step": 73223, "epoch": 605} {"train_loss": -37.76719284057617, "global_step": 73224, "epoch": 605} {"train_loss": -38.026214599609375, "global_step": 73225, "epoch": 605} {"train_loss": -38.11334228515625, "global_step": 73226, "epoch": 605} {"train_loss": -38.37849807739258, "global_step": 73227, "epoch": 605} {"train_loss": -37.54115676879883, "global_step": 73228, "epoch": 605} {"train_loss": -37.968414306640625, "global_step": 73229, "epoch": 605} {"train_loss": -37.796241760253906, "global_step": 73230, "epoch": 605} {"train_loss": -38.46004104614258, "global_step": 73231, "epoch": 605} {"train_loss": -37.36461639404297, "global_step": 73232, "epoch": 605} {"train_loss": -37.760746002197266, "global_step": 73233, "epoch": 605} {"train_loss": -36.581214904785156, "global_step": 73234, "epoch": 605} {"train_loss": -36.59794616699219, "global_step": 73235, "epoch": 605} {"train_loss": -34.42338180541992, "global_step": 73236, "epoch": 605} {"train_loss": -33.830238342285156, "global_step": 73237, "epoch": 605} {"train_loss": -35.947566986083984, "global_step": 73238, "epoch": 605} {"train_loss": -37.201541900634766, "global_step": 73239, "epoch": 605} {"train_loss": -35.82304763793945, "global_step": 73240, "epoch": 605} {"train_loss": -35.297603607177734, "global_step": 73241, "epoch": 605} {"train_loss": -36.85636520385742, "global_step": 73242, "epoch": 605} {"train_loss": -36.12031173706055, "global_step": 73243, "epoch": 605} {"train_loss": -35.5806770324707, "global_step": 73244, "epoch": 605} {"train_loss": -36.9980354309082, "global_step": 73245, "epoch": 605} {"train_loss": -36.614723205566406, "global_step": 73246, "epoch": 605} {"train_loss": -37.13167953491211, "global_step": 73247, "epoch": 605} {"train_loss": -35.97987365722656, "global_step": 73248, "epoch": 605} {"train_loss": -36.51113510131836, "global_step": 73249, "epoch": 605} {"train_loss": -37.39453887939453, "global_step": 73250, "epoch": 605} {"train_loss": -35.16048049926758, "global_step": 73251, "epoch": 605} {"train_loss": -33.1379280090332, "global_step": 73252, "epoch": 605} {"train_loss": -34.51796340942383, "global_step": 73253, "epoch": 605} {"train_loss": -37.0421257019043, "global_step": 73254, "epoch": 605} {"train_loss": -35.76265335083008, "global_step": 73255, "epoch": 605} {"train_loss": -35.82978439331055, "global_step": 73256, "epoch": 605} {"train_loss": -36.437782287597656, "global_step": 73257, "epoch": 605} {"train_loss": -36.342830657958984, "global_step": 73258, "epoch": 605} {"train_loss": -36.928096771240234, "global_step": 73259, "epoch": 605} {"train_loss": -36.29034423828125, "global_step": 73260, "epoch": 605} {"train_loss": -36.58256912231445, "global_step": 73261, "epoch": 605} {"train_loss": -37.48674392700195, "global_step": 73262, "epoch": 605} {"train_loss": -36.61326217651367, "global_step": 73263, "epoch": 605} {"train_loss": -37.23550033569336, "global_step": 73264, "epoch": 605} {"train_loss": -36.82954025268555, "global_step": 73265, "epoch": 605} {"train_loss": -36.113037109375, "global_step": 73266, "epoch": 605} {"train_loss": -35.53885269165039, "global_step": 73267, "epoch": 605} {"train_loss": -36.030860900878906, "global_step": 73268, "epoch": 605} {"train_loss": -36.59078598022461, "global_step": 73269, "epoch": 605} {"train_loss": -37.03070831298828, "global_step": 73270, "epoch": 605} {"train_loss": -36.644195556640625, "global_step": 73271, "epoch": 605} {"train_loss": -36.781898498535156, "global_step": 73272, "epoch": 605} {"train_loss": -36.488616943359375, "global_step": 73273, "epoch": 605} {"train_loss": -35.36292266845703, "global_step": 73274, "epoch": 605} {"train_loss": -36.1132698059082, "global_step": 73275, "epoch": 605} {"train_loss": -36.530189514160156, "global_step": 73276, "epoch": 605} {"train_loss": -36.46461868286133, "global_step": 73277, "epoch": 605} {"train_loss": -36.97212600708008, "global_step": 73278, "epoch": 605} {"train_loss": -36.64418411254883, "global_step": 73279, "epoch": 605} {"train_loss": -36.86515426635742, "global_step": 73280, "epoch": 605} {"train_loss": -37.5035514831543, "global_step": 73281, "epoch": 605} {"train_loss": -36.03713607788086, "global_step": 73282, "epoch": 605} {"train_loss": -36.82695388793945, "global_step": 73283, "epoch": 605} {"train_loss": -37.2501220703125, "global_step": 73284, "epoch": 605} {"train_loss": -37.60438919067383, "global_step": 73285, "epoch": 605} {"train_loss": -36.94179153442383, "global_step": 73286, "epoch": 605} {"train_loss": -37.11186218261719, "global_step": 73287, "epoch": 605} {"train_loss": -37.89724349975586, "global_step": 73288, "epoch": 605} {"train_loss": -37.285587310791016, "global_step": 73289, "epoch": 605} {"train_loss": -36.905738830566406, "global_step": 73290, "epoch": 605} {"train_loss": -37.9139289855957, "global_step": 73291, "epoch": 605} {"train_loss": -37.2678108215332, "global_step": 73292, "epoch": 605} {"train_loss": -37.57748031616211, "global_step": 73293, "epoch": 605} {"train_loss": -37.96738815307617, "global_step": 73294, "epoch": 605} {"train_loss": -36.73020553588867, "global_step": 73295, "epoch": 605} {"train_loss": -36.74259567260742, "global_step": 73296, "epoch": 605} {"train_loss": -37.67584991455078, "global_step": 73297, "epoch": 605} {"train_loss": -37.455684661865234, "global_step": 73298, "epoch": 605} {"train_loss": -37.72083282470703, "global_step": 73299, "epoch": 605} {"train_loss": -37.72459411621094, "global_step": 73300, "epoch": 605} {"train_loss": -37.64393615722656, "global_step": 73301, "epoch": 605} {"train_loss": -37.835105895996094, "global_step": 73302, "epoch": 605} {"train_loss": -37.8529052734375, "global_step": 73303, "epoch": 605} {"train_loss": -37.62842559814453, "global_step": 73304, "epoch": 605} {"train_loss": -38.249752044677734, "global_step": 73305, "epoch": 605} {"train_loss": -36.873077392578125, "global_step": 73306, "epoch": 605} {"train_loss": -37.898433685302734, "global_step": 73307, "epoch": 605} {"train_loss": -38.09440231323242, "global_step": 73308, "epoch": 605} {"train_loss": -37.67378616333008, "global_step": 73309, "epoch": 605} {"train_loss": -37.40237045288086, "global_step": 73310, "epoch": 605} {"train_loss": -38.112701416015625, "global_step": 73311, "epoch": 605} {"train_loss": -37.441802978515625, "global_step": 73312, "epoch": 605} {"train_loss": -36.57893753051758, "global_step": 73313, "epoch": 605} {"train_loss": -37.662628173828125, "global_step": 73314, "epoch": 605} {"train_loss": -36.784183502197266, "global_step": 73315, "epoch": 605} {"train_loss": -37.88224411010742, "global_step": 73316, "epoch": 605} {"train_loss": -36.596824645996094, "global_step": 73317, "epoch": 605} {"train_loss": -35.23566818237305, "global_step": 73318, "epoch": 605} {"train_loss": -31.707700729370117, "global_step": 73319, "epoch": 605} {"train_loss": -35.970001220703125, "global_step": 73320, "epoch": 605} {"train_loss": -35.655792236328125, "global_step": 73321, "epoch": 605} {"train_loss": -35.83715057373047, "global_step": 73322, "epoch": 605} {"train_loss": -35.830684661865234, "global_step": 73323, "epoch": 605} {"train_loss": -36.40098571777344, "global_step": 73324, "epoch": 605} {"train_loss": -36.912368695598005, "global_step": 73325, "epoch": 605, "val_loss": 2658993.75} {"train_loss": -36.820709228515625, "global_step": 73326, "epoch": 606} {"train_loss": -35.8303108215332, "global_step": 73327, "epoch": 606} {"train_loss": -36.402523040771484, "global_step": 73328, "epoch": 606} {"train_loss": -36.67110824584961, "global_step": 73329, "epoch": 606} {"train_loss": -37.928245544433594, "global_step": 73330, "epoch": 606} {"train_loss": -37.331695556640625, "global_step": 73331, "epoch": 606} {"train_loss": -37.710235595703125, "global_step": 73332, "epoch": 606} {"train_loss": -37.74338912963867, "global_step": 73333, "epoch": 606} {"train_loss": -37.09132766723633, "global_step": 73334, "epoch": 606} {"train_loss": -37.46309280395508, "global_step": 73335, "epoch": 606} {"train_loss": -37.9246711730957, "global_step": 73336, "epoch": 606} {"train_loss": -37.7358512878418, "global_step": 73337, "epoch": 606} {"train_loss": -37.84867477416992, "global_step": 73338, "epoch": 606} {"train_loss": -38.05845260620117, "global_step": 73339, "epoch": 606} {"train_loss": -37.30360794067383, "global_step": 73340, "epoch": 606} {"train_loss": -37.82893753051758, "global_step": 73341, "epoch": 606} {"train_loss": -37.827117919921875, "global_step": 73342, "epoch": 606} {"train_loss": -37.86666488647461, "global_step": 73343, "epoch": 606} {"train_loss": -37.410865783691406, "global_step": 73344, "epoch": 606} {"train_loss": -37.95207977294922, "global_step": 73345, "epoch": 606} {"train_loss": -37.47123336791992, "global_step": 73346, "epoch": 606} {"train_loss": -36.984798431396484, "global_step": 73347, "epoch": 606} {"train_loss": -37.23818588256836, "global_step": 73348, "epoch": 606} {"train_loss": -37.93136978149414, "global_step": 73349, "epoch": 606} {"train_loss": -37.98345947265625, "global_step": 73350, "epoch": 606} {"train_loss": -37.800899505615234, "global_step": 73351, "epoch": 606} {"train_loss": -37.331825256347656, "global_step": 73352, "epoch": 606} {"train_loss": -36.911903381347656, "global_step": 73353, "epoch": 606} {"train_loss": -38.03728485107422, "global_step": 73354, "epoch": 606} {"train_loss": -37.929317474365234, "global_step": 73355, "epoch": 606} {"train_loss": -37.557159423828125, "global_step": 73356, "epoch": 606} {"train_loss": -37.54228973388672, "global_step": 73357, "epoch": 606} {"train_loss": -38.13527297973633, "global_step": 73358, "epoch": 606} {"train_loss": -37.479164123535156, "global_step": 73359, "epoch": 606} {"train_loss": -37.281593322753906, "global_step": 73360, "epoch": 606} {"train_loss": -36.75932693481445, "global_step": 73361, "epoch": 606} {"train_loss": -37.890079498291016, "global_step": 73362, "epoch": 606} {"train_loss": -37.28713607788086, "global_step": 73363, "epoch": 606} {"train_loss": -37.0965461730957, "global_step": 73364, "epoch": 606} {"train_loss": -38.09431838989258, "global_step": 73365, "epoch": 606} {"train_loss": -37.92347717285156, "global_step": 73366, "epoch": 606} {"train_loss": -37.492919921875, "global_step": 73367, "epoch": 606} {"train_loss": -37.66798400878906, "global_step": 73368, "epoch": 606} {"train_loss": -38.19023513793945, "global_step": 73369, "epoch": 606} {"train_loss": -37.26224899291992, "global_step": 73370, "epoch": 606} {"train_loss": -37.65346908569336, "global_step": 73371, "epoch": 606} {"train_loss": -36.8575439453125, "global_step": 73372, "epoch": 606} {"train_loss": -37.02128219604492, "global_step": 73373, "epoch": 606} {"train_loss": -37.34165573120117, "global_step": 73374, "epoch": 606} {"train_loss": -38.09961700439453, "global_step": 73375, "epoch": 606} {"train_loss": -37.96617126464844, "global_step": 73376, "epoch": 606} {"train_loss": -37.17053985595703, "global_step": 73377, "epoch": 606} {"train_loss": -37.83797073364258, "global_step": 73378, "epoch": 606} {"train_loss": -38.383243560791016, "global_step": 73379, "epoch": 606} {"train_loss": -37.249908447265625, "global_step": 73380, "epoch": 606} {"train_loss": -37.41484451293945, "global_step": 73381, "epoch": 606} {"train_loss": -36.634376525878906, "global_step": 73382, "epoch": 606} {"train_loss": -36.7653694152832, "global_step": 73383, "epoch": 606} {"train_loss": -36.841365814208984, "global_step": 73384, "epoch": 606} {"train_loss": -37.69114303588867, "global_step": 73385, "epoch": 606} {"train_loss": -37.54413604736328, "global_step": 73386, "epoch": 606} {"train_loss": -36.80836868286133, "global_step": 73387, "epoch": 606} {"train_loss": -37.58543014526367, "global_step": 73388, "epoch": 606} {"train_loss": -37.31879806518555, "global_step": 73389, "epoch": 606} {"train_loss": -36.79225540161133, "global_step": 73390, "epoch": 606} {"train_loss": -37.36684036254883, "global_step": 73391, "epoch": 606} {"train_loss": -38.52891159057617, "global_step": 73392, "epoch": 606} {"train_loss": -37.79544448852539, "global_step": 73393, "epoch": 606} {"train_loss": -36.692352294921875, "global_step": 73394, "epoch": 606} {"train_loss": -36.27458190917969, "global_step": 73395, "epoch": 606} {"train_loss": -37.7242546081543, "global_step": 73396, "epoch": 606} {"train_loss": -37.540122985839844, "global_step": 73397, "epoch": 606} {"train_loss": -37.13119888305664, "global_step": 73398, "epoch": 606} {"train_loss": -37.255523681640625, "global_step": 73399, "epoch": 606} {"train_loss": -37.2336540222168, "global_step": 73400, "epoch": 606} {"train_loss": -36.874935150146484, "global_step": 73401, "epoch": 606} {"train_loss": -37.00688934326172, "global_step": 73402, "epoch": 606} {"train_loss": -36.70863723754883, "global_step": 73403, "epoch": 606} {"train_loss": -37.069976806640625, "global_step": 73404, "epoch": 606} {"train_loss": -37.00979232788086, "global_step": 73405, "epoch": 606} {"train_loss": -37.36419677734375, "global_step": 73406, "epoch": 606} {"train_loss": -37.36403274536133, "global_step": 73407, "epoch": 606} {"train_loss": -36.43175506591797, "global_step": 73408, "epoch": 606} {"train_loss": -37.139591217041016, "global_step": 73409, "epoch": 606} {"train_loss": -37.224586486816406, "global_step": 73410, "epoch": 606} {"train_loss": -37.19330978393555, "global_step": 73411, "epoch": 606} {"train_loss": -38.10331726074219, "global_step": 73412, "epoch": 606} {"train_loss": -36.98685836791992, "global_step": 73413, "epoch": 606} {"train_loss": -37.565528869628906, "global_step": 73414, "epoch": 606} {"train_loss": -37.25687789916992, "global_step": 73415, "epoch": 606} {"train_loss": -36.08925247192383, "global_step": 73416, "epoch": 606} {"train_loss": -35.35760498046875, "global_step": 73417, "epoch": 606} {"train_loss": -34.62537384033203, "global_step": 73418, "epoch": 606} {"train_loss": -35.384700775146484, "global_step": 73419, "epoch": 606} {"train_loss": -36.414920806884766, "global_step": 73420, "epoch": 606} {"train_loss": -37.41767501831055, "global_step": 73421, "epoch": 606} {"train_loss": -37.5114860534668, "global_step": 73422, "epoch": 606} {"train_loss": -37.23480987548828, "global_step": 73423, "epoch": 606} {"train_loss": -37.769447326660156, "global_step": 73424, "epoch": 606} {"train_loss": -37.45497512817383, "global_step": 73425, "epoch": 606} {"train_loss": -37.517879486083984, "global_step": 73426, "epoch": 606} {"train_loss": -36.3201789855957, "global_step": 73427, "epoch": 606} {"train_loss": -34.36469650268555, "global_step": 73428, "epoch": 606} {"train_loss": -32.786346435546875, "global_step": 73429, "epoch": 606} {"train_loss": -36.746578216552734, "global_step": 73430, "epoch": 606} {"train_loss": -36.797054290771484, "global_step": 73431, "epoch": 606} {"train_loss": -34.420719146728516, "global_step": 73432, "epoch": 606} {"train_loss": -36.3900032043457, "global_step": 73433, "epoch": 606} {"train_loss": -36.3467903137207, "global_step": 73434, "epoch": 606} {"train_loss": -33.380027770996094, "global_step": 73435, "epoch": 606} {"train_loss": -32.508026123046875, "global_step": 73436, "epoch": 606} {"train_loss": -34.584842681884766, "global_step": 73437, "epoch": 606} {"train_loss": -37.18427658081055, "global_step": 73438, "epoch": 606} {"train_loss": -33.282997131347656, "global_step": 73439, "epoch": 606} {"train_loss": -34.378929138183594, "global_step": 73440, "epoch": 606} {"train_loss": -37.09170150756836, "global_step": 73441, "epoch": 606} {"train_loss": -35.859046936035156, "global_step": 73442, "epoch": 606} {"train_loss": -35.94043731689453, "global_step": 73443, "epoch": 606} {"train_loss": -37.57080078125, "global_step": 73444, "epoch": 606} {"train_loss": -36.006500244140625, "global_step": 73445, "epoch": 606} {"train_loss": -37.00590452083871, "global_step": 73446, "epoch": 606, "val_loss": 2538140.25} {"train_loss": -37.00306701660156, "global_step": 73447, "epoch": 607} {"train_loss": -36.51533889770508, "global_step": 73448, "epoch": 607} {"train_loss": -37.377742767333984, "global_step": 73449, "epoch": 607} {"train_loss": -37.13827896118164, "global_step": 73450, "epoch": 607} {"train_loss": -36.972225189208984, "global_step": 73451, "epoch": 607} {"train_loss": -37.65184783935547, "global_step": 73452, "epoch": 607} {"train_loss": -37.00293731689453, "global_step": 73453, "epoch": 607} {"train_loss": -37.762062072753906, "global_step": 73454, "epoch": 607} {"train_loss": -37.23725891113281, "global_step": 73455, "epoch": 607} {"train_loss": -37.42782211303711, "global_step": 73456, "epoch": 607} {"train_loss": -37.18581771850586, "global_step": 73457, "epoch": 607} {"train_loss": -36.977962493896484, "global_step": 73458, "epoch": 607} {"train_loss": -37.33051681518555, "global_step": 73459, "epoch": 607} {"train_loss": -37.426761627197266, "global_step": 73460, "epoch": 607} {"train_loss": -37.56547164916992, "global_step": 73461, "epoch": 607} {"train_loss": -37.00432205200195, "global_step": 73462, "epoch": 607} {"train_loss": -37.56522750854492, "global_step": 73463, "epoch": 607} {"train_loss": -37.1027717590332, "global_step": 73464, "epoch": 607} {"train_loss": -36.30437088012695, "global_step": 73465, "epoch": 607} {"train_loss": -36.604976654052734, "global_step": 73466, "epoch": 607} {"train_loss": -37.809444427490234, "global_step": 73467, "epoch": 607} {"train_loss": -36.022274017333984, "global_step": 73468, "epoch": 607} {"train_loss": -37.03652572631836, "global_step": 73469, "epoch": 607} {"train_loss": -36.200477600097656, "global_step": 73470, "epoch": 607} {"train_loss": -33.793148040771484, "global_step": 73471, "epoch": 607} {"train_loss": -37.5069694519043, "global_step": 73472, "epoch": 607} {"train_loss": -34.42416000366211, "global_step": 73473, "epoch": 607} {"train_loss": -37.23336410522461, "global_step": 73474, "epoch": 607} {"train_loss": -36.215919494628906, "global_step": 73475, "epoch": 607} {"train_loss": -38.16212844848633, "global_step": 73476, "epoch": 607} {"train_loss": -36.7349739074707, "global_step": 73477, "epoch": 607} {"train_loss": -37.621246337890625, "global_step": 73478, "epoch": 607} {"train_loss": -37.316810607910156, "global_step": 73479, "epoch": 607} {"train_loss": -37.64080810546875, "global_step": 73480, "epoch": 607} {"train_loss": -37.941646575927734, "global_step": 73481, "epoch": 607} {"train_loss": -38.30201721191406, "global_step": 73482, "epoch": 607} {"train_loss": -37.49382019042969, "global_step": 73483, "epoch": 607} {"train_loss": -37.642486572265625, "global_step": 73484, "epoch": 607} {"train_loss": -37.92058181762695, "global_step": 73485, "epoch": 607} {"train_loss": -37.07635498046875, "global_step": 73486, "epoch": 607} {"train_loss": -37.41259002685547, "global_step": 73487, "epoch": 607} {"train_loss": -37.988224029541016, "global_step": 73488, "epoch": 607} {"train_loss": -37.024940490722656, "global_step": 73489, "epoch": 607} {"train_loss": -37.445343017578125, "global_step": 73490, "epoch": 607} {"train_loss": -38.2095832824707, "global_step": 73491, "epoch": 607} {"train_loss": -36.268165588378906, "global_step": 73492, "epoch": 607} {"train_loss": -36.90237045288086, "global_step": 73493, "epoch": 607} {"train_loss": -37.57036590576172, "global_step": 73494, "epoch": 607} {"train_loss": -37.622779846191406, "global_step": 73495, "epoch": 607} {"train_loss": -37.25995635986328, "global_step": 73496, "epoch": 607} {"train_loss": -37.678707122802734, "global_step": 73497, "epoch": 607} {"train_loss": -36.85945129394531, "global_step": 73498, "epoch": 607} {"train_loss": -37.99467849731445, "global_step": 73499, "epoch": 607} {"train_loss": -37.34516525268555, "global_step": 73500, "epoch": 607} {"train_loss": -36.85560989379883, "global_step": 73501, "epoch": 607} {"train_loss": -37.79905319213867, "global_step": 73502, "epoch": 607} {"train_loss": -37.86721420288086, "global_step": 73503, "epoch": 607} {"train_loss": -38.06959915161133, "global_step": 73504, "epoch": 607} {"train_loss": -37.93806076049805, "global_step": 73505, "epoch": 607} {"train_loss": -38.06721115112305, "global_step": 73506, "epoch": 607} {"train_loss": -37.130859375, "global_step": 73507, "epoch": 607} {"train_loss": -37.84981918334961, "global_step": 73508, "epoch": 607} {"train_loss": -38.36285400390625, "global_step": 73509, "epoch": 607} {"train_loss": -37.53361129760742, "global_step": 73510, "epoch": 607} {"train_loss": -38.040130615234375, "global_step": 73511, "epoch": 607} {"train_loss": -37.853782653808594, "global_step": 73512, "epoch": 607} {"train_loss": -37.6492919921875, "global_step": 73513, "epoch": 607} {"train_loss": -37.63374710083008, "global_step": 73514, "epoch": 607} {"train_loss": -37.738826751708984, "global_step": 73515, "epoch": 607} {"train_loss": -37.325618743896484, "global_step": 73516, "epoch": 607} {"train_loss": -37.7593994140625, "global_step": 73517, "epoch": 607} {"train_loss": -37.1473503112793, "global_step": 73518, "epoch": 607} {"train_loss": -37.57908248901367, "global_step": 73519, "epoch": 607} {"train_loss": -38.11417770385742, "global_step": 73520, "epoch": 607} {"train_loss": -36.84626388549805, "global_step": 73521, "epoch": 607} {"train_loss": -36.358123779296875, "global_step": 73522, "epoch": 607} {"train_loss": -34.58773422241211, "global_step": 73523, "epoch": 607} {"train_loss": -32.432029724121094, "global_step": 73524, "epoch": 607} {"train_loss": -31.30632972717285, "global_step": 73525, "epoch": 607} {"train_loss": -34.30757522583008, "global_step": 73526, "epoch": 607} {"train_loss": -36.236236572265625, "global_step": 73527, "epoch": 607} {"train_loss": -34.180233001708984, "global_step": 73528, "epoch": 607} {"train_loss": -35.938865661621094, "global_step": 73529, "epoch": 607} {"train_loss": -36.106014251708984, "global_step": 73530, "epoch": 607} {"train_loss": -35.675697326660156, "global_step": 73531, "epoch": 607} {"train_loss": -35.27276611328125, "global_step": 73532, "epoch": 607} {"train_loss": -35.64951705932617, "global_step": 73533, "epoch": 607} {"train_loss": -35.74650955200195, "global_step": 73534, "epoch": 607} {"train_loss": -36.0919189453125, "global_step": 73535, "epoch": 607} {"train_loss": -36.560218811035156, "global_step": 73536, "epoch": 607} {"train_loss": -36.273677825927734, "global_step": 73537, "epoch": 607} {"train_loss": -35.973358154296875, "global_step": 73538, "epoch": 607} {"train_loss": -37.58628845214844, "global_step": 73539, "epoch": 607} {"train_loss": -36.97467803955078, "global_step": 73540, "epoch": 607} {"train_loss": -36.66276931762695, "global_step": 73541, "epoch": 607} {"train_loss": -36.636409759521484, "global_step": 73542, "epoch": 607} {"train_loss": -37.35487747192383, "global_step": 73543, "epoch": 607} {"train_loss": -37.19942855834961, "global_step": 73544, "epoch": 607} {"train_loss": -36.46778106689453, "global_step": 73545, "epoch": 607} {"train_loss": -36.899288177490234, "global_step": 73546, "epoch": 607} {"train_loss": -37.96346664428711, "global_step": 73547, "epoch": 607} {"train_loss": -37.45509338378906, "global_step": 73548, "epoch": 607} {"train_loss": -37.24215316772461, "global_step": 73549, "epoch": 607} {"train_loss": -37.49750900268555, "global_step": 73550, "epoch": 607} {"train_loss": -37.57694625854492, "global_step": 73551, "epoch": 607} {"train_loss": -37.20891189575195, "global_step": 73552, "epoch": 607} {"train_loss": -37.41085433959961, "global_step": 73553, "epoch": 607} {"train_loss": -37.364505767822266, "global_step": 73554, "epoch": 607} {"train_loss": -37.862091064453125, "global_step": 73555, "epoch": 607} {"train_loss": -37.16685104370117, "global_step": 73556, "epoch": 607} {"train_loss": -36.85567092895508, "global_step": 73557, "epoch": 607} {"train_loss": -38.0550651550293, "global_step": 73558, "epoch": 607} {"train_loss": -37.55883026123047, "global_step": 73559, "epoch": 607} {"train_loss": -37.07853317260742, "global_step": 73560, "epoch": 607} {"train_loss": -37.49989700317383, "global_step": 73561, "epoch": 607} {"train_loss": -37.92702865600586, "global_step": 73562, "epoch": 607} {"train_loss": -37.856544494628906, "global_step": 73563, "epoch": 607} {"train_loss": -37.92568588256836, "global_step": 73564, "epoch": 607} {"train_loss": -37.83123779296875, "global_step": 73565, "epoch": 607} {"train_loss": -37.99386978149414, "global_step": 73566, "epoch": 607} {"train_loss": -37.034533492789784, "global_step": 73567, "epoch": 607, "val_loss": 2581586.25} {"train_loss": -37.83222579956055, "global_step": 73568, "epoch": 608} {"train_loss": -38.27390670776367, "global_step": 73569, "epoch": 608} {"train_loss": -37.878719329833984, "global_step": 73570, "epoch": 608} {"train_loss": -37.0844841003418, "global_step": 73571, "epoch": 608} {"train_loss": -38.028846740722656, "global_step": 73572, "epoch": 608} {"train_loss": -37.93172836303711, "global_step": 73573, "epoch": 608} {"train_loss": -37.5352668762207, "global_step": 73574, "epoch": 608} {"train_loss": -37.61880874633789, "global_step": 73575, "epoch": 608} {"train_loss": -37.851844787597656, "global_step": 73576, "epoch": 608} {"train_loss": -37.946319580078125, "global_step": 73577, "epoch": 608} {"train_loss": -38.024017333984375, "global_step": 73578, "epoch": 608} {"train_loss": -37.50556182861328, "global_step": 73579, "epoch": 608} {"train_loss": -37.606658935546875, "global_step": 73580, "epoch": 608} {"train_loss": -37.17856979370117, "global_step": 73581, "epoch": 608} {"train_loss": -38.0788688659668, "global_step": 73582, "epoch": 608} {"train_loss": -36.105892181396484, "global_step": 73583, "epoch": 608} {"train_loss": -34.54338455200195, "global_step": 73584, "epoch": 608} {"train_loss": -33.35886764526367, "global_step": 73585, "epoch": 608} {"train_loss": -28.824445724487305, "global_step": 73586, "epoch": 608} {"train_loss": -29.644941329956055, "global_step": 73587, "epoch": 608} {"train_loss": -31.579315185546875, "global_step": 73588, "epoch": 608} {"train_loss": -34.0322380065918, "global_step": 73589, "epoch": 608} {"train_loss": -31.582183837890625, "global_step": 73590, "epoch": 608} {"train_loss": -32.98527145385742, "global_step": 73591, "epoch": 608} {"train_loss": -32.70725631713867, "global_step": 73592, "epoch": 608} {"train_loss": -32.59498977661133, "global_step": 73593, "epoch": 608} {"train_loss": -32.509395599365234, "global_step": 73594, "epoch": 608} {"train_loss": -34.73159408569336, "global_step": 73595, "epoch": 608} {"train_loss": -35.746646881103516, "global_step": 73596, "epoch": 608} {"train_loss": -36.033287048339844, "global_step": 73597, "epoch": 608} {"train_loss": -36.35297393798828, "global_step": 73598, "epoch": 608} {"train_loss": -36.26062774658203, "global_step": 73599, "epoch": 608} {"train_loss": -36.280574798583984, "global_step": 73600, "epoch": 608} {"train_loss": -35.60580062866211, "global_step": 73601, "epoch": 608} {"train_loss": -35.9849967956543, "global_step": 73602, "epoch": 608} {"train_loss": -35.63075637817383, "global_step": 73603, "epoch": 608} {"train_loss": -36.42280197143555, "global_step": 73604, "epoch": 608} {"train_loss": -36.320186614990234, "global_step": 73605, "epoch": 608} {"train_loss": -37.44099044799805, "global_step": 73606, "epoch": 608} {"train_loss": -36.57505416870117, "global_step": 73607, "epoch": 608} {"train_loss": -35.6268310546875, "global_step": 73608, "epoch": 608} {"train_loss": -37.16206741333008, "global_step": 73609, "epoch": 608} {"train_loss": -35.78491973876953, "global_step": 73610, "epoch": 608} {"train_loss": -34.647926330566406, "global_step": 73611, "epoch": 608} {"train_loss": -34.96337890625, "global_step": 73612, "epoch": 608} {"train_loss": -32.50897979736328, "global_step": 73613, "epoch": 608} {"train_loss": -31.86273193359375, "global_step": 73614, "epoch": 608} {"train_loss": -33.39769744873047, "global_step": 73615, "epoch": 608} {"train_loss": -37.16864776611328, "global_step": 73616, "epoch": 608} {"train_loss": -34.85780715942383, "global_step": 73617, "epoch": 608} {"train_loss": -35.49994659423828, "global_step": 73618, "epoch": 608} {"train_loss": -37.26472091674805, "global_step": 73619, "epoch": 608} {"train_loss": -36.35164260864258, "global_step": 73620, "epoch": 608} {"train_loss": -36.97233963012695, "global_step": 73621, "epoch": 608} {"train_loss": -36.8596076965332, "global_step": 73622, "epoch": 608} {"train_loss": -36.79726028442383, "global_step": 73623, "epoch": 608} {"train_loss": -37.00928497314453, "global_step": 73624, "epoch": 608} {"train_loss": -36.826812744140625, "global_step": 73625, "epoch": 608} {"train_loss": -37.586666107177734, "global_step": 73626, "epoch": 608} {"train_loss": -36.61408615112305, "global_step": 73627, "epoch": 608} {"train_loss": -37.41035461425781, "global_step": 73628, "epoch": 608} {"train_loss": -37.384090423583984, "global_step": 73629, "epoch": 608} {"train_loss": -36.99221420288086, "global_step": 73630, "epoch": 608} {"train_loss": -37.31779098510742, "global_step": 73631, "epoch": 608} {"train_loss": -36.725318908691406, "global_step": 73632, "epoch": 608} {"train_loss": -37.861083984375, "global_step": 73633, "epoch": 608} {"train_loss": -37.49198532104492, "global_step": 73634, "epoch": 608} {"train_loss": -37.764930725097656, "global_step": 73635, "epoch": 608} {"train_loss": -37.61227798461914, "global_step": 73636, "epoch": 608} {"train_loss": -37.47981643676758, "global_step": 73637, "epoch": 608} {"train_loss": -37.33376693725586, "global_step": 73638, "epoch": 608} {"train_loss": -37.99876022338867, "global_step": 73639, "epoch": 608} {"train_loss": -37.80288314819336, "global_step": 73640, "epoch": 608} {"train_loss": -37.346866607666016, "global_step": 73641, "epoch": 608} {"train_loss": -37.75474166870117, "global_step": 73642, "epoch": 608} {"train_loss": -37.24132537841797, "global_step": 73643, "epoch": 608} {"train_loss": -37.89889144897461, "global_step": 73644, "epoch": 608} {"train_loss": -37.35627365112305, "global_step": 73645, "epoch": 608} {"train_loss": -38.197322845458984, "global_step": 73646, "epoch": 608} {"train_loss": -38.171451568603516, "global_step": 73647, "epoch": 608} {"train_loss": -37.539485931396484, "global_step": 73648, "epoch": 608} {"train_loss": -37.04241943359375, "global_step": 73649, "epoch": 608} {"train_loss": -37.085777282714844, "global_step": 73650, "epoch": 608} {"train_loss": -37.875709533691406, "global_step": 73651, "epoch": 608} {"train_loss": -37.62691879272461, "global_step": 73652, "epoch": 608} {"train_loss": -36.3927116394043, "global_step": 73653, "epoch": 608} {"train_loss": -37.040924072265625, "global_step": 73654, "epoch": 608} {"train_loss": -37.8219108581543, "global_step": 73655, "epoch": 608} {"train_loss": -36.784210205078125, "global_step": 73656, "epoch": 608} {"train_loss": -37.47148513793945, "global_step": 73657, "epoch": 608} {"train_loss": -37.9691276550293, "global_step": 73658, "epoch": 608} {"train_loss": -37.37901306152344, "global_step": 73659, "epoch": 608} {"train_loss": -37.45453643798828, "global_step": 73660, "epoch": 608} {"train_loss": -38.33530807495117, "global_step": 73661, "epoch": 608} {"train_loss": -37.63505935668945, "global_step": 73662, "epoch": 608} {"train_loss": -38.08083724975586, "global_step": 73663, "epoch": 608} {"train_loss": -37.64913558959961, "global_step": 73664, "epoch": 608} {"train_loss": -38.14215087890625, "global_step": 73665, "epoch": 608} {"train_loss": -38.21504592895508, "global_step": 73666, "epoch": 608} {"train_loss": -37.95170211791992, "global_step": 73667, "epoch": 608} {"train_loss": -37.84342575073242, "global_step": 73668, "epoch": 608} {"train_loss": -37.64666748046875, "global_step": 73669, "epoch": 608} {"train_loss": -37.433815002441406, "global_step": 73670, "epoch": 608} {"train_loss": -38.05569839477539, "global_step": 73671, "epoch": 608} {"train_loss": -37.952877044677734, "global_step": 73672, "epoch": 608} {"train_loss": -38.033111572265625, "global_step": 73673, "epoch": 608} {"train_loss": -38.16758346557617, "global_step": 73674, "epoch": 608} {"train_loss": -37.864524841308594, "global_step": 73675, "epoch": 608} {"train_loss": -36.60503387451172, "global_step": 73676, "epoch": 608} {"train_loss": -34.20394515991211, "global_step": 73677, "epoch": 608} {"train_loss": -29.491046905517578, "global_step": 73678, "epoch": 608} {"train_loss": -19.802892684936523, "global_step": 73679, "epoch": 608} {"train_loss": -29.252622604370117, "global_step": 73680, "epoch": 608} {"train_loss": -25.821699142456055, "global_step": 73681, "epoch": 608} {"train_loss": -27.340442657470703, "global_step": 73682, "epoch": 608} {"train_loss": -29.832143783569336, "global_step": 73683, "epoch": 608} {"train_loss": -31.714263916015625, "global_step": 73684, "epoch": 608} {"train_loss": -31.46209716796875, "global_step": 73685, "epoch": 608} {"train_loss": -32.154598236083984, "global_step": 73686, "epoch": 608} {"train_loss": -32.63916015625, "global_step": 73687, "epoch": 608} {"train_loss": -35.870951975672696, "global_step": 73688, "epoch": 608, "val_loss": 2612446.75} {"train_loss": -32.05937194824219, "global_step": 73689, "epoch": 609} {"train_loss": -32.6046028137207, "global_step": 73690, "epoch": 609} {"train_loss": -32.47904968261719, "global_step": 73691, "epoch": 609} {"train_loss": -33.7437858581543, "global_step": 73692, "epoch": 609} {"train_loss": -33.58354568481445, "global_step": 73693, "epoch": 609} {"train_loss": -33.685333251953125, "global_step": 73694, "epoch": 609} {"train_loss": -33.96149826049805, "global_step": 73695, "epoch": 609} {"train_loss": -34.5106201171875, "global_step": 73696, "epoch": 609} {"train_loss": -34.860050201416016, "global_step": 73697, "epoch": 609} {"train_loss": -35.319576263427734, "global_step": 73698, "epoch": 609} {"train_loss": -35.1842155456543, "global_step": 73699, "epoch": 609} {"train_loss": -35.380855560302734, "global_step": 73700, "epoch": 609} {"train_loss": -35.562110900878906, "global_step": 73701, "epoch": 609} {"train_loss": -36.56744384765625, "global_step": 73702, "epoch": 609} {"train_loss": -35.98958969116211, "global_step": 73703, "epoch": 609} {"train_loss": -36.564815521240234, "global_step": 73704, "epoch": 609} {"train_loss": -36.9879264831543, "global_step": 73705, "epoch": 609} {"train_loss": -37.286922454833984, "global_step": 73706, "epoch": 609} {"train_loss": -37.05723190307617, "global_step": 73707, "epoch": 609} {"train_loss": -37.19916534423828, "global_step": 73708, "epoch": 609} {"train_loss": -36.98700714111328, "global_step": 73709, "epoch": 609} {"train_loss": -37.09890365600586, "global_step": 73710, "epoch": 609} {"train_loss": -37.108402252197266, "global_step": 73711, "epoch": 609} {"train_loss": -37.36930465698242, "global_step": 73712, "epoch": 609} {"train_loss": -37.034297943115234, "global_step": 73713, "epoch": 609} {"train_loss": -37.2074089050293, "global_step": 73714, "epoch": 609} {"train_loss": -37.17523193359375, "global_step": 73715, "epoch": 609} {"train_loss": -37.28074264526367, "global_step": 73716, "epoch": 609} {"train_loss": -37.49614334106445, "global_step": 73717, "epoch": 609} {"train_loss": -37.2506103515625, "global_step": 73718, "epoch": 609} {"train_loss": -37.14945983886719, "global_step": 73719, "epoch": 609} {"train_loss": -37.57295608520508, "global_step": 73720, "epoch": 609} {"train_loss": -37.38978958129883, "global_step": 73721, "epoch": 609} {"train_loss": -37.652076721191406, "global_step": 73722, "epoch": 609} {"train_loss": -37.28231430053711, "global_step": 73723, "epoch": 609} {"train_loss": -37.76853561401367, "global_step": 73724, "epoch": 609} {"train_loss": -37.71100616455078, "global_step": 73725, "epoch": 609} {"train_loss": -38.2782096862793, "global_step": 73726, "epoch": 609} {"train_loss": -38.0887565612793, "global_step": 73727, "epoch": 609} {"train_loss": -37.801570892333984, "global_step": 73728, "epoch": 609} {"train_loss": -37.82941818237305, "global_step": 73729, "epoch": 609} {"train_loss": -37.906227111816406, "global_step": 73730, "epoch": 609} {"train_loss": -38.45768356323242, "global_step": 73731, "epoch": 609} {"train_loss": -38.11750411987305, "global_step": 73732, "epoch": 609} {"train_loss": -38.2835807800293, "global_step": 73733, "epoch": 609} {"train_loss": -38.15106201171875, "global_step": 73734, "epoch": 609} {"train_loss": -37.54096603393555, "global_step": 73735, "epoch": 609} {"train_loss": -37.125579833984375, "global_step": 73736, "epoch": 609} {"train_loss": -36.644039154052734, "global_step": 73737, "epoch": 609} {"train_loss": -38.1941032409668, "global_step": 73738, "epoch": 609} {"train_loss": -37.819732666015625, "global_step": 73739, "epoch": 609} {"train_loss": -37.212249755859375, "global_step": 73740, "epoch": 609} {"train_loss": -37.17243576049805, "global_step": 73741, "epoch": 609} {"train_loss": -37.75800704956055, "global_step": 73742, "epoch": 609} {"train_loss": -37.293731689453125, "global_step": 73743, "epoch": 609} {"train_loss": -37.168941497802734, "global_step": 73744, "epoch": 609} {"train_loss": -37.51823043823242, "global_step": 73745, "epoch": 609} {"train_loss": -38.10317611694336, "global_step": 73746, "epoch": 609} {"train_loss": -37.31641387939453, "global_step": 73747, "epoch": 609} {"train_loss": -37.386688232421875, "global_step": 73748, "epoch": 609} {"train_loss": -37.434749603271484, "global_step": 73749, "epoch": 609} {"train_loss": -38.28663635253906, "global_step": 73750, "epoch": 609} {"train_loss": -37.70648193359375, "global_step": 73751, "epoch": 609} {"train_loss": -37.7547721862793, "global_step": 73752, "epoch": 609} {"train_loss": -38.4952278137207, "global_step": 73753, "epoch": 609} {"train_loss": -37.65438461303711, "global_step": 73754, "epoch": 609} {"train_loss": -37.65221405029297, "global_step": 73755, "epoch": 609} {"train_loss": -37.929561614990234, "global_step": 73756, "epoch": 609} {"train_loss": -37.527523040771484, "global_step": 73757, "epoch": 609} {"train_loss": -37.52421188354492, "global_step": 73758, "epoch": 609} {"train_loss": -37.9714469909668, "global_step": 73759, "epoch": 609} {"train_loss": -37.75993347167969, "global_step": 73760, "epoch": 609} {"train_loss": -37.59882354736328, "global_step": 73761, "epoch": 609} {"train_loss": -38.17306137084961, "global_step": 73762, "epoch": 609} {"train_loss": -37.07231521606445, "global_step": 73763, "epoch": 609} {"train_loss": -36.613739013671875, "global_step": 73764, "epoch": 609} {"train_loss": -37.010066986083984, "global_step": 73765, "epoch": 609} {"train_loss": -37.8677978515625, "global_step": 73766, "epoch": 609} {"train_loss": -37.065765380859375, "global_step": 73767, "epoch": 609} {"train_loss": -35.465423583984375, "global_step": 73768, "epoch": 609} {"train_loss": -32.54038619995117, "global_step": 73769, "epoch": 609} {"train_loss": -32.98044967651367, "global_step": 73770, "epoch": 609} {"train_loss": -33.22047805786133, "global_step": 73771, "epoch": 609} {"train_loss": -23.290864944458008, "global_step": 73772, "epoch": 609} {"train_loss": -27.2525634765625, "global_step": 73773, "epoch": 609} {"train_loss": -30.7122745513916, "global_step": 73774, "epoch": 609} {"train_loss": -15.991891860961914, "global_step": 73775, "epoch": 609} {"train_loss": -34.714569091796875, "global_step": 73776, "epoch": 609} {"train_loss": -24.536518096923828, "global_step": 73777, "epoch": 609} {"train_loss": -34.06510543823242, "global_step": 73778, "epoch": 609} {"train_loss": -31.1240234375, "global_step": 73779, "epoch": 609} {"train_loss": -29.926666259765625, "global_step": 73780, "epoch": 609} {"train_loss": -34.6199836730957, "global_step": 73781, "epoch": 609} {"train_loss": -32.89345932006836, "global_step": 73782, "epoch": 609} {"train_loss": -34.032264709472656, "global_step": 73783, "epoch": 609} {"train_loss": -35.053382873535156, "global_step": 73784, "epoch": 609} {"train_loss": -36.24125289916992, "global_step": 73785, "epoch": 609} {"train_loss": -35.106536865234375, "global_step": 73786, "epoch": 609} {"train_loss": -35.78260803222656, "global_step": 73787, "epoch": 609} {"train_loss": -36.17986297607422, "global_step": 73788, "epoch": 609} {"train_loss": -36.45573043823242, "global_step": 73789, "epoch": 609} {"train_loss": -35.623390197753906, "global_step": 73790, "epoch": 609} {"train_loss": -36.8133544921875, "global_step": 73791, "epoch": 609} {"train_loss": -36.01543045043945, "global_step": 73792, "epoch": 609} {"train_loss": -36.92121505737305, "global_step": 73793, "epoch": 609} {"train_loss": -36.60477828979492, "global_step": 73794, "epoch": 609} {"train_loss": -36.61067581176758, "global_step": 73795, "epoch": 609} {"train_loss": -36.505802154541016, "global_step": 73796, "epoch": 609} {"train_loss": -36.966304779052734, "global_step": 73797, "epoch": 609} {"train_loss": -36.933799743652344, "global_step": 73798, "epoch": 609} {"train_loss": -37.167659759521484, "global_step": 73799, "epoch": 609} {"train_loss": -37.05656051635742, "global_step": 73800, "epoch": 609} {"train_loss": -36.957576751708984, "global_step": 73801, "epoch": 609} {"train_loss": -36.82487869262695, "global_step": 73802, "epoch": 609} {"train_loss": -37.3758544921875, "global_step": 73803, "epoch": 609} {"train_loss": -37.54646682739258, "global_step": 73804, "epoch": 609} {"train_loss": -37.16921615600586, "global_step": 73805, "epoch": 609} {"train_loss": -37.20149230957031, "global_step": 73806, "epoch": 609} {"train_loss": -37.56745529174805, "global_step": 73807, "epoch": 609} {"train_loss": -37.56528854370117, "global_step": 73808, "epoch": 609} {"train_loss": -36.021687137193915, "global_step": 73809, "epoch": 609, "val_loss": 2502462.75} {"train_loss": -37.32650375366211, "global_step": 73810, "epoch": 610} {"train_loss": -38.018035888671875, "global_step": 73811, "epoch": 610} {"train_loss": -37.69685745239258, "global_step": 73812, "epoch": 610} {"train_loss": -37.50001907348633, "global_step": 73813, "epoch": 610} {"train_loss": -37.59748458862305, "global_step": 73814, "epoch": 610} {"train_loss": -37.75876998901367, "global_step": 73815, "epoch": 610} {"train_loss": -38.084938049316406, "global_step": 73816, "epoch": 610} {"train_loss": -37.99912643432617, "global_step": 73817, "epoch": 610} {"train_loss": -37.998348236083984, "global_step": 73818, "epoch": 610} {"train_loss": -36.9652099609375, "global_step": 73819, "epoch": 610} {"train_loss": -37.31534957885742, "global_step": 73820, "epoch": 610} {"train_loss": -37.77914047241211, "global_step": 73821, "epoch": 610} {"train_loss": -38.24199295043945, "global_step": 73822, "epoch": 610} {"train_loss": -38.14511489868164, "global_step": 73823, "epoch": 610} {"train_loss": -38.178157806396484, "global_step": 73824, "epoch": 610} {"train_loss": -38.33810043334961, "global_step": 73825, "epoch": 610} {"train_loss": -37.01889419555664, "global_step": 73826, "epoch": 610} {"train_loss": -36.97624969482422, "global_step": 73827, "epoch": 610} {"train_loss": -37.021541595458984, "global_step": 73828, "epoch": 610} {"train_loss": -36.933834075927734, "global_step": 73829, "epoch": 610} {"train_loss": -38.356014251708984, "global_step": 73830, "epoch": 610} {"train_loss": -37.903717041015625, "global_step": 73831, "epoch": 610} {"train_loss": -36.37461471557617, "global_step": 73832, "epoch": 610} {"train_loss": -36.1801872253418, "global_step": 73833, "epoch": 610} {"train_loss": -38.0177001953125, "global_step": 73834, "epoch": 610} {"train_loss": -37.01211166381836, "global_step": 73835, "epoch": 610} {"train_loss": -36.171260833740234, "global_step": 73836, "epoch": 610} {"train_loss": -37.53489303588867, "global_step": 73837, "epoch": 610} {"train_loss": -37.756866455078125, "global_step": 73838, "epoch": 610} {"train_loss": -35.635963439941406, "global_step": 73839, "epoch": 610} {"train_loss": -36.47771072387695, "global_step": 73840, "epoch": 610} {"train_loss": -37.84811782836914, "global_step": 73841, "epoch": 610} {"train_loss": -36.26983642578125, "global_step": 73842, "epoch": 610} {"train_loss": -37.96548843383789, "global_step": 73843, "epoch": 610} {"train_loss": -36.70856475830078, "global_step": 73844, "epoch": 610} {"train_loss": -36.846920013427734, "global_step": 73845, "epoch": 610} {"train_loss": -38.2740364074707, "global_step": 73846, "epoch": 610} {"train_loss": -37.43215560913086, "global_step": 73847, "epoch": 610} {"train_loss": -37.55044174194336, "global_step": 73848, "epoch": 610} {"train_loss": -38.14403533935547, "global_step": 73849, "epoch": 610} {"train_loss": -37.36188507080078, "global_step": 73850, "epoch": 610} {"train_loss": -37.060455322265625, "global_step": 73851, "epoch": 610} {"train_loss": -37.397396087646484, "global_step": 73852, "epoch": 610} {"train_loss": -36.87296676635742, "global_step": 73853, "epoch": 610} {"train_loss": -37.625396728515625, "global_step": 73854, "epoch": 610} {"train_loss": -37.60646438598633, "global_step": 73855, "epoch": 610} {"train_loss": -37.80377960205078, "global_step": 73856, "epoch": 610} {"train_loss": -37.70614242553711, "global_step": 73857, "epoch": 610} {"train_loss": -37.5562858581543, "global_step": 73858, "epoch": 610} {"train_loss": -37.384437561035156, "global_step": 73859, "epoch": 610} {"train_loss": -36.865474700927734, "global_step": 73860, "epoch": 610} {"train_loss": -37.71175765991211, "global_step": 73861, "epoch": 610} {"train_loss": -35.157283782958984, "global_step": 73862, "epoch": 610} {"train_loss": -36.70456314086914, "global_step": 73863, "epoch": 610} {"train_loss": -37.186744689941406, "global_step": 73864, "epoch": 610} {"train_loss": -36.21137237548828, "global_step": 73865, "epoch": 610} {"train_loss": -36.724666595458984, "global_step": 73866, "epoch": 610} {"train_loss": -36.70404052734375, "global_step": 73867, "epoch": 610} {"train_loss": -35.3917121887207, "global_step": 73868, "epoch": 610} {"train_loss": -35.68526077270508, "global_step": 73869, "epoch": 610} {"train_loss": -37.30170440673828, "global_step": 73870, "epoch": 610} {"train_loss": -36.49808883666992, "global_step": 73871, "epoch": 610} {"train_loss": -34.906288146972656, "global_step": 73872, "epoch": 610} {"train_loss": -36.331703186035156, "global_step": 73873, "epoch": 610} {"train_loss": -34.22532272338867, "global_step": 73874, "epoch": 610} {"train_loss": -37.522064208984375, "global_step": 73875, "epoch": 610} {"train_loss": -34.6809196472168, "global_step": 73876, "epoch": 610} {"train_loss": -36.70266342163086, "global_step": 73877, "epoch": 610} {"train_loss": -35.100013732910156, "global_step": 73878, "epoch": 610} {"train_loss": -37.62677001953125, "global_step": 73879, "epoch": 610} {"train_loss": -34.7774772644043, "global_step": 73880, "epoch": 610} {"train_loss": -37.346527099609375, "global_step": 73881, "epoch": 610} {"train_loss": -34.921783447265625, "global_step": 73882, "epoch": 610} {"train_loss": -36.9217643737793, "global_step": 73883, "epoch": 610} {"train_loss": -35.73674774169922, "global_step": 73884, "epoch": 610} {"train_loss": -35.002418518066406, "global_step": 73885, "epoch": 610} {"train_loss": -35.853458404541016, "global_step": 73886, "epoch": 610} {"train_loss": -37.489315032958984, "global_step": 73887, "epoch": 610} {"train_loss": -36.38932418823242, "global_step": 73888, "epoch": 610} {"train_loss": -37.642696380615234, "global_step": 73889, "epoch": 610} {"train_loss": -36.810997009277344, "global_step": 73890, "epoch": 610} {"train_loss": -36.86898422241211, "global_step": 73891, "epoch": 610} {"train_loss": -36.949337005615234, "global_step": 73892, "epoch": 610} {"train_loss": -37.26249313354492, "global_step": 73893, "epoch": 610} {"train_loss": -36.9653434753418, "global_step": 73894, "epoch": 610} {"train_loss": -37.094478607177734, "global_step": 73895, "epoch": 610} {"train_loss": -36.416015625, "global_step": 73896, "epoch": 610} {"train_loss": -37.084171295166016, "global_step": 73897, "epoch": 610} {"train_loss": -36.52207565307617, "global_step": 73898, "epoch": 610} {"train_loss": -37.14643478393555, "global_step": 73899, "epoch": 610} {"train_loss": -37.19965362548828, "global_step": 73900, "epoch": 610} {"train_loss": -36.553314208984375, "global_step": 73901, "epoch": 610} {"train_loss": -35.939754486083984, "global_step": 73902, "epoch": 610} {"train_loss": -36.539852142333984, "global_step": 73903, "epoch": 610} {"train_loss": -37.27759552001953, "global_step": 73904, "epoch": 610} {"train_loss": -36.91353225708008, "global_step": 73905, "epoch": 610} {"train_loss": -37.30690383911133, "global_step": 73906, "epoch": 610} {"train_loss": -37.131134033203125, "global_step": 73907, "epoch": 610} {"train_loss": -37.59474563598633, "global_step": 73908, "epoch": 610} {"train_loss": -37.60423278808594, "global_step": 73909, "epoch": 610} {"train_loss": -37.16597366333008, "global_step": 73910, "epoch": 610} {"train_loss": -37.86289596557617, "global_step": 73911, "epoch": 610} {"train_loss": -37.53817367553711, "global_step": 73912, "epoch": 610} {"train_loss": -37.64248275756836, "global_step": 73913, "epoch": 610} {"train_loss": -37.10957717895508, "global_step": 73914, "epoch": 610} {"train_loss": -38.028175354003906, "global_step": 73915, "epoch": 610} {"train_loss": -37.782222747802734, "global_step": 73916, "epoch": 610} {"train_loss": -36.916648864746094, "global_step": 73917, "epoch": 610} {"train_loss": -37.98861312866211, "global_step": 73918, "epoch": 610} {"train_loss": -37.78646469116211, "global_step": 73919, "epoch": 610} {"train_loss": -37.87791442871094, "global_step": 73920, "epoch": 610} {"train_loss": -37.415382385253906, "global_step": 73921, "epoch": 610} {"train_loss": -37.431034088134766, "global_step": 73922, "epoch": 610} {"train_loss": -37.52368927001953, "global_step": 73923, "epoch": 610} {"train_loss": -37.849605560302734, "global_step": 73924, "epoch": 610} {"train_loss": -37.962066650390625, "global_step": 73925, "epoch": 610} {"train_loss": -37.83451461791992, "global_step": 73926, "epoch": 610} {"train_loss": -37.4692268371582, "global_step": 73927, "epoch": 610} {"train_loss": -36.00410079956055, "global_step": 73928, "epoch": 610} {"train_loss": -36.921173095703125, "global_step": 73929, "epoch": 610} {"train_loss": -37.06185512700357, "global_step": 73930, "epoch": 610, "val_loss": 2645444.0} {"train_loss": -36.54453659057617, "global_step": 73931, "epoch": 611} {"train_loss": -35.12295150756836, "global_step": 73932, "epoch": 611} {"train_loss": -34.54108428955078, "global_step": 73933, "epoch": 611} {"train_loss": -34.15508270263672, "global_step": 73934, "epoch": 611} {"train_loss": -37.157955169677734, "global_step": 73935, "epoch": 611} {"train_loss": -35.426673889160156, "global_step": 73936, "epoch": 611} {"train_loss": -34.48659133911133, "global_step": 73937, "epoch": 611} {"train_loss": -35.15857696533203, "global_step": 73938, "epoch": 611} {"train_loss": -37.00017166137695, "global_step": 73939, "epoch": 611} {"train_loss": -36.64085006713867, "global_step": 73940, "epoch": 611} {"train_loss": -2.1580581665039062, "global_step": 73941, "epoch": 611} {"train_loss": -32.88254928588867, "global_step": 73942, "epoch": 611} {"train_loss": -14.206244468688965, "global_step": 73943, "epoch": 611} {"train_loss": -19.40765380859375, "global_step": 73944, "epoch": 611} {"train_loss": -19.42633628845215, "global_step": 73945, "epoch": 611} {"train_loss": -17.00115394592285, "global_step": 73946, "epoch": 611} {"train_loss": -20.38086700439453, "global_step": 73947, "epoch": 611} {"train_loss": -24.625547409057617, "global_step": 73948, "epoch": 611} {"train_loss": -21.209800720214844, "global_step": 73949, "epoch": 611} {"train_loss": -24.7834529876709, "global_step": 73950, "epoch": 611} {"train_loss": -26.491323471069336, "global_step": 73951, "epoch": 611} {"train_loss": -27.457965850830078, "global_step": 73952, "epoch": 611} {"train_loss": -27.89241600036621, "global_step": 73953, "epoch": 611} {"train_loss": -28.453290939331055, "global_step": 73954, "epoch": 611} {"train_loss": -28.139862060546875, "global_step": 73955, "epoch": 611} {"train_loss": -28.339065551757812, "global_step": 73956, "epoch": 611} {"train_loss": -29.137420654296875, "global_step": 73957, "epoch": 611} {"train_loss": -28.76350975036621, "global_step": 73958, "epoch": 611} {"train_loss": -29.716766357421875, "global_step": 73959, "epoch": 611} {"train_loss": -29.17889404296875, "global_step": 73960, "epoch": 611} {"train_loss": -30.80105972290039, "global_step": 73961, "epoch": 611} {"train_loss": -29.997821807861328, "global_step": 73962, "epoch": 611} {"train_loss": -30.8001766204834, "global_step": 73963, "epoch": 611} {"train_loss": -30.5406494140625, "global_step": 73964, "epoch": 611} {"train_loss": -31.335010528564453, "global_step": 73965, "epoch": 611} {"train_loss": -31.151874542236328, "global_step": 73966, "epoch": 611} {"train_loss": -31.305383682250977, "global_step": 73967, "epoch": 611} {"train_loss": -32.66892623901367, "global_step": 73968, "epoch": 611} {"train_loss": -32.30110168457031, "global_step": 73969, "epoch": 611} {"train_loss": -30.831037521362305, "global_step": 73970, "epoch": 611} {"train_loss": -31.656713485717773, "global_step": 73971, "epoch": 611} {"train_loss": -32.528141021728516, "global_step": 73972, "epoch": 611} {"train_loss": -32.799381256103516, "global_step": 73973, "epoch": 611} {"train_loss": -31.839231491088867, "global_step": 73974, "epoch": 611} {"train_loss": -32.795501708984375, "global_step": 73975, "epoch": 611} {"train_loss": -33.11235427856445, "global_step": 73976, "epoch": 611} {"train_loss": -33.09214401245117, "global_step": 73977, "epoch": 611} {"train_loss": -32.562225341796875, "global_step": 73978, "epoch": 611} {"train_loss": -33.21167755126953, "global_step": 73979, "epoch": 611} {"train_loss": -33.7092399597168, "global_step": 73980, "epoch": 611} {"train_loss": -32.62541198730469, "global_step": 73981, "epoch": 611} {"train_loss": -33.26534652709961, "global_step": 73982, "epoch": 611} {"train_loss": -32.21749496459961, "global_step": 73983, "epoch": 611} {"train_loss": -32.24898910522461, "global_step": 73984, "epoch": 611} {"train_loss": -33.62014389038086, "global_step": 73985, "epoch": 611} {"train_loss": -33.976051330566406, "global_step": 73986, "epoch": 611} {"train_loss": -34.53214645385742, "global_step": 73987, "epoch": 611} {"train_loss": -33.569618225097656, "global_step": 73988, "epoch": 611} {"train_loss": -33.55419158935547, "global_step": 73989, "epoch": 611} {"train_loss": -34.5369987487793, "global_step": 73990, "epoch": 611} {"train_loss": -34.332393646240234, "global_step": 73991, "epoch": 611} {"train_loss": -34.58925247192383, "global_step": 73992, "epoch": 611} {"train_loss": -34.50654983520508, "global_step": 73993, "epoch": 611} {"train_loss": -34.8170280456543, "global_step": 73994, "epoch": 611} {"train_loss": -34.627315521240234, "global_step": 73995, "epoch": 611} {"train_loss": -33.80579376220703, "global_step": 73996, "epoch": 611} {"train_loss": -34.52701187133789, "global_step": 73997, "epoch": 611} {"train_loss": -34.848690032958984, "global_step": 73998, "epoch": 611} {"train_loss": -33.85624313354492, "global_step": 73999, "epoch": 611} {"train_loss": -34.09312057495117, "global_step": 74000, "epoch": 611} {"train_loss": -34.56031799316406, "global_step": 74001, "epoch": 611} {"train_loss": -34.98951721191406, "global_step": 74002, "epoch": 611} {"train_loss": -34.315040588378906, "global_step": 74003, "epoch": 611} {"train_loss": -34.74058151245117, "global_step": 74004, "epoch": 611} {"train_loss": -34.779361724853516, "global_step": 74005, "epoch": 611} {"train_loss": -35.74802780151367, "global_step": 74006, "epoch": 611} {"train_loss": -35.18149948120117, "global_step": 74007, "epoch": 611} {"train_loss": -34.406005859375, "global_step": 74008, "epoch": 611} {"train_loss": -35.867645263671875, "global_step": 74009, "epoch": 611} {"train_loss": -35.693153381347656, "global_step": 74010, "epoch": 611} {"train_loss": -35.22703552246094, "global_step": 74011, "epoch": 611} {"train_loss": -35.11007308959961, "global_step": 74012, "epoch": 611} {"train_loss": -34.769195556640625, "global_step": 74013, "epoch": 611} {"train_loss": -35.71175765991211, "global_step": 74014, "epoch": 611} {"train_loss": -35.044742584228516, "global_step": 74015, "epoch": 611} {"train_loss": -35.197505950927734, "global_step": 74016, "epoch": 611} {"train_loss": -35.707881927490234, "global_step": 74017, "epoch": 611} {"train_loss": -35.27219772338867, "global_step": 74018, "epoch": 611} {"train_loss": -35.68647384643555, "global_step": 74019, "epoch": 611} {"train_loss": -33.91212463378906, "global_step": 74020, "epoch": 611} {"train_loss": -35.77347946166992, "global_step": 74021, "epoch": 611} {"train_loss": -36.11249923706055, "global_step": 74022, "epoch": 611} {"train_loss": -36.44841003417969, "global_step": 74023, "epoch": 611} {"train_loss": -35.62592315673828, "global_step": 74024, "epoch": 611} {"train_loss": -35.248443603515625, "global_step": 74025, "epoch": 611} {"train_loss": -35.32967758178711, "global_step": 74026, "epoch": 611} {"train_loss": -35.36811447143555, "global_step": 74027, "epoch": 611} {"train_loss": -34.5404052734375, "global_step": 74028, "epoch": 611} {"train_loss": -36.12354278564453, "global_step": 74029, "epoch": 611} {"train_loss": -35.04044723510742, "global_step": 74030, "epoch": 611} {"train_loss": -31.40899085998535, "global_step": 74031, "epoch": 611} {"train_loss": -35.58903884887695, "global_step": 74032, "epoch": 611} {"train_loss": -36.30245590209961, "global_step": 74033, "epoch": 611} {"train_loss": -34.09403610229492, "global_step": 74034, "epoch": 611} {"train_loss": -29.807727813720703, "global_step": 74035, "epoch": 611} {"train_loss": -29.976301193237305, "global_step": 74036, "epoch": 611} {"train_loss": -29.593921661376953, "global_step": 74037, "epoch": 611} {"train_loss": -29.5667724609375, "global_step": 74038, "epoch": 611} {"train_loss": -29.684051513671875, "global_step": 74039, "epoch": 611} {"train_loss": -30.537235260009766, "global_step": 74040, "epoch": 611} {"train_loss": -30.193567276000977, "global_step": 74041, "epoch": 611} {"train_loss": -30.652311325073242, "global_step": 74042, "epoch": 611} {"train_loss": -30.7311954498291, "global_step": 74043, "epoch": 611} {"train_loss": -30.79279136657715, "global_step": 74044, "epoch": 611} {"train_loss": -30.3768310546875, "global_step": 74045, "epoch": 611} {"train_loss": -30.80466079711914, "global_step": 74046, "epoch": 611} {"train_loss": -31.076995849609375, "global_step": 74047, "epoch": 611} {"train_loss": -31.08039665222168, "global_step": 74048, "epoch": 611} {"train_loss": -31.22283935546875, "global_step": 74049, "epoch": 611} {"train_loss": -31.59112548828125, "global_step": 74050, "epoch": 611} {"train_loss": -31.960286487232555, "global_step": 74051, "epoch": 611, "val_loss": 2641047.0} {"train_loss": -31.811786651611328, "global_step": 74052, "epoch": 612} {"train_loss": -31.725950241088867, "global_step": 74053, "epoch": 612} {"train_loss": -32.15804672241211, "global_step": 74054, "epoch": 612} {"train_loss": -32.00749588012695, "global_step": 74055, "epoch": 612} {"train_loss": -32.3951416015625, "global_step": 74056, "epoch": 612} {"train_loss": -32.600799560546875, "global_step": 74057, "epoch": 612} {"train_loss": -32.478694915771484, "global_step": 74058, "epoch": 612} {"train_loss": -32.70819091796875, "global_step": 74059, "epoch": 612} {"train_loss": -33.46466064453125, "global_step": 74060, "epoch": 612} {"train_loss": -33.14780044555664, "global_step": 74061, "epoch": 612} {"train_loss": -33.5346794128418, "global_step": 74062, "epoch": 612} {"train_loss": -33.0718879699707, "global_step": 74063, "epoch": 612} {"train_loss": -32.649593353271484, "global_step": 74064, "epoch": 612} {"train_loss": -30.755817413330078, "global_step": 74065, "epoch": 612} {"train_loss": -28.245319366455078, "global_step": 74066, "epoch": 612} {"train_loss": -28.940465927124023, "global_step": 74067, "epoch": 612} {"train_loss": -34.30833053588867, "global_step": 74068, "epoch": 612} {"train_loss": -29.809961318969727, "global_step": 74069, "epoch": 612} {"train_loss": -33.651123046875, "global_step": 74070, "epoch": 612} {"train_loss": -32.4248161315918, "global_step": 74071, "epoch": 612} {"train_loss": -33.03957748413086, "global_step": 74072, "epoch": 612} {"train_loss": -33.07715606689453, "global_step": 74073, "epoch": 612} {"train_loss": -33.75476837158203, "global_step": 74074, "epoch": 612} {"train_loss": -33.0688362121582, "global_step": 74075, "epoch": 612} {"train_loss": -34.63126754760742, "global_step": 74076, "epoch": 612} {"train_loss": -33.536373138427734, "global_step": 74077, "epoch": 612} {"train_loss": -33.37415313720703, "global_step": 74078, "epoch": 612} {"train_loss": -33.589385986328125, "global_step": 74079, "epoch": 612} {"train_loss": -33.383235931396484, "global_step": 74080, "epoch": 612} {"train_loss": -34.141178131103516, "global_step": 74081, "epoch": 612} {"train_loss": -33.17863845825195, "global_step": 74082, "epoch": 612} {"train_loss": -25.154354095458984, "global_step": 74083, "epoch": 612} {"train_loss": -13.116004943847656, "global_step": 74084, "epoch": 612} {"train_loss": -24.181447982788086, "global_step": 74085, "epoch": 612} {"train_loss": -31.865942001342773, "global_step": 74086, "epoch": 612} {"train_loss": -23.886375427246094, "global_step": 74087, "epoch": 612} {"train_loss": -33.92714309692383, "global_step": 74088, "epoch": 612} {"train_loss": -28.52138328552246, "global_step": 74089, "epoch": 612} {"train_loss": -32.762969970703125, "global_step": 74090, "epoch": 612} {"train_loss": -33.15031051635742, "global_step": 74091, "epoch": 612} {"train_loss": -31.743942260742188, "global_step": 74092, "epoch": 612} {"train_loss": -33.922481536865234, "global_step": 74093, "epoch": 612} {"train_loss": -33.35393524169922, "global_step": 74094, "epoch": 612} {"train_loss": -32.13593673706055, "global_step": 74095, "epoch": 612} {"train_loss": -33.782493591308594, "global_step": 74096, "epoch": 612} {"train_loss": -34.01089096069336, "global_step": 74097, "epoch": 612} {"train_loss": -32.99154281616211, "global_step": 74098, "epoch": 612} {"train_loss": -33.244384765625, "global_step": 74099, "epoch": 612} {"train_loss": -34.2382698059082, "global_step": 74100, "epoch": 612} {"train_loss": -34.23421096801758, "global_step": 74101, "epoch": 612} {"train_loss": -33.95856857299805, "global_step": 74102, "epoch": 612} {"train_loss": -32.872310638427734, "global_step": 74103, "epoch": 612} {"train_loss": -33.71657943725586, "global_step": 74104, "epoch": 612} {"train_loss": -34.0838623046875, "global_step": 74105, "epoch": 612} {"train_loss": -34.28947067260742, "global_step": 74106, "epoch": 612} {"train_loss": -33.50434494018555, "global_step": 74107, "epoch": 612} {"train_loss": -33.440269470214844, "global_step": 74108, "epoch": 612} {"train_loss": -33.81734848022461, "global_step": 74109, "epoch": 612} {"train_loss": -33.19646453857422, "global_step": 74110, "epoch": 612} {"train_loss": -32.36153793334961, "global_step": 74111, "epoch": 612} {"train_loss": -34.47737121582031, "global_step": 74112, "epoch": 612} {"train_loss": -33.7543830871582, "global_step": 74113, "epoch": 612} {"train_loss": -33.45168685913086, "global_step": 74114, "epoch": 612} {"train_loss": -34.12622833251953, "global_step": 74115, "epoch": 612} {"train_loss": -34.42014694213867, "global_step": 74116, "epoch": 612} {"train_loss": -33.745853424072266, "global_step": 74117, "epoch": 612} {"train_loss": -34.30499267578125, "global_step": 74118, "epoch": 612} {"train_loss": -34.949031829833984, "global_step": 74119, "epoch": 612} {"train_loss": -33.08943557739258, "global_step": 74120, "epoch": 612} {"train_loss": -31.35428237915039, "global_step": 74121, "epoch": 612} {"train_loss": -18.943328857421875, "global_step": 74122, "epoch": 612} {"train_loss": 2.525717258453369, "global_step": 74123, "epoch": 612} {"train_loss": -25.03617286682129, "global_step": 74124, "epoch": 612} {"train_loss": -23.11379051208496, "global_step": 74125, "epoch": 612} {"train_loss": -32.208534240722656, "global_step": 74126, "epoch": 612} {"train_loss": -23.452077865600586, "global_step": 74127, "epoch": 612} {"train_loss": -33.4785041809082, "global_step": 74128, "epoch": 612} {"train_loss": -29.167438507080078, "global_step": 74129, "epoch": 612} {"train_loss": -29.532629013061523, "global_step": 74130, "epoch": 612} {"train_loss": -33.704097747802734, "global_step": 74131, "epoch": 612} {"train_loss": -30.8475399017334, "global_step": 74132, "epoch": 612} {"train_loss": -31.06673240661621, "global_step": 74133, "epoch": 612} {"train_loss": -33.64095687866211, "global_step": 74134, "epoch": 612} {"train_loss": -32.738319396972656, "global_step": 74135, "epoch": 612} {"train_loss": -31.034778594970703, "global_step": 74136, "epoch": 612} {"train_loss": -32.672977447509766, "global_step": 74137, "epoch": 612} {"train_loss": -33.986995697021484, "global_step": 74138, "epoch": 612} {"train_loss": -32.98521041870117, "global_step": 74139, "epoch": 612} {"train_loss": -32.629695892333984, "global_step": 74140, "epoch": 612} {"train_loss": -33.204620361328125, "global_step": 74141, "epoch": 612} {"train_loss": -33.5339469909668, "global_step": 74142, "epoch": 612} {"train_loss": -33.38102722167969, "global_step": 74143, "epoch": 612} {"train_loss": -33.540992736816406, "global_step": 74144, "epoch": 612} {"train_loss": -32.88303756713867, "global_step": 74145, "epoch": 612} {"train_loss": -32.83161544799805, "global_step": 74146, "epoch": 612} {"train_loss": -33.94892120361328, "global_step": 74147, "epoch": 612} {"train_loss": -34.35195541381836, "global_step": 74148, "epoch": 612} {"train_loss": -33.63767623901367, "global_step": 74149, "epoch": 612} {"train_loss": -33.5335693359375, "global_step": 74150, "epoch": 612} {"train_loss": -33.847808837890625, "global_step": 74151, "epoch": 612} {"train_loss": -33.978248596191406, "global_step": 74152, "epoch": 612} {"train_loss": -33.743125915527344, "global_step": 74153, "epoch": 612} {"train_loss": -34.1887092590332, "global_step": 74154, "epoch": 612} {"train_loss": -34.37749481201172, "global_step": 74155, "epoch": 612} {"train_loss": -34.03410720825195, "global_step": 74156, "epoch": 612} {"train_loss": -33.610042572021484, "global_step": 74157, "epoch": 612} {"train_loss": -34.55247116088867, "global_step": 74158, "epoch": 612} {"train_loss": -34.267391204833984, "global_step": 74159, "epoch": 612} {"train_loss": -33.59835433959961, "global_step": 74160, "epoch": 612} {"train_loss": -34.749263763427734, "global_step": 74161, "epoch": 612} {"train_loss": -34.20862579345703, "global_step": 74162, "epoch": 612} {"train_loss": -34.48262405395508, "global_step": 74163, "epoch": 612} {"train_loss": -34.6173095703125, "global_step": 74164, "epoch": 612} {"train_loss": -34.05046081542969, "global_step": 74165, "epoch": 612} {"train_loss": -34.3867301940918, "global_step": 74166, "epoch": 612} {"train_loss": -31.69099998474121, "global_step": 74167, "epoch": 612} {"train_loss": -28.4580135345459, "global_step": 74168, "epoch": 612} {"train_loss": -28.927099227905273, "global_step": 74169, "epoch": 612} {"train_loss": -34.058509826660156, "global_step": 74170, "epoch": 612} {"train_loss": -31.998035430908203, "global_step": 74171, "epoch": 612} {"train_loss": -31.99832458732542, "global_step": 74172, "epoch": 612, "val_loss": 2656456.25} {"train_loss": -33.77381134033203, "global_step": 74173, "epoch": 613} {"train_loss": -34.2032585144043, "global_step": 74174, "epoch": 613} {"train_loss": -34.155033111572266, "global_step": 74175, "epoch": 613} {"train_loss": -34.62321853637695, "global_step": 74176, "epoch": 613} {"train_loss": -34.378108978271484, "global_step": 74177, "epoch": 613} {"train_loss": -34.761043548583984, "global_step": 74178, "epoch": 613} {"train_loss": -33.730140686035156, "global_step": 74179, "epoch": 613} {"train_loss": -34.21625900268555, "global_step": 74180, "epoch": 613} {"train_loss": -35.0238037109375, "global_step": 74181, "epoch": 613} {"train_loss": -34.61473083496094, "global_step": 74182, "epoch": 613} {"train_loss": -34.69493103027344, "global_step": 74183, "epoch": 613} {"train_loss": -35.172237396240234, "global_step": 74184, "epoch": 613} {"train_loss": -34.59909439086914, "global_step": 74185, "epoch": 613} {"train_loss": -34.71779251098633, "global_step": 74186, "epoch": 613} {"train_loss": -34.9987678527832, "global_step": 74187, "epoch": 613} {"train_loss": -33.77964782714844, "global_step": 74188, "epoch": 613} {"train_loss": -34.76716232299805, "global_step": 74189, "epoch": 613} {"train_loss": -34.75474548339844, "global_step": 74190, "epoch": 613} {"train_loss": -34.74226760864258, "global_step": 74191, "epoch": 613} {"train_loss": -34.46537399291992, "global_step": 74192, "epoch": 613} {"train_loss": -34.614681243896484, "global_step": 74193, "epoch": 613} {"train_loss": -34.798439025878906, "global_step": 74194, "epoch": 613} {"train_loss": -34.315826416015625, "global_step": 74195, "epoch": 613} {"train_loss": -34.141963958740234, "global_step": 74196, "epoch": 613} {"train_loss": -34.2619743347168, "global_step": 74197, "epoch": 613} {"train_loss": -35.56130599975586, "global_step": 74198, "epoch": 613} {"train_loss": -35.1318359375, "global_step": 74199, "epoch": 613} {"train_loss": -34.365596771240234, "global_step": 74200, "epoch": 613} {"train_loss": -35.29353332519531, "global_step": 74201, "epoch": 613} {"train_loss": -35.192962646484375, "global_step": 74202, "epoch": 613} {"train_loss": -34.50971221923828, "global_step": 74203, "epoch": 613} {"train_loss": -34.110416412353516, "global_step": 74204, "epoch": 613} {"train_loss": -35.6978874206543, "global_step": 74205, "epoch": 613} {"train_loss": -34.8492546081543, "global_step": 74206, "epoch": 613} {"train_loss": -34.931636810302734, "global_step": 74207, "epoch": 613} {"train_loss": -34.91786575317383, "global_step": 74208, "epoch": 613} {"train_loss": -33.680328369140625, "global_step": 74209, "epoch": 613} {"train_loss": -30.33699607849121, "global_step": 74210, "epoch": 613} {"train_loss": -18.27042007446289, "global_step": 74211, "epoch": 613} {"train_loss": -6.20632266998291, "global_step": 74212, "epoch": 613} {"train_loss": -28.162805557250977, "global_step": 74213, "epoch": 613} {"train_loss": -28.90987205505371, "global_step": 74214, "epoch": 613} {"train_loss": -29.573368072509766, "global_step": 74215, "epoch": 613} {"train_loss": -27.299957275390625, "global_step": 74216, "epoch": 613} {"train_loss": -33.70479965209961, "global_step": 74217, "epoch": 613} {"train_loss": -27.8999080657959, "global_step": 74218, "epoch": 613} {"train_loss": -33.23844528198242, "global_step": 74219, "epoch": 613} {"train_loss": -32.72598648071289, "global_step": 74220, "epoch": 613} {"train_loss": -30.121984481811523, "global_step": 74221, "epoch": 613} {"train_loss": -34.461509704589844, "global_step": 74222, "epoch": 613} {"train_loss": -32.54582595825195, "global_step": 74223, "epoch": 613} {"train_loss": -31.94217300415039, "global_step": 74224, "epoch": 613} {"train_loss": -32.891334533691406, "global_step": 74225, "epoch": 613} {"train_loss": -33.780391693115234, "global_step": 74226, "epoch": 613} {"train_loss": -33.19377517700195, "global_step": 74227, "epoch": 613} {"train_loss": -32.556495666503906, "global_step": 74228, "epoch": 613} {"train_loss": -34.129608154296875, "global_step": 74229, "epoch": 613} {"train_loss": -34.57949447631836, "global_step": 74230, "epoch": 613} {"train_loss": -33.6320915222168, "global_step": 74231, "epoch": 613} {"train_loss": -32.97574996948242, "global_step": 74232, "epoch": 613} {"train_loss": -34.152442932128906, "global_step": 74233, "epoch": 613} {"train_loss": -34.37069320678711, "global_step": 74234, "epoch": 613} {"train_loss": -34.58176803588867, "global_step": 74235, "epoch": 613} {"train_loss": -34.196617126464844, "global_step": 74236, "epoch": 613} {"train_loss": -33.88888168334961, "global_step": 74237, "epoch": 613} {"train_loss": -34.20927047729492, "global_step": 74238, "epoch": 613} {"train_loss": -34.464759826660156, "global_step": 74239, "epoch": 613} {"train_loss": -34.74507522583008, "global_step": 74240, "epoch": 613} {"train_loss": -34.69189453125, "global_step": 74241, "epoch": 613} {"train_loss": -34.39876937866211, "global_step": 74242, "epoch": 613} {"train_loss": -34.62049865722656, "global_step": 74243, "epoch": 613} {"train_loss": -34.90920639038086, "global_step": 74244, "epoch": 613} {"train_loss": -34.428524017333984, "global_step": 74245, "epoch": 613} {"train_loss": -34.8233642578125, "global_step": 74246, "epoch": 613} {"train_loss": -34.773048400878906, "global_step": 74247, "epoch": 613} {"train_loss": -34.73109817504883, "global_step": 74248, "epoch": 613} {"train_loss": -35.156211853027344, "global_step": 74249, "epoch": 613} {"train_loss": -34.91486358642578, "global_step": 74250, "epoch": 613} {"train_loss": -35.34153366088867, "global_step": 74251, "epoch": 613} {"train_loss": -34.39449691772461, "global_step": 74252, "epoch": 613} {"train_loss": -35.300811767578125, "global_step": 74253, "epoch": 613} {"train_loss": -35.11591339111328, "global_step": 74254, "epoch": 613} {"train_loss": -34.89829635620117, "global_step": 74255, "epoch": 613} {"train_loss": -35.057594299316406, "global_step": 74256, "epoch": 613} {"train_loss": -35.43851089477539, "global_step": 74257, "epoch": 613} {"train_loss": -35.35407638549805, "global_step": 74258, "epoch": 613} {"train_loss": -33.70526123046875, "global_step": 74259, "epoch": 613} {"train_loss": -35.641292572021484, "global_step": 74260, "epoch": 613} {"train_loss": -35.302738189697266, "global_step": 74261, "epoch": 613} {"train_loss": -35.24956130981445, "global_step": 74262, "epoch": 613} {"train_loss": -35.59895706176758, "global_step": 74263, "epoch": 613} {"train_loss": -35.72366714477539, "global_step": 74264, "epoch": 613} {"train_loss": -35.7760009765625, "global_step": 74265, "epoch": 613} {"train_loss": -35.95797348022461, "global_step": 74266, "epoch": 613} {"train_loss": -35.8708610534668, "global_step": 74267, "epoch": 613} {"train_loss": -35.494873046875, "global_step": 74268, "epoch": 613} {"train_loss": -35.69572830200195, "global_step": 74269, "epoch": 613} {"train_loss": -35.53702163696289, "global_step": 74270, "epoch": 613} {"train_loss": -34.028228759765625, "global_step": 74271, "epoch": 613} {"train_loss": -36.00559997558594, "global_step": 74272, "epoch": 613} {"train_loss": -36.3790397644043, "global_step": 74273, "epoch": 613} {"train_loss": -35.658203125, "global_step": 74274, "epoch": 613} {"train_loss": -36.25123596191406, "global_step": 74275, "epoch": 613} {"train_loss": -35.37101745605469, "global_step": 74276, "epoch": 613} {"train_loss": -35.002586364746094, "global_step": 74277, "epoch": 613} {"train_loss": -35.49286651611328, "global_step": 74278, "epoch": 613} {"train_loss": -35.578853607177734, "global_step": 74279, "epoch": 613} {"train_loss": -35.894073486328125, "global_step": 74280, "epoch": 613} {"train_loss": -35.8052864074707, "global_step": 74281, "epoch": 613} {"train_loss": -35.70510482788086, "global_step": 74282, "epoch": 613} {"train_loss": -36.17653274536133, "global_step": 74283, "epoch": 613} {"train_loss": -35.89256286621094, "global_step": 74284, "epoch": 613} {"train_loss": -35.140018463134766, "global_step": 74285, "epoch": 613} {"train_loss": -35.875953674316406, "global_step": 74286, "epoch": 613} {"train_loss": -35.637203216552734, "global_step": 74287, "epoch": 613} {"train_loss": -35.84496307373047, "global_step": 74288, "epoch": 613} {"train_loss": -35.973388671875, "global_step": 74289, "epoch": 613} {"train_loss": -32.75385665893555, "global_step": 74290, "epoch": 613} {"train_loss": -36.024681091308594, "global_step": 74291, "epoch": 613} {"train_loss": -35.0263557434082, "global_step": 74292, "epoch": 613} {"train_loss": -34.041065460394236, "global_step": 74293, "epoch": 613, "val_loss": 2646214.25} {"train_loss": -36.43905258178711, "global_step": 74294, "epoch": 614} {"train_loss": -36.2819938659668, "global_step": 74295, "epoch": 614} {"train_loss": -35.92151641845703, "global_step": 74296, "epoch": 614} {"train_loss": -35.895565032958984, "global_step": 74297, "epoch": 614} {"train_loss": -35.67348861694336, "global_step": 74298, "epoch": 614} {"train_loss": -34.81653594970703, "global_step": 74299, "epoch": 614} {"train_loss": -35.51652145385742, "global_step": 74300, "epoch": 614} {"train_loss": -35.915279388427734, "global_step": 74301, "epoch": 614} {"train_loss": -35.855133056640625, "global_step": 74302, "epoch": 614} {"train_loss": -35.41781234741211, "global_step": 74303, "epoch": 614} {"train_loss": -35.494564056396484, "global_step": 74304, "epoch": 614} {"train_loss": -36.13538360595703, "global_step": 74305, "epoch": 614} {"train_loss": -35.544944763183594, "global_step": 74306, "epoch": 614} {"train_loss": -35.86311721801758, "global_step": 74307, "epoch": 614} {"train_loss": -36.51459884643555, "global_step": 74308, "epoch": 614} {"train_loss": -35.92263412475586, "global_step": 74309, "epoch": 614} {"train_loss": -35.672115325927734, "global_step": 74310, "epoch": 614} {"train_loss": -35.66904830932617, "global_step": 74311, "epoch": 614} {"train_loss": -36.69155502319336, "global_step": 74312, "epoch": 614} {"train_loss": -34.943477630615234, "global_step": 74313, "epoch": 614} {"train_loss": -36.010433197021484, "global_step": 74314, "epoch": 614} {"train_loss": -36.089942932128906, "global_step": 74315, "epoch": 614} {"train_loss": -36.2450065612793, "global_step": 74316, "epoch": 614} {"train_loss": -36.246761322021484, "global_step": 74317, "epoch": 614} {"train_loss": -36.64509963989258, "global_step": 74318, "epoch": 614} {"train_loss": -36.5932502746582, "global_step": 74319, "epoch": 614} {"train_loss": -35.59138107299805, "global_step": 74320, "epoch": 614} {"train_loss": -36.555213928222656, "global_step": 74321, "epoch": 614} {"train_loss": -36.312679290771484, "global_step": 74322, "epoch": 614} {"train_loss": -36.47005844116211, "global_step": 74323, "epoch": 614} {"train_loss": -36.30988311767578, "global_step": 74324, "epoch": 614} {"train_loss": -36.783302307128906, "global_step": 74325, "epoch": 614} {"train_loss": -36.872215270996094, "global_step": 74326, "epoch": 614} {"train_loss": -36.74869918823242, "global_step": 74327, "epoch": 614} {"train_loss": -36.357330322265625, "global_step": 74328, "epoch": 614} {"train_loss": -34.70650863647461, "global_step": 74329, "epoch": 614} {"train_loss": -34.900245666503906, "global_step": 74330, "epoch": 614} {"train_loss": -35.753387451171875, "global_step": 74331, "epoch": 614} {"train_loss": -35.54047775268555, "global_step": 74332, "epoch": 614} {"train_loss": -36.088348388671875, "global_step": 74333, "epoch": 614} {"train_loss": -36.73785400390625, "global_step": 74334, "epoch": 614} {"train_loss": -36.65656661987305, "global_step": 74335, "epoch": 614} {"train_loss": -36.38474655151367, "global_step": 74336, "epoch": 614} {"train_loss": -36.872222900390625, "global_step": 74337, "epoch": 614} {"train_loss": -36.33588409423828, "global_step": 74338, "epoch": 614} {"train_loss": -37.09879684448242, "global_step": 74339, "epoch": 614} {"train_loss": -37.06846618652344, "global_step": 74340, "epoch": 614} {"train_loss": -35.91915512084961, "global_step": 74341, "epoch": 614} {"train_loss": -36.424102783203125, "global_step": 74342, "epoch": 614} {"train_loss": -36.29560852050781, "global_step": 74343, "epoch": 614} {"train_loss": -36.268348693847656, "global_step": 74344, "epoch": 614} {"train_loss": -36.88147735595703, "global_step": 74345, "epoch": 614} {"train_loss": -35.28081130981445, "global_step": 74346, "epoch": 614} {"train_loss": -35.23842239379883, "global_step": 74347, "epoch": 614} {"train_loss": -35.55717849731445, "global_step": 74348, "epoch": 614} {"train_loss": -35.811405181884766, "global_step": 74349, "epoch": 614} {"train_loss": -35.07761764526367, "global_step": 74350, "epoch": 614} {"train_loss": -34.803871154785156, "global_step": 74351, "epoch": 614} {"train_loss": -35.16885757446289, "global_step": 74352, "epoch": 614} {"train_loss": -34.90032958984375, "global_step": 74353, "epoch": 614} {"train_loss": -33.667633056640625, "global_step": 74354, "epoch": 614} {"train_loss": -35.83271408081055, "global_step": 74355, "epoch": 614} {"train_loss": -35.857704162597656, "global_step": 74356, "epoch": 614} {"train_loss": -36.50373458862305, "global_step": 74357, "epoch": 614} {"train_loss": -36.16303253173828, "global_step": 74358, "epoch": 614} {"train_loss": -34.16202926635742, "global_step": 74359, "epoch": 614} {"train_loss": -36.20383834838867, "global_step": 74360, "epoch": 614} {"train_loss": -35.603729248046875, "global_step": 74361, "epoch": 614} {"train_loss": -36.2803955078125, "global_step": 74362, "epoch": 614} {"train_loss": -35.88736343383789, "global_step": 74363, "epoch": 614} {"train_loss": -36.10825729370117, "global_step": 74364, "epoch": 614} {"train_loss": -36.715858459472656, "global_step": 74365, "epoch": 614} {"train_loss": -36.41425323486328, "global_step": 74366, "epoch": 614} {"train_loss": -35.92619705200195, "global_step": 74367, "epoch": 614} {"train_loss": -36.37490463256836, "global_step": 74368, "epoch": 614} {"train_loss": -36.49509811401367, "global_step": 74369, "epoch": 614} {"train_loss": -36.158329010009766, "global_step": 74370, "epoch": 614} {"train_loss": -35.989933013916016, "global_step": 74371, "epoch": 614} {"train_loss": -36.173011779785156, "global_step": 74372, "epoch": 614} {"train_loss": -35.94181442260742, "global_step": 74373, "epoch": 614} {"train_loss": -36.86658477783203, "global_step": 74374, "epoch": 614} {"train_loss": -36.155738830566406, "global_step": 74375, "epoch": 614} {"train_loss": -36.106563568115234, "global_step": 74376, "epoch": 614} {"train_loss": -36.51548385620117, "global_step": 74377, "epoch": 614} {"train_loss": -36.8744010925293, "global_step": 74378, "epoch": 614} {"train_loss": -36.58392333984375, "global_step": 74379, "epoch": 614} {"train_loss": -36.3294563293457, "global_step": 74380, "epoch": 614} {"train_loss": -36.783355712890625, "global_step": 74381, "epoch": 614} {"train_loss": -36.19218826293945, "global_step": 74382, "epoch": 614} {"train_loss": -35.11042404174805, "global_step": 74383, "epoch": 614} {"train_loss": -35.34174728393555, "global_step": 74384, "epoch": 614} {"train_loss": -35.39287567138672, "global_step": 74385, "epoch": 614} {"train_loss": -36.111289978027344, "global_step": 74386, "epoch": 614} {"train_loss": -35.40885543823242, "global_step": 74387, "epoch": 614} {"train_loss": -36.83535385131836, "global_step": 74388, "epoch": 614} {"train_loss": -35.282711029052734, "global_step": 74389, "epoch": 614} {"train_loss": -35.677711486816406, "global_step": 74390, "epoch": 614} {"train_loss": -35.41706466674805, "global_step": 74391, "epoch": 614} {"train_loss": -36.04257583618164, "global_step": 74392, "epoch": 614} {"train_loss": -35.789154052734375, "global_step": 74393, "epoch": 614} {"train_loss": -35.55986785888672, "global_step": 74394, "epoch": 614} {"train_loss": -36.22170639038086, "global_step": 74395, "epoch": 614} {"train_loss": -35.38433837890625, "global_step": 74396, "epoch": 614} {"train_loss": -35.695858001708984, "global_step": 74397, "epoch": 614} {"train_loss": -36.024696350097656, "global_step": 74398, "epoch": 614} {"train_loss": -34.15705490112305, "global_step": 74399, "epoch": 614} {"train_loss": -35.9548454284668, "global_step": 74400, "epoch": 614} {"train_loss": -35.861541748046875, "global_step": 74401, "epoch": 614} {"train_loss": -33.79974365234375, "global_step": 74402, "epoch": 614} {"train_loss": -35.80263900756836, "global_step": 74403, "epoch": 614} {"train_loss": -36.32332992553711, "global_step": 74404, "epoch": 614} {"train_loss": -35.3452033996582, "global_step": 74405, "epoch": 614} {"train_loss": -35.33943557739258, "global_step": 74406, "epoch": 614} {"train_loss": -35.11646270751953, "global_step": 74407, "epoch": 614} {"train_loss": -35.589046478271484, "global_step": 74408, "epoch": 614} {"train_loss": -35.763301849365234, "global_step": 74409, "epoch": 614} {"train_loss": -36.5682258605957, "global_step": 74410, "epoch": 614} {"train_loss": -35.0971565246582, "global_step": 74411, "epoch": 614} {"train_loss": -34.281822204589844, "global_step": 74412, "epoch": 614} {"train_loss": -33.99225997924805, "global_step": 74413, "epoch": 614} {"train_loss": -35.88639781100691, "global_step": 74414, "epoch": 614, "val_loss": 2716326.25} {"train_loss": -35.5296630859375, "global_step": 74415, "epoch": 615} {"train_loss": -35.0427131652832, "global_step": 74416, "epoch": 615} {"train_loss": -36.79309844970703, "global_step": 74417, "epoch": 615} {"train_loss": -36.725250244140625, "global_step": 74418, "epoch": 615} {"train_loss": -34.76154708862305, "global_step": 74419, "epoch": 615} {"train_loss": -36.00553894042969, "global_step": 74420, "epoch": 615} {"train_loss": -35.723365783691406, "global_step": 74421, "epoch": 615} {"train_loss": -35.99028396606445, "global_step": 74422, "epoch": 615} {"train_loss": -35.49142074584961, "global_step": 74423, "epoch": 615} {"train_loss": -36.22431945800781, "global_step": 74424, "epoch": 615} {"train_loss": -37.154876708984375, "global_step": 74425, "epoch": 615} {"train_loss": -36.4629020690918, "global_step": 74426, "epoch": 615} {"train_loss": -35.50685501098633, "global_step": 74427, "epoch": 615} {"train_loss": -36.28982162475586, "global_step": 74428, "epoch": 615} {"train_loss": -35.6761589050293, "global_step": 74429, "epoch": 615} {"train_loss": -36.49870681762695, "global_step": 74430, "epoch": 615} {"train_loss": -36.52962875366211, "global_step": 74431, "epoch": 615} {"train_loss": -36.61007308959961, "global_step": 74432, "epoch": 615} {"train_loss": -36.458251953125, "global_step": 74433, "epoch": 615} {"train_loss": -36.67928695678711, "global_step": 74434, "epoch": 615} {"train_loss": -35.89341735839844, "global_step": 74435, "epoch": 615} {"train_loss": -36.65132141113281, "global_step": 74436, "epoch": 615} {"train_loss": -36.77097702026367, "global_step": 74437, "epoch": 615} {"train_loss": -35.783843994140625, "global_step": 74438, "epoch": 615} {"train_loss": -36.396995544433594, "global_step": 74439, "epoch": 615} {"train_loss": -36.3138542175293, "global_step": 74440, "epoch": 615} {"train_loss": -35.444618225097656, "global_step": 74441, "epoch": 615} {"train_loss": -36.7409782409668, "global_step": 74442, "epoch": 615} {"train_loss": -36.13434600830078, "global_step": 74443, "epoch": 615} {"train_loss": -36.33241653442383, "global_step": 74444, "epoch": 615} {"train_loss": -36.96399688720703, "global_step": 74445, "epoch": 615} {"train_loss": -35.8087272644043, "global_step": 74446, "epoch": 615} {"train_loss": -36.37716293334961, "global_step": 74447, "epoch": 615} {"train_loss": -36.2893180847168, "global_step": 74448, "epoch": 615} {"train_loss": -35.831886291503906, "global_step": 74449, "epoch": 615} {"train_loss": -35.821041107177734, "global_step": 74450, "epoch": 615} {"train_loss": -36.5023078918457, "global_step": 74451, "epoch": 615} {"train_loss": -36.41303634643555, "global_step": 74452, "epoch": 615} {"train_loss": -36.78178787231445, "global_step": 74453, "epoch": 615} {"train_loss": -36.703392028808594, "global_step": 74454, "epoch": 615} {"train_loss": -36.0844841003418, "global_step": 74455, "epoch": 615} {"train_loss": -36.4739875793457, "global_step": 74456, "epoch": 615} {"train_loss": -35.4621467590332, "global_step": 74457, "epoch": 615} {"train_loss": -35.08451843261719, "global_step": 74458, "epoch": 615} {"train_loss": -35.549259185791016, "global_step": 74459, "epoch": 615} {"train_loss": -36.0621337890625, "global_step": 74460, "epoch": 615} {"train_loss": -35.035308837890625, "global_step": 74461, "epoch": 615} {"train_loss": -36.21357345581055, "global_step": 74462, "epoch": 615} {"train_loss": -36.94279098510742, "global_step": 74463, "epoch": 615} {"train_loss": -35.5232048034668, "global_step": 74464, "epoch": 615} {"train_loss": -36.155784606933594, "global_step": 74465, "epoch": 615} {"train_loss": -36.14570617675781, "global_step": 74466, "epoch": 615} {"train_loss": -35.65289306640625, "global_step": 74467, "epoch": 615} {"train_loss": -37.081336975097656, "global_step": 74468, "epoch": 615} {"train_loss": -35.8617057800293, "global_step": 74469, "epoch": 615} {"train_loss": -34.87458419799805, "global_step": 74470, "epoch": 615} {"train_loss": -36.74686813354492, "global_step": 74471, "epoch": 615} {"train_loss": -36.282405853271484, "global_step": 74472, "epoch": 615} {"train_loss": -36.853267669677734, "global_step": 74473, "epoch": 615} {"train_loss": -36.60886764526367, "global_step": 74474, "epoch": 615} {"train_loss": -36.29378890991211, "global_step": 74475, "epoch": 615} {"train_loss": -36.215919494628906, "global_step": 74476, "epoch": 615} {"train_loss": -35.79212951660156, "global_step": 74477, "epoch": 615} {"train_loss": -36.50907516479492, "global_step": 74478, "epoch": 615} {"train_loss": -36.48698806762695, "global_step": 74479, "epoch": 615} {"train_loss": -36.525875091552734, "global_step": 74480, "epoch": 615} {"train_loss": -36.16737747192383, "global_step": 74481, "epoch": 615} {"train_loss": -36.306678771972656, "global_step": 74482, "epoch": 615} {"train_loss": -36.30265426635742, "global_step": 74483, "epoch": 615} {"train_loss": -36.462005615234375, "global_step": 74484, "epoch": 615} {"train_loss": -35.8879508972168, "global_step": 74485, "epoch": 615} {"train_loss": -36.664302825927734, "global_step": 74486, "epoch": 615} {"train_loss": -37.18593978881836, "global_step": 74487, "epoch": 615} {"train_loss": -37.0877685546875, "global_step": 74488, "epoch": 615} {"train_loss": -36.47166442871094, "global_step": 74489, "epoch": 615} {"train_loss": -37.17271041870117, "global_step": 74490, "epoch": 615} {"train_loss": -36.063636779785156, "global_step": 74491, "epoch": 615} {"train_loss": -35.31074905395508, "global_step": 74492, "epoch": 615} {"train_loss": -35.38701248168945, "global_step": 74493, "epoch": 615} {"train_loss": -33.924163818359375, "global_step": 74494, "epoch": 615} {"train_loss": -35.39490509033203, "global_step": 74495, "epoch": 615} {"train_loss": -35.95650863647461, "global_step": 74496, "epoch": 615} {"train_loss": -35.49147415161133, "global_step": 74497, "epoch": 615} {"train_loss": -34.997127532958984, "global_step": 74498, "epoch": 615} {"train_loss": -35.79144287109375, "global_step": 74499, "epoch": 615} {"train_loss": -36.05498504638672, "global_step": 74500, "epoch": 615} {"train_loss": -36.752960205078125, "global_step": 74501, "epoch": 615} {"train_loss": -34.62849807739258, "global_step": 74502, "epoch": 615} {"train_loss": -35.37986373901367, "global_step": 74503, "epoch": 615} {"train_loss": -36.68729782104492, "global_step": 74504, "epoch": 615} {"train_loss": -35.8164176940918, "global_step": 74505, "epoch": 615} {"train_loss": -35.71213912963867, "global_step": 74506, "epoch": 615} {"train_loss": -34.66157913208008, "global_step": 74507, "epoch": 615} {"train_loss": -35.35542678833008, "global_step": 74508, "epoch": 615} {"train_loss": -35.91982650756836, "global_step": 74509, "epoch": 615} {"train_loss": -35.87757110595703, "global_step": 74510, "epoch": 615} {"train_loss": -36.442420959472656, "global_step": 74511, "epoch": 615} {"train_loss": -36.080745697021484, "global_step": 74512, "epoch": 615} {"train_loss": -36.99264144897461, "global_step": 74513, "epoch": 615} {"train_loss": -36.279483795166016, "global_step": 74514, "epoch": 615} {"train_loss": -36.8097038269043, "global_step": 74515, "epoch": 615} {"train_loss": -36.73360824584961, "global_step": 74516, "epoch": 615} {"train_loss": -37.2673454284668, "global_step": 74517, "epoch": 615} {"train_loss": -36.66455841064453, "global_step": 74518, "epoch": 615} {"train_loss": -37.513763427734375, "global_step": 74519, "epoch": 615} {"train_loss": -36.45209884643555, "global_step": 74520, "epoch": 615} {"train_loss": -37.34299850463867, "global_step": 74521, "epoch": 615} {"train_loss": -35.79731369018555, "global_step": 74522, "epoch": 615} {"train_loss": -37.05935287475586, "global_step": 74523, "epoch": 615} {"train_loss": -36.653499603271484, "global_step": 74524, "epoch": 615} {"train_loss": -37.018733978271484, "global_step": 74525, "epoch": 615} {"train_loss": -36.15513229370117, "global_step": 74526, "epoch": 615} {"train_loss": -37.89019775390625, "global_step": 74527, "epoch": 615} {"train_loss": -37.45408248901367, "global_step": 74528, "epoch": 615} {"train_loss": -37.38206100463867, "global_step": 74529, "epoch": 615} {"train_loss": -36.03767395019531, "global_step": 74530, "epoch": 615} {"train_loss": -36.71772384643555, "global_step": 74531, "epoch": 615} {"train_loss": -36.5307731628418, "global_step": 74532, "epoch": 615} {"train_loss": -37.45479202270508, "global_step": 74533, "epoch": 615} {"train_loss": -37.559932708740234, "global_step": 74534, "epoch": 615} {"train_loss": -36.23839480817811, "global_step": 74535, "epoch": 615, "val_loss": 2608008.0} {"train_loss": -36.107330322265625, "global_step": 74536, "epoch": 616} {"train_loss": -37.589508056640625, "global_step": 74537, "epoch": 616} {"train_loss": -37.877254486083984, "global_step": 74538, "epoch": 616} {"train_loss": -37.188514709472656, "global_step": 74539, "epoch": 616} {"train_loss": -36.4898567199707, "global_step": 74540, "epoch": 616} {"train_loss": -37.186279296875, "global_step": 74541, "epoch": 616} {"train_loss": -36.81134033203125, "global_step": 74542, "epoch": 616} {"train_loss": -37.479156494140625, "global_step": 74543, "epoch": 616} {"train_loss": -37.15581512451172, "global_step": 74544, "epoch": 616} {"train_loss": -36.99617385864258, "global_step": 74545, "epoch": 616} {"train_loss": -36.11412048339844, "global_step": 74546, "epoch": 616} {"train_loss": -33.77627182006836, "global_step": 74547, "epoch": 616} {"train_loss": -33.95796585083008, "global_step": 74548, "epoch": 616} {"train_loss": -36.356910705566406, "global_step": 74549, "epoch": 616} {"train_loss": -36.48575210571289, "global_step": 74550, "epoch": 616} {"train_loss": -34.03257369995117, "global_step": 74551, "epoch": 616} {"train_loss": -32.36727523803711, "global_step": 74552, "epoch": 616} {"train_loss": -35.197410583496094, "global_step": 74553, "epoch": 616} {"train_loss": -35.72661209106445, "global_step": 74554, "epoch": 616} {"train_loss": -34.608821868896484, "global_step": 74555, "epoch": 616} {"train_loss": -35.635047912597656, "global_step": 74556, "epoch": 616} {"train_loss": -36.45119094848633, "global_step": 74557, "epoch": 616} {"train_loss": -35.8222770690918, "global_step": 74558, "epoch": 616} {"train_loss": -37.517024993896484, "global_step": 74559, "epoch": 616} {"train_loss": -36.6622428894043, "global_step": 74560, "epoch": 616} {"train_loss": -37.333621978759766, "global_step": 74561, "epoch": 616} {"train_loss": -36.34498977661133, "global_step": 74562, "epoch": 616} {"train_loss": -36.99076461791992, "global_step": 74563, "epoch": 616} {"train_loss": -36.275760650634766, "global_step": 74564, "epoch": 616} {"train_loss": -37.167354583740234, "global_step": 74565, "epoch": 616} {"train_loss": -36.81241226196289, "global_step": 74566, "epoch": 616} {"train_loss": -35.50509262084961, "global_step": 74567, "epoch": 616} {"train_loss": -35.852294921875, "global_step": 74568, "epoch": 616} {"train_loss": -36.68347930908203, "global_step": 74569, "epoch": 616} {"train_loss": -36.51497268676758, "global_step": 74570, "epoch": 616} {"train_loss": -36.661800384521484, "global_step": 74571, "epoch": 616} {"train_loss": -36.14095687866211, "global_step": 74572, "epoch": 616} {"train_loss": -35.95428466796875, "global_step": 74573, "epoch": 616} {"train_loss": -35.97991180419922, "global_step": 74574, "epoch": 616} {"train_loss": -35.40190505981445, "global_step": 74575, "epoch": 616} {"train_loss": -35.9010009765625, "global_step": 74576, "epoch": 616} {"train_loss": -36.075584411621094, "global_step": 74577, "epoch": 616} {"train_loss": -35.3967170715332, "global_step": 74578, "epoch": 616} {"train_loss": -36.16889190673828, "global_step": 74579, "epoch": 616} {"train_loss": -36.38739013671875, "global_step": 74580, "epoch": 616} {"train_loss": -37.06117630004883, "global_step": 74581, "epoch": 616} {"train_loss": -36.13203048706055, "global_step": 74582, "epoch": 616} {"train_loss": -35.284942626953125, "global_step": 74583, "epoch": 616} {"train_loss": -36.0791130065918, "global_step": 74584, "epoch": 616} {"train_loss": -35.7512092590332, "global_step": 74585, "epoch": 616} {"train_loss": -36.926673889160156, "global_step": 74586, "epoch": 616} {"train_loss": -36.495296478271484, "global_step": 74587, "epoch": 616} {"train_loss": -34.314422607421875, "global_step": 74588, "epoch": 616} {"train_loss": -35.80464172363281, "global_step": 74589, "epoch": 616} {"train_loss": -35.89326095581055, "global_step": 74590, "epoch": 616} {"train_loss": -36.53310775756836, "global_step": 74591, "epoch": 616} {"train_loss": -36.38918685913086, "global_step": 74592, "epoch": 616} {"train_loss": -35.18776321411133, "global_step": 74593, "epoch": 616} {"train_loss": -35.3160400390625, "global_step": 74594, "epoch": 616} {"train_loss": -35.02443313598633, "global_step": 74595, "epoch": 616} {"train_loss": -35.6678581237793, "global_step": 74596, "epoch": 616} {"train_loss": -36.12000274658203, "global_step": 74597, "epoch": 616} {"train_loss": -36.326988220214844, "global_step": 74598, "epoch": 616} {"train_loss": -35.102535247802734, "global_step": 74599, "epoch": 616} {"train_loss": -35.0826530456543, "global_step": 74600, "epoch": 616} {"train_loss": -35.19399642944336, "global_step": 74601, "epoch": 616} {"train_loss": -33.74806213378906, "global_step": 74602, "epoch": 616} {"train_loss": -34.95269775390625, "global_step": 74603, "epoch": 616} {"train_loss": -35.17205810546875, "global_step": 74604, "epoch": 616} {"train_loss": -33.104835510253906, "global_step": 74605, "epoch": 616} {"train_loss": -34.635860443115234, "global_step": 74606, "epoch": 616} {"train_loss": -35.41868209838867, "global_step": 74607, "epoch": 616} {"train_loss": -34.82509231567383, "global_step": 74608, "epoch": 616} {"train_loss": -31.832311630249023, "global_step": 74609, "epoch": 616} {"train_loss": -33.94070053100586, "global_step": 74610, "epoch": 616} {"train_loss": -36.58415603637695, "global_step": 74611, "epoch": 616} {"train_loss": -35.01926803588867, "global_step": 74612, "epoch": 616} {"train_loss": -35.15607452392578, "global_step": 74613, "epoch": 616} {"train_loss": -35.77748489379883, "global_step": 74614, "epoch": 616} {"train_loss": -36.29602813720703, "global_step": 74615, "epoch": 616} {"train_loss": -33.77552032470703, "global_step": 74616, "epoch": 616} {"train_loss": -35.55723190307617, "global_step": 74617, "epoch": 616} {"train_loss": -36.2753791809082, "global_step": 74618, "epoch": 616} {"train_loss": -36.6112174987793, "global_step": 74619, "epoch": 616} {"train_loss": -35.18410873413086, "global_step": 74620, "epoch": 616} {"train_loss": -35.62350082397461, "global_step": 74621, "epoch": 616} {"train_loss": -35.234474182128906, "global_step": 74622, "epoch": 616} {"train_loss": -35.19742965698242, "global_step": 74623, "epoch": 616} {"train_loss": -36.14547348022461, "global_step": 74624, "epoch": 616} {"train_loss": -36.369354248046875, "global_step": 74625, "epoch": 616} {"train_loss": -36.29313278198242, "global_step": 74626, "epoch": 616} {"train_loss": -36.32453918457031, "global_step": 74627, "epoch": 616} {"train_loss": -36.78733444213867, "global_step": 74628, "epoch": 616} {"train_loss": -36.94013214111328, "global_step": 74629, "epoch": 616} {"train_loss": -36.33628463745117, "global_step": 74630, "epoch": 616} {"train_loss": -35.58955001831055, "global_step": 74631, "epoch": 616} {"train_loss": -36.710514068603516, "global_step": 74632, "epoch": 616} {"train_loss": -36.25366973876953, "global_step": 74633, "epoch": 616} {"train_loss": -36.62412643432617, "global_step": 74634, "epoch": 616} {"train_loss": -36.831764221191406, "global_step": 74635, "epoch": 616} {"train_loss": -36.70375442504883, "global_step": 74636, "epoch": 616} {"train_loss": -36.85913848876953, "global_step": 74637, "epoch": 616} {"train_loss": -36.67340850830078, "global_step": 74638, "epoch": 616} {"train_loss": -37.35685729980469, "global_step": 74639, "epoch": 616} {"train_loss": -36.672119140625, "global_step": 74640, "epoch": 616} {"train_loss": -36.901512145996094, "global_step": 74641, "epoch": 616} {"train_loss": -36.84578323364258, "global_step": 74642, "epoch": 616} {"train_loss": -36.818538665771484, "global_step": 74643, "epoch": 616} {"train_loss": -36.30408477783203, "global_step": 74644, "epoch": 616} {"train_loss": -37.13488006591797, "global_step": 74645, "epoch": 616} {"train_loss": -35.61335372924805, "global_step": 74646, "epoch": 616} {"train_loss": -37.54702377319336, "global_step": 74647, "epoch": 616} {"train_loss": -36.552589416503906, "global_step": 74648, "epoch": 616} {"train_loss": -36.410072326660156, "global_step": 74649, "epoch": 616} {"train_loss": -36.92869186401367, "global_step": 74650, "epoch": 616} {"train_loss": -36.053680419921875, "global_step": 74651, "epoch": 616} {"train_loss": -36.99409866333008, "global_step": 74652, "epoch": 616} {"train_loss": -37.03340530395508, "global_step": 74653, "epoch": 616} {"train_loss": -36.76996612548828, "global_step": 74654, "epoch": 616} {"train_loss": -36.84465408325195, "global_step": 74655, "epoch": 616} {"train_loss": -36.01897977403373, "global_step": 74656, "epoch": 616, "val_loss": 2767874.25} {"train_loss": -37.61299133300781, "global_step": 74657, "epoch": 617} {"train_loss": -36.473121643066406, "global_step": 74658, "epoch": 617} {"train_loss": -37.21793746948242, "global_step": 74659, "epoch": 617} {"train_loss": -37.02997970581055, "global_step": 74660, "epoch": 617} {"train_loss": -36.552513122558594, "global_step": 74661, "epoch": 617} {"train_loss": -37.63554763793945, "global_step": 74662, "epoch": 617} {"train_loss": -36.1700553894043, "global_step": 74663, "epoch": 617} {"train_loss": -37.4703254699707, "global_step": 74664, "epoch": 617} {"train_loss": -36.70426559448242, "global_step": 74665, "epoch": 617} {"train_loss": -37.751827239990234, "global_step": 74666, "epoch": 617} {"train_loss": -37.401611328125, "global_step": 74667, "epoch": 617} {"train_loss": -36.563575744628906, "global_step": 74668, "epoch": 617} {"train_loss": -37.61952590942383, "global_step": 74669, "epoch": 617} {"train_loss": -36.48418045043945, "global_step": 74670, "epoch": 617} {"train_loss": -35.506591796875, "global_step": 74671, "epoch": 617} {"train_loss": -36.543983459472656, "global_step": 74672, "epoch": 617} {"train_loss": -37.75515365600586, "global_step": 74673, "epoch": 617} {"train_loss": -37.2830696105957, "global_step": 74674, "epoch": 617} {"train_loss": -36.04011917114258, "global_step": 74675, "epoch": 617} {"train_loss": -37.78538131713867, "global_step": 74676, "epoch": 617} {"train_loss": -37.37360763549805, "global_step": 74677, "epoch": 617} {"train_loss": -37.23384475708008, "global_step": 74678, "epoch": 617} {"train_loss": -36.181983947753906, "global_step": 74679, "epoch": 617} {"train_loss": -34.82249069213867, "global_step": 74680, "epoch": 617} {"train_loss": -31.575300216674805, "global_step": 74681, "epoch": 617} {"train_loss": -33.25775146484375, "global_step": 74682, "epoch": 617} {"train_loss": -32.43056869506836, "global_step": 74683, "epoch": 617} {"train_loss": -33.447235107421875, "global_step": 74684, "epoch": 617} {"train_loss": -36.24347686767578, "global_step": 74685, "epoch": 617} {"train_loss": -34.581390380859375, "global_step": 74686, "epoch": 617} {"train_loss": -36.877376556396484, "global_step": 74687, "epoch": 617} {"train_loss": -34.95905685424805, "global_step": 74688, "epoch": 617} {"train_loss": -35.67182159423828, "global_step": 74689, "epoch": 617} {"train_loss": -33.48445510864258, "global_step": 74690, "epoch": 617} {"train_loss": -31.316608428955078, "global_step": 74691, "epoch": 617} {"train_loss": -28.35009765625, "global_step": 74692, "epoch": 617} {"train_loss": -20.189767837524414, "global_step": 74693, "epoch": 617} {"train_loss": -29.305139541625977, "global_step": 74694, "epoch": 617} {"train_loss": -33.73799133300781, "global_step": 74695, "epoch": 617} {"train_loss": -27.425756454467773, "global_step": 74696, "epoch": 617} {"train_loss": -35.77274703979492, "global_step": 74697, "epoch": 617} {"train_loss": -31.21329116821289, "global_step": 74698, "epoch": 617} {"train_loss": -36.60346984863281, "global_step": 74699, "epoch": 617} {"train_loss": -32.0273551940918, "global_step": 74700, "epoch": 617} {"train_loss": -34.03600311279297, "global_step": 74701, "epoch": 617} {"train_loss": -35.82705307006836, "global_step": 74702, "epoch": 617} {"train_loss": -33.41720962524414, "global_step": 74703, "epoch": 617} {"train_loss": -35.91376495361328, "global_step": 74704, "epoch": 617} {"train_loss": -34.61332702636719, "global_step": 74705, "epoch": 617} {"train_loss": -34.884334564208984, "global_step": 74706, "epoch": 617} {"train_loss": -36.48688507080078, "global_step": 74707, "epoch": 617} {"train_loss": -33.3060302734375, "global_step": 74708, "epoch": 617} {"train_loss": -32.732421875, "global_step": 74709, "epoch": 617} {"train_loss": -32.49390411376953, "global_step": 74710, "epoch": 617} {"train_loss": -34.173736572265625, "global_step": 74711, "epoch": 617} {"train_loss": -35.82204818725586, "global_step": 74712, "epoch": 617} {"train_loss": -35.74513626098633, "global_step": 74713, "epoch": 617} {"train_loss": -35.93610763549805, "global_step": 74714, "epoch": 617} {"train_loss": -33.6829719543457, "global_step": 74715, "epoch": 617} {"train_loss": -35.46296691894531, "global_step": 74716, "epoch": 617} {"train_loss": -35.87660598754883, "global_step": 74717, "epoch": 617} {"train_loss": -33.62746047973633, "global_step": 74718, "epoch": 617} {"train_loss": -28.857196807861328, "global_step": 74719, "epoch": 617} {"train_loss": -34.56711959838867, "global_step": 74720, "epoch": 617} {"train_loss": -35.693031311035156, "global_step": 74721, "epoch": 617} {"train_loss": -35.1756477355957, "global_step": 74722, "epoch": 617} {"train_loss": -34.23097610473633, "global_step": 74723, "epoch": 617} {"train_loss": -34.66825485229492, "global_step": 74724, "epoch": 617} {"train_loss": -33.7585563659668, "global_step": 74725, "epoch": 617} {"train_loss": -33.407161712646484, "global_step": 74726, "epoch": 617} {"train_loss": -34.69287872314453, "global_step": 74727, "epoch": 617} {"train_loss": -34.678558349609375, "global_step": 74728, "epoch": 617} {"train_loss": -35.01124572753906, "global_step": 74729, "epoch": 617} {"train_loss": -33.90571212768555, "global_step": 74730, "epoch": 617} {"train_loss": -34.20960998535156, "global_step": 74731, "epoch": 617} {"train_loss": -35.743682861328125, "global_step": 74732, "epoch": 617} {"train_loss": -34.98796081542969, "global_step": 74733, "epoch": 617} {"train_loss": -35.7846794128418, "global_step": 74734, "epoch": 617} {"train_loss": -35.09014892578125, "global_step": 74735, "epoch": 617} {"train_loss": -34.98211669921875, "global_step": 74736, "epoch": 617} {"train_loss": -32.6201171875, "global_step": 74737, "epoch": 617} {"train_loss": -35.51945877075195, "global_step": 74738, "epoch": 617} {"train_loss": -34.59475326538086, "global_step": 74739, "epoch": 617} {"train_loss": -35.270931243896484, "global_step": 74740, "epoch": 617} {"train_loss": -33.94303512573242, "global_step": 74741, "epoch": 617} {"train_loss": -35.622596740722656, "global_step": 74742, "epoch": 617} {"train_loss": -36.25930404663086, "global_step": 74743, "epoch": 617} {"train_loss": -31.268735885620117, "global_step": 74744, "epoch": 617} {"train_loss": -35.57528305053711, "global_step": 74745, "epoch": 617} {"train_loss": -35.7155876159668, "global_step": 74746, "epoch": 617} {"train_loss": -35.906341552734375, "global_step": 74747, "epoch": 617} {"train_loss": -35.512672424316406, "global_step": 74748, "epoch": 617} {"train_loss": -35.65230178833008, "global_step": 74749, "epoch": 617} {"train_loss": -35.98167037963867, "global_step": 74750, "epoch": 617} {"train_loss": -35.599159240722656, "global_step": 74751, "epoch": 617} {"train_loss": -35.518001556396484, "global_step": 74752, "epoch": 617} {"train_loss": -35.783180236816406, "global_step": 74753, "epoch": 617} {"train_loss": -35.690467834472656, "global_step": 74754, "epoch": 617} {"train_loss": -35.71542739868164, "global_step": 74755, "epoch": 617} {"train_loss": -35.613372802734375, "global_step": 74756, "epoch": 617} {"train_loss": -36.263038635253906, "global_step": 74757, "epoch": 617} {"train_loss": -36.141273498535156, "global_step": 74758, "epoch": 617} {"train_loss": -35.486507415771484, "global_step": 74759, "epoch": 617} {"train_loss": -35.51436233520508, "global_step": 74760, "epoch": 617} {"train_loss": -36.078060150146484, "global_step": 74761, "epoch": 617} {"train_loss": -34.805660247802734, "global_step": 74762, "epoch": 617} {"train_loss": -35.26569747924805, "global_step": 74763, "epoch": 617} {"train_loss": -34.57135009765625, "global_step": 74764, "epoch": 617} {"train_loss": -36.19610595703125, "global_step": 74765, "epoch": 617} {"train_loss": -35.73221206665039, "global_step": 74766, "epoch": 617} {"train_loss": -36.28702926635742, "global_step": 74767, "epoch": 617} {"train_loss": -36.183475494384766, "global_step": 74768, "epoch": 617} {"train_loss": -35.87873458862305, "global_step": 74769, "epoch": 617} {"train_loss": -35.97703170776367, "global_step": 74770, "epoch": 617} {"train_loss": -36.20174026489258, "global_step": 74771, "epoch": 617} {"train_loss": -36.824623107910156, "global_step": 74772, "epoch": 617} {"train_loss": -36.34474563598633, "global_step": 74773, "epoch": 617} {"train_loss": -36.0743293762207, "global_step": 74774, "epoch": 617} {"train_loss": -36.55567932128906, "global_step": 74775, "epoch": 617} {"train_loss": -36.751399993896484, "global_step": 74776, "epoch": 617} {"train_loss": -35.00346231066491, "global_step": 74777, "epoch": 617, "val_loss": 2774235.25} {"train_loss": -36.29395294189453, "global_step": 74778, "epoch": 618} {"train_loss": -36.5548210144043, "global_step": 74779, "epoch": 618} {"train_loss": -36.59672164916992, "global_step": 74780, "epoch": 618} {"train_loss": -36.87852096557617, "global_step": 74781, "epoch": 618} {"train_loss": -36.70844650268555, "global_step": 74782, "epoch": 618} {"train_loss": -36.949180603027344, "global_step": 74783, "epoch": 618} {"train_loss": -37.29741668701172, "global_step": 74784, "epoch": 618} {"train_loss": -36.60566329956055, "global_step": 74785, "epoch": 618} {"train_loss": -36.177127838134766, "global_step": 74786, "epoch": 618} {"train_loss": -37.01142120361328, "global_step": 74787, "epoch": 618} {"train_loss": -37.06717300415039, "global_step": 74788, "epoch": 618} {"train_loss": -37.2052001953125, "global_step": 74789, "epoch": 618} {"train_loss": -36.94150924682617, "global_step": 74790, "epoch": 618} {"train_loss": -37.23920440673828, "global_step": 74791, "epoch": 618} {"train_loss": -36.97511672973633, "global_step": 74792, "epoch": 618} {"train_loss": -36.543453216552734, "global_step": 74793, "epoch": 618} {"train_loss": -36.78121566772461, "global_step": 74794, "epoch": 618} {"train_loss": -37.19269561767578, "global_step": 74795, "epoch": 618} {"train_loss": -36.90827178955078, "global_step": 74796, "epoch": 618} {"train_loss": -36.74162673950195, "global_step": 74797, "epoch": 618} {"train_loss": -37.43239212036133, "global_step": 74798, "epoch": 618} {"train_loss": -37.16384506225586, "global_step": 74799, "epoch": 618} {"train_loss": -37.0210075378418, "global_step": 74800, "epoch": 618} {"train_loss": -36.55786895751953, "global_step": 74801, "epoch": 618} {"train_loss": -34.403987884521484, "global_step": 74802, "epoch": 618} {"train_loss": -35.93735885620117, "global_step": 74803, "epoch": 618} {"train_loss": -35.72829818725586, "global_step": 74804, "epoch": 618} {"train_loss": -34.60771560668945, "global_step": 74805, "epoch": 618} {"train_loss": -35.34363555908203, "global_step": 74806, "epoch": 618} {"train_loss": -33.87142562866211, "global_step": 74807, "epoch": 618} {"train_loss": -26.316137313842773, "global_step": 74808, "epoch": 618} {"train_loss": -14.228802680969238, "global_step": 74809, "epoch": 618} {"train_loss": -18.794248580932617, "global_step": 74810, "epoch": 618} {"train_loss": -34.48066329956055, "global_step": 74811, "epoch": 618} {"train_loss": -21.277318954467773, "global_step": 74812, "epoch": 618} {"train_loss": -28.39947509765625, "global_step": 74813, "epoch": 618} {"train_loss": -30.786834716796875, "global_step": 74814, "epoch": 618} {"train_loss": -32.38621520996094, "global_step": 74815, "epoch": 618} {"train_loss": -31.714075088500977, "global_step": 74816, "epoch": 618} {"train_loss": -36.17888641357422, "global_step": 74817, "epoch": 618} {"train_loss": -33.130638122558594, "global_step": 74818, "epoch": 618} {"train_loss": -34.011722564697266, "global_step": 74819, "epoch": 618} {"train_loss": -35.58287811279297, "global_step": 74820, "epoch": 618} {"train_loss": -34.30263900756836, "global_step": 74821, "epoch": 618} {"train_loss": -35.06544494628906, "global_step": 74822, "epoch": 618} {"train_loss": -35.57417678833008, "global_step": 74823, "epoch": 618} {"train_loss": -34.799659729003906, "global_step": 74824, "epoch": 618} {"train_loss": -34.85091781616211, "global_step": 74825, "epoch": 618} {"train_loss": -35.910560607910156, "global_step": 74826, "epoch": 618} {"train_loss": -35.85143280029297, "global_step": 74827, "epoch": 618} {"train_loss": -35.069393157958984, "global_step": 74828, "epoch": 618} {"train_loss": -35.39680099487305, "global_step": 74829, "epoch": 618} {"train_loss": -36.3619384765625, "global_step": 74830, "epoch": 618} {"train_loss": -35.322635650634766, "global_step": 74831, "epoch": 618} {"train_loss": -35.265804290771484, "global_step": 74832, "epoch": 618} {"train_loss": -36.05633544921875, "global_step": 74833, "epoch": 618} {"train_loss": -36.801849365234375, "global_step": 74834, "epoch": 618} {"train_loss": -36.301692962646484, "global_step": 74835, "epoch": 618} {"train_loss": -35.95174789428711, "global_step": 74836, "epoch": 618} {"train_loss": -36.750892639160156, "global_step": 74837, "epoch": 618} {"train_loss": -36.35707473754883, "global_step": 74838, "epoch": 618} {"train_loss": -36.42728042602539, "global_step": 74839, "epoch": 618} {"train_loss": -36.5516242980957, "global_step": 74840, "epoch": 618} {"train_loss": -36.563636779785156, "global_step": 74841, "epoch": 618} {"train_loss": -36.35759353637695, "global_step": 74842, "epoch": 618} {"train_loss": -36.71346664428711, "global_step": 74843, "epoch": 618} {"train_loss": -36.37550735473633, "global_step": 74844, "epoch": 618} {"train_loss": -36.513858795166016, "global_step": 74845, "epoch": 618} {"train_loss": -36.89929962158203, "global_step": 74846, "epoch": 618} {"train_loss": -35.950740814208984, "global_step": 74847, "epoch": 618} {"train_loss": -37.02021408081055, "global_step": 74848, "epoch": 618} {"train_loss": -37.16392517089844, "global_step": 74849, "epoch": 618} {"train_loss": -36.042823791503906, "global_step": 74850, "epoch": 618} {"train_loss": -37.19879913330078, "global_step": 74851, "epoch": 618} {"train_loss": -37.17866134643555, "global_step": 74852, "epoch": 618} {"train_loss": -36.7119140625, "global_step": 74853, "epoch": 618} {"train_loss": -37.0385627746582, "global_step": 74854, "epoch": 618} {"train_loss": -37.18335723876953, "global_step": 74855, "epoch": 618} {"train_loss": -37.37075424194336, "global_step": 74856, "epoch": 618} {"train_loss": -36.745906829833984, "global_step": 74857, "epoch": 618} {"train_loss": -37.321197509765625, "global_step": 74858, "epoch": 618} {"train_loss": -37.17832565307617, "global_step": 74859, "epoch": 618} {"train_loss": -37.34602737426758, "global_step": 74860, "epoch": 618} {"train_loss": -37.3390007019043, "global_step": 74861, "epoch": 618} {"train_loss": -37.058719635009766, "global_step": 74862, "epoch": 618} {"train_loss": -36.431304931640625, "global_step": 74863, "epoch": 618} {"train_loss": -34.92277908325195, "global_step": 74864, "epoch": 618} {"train_loss": -31.377622604370117, "global_step": 74865, "epoch": 618} {"train_loss": -26.374088287353516, "global_step": 74866, "epoch": 618} {"train_loss": -24.289575576782227, "global_step": 74867, "epoch": 618} {"train_loss": -33.369781494140625, "global_step": 74868, "epoch": 618} {"train_loss": -35.12250900268555, "global_step": 74869, "epoch": 618} {"train_loss": -27.60346031188965, "global_step": 74870, "epoch": 618} {"train_loss": -32.3567008972168, "global_step": 74871, "epoch": 618} {"train_loss": -30.872419357299805, "global_step": 74872, "epoch": 618} {"train_loss": -35.68308639526367, "global_step": 74873, "epoch": 618} {"train_loss": -30.591812133789062, "global_step": 74874, "epoch": 618} {"train_loss": -33.42860794067383, "global_step": 74875, "epoch": 618} {"train_loss": -32.877506256103516, "global_step": 74876, "epoch": 618} {"train_loss": -33.78868103027344, "global_step": 74877, "epoch": 618} {"train_loss": -31.409076690673828, "global_step": 74878, "epoch": 618} {"train_loss": -34.631038665771484, "global_step": 74879, "epoch": 618} {"train_loss": -34.13882064819336, "global_step": 74880, "epoch": 618} {"train_loss": -30.737661361694336, "global_step": 74881, "epoch": 618} {"train_loss": -35.28107833862305, "global_step": 74882, "epoch": 618} {"train_loss": -33.3632926940918, "global_step": 74883, "epoch": 618} {"train_loss": -34.95296096801758, "global_step": 74884, "epoch": 618} {"train_loss": -34.1313591003418, "global_step": 74885, "epoch": 618} {"train_loss": -35.782318115234375, "global_step": 74886, "epoch": 618} {"train_loss": -34.10899353027344, "global_step": 74887, "epoch": 618} {"train_loss": -35.295169830322266, "global_step": 74888, "epoch": 618} {"train_loss": -35.13938903808594, "global_step": 74889, "epoch": 618} {"train_loss": -35.606258392333984, "global_step": 74890, "epoch": 618} {"train_loss": -34.83512878417969, "global_step": 74891, "epoch": 618} {"train_loss": -35.88320541381836, "global_step": 74892, "epoch": 618} {"train_loss": -35.7548828125, "global_step": 74893, "epoch": 618} {"train_loss": -36.128902435302734, "global_step": 74894, "epoch": 618} {"train_loss": -35.52447509765625, "global_step": 74895, "epoch": 618} {"train_loss": -35.80682373046875, "global_step": 74896, "epoch": 618} {"train_loss": -35.43772506713867, "global_step": 74897, "epoch": 618} {"train_loss": -34.76794688169621, "global_step": 74898, "epoch": 618, "val_loss": 2632622.0} {"train_loss": -35.574649810791016, "global_step": 74899, "epoch": 619} {"train_loss": -36.1326789855957, "global_step": 74900, "epoch": 619} {"train_loss": -35.27656936645508, "global_step": 74901, "epoch": 619} {"train_loss": -36.066497802734375, "global_step": 74902, "epoch": 619} {"train_loss": -36.134029388427734, "global_step": 74903, "epoch": 619} {"train_loss": -36.29917526245117, "global_step": 74904, "epoch": 619} {"train_loss": -36.30040740966797, "global_step": 74905, "epoch": 619} {"train_loss": -36.34865951538086, "global_step": 74906, "epoch": 619} {"train_loss": -36.33256912231445, "global_step": 74907, "epoch": 619} {"train_loss": -36.39842224121094, "global_step": 74908, "epoch": 619} {"train_loss": -35.86823272705078, "global_step": 74909, "epoch": 619} {"train_loss": -36.78098678588867, "global_step": 74910, "epoch": 619} {"train_loss": -36.13188171386719, "global_step": 74911, "epoch": 619} {"train_loss": -36.33241653442383, "global_step": 74912, "epoch": 619} {"train_loss": -36.58341979980469, "global_step": 74913, "epoch": 619} {"train_loss": -36.46551513671875, "global_step": 74914, "epoch": 619} {"train_loss": -36.72758483886719, "global_step": 74915, "epoch": 619} {"train_loss": -36.80648422241211, "global_step": 74916, "epoch": 619} {"train_loss": -36.83256149291992, "global_step": 74917, "epoch": 619} {"train_loss": -36.84660720825195, "global_step": 74918, "epoch": 619} {"train_loss": -36.88691329956055, "global_step": 74919, "epoch": 619} {"train_loss": -36.4794807434082, "global_step": 74920, "epoch": 619} {"train_loss": -36.85211944580078, "global_step": 74921, "epoch": 619} {"train_loss": -36.6590690612793, "global_step": 74922, "epoch": 619} {"train_loss": -36.940120697021484, "global_step": 74923, "epoch": 619} {"train_loss": -36.87049102783203, "global_step": 74924, "epoch": 619} {"train_loss": -36.913082122802734, "global_step": 74925, "epoch": 619} {"train_loss": -36.94647979736328, "global_step": 74926, "epoch": 619} {"train_loss": -37.370452880859375, "global_step": 74927, "epoch": 619} {"train_loss": -36.705589294433594, "global_step": 74928, "epoch": 619} {"train_loss": -36.53310012817383, "global_step": 74929, "epoch": 619} {"train_loss": -36.46104049682617, "global_step": 74930, "epoch": 619} {"train_loss": -36.73716354370117, "global_step": 74931, "epoch": 619} {"train_loss": -36.374000549316406, "global_step": 74932, "epoch": 619} {"train_loss": -35.03440475463867, "global_step": 74933, "epoch": 619} {"train_loss": -36.995601654052734, "global_step": 74934, "epoch": 619} {"train_loss": -37.1940803527832, "global_step": 74935, "epoch": 619} {"train_loss": -37.43937301635742, "global_step": 74936, "epoch": 619} {"train_loss": -36.96345901489258, "global_step": 74937, "epoch": 619} {"train_loss": -36.51936721801758, "global_step": 74938, "epoch": 619} {"train_loss": -36.67741012573242, "global_step": 74939, "epoch": 619} {"train_loss": -37.184513092041016, "global_step": 74940, "epoch": 619} {"train_loss": -37.012638092041016, "global_step": 74941, "epoch": 619} {"train_loss": -37.260902404785156, "global_step": 74942, "epoch": 619} {"train_loss": -35.26095199584961, "global_step": 74943, "epoch": 619} {"train_loss": -36.657833099365234, "global_step": 74944, "epoch": 619} {"train_loss": -37.189876556396484, "global_step": 74945, "epoch": 619} {"train_loss": -37.3394660949707, "global_step": 74946, "epoch": 619} {"train_loss": -35.39876937866211, "global_step": 74947, "epoch": 619} {"train_loss": -36.87421798706055, "global_step": 74948, "epoch": 619} {"train_loss": -36.762325286865234, "global_step": 74949, "epoch": 619} {"train_loss": -37.07108688354492, "global_step": 74950, "epoch": 619} {"train_loss": -37.28794479370117, "global_step": 74951, "epoch": 619} {"train_loss": -36.753028869628906, "global_step": 74952, "epoch": 619} {"train_loss": -37.31710433959961, "global_step": 74953, "epoch": 619} {"train_loss": -37.0263557434082, "global_step": 74954, "epoch": 619} {"train_loss": -37.205421447753906, "global_step": 74955, "epoch": 619} {"train_loss": -36.93953323364258, "global_step": 74956, "epoch": 619} {"train_loss": -37.07402801513672, "global_step": 74957, "epoch": 619} {"train_loss": -36.376243591308594, "global_step": 74958, "epoch": 619} {"train_loss": -36.72816467285156, "global_step": 74959, "epoch": 619} {"train_loss": -36.93962097167969, "global_step": 74960, "epoch": 619} {"train_loss": -37.08320617675781, "global_step": 74961, "epoch": 619} {"train_loss": -37.04344940185547, "global_step": 74962, "epoch": 619} {"train_loss": -37.053524017333984, "global_step": 74963, "epoch": 619} {"train_loss": -37.066036224365234, "global_step": 74964, "epoch": 619} {"train_loss": -37.6518440246582, "global_step": 74965, "epoch": 619} {"train_loss": -37.16463088989258, "global_step": 74966, "epoch": 619} {"train_loss": -37.2518310546875, "global_step": 74967, "epoch": 619} {"train_loss": -37.20161819458008, "global_step": 74968, "epoch": 619} {"train_loss": -37.60825729370117, "global_step": 74969, "epoch": 619} {"train_loss": -37.669830322265625, "global_step": 74970, "epoch": 619} {"train_loss": -37.33533477783203, "global_step": 74971, "epoch": 619} {"train_loss": -37.28367233276367, "global_step": 74972, "epoch": 619} {"train_loss": -37.69462966918945, "global_step": 74973, "epoch": 619} {"train_loss": -37.04195785522461, "global_step": 74974, "epoch": 619} {"train_loss": -37.09776306152344, "global_step": 74975, "epoch": 619} {"train_loss": -37.11293411254883, "global_step": 74976, "epoch": 619} {"train_loss": -35.00478744506836, "global_step": 74977, "epoch": 619} {"train_loss": -34.31690216064453, "global_step": 74978, "epoch": 619} {"train_loss": -32.39966583251953, "global_step": 74979, "epoch": 619} {"train_loss": -28.15896987915039, "global_step": 74980, "epoch": 619} {"train_loss": -24.453044891357422, "global_step": 74981, "epoch": 619} {"train_loss": -28.782392501831055, "global_step": 74982, "epoch": 619} {"train_loss": -37.028255462646484, "global_step": 74983, "epoch": 619} {"train_loss": -31.301544189453125, "global_step": 74984, "epoch": 619} {"train_loss": -32.56454849243164, "global_step": 74985, "epoch": 619} {"train_loss": -36.4500732421875, "global_step": 74986, "epoch": 619} {"train_loss": -34.33143615722656, "global_step": 74987, "epoch": 619} {"train_loss": -36.07692337036133, "global_step": 74988, "epoch": 619} {"train_loss": -34.03834915161133, "global_step": 74989, "epoch": 619} {"train_loss": -36.77315902709961, "global_step": 74990, "epoch": 619} {"train_loss": -35.693580627441406, "global_step": 74991, "epoch": 619} {"train_loss": -35.80084228515625, "global_step": 74992, "epoch": 619} {"train_loss": -36.620540618896484, "global_step": 74993, "epoch": 619} {"train_loss": -35.974491119384766, "global_step": 74994, "epoch": 619} {"train_loss": -36.9241828918457, "global_step": 74995, "epoch": 619} {"train_loss": -35.7025146484375, "global_step": 74996, "epoch": 619} {"train_loss": -36.595149993896484, "global_step": 74997, "epoch": 619} {"train_loss": -36.58758544921875, "global_step": 74998, "epoch": 619} {"train_loss": -36.4815559387207, "global_step": 74999, "epoch": 619} {"train_loss": -37.154842376708984, "global_step": 75000, "epoch": 619} {"train_loss": -36.99136734008789, "global_step": 75001, "epoch": 619} {"train_loss": -36.31604766845703, "global_step": 75002, "epoch": 619} {"train_loss": -36.870784759521484, "global_step": 75003, "epoch": 619} {"train_loss": -37.16120529174805, "global_step": 75004, "epoch": 619} {"train_loss": -36.38486099243164, "global_step": 75005, "epoch": 619} {"train_loss": -37.367454528808594, "global_step": 75006, "epoch": 619} {"train_loss": -36.67381286621094, "global_step": 75007, "epoch": 619} {"train_loss": -37.22442626953125, "global_step": 75008, "epoch": 619} {"train_loss": -37.17818832397461, "global_step": 75009, "epoch": 619} {"train_loss": -37.4793586730957, "global_step": 75010, "epoch": 619} {"train_loss": -37.31376266479492, "global_step": 75011, "epoch": 619} {"train_loss": -37.570674896240234, "global_step": 75012, "epoch": 619} {"train_loss": -37.33042907714844, "global_step": 75013, "epoch": 619} {"train_loss": -37.09778594970703, "global_step": 75014, "epoch": 619} {"train_loss": -37.350563049316406, "global_step": 75015, "epoch": 619} {"train_loss": -37.00782012939453, "global_step": 75016, "epoch": 619} {"train_loss": -36.99978256225586, "global_step": 75017, "epoch": 619} {"train_loss": -37.432395935058594, "global_step": 75018, "epoch": 619} {"train_loss": -36.350921961886826, "global_step": 75019, "epoch": 619, "val_loss": 2733965.75} {"train_loss": -37.335792541503906, "global_step": 75020, "epoch": 620} {"train_loss": -36.894405364990234, "global_step": 75021, "epoch": 620} {"train_loss": -37.31460189819336, "global_step": 75022, "epoch": 620} {"train_loss": -36.05891799926758, "global_step": 75023, "epoch": 620} {"train_loss": -35.4756965637207, "global_step": 75024, "epoch": 620} {"train_loss": -35.04774475097656, "global_step": 75025, "epoch": 620} {"train_loss": -34.06461715698242, "global_step": 75026, "epoch": 620} {"train_loss": -26.69742202758789, "global_step": 75027, "epoch": 620} {"train_loss": -34.27967071533203, "global_step": 75028, "epoch": 620} {"train_loss": -35.243282318115234, "global_step": 75029, "epoch": 620} {"train_loss": -36.550132751464844, "global_step": 75030, "epoch": 620} {"train_loss": -34.06622314453125, "global_step": 75031, "epoch": 620} {"train_loss": -29.947418212890625, "global_step": 75032, "epoch": 620} {"train_loss": -35.99991989135742, "global_step": 75033, "epoch": 620} {"train_loss": -35.566646575927734, "global_step": 75034, "epoch": 620} {"train_loss": -36.01819610595703, "global_step": 75035, "epoch": 620} {"train_loss": -33.494361877441406, "global_step": 75036, "epoch": 620} {"train_loss": -29.726388931274414, "global_step": 75037, "epoch": 620} {"train_loss": -33.28609085083008, "global_step": 75038, "epoch": 620} {"train_loss": -35.9287223815918, "global_step": 75039, "epoch": 620} {"train_loss": -32.08739471435547, "global_step": 75040, "epoch": 620} {"train_loss": -33.71568298339844, "global_step": 75041, "epoch": 620} {"train_loss": -35.217708587646484, "global_step": 75042, "epoch": 620} {"train_loss": -34.34197998046875, "global_step": 75043, "epoch": 620} {"train_loss": -34.14162063598633, "global_step": 75044, "epoch": 620} {"train_loss": -32.4345588684082, "global_step": 75045, "epoch": 620} {"train_loss": -34.25254440307617, "global_step": 75046, "epoch": 620} {"train_loss": -34.03092956542969, "global_step": 75047, "epoch": 620} {"train_loss": -34.6993293762207, "global_step": 75048, "epoch": 620} {"train_loss": -31.873249053955078, "global_step": 75049, "epoch": 620} {"train_loss": -32.65266799926758, "global_step": 75050, "epoch": 620} {"train_loss": -33.91737747192383, "global_step": 75051, "epoch": 620} {"train_loss": -31.801969528198242, "global_step": 75052, "epoch": 620} {"train_loss": -34.63326644897461, "global_step": 75053, "epoch": 620} {"train_loss": -32.96946334838867, "global_step": 75054, "epoch": 620} {"train_loss": -35.19100570678711, "global_step": 75055, "epoch": 620} {"train_loss": -35.26890182495117, "global_step": 75056, "epoch": 620} {"train_loss": -34.21875, "global_step": 75057, "epoch": 620} {"train_loss": -33.930335998535156, "global_step": 75058, "epoch": 620} {"train_loss": -35.1784553527832, "global_step": 75059, "epoch": 620} {"train_loss": -33.6064567565918, "global_step": 75060, "epoch": 620} {"train_loss": -33.95539474487305, "global_step": 75061, "epoch": 620} {"train_loss": -34.072669982910156, "global_step": 75062, "epoch": 620} {"train_loss": -33.47494125366211, "global_step": 75063, "epoch": 620} {"train_loss": -34.46989822387695, "global_step": 75064, "epoch": 620} {"train_loss": -34.34233474731445, "global_step": 75065, "epoch": 620} {"train_loss": -34.86886978149414, "global_step": 75066, "epoch": 620} {"train_loss": -34.911102294921875, "global_step": 75067, "epoch": 620} {"train_loss": -35.58516311645508, "global_step": 75068, "epoch": 620} {"train_loss": -35.21516036987305, "global_step": 75069, "epoch": 620} {"train_loss": -35.93398666381836, "global_step": 75070, "epoch": 620} {"train_loss": -35.73713684082031, "global_step": 75071, "epoch": 620} {"train_loss": -34.48602294921875, "global_step": 75072, "epoch": 620} {"train_loss": -34.465301513671875, "global_step": 75073, "epoch": 620} {"train_loss": -35.02199172973633, "global_step": 75074, "epoch": 620} {"train_loss": -35.16557693481445, "global_step": 75075, "epoch": 620} {"train_loss": -35.542144775390625, "global_step": 75076, "epoch": 620} {"train_loss": -35.833187103271484, "global_step": 75077, "epoch": 620} {"train_loss": -35.53529739379883, "global_step": 75078, "epoch": 620} {"train_loss": -35.95107650756836, "global_step": 75079, "epoch": 620} {"train_loss": -35.78936767578125, "global_step": 75080, "epoch": 620} {"train_loss": -35.56711959838867, "global_step": 75081, "epoch": 620} {"train_loss": -35.46424102783203, "global_step": 75082, "epoch": 620} {"train_loss": -35.55775833129883, "global_step": 75083, "epoch": 620} {"train_loss": -36.528778076171875, "global_step": 75084, "epoch": 620} {"train_loss": -35.71001052856445, "global_step": 75085, "epoch": 620} {"train_loss": -36.40394592285156, "global_step": 75086, "epoch": 620} {"train_loss": -35.222713470458984, "global_step": 75087, "epoch": 620} {"train_loss": -35.24961853027344, "global_step": 75088, "epoch": 620} {"train_loss": -36.79487228393555, "global_step": 75089, "epoch": 620} {"train_loss": -36.07935333251953, "global_step": 75090, "epoch": 620} {"train_loss": -36.1616325378418, "global_step": 75091, "epoch": 620} {"train_loss": -35.40165328979492, "global_step": 75092, "epoch": 620} {"train_loss": -36.42327880859375, "global_step": 75093, "epoch": 620} {"train_loss": -36.35757064819336, "global_step": 75094, "epoch": 620} {"train_loss": -36.26792526245117, "global_step": 75095, "epoch": 620} {"train_loss": -36.29047775268555, "global_step": 75096, "epoch": 620} {"train_loss": -36.52476119995117, "global_step": 75097, "epoch": 620} {"train_loss": -36.40781784057617, "global_step": 75098, "epoch": 620} {"train_loss": -36.92702865600586, "global_step": 75099, "epoch": 620} {"train_loss": -36.995269775390625, "global_step": 75100, "epoch": 620} {"train_loss": -36.38215637207031, "global_step": 75101, "epoch": 620} {"train_loss": -36.1588249206543, "global_step": 75102, "epoch": 620} {"train_loss": -37.1358528137207, "global_step": 75103, "epoch": 620} {"train_loss": -36.84627151489258, "global_step": 75104, "epoch": 620} {"train_loss": -36.61904525756836, "global_step": 75105, "epoch": 620} {"train_loss": -36.70649337768555, "global_step": 75106, "epoch": 620} {"train_loss": -37.05935287475586, "global_step": 75107, "epoch": 620} {"train_loss": -35.32833480834961, "global_step": 75108, "epoch": 620} {"train_loss": -35.212703704833984, "global_step": 75109, "epoch": 620} {"train_loss": -36.803524017333984, "global_step": 75110, "epoch": 620} {"train_loss": -34.221675872802734, "global_step": 75111, "epoch": 620} {"train_loss": -37.2083625793457, "global_step": 75112, "epoch": 620} {"train_loss": -34.94304275512695, "global_step": 75113, "epoch": 620} {"train_loss": -36.96078109741211, "global_step": 75114, "epoch": 620} {"train_loss": -35.21416473388672, "global_step": 75115, "epoch": 620} {"train_loss": -37.01144027709961, "global_step": 75116, "epoch": 620} {"train_loss": -35.989139556884766, "global_step": 75117, "epoch": 620} {"train_loss": -36.26621627807617, "global_step": 75118, "epoch": 620} {"train_loss": -36.19404220581055, "global_step": 75119, "epoch": 620} {"train_loss": -36.70228958129883, "global_step": 75120, "epoch": 620} {"train_loss": -35.40252685546875, "global_step": 75121, "epoch": 620} {"train_loss": -36.83662796020508, "global_step": 75122, "epoch": 620} {"train_loss": -36.013214111328125, "global_step": 75123, "epoch": 620} {"train_loss": -36.736663818359375, "global_step": 75124, "epoch": 620} {"train_loss": -37.05269241333008, "global_step": 75125, "epoch": 620} {"train_loss": -35.59242248535156, "global_step": 75126, "epoch": 620} {"train_loss": -36.29877853393555, "global_step": 75127, "epoch": 620} {"train_loss": -35.929481506347656, "global_step": 75128, "epoch": 620} {"train_loss": -37.16530990600586, "global_step": 75129, "epoch": 620} {"train_loss": -35.429622650146484, "global_step": 75130, "epoch": 620} {"train_loss": -36.58293151855469, "global_step": 75131, "epoch": 620} {"train_loss": -34.91575241088867, "global_step": 75132, "epoch": 620} {"train_loss": -35.0942268371582, "global_step": 75133, "epoch": 620} {"train_loss": -35.9799690246582, "global_step": 75134, "epoch": 620} {"train_loss": -34.6490364074707, "global_step": 75135, "epoch": 620} {"train_loss": -36.94355010986328, "global_step": 75136, "epoch": 620} {"train_loss": -36.210018157958984, "global_step": 75137, "epoch": 620} {"train_loss": -36.99393844604492, "global_step": 75138, "epoch": 620} {"train_loss": -36.62876510620117, "global_step": 75139, "epoch": 620} {"train_loss": -35.279162351750145, "global_step": 75140, "epoch": 620, "val_loss": 2680068.25} {"train_loss": -36.51139450073242, "global_step": 75141, "epoch": 621} {"train_loss": -35.662261962890625, "global_step": 75142, "epoch": 621} {"train_loss": -36.847347259521484, "global_step": 75143, "epoch": 621} {"train_loss": -35.451019287109375, "global_step": 75144, "epoch": 621} {"train_loss": -36.361175537109375, "global_step": 75145, "epoch": 621} {"train_loss": -36.716796875, "global_step": 75146, "epoch": 621} {"train_loss": -36.92439270019531, "global_step": 75147, "epoch": 621} {"train_loss": -35.58077621459961, "global_step": 75148, "epoch": 621} {"train_loss": -37.3986701965332, "global_step": 75149, "epoch": 621} {"train_loss": -36.941436767578125, "global_step": 75150, "epoch": 621} {"train_loss": -36.98735427856445, "global_step": 75151, "epoch": 621} {"train_loss": -37.38138961791992, "global_step": 75152, "epoch": 621} {"train_loss": -37.519813537597656, "global_step": 75153, "epoch": 621} {"train_loss": -36.95531463623047, "global_step": 75154, "epoch": 621} {"train_loss": -37.12865447998047, "global_step": 75155, "epoch": 621} {"train_loss": -37.551265716552734, "global_step": 75156, "epoch": 621} {"train_loss": -37.51325607299805, "global_step": 75157, "epoch": 621} {"train_loss": -37.20170211791992, "global_step": 75158, "epoch": 621} {"train_loss": -37.354103088378906, "global_step": 75159, "epoch": 621} {"train_loss": -37.4119987487793, "global_step": 75160, "epoch": 621} {"train_loss": -37.20448684692383, "global_step": 75161, "epoch": 621} {"train_loss": -36.99443435668945, "global_step": 75162, "epoch": 621} {"train_loss": -37.00718688964844, "global_step": 75163, "epoch": 621} {"train_loss": -36.86879348754883, "global_step": 75164, "epoch": 621} {"train_loss": -37.524993896484375, "global_step": 75165, "epoch": 621} {"train_loss": -37.4911994934082, "global_step": 75166, "epoch": 621} {"train_loss": -36.97481155395508, "global_step": 75167, "epoch": 621} {"train_loss": -36.800384521484375, "global_step": 75168, "epoch": 621} {"train_loss": -37.51787567138672, "global_step": 75169, "epoch": 621} {"train_loss": -36.72256088256836, "global_step": 75170, "epoch": 621} {"train_loss": -36.0247802734375, "global_step": 75171, "epoch": 621} {"train_loss": -36.15385818481445, "global_step": 75172, "epoch": 621} {"train_loss": -37.53831100463867, "global_step": 75173, "epoch": 621} {"train_loss": -36.35453414916992, "global_step": 75174, "epoch": 621} {"train_loss": -36.60899353027344, "global_step": 75175, "epoch": 621} {"train_loss": -36.91593551635742, "global_step": 75176, "epoch": 621} {"train_loss": -36.92034912109375, "global_step": 75177, "epoch": 621} {"train_loss": -37.382232666015625, "global_step": 75178, "epoch": 621} {"train_loss": -37.39970016479492, "global_step": 75179, "epoch": 621} {"train_loss": -36.46711349487305, "global_step": 75180, "epoch": 621} {"train_loss": -37.20603942871094, "global_step": 75181, "epoch": 621} {"train_loss": -36.80807113647461, "global_step": 75182, "epoch": 621} {"train_loss": -36.3668212890625, "global_step": 75183, "epoch": 621} {"train_loss": -37.09785079956055, "global_step": 75184, "epoch": 621} {"train_loss": -36.631778717041016, "global_step": 75185, "epoch": 621} {"train_loss": -35.8921012878418, "global_step": 75186, "epoch": 621} {"train_loss": -37.16492462158203, "global_step": 75187, "epoch": 621} {"train_loss": -37.78705596923828, "global_step": 75188, "epoch": 621} {"train_loss": -36.19985580444336, "global_step": 75189, "epoch": 621} {"train_loss": -35.07344436645508, "global_step": 75190, "epoch": 621} {"train_loss": -36.471073150634766, "global_step": 75191, "epoch": 621} {"train_loss": -37.21511459350586, "global_step": 75192, "epoch": 621} {"train_loss": -36.4006462097168, "global_step": 75193, "epoch": 621} {"train_loss": -36.29537582397461, "global_step": 75194, "epoch": 621} {"train_loss": -36.30221176147461, "global_step": 75195, "epoch": 621} {"train_loss": -36.198734283447266, "global_step": 75196, "epoch": 621} {"train_loss": -36.88070297241211, "global_step": 75197, "epoch": 621} {"train_loss": -36.106746673583984, "global_step": 75198, "epoch": 621} {"train_loss": -32.52653884887695, "global_step": 75199, "epoch": 621} {"train_loss": -21.30368423461914, "global_step": 75200, "epoch": 621} {"train_loss": -29.283735275268555, "global_step": 75201, "epoch": 621} {"train_loss": -31.79960060119629, "global_step": 75202, "epoch": 621} {"train_loss": -29.5465030670166, "global_step": 75203, "epoch": 621} {"train_loss": -27.817670822143555, "global_step": 75204, "epoch": 621} {"train_loss": -31.102643966674805, "global_step": 75205, "epoch": 621} {"train_loss": -29.753604888916016, "global_step": 75206, "epoch": 621} {"train_loss": -28.877384185791016, "global_step": 75207, "epoch": 621} {"train_loss": -30.80646324157715, "global_step": 75208, "epoch": 621} {"train_loss": -29.21317481994629, "global_step": 75209, "epoch": 621} {"train_loss": -27.083698272705078, "global_step": 75210, "epoch": 621} {"train_loss": -30.344282150268555, "global_step": 75211, "epoch": 621} {"train_loss": -32.10530471801758, "global_step": 75212, "epoch": 621} {"train_loss": -31.651615142822266, "global_step": 75213, "epoch": 621} {"train_loss": -31.84846305847168, "global_step": 75214, "epoch": 621} {"train_loss": -28.14501953125, "global_step": 75215, "epoch": 621} {"train_loss": -32.444332122802734, "global_step": 75216, "epoch": 621} {"train_loss": -31.1884822845459, "global_step": 75217, "epoch": 621} {"train_loss": -30.050031661987305, "global_step": 75218, "epoch": 621} {"train_loss": -31.55862808227539, "global_step": 75219, "epoch": 621} {"train_loss": -30.838638305664062, "global_step": 75220, "epoch": 621} {"train_loss": -31.4974422454834, "global_step": 75221, "epoch": 621} {"train_loss": -32.97440719604492, "global_step": 75222, "epoch": 621} {"train_loss": -32.522377014160156, "global_step": 75223, "epoch": 621} {"train_loss": -31.3185977935791, "global_step": 75224, "epoch": 621} {"train_loss": -32.214691162109375, "global_step": 75225, "epoch": 621} {"train_loss": -33.05786895751953, "global_step": 75226, "epoch": 621} {"train_loss": -33.137855529785156, "global_step": 75227, "epoch": 621} {"train_loss": -31.189916610717773, "global_step": 75228, "epoch": 621} {"train_loss": -32.934505462646484, "global_step": 75229, "epoch": 621} {"train_loss": -33.48178482055664, "global_step": 75230, "epoch": 621} {"train_loss": -32.487335205078125, "global_step": 75231, "epoch": 621} {"train_loss": -32.9443244934082, "global_step": 75232, "epoch": 621} {"train_loss": -33.12880325317383, "global_step": 75233, "epoch": 621} {"train_loss": -33.77909469604492, "global_step": 75234, "epoch": 621} {"train_loss": -33.404109954833984, "global_step": 75235, "epoch": 621} {"train_loss": -33.53278732299805, "global_step": 75236, "epoch": 621} {"train_loss": -33.03451919555664, "global_step": 75237, "epoch": 621} {"train_loss": -33.73133087158203, "global_step": 75238, "epoch": 621} {"train_loss": -33.59785842895508, "global_step": 75239, "epoch": 621} {"train_loss": -34.07447052001953, "global_step": 75240, "epoch": 621} {"train_loss": -34.279876708984375, "global_step": 75241, "epoch": 621} {"train_loss": -33.803707122802734, "global_step": 75242, "epoch": 621} {"train_loss": -34.04012680053711, "global_step": 75243, "epoch": 621} {"train_loss": -34.31434631347656, "global_step": 75244, "epoch": 621} {"train_loss": -34.921566009521484, "global_step": 75245, "epoch": 621} {"train_loss": -34.28245162963867, "global_step": 75246, "epoch": 621} {"train_loss": -34.42403030395508, "global_step": 75247, "epoch": 621} {"train_loss": -33.94987106323242, "global_step": 75248, "epoch": 621} {"train_loss": -34.87175369262695, "global_step": 75249, "epoch": 621} {"train_loss": -34.802791595458984, "global_step": 75250, "epoch": 621} {"train_loss": -34.64994812011719, "global_step": 75251, "epoch": 621} {"train_loss": -34.83964538574219, "global_step": 75252, "epoch": 621} {"train_loss": -34.56373977661133, "global_step": 75253, "epoch": 621} {"train_loss": -35.14656448364258, "global_step": 75254, "epoch": 621} {"train_loss": -34.8763313293457, "global_step": 75255, "epoch": 621} {"train_loss": -35.10634994506836, "global_step": 75256, "epoch": 621} {"train_loss": -34.46370315551758, "global_step": 75257, "epoch": 621} {"train_loss": -35.46086120605469, "global_step": 75258, "epoch": 621} {"train_loss": -35.1866340637207, "global_step": 75259, "epoch": 621} {"train_loss": -35.172115325927734, "global_step": 75260, "epoch": 621} {"train_loss": -34.54751561692924, "global_step": 75261, "epoch": 621, "val_loss": 2739987.25} {"train_loss": -35.3073844909668, "global_step": 75262, "epoch": 622} {"train_loss": -35.64949417114258, "global_step": 75263, "epoch": 622} {"train_loss": -35.11909103393555, "global_step": 75264, "epoch": 622} {"train_loss": -35.71173858642578, "global_step": 75265, "epoch": 622} {"train_loss": -35.52810287475586, "global_step": 75266, "epoch": 622} {"train_loss": -35.786685943603516, "global_step": 75267, "epoch": 622} {"train_loss": -35.86054611206055, "global_step": 75268, "epoch": 622} {"train_loss": -35.92637252807617, "global_step": 75269, "epoch": 622} {"train_loss": -35.81070327758789, "global_step": 75270, "epoch": 622} {"train_loss": -36.0327033996582, "global_step": 75271, "epoch": 622} {"train_loss": -35.622406005859375, "global_step": 75272, "epoch": 622} {"train_loss": -35.825462341308594, "global_step": 75273, "epoch": 622} {"train_loss": -36.385677337646484, "global_step": 75274, "epoch": 622} {"train_loss": -35.90031051635742, "global_step": 75275, "epoch": 622} {"train_loss": -36.015933990478516, "global_step": 75276, "epoch": 622} {"train_loss": -35.88008499145508, "global_step": 75277, "epoch": 622} {"train_loss": -35.9133415222168, "global_step": 75278, "epoch": 622} {"train_loss": -36.092620849609375, "global_step": 75279, "epoch": 622} {"train_loss": -36.21208572387695, "global_step": 75280, "epoch": 622} {"train_loss": -36.120567321777344, "global_step": 75281, "epoch": 622} {"train_loss": -36.105464935302734, "global_step": 75282, "epoch": 622} {"train_loss": -35.5033073425293, "global_step": 75283, "epoch": 622} {"train_loss": -35.6883659362793, "global_step": 75284, "epoch": 622} {"train_loss": -36.06076431274414, "global_step": 75285, "epoch": 622} {"train_loss": -36.21284103393555, "global_step": 75286, "epoch": 622} {"train_loss": -36.162410736083984, "global_step": 75287, "epoch": 622} {"train_loss": -36.48136520385742, "global_step": 75288, "epoch": 622} {"train_loss": -36.373931884765625, "global_step": 75289, "epoch": 622} {"train_loss": -36.10013198852539, "global_step": 75290, "epoch": 622} {"train_loss": -36.3980712890625, "global_step": 75291, "epoch": 622} {"train_loss": -37.05022048950195, "global_step": 75292, "epoch": 622} {"train_loss": -36.38044357299805, "global_step": 75293, "epoch": 622} {"train_loss": -36.37656784057617, "global_step": 75294, "epoch": 622} {"train_loss": -36.44034957885742, "global_step": 75295, "epoch": 622} {"train_loss": -36.58888244628906, "global_step": 75296, "epoch": 622} {"train_loss": -36.981815338134766, "global_step": 75297, "epoch": 622} {"train_loss": -36.7896842956543, "global_step": 75298, "epoch": 622} {"train_loss": -36.364463806152344, "global_step": 75299, "epoch": 622} {"train_loss": -36.28768539428711, "global_step": 75300, "epoch": 622} {"train_loss": -36.261505126953125, "global_step": 75301, "epoch": 622} {"train_loss": -33.575523376464844, "global_step": 75302, "epoch": 622} {"train_loss": -30.993335723876953, "global_step": 75303, "epoch": 622} {"train_loss": -25.03154182434082, "global_step": 75304, "epoch": 622} {"train_loss": -13.346919059753418, "global_step": 75305, "epoch": 622} {"train_loss": 11.795479774475098, "global_step": 75306, "epoch": 622} {"train_loss": -15.116194725036621, "global_step": 75307, "epoch": 622} {"train_loss": -28.142255783081055, "global_step": 75308, "epoch": 622} {"train_loss": -22.033119201660156, "global_step": 75309, "epoch": 622} {"train_loss": -26.208417892456055, "global_step": 75310, "epoch": 622} {"train_loss": -28.689727783203125, "global_step": 75311, "epoch": 622} {"train_loss": -24.246173858642578, "global_step": 75312, "epoch": 622} {"train_loss": -34.14213180541992, "global_step": 75313, "epoch": 622} {"train_loss": -30.01032066345215, "global_step": 75314, "epoch": 622} {"train_loss": -29.297082901000977, "global_step": 75315, "epoch": 622} {"train_loss": -34.16748809814453, "global_step": 75316, "epoch": 622} {"train_loss": -33.885860443115234, "global_step": 75317, "epoch": 622} {"train_loss": -30.987424850463867, "global_step": 75318, "epoch": 622} {"train_loss": -32.187374114990234, "global_step": 75319, "epoch": 622} {"train_loss": -34.24211502075195, "global_step": 75320, "epoch": 622} {"train_loss": -34.76510238647461, "global_step": 75321, "epoch": 622} {"train_loss": -33.401973724365234, "global_step": 75322, "epoch": 622} {"train_loss": -32.90534210205078, "global_step": 75323, "epoch": 622} {"train_loss": -34.20868682861328, "global_step": 75324, "epoch": 622} {"train_loss": -34.966609954833984, "global_step": 75325, "epoch": 622} {"train_loss": -34.565303802490234, "global_step": 75326, "epoch": 622} {"train_loss": -34.165245056152344, "global_step": 75327, "epoch": 622} {"train_loss": -34.62477111816406, "global_step": 75328, "epoch": 622} {"train_loss": -34.89388656616211, "global_step": 75329, "epoch": 622} {"train_loss": -34.89681625366211, "global_step": 75330, "epoch": 622} {"train_loss": -35.4368782043457, "global_step": 75331, "epoch": 622} {"train_loss": -34.98775100708008, "global_step": 75332, "epoch": 622} {"train_loss": -35.47088623046875, "global_step": 75333, "epoch": 622} {"train_loss": -35.09537124633789, "global_step": 75334, "epoch": 622} {"train_loss": -35.36127471923828, "global_step": 75335, "epoch": 622} {"train_loss": -35.394771575927734, "global_step": 75336, "epoch": 622} {"train_loss": -35.343318939208984, "global_step": 75337, "epoch": 622} {"train_loss": -35.19883346557617, "global_step": 75338, "epoch": 622} {"train_loss": -35.52638626098633, "global_step": 75339, "epoch": 622} {"train_loss": -35.469783782958984, "global_step": 75340, "epoch": 622} {"train_loss": -35.44231033325195, "global_step": 75341, "epoch": 622} {"train_loss": -35.967864990234375, "global_step": 75342, "epoch": 622} {"train_loss": -35.8620719909668, "global_step": 75343, "epoch": 622} {"train_loss": -35.66978073120117, "global_step": 75344, "epoch": 622} {"train_loss": -35.755680084228516, "global_step": 75345, "epoch": 622} {"train_loss": -36.4302978515625, "global_step": 75346, "epoch": 622} {"train_loss": -35.866249084472656, "global_step": 75347, "epoch": 622} {"train_loss": -36.07487106323242, "global_step": 75348, "epoch": 622} {"train_loss": -36.266658782958984, "global_step": 75349, "epoch": 622} {"train_loss": -36.06159591674805, "global_step": 75350, "epoch": 622} {"train_loss": -36.39870834350586, "global_step": 75351, "epoch": 622} {"train_loss": -36.50804138183594, "global_step": 75352, "epoch": 622} {"train_loss": -36.32066345214844, "global_step": 75353, "epoch": 622} {"train_loss": -36.35652160644531, "global_step": 75354, "epoch": 622} {"train_loss": -36.07939529418945, "global_step": 75355, "epoch": 622} {"train_loss": -36.48604965209961, "global_step": 75356, "epoch": 622} {"train_loss": -36.603023529052734, "global_step": 75357, "epoch": 622} {"train_loss": -36.31455612182617, "global_step": 75358, "epoch": 622} {"train_loss": -36.991695404052734, "global_step": 75359, "epoch": 622} {"train_loss": -36.65912628173828, "global_step": 75360, "epoch": 622} {"train_loss": -36.611663818359375, "global_step": 75361, "epoch": 622} {"train_loss": -36.951812744140625, "global_step": 75362, "epoch": 622} {"train_loss": -36.379024505615234, "global_step": 75363, "epoch": 622} {"train_loss": -36.216854095458984, "global_step": 75364, "epoch": 622} {"train_loss": -36.695648193359375, "global_step": 75365, "epoch": 622} {"train_loss": -36.7985954284668, "global_step": 75366, "epoch": 622} {"train_loss": -37.25442886352539, "global_step": 75367, "epoch": 622} {"train_loss": -36.74717330932617, "global_step": 75368, "epoch": 622} {"train_loss": -36.854427337646484, "global_step": 75369, "epoch": 622} {"train_loss": -36.662288665771484, "global_step": 75370, "epoch": 622} {"train_loss": -37.06481170654297, "global_step": 75371, "epoch": 622} {"train_loss": -36.76061248779297, "global_step": 75372, "epoch": 622} {"train_loss": -37.22174835205078, "global_step": 75373, "epoch": 622} {"train_loss": -36.87472152709961, "global_step": 75374, "epoch": 622} {"train_loss": -36.86026382446289, "global_step": 75375, "epoch": 622} {"train_loss": -37.033477783203125, "global_step": 75376, "epoch": 622} {"train_loss": -36.98788070678711, "global_step": 75377, "epoch": 622} {"train_loss": -37.07659912109375, "global_step": 75378, "epoch": 622} {"train_loss": -36.911067962646484, "global_step": 75379, "epoch": 622} {"train_loss": -37.31987762451172, "global_step": 75380, "epoch": 622} {"train_loss": -36.85786056518555, "global_step": 75381, "epoch": 622} {"train_loss": -34.46149139561929, "global_step": 75382, "epoch": 622, "val_loss": 2741505.0} {"train_loss": -36.962406158447266, "global_step": 75383, "epoch": 623} {"train_loss": -37.14876937866211, "global_step": 75384, "epoch": 623} {"train_loss": -37.251224517822266, "global_step": 75385, "epoch": 623} {"train_loss": -36.95327377319336, "global_step": 75386, "epoch": 623} {"train_loss": -37.43920135498047, "global_step": 75387, "epoch": 623} {"train_loss": -37.3272705078125, "global_step": 75388, "epoch": 623} {"train_loss": -37.383880615234375, "global_step": 75389, "epoch": 623} {"train_loss": -37.08486557006836, "global_step": 75390, "epoch": 623} {"train_loss": -37.212955474853516, "global_step": 75391, "epoch": 623} {"train_loss": -35.92902755737305, "global_step": 75392, "epoch": 623} {"train_loss": -37.805904388427734, "global_step": 75393, "epoch": 623} {"train_loss": -37.57230758666992, "global_step": 75394, "epoch": 623} {"train_loss": -37.31303024291992, "global_step": 75395, "epoch": 623} {"train_loss": -36.68740463256836, "global_step": 75396, "epoch": 623} {"train_loss": -36.385154724121094, "global_step": 75397, "epoch": 623} {"train_loss": -36.04289245605469, "global_step": 75398, "epoch": 623} {"train_loss": -37.416561126708984, "global_step": 75399, "epoch": 623} {"train_loss": -37.351722717285156, "global_step": 75400, "epoch": 623} {"train_loss": -36.49027633666992, "global_step": 75401, "epoch": 623} {"train_loss": -36.15255355834961, "global_step": 75402, "epoch": 623} {"train_loss": -36.0294189453125, "global_step": 75403, "epoch": 623} {"train_loss": -36.700599670410156, "global_step": 75404, "epoch": 623} {"train_loss": -35.50259017944336, "global_step": 75405, "epoch": 623} {"train_loss": -36.405723571777344, "global_step": 75406, "epoch": 623} {"train_loss": -35.47433853149414, "global_step": 75407, "epoch": 623} {"train_loss": -34.677520751953125, "global_step": 75408, "epoch": 623} {"train_loss": -36.21339416503906, "global_step": 75409, "epoch": 623} {"train_loss": -36.83242416381836, "global_step": 75410, "epoch": 623} {"train_loss": -34.92265701293945, "global_step": 75411, "epoch": 623} {"train_loss": -34.98048782348633, "global_step": 75412, "epoch": 623} {"train_loss": -32.89023971557617, "global_step": 75413, "epoch": 623} {"train_loss": -32.13343811035156, "global_step": 75414, "epoch": 623} {"train_loss": -33.57985305786133, "global_step": 75415, "epoch": 623} {"train_loss": -36.957584381103516, "global_step": 75416, "epoch": 623} {"train_loss": -36.97422409057617, "global_step": 75417, "epoch": 623} {"train_loss": -34.882625579833984, "global_step": 75418, "epoch": 623} {"train_loss": -34.66758728027344, "global_step": 75419, "epoch": 623} {"train_loss": -35.8088264465332, "global_step": 75420, "epoch": 623} {"train_loss": -35.555572509765625, "global_step": 75421, "epoch": 623} {"train_loss": -36.00886154174805, "global_step": 75422, "epoch": 623} {"train_loss": -36.7376594543457, "global_step": 75423, "epoch": 623} {"train_loss": -35.510738372802734, "global_step": 75424, "epoch": 623} {"train_loss": -35.51357650756836, "global_step": 75425, "epoch": 623} {"train_loss": -36.86323928833008, "global_step": 75426, "epoch": 623} {"train_loss": -35.434696197509766, "global_step": 75427, "epoch": 623} {"train_loss": -35.180999755859375, "global_step": 75428, "epoch": 623} {"train_loss": -36.37929153442383, "global_step": 75429, "epoch": 623} {"train_loss": -36.49785232543945, "global_step": 75430, "epoch": 623} {"train_loss": -34.328102111816406, "global_step": 75431, "epoch": 623} {"train_loss": -34.82271194458008, "global_step": 75432, "epoch": 623} {"train_loss": -36.44658279418945, "global_step": 75433, "epoch": 623} {"train_loss": -34.100738525390625, "global_step": 75434, "epoch": 623} {"train_loss": -34.215423583984375, "global_step": 75435, "epoch": 623} {"train_loss": -36.280643463134766, "global_step": 75436, "epoch": 623} {"train_loss": -35.57874298095703, "global_step": 75437, "epoch": 623} {"train_loss": -35.9786491394043, "global_step": 75438, "epoch": 623} {"train_loss": -36.81355285644531, "global_step": 75439, "epoch": 623} {"train_loss": -36.637115478515625, "global_step": 75440, "epoch": 623} {"train_loss": -35.63939666748047, "global_step": 75441, "epoch": 623} {"train_loss": -31.724206924438477, "global_step": 75442, "epoch": 623} {"train_loss": -36.00950241088867, "global_step": 75443, "epoch": 623} {"train_loss": -36.00614547729492, "global_step": 75444, "epoch": 623} {"train_loss": -36.08445358276367, "global_step": 75445, "epoch": 623} {"train_loss": -36.260826110839844, "global_step": 75446, "epoch": 623} {"train_loss": -35.404083251953125, "global_step": 75447, "epoch": 623} {"train_loss": -35.5102653503418, "global_step": 75448, "epoch": 623} {"train_loss": -35.62807846069336, "global_step": 75449, "epoch": 623} {"train_loss": -35.61444854736328, "global_step": 75450, "epoch": 623} {"train_loss": -35.431243896484375, "global_step": 75451, "epoch": 623} {"train_loss": -34.67551803588867, "global_step": 75452, "epoch": 623} {"train_loss": -35.80210876464844, "global_step": 75453, "epoch": 623} {"train_loss": -35.61497116088867, "global_step": 75454, "epoch": 623} {"train_loss": -35.756526947021484, "global_step": 75455, "epoch": 623} {"train_loss": -35.69919967651367, "global_step": 75456, "epoch": 623} {"train_loss": -35.78341293334961, "global_step": 75457, "epoch": 623} {"train_loss": -36.795074462890625, "global_step": 75458, "epoch": 623} {"train_loss": -35.34938430786133, "global_step": 75459, "epoch": 623} {"train_loss": -36.409664154052734, "global_step": 75460, "epoch": 623} {"train_loss": -36.04853439331055, "global_step": 75461, "epoch": 623} {"train_loss": -36.920658111572266, "global_step": 75462, "epoch": 623} {"train_loss": -36.732234954833984, "global_step": 75463, "epoch": 623} {"train_loss": -36.743038177490234, "global_step": 75464, "epoch": 623} {"train_loss": -36.52427673339844, "global_step": 75465, "epoch": 623} {"train_loss": -35.56365966796875, "global_step": 75466, "epoch": 623} {"train_loss": -36.273841857910156, "global_step": 75467, "epoch": 623} {"train_loss": -36.68561553955078, "global_step": 75468, "epoch": 623} {"train_loss": -36.539730072021484, "global_step": 75469, "epoch": 623} {"train_loss": -37.29502487182617, "global_step": 75470, "epoch": 623} {"train_loss": -36.55086135864258, "global_step": 75471, "epoch": 623} {"train_loss": -36.74210739135742, "global_step": 75472, "epoch": 623} {"train_loss": -36.955780029296875, "global_step": 75473, "epoch": 623} {"train_loss": -36.936824798583984, "global_step": 75474, "epoch": 623} {"train_loss": -36.79413986206055, "global_step": 75475, "epoch": 623} {"train_loss": -36.739559173583984, "global_step": 75476, "epoch": 623} {"train_loss": -37.30835723876953, "global_step": 75477, "epoch": 623} {"train_loss": -36.7614860534668, "global_step": 75478, "epoch": 623} {"train_loss": -36.83246994018555, "global_step": 75479, "epoch": 623} {"train_loss": -37.03566360473633, "global_step": 75480, "epoch": 623} {"train_loss": -36.294189453125, "global_step": 75481, "epoch": 623} {"train_loss": -36.81471633911133, "global_step": 75482, "epoch": 623} {"train_loss": -36.58549118041992, "global_step": 75483, "epoch": 623} {"train_loss": -35.55382537841797, "global_step": 75484, "epoch": 623} {"train_loss": -36.64116287231445, "global_step": 75485, "epoch": 623} {"train_loss": -36.820796966552734, "global_step": 75486, "epoch": 623} {"train_loss": -36.034053802490234, "global_step": 75487, "epoch": 623} {"train_loss": -34.3379020690918, "global_step": 75488, "epoch": 623} {"train_loss": -36.856842041015625, "global_step": 75489, "epoch": 623} {"train_loss": -36.09278106689453, "global_step": 75490, "epoch": 623} {"train_loss": -36.638004302978516, "global_step": 75491, "epoch": 623} {"train_loss": -34.2287712097168, "global_step": 75492, "epoch": 623} {"train_loss": -36.72703170776367, "global_step": 75493, "epoch": 623} {"train_loss": -36.8154411315918, "global_step": 75494, "epoch": 623} {"train_loss": -35.87701416015625, "global_step": 75495, "epoch": 623} {"train_loss": -33.95402145385742, "global_step": 75496, "epoch": 623} {"train_loss": -36.45641326904297, "global_step": 75497, "epoch": 623} {"train_loss": -35.95376205444336, "global_step": 75498, "epoch": 623} {"train_loss": -35.4914436340332, "global_step": 75499, "epoch": 623} {"train_loss": -35.9162483215332, "global_step": 75500, "epoch": 623} {"train_loss": -36.598812103271484, "global_step": 75501, "epoch": 623} {"train_loss": -35.820648193359375, "global_step": 75502, "epoch": 623} {"train_loss": -36.06328555966212, "global_step": 75503, "epoch": 623, "val_loss": 2716070.0} {"train_loss": -35.882747650146484, "global_step": 75504, "epoch": 624} {"train_loss": -36.54079818725586, "global_step": 75505, "epoch": 624} {"train_loss": -36.791255950927734, "global_step": 75506, "epoch": 624} {"train_loss": -36.871185302734375, "global_step": 75507, "epoch": 624} {"train_loss": -36.95661926269531, "global_step": 75508, "epoch": 624} {"train_loss": -36.55644607543945, "global_step": 75509, "epoch": 624} {"train_loss": -36.98016357421875, "global_step": 75510, "epoch": 624} {"train_loss": -36.0411262512207, "global_step": 75511, "epoch": 624} {"train_loss": -36.917781829833984, "global_step": 75512, "epoch": 624} {"train_loss": -35.979095458984375, "global_step": 75513, "epoch": 624} {"train_loss": -36.60475158691406, "global_step": 75514, "epoch": 624} {"train_loss": -36.985565185546875, "global_step": 75515, "epoch": 624} {"train_loss": -36.43037033081055, "global_step": 75516, "epoch": 624} {"train_loss": -36.999874114990234, "global_step": 75517, "epoch": 624} {"train_loss": -36.967403411865234, "global_step": 75518, "epoch": 624} {"train_loss": -36.750946044921875, "global_step": 75519, "epoch": 624} {"train_loss": -36.32858657836914, "global_step": 75520, "epoch": 624} {"train_loss": -36.393768310546875, "global_step": 75521, "epoch": 624} {"train_loss": -35.70447540283203, "global_step": 75522, "epoch": 624} {"train_loss": -36.854854583740234, "global_step": 75523, "epoch": 624} {"train_loss": -35.79719161987305, "global_step": 75524, "epoch": 624} {"train_loss": -34.51800537109375, "global_step": 75525, "epoch": 624} {"train_loss": -35.8123893737793, "global_step": 75526, "epoch": 624} {"train_loss": -35.65509796142578, "global_step": 75527, "epoch": 624} {"train_loss": -36.615501403808594, "global_step": 75528, "epoch": 624} {"train_loss": -36.72529220581055, "global_step": 75529, "epoch": 624} {"train_loss": -35.09945297241211, "global_step": 75530, "epoch": 624} {"train_loss": -36.11469650268555, "global_step": 75531, "epoch": 624} {"train_loss": -34.49231719970703, "global_step": 75532, "epoch": 624} {"train_loss": -34.11741256713867, "global_step": 75533, "epoch": 624} {"train_loss": -33.858943939208984, "global_step": 75534, "epoch": 624} {"train_loss": -34.6563720703125, "global_step": 75535, "epoch": 624} {"train_loss": -30.771818161010742, "global_step": 75536, "epoch": 624} {"train_loss": -27.83154296875, "global_step": 75537, "epoch": 624} {"train_loss": -30.809030532836914, "global_step": 75538, "epoch": 624} {"train_loss": -35.59125518798828, "global_step": 75539, "epoch": 624} {"train_loss": -34.190181732177734, "global_step": 75540, "epoch": 624} {"train_loss": -33.54972457885742, "global_step": 75541, "epoch": 624} {"train_loss": -34.79655075073242, "global_step": 75542, "epoch": 624} {"train_loss": -35.0158805847168, "global_step": 75543, "epoch": 624} {"train_loss": -35.90974044799805, "global_step": 75544, "epoch": 624} {"train_loss": -35.65768051147461, "global_step": 75545, "epoch": 624} {"train_loss": -34.74796676635742, "global_step": 75546, "epoch": 624} {"train_loss": -33.85919952392578, "global_step": 75547, "epoch": 624} {"train_loss": -35.634830474853516, "global_step": 75548, "epoch": 624} {"train_loss": -35.3723030090332, "global_step": 75549, "epoch": 624} {"train_loss": -35.99430465698242, "global_step": 75550, "epoch": 624} {"train_loss": -35.47201156616211, "global_step": 75551, "epoch": 624} {"train_loss": -36.3171501159668, "global_step": 75552, "epoch": 624} {"train_loss": -35.79753112792969, "global_step": 75553, "epoch": 624} {"train_loss": -36.30868911743164, "global_step": 75554, "epoch": 624} {"train_loss": -35.0439567565918, "global_step": 75555, "epoch": 624} {"train_loss": -35.27268600463867, "global_step": 75556, "epoch": 624} {"train_loss": -36.19753646850586, "global_step": 75557, "epoch": 624} {"train_loss": -36.29439926147461, "global_step": 75558, "epoch": 624} {"train_loss": -36.11909103393555, "global_step": 75559, "epoch": 624} {"train_loss": -35.79572677612305, "global_step": 75560, "epoch": 624} {"train_loss": -36.01686477661133, "global_step": 75561, "epoch": 624} {"train_loss": -35.71677780151367, "global_step": 75562, "epoch": 624} {"train_loss": -35.99922561645508, "global_step": 75563, "epoch": 624} {"train_loss": -36.206085205078125, "global_step": 75564, "epoch": 624} {"train_loss": -34.848182678222656, "global_step": 75565, "epoch": 624} {"train_loss": -36.02223205566406, "global_step": 75566, "epoch": 624} {"train_loss": -36.89609909057617, "global_step": 75567, "epoch": 624} {"train_loss": -35.9782829284668, "global_step": 75568, "epoch": 624} {"train_loss": -36.20976638793945, "global_step": 75569, "epoch": 624} {"train_loss": -36.217002868652344, "global_step": 75570, "epoch": 624} {"train_loss": -35.98826217651367, "global_step": 75571, "epoch": 624} {"train_loss": -36.43613815307617, "global_step": 75572, "epoch": 624} {"train_loss": -36.64250183105469, "global_step": 75573, "epoch": 624} {"train_loss": -36.72113800048828, "global_step": 75574, "epoch": 624} {"train_loss": -36.49943161010742, "global_step": 75575, "epoch": 624} {"train_loss": -36.73228073120117, "global_step": 75576, "epoch": 624} {"train_loss": -36.390281677246094, "global_step": 75577, "epoch": 624} {"train_loss": -36.940731048583984, "global_step": 75578, "epoch": 624} {"train_loss": -36.871063232421875, "global_step": 75579, "epoch": 624} {"train_loss": -36.722747802734375, "global_step": 75580, "epoch": 624} {"train_loss": -36.84880447387695, "global_step": 75581, "epoch": 624} {"train_loss": -37.14559555053711, "global_step": 75582, "epoch": 624} {"train_loss": -36.71540069580078, "global_step": 75583, "epoch": 624} {"train_loss": -37.554927825927734, "global_step": 75584, "epoch": 624} {"train_loss": -36.77008819580078, "global_step": 75585, "epoch": 624} {"train_loss": -35.99060821533203, "global_step": 75586, "epoch": 624} {"train_loss": -36.11772537231445, "global_step": 75587, "epoch": 624} {"train_loss": -36.477386474609375, "global_step": 75588, "epoch": 624} {"train_loss": -37.31273651123047, "global_step": 75589, "epoch": 624} {"train_loss": -37.199676513671875, "global_step": 75590, "epoch": 624} {"train_loss": -36.917572021484375, "global_step": 75591, "epoch": 624} {"train_loss": -36.8538703918457, "global_step": 75592, "epoch": 624} {"train_loss": -37.106346130371094, "global_step": 75593, "epoch": 624} {"train_loss": -36.999114990234375, "global_step": 75594, "epoch": 624} {"train_loss": -37.19082260131836, "global_step": 75595, "epoch": 624} {"train_loss": -37.387786865234375, "global_step": 75596, "epoch": 624} {"train_loss": -37.46638488769531, "global_step": 75597, "epoch": 624} {"train_loss": -36.97367858886719, "global_step": 75598, "epoch": 624} {"train_loss": -36.53547286987305, "global_step": 75599, "epoch": 624} {"train_loss": -37.42454147338867, "global_step": 75600, "epoch": 624} {"train_loss": -36.55214309692383, "global_step": 75601, "epoch": 624} {"train_loss": -37.83776092529297, "global_step": 75602, "epoch": 624} {"train_loss": -36.98495101928711, "global_step": 75603, "epoch": 624} {"train_loss": -37.11039352416992, "global_step": 75604, "epoch": 624} {"train_loss": -36.68941879272461, "global_step": 75605, "epoch": 624} {"train_loss": -37.044246673583984, "global_step": 75606, "epoch": 624} {"train_loss": -36.29429244995117, "global_step": 75607, "epoch": 624} {"train_loss": -37.470523834228516, "global_step": 75608, "epoch": 624} {"train_loss": -34.28407669067383, "global_step": 75609, "epoch": 624} {"train_loss": -36.95914840698242, "global_step": 75610, "epoch": 624} {"train_loss": -37.10163116455078, "global_step": 75611, "epoch": 624} {"train_loss": -36.86875534057617, "global_step": 75612, "epoch": 624} {"train_loss": -37.25727081298828, "global_step": 75613, "epoch": 624} {"train_loss": -36.38731002807617, "global_step": 75614, "epoch": 624} {"train_loss": -37.35612487792969, "global_step": 75615, "epoch": 624} {"train_loss": -36.84684371948242, "global_step": 75616, "epoch": 624} {"train_loss": -37.143917083740234, "global_step": 75617, "epoch": 624} {"train_loss": -36.07217025756836, "global_step": 75618, "epoch": 624} {"train_loss": -37.00088119506836, "global_step": 75619, "epoch": 624} {"train_loss": -37.2930908203125, "global_step": 75620, "epoch": 624} {"train_loss": -37.033905029296875, "global_step": 75621, "epoch": 624} {"train_loss": -37.648414611816406, "global_step": 75622, "epoch": 624} {"train_loss": -37.657039642333984, "global_step": 75623, "epoch": 624} {"train_loss": -36.11620589327221, "global_step": 75624, "epoch": 624, "val_loss": 2721547.25} {"train_loss": -37.82025909423828, "global_step": 75625, "epoch": 625} {"train_loss": -36.87651443481445, "global_step": 75626, "epoch": 625} {"train_loss": -37.193172454833984, "global_step": 75627, "epoch": 625} {"train_loss": -36.10210037231445, "global_step": 75628, "epoch": 625} {"train_loss": -35.128719329833984, "global_step": 75629, "epoch": 625} {"train_loss": -35.25619125366211, "global_step": 75630, "epoch": 625} {"train_loss": -35.683815002441406, "global_step": 75631, "epoch": 625} {"train_loss": -35.94121551513672, "global_step": 75632, "epoch": 625} {"train_loss": -36.58960723876953, "global_step": 75633, "epoch": 625} {"train_loss": -36.80561447143555, "global_step": 75634, "epoch": 625} {"train_loss": -36.449893951416016, "global_step": 75635, "epoch": 625} {"train_loss": -35.76152801513672, "global_step": 75636, "epoch": 625} {"train_loss": -36.83511734008789, "global_step": 75637, "epoch": 625} {"train_loss": -36.614990234375, "global_step": 75638, "epoch": 625} {"train_loss": -35.56936264038086, "global_step": 75639, "epoch": 625} {"train_loss": -35.29269027709961, "global_step": 75640, "epoch": 625} {"train_loss": -35.24477767944336, "global_step": 75641, "epoch": 625} {"train_loss": -35.56592559814453, "global_step": 75642, "epoch": 625} {"train_loss": -36.47432327270508, "global_step": 75643, "epoch": 625} {"train_loss": -35.43912887573242, "global_step": 75644, "epoch": 625} {"train_loss": -36.39456558227539, "global_step": 75645, "epoch": 625} {"train_loss": -36.34470748901367, "global_step": 75646, "epoch": 625} {"train_loss": -36.21743392944336, "global_step": 75647, "epoch": 625} {"train_loss": -37.081146240234375, "global_step": 75648, "epoch": 625} {"train_loss": -35.62897872924805, "global_step": 75649, "epoch": 625} {"train_loss": -36.74581527709961, "global_step": 75650, "epoch": 625} {"train_loss": -36.74055099487305, "global_step": 75651, "epoch": 625} {"train_loss": -35.26314926147461, "global_step": 75652, "epoch": 625} {"train_loss": -35.46873092651367, "global_step": 75653, "epoch": 625} {"train_loss": -35.979103088378906, "global_step": 75654, "epoch": 625} {"train_loss": -36.11216354370117, "global_step": 75655, "epoch": 625} {"train_loss": -36.53175735473633, "global_step": 75656, "epoch": 625} {"train_loss": -36.2889404296875, "global_step": 75657, "epoch": 625} {"train_loss": -36.83958053588867, "global_step": 75658, "epoch": 625} {"train_loss": -36.78493118286133, "global_step": 75659, "epoch": 625} {"train_loss": -36.741912841796875, "global_step": 75660, "epoch": 625} {"train_loss": -36.855628967285156, "global_step": 75661, "epoch": 625} {"train_loss": -35.862892150878906, "global_step": 75662, "epoch": 625} {"train_loss": -37.06650924682617, "global_step": 75663, "epoch": 625} {"train_loss": -36.67898178100586, "global_step": 75664, "epoch": 625} {"train_loss": -35.86689376831055, "global_step": 75665, "epoch": 625} {"train_loss": -35.951961517333984, "global_step": 75666, "epoch": 625} {"train_loss": -34.94596862792969, "global_step": 75667, "epoch": 625} {"train_loss": -35.9718017578125, "global_step": 75668, "epoch": 625} {"train_loss": -36.30739212036133, "global_step": 75669, "epoch": 625} {"train_loss": -37.3807487487793, "global_step": 75670, "epoch": 625} {"train_loss": -37.324928283691406, "global_step": 75671, "epoch": 625} {"train_loss": -36.233821868896484, "global_step": 75672, "epoch": 625} {"train_loss": -36.92326736450195, "global_step": 75673, "epoch": 625} {"train_loss": -37.05896759033203, "global_step": 75674, "epoch": 625} {"train_loss": -35.715423583984375, "global_step": 75675, "epoch": 625} {"train_loss": -37.489410400390625, "global_step": 75676, "epoch": 625} {"train_loss": -36.070674896240234, "global_step": 75677, "epoch": 625} {"train_loss": -35.483150482177734, "global_step": 75678, "epoch": 625} {"train_loss": -37.117916107177734, "global_step": 75679, "epoch": 625} {"train_loss": -35.931915283203125, "global_step": 75680, "epoch": 625} {"train_loss": -35.3695182800293, "global_step": 75681, "epoch": 625} {"train_loss": -35.095741271972656, "global_step": 75682, "epoch": 625} {"train_loss": -34.35425567626953, "global_step": 75683, "epoch": 625} {"train_loss": -36.01447296142578, "global_step": 75684, "epoch": 625} {"train_loss": -34.46998977661133, "global_step": 75685, "epoch": 625} {"train_loss": -34.91265106201172, "global_step": 75686, "epoch": 625} {"train_loss": -34.24045181274414, "global_step": 75687, "epoch": 625} {"train_loss": -34.67325973510742, "global_step": 75688, "epoch": 625} {"train_loss": -34.759117126464844, "global_step": 75689, "epoch": 625} {"train_loss": -36.11137008666992, "global_step": 75690, "epoch": 625} {"train_loss": -35.544960021972656, "global_step": 75691, "epoch": 625} {"train_loss": -35.75284957885742, "global_step": 75692, "epoch": 625} {"train_loss": -36.06612777709961, "global_step": 75693, "epoch": 625} {"train_loss": -33.69465255737305, "global_step": 75694, "epoch": 625} {"train_loss": -33.971920013427734, "global_step": 75695, "epoch": 625} {"train_loss": -35.3895378112793, "global_step": 75696, "epoch": 625} {"train_loss": -33.4879150390625, "global_step": 75697, "epoch": 625} {"train_loss": -33.93901443481445, "global_step": 75698, "epoch": 625} {"train_loss": -33.22568130493164, "global_step": 75699, "epoch": 625} {"train_loss": -35.954654693603516, "global_step": 75700, "epoch": 625} {"train_loss": -35.0697135925293, "global_step": 75701, "epoch": 625} {"train_loss": -35.1766242980957, "global_step": 75702, "epoch": 625} {"train_loss": -35.64044189453125, "global_step": 75703, "epoch": 625} {"train_loss": -35.590118408203125, "global_step": 75704, "epoch": 625} {"train_loss": -36.334896087646484, "global_step": 75705, "epoch": 625} {"train_loss": -35.55570983886719, "global_step": 75706, "epoch": 625} {"train_loss": -36.72756576538086, "global_step": 75707, "epoch": 625} {"train_loss": -36.00238800048828, "global_step": 75708, "epoch": 625} {"train_loss": -36.3884162902832, "global_step": 75709, "epoch": 625} {"train_loss": -36.262603759765625, "global_step": 75710, "epoch": 625} {"train_loss": -36.90569305419922, "global_step": 75711, "epoch": 625} {"train_loss": -35.663002014160156, "global_step": 75712, "epoch": 625} {"train_loss": -37.03890609741211, "global_step": 75713, "epoch": 625} {"train_loss": -36.47975540161133, "global_step": 75714, "epoch": 625} {"train_loss": -37.121620178222656, "global_step": 75715, "epoch": 625} {"train_loss": -36.60768127441406, "global_step": 75716, "epoch": 625} {"train_loss": -36.678218841552734, "global_step": 75717, "epoch": 625} {"train_loss": -37.38855743408203, "global_step": 75718, "epoch": 625} {"train_loss": -37.09735870361328, "global_step": 75719, "epoch": 625} {"train_loss": -37.231483459472656, "global_step": 75720, "epoch": 625} {"train_loss": -36.20893096923828, "global_step": 75721, "epoch": 625} {"train_loss": -36.75229263305664, "global_step": 75722, "epoch": 625} {"train_loss": -37.10176467895508, "global_step": 75723, "epoch": 625} {"train_loss": -36.605648040771484, "global_step": 75724, "epoch": 625} {"train_loss": -37.51940155029297, "global_step": 75725, "epoch": 625} {"train_loss": -36.91085433959961, "global_step": 75726, "epoch": 625} {"train_loss": -37.07243728637695, "global_step": 75727, "epoch": 625} {"train_loss": -37.01715087890625, "global_step": 75728, "epoch": 625} {"train_loss": -37.67011260986328, "global_step": 75729, "epoch": 625} {"train_loss": -37.18888473510742, "global_step": 75730, "epoch": 625} {"train_loss": -37.17030715942383, "global_step": 75731, "epoch": 625} {"train_loss": -37.252784729003906, "global_step": 75732, "epoch": 625} {"train_loss": -37.86562728881836, "global_step": 75733, "epoch": 625} {"train_loss": -37.315067291259766, "global_step": 75734, "epoch": 625} {"train_loss": -37.70967102050781, "global_step": 75735, "epoch": 625} {"train_loss": -37.65825653076172, "global_step": 75736, "epoch": 625} {"train_loss": -37.4772834777832, "global_step": 75737, "epoch": 625} {"train_loss": -37.8994026184082, "global_step": 75738, "epoch": 625} {"train_loss": -38.03376770019531, "global_step": 75739, "epoch": 625} {"train_loss": -37.640830993652344, "global_step": 75740, "epoch": 625} {"train_loss": -37.81135940551758, "global_step": 75741, "epoch": 625} {"train_loss": -38.06193923950195, "global_step": 75742, "epoch": 625} {"train_loss": -37.85313415527344, "global_step": 75743, "epoch": 625} {"train_loss": -37.694091796875, "global_step": 75744, "epoch": 625} {"train_loss": -36.2911681813642, "global_step": 75745, "epoch": 625, "val_loss": 2686130.0} {"train_loss": -37.69630813598633, "global_step": 75746, "epoch": 626} {"train_loss": -38.15023422241211, "global_step": 75747, "epoch": 626} {"train_loss": -38.111358642578125, "global_step": 75748, "epoch": 626} {"train_loss": -38.00107955932617, "global_step": 75749, "epoch": 626} {"train_loss": -38.27401351928711, "global_step": 75750, "epoch": 626} {"train_loss": -38.21439743041992, "global_step": 75751, "epoch": 626} {"train_loss": -38.08272933959961, "global_step": 75752, "epoch": 626} {"train_loss": -38.173282623291016, "global_step": 75753, "epoch": 626} {"train_loss": -38.0748291015625, "global_step": 75754, "epoch": 626} {"train_loss": -38.106468200683594, "global_step": 75755, "epoch": 626} {"train_loss": -38.067073822021484, "global_step": 75756, "epoch": 626} {"train_loss": -38.40032196044922, "global_step": 75757, "epoch": 626} {"train_loss": -38.17449951171875, "global_step": 75758, "epoch": 626} {"train_loss": -38.05979537963867, "global_step": 75759, "epoch": 626} {"train_loss": -37.94350051879883, "global_step": 75760, "epoch": 626} {"train_loss": -38.317832946777344, "global_step": 75761, "epoch": 626} {"train_loss": -37.45441818237305, "global_step": 75762, "epoch": 626} {"train_loss": -36.45284652709961, "global_step": 75763, "epoch": 626} {"train_loss": -33.90555953979492, "global_step": 75764, "epoch": 626} {"train_loss": -32.038002014160156, "global_step": 75765, "epoch": 626} {"train_loss": -31.100744247436523, "global_step": 75766, "epoch": 626} {"train_loss": -31.593332290649414, "global_step": 75767, "epoch": 626} {"train_loss": -33.103302001953125, "global_step": 75768, "epoch": 626} {"train_loss": -35.51210403442383, "global_step": 75769, "epoch": 626} {"train_loss": -35.8040771484375, "global_step": 75770, "epoch": 626} {"train_loss": -35.36244201660156, "global_step": 75771, "epoch": 626} {"train_loss": -35.57963943481445, "global_step": 75772, "epoch": 626} {"train_loss": -36.032562255859375, "global_step": 75773, "epoch": 626} {"train_loss": -34.547767639160156, "global_step": 75774, "epoch": 626} {"train_loss": -36.35921859741211, "global_step": 75775, "epoch": 626} {"train_loss": -34.42153549194336, "global_step": 75776, "epoch": 626} {"train_loss": -34.27944564819336, "global_step": 75777, "epoch": 626} {"train_loss": -35.787506103515625, "global_step": 75778, "epoch": 626} {"train_loss": -35.65095138549805, "global_step": 75779, "epoch": 626} {"train_loss": -35.533599853515625, "global_step": 75780, "epoch": 626} {"train_loss": -35.51826095581055, "global_step": 75781, "epoch": 626} {"train_loss": -35.829505920410156, "global_step": 75782, "epoch": 626} {"train_loss": -35.96607208251953, "global_step": 75783, "epoch": 626} {"train_loss": -36.793060302734375, "global_step": 75784, "epoch": 626} {"train_loss": -35.73745346069336, "global_step": 75785, "epoch": 626} {"train_loss": -35.447105407714844, "global_step": 75786, "epoch": 626} {"train_loss": -37.45484161376953, "global_step": 75787, "epoch": 626} {"train_loss": -33.09090805053711, "global_step": 75788, "epoch": 626} {"train_loss": -36.09832763671875, "global_step": 75789, "epoch": 626} {"train_loss": -34.310760498046875, "global_step": 75790, "epoch": 626} {"train_loss": -35.60508346557617, "global_step": 75791, "epoch": 626} {"train_loss": -35.80012130737305, "global_step": 75792, "epoch": 626} {"train_loss": -35.0897216796875, "global_step": 75793, "epoch": 626} {"train_loss": -36.40431594848633, "global_step": 75794, "epoch": 626} {"train_loss": -35.737056732177734, "global_step": 75795, "epoch": 626} {"train_loss": -35.59867477416992, "global_step": 75796, "epoch": 626} {"train_loss": -34.08518981933594, "global_step": 75797, "epoch": 626} {"train_loss": -35.98286819458008, "global_step": 75798, "epoch": 626} {"train_loss": -36.20577621459961, "global_step": 75799, "epoch": 626} {"train_loss": -35.87412643432617, "global_step": 75800, "epoch": 626} {"train_loss": -36.33161544799805, "global_step": 75801, "epoch": 626} {"train_loss": -35.6103515625, "global_step": 75802, "epoch": 626} {"train_loss": -35.9289665222168, "global_step": 75803, "epoch": 626} {"train_loss": -35.80503463745117, "global_step": 75804, "epoch": 626} {"train_loss": -35.1903190612793, "global_step": 75805, "epoch": 626} {"train_loss": -36.42258834838867, "global_step": 75806, "epoch": 626} {"train_loss": -36.3470344543457, "global_step": 75807, "epoch": 626} {"train_loss": -36.222660064697266, "global_step": 75808, "epoch": 626} {"train_loss": -35.46466827392578, "global_step": 75809, "epoch": 626} {"train_loss": -34.67848587036133, "global_step": 75810, "epoch": 626} {"train_loss": -36.025482177734375, "global_step": 75811, "epoch": 626} {"train_loss": -35.25753402709961, "global_step": 75812, "epoch": 626} {"train_loss": -36.70867919921875, "global_step": 75813, "epoch": 626} {"train_loss": -35.6840705871582, "global_step": 75814, "epoch": 626} {"train_loss": -35.955787658691406, "global_step": 75815, "epoch": 626} {"train_loss": -36.094478607177734, "global_step": 75816, "epoch": 626} {"train_loss": -35.97515106201172, "global_step": 75817, "epoch": 626} {"train_loss": -35.28565216064453, "global_step": 75818, "epoch": 626} {"train_loss": -36.5505256652832, "global_step": 75819, "epoch": 626} {"train_loss": -37.09220886230469, "global_step": 75820, "epoch": 626} {"train_loss": -35.28723907470703, "global_step": 75821, "epoch": 626} {"train_loss": -34.564125061035156, "global_step": 75822, "epoch": 626} {"train_loss": -35.64093017578125, "global_step": 75823, "epoch": 626} {"train_loss": -35.38633346557617, "global_step": 75824, "epoch": 626} {"train_loss": -35.60918045043945, "global_step": 75825, "epoch": 626} {"train_loss": -36.5587272644043, "global_step": 75826, "epoch": 626} {"train_loss": -36.883644104003906, "global_step": 75827, "epoch": 626} {"train_loss": -36.35740280151367, "global_step": 75828, "epoch": 626} {"train_loss": -36.89284896850586, "global_step": 75829, "epoch": 626} {"train_loss": -36.792640686035156, "global_step": 75830, "epoch": 626} {"train_loss": -36.70366668701172, "global_step": 75831, "epoch": 626} {"train_loss": -37.162235260009766, "global_step": 75832, "epoch": 626} {"train_loss": -37.014705657958984, "global_step": 75833, "epoch": 626} {"train_loss": -36.73611068725586, "global_step": 75834, "epoch": 626} {"train_loss": -37.20518112182617, "global_step": 75835, "epoch": 626} {"train_loss": -36.58539962768555, "global_step": 75836, "epoch": 626} {"train_loss": -36.86200714111328, "global_step": 75837, "epoch": 626} {"train_loss": -37.51314926147461, "global_step": 75838, "epoch": 626} {"train_loss": -36.674983978271484, "global_step": 75839, "epoch": 626} {"train_loss": -37.33928298950195, "global_step": 75840, "epoch": 626} {"train_loss": -36.88908767700195, "global_step": 75841, "epoch": 626} {"train_loss": -36.788387298583984, "global_step": 75842, "epoch": 626} {"train_loss": -37.25393295288086, "global_step": 75843, "epoch": 626} {"train_loss": -36.70820617675781, "global_step": 75844, "epoch": 626} {"train_loss": -34.84765625, "global_step": 75845, "epoch": 626} {"train_loss": -36.89777755737305, "global_step": 75846, "epoch": 626} {"train_loss": -37.13772964477539, "global_step": 75847, "epoch": 626} {"train_loss": -37.02626419067383, "global_step": 75848, "epoch": 626} {"train_loss": -35.63468551635742, "global_step": 75849, "epoch": 626} {"train_loss": -34.331817626953125, "global_step": 75850, "epoch": 626} {"train_loss": -36.435516357421875, "global_step": 75851, "epoch": 626} {"train_loss": -37.01286697387695, "global_step": 75852, "epoch": 626} {"train_loss": -37.18745803833008, "global_step": 75853, "epoch": 626} {"train_loss": -31.2778377532959, "global_step": 75854, "epoch": 626} {"train_loss": -36.36344528198242, "global_step": 75855, "epoch": 626} {"train_loss": -32.60427474975586, "global_step": 75856, "epoch": 626} {"train_loss": -30.5216007232666, "global_step": 75857, "epoch": 626} {"train_loss": -35.23884201049805, "global_step": 75858, "epoch": 626} {"train_loss": -36.520484924316406, "global_step": 75859, "epoch": 626} {"train_loss": -34.546695709228516, "global_step": 75860, "epoch": 626} {"train_loss": -33.661930084228516, "global_step": 75861, "epoch": 626} {"train_loss": -35.92106246948242, "global_step": 75862, "epoch": 626} {"train_loss": -36.1356315612793, "global_step": 75863, "epoch": 626} {"train_loss": -35.077247619628906, "global_step": 75864, "epoch": 626} {"train_loss": -36.46099853515625, "global_step": 75865, "epoch": 626} {"train_loss": -35.999595925827656, "global_step": 75866, "epoch": 626, "val_loss": 2469773.75} {"train_loss": -34.54905319213867, "global_step": 75867, "epoch": 627} {"train_loss": -36.10470199584961, "global_step": 75868, "epoch": 627} {"train_loss": -35.44309616088867, "global_step": 75869, "epoch": 627} {"train_loss": -35.54347610473633, "global_step": 75870, "epoch": 627} {"train_loss": -36.48318099975586, "global_step": 75871, "epoch": 627} {"train_loss": -34.32160568237305, "global_step": 75872, "epoch": 627} {"train_loss": -36.652740478515625, "global_step": 75873, "epoch": 627} {"train_loss": -35.98511505126953, "global_step": 75874, "epoch": 627} {"train_loss": -36.4002571105957, "global_step": 75875, "epoch": 627} {"train_loss": -36.090423583984375, "global_step": 75876, "epoch": 627} {"train_loss": -34.86261749267578, "global_step": 75877, "epoch": 627} {"train_loss": -35.97739791870117, "global_step": 75878, "epoch": 627} {"train_loss": -36.27687454223633, "global_step": 75879, "epoch": 627} {"train_loss": -35.579246520996094, "global_step": 75880, "epoch": 627} {"train_loss": -36.209835052490234, "global_step": 75881, "epoch": 627} {"train_loss": -36.25012969970703, "global_step": 75882, "epoch": 627} {"train_loss": -36.45662307739258, "global_step": 75883, "epoch": 627} {"train_loss": -34.7587776184082, "global_step": 75884, "epoch": 627} {"train_loss": -35.15339279174805, "global_step": 75885, "epoch": 627} {"train_loss": -35.841773986816406, "global_step": 75886, "epoch": 627} {"train_loss": -34.9766960144043, "global_step": 75887, "epoch": 627} {"train_loss": -34.4975700378418, "global_step": 75888, "epoch": 627} {"train_loss": -36.27144241333008, "global_step": 75889, "epoch": 627} {"train_loss": -35.5424690246582, "global_step": 75890, "epoch": 627} {"train_loss": -36.27727127075195, "global_step": 75891, "epoch": 627} {"train_loss": -36.801509857177734, "global_step": 75892, "epoch": 627} {"train_loss": -35.93206787109375, "global_step": 75893, "epoch": 627} {"train_loss": -35.944637298583984, "global_step": 75894, "epoch": 627} {"train_loss": -35.5162467956543, "global_step": 75895, "epoch": 627} {"train_loss": -36.600704193115234, "global_step": 75896, "epoch": 627} {"train_loss": -35.9520378112793, "global_step": 75897, "epoch": 627} {"train_loss": -36.088966369628906, "global_step": 75898, "epoch": 627} {"train_loss": -35.68455123901367, "global_step": 75899, "epoch": 627} {"train_loss": -36.969024658203125, "global_step": 75900, "epoch": 627} {"train_loss": -36.32560729980469, "global_step": 75901, "epoch": 627} {"train_loss": -36.1496467590332, "global_step": 75902, "epoch": 627} {"train_loss": -36.11081314086914, "global_step": 75903, "epoch": 627} {"train_loss": -37.04989242553711, "global_step": 75904, "epoch": 627} {"train_loss": -37.13175582885742, "global_step": 75905, "epoch": 627} {"train_loss": -36.20332717895508, "global_step": 75906, "epoch": 627} {"train_loss": -36.21259307861328, "global_step": 75907, "epoch": 627} {"train_loss": -36.147071838378906, "global_step": 75908, "epoch": 627} {"train_loss": -36.868438720703125, "global_step": 75909, "epoch": 627} {"train_loss": -36.634246826171875, "global_step": 75910, "epoch": 627} {"train_loss": -36.69251251220703, "global_step": 75911, "epoch": 627} {"train_loss": -36.59385299682617, "global_step": 75912, "epoch": 627} {"train_loss": -37.029598236083984, "global_step": 75913, "epoch": 627} {"train_loss": -37.3851318359375, "global_step": 75914, "epoch": 627} {"train_loss": -36.83906173706055, "global_step": 75915, "epoch": 627} {"train_loss": -36.997249603271484, "global_step": 75916, "epoch": 627} {"train_loss": -36.70161437988281, "global_step": 75917, "epoch": 627} {"train_loss": -37.24578857421875, "global_step": 75918, "epoch": 627} {"train_loss": -37.16413497924805, "global_step": 75919, "epoch": 627} {"train_loss": -37.05709457397461, "global_step": 75920, "epoch": 627} {"train_loss": -36.91682815551758, "global_step": 75921, "epoch": 627} {"train_loss": -36.8552360534668, "global_step": 75922, "epoch": 627} {"train_loss": -36.6055793762207, "global_step": 75923, "epoch": 627} {"train_loss": -37.06981658935547, "global_step": 75924, "epoch": 627} {"train_loss": -37.3886833190918, "global_step": 75925, "epoch": 627} {"train_loss": -36.581966400146484, "global_step": 75926, "epoch": 627} {"train_loss": -36.895381927490234, "global_step": 75927, "epoch": 627} {"train_loss": -36.51786422729492, "global_step": 75928, "epoch": 627} {"train_loss": -35.70130920410156, "global_step": 75929, "epoch": 627} {"train_loss": -35.74833297729492, "global_step": 75930, "epoch": 627} {"train_loss": -36.07891845703125, "global_step": 75931, "epoch": 627} {"train_loss": -36.917171478271484, "global_step": 75932, "epoch": 627} {"train_loss": -36.37545394897461, "global_step": 75933, "epoch": 627} {"train_loss": -37.576820373535156, "global_step": 75934, "epoch": 627} {"train_loss": -36.905494689941406, "global_step": 75935, "epoch": 627} {"train_loss": -36.2546272277832, "global_step": 75936, "epoch": 627} {"train_loss": -34.47450637817383, "global_step": 75937, "epoch": 627} {"train_loss": -35.579627990722656, "global_step": 75938, "epoch": 627} {"train_loss": -37.012718200683594, "global_step": 75939, "epoch": 627} {"train_loss": -37.47274398803711, "global_step": 75940, "epoch": 627} {"train_loss": -35.17523193359375, "global_step": 75941, "epoch": 627} {"train_loss": -35.44338607788086, "global_step": 75942, "epoch": 627} {"train_loss": -36.657222747802734, "global_step": 75943, "epoch": 627} {"train_loss": -37.45200729370117, "global_step": 75944, "epoch": 627} {"train_loss": -35.96468734741211, "global_step": 75945, "epoch": 627} {"train_loss": -34.352535247802734, "global_step": 75946, "epoch": 627} {"train_loss": -37.30862808227539, "global_step": 75947, "epoch": 627} {"train_loss": -35.74430465698242, "global_step": 75948, "epoch": 627} {"train_loss": -35.380592346191406, "global_step": 75949, "epoch": 627} {"train_loss": -36.36157989501953, "global_step": 75950, "epoch": 627} {"train_loss": -36.10900115966797, "global_step": 75951, "epoch": 627} {"train_loss": -34.72578048706055, "global_step": 75952, "epoch": 627} {"train_loss": -37.89543533325195, "global_step": 75953, "epoch": 627} {"train_loss": -36.91188430786133, "global_step": 75954, "epoch": 627} {"train_loss": -36.862789154052734, "global_step": 75955, "epoch": 627} {"train_loss": -37.124046325683594, "global_step": 75956, "epoch": 627} {"train_loss": -35.6256217956543, "global_step": 75957, "epoch": 627} {"train_loss": -36.8927001953125, "global_step": 75958, "epoch": 627} {"train_loss": -37.38888168334961, "global_step": 75959, "epoch": 627} {"train_loss": -35.51654815673828, "global_step": 75960, "epoch": 627} {"train_loss": -36.80910110473633, "global_step": 75961, "epoch": 627} {"train_loss": -36.851497650146484, "global_step": 75962, "epoch": 627} {"train_loss": -37.83027267456055, "global_step": 75963, "epoch": 627} {"train_loss": -35.96745681762695, "global_step": 75964, "epoch": 627} {"train_loss": -34.57747268676758, "global_step": 75965, "epoch": 627} {"train_loss": -34.777503967285156, "global_step": 75966, "epoch": 627} {"train_loss": -36.577754974365234, "global_step": 75967, "epoch": 627} {"train_loss": -37.06599044799805, "global_step": 75968, "epoch": 627} {"train_loss": -35.21229934692383, "global_step": 75969, "epoch": 627} {"train_loss": -34.37986373901367, "global_step": 75970, "epoch": 627} {"train_loss": -35.00389862060547, "global_step": 75971, "epoch": 627} {"train_loss": -37.19865798950195, "global_step": 75972, "epoch": 627} {"train_loss": -36.991172790527344, "global_step": 75973, "epoch": 627} {"train_loss": -36.2522087097168, "global_step": 75974, "epoch": 627} {"train_loss": -37.334598541259766, "global_step": 75975, "epoch": 627} {"train_loss": -36.34174346923828, "global_step": 75976, "epoch": 627} {"train_loss": -36.70943832397461, "global_step": 75977, "epoch": 627} {"train_loss": -36.83353805541992, "global_step": 75978, "epoch": 627} {"train_loss": -35.874732971191406, "global_step": 75979, "epoch": 627} {"train_loss": -35.709285736083984, "global_step": 75980, "epoch": 627} {"train_loss": -35.99939727783203, "global_step": 75981, "epoch": 627} {"train_loss": -35.93465805053711, "global_step": 75982, "epoch": 627} {"train_loss": -36.126956939697266, "global_step": 75983, "epoch": 627} {"train_loss": -35.72367477416992, "global_step": 75984, "epoch": 627} {"train_loss": -36.53285598754883, "global_step": 75985, "epoch": 627} {"train_loss": -34.98922348022461, "global_step": 75986, "epoch": 627} {"train_loss": -36.21121228430882, "global_step": 75987, "epoch": 627, "val_loss": 2586666.75} {"train_loss": -34.24718475341797, "global_step": 75988, "epoch": 628} {"train_loss": -34.804988861083984, "global_step": 75989, "epoch": 628} {"train_loss": -34.41850280761719, "global_step": 75990, "epoch": 628} {"train_loss": -34.05619430541992, "global_step": 75991, "epoch": 628} {"train_loss": -35.30949020385742, "global_step": 75992, "epoch": 628} {"train_loss": -32.471920013427734, "global_step": 75993, "epoch": 628} {"train_loss": -36.13734817504883, "global_step": 75994, "epoch": 628} {"train_loss": -36.19745635986328, "global_step": 75995, "epoch": 628} {"train_loss": -35.665283203125, "global_step": 75996, "epoch": 628} {"train_loss": -35.73680114746094, "global_step": 75997, "epoch": 628} {"train_loss": -36.31731033325195, "global_step": 75998, "epoch": 628} {"train_loss": -31.20049476623535, "global_step": 75999, "epoch": 628} {"train_loss": -36.511470794677734, "global_step": 76000, "epoch": 628} {"train_loss": -33.725643157958984, "global_step": 76001, "epoch": 628} {"train_loss": -30.839588165283203, "global_step": 76002, "epoch": 628} {"train_loss": -33.97878646850586, "global_step": 76003, "epoch": 628} {"train_loss": -33.21810531616211, "global_step": 76004, "epoch": 628} {"train_loss": -34.57345199584961, "global_step": 76005, "epoch": 628} {"train_loss": -34.64692306518555, "global_step": 76006, "epoch": 628} {"train_loss": -35.10485076904297, "global_step": 76007, "epoch": 628} {"train_loss": -33.84540557861328, "global_step": 76008, "epoch": 628} {"train_loss": -35.21620559692383, "global_step": 76009, "epoch": 628} {"train_loss": -34.743385314941406, "global_step": 76010, "epoch": 628} {"train_loss": -35.1613883972168, "global_step": 76011, "epoch": 628} {"train_loss": -35.023353576660156, "global_step": 76012, "epoch": 628} {"train_loss": -33.531158447265625, "global_step": 76013, "epoch": 628} {"train_loss": -35.870460510253906, "global_step": 76014, "epoch": 628} {"train_loss": -34.8603401184082, "global_step": 76015, "epoch": 628} {"train_loss": -33.21700668334961, "global_step": 76016, "epoch": 628} {"train_loss": -35.175533294677734, "global_step": 76017, "epoch": 628} {"train_loss": -35.68976974487305, "global_step": 76018, "epoch": 628} {"train_loss": -36.45911407470703, "global_step": 76019, "epoch": 628} {"train_loss": -36.21561813354492, "global_step": 76020, "epoch": 628} {"train_loss": -35.19304275512695, "global_step": 76021, "epoch": 628} {"train_loss": -36.37199401855469, "global_step": 76022, "epoch": 628} {"train_loss": -35.41984558105469, "global_step": 76023, "epoch": 628} {"train_loss": -35.699710845947266, "global_step": 76024, "epoch": 628} {"train_loss": -36.192649841308594, "global_step": 76025, "epoch": 628} {"train_loss": -36.095863342285156, "global_step": 76026, "epoch": 628} {"train_loss": -36.25537109375, "global_step": 76027, "epoch": 628} {"train_loss": -36.65485382080078, "global_step": 76028, "epoch": 628} {"train_loss": -35.56056594848633, "global_step": 76029, "epoch": 628} {"train_loss": -36.642677307128906, "global_step": 76030, "epoch": 628} {"train_loss": -36.032962799072266, "global_step": 76031, "epoch": 628} {"train_loss": -35.79102325439453, "global_step": 76032, "epoch": 628} {"train_loss": -36.6187629699707, "global_step": 76033, "epoch": 628} {"train_loss": -36.78480529785156, "global_step": 76034, "epoch": 628} {"train_loss": -35.73368835449219, "global_step": 76035, "epoch": 628} {"train_loss": -35.29096221923828, "global_step": 76036, "epoch": 628} {"train_loss": -36.72932434082031, "global_step": 76037, "epoch": 628} {"train_loss": -36.70028305053711, "global_step": 76038, "epoch": 628} {"train_loss": -36.964454650878906, "global_step": 76039, "epoch": 628} {"train_loss": -36.525306701660156, "global_step": 76040, "epoch": 628} {"train_loss": -36.19390869140625, "global_step": 76041, "epoch": 628} {"train_loss": -35.33429718017578, "global_step": 76042, "epoch": 628} {"train_loss": -37.05898666381836, "global_step": 76043, "epoch": 628} {"train_loss": -37.18376159667969, "global_step": 76044, "epoch": 628} {"train_loss": -36.06817626953125, "global_step": 76045, "epoch": 628} {"train_loss": -36.93963623046875, "global_step": 76046, "epoch": 628} {"train_loss": -36.50254440307617, "global_step": 76047, "epoch": 628} {"train_loss": -36.84458923339844, "global_step": 76048, "epoch": 628} {"train_loss": -36.576499938964844, "global_step": 76049, "epoch": 628} {"train_loss": -36.46484375, "global_step": 76050, "epoch": 628} {"train_loss": -35.6315803527832, "global_step": 76051, "epoch": 628} {"train_loss": -36.84747314453125, "global_step": 76052, "epoch": 628} {"train_loss": -35.32154083251953, "global_step": 76053, "epoch": 628} {"train_loss": -36.749244689941406, "global_step": 76054, "epoch": 628} {"train_loss": -36.48200225830078, "global_step": 76055, "epoch": 628} {"train_loss": -36.7224006652832, "global_step": 76056, "epoch": 628} {"train_loss": -36.35576248168945, "global_step": 76057, "epoch": 628} {"train_loss": -36.52061080932617, "global_step": 76058, "epoch": 628} {"train_loss": -36.551631927490234, "global_step": 76059, "epoch": 628} {"train_loss": -35.780982971191406, "global_step": 76060, "epoch": 628} {"train_loss": -35.64834976196289, "global_step": 76061, "epoch": 628} {"train_loss": -34.69736099243164, "global_step": 76062, "epoch": 628} {"train_loss": -34.3123893737793, "global_step": 76063, "epoch": 628} {"train_loss": -32.34182357788086, "global_step": 76064, "epoch": 628} {"train_loss": -27.159015655517578, "global_step": 76065, "epoch": 628} {"train_loss": -25.384098052978516, "global_step": 76066, "epoch": 628} {"train_loss": -32.979705810546875, "global_step": 76067, "epoch": 628} {"train_loss": -36.0311279296875, "global_step": 76068, "epoch": 628} {"train_loss": -29.579023361206055, "global_step": 76069, "epoch": 628} {"train_loss": -36.2617301940918, "global_step": 76070, "epoch": 628} {"train_loss": -31.882925033569336, "global_step": 76071, "epoch": 628} {"train_loss": -32.68825912475586, "global_step": 76072, "epoch": 628} {"train_loss": -35.39533615112305, "global_step": 76073, "epoch": 628} {"train_loss": -33.18246078491211, "global_step": 76074, "epoch": 628} {"train_loss": -36.63582992553711, "global_step": 76075, "epoch": 628} {"train_loss": -34.162288665771484, "global_step": 76076, "epoch": 628} {"train_loss": -36.455299377441406, "global_step": 76077, "epoch": 628} {"train_loss": -35.395355224609375, "global_step": 76078, "epoch": 628} {"train_loss": -36.390235900878906, "global_step": 76079, "epoch": 628} {"train_loss": -34.77042770385742, "global_step": 76080, "epoch": 628} {"train_loss": -36.73955535888672, "global_step": 76081, "epoch": 628} {"train_loss": -36.18368148803711, "global_step": 76082, "epoch": 628} {"train_loss": -35.757423400878906, "global_step": 76083, "epoch": 628} {"train_loss": -36.20602035522461, "global_step": 76084, "epoch": 628} {"train_loss": -36.68703079223633, "global_step": 76085, "epoch": 628} {"train_loss": -36.90267562866211, "global_step": 76086, "epoch": 628} {"train_loss": -36.75698471069336, "global_step": 76087, "epoch": 628} {"train_loss": -36.763484954833984, "global_step": 76088, "epoch": 628} {"train_loss": -36.904052734375, "global_step": 76089, "epoch": 628} {"train_loss": -36.632205963134766, "global_step": 76090, "epoch": 628} {"train_loss": -36.87688446044922, "global_step": 76091, "epoch": 628} {"train_loss": -36.8211784362793, "global_step": 76092, "epoch": 628} {"train_loss": -37.10209274291992, "global_step": 76093, "epoch": 628} {"train_loss": -37.36243438720703, "global_step": 76094, "epoch": 628} {"train_loss": -37.3253288269043, "global_step": 76095, "epoch": 628} {"train_loss": -37.32877731323242, "global_step": 76096, "epoch": 628} {"train_loss": -37.28902816772461, "global_step": 76097, "epoch": 628} {"train_loss": -37.612667083740234, "global_step": 76098, "epoch": 628} {"train_loss": -37.013328552246094, "global_step": 76099, "epoch": 628} {"train_loss": -37.17863845825195, "global_step": 76100, "epoch": 628} {"train_loss": -37.51483917236328, "global_step": 76101, "epoch": 628} {"train_loss": -36.9779052734375, "global_step": 76102, "epoch": 628} {"train_loss": -37.728485107421875, "global_step": 76103, "epoch": 628} {"train_loss": -37.03733444213867, "global_step": 76104, "epoch": 628} {"train_loss": -37.03645706176758, "global_step": 76105, "epoch": 628} {"train_loss": -36.72358322143555, "global_step": 76106, "epoch": 628} {"train_loss": -37.6328239440918, "global_step": 76107, "epoch": 628} {"train_loss": -35.55941565962863, "global_step": 76108, "epoch": 628, "val_loss": 2601884.0} {"train_loss": -37.15061569213867, "global_step": 76109, "epoch": 629} {"train_loss": -37.21648025512695, "global_step": 76110, "epoch": 629} {"train_loss": -37.14754104614258, "global_step": 76111, "epoch": 629} {"train_loss": -36.95452117919922, "global_step": 76112, "epoch": 629} {"train_loss": -36.192440032958984, "global_step": 76113, "epoch": 629} {"train_loss": -35.3032341003418, "global_step": 76114, "epoch": 629} {"train_loss": -34.84141159057617, "global_step": 76115, "epoch": 629} {"train_loss": -34.866939544677734, "global_step": 76116, "epoch": 629} {"train_loss": -36.735595703125, "global_step": 76117, "epoch": 629} {"train_loss": -36.3524055480957, "global_step": 76118, "epoch": 629} {"train_loss": -37.28504180908203, "global_step": 76119, "epoch": 629} {"train_loss": -36.46513748168945, "global_step": 76120, "epoch": 629} {"train_loss": -37.1959342956543, "global_step": 76121, "epoch": 629} {"train_loss": -37.234371185302734, "global_step": 76122, "epoch": 629} {"train_loss": -35.03137969970703, "global_step": 76123, "epoch": 629} {"train_loss": -36.92145538330078, "global_step": 76124, "epoch": 629} {"train_loss": -36.13102722167969, "global_step": 76125, "epoch": 629} {"train_loss": -37.02984619140625, "global_step": 76126, "epoch": 629} {"train_loss": -36.43014144897461, "global_step": 76127, "epoch": 629} {"train_loss": -36.31752395629883, "global_step": 76128, "epoch": 629} {"train_loss": -36.80795669555664, "global_step": 76129, "epoch": 629} {"train_loss": -36.776004791259766, "global_step": 76130, "epoch": 629} {"train_loss": -36.19794845581055, "global_step": 76131, "epoch": 629} {"train_loss": -37.544612884521484, "global_step": 76132, "epoch": 629} {"train_loss": -36.856929779052734, "global_step": 76133, "epoch": 629} {"train_loss": -37.53736114501953, "global_step": 76134, "epoch": 629} {"train_loss": -37.107887268066406, "global_step": 76135, "epoch": 629} {"train_loss": -36.76984786987305, "global_step": 76136, "epoch": 629} {"train_loss": -36.867427825927734, "global_step": 76137, "epoch": 629} {"train_loss": -37.079010009765625, "global_step": 76138, "epoch": 629} {"train_loss": -37.02408981323242, "global_step": 76139, "epoch": 629} {"train_loss": -36.70094299316406, "global_step": 76140, "epoch": 629} {"train_loss": -36.789588928222656, "global_step": 76141, "epoch": 629} {"train_loss": -36.194271087646484, "global_step": 76142, "epoch": 629} {"train_loss": -36.25415802001953, "global_step": 76143, "epoch": 629} {"train_loss": -36.85236358642578, "global_step": 76144, "epoch": 629} {"train_loss": -36.99577713012695, "global_step": 76145, "epoch": 629} {"train_loss": -37.11724853515625, "global_step": 76146, "epoch": 629} {"train_loss": -35.808773040771484, "global_step": 76147, "epoch": 629} {"train_loss": -36.651729583740234, "global_step": 76148, "epoch": 629} {"train_loss": -36.243350982666016, "global_step": 76149, "epoch": 629} {"train_loss": -36.817378997802734, "global_step": 76150, "epoch": 629} {"train_loss": -36.937477111816406, "global_step": 76151, "epoch": 629} {"train_loss": -37.333248138427734, "global_step": 76152, "epoch": 629} {"train_loss": -36.361358642578125, "global_step": 76153, "epoch": 629} {"train_loss": -36.599517822265625, "global_step": 76154, "epoch": 629} {"train_loss": -37.39999771118164, "global_step": 76155, "epoch": 629} {"train_loss": -36.49528121948242, "global_step": 76156, "epoch": 629} {"train_loss": -36.29323959350586, "global_step": 76157, "epoch": 629} {"train_loss": -35.917144775390625, "global_step": 76158, "epoch": 629} {"train_loss": -36.56257629394531, "global_step": 76159, "epoch": 629} {"train_loss": -37.38047409057617, "global_step": 76160, "epoch": 629} {"train_loss": -36.717159271240234, "global_step": 76161, "epoch": 629} {"train_loss": -36.50383377075195, "global_step": 76162, "epoch": 629} {"train_loss": -35.63935470581055, "global_step": 76163, "epoch": 629} {"train_loss": -35.64750289916992, "global_step": 76164, "epoch": 629} {"train_loss": -37.023170471191406, "global_step": 76165, "epoch": 629} {"train_loss": -35.47251510620117, "global_step": 76166, "epoch": 629} {"train_loss": -37.583595275878906, "global_step": 76167, "epoch": 629} {"train_loss": -36.8305778503418, "global_step": 76168, "epoch": 629} {"train_loss": -36.54629898071289, "global_step": 76169, "epoch": 629} {"train_loss": -37.093414306640625, "global_step": 76170, "epoch": 629} {"train_loss": -36.95380783081055, "global_step": 76171, "epoch": 629} {"train_loss": -36.942054748535156, "global_step": 76172, "epoch": 629} {"train_loss": -37.127044677734375, "global_step": 76173, "epoch": 629} {"train_loss": -37.57381057739258, "global_step": 76174, "epoch": 629} {"train_loss": -37.639076232910156, "global_step": 76175, "epoch": 629} {"train_loss": -37.516178131103516, "global_step": 76176, "epoch": 629} {"train_loss": -37.206886291503906, "global_step": 76177, "epoch": 629} {"train_loss": -37.85736083984375, "global_step": 76178, "epoch": 629} {"train_loss": -36.737060546875, "global_step": 76179, "epoch": 629} {"train_loss": -37.760040283203125, "global_step": 76180, "epoch": 629} {"train_loss": -36.986934661865234, "global_step": 76181, "epoch": 629} {"train_loss": -35.81541442871094, "global_step": 76182, "epoch": 629} {"train_loss": -36.081241607666016, "global_step": 76183, "epoch": 629} {"train_loss": -35.18642044067383, "global_step": 76184, "epoch": 629} {"train_loss": -37.2016716003418, "global_step": 76185, "epoch": 629} {"train_loss": -37.4121208190918, "global_step": 76186, "epoch": 629} {"train_loss": -37.3661994934082, "global_step": 76187, "epoch": 629} {"train_loss": -37.24174118041992, "global_step": 76188, "epoch": 629} {"train_loss": -36.70065689086914, "global_step": 76189, "epoch": 629} {"train_loss": -37.1019287109375, "global_step": 76190, "epoch": 629} {"train_loss": -37.610958099365234, "global_step": 76191, "epoch": 629} {"train_loss": -36.60633087158203, "global_step": 76192, "epoch": 629} {"train_loss": -36.860965728759766, "global_step": 76193, "epoch": 629} {"train_loss": -36.52420425415039, "global_step": 76194, "epoch": 629} {"train_loss": -36.45545196533203, "global_step": 76195, "epoch": 629} {"train_loss": -37.201690673828125, "global_step": 76196, "epoch": 629} {"train_loss": -37.610145568847656, "global_step": 76197, "epoch": 629} {"train_loss": -37.121795654296875, "global_step": 76198, "epoch": 629} {"train_loss": -37.52894592285156, "global_step": 76199, "epoch": 629} {"train_loss": -36.8978385925293, "global_step": 76200, "epoch": 629} {"train_loss": -37.45011520385742, "global_step": 76201, "epoch": 629} {"train_loss": -37.7385139465332, "global_step": 76202, "epoch": 629} {"train_loss": -37.687255859375, "global_step": 76203, "epoch": 629} {"train_loss": -37.07209014892578, "global_step": 76204, "epoch": 629} {"train_loss": -38.09248733520508, "global_step": 76205, "epoch": 629} {"train_loss": -37.46260070800781, "global_step": 76206, "epoch": 629} {"train_loss": -37.203460693359375, "global_step": 76207, "epoch": 629} {"train_loss": -37.43571853637695, "global_step": 76208, "epoch": 629} {"train_loss": -38.0638542175293, "global_step": 76209, "epoch": 629} {"train_loss": -37.30836868286133, "global_step": 76210, "epoch": 629} {"train_loss": -37.02479934692383, "global_step": 76211, "epoch": 629} {"train_loss": -37.99976348876953, "global_step": 76212, "epoch": 629} {"train_loss": -34.61219787597656, "global_step": 76213, "epoch": 629} {"train_loss": -38.0177116394043, "global_step": 76214, "epoch": 629} {"train_loss": -37.3493766784668, "global_step": 76215, "epoch": 629} {"train_loss": -37.369537353515625, "global_step": 76216, "epoch": 629} {"train_loss": -38.338436126708984, "global_step": 76217, "epoch": 629} {"train_loss": -36.98458480834961, "global_step": 76218, "epoch": 629} {"train_loss": -36.78989791870117, "global_step": 76219, "epoch": 629} {"train_loss": -37.784732818603516, "global_step": 76220, "epoch": 629} {"train_loss": -36.573280334472656, "global_step": 76221, "epoch": 629} {"train_loss": -37.748538970947266, "global_step": 76222, "epoch": 629} {"train_loss": -38.10199737548828, "global_step": 76223, "epoch": 629} {"train_loss": -34.98902893066406, "global_step": 76224, "epoch": 629} {"train_loss": -36.80376052856445, "global_step": 76225, "epoch": 629} {"train_loss": -36.78928756713867, "global_step": 76226, "epoch": 629} {"train_loss": -35.23222732543945, "global_step": 76227, "epoch": 629} {"train_loss": -36.590023040771484, "global_step": 76228, "epoch": 629} {"train_loss": -36.852113676465244, "global_step": 76229, "epoch": 629, "val_loss": 2714026.25} {"train_loss": -37.55910873413086, "global_step": 76230, "epoch": 630} {"train_loss": -35.60837936401367, "global_step": 76231, "epoch": 630} {"train_loss": -35.814186096191406, "global_step": 76232, "epoch": 630} {"train_loss": -35.22105026245117, "global_step": 76233, "epoch": 630} {"train_loss": -35.811622619628906, "global_step": 76234, "epoch": 630} {"train_loss": -36.87495040893555, "global_step": 76235, "epoch": 630} {"train_loss": -37.10834884643555, "global_step": 76236, "epoch": 630} {"train_loss": -36.83077621459961, "global_step": 76237, "epoch": 630} {"train_loss": -37.76174545288086, "global_step": 76238, "epoch": 630} {"train_loss": -35.391395568847656, "global_step": 76239, "epoch": 630} {"train_loss": -35.55357360839844, "global_step": 76240, "epoch": 630} {"train_loss": -34.8723258972168, "global_step": 76241, "epoch": 630} {"train_loss": -35.817787170410156, "global_step": 76242, "epoch": 630} {"train_loss": -38.3187255859375, "global_step": 76243, "epoch": 630} {"train_loss": -36.27033615112305, "global_step": 76244, "epoch": 630} {"train_loss": -36.873592376708984, "global_step": 76245, "epoch": 630} {"train_loss": -36.29502487182617, "global_step": 76246, "epoch": 630} {"train_loss": -36.125362396240234, "global_step": 76247, "epoch": 630} {"train_loss": -36.73666000366211, "global_step": 76248, "epoch": 630} {"train_loss": -35.02129364013672, "global_step": 76249, "epoch": 630} {"train_loss": -34.57670211791992, "global_step": 76250, "epoch": 630} {"train_loss": -35.38223648071289, "global_step": 76251, "epoch": 630} {"train_loss": -33.326942443847656, "global_step": 76252, "epoch": 630} {"train_loss": -34.689918518066406, "global_step": 76253, "epoch": 630} {"train_loss": -35.66193389892578, "global_step": 76254, "epoch": 630} {"train_loss": -36.72774124145508, "global_step": 76255, "epoch": 630} {"train_loss": -34.713871002197266, "global_step": 76256, "epoch": 630} {"train_loss": -36.88802719116211, "global_step": 76257, "epoch": 630} {"train_loss": -36.2060432434082, "global_step": 76258, "epoch": 630} {"train_loss": -36.64072036743164, "global_step": 76259, "epoch": 630} {"train_loss": -36.53043746948242, "global_step": 76260, "epoch": 630} {"train_loss": -36.28588104248047, "global_step": 76261, "epoch": 630} {"train_loss": -35.96670150756836, "global_step": 76262, "epoch": 630} {"train_loss": -37.130855560302734, "global_step": 76263, "epoch": 630} {"train_loss": -37.059547424316406, "global_step": 76264, "epoch": 630} {"train_loss": -37.27621841430664, "global_step": 76265, "epoch": 630} {"train_loss": -36.84109115600586, "global_step": 76266, "epoch": 630} {"train_loss": -37.052181243896484, "global_step": 76267, "epoch": 630} {"train_loss": -37.56140899658203, "global_step": 76268, "epoch": 630} {"train_loss": -37.1019287109375, "global_step": 76269, "epoch": 630} {"train_loss": -37.1623649597168, "global_step": 76270, "epoch": 630} {"train_loss": -37.45601272583008, "global_step": 76271, "epoch": 630} {"train_loss": -37.12596130371094, "global_step": 76272, "epoch": 630} {"train_loss": -37.5020751953125, "global_step": 76273, "epoch": 630} {"train_loss": -37.71824645996094, "global_step": 76274, "epoch": 630} {"train_loss": -37.67509078979492, "global_step": 76275, "epoch": 630} {"train_loss": -36.50777053833008, "global_step": 76276, "epoch": 630} {"train_loss": -37.70206069946289, "global_step": 76277, "epoch": 630} {"train_loss": -37.87126922607422, "global_step": 76278, "epoch": 630} {"train_loss": -37.624000549316406, "global_step": 76279, "epoch": 630} {"train_loss": -37.01774978637695, "global_step": 76280, "epoch": 630} {"train_loss": -37.86305618286133, "global_step": 76281, "epoch": 630} {"train_loss": -37.35763168334961, "global_step": 76282, "epoch": 630} {"train_loss": -37.42682647705078, "global_step": 76283, "epoch": 630} {"train_loss": -37.818111419677734, "global_step": 76284, "epoch": 630} {"train_loss": -37.64430618286133, "global_step": 76285, "epoch": 630} {"train_loss": -36.03168869018555, "global_step": 76286, "epoch": 630} {"train_loss": -36.25301742553711, "global_step": 76287, "epoch": 630} {"train_loss": -37.517696380615234, "global_step": 76288, "epoch": 630} {"train_loss": -37.73575973510742, "global_step": 76289, "epoch": 630} {"train_loss": -37.68556594848633, "global_step": 76290, "epoch": 630} {"train_loss": -37.10482406616211, "global_step": 76291, "epoch": 630} {"train_loss": -37.641963958740234, "global_step": 76292, "epoch": 630} {"train_loss": -37.967552185058594, "global_step": 76293, "epoch": 630} {"train_loss": -38.21201705932617, "global_step": 76294, "epoch": 630} {"train_loss": -36.9332389831543, "global_step": 76295, "epoch": 630} {"train_loss": -37.08534240722656, "global_step": 76296, "epoch": 630} {"train_loss": -37.98110580444336, "global_step": 76297, "epoch": 630} {"train_loss": -37.088008880615234, "global_step": 76298, "epoch": 630} {"train_loss": -35.696693420410156, "global_step": 76299, "epoch": 630} {"train_loss": -37.0263786315918, "global_step": 76300, "epoch": 630} {"train_loss": -37.76279067993164, "global_step": 76301, "epoch": 630} {"train_loss": -36.786155700683594, "global_step": 76302, "epoch": 630} {"train_loss": -36.53562545776367, "global_step": 76303, "epoch": 630} {"train_loss": -36.894989013671875, "global_step": 76304, "epoch": 630} {"train_loss": -37.59906005859375, "global_step": 76305, "epoch": 630} {"train_loss": -36.29261779785156, "global_step": 76306, "epoch": 630} {"train_loss": -36.17823028564453, "global_step": 76307, "epoch": 630} {"train_loss": -36.680599212646484, "global_step": 76308, "epoch": 630} {"train_loss": -36.93374252319336, "global_step": 76309, "epoch": 630} {"train_loss": -31.928476333618164, "global_step": 76310, "epoch": 630} {"train_loss": -37.81706619262695, "global_step": 76311, "epoch": 630} {"train_loss": -35.93904495239258, "global_step": 76312, "epoch": 630} {"train_loss": -36.794246673583984, "global_step": 76313, "epoch": 630} {"train_loss": -37.474159240722656, "global_step": 76314, "epoch": 630} {"train_loss": -36.67827224731445, "global_step": 76315, "epoch": 630} {"train_loss": -36.84944534301758, "global_step": 76316, "epoch": 630} {"train_loss": -37.303653717041016, "global_step": 76317, "epoch": 630} {"train_loss": -36.60014724731445, "global_step": 76318, "epoch": 630} {"train_loss": -36.47275924682617, "global_step": 76319, "epoch": 630} {"train_loss": -35.1507682800293, "global_step": 76320, "epoch": 630} {"train_loss": -36.70709991455078, "global_step": 76321, "epoch": 630} {"train_loss": -36.76069641113281, "global_step": 76322, "epoch": 630} {"train_loss": -36.61077880859375, "global_step": 76323, "epoch": 630} {"train_loss": -35.8875732421875, "global_step": 76324, "epoch": 630} {"train_loss": -36.91986083984375, "global_step": 76325, "epoch": 630} {"train_loss": -37.213897705078125, "global_step": 76326, "epoch": 630} {"train_loss": -36.38795471191406, "global_step": 76327, "epoch": 630} {"train_loss": -36.39680099487305, "global_step": 76328, "epoch": 630} {"train_loss": -37.34629440307617, "global_step": 76329, "epoch": 630} {"train_loss": -37.6341552734375, "global_step": 76330, "epoch": 630} {"train_loss": -37.35508346557617, "global_step": 76331, "epoch": 630} {"train_loss": -36.28591537475586, "global_step": 76332, "epoch": 630} {"train_loss": -36.39725875854492, "global_step": 76333, "epoch": 630} {"train_loss": -35.38650131225586, "global_step": 76334, "epoch": 630} {"train_loss": -37.030189514160156, "global_step": 76335, "epoch": 630} {"train_loss": -36.782188415527344, "global_step": 76336, "epoch": 630} {"train_loss": -37.0256233215332, "global_step": 76337, "epoch": 630} {"train_loss": -35.417110443115234, "global_step": 76338, "epoch": 630} {"train_loss": -35.679439544677734, "global_step": 76339, "epoch": 630} {"train_loss": -36.44917678833008, "global_step": 76340, "epoch": 630} {"train_loss": -37.170772552490234, "global_step": 76341, "epoch": 630} {"train_loss": -37.10765838623047, "global_step": 76342, "epoch": 630} {"train_loss": -36.03449249267578, "global_step": 76343, "epoch": 630} {"train_loss": -37.44942855834961, "global_step": 76344, "epoch": 630} {"train_loss": -36.598514556884766, "global_step": 76345, "epoch": 630} {"train_loss": -35.67079544067383, "global_step": 76346, "epoch": 630} {"train_loss": -36.565155029296875, "global_step": 76347, "epoch": 630} {"train_loss": -36.99431228637695, "global_step": 76348, "epoch": 630} {"train_loss": -37.918373107910156, "global_step": 76349, "epoch": 630} {"train_loss": -36.67302292437593, "global_step": 76350, "epoch": 630, "val_loss": 2701305.0} {"train_loss": -37.563751220703125, "global_step": 76351, "epoch": 631} {"train_loss": -36.74104309082031, "global_step": 76352, "epoch": 631} {"train_loss": -37.31431579589844, "global_step": 76353, "epoch": 631} {"train_loss": -37.35404586791992, "global_step": 76354, "epoch": 631} {"train_loss": -37.3327751159668, "global_step": 76355, "epoch": 631} {"train_loss": -37.506622314453125, "global_step": 76356, "epoch": 631} {"train_loss": -36.69270706176758, "global_step": 76357, "epoch": 631} {"train_loss": -36.90579605102539, "global_step": 76358, "epoch": 631} {"train_loss": -34.81571960449219, "global_step": 76359, "epoch": 631} {"train_loss": -35.39857482910156, "global_step": 76360, "epoch": 631} {"train_loss": -34.781375885009766, "global_step": 76361, "epoch": 631} {"train_loss": -34.05451202392578, "global_step": 76362, "epoch": 631} {"train_loss": -35.00118637084961, "global_step": 76363, "epoch": 631} {"train_loss": -36.961944580078125, "global_step": 76364, "epoch": 631} {"train_loss": -37.06549835205078, "global_step": 76365, "epoch": 631} {"train_loss": -36.61560821533203, "global_step": 76366, "epoch": 631} {"train_loss": -36.99933624267578, "global_step": 76367, "epoch": 631} {"train_loss": -37.548492431640625, "global_step": 76368, "epoch": 631} {"train_loss": -37.7473258972168, "global_step": 76369, "epoch": 631} {"train_loss": -35.81972122192383, "global_step": 76370, "epoch": 631} {"train_loss": -35.72361373901367, "global_step": 76371, "epoch": 631} {"train_loss": -36.71834945678711, "global_step": 76372, "epoch": 631} {"train_loss": -35.15003204345703, "global_step": 76373, "epoch": 631} {"train_loss": -32.13300704956055, "global_step": 76374, "epoch": 631} {"train_loss": -32.47915267944336, "global_step": 76375, "epoch": 631} {"train_loss": -36.329071044921875, "global_step": 76376, "epoch": 631} {"train_loss": -34.92316436767578, "global_step": 76377, "epoch": 631} {"train_loss": -33.0713996887207, "global_step": 76378, "epoch": 631} {"train_loss": -36.462093353271484, "global_step": 76379, "epoch": 631} {"train_loss": -36.35673141479492, "global_step": 76380, "epoch": 631} {"train_loss": -34.75034713745117, "global_step": 76381, "epoch": 631} {"train_loss": -37.15827178955078, "global_step": 76382, "epoch": 631} {"train_loss": -36.06250762939453, "global_step": 76383, "epoch": 631} {"train_loss": -36.33637237548828, "global_step": 76384, "epoch": 631} {"train_loss": -35.21897506713867, "global_step": 76385, "epoch": 631} {"train_loss": -35.06380844116211, "global_step": 76386, "epoch": 631} {"train_loss": -36.14154052734375, "global_step": 76387, "epoch": 631} {"train_loss": -35.75246047973633, "global_step": 76388, "epoch": 631} {"train_loss": -36.17145538330078, "global_step": 76389, "epoch": 631} {"train_loss": -35.08768081665039, "global_step": 76390, "epoch": 631} {"train_loss": -37.1233024597168, "global_step": 76391, "epoch": 631} {"train_loss": -35.56772994995117, "global_step": 76392, "epoch": 631} {"train_loss": -36.068946838378906, "global_step": 76393, "epoch": 631} {"train_loss": -36.042293548583984, "global_step": 76394, "epoch": 631} {"train_loss": -36.74859619140625, "global_step": 76395, "epoch": 631} {"train_loss": -36.362247467041016, "global_step": 76396, "epoch": 631} {"train_loss": -36.13397979736328, "global_step": 76397, "epoch": 631} {"train_loss": -37.14897155761719, "global_step": 76398, "epoch": 631} {"train_loss": -36.479408264160156, "global_step": 76399, "epoch": 631} {"train_loss": -36.297977447509766, "global_step": 76400, "epoch": 631} {"train_loss": -36.91501998901367, "global_step": 76401, "epoch": 631} {"train_loss": -36.549983978271484, "global_step": 76402, "epoch": 631} {"train_loss": -37.17993927001953, "global_step": 76403, "epoch": 631} {"train_loss": -36.94279861450195, "global_step": 76404, "epoch": 631} {"train_loss": -37.19321060180664, "global_step": 76405, "epoch": 631} {"train_loss": -36.90940475463867, "global_step": 76406, "epoch": 631} {"train_loss": -37.02186584472656, "global_step": 76407, "epoch": 631} {"train_loss": -36.964500427246094, "global_step": 76408, "epoch": 631} {"train_loss": -36.51960372924805, "global_step": 76409, "epoch": 631} {"train_loss": -36.86286163330078, "global_step": 76410, "epoch": 631} {"train_loss": -37.1222038269043, "global_step": 76411, "epoch": 631} {"train_loss": -36.91303253173828, "global_step": 76412, "epoch": 631} {"train_loss": -35.968563079833984, "global_step": 76413, "epoch": 631} {"train_loss": -36.67464065551758, "global_step": 76414, "epoch": 631} {"train_loss": -37.264278411865234, "global_step": 76415, "epoch": 631} {"train_loss": -37.128448486328125, "global_step": 76416, "epoch": 631} {"train_loss": -37.45246124267578, "global_step": 76417, "epoch": 631} {"train_loss": -37.07514572143555, "global_step": 76418, "epoch": 631} {"train_loss": -37.158077239990234, "global_step": 76419, "epoch": 631} {"train_loss": -37.17977523803711, "global_step": 76420, "epoch": 631} {"train_loss": -37.24452590942383, "global_step": 76421, "epoch": 631} {"train_loss": -37.916316986083984, "global_step": 76422, "epoch": 631} {"train_loss": -37.244728088378906, "global_step": 76423, "epoch": 631} {"train_loss": -37.625946044921875, "global_step": 76424, "epoch": 631} {"train_loss": -37.85087585449219, "global_step": 76425, "epoch": 631} {"train_loss": -37.852027893066406, "global_step": 76426, "epoch": 631} {"train_loss": -37.69287109375, "global_step": 76427, "epoch": 631} {"train_loss": -36.69257736206055, "global_step": 76428, "epoch": 631} {"train_loss": -36.503692626953125, "global_step": 76429, "epoch": 631} {"train_loss": -36.49029541015625, "global_step": 76430, "epoch": 631} {"train_loss": -37.84575653076172, "global_step": 76431, "epoch": 631} {"train_loss": -37.42271041870117, "global_step": 76432, "epoch": 631} {"train_loss": -36.97262191772461, "global_step": 76433, "epoch": 631} {"train_loss": -37.351036071777344, "global_step": 76434, "epoch": 631} {"train_loss": -36.67629623413086, "global_step": 76435, "epoch": 631} {"train_loss": -37.30474853515625, "global_step": 76436, "epoch": 631} {"train_loss": -37.63725280761719, "global_step": 76437, "epoch": 631} {"train_loss": -37.92753982543945, "global_step": 76438, "epoch": 631} {"train_loss": -37.69814682006836, "global_step": 76439, "epoch": 631} {"train_loss": -37.47037887573242, "global_step": 76440, "epoch": 631} {"train_loss": -37.41043472290039, "global_step": 76441, "epoch": 631} {"train_loss": -37.08701705932617, "global_step": 76442, "epoch": 631} {"train_loss": -37.698787689208984, "global_step": 76443, "epoch": 631} {"train_loss": -37.21381759643555, "global_step": 76444, "epoch": 631} {"train_loss": -37.63556671142578, "global_step": 76445, "epoch": 631} {"train_loss": -37.61128234863281, "global_step": 76446, "epoch": 631} {"train_loss": -37.878448486328125, "global_step": 76447, "epoch": 631} {"train_loss": -37.83544158935547, "global_step": 76448, "epoch": 631} {"train_loss": -37.357635498046875, "global_step": 76449, "epoch": 631} {"train_loss": -37.8264045715332, "global_step": 76450, "epoch": 631} {"train_loss": -37.62788009643555, "global_step": 76451, "epoch": 631} {"train_loss": -37.87076950073242, "global_step": 76452, "epoch": 631} {"train_loss": -36.23203659057617, "global_step": 76453, "epoch": 631} {"train_loss": -36.21561813354492, "global_step": 76454, "epoch": 631} {"train_loss": -37.062015533447266, "global_step": 76455, "epoch": 631} {"train_loss": -37.20075607299805, "global_step": 76456, "epoch": 631} {"train_loss": -37.83274459838867, "global_step": 76457, "epoch": 631} {"train_loss": -36.47938919067383, "global_step": 76458, "epoch": 631} {"train_loss": -37.042869567871094, "global_step": 76459, "epoch": 631} {"train_loss": -37.2955207824707, "global_step": 76460, "epoch": 631} {"train_loss": -37.617740631103516, "global_step": 76461, "epoch": 631} {"train_loss": -38.16347122192383, "global_step": 76462, "epoch": 631} {"train_loss": -36.415565490722656, "global_step": 76463, "epoch": 631} {"train_loss": -36.3863639831543, "global_step": 76464, "epoch": 631} {"train_loss": -35.69999694824219, "global_step": 76465, "epoch": 631} {"train_loss": -37.57399368286133, "global_step": 76466, "epoch": 631} {"train_loss": -36.659908294677734, "global_step": 76467, "epoch": 631} {"train_loss": -36.088661193847656, "global_step": 76468, "epoch": 631} {"train_loss": -35.62274932861328, "global_step": 76469, "epoch": 631} {"train_loss": -37.908870697021484, "global_step": 76470, "epoch": 631} {"train_loss": -36.68829733478136, "global_step": 76471, "epoch": 631, "val_loss": 2566305.25} {"train_loss": -34.3616943359375, "global_step": 76472, "epoch": 632} {"train_loss": -35.6419792175293, "global_step": 76473, "epoch": 632} {"train_loss": -38.05550765991211, "global_step": 76474, "epoch": 632} {"train_loss": -35.4707145690918, "global_step": 76475, "epoch": 632} {"train_loss": -35.500885009765625, "global_step": 76476, "epoch": 632} {"train_loss": -35.38819122314453, "global_step": 76477, "epoch": 632} {"train_loss": -36.13117599487305, "global_step": 76478, "epoch": 632} {"train_loss": -36.67811584472656, "global_step": 76479, "epoch": 632} {"train_loss": -36.63490676879883, "global_step": 76480, "epoch": 632} {"train_loss": -36.19729232788086, "global_step": 76481, "epoch": 632} {"train_loss": -33.81211471557617, "global_step": 76482, "epoch": 632} {"train_loss": -32.295570373535156, "global_step": 76483, "epoch": 632} {"train_loss": -35.186004638671875, "global_step": 76484, "epoch": 632} {"train_loss": -37.201942443847656, "global_step": 76485, "epoch": 632} {"train_loss": -36.55926513671875, "global_step": 76486, "epoch": 632} {"train_loss": -36.90314483642578, "global_step": 76487, "epoch": 632} {"train_loss": -36.7286491394043, "global_step": 76488, "epoch": 632} {"train_loss": -36.76129150390625, "global_step": 76489, "epoch": 632} {"train_loss": -35.3627815246582, "global_step": 76490, "epoch": 632} {"train_loss": -37.427486419677734, "global_step": 76491, "epoch": 632} {"train_loss": -37.60480499267578, "global_step": 76492, "epoch": 632} {"train_loss": -37.41946029663086, "global_step": 76493, "epoch": 632} {"train_loss": -37.60187530517578, "global_step": 76494, "epoch": 632} {"train_loss": -36.99893569946289, "global_step": 76495, "epoch": 632} {"train_loss": -37.70027542114258, "global_step": 76496, "epoch": 632} {"train_loss": -37.73365020751953, "global_step": 76497, "epoch": 632} {"train_loss": -38.156646728515625, "global_step": 76498, "epoch": 632} {"train_loss": -36.98134231567383, "global_step": 76499, "epoch": 632} {"train_loss": -37.76231002807617, "global_step": 76500, "epoch": 632} {"train_loss": -37.674888610839844, "global_step": 76501, "epoch": 632} {"train_loss": -37.87451171875, "global_step": 76502, "epoch": 632} {"train_loss": -37.651405334472656, "global_step": 76503, "epoch": 632} {"train_loss": -37.87257766723633, "global_step": 76504, "epoch": 632} {"train_loss": -37.341278076171875, "global_step": 76505, "epoch": 632} {"train_loss": -36.828819274902344, "global_step": 76506, "epoch": 632} {"train_loss": -38.22755813598633, "global_step": 76507, "epoch": 632} {"train_loss": -37.132301330566406, "global_step": 76508, "epoch": 632} {"train_loss": -37.730831146240234, "global_step": 76509, "epoch": 632} {"train_loss": -36.95441818237305, "global_step": 76510, "epoch": 632} {"train_loss": -37.788848876953125, "global_step": 76511, "epoch": 632} {"train_loss": -36.71908187866211, "global_step": 76512, "epoch": 632} {"train_loss": -37.83618927001953, "global_step": 76513, "epoch": 632} {"train_loss": -37.42231369018555, "global_step": 76514, "epoch": 632} {"train_loss": -37.802703857421875, "global_step": 76515, "epoch": 632} {"train_loss": -35.89682388305664, "global_step": 76516, "epoch": 632} {"train_loss": -37.18180465698242, "global_step": 76517, "epoch": 632} {"train_loss": -37.48768997192383, "global_step": 76518, "epoch": 632} {"train_loss": -37.879127502441406, "global_step": 76519, "epoch": 632} {"train_loss": -36.27871322631836, "global_step": 76520, "epoch": 632} {"train_loss": -37.4600944519043, "global_step": 76521, "epoch": 632} {"train_loss": -33.4642219543457, "global_step": 76522, "epoch": 632} {"train_loss": -33.511024475097656, "global_step": 76523, "epoch": 632} {"train_loss": -36.979225158691406, "global_step": 76524, "epoch": 632} {"train_loss": -35.799251556396484, "global_step": 76525, "epoch": 632} {"train_loss": -35.26941680908203, "global_step": 76526, "epoch": 632} {"train_loss": -34.118080139160156, "global_step": 76527, "epoch": 632} {"train_loss": -36.21686935424805, "global_step": 76528, "epoch": 632} {"train_loss": -37.03266525268555, "global_step": 76529, "epoch": 632} {"train_loss": -35.11355972290039, "global_step": 76530, "epoch": 632} {"train_loss": -35.94778060913086, "global_step": 76531, "epoch": 632} {"train_loss": -34.246585845947266, "global_step": 76532, "epoch": 632} {"train_loss": -35.171546936035156, "global_step": 76533, "epoch": 632} {"train_loss": -35.50057601928711, "global_step": 76534, "epoch": 632} {"train_loss": -35.75081253051758, "global_step": 76535, "epoch": 632} {"train_loss": -36.464332580566406, "global_step": 76536, "epoch": 632} {"train_loss": -36.4620475769043, "global_step": 76537, "epoch": 632} {"train_loss": -35.51459884643555, "global_step": 76538, "epoch": 632} {"train_loss": -35.714298248291016, "global_step": 76539, "epoch": 632} {"train_loss": -36.52202224731445, "global_step": 76540, "epoch": 632} {"train_loss": -35.70888137817383, "global_step": 76541, "epoch": 632} {"train_loss": -36.768638610839844, "global_step": 76542, "epoch": 632} {"train_loss": -35.28973388671875, "global_step": 76543, "epoch": 632} {"train_loss": -37.09304428100586, "global_step": 76544, "epoch": 632} {"train_loss": -36.40756607055664, "global_step": 76545, "epoch": 632} {"train_loss": -36.454986572265625, "global_step": 76546, "epoch": 632} {"train_loss": -36.454864501953125, "global_step": 76547, "epoch": 632} {"train_loss": -37.31809997558594, "global_step": 76548, "epoch": 632} {"train_loss": -36.6629753112793, "global_step": 76549, "epoch": 632} {"train_loss": -35.81895065307617, "global_step": 76550, "epoch": 632} {"train_loss": -36.3049430847168, "global_step": 76551, "epoch": 632} {"train_loss": -36.8816032409668, "global_step": 76552, "epoch": 632} {"train_loss": -37.16779708862305, "global_step": 76553, "epoch": 632} {"train_loss": -37.26003646850586, "global_step": 76554, "epoch": 632} {"train_loss": -36.442325592041016, "global_step": 76555, "epoch": 632} {"train_loss": -37.196285247802734, "global_step": 76556, "epoch": 632} {"train_loss": -36.819271087646484, "global_step": 76557, "epoch": 632} {"train_loss": -37.32064437866211, "global_step": 76558, "epoch": 632} {"train_loss": -36.102439880371094, "global_step": 76559, "epoch": 632} {"train_loss": -37.276336669921875, "global_step": 76560, "epoch": 632} {"train_loss": -34.98451614379883, "global_step": 76561, "epoch": 632} {"train_loss": -34.39305114746094, "global_step": 76562, "epoch": 632} {"train_loss": -34.45553970336914, "global_step": 76563, "epoch": 632} {"train_loss": -35.55979919433594, "global_step": 76564, "epoch": 632} {"train_loss": -34.041412353515625, "global_step": 76565, "epoch": 632} {"train_loss": -33.87746810913086, "global_step": 76566, "epoch": 632} {"train_loss": -35.88395309448242, "global_step": 76567, "epoch": 632} {"train_loss": -36.981590270996094, "global_step": 76568, "epoch": 632} {"train_loss": -34.53581619262695, "global_step": 76569, "epoch": 632} {"train_loss": -34.434146881103516, "global_step": 76570, "epoch": 632} {"train_loss": -34.790950775146484, "global_step": 76571, "epoch": 632} {"train_loss": -36.847434997558594, "global_step": 76572, "epoch": 632} {"train_loss": -36.244964599609375, "global_step": 76573, "epoch": 632} {"train_loss": -36.72445297241211, "global_step": 76574, "epoch": 632} {"train_loss": -36.48943328857422, "global_step": 76575, "epoch": 632} {"train_loss": -37.53729248046875, "global_step": 76576, "epoch": 632} {"train_loss": -36.805335998535156, "global_step": 76577, "epoch": 632} {"train_loss": -37.477996826171875, "global_step": 76578, "epoch": 632} {"train_loss": -37.410762786865234, "global_step": 76579, "epoch": 632} {"train_loss": -37.199947357177734, "global_step": 76580, "epoch": 632} {"train_loss": -37.66469192504883, "global_step": 76581, "epoch": 632} {"train_loss": -37.51372528076172, "global_step": 76582, "epoch": 632} {"train_loss": -37.63877487182617, "global_step": 76583, "epoch": 632} {"train_loss": -37.465450286865234, "global_step": 76584, "epoch": 632} {"train_loss": -36.576351165771484, "global_step": 76585, "epoch": 632} {"train_loss": -37.65061950683594, "global_step": 76586, "epoch": 632} {"train_loss": -37.28902816772461, "global_step": 76587, "epoch": 632} {"train_loss": -37.177001953125, "global_step": 76588, "epoch": 632} {"train_loss": -37.19603729248047, "global_step": 76589, "epoch": 632} {"train_loss": -36.383602142333984, "global_step": 76590, "epoch": 632} {"train_loss": -37.49567794799805, "global_step": 76591, "epoch": 632} {"train_loss": -36.47428427451898, "global_step": 76592, "epoch": 632, "val_loss": 2658778.5} {"train_loss": -36.61130905151367, "global_step": 76593, "epoch": 633} {"train_loss": -37.0970458984375, "global_step": 76594, "epoch": 633} {"train_loss": -36.895565032958984, "global_step": 76595, "epoch": 633} {"train_loss": -37.026851654052734, "global_step": 76596, "epoch": 633} {"train_loss": -37.14743423461914, "global_step": 76597, "epoch": 633} {"train_loss": -37.593421936035156, "global_step": 76598, "epoch": 633} {"train_loss": -37.59129333496094, "global_step": 76599, "epoch": 633} {"train_loss": -37.67534637451172, "global_step": 76600, "epoch": 633} {"train_loss": -37.845455169677734, "global_step": 76601, "epoch": 633} {"train_loss": -37.58937072753906, "global_step": 76602, "epoch": 633} {"train_loss": -37.71316146850586, "global_step": 76603, "epoch": 633} {"train_loss": -37.80710983276367, "global_step": 76604, "epoch": 633} {"train_loss": -37.117244720458984, "global_step": 76605, "epoch": 633} {"train_loss": -37.52919387817383, "global_step": 76606, "epoch": 633} {"train_loss": -37.54777145385742, "global_step": 76607, "epoch": 633} {"train_loss": -37.33897018432617, "global_step": 76608, "epoch": 633} {"train_loss": -38.0382080078125, "global_step": 76609, "epoch": 633} {"train_loss": -37.58856964111328, "global_step": 76610, "epoch": 633} {"train_loss": -37.768646240234375, "global_step": 76611, "epoch": 633} {"train_loss": -37.70392608642578, "global_step": 76612, "epoch": 633} {"train_loss": -37.636871337890625, "global_step": 76613, "epoch": 633} {"train_loss": -36.9137077331543, "global_step": 76614, "epoch": 633} {"train_loss": -37.248016357421875, "global_step": 76615, "epoch": 633} {"train_loss": -36.98072052001953, "global_step": 76616, "epoch": 633} {"train_loss": -36.426177978515625, "global_step": 76617, "epoch": 633} {"train_loss": -36.27043533325195, "global_step": 76618, "epoch": 633} {"train_loss": -33.7631721496582, "global_step": 76619, "epoch": 633} {"train_loss": -31.686750411987305, "global_step": 76620, "epoch": 633} {"train_loss": -31.019092559814453, "global_step": 76621, "epoch": 633} {"train_loss": -33.47099685668945, "global_step": 76622, "epoch": 633} {"train_loss": -36.176177978515625, "global_step": 76623, "epoch": 633} {"train_loss": -36.290260314941406, "global_step": 76624, "epoch": 633} {"train_loss": -35.73299026489258, "global_step": 76625, "epoch": 633} {"train_loss": -35.95586013793945, "global_step": 76626, "epoch": 633} {"train_loss": -35.5837516784668, "global_step": 76627, "epoch": 633} {"train_loss": -34.55231475830078, "global_step": 76628, "epoch": 633} {"train_loss": -35.66047286987305, "global_step": 76629, "epoch": 633} {"train_loss": -36.562313079833984, "global_step": 76630, "epoch": 633} {"train_loss": -36.87508773803711, "global_step": 76631, "epoch": 633} {"train_loss": -36.95829391479492, "global_step": 76632, "epoch": 633} {"train_loss": -36.379493713378906, "global_step": 76633, "epoch": 633} {"train_loss": -34.71458053588867, "global_step": 76634, "epoch": 633} {"train_loss": -36.24240493774414, "global_step": 76635, "epoch": 633} {"train_loss": -36.98974609375, "global_step": 76636, "epoch": 633} {"train_loss": -35.23338317871094, "global_step": 76637, "epoch": 633} {"train_loss": -35.96620559692383, "global_step": 76638, "epoch": 633} {"train_loss": -36.75803756713867, "global_step": 76639, "epoch": 633} {"train_loss": -36.50319290161133, "global_step": 76640, "epoch": 633} {"train_loss": -36.85756301879883, "global_step": 76641, "epoch": 633} {"train_loss": -36.89423370361328, "global_step": 76642, "epoch": 633} {"train_loss": -36.22838592529297, "global_step": 76643, "epoch": 633} {"train_loss": -37.188716888427734, "global_step": 76644, "epoch": 633} {"train_loss": -37.466976165771484, "global_step": 76645, "epoch": 633} {"train_loss": -37.60850524902344, "global_step": 76646, "epoch": 633} {"train_loss": -36.781002044677734, "global_step": 76647, "epoch": 633} {"train_loss": -37.699615478515625, "global_step": 76648, "epoch": 633} {"train_loss": -37.24991989135742, "global_step": 76649, "epoch": 633} {"train_loss": -37.43259048461914, "global_step": 76650, "epoch": 633} {"train_loss": -35.39715576171875, "global_step": 76651, "epoch": 633} {"train_loss": -37.03885269165039, "global_step": 76652, "epoch": 633} {"train_loss": -37.25297164916992, "global_step": 76653, "epoch": 633} {"train_loss": -36.187313079833984, "global_step": 76654, "epoch": 633} {"train_loss": -37.316925048828125, "global_step": 76655, "epoch": 633} {"train_loss": -36.91019821166992, "global_step": 76656, "epoch": 633} {"train_loss": -37.62675094604492, "global_step": 76657, "epoch": 633} {"train_loss": -37.29598617553711, "global_step": 76658, "epoch": 633} {"train_loss": -37.52147674560547, "global_step": 76659, "epoch": 633} {"train_loss": -37.009437561035156, "global_step": 76660, "epoch": 633} {"train_loss": -37.50479507446289, "global_step": 76661, "epoch": 633} {"train_loss": -37.6057014465332, "global_step": 76662, "epoch": 633} {"train_loss": -36.8553466796875, "global_step": 76663, "epoch": 633} {"train_loss": -37.72222900390625, "global_step": 76664, "epoch": 633} {"train_loss": -37.01887130737305, "global_step": 76665, "epoch": 633} {"train_loss": -38.055023193359375, "global_step": 76666, "epoch": 633} {"train_loss": -37.30949020385742, "global_step": 76667, "epoch": 633} {"train_loss": -37.30409240722656, "global_step": 76668, "epoch": 633} {"train_loss": -37.210628509521484, "global_step": 76669, "epoch": 633} {"train_loss": -36.84458541870117, "global_step": 76670, "epoch": 633} {"train_loss": -36.431617736816406, "global_step": 76671, "epoch": 633} {"train_loss": -35.735347747802734, "global_step": 76672, "epoch": 633} {"train_loss": -37.553348541259766, "global_step": 76673, "epoch": 633} {"train_loss": -37.484519958496094, "global_step": 76674, "epoch": 633} {"train_loss": -36.901145935058594, "global_step": 76675, "epoch": 633} {"train_loss": -35.568328857421875, "global_step": 76676, "epoch": 633} {"train_loss": -37.65024948120117, "global_step": 76677, "epoch": 633} {"train_loss": -37.19105911254883, "global_step": 76678, "epoch": 633} {"train_loss": -37.47848129272461, "global_step": 76679, "epoch": 633} {"train_loss": -36.453956604003906, "global_step": 76680, "epoch": 633} {"train_loss": -37.32149124145508, "global_step": 76681, "epoch": 633} {"train_loss": -36.49564743041992, "global_step": 76682, "epoch": 633} {"train_loss": -37.376548767089844, "global_step": 76683, "epoch": 633} {"train_loss": -37.26310348510742, "global_step": 76684, "epoch": 633} {"train_loss": -37.39289093017578, "global_step": 76685, "epoch": 633} {"train_loss": -37.33234405517578, "global_step": 76686, "epoch": 633} {"train_loss": -37.78540802001953, "global_step": 76687, "epoch": 633} {"train_loss": -37.524322509765625, "global_step": 76688, "epoch": 633} {"train_loss": -37.0446662902832, "global_step": 76689, "epoch": 633} {"train_loss": -37.487464904785156, "global_step": 76690, "epoch": 633} {"train_loss": -37.23214340209961, "global_step": 76691, "epoch": 633} {"train_loss": -37.822113037109375, "global_step": 76692, "epoch": 633} {"train_loss": -36.530914306640625, "global_step": 76693, "epoch": 633} {"train_loss": -37.588985443115234, "global_step": 76694, "epoch": 633} {"train_loss": -36.804595947265625, "global_step": 76695, "epoch": 633} {"train_loss": -37.68905258178711, "global_step": 76696, "epoch": 633} {"train_loss": -37.24226760864258, "global_step": 76697, "epoch": 633} {"train_loss": -37.49653244018555, "global_step": 76698, "epoch": 633} {"train_loss": -37.391845703125, "global_step": 76699, "epoch": 633} {"train_loss": -37.41744613647461, "global_step": 76700, "epoch": 633} {"train_loss": -37.12845993041992, "global_step": 76701, "epoch": 633} {"train_loss": -36.74281692504883, "global_step": 76702, "epoch": 633} {"train_loss": -36.86520004272461, "global_step": 76703, "epoch": 633} {"train_loss": -37.05654525756836, "global_step": 76704, "epoch": 633} {"train_loss": -35.13084030151367, "global_step": 76705, "epoch": 633} {"train_loss": -32.61823654174805, "global_step": 76706, "epoch": 633} {"train_loss": -30.719900131225586, "global_step": 76707, "epoch": 633} {"train_loss": -30.355512619018555, "global_step": 76708, "epoch": 633} {"train_loss": -28.84303855895996, "global_step": 76709, "epoch": 633} {"train_loss": -35.992069244384766, "global_step": 76710, "epoch": 633} {"train_loss": -34.9714241027832, "global_step": 76711, "epoch": 633} {"train_loss": -32.62439727783203, "global_step": 76712, "epoch": 633} {"train_loss": -36.56815432714037, "global_step": 76713, "epoch": 633, "val_loss": 2627440.75} {"train_loss": -33.3964729309082, "global_step": 76714, "epoch": 634} {"train_loss": -36.12180709838867, "global_step": 76715, "epoch": 634} {"train_loss": -35.589962005615234, "global_step": 76716, "epoch": 634} {"train_loss": -37.27997589111328, "global_step": 76717, "epoch": 634} {"train_loss": -35.579463958740234, "global_step": 76718, "epoch": 634} {"train_loss": -37.1245231628418, "global_step": 76719, "epoch": 634} {"train_loss": -35.60309982299805, "global_step": 76720, "epoch": 634} {"train_loss": -37.320064544677734, "global_step": 76721, "epoch": 634} {"train_loss": -36.45740509033203, "global_step": 76722, "epoch": 634} {"train_loss": -35.28506851196289, "global_step": 76723, "epoch": 634} {"train_loss": -36.915191650390625, "global_step": 76724, "epoch": 634} {"train_loss": -35.80103302001953, "global_step": 76725, "epoch": 634} {"train_loss": -37.42930603027344, "global_step": 76726, "epoch": 634} {"train_loss": -36.95094680786133, "global_step": 76727, "epoch": 634} {"train_loss": -37.1098518371582, "global_step": 76728, "epoch": 634} {"train_loss": -37.18537521362305, "global_step": 76729, "epoch": 634} {"train_loss": -36.35621643066406, "global_step": 76730, "epoch": 634} {"train_loss": -37.01068878173828, "global_step": 76731, "epoch": 634} {"train_loss": -36.88241195678711, "global_step": 76732, "epoch": 634} {"train_loss": -37.4422492980957, "global_step": 76733, "epoch": 634} {"train_loss": -37.45758056640625, "global_step": 76734, "epoch": 634} {"train_loss": -37.2942008972168, "global_step": 76735, "epoch": 634} {"train_loss": -37.58053207397461, "global_step": 76736, "epoch": 634} {"train_loss": -38.144859313964844, "global_step": 76737, "epoch": 634} {"train_loss": -37.13011932373047, "global_step": 76738, "epoch": 634} {"train_loss": -37.73096466064453, "global_step": 76739, "epoch": 634} {"train_loss": -37.81216049194336, "global_step": 76740, "epoch": 634} {"train_loss": -28.007862091064453, "global_step": 76741, "epoch": 634} {"train_loss": -36.10004806518555, "global_step": 76742, "epoch": 634} {"train_loss": -34.88758850097656, "global_step": 76743, "epoch": 634} {"train_loss": -35.02337646484375, "global_step": 76744, "epoch": 634} {"train_loss": -20.86288070678711, "global_step": 76745, "epoch": 634} {"train_loss": -30.299243927001953, "global_step": 76746, "epoch": 634} {"train_loss": -21.299291610717773, "global_step": 76747, "epoch": 634} {"train_loss": -25.033571243286133, "global_step": 76748, "epoch": 634} {"train_loss": -23.33770179748535, "global_step": 76749, "epoch": 634} {"train_loss": -29.543033599853516, "global_step": 76750, "epoch": 634} {"train_loss": -27.12799644470215, "global_step": 76751, "epoch": 634} {"train_loss": -19.57160758972168, "global_step": 76752, "epoch": 634} {"train_loss": -18.722890853881836, "global_step": 76753, "epoch": 634} {"train_loss": -25.511274337768555, "global_step": 76754, "epoch": 634} {"train_loss": -23.171585083007812, "global_step": 76755, "epoch": 634} {"train_loss": -23.93231201171875, "global_step": 76756, "epoch": 634} {"train_loss": -6.296564102172852, "global_step": 76757, "epoch": 634} {"train_loss": -29.7818603515625, "global_step": 76758, "epoch": 634} {"train_loss": -30.298507690429688, "global_step": 76759, "epoch": 634} {"train_loss": -31.33441162109375, "global_step": 76760, "epoch": 634} {"train_loss": -30.17433738708496, "global_step": 76761, "epoch": 634} {"train_loss": -29.556522369384766, "global_step": 76762, "epoch": 634} {"train_loss": -28.121768951416016, "global_step": 76763, "epoch": 634} {"train_loss": -29.33757972717285, "global_step": 76764, "epoch": 634} {"train_loss": -28.3566837310791, "global_step": 76765, "epoch": 634} {"train_loss": -29.28193473815918, "global_step": 76766, "epoch": 634} {"train_loss": -28.881702423095703, "global_step": 76767, "epoch": 634} {"train_loss": -30.634571075439453, "global_step": 76768, "epoch": 634} {"train_loss": -30.585845947265625, "global_step": 76769, "epoch": 634} {"train_loss": -30.523700714111328, "global_step": 76770, "epoch": 634} {"train_loss": -31.014326095581055, "global_step": 76771, "epoch": 634} {"train_loss": -31.60296630859375, "global_step": 76772, "epoch": 634} {"train_loss": -31.074804306030273, "global_step": 76773, "epoch": 634} {"train_loss": -30.73809242248535, "global_step": 76774, "epoch": 634} {"train_loss": -31.03504753112793, "global_step": 76775, "epoch": 634} {"train_loss": -31.20821189880371, "global_step": 76776, "epoch": 634} {"train_loss": -30.672592163085938, "global_step": 76777, "epoch": 634} {"train_loss": -31.281457901000977, "global_step": 76778, "epoch": 634} {"train_loss": -31.401708602905273, "global_step": 76779, "epoch": 634} {"train_loss": -31.303974151611328, "global_step": 76780, "epoch": 634} {"train_loss": -31.569049835205078, "global_step": 76781, "epoch": 634} {"train_loss": -30.698135375976562, "global_step": 76782, "epoch": 634} {"train_loss": -31.385400772094727, "global_step": 76783, "epoch": 634} {"train_loss": -31.814193725585938, "global_step": 76784, "epoch": 634} {"train_loss": -31.304059982299805, "global_step": 76785, "epoch": 634} {"train_loss": -31.958984375, "global_step": 76786, "epoch": 634} {"train_loss": -31.949371337890625, "global_step": 76787, "epoch": 634} {"train_loss": -31.754114151000977, "global_step": 76788, "epoch": 634} {"train_loss": -31.509008407592773, "global_step": 76789, "epoch": 634} {"train_loss": -31.5900936126709, "global_step": 76790, "epoch": 634} {"train_loss": -32.14476013183594, "global_step": 76791, "epoch": 634} {"train_loss": -32.353694915771484, "global_step": 76792, "epoch": 634} {"train_loss": -32.3115234375, "global_step": 76793, "epoch": 634} {"train_loss": -32.1845703125, "global_step": 76794, "epoch": 634} {"train_loss": -32.21084213256836, "global_step": 76795, "epoch": 634} {"train_loss": -32.8125, "global_step": 76796, "epoch": 634} {"train_loss": -33.77079772949219, "global_step": 76797, "epoch": 634} {"train_loss": -32.606319427490234, "global_step": 76798, "epoch": 634} {"train_loss": -32.01951217651367, "global_step": 76799, "epoch": 634} {"train_loss": -32.71749496459961, "global_step": 76800, "epoch": 634} {"train_loss": -33.55482864379883, "global_step": 76801, "epoch": 634} {"train_loss": -33.22071075439453, "global_step": 76802, "epoch": 634} {"train_loss": -32.369720458984375, "global_step": 76803, "epoch": 634} {"train_loss": -32.790557861328125, "global_step": 76804, "epoch": 634} {"train_loss": -32.73756408691406, "global_step": 76805, "epoch": 634} {"train_loss": -33.354061126708984, "global_step": 76806, "epoch": 634} {"train_loss": -33.034488677978516, "global_step": 76807, "epoch": 634} {"train_loss": -32.78056716918945, "global_step": 76808, "epoch": 634} {"train_loss": -34.00278854370117, "global_step": 76809, "epoch": 634} {"train_loss": -33.15053176879883, "global_step": 76810, "epoch": 634} {"train_loss": -33.47617721557617, "global_step": 76811, "epoch": 634} {"train_loss": -33.55404281616211, "global_step": 76812, "epoch": 634} {"train_loss": -33.05229187011719, "global_step": 76813, "epoch": 634} {"train_loss": -32.86256790161133, "global_step": 76814, "epoch": 634} {"train_loss": -33.41093063354492, "global_step": 76815, "epoch": 634} {"train_loss": -34.048641204833984, "global_step": 76816, "epoch": 634} {"train_loss": -33.11797332763672, "global_step": 76817, "epoch": 634} {"train_loss": -34.50936508178711, "global_step": 76818, "epoch": 634} {"train_loss": -34.782833099365234, "global_step": 76819, "epoch": 634} {"train_loss": -34.292640686035156, "global_step": 76820, "epoch": 634} {"train_loss": -33.872100830078125, "global_step": 76821, "epoch": 634} {"train_loss": -34.631622314453125, "global_step": 76822, "epoch": 634} {"train_loss": -33.940948486328125, "global_step": 76823, "epoch": 634} {"train_loss": -33.9547233581543, "global_step": 76824, "epoch": 634} {"train_loss": -35.00129699707031, "global_step": 76825, "epoch": 634} {"train_loss": -33.95729446411133, "global_step": 76826, "epoch": 634} {"train_loss": -34.34614181518555, "global_step": 76827, "epoch": 634} {"train_loss": -34.630062103271484, "global_step": 76828, "epoch": 634} {"train_loss": -34.42887496948242, "global_step": 76829, "epoch": 634} {"train_loss": -35.14963912963867, "global_step": 76830, "epoch": 634} {"train_loss": -33.8118896484375, "global_step": 76831, "epoch": 634} {"train_loss": -33.2730827331543, "global_step": 76832, "epoch": 634} {"train_loss": -33.941322326660156, "global_step": 76833, "epoch": 634} {"train_loss": -32.26844734002736, "global_step": 76834, "epoch": 634, "val_loss": 2689044.25} {"train_loss": -34.47732925415039, "global_step": 76835, "epoch": 635} {"train_loss": -34.291534423828125, "global_step": 76836, "epoch": 635} {"train_loss": -33.600887298583984, "global_step": 76837, "epoch": 635} {"train_loss": -32.64510726928711, "global_step": 76838, "epoch": 635} {"train_loss": -32.74164581298828, "global_step": 76839, "epoch": 635} {"train_loss": -34.24953079223633, "global_step": 76840, "epoch": 635} {"train_loss": -32.57546615600586, "global_step": 76841, "epoch": 635} {"train_loss": -34.30730056762695, "global_step": 76842, "epoch": 635} {"train_loss": -33.0566291809082, "global_step": 76843, "epoch": 635} {"train_loss": -34.93366241455078, "global_step": 76844, "epoch": 635} {"train_loss": -34.28620147705078, "global_step": 76845, "epoch": 635} {"train_loss": -34.783058166503906, "global_step": 76846, "epoch": 635} {"train_loss": -34.6202392578125, "global_step": 76847, "epoch": 635} {"train_loss": -35.128963470458984, "global_step": 76848, "epoch": 635} {"train_loss": -34.90638732910156, "global_step": 76849, "epoch": 635} {"train_loss": -34.86654281616211, "global_step": 76850, "epoch": 635} {"train_loss": -35.01668930053711, "global_step": 76851, "epoch": 635} {"train_loss": -34.73978805541992, "global_step": 76852, "epoch": 635} {"train_loss": -34.74598693847656, "global_step": 76853, "epoch": 635} {"train_loss": -35.44477462768555, "global_step": 76854, "epoch": 635} {"train_loss": -35.43363571166992, "global_step": 76855, "epoch": 635} {"train_loss": -35.22806930541992, "global_step": 76856, "epoch": 635} {"train_loss": -35.27126693725586, "global_step": 76857, "epoch": 635} {"train_loss": -35.02956008911133, "global_step": 76858, "epoch": 635} {"train_loss": -35.469268798828125, "global_step": 76859, "epoch": 635} {"train_loss": -35.50017547607422, "global_step": 76860, "epoch": 635} {"train_loss": -35.16721725463867, "global_step": 76861, "epoch": 635} {"train_loss": -34.961219787597656, "global_step": 76862, "epoch": 635} {"train_loss": -35.12077713012695, "global_step": 76863, "epoch": 635} {"train_loss": -36.00752639770508, "global_step": 76864, "epoch": 635} {"train_loss": -35.62348556518555, "global_step": 76865, "epoch": 635} {"train_loss": -35.50157928466797, "global_step": 76866, "epoch": 635} {"train_loss": -36.56690216064453, "global_step": 76867, "epoch": 635} {"train_loss": -36.14155960083008, "global_step": 76868, "epoch": 635} {"train_loss": -35.777015686035156, "global_step": 76869, "epoch": 635} {"train_loss": -35.569313049316406, "global_step": 76870, "epoch": 635} {"train_loss": -36.3101921081543, "global_step": 76871, "epoch": 635} {"train_loss": -35.083499908447266, "global_step": 76872, "epoch": 635} {"train_loss": -36.09111404418945, "global_step": 76873, "epoch": 635} {"train_loss": -35.717132568359375, "global_step": 76874, "epoch": 635} {"train_loss": -36.6949348449707, "global_step": 76875, "epoch": 635} {"train_loss": -35.6790885925293, "global_step": 76876, "epoch": 635} {"train_loss": -36.32841110229492, "global_step": 76877, "epoch": 635} {"train_loss": -36.05744552612305, "global_step": 76878, "epoch": 635} {"train_loss": -35.918941497802734, "global_step": 76879, "epoch": 635} {"train_loss": -35.793174743652344, "global_step": 76880, "epoch": 635} {"train_loss": -36.40876388549805, "global_step": 76881, "epoch": 635} {"train_loss": -36.12911605834961, "global_step": 76882, "epoch": 635} {"train_loss": -36.22475814819336, "global_step": 76883, "epoch": 635} {"train_loss": -35.5706901550293, "global_step": 76884, "epoch": 635} {"train_loss": -36.777862548828125, "global_step": 76885, "epoch": 635} {"train_loss": -35.489952087402344, "global_step": 76886, "epoch": 635} {"train_loss": -36.144195556640625, "global_step": 76887, "epoch": 635} {"train_loss": -37.01763916015625, "global_step": 76888, "epoch": 635} {"train_loss": -35.33229064941406, "global_step": 76889, "epoch": 635} {"train_loss": -36.3607292175293, "global_step": 76890, "epoch": 635} {"train_loss": -35.79920196533203, "global_step": 76891, "epoch": 635} {"train_loss": -35.6076545715332, "global_step": 76892, "epoch": 635} {"train_loss": -36.51963806152344, "global_step": 76893, "epoch": 635} {"train_loss": -36.057918548583984, "global_step": 76894, "epoch": 635} {"train_loss": -36.38644027709961, "global_step": 76895, "epoch": 635} {"train_loss": -36.30569076538086, "global_step": 76896, "epoch": 635} {"train_loss": -36.1737060546875, "global_step": 76897, "epoch": 635} {"train_loss": -35.978607177734375, "global_step": 76898, "epoch": 635} {"train_loss": -34.40313720703125, "global_step": 76899, "epoch": 635} {"train_loss": -32.55643844604492, "global_step": 76900, "epoch": 635} {"train_loss": -19.0915584564209, "global_step": 76901, "epoch": 635} {"train_loss": 33.53312301635742, "global_step": 76902, "epoch": 635} {"train_loss": 25.464431762695312, "global_step": 76903, "epoch": 635} {"train_loss": -28.106494903564453, "global_step": 76904, "epoch": 635} {"train_loss": 6.754950046539307, "global_step": 76905, "epoch": 635} {"train_loss": -20.374128341674805, "global_step": 76906, "epoch": 635} {"train_loss": -19.44925880432129, "global_step": 76907, "epoch": 635} {"train_loss": -13.271140098571777, "global_step": 76908, "epoch": 635} {"train_loss": -32.627437591552734, "global_step": 76909, "epoch": 635} {"train_loss": -19.461578369140625, "global_step": 76910, "epoch": 635} {"train_loss": -25.015056610107422, "global_step": 76911, "epoch": 635} {"train_loss": -32.72556686401367, "global_step": 76912, "epoch": 635} {"train_loss": -31.399206161499023, "global_step": 76913, "epoch": 635} {"train_loss": -25.237041473388672, "global_step": 76914, "epoch": 635} {"train_loss": -27.70576286315918, "global_step": 76915, "epoch": 635} {"train_loss": -32.34668731689453, "global_step": 76916, "epoch": 635} {"train_loss": -33.221004486083984, "global_step": 76917, "epoch": 635} {"train_loss": -30.611469268798828, "global_step": 76918, "epoch": 635} {"train_loss": -30.499975204467773, "global_step": 76919, "epoch": 635} {"train_loss": -31.0194034576416, "global_step": 76920, "epoch": 635} {"train_loss": -32.21134567260742, "global_step": 76921, "epoch": 635} {"train_loss": -33.2715950012207, "global_step": 76922, "epoch": 635} {"train_loss": -33.211090087890625, "global_step": 76923, "epoch": 635} {"train_loss": -32.83114242553711, "global_step": 76924, "epoch": 635} {"train_loss": -32.79684066772461, "global_step": 76925, "epoch": 635} {"train_loss": -32.789894104003906, "global_step": 76926, "epoch": 635} {"train_loss": -32.647647857666016, "global_step": 76927, "epoch": 635} {"train_loss": -33.56235885620117, "global_step": 76928, "epoch": 635} {"train_loss": -33.048614501953125, "global_step": 76929, "epoch": 635} {"train_loss": -33.57973098754883, "global_step": 76930, "epoch": 635} {"train_loss": -33.616943359375, "global_step": 76931, "epoch": 635} {"train_loss": -33.3037223815918, "global_step": 76932, "epoch": 635} {"train_loss": -32.975120544433594, "global_step": 76933, "epoch": 635} {"train_loss": -33.35231399536133, "global_step": 76934, "epoch": 635} {"train_loss": -34.19799041748047, "global_step": 76935, "epoch": 635} {"train_loss": -33.93018341064453, "global_step": 76936, "epoch": 635} {"train_loss": -33.950950622558594, "global_step": 76937, "epoch": 635} {"train_loss": -33.935203552246094, "global_step": 76938, "epoch": 635} {"train_loss": -33.855587005615234, "global_step": 76939, "epoch": 635} {"train_loss": -33.97997283935547, "global_step": 76940, "epoch": 635} {"train_loss": -34.21879959106445, "global_step": 76941, "epoch": 635} {"train_loss": -34.52081298828125, "global_step": 76942, "epoch": 635} {"train_loss": -34.45737838745117, "global_step": 76943, "epoch": 635} {"train_loss": -34.66469955444336, "global_step": 76944, "epoch": 635} {"train_loss": -34.162879943847656, "global_step": 76945, "epoch": 635} {"train_loss": -34.56827163696289, "global_step": 76946, "epoch": 635} {"train_loss": -34.89010238647461, "global_step": 76947, "epoch": 635} {"train_loss": -34.74338150024414, "global_step": 76948, "epoch": 635} {"train_loss": -34.86720657348633, "global_step": 76949, "epoch": 635} {"train_loss": -34.95862579345703, "global_step": 76950, "epoch": 635} {"train_loss": -35.28147506713867, "global_step": 76951, "epoch": 635} {"train_loss": -35.39875411987305, "global_step": 76952, "epoch": 635} {"train_loss": -35.16765213012695, "global_step": 76953, "epoch": 635} {"train_loss": -35.727020263671875, "global_step": 76954, "epoch": 635} {"train_loss": -32.287454293779106, "global_step": 76955, "epoch": 635, "val_loss": 2674769.25} {"train_loss": -35.56644821166992, "global_step": 76956, "epoch": 636} {"train_loss": -35.40528106689453, "global_step": 76957, "epoch": 636} {"train_loss": -35.36809158325195, "global_step": 76958, "epoch": 636} {"train_loss": -35.8031005859375, "global_step": 76959, "epoch": 636} {"train_loss": -35.44456100463867, "global_step": 76960, "epoch": 636} {"train_loss": -35.38264083862305, "global_step": 76961, "epoch": 636} {"train_loss": -35.8848991394043, "global_step": 76962, "epoch": 636} {"train_loss": -35.372737884521484, "global_step": 76963, "epoch": 636} {"train_loss": -35.94118881225586, "global_step": 76964, "epoch": 636} {"train_loss": -35.95235061645508, "global_step": 76965, "epoch": 636} {"train_loss": -35.71195602416992, "global_step": 76966, "epoch": 636} {"train_loss": -35.974464416503906, "global_step": 76967, "epoch": 636} {"train_loss": -35.49835968017578, "global_step": 76968, "epoch": 636} {"train_loss": -35.23172378540039, "global_step": 76969, "epoch": 636} {"train_loss": -36.102569580078125, "global_step": 76970, "epoch": 636} {"train_loss": -36.15036392211914, "global_step": 76971, "epoch": 636} {"train_loss": -36.3555908203125, "global_step": 76972, "epoch": 636} {"train_loss": -35.89619827270508, "global_step": 76973, "epoch": 636} {"train_loss": -35.984405517578125, "global_step": 76974, "epoch": 636} {"train_loss": -36.54219436645508, "global_step": 76975, "epoch": 636} {"train_loss": -35.89005661010742, "global_step": 76976, "epoch": 636} {"train_loss": -36.1901741027832, "global_step": 76977, "epoch": 636} {"train_loss": -36.170196533203125, "global_step": 76978, "epoch": 636} {"train_loss": -36.273372650146484, "global_step": 76979, "epoch": 636} {"train_loss": -36.40729904174805, "global_step": 76980, "epoch": 636} {"train_loss": -36.64067459106445, "global_step": 76981, "epoch": 636} {"train_loss": -36.88190460205078, "global_step": 76982, "epoch": 636} {"train_loss": -36.0467414855957, "global_step": 76983, "epoch": 636} {"train_loss": -36.453956604003906, "global_step": 76984, "epoch": 636} {"train_loss": -37.001258850097656, "global_step": 76985, "epoch": 636} {"train_loss": -36.484676361083984, "global_step": 76986, "epoch": 636} {"train_loss": -36.10056686401367, "global_step": 76987, "epoch": 636} {"train_loss": -36.78566360473633, "global_step": 76988, "epoch": 636} {"train_loss": -36.3612060546875, "global_step": 76989, "epoch": 636} {"train_loss": -36.7479248046875, "global_step": 76990, "epoch": 636} {"train_loss": -36.781654357910156, "global_step": 76991, "epoch": 636} {"train_loss": -36.73165512084961, "global_step": 76992, "epoch": 636} {"train_loss": -36.8277702331543, "global_step": 76993, "epoch": 636} {"train_loss": -36.441951751708984, "global_step": 76994, "epoch": 636} {"train_loss": -36.29585647583008, "global_step": 76995, "epoch": 636} {"train_loss": -36.61141586303711, "global_step": 76996, "epoch": 636} {"train_loss": -37.01983642578125, "global_step": 76997, "epoch": 636} {"train_loss": -36.13947677612305, "global_step": 76998, "epoch": 636} {"train_loss": -36.57770919799805, "global_step": 76999, "epoch": 636} {"train_loss": -36.448204040527344, "global_step": 77000, "epoch": 636} {"train_loss": -36.39908981323242, "global_step": 77001, "epoch": 636} {"train_loss": -37.153709411621094, "global_step": 77002, "epoch": 636} {"train_loss": -36.26420211791992, "global_step": 77003, "epoch": 636} {"train_loss": -36.42000961303711, "global_step": 77004, "epoch": 636} {"train_loss": -36.795616149902344, "global_step": 77005, "epoch": 636} {"train_loss": -36.93497848510742, "global_step": 77006, "epoch": 636} {"train_loss": -36.621429443359375, "global_step": 77007, "epoch": 636} {"train_loss": -36.928436279296875, "global_step": 77008, "epoch": 636} {"train_loss": -36.515594482421875, "global_step": 77009, "epoch": 636} {"train_loss": -36.75861740112305, "global_step": 77010, "epoch": 636} {"train_loss": -36.55916976928711, "global_step": 77011, "epoch": 636} {"train_loss": -36.96326446533203, "global_step": 77012, "epoch": 636} {"train_loss": -37.38681411743164, "global_step": 77013, "epoch": 636} {"train_loss": -36.836605072021484, "global_step": 77014, "epoch": 636} {"train_loss": -36.81541061401367, "global_step": 77015, "epoch": 636} {"train_loss": -36.49811553955078, "global_step": 77016, "epoch": 636} {"train_loss": -36.35377502441406, "global_step": 77017, "epoch": 636} {"train_loss": -35.2424430847168, "global_step": 77018, "epoch": 636} {"train_loss": -31.191883087158203, "global_step": 77019, "epoch": 636} {"train_loss": -20.549203872680664, "global_step": 77020, "epoch": 636} {"train_loss": -12.528830528259277, "global_step": 77021, "epoch": 636} {"train_loss": -19.73316764831543, "global_step": 77022, "epoch": 636} {"train_loss": -29.728687286376953, "global_step": 77023, "epoch": 636} {"train_loss": -29.47393226623535, "global_step": 77024, "epoch": 636} {"train_loss": -30.598388671875, "global_step": 77025, "epoch": 636} {"train_loss": -30.40532875061035, "global_step": 77026, "epoch": 636} {"train_loss": -32.94358825683594, "global_step": 77027, "epoch": 636} {"train_loss": -32.6153678894043, "global_step": 77028, "epoch": 636} {"train_loss": -33.42924118041992, "global_step": 77029, "epoch": 636} {"train_loss": -33.309566497802734, "global_step": 77030, "epoch": 636} {"train_loss": -33.95195770263672, "global_step": 77031, "epoch": 636} {"train_loss": -33.31724548339844, "global_step": 77032, "epoch": 636} {"train_loss": -34.35778045654297, "global_step": 77033, "epoch": 636} {"train_loss": -33.75301742553711, "global_step": 77034, "epoch": 636} {"train_loss": -34.28473663330078, "global_step": 77035, "epoch": 636} {"train_loss": -34.996726989746094, "global_step": 77036, "epoch": 636} {"train_loss": -34.13546371459961, "global_step": 77037, "epoch": 636} {"train_loss": -34.88608932495117, "global_step": 77038, "epoch": 636} {"train_loss": -34.44851303100586, "global_step": 77039, "epoch": 636} {"train_loss": -34.79297637939453, "global_step": 77040, "epoch": 636} {"train_loss": -35.15116500854492, "global_step": 77041, "epoch": 636} {"train_loss": -35.183837890625, "global_step": 77042, "epoch": 636} {"train_loss": -35.30087661743164, "global_step": 77043, "epoch": 636} {"train_loss": -35.32122039794922, "global_step": 77044, "epoch": 636} {"train_loss": -35.313819885253906, "global_step": 77045, "epoch": 636} {"train_loss": -34.89299392700195, "global_step": 77046, "epoch": 636} {"train_loss": -35.442054748535156, "global_step": 77047, "epoch": 636} {"train_loss": -35.62201690673828, "global_step": 77048, "epoch": 636} {"train_loss": -35.718082427978516, "global_step": 77049, "epoch": 636} {"train_loss": -35.527809143066406, "global_step": 77050, "epoch": 636} {"train_loss": -35.299285888671875, "global_step": 77051, "epoch": 636} {"train_loss": -35.74063491821289, "global_step": 77052, "epoch": 636} {"train_loss": -35.834075927734375, "global_step": 77053, "epoch": 636} {"train_loss": -35.98344421386719, "global_step": 77054, "epoch": 636} {"train_loss": -35.231834411621094, "global_step": 77055, "epoch": 636} {"train_loss": -36.09270477294922, "global_step": 77056, "epoch": 636} {"train_loss": -35.27743148803711, "global_step": 77057, "epoch": 636} {"train_loss": -36.194793701171875, "global_step": 77058, "epoch": 636} {"train_loss": -35.43855667114258, "global_step": 77059, "epoch": 636} {"train_loss": -35.741607666015625, "global_step": 77060, "epoch": 636} {"train_loss": -35.69377899169922, "global_step": 77061, "epoch": 636} {"train_loss": -36.00254440307617, "global_step": 77062, "epoch": 636} {"train_loss": -36.19533157348633, "global_step": 77063, "epoch": 636} {"train_loss": -36.22481918334961, "global_step": 77064, "epoch": 636} {"train_loss": -36.25501251220703, "global_step": 77065, "epoch": 636} {"train_loss": -36.29111099243164, "global_step": 77066, "epoch": 636} {"train_loss": -36.04641342163086, "global_step": 77067, "epoch": 636} {"train_loss": -35.9813117980957, "global_step": 77068, "epoch": 636} {"train_loss": -35.85077667236328, "global_step": 77069, "epoch": 636} {"train_loss": -36.138912200927734, "global_step": 77070, "epoch": 636} {"train_loss": -36.15890884399414, "global_step": 77071, "epoch": 636} {"train_loss": -36.374874114990234, "global_step": 77072, "epoch": 636} {"train_loss": -36.5308723449707, "global_step": 77073, "epoch": 636} {"train_loss": -36.34220504760742, "global_step": 77074, "epoch": 636} {"train_loss": -35.888580322265625, "global_step": 77075, "epoch": 636} {"train_loss": -35.17302186035913, "global_step": 77076, "epoch": 636, "val_loss": 2670395.25} {"train_loss": -36.53898239135742, "global_step": 77077, "epoch": 637} {"train_loss": -36.66191864013672, "global_step": 77078, "epoch": 637} {"train_loss": -36.758907318115234, "global_step": 77079, "epoch": 637} {"train_loss": -36.58683395385742, "global_step": 77080, "epoch": 637} {"train_loss": -36.8293571472168, "global_step": 77081, "epoch": 637} {"train_loss": -36.80530548095703, "global_step": 77082, "epoch": 637} {"train_loss": -36.993804931640625, "global_step": 77083, "epoch": 637} {"train_loss": -36.42184066772461, "global_step": 77084, "epoch": 637} {"train_loss": -36.874176025390625, "global_step": 77085, "epoch": 637} {"train_loss": -36.746986389160156, "global_step": 77086, "epoch": 637} {"train_loss": -37.08544921875, "global_step": 77087, "epoch": 637} {"train_loss": -37.08881759643555, "global_step": 77088, "epoch": 637} {"train_loss": -37.10200500488281, "global_step": 77089, "epoch": 637} {"train_loss": -37.13087463378906, "global_step": 77090, "epoch": 637} {"train_loss": -37.08506393432617, "global_step": 77091, "epoch": 637} {"train_loss": -37.46470260620117, "global_step": 77092, "epoch": 637} {"train_loss": -36.57035446166992, "global_step": 77093, "epoch": 637} {"train_loss": -36.1727409362793, "global_step": 77094, "epoch": 637} {"train_loss": -36.610721588134766, "global_step": 77095, "epoch": 637} {"train_loss": -36.93435287475586, "global_step": 77096, "epoch": 637} {"train_loss": -36.30327224731445, "global_step": 77097, "epoch": 637} {"train_loss": -35.743553161621094, "global_step": 77098, "epoch": 637} {"train_loss": -30.663625717163086, "global_step": 77099, "epoch": 637} {"train_loss": -25.793060302734375, "global_step": 77100, "epoch": 637} {"train_loss": -27.621875762939453, "global_step": 77101, "epoch": 637} {"train_loss": -36.352054595947266, "global_step": 77102, "epoch": 637} {"train_loss": -30.00217056274414, "global_step": 77103, "epoch": 637} {"train_loss": -33.58260726928711, "global_step": 77104, "epoch": 637} {"train_loss": -34.459529876708984, "global_step": 77105, "epoch": 637} {"train_loss": -34.525489807128906, "global_step": 77106, "epoch": 637} {"train_loss": -35.11642074584961, "global_step": 77107, "epoch": 637} {"train_loss": -35.30998611450195, "global_step": 77108, "epoch": 637} {"train_loss": -34.97295379638672, "global_step": 77109, "epoch": 637} {"train_loss": -35.31162643432617, "global_step": 77110, "epoch": 637} {"train_loss": -35.4488639831543, "global_step": 77111, "epoch": 637} {"train_loss": -36.4581413269043, "global_step": 77112, "epoch": 637} {"train_loss": -35.42714309692383, "global_step": 77113, "epoch": 637} {"train_loss": -36.391357421875, "global_step": 77114, "epoch": 637} {"train_loss": -35.93245315551758, "global_step": 77115, "epoch": 637} {"train_loss": -35.9893798828125, "global_step": 77116, "epoch": 637} {"train_loss": -36.47225570678711, "global_step": 77117, "epoch": 637} {"train_loss": -36.27958679199219, "global_step": 77118, "epoch": 637} {"train_loss": -36.218406677246094, "global_step": 77119, "epoch": 637} {"train_loss": -36.63932800292969, "global_step": 77120, "epoch": 637} {"train_loss": -36.290679931640625, "global_step": 77121, "epoch": 637} {"train_loss": -36.561580657958984, "global_step": 77122, "epoch": 637} {"train_loss": -36.98088455200195, "global_step": 77123, "epoch": 637} {"train_loss": -36.39223098754883, "global_step": 77124, "epoch": 637} {"train_loss": -35.843563079833984, "global_step": 77125, "epoch": 637} {"train_loss": -36.91484451293945, "global_step": 77126, "epoch": 637} {"train_loss": -35.7563591003418, "global_step": 77127, "epoch": 637} {"train_loss": -36.40340042114258, "global_step": 77128, "epoch": 637} {"train_loss": -36.42384719848633, "global_step": 77129, "epoch": 637} {"train_loss": -36.5196647644043, "global_step": 77130, "epoch": 637} {"train_loss": -36.641326904296875, "global_step": 77131, "epoch": 637} {"train_loss": -36.45246124267578, "global_step": 77132, "epoch": 637} {"train_loss": -36.94704818725586, "global_step": 77133, "epoch": 637} {"train_loss": -36.809940338134766, "global_step": 77134, "epoch": 637} {"train_loss": -36.175662994384766, "global_step": 77135, "epoch": 637} {"train_loss": -37.05735397338867, "global_step": 77136, "epoch": 637} {"train_loss": -36.54526901245117, "global_step": 77137, "epoch": 637} {"train_loss": -37.0288200378418, "global_step": 77138, "epoch": 637} {"train_loss": -36.94757080078125, "global_step": 77139, "epoch": 637} {"train_loss": -37.12085723876953, "global_step": 77140, "epoch": 637} {"train_loss": -36.97584533691406, "global_step": 77141, "epoch": 637} {"train_loss": -36.9373893737793, "global_step": 77142, "epoch": 637} {"train_loss": -36.869972229003906, "global_step": 77143, "epoch": 637} {"train_loss": -36.94187927246094, "global_step": 77144, "epoch": 637} {"train_loss": -37.03548049926758, "global_step": 77145, "epoch": 637} {"train_loss": -36.45194625854492, "global_step": 77146, "epoch": 637} {"train_loss": -36.456390380859375, "global_step": 77147, "epoch": 637} {"train_loss": -36.415863037109375, "global_step": 77148, "epoch": 637} {"train_loss": -37.29523468017578, "global_step": 77149, "epoch": 637} {"train_loss": -36.99005889892578, "global_step": 77150, "epoch": 637} {"train_loss": -35.614715576171875, "global_step": 77151, "epoch": 637} {"train_loss": -37.154396057128906, "global_step": 77152, "epoch": 637} {"train_loss": -36.54258346557617, "global_step": 77153, "epoch": 637} {"train_loss": -36.77840805053711, "global_step": 77154, "epoch": 637} {"train_loss": -36.19663619995117, "global_step": 77155, "epoch": 637} {"train_loss": -36.011653900146484, "global_step": 77156, "epoch": 637} {"train_loss": -37.10032272338867, "global_step": 77157, "epoch": 637} {"train_loss": -35.9510498046875, "global_step": 77158, "epoch": 637} {"train_loss": -37.119659423828125, "global_step": 77159, "epoch": 637} {"train_loss": -36.70682907104492, "global_step": 77160, "epoch": 637} {"train_loss": -36.92843246459961, "global_step": 77161, "epoch": 637} {"train_loss": -37.346397399902344, "global_step": 77162, "epoch": 637} {"train_loss": -36.592552185058594, "global_step": 77163, "epoch": 637} {"train_loss": -36.606910705566406, "global_step": 77164, "epoch": 637} {"train_loss": -36.37336730957031, "global_step": 77165, "epoch": 637} {"train_loss": -37.388545989990234, "global_step": 77166, "epoch": 637} {"train_loss": -37.60459518432617, "global_step": 77167, "epoch": 637} {"train_loss": -37.385711669921875, "global_step": 77168, "epoch": 637} {"train_loss": -37.2285270690918, "global_step": 77169, "epoch": 637} {"train_loss": -36.9972038269043, "global_step": 77170, "epoch": 637} {"train_loss": -36.80686569213867, "global_step": 77171, "epoch": 637} {"train_loss": -36.7381477355957, "global_step": 77172, "epoch": 637} {"train_loss": -37.23724365234375, "global_step": 77173, "epoch": 637} {"train_loss": -37.28474044799805, "global_step": 77174, "epoch": 637} {"train_loss": -37.51596450805664, "global_step": 77175, "epoch": 637} {"train_loss": -37.1553840637207, "global_step": 77176, "epoch": 637} {"train_loss": -36.44171905517578, "global_step": 77177, "epoch": 637} {"train_loss": -36.46368408203125, "global_step": 77178, "epoch": 637} {"train_loss": -35.22576904296875, "global_step": 77179, "epoch": 637} {"train_loss": -33.20143508911133, "global_step": 77180, "epoch": 637} {"train_loss": -31.741430282592773, "global_step": 77181, "epoch": 637} {"train_loss": -24.766855239868164, "global_step": 77182, "epoch": 637} {"train_loss": -30.238880157470703, "global_step": 77183, "epoch": 637} {"train_loss": -34.98716735839844, "global_step": 77184, "epoch": 637} {"train_loss": -30.950056076049805, "global_step": 77185, "epoch": 637} {"train_loss": -26.784326553344727, "global_step": 77186, "epoch": 637} {"train_loss": -29.794599533081055, "global_step": 77187, "epoch": 637} {"train_loss": -30.25282096862793, "global_step": 77188, "epoch": 637} {"train_loss": -32.86658477783203, "global_step": 77189, "epoch": 637} {"train_loss": -28.121442794799805, "global_step": 77190, "epoch": 637} {"train_loss": -32.04279708862305, "global_step": 77191, "epoch": 637} {"train_loss": -30.810943603515625, "global_step": 77192, "epoch": 637} {"train_loss": -32.487064361572266, "global_step": 77193, "epoch": 637} {"train_loss": -31.950620651245117, "global_step": 77194, "epoch": 637} {"train_loss": -32.435359954833984, "global_step": 77195, "epoch": 637} {"train_loss": -33.94605255126953, "global_step": 77196, "epoch": 637} {"train_loss": -35.462836825157986, "global_step": 77197, "epoch": 637, "val_loss": 2714820.25} {"train_loss": -32.881771087646484, "global_step": 77198, "epoch": 638} {"train_loss": -34.94318771362305, "global_step": 77199, "epoch": 638} {"train_loss": -34.7945556640625, "global_step": 77200, "epoch": 638} {"train_loss": -34.73579788208008, "global_step": 77201, "epoch": 638} {"train_loss": -35.22792053222656, "global_step": 77202, "epoch": 638} {"train_loss": -34.094852447509766, "global_step": 77203, "epoch": 638} {"train_loss": -35.63778305053711, "global_step": 77204, "epoch": 638} {"train_loss": -34.41581344604492, "global_step": 77205, "epoch": 638} {"train_loss": -35.791770935058594, "global_step": 77206, "epoch": 638} {"train_loss": -35.082359313964844, "global_step": 77207, "epoch": 638} {"train_loss": -35.80607223510742, "global_step": 77208, "epoch": 638} {"train_loss": -35.5034294128418, "global_step": 77209, "epoch": 638} {"train_loss": -35.972137451171875, "global_step": 77210, "epoch": 638} {"train_loss": -34.812984466552734, "global_step": 77211, "epoch": 638} {"train_loss": -36.35648727416992, "global_step": 77212, "epoch": 638} {"train_loss": -35.70820236206055, "global_step": 77213, "epoch": 638} {"train_loss": -35.91415786743164, "global_step": 77214, "epoch": 638} {"train_loss": -36.186222076416016, "global_step": 77215, "epoch": 638} {"train_loss": -36.14823532104492, "global_step": 77216, "epoch": 638} {"train_loss": -36.084842681884766, "global_step": 77217, "epoch": 638} {"train_loss": -36.5368766784668, "global_step": 77218, "epoch": 638} {"train_loss": -36.24221420288086, "global_step": 77219, "epoch": 638} {"train_loss": -36.4299201965332, "global_step": 77220, "epoch": 638} {"train_loss": -34.51161193847656, "global_step": 77221, "epoch": 638} {"train_loss": -36.422454833984375, "global_step": 77222, "epoch": 638} {"train_loss": -36.54671859741211, "global_step": 77223, "epoch": 638} {"train_loss": -36.92894744873047, "global_step": 77224, "epoch": 638} {"train_loss": -36.47587966918945, "global_step": 77225, "epoch": 638} {"train_loss": -37.15419387817383, "global_step": 77226, "epoch": 638} {"train_loss": -36.97459030151367, "global_step": 77227, "epoch": 638} {"train_loss": -35.36957550048828, "global_step": 77228, "epoch": 638} {"train_loss": -36.28297805786133, "global_step": 77229, "epoch": 638} {"train_loss": -36.05453109741211, "global_step": 77230, "epoch": 638} {"train_loss": -37.048824310302734, "global_step": 77231, "epoch": 638} {"train_loss": -37.056312561035156, "global_step": 77232, "epoch": 638} {"train_loss": -37.07645034790039, "global_step": 77233, "epoch": 638} {"train_loss": -36.4822998046875, "global_step": 77234, "epoch": 638} {"train_loss": -35.957008361816406, "global_step": 77235, "epoch": 638} {"train_loss": -36.9021110534668, "global_step": 77236, "epoch": 638} {"train_loss": -37.165714263916016, "global_step": 77237, "epoch": 638} {"train_loss": -37.3317756652832, "global_step": 77238, "epoch": 638} {"train_loss": -36.83321762084961, "global_step": 77239, "epoch": 638} {"train_loss": -36.56280517578125, "global_step": 77240, "epoch": 638} {"train_loss": -36.875030517578125, "global_step": 77241, "epoch": 638} {"train_loss": -37.21011734008789, "global_step": 77242, "epoch": 638} {"train_loss": -37.01300048828125, "global_step": 77243, "epoch": 638} {"train_loss": -36.98798370361328, "global_step": 77244, "epoch": 638} {"train_loss": -36.95381546020508, "global_step": 77245, "epoch": 638} {"train_loss": -37.66411209106445, "global_step": 77246, "epoch": 638} {"train_loss": -36.78556442260742, "global_step": 77247, "epoch": 638} {"train_loss": -37.4295768737793, "global_step": 77248, "epoch": 638} {"train_loss": -37.41229248046875, "global_step": 77249, "epoch": 638} {"train_loss": -36.96287155151367, "global_step": 77250, "epoch": 638} {"train_loss": -37.453834533691406, "global_step": 77251, "epoch": 638} {"train_loss": -37.19881057739258, "global_step": 77252, "epoch": 638} {"train_loss": -37.39887619018555, "global_step": 77253, "epoch": 638} {"train_loss": -37.35271072387695, "global_step": 77254, "epoch": 638} {"train_loss": -37.00448226928711, "global_step": 77255, "epoch": 638} {"train_loss": -37.56214141845703, "global_step": 77256, "epoch": 638} {"train_loss": -37.35893249511719, "global_step": 77257, "epoch": 638} {"train_loss": -37.565547943115234, "global_step": 77258, "epoch": 638} {"train_loss": -37.14296340942383, "global_step": 77259, "epoch": 638} {"train_loss": -37.52522277832031, "global_step": 77260, "epoch": 638} {"train_loss": -37.15039825439453, "global_step": 77261, "epoch": 638} {"train_loss": -37.56601333618164, "global_step": 77262, "epoch": 638} {"train_loss": -36.986629486083984, "global_step": 77263, "epoch": 638} {"train_loss": -37.056854248046875, "global_step": 77264, "epoch": 638} {"train_loss": -37.34640121459961, "global_step": 77265, "epoch": 638} {"train_loss": -37.6338996887207, "global_step": 77266, "epoch": 638} {"train_loss": -38.086280822753906, "global_step": 77267, "epoch": 638} {"train_loss": -37.367393493652344, "global_step": 77268, "epoch": 638} {"train_loss": -37.5184440612793, "global_step": 77269, "epoch": 638} {"train_loss": -37.4793701171875, "global_step": 77270, "epoch": 638} {"train_loss": -37.386112213134766, "global_step": 77271, "epoch": 638} {"train_loss": -37.34599685668945, "global_step": 77272, "epoch": 638} {"train_loss": -37.779354095458984, "global_step": 77273, "epoch": 638} {"train_loss": -37.9625129699707, "global_step": 77274, "epoch": 638} {"train_loss": -36.55424118041992, "global_step": 77275, "epoch": 638} {"train_loss": -36.44147872924805, "global_step": 77276, "epoch": 638} {"train_loss": -38.21165084838867, "global_step": 77277, "epoch": 638} {"train_loss": -37.664398193359375, "global_step": 77278, "epoch": 638} {"train_loss": -37.773040771484375, "global_step": 77279, "epoch": 638} {"train_loss": -37.685089111328125, "global_step": 77280, "epoch": 638} {"train_loss": -37.82220458984375, "global_step": 77281, "epoch": 638} {"train_loss": -37.54853439331055, "global_step": 77282, "epoch": 638} {"train_loss": -37.56589889526367, "global_step": 77283, "epoch": 638} {"train_loss": -37.57994842529297, "global_step": 77284, "epoch": 638} {"train_loss": -37.74519348144531, "global_step": 77285, "epoch": 638} {"train_loss": -38.07521057128906, "global_step": 77286, "epoch": 638} {"train_loss": -37.4667854309082, "global_step": 77287, "epoch": 638} {"train_loss": -38.245059967041016, "global_step": 77288, "epoch": 638} {"train_loss": -37.612552642822266, "global_step": 77289, "epoch": 638} {"train_loss": -37.23424530029297, "global_step": 77290, "epoch": 638} {"train_loss": -38.1577262878418, "global_step": 77291, "epoch": 638} {"train_loss": -37.03409957885742, "global_step": 77292, "epoch": 638} {"train_loss": -37.29322052001953, "global_step": 77293, "epoch": 638} {"train_loss": -37.66289138793945, "global_step": 77294, "epoch": 638} {"train_loss": -37.50672149658203, "global_step": 77295, "epoch": 638} {"train_loss": -37.19746017456055, "global_step": 77296, "epoch": 638} {"train_loss": -37.213191986083984, "global_step": 77297, "epoch": 638} {"train_loss": -37.79183578491211, "global_step": 77298, "epoch": 638} {"train_loss": -36.573360443115234, "global_step": 77299, "epoch": 638} {"train_loss": -37.45649337768555, "global_step": 77300, "epoch": 638} {"train_loss": -37.89670944213867, "global_step": 77301, "epoch": 638} {"train_loss": -34.90082931518555, "global_step": 77302, "epoch": 638} {"train_loss": -37.29669952392578, "global_step": 77303, "epoch": 638} {"train_loss": -37.1396369934082, "global_step": 77304, "epoch": 638} {"train_loss": -35.91963577270508, "global_step": 77305, "epoch": 638} {"train_loss": -29.854598999023438, "global_step": 77306, "epoch": 638} {"train_loss": -37.31991195678711, "global_step": 77307, "epoch": 638} {"train_loss": -36.89323806762695, "global_step": 77308, "epoch": 638} {"train_loss": -36.61783981323242, "global_step": 77309, "epoch": 638} {"train_loss": -33.26483154296875, "global_step": 77310, "epoch": 638} {"train_loss": -36.700897216796875, "global_step": 77311, "epoch": 638} {"train_loss": -35.79705047607422, "global_step": 77312, "epoch": 638} {"train_loss": -34.9936408996582, "global_step": 77313, "epoch": 638} {"train_loss": -35.59693145751953, "global_step": 77314, "epoch": 638} {"train_loss": -36.24266052246094, "global_step": 77315, "epoch": 638} {"train_loss": -34.05110168457031, "global_step": 77316, "epoch": 638} {"train_loss": -34.602081298828125, "global_step": 77317, "epoch": 638} {"train_loss": -36.62583488275197, "global_step": 77318, "epoch": 638, "val_loss": 3642390.0} {"train_loss": -34.05009078979492, "global_step": 77319, "epoch": 639} {"train_loss": -35.029476165771484, "global_step": 77320, "epoch": 639} {"train_loss": -35.7745475769043, "global_step": 77321, "epoch": 639} {"train_loss": -34.798091888427734, "global_step": 77322, "epoch": 639} {"train_loss": -34.8533821105957, "global_step": 77323, "epoch": 639} {"train_loss": -34.343467712402344, "global_step": 77324, "epoch": 639} {"train_loss": -36.5208625793457, "global_step": 77325, "epoch": 639} {"train_loss": -34.70866775512695, "global_step": 77326, "epoch": 639} {"train_loss": -35.66279983520508, "global_step": 77327, "epoch": 639} {"train_loss": -36.079002380371094, "global_step": 77328, "epoch": 639} {"train_loss": -35.0463981628418, "global_step": 77329, "epoch": 639} {"train_loss": -36.35645294189453, "global_step": 77330, "epoch": 639} {"train_loss": -31.64149284362793, "global_step": 77331, "epoch": 639} {"train_loss": -19.236923217773438, "global_step": 77332, "epoch": 639} {"train_loss": -36.359046936035156, "global_step": 77333, "epoch": 639} {"train_loss": -35.58069610595703, "global_step": 77334, "epoch": 639} {"train_loss": -21.55923843383789, "global_step": 77335, "epoch": 639} {"train_loss": -35.1005973815918, "global_step": 77336, "epoch": 639} {"train_loss": -23.70275115966797, "global_step": 77337, "epoch": 639} {"train_loss": -32.231563568115234, "global_step": 77338, "epoch": 639} {"train_loss": -14.33531665802002, "global_step": 77339, "epoch": 639} {"train_loss": -32.65670394897461, "global_step": 77340, "epoch": 639} {"train_loss": -32.40340805053711, "global_step": 77341, "epoch": 639} {"train_loss": -32.2412109375, "global_step": 77342, "epoch": 639} {"train_loss": -28.73179054260254, "global_step": 77343, "epoch": 639} {"train_loss": -27.2818603515625, "global_step": 77344, "epoch": 639} {"train_loss": -31.21624755859375, "global_step": 77345, "epoch": 639} {"train_loss": -30.964466094970703, "global_step": 77346, "epoch": 639} {"train_loss": -31.860034942626953, "global_step": 77347, "epoch": 639} {"train_loss": -31.529855728149414, "global_step": 77348, "epoch": 639} {"train_loss": -33.06538009643555, "global_step": 77349, "epoch": 639} {"train_loss": -31.506677627563477, "global_step": 77350, "epoch": 639} {"train_loss": -30.7030086517334, "global_step": 77351, "epoch": 639} {"train_loss": -32.788490295410156, "global_step": 77352, "epoch": 639} {"train_loss": -32.49205017089844, "global_step": 77353, "epoch": 639} {"train_loss": -33.7713737487793, "global_step": 77354, "epoch": 639} {"train_loss": -31.813756942749023, "global_step": 77355, "epoch": 639} {"train_loss": -33.96273422241211, "global_step": 77356, "epoch": 639} {"train_loss": -32.85830307006836, "global_step": 77357, "epoch": 639} {"train_loss": -33.61201858520508, "global_step": 77358, "epoch": 639} {"train_loss": -32.388084411621094, "global_step": 77359, "epoch": 639} {"train_loss": -33.16278076171875, "global_step": 77360, "epoch": 639} {"train_loss": -33.83623123168945, "global_step": 77361, "epoch": 639} {"train_loss": -33.20811080932617, "global_step": 77362, "epoch": 639} {"train_loss": -33.51437759399414, "global_step": 77363, "epoch": 639} {"train_loss": -32.126827239990234, "global_step": 77364, "epoch": 639} {"train_loss": -31.67340087890625, "global_step": 77365, "epoch": 639} {"train_loss": -33.99946975708008, "global_step": 77366, "epoch": 639} {"train_loss": -33.77022171020508, "global_step": 77367, "epoch": 639} {"train_loss": -34.36044692993164, "global_step": 77368, "epoch": 639} {"train_loss": -33.942989349365234, "global_step": 77369, "epoch": 639} {"train_loss": -34.29398727416992, "global_step": 77370, "epoch": 639} {"train_loss": -34.365447998046875, "global_step": 77371, "epoch": 639} {"train_loss": -34.14596176147461, "global_step": 77372, "epoch": 639} {"train_loss": -33.50405502319336, "global_step": 77373, "epoch": 639} {"train_loss": -33.51415252685547, "global_step": 77374, "epoch": 639} {"train_loss": -33.353336334228516, "global_step": 77375, "epoch": 639} {"train_loss": -34.294551849365234, "global_step": 77376, "epoch": 639} {"train_loss": -34.44399642944336, "global_step": 77377, "epoch": 639} {"train_loss": -34.38465118408203, "global_step": 77378, "epoch": 639} {"train_loss": -34.73162841796875, "global_step": 77379, "epoch": 639} {"train_loss": -34.26620101928711, "global_step": 77380, "epoch": 639} {"train_loss": -34.12755584716797, "global_step": 77381, "epoch": 639} {"train_loss": -34.644290924072266, "global_step": 77382, "epoch": 639} {"train_loss": -34.9019775390625, "global_step": 77383, "epoch": 639} {"train_loss": -35.142433166503906, "global_step": 77384, "epoch": 639} {"train_loss": -35.29120635986328, "global_step": 77385, "epoch": 639} {"train_loss": -34.671504974365234, "global_step": 77386, "epoch": 639} {"train_loss": -35.398250579833984, "global_step": 77387, "epoch": 639} {"train_loss": -34.07809066772461, "global_step": 77388, "epoch": 639} {"train_loss": -35.28152084350586, "global_step": 77389, "epoch": 639} {"train_loss": -35.257076263427734, "global_step": 77390, "epoch": 639} {"train_loss": -35.35470199584961, "global_step": 77391, "epoch": 639} {"train_loss": -35.77634811401367, "global_step": 77392, "epoch": 639} {"train_loss": -34.27834701538086, "global_step": 77393, "epoch": 639} {"train_loss": -35.49570846557617, "global_step": 77394, "epoch": 639} {"train_loss": -35.3726921081543, "global_step": 77395, "epoch": 639} {"train_loss": -35.737335205078125, "global_step": 77396, "epoch": 639} {"train_loss": -35.32085418701172, "global_step": 77397, "epoch": 639} {"train_loss": -35.76046371459961, "global_step": 77398, "epoch": 639} {"train_loss": -36.21672439575195, "global_step": 77399, "epoch": 639} {"train_loss": -35.69856262207031, "global_step": 77400, "epoch": 639} {"train_loss": -35.746429443359375, "global_step": 77401, "epoch": 639} {"train_loss": -35.56983184814453, "global_step": 77402, "epoch": 639} {"train_loss": -35.625789642333984, "global_step": 77403, "epoch": 639} {"train_loss": -35.68415451049805, "global_step": 77404, "epoch": 639} {"train_loss": -35.37346649169922, "global_step": 77405, "epoch": 639} {"train_loss": -35.46308517456055, "global_step": 77406, "epoch": 639} {"train_loss": -35.79819107055664, "global_step": 77407, "epoch": 639} {"train_loss": -36.51961898803711, "global_step": 77408, "epoch": 639} {"train_loss": -36.26906967163086, "global_step": 77409, "epoch": 639} {"train_loss": -35.95670700073242, "global_step": 77410, "epoch": 639} {"train_loss": -35.729793548583984, "global_step": 77411, "epoch": 639} {"train_loss": -36.45012664794922, "global_step": 77412, "epoch": 639} {"train_loss": -35.8060188293457, "global_step": 77413, "epoch": 639} {"train_loss": -36.00570297241211, "global_step": 77414, "epoch": 639} {"train_loss": -36.129371643066406, "global_step": 77415, "epoch": 639} {"train_loss": -35.44150161743164, "global_step": 77416, "epoch": 639} {"train_loss": -36.34403610229492, "global_step": 77417, "epoch": 639} {"train_loss": -36.365901947021484, "global_step": 77418, "epoch": 639} {"train_loss": -36.478599548339844, "global_step": 77419, "epoch": 639} {"train_loss": -36.656063079833984, "global_step": 77420, "epoch": 639} {"train_loss": -36.58681106567383, "global_step": 77421, "epoch": 639} {"train_loss": -36.4901237487793, "global_step": 77422, "epoch": 639} {"train_loss": -35.51527404785156, "global_step": 77423, "epoch": 639} {"train_loss": -36.83871841430664, "global_step": 77424, "epoch": 639} {"train_loss": -35.70598220825195, "global_step": 77425, "epoch": 639} {"train_loss": -35.811424255371094, "global_step": 77426, "epoch": 639} {"train_loss": -36.287818908691406, "global_step": 77427, "epoch": 639} {"train_loss": -35.81218338012695, "global_step": 77428, "epoch": 639} {"train_loss": -35.428401947021484, "global_step": 77429, "epoch": 639} {"train_loss": -35.73585510253906, "global_step": 77430, "epoch": 639} {"train_loss": -35.609004974365234, "global_step": 77431, "epoch": 639} {"train_loss": -35.81692123413086, "global_step": 77432, "epoch": 639} {"train_loss": -36.292396545410156, "global_step": 77433, "epoch": 639} {"train_loss": -35.68800735473633, "global_step": 77434, "epoch": 639} {"train_loss": -35.35860061645508, "global_step": 77435, "epoch": 639} {"train_loss": -36.3592414855957, "global_step": 77436, "epoch": 639} {"train_loss": -34.92509078979492, "global_step": 77437, "epoch": 639} {"train_loss": -36.592872619628906, "global_step": 77438, "epoch": 639} {"train_loss": -34.10447895428366, "global_step": 77439, "epoch": 639, "val_loss": 2685046.75} {"train_loss": -37.000091552734375, "global_step": 77440, "epoch": 640} {"train_loss": -36.57517623901367, "global_step": 77441, "epoch": 640} {"train_loss": -37.021907806396484, "global_step": 77442, "epoch": 640} {"train_loss": -36.6295280456543, "global_step": 77443, "epoch": 640} {"train_loss": -36.538291931152344, "global_step": 77444, "epoch": 640} {"train_loss": -35.0258903503418, "global_step": 77445, "epoch": 640} {"train_loss": -34.80245590209961, "global_step": 77446, "epoch": 640} {"train_loss": -36.50791549682617, "global_step": 77447, "epoch": 640} {"train_loss": -35.95804214477539, "global_step": 77448, "epoch": 640} {"train_loss": -35.960994720458984, "global_step": 77449, "epoch": 640} {"train_loss": -36.177650451660156, "global_step": 77450, "epoch": 640} {"train_loss": -37.22249984741211, "global_step": 77451, "epoch": 640} {"train_loss": -35.65437698364258, "global_step": 77452, "epoch": 640} {"train_loss": -36.94404983520508, "global_step": 77453, "epoch": 640} {"train_loss": -36.31294631958008, "global_step": 77454, "epoch": 640} {"train_loss": -35.78321075439453, "global_step": 77455, "epoch": 640} {"train_loss": -37.36757278442383, "global_step": 77456, "epoch": 640} {"train_loss": -36.29209518432617, "global_step": 77457, "epoch": 640} {"train_loss": -37.23060989379883, "global_step": 77458, "epoch": 640} {"train_loss": -37.15910720825195, "global_step": 77459, "epoch": 640} {"train_loss": -37.13656234741211, "global_step": 77460, "epoch": 640} {"train_loss": -36.77499008178711, "global_step": 77461, "epoch": 640} {"train_loss": -36.91199493408203, "global_step": 77462, "epoch": 640} {"train_loss": -37.10198974609375, "global_step": 77463, "epoch": 640} {"train_loss": -36.73439407348633, "global_step": 77464, "epoch": 640} {"train_loss": -37.24586486816406, "global_step": 77465, "epoch": 640} {"train_loss": -37.07558822631836, "global_step": 77466, "epoch": 640} {"train_loss": -37.204994201660156, "global_step": 77467, "epoch": 640} {"train_loss": -36.9705696105957, "global_step": 77468, "epoch": 640} {"train_loss": -36.312007904052734, "global_step": 77469, "epoch": 640} {"train_loss": -35.783382415771484, "global_step": 77470, "epoch": 640} {"train_loss": -32.44019317626953, "global_step": 77471, "epoch": 640} {"train_loss": -33.44173049926758, "global_step": 77472, "epoch": 640} {"train_loss": -35.951385498046875, "global_step": 77473, "epoch": 640} {"train_loss": -31.116384506225586, "global_step": 77474, "epoch": 640} {"train_loss": -33.654510498046875, "global_step": 77475, "epoch": 640} {"train_loss": -36.99869918823242, "global_step": 77476, "epoch": 640} {"train_loss": -34.520870208740234, "global_step": 77477, "epoch": 640} {"train_loss": -35.82417297363281, "global_step": 77478, "epoch": 640} {"train_loss": -34.43300247192383, "global_step": 77479, "epoch": 640} {"train_loss": -36.091453552246094, "global_step": 77480, "epoch": 640} {"train_loss": -37.12064743041992, "global_step": 77481, "epoch": 640} {"train_loss": -36.047122955322266, "global_step": 77482, "epoch": 640} {"train_loss": -35.93950271606445, "global_step": 77483, "epoch": 640} {"train_loss": -37.068145751953125, "global_step": 77484, "epoch": 640} {"train_loss": -36.74448776245117, "global_step": 77485, "epoch": 640} {"train_loss": -36.968955993652344, "global_step": 77486, "epoch": 640} {"train_loss": -36.427764892578125, "global_step": 77487, "epoch": 640} {"train_loss": -37.15553665161133, "global_step": 77488, "epoch": 640} {"train_loss": -37.432647705078125, "global_step": 77489, "epoch": 640} {"train_loss": -36.97573471069336, "global_step": 77490, "epoch": 640} {"train_loss": -36.65431213378906, "global_step": 77491, "epoch": 640} {"train_loss": -37.107295989990234, "global_step": 77492, "epoch": 640} {"train_loss": -36.86439514160156, "global_step": 77493, "epoch": 640} {"train_loss": -36.79506301879883, "global_step": 77494, "epoch": 640} {"train_loss": -36.46847152709961, "global_step": 77495, "epoch": 640} {"train_loss": -37.09757614135742, "global_step": 77496, "epoch": 640} {"train_loss": -36.94163513183594, "global_step": 77497, "epoch": 640} {"train_loss": -36.94404983520508, "global_step": 77498, "epoch": 640} {"train_loss": -37.62874221801758, "global_step": 77499, "epoch": 640} {"train_loss": -37.65684127807617, "global_step": 77500, "epoch": 640} {"train_loss": -37.488887786865234, "global_step": 77501, "epoch": 640} {"train_loss": -36.98628616333008, "global_step": 77502, "epoch": 640} {"train_loss": -37.494895935058594, "global_step": 77503, "epoch": 640} {"train_loss": -37.52598190307617, "global_step": 77504, "epoch": 640} {"train_loss": -37.333370208740234, "global_step": 77505, "epoch": 640} {"train_loss": -37.83771896362305, "global_step": 77506, "epoch": 640} {"train_loss": -36.93392562866211, "global_step": 77507, "epoch": 640} {"train_loss": -37.29038619995117, "global_step": 77508, "epoch": 640} {"train_loss": -37.184139251708984, "global_step": 77509, "epoch": 640} {"train_loss": -37.554115295410156, "global_step": 77510, "epoch": 640} {"train_loss": -36.9708251953125, "global_step": 77511, "epoch": 640} {"train_loss": -37.5026741027832, "global_step": 77512, "epoch": 640} {"train_loss": -37.46688461303711, "global_step": 77513, "epoch": 640} {"train_loss": -37.51523971557617, "global_step": 77514, "epoch": 640} {"train_loss": -37.328224182128906, "global_step": 77515, "epoch": 640} {"train_loss": -38.10736846923828, "global_step": 77516, "epoch": 640} {"train_loss": -38.239418029785156, "global_step": 77517, "epoch": 640} {"train_loss": -37.20048141479492, "global_step": 77518, "epoch": 640} {"train_loss": -37.201873779296875, "global_step": 77519, "epoch": 640} {"train_loss": -37.613094329833984, "global_step": 77520, "epoch": 640} {"train_loss": -37.49225997924805, "global_step": 77521, "epoch": 640} {"train_loss": -37.2308349609375, "global_step": 77522, "epoch": 640} {"train_loss": -36.52650833129883, "global_step": 77523, "epoch": 640} {"train_loss": -37.581886291503906, "global_step": 77524, "epoch": 640} {"train_loss": -37.93853759765625, "global_step": 77525, "epoch": 640} {"train_loss": -37.172481536865234, "global_step": 77526, "epoch": 640} {"train_loss": -37.45436096191406, "global_step": 77527, "epoch": 640} {"train_loss": -37.37385940551758, "global_step": 77528, "epoch": 640} {"train_loss": -36.466121673583984, "global_step": 77529, "epoch": 640} {"train_loss": -35.97623825073242, "global_step": 77530, "epoch": 640} {"train_loss": -36.19770812988281, "global_step": 77531, "epoch": 640} {"train_loss": -35.42352294921875, "global_step": 77532, "epoch": 640} {"train_loss": -36.4312629699707, "global_step": 77533, "epoch": 640} {"train_loss": -36.89631652832031, "global_step": 77534, "epoch": 640} {"train_loss": -37.61818313598633, "global_step": 77535, "epoch": 640} {"train_loss": -35.059539794921875, "global_step": 77536, "epoch": 640} {"train_loss": -32.66445541381836, "global_step": 77537, "epoch": 640} {"train_loss": -36.61615753173828, "global_step": 77538, "epoch": 640} {"train_loss": -35.840484619140625, "global_step": 77539, "epoch": 640} {"train_loss": -31.094308853149414, "global_step": 77540, "epoch": 640} {"train_loss": -32.56022262573242, "global_step": 77541, "epoch": 640} {"train_loss": -34.08186721801758, "global_step": 77542, "epoch": 640} {"train_loss": -35.17183303833008, "global_step": 77543, "epoch": 640} {"train_loss": -31.917316436767578, "global_step": 77544, "epoch": 640} {"train_loss": -35.233978271484375, "global_step": 77545, "epoch": 640} {"train_loss": -34.84382247924805, "global_step": 77546, "epoch": 640} {"train_loss": -34.08846664428711, "global_step": 77547, "epoch": 640} {"train_loss": -34.920284271240234, "global_step": 77548, "epoch": 640} {"train_loss": -33.82273483276367, "global_step": 77549, "epoch": 640} {"train_loss": -36.682701110839844, "global_step": 77550, "epoch": 640} {"train_loss": -35.257789611816406, "global_step": 77551, "epoch": 640} {"train_loss": -35.43839645385742, "global_step": 77552, "epoch": 640} {"train_loss": -34.88677215576172, "global_step": 77553, "epoch": 640} {"train_loss": -35.994728088378906, "global_step": 77554, "epoch": 640} {"train_loss": -35.398189544677734, "global_step": 77555, "epoch": 640} {"train_loss": -36.083106994628906, "global_step": 77556, "epoch": 640} {"train_loss": -34.73836135864258, "global_step": 77557, "epoch": 640} {"train_loss": -35.1145133972168, "global_step": 77558, "epoch": 640} {"train_loss": -36.17898178100586, "global_step": 77559, "epoch": 640} {"train_loss": -36.253633294223754, "global_step": 77560, "epoch": 640, "val_loss": 2714312.75} {"train_loss": -30.18695640563965, "global_step": 77561, "epoch": 641} {"train_loss": -33.466156005859375, "global_step": 77562, "epoch": 641} {"train_loss": -34.63761520385742, "global_step": 77563, "epoch": 641} {"train_loss": -34.26291275024414, "global_step": 77564, "epoch": 641} {"train_loss": -33.31074142456055, "global_step": 77565, "epoch": 641} {"train_loss": -32.93052291870117, "global_step": 77566, "epoch": 641} {"train_loss": -35.11444854736328, "global_step": 77567, "epoch": 641} {"train_loss": -33.62348175048828, "global_step": 77568, "epoch": 641} {"train_loss": -33.36415481567383, "global_step": 77569, "epoch": 641} {"train_loss": -33.40587615966797, "global_step": 77570, "epoch": 641} {"train_loss": -34.312137603759766, "global_step": 77571, "epoch": 641} {"train_loss": -34.04561996459961, "global_step": 77572, "epoch": 641} {"train_loss": -34.889156341552734, "global_step": 77573, "epoch": 641} {"train_loss": -34.18989181518555, "global_step": 77574, "epoch": 641} {"train_loss": -33.71921920776367, "global_step": 77575, "epoch": 641} {"train_loss": -35.677066802978516, "global_step": 77576, "epoch": 641} {"train_loss": -33.163795471191406, "global_step": 77577, "epoch": 641} {"train_loss": -35.35995101928711, "global_step": 77578, "epoch": 641} {"train_loss": -35.6182975769043, "global_step": 77579, "epoch": 641} {"train_loss": -33.30805587768555, "global_step": 77580, "epoch": 641} {"train_loss": -34.162052154541016, "global_step": 77581, "epoch": 641} {"train_loss": -35.16529846191406, "global_step": 77582, "epoch": 641} {"train_loss": -35.5954475402832, "global_step": 77583, "epoch": 641} {"train_loss": -35.143402099609375, "global_step": 77584, "epoch": 641} {"train_loss": -35.16943359375, "global_step": 77585, "epoch": 641} {"train_loss": -35.443477630615234, "global_step": 77586, "epoch": 641} {"train_loss": -34.796173095703125, "global_step": 77587, "epoch": 641} {"train_loss": -35.26734924316406, "global_step": 77588, "epoch": 641} {"train_loss": -35.64223861694336, "global_step": 77589, "epoch": 641} {"train_loss": -35.48286056518555, "global_step": 77590, "epoch": 641} {"train_loss": -35.73263931274414, "global_step": 77591, "epoch": 641} {"train_loss": -33.70090866088867, "global_step": 77592, "epoch": 641} {"train_loss": -35.69704818725586, "global_step": 77593, "epoch": 641} {"train_loss": -35.551025390625, "global_step": 77594, "epoch": 641} {"train_loss": -35.839290618896484, "global_step": 77595, "epoch": 641} {"train_loss": -36.132293701171875, "global_step": 77596, "epoch": 641} {"train_loss": -36.16666793823242, "global_step": 77597, "epoch": 641} {"train_loss": -35.43513488769531, "global_step": 77598, "epoch": 641} {"train_loss": -35.53861618041992, "global_step": 77599, "epoch": 641} {"train_loss": -36.037017822265625, "global_step": 77600, "epoch": 641} {"train_loss": -35.6342658996582, "global_step": 77601, "epoch": 641} {"train_loss": -36.07682418823242, "global_step": 77602, "epoch": 641} {"train_loss": -36.45052719116211, "global_step": 77603, "epoch": 641} {"train_loss": -36.35052490234375, "global_step": 77604, "epoch": 641} {"train_loss": -35.95906448364258, "global_step": 77605, "epoch": 641} {"train_loss": -36.5427131652832, "global_step": 77606, "epoch": 641} {"train_loss": -36.29363250732422, "global_step": 77607, "epoch": 641} {"train_loss": -36.439727783203125, "global_step": 77608, "epoch": 641} {"train_loss": -36.564605712890625, "global_step": 77609, "epoch": 641} {"train_loss": -35.94140625, "global_step": 77610, "epoch": 641} {"train_loss": -36.58315658569336, "global_step": 77611, "epoch": 641} {"train_loss": -36.51959991455078, "global_step": 77612, "epoch": 641} {"train_loss": -36.35537338256836, "global_step": 77613, "epoch": 641} {"train_loss": -36.50532150268555, "global_step": 77614, "epoch": 641} {"train_loss": -36.34040451049805, "global_step": 77615, "epoch": 641} {"train_loss": -36.61509704589844, "global_step": 77616, "epoch": 641} {"train_loss": -36.87966537475586, "global_step": 77617, "epoch": 641} {"train_loss": -36.817989349365234, "global_step": 77618, "epoch": 641} {"train_loss": -36.88369369506836, "global_step": 77619, "epoch": 641} {"train_loss": -36.25242614746094, "global_step": 77620, "epoch": 641} {"train_loss": -36.42635726928711, "global_step": 77621, "epoch": 641} {"train_loss": -36.94655990600586, "global_step": 77622, "epoch": 641} {"train_loss": -36.553558349609375, "global_step": 77623, "epoch": 641} {"train_loss": -36.290130615234375, "global_step": 77624, "epoch": 641} {"train_loss": -37.02512741088867, "global_step": 77625, "epoch": 641} {"train_loss": -36.495357513427734, "global_step": 77626, "epoch": 641} {"train_loss": -36.369873046875, "global_step": 77627, "epoch": 641} {"train_loss": -35.76776123046875, "global_step": 77628, "epoch": 641} {"train_loss": -36.54351806640625, "global_step": 77629, "epoch": 641} {"train_loss": -37.1458740234375, "global_step": 77630, "epoch": 641} {"train_loss": -36.013668060302734, "global_step": 77631, "epoch": 641} {"train_loss": -36.590763092041016, "global_step": 77632, "epoch": 641} {"train_loss": -37.09552764892578, "global_step": 77633, "epoch": 641} {"train_loss": -37.125144958496094, "global_step": 77634, "epoch": 641} {"train_loss": -36.68830108642578, "global_step": 77635, "epoch": 641} {"train_loss": -37.09584426879883, "global_step": 77636, "epoch": 641} {"train_loss": -37.394630432128906, "global_step": 77637, "epoch": 641} {"train_loss": -36.46050262451172, "global_step": 77638, "epoch": 641} {"train_loss": -36.99421310424805, "global_step": 77639, "epoch": 641} {"train_loss": -36.519309997558594, "global_step": 77640, "epoch": 641} {"train_loss": -35.981605529785156, "global_step": 77641, "epoch": 641} {"train_loss": -36.52254867553711, "global_step": 77642, "epoch": 641} {"train_loss": -36.742919921875, "global_step": 77643, "epoch": 641} {"train_loss": -37.125587463378906, "global_step": 77644, "epoch": 641} {"train_loss": -36.65198516845703, "global_step": 77645, "epoch": 641} {"train_loss": -36.816280364990234, "global_step": 77646, "epoch": 641} {"train_loss": -37.78083419799805, "global_step": 77647, "epoch": 641} {"train_loss": -37.485076904296875, "global_step": 77648, "epoch": 641} {"train_loss": -37.04008865356445, "global_step": 77649, "epoch": 641} {"train_loss": -35.63441848754883, "global_step": 77650, "epoch": 641} {"train_loss": -29.003570556640625, "global_step": 77651, "epoch": 641} {"train_loss": -20.97761344909668, "global_step": 77652, "epoch": 641} {"train_loss": -19.58493423461914, "global_step": 77653, "epoch": 641} {"train_loss": -31.516752243041992, "global_step": 77654, "epoch": 641} {"train_loss": -33.25343704223633, "global_step": 77655, "epoch": 641} {"train_loss": -26.561079025268555, "global_step": 77656, "epoch": 641} {"train_loss": -36.23152542114258, "global_step": 77657, "epoch": 641} {"train_loss": -29.292516708374023, "global_step": 77658, "epoch": 641} {"train_loss": -35.65174102783203, "global_step": 77659, "epoch": 641} {"train_loss": -31.183761596679688, "global_step": 77660, "epoch": 641} {"train_loss": -35.374542236328125, "global_step": 77661, "epoch": 641} {"train_loss": -34.58909606933594, "global_step": 77662, "epoch": 641} {"train_loss": -33.1562614440918, "global_step": 77663, "epoch": 641} {"train_loss": -36.5472412109375, "global_step": 77664, "epoch": 641} {"train_loss": -35.592567443847656, "global_step": 77665, "epoch": 641} {"train_loss": -34.03614807128906, "global_step": 77666, "epoch": 641} {"train_loss": -36.535423278808594, "global_step": 77667, "epoch": 641} {"train_loss": -35.911190032958984, "global_step": 77668, "epoch": 641} {"train_loss": -34.6793327331543, "global_step": 77669, "epoch": 641} {"train_loss": -35.826622009277344, "global_step": 77670, "epoch": 641} {"train_loss": -36.20545196533203, "global_step": 77671, "epoch": 641} {"train_loss": -35.99306869506836, "global_step": 77672, "epoch": 641} {"train_loss": -35.823238372802734, "global_step": 77673, "epoch": 641} {"train_loss": -36.56112289428711, "global_step": 77674, "epoch": 641} {"train_loss": -37.41497802734375, "global_step": 77675, "epoch": 641} {"train_loss": -36.197505950927734, "global_step": 77676, "epoch": 641} {"train_loss": -36.86077880859375, "global_step": 77677, "epoch": 641} {"train_loss": -36.54510498046875, "global_step": 77678, "epoch": 641} {"train_loss": -36.570430755615234, "global_step": 77679, "epoch": 641} {"train_loss": -36.83064651489258, "global_step": 77680, "epoch": 641} {"train_loss": -35.22954485239076, "global_step": 77681, "epoch": 641, "val_loss": 2631089.75} {"train_loss": -36.875389099121094, "global_step": 77682, "epoch": 642} {"train_loss": -36.60700225830078, "global_step": 77683, "epoch": 642} {"train_loss": -36.99440002441406, "global_step": 77684, "epoch": 642} {"train_loss": -36.75056076049805, "global_step": 77685, "epoch": 642} {"train_loss": -37.05078887939453, "global_step": 77686, "epoch": 642} {"train_loss": -37.11857604980469, "global_step": 77687, "epoch": 642} {"train_loss": -37.211761474609375, "global_step": 77688, "epoch": 642} {"train_loss": -36.8803596496582, "global_step": 77689, "epoch": 642} {"train_loss": -37.362586975097656, "global_step": 77690, "epoch": 642} {"train_loss": -37.342681884765625, "global_step": 77691, "epoch": 642} {"train_loss": -37.39748001098633, "global_step": 77692, "epoch": 642} {"train_loss": -36.81654739379883, "global_step": 77693, "epoch": 642} {"train_loss": -37.64653396606445, "global_step": 77694, "epoch": 642} {"train_loss": -36.82039260864258, "global_step": 77695, "epoch": 642} {"train_loss": -37.40428161621094, "global_step": 77696, "epoch": 642} {"train_loss": -37.26284408569336, "global_step": 77697, "epoch": 642} {"train_loss": -37.484615325927734, "global_step": 77698, "epoch": 642} {"train_loss": -37.616363525390625, "global_step": 77699, "epoch": 642} {"train_loss": -37.8511962890625, "global_step": 77700, "epoch": 642} {"train_loss": -37.7932014465332, "global_step": 77701, "epoch": 642} {"train_loss": -37.6359977722168, "global_step": 77702, "epoch": 642} {"train_loss": -37.69106674194336, "global_step": 77703, "epoch": 642} {"train_loss": -37.54767608642578, "global_step": 77704, "epoch": 642} {"train_loss": -37.876930236816406, "global_step": 77705, "epoch": 642} {"train_loss": -37.82645797729492, "global_step": 77706, "epoch": 642} {"train_loss": -37.61077880859375, "global_step": 77707, "epoch": 642} {"train_loss": -37.834312438964844, "global_step": 77708, "epoch": 642} {"train_loss": -37.89017105102539, "global_step": 77709, "epoch": 642} {"train_loss": -37.23260498046875, "global_step": 77710, "epoch": 642} {"train_loss": -37.809078216552734, "global_step": 77711, "epoch": 642} {"train_loss": -37.747657775878906, "global_step": 77712, "epoch": 642} {"train_loss": -37.428077697753906, "global_step": 77713, "epoch": 642} {"train_loss": -37.66718673706055, "global_step": 77714, "epoch": 642} {"train_loss": -37.8775749206543, "global_step": 77715, "epoch": 642} {"train_loss": -37.721492767333984, "global_step": 77716, "epoch": 642} {"train_loss": -37.68017578125, "global_step": 77717, "epoch": 642} {"train_loss": -37.938289642333984, "global_step": 77718, "epoch": 642} {"train_loss": -38.08641815185547, "global_step": 77719, "epoch": 642} {"train_loss": -37.92246627807617, "global_step": 77720, "epoch": 642} {"train_loss": -37.351173400878906, "global_step": 77721, "epoch": 642} {"train_loss": -37.92790603637695, "global_step": 77722, "epoch": 642} {"train_loss": -36.862884521484375, "global_step": 77723, "epoch": 642} {"train_loss": -36.4212646484375, "global_step": 77724, "epoch": 642} {"train_loss": -35.36880111694336, "global_step": 77725, "epoch": 642} {"train_loss": -34.61985778808594, "global_step": 77726, "epoch": 642} {"train_loss": -31.558216094970703, "global_step": 77727, "epoch": 642} {"train_loss": -27.142385482788086, "global_step": 77728, "epoch": 642} {"train_loss": -25.061100006103516, "global_step": 77729, "epoch": 642} {"train_loss": -29.431232452392578, "global_step": 77730, "epoch": 642} {"train_loss": -33.842613220214844, "global_step": 77731, "epoch": 642} {"train_loss": -34.57575225830078, "global_step": 77732, "epoch": 642} {"train_loss": -34.2114143371582, "global_step": 77733, "epoch": 642} {"train_loss": -34.80694580078125, "global_step": 77734, "epoch": 642} {"train_loss": -31.516357421875, "global_step": 77735, "epoch": 642} {"train_loss": -36.265132904052734, "global_step": 77736, "epoch": 642} {"train_loss": -34.45562744140625, "global_step": 77737, "epoch": 642} {"train_loss": -36.00535202026367, "global_step": 77738, "epoch": 642} {"train_loss": -34.81284713745117, "global_step": 77739, "epoch": 642} {"train_loss": -36.249961853027344, "global_step": 77740, "epoch": 642} {"train_loss": -34.69272994995117, "global_step": 77741, "epoch": 642} {"train_loss": -36.388362884521484, "global_step": 77742, "epoch": 642} {"train_loss": -35.94804000854492, "global_step": 77743, "epoch": 642} {"train_loss": -36.872920989990234, "global_step": 77744, "epoch": 642} {"train_loss": -36.89864730834961, "global_step": 77745, "epoch": 642} {"train_loss": -36.67699432373047, "global_step": 77746, "epoch": 642} {"train_loss": -36.752586364746094, "global_step": 77747, "epoch": 642} {"train_loss": -37.25887680053711, "global_step": 77748, "epoch": 642} {"train_loss": -36.75447463989258, "global_step": 77749, "epoch": 642} {"train_loss": -36.630165100097656, "global_step": 77750, "epoch": 642} {"train_loss": -36.91426467895508, "global_step": 77751, "epoch": 642} {"train_loss": -36.793094635009766, "global_step": 77752, "epoch": 642} {"train_loss": -37.418296813964844, "global_step": 77753, "epoch": 642} {"train_loss": -37.128299713134766, "global_step": 77754, "epoch": 642} {"train_loss": -37.40473175048828, "global_step": 77755, "epoch": 642} {"train_loss": -37.2254524230957, "global_step": 77756, "epoch": 642} {"train_loss": -36.93752670288086, "global_step": 77757, "epoch": 642} {"train_loss": -37.024993896484375, "global_step": 77758, "epoch": 642} {"train_loss": -37.35950469970703, "global_step": 77759, "epoch": 642} {"train_loss": -37.13602066040039, "global_step": 77760, "epoch": 642} {"train_loss": -37.250972747802734, "global_step": 77761, "epoch": 642} {"train_loss": -37.65784454345703, "global_step": 77762, "epoch": 642} {"train_loss": -37.23148727416992, "global_step": 77763, "epoch": 642} {"train_loss": -37.22321701049805, "global_step": 77764, "epoch": 642} {"train_loss": -37.215179443359375, "global_step": 77765, "epoch": 642} {"train_loss": -37.01559066772461, "global_step": 77766, "epoch": 642} {"train_loss": -37.63591384887695, "global_step": 77767, "epoch": 642} {"train_loss": -37.266841888427734, "global_step": 77768, "epoch": 642} {"train_loss": -37.75967025756836, "global_step": 77769, "epoch": 642} {"train_loss": -37.65740966796875, "global_step": 77770, "epoch": 642} {"train_loss": -37.39519119262695, "global_step": 77771, "epoch": 642} {"train_loss": -37.57437515258789, "global_step": 77772, "epoch": 642} {"train_loss": -37.88772964477539, "global_step": 77773, "epoch": 642} {"train_loss": -37.73248291015625, "global_step": 77774, "epoch": 642} {"train_loss": -37.86395263671875, "global_step": 77775, "epoch": 642} {"train_loss": -37.615596771240234, "global_step": 77776, "epoch": 642} {"train_loss": -37.79436111450195, "global_step": 77777, "epoch": 642} {"train_loss": -38.20060348510742, "global_step": 77778, "epoch": 642} {"train_loss": -37.74415588378906, "global_step": 77779, "epoch": 642} {"train_loss": -37.2821044921875, "global_step": 77780, "epoch": 642} {"train_loss": -37.800376892089844, "global_step": 77781, "epoch": 642} {"train_loss": -37.76898193359375, "global_step": 77782, "epoch": 642} {"train_loss": -37.819313049316406, "global_step": 77783, "epoch": 642} {"train_loss": -37.0085563659668, "global_step": 77784, "epoch": 642} {"train_loss": -36.49758529663086, "global_step": 77785, "epoch": 642} {"train_loss": -32.52924728393555, "global_step": 77786, "epoch": 642} {"train_loss": -26.95395278930664, "global_step": 77787, "epoch": 642} {"train_loss": -30.641874313354492, "global_step": 77788, "epoch": 642} {"train_loss": -35.35042953491211, "global_step": 77789, "epoch": 642} {"train_loss": -32.6805305480957, "global_step": 77790, "epoch": 642} {"train_loss": -33.297210693359375, "global_step": 77791, "epoch": 642} {"train_loss": -34.840728759765625, "global_step": 77792, "epoch": 642} {"train_loss": -35.27668380737305, "global_step": 77793, "epoch": 642} {"train_loss": -35.3928108215332, "global_step": 77794, "epoch": 642} {"train_loss": -35.87311935424805, "global_step": 77795, "epoch": 642} {"train_loss": -36.03590774536133, "global_step": 77796, "epoch": 642} {"train_loss": -35.462337493896484, "global_step": 77797, "epoch": 642} {"train_loss": -36.2885627746582, "global_step": 77798, "epoch": 642} {"train_loss": -36.348323822021484, "global_step": 77799, "epoch": 642} {"train_loss": -36.51133728027344, "global_step": 77800, "epoch": 642} {"train_loss": -36.29020309448242, "global_step": 77801, "epoch": 642} {"train_loss": -36.36285015768256, "global_step": 77802, "epoch": 642, "val_loss": 2706627.75} {"train_loss": -36.345001220703125, "global_step": 77803, "epoch": 643} {"train_loss": -36.080810546875, "global_step": 77804, "epoch": 643} {"train_loss": -36.682762145996094, "global_step": 77805, "epoch": 643} {"train_loss": -36.38086700439453, "global_step": 77806, "epoch": 643} {"train_loss": -37.09407424926758, "global_step": 77807, "epoch": 643} {"train_loss": -36.737178802490234, "global_step": 77808, "epoch": 643} {"train_loss": -36.265419006347656, "global_step": 77809, "epoch": 643} {"train_loss": -37.10477828979492, "global_step": 77810, "epoch": 643} {"train_loss": -37.04174041748047, "global_step": 77811, "epoch": 643} {"train_loss": -36.95901107788086, "global_step": 77812, "epoch": 643} {"train_loss": -36.73395919799805, "global_step": 77813, "epoch": 643} {"train_loss": -36.57514953613281, "global_step": 77814, "epoch": 643} {"train_loss": -37.401123046875, "global_step": 77815, "epoch": 643} {"train_loss": -37.37685012817383, "global_step": 77816, "epoch": 643} {"train_loss": -37.11329650878906, "global_step": 77817, "epoch": 643} {"train_loss": -37.34523391723633, "global_step": 77818, "epoch": 643} {"train_loss": -37.439056396484375, "global_step": 77819, "epoch": 643} {"train_loss": -37.0000114440918, "global_step": 77820, "epoch": 643} {"train_loss": -37.29608154296875, "global_step": 77821, "epoch": 643} {"train_loss": -37.69951248168945, "global_step": 77822, "epoch": 643} {"train_loss": -37.691219329833984, "global_step": 77823, "epoch": 643} {"train_loss": -37.526092529296875, "global_step": 77824, "epoch": 643} {"train_loss": -37.02122116088867, "global_step": 77825, "epoch": 643} {"train_loss": -37.31449508666992, "global_step": 77826, "epoch": 643} {"train_loss": -37.89536666870117, "global_step": 77827, "epoch": 643} {"train_loss": -37.7663459777832, "global_step": 77828, "epoch": 643} {"train_loss": -37.484527587890625, "global_step": 77829, "epoch": 643} {"train_loss": -37.22705078125, "global_step": 77830, "epoch": 643} {"train_loss": -36.90620040893555, "global_step": 77831, "epoch": 643} {"train_loss": -36.48191452026367, "global_step": 77832, "epoch": 643} {"train_loss": -36.69635772705078, "global_step": 77833, "epoch": 643} {"train_loss": -37.711883544921875, "global_step": 77834, "epoch": 643} {"train_loss": -37.217689514160156, "global_step": 77835, "epoch": 643} {"train_loss": -37.284488677978516, "global_step": 77836, "epoch": 643} {"train_loss": -37.02903366088867, "global_step": 77837, "epoch": 643} {"train_loss": -35.32851028442383, "global_step": 77838, "epoch": 643} {"train_loss": -37.10593032836914, "global_step": 77839, "epoch": 643} {"train_loss": -37.73164749145508, "global_step": 77840, "epoch": 643} {"train_loss": -37.14310836791992, "global_step": 77841, "epoch": 643} {"train_loss": -37.3411750793457, "global_step": 77842, "epoch": 643} {"train_loss": -36.54934310913086, "global_step": 77843, "epoch": 643} {"train_loss": -36.16587448120117, "global_step": 77844, "epoch": 643} {"train_loss": -37.20634460449219, "global_step": 77845, "epoch": 643} {"train_loss": -37.261077880859375, "global_step": 77846, "epoch": 643} {"train_loss": -38.02272415161133, "global_step": 77847, "epoch": 643} {"train_loss": -37.56270217895508, "global_step": 77848, "epoch": 643} {"train_loss": -36.604087829589844, "global_step": 77849, "epoch": 643} {"train_loss": -37.35136032104492, "global_step": 77850, "epoch": 643} {"train_loss": -38.28971481323242, "global_step": 77851, "epoch": 643} {"train_loss": -37.46599578857422, "global_step": 77852, "epoch": 643} {"train_loss": -37.125038146972656, "global_step": 77853, "epoch": 643} {"train_loss": -36.32558822631836, "global_step": 77854, "epoch": 643} {"train_loss": -37.55355453491211, "global_step": 77855, "epoch": 643} {"train_loss": -37.49069595336914, "global_step": 77856, "epoch": 643} {"train_loss": -37.439510345458984, "global_step": 77857, "epoch": 643} {"train_loss": -37.65616989135742, "global_step": 77858, "epoch": 643} {"train_loss": -37.22710037231445, "global_step": 77859, "epoch": 643} {"train_loss": -37.058807373046875, "global_step": 77860, "epoch": 643} {"train_loss": -35.51632308959961, "global_step": 77861, "epoch": 643} {"train_loss": -35.3178825378418, "global_step": 77862, "epoch": 643} {"train_loss": -36.6191291809082, "global_step": 77863, "epoch": 643} {"train_loss": -37.89968490600586, "global_step": 77864, "epoch": 643} {"train_loss": -37.01882553100586, "global_step": 77865, "epoch": 643} {"train_loss": -37.78334426879883, "global_step": 77866, "epoch": 643} {"train_loss": -38.078582763671875, "global_step": 77867, "epoch": 643} {"train_loss": -38.197669982910156, "global_step": 77868, "epoch": 643} {"train_loss": -38.208045959472656, "global_step": 77869, "epoch": 643} {"train_loss": -37.72446823120117, "global_step": 77870, "epoch": 643} {"train_loss": -37.79854965209961, "global_step": 77871, "epoch": 643} {"train_loss": -37.97321701049805, "global_step": 77872, "epoch": 643} {"train_loss": -38.09000778198242, "global_step": 77873, "epoch": 643} {"train_loss": -38.37083053588867, "global_step": 77874, "epoch": 643} {"train_loss": -38.3173942565918, "global_step": 77875, "epoch": 643} {"train_loss": -37.864463806152344, "global_step": 77876, "epoch": 643} {"train_loss": -37.853736877441406, "global_step": 77877, "epoch": 643} {"train_loss": -37.76902389526367, "global_step": 77878, "epoch": 643} {"train_loss": -37.88115310668945, "global_step": 77879, "epoch": 643} {"train_loss": -36.68166732788086, "global_step": 77880, "epoch": 643} {"train_loss": -36.977108001708984, "global_step": 77881, "epoch": 643} {"train_loss": -37.53560256958008, "global_step": 77882, "epoch": 643} {"train_loss": -37.758384704589844, "global_step": 77883, "epoch": 643} {"train_loss": -37.64080810546875, "global_step": 77884, "epoch": 643} {"train_loss": -37.348472595214844, "global_step": 77885, "epoch": 643} {"train_loss": -36.398677825927734, "global_step": 77886, "epoch": 643} {"train_loss": -35.724483489990234, "global_step": 77887, "epoch": 643} {"train_loss": -35.87541580200195, "global_step": 77888, "epoch": 643} {"train_loss": -33.669105529785156, "global_step": 77889, "epoch": 643} {"train_loss": -23.700092315673828, "global_step": 77890, "epoch": 643} {"train_loss": -7.609592437744141, "global_step": 77891, "epoch": 643} {"train_loss": -5.867105484008789, "global_step": 77892, "epoch": 643} {"train_loss": -36.032806396484375, "global_step": 77893, "epoch": 643} {"train_loss": -23.79931640625, "global_step": 77894, "epoch": 643} {"train_loss": -29.688329696655273, "global_step": 77895, "epoch": 643} {"train_loss": -29.72812843322754, "global_step": 77896, "epoch": 643} {"train_loss": -33.65166091918945, "global_step": 77897, "epoch": 643} {"train_loss": -28.87054443359375, "global_step": 77898, "epoch": 643} {"train_loss": -36.50161361694336, "global_step": 77899, "epoch": 643} {"train_loss": -31.079450607299805, "global_step": 77900, "epoch": 643} {"train_loss": -34.58477020263672, "global_step": 77901, "epoch": 643} {"train_loss": -35.005062103271484, "global_step": 77902, "epoch": 643} {"train_loss": -34.17993927001953, "global_step": 77903, "epoch": 643} {"train_loss": -34.31161117553711, "global_step": 77904, "epoch": 643} {"train_loss": -36.25935745239258, "global_step": 77905, "epoch": 643} {"train_loss": -34.832923889160156, "global_step": 77906, "epoch": 643} {"train_loss": -35.126949310302734, "global_step": 77907, "epoch": 643} {"train_loss": -36.109188079833984, "global_step": 77908, "epoch": 643} {"train_loss": -35.80186080932617, "global_step": 77909, "epoch": 643} {"train_loss": -36.00252914428711, "global_step": 77910, "epoch": 643} {"train_loss": -36.09817886352539, "global_step": 77911, "epoch": 643} {"train_loss": -36.44662094116211, "global_step": 77912, "epoch": 643} {"train_loss": -36.70579147338867, "global_step": 77913, "epoch": 643} {"train_loss": -36.258392333984375, "global_step": 77914, "epoch": 643} {"train_loss": -36.37373733520508, "global_step": 77915, "epoch": 643} {"train_loss": -36.33088302612305, "global_step": 77916, "epoch": 643} {"train_loss": -36.848976135253906, "global_step": 77917, "epoch": 643} {"train_loss": -37.02018356323242, "global_step": 77918, "epoch": 643} {"train_loss": -36.9013786315918, "global_step": 77919, "epoch": 643} {"train_loss": -37.163299560546875, "global_step": 77920, "epoch": 643} {"train_loss": -37.15930938720703, "global_step": 77921, "epoch": 643} {"train_loss": -36.983455657958984, "global_step": 77922, "epoch": 643} {"train_loss": -35.94272938247555, "global_step": 77923, "epoch": 643, "val_loss": 2646594.75} {"train_loss": -37.3603515625, "global_step": 77924, "epoch": 644} {"train_loss": -37.65383529663086, "global_step": 77925, "epoch": 644} {"train_loss": -37.45864486694336, "global_step": 77926, "epoch": 644} {"train_loss": -37.14411163330078, "global_step": 77927, "epoch": 644} {"train_loss": -37.42252731323242, "global_step": 77928, "epoch": 644} {"train_loss": -37.43327713012695, "global_step": 77929, "epoch": 644} {"train_loss": -37.63761901855469, "global_step": 77930, "epoch": 644} {"train_loss": -37.5889892578125, "global_step": 77931, "epoch": 644} {"train_loss": -37.78779220581055, "global_step": 77932, "epoch": 644} {"train_loss": -37.107032775878906, "global_step": 77933, "epoch": 644} {"train_loss": -37.423458099365234, "global_step": 77934, "epoch": 644} {"train_loss": -37.5333366394043, "global_step": 77935, "epoch": 644} {"train_loss": -37.48871994018555, "global_step": 77936, "epoch": 644} {"train_loss": -38.01289749145508, "global_step": 77937, "epoch": 644} {"train_loss": -37.44601058959961, "global_step": 77938, "epoch": 644} {"train_loss": -37.93516159057617, "global_step": 77939, "epoch": 644} {"train_loss": -38.08718490600586, "global_step": 77940, "epoch": 644} {"train_loss": -37.48754119873047, "global_step": 77941, "epoch": 644} {"train_loss": -37.62400817871094, "global_step": 77942, "epoch": 644} {"train_loss": -37.427215576171875, "global_step": 77943, "epoch": 644} {"train_loss": -37.5254020690918, "global_step": 77944, "epoch": 644} {"train_loss": -37.595802307128906, "global_step": 77945, "epoch": 644} {"train_loss": -37.82207107543945, "global_step": 77946, "epoch": 644} {"train_loss": -38.153602600097656, "global_step": 77947, "epoch": 644} {"train_loss": -37.33238983154297, "global_step": 77948, "epoch": 644} {"train_loss": -37.95856475830078, "global_step": 77949, "epoch": 644} {"train_loss": -38.0943489074707, "global_step": 77950, "epoch": 644} {"train_loss": -38.069366455078125, "global_step": 77951, "epoch": 644} {"train_loss": -37.89089584350586, "global_step": 77952, "epoch": 644} {"train_loss": -37.73748016357422, "global_step": 77953, "epoch": 644} {"train_loss": -38.19285202026367, "global_step": 77954, "epoch": 644} {"train_loss": -37.91962432861328, "global_step": 77955, "epoch": 644} {"train_loss": -38.08881378173828, "global_step": 77956, "epoch": 644} {"train_loss": -38.12821960449219, "global_step": 77957, "epoch": 644} {"train_loss": -37.937191009521484, "global_step": 77958, "epoch": 644} {"train_loss": -37.65411376953125, "global_step": 77959, "epoch": 644} {"train_loss": -37.268856048583984, "global_step": 77960, "epoch": 644} {"train_loss": -36.61260986328125, "global_step": 77961, "epoch": 644} {"train_loss": -36.426246643066406, "global_step": 77962, "epoch": 644} {"train_loss": -36.26264572143555, "global_step": 77963, "epoch": 644} {"train_loss": -35.43283462524414, "global_step": 77964, "epoch": 644} {"train_loss": -36.50233840942383, "global_step": 77965, "epoch": 644} {"train_loss": -37.42401123046875, "global_step": 77966, "epoch": 644} {"train_loss": -37.98737335205078, "global_step": 77967, "epoch": 644} {"train_loss": -36.27252960205078, "global_step": 77968, "epoch": 644} {"train_loss": -37.037696838378906, "global_step": 77969, "epoch": 644} {"train_loss": -37.75130844116211, "global_step": 77970, "epoch": 644} {"train_loss": -37.255279541015625, "global_step": 77971, "epoch": 644} {"train_loss": -37.52231216430664, "global_step": 77972, "epoch": 644} {"train_loss": -36.214080810546875, "global_step": 77973, "epoch": 644} {"train_loss": -36.12447738647461, "global_step": 77974, "epoch": 644} {"train_loss": -36.872318267822266, "global_step": 77975, "epoch": 644} {"train_loss": -37.539005279541016, "global_step": 77976, "epoch": 644} {"train_loss": -37.519039154052734, "global_step": 77977, "epoch": 644} {"train_loss": -36.87294387817383, "global_step": 77978, "epoch": 644} {"train_loss": -36.93844223022461, "global_step": 77979, "epoch": 644} {"train_loss": -37.01118087768555, "global_step": 77980, "epoch": 644} {"train_loss": -37.07691955566406, "global_step": 77981, "epoch": 644} {"train_loss": -35.54049301147461, "global_step": 77982, "epoch": 644} {"train_loss": -37.3338623046875, "global_step": 77983, "epoch": 644} {"train_loss": -37.23324966430664, "global_step": 77984, "epoch": 644} {"train_loss": -36.77604293823242, "global_step": 77985, "epoch": 644} {"train_loss": -35.122406005859375, "global_step": 77986, "epoch": 644} {"train_loss": -36.60565185546875, "global_step": 77987, "epoch": 644} {"train_loss": -36.1314811706543, "global_step": 77988, "epoch": 644} {"train_loss": -36.45663070678711, "global_step": 77989, "epoch": 644} {"train_loss": -35.59220504760742, "global_step": 77990, "epoch": 644} {"train_loss": -36.34967041015625, "global_step": 77991, "epoch": 644} {"train_loss": -34.005775451660156, "global_step": 77992, "epoch": 644} {"train_loss": -37.179115295410156, "global_step": 77993, "epoch": 644} {"train_loss": -36.456764221191406, "global_step": 77994, "epoch": 644} {"train_loss": -36.96343994140625, "global_step": 77995, "epoch": 644} {"train_loss": -36.34796142578125, "global_step": 77996, "epoch": 644} {"train_loss": -35.738006591796875, "global_step": 77997, "epoch": 644} {"train_loss": -36.329219818115234, "global_step": 77998, "epoch": 644} {"train_loss": -34.659019470214844, "global_step": 77999, "epoch": 644} {"train_loss": -35.220088958740234, "global_step": 78000, "epoch": 644} {"train_loss": -34.053314208984375, "global_step": 78001, "epoch": 644} {"train_loss": -35.88897705078125, "global_step": 78002, "epoch": 644} {"train_loss": -35.2374267578125, "global_step": 78003, "epoch": 644} {"train_loss": -35.82145690917969, "global_step": 78004, "epoch": 644} {"train_loss": -36.630001068115234, "global_step": 78005, "epoch": 644} {"train_loss": -33.46958541870117, "global_step": 78006, "epoch": 644} {"train_loss": -35.36818313598633, "global_step": 78007, "epoch": 644} {"train_loss": -35.611846923828125, "global_step": 78008, "epoch": 644} {"train_loss": -33.63582229614258, "global_step": 78009, "epoch": 644} {"train_loss": -34.71955490112305, "global_step": 78010, "epoch": 644} {"train_loss": -35.75649642944336, "global_step": 78011, "epoch": 644} {"train_loss": -36.38226318359375, "global_step": 78012, "epoch": 644} {"train_loss": -35.366207122802734, "global_step": 78013, "epoch": 644} {"train_loss": -35.39970016479492, "global_step": 78014, "epoch": 644} {"train_loss": -35.60450744628906, "global_step": 78015, "epoch": 644} {"train_loss": -33.2425422668457, "global_step": 78016, "epoch": 644} {"train_loss": -35.37034225463867, "global_step": 78017, "epoch": 644} {"train_loss": -35.572444915771484, "global_step": 78018, "epoch": 644} {"train_loss": -35.79400634765625, "global_step": 78019, "epoch": 644} {"train_loss": -34.94623565673828, "global_step": 78020, "epoch": 644} {"train_loss": -35.316402435302734, "global_step": 78021, "epoch": 644} {"train_loss": -35.15359115600586, "global_step": 78022, "epoch": 644} {"train_loss": -36.518287658691406, "global_step": 78023, "epoch": 644} {"train_loss": -36.60308837890625, "global_step": 78024, "epoch": 644} {"train_loss": -36.204010009765625, "global_step": 78025, "epoch": 644} {"train_loss": -35.090328216552734, "global_step": 78026, "epoch": 644} {"train_loss": -36.04939270019531, "global_step": 78027, "epoch": 644} {"train_loss": -34.23042297363281, "global_step": 78028, "epoch": 644} {"train_loss": -36.3272819519043, "global_step": 78029, "epoch": 644} {"train_loss": -35.61152267456055, "global_step": 78030, "epoch": 644} {"train_loss": -36.2226676940918, "global_step": 78031, "epoch": 644} {"train_loss": -36.62592315673828, "global_step": 78032, "epoch": 644} {"train_loss": -36.85784149169922, "global_step": 78033, "epoch": 644} {"train_loss": -35.58201599121094, "global_step": 78034, "epoch": 644} {"train_loss": -35.45924377441406, "global_step": 78035, "epoch": 644} {"train_loss": -35.503265380859375, "global_step": 78036, "epoch": 644} {"train_loss": -36.96124267578125, "global_step": 78037, "epoch": 644} {"train_loss": -35.462196350097656, "global_step": 78038, "epoch": 644} {"train_loss": -35.7281608581543, "global_step": 78039, "epoch": 644} {"train_loss": -35.01711654663086, "global_step": 78040, "epoch": 644} {"train_loss": -35.50703048706055, "global_step": 78041, "epoch": 644} {"train_loss": -36.712554931640625, "global_step": 78042, "epoch": 644} {"train_loss": -36.372188568115234, "global_step": 78043, "epoch": 644} {"train_loss": -36.53191873849916, "global_step": 78044, "epoch": 644, "val_loss": 2698889.25} {"train_loss": -36.4449577331543, "global_step": 78045, "epoch": 645} {"train_loss": -36.73747634887695, "global_step": 78046, "epoch": 645} {"train_loss": -35.91239929199219, "global_step": 78047, "epoch": 645} {"train_loss": -36.69104766845703, "global_step": 78048, "epoch": 645} {"train_loss": -36.63960647583008, "global_step": 78049, "epoch": 645} {"train_loss": -36.889808654785156, "global_step": 78050, "epoch": 645} {"train_loss": -36.65772247314453, "global_step": 78051, "epoch": 645} {"train_loss": -36.5223503112793, "global_step": 78052, "epoch": 645} {"train_loss": -36.78768539428711, "global_step": 78053, "epoch": 645} {"train_loss": -36.41358947753906, "global_step": 78054, "epoch": 645} {"train_loss": -36.49341583251953, "global_step": 78055, "epoch": 645} {"train_loss": -37.08491516113281, "global_step": 78056, "epoch": 645} {"train_loss": -37.020381927490234, "global_step": 78057, "epoch": 645} {"train_loss": -37.432289123535156, "global_step": 78058, "epoch": 645} {"train_loss": -36.87911605834961, "global_step": 78059, "epoch": 645} {"train_loss": -36.36947250366211, "global_step": 78060, "epoch": 645} {"train_loss": -36.3460807800293, "global_step": 78061, "epoch": 645} {"train_loss": -37.36991500854492, "global_step": 78062, "epoch": 645} {"train_loss": -35.999324798583984, "global_step": 78063, "epoch": 645} {"train_loss": -36.18973922729492, "global_step": 78064, "epoch": 645} {"train_loss": -36.27656173706055, "global_step": 78065, "epoch": 645} {"train_loss": -36.405799865722656, "global_step": 78066, "epoch": 645} {"train_loss": -36.692134857177734, "global_step": 78067, "epoch": 645} {"train_loss": -35.955570220947266, "global_step": 78068, "epoch": 645} {"train_loss": -35.583744049072266, "global_step": 78069, "epoch": 645} {"train_loss": -36.706703186035156, "global_step": 78070, "epoch": 645} {"train_loss": -36.70383834838867, "global_step": 78071, "epoch": 645} {"train_loss": -35.14040756225586, "global_step": 78072, "epoch": 645} {"train_loss": -36.414093017578125, "global_step": 78073, "epoch": 645} {"train_loss": -36.36130142211914, "global_step": 78074, "epoch": 645} {"train_loss": -36.25056457519531, "global_step": 78075, "epoch": 645} {"train_loss": -37.57448196411133, "global_step": 78076, "epoch": 645} {"train_loss": -36.628623962402344, "global_step": 78077, "epoch": 645} {"train_loss": -37.26339340209961, "global_step": 78078, "epoch": 645} {"train_loss": -35.91323471069336, "global_step": 78079, "epoch": 645} {"train_loss": -36.70722579956055, "global_step": 78080, "epoch": 645} {"train_loss": -36.92788314819336, "global_step": 78081, "epoch": 645} {"train_loss": -36.29151153564453, "global_step": 78082, "epoch": 645} {"train_loss": -36.13119888305664, "global_step": 78083, "epoch": 645} {"train_loss": -35.635040283203125, "global_step": 78084, "epoch": 645} {"train_loss": -35.499752044677734, "global_step": 78085, "epoch": 645} {"train_loss": -35.747676849365234, "global_step": 78086, "epoch": 645} {"train_loss": -36.80149459838867, "global_step": 78087, "epoch": 645} {"train_loss": -34.884883880615234, "global_step": 78088, "epoch": 645} {"train_loss": -34.109779357910156, "global_step": 78089, "epoch": 645} {"train_loss": -35.880279541015625, "global_step": 78090, "epoch": 645} {"train_loss": -36.875919342041016, "global_step": 78091, "epoch": 645} {"train_loss": -34.26052474975586, "global_step": 78092, "epoch": 645} {"train_loss": -31.821008682250977, "global_step": 78093, "epoch": 645} {"train_loss": -36.687923431396484, "global_step": 78094, "epoch": 645} {"train_loss": -35.185115814208984, "global_step": 78095, "epoch": 645} {"train_loss": -34.062294006347656, "global_step": 78096, "epoch": 645} {"train_loss": -32.97846603393555, "global_step": 78097, "epoch": 645} {"train_loss": -36.9015998840332, "global_step": 78098, "epoch": 645} {"train_loss": -33.81753158569336, "global_step": 78099, "epoch": 645} {"train_loss": -36.31808090209961, "global_step": 78100, "epoch": 645} {"train_loss": -35.66036605834961, "global_step": 78101, "epoch": 645} {"train_loss": -36.13676071166992, "global_step": 78102, "epoch": 645} {"train_loss": -36.98942947387695, "global_step": 78103, "epoch": 645} {"train_loss": -35.646148681640625, "global_step": 78104, "epoch": 645} {"train_loss": -36.69900131225586, "global_step": 78105, "epoch": 645} {"train_loss": -36.957767486572266, "global_step": 78106, "epoch": 645} {"train_loss": -35.27549743652344, "global_step": 78107, "epoch": 645} {"train_loss": -37.074928283691406, "global_step": 78108, "epoch": 645} {"train_loss": -35.72215270996094, "global_step": 78109, "epoch": 645} {"train_loss": -36.640472412109375, "global_step": 78110, "epoch": 645} {"train_loss": -36.98314666748047, "global_step": 78111, "epoch": 645} {"train_loss": -36.8908576965332, "global_step": 78112, "epoch": 645} {"train_loss": -37.22673416137695, "global_step": 78113, "epoch": 645} {"train_loss": -36.738338470458984, "global_step": 78114, "epoch": 645} {"train_loss": -37.1820068359375, "global_step": 78115, "epoch": 645} {"train_loss": -36.58657455444336, "global_step": 78116, "epoch": 645} {"train_loss": -37.38906478881836, "global_step": 78117, "epoch": 645} {"train_loss": -36.6470832824707, "global_step": 78118, "epoch": 645} {"train_loss": -36.29779052734375, "global_step": 78119, "epoch": 645} {"train_loss": -35.26204299926758, "global_step": 78120, "epoch": 645} {"train_loss": -36.619808197021484, "global_step": 78121, "epoch": 645} {"train_loss": -36.44328308105469, "global_step": 78122, "epoch": 645} {"train_loss": -36.727088928222656, "global_step": 78123, "epoch": 645} {"train_loss": -37.40629959106445, "global_step": 78124, "epoch": 645} {"train_loss": -37.12007522583008, "global_step": 78125, "epoch": 645} {"train_loss": -37.195491790771484, "global_step": 78126, "epoch": 645} {"train_loss": -37.2735595703125, "global_step": 78127, "epoch": 645} {"train_loss": -37.58311080932617, "global_step": 78128, "epoch": 645} {"train_loss": -37.69378662109375, "global_step": 78129, "epoch": 645} {"train_loss": -37.28694152832031, "global_step": 78130, "epoch": 645} {"train_loss": -37.224952697753906, "global_step": 78131, "epoch": 645} {"train_loss": -37.89921188354492, "global_step": 78132, "epoch": 645} {"train_loss": -37.574893951416016, "global_step": 78133, "epoch": 645} {"train_loss": -37.946624755859375, "global_step": 78134, "epoch": 645} {"train_loss": -37.80863571166992, "global_step": 78135, "epoch": 645} {"train_loss": -37.918190002441406, "global_step": 78136, "epoch": 645} {"train_loss": -37.649593353271484, "global_step": 78137, "epoch": 645} {"train_loss": -38.09980392456055, "global_step": 78138, "epoch": 645} {"train_loss": -38.23345947265625, "global_step": 78139, "epoch": 645} {"train_loss": -38.492488861083984, "global_step": 78140, "epoch": 645} {"train_loss": -37.699371337890625, "global_step": 78141, "epoch": 645} {"train_loss": -38.035640716552734, "global_step": 78142, "epoch": 645} {"train_loss": -38.153560638427734, "global_step": 78143, "epoch": 645} {"train_loss": -38.26148986816406, "global_step": 78144, "epoch": 645} {"train_loss": -37.97857666015625, "global_step": 78145, "epoch": 645} {"train_loss": -38.31433868408203, "global_step": 78146, "epoch": 645} {"train_loss": -38.08805465698242, "global_step": 78147, "epoch": 645} {"train_loss": -37.8205680847168, "global_step": 78148, "epoch": 645} {"train_loss": -38.071590423583984, "global_step": 78149, "epoch": 645} {"train_loss": -37.72182846069336, "global_step": 78150, "epoch": 645} {"train_loss": -38.000247955322266, "global_step": 78151, "epoch": 645} {"train_loss": -38.515071868896484, "global_step": 78152, "epoch": 645} {"train_loss": -38.358802795410156, "global_step": 78153, "epoch": 645} {"train_loss": -37.67197799682617, "global_step": 78154, "epoch": 645} {"train_loss": -37.71449279785156, "global_step": 78155, "epoch": 645} {"train_loss": -38.43973922729492, "global_step": 78156, "epoch": 645} {"train_loss": -38.111549377441406, "global_step": 78157, "epoch": 645} {"train_loss": -38.18564987182617, "global_step": 78158, "epoch": 645} {"train_loss": -37.85067367553711, "global_step": 78159, "epoch": 645} {"train_loss": -37.86457443237305, "global_step": 78160, "epoch": 645} {"train_loss": -38.21186447143555, "global_step": 78161, "epoch": 645} {"train_loss": -38.04756546020508, "global_step": 78162, "epoch": 645} {"train_loss": -37.470855712890625, "global_step": 78163, "epoch": 645} {"train_loss": -36.09255599975586, "global_step": 78164, "epoch": 645} {"train_loss": -36.75380585410378, "global_step": 78165, "epoch": 645, "val_loss": 2661884.25} {"train_loss": -23.44565773010254, "global_step": 78166, "epoch": 646} {"train_loss": -9.265449523925781, "global_step": 78167, "epoch": 646} {"train_loss": -8.487711906433105, "global_step": 78168, "epoch": 646} {"train_loss": -34.227779388427734, "global_step": 78169, "epoch": 646} {"train_loss": -30.026721954345703, "global_step": 78170, "epoch": 646} {"train_loss": -18.708242416381836, "global_step": 78171, "epoch": 646} {"train_loss": -34.6732177734375, "global_step": 78172, "epoch": 646} {"train_loss": -21.736331939697266, "global_step": 78173, "epoch": 646} {"train_loss": -36.01411056518555, "global_step": 78174, "epoch": 646} {"train_loss": -30.407392501831055, "global_step": 78175, "epoch": 646} {"train_loss": -33.43026351928711, "global_step": 78176, "epoch": 646} {"train_loss": -34.69381332397461, "global_step": 78177, "epoch": 646} {"train_loss": -31.844419479370117, "global_step": 78178, "epoch": 646} {"train_loss": -36.9398078918457, "global_step": 78179, "epoch": 646} {"train_loss": -34.1076545715332, "global_step": 78180, "epoch": 646} {"train_loss": -34.332672119140625, "global_step": 78181, "epoch": 646} {"train_loss": -36.73950958251953, "global_step": 78182, "epoch": 646} {"train_loss": -35.525848388671875, "global_step": 78183, "epoch": 646} {"train_loss": -34.12479019165039, "global_step": 78184, "epoch": 646} {"train_loss": -36.07569122314453, "global_step": 78185, "epoch": 646} {"train_loss": -36.27906036376953, "global_step": 78186, "epoch": 646} {"train_loss": -35.24067687988281, "global_step": 78187, "epoch": 646} {"train_loss": -36.3298454284668, "global_step": 78188, "epoch": 646} {"train_loss": -36.674285888671875, "global_step": 78189, "epoch": 646} {"train_loss": -36.970298767089844, "global_step": 78190, "epoch": 646} {"train_loss": -36.41126251220703, "global_step": 78191, "epoch": 646} {"train_loss": -36.63031005859375, "global_step": 78192, "epoch": 646} {"train_loss": -36.621456146240234, "global_step": 78193, "epoch": 646} {"train_loss": -36.78186798095703, "global_step": 78194, "epoch": 646} {"train_loss": -36.616241455078125, "global_step": 78195, "epoch": 646} {"train_loss": -37.128475189208984, "global_step": 78196, "epoch": 646} {"train_loss": -37.11068344116211, "global_step": 78197, "epoch": 646} {"train_loss": -37.002777099609375, "global_step": 78198, "epoch": 646} {"train_loss": -37.10254669189453, "global_step": 78199, "epoch": 646} {"train_loss": -37.30900955200195, "global_step": 78200, "epoch": 646} {"train_loss": -37.15182876586914, "global_step": 78201, "epoch": 646} {"train_loss": -37.516971588134766, "global_step": 78202, "epoch": 646} {"train_loss": -37.555946350097656, "global_step": 78203, "epoch": 646} {"train_loss": -37.557342529296875, "global_step": 78204, "epoch": 646} {"train_loss": -37.66571044921875, "global_step": 78205, "epoch": 646} {"train_loss": -37.34548568725586, "global_step": 78206, "epoch": 646} {"train_loss": -37.584449768066406, "global_step": 78207, "epoch": 646} {"train_loss": -37.44324493408203, "global_step": 78208, "epoch": 646} {"train_loss": -37.60195541381836, "global_step": 78209, "epoch": 646} {"train_loss": -37.659786224365234, "global_step": 78210, "epoch": 646} {"train_loss": -38.00054168701172, "global_step": 78211, "epoch": 646} {"train_loss": -37.96718978881836, "global_step": 78212, "epoch": 646} {"train_loss": -38.273536682128906, "global_step": 78213, "epoch": 646} {"train_loss": -37.592201232910156, "global_step": 78214, "epoch": 646} {"train_loss": -37.77424621582031, "global_step": 78215, "epoch": 646} {"train_loss": -38.19056701660156, "global_step": 78216, "epoch": 646} {"train_loss": -38.0406379699707, "global_step": 78217, "epoch": 646} {"train_loss": -37.56047439575195, "global_step": 78218, "epoch": 646} {"train_loss": -37.76420211791992, "global_step": 78219, "epoch": 646} {"train_loss": -37.96499252319336, "global_step": 78220, "epoch": 646} {"train_loss": -38.015869140625, "global_step": 78221, "epoch": 646} {"train_loss": -38.06688690185547, "global_step": 78222, "epoch": 646} {"train_loss": -37.92897415161133, "global_step": 78223, "epoch": 646} {"train_loss": -37.29734420776367, "global_step": 78224, "epoch": 646} {"train_loss": -38.06439208984375, "global_step": 78225, "epoch": 646} {"train_loss": -38.04780960083008, "global_step": 78226, "epoch": 646} {"train_loss": -38.11868667602539, "global_step": 78227, "epoch": 646} {"train_loss": -37.99906539916992, "global_step": 78228, "epoch": 646} {"train_loss": -37.705360412597656, "global_step": 78229, "epoch": 646} {"train_loss": -38.27539825439453, "global_step": 78230, "epoch": 646} {"train_loss": -37.93556594848633, "global_step": 78231, "epoch": 646} {"train_loss": -37.926944732666016, "global_step": 78232, "epoch": 646} {"train_loss": -36.643768310546875, "global_step": 78233, "epoch": 646} {"train_loss": -37.05208969116211, "global_step": 78234, "epoch": 646} {"train_loss": -38.10773468017578, "global_step": 78235, "epoch": 646} {"train_loss": -37.785335540771484, "global_step": 78236, "epoch": 646} {"train_loss": -37.80251693725586, "global_step": 78237, "epoch": 646} {"train_loss": -36.77790451049805, "global_step": 78238, "epoch": 646} {"train_loss": -37.66217041015625, "global_step": 78239, "epoch": 646} {"train_loss": -36.907928466796875, "global_step": 78240, "epoch": 646} {"train_loss": -36.796661376953125, "global_step": 78241, "epoch": 646} {"train_loss": -37.030601501464844, "global_step": 78242, "epoch": 646} {"train_loss": -36.816673278808594, "global_step": 78243, "epoch": 646} {"train_loss": -37.26063919067383, "global_step": 78244, "epoch": 646} {"train_loss": -36.98243713378906, "global_step": 78245, "epoch": 646} {"train_loss": -35.969608306884766, "global_step": 78246, "epoch": 646} {"train_loss": -35.767642974853516, "global_step": 78247, "epoch": 646} {"train_loss": -35.073116302490234, "global_step": 78248, "epoch": 646} {"train_loss": -35.610984802246094, "global_step": 78249, "epoch": 646} {"train_loss": -34.51966857910156, "global_step": 78250, "epoch": 646} {"train_loss": -35.81120681762695, "global_step": 78251, "epoch": 646} {"train_loss": -34.383174896240234, "global_step": 78252, "epoch": 646} {"train_loss": -36.088348388671875, "global_step": 78253, "epoch": 646} {"train_loss": -31.16346549987793, "global_step": 78254, "epoch": 646} {"train_loss": -37.3722038269043, "global_step": 78255, "epoch": 646} {"train_loss": -35.57238006591797, "global_step": 78256, "epoch": 646} {"train_loss": -30.24886131286621, "global_step": 78257, "epoch": 646} {"train_loss": -34.126136779785156, "global_step": 78258, "epoch": 646} {"train_loss": -33.33047103881836, "global_step": 78259, "epoch": 646} {"train_loss": -34.44892120361328, "global_step": 78260, "epoch": 646} {"train_loss": -32.041259765625, "global_step": 78261, "epoch": 646} {"train_loss": -34.19508361816406, "global_step": 78262, "epoch": 646} {"train_loss": -35.89325714111328, "global_step": 78263, "epoch": 646} {"train_loss": -33.03253173828125, "global_step": 78264, "epoch": 646} {"train_loss": -29.41701316833496, "global_step": 78265, "epoch": 646} {"train_loss": -26.29193115234375, "global_step": 78266, "epoch": 646} {"train_loss": -32.12803268432617, "global_step": 78267, "epoch": 646} {"train_loss": -29.196531295776367, "global_step": 78268, "epoch": 646} {"train_loss": -6.220696926116943, "global_step": 78269, "epoch": 646} {"train_loss": -28.32404136657715, "global_step": 78270, "epoch": 646} {"train_loss": -32.49406051635742, "global_step": 78271, "epoch": 646} {"train_loss": -25.73224449157715, "global_step": 78272, "epoch": 646} {"train_loss": -27.685443878173828, "global_step": 78273, "epoch": 646} {"train_loss": -27.773889541625977, "global_step": 78274, "epoch": 646} {"train_loss": -28.897855758666992, "global_step": 78275, "epoch": 646} {"train_loss": -28.99554443359375, "global_step": 78276, "epoch": 646} {"train_loss": -27.789968490600586, "global_step": 78277, "epoch": 646} {"train_loss": -27.166715621948242, "global_step": 78278, "epoch": 646} {"train_loss": -28.399877548217773, "global_step": 78279, "epoch": 646} {"train_loss": -30.514062881469727, "global_step": 78280, "epoch": 646} {"train_loss": -30.46561050415039, "global_step": 78281, "epoch": 646} {"train_loss": -32.10178756713867, "global_step": 78282, "epoch": 646} {"train_loss": -30.535017013549805, "global_step": 78283, "epoch": 646} {"train_loss": -31.43189811706543, "global_step": 78284, "epoch": 646} {"train_loss": -30.66973876953125, "global_step": 78285, "epoch": 646} {"train_loss": -34.02691726448122, "global_step": 78286, "epoch": 646, "val_loss": 2876430.0} {"train_loss": -30.97788429260254, "global_step": 78287, "epoch": 647} {"train_loss": -32.244937896728516, "global_step": 78288, "epoch": 647} {"train_loss": -32.131813049316406, "global_step": 78289, "epoch": 647} {"train_loss": -32.57986068725586, "global_step": 78290, "epoch": 647} {"train_loss": -32.644004821777344, "global_step": 78291, "epoch": 647} {"train_loss": -33.0120735168457, "global_step": 78292, "epoch": 647} {"train_loss": -33.43614959716797, "global_step": 78293, "epoch": 647} {"train_loss": -33.436790466308594, "global_step": 78294, "epoch": 647} {"train_loss": -33.410850524902344, "global_step": 78295, "epoch": 647} {"train_loss": -32.25709533691406, "global_step": 78296, "epoch": 647} {"train_loss": -33.150390625, "global_step": 78297, "epoch": 647} {"train_loss": -33.564247131347656, "global_step": 78298, "epoch": 647} {"train_loss": -33.29435348510742, "global_step": 78299, "epoch": 647} {"train_loss": -33.6488151550293, "global_step": 78300, "epoch": 647} {"train_loss": -33.719051361083984, "global_step": 78301, "epoch": 647} {"train_loss": -33.69655990600586, "global_step": 78302, "epoch": 647} {"train_loss": -33.9637451171875, "global_step": 78303, "epoch": 647} {"train_loss": -33.59187698364258, "global_step": 78304, "epoch": 647} {"train_loss": -34.24345016479492, "global_step": 78305, "epoch": 647} {"train_loss": -34.257537841796875, "global_step": 78306, "epoch": 647} {"train_loss": -34.11159896850586, "global_step": 78307, "epoch": 647} {"train_loss": -34.36407470703125, "global_step": 78308, "epoch": 647} {"train_loss": -33.7698860168457, "global_step": 78309, "epoch": 647} {"train_loss": -33.99420166015625, "global_step": 78310, "epoch": 647} {"train_loss": -34.28169250488281, "global_step": 78311, "epoch": 647} {"train_loss": -34.4219856262207, "global_step": 78312, "epoch": 647} {"train_loss": -34.70295333862305, "global_step": 78313, "epoch": 647} {"train_loss": -34.35517120361328, "global_step": 78314, "epoch": 647} {"train_loss": -34.580657958984375, "global_step": 78315, "epoch": 647} {"train_loss": -34.86920928955078, "global_step": 78316, "epoch": 647} {"train_loss": -34.38181686401367, "global_step": 78317, "epoch": 647} {"train_loss": -34.18267822265625, "global_step": 78318, "epoch": 647} {"train_loss": -34.55854415893555, "global_step": 78319, "epoch": 647} {"train_loss": -34.90899658203125, "global_step": 78320, "epoch": 647} {"train_loss": -34.79688262939453, "global_step": 78321, "epoch": 647} {"train_loss": -35.120357513427734, "global_step": 78322, "epoch": 647} {"train_loss": -34.815818786621094, "global_step": 78323, "epoch": 647} {"train_loss": -35.06757736206055, "global_step": 78324, "epoch": 647} {"train_loss": -35.169219970703125, "global_step": 78325, "epoch": 647} {"train_loss": -35.134456634521484, "global_step": 78326, "epoch": 647} {"train_loss": -35.42848587036133, "global_step": 78327, "epoch": 647} {"train_loss": -35.42961120605469, "global_step": 78328, "epoch": 647} {"train_loss": -35.41762161254883, "global_step": 78329, "epoch": 647} {"train_loss": -35.309043884277344, "global_step": 78330, "epoch": 647} {"train_loss": -35.1751708984375, "global_step": 78331, "epoch": 647} {"train_loss": -35.3768310546875, "global_step": 78332, "epoch": 647} {"train_loss": -34.95424270629883, "global_step": 78333, "epoch": 647} {"train_loss": -35.55828857421875, "global_step": 78334, "epoch": 647} {"train_loss": -35.74468231201172, "global_step": 78335, "epoch": 647} {"train_loss": -35.31412887573242, "global_step": 78336, "epoch": 647} {"train_loss": -35.907310485839844, "global_step": 78337, "epoch": 647} {"train_loss": -35.6387825012207, "global_step": 78338, "epoch": 647} {"train_loss": -36.157588958740234, "global_step": 78339, "epoch": 647} {"train_loss": -35.646907806396484, "global_step": 78340, "epoch": 647} {"train_loss": -36.14735794067383, "global_step": 78341, "epoch": 647} {"train_loss": -36.166194915771484, "global_step": 78342, "epoch": 647} {"train_loss": -35.933929443359375, "global_step": 78343, "epoch": 647} {"train_loss": -36.02470779418945, "global_step": 78344, "epoch": 647} {"train_loss": -36.207916259765625, "global_step": 78345, "epoch": 647} {"train_loss": -36.09510803222656, "global_step": 78346, "epoch": 647} {"train_loss": -35.69605255126953, "global_step": 78347, "epoch": 647} {"train_loss": -35.9757194519043, "global_step": 78348, "epoch": 647} {"train_loss": -36.3715934753418, "global_step": 78349, "epoch": 647} {"train_loss": -36.2602653503418, "global_step": 78350, "epoch": 647} {"train_loss": -36.21784210205078, "global_step": 78351, "epoch": 647} {"train_loss": -36.65932846069336, "global_step": 78352, "epoch": 647} {"train_loss": -36.387630462646484, "global_step": 78353, "epoch": 647} {"train_loss": -36.613338470458984, "global_step": 78354, "epoch": 647} {"train_loss": -36.05447769165039, "global_step": 78355, "epoch": 647} {"train_loss": -36.57141876220703, "global_step": 78356, "epoch": 647} {"train_loss": -36.50934600830078, "global_step": 78357, "epoch": 647} {"train_loss": -36.66591262817383, "global_step": 78358, "epoch": 647} {"train_loss": -36.596717834472656, "global_step": 78359, "epoch": 647} {"train_loss": -36.67501449584961, "global_step": 78360, "epoch": 647} {"train_loss": -36.16621017456055, "global_step": 78361, "epoch": 647} {"train_loss": -36.625160217285156, "global_step": 78362, "epoch": 647} {"train_loss": -36.74807357788086, "global_step": 78363, "epoch": 647} {"train_loss": -36.41530990600586, "global_step": 78364, "epoch": 647} {"train_loss": -36.41527557373047, "global_step": 78365, "epoch": 647} {"train_loss": -36.61735153198242, "global_step": 78366, "epoch": 647} {"train_loss": -36.189537048339844, "global_step": 78367, "epoch": 647} {"train_loss": -34.74560546875, "global_step": 78368, "epoch": 647} {"train_loss": -34.63885498046875, "global_step": 78369, "epoch": 647} {"train_loss": -36.460567474365234, "global_step": 78370, "epoch": 647} {"train_loss": -36.59664535522461, "global_step": 78371, "epoch": 647} {"train_loss": -35.336299896240234, "global_step": 78372, "epoch": 647} {"train_loss": -35.603206634521484, "global_step": 78373, "epoch": 647} {"train_loss": -36.27260971069336, "global_step": 78374, "epoch": 647} {"train_loss": -37.24088668823242, "global_step": 78375, "epoch": 647} {"train_loss": -36.029754638671875, "global_step": 78376, "epoch": 647} {"train_loss": -35.51351547241211, "global_step": 78377, "epoch": 647} {"train_loss": -37.13572311401367, "global_step": 78378, "epoch": 647} {"train_loss": -36.12307357788086, "global_step": 78379, "epoch": 647} {"train_loss": -35.71232986450195, "global_step": 78380, "epoch": 647} {"train_loss": -35.68425750732422, "global_step": 78381, "epoch": 647} {"train_loss": -36.83614730834961, "global_step": 78382, "epoch": 647} {"train_loss": -36.50895309448242, "global_step": 78383, "epoch": 647} {"train_loss": -36.484066009521484, "global_step": 78384, "epoch": 647} {"train_loss": -36.951351165771484, "global_step": 78385, "epoch": 647} {"train_loss": -36.2896614074707, "global_step": 78386, "epoch": 647} {"train_loss": -36.132957458496094, "global_step": 78387, "epoch": 647} {"train_loss": -36.400123596191406, "global_step": 78388, "epoch": 647} {"train_loss": -37.22613525390625, "global_step": 78389, "epoch": 647} {"train_loss": -36.36674118041992, "global_step": 78390, "epoch": 647} {"train_loss": -36.419673919677734, "global_step": 78391, "epoch": 647} {"train_loss": -37.03364562988281, "global_step": 78392, "epoch": 647} {"train_loss": -36.89311599731445, "global_step": 78393, "epoch": 647} {"train_loss": -36.210479736328125, "global_step": 78394, "epoch": 647} {"train_loss": -37.01703643798828, "global_step": 78395, "epoch": 647} {"train_loss": -36.905941009521484, "global_step": 78396, "epoch": 647} {"train_loss": -36.35983657836914, "global_step": 78397, "epoch": 647} {"train_loss": -36.88077926635742, "global_step": 78398, "epoch": 647} {"train_loss": -37.375911712646484, "global_step": 78399, "epoch": 647} {"train_loss": -36.816139221191406, "global_step": 78400, "epoch": 647} {"train_loss": -37.173255920410156, "global_step": 78401, "epoch": 647} {"train_loss": -37.25461959838867, "global_step": 78402, "epoch": 647} {"train_loss": -36.458248138427734, "global_step": 78403, "epoch": 647} {"train_loss": -37.159244537353516, "global_step": 78404, "epoch": 647} {"train_loss": -37.305999755859375, "global_step": 78405, "epoch": 647} {"train_loss": -37.252784729003906, "global_step": 78406, "epoch": 647} {"train_loss": -35.47813000954872, "global_step": 78407, "epoch": 647, "val_loss": 2618934.0} {"train_loss": -37.095027923583984, "global_step": 78408, "epoch": 648} {"train_loss": -37.06414794921875, "global_step": 78409, "epoch": 648} {"train_loss": -35.011077880859375, "global_step": 78410, "epoch": 648} {"train_loss": -37.545040130615234, "global_step": 78411, "epoch": 648} {"train_loss": -33.99583053588867, "global_step": 78412, "epoch": 648} {"train_loss": -37.74204635620117, "global_step": 78413, "epoch": 648} {"train_loss": -35.46417236328125, "global_step": 78414, "epoch": 648} {"train_loss": -37.06629943847656, "global_step": 78415, "epoch": 648} {"train_loss": -35.7843017578125, "global_step": 78416, "epoch": 648} {"train_loss": -37.1483154296875, "global_step": 78417, "epoch": 648} {"train_loss": -36.23101806640625, "global_step": 78418, "epoch": 648} {"train_loss": -37.0320930480957, "global_step": 78419, "epoch": 648} {"train_loss": -37.4390983581543, "global_step": 78420, "epoch": 648} {"train_loss": -36.533748626708984, "global_step": 78421, "epoch": 648} {"train_loss": -37.57271957397461, "global_step": 78422, "epoch": 648} {"train_loss": -37.001895904541016, "global_step": 78423, "epoch": 648} {"train_loss": -37.9502067565918, "global_step": 78424, "epoch": 648} {"train_loss": -37.37432861328125, "global_step": 78425, "epoch": 648} {"train_loss": -36.12800216674805, "global_step": 78426, "epoch": 648} {"train_loss": -34.058937072753906, "global_step": 78427, "epoch": 648} {"train_loss": -33.29692077636719, "global_step": 78428, "epoch": 648} {"train_loss": -32.78383255004883, "global_step": 78429, "epoch": 648} {"train_loss": -33.43789291381836, "global_step": 78430, "epoch": 648} {"train_loss": -37.220272064208984, "global_step": 78431, "epoch": 648} {"train_loss": -35.553585052490234, "global_step": 78432, "epoch": 648} {"train_loss": -31.942718505859375, "global_step": 78433, "epoch": 648} {"train_loss": -35.41497802734375, "global_step": 78434, "epoch": 648} {"train_loss": -36.56254196166992, "global_step": 78435, "epoch": 648} {"train_loss": -35.60429763793945, "global_step": 78436, "epoch": 648} {"train_loss": -35.231224060058594, "global_step": 78437, "epoch": 648} {"train_loss": -34.14207077026367, "global_step": 78438, "epoch": 648} {"train_loss": -35.94829177856445, "global_step": 78439, "epoch": 648} {"train_loss": -36.834075927734375, "global_step": 78440, "epoch": 648} {"train_loss": -36.33015060424805, "global_step": 78441, "epoch": 648} {"train_loss": -36.350276947021484, "global_step": 78442, "epoch": 648} {"train_loss": -36.51999282836914, "global_step": 78443, "epoch": 648} {"train_loss": -36.6430549621582, "global_step": 78444, "epoch": 648} {"train_loss": -36.975830078125, "global_step": 78445, "epoch": 648} {"train_loss": -36.673458099365234, "global_step": 78446, "epoch": 648} {"train_loss": -36.70531463623047, "global_step": 78447, "epoch": 648} {"train_loss": -37.03707504272461, "global_step": 78448, "epoch": 648} {"train_loss": -37.29951095581055, "global_step": 78449, "epoch": 648} {"train_loss": -37.36393356323242, "global_step": 78450, "epoch": 648} {"train_loss": -36.97978591918945, "global_step": 78451, "epoch": 648} {"train_loss": -37.47808074951172, "global_step": 78452, "epoch": 648} {"train_loss": -37.368507385253906, "global_step": 78453, "epoch": 648} {"train_loss": -36.68330001831055, "global_step": 78454, "epoch": 648} {"train_loss": -37.77056121826172, "global_step": 78455, "epoch": 648} {"train_loss": -37.33854675292969, "global_step": 78456, "epoch": 648} {"train_loss": -37.43141555786133, "global_step": 78457, "epoch": 648} {"train_loss": -37.74633026123047, "global_step": 78458, "epoch": 648} {"train_loss": -36.373416900634766, "global_step": 78459, "epoch": 648} {"train_loss": -37.459938049316406, "global_step": 78460, "epoch": 648} {"train_loss": -37.9136962890625, "global_step": 78461, "epoch": 648} {"train_loss": -37.755210876464844, "global_step": 78462, "epoch": 648} {"train_loss": -37.287567138671875, "global_step": 78463, "epoch": 648} {"train_loss": -37.29632568359375, "global_step": 78464, "epoch": 648} {"train_loss": -38.03705978393555, "global_step": 78465, "epoch": 648} {"train_loss": -37.70965576171875, "global_step": 78466, "epoch": 648} {"train_loss": -37.247310638427734, "global_step": 78467, "epoch": 648} {"train_loss": -37.98554611206055, "global_step": 78468, "epoch": 648} {"train_loss": -37.45461654663086, "global_step": 78469, "epoch": 648} {"train_loss": -37.22805404663086, "global_step": 78470, "epoch": 648} {"train_loss": -37.665435791015625, "global_step": 78471, "epoch": 648} {"train_loss": -37.78989791870117, "global_step": 78472, "epoch": 648} {"train_loss": -36.40549850463867, "global_step": 78473, "epoch": 648} {"train_loss": -37.3809700012207, "global_step": 78474, "epoch": 648} {"train_loss": -37.74908447265625, "global_step": 78475, "epoch": 648} {"train_loss": -37.35150146484375, "global_step": 78476, "epoch": 648} {"train_loss": -36.44855880737305, "global_step": 78477, "epoch": 648} {"train_loss": -37.891395568847656, "global_step": 78478, "epoch": 648} {"train_loss": -37.74592971801758, "global_step": 78479, "epoch": 648} {"train_loss": -37.19928741455078, "global_step": 78480, "epoch": 648} {"train_loss": -37.93214416503906, "global_step": 78481, "epoch": 648} {"train_loss": -38.05709457397461, "global_step": 78482, "epoch": 648} {"train_loss": -37.850215911865234, "global_step": 78483, "epoch": 648} {"train_loss": -37.12432861328125, "global_step": 78484, "epoch": 648} {"train_loss": -37.791316986083984, "global_step": 78485, "epoch": 648} {"train_loss": -37.90460205078125, "global_step": 78486, "epoch": 648} {"train_loss": -37.143211364746094, "global_step": 78487, "epoch": 648} {"train_loss": -37.86542892456055, "global_step": 78488, "epoch": 648} {"train_loss": -36.205020904541016, "global_step": 78489, "epoch": 648} {"train_loss": -36.9759635925293, "global_step": 78490, "epoch": 648} {"train_loss": -37.49867630004883, "global_step": 78491, "epoch": 648} {"train_loss": -37.38792037963867, "global_step": 78492, "epoch": 648} {"train_loss": -37.33317947387695, "global_step": 78493, "epoch": 648} {"train_loss": -36.045841217041016, "global_step": 78494, "epoch": 648} {"train_loss": -37.48945999145508, "global_step": 78495, "epoch": 648} {"train_loss": -37.35386276245117, "global_step": 78496, "epoch": 648} {"train_loss": -35.80276870727539, "global_step": 78497, "epoch": 648} {"train_loss": -37.643165588378906, "global_step": 78498, "epoch": 648} {"train_loss": -37.15675735473633, "global_step": 78499, "epoch": 648} {"train_loss": -35.56098175048828, "global_step": 78500, "epoch": 648} {"train_loss": -37.489593505859375, "global_step": 78501, "epoch": 648} {"train_loss": -37.60748291015625, "global_step": 78502, "epoch": 648} {"train_loss": -35.23762130737305, "global_step": 78503, "epoch": 648} {"train_loss": -36.819061279296875, "global_step": 78504, "epoch": 648} {"train_loss": -35.023040771484375, "global_step": 78505, "epoch": 648} {"train_loss": -35.353179931640625, "global_step": 78506, "epoch": 648} {"train_loss": -36.92805862426758, "global_step": 78507, "epoch": 648} {"train_loss": -37.323299407958984, "global_step": 78508, "epoch": 648} {"train_loss": -35.16428756713867, "global_step": 78509, "epoch": 648} {"train_loss": -37.22929000854492, "global_step": 78510, "epoch": 648} {"train_loss": -37.23786544799805, "global_step": 78511, "epoch": 648} {"train_loss": -36.41316604614258, "global_step": 78512, "epoch": 648} {"train_loss": -36.12616729736328, "global_step": 78513, "epoch": 648} {"train_loss": -36.891502380371094, "global_step": 78514, "epoch": 648} {"train_loss": -35.626102447509766, "global_step": 78515, "epoch": 648} {"train_loss": -36.710418701171875, "global_step": 78516, "epoch": 648} {"train_loss": -36.67408752441406, "global_step": 78517, "epoch": 648} {"train_loss": -36.445159912109375, "global_step": 78518, "epoch": 648} {"train_loss": -35.240623474121094, "global_step": 78519, "epoch": 648} {"train_loss": -36.46562576293945, "global_step": 78520, "epoch": 648} {"train_loss": -37.199134826660156, "global_step": 78521, "epoch": 648} {"train_loss": -36.389808654785156, "global_step": 78522, "epoch": 648} {"train_loss": -37.063392639160156, "global_step": 78523, "epoch": 648} {"train_loss": -36.28120040893555, "global_step": 78524, "epoch": 648} {"train_loss": -37.016876220703125, "global_step": 78525, "epoch": 648} {"train_loss": -37.23116683959961, "global_step": 78526, "epoch": 648} {"train_loss": -37.22740173339844, "global_step": 78527, "epoch": 648} {"train_loss": -36.72329024638026, "global_step": 78528, "epoch": 648, "val_loss": 2649855.0} {"train_loss": -37.25344467163086, "global_step": 78529, "epoch": 649} {"train_loss": -37.68320846557617, "global_step": 78530, "epoch": 649} {"train_loss": -36.98899459838867, "global_step": 78531, "epoch": 649} {"train_loss": -37.359493255615234, "global_step": 78532, "epoch": 649} {"train_loss": -37.723995208740234, "global_step": 78533, "epoch": 649} {"train_loss": -37.43174362182617, "global_step": 78534, "epoch": 649} {"train_loss": -37.68252182006836, "global_step": 78535, "epoch": 649} {"train_loss": -30.233158111572266, "global_step": 78536, "epoch": 649} {"train_loss": -36.58573532104492, "global_step": 78537, "epoch": 649} {"train_loss": -37.1518669128418, "global_step": 78538, "epoch": 649} {"train_loss": -36.72034454345703, "global_step": 78539, "epoch": 649} {"train_loss": -32.90763854980469, "global_step": 78540, "epoch": 649} {"train_loss": -33.17245864868164, "global_step": 78541, "epoch": 649} {"train_loss": -35.29105758666992, "global_step": 78542, "epoch": 649} {"train_loss": -36.35568618774414, "global_step": 78543, "epoch": 649} {"train_loss": -34.90626907348633, "global_step": 78544, "epoch": 649} {"train_loss": -32.69697189331055, "global_step": 78545, "epoch": 649} {"train_loss": -26.776403427124023, "global_step": 78546, "epoch": 649} {"train_loss": -32.155548095703125, "global_step": 78547, "epoch": 649} {"train_loss": -31.699995040893555, "global_step": 78548, "epoch": 649} {"train_loss": -19.51494026184082, "global_step": 78549, "epoch": 649} {"train_loss": -26.293806076049805, "global_step": 78550, "epoch": 649} {"train_loss": -28.1182861328125, "global_step": 78551, "epoch": 649} {"train_loss": -28.055866241455078, "global_step": 78552, "epoch": 649} {"train_loss": -29.313379287719727, "global_step": 78553, "epoch": 649} {"train_loss": -29.2825984954834, "global_step": 78554, "epoch": 649} {"train_loss": -30.736608505249023, "global_step": 78555, "epoch": 649} {"train_loss": -30.1083927154541, "global_step": 78556, "epoch": 649} {"train_loss": -28.263219833374023, "global_step": 78557, "epoch": 649} {"train_loss": -30.807056427001953, "global_step": 78558, "epoch": 649} {"train_loss": -30.39313316345215, "global_step": 78559, "epoch": 649} {"train_loss": -31.243574142456055, "global_step": 78560, "epoch": 649} {"train_loss": -30.0878963470459, "global_step": 78561, "epoch": 649} {"train_loss": -30.965377807617188, "global_step": 78562, "epoch": 649} {"train_loss": -31.91926383972168, "global_step": 78563, "epoch": 649} {"train_loss": -30.357141494750977, "global_step": 78564, "epoch": 649} {"train_loss": -32.25881576538086, "global_step": 78565, "epoch": 649} {"train_loss": -32.36085891723633, "global_step": 78566, "epoch": 649} {"train_loss": -31.286334991455078, "global_step": 78567, "epoch": 649} {"train_loss": -33.21957015991211, "global_step": 78568, "epoch": 649} {"train_loss": -32.075958251953125, "global_step": 78569, "epoch": 649} {"train_loss": -32.37786102294922, "global_step": 78570, "epoch": 649} {"train_loss": -32.85801315307617, "global_step": 78571, "epoch": 649} {"train_loss": -33.0714225769043, "global_step": 78572, "epoch": 649} {"train_loss": -33.46950912475586, "global_step": 78573, "epoch": 649} {"train_loss": -33.23596954345703, "global_step": 78574, "epoch": 649} {"train_loss": -33.931880950927734, "global_step": 78575, "epoch": 649} {"train_loss": -33.84979248046875, "global_step": 78576, "epoch": 649} {"train_loss": -32.8914680480957, "global_step": 78577, "epoch": 649} {"train_loss": -34.640663146972656, "global_step": 78578, "epoch": 649} {"train_loss": -33.93085861206055, "global_step": 78579, "epoch": 649} {"train_loss": -33.650630950927734, "global_step": 78580, "epoch": 649} {"train_loss": -34.36524200439453, "global_step": 78581, "epoch": 649} {"train_loss": -34.032711029052734, "global_step": 78582, "epoch": 649} {"train_loss": -34.08939743041992, "global_step": 78583, "epoch": 649} {"train_loss": -34.68545150756836, "global_step": 78584, "epoch": 649} {"train_loss": -34.449195861816406, "global_step": 78585, "epoch": 649} {"train_loss": -34.57619857788086, "global_step": 78586, "epoch": 649} {"train_loss": -34.63644027709961, "global_step": 78587, "epoch": 649} {"train_loss": -35.010345458984375, "global_step": 78588, "epoch": 649} {"train_loss": -34.89726638793945, "global_step": 78589, "epoch": 649} {"train_loss": -34.74074172973633, "global_step": 78590, "epoch": 649} {"train_loss": -34.60814666748047, "global_step": 78591, "epoch": 649} {"train_loss": -35.34560012817383, "global_step": 78592, "epoch": 649} {"train_loss": -34.79938507080078, "global_step": 78593, "epoch": 649} {"train_loss": -34.90609359741211, "global_step": 78594, "epoch": 649} {"train_loss": -34.86239242553711, "global_step": 78595, "epoch": 649} {"train_loss": -34.7645263671875, "global_step": 78596, "epoch": 649} {"train_loss": -35.385292053222656, "global_step": 78597, "epoch": 649} {"train_loss": -35.181148529052734, "global_step": 78598, "epoch": 649} {"train_loss": -34.69012451171875, "global_step": 78599, "epoch": 649} {"train_loss": -35.293907165527344, "global_step": 78600, "epoch": 649} {"train_loss": -35.60816955566406, "global_step": 78601, "epoch": 649} {"train_loss": -35.631587982177734, "global_step": 78602, "epoch": 649} {"train_loss": -34.841522216796875, "global_step": 78603, "epoch": 649} {"train_loss": -35.8150520324707, "global_step": 78604, "epoch": 649} {"train_loss": -35.33750534057617, "global_step": 78605, "epoch": 649} {"train_loss": -35.60038375854492, "global_step": 78606, "epoch": 649} {"train_loss": -35.7580451965332, "global_step": 78607, "epoch": 649} {"train_loss": -35.89238357543945, "global_step": 78608, "epoch": 649} {"train_loss": -35.956180572509766, "global_step": 78609, "epoch": 649} {"train_loss": -36.16958236694336, "global_step": 78610, "epoch": 649} {"train_loss": -35.657325744628906, "global_step": 78611, "epoch": 649} {"train_loss": -35.69233322143555, "global_step": 78612, "epoch": 649} {"train_loss": -35.905696868896484, "global_step": 78613, "epoch": 649} {"train_loss": -36.08986282348633, "global_step": 78614, "epoch": 649} {"train_loss": -36.22809982299805, "global_step": 78615, "epoch": 649} {"train_loss": -36.0067253112793, "global_step": 78616, "epoch": 649} {"train_loss": -36.320472717285156, "global_step": 78617, "epoch": 649} {"train_loss": -35.91677474975586, "global_step": 78618, "epoch": 649} {"train_loss": -36.29690170288086, "global_step": 78619, "epoch": 649} {"train_loss": -35.760066986083984, "global_step": 78620, "epoch": 649} {"train_loss": -36.3017578125, "global_step": 78621, "epoch": 649} {"train_loss": -36.17249298095703, "global_step": 78622, "epoch": 649} {"train_loss": -36.17280197143555, "global_step": 78623, "epoch": 649} {"train_loss": -35.9442253112793, "global_step": 78624, "epoch": 649} {"train_loss": -36.06928253173828, "global_step": 78625, "epoch": 649} {"train_loss": -35.78635025024414, "global_step": 78626, "epoch": 649} {"train_loss": -36.1630973815918, "global_step": 78627, "epoch": 649} {"train_loss": -36.2026252746582, "global_step": 78628, "epoch": 649} {"train_loss": -37.071022033691406, "global_step": 78629, "epoch": 649} {"train_loss": -36.788021087646484, "global_step": 78630, "epoch": 649} {"train_loss": -36.58225631713867, "global_step": 78631, "epoch": 649} {"train_loss": -36.580745697021484, "global_step": 78632, "epoch": 649} {"train_loss": -36.614418029785156, "global_step": 78633, "epoch": 649} {"train_loss": -36.71894073486328, "global_step": 78634, "epoch": 649} {"train_loss": -36.661041259765625, "global_step": 78635, "epoch": 649} {"train_loss": -37.12471389770508, "global_step": 78636, "epoch": 649} {"train_loss": -36.75973129272461, "global_step": 78637, "epoch": 649} {"train_loss": -36.572509765625, "global_step": 78638, "epoch": 649} {"train_loss": -37.0179328918457, "global_step": 78639, "epoch": 649} {"train_loss": -37.02817916870117, "global_step": 78640, "epoch": 649} {"train_loss": -37.12638473510742, "global_step": 78641, "epoch": 649} {"train_loss": -36.992488861083984, "global_step": 78642, "epoch": 649} {"train_loss": -36.64723587036133, "global_step": 78643, "epoch": 649} {"train_loss": -36.68215560913086, "global_step": 78644, "epoch": 649} {"train_loss": -36.81072998046875, "global_step": 78645, "epoch": 649} {"train_loss": -36.74820327758789, "global_step": 78646, "epoch": 649} {"train_loss": -36.511253356933594, "global_step": 78647, "epoch": 649} {"train_loss": -36.98069381713867, "global_step": 78648, "epoch": 649} {"train_loss": -34.43437005665677, "global_step": 78649, "epoch": 649, "val_loss": 2630905.75} {"train_loss": -35.79348373413086, "global_step": 78650, "epoch": 650} {"train_loss": -35.57625961303711, "global_step": 78651, "epoch": 650} {"train_loss": -36.4055290222168, "global_step": 78652, "epoch": 650} {"train_loss": -36.99262619018555, "global_step": 78653, "epoch": 650} {"train_loss": -35.34513854980469, "global_step": 78654, "epoch": 650} {"train_loss": -36.022377014160156, "global_step": 78655, "epoch": 650} {"train_loss": -36.717220306396484, "global_step": 78656, "epoch": 650} {"train_loss": -36.07625198364258, "global_step": 78657, "epoch": 650} {"train_loss": -36.540489196777344, "global_step": 78658, "epoch": 650} {"train_loss": -36.787593841552734, "global_step": 78659, "epoch": 650} {"train_loss": -36.7424430847168, "global_step": 78660, "epoch": 650} {"train_loss": -35.671443939208984, "global_step": 78661, "epoch": 650} {"train_loss": -32.83412551879883, "global_step": 78662, "epoch": 650} {"train_loss": -32.89278793334961, "global_step": 78663, "epoch": 650} {"train_loss": -33.12180709838867, "global_step": 78664, "epoch": 650} {"train_loss": -26.04976463317871, "global_step": 78665, "epoch": 650} {"train_loss": -37.2419548034668, "global_step": 78666, "epoch": 650} {"train_loss": -27.4382381439209, "global_step": 78667, "epoch": 650} {"train_loss": -36.95984649658203, "global_step": 78668, "epoch": 650} {"train_loss": -29.017562866210938, "global_step": 78669, "epoch": 650} {"train_loss": -36.494773864746094, "global_step": 78670, "epoch": 650} {"train_loss": -32.14545822143555, "global_step": 78671, "epoch": 650} {"train_loss": -34.02519226074219, "global_step": 78672, "epoch": 650} {"train_loss": -36.668373107910156, "global_step": 78673, "epoch": 650} {"train_loss": -35.39010238647461, "global_step": 78674, "epoch": 650} {"train_loss": -35.370304107666016, "global_step": 78675, "epoch": 650} {"train_loss": -36.02592849731445, "global_step": 78676, "epoch": 650} {"train_loss": -36.26992416381836, "global_step": 78677, "epoch": 650} {"train_loss": -35.4218864440918, "global_step": 78678, "epoch": 650} {"train_loss": -36.54742431640625, "global_step": 78679, "epoch": 650} {"train_loss": -35.762508392333984, "global_step": 78680, "epoch": 650} {"train_loss": -36.65763473510742, "global_step": 78681, "epoch": 650} {"train_loss": -35.78952407836914, "global_step": 78682, "epoch": 650} {"train_loss": -36.79216384887695, "global_step": 78683, "epoch": 650} {"train_loss": -35.948638916015625, "global_step": 78684, "epoch": 650} {"train_loss": -35.7425651550293, "global_step": 78685, "epoch": 650} {"train_loss": -36.63758087158203, "global_step": 78686, "epoch": 650} {"train_loss": -36.24216842651367, "global_step": 78687, "epoch": 650} {"train_loss": -36.24251174926758, "global_step": 78688, "epoch": 650} {"train_loss": -36.21405792236328, "global_step": 78689, "epoch": 650} {"train_loss": -36.630008697509766, "global_step": 78690, "epoch": 650} {"train_loss": -36.86249923706055, "global_step": 78691, "epoch": 650} {"train_loss": -37.36517333984375, "global_step": 78692, "epoch": 650} {"train_loss": -36.294219970703125, "global_step": 78693, "epoch": 650} {"train_loss": -36.39873123168945, "global_step": 78694, "epoch": 650} {"train_loss": -36.77125930786133, "global_step": 78695, "epoch": 650} {"train_loss": -36.032161712646484, "global_step": 78696, "epoch": 650} {"train_loss": -36.80393981933594, "global_step": 78697, "epoch": 650} {"train_loss": -36.49733352661133, "global_step": 78698, "epoch": 650} {"train_loss": -37.091129302978516, "global_step": 78699, "epoch": 650} {"train_loss": -36.788665771484375, "global_step": 78700, "epoch": 650} {"train_loss": -36.808448791503906, "global_step": 78701, "epoch": 650} {"train_loss": -36.845394134521484, "global_step": 78702, "epoch": 650} {"train_loss": -37.057220458984375, "global_step": 78703, "epoch": 650} {"train_loss": -37.501678466796875, "global_step": 78704, "epoch": 650} {"train_loss": -37.28853225708008, "global_step": 78705, "epoch": 650} {"train_loss": -37.47255325317383, "global_step": 78706, "epoch": 650} {"train_loss": -37.838558197021484, "global_step": 78707, "epoch": 650} {"train_loss": -37.472259521484375, "global_step": 78708, "epoch": 650} {"train_loss": -36.9323844909668, "global_step": 78709, "epoch": 650} {"train_loss": -37.984256744384766, "global_step": 78710, "epoch": 650} {"train_loss": -37.53955841064453, "global_step": 78711, "epoch": 650} {"train_loss": -37.465267181396484, "global_step": 78712, "epoch": 650} {"train_loss": -37.61678695678711, "global_step": 78713, "epoch": 650} {"train_loss": -37.16804122924805, "global_step": 78714, "epoch": 650} {"train_loss": -37.48042678833008, "global_step": 78715, "epoch": 650} {"train_loss": -37.34143829345703, "global_step": 78716, "epoch": 650} {"train_loss": -36.81461715698242, "global_step": 78717, "epoch": 650} {"train_loss": -36.504756927490234, "global_step": 78718, "epoch": 650} {"train_loss": -36.67964172363281, "global_step": 78719, "epoch": 650} {"train_loss": -36.291236877441406, "global_step": 78720, "epoch": 650} {"train_loss": -36.96530532836914, "global_step": 78721, "epoch": 650} {"train_loss": -37.188636779785156, "global_step": 78722, "epoch": 650} {"train_loss": -37.400325775146484, "global_step": 78723, "epoch": 650} {"train_loss": -36.476810455322266, "global_step": 78724, "epoch": 650} {"train_loss": -37.607181549072266, "global_step": 78725, "epoch": 650} {"train_loss": -38.10313034057617, "global_step": 78726, "epoch": 650} {"train_loss": -37.39667510986328, "global_step": 78727, "epoch": 650} {"train_loss": -37.54555130004883, "global_step": 78728, "epoch": 650} {"train_loss": -37.79898452758789, "global_step": 78729, "epoch": 650} {"train_loss": -37.94326400756836, "global_step": 78730, "epoch": 650} {"train_loss": -37.1427116394043, "global_step": 78731, "epoch": 650} {"train_loss": -38.09358215332031, "global_step": 78732, "epoch": 650} {"train_loss": -37.67074203491211, "global_step": 78733, "epoch": 650} {"train_loss": -36.664180755615234, "global_step": 78734, "epoch": 650} {"train_loss": -34.69097900390625, "global_step": 78735, "epoch": 650} {"train_loss": -33.09572982788086, "global_step": 78736, "epoch": 650} {"train_loss": -36.83414840698242, "global_step": 78737, "epoch": 650} {"train_loss": -37.289825439453125, "global_step": 78738, "epoch": 650} {"train_loss": -37.29890823364258, "global_step": 78739, "epoch": 650} {"train_loss": -36.3400993347168, "global_step": 78740, "epoch": 650} {"train_loss": -35.45412063598633, "global_step": 78741, "epoch": 650} {"train_loss": -37.0576286315918, "global_step": 78742, "epoch": 650} {"train_loss": -37.827327728271484, "global_step": 78743, "epoch": 650} {"train_loss": -36.9268913269043, "global_step": 78744, "epoch": 650} {"train_loss": -37.2084846496582, "global_step": 78745, "epoch": 650} {"train_loss": -34.31062316894531, "global_step": 78746, "epoch": 650} {"train_loss": -37.28373336791992, "global_step": 78747, "epoch": 650} {"train_loss": -38.136837005615234, "global_step": 78748, "epoch": 650} {"train_loss": -36.24176025390625, "global_step": 78749, "epoch": 650} {"train_loss": -36.8157958984375, "global_step": 78750, "epoch": 650} {"train_loss": -37.140625, "global_step": 78751, "epoch": 650} {"train_loss": -35.430519104003906, "global_step": 78752, "epoch": 650} {"train_loss": -35.77337646484375, "global_step": 78753, "epoch": 650} {"train_loss": -34.871376037597656, "global_step": 78754, "epoch": 650} {"train_loss": -33.80313491821289, "global_step": 78755, "epoch": 650} {"train_loss": -35.79240036010742, "global_step": 78756, "epoch": 650} {"train_loss": -36.6725959777832, "global_step": 78757, "epoch": 650} {"train_loss": -36.72460174560547, "global_step": 78758, "epoch": 650} {"train_loss": -36.55400085449219, "global_step": 78759, "epoch": 650} {"train_loss": -36.727840423583984, "global_step": 78760, "epoch": 650} {"train_loss": -36.00376510620117, "global_step": 78761, "epoch": 650} {"train_loss": -36.96588897705078, "global_step": 78762, "epoch": 650} {"train_loss": -37.373756408691406, "global_step": 78763, "epoch": 650} {"train_loss": -36.47265625, "global_step": 78764, "epoch": 650} {"train_loss": -36.810302734375, "global_step": 78765, "epoch": 650} {"train_loss": -36.9839973449707, "global_step": 78766, "epoch": 650} {"train_loss": -37.190975189208984, "global_step": 78767, "epoch": 650} {"train_loss": -36.163299560546875, "global_step": 78768, "epoch": 650} {"train_loss": -37.510005950927734, "global_step": 78769, "epoch": 650} {"train_loss": -36.27181950088375, "global_step": 78770, "epoch": 650, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4400000": 1.0, "test/sim_max_reward_4400001": 1.0, "test/sim_max_reward_4400002": 1.0, "test/sim_max_reward_4400003": 1.0, "test/sim_max_reward_4400004": 1.0, "test/sim_max_reward_4400005": 1.0, "test/sim_max_reward_4400006": 1.0, "test/sim_max_reward_4400007": 1.0, "test/sim_max_reward_4400008": 1.0, "test/sim_max_reward_4400009": 1.0, "test/sim_max_reward_4400010": 1.0, "test/sim_max_reward_4400011": 1.0, "test/sim_max_reward_4400012": 1.0, "test/sim_max_reward_4400013": 1.0, "test/sim_max_reward_4400014": 1.0, "test/sim_max_reward_4400015": 1.0, "test/sim_max_reward_4400016": 1.0, "test/sim_max_reward_4400017": 1.0, "test/sim_max_reward_4400018": 1.0, "test/sim_max_reward_4400019": 1.0, "test/sim_max_reward_4400020": 1.0, "test/sim_max_reward_4400021": 1.0, "train/mean_score": 1.0, "test/mean_score": 1.0, "val_loss": 2764560.5} {"train_loss": -37.4161376953125, "global_step": 78771, "epoch": 651} {"train_loss": -36.926185607910156, "global_step": 78772, "epoch": 651} {"train_loss": -37.04779052734375, "global_step": 78773, "epoch": 651} {"train_loss": -35.472084045410156, "global_step": 78774, "epoch": 651} {"train_loss": -37.09001159667969, "global_step": 78775, "epoch": 651} {"train_loss": -35.75859451293945, "global_step": 78776, "epoch": 651} {"train_loss": -37.29729080200195, "global_step": 78777, "epoch": 651} {"train_loss": -37.30884552001953, "global_step": 78778, "epoch": 651} {"train_loss": -37.63063430786133, "global_step": 78779, "epoch": 651} {"train_loss": -34.7137451171875, "global_step": 78780, "epoch": 651} {"train_loss": -37.30202865600586, "global_step": 78781, "epoch": 651} {"train_loss": -36.80324935913086, "global_step": 78782, "epoch": 651} {"train_loss": -37.97992706298828, "global_step": 78783, "epoch": 651} {"train_loss": -36.16975021362305, "global_step": 78784, "epoch": 651} {"train_loss": -36.5699462890625, "global_step": 78785, "epoch": 651} {"train_loss": -37.1191520690918, "global_step": 78786, "epoch": 651} {"train_loss": -36.7107048034668, "global_step": 78787, "epoch": 651} {"train_loss": -36.20976638793945, "global_step": 78788, "epoch": 651} {"train_loss": -35.9939079284668, "global_step": 78789, "epoch": 651} {"train_loss": -34.745391845703125, "global_step": 78790, "epoch": 651} {"train_loss": -36.10600662231445, "global_step": 78791, "epoch": 651} {"train_loss": -34.87070846557617, "global_step": 78792, "epoch": 651} {"train_loss": -36.237091064453125, "global_step": 78793, "epoch": 651} {"train_loss": -36.58295822143555, "global_step": 78794, "epoch": 651} {"train_loss": -35.0305061340332, "global_step": 78795, "epoch": 651} {"train_loss": -35.829097747802734, "global_step": 78796, "epoch": 651} {"train_loss": -34.8841438293457, "global_step": 78797, "epoch": 651} {"train_loss": -37.39790725708008, "global_step": 78798, "epoch": 651} {"train_loss": -36.22553634643555, "global_step": 78799, "epoch": 651} {"train_loss": -34.51713943481445, "global_step": 78800, "epoch": 651} {"train_loss": -34.44844436645508, "global_step": 78801, "epoch": 651} {"train_loss": -34.47817611694336, "global_step": 78802, "epoch": 651} {"train_loss": -35.96524429321289, "global_step": 78803, "epoch": 651} {"train_loss": -33.7471923828125, "global_step": 78804, "epoch": 651} {"train_loss": -32.70921325683594, "global_step": 78805, "epoch": 651} {"train_loss": -34.104248046875, "global_step": 78806, "epoch": 651} {"train_loss": -35.67140197753906, "global_step": 78807, "epoch": 651} {"train_loss": -32.827720642089844, "global_step": 78808, "epoch": 651} {"train_loss": -34.87559509277344, "global_step": 78809, "epoch": 651} {"train_loss": -35.84709548950195, "global_step": 78810, "epoch": 651} {"train_loss": -33.68117904663086, "global_step": 78811, "epoch": 651} {"train_loss": -35.97993087768555, "global_step": 78812, "epoch": 651} {"train_loss": -34.188777923583984, "global_step": 78813, "epoch": 651} {"train_loss": -34.808292388916016, "global_step": 78814, "epoch": 651} {"train_loss": -35.177696228027344, "global_step": 78815, "epoch": 651} {"train_loss": -35.722469329833984, "global_step": 78816, "epoch": 651} {"train_loss": -35.7757568359375, "global_step": 78817, "epoch": 651} {"train_loss": -36.16071319580078, "global_step": 78818, "epoch": 651} {"train_loss": -36.672889709472656, "global_step": 78819, "epoch": 651} {"train_loss": -35.62575912475586, "global_step": 78820, "epoch": 651} {"train_loss": -35.95808410644531, "global_step": 78821, "epoch": 651} {"train_loss": -36.61307907104492, "global_step": 78822, "epoch": 651} {"train_loss": -35.89445114135742, "global_step": 78823, "epoch": 651} {"train_loss": -36.911006927490234, "global_step": 78824, "epoch": 651} {"train_loss": -36.240291595458984, "global_step": 78825, "epoch": 651} {"train_loss": -36.38203048706055, "global_step": 78826, "epoch": 651} {"train_loss": -36.88916015625, "global_step": 78827, "epoch": 651} {"train_loss": -36.8043098449707, "global_step": 78828, "epoch": 651} {"train_loss": -36.80316162109375, "global_step": 78829, "epoch": 651} {"train_loss": -37.12544631958008, "global_step": 78830, "epoch": 651} {"train_loss": -37.33172607421875, "global_step": 78831, "epoch": 651} {"train_loss": -37.24392318725586, "global_step": 78832, "epoch": 651} {"train_loss": -36.76667022705078, "global_step": 78833, "epoch": 651} {"train_loss": -36.12516403198242, "global_step": 78834, "epoch": 651} {"train_loss": -35.948787689208984, "global_step": 78835, "epoch": 651} {"train_loss": -36.585689544677734, "global_step": 78836, "epoch": 651} {"train_loss": -36.98558807373047, "global_step": 78837, "epoch": 651} {"train_loss": -37.455142974853516, "global_step": 78838, "epoch": 651} {"train_loss": -36.69222640991211, "global_step": 78839, "epoch": 651} {"train_loss": -37.23006820678711, "global_step": 78840, "epoch": 651} {"train_loss": -36.75521469116211, "global_step": 78841, "epoch": 651} {"train_loss": -37.15553283691406, "global_step": 78842, "epoch": 651} {"train_loss": -37.09033203125, "global_step": 78843, "epoch": 651} {"train_loss": -37.081356048583984, "global_step": 78844, "epoch": 651} {"train_loss": -37.72426223754883, "global_step": 78845, "epoch": 651} {"train_loss": -37.545135498046875, "global_step": 78846, "epoch": 651} {"train_loss": -37.42327117919922, "global_step": 78847, "epoch": 651} {"train_loss": -37.54073715209961, "global_step": 78848, "epoch": 651} {"train_loss": -37.08926773071289, "global_step": 78849, "epoch": 651} {"train_loss": -36.748470306396484, "global_step": 78850, "epoch": 651} {"train_loss": -37.25014877319336, "global_step": 78851, "epoch": 651} {"train_loss": -37.80192184448242, "global_step": 78852, "epoch": 651} {"train_loss": -37.50104904174805, "global_step": 78853, "epoch": 651} {"train_loss": -37.42281723022461, "global_step": 78854, "epoch": 651} {"train_loss": -37.949798583984375, "global_step": 78855, "epoch": 651} {"train_loss": -37.57827377319336, "global_step": 78856, "epoch": 651} {"train_loss": -37.204689025878906, "global_step": 78857, "epoch": 651} {"train_loss": -37.0782356262207, "global_step": 78858, "epoch": 651} {"train_loss": -38.22478103637695, "global_step": 78859, "epoch": 651} {"train_loss": -36.821468353271484, "global_step": 78860, "epoch": 651} {"train_loss": -37.180885314941406, "global_step": 78861, "epoch": 651} {"train_loss": -37.53679275512695, "global_step": 78862, "epoch": 651} {"train_loss": -37.264808654785156, "global_step": 78863, "epoch": 651} {"train_loss": -38.0426025390625, "global_step": 78864, "epoch": 651} {"train_loss": -37.9698600769043, "global_step": 78865, "epoch": 651} {"train_loss": -38.17609786987305, "global_step": 78866, "epoch": 651} {"train_loss": -38.15376663208008, "global_step": 78867, "epoch": 651} {"train_loss": -38.40578079223633, "global_step": 78868, "epoch": 651} {"train_loss": -37.55097579956055, "global_step": 78869, "epoch": 651} {"train_loss": -37.9806022644043, "global_step": 78870, "epoch": 651} {"train_loss": -38.315399169921875, "global_step": 78871, "epoch": 651} {"train_loss": -37.92509078979492, "global_step": 78872, "epoch": 651} {"train_loss": -37.950008392333984, "global_step": 78873, "epoch": 651} {"train_loss": -37.57713317871094, "global_step": 78874, "epoch": 651} {"train_loss": -37.339717864990234, "global_step": 78875, "epoch": 651} {"train_loss": -36.074859619140625, "global_step": 78876, "epoch": 651} {"train_loss": -38.43666458129883, "global_step": 78877, "epoch": 651} {"train_loss": -38.182167053222656, "global_step": 78878, "epoch": 651} {"train_loss": -37.53353500366211, "global_step": 78879, "epoch": 651} {"train_loss": -37.27322006225586, "global_step": 78880, "epoch": 651} {"train_loss": -37.61411666870117, "global_step": 78881, "epoch": 651} {"train_loss": -37.75922775268555, "global_step": 78882, "epoch": 651} {"train_loss": -36.64410400390625, "global_step": 78883, "epoch": 651} {"train_loss": -36.304256439208984, "global_step": 78884, "epoch": 651} {"train_loss": -36.57082748413086, "global_step": 78885, "epoch": 651} {"train_loss": -37.5626335144043, "global_step": 78886, "epoch": 651} {"train_loss": -35.546932220458984, "global_step": 78887, "epoch": 651} {"train_loss": -36.05732345581055, "global_step": 78888, "epoch": 651} {"train_loss": -37.42046356201172, "global_step": 78889, "epoch": 651} {"train_loss": -37.136077880859375, "global_step": 78890, "epoch": 651} {"train_loss": -36.587951092680626, "global_step": 78891, "epoch": 651, "val_loss": 2547380.0} {"train_loss": -31.665725708007812, "global_step": 78892, "epoch": 652} {"train_loss": -28.723758697509766, "global_step": 78893, "epoch": 652} {"train_loss": -32.869625091552734, "global_step": 78894, "epoch": 652} {"train_loss": -36.5282096862793, "global_step": 78895, "epoch": 652} {"train_loss": -33.82903289794922, "global_step": 78896, "epoch": 652} {"train_loss": -34.451011657714844, "global_step": 78897, "epoch": 652} {"train_loss": -37.0594596862793, "global_step": 78898, "epoch": 652} {"train_loss": -35.840179443359375, "global_step": 78899, "epoch": 652} {"train_loss": -34.42670822143555, "global_step": 78900, "epoch": 652} {"train_loss": -36.85456466674805, "global_step": 78901, "epoch": 652} {"train_loss": -36.38428497314453, "global_step": 78902, "epoch": 652} {"train_loss": -35.9171142578125, "global_step": 78903, "epoch": 652} {"train_loss": -37.207977294921875, "global_step": 78904, "epoch": 652} {"train_loss": -35.42610549926758, "global_step": 78905, "epoch": 652} {"train_loss": -36.750606536865234, "global_step": 78906, "epoch": 652} {"train_loss": -35.8135871887207, "global_step": 78907, "epoch": 652} {"train_loss": -35.26710891723633, "global_step": 78908, "epoch": 652} {"train_loss": -36.01235580444336, "global_step": 78909, "epoch": 652} {"train_loss": -35.9416389465332, "global_step": 78910, "epoch": 652} {"train_loss": -36.745513916015625, "global_step": 78911, "epoch": 652} {"train_loss": -35.81044387817383, "global_step": 78912, "epoch": 652} {"train_loss": -37.584442138671875, "global_step": 78913, "epoch": 652} {"train_loss": -34.35906982421875, "global_step": 78914, "epoch": 652} {"train_loss": -37.12946319580078, "global_step": 78915, "epoch": 652} {"train_loss": -36.11080551147461, "global_step": 78916, "epoch": 652} {"train_loss": -36.98421859741211, "global_step": 78917, "epoch": 652} {"train_loss": -36.55126953125, "global_step": 78918, "epoch": 652} {"train_loss": -37.4342041015625, "global_step": 78919, "epoch": 652} {"train_loss": -37.07685470581055, "global_step": 78920, "epoch": 652} {"train_loss": -37.113037109375, "global_step": 78921, "epoch": 652} {"train_loss": -36.42635726928711, "global_step": 78922, "epoch": 652} {"train_loss": -37.6493034362793, "global_step": 78923, "epoch": 652} {"train_loss": -36.766578674316406, "global_step": 78924, "epoch": 652} {"train_loss": -37.4459342956543, "global_step": 78925, "epoch": 652} {"train_loss": -37.28718948364258, "global_step": 78926, "epoch": 652} {"train_loss": -37.82843017578125, "global_step": 78927, "epoch": 652} {"train_loss": -37.27753448486328, "global_step": 78928, "epoch": 652} {"train_loss": -37.59064483642578, "global_step": 78929, "epoch": 652} {"train_loss": -37.550689697265625, "global_step": 78930, "epoch": 652} {"train_loss": -37.60923767089844, "global_step": 78931, "epoch": 652} {"train_loss": -38.00418472290039, "global_step": 78932, "epoch": 652} {"train_loss": -37.892616271972656, "global_step": 78933, "epoch": 652} {"train_loss": -36.882362365722656, "global_step": 78934, "epoch": 652} {"train_loss": -37.794551849365234, "global_step": 78935, "epoch": 652} {"train_loss": -37.23011779785156, "global_step": 78936, "epoch": 652} {"train_loss": -37.714378356933594, "global_step": 78937, "epoch": 652} {"train_loss": -38.026710510253906, "global_step": 78938, "epoch": 652} {"train_loss": -37.46670913696289, "global_step": 78939, "epoch": 652} {"train_loss": -38.19144821166992, "global_step": 78940, "epoch": 652} {"train_loss": -38.232421875, "global_step": 78941, "epoch": 652} {"train_loss": -37.92873001098633, "global_step": 78942, "epoch": 652} {"train_loss": -38.03731918334961, "global_step": 78943, "epoch": 652} {"train_loss": -38.12526321411133, "global_step": 78944, "epoch": 652} {"train_loss": -37.773372650146484, "global_step": 78945, "epoch": 652} {"train_loss": -37.51460266113281, "global_step": 78946, "epoch": 652} {"train_loss": -37.59485626220703, "global_step": 78947, "epoch": 652} {"train_loss": -38.27385330200195, "global_step": 78948, "epoch": 652} {"train_loss": -38.1351432800293, "global_step": 78949, "epoch": 652} {"train_loss": -38.21142578125, "global_step": 78950, "epoch": 652} {"train_loss": -37.81583786010742, "global_step": 78951, "epoch": 652} {"train_loss": -38.388465881347656, "global_step": 78952, "epoch": 652} {"train_loss": -38.115447998046875, "global_step": 78953, "epoch": 652} {"train_loss": -38.045806884765625, "global_step": 78954, "epoch": 652} {"train_loss": -37.5877799987793, "global_step": 78955, "epoch": 652} {"train_loss": -37.661041259765625, "global_step": 78956, "epoch": 652} {"train_loss": -38.211029052734375, "global_step": 78957, "epoch": 652} {"train_loss": -37.93872833251953, "global_step": 78958, "epoch": 652} {"train_loss": -37.7859001159668, "global_step": 78959, "epoch": 652} {"train_loss": -37.8531494140625, "global_step": 78960, "epoch": 652} {"train_loss": -37.762123107910156, "global_step": 78961, "epoch": 652} {"train_loss": -37.69136047363281, "global_step": 78962, "epoch": 652} {"train_loss": -37.10602951049805, "global_step": 78963, "epoch": 652} {"train_loss": -38.33430099487305, "global_step": 78964, "epoch": 652} {"train_loss": -37.03527069091797, "global_step": 78965, "epoch": 652} {"train_loss": -36.460750579833984, "global_step": 78966, "epoch": 652} {"train_loss": -36.45743942260742, "global_step": 78967, "epoch": 652} {"train_loss": -37.318565368652344, "global_step": 78968, "epoch": 652} {"train_loss": -37.48143768310547, "global_step": 78969, "epoch": 652} {"train_loss": -38.00721740722656, "global_step": 78970, "epoch": 652} {"train_loss": -38.01753234863281, "global_step": 78971, "epoch": 652} {"train_loss": -37.90592575073242, "global_step": 78972, "epoch": 652} {"train_loss": -37.68654251098633, "global_step": 78973, "epoch": 652} {"train_loss": -37.06986618041992, "global_step": 78974, "epoch": 652} {"train_loss": -38.157875061035156, "global_step": 78975, "epoch": 652} {"train_loss": -37.67075729370117, "global_step": 78976, "epoch": 652} {"train_loss": -36.29082107543945, "global_step": 78977, "epoch": 652} {"train_loss": -37.389915466308594, "global_step": 78978, "epoch": 652} {"train_loss": -38.22544479370117, "global_step": 78979, "epoch": 652} {"train_loss": -36.61921310424805, "global_step": 78980, "epoch": 652} {"train_loss": -37.4171257019043, "global_step": 78981, "epoch": 652} {"train_loss": -38.3463249206543, "global_step": 78982, "epoch": 652} {"train_loss": -38.29146957397461, "global_step": 78983, "epoch": 652} {"train_loss": -36.85825729370117, "global_step": 78984, "epoch": 652} {"train_loss": -37.14430618286133, "global_step": 78985, "epoch": 652} {"train_loss": -37.57245635986328, "global_step": 78986, "epoch": 652} {"train_loss": -37.48401641845703, "global_step": 78987, "epoch": 652} {"train_loss": -37.55835723876953, "global_step": 78988, "epoch": 652} {"train_loss": -37.010982513427734, "global_step": 78989, "epoch": 652} {"train_loss": -34.783504486083984, "global_step": 78990, "epoch": 652} {"train_loss": -35.319618225097656, "global_step": 78991, "epoch": 652} {"train_loss": -35.68764877319336, "global_step": 78992, "epoch": 652} {"train_loss": -36.06813430786133, "global_step": 78993, "epoch": 652} {"train_loss": -37.10957717895508, "global_step": 78994, "epoch": 652} {"train_loss": -37.277320861816406, "global_step": 78995, "epoch": 652} {"train_loss": -36.66067123413086, "global_step": 78996, "epoch": 652} {"train_loss": -37.420127868652344, "global_step": 78997, "epoch": 652} {"train_loss": -37.17923355102539, "global_step": 78998, "epoch": 652} {"train_loss": -37.18060302734375, "global_step": 78999, "epoch": 652} {"train_loss": -36.55066680908203, "global_step": 79000, "epoch": 652} {"train_loss": -37.110328674316406, "global_step": 79001, "epoch": 652} {"train_loss": -37.720760345458984, "global_step": 79002, "epoch": 652} {"train_loss": -37.0751838684082, "global_step": 79003, "epoch": 652} {"train_loss": -38.125709533691406, "global_step": 79004, "epoch": 652} {"train_loss": -36.892391204833984, "global_step": 79005, "epoch": 652} {"train_loss": -37.23102951049805, "global_step": 79006, "epoch": 652} {"train_loss": -36.42932891845703, "global_step": 79007, "epoch": 652} {"train_loss": -37.655357360839844, "global_step": 79008, "epoch": 652} {"train_loss": -36.371360778808594, "global_step": 79009, "epoch": 652} {"train_loss": -37.58564376831055, "global_step": 79010, "epoch": 652} {"train_loss": -36.76473617553711, "global_step": 79011, "epoch": 652} {"train_loss": -36.98472343003454, "global_step": 79012, "epoch": 652, "val_loss": 2532014.75} {"train_loss": -37.311771392822266, "global_step": 79013, "epoch": 653} {"train_loss": -37.58154296875, "global_step": 79014, "epoch": 653} {"train_loss": -37.138858795166016, "global_step": 79015, "epoch": 653} {"train_loss": -37.72504806518555, "global_step": 79016, "epoch": 653} {"train_loss": -36.11127471923828, "global_step": 79017, "epoch": 653} {"train_loss": -36.20531463623047, "global_step": 79018, "epoch": 653} {"train_loss": -37.13611602783203, "global_step": 79019, "epoch": 653} {"train_loss": -36.763729095458984, "global_step": 79020, "epoch": 653} {"train_loss": -36.486629486083984, "global_step": 79021, "epoch": 653} {"train_loss": -36.92794418334961, "global_step": 79022, "epoch": 653} {"train_loss": -37.131591796875, "global_step": 79023, "epoch": 653} {"train_loss": -37.992427825927734, "global_step": 79024, "epoch": 653} {"train_loss": -37.04834747314453, "global_step": 79025, "epoch": 653} {"train_loss": -36.13666915893555, "global_step": 79026, "epoch": 653} {"train_loss": -38.270835876464844, "global_step": 79027, "epoch": 653} {"train_loss": -36.313575744628906, "global_step": 79028, "epoch": 653} {"train_loss": -35.606685638427734, "global_step": 79029, "epoch": 653} {"train_loss": -37.65963363647461, "global_step": 79030, "epoch": 653} {"train_loss": -37.4729118347168, "global_step": 79031, "epoch": 653} {"train_loss": -36.388816833496094, "global_step": 79032, "epoch": 653} {"train_loss": -36.84565353393555, "global_step": 79033, "epoch": 653} {"train_loss": -37.33246612548828, "global_step": 79034, "epoch": 653} {"train_loss": -36.48829650878906, "global_step": 79035, "epoch": 653} {"train_loss": -37.27314758300781, "global_step": 79036, "epoch": 653} {"train_loss": -37.51781463623047, "global_step": 79037, "epoch": 653} {"train_loss": -36.40471267700195, "global_step": 79038, "epoch": 653} {"train_loss": -37.202178955078125, "global_step": 79039, "epoch": 653} {"train_loss": -37.78948974609375, "global_step": 79040, "epoch": 653} {"train_loss": -38.36130905151367, "global_step": 79041, "epoch": 653} {"train_loss": -37.47557830810547, "global_step": 79042, "epoch": 653} {"train_loss": -38.0055046081543, "global_step": 79043, "epoch": 653} {"train_loss": -37.92592239379883, "global_step": 79044, "epoch": 653} {"train_loss": -38.146976470947266, "global_step": 79045, "epoch": 653} {"train_loss": -38.366981506347656, "global_step": 79046, "epoch": 653} {"train_loss": -37.787349700927734, "global_step": 79047, "epoch": 653} {"train_loss": -38.498836517333984, "global_step": 79048, "epoch": 653} {"train_loss": -37.32375717163086, "global_step": 79049, "epoch": 653} {"train_loss": -37.96769332885742, "global_step": 79050, "epoch": 653} {"train_loss": -37.62119674682617, "global_step": 79051, "epoch": 653} {"train_loss": -38.113441467285156, "global_step": 79052, "epoch": 653} {"train_loss": -37.392059326171875, "global_step": 79053, "epoch": 653} {"train_loss": -37.97303771972656, "global_step": 79054, "epoch": 653} {"train_loss": -38.03646469116211, "global_step": 79055, "epoch": 653} {"train_loss": -38.16788864135742, "global_step": 79056, "epoch": 653} {"train_loss": -37.24278259277344, "global_step": 79057, "epoch": 653} {"train_loss": -36.25956344604492, "global_step": 79058, "epoch": 653} {"train_loss": -34.42102813720703, "global_step": 79059, "epoch": 653} {"train_loss": -32.816463470458984, "global_step": 79060, "epoch": 653} {"train_loss": -31.78205680847168, "global_step": 79061, "epoch": 653} {"train_loss": -32.86213302612305, "global_step": 79062, "epoch": 653} {"train_loss": -37.22733688354492, "global_step": 79063, "epoch": 653} {"train_loss": -34.97993850708008, "global_step": 79064, "epoch": 653} {"train_loss": -34.877349853515625, "global_step": 79065, "epoch": 653} {"train_loss": -30.463886260986328, "global_step": 79066, "epoch": 653} {"train_loss": -29.762821197509766, "global_step": 79067, "epoch": 653} {"train_loss": -35.68413162231445, "global_step": 79068, "epoch": 653} {"train_loss": -29.804468154907227, "global_step": 79069, "epoch": 653} {"train_loss": -34.36372756958008, "global_step": 79070, "epoch": 653} {"train_loss": -34.93571090698242, "global_step": 79071, "epoch": 653} {"train_loss": -33.913883209228516, "global_step": 79072, "epoch": 653} {"train_loss": -37.33002853393555, "global_step": 79073, "epoch": 653} {"train_loss": -35.1805534362793, "global_step": 79074, "epoch": 653} {"train_loss": -37.07167053222656, "global_step": 79075, "epoch": 653} {"train_loss": -36.17754364013672, "global_step": 79076, "epoch": 653} {"train_loss": -36.8256721496582, "global_step": 79077, "epoch": 653} {"train_loss": -36.353450775146484, "global_step": 79078, "epoch": 653} {"train_loss": -36.9124870300293, "global_step": 79079, "epoch": 653} {"train_loss": -36.24256134033203, "global_step": 79080, "epoch": 653} {"train_loss": -37.30410385131836, "global_step": 79081, "epoch": 653} {"train_loss": -36.36396408081055, "global_step": 79082, "epoch": 653} {"train_loss": -37.156490325927734, "global_step": 79083, "epoch": 653} {"train_loss": -36.887020111083984, "global_step": 79084, "epoch": 653} {"train_loss": -37.327545166015625, "global_step": 79085, "epoch": 653} {"train_loss": -37.55149459838867, "global_step": 79086, "epoch": 653} {"train_loss": -37.2431755065918, "global_step": 79087, "epoch": 653} {"train_loss": -37.30867004394531, "global_step": 79088, "epoch": 653} {"train_loss": -37.288330078125, "global_step": 79089, "epoch": 653} {"train_loss": -37.71236801147461, "global_step": 79090, "epoch": 653} {"train_loss": -37.758296966552734, "global_step": 79091, "epoch": 653} {"train_loss": -37.267372131347656, "global_step": 79092, "epoch": 653} {"train_loss": -38.19228744506836, "global_step": 79093, "epoch": 653} {"train_loss": -37.69070053100586, "global_step": 79094, "epoch": 653} {"train_loss": -38.05245590209961, "global_step": 79095, "epoch": 653} {"train_loss": -38.004154205322266, "global_step": 79096, "epoch": 653} {"train_loss": -38.17214584350586, "global_step": 79097, "epoch": 653} {"train_loss": -38.568294525146484, "global_step": 79098, "epoch": 653} {"train_loss": -37.84545135498047, "global_step": 79099, "epoch": 653} {"train_loss": -37.8634033203125, "global_step": 79100, "epoch": 653} {"train_loss": -36.10201644897461, "global_step": 79101, "epoch": 653} {"train_loss": -37.842987060546875, "global_step": 79102, "epoch": 653} {"train_loss": -37.6152229309082, "global_step": 79103, "epoch": 653} {"train_loss": -38.20697784423828, "global_step": 79104, "epoch": 653} {"train_loss": -38.29603958129883, "global_step": 79105, "epoch": 653} {"train_loss": -37.929508209228516, "global_step": 79106, "epoch": 653} {"train_loss": -37.41792297363281, "global_step": 79107, "epoch": 653} {"train_loss": -37.14348220825195, "global_step": 79108, "epoch": 653} {"train_loss": -37.9648551940918, "global_step": 79109, "epoch": 653} {"train_loss": -38.51435470581055, "global_step": 79110, "epoch": 653} {"train_loss": -38.17983627319336, "global_step": 79111, "epoch": 653} {"train_loss": -38.1520881652832, "global_step": 79112, "epoch": 653} {"train_loss": -38.274269104003906, "global_step": 79113, "epoch": 653} {"train_loss": -37.94175338745117, "global_step": 79114, "epoch": 653} {"train_loss": -38.21407699584961, "global_step": 79115, "epoch": 653} {"train_loss": -38.42285919189453, "global_step": 79116, "epoch": 653} {"train_loss": -37.657508850097656, "global_step": 79117, "epoch": 653} {"train_loss": -37.945404052734375, "global_step": 79118, "epoch": 653} {"train_loss": -38.03424835205078, "global_step": 79119, "epoch": 653} {"train_loss": -38.39864730834961, "global_step": 79120, "epoch": 653} {"train_loss": -37.7728385925293, "global_step": 79121, "epoch": 653} {"train_loss": -37.932308197021484, "global_step": 79122, "epoch": 653} {"train_loss": -37.15602111816406, "global_step": 79123, "epoch": 653} {"train_loss": -35.916259765625, "global_step": 79124, "epoch": 653} {"train_loss": -32.60834884643555, "global_step": 79125, "epoch": 653} {"train_loss": -22.59377098083496, "global_step": 79126, "epoch": 653} {"train_loss": -29.731164932250977, "global_step": 79127, "epoch": 653} {"train_loss": -33.65973663330078, "global_step": 79128, "epoch": 653} {"train_loss": -36.550758361816406, "global_step": 79129, "epoch": 653} {"train_loss": -33.389678955078125, "global_step": 79130, "epoch": 653} {"train_loss": -35.069087982177734, "global_step": 79131, "epoch": 653} {"train_loss": -35.76414108276367, "global_step": 79132, "epoch": 653} {"train_loss": -36.61761729973407, "global_step": 79133, "epoch": 653, "val_loss": 2698582.0} {"train_loss": -34.98512268066406, "global_step": 79134, "epoch": 654} {"train_loss": -34.77206802368164, "global_step": 79135, "epoch": 654} {"train_loss": -36.530517578125, "global_step": 79136, "epoch": 654} {"train_loss": -35.35732650756836, "global_step": 79137, "epoch": 654} {"train_loss": -36.069854736328125, "global_step": 79138, "epoch": 654} {"train_loss": -36.87102127075195, "global_step": 79139, "epoch": 654} {"train_loss": -32.010894775390625, "global_step": 79140, "epoch": 654} {"train_loss": -36.98508834838867, "global_step": 79141, "epoch": 654} {"train_loss": -36.53791427612305, "global_step": 79142, "epoch": 654} {"train_loss": -36.48130416870117, "global_step": 79143, "epoch": 654} {"train_loss": -36.64446258544922, "global_step": 79144, "epoch": 654} {"train_loss": -36.24260711669922, "global_step": 79145, "epoch": 654} {"train_loss": -37.10798263549805, "global_step": 79146, "epoch": 654} {"train_loss": -36.33646774291992, "global_step": 79147, "epoch": 654} {"train_loss": -37.11921691894531, "global_step": 79148, "epoch": 654} {"train_loss": -37.26994705200195, "global_step": 79149, "epoch": 654} {"train_loss": -37.154998779296875, "global_step": 79150, "epoch": 654} {"train_loss": -37.00992202758789, "global_step": 79151, "epoch": 654} {"train_loss": -37.473915100097656, "global_step": 79152, "epoch": 654} {"train_loss": -36.9547119140625, "global_step": 79153, "epoch": 654} {"train_loss": -36.38886642456055, "global_step": 79154, "epoch": 654} {"train_loss": -37.1262092590332, "global_step": 79155, "epoch": 654} {"train_loss": -36.47426986694336, "global_step": 79156, "epoch": 654} {"train_loss": -37.431556701660156, "global_step": 79157, "epoch": 654} {"train_loss": -37.05768966674805, "global_step": 79158, "epoch": 654} {"train_loss": -36.954891204833984, "global_step": 79159, "epoch": 654} {"train_loss": -35.33168411254883, "global_step": 79160, "epoch": 654} {"train_loss": -37.22689437866211, "global_step": 79161, "epoch": 654} {"train_loss": -36.6522102355957, "global_step": 79162, "epoch": 654} {"train_loss": -37.50376510620117, "global_step": 79163, "epoch": 654} {"train_loss": -37.5443000793457, "global_step": 79164, "epoch": 654} {"train_loss": -37.279632568359375, "global_step": 79165, "epoch": 654} {"train_loss": -37.46030807495117, "global_step": 79166, "epoch": 654} {"train_loss": -37.353538513183594, "global_step": 79167, "epoch": 654} {"train_loss": -37.029808044433594, "global_step": 79168, "epoch": 654} {"train_loss": -36.94570541381836, "global_step": 79169, "epoch": 654} {"train_loss": -37.605770111083984, "global_step": 79170, "epoch": 654} {"train_loss": -36.909034729003906, "global_step": 79171, "epoch": 654} {"train_loss": -37.3643913269043, "global_step": 79172, "epoch": 654} {"train_loss": -37.579559326171875, "global_step": 79173, "epoch": 654} {"train_loss": -37.08430099487305, "global_step": 79174, "epoch": 654} {"train_loss": -37.385406494140625, "global_step": 79175, "epoch": 654} {"train_loss": -36.71050262451172, "global_step": 79176, "epoch": 654} {"train_loss": -37.93342208862305, "global_step": 79177, "epoch": 654} {"train_loss": -36.92818832397461, "global_step": 79178, "epoch": 654} {"train_loss": -36.8780632019043, "global_step": 79179, "epoch": 654} {"train_loss": -37.75808334350586, "global_step": 79180, "epoch": 654} {"train_loss": -36.04108810424805, "global_step": 79181, "epoch": 654} {"train_loss": -37.80830764770508, "global_step": 79182, "epoch": 654} {"train_loss": -37.65117645263672, "global_step": 79183, "epoch": 654} {"train_loss": -37.8363151550293, "global_step": 79184, "epoch": 654} {"train_loss": -37.67194747924805, "global_step": 79185, "epoch": 654} {"train_loss": -38.035926818847656, "global_step": 79186, "epoch": 654} {"train_loss": -37.855308532714844, "global_step": 79187, "epoch": 654} {"train_loss": -38.21065902709961, "global_step": 79188, "epoch": 654} {"train_loss": -38.23395538330078, "global_step": 79189, "epoch": 654} {"train_loss": -37.98273849487305, "global_step": 79190, "epoch": 654} {"train_loss": -38.192508697509766, "global_step": 79191, "epoch": 654} {"train_loss": -38.015045166015625, "global_step": 79192, "epoch": 654} {"train_loss": -38.39801025390625, "global_step": 79193, "epoch": 654} {"train_loss": -38.22024154663086, "global_step": 79194, "epoch": 654} {"train_loss": -38.379249572753906, "global_step": 79195, "epoch": 654} {"train_loss": -38.14665603637695, "global_step": 79196, "epoch": 654} {"train_loss": -37.99111557006836, "global_step": 79197, "epoch": 654} {"train_loss": -36.15864944458008, "global_step": 79198, "epoch": 654} {"train_loss": -38.15679931640625, "global_step": 79199, "epoch": 654} {"train_loss": -37.37366485595703, "global_step": 79200, "epoch": 654} {"train_loss": -37.15752029418945, "global_step": 79201, "epoch": 654} {"train_loss": -37.288814544677734, "global_step": 79202, "epoch": 654} {"train_loss": -37.833595275878906, "global_step": 79203, "epoch": 654} {"train_loss": -37.8680305480957, "global_step": 79204, "epoch": 654} {"train_loss": -37.12856674194336, "global_step": 79205, "epoch": 654} {"train_loss": -36.842098236083984, "global_step": 79206, "epoch": 654} {"train_loss": -37.5483283996582, "global_step": 79207, "epoch": 654} {"train_loss": -38.164512634277344, "global_step": 79208, "epoch": 654} {"train_loss": -37.89463806152344, "global_step": 79209, "epoch": 654} {"train_loss": -38.32160568237305, "global_step": 79210, "epoch": 654} {"train_loss": -37.608272552490234, "global_step": 79211, "epoch": 654} {"train_loss": -37.0338249206543, "global_step": 79212, "epoch": 654} {"train_loss": -36.17272186279297, "global_step": 79213, "epoch": 654} {"train_loss": -36.148475646972656, "global_step": 79214, "epoch": 654} {"train_loss": -35.40785598754883, "global_step": 79215, "epoch": 654} {"train_loss": -36.88613510131836, "global_step": 79216, "epoch": 654} {"train_loss": -38.162235260009766, "global_step": 79217, "epoch": 654} {"train_loss": -37.72894287109375, "global_step": 79218, "epoch": 654} {"train_loss": -37.24711990356445, "global_step": 79219, "epoch": 654} {"train_loss": -36.87152862548828, "global_step": 79220, "epoch": 654} {"train_loss": -36.61973190307617, "global_step": 79221, "epoch": 654} {"train_loss": -36.284881591796875, "global_step": 79222, "epoch": 654} {"train_loss": -35.83494186401367, "global_step": 79223, "epoch": 654} {"train_loss": -37.0590705871582, "global_step": 79224, "epoch": 654} {"train_loss": -37.28551483154297, "global_step": 79225, "epoch": 654} {"train_loss": -37.59645462036133, "global_step": 79226, "epoch": 654} {"train_loss": -38.276390075683594, "global_step": 79227, "epoch": 654} {"train_loss": -37.65391159057617, "global_step": 79228, "epoch": 654} {"train_loss": -37.98445510864258, "global_step": 79229, "epoch": 654} {"train_loss": -37.494354248046875, "global_step": 79230, "epoch": 654} {"train_loss": -38.11572265625, "global_step": 79231, "epoch": 654} {"train_loss": -37.735755920410156, "global_step": 79232, "epoch": 654} {"train_loss": -37.99056625366211, "global_step": 79233, "epoch": 654} {"train_loss": -37.67377471923828, "global_step": 79234, "epoch": 654} {"train_loss": -37.7718620300293, "global_step": 79235, "epoch": 654} {"train_loss": -38.44088363647461, "global_step": 79236, "epoch": 654} {"train_loss": -35.815406799316406, "global_step": 79237, "epoch": 654} {"train_loss": -38.24239730834961, "global_step": 79238, "epoch": 654} {"train_loss": -38.22467803955078, "global_step": 79239, "epoch": 654} {"train_loss": -37.16555404663086, "global_step": 79240, "epoch": 654} {"train_loss": -36.38753890991211, "global_step": 79241, "epoch": 654} {"train_loss": -36.65202713012695, "global_step": 79242, "epoch": 654} {"train_loss": -37.740753173828125, "global_step": 79243, "epoch": 654} {"train_loss": -38.16682052612305, "global_step": 79244, "epoch": 654} {"train_loss": -37.25563430786133, "global_step": 79245, "epoch": 654} {"train_loss": -37.006099700927734, "global_step": 79246, "epoch": 654} {"train_loss": -37.1409797668457, "global_step": 79247, "epoch": 654} {"train_loss": -38.05911636352539, "global_step": 79248, "epoch": 654} {"train_loss": -37.587745666503906, "global_step": 79249, "epoch": 654} {"train_loss": -38.14476776123047, "global_step": 79250, "epoch": 654} {"train_loss": -37.54798889160156, "global_step": 79251, "epoch": 654} {"train_loss": -38.05648422241211, "global_step": 79252, "epoch": 654} {"train_loss": -38.36175537109375, "global_step": 79253, "epoch": 654} {"train_loss": -37.2303603936818, "global_step": 79254, "epoch": 654, "val_loss": 2576264.75} {"train_loss": -38.24629592895508, "global_step": 79255, "epoch": 655} {"train_loss": -38.38572311401367, "global_step": 79256, "epoch": 655} {"train_loss": -38.28220748901367, "global_step": 79257, "epoch": 655} {"train_loss": -37.89192199707031, "global_step": 79258, "epoch": 655} {"train_loss": -37.755645751953125, "global_step": 79259, "epoch": 655} {"train_loss": -38.149532318115234, "global_step": 79260, "epoch": 655} {"train_loss": -37.76332473754883, "global_step": 79261, "epoch": 655} {"train_loss": -38.851112365722656, "global_step": 79262, "epoch": 655} {"train_loss": -38.264156341552734, "global_step": 79263, "epoch": 655} {"train_loss": -38.2070198059082, "global_step": 79264, "epoch": 655} {"train_loss": -38.428218841552734, "global_step": 79265, "epoch": 655} {"train_loss": -37.41730499267578, "global_step": 79266, "epoch": 655} {"train_loss": -36.40166091918945, "global_step": 79267, "epoch": 655} {"train_loss": -36.132362365722656, "global_step": 79268, "epoch": 655} {"train_loss": -36.08530044555664, "global_step": 79269, "epoch": 655} {"train_loss": -36.69856643676758, "global_step": 79270, "epoch": 655} {"train_loss": -35.96161651611328, "global_step": 79271, "epoch": 655} {"train_loss": -37.26076889038086, "global_step": 79272, "epoch": 655} {"train_loss": -35.64103698730469, "global_step": 79273, "epoch": 655} {"train_loss": -32.59103012084961, "global_step": 79274, "epoch": 655} {"train_loss": -34.85382080078125, "global_step": 79275, "epoch": 655} {"train_loss": -31.787460327148438, "global_step": 79276, "epoch": 655} {"train_loss": -31.10909080505371, "global_step": 79277, "epoch": 655} {"train_loss": -35.045562744140625, "global_step": 79278, "epoch": 655} {"train_loss": -33.21393585205078, "global_step": 79279, "epoch": 655} {"train_loss": -34.57244873046875, "global_step": 79280, "epoch": 655} {"train_loss": -35.325984954833984, "global_step": 79281, "epoch": 655} {"train_loss": -32.02794647216797, "global_step": 79282, "epoch": 655} {"train_loss": -36.93931198120117, "global_step": 79283, "epoch": 655} {"train_loss": -36.6550178527832, "global_step": 79284, "epoch": 655} {"train_loss": -31.155094146728516, "global_step": 79285, "epoch": 655} {"train_loss": -34.364559173583984, "global_step": 79286, "epoch": 655} {"train_loss": -35.307159423828125, "global_step": 79287, "epoch": 655} {"train_loss": -34.97141647338867, "global_step": 79288, "epoch": 655} {"train_loss": -35.650352478027344, "global_step": 79289, "epoch": 655} {"train_loss": -37.26752471923828, "global_step": 79290, "epoch": 655} {"train_loss": -35.56753158569336, "global_step": 79291, "epoch": 655} {"train_loss": -35.29798126220703, "global_step": 79292, "epoch": 655} {"train_loss": -36.455780029296875, "global_step": 79293, "epoch": 655} {"train_loss": -36.676753997802734, "global_step": 79294, "epoch": 655} {"train_loss": -33.38473129272461, "global_step": 79295, "epoch": 655} {"train_loss": -36.979644775390625, "global_step": 79296, "epoch": 655} {"train_loss": -36.027801513671875, "global_step": 79297, "epoch": 655} {"train_loss": -36.672515869140625, "global_step": 79298, "epoch": 655} {"train_loss": -37.00545883178711, "global_step": 79299, "epoch": 655} {"train_loss": -37.08243942260742, "global_step": 79300, "epoch": 655} {"train_loss": -37.47032928466797, "global_step": 79301, "epoch": 655} {"train_loss": -37.163936614990234, "global_step": 79302, "epoch": 655} {"train_loss": -36.82304000854492, "global_step": 79303, "epoch": 655} {"train_loss": -36.7863883972168, "global_step": 79304, "epoch": 655} {"train_loss": -37.43036651611328, "global_step": 79305, "epoch": 655} {"train_loss": -37.332489013671875, "global_step": 79306, "epoch": 655} {"train_loss": -37.58086395263672, "global_step": 79307, "epoch": 655} {"train_loss": -37.00554656982422, "global_step": 79308, "epoch": 655} {"train_loss": -37.69307327270508, "global_step": 79309, "epoch": 655} {"train_loss": -37.179752349853516, "global_step": 79310, "epoch": 655} {"train_loss": -36.90338134765625, "global_step": 79311, "epoch": 655} {"train_loss": -37.83656692504883, "global_step": 79312, "epoch": 655} {"train_loss": -37.13315963745117, "global_step": 79313, "epoch": 655} {"train_loss": -37.50296401977539, "global_step": 79314, "epoch": 655} {"train_loss": -37.52004623413086, "global_step": 79315, "epoch": 655} {"train_loss": -37.33115768432617, "global_step": 79316, "epoch": 655} {"train_loss": -38.12226486206055, "global_step": 79317, "epoch": 655} {"train_loss": -37.18073272705078, "global_step": 79318, "epoch": 655} {"train_loss": -37.604286193847656, "global_step": 79319, "epoch": 655} {"train_loss": -37.59174728393555, "global_step": 79320, "epoch": 655} {"train_loss": -37.98090362548828, "global_step": 79321, "epoch": 655} {"train_loss": -37.82419204711914, "global_step": 79322, "epoch": 655} {"train_loss": -37.71246337890625, "global_step": 79323, "epoch": 655} {"train_loss": -37.55542755126953, "global_step": 79324, "epoch": 655} {"train_loss": -37.93313217163086, "global_step": 79325, "epoch": 655} {"train_loss": -38.39943313598633, "global_step": 79326, "epoch": 655} {"train_loss": -38.25777816772461, "global_step": 79327, "epoch": 655} {"train_loss": -37.92560958862305, "global_step": 79328, "epoch": 655} {"train_loss": -38.30788040161133, "global_step": 79329, "epoch": 655} {"train_loss": -37.98728942871094, "global_step": 79330, "epoch": 655} {"train_loss": -38.03152084350586, "global_step": 79331, "epoch": 655} {"train_loss": -37.74360275268555, "global_step": 79332, "epoch": 655} {"train_loss": -37.83406448364258, "global_step": 79333, "epoch": 655} {"train_loss": -37.73061752319336, "global_step": 79334, "epoch": 655} {"train_loss": -37.663124084472656, "global_step": 79335, "epoch": 655} {"train_loss": -38.628021240234375, "global_step": 79336, "epoch": 655} {"train_loss": -37.640663146972656, "global_step": 79337, "epoch": 655} {"train_loss": -38.23722457885742, "global_step": 79338, "epoch": 655} {"train_loss": -38.137020111083984, "global_step": 79339, "epoch": 655} {"train_loss": -38.0450439453125, "global_step": 79340, "epoch": 655} {"train_loss": -38.5652961730957, "global_step": 79341, "epoch": 655} {"train_loss": -38.12046432495117, "global_step": 79342, "epoch": 655} {"train_loss": -38.237369537353516, "global_step": 79343, "epoch": 655} {"train_loss": -38.55023193359375, "global_step": 79344, "epoch": 655} {"train_loss": -37.88802719116211, "global_step": 79345, "epoch": 655} {"train_loss": -37.3722038269043, "global_step": 79346, "epoch": 655} {"train_loss": -36.21821212768555, "global_step": 79347, "epoch": 655} {"train_loss": -36.11064147949219, "global_step": 79348, "epoch": 655} {"train_loss": -37.88236618041992, "global_step": 79349, "epoch": 655} {"train_loss": -38.087890625, "global_step": 79350, "epoch": 655} {"train_loss": -38.571075439453125, "global_step": 79351, "epoch": 655} {"train_loss": -37.45492172241211, "global_step": 79352, "epoch": 655} {"train_loss": -37.186370849609375, "global_step": 79353, "epoch": 655} {"train_loss": -37.67069625854492, "global_step": 79354, "epoch": 655} {"train_loss": -38.219173431396484, "global_step": 79355, "epoch": 655} {"train_loss": -38.4698600769043, "global_step": 79356, "epoch": 655} {"train_loss": -37.25006103515625, "global_step": 79357, "epoch": 655} {"train_loss": -37.75940704345703, "global_step": 79358, "epoch": 655} {"train_loss": -38.25484848022461, "global_step": 79359, "epoch": 655} {"train_loss": -36.57240676879883, "global_step": 79360, "epoch": 655} {"train_loss": -37.1151237487793, "global_step": 79361, "epoch": 655} {"train_loss": -37.39325714111328, "global_step": 79362, "epoch": 655} {"train_loss": -37.92432403564453, "global_step": 79363, "epoch": 655} {"train_loss": -38.04109573364258, "global_step": 79364, "epoch": 655} {"train_loss": -36.29572677612305, "global_step": 79365, "epoch": 655} {"train_loss": -33.21169662475586, "global_step": 79366, "epoch": 655} {"train_loss": -30.57037925720215, "global_step": 79367, "epoch": 655} {"train_loss": -31.843854904174805, "global_step": 79368, "epoch": 655} {"train_loss": -34.438621520996094, "global_step": 79369, "epoch": 655} {"train_loss": -36.79519271850586, "global_step": 79370, "epoch": 655} {"train_loss": -33.938262939453125, "global_step": 79371, "epoch": 655} {"train_loss": -37.35258102416992, "global_step": 79372, "epoch": 655} {"train_loss": -35.14182662963867, "global_step": 79373, "epoch": 655} {"train_loss": -37.015377044677734, "global_step": 79374, "epoch": 655} {"train_loss": -36.78838280606861, "global_step": 79375, "epoch": 655, "val_loss": 2522745.0} {"train_loss": -35.2681999206543, "global_step": 79376, "epoch": 656} {"train_loss": -37.36345672607422, "global_step": 79377, "epoch": 656} {"train_loss": -37.371944427490234, "global_step": 79378, "epoch": 656} {"train_loss": -36.65094757080078, "global_step": 79379, "epoch": 656} {"train_loss": -37.87382125854492, "global_step": 79380, "epoch": 656} {"train_loss": -36.986942291259766, "global_step": 79381, "epoch": 656} {"train_loss": -36.9754524230957, "global_step": 79382, "epoch": 656} {"train_loss": -36.792728424072266, "global_step": 79383, "epoch": 656} {"train_loss": -37.76288986206055, "global_step": 79384, "epoch": 656} {"train_loss": -37.084022521972656, "global_step": 79385, "epoch": 656} {"train_loss": -36.88660430908203, "global_step": 79386, "epoch": 656} {"train_loss": -38.06972885131836, "global_step": 79387, "epoch": 656} {"train_loss": -37.12714385986328, "global_step": 79388, "epoch": 656} {"train_loss": -36.7817268371582, "global_step": 79389, "epoch": 656} {"train_loss": -37.76219940185547, "global_step": 79390, "epoch": 656} {"train_loss": -37.6771240234375, "global_step": 79391, "epoch": 656} {"train_loss": -37.244625091552734, "global_step": 79392, "epoch": 656} {"train_loss": -37.693199157714844, "global_step": 79393, "epoch": 656} {"train_loss": -37.98077392578125, "global_step": 79394, "epoch": 656} {"train_loss": -38.20148468017578, "global_step": 79395, "epoch": 656} {"train_loss": -38.00957107543945, "global_step": 79396, "epoch": 656} {"train_loss": -37.945465087890625, "global_step": 79397, "epoch": 656} {"train_loss": -38.21744918823242, "global_step": 79398, "epoch": 656} {"train_loss": -37.51654052734375, "global_step": 79399, "epoch": 656} {"train_loss": -38.00803756713867, "global_step": 79400, "epoch": 656} {"train_loss": -38.29562759399414, "global_step": 79401, "epoch": 656} {"train_loss": -38.01571273803711, "global_step": 79402, "epoch": 656} {"train_loss": -37.914573669433594, "global_step": 79403, "epoch": 656} {"train_loss": -38.17013168334961, "global_step": 79404, "epoch": 656} {"train_loss": -38.20999526977539, "global_step": 79405, "epoch": 656} {"train_loss": -37.93259811401367, "global_step": 79406, "epoch": 656} {"train_loss": -38.21921920776367, "global_step": 79407, "epoch": 656} {"train_loss": -37.7678108215332, "global_step": 79408, "epoch": 656} {"train_loss": -37.65139389038086, "global_step": 79409, "epoch": 656} {"train_loss": -35.6672248840332, "global_step": 79410, "epoch": 656} {"train_loss": -33.2193717956543, "global_step": 79411, "epoch": 656} {"train_loss": -31.7226505279541, "global_step": 79412, "epoch": 656} {"train_loss": -26.293048858642578, "global_step": 79413, "epoch": 656} {"train_loss": -18.034299850463867, "global_step": 79414, "epoch": 656} {"train_loss": -13.710049629211426, "global_step": 79415, "epoch": 656} {"train_loss": -37.8452033996582, "global_step": 79416, "epoch": 656} {"train_loss": -21.756671905517578, "global_step": 79417, "epoch": 656} {"train_loss": -26.64691734313965, "global_step": 79418, "epoch": 656} {"train_loss": -33.57589340209961, "global_step": 79419, "epoch": 656} {"train_loss": -28.884424209594727, "global_step": 79420, "epoch": 656} {"train_loss": -33.656246185302734, "global_step": 79421, "epoch": 656} {"train_loss": -33.49384689331055, "global_step": 79422, "epoch": 656} {"train_loss": -33.01838302612305, "global_step": 79423, "epoch": 656} {"train_loss": -36.7711067199707, "global_step": 79424, "epoch": 656} {"train_loss": -34.321441650390625, "global_step": 79425, "epoch": 656} {"train_loss": -35.009918212890625, "global_step": 79426, "epoch": 656} {"train_loss": -37.431556701660156, "global_step": 79427, "epoch": 656} {"train_loss": -35.42670822143555, "global_step": 79428, "epoch": 656} {"train_loss": -35.12710189819336, "global_step": 79429, "epoch": 656} {"train_loss": -37.39091110229492, "global_step": 79430, "epoch": 656} {"train_loss": -36.33669662475586, "global_step": 79431, "epoch": 656} {"train_loss": -35.28300094604492, "global_step": 79432, "epoch": 656} {"train_loss": -36.294673919677734, "global_step": 79433, "epoch": 656} {"train_loss": -37.07841110229492, "global_step": 79434, "epoch": 656} {"train_loss": -36.154022216796875, "global_step": 79435, "epoch": 656} {"train_loss": -36.32352828979492, "global_step": 79436, "epoch": 656} {"train_loss": -37.41514205932617, "global_step": 79437, "epoch": 656} {"train_loss": -37.32435989379883, "global_step": 79438, "epoch": 656} {"train_loss": -36.6505126953125, "global_step": 79439, "epoch": 656} {"train_loss": -36.74624252319336, "global_step": 79440, "epoch": 656} {"train_loss": -37.26462173461914, "global_step": 79441, "epoch": 656} {"train_loss": -37.6240348815918, "global_step": 79442, "epoch": 656} {"train_loss": -37.1292839050293, "global_step": 79443, "epoch": 656} {"train_loss": -37.08152389526367, "global_step": 79444, "epoch": 656} {"train_loss": -37.9499397277832, "global_step": 79445, "epoch": 656} {"train_loss": -37.829586029052734, "global_step": 79446, "epoch": 656} {"train_loss": -37.390380859375, "global_step": 79447, "epoch": 656} {"train_loss": -37.624061584472656, "global_step": 79448, "epoch": 656} {"train_loss": -38.007835388183594, "global_step": 79449, "epoch": 656} {"train_loss": -37.36699295043945, "global_step": 79450, "epoch": 656} {"train_loss": -38.039772033691406, "global_step": 79451, "epoch": 656} {"train_loss": -37.34385299682617, "global_step": 79452, "epoch": 656} {"train_loss": -37.48902130126953, "global_step": 79453, "epoch": 656} {"train_loss": -37.72119903564453, "global_step": 79454, "epoch": 656} {"train_loss": -37.96842575073242, "global_step": 79455, "epoch": 656} {"train_loss": -37.84278106689453, "global_step": 79456, "epoch": 656} {"train_loss": -37.47087478637695, "global_step": 79457, "epoch": 656} {"train_loss": -38.05708312988281, "global_step": 79458, "epoch": 656} {"train_loss": -37.931758880615234, "global_step": 79459, "epoch": 656} {"train_loss": -37.97535705566406, "global_step": 79460, "epoch": 656} {"train_loss": -38.14756774902344, "global_step": 79461, "epoch": 656} {"train_loss": -37.716922760009766, "global_step": 79462, "epoch": 656} {"train_loss": -37.665035247802734, "global_step": 79463, "epoch": 656} {"train_loss": -38.192169189453125, "global_step": 79464, "epoch": 656} {"train_loss": -37.620723724365234, "global_step": 79465, "epoch": 656} {"train_loss": -38.067989349365234, "global_step": 79466, "epoch": 656} {"train_loss": -38.04067611694336, "global_step": 79467, "epoch": 656} {"train_loss": -37.70025634765625, "global_step": 79468, "epoch": 656} {"train_loss": -37.85872268676758, "global_step": 79469, "epoch": 656} {"train_loss": -37.776222229003906, "global_step": 79470, "epoch": 656} {"train_loss": -37.35641098022461, "global_step": 79471, "epoch": 656} {"train_loss": -38.188934326171875, "global_step": 79472, "epoch": 656} {"train_loss": -37.444515228271484, "global_step": 79473, "epoch": 656} {"train_loss": -37.38844680786133, "global_step": 79474, "epoch": 656} {"train_loss": -37.70243453979492, "global_step": 79475, "epoch": 656} {"train_loss": -38.09745788574219, "global_step": 79476, "epoch": 656} {"train_loss": -37.412113189697266, "global_step": 79477, "epoch": 656} {"train_loss": -37.13137435913086, "global_step": 79478, "epoch": 656} {"train_loss": -36.40808868408203, "global_step": 79479, "epoch": 656} {"train_loss": -34.29006576538086, "global_step": 79480, "epoch": 656} {"train_loss": -35.585609436035156, "global_step": 79481, "epoch": 656} {"train_loss": -36.632022857666016, "global_step": 79482, "epoch": 656} {"train_loss": -35.441314697265625, "global_step": 79483, "epoch": 656} {"train_loss": -34.69136428833008, "global_step": 79484, "epoch": 656} {"train_loss": -35.65641784667969, "global_step": 79485, "epoch": 656} {"train_loss": -33.77052307128906, "global_step": 79486, "epoch": 656} {"train_loss": -35.61575698852539, "global_step": 79487, "epoch": 656} {"train_loss": -28.739377975463867, "global_step": 79488, "epoch": 656} {"train_loss": -32.904335021972656, "global_step": 79489, "epoch": 656} {"train_loss": -32.83287048339844, "global_step": 79490, "epoch": 656} {"train_loss": -34.426029205322266, "global_step": 79491, "epoch": 656} {"train_loss": -31.56501579284668, "global_step": 79492, "epoch": 656} {"train_loss": -36.19193649291992, "global_step": 79493, "epoch": 656} {"train_loss": -34.201568603515625, "global_step": 79494, "epoch": 656} {"train_loss": -34.62054443359375, "global_step": 79495, "epoch": 656} {"train_loss": -35.97710343825916, "global_step": 79496, "epoch": 656, "val_loss": 2524474.25} {"train_loss": -34.79301071166992, "global_step": 79497, "epoch": 657} {"train_loss": -36.363033294677734, "global_step": 79498, "epoch": 657} {"train_loss": -34.27735137939453, "global_step": 79499, "epoch": 657} {"train_loss": -35.46732711791992, "global_step": 79500, "epoch": 657} {"train_loss": -34.53670883178711, "global_step": 79501, "epoch": 657} {"train_loss": -35.26493453979492, "global_step": 79502, "epoch": 657} {"train_loss": -35.25687789916992, "global_step": 79503, "epoch": 657} {"train_loss": -35.752845764160156, "global_step": 79504, "epoch": 657} {"train_loss": -36.08651351928711, "global_step": 79505, "epoch": 657} {"train_loss": -34.98322296142578, "global_step": 79506, "epoch": 657} {"train_loss": -35.600276947021484, "global_step": 79507, "epoch": 657} {"train_loss": -35.42116928100586, "global_step": 79508, "epoch": 657} {"train_loss": -36.715431213378906, "global_step": 79509, "epoch": 657} {"train_loss": -36.1912956237793, "global_step": 79510, "epoch": 657} {"train_loss": -35.96576690673828, "global_step": 79511, "epoch": 657} {"train_loss": -37.185546875, "global_step": 79512, "epoch": 657} {"train_loss": -36.93813705444336, "global_step": 79513, "epoch": 657} {"train_loss": -36.782562255859375, "global_step": 79514, "epoch": 657} {"train_loss": -37.22450637817383, "global_step": 79515, "epoch": 657} {"train_loss": -36.695125579833984, "global_step": 79516, "epoch": 657} {"train_loss": -37.299346923828125, "global_step": 79517, "epoch": 657} {"train_loss": -37.474544525146484, "global_step": 79518, "epoch": 657} {"train_loss": -37.26593780517578, "global_step": 79519, "epoch": 657} {"train_loss": -37.55852127075195, "global_step": 79520, "epoch": 657} {"train_loss": -37.11445999145508, "global_step": 79521, "epoch": 657} {"train_loss": -37.225067138671875, "global_step": 79522, "epoch": 657} {"train_loss": -37.239166259765625, "global_step": 79523, "epoch": 657} {"train_loss": -37.450660705566406, "global_step": 79524, "epoch": 657} {"train_loss": -37.2735710144043, "global_step": 79525, "epoch": 657} {"train_loss": -37.42396926879883, "global_step": 79526, "epoch": 657} {"train_loss": -37.4945182800293, "global_step": 79527, "epoch": 657} {"train_loss": -37.5833740234375, "global_step": 79528, "epoch": 657} {"train_loss": -37.47620391845703, "global_step": 79529, "epoch": 657} {"train_loss": -37.01074981689453, "global_step": 79530, "epoch": 657} {"train_loss": -37.70608139038086, "global_step": 79531, "epoch": 657} {"train_loss": -37.57993698120117, "global_step": 79532, "epoch": 657} {"train_loss": -37.3248405456543, "global_step": 79533, "epoch": 657} {"train_loss": -37.66596221923828, "global_step": 79534, "epoch": 657} {"train_loss": -37.62055206298828, "global_step": 79535, "epoch": 657} {"train_loss": -37.246761322021484, "global_step": 79536, "epoch": 657} {"train_loss": -37.53203201293945, "global_step": 79537, "epoch": 657} {"train_loss": -37.9255256652832, "global_step": 79538, "epoch": 657} {"train_loss": -37.379005432128906, "global_step": 79539, "epoch": 657} {"train_loss": -37.36451721191406, "global_step": 79540, "epoch": 657} {"train_loss": -37.77798080444336, "global_step": 79541, "epoch": 657} {"train_loss": -37.75537109375, "global_step": 79542, "epoch": 657} {"train_loss": -37.67310333251953, "global_step": 79543, "epoch": 657} {"train_loss": -38.143795013427734, "global_step": 79544, "epoch": 657} {"train_loss": -37.83979034423828, "global_step": 79545, "epoch": 657} {"train_loss": -37.95550537109375, "global_step": 79546, "epoch": 657} {"train_loss": -37.7965202331543, "global_step": 79547, "epoch": 657} {"train_loss": -38.09476852416992, "global_step": 79548, "epoch": 657} {"train_loss": -38.18928909301758, "global_step": 79549, "epoch": 657} {"train_loss": -37.275146484375, "global_step": 79550, "epoch": 657} {"train_loss": -36.663944244384766, "global_step": 79551, "epoch": 657} {"train_loss": -36.58814239501953, "global_step": 79552, "epoch": 657} {"train_loss": -37.870452880859375, "global_step": 79553, "epoch": 657} {"train_loss": -38.14991760253906, "global_step": 79554, "epoch": 657} {"train_loss": -37.91427230834961, "global_step": 79555, "epoch": 657} {"train_loss": -37.17399978637695, "global_step": 79556, "epoch": 657} {"train_loss": -38.10516357421875, "global_step": 79557, "epoch": 657} {"train_loss": -38.0021858215332, "global_step": 79558, "epoch": 657} {"train_loss": -38.28185272216797, "global_step": 79559, "epoch": 657} {"train_loss": -37.96369552612305, "global_step": 79560, "epoch": 657} {"train_loss": -38.06440353393555, "global_step": 79561, "epoch": 657} {"train_loss": -38.301177978515625, "global_step": 79562, "epoch": 657} {"train_loss": -37.26835250854492, "global_step": 79563, "epoch": 657} {"train_loss": -35.81660079956055, "global_step": 79564, "epoch": 657} {"train_loss": -31.543928146362305, "global_step": 79565, "epoch": 657} {"train_loss": -26.004331588745117, "global_step": 79566, "epoch": 657} {"train_loss": -27.382638931274414, "global_step": 79567, "epoch": 657} {"train_loss": -29.59440040588379, "global_step": 79568, "epoch": 657} {"train_loss": -26.90119743347168, "global_step": 79569, "epoch": 657} {"train_loss": -35.4793701171875, "global_step": 79570, "epoch": 657} {"train_loss": -32.446266174316406, "global_step": 79571, "epoch": 657} {"train_loss": -29.921070098876953, "global_step": 79572, "epoch": 657} {"train_loss": -33.3987922668457, "global_step": 79573, "epoch": 657} {"train_loss": -35.8161735534668, "global_step": 79574, "epoch": 657} {"train_loss": -34.56930923461914, "global_step": 79575, "epoch": 657} {"train_loss": -36.419437408447266, "global_step": 79576, "epoch": 657} {"train_loss": -35.70541000366211, "global_step": 79577, "epoch": 657} {"train_loss": -36.405242919921875, "global_step": 79578, "epoch": 657} {"train_loss": -36.128562927246094, "global_step": 79579, "epoch": 657} {"train_loss": -35.59738540649414, "global_step": 79580, "epoch": 657} {"train_loss": -36.87811279296875, "global_step": 79581, "epoch": 657} {"train_loss": -35.76140213012695, "global_step": 79582, "epoch": 657} {"train_loss": -36.4940299987793, "global_step": 79583, "epoch": 657} {"train_loss": -36.313846588134766, "global_step": 79584, "epoch": 657} {"train_loss": -36.741092681884766, "global_step": 79585, "epoch": 657} {"train_loss": -36.403099060058594, "global_step": 79586, "epoch": 657} {"train_loss": -36.89392852783203, "global_step": 79587, "epoch": 657} {"train_loss": -37.077632904052734, "global_step": 79588, "epoch": 657} {"train_loss": -36.87158966064453, "global_step": 79589, "epoch": 657} {"train_loss": -37.300411224365234, "global_step": 79590, "epoch": 657} {"train_loss": -37.34376907348633, "global_step": 79591, "epoch": 657} {"train_loss": -37.26975631713867, "global_step": 79592, "epoch": 657} {"train_loss": -36.934837341308594, "global_step": 79593, "epoch": 657} {"train_loss": -37.58390426635742, "global_step": 79594, "epoch": 657} {"train_loss": -36.95416259765625, "global_step": 79595, "epoch": 657} {"train_loss": -37.738861083984375, "global_step": 79596, "epoch": 657} {"train_loss": -37.60045623779297, "global_step": 79597, "epoch": 657} {"train_loss": -37.3671989440918, "global_step": 79598, "epoch": 657} {"train_loss": -37.02033996582031, "global_step": 79599, "epoch": 657} {"train_loss": -37.49128341674805, "global_step": 79600, "epoch": 657} {"train_loss": -37.202125549316406, "global_step": 79601, "epoch": 657} {"train_loss": -37.54640579223633, "global_step": 79602, "epoch": 657} {"train_loss": -37.85710525512695, "global_step": 79603, "epoch": 657} {"train_loss": -37.55290222167969, "global_step": 79604, "epoch": 657} {"train_loss": -38.06538772583008, "global_step": 79605, "epoch": 657} {"train_loss": -37.998992919921875, "global_step": 79606, "epoch": 657} {"train_loss": -37.90019607543945, "global_step": 79607, "epoch": 657} {"train_loss": -37.8746452331543, "global_step": 79608, "epoch": 657} {"train_loss": -38.08250045776367, "global_step": 79609, "epoch": 657} {"train_loss": -38.01182174682617, "global_step": 79610, "epoch": 657} {"train_loss": -38.0018196105957, "global_step": 79611, "epoch": 657} {"train_loss": -38.0451545715332, "global_step": 79612, "epoch": 657} {"train_loss": -37.92815399169922, "global_step": 79613, "epoch": 657} {"train_loss": -38.12136459350586, "global_step": 79614, "epoch": 657} {"train_loss": -38.263458251953125, "global_step": 79615, "epoch": 657} {"train_loss": -37.90969467163086, "global_step": 79616, "epoch": 657} {"train_loss": -36.59627748914986, "global_step": 79617, "epoch": 657, "val_loss": 2574158.25} {"train_loss": -38.26025390625, "global_step": 79618, "epoch": 658} {"train_loss": -38.60199737548828, "global_step": 79619, "epoch": 658} {"train_loss": -38.12191390991211, "global_step": 79620, "epoch": 658} {"train_loss": -38.311588287353516, "global_step": 79621, "epoch": 658} {"train_loss": -37.7576789855957, "global_step": 79622, "epoch": 658} {"train_loss": -38.580833435058594, "global_step": 79623, "epoch": 658} {"train_loss": -38.30793380737305, "global_step": 79624, "epoch": 658} {"train_loss": -38.169979095458984, "global_step": 79625, "epoch": 658} {"train_loss": -37.944427490234375, "global_step": 79626, "epoch": 658} {"train_loss": -37.81441116333008, "global_step": 79627, "epoch": 658} {"train_loss": -36.502689361572266, "global_step": 79628, "epoch": 658} {"train_loss": -36.19048309326172, "global_step": 79629, "epoch": 658} {"train_loss": -32.84041213989258, "global_step": 79630, "epoch": 658} {"train_loss": -26.200469970703125, "global_step": 79631, "epoch": 658} {"train_loss": -32.49025344848633, "global_step": 79632, "epoch": 658} {"train_loss": -37.761478424072266, "global_step": 79633, "epoch": 658} {"train_loss": -33.58180618286133, "global_step": 79634, "epoch": 658} {"train_loss": -36.77700424194336, "global_step": 79635, "epoch": 658} {"train_loss": -35.498531341552734, "global_step": 79636, "epoch": 658} {"train_loss": -33.39358139038086, "global_step": 79637, "epoch": 658} {"train_loss": -37.86674880981445, "global_step": 79638, "epoch": 658} {"train_loss": -34.86934280395508, "global_step": 79639, "epoch": 658} {"train_loss": -36.88442611694336, "global_step": 79640, "epoch": 658} {"train_loss": -34.47309494018555, "global_step": 79641, "epoch": 658} {"train_loss": -37.513553619384766, "global_step": 79642, "epoch": 658} {"train_loss": -33.570377349853516, "global_step": 79643, "epoch": 658} {"train_loss": -34.899383544921875, "global_step": 79644, "epoch": 658} {"train_loss": -36.61989974975586, "global_step": 79645, "epoch": 658} {"train_loss": -36.33610153198242, "global_step": 79646, "epoch": 658} {"train_loss": -34.803646087646484, "global_step": 79647, "epoch": 658} {"train_loss": -34.74950408935547, "global_step": 79648, "epoch": 658} {"train_loss": -36.78115463256836, "global_step": 79649, "epoch": 658} {"train_loss": -36.60505294799805, "global_step": 79650, "epoch": 658} {"train_loss": -36.7197380065918, "global_step": 79651, "epoch": 658} {"train_loss": -36.63553237915039, "global_step": 79652, "epoch": 658} {"train_loss": -36.71663284301758, "global_step": 79653, "epoch": 658} {"train_loss": -37.45540237426758, "global_step": 79654, "epoch": 658} {"train_loss": -36.82894515991211, "global_step": 79655, "epoch": 658} {"train_loss": -37.4033317565918, "global_step": 79656, "epoch": 658} {"train_loss": -37.47941207885742, "global_step": 79657, "epoch": 658} {"train_loss": -36.82149124145508, "global_step": 79658, "epoch": 658} {"train_loss": -37.1899299621582, "global_step": 79659, "epoch": 658} {"train_loss": -37.352088928222656, "global_step": 79660, "epoch": 658} {"train_loss": -37.39141845703125, "global_step": 79661, "epoch": 658} {"train_loss": -37.54890060424805, "global_step": 79662, "epoch": 658} {"train_loss": -37.264583587646484, "global_step": 79663, "epoch": 658} {"train_loss": -37.618404388427734, "global_step": 79664, "epoch": 658} {"train_loss": -37.524131774902344, "global_step": 79665, "epoch": 658} {"train_loss": -37.8197135925293, "global_step": 79666, "epoch": 658} {"train_loss": -37.933162689208984, "global_step": 79667, "epoch": 658} {"train_loss": -37.88295364379883, "global_step": 79668, "epoch": 658} {"train_loss": -37.87991714477539, "global_step": 79669, "epoch": 658} {"train_loss": -37.9332389831543, "global_step": 79670, "epoch": 658} {"train_loss": -37.90468215942383, "global_step": 79671, "epoch": 658} {"train_loss": -38.01176071166992, "global_step": 79672, "epoch": 658} {"train_loss": -37.31146240234375, "global_step": 79673, "epoch": 658} {"train_loss": -38.09273910522461, "global_step": 79674, "epoch": 658} {"train_loss": -38.00686264038086, "global_step": 79675, "epoch": 658} {"train_loss": -38.280826568603516, "global_step": 79676, "epoch": 658} {"train_loss": -37.89198303222656, "global_step": 79677, "epoch": 658} {"train_loss": -38.217681884765625, "global_step": 79678, "epoch": 658} {"train_loss": -38.34409713745117, "global_step": 79679, "epoch": 658} {"train_loss": -38.241207122802734, "global_step": 79680, "epoch": 658} {"train_loss": -37.9917106628418, "global_step": 79681, "epoch": 658} {"train_loss": -38.29579544067383, "global_step": 79682, "epoch": 658} {"train_loss": -38.0765495300293, "global_step": 79683, "epoch": 658} {"train_loss": -38.2585563659668, "global_step": 79684, "epoch": 658} {"train_loss": -38.09465026855469, "global_step": 79685, "epoch": 658} {"train_loss": -38.51976776123047, "global_step": 79686, "epoch": 658} {"train_loss": -38.147857666015625, "global_step": 79687, "epoch": 658} {"train_loss": -38.28963851928711, "global_step": 79688, "epoch": 658} {"train_loss": -38.707794189453125, "global_step": 79689, "epoch": 658} {"train_loss": -38.4592170715332, "global_step": 79690, "epoch": 658} {"train_loss": -37.87413787841797, "global_step": 79691, "epoch": 658} {"train_loss": -38.6323356628418, "global_step": 79692, "epoch": 658} {"train_loss": -38.392154693603516, "global_step": 79693, "epoch": 658} {"train_loss": -38.32621383666992, "global_step": 79694, "epoch": 658} {"train_loss": -38.28864669799805, "global_step": 79695, "epoch": 658} {"train_loss": -38.313961029052734, "global_step": 79696, "epoch": 658} {"train_loss": -38.741031646728516, "global_step": 79697, "epoch": 658} {"train_loss": -38.13705062866211, "global_step": 79698, "epoch": 658} {"train_loss": -38.5905876159668, "global_step": 79699, "epoch": 658} {"train_loss": -38.65668869018555, "global_step": 79700, "epoch": 658} {"train_loss": -38.423152923583984, "global_step": 79701, "epoch": 658} {"train_loss": -38.81538009643555, "global_step": 79702, "epoch": 658} {"train_loss": -38.76392364501953, "global_step": 79703, "epoch": 658} {"train_loss": -37.962249755859375, "global_step": 79704, "epoch": 658} {"train_loss": -38.36016845703125, "global_step": 79705, "epoch": 658} {"train_loss": -37.38391876220703, "global_step": 79706, "epoch": 658} {"train_loss": -36.630340576171875, "global_step": 79707, "epoch": 658} {"train_loss": -38.421566009521484, "global_step": 79708, "epoch": 658} {"train_loss": -37.59188461303711, "global_step": 79709, "epoch": 658} {"train_loss": -34.76679611206055, "global_step": 79710, "epoch": 658} {"train_loss": -37.215240478515625, "global_step": 79711, "epoch": 658} {"train_loss": -35.83754348754883, "global_step": 79712, "epoch": 658} {"train_loss": -36.47813415527344, "global_step": 79713, "epoch": 658} {"train_loss": -31.820892333984375, "global_step": 79714, "epoch": 658} {"train_loss": -35.81769943237305, "global_step": 79715, "epoch": 658} {"train_loss": -37.052337646484375, "global_step": 79716, "epoch": 658} {"train_loss": -37.30934143066406, "global_step": 79717, "epoch": 658} {"train_loss": -35.7962646484375, "global_step": 79718, "epoch": 658} {"train_loss": -32.95991897583008, "global_step": 79719, "epoch": 658} {"train_loss": -33.9645881652832, "global_step": 79720, "epoch": 658} {"train_loss": -34.0556640625, "global_step": 79721, "epoch": 658} {"train_loss": -32.15690994262695, "global_step": 79722, "epoch": 658} {"train_loss": -20.7720890045166, "global_step": 79723, "epoch": 658} {"train_loss": -32.7746467590332, "global_step": 79724, "epoch": 658} {"train_loss": -35.899574279785156, "global_step": 79725, "epoch": 658} {"train_loss": -27.794958114624023, "global_step": 79726, "epoch": 658} {"train_loss": -32.674896240234375, "global_step": 79727, "epoch": 658} {"train_loss": -25.37603187561035, "global_step": 79728, "epoch": 658} {"train_loss": -31.566938400268555, "global_step": 79729, "epoch": 658} {"train_loss": -32.407745361328125, "global_step": 79730, "epoch": 658} {"train_loss": -33.2440071105957, "global_step": 79731, "epoch": 658} {"train_loss": -33.89724349975586, "global_step": 79732, "epoch": 658} {"train_loss": -33.68743896484375, "global_step": 79733, "epoch": 658} {"train_loss": -33.593666076660156, "global_step": 79734, "epoch": 658} {"train_loss": -34.541847229003906, "global_step": 79735, "epoch": 658} {"train_loss": -31.558385848999023, "global_step": 79736, "epoch": 658} {"train_loss": -33.89155960083008, "global_step": 79737, "epoch": 658} {"train_loss": -36.266197157300205, "global_step": 79738, "epoch": 658, "val_loss": 2469840.25} {"train_loss": -33.7247428894043, "global_step": 79739, "epoch": 659} {"train_loss": -33.415069580078125, "global_step": 79740, "epoch": 659} {"train_loss": -32.87784957885742, "global_step": 79741, "epoch": 659} {"train_loss": -34.378108978271484, "global_step": 79742, "epoch": 659} {"train_loss": -33.226131439208984, "global_step": 79743, "epoch": 659} {"train_loss": -33.73588180541992, "global_step": 79744, "epoch": 659} {"train_loss": -33.569786071777344, "global_step": 79745, "epoch": 659} {"train_loss": -33.953521728515625, "global_step": 79746, "epoch": 659} {"train_loss": -32.95808792114258, "global_step": 79747, "epoch": 659} {"train_loss": -35.49589920043945, "global_step": 79748, "epoch": 659} {"train_loss": -35.40497970581055, "global_step": 79749, "epoch": 659} {"train_loss": -34.93659973144531, "global_step": 79750, "epoch": 659} {"train_loss": -35.2000846862793, "global_step": 79751, "epoch": 659} {"train_loss": -34.66682052612305, "global_step": 79752, "epoch": 659} {"train_loss": -34.79315948486328, "global_step": 79753, "epoch": 659} {"train_loss": -34.436065673828125, "global_step": 79754, "epoch": 659} {"train_loss": -35.16157150268555, "global_step": 79755, "epoch": 659} {"train_loss": -36.2503776550293, "global_step": 79756, "epoch": 659} {"train_loss": -35.836490631103516, "global_step": 79757, "epoch": 659} {"train_loss": -35.9278564453125, "global_step": 79758, "epoch": 659} {"train_loss": -35.67403793334961, "global_step": 79759, "epoch": 659} {"train_loss": -36.312278747558594, "global_step": 79760, "epoch": 659} {"train_loss": -35.74905776977539, "global_step": 79761, "epoch": 659} {"train_loss": -35.68419647216797, "global_step": 79762, "epoch": 659} {"train_loss": -36.442970275878906, "global_step": 79763, "epoch": 659} {"train_loss": -36.31039810180664, "global_step": 79764, "epoch": 659} {"train_loss": -36.25365447998047, "global_step": 79765, "epoch": 659} {"train_loss": -35.816768646240234, "global_step": 79766, "epoch": 659} {"train_loss": -36.122283935546875, "global_step": 79767, "epoch": 659} {"train_loss": -36.734466552734375, "global_step": 79768, "epoch": 659} {"train_loss": -36.534339904785156, "global_step": 79769, "epoch": 659} {"train_loss": -35.484832763671875, "global_step": 79770, "epoch": 659} {"train_loss": -36.76601791381836, "global_step": 79771, "epoch": 659} {"train_loss": -36.25238037109375, "global_step": 79772, "epoch": 659} {"train_loss": -36.744117736816406, "global_step": 79773, "epoch": 659} {"train_loss": -37.03718948364258, "global_step": 79774, "epoch": 659} {"train_loss": -36.09907150268555, "global_step": 79775, "epoch": 659} {"train_loss": -36.74818801879883, "global_step": 79776, "epoch": 659} {"train_loss": -37.48442459106445, "global_step": 79777, "epoch": 659} {"train_loss": -36.49485397338867, "global_step": 79778, "epoch": 659} {"train_loss": -36.620338439941406, "global_step": 79779, "epoch": 659} {"train_loss": -36.911720275878906, "global_step": 79780, "epoch": 659} {"train_loss": -36.62852096557617, "global_step": 79781, "epoch": 659} {"train_loss": -36.53241729736328, "global_step": 79782, "epoch": 659} {"train_loss": -36.5963020324707, "global_step": 79783, "epoch": 659} {"train_loss": -37.406246185302734, "global_step": 79784, "epoch": 659} {"train_loss": -37.33008575439453, "global_step": 79785, "epoch": 659} {"train_loss": -37.31732940673828, "global_step": 79786, "epoch": 659} {"train_loss": -37.6096076965332, "global_step": 79787, "epoch": 659} {"train_loss": -37.287147521972656, "global_step": 79788, "epoch": 659} {"train_loss": -37.00602340698242, "global_step": 79789, "epoch": 659} {"train_loss": -37.489383697509766, "global_step": 79790, "epoch": 659} {"train_loss": -37.95029830932617, "global_step": 79791, "epoch": 659} {"train_loss": -37.57769775390625, "global_step": 79792, "epoch": 659} {"train_loss": -37.60408401489258, "global_step": 79793, "epoch": 659} {"train_loss": -37.77277755737305, "global_step": 79794, "epoch": 659} {"train_loss": -37.56696319580078, "global_step": 79795, "epoch": 659} {"train_loss": -37.232208251953125, "global_step": 79796, "epoch": 659} {"train_loss": -37.81776809692383, "global_step": 79797, "epoch": 659} {"train_loss": -37.393497467041016, "global_step": 79798, "epoch": 659} {"train_loss": -38.17937088012695, "global_step": 79799, "epoch": 659} {"train_loss": -37.90046691894531, "global_step": 79800, "epoch": 659} {"train_loss": -37.7595329284668, "global_step": 79801, "epoch": 659} {"train_loss": -37.24367904663086, "global_step": 79802, "epoch": 659} {"train_loss": -35.9094352722168, "global_step": 79803, "epoch": 659} {"train_loss": -34.028717041015625, "global_step": 79804, "epoch": 659} {"train_loss": -32.11406326293945, "global_step": 79805, "epoch": 659} {"train_loss": -37.41071701049805, "global_step": 79806, "epoch": 659} {"train_loss": -22.612295150756836, "global_step": 79807, "epoch": 659} {"train_loss": -10.991472244262695, "global_step": 79808, "epoch": 659} {"train_loss": 103.82173919677734, "global_step": 79809, "epoch": 659} {"train_loss": 59.92257308959961, "global_step": 79810, "epoch": 659} {"train_loss": -16.41388511657715, "global_step": 79811, "epoch": 659} {"train_loss": 6.199697494506836, "global_step": 79812, "epoch": 659} {"train_loss": -2.497130870819092, "global_step": 79813, "epoch": 659} {"train_loss": -30.160531997680664, "global_step": 79814, "epoch": 659} {"train_loss": -11.00623893737793, "global_step": 79815, "epoch": 659} {"train_loss": -11.610602378845215, "global_step": 79816, "epoch": 659} {"train_loss": -28.093372344970703, "global_step": 79817, "epoch": 659} {"train_loss": -28.554101943969727, "global_step": 79818, "epoch": 659} {"train_loss": -21.787738800048828, "global_step": 79819, "epoch": 659} {"train_loss": -20.628910064697266, "global_step": 79820, "epoch": 659} {"train_loss": -26.251480102539062, "global_step": 79821, "epoch": 659} {"train_loss": -31.990888595581055, "global_step": 79822, "epoch": 659} {"train_loss": -32.54520034790039, "global_step": 79823, "epoch": 659} {"train_loss": -28.942523956298828, "global_step": 79824, "epoch": 659} {"train_loss": -26.96345329284668, "global_step": 79825, "epoch": 659} {"train_loss": -28.1019344329834, "global_step": 79826, "epoch": 659} {"train_loss": -30.428327560424805, "global_step": 79827, "epoch": 659} {"train_loss": -31.94964027404785, "global_step": 79828, "epoch": 659} {"train_loss": -33.31402587890625, "global_step": 79829, "epoch": 659} {"train_loss": -32.742156982421875, "global_step": 79830, "epoch": 659} {"train_loss": -31.594778060913086, "global_step": 79831, "epoch": 659} {"train_loss": -31.081119537353516, "global_step": 79832, "epoch": 659} {"train_loss": -31.019195556640625, "global_step": 79833, "epoch": 659} {"train_loss": -31.945484161376953, "global_step": 79834, "epoch": 659} {"train_loss": -32.25234603881836, "global_step": 79835, "epoch": 659} {"train_loss": -32.62241744995117, "global_step": 79836, "epoch": 659} {"train_loss": -33.46506881713867, "global_step": 79837, "epoch": 659} {"train_loss": -33.4697151184082, "global_step": 79838, "epoch": 659} {"train_loss": -32.98616409301758, "global_step": 79839, "epoch": 659} {"train_loss": -32.85211181640625, "global_step": 79840, "epoch": 659} {"train_loss": -33.018775939941406, "global_step": 79841, "epoch": 659} {"train_loss": -32.84611129760742, "global_step": 79842, "epoch": 659} {"train_loss": -33.13985061645508, "global_step": 79843, "epoch": 659} {"train_loss": -33.51807403564453, "global_step": 79844, "epoch": 659} {"train_loss": -33.86396026611328, "global_step": 79845, "epoch": 659} {"train_loss": -33.66461944580078, "global_step": 79846, "epoch": 659} {"train_loss": -33.806236267089844, "global_step": 79847, "epoch": 659} {"train_loss": -33.53971862792969, "global_step": 79848, "epoch": 659} {"train_loss": -33.87917709350586, "global_step": 79849, "epoch": 659} {"train_loss": -33.391780853271484, "global_step": 79850, "epoch": 659} {"train_loss": -33.970191955566406, "global_step": 79851, "epoch": 659} {"train_loss": -34.133541107177734, "global_step": 79852, "epoch": 659} {"train_loss": -34.077816009521484, "global_step": 79853, "epoch": 659} {"train_loss": -33.81303405761719, "global_step": 79854, "epoch": 659} {"train_loss": -34.31168746948242, "global_step": 79855, "epoch": 659} {"train_loss": -34.67025375366211, "global_step": 79856, "epoch": 659} {"train_loss": -34.30828857421875, "global_step": 79857, "epoch": 659} {"train_loss": -34.58717727661133, "global_step": 79858, "epoch": 659} {"train_loss": -31.04814867145759, "global_step": 79859, "epoch": 659, "val_loss": 2635754.75} {"train_loss": -34.72664260864258, "global_step": 79860, "epoch": 660} {"train_loss": -34.5375862121582, "global_step": 79861, "epoch": 660} {"train_loss": -34.767547607421875, "global_step": 79862, "epoch": 660} {"train_loss": -35.09140396118164, "global_step": 79863, "epoch": 660} {"train_loss": -34.657806396484375, "global_step": 79864, "epoch": 660} {"train_loss": -35.02461624145508, "global_step": 79865, "epoch": 660} {"train_loss": -34.863311767578125, "global_step": 79866, "epoch": 660} {"train_loss": -34.705787658691406, "global_step": 79867, "epoch": 660} {"train_loss": -35.18343734741211, "global_step": 79868, "epoch": 660} {"train_loss": -34.98335647583008, "global_step": 79869, "epoch": 660} {"train_loss": -35.38755416870117, "global_step": 79870, "epoch": 660} {"train_loss": -35.40403366088867, "global_step": 79871, "epoch": 660} {"train_loss": -34.970741271972656, "global_step": 79872, "epoch": 660} {"train_loss": -35.1304817199707, "global_step": 79873, "epoch": 660} {"train_loss": -35.55479049682617, "global_step": 79874, "epoch": 660} {"train_loss": -35.627357482910156, "global_step": 79875, "epoch": 660} {"train_loss": -35.10820388793945, "global_step": 79876, "epoch": 660} {"train_loss": -35.72286605834961, "global_step": 79877, "epoch": 660} {"train_loss": -35.4150505065918, "global_step": 79878, "epoch": 660} {"train_loss": -35.23066329956055, "global_step": 79879, "epoch": 660} {"train_loss": -35.81660079956055, "global_step": 79880, "epoch": 660} {"train_loss": -35.715660095214844, "global_step": 79881, "epoch": 660} {"train_loss": -35.471221923828125, "global_step": 79882, "epoch": 660} {"train_loss": -35.5614128112793, "global_step": 79883, "epoch": 660} {"train_loss": -35.71926498413086, "global_step": 79884, "epoch": 660} {"train_loss": -36.21211624145508, "global_step": 79885, "epoch": 660} {"train_loss": -35.957061767578125, "global_step": 79886, "epoch": 660} {"train_loss": -36.449954986572266, "global_step": 79887, "epoch": 660} {"train_loss": -35.888126373291016, "global_step": 79888, "epoch": 660} {"train_loss": -36.43769073486328, "global_step": 79889, "epoch": 660} {"train_loss": -35.98395538330078, "global_step": 79890, "epoch": 660} {"train_loss": -36.04133224487305, "global_step": 79891, "epoch": 660} {"train_loss": -36.236480712890625, "global_step": 79892, "epoch": 660} {"train_loss": -36.29112243652344, "global_step": 79893, "epoch": 660} {"train_loss": -36.01935958862305, "global_step": 79894, "epoch": 660} {"train_loss": -36.316741943359375, "global_step": 79895, "epoch": 660} {"train_loss": -36.609771728515625, "global_step": 79896, "epoch": 660} {"train_loss": -36.575775146484375, "global_step": 79897, "epoch": 660} {"train_loss": -36.22217559814453, "global_step": 79898, "epoch": 660} {"train_loss": -36.61022186279297, "global_step": 79899, "epoch": 660} {"train_loss": -36.52565002441406, "global_step": 79900, "epoch": 660} {"train_loss": -36.437862396240234, "global_step": 79901, "epoch": 660} {"train_loss": -36.4768180847168, "global_step": 79902, "epoch": 660} {"train_loss": -36.47542953491211, "global_step": 79903, "epoch": 660} {"train_loss": -36.65524673461914, "global_step": 79904, "epoch": 660} {"train_loss": -36.54727554321289, "global_step": 79905, "epoch": 660} {"train_loss": -36.85933303833008, "global_step": 79906, "epoch": 660} {"train_loss": -37.048255920410156, "global_step": 79907, "epoch": 660} {"train_loss": -36.851539611816406, "global_step": 79908, "epoch": 660} {"train_loss": -37.093231201171875, "global_step": 79909, "epoch": 660} {"train_loss": -36.597747802734375, "global_step": 79910, "epoch": 660} {"train_loss": -36.45209503173828, "global_step": 79911, "epoch": 660} {"train_loss": -36.945899963378906, "global_step": 79912, "epoch": 660} {"train_loss": -36.57072067260742, "global_step": 79913, "epoch": 660} {"train_loss": -37.140167236328125, "global_step": 79914, "epoch": 660} {"train_loss": -37.26606369018555, "global_step": 79915, "epoch": 660} {"train_loss": -37.12337112426758, "global_step": 79916, "epoch": 660} {"train_loss": -36.76353073120117, "global_step": 79917, "epoch": 660} {"train_loss": -36.772857666015625, "global_step": 79918, "epoch": 660} {"train_loss": -36.76375198364258, "global_step": 79919, "epoch": 660} {"train_loss": -37.36270523071289, "global_step": 79920, "epoch": 660} {"train_loss": -37.38976287841797, "global_step": 79921, "epoch": 660} {"train_loss": -37.263916015625, "global_step": 79922, "epoch": 660} {"train_loss": -37.2928466796875, "global_step": 79923, "epoch": 660} {"train_loss": -37.133819580078125, "global_step": 79924, "epoch": 660} {"train_loss": -37.30059814453125, "global_step": 79925, "epoch": 660} {"train_loss": -37.369869232177734, "global_step": 79926, "epoch": 660} {"train_loss": -37.193016052246094, "global_step": 79927, "epoch": 660} {"train_loss": -37.404083251953125, "global_step": 79928, "epoch": 660} {"train_loss": -37.16176986694336, "global_step": 79929, "epoch": 660} {"train_loss": -37.64132308959961, "global_step": 79930, "epoch": 660} {"train_loss": -37.115230560302734, "global_step": 79931, "epoch": 660} {"train_loss": -37.24488067626953, "global_step": 79932, "epoch": 660} {"train_loss": -37.726104736328125, "global_step": 79933, "epoch": 660} {"train_loss": -37.411128997802734, "global_step": 79934, "epoch": 660} {"train_loss": -37.58171081542969, "global_step": 79935, "epoch": 660} {"train_loss": -37.613380432128906, "global_step": 79936, "epoch": 660} {"train_loss": -37.21073913574219, "global_step": 79937, "epoch": 660} {"train_loss": -37.4877815246582, "global_step": 79938, "epoch": 660} {"train_loss": -37.02346420288086, "global_step": 79939, "epoch": 660} {"train_loss": -37.32544708251953, "global_step": 79940, "epoch": 660} {"train_loss": -37.272552490234375, "global_step": 79941, "epoch": 660} {"train_loss": -37.1036491394043, "global_step": 79942, "epoch": 660} {"train_loss": -37.92247772216797, "global_step": 79943, "epoch": 660} {"train_loss": -37.923500061035156, "global_step": 79944, "epoch": 660} {"train_loss": -36.679779052734375, "global_step": 79945, "epoch": 660} {"train_loss": -37.1024169921875, "global_step": 79946, "epoch": 660} {"train_loss": -36.99385452270508, "global_step": 79947, "epoch": 660} {"train_loss": -37.48621368408203, "global_step": 79948, "epoch": 660} {"train_loss": -35.49848556518555, "global_step": 79949, "epoch": 660} {"train_loss": -36.41718673706055, "global_step": 79950, "epoch": 660} {"train_loss": -37.2982292175293, "global_step": 79951, "epoch": 660} {"train_loss": -37.209556579589844, "global_step": 79952, "epoch": 660} {"train_loss": -37.1486930847168, "global_step": 79953, "epoch": 660} {"train_loss": -36.54030990600586, "global_step": 79954, "epoch": 660} {"train_loss": -37.1847038269043, "global_step": 79955, "epoch": 660} {"train_loss": -36.98469161987305, "global_step": 79956, "epoch": 660} {"train_loss": -36.4913444519043, "global_step": 79957, "epoch": 660} {"train_loss": -36.455291748046875, "global_step": 79958, "epoch": 660} {"train_loss": -37.08399200439453, "global_step": 79959, "epoch": 660} {"train_loss": -36.53932189941406, "global_step": 79960, "epoch": 660} {"train_loss": -35.842220306396484, "global_step": 79961, "epoch": 660} {"train_loss": -36.93241500854492, "global_step": 79962, "epoch": 660} {"train_loss": -35.13618087768555, "global_step": 79963, "epoch": 660} {"train_loss": -34.48611831665039, "global_step": 79964, "epoch": 660} {"train_loss": -36.341854095458984, "global_step": 79965, "epoch": 660} {"train_loss": -35.65668869018555, "global_step": 79966, "epoch": 660} {"train_loss": -34.7252082824707, "global_step": 79967, "epoch": 660} {"train_loss": -36.23250961303711, "global_step": 79968, "epoch": 660} {"train_loss": -35.462074279785156, "global_step": 79969, "epoch": 660} {"train_loss": -36.27093505859375, "global_step": 79970, "epoch": 660} {"train_loss": -36.53336715698242, "global_step": 79971, "epoch": 660} {"train_loss": -35.59117889404297, "global_step": 79972, "epoch": 660} {"train_loss": -35.2909049987793, "global_step": 79973, "epoch": 660} {"train_loss": -36.956966400146484, "global_step": 79974, "epoch": 660} {"train_loss": -35.96995162963867, "global_step": 79975, "epoch": 660} {"train_loss": -36.93224334716797, "global_step": 79976, "epoch": 660} {"train_loss": -35.62511444091797, "global_step": 79977, "epoch": 660} {"train_loss": -36.87289810180664, "global_step": 79978, "epoch": 660} {"train_loss": -32.90684127807617, "global_step": 79979, "epoch": 660} {"train_loss": -36.35424959166976, "global_step": 79980, "epoch": 660, "val_loss": 2623352.75} {"train_loss": -35.651790618896484, "global_step": 79981, "epoch": 661} {"train_loss": -35.9521598815918, "global_step": 79982, "epoch": 661} {"train_loss": -36.39170455932617, "global_step": 79983, "epoch": 661} {"train_loss": -34.94480895996094, "global_step": 79984, "epoch": 661} {"train_loss": -35.09774398803711, "global_step": 79985, "epoch": 661} {"train_loss": -34.61114501953125, "global_step": 79986, "epoch": 661} {"train_loss": -31.081836700439453, "global_step": 79987, "epoch": 661} {"train_loss": -35.201629638671875, "global_step": 79988, "epoch": 661} {"train_loss": -36.671051025390625, "global_step": 79989, "epoch": 661} {"train_loss": -33.77555465698242, "global_step": 79990, "epoch": 661} {"train_loss": -36.572479248046875, "global_step": 79991, "epoch": 661} {"train_loss": -33.485713958740234, "global_step": 79992, "epoch": 661} {"train_loss": -33.458858489990234, "global_step": 79993, "epoch": 661} {"train_loss": -35.83158493041992, "global_step": 79994, "epoch": 661} {"train_loss": -35.35321044921875, "global_step": 79995, "epoch": 661} {"train_loss": -32.49393844604492, "global_step": 79996, "epoch": 661} {"train_loss": -34.443416595458984, "global_step": 79997, "epoch": 661} {"train_loss": -35.629451751708984, "global_step": 79998, "epoch": 661} {"train_loss": -34.196773529052734, "global_step": 79999, "epoch": 661} {"train_loss": -35.27061080932617, "global_step": 80000, "epoch": 661} {"train_loss": -35.07615280151367, "global_step": 80001, "epoch": 661} {"train_loss": -35.37690353393555, "global_step": 80002, "epoch": 661} {"train_loss": -34.5684814453125, "global_step": 80003, "epoch": 661} {"train_loss": -35.42219924926758, "global_step": 80004, "epoch": 661} {"train_loss": -35.60957717895508, "global_step": 80005, "epoch": 661} {"train_loss": -35.87306594848633, "global_step": 80006, "epoch": 661} {"train_loss": -35.4431266784668, "global_step": 80007, "epoch": 661} {"train_loss": -34.86983871459961, "global_step": 80008, "epoch": 661} {"train_loss": -33.8544921875, "global_step": 80009, "epoch": 661} {"train_loss": -36.533714294433594, "global_step": 80010, "epoch": 661} {"train_loss": -35.898658752441406, "global_step": 80011, "epoch": 661} {"train_loss": -34.940547943115234, "global_step": 80012, "epoch": 661} {"train_loss": -36.078433990478516, "global_step": 80013, "epoch": 661} {"train_loss": -36.13694763183594, "global_step": 80014, "epoch": 661} {"train_loss": -35.14249038696289, "global_step": 80015, "epoch": 661} {"train_loss": -35.86975860595703, "global_step": 80016, "epoch": 661} {"train_loss": -35.30382537841797, "global_step": 80017, "epoch": 661} {"train_loss": -35.22481918334961, "global_step": 80018, "epoch": 661} {"train_loss": -36.25468063354492, "global_step": 80019, "epoch": 661} {"train_loss": -35.54634094238281, "global_step": 80020, "epoch": 661} {"train_loss": -35.297760009765625, "global_step": 80021, "epoch": 661} {"train_loss": -36.40986251831055, "global_step": 80022, "epoch": 661} {"train_loss": -35.26215744018555, "global_step": 80023, "epoch": 661} {"train_loss": -34.43854904174805, "global_step": 80024, "epoch": 661} {"train_loss": -36.00984191894531, "global_step": 80025, "epoch": 661} {"train_loss": -36.0963249206543, "global_step": 80026, "epoch": 661} {"train_loss": -36.20931625366211, "global_step": 80027, "epoch": 661} {"train_loss": -34.225101470947266, "global_step": 80028, "epoch": 661} {"train_loss": -33.61214828491211, "global_step": 80029, "epoch": 661} {"train_loss": -36.37775802612305, "global_step": 80030, "epoch": 661} {"train_loss": -36.61174392700195, "global_step": 80031, "epoch": 661} {"train_loss": -36.00191879272461, "global_step": 80032, "epoch": 661} {"train_loss": -34.91764450073242, "global_step": 80033, "epoch": 661} {"train_loss": -36.08721923828125, "global_step": 80034, "epoch": 661} {"train_loss": -35.90842819213867, "global_step": 80035, "epoch": 661} {"train_loss": -36.14081573486328, "global_step": 80036, "epoch": 661} {"train_loss": -36.832984924316406, "global_step": 80037, "epoch": 661} {"train_loss": -36.15617752075195, "global_step": 80038, "epoch": 661} {"train_loss": -36.1400032043457, "global_step": 80039, "epoch": 661} {"train_loss": -36.23552322387695, "global_step": 80040, "epoch": 661} {"train_loss": -36.178707122802734, "global_step": 80041, "epoch": 661} {"train_loss": -35.38161849975586, "global_step": 80042, "epoch": 661} {"train_loss": -36.10011672973633, "global_step": 80043, "epoch": 661} {"train_loss": -36.27278518676758, "global_step": 80044, "epoch": 661} {"train_loss": -36.589359283447266, "global_step": 80045, "epoch": 661} {"train_loss": -36.26027297973633, "global_step": 80046, "epoch": 661} {"train_loss": -35.62925720214844, "global_step": 80047, "epoch": 661} {"train_loss": -36.10385513305664, "global_step": 80048, "epoch": 661} {"train_loss": -36.18413162231445, "global_step": 80049, "epoch": 661} {"train_loss": -36.37356185913086, "global_step": 80050, "epoch": 661} {"train_loss": -36.795040130615234, "global_step": 80051, "epoch": 661} {"train_loss": -37.49435043334961, "global_step": 80052, "epoch": 661} {"train_loss": -36.53105545043945, "global_step": 80053, "epoch": 661} {"train_loss": -36.664642333984375, "global_step": 80054, "epoch": 661} {"train_loss": -36.995399475097656, "global_step": 80055, "epoch": 661} {"train_loss": -36.82762145996094, "global_step": 80056, "epoch": 661} {"train_loss": -36.826141357421875, "global_step": 80057, "epoch": 661} {"train_loss": -36.25578689575195, "global_step": 80058, "epoch": 661} {"train_loss": -37.19770431518555, "global_step": 80059, "epoch": 661} {"train_loss": -36.748477935791016, "global_step": 80060, "epoch": 661} {"train_loss": -37.70177459716797, "global_step": 80061, "epoch": 661} {"train_loss": -37.353248596191406, "global_step": 80062, "epoch": 661} {"train_loss": -37.14033126831055, "global_step": 80063, "epoch": 661} {"train_loss": -37.00484085083008, "global_step": 80064, "epoch": 661} {"train_loss": -36.81156539916992, "global_step": 80065, "epoch": 661} {"train_loss": -37.16632843017578, "global_step": 80066, "epoch": 661} {"train_loss": -37.04380416870117, "global_step": 80067, "epoch": 661} {"train_loss": -37.590431213378906, "global_step": 80068, "epoch": 661} {"train_loss": -37.900184631347656, "global_step": 80069, "epoch": 661} {"train_loss": -37.4586181640625, "global_step": 80070, "epoch": 661} {"train_loss": -37.51803970336914, "global_step": 80071, "epoch": 661} {"train_loss": -37.14990234375, "global_step": 80072, "epoch": 661} {"train_loss": -37.5097770690918, "global_step": 80073, "epoch": 661} {"train_loss": -37.315711975097656, "global_step": 80074, "epoch": 661} {"train_loss": -37.708858489990234, "global_step": 80075, "epoch": 661} {"train_loss": -37.086185455322266, "global_step": 80076, "epoch": 661} {"train_loss": -37.17916488647461, "global_step": 80077, "epoch": 661} {"train_loss": -37.777198791503906, "global_step": 80078, "epoch": 661} {"train_loss": -37.91523742675781, "global_step": 80079, "epoch": 661} {"train_loss": -37.82854080200195, "global_step": 80080, "epoch": 661} {"train_loss": -37.16579055786133, "global_step": 80081, "epoch": 661} {"train_loss": -37.38535690307617, "global_step": 80082, "epoch": 661} {"train_loss": -37.795326232910156, "global_step": 80083, "epoch": 661} {"train_loss": -37.683837890625, "global_step": 80084, "epoch": 661} {"train_loss": -37.05242156982422, "global_step": 80085, "epoch": 661} {"train_loss": -37.687374114990234, "global_step": 80086, "epoch": 661} {"train_loss": -37.46294021606445, "global_step": 80087, "epoch": 661} {"train_loss": -37.513431549072266, "global_step": 80088, "epoch": 661} {"train_loss": -37.6037712097168, "global_step": 80089, "epoch": 661} {"train_loss": -37.18868637084961, "global_step": 80090, "epoch": 661} {"train_loss": -36.3090705871582, "global_step": 80091, "epoch": 661} {"train_loss": -37.60625076293945, "global_step": 80092, "epoch": 661} {"train_loss": -36.47866439819336, "global_step": 80093, "epoch": 661} {"train_loss": -36.486934661865234, "global_step": 80094, "epoch": 661} {"train_loss": -34.41522216796875, "global_step": 80095, "epoch": 661} {"train_loss": -35.12162399291992, "global_step": 80096, "epoch": 661} {"train_loss": -33.734832763671875, "global_step": 80097, "epoch": 661} {"train_loss": -33.53123092651367, "global_step": 80098, "epoch": 661} {"train_loss": -31.072378158569336, "global_step": 80099, "epoch": 661} {"train_loss": -32.319942474365234, "global_step": 80100, "epoch": 661} {"train_loss": -35.992111190291475, "global_step": 80101, "epoch": 661, "val_loss": 2643712.25} {"train_loss": -36.99506759643555, "global_step": 80102, "epoch": 662} {"train_loss": -36.149288177490234, "global_step": 80103, "epoch": 662} {"train_loss": -34.2907829284668, "global_step": 80104, "epoch": 662} {"train_loss": -35.0075798034668, "global_step": 80105, "epoch": 662} {"train_loss": -36.23099899291992, "global_step": 80106, "epoch": 662} {"train_loss": -36.55794143676758, "global_step": 80107, "epoch": 662} {"train_loss": -36.333641052246094, "global_step": 80108, "epoch": 662} {"train_loss": -36.97563552856445, "global_step": 80109, "epoch": 662} {"train_loss": -36.47383499145508, "global_step": 80110, "epoch": 662} {"train_loss": -36.49983596801758, "global_step": 80111, "epoch": 662} {"train_loss": -36.70356750488281, "global_step": 80112, "epoch": 662} {"train_loss": -36.5222282409668, "global_step": 80113, "epoch": 662} {"train_loss": -35.67045211791992, "global_step": 80114, "epoch": 662} {"train_loss": -36.310340881347656, "global_step": 80115, "epoch": 662} {"train_loss": -36.96566390991211, "global_step": 80116, "epoch": 662} {"train_loss": -35.975032806396484, "global_step": 80117, "epoch": 662} {"train_loss": -35.982723236083984, "global_step": 80118, "epoch": 662} {"train_loss": -35.28203201293945, "global_step": 80119, "epoch": 662} {"train_loss": -36.212646484375, "global_step": 80120, "epoch": 662} {"train_loss": -36.91530990600586, "global_step": 80121, "epoch": 662} {"train_loss": -37.36933135986328, "global_step": 80122, "epoch": 662} {"train_loss": -36.43012619018555, "global_step": 80123, "epoch": 662} {"train_loss": -36.5783805847168, "global_step": 80124, "epoch": 662} {"train_loss": -36.32204055786133, "global_step": 80125, "epoch": 662} {"train_loss": -36.96926498413086, "global_step": 80126, "epoch": 662} {"train_loss": -36.39750671386719, "global_step": 80127, "epoch": 662} {"train_loss": -36.68769454956055, "global_step": 80128, "epoch": 662} {"train_loss": -37.49728012084961, "global_step": 80129, "epoch": 662} {"train_loss": -36.66927719116211, "global_step": 80130, "epoch": 662} {"train_loss": -36.64642333984375, "global_step": 80131, "epoch": 662} {"train_loss": -37.27240753173828, "global_step": 80132, "epoch": 662} {"train_loss": -37.15317916870117, "global_step": 80133, "epoch": 662} {"train_loss": -37.32041549682617, "global_step": 80134, "epoch": 662} {"train_loss": -37.013145446777344, "global_step": 80135, "epoch": 662} {"train_loss": -36.64534378051758, "global_step": 80136, "epoch": 662} {"train_loss": -37.68911361694336, "global_step": 80137, "epoch": 662} {"train_loss": -35.32686233520508, "global_step": 80138, "epoch": 662} {"train_loss": -37.29749298095703, "global_step": 80139, "epoch": 662} {"train_loss": -35.999900817871094, "global_step": 80140, "epoch": 662} {"train_loss": -36.947509765625, "global_step": 80141, "epoch": 662} {"train_loss": -37.273983001708984, "global_step": 80142, "epoch": 662} {"train_loss": -37.14973068237305, "global_step": 80143, "epoch": 662} {"train_loss": -36.93157958984375, "global_step": 80144, "epoch": 662} {"train_loss": -36.3945198059082, "global_step": 80145, "epoch": 662} {"train_loss": -36.6409797668457, "global_step": 80146, "epoch": 662} {"train_loss": -36.31208038330078, "global_step": 80147, "epoch": 662} {"train_loss": -37.04677963256836, "global_step": 80148, "epoch": 662} {"train_loss": -36.880645751953125, "global_step": 80149, "epoch": 662} {"train_loss": -37.36579895019531, "global_step": 80150, "epoch": 662} {"train_loss": -36.12138748168945, "global_step": 80151, "epoch": 662} {"train_loss": -37.129798889160156, "global_step": 80152, "epoch": 662} {"train_loss": -36.78388595581055, "global_step": 80153, "epoch": 662} {"train_loss": -37.767181396484375, "global_step": 80154, "epoch": 662} {"train_loss": -37.43989562988281, "global_step": 80155, "epoch": 662} {"train_loss": -37.29368209838867, "global_step": 80156, "epoch": 662} {"train_loss": -37.849239349365234, "global_step": 80157, "epoch": 662} {"train_loss": -37.342708587646484, "global_step": 80158, "epoch": 662} {"train_loss": -37.632606506347656, "global_step": 80159, "epoch": 662} {"train_loss": -37.68510055541992, "global_step": 80160, "epoch": 662} {"train_loss": -35.49924850463867, "global_step": 80161, "epoch": 662} {"train_loss": -36.9121208190918, "global_step": 80162, "epoch": 662} {"train_loss": -37.0334358215332, "global_step": 80163, "epoch": 662} {"train_loss": -37.542659759521484, "global_step": 80164, "epoch": 662} {"train_loss": -37.58951187133789, "global_step": 80165, "epoch": 662} {"train_loss": -36.693965911865234, "global_step": 80166, "epoch": 662} {"train_loss": -37.25772476196289, "global_step": 80167, "epoch": 662} {"train_loss": -36.1807861328125, "global_step": 80168, "epoch": 662} {"train_loss": -36.839454650878906, "global_step": 80169, "epoch": 662} {"train_loss": -37.52876663208008, "global_step": 80170, "epoch": 662} {"train_loss": -37.18000411987305, "global_step": 80171, "epoch": 662} {"train_loss": -37.07004928588867, "global_step": 80172, "epoch": 662} {"train_loss": -35.4166259765625, "global_step": 80173, "epoch": 662} {"train_loss": -33.58152389526367, "global_step": 80174, "epoch": 662} {"train_loss": -28.0575008392334, "global_step": 80175, "epoch": 662} {"train_loss": -25.07712745666504, "global_step": 80176, "epoch": 662} {"train_loss": -34.86153793334961, "global_step": 80177, "epoch": 662} {"train_loss": -36.70542526245117, "global_step": 80178, "epoch": 662} {"train_loss": -29.15459632873535, "global_step": 80179, "epoch": 662} {"train_loss": -31.070520401000977, "global_step": 80180, "epoch": 662} {"train_loss": -37.0662956237793, "global_step": 80181, "epoch": 662} {"train_loss": -30.91749382019043, "global_step": 80182, "epoch": 662} {"train_loss": -34.24270248413086, "global_step": 80183, "epoch": 662} {"train_loss": -31.676156997680664, "global_step": 80184, "epoch": 662} {"train_loss": -30.583023071289062, "global_step": 80185, "epoch": 662} {"train_loss": -34.72666931152344, "global_step": 80186, "epoch": 662} {"train_loss": -31.079818725585938, "global_step": 80187, "epoch": 662} {"train_loss": -35.947242736816406, "global_step": 80188, "epoch": 662} {"train_loss": -34.95292282104492, "global_step": 80189, "epoch": 662} {"train_loss": -35.80665969848633, "global_step": 80190, "epoch": 662} {"train_loss": -35.414459228515625, "global_step": 80191, "epoch": 662} {"train_loss": -35.05503463745117, "global_step": 80192, "epoch": 662} {"train_loss": -36.10292434692383, "global_step": 80193, "epoch": 662} {"train_loss": -35.611785888671875, "global_step": 80194, "epoch": 662} {"train_loss": -36.20115280151367, "global_step": 80195, "epoch": 662} {"train_loss": -35.74103927612305, "global_step": 80196, "epoch": 662} {"train_loss": -34.918975830078125, "global_step": 80197, "epoch": 662} {"train_loss": -36.20830535888672, "global_step": 80198, "epoch": 662} {"train_loss": -35.94521713256836, "global_step": 80199, "epoch": 662} {"train_loss": -36.136962890625, "global_step": 80200, "epoch": 662} {"train_loss": -35.748634338378906, "global_step": 80201, "epoch": 662} {"train_loss": -34.786956787109375, "global_step": 80202, "epoch": 662} {"train_loss": -36.39334487915039, "global_step": 80203, "epoch": 662} {"train_loss": -36.036216735839844, "global_step": 80204, "epoch": 662} {"train_loss": -36.51163864135742, "global_step": 80205, "epoch": 662} {"train_loss": -36.28109359741211, "global_step": 80206, "epoch": 662} {"train_loss": -36.29903030395508, "global_step": 80207, "epoch": 662} {"train_loss": -36.8719596862793, "global_step": 80208, "epoch": 662} {"train_loss": -36.493927001953125, "global_step": 80209, "epoch": 662} {"train_loss": -35.498538970947266, "global_step": 80210, "epoch": 662} {"train_loss": -37.0973014831543, "global_step": 80211, "epoch": 662} {"train_loss": -36.336849212646484, "global_step": 80212, "epoch": 662} {"train_loss": -35.52517318725586, "global_step": 80213, "epoch": 662} {"train_loss": -37.07233428955078, "global_step": 80214, "epoch": 662} {"train_loss": -35.74129104614258, "global_step": 80215, "epoch": 662} {"train_loss": -36.90517807006836, "global_step": 80216, "epoch": 662} {"train_loss": -36.73735809326172, "global_step": 80217, "epoch": 662} {"train_loss": -36.82814407348633, "global_step": 80218, "epoch": 662} {"train_loss": -36.16025924682617, "global_step": 80219, "epoch": 662} {"train_loss": -37.2816162109375, "global_step": 80220, "epoch": 662} {"train_loss": -36.371089935302734, "global_step": 80221, "epoch": 662} {"train_loss": -36.00874016501687, "global_step": 80222, "epoch": 662, "val_loss": 2699213.5} {"train_loss": -37.09805679321289, "global_step": 80223, "epoch": 663} {"train_loss": -37.281856536865234, "global_step": 80224, "epoch": 663} {"train_loss": -36.8427848815918, "global_step": 80225, "epoch": 663} {"train_loss": -37.46918869018555, "global_step": 80226, "epoch": 663} {"train_loss": -37.8731575012207, "global_step": 80227, "epoch": 663} {"train_loss": -37.31087875366211, "global_step": 80228, "epoch": 663} {"train_loss": -38.102291107177734, "global_step": 80229, "epoch": 663} {"train_loss": -37.59386444091797, "global_step": 80230, "epoch": 663} {"train_loss": -35.865631103515625, "global_step": 80231, "epoch": 663} {"train_loss": -36.57398223876953, "global_step": 80232, "epoch": 663} {"train_loss": -36.2639045715332, "global_step": 80233, "epoch": 663} {"train_loss": -36.08559799194336, "global_step": 80234, "epoch": 663} {"train_loss": -35.05691146850586, "global_step": 80235, "epoch": 663} {"train_loss": -36.92412567138672, "global_step": 80236, "epoch": 663} {"train_loss": -37.53700637817383, "global_step": 80237, "epoch": 663} {"train_loss": -36.22629928588867, "global_step": 80238, "epoch": 663} {"train_loss": -35.497291564941406, "global_step": 80239, "epoch": 663} {"train_loss": -34.5265007019043, "global_step": 80240, "epoch": 663} {"train_loss": -37.03768539428711, "global_step": 80241, "epoch": 663} {"train_loss": -36.25409698486328, "global_step": 80242, "epoch": 663} {"train_loss": -36.71971893310547, "global_step": 80243, "epoch": 663} {"train_loss": -35.843841552734375, "global_step": 80244, "epoch": 663} {"train_loss": -36.57038497924805, "global_step": 80245, "epoch": 663} {"train_loss": -37.358497619628906, "global_step": 80246, "epoch": 663} {"train_loss": -35.947261810302734, "global_step": 80247, "epoch": 663} {"train_loss": -37.301021575927734, "global_step": 80248, "epoch": 663} {"train_loss": -36.68290328979492, "global_step": 80249, "epoch": 663} {"train_loss": -36.973182678222656, "global_step": 80250, "epoch": 663} {"train_loss": -34.645137786865234, "global_step": 80251, "epoch": 663} {"train_loss": -36.469970703125, "global_step": 80252, "epoch": 663} {"train_loss": -36.56588363647461, "global_step": 80253, "epoch": 663} {"train_loss": -36.15821075439453, "global_step": 80254, "epoch": 663} {"train_loss": -35.168678283691406, "global_step": 80255, "epoch": 663} {"train_loss": -35.02436828613281, "global_step": 80256, "epoch": 663} {"train_loss": -33.75893783569336, "global_step": 80257, "epoch": 663} {"train_loss": -36.4815559387207, "global_step": 80258, "epoch": 663} {"train_loss": -35.83182907104492, "global_step": 80259, "epoch": 663} {"train_loss": -35.92808151245117, "global_step": 80260, "epoch": 663} {"train_loss": -34.439632415771484, "global_step": 80261, "epoch": 663} {"train_loss": -34.4630241394043, "global_step": 80262, "epoch": 663} {"train_loss": -34.372867584228516, "global_step": 80263, "epoch": 663} {"train_loss": -35.101314544677734, "global_step": 80264, "epoch": 663} {"train_loss": -35.80955505371094, "global_step": 80265, "epoch": 663} {"train_loss": -32.740089416503906, "global_step": 80266, "epoch": 663} {"train_loss": -35.0531120300293, "global_step": 80267, "epoch": 663} {"train_loss": -35.38767623901367, "global_step": 80268, "epoch": 663} {"train_loss": -35.040523529052734, "global_step": 80269, "epoch": 663} {"train_loss": -35.26219177246094, "global_step": 80270, "epoch": 663} {"train_loss": -35.07022476196289, "global_step": 80271, "epoch": 663} {"train_loss": -35.620750427246094, "global_step": 80272, "epoch": 663} {"train_loss": -33.867733001708984, "global_step": 80273, "epoch": 663} {"train_loss": -36.024234771728516, "global_step": 80274, "epoch": 663} {"train_loss": -35.98725509643555, "global_step": 80275, "epoch": 663} {"train_loss": -36.25408172607422, "global_step": 80276, "epoch": 663} {"train_loss": -36.37568283081055, "global_step": 80277, "epoch": 663} {"train_loss": -35.37548828125, "global_step": 80278, "epoch": 663} {"train_loss": -36.0648307800293, "global_step": 80279, "epoch": 663} {"train_loss": -36.04288101196289, "global_step": 80280, "epoch": 663} {"train_loss": -35.479393005371094, "global_step": 80281, "epoch": 663} {"train_loss": -35.535125732421875, "global_step": 80282, "epoch": 663} {"train_loss": -36.86804962158203, "global_step": 80283, "epoch": 663} {"train_loss": -35.77834701538086, "global_step": 80284, "epoch": 663} {"train_loss": -36.24860763549805, "global_step": 80285, "epoch": 663} {"train_loss": -36.24584197998047, "global_step": 80286, "epoch": 663} {"train_loss": -36.21608352661133, "global_step": 80287, "epoch": 663} {"train_loss": -36.48398971557617, "global_step": 80288, "epoch": 663} {"train_loss": -36.612701416015625, "global_step": 80289, "epoch": 663} {"train_loss": -36.14116287231445, "global_step": 80290, "epoch": 663} {"train_loss": -35.34543991088867, "global_step": 80291, "epoch": 663} {"train_loss": -36.3192138671875, "global_step": 80292, "epoch": 663} {"train_loss": -36.141746520996094, "global_step": 80293, "epoch": 663} {"train_loss": -35.8413200378418, "global_step": 80294, "epoch": 663} {"train_loss": -35.547340393066406, "global_step": 80295, "epoch": 663} {"train_loss": -36.68952178955078, "global_step": 80296, "epoch": 663} {"train_loss": -36.478271484375, "global_step": 80297, "epoch": 663} {"train_loss": -35.5953483581543, "global_step": 80298, "epoch": 663} {"train_loss": -36.577789306640625, "global_step": 80299, "epoch": 663} {"train_loss": -35.892887115478516, "global_step": 80300, "epoch": 663} {"train_loss": -36.943904876708984, "global_step": 80301, "epoch": 663} {"train_loss": -36.898475646972656, "global_step": 80302, "epoch": 663} {"train_loss": -36.87794876098633, "global_step": 80303, "epoch": 663} {"train_loss": -37.29066848754883, "global_step": 80304, "epoch": 663} {"train_loss": -36.21696090698242, "global_step": 80305, "epoch": 663} {"train_loss": -36.00924301147461, "global_step": 80306, "epoch": 663} {"train_loss": -36.90541076660156, "global_step": 80307, "epoch": 663} {"train_loss": -37.088539123535156, "global_step": 80308, "epoch": 663} {"train_loss": -36.22745895385742, "global_step": 80309, "epoch": 663} {"train_loss": -36.27451705932617, "global_step": 80310, "epoch": 663} {"train_loss": -36.3025016784668, "global_step": 80311, "epoch": 663} {"train_loss": -33.76622009277344, "global_step": 80312, "epoch": 663} {"train_loss": -36.241119384765625, "global_step": 80313, "epoch": 663} {"train_loss": -37.013206481933594, "global_step": 80314, "epoch": 663} {"train_loss": -36.36996078491211, "global_step": 80315, "epoch": 663} {"train_loss": -36.78351593017578, "global_step": 80316, "epoch": 663} {"train_loss": -37.2625732421875, "global_step": 80317, "epoch": 663} {"train_loss": -37.053035736083984, "global_step": 80318, "epoch": 663} {"train_loss": -36.8997917175293, "global_step": 80319, "epoch": 663} {"train_loss": -36.24770736694336, "global_step": 80320, "epoch": 663} {"train_loss": -37.32262420654297, "global_step": 80321, "epoch": 663} {"train_loss": -37.06155014038086, "global_step": 80322, "epoch": 663} {"train_loss": -36.918052673339844, "global_step": 80323, "epoch": 663} {"train_loss": -36.92523193359375, "global_step": 80324, "epoch": 663} {"train_loss": -36.77724838256836, "global_step": 80325, "epoch": 663} {"train_loss": -36.93130111694336, "global_step": 80326, "epoch": 663} {"train_loss": -36.834903717041016, "global_step": 80327, "epoch": 663} {"train_loss": -37.33346176147461, "global_step": 80328, "epoch": 663} {"train_loss": -37.40180587768555, "global_step": 80329, "epoch": 663} {"train_loss": -37.486000061035156, "global_step": 80330, "epoch": 663} {"train_loss": -36.86936569213867, "global_step": 80331, "epoch": 663} {"train_loss": -37.344932556152344, "global_step": 80332, "epoch": 663} {"train_loss": -36.89826202392578, "global_step": 80333, "epoch": 663} {"train_loss": -37.02994918823242, "global_step": 80334, "epoch": 663} {"train_loss": -36.9473876953125, "global_step": 80335, "epoch": 663} {"train_loss": -37.45333480834961, "global_step": 80336, "epoch": 663} {"train_loss": -37.66700744628906, "global_step": 80337, "epoch": 663} {"train_loss": -36.46977615356445, "global_step": 80338, "epoch": 663} {"train_loss": -36.692657470703125, "global_step": 80339, "epoch": 663} {"train_loss": -36.80348587036133, "global_step": 80340, "epoch": 663} {"train_loss": -36.747283935546875, "global_step": 80341, "epoch": 663} {"train_loss": -37.461952209472656, "global_step": 80342, "epoch": 663} {"train_loss": -36.30139535320692, "global_step": 80343, "epoch": 663, "val_loss": 2624327.75} {"train_loss": -37.426387786865234, "global_step": 80344, "epoch": 664} {"train_loss": -36.9138298034668, "global_step": 80345, "epoch": 664} {"train_loss": -37.0288200378418, "global_step": 80346, "epoch": 664} {"train_loss": -37.78414535522461, "global_step": 80347, "epoch": 664} {"train_loss": -37.629512786865234, "global_step": 80348, "epoch": 664} {"train_loss": -37.05941390991211, "global_step": 80349, "epoch": 664} {"train_loss": -36.52474594116211, "global_step": 80350, "epoch": 664} {"train_loss": -35.53840255737305, "global_step": 80351, "epoch": 664} {"train_loss": -35.980377197265625, "global_step": 80352, "epoch": 664} {"train_loss": -37.73600387573242, "global_step": 80353, "epoch": 664} {"train_loss": -37.37385940551758, "global_step": 80354, "epoch": 664} {"train_loss": -35.57699966430664, "global_step": 80355, "epoch": 664} {"train_loss": -33.61268997192383, "global_step": 80356, "epoch": 664} {"train_loss": -36.07033157348633, "global_step": 80357, "epoch": 664} {"train_loss": -37.08519744873047, "global_step": 80358, "epoch": 664} {"train_loss": -36.15885543823242, "global_step": 80359, "epoch": 664} {"train_loss": -35.37284469604492, "global_step": 80360, "epoch": 664} {"train_loss": -37.29229736328125, "global_step": 80361, "epoch": 664} {"train_loss": -36.75346755981445, "global_step": 80362, "epoch": 664} {"train_loss": -37.1353645324707, "global_step": 80363, "epoch": 664} {"train_loss": -37.042659759521484, "global_step": 80364, "epoch": 664} {"train_loss": -35.9622802734375, "global_step": 80365, "epoch": 664} {"train_loss": -37.55885696411133, "global_step": 80366, "epoch": 664} {"train_loss": -37.25373077392578, "global_step": 80367, "epoch": 664} {"train_loss": -35.56130599975586, "global_step": 80368, "epoch": 664} {"train_loss": -37.00690460205078, "global_step": 80369, "epoch": 664} {"train_loss": -37.13129806518555, "global_step": 80370, "epoch": 664} {"train_loss": -35.54500198364258, "global_step": 80371, "epoch": 664} {"train_loss": -36.61857986450195, "global_step": 80372, "epoch": 664} {"train_loss": -34.960018157958984, "global_step": 80373, "epoch": 664} {"train_loss": -36.301143646240234, "global_step": 80374, "epoch": 664} {"train_loss": -36.948333740234375, "global_step": 80375, "epoch": 664} {"train_loss": -35.35639572143555, "global_step": 80376, "epoch": 664} {"train_loss": -36.65316390991211, "global_step": 80377, "epoch": 664} {"train_loss": -34.799190521240234, "global_step": 80378, "epoch": 664} {"train_loss": -34.22428512573242, "global_step": 80379, "epoch": 664} {"train_loss": -36.379669189453125, "global_step": 80380, "epoch": 664} {"train_loss": -34.43124008178711, "global_step": 80381, "epoch": 664} {"train_loss": -35.295936584472656, "global_step": 80382, "epoch": 664} {"train_loss": -35.133392333984375, "global_step": 80383, "epoch": 664} {"train_loss": -35.81192398071289, "global_step": 80384, "epoch": 664} {"train_loss": -34.426902770996094, "global_step": 80385, "epoch": 664} {"train_loss": -35.83855056762695, "global_step": 80386, "epoch": 664} {"train_loss": -32.29793930053711, "global_step": 80387, "epoch": 664} {"train_loss": -35.89262771606445, "global_step": 80388, "epoch": 664} {"train_loss": -36.1971549987793, "global_step": 80389, "epoch": 664} {"train_loss": -34.693359375, "global_step": 80390, "epoch": 664} {"train_loss": -35.2187614440918, "global_step": 80391, "epoch": 664} {"train_loss": -33.25027084350586, "global_step": 80392, "epoch": 664} {"train_loss": -35.021026611328125, "global_step": 80393, "epoch": 664} {"train_loss": -35.95117950439453, "global_step": 80394, "epoch": 664} {"train_loss": -35.397579193115234, "global_step": 80395, "epoch": 664} {"train_loss": -35.526580810546875, "global_step": 80396, "epoch": 664} {"train_loss": -35.41786575317383, "global_step": 80397, "epoch": 664} {"train_loss": -36.14884567260742, "global_step": 80398, "epoch": 664} {"train_loss": -36.20317459106445, "global_step": 80399, "epoch": 664} {"train_loss": -34.70457077026367, "global_step": 80400, "epoch": 664} {"train_loss": -35.15507125854492, "global_step": 80401, "epoch": 664} {"train_loss": -36.03490447998047, "global_step": 80402, "epoch": 664} {"train_loss": -35.02070236206055, "global_step": 80403, "epoch": 664} {"train_loss": -36.17824935913086, "global_step": 80404, "epoch": 664} {"train_loss": -35.60283279418945, "global_step": 80405, "epoch": 664} {"train_loss": -35.778072357177734, "global_step": 80406, "epoch": 664} {"train_loss": -34.38346481323242, "global_step": 80407, "epoch": 664} {"train_loss": -36.23956298828125, "global_step": 80408, "epoch": 664} {"train_loss": -36.16152572631836, "global_step": 80409, "epoch": 664} {"train_loss": -34.582210540771484, "global_step": 80410, "epoch": 664} {"train_loss": -36.070594787597656, "global_step": 80411, "epoch": 664} {"train_loss": -34.3793830871582, "global_step": 80412, "epoch": 664} {"train_loss": -35.69365310668945, "global_step": 80413, "epoch": 664} {"train_loss": -36.43832015991211, "global_step": 80414, "epoch": 664} {"train_loss": -35.804500579833984, "global_step": 80415, "epoch": 664} {"train_loss": -35.40603256225586, "global_step": 80416, "epoch": 664} {"train_loss": -36.1572151184082, "global_step": 80417, "epoch": 664} {"train_loss": -35.5216064453125, "global_step": 80418, "epoch": 664} {"train_loss": -36.58858871459961, "global_step": 80419, "epoch": 664} {"train_loss": -36.1954460144043, "global_step": 80420, "epoch": 664} {"train_loss": -36.37236785888672, "global_step": 80421, "epoch": 664} {"train_loss": -35.61605453491211, "global_step": 80422, "epoch": 664} {"train_loss": -35.544525146484375, "global_step": 80423, "epoch": 664} {"train_loss": -35.867279052734375, "global_step": 80424, "epoch": 664} {"train_loss": -35.55339050292969, "global_step": 80425, "epoch": 664} {"train_loss": -35.77463912963867, "global_step": 80426, "epoch": 664} {"train_loss": -36.087886810302734, "global_step": 80427, "epoch": 664} {"train_loss": -36.32727813720703, "global_step": 80428, "epoch": 664} {"train_loss": -34.768253326416016, "global_step": 80429, "epoch": 664} {"train_loss": -36.18604278564453, "global_step": 80430, "epoch": 664} {"train_loss": -35.59394836425781, "global_step": 80431, "epoch": 664} {"train_loss": -36.412479400634766, "global_step": 80432, "epoch": 664} {"train_loss": -34.99277877807617, "global_step": 80433, "epoch": 664} {"train_loss": -36.0776481628418, "global_step": 80434, "epoch": 664} {"train_loss": -35.74904251098633, "global_step": 80435, "epoch": 664} {"train_loss": -35.84599685668945, "global_step": 80436, "epoch": 664} {"train_loss": -36.5853385925293, "global_step": 80437, "epoch": 664} {"train_loss": -36.176422119140625, "global_step": 80438, "epoch": 664} {"train_loss": -35.480560302734375, "global_step": 80439, "epoch": 664} {"train_loss": -36.846553802490234, "global_step": 80440, "epoch": 664} {"train_loss": -36.59031295776367, "global_step": 80441, "epoch": 664} {"train_loss": -37.18730163574219, "global_step": 80442, "epoch": 664} {"train_loss": -36.85821533203125, "global_step": 80443, "epoch": 664} {"train_loss": -36.93928146362305, "global_step": 80444, "epoch": 664} {"train_loss": -36.53550720214844, "global_step": 80445, "epoch": 664} {"train_loss": -37.036197662353516, "global_step": 80446, "epoch": 664} {"train_loss": -36.9331169128418, "global_step": 80447, "epoch": 664} {"train_loss": -37.108245849609375, "global_step": 80448, "epoch": 664} {"train_loss": -36.60978317260742, "global_step": 80449, "epoch": 664} {"train_loss": -37.06043243408203, "global_step": 80450, "epoch": 664} {"train_loss": -36.73601150512695, "global_step": 80451, "epoch": 664} {"train_loss": -37.19509506225586, "global_step": 80452, "epoch": 664} {"train_loss": -37.15790939331055, "global_step": 80453, "epoch": 664} {"train_loss": -36.44038772583008, "global_step": 80454, "epoch": 664} {"train_loss": -37.1092414855957, "global_step": 80455, "epoch": 664} {"train_loss": -36.87042999267578, "global_step": 80456, "epoch": 664} {"train_loss": -37.555152893066406, "global_step": 80457, "epoch": 664} {"train_loss": -37.00033187866211, "global_step": 80458, "epoch": 664} {"train_loss": -37.67094421386719, "global_step": 80459, "epoch": 664} {"train_loss": -37.12578582763672, "global_step": 80460, "epoch": 664} {"train_loss": -35.87240219116211, "global_step": 80461, "epoch": 664} {"train_loss": -37.58512496948242, "global_step": 80462, "epoch": 664} {"train_loss": -37.583290100097656, "global_step": 80463, "epoch": 664} {"train_loss": -36.10909945905701, "global_step": 80464, "epoch": 664, "val_loss": 2687722.75} {"train_loss": -35.80922317504883, "global_step": 80465, "epoch": 665} {"train_loss": -36.531097412109375, "global_step": 80466, "epoch": 665} {"train_loss": -36.44728469848633, "global_step": 80467, "epoch": 665} {"train_loss": -37.70888137817383, "global_step": 80468, "epoch": 665} {"train_loss": -37.49201965332031, "global_step": 80469, "epoch": 665} {"train_loss": -37.65362548828125, "global_step": 80470, "epoch": 665} {"train_loss": -37.30553436279297, "global_step": 80471, "epoch": 665} {"train_loss": -37.871917724609375, "global_step": 80472, "epoch": 665} {"train_loss": -36.94818878173828, "global_step": 80473, "epoch": 665} {"train_loss": -37.18577194213867, "global_step": 80474, "epoch": 665} {"train_loss": -37.9812126159668, "global_step": 80475, "epoch": 665} {"train_loss": -36.666072845458984, "global_step": 80476, "epoch": 665} {"train_loss": -37.123374938964844, "global_step": 80477, "epoch": 665} {"train_loss": -37.961097717285156, "global_step": 80478, "epoch": 665} {"train_loss": -37.74909210205078, "global_step": 80479, "epoch": 665} {"train_loss": -37.714569091796875, "global_step": 80480, "epoch": 665} {"train_loss": -37.443233489990234, "global_step": 80481, "epoch": 665} {"train_loss": -37.487274169921875, "global_step": 80482, "epoch": 665} {"train_loss": -37.59337615966797, "global_step": 80483, "epoch": 665} {"train_loss": -37.086910247802734, "global_step": 80484, "epoch": 665} {"train_loss": -37.49037551879883, "global_step": 80485, "epoch": 665} {"train_loss": -37.9537353515625, "global_step": 80486, "epoch": 665} {"train_loss": -37.3062629699707, "global_step": 80487, "epoch": 665} {"train_loss": -37.8578987121582, "global_step": 80488, "epoch": 665} {"train_loss": -37.381813049316406, "global_step": 80489, "epoch": 665} {"train_loss": -37.391021728515625, "global_step": 80490, "epoch": 665} {"train_loss": -37.41341781616211, "global_step": 80491, "epoch": 665} {"train_loss": -37.93000411987305, "global_step": 80492, "epoch": 665} {"train_loss": -37.718502044677734, "global_step": 80493, "epoch": 665} {"train_loss": -37.67253875732422, "global_step": 80494, "epoch": 665} {"train_loss": -37.58631896972656, "global_step": 80495, "epoch": 665} {"train_loss": -37.399986267089844, "global_step": 80496, "epoch": 665} {"train_loss": -37.18726348876953, "global_step": 80497, "epoch": 665} {"train_loss": -37.2892951965332, "global_step": 80498, "epoch": 665} {"train_loss": -37.69239044189453, "global_step": 80499, "epoch": 665} {"train_loss": -38.03278732299805, "global_step": 80500, "epoch": 665} {"train_loss": -38.527313232421875, "global_step": 80501, "epoch": 665} {"train_loss": -37.912906646728516, "global_step": 80502, "epoch": 665} {"train_loss": -38.29114532470703, "global_step": 80503, "epoch": 665} {"train_loss": -37.903053283691406, "global_step": 80504, "epoch": 665} {"train_loss": -38.15727996826172, "global_step": 80505, "epoch": 665} {"train_loss": -38.009403228759766, "global_step": 80506, "epoch": 665} {"train_loss": -38.14235305786133, "global_step": 80507, "epoch": 665} {"train_loss": -38.08154296875, "global_step": 80508, "epoch": 665} {"train_loss": -37.32290267944336, "global_step": 80509, "epoch": 665} {"train_loss": -37.80953598022461, "global_step": 80510, "epoch": 665} {"train_loss": -37.79523468017578, "global_step": 80511, "epoch": 665} {"train_loss": -36.73141098022461, "global_step": 80512, "epoch": 665} {"train_loss": -36.739295959472656, "global_step": 80513, "epoch": 665} {"train_loss": -37.76519775390625, "global_step": 80514, "epoch": 665} {"train_loss": -35.967952728271484, "global_step": 80515, "epoch": 665} {"train_loss": -36.00346755981445, "global_step": 80516, "epoch": 665} {"train_loss": -36.90656661987305, "global_step": 80517, "epoch": 665} {"train_loss": -35.055171966552734, "global_step": 80518, "epoch": 665} {"train_loss": -35.24798583984375, "global_step": 80519, "epoch": 665} {"train_loss": -32.94136428833008, "global_step": 80520, "epoch": 665} {"train_loss": -31.692157745361328, "global_step": 80521, "epoch": 665} {"train_loss": -32.81624221801758, "global_step": 80522, "epoch": 665} {"train_loss": -33.913700103759766, "global_step": 80523, "epoch": 665} {"train_loss": -35.18207931518555, "global_step": 80524, "epoch": 665} {"train_loss": -35.82323455810547, "global_step": 80525, "epoch": 665} {"train_loss": -35.24235916137695, "global_step": 80526, "epoch": 665} {"train_loss": -35.812904357910156, "global_step": 80527, "epoch": 665} {"train_loss": -34.98815155029297, "global_step": 80528, "epoch": 665} {"train_loss": -35.930397033691406, "global_step": 80529, "epoch": 665} {"train_loss": -34.83991622924805, "global_step": 80530, "epoch": 665} {"train_loss": -34.391143798828125, "global_step": 80531, "epoch": 665} {"train_loss": -36.811988830566406, "global_step": 80532, "epoch": 665} {"train_loss": -36.44013595581055, "global_step": 80533, "epoch": 665} {"train_loss": -35.34782028198242, "global_step": 80534, "epoch": 665} {"train_loss": -35.02018356323242, "global_step": 80535, "epoch": 665} {"train_loss": -36.57013702392578, "global_step": 80536, "epoch": 665} {"train_loss": -35.59959411621094, "global_step": 80537, "epoch": 665} {"train_loss": -36.27260971069336, "global_step": 80538, "epoch": 665} {"train_loss": -36.6320915222168, "global_step": 80539, "epoch": 665} {"train_loss": -36.06560516357422, "global_step": 80540, "epoch": 665} {"train_loss": -36.53679275512695, "global_step": 80541, "epoch": 665} {"train_loss": -36.55949020385742, "global_step": 80542, "epoch": 665} {"train_loss": -35.3883056640625, "global_step": 80543, "epoch": 665} {"train_loss": -36.11874008178711, "global_step": 80544, "epoch": 665} {"train_loss": -33.876373291015625, "global_step": 80545, "epoch": 665} {"train_loss": -36.42012405395508, "global_step": 80546, "epoch": 665} {"train_loss": -35.2105598449707, "global_step": 80547, "epoch": 665} {"train_loss": -36.37076950073242, "global_step": 80548, "epoch": 665} {"train_loss": -35.84781265258789, "global_step": 80549, "epoch": 665} {"train_loss": -35.77375030517578, "global_step": 80550, "epoch": 665} {"train_loss": -37.07835388183594, "global_step": 80551, "epoch": 665} {"train_loss": -36.054725646972656, "global_step": 80552, "epoch": 665} {"train_loss": -37.0214729309082, "global_step": 80553, "epoch": 665} {"train_loss": -36.07453918457031, "global_step": 80554, "epoch": 665} {"train_loss": -37.025146484375, "global_step": 80555, "epoch": 665} {"train_loss": -35.893943786621094, "global_step": 80556, "epoch": 665} {"train_loss": -36.60055923461914, "global_step": 80557, "epoch": 665} {"train_loss": -35.84701156616211, "global_step": 80558, "epoch": 665} {"train_loss": -36.827980041503906, "global_step": 80559, "epoch": 665} {"train_loss": -36.23386001586914, "global_step": 80560, "epoch": 665} {"train_loss": -36.731449127197266, "global_step": 80561, "epoch": 665} {"train_loss": -36.85892868041992, "global_step": 80562, "epoch": 665} {"train_loss": -35.634029388427734, "global_step": 80563, "epoch": 665} {"train_loss": -36.95659637451172, "global_step": 80564, "epoch": 665} {"train_loss": -37.2042121887207, "global_step": 80565, "epoch": 665} {"train_loss": -37.60774612426758, "global_step": 80566, "epoch": 665} {"train_loss": -37.18569564819336, "global_step": 80567, "epoch": 665} {"train_loss": -37.20916748046875, "global_step": 80568, "epoch": 665} {"train_loss": -37.683685302734375, "global_step": 80569, "epoch": 665} {"train_loss": -37.33822250366211, "global_step": 80570, "epoch": 665} {"train_loss": -37.34306716918945, "global_step": 80571, "epoch": 665} {"train_loss": -37.81500244140625, "global_step": 80572, "epoch": 665} {"train_loss": -36.58285903930664, "global_step": 80573, "epoch": 665} {"train_loss": -36.59130859375, "global_step": 80574, "epoch": 665} {"train_loss": -37.462703704833984, "global_step": 80575, "epoch": 665} {"train_loss": -37.67537307739258, "global_step": 80576, "epoch": 665} {"train_loss": -37.402381896972656, "global_step": 80577, "epoch": 665} {"train_loss": -36.963409423828125, "global_step": 80578, "epoch": 665} {"train_loss": -37.58240509033203, "global_step": 80579, "epoch": 665} {"train_loss": -37.3380126953125, "global_step": 80580, "epoch": 665} {"train_loss": -34.23413848876953, "global_step": 80581, "epoch": 665} {"train_loss": -37.39147186279297, "global_step": 80582, "epoch": 665} {"train_loss": -37.53282928466797, "global_step": 80583, "epoch": 665} {"train_loss": -37.01220703125, "global_step": 80584, "epoch": 665} {"train_loss": -36.72328126134951, "global_step": 80585, "epoch": 665, "val_loss": 2673402.0} {"train_loss": -37.449005126953125, "global_step": 80586, "epoch": 666} {"train_loss": -37.229610443115234, "global_step": 80587, "epoch": 666} {"train_loss": -34.9522590637207, "global_step": 80588, "epoch": 666} {"train_loss": -33.533199310302734, "global_step": 80589, "epoch": 666} {"train_loss": -36.003231048583984, "global_step": 80590, "epoch": 666} {"train_loss": -35.59408187866211, "global_step": 80591, "epoch": 666} {"train_loss": -37.10595703125, "global_step": 80592, "epoch": 666} {"train_loss": -35.11439895629883, "global_step": 80593, "epoch": 666} {"train_loss": -33.223262786865234, "global_step": 80594, "epoch": 666} {"train_loss": -31.850828170776367, "global_step": 80595, "epoch": 666} {"train_loss": -30.66347312927246, "global_step": 80596, "epoch": 666} {"train_loss": -31.395048141479492, "global_step": 80597, "epoch": 666} {"train_loss": -30.984411239624023, "global_step": 80598, "epoch": 666} {"train_loss": -28.209604263305664, "global_step": 80599, "epoch": 666} {"train_loss": -30.413190841674805, "global_step": 80600, "epoch": 666} {"train_loss": -31.407764434814453, "global_step": 80601, "epoch": 666} {"train_loss": -29.259485244750977, "global_step": 80602, "epoch": 666} {"train_loss": -30.390430450439453, "global_step": 80603, "epoch": 666} {"train_loss": -31.384103775024414, "global_step": 80604, "epoch": 666} {"train_loss": -29.942401885986328, "global_step": 80605, "epoch": 666} {"train_loss": -31.413589477539062, "global_step": 80606, "epoch": 666} {"train_loss": -31.369653701782227, "global_step": 80607, "epoch": 666} {"train_loss": -27.805994033813477, "global_step": 80608, "epoch": 666} {"train_loss": -32.707847595214844, "global_step": 80609, "epoch": 666} {"train_loss": -33.82988357543945, "global_step": 80610, "epoch": 666} {"train_loss": -31.72486686706543, "global_step": 80611, "epoch": 666} {"train_loss": -32.1971549987793, "global_step": 80612, "epoch": 666} {"train_loss": -32.09962844848633, "global_step": 80613, "epoch": 666} {"train_loss": -32.866065979003906, "global_step": 80614, "epoch": 666} {"train_loss": -32.922637939453125, "global_step": 80615, "epoch": 666} {"train_loss": -32.072021484375, "global_step": 80616, "epoch": 666} {"train_loss": -34.12308120727539, "global_step": 80617, "epoch": 666} {"train_loss": -34.632171630859375, "global_step": 80618, "epoch": 666} {"train_loss": -33.37090301513672, "global_step": 80619, "epoch": 666} {"train_loss": -33.659156799316406, "global_step": 80620, "epoch": 666} {"train_loss": -34.39424514770508, "global_step": 80621, "epoch": 666} {"train_loss": -33.52260208129883, "global_step": 80622, "epoch": 666} {"train_loss": -33.94400405883789, "global_step": 80623, "epoch": 666} {"train_loss": -34.27631759643555, "global_step": 80624, "epoch": 666} {"train_loss": -33.95072555541992, "global_step": 80625, "epoch": 666} {"train_loss": -34.24395751953125, "global_step": 80626, "epoch": 666} {"train_loss": -34.20023727416992, "global_step": 80627, "epoch": 666} {"train_loss": -34.13739776611328, "global_step": 80628, "epoch": 666} {"train_loss": -33.80668258666992, "global_step": 80629, "epoch": 666} {"train_loss": -33.82861328125, "global_step": 80630, "epoch": 666} {"train_loss": -34.558815002441406, "global_step": 80631, "epoch": 666} {"train_loss": -33.50402069091797, "global_step": 80632, "epoch": 666} {"train_loss": -35.326576232910156, "global_step": 80633, "epoch": 666} {"train_loss": -34.15203857421875, "global_step": 80634, "epoch": 666} {"train_loss": -35.19462585449219, "global_step": 80635, "epoch": 666} {"train_loss": -34.77179718017578, "global_step": 80636, "epoch": 666} {"train_loss": -34.804866790771484, "global_step": 80637, "epoch": 666} {"train_loss": -34.680755615234375, "global_step": 80638, "epoch": 666} {"train_loss": -34.869564056396484, "global_step": 80639, "epoch": 666} {"train_loss": -34.96406936645508, "global_step": 80640, "epoch": 666} {"train_loss": -35.485626220703125, "global_step": 80641, "epoch": 666} {"train_loss": -33.952919006347656, "global_step": 80642, "epoch": 666} {"train_loss": -35.602603912353516, "global_step": 80643, "epoch": 666} {"train_loss": -35.33216857910156, "global_step": 80644, "epoch": 666} {"train_loss": -35.46156692504883, "global_step": 80645, "epoch": 666} {"train_loss": -34.337562561035156, "global_step": 80646, "epoch": 666} {"train_loss": -35.25169372558594, "global_step": 80647, "epoch": 666} {"train_loss": -34.489986419677734, "global_step": 80648, "epoch": 666} {"train_loss": -34.604591369628906, "global_step": 80649, "epoch": 666} {"train_loss": -34.9578857421875, "global_step": 80650, "epoch": 666} {"train_loss": -35.8635139465332, "global_step": 80651, "epoch": 666} {"train_loss": -35.47654342651367, "global_step": 80652, "epoch": 666} {"train_loss": -35.66114044189453, "global_step": 80653, "epoch": 666} {"train_loss": -35.55086135864258, "global_step": 80654, "epoch": 666} {"train_loss": -36.19272232055664, "global_step": 80655, "epoch": 666} {"train_loss": -35.96952438354492, "global_step": 80656, "epoch": 666} {"train_loss": -35.883827209472656, "global_step": 80657, "epoch": 666} {"train_loss": -36.299339294433594, "global_step": 80658, "epoch": 666} {"train_loss": -35.97707748413086, "global_step": 80659, "epoch": 666} {"train_loss": -36.3142204284668, "global_step": 80660, "epoch": 666} {"train_loss": -36.550079345703125, "global_step": 80661, "epoch": 666} {"train_loss": -36.01963424682617, "global_step": 80662, "epoch": 666} {"train_loss": -35.313045501708984, "global_step": 80663, "epoch": 666} {"train_loss": -36.646522521972656, "global_step": 80664, "epoch": 666} {"train_loss": -35.785003662109375, "global_step": 80665, "epoch": 666} {"train_loss": -36.45351028442383, "global_step": 80666, "epoch": 666} {"train_loss": -36.541412353515625, "global_step": 80667, "epoch": 666} {"train_loss": -36.56023025512695, "global_step": 80668, "epoch": 666} {"train_loss": -36.64606475830078, "global_step": 80669, "epoch": 666} {"train_loss": -36.52921676635742, "global_step": 80670, "epoch": 666} {"train_loss": -36.78398513793945, "global_step": 80671, "epoch": 666} {"train_loss": -37.11283493041992, "global_step": 80672, "epoch": 666} {"train_loss": -36.8153076171875, "global_step": 80673, "epoch": 666} {"train_loss": -36.96341323852539, "global_step": 80674, "epoch": 666} {"train_loss": -36.981727600097656, "global_step": 80675, "epoch": 666} {"train_loss": -36.91494369506836, "global_step": 80676, "epoch": 666} {"train_loss": -36.76973342895508, "global_step": 80677, "epoch": 666} {"train_loss": -37.03706741333008, "global_step": 80678, "epoch": 666} {"train_loss": -37.4972038269043, "global_step": 80679, "epoch": 666} {"train_loss": -36.978397369384766, "global_step": 80680, "epoch": 666} {"train_loss": -37.155067443847656, "global_step": 80681, "epoch": 666} {"train_loss": -37.29597091674805, "global_step": 80682, "epoch": 666} {"train_loss": -37.15403366088867, "global_step": 80683, "epoch": 666} {"train_loss": -37.31038284301758, "global_step": 80684, "epoch": 666} {"train_loss": -37.28835678100586, "global_step": 80685, "epoch": 666} {"train_loss": -37.14522171020508, "global_step": 80686, "epoch": 666} {"train_loss": -37.09088134765625, "global_step": 80687, "epoch": 666} {"train_loss": -37.59473419189453, "global_step": 80688, "epoch": 666} {"train_loss": -37.56720733642578, "global_step": 80689, "epoch": 666} {"train_loss": -37.193782806396484, "global_step": 80690, "epoch": 666} {"train_loss": -37.205989837646484, "global_step": 80691, "epoch": 666} {"train_loss": -37.057857513427734, "global_step": 80692, "epoch": 666} {"train_loss": -37.172119140625, "global_step": 80693, "epoch": 666} {"train_loss": -37.050506591796875, "global_step": 80694, "epoch": 666} {"train_loss": -37.068782806396484, "global_step": 80695, "epoch": 666} {"train_loss": -36.524620056152344, "global_step": 80696, "epoch": 666} {"train_loss": -36.74668502807617, "global_step": 80697, "epoch": 666} {"train_loss": -35.8848991394043, "global_step": 80698, "epoch": 666} {"train_loss": -36.21967697143555, "global_step": 80699, "epoch": 666} {"train_loss": -35.77851867675781, "global_step": 80700, "epoch": 666} {"train_loss": -34.242103576660156, "global_step": 80701, "epoch": 666} {"train_loss": -33.729103088378906, "global_step": 80702, "epoch": 666} {"train_loss": -33.73631286621094, "global_step": 80703, "epoch": 666} {"train_loss": -34.76044845581055, "global_step": 80704, "epoch": 666} {"train_loss": -34.364349365234375, "global_step": 80705, "epoch": 666} {"train_loss": -34.84672273683154, "global_step": 80706, "epoch": 666, "val_loss": 2771074.75} {"train_loss": -37.306915283203125, "global_step": 80707, "epoch": 667} {"train_loss": -36.82929611206055, "global_step": 80708, "epoch": 667} {"train_loss": -35.05965805053711, "global_step": 80709, "epoch": 667} {"train_loss": -36.05825424194336, "global_step": 80710, "epoch": 667} {"train_loss": -35.90616989135742, "global_step": 80711, "epoch": 667} {"train_loss": -37.42822265625, "global_step": 80712, "epoch": 667} {"train_loss": -36.588783264160156, "global_step": 80713, "epoch": 667} {"train_loss": -36.60270309448242, "global_step": 80714, "epoch": 667} {"train_loss": -36.54311752319336, "global_step": 80715, "epoch": 667} {"train_loss": -36.422420501708984, "global_step": 80716, "epoch": 667} {"train_loss": -36.57948684692383, "global_step": 80717, "epoch": 667} {"train_loss": -36.086143493652344, "global_step": 80718, "epoch": 667} {"train_loss": -37.0318603515625, "global_step": 80719, "epoch": 667} {"train_loss": -36.96259689331055, "global_step": 80720, "epoch": 667} {"train_loss": -36.23693084716797, "global_step": 80721, "epoch": 667} {"train_loss": -37.36113357543945, "global_step": 80722, "epoch": 667} {"train_loss": -36.164669036865234, "global_step": 80723, "epoch": 667} {"train_loss": -36.77204513549805, "global_step": 80724, "epoch": 667} {"train_loss": -37.026302337646484, "global_step": 80725, "epoch": 667} {"train_loss": -37.343196868896484, "global_step": 80726, "epoch": 667} {"train_loss": -37.3865852355957, "global_step": 80727, "epoch": 667} {"train_loss": -36.75617599487305, "global_step": 80728, "epoch": 667} {"train_loss": -37.44546127319336, "global_step": 80729, "epoch": 667} {"train_loss": -36.64751434326172, "global_step": 80730, "epoch": 667} {"train_loss": -37.43794631958008, "global_step": 80731, "epoch": 667} {"train_loss": -36.92683029174805, "global_step": 80732, "epoch": 667} {"train_loss": -37.840187072753906, "global_step": 80733, "epoch": 667} {"train_loss": -37.57818603515625, "global_step": 80734, "epoch": 667} {"train_loss": -37.382537841796875, "global_step": 80735, "epoch": 667} {"train_loss": -37.229000091552734, "global_step": 80736, "epoch": 667} {"train_loss": -37.23654556274414, "global_step": 80737, "epoch": 667} {"train_loss": -36.14828872680664, "global_step": 80738, "epoch": 667} {"train_loss": -36.01443099975586, "global_step": 80739, "epoch": 667} {"train_loss": -35.6604118347168, "global_step": 80740, "epoch": 667} {"train_loss": -37.43645095825195, "global_step": 80741, "epoch": 667} {"train_loss": -37.893898010253906, "global_step": 80742, "epoch": 667} {"train_loss": -37.42346954345703, "global_step": 80743, "epoch": 667} {"train_loss": -37.68257522583008, "global_step": 80744, "epoch": 667} {"train_loss": -37.702720642089844, "global_step": 80745, "epoch": 667} {"train_loss": -37.79054641723633, "global_step": 80746, "epoch": 667} {"train_loss": -37.237762451171875, "global_step": 80747, "epoch": 667} {"train_loss": -35.30844497680664, "global_step": 80748, "epoch": 667} {"train_loss": -37.27079391479492, "global_step": 80749, "epoch": 667} {"train_loss": -37.440147399902344, "global_step": 80750, "epoch": 667} {"train_loss": -37.44599151611328, "global_step": 80751, "epoch": 667} {"train_loss": -37.26868438720703, "global_step": 80752, "epoch": 667} {"train_loss": -37.95173263549805, "global_step": 80753, "epoch": 667} {"train_loss": -37.00852966308594, "global_step": 80754, "epoch": 667} {"train_loss": -37.18874740600586, "global_step": 80755, "epoch": 667} {"train_loss": -37.061214447021484, "global_step": 80756, "epoch": 667} {"train_loss": -37.85761260986328, "global_step": 80757, "epoch": 667} {"train_loss": -35.96912384033203, "global_step": 80758, "epoch": 667} {"train_loss": -35.54587936401367, "global_step": 80759, "epoch": 667} {"train_loss": -33.102718353271484, "global_step": 80760, "epoch": 667} {"train_loss": -32.840675354003906, "global_step": 80761, "epoch": 667} {"train_loss": -32.76924514770508, "global_step": 80762, "epoch": 667} {"train_loss": -34.48189926147461, "global_step": 80763, "epoch": 667} {"train_loss": -37.775997161865234, "global_step": 80764, "epoch": 667} {"train_loss": -36.15998458862305, "global_step": 80765, "epoch": 667} {"train_loss": -36.07190704345703, "global_step": 80766, "epoch": 667} {"train_loss": -37.592586517333984, "global_step": 80767, "epoch": 667} {"train_loss": -37.35920333862305, "global_step": 80768, "epoch": 667} {"train_loss": -37.125648498535156, "global_step": 80769, "epoch": 667} {"train_loss": -37.322959899902344, "global_step": 80770, "epoch": 667} {"train_loss": -36.89360427856445, "global_step": 80771, "epoch": 667} {"train_loss": -36.76816940307617, "global_step": 80772, "epoch": 667} {"train_loss": -38.141212463378906, "global_step": 80773, "epoch": 667} {"train_loss": -37.568626403808594, "global_step": 80774, "epoch": 667} {"train_loss": -37.354896545410156, "global_step": 80775, "epoch": 667} {"train_loss": -37.30076217651367, "global_step": 80776, "epoch": 667} {"train_loss": -37.00989532470703, "global_step": 80777, "epoch": 667} {"train_loss": -37.73922348022461, "global_step": 80778, "epoch": 667} {"train_loss": -37.75065994262695, "global_step": 80779, "epoch": 667} {"train_loss": -37.90934753417969, "global_step": 80780, "epoch": 667} {"train_loss": -37.647193908691406, "global_step": 80781, "epoch": 667} {"train_loss": -37.18689727783203, "global_step": 80782, "epoch": 667} {"train_loss": -38.286399841308594, "global_step": 80783, "epoch": 667} {"train_loss": -37.968505859375, "global_step": 80784, "epoch": 667} {"train_loss": -37.97158432006836, "global_step": 80785, "epoch": 667} {"train_loss": -37.066951751708984, "global_step": 80786, "epoch": 667} {"train_loss": -37.02187728881836, "global_step": 80787, "epoch": 667} {"train_loss": -37.75043869018555, "global_step": 80788, "epoch": 667} {"train_loss": -36.7690544128418, "global_step": 80789, "epoch": 667} {"train_loss": -36.36006164550781, "global_step": 80790, "epoch": 667} {"train_loss": -36.76656723022461, "global_step": 80791, "epoch": 667} {"train_loss": -37.536651611328125, "global_step": 80792, "epoch": 667} {"train_loss": -36.666622161865234, "global_step": 80793, "epoch": 667} {"train_loss": -37.73855209350586, "global_step": 80794, "epoch": 667} {"train_loss": -36.51563262939453, "global_step": 80795, "epoch": 667} {"train_loss": -37.42310333251953, "global_step": 80796, "epoch": 667} {"train_loss": -34.428428649902344, "global_step": 80797, "epoch": 667} {"train_loss": -31.15594482421875, "global_step": 80798, "epoch": 667} {"train_loss": -37.29780960083008, "global_step": 80799, "epoch": 667} {"train_loss": -33.71746063232422, "global_step": 80800, "epoch": 667} {"train_loss": -37.25629806518555, "global_step": 80801, "epoch": 667} {"train_loss": -35.5452880859375, "global_step": 80802, "epoch": 667} {"train_loss": -37.02537155151367, "global_step": 80803, "epoch": 667} {"train_loss": -36.85124588012695, "global_step": 80804, "epoch": 667} {"train_loss": -35.892250061035156, "global_step": 80805, "epoch": 667} {"train_loss": -37.06980514526367, "global_step": 80806, "epoch": 667} {"train_loss": -36.47926712036133, "global_step": 80807, "epoch": 667} {"train_loss": -37.15277099609375, "global_step": 80808, "epoch": 667} {"train_loss": -35.621700286865234, "global_step": 80809, "epoch": 667} {"train_loss": -37.33014678955078, "global_step": 80810, "epoch": 667} {"train_loss": -37.29118728637695, "global_step": 80811, "epoch": 667} {"train_loss": -36.91034698486328, "global_step": 80812, "epoch": 667} {"train_loss": -37.41129684448242, "global_step": 80813, "epoch": 667} {"train_loss": -37.81736373901367, "global_step": 80814, "epoch": 667} {"train_loss": -35.897605895996094, "global_step": 80815, "epoch": 667} {"train_loss": -36.539302825927734, "global_step": 80816, "epoch": 667} {"train_loss": -36.59282684326172, "global_step": 80817, "epoch": 667} {"train_loss": -36.25804138183594, "global_step": 80818, "epoch": 667} {"train_loss": -37.34328842163086, "global_step": 80819, "epoch": 667} {"train_loss": -34.02053451538086, "global_step": 80820, "epoch": 667} {"train_loss": -36.61357116699219, "global_step": 80821, "epoch": 667} {"train_loss": -35.76042938232422, "global_step": 80822, "epoch": 667} {"train_loss": -37.20294952392578, "global_step": 80823, "epoch": 667} {"train_loss": -35.655025482177734, "global_step": 80824, "epoch": 667} {"train_loss": -36.9500846862793, "global_step": 80825, "epoch": 667} {"train_loss": -36.3577995300293, "global_step": 80826, "epoch": 667} {"train_loss": -36.727601926188825, "global_step": 80827, "epoch": 667, "val_loss": 2797706.75} {"train_loss": -36.31630325317383, "global_step": 80828, "epoch": 668} {"train_loss": -36.984127044677734, "global_step": 80829, "epoch": 668} {"train_loss": -36.14244079589844, "global_step": 80830, "epoch": 668} {"train_loss": -36.80904006958008, "global_step": 80831, "epoch": 668} {"train_loss": -36.85464859008789, "global_step": 80832, "epoch": 668} {"train_loss": -36.867671966552734, "global_step": 80833, "epoch": 668} {"train_loss": -37.12568664550781, "global_step": 80834, "epoch": 668} {"train_loss": -26.699209213256836, "global_step": 80835, "epoch": 668} {"train_loss": -36.71193313598633, "global_step": 80836, "epoch": 668} {"train_loss": -36.96489334106445, "global_step": 80837, "epoch": 668} {"train_loss": -37.4583854675293, "global_step": 80838, "epoch": 668} {"train_loss": -33.43073272705078, "global_step": 80839, "epoch": 668} {"train_loss": -36.91389083862305, "global_step": 80840, "epoch": 668} {"train_loss": -36.500732421875, "global_step": 80841, "epoch": 668} {"train_loss": -37.10077667236328, "global_step": 80842, "epoch": 668} {"train_loss": -37.08949661254883, "global_step": 80843, "epoch": 668} {"train_loss": -36.0023078918457, "global_step": 80844, "epoch": 668} {"train_loss": -36.2797737121582, "global_step": 80845, "epoch": 668} {"train_loss": -35.77288818359375, "global_step": 80846, "epoch": 668} {"train_loss": -36.07141876220703, "global_step": 80847, "epoch": 668} {"train_loss": -35.52297592163086, "global_step": 80848, "epoch": 668} {"train_loss": -33.908626556396484, "global_step": 80849, "epoch": 668} {"train_loss": -36.50944900512695, "global_step": 80850, "epoch": 668} {"train_loss": -36.02683639526367, "global_step": 80851, "epoch": 668} {"train_loss": -36.74921798706055, "global_step": 80852, "epoch": 668} {"train_loss": -34.62293243408203, "global_step": 80853, "epoch": 668} {"train_loss": -37.15019607543945, "global_step": 80854, "epoch": 668} {"train_loss": -37.16407012939453, "global_step": 80855, "epoch": 668} {"train_loss": -35.197021484375, "global_step": 80856, "epoch": 668} {"train_loss": -36.29215621948242, "global_step": 80857, "epoch": 668} {"train_loss": -37.19150924682617, "global_step": 80858, "epoch": 668} {"train_loss": -37.079368591308594, "global_step": 80859, "epoch": 668} {"train_loss": -37.1051139831543, "global_step": 80860, "epoch": 668} {"train_loss": -37.363033294677734, "global_step": 80861, "epoch": 668} {"train_loss": -36.761287689208984, "global_step": 80862, "epoch": 668} {"train_loss": -36.82346725463867, "global_step": 80863, "epoch": 668} {"train_loss": -36.64840316772461, "global_step": 80864, "epoch": 668} {"train_loss": -37.30253219604492, "global_step": 80865, "epoch": 668} {"train_loss": -36.152259826660156, "global_step": 80866, "epoch": 668} {"train_loss": -36.979644775390625, "global_step": 80867, "epoch": 668} {"train_loss": -37.168941497802734, "global_step": 80868, "epoch": 668} {"train_loss": -35.69741439819336, "global_step": 80869, "epoch": 668} {"train_loss": -37.38483810424805, "global_step": 80870, "epoch": 668} {"train_loss": -36.820526123046875, "global_step": 80871, "epoch": 668} {"train_loss": -37.526123046875, "global_step": 80872, "epoch": 668} {"train_loss": -37.40180587768555, "global_step": 80873, "epoch": 668} {"train_loss": -37.39176940917969, "global_step": 80874, "epoch": 668} {"train_loss": -36.204463958740234, "global_step": 80875, "epoch": 668} {"train_loss": -35.645137786865234, "global_step": 80876, "epoch": 668} {"train_loss": -37.21501541137695, "global_step": 80877, "epoch": 668} {"train_loss": -37.438751220703125, "global_step": 80878, "epoch": 668} {"train_loss": -37.341739654541016, "global_step": 80879, "epoch": 668} {"train_loss": -36.82880783081055, "global_step": 80880, "epoch": 668} {"train_loss": -36.20735549926758, "global_step": 80881, "epoch": 668} {"train_loss": -37.4674186706543, "global_step": 80882, "epoch": 668} {"train_loss": -37.366939544677734, "global_step": 80883, "epoch": 668} {"train_loss": -37.00358581542969, "global_step": 80884, "epoch": 668} {"train_loss": -37.29543685913086, "global_step": 80885, "epoch": 668} {"train_loss": -37.66366195678711, "global_step": 80886, "epoch": 668} {"train_loss": -36.8406982421875, "global_step": 80887, "epoch": 668} {"train_loss": -36.5592041015625, "global_step": 80888, "epoch": 668} {"train_loss": -37.07839584350586, "global_step": 80889, "epoch": 668} {"train_loss": -37.51007843017578, "global_step": 80890, "epoch": 668} {"train_loss": -37.07004928588867, "global_step": 80891, "epoch": 668} {"train_loss": -37.59720230102539, "global_step": 80892, "epoch": 668} {"train_loss": -37.4757194519043, "global_step": 80893, "epoch": 668} {"train_loss": -37.521881103515625, "global_step": 80894, "epoch": 668} {"train_loss": -36.5533561706543, "global_step": 80895, "epoch": 668} {"train_loss": -37.09103012084961, "global_step": 80896, "epoch": 668} {"train_loss": -37.490684509277344, "global_step": 80897, "epoch": 668} {"train_loss": -37.4442138671875, "global_step": 80898, "epoch": 668} {"train_loss": -34.166542053222656, "global_step": 80899, "epoch": 668} {"train_loss": -37.317237854003906, "global_step": 80900, "epoch": 668} {"train_loss": -37.070003509521484, "global_step": 80901, "epoch": 668} {"train_loss": -37.401222229003906, "global_step": 80902, "epoch": 668} {"train_loss": -36.50824737548828, "global_step": 80903, "epoch": 668} {"train_loss": -37.65326690673828, "global_step": 80904, "epoch": 668} {"train_loss": -36.14532470703125, "global_step": 80905, "epoch": 668} {"train_loss": -36.79470443725586, "global_step": 80906, "epoch": 668} {"train_loss": -37.30942916870117, "global_step": 80907, "epoch": 668} {"train_loss": -37.61870193481445, "global_step": 80908, "epoch": 668} {"train_loss": -37.449581146240234, "global_step": 80909, "epoch": 668} {"train_loss": -38.04768371582031, "global_step": 80910, "epoch": 668} {"train_loss": -37.434364318847656, "global_step": 80911, "epoch": 668} {"train_loss": -37.44211196899414, "global_step": 80912, "epoch": 668} {"train_loss": -37.891090393066406, "global_step": 80913, "epoch": 668} {"train_loss": -37.57038116455078, "global_step": 80914, "epoch": 668} {"train_loss": -36.18492126464844, "global_step": 80915, "epoch": 668} {"train_loss": -37.04336166381836, "global_step": 80916, "epoch": 668} {"train_loss": -37.80598068237305, "global_step": 80917, "epoch": 668} {"train_loss": -36.45719528198242, "global_step": 80918, "epoch": 668} {"train_loss": -36.51905059814453, "global_step": 80919, "epoch": 668} {"train_loss": -37.696163177490234, "global_step": 80920, "epoch": 668} {"train_loss": -36.101131439208984, "global_step": 80921, "epoch": 668} {"train_loss": -37.0451545715332, "global_step": 80922, "epoch": 668} {"train_loss": -37.579566955566406, "global_step": 80923, "epoch": 668} {"train_loss": -37.62846374511719, "global_step": 80924, "epoch": 668} {"train_loss": -37.477630615234375, "global_step": 80925, "epoch": 668} {"train_loss": -37.08468246459961, "global_step": 80926, "epoch": 668} {"train_loss": -37.669403076171875, "global_step": 80927, "epoch": 668} {"train_loss": -36.94355773925781, "global_step": 80928, "epoch": 668} {"train_loss": -36.43772506713867, "global_step": 80929, "epoch": 668} {"train_loss": -35.585845947265625, "global_step": 80930, "epoch": 668} {"train_loss": -36.458614349365234, "global_step": 80931, "epoch": 668} {"train_loss": -37.402095794677734, "global_step": 80932, "epoch": 668} {"train_loss": -37.415252685546875, "global_step": 80933, "epoch": 668} {"train_loss": -36.90327835083008, "global_step": 80934, "epoch": 668} {"train_loss": -36.18547439575195, "global_step": 80935, "epoch": 668} {"train_loss": -36.68817138671875, "global_step": 80936, "epoch": 668} {"train_loss": -37.042327880859375, "global_step": 80937, "epoch": 668} {"train_loss": -37.48202133178711, "global_step": 80938, "epoch": 668} {"train_loss": -36.71785354614258, "global_step": 80939, "epoch": 668} {"train_loss": -36.99982452392578, "global_step": 80940, "epoch": 668} {"train_loss": -36.636688232421875, "global_step": 80941, "epoch": 668} {"train_loss": -36.42010498046875, "global_step": 80942, "epoch": 668} {"train_loss": -37.04623031616211, "global_step": 80943, "epoch": 668} {"train_loss": -35.794063568115234, "global_step": 80944, "epoch": 668} {"train_loss": -32.397857666015625, "global_step": 80945, "epoch": 668} {"train_loss": -27.435810089111328, "global_step": 80946, "epoch": 668} {"train_loss": -15.350253105163574, "global_step": 80947, "epoch": 668} {"train_loss": -36.28338184041425, "global_step": 80948, "epoch": 668, "val_loss": 2688696.75} {"train_loss": -31.73920249938965, "global_step": 80949, "epoch": 669} {"train_loss": -13.287750244140625, "global_step": 80950, "epoch": 669} {"train_loss": -33.398502349853516, "global_step": 80951, "epoch": 669} {"train_loss": -21.577566146850586, "global_step": 80952, "epoch": 669} {"train_loss": -33.89540481567383, "global_step": 80953, "epoch": 669} {"train_loss": -22.962675094604492, "global_step": 80954, "epoch": 669} {"train_loss": -34.108402252197266, "global_step": 80955, "epoch": 669} {"train_loss": -29.828516006469727, "global_step": 80956, "epoch": 669} {"train_loss": -32.31887435913086, "global_step": 80957, "epoch": 669} {"train_loss": -32.973812103271484, "global_step": 80958, "epoch": 669} {"train_loss": -31.27638053894043, "global_step": 80959, "epoch": 669} {"train_loss": -34.47156524658203, "global_step": 80960, "epoch": 669} {"train_loss": -33.7553596496582, "global_step": 80961, "epoch": 669} {"train_loss": -33.16146469116211, "global_step": 80962, "epoch": 669} {"train_loss": -32.937801361083984, "global_step": 80963, "epoch": 669} {"train_loss": -35.1998405456543, "global_step": 80964, "epoch": 669} {"train_loss": -18.374094009399414, "global_step": 80965, "epoch": 669} {"train_loss": -33.8297004699707, "global_step": 80966, "epoch": 669} {"train_loss": -33.83384323120117, "global_step": 80967, "epoch": 669} {"train_loss": -32.97943878173828, "global_step": 80968, "epoch": 669} {"train_loss": -32.56874465942383, "global_step": 80969, "epoch": 669} {"train_loss": -33.94033432006836, "global_step": 80970, "epoch": 669} {"train_loss": -34.43156433105469, "global_step": 80971, "epoch": 669} {"train_loss": -33.24966049194336, "global_step": 80972, "epoch": 669} {"train_loss": -34.0617561340332, "global_step": 80973, "epoch": 669} {"train_loss": -31.021697998046875, "global_step": 80974, "epoch": 669} {"train_loss": -35.13811492919922, "global_step": 80975, "epoch": 669} {"train_loss": -35.58407211303711, "global_step": 80976, "epoch": 669} {"train_loss": -34.706336975097656, "global_step": 80977, "epoch": 669} {"train_loss": -34.5439567565918, "global_step": 80978, "epoch": 669} {"train_loss": -34.39704132080078, "global_step": 80979, "epoch": 669} {"train_loss": -34.97346878051758, "global_step": 80980, "epoch": 669} {"train_loss": -34.58442687988281, "global_step": 80981, "epoch": 669} {"train_loss": -34.42005157470703, "global_step": 80982, "epoch": 669} {"train_loss": -35.33466339111328, "global_step": 80983, "epoch": 669} {"train_loss": -35.439640045166016, "global_step": 80984, "epoch": 669} {"train_loss": -35.43948745727539, "global_step": 80985, "epoch": 669} {"train_loss": -35.49605178833008, "global_step": 80986, "epoch": 669} {"train_loss": -35.29226303100586, "global_step": 80987, "epoch": 669} {"train_loss": -35.34431838989258, "global_step": 80988, "epoch": 669} {"train_loss": -35.369140625, "global_step": 80989, "epoch": 669} {"train_loss": -34.96118927001953, "global_step": 80990, "epoch": 669} {"train_loss": -36.04097366333008, "global_step": 80991, "epoch": 669} {"train_loss": -35.23591232299805, "global_step": 80992, "epoch": 669} {"train_loss": -35.84326934814453, "global_step": 80993, "epoch": 669} {"train_loss": -35.63269805908203, "global_step": 80994, "epoch": 669} {"train_loss": -35.73380661010742, "global_step": 80995, "epoch": 669} {"train_loss": -35.93748092651367, "global_step": 80996, "epoch": 669} {"train_loss": -35.51626205444336, "global_step": 80997, "epoch": 669} {"train_loss": -35.81820297241211, "global_step": 80998, "epoch": 669} {"train_loss": -35.32578659057617, "global_step": 80999, "epoch": 669} {"train_loss": -35.97761917114258, "global_step": 81000, "epoch": 669} {"train_loss": -36.18378448486328, "global_step": 81001, "epoch": 669} {"train_loss": -35.805023193359375, "global_step": 81002, "epoch": 669} {"train_loss": -36.526119232177734, "global_step": 81003, "epoch": 669} {"train_loss": -36.298667907714844, "global_step": 81004, "epoch": 669} {"train_loss": -36.268985748291016, "global_step": 81005, "epoch": 669} {"train_loss": -36.66536331176758, "global_step": 81006, "epoch": 669} {"train_loss": -36.22617721557617, "global_step": 81007, "epoch": 669} {"train_loss": -36.552772521972656, "global_step": 81008, "epoch": 669} {"train_loss": -36.546539306640625, "global_step": 81009, "epoch": 669} {"train_loss": -36.77750778198242, "global_step": 81010, "epoch": 669} {"train_loss": -36.661895751953125, "global_step": 81011, "epoch": 669} {"train_loss": -36.317378997802734, "global_step": 81012, "epoch": 669} {"train_loss": -36.3741569519043, "global_step": 81013, "epoch": 669} {"train_loss": -36.70894241333008, "global_step": 81014, "epoch": 669} {"train_loss": -36.99370193481445, "global_step": 81015, "epoch": 669} {"train_loss": -36.97773742675781, "global_step": 81016, "epoch": 669} {"train_loss": -36.81204605102539, "global_step": 81017, "epoch": 669} {"train_loss": -37.18183135986328, "global_step": 81018, "epoch": 669} {"train_loss": -36.75758743286133, "global_step": 81019, "epoch": 669} {"train_loss": -37.02132797241211, "global_step": 81020, "epoch": 669} {"train_loss": -37.04339599609375, "global_step": 81021, "epoch": 669} {"train_loss": -36.99204635620117, "global_step": 81022, "epoch": 669} {"train_loss": -37.25904846191406, "global_step": 81023, "epoch": 669} {"train_loss": -36.98797607421875, "global_step": 81024, "epoch": 669} {"train_loss": -36.60531234741211, "global_step": 81025, "epoch": 669} {"train_loss": -37.51417541503906, "global_step": 81026, "epoch": 669} {"train_loss": -37.21761703491211, "global_step": 81027, "epoch": 669} {"train_loss": -37.35763168334961, "global_step": 81028, "epoch": 669} {"train_loss": -37.73575973510742, "global_step": 81029, "epoch": 669} {"train_loss": -37.4307861328125, "global_step": 81030, "epoch": 669} {"train_loss": -37.54549026489258, "global_step": 81031, "epoch": 669} {"train_loss": -37.81097412109375, "global_step": 81032, "epoch": 669} {"train_loss": -37.169471740722656, "global_step": 81033, "epoch": 669} {"train_loss": -37.49015426635742, "global_step": 81034, "epoch": 669} {"train_loss": -37.3834342956543, "global_step": 81035, "epoch": 669} {"train_loss": -37.4972038269043, "global_step": 81036, "epoch": 669} {"train_loss": -37.472450256347656, "global_step": 81037, "epoch": 669} {"train_loss": -37.5578498840332, "global_step": 81038, "epoch": 669} {"train_loss": -37.91611862182617, "global_step": 81039, "epoch": 669} {"train_loss": -37.92123031616211, "global_step": 81040, "epoch": 669} {"train_loss": -38.18717575073242, "global_step": 81041, "epoch": 669} {"train_loss": -37.64446258544922, "global_step": 81042, "epoch": 669} {"train_loss": -37.932247161865234, "global_step": 81043, "epoch": 669} {"train_loss": -37.67879867553711, "global_step": 81044, "epoch": 669} {"train_loss": -38.03666687011719, "global_step": 81045, "epoch": 669} {"train_loss": -38.08536911010742, "global_step": 81046, "epoch": 669} {"train_loss": -38.11518096923828, "global_step": 81047, "epoch": 669} {"train_loss": -37.7155647277832, "global_step": 81048, "epoch": 669} {"train_loss": -37.953731536865234, "global_step": 81049, "epoch": 669} {"train_loss": -37.831390380859375, "global_step": 81050, "epoch": 669} {"train_loss": -38.28204345703125, "global_step": 81051, "epoch": 669} {"train_loss": -37.90831756591797, "global_step": 81052, "epoch": 669} {"train_loss": -37.95686340332031, "global_step": 81053, "epoch": 669} {"train_loss": -37.81923294067383, "global_step": 81054, "epoch": 669} {"train_loss": -37.26729202270508, "global_step": 81055, "epoch": 669} {"train_loss": -35.573944091796875, "global_step": 81056, "epoch": 669} {"train_loss": -36.41764450073242, "global_step": 81057, "epoch": 669} {"train_loss": -36.8138427734375, "global_step": 81058, "epoch": 669} {"train_loss": -36.9934196472168, "global_step": 81059, "epoch": 669} {"train_loss": -37.608211517333984, "global_step": 81060, "epoch": 669} {"train_loss": -37.812408447265625, "global_step": 81061, "epoch": 669} {"train_loss": -38.25980758666992, "global_step": 81062, "epoch": 669} {"train_loss": -37.9067497253418, "global_step": 81063, "epoch": 669} {"train_loss": -37.87955856323242, "global_step": 81064, "epoch": 669} {"train_loss": -37.8873291015625, "global_step": 81065, "epoch": 669} {"train_loss": -37.98664093017578, "global_step": 81066, "epoch": 669} {"train_loss": -37.85707473754883, "global_step": 81067, "epoch": 669} {"train_loss": -38.193031311035156, "global_step": 81068, "epoch": 669} {"train_loss": -35.50858231221349, "global_step": 81069, "epoch": 669, "val_loss": 2804259.0} {"train_loss": -37.141143798828125, "global_step": 81070, "epoch": 670} {"train_loss": -37.1995964050293, "global_step": 81071, "epoch": 670} {"train_loss": -36.62822341918945, "global_step": 81072, "epoch": 670} {"train_loss": -35.49610137939453, "global_step": 81073, "epoch": 670} {"train_loss": -32.48653793334961, "global_step": 81074, "epoch": 670} {"train_loss": -20.135631561279297, "global_step": 81075, "epoch": 670} {"train_loss": -10.953155517578125, "global_step": 81076, "epoch": 670} {"train_loss": -17.484375, "global_step": 81077, "epoch": 670} {"train_loss": -35.8447380065918, "global_step": 81078, "epoch": 670} {"train_loss": -22.739261627197266, "global_step": 81079, "epoch": 670} {"train_loss": -33.23090362548828, "global_step": 81080, "epoch": 670} {"train_loss": -28.894590377807617, "global_step": 81081, "epoch": 670} {"train_loss": -35.14582061767578, "global_step": 81082, "epoch": 670} {"train_loss": -31.429346084594727, "global_step": 81083, "epoch": 670} {"train_loss": -30.082727432250977, "global_step": 81084, "epoch": 670} {"train_loss": -35.266632080078125, "global_step": 81085, "epoch": 670} {"train_loss": -31.11305809020996, "global_step": 81086, "epoch": 670} {"train_loss": -33.14202880859375, "global_step": 81087, "epoch": 670} {"train_loss": -35.04000473022461, "global_step": 81088, "epoch": 670} {"train_loss": -33.350830078125, "global_step": 81089, "epoch": 670} {"train_loss": -33.761741638183594, "global_step": 81090, "epoch": 670} {"train_loss": -34.6403923034668, "global_step": 81091, "epoch": 670} {"train_loss": -35.8132438659668, "global_step": 81092, "epoch": 670} {"train_loss": -34.7051887512207, "global_step": 81093, "epoch": 670} {"train_loss": -34.71786880493164, "global_step": 81094, "epoch": 670} {"train_loss": -35.0081901550293, "global_step": 81095, "epoch": 670} {"train_loss": -36.84669876098633, "global_step": 81096, "epoch": 670} {"train_loss": -35.51981735229492, "global_step": 81097, "epoch": 670} {"train_loss": -34.8856315612793, "global_step": 81098, "epoch": 670} {"train_loss": -33.242069244384766, "global_step": 81099, "epoch": 670} {"train_loss": -35.7485466003418, "global_step": 81100, "epoch": 670} {"train_loss": -36.072906494140625, "global_step": 81101, "epoch": 670} {"train_loss": -33.95426559448242, "global_step": 81102, "epoch": 670} {"train_loss": -36.03884506225586, "global_step": 81103, "epoch": 670} {"train_loss": -35.80121612548828, "global_step": 81104, "epoch": 670} {"train_loss": -35.825897216796875, "global_step": 81105, "epoch": 670} {"train_loss": -34.3030891418457, "global_step": 81106, "epoch": 670} {"train_loss": -35.87492752075195, "global_step": 81107, "epoch": 670} {"train_loss": -33.421844482421875, "global_step": 81108, "epoch": 670} {"train_loss": -35.47321701049805, "global_step": 81109, "epoch": 670} {"train_loss": -36.276222229003906, "global_step": 81110, "epoch": 670} {"train_loss": -35.945552825927734, "global_step": 81111, "epoch": 670} {"train_loss": -36.40640640258789, "global_step": 81112, "epoch": 670} {"train_loss": -35.7962646484375, "global_step": 81113, "epoch": 670} {"train_loss": -35.24396514892578, "global_step": 81114, "epoch": 670} {"train_loss": -36.45798873901367, "global_step": 81115, "epoch": 670} {"train_loss": -35.47529220581055, "global_step": 81116, "epoch": 670} {"train_loss": -36.72935104370117, "global_step": 81117, "epoch": 670} {"train_loss": -35.52948760986328, "global_step": 81118, "epoch": 670} {"train_loss": -35.448631286621094, "global_step": 81119, "epoch": 670} {"train_loss": -35.53010177612305, "global_step": 81120, "epoch": 670} {"train_loss": -36.18933868408203, "global_step": 81121, "epoch": 670} {"train_loss": -36.034523010253906, "global_step": 81122, "epoch": 670} {"train_loss": -35.966651916503906, "global_step": 81123, "epoch": 670} {"train_loss": -36.791725158691406, "global_step": 81124, "epoch": 670} {"train_loss": -36.53837585449219, "global_step": 81125, "epoch": 670} {"train_loss": -36.876922607421875, "global_step": 81126, "epoch": 670} {"train_loss": -36.84618377685547, "global_step": 81127, "epoch": 670} {"train_loss": -36.58216094970703, "global_step": 81128, "epoch": 670} {"train_loss": -36.2292594909668, "global_step": 81129, "epoch": 670} {"train_loss": -36.28379440307617, "global_step": 81130, "epoch": 670} {"train_loss": -36.79810333251953, "global_step": 81131, "epoch": 670} {"train_loss": -36.927494049072266, "global_step": 81132, "epoch": 670} {"train_loss": -36.725650787353516, "global_step": 81133, "epoch": 670} {"train_loss": -36.369529724121094, "global_step": 81134, "epoch": 670} {"train_loss": -36.18305206298828, "global_step": 81135, "epoch": 670} {"train_loss": -36.128395080566406, "global_step": 81136, "epoch": 670} {"train_loss": -37.0163459777832, "global_step": 81137, "epoch": 670} {"train_loss": -37.17513656616211, "global_step": 81138, "epoch": 670} {"train_loss": -37.11898422241211, "global_step": 81139, "epoch": 670} {"train_loss": -36.45542526245117, "global_step": 81140, "epoch": 670} {"train_loss": -37.18952178955078, "global_step": 81141, "epoch": 670} {"train_loss": -37.12220001220703, "global_step": 81142, "epoch": 670} {"train_loss": -37.19428634643555, "global_step": 81143, "epoch": 670} {"train_loss": -37.25966262817383, "global_step": 81144, "epoch": 670} {"train_loss": -37.77808380126953, "global_step": 81145, "epoch": 670} {"train_loss": -37.343605041503906, "global_step": 81146, "epoch": 670} {"train_loss": -37.13493347167969, "global_step": 81147, "epoch": 670} {"train_loss": -37.170162200927734, "global_step": 81148, "epoch": 670} {"train_loss": -36.777217864990234, "global_step": 81149, "epoch": 670} {"train_loss": -37.4629020690918, "global_step": 81150, "epoch": 670} {"train_loss": -37.8607292175293, "global_step": 81151, "epoch": 670} {"train_loss": -37.376834869384766, "global_step": 81152, "epoch": 670} {"train_loss": -37.16371154785156, "global_step": 81153, "epoch": 670} {"train_loss": -36.312007904052734, "global_step": 81154, "epoch": 670} {"train_loss": -37.38730239868164, "global_step": 81155, "epoch": 670} {"train_loss": -35.85602951049805, "global_step": 81156, "epoch": 670} {"train_loss": -33.23048782348633, "global_step": 81157, "epoch": 670} {"train_loss": -35.12386703491211, "global_step": 81158, "epoch": 670} {"train_loss": -37.11532211303711, "global_step": 81159, "epoch": 670} {"train_loss": -36.60049057006836, "global_step": 81160, "epoch": 670} {"train_loss": -37.005489349365234, "global_step": 81161, "epoch": 670} {"train_loss": -37.241424560546875, "global_step": 81162, "epoch": 670} {"train_loss": -35.444759368896484, "global_step": 81163, "epoch": 670} {"train_loss": -37.826595306396484, "global_step": 81164, "epoch": 670} {"train_loss": -36.89874267578125, "global_step": 81165, "epoch": 670} {"train_loss": -37.587646484375, "global_step": 81166, "epoch": 670} {"train_loss": -37.49026107788086, "global_step": 81167, "epoch": 670} {"train_loss": -37.56772994995117, "global_step": 81168, "epoch": 670} {"train_loss": -36.37527084350586, "global_step": 81169, "epoch": 670} {"train_loss": -37.45461654663086, "global_step": 81170, "epoch": 670} {"train_loss": -37.531959533691406, "global_step": 81171, "epoch": 670} {"train_loss": -37.63315963745117, "global_step": 81172, "epoch": 670} {"train_loss": -37.0217170715332, "global_step": 81173, "epoch": 670} {"train_loss": -37.816741943359375, "global_step": 81174, "epoch": 670} {"train_loss": -37.26031494140625, "global_step": 81175, "epoch": 670} {"train_loss": -37.6160774230957, "global_step": 81176, "epoch": 670} {"train_loss": -37.467159271240234, "global_step": 81177, "epoch": 670} {"train_loss": -37.70852279663086, "global_step": 81178, "epoch": 670} {"train_loss": -37.859230041503906, "global_step": 81179, "epoch": 670} {"train_loss": -38.01670837402344, "global_step": 81180, "epoch": 670} {"train_loss": -37.99262619018555, "global_step": 81181, "epoch": 670} {"train_loss": -37.78745651245117, "global_step": 81182, "epoch": 670} {"train_loss": -37.05462646484375, "global_step": 81183, "epoch": 670} {"train_loss": -37.794952392578125, "global_step": 81184, "epoch": 670} {"train_loss": -37.85284423828125, "global_step": 81185, "epoch": 670} {"train_loss": -38.043251037597656, "global_step": 81186, "epoch": 670} {"train_loss": -37.168922424316406, "global_step": 81187, "epoch": 670} {"train_loss": -37.81828308105469, "global_step": 81188, "epoch": 670} {"train_loss": -37.51085662841797, "global_step": 81189, "epoch": 670} {"train_loss": -35.53933920742067, "global_step": 81190, "epoch": 670, "val_loss": 2714558.5} {"train_loss": -37.84873962402344, "global_step": 81191, "epoch": 671} {"train_loss": -37.968727111816406, "global_step": 81192, "epoch": 671} {"train_loss": -37.8787956237793, "global_step": 81193, "epoch": 671} {"train_loss": -36.94147872924805, "global_step": 81194, "epoch": 671} {"train_loss": -37.9403190612793, "global_step": 81195, "epoch": 671} {"train_loss": -38.07424545288086, "global_step": 81196, "epoch": 671} {"train_loss": -37.99197006225586, "global_step": 81197, "epoch": 671} {"train_loss": -37.21010971069336, "global_step": 81198, "epoch": 671} {"train_loss": -38.045814514160156, "global_step": 81199, "epoch": 671} {"train_loss": -36.97544479370117, "global_step": 81200, "epoch": 671} {"train_loss": -37.91532516479492, "global_step": 81201, "epoch": 671} {"train_loss": -37.78664779663086, "global_step": 81202, "epoch": 671} {"train_loss": -37.78998947143555, "global_step": 81203, "epoch": 671} {"train_loss": -37.7069091796875, "global_step": 81204, "epoch": 671} {"train_loss": -37.5004997253418, "global_step": 81205, "epoch": 671} {"train_loss": -37.4820671081543, "global_step": 81206, "epoch": 671} {"train_loss": -37.55812454223633, "global_step": 81207, "epoch": 671} {"train_loss": -37.066749572753906, "global_step": 81208, "epoch": 671} {"train_loss": -37.25218200683594, "global_step": 81209, "epoch": 671} {"train_loss": -37.68337631225586, "global_step": 81210, "epoch": 671} {"train_loss": -37.24971389770508, "global_step": 81211, "epoch": 671} {"train_loss": -38.302940368652344, "global_step": 81212, "epoch": 671} {"train_loss": -37.88462829589844, "global_step": 81213, "epoch": 671} {"train_loss": -38.30445098876953, "global_step": 81214, "epoch": 671} {"train_loss": -38.31023025512695, "global_step": 81215, "epoch": 671} {"train_loss": -37.02511978149414, "global_step": 81216, "epoch": 671} {"train_loss": -36.0922966003418, "global_step": 81217, "epoch": 671} {"train_loss": -34.22817611694336, "global_step": 81218, "epoch": 671} {"train_loss": -37.8031120300293, "global_step": 81219, "epoch": 671} {"train_loss": -37.10700607299805, "global_step": 81220, "epoch": 671} {"train_loss": -36.5004768371582, "global_step": 81221, "epoch": 671} {"train_loss": -32.714115142822266, "global_step": 81222, "epoch": 671} {"train_loss": -29.521869659423828, "global_step": 81223, "epoch": 671} {"train_loss": -34.043006896972656, "global_step": 81224, "epoch": 671} {"train_loss": -34.74711608886719, "global_step": 81225, "epoch": 671} {"train_loss": -31.492033004760742, "global_step": 81226, "epoch": 671} {"train_loss": -31.689001083374023, "global_step": 81227, "epoch": 671} {"train_loss": -34.29469680786133, "global_step": 81228, "epoch": 671} {"train_loss": -33.96084213256836, "global_step": 81229, "epoch": 671} {"train_loss": -29.629535675048828, "global_step": 81230, "epoch": 671} {"train_loss": -30.339826583862305, "global_step": 81231, "epoch": 671} {"train_loss": -31.495136260986328, "global_step": 81232, "epoch": 671} {"train_loss": -34.867279052734375, "global_step": 81233, "epoch": 671} {"train_loss": -31.696125030517578, "global_step": 81234, "epoch": 671} {"train_loss": -30.873809814453125, "global_step": 81235, "epoch": 671} {"train_loss": -35.23066329956055, "global_step": 81236, "epoch": 671} {"train_loss": -33.97612380981445, "global_step": 81237, "epoch": 671} {"train_loss": -26.85886001586914, "global_step": 81238, "epoch": 671} {"train_loss": -34.416900634765625, "global_step": 81239, "epoch": 671} {"train_loss": -34.27244186401367, "global_step": 81240, "epoch": 671} {"train_loss": -33.31912612915039, "global_step": 81241, "epoch": 671} {"train_loss": -34.38835144042969, "global_step": 81242, "epoch": 671} {"train_loss": -29.26450538635254, "global_step": 81243, "epoch": 671} {"train_loss": -31.695077896118164, "global_step": 81244, "epoch": 671} {"train_loss": -34.1800651550293, "global_step": 81245, "epoch": 671} {"train_loss": -33.49465560913086, "global_step": 81246, "epoch": 671} {"train_loss": -33.36207580566406, "global_step": 81247, "epoch": 671} {"train_loss": -33.718868255615234, "global_step": 81248, "epoch": 671} {"train_loss": -32.49518966674805, "global_step": 81249, "epoch": 671} {"train_loss": -33.78709030151367, "global_step": 81250, "epoch": 671} {"train_loss": -33.95253372192383, "global_step": 81251, "epoch": 671} {"train_loss": -33.9086799621582, "global_step": 81252, "epoch": 671} {"train_loss": -35.172119140625, "global_step": 81253, "epoch": 671} {"train_loss": -34.03337097167969, "global_step": 81254, "epoch": 671} {"train_loss": -34.994930267333984, "global_step": 81255, "epoch": 671} {"train_loss": -34.153167724609375, "global_step": 81256, "epoch": 671} {"train_loss": -35.07451248168945, "global_step": 81257, "epoch": 671} {"train_loss": -34.599918365478516, "global_step": 81258, "epoch": 671} {"train_loss": -34.77198791503906, "global_step": 81259, "epoch": 671} {"train_loss": -34.05609130859375, "global_step": 81260, "epoch": 671} {"train_loss": -35.2409553527832, "global_step": 81261, "epoch": 671} {"train_loss": -35.92140579223633, "global_step": 81262, "epoch": 671} {"train_loss": -35.138282775878906, "global_step": 81263, "epoch": 671} {"train_loss": -36.142093658447266, "global_step": 81264, "epoch": 671} {"train_loss": -35.022491455078125, "global_step": 81265, "epoch": 671} {"train_loss": -36.254737854003906, "global_step": 81266, "epoch": 671} {"train_loss": -35.95145034790039, "global_step": 81267, "epoch": 671} {"train_loss": -36.12347412109375, "global_step": 81268, "epoch": 671} {"train_loss": -36.315284729003906, "global_step": 81269, "epoch": 671} {"train_loss": -35.45721435546875, "global_step": 81270, "epoch": 671} {"train_loss": -35.92692184448242, "global_step": 81271, "epoch": 671} {"train_loss": -36.335289001464844, "global_step": 81272, "epoch": 671} {"train_loss": -36.292823791503906, "global_step": 81273, "epoch": 671} {"train_loss": -35.37621307373047, "global_step": 81274, "epoch": 671} {"train_loss": -36.293941497802734, "global_step": 81275, "epoch": 671} {"train_loss": -35.95576858520508, "global_step": 81276, "epoch": 671} {"train_loss": -36.0083122253418, "global_step": 81277, "epoch": 671} {"train_loss": -36.6890754699707, "global_step": 81278, "epoch": 671} {"train_loss": -36.39451217651367, "global_step": 81279, "epoch": 671} {"train_loss": -36.3206901550293, "global_step": 81280, "epoch": 671} {"train_loss": -36.43874740600586, "global_step": 81281, "epoch": 671} {"train_loss": -36.67686080932617, "global_step": 81282, "epoch": 671} {"train_loss": -36.90372848510742, "global_step": 81283, "epoch": 671} {"train_loss": -36.452049255371094, "global_step": 81284, "epoch": 671} {"train_loss": -36.796112060546875, "global_step": 81285, "epoch": 671} {"train_loss": -36.78606414794922, "global_step": 81286, "epoch": 671} {"train_loss": -36.92222595214844, "global_step": 81287, "epoch": 671} {"train_loss": -37.1462516784668, "global_step": 81288, "epoch": 671} {"train_loss": -36.757022857666016, "global_step": 81289, "epoch": 671} {"train_loss": -36.93780517578125, "global_step": 81290, "epoch": 671} {"train_loss": -36.79008483886719, "global_step": 81291, "epoch": 671} {"train_loss": -36.998626708984375, "global_step": 81292, "epoch": 671} {"train_loss": -37.119232177734375, "global_step": 81293, "epoch": 671} {"train_loss": -37.00239181518555, "global_step": 81294, "epoch": 671} {"train_loss": -36.870147705078125, "global_step": 81295, "epoch": 671} {"train_loss": -36.51356887817383, "global_step": 81296, "epoch": 671} {"train_loss": -37.34803009033203, "global_step": 81297, "epoch": 671} {"train_loss": -37.139469146728516, "global_step": 81298, "epoch": 671} {"train_loss": -37.160377502441406, "global_step": 81299, "epoch": 671} {"train_loss": -37.6071662902832, "global_step": 81300, "epoch": 671} {"train_loss": -37.13176345825195, "global_step": 81301, "epoch": 671} {"train_loss": -37.798736572265625, "global_step": 81302, "epoch": 671} {"train_loss": -37.62008285522461, "global_step": 81303, "epoch": 671} {"train_loss": -37.89455795288086, "global_step": 81304, "epoch": 671} {"train_loss": -37.394012451171875, "global_step": 81305, "epoch": 671} {"train_loss": -37.55397415161133, "global_step": 81306, "epoch": 671} {"train_loss": -37.0587272644043, "global_step": 81307, "epoch": 671} {"train_loss": -37.424991607666016, "global_step": 81308, "epoch": 671} {"train_loss": -37.7359619140625, "global_step": 81309, "epoch": 671} {"train_loss": -37.62610626220703, "global_step": 81310, "epoch": 671} {"train_loss": -35.72238712468423, "global_step": 81311, "epoch": 671, "val_loss": 2659568.0} {"train_loss": -37.485511779785156, "global_step": 81312, "epoch": 672} {"train_loss": -37.588619232177734, "global_step": 81313, "epoch": 672} {"train_loss": -37.74506759643555, "global_step": 81314, "epoch": 672} {"train_loss": -37.71165084838867, "global_step": 81315, "epoch": 672} {"train_loss": -38.10610580444336, "global_step": 81316, "epoch": 672} {"train_loss": -36.81222152709961, "global_step": 81317, "epoch": 672} {"train_loss": -37.67132568359375, "global_step": 81318, "epoch": 672} {"train_loss": -37.292816162109375, "global_step": 81319, "epoch": 672} {"train_loss": -33.37068557739258, "global_step": 81320, "epoch": 672} {"train_loss": -22.894865036010742, "global_step": 81321, "epoch": 672} {"train_loss": -25.321985244750977, "global_step": 81322, "epoch": 672} {"train_loss": -35.899288177490234, "global_step": 81323, "epoch": 672} {"train_loss": -17.489599227905273, "global_step": 81324, "epoch": 672} {"train_loss": -35.12504196166992, "global_step": 81325, "epoch": 672} {"train_loss": -18.692371368408203, "global_step": 81326, "epoch": 672} {"train_loss": -34.307373046875, "global_step": 81327, "epoch": 672} {"train_loss": -23.62262535095215, "global_step": 81328, "epoch": 672} {"train_loss": -32.739959716796875, "global_step": 81329, "epoch": 672} {"train_loss": -35.9012451171875, "global_step": 81330, "epoch": 672} {"train_loss": -31.8377685546875, "global_step": 81331, "epoch": 672} {"train_loss": -31.584314346313477, "global_step": 81332, "epoch": 672} {"train_loss": -36.401283264160156, "global_step": 81333, "epoch": 672} {"train_loss": -35.469356536865234, "global_step": 81334, "epoch": 672} {"train_loss": -33.66233444213867, "global_step": 81335, "epoch": 672} {"train_loss": -33.86513137817383, "global_step": 81336, "epoch": 672} {"train_loss": -36.0435905456543, "global_step": 81337, "epoch": 672} {"train_loss": -36.07045364379883, "global_step": 81338, "epoch": 672} {"train_loss": -35.511619567871094, "global_step": 81339, "epoch": 672} {"train_loss": -35.8402214050293, "global_step": 81340, "epoch": 672} {"train_loss": -34.291748046875, "global_step": 81341, "epoch": 672} {"train_loss": -36.20048904418945, "global_step": 81342, "epoch": 672} {"train_loss": -36.68233871459961, "global_step": 81343, "epoch": 672} {"train_loss": -36.670658111572266, "global_step": 81344, "epoch": 672} {"train_loss": -36.282752990722656, "global_step": 81345, "epoch": 672} {"train_loss": -36.1581916809082, "global_step": 81346, "epoch": 672} {"train_loss": -36.64274215698242, "global_step": 81347, "epoch": 672} {"train_loss": -37.05524444580078, "global_step": 81348, "epoch": 672} {"train_loss": -37.25819396972656, "global_step": 81349, "epoch": 672} {"train_loss": -36.93193435668945, "global_step": 81350, "epoch": 672} {"train_loss": -37.676204681396484, "global_step": 81351, "epoch": 672} {"train_loss": -36.70393753051758, "global_step": 81352, "epoch": 672} {"train_loss": -37.13866424560547, "global_step": 81353, "epoch": 672} {"train_loss": -37.30863571166992, "global_step": 81354, "epoch": 672} {"train_loss": -36.76240539550781, "global_step": 81355, "epoch": 672} {"train_loss": -37.177982330322266, "global_step": 81356, "epoch": 672} {"train_loss": -37.26226043701172, "global_step": 81357, "epoch": 672} {"train_loss": -37.69846725463867, "global_step": 81358, "epoch": 672} {"train_loss": -36.869388580322266, "global_step": 81359, "epoch": 672} {"train_loss": -37.144439697265625, "global_step": 81360, "epoch": 672} {"train_loss": -37.3847770690918, "global_step": 81361, "epoch": 672} {"train_loss": -37.58620834350586, "global_step": 81362, "epoch": 672} {"train_loss": -36.97922897338867, "global_step": 81363, "epoch": 672} {"train_loss": -37.14326477050781, "global_step": 81364, "epoch": 672} {"train_loss": -37.180599212646484, "global_step": 81365, "epoch": 672} {"train_loss": -37.25273132324219, "global_step": 81366, "epoch": 672} {"train_loss": -37.114845275878906, "global_step": 81367, "epoch": 672} {"train_loss": -37.5167236328125, "global_step": 81368, "epoch": 672} {"train_loss": -38.03927993774414, "global_step": 81369, "epoch": 672} {"train_loss": -37.2765998840332, "global_step": 81370, "epoch": 672} {"train_loss": -37.814144134521484, "global_step": 81371, "epoch": 672} {"train_loss": -37.81727600097656, "global_step": 81372, "epoch": 672} {"train_loss": -37.1814079284668, "global_step": 81373, "epoch": 672} {"train_loss": -37.30288314819336, "global_step": 81374, "epoch": 672} {"train_loss": -37.84187698364258, "global_step": 81375, "epoch": 672} {"train_loss": -37.97066879272461, "global_step": 81376, "epoch": 672} {"train_loss": -37.4836540222168, "global_step": 81377, "epoch": 672} {"train_loss": -37.935787200927734, "global_step": 81378, "epoch": 672} {"train_loss": -37.74512481689453, "global_step": 81379, "epoch": 672} {"train_loss": -37.988197326660156, "global_step": 81380, "epoch": 672} {"train_loss": -38.12614059448242, "global_step": 81381, "epoch": 672} {"train_loss": -38.34653854370117, "global_step": 81382, "epoch": 672} {"train_loss": -37.30172348022461, "global_step": 81383, "epoch": 672} {"train_loss": -37.161556243896484, "global_step": 81384, "epoch": 672} {"train_loss": -37.86015701293945, "global_step": 81385, "epoch": 672} {"train_loss": -37.92836380004883, "global_step": 81386, "epoch": 672} {"train_loss": -37.018035888671875, "global_step": 81387, "epoch": 672} {"train_loss": -37.34748077392578, "global_step": 81388, "epoch": 672} {"train_loss": -35.6563606262207, "global_step": 81389, "epoch": 672} {"train_loss": -34.290950775146484, "global_step": 81390, "epoch": 672} {"train_loss": -31.3873348236084, "global_step": 81391, "epoch": 672} {"train_loss": -32.92190170288086, "global_step": 81392, "epoch": 672} {"train_loss": -37.07374572753906, "global_step": 81393, "epoch": 672} {"train_loss": -34.69792556762695, "global_step": 81394, "epoch": 672} {"train_loss": -35.1744270324707, "global_step": 81395, "epoch": 672} {"train_loss": -35.11737060546875, "global_step": 81396, "epoch": 672} {"train_loss": -35.056007385253906, "global_step": 81397, "epoch": 672} {"train_loss": -36.903472900390625, "global_step": 81398, "epoch": 672} {"train_loss": -34.7675895690918, "global_step": 81399, "epoch": 672} {"train_loss": -36.33320236206055, "global_step": 81400, "epoch": 672} {"train_loss": -36.50952911376953, "global_step": 81401, "epoch": 672} {"train_loss": -36.88254928588867, "global_step": 81402, "epoch": 672} {"train_loss": -35.1146125793457, "global_step": 81403, "epoch": 672} {"train_loss": -37.06100082397461, "global_step": 81404, "epoch": 672} {"train_loss": -35.53800582885742, "global_step": 81405, "epoch": 672} {"train_loss": -36.709320068359375, "global_step": 81406, "epoch": 672} {"train_loss": -34.7711181640625, "global_step": 81407, "epoch": 672} {"train_loss": -36.836669921875, "global_step": 81408, "epoch": 672} {"train_loss": -35.3116340637207, "global_step": 81409, "epoch": 672} {"train_loss": -35.59975051879883, "global_step": 81410, "epoch": 672} {"train_loss": -36.98736572265625, "global_step": 81411, "epoch": 672} {"train_loss": -36.6763801574707, "global_step": 81412, "epoch": 672} {"train_loss": -36.223480224609375, "global_step": 81413, "epoch": 672} {"train_loss": -36.179744720458984, "global_step": 81414, "epoch": 672} {"train_loss": -35.96289825439453, "global_step": 81415, "epoch": 672} {"train_loss": -35.91071701049805, "global_step": 81416, "epoch": 672} {"train_loss": -36.89736557006836, "global_step": 81417, "epoch": 672} {"train_loss": -36.72649383544922, "global_step": 81418, "epoch": 672} {"train_loss": -37.357147216796875, "global_step": 81419, "epoch": 672} {"train_loss": -36.59009552001953, "global_step": 81420, "epoch": 672} {"train_loss": -35.115577697753906, "global_step": 81421, "epoch": 672} {"train_loss": -36.786739349365234, "global_step": 81422, "epoch": 672} {"train_loss": -37.175933837890625, "global_step": 81423, "epoch": 672} {"train_loss": -36.77473068237305, "global_step": 81424, "epoch": 672} {"train_loss": -36.70402145385742, "global_step": 81425, "epoch": 672} {"train_loss": -37.19390106201172, "global_step": 81426, "epoch": 672} {"train_loss": -36.58790969848633, "global_step": 81427, "epoch": 672} {"train_loss": -37.53944778442383, "global_step": 81428, "epoch": 672} {"train_loss": -36.31185531616211, "global_step": 81429, "epoch": 672} {"train_loss": -36.27061080932617, "global_step": 81430, "epoch": 672} {"train_loss": -36.549922943115234, "global_step": 81431, "epoch": 672} {"train_loss": -35.82381524330329, "global_step": 81432, "epoch": 672, "val_loss": 2676017.0} {"train_loss": -35.5163688659668, "global_step": 81433, "epoch": 673} {"train_loss": -37.37157440185547, "global_step": 81434, "epoch": 673} {"train_loss": -37.257686614990234, "global_step": 81435, "epoch": 673} {"train_loss": -37.272090911865234, "global_step": 81436, "epoch": 673} {"train_loss": -37.2708625793457, "global_step": 81437, "epoch": 673} {"train_loss": -37.20015335083008, "global_step": 81438, "epoch": 673} {"train_loss": -37.176082611083984, "global_step": 81439, "epoch": 673} {"train_loss": -37.70602035522461, "global_step": 81440, "epoch": 673} {"train_loss": -33.25514602661133, "global_step": 81441, "epoch": 673} {"train_loss": -36.87746810913086, "global_step": 81442, "epoch": 673} {"train_loss": -37.02260971069336, "global_step": 81443, "epoch": 673} {"train_loss": -37.5352783203125, "global_step": 81444, "epoch": 673} {"train_loss": -36.69999313354492, "global_step": 81445, "epoch": 673} {"train_loss": -36.74911117553711, "global_step": 81446, "epoch": 673} {"train_loss": -36.215797424316406, "global_step": 81447, "epoch": 673} {"train_loss": -37.05127716064453, "global_step": 81448, "epoch": 673} {"train_loss": -37.3329963684082, "global_step": 81449, "epoch": 673} {"train_loss": -36.917091369628906, "global_step": 81450, "epoch": 673} {"train_loss": -34.71636962890625, "global_step": 81451, "epoch": 673} {"train_loss": -36.15183639526367, "global_step": 81452, "epoch": 673} {"train_loss": -37.33266067504883, "global_step": 81453, "epoch": 673} {"train_loss": -37.134029388427734, "global_step": 81454, "epoch": 673} {"train_loss": -36.05769348144531, "global_step": 81455, "epoch": 673} {"train_loss": -35.214385986328125, "global_step": 81456, "epoch": 673} {"train_loss": -36.49692153930664, "global_step": 81457, "epoch": 673} {"train_loss": -37.963096618652344, "global_step": 81458, "epoch": 673} {"train_loss": -34.00343322753906, "global_step": 81459, "epoch": 673} {"train_loss": -35.1319694519043, "global_step": 81460, "epoch": 673} {"train_loss": -36.605648040771484, "global_step": 81461, "epoch": 673} {"train_loss": -36.71305847167969, "global_step": 81462, "epoch": 673} {"train_loss": -37.52815628051758, "global_step": 81463, "epoch": 673} {"train_loss": -35.99951934814453, "global_step": 81464, "epoch": 673} {"train_loss": -34.98862838745117, "global_step": 81465, "epoch": 673} {"train_loss": -35.289772033691406, "global_step": 81466, "epoch": 673} {"train_loss": -36.894527435302734, "global_step": 81467, "epoch": 673} {"train_loss": -37.071136474609375, "global_step": 81468, "epoch": 673} {"train_loss": -35.115692138671875, "global_step": 81469, "epoch": 673} {"train_loss": -37.04610824584961, "global_step": 81470, "epoch": 673} {"train_loss": -37.01937484741211, "global_step": 81471, "epoch": 673} {"train_loss": -36.787044525146484, "global_step": 81472, "epoch": 673} {"train_loss": -37.10818099975586, "global_step": 81473, "epoch": 673} {"train_loss": -37.32373046875, "global_step": 81474, "epoch": 673} {"train_loss": -37.85783767700195, "global_step": 81475, "epoch": 673} {"train_loss": -36.25558090209961, "global_step": 81476, "epoch": 673} {"train_loss": -37.49370193481445, "global_step": 81477, "epoch": 673} {"train_loss": -37.546810150146484, "global_step": 81478, "epoch": 673} {"train_loss": -37.20966720581055, "global_step": 81479, "epoch": 673} {"train_loss": -37.795223236083984, "global_step": 81480, "epoch": 673} {"train_loss": -37.18508529663086, "global_step": 81481, "epoch": 673} {"train_loss": -37.1535530090332, "global_step": 81482, "epoch": 673} {"train_loss": -37.90442657470703, "global_step": 81483, "epoch": 673} {"train_loss": -37.6076774597168, "global_step": 81484, "epoch": 673} {"train_loss": -36.05047607421875, "global_step": 81485, "epoch": 673} {"train_loss": -37.10550308227539, "global_step": 81486, "epoch": 673} {"train_loss": -36.939002990722656, "global_step": 81487, "epoch": 673} {"train_loss": -37.606075286865234, "global_step": 81488, "epoch": 673} {"train_loss": -37.72220993041992, "global_step": 81489, "epoch": 673} {"train_loss": -37.6478157043457, "global_step": 81490, "epoch": 673} {"train_loss": -37.788482666015625, "global_step": 81491, "epoch": 673} {"train_loss": -37.42079544067383, "global_step": 81492, "epoch": 673} {"train_loss": -37.85854721069336, "global_step": 81493, "epoch": 673} {"train_loss": -37.10459518432617, "global_step": 81494, "epoch": 673} {"train_loss": -36.25479507446289, "global_step": 81495, "epoch": 673} {"train_loss": -37.22060012817383, "global_step": 81496, "epoch": 673} {"train_loss": -37.643409729003906, "global_step": 81497, "epoch": 673} {"train_loss": -37.17902755737305, "global_step": 81498, "epoch": 673} {"train_loss": -37.463253021240234, "global_step": 81499, "epoch": 673} {"train_loss": -37.51432418823242, "global_step": 81500, "epoch": 673} {"train_loss": -37.093448638916016, "global_step": 81501, "epoch": 673} {"train_loss": -37.2929573059082, "global_step": 81502, "epoch": 673} {"train_loss": -37.68291091918945, "global_step": 81503, "epoch": 673} {"train_loss": -37.383480072021484, "global_step": 81504, "epoch": 673} {"train_loss": -38.03900146484375, "global_step": 81505, "epoch": 673} {"train_loss": -37.01652145385742, "global_step": 81506, "epoch": 673} {"train_loss": -37.5187873840332, "global_step": 81507, "epoch": 673} {"train_loss": -36.65024185180664, "global_step": 81508, "epoch": 673} {"train_loss": -37.63106918334961, "global_step": 81509, "epoch": 673} {"train_loss": -37.78312301635742, "global_step": 81510, "epoch": 673} {"train_loss": -37.57716751098633, "global_step": 81511, "epoch": 673} {"train_loss": -37.56443405151367, "global_step": 81512, "epoch": 673} {"train_loss": -37.84267807006836, "global_step": 81513, "epoch": 673} {"train_loss": -36.633113861083984, "global_step": 81514, "epoch": 673} {"train_loss": -38.11882019042969, "global_step": 81515, "epoch": 673} {"train_loss": -37.4345817565918, "global_step": 81516, "epoch": 673} {"train_loss": -37.584693908691406, "global_step": 81517, "epoch": 673} {"train_loss": -38.1956901550293, "global_step": 81518, "epoch": 673} {"train_loss": -38.0548210144043, "global_step": 81519, "epoch": 673} {"train_loss": -37.66615676879883, "global_step": 81520, "epoch": 673} {"train_loss": -38.049015045166016, "global_step": 81521, "epoch": 673} {"train_loss": -37.80684280395508, "global_step": 81522, "epoch": 673} {"train_loss": -37.218936920166016, "global_step": 81523, "epoch": 673} {"train_loss": -37.580360412597656, "global_step": 81524, "epoch": 673} {"train_loss": -38.21657180786133, "global_step": 81525, "epoch": 673} {"train_loss": -37.80908203125, "global_step": 81526, "epoch": 673} {"train_loss": -34.83579635620117, "global_step": 81527, "epoch": 673} {"train_loss": -32.9620475769043, "global_step": 81528, "epoch": 673} {"train_loss": -31.560468673706055, "global_step": 81529, "epoch": 673} {"train_loss": -37.118629455566406, "global_step": 81530, "epoch": 673} {"train_loss": -35.48918533325195, "global_step": 81531, "epoch": 673} {"train_loss": -27.62554931640625, "global_step": 81532, "epoch": 673} {"train_loss": -21.627553939819336, "global_step": 81533, "epoch": 673} {"train_loss": -31.067636489868164, "global_step": 81534, "epoch": 673} {"train_loss": -36.60103988647461, "global_step": 81535, "epoch": 673} {"train_loss": -34.70322799682617, "global_step": 81536, "epoch": 673} {"train_loss": -34.80509567260742, "global_step": 81537, "epoch": 673} {"train_loss": -35.52094268798828, "global_step": 81538, "epoch": 673} {"train_loss": -33.9467887878418, "global_step": 81539, "epoch": 673} {"train_loss": -36.81196212768555, "global_step": 81540, "epoch": 673} {"train_loss": -37.15935516357422, "global_step": 81541, "epoch": 673} {"train_loss": -35.08942794799805, "global_step": 81542, "epoch": 673} {"train_loss": -36.954471588134766, "global_step": 81543, "epoch": 673} {"train_loss": -36.97214889526367, "global_step": 81544, "epoch": 673} {"train_loss": -37.1092414855957, "global_step": 81545, "epoch": 673} {"train_loss": -36.82918167114258, "global_step": 81546, "epoch": 673} {"train_loss": -37.00979232788086, "global_step": 81547, "epoch": 673} {"train_loss": -37.18192672729492, "global_step": 81548, "epoch": 673} {"train_loss": -37.325618743896484, "global_step": 81549, "epoch": 673} {"train_loss": -37.48405075073242, "global_step": 81550, "epoch": 673} {"train_loss": -37.445865631103516, "global_step": 81551, "epoch": 673} {"train_loss": -37.27195358276367, "global_step": 81552, "epoch": 673} {"train_loss": -36.5947466605951, "global_step": 81553, "epoch": 673, "val_loss": 2592870.25} {"train_loss": -37.54478073120117, "global_step": 81554, "epoch": 674} {"train_loss": -37.133705139160156, "global_step": 81555, "epoch": 674} {"train_loss": -37.77789306640625, "global_step": 81556, "epoch": 674} {"train_loss": -36.846431732177734, "global_step": 81557, "epoch": 674} {"train_loss": -37.22871017456055, "global_step": 81558, "epoch": 674} {"train_loss": -37.828182220458984, "global_step": 81559, "epoch": 674} {"train_loss": -37.044612884521484, "global_step": 81560, "epoch": 674} {"train_loss": -37.631656646728516, "global_step": 81561, "epoch": 674} {"train_loss": -37.984886169433594, "global_step": 81562, "epoch": 674} {"train_loss": -37.249507904052734, "global_step": 81563, "epoch": 674} {"train_loss": -37.802642822265625, "global_step": 81564, "epoch": 674} {"train_loss": -37.95933151245117, "global_step": 81565, "epoch": 674} {"train_loss": -37.32205581665039, "global_step": 81566, "epoch": 674} {"train_loss": -37.76041030883789, "global_step": 81567, "epoch": 674} {"train_loss": -37.88382339477539, "global_step": 81568, "epoch": 674} {"train_loss": -37.31344223022461, "global_step": 81569, "epoch": 674} {"train_loss": -37.889156341552734, "global_step": 81570, "epoch": 674} {"train_loss": -37.855690002441406, "global_step": 81571, "epoch": 674} {"train_loss": -38.12563705444336, "global_step": 81572, "epoch": 674} {"train_loss": -38.0152702331543, "global_step": 81573, "epoch": 674} {"train_loss": -37.50698471069336, "global_step": 81574, "epoch": 674} {"train_loss": -38.2287483215332, "global_step": 81575, "epoch": 674} {"train_loss": -38.040218353271484, "global_step": 81576, "epoch": 674} {"train_loss": -37.84511947631836, "global_step": 81577, "epoch": 674} {"train_loss": -38.399383544921875, "global_step": 81578, "epoch": 674} {"train_loss": -38.142513275146484, "global_step": 81579, "epoch": 674} {"train_loss": -38.238319396972656, "global_step": 81580, "epoch": 674} {"train_loss": -38.42844009399414, "global_step": 81581, "epoch": 674} {"train_loss": -38.61669158935547, "global_step": 81582, "epoch": 674} {"train_loss": -38.131404876708984, "global_step": 81583, "epoch": 674} {"train_loss": -38.32648468017578, "global_step": 81584, "epoch": 674} {"train_loss": -37.21779251098633, "global_step": 81585, "epoch": 674} {"train_loss": -37.97174072265625, "global_step": 81586, "epoch": 674} {"train_loss": -37.64406204223633, "global_step": 81587, "epoch": 674} {"train_loss": -38.30912780761719, "global_step": 81588, "epoch": 674} {"train_loss": -37.80593490600586, "global_step": 81589, "epoch": 674} {"train_loss": -37.1116828918457, "global_step": 81590, "epoch": 674} {"train_loss": -38.12164306640625, "global_step": 81591, "epoch": 674} {"train_loss": -37.118934631347656, "global_step": 81592, "epoch": 674} {"train_loss": -36.150489807128906, "global_step": 81593, "epoch": 674} {"train_loss": -34.5948600769043, "global_step": 81594, "epoch": 674} {"train_loss": -34.15000534057617, "global_step": 81595, "epoch": 674} {"train_loss": -34.77435302734375, "global_step": 81596, "epoch": 674} {"train_loss": -37.42531967163086, "global_step": 81597, "epoch": 674} {"train_loss": -36.6224250793457, "global_step": 81598, "epoch": 674} {"train_loss": -36.16246032714844, "global_step": 81599, "epoch": 674} {"train_loss": -36.3565559387207, "global_step": 81600, "epoch": 674} {"train_loss": -36.944705963134766, "global_step": 81601, "epoch": 674} {"train_loss": -37.113338470458984, "global_step": 81602, "epoch": 674} {"train_loss": -37.33304977416992, "global_step": 81603, "epoch": 674} {"train_loss": -37.478118896484375, "global_step": 81604, "epoch": 674} {"train_loss": -34.23823165893555, "global_step": 81605, "epoch": 674} {"train_loss": -36.94222640991211, "global_step": 81606, "epoch": 674} {"train_loss": -37.699615478515625, "global_step": 81607, "epoch": 674} {"train_loss": -37.32613754272461, "global_step": 81608, "epoch": 674} {"train_loss": -35.840938568115234, "global_step": 81609, "epoch": 674} {"train_loss": -38.150665283203125, "global_step": 81610, "epoch": 674} {"train_loss": -37.55719757080078, "global_step": 81611, "epoch": 674} {"train_loss": -31.768186569213867, "global_step": 81612, "epoch": 674} {"train_loss": -36.62788009643555, "global_step": 81613, "epoch": 674} {"train_loss": -37.22280502319336, "global_step": 81614, "epoch": 674} {"train_loss": -33.403045654296875, "global_step": 81615, "epoch": 674} {"train_loss": -33.545867919921875, "global_step": 81616, "epoch": 674} {"train_loss": -33.8040885925293, "global_step": 81617, "epoch": 674} {"train_loss": -36.685462951660156, "global_step": 81618, "epoch": 674} {"train_loss": -34.11541748046875, "global_step": 81619, "epoch": 674} {"train_loss": -36.38983154296875, "global_step": 81620, "epoch": 674} {"train_loss": -36.37958908081055, "global_step": 81621, "epoch": 674} {"train_loss": -36.4527587890625, "global_step": 81622, "epoch": 674} {"train_loss": -33.319271087646484, "global_step": 81623, "epoch": 674} {"train_loss": -33.05270004272461, "global_step": 81624, "epoch": 674} {"train_loss": -36.445465087890625, "global_step": 81625, "epoch": 674} {"train_loss": -36.198665618896484, "global_step": 81626, "epoch": 674} {"train_loss": -31.642608642578125, "global_step": 81627, "epoch": 674} {"train_loss": -36.178558349609375, "global_step": 81628, "epoch": 674} {"train_loss": -35.734249114990234, "global_step": 81629, "epoch": 674} {"train_loss": -35.42452621459961, "global_step": 81630, "epoch": 674} {"train_loss": -35.71950912475586, "global_step": 81631, "epoch": 674} {"train_loss": -32.53572082519531, "global_step": 81632, "epoch": 674} {"train_loss": -34.42536544799805, "global_step": 81633, "epoch": 674} {"train_loss": -35.75956726074219, "global_step": 81634, "epoch": 674} {"train_loss": -36.38682174682617, "global_step": 81635, "epoch": 674} {"train_loss": -35.113460540771484, "global_step": 81636, "epoch": 674} {"train_loss": -36.133724212646484, "global_step": 81637, "epoch": 674} {"train_loss": -35.509090423583984, "global_step": 81638, "epoch": 674} {"train_loss": -35.8006706237793, "global_step": 81639, "epoch": 674} {"train_loss": -36.14164352416992, "global_step": 81640, "epoch": 674} {"train_loss": -35.25338363647461, "global_step": 81641, "epoch": 674} {"train_loss": -35.99695587158203, "global_step": 81642, "epoch": 674} {"train_loss": -35.63912582397461, "global_step": 81643, "epoch": 674} {"train_loss": -36.09290313720703, "global_step": 81644, "epoch": 674} {"train_loss": -35.76621627807617, "global_step": 81645, "epoch": 674} {"train_loss": -36.64889144897461, "global_step": 81646, "epoch": 674} {"train_loss": -36.675628662109375, "global_step": 81647, "epoch": 674} {"train_loss": -36.33103561401367, "global_step": 81648, "epoch": 674} {"train_loss": -36.54024124145508, "global_step": 81649, "epoch": 674} {"train_loss": -36.263031005859375, "global_step": 81650, "epoch": 674} {"train_loss": -36.60953903198242, "global_step": 81651, "epoch": 674} {"train_loss": -35.747169494628906, "global_step": 81652, "epoch": 674} {"train_loss": -36.48521041870117, "global_step": 81653, "epoch": 674} {"train_loss": -34.91642379760742, "global_step": 81654, "epoch": 674} {"train_loss": -36.19232940673828, "global_step": 81655, "epoch": 674} {"train_loss": -36.78239059448242, "global_step": 81656, "epoch": 674} {"train_loss": -36.66537094116211, "global_step": 81657, "epoch": 674} {"train_loss": -37.047969818115234, "global_step": 81658, "epoch": 674} {"train_loss": -36.79730224609375, "global_step": 81659, "epoch": 674} {"train_loss": -37.142879486083984, "global_step": 81660, "epoch": 674} {"train_loss": -37.16469955444336, "global_step": 81661, "epoch": 674} {"train_loss": -37.119239807128906, "global_step": 81662, "epoch": 674} {"train_loss": -36.39466094970703, "global_step": 81663, "epoch": 674} {"train_loss": -37.15322494506836, "global_step": 81664, "epoch": 674} {"train_loss": -36.86629104614258, "global_step": 81665, "epoch": 674} {"train_loss": -37.00675582885742, "global_step": 81666, "epoch": 674} {"train_loss": -36.580684661865234, "global_step": 81667, "epoch": 674} {"train_loss": -37.384307861328125, "global_step": 81668, "epoch": 674} {"train_loss": -36.49164962768555, "global_step": 81669, "epoch": 674} {"train_loss": -35.743629455566406, "global_step": 81670, "epoch": 674} {"train_loss": -36.9334716796875, "global_step": 81671, "epoch": 674} {"train_loss": -36.54299545288086, "global_step": 81672, "epoch": 674} {"train_loss": -37.463260650634766, "global_step": 81673, "epoch": 674} {"train_loss": -36.57410990502223, "global_step": 81674, "epoch": 674, "val_loss": 2671719.75} {"train_loss": -37.412322998046875, "global_step": 81675, "epoch": 675} {"train_loss": -37.2044677734375, "global_step": 81676, "epoch": 675} {"train_loss": -36.37369918823242, "global_step": 81677, "epoch": 675} {"train_loss": -36.84225082397461, "global_step": 81678, "epoch": 675} {"train_loss": -37.205055236816406, "global_step": 81679, "epoch": 675} {"train_loss": -36.8829345703125, "global_step": 81680, "epoch": 675} {"train_loss": -37.34595489501953, "global_step": 81681, "epoch": 675} {"train_loss": -37.7577018737793, "global_step": 81682, "epoch": 675} {"train_loss": -37.142704010009766, "global_step": 81683, "epoch": 675} {"train_loss": -37.49515914916992, "global_step": 81684, "epoch": 675} {"train_loss": -37.53559112548828, "global_step": 81685, "epoch": 675} {"train_loss": -37.50937271118164, "global_step": 81686, "epoch": 675} {"train_loss": -36.90331268310547, "global_step": 81687, "epoch": 675} {"train_loss": -38.10356521606445, "global_step": 81688, "epoch": 675} {"train_loss": -36.29548645019531, "global_step": 81689, "epoch": 675} {"train_loss": -36.96433639526367, "global_step": 81690, "epoch": 675} {"train_loss": -37.6766471862793, "global_step": 81691, "epoch": 675} {"train_loss": -37.58143997192383, "global_step": 81692, "epoch": 675} {"train_loss": -36.97400665283203, "global_step": 81693, "epoch": 675} {"train_loss": -36.69926071166992, "global_step": 81694, "epoch": 675} {"train_loss": -37.0078125, "global_step": 81695, "epoch": 675} {"train_loss": -37.40922927856445, "global_step": 81696, "epoch": 675} {"train_loss": -37.523128509521484, "global_step": 81697, "epoch": 675} {"train_loss": -33.760433197021484, "global_step": 81698, "epoch": 675} {"train_loss": -30.236806869506836, "global_step": 81699, "epoch": 675} {"train_loss": -28.896215438842773, "global_step": 81700, "epoch": 675} {"train_loss": -30.396921157836914, "global_step": 81701, "epoch": 675} {"train_loss": -35.721282958984375, "global_step": 81702, "epoch": 675} {"train_loss": -35.47372055053711, "global_step": 81703, "epoch": 675} {"train_loss": -32.246578216552734, "global_step": 81704, "epoch": 675} {"train_loss": -34.9119758605957, "global_step": 81705, "epoch": 675} {"train_loss": -35.5106086730957, "global_step": 81706, "epoch": 675} {"train_loss": -35.38749313354492, "global_step": 81707, "epoch": 675} {"train_loss": -35.19386672973633, "global_step": 81708, "epoch": 675} {"train_loss": -36.85758590698242, "global_step": 81709, "epoch": 675} {"train_loss": -33.79052734375, "global_step": 81710, "epoch": 675} {"train_loss": -37.14547348022461, "global_step": 81711, "epoch": 675} {"train_loss": -36.38931655883789, "global_step": 81712, "epoch": 675} {"train_loss": -36.882137298583984, "global_step": 81713, "epoch": 675} {"train_loss": -36.90057373046875, "global_step": 81714, "epoch": 675} {"train_loss": -36.60036087036133, "global_step": 81715, "epoch": 675} {"train_loss": -37.3248405456543, "global_step": 81716, "epoch": 675} {"train_loss": -36.9959716796875, "global_step": 81717, "epoch": 675} {"train_loss": -37.59771728515625, "global_step": 81718, "epoch": 675} {"train_loss": -37.03473663330078, "global_step": 81719, "epoch": 675} {"train_loss": -37.65803909301758, "global_step": 81720, "epoch": 675} {"train_loss": -37.035133361816406, "global_step": 81721, "epoch": 675} {"train_loss": -37.645015716552734, "global_step": 81722, "epoch": 675} {"train_loss": -37.37093734741211, "global_step": 81723, "epoch": 675} {"train_loss": -37.052162170410156, "global_step": 81724, "epoch": 675} {"train_loss": -37.200923919677734, "global_step": 81725, "epoch": 675} {"train_loss": -38.408042907714844, "global_step": 81726, "epoch": 675} {"train_loss": -37.75246047973633, "global_step": 81727, "epoch": 675} {"train_loss": -38.14162826538086, "global_step": 81728, "epoch": 675} {"train_loss": -37.83677291870117, "global_step": 81729, "epoch": 675} {"train_loss": -37.961429595947266, "global_step": 81730, "epoch": 675} {"train_loss": -37.685970306396484, "global_step": 81731, "epoch": 675} {"train_loss": -37.93364334106445, "global_step": 81732, "epoch": 675} {"train_loss": -37.727447509765625, "global_step": 81733, "epoch": 675} {"train_loss": -37.5405387878418, "global_step": 81734, "epoch": 675} {"train_loss": -37.53505325317383, "global_step": 81735, "epoch": 675} {"train_loss": -38.148311614990234, "global_step": 81736, "epoch": 675} {"train_loss": -37.52200698852539, "global_step": 81737, "epoch": 675} {"train_loss": -38.0173225402832, "global_step": 81738, "epoch": 675} {"train_loss": -37.97148513793945, "global_step": 81739, "epoch": 675} {"train_loss": -37.61420440673828, "global_step": 81740, "epoch": 675} {"train_loss": -38.220455169677734, "global_step": 81741, "epoch": 675} {"train_loss": -38.17216873168945, "global_step": 81742, "epoch": 675} {"train_loss": -38.440059661865234, "global_step": 81743, "epoch": 675} {"train_loss": -38.63620376586914, "global_step": 81744, "epoch": 675} {"train_loss": -38.470603942871094, "global_step": 81745, "epoch": 675} {"train_loss": -38.537471771240234, "global_step": 81746, "epoch": 675} {"train_loss": -37.52170944213867, "global_step": 81747, "epoch": 675} {"train_loss": -38.270469665527344, "global_step": 81748, "epoch": 675} {"train_loss": -37.8194580078125, "global_step": 81749, "epoch": 675} {"train_loss": -37.66372299194336, "global_step": 81750, "epoch": 675} {"train_loss": -37.87335205078125, "global_step": 81751, "epoch": 675} {"train_loss": -38.23553466796875, "global_step": 81752, "epoch": 675} {"train_loss": -37.81877517700195, "global_step": 81753, "epoch": 675} {"train_loss": -38.48637771606445, "global_step": 81754, "epoch": 675} {"train_loss": -37.53955078125, "global_step": 81755, "epoch": 675} {"train_loss": -36.95929718017578, "global_step": 81756, "epoch": 675} {"train_loss": -37.586341857910156, "global_step": 81757, "epoch": 675} {"train_loss": -37.671058654785156, "global_step": 81758, "epoch": 675} {"train_loss": -38.307899475097656, "global_step": 81759, "epoch": 675} {"train_loss": -38.411659240722656, "global_step": 81760, "epoch": 675} {"train_loss": -37.85526657104492, "global_step": 81761, "epoch": 675} {"train_loss": -38.0010871887207, "global_step": 81762, "epoch": 675} {"train_loss": -37.6499137878418, "global_step": 81763, "epoch": 675} {"train_loss": -37.36591720581055, "global_step": 81764, "epoch": 675} {"train_loss": -37.935787200927734, "global_step": 81765, "epoch": 675} {"train_loss": -38.02796173095703, "global_step": 81766, "epoch": 675} {"train_loss": -37.883949279785156, "global_step": 81767, "epoch": 675} {"train_loss": -37.8760986328125, "global_step": 81768, "epoch": 675} {"train_loss": -38.15784454345703, "global_step": 81769, "epoch": 675} {"train_loss": -36.641292572021484, "global_step": 81770, "epoch": 675} {"train_loss": -36.747615814208984, "global_step": 81771, "epoch": 675} {"train_loss": -38.068809509277344, "global_step": 81772, "epoch": 675} {"train_loss": -38.14918899536133, "global_step": 81773, "epoch": 675} {"train_loss": -37.75104904174805, "global_step": 81774, "epoch": 675} {"train_loss": -37.9043083190918, "global_step": 81775, "epoch": 675} {"train_loss": -38.3947639465332, "global_step": 81776, "epoch": 675} {"train_loss": -37.26716232299805, "global_step": 81777, "epoch": 675} {"train_loss": -35.912776947021484, "global_step": 81778, "epoch": 675} {"train_loss": -35.59749221801758, "global_step": 81779, "epoch": 675} {"train_loss": -37.0173454284668, "global_step": 81780, "epoch": 675} {"train_loss": -37.747039794921875, "global_step": 81781, "epoch": 675} {"train_loss": -36.23247146606445, "global_step": 81782, "epoch": 675} {"train_loss": -36.41665267944336, "global_step": 81783, "epoch": 675} {"train_loss": -37.825477600097656, "global_step": 81784, "epoch": 675} {"train_loss": -37.05177307128906, "global_step": 81785, "epoch": 675} {"train_loss": -36.5125846862793, "global_step": 81786, "epoch": 675} {"train_loss": -37.95119857788086, "global_step": 81787, "epoch": 675} {"train_loss": -37.84125900268555, "global_step": 81788, "epoch": 675} {"train_loss": -35.52277755737305, "global_step": 81789, "epoch": 675} {"train_loss": -35.583492279052734, "global_step": 81790, "epoch": 675} {"train_loss": -36.355831146240234, "global_step": 81791, "epoch": 675} {"train_loss": -34.36602783203125, "global_step": 81792, "epoch": 675} {"train_loss": -36.13011169433594, "global_step": 81793, "epoch": 675} {"train_loss": -37.656166076660156, "global_step": 81794, "epoch": 675} {"train_loss": -37.01137708238334, "global_step": 81795, "epoch": 675, "val_loss": 2630549.25} {"train_loss": -37.48529052734375, "global_step": 81796, "epoch": 676} {"train_loss": -36.76551818847656, "global_step": 81797, "epoch": 676} {"train_loss": -37.69602584838867, "global_step": 81798, "epoch": 676} {"train_loss": -37.516422271728516, "global_step": 81799, "epoch": 676} {"train_loss": -37.62826156616211, "global_step": 81800, "epoch": 676} {"train_loss": -34.8693733215332, "global_step": 81801, "epoch": 676} {"train_loss": -36.64002990722656, "global_step": 81802, "epoch": 676} {"train_loss": -37.49415969848633, "global_step": 81803, "epoch": 676} {"train_loss": -36.579322814941406, "global_step": 81804, "epoch": 676} {"train_loss": -36.23500442504883, "global_step": 81805, "epoch": 676} {"train_loss": -37.517765045166016, "global_step": 81806, "epoch": 676} {"train_loss": -36.46678924560547, "global_step": 81807, "epoch": 676} {"train_loss": -36.97017288208008, "global_step": 81808, "epoch": 676} {"train_loss": -37.78207015991211, "global_step": 81809, "epoch": 676} {"train_loss": -36.12384033203125, "global_step": 81810, "epoch": 676} {"train_loss": -37.0308952331543, "global_step": 81811, "epoch": 676} {"train_loss": -37.63901901245117, "global_step": 81812, "epoch": 676} {"train_loss": -36.943973541259766, "global_step": 81813, "epoch": 676} {"train_loss": -37.93439865112305, "global_step": 81814, "epoch": 676} {"train_loss": -37.308624267578125, "global_step": 81815, "epoch": 676} {"train_loss": -36.717262268066406, "global_step": 81816, "epoch": 676} {"train_loss": -37.848876953125, "global_step": 81817, "epoch": 676} {"train_loss": -37.072322845458984, "global_step": 81818, "epoch": 676} {"train_loss": -37.99507522583008, "global_step": 81819, "epoch": 676} {"train_loss": -37.4999885559082, "global_step": 81820, "epoch": 676} {"train_loss": -37.46735382080078, "global_step": 81821, "epoch": 676} {"train_loss": -37.777565002441406, "global_step": 81822, "epoch": 676} {"train_loss": -37.74077224731445, "global_step": 81823, "epoch": 676} {"train_loss": -37.77041244506836, "global_step": 81824, "epoch": 676} {"train_loss": -37.325504302978516, "global_step": 81825, "epoch": 676} {"train_loss": -37.65511703491211, "global_step": 81826, "epoch": 676} {"train_loss": -38.106224060058594, "global_step": 81827, "epoch": 676} {"train_loss": -37.7723503112793, "global_step": 81828, "epoch": 676} {"train_loss": -37.55686569213867, "global_step": 81829, "epoch": 676} {"train_loss": -37.98482131958008, "global_step": 81830, "epoch": 676} {"train_loss": -37.65473175048828, "global_step": 81831, "epoch": 676} {"train_loss": -38.525543212890625, "global_step": 81832, "epoch": 676} {"train_loss": -37.80591583251953, "global_step": 81833, "epoch": 676} {"train_loss": -37.75423812866211, "global_step": 81834, "epoch": 676} {"train_loss": -38.334747314453125, "global_step": 81835, "epoch": 676} {"train_loss": -38.0160026550293, "global_step": 81836, "epoch": 676} {"train_loss": -38.20579147338867, "global_step": 81837, "epoch": 676} {"train_loss": -38.18886184692383, "global_step": 81838, "epoch": 676} {"train_loss": -38.08869934082031, "global_step": 81839, "epoch": 676} {"train_loss": -37.58026885986328, "global_step": 81840, "epoch": 676} {"train_loss": -37.247318267822266, "global_step": 81841, "epoch": 676} {"train_loss": -37.7929801940918, "global_step": 81842, "epoch": 676} {"train_loss": -38.178199768066406, "global_step": 81843, "epoch": 676} {"train_loss": -38.501304626464844, "global_step": 81844, "epoch": 676} {"train_loss": -38.513397216796875, "global_step": 81845, "epoch": 676} {"train_loss": -37.95855712890625, "global_step": 81846, "epoch": 676} {"train_loss": -37.863975524902344, "global_step": 81847, "epoch": 676} {"train_loss": -37.78385543823242, "global_step": 81848, "epoch": 676} {"train_loss": -38.39968490600586, "global_step": 81849, "epoch": 676} {"train_loss": -34.93544387817383, "global_step": 81850, "epoch": 676} {"train_loss": -38.24787521362305, "global_step": 81851, "epoch": 676} {"train_loss": -38.308956146240234, "global_step": 81852, "epoch": 676} {"train_loss": -37.747005462646484, "global_step": 81853, "epoch": 676} {"train_loss": -38.269805908203125, "global_step": 81854, "epoch": 676} {"train_loss": -37.82253646850586, "global_step": 81855, "epoch": 676} {"train_loss": -38.20077133178711, "global_step": 81856, "epoch": 676} {"train_loss": -38.330322265625, "global_step": 81857, "epoch": 676} {"train_loss": -37.2699089050293, "global_step": 81858, "epoch": 676} {"train_loss": -33.66572952270508, "global_step": 81859, "epoch": 676} {"train_loss": -36.82151412963867, "global_step": 81860, "epoch": 676} {"train_loss": -36.4807243347168, "global_step": 81861, "epoch": 676} {"train_loss": -35.999900817871094, "global_step": 81862, "epoch": 676} {"train_loss": -35.910396575927734, "global_step": 81863, "epoch": 676} {"train_loss": -36.77716064453125, "global_step": 81864, "epoch": 676} {"train_loss": -37.518375396728516, "global_step": 81865, "epoch": 676} {"train_loss": -36.04875564575195, "global_step": 81866, "epoch": 676} {"train_loss": -35.72146224975586, "global_step": 81867, "epoch": 676} {"train_loss": -36.85575866699219, "global_step": 81868, "epoch": 676} {"train_loss": -36.633548736572266, "global_step": 81869, "epoch": 676} {"train_loss": -36.944759368896484, "global_step": 81870, "epoch": 676} {"train_loss": -36.77557373046875, "global_step": 81871, "epoch": 676} {"train_loss": -35.55910873413086, "global_step": 81872, "epoch": 676} {"train_loss": -36.87204360961914, "global_step": 81873, "epoch": 676} {"train_loss": -36.7930908203125, "global_step": 81874, "epoch": 676} {"train_loss": -37.43024444580078, "global_step": 81875, "epoch": 676} {"train_loss": -38.156715393066406, "global_step": 81876, "epoch": 676} {"train_loss": -36.56281661987305, "global_step": 81877, "epoch": 676} {"train_loss": -36.77304458618164, "global_step": 81878, "epoch": 676} {"train_loss": -36.3931884765625, "global_step": 81879, "epoch": 676} {"train_loss": -35.699398040771484, "global_step": 81880, "epoch": 676} {"train_loss": -36.738521575927734, "global_step": 81881, "epoch": 676} {"train_loss": -32.179229736328125, "global_step": 81882, "epoch": 676} {"train_loss": -35.849754333496094, "global_step": 81883, "epoch": 676} {"train_loss": -36.073787689208984, "global_step": 81884, "epoch": 676} {"train_loss": -36.365936279296875, "global_step": 81885, "epoch": 676} {"train_loss": -36.621253967285156, "global_step": 81886, "epoch": 676} {"train_loss": -35.4102783203125, "global_step": 81887, "epoch": 676} {"train_loss": -35.63576126098633, "global_step": 81888, "epoch": 676} {"train_loss": -35.65031433105469, "global_step": 81889, "epoch": 676} {"train_loss": -35.64461898803711, "global_step": 81890, "epoch": 676} {"train_loss": -37.59095001220703, "global_step": 81891, "epoch": 676} {"train_loss": -35.87710952758789, "global_step": 81892, "epoch": 676} {"train_loss": -37.640079498291016, "global_step": 81893, "epoch": 676} {"train_loss": -36.892879486083984, "global_step": 81894, "epoch": 676} {"train_loss": -37.23723220825195, "global_step": 81895, "epoch": 676} {"train_loss": -37.99079895019531, "global_step": 81896, "epoch": 676} {"train_loss": -37.33940887451172, "global_step": 81897, "epoch": 676} {"train_loss": -36.88212203979492, "global_step": 81898, "epoch": 676} {"train_loss": -37.835628509521484, "global_step": 81899, "epoch": 676} {"train_loss": -37.361019134521484, "global_step": 81900, "epoch": 676} {"train_loss": -36.114837646484375, "global_step": 81901, "epoch": 676} {"train_loss": -37.34568405151367, "global_step": 81902, "epoch": 676} {"train_loss": -37.242855072021484, "global_step": 81903, "epoch": 676} {"train_loss": -37.227054595947266, "global_step": 81904, "epoch": 676} {"train_loss": -37.36284255981445, "global_step": 81905, "epoch": 676} {"train_loss": -36.44614791870117, "global_step": 81906, "epoch": 676} {"train_loss": -37.52224349975586, "global_step": 81907, "epoch": 676} {"train_loss": -36.57088851928711, "global_step": 81908, "epoch": 676} {"train_loss": -37.75382614135742, "global_step": 81909, "epoch": 676} {"train_loss": -37.72816848754883, "global_step": 81910, "epoch": 676} {"train_loss": -37.27521514892578, "global_step": 81911, "epoch": 676} {"train_loss": -37.66189193725586, "global_step": 81912, "epoch": 676} {"train_loss": -38.16710662841797, "global_step": 81913, "epoch": 676} {"train_loss": -37.06352615356445, "global_step": 81914, "epoch": 676} {"train_loss": -37.69831466674805, "global_step": 81915, "epoch": 676} {"train_loss": -37.14781381276028, "global_step": 81916, "epoch": 676, "val_loss": 2644768.0} {"train_loss": -38.23603439331055, "global_step": 81917, "epoch": 677} {"train_loss": -38.2400016784668, "global_step": 81918, "epoch": 677} {"train_loss": -38.10478591918945, "global_step": 81919, "epoch": 677} {"train_loss": -37.27387237548828, "global_step": 81920, "epoch": 677} {"train_loss": -37.04730224609375, "global_step": 81921, "epoch": 677} {"train_loss": -37.553279876708984, "global_step": 81922, "epoch": 677} {"train_loss": -37.78420639038086, "global_step": 81923, "epoch": 677} {"train_loss": -37.3433723449707, "global_step": 81924, "epoch": 677} {"train_loss": -37.967445373535156, "global_step": 81925, "epoch": 677} {"train_loss": -36.967586517333984, "global_step": 81926, "epoch": 677} {"train_loss": -37.087242126464844, "global_step": 81927, "epoch": 677} {"train_loss": -37.062744140625, "global_step": 81928, "epoch": 677} {"train_loss": -37.014766693115234, "global_step": 81929, "epoch": 677} {"train_loss": -37.79854965209961, "global_step": 81930, "epoch": 677} {"train_loss": -37.72793197631836, "global_step": 81931, "epoch": 677} {"train_loss": -35.614749908447266, "global_step": 81932, "epoch": 677} {"train_loss": -36.28101348876953, "global_step": 81933, "epoch": 677} {"train_loss": -35.81428527832031, "global_step": 81934, "epoch": 677} {"train_loss": -36.77887725830078, "global_step": 81935, "epoch": 677} {"train_loss": -36.597450256347656, "global_step": 81936, "epoch": 677} {"train_loss": -37.180572509765625, "global_step": 81937, "epoch": 677} {"train_loss": -35.52332305908203, "global_step": 81938, "epoch": 677} {"train_loss": -29.789642333984375, "global_step": 81939, "epoch": 677} {"train_loss": -27.1834774017334, "global_step": 81940, "epoch": 677} {"train_loss": -26.379199981689453, "global_step": 81941, "epoch": 677} {"train_loss": -33.807830810546875, "global_step": 81942, "epoch": 677} {"train_loss": -34.59604263305664, "global_step": 81943, "epoch": 677} {"train_loss": -33.89444351196289, "global_step": 81944, "epoch": 677} {"train_loss": -36.02052688598633, "global_step": 81945, "epoch": 677} {"train_loss": -35.55308532714844, "global_step": 81946, "epoch": 677} {"train_loss": -36.161521911621094, "global_step": 81947, "epoch": 677} {"train_loss": -36.67299270629883, "global_step": 81948, "epoch": 677} {"train_loss": -36.47449493408203, "global_step": 81949, "epoch": 677} {"train_loss": -36.639137268066406, "global_step": 81950, "epoch": 677} {"train_loss": -37.56718444824219, "global_step": 81951, "epoch": 677} {"train_loss": -36.35129928588867, "global_step": 81952, "epoch": 677} {"train_loss": -36.570430755615234, "global_step": 81953, "epoch": 677} {"train_loss": -36.389495849609375, "global_step": 81954, "epoch": 677} {"train_loss": -37.471248626708984, "global_step": 81955, "epoch": 677} {"train_loss": -36.79557418823242, "global_step": 81956, "epoch": 677} {"train_loss": -36.5316162109375, "global_step": 81957, "epoch": 677} {"train_loss": -37.33650588989258, "global_step": 81958, "epoch": 677} {"train_loss": -37.11208724975586, "global_step": 81959, "epoch": 677} {"train_loss": -36.79733657836914, "global_step": 81960, "epoch": 677} {"train_loss": -37.51278305053711, "global_step": 81961, "epoch": 677} {"train_loss": -36.74134826660156, "global_step": 81962, "epoch": 677} {"train_loss": -37.20500564575195, "global_step": 81963, "epoch": 677} {"train_loss": -37.21282958984375, "global_step": 81964, "epoch": 677} {"train_loss": -37.096534729003906, "global_step": 81965, "epoch": 677} {"train_loss": -37.869659423828125, "global_step": 81966, "epoch": 677} {"train_loss": -37.285499572753906, "global_step": 81967, "epoch": 677} {"train_loss": -37.072265625, "global_step": 81968, "epoch": 677} {"train_loss": -37.93268966674805, "global_step": 81969, "epoch": 677} {"train_loss": -37.106292724609375, "global_step": 81970, "epoch": 677} {"train_loss": -37.52528762817383, "global_step": 81971, "epoch": 677} {"train_loss": -37.82114791870117, "global_step": 81972, "epoch": 677} {"train_loss": -37.394771575927734, "global_step": 81973, "epoch": 677} {"train_loss": -37.46889114379883, "global_step": 81974, "epoch": 677} {"train_loss": -37.36006164550781, "global_step": 81975, "epoch": 677} {"train_loss": -37.1175422668457, "global_step": 81976, "epoch": 677} {"train_loss": -37.78446578979492, "global_step": 81977, "epoch": 677} {"train_loss": -37.41892623901367, "global_step": 81978, "epoch": 677} {"train_loss": -37.943275451660156, "global_step": 81979, "epoch": 677} {"train_loss": -37.66508865356445, "global_step": 81980, "epoch": 677} {"train_loss": -38.22197341918945, "global_step": 81981, "epoch": 677} {"train_loss": -37.22264099121094, "global_step": 81982, "epoch": 677} {"train_loss": -38.15590286254883, "global_step": 81983, "epoch": 677} {"train_loss": -37.9531364440918, "global_step": 81984, "epoch": 677} {"train_loss": -37.61592102050781, "global_step": 81985, "epoch": 677} {"train_loss": -37.65085983276367, "global_step": 81986, "epoch": 677} {"train_loss": -37.35342025756836, "global_step": 81987, "epoch": 677} {"train_loss": -36.9125862121582, "global_step": 81988, "epoch": 677} {"train_loss": -38.23891830444336, "global_step": 81989, "epoch": 677} {"train_loss": -38.02851104736328, "global_step": 81990, "epoch": 677} {"train_loss": -38.278194427490234, "global_step": 81991, "epoch": 677} {"train_loss": -37.945491790771484, "global_step": 81992, "epoch": 677} {"train_loss": -36.96657943725586, "global_step": 81993, "epoch": 677} {"train_loss": -37.239967346191406, "global_step": 81994, "epoch": 677} {"train_loss": -38.217559814453125, "global_step": 81995, "epoch": 677} {"train_loss": -36.47334289550781, "global_step": 81996, "epoch": 677} {"train_loss": -35.987239837646484, "global_step": 81997, "epoch": 677} {"train_loss": -36.96504592895508, "global_step": 81998, "epoch": 677} {"train_loss": -36.35980987548828, "global_step": 81999, "epoch": 677} {"train_loss": -35.94080352783203, "global_step": 82000, "epoch": 677} {"train_loss": -37.41079330444336, "global_step": 82001, "epoch": 677} {"train_loss": -37.27147674560547, "global_step": 82002, "epoch": 677} {"train_loss": -36.11990737915039, "global_step": 82003, "epoch": 677} {"train_loss": -36.4361457824707, "global_step": 82004, "epoch": 677} {"train_loss": -34.85573959350586, "global_step": 82005, "epoch": 677} {"train_loss": -36.45258712768555, "global_step": 82006, "epoch": 677} {"train_loss": -35.83169937133789, "global_step": 82007, "epoch": 677} {"train_loss": -37.11815643310547, "global_step": 82008, "epoch": 677} {"train_loss": -36.502689361572266, "global_step": 82009, "epoch": 677} {"train_loss": -36.690223693847656, "global_step": 82010, "epoch": 677} {"train_loss": -37.76930618286133, "global_step": 82011, "epoch": 677} {"train_loss": -37.46864318847656, "global_step": 82012, "epoch": 677} {"train_loss": -36.21963119506836, "global_step": 82013, "epoch": 677} {"train_loss": -37.50638961791992, "global_step": 82014, "epoch": 677} {"train_loss": -36.67606735229492, "global_step": 82015, "epoch": 677} {"train_loss": -36.7120475769043, "global_step": 82016, "epoch": 677} {"train_loss": -37.20156478881836, "global_step": 82017, "epoch": 677} {"train_loss": -36.2760009765625, "global_step": 82018, "epoch": 677} {"train_loss": -38.12660598754883, "global_step": 82019, "epoch": 677} {"train_loss": -36.36804962158203, "global_step": 82020, "epoch": 677} {"train_loss": -37.78116226196289, "global_step": 82021, "epoch": 677} {"train_loss": -37.99019241333008, "global_step": 82022, "epoch": 677} {"train_loss": -35.055294036865234, "global_step": 82023, "epoch": 677} {"train_loss": -37.944637298583984, "global_step": 82024, "epoch": 677} {"train_loss": -37.30976104736328, "global_step": 82025, "epoch": 677} {"train_loss": -38.06277084350586, "global_step": 82026, "epoch": 677} {"train_loss": -37.31200408935547, "global_step": 82027, "epoch": 677} {"train_loss": -38.087013244628906, "global_step": 82028, "epoch": 677} {"train_loss": -37.49648666381836, "global_step": 82029, "epoch": 677} {"train_loss": -37.90082550048828, "global_step": 82030, "epoch": 677} {"train_loss": -37.01056671142578, "global_step": 82031, "epoch": 677} {"train_loss": -37.92743682861328, "global_step": 82032, "epoch": 677} {"train_loss": -37.924461364746094, "global_step": 82033, "epoch": 677} {"train_loss": -36.40469741821289, "global_step": 82034, "epoch": 677} {"train_loss": -38.01045608520508, "global_step": 82035, "epoch": 677} {"train_loss": -37.60841751098633, "global_step": 82036, "epoch": 677} {"train_loss": -36.84746184230836, "global_step": 82037, "epoch": 677, "val_loss": 2583169.5} {"train_loss": -37.9518928527832, "global_step": 82038, "epoch": 678} {"train_loss": -38.05842971801758, "global_step": 82039, "epoch": 678} {"train_loss": -38.187347412109375, "global_step": 82040, "epoch": 678} {"train_loss": -37.762664794921875, "global_step": 82041, "epoch": 678} {"train_loss": -38.56521987915039, "global_step": 82042, "epoch": 678} {"train_loss": -38.40373611450195, "global_step": 82043, "epoch": 678} {"train_loss": -38.6392822265625, "global_step": 82044, "epoch": 678} {"train_loss": -38.18559646606445, "global_step": 82045, "epoch": 678} {"train_loss": -37.856388092041016, "global_step": 82046, "epoch": 678} {"train_loss": -37.25117874145508, "global_step": 82047, "epoch": 678} {"train_loss": -38.265968322753906, "global_step": 82048, "epoch": 678} {"train_loss": -38.47727584838867, "global_step": 82049, "epoch": 678} {"train_loss": -38.0838623046875, "global_step": 82050, "epoch": 678} {"train_loss": -37.97168731689453, "global_step": 82051, "epoch": 678} {"train_loss": -38.13814926147461, "global_step": 82052, "epoch": 678} {"train_loss": -38.649288177490234, "global_step": 82053, "epoch": 678} {"train_loss": -38.8123664855957, "global_step": 82054, "epoch": 678} {"train_loss": -38.250240325927734, "global_step": 82055, "epoch": 678} {"train_loss": -38.7806396484375, "global_step": 82056, "epoch": 678} {"train_loss": -38.57626724243164, "global_step": 82057, "epoch": 678} {"train_loss": -38.790061950683594, "global_step": 82058, "epoch": 678} {"train_loss": -38.496612548828125, "global_step": 82059, "epoch": 678} {"train_loss": -38.64617919921875, "global_step": 82060, "epoch": 678} {"train_loss": -38.20847702026367, "global_step": 82061, "epoch": 678} {"train_loss": -38.10486602783203, "global_step": 82062, "epoch": 678} {"train_loss": -37.562191009521484, "global_step": 82063, "epoch": 678} {"train_loss": -38.50149917602539, "global_step": 82064, "epoch": 678} {"train_loss": -38.247337341308594, "global_step": 82065, "epoch": 678} {"train_loss": -38.662574768066406, "global_step": 82066, "epoch": 678} {"train_loss": -39.05853271484375, "global_step": 82067, "epoch": 678} {"train_loss": -38.0186882019043, "global_step": 82068, "epoch": 678} {"train_loss": -37.4922981262207, "global_step": 82069, "epoch": 678} {"train_loss": -37.80220413208008, "global_step": 82070, "epoch": 678} {"train_loss": -37.07020950317383, "global_step": 82071, "epoch": 678} {"train_loss": -37.560028076171875, "global_step": 82072, "epoch": 678} {"train_loss": -37.92823028564453, "global_step": 82073, "epoch": 678} {"train_loss": -38.40125274658203, "global_step": 82074, "epoch": 678} {"train_loss": -38.75062561035156, "global_step": 82075, "epoch": 678} {"train_loss": -38.507667541503906, "global_step": 82076, "epoch": 678} {"train_loss": -38.57817077636719, "global_step": 82077, "epoch": 678} {"train_loss": -37.649837493896484, "global_step": 82078, "epoch": 678} {"train_loss": -36.685699462890625, "global_step": 82079, "epoch": 678} {"train_loss": -36.900848388671875, "global_step": 82080, "epoch": 678} {"train_loss": -36.918209075927734, "global_step": 82081, "epoch": 678} {"train_loss": -38.20972442626953, "global_step": 82082, "epoch": 678} {"train_loss": -36.897064208984375, "global_step": 82083, "epoch": 678} {"train_loss": -34.63288497924805, "global_step": 82084, "epoch": 678} {"train_loss": -32.67458724975586, "global_step": 82085, "epoch": 678} {"train_loss": -33.87336349487305, "global_step": 82086, "epoch": 678} {"train_loss": -34.48696517944336, "global_step": 82087, "epoch": 678} {"train_loss": -37.31626510620117, "global_step": 82088, "epoch": 678} {"train_loss": -36.6534309387207, "global_step": 82089, "epoch": 678} {"train_loss": -35.971187591552734, "global_step": 82090, "epoch": 678} {"train_loss": -36.39014434814453, "global_step": 82091, "epoch": 678} {"train_loss": -37.367069244384766, "global_step": 82092, "epoch": 678} {"train_loss": -38.01152038574219, "global_step": 82093, "epoch": 678} {"train_loss": -37.19204330444336, "global_step": 82094, "epoch": 678} {"train_loss": -34.60466384887695, "global_step": 82095, "epoch": 678} {"train_loss": -34.98099136352539, "global_step": 82096, "epoch": 678} {"train_loss": -37.532325744628906, "global_step": 82097, "epoch": 678} {"train_loss": -36.480010986328125, "global_step": 82098, "epoch": 678} {"train_loss": -35.68146896362305, "global_step": 82099, "epoch": 678} {"train_loss": -36.897823333740234, "global_step": 82100, "epoch": 678} {"train_loss": -36.68130111694336, "global_step": 82101, "epoch": 678} {"train_loss": -35.28596878051758, "global_step": 82102, "epoch": 678} {"train_loss": -36.99241256713867, "global_step": 82103, "epoch": 678} {"train_loss": -37.89772415161133, "global_step": 82104, "epoch": 678} {"train_loss": -35.72174835205078, "global_step": 82105, "epoch": 678} {"train_loss": -37.57560729980469, "global_step": 82106, "epoch": 678} {"train_loss": -37.55371856689453, "global_step": 82107, "epoch": 678} {"train_loss": -36.601436614990234, "global_step": 82108, "epoch": 678} {"train_loss": -36.87578201293945, "global_step": 82109, "epoch": 678} {"train_loss": -37.76082229614258, "global_step": 82110, "epoch": 678} {"train_loss": -35.818641662597656, "global_step": 82111, "epoch": 678} {"train_loss": -37.19454574584961, "global_step": 82112, "epoch": 678} {"train_loss": -34.884456634521484, "global_step": 82113, "epoch": 678} {"train_loss": -36.56713104248047, "global_step": 82114, "epoch": 678} {"train_loss": -37.526580810546875, "global_step": 82115, "epoch": 678} {"train_loss": -35.88632583618164, "global_step": 82116, "epoch": 678} {"train_loss": -37.63574981689453, "global_step": 82117, "epoch": 678} {"train_loss": -35.989051818847656, "global_step": 82118, "epoch": 678} {"train_loss": -37.574275970458984, "global_step": 82119, "epoch": 678} {"train_loss": -37.04033279418945, "global_step": 82120, "epoch": 678} {"train_loss": -36.593631744384766, "global_step": 82121, "epoch": 678} {"train_loss": -37.91929244995117, "global_step": 82122, "epoch": 678} {"train_loss": -37.72434616088867, "global_step": 82123, "epoch": 678} {"train_loss": -33.85908889770508, "global_step": 82124, "epoch": 678} {"train_loss": -38.020294189453125, "global_step": 82125, "epoch": 678} {"train_loss": -37.80703353881836, "global_step": 82126, "epoch": 678} {"train_loss": -37.419158935546875, "global_step": 82127, "epoch": 678} {"train_loss": -37.86623764038086, "global_step": 82128, "epoch": 678} {"train_loss": -37.52517318725586, "global_step": 82129, "epoch": 678} {"train_loss": -35.61874008178711, "global_step": 82130, "epoch": 678} {"train_loss": -37.78449249267578, "global_step": 82131, "epoch": 678} {"train_loss": -37.74325180053711, "global_step": 82132, "epoch": 678} {"train_loss": -37.31500244140625, "global_step": 82133, "epoch": 678} {"train_loss": -38.54623031616211, "global_step": 82134, "epoch": 678} {"train_loss": -37.46142578125, "global_step": 82135, "epoch": 678} {"train_loss": -37.96323013305664, "global_step": 82136, "epoch": 678} {"train_loss": -37.88404083251953, "global_step": 82137, "epoch": 678} {"train_loss": -38.44077682495117, "global_step": 82138, "epoch": 678} {"train_loss": -38.158687591552734, "global_step": 82139, "epoch": 678} {"train_loss": -38.20903015136719, "global_step": 82140, "epoch": 678} {"train_loss": -37.96372604370117, "global_step": 82141, "epoch": 678} {"train_loss": -38.201988220214844, "global_step": 82142, "epoch": 678} {"train_loss": -38.04043197631836, "global_step": 82143, "epoch": 678} {"train_loss": -37.960594177246094, "global_step": 82144, "epoch": 678} {"train_loss": -37.890602111816406, "global_step": 82145, "epoch": 678} {"train_loss": -37.96786117553711, "global_step": 82146, "epoch": 678} {"train_loss": -36.71904373168945, "global_step": 82147, "epoch": 678} {"train_loss": -37.518653869628906, "global_step": 82148, "epoch": 678} {"train_loss": -36.44355010986328, "global_step": 82149, "epoch": 678} {"train_loss": -35.32697296142578, "global_step": 82150, "epoch": 678} {"train_loss": -33.7742919921875, "global_step": 82151, "epoch": 678} {"train_loss": -34.96855163574219, "global_step": 82152, "epoch": 678} {"train_loss": -37.990386962890625, "global_step": 82153, "epoch": 678} {"train_loss": -37.22235870361328, "global_step": 82154, "epoch": 678} {"train_loss": -35.87240219116211, "global_step": 82155, "epoch": 678} {"train_loss": -36.10213088989258, "global_step": 82156, "epoch": 678} {"train_loss": -38.23826217651367, "global_step": 82157, "epoch": 678} {"train_loss": -37.302114565510394, "global_step": 82158, "epoch": 678, "val_loss": 2613147.75} {"train_loss": -36.88090896606445, "global_step": 82159, "epoch": 679} {"train_loss": -37.403926849365234, "global_step": 82160, "epoch": 679} {"train_loss": -37.92957305908203, "global_step": 82161, "epoch": 679} {"train_loss": -38.161556243896484, "global_step": 82162, "epoch": 679} {"train_loss": -37.089271545410156, "global_step": 82163, "epoch": 679} {"train_loss": -37.29104995727539, "global_step": 82164, "epoch": 679} {"train_loss": -37.0762825012207, "global_step": 82165, "epoch": 679} {"train_loss": -38.1740837097168, "global_step": 82166, "epoch": 679} {"train_loss": -37.780364990234375, "global_step": 82167, "epoch": 679} {"train_loss": -37.260162353515625, "global_step": 82168, "epoch": 679} {"train_loss": -38.276771545410156, "global_step": 82169, "epoch": 679} {"train_loss": -36.84587860107422, "global_step": 82170, "epoch": 679} {"train_loss": -37.24638748168945, "global_step": 82171, "epoch": 679} {"train_loss": -37.36971664428711, "global_step": 82172, "epoch": 679} {"train_loss": -37.78084945678711, "global_step": 82173, "epoch": 679} {"train_loss": -37.840816497802734, "global_step": 82174, "epoch": 679} {"train_loss": -37.695125579833984, "global_step": 82175, "epoch": 679} {"train_loss": -37.840728759765625, "global_step": 82176, "epoch": 679} {"train_loss": -36.85634231567383, "global_step": 82177, "epoch": 679} {"train_loss": -37.656063079833984, "global_step": 82178, "epoch": 679} {"train_loss": -36.795833587646484, "global_step": 82179, "epoch": 679} {"train_loss": -38.1296501159668, "global_step": 82180, "epoch": 679} {"train_loss": -38.008331298828125, "global_step": 82181, "epoch": 679} {"train_loss": -37.553157806396484, "global_step": 82182, "epoch": 679} {"train_loss": -37.46682357788086, "global_step": 82183, "epoch": 679} {"train_loss": -37.47361373901367, "global_step": 82184, "epoch": 679} {"train_loss": -38.396240234375, "global_step": 82185, "epoch": 679} {"train_loss": -37.3001823425293, "global_step": 82186, "epoch": 679} {"train_loss": -37.48956298828125, "global_step": 82187, "epoch": 679} {"train_loss": -36.54660415649414, "global_step": 82188, "epoch": 679} {"train_loss": -37.54249954223633, "global_step": 82189, "epoch": 679} {"train_loss": -36.895626068115234, "global_step": 82190, "epoch": 679} {"train_loss": -37.14309310913086, "global_step": 82191, "epoch": 679} {"train_loss": -38.58208465576172, "global_step": 82192, "epoch": 679} {"train_loss": -36.32017135620117, "global_step": 82193, "epoch": 679} {"train_loss": -37.51508331298828, "global_step": 82194, "epoch": 679} {"train_loss": -36.23991394042969, "global_step": 82195, "epoch": 679} {"train_loss": -36.7062873840332, "global_step": 82196, "epoch": 679} {"train_loss": -37.459144592285156, "global_step": 82197, "epoch": 679} {"train_loss": -36.401580810546875, "global_step": 82198, "epoch": 679} {"train_loss": -37.85344696044922, "global_step": 82199, "epoch": 679} {"train_loss": -37.1081657409668, "global_step": 82200, "epoch": 679} {"train_loss": -35.53181076049805, "global_step": 82201, "epoch": 679} {"train_loss": -36.24494552612305, "global_step": 82202, "epoch": 679} {"train_loss": -37.08925247192383, "global_step": 82203, "epoch": 679} {"train_loss": -33.14815902709961, "global_step": 82204, "epoch": 679} {"train_loss": -37.015804290771484, "global_step": 82205, "epoch": 679} {"train_loss": -37.0728645324707, "global_step": 82206, "epoch": 679} {"train_loss": -37.861148834228516, "global_step": 82207, "epoch": 679} {"train_loss": -35.60255813598633, "global_step": 82208, "epoch": 679} {"train_loss": -37.85349655151367, "global_step": 82209, "epoch": 679} {"train_loss": -36.49021530151367, "global_step": 82210, "epoch": 679} {"train_loss": -37.36711502075195, "global_step": 82211, "epoch": 679} {"train_loss": -36.8848991394043, "global_step": 82212, "epoch": 679} {"train_loss": -38.26797103881836, "global_step": 82213, "epoch": 679} {"train_loss": -36.75898361206055, "global_step": 82214, "epoch": 679} {"train_loss": -37.8016357421875, "global_step": 82215, "epoch": 679} {"train_loss": -37.04179000854492, "global_step": 82216, "epoch": 679} {"train_loss": -38.03554153442383, "global_step": 82217, "epoch": 679} {"train_loss": -37.80316925048828, "global_step": 82218, "epoch": 679} {"train_loss": -37.576515197753906, "global_step": 82219, "epoch": 679} {"train_loss": -38.06671142578125, "global_step": 82220, "epoch": 679} {"train_loss": -38.348079681396484, "global_step": 82221, "epoch": 679} {"train_loss": -37.63943099975586, "global_step": 82222, "epoch": 679} {"train_loss": -37.741127014160156, "global_step": 82223, "epoch": 679} {"train_loss": -37.2447509765625, "global_step": 82224, "epoch": 679} {"train_loss": -37.693233489990234, "global_step": 82225, "epoch": 679} {"train_loss": -37.518306732177734, "global_step": 82226, "epoch": 679} {"train_loss": -37.295562744140625, "global_step": 82227, "epoch": 679} {"train_loss": -37.11858367919922, "global_step": 82228, "epoch": 679} {"train_loss": -37.89175033569336, "global_step": 82229, "epoch": 679} {"train_loss": -37.554927825927734, "global_step": 82230, "epoch": 679} {"train_loss": -35.710140228271484, "global_step": 82231, "epoch": 679} {"train_loss": -36.7552375793457, "global_step": 82232, "epoch": 679} {"train_loss": -37.72607421875, "global_step": 82233, "epoch": 679} {"train_loss": -38.003875732421875, "global_step": 82234, "epoch": 679} {"train_loss": -36.63532638549805, "global_step": 82235, "epoch": 679} {"train_loss": -33.136837005615234, "global_step": 82236, "epoch": 679} {"train_loss": -38.367591857910156, "global_step": 82237, "epoch": 679} {"train_loss": -36.06952667236328, "global_step": 82238, "epoch": 679} {"train_loss": -34.261756896972656, "global_step": 82239, "epoch": 679} {"train_loss": -38.114192962646484, "global_step": 82240, "epoch": 679} {"train_loss": -36.621986389160156, "global_step": 82241, "epoch": 679} {"train_loss": -30.6505126953125, "global_step": 82242, "epoch": 679} {"train_loss": -35.873023986816406, "global_step": 82243, "epoch": 679} {"train_loss": -35.50886154174805, "global_step": 82244, "epoch": 679} {"train_loss": -32.630035400390625, "global_step": 82245, "epoch": 679} {"train_loss": -36.25714111328125, "global_step": 82246, "epoch": 679} {"train_loss": -33.84012985229492, "global_step": 82247, "epoch": 679} {"train_loss": -33.154640197753906, "global_step": 82248, "epoch": 679} {"train_loss": -34.51993942260742, "global_step": 82249, "epoch": 679} {"train_loss": -36.08000183105469, "global_step": 82250, "epoch": 679} {"train_loss": -35.41884994506836, "global_step": 82251, "epoch": 679} {"train_loss": -34.05323028564453, "global_step": 82252, "epoch": 679} {"train_loss": -36.16103744506836, "global_step": 82253, "epoch": 679} {"train_loss": -35.17822265625, "global_step": 82254, "epoch": 679} {"train_loss": -36.939022064208984, "global_step": 82255, "epoch": 679} {"train_loss": -36.013343811035156, "global_step": 82256, "epoch": 679} {"train_loss": -35.88265609741211, "global_step": 82257, "epoch": 679} {"train_loss": -35.8667106628418, "global_step": 82258, "epoch": 679} {"train_loss": -37.308292388916016, "global_step": 82259, "epoch": 679} {"train_loss": -35.794185638427734, "global_step": 82260, "epoch": 679} {"train_loss": -36.80977249145508, "global_step": 82261, "epoch": 679} {"train_loss": -34.1125373840332, "global_step": 82262, "epoch": 679} {"train_loss": -35.22554397583008, "global_step": 82263, "epoch": 679} {"train_loss": -37.0746955871582, "global_step": 82264, "epoch": 679} {"train_loss": -35.833091735839844, "global_step": 82265, "epoch": 679} {"train_loss": -36.018531799316406, "global_step": 82266, "epoch": 679} {"train_loss": -36.162742614746094, "global_step": 82267, "epoch": 679} {"train_loss": -35.847686767578125, "global_step": 82268, "epoch": 679} {"train_loss": -36.896305084228516, "global_step": 82269, "epoch": 679} {"train_loss": -36.58747482299805, "global_step": 82270, "epoch": 679} {"train_loss": -37.22279739379883, "global_step": 82271, "epoch": 679} {"train_loss": -36.880218505859375, "global_step": 82272, "epoch": 679} {"train_loss": -36.75226593017578, "global_step": 82273, "epoch": 679} {"train_loss": -36.403621673583984, "global_step": 82274, "epoch": 679} {"train_loss": -37.09263229370117, "global_step": 82275, "epoch": 679} {"train_loss": -37.535308837890625, "global_step": 82276, "epoch": 679} {"train_loss": -36.190528869628906, "global_step": 82277, "epoch": 679} {"train_loss": -37.32190704345703, "global_step": 82278, "epoch": 679} {"train_loss": -36.74143436526464, "global_step": 82279, "epoch": 679, "val_loss": 2864630.75} {"train_loss": -37.404911041259766, "global_step": 82280, "epoch": 680} {"train_loss": -37.819435119628906, "global_step": 82281, "epoch": 680} {"train_loss": -37.078407287597656, "global_step": 82282, "epoch": 680} {"train_loss": -37.61063003540039, "global_step": 82283, "epoch": 680} {"train_loss": -36.18706130981445, "global_step": 82284, "epoch": 680} {"train_loss": -34.792083740234375, "global_step": 82285, "epoch": 680} {"train_loss": -37.026283264160156, "global_step": 82286, "epoch": 680} {"train_loss": -36.719520568847656, "global_step": 82287, "epoch": 680} {"train_loss": -36.72944641113281, "global_step": 82288, "epoch": 680} {"train_loss": -35.699214935302734, "global_step": 82289, "epoch": 680} {"train_loss": -36.958351135253906, "global_step": 82290, "epoch": 680} {"train_loss": -36.5166130065918, "global_step": 82291, "epoch": 680} {"train_loss": -37.322628021240234, "global_step": 82292, "epoch": 680} {"train_loss": -36.57257080078125, "global_step": 82293, "epoch": 680} {"train_loss": -36.52283477783203, "global_step": 82294, "epoch": 680} {"train_loss": -36.62089920043945, "global_step": 82295, "epoch": 680} {"train_loss": -36.64797592163086, "global_step": 82296, "epoch": 680} {"train_loss": -36.309173583984375, "global_step": 82297, "epoch": 680} {"train_loss": -37.16178894042969, "global_step": 82298, "epoch": 680} {"train_loss": -37.12584686279297, "global_step": 82299, "epoch": 680} {"train_loss": -37.80140686035156, "global_step": 82300, "epoch": 680} {"train_loss": -37.057071685791016, "global_step": 82301, "epoch": 680} {"train_loss": -37.65298080444336, "global_step": 82302, "epoch": 680} {"train_loss": -36.0357551574707, "global_step": 82303, "epoch": 680} {"train_loss": -37.16866683959961, "global_step": 82304, "epoch": 680} {"train_loss": -37.84828567504883, "global_step": 82305, "epoch": 680} {"train_loss": -37.601478576660156, "global_step": 82306, "epoch": 680} {"train_loss": -36.317928314208984, "global_step": 82307, "epoch": 680} {"train_loss": -37.197059631347656, "global_step": 82308, "epoch": 680} {"train_loss": -37.69670486450195, "global_step": 82309, "epoch": 680} {"train_loss": -37.79597091674805, "global_step": 82310, "epoch": 680} {"train_loss": -37.96273422241211, "global_step": 82311, "epoch": 680} {"train_loss": -37.795257568359375, "global_step": 82312, "epoch": 680} {"train_loss": -37.27425765991211, "global_step": 82313, "epoch": 680} {"train_loss": -36.91859817504883, "global_step": 82314, "epoch": 680} {"train_loss": -37.946205139160156, "global_step": 82315, "epoch": 680} {"train_loss": -37.86749267578125, "global_step": 82316, "epoch": 680} {"train_loss": -37.9374885559082, "global_step": 82317, "epoch": 680} {"train_loss": -37.562049865722656, "global_step": 82318, "epoch": 680} {"train_loss": -37.7867431640625, "global_step": 82319, "epoch": 680} {"train_loss": -38.04213333129883, "global_step": 82320, "epoch": 680} {"train_loss": -37.81080627441406, "global_step": 82321, "epoch": 680} {"train_loss": -38.27935791015625, "global_step": 82322, "epoch": 680} {"train_loss": -37.2087287902832, "global_step": 82323, "epoch": 680} {"train_loss": -37.75059127807617, "global_step": 82324, "epoch": 680} {"train_loss": -37.56992721557617, "global_step": 82325, "epoch": 680} {"train_loss": -35.91964340209961, "global_step": 82326, "epoch": 680} {"train_loss": -35.22886276245117, "global_step": 82327, "epoch": 680} {"train_loss": -37.05121994018555, "global_step": 82328, "epoch": 680} {"train_loss": -38.017024993896484, "global_step": 82329, "epoch": 680} {"train_loss": -38.5108757019043, "global_step": 82330, "epoch": 680} {"train_loss": -38.146331787109375, "global_step": 82331, "epoch": 680} {"train_loss": -37.549530029296875, "global_step": 82332, "epoch": 680} {"train_loss": -36.467010498046875, "global_step": 82333, "epoch": 680} {"train_loss": -35.5006217956543, "global_step": 82334, "epoch": 680} {"train_loss": -37.43461227416992, "global_step": 82335, "epoch": 680} {"train_loss": -37.1209831237793, "global_step": 82336, "epoch": 680} {"train_loss": -38.42572784423828, "global_step": 82337, "epoch": 680} {"train_loss": -38.325130462646484, "global_step": 82338, "epoch": 680} {"train_loss": -37.47035217285156, "global_step": 82339, "epoch": 680} {"train_loss": -37.413734436035156, "global_step": 82340, "epoch": 680} {"train_loss": -38.107826232910156, "global_step": 82341, "epoch": 680} {"train_loss": -38.3093376159668, "global_step": 82342, "epoch": 680} {"train_loss": -35.3165168762207, "global_step": 82343, "epoch": 680} {"train_loss": -36.64107131958008, "global_step": 82344, "epoch": 680} {"train_loss": -37.636138916015625, "global_step": 82345, "epoch": 680} {"train_loss": -37.568580627441406, "global_step": 82346, "epoch": 680} {"train_loss": -37.21479034423828, "global_step": 82347, "epoch": 680} {"train_loss": -37.49662399291992, "global_step": 82348, "epoch": 680} {"train_loss": -37.583595275878906, "global_step": 82349, "epoch": 680} {"train_loss": -36.83449935913086, "global_step": 82350, "epoch": 680} {"train_loss": -32.282955169677734, "global_step": 82351, "epoch": 680} {"train_loss": -29.43204116821289, "global_step": 82352, "epoch": 680} {"train_loss": -36.910911560058594, "global_step": 82353, "epoch": 680} {"train_loss": -34.44797897338867, "global_step": 82354, "epoch": 680} {"train_loss": -37.57235336303711, "global_step": 82355, "epoch": 680} {"train_loss": -34.01604080200195, "global_step": 82356, "epoch": 680} {"train_loss": -38.22180938720703, "global_step": 82357, "epoch": 680} {"train_loss": -36.20241928100586, "global_step": 82358, "epoch": 680} {"train_loss": -37.045875549316406, "global_step": 82359, "epoch": 680} {"train_loss": -37.384700775146484, "global_step": 82360, "epoch": 680} {"train_loss": -37.047725677490234, "global_step": 82361, "epoch": 680} {"train_loss": -37.6615104675293, "global_step": 82362, "epoch": 680} {"train_loss": -36.77108383178711, "global_step": 82363, "epoch": 680} {"train_loss": -37.16422653198242, "global_step": 82364, "epoch": 680} {"train_loss": -37.98003005981445, "global_step": 82365, "epoch": 680} {"train_loss": -37.60134506225586, "global_step": 82366, "epoch": 680} {"train_loss": -36.42770004272461, "global_step": 82367, "epoch": 680} {"train_loss": -37.48064041137695, "global_step": 82368, "epoch": 680} {"train_loss": -37.83650588989258, "global_step": 82369, "epoch": 680} {"train_loss": -36.6363410949707, "global_step": 82370, "epoch": 680} {"train_loss": -37.828243255615234, "global_step": 82371, "epoch": 680} {"train_loss": -37.74447250366211, "global_step": 82372, "epoch": 680} {"train_loss": -37.910274505615234, "global_step": 82373, "epoch": 680} {"train_loss": -38.63054275512695, "global_step": 82374, "epoch": 680} {"train_loss": -38.40220260620117, "global_step": 82375, "epoch": 680} {"train_loss": -37.50197982788086, "global_step": 82376, "epoch": 680} {"train_loss": -36.64577865600586, "global_step": 82377, "epoch": 680} {"train_loss": -37.81264114379883, "global_step": 82378, "epoch": 680} {"train_loss": -36.75146484375, "global_step": 82379, "epoch": 680} {"train_loss": -37.83375930786133, "global_step": 82380, "epoch": 680} {"train_loss": -37.569095611572266, "global_step": 82381, "epoch": 680} {"train_loss": -37.20625686645508, "global_step": 82382, "epoch": 680} {"train_loss": -37.0407600402832, "global_step": 82383, "epoch": 680} {"train_loss": -37.815185546875, "global_step": 82384, "epoch": 680} {"train_loss": -37.39381408691406, "global_step": 82385, "epoch": 680} {"train_loss": -38.17902755737305, "global_step": 82386, "epoch": 680} {"train_loss": -37.60596466064453, "global_step": 82387, "epoch": 680} {"train_loss": -37.6026496887207, "global_step": 82388, "epoch": 680} {"train_loss": -38.324790954589844, "global_step": 82389, "epoch": 680} {"train_loss": -35.916481018066406, "global_step": 82390, "epoch": 680} {"train_loss": -37.26905059814453, "global_step": 82391, "epoch": 680} {"train_loss": -37.00277328491211, "global_step": 82392, "epoch": 680} {"train_loss": -37.63627624511719, "global_step": 82393, "epoch": 680} {"train_loss": -36.53879928588867, "global_step": 82394, "epoch": 680} {"train_loss": -37.626102447509766, "global_step": 82395, "epoch": 680} {"train_loss": -37.844573974609375, "global_step": 82396, "epoch": 680} {"train_loss": -36.64366912841797, "global_step": 82397, "epoch": 680} {"train_loss": -36.93525314331055, "global_step": 82398, "epoch": 680} {"train_loss": -35.77688217163086, "global_step": 82399, "epoch": 680} {"train_loss": -37.1209937797105, "global_step": 82400, "epoch": 680, "val_loss": 2693364.25} {"train_loss": -36.5355339050293, "global_step": 82401, "epoch": 681} {"train_loss": -37.421897888183594, "global_step": 82402, "epoch": 681} {"train_loss": -37.987667083740234, "global_step": 82403, "epoch": 681} {"train_loss": -36.786354064941406, "global_step": 82404, "epoch": 681} {"train_loss": -35.00651931762695, "global_step": 82405, "epoch": 681} {"train_loss": -35.619781494140625, "global_step": 82406, "epoch": 681} {"train_loss": -37.46266555786133, "global_step": 82407, "epoch": 681} {"train_loss": -36.01727294921875, "global_step": 82408, "epoch": 681} {"train_loss": -37.27449035644531, "global_step": 82409, "epoch": 681} {"train_loss": -38.3325309753418, "global_step": 82410, "epoch": 681} {"train_loss": -37.54123306274414, "global_step": 82411, "epoch": 681} {"train_loss": -36.5648193359375, "global_step": 82412, "epoch": 681} {"train_loss": -36.5223388671875, "global_step": 82413, "epoch": 681} {"train_loss": -37.07709503173828, "global_step": 82414, "epoch": 681} {"train_loss": -37.018714904785156, "global_step": 82415, "epoch": 681} {"train_loss": -36.050804138183594, "global_step": 82416, "epoch": 681} {"train_loss": -36.5856819152832, "global_step": 82417, "epoch": 681} {"train_loss": -35.902774810791016, "global_step": 82418, "epoch": 681} {"train_loss": -36.57316589355469, "global_step": 82419, "epoch": 681} {"train_loss": -36.920692443847656, "global_step": 82420, "epoch": 681} {"train_loss": -38.305599212646484, "global_step": 82421, "epoch": 681} {"train_loss": -36.34446334838867, "global_step": 82422, "epoch": 681} {"train_loss": -35.738399505615234, "global_step": 82423, "epoch": 681} {"train_loss": -30.82638931274414, "global_step": 82424, "epoch": 681} {"train_loss": -37.48225021362305, "global_step": 82425, "epoch": 681} {"train_loss": -33.9837532043457, "global_step": 82426, "epoch": 681} {"train_loss": -17.225120544433594, "global_step": 82427, "epoch": 681} {"train_loss": -33.54664993286133, "global_step": 82428, "epoch": 681} {"train_loss": -33.5732307434082, "global_step": 82429, "epoch": 681} {"train_loss": -27.771448135375977, "global_step": 82430, "epoch": 681} {"train_loss": -36.04591369628906, "global_step": 82431, "epoch": 681} {"train_loss": -31.9389705657959, "global_step": 82432, "epoch": 681} {"train_loss": -28.257596969604492, "global_step": 82433, "epoch": 681} {"train_loss": -33.97739791870117, "global_step": 82434, "epoch": 681} {"train_loss": -31.952590942382812, "global_step": 82435, "epoch": 681} {"train_loss": -33.181793212890625, "global_step": 82436, "epoch": 681} {"train_loss": -31.535436630249023, "global_step": 82437, "epoch": 681} {"train_loss": -26.977643966674805, "global_step": 82438, "epoch": 681} {"train_loss": -29.008697509765625, "global_step": 82439, "epoch": 681} {"train_loss": -28.370840072631836, "global_step": 82440, "epoch": 681} {"train_loss": -34.12290573120117, "global_step": 82441, "epoch": 681} {"train_loss": -33.73253631591797, "global_step": 82442, "epoch": 681} {"train_loss": -33.82027816772461, "global_step": 82443, "epoch": 681} {"train_loss": -30.850250244140625, "global_step": 82444, "epoch": 681} {"train_loss": -27.81525230407715, "global_step": 82445, "epoch": 681} {"train_loss": -32.6147575378418, "global_step": 82446, "epoch": 681} {"train_loss": -33.11152267456055, "global_step": 82447, "epoch": 681} {"train_loss": -32.33349609375, "global_step": 82448, "epoch": 681} {"train_loss": -33.9730224609375, "global_step": 82449, "epoch": 681} {"train_loss": -33.85457992553711, "global_step": 82450, "epoch": 681} {"train_loss": -33.96003341674805, "global_step": 82451, "epoch": 681} {"train_loss": -33.938232421875, "global_step": 82452, "epoch": 681} {"train_loss": -33.84775924682617, "global_step": 82453, "epoch": 681} {"train_loss": -34.17653274536133, "global_step": 82454, "epoch": 681} {"train_loss": -33.57830810546875, "global_step": 82455, "epoch": 681} {"train_loss": -34.845027923583984, "global_step": 82456, "epoch": 681} {"train_loss": -33.99787521362305, "global_step": 82457, "epoch": 681} {"train_loss": -34.19839096069336, "global_step": 82458, "epoch": 681} {"train_loss": -34.91657638549805, "global_step": 82459, "epoch": 681} {"train_loss": -34.23157501220703, "global_step": 82460, "epoch": 681} {"train_loss": -34.89150619506836, "global_step": 82461, "epoch": 681} {"train_loss": -33.6258659362793, "global_step": 82462, "epoch": 681} {"train_loss": -34.430442810058594, "global_step": 82463, "epoch": 681} {"train_loss": -34.164241790771484, "global_step": 82464, "epoch": 681} {"train_loss": -33.365108489990234, "global_step": 82465, "epoch": 681} {"train_loss": -35.01839828491211, "global_step": 82466, "epoch": 681} {"train_loss": -34.6414794921875, "global_step": 82467, "epoch": 681} {"train_loss": -34.56452560424805, "global_step": 82468, "epoch": 681} {"train_loss": -35.222652435302734, "global_step": 82469, "epoch": 681} {"train_loss": -35.49677658081055, "global_step": 82470, "epoch": 681} {"train_loss": -34.53340530395508, "global_step": 82471, "epoch": 681} {"train_loss": -35.285491943359375, "global_step": 82472, "epoch": 681} {"train_loss": -35.79423141479492, "global_step": 82473, "epoch": 681} {"train_loss": -35.15060043334961, "global_step": 82474, "epoch": 681} {"train_loss": -34.7913703918457, "global_step": 82475, "epoch": 681} {"train_loss": -35.86312484741211, "global_step": 82476, "epoch": 681} {"train_loss": -35.705902099609375, "global_step": 82477, "epoch": 681} {"train_loss": -35.03841781616211, "global_step": 82478, "epoch": 681} {"train_loss": -35.484840393066406, "global_step": 82479, "epoch": 681} {"train_loss": -35.340816497802734, "global_step": 82480, "epoch": 681} {"train_loss": -36.1310920715332, "global_step": 82481, "epoch": 681} {"train_loss": -36.077247619628906, "global_step": 82482, "epoch": 681} {"train_loss": -36.25139236450195, "global_step": 82483, "epoch": 681} {"train_loss": -35.90552520751953, "global_step": 82484, "epoch": 681} {"train_loss": -35.89522933959961, "global_step": 82485, "epoch": 681} {"train_loss": -35.67372512817383, "global_step": 82486, "epoch": 681} {"train_loss": -36.233665466308594, "global_step": 82487, "epoch": 681} {"train_loss": -36.544334411621094, "global_step": 82488, "epoch": 681} {"train_loss": -35.847408294677734, "global_step": 82489, "epoch": 681} {"train_loss": -36.54172134399414, "global_step": 82490, "epoch": 681} {"train_loss": -36.335697174072266, "global_step": 82491, "epoch": 681} {"train_loss": -36.470855712890625, "global_step": 82492, "epoch": 681} {"train_loss": -36.448970794677734, "global_step": 82493, "epoch": 681} {"train_loss": -36.53652572631836, "global_step": 82494, "epoch": 681} {"train_loss": -36.790496826171875, "global_step": 82495, "epoch": 681} {"train_loss": -36.92093276977539, "global_step": 82496, "epoch": 681} {"train_loss": -36.289207458496094, "global_step": 82497, "epoch": 681} {"train_loss": -36.32769012451172, "global_step": 82498, "epoch": 681} {"train_loss": -36.56654739379883, "global_step": 82499, "epoch": 681} {"train_loss": -36.58826446533203, "global_step": 82500, "epoch": 681} {"train_loss": -36.63291931152344, "global_step": 82501, "epoch": 681} {"train_loss": -36.49298095703125, "global_step": 82502, "epoch": 681} {"train_loss": -36.90595245361328, "global_step": 82503, "epoch": 681} {"train_loss": -36.94532775878906, "global_step": 82504, "epoch": 681} {"train_loss": -37.16836166381836, "global_step": 82505, "epoch": 681} {"train_loss": -37.2747917175293, "global_step": 82506, "epoch": 681} {"train_loss": -37.10337829589844, "global_step": 82507, "epoch": 681} {"train_loss": -37.00736999511719, "global_step": 82508, "epoch": 681} {"train_loss": -37.35368347167969, "global_step": 82509, "epoch": 681} {"train_loss": -36.92144775390625, "global_step": 82510, "epoch": 681} {"train_loss": -37.575660705566406, "global_step": 82511, "epoch": 681} {"train_loss": -37.51646041870117, "global_step": 82512, "epoch": 681} {"train_loss": -37.595279693603516, "global_step": 82513, "epoch": 681} {"train_loss": -37.3360710144043, "global_step": 82514, "epoch": 681} {"train_loss": -37.192909240722656, "global_step": 82515, "epoch": 681} {"train_loss": -38.006622314453125, "global_step": 82516, "epoch": 681} {"train_loss": -38.18655014038086, "global_step": 82517, "epoch": 681} {"train_loss": -37.36176681518555, "global_step": 82518, "epoch": 681} {"train_loss": -37.56863021850586, "global_step": 82519, "epoch": 681} {"train_loss": -37.463645935058594, "global_step": 82520, "epoch": 681} {"train_loss": -35.10267892947867, "global_step": 82521, "epoch": 681, "val_loss": 2589715.25} {"train_loss": -37.43263626098633, "global_step": 82522, "epoch": 682} {"train_loss": -37.276763916015625, "global_step": 82523, "epoch": 682} {"train_loss": -36.65333938598633, "global_step": 82524, "epoch": 682} {"train_loss": -37.7702522277832, "global_step": 82525, "epoch": 682} {"train_loss": -37.17746353149414, "global_step": 82526, "epoch": 682} {"train_loss": -36.860836029052734, "global_step": 82527, "epoch": 682} {"train_loss": -37.775535583496094, "global_step": 82528, "epoch": 682} {"train_loss": -37.16792678833008, "global_step": 82529, "epoch": 682} {"train_loss": -36.72927474975586, "global_step": 82530, "epoch": 682} {"train_loss": -37.564369201660156, "global_step": 82531, "epoch": 682} {"train_loss": -37.052459716796875, "global_step": 82532, "epoch": 682} {"train_loss": -37.52970504760742, "global_step": 82533, "epoch": 682} {"train_loss": -37.72916793823242, "global_step": 82534, "epoch": 682} {"train_loss": -37.77799606323242, "global_step": 82535, "epoch": 682} {"train_loss": -37.60400390625, "global_step": 82536, "epoch": 682} {"train_loss": -37.42445373535156, "global_step": 82537, "epoch": 682} {"train_loss": -37.46969223022461, "global_step": 82538, "epoch": 682} {"train_loss": -37.59560775756836, "global_step": 82539, "epoch": 682} {"train_loss": -37.26372146606445, "global_step": 82540, "epoch": 682} {"train_loss": -36.3289680480957, "global_step": 82541, "epoch": 682} {"train_loss": -34.7005615234375, "global_step": 82542, "epoch": 682} {"train_loss": -35.66767120361328, "global_step": 82543, "epoch": 682} {"train_loss": -37.44066619873047, "global_step": 82544, "epoch": 682} {"train_loss": -37.437904357910156, "global_step": 82545, "epoch": 682} {"train_loss": -36.60920333862305, "global_step": 82546, "epoch": 682} {"train_loss": -37.4698600769043, "global_step": 82547, "epoch": 682} {"train_loss": -37.26271057128906, "global_step": 82548, "epoch": 682} {"train_loss": -37.17594909667969, "global_step": 82549, "epoch": 682} {"train_loss": -37.55760955810547, "global_step": 82550, "epoch": 682} {"train_loss": -36.34279251098633, "global_step": 82551, "epoch": 682} {"train_loss": -37.203025817871094, "global_step": 82552, "epoch": 682} {"train_loss": -38.26473617553711, "global_step": 82553, "epoch": 682} {"train_loss": -37.374759674072266, "global_step": 82554, "epoch": 682} {"train_loss": -36.19246292114258, "global_step": 82555, "epoch": 682} {"train_loss": -36.58796310424805, "global_step": 82556, "epoch": 682} {"train_loss": -37.65446090698242, "global_step": 82557, "epoch": 682} {"train_loss": -35.46897506713867, "global_step": 82558, "epoch": 682} {"train_loss": -34.327091217041016, "global_step": 82559, "epoch": 682} {"train_loss": -36.57136154174805, "global_step": 82560, "epoch": 682} {"train_loss": -37.08376693725586, "global_step": 82561, "epoch": 682} {"train_loss": -34.309391021728516, "global_step": 82562, "epoch": 682} {"train_loss": -28.083948135375977, "global_step": 82563, "epoch": 682} {"train_loss": -33.63126754760742, "global_step": 82564, "epoch": 682} {"train_loss": -36.698490142822266, "global_step": 82565, "epoch": 682} {"train_loss": -34.09150314331055, "global_step": 82566, "epoch": 682} {"train_loss": -35.893310546875, "global_step": 82567, "epoch": 682} {"train_loss": -37.2780876159668, "global_step": 82568, "epoch": 682} {"train_loss": -33.86184310913086, "global_step": 82569, "epoch": 682} {"train_loss": -35.312461853027344, "global_step": 82570, "epoch": 682} {"train_loss": -37.7093391418457, "global_step": 82571, "epoch": 682} {"train_loss": -36.676002502441406, "global_step": 82572, "epoch": 682} {"train_loss": -37.616451263427734, "global_step": 82573, "epoch": 682} {"train_loss": -37.28750991821289, "global_step": 82574, "epoch": 682} {"train_loss": -37.175575256347656, "global_step": 82575, "epoch": 682} {"train_loss": -37.26675033569336, "global_step": 82576, "epoch": 682} {"train_loss": -37.2055778503418, "global_step": 82577, "epoch": 682} {"train_loss": -37.235191345214844, "global_step": 82578, "epoch": 682} {"train_loss": -37.26678466796875, "global_step": 82579, "epoch": 682} {"train_loss": -37.407108306884766, "global_step": 82580, "epoch": 682} {"train_loss": -37.46443557739258, "global_step": 82581, "epoch": 682} {"train_loss": -37.59440612792969, "global_step": 82582, "epoch": 682} {"train_loss": -37.39204788208008, "global_step": 82583, "epoch": 682} {"train_loss": -37.25321578979492, "global_step": 82584, "epoch": 682} {"train_loss": -37.8531608581543, "global_step": 82585, "epoch": 682} {"train_loss": -38.14033126831055, "global_step": 82586, "epoch": 682} {"train_loss": -37.90559005737305, "global_step": 82587, "epoch": 682} {"train_loss": -38.130367279052734, "global_step": 82588, "epoch": 682} {"train_loss": -37.834320068359375, "global_step": 82589, "epoch": 682} {"train_loss": -37.31697463989258, "global_step": 82590, "epoch": 682} {"train_loss": -38.081512451171875, "global_step": 82591, "epoch": 682} {"train_loss": -37.54104995727539, "global_step": 82592, "epoch": 682} {"train_loss": -37.80915451049805, "global_step": 82593, "epoch": 682} {"train_loss": -37.24326705932617, "global_step": 82594, "epoch": 682} {"train_loss": -38.21044921875, "global_step": 82595, "epoch": 682} {"train_loss": -38.27103805541992, "global_step": 82596, "epoch": 682} {"train_loss": -37.68998718261719, "global_step": 82597, "epoch": 682} {"train_loss": -37.605857849121094, "global_step": 82598, "epoch": 682} {"train_loss": -37.69834518432617, "global_step": 82599, "epoch": 682} {"train_loss": -37.89356231689453, "global_step": 82600, "epoch": 682} {"train_loss": -38.15580368041992, "global_step": 82601, "epoch": 682} {"train_loss": -38.272762298583984, "global_step": 82602, "epoch": 682} {"train_loss": -38.147518157958984, "global_step": 82603, "epoch": 682} {"train_loss": -37.98039245605469, "global_step": 82604, "epoch": 682} {"train_loss": -38.346988677978516, "global_step": 82605, "epoch": 682} {"train_loss": -37.95687484741211, "global_step": 82606, "epoch": 682} {"train_loss": -38.04533004760742, "global_step": 82607, "epoch": 682} {"train_loss": -38.06771469116211, "global_step": 82608, "epoch": 682} {"train_loss": -37.77981185913086, "global_step": 82609, "epoch": 682} {"train_loss": -37.910987854003906, "global_step": 82610, "epoch": 682} {"train_loss": -38.1709098815918, "global_step": 82611, "epoch": 682} {"train_loss": -38.4645881652832, "global_step": 82612, "epoch": 682} {"train_loss": -37.912330627441406, "global_step": 82613, "epoch": 682} {"train_loss": -38.2459602355957, "global_step": 82614, "epoch": 682} {"train_loss": -38.2890625, "global_step": 82615, "epoch": 682} {"train_loss": -39.050350189208984, "global_step": 82616, "epoch": 682} {"train_loss": -38.31556701660156, "global_step": 82617, "epoch": 682} {"train_loss": -38.6043586730957, "global_step": 82618, "epoch": 682} {"train_loss": -38.467506408691406, "global_step": 82619, "epoch": 682} {"train_loss": -37.963233947753906, "global_step": 82620, "epoch": 682} {"train_loss": -38.773338317871094, "global_step": 82621, "epoch": 682} {"train_loss": -37.466854095458984, "global_step": 82622, "epoch": 682} {"train_loss": -38.31837844848633, "global_step": 82623, "epoch": 682} {"train_loss": -37.9776611328125, "global_step": 82624, "epoch": 682} {"train_loss": -37.62964630126953, "global_step": 82625, "epoch": 682} {"train_loss": -37.264862060546875, "global_step": 82626, "epoch": 682} {"train_loss": -38.5821647644043, "global_step": 82627, "epoch": 682} {"train_loss": -38.72682571411133, "global_step": 82628, "epoch": 682} {"train_loss": -37.77376174926758, "global_step": 82629, "epoch": 682} {"train_loss": -38.56127166748047, "global_step": 82630, "epoch": 682} {"train_loss": -37.558319091796875, "global_step": 82631, "epoch": 682} {"train_loss": -36.06069564819336, "global_step": 82632, "epoch": 682} {"train_loss": -34.91915512084961, "global_step": 82633, "epoch": 682} {"train_loss": -33.28392791748047, "global_step": 82634, "epoch": 682} {"train_loss": -34.36769485473633, "global_step": 82635, "epoch": 682} {"train_loss": -36.76068878173828, "global_step": 82636, "epoch": 682} {"train_loss": -37.85688400268555, "global_step": 82637, "epoch": 682} {"train_loss": -35.485469818115234, "global_step": 82638, "epoch": 682} {"train_loss": -33.02445602416992, "global_step": 82639, "epoch": 682} {"train_loss": -31.00416374206543, "global_step": 82640, "epoch": 682} {"train_loss": -36.61140823364258, "global_step": 82641, "epoch": 682} {"train_loss": -37.02508382560793, "global_step": 82642, "epoch": 682, "val_loss": 2670141.0} {"train_loss": -24.83035659790039, "global_step": 82643, "epoch": 683} {"train_loss": -31.250268936157227, "global_step": 82644, "epoch": 683} {"train_loss": -31.8409366607666, "global_step": 82645, "epoch": 683} {"train_loss": -33.04433059692383, "global_step": 82646, "epoch": 683} {"train_loss": -34.331932067871094, "global_step": 82647, "epoch": 683} {"train_loss": -30.955854415893555, "global_step": 82648, "epoch": 683} {"train_loss": -34.350643157958984, "global_step": 82649, "epoch": 683} {"train_loss": -33.323951721191406, "global_step": 82650, "epoch": 683} {"train_loss": -35.29561996459961, "global_step": 82651, "epoch": 683} {"train_loss": -35.84832763671875, "global_step": 82652, "epoch": 683} {"train_loss": -35.12190628051758, "global_step": 82653, "epoch": 683} {"train_loss": -36.855281829833984, "global_step": 82654, "epoch": 683} {"train_loss": -35.1446647644043, "global_step": 82655, "epoch": 683} {"train_loss": -36.533607482910156, "global_step": 82656, "epoch": 683} {"train_loss": -36.4532585144043, "global_step": 82657, "epoch": 683} {"train_loss": -36.72074508666992, "global_step": 82658, "epoch": 683} {"train_loss": -36.34890365600586, "global_step": 82659, "epoch": 683} {"train_loss": -36.8929557800293, "global_step": 82660, "epoch": 683} {"train_loss": -35.9810905456543, "global_step": 82661, "epoch": 683} {"train_loss": -37.23247146606445, "global_step": 82662, "epoch": 683} {"train_loss": -36.91622543334961, "global_step": 82663, "epoch": 683} {"train_loss": -37.09479904174805, "global_step": 82664, "epoch": 683} {"train_loss": -36.91072463989258, "global_step": 82665, "epoch": 683} {"train_loss": -37.080257415771484, "global_step": 82666, "epoch": 683} {"train_loss": -37.27574920654297, "global_step": 82667, "epoch": 683} {"train_loss": -37.50027084350586, "global_step": 82668, "epoch": 683} {"train_loss": -37.207271575927734, "global_step": 82669, "epoch": 683} {"train_loss": -37.53493881225586, "global_step": 82670, "epoch": 683} {"train_loss": -37.69011306762695, "global_step": 82671, "epoch": 683} {"train_loss": -37.49882125854492, "global_step": 82672, "epoch": 683} {"train_loss": -37.0177001953125, "global_step": 82673, "epoch": 683} {"train_loss": -36.1541862487793, "global_step": 82674, "epoch": 683} {"train_loss": -35.24799728393555, "global_step": 82675, "epoch": 683} {"train_loss": -37.30868148803711, "global_step": 82676, "epoch": 683} {"train_loss": -37.47736740112305, "global_step": 82677, "epoch": 683} {"train_loss": -37.55214309692383, "global_step": 82678, "epoch": 683} {"train_loss": -37.490596771240234, "global_step": 82679, "epoch": 683} {"train_loss": -37.461952209472656, "global_step": 82680, "epoch": 683} {"train_loss": -35.78046798706055, "global_step": 82681, "epoch": 683} {"train_loss": -37.483734130859375, "global_step": 82682, "epoch": 683} {"train_loss": -37.69379425048828, "global_step": 82683, "epoch": 683} {"train_loss": -37.76643371582031, "global_step": 82684, "epoch": 683} {"train_loss": -36.80542755126953, "global_step": 82685, "epoch": 683} {"train_loss": -37.78594970703125, "global_step": 82686, "epoch": 683} {"train_loss": -36.150718688964844, "global_step": 82687, "epoch": 683} {"train_loss": -37.991661071777344, "global_step": 82688, "epoch": 683} {"train_loss": -37.68104553222656, "global_step": 82689, "epoch": 683} {"train_loss": -37.7724609375, "global_step": 82690, "epoch": 683} {"train_loss": -37.17426300048828, "global_step": 82691, "epoch": 683} {"train_loss": -36.7316780090332, "global_step": 82692, "epoch": 683} {"train_loss": -37.59627914428711, "global_step": 82693, "epoch": 683} {"train_loss": -37.80869674682617, "global_step": 82694, "epoch": 683} {"train_loss": -37.07383728027344, "global_step": 82695, "epoch": 683} {"train_loss": -37.25191116333008, "global_step": 82696, "epoch": 683} {"train_loss": -37.474754333496094, "global_step": 82697, "epoch": 683} {"train_loss": -37.27713394165039, "global_step": 82698, "epoch": 683} {"train_loss": -36.81238555908203, "global_step": 82699, "epoch": 683} {"train_loss": -37.51194381713867, "global_step": 82700, "epoch": 683} {"train_loss": -37.80234909057617, "global_step": 82701, "epoch": 683} {"train_loss": -36.45943832397461, "global_step": 82702, "epoch": 683} {"train_loss": -35.68735122680664, "global_step": 82703, "epoch": 683} {"train_loss": -37.455535888671875, "global_step": 82704, "epoch": 683} {"train_loss": -37.99772262573242, "global_step": 82705, "epoch": 683} {"train_loss": -37.3565788269043, "global_step": 82706, "epoch": 683} {"train_loss": -36.05717468261719, "global_step": 82707, "epoch": 683} {"train_loss": -37.59841537475586, "global_step": 82708, "epoch": 683} {"train_loss": -38.14778518676758, "global_step": 82709, "epoch": 683} {"train_loss": -37.60451889038086, "global_step": 82710, "epoch": 683} {"train_loss": -37.06881332397461, "global_step": 82711, "epoch": 683} {"train_loss": -37.14486312866211, "global_step": 82712, "epoch": 683} {"train_loss": -36.87614440917969, "global_step": 82713, "epoch": 683} {"train_loss": -37.71894836425781, "global_step": 82714, "epoch": 683} {"train_loss": -37.079708099365234, "global_step": 82715, "epoch": 683} {"train_loss": -36.06874465942383, "global_step": 82716, "epoch": 683} {"train_loss": -33.58611297607422, "global_step": 82717, "epoch": 683} {"train_loss": -36.63048553466797, "global_step": 82718, "epoch": 683} {"train_loss": -37.458396911621094, "global_step": 82719, "epoch": 683} {"train_loss": -34.2297248840332, "global_step": 82720, "epoch": 683} {"train_loss": -36.24241256713867, "global_step": 82721, "epoch": 683} {"train_loss": -37.69416427612305, "global_step": 82722, "epoch": 683} {"train_loss": -37.156646728515625, "global_step": 82723, "epoch": 683} {"train_loss": -36.18996810913086, "global_step": 82724, "epoch": 683} {"train_loss": -37.20705795288086, "global_step": 82725, "epoch": 683} {"train_loss": -37.164390563964844, "global_step": 82726, "epoch": 683} {"train_loss": -35.33980941772461, "global_step": 82727, "epoch": 683} {"train_loss": -37.384735107421875, "global_step": 82728, "epoch": 683} {"train_loss": -36.73544692993164, "global_step": 82729, "epoch": 683} {"train_loss": -36.798397064208984, "global_step": 82730, "epoch": 683} {"train_loss": -37.021026611328125, "global_step": 82731, "epoch": 683} {"train_loss": -37.791282653808594, "global_step": 82732, "epoch": 683} {"train_loss": -36.433414459228516, "global_step": 82733, "epoch": 683} {"train_loss": -36.654884338378906, "global_step": 82734, "epoch": 683} {"train_loss": -36.36300277709961, "global_step": 82735, "epoch": 683} {"train_loss": -36.48069381713867, "global_step": 82736, "epoch": 683} {"train_loss": -34.679866790771484, "global_step": 82737, "epoch": 683} {"train_loss": -35.12681579589844, "global_step": 82738, "epoch": 683} {"train_loss": -35.45359420776367, "global_step": 82739, "epoch": 683} {"train_loss": -33.735530853271484, "global_step": 82740, "epoch": 683} {"train_loss": -35.81169128417969, "global_step": 82741, "epoch": 683} {"train_loss": -35.605567932128906, "global_step": 82742, "epoch": 683} {"train_loss": -36.40450668334961, "global_step": 82743, "epoch": 683} {"train_loss": -37.05828857421875, "global_step": 82744, "epoch": 683} {"train_loss": -35.89236068725586, "global_step": 82745, "epoch": 683} {"train_loss": -37.25225830078125, "global_step": 82746, "epoch": 683} {"train_loss": -35.59611892700195, "global_step": 82747, "epoch": 683} {"train_loss": -36.99266815185547, "global_step": 82748, "epoch": 683} {"train_loss": -36.5157470703125, "global_step": 82749, "epoch": 683} {"train_loss": -36.49489212036133, "global_step": 82750, "epoch": 683} {"train_loss": -37.443603515625, "global_step": 82751, "epoch": 683} {"train_loss": -36.67013168334961, "global_step": 82752, "epoch": 683} {"train_loss": -37.84849166870117, "global_step": 82753, "epoch": 683} {"train_loss": -37.98384475708008, "global_step": 82754, "epoch": 683} {"train_loss": -37.48087692260742, "global_step": 82755, "epoch": 683} {"train_loss": -37.43572235107422, "global_step": 82756, "epoch": 683} {"train_loss": -37.67597198486328, "global_step": 82757, "epoch": 683} {"train_loss": -38.05802536010742, "global_step": 82758, "epoch": 683} {"train_loss": -38.12569046020508, "global_step": 82759, "epoch": 683} {"train_loss": -38.146095275878906, "global_step": 82760, "epoch": 683} {"train_loss": -38.11328887939453, "global_step": 82761, "epoch": 683} {"train_loss": -38.33216094970703, "global_step": 82762, "epoch": 683} {"train_loss": -36.54238401365674, "global_step": 82763, "epoch": 683, "val_loss": 2598803.25} {"train_loss": -37.720149993896484, "global_step": 82764, "epoch": 684} {"train_loss": -37.93219757080078, "global_step": 82765, "epoch": 684} {"train_loss": -37.63727569580078, "global_step": 82766, "epoch": 684} {"train_loss": -37.925743103027344, "global_step": 82767, "epoch": 684} {"train_loss": -38.29281234741211, "global_step": 82768, "epoch": 684} {"train_loss": -37.591400146484375, "global_step": 82769, "epoch": 684} {"train_loss": -38.61147689819336, "global_step": 82770, "epoch": 684} {"train_loss": -37.95709228515625, "global_step": 82771, "epoch": 684} {"train_loss": -38.44075012207031, "global_step": 82772, "epoch": 684} {"train_loss": -38.500240325927734, "global_step": 82773, "epoch": 684} {"train_loss": -38.787506103515625, "global_step": 82774, "epoch": 684} {"train_loss": -37.8075065612793, "global_step": 82775, "epoch": 684} {"train_loss": -38.174617767333984, "global_step": 82776, "epoch": 684} {"train_loss": -38.656959533691406, "global_step": 82777, "epoch": 684} {"train_loss": -37.916378021240234, "global_step": 82778, "epoch": 684} {"train_loss": -36.50164794921875, "global_step": 82779, "epoch": 684} {"train_loss": -38.712066650390625, "global_step": 82780, "epoch": 684} {"train_loss": -34.495540618896484, "global_step": 82781, "epoch": 684} {"train_loss": -37.001708984375, "global_step": 82782, "epoch": 684} {"train_loss": -35.30984115600586, "global_step": 82783, "epoch": 684} {"train_loss": -36.0831184387207, "global_step": 82784, "epoch": 684} {"train_loss": -37.06391525268555, "global_step": 82785, "epoch": 684} {"train_loss": -34.15068435668945, "global_step": 82786, "epoch": 684} {"train_loss": -33.62410354614258, "global_step": 82787, "epoch": 684} {"train_loss": -33.61271286010742, "global_step": 82788, "epoch": 684} {"train_loss": -34.906585693359375, "global_step": 82789, "epoch": 684} {"train_loss": -34.895790100097656, "global_step": 82790, "epoch": 684} {"train_loss": -33.264556884765625, "global_step": 82791, "epoch": 684} {"train_loss": -34.94783401489258, "global_step": 82792, "epoch": 684} {"train_loss": -33.40949630737305, "global_step": 82793, "epoch": 684} {"train_loss": -33.07254409790039, "global_step": 82794, "epoch": 684} {"train_loss": -34.91108322143555, "global_step": 82795, "epoch": 684} {"train_loss": -34.04500961303711, "global_step": 82796, "epoch": 684} {"train_loss": -35.05867385864258, "global_step": 82797, "epoch": 684} {"train_loss": -34.52634048461914, "global_step": 82798, "epoch": 684} {"train_loss": -36.21645736694336, "global_step": 82799, "epoch": 684} {"train_loss": -36.09048843383789, "global_step": 82800, "epoch": 684} {"train_loss": -36.294883728027344, "global_step": 82801, "epoch": 684} {"train_loss": -36.5404052734375, "global_step": 82802, "epoch": 684} {"train_loss": -35.46535873413086, "global_step": 82803, "epoch": 684} {"train_loss": -36.31162643432617, "global_step": 82804, "epoch": 684} {"train_loss": -36.29241180419922, "global_step": 82805, "epoch": 684} {"train_loss": -36.34965515136719, "global_step": 82806, "epoch": 684} {"train_loss": -36.47538375854492, "global_step": 82807, "epoch": 684} {"train_loss": -36.95765686035156, "global_step": 82808, "epoch": 684} {"train_loss": -36.97856903076172, "global_step": 82809, "epoch": 684} {"train_loss": -36.326202392578125, "global_step": 82810, "epoch": 684} {"train_loss": -37.39548873901367, "global_step": 82811, "epoch": 684} {"train_loss": -36.64323043823242, "global_step": 82812, "epoch": 684} {"train_loss": -36.76496505737305, "global_step": 82813, "epoch": 684} {"train_loss": -36.09248352050781, "global_step": 82814, "epoch": 684} {"train_loss": -37.68775177001953, "global_step": 82815, "epoch": 684} {"train_loss": -37.33939743041992, "global_step": 82816, "epoch": 684} {"train_loss": -37.599708557128906, "global_step": 82817, "epoch": 684} {"train_loss": -36.76444625854492, "global_step": 82818, "epoch": 684} {"train_loss": -37.314971923828125, "global_step": 82819, "epoch": 684} {"train_loss": -36.80165481567383, "global_step": 82820, "epoch": 684} {"train_loss": -37.24848556518555, "global_step": 82821, "epoch": 684} {"train_loss": -38.21284103393555, "global_step": 82822, "epoch": 684} {"train_loss": -36.84467697143555, "global_step": 82823, "epoch": 684} {"train_loss": -37.355682373046875, "global_step": 82824, "epoch": 684} {"train_loss": -37.5484733581543, "global_step": 82825, "epoch": 684} {"train_loss": -37.76776885986328, "global_step": 82826, "epoch": 684} {"train_loss": -38.393409729003906, "global_step": 82827, "epoch": 684} {"train_loss": -37.53004837036133, "global_step": 82828, "epoch": 684} {"train_loss": -37.578216552734375, "global_step": 82829, "epoch": 684} {"train_loss": -37.48479080200195, "global_step": 82830, "epoch": 684} {"train_loss": -37.6258659362793, "global_step": 82831, "epoch": 684} {"train_loss": -38.15802764892578, "global_step": 82832, "epoch": 684} {"train_loss": -37.695159912109375, "global_step": 82833, "epoch": 684} {"train_loss": -37.70086669921875, "global_step": 82834, "epoch": 684} {"train_loss": -37.69674301147461, "global_step": 82835, "epoch": 684} {"train_loss": -37.846858978271484, "global_step": 82836, "epoch": 684} {"train_loss": -37.5914421081543, "global_step": 82837, "epoch": 684} {"train_loss": -37.139427185058594, "global_step": 82838, "epoch": 684} {"train_loss": -38.042327880859375, "global_step": 82839, "epoch": 684} {"train_loss": -38.035884857177734, "global_step": 82840, "epoch": 684} {"train_loss": -37.190895080566406, "global_step": 82841, "epoch": 684} {"train_loss": -38.31793212890625, "global_step": 82842, "epoch": 684} {"train_loss": -38.26478958129883, "global_step": 82843, "epoch": 684} {"train_loss": -38.06574249267578, "global_step": 82844, "epoch": 684} {"train_loss": -38.12580871582031, "global_step": 82845, "epoch": 684} {"train_loss": -37.838157653808594, "global_step": 82846, "epoch": 684} {"train_loss": -38.09046173095703, "global_step": 82847, "epoch": 684} {"train_loss": -38.09321975708008, "global_step": 82848, "epoch": 684} {"train_loss": -38.22998809814453, "global_step": 82849, "epoch": 684} {"train_loss": -38.66497802734375, "global_step": 82850, "epoch": 684} {"train_loss": -38.80286407470703, "global_step": 82851, "epoch": 684} {"train_loss": -38.066810607910156, "global_step": 82852, "epoch": 684} {"train_loss": -38.302085876464844, "global_step": 82853, "epoch": 684} {"train_loss": -38.34699249267578, "global_step": 82854, "epoch": 684} {"train_loss": -37.93486785888672, "global_step": 82855, "epoch": 684} {"train_loss": -37.85588073730469, "global_step": 82856, "epoch": 684} {"train_loss": -37.988197326660156, "global_step": 82857, "epoch": 684} {"train_loss": -38.457305908203125, "global_step": 82858, "epoch": 684} {"train_loss": -37.04636764526367, "global_step": 82859, "epoch": 684} {"train_loss": -37.56405258178711, "global_step": 82860, "epoch": 684} {"train_loss": -37.46116256713867, "global_step": 82861, "epoch": 684} {"train_loss": -37.74100875854492, "global_step": 82862, "epoch": 684} {"train_loss": -34.83766555786133, "global_step": 82863, "epoch": 684} {"train_loss": -31.913864135742188, "global_step": 82864, "epoch": 684} {"train_loss": -29.9549560546875, "global_step": 82865, "epoch": 684} {"train_loss": -32.764469146728516, "global_step": 82866, "epoch": 684} {"train_loss": -26.561307907104492, "global_step": 82867, "epoch": 684} {"train_loss": -13.63519287109375, "global_step": 82868, "epoch": 684} {"train_loss": -23.861913681030273, "global_step": 82869, "epoch": 684} {"train_loss": -19.22953224182129, "global_step": 82870, "epoch": 684} {"train_loss": -29.17917251586914, "global_step": 82871, "epoch": 684} {"train_loss": -23.158401489257812, "global_step": 82872, "epoch": 684} {"train_loss": -23.844274520874023, "global_step": 82873, "epoch": 684} {"train_loss": -27.42696189880371, "global_step": 82874, "epoch": 684} {"train_loss": -27.942977905273438, "global_step": 82875, "epoch": 684} {"train_loss": -25.29611587524414, "global_step": 82876, "epoch": 684} {"train_loss": -26.772672653198242, "global_step": 82877, "epoch": 684} {"train_loss": -29.200927734375, "global_step": 82878, "epoch": 684} {"train_loss": -28.928680419921875, "global_step": 82879, "epoch": 684} {"train_loss": -28.275991439819336, "global_step": 82880, "epoch": 684} {"train_loss": -28.920225143432617, "global_step": 82881, "epoch": 684} {"train_loss": -28.7249698638916, "global_step": 82882, "epoch": 684} {"train_loss": -29.537168502807617, "global_step": 82883, "epoch": 684} {"train_loss": -35.243152539592145, "global_step": 82884, "epoch": 684, "val_loss": 2551765.75} {"train_loss": -29.490478515625, "global_step": 82885, "epoch": 685} {"train_loss": -28.673908233642578, "global_step": 82886, "epoch": 685} {"train_loss": -29.9180908203125, "global_step": 82887, "epoch": 685} {"train_loss": -30.460926055908203, "global_step": 82888, "epoch": 685} {"train_loss": -29.63228416442871, "global_step": 82889, "epoch": 685} {"train_loss": -28.777820587158203, "global_step": 82890, "epoch": 685} {"train_loss": -30.2680606842041, "global_step": 82891, "epoch": 685} {"train_loss": -30.1564884185791, "global_step": 82892, "epoch": 685} {"train_loss": -31.205402374267578, "global_step": 82893, "epoch": 685} {"train_loss": -30.745370864868164, "global_step": 82894, "epoch": 685} {"train_loss": -31.1138916015625, "global_step": 82895, "epoch": 685} {"train_loss": -31.697250366210938, "global_step": 82896, "epoch": 685} {"train_loss": -29.572437286376953, "global_step": 82897, "epoch": 685} {"train_loss": -32.78845977783203, "global_step": 82898, "epoch": 685} {"train_loss": -31.51755142211914, "global_step": 82899, "epoch": 685} {"train_loss": -32.250308990478516, "global_step": 82900, "epoch": 685} {"train_loss": -32.62934112548828, "global_step": 82901, "epoch": 685} {"train_loss": -31.965848922729492, "global_step": 82902, "epoch": 685} {"train_loss": -32.2570915222168, "global_step": 82903, "epoch": 685} {"train_loss": -32.249794006347656, "global_step": 82904, "epoch": 685} {"train_loss": -32.98272705078125, "global_step": 82905, "epoch": 685} {"train_loss": -32.263641357421875, "global_step": 82906, "epoch": 685} {"train_loss": -32.21154022216797, "global_step": 82907, "epoch": 685} {"train_loss": -32.57982635498047, "global_step": 82908, "epoch": 685} {"train_loss": -32.96199417114258, "global_step": 82909, "epoch": 685} {"train_loss": -33.195037841796875, "global_step": 82910, "epoch": 685} {"train_loss": -32.48193359375, "global_step": 82911, "epoch": 685} {"train_loss": -33.166542053222656, "global_step": 82912, "epoch": 685} {"train_loss": -32.848934173583984, "global_step": 82913, "epoch": 685} {"train_loss": -33.246700286865234, "global_step": 82914, "epoch": 685} {"train_loss": -33.54651641845703, "global_step": 82915, "epoch": 685} {"train_loss": -33.5257682800293, "global_step": 82916, "epoch": 685} {"train_loss": -33.701412200927734, "global_step": 82917, "epoch": 685} {"train_loss": -34.36163330078125, "global_step": 82918, "epoch": 685} {"train_loss": -34.182308197021484, "global_step": 82919, "epoch": 685} {"train_loss": -33.64435577392578, "global_step": 82920, "epoch": 685} {"train_loss": -34.39640426635742, "global_step": 82921, "epoch": 685} {"train_loss": -34.38332748413086, "global_step": 82922, "epoch": 685} {"train_loss": -34.45884323120117, "global_step": 82923, "epoch": 685} {"train_loss": -34.47594451904297, "global_step": 82924, "epoch": 685} {"train_loss": -34.29122543334961, "global_step": 82925, "epoch": 685} {"train_loss": -33.547813415527344, "global_step": 82926, "epoch": 685} {"train_loss": -32.75496292114258, "global_step": 82927, "epoch": 685} {"train_loss": -31.261890411376953, "global_step": 82928, "epoch": 685} {"train_loss": -28.106473922729492, "global_step": 82929, "epoch": 685} {"train_loss": -32.7892951965332, "global_step": 82930, "epoch": 685} {"train_loss": -32.63991165161133, "global_step": 82931, "epoch": 685} {"train_loss": -32.192081451416016, "global_step": 82932, "epoch": 685} {"train_loss": -33.12223815917969, "global_step": 82933, "epoch": 685} {"train_loss": -32.26968002319336, "global_step": 82934, "epoch": 685} {"train_loss": -34.2713508605957, "global_step": 82935, "epoch": 685} {"train_loss": -32.98941421508789, "global_step": 82936, "epoch": 685} {"train_loss": -34.0555419921875, "global_step": 82937, "epoch": 685} {"train_loss": -33.4871940612793, "global_step": 82938, "epoch": 685} {"train_loss": -32.09646224975586, "global_step": 82939, "epoch": 685} {"train_loss": -34.18101119995117, "global_step": 82940, "epoch": 685} {"train_loss": -33.40079879760742, "global_step": 82941, "epoch": 685} {"train_loss": -33.62542724609375, "global_step": 82942, "epoch": 685} {"train_loss": -34.6745719909668, "global_step": 82943, "epoch": 685} {"train_loss": -34.45100402832031, "global_step": 82944, "epoch": 685} {"train_loss": -34.86642074584961, "global_step": 82945, "epoch": 685} {"train_loss": -34.56574249267578, "global_step": 82946, "epoch": 685} {"train_loss": -34.28550338745117, "global_step": 82947, "epoch": 685} {"train_loss": -34.77251052856445, "global_step": 82948, "epoch": 685} {"train_loss": -34.54539489746094, "global_step": 82949, "epoch": 685} {"train_loss": -35.479000091552734, "global_step": 82950, "epoch": 685} {"train_loss": -34.9659423828125, "global_step": 82951, "epoch": 685} {"train_loss": -34.36505889892578, "global_step": 82952, "epoch": 685} {"train_loss": -34.93667984008789, "global_step": 82953, "epoch": 685} {"train_loss": -35.458030700683594, "global_step": 82954, "epoch": 685} {"train_loss": -35.5162239074707, "global_step": 82955, "epoch": 685} {"train_loss": -35.300086975097656, "global_step": 82956, "epoch": 685} {"train_loss": -34.901424407958984, "global_step": 82957, "epoch": 685} {"train_loss": -35.04937744140625, "global_step": 82958, "epoch": 685} {"train_loss": -35.63156509399414, "global_step": 82959, "epoch": 685} {"train_loss": -35.78152847290039, "global_step": 82960, "epoch": 685} {"train_loss": -35.63816452026367, "global_step": 82961, "epoch": 685} {"train_loss": -34.77980422973633, "global_step": 82962, "epoch": 685} {"train_loss": -32.43941116333008, "global_step": 82963, "epoch": 685} {"train_loss": -31.37555503845215, "global_step": 82964, "epoch": 685} {"train_loss": -35.33543014526367, "global_step": 82965, "epoch": 685} {"train_loss": -32.18144607543945, "global_step": 82966, "epoch": 685} {"train_loss": -35.68532943725586, "global_step": 82967, "epoch": 685} {"train_loss": -34.25382995605469, "global_step": 82968, "epoch": 685} {"train_loss": -35.8380241394043, "global_step": 82969, "epoch": 685} {"train_loss": -34.19766616821289, "global_step": 82970, "epoch": 685} {"train_loss": -34.9249267578125, "global_step": 82971, "epoch": 685} {"train_loss": -34.154720306396484, "global_step": 82972, "epoch": 685} {"train_loss": -35.40605163574219, "global_step": 82973, "epoch": 685} {"train_loss": -34.87410354614258, "global_step": 82974, "epoch": 685} {"train_loss": -35.105674743652344, "global_step": 82975, "epoch": 685} {"train_loss": -33.53369140625, "global_step": 82976, "epoch": 685} {"train_loss": -33.02153015136719, "global_step": 82977, "epoch": 685} {"train_loss": -36.128170013427734, "global_step": 82978, "epoch": 685} {"train_loss": -35.556758880615234, "global_step": 82979, "epoch": 685} {"train_loss": -34.19858932495117, "global_step": 82980, "epoch": 685} {"train_loss": -34.31550216674805, "global_step": 82981, "epoch": 685} {"train_loss": -33.07295608520508, "global_step": 82982, "epoch": 685} {"train_loss": -35.59018325805664, "global_step": 82983, "epoch": 685} {"train_loss": -34.75382995605469, "global_step": 82984, "epoch": 685} {"train_loss": -34.818477630615234, "global_step": 82985, "epoch": 685} {"train_loss": -34.73160934448242, "global_step": 82986, "epoch": 685} {"train_loss": -34.381126403808594, "global_step": 82987, "epoch": 685} {"train_loss": -34.1927490234375, "global_step": 82988, "epoch": 685} {"train_loss": -35.560943603515625, "global_step": 82989, "epoch": 685} {"train_loss": -33.59622573852539, "global_step": 82990, "epoch": 685} {"train_loss": -35.212406158447266, "global_step": 82991, "epoch": 685} {"train_loss": -35.22063064575195, "global_step": 82992, "epoch": 685} {"train_loss": -35.33867645263672, "global_step": 82993, "epoch": 685} {"train_loss": -35.067806243896484, "global_step": 82994, "epoch": 685} {"train_loss": -35.02738571166992, "global_step": 82995, "epoch": 685} {"train_loss": -36.00904083251953, "global_step": 82996, "epoch": 685} {"train_loss": -35.61211395263672, "global_step": 82997, "epoch": 685} {"train_loss": -35.936458587646484, "global_step": 82998, "epoch": 685} {"train_loss": -35.50852584838867, "global_step": 82999, "epoch": 685} {"train_loss": -35.11252975463867, "global_step": 83000, "epoch": 685} {"train_loss": -35.607521057128906, "global_step": 83001, "epoch": 685} {"train_loss": -35.84049606323242, "global_step": 83002, "epoch": 685} {"train_loss": -36.091609954833984, "global_step": 83003, "epoch": 685} {"train_loss": -36.47184753417969, "global_step": 83004, "epoch": 685} {"train_loss": -33.669329477735786, "global_step": 83005, "epoch": 685, "val_loss": 2652064.75} {"train_loss": -35.573909759521484, "global_step": 83006, "epoch": 686} {"train_loss": -35.86357498168945, "global_step": 83007, "epoch": 686} {"train_loss": -36.166542053222656, "global_step": 83008, "epoch": 686} {"train_loss": -36.15504837036133, "global_step": 83009, "epoch": 686} {"train_loss": -35.5263557434082, "global_step": 83010, "epoch": 686} {"train_loss": -35.73093795776367, "global_step": 83011, "epoch": 686} {"train_loss": -35.33584213256836, "global_step": 83012, "epoch": 686} {"train_loss": -35.6768913269043, "global_step": 83013, "epoch": 686} {"train_loss": -35.505855560302734, "global_step": 83014, "epoch": 686} {"train_loss": -36.38349151611328, "global_step": 83015, "epoch": 686} {"train_loss": -36.73574447631836, "global_step": 83016, "epoch": 686} {"train_loss": -36.08555603027344, "global_step": 83017, "epoch": 686} {"train_loss": -36.03078842163086, "global_step": 83018, "epoch": 686} {"train_loss": -36.39939880371094, "global_step": 83019, "epoch": 686} {"train_loss": -36.99152374267578, "global_step": 83020, "epoch": 686} {"train_loss": -36.783416748046875, "global_step": 83021, "epoch": 686} {"train_loss": -36.841121673583984, "global_step": 83022, "epoch": 686} {"train_loss": -36.36897659301758, "global_step": 83023, "epoch": 686} {"train_loss": -36.46812057495117, "global_step": 83024, "epoch": 686} {"train_loss": -35.3587532043457, "global_step": 83025, "epoch": 686} {"train_loss": -34.708919525146484, "global_step": 83026, "epoch": 686} {"train_loss": -32.494171142578125, "global_step": 83027, "epoch": 686} {"train_loss": -30.479726791381836, "global_step": 83028, "epoch": 686} {"train_loss": -33.83088302612305, "global_step": 83029, "epoch": 686} {"train_loss": -34.376258850097656, "global_step": 83030, "epoch": 686} {"train_loss": -31.699390411376953, "global_step": 83031, "epoch": 686} {"train_loss": -35.75950241088867, "global_step": 83032, "epoch": 686} {"train_loss": -34.257930755615234, "global_step": 83033, "epoch": 686} {"train_loss": -35.87946701049805, "global_step": 83034, "epoch": 686} {"train_loss": -34.1318473815918, "global_step": 83035, "epoch": 686} {"train_loss": -35.656856536865234, "global_step": 83036, "epoch": 686} {"train_loss": -33.41366195678711, "global_step": 83037, "epoch": 686} {"train_loss": -35.71482467651367, "global_step": 83038, "epoch": 686} {"train_loss": -35.55632781982422, "global_step": 83039, "epoch": 686} {"train_loss": -34.99905776977539, "global_step": 83040, "epoch": 686} {"train_loss": -35.63500213623047, "global_step": 83041, "epoch": 686} {"train_loss": -35.63288879394531, "global_step": 83042, "epoch": 686} {"train_loss": -34.53196334838867, "global_step": 83043, "epoch": 686} {"train_loss": -34.75532150268555, "global_step": 83044, "epoch": 686} {"train_loss": -36.026947021484375, "global_step": 83045, "epoch": 686} {"train_loss": -34.5224609375, "global_step": 83046, "epoch": 686} {"train_loss": -35.7133903503418, "global_step": 83047, "epoch": 686} {"train_loss": -35.33030319213867, "global_step": 83048, "epoch": 686} {"train_loss": -35.37677001953125, "global_step": 83049, "epoch": 686} {"train_loss": -35.35118865966797, "global_step": 83050, "epoch": 686} {"train_loss": -35.37494659423828, "global_step": 83051, "epoch": 686} {"train_loss": -33.69500732421875, "global_step": 83052, "epoch": 686} {"train_loss": -36.05549621582031, "global_step": 83053, "epoch": 686} {"train_loss": -34.18466567993164, "global_step": 83054, "epoch": 686} {"train_loss": -36.061866760253906, "global_step": 83055, "epoch": 686} {"train_loss": -33.47713088989258, "global_step": 83056, "epoch": 686} {"train_loss": -35.09111785888672, "global_step": 83057, "epoch": 686} {"train_loss": -34.9744873046875, "global_step": 83058, "epoch": 686} {"train_loss": -36.11776351928711, "global_step": 83059, "epoch": 686} {"train_loss": -34.41465377807617, "global_step": 83060, "epoch": 686} {"train_loss": -34.17466354370117, "global_step": 83061, "epoch": 686} {"train_loss": -33.78676223754883, "global_step": 83062, "epoch": 686} {"train_loss": -33.34028625488281, "global_step": 83063, "epoch": 686} {"train_loss": -28.924671173095703, "global_step": 83064, "epoch": 686} {"train_loss": -28.777332305908203, "global_step": 83065, "epoch": 686} {"train_loss": -34.5450439453125, "global_step": 83066, "epoch": 686} {"train_loss": -34.90395736694336, "global_step": 83067, "epoch": 686} {"train_loss": -34.18143844604492, "global_step": 83068, "epoch": 686} {"train_loss": -35.33504104614258, "global_step": 83069, "epoch": 686} {"train_loss": -34.967403411865234, "global_step": 83070, "epoch": 686} {"train_loss": -35.79323196411133, "global_step": 83071, "epoch": 686} {"train_loss": -34.80364990234375, "global_step": 83072, "epoch": 686} {"train_loss": -35.54462814331055, "global_step": 83073, "epoch": 686} {"train_loss": -35.07011795043945, "global_step": 83074, "epoch": 686} {"train_loss": -35.72903060913086, "global_step": 83075, "epoch": 686} {"train_loss": -35.35609436035156, "global_step": 83076, "epoch": 686} {"train_loss": -35.16620635986328, "global_step": 83077, "epoch": 686} {"train_loss": -36.3299560546875, "global_step": 83078, "epoch": 686} {"train_loss": -35.88886260986328, "global_step": 83079, "epoch": 686} {"train_loss": -36.187660217285156, "global_step": 83080, "epoch": 686} {"train_loss": -35.61648941040039, "global_step": 83081, "epoch": 686} {"train_loss": -36.25680160522461, "global_step": 83082, "epoch": 686} {"train_loss": -36.165008544921875, "global_step": 83083, "epoch": 686} {"train_loss": -36.1920051574707, "global_step": 83084, "epoch": 686} {"train_loss": -36.07487106323242, "global_step": 83085, "epoch": 686} {"train_loss": -36.55561447143555, "global_step": 83086, "epoch": 686} {"train_loss": -36.78961944580078, "global_step": 83087, "epoch": 686} {"train_loss": -36.373416900634766, "global_step": 83088, "epoch": 686} {"train_loss": -36.55329132080078, "global_step": 83089, "epoch": 686} {"train_loss": -36.41811752319336, "global_step": 83090, "epoch": 686} {"train_loss": -36.75452423095703, "global_step": 83091, "epoch": 686} {"train_loss": -36.312232971191406, "global_step": 83092, "epoch": 686} {"train_loss": -37.00178909301758, "global_step": 83093, "epoch": 686} {"train_loss": -37.08236312866211, "global_step": 83094, "epoch": 686} {"train_loss": -37.2402458190918, "global_step": 83095, "epoch": 686} {"train_loss": -36.937713623046875, "global_step": 83096, "epoch": 686} {"train_loss": -37.214881896972656, "global_step": 83097, "epoch": 686} {"train_loss": -36.019039154052734, "global_step": 83098, "epoch": 686} {"train_loss": -36.881771087646484, "global_step": 83099, "epoch": 686} {"train_loss": -37.293575286865234, "global_step": 83100, "epoch": 686} {"train_loss": -36.951560974121094, "global_step": 83101, "epoch": 686} {"train_loss": -36.58760452270508, "global_step": 83102, "epoch": 686} {"train_loss": -36.73647689819336, "global_step": 83103, "epoch": 686} {"train_loss": -36.70511245727539, "global_step": 83104, "epoch": 686} {"train_loss": -36.01454162597656, "global_step": 83105, "epoch": 686} {"train_loss": -36.61818313598633, "global_step": 83106, "epoch": 686} {"train_loss": -36.937103271484375, "global_step": 83107, "epoch": 686} {"train_loss": -36.1343994140625, "global_step": 83108, "epoch": 686} {"train_loss": -34.619754791259766, "global_step": 83109, "epoch": 686} {"train_loss": -33.43552780151367, "global_step": 83110, "epoch": 686} {"train_loss": -33.53877639770508, "global_step": 83111, "epoch": 686} {"train_loss": -36.9048957824707, "global_step": 83112, "epoch": 686} {"train_loss": -33.73856735229492, "global_step": 83113, "epoch": 686} {"train_loss": -34.51222229003906, "global_step": 83114, "epoch": 686} {"train_loss": -37.210594177246094, "global_step": 83115, "epoch": 686} {"train_loss": -34.96921920776367, "global_step": 83116, "epoch": 686} {"train_loss": -36.64460372924805, "global_step": 83117, "epoch": 686} {"train_loss": -35.670379638671875, "global_step": 83118, "epoch": 686} {"train_loss": -36.78975296020508, "global_step": 83119, "epoch": 686} {"train_loss": -35.7971076965332, "global_step": 83120, "epoch": 686} {"train_loss": -36.669212341308594, "global_step": 83121, "epoch": 686} {"train_loss": -33.714664459228516, "global_step": 83122, "epoch": 686} {"train_loss": -33.86661911010742, "global_step": 83123, "epoch": 686} {"train_loss": -34.55488204956055, "global_step": 83124, "epoch": 686} {"train_loss": -35.0072135925293, "global_step": 83125, "epoch": 686} {"train_loss": -35.409151896957525, "global_step": 83126, "epoch": 686, "val_loss": 2546506.75} {"train_loss": -36.29853057861328, "global_step": 83127, "epoch": 687} {"train_loss": -35.04338455200195, "global_step": 83128, "epoch": 687} {"train_loss": -35.56397247314453, "global_step": 83129, "epoch": 687} {"train_loss": -37.02521514892578, "global_step": 83130, "epoch": 687} {"train_loss": -35.51783752441406, "global_step": 83131, "epoch": 687} {"train_loss": -36.23175811767578, "global_step": 83132, "epoch": 687} {"train_loss": -35.75753402709961, "global_step": 83133, "epoch": 687} {"train_loss": -36.17570114135742, "global_step": 83134, "epoch": 687} {"train_loss": -36.609004974365234, "global_step": 83135, "epoch": 687} {"train_loss": -36.421730041503906, "global_step": 83136, "epoch": 687} {"train_loss": -37.121726989746094, "global_step": 83137, "epoch": 687} {"train_loss": -34.98979568481445, "global_step": 83138, "epoch": 687} {"train_loss": -36.67759704589844, "global_step": 83139, "epoch": 687} {"train_loss": -36.50022888183594, "global_step": 83140, "epoch": 687} {"train_loss": -35.22805404663086, "global_step": 83141, "epoch": 687} {"train_loss": -36.70014572143555, "global_step": 83142, "epoch": 687} {"train_loss": -36.349605560302734, "global_step": 83143, "epoch": 687} {"train_loss": -35.2140998840332, "global_step": 83144, "epoch": 687} {"train_loss": -35.15460205078125, "global_step": 83145, "epoch": 687} {"train_loss": -36.30215072631836, "global_step": 83146, "epoch": 687} {"train_loss": -35.814369201660156, "global_step": 83147, "epoch": 687} {"train_loss": -37.0728759765625, "global_step": 83148, "epoch": 687} {"train_loss": -36.03275680541992, "global_step": 83149, "epoch": 687} {"train_loss": -36.006858825683594, "global_step": 83150, "epoch": 687} {"train_loss": -36.746280670166016, "global_step": 83151, "epoch": 687} {"train_loss": -36.05131149291992, "global_step": 83152, "epoch": 687} {"train_loss": -35.63839340209961, "global_step": 83153, "epoch": 687} {"train_loss": -35.53042221069336, "global_step": 83154, "epoch": 687} {"train_loss": -36.344669342041016, "global_step": 83155, "epoch": 687} {"train_loss": -36.21458053588867, "global_step": 83156, "epoch": 687} {"train_loss": -36.348609924316406, "global_step": 83157, "epoch": 687} {"train_loss": -36.73799514770508, "global_step": 83158, "epoch": 687} {"train_loss": -35.421661376953125, "global_step": 83159, "epoch": 687} {"train_loss": -36.29120635986328, "global_step": 83160, "epoch": 687} {"train_loss": -36.3537712097168, "global_step": 83161, "epoch": 687} {"train_loss": -36.0061149597168, "global_step": 83162, "epoch": 687} {"train_loss": -35.66852951049805, "global_step": 83163, "epoch": 687} {"train_loss": -36.09334945678711, "global_step": 83164, "epoch": 687} {"train_loss": -34.78927230834961, "global_step": 83165, "epoch": 687} {"train_loss": -36.00118637084961, "global_step": 83166, "epoch": 687} {"train_loss": -34.55984115600586, "global_step": 83167, "epoch": 687} {"train_loss": -33.45711898803711, "global_step": 83168, "epoch": 687} {"train_loss": -23.20857810974121, "global_step": 83169, "epoch": 687} {"train_loss": -23.237279891967773, "global_step": 83170, "epoch": 687} {"train_loss": -35.62896728515625, "global_step": 83171, "epoch": 687} {"train_loss": -30.72478675842285, "global_step": 83172, "epoch": 687} {"train_loss": -33.94261932373047, "global_step": 83173, "epoch": 687} {"train_loss": -34.48356628417969, "global_step": 83174, "epoch": 687} {"train_loss": -35.09025955200195, "global_step": 83175, "epoch": 687} {"train_loss": -35.339027404785156, "global_step": 83176, "epoch": 687} {"train_loss": -36.009315490722656, "global_step": 83177, "epoch": 687} {"train_loss": -35.081172943115234, "global_step": 83178, "epoch": 687} {"train_loss": -36.05596923828125, "global_step": 83179, "epoch": 687} {"train_loss": -34.94710922241211, "global_step": 83180, "epoch": 687} {"train_loss": -34.115203857421875, "global_step": 83181, "epoch": 687} {"train_loss": -36.54062271118164, "global_step": 83182, "epoch": 687} {"train_loss": -35.93962478637695, "global_step": 83183, "epoch": 687} {"train_loss": -36.26671600341797, "global_step": 83184, "epoch": 687} {"train_loss": -36.41135025024414, "global_step": 83185, "epoch": 687} {"train_loss": -36.169837951660156, "global_step": 83186, "epoch": 687} {"train_loss": -35.1309814453125, "global_step": 83187, "epoch": 687} {"train_loss": -34.89034652709961, "global_step": 83188, "epoch": 687} {"train_loss": -36.2275505065918, "global_step": 83189, "epoch": 687} {"train_loss": -36.010066986083984, "global_step": 83190, "epoch": 687} {"train_loss": -36.763519287109375, "global_step": 83191, "epoch": 687} {"train_loss": -36.3975944519043, "global_step": 83192, "epoch": 687} {"train_loss": -36.49814987182617, "global_step": 83193, "epoch": 687} {"train_loss": -36.799800872802734, "global_step": 83194, "epoch": 687} {"train_loss": -35.816768646240234, "global_step": 83195, "epoch": 687} {"train_loss": -35.995723724365234, "global_step": 83196, "epoch": 687} {"train_loss": -36.1536750793457, "global_step": 83197, "epoch": 687} {"train_loss": -36.17478561401367, "global_step": 83198, "epoch": 687} {"train_loss": -33.67206954956055, "global_step": 83199, "epoch": 687} {"train_loss": -36.53788375854492, "global_step": 83200, "epoch": 687} {"train_loss": -36.386470794677734, "global_step": 83201, "epoch": 687} {"train_loss": -37.018856048583984, "global_step": 83202, "epoch": 687} {"train_loss": -36.205421447753906, "global_step": 83203, "epoch": 687} {"train_loss": -35.808509826660156, "global_step": 83204, "epoch": 687} {"train_loss": -35.41109848022461, "global_step": 83205, "epoch": 687} {"train_loss": -33.95888137817383, "global_step": 83206, "epoch": 687} {"train_loss": -30.74490737915039, "global_step": 83207, "epoch": 687} {"train_loss": -30.026123046875, "global_step": 83208, "epoch": 687} {"train_loss": -35.91391372680664, "global_step": 83209, "epoch": 687} {"train_loss": -33.953792572021484, "global_step": 83210, "epoch": 687} {"train_loss": -32.448883056640625, "global_step": 83211, "epoch": 687} {"train_loss": -35.201873779296875, "global_step": 83212, "epoch": 687} {"train_loss": -31.14643669128418, "global_step": 83213, "epoch": 687} {"train_loss": -35.919429779052734, "global_step": 83214, "epoch": 687} {"train_loss": -33.37782669067383, "global_step": 83215, "epoch": 687} {"train_loss": -35.39228439331055, "global_step": 83216, "epoch": 687} {"train_loss": -34.93159866333008, "global_step": 83217, "epoch": 687} {"train_loss": -34.72564697265625, "global_step": 83218, "epoch": 687} {"train_loss": -36.61497497558594, "global_step": 83219, "epoch": 687} {"train_loss": -35.33403396606445, "global_step": 83220, "epoch": 687} {"train_loss": -35.466331481933594, "global_step": 83221, "epoch": 687} {"train_loss": -36.28359603881836, "global_step": 83222, "epoch": 687} {"train_loss": -34.58460235595703, "global_step": 83223, "epoch": 687} {"train_loss": -36.069698333740234, "global_step": 83224, "epoch": 687} {"train_loss": -35.60624313354492, "global_step": 83225, "epoch": 687} {"train_loss": -36.234230041503906, "global_step": 83226, "epoch": 687} {"train_loss": -35.70779037475586, "global_step": 83227, "epoch": 687} {"train_loss": -35.87688064575195, "global_step": 83228, "epoch": 687} {"train_loss": -35.95681381225586, "global_step": 83229, "epoch": 687} {"train_loss": -36.1444091796875, "global_step": 83230, "epoch": 687} {"train_loss": -34.73682403564453, "global_step": 83231, "epoch": 687} {"train_loss": -36.12238693237305, "global_step": 83232, "epoch": 687} {"train_loss": -36.20975112915039, "global_step": 83233, "epoch": 687} {"train_loss": -36.4033317565918, "global_step": 83234, "epoch": 687} {"train_loss": -36.49945831298828, "global_step": 83235, "epoch": 687} {"train_loss": -35.80669021606445, "global_step": 83236, "epoch": 687} {"train_loss": -34.820770263671875, "global_step": 83237, "epoch": 687} {"train_loss": -35.88541793823242, "global_step": 83238, "epoch": 687} {"train_loss": -36.269466400146484, "global_step": 83239, "epoch": 687} {"train_loss": -36.056007385253906, "global_step": 83240, "epoch": 687} {"train_loss": -36.250396728515625, "global_step": 83241, "epoch": 687} {"train_loss": -36.4119987487793, "global_step": 83242, "epoch": 687} {"train_loss": -35.975406646728516, "global_step": 83243, "epoch": 687} {"train_loss": -36.379730224609375, "global_step": 83244, "epoch": 687} {"train_loss": -36.32229232788086, "global_step": 83245, "epoch": 687} {"train_loss": -35.97401428222656, "global_step": 83246, "epoch": 687} {"train_loss": -35.393843438014514, "global_step": 83247, "epoch": 687, "val_loss": 2597700.25} {"train_loss": -32.587825775146484, "global_step": 83248, "epoch": 688} {"train_loss": -31.98101234436035, "global_step": 83249, "epoch": 688} {"train_loss": -33.9796257019043, "global_step": 83250, "epoch": 688} {"train_loss": -35.943115234375, "global_step": 83251, "epoch": 688} {"train_loss": -35.94807052612305, "global_step": 83252, "epoch": 688} {"train_loss": -35.299983978271484, "global_step": 83253, "epoch": 688} {"train_loss": -36.19437026977539, "global_step": 83254, "epoch": 688} {"train_loss": -36.039730072021484, "global_step": 83255, "epoch": 688} {"train_loss": -35.4865837097168, "global_step": 83256, "epoch": 688} {"train_loss": -36.65074157714844, "global_step": 83257, "epoch": 688} {"train_loss": -36.0714225769043, "global_step": 83258, "epoch": 688} {"train_loss": -36.99244689941406, "global_step": 83259, "epoch": 688} {"train_loss": -36.4214973449707, "global_step": 83260, "epoch": 688} {"train_loss": -36.303157806396484, "global_step": 83261, "epoch": 688} {"train_loss": -36.302730560302734, "global_step": 83262, "epoch": 688} {"train_loss": -35.750301361083984, "global_step": 83263, "epoch": 688} {"train_loss": -35.77164840698242, "global_step": 83264, "epoch": 688} {"train_loss": -36.610877990722656, "global_step": 83265, "epoch": 688} {"train_loss": -36.78650665283203, "global_step": 83266, "epoch": 688} {"train_loss": -36.272335052490234, "global_step": 83267, "epoch": 688} {"train_loss": -37.40797805786133, "global_step": 83268, "epoch": 688} {"train_loss": -37.16436767578125, "global_step": 83269, "epoch": 688} {"train_loss": -36.833736419677734, "global_step": 83270, "epoch": 688} {"train_loss": -36.51278305053711, "global_step": 83271, "epoch": 688} {"train_loss": -37.66483688354492, "global_step": 83272, "epoch": 688} {"train_loss": -37.3558464050293, "global_step": 83273, "epoch": 688} {"train_loss": -36.849525451660156, "global_step": 83274, "epoch": 688} {"train_loss": -37.42281723022461, "global_step": 83275, "epoch": 688} {"train_loss": -36.972023010253906, "global_step": 83276, "epoch": 688} {"train_loss": -36.96623611450195, "global_step": 83277, "epoch": 688} {"train_loss": -36.732017517089844, "global_step": 83278, "epoch": 688} {"train_loss": -36.581424713134766, "global_step": 83279, "epoch": 688} {"train_loss": -37.60126876831055, "global_step": 83280, "epoch": 688} {"train_loss": -37.539573669433594, "global_step": 83281, "epoch": 688} {"train_loss": -37.41860580444336, "global_step": 83282, "epoch": 688} {"train_loss": -37.18537521362305, "global_step": 83283, "epoch": 688} {"train_loss": -37.62376403808594, "global_step": 83284, "epoch": 688} {"train_loss": -37.20261001586914, "global_step": 83285, "epoch": 688} {"train_loss": -36.65481948852539, "global_step": 83286, "epoch": 688} {"train_loss": -37.162471771240234, "global_step": 83287, "epoch": 688} {"train_loss": -37.42368698120117, "global_step": 83288, "epoch": 688} {"train_loss": -36.67685317993164, "global_step": 83289, "epoch": 688} {"train_loss": -37.68095779418945, "global_step": 83290, "epoch": 688} {"train_loss": -37.08042526245117, "global_step": 83291, "epoch": 688} {"train_loss": -37.21295166015625, "global_step": 83292, "epoch": 688} {"train_loss": -35.316078186035156, "global_step": 83293, "epoch": 688} {"train_loss": -36.613277435302734, "global_step": 83294, "epoch": 688} {"train_loss": -37.009395599365234, "global_step": 83295, "epoch": 688} {"train_loss": -36.85496139526367, "global_step": 83296, "epoch": 688} {"train_loss": -37.683837890625, "global_step": 83297, "epoch": 688} {"train_loss": -37.439510345458984, "global_step": 83298, "epoch": 688} {"train_loss": -37.3489875793457, "global_step": 83299, "epoch": 688} {"train_loss": -37.256656646728516, "global_step": 83300, "epoch": 688} {"train_loss": -37.32693099975586, "global_step": 83301, "epoch": 688} {"train_loss": -37.3354606628418, "global_step": 83302, "epoch": 688} {"train_loss": -37.33469772338867, "global_step": 83303, "epoch": 688} {"train_loss": -36.59049606323242, "global_step": 83304, "epoch": 688} {"train_loss": -36.30938720703125, "global_step": 83305, "epoch": 688} {"train_loss": -36.43718338012695, "global_step": 83306, "epoch": 688} {"train_loss": -36.4477653503418, "global_step": 83307, "epoch": 688} {"train_loss": -35.87599563598633, "global_step": 83308, "epoch": 688} {"train_loss": -33.93375778198242, "global_step": 83309, "epoch": 688} {"train_loss": -35.74584197998047, "global_step": 83310, "epoch": 688} {"train_loss": -36.16400146484375, "global_step": 83311, "epoch": 688} {"train_loss": -35.3564453125, "global_step": 83312, "epoch": 688} {"train_loss": -36.50092315673828, "global_step": 83313, "epoch": 688} {"train_loss": -36.819862365722656, "global_step": 83314, "epoch": 688} {"train_loss": -33.87004852294922, "global_step": 83315, "epoch": 688} {"train_loss": -34.91899871826172, "global_step": 83316, "epoch": 688} {"train_loss": -35.68949508666992, "global_step": 83317, "epoch": 688} {"train_loss": -35.97612762451172, "global_step": 83318, "epoch": 688} {"train_loss": -35.18293380737305, "global_step": 83319, "epoch": 688} {"train_loss": -36.13339614868164, "global_step": 83320, "epoch": 688} {"train_loss": -35.74644470214844, "global_step": 83321, "epoch": 688} {"train_loss": -36.23238754272461, "global_step": 83322, "epoch": 688} {"train_loss": -36.30986404418945, "global_step": 83323, "epoch": 688} {"train_loss": -36.23627471923828, "global_step": 83324, "epoch": 688} {"train_loss": -36.66872787475586, "global_step": 83325, "epoch": 688} {"train_loss": -35.101776123046875, "global_step": 83326, "epoch": 688} {"train_loss": -36.29077911376953, "global_step": 83327, "epoch": 688} {"train_loss": -35.94748306274414, "global_step": 83328, "epoch": 688} {"train_loss": -36.7692985534668, "global_step": 83329, "epoch": 688} {"train_loss": -36.25288009643555, "global_step": 83330, "epoch": 688} {"train_loss": -35.44947052001953, "global_step": 83331, "epoch": 688} {"train_loss": -36.371376037597656, "global_step": 83332, "epoch": 688} {"train_loss": -35.99532699584961, "global_step": 83333, "epoch": 688} {"train_loss": -35.48270797729492, "global_step": 83334, "epoch": 688} {"train_loss": -35.9569206237793, "global_step": 83335, "epoch": 688} {"train_loss": -34.795570373535156, "global_step": 83336, "epoch": 688} {"train_loss": -37.30855941772461, "global_step": 83337, "epoch": 688} {"train_loss": -36.672054290771484, "global_step": 83338, "epoch": 688} {"train_loss": -36.111087799072266, "global_step": 83339, "epoch": 688} {"train_loss": -35.95888900756836, "global_step": 83340, "epoch": 688} {"train_loss": -36.22380447387695, "global_step": 83341, "epoch": 688} {"train_loss": -36.4708137512207, "global_step": 83342, "epoch": 688} {"train_loss": -36.80149841308594, "global_step": 83343, "epoch": 688} {"train_loss": -36.14842987060547, "global_step": 83344, "epoch": 688} {"train_loss": -36.95661544799805, "global_step": 83345, "epoch": 688} {"train_loss": -37.71352767944336, "global_step": 83346, "epoch": 688} {"train_loss": -36.22455978393555, "global_step": 83347, "epoch": 688} {"train_loss": -37.027462005615234, "global_step": 83348, "epoch": 688} {"train_loss": -37.04457092285156, "global_step": 83349, "epoch": 688} {"train_loss": -36.9913444519043, "global_step": 83350, "epoch": 688} {"train_loss": -37.30786895751953, "global_step": 83351, "epoch": 688} {"train_loss": -36.60506057739258, "global_step": 83352, "epoch": 688} {"train_loss": -37.09039306640625, "global_step": 83353, "epoch": 688} {"train_loss": -37.38715362548828, "global_step": 83354, "epoch": 688} {"train_loss": -37.536476135253906, "global_step": 83355, "epoch": 688} {"train_loss": -37.17474365234375, "global_step": 83356, "epoch": 688} {"train_loss": -36.54524612426758, "global_step": 83357, "epoch": 688} {"train_loss": -37.581180572509766, "global_step": 83358, "epoch": 688} {"train_loss": -37.806373596191406, "global_step": 83359, "epoch": 688} {"train_loss": -37.152278900146484, "global_step": 83360, "epoch": 688} {"train_loss": -36.9351921081543, "global_step": 83361, "epoch": 688} {"train_loss": -37.27630615234375, "global_step": 83362, "epoch": 688} {"train_loss": -37.34029769897461, "global_step": 83363, "epoch": 688} {"train_loss": -37.918819427490234, "global_step": 83364, "epoch": 688} {"train_loss": -37.19491958618164, "global_step": 83365, "epoch": 688} {"train_loss": -37.47663497924805, "global_step": 83366, "epoch": 688} {"train_loss": -37.182918548583984, "global_step": 83367, "epoch": 688} {"train_loss": -36.51738507294458, "global_step": 83368, "epoch": 688, "val_loss": 2655032.25} {"train_loss": -37.3709602355957, "global_step": 83369, "epoch": 689} {"train_loss": -37.54075622558594, "global_step": 83370, "epoch": 689} {"train_loss": -37.44804763793945, "global_step": 83371, "epoch": 689} {"train_loss": -37.475894927978516, "global_step": 83372, "epoch": 689} {"train_loss": -37.077274322509766, "global_step": 83373, "epoch": 689} {"train_loss": -35.98180389404297, "global_step": 83374, "epoch": 689} {"train_loss": -36.122718811035156, "global_step": 83375, "epoch": 689} {"train_loss": -34.870521545410156, "global_step": 83376, "epoch": 689} {"train_loss": -32.20016860961914, "global_step": 83377, "epoch": 689} {"train_loss": -33.916236877441406, "global_step": 83378, "epoch": 689} {"train_loss": -35.23677062988281, "global_step": 83379, "epoch": 689} {"train_loss": -37.59811019897461, "global_step": 83380, "epoch": 689} {"train_loss": -33.199031829833984, "global_step": 83381, "epoch": 689} {"train_loss": -32.08759689331055, "global_step": 83382, "epoch": 689} {"train_loss": -34.1111946105957, "global_step": 83383, "epoch": 689} {"train_loss": -30.553442001342773, "global_step": 83384, "epoch": 689} {"train_loss": -34.743343353271484, "global_step": 83385, "epoch": 689} {"train_loss": -33.706729888916016, "global_step": 83386, "epoch": 689} {"train_loss": -32.408836364746094, "global_step": 83387, "epoch": 689} {"train_loss": -34.040184020996094, "global_step": 83388, "epoch": 689} {"train_loss": -36.1916618347168, "global_step": 83389, "epoch": 689} {"train_loss": -34.45561599731445, "global_step": 83390, "epoch": 689} {"train_loss": -36.8531379699707, "global_step": 83391, "epoch": 689} {"train_loss": -36.52012252807617, "global_step": 83392, "epoch": 689} {"train_loss": -35.46025848388672, "global_step": 83393, "epoch": 689} {"train_loss": -35.66719436645508, "global_step": 83394, "epoch": 689} {"train_loss": -36.559974670410156, "global_step": 83395, "epoch": 689} {"train_loss": -36.882442474365234, "global_step": 83396, "epoch": 689} {"train_loss": -35.80685043334961, "global_step": 83397, "epoch": 689} {"train_loss": -36.45764923095703, "global_step": 83398, "epoch": 689} {"train_loss": -35.82078170776367, "global_step": 83399, "epoch": 689} {"train_loss": -36.65520095825195, "global_step": 83400, "epoch": 689} {"train_loss": -35.719512939453125, "global_step": 83401, "epoch": 689} {"train_loss": -36.59406280517578, "global_step": 83402, "epoch": 689} {"train_loss": -37.48910140991211, "global_step": 83403, "epoch": 689} {"train_loss": -36.72949981689453, "global_step": 83404, "epoch": 689} {"train_loss": -37.38146209716797, "global_step": 83405, "epoch": 689} {"train_loss": -37.07768630981445, "global_step": 83406, "epoch": 689} {"train_loss": -37.34344482421875, "global_step": 83407, "epoch": 689} {"train_loss": -37.24697494506836, "global_step": 83408, "epoch": 689} {"train_loss": -36.64509201049805, "global_step": 83409, "epoch": 689} {"train_loss": -37.09416580200195, "global_step": 83410, "epoch": 689} {"train_loss": -36.780208587646484, "global_step": 83411, "epoch": 689} {"train_loss": -37.43272399902344, "global_step": 83412, "epoch": 689} {"train_loss": -37.095130920410156, "global_step": 83413, "epoch": 689} {"train_loss": -37.05453109741211, "global_step": 83414, "epoch": 689} {"train_loss": -37.43616485595703, "global_step": 83415, "epoch": 689} {"train_loss": -36.928955078125, "global_step": 83416, "epoch": 689} {"train_loss": -37.039608001708984, "global_step": 83417, "epoch": 689} {"train_loss": -37.71952438354492, "global_step": 83418, "epoch": 689} {"train_loss": -37.34159469604492, "global_step": 83419, "epoch": 689} {"train_loss": -37.177127838134766, "global_step": 83420, "epoch": 689} {"train_loss": -35.37321090698242, "global_step": 83421, "epoch": 689} {"train_loss": -36.9504280090332, "global_step": 83422, "epoch": 689} {"train_loss": -37.094459533691406, "global_step": 83423, "epoch": 689} {"train_loss": -37.49467468261719, "global_step": 83424, "epoch": 689} {"train_loss": -36.82038497924805, "global_step": 83425, "epoch": 689} {"train_loss": -35.712825775146484, "global_step": 83426, "epoch": 689} {"train_loss": -36.173519134521484, "global_step": 83427, "epoch": 689} {"train_loss": -36.200008392333984, "global_step": 83428, "epoch": 689} {"train_loss": -36.06446838378906, "global_step": 83429, "epoch": 689} {"train_loss": -37.59747314453125, "global_step": 83430, "epoch": 689} {"train_loss": -36.91889572143555, "global_step": 83431, "epoch": 689} {"train_loss": -37.61350631713867, "global_step": 83432, "epoch": 689} {"train_loss": -36.90193557739258, "global_step": 83433, "epoch": 689} {"train_loss": -37.22516632080078, "global_step": 83434, "epoch": 689} {"train_loss": -37.05461502075195, "global_step": 83435, "epoch": 689} {"train_loss": -35.24674606323242, "global_step": 83436, "epoch": 689} {"train_loss": -36.049129486083984, "global_step": 83437, "epoch": 689} {"train_loss": -36.190948486328125, "global_step": 83438, "epoch": 689} {"train_loss": -37.805747985839844, "global_step": 83439, "epoch": 689} {"train_loss": -36.54527282714844, "global_step": 83440, "epoch": 689} {"train_loss": -37.513912200927734, "global_step": 83441, "epoch": 689} {"train_loss": -35.767425537109375, "global_step": 83442, "epoch": 689} {"train_loss": -36.25651931762695, "global_step": 83443, "epoch": 689} {"train_loss": -36.896846771240234, "global_step": 83444, "epoch": 689} {"train_loss": -37.58930587768555, "global_step": 83445, "epoch": 689} {"train_loss": -37.421878814697266, "global_step": 83446, "epoch": 689} {"train_loss": -35.820987701416016, "global_step": 83447, "epoch": 689} {"train_loss": -36.11444091796875, "global_step": 83448, "epoch": 689} {"train_loss": -36.929439544677734, "global_step": 83449, "epoch": 689} {"train_loss": -33.306331634521484, "global_step": 83450, "epoch": 689} {"train_loss": -36.44305419921875, "global_step": 83451, "epoch": 689} {"train_loss": -33.2296257019043, "global_step": 83452, "epoch": 689} {"train_loss": -37.21632385253906, "global_step": 83453, "epoch": 689} {"train_loss": -36.842559814453125, "global_step": 83454, "epoch": 689} {"train_loss": -33.9410400390625, "global_step": 83455, "epoch": 689} {"train_loss": -37.37038040161133, "global_step": 83456, "epoch": 689} {"train_loss": -32.40791702270508, "global_step": 83457, "epoch": 689} {"train_loss": -31.36104393005371, "global_step": 83458, "epoch": 689} {"train_loss": -35.9326286315918, "global_step": 83459, "epoch": 689} {"train_loss": -35.29671096801758, "global_step": 83460, "epoch": 689} {"train_loss": -35.48757553100586, "global_step": 83461, "epoch": 689} {"train_loss": -34.43561553955078, "global_step": 83462, "epoch": 689} {"train_loss": -31.714862823486328, "global_step": 83463, "epoch": 689} {"train_loss": -36.4039192199707, "global_step": 83464, "epoch": 689} {"train_loss": -34.59807205200195, "global_step": 83465, "epoch": 689} {"train_loss": -35.717689514160156, "global_step": 83466, "epoch": 689} {"train_loss": -35.02872848510742, "global_step": 83467, "epoch": 689} {"train_loss": -33.06643295288086, "global_step": 83468, "epoch": 689} {"train_loss": -34.60774612426758, "global_step": 83469, "epoch": 689} {"train_loss": -35.247535705566406, "global_step": 83470, "epoch": 689} {"train_loss": -36.478424072265625, "global_step": 83471, "epoch": 689} {"train_loss": -35.80316162109375, "global_step": 83472, "epoch": 689} {"train_loss": -36.11577224731445, "global_step": 83473, "epoch": 689} {"train_loss": -35.74784469604492, "global_step": 83474, "epoch": 689} {"train_loss": -36.08744812011719, "global_step": 83475, "epoch": 689} {"train_loss": -35.93624496459961, "global_step": 83476, "epoch": 689} {"train_loss": -35.81982421875, "global_step": 83477, "epoch": 689} {"train_loss": -35.27640914916992, "global_step": 83478, "epoch": 689} {"train_loss": -35.93474197387695, "global_step": 83479, "epoch": 689} {"train_loss": -35.85203552246094, "global_step": 83480, "epoch": 689} {"train_loss": -35.41238021850586, "global_step": 83481, "epoch": 689} {"train_loss": -37.03495788574219, "global_step": 83482, "epoch": 689} {"train_loss": -36.417991638183594, "global_step": 83483, "epoch": 689} {"train_loss": -36.032684326171875, "global_step": 83484, "epoch": 689} {"train_loss": -36.634178161621094, "global_step": 83485, "epoch": 689} {"train_loss": -36.74873733520508, "global_step": 83486, "epoch": 689} {"train_loss": -34.97163772583008, "global_step": 83487, "epoch": 689} {"train_loss": -36.3409538269043, "global_step": 83488, "epoch": 689} {"train_loss": -35.95190886820643, "global_step": 83489, "epoch": 689, "val_loss": 2612289.25} {"train_loss": -34.22185134887695, "global_step": 83490, "epoch": 690} {"train_loss": -35.90618133544922, "global_step": 83491, "epoch": 690} {"train_loss": -35.444759368896484, "global_step": 83492, "epoch": 690} {"train_loss": -34.037662506103516, "global_step": 83493, "epoch": 690} {"train_loss": -30.119348526000977, "global_step": 83494, "epoch": 690} {"train_loss": -19.13456153869629, "global_step": 83495, "epoch": 690} {"train_loss": -6.592774868011475, "global_step": 83496, "epoch": 690} {"train_loss": -16.393728256225586, "global_step": 83497, "epoch": 690} {"train_loss": -33.95417404174805, "global_step": 83498, "epoch": 690} {"train_loss": -23.604524612426758, "global_step": 83499, "epoch": 690} {"train_loss": -34.60825729370117, "global_step": 83500, "epoch": 690} {"train_loss": -28.724781036376953, "global_step": 83501, "epoch": 690} {"train_loss": -32.050411224365234, "global_step": 83502, "epoch": 690} {"train_loss": -33.698490142822266, "global_step": 83503, "epoch": 690} {"train_loss": -28.262739181518555, "global_step": 83504, "epoch": 690} {"train_loss": -35.5217399597168, "global_step": 83505, "epoch": 690} {"train_loss": -33.620811462402344, "global_step": 83506, "epoch": 690} {"train_loss": -32.090179443359375, "global_step": 83507, "epoch": 690} {"train_loss": -35.11509323120117, "global_step": 83508, "epoch": 690} {"train_loss": -34.89521026611328, "global_step": 83509, "epoch": 690} {"train_loss": -33.37921142578125, "global_step": 83510, "epoch": 690} {"train_loss": -35.15919876098633, "global_step": 83511, "epoch": 690} {"train_loss": -35.29050827026367, "global_step": 83512, "epoch": 690} {"train_loss": -35.404205322265625, "global_step": 83513, "epoch": 690} {"train_loss": -35.372676849365234, "global_step": 83514, "epoch": 690} {"train_loss": -35.106746673583984, "global_step": 83515, "epoch": 690} {"train_loss": -35.735206604003906, "global_step": 83516, "epoch": 690} {"train_loss": -35.55905532836914, "global_step": 83517, "epoch": 690} {"train_loss": -35.98161697387695, "global_step": 83518, "epoch": 690} {"train_loss": -35.905216217041016, "global_step": 83519, "epoch": 690} {"train_loss": -36.25826644897461, "global_step": 83520, "epoch": 690} {"train_loss": -34.74766159057617, "global_step": 83521, "epoch": 690} {"train_loss": -35.90763473510742, "global_step": 83522, "epoch": 690} {"train_loss": -36.06540298461914, "global_step": 83523, "epoch": 690} {"train_loss": -36.09748458862305, "global_step": 83524, "epoch": 690} {"train_loss": -34.50181198120117, "global_step": 83525, "epoch": 690} {"train_loss": -36.09878158569336, "global_step": 83526, "epoch": 690} {"train_loss": -36.305294036865234, "global_step": 83527, "epoch": 690} {"train_loss": -35.92529296875, "global_step": 83528, "epoch": 690} {"train_loss": -36.10868453979492, "global_step": 83529, "epoch": 690} {"train_loss": -36.13035202026367, "global_step": 83530, "epoch": 690} {"train_loss": -36.50914001464844, "global_step": 83531, "epoch": 690} {"train_loss": -36.53847885131836, "global_step": 83532, "epoch": 690} {"train_loss": -36.11286544799805, "global_step": 83533, "epoch": 690} {"train_loss": -35.80448532104492, "global_step": 83534, "epoch": 690} {"train_loss": -36.75123977661133, "global_step": 83535, "epoch": 690} {"train_loss": -37.100067138671875, "global_step": 83536, "epoch": 690} {"train_loss": -36.59458541870117, "global_step": 83537, "epoch": 690} {"train_loss": -36.76652526855469, "global_step": 83538, "epoch": 690} {"train_loss": -36.6720085144043, "global_step": 83539, "epoch": 690} {"train_loss": -36.93538284301758, "global_step": 83540, "epoch": 690} {"train_loss": -37.34342575073242, "global_step": 83541, "epoch": 690} {"train_loss": -36.99685287475586, "global_step": 83542, "epoch": 690} {"train_loss": -36.96514892578125, "global_step": 83543, "epoch": 690} {"train_loss": -36.96592330932617, "global_step": 83544, "epoch": 690} {"train_loss": -37.514522552490234, "global_step": 83545, "epoch": 690} {"train_loss": -36.59633255004883, "global_step": 83546, "epoch": 690} {"train_loss": -37.329689025878906, "global_step": 83547, "epoch": 690} {"train_loss": -37.181461334228516, "global_step": 83548, "epoch": 690} {"train_loss": -37.49782943725586, "global_step": 83549, "epoch": 690} {"train_loss": -36.81303405761719, "global_step": 83550, "epoch": 690} {"train_loss": -37.16389083862305, "global_step": 83551, "epoch": 690} {"train_loss": -36.6994743347168, "global_step": 83552, "epoch": 690} {"train_loss": -35.71660614013672, "global_step": 83553, "epoch": 690} {"train_loss": -34.782203674316406, "global_step": 83554, "epoch": 690} {"train_loss": -33.3719596862793, "global_step": 83555, "epoch": 690} {"train_loss": -31.16006851196289, "global_step": 83556, "epoch": 690} {"train_loss": -29.6057186126709, "global_step": 83557, "epoch": 690} {"train_loss": -31.276264190673828, "global_step": 83558, "epoch": 690} {"train_loss": -35.17298126220703, "global_step": 83559, "epoch": 690} {"train_loss": -35.88822555541992, "global_step": 83560, "epoch": 690} {"train_loss": -35.87117385864258, "global_step": 83561, "epoch": 690} {"train_loss": -36.494686126708984, "global_step": 83562, "epoch": 690} {"train_loss": -36.62443161010742, "global_step": 83563, "epoch": 690} {"train_loss": -36.18417739868164, "global_step": 83564, "epoch": 690} {"train_loss": -37.20670700073242, "global_step": 83565, "epoch": 690} {"train_loss": -36.59784698486328, "global_step": 83566, "epoch": 690} {"train_loss": -36.215084075927734, "global_step": 83567, "epoch": 690} {"train_loss": -36.303340911865234, "global_step": 83568, "epoch": 690} {"train_loss": -37.199462890625, "global_step": 83569, "epoch": 690} {"train_loss": -36.72639465332031, "global_step": 83570, "epoch": 690} {"train_loss": -36.77740478515625, "global_step": 83571, "epoch": 690} {"train_loss": -36.59268569946289, "global_step": 83572, "epoch": 690} {"train_loss": -35.94920349121094, "global_step": 83573, "epoch": 690} {"train_loss": -35.05005645751953, "global_step": 83574, "epoch": 690} {"train_loss": -37.56562423706055, "global_step": 83575, "epoch": 690} {"train_loss": -34.961585998535156, "global_step": 83576, "epoch": 690} {"train_loss": -35.168067932128906, "global_step": 83577, "epoch": 690} {"train_loss": -36.1009635925293, "global_step": 83578, "epoch": 690} {"train_loss": -36.89358139038086, "global_step": 83579, "epoch": 690} {"train_loss": -36.283931732177734, "global_step": 83580, "epoch": 690} {"train_loss": -37.159645080566406, "global_step": 83581, "epoch": 690} {"train_loss": -36.8988151550293, "global_step": 83582, "epoch": 690} {"train_loss": -35.08992385864258, "global_step": 83583, "epoch": 690} {"train_loss": -37.775447845458984, "global_step": 83584, "epoch": 690} {"train_loss": -36.293212890625, "global_step": 83585, "epoch": 690} {"train_loss": -37.53157043457031, "global_step": 83586, "epoch": 690} {"train_loss": -37.410377502441406, "global_step": 83587, "epoch": 690} {"train_loss": -37.48014450073242, "global_step": 83588, "epoch": 690} {"train_loss": -37.35042953491211, "global_step": 83589, "epoch": 690} {"train_loss": -37.059547424316406, "global_step": 83590, "epoch": 690} {"train_loss": -37.53823471069336, "global_step": 83591, "epoch": 690} {"train_loss": -37.10503005981445, "global_step": 83592, "epoch": 690} {"train_loss": -36.91754150390625, "global_step": 83593, "epoch": 690} {"train_loss": -36.925872802734375, "global_step": 83594, "epoch": 690} {"train_loss": -36.91929244995117, "global_step": 83595, "epoch": 690} {"train_loss": -37.01057052612305, "global_step": 83596, "epoch": 690} {"train_loss": -37.5738525390625, "global_step": 83597, "epoch": 690} {"train_loss": -37.571998596191406, "global_step": 83598, "epoch": 690} {"train_loss": -36.68985366821289, "global_step": 83599, "epoch": 690} {"train_loss": -37.5545768737793, "global_step": 83600, "epoch": 690} {"train_loss": -36.702056884765625, "global_step": 83601, "epoch": 690} {"train_loss": -37.08903884887695, "global_step": 83602, "epoch": 690} {"train_loss": -37.95821762084961, "global_step": 83603, "epoch": 690} {"train_loss": -37.36660385131836, "global_step": 83604, "epoch": 690} {"train_loss": -37.11332321166992, "global_step": 83605, "epoch": 690} {"train_loss": -37.27167510986328, "global_step": 83606, "epoch": 690} {"train_loss": -37.24693298339844, "global_step": 83607, "epoch": 690} {"train_loss": -35.80265808105469, "global_step": 83608, "epoch": 690} {"train_loss": -35.236202239990234, "global_step": 83609, "epoch": 690} {"train_loss": -35.211021781952915, "global_step": 83610, "epoch": 690, "val_loss": 2594035.0} {"train_loss": -36.16458511352539, "global_step": 83611, "epoch": 691} {"train_loss": -34.33935546875, "global_step": 83612, "epoch": 691} {"train_loss": -35.72356414794922, "global_step": 83613, "epoch": 691} {"train_loss": -37.25980758666992, "global_step": 83614, "epoch": 691} {"train_loss": -35.17351150512695, "global_step": 83615, "epoch": 691} {"train_loss": -35.94609451293945, "global_step": 83616, "epoch": 691} {"train_loss": -36.0373420715332, "global_step": 83617, "epoch": 691} {"train_loss": -36.057376861572266, "global_step": 83618, "epoch": 691} {"train_loss": -37.506134033203125, "global_step": 83619, "epoch": 691} {"train_loss": -35.43855667114258, "global_step": 83620, "epoch": 691} {"train_loss": -36.649105072021484, "global_step": 83621, "epoch": 691} {"train_loss": -35.27010726928711, "global_step": 83622, "epoch": 691} {"train_loss": -36.616024017333984, "global_step": 83623, "epoch": 691} {"train_loss": -36.25002670288086, "global_step": 83624, "epoch": 691} {"train_loss": -35.86714172363281, "global_step": 83625, "epoch": 691} {"train_loss": -34.74357604980469, "global_step": 83626, "epoch": 691} {"train_loss": -36.41242218017578, "global_step": 83627, "epoch": 691} {"train_loss": -35.54293441772461, "global_step": 83628, "epoch": 691} {"train_loss": -37.013362884521484, "global_step": 83629, "epoch": 691} {"train_loss": -34.9001579284668, "global_step": 83630, "epoch": 691} {"train_loss": -36.60190963745117, "global_step": 83631, "epoch": 691} {"train_loss": -36.07898712158203, "global_step": 83632, "epoch": 691} {"train_loss": -37.36045455932617, "global_step": 83633, "epoch": 691} {"train_loss": -35.87154006958008, "global_step": 83634, "epoch": 691} {"train_loss": -36.74348831176758, "global_step": 83635, "epoch": 691} {"train_loss": -36.433860778808594, "global_step": 83636, "epoch": 691} {"train_loss": -36.66420364379883, "global_step": 83637, "epoch": 691} {"train_loss": -36.651222229003906, "global_step": 83638, "epoch": 691} {"train_loss": -37.088836669921875, "global_step": 83639, "epoch": 691} {"train_loss": -36.8187370300293, "global_step": 83640, "epoch": 691} {"train_loss": -36.85884475708008, "global_step": 83641, "epoch": 691} {"train_loss": -36.143123626708984, "global_step": 83642, "epoch": 691} {"train_loss": -35.61385726928711, "global_step": 83643, "epoch": 691} {"train_loss": -35.86626052856445, "global_step": 83644, "epoch": 691} {"train_loss": -35.10645294189453, "global_step": 83645, "epoch": 691} {"train_loss": -36.52861785888672, "global_step": 83646, "epoch": 691} {"train_loss": -35.436702728271484, "global_step": 83647, "epoch": 691} {"train_loss": -36.181209564208984, "global_step": 83648, "epoch": 691} {"train_loss": -36.502193450927734, "global_step": 83649, "epoch": 691} {"train_loss": -36.67019271850586, "global_step": 83650, "epoch": 691} {"train_loss": -36.297664642333984, "global_step": 83651, "epoch": 691} {"train_loss": -36.23582077026367, "global_step": 83652, "epoch": 691} {"train_loss": -36.07808303833008, "global_step": 83653, "epoch": 691} {"train_loss": -36.73882293701172, "global_step": 83654, "epoch": 691} {"train_loss": -35.83723068237305, "global_step": 83655, "epoch": 691} {"train_loss": -36.37560272216797, "global_step": 83656, "epoch": 691} {"train_loss": -36.54069137573242, "global_step": 83657, "epoch": 691} {"train_loss": -36.725929260253906, "global_step": 83658, "epoch": 691} {"train_loss": -36.3950080871582, "global_step": 83659, "epoch": 691} {"train_loss": -35.659236907958984, "global_step": 83660, "epoch": 691} {"train_loss": -35.191226959228516, "global_step": 83661, "epoch": 691} {"train_loss": -34.37014389038086, "global_step": 83662, "epoch": 691} {"train_loss": -33.43268585205078, "global_step": 83663, "epoch": 691} {"train_loss": -34.79694747924805, "global_step": 83664, "epoch": 691} {"train_loss": -33.8580436706543, "global_step": 83665, "epoch": 691} {"train_loss": -35.18684005737305, "global_step": 83666, "epoch": 691} {"train_loss": -35.9056510925293, "global_step": 83667, "epoch": 691} {"train_loss": -34.0961799621582, "global_step": 83668, "epoch": 691} {"train_loss": -36.17280197143555, "global_step": 83669, "epoch": 691} {"train_loss": -35.56789016723633, "global_step": 83670, "epoch": 691} {"train_loss": -35.76375961303711, "global_step": 83671, "epoch": 691} {"train_loss": -35.64605712890625, "global_step": 83672, "epoch": 691} {"train_loss": -35.40313720703125, "global_step": 83673, "epoch": 691} {"train_loss": -35.623252868652344, "global_step": 83674, "epoch": 691} {"train_loss": -35.6524543762207, "global_step": 83675, "epoch": 691} {"train_loss": -36.41266632080078, "global_step": 83676, "epoch": 691} {"train_loss": -35.291988372802734, "global_step": 83677, "epoch": 691} {"train_loss": -35.65193557739258, "global_step": 83678, "epoch": 691} {"train_loss": -36.98195266723633, "global_step": 83679, "epoch": 691} {"train_loss": -36.36824417114258, "global_step": 83680, "epoch": 691} {"train_loss": -36.6778678894043, "global_step": 83681, "epoch": 691} {"train_loss": -36.72615051269531, "global_step": 83682, "epoch": 691} {"train_loss": -36.85813522338867, "global_step": 83683, "epoch": 691} {"train_loss": -36.82851791381836, "global_step": 83684, "epoch": 691} {"train_loss": -36.659908294677734, "global_step": 83685, "epoch": 691} {"train_loss": -36.00275802612305, "global_step": 83686, "epoch": 691} {"train_loss": -35.48603057861328, "global_step": 83687, "epoch": 691} {"train_loss": -36.537086486816406, "global_step": 83688, "epoch": 691} {"train_loss": -36.59452438354492, "global_step": 83689, "epoch": 691} {"train_loss": -35.35908126831055, "global_step": 83690, "epoch": 691} {"train_loss": -34.5282096862793, "global_step": 83691, "epoch": 691} {"train_loss": -35.50828170776367, "global_step": 83692, "epoch": 691} {"train_loss": -36.771751403808594, "global_step": 83693, "epoch": 691} {"train_loss": -34.36249923706055, "global_step": 83694, "epoch": 691} {"train_loss": -34.63630294799805, "global_step": 83695, "epoch": 691} {"train_loss": -36.772178649902344, "global_step": 83696, "epoch": 691} {"train_loss": -35.171974182128906, "global_step": 83697, "epoch": 691} {"train_loss": -36.933162689208984, "global_step": 83698, "epoch": 691} {"train_loss": -35.95417404174805, "global_step": 83699, "epoch": 691} {"train_loss": -35.251068115234375, "global_step": 83700, "epoch": 691} {"train_loss": -36.81989669799805, "global_step": 83701, "epoch": 691} {"train_loss": -36.16944122314453, "global_step": 83702, "epoch": 691} {"train_loss": -36.57568359375, "global_step": 83703, "epoch": 691} {"train_loss": -36.672271728515625, "global_step": 83704, "epoch": 691} {"train_loss": -36.746402740478516, "global_step": 83705, "epoch": 691} {"train_loss": -36.53559494018555, "global_step": 83706, "epoch": 691} {"train_loss": -37.05315017700195, "global_step": 83707, "epoch": 691} {"train_loss": -35.77071762084961, "global_step": 83708, "epoch": 691} {"train_loss": -36.150665283203125, "global_step": 83709, "epoch": 691} {"train_loss": -35.232540130615234, "global_step": 83710, "epoch": 691} {"train_loss": -32.433349609375, "global_step": 83711, "epoch": 691} {"train_loss": -30.67865562438965, "global_step": 83712, "epoch": 691} {"train_loss": -31.101980209350586, "global_step": 83713, "epoch": 691} {"train_loss": -34.641910552978516, "global_step": 83714, "epoch": 691} {"train_loss": -36.828460693359375, "global_step": 83715, "epoch": 691} {"train_loss": -34.61282730102539, "global_step": 83716, "epoch": 691} {"train_loss": -36.160587310791016, "global_step": 83717, "epoch": 691} {"train_loss": -35.974037170410156, "global_step": 83718, "epoch": 691} {"train_loss": -35.61407470703125, "global_step": 83719, "epoch": 691} {"train_loss": -37.24858093261719, "global_step": 83720, "epoch": 691} {"train_loss": -34.19014358520508, "global_step": 83721, "epoch": 691} {"train_loss": -37.27337646484375, "global_step": 83722, "epoch": 691} {"train_loss": -36.68862533569336, "global_step": 83723, "epoch": 691} {"train_loss": -36.94204330444336, "global_step": 83724, "epoch": 691} {"train_loss": -36.8582878112793, "global_step": 83725, "epoch": 691} {"train_loss": -36.68098068237305, "global_step": 83726, "epoch": 691} {"train_loss": -36.997100830078125, "global_step": 83727, "epoch": 691} {"train_loss": -36.33281326293945, "global_step": 83728, "epoch": 691} {"train_loss": -36.413238525390625, "global_step": 83729, "epoch": 691} {"train_loss": -36.92978286743164, "global_step": 83730, "epoch": 691} {"train_loss": -35.92443463033881, "global_step": 83731, "epoch": 691, "val_loss": 2616344.75} {"train_loss": -37.53782272338867, "global_step": 83732, "epoch": 692} {"train_loss": -37.0172233581543, "global_step": 83733, "epoch": 692} {"train_loss": -37.226863861083984, "global_step": 83734, "epoch": 692} {"train_loss": -37.52833557128906, "global_step": 83735, "epoch": 692} {"train_loss": -37.64348220825195, "global_step": 83736, "epoch": 692} {"train_loss": -37.42877197265625, "global_step": 83737, "epoch": 692} {"train_loss": -37.77645492553711, "global_step": 83738, "epoch": 692} {"train_loss": -37.277767181396484, "global_step": 83739, "epoch": 692} {"train_loss": -37.96234893798828, "global_step": 83740, "epoch": 692} {"train_loss": -37.94990158081055, "global_step": 83741, "epoch": 692} {"train_loss": -37.509822845458984, "global_step": 83742, "epoch": 692} {"train_loss": -37.393226623535156, "global_step": 83743, "epoch": 692} {"train_loss": -37.81885528564453, "global_step": 83744, "epoch": 692} {"train_loss": -37.62945556640625, "global_step": 83745, "epoch": 692} {"train_loss": -37.60478973388672, "global_step": 83746, "epoch": 692} {"train_loss": -37.846229553222656, "global_step": 83747, "epoch": 692} {"train_loss": -37.560516357421875, "global_step": 83748, "epoch": 692} {"train_loss": -38.24535369873047, "global_step": 83749, "epoch": 692} {"train_loss": -38.1051025390625, "global_step": 83750, "epoch": 692} {"train_loss": -37.40937423706055, "global_step": 83751, "epoch": 692} {"train_loss": -37.80549240112305, "global_step": 83752, "epoch": 692} {"train_loss": -38.061031341552734, "global_step": 83753, "epoch": 692} {"train_loss": -38.1956901550293, "global_step": 83754, "epoch": 692} {"train_loss": -38.3453483581543, "global_step": 83755, "epoch": 692} {"train_loss": -38.14430618286133, "global_step": 83756, "epoch": 692} {"train_loss": -37.98084259033203, "global_step": 83757, "epoch": 692} {"train_loss": -38.12091827392578, "global_step": 83758, "epoch": 692} {"train_loss": -38.622554779052734, "global_step": 83759, "epoch": 692} {"train_loss": -38.116451263427734, "global_step": 83760, "epoch": 692} {"train_loss": -37.70084762573242, "global_step": 83761, "epoch": 692} {"train_loss": -38.32242965698242, "global_step": 83762, "epoch": 692} {"train_loss": -38.36793899536133, "global_step": 83763, "epoch": 692} {"train_loss": -38.50251388549805, "global_step": 83764, "epoch": 692} {"train_loss": -38.116546630859375, "global_step": 83765, "epoch": 692} {"train_loss": -38.27540969848633, "global_step": 83766, "epoch": 692} {"train_loss": -38.36043167114258, "global_step": 83767, "epoch": 692} {"train_loss": -38.14094924926758, "global_step": 83768, "epoch": 692} {"train_loss": -37.682613372802734, "global_step": 83769, "epoch": 692} {"train_loss": -37.200225830078125, "global_step": 83770, "epoch": 692} {"train_loss": -35.63370132446289, "global_step": 83771, "epoch": 692} {"train_loss": -35.304805755615234, "global_step": 83772, "epoch": 692} {"train_loss": -34.810279846191406, "global_step": 83773, "epoch": 692} {"train_loss": -35.2843132019043, "global_step": 83774, "epoch": 692} {"train_loss": -36.25019454956055, "global_step": 83775, "epoch": 692} {"train_loss": -35.09400177001953, "global_step": 83776, "epoch": 692} {"train_loss": -37.09763717651367, "global_step": 83777, "epoch": 692} {"train_loss": -36.0388069152832, "global_step": 83778, "epoch": 692} {"train_loss": -35.56816864013672, "global_step": 83779, "epoch": 692} {"train_loss": -36.305755615234375, "global_step": 83780, "epoch": 692} {"train_loss": -37.58553695678711, "global_step": 83781, "epoch": 692} {"train_loss": -36.62530517578125, "global_step": 83782, "epoch": 692} {"train_loss": -36.9715576171875, "global_step": 83783, "epoch": 692} {"train_loss": -37.67469024658203, "global_step": 83784, "epoch": 692} {"train_loss": -37.10707473754883, "global_step": 83785, "epoch": 692} {"train_loss": -37.88629913330078, "global_step": 83786, "epoch": 692} {"train_loss": -37.35456466674805, "global_step": 83787, "epoch": 692} {"train_loss": -37.91363525390625, "global_step": 83788, "epoch": 692} {"train_loss": -37.70329666137695, "global_step": 83789, "epoch": 692} {"train_loss": -38.29911804199219, "global_step": 83790, "epoch": 692} {"train_loss": -37.07514190673828, "global_step": 83791, "epoch": 692} {"train_loss": -37.683834075927734, "global_step": 83792, "epoch": 692} {"train_loss": -37.699520111083984, "global_step": 83793, "epoch": 692} {"train_loss": -38.101497650146484, "global_step": 83794, "epoch": 692} {"train_loss": -37.84434127807617, "global_step": 83795, "epoch": 692} {"train_loss": -36.85067367553711, "global_step": 83796, "epoch": 692} {"train_loss": -37.6466064453125, "global_step": 83797, "epoch": 692} {"train_loss": -38.139434814453125, "global_step": 83798, "epoch": 692} {"train_loss": -38.08427047729492, "global_step": 83799, "epoch": 692} {"train_loss": -36.190467834472656, "global_step": 83800, "epoch": 692} {"train_loss": -38.006591796875, "global_step": 83801, "epoch": 692} {"train_loss": -36.69675827026367, "global_step": 83802, "epoch": 692} {"train_loss": -37.724143981933594, "global_step": 83803, "epoch": 692} {"train_loss": -37.829071044921875, "global_step": 83804, "epoch": 692} {"train_loss": -36.91670608520508, "global_step": 83805, "epoch": 692} {"train_loss": -37.14327621459961, "global_step": 83806, "epoch": 692} {"train_loss": -37.524837493896484, "global_step": 83807, "epoch": 692} {"train_loss": -37.71879196166992, "global_step": 83808, "epoch": 692} {"train_loss": -37.552425384521484, "global_step": 83809, "epoch": 692} {"train_loss": -37.5898551940918, "global_step": 83810, "epoch": 692} {"train_loss": -36.77199172973633, "global_step": 83811, "epoch": 692} {"train_loss": -37.07386016845703, "global_step": 83812, "epoch": 692} {"train_loss": -37.60332107543945, "global_step": 83813, "epoch": 692} {"train_loss": -37.704830169677734, "global_step": 83814, "epoch": 692} {"train_loss": -32.82184982299805, "global_step": 83815, "epoch": 692} {"train_loss": -31.385522842407227, "global_step": 83816, "epoch": 692} {"train_loss": -37.7222785949707, "global_step": 83817, "epoch": 692} {"train_loss": -37.33921432495117, "global_step": 83818, "epoch": 692} {"train_loss": -37.77581787109375, "global_step": 83819, "epoch": 692} {"train_loss": -37.65233612060547, "global_step": 83820, "epoch": 692} {"train_loss": -37.894588470458984, "global_step": 83821, "epoch": 692} {"train_loss": -37.15470504760742, "global_step": 83822, "epoch": 692} {"train_loss": -37.78892135620117, "global_step": 83823, "epoch": 692} {"train_loss": -37.69818878173828, "global_step": 83824, "epoch": 692} {"train_loss": -37.882686614990234, "global_step": 83825, "epoch": 692} {"train_loss": -37.39228820800781, "global_step": 83826, "epoch": 692} {"train_loss": -36.656219482421875, "global_step": 83827, "epoch": 692} {"train_loss": -35.99856185913086, "global_step": 83828, "epoch": 692} {"train_loss": -37.0849723815918, "global_step": 83829, "epoch": 692} {"train_loss": -35.445762634277344, "global_step": 83830, "epoch": 692} {"train_loss": -37.4228630065918, "global_step": 83831, "epoch": 692} {"train_loss": -37.33327865600586, "global_step": 83832, "epoch": 692} {"train_loss": -37.67169189453125, "global_step": 83833, "epoch": 692} {"train_loss": -36.44351577758789, "global_step": 83834, "epoch": 692} {"train_loss": -37.396018981933594, "global_step": 83835, "epoch": 692} {"train_loss": -35.42124557495117, "global_step": 83836, "epoch": 692} {"train_loss": -36.81730270385742, "global_step": 83837, "epoch": 692} {"train_loss": -35.97793197631836, "global_step": 83838, "epoch": 692} {"train_loss": -35.830596923828125, "global_step": 83839, "epoch": 692} {"train_loss": -34.623619079589844, "global_step": 83840, "epoch": 692} {"train_loss": -32.142269134521484, "global_step": 83841, "epoch": 692} {"train_loss": -33.34284210205078, "global_step": 83842, "epoch": 692} {"train_loss": -36.04139709472656, "global_step": 83843, "epoch": 692} {"train_loss": -37.30092239379883, "global_step": 83844, "epoch": 692} {"train_loss": -36.828365325927734, "global_step": 83845, "epoch": 692} {"train_loss": -37.12470245361328, "global_step": 83846, "epoch": 692} {"train_loss": -37.71921920776367, "global_step": 83847, "epoch": 692} {"train_loss": -36.58216857910156, "global_step": 83848, "epoch": 692} {"train_loss": -37.219783782958984, "global_step": 83849, "epoch": 692} {"train_loss": -36.7341194152832, "global_step": 83850, "epoch": 692} {"train_loss": -36.78495407104492, "global_step": 83851, "epoch": 692} {"train_loss": -37.140253729071496, "global_step": 83852, "epoch": 692, "val_loss": 2592062.25} {"train_loss": -37.668479919433594, "global_step": 83853, "epoch": 693} {"train_loss": -37.174007415771484, "global_step": 83854, "epoch": 693} {"train_loss": -38.1887321472168, "global_step": 83855, "epoch": 693} {"train_loss": -37.1566047668457, "global_step": 83856, "epoch": 693} {"train_loss": -37.67068862915039, "global_step": 83857, "epoch": 693} {"train_loss": -38.28562927246094, "global_step": 83858, "epoch": 693} {"train_loss": -37.3661003112793, "global_step": 83859, "epoch": 693} {"train_loss": -37.45112991333008, "global_step": 83860, "epoch": 693} {"train_loss": -36.17387771606445, "global_step": 83861, "epoch": 693} {"train_loss": -36.712196350097656, "global_step": 83862, "epoch": 693} {"train_loss": -37.821224212646484, "global_step": 83863, "epoch": 693} {"train_loss": -37.57969284057617, "global_step": 83864, "epoch": 693} {"train_loss": -37.996612548828125, "global_step": 83865, "epoch": 693} {"train_loss": -38.41652297973633, "global_step": 83866, "epoch": 693} {"train_loss": -37.817935943603516, "global_step": 83867, "epoch": 693} {"train_loss": -38.0620231628418, "global_step": 83868, "epoch": 693} {"train_loss": -37.12830352783203, "global_step": 83869, "epoch": 693} {"train_loss": -37.43185806274414, "global_step": 83870, "epoch": 693} {"train_loss": -38.3155517578125, "global_step": 83871, "epoch": 693} {"train_loss": -37.67499923706055, "global_step": 83872, "epoch": 693} {"train_loss": -38.256919860839844, "global_step": 83873, "epoch": 693} {"train_loss": -38.12020492553711, "global_step": 83874, "epoch": 693} {"train_loss": -38.13689422607422, "global_step": 83875, "epoch": 693} {"train_loss": -37.31069564819336, "global_step": 83876, "epoch": 693} {"train_loss": -37.98606491088867, "global_step": 83877, "epoch": 693} {"train_loss": -37.69758987426758, "global_step": 83878, "epoch": 693} {"train_loss": -37.1903190612793, "global_step": 83879, "epoch": 693} {"train_loss": -37.19269943237305, "global_step": 83880, "epoch": 693} {"train_loss": -37.49790954589844, "global_step": 83881, "epoch": 693} {"train_loss": -37.01381301879883, "global_step": 83882, "epoch": 693} {"train_loss": -36.95180892944336, "global_step": 83883, "epoch": 693} {"train_loss": -36.1170654296875, "global_step": 83884, "epoch": 693} {"train_loss": -35.57516098022461, "global_step": 83885, "epoch": 693} {"train_loss": -37.7097282409668, "global_step": 83886, "epoch": 693} {"train_loss": -36.03556442260742, "global_step": 83887, "epoch": 693} {"train_loss": -36.78059768676758, "global_step": 83888, "epoch": 693} {"train_loss": -36.08590316772461, "global_step": 83889, "epoch": 693} {"train_loss": -35.39063262939453, "global_step": 83890, "epoch": 693} {"train_loss": -36.412776947021484, "global_step": 83891, "epoch": 693} {"train_loss": -36.7762336730957, "global_step": 83892, "epoch": 693} {"train_loss": -36.74710464477539, "global_step": 83893, "epoch": 693} {"train_loss": -37.73186111450195, "global_step": 83894, "epoch": 693} {"train_loss": -37.62514877319336, "global_step": 83895, "epoch": 693} {"train_loss": -37.308746337890625, "global_step": 83896, "epoch": 693} {"train_loss": -37.43734359741211, "global_step": 83897, "epoch": 693} {"train_loss": -37.566986083984375, "global_step": 83898, "epoch": 693} {"train_loss": -36.12191390991211, "global_step": 83899, "epoch": 693} {"train_loss": -36.82954406738281, "global_step": 83900, "epoch": 693} {"train_loss": -37.385189056396484, "global_step": 83901, "epoch": 693} {"train_loss": -37.382667541503906, "global_step": 83902, "epoch": 693} {"train_loss": -37.7662467956543, "global_step": 83903, "epoch": 693} {"train_loss": -37.70878219604492, "global_step": 83904, "epoch": 693} {"train_loss": -37.1561164855957, "global_step": 83905, "epoch": 693} {"train_loss": -37.95125961303711, "global_step": 83906, "epoch": 693} {"train_loss": -36.6457405090332, "global_step": 83907, "epoch": 693} {"train_loss": -36.87811279296875, "global_step": 83908, "epoch": 693} {"train_loss": -36.52092361450195, "global_step": 83909, "epoch": 693} {"train_loss": -35.13827133178711, "global_step": 83910, "epoch": 693} {"train_loss": -35.80270004272461, "global_step": 83911, "epoch": 693} {"train_loss": -33.53724670410156, "global_step": 83912, "epoch": 693} {"train_loss": -36.5167236328125, "global_step": 83913, "epoch": 693} {"train_loss": -35.750267028808594, "global_step": 83914, "epoch": 693} {"train_loss": -37.03010940551758, "global_step": 83915, "epoch": 693} {"train_loss": -34.38232421875, "global_step": 83916, "epoch": 693} {"train_loss": -31.189208984375, "global_step": 83917, "epoch": 693} {"train_loss": -29.95464515686035, "global_step": 83918, "epoch": 693} {"train_loss": -32.54887771606445, "global_step": 83919, "epoch": 693} {"train_loss": -36.14033889770508, "global_step": 83920, "epoch": 693} {"train_loss": -33.279109954833984, "global_step": 83921, "epoch": 693} {"train_loss": -33.16278839111328, "global_step": 83922, "epoch": 693} {"train_loss": -36.58696365356445, "global_step": 83923, "epoch": 693} {"train_loss": -32.04707336425781, "global_step": 83924, "epoch": 693} {"train_loss": -35.719329833984375, "global_step": 83925, "epoch": 693} {"train_loss": -35.50302505493164, "global_step": 83926, "epoch": 693} {"train_loss": -35.650909423828125, "global_step": 83927, "epoch": 693} {"train_loss": -36.130496978759766, "global_step": 83928, "epoch": 693} {"train_loss": -37.13256072998047, "global_step": 83929, "epoch": 693} {"train_loss": -36.551658630371094, "global_step": 83930, "epoch": 693} {"train_loss": -36.34577560424805, "global_step": 83931, "epoch": 693} {"train_loss": -36.5111083984375, "global_step": 83932, "epoch": 693} {"train_loss": -36.829891204833984, "global_step": 83933, "epoch": 693} {"train_loss": -36.825164794921875, "global_step": 83934, "epoch": 693} {"train_loss": -37.09487533569336, "global_step": 83935, "epoch": 693} {"train_loss": -37.341590881347656, "global_step": 83936, "epoch": 693} {"train_loss": -36.243072509765625, "global_step": 83937, "epoch": 693} {"train_loss": -36.18155288696289, "global_step": 83938, "epoch": 693} {"train_loss": -37.170772552490234, "global_step": 83939, "epoch": 693} {"train_loss": -37.49856185913086, "global_step": 83940, "epoch": 693} {"train_loss": -37.30720520019531, "global_step": 83941, "epoch": 693} {"train_loss": -36.70261001586914, "global_step": 83942, "epoch": 693} {"train_loss": -37.544002532958984, "global_step": 83943, "epoch": 693} {"train_loss": -37.68405532836914, "global_step": 83944, "epoch": 693} {"train_loss": -36.84698486328125, "global_step": 83945, "epoch": 693} {"train_loss": -37.09030532836914, "global_step": 83946, "epoch": 693} {"train_loss": -37.98450469970703, "global_step": 83947, "epoch": 693} {"train_loss": -37.59144973754883, "global_step": 83948, "epoch": 693} {"train_loss": -37.354393005371094, "global_step": 83949, "epoch": 693} {"train_loss": -37.34954833984375, "global_step": 83950, "epoch": 693} {"train_loss": -37.14870071411133, "global_step": 83951, "epoch": 693} {"train_loss": -37.585418701171875, "global_step": 83952, "epoch": 693} {"train_loss": -38.08041763305664, "global_step": 83953, "epoch": 693} {"train_loss": -37.71533966064453, "global_step": 83954, "epoch": 693} {"train_loss": -36.8835334777832, "global_step": 83955, "epoch": 693} {"train_loss": -36.365108489990234, "global_step": 83956, "epoch": 693} {"train_loss": -36.83285140991211, "global_step": 83957, "epoch": 693} {"train_loss": -36.897865295410156, "global_step": 83958, "epoch": 693} {"train_loss": -37.316097259521484, "global_step": 83959, "epoch": 693} {"train_loss": -34.87477493286133, "global_step": 83960, "epoch": 693} {"train_loss": -27.42596435546875, "global_step": 83961, "epoch": 693} {"train_loss": -24.224611282348633, "global_step": 83962, "epoch": 693} {"train_loss": -32.95162582397461, "global_step": 83963, "epoch": 693} {"train_loss": -36.64079666137695, "global_step": 83964, "epoch": 693} {"train_loss": -32.31268310546875, "global_step": 83965, "epoch": 693} {"train_loss": -30.361242294311523, "global_step": 83966, "epoch": 693} {"train_loss": -36.49161911010742, "global_step": 83967, "epoch": 693} {"train_loss": -34.42176055908203, "global_step": 83968, "epoch": 693} {"train_loss": -35.004066467285156, "global_step": 83969, "epoch": 693} {"train_loss": -36.920223236083984, "global_step": 83970, "epoch": 693} {"train_loss": -34.93247604370117, "global_step": 83971, "epoch": 693} {"train_loss": -37.17281723022461, "global_step": 83972, "epoch": 693} {"train_loss": -36.35523137179288, "global_step": 83973, "epoch": 693, "val_loss": 2791173.25} {"train_loss": -37.4965934753418, "global_step": 83974, "epoch": 694} {"train_loss": -35.2602424621582, "global_step": 83975, "epoch": 694} {"train_loss": -36.66402816772461, "global_step": 83976, "epoch": 694} {"train_loss": -35.55225372314453, "global_step": 83977, "epoch": 694} {"train_loss": -36.07761764526367, "global_step": 83978, "epoch": 694} {"train_loss": -37.132049560546875, "global_step": 83979, "epoch": 694} {"train_loss": -36.61568832397461, "global_step": 83980, "epoch": 694} {"train_loss": -36.69050979614258, "global_step": 83981, "epoch": 694} {"train_loss": -36.194698333740234, "global_step": 83982, "epoch": 694} {"train_loss": -36.843544006347656, "global_step": 83983, "epoch": 694} {"train_loss": -37.45209503173828, "global_step": 83984, "epoch": 694} {"train_loss": -36.16794967651367, "global_step": 83985, "epoch": 694} {"train_loss": -37.86410140991211, "global_step": 83986, "epoch": 694} {"train_loss": -36.16437530517578, "global_step": 83987, "epoch": 694} {"train_loss": -37.238243103027344, "global_step": 83988, "epoch": 694} {"train_loss": -37.60211944580078, "global_step": 83989, "epoch": 694} {"train_loss": -37.39019775390625, "global_step": 83990, "epoch": 694} {"train_loss": -37.2793083190918, "global_step": 83991, "epoch": 694} {"train_loss": -37.57752227783203, "global_step": 83992, "epoch": 694} {"train_loss": -37.97938919067383, "global_step": 83993, "epoch": 694} {"train_loss": -37.45314407348633, "global_step": 83994, "epoch": 694} {"train_loss": -37.6224479675293, "global_step": 83995, "epoch": 694} {"train_loss": -36.62300109863281, "global_step": 83996, "epoch": 694} {"train_loss": -37.57265853881836, "global_step": 83997, "epoch": 694} {"train_loss": -38.063167572021484, "global_step": 83998, "epoch": 694} {"train_loss": -37.79749298095703, "global_step": 83999, "epoch": 694} {"train_loss": -38.1958122253418, "global_step": 84000, "epoch": 694} {"train_loss": -37.19102096557617, "global_step": 84001, "epoch": 694} {"train_loss": -38.12521743774414, "global_step": 84002, "epoch": 694} {"train_loss": -36.5444221496582, "global_step": 84003, "epoch": 694} {"train_loss": -38.10737228393555, "global_step": 84004, "epoch": 694} {"train_loss": -37.9449462890625, "global_step": 84005, "epoch": 694} {"train_loss": -37.019039154052734, "global_step": 84006, "epoch": 694} {"train_loss": -37.59064865112305, "global_step": 84007, "epoch": 694} {"train_loss": -37.68946075439453, "global_step": 84008, "epoch": 694} {"train_loss": -37.446563720703125, "global_step": 84009, "epoch": 694} {"train_loss": -35.68281173706055, "global_step": 84010, "epoch": 694} {"train_loss": -36.763519287109375, "global_step": 84011, "epoch": 694} {"train_loss": -36.8044548034668, "global_step": 84012, "epoch": 694} {"train_loss": -36.55854034423828, "global_step": 84013, "epoch": 694} {"train_loss": -37.354347229003906, "global_step": 84014, "epoch": 694} {"train_loss": -37.688507080078125, "global_step": 84015, "epoch": 694} {"train_loss": -36.562767028808594, "global_step": 84016, "epoch": 694} {"train_loss": -36.05134201049805, "global_step": 84017, "epoch": 694} {"train_loss": -35.30107498168945, "global_step": 84018, "epoch": 694} {"train_loss": -35.558021545410156, "global_step": 84019, "epoch": 694} {"train_loss": -36.30221176147461, "global_step": 84020, "epoch": 694} {"train_loss": -37.11212158203125, "global_step": 84021, "epoch": 694} {"train_loss": -35.7574348449707, "global_step": 84022, "epoch": 694} {"train_loss": -37.68916702270508, "global_step": 84023, "epoch": 694} {"train_loss": -36.888484954833984, "global_step": 84024, "epoch": 694} {"train_loss": -36.275245666503906, "global_step": 84025, "epoch": 694} {"train_loss": -36.87686538696289, "global_step": 84026, "epoch": 694} {"train_loss": -35.922000885009766, "global_step": 84027, "epoch": 694} {"train_loss": -36.53094482421875, "global_step": 84028, "epoch": 694} {"train_loss": -37.113643646240234, "global_step": 84029, "epoch": 694} {"train_loss": -36.72732162475586, "global_step": 84030, "epoch": 694} {"train_loss": -36.74931716918945, "global_step": 84031, "epoch": 694} {"train_loss": -36.3016242980957, "global_step": 84032, "epoch": 694} {"train_loss": -36.987953186035156, "global_step": 84033, "epoch": 694} {"train_loss": -35.76862716674805, "global_step": 84034, "epoch": 694} {"train_loss": -36.445430755615234, "global_step": 84035, "epoch": 694} {"train_loss": -34.76530075073242, "global_step": 84036, "epoch": 694} {"train_loss": -34.83992385864258, "global_step": 84037, "epoch": 694} {"train_loss": -36.63013458251953, "global_step": 84038, "epoch": 694} {"train_loss": -36.03412628173828, "global_step": 84039, "epoch": 694} {"train_loss": -36.992431640625, "global_step": 84040, "epoch": 694} {"train_loss": -37.11773681640625, "global_step": 84041, "epoch": 694} {"train_loss": -37.022621154785156, "global_step": 84042, "epoch": 694} {"train_loss": -36.699745178222656, "global_step": 84043, "epoch": 694} {"train_loss": -37.20377731323242, "global_step": 84044, "epoch": 694} {"train_loss": -36.396881103515625, "global_step": 84045, "epoch": 694} {"train_loss": -34.522315979003906, "global_step": 84046, "epoch": 694} {"train_loss": -36.707950592041016, "global_step": 84047, "epoch": 694} {"train_loss": -37.312435150146484, "global_step": 84048, "epoch": 694} {"train_loss": -36.8646354675293, "global_step": 84049, "epoch": 694} {"train_loss": -36.96519088745117, "global_step": 84050, "epoch": 694} {"train_loss": -36.12213134765625, "global_step": 84051, "epoch": 694} {"train_loss": -36.810394287109375, "global_step": 84052, "epoch": 694} {"train_loss": -36.40158462524414, "global_step": 84053, "epoch": 694} {"train_loss": -36.491390228271484, "global_step": 84054, "epoch": 694} {"train_loss": -35.51887893676758, "global_step": 84055, "epoch": 694} {"train_loss": -36.509796142578125, "global_step": 84056, "epoch": 694} {"train_loss": -37.16971969604492, "global_step": 84057, "epoch": 694} {"train_loss": -36.3460807800293, "global_step": 84058, "epoch": 694} {"train_loss": -37.61953353881836, "global_step": 84059, "epoch": 694} {"train_loss": -37.19346618652344, "global_step": 84060, "epoch": 694} {"train_loss": -37.03994369506836, "global_step": 84061, "epoch": 694} {"train_loss": -36.71786880493164, "global_step": 84062, "epoch": 694} {"train_loss": -36.466651916503906, "global_step": 84063, "epoch": 694} {"train_loss": -35.58478546142578, "global_step": 84064, "epoch": 694} {"train_loss": -36.68742752075195, "global_step": 84065, "epoch": 694} {"train_loss": -36.75950241088867, "global_step": 84066, "epoch": 694} {"train_loss": -36.175567626953125, "global_step": 84067, "epoch": 694} {"train_loss": -36.96649169921875, "global_step": 84068, "epoch": 694} {"train_loss": -36.4636344909668, "global_step": 84069, "epoch": 694} {"train_loss": -35.72998809814453, "global_step": 84070, "epoch": 694} {"train_loss": -34.9269905090332, "global_step": 84071, "epoch": 694} {"train_loss": -36.90733337402344, "global_step": 84072, "epoch": 694} {"train_loss": -35.041072845458984, "global_step": 84073, "epoch": 694} {"train_loss": -36.22079086303711, "global_step": 84074, "epoch": 694} {"train_loss": -35.894744873046875, "global_step": 84075, "epoch": 694} {"train_loss": -37.15000915527344, "global_step": 84076, "epoch": 694} {"train_loss": -36.663185119628906, "global_step": 84077, "epoch": 694} {"train_loss": -36.19328689575195, "global_step": 84078, "epoch": 694} {"train_loss": -36.72517013549805, "global_step": 84079, "epoch": 694} {"train_loss": -36.80302810668945, "global_step": 84080, "epoch": 694} {"train_loss": -36.79461669921875, "global_step": 84081, "epoch": 694} {"train_loss": -37.46149826049805, "global_step": 84082, "epoch": 694} {"train_loss": -36.961055755615234, "global_step": 84083, "epoch": 694} {"train_loss": -36.97132873535156, "global_step": 84084, "epoch": 694} {"train_loss": -34.2928352355957, "global_step": 84085, "epoch": 694} {"train_loss": -36.099124908447266, "global_step": 84086, "epoch": 694} {"train_loss": -37.017547607421875, "global_step": 84087, "epoch": 694} {"train_loss": -37.415374755859375, "global_step": 84088, "epoch": 694} {"train_loss": -36.21537399291992, "global_step": 84089, "epoch": 694} {"train_loss": -37.04752731323242, "global_step": 84090, "epoch": 694} {"train_loss": -36.87222671508789, "global_step": 84091, "epoch": 694} {"train_loss": -37.021827697753906, "global_step": 84092, "epoch": 694} {"train_loss": -36.83015060424805, "global_step": 84093, "epoch": 694} {"train_loss": -36.70802846230751, "global_step": 84094, "epoch": 694, "val_loss": 2625317.75} {"train_loss": -36.696128845214844, "global_step": 84095, "epoch": 695} {"train_loss": -36.904090881347656, "global_step": 84096, "epoch": 695} {"train_loss": -37.68851852416992, "global_step": 84097, "epoch": 695} {"train_loss": -36.39265060424805, "global_step": 84098, "epoch": 695} {"train_loss": -36.94841384887695, "global_step": 84099, "epoch": 695} {"train_loss": -36.99745178222656, "global_step": 84100, "epoch": 695} {"train_loss": -36.29439163208008, "global_step": 84101, "epoch": 695} {"train_loss": -37.26552963256836, "global_step": 84102, "epoch": 695} {"train_loss": -37.41592788696289, "global_step": 84103, "epoch": 695} {"train_loss": -37.64876937866211, "global_step": 84104, "epoch": 695} {"train_loss": -36.0040168762207, "global_step": 84105, "epoch": 695} {"train_loss": -37.48796463012695, "global_step": 84106, "epoch": 695} {"train_loss": -37.809696197509766, "global_step": 84107, "epoch": 695} {"train_loss": -37.4356689453125, "global_step": 84108, "epoch": 695} {"train_loss": -37.3063850402832, "global_step": 84109, "epoch": 695} {"train_loss": -37.24126052856445, "global_step": 84110, "epoch": 695} {"train_loss": -37.28239059448242, "global_step": 84111, "epoch": 695} {"train_loss": -37.79460906982422, "global_step": 84112, "epoch": 695} {"train_loss": -37.516746520996094, "global_step": 84113, "epoch": 695} {"train_loss": -37.5783576965332, "global_step": 84114, "epoch": 695} {"train_loss": -37.39335632324219, "global_step": 84115, "epoch": 695} {"train_loss": -38.3056755065918, "global_step": 84116, "epoch": 695} {"train_loss": -37.998146057128906, "global_step": 84117, "epoch": 695} {"train_loss": -37.1422004699707, "global_step": 84118, "epoch": 695} {"train_loss": -37.781185150146484, "global_step": 84119, "epoch": 695} {"train_loss": -37.97654724121094, "global_step": 84120, "epoch": 695} {"train_loss": -37.737728118896484, "global_step": 84121, "epoch": 695} {"train_loss": -36.458492279052734, "global_step": 84122, "epoch": 695} {"train_loss": -37.37429428100586, "global_step": 84123, "epoch": 695} {"train_loss": -37.417659759521484, "global_step": 84124, "epoch": 695} {"train_loss": -37.662864685058594, "global_step": 84125, "epoch": 695} {"train_loss": -36.292842864990234, "global_step": 84126, "epoch": 695} {"train_loss": -36.79032516479492, "global_step": 84127, "epoch": 695} {"train_loss": -37.14094543457031, "global_step": 84128, "epoch": 695} {"train_loss": -37.51144027709961, "global_step": 84129, "epoch": 695} {"train_loss": -36.435665130615234, "global_step": 84130, "epoch": 695} {"train_loss": -34.147560119628906, "global_step": 84131, "epoch": 695} {"train_loss": -30.877710342407227, "global_step": 84132, "epoch": 695} {"train_loss": -17.937673568725586, "global_step": 84133, "epoch": 695} {"train_loss": -0.9497591257095337, "global_step": 84134, "epoch": 695} {"train_loss": -14.231986045837402, "global_step": 84135, "epoch": 695} {"train_loss": -34.2815055847168, "global_step": 84136, "epoch": 695} {"train_loss": -23.108234405517578, "global_step": 84137, "epoch": 695} {"train_loss": -35.67804718017578, "global_step": 84138, "epoch": 695} {"train_loss": -27.636310577392578, "global_step": 84139, "epoch": 695} {"train_loss": -34.676822662353516, "global_step": 84140, "epoch": 695} {"train_loss": -32.36725616455078, "global_step": 84141, "epoch": 695} {"train_loss": -31.898344039916992, "global_step": 84142, "epoch": 695} {"train_loss": -34.42194747924805, "global_step": 84143, "epoch": 695} {"train_loss": -31.435474395751953, "global_step": 84144, "epoch": 695} {"train_loss": -33.0317497253418, "global_step": 84145, "epoch": 695} {"train_loss": -33.9478874206543, "global_step": 84146, "epoch": 695} {"train_loss": -33.247596740722656, "global_step": 84147, "epoch": 695} {"train_loss": -32.11800003051758, "global_step": 84148, "epoch": 695} {"train_loss": -36.38452911376953, "global_step": 84149, "epoch": 695} {"train_loss": -35.10342025756836, "global_step": 84150, "epoch": 695} {"train_loss": -33.36561965942383, "global_step": 84151, "epoch": 695} {"train_loss": -34.356597900390625, "global_step": 84152, "epoch": 695} {"train_loss": -35.77102279663086, "global_step": 84153, "epoch": 695} {"train_loss": -35.0070915222168, "global_step": 84154, "epoch": 695} {"train_loss": -33.762237548828125, "global_step": 84155, "epoch": 695} {"train_loss": -35.137733459472656, "global_step": 84156, "epoch": 695} {"train_loss": -35.920310974121094, "global_step": 84157, "epoch": 695} {"train_loss": -34.4769172668457, "global_step": 84158, "epoch": 695} {"train_loss": -35.80854034423828, "global_step": 84159, "epoch": 695} {"train_loss": -34.15310287475586, "global_step": 84160, "epoch": 695} {"train_loss": -35.24434280395508, "global_step": 84161, "epoch": 695} {"train_loss": -36.021484375, "global_step": 84162, "epoch": 695} {"train_loss": -36.027130126953125, "global_step": 84163, "epoch": 695} {"train_loss": -34.63479232788086, "global_step": 84164, "epoch": 695} {"train_loss": -35.36798095703125, "global_step": 84165, "epoch": 695} {"train_loss": -36.42847442626953, "global_step": 84166, "epoch": 695} {"train_loss": -36.390525817871094, "global_step": 84167, "epoch": 695} {"train_loss": -35.8841667175293, "global_step": 84168, "epoch": 695} {"train_loss": -35.91494369506836, "global_step": 84169, "epoch": 695} {"train_loss": -36.229244232177734, "global_step": 84170, "epoch": 695} {"train_loss": -35.139686584472656, "global_step": 84171, "epoch": 695} {"train_loss": -36.65861129760742, "global_step": 84172, "epoch": 695} {"train_loss": -36.2481575012207, "global_step": 84173, "epoch": 695} {"train_loss": -35.838558197021484, "global_step": 84174, "epoch": 695} {"train_loss": -35.20198440551758, "global_step": 84175, "epoch": 695} {"train_loss": -36.63731002807617, "global_step": 84176, "epoch": 695} {"train_loss": -36.21891403198242, "global_step": 84177, "epoch": 695} {"train_loss": -36.57060623168945, "global_step": 84178, "epoch": 695} {"train_loss": -36.39112091064453, "global_step": 84179, "epoch": 695} {"train_loss": -35.54206466674805, "global_step": 84180, "epoch": 695} {"train_loss": -36.97964859008789, "global_step": 84181, "epoch": 695} {"train_loss": -36.945316314697266, "global_step": 84182, "epoch": 695} {"train_loss": -36.9429931640625, "global_step": 84183, "epoch": 695} {"train_loss": -36.40513229370117, "global_step": 84184, "epoch": 695} {"train_loss": -36.42332458496094, "global_step": 84185, "epoch": 695} {"train_loss": -37.314762115478516, "global_step": 84186, "epoch": 695} {"train_loss": -36.215972900390625, "global_step": 84187, "epoch": 695} {"train_loss": -36.88955307006836, "global_step": 84188, "epoch": 695} {"train_loss": -36.990535736083984, "global_step": 84189, "epoch": 695} {"train_loss": -36.67413330078125, "global_step": 84190, "epoch": 695} {"train_loss": -36.475791931152344, "global_step": 84191, "epoch": 695} {"train_loss": -36.35797882080078, "global_step": 84192, "epoch": 695} {"train_loss": -37.357608795166016, "global_step": 84193, "epoch": 695} {"train_loss": -37.51462936401367, "global_step": 84194, "epoch": 695} {"train_loss": -37.48202896118164, "global_step": 84195, "epoch": 695} {"train_loss": -36.35823059082031, "global_step": 84196, "epoch": 695} {"train_loss": -37.69698715209961, "global_step": 84197, "epoch": 695} {"train_loss": -36.96390914916992, "global_step": 84198, "epoch": 695} {"train_loss": -37.79829788208008, "global_step": 84199, "epoch": 695} {"train_loss": -37.291805267333984, "global_step": 84200, "epoch": 695} {"train_loss": -37.29888916015625, "global_step": 84201, "epoch": 695} {"train_loss": -37.41191482543945, "global_step": 84202, "epoch": 695} {"train_loss": -37.329566955566406, "global_step": 84203, "epoch": 695} {"train_loss": -37.64484786987305, "global_step": 84204, "epoch": 695} {"train_loss": -37.7235221862793, "global_step": 84205, "epoch": 695} {"train_loss": -37.26246643066406, "global_step": 84206, "epoch": 695} {"train_loss": -37.84083938598633, "global_step": 84207, "epoch": 695} {"train_loss": -37.74953079223633, "global_step": 84208, "epoch": 695} {"train_loss": -37.95246505737305, "global_step": 84209, "epoch": 695} {"train_loss": -37.60602569580078, "global_step": 84210, "epoch": 695} {"train_loss": -37.548179626464844, "global_step": 84211, "epoch": 695} {"train_loss": -37.7540397644043, "global_step": 84212, "epoch": 695} {"train_loss": -37.28712463378906, "global_step": 84213, "epoch": 695} {"train_loss": -37.73736572265625, "global_step": 84214, "epoch": 695} {"train_loss": -35.52208548636476, "global_step": 84215, "epoch": 695, "val_loss": 2716623.25} {"train_loss": -37.59406661987305, "global_step": 84216, "epoch": 696} {"train_loss": -37.38071823120117, "global_step": 84217, "epoch": 696} {"train_loss": -37.58854293823242, "global_step": 84218, "epoch": 696} {"train_loss": -37.11119079589844, "global_step": 84219, "epoch": 696} {"train_loss": -36.59899139404297, "global_step": 84220, "epoch": 696} {"train_loss": -37.580135345458984, "global_step": 84221, "epoch": 696} {"train_loss": -36.761138916015625, "global_step": 84222, "epoch": 696} {"train_loss": -36.67156219482422, "global_step": 84223, "epoch": 696} {"train_loss": -37.0432243347168, "global_step": 84224, "epoch": 696} {"train_loss": -36.32615280151367, "global_step": 84225, "epoch": 696} {"train_loss": -37.58579635620117, "global_step": 84226, "epoch": 696} {"train_loss": -36.209495544433594, "global_step": 84227, "epoch": 696} {"train_loss": -37.88349533081055, "global_step": 84228, "epoch": 696} {"train_loss": -36.878902435302734, "global_step": 84229, "epoch": 696} {"train_loss": -34.03744125366211, "global_step": 84230, "epoch": 696} {"train_loss": -37.3114128112793, "global_step": 84231, "epoch": 696} {"train_loss": -36.30500030517578, "global_step": 84232, "epoch": 696} {"train_loss": -37.01301193237305, "global_step": 84233, "epoch": 696} {"train_loss": -36.52886199951172, "global_step": 84234, "epoch": 696} {"train_loss": -36.23134994506836, "global_step": 84235, "epoch": 696} {"train_loss": -37.145931243896484, "global_step": 84236, "epoch": 696} {"train_loss": -35.327213287353516, "global_step": 84237, "epoch": 696} {"train_loss": -37.20751953125, "global_step": 84238, "epoch": 696} {"train_loss": -37.228816986083984, "global_step": 84239, "epoch": 696} {"train_loss": -35.88655471801758, "global_step": 84240, "epoch": 696} {"train_loss": -36.454132080078125, "global_step": 84241, "epoch": 696} {"train_loss": -33.73875045776367, "global_step": 84242, "epoch": 696} {"train_loss": -37.034297943115234, "global_step": 84243, "epoch": 696} {"train_loss": -35.64067077636719, "global_step": 84244, "epoch": 696} {"train_loss": -37.44778823852539, "global_step": 84245, "epoch": 696} {"train_loss": -36.115909576416016, "global_step": 84246, "epoch": 696} {"train_loss": -36.97445297241211, "global_step": 84247, "epoch": 696} {"train_loss": -36.12382125854492, "global_step": 84248, "epoch": 696} {"train_loss": -34.957733154296875, "global_step": 84249, "epoch": 696} {"train_loss": -36.65474319458008, "global_step": 84250, "epoch": 696} {"train_loss": -36.77326965332031, "global_step": 84251, "epoch": 696} {"train_loss": -33.92990493774414, "global_step": 84252, "epoch": 696} {"train_loss": -35.56513214111328, "global_step": 84253, "epoch": 696} {"train_loss": -35.821590423583984, "global_step": 84254, "epoch": 696} {"train_loss": -37.489437103271484, "global_step": 84255, "epoch": 696} {"train_loss": -35.90015411376953, "global_step": 84256, "epoch": 696} {"train_loss": -35.9195556640625, "global_step": 84257, "epoch": 696} {"train_loss": -36.560646057128906, "global_step": 84258, "epoch": 696} {"train_loss": -37.13125228881836, "global_step": 84259, "epoch": 696} {"train_loss": -36.75403594970703, "global_step": 84260, "epoch": 696} {"train_loss": -36.451412200927734, "global_step": 84261, "epoch": 696} {"train_loss": -35.51705551147461, "global_step": 84262, "epoch": 696} {"train_loss": -36.849273681640625, "global_step": 84263, "epoch": 696} {"train_loss": -35.351383209228516, "global_step": 84264, "epoch": 696} {"train_loss": -35.37590026855469, "global_step": 84265, "epoch": 696} {"train_loss": -36.1065788269043, "global_step": 84266, "epoch": 696} {"train_loss": -36.356746673583984, "global_step": 84267, "epoch": 696} {"train_loss": -36.18600845336914, "global_step": 84268, "epoch": 696} {"train_loss": -35.61623764038086, "global_step": 84269, "epoch": 696} {"train_loss": -34.856990814208984, "global_step": 84270, "epoch": 696} {"train_loss": -35.20005416870117, "global_step": 84271, "epoch": 696} {"train_loss": -35.2883186340332, "global_step": 84272, "epoch": 696} {"train_loss": -35.93288040161133, "global_step": 84273, "epoch": 696} {"train_loss": -36.26824188232422, "global_step": 84274, "epoch": 696} {"train_loss": -36.4847412109375, "global_step": 84275, "epoch": 696} {"train_loss": -36.94175720214844, "global_step": 84276, "epoch": 696} {"train_loss": -36.7612419128418, "global_step": 84277, "epoch": 696} {"train_loss": -36.805694580078125, "global_step": 84278, "epoch": 696} {"train_loss": -35.95740509033203, "global_step": 84279, "epoch": 696} {"train_loss": -36.74391555786133, "global_step": 84280, "epoch": 696} {"train_loss": -37.2587776184082, "global_step": 84281, "epoch": 696} {"train_loss": -36.613014221191406, "global_step": 84282, "epoch": 696} {"train_loss": -37.41740417480469, "global_step": 84283, "epoch": 696} {"train_loss": -36.873291015625, "global_step": 84284, "epoch": 696} {"train_loss": -36.57879638671875, "global_step": 84285, "epoch": 696} {"train_loss": -36.64241409301758, "global_step": 84286, "epoch": 696} {"train_loss": -37.102516174316406, "global_step": 84287, "epoch": 696} {"train_loss": -36.79927444458008, "global_step": 84288, "epoch": 696} {"train_loss": -36.6212272644043, "global_step": 84289, "epoch": 696} {"train_loss": -36.85087203979492, "global_step": 84290, "epoch": 696} {"train_loss": -37.36143493652344, "global_step": 84291, "epoch": 696} {"train_loss": -36.501914978027344, "global_step": 84292, "epoch": 696} {"train_loss": -37.41981887817383, "global_step": 84293, "epoch": 696} {"train_loss": -37.015167236328125, "global_step": 84294, "epoch": 696} {"train_loss": -37.42366027832031, "global_step": 84295, "epoch": 696} {"train_loss": -37.40970993041992, "global_step": 84296, "epoch": 696} {"train_loss": -36.739593505859375, "global_step": 84297, "epoch": 696} {"train_loss": -36.770843505859375, "global_step": 84298, "epoch": 696} {"train_loss": -37.53277587890625, "global_step": 84299, "epoch": 696} {"train_loss": -37.778682708740234, "global_step": 84300, "epoch": 696} {"train_loss": -37.6816291809082, "global_step": 84301, "epoch": 696} {"train_loss": -37.272560119628906, "global_step": 84302, "epoch": 696} {"train_loss": -37.63991165161133, "global_step": 84303, "epoch": 696} {"train_loss": -36.74851608276367, "global_step": 84304, "epoch": 696} {"train_loss": -37.6151237487793, "global_step": 84305, "epoch": 696} {"train_loss": -38.161991119384766, "global_step": 84306, "epoch": 696} {"train_loss": -36.780059814453125, "global_step": 84307, "epoch": 696} {"train_loss": -37.229183197021484, "global_step": 84308, "epoch": 696} {"train_loss": -37.840660095214844, "global_step": 84309, "epoch": 696} {"train_loss": -38.17426300048828, "global_step": 84310, "epoch": 696} {"train_loss": -37.26447677612305, "global_step": 84311, "epoch": 696} {"train_loss": -37.48057174682617, "global_step": 84312, "epoch": 696} {"train_loss": -38.06404495239258, "global_step": 84313, "epoch": 696} {"train_loss": -38.33527755737305, "global_step": 84314, "epoch": 696} {"train_loss": -37.46894454956055, "global_step": 84315, "epoch": 696} {"train_loss": -35.76862716674805, "global_step": 84316, "epoch": 696} {"train_loss": -35.872406005859375, "global_step": 84317, "epoch": 696} {"train_loss": -32.714942932128906, "global_step": 84318, "epoch": 696} {"train_loss": -28.613061904907227, "global_step": 84319, "epoch": 696} {"train_loss": -28.958784103393555, "global_step": 84320, "epoch": 696} {"train_loss": -34.611202239990234, "global_step": 84321, "epoch": 696} {"train_loss": -37.083553314208984, "global_step": 84322, "epoch": 696} {"train_loss": -35.68539047241211, "global_step": 84323, "epoch": 696} {"train_loss": -35.51250076293945, "global_step": 84324, "epoch": 696} {"train_loss": -37.640316009521484, "global_step": 84325, "epoch": 696} {"train_loss": -36.2059211730957, "global_step": 84326, "epoch": 696} {"train_loss": -36.39875411987305, "global_step": 84327, "epoch": 696} {"train_loss": -36.30277633666992, "global_step": 84328, "epoch": 696} {"train_loss": -35.66127395629883, "global_step": 84329, "epoch": 696} {"train_loss": -35.86311340332031, "global_step": 84330, "epoch": 696} {"train_loss": -35.61345291137695, "global_step": 84331, "epoch": 696} {"train_loss": -37.451820373535156, "global_step": 84332, "epoch": 696} {"train_loss": -36.904170989990234, "global_step": 84333, "epoch": 696} {"train_loss": -36.265052795410156, "global_step": 84334, "epoch": 696} {"train_loss": -36.54414749145508, "global_step": 84335, "epoch": 696} {"train_loss": -36.45379323407638, "global_step": 84336, "epoch": 696, "val_loss": 2673990.75} {"train_loss": -36.449546813964844, "global_step": 84337, "epoch": 697} {"train_loss": -37.58102035522461, "global_step": 84338, "epoch": 697} {"train_loss": -36.02742004394531, "global_step": 84339, "epoch": 697} {"train_loss": -37.108184814453125, "global_step": 84340, "epoch": 697} {"train_loss": -35.85825729370117, "global_step": 84341, "epoch": 697} {"train_loss": -35.0050048828125, "global_step": 84342, "epoch": 697} {"train_loss": -37.421791076660156, "global_step": 84343, "epoch": 697} {"train_loss": -35.47018051147461, "global_step": 84344, "epoch": 697} {"train_loss": -35.68743133544922, "global_step": 84345, "epoch": 697} {"train_loss": -35.957427978515625, "global_step": 84346, "epoch": 697} {"train_loss": -36.54120635986328, "global_step": 84347, "epoch": 697} {"train_loss": -37.3548583984375, "global_step": 84348, "epoch": 697} {"train_loss": -36.90459060668945, "global_step": 84349, "epoch": 697} {"train_loss": -36.13801956176758, "global_step": 84350, "epoch": 697} {"train_loss": -35.88742446899414, "global_step": 84351, "epoch": 697} {"train_loss": -37.008174896240234, "global_step": 84352, "epoch": 697} {"train_loss": -36.97743606567383, "global_step": 84353, "epoch": 697} {"train_loss": -35.45205307006836, "global_step": 84354, "epoch": 697} {"train_loss": -36.57047653198242, "global_step": 84355, "epoch": 697} {"train_loss": -36.73497009277344, "global_step": 84356, "epoch": 697} {"train_loss": -36.5690803527832, "global_step": 84357, "epoch": 697} {"train_loss": -36.24489212036133, "global_step": 84358, "epoch": 697} {"train_loss": -36.22176742553711, "global_step": 84359, "epoch": 697} {"train_loss": -36.591365814208984, "global_step": 84360, "epoch": 697} {"train_loss": -37.02045822143555, "global_step": 84361, "epoch": 697} {"train_loss": -35.791500091552734, "global_step": 84362, "epoch": 697} {"train_loss": -36.75695037841797, "global_step": 84363, "epoch": 697} {"train_loss": -36.88651657104492, "global_step": 84364, "epoch": 697} {"train_loss": -36.65611267089844, "global_step": 84365, "epoch": 697} {"train_loss": -37.10192108154297, "global_step": 84366, "epoch": 697} {"train_loss": -36.39054489135742, "global_step": 84367, "epoch": 697} {"train_loss": -36.49396896362305, "global_step": 84368, "epoch": 697} {"train_loss": -35.72755432128906, "global_step": 84369, "epoch": 697} {"train_loss": -36.98828125, "global_step": 84370, "epoch": 697} {"train_loss": -37.256221771240234, "global_step": 84371, "epoch": 697} {"train_loss": -37.28415298461914, "global_step": 84372, "epoch": 697} {"train_loss": -37.076934814453125, "global_step": 84373, "epoch": 697} {"train_loss": -37.21744918823242, "global_step": 84374, "epoch": 697} {"train_loss": -36.03316879272461, "global_step": 84375, "epoch": 697} {"train_loss": -36.02016067504883, "global_step": 84376, "epoch": 697} {"train_loss": -35.66478729248047, "global_step": 84377, "epoch": 697} {"train_loss": -36.98865509033203, "global_step": 84378, "epoch": 697} {"train_loss": -36.81371307373047, "global_step": 84379, "epoch": 697} {"train_loss": -36.3398551940918, "global_step": 84380, "epoch": 697} {"train_loss": -35.657554626464844, "global_step": 84381, "epoch": 697} {"train_loss": -36.11369323730469, "global_step": 84382, "epoch": 697} {"train_loss": -37.059608459472656, "global_step": 84383, "epoch": 697} {"train_loss": -36.79882049560547, "global_step": 84384, "epoch": 697} {"train_loss": -37.36806869506836, "global_step": 84385, "epoch": 697} {"train_loss": -37.401344299316406, "global_step": 84386, "epoch": 697} {"train_loss": -37.51375198364258, "global_step": 84387, "epoch": 697} {"train_loss": -36.765132904052734, "global_step": 84388, "epoch": 697} {"train_loss": -37.0844841003418, "global_step": 84389, "epoch": 697} {"train_loss": -37.05802536010742, "global_step": 84390, "epoch": 697} {"train_loss": -37.01700973510742, "global_step": 84391, "epoch": 697} {"train_loss": -36.737648010253906, "global_step": 84392, "epoch": 697} {"train_loss": -37.04909896850586, "global_step": 84393, "epoch": 697} {"train_loss": -37.6024169921875, "global_step": 84394, "epoch": 697} {"train_loss": -36.47389602661133, "global_step": 84395, "epoch": 697} {"train_loss": -36.889190673828125, "global_step": 84396, "epoch": 697} {"train_loss": -37.64418411254883, "global_step": 84397, "epoch": 697} {"train_loss": -37.6082649230957, "global_step": 84398, "epoch": 697} {"train_loss": -33.8855094909668, "global_step": 84399, "epoch": 697} {"train_loss": -36.53202438354492, "global_step": 84400, "epoch": 697} {"train_loss": -34.505653381347656, "global_step": 84401, "epoch": 697} {"train_loss": -36.3367919921875, "global_step": 84402, "epoch": 697} {"train_loss": -37.360408782958984, "global_step": 84403, "epoch": 697} {"train_loss": -35.829139709472656, "global_step": 84404, "epoch": 697} {"train_loss": -36.10280990600586, "global_step": 84405, "epoch": 697} {"train_loss": -37.16912841796875, "global_step": 84406, "epoch": 697} {"train_loss": -36.63225173950195, "global_step": 84407, "epoch": 697} {"train_loss": -36.08512496948242, "global_step": 84408, "epoch": 697} {"train_loss": -37.02376937866211, "global_step": 84409, "epoch": 697} {"train_loss": -37.094661712646484, "global_step": 84410, "epoch": 697} {"train_loss": -36.50142288208008, "global_step": 84411, "epoch": 697} {"train_loss": -37.09143829345703, "global_step": 84412, "epoch": 697} {"train_loss": -36.33839797973633, "global_step": 84413, "epoch": 697} {"train_loss": -36.74003219604492, "global_step": 84414, "epoch": 697} {"train_loss": -36.047481536865234, "global_step": 84415, "epoch": 697} {"train_loss": -37.198280334472656, "global_step": 84416, "epoch": 697} {"train_loss": -37.05984115600586, "global_step": 84417, "epoch": 697} {"train_loss": -36.92887496948242, "global_step": 84418, "epoch": 697} {"train_loss": -37.05766296386719, "global_step": 84419, "epoch": 697} {"train_loss": -36.492488861083984, "global_step": 84420, "epoch": 697} {"train_loss": -37.20499038696289, "global_step": 84421, "epoch": 697} {"train_loss": -36.0733528137207, "global_step": 84422, "epoch": 697} {"train_loss": -37.528194427490234, "global_step": 84423, "epoch": 697} {"train_loss": -36.7251091003418, "global_step": 84424, "epoch": 697} {"train_loss": -36.202327728271484, "global_step": 84425, "epoch": 697} {"train_loss": -37.75102996826172, "global_step": 84426, "epoch": 697} {"train_loss": -36.489356994628906, "global_step": 84427, "epoch": 697} {"train_loss": -36.777076721191406, "global_step": 84428, "epoch": 697} {"train_loss": -36.34373092651367, "global_step": 84429, "epoch": 697} {"train_loss": -36.948143005371094, "global_step": 84430, "epoch": 697} {"train_loss": -36.68147659301758, "global_step": 84431, "epoch": 697} {"train_loss": -37.2386589050293, "global_step": 84432, "epoch": 697} {"train_loss": -36.68684768676758, "global_step": 84433, "epoch": 697} {"train_loss": -37.309226989746094, "global_step": 84434, "epoch": 697} {"train_loss": -36.70820236206055, "global_step": 84435, "epoch": 697} {"train_loss": -36.33303451538086, "global_step": 84436, "epoch": 697} {"train_loss": -37.12491989135742, "global_step": 84437, "epoch": 697} {"train_loss": -36.7794189453125, "global_step": 84438, "epoch": 697} {"train_loss": -37.3819694519043, "global_step": 84439, "epoch": 697} {"train_loss": -36.4448356628418, "global_step": 84440, "epoch": 697} {"train_loss": -37.41264724731445, "global_step": 84441, "epoch": 697} {"train_loss": -35.70675277709961, "global_step": 84442, "epoch": 697} {"train_loss": -36.07606887817383, "global_step": 84443, "epoch": 697} {"train_loss": -36.22736740112305, "global_step": 84444, "epoch": 697} {"train_loss": -37.580055236816406, "global_step": 84445, "epoch": 697} {"train_loss": -35.53620529174805, "global_step": 84446, "epoch": 697} {"train_loss": -35.7902946472168, "global_step": 84447, "epoch": 697} {"train_loss": -36.692543029785156, "global_step": 84448, "epoch": 697} {"train_loss": -36.07838821411133, "global_step": 84449, "epoch": 697} {"train_loss": -36.915382385253906, "global_step": 84450, "epoch": 697} {"train_loss": -36.12473678588867, "global_step": 84451, "epoch": 697} {"train_loss": -35.8408088684082, "global_step": 84452, "epoch": 697} {"train_loss": -37.4681282043457, "global_step": 84453, "epoch": 697} {"train_loss": -37.06724166870117, "global_step": 84454, "epoch": 697} {"train_loss": -36.66884994506836, "global_step": 84455, "epoch": 697} {"train_loss": -37.13376998901367, "global_step": 84456, "epoch": 697} {"train_loss": -36.62865974489323, "global_step": 84457, "epoch": 697, "val_loss": 2675655.5} {"train_loss": -37.012725830078125, "global_step": 84458, "epoch": 698} {"train_loss": -37.19987869262695, "global_step": 84459, "epoch": 698} {"train_loss": -37.122859954833984, "global_step": 84460, "epoch": 698} {"train_loss": -37.01823043823242, "global_step": 84461, "epoch": 698} {"train_loss": -37.500213623046875, "global_step": 84462, "epoch": 698} {"train_loss": -37.25209045410156, "global_step": 84463, "epoch": 698} {"train_loss": -36.781795501708984, "global_step": 84464, "epoch": 698} {"train_loss": -37.5482177734375, "global_step": 84465, "epoch": 698} {"train_loss": -37.578033447265625, "global_step": 84466, "epoch": 698} {"train_loss": -37.27412033081055, "global_step": 84467, "epoch": 698} {"train_loss": -37.36598587036133, "global_step": 84468, "epoch": 698} {"train_loss": -37.34980010986328, "global_step": 84469, "epoch": 698} {"train_loss": -36.321372985839844, "global_step": 84470, "epoch": 698} {"train_loss": -37.40403747558594, "global_step": 84471, "epoch": 698} {"train_loss": -37.37653732299805, "global_step": 84472, "epoch": 698} {"train_loss": -37.305538177490234, "global_step": 84473, "epoch": 698} {"train_loss": -36.94733810424805, "global_step": 84474, "epoch": 698} {"train_loss": -37.231719970703125, "global_step": 84475, "epoch": 698} {"train_loss": -35.9294548034668, "global_step": 84476, "epoch": 698} {"train_loss": -36.8744010925293, "global_step": 84477, "epoch": 698} {"train_loss": -37.095924377441406, "global_step": 84478, "epoch": 698} {"train_loss": -36.80229949951172, "global_step": 84479, "epoch": 698} {"train_loss": -35.65761947631836, "global_step": 84480, "epoch": 698} {"train_loss": -37.72663879394531, "global_step": 84481, "epoch": 698} {"train_loss": -36.62567901611328, "global_step": 84482, "epoch": 698} {"train_loss": -36.923728942871094, "global_step": 84483, "epoch": 698} {"train_loss": -37.50568389892578, "global_step": 84484, "epoch": 698} {"train_loss": -36.63253402709961, "global_step": 84485, "epoch": 698} {"train_loss": -35.468536376953125, "global_step": 84486, "epoch": 698} {"train_loss": -36.91862869262695, "global_step": 84487, "epoch": 698} {"train_loss": -37.635616302490234, "global_step": 84488, "epoch": 698} {"train_loss": -37.020992279052734, "global_step": 84489, "epoch": 698} {"train_loss": -37.40255355834961, "global_step": 84490, "epoch": 698} {"train_loss": -37.4613037109375, "global_step": 84491, "epoch": 698} {"train_loss": -36.879737854003906, "global_step": 84492, "epoch": 698} {"train_loss": -37.10006332397461, "global_step": 84493, "epoch": 698} {"train_loss": -37.874610900878906, "global_step": 84494, "epoch": 698} {"train_loss": -37.79835510253906, "global_step": 84495, "epoch": 698} {"train_loss": -37.26847457885742, "global_step": 84496, "epoch": 698} {"train_loss": -36.59294509887695, "global_step": 84497, "epoch": 698} {"train_loss": -37.35017776489258, "global_step": 84498, "epoch": 698} {"train_loss": -37.195247650146484, "global_step": 84499, "epoch": 698} {"train_loss": -37.188716888427734, "global_step": 84500, "epoch": 698} {"train_loss": -37.648433685302734, "global_step": 84501, "epoch": 698} {"train_loss": -36.67715072631836, "global_step": 84502, "epoch": 698} {"train_loss": -37.54594802856445, "global_step": 84503, "epoch": 698} {"train_loss": -37.09757614135742, "global_step": 84504, "epoch": 698} {"train_loss": -37.01177215576172, "global_step": 84505, "epoch": 698} {"train_loss": -36.08317947387695, "global_step": 84506, "epoch": 698} {"train_loss": -35.91926574707031, "global_step": 84507, "epoch": 698} {"train_loss": -37.30177688598633, "global_step": 84508, "epoch": 698} {"train_loss": -37.86686325073242, "global_step": 84509, "epoch": 698} {"train_loss": -36.812496185302734, "global_step": 84510, "epoch": 698} {"train_loss": -37.24288558959961, "global_step": 84511, "epoch": 698} {"train_loss": -36.54305648803711, "global_step": 84512, "epoch": 698} {"train_loss": -35.96434020996094, "global_step": 84513, "epoch": 698} {"train_loss": -36.9726448059082, "global_step": 84514, "epoch": 698} {"train_loss": -36.8605842590332, "global_step": 84515, "epoch": 698} {"train_loss": -37.18488311767578, "global_step": 84516, "epoch": 698} {"train_loss": -36.57875442504883, "global_step": 84517, "epoch": 698} {"train_loss": -36.995792388916016, "global_step": 84518, "epoch": 698} {"train_loss": -37.23369216918945, "global_step": 84519, "epoch": 698} {"train_loss": -36.82758712768555, "global_step": 84520, "epoch": 698} {"train_loss": -36.9537467956543, "global_step": 84521, "epoch": 698} {"train_loss": -37.32332229614258, "global_step": 84522, "epoch": 698} {"train_loss": -37.29313278198242, "global_step": 84523, "epoch": 698} {"train_loss": -36.138702392578125, "global_step": 84524, "epoch": 698} {"train_loss": -36.93738555908203, "global_step": 84525, "epoch": 698} {"train_loss": -36.77126693725586, "global_step": 84526, "epoch": 698} {"train_loss": -34.91975784301758, "global_step": 84527, "epoch": 698} {"train_loss": -34.243038177490234, "global_step": 84528, "epoch": 698} {"train_loss": -33.46541213989258, "global_step": 84529, "epoch": 698} {"train_loss": -31.851303100585938, "global_step": 84530, "epoch": 698} {"train_loss": -31.396759033203125, "global_step": 84531, "epoch": 698} {"train_loss": -34.24374008178711, "global_step": 84532, "epoch": 698} {"train_loss": -35.359107971191406, "global_step": 84533, "epoch": 698} {"train_loss": -35.55121994018555, "global_step": 84534, "epoch": 698} {"train_loss": -34.58159637451172, "global_step": 84535, "epoch": 698} {"train_loss": -34.6967887878418, "global_step": 84536, "epoch": 698} {"train_loss": -37.47627258300781, "global_step": 84537, "epoch": 698} {"train_loss": -35.65119552612305, "global_step": 84538, "epoch": 698} {"train_loss": -36.28566360473633, "global_step": 84539, "epoch": 698} {"train_loss": -36.565128326416016, "global_step": 84540, "epoch": 698} {"train_loss": -36.321895599365234, "global_step": 84541, "epoch": 698} {"train_loss": -36.49269485473633, "global_step": 84542, "epoch": 698} {"train_loss": -36.59653854370117, "global_step": 84543, "epoch": 698} {"train_loss": -36.34458541870117, "global_step": 84544, "epoch": 698} {"train_loss": -37.74570083618164, "global_step": 84545, "epoch": 698} {"train_loss": -36.556053161621094, "global_step": 84546, "epoch": 698} {"train_loss": -37.52714920043945, "global_step": 84547, "epoch": 698} {"train_loss": -37.31721878051758, "global_step": 84548, "epoch": 698} {"train_loss": -36.38343048095703, "global_step": 84549, "epoch": 698} {"train_loss": -37.56716537475586, "global_step": 84550, "epoch": 698} {"train_loss": -37.03641891479492, "global_step": 84551, "epoch": 698} {"train_loss": -36.69059371948242, "global_step": 84552, "epoch": 698} {"train_loss": -37.726776123046875, "global_step": 84553, "epoch": 698} {"train_loss": -37.114845275878906, "global_step": 84554, "epoch": 698} {"train_loss": -37.2254753112793, "global_step": 84555, "epoch": 698} {"train_loss": -37.05251693725586, "global_step": 84556, "epoch": 698} {"train_loss": -37.876991271972656, "global_step": 84557, "epoch": 698} {"train_loss": -37.32100296020508, "global_step": 84558, "epoch": 698} {"train_loss": -37.98359298706055, "global_step": 84559, "epoch": 698} {"train_loss": -37.85927963256836, "global_step": 84560, "epoch": 698} {"train_loss": -37.80668258666992, "global_step": 84561, "epoch": 698} {"train_loss": -37.70002365112305, "global_step": 84562, "epoch": 698} {"train_loss": -37.46943283081055, "global_step": 84563, "epoch": 698} {"train_loss": -37.56256866455078, "global_step": 84564, "epoch": 698} {"train_loss": -37.29753875732422, "global_step": 84565, "epoch": 698} {"train_loss": -37.85696029663086, "global_step": 84566, "epoch": 698} {"train_loss": -36.92763137817383, "global_step": 84567, "epoch": 698} {"train_loss": -38.31315612792969, "global_step": 84568, "epoch": 698} {"train_loss": -37.71010971069336, "global_step": 84569, "epoch": 698} {"train_loss": -37.25664138793945, "global_step": 84570, "epoch": 698} {"train_loss": -38.21912384033203, "global_step": 84571, "epoch": 698} {"train_loss": -37.382896423339844, "global_step": 84572, "epoch": 698} {"train_loss": -37.60456085205078, "global_step": 84573, "epoch": 698} {"train_loss": -37.5139045715332, "global_step": 84574, "epoch": 698} {"train_loss": -38.098915100097656, "global_step": 84575, "epoch": 698} {"train_loss": -37.90170669555664, "global_step": 84576, "epoch": 698} {"train_loss": -37.7645149230957, "global_step": 84577, "epoch": 698} {"train_loss": -36.87749140715796, "global_step": 84578, "epoch": 698, "val_loss": 2637689.75} {"train_loss": -37.80819320678711, "global_step": 84579, "epoch": 699} {"train_loss": -36.56702423095703, "global_step": 84580, "epoch": 699} {"train_loss": -37.759498596191406, "global_step": 84581, "epoch": 699} {"train_loss": -37.0284423828125, "global_step": 84582, "epoch": 699} {"train_loss": -37.707515716552734, "global_step": 84583, "epoch": 699} {"train_loss": -37.85520553588867, "global_step": 84584, "epoch": 699} {"train_loss": -36.72616195678711, "global_step": 84585, "epoch": 699} {"train_loss": -37.433719635009766, "global_step": 84586, "epoch": 699} {"train_loss": -38.07481384277344, "global_step": 84587, "epoch": 699} {"train_loss": -37.975399017333984, "global_step": 84588, "epoch": 699} {"train_loss": -36.068931579589844, "global_step": 84589, "epoch": 699} {"train_loss": -37.247337341308594, "global_step": 84590, "epoch": 699} {"train_loss": -37.272926330566406, "global_step": 84591, "epoch": 699} {"train_loss": -37.46303939819336, "global_step": 84592, "epoch": 699} {"train_loss": -35.19403076171875, "global_step": 84593, "epoch": 699} {"train_loss": -35.73365020751953, "global_step": 84594, "epoch": 699} {"train_loss": -37.48333740234375, "global_step": 84595, "epoch": 699} {"train_loss": -36.59251403808594, "global_step": 84596, "epoch": 699} {"train_loss": -35.84368896484375, "global_step": 84597, "epoch": 699} {"train_loss": -36.2663688659668, "global_step": 84598, "epoch": 699} {"train_loss": -37.43107223510742, "global_step": 84599, "epoch": 699} {"train_loss": -36.41938400268555, "global_step": 84600, "epoch": 699} {"train_loss": -37.13237380981445, "global_step": 84601, "epoch": 699} {"train_loss": -36.81974411010742, "global_step": 84602, "epoch": 699} {"train_loss": -37.0256462097168, "global_step": 84603, "epoch": 699} {"train_loss": -37.08022689819336, "global_step": 84604, "epoch": 699} {"train_loss": -36.999488830566406, "global_step": 84605, "epoch": 699} {"train_loss": -37.684959411621094, "global_step": 84606, "epoch": 699} {"train_loss": -37.79217529296875, "global_step": 84607, "epoch": 699} {"train_loss": -37.47386932373047, "global_step": 84608, "epoch": 699} {"train_loss": -38.2139892578125, "global_step": 84609, "epoch": 699} {"train_loss": -37.63722610473633, "global_step": 84610, "epoch": 699} {"train_loss": -37.70858383178711, "global_step": 84611, "epoch": 699} {"train_loss": -38.051124572753906, "global_step": 84612, "epoch": 699} {"train_loss": -37.37627410888672, "global_step": 84613, "epoch": 699} {"train_loss": -38.17098617553711, "global_step": 84614, "epoch": 699} {"train_loss": -37.30131912231445, "global_step": 84615, "epoch": 699} {"train_loss": -37.14329147338867, "global_step": 84616, "epoch": 699} {"train_loss": -37.245052337646484, "global_step": 84617, "epoch": 699} {"train_loss": -37.7188606262207, "global_step": 84618, "epoch": 699} {"train_loss": -37.65053939819336, "global_step": 84619, "epoch": 699} {"train_loss": -37.48476791381836, "global_step": 84620, "epoch": 699} {"train_loss": -37.14352798461914, "global_step": 84621, "epoch": 699} {"train_loss": -38.008026123046875, "global_step": 84622, "epoch": 699} {"train_loss": -38.34035873413086, "global_step": 84623, "epoch": 699} {"train_loss": -38.20582580566406, "global_step": 84624, "epoch": 699} {"train_loss": -37.30971908569336, "global_step": 84625, "epoch": 699} {"train_loss": -36.295101165771484, "global_step": 84626, "epoch": 699} {"train_loss": -36.24937057495117, "global_step": 84627, "epoch": 699} {"train_loss": -36.61872482299805, "global_step": 84628, "epoch": 699} {"train_loss": -36.38875961303711, "global_step": 84629, "epoch": 699} {"train_loss": -38.47837448120117, "global_step": 84630, "epoch": 699} {"train_loss": -36.88887405395508, "global_step": 84631, "epoch": 699} {"train_loss": -34.648921966552734, "global_step": 84632, "epoch": 699} {"train_loss": -36.19990921020508, "global_step": 84633, "epoch": 699} {"train_loss": -36.97981643676758, "global_step": 84634, "epoch": 699} {"train_loss": -35.27009963989258, "global_step": 84635, "epoch": 699} {"train_loss": -36.79072952270508, "global_step": 84636, "epoch": 699} {"train_loss": -36.69913864135742, "global_step": 84637, "epoch": 699} {"train_loss": -36.095821380615234, "global_step": 84638, "epoch": 699} {"train_loss": -36.6395149230957, "global_step": 84639, "epoch": 699} {"train_loss": -36.71263122558594, "global_step": 84640, "epoch": 699} {"train_loss": -35.55241394042969, "global_step": 84641, "epoch": 699} {"train_loss": -35.90343475341797, "global_step": 84642, "epoch": 699} {"train_loss": -35.6067008972168, "global_step": 84643, "epoch": 699} {"train_loss": -34.8724365234375, "global_step": 84644, "epoch": 699} {"train_loss": -36.59870910644531, "global_step": 84645, "epoch": 699} {"train_loss": -35.54484176635742, "global_step": 84646, "epoch": 699} {"train_loss": -36.83347702026367, "global_step": 84647, "epoch": 699} {"train_loss": -35.54475784301758, "global_step": 84648, "epoch": 699} {"train_loss": -37.26517105102539, "global_step": 84649, "epoch": 699} {"train_loss": -37.215057373046875, "global_step": 84650, "epoch": 699} {"train_loss": -36.99320602416992, "global_step": 84651, "epoch": 699} {"train_loss": -38.09548568725586, "global_step": 84652, "epoch": 699} {"train_loss": -37.5612907409668, "global_step": 84653, "epoch": 699} {"train_loss": -38.10905838012695, "global_step": 84654, "epoch": 699} {"train_loss": -38.21037292480469, "global_step": 84655, "epoch": 699} {"train_loss": -37.41054916381836, "global_step": 84656, "epoch": 699} {"train_loss": -38.132057189941406, "global_step": 84657, "epoch": 699} {"train_loss": -37.97526168823242, "global_step": 84658, "epoch": 699} {"train_loss": -36.8404426574707, "global_step": 84659, "epoch": 699} {"train_loss": -37.99018096923828, "global_step": 84660, "epoch": 699} {"train_loss": -37.427894592285156, "global_step": 84661, "epoch": 699} {"train_loss": -37.627845764160156, "global_step": 84662, "epoch": 699} {"train_loss": -36.87247085571289, "global_step": 84663, "epoch": 699} {"train_loss": -36.65894317626953, "global_step": 84664, "epoch": 699} {"train_loss": -37.39896774291992, "global_step": 84665, "epoch": 699} {"train_loss": -37.44365310668945, "global_step": 84666, "epoch": 699} {"train_loss": -38.38101577758789, "global_step": 84667, "epoch": 699} {"train_loss": -37.37431716918945, "global_step": 84668, "epoch": 699} {"train_loss": -37.22995376586914, "global_step": 84669, "epoch": 699} {"train_loss": -37.81361770629883, "global_step": 84670, "epoch": 699} {"train_loss": -37.899044036865234, "global_step": 84671, "epoch": 699} {"train_loss": -37.27943801879883, "global_step": 84672, "epoch": 699} {"train_loss": -36.697139739990234, "global_step": 84673, "epoch": 699} {"train_loss": -37.93730163574219, "global_step": 84674, "epoch": 699} {"train_loss": -38.3093147277832, "global_step": 84675, "epoch": 699} {"train_loss": -38.0698356628418, "global_step": 84676, "epoch": 699} {"train_loss": -37.35834884643555, "global_step": 84677, "epoch": 699} {"train_loss": -35.81462478637695, "global_step": 84678, "epoch": 699} {"train_loss": -37.41019821166992, "global_step": 84679, "epoch": 699} {"train_loss": -37.24163818359375, "global_step": 84680, "epoch": 699} {"train_loss": -37.429969787597656, "global_step": 84681, "epoch": 699} {"train_loss": -37.053955078125, "global_step": 84682, "epoch": 699} {"train_loss": -36.816009521484375, "global_step": 84683, "epoch": 699} {"train_loss": -35.97488021850586, "global_step": 84684, "epoch": 699} {"train_loss": -35.25718688964844, "global_step": 84685, "epoch": 699} {"train_loss": -34.1245002746582, "global_step": 84686, "epoch": 699} {"train_loss": -36.645225524902344, "global_step": 84687, "epoch": 699} {"train_loss": -33.75654220581055, "global_step": 84688, "epoch": 699} {"train_loss": -35.097286224365234, "global_step": 84689, "epoch": 699} {"train_loss": -34.20184326171875, "global_step": 84690, "epoch": 699} {"train_loss": -36.25251770019531, "global_step": 84691, "epoch": 699} {"train_loss": -36.438411712646484, "global_step": 84692, "epoch": 699} {"train_loss": -34.23479080200195, "global_step": 84693, "epoch": 699} {"train_loss": -35.75430679321289, "global_step": 84694, "epoch": 699} {"train_loss": -35.858917236328125, "global_step": 84695, "epoch": 699} {"train_loss": -35.270511627197266, "global_step": 84696, "epoch": 699} {"train_loss": -35.164772033691406, "global_step": 84697, "epoch": 699} {"train_loss": -33.989742279052734, "global_step": 84698, "epoch": 699} {"train_loss": -36.85209179712721, "global_step": 84699, "epoch": 699, "val_loss": 2635170.0} {"train_loss": -34.24552536010742, "global_step": 84700, "epoch": 700} {"train_loss": -36.4780158996582, "global_step": 84701, "epoch": 700} {"train_loss": -36.04829025268555, "global_step": 84702, "epoch": 700} {"train_loss": -33.09143829345703, "global_step": 84703, "epoch": 700} {"train_loss": -35.433990478515625, "global_step": 84704, "epoch": 700} {"train_loss": -35.44385528564453, "global_step": 84705, "epoch": 700} {"train_loss": -35.17040252685547, "global_step": 84706, "epoch": 700} {"train_loss": -35.210060119628906, "global_step": 84707, "epoch": 700} {"train_loss": -35.87422180175781, "global_step": 84708, "epoch": 700} {"train_loss": -35.519493103027344, "global_step": 84709, "epoch": 700} {"train_loss": -35.64093780517578, "global_step": 84710, "epoch": 700} {"train_loss": -35.20964431762695, "global_step": 84711, "epoch": 700} {"train_loss": -35.7719841003418, "global_step": 84712, "epoch": 700} {"train_loss": -35.00102615356445, "global_step": 84713, "epoch": 700} {"train_loss": -34.888057708740234, "global_step": 84714, "epoch": 700} {"train_loss": -34.98040771484375, "global_step": 84715, "epoch": 700} {"train_loss": -35.699615478515625, "global_step": 84716, "epoch": 700} {"train_loss": -35.41130447387695, "global_step": 84717, "epoch": 700} {"train_loss": -36.44834518432617, "global_step": 84718, "epoch": 700} {"train_loss": -36.2092170715332, "global_step": 84719, "epoch": 700} {"train_loss": -36.190853118896484, "global_step": 84720, "epoch": 700} {"train_loss": -35.92984390258789, "global_step": 84721, "epoch": 700} {"train_loss": -36.67083740234375, "global_step": 84722, "epoch": 700} {"train_loss": -36.9664306640625, "global_step": 84723, "epoch": 700} {"train_loss": -37.07274627685547, "global_step": 84724, "epoch": 700} {"train_loss": -36.47107696533203, "global_step": 84725, "epoch": 700} {"train_loss": -36.5481071472168, "global_step": 84726, "epoch": 700} {"train_loss": -36.246795654296875, "global_step": 84727, "epoch": 700} {"train_loss": -36.73037338256836, "global_step": 84728, "epoch": 700} {"train_loss": -37.096588134765625, "global_step": 84729, "epoch": 700} {"train_loss": -36.99555587768555, "global_step": 84730, "epoch": 700} {"train_loss": -37.16088104248047, "global_step": 84731, "epoch": 700} {"train_loss": -36.62411117553711, "global_step": 84732, "epoch": 700} {"train_loss": -36.856502532958984, "global_step": 84733, "epoch": 700} {"train_loss": -36.912269592285156, "global_step": 84734, "epoch": 700} {"train_loss": -36.218666076660156, "global_step": 84735, "epoch": 700} {"train_loss": -37.3519287109375, "global_step": 84736, "epoch": 700} {"train_loss": -37.310489654541016, "global_step": 84737, "epoch": 700} {"train_loss": -37.31804656982422, "global_step": 84738, "epoch": 700} {"train_loss": -36.9206657409668, "global_step": 84739, "epoch": 700} {"train_loss": -37.446449279785156, "global_step": 84740, "epoch": 700} {"train_loss": -36.30588912963867, "global_step": 84741, "epoch": 700} {"train_loss": -37.56519317626953, "global_step": 84742, "epoch": 700} {"train_loss": -36.46714782714844, "global_step": 84743, "epoch": 700} {"train_loss": -38.10016632080078, "global_step": 84744, "epoch": 700} {"train_loss": -37.6771125793457, "global_step": 84745, "epoch": 700} {"train_loss": -37.56498336791992, "global_step": 84746, "epoch": 700} {"train_loss": -37.89907455444336, "global_step": 84747, "epoch": 700} {"train_loss": -35.31140899658203, "global_step": 84748, "epoch": 700} {"train_loss": -37.677284240722656, "global_step": 84749, "epoch": 700} {"train_loss": -37.51353073120117, "global_step": 84750, "epoch": 700} {"train_loss": -36.866905212402344, "global_step": 84751, "epoch": 700} {"train_loss": -37.2823486328125, "global_step": 84752, "epoch": 700} {"train_loss": -34.763851165771484, "global_step": 84753, "epoch": 700} {"train_loss": -37.107383728027344, "global_step": 84754, "epoch": 700} {"train_loss": -35.188751220703125, "global_step": 84755, "epoch": 700} {"train_loss": -36.42876434326172, "global_step": 84756, "epoch": 700} {"train_loss": -37.050716400146484, "global_step": 84757, "epoch": 700} {"train_loss": -34.525535583496094, "global_step": 84758, "epoch": 700} {"train_loss": -36.77077102661133, "global_step": 84759, "epoch": 700} {"train_loss": -37.44129180908203, "global_step": 84760, "epoch": 700} {"train_loss": -35.939369201660156, "global_step": 84761, "epoch": 700} {"train_loss": -37.252662658691406, "global_step": 84762, "epoch": 700} {"train_loss": -36.08271026611328, "global_step": 84763, "epoch": 700} {"train_loss": -37.78269577026367, "global_step": 84764, "epoch": 700} {"train_loss": -36.879119873046875, "global_step": 84765, "epoch": 700} {"train_loss": -37.31669998168945, "global_step": 84766, "epoch": 700} {"train_loss": -36.30630111694336, "global_step": 84767, "epoch": 700} {"train_loss": -37.24550247192383, "global_step": 84768, "epoch": 700} {"train_loss": -36.88485336303711, "global_step": 84769, "epoch": 700} {"train_loss": -37.48012924194336, "global_step": 84770, "epoch": 700} {"train_loss": -37.389190673828125, "global_step": 84771, "epoch": 700} {"train_loss": -37.39980697631836, "global_step": 84772, "epoch": 700} {"train_loss": -37.681209564208984, "global_step": 84773, "epoch": 700} {"train_loss": -37.223262786865234, "global_step": 84774, "epoch": 700} {"train_loss": -37.466094970703125, "global_step": 84775, "epoch": 700} {"train_loss": -37.51107406616211, "global_step": 84776, "epoch": 700} {"train_loss": -36.21847152709961, "global_step": 84777, "epoch": 700} {"train_loss": -37.60852813720703, "global_step": 84778, "epoch": 700} {"train_loss": -37.31605911254883, "global_step": 84779, "epoch": 700} {"train_loss": -37.68012619018555, "global_step": 84780, "epoch": 700} {"train_loss": -36.63822937011719, "global_step": 84781, "epoch": 700} {"train_loss": -37.06755447387695, "global_step": 84782, "epoch": 700} {"train_loss": -37.16908264160156, "global_step": 84783, "epoch": 700} {"train_loss": -37.0734977722168, "global_step": 84784, "epoch": 700} {"train_loss": -35.964698791503906, "global_step": 84785, "epoch": 700} {"train_loss": -37.42620086669922, "global_step": 84786, "epoch": 700} {"train_loss": -37.278316497802734, "global_step": 84787, "epoch": 700} {"train_loss": -37.846065521240234, "global_step": 84788, "epoch": 700} {"train_loss": -37.02790451049805, "global_step": 84789, "epoch": 700} {"train_loss": -35.47621154785156, "global_step": 84790, "epoch": 700} {"train_loss": -37.2382698059082, "global_step": 84791, "epoch": 700} {"train_loss": -35.90975570678711, "global_step": 84792, "epoch": 700} {"train_loss": -34.74493408203125, "global_step": 84793, "epoch": 700} {"train_loss": -36.72111511230469, "global_step": 84794, "epoch": 700} {"train_loss": -35.63193893432617, "global_step": 84795, "epoch": 700} {"train_loss": -33.73098373413086, "global_step": 84796, "epoch": 700} {"train_loss": -33.74764633178711, "global_step": 84797, "epoch": 700} {"train_loss": -31.7944278717041, "global_step": 84798, "epoch": 700} {"train_loss": -31.415014266967773, "global_step": 84799, "epoch": 700} {"train_loss": -36.85763931274414, "global_step": 84800, "epoch": 700} {"train_loss": -37.281700134277344, "global_step": 84801, "epoch": 700} {"train_loss": -35.844669342041016, "global_step": 84802, "epoch": 700} {"train_loss": -37.00992965698242, "global_step": 84803, "epoch": 700} {"train_loss": -36.140541076660156, "global_step": 84804, "epoch": 700} {"train_loss": -36.179176330566406, "global_step": 84805, "epoch": 700} {"train_loss": -37.293148040771484, "global_step": 84806, "epoch": 700} {"train_loss": -35.60945510864258, "global_step": 84807, "epoch": 700} {"train_loss": -36.439815521240234, "global_step": 84808, "epoch": 700} {"train_loss": -36.785884857177734, "global_step": 84809, "epoch": 700} {"train_loss": -36.616943359375, "global_step": 84810, "epoch": 700} {"train_loss": -37.229862213134766, "global_step": 84811, "epoch": 700} {"train_loss": -37.08221435546875, "global_step": 84812, "epoch": 700} {"train_loss": -37.004825592041016, "global_step": 84813, "epoch": 700} {"train_loss": -36.912200927734375, "global_step": 84814, "epoch": 700} {"train_loss": -37.12124252319336, "global_step": 84815, "epoch": 700} {"train_loss": -36.9742317199707, "global_step": 84816, "epoch": 700} {"train_loss": -37.40473556518555, "global_step": 84817, "epoch": 700} {"train_loss": -37.319068908691406, "global_step": 84818, "epoch": 700} {"train_loss": -37.452510833740234, "global_step": 84819, "epoch": 700} {"train_loss": -36.46632807707984, "global_step": 84820, "epoch": 700, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4400000": 1.0, "test/sim_max_reward_4400001": 1.0, "test/sim_max_reward_4400002": 1.0, "test/sim_max_reward_4400003": 1.0, "test/sim_max_reward_4400004": 1.0, "test/sim_max_reward_4400005": 1.0, "test/sim_max_reward_4400006": 1.0, "test/sim_max_reward_4400007": 1.0, "test/sim_max_reward_4400008": 1.0, "test/sim_max_reward_4400009": 1.0, "test/sim_max_reward_4400010": 1.0, "test/sim_max_reward_4400011": 1.0, "test/sim_max_reward_4400012": 1.0, "test/sim_max_reward_4400013": 1.0, "test/sim_max_reward_4400014": 1.0, "test/sim_max_reward_4400015": 1.0, "test/sim_max_reward_4400016": 1.0, "test/sim_max_reward_4400017": 1.0, "test/sim_max_reward_4400018": 1.0, "test/sim_max_reward_4400019": 1.0, "test/sim_max_reward_4400020": 1.0, "test/sim_max_reward_4400021": 1.0, "train/mean_score": 1.0, "test/mean_score": 1.0, "val_loss": 2641864.75} {"train_loss": -37.513248443603516, "global_step": 84821, "epoch": 701} {"train_loss": -37.22475051879883, "global_step": 84822, "epoch": 701} {"train_loss": -37.63701629638672, "global_step": 84823, "epoch": 701} {"train_loss": -37.252132415771484, "global_step": 84824, "epoch": 701} {"train_loss": -37.30492401123047, "global_step": 84825, "epoch": 701} {"train_loss": -36.74462890625, "global_step": 84826, "epoch": 701} {"train_loss": -37.68913269042969, "global_step": 84827, "epoch": 701} {"train_loss": -36.94955062866211, "global_step": 84828, "epoch": 701} {"train_loss": -36.324623107910156, "global_step": 84829, "epoch": 701} {"train_loss": -36.93644332885742, "global_step": 84830, "epoch": 701} {"train_loss": -37.47463607788086, "global_step": 84831, "epoch": 701} {"train_loss": -37.23344802856445, "global_step": 84832, "epoch": 701} {"train_loss": -37.21042251586914, "global_step": 84833, "epoch": 701} {"train_loss": -37.092559814453125, "global_step": 84834, "epoch": 701} {"train_loss": -37.38064956665039, "global_step": 84835, "epoch": 701} {"train_loss": -37.16126251220703, "global_step": 84836, "epoch": 701} {"train_loss": -36.852447509765625, "global_step": 84837, "epoch": 701} {"train_loss": -37.85566711425781, "global_step": 84838, "epoch": 701} {"train_loss": -37.58039093017578, "global_step": 84839, "epoch": 701} {"train_loss": -37.423763275146484, "global_step": 84840, "epoch": 701} {"train_loss": -36.3940315246582, "global_step": 84841, "epoch": 701} {"train_loss": -36.5624885559082, "global_step": 84842, "epoch": 701} {"train_loss": -37.475257873535156, "global_step": 84843, "epoch": 701} {"train_loss": -34.90334701538086, "global_step": 84844, "epoch": 701} {"train_loss": -33.93116760253906, "global_step": 84845, "epoch": 701} {"train_loss": -36.385719299316406, "global_step": 84846, "epoch": 701} {"train_loss": -36.822750091552734, "global_step": 84847, "epoch": 701} {"train_loss": -36.19464111328125, "global_step": 84848, "epoch": 701} {"train_loss": -34.8440055847168, "global_step": 84849, "epoch": 701} {"train_loss": -37.367156982421875, "global_step": 84850, "epoch": 701} {"train_loss": -36.11334991455078, "global_step": 84851, "epoch": 701} {"train_loss": -33.163116455078125, "global_step": 84852, "epoch": 701} {"train_loss": -36.05939483642578, "global_step": 84853, "epoch": 701} {"train_loss": -36.83024978637695, "global_step": 84854, "epoch": 701} {"train_loss": -35.096214294433594, "global_step": 84855, "epoch": 701} {"train_loss": -34.11062240600586, "global_step": 84856, "epoch": 701} {"train_loss": -37.22932815551758, "global_step": 84857, "epoch": 701} {"train_loss": -35.79030227661133, "global_step": 84858, "epoch": 701} {"train_loss": -34.927303314208984, "global_step": 84859, "epoch": 701} {"train_loss": -34.72723388671875, "global_step": 84860, "epoch": 701} {"train_loss": -36.43513107299805, "global_step": 84861, "epoch": 701} {"train_loss": -35.99085235595703, "global_step": 84862, "epoch": 701} {"train_loss": -36.854736328125, "global_step": 84863, "epoch": 701} {"train_loss": -35.78448486328125, "global_step": 84864, "epoch": 701} {"train_loss": -36.868629455566406, "global_step": 84865, "epoch": 701} {"train_loss": -23.864686965942383, "global_step": 84866, "epoch": 701} {"train_loss": -34.42036056518555, "global_step": 84867, "epoch": 701} {"train_loss": -36.356571197509766, "global_step": 84868, "epoch": 701} {"train_loss": -30.31658363342285, "global_step": 84869, "epoch": 701} {"train_loss": -34.620399475097656, "global_step": 84870, "epoch": 701} {"train_loss": -35.657745361328125, "global_step": 84871, "epoch": 701} {"train_loss": -31.89607048034668, "global_step": 84872, "epoch": 701} {"train_loss": -33.15975570678711, "global_step": 84873, "epoch": 701} {"train_loss": -33.47649002075195, "global_step": 84874, "epoch": 701} {"train_loss": -33.819000244140625, "global_step": 84875, "epoch": 701} {"train_loss": -34.65300369262695, "global_step": 84876, "epoch": 701} {"train_loss": -29.264469146728516, "global_step": 84877, "epoch": 701} {"train_loss": -33.53318405151367, "global_step": 84878, "epoch": 701} {"train_loss": -33.57939529418945, "global_step": 84879, "epoch": 701} {"train_loss": -33.1922607421875, "global_step": 84880, "epoch": 701} {"train_loss": -34.1342658996582, "global_step": 84881, "epoch": 701} {"train_loss": -33.74550247192383, "global_step": 84882, "epoch": 701} {"train_loss": -32.18683624267578, "global_step": 84883, "epoch": 701} {"train_loss": -32.853092193603516, "global_step": 84884, "epoch": 701} {"train_loss": -34.303016662597656, "global_step": 84885, "epoch": 701} {"train_loss": -32.6662712097168, "global_step": 84886, "epoch": 701} {"train_loss": -33.828975677490234, "global_step": 84887, "epoch": 701} {"train_loss": -33.418968200683594, "global_step": 84888, "epoch": 701} {"train_loss": -34.567710876464844, "global_step": 84889, "epoch": 701} {"train_loss": -35.43852615356445, "global_step": 84890, "epoch": 701} {"train_loss": -35.19609451293945, "global_step": 84891, "epoch": 701} {"train_loss": -34.93972396850586, "global_step": 84892, "epoch": 701} {"train_loss": -34.937984466552734, "global_step": 84893, "epoch": 701} {"train_loss": -34.682220458984375, "global_step": 84894, "epoch": 701} {"train_loss": -34.85731506347656, "global_step": 84895, "epoch": 701} {"train_loss": -35.85334396362305, "global_step": 84896, "epoch": 701} {"train_loss": -35.574974060058594, "global_step": 84897, "epoch": 701} {"train_loss": -34.22180938720703, "global_step": 84898, "epoch": 701} {"train_loss": -35.60808563232422, "global_step": 84899, "epoch": 701} {"train_loss": -35.992191314697266, "global_step": 84900, "epoch": 701} {"train_loss": -35.91691207885742, "global_step": 84901, "epoch": 701} {"train_loss": -35.72248840332031, "global_step": 84902, "epoch": 701} {"train_loss": -35.91866683959961, "global_step": 84903, "epoch": 701} {"train_loss": -35.3125, "global_step": 84904, "epoch": 701} {"train_loss": -36.0139045715332, "global_step": 84905, "epoch": 701} {"train_loss": -36.2689323425293, "global_step": 84906, "epoch": 701} {"train_loss": -34.106483459472656, "global_step": 84907, "epoch": 701} {"train_loss": -35.625701904296875, "global_step": 84908, "epoch": 701} {"train_loss": -35.553550720214844, "global_step": 84909, "epoch": 701} {"train_loss": -35.73373031616211, "global_step": 84910, "epoch": 701} {"train_loss": -36.4884147644043, "global_step": 84911, "epoch": 701} {"train_loss": -35.92519760131836, "global_step": 84912, "epoch": 701} {"train_loss": -35.10807418823242, "global_step": 84913, "epoch": 701} {"train_loss": -35.28286361694336, "global_step": 84914, "epoch": 701} {"train_loss": -36.48370361328125, "global_step": 84915, "epoch": 701} {"train_loss": -36.42810821533203, "global_step": 84916, "epoch": 701} {"train_loss": -36.63472366333008, "global_step": 84917, "epoch": 701} {"train_loss": -36.14785385131836, "global_step": 84918, "epoch": 701} {"train_loss": -35.69690704345703, "global_step": 84919, "epoch": 701} {"train_loss": -36.4376106262207, "global_step": 84920, "epoch": 701} {"train_loss": -36.555328369140625, "global_step": 84921, "epoch": 701} {"train_loss": -36.523983001708984, "global_step": 84922, "epoch": 701} {"train_loss": -36.44477844238281, "global_step": 84923, "epoch": 701} {"train_loss": -36.9730339050293, "global_step": 84924, "epoch": 701} {"train_loss": -36.85518264770508, "global_step": 84925, "epoch": 701} {"train_loss": -37.0360107421875, "global_step": 84926, "epoch": 701} {"train_loss": -36.92314147949219, "global_step": 84927, "epoch": 701} {"train_loss": -37.03038024902344, "global_step": 84928, "epoch": 701} {"train_loss": -36.816139221191406, "global_step": 84929, "epoch": 701} {"train_loss": -36.58269119262695, "global_step": 84930, "epoch": 701} {"train_loss": -36.953495025634766, "global_step": 84931, "epoch": 701} {"train_loss": -36.51217269897461, "global_step": 84932, "epoch": 701} {"train_loss": -36.92881393432617, "global_step": 84933, "epoch": 701} {"train_loss": -37.52973556518555, "global_step": 84934, "epoch": 701} {"train_loss": -37.21039962768555, "global_step": 84935, "epoch": 701} {"train_loss": -37.319549560546875, "global_step": 84936, "epoch": 701} {"train_loss": -36.9089241027832, "global_step": 84937, "epoch": 701} {"train_loss": -37.33631134033203, "global_step": 84938, "epoch": 701} {"train_loss": -36.86185836791992, "global_step": 84939, "epoch": 701} {"train_loss": -37.15924072265625, "global_step": 84940, "epoch": 701} {"train_loss": -35.66225888906432, "global_step": 84941, "epoch": 701, "val_loss": 2656618.0} {"train_loss": -37.338584899902344, "global_step": 84942, "epoch": 702} {"train_loss": -37.87079620361328, "global_step": 84943, "epoch": 702} {"train_loss": -37.40156555175781, "global_step": 84944, "epoch": 702} {"train_loss": -37.36018371582031, "global_step": 84945, "epoch": 702} {"train_loss": -37.57938003540039, "global_step": 84946, "epoch": 702} {"train_loss": -37.83400344848633, "global_step": 84947, "epoch": 702} {"train_loss": -38.069671630859375, "global_step": 84948, "epoch": 702} {"train_loss": -37.8784294128418, "global_step": 84949, "epoch": 702} {"train_loss": -37.568511962890625, "global_step": 84950, "epoch": 702} {"train_loss": -37.18441390991211, "global_step": 84951, "epoch": 702} {"train_loss": -37.62529754638672, "global_step": 84952, "epoch": 702} {"train_loss": -37.87912368774414, "global_step": 84953, "epoch": 702} {"train_loss": -38.07197570800781, "global_step": 84954, "epoch": 702} {"train_loss": -37.99562072753906, "global_step": 84955, "epoch": 702} {"train_loss": -37.265716552734375, "global_step": 84956, "epoch": 702} {"train_loss": -37.85201644897461, "global_step": 84957, "epoch": 702} {"train_loss": -37.957435607910156, "global_step": 84958, "epoch": 702} {"train_loss": -37.714229583740234, "global_step": 84959, "epoch": 702} {"train_loss": -37.966041564941406, "global_step": 84960, "epoch": 702} {"train_loss": -37.419166564941406, "global_step": 84961, "epoch": 702} {"train_loss": -37.503658294677734, "global_step": 84962, "epoch": 702} {"train_loss": -36.51710891723633, "global_step": 84963, "epoch": 702} {"train_loss": -35.75322341918945, "global_step": 84964, "epoch": 702} {"train_loss": -35.57190704345703, "global_step": 84965, "epoch": 702} {"train_loss": -35.293304443359375, "global_step": 84966, "epoch": 702} {"train_loss": -34.0975341796875, "global_step": 84967, "epoch": 702} {"train_loss": -36.45991134643555, "global_step": 84968, "epoch": 702} {"train_loss": -36.18747329711914, "global_step": 84969, "epoch": 702} {"train_loss": -33.99235534667969, "global_step": 84970, "epoch": 702} {"train_loss": -34.23967361450195, "global_step": 84971, "epoch": 702} {"train_loss": -31.829614639282227, "global_step": 84972, "epoch": 702} {"train_loss": -26.764551162719727, "global_step": 84973, "epoch": 702} {"train_loss": -22.748281478881836, "global_step": 84974, "epoch": 702} {"train_loss": -31.1318359375, "global_step": 84975, "epoch": 702} {"train_loss": -30.90109634399414, "global_step": 84976, "epoch": 702} {"train_loss": -28.569671630859375, "global_step": 84977, "epoch": 702} {"train_loss": -33.13212203979492, "global_step": 84978, "epoch": 702} {"train_loss": -32.68851852416992, "global_step": 84979, "epoch": 702} {"train_loss": -34.3766975402832, "global_step": 84980, "epoch": 702} {"train_loss": -32.30341720581055, "global_step": 84981, "epoch": 702} {"train_loss": -34.03943634033203, "global_step": 84982, "epoch": 702} {"train_loss": -34.90327072143555, "global_step": 84983, "epoch": 702} {"train_loss": -33.08545684814453, "global_step": 84984, "epoch": 702} {"train_loss": -35.037330627441406, "global_step": 84985, "epoch": 702} {"train_loss": -35.31821060180664, "global_step": 84986, "epoch": 702} {"train_loss": -35.96462631225586, "global_step": 84987, "epoch": 702} {"train_loss": -35.52079772949219, "global_step": 84988, "epoch": 702} {"train_loss": -35.9102668762207, "global_step": 84989, "epoch": 702} {"train_loss": -37.08083724975586, "global_step": 84990, "epoch": 702} {"train_loss": -36.551300048828125, "global_step": 84991, "epoch": 702} {"train_loss": -35.495052337646484, "global_step": 84992, "epoch": 702} {"train_loss": -36.92643356323242, "global_step": 84993, "epoch": 702} {"train_loss": -37.0816650390625, "global_step": 84994, "epoch": 702} {"train_loss": -37.05753707885742, "global_step": 84995, "epoch": 702} {"train_loss": -36.49776840209961, "global_step": 84996, "epoch": 702} {"train_loss": -36.407161712646484, "global_step": 84997, "epoch": 702} {"train_loss": -37.14693832397461, "global_step": 84998, "epoch": 702} {"train_loss": -37.19517135620117, "global_step": 84999, "epoch": 702} {"train_loss": -37.210018157958984, "global_step": 85000, "epoch": 702} {"train_loss": -37.50046920776367, "global_step": 85001, "epoch": 702} {"train_loss": -37.61391830444336, "global_step": 85002, "epoch": 702} {"train_loss": -37.257686614990234, "global_step": 85003, "epoch": 702} {"train_loss": -37.02315139770508, "global_step": 85004, "epoch": 702} {"train_loss": -37.208011627197266, "global_step": 85005, "epoch": 702} {"train_loss": -37.50585174560547, "global_step": 85006, "epoch": 702} {"train_loss": -37.490028381347656, "global_step": 85007, "epoch": 702} {"train_loss": -37.82819366455078, "global_step": 85008, "epoch": 702} {"train_loss": -37.21006393432617, "global_step": 85009, "epoch": 702} {"train_loss": -38.03763961791992, "global_step": 85010, "epoch": 702} {"train_loss": -37.608150482177734, "global_step": 85011, "epoch": 702} {"train_loss": -37.38530731201172, "global_step": 85012, "epoch": 702} {"train_loss": -37.79602813720703, "global_step": 85013, "epoch": 702} {"train_loss": -37.817440032958984, "global_step": 85014, "epoch": 702} {"train_loss": -38.070465087890625, "global_step": 85015, "epoch": 702} {"train_loss": -38.321044921875, "global_step": 85016, "epoch": 702} {"train_loss": -38.18961715698242, "global_step": 85017, "epoch": 702} {"train_loss": -37.33063888549805, "global_step": 85018, "epoch": 702} {"train_loss": -37.54559326171875, "global_step": 85019, "epoch": 702} {"train_loss": -38.026885986328125, "global_step": 85020, "epoch": 702} {"train_loss": -38.10268020629883, "global_step": 85021, "epoch": 702} {"train_loss": -37.43363571166992, "global_step": 85022, "epoch": 702} {"train_loss": -38.097347259521484, "global_step": 85023, "epoch": 702} {"train_loss": -37.84951400756836, "global_step": 85024, "epoch": 702} {"train_loss": -38.181453704833984, "global_step": 85025, "epoch": 702} {"train_loss": -37.15896224975586, "global_step": 85026, "epoch": 702} {"train_loss": -37.415279388427734, "global_step": 85027, "epoch": 702} {"train_loss": -38.228755950927734, "global_step": 85028, "epoch": 702} {"train_loss": -37.71533966064453, "global_step": 85029, "epoch": 702} {"train_loss": -36.950679779052734, "global_step": 85030, "epoch": 702} {"train_loss": -37.618690490722656, "global_step": 85031, "epoch": 702} {"train_loss": -38.037471771240234, "global_step": 85032, "epoch": 702} {"train_loss": -37.92837142944336, "global_step": 85033, "epoch": 702} {"train_loss": -37.296417236328125, "global_step": 85034, "epoch": 702} {"train_loss": -36.96579360961914, "global_step": 85035, "epoch": 702} {"train_loss": -37.703399658203125, "global_step": 85036, "epoch": 702} {"train_loss": -38.28214645385742, "global_step": 85037, "epoch": 702} {"train_loss": -37.65627670288086, "global_step": 85038, "epoch": 702} {"train_loss": -36.99997329711914, "global_step": 85039, "epoch": 702} {"train_loss": -36.67539596557617, "global_step": 85040, "epoch": 702} {"train_loss": -37.42619705200195, "global_step": 85041, "epoch": 702} {"train_loss": -37.367530822753906, "global_step": 85042, "epoch": 702} {"train_loss": -36.98214340209961, "global_step": 85043, "epoch": 702} {"train_loss": -36.76321792602539, "global_step": 85044, "epoch": 702} {"train_loss": -36.17732620239258, "global_step": 85045, "epoch": 702} {"train_loss": -31.4069881439209, "global_step": 85046, "epoch": 702} {"train_loss": -16.534921646118164, "global_step": 85047, "epoch": 702} {"train_loss": -8.927977561950684, "global_step": 85048, "epoch": 702} {"train_loss": -28.01454734802246, "global_step": 85049, "epoch": 702} {"train_loss": -33.87522506713867, "global_step": 85050, "epoch": 702} {"train_loss": -22.68474006652832, "global_step": 85051, "epoch": 702} {"train_loss": -36.572505950927734, "global_step": 85052, "epoch": 702} {"train_loss": -26.574670791625977, "global_step": 85053, "epoch": 702} {"train_loss": -36.73627471923828, "global_step": 85054, "epoch": 702} {"train_loss": -29.671106338500977, "global_step": 85055, "epoch": 702} {"train_loss": -36.52755355834961, "global_step": 85056, "epoch": 702} {"train_loss": -33.078636169433594, "global_step": 85057, "epoch": 702} {"train_loss": -35.000247955322266, "global_step": 85058, "epoch": 702} {"train_loss": -35.62993240356445, "global_step": 85059, "epoch": 702} {"train_loss": -34.54970169067383, "global_step": 85060, "epoch": 702} {"train_loss": -35.45554733276367, "global_step": 85061, "epoch": 702} {"train_loss": -35.58688910145405, "global_step": 85062, "epoch": 702, "val_loss": 2587127.25} {"train_loss": -35.03009796142578, "global_step": 85063, "epoch": 703} {"train_loss": -36.62411117553711, "global_step": 85064, "epoch": 703} {"train_loss": -36.45227813720703, "global_step": 85065, "epoch": 703} {"train_loss": -36.048011779785156, "global_step": 85066, "epoch": 703} {"train_loss": -36.50443649291992, "global_step": 85067, "epoch": 703} {"train_loss": -36.675384521484375, "global_step": 85068, "epoch": 703} {"train_loss": -36.17205810546875, "global_step": 85069, "epoch": 703} {"train_loss": -36.5783576965332, "global_step": 85070, "epoch": 703} {"train_loss": -36.68706130981445, "global_step": 85071, "epoch": 703} {"train_loss": -36.988162994384766, "global_step": 85072, "epoch": 703} {"train_loss": -36.86488723754883, "global_step": 85073, "epoch": 703} {"train_loss": -36.44027328491211, "global_step": 85074, "epoch": 703} {"train_loss": -36.85076904296875, "global_step": 85075, "epoch": 703} {"train_loss": -37.23030471801758, "global_step": 85076, "epoch": 703} {"train_loss": -36.02288818359375, "global_step": 85077, "epoch": 703} {"train_loss": -36.589454650878906, "global_step": 85078, "epoch": 703} {"train_loss": -37.21018600463867, "global_step": 85079, "epoch": 703} {"train_loss": -37.42432403564453, "global_step": 85080, "epoch": 703} {"train_loss": -37.21769332885742, "global_step": 85081, "epoch": 703} {"train_loss": -36.9879150390625, "global_step": 85082, "epoch": 703} {"train_loss": -37.23696517944336, "global_step": 85083, "epoch": 703} {"train_loss": -37.01253890991211, "global_step": 85084, "epoch": 703} {"train_loss": -35.93284225463867, "global_step": 85085, "epoch": 703} {"train_loss": -37.23019027709961, "global_step": 85086, "epoch": 703} {"train_loss": -37.46729278564453, "global_step": 85087, "epoch": 703} {"train_loss": -37.39811325073242, "global_step": 85088, "epoch": 703} {"train_loss": -36.92792892456055, "global_step": 85089, "epoch": 703} {"train_loss": -37.681358337402344, "global_step": 85090, "epoch": 703} {"train_loss": -37.726905822753906, "global_step": 85091, "epoch": 703} {"train_loss": -34.83816146850586, "global_step": 85092, "epoch": 703} {"train_loss": -38.0272331237793, "global_step": 85093, "epoch": 703} {"train_loss": -37.27082061767578, "global_step": 85094, "epoch": 703} {"train_loss": -35.7269172668457, "global_step": 85095, "epoch": 703} {"train_loss": -37.5175895690918, "global_step": 85096, "epoch": 703} {"train_loss": -37.905025482177734, "global_step": 85097, "epoch": 703} {"train_loss": -37.66004943847656, "global_step": 85098, "epoch": 703} {"train_loss": -35.31624984741211, "global_step": 85099, "epoch": 703} {"train_loss": -37.57698440551758, "global_step": 85100, "epoch": 703} {"train_loss": -37.3881950378418, "global_step": 85101, "epoch": 703} {"train_loss": -37.721553802490234, "global_step": 85102, "epoch": 703} {"train_loss": -38.068153381347656, "global_step": 85103, "epoch": 703} {"train_loss": -37.90181350708008, "global_step": 85104, "epoch": 703} {"train_loss": -38.016170501708984, "global_step": 85105, "epoch": 703} {"train_loss": -37.642879486083984, "global_step": 85106, "epoch": 703} {"train_loss": -37.91453552246094, "global_step": 85107, "epoch": 703} {"train_loss": -37.74787521362305, "global_step": 85108, "epoch": 703} {"train_loss": -38.25239944458008, "global_step": 85109, "epoch": 703} {"train_loss": -36.04685592651367, "global_step": 85110, "epoch": 703} {"train_loss": -37.946022033691406, "global_step": 85111, "epoch": 703} {"train_loss": -37.91849899291992, "global_step": 85112, "epoch": 703} {"train_loss": -37.9111213684082, "global_step": 85113, "epoch": 703} {"train_loss": -35.60676574707031, "global_step": 85114, "epoch": 703} {"train_loss": -36.46608352661133, "global_step": 85115, "epoch": 703} {"train_loss": -33.45867156982422, "global_step": 85116, "epoch": 703} {"train_loss": -36.43903732299805, "global_step": 85117, "epoch": 703} {"train_loss": -37.13138961791992, "global_step": 85118, "epoch": 703} {"train_loss": -36.67195510864258, "global_step": 85119, "epoch": 703} {"train_loss": -37.27054977416992, "global_step": 85120, "epoch": 703} {"train_loss": -33.86845779418945, "global_step": 85121, "epoch": 703} {"train_loss": -37.061187744140625, "global_step": 85122, "epoch": 703} {"train_loss": -37.26392364501953, "global_step": 85123, "epoch": 703} {"train_loss": -37.44828414916992, "global_step": 85124, "epoch": 703} {"train_loss": -36.731903076171875, "global_step": 85125, "epoch": 703} {"train_loss": -37.13459396362305, "global_step": 85126, "epoch": 703} {"train_loss": -35.80867004394531, "global_step": 85127, "epoch": 703} {"train_loss": -36.006317138671875, "global_step": 85128, "epoch": 703} {"train_loss": -35.70833969116211, "global_step": 85129, "epoch": 703} {"train_loss": -37.045570373535156, "global_step": 85130, "epoch": 703} {"train_loss": -35.99348068237305, "global_step": 85131, "epoch": 703} {"train_loss": -36.69187927246094, "global_step": 85132, "epoch": 703} {"train_loss": -36.30970001220703, "global_step": 85133, "epoch": 703} {"train_loss": -34.904510498046875, "global_step": 85134, "epoch": 703} {"train_loss": -35.868465423583984, "global_step": 85135, "epoch": 703} {"train_loss": -33.922828674316406, "global_step": 85136, "epoch": 703} {"train_loss": -35.5149040222168, "global_step": 85137, "epoch": 703} {"train_loss": -36.82244110107422, "global_step": 85138, "epoch": 703} {"train_loss": -35.860652923583984, "global_step": 85139, "epoch": 703} {"train_loss": -35.293739318847656, "global_step": 85140, "epoch": 703} {"train_loss": -35.914390563964844, "global_step": 85141, "epoch": 703} {"train_loss": -34.031551361083984, "global_step": 85142, "epoch": 703} {"train_loss": -36.296260833740234, "global_step": 85143, "epoch": 703} {"train_loss": -34.582889556884766, "global_step": 85144, "epoch": 703} {"train_loss": -35.42916488647461, "global_step": 85145, "epoch": 703} {"train_loss": -36.10441207885742, "global_step": 85146, "epoch": 703} {"train_loss": -35.98963165283203, "global_step": 85147, "epoch": 703} {"train_loss": -37.130619049072266, "global_step": 85148, "epoch": 703} {"train_loss": -36.73609924316406, "global_step": 85149, "epoch": 703} {"train_loss": -34.998905181884766, "global_step": 85150, "epoch": 703} {"train_loss": -35.025390625, "global_step": 85151, "epoch": 703} {"train_loss": -36.81342697143555, "global_step": 85152, "epoch": 703} {"train_loss": -36.18312454223633, "global_step": 85153, "epoch": 703} {"train_loss": -37.37149429321289, "global_step": 85154, "epoch": 703} {"train_loss": -35.28644561767578, "global_step": 85155, "epoch": 703} {"train_loss": -37.49406433105469, "global_step": 85156, "epoch": 703} {"train_loss": -36.33125686645508, "global_step": 85157, "epoch": 703} {"train_loss": -36.63340377807617, "global_step": 85158, "epoch": 703} {"train_loss": -37.13789749145508, "global_step": 85159, "epoch": 703} {"train_loss": -36.42749786376953, "global_step": 85160, "epoch": 703} {"train_loss": -37.046199798583984, "global_step": 85161, "epoch": 703} {"train_loss": -37.4115104675293, "global_step": 85162, "epoch": 703} {"train_loss": -37.589080810546875, "global_step": 85163, "epoch": 703} {"train_loss": -36.81322479248047, "global_step": 85164, "epoch": 703} {"train_loss": -37.070465087890625, "global_step": 85165, "epoch": 703} {"train_loss": -37.06992721557617, "global_step": 85166, "epoch": 703} {"train_loss": -37.324485778808594, "global_step": 85167, "epoch": 703} {"train_loss": -37.4149169921875, "global_step": 85168, "epoch": 703} {"train_loss": -37.17393493652344, "global_step": 85169, "epoch": 703} {"train_loss": -37.43351745605469, "global_step": 85170, "epoch": 703} {"train_loss": -37.619667053222656, "global_step": 85171, "epoch": 703} {"train_loss": -37.5787239074707, "global_step": 85172, "epoch": 703} {"train_loss": -37.97224807739258, "global_step": 85173, "epoch": 703} {"train_loss": -38.0330810546875, "global_step": 85174, "epoch": 703} {"train_loss": -37.508548736572266, "global_step": 85175, "epoch": 703} {"train_loss": -37.205692291259766, "global_step": 85176, "epoch": 703} {"train_loss": -37.791664123535156, "global_step": 85177, "epoch": 703} {"train_loss": -37.37856674194336, "global_step": 85178, "epoch": 703} {"train_loss": -37.214744567871094, "global_step": 85179, "epoch": 703} {"train_loss": -37.9794807434082, "global_step": 85180, "epoch": 703} {"train_loss": -37.404327392578125, "global_step": 85181, "epoch": 703} {"train_loss": -37.53325271606445, "global_step": 85182, "epoch": 703} {"train_loss": -36.748717126767495, "global_step": 85183, "epoch": 703, "val_loss": 2624743.75} {"train_loss": -37.77733612060547, "global_step": 85184, "epoch": 704} {"train_loss": -38.235469818115234, "global_step": 85185, "epoch": 704} {"train_loss": -37.70283126831055, "global_step": 85186, "epoch": 704} {"train_loss": -37.73077392578125, "global_step": 85187, "epoch": 704} {"train_loss": -37.28640365600586, "global_step": 85188, "epoch": 704} {"train_loss": -37.42554473876953, "global_step": 85189, "epoch": 704} {"train_loss": -37.7763786315918, "global_step": 85190, "epoch": 704} {"train_loss": -37.31792068481445, "global_step": 85191, "epoch": 704} {"train_loss": -37.44194030761719, "global_step": 85192, "epoch": 704} {"train_loss": -37.41622543334961, "global_step": 85193, "epoch": 704} {"train_loss": -37.45630645751953, "global_step": 85194, "epoch": 704} {"train_loss": -37.34698486328125, "global_step": 85195, "epoch": 704} {"train_loss": -37.8441047668457, "global_step": 85196, "epoch": 704} {"train_loss": -37.213661193847656, "global_step": 85197, "epoch": 704} {"train_loss": -37.412086486816406, "global_step": 85198, "epoch": 704} {"train_loss": -37.196590423583984, "global_step": 85199, "epoch": 704} {"train_loss": -37.47502517700195, "global_step": 85200, "epoch": 704} {"train_loss": -37.52961349487305, "global_step": 85201, "epoch": 704} {"train_loss": -37.90067672729492, "global_step": 85202, "epoch": 704} {"train_loss": -36.968421936035156, "global_step": 85203, "epoch": 704} {"train_loss": -36.90516662597656, "global_step": 85204, "epoch": 704} {"train_loss": -37.478248596191406, "global_step": 85205, "epoch": 704} {"train_loss": -37.36903762817383, "global_step": 85206, "epoch": 704} {"train_loss": -37.38804244995117, "global_step": 85207, "epoch": 704} {"train_loss": -36.37990188598633, "global_step": 85208, "epoch": 704} {"train_loss": -37.15793991088867, "global_step": 85209, "epoch": 704} {"train_loss": -35.89439010620117, "global_step": 85210, "epoch": 704} {"train_loss": -37.10883712768555, "global_step": 85211, "epoch": 704} {"train_loss": -36.6772575378418, "global_step": 85212, "epoch": 704} {"train_loss": -34.6845703125, "global_step": 85213, "epoch": 704} {"train_loss": -34.133056640625, "global_step": 85214, "epoch": 704} {"train_loss": -37.407188415527344, "global_step": 85215, "epoch": 704} {"train_loss": -37.50868225097656, "global_step": 85216, "epoch": 704} {"train_loss": -36.36622619628906, "global_step": 85217, "epoch": 704} {"train_loss": -36.75962448120117, "global_step": 85218, "epoch": 704} {"train_loss": -37.17726516723633, "global_step": 85219, "epoch": 704} {"train_loss": -37.28938674926758, "global_step": 85220, "epoch": 704} {"train_loss": -36.10897445678711, "global_step": 85221, "epoch": 704} {"train_loss": -37.309051513671875, "global_step": 85222, "epoch": 704} {"train_loss": -37.4432258605957, "global_step": 85223, "epoch": 704} {"train_loss": -37.48278045654297, "global_step": 85224, "epoch": 704} {"train_loss": -37.650691986083984, "global_step": 85225, "epoch": 704} {"train_loss": -37.22279739379883, "global_step": 85226, "epoch": 704} {"train_loss": -35.45417404174805, "global_step": 85227, "epoch": 704} {"train_loss": -36.28125762939453, "global_step": 85228, "epoch": 704} {"train_loss": -37.34676742553711, "global_step": 85229, "epoch": 704} {"train_loss": -38.064781188964844, "global_step": 85230, "epoch": 704} {"train_loss": -37.341896057128906, "global_step": 85231, "epoch": 704} {"train_loss": -37.32522201538086, "global_step": 85232, "epoch": 704} {"train_loss": -37.20857238769531, "global_step": 85233, "epoch": 704} {"train_loss": -37.414485931396484, "global_step": 85234, "epoch": 704} {"train_loss": -36.94368362426758, "global_step": 85235, "epoch": 704} {"train_loss": -37.58243942260742, "global_step": 85236, "epoch": 704} {"train_loss": -37.36909103393555, "global_step": 85237, "epoch": 704} {"train_loss": -37.982601165771484, "global_step": 85238, "epoch": 704} {"train_loss": -37.13977813720703, "global_step": 85239, "epoch": 704} {"train_loss": -37.70917892456055, "global_step": 85240, "epoch": 704} {"train_loss": -37.28321838378906, "global_step": 85241, "epoch": 704} {"train_loss": -33.25050354003906, "global_step": 85242, "epoch": 704} {"train_loss": -33.32832717895508, "global_step": 85243, "epoch": 704} {"train_loss": -34.9369010925293, "global_step": 85244, "epoch": 704} {"train_loss": -37.12199783325195, "global_step": 85245, "epoch": 704} {"train_loss": -36.8468132019043, "global_step": 85246, "epoch": 704} {"train_loss": -33.84565353393555, "global_step": 85247, "epoch": 704} {"train_loss": -35.937374114990234, "global_step": 85248, "epoch": 704} {"train_loss": -35.303707122802734, "global_step": 85249, "epoch": 704} {"train_loss": -34.6599006652832, "global_step": 85250, "epoch": 704} {"train_loss": -32.234012603759766, "global_step": 85251, "epoch": 704} {"train_loss": -35.509830474853516, "global_step": 85252, "epoch": 704} {"train_loss": -36.49189758300781, "global_step": 85253, "epoch": 704} {"train_loss": -35.213897705078125, "global_step": 85254, "epoch": 704} {"train_loss": -34.46796417236328, "global_step": 85255, "epoch": 704} {"train_loss": -35.1660041809082, "global_step": 85256, "epoch": 704} {"train_loss": -33.524627685546875, "global_step": 85257, "epoch": 704} {"train_loss": -35.157772064208984, "global_step": 85258, "epoch": 704} {"train_loss": -35.43498229980469, "global_step": 85259, "epoch": 704} {"train_loss": -35.268463134765625, "global_step": 85260, "epoch": 704} {"train_loss": -36.274871826171875, "global_step": 85261, "epoch": 704} {"train_loss": -34.68479537963867, "global_step": 85262, "epoch": 704} {"train_loss": -35.52389144897461, "global_step": 85263, "epoch": 704} {"train_loss": -34.8112678527832, "global_step": 85264, "epoch": 704} {"train_loss": -35.51340866088867, "global_step": 85265, "epoch": 704} {"train_loss": -36.251251220703125, "global_step": 85266, "epoch": 704} {"train_loss": -36.29058837890625, "global_step": 85267, "epoch": 704} {"train_loss": -35.65475082397461, "global_step": 85268, "epoch": 704} {"train_loss": -34.8248405456543, "global_step": 85269, "epoch": 704} {"train_loss": -35.36562728881836, "global_step": 85270, "epoch": 704} {"train_loss": -35.06474685668945, "global_step": 85271, "epoch": 704} {"train_loss": -33.62528610229492, "global_step": 85272, "epoch": 704} {"train_loss": -35.49992752075195, "global_step": 85273, "epoch": 704} {"train_loss": -35.94082260131836, "global_step": 85274, "epoch": 704} {"train_loss": -35.33644485473633, "global_step": 85275, "epoch": 704} {"train_loss": -35.33394241333008, "global_step": 85276, "epoch": 704} {"train_loss": -35.50025177001953, "global_step": 85277, "epoch": 704} {"train_loss": -35.9329948425293, "global_step": 85278, "epoch": 704} {"train_loss": -36.574310302734375, "global_step": 85279, "epoch": 704} {"train_loss": -36.53277587890625, "global_step": 85280, "epoch": 704} {"train_loss": -34.13127517700195, "global_step": 85281, "epoch": 704} {"train_loss": -35.578399658203125, "global_step": 85282, "epoch": 704} {"train_loss": -36.12127685546875, "global_step": 85283, "epoch": 704} {"train_loss": -35.88369369506836, "global_step": 85284, "epoch": 704} {"train_loss": -36.38644027709961, "global_step": 85285, "epoch": 704} {"train_loss": -36.444271087646484, "global_step": 85286, "epoch": 704} {"train_loss": -36.76152038574219, "global_step": 85287, "epoch": 704} {"train_loss": -35.04752731323242, "global_step": 85288, "epoch": 704} {"train_loss": -35.64628219604492, "global_step": 85289, "epoch": 704} {"train_loss": -36.63875198364258, "global_step": 85290, "epoch": 704} {"train_loss": -37.12784957885742, "global_step": 85291, "epoch": 704} {"train_loss": -36.95546340942383, "global_step": 85292, "epoch": 704} {"train_loss": -36.624691009521484, "global_step": 85293, "epoch": 704} {"train_loss": -36.80864334106445, "global_step": 85294, "epoch": 704} {"train_loss": -37.07952880859375, "global_step": 85295, "epoch": 704} {"train_loss": -37.01163864135742, "global_step": 85296, "epoch": 704} {"train_loss": -37.39097595214844, "global_step": 85297, "epoch": 704} {"train_loss": -36.53752517700195, "global_step": 85298, "epoch": 704} {"train_loss": -36.460880279541016, "global_step": 85299, "epoch": 704} {"train_loss": -36.70780944824219, "global_step": 85300, "epoch": 704} {"train_loss": -36.52042007446289, "global_step": 85301, "epoch": 704} {"train_loss": -37.421356201171875, "global_step": 85302, "epoch": 704} {"train_loss": -36.954498291015625, "global_step": 85303, "epoch": 704} {"train_loss": -36.40629817237539, "global_step": 85304, "epoch": 704, "val_loss": 2693316.0} {"train_loss": -37.271995544433594, "global_step": 85305, "epoch": 705} {"train_loss": -37.27570343017578, "global_step": 85306, "epoch": 705} {"train_loss": -37.045692443847656, "global_step": 85307, "epoch": 705} {"train_loss": -36.485633850097656, "global_step": 85308, "epoch": 705} {"train_loss": -34.99496841430664, "global_step": 85309, "epoch": 705} {"train_loss": -31.840932846069336, "global_step": 85310, "epoch": 705} {"train_loss": -23.1334171295166, "global_step": 85311, "epoch": 705} {"train_loss": -4.7559919357299805, "global_step": 85312, "epoch": 705} {"train_loss": -15.684218406677246, "global_step": 85313, "epoch": 705} {"train_loss": -35.88645553588867, "global_step": 85314, "epoch": 705} {"train_loss": -21.282724380493164, "global_step": 85315, "epoch": 705} {"train_loss": -33.631874084472656, "global_step": 85316, "epoch": 705} {"train_loss": -26.501264572143555, "global_step": 85317, "epoch": 705} {"train_loss": -33.451324462890625, "global_step": 85318, "epoch": 705} {"train_loss": -29.393524169921875, "global_step": 85319, "epoch": 705} {"train_loss": -35.53229522705078, "global_step": 85320, "epoch": 705} {"train_loss": -31.818723678588867, "global_step": 85321, "epoch": 705} {"train_loss": -35.029754638671875, "global_step": 85322, "epoch": 705} {"train_loss": -35.02725601196289, "global_step": 85323, "epoch": 705} {"train_loss": -33.796817779541016, "global_step": 85324, "epoch": 705} {"train_loss": -35.53364944458008, "global_step": 85325, "epoch": 705} {"train_loss": -34.644622802734375, "global_step": 85326, "epoch": 705} {"train_loss": -35.04694747924805, "global_step": 85327, "epoch": 705} {"train_loss": -36.0662841796875, "global_step": 85328, "epoch": 705} {"train_loss": -35.31850814819336, "global_step": 85329, "epoch": 705} {"train_loss": -35.43768310546875, "global_step": 85330, "epoch": 705} {"train_loss": -35.578060150146484, "global_step": 85331, "epoch": 705} {"train_loss": -36.05601119995117, "global_step": 85332, "epoch": 705} {"train_loss": -36.07613754272461, "global_step": 85333, "epoch": 705} {"train_loss": -35.808162689208984, "global_step": 85334, "epoch": 705} {"train_loss": -36.07597351074219, "global_step": 85335, "epoch": 705} {"train_loss": -36.13275146484375, "global_step": 85336, "epoch": 705} {"train_loss": -36.195064544677734, "global_step": 85337, "epoch": 705} {"train_loss": -35.997718811035156, "global_step": 85338, "epoch": 705} {"train_loss": -36.007747650146484, "global_step": 85339, "epoch": 705} {"train_loss": -36.48408508300781, "global_step": 85340, "epoch": 705} {"train_loss": -36.344207763671875, "global_step": 85341, "epoch": 705} {"train_loss": -36.7969856262207, "global_step": 85342, "epoch": 705} {"train_loss": -36.5539665222168, "global_step": 85343, "epoch": 705} {"train_loss": -36.55841827392578, "global_step": 85344, "epoch": 705} {"train_loss": -36.299896240234375, "global_step": 85345, "epoch": 705} {"train_loss": -37.03728103637695, "global_step": 85346, "epoch": 705} {"train_loss": -36.73385238647461, "global_step": 85347, "epoch": 705} {"train_loss": -36.937530517578125, "global_step": 85348, "epoch": 705} {"train_loss": -36.66730499267578, "global_step": 85349, "epoch": 705} {"train_loss": -36.81318283081055, "global_step": 85350, "epoch": 705} {"train_loss": -36.5380973815918, "global_step": 85351, "epoch": 705} {"train_loss": -36.983238220214844, "global_step": 85352, "epoch": 705} {"train_loss": -37.35200119018555, "global_step": 85353, "epoch": 705} {"train_loss": -37.05506134033203, "global_step": 85354, "epoch": 705} {"train_loss": -37.07032012939453, "global_step": 85355, "epoch": 705} {"train_loss": -37.13434600830078, "global_step": 85356, "epoch": 705} {"train_loss": -36.97065734863281, "global_step": 85357, "epoch": 705} {"train_loss": -36.900672912597656, "global_step": 85358, "epoch": 705} {"train_loss": -37.21403503417969, "global_step": 85359, "epoch": 705} {"train_loss": -37.46730422973633, "global_step": 85360, "epoch": 705} {"train_loss": -37.30153274536133, "global_step": 85361, "epoch": 705} {"train_loss": -37.389644622802734, "global_step": 85362, "epoch": 705} {"train_loss": -37.34454345703125, "global_step": 85363, "epoch": 705} {"train_loss": -37.48638916015625, "global_step": 85364, "epoch": 705} {"train_loss": -37.446903228759766, "global_step": 85365, "epoch": 705} {"train_loss": -37.81205368041992, "global_step": 85366, "epoch": 705} {"train_loss": -37.99412155151367, "global_step": 85367, "epoch": 705} {"train_loss": -37.82865524291992, "global_step": 85368, "epoch": 705} {"train_loss": -37.739131927490234, "global_step": 85369, "epoch": 705} {"train_loss": -37.777462005615234, "global_step": 85370, "epoch": 705} {"train_loss": -37.83047103881836, "global_step": 85371, "epoch": 705} {"train_loss": -37.99396896362305, "global_step": 85372, "epoch": 705} {"train_loss": -37.75094223022461, "global_step": 85373, "epoch": 705} {"train_loss": -37.61464309692383, "global_step": 85374, "epoch": 705} {"train_loss": -37.8140983581543, "global_step": 85375, "epoch": 705} {"train_loss": -38.002925872802734, "global_step": 85376, "epoch": 705} {"train_loss": -38.233314514160156, "global_step": 85377, "epoch": 705} {"train_loss": -37.67545700073242, "global_step": 85378, "epoch": 705} {"train_loss": -37.883575439453125, "global_step": 85379, "epoch": 705} {"train_loss": -37.99703598022461, "global_step": 85380, "epoch": 705} {"train_loss": -38.01974105834961, "global_step": 85381, "epoch": 705} {"train_loss": -38.17251205444336, "global_step": 85382, "epoch": 705} {"train_loss": -38.366432189941406, "global_step": 85383, "epoch": 705} {"train_loss": -38.041961669921875, "global_step": 85384, "epoch": 705} {"train_loss": -38.1683464050293, "global_step": 85385, "epoch": 705} {"train_loss": -38.213069915771484, "global_step": 85386, "epoch": 705} {"train_loss": -38.19257736206055, "global_step": 85387, "epoch": 705} {"train_loss": -37.266170501708984, "global_step": 85388, "epoch": 705} {"train_loss": -37.07770919799805, "global_step": 85389, "epoch": 705} {"train_loss": -37.35496139526367, "global_step": 85390, "epoch": 705} {"train_loss": -37.891639709472656, "global_step": 85391, "epoch": 705} {"train_loss": -30.434024810791016, "global_step": 85392, "epoch": 705} {"train_loss": -14.922225952148438, "global_step": 85393, "epoch": 705} {"train_loss": -24.78724479675293, "global_step": 85394, "epoch": 705} {"train_loss": -33.81045150756836, "global_step": 85395, "epoch": 705} {"train_loss": -31.600357055664062, "global_step": 85396, "epoch": 705} {"train_loss": -34.632808685302734, "global_step": 85397, "epoch": 705} {"train_loss": -35.22230529785156, "global_step": 85398, "epoch": 705} {"train_loss": -35.526180267333984, "global_step": 85399, "epoch": 705} {"train_loss": -37.02045822143555, "global_step": 85400, "epoch": 705} {"train_loss": -36.46830368041992, "global_step": 85401, "epoch": 705} {"train_loss": -34.54793167114258, "global_step": 85402, "epoch": 705} {"train_loss": -37.021942138671875, "global_step": 85403, "epoch": 705} {"train_loss": -34.139888763427734, "global_step": 85404, "epoch": 705} {"train_loss": -37.3406982421875, "global_step": 85405, "epoch": 705} {"train_loss": -36.63629913330078, "global_step": 85406, "epoch": 705} {"train_loss": -37.232112884521484, "global_step": 85407, "epoch": 705} {"train_loss": -36.0245361328125, "global_step": 85408, "epoch": 705} {"train_loss": -37.02277374267578, "global_step": 85409, "epoch": 705} {"train_loss": -36.22154998779297, "global_step": 85410, "epoch": 705} {"train_loss": -37.15011978149414, "global_step": 85411, "epoch": 705} {"train_loss": -35.40279006958008, "global_step": 85412, "epoch": 705} {"train_loss": -36.6695671081543, "global_step": 85413, "epoch": 705} {"train_loss": -37.232704162597656, "global_step": 85414, "epoch": 705} {"train_loss": -37.35305404663086, "global_step": 85415, "epoch": 705} {"train_loss": -37.12809371948242, "global_step": 85416, "epoch": 705} {"train_loss": -35.59269714355469, "global_step": 85417, "epoch": 705} {"train_loss": -37.55215835571289, "global_step": 85418, "epoch": 705} {"train_loss": -37.005409240722656, "global_step": 85419, "epoch": 705} {"train_loss": -36.71405029296875, "global_step": 85420, "epoch": 705} {"train_loss": -36.56412887573242, "global_step": 85421, "epoch": 705} {"train_loss": -37.77634811401367, "global_step": 85422, "epoch": 705} {"train_loss": -37.06605911254883, "global_step": 85423, "epoch": 705} {"train_loss": -36.861236572265625, "global_step": 85424, "epoch": 705} {"train_loss": -35.41662870359815, "global_step": 85425, "epoch": 705, "val_loss": 2598404.25} {"train_loss": -37.408329010009766, "global_step": 85426, "epoch": 706} {"train_loss": -35.70393371582031, "global_step": 85427, "epoch": 706} {"train_loss": -37.1031494140625, "global_step": 85428, "epoch": 706} {"train_loss": -37.53742980957031, "global_step": 85429, "epoch": 706} {"train_loss": -37.09323501586914, "global_step": 85430, "epoch": 706} {"train_loss": -36.82963180541992, "global_step": 85431, "epoch": 706} {"train_loss": -37.5943717956543, "global_step": 85432, "epoch": 706} {"train_loss": -37.74311447143555, "global_step": 85433, "epoch": 706} {"train_loss": -37.70159912109375, "global_step": 85434, "epoch": 706} {"train_loss": -37.77351760864258, "global_step": 85435, "epoch": 706} {"train_loss": -37.212623596191406, "global_step": 85436, "epoch": 706} {"train_loss": -37.94330978393555, "global_step": 85437, "epoch": 706} {"train_loss": -37.37468719482422, "global_step": 85438, "epoch": 706} {"train_loss": -37.97392654418945, "global_step": 85439, "epoch": 706} {"train_loss": -37.687591552734375, "global_step": 85440, "epoch": 706} {"train_loss": -38.040767669677734, "global_step": 85441, "epoch": 706} {"train_loss": -37.66596984863281, "global_step": 85442, "epoch": 706} {"train_loss": -37.71919631958008, "global_step": 85443, "epoch": 706} {"train_loss": -37.76232147216797, "global_step": 85444, "epoch": 706} {"train_loss": -38.304744720458984, "global_step": 85445, "epoch": 706} {"train_loss": -37.942413330078125, "global_step": 85446, "epoch": 706} {"train_loss": -37.52429962158203, "global_step": 85447, "epoch": 706} {"train_loss": -37.87492752075195, "global_step": 85448, "epoch": 706} {"train_loss": -37.81388473510742, "global_step": 85449, "epoch": 706} {"train_loss": -37.83573913574219, "global_step": 85450, "epoch": 706} {"train_loss": -37.96979904174805, "global_step": 85451, "epoch": 706} {"train_loss": -38.426177978515625, "global_step": 85452, "epoch": 706} {"train_loss": -38.143489837646484, "global_step": 85453, "epoch": 706} {"train_loss": -37.72395706176758, "global_step": 85454, "epoch": 706} {"train_loss": -37.79621505737305, "global_step": 85455, "epoch": 706} {"train_loss": -37.3570671081543, "global_step": 85456, "epoch": 706} {"train_loss": -36.14522933959961, "global_step": 85457, "epoch": 706} {"train_loss": -35.439754486083984, "global_step": 85458, "epoch": 706} {"train_loss": -30.91193962097168, "global_step": 85459, "epoch": 706} {"train_loss": -33.2596321105957, "global_step": 85460, "epoch": 706} {"train_loss": -36.31596755981445, "global_step": 85461, "epoch": 706} {"train_loss": -35.432552337646484, "global_step": 85462, "epoch": 706} {"train_loss": -36.68973159790039, "global_step": 85463, "epoch": 706} {"train_loss": -36.13554000854492, "global_step": 85464, "epoch": 706} {"train_loss": -36.725494384765625, "global_step": 85465, "epoch": 706} {"train_loss": -37.171043395996094, "global_step": 85466, "epoch": 706} {"train_loss": -36.410667419433594, "global_step": 85467, "epoch": 706} {"train_loss": -37.952789306640625, "global_step": 85468, "epoch": 706} {"train_loss": -35.8796272277832, "global_step": 85469, "epoch": 706} {"train_loss": -37.4642333984375, "global_step": 85470, "epoch": 706} {"train_loss": -36.93436813354492, "global_step": 85471, "epoch": 706} {"train_loss": -37.572357177734375, "global_step": 85472, "epoch": 706} {"train_loss": -37.24641036987305, "global_step": 85473, "epoch": 706} {"train_loss": -37.330745697021484, "global_step": 85474, "epoch": 706} {"train_loss": -37.87466812133789, "global_step": 85475, "epoch": 706} {"train_loss": -37.839378356933594, "global_step": 85476, "epoch": 706} {"train_loss": -37.899169921875, "global_step": 85477, "epoch": 706} {"train_loss": -36.94673538208008, "global_step": 85478, "epoch": 706} {"train_loss": -37.847991943359375, "global_step": 85479, "epoch": 706} {"train_loss": -37.801448822021484, "global_step": 85480, "epoch": 706} {"train_loss": -37.289546966552734, "global_step": 85481, "epoch": 706} {"train_loss": -37.396217346191406, "global_step": 85482, "epoch": 706} {"train_loss": -37.9132194519043, "global_step": 85483, "epoch": 706} {"train_loss": -38.092498779296875, "global_step": 85484, "epoch": 706} {"train_loss": -37.465511322021484, "global_step": 85485, "epoch": 706} {"train_loss": -37.99917984008789, "global_step": 85486, "epoch": 706} {"train_loss": -38.003639221191406, "global_step": 85487, "epoch": 706} {"train_loss": -37.86089324951172, "global_step": 85488, "epoch": 706} {"train_loss": -37.569427490234375, "global_step": 85489, "epoch": 706} {"train_loss": -37.69918441772461, "global_step": 85490, "epoch": 706} {"train_loss": -37.86915969848633, "global_step": 85491, "epoch": 706} {"train_loss": -37.80630111694336, "global_step": 85492, "epoch": 706} {"train_loss": -38.58009719848633, "global_step": 85493, "epoch": 706} {"train_loss": -37.981685638427734, "global_step": 85494, "epoch": 706} {"train_loss": -37.98120880126953, "global_step": 85495, "epoch": 706} {"train_loss": -37.53124237060547, "global_step": 85496, "epoch": 706} {"train_loss": -37.400238037109375, "global_step": 85497, "epoch": 706} {"train_loss": -38.06401824951172, "global_step": 85498, "epoch": 706} {"train_loss": -38.16379928588867, "global_step": 85499, "epoch": 706} {"train_loss": -38.39473342895508, "global_step": 85500, "epoch": 706} {"train_loss": -38.5145149230957, "global_step": 85501, "epoch": 706} {"train_loss": -38.2364501953125, "global_step": 85502, "epoch": 706} {"train_loss": -38.08491897583008, "global_step": 85503, "epoch": 706} {"train_loss": -38.222232818603516, "global_step": 85504, "epoch": 706} {"train_loss": -37.538570404052734, "global_step": 85505, "epoch": 706} {"train_loss": -37.977752685546875, "global_step": 85506, "epoch": 706} {"train_loss": -36.61513900756836, "global_step": 85507, "epoch": 706} {"train_loss": -37.67857360839844, "global_step": 85508, "epoch": 706} {"train_loss": -35.555320739746094, "global_step": 85509, "epoch": 706} {"train_loss": -36.99750900268555, "global_step": 85510, "epoch": 706} {"train_loss": -34.23659896850586, "global_step": 85511, "epoch": 706} {"train_loss": -30.88498878479004, "global_step": 85512, "epoch": 706} {"train_loss": -34.999908447265625, "global_step": 85513, "epoch": 706} {"train_loss": -25.665313720703125, "global_step": 85514, "epoch": 706} {"train_loss": -36.44541549682617, "global_step": 85515, "epoch": 706} {"train_loss": -32.85608673095703, "global_step": 85516, "epoch": 706} {"train_loss": -30.66285514831543, "global_step": 85517, "epoch": 706} {"train_loss": -32.37417221069336, "global_step": 85518, "epoch": 706} {"train_loss": -32.964168548583984, "global_step": 85519, "epoch": 706} {"train_loss": -29.643056869506836, "global_step": 85520, "epoch": 706} {"train_loss": -25.571470260620117, "global_step": 85521, "epoch": 706} {"train_loss": -31.34132957458496, "global_step": 85522, "epoch": 706} {"train_loss": -28.01407241821289, "global_step": 85523, "epoch": 706} {"train_loss": -31.03167724609375, "global_step": 85524, "epoch": 706} {"train_loss": -33.46331024169922, "global_step": 85525, "epoch": 706} {"train_loss": -29.332311630249023, "global_step": 85526, "epoch": 706} {"train_loss": -26.56830406188965, "global_step": 85527, "epoch": 706} {"train_loss": -28.739789962768555, "global_step": 85528, "epoch": 706} {"train_loss": -31.691640853881836, "global_step": 85529, "epoch": 706} {"train_loss": -33.4997444152832, "global_step": 85530, "epoch": 706} {"train_loss": -32.22981643676758, "global_step": 85531, "epoch": 706} {"train_loss": -28.486616134643555, "global_step": 85532, "epoch": 706} {"train_loss": -32.79049301147461, "global_step": 85533, "epoch": 706} {"train_loss": -33.5527229309082, "global_step": 85534, "epoch": 706} {"train_loss": -33.73627853393555, "global_step": 85535, "epoch": 706} {"train_loss": -32.32330322265625, "global_step": 85536, "epoch": 706} {"train_loss": -33.048763275146484, "global_step": 85537, "epoch": 706} {"train_loss": -33.97561264038086, "global_step": 85538, "epoch": 706} {"train_loss": -34.2522087097168, "global_step": 85539, "epoch": 706} {"train_loss": -32.70119857788086, "global_step": 85540, "epoch": 706} {"train_loss": -33.029048919677734, "global_step": 85541, "epoch": 706} {"train_loss": -33.6270866394043, "global_step": 85542, "epoch": 706} {"train_loss": -34.61391830444336, "global_step": 85543, "epoch": 706} {"train_loss": -33.693904876708984, "global_step": 85544, "epoch": 706} {"train_loss": -34.943904876708984, "global_step": 85545, "epoch": 706} {"train_loss": -35.76634419654027, "global_step": 85546, "epoch": 706, "val_loss": 2640688.0} {"train_loss": -34.54981994628906, "global_step": 85547, "epoch": 707} {"train_loss": -34.5378532409668, "global_step": 85548, "epoch": 707} {"train_loss": -34.70855712890625, "global_step": 85549, "epoch": 707} {"train_loss": -34.4856071472168, "global_step": 85550, "epoch": 707} {"train_loss": -34.638755798339844, "global_step": 85551, "epoch": 707} {"train_loss": -34.413673400878906, "global_step": 85552, "epoch": 707} {"train_loss": -34.58729934692383, "global_step": 85553, "epoch": 707} {"train_loss": -34.86959457397461, "global_step": 85554, "epoch": 707} {"train_loss": -34.70713424682617, "global_step": 85555, "epoch": 707} {"train_loss": -34.36650466918945, "global_step": 85556, "epoch": 707} {"train_loss": -34.97685623168945, "global_step": 85557, "epoch": 707} {"train_loss": -34.97475814819336, "global_step": 85558, "epoch": 707} {"train_loss": -35.38385009765625, "global_step": 85559, "epoch": 707} {"train_loss": -35.01725387573242, "global_step": 85560, "epoch": 707} {"train_loss": -35.56394577026367, "global_step": 85561, "epoch": 707} {"train_loss": -35.710567474365234, "global_step": 85562, "epoch": 707} {"train_loss": -35.22943878173828, "global_step": 85563, "epoch": 707} {"train_loss": -35.660743713378906, "global_step": 85564, "epoch": 707} {"train_loss": -35.4163703918457, "global_step": 85565, "epoch": 707} {"train_loss": -35.660972595214844, "global_step": 85566, "epoch": 707} {"train_loss": -35.8656120300293, "global_step": 85567, "epoch": 707} {"train_loss": -35.471248626708984, "global_step": 85568, "epoch": 707} {"train_loss": -35.572959899902344, "global_step": 85569, "epoch": 707} {"train_loss": -35.598567962646484, "global_step": 85570, "epoch": 707} {"train_loss": -36.29041290283203, "global_step": 85571, "epoch": 707} {"train_loss": -36.07699203491211, "global_step": 85572, "epoch": 707} {"train_loss": -36.33881378173828, "global_step": 85573, "epoch": 707} {"train_loss": -36.24346160888672, "global_step": 85574, "epoch": 707} {"train_loss": -36.29365158081055, "global_step": 85575, "epoch": 707} {"train_loss": -36.43022918701172, "global_step": 85576, "epoch": 707} {"train_loss": -36.40336608886719, "global_step": 85577, "epoch": 707} {"train_loss": -36.509517669677734, "global_step": 85578, "epoch": 707} {"train_loss": -36.533233642578125, "global_step": 85579, "epoch": 707} {"train_loss": -36.90205001831055, "global_step": 85580, "epoch": 707} {"train_loss": -36.66255187988281, "global_step": 85581, "epoch": 707} {"train_loss": -36.287376403808594, "global_step": 85582, "epoch": 707} {"train_loss": -36.647403717041016, "global_step": 85583, "epoch": 707} {"train_loss": -36.009742736816406, "global_step": 85584, "epoch": 707} {"train_loss": -36.29252243041992, "global_step": 85585, "epoch": 707} {"train_loss": -36.79119873046875, "global_step": 85586, "epoch": 707} {"train_loss": -36.25566101074219, "global_step": 85587, "epoch": 707} {"train_loss": -37.37256622314453, "global_step": 85588, "epoch": 707} {"train_loss": -36.82273483276367, "global_step": 85589, "epoch": 707} {"train_loss": -36.826080322265625, "global_step": 85590, "epoch": 707} {"train_loss": -36.27714920043945, "global_step": 85591, "epoch": 707} {"train_loss": -35.89998245239258, "global_step": 85592, "epoch": 707} {"train_loss": -36.97890853881836, "global_step": 85593, "epoch": 707} {"train_loss": -36.157955169677734, "global_step": 85594, "epoch": 707} {"train_loss": -37.15144729614258, "global_step": 85595, "epoch": 707} {"train_loss": -36.450748443603516, "global_step": 85596, "epoch": 707} {"train_loss": -37.503353118896484, "global_step": 85597, "epoch": 707} {"train_loss": -36.584938049316406, "global_step": 85598, "epoch": 707} {"train_loss": -36.54035568237305, "global_step": 85599, "epoch": 707} {"train_loss": -36.97072982788086, "global_step": 85600, "epoch": 707} {"train_loss": -37.00773239135742, "global_step": 85601, "epoch": 707} {"train_loss": -37.00114440917969, "global_step": 85602, "epoch": 707} {"train_loss": -36.45429229736328, "global_step": 85603, "epoch": 707} {"train_loss": -37.01870346069336, "global_step": 85604, "epoch": 707} {"train_loss": -36.79804992675781, "global_step": 85605, "epoch": 707} {"train_loss": -36.9918212890625, "global_step": 85606, "epoch": 707} {"train_loss": -37.694488525390625, "global_step": 85607, "epoch": 707} {"train_loss": -37.13549041748047, "global_step": 85608, "epoch": 707} {"train_loss": -37.24515914916992, "global_step": 85609, "epoch": 707} {"train_loss": -37.59751510620117, "global_step": 85610, "epoch": 707} {"train_loss": -37.69602584838867, "global_step": 85611, "epoch": 707} {"train_loss": -37.22917556762695, "global_step": 85612, "epoch": 707} {"train_loss": -37.36843490600586, "global_step": 85613, "epoch": 707} {"train_loss": -37.19508361816406, "global_step": 85614, "epoch": 707} {"train_loss": -37.34251022338867, "global_step": 85615, "epoch": 707} {"train_loss": -37.64035415649414, "global_step": 85616, "epoch": 707} {"train_loss": -37.549163818359375, "global_step": 85617, "epoch": 707} {"train_loss": -37.378868103027344, "global_step": 85618, "epoch": 707} {"train_loss": -38.16814422607422, "global_step": 85619, "epoch": 707} {"train_loss": -37.724971771240234, "global_step": 85620, "epoch": 707} {"train_loss": -37.44717025756836, "global_step": 85621, "epoch": 707} {"train_loss": -35.95002365112305, "global_step": 85622, "epoch": 707} {"train_loss": -29.916217803955078, "global_step": 85623, "epoch": 707} {"train_loss": -16.27374839782715, "global_step": 85624, "epoch": 707} {"train_loss": -2.715773820877075, "global_step": 85625, "epoch": 707} {"train_loss": -8.386198997497559, "global_step": 85626, "epoch": 707} {"train_loss": -36.17881393432617, "global_step": 85627, "epoch": 707} {"train_loss": -11.387843132019043, "global_step": 85628, "epoch": 707} {"train_loss": -35.56669998168945, "global_step": 85629, "epoch": 707} {"train_loss": -15.230704307556152, "global_step": 85630, "epoch": 707} {"train_loss": -35.041259765625, "global_step": 85631, "epoch": 707} {"train_loss": -26.340778350830078, "global_step": 85632, "epoch": 707} {"train_loss": -27.0520076751709, "global_step": 85633, "epoch": 707} {"train_loss": -35.812156677246094, "global_step": 85634, "epoch": 707} {"train_loss": -29.84490394592285, "global_step": 85635, "epoch": 707} {"train_loss": -28.53383445739746, "global_step": 85636, "epoch": 707} {"train_loss": -36.069515228271484, "global_step": 85637, "epoch": 707} {"train_loss": -33.66202926635742, "global_step": 85638, "epoch": 707} {"train_loss": -31.95185661315918, "global_step": 85639, "epoch": 707} {"train_loss": -32.94837188720703, "global_step": 85640, "epoch": 707} {"train_loss": -36.24423599243164, "global_step": 85641, "epoch": 707} {"train_loss": -35.11019515991211, "global_step": 85642, "epoch": 707} {"train_loss": -32.45125198364258, "global_step": 85643, "epoch": 707} {"train_loss": -34.08516311645508, "global_step": 85644, "epoch": 707} {"train_loss": -35.46088409423828, "global_step": 85645, "epoch": 707} {"train_loss": -36.54241180419922, "global_step": 85646, "epoch": 707} {"train_loss": -35.46953201293945, "global_step": 85647, "epoch": 707} {"train_loss": -35.70466613769531, "global_step": 85648, "epoch": 707} {"train_loss": -35.25747299194336, "global_step": 85649, "epoch": 707} {"train_loss": -35.193363189697266, "global_step": 85650, "epoch": 707} {"train_loss": -35.9392204284668, "global_step": 85651, "epoch": 707} {"train_loss": -34.466129302978516, "global_step": 85652, "epoch": 707} {"train_loss": -35.78602600097656, "global_step": 85653, "epoch": 707} {"train_loss": -35.821075439453125, "global_step": 85654, "epoch": 707} {"train_loss": -36.11175537109375, "global_step": 85655, "epoch": 707} {"train_loss": -36.50883102416992, "global_step": 85656, "epoch": 707} {"train_loss": -36.260372161865234, "global_step": 85657, "epoch": 707} {"train_loss": -36.49648666381836, "global_step": 85658, "epoch": 707} {"train_loss": -36.67264175415039, "global_step": 85659, "epoch": 707} {"train_loss": -36.23167419433594, "global_step": 85660, "epoch": 707} {"train_loss": -36.254940032958984, "global_step": 85661, "epoch": 707} {"train_loss": -36.93501663208008, "global_step": 85662, "epoch": 707} {"train_loss": -36.48890686035156, "global_step": 85663, "epoch": 707} {"train_loss": -36.888587951660156, "global_step": 85664, "epoch": 707} {"train_loss": -36.96321487426758, "global_step": 85665, "epoch": 707} {"train_loss": -36.54133224487305, "global_step": 85666, "epoch": 707} {"train_loss": -34.70513583608895, "global_step": 85667, "epoch": 707, "val_loss": 2587262.25} {"train_loss": -36.780269622802734, "global_step": 85668, "epoch": 708} {"train_loss": -37.24295425415039, "global_step": 85669, "epoch": 708} {"train_loss": -37.289302825927734, "global_step": 85670, "epoch": 708} {"train_loss": -37.15522003173828, "global_step": 85671, "epoch": 708} {"train_loss": -36.335121154785156, "global_step": 85672, "epoch": 708} {"train_loss": -37.28246307373047, "global_step": 85673, "epoch": 708} {"train_loss": -37.392799377441406, "global_step": 85674, "epoch": 708} {"train_loss": -37.10477828979492, "global_step": 85675, "epoch": 708} {"train_loss": -37.15616989135742, "global_step": 85676, "epoch": 708} {"train_loss": -37.632049560546875, "global_step": 85677, "epoch": 708} {"train_loss": -37.178321838378906, "global_step": 85678, "epoch": 708} {"train_loss": -37.519832611083984, "global_step": 85679, "epoch": 708} {"train_loss": -37.50922775268555, "global_step": 85680, "epoch": 708} {"train_loss": -37.460548400878906, "global_step": 85681, "epoch": 708} {"train_loss": -37.30520248413086, "global_step": 85682, "epoch": 708} {"train_loss": -37.10801315307617, "global_step": 85683, "epoch": 708} {"train_loss": -37.34336471557617, "global_step": 85684, "epoch": 708} {"train_loss": -37.75178146362305, "global_step": 85685, "epoch": 708} {"train_loss": -37.45357131958008, "global_step": 85686, "epoch": 708} {"train_loss": -37.856407165527344, "global_step": 85687, "epoch": 708} {"train_loss": -37.215248107910156, "global_step": 85688, "epoch": 708} {"train_loss": -37.658973693847656, "global_step": 85689, "epoch": 708} {"train_loss": -37.597877502441406, "global_step": 85690, "epoch": 708} {"train_loss": -37.76448440551758, "global_step": 85691, "epoch": 708} {"train_loss": -37.58406448364258, "global_step": 85692, "epoch": 708} {"train_loss": -37.91499328613281, "global_step": 85693, "epoch": 708} {"train_loss": -38.46820831298828, "global_step": 85694, "epoch": 708} {"train_loss": -37.708412170410156, "global_step": 85695, "epoch": 708} {"train_loss": -37.71726989746094, "global_step": 85696, "epoch": 708} {"train_loss": -37.72296905517578, "global_step": 85697, "epoch": 708} {"train_loss": -37.98527908325195, "global_step": 85698, "epoch": 708} {"train_loss": -38.330257415771484, "global_step": 85699, "epoch": 708} {"train_loss": -38.1518440246582, "global_step": 85700, "epoch": 708} {"train_loss": -37.94570541381836, "global_step": 85701, "epoch": 708} {"train_loss": -38.20713424682617, "global_step": 85702, "epoch": 708} {"train_loss": -37.73541259765625, "global_step": 85703, "epoch": 708} {"train_loss": -37.8536376953125, "global_step": 85704, "epoch": 708} {"train_loss": -38.37446212768555, "global_step": 85705, "epoch": 708} {"train_loss": -37.3585319519043, "global_step": 85706, "epoch": 708} {"train_loss": -38.256534576416016, "global_step": 85707, "epoch": 708} {"train_loss": -38.4869499206543, "global_step": 85708, "epoch": 708} {"train_loss": -38.183837890625, "global_step": 85709, "epoch": 708} {"train_loss": -38.199737548828125, "global_step": 85710, "epoch": 708} {"train_loss": -38.08567428588867, "global_step": 85711, "epoch": 708} {"train_loss": -37.86646270751953, "global_step": 85712, "epoch": 708} {"train_loss": -38.00950241088867, "global_step": 85713, "epoch": 708} {"train_loss": -37.35844421386719, "global_step": 85714, "epoch": 708} {"train_loss": -37.75953674316406, "global_step": 85715, "epoch": 708} {"train_loss": -37.52168273925781, "global_step": 85716, "epoch": 708} {"train_loss": -37.48284912109375, "global_step": 85717, "epoch": 708} {"train_loss": -37.65553665161133, "global_step": 85718, "epoch": 708} {"train_loss": -37.890987396240234, "global_step": 85719, "epoch": 708} {"train_loss": -35.1935920715332, "global_step": 85720, "epoch": 708} {"train_loss": -33.53443145751953, "global_step": 85721, "epoch": 708} {"train_loss": -29.581281661987305, "global_step": 85722, "epoch": 708} {"train_loss": -28.321313858032227, "global_step": 85723, "epoch": 708} {"train_loss": -31.123126983642578, "global_step": 85724, "epoch": 708} {"train_loss": -31.844762802124023, "global_step": 85725, "epoch": 708} {"train_loss": -32.67622756958008, "global_step": 85726, "epoch": 708} {"train_loss": -37.13540267944336, "global_step": 85727, "epoch": 708} {"train_loss": -35.416744232177734, "global_step": 85728, "epoch": 708} {"train_loss": -35.63739776611328, "global_step": 85729, "epoch": 708} {"train_loss": -35.52898406982422, "global_step": 85730, "epoch": 708} {"train_loss": -36.3408088684082, "global_step": 85731, "epoch": 708} {"train_loss": -35.07847213745117, "global_step": 85732, "epoch": 708} {"train_loss": -35.97388458251953, "global_step": 85733, "epoch": 708} {"train_loss": -36.3652458190918, "global_step": 85734, "epoch": 708} {"train_loss": -36.216819763183594, "global_step": 85735, "epoch": 708} {"train_loss": -36.42203903198242, "global_step": 85736, "epoch": 708} {"train_loss": -36.335201263427734, "global_step": 85737, "epoch": 708} {"train_loss": -36.62942123413086, "global_step": 85738, "epoch": 708} {"train_loss": -36.29801940917969, "global_step": 85739, "epoch": 708} {"train_loss": -37.25594711303711, "global_step": 85740, "epoch": 708} {"train_loss": -36.5224723815918, "global_step": 85741, "epoch": 708} {"train_loss": -37.077308654785156, "global_step": 85742, "epoch": 708} {"train_loss": -36.098731994628906, "global_step": 85743, "epoch": 708} {"train_loss": -37.095436096191406, "global_step": 85744, "epoch": 708} {"train_loss": -36.72614288330078, "global_step": 85745, "epoch": 708} {"train_loss": -36.114253997802734, "global_step": 85746, "epoch": 708} {"train_loss": -37.054466247558594, "global_step": 85747, "epoch": 708} {"train_loss": -36.74631118774414, "global_step": 85748, "epoch": 708} {"train_loss": -36.939144134521484, "global_step": 85749, "epoch": 708} {"train_loss": -37.01177978515625, "global_step": 85750, "epoch": 708} {"train_loss": -36.67988204956055, "global_step": 85751, "epoch": 708} {"train_loss": -36.721885681152344, "global_step": 85752, "epoch": 708} {"train_loss": -37.26438522338867, "global_step": 85753, "epoch": 708} {"train_loss": -37.14246368408203, "global_step": 85754, "epoch": 708} {"train_loss": -37.92280578613281, "global_step": 85755, "epoch": 708} {"train_loss": -37.264774322509766, "global_step": 85756, "epoch": 708} {"train_loss": -36.777679443359375, "global_step": 85757, "epoch": 708} {"train_loss": -37.42076110839844, "global_step": 85758, "epoch": 708} {"train_loss": -36.668121337890625, "global_step": 85759, "epoch": 708} {"train_loss": -36.71516036987305, "global_step": 85760, "epoch": 708} {"train_loss": -36.71193313598633, "global_step": 85761, "epoch": 708} {"train_loss": -37.190032958984375, "global_step": 85762, "epoch": 708} {"train_loss": -36.608436584472656, "global_step": 85763, "epoch": 708} {"train_loss": -36.763057708740234, "global_step": 85764, "epoch": 708} {"train_loss": -36.704402923583984, "global_step": 85765, "epoch": 708} {"train_loss": -36.2862663269043, "global_step": 85766, "epoch": 708} {"train_loss": -36.39561462402344, "global_step": 85767, "epoch": 708} {"train_loss": -37.22956085205078, "global_step": 85768, "epoch": 708} {"train_loss": -37.54267501831055, "global_step": 85769, "epoch": 708} {"train_loss": -37.7280387878418, "global_step": 85770, "epoch": 708} {"train_loss": -37.49720001220703, "global_step": 85771, "epoch": 708} {"train_loss": -37.21160888671875, "global_step": 85772, "epoch": 708} {"train_loss": -36.32753372192383, "global_step": 85773, "epoch": 708} {"train_loss": -35.458370208740234, "global_step": 85774, "epoch": 708} {"train_loss": -36.691463470458984, "global_step": 85775, "epoch": 708} {"train_loss": -37.710506439208984, "global_step": 85776, "epoch": 708} {"train_loss": -37.60639190673828, "global_step": 85777, "epoch": 708} {"train_loss": -37.76301574707031, "global_step": 85778, "epoch": 708} {"train_loss": -38.31001663208008, "global_step": 85779, "epoch": 708} {"train_loss": -37.94887161254883, "global_step": 85780, "epoch": 708} {"train_loss": -37.722511291503906, "global_step": 85781, "epoch": 708} {"train_loss": -37.96538162231445, "global_step": 85782, "epoch": 708} {"train_loss": -38.066856384277344, "global_step": 85783, "epoch": 708} {"train_loss": -38.30784225463867, "global_step": 85784, "epoch": 708} {"train_loss": -38.03681182861328, "global_step": 85785, "epoch": 708} {"train_loss": -37.5415153503418, "global_step": 85786, "epoch": 708} {"train_loss": -37.896724700927734, "global_step": 85787, "epoch": 708} {"train_loss": -36.941421524552275, "global_step": 85788, "epoch": 708, "val_loss": 2619962.0} {"train_loss": -38.06307601928711, "global_step": 85789, "epoch": 709} {"train_loss": -37.31964111328125, "global_step": 85790, "epoch": 709} {"train_loss": -37.6226921081543, "global_step": 85791, "epoch": 709} {"train_loss": -37.4447135925293, "global_step": 85792, "epoch": 709} {"train_loss": -36.38740158081055, "global_step": 85793, "epoch": 709} {"train_loss": -37.70689010620117, "global_step": 85794, "epoch": 709} {"train_loss": -37.11420822143555, "global_step": 85795, "epoch": 709} {"train_loss": -37.6800537109375, "global_step": 85796, "epoch": 709} {"train_loss": -38.1918830871582, "global_step": 85797, "epoch": 709} {"train_loss": -37.888458251953125, "global_step": 85798, "epoch": 709} {"train_loss": -37.0210075378418, "global_step": 85799, "epoch": 709} {"train_loss": -35.2271728515625, "global_step": 85800, "epoch": 709} {"train_loss": -35.1312370300293, "global_step": 85801, "epoch": 709} {"train_loss": -34.7750129699707, "global_step": 85802, "epoch": 709} {"train_loss": -37.29922866821289, "global_step": 85803, "epoch": 709} {"train_loss": -35.80618667602539, "global_step": 85804, "epoch": 709} {"train_loss": -35.981868743896484, "global_step": 85805, "epoch": 709} {"train_loss": -36.22776412963867, "global_step": 85806, "epoch": 709} {"train_loss": -37.19167709350586, "global_step": 85807, "epoch": 709} {"train_loss": -37.361328125, "global_step": 85808, "epoch": 709} {"train_loss": -37.001094818115234, "global_step": 85809, "epoch": 709} {"train_loss": -37.43349838256836, "global_step": 85810, "epoch": 709} {"train_loss": -37.39863967895508, "global_step": 85811, "epoch": 709} {"train_loss": -37.40521240234375, "global_step": 85812, "epoch": 709} {"train_loss": -37.896392822265625, "global_step": 85813, "epoch": 709} {"train_loss": -37.875736236572266, "global_step": 85814, "epoch": 709} {"train_loss": -37.5906982421875, "global_step": 85815, "epoch": 709} {"train_loss": -38.124244689941406, "global_step": 85816, "epoch": 709} {"train_loss": -38.02663040161133, "global_step": 85817, "epoch": 709} {"train_loss": -37.33585739135742, "global_step": 85818, "epoch": 709} {"train_loss": -36.59816360473633, "global_step": 85819, "epoch": 709} {"train_loss": -37.671199798583984, "global_step": 85820, "epoch": 709} {"train_loss": -38.07032012939453, "global_step": 85821, "epoch": 709} {"train_loss": -37.28600311279297, "global_step": 85822, "epoch": 709} {"train_loss": -36.438209533691406, "global_step": 85823, "epoch": 709} {"train_loss": -37.195098876953125, "global_step": 85824, "epoch": 709} {"train_loss": -37.455116271972656, "global_step": 85825, "epoch": 709} {"train_loss": -38.16878890991211, "global_step": 85826, "epoch": 709} {"train_loss": -36.10369873046875, "global_step": 85827, "epoch": 709} {"train_loss": -37.404945373535156, "global_step": 85828, "epoch": 709} {"train_loss": -37.914710998535156, "global_step": 85829, "epoch": 709} {"train_loss": -35.2358512878418, "global_step": 85830, "epoch": 709} {"train_loss": -36.082679748535156, "global_step": 85831, "epoch": 709} {"train_loss": -37.221717834472656, "global_step": 85832, "epoch": 709} {"train_loss": -35.8745231628418, "global_step": 85833, "epoch": 709} {"train_loss": -37.835689544677734, "global_step": 85834, "epoch": 709} {"train_loss": -36.803932189941406, "global_step": 85835, "epoch": 709} {"train_loss": -35.8214111328125, "global_step": 85836, "epoch": 709} {"train_loss": -37.11276626586914, "global_step": 85837, "epoch": 709} {"train_loss": -35.887550354003906, "global_step": 85838, "epoch": 709} {"train_loss": -37.65141677856445, "global_step": 85839, "epoch": 709} {"train_loss": -36.854400634765625, "global_step": 85840, "epoch": 709} {"train_loss": -37.77348327636719, "global_step": 85841, "epoch": 709} {"train_loss": -34.764434814453125, "global_step": 85842, "epoch": 709} {"train_loss": -36.443275451660156, "global_step": 85843, "epoch": 709} {"train_loss": -36.8276481628418, "global_step": 85844, "epoch": 709} {"train_loss": -36.8801383972168, "global_step": 85845, "epoch": 709} {"train_loss": -35.53936004638672, "global_step": 85846, "epoch": 709} {"train_loss": -35.25609588623047, "global_step": 85847, "epoch": 709} {"train_loss": -34.04639434814453, "global_step": 85848, "epoch": 709} {"train_loss": -36.600215911865234, "global_step": 85849, "epoch": 709} {"train_loss": -35.38911819458008, "global_step": 85850, "epoch": 709} {"train_loss": -35.388038635253906, "global_step": 85851, "epoch": 709} {"train_loss": -36.74495315551758, "global_step": 85852, "epoch": 709} {"train_loss": -37.008384704589844, "global_step": 85853, "epoch": 709} {"train_loss": -36.41828536987305, "global_step": 85854, "epoch": 709} {"train_loss": -35.47216796875, "global_step": 85855, "epoch": 709} {"train_loss": -36.6987419128418, "global_step": 85856, "epoch": 709} {"train_loss": -36.37094497680664, "global_step": 85857, "epoch": 709} {"train_loss": -37.69023513793945, "global_step": 85858, "epoch": 709} {"train_loss": -36.108516693115234, "global_step": 85859, "epoch": 709} {"train_loss": -36.219688415527344, "global_step": 85860, "epoch": 709} {"train_loss": -36.644996643066406, "global_step": 85861, "epoch": 709} {"train_loss": -37.392242431640625, "global_step": 85862, "epoch": 709} {"train_loss": -36.12931442260742, "global_step": 85863, "epoch": 709} {"train_loss": -36.95305252075195, "global_step": 85864, "epoch": 709} {"train_loss": -37.087501525878906, "global_step": 85865, "epoch": 709} {"train_loss": -36.8524169921875, "global_step": 85866, "epoch": 709} {"train_loss": -37.1463737487793, "global_step": 85867, "epoch": 709} {"train_loss": -37.42995834350586, "global_step": 85868, "epoch": 709} {"train_loss": -37.260955810546875, "global_step": 85869, "epoch": 709} {"train_loss": -38.318580627441406, "global_step": 85870, "epoch": 709} {"train_loss": -37.73589324951172, "global_step": 85871, "epoch": 709} {"train_loss": -38.18052673339844, "global_step": 85872, "epoch": 709} {"train_loss": -37.92875289916992, "global_step": 85873, "epoch": 709} {"train_loss": -38.0857048034668, "global_step": 85874, "epoch": 709} {"train_loss": -38.1569709777832, "global_step": 85875, "epoch": 709} {"train_loss": -37.82379150390625, "global_step": 85876, "epoch": 709} {"train_loss": -38.016265869140625, "global_step": 85877, "epoch": 709} {"train_loss": -38.1152229309082, "global_step": 85878, "epoch": 709} {"train_loss": -37.85375213623047, "global_step": 85879, "epoch": 709} {"train_loss": -38.022979736328125, "global_step": 85880, "epoch": 709} {"train_loss": -37.9779167175293, "global_step": 85881, "epoch": 709} {"train_loss": -38.52413558959961, "global_step": 85882, "epoch": 709} {"train_loss": -38.17276382446289, "global_step": 85883, "epoch": 709} {"train_loss": -37.93674850463867, "global_step": 85884, "epoch": 709} {"train_loss": -38.011592864990234, "global_step": 85885, "epoch": 709} {"train_loss": -38.41415023803711, "global_step": 85886, "epoch": 709} {"train_loss": -38.25522994995117, "global_step": 85887, "epoch": 709} {"train_loss": -38.27628707885742, "global_step": 85888, "epoch": 709} {"train_loss": -38.66627502441406, "global_step": 85889, "epoch": 709} {"train_loss": -37.809356689453125, "global_step": 85890, "epoch": 709} {"train_loss": -37.31948471069336, "global_step": 85891, "epoch": 709} {"train_loss": -37.15501022338867, "global_step": 85892, "epoch": 709} {"train_loss": -36.913997650146484, "global_step": 85893, "epoch": 709} {"train_loss": -35.19135665893555, "global_step": 85894, "epoch": 709} {"train_loss": -33.95563507080078, "global_step": 85895, "epoch": 709} {"train_loss": -33.12948226928711, "global_step": 85896, "epoch": 709} {"train_loss": -34.431541442871094, "global_step": 85897, "epoch": 709} {"train_loss": -37.31106948852539, "global_step": 85898, "epoch": 709} {"train_loss": -37.8033447265625, "global_step": 85899, "epoch": 709} {"train_loss": -36.771724700927734, "global_step": 85900, "epoch": 709} {"train_loss": -37.36433029174805, "global_step": 85901, "epoch": 709} {"train_loss": -38.321319580078125, "global_step": 85902, "epoch": 709} {"train_loss": -37.470211029052734, "global_step": 85903, "epoch": 709} {"train_loss": -37.59532928466797, "global_step": 85904, "epoch": 709} {"train_loss": -35.20718002319336, "global_step": 85905, "epoch": 709} {"train_loss": -37.37285232543945, "global_step": 85906, "epoch": 709} {"train_loss": -37.24137496948242, "global_step": 85907, "epoch": 709} {"train_loss": -37.95402908325195, "global_step": 85908, "epoch": 709} {"train_loss": -37.018927109142965, "global_step": 85909, "epoch": 709, "val_loss": 2773820.0} {"train_loss": -36.20570755004883, "global_step": 85910, "epoch": 710} {"train_loss": -37.45888900756836, "global_step": 85911, "epoch": 710} {"train_loss": -36.56965255737305, "global_step": 85912, "epoch": 710} {"train_loss": -37.18717575073242, "global_step": 85913, "epoch": 710} {"train_loss": -38.01832962036133, "global_step": 85914, "epoch": 710} {"train_loss": -36.24646759033203, "global_step": 85915, "epoch": 710} {"train_loss": -37.38829040527344, "global_step": 85916, "epoch": 710} {"train_loss": -38.04749298095703, "global_step": 85917, "epoch": 710} {"train_loss": -37.96856689453125, "global_step": 85918, "epoch": 710} {"train_loss": -38.149696350097656, "global_step": 85919, "epoch": 710} {"train_loss": -37.94939422607422, "global_step": 85920, "epoch": 710} {"train_loss": -37.34638214111328, "global_step": 85921, "epoch": 710} {"train_loss": -37.74028396606445, "global_step": 85922, "epoch": 710} {"train_loss": -37.87482833862305, "global_step": 85923, "epoch": 710} {"train_loss": -38.47186279296875, "global_step": 85924, "epoch": 710} {"train_loss": -37.20965576171875, "global_step": 85925, "epoch": 710} {"train_loss": -37.980342864990234, "global_step": 85926, "epoch": 710} {"train_loss": -37.50614547729492, "global_step": 85927, "epoch": 710} {"train_loss": -37.45207977294922, "global_step": 85928, "epoch": 710} {"train_loss": -37.48794174194336, "global_step": 85929, "epoch": 710} {"train_loss": -38.041908264160156, "global_step": 85930, "epoch": 710} {"train_loss": -37.95416259765625, "global_step": 85931, "epoch": 710} {"train_loss": -38.4974479675293, "global_step": 85932, "epoch": 710} {"train_loss": -37.615516662597656, "global_step": 85933, "epoch": 710} {"train_loss": -36.98011016845703, "global_step": 85934, "epoch": 710} {"train_loss": -37.742431640625, "global_step": 85935, "epoch": 710} {"train_loss": -38.57796096801758, "global_step": 85936, "epoch": 710} {"train_loss": -37.71432113647461, "global_step": 85937, "epoch": 710} {"train_loss": -37.680416107177734, "global_step": 85938, "epoch": 710} {"train_loss": -37.78174591064453, "global_step": 85939, "epoch": 710} {"train_loss": -38.0684928894043, "global_step": 85940, "epoch": 710} {"train_loss": -37.49261474609375, "global_step": 85941, "epoch": 710} {"train_loss": -37.49939727783203, "global_step": 85942, "epoch": 710} {"train_loss": -37.32374572753906, "global_step": 85943, "epoch": 710} {"train_loss": -37.601165771484375, "global_step": 85944, "epoch": 710} {"train_loss": -36.89805221557617, "global_step": 85945, "epoch": 710} {"train_loss": -36.71682357788086, "global_step": 85946, "epoch": 710} {"train_loss": -38.12434768676758, "global_step": 85947, "epoch": 710} {"train_loss": -38.29879379272461, "global_step": 85948, "epoch": 710} {"train_loss": -37.764198303222656, "global_step": 85949, "epoch": 710} {"train_loss": -36.8581657409668, "global_step": 85950, "epoch": 710} {"train_loss": -35.141700744628906, "global_step": 85951, "epoch": 710} {"train_loss": -34.57430648803711, "global_step": 85952, "epoch": 710} {"train_loss": -33.33928298950195, "global_step": 85953, "epoch": 710} {"train_loss": -33.93975830078125, "global_step": 85954, "epoch": 710} {"train_loss": -35.34070587158203, "global_step": 85955, "epoch": 710} {"train_loss": -35.71759796142578, "global_step": 85956, "epoch": 710} {"train_loss": -37.57168197631836, "global_step": 85957, "epoch": 710} {"train_loss": -36.21828842163086, "global_step": 85958, "epoch": 710} {"train_loss": -37.19222640991211, "global_step": 85959, "epoch": 710} {"train_loss": -37.1221809387207, "global_step": 85960, "epoch": 710} {"train_loss": -36.93193054199219, "global_step": 85961, "epoch": 710} {"train_loss": -38.386566162109375, "global_step": 85962, "epoch": 710} {"train_loss": -37.38875198364258, "global_step": 85963, "epoch": 710} {"train_loss": -37.111244201660156, "global_step": 85964, "epoch": 710} {"train_loss": -37.73482131958008, "global_step": 85965, "epoch": 710} {"train_loss": -38.39922332763672, "global_step": 85966, "epoch": 710} {"train_loss": -38.273956298828125, "global_step": 85967, "epoch": 710} {"train_loss": -38.14617919921875, "global_step": 85968, "epoch": 710} {"train_loss": -37.48688507080078, "global_step": 85969, "epoch": 710} {"train_loss": -38.358726501464844, "global_step": 85970, "epoch": 710} {"train_loss": -38.05530548095703, "global_step": 85971, "epoch": 710} {"train_loss": -38.13092041015625, "global_step": 85972, "epoch": 710} {"train_loss": -38.2526969909668, "global_step": 85973, "epoch": 710} {"train_loss": -37.4656867980957, "global_step": 85974, "epoch": 710} {"train_loss": -38.1948127746582, "global_step": 85975, "epoch": 710} {"train_loss": -37.61661911010742, "global_step": 85976, "epoch": 710} {"train_loss": -38.324798583984375, "global_step": 85977, "epoch": 710} {"train_loss": -38.438690185546875, "global_step": 85978, "epoch": 710} {"train_loss": -34.409217834472656, "global_step": 85979, "epoch": 710} {"train_loss": -38.452674865722656, "global_step": 85980, "epoch": 710} {"train_loss": -38.35319137573242, "global_step": 85981, "epoch": 710} {"train_loss": -38.167720794677734, "global_step": 85982, "epoch": 710} {"train_loss": -37.83951950073242, "global_step": 85983, "epoch": 710} {"train_loss": -38.13154220581055, "global_step": 85984, "epoch": 710} {"train_loss": -38.16107940673828, "global_step": 85985, "epoch": 710} {"train_loss": -38.296600341796875, "global_step": 85986, "epoch": 710} {"train_loss": -38.0421257019043, "global_step": 85987, "epoch": 710} {"train_loss": -37.936195373535156, "global_step": 85988, "epoch": 710} {"train_loss": -38.102264404296875, "global_step": 85989, "epoch": 710} {"train_loss": -37.97649002075195, "global_step": 85990, "epoch": 710} {"train_loss": -38.33631896972656, "global_step": 85991, "epoch": 710} {"train_loss": -38.183876037597656, "global_step": 85992, "epoch": 710} {"train_loss": -38.1245231628418, "global_step": 85993, "epoch": 710} {"train_loss": -38.39665985107422, "global_step": 85994, "epoch": 710} {"train_loss": -36.71914291381836, "global_step": 85995, "epoch": 710} {"train_loss": -37.91799545288086, "global_step": 85996, "epoch": 710} {"train_loss": -37.84536361694336, "global_step": 85997, "epoch": 710} {"train_loss": -37.14738082885742, "global_step": 85998, "epoch": 710} {"train_loss": -37.6655387878418, "global_step": 85999, "epoch": 710} {"train_loss": -38.1341552734375, "global_step": 86000, "epoch": 710} {"train_loss": -38.39106369018555, "global_step": 86001, "epoch": 710} {"train_loss": -38.63763427734375, "global_step": 86002, "epoch": 710} {"train_loss": -38.090877532958984, "global_step": 86003, "epoch": 710} {"train_loss": -37.28607177734375, "global_step": 86004, "epoch": 710} {"train_loss": -36.658790588378906, "global_step": 86005, "epoch": 710} {"train_loss": -36.536014556884766, "global_step": 86006, "epoch": 710} {"train_loss": -38.82548904418945, "global_step": 86007, "epoch": 710} {"train_loss": -36.8615837097168, "global_step": 86008, "epoch": 710} {"train_loss": -38.219764709472656, "global_step": 86009, "epoch": 710} {"train_loss": -36.94069290161133, "global_step": 86010, "epoch": 710} {"train_loss": -37.21479034423828, "global_step": 86011, "epoch": 710} {"train_loss": -38.70492172241211, "global_step": 86012, "epoch": 710} {"train_loss": -38.67451095581055, "global_step": 86013, "epoch": 710} {"train_loss": -38.34096908569336, "global_step": 86014, "epoch": 710} {"train_loss": -38.71294021606445, "global_step": 86015, "epoch": 710} {"train_loss": -38.27473068237305, "global_step": 86016, "epoch": 710} {"train_loss": -38.15751647949219, "global_step": 86017, "epoch": 710} {"train_loss": -38.585426330566406, "global_step": 86018, "epoch": 710} {"train_loss": -38.5321044921875, "global_step": 86019, "epoch": 710} {"train_loss": -38.475833892822266, "global_step": 86020, "epoch": 710} {"train_loss": -38.71845626831055, "global_step": 86021, "epoch": 710} {"train_loss": -38.49605941772461, "global_step": 86022, "epoch": 710} {"train_loss": -38.69684982299805, "global_step": 86023, "epoch": 710} {"train_loss": -38.4134635925293, "global_step": 86024, "epoch": 710} {"train_loss": -38.561614990234375, "global_step": 86025, "epoch": 710} {"train_loss": -38.4559440612793, "global_step": 86026, "epoch": 710} {"train_loss": -38.02919006347656, "global_step": 86027, "epoch": 710} {"train_loss": -37.4022102355957, "global_step": 86028, "epoch": 710} {"train_loss": -35.716976165771484, "global_step": 86029, "epoch": 710} {"train_loss": -37.58143530601312, "global_step": 86030, "epoch": 710, "val_loss": 2698828.75} {"train_loss": -37.22064971923828, "global_step": 86031, "epoch": 711} {"train_loss": -37.21657180786133, "global_step": 86032, "epoch": 711} {"train_loss": -34.641090393066406, "global_step": 86033, "epoch": 711} {"train_loss": -33.73357009887695, "global_step": 86034, "epoch": 711} {"train_loss": -36.92267990112305, "global_step": 86035, "epoch": 711} {"train_loss": -37.01298141479492, "global_step": 86036, "epoch": 711} {"train_loss": -36.182796478271484, "global_step": 86037, "epoch": 711} {"train_loss": -36.17924499511719, "global_step": 86038, "epoch": 711} {"train_loss": -35.68729782104492, "global_step": 86039, "epoch": 711} {"train_loss": -36.78303527832031, "global_step": 86040, "epoch": 711} {"train_loss": -37.257102966308594, "global_step": 86041, "epoch": 711} {"train_loss": -37.04154586791992, "global_step": 86042, "epoch": 711} {"train_loss": -37.595977783203125, "global_step": 86043, "epoch": 711} {"train_loss": -37.954132080078125, "global_step": 86044, "epoch": 711} {"train_loss": -35.07255172729492, "global_step": 86045, "epoch": 711} {"train_loss": -37.51918029785156, "global_step": 86046, "epoch": 711} {"train_loss": -37.926998138427734, "global_step": 86047, "epoch": 711} {"train_loss": -36.82125473022461, "global_step": 86048, "epoch": 711} {"train_loss": -37.91617965698242, "global_step": 86049, "epoch": 711} {"train_loss": -36.34632873535156, "global_step": 86050, "epoch": 711} {"train_loss": -37.15778732299805, "global_step": 86051, "epoch": 711} {"train_loss": -35.53926467895508, "global_step": 86052, "epoch": 711} {"train_loss": -36.808536529541016, "global_step": 86053, "epoch": 711} {"train_loss": -38.104408264160156, "global_step": 86054, "epoch": 711} {"train_loss": -37.34491729736328, "global_step": 86055, "epoch": 711} {"train_loss": -37.648250579833984, "global_step": 86056, "epoch": 711} {"train_loss": -36.359718322753906, "global_step": 86057, "epoch": 711} {"train_loss": -37.2378044128418, "global_step": 86058, "epoch": 711} {"train_loss": -36.91292953491211, "global_step": 86059, "epoch": 711} {"train_loss": -36.7153205871582, "global_step": 86060, "epoch": 711} {"train_loss": -37.12086868286133, "global_step": 86061, "epoch": 711} {"train_loss": -37.637451171875, "global_step": 86062, "epoch": 711} {"train_loss": -37.03190994262695, "global_step": 86063, "epoch": 711} {"train_loss": -37.72043991088867, "global_step": 86064, "epoch": 711} {"train_loss": -37.41142272949219, "global_step": 86065, "epoch": 711} {"train_loss": -36.016658782958984, "global_step": 86066, "epoch": 711} {"train_loss": -35.83211898803711, "global_step": 86067, "epoch": 711} {"train_loss": -36.060211181640625, "global_step": 86068, "epoch": 711} {"train_loss": -37.03977584838867, "global_step": 86069, "epoch": 711} {"train_loss": -37.35927963256836, "global_step": 86070, "epoch": 711} {"train_loss": -36.59649658203125, "global_step": 86071, "epoch": 711} {"train_loss": -36.15553665161133, "global_step": 86072, "epoch": 711} {"train_loss": -36.164981842041016, "global_step": 86073, "epoch": 711} {"train_loss": -37.48454666137695, "global_step": 86074, "epoch": 711} {"train_loss": -37.07876968383789, "global_step": 86075, "epoch": 711} {"train_loss": -36.94999313354492, "global_step": 86076, "epoch": 711} {"train_loss": -36.89548873901367, "global_step": 86077, "epoch": 711} {"train_loss": -37.301185607910156, "global_step": 86078, "epoch": 711} {"train_loss": -37.656280517578125, "global_step": 86079, "epoch": 711} {"train_loss": -37.3862419128418, "global_step": 86080, "epoch": 711} {"train_loss": -37.419063568115234, "global_step": 86081, "epoch": 711} {"train_loss": -37.49673080444336, "global_step": 86082, "epoch": 711} {"train_loss": -38.14763641357422, "global_step": 86083, "epoch": 711} {"train_loss": -37.7305908203125, "global_step": 86084, "epoch": 711} {"train_loss": -37.43815231323242, "global_step": 86085, "epoch": 711} {"train_loss": -37.816070556640625, "global_step": 86086, "epoch": 711} {"train_loss": -37.68619155883789, "global_step": 86087, "epoch": 711} {"train_loss": -38.29341125488281, "global_step": 86088, "epoch": 711} {"train_loss": -37.7808952331543, "global_step": 86089, "epoch": 711} {"train_loss": -37.759666442871094, "global_step": 86090, "epoch": 711} {"train_loss": -37.82057571411133, "global_step": 86091, "epoch": 711} {"train_loss": -38.00621795654297, "global_step": 86092, "epoch": 711} {"train_loss": -36.75397872924805, "global_step": 86093, "epoch": 711} {"train_loss": -37.980228424072266, "global_step": 86094, "epoch": 711} {"train_loss": -38.165077209472656, "global_step": 86095, "epoch": 711} {"train_loss": -37.83793640136719, "global_step": 86096, "epoch": 711} {"train_loss": -38.334266662597656, "global_step": 86097, "epoch": 711} {"train_loss": -38.05836868286133, "global_step": 86098, "epoch": 711} {"train_loss": -38.146121978759766, "global_step": 86099, "epoch": 711} {"train_loss": -38.3918571472168, "global_step": 86100, "epoch": 711} {"train_loss": -37.89398193359375, "global_step": 86101, "epoch": 711} {"train_loss": -38.236629486083984, "global_step": 86102, "epoch": 711} {"train_loss": -38.492889404296875, "global_step": 86103, "epoch": 711} {"train_loss": -38.44765853881836, "global_step": 86104, "epoch": 711} {"train_loss": -38.030818939208984, "global_step": 86105, "epoch": 711} {"train_loss": -38.2550048828125, "global_step": 86106, "epoch": 711} {"train_loss": -38.68437194824219, "global_step": 86107, "epoch": 711} {"train_loss": -38.71572494506836, "global_step": 86108, "epoch": 711} {"train_loss": -37.586822509765625, "global_step": 86109, "epoch": 711} {"train_loss": -37.05442810058594, "global_step": 86110, "epoch": 711} {"train_loss": -34.45326614379883, "global_step": 86111, "epoch": 711} {"train_loss": -30.53687858581543, "global_step": 86112, "epoch": 711} {"train_loss": -33.81915283203125, "global_step": 86113, "epoch": 711} {"train_loss": -23.737960815429688, "global_step": 86114, "epoch": 711} {"train_loss": -23.44246482849121, "global_step": 86115, "epoch": 711} {"train_loss": -15.904440879821777, "global_step": 86116, "epoch": 711} {"train_loss": 11.496230125427246, "global_step": 86117, "epoch": 711} {"train_loss": 7.226409912109375, "global_step": 86118, "epoch": 711} {"train_loss": -25.80605125427246, "global_step": 86119, "epoch": 711} {"train_loss": -14.461708068847656, "global_step": 86120, "epoch": 711} {"train_loss": -21.405258178710938, "global_step": 86121, "epoch": 711} {"train_loss": -23.384628295898438, "global_step": 86122, "epoch": 711} {"train_loss": -19.770902633666992, "global_step": 86123, "epoch": 711} {"train_loss": -25.82246971130371, "global_step": 86124, "epoch": 711} {"train_loss": -27.797595977783203, "global_step": 86125, "epoch": 711} {"train_loss": -24.171829223632812, "global_step": 86126, "epoch": 711} {"train_loss": -28.277761459350586, "global_step": 86127, "epoch": 711} {"train_loss": -28.380569458007812, "global_step": 86128, "epoch": 711} {"train_loss": -28.800342559814453, "global_step": 86129, "epoch": 711} {"train_loss": -28.19589614868164, "global_step": 86130, "epoch": 711} {"train_loss": -27.9083309173584, "global_step": 86131, "epoch": 711} {"train_loss": -30.753406524658203, "global_step": 86132, "epoch": 711} {"train_loss": -29.869037628173828, "global_step": 86133, "epoch": 711} {"train_loss": -29.364797592163086, "global_step": 86134, "epoch": 711} {"train_loss": -29.701513290405273, "global_step": 86135, "epoch": 711} {"train_loss": -30.216222763061523, "global_step": 86136, "epoch": 711} {"train_loss": -31.1079158782959, "global_step": 86137, "epoch": 711} {"train_loss": -32.0855712890625, "global_step": 86138, "epoch": 711} {"train_loss": -31.113067626953125, "global_step": 86139, "epoch": 711} {"train_loss": -30.450775146484375, "global_step": 86140, "epoch": 711} {"train_loss": -31.73508071899414, "global_step": 86141, "epoch": 711} {"train_loss": -31.76871109008789, "global_step": 86142, "epoch": 711} {"train_loss": -32.40453338623047, "global_step": 86143, "epoch": 711} {"train_loss": -32.62232208251953, "global_step": 86144, "epoch": 711} {"train_loss": -32.40999221801758, "global_step": 86145, "epoch": 711} {"train_loss": -32.4983024597168, "global_step": 86146, "epoch": 711} {"train_loss": -32.98690414428711, "global_step": 86147, "epoch": 711} {"train_loss": -32.83000946044922, "global_step": 86148, "epoch": 711} {"train_loss": -32.87299728393555, "global_step": 86149, "epoch": 711} {"train_loss": -33.40974807739258, "global_step": 86150, "epoch": 711} {"train_loss": -33.730751400151526, "global_step": 86151, "epoch": 711, "val_loss": 2830132.0} {"train_loss": -33.80860137939453, "global_step": 86152, "epoch": 712} {"train_loss": -33.82624435424805, "global_step": 86153, "epoch": 712} {"train_loss": -33.46354293823242, "global_step": 86154, "epoch": 712} {"train_loss": -34.31071090698242, "global_step": 86155, "epoch": 712} {"train_loss": -34.69990921020508, "global_step": 86156, "epoch": 712} {"train_loss": -34.32434844970703, "global_step": 86157, "epoch": 712} {"train_loss": -34.28902053833008, "global_step": 86158, "epoch": 712} {"train_loss": -34.00834655761719, "global_step": 86159, "epoch": 712} {"train_loss": -33.83708190917969, "global_step": 86160, "epoch": 712} {"train_loss": -33.40318298339844, "global_step": 86161, "epoch": 712} {"train_loss": -33.858551025390625, "global_step": 86162, "epoch": 712} {"train_loss": -33.869346618652344, "global_step": 86163, "epoch": 712} {"train_loss": -33.66358947753906, "global_step": 86164, "epoch": 712} {"train_loss": -33.82133865356445, "global_step": 86165, "epoch": 712} {"train_loss": -34.39579391479492, "global_step": 86166, "epoch": 712} {"train_loss": -34.88644027709961, "global_step": 86167, "epoch": 712} {"train_loss": -34.75712585449219, "global_step": 86168, "epoch": 712} {"train_loss": -35.50224304199219, "global_step": 86169, "epoch": 712} {"train_loss": -34.53038024902344, "global_step": 86170, "epoch": 712} {"train_loss": -34.418174743652344, "global_step": 86171, "epoch": 712} {"train_loss": -34.33845138549805, "global_step": 86172, "epoch": 712} {"train_loss": -33.69978713989258, "global_step": 86173, "epoch": 712} {"train_loss": -34.42250442504883, "global_step": 86174, "epoch": 712} {"train_loss": -35.48432540893555, "global_step": 86175, "epoch": 712} {"train_loss": -35.338191986083984, "global_step": 86176, "epoch": 712} {"train_loss": -34.51131057739258, "global_step": 86177, "epoch": 712} {"train_loss": -34.56034469604492, "global_step": 86178, "epoch": 712} {"train_loss": -35.32821273803711, "global_step": 86179, "epoch": 712} {"train_loss": -35.86591720581055, "global_step": 86180, "epoch": 712} {"train_loss": -35.873722076416016, "global_step": 86181, "epoch": 712} {"train_loss": -35.15513229370117, "global_step": 86182, "epoch": 712} {"train_loss": -34.42861557006836, "global_step": 86183, "epoch": 712} {"train_loss": -35.52009201049805, "global_step": 86184, "epoch": 712} {"train_loss": -35.678829193115234, "global_step": 86185, "epoch": 712} {"train_loss": -35.45166015625, "global_step": 86186, "epoch": 712} {"train_loss": -35.8414421081543, "global_step": 86187, "epoch": 712} {"train_loss": -35.802547454833984, "global_step": 86188, "epoch": 712} {"train_loss": -35.49949264526367, "global_step": 86189, "epoch": 712} {"train_loss": -35.472347259521484, "global_step": 86190, "epoch": 712} {"train_loss": -35.93973922729492, "global_step": 86191, "epoch": 712} {"train_loss": -35.939823150634766, "global_step": 86192, "epoch": 712} {"train_loss": -35.9151725769043, "global_step": 86193, "epoch": 712} {"train_loss": -35.455528259277344, "global_step": 86194, "epoch": 712} {"train_loss": -35.47054672241211, "global_step": 86195, "epoch": 712} {"train_loss": -35.954002380371094, "global_step": 86196, "epoch": 712} {"train_loss": -34.72079086303711, "global_step": 86197, "epoch": 712} {"train_loss": -33.17529296875, "global_step": 86198, "epoch": 712} {"train_loss": -30.6810302734375, "global_step": 86199, "epoch": 712} {"train_loss": -31.852890014648438, "global_step": 86200, "epoch": 712} {"train_loss": -36.32207107543945, "global_step": 86201, "epoch": 712} {"train_loss": -32.969032287597656, "global_step": 86202, "epoch": 712} {"train_loss": -35.75516891479492, "global_step": 86203, "epoch": 712} {"train_loss": -33.46920394897461, "global_step": 86204, "epoch": 712} {"train_loss": -35.629634857177734, "global_step": 86205, "epoch": 712} {"train_loss": -34.71353530883789, "global_step": 86206, "epoch": 712} {"train_loss": -36.13837432861328, "global_step": 86207, "epoch": 712} {"train_loss": -35.61231231689453, "global_step": 86208, "epoch": 712} {"train_loss": -35.233856201171875, "global_step": 86209, "epoch": 712} {"train_loss": -35.75339889526367, "global_step": 86210, "epoch": 712} {"train_loss": -35.46579360961914, "global_step": 86211, "epoch": 712} {"train_loss": -35.295570373535156, "global_step": 86212, "epoch": 712} {"train_loss": -34.81660079956055, "global_step": 86213, "epoch": 712} {"train_loss": -35.62246322631836, "global_step": 86214, "epoch": 712} {"train_loss": -35.530452728271484, "global_step": 86215, "epoch": 712} {"train_loss": -34.75087356567383, "global_step": 86216, "epoch": 712} {"train_loss": -36.2899284362793, "global_step": 86217, "epoch": 712} {"train_loss": -35.32280349731445, "global_step": 86218, "epoch": 712} {"train_loss": -35.713768005371094, "global_step": 86219, "epoch": 712} {"train_loss": -35.703086853027344, "global_step": 86220, "epoch": 712} {"train_loss": -35.01298141479492, "global_step": 86221, "epoch": 712} {"train_loss": -36.3638801574707, "global_step": 86222, "epoch": 712} {"train_loss": -35.03778076171875, "global_step": 86223, "epoch": 712} {"train_loss": -35.80447006225586, "global_step": 86224, "epoch": 712} {"train_loss": -36.00055694580078, "global_step": 86225, "epoch": 712} {"train_loss": -35.46385955810547, "global_step": 86226, "epoch": 712} {"train_loss": -36.709712982177734, "global_step": 86227, "epoch": 712} {"train_loss": -35.97271728515625, "global_step": 86228, "epoch": 712} {"train_loss": -36.21553421020508, "global_step": 86229, "epoch": 712} {"train_loss": -35.922054290771484, "global_step": 86230, "epoch": 712} {"train_loss": -36.57902908325195, "global_step": 86231, "epoch": 712} {"train_loss": -36.398773193359375, "global_step": 86232, "epoch": 712} {"train_loss": -36.4780158996582, "global_step": 86233, "epoch": 712} {"train_loss": -36.761085510253906, "global_step": 86234, "epoch": 712} {"train_loss": -36.878631591796875, "global_step": 86235, "epoch": 712} {"train_loss": -36.877479553222656, "global_step": 86236, "epoch": 712} {"train_loss": -37.1785774230957, "global_step": 86237, "epoch": 712} {"train_loss": -36.400630950927734, "global_step": 86238, "epoch": 712} {"train_loss": -36.98515319824219, "global_step": 86239, "epoch": 712} {"train_loss": -36.90452194213867, "global_step": 86240, "epoch": 712} {"train_loss": -36.72352981567383, "global_step": 86241, "epoch": 712} {"train_loss": -36.80971908569336, "global_step": 86242, "epoch": 712} {"train_loss": -36.743011474609375, "global_step": 86243, "epoch": 712} {"train_loss": -35.9840202331543, "global_step": 86244, "epoch": 712} {"train_loss": -36.52009201049805, "global_step": 86245, "epoch": 712} {"train_loss": -36.826995849609375, "global_step": 86246, "epoch": 712} {"train_loss": -36.723976135253906, "global_step": 86247, "epoch": 712} {"train_loss": -36.850032806396484, "global_step": 86248, "epoch": 712} {"train_loss": -36.78727722167969, "global_step": 86249, "epoch": 712} {"train_loss": -36.62078857421875, "global_step": 86250, "epoch": 712} {"train_loss": -37.03880310058594, "global_step": 86251, "epoch": 712} {"train_loss": -36.980712890625, "global_step": 86252, "epoch": 712} {"train_loss": -37.37814712524414, "global_step": 86253, "epoch": 712} {"train_loss": -37.33246994018555, "global_step": 86254, "epoch": 712} {"train_loss": -36.973785400390625, "global_step": 86255, "epoch": 712} {"train_loss": -37.257293701171875, "global_step": 86256, "epoch": 712} {"train_loss": -37.183929443359375, "global_step": 86257, "epoch": 712} {"train_loss": -37.623023986816406, "global_step": 86258, "epoch": 712} {"train_loss": -37.124855041503906, "global_step": 86259, "epoch": 712} {"train_loss": -36.900089263916016, "global_step": 86260, "epoch": 712} {"train_loss": -36.49857711791992, "global_step": 86261, "epoch": 712} {"train_loss": -36.90635299682617, "global_step": 86262, "epoch": 712} {"train_loss": -36.93427276611328, "global_step": 86263, "epoch": 712} {"train_loss": -36.686485290527344, "global_step": 86264, "epoch": 712} {"train_loss": -36.934471130371094, "global_step": 86265, "epoch": 712} {"train_loss": -36.5557861328125, "global_step": 86266, "epoch": 712} {"train_loss": -36.065704345703125, "global_step": 86267, "epoch": 712} {"train_loss": -36.87484359741211, "global_step": 86268, "epoch": 712} {"train_loss": -36.655330657958984, "global_step": 86269, "epoch": 712} {"train_loss": -36.88413619995117, "global_step": 86270, "epoch": 712} {"train_loss": -35.932762145996094, "global_step": 86271, "epoch": 712} {"train_loss": -35.588998715739606, "global_step": 86272, "epoch": 712, "val_loss": 2721659.75} {"train_loss": -36.27446365356445, "global_step": 86273, "epoch": 713} {"train_loss": -36.91492462158203, "global_step": 86274, "epoch": 713} {"train_loss": -35.791725158691406, "global_step": 86275, "epoch": 713} {"train_loss": -36.69295120239258, "global_step": 86276, "epoch": 713} {"train_loss": -34.7529296875, "global_step": 86277, "epoch": 713} {"train_loss": -35.32118225097656, "global_step": 86278, "epoch": 713} {"train_loss": -35.4593505859375, "global_step": 86279, "epoch": 713} {"train_loss": -36.32823944091797, "global_step": 86280, "epoch": 713} {"train_loss": -37.167030334472656, "global_step": 86281, "epoch": 713} {"train_loss": -35.4849739074707, "global_step": 86282, "epoch": 713} {"train_loss": -37.098297119140625, "global_step": 86283, "epoch": 713} {"train_loss": -36.22364044189453, "global_step": 86284, "epoch": 713} {"train_loss": -37.024147033691406, "global_step": 86285, "epoch": 713} {"train_loss": -36.84939193725586, "global_step": 86286, "epoch": 713} {"train_loss": -35.18457794189453, "global_step": 86287, "epoch": 713} {"train_loss": -35.00775909423828, "global_step": 86288, "epoch": 713} {"train_loss": -37.143611907958984, "global_step": 86289, "epoch": 713} {"train_loss": -32.0544548034668, "global_step": 86290, "epoch": 713} {"train_loss": -33.81547927856445, "global_step": 86291, "epoch": 713} {"train_loss": -31.12543296813965, "global_step": 86292, "epoch": 713} {"train_loss": -30.179859161376953, "global_step": 86293, "epoch": 713} {"train_loss": -35.906700134277344, "global_step": 86294, "epoch": 713} {"train_loss": -35.1243896484375, "global_step": 86295, "epoch": 713} {"train_loss": -31.80959129333496, "global_step": 86296, "epoch": 713} {"train_loss": -36.46499252319336, "global_step": 86297, "epoch": 713} {"train_loss": -34.136409759521484, "global_step": 86298, "epoch": 713} {"train_loss": -34.126625061035156, "global_step": 86299, "epoch": 713} {"train_loss": -35.8204231262207, "global_step": 86300, "epoch": 713} {"train_loss": -30.27378273010254, "global_step": 86301, "epoch": 713} {"train_loss": -36.399078369140625, "global_step": 86302, "epoch": 713} {"train_loss": -36.9088134765625, "global_step": 86303, "epoch": 713} {"train_loss": -34.895687103271484, "global_step": 86304, "epoch": 713} {"train_loss": -33.65336608886719, "global_step": 86305, "epoch": 713} {"train_loss": -35.36771011352539, "global_step": 86306, "epoch": 713} {"train_loss": -36.52280807495117, "global_step": 86307, "epoch": 713} {"train_loss": -35.35415267944336, "global_step": 86308, "epoch": 713} {"train_loss": -36.5952262878418, "global_step": 86309, "epoch": 713} {"train_loss": -35.89814758300781, "global_step": 86310, "epoch": 713} {"train_loss": -36.94643783569336, "global_step": 86311, "epoch": 713} {"train_loss": -36.720149993896484, "global_step": 86312, "epoch": 713} {"train_loss": -37.311195373535156, "global_step": 86313, "epoch": 713} {"train_loss": -36.904014587402344, "global_step": 86314, "epoch": 713} {"train_loss": -36.499935150146484, "global_step": 86315, "epoch": 713} {"train_loss": -37.50007247924805, "global_step": 86316, "epoch": 713} {"train_loss": -36.928775787353516, "global_step": 86317, "epoch": 713} {"train_loss": -37.60390853881836, "global_step": 86318, "epoch": 713} {"train_loss": -37.12890625, "global_step": 86319, "epoch": 713} {"train_loss": -35.116546630859375, "global_step": 86320, "epoch": 713} {"train_loss": -35.72151565551758, "global_step": 86321, "epoch": 713} {"train_loss": -35.12266159057617, "global_step": 86322, "epoch": 713} {"train_loss": -36.249324798583984, "global_step": 86323, "epoch": 713} {"train_loss": -35.808258056640625, "global_step": 86324, "epoch": 713} {"train_loss": -36.46036911010742, "global_step": 86325, "epoch": 713} {"train_loss": -36.3544807434082, "global_step": 86326, "epoch": 713} {"train_loss": -33.943843841552734, "global_step": 86327, "epoch": 713} {"train_loss": -33.284786224365234, "global_step": 86328, "epoch": 713} {"train_loss": -34.81689453125, "global_step": 86329, "epoch": 713} {"train_loss": -35.95594024658203, "global_step": 86330, "epoch": 713} {"train_loss": -36.71083450317383, "global_step": 86331, "epoch": 713} {"train_loss": -33.68000030517578, "global_step": 86332, "epoch": 713} {"train_loss": -32.32642364501953, "global_step": 86333, "epoch": 713} {"train_loss": -31.32561683654785, "global_step": 86334, "epoch": 713} {"train_loss": -36.80206298828125, "global_step": 86335, "epoch": 713} {"train_loss": -35.58620834350586, "global_step": 86336, "epoch": 713} {"train_loss": -33.41038131713867, "global_step": 86337, "epoch": 713} {"train_loss": -35.52653121948242, "global_step": 86338, "epoch": 713} {"train_loss": -36.079036712646484, "global_step": 86339, "epoch": 713} {"train_loss": -33.80347442626953, "global_step": 86340, "epoch": 713} {"train_loss": -36.95246505737305, "global_step": 86341, "epoch": 713} {"train_loss": -35.75934600830078, "global_step": 86342, "epoch": 713} {"train_loss": -36.04934310913086, "global_step": 86343, "epoch": 713} {"train_loss": -36.68040084838867, "global_step": 86344, "epoch": 713} {"train_loss": -34.9834098815918, "global_step": 86345, "epoch": 713} {"train_loss": -36.73662185668945, "global_step": 86346, "epoch": 713} {"train_loss": -35.79170227050781, "global_step": 86347, "epoch": 713} {"train_loss": -36.14616775512695, "global_step": 86348, "epoch": 713} {"train_loss": -36.648536682128906, "global_step": 86349, "epoch": 713} {"train_loss": -36.33437728881836, "global_step": 86350, "epoch": 713} {"train_loss": -37.019710540771484, "global_step": 86351, "epoch": 713} {"train_loss": -36.64366912841797, "global_step": 86352, "epoch": 713} {"train_loss": -36.601531982421875, "global_step": 86353, "epoch": 713} {"train_loss": -34.37289047241211, "global_step": 86354, "epoch": 713} {"train_loss": -33.57189178466797, "global_step": 86355, "epoch": 713} {"train_loss": -34.7274284362793, "global_step": 86356, "epoch": 713} {"train_loss": -36.616294860839844, "global_step": 86357, "epoch": 713} {"train_loss": -36.5708122253418, "global_step": 86358, "epoch": 713} {"train_loss": -35.33448791503906, "global_step": 86359, "epoch": 713} {"train_loss": -36.40363311767578, "global_step": 86360, "epoch": 713} {"train_loss": -34.900596618652344, "global_step": 86361, "epoch": 713} {"train_loss": -36.634159088134766, "global_step": 86362, "epoch": 713} {"train_loss": -35.2749137878418, "global_step": 86363, "epoch": 713} {"train_loss": -37.00484085083008, "global_step": 86364, "epoch": 713} {"train_loss": -36.250301361083984, "global_step": 86365, "epoch": 713} {"train_loss": -37.02777862548828, "global_step": 86366, "epoch": 713} {"train_loss": -37.00404739379883, "global_step": 86367, "epoch": 713} {"train_loss": -37.1385498046875, "global_step": 86368, "epoch": 713} {"train_loss": -36.37549591064453, "global_step": 86369, "epoch": 713} {"train_loss": -36.99000930786133, "global_step": 86370, "epoch": 713} {"train_loss": -36.79890060424805, "global_step": 86371, "epoch": 713} {"train_loss": -37.067115783691406, "global_step": 86372, "epoch": 713} {"train_loss": -37.01841354370117, "global_step": 86373, "epoch": 713} {"train_loss": -37.33513259887695, "global_step": 86374, "epoch": 713} {"train_loss": -37.34725570678711, "global_step": 86375, "epoch": 713} {"train_loss": -36.5394172668457, "global_step": 86376, "epoch": 713} {"train_loss": -36.848384857177734, "global_step": 86377, "epoch": 713} {"train_loss": -37.321956634521484, "global_step": 86378, "epoch": 713} {"train_loss": -37.55072784423828, "global_step": 86379, "epoch": 713} {"train_loss": -36.57889938354492, "global_step": 86380, "epoch": 713} {"train_loss": -36.77762985229492, "global_step": 86381, "epoch": 713} {"train_loss": -37.3310432434082, "global_step": 86382, "epoch": 713} {"train_loss": -36.98699951171875, "global_step": 86383, "epoch": 713} {"train_loss": -37.180416107177734, "global_step": 86384, "epoch": 713} {"train_loss": -37.25592803955078, "global_step": 86385, "epoch": 713} {"train_loss": -37.20762634277344, "global_step": 86386, "epoch": 713} {"train_loss": -37.262386322021484, "global_step": 86387, "epoch": 713} {"train_loss": -37.391048431396484, "global_step": 86388, "epoch": 713} {"train_loss": -37.64231491088867, "global_step": 86389, "epoch": 713} {"train_loss": -36.46779251098633, "global_step": 86390, "epoch": 713} {"train_loss": -35.494384765625, "global_step": 86391, "epoch": 713} {"train_loss": -37.35247802734375, "global_step": 86392, "epoch": 713} {"train_loss": -35.87610541099359, "global_step": 86393, "epoch": 713, "val_loss": 2723551.25} {"train_loss": -36.91875076293945, "global_step": 86394, "epoch": 714} {"train_loss": -36.49694061279297, "global_step": 86395, "epoch": 714} {"train_loss": -36.94218444824219, "global_step": 86396, "epoch": 714} {"train_loss": -36.87892532348633, "global_step": 86397, "epoch": 714} {"train_loss": -33.99471664428711, "global_step": 86398, "epoch": 714} {"train_loss": -30.80096435546875, "global_step": 86399, "epoch": 714} {"train_loss": -28.693124771118164, "global_step": 86400, "epoch": 714} {"train_loss": -30.109472274780273, "global_step": 86401, "epoch": 714} {"train_loss": -36.29438400268555, "global_step": 86402, "epoch": 714} {"train_loss": -33.545166015625, "global_step": 86403, "epoch": 714} {"train_loss": -35.180843353271484, "global_step": 86404, "epoch": 714} {"train_loss": -33.577022552490234, "global_step": 86405, "epoch": 714} {"train_loss": -36.55052947998047, "global_step": 86406, "epoch": 714} {"train_loss": -33.95589828491211, "global_step": 86407, "epoch": 714} {"train_loss": -30.513601303100586, "global_step": 86408, "epoch": 714} {"train_loss": -33.810302734375, "global_step": 86409, "epoch": 714} {"train_loss": -34.12858200073242, "global_step": 86410, "epoch": 714} {"train_loss": -35.60398483276367, "global_step": 86411, "epoch": 714} {"train_loss": -33.58211135864258, "global_step": 86412, "epoch": 714} {"train_loss": -32.82594680786133, "global_step": 86413, "epoch": 714} {"train_loss": -35.2302360534668, "global_step": 86414, "epoch": 714} {"train_loss": -33.0045166015625, "global_step": 86415, "epoch": 714} {"train_loss": -34.6710319519043, "global_step": 86416, "epoch": 714} {"train_loss": -32.53664016723633, "global_step": 86417, "epoch": 714} {"train_loss": -33.25990676879883, "global_step": 86418, "epoch": 714} {"train_loss": -33.79367446899414, "global_step": 86419, "epoch": 714} {"train_loss": -34.07843780517578, "global_step": 86420, "epoch": 714} {"train_loss": -34.76625442504883, "global_step": 86421, "epoch": 714} {"train_loss": -34.7816047668457, "global_step": 86422, "epoch": 714} {"train_loss": -33.4478759765625, "global_step": 86423, "epoch": 714} {"train_loss": -34.91151809692383, "global_step": 86424, "epoch": 714} {"train_loss": -35.068389892578125, "global_step": 86425, "epoch": 714} {"train_loss": -34.397945404052734, "global_step": 86426, "epoch": 714} {"train_loss": -36.19414520263672, "global_step": 86427, "epoch": 714} {"train_loss": -34.252418518066406, "global_step": 86428, "epoch": 714} {"train_loss": -35.42704772949219, "global_step": 86429, "epoch": 714} {"train_loss": -34.991493225097656, "global_step": 86430, "epoch": 714} {"train_loss": -34.581233978271484, "global_step": 86431, "epoch": 714} {"train_loss": -34.60902404785156, "global_step": 86432, "epoch": 714} {"train_loss": -35.184566497802734, "global_step": 86433, "epoch": 714} {"train_loss": -35.295074462890625, "global_step": 86434, "epoch": 714} {"train_loss": -35.81244659423828, "global_step": 86435, "epoch": 714} {"train_loss": -35.88253402709961, "global_step": 86436, "epoch": 714} {"train_loss": -35.686927795410156, "global_step": 86437, "epoch": 714} {"train_loss": -36.421958923339844, "global_step": 86438, "epoch": 714} {"train_loss": -35.9069709777832, "global_step": 86439, "epoch": 714} {"train_loss": -35.99977493286133, "global_step": 86440, "epoch": 714} {"train_loss": -35.652503967285156, "global_step": 86441, "epoch": 714} {"train_loss": -36.23525619506836, "global_step": 86442, "epoch": 714} {"train_loss": -35.90314483642578, "global_step": 86443, "epoch": 714} {"train_loss": -35.81925582885742, "global_step": 86444, "epoch": 714} {"train_loss": -35.90468978881836, "global_step": 86445, "epoch": 714} {"train_loss": -36.118953704833984, "global_step": 86446, "epoch": 714} {"train_loss": -36.45001983642578, "global_step": 86447, "epoch": 714} {"train_loss": -36.390968322753906, "global_step": 86448, "epoch": 714} {"train_loss": -36.316131591796875, "global_step": 86449, "epoch": 714} {"train_loss": -36.262725830078125, "global_step": 86450, "epoch": 714} {"train_loss": -36.615970611572266, "global_step": 86451, "epoch": 714} {"train_loss": -36.9378547668457, "global_step": 86452, "epoch": 714} {"train_loss": -36.12604522705078, "global_step": 86453, "epoch": 714} {"train_loss": -36.993099212646484, "global_step": 86454, "epoch": 714} {"train_loss": -36.65210723876953, "global_step": 86455, "epoch": 714} {"train_loss": -36.47042465209961, "global_step": 86456, "epoch": 714} {"train_loss": -36.93894577026367, "global_step": 86457, "epoch": 714} {"train_loss": -36.94968795776367, "global_step": 86458, "epoch": 714} {"train_loss": -36.564083099365234, "global_step": 86459, "epoch": 714} {"train_loss": -36.827327728271484, "global_step": 86460, "epoch": 714} {"train_loss": -36.98762893676758, "global_step": 86461, "epoch": 714} {"train_loss": -36.48408126831055, "global_step": 86462, "epoch": 714} {"train_loss": -36.65623474121094, "global_step": 86463, "epoch": 714} {"train_loss": -37.03280258178711, "global_step": 86464, "epoch": 714} {"train_loss": -37.22239685058594, "global_step": 86465, "epoch": 714} {"train_loss": -37.0805778503418, "global_step": 86466, "epoch": 714} {"train_loss": -37.2906379699707, "global_step": 86467, "epoch": 714} {"train_loss": -37.02350616455078, "global_step": 86468, "epoch": 714} {"train_loss": -37.42702865600586, "global_step": 86469, "epoch": 714} {"train_loss": -37.42681884765625, "global_step": 86470, "epoch": 714} {"train_loss": -37.472957611083984, "global_step": 86471, "epoch": 714} {"train_loss": -37.322296142578125, "global_step": 86472, "epoch": 714} {"train_loss": -37.49974822998047, "global_step": 86473, "epoch": 714} {"train_loss": -36.66301345825195, "global_step": 86474, "epoch": 714} {"train_loss": -37.526161193847656, "global_step": 86475, "epoch": 714} {"train_loss": -37.370460510253906, "global_step": 86476, "epoch": 714} {"train_loss": -37.3674201965332, "global_step": 86477, "epoch": 714} {"train_loss": -37.62226486206055, "global_step": 86478, "epoch": 714} {"train_loss": -37.50832748413086, "global_step": 86479, "epoch": 714} {"train_loss": -37.2548942565918, "global_step": 86480, "epoch": 714} {"train_loss": -37.16412353515625, "global_step": 86481, "epoch": 714} {"train_loss": -37.54756546020508, "global_step": 86482, "epoch": 714} {"train_loss": -37.67191696166992, "global_step": 86483, "epoch": 714} {"train_loss": -37.64307403564453, "global_step": 86484, "epoch": 714} {"train_loss": -37.98341369628906, "global_step": 86485, "epoch": 714} {"train_loss": -38.07835388183594, "global_step": 86486, "epoch": 714} {"train_loss": -37.62900161743164, "global_step": 86487, "epoch": 714} {"train_loss": -37.80546951293945, "global_step": 86488, "epoch": 714} {"train_loss": -37.85011291503906, "global_step": 86489, "epoch": 714} {"train_loss": -37.94685363769531, "global_step": 86490, "epoch": 714} {"train_loss": -37.118629455566406, "global_step": 86491, "epoch": 714} {"train_loss": -34.76096725463867, "global_step": 86492, "epoch": 714} {"train_loss": -36.40034484863281, "global_step": 86493, "epoch": 714} {"train_loss": -36.69377517700195, "global_step": 86494, "epoch": 714} {"train_loss": -35.3325080871582, "global_step": 86495, "epoch": 714} {"train_loss": -36.0916633605957, "global_step": 86496, "epoch": 714} {"train_loss": -35.215240478515625, "global_step": 86497, "epoch": 714} {"train_loss": -36.26691436767578, "global_step": 86498, "epoch": 714} {"train_loss": -36.92462921142578, "global_step": 86499, "epoch": 714} {"train_loss": -36.822235107421875, "global_step": 86500, "epoch": 714} {"train_loss": -37.04341506958008, "global_step": 86501, "epoch": 714} {"train_loss": -36.67410659790039, "global_step": 86502, "epoch": 714} {"train_loss": -37.93917465209961, "global_step": 86503, "epoch": 714} {"train_loss": -37.25445556640625, "global_step": 86504, "epoch": 714} {"train_loss": -36.557857513427734, "global_step": 86505, "epoch": 714} {"train_loss": -34.122901916503906, "global_step": 86506, "epoch": 714} {"train_loss": -31.512130737304688, "global_step": 86507, "epoch": 714} {"train_loss": -31.117883682250977, "global_step": 86508, "epoch": 714} {"train_loss": -35.20145797729492, "global_step": 86509, "epoch": 714} {"train_loss": -36.7110481262207, "global_step": 86510, "epoch": 714} {"train_loss": -34.588863372802734, "global_step": 86511, "epoch": 714} {"train_loss": -37.091976165771484, "global_step": 86512, "epoch": 714} {"train_loss": -36.009334564208984, "global_step": 86513, "epoch": 714} {"train_loss": -35.79073258076818, "global_step": 86514, "epoch": 714, "val_loss": 2667925.0} {"train_loss": -36.6016960144043, "global_step": 86515, "epoch": 715} {"train_loss": -36.79934310913086, "global_step": 86516, "epoch": 715} {"train_loss": -37.06330108642578, "global_step": 86517, "epoch": 715} {"train_loss": -37.336360931396484, "global_step": 86518, "epoch": 715} {"train_loss": -37.402462005615234, "global_step": 86519, "epoch": 715} {"train_loss": -37.3857421875, "global_step": 86520, "epoch": 715} {"train_loss": -37.2157096862793, "global_step": 86521, "epoch": 715} {"train_loss": -37.48738479614258, "global_step": 86522, "epoch": 715} {"train_loss": -36.30788803100586, "global_step": 86523, "epoch": 715} {"train_loss": -37.62599563598633, "global_step": 86524, "epoch": 715} {"train_loss": -38.06505584716797, "global_step": 86525, "epoch": 715} {"train_loss": -37.83311080932617, "global_step": 86526, "epoch": 715} {"train_loss": -37.16378402709961, "global_step": 86527, "epoch": 715} {"train_loss": -37.90298080444336, "global_step": 86528, "epoch": 715} {"train_loss": -38.088680267333984, "global_step": 86529, "epoch": 715} {"train_loss": -37.70872116088867, "global_step": 86530, "epoch": 715} {"train_loss": -37.596431732177734, "global_step": 86531, "epoch": 715} {"train_loss": -37.831756591796875, "global_step": 86532, "epoch": 715} {"train_loss": -37.21826171875, "global_step": 86533, "epoch": 715} {"train_loss": -37.84854507446289, "global_step": 86534, "epoch": 715} {"train_loss": -37.91146469116211, "global_step": 86535, "epoch": 715} {"train_loss": -37.31602096557617, "global_step": 86536, "epoch": 715} {"train_loss": -38.297298431396484, "global_step": 86537, "epoch": 715} {"train_loss": -38.326080322265625, "global_step": 86538, "epoch": 715} {"train_loss": -37.69095993041992, "global_step": 86539, "epoch": 715} {"train_loss": -37.675533294677734, "global_step": 86540, "epoch": 715} {"train_loss": -38.44300079345703, "global_step": 86541, "epoch": 715} {"train_loss": -38.133052825927734, "global_step": 86542, "epoch": 715} {"train_loss": -37.39361572265625, "global_step": 86543, "epoch": 715} {"train_loss": -36.877708435058594, "global_step": 86544, "epoch": 715} {"train_loss": -36.68769073486328, "global_step": 86545, "epoch": 715} {"train_loss": -36.32957077026367, "global_step": 86546, "epoch": 715} {"train_loss": -37.014320373535156, "global_step": 86547, "epoch": 715} {"train_loss": -38.2266960144043, "global_step": 86548, "epoch": 715} {"train_loss": -37.02926254272461, "global_step": 86549, "epoch": 715} {"train_loss": -37.74213409423828, "global_step": 86550, "epoch": 715} {"train_loss": -37.58121109008789, "global_step": 86551, "epoch": 715} {"train_loss": -37.50715255737305, "global_step": 86552, "epoch": 715} {"train_loss": -36.800899505615234, "global_step": 86553, "epoch": 715} {"train_loss": -36.1763801574707, "global_step": 86554, "epoch": 715} {"train_loss": -35.93891525268555, "global_step": 86555, "epoch": 715} {"train_loss": -37.55164337158203, "global_step": 86556, "epoch": 715} {"train_loss": -37.76776123046875, "global_step": 86557, "epoch": 715} {"train_loss": -37.054840087890625, "global_step": 86558, "epoch": 715} {"train_loss": -37.38717269897461, "global_step": 86559, "epoch": 715} {"train_loss": -37.55215072631836, "global_step": 86560, "epoch": 715} {"train_loss": -36.750423431396484, "global_step": 86561, "epoch": 715} {"train_loss": -37.24103546142578, "global_step": 86562, "epoch": 715} {"train_loss": -37.17153549194336, "global_step": 86563, "epoch": 715} {"train_loss": -36.9959831237793, "global_step": 86564, "epoch": 715} {"train_loss": -37.74506759643555, "global_step": 86565, "epoch": 715} {"train_loss": -37.51150894165039, "global_step": 86566, "epoch": 715} {"train_loss": -37.55491256713867, "global_step": 86567, "epoch": 715} {"train_loss": -37.626258850097656, "global_step": 86568, "epoch": 715} {"train_loss": -37.895320892333984, "global_step": 86569, "epoch": 715} {"train_loss": -37.71743392944336, "global_step": 86570, "epoch": 715} {"train_loss": -37.608821868896484, "global_step": 86571, "epoch": 715} {"train_loss": -36.7189826965332, "global_step": 86572, "epoch": 715} {"train_loss": -37.41938018798828, "global_step": 86573, "epoch": 715} {"train_loss": -37.974273681640625, "global_step": 86574, "epoch": 715} {"train_loss": -37.80943298339844, "global_step": 86575, "epoch": 715} {"train_loss": -37.333702087402344, "global_step": 86576, "epoch": 715} {"train_loss": -37.446571350097656, "global_step": 86577, "epoch": 715} {"train_loss": -37.0505485534668, "global_step": 86578, "epoch": 715} {"train_loss": -37.40266799926758, "global_step": 86579, "epoch": 715} {"train_loss": -37.8046760559082, "global_step": 86580, "epoch": 715} {"train_loss": -37.2845573425293, "global_step": 86581, "epoch": 715} {"train_loss": -36.41127395629883, "global_step": 86582, "epoch": 715} {"train_loss": -36.99787521362305, "global_step": 86583, "epoch": 715} {"train_loss": -38.01976013183594, "global_step": 86584, "epoch": 715} {"train_loss": -37.77407455444336, "global_step": 86585, "epoch": 715} {"train_loss": -36.622703552246094, "global_step": 86586, "epoch": 715} {"train_loss": -37.787818908691406, "global_step": 86587, "epoch": 715} {"train_loss": -37.591087341308594, "global_step": 86588, "epoch": 715} {"train_loss": -37.49748611450195, "global_step": 86589, "epoch": 715} {"train_loss": -36.12495803833008, "global_step": 86590, "epoch": 715} {"train_loss": -37.66328811645508, "global_step": 86591, "epoch": 715} {"train_loss": -36.630367279052734, "global_step": 86592, "epoch": 715} {"train_loss": -38.44689178466797, "global_step": 86593, "epoch": 715} {"train_loss": -37.69193649291992, "global_step": 86594, "epoch": 715} {"train_loss": -38.02063751220703, "global_step": 86595, "epoch": 715} {"train_loss": -38.298683166503906, "global_step": 86596, "epoch": 715} {"train_loss": -37.396114349365234, "global_step": 86597, "epoch": 715} {"train_loss": -37.9331169128418, "global_step": 86598, "epoch": 715} {"train_loss": -36.84368896484375, "global_step": 86599, "epoch": 715} {"train_loss": -35.8157958984375, "global_step": 86600, "epoch": 715} {"train_loss": -35.47526168823242, "global_step": 86601, "epoch": 715} {"train_loss": -36.88282012939453, "global_step": 86602, "epoch": 715} {"train_loss": -37.20322799682617, "global_step": 86603, "epoch": 715} {"train_loss": -35.18954086303711, "global_step": 86604, "epoch": 715} {"train_loss": -36.07729721069336, "global_step": 86605, "epoch": 715} {"train_loss": -37.06291961669922, "global_step": 86606, "epoch": 715} {"train_loss": -35.712440490722656, "global_step": 86607, "epoch": 715} {"train_loss": -36.725460052490234, "global_step": 86608, "epoch": 715} {"train_loss": -35.204307556152344, "global_step": 86609, "epoch": 715} {"train_loss": -30.652435302734375, "global_step": 86610, "epoch": 715} {"train_loss": -29.474218368530273, "global_step": 86611, "epoch": 715} {"train_loss": -35.25020980834961, "global_step": 86612, "epoch": 715} {"train_loss": -32.42536544799805, "global_step": 86613, "epoch": 715} {"train_loss": -32.182735443115234, "global_step": 86614, "epoch": 715} {"train_loss": -34.900665283203125, "global_step": 86615, "epoch": 715} {"train_loss": -33.65948486328125, "global_step": 86616, "epoch": 715} {"train_loss": -34.17074203491211, "global_step": 86617, "epoch": 715} {"train_loss": -34.37551498413086, "global_step": 86618, "epoch": 715} {"train_loss": -35.625057220458984, "global_step": 86619, "epoch": 715} {"train_loss": -35.1241569519043, "global_step": 86620, "epoch": 715} {"train_loss": -31.853271484375, "global_step": 86621, "epoch": 715} {"train_loss": -34.49685287475586, "global_step": 86622, "epoch": 715} {"train_loss": -35.49911117553711, "global_step": 86623, "epoch": 715} {"train_loss": -32.745460510253906, "global_step": 86624, "epoch": 715} {"train_loss": -31.99190330505371, "global_step": 86625, "epoch": 715} {"train_loss": -33.503944396972656, "global_step": 86626, "epoch": 715} {"train_loss": -33.65391159057617, "global_step": 86627, "epoch": 715} {"train_loss": -35.183448791503906, "global_step": 86628, "epoch": 715} {"train_loss": -35.88467025756836, "global_step": 86629, "epoch": 715} {"train_loss": -35.152278900146484, "global_step": 86630, "epoch": 715} {"train_loss": -36.60591125488281, "global_step": 86631, "epoch": 715} {"train_loss": -35.069393157958984, "global_step": 86632, "epoch": 715} {"train_loss": -35.259151458740234, "global_step": 86633, "epoch": 715} {"train_loss": -35.7203254699707, "global_step": 86634, "epoch": 715} {"train_loss": -36.60362650343209, "global_step": 86635, "epoch": 715, "val_loss": 3093216.0} {"train_loss": -34.529945373535156, "global_step": 86636, "epoch": 716} {"train_loss": -35.24538803100586, "global_step": 86637, "epoch": 716} {"train_loss": -34.12592697143555, "global_step": 86638, "epoch": 716} {"train_loss": -35.40863037109375, "global_step": 86639, "epoch": 716} {"train_loss": -35.66146469116211, "global_step": 86640, "epoch": 716} {"train_loss": -35.62160873413086, "global_step": 86641, "epoch": 716} {"train_loss": -35.5412483215332, "global_step": 86642, "epoch": 716} {"train_loss": -36.016849517822266, "global_step": 86643, "epoch": 716} {"train_loss": -36.708736419677734, "global_step": 86644, "epoch": 716} {"train_loss": -36.48613357543945, "global_step": 86645, "epoch": 716} {"train_loss": -36.30229949951172, "global_step": 86646, "epoch": 716} {"train_loss": -36.334320068359375, "global_step": 86647, "epoch": 716} {"train_loss": -36.432979583740234, "global_step": 86648, "epoch": 716} {"train_loss": -35.3065299987793, "global_step": 86649, "epoch": 716} {"train_loss": -33.599586486816406, "global_step": 86650, "epoch": 716} {"train_loss": -34.23330307006836, "global_step": 86651, "epoch": 716} {"train_loss": -36.3741569519043, "global_step": 86652, "epoch": 716} {"train_loss": -36.8009147644043, "global_step": 86653, "epoch": 716} {"train_loss": -36.11763381958008, "global_step": 86654, "epoch": 716} {"train_loss": -36.07108688354492, "global_step": 86655, "epoch": 716} {"train_loss": -36.46925735473633, "global_step": 86656, "epoch": 716} {"train_loss": -37.262508392333984, "global_step": 86657, "epoch": 716} {"train_loss": -36.486732482910156, "global_step": 86658, "epoch": 716} {"train_loss": -36.557674407958984, "global_step": 86659, "epoch": 716} {"train_loss": -36.145931243896484, "global_step": 86660, "epoch": 716} {"train_loss": -36.228302001953125, "global_step": 86661, "epoch": 716} {"train_loss": -36.690914154052734, "global_step": 86662, "epoch": 716} {"train_loss": -37.17365646362305, "global_step": 86663, "epoch": 716} {"train_loss": -36.536781311035156, "global_step": 86664, "epoch": 716} {"train_loss": -36.46205520629883, "global_step": 86665, "epoch": 716} {"train_loss": -37.24232864379883, "global_step": 86666, "epoch": 716} {"train_loss": -37.595558166503906, "global_step": 86667, "epoch": 716} {"train_loss": -37.319271087646484, "global_step": 86668, "epoch": 716} {"train_loss": -37.08285903930664, "global_step": 86669, "epoch": 716} {"train_loss": -37.507259368896484, "global_step": 86670, "epoch": 716} {"train_loss": -37.13532257080078, "global_step": 86671, "epoch": 716} {"train_loss": -37.194149017333984, "global_step": 86672, "epoch": 716} {"train_loss": -37.6871223449707, "global_step": 86673, "epoch": 716} {"train_loss": -37.340492248535156, "global_step": 86674, "epoch": 716} {"train_loss": -37.59892654418945, "global_step": 86675, "epoch": 716} {"train_loss": -37.06844711303711, "global_step": 86676, "epoch": 716} {"train_loss": -37.069644927978516, "global_step": 86677, "epoch": 716} {"train_loss": -37.44717025756836, "global_step": 86678, "epoch": 716} {"train_loss": -37.06966018676758, "global_step": 86679, "epoch": 716} {"train_loss": -37.44289779663086, "global_step": 86680, "epoch": 716} {"train_loss": -37.47433853149414, "global_step": 86681, "epoch": 716} {"train_loss": -37.24198532104492, "global_step": 86682, "epoch": 716} {"train_loss": -38.3589973449707, "global_step": 86683, "epoch": 716} {"train_loss": -37.7737922668457, "global_step": 86684, "epoch": 716} {"train_loss": -37.98171615600586, "global_step": 86685, "epoch": 716} {"train_loss": -37.5239372253418, "global_step": 86686, "epoch": 716} {"train_loss": -37.4741325378418, "global_step": 86687, "epoch": 716} {"train_loss": -37.99473190307617, "global_step": 86688, "epoch": 716} {"train_loss": -38.11796188354492, "global_step": 86689, "epoch": 716} {"train_loss": -37.18345260620117, "global_step": 86690, "epoch": 716} {"train_loss": -33.79878234863281, "global_step": 86691, "epoch": 716} {"train_loss": -26.57110023498535, "global_step": 86692, "epoch": 716} {"train_loss": -9.085297584533691, "global_step": 86693, "epoch": 716} {"train_loss": 1.509227991104126, "global_step": 86694, "epoch": 716} {"train_loss": -28.643125534057617, "global_step": 86695, "epoch": 716} {"train_loss": -25.048044204711914, "global_step": 86696, "epoch": 716} {"train_loss": -29.517913818359375, "global_step": 86697, "epoch": 716} {"train_loss": -26.597814559936523, "global_step": 86698, "epoch": 716} {"train_loss": -35.781463623046875, "global_step": 86699, "epoch": 716} {"train_loss": -25.913053512573242, "global_step": 86700, "epoch": 716} {"train_loss": -35.686279296875, "global_step": 86701, "epoch": 716} {"train_loss": -31.897937774658203, "global_step": 86702, "epoch": 716} {"train_loss": -30.235095977783203, "global_step": 86703, "epoch": 716} {"train_loss": -37.161407470703125, "global_step": 86704, "epoch": 716} {"train_loss": -33.310157775878906, "global_step": 86705, "epoch": 716} {"train_loss": -32.90386199951172, "global_step": 86706, "epoch": 716} {"train_loss": -34.35126876831055, "global_step": 86707, "epoch": 716} {"train_loss": -34.59356689453125, "global_step": 86708, "epoch": 716} {"train_loss": -34.28520965576172, "global_step": 86709, "epoch": 716} {"train_loss": -31.891742706298828, "global_step": 86710, "epoch": 716} {"train_loss": -32.550758361816406, "global_step": 86711, "epoch": 716} {"train_loss": -35.05097579956055, "global_step": 86712, "epoch": 716} {"train_loss": -35.27573776245117, "global_step": 86713, "epoch": 716} {"train_loss": -33.69902801513672, "global_step": 86714, "epoch": 716} {"train_loss": -35.247798919677734, "global_step": 86715, "epoch": 716} {"train_loss": -34.78803634643555, "global_step": 86716, "epoch": 716} {"train_loss": -35.097869873046875, "global_step": 86717, "epoch": 716} {"train_loss": -35.909690856933594, "global_step": 86718, "epoch": 716} {"train_loss": -34.93490982055664, "global_step": 86719, "epoch": 716} {"train_loss": -35.22925567626953, "global_step": 86720, "epoch": 716} {"train_loss": -36.59006118774414, "global_step": 86721, "epoch": 716} {"train_loss": -33.65468978881836, "global_step": 86722, "epoch": 716} {"train_loss": -36.5434684753418, "global_step": 86723, "epoch": 716} {"train_loss": -35.32698440551758, "global_step": 86724, "epoch": 716} {"train_loss": -35.75966262817383, "global_step": 86725, "epoch": 716} {"train_loss": -36.53842544555664, "global_step": 86726, "epoch": 716} {"train_loss": -36.93534469604492, "global_step": 86727, "epoch": 716} {"train_loss": -35.964820861816406, "global_step": 86728, "epoch": 716} {"train_loss": -36.313026428222656, "global_step": 86729, "epoch": 716} {"train_loss": -36.137332916259766, "global_step": 86730, "epoch": 716} {"train_loss": -36.643157958984375, "global_step": 86731, "epoch": 716} {"train_loss": -36.943729400634766, "global_step": 86732, "epoch": 716} {"train_loss": -36.77713394165039, "global_step": 86733, "epoch": 716} {"train_loss": -36.55915451049805, "global_step": 86734, "epoch": 716} {"train_loss": -36.8665885925293, "global_step": 86735, "epoch": 716} {"train_loss": -36.68647384643555, "global_step": 86736, "epoch": 716} {"train_loss": -37.29047393798828, "global_step": 86737, "epoch": 716} {"train_loss": -37.03078079223633, "global_step": 86738, "epoch": 716} {"train_loss": -36.86228942871094, "global_step": 86739, "epoch": 716} {"train_loss": -37.43330001831055, "global_step": 86740, "epoch": 716} {"train_loss": -37.322574615478516, "global_step": 86741, "epoch": 716} {"train_loss": -37.74061965942383, "global_step": 86742, "epoch": 716} {"train_loss": -37.44765090942383, "global_step": 86743, "epoch": 716} {"train_loss": -37.715694427490234, "global_step": 86744, "epoch": 716} {"train_loss": -34.822059631347656, "global_step": 86745, "epoch": 716} {"train_loss": -37.45146942138672, "global_step": 86746, "epoch": 716} {"train_loss": -37.57416915893555, "global_step": 86747, "epoch": 716} {"train_loss": -36.94082260131836, "global_step": 86748, "epoch": 716} {"train_loss": -34.88044738769531, "global_step": 86749, "epoch": 716} {"train_loss": -35.95972442626953, "global_step": 86750, "epoch": 716} {"train_loss": -37.35679244995117, "global_step": 86751, "epoch": 716} {"train_loss": -37.5311393737793, "global_step": 86752, "epoch": 716} {"train_loss": -37.744781494140625, "global_step": 86753, "epoch": 716} {"train_loss": -36.778900146484375, "global_step": 86754, "epoch": 716} {"train_loss": -37.172183990478516, "global_step": 86755, "epoch": 716} {"train_loss": -35.210953442518374, "global_step": 86756, "epoch": 716, "val_loss": 2601439.75} {"train_loss": -37.835845947265625, "global_step": 86757, "epoch": 717} {"train_loss": -36.15155029296875, "global_step": 86758, "epoch": 717} {"train_loss": -37.2232780456543, "global_step": 86759, "epoch": 717} {"train_loss": -37.12543869018555, "global_step": 86760, "epoch": 717} {"train_loss": -37.153499603271484, "global_step": 86761, "epoch": 717} {"train_loss": -37.84391403198242, "global_step": 86762, "epoch": 717} {"train_loss": -37.12936019897461, "global_step": 86763, "epoch": 717} {"train_loss": -37.797237396240234, "global_step": 86764, "epoch": 717} {"train_loss": -37.40064239501953, "global_step": 86765, "epoch": 717} {"train_loss": -38.13397216796875, "global_step": 86766, "epoch": 717} {"train_loss": -37.77495193481445, "global_step": 86767, "epoch": 717} {"train_loss": -37.764686584472656, "global_step": 86768, "epoch": 717} {"train_loss": -37.053924560546875, "global_step": 86769, "epoch": 717} {"train_loss": -38.05312728881836, "global_step": 86770, "epoch": 717} {"train_loss": -37.915321350097656, "global_step": 86771, "epoch": 717} {"train_loss": -38.06100082397461, "global_step": 86772, "epoch": 717} {"train_loss": -37.30585479736328, "global_step": 86773, "epoch": 717} {"train_loss": -37.958404541015625, "global_step": 86774, "epoch": 717} {"train_loss": -36.71946334838867, "global_step": 86775, "epoch": 717} {"train_loss": -37.188026428222656, "global_step": 86776, "epoch": 717} {"train_loss": -37.17013168334961, "global_step": 86777, "epoch": 717} {"train_loss": -37.477394104003906, "global_step": 86778, "epoch": 717} {"train_loss": -35.120967864990234, "global_step": 86779, "epoch": 717} {"train_loss": -35.51355743408203, "global_step": 86780, "epoch": 717} {"train_loss": -34.787025451660156, "global_step": 86781, "epoch": 717} {"train_loss": -31.143096923828125, "global_step": 86782, "epoch": 717} {"train_loss": -32.97663497924805, "global_step": 86783, "epoch": 717} {"train_loss": -37.44424057006836, "global_step": 86784, "epoch": 717} {"train_loss": -36.4784049987793, "global_step": 86785, "epoch": 717} {"train_loss": -33.863040924072266, "global_step": 86786, "epoch": 717} {"train_loss": -37.30971145629883, "global_step": 86787, "epoch": 717} {"train_loss": -35.2389030456543, "global_step": 86788, "epoch": 717} {"train_loss": -34.127811431884766, "global_step": 86789, "epoch": 717} {"train_loss": -34.47494888305664, "global_step": 86790, "epoch": 717} {"train_loss": -31.816450119018555, "global_step": 86791, "epoch": 717} {"train_loss": -36.376930236816406, "global_step": 86792, "epoch": 717} {"train_loss": -34.883758544921875, "global_step": 86793, "epoch": 717} {"train_loss": -36.813880920410156, "global_step": 86794, "epoch": 717} {"train_loss": -34.49666976928711, "global_step": 86795, "epoch": 717} {"train_loss": -35.089935302734375, "global_step": 86796, "epoch": 717} {"train_loss": -34.0642204284668, "global_step": 86797, "epoch": 717} {"train_loss": -35.117313385009766, "global_step": 86798, "epoch": 717} {"train_loss": -32.80782699584961, "global_step": 86799, "epoch": 717} {"train_loss": -33.49340057373047, "global_step": 86800, "epoch": 717} {"train_loss": -36.045494079589844, "global_step": 86801, "epoch": 717} {"train_loss": -34.996559143066406, "global_step": 86802, "epoch": 717} {"train_loss": -33.80120849609375, "global_step": 86803, "epoch": 717} {"train_loss": -33.561458587646484, "global_step": 86804, "epoch": 717} {"train_loss": -35.20920944213867, "global_step": 86805, "epoch": 717} {"train_loss": -34.78470230102539, "global_step": 86806, "epoch": 717} {"train_loss": -35.760284423828125, "global_step": 86807, "epoch": 717} {"train_loss": -35.41840362548828, "global_step": 86808, "epoch": 717} {"train_loss": -36.447898864746094, "global_step": 86809, "epoch": 717} {"train_loss": -35.1103401184082, "global_step": 86810, "epoch": 717} {"train_loss": -36.45001983642578, "global_step": 86811, "epoch": 717} {"train_loss": -33.2833137512207, "global_step": 86812, "epoch": 717} {"train_loss": -34.809818267822266, "global_step": 86813, "epoch": 717} {"train_loss": -35.67021560668945, "global_step": 86814, "epoch": 717} {"train_loss": -34.61945724487305, "global_step": 86815, "epoch": 717} {"train_loss": -34.5350456237793, "global_step": 86816, "epoch": 717} {"train_loss": -35.99201965332031, "global_step": 86817, "epoch": 717} {"train_loss": -34.91390609741211, "global_step": 86818, "epoch": 717} {"train_loss": -35.44757843017578, "global_step": 86819, "epoch": 717} {"train_loss": -33.10185623168945, "global_step": 86820, "epoch": 717} {"train_loss": -34.25080490112305, "global_step": 86821, "epoch": 717} {"train_loss": -35.03146743774414, "global_step": 86822, "epoch": 717} {"train_loss": -35.7880859375, "global_step": 86823, "epoch": 717} {"train_loss": -33.91199493408203, "global_step": 86824, "epoch": 717} {"train_loss": -35.29237747192383, "global_step": 86825, "epoch": 717} {"train_loss": -36.02154541015625, "global_step": 86826, "epoch": 717} {"train_loss": -35.404747009277344, "global_step": 86827, "epoch": 717} {"train_loss": -35.81808090209961, "global_step": 86828, "epoch": 717} {"train_loss": -34.37912368774414, "global_step": 86829, "epoch": 717} {"train_loss": -35.72963333129883, "global_step": 86830, "epoch": 717} {"train_loss": -35.124568939208984, "global_step": 86831, "epoch": 717} {"train_loss": -34.38861083984375, "global_step": 86832, "epoch": 717} {"train_loss": -34.84806823730469, "global_step": 86833, "epoch": 717} {"train_loss": -35.533531188964844, "global_step": 86834, "epoch": 717} {"train_loss": -35.96356964111328, "global_step": 86835, "epoch": 717} {"train_loss": -35.58155059814453, "global_step": 86836, "epoch": 717} {"train_loss": -36.02295684814453, "global_step": 86837, "epoch": 717} {"train_loss": -35.11959457397461, "global_step": 86838, "epoch": 717} {"train_loss": -35.273860931396484, "global_step": 86839, "epoch": 717} {"train_loss": -36.015071868896484, "global_step": 86840, "epoch": 717} {"train_loss": -36.41781234741211, "global_step": 86841, "epoch": 717} {"train_loss": -36.33620071411133, "global_step": 86842, "epoch": 717} {"train_loss": -36.19049072265625, "global_step": 86843, "epoch": 717} {"train_loss": -35.394474029541016, "global_step": 86844, "epoch": 717} {"train_loss": -35.63433837890625, "global_step": 86845, "epoch": 717} {"train_loss": -36.59817886352539, "global_step": 86846, "epoch": 717} {"train_loss": -35.53900909423828, "global_step": 86847, "epoch": 717} {"train_loss": -36.55963134765625, "global_step": 86848, "epoch": 717} {"train_loss": -36.62305450439453, "global_step": 86849, "epoch": 717} {"train_loss": -36.54716110229492, "global_step": 86850, "epoch": 717} {"train_loss": -36.68490982055664, "global_step": 86851, "epoch": 717} {"train_loss": -35.884796142578125, "global_step": 86852, "epoch": 717} {"train_loss": -36.75969314575195, "global_step": 86853, "epoch": 717} {"train_loss": -37.052669525146484, "global_step": 86854, "epoch": 717} {"train_loss": -36.52971649169922, "global_step": 86855, "epoch": 717} {"train_loss": -36.70958709716797, "global_step": 86856, "epoch": 717} {"train_loss": -37.00690460205078, "global_step": 86857, "epoch": 717} {"train_loss": -36.95376968383789, "global_step": 86858, "epoch": 717} {"train_loss": -36.56718063354492, "global_step": 86859, "epoch": 717} {"train_loss": -36.5699577331543, "global_step": 86860, "epoch": 717} {"train_loss": -36.74391555786133, "global_step": 86861, "epoch": 717} {"train_loss": -36.657527923583984, "global_step": 86862, "epoch": 717} {"train_loss": -36.8516845703125, "global_step": 86863, "epoch": 717} {"train_loss": -36.94681930541992, "global_step": 86864, "epoch": 717} {"train_loss": -37.325679779052734, "global_step": 86865, "epoch": 717} {"train_loss": -36.89198303222656, "global_step": 86866, "epoch": 717} {"train_loss": -37.11990737915039, "global_step": 86867, "epoch": 717} {"train_loss": -36.83927536010742, "global_step": 86868, "epoch": 717} {"train_loss": -37.60221481323242, "global_step": 86869, "epoch": 717} {"train_loss": -37.24910354614258, "global_step": 86870, "epoch": 717} {"train_loss": -37.443153381347656, "global_step": 86871, "epoch": 717} {"train_loss": -36.647090911865234, "global_step": 86872, "epoch": 717} {"train_loss": -36.61933517456055, "global_step": 86873, "epoch": 717} {"train_loss": -35.86463165283203, "global_step": 86874, "epoch": 717} {"train_loss": -35.4979362487793, "global_step": 86875, "epoch": 717} {"train_loss": -35.08844757080078, "global_step": 86876, "epoch": 717} {"train_loss": -35.90191664577516, "global_step": 86877, "epoch": 717, "val_loss": 2599174.75} {"train_loss": -36.137229919433594, "global_step": 86878, "epoch": 718} {"train_loss": -36.7206916809082, "global_step": 86879, "epoch": 718} {"train_loss": -37.437374114990234, "global_step": 86880, "epoch": 718} {"train_loss": -36.52434539794922, "global_step": 86881, "epoch": 718} {"train_loss": -36.03245162963867, "global_step": 86882, "epoch": 718} {"train_loss": -34.496803283691406, "global_step": 86883, "epoch": 718} {"train_loss": -35.8195915222168, "global_step": 86884, "epoch": 718} {"train_loss": -36.770687103271484, "global_step": 86885, "epoch": 718} {"train_loss": -36.24964141845703, "global_step": 86886, "epoch": 718} {"train_loss": -36.421875, "global_step": 86887, "epoch": 718} {"train_loss": -37.920955657958984, "global_step": 86888, "epoch": 718} {"train_loss": -36.34934616088867, "global_step": 86889, "epoch": 718} {"train_loss": -35.55111312866211, "global_step": 86890, "epoch": 718} {"train_loss": -37.04984664916992, "global_step": 86891, "epoch": 718} {"train_loss": -36.16773223876953, "global_step": 86892, "epoch": 718} {"train_loss": -36.53745651245117, "global_step": 86893, "epoch": 718} {"train_loss": -36.86655044555664, "global_step": 86894, "epoch": 718} {"train_loss": -35.1763916015625, "global_step": 86895, "epoch": 718} {"train_loss": -35.94342041015625, "global_step": 86896, "epoch": 718} {"train_loss": -36.35819625854492, "global_step": 86897, "epoch": 718} {"train_loss": -34.3802490234375, "global_step": 86898, "epoch": 718} {"train_loss": -37.20682907104492, "global_step": 86899, "epoch": 718} {"train_loss": -34.95344924926758, "global_step": 86900, "epoch": 718} {"train_loss": -35.88335037231445, "global_step": 86901, "epoch": 718} {"train_loss": -34.41340255737305, "global_step": 86902, "epoch": 718} {"train_loss": -34.9464111328125, "global_step": 86903, "epoch": 718} {"train_loss": -36.670772552490234, "global_step": 86904, "epoch": 718} {"train_loss": -34.889278411865234, "global_step": 86905, "epoch": 718} {"train_loss": -35.44328308105469, "global_step": 86906, "epoch": 718} {"train_loss": -36.29193115234375, "global_step": 86907, "epoch": 718} {"train_loss": -36.610633850097656, "global_step": 86908, "epoch": 718} {"train_loss": -35.678218841552734, "global_step": 86909, "epoch": 718} {"train_loss": -34.99838638305664, "global_step": 86910, "epoch": 718} {"train_loss": -36.392635345458984, "global_step": 86911, "epoch": 718} {"train_loss": -35.29311752319336, "global_step": 86912, "epoch": 718} {"train_loss": -36.63569641113281, "global_step": 86913, "epoch": 718} {"train_loss": -34.77759552001953, "global_step": 86914, "epoch": 718} {"train_loss": -37.40793991088867, "global_step": 86915, "epoch": 718} {"train_loss": -35.397003173828125, "global_step": 86916, "epoch": 718} {"train_loss": -37.38508605957031, "global_step": 86917, "epoch": 718} {"train_loss": -35.85525131225586, "global_step": 86918, "epoch": 718} {"train_loss": -36.06887435913086, "global_step": 86919, "epoch": 718} {"train_loss": -36.973968505859375, "global_step": 86920, "epoch": 718} {"train_loss": -36.21535873413086, "global_step": 86921, "epoch": 718} {"train_loss": -36.807533264160156, "global_step": 86922, "epoch": 718} {"train_loss": -35.86014175415039, "global_step": 86923, "epoch": 718} {"train_loss": -37.14122009277344, "global_step": 86924, "epoch": 718} {"train_loss": -35.86757278442383, "global_step": 86925, "epoch": 718} {"train_loss": -36.01449203491211, "global_step": 86926, "epoch": 718} {"train_loss": -37.658424377441406, "global_step": 86927, "epoch": 718} {"train_loss": -36.15336227416992, "global_step": 86928, "epoch": 718} {"train_loss": -37.24062728881836, "global_step": 86929, "epoch": 718} {"train_loss": -37.00082015991211, "global_step": 86930, "epoch": 718} {"train_loss": -36.837547302246094, "global_step": 86931, "epoch": 718} {"train_loss": -36.98411178588867, "global_step": 86932, "epoch": 718} {"train_loss": -36.94007110595703, "global_step": 86933, "epoch": 718} {"train_loss": -37.21682357788086, "global_step": 86934, "epoch": 718} {"train_loss": -37.587650299072266, "global_step": 86935, "epoch": 718} {"train_loss": -37.29524612426758, "global_step": 86936, "epoch": 718} {"train_loss": -37.661041259765625, "global_step": 86937, "epoch": 718} {"train_loss": -37.970924377441406, "global_step": 86938, "epoch": 718} {"train_loss": -36.93929672241211, "global_step": 86939, "epoch": 718} {"train_loss": -37.658721923828125, "global_step": 86940, "epoch": 718} {"train_loss": -37.782142639160156, "global_step": 86941, "epoch": 718} {"train_loss": -38.05095291137695, "global_step": 86942, "epoch": 718} {"train_loss": -37.66253662109375, "global_step": 86943, "epoch": 718} {"train_loss": -37.58760070800781, "global_step": 86944, "epoch": 718} {"train_loss": -38.01296615600586, "global_step": 86945, "epoch": 718} {"train_loss": -37.328365325927734, "global_step": 86946, "epoch": 718} {"train_loss": -37.59417724609375, "global_step": 86947, "epoch": 718} {"train_loss": -38.162349700927734, "global_step": 86948, "epoch": 718} {"train_loss": -37.57155990600586, "global_step": 86949, "epoch": 718} {"train_loss": -37.482147216796875, "global_step": 86950, "epoch": 718} {"train_loss": -37.51876449584961, "global_step": 86951, "epoch": 718} {"train_loss": -37.20750427246094, "global_step": 86952, "epoch": 718} {"train_loss": -37.2748908996582, "global_step": 86953, "epoch": 718} {"train_loss": -37.39507293701172, "global_step": 86954, "epoch": 718} {"train_loss": -37.784645080566406, "global_step": 86955, "epoch": 718} {"train_loss": -37.416805267333984, "global_step": 86956, "epoch": 718} {"train_loss": -37.84648513793945, "global_step": 86957, "epoch": 718} {"train_loss": -37.68404769897461, "global_step": 86958, "epoch": 718} {"train_loss": -37.83478927612305, "global_step": 86959, "epoch": 718} {"train_loss": -37.766143798828125, "global_step": 86960, "epoch": 718} {"train_loss": -35.62415313720703, "global_step": 86961, "epoch": 718} {"train_loss": -38.16521072387695, "global_step": 86962, "epoch": 718} {"train_loss": -37.89298629760742, "global_step": 86963, "epoch": 718} {"train_loss": -36.7943229675293, "global_step": 86964, "epoch": 718} {"train_loss": -37.634517669677734, "global_step": 86965, "epoch": 718} {"train_loss": -37.41378402709961, "global_step": 86966, "epoch": 718} {"train_loss": -37.59299850463867, "global_step": 86967, "epoch": 718} {"train_loss": -37.21935272216797, "global_step": 86968, "epoch": 718} {"train_loss": -36.197410583496094, "global_step": 86969, "epoch": 718} {"train_loss": -37.49134063720703, "global_step": 86970, "epoch": 718} {"train_loss": -37.86695098876953, "global_step": 86971, "epoch": 718} {"train_loss": -38.00120162963867, "global_step": 86972, "epoch": 718} {"train_loss": -36.9716796875, "global_step": 86973, "epoch": 718} {"train_loss": -37.58732223510742, "global_step": 86974, "epoch": 718} {"train_loss": -37.64488983154297, "global_step": 86975, "epoch": 718} {"train_loss": -37.67098617553711, "global_step": 86976, "epoch": 718} {"train_loss": -37.86134719848633, "global_step": 86977, "epoch": 718} {"train_loss": -37.99540328979492, "global_step": 86978, "epoch": 718} {"train_loss": -38.333675384521484, "global_step": 86979, "epoch": 718} {"train_loss": -37.802223205566406, "global_step": 86980, "epoch": 718} {"train_loss": -37.30422592163086, "global_step": 86981, "epoch": 718} {"train_loss": -37.438655853271484, "global_step": 86982, "epoch": 718} {"train_loss": -37.775779724121094, "global_step": 86983, "epoch": 718} {"train_loss": -37.894161224365234, "global_step": 86984, "epoch": 718} {"train_loss": -38.237117767333984, "global_step": 86985, "epoch": 718} {"train_loss": -37.91437911987305, "global_step": 86986, "epoch": 718} {"train_loss": -37.795814514160156, "global_step": 86987, "epoch": 718} {"train_loss": -38.37015151977539, "global_step": 86988, "epoch": 718} {"train_loss": -38.50175094604492, "global_step": 86989, "epoch": 718} {"train_loss": -37.436744689941406, "global_step": 86990, "epoch": 718} {"train_loss": -38.59824752807617, "global_step": 86991, "epoch": 718} {"train_loss": -38.16817092895508, "global_step": 86992, "epoch": 718} {"train_loss": -37.76991271972656, "global_step": 86993, "epoch": 718} {"train_loss": -37.326751708984375, "global_step": 86994, "epoch": 718} {"train_loss": -36.54960250854492, "global_step": 86995, "epoch": 718} {"train_loss": -36.16415786743164, "global_step": 86996, "epoch": 718} {"train_loss": -33.53416061401367, "global_step": 86997, "epoch": 718} {"train_loss": -36.89690991866687, "global_step": 86998, "epoch": 718, "val_loss": 2719962.0} {"train_loss": -36.40745162963867, "global_step": 86999, "epoch": 719} {"train_loss": -36.409217834472656, "global_step": 87000, "epoch": 719} {"train_loss": -37.52410888671875, "global_step": 87001, "epoch": 719} {"train_loss": -36.699554443359375, "global_step": 87002, "epoch": 719} {"train_loss": -36.81024932861328, "global_step": 87003, "epoch": 719} {"train_loss": -37.67269515991211, "global_step": 87004, "epoch": 719} {"train_loss": -37.135982513427734, "global_step": 87005, "epoch": 719} {"train_loss": -36.96514129638672, "global_step": 87006, "epoch": 719} {"train_loss": -37.76227951049805, "global_step": 87007, "epoch": 719} {"train_loss": -37.49569320678711, "global_step": 87008, "epoch": 719} {"train_loss": -37.93408203125, "global_step": 87009, "epoch": 719} {"train_loss": -37.569061279296875, "global_step": 87010, "epoch": 719} {"train_loss": -37.956764221191406, "global_step": 87011, "epoch": 719} {"train_loss": -36.785377502441406, "global_step": 87012, "epoch": 719} {"train_loss": -37.498695373535156, "global_step": 87013, "epoch": 719} {"train_loss": -37.353065490722656, "global_step": 87014, "epoch": 719} {"train_loss": -37.84267807006836, "global_step": 87015, "epoch": 719} {"train_loss": -37.2092399597168, "global_step": 87016, "epoch": 719} {"train_loss": -36.63951873779297, "global_step": 87017, "epoch": 719} {"train_loss": -37.13893127441406, "global_step": 87018, "epoch": 719} {"train_loss": -37.98310470581055, "global_step": 87019, "epoch": 719} {"train_loss": -37.52632522583008, "global_step": 87020, "epoch": 719} {"train_loss": -37.532875061035156, "global_step": 87021, "epoch": 719} {"train_loss": -37.26189041137695, "global_step": 87022, "epoch": 719} {"train_loss": -36.434600830078125, "global_step": 87023, "epoch": 719} {"train_loss": -35.87502670288086, "global_step": 87024, "epoch": 719} {"train_loss": -37.03219223022461, "global_step": 87025, "epoch": 719} {"train_loss": -38.05217361450195, "global_step": 87026, "epoch": 719} {"train_loss": -37.17145919799805, "global_step": 87027, "epoch": 719} {"train_loss": -36.92804718017578, "global_step": 87028, "epoch": 719} {"train_loss": -38.50333786010742, "global_step": 87029, "epoch": 719} {"train_loss": -38.52065658569336, "global_step": 87030, "epoch": 719} {"train_loss": -37.911983489990234, "global_step": 87031, "epoch": 719} {"train_loss": -37.82807159423828, "global_step": 87032, "epoch": 719} {"train_loss": -37.7014274597168, "global_step": 87033, "epoch": 719} {"train_loss": -37.7619514465332, "global_step": 87034, "epoch": 719} {"train_loss": -38.52982711791992, "global_step": 87035, "epoch": 719} {"train_loss": -37.352230072021484, "global_step": 87036, "epoch": 719} {"train_loss": -37.55595779418945, "global_step": 87037, "epoch": 719} {"train_loss": -37.38259506225586, "global_step": 87038, "epoch": 719} {"train_loss": -37.457244873046875, "global_step": 87039, "epoch": 719} {"train_loss": -37.42201614379883, "global_step": 87040, "epoch": 719} {"train_loss": -37.8742790222168, "global_step": 87041, "epoch": 719} {"train_loss": -36.61909103393555, "global_step": 87042, "epoch": 719} {"train_loss": -36.93539047241211, "global_step": 87043, "epoch": 719} {"train_loss": -37.14032745361328, "global_step": 87044, "epoch": 719} {"train_loss": -37.20127868652344, "global_step": 87045, "epoch": 719} {"train_loss": -37.80870819091797, "global_step": 87046, "epoch": 719} {"train_loss": -36.03883743286133, "global_step": 87047, "epoch": 719} {"train_loss": -37.07316207885742, "global_step": 87048, "epoch": 719} {"train_loss": -36.26792526245117, "global_step": 87049, "epoch": 719} {"train_loss": -37.65388870239258, "global_step": 87050, "epoch": 719} {"train_loss": -37.753658294677734, "global_step": 87051, "epoch": 719} {"train_loss": -36.70952606201172, "global_step": 87052, "epoch": 719} {"train_loss": -37.8820915222168, "global_step": 87053, "epoch": 719} {"train_loss": -37.72694396972656, "global_step": 87054, "epoch": 719} {"train_loss": -37.89738845825195, "global_step": 87055, "epoch": 719} {"train_loss": -37.01216506958008, "global_step": 87056, "epoch": 719} {"train_loss": -37.78497314453125, "global_step": 87057, "epoch": 719} {"train_loss": -37.530704498291016, "global_step": 87058, "epoch": 719} {"train_loss": -37.951900482177734, "global_step": 87059, "epoch": 719} {"train_loss": -38.11257553100586, "global_step": 87060, "epoch": 719} {"train_loss": -37.290157318115234, "global_step": 87061, "epoch": 719} {"train_loss": -38.25933074951172, "global_step": 87062, "epoch": 719} {"train_loss": -38.21128463745117, "global_step": 87063, "epoch": 719} {"train_loss": -36.78314208984375, "global_step": 87064, "epoch": 719} {"train_loss": -37.42521286010742, "global_step": 87065, "epoch": 719} {"train_loss": -37.9198112487793, "global_step": 87066, "epoch": 719} {"train_loss": -37.96638107299805, "global_step": 87067, "epoch": 719} {"train_loss": -38.587928771972656, "global_step": 87068, "epoch": 719} {"train_loss": -37.63999557495117, "global_step": 87069, "epoch": 719} {"train_loss": -36.786399841308594, "global_step": 87070, "epoch": 719} {"train_loss": -35.79290771484375, "global_step": 87071, "epoch": 719} {"train_loss": -36.649105072021484, "global_step": 87072, "epoch": 719} {"train_loss": -37.705196380615234, "global_step": 87073, "epoch": 719} {"train_loss": -37.444671630859375, "global_step": 87074, "epoch": 719} {"train_loss": -37.36861038208008, "global_step": 87075, "epoch": 719} {"train_loss": -36.68077850341797, "global_step": 87076, "epoch": 719} {"train_loss": -36.79478073120117, "global_step": 87077, "epoch": 719} {"train_loss": -37.10477828979492, "global_step": 87078, "epoch": 719} {"train_loss": -35.048248291015625, "global_step": 87079, "epoch": 719} {"train_loss": -36.69816970825195, "global_step": 87080, "epoch": 719} {"train_loss": -37.23780822753906, "global_step": 87081, "epoch": 719} {"train_loss": -36.788291931152344, "global_step": 87082, "epoch": 719} {"train_loss": -37.33742904663086, "global_step": 87083, "epoch": 719} {"train_loss": -37.65936279296875, "global_step": 87084, "epoch": 719} {"train_loss": -37.53693389892578, "global_step": 87085, "epoch": 719} {"train_loss": -37.04298782348633, "global_step": 87086, "epoch": 719} {"train_loss": -38.10765838623047, "global_step": 87087, "epoch": 719} {"train_loss": -37.23736572265625, "global_step": 87088, "epoch": 719} {"train_loss": -38.2353630065918, "global_step": 87089, "epoch": 719} {"train_loss": -38.26617431640625, "global_step": 87090, "epoch": 719} {"train_loss": -38.25016403198242, "global_step": 87091, "epoch": 719} {"train_loss": -38.868568420410156, "global_step": 87092, "epoch": 719} {"train_loss": -38.37791061401367, "global_step": 87093, "epoch": 719} {"train_loss": -38.34492874145508, "global_step": 87094, "epoch": 719} {"train_loss": -37.64144515991211, "global_step": 87095, "epoch": 719} {"train_loss": -38.49910354614258, "global_step": 87096, "epoch": 719} {"train_loss": -37.60300064086914, "global_step": 87097, "epoch": 719} {"train_loss": -36.33097457885742, "global_step": 87098, "epoch": 719} {"train_loss": -36.04600143432617, "global_step": 87099, "epoch": 719} {"train_loss": -36.94441223144531, "global_step": 87100, "epoch": 719} {"train_loss": -37.5040283203125, "global_step": 87101, "epoch": 719} {"train_loss": -35.2312126159668, "global_step": 87102, "epoch": 719} {"train_loss": -36.5258903503418, "global_step": 87103, "epoch": 719} {"train_loss": -36.07085037231445, "global_step": 87104, "epoch": 719} {"train_loss": -36.515167236328125, "global_step": 87105, "epoch": 719} {"train_loss": -37.516212463378906, "global_step": 87106, "epoch": 719} {"train_loss": -36.81385803222656, "global_step": 87107, "epoch": 719} {"train_loss": -37.70058059692383, "global_step": 87108, "epoch": 719} {"train_loss": -37.32369613647461, "global_step": 87109, "epoch": 719} {"train_loss": -36.35120391845703, "global_step": 87110, "epoch": 719} {"train_loss": -35.34930419921875, "global_step": 87111, "epoch": 719} {"train_loss": -36.298866271972656, "global_step": 87112, "epoch": 719} {"train_loss": -37.24072265625, "global_step": 87113, "epoch": 719} {"train_loss": -35.75796127319336, "global_step": 87114, "epoch": 719} {"train_loss": -37.4716911315918, "global_step": 87115, "epoch": 719} {"train_loss": -37.168373107910156, "global_step": 87116, "epoch": 719} {"train_loss": -36.227638244628906, "global_step": 87117, "epoch": 719} {"train_loss": -37.24752426147461, "global_step": 87118, "epoch": 719} {"train_loss": -37.283875142247226, "global_step": 87119, "epoch": 719, "val_loss": 2801858.0} {"train_loss": -36.01478958129883, "global_step": 87120, "epoch": 720} {"train_loss": -34.004730224609375, "global_step": 87121, "epoch": 720} {"train_loss": -35.80732345581055, "global_step": 87122, "epoch": 720} {"train_loss": -34.38682174682617, "global_step": 87123, "epoch": 720} {"train_loss": -36.767738342285156, "global_step": 87124, "epoch": 720} {"train_loss": -36.66169357299805, "global_step": 87125, "epoch": 720} {"train_loss": -35.70294189453125, "global_step": 87126, "epoch": 720} {"train_loss": -33.70912551879883, "global_step": 87127, "epoch": 720} {"train_loss": -33.83534622192383, "global_step": 87128, "epoch": 720} {"train_loss": -32.27120590209961, "global_step": 87129, "epoch": 720} {"train_loss": -34.677059173583984, "global_step": 87130, "epoch": 720} {"train_loss": -35.7530632019043, "global_step": 87131, "epoch": 720} {"train_loss": -34.9580192565918, "global_step": 87132, "epoch": 720} {"train_loss": -34.8951301574707, "global_step": 87133, "epoch": 720} {"train_loss": -33.50021743774414, "global_step": 87134, "epoch": 720} {"train_loss": -34.85807800292969, "global_step": 87135, "epoch": 720} {"train_loss": -34.539058685302734, "global_step": 87136, "epoch": 720} {"train_loss": -36.15755081176758, "global_step": 87137, "epoch": 720} {"train_loss": -34.61144256591797, "global_step": 87138, "epoch": 720} {"train_loss": -36.478858947753906, "global_step": 87139, "epoch": 720} {"train_loss": -33.73630905151367, "global_step": 87140, "epoch": 720} {"train_loss": -35.92496871948242, "global_step": 87141, "epoch": 720} {"train_loss": -36.125423431396484, "global_step": 87142, "epoch": 720} {"train_loss": -35.4504508972168, "global_step": 87143, "epoch": 720} {"train_loss": -36.55833053588867, "global_step": 87144, "epoch": 720} {"train_loss": -36.51438522338867, "global_step": 87145, "epoch": 720} {"train_loss": -35.68391799926758, "global_step": 87146, "epoch": 720} {"train_loss": -36.0192985534668, "global_step": 87147, "epoch": 720} {"train_loss": -35.978694915771484, "global_step": 87148, "epoch": 720} {"train_loss": -34.812923431396484, "global_step": 87149, "epoch": 720} {"train_loss": -36.447139739990234, "global_step": 87150, "epoch": 720} {"train_loss": -36.556331634521484, "global_step": 87151, "epoch": 720} {"train_loss": -34.023292541503906, "global_step": 87152, "epoch": 720} {"train_loss": -36.64699935913086, "global_step": 87153, "epoch": 720} {"train_loss": -36.59812927246094, "global_step": 87154, "epoch": 720} {"train_loss": -36.35653305053711, "global_step": 87155, "epoch": 720} {"train_loss": -33.869842529296875, "global_step": 87156, "epoch": 720} {"train_loss": -36.330562591552734, "global_step": 87157, "epoch": 720} {"train_loss": -36.5740966796875, "global_step": 87158, "epoch": 720} {"train_loss": -36.589656829833984, "global_step": 87159, "epoch": 720} {"train_loss": -36.14490509033203, "global_step": 87160, "epoch": 720} {"train_loss": -35.7385368347168, "global_step": 87161, "epoch": 720} {"train_loss": -36.60511779785156, "global_step": 87162, "epoch": 720} {"train_loss": -37.03109359741211, "global_step": 87163, "epoch": 720} {"train_loss": -35.91627883911133, "global_step": 87164, "epoch": 720} {"train_loss": -35.96641159057617, "global_step": 87165, "epoch": 720} {"train_loss": -36.69738006591797, "global_step": 87166, "epoch": 720} {"train_loss": -34.2230339050293, "global_step": 87167, "epoch": 720} {"train_loss": -37.02887725830078, "global_step": 87168, "epoch": 720} {"train_loss": -36.3350715637207, "global_step": 87169, "epoch": 720} {"train_loss": -37.365638732910156, "global_step": 87170, "epoch": 720} {"train_loss": -36.794212341308594, "global_step": 87171, "epoch": 720} {"train_loss": -36.49009704589844, "global_step": 87172, "epoch": 720} {"train_loss": -36.510005950927734, "global_step": 87173, "epoch": 720} {"train_loss": -36.620399475097656, "global_step": 87174, "epoch": 720} {"train_loss": -36.69694519042969, "global_step": 87175, "epoch": 720} {"train_loss": -36.9421272277832, "global_step": 87176, "epoch": 720} {"train_loss": -37.33684158325195, "global_step": 87177, "epoch": 720} {"train_loss": -36.800052642822266, "global_step": 87178, "epoch": 720} {"train_loss": -37.40338897705078, "global_step": 87179, "epoch": 720} {"train_loss": -36.41034698486328, "global_step": 87180, "epoch": 720} {"train_loss": -36.465980529785156, "global_step": 87181, "epoch": 720} {"train_loss": -37.541439056396484, "global_step": 87182, "epoch": 720} {"train_loss": -36.95711898803711, "global_step": 87183, "epoch": 720} {"train_loss": -36.24404525756836, "global_step": 87184, "epoch": 720} {"train_loss": -37.05963897705078, "global_step": 87185, "epoch": 720} {"train_loss": -37.55859375, "global_step": 87186, "epoch": 720} {"train_loss": -37.60103225708008, "global_step": 87187, "epoch": 720} {"train_loss": -36.780025482177734, "global_step": 87188, "epoch": 720} {"train_loss": -37.401756286621094, "global_step": 87189, "epoch": 720} {"train_loss": -37.2662353515625, "global_step": 87190, "epoch": 720} {"train_loss": -36.64512634277344, "global_step": 87191, "epoch": 720} {"train_loss": -37.374427795410156, "global_step": 87192, "epoch": 720} {"train_loss": -36.961181640625, "global_step": 87193, "epoch": 720} {"train_loss": -32.17777633666992, "global_step": 87194, "epoch": 720} {"train_loss": -36.86780548095703, "global_step": 87195, "epoch": 720} {"train_loss": -32.14669418334961, "global_step": 87196, "epoch": 720} {"train_loss": -29.154794692993164, "global_step": 87197, "epoch": 720} {"train_loss": -32.87116241455078, "global_step": 87198, "epoch": 720} {"train_loss": -31.525720596313477, "global_step": 87199, "epoch": 720} {"train_loss": -26.0072078704834, "global_step": 87200, "epoch": 720} {"train_loss": -30.3394832611084, "global_step": 87201, "epoch": 720} {"train_loss": -33.37950897216797, "global_step": 87202, "epoch": 720} {"train_loss": -36.150386810302734, "global_step": 87203, "epoch": 720} {"train_loss": -31.032520294189453, "global_step": 87204, "epoch": 720} {"train_loss": -35.8575553894043, "global_step": 87205, "epoch": 720} {"train_loss": -35.35416030883789, "global_step": 87206, "epoch": 720} {"train_loss": -34.29688262939453, "global_step": 87207, "epoch": 720} {"train_loss": -35.78049087524414, "global_step": 87208, "epoch": 720} {"train_loss": -35.49344253540039, "global_step": 87209, "epoch": 720} {"train_loss": -36.27759552001953, "global_step": 87210, "epoch": 720} {"train_loss": -34.44865417480469, "global_step": 87211, "epoch": 720} {"train_loss": -35.978328704833984, "global_step": 87212, "epoch": 720} {"train_loss": -36.872962951660156, "global_step": 87213, "epoch": 720} {"train_loss": -35.509307861328125, "global_step": 87214, "epoch": 720} {"train_loss": -36.56344223022461, "global_step": 87215, "epoch": 720} {"train_loss": -36.982513427734375, "global_step": 87216, "epoch": 720} {"train_loss": -36.9470100402832, "global_step": 87217, "epoch": 720} {"train_loss": -37.19636154174805, "global_step": 87218, "epoch": 720} {"train_loss": -37.492637634277344, "global_step": 87219, "epoch": 720} {"train_loss": -37.350032806396484, "global_step": 87220, "epoch": 720} {"train_loss": -37.24723434448242, "global_step": 87221, "epoch": 720} {"train_loss": -37.212711334228516, "global_step": 87222, "epoch": 720} {"train_loss": -37.6003303527832, "global_step": 87223, "epoch": 720} {"train_loss": -37.972110748291016, "global_step": 87224, "epoch": 720} {"train_loss": -37.5788688659668, "global_step": 87225, "epoch": 720} {"train_loss": -37.82332229614258, "global_step": 87226, "epoch": 720} {"train_loss": -37.612056732177734, "global_step": 87227, "epoch": 720} {"train_loss": -37.54799270629883, "global_step": 87228, "epoch": 720} {"train_loss": -38.038818359375, "global_step": 87229, "epoch": 720} {"train_loss": -38.091590881347656, "global_step": 87230, "epoch": 720} {"train_loss": -38.102020263671875, "global_step": 87231, "epoch": 720} {"train_loss": -37.56766891479492, "global_step": 87232, "epoch": 720} {"train_loss": -38.034950256347656, "global_step": 87233, "epoch": 720} {"train_loss": -37.85579299926758, "global_step": 87234, "epoch": 720} {"train_loss": -37.98438262939453, "global_step": 87235, "epoch": 720} {"train_loss": -37.92586898803711, "global_step": 87236, "epoch": 720} {"train_loss": -38.18661117553711, "global_step": 87237, "epoch": 720} {"train_loss": -37.5502815246582, "global_step": 87238, "epoch": 720} {"train_loss": -37.22123718261719, "global_step": 87239, "epoch": 720} {"train_loss": -35.94846227346373, "global_step": 87240, "epoch": 720, "val_loss": 2564903.25} {"train_loss": -38.29902267456055, "global_step": 87241, "epoch": 721} {"train_loss": -38.02381134033203, "global_step": 87242, "epoch": 721} {"train_loss": -38.31927490234375, "global_step": 87243, "epoch": 721} {"train_loss": -38.34711837768555, "global_step": 87244, "epoch": 721} {"train_loss": -37.78513717651367, "global_step": 87245, "epoch": 721} {"train_loss": -37.034820556640625, "global_step": 87246, "epoch": 721} {"train_loss": -36.59218978881836, "global_step": 87247, "epoch": 721} {"train_loss": -36.593441009521484, "global_step": 87248, "epoch": 721} {"train_loss": -37.716854095458984, "global_step": 87249, "epoch": 721} {"train_loss": -38.169464111328125, "global_step": 87250, "epoch": 721} {"train_loss": -37.875648498535156, "global_step": 87251, "epoch": 721} {"train_loss": -36.70371627807617, "global_step": 87252, "epoch": 721} {"train_loss": -34.58473587036133, "global_step": 87253, "epoch": 721} {"train_loss": -33.32375717163086, "global_step": 87254, "epoch": 721} {"train_loss": -34.28041458129883, "global_step": 87255, "epoch": 721} {"train_loss": -34.84249496459961, "global_step": 87256, "epoch": 721} {"train_loss": -36.240291595458984, "global_step": 87257, "epoch": 721} {"train_loss": -37.00248336791992, "global_step": 87258, "epoch": 721} {"train_loss": -36.705474853515625, "global_step": 87259, "epoch": 721} {"train_loss": -37.0509147644043, "global_step": 87260, "epoch": 721} {"train_loss": -36.936153411865234, "global_step": 87261, "epoch": 721} {"train_loss": -34.043392181396484, "global_step": 87262, "epoch": 721} {"train_loss": -37.63383865356445, "global_step": 87263, "epoch": 721} {"train_loss": -37.80754089355469, "global_step": 87264, "epoch": 721} {"train_loss": -36.51681137084961, "global_step": 87265, "epoch": 721} {"train_loss": -37.092891693115234, "global_step": 87266, "epoch": 721} {"train_loss": -37.74278259277344, "global_step": 87267, "epoch": 721} {"train_loss": -35.77549362182617, "global_step": 87268, "epoch": 721} {"train_loss": -36.517234802246094, "global_step": 87269, "epoch": 721} {"train_loss": -36.333351135253906, "global_step": 87270, "epoch": 721} {"train_loss": -36.935821533203125, "global_step": 87271, "epoch": 721} {"train_loss": -37.870357513427734, "global_step": 87272, "epoch": 721} {"train_loss": -37.27863311767578, "global_step": 87273, "epoch": 721} {"train_loss": -37.13682174682617, "global_step": 87274, "epoch": 721} {"train_loss": -36.876197814941406, "global_step": 87275, "epoch": 721} {"train_loss": -38.11738586425781, "global_step": 87276, "epoch": 721} {"train_loss": -37.539276123046875, "global_step": 87277, "epoch": 721} {"train_loss": -37.61208724975586, "global_step": 87278, "epoch": 721} {"train_loss": -37.0424919128418, "global_step": 87279, "epoch": 721} {"train_loss": -37.196075439453125, "global_step": 87280, "epoch": 721} {"train_loss": -37.80147933959961, "global_step": 87281, "epoch": 721} {"train_loss": -37.461910247802734, "global_step": 87282, "epoch": 721} {"train_loss": -37.6732292175293, "global_step": 87283, "epoch": 721} {"train_loss": -37.834983825683594, "global_step": 87284, "epoch": 721} {"train_loss": -37.71907424926758, "global_step": 87285, "epoch": 721} {"train_loss": -37.96538543701172, "global_step": 87286, "epoch": 721} {"train_loss": -36.44534683227539, "global_step": 87287, "epoch": 721} {"train_loss": -35.09790802001953, "global_step": 87288, "epoch": 721} {"train_loss": -38.126380920410156, "global_step": 87289, "epoch": 721} {"train_loss": -37.909786224365234, "global_step": 87290, "epoch": 721} {"train_loss": -37.06101989746094, "global_step": 87291, "epoch": 721} {"train_loss": -36.46282196044922, "global_step": 87292, "epoch": 721} {"train_loss": -37.685462951660156, "global_step": 87293, "epoch": 721} {"train_loss": -36.47860336303711, "global_step": 87294, "epoch": 721} {"train_loss": -36.23273468017578, "global_step": 87295, "epoch": 721} {"train_loss": -37.3836669921875, "global_step": 87296, "epoch": 721} {"train_loss": -38.425106048583984, "global_step": 87297, "epoch": 721} {"train_loss": -37.42247009277344, "global_step": 87298, "epoch": 721} {"train_loss": -37.84339141845703, "global_step": 87299, "epoch": 721} {"train_loss": -37.355613708496094, "global_step": 87300, "epoch": 721} {"train_loss": -37.1082878112793, "global_step": 87301, "epoch": 721} {"train_loss": -38.03843307495117, "global_step": 87302, "epoch": 721} {"train_loss": -37.29580307006836, "global_step": 87303, "epoch": 721} {"train_loss": -37.5565299987793, "global_step": 87304, "epoch": 721} {"train_loss": -38.21968078613281, "global_step": 87305, "epoch": 721} {"train_loss": -38.206478118896484, "global_step": 87306, "epoch": 721} {"train_loss": -37.7056884765625, "global_step": 87307, "epoch": 721} {"train_loss": -36.44160079956055, "global_step": 87308, "epoch": 721} {"train_loss": -37.48073959350586, "global_step": 87309, "epoch": 721} {"train_loss": -37.90178298950195, "global_step": 87310, "epoch": 721} {"train_loss": -37.100643157958984, "global_step": 87311, "epoch": 721} {"train_loss": -36.4250373840332, "global_step": 87312, "epoch": 721} {"train_loss": -37.706825256347656, "global_step": 87313, "epoch": 721} {"train_loss": -36.72090530395508, "global_step": 87314, "epoch": 721} {"train_loss": -37.01637649536133, "global_step": 87315, "epoch": 721} {"train_loss": -38.295654296875, "global_step": 87316, "epoch": 721} {"train_loss": -36.46540451049805, "global_step": 87317, "epoch": 721} {"train_loss": -37.6243782043457, "global_step": 87318, "epoch": 721} {"train_loss": -38.13872528076172, "global_step": 87319, "epoch": 721} {"train_loss": -37.32806396484375, "global_step": 87320, "epoch": 721} {"train_loss": -38.05851364135742, "global_step": 87321, "epoch": 721} {"train_loss": -38.39064025878906, "global_step": 87322, "epoch": 721} {"train_loss": -37.41859817504883, "global_step": 87323, "epoch": 721} {"train_loss": -37.69855880737305, "global_step": 87324, "epoch": 721} {"train_loss": -37.6138801574707, "global_step": 87325, "epoch": 721} {"train_loss": -37.88068389892578, "global_step": 87326, "epoch": 721} {"train_loss": -36.70817947387695, "global_step": 87327, "epoch": 721} {"train_loss": -36.574771881103516, "global_step": 87328, "epoch": 721} {"train_loss": -37.416114807128906, "global_step": 87329, "epoch": 721} {"train_loss": -38.41020584106445, "global_step": 87330, "epoch": 721} {"train_loss": -38.306724548339844, "global_step": 87331, "epoch": 721} {"train_loss": -37.364044189453125, "global_step": 87332, "epoch": 721} {"train_loss": -37.00568389892578, "global_step": 87333, "epoch": 721} {"train_loss": -36.78089141845703, "global_step": 87334, "epoch": 721} {"train_loss": -38.04743194580078, "global_step": 87335, "epoch": 721} {"train_loss": -37.35496139526367, "global_step": 87336, "epoch": 721} {"train_loss": -38.15177536010742, "global_step": 87337, "epoch": 721} {"train_loss": -37.754634857177734, "global_step": 87338, "epoch": 721} {"train_loss": -37.93131637573242, "global_step": 87339, "epoch": 721} {"train_loss": -37.548187255859375, "global_step": 87340, "epoch": 721} {"train_loss": -37.28797912597656, "global_step": 87341, "epoch": 721} {"train_loss": -36.983917236328125, "global_step": 87342, "epoch": 721} {"train_loss": -37.343196868896484, "global_step": 87343, "epoch": 721} {"train_loss": -36.19954299926758, "global_step": 87344, "epoch": 721} {"train_loss": -37.413665771484375, "global_step": 87345, "epoch": 721} {"train_loss": -37.21200180053711, "global_step": 87346, "epoch": 721} {"train_loss": -37.093849182128906, "global_step": 87347, "epoch": 721} {"train_loss": -37.318885803222656, "global_step": 87348, "epoch": 721} {"train_loss": -36.63011932373047, "global_step": 87349, "epoch": 721} {"train_loss": -37.17536163330078, "global_step": 87350, "epoch": 721} {"train_loss": -37.5115966796875, "global_step": 87351, "epoch": 721} {"train_loss": -37.927249908447266, "global_step": 87352, "epoch": 721} {"train_loss": -37.63128662109375, "global_step": 87353, "epoch": 721} {"train_loss": -37.410335540771484, "global_step": 87354, "epoch": 721} {"train_loss": -37.95475387573242, "global_step": 87355, "epoch": 721} {"train_loss": -36.016963958740234, "global_step": 87356, "epoch": 721} {"train_loss": -37.07040786743164, "global_step": 87357, "epoch": 721} {"train_loss": -37.0826301574707, "global_step": 87358, "epoch": 721} {"train_loss": -37.41660690307617, "global_step": 87359, "epoch": 721} {"train_loss": -37.25593185424805, "global_step": 87360, "epoch": 721} {"train_loss": -37.229633362825254, "global_step": 87361, "epoch": 721, "val_loss": 2497127.0} {"train_loss": -36.82070541381836, "global_step": 87362, "epoch": 722} {"train_loss": -35.6158561706543, "global_step": 87363, "epoch": 722} {"train_loss": -34.0604362487793, "global_step": 87364, "epoch": 722} {"train_loss": -35.228492736816406, "global_step": 87365, "epoch": 722} {"train_loss": -37.186397552490234, "global_step": 87366, "epoch": 722} {"train_loss": -35.29136276245117, "global_step": 87367, "epoch": 722} {"train_loss": -36.358829498291016, "global_step": 87368, "epoch": 722} {"train_loss": -36.45365524291992, "global_step": 87369, "epoch": 722} {"train_loss": -36.49870681762695, "global_step": 87370, "epoch": 722} {"train_loss": -36.91309356689453, "global_step": 87371, "epoch": 722} {"train_loss": -35.60478973388672, "global_step": 87372, "epoch": 722} {"train_loss": -35.8974609375, "global_step": 87373, "epoch": 722} {"train_loss": -33.96608352661133, "global_step": 87374, "epoch": 722} {"train_loss": -37.57225799560547, "global_step": 87375, "epoch": 722} {"train_loss": -36.8808708190918, "global_step": 87376, "epoch": 722} {"train_loss": -37.29739761352539, "global_step": 87377, "epoch": 722} {"train_loss": -37.7788200378418, "global_step": 87378, "epoch": 722} {"train_loss": -34.82503890991211, "global_step": 87379, "epoch": 722} {"train_loss": -33.28609848022461, "global_step": 87380, "epoch": 722} {"train_loss": -35.66935348510742, "global_step": 87381, "epoch": 722} {"train_loss": -33.58489227294922, "global_step": 87382, "epoch": 722} {"train_loss": -36.1774787902832, "global_step": 87383, "epoch": 722} {"train_loss": -36.05330276489258, "global_step": 87384, "epoch": 722} {"train_loss": -36.48405456542969, "global_step": 87385, "epoch": 722} {"train_loss": -36.22394561767578, "global_step": 87386, "epoch": 722} {"train_loss": -35.461368560791016, "global_step": 87387, "epoch": 722} {"train_loss": -36.2075309753418, "global_step": 87388, "epoch": 722} {"train_loss": -36.03432083129883, "global_step": 87389, "epoch": 722} {"train_loss": -36.1557502746582, "global_step": 87390, "epoch": 722} {"train_loss": -35.32601547241211, "global_step": 87391, "epoch": 722} {"train_loss": -35.85982894897461, "global_step": 87392, "epoch": 722} {"train_loss": -36.43061065673828, "global_step": 87393, "epoch": 722} {"train_loss": -36.041072845458984, "global_step": 87394, "epoch": 722} {"train_loss": -36.5905876159668, "global_step": 87395, "epoch": 722} {"train_loss": -37.523738861083984, "global_step": 87396, "epoch": 722} {"train_loss": -36.788787841796875, "global_step": 87397, "epoch": 722} {"train_loss": -37.28190994262695, "global_step": 87398, "epoch": 722} {"train_loss": -37.49860382080078, "global_step": 87399, "epoch": 722} {"train_loss": -37.54743576049805, "global_step": 87400, "epoch": 722} {"train_loss": -37.63372802734375, "global_step": 87401, "epoch": 722} {"train_loss": -36.73332977294922, "global_step": 87402, "epoch": 722} {"train_loss": -36.86434555053711, "global_step": 87403, "epoch": 722} {"train_loss": -37.51634979248047, "global_step": 87404, "epoch": 722} {"train_loss": -37.4802360534668, "global_step": 87405, "epoch": 722} {"train_loss": -36.79821014404297, "global_step": 87406, "epoch": 722} {"train_loss": -36.82867431640625, "global_step": 87407, "epoch": 722} {"train_loss": -37.27973556518555, "global_step": 87408, "epoch": 722} {"train_loss": -36.79587936401367, "global_step": 87409, "epoch": 722} {"train_loss": -37.066688537597656, "global_step": 87410, "epoch": 722} {"train_loss": -36.1067008972168, "global_step": 87411, "epoch": 722} {"train_loss": -36.4701042175293, "global_step": 87412, "epoch": 722} {"train_loss": -37.6077766418457, "global_step": 87413, "epoch": 722} {"train_loss": -37.64008331298828, "global_step": 87414, "epoch": 722} {"train_loss": -36.476741790771484, "global_step": 87415, "epoch": 722} {"train_loss": -36.56068801879883, "global_step": 87416, "epoch": 722} {"train_loss": -37.292781829833984, "global_step": 87417, "epoch": 722} {"train_loss": -37.47705078125, "global_step": 87418, "epoch": 722} {"train_loss": -36.72150802612305, "global_step": 87419, "epoch": 722} {"train_loss": -35.89379119873047, "global_step": 87420, "epoch": 722} {"train_loss": -36.34916305541992, "global_step": 87421, "epoch": 722} {"train_loss": -37.56324768066406, "global_step": 87422, "epoch": 722} {"train_loss": -36.95644760131836, "global_step": 87423, "epoch": 722} {"train_loss": -36.89921569824219, "global_step": 87424, "epoch": 722} {"train_loss": -35.93742752075195, "global_step": 87425, "epoch": 722} {"train_loss": -37.379146575927734, "global_step": 87426, "epoch": 722} {"train_loss": -37.42911911010742, "global_step": 87427, "epoch": 722} {"train_loss": -37.942657470703125, "global_step": 87428, "epoch": 722} {"train_loss": -37.203208923339844, "global_step": 87429, "epoch": 722} {"train_loss": -37.7982063293457, "global_step": 87430, "epoch": 722} {"train_loss": -37.81861114501953, "global_step": 87431, "epoch": 722} {"train_loss": -37.57849884033203, "global_step": 87432, "epoch": 722} {"train_loss": -36.807106018066406, "global_step": 87433, "epoch": 722} {"train_loss": -37.89167404174805, "global_step": 87434, "epoch": 722} {"train_loss": -37.9770393371582, "global_step": 87435, "epoch": 722} {"train_loss": -37.804439544677734, "global_step": 87436, "epoch": 722} {"train_loss": -37.343162536621094, "global_step": 87437, "epoch": 722} {"train_loss": -37.4940299987793, "global_step": 87438, "epoch": 722} {"train_loss": -36.5593376159668, "global_step": 87439, "epoch": 722} {"train_loss": -36.45412063598633, "global_step": 87440, "epoch": 722} {"train_loss": -37.167816162109375, "global_step": 87441, "epoch": 722} {"train_loss": -38.38885498046875, "global_step": 87442, "epoch": 722} {"train_loss": -38.04280471801758, "global_step": 87443, "epoch": 722} {"train_loss": -37.93050765991211, "global_step": 87444, "epoch": 722} {"train_loss": -38.186092376708984, "global_step": 87445, "epoch": 722} {"train_loss": -38.031288146972656, "global_step": 87446, "epoch": 722} {"train_loss": -38.2645149230957, "global_step": 87447, "epoch": 722} {"train_loss": -37.601768493652344, "global_step": 87448, "epoch": 722} {"train_loss": -37.36284255981445, "global_step": 87449, "epoch": 722} {"train_loss": -38.08060836791992, "global_step": 87450, "epoch": 722} {"train_loss": -38.35560989379883, "global_step": 87451, "epoch": 722} {"train_loss": -37.91754913330078, "global_step": 87452, "epoch": 722} {"train_loss": -38.54829788208008, "global_step": 87453, "epoch": 722} {"train_loss": -37.69072341918945, "global_step": 87454, "epoch": 722} {"train_loss": -38.62733840942383, "global_step": 87455, "epoch": 722} {"train_loss": -37.63985061645508, "global_step": 87456, "epoch": 722} {"train_loss": -37.474578857421875, "global_step": 87457, "epoch": 722} {"train_loss": -36.26005172729492, "global_step": 87458, "epoch": 722} {"train_loss": -37.26884078979492, "global_step": 87459, "epoch": 722} {"train_loss": -38.286094665527344, "global_step": 87460, "epoch": 722} {"train_loss": -38.2209587097168, "global_step": 87461, "epoch": 722} {"train_loss": -37.52244186401367, "global_step": 87462, "epoch": 722} {"train_loss": -37.75754928588867, "global_step": 87463, "epoch": 722} {"train_loss": -38.07892990112305, "global_step": 87464, "epoch": 722} {"train_loss": -37.204689025878906, "global_step": 87465, "epoch": 722} {"train_loss": -37.219764709472656, "global_step": 87466, "epoch": 722} {"train_loss": -38.5677490234375, "global_step": 87467, "epoch": 722} {"train_loss": -37.98031997680664, "global_step": 87468, "epoch": 722} {"train_loss": -36.51087188720703, "global_step": 87469, "epoch": 722} {"train_loss": -36.01893615722656, "global_step": 87470, "epoch": 722} {"train_loss": -37.091487884521484, "global_step": 87471, "epoch": 722} {"train_loss": -38.441890716552734, "global_step": 87472, "epoch": 722} {"train_loss": -35.912139892578125, "global_step": 87473, "epoch": 722} {"train_loss": -34.869503021240234, "global_step": 87474, "epoch": 722} {"train_loss": -35.40607452392578, "global_step": 87475, "epoch": 722} {"train_loss": -37.9459228515625, "global_step": 87476, "epoch": 722} {"train_loss": -37.795440673828125, "global_step": 87477, "epoch": 722} {"train_loss": -35.50935745239258, "global_step": 87478, "epoch": 722} {"train_loss": -37.600772857666016, "global_step": 87479, "epoch": 722} {"train_loss": -38.12451934814453, "global_step": 87480, "epoch": 722} {"train_loss": -36.65129852294922, "global_step": 87481, "epoch": 722} {"train_loss": -36.92382374282711, "global_step": 87482, "epoch": 722, "val_loss": 2697767.0} {"train_loss": -38.472145080566406, "global_step": 87483, "epoch": 723} {"train_loss": -36.01411437988281, "global_step": 87484, "epoch": 723} {"train_loss": -37.94610595703125, "global_step": 87485, "epoch": 723} {"train_loss": -36.98234176635742, "global_step": 87486, "epoch": 723} {"train_loss": -37.47620391845703, "global_step": 87487, "epoch": 723} {"train_loss": -36.14716720581055, "global_step": 87488, "epoch": 723} {"train_loss": -36.78621292114258, "global_step": 87489, "epoch": 723} {"train_loss": -38.46376037597656, "global_step": 87490, "epoch": 723} {"train_loss": -36.724117279052734, "global_step": 87491, "epoch": 723} {"train_loss": -37.00000762939453, "global_step": 87492, "epoch": 723} {"train_loss": -35.91667556762695, "global_step": 87493, "epoch": 723} {"train_loss": -37.50814437866211, "global_step": 87494, "epoch": 723} {"train_loss": -36.46989059448242, "global_step": 87495, "epoch": 723} {"train_loss": -36.12221908569336, "global_step": 87496, "epoch": 723} {"train_loss": -36.509639739990234, "global_step": 87497, "epoch": 723} {"train_loss": -34.2975959777832, "global_step": 87498, "epoch": 723} {"train_loss": -34.570526123046875, "global_step": 87499, "epoch": 723} {"train_loss": -33.943294525146484, "global_step": 87500, "epoch": 723} {"train_loss": -36.39204788208008, "global_step": 87501, "epoch": 723} {"train_loss": -35.05084228515625, "global_step": 87502, "epoch": 723} {"train_loss": -35.8929328918457, "global_step": 87503, "epoch": 723} {"train_loss": -35.70927047729492, "global_step": 87504, "epoch": 723} {"train_loss": -35.265113830566406, "global_step": 87505, "epoch": 723} {"train_loss": -35.4569206237793, "global_step": 87506, "epoch": 723} {"train_loss": -35.89213180541992, "global_step": 87507, "epoch": 723} {"train_loss": -33.8033561706543, "global_step": 87508, "epoch": 723} {"train_loss": -31.5045108795166, "global_step": 87509, "epoch": 723} {"train_loss": -34.14741134643555, "global_step": 87510, "epoch": 723} {"train_loss": -34.18054962158203, "global_step": 87511, "epoch": 723} {"train_loss": -32.099822998046875, "global_step": 87512, "epoch": 723} {"train_loss": -35.834476470947266, "global_step": 87513, "epoch": 723} {"train_loss": -33.70722579956055, "global_step": 87514, "epoch": 723} {"train_loss": -34.92436599731445, "global_step": 87515, "epoch": 723} {"train_loss": -33.8361701965332, "global_step": 87516, "epoch": 723} {"train_loss": -32.564510345458984, "global_step": 87517, "epoch": 723} {"train_loss": -35.55078125, "global_step": 87518, "epoch": 723} {"train_loss": -35.29985427856445, "global_step": 87519, "epoch": 723} {"train_loss": -33.61489486694336, "global_step": 87520, "epoch": 723} {"train_loss": -36.46307373046875, "global_step": 87521, "epoch": 723} {"train_loss": -32.898311614990234, "global_step": 87522, "epoch": 723} {"train_loss": -35.58454895019531, "global_step": 87523, "epoch": 723} {"train_loss": -35.333030700683594, "global_step": 87524, "epoch": 723} {"train_loss": -36.60504913330078, "global_step": 87525, "epoch": 723} {"train_loss": -35.79055404663086, "global_step": 87526, "epoch": 723} {"train_loss": -36.333656311035156, "global_step": 87527, "epoch": 723} {"train_loss": -35.85687255859375, "global_step": 87528, "epoch": 723} {"train_loss": -35.82122802734375, "global_step": 87529, "epoch": 723} {"train_loss": -34.32912063598633, "global_step": 87530, "epoch": 723} {"train_loss": -35.58120346069336, "global_step": 87531, "epoch": 723} {"train_loss": -35.480167388916016, "global_step": 87532, "epoch": 723} {"train_loss": -36.5869026184082, "global_step": 87533, "epoch": 723} {"train_loss": -36.218868255615234, "global_step": 87534, "epoch": 723} {"train_loss": -36.52386474609375, "global_step": 87535, "epoch": 723} {"train_loss": -36.24885940551758, "global_step": 87536, "epoch": 723} {"train_loss": -35.97817611694336, "global_step": 87537, "epoch": 723} {"train_loss": -36.56048583984375, "global_step": 87538, "epoch": 723} {"train_loss": -36.0098991394043, "global_step": 87539, "epoch": 723} {"train_loss": -36.81409454345703, "global_step": 87540, "epoch": 723} {"train_loss": -36.54777908325195, "global_step": 87541, "epoch": 723} {"train_loss": -37.13288497924805, "global_step": 87542, "epoch": 723} {"train_loss": -36.523075103759766, "global_step": 87543, "epoch": 723} {"train_loss": -36.30757522583008, "global_step": 87544, "epoch": 723} {"train_loss": -36.70551300048828, "global_step": 87545, "epoch": 723} {"train_loss": -36.571041107177734, "global_step": 87546, "epoch": 723} {"train_loss": -36.67422103881836, "global_step": 87547, "epoch": 723} {"train_loss": -36.78407287597656, "global_step": 87548, "epoch": 723} {"train_loss": -37.07121658325195, "global_step": 87549, "epoch": 723} {"train_loss": -36.97930908203125, "global_step": 87550, "epoch": 723} {"train_loss": -36.91352081298828, "global_step": 87551, "epoch": 723} {"train_loss": -37.43593215942383, "global_step": 87552, "epoch": 723} {"train_loss": -37.56290817260742, "global_step": 87553, "epoch": 723} {"train_loss": -37.8349609375, "global_step": 87554, "epoch": 723} {"train_loss": -37.67293167114258, "global_step": 87555, "epoch": 723} {"train_loss": -37.83283615112305, "global_step": 87556, "epoch": 723} {"train_loss": -37.7984619140625, "global_step": 87557, "epoch": 723} {"train_loss": -37.19800567626953, "global_step": 87558, "epoch": 723} {"train_loss": -37.545135498046875, "global_step": 87559, "epoch": 723} {"train_loss": -37.8159294128418, "global_step": 87560, "epoch": 723} {"train_loss": -37.8431510925293, "global_step": 87561, "epoch": 723} {"train_loss": -37.14069747924805, "global_step": 87562, "epoch": 723} {"train_loss": -36.61146926879883, "global_step": 87563, "epoch": 723} {"train_loss": -36.8807487487793, "global_step": 87564, "epoch": 723} {"train_loss": -37.059295654296875, "global_step": 87565, "epoch": 723} {"train_loss": -37.827388763427734, "global_step": 87566, "epoch": 723} {"train_loss": -38.19434356689453, "global_step": 87567, "epoch": 723} {"train_loss": -38.17671585083008, "global_step": 87568, "epoch": 723} {"train_loss": -37.54227066040039, "global_step": 87569, "epoch": 723} {"train_loss": -36.58970260620117, "global_step": 87570, "epoch": 723} {"train_loss": -34.88664627075195, "global_step": 87571, "epoch": 723} {"train_loss": -35.169288635253906, "global_step": 87572, "epoch": 723} {"train_loss": -34.81843185424805, "global_step": 87573, "epoch": 723} {"train_loss": -35.605140686035156, "global_step": 87574, "epoch": 723} {"train_loss": -37.944400787353516, "global_step": 87575, "epoch": 723} {"train_loss": -37.542667388916016, "global_step": 87576, "epoch": 723} {"train_loss": -35.14491653442383, "global_step": 87577, "epoch": 723} {"train_loss": -37.16572189331055, "global_step": 87578, "epoch": 723} {"train_loss": -38.11209487915039, "global_step": 87579, "epoch": 723} {"train_loss": -37.69666290283203, "global_step": 87580, "epoch": 723} {"train_loss": -36.60354232788086, "global_step": 87581, "epoch": 723} {"train_loss": -37.66704559326172, "global_step": 87582, "epoch": 723} {"train_loss": -37.993343353271484, "global_step": 87583, "epoch": 723} {"train_loss": -37.33192825317383, "global_step": 87584, "epoch": 723} {"train_loss": -38.18730163574219, "global_step": 87585, "epoch": 723} {"train_loss": -38.44191360473633, "global_step": 87586, "epoch": 723} {"train_loss": -37.89173126220703, "global_step": 87587, "epoch": 723} {"train_loss": -38.18798065185547, "global_step": 87588, "epoch": 723} {"train_loss": -38.56974411010742, "global_step": 87589, "epoch": 723} {"train_loss": -38.368648529052734, "global_step": 87590, "epoch": 723} {"train_loss": -37.43447494506836, "global_step": 87591, "epoch": 723} {"train_loss": -38.64366149902344, "global_step": 87592, "epoch": 723} {"train_loss": -38.19610595703125, "global_step": 87593, "epoch": 723} {"train_loss": -38.162132263183594, "global_step": 87594, "epoch": 723} {"train_loss": -38.122833251953125, "global_step": 87595, "epoch": 723} {"train_loss": -36.37519073486328, "global_step": 87596, "epoch": 723} {"train_loss": -37.525909423828125, "global_step": 87597, "epoch": 723} {"train_loss": -37.94183349609375, "global_step": 87598, "epoch": 723} {"train_loss": -37.90947341918945, "global_step": 87599, "epoch": 723} {"train_loss": -37.876461029052734, "global_step": 87600, "epoch": 723} {"train_loss": -38.239906311035156, "global_step": 87601, "epoch": 723} {"train_loss": -37.6640625, "global_step": 87602, "epoch": 723} {"train_loss": -36.499430459392954, "global_step": 87603, "epoch": 723, "val_loss": 2646554.25} {"train_loss": -38.237545013427734, "global_step": 87604, "epoch": 724} {"train_loss": -38.23592758178711, "global_step": 87605, "epoch": 724} {"train_loss": -37.983253479003906, "global_step": 87606, "epoch": 724} {"train_loss": -38.3505859375, "global_step": 87607, "epoch": 724} {"train_loss": -37.749420166015625, "global_step": 87608, "epoch": 724} {"train_loss": -38.0926628112793, "global_step": 87609, "epoch": 724} {"train_loss": -38.612403869628906, "global_step": 87610, "epoch": 724} {"train_loss": -38.269081115722656, "global_step": 87611, "epoch": 724} {"train_loss": -38.41527557373047, "global_step": 87612, "epoch": 724} {"train_loss": -38.588409423828125, "global_step": 87613, "epoch": 724} {"train_loss": -37.84416198730469, "global_step": 87614, "epoch": 724} {"train_loss": -37.76093673706055, "global_step": 87615, "epoch": 724} {"train_loss": -37.763614654541016, "global_step": 87616, "epoch": 724} {"train_loss": -38.04254913330078, "global_step": 87617, "epoch": 724} {"train_loss": -38.328392028808594, "global_step": 87618, "epoch": 724} {"train_loss": -37.80604934692383, "global_step": 87619, "epoch": 724} {"train_loss": -37.7785530090332, "global_step": 87620, "epoch": 724} {"train_loss": -37.69493865966797, "global_step": 87621, "epoch": 724} {"train_loss": -36.40843200683594, "global_step": 87622, "epoch": 724} {"train_loss": -37.50612258911133, "global_step": 87623, "epoch": 724} {"train_loss": -38.655189514160156, "global_step": 87624, "epoch": 724} {"train_loss": -38.24819564819336, "global_step": 87625, "epoch": 724} {"train_loss": -37.23369216918945, "global_step": 87626, "epoch": 724} {"train_loss": -37.901283264160156, "global_step": 87627, "epoch": 724} {"train_loss": -38.0391845703125, "global_step": 87628, "epoch": 724} {"train_loss": -37.38822555541992, "global_step": 87629, "epoch": 724} {"train_loss": -37.81240463256836, "global_step": 87630, "epoch": 724} {"train_loss": -37.72611618041992, "global_step": 87631, "epoch": 724} {"train_loss": -37.468116760253906, "global_step": 87632, "epoch": 724} {"train_loss": -37.131988525390625, "global_step": 87633, "epoch": 724} {"train_loss": -38.07231903076172, "global_step": 87634, "epoch": 724} {"train_loss": -36.718345642089844, "global_step": 87635, "epoch": 724} {"train_loss": -38.1093635559082, "global_step": 87636, "epoch": 724} {"train_loss": -38.652008056640625, "global_step": 87637, "epoch": 724} {"train_loss": -37.9373779296875, "global_step": 87638, "epoch": 724} {"train_loss": -37.241268157958984, "global_step": 87639, "epoch": 724} {"train_loss": -34.627716064453125, "global_step": 87640, "epoch": 724} {"train_loss": -36.469146728515625, "global_step": 87641, "epoch": 724} {"train_loss": -37.33696746826172, "global_step": 87642, "epoch": 724} {"train_loss": -36.327301025390625, "global_step": 87643, "epoch": 724} {"train_loss": -36.721702575683594, "global_step": 87644, "epoch": 724} {"train_loss": -34.61825180053711, "global_step": 87645, "epoch": 724} {"train_loss": -37.33937454223633, "global_step": 87646, "epoch": 724} {"train_loss": -34.80952072143555, "global_step": 87647, "epoch": 724} {"train_loss": -34.86758041381836, "global_step": 87648, "epoch": 724} {"train_loss": -37.157196044921875, "global_step": 87649, "epoch": 724} {"train_loss": -35.355567932128906, "global_step": 87650, "epoch": 724} {"train_loss": -35.467647552490234, "global_step": 87651, "epoch": 724} {"train_loss": -34.28312683105469, "global_step": 87652, "epoch": 724} {"train_loss": -33.075965881347656, "global_step": 87653, "epoch": 724} {"train_loss": -35.021053314208984, "global_step": 87654, "epoch": 724} {"train_loss": -32.38552474975586, "global_step": 87655, "epoch": 724} {"train_loss": -32.66671371459961, "global_step": 87656, "epoch": 724} {"train_loss": -34.43178176879883, "global_step": 87657, "epoch": 724} {"train_loss": -32.35131072998047, "global_step": 87658, "epoch": 724} {"train_loss": -35.00654983520508, "global_step": 87659, "epoch": 724} {"train_loss": -30.395782470703125, "global_step": 87660, "epoch": 724} {"train_loss": -35.587623596191406, "global_step": 87661, "epoch": 724} {"train_loss": -33.91874313354492, "global_step": 87662, "epoch": 724} {"train_loss": -34.195858001708984, "global_step": 87663, "epoch": 724} {"train_loss": -35.54723358154297, "global_step": 87664, "epoch": 724} {"train_loss": -33.78202438354492, "global_step": 87665, "epoch": 724} {"train_loss": -32.65598678588867, "global_step": 87666, "epoch": 724} {"train_loss": -34.86872482299805, "global_step": 87667, "epoch": 724} {"train_loss": -34.376338958740234, "global_step": 87668, "epoch": 724} {"train_loss": -33.742610931396484, "global_step": 87669, "epoch": 724} {"train_loss": -35.06905746459961, "global_step": 87670, "epoch": 724} {"train_loss": -34.3759765625, "global_step": 87671, "epoch": 724} {"train_loss": -35.28304672241211, "global_step": 87672, "epoch": 724} {"train_loss": -35.049415588378906, "global_step": 87673, "epoch": 724} {"train_loss": -35.552642822265625, "global_step": 87674, "epoch": 724} {"train_loss": -36.3945198059082, "global_step": 87675, "epoch": 724} {"train_loss": -36.1732063293457, "global_step": 87676, "epoch": 724} {"train_loss": -35.114837646484375, "global_step": 87677, "epoch": 724} {"train_loss": -36.499149322509766, "global_step": 87678, "epoch": 724} {"train_loss": -35.90922927856445, "global_step": 87679, "epoch": 724} {"train_loss": -36.356109619140625, "global_step": 87680, "epoch": 724} {"train_loss": -35.79327392578125, "global_step": 87681, "epoch": 724} {"train_loss": -35.91954040527344, "global_step": 87682, "epoch": 724} {"train_loss": -35.72261428833008, "global_step": 87683, "epoch": 724} {"train_loss": -32.72927474975586, "global_step": 87684, "epoch": 724} {"train_loss": -35.96220016479492, "global_step": 87685, "epoch": 724} {"train_loss": -34.57986068725586, "global_step": 87686, "epoch": 724} {"train_loss": -31.6350040435791, "global_step": 87687, "epoch": 724} {"train_loss": -33.57601547241211, "global_step": 87688, "epoch": 724} {"train_loss": -34.990570068359375, "global_step": 87689, "epoch": 724} {"train_loss": -32.84908676147461, "global_step": 87690, "epoch": 724} {"train_loss": -28.300634384155273, "global_step": 87691, "epoch": 724} {"train_loss": -34.30609130859375, "global_step": 87692, "epoch": 724} {"train_loss": -31.86541175842285, "global_step": 87693, "epoch": 724} {"train_loss": -29.9053955078125, "global_step": 87694, "epoch": 724} {"train_loss": -31.395959854125977, "global_step": 87695, "epoch": 724} {"train_loss": -33.12438201904297, "global_step": 87696, "epoch": 724} {"train_loss": -34.896217346191406, "global_step": 87697, "epoch": 724} {"train_loss": -25.61188316345215, "global_step": 87698, "epoch": 724} {"train_loss": -31.4141902923584, "global_step": 87699, "epoch": 724} {"train_loss": -30.923114776611328, "global_step": 87700, "epoch": 724} {"train_loss": -27.529083251953125, "global_step": 87701, "epoch": 724} {"train_loss": -34.541748046875, "global_step": 87702, "epoch": 724} {"train_loss": -32.35230255126953, "global_step": 87703, "epoch": 724} {"train_loss": -34.219173431396484, "global_step": 87704, "epoch": 724} {"train_loss": -34.10714340209961, "global_step": 87705, "epoch": 724} {"train_loss": -34.053993225097656, "global_step": 87706, "epoch": 724} {"train_loss": -34.04227828979492, "global_step": 87707, "epoch": 724} {"train_loss": -33.65299606323242, "global_step": 87708, "epoch": 724} {"train_loss": -32.33795928955078, "global_step": 87709, "epoch": 724} {"train_loss": -34.73872756958008, "global_step": 87710, "epoch": 724} {"train_loss": -34.427886962890625, "global_step": 87711, "epoch": 724} {"train_loss": -34.46953201293945, "global_step": 87712, "epoch": 724} {"train_loss": -34.74066925048828, "global_step": 87713, "epoch": 724} {"train_loss": -34.14157485961914, "global_step": 87714, "epoch": 724} {"train_loss": -34.66388702392578, "global_step": 87715, "epoch": 724} {"train_loss": -35.04275131225586, "global_step": 87716, "epoch": 724} {"train_loss": -33.9150276184082, "global_step": 87717, "epoch": 724} {"train_loss": -35.166961669921875, "global_step": 87718, "epoch": 724} {"train_loss": -35.6138916015625, "global_step": 87719, "epoch": 724} {"train_loss": -35.485198974609375, "global_step": 87720, "epoch": 724} {"train_loss": -34.7717399597168, "global_step": 87721, "epoch": 724} {"train_loss": -35.2825927734375, "global_step": 87722, "epoch": 724} {"train_loss": -35.6087760925293, "global_step": 87723, "epoch": 724} {"train_loss": -35.29073157192262, "global_step": 87724, "epoch": 724, "val_loss": 2697868.75} {"train_loss": -35.67829513549805, "global_step": 87725, "epoch": 725} {"train_loss": -35.37736892700195, "global_step": 87726, "epoch": 725} {"train_loss": -35.7037467956543, "global_step": 87727, "epoch": 725} {"train_loss": -35.82497787475586, "global_step": 87728, "epoch": 725} {"train_loss": -35.65961837768555, "global_step": 87729, "epoch": 725} {"train_loss": -35.96974563598633, "global_step": 87730, "epoch": 725} {"train_loss": -35.55784225463867, "global_step": 87731, "epoch": 725} {"train_loss": -35.803260803222656, "global_step": 87732, "epoch": 725} {"train_loss": -36.39948272705078, "global_step": 87733, "epoch": 725} {"train_loss": -36.083045959472656, "global_step": 87734, "epoch": 725} {"train_loss": -36.62018966674805, "global_step": 87735, "epoch": 725} {"train_loss": -36.13955307006836, "global_step": 87736, "epoch": 725} {"train_loss": -36.32307434082031, "global_step": 87737, "epoch": 725} {"train_loss": -36.04819869995117, "global_step": 87738, "epoch": 725} {"train_loss": -36.250728607177734, "global_step": 87739, "epoch": 725} {"train_loss": -36.519405364990234, "global_step": 87740, "epoch": 725} {"train_loss": -36.374542236328125, "global_step": 87741, "epoch": 725} {"train_loss": -36.547000885009766, "global_step": 87742, "epoch": 725} {"train_loss": -36.89094924926758, "global_step": 87743, "epoch": 725} {"train_loss": -36.511356353759766, "global_step": 87744, "epoch": 725} {"train_loss": -36.51446533203125, "global_step": 87745, "epoch": 725} {"train_loss": -36.878055572509766, "global_step": 87746, "epoch": 725} {"train_loss": -36.946224212646484, "global_step": 87747, "epoch": 725} {"train_loss": -36.9324836730957, "global_step": 87748, "epoch": 725} {"train_loss": -36.99473190307617, "global_step": 87749, "epoch": 725} {"train_loss": -37.281673431396484, "global_step": 87750, "epoch": 725} {"train_loss": -37.059146881103516, "global_step": 87751, "epoch": 725} {"train_loss": -37.04096603393555, "global_step": 87752, "epoch": 725} {"train_loss": -37.16450119018555, "global_step": 87753, "epoch": 725} {"train_loss": -37.2681770324707, "global_step": 87754, "epoch": 725} {"train_loss": -37.21711349487305, "global_step": 87755, "epoch": 725} {"train_loss": -37.087947845458984, "global_step": 87756, "epoch": 725} {"train_loss": -37.398189544677734, "global_step": 87757, "epoch": 725} {"train_loss": -37.21027374267578, "global_step": 87758, "epoch": 725} {"train_loss": -37.78987121582031, "global_step": 87759, "epoch": 725} {"train_loss": -37.45917892456055, "global_step": 87760, "epoch": 725} {"train_loss": -37.48236083984375, "global_step": 87761, "epoch": 725} {"train_loss": -37.55973815917969, "global_step": 87762, "epoch": 725} {"train_loss": -37.18661117553711, "global_step": 87763, "epoch": 725} {"train_loss": -37.59176254272461, "global_step": 87764, "epoch": 725} {"train_loss": -37.63021469116211, "global_step": 87765, "epoch": 725} {"train_loss": -37.87771224975586, "global_step": 87766, "epoch": 725} {"train_loss": -38.05585479736328, "global_step": 87767, "epoch": 725} {"train_loss": -37.876136779785156, "global_step": 87768, "epoch": 725} {"train_loss": -38.102989196777344, "global_step": 87769, "epoch": 725} {"train_loss": -37.53379821777344, "global_step": 87770, "epoch": 725} {"train_loss": -37.94497299194336, "global_step": 87771, "epoch": 725} {"train_loss": -38.13746643066406, "global_step": 87772, "epoch": 725} {"train_loss": -37.9709358215332, "global_step": 87773, "epoch": 725} {"train_loss": -38.151824951171875, "global_step": 87774, "epoch": 725} {"train_loss": -37.72819519042969, "global_step": 87775, "epoch": 725} {"train_loss": -38.265132904052734, "global_step": 87776, "epoch": 725} {"train_loss": -38.135902404785156, "global_step": 87777, "epoch": 725} {"train_loss": -37.92740249633789, "global_step": 87778, "epoch": 725} {"train_loss": -38.03702926635742, "global_step": 87779, "epoch": 725} {"train_loss": -37.52456283569336, "global_step": 87780, "epoch": 725} {"train_loss": -37.989776611328125, "global_step": 87781, "epoch": 725} {"train_loss": -37.53778076171875, "global_step": 87782, "epoch": 725} {"train_loss": -37.3895263671875, "global_step": 87783, "epoch": 725} {"train_loss": -37.6025276184082, "global_step": 87784, "epoch": 725} {"train_loss": -37.14115524291992, "global_step": 87785, "epoch": 725} {"train_loss": -37.58810806274414, "global_step": 87786, "epoch": 725} {"train_loss": -37.61727523803711, "global_step": 87787, "epoch": 725} {"train_loss": -38.65824508666992, "global_step": 87788, "epoch": 725} {"train_loss": -38.59391403198242, "global_step": 87789, "epoch": 725} {"train_loss": -38.72125244140625, "global_step": 87790, "epoch": 725} {"train_loss": -38.48036193847656, "global_step": 87791, "epoch": 725} {"train_loss": -38.61524200439453, "global_step": 87792, "epoch": 725} {"train_loss": -38.19109344482422, "global_step": 87793, "epoch": 725} {"train_loss": -38.360626220703125, "global_step": 87794, "epoch": 725} {"train_loss": -38.10673522949219, "global_step": 87795, "epoch": 725} {"train_loss": -38.33327102661133, "global_step": 87796, "epoch": 725} {"train_loss": -37.60027313232422, "global_step": 87797, "epoch": 725} {"train_loss": -36.19260787963867, "global_step": 87798, "epoch": 725} {"train_loss": -37.381263732910156, "global_step": 87799, "epoch": 725} {"train_loss": -37.493953704833984, "global_step": 87800, "epoch": 725} {"train_loss": -35.98348617553711, "global_step": 87801, "epoch": 725} {"train_loss": -34.73454666137695, "global_step": 87802, "epoch": 725} {"train_loss": -32.18693923950195, "global_step": 87803, "epoch": 725} {"train_loss": -29.778120040893555, "global_step": 87804, "epoch": 725} {"train_loss": -28.083663940429688, "global_step": 87805, "epoch": 725} {"train_loss": -29.953474044799805, "global_step": 87806, "epoch": 725} {"train_loss": -33.62009811401367, "global_step": 87807, "epoch": 725} {"train_loss": -35.377105712890625, "global_step": 87808, "epoch": 725} {"train_loss": -34.48293685913086, "global_step": 87809, "epoch": 725} {"train_loss": -34.9058952331543, "global_step": 87810, "epoch": 725} {"train_loss": -35.720455169677734, "global_step": 87811, "epoch": 725} {"train_loss": -36.87551498413086, "global_step": 87812, "epoch": 725} {"train_loss": -35.7216682434082, "global_step": 87813, "epoch": 725} {"train_loss": -37.2080078125, "global_step": 87814, "epoch": 725} {"train_loss": -35.77970504760742, "global_step": 87815, "epoch": 725} {"train_loss": -37.04248046875, "global_step": 87816, "epoch": 725} {"train_loss": -36.55898666381836, "global_step": 87817, "epoch": 725} {"train_loss": -37.4957160949707, "global_step": 87818, "epoch": 725} {"train_loss": -35.862239837646484, "global_step": 87819, "epoch": 725} {"train_loss": -37.45046615600586, "global_step": 87820, "epoch": 725} {"train_loss": -35.70980453491211, "global_step": 87821, "epoch": 725} {"train_loss": -37.43312072753906, "global_step": 87822, "epoch": 725} {"train_loss": -36.2807731628418, "global_step": 87823, "epoch": 725} {"train_loss": -36.939735412597656, "global_step": 87824, "epoch": 725} {"train_loss": -37.359954833984375, "global_step": 87825, "epoch": 725} {"train_loss": -37.5097541809082, "global_step": 87826, "epoch": 725} {"train_loss": -37.7194709777832, "global_step": 87827, "epoch": 725} {"train_loss": -37.00318145751953, "global_step": 87828, "epoch": 725} {"train_loss": -37.66145706176758, "global_step": 87829, "epoch": 725} {"train_loss": -37.72478485107422, "global_step": 87830, "epoch": 725} {"train_loss": -37.80707931518555, "global_step": 87831, "epoch": 725} {"train_loss": -37.881629943847656, "global_step": 87832, "epoch": 725} {"train_loss": -37.76229476928711, "global_step": 87833, "epoch": 725} {"train_loss": -38.22913360595703, "global_step": 87834, "epoch": 725} {"train_loss": -37.65127944946289, "global_step": 87835, "epoch": 725} {"train_loss": -37.67163848876953, "global_step": 87836, "epoch": 725} {"train_loss": -37.923622131347656, "global_step": 87837, "epoch": 725} {"train_loss": -37.9752311706543, "global_step": 87838, "epoch": 725} {"train_loss": -37.53873062133789, "global_step": 87839, "epoch": 725} {"train_loss": -37.24650192260742, "global_step": 87840, "epoch": 725} {"train_loss": -38.4311637878418, "global_step": 87841, "epoch": 725} {"train_loss": -38.30768585205078, "global_step": 87842, "epoch": 725} {"train_loss": -38.1135368347168, "global_step": 87843, "epoch": 725} {"train_loss": -37.570919036865234, "global_step": 87844, "epoch": 725} {"train_loss": -36.904246306616415, "global_step": 87845, "epoch": 725, "val_loss": 2641008.75} {"train_loss": -38.73750686645508, "global_step": 87846, "epoch": 726} {"train_loss": -38.331966400146484, "global_step": 87847, "epoch": 726} {"train_loss": -38.23907470703125, "global_step": 87848, "epoch": 726} {"train_loss": -38.61450958251953, "global_step": 87849, "epoch": 726} {"train_loss": -38.37266159057617, "global_step": 87850, "epoch": 726} {"train_loss": -38.8404426574707, "global_step": 87851, "epoch": 726} {"train_loss": -38.53249740600586, "global_step": 87852, "epoch": 726} {"train_loss": -38.692256927490234, "global_step": 87853, "epoch": 726} {"train_loss": -38.40418243408203, "global_step": 87854, "epoch": 726} {"train_loss": -38.711421966552734, "global_step": 87855, "epoch": 726} {"train_loss": -38.770503997802734, "global_step": 87856, "epoch": 726} {"train_loss": -38.38759994506836, "global_step": 87857, "epoch": 726} {"train_loss": -38.34590530395508, "global_step": 87858, "epoch": 726} {"train_loss": -38.30718231201172, "global_step": 87859, "epoch": 726} {"train_loss": -38.69977569580078, "global_step": 87860, "epoch": 726} {"train_loss": -38.49409866333008, "global_step": 87861, "epoch": 726} {"train_loss": -38.984493255615234, "global_step": 87862, "epoch": 726} {"train_loss": -39.114959716796875, "global_step": 87863, "epoch": 726} {"train_loss": -38.42988967895508, "global_step": 87864, "epoch": 726} {"train_loss": -38.369754791259766, "global_step": 87865, "epoch": 726} {"train_loss": -37.81816482543945, "global_step": 87866, "epoch": 726} {"train_loss": -37.55086898803711, "global_step": 87867, "epoch": 726} {"train_loss": -34.29598617553711, "global_step": 87868, "epoch": 726} {"train_loss": -21.352697372436523, "global_step": 87869, "epoch": 726} {"train_loss": -5.7519001960754395, "global_step": 87870, "epoch": 726} {"train_loss": -4.13795280456543, "global_step": 87871, "epoch": 726} {"train_loss": -37.6843376159668, "global_step": 87872, "epoch": 726} {"train_loss": -16.261615753173828, "global_step": 87873, "epoch": 726} {"train_loss": -27.207910537719727, "global_step": 87874, "epoch": 726} {"train_loss": -28.99018669128418, "global_step": 87875, "epoch": 726} {"train_loss": -35.08723068237305, "global_step": 87876, "epoch": 726} {"train_loss": -27.367826461791992, "global_step": 87877, "epoch": 726} {"train_loss": -36.57701110839844, "global_step": 87878, "epoch": 726} {"train_loss": -30.772363662719727, "global_step": 87879, "epoch": 726} {"train_loss": -34.24752426147461, "global_step": 87880, "epoch": 726} {"train_loss": -35.12721633911133, "global_step": 87881, "epoch": 726} {"train_loss": -32.7265510559082, "global_step": 87882, "epoch": 726} {"train_loss": -33.85430908203125, "global_step": 87883, "epoch": 726} {"train_loss": -36.60780715942383, "global_step": 87884, "epoch": 726} {"train_loss": -33.61133575439453, "global_step": 87885, "epoch": 726} {"train_loss": -35.24032211303711, "global_step": 87886, "epoch": 726} {"train_loss": -36.4501953125, "global_step": 87887, "epoch": 726} {"train_loss": -35.854278564453125, "global_step": 87888, "epoch": 726} {"train_loss": -35.197811126708984, "global_step": 87889, "epoch": 726} {"train_loss": -36.16274642944336, "global_step": 87890, "epoch": 726} {"train_loss": -36.80677795410156, "global_step": 87891, "epoch": 726} {"train_loss": -35.69983673095703, "global_step": 87892, "epoch": 726} {"train_loss": -36.546146392822266, "global_step": 87893, "epoch": 726} {"train_loss": -36.293251037597656, "global_step": 87894, "epoch": 726} {"train_loss": -36.821510314941406, "global_step": 87895, "epoch": 726} {"train_loss": -36.98537063598633, "global_step": 87896, "epoch": 726} {"train_loss": -36.78148651123047, "global_step": 87897, "epoch": 726} {"train_loss": -36.84455108642578, "global_step": 87898, "epoch": 726} {"train_loss": -36.56834030151367, "global_step": 87899, "epoch": 726} {"train_loss": -37.334529876708984, "global_step": 87900, "epoch": 726} {"train_loss": -37.112422943115234, "global_step": 87901, "epoch": 726} {"train_loss": -37.127532958984375, "global_step": 87902, "epoch": 726} {"train_loss": -37.14849853515625, "global_step": 87903, "epoch": 726} {"train_loss": -37.50623321533203, "global_step": 87904, "epoch": 726} {"train_loss": -37.48818588256836, "global_step": 87905, "epoch": 726} {"train_loss": -37.38764572143555, "global_step": 87906, "epoch": 726} {"train_loss": -37.63764190673828, "global_step": 87907, "epoch": 726} {"train_loss": -37.35032272338867, "global_step": 87908, "epoch": 726} {"train_loss": -37.6811637878418, "global_step": 87909, "epoch": 726} {"train_loss": -37.5029182434082, "global_step": 87910, "epoch": 726} {"train_loss": -37.84553146362305, "global_step": 87911, "epoch": 726} {"train_loss": -37.33401107788086, "global_step": 87912, "epoch": 726} {"train_loss": -37.939937591552734, "global_step": 87913, "epoch": 726} {"train_loss": -37.69552230834961, "global_step": 87914, "epoch": 726} {"train_loss": -38.2353630065918, "global_step": 87915, "epoch": 726} {"train_loss": -37.708431243896484, "global_step": 87916, "epoch": 726} {"train_loss": -37.532840728759766, "global_step": 87917, "epoch": 726} {"train_loss": -38.2037353515625, "global_step": 87918, "epoch": 726} {"train_loss": -38.0885009765625, "global_step": 87919, "epoch": 726} {"train_loss": -37.88762283325195, "global_step": 87920, "epoch": 726} {"train_loss": -38.2717399597168, "global_step": 87921, "epoch": 726} {"train_loss": -37.626827239990234, "global_step": 87922, "epoch": 726} {"train_loss": -37.42823028564453, "global_step": 87923, "epoch": 726} {"train_loss": -37.36155700683594, "global_step": 87924, "epoch": 726} {"train_loss": -37.290740966796875, "global_step": 87925, "epoch": 726} {"train_loss": -37.98861312866211, "global_step": 87926, "epoch": 726} {"train_loss": -38.02987289428711, "global_step": 87927, "epoch": 726} {"train_loss": -37.93284225463867, "global_step": 87928, "epoch": 726} {"train_loss": -37.82536697387695, "global_step": 87929, "epoch": 726} {"train_loss": -37.31000518798828, "global_step": 87930, "epoch": 726} {"train_loss": -36.65312576293945, "global_step": 87931, "epoch": 726} {"train_loss": -38.33612060546875, "global_step": 87932, "epoch": 726} {"train_loss": -37.2992057800293, "global_step": 87933, "epoch": 726} {"train_loss": -35.0702018737793, "global_step": 87934, "epoch": 726} {"train_loss": -32.80713653564453, "global_step": 87935, "epoch": 726} {"train_loss": -29.676971435546875, "global_step": 87936, "epoch": 726} {"train_loss": -29.977401733398438, "global_step": 87937, "epoch": 726} {"train_loss": -36.16249465942383, "global_step": 87938, "epoch": 726} {"train_loss": -35.4896125793457, "global_step": 87939, "epoch": 726} {"train_loss": -35.64215850830078, "global_step": 87940, "epoch": 726} {"train_loss": -36.19218063354492, "global_step": 87941, "epoch": 726} {"train_loss": -34.587276458740234, "global_step": 87942, "epoch": 726} {"train_loss": -37.94045639038086, "global_step": 87943, "epoch": 726} {"train_loss": -35.569061279296875, "global_step": 87944, "epoch": 726} {"train_loss": -37.17033004760742, "global_step": 87945, "epoch": 726} {"train_loss": -36.68731689453125, "global_step": 87946, "epoch": 726} {"train_loss": -36.944488525390625, "global_step": 87947, "epoch": 726} {"train_loss": -36.485816955566406, "global_step": 87948, "epoch": 726} {"train_loss": -36.587318420410156, "global_step": 87949, "epoch": 726} {"train_loss": -36.762489318847656, "global_step": 87950, "epoch": 726} {"train_loss": -36.716094970703125, "global_step": 87951, "epoch": 726} {"train_loss": -36.787696838378906, "global_step": 87952, "epoch": 726} {"train_loss": -36.47113800048828, "global_step": 87953, "epoch": 726} {"train_loss": -36.676937103271484, "global_step": 87954, "epoch": 726} {"train_loss": -37.388851165771484, "global_step": 87955, "epoch": 726} {"train_loss": -36.815860748291016, "global_step": 87956, "epoch": 726} {"train_loss": -37.333248138427734, "global_step": 87957, "epoch": 726} {"train_loss": -37.4040412902832, "global_step": 87958, "epoch": 726} {"train_loss": -37.43741989135742, "global_step": 87959, "epoch": 726} {"train_loss": -37.30642318725586, "global_step": 87960, "epoch": 726} {"train_loss": -37.120819091796875, "global_step": 87961, "epoch": 726} {"train_loss": -37.57474899291992, "global_step": 87962, "epoch": 726} {"train_loss": -36.93687438964844, "global_step": 87963, "epoch": 726} {"train_loss": -37.503841400146484, "global_step": 87964, "epoch": 726} {"train_loss": -37.58443069458008, "global_step": 87965, "epoch": 726} {"train_loss": -35.869670682702186, "global_step": 87966, "epoch": 726, "val_loss": 2633664.0} {"train_loss": -37.20331954956055, "global_step": 87967, "epoch": 727} {"train_loss": -37.736244201660156, "global_step": 87968, "epoch": 727} {"train_loss": -37.68122100830078, "global_step": 87969, "epoch": 727} {"train_loss": -37.86790084838867, "global_step": 87970, "epoch": 727} {"train_loss": -38.27922058105469, "global_step": 87971, "epoch": 727} {"train_loss": -37.848182678222656, "global_step": 87972, "epoch": 727} {"train_loss": -38.06424331665039, "global_step": 87973, "epoch": 727} {"train_loss": -38.15803146362305, "global_step": 87974, "epoch": 727} {"train_loss": -37.64667510986328, "global_step": 87975, "epoch": 727} {"train_loss": -37.991844177246094, "global_step": 87976, "epoch": 727} {"train_loss": -37.345680236816406, "global_step": 87977, "epoch": 727} {"train_loss": -35.854156494140625, "global_step": 87978, "epoch": 727} {"train_loss": -29.766447067260742, "global_step": 87979, "epoch": 727} {"train_loss": -14.018816947937012, "global_step": 87980, "epoch": 727} {"train_loss": 16.001953125, "global_step": 87981, "epoch": 727} {"train_loss": -21.62729835510254, "global_step": 87982, "epoch": 727} {"train_loss": -31.784894943237305, "global_step": 87983, "epoch": 727} {"train_loss": -23.127939224243164, "global_step": 87984, "epoch": 727} {"train_loss": -33.30459976196289, "global_step": 87985, "epoch": 727} {"train_loss": -30.772024154663086, "global_step": 87986, "epoch": 727} {"train_loss": -29.424579620361328, "global_step": 87987, "epoch": 727} {"train_loss": -35.44355392456055, "global_step": 87988, "epoch": 727} {"train_loss": -31.128498077392578, "global_step": 87989, "epoch": 727} {"train_loss": -33.2811393737793, "global_step": 87990, "epoch": 727} {"train_loss": -36.321929931640625, "global_step": 87991, "epoch": 727} {"train_loss": -32.4464111328125, "global_step": 87992, "epoch": 727} {"train_loss": -34.454017639160156, "global_step": 87993, "epoch": 727} {"train_loss": -35.870697021484375, "global_step": 87994, "epoch": 727} {"train_loss": -35.7872200012207, "global_step": 87995, "epoch": 727} {"train_loss": -33.9813117980957, "global_step": 87996, "epoch": 727} {"train_loss": -35.59126663208008, "global_step": 87997, "epoch": 727} {"train_loss": -36.65066909790039, "global_step": 87998, "epoch": 727} {"train_loss": -35.180355072021484, "global_step": 87999, "epoch": 727} {"train_loss": -35.47092819213867, "global_step": 88000, "epoch": 727} {"train_loss": -35.910888671875, "global_step": 88001, "epoch": 727} {"train_loss": -36.40333938598633, "global_step": 88002, "epoch": 727} {"train_loss": -36.22297286987305, "global_step": 88003, "epoch": 727} {"train_loss": -36.457210540771484, "global_step": 88004, "epoch": 727} {"train_loss": -36.114192962646484, "global_step": 88005, "epoch": 727} {"train_loss": -36.44619369506836, "global_step": 88006, "epoch": 727} {"train_loss": -36.94989013671875, "global_step": 88007, "epoch": 727} {"train_loss": -36.310401916503906, "global_step": 88008, "epoch": 727} {"train_loss": -36.40797805786133, "global_step": 88009, "epoch": 727} {"train_loss": -36.89357376098633, "global_step": 88010, "epoch": 727} {"train_loss": -36.69124221801758, "global_step": 88011, "epoch": 727} {"train_loss": -36.82215118408203, "global_step": 88012, "epoch": 727} {"train_loss": -36.90998077392578, "global_step": 88013, "epoch": 727} {"train_loss": -37.17916488647461, "global_step": 88014, "epoch": 727} {"train_loss": -37.090084075927734, "global_step": 88015, "epoch": 727} {"train_loss": -37.36176300048828, "global_step": 88016, "epoch": 727} {"train_loss": -37.33584213256836, "global_step": 88017, "epoch": 727} {"train_loss": -37.67020034790039, "global_step": 88018, "epoch": 727} {"train_loss": -37.32089614868164, "global_step": 88019, "epoch": 727} {"train_loss": -37.360618591308594, "global_step": 88020, "epoch": 727} {"train_loss": -37.76015090942383, "global_step": 88021, "epoch": 727} {"train_loss": -37.423561096191406, "global_step": 88022, "epoch": 727} {"train_loss": -37.479522705078125, "global_step": 88023, "epoch": 727} {"train_loss": -37.75108337402344, "global_step": 88024, "epoch": 727} {"train_loss": -37.85446548461914, "global_step": 88025, "epoch": 727} {"train_loss": -37.37380599975586, "global_step": 88026, "epoch": 727} {"train_loss": -37.756446838378906, "global_step": 88027, "epoch": 727} {"train_loss": -37.393959045410156, "global_step": 88028, "epoch": 727} {"train_loss": -37.78102493286133, "global_step": 88029, "epoch": 727} {"train_loss": -37.41184616088867, "global_step": 88030, "epoch": 727} {"train_loss": -37.65314865112305, "global_step": 88031, "epoch": 727} {"train_loss": -37.9111442565918, "global_step": 88032, "epoch": 727} {"train_loss": -37.64289474487305, "global_step": 88033, "epoch": 727} {"train_loss": -37.82265090942383, "global_step": 88034, "epoch": 727} {"train_loss": -37.58051681518555, "global_step": 88035, "epoch": 727} {"train_loss": -38.25925827026367, "global_step": 88036, "epoch": 727} {"train_loss": -38.51400375366211, "global_step": 88037, "epoch": 727} {"train_loss": -37.895626068115234, "global_step": 88038, "epoch": 727} {"train_loss": -38.02771759033203, "global_step": 88039, "epoch": 727} {"train_loss": -38.3221549987793, "global_step": 88040, "epoch": 727} {"train_loss": -38.37190628051758, "global_step": 88041, "epoch": 727} {"train_loss": -37.623756408691406, "global_step": 88042, "epoch": 727} {"train_loss": -37.88566207885742, "global_step": 88043, "epoch": 727} {"train_loss": -37.58294677734375, "global_step": 88044, "epoch": 727} {"train_loss": -37.35667037963867, "global_step": 88045, "epoch": 727} {"train_loss": -37.714012145996094, "global_step": 88046, "epoch": 727} {"train_loss": -38.11140060424805, "global_step": 88047, "epoch": 727} {"train_loss": -37.96603775024414, "global_step": 88048, "epoch": 727} {"train_loss": -38.227386474609375, "global_step": 88049, "epoch": 727} {"train_loss": -38.0267219543457, "global_step": 88050, "epoch": 727} {"train_loss": -37.91437911987305, "global_step": 88051, "epoch": 727} {"train_loss": -37.462646484375, "global_step": 88052, "epoch": 727} {"train_loss": -37.30927276611328, "global_step": 88053, "epoch": 727} {"train_loss": -37.479061126708984, "global_step": 88054, "epoch": 727} {"train_loss": -36.25638961791992, "global_step": 88055, "epoch": 727} {"train_loss": -36.335872650146484, "global_step": 88056, "epoch": 727} {"train_loss": -36.13929748535156, "global_step": 88057, "epoch": 727} {"train_loss": -37.013771057128906, "global_step": 88058, "epoch": 727} {"train_loss": -36.765968322753906, "global_step": 88059, "epoch": 727} {"train_loss": -37.537479400634766, "global_step": 88060, "epoch": 727} {"train_loss": -37.5262565612793, "global_step": 88061, "epoch": 727} {"train_loss": -37.334877014160156, "global_step": 88062, "epoch": 727} {"train_loss": -37.44740676879883, "global_step": 88063, "epoch": 727} {"train_loss": -37.39201736450195, "global_step": 88064, "epoch": 727} {"train_loss": -37.443538665771484, "global_step": 88065, "epoch": 727} {"train_loss": -35.45010757446289, "global_step": 88066, "epoch": 727} {"train_loss": -34.11467361450195, "global_step": 88067, "epoch": 727} {"train_loss": -36.810401916503906, "global_step": 88068, "epoch": 727} {"train_loss": -36.48884582519531, "global_step": 88069, "epoch": 727} {"train_loss": -36.77042770385742, "global_step": 88070, "epoch": 727} {"train_loss": -37.447505950927734, "global_step": 88071, "epoch": 727} {"train_loss": -36.264530181884766, "global_step": 88072, "epoch": 727} {"train_loss": -35.472389221191406, "global_step": 88073, "epoch": 727} {"train_loss": -36.75033950805664, "global_step": 88074, "epoch": 727} {"train_loss": -37.360069274902344, "global_step": 88075, "epoch": 727} {"train_loss": -36.68648910522461, "global_step": 88076, "epoch": 727} {"train_loss": -37.32406997680664, "global_step": 88077, "epoch": 727} {"train_loss": -37.47053146362305, "global_step": 88078, "epoch": 727} {"train_loss": -36.97407150268555, "global_step": 88079, "epoch": 727} {"train_loss": -37.19585418701172, "global_step": 88080, "epoch": 727} {"train_loss": -38.19293212890625, "global_step": 88081, "epoch": 727} {"train_loss": -37.2578125, "global_step": 88082, "epoch": 727} {"train_loss": -38.16752624511719, "global_step": 88083, "epoch": 727} {"train_loss": -37.1949348449707, "global_step": 88084, "epoch": 727} {"train_loss": -36.964599609375, "global_step": 88085, "epoch": 727} {"train_loss": -37.58142852783203, "global_step": 88086, "epoch": 727} {"train_loss": -35.86660704336876, "global_step": 88087, "epoch": 727, "val_loss": 2642296.25} {"train_loss": -37.6496696472168, "global_step": 88088, "epoch": 728} {"train_loss": -37.58882141113281, "global_step": 88089, "epoch": 728} {"train_loss": -37.43430709838867, "global_step": 88090, "epoch": 728} {"train_loss": -37.60970687866211, "global_step": 88091, "epoch": 728} {"train_loss": -36.821231842041016, "global_step": 88092, "epoch": 728} {"train_loss": -37.8585090637207, "global_step": 88093, "epoch": 728} {"train_loss": -37.79500198364258, "global_step": 88094, "epoch": 728} {"train_loss": -37.91630935668945, "global_step": 88095, "epoch": 728} {"train_loss": -37.59157943725586, "global_step": 88096, "epoch": 728} {"train_loss": -37.176963806152344, "global_step": 88097, "epoch": 728} {"train_loss": -37.076210021972656, "global_step": 88098, "epoch": 728} {"train_loss": -37.43864440917969, "global_step": 88099, "epoch": 728} {"train_loss": -37.8239860534668, "global_step": 88100, "epoch": 728} {"train_loss": -38.080562591552734, "global_step": 88101, "epoch": 728} {"train_loss": -38.180755615234375, "global_step": 88102, "epoch": 728} {"train_loss": -37.080108642578125, "global_step": 88103, "epoch": 728} {"train_loss": -37.06576156616211, "global_step": 88104, "epoch": 728} {"train_loss": -37.46683120727539, "global_step": 88105, "epoch": 728} {"train_loss": -37.92905807495117, "global_step": 88106, "epoch": 728} {"train_loss": -37.856441497802734, "global_step": 88107, "epoch": 728} {"train_loss": -37.70041275024414, "global_step": 88108, "epoch": 728} {"train_loss": -37.095619201660156, "global_step": 88109, "epoch": 728} {"train_loss": -37.58170700073242, "global_step": 88110, "epoch": 728} {"train_loss": -37.55317687988281, "global_step": 88111, "epoch": 728} {"train_loss": -36.98134994506836, "global_step": 88112, "epoch": 728} {"train_loss": -37.942317962646484, "global_step": 88113, "epoch": 728} {"train_loss": -37.767486572265625, "global_step": 88114, "epoch": 728} {"train_loss": -38.374122619628906, "global_step": 88115, "epoch": 728} {"train_loss": -38.046539306640625, "global_step": 88116, "epoch": 728} {"train_loss": -38.04916000366211, "global_step": 88117, "epoch": 728} {"train_loss": -38.07408905029297, "global_step": 88118, "epoch": 728} {"train_loss": -38.24289321899414, "global_step": 88119, "epoch": 728} {"train_loss": -38.291934967041016, "global_step": 88120, "epoch": 728} {"train_loss": -38.24706268310547, "global_step": 88121, "epoch": 728} {"train_loss": -38.097755432128906, "global_step": 88122, "epoch": 728} {"train_loss": -38.00478744506836, "global_step": 88123, "epoch": 728} {"train_loss": -37.155513763427734, "global_step": 88124, "epoch": 728} {"train_loss": -38.31565475463867, "global_step": 88125, "epoch": 728} {"train_loss": -38.62012481689453, "global_step": 88126, "epoch": 728} {"train_loss": -38.62458038330078, "global_step": 88127, "epoch": 728} {"train_loss": -38.1202507019043, "global_step": 88128, "epoch": 728} {"train_loss": -38.17909622192383, "global_step": 88129, "epoch": 728} {"train_loss": -37.654727935791016, "global_step": 88130, "epoch": 728} {"train_loss": -37.06937026977539, "global_step": 88131, "epoch": 728} {"train_loss": -37.2400016784668, "global_step": 88132, "epoch": 728} {"train_loss": -36.539344787597656, "global_step": 88133, "epoch": 728} {"train_loss": -36.65071487426758, "global_step": 88134, "epoch": 728} {"train_loss": -34.86891555786133, "global_step": 88135, "epoch": 728} {"train_loss": -33.13668441772461, "global_step": 88136, "epoch": 728} {"train_loss": -34.433433532714844, "global_step": 88137, "epoch": 728} {"train_loss": -35.66489791870117, "global_step": 88138, "epoch": 728} {"train_loss": -36.80214309692383, "global_step": 88139, "epoch": 728} {"train_loss": -37.43500900268555, "global_step": 88140, "epoch": 728} {"train_loss": -35.34959411621094, "global_step": 88141, "epoch": 728} {"train_loss": -33.897483825683594, "global_step": 88142, "epoch": 728} {"train_loss": -34.92594909667969, "global_step": 88143, "epoch": 728} {"train_loss": -37.096073150634766, "global_step": 88144, "epoch": 728} {"train_loss": -35.953548431396484, "global_step": 88145, "epoch": 728} {"train_loss": -36.01415252685547, "global_step": 88146, "epoch": 728} {"train_loss": -37.257545471191406, "global_step": 88147, "epoch": 728} {"train_loss": -36.182186126708984, "global_step": 88148, "epoch": 728} {"train_loss": -36.00221633911133, "global_step": 88149, "epoch": 728} {"train_loss": -37.37263870239258, "global_step": 88150, "epoch": 728} {"train_loss": -37.15354537963867, "global_step": 88151, "epoch": 728} {"train_loss": -37.242774963378906, "global_step": 88152, "epoch": 728} {"train_loss": -36.84521484375, "global_step": 88153, "epoch": 728} {"train_loss": -36.687686920166016, "global_step": 88154, "epoch": 728} {"train_loss": -36.329524993896484, "global_step": 88155, "epoch": 728} {"train_loss": -36.1504020690918, "global_step": 88156, "epoch": 728} {"train_loss": -35.97842025756836, "global_step": 88157, "epoch": 728} {"train_loss": -36.6530876159668, "global_step": 88158, "epoch": 728} {"train_loss": -37.356788635253906, "global_step": 88159, "epoch": 728} {"train_loss": -37.21121597290039, "global_step": 88160, "epoch": 728} {"train_loss": -37.58533477783203, "global_step": 88161, "epoch": 728} {"train_loss": -36.55601119995117, "global_step": 88162, "epoch": 728} {"train_loss": -37.2025146484375, "global_step": 88163, "epoch": 728} {"train_loss": -37.01528549194336, "global_step": 88164, "epoch": 728} {"train_loss": -36.95598602294922, "global_step": 88165, "epoch": 728} {"train_loss": -37.71615982055664, "global_step": 88166, "epoch": 728} {"train_loss": -37.00516891479492, "global_step": 88167, "epoch": 728} {"train_loss": -38.009578704833984, "global_step": 88168, "epoch": 728} {"train_loss": -37.608306884765625, "global_step": 88169, "epoch": 728} {"train_loss": -37.86800765991211, "global_step": 88170, "epoch": 728} {"train_loss": -37.34150695800781, "global_step": 88171, "epoch": 728} {"train_loss": -32.163368225097656, "global_step": 88172, "epoch": 728} {"train_loss": -37.7177848815918, "global_step": 88173, "epoch": 728} {"train_loss": -37.348880767822266, "global_step": 88174, "epoch": 728} {"train_loss": -37.56709671020508, "global_step": 88175, "epoch": 728} {"train_loss": -37.56605911254883, "global_step": 88176, "epoch": 728} {"train_loss": -37.512908935546875, "global_step": 88177, "epoch": 728} {"train_loss": -37.4566650390625, "global_step": 88178, "epoch": 728} {"train_loss": -37.49284744262695, "global_step": 88179, "epoch": 728} {"train_loss": -37.488525390625, "global_step": 88180, "epoch": 728} {"train_loss": -37.68809127807617, "global_step": 88181, "epoch": 728} {"train_loss": -37.79214859008789, "global_step": 88182, "epoch": 728} {"train_loss": -37.1494255065918, "global_step": 88183, "epoch": 728} {"train_loss": -37.40553283691406, "global_step": 88184, "epoch": 728} {"train_loss": -37.33165740966797, "global_step": 88185, "epoch": 728} {"train_loss": -37.26974105834961, "global_step": 88186, "epoch": 728} {"train_loss": -37.2254753112793, "global_step": 88187, "epoch": 728} {"train_loss": -37.279537200927734, "global_step": 88188, "epoch": 728} {"train_loss": -38.061134338378906, "global_step": 88189, "epoch": 728} {"train_loss": -37.945472717285156, "global_step": 88190, "epoch": 728} {"train_loss": -34.89434814453125, "global_step": 88191, "epoch": 728} {"train_loss": -37.82008361816406, "global_step": 88192, "epoch": 728} {"train_loss": -37.89306640625, "global_step": 88193, "epoch": 728} {"train_loss": -38.26912307739258, "global_step": 88194, "epoch": 728} {"train_loss": -37.500328063964844, "global_step": 88195, "epoch": 728} {"train_loss": -37.93937301635742, "global_step": 88196, "epoch": 728} {"train_loss": -38.28347396850586, "global_step": 88197, "epoch": 728} {"train_loss": -37.9522590637207, "global_step": 88198, "epoch": 728} {"train_loss": -37.475128173828125, "global_step": 88199, "epoch": 728} {"train_loss": -38.04948043823242, "global_step": 88200, "epoch": 728} {"train_loss": -37.11552810668945, "global_step": 88201, "epoch": 728} {"train_loss": -37.94322204589844, "global_step": 88202, "epoch": 728} {"train_loss": -38.635684967041016, "global_step": 88203, "epoch": 728} {"train_loss": -37.9621696472168, "global_step": 88204, "epoch": 728} {"train_loss": -35.36564254760742, "global_step": 88205, "epoch": 728} {"train_loss": -37.0272102355957, "global_step": 88206, "epoch": 728} {"train_loss": -37.32072448730469, "global_step": 88207, "epoch": 728} {"train_loss": -37.23472787526028, "global_step": 88208, "epoch": 728, "val_loss": 2478735.0} {"train_loss": -36.22207260131836, "global_step": 88209, "epoch": 729} {"train_loss": -37.49418258666992, "global_step": 88210, "epoch": 729} {"train_loss": -37.73696517944336, "global_step": 88211, "epoch": 729} {"train_loss": -36.789058685302734, "global_step": 88212, "epoch": 729} {"train_loss": -37.54362487792969, "global_step": 88213, "epoch": 729} {"train_loss": -37.75450134277344, "global_step": 88214, "epoch": 729} {"train_loss": 1.1122779846191406, "global_step": 88215, "epoch": 729} {"train_loss": -16.449161529541016, "global_step": 88216, "epoch": 729} {"train_loss": -22.85892677307129, "global_step": 88217, "epoch": 729} {"train_loss": -26.15052604675293, "global_step": 88218, "epoch": 729} {"train_loss": -32.08218765258789, "global_step": 88219, "epoch": 729} {"train_loss": -28.062854766845703, "global_step": 88220, "epoch": 729} {"train_loss": -23.649717330932617, "global_step": 88221, "epoch": 729} {"train_loss": -26.891510009765625, "global_step": 88222, "epoch": 729} {"train_loss": -30.65399169921875, "global_step": 88223, "epoch": 729} {"train_loss": -24.886951446533203, "global_step": 88224, "epoch": 729} {"train_loss": -30.423994064331055, "global_step": 88225, "epoch": 729} {"train_loss": -32.17940902709961, "global_step": 88226, "epoch": 729} {"train_loss": -34.54310607910156, "global_step": 88227, "epoch": 729} {"train_loss": -31.354825973510742, "global_step": 88228, "epoch": 729} {"train_loss": -29.843433380126953, "global_step": 88229, "epoch": 729} {"train_loss": -31.377960205078125, "global_step": 88230, "epoch": 729} {"train_loss": -30.634695053100586, "global_step": 88231, "epoch": 729} {"train_loss": -31.8817195892334, "global_step": 88232, "epoch": 729} {"train_loss": -31.715417861938477, "global_step": 88233, "epoch": 729} {"train_loss": -33.91095733642578, "global_step": 88234, "epoch": 729} {"train_loss": -34.4293327331543, "global_step": 88235, "epoch": 729} {"train_loss": -33.12789535522461, "global_step": 88236, "epoch": 729} {"train_loss": -32.8160285949707, "global_step": 88237, "epoch": 729} {"train_loss": -30.697004318237305, "global_step": 88238, "epoch": 729} {"train_loss": -32.985984802246094, "global_step": 88239, "epoch": 729} {"train_loss": -34.64560317993164, "global_step": 88240, "epoch": 729} {"train_loss": -34.515987396240234, "global_step": 88241, "epoch": 729} {"train_loss": -33.31206512451172, "global_step": 88242, "epoch": 729} {"train_loss": -34.55439758300781, "global_step": 88243, "epoch": 729} {"train_loss": -35.03597640991211, "global_step": 88244, "epoch": 729} {"train_loss": -34.3186149597168, "global_step": 88245, "epoch": 729} {"train_loss": -34.94875717163086, "global_step": 88246, "epoch": 729} {"train_loss": -34.2016716003418, "global_step": 88247, "epoch": 729} {"train_loss": -35.43269729614258, "global_step": 88248, "epoch": 729} {"train_loss": -34.53941345214844, "global_step": 88249, "epoch": 729} {"train_loss": -34.87953567504883, "global_step": 88250, "epoch": 729} {"train_loss": -34.47579574584961, "global_step": 88251, "epoch": 729} {"train_loss": -35.18852615356445, "global_step": 88252, "epoch": 729} {"train_loss": -34.91315841674805, "global_step": 88253, "epoch": 729} {"train_loss": -35.333003997802734, "global_step": 88254, "epoch": 729} {"train_loss": -35.31390380859375, "global_step": 88255, "epoch": 729} {"train_loss": -34.99528121948242, "global_step": 88256, "epoch": 729} {"train_loss": -35.06663131713867, "global_step": 88257, "epoch": 729} {"train_loss": -35.43997573852539, "global_step": 88258, "epoch": 729} {"train_loss": -35.70698547363281, "global_step": 88259, "epoch": 729} {"train_loss": -35.59059143066406, "global_step": 88260, "epoch": 729} {"train_loss": -35.37459945678711, "global_step": 88261, "epoch": 729} {"train_loss": -36.1125602722168, "global_step": 88262, "epoch": 729} {"train_loss": -35.99073028564453, "global_step": 88263, "epoch": 729} {"train_loss": -35.981117248535156, "global_step": 88264, "epoch": 729} {"train_loss": -35.61970520019531, "global_step": 88265, "epoch": 729} {"train_loss": -35.75339889526367, "global_step": 88266, "epoch": 729} {"train_loss": -35.86030197143555, "global_step": 88267, "epoch": 729} {"train_loss": -35.76531982421875, "global_step": 88268, "epoch": 729} {"train_loss": -36.04691696166992, "global_step": 88269, "epoch": 729} {"train_loss": -35.69599151611328, "global_step": 88270, "epoch": 729} {"train_loss": -35.73481369018555, "global_step": 88271, "epoch": 729} {"train_loss": -36.076324462890625, "global_step": 88272, "epoch": 729} {"train_loss": -35.89414596557617, "global_step": 88273, "epoch": 729} {"train_loss": -36.22549819946289, "global_step": 88274, "epoch": 729} {"train_loss": -36.35688400268555, "global_step": 88275, "epoch": 729} {"train_loss": -36.3403205871582, "global_step": 88276, "epoch": 729} {"train_loss": -36.62705612182617, "global_step": 88277, "epoch": 729} {"train_loss": -36.2015495300293, "global_step": 88278, "epoch": 729} {"train_loss": -36.3559455871582, "global_step": 88279, "epoch": 729} {"train_loss": -36.79878616333008, "global_step": 88280, "epoch": 729} {"train_loss": -36.74473571777344, "global_step": 88281, "epoch": 729} {"train_loss": -36.90938186645508, "global_step": 88282, "epoch": 729} {"train_loss": -35.92997360229492, "global_step": 88283, "epoch": 729} {"train_loss": -36.60334014892578, "global_step": 88284, "epoch": 729} {"train_loss": -37.52251052856445, "global_step": 88285, "epoch": 729} {"train_loss": -36.844566345214844, "global_step": 88286, "epoch": 729} {"train_loss": -37.053218841552734, "global_step": 88287, "epoch": 729} {"train_loss": -36.93519973754883, "global_step": 88288, "epoch": 729} {"train_loss": -36.80940628051758, "global_step": 88289, "epoch": 729} {"train_loss": -36.982757568359375, "global_step": 88290, "epoch": 729} {"train_loss": -36.670860290527344, "global_step": 88291, "epoch": 729} {"train_loss": -37.16379165649414, "global_step": 88292, "epoch": 729} {"train_loss": -36.88301086425781, "global_step": 88293, "epoch": 729} {"train_loss": -37.50258255004883, "global_step": 88294, "epoch": 729} {"train_loss": -37.2524299621582, "global_step": 88295, "epoch": 729} {"train_loss": -36.30744552612305, "global_step": 88296, "epoch": 729} {"train_loss": -37.167781829833984, "global_step": 88297, "epoch": 729} {"train_loss": -37.233314514160156, "global_step": 88298, "epoch": 729} {"train_loss": -37.19121551513672, "global_step": 88299, "epoch": 729} {"train_loss": -36.128047943115234, "global_step": 88300, "epoch": 729} {"train_loss": -37.38332748413086, "global_step": 88301, "epoch": 729} {"train_loss": -37.284732818603516, "global_step": 88302, "epoch": 729} {"train_loss": -37.18198776245117, "global_step": 88303, "epoch": 729} {"train_loss": -36.5440788269043, "global_step": 88304, "epoch": 729} {"train_loss": -36.19132995605469, "global_step": 88305, "epoch": 729} {"train_loss": -35.71127700805664, "global_step": 88306, "epoch": 729} {"train_loss": -34.099708557128906, "global_step": 88307, "epoch": 729} {"train_loss": -27.905094146728516, "global_step": 88308, "epoch": 729} {"train_loss": -24.502389907836914, "global_step": 88309, "epoch": 729} {"train_loss": -33.26261520385742, "global_step": 88310, "epoch": 729} {"train_loss": -36.73586654663086, "global_step": 88311, "epoch": 729} {"train_loss": -32.02737045288086, "global_step": 88312, "epoch": 729} {"train_loss": -35.46726608276367, "global_step": 88313, "epoch": 729} {"train_loss": -36.20967483520508, "global_step": 88314, "epoch": 729} {"train_loss": -34.29741668701172, "global_step": 88315, "epoch": 729} {"train_loss": -36.560977935791016, "global_step": 88316, "epoch": 729} {"train_loss": -34.941162109375, "global_step": 88317, "epoch": 729} {"train_loss": -36.88896560668945, "global_step": 88318, "epoch": 729} {"train_loss": -36.1881217956543, "global_step": 88319, "epoch": 729} {"train_loss": -36.5802001953125, "global_step": 88320, "epoch": 729} {"train_loss": -35.917842864990234, "global_step": 88321, "epoch": 729} {"train_loss": -36.93150329589844, "global_step": 88322, "epoch": 729} {"train_loss": -35.59059143066406, "global_step": 88323, "epoch": 729} {"train_loss": -37.09687423706055, "global_step": 88324, "epoch": 729} {"train_loss": -36.39058303833008, "global_step": 88325, "epoch": 729} {"train_loss": -37.34574508666992, "global_step": 88326, "epoch": 729} {"train_loss": -36.40839385986328, "global_step": 88327, "epoch": 729} {"train_loss": -37.213478088378906, "global_step": 88328, "epoch": 729} {"train_loss": -34.31434766911278, "global_step": 88329, "epoch": 729, "val_loss": 2634157.0} {"train_loss": -37.430885314941406, "global_step": 88330, "epoch": 730} {"train_loss": -36.78847122192383, "global_step": 88331, "epoch": 730} {"train_loss": -37.33234405517578, "global_step": 88332, "epoch": 730} {"train_loss": -37.590763092041016, "global_step": 88333, "epoch": 730} {"train_loss": -37.14326095581055, "global_step": 88334, "epoch": 730} {"train_loss": -36.783119201660156, "global_step": 88335, "epoch": 730} {"train_loss": -37.06324005126953, "global_step": 88336, "epoch": 730} {"train_loss": -37.39714431762695, "global_step": 88337, "epoch": 730} {"train_loss": -37.15855026245117, "global_step": 88338, "epoch": 730} {"train_loss": -37.34467697143555, "global_step": 88339, "epoch": 730} {"train_loss": -37.198726654052734, "global_step": 88340, "epoch": 730} {"train_loss": -37.669429779052734, "global_step": 88341, "epoch": 730} {"train_loss": -37.08626937866211, "global_step": 88342, "epoch": 730} {"train_loss": -37.24938201904297, "global_step": 88343, "epoch": 730} {"train_loss": -37.36080551147461, "global_step": 88344, "epoch": 730} {"train_loss": -37.24602508544922, "global_step": 88345, "epoch": 730} {"train_loss": -37.89691925048828, "global_step": 88346, "epoch": 730} {"train_loss": -37.81834030151367, "global_step": 88347, "epoch": 730} {"train_loss": -37.704017639160156, "global_step": 88348, "epoch": 730} {"train_loss": -37.53937911987305, "global_step": 88349, "epoch": 730} {"train_loss": -37.79630661010742, "global_step": 88350, "epoch": 730} {"train_loss": -37.150054931640625, "global_step": 88351, "epoch": 730} {"train_loss": -37.91226577758789, "global_step": 88352, "epoch": 730} {"train_loss": -38.126548767089844, "global_step": 88353, "epoch": 730} {"train_loss": -37.9154167175293, "global_step": 88354, "epoch": 730} {"train_loss": -37.75410079956055, "global_step": 88355, "epoch": 730} {"train_loss": -37.998165130615234, "global_step": 88356, "epoch": 730} {"train_loss": -38.23405838012695, "global_step": 88357, "epoch": 730} {"train_loss": -38.12141799926758, "global_step": 88358, "epoch": 730} {"train_loss": -38.45051574707031, "global_step": 88359, "epoch": 730} {"train_loss": -38.209022521972656, "global_step": 88360, "epoch": 730} {"train_loss": -37.8074951171875, "global_step": 88361, "epoch": 730} {"train_loss": -37.86518478393555, "global_step": 88362, "epoch": 730} {"train_loss": -38.445533752441406, "global_step": 88363, "epoch": 730} {"train_loss": -37.966835021972656, "global_step": 88364, "epoch": 730} {"train_loss": -38.3258056640625, "global_step": 88365, "epoch": 730} {"train_loss": -37.8192253112793, "global_step": 88366, "epoch": 730} {"train_loss": -38.25617599487305, "global_step": 88367, "epoch": 730} {"train_loss": -37.20286560058594, "global_step": 88368, "epoch": 730} {"train_loss": -37.96638870239258, "global_step": 88369, "epoch": 730} {"train_loss": -37.64704513549805, "global_step": 88370, "epoch": 730} {"train_loss": -37.406349182128906, "global_step": 88371, "epoch": 730} {"train_loss": -37.349544525146484, "global_step": 88372, "epoch": 730} {"train_loss": -37.4129524230957, "global_step": 88373, "epoch": 730} {"train_loss": -36.965328216552734, "global_step": 88374, "epoch": 730} {"train_loss": -37.596717834472656, "global_step": 88375, "epoch": 730} {"train_loss": -37.80121994018555, "global_step": 88376, "epoch": 730} {"train_loss": -37.888851165771484, "global_step": 88377, "epoch": 730} {"train_loss": -37.11012649536133, "global_step": 88378, "epoch": 730} {"train_loss": -36.07948303222656, "global_step": 88379, "epoch": 730} {"train_loss": -37.19880294799805, "global_step": 88380, "epoch": 730} {"train_loss": -37.68349075317383, "global_step": 88381, "epoch": 730} {"train_loss": -37.1569938659668, "global_step": 88382, "epoch": 730} {"train_loss": -37.70980453491211, "global_step": 88383, "epoch": 730} {"train_loss": -37.09368896484375, "global_step": 88384, "epoch": 730} {"train_loss": -37.76206588745117, "global_step": 88385, "epoch": 730} {"train_loss": -36.91238021850586, "global_step": 88386, "epoch": 730} {"train_loss": -35.69132614135742, "global_step": 88387, "epoch": 730} {"train_loss": -36.2663688659668, "global_step": 88388, "epoch": 730} {"train_loss": -35.739044189453125, "global_step": 88389, "epoch": 730} {"train_loss": -37.92517852783203, "global_step": 88390, "epoch": 730} {"train_loss": -37.136390686035156, "global_step": 88391, "epoch": 730} {"train_loss": -37.03035354614258, "global_step": 88392, "epoch": 730} {"train_loss": -35.81295394897461, "global_step": 88393, "epoch": 730} {"train_loss": -37.55213165283203, "global_step": 88394, "epoch": 730} {"train_loss": -36.745880126953125, "global_step": 88395, "epoch": 730} {"train_loss": -36.88216781616211, "global_step": 88396, "epoch": 730} {"train_loss": -35.71591567993164, "global_step": 88397, "epoch": 730} {"train_loss": -37.871482849121094, "global_step": 88398, "epoch": 730} {"train_loss": -36.96647262573242, "global_step": 88399, "epoch": 730} {"train_loss": -37.341552734375, "global_step": 88400, "epoch": 730} {"train_loss": -37.22446823120117, "global_step": 88401, "epoch": 730} {"train_loss": -37.746070861816406, "global_step": 88402, "epoch": 730} {"train_loss": -37.51469802856445, "global_step": 88403, "epoch": 730} {"train_loss": -37.95680236816406, "global_step": 88404, "epoch": 730} {"train_loss": -37.411930084228516, "global_step": 88405, "epoch": 730} {"train_loss": -37.98152542114258, "global_step": 88406, "epoch": 730} {"train_loss": -37.82014083862305, "global_step": 88407, "epoch": 730} {"train_loss": -37.111366271972656, "global_step": 88408, "epoch": 730} {"train_loss": -37.5666618347168, "global_step": 88409, "epoch": 730} {"train_loss": -36.8542594909668, "global_step": 88410, "epoch": 730} {"train_loss": -37.66874694824219, "global_step": 88411, "epoch": 730} {"train_loss": -37.6949348449707, "global_step": 88412, "epoch": 730} {"train_loss": -37.850894927978516, "global_step": 88413, "epoch": 730} {"train_loss": -37.6185417175293, "global_step": 88414, "epoch": 730} {"train_loss": -38.426998138427734, "global_step": 88415, "epoch": 730} {"train_loss": -37.31227111816406, "global_step": 88416, "epoch": 730} {"train_loss": -37.7021369934082, "global_step": 88417, "epoch": 730} {"train_loss": -37.735076904296875, "global_step": 88418, "epoch": 730} {"train_loss": -37.8936882019043, "global_step": 88419, "epoch": 730} {"train_loss": -38.357704162597656, "global_step": 88420, "epoch": 730} {"train_loss": -38.24725341796875, "global_step": 88421, "epoch": 730} {"train_loss": -38.09818649291992, "global_step": 88422, "epoch": 730} {"train_loss": -38.07715606689453, "global_step": 88423, "epoch": 730} {"train_loss": -38.20472717285156, "global_step": 88424, "epoch": 730} {"train_loss": -38.122589111328125, "global_step": 88425, "epoch": 730} {"train_loss": -37.996822357177734, "global_step": 88426, "epoch": 730} {"train_loss": -38.05048370361328, "global_step": 88427, "epoch": 730} {"train_loss": -38.561336517333984, "global_step": 88428, "epoch": 730} {"train_loss": -38.53037643432617, "global_step": 88429, "epoch": 730} {"train_loss": -38.37131881713867, "global_step": 88430, "epoch": 730} {"train_loss": -38.31386947631836, "global_step": 88431, "epoch": 730} {"train_loss": -38.15216827392578, "global_step": 88432, "epoch": 730} {"train_loss": -38.03718948364258, "global_step": 88433, "epoch": 730} {"train_loss": -38.631107330322266, "global_step": 88434, "epoch": 730} {"train_loss": -38.42121124267578, "global_step": 88435, "epoch": 730} {"train_loss": -37.94057083129883, "global_step": 88436, "epoch": 730} {"train_loss": -38.60641098022461, "global_step": 88437, "epoch": 730} {"train_loss": -38.56193923950195, "global_step": 88438, "epoch": 730} {"train_loss": -37.752532958984375, "global_step": 88439, "epoch": 730} {"train_loss": -38.87357711791992, "global_step": 88440, "epoch": 730} {"train_loss": -38.502349853515625, "global_step": 88441, "epoch": 730} {"train_loss": -38.706459045410156, "global_step": 88442, "epoch": 730} {"train_loss": -38.15607452392578, "global_step": 88443, "epoch": 730} {"train_loss": -38.3300895690918, "global_step": 88444, "epoch": 730} {"train_loss": -38.79859161376953, "global_step": 88445, "epoch": 730} {"train_loss": -38.06257247924805, "global_step": 88446, "epoch": 730} {"train_loss": -38.186553955078125, "global_step": 88447, "epoch": 730} {"train_loss": -38.88601303100586, "global_step": 88448, "epoch": 730} {"train_loss": -38.59771728515625, "global_step": 88449, "epoch": 730} {"train_loss": -37.685425561321665, "global_step": 88450, "epoch": 730, "val_loss": 2612234.25} {"train_loss": -38.36851119995117, "global_step": 88451, "epoch": 731} {"train_loss": -38.544456481933594, "global_step": 88452, "epoch": 731} {"train_loss": -38.900508880615234, "global_step": 88453, "epoch": 731} {"train_loss": -38.381072998046875, "global_step": 88454, "epoch": 731} {"train_loss": -38.75385665893555, "global_step": 88455, "epoch": 731} {"train_loss": -38.35197830200195, "global_step": 88456, "epoch": 731} {"train_loss": -38.53528594970703, "global_step": 88457, "epoch": 731} {"train_loss": -37.751869201660156, "global_step": 88458, "epoch": 731} {"train_loss": -38.66577911376953, "global_step": 88459, "epoch": 731} {"train_loss": -38.234169006347656, "global_step": 88460, "epoch": 731} {"train_loss": -37.51131057739258, "global_step": 88461, "epoch": 731} {"train_loss": -35.44417190551758, "global_step": 88462, "epoch": 731} {"train_loss": -29.34610366821289, "global_step": 88463, "epoch": 731} {"train_loss": -32.168025970458984, "global_step": 88464, "epoch": 731} {"train_loss": -34.256229400634766, "global_step": 88465, "epoch": 731} {"train_loss": -32.908050537109375, "global_step": 88466, "epoch": 731} {"train_loss": -26.732013702392578, "global_step": 88467, "epoch": 731} {"train_loss": -26.52471923828125, "global_step": 88468, "epoch": 731} {"train_loss": -30.45411491394043, "global_step": 88469, "epoch": 731} {"train_loss": -35.099998474121094, "global_step": 88470, "epoch": 731} {"train_loss": -33.73848342895508, "global_step": 88471, "epoch": 731} {"train_loss": -35.528480529785156, "global_step": 88472, "epoch": 731} {"train_loss": -34.536685943603516, "global_step": 88473, "epoch": 731} {"train_loss": -34.017189025878906, "global_step": 88474, "epoch": 731} {"train_loss": -32.752906799316406, "global_step": 88475, "epoch": 731} {"train_loss": -35.634002685546875, "global_step": 88476, "epoch": 731} {"train_loss": -34.50907516479492, "global_step": 88477, "epoch": 731} {"train_loss": -35.70784378051758, "global_step": 88478, "epoch": 731} {"train_loss": -35.117427825927734, "global_step": 88479, "epoch": 731} {"train_loss": -34.6862678527832, "global_step": 88480, "epoch": 731} {"train_loss": -36.60102081298828, "global_step": 88481, "epoch": 731} {"train_loss": -34.55469512939453, "global_step": 88482, "epoch": 731} {"train_loss": -36.87778854370117, "global_step": 88483, "epoch": 731} {"train_loss": -36.133758544921875, "global_step": 88484, "epoch": 731} {"train_loss": -35.645809173583984, "global_step": 88485, "epoch": 731} {"train_loss": -37.24279022216797, "global_step": 88486, "epoch": 731} {"train_loss": -37.06360626220703, "global_step": 88487, "epoch": 731} {"train_loss": -37.28898239135742, "global_step": 88488, "epoch": 731} {"train_loss": -37.537532806396484, "global_step": 88489, "epoch": 731} {"train_loss": -36.815547943115234, "global_step": 88490, "epoch": 731} {"train_loss": -37.291629791259766, "global_step": 88491, "epoch": 731} {"train_loss": -37.23434066772461, "global_step": 88492, "epoch": 731} {"train_loss": -37.31055450439453, "global_step": 88493, "epoch": 731} {"train_loss": -37.38964080810547, "global_step": 88494, "epoch": 731} {"train_loss": -38.01821517944336, "global_step": 88495, "epoch": 731} {"train_loss": -37.25960922241211, "global_step": 88496, "epoch": 731} {"train_loss": -37.74666213989258, "global_step": 88497, "epoch": 731} {"train_loss": -37.77808380126953, "global_step": 88498, "epoch": 731} {"train_loss": -37.74250030517578, "global_step": 88499, "epoch": 731} {"train_loss": -37.99119186401367, "global_step": 88500, "epoch": 731} {"train_loss": -38.04349899291992, "global_step": 88501, "epoch": 731} {"train_loss": -37.798583984375, "global_step": 88502, "epoch": 731} {"train_loss": -37.72152328491211, "global_step": 88503, "epoch": 731} {"train_loss": -38.08512496948242, "global_step": 88504, "epoch": 731} {"train_loss": -38.37834930419922, "global_step": 88505, "epoch": 731} {"train_loss": -37.74725341796875, "global_step": 88506, "epoch": 731} {"train_loss": -38.34572982788086, "global_step": 88507, "epoch": 731} {"train_loss": -38.258480072021484, "global_step": 88508, "epoch": 731} {"train_loss": -38.00957107543945, "global_step": 88509, "epoch": 731} {"train_loss": -38.55735397338867, "global_step": 88510, "epoch": 731} {"train_loss": -38.42869186401367, "global_step": 88511, "epoch": 731} {"train_loss": -38.08152389526367, "global_step": 88512, "epoch": 731} {"train_loss": -37.94655227661133, "global_step": 88513, "epoch": 731} {"train_loss": -37.9152946472168, "global_step": 88514, "epoch": 731} {"train_loss": -37.44485855102539, "global_step": 88515, "epoch": 731} {"train_loss": -38.46305465698242, "global_step": 88516, "epoch": 731} {"train_loss": -38.45528793334961, "global_step": 88517, "epoch": 731} {"train_loss": -37.5345573425293, "global_step": 88518, "epoch": 731} {"train_loss": -38.10616683959961, "global_step": 88519, "epoch": 731} {"train_loss": -38.28513717651367, "global_step": 88520, "epoch": 731} {"train_loss": -38.04851531982422, "global_step": 88521, "epoch": 731} {"train_loss": -38.02289962768555, "global_step": 88522, "epoch": 731} {"train_loss": -38.50172805786133, "global_step": 88523, "epoch": 731} {"train_loss": -38.55022430419922, "global_step": 88524, "epoch": 731} {"train_loss": -38.675628662109375, "global_step": 88525, "epoch": 731} {"train_loss": -38.365882873535156, "global_step": 88526, "epoch": 731} {"train_loss": -38.46171569824219, "global_step": 88527, "epoch": 731} {"train_loss": -38.481876373291016, "global_step": 88528, "epoch": 731} {"train_loss": -38.10321044921875, "global_step": 88529, "epoch": 731} {"train_loss": -38.852943420410156, "global_step": 88530, "epoch": 731} {"train_loss": -38.3950309753418, "global_step": 88531, "epoch": 731} {"train_loss": -37.41108322143555, "global_step": 88532, "epoch": 731} {"train_loss": -38.18539047241211, "global_step": 88533, "epoch": 731} {"train_loss": -38.47978210449219, "global_step": 88534, "epoch": 731} {"train_loss": -37.27448654174805, "global_step": 88535, "epoch": 731} {"train_loss": -36.81087875366211, "global_step": 88536, "epoch": 731} {"train_loss": -37.68915557861328, "global_step": 88537, "epoch": 731} {"train_loss": -37.92477035522461, "global_step": 88538, "epoch": 731} {"train_loss": -37.61985778808594, "global_step": 88539, "epoch": 731} {"train_loss": -37.297115325927734, "global_step": 88540, "epoch": 731} {"train_loss": -37.87582015991211, "global_step": 88541, "epoch": 731} {"train_loss": -36.387630462646484, "global_step": 88542, "epoch": 731} {"train_loss": -37.18012619018555, "global_step": 88543, "epoch": 731} {"train_loss": -37.427947998046875, "global_step": 88544, "epoch": 731} {"train_loss": -38.03223419189453, "global_step": 88545, "epoch": 731} {"train_loss": -37.21393585205078, "global_step": 88546, "epoch": 731} {"train_loss": -35.72787094116211, "global_step": 88547, "epoch": 731} {"train_loss": -36.7468147277832, "global_step": 88548, "epoch": 731} {"train_loss": -37.01679611206055, "global_step": 88549, "epoch": 731} {"train_loss": -37.3033332824707, "global_step": 88550, "epoch": 731} {"train_loss": -35.191864013671875, "global_step": 88551, "epoch": 731} {"train_loss": -31.345075607299805, "global_step": 88552, "epoch": 731} {"train_loss": -36.12813949584961, "global_step": 88553, "epoch": 731} {"train_loss": -23.324560165405273, "global_step": 88554, "epoch": 731} {"train_loss": -38.00388717651367, "global_step": 88555, "epoch": 731} {"train_loss": -26.997602462768555, "global_step": 88556, "epoch": 731} {"train_loss": -36.908626556396484, "global_step": 88557, "epoch": 731} {"train_loss": -33.13031005859375, "global_step": 88558, "epoch": 731} {"train_loss": -32.51540756225586, "global_step": 88559, "epoch": 731} {"train_loss": -36.54569625854492, "global_step": 88560, "epoch": 731} {"train_loss": -32.323486328125, "global_step": 88561, "epoch": 731} {"train_loss": -34.590179443359375, "global_step": 88562, "epoch": 731} {"train_loss": -35.917266845703125, "global_step": 88563, "epoch": 731} {"train_loss": -36.069637298583984, "global_step": 88564, "epoch": 731} {"train_loss": -35.5833854675293, "global_step": 88565, "epoch": 731} {"train_loss": -35.263580322265625, "global_step": 88566, "epoch": 731} {"train_loss": -37.49009323120117, "global_step": 88567, "epoch": 731} {"train_loss": -36.982357025146484, "global_step": 88568, "epoch": 731} {"train_loss": -35.87941360473633, "global_step": 88569, "epoch": 731} {"train_loss": -35.68941116333008, "global_step": 88570, "epoch": 731} {"train_loss": -36.441530590215, "global_step": 88571, "epoch": 731, "val_loss": 2530199.75} {"train_loss": -37.17122268676758, "global_step": 88572, "epoch": 732} {"train_loss": -36.89075469970703, "global_step": 88573, "epoch": 732} {"train_loss": -36.40688705444336, "global_step": 88574, "epoch": 732} {"train_loss": -36.84507369995117, "global_step": 88575, "epoch": 732} {"train_loss": -37.80034255981445, "global_step": 88576, "epoch": 732} {"train_loss": -38.02840805053711, "global_step": 88577, "epoch": 732} {"train_loss": -37.33251953125, "global_step": 88578, "epoch": 732} {"train_loss": -37.486228942871094, "global_step": 88579, "epoch": 732} {"train_loss": -37.8117790222168, "global_step": 88580, "epoch": 732} {"train_loss": -38.031028747558594, "global_step": 88581, "epoch": 732} {"train_loss": -38.09049987792969, "global_step": 88582, "epoch": 732} {"train_loss": -38.03038787841797, "global_step": 88583, "epoch": 732} {"train_loss": -38.087154388427734, "global_step": 88584, "epoch": 732} {"train_loss": -37.6728401184082, "global_step": 88585, "epoch": 732} {"train_loss": -38.36042785644531, "global_step": 88586, "epoch": 732} {"train_loss": -38.0124397277832, "global_step": 88587, "epoch": 732} {"train_loss": -38.5156135559082, "global_step": 88588, "epoch": 732} {"train_loss": -38.11869430541992, "global_step": 88589, "epoch": 732} {"train_loss": -38.47455978393555, "global_step": 88590, "epoch": 732} {"train_loss": -38.4420166015625, "global_step": 88591, "epoch": 732} {"train_loss": -38.455352783203125, "global_step": 88592, "epoch": 732} {"train_loss": -38.445533752441406, "global_step": 88593, "epoch": 732} {"train_loss": -38.10382843017578, "global_step": 88594, "epoch": 732} {"train_loss": -38.35810089111328, "global_step": 88595, "epoch": 732} {"train_loss": -38.189849853515625, "global_step": 88596, "epoch": 732} {"train_loss": -38.45808410644531, "global_step": 88597, "epoch": 732} {"train_loss": -37.462547302246094, "global_step": 88598, "epoch": 732} {"train_loss": -37.45968246459961, "global_step": 88599, "epoch": 732} {"train_loss": -37.00436019897461, "global_step": 88600, "epoch": 732} {"train_loss": -37.57694625854492, "global_step": 88601, "epoch": 732} {"train_loss": -38.20844268798828, "global_step": 88602, "epoch": 732} {"train_loss": -37.36147689819336, "global_step": 88603, "epoch": 732} {"train_loss": -36.44560241699219, "global_step": 88604, "epoch": 732} {"train_loss": -36.29133987426758, "global_step": 88605, "epoch": 732} {"train_loss": -38.1954345703125, "global_step": 88606, "epoch": 732} {"train_loss": -38.803192138671875, "global_step": 88607, "epoch": 732} {"train_loss": -37.74199295043945, "global_step": 88608, "epoch": 732} {"train_loss": -37.516841888427734, "global_step": 88609, "epoch": 732} {"train_loss": -38.21305465698242, "global_step": 88610, "epoch": 732} {"train_loss": -38.004905700683594, "global_step": 88611, "epoch": 732} {"train_loss": -37.36623001098633, "global_step": 88612, "epoch": 732} {"train_loss": -37.92558288574219, "global_step": 88613, "epoch": 732} {"train_loss": -38.13234329223633, "global_step": 88614, "epoch": 732} {"train_loss": -38.2063102722168, "global_step": 88615, "epoch": 732} {"train_loss": -37.12477493286133, "global_step": 88616, "epoch": 732} {"train_loss": -37.958595275878906, "global_step": 88617, "epoch": 732} {"train_loss": -38.18572235107422, "global_step": 88618, "epoch": 732} {"train_loss": -38.23671340942383, "global_step": 88619, "epoch": 732} {"train_loss": -37.979549407958984, "global_step": 88620, "epoch": 732} {"train_loss": -37.7148551940918, "global_step": 88621, "epoch": 732} {"train_loss": -37.13771438598633, "global_step": 88622, "epoch": 732} {"train_loss": -37.41128158569336, "global_step": 88623, "epoch": 732} {"train_loss": -37.410804748535156, "global_step": 88624, "epoch": 732} {"train_loss": -37.3601188659668, "global_step": 88625, "epoch": 732} {"train_loss": -37.366844177246094, "global_step": 88626, "epoch": 732} {"train_loss": -37.562171936035156, "global_step": 88627, "epoch": 732} {"train_loss": -38.484249114990234, "global_step": 88628, "epoch": 732} {"train_loss": -37.84194564819336, "global_step": 88629, "epoch": 732} {"train_loss": -37.40963363647461, "global_step": 88630, "epoch": 732} {"train_loss": -36.04640579223633, "global_step": 88631, "epoch": 732} {"train_loss": -38.22019577026367, "global_step": 88632, "epoch": 732} {"train_loss": -38.0354118347168, "global_step": 88633, "epoch": 732} {"train_loss": -37.78730392456055, "global_step": 88634, "epoch": 732} {"train_loss": -36.4525260925293, "global_step": 88635, "epoch": 732} {"train_loss": -37.0567512512207, "global_step": 88636, "epoch": 732} {"train_loss": -37.85451889038086, "global_step": 88637, "epoch": 732} {"train_loss": -38.242122650146484, "global_step": 88638, "epoch": 732} {"train_loss": -38.02635192871094, "global_step": 88639, "epoch": 732} {"train_loss": -36.8851432800293, "global_step": 88640, "epoch": 732} {"train_loss": -37.74456024169922, "global_step": 88641, "epoch": 732} {"train_loss": -37.920475006103516, "global_step": 88642, "epoch": 732} {"train_loss": -37.69630813598633, "global_step": 88643, "epoch": 732} {"train_loss": -36.688255310058594, "global_step": 88644, "epoch": 732} {"train_loss": -34.957820892333984, "global_step": 88645, "epoch": 732} {"train_loss": -33.52577209472656, "global_step": 88646, "epoch": 732} {"train_loss": -35.33644104003906, "global_step": 88647, "epoch": 732} {"train_loss": -37.80716323852539, "global_step": 88648, "epoch": 732} {"train_loss": -35.70365905761719, "global_step": 88649, "epoch": 732} {"train_loss": -36.117774963378906, "global_step": 88650, "epoch": 732} {"train_loss": -35.34133529663086, "global_step": 88651, "epoch": 732} {"train_loss": -35.97061538696289, "global_step": 88652, "epoch": 732} {"train_loss": -36.123046875, "global_step": 88653, "epoch": 732} {"train_loss": -34.88644027709961, "global_step": 88654, "epoch": 732} {"train_loss": -36.6662483215332, "global_step": 88655, "epoch": 732} {"train_loss": -37.95440673828125, "global_step": 88656, "epoch": 732} {"train_loss": -37.23354721069336, "global_step": 88657, "epoch": 732} {"train_loss": -37.12394332885742, "global_step": 88658, "epoch": 732} {"train_loss": -37.971717834472656, "global_step": 88659, "epoch": 732} {"train_loss": -37.3333740234375, "global_step": 88660, "epoch": 732} {"train_loss": -38.18540573120117, "global_step": 88661, "epoch": 732} {"train_loss": -38.00361251831055, "global_step": 88662, "epoch": 732} {"train_loss": -38.0227165222168, "global_step": 88663, "epoch": 732} {"train_loss": -38.326263427734375, "global_step": 88664, "epoch": 732} {"train_loss": -38.20286560058594, "global_step": 88665, "epoch": 732} {"train_loss": -38.38532257080078, "global_step": 88666, "epoch": 732} {"train_loss": -38.52129364013672, "global_step": 88667, "epoch": 732} {"train_loss": -37.996517181396484, "global_step": 88668, "epoch": 732} {"train_loss": -38.01145553588867, "global_step": 88669, "epoch": 732} {"train_loss": -37.5023193359375, "global_step": 88670, "epoch": 732} {"train_loss": -37.8621940612793, "global_step": 88671, "epoch": 732} {"train_loss": -37.73160934448242, "global_step": 88672, "epoch": 732} {"train_loss": -38.42006301879883, "global_step": 88673, "epoch": 732} {"train_loss": -37.66250228881836, "global_step": 88674, "epoch": 732} {"train_loss": -37.882991790771484, "global_step": 88675, "epoch": 732} {"train_loss": -37.99370193481445, "global_step": 88676, "epoch": 732} {"train_loss": -37.70912170410156, "global_step": 88677, "epoch": 732} {"train_loss": -37.96513748168945, "global_step": 88678, "epoch": 732} {"train_loss": -38.054298400878906, "global_step": 88679, "epoch": 732} {"train_loss": -38.24628829956055, "global_step": 88680, "epoch": 732} {"train_loss": -38.124290466308594, "global_step": 88681, "epoch": 732} {"train_loss": -38.397216796875, "global_step": 88682, "epoch": 732} {"train_loss": -38.84910202026367, "global_step": 88683, "epoch": 732} {"train_loss": -37.976051330566406, "global_step": 88684, "epoch": 732} {"train_loss": -38.5228271484375, "global_step": 88685, "epoch": 732} {"train_loss": -37.740943908691406, "global_step": 88686, "epoch": 732} {"train_loss": -37.54286575317383, "global_step": 88687, "epoch": 732} {"train_loss": -38.813880920410156, "global_step": 88688, "epoch": 732} {"train_loss": -38.114280700683594, "global_step": 88689, "epoch": 732} {"train_loss": -38.86433410644531, "global_step": 88690, "epoch": 732} {"train_loss": -38.52989959716797, "global_step": 88691, "epoch": 732} {"train_loss": -37.64033256089392, "global_step": 88692, "epoch": 732, "val_loss": 2510315.75} {"train_loss": -38.433189392089844, "global_step": 88693, "epoch": 733} {"train_loss": -37.70025634765625, "global_step": 88694, "epoch": 733} {"train_loss": -38.57667922973633, "global_step": 88695, "epoch": 733} {"train_loss": -38.5074348449707, "global_step": 88696, "epoch": 733} {"train_loss": -37.12339782714844, "global_step": 88697, "epoch": 733} {"train_loss": -36.413448333740234, "global_step": 88698, "epoch": 733} {"train_loss": -36.6014289855957, "global_step": 88699, "epoch": 733} {"train_loss": -35.79747009277344, "global_step": 88700, "epoch": 733} {"train_loss": -35.24650955200195, "global_step": 88701, "epoch": 733} {"train_loss": -33.46433639526367, "global_step": 88702, "epoch": 733} {"train_loss": -34.261505126953125, "global_step": 88703, "epoch": 733} {"train_loss": -38.4229621887207, "global_step": 88704, "epoch": 733} {"train_loss": -36.07999801635742, "global_step": 88705, "epoch": 733} {"train_loss": -29.736343383789062, "global_step": 88706, "epoch": 733} {"train_loss": -29.5874080657959, "global_step": 88707, "epoch": 733} {"train_loss": -37.790313720703125, "global_step": 88708, "epoch": 733} {"train_loss": -34.58995819091797, "global_step": 88709, "epoch": 733} {"train_loss": -32.326778411865234, "global_step": 88710, "epoch": 733} {"train_loss": -37.34892272949219, "global_step": 88711, "epoch": 733} {"train_loss": -33.315425872802734, "global_step": 88712, "epoch": 733} {"train_loss": -37.57350540161133, "global_step": 88713, "epoch": 733} {"train_loss": -35.66558837890625, "global_step": 88714, "epoch": 733} {"train_loss": -37.46506881713867, "global_step": 88715, "epoch": 733} {"train_loss": -36.35922622680664, "global_step": 88716, "epoch": 733} {"train_loss": -37.89361572265625, "global_step": 88717, "epoch": 733} {"train_loss": -37.09233474731445, "global_step": 88718, "epoch": 733} {"train_loss": -38.04567337036133, "global_step": 88719, "epoch": 733} {"train_loss": -37.14958190917969, "global_step": 88720, "epoch": 733} {"train_loss": -37.74821090698242, "global_step": 88721, "epoch": 733} {"train_loss": -37.83721160888672, "global_step": 88722, "epoch": 733} {"train_loss": -37.43953323364258, "global_step": 88723, "epoch": 733} {"train_loss": -38.06653594970703, "global_step": 88724, "epoch": 733} {"train_loss": -37.86735916137695, "global_step": 88725, "epoch": 733} {"train_loss": -38.37752151489258, "global_step": 88726, "epoch": 733} {"train_loss": -37.4714241027832, "global_step": 88727, "epoch": 733} {"train_loss": -38.089073181152344, "global_step": 88728, "epoch": 733} {"train_loss": -37.956600189208984, "global_step": 88729, "epoch": 733} {"train_loss": -37.97053146362305, "global_step": 88730, "epoch": 733} {"train_loss": -38.34794998168945, "global_step": 88731, "epoch": 733} {"train_loss": -37.84186553955078, "global_step": 88732, "epoch": 733} {"train_loss": -38.43694305419922, "global_step": 88733, "epoch": 733} {"train_loss": -37.9337158203125, "global_step": 88734, "epoch": 733} {"train_loss": -38.701812744140625, "global_step": 88735, "epoch": 733} {"train_loss": -38.01304244995117, "global_step": 88736, "epoch": 733} {"train_loss": -38.10055160522461, "global_step": 88737, "epoch": 733} {"train_loss": -37.875732421875, "global_step": 88738, "epoch": 733} {"train_loss": -38.044612884521484, "global_step": 88739, "epoch": 733} {"train_loss": -38.18447494506836, "global_step": 88740, "epoch": 733} {"train_loss": -38.09946823120117, "global_step": 88741, "epoch": 733} {"train_loss": -37.67606735229492, "global_step": 88742, "epoch": 733} {"train_loss": -38.1170768737793, "global_step": 88743, "epoch": 733} {"train_loss": -38.373809814453125, "global_step": 88744, "epoch": 733} {"train_loss": -38.72256088256836, "global_step": 88745, "epoch": 733} {"train_loss": -38.69743728637695, "global_step": 88746, "epoch": 733} {"train_loss": -38.02421188354492, "global_step": 88747, "epoch": 733} {"train_loss": -38.56283187866211, "global_step": 88748, "epoch": 733} {"train_loss": -38.504756927490234, "global_step": 88749, "epoch": 733} {"train_loss": -38.60831069946289, "global_step": 88750, "epoch": 733} {"train_loss": -37.89712905883789, "global_step": 88751, "epoch": 733} {"train_loss": -38.27891159057617, "global_step": 88752, "epoch": 733} {"train_loss": -38.90198516845703, "global_step": 88753, "epoch": 733} {"train_loss": -38.83242416381836, "global_step": 88754, "epoch": 733} {"train_loss": -38.268489837646484, "global_step": 88755, "epoch": 733} {"train_loss": -38.58335494995117, "global_step": 88756, "epoch": 733} {"train_loss": -38.78569412231445, "global_step": 88757, "epoch": 733} {"train_loss": -37.95390701293945, "global_step": 88758, "epoch": 733} {"train_loss": -38.456722259521484, "global_step": 88759, "epoch": 733} {"train_loss": -37.15371322631836, "global_step": 88760, "epoch": 733} {"train_loss": -37.67953872680664, "global_step": 88761, "epoch": 733} {"train_loss": -38.6209716796875, "global_step": 88762, "epoch": 733} {"train_loss": -38.75164031982422, "global_step": 88763, "epoch": 733} {"train_loss": -38.75305938720703, "global_step": 88764, "epoch": 733} {"train_loss": -38.32261276245117, "global_step": 88765, "epoch": 733} {"train_loss": -38.07630920410156, "global_step": 88766, "epoch": 733} {"train_loss": -38.96710968017578, "global_step": 88767, "epoch": 733} {"train_loss": -38.44709777832031, "global_step": 88768, "epoch": 733} {"train_loss": -37.77366256713867, "global_step": 88769, "epoch": 733} {"train_loss": -37.3613395690918, "global_step": 88770, "epoch": 733} {"train_loss": -38.46150588989258, "global_step": 88771, "epoch": 733} {"train_loss": -37.82599639892578, "global_step": 88772, "epoch": 733} {"train_loss": -37.58610916137695, "global_step": 88773, "epoch": 733} {"train_loss": -37.98966598510742, "global_step": 88774, "epoch": 733} {"train_loss": -37.34487533569336, "global_step": 88775, "epoch": 733} {"train_loss": -38.855995178222656, "global_step": 88776, "epoch": 733} {"train_loss": -37.477882385253906, "global_step": 88777, "epoch": 733} {"train_loss": -36.709999084472656, "global_step": 88778, "epoch": 733} {"train_loss": -37.16804122924805, "global_step": 88779, "epoch": 733} {"train_loss": -38.35193634033203, "global_step": 88780, "epoch": 733} {"train_loss": -38.59196090698242, "global_step": 88781, "epoch": 733} {"train_loss": -36.3897705078125, "global_step": 88782, "epoch": 733} {"train_loss": -35.32822036743164, "global_step": 88783, "epoch": 733} {"train_loss": -34.55955505371094, "global_step": 88784, "epoch": 733} {"train_loss": -36.85801315307617, "global_step": 88785, "epoch": 733} {"train_loss": -37.98242950439453, "global_step": 88786, "epoch": 733} {"train_loss": -34.36601638793945, "global_step": 88787, "epoch": 733} {"train_loss": -37.385536193847656, "global_step": 88788, "epoch": 733} {"train_loss": -37.60274124145508, "global_step": 88789, "epoch": 733} {"train_loss": -34.370582580566406, "global_step": 88790, "epoch": 733} {"train_loss": -36.845829010009766, "global_step": 88791, "epoch": 733} {"train_loss": -37.55506134033203, "global_step": 88792, "epoch": 733} {"train_loss": -36.75733184814453, "global_step": 88793, "epoch": 733} {"train_loss": -38.043739318847656, "global_step": 88794, "epoch": 733} {"train_loss": -36.76467514038086, "global_step": 88795, "epoch": 733} {"train_loss": -36.157100677490234, "global_step": 88796, "epoch": 733} {"train_loss": -37.8229866027832, "global_step": 88797, "epoch": 733} {"train_loss": -37.980648040771484, "global_step": 88798, "epoch": 733} {"train_loss": -38.06509017944336, "global_step": 88799, "epoch": 733} {"train_loss": -36.76066207885742, "global_step": 88800, "epoch": 733} {"train_loss": -38.29401397705078, "global_step": 88801, "epoch": 733} {"train_loss": -37.58842086791992, "global_step": 88802, "epoch": 733} {"train_loss": -37.65970993041992, "global_step": 88803, "epoch": 733} {"train_loss": -36.64191818237305, "global_step": 88804, "epoch": 733} {"train_loss": -36.97477340698242, "global_step": 88805, "epoch": 733} {"train_loss": -37.89870071411133, "global_step": 88806, "epoch": 733} {"train_loss": -36.14098358154297, "global_step": 88807, "epoch": 733} {"train_loss": -38.14659118652344, "global_step": 88808, "epoch": 733} {"train_loss": -36.99345779418945, "global_step": 88809, "epoch": 733} {"train_loss": -38.08642578125, "global_step": 88810, "epoch": 733} {"train_loss": -36.84109878540039, "global_step": 88811, "epoch": 733} {"train_loss": -36.54716110229492, "global_step": 88812, "epoch": 733} {"train_loss": -37.32997095092269, "global_step": 88813, "epoch": 733, "val_loss": 2574726.0} {"train_loss": -36.80344772338867, "global_step": 88814, "epoch": 734} {"train_loss": -38.01445388793945, "global_step": 88815, "epoch": 734} {"train_loss": -36.958702087402344, "global_step": 88816, "epoch": 734} {"train_loss": -35.950538635253906, "global_step": 88817, "epoch": 734} {"train_loss": -34.0616455078125, "global_step": 88818, "epoch": 734} {"train_loss": -36.24475860595703, "global_step": 88819, "epoch": 734} {"train_loss": -38.234962463378906, "global_step": 88820, "epoch": 734} {"train_loss": -36.79327392578125, "global_step": 88821, "epoch": 734} {"train_loss": -35.3314208984375, "global_step": 88822, "epoch": 734} {"train_loss": -34.212158203125, "global_step": 88823, "epoch": 734} {"train_loss": -37.00954055786133, "global_step": 88824, "epoch": 734} {"train_loss": -37.31124496459961, "global_step": 88825, "epoch": 734} {"train_loss": -33.700191497802734, "global_step": 88826, "epoch": 734} {"train_loss": -36.801361083984375, "global_step": 88827, "epoch": 734} {"train_loss": -37.772708892822266, "global_step": 88828, "epoch": 734} {"train_loss": -34.82557678222656, "global_step": 88829, "epoch": 734} {"train_loss": -37.11140823364258, "global_step": 88830, "epoch": 734} {"train_loss": -37.48714828491211, "global_step": 88831, "epoch": 734} {"train_loss": -35.614723205566406, "global_step": 88832, "epoch": 734} {"train_loss": -37.18367385864258, "global_step": 88833, "epoch": 734} {"train_loss": -37.30662155151367, "global_step": 88834, "epoch": 734} {"train_loss": -36.43757247924805, "global_step": 88835, "epoch": 734} {"train_loss": -37.95321273803711, "global_step": 88836, "epoch": 734} {"train_loss": -36.761932373046875, "global_step": 88837, "epoch": 734} {"train_loss": -38.51507568359375, "global_step": 88838, "epoch": 734} {"train_loss": -37.3004035949707, "global_step": 88839, "epoch": 734} {"train_loss": -37.90350341796875, "global_step": 88840, "epoch": 734} {"train_loss": -38.214210510253906, "global_step": 88841, "epoch": 734} {"train_loss": -37.625213623046875, "global_step": 88842, "epoch": 734} {"train_loss": -38.46931838989258, "global_step": 88843, "epoch": 734} {"train_loss": -38.00541687011719, "global_step": 88844, "epoch": 734} {"train_loss": -38.86687088012695, "global_step": 88845, "epoch": 734} {"train_loss": -38.5504150390625, "global_step": 88846, "epoch": 734} {"train_loss": -39.01237487792969, "global_step": 88847, "epoch": 734} {"train_loss": -38.353660583496094, "global_step": 88848, "epoch": 734} {"train_loss": -39.084136962890625, "global_step": 88849, "epoch": 734} {"train_loss": -38.6592903137207, "global_step": 88850, "epoch": 734} {"train_loss": -38.724483489990234, "global_step": 88851, "epoch": 734} {"train_loss": -38.606842041015625, "global_step": 88852, "epoch": 734} {"train_loss": -38.54804611206055, "global_step": 88853, "epoch": 734} {"train_loss": -39.059200286865234, "global_step": 88854, "epoch": 734} {"train_loss": -38.511226654052734, "global_step": 88855, "epoch": 734} {"train_loss": -38.65629196166992, "global_step": 88856, "epoch": 734} {"train_loss": -39.04209518432617, "global_step": 88857, "epoch": 734} {"train_loss": -39.39419174194336, "global_step": 88858, "epoch": 734} {"train_loss": -37.340187072753906, "global_step": 88859, "epoch": 734} {"train_loss": -37.64582443237305, "global_step": 88860, "epoch": 734} {"train_loss": -37.0821418762207, "global_step": 88861, "epoch": 734} {"train_loss": -38.12661361694336, "global_step": 88862, "epoch": 734} {"train_loss": -38.13972091674805, "global_step": 88863, "epoch": 734} {"train_loss": -37.766658782958984, "global_step": 88864, "epoch": 734} {"train_loss": -37.017860412597656, "global_step": 88865, "epoch": 734} {"train_loss": -36.84138870239258, "global_step": 88866, "epoch": 734} {"train_loss": -35.92387008666992, "global_step": 88867, "epoch": 734} {"train_loss": -38.33234786987305, "global_step": 88868, "epoch": 734} {"train_loss": -37.643898010253906, "global_step": 88869, "epoch": 734} {"train_loss": -36.13888168334961, "global_step": 88870, "epoch": 734} {"train_loss": -35.0154914855957, "global_step": 88871, "epoch": 734} {"train_loss": -37.22772216796875, "global_step": 88872, "epoch": 734} {"train_loss": -38.452083587646484, "global_step": 88873, "epoch": 734} {"train_loss": -37.04731369018555, "global_step": 88874, "epoch": 734} {"train_loss": -37.91633224487305, "global_step": 88875, "epoch": 734} {"train_loss": -37.74578857421875, "global_step": 88876, "epoch": 734} {"train_loss": -37.693843841552734, "global_step": 88877, "epoch": 734} {"train_loss": -38.17239761352539, "global_step": 88878, "epoch": 734} {"train_loss": -36.9851188659668, "global_step": 88879, "epoch": 734} {"train_loss": -38.166587829589844, "global_step": 88880, "epoch": 734} {"train_loss": -37.57365036010742, "global_step": 88881, "epoch": 734} {"train_loss": -36.9991569519043, "global_step": 88882, "epoch": 734} {"train_loss": -37.36701965332031, "global_step": 88883, "epoch": 734} {"train_loss": -37.54930877685547, "global_step": 88884, "epoch": 734} {"train_loss": -35.95930099487305, "global_step": 88885, "epoch": 734} {"train_loss": -38.30077362060547, "global_step": 88886, "epoch": 734} {"train_loss": -36.92703628540039, "global_step": 88887, "epoch": 734} {"train_loss": -35.18031692504883, "global_step": 88888, "epoch": 734} {"train_loss": -34.896541595458984, "global_step": 88889, "epoch": 734} {"train_loss": -37.0078125, "global_step": 88890, "epoch": 734} {"train_loss": -35.33016586303711, "global_step": 88891, "epoch": 734} {"train_loss": -35.312042236328125, "global_step": 88892, "epoch": 734} {"train_loss": -36.99591064453125, "global_step": 88893, "epoch": 734} {"train_loss": -37.11298370361328, "global_step": 88894, "epoch": 734} {"train_loss": -37.566253662109375, "global_step": 88895, "epoch": 734} {"train_loss": -36.36713790893555, "global_step": 88896, "epoch": 734} {"train_loss": -35.5717658996582, "global_step": 88897, "epoch": 734} {"train_loss": -36.59687042236328, "global_step": 88898, "epoch": 734} {"train_loss": -37.44101333618164, "global_step": 88899, "epoch": 734} {"train_loss": -35.79942321777344, "global_step": 88900, "epoch": 734} {"train_loss": -37.09326171875, "global_step": 88901, "epoch": 734} {"train_loss": -37.18425369262695, "global_step": 88902, "epoch": 734} {"train_loss": -34.99310302734375, "global_step": 88903, "epoch": 734} {"train_loss": -37.648921966552734, "global_step": 88904, "epoch": 734} {"train_loss": -36.273738861083984, "global_step": 88905, "epoch": 734} {"train_loss": -37.76106643676758, "global_step": 88906, "epoch": 734} {"train_loss": -38.098384857177734, "global_step": 88907, "epoch": 734} {"train_loss": -36.79833984375, "global_step": 88908, "epoch": 734} {"train_loss": -36.97125244140625, "global_step": 88909, "epoch": 734} {"train_loss": -35.24795150756836, "global_step": 88910, "epoch": 734} {"train_loss": -35.85994338989258, "global_step": 88911, "epoch": 734} {"train_loss": -36.69711685180664, "global_step": 88912, "epoch": 734} {"train_loss": -35.04168701171875, "global_step": 88913, "epoch": 734} {"train_loss": -36.43622970581055, "global_step": 88914, "epoch": 734} {"train_loss": -37.52141189575195, "global_step": 88915, "epoch": 734} {"train_loss": -37.194393157958984, "global_step": 88916, "epoch": 734} {"train_loss": -36.054134368896484, "global_step": 88917, "epoch": 734} {"train_loss": -36.09236145019531, "global_step": 88918, "epoch": 734} {"train_loss": -36.6436653137207, "global_step": 88919, "epoch": 734} {"train_loss": -34.25139236450195, "global_step": 88920, "epoch": 734} {"train_loss": -36.8911018371582, "global_step": 88921, "epoch": 734} {"train_loss": -37.32384490966797, "global_step": 88922, "epoch": 734} {"train_loss": -37.13233947753906, "global_step": 88923, "epoch": 734} {"train_loss": -36.480690002441406, "global_step": 88924, "epoch": 734} {"train_loss": -36.26332473754883, "global_step": 88925, "epoch": 734} {"train_loss": -35.534725189208984, "global_step": 88926, "epoch": 734} {"train_loss": -36.03981399536133, "global_step": 88927, "epoch": 734} {"train_loss": -36.35270690917969, "global_step": 88928, "epoch": 734} {"train_loss": -34.232574462890625, "global_step": 88929, "epoch": 734} {"train_loss": -37.39474105834961, "global_step": 88930, "epoch": 734} {"train_loss": -37.30195617675781, "global_step": 88931, "epoch": 734} {"train_loss": -36.47426986694336, "global_step": 88932, "epoch": 734} {"train_loss": -37.09312057495117, "global_step": 88933, "epoch": 734} {"train_loss": -37.02780189198896, "global_step": 88934, "epoch": 734, "val_loss": 2740804.25} {"train_loss": -37.001895904541016, "global_step": 88935, "epoch": 735} {"train_loss": -37.03278350830078, "global_step": 88936, "epoch": 735} {"train_loss": -37.960506439208984, "global_step": 88937, "epoch": 735} {"train_loss": -35.60787582397461, "global_step": 88938, "epoch": 735} {"train_loss": -37.1392707824707, "global_step": 88939, "epoch": 735} {"train_loss": -36.50722122192383, "global_step": 88940, "epoch": 735} {"train_loss": -36.27002716064453, "global_step": 88941, "epoch": 735} {"train_loss": -37.26693344116211, "global_step": 88942, "epoch": 735} {"train_loss": -37.13846969604492, "global_step": 88943, "epoch": 735} {"train_loss": -36.271453857421875, "global_step": 88944, "epoch": 735} {"train_loss": -35.9326286315918, "global_step": 88945, "epoch": 735} {"train_loss": -37.21751022338867, "global_step": 88946, "epoch": 735} {"train_loss": -37.22197341918945, "global_step": 88947, "epoch": 735} {"train_loss": -36.0054817199707, "global_step": 88948, "epoch": 735} {"train_loss": -37.91659164428711, "global_step": 88949, "epoch": 735} {"train_loss": -36.79021453857422, "global_step": 88950, "epoch": 735} {"train_loss": -37.81356430053711, "global_step": 88951, "epoch": 735} {"train_loss": -36.846412658691406, "global_step": 88952, "epoch": 735} {"train_loss": -37.91585159301758, "global_step": 88953, "epoch": 735} {"train_loss": -37.98001480102539, "global_step": 88954, "epoch": 735} {"train_loss": -37.46027755737305, "global_step": 88955, "epoch": 735} {"train_loss": -36.945030212402344, "global_step": 88956, "epoch": 735} {"train_loss": -37.8724365234375, "global_step": 88957, "epoch": 735} {"train_loss": -37.23747634887695, "global_step": 88958, "epoch": 735} {"train_loss": -37.13872146606445, "global_step": 88959, "epoch": 735} {"train_loss": -37.92285919189453, "global_step": 88960, "epoch": 735} {"train_loss": -37.650753021240234, "global_step": 88961, "epoch": 735} {"train_loss": -37.763099670410156, "global_step": 88962, "epoch": 735} {"train_loss": -37.781429290771484, "global_step": 88963, "epoch": 735} {"train_loss": -37.71804428100586, "global_step": 88964, "epoch": 735} {"train_loss": -37.16571044921875, "global_step": 88965, "epoch": 735} {"train_loss": -36.89136505126953, "global_step": 88966, "epoch": 735} {"train_loss": -36.39577102661133, "global_step": 88967, "epoch": 735} {"train_loss": -38.284175872802734, "global_step": 88968, "epoch": 735} {"train_loss": -37.501914978027344, "global_step": 88969, "epoch": 735} {"train_loss": -38.25059127807617, "global_step": 88970, "epoch": 735} {"train_loss": -35.642539978027344, "global_step": 88971, "epoch": 735} {"train_loss": -37.72750473022461, "global_step": 88972, "epoch": 735} {"train_loss": -37.15479278564453, "global_step": 88973, "epoch": 735} {"train_loss": -36.428062438964844, "global_step": 88974, "epoch": 735} {"train_loss": -38.34347152709961, "global_step": 88975, "epoch": 735} {"train_loss": -37.91468048095703, "global_step": 88976, "epoch": 735} {"train_loss": -37.322967529296875, "global_step": 88977, "epoch": 735} {"train_loss": -37.37025833129883, "global_step": 88978, "epoch": 735} {"train_loss": -37.79802703857422, "global_step": 88979, "epoch": 735} {"train_loss": -37.383949279785156, "global_step": 88980, "epoch": 735} {"train_loss": -37.490447998046875, "global_step": 88981, "epoch": 735} {"train_loss": -37.50958251953125, "global_step": 88982, "epoch": 735} {"train_loss": -38.052486419677734, "global_step": 88983, "epoch": 735} {"train_loss": -37.762794494628906, "global_step": 88984, "epoch": 735} {"train_loss": -38.20241928100586, "global_step": 88985, "epoch": 735} {"train_loss": -37.5811653137207, "global_step": 88986, "epoch": 735} {"train_loss": -36.7639274597168, "global_step": 88987, "epoch": 735} {"train_loss": -37.926544189453125, "global_step": 88988, "epoch": 735} {"train_loss": -38.010414123535156, "global_step": 88989, "epoch": 735} {"train_loss": -38.50748825073242, "global_step": 88990, "epoch": 735} {"train_loss": -37.62192916870117, "global_step": 88991, "epoch": 735} {"train_loss": -37.766822814941406, "global_step": 88992, "epoch": 735} {"train_loss": -37.91717529296875, "global_step": 88993, "epoch": 735} {"train_loss": -37.39251708984375, "global_step": 88994, "epoch": 735} {"train_loss": -37.87362289428711, "global_step": 88995, "epoch": 735} {"train_loss": -37.59833526611328, "global_step": 88996, "epoch": 735} {"train_loss": -37.06394577026367, "global_step": 88997, "epoch": 735} {"train_loss": -36.9506950378418, "global_step": 88998, "epoch": 735} {"train_loss": -36.1611442565918, "global_step": 88999, "epoch": 735} {"train_loss": -36.2337532043457, "global_step": 89000, "epoch": 735} {"train_loss": -36.69293975830078, "global_step": 89001, "epoch": 735} {"train_loss": -34.45796585083008, "global_step": 89002, "epoch": 735} {"train_loss": -36.022987365722656, "global_step": 89003, "epoch": 735} {"train_loss": -37.81585693359375, "global_step": 89004, "epoch": 735} {"train_loss": -37.10960006713867, "global_step": 89005, "epoch": 735} {"train_loss": -35.42791748046875, "global_step": 89006, "epoch": 735} {"train_loss": -37.50397872924805, "global_step": 89007, "epoch": 735} {"train_loss": -37.28759765625, "global_step": 89008, "epoch": 735} {"train_loss": -35.32345199584961, "global_step": 89009, "epoch": 735} {"train_loss": -32.77238845825195, "global_step": 89010, "epoch": 735} {"train_loss": -34.22576904296875, "global_step": 89011, "epoch": 735} {"train_loss": -36.45545196533203, "global_step": 89012, "epoch": 735} {"train_loss": -35.89748764038086, "global_step": 89013, "epoch": 735} {"train_loss": -34.097835540771484, "global_step": 89014, "epoch": 735} {"train_loss": -36.26148986816406, "global_step": 89015, "epoch": 735} {"train_loss": -35.76678466796875, "global_step": 89016, "epoch": 735} {"train_loss": -34.32589340209961, "global_step": 89017, "epoch": 735} {"train_loss": -35.553466796875, "global_step": 89018, "epoch": 735} {"train_loss": -36.65678787231445, "global_step": 89019, "epoch": 735} {"train_loss": -34.774959564208984, "global_step": 89020, "epoch": 735} {"train_loss": -33.62117385864258, "global_step": 89021, "epoch": 735} {"train_loss": -35.83242416381836, "global_step": 89022, "epoch": 735} {"train_loss": -34.89448165893555, "global_step": 89023, "epoch": 735} {"train_loss": -35.96981430053711, "global_step": 89024, "epoch": 735} {"train_loss": -36.2832145690918, "global_step": 89025, "epoch": 735} {"train_loss": -35.10302734375, "global_step": 89026, "epoch": 735} {"train_loss": -37.512733459472656, "global_step": 89027, "epoch": 735} {"train_loss": -36.602272033691406, "global_step": 89028, "epoch": 735} {"train_loss": -36.02067947387695, "global_step": 89029, "epoch": 735} {"train_loss": -37.274322509765625, "global_step": 89030, "epoch": 735} {"train_loss": -36.13831329345703, "global_step": 89031, "epoch": 735} {"train_loss": -35.6198844909668, "global_step": 89032, "epoch": 735} {"train_loss": -36.92698287963867, "global_step": 89033, "epoch": 735} {"train_loss": -36.53774642944336, "global_step": 89034, "epoch": 735} {"train_loss": -37.302181243896484, "global_step": 89035, "epoch": 735} {"train_loss": -36.29579162597656, "global_step": 89036, "epoch": 735} {"train_loss": -35.9577751159668, "global_step": 89037, "epoch": 735} {"train_loss": -37.61125564575195, "global_step": 89038, "epoch": 735} {"train_loss": -35.8347053527832, "global_step": 89039, "epoch": 735} {"train_loss": -37.201717376708984, "global_step": 89040, "epoch": 735} {"train_loss": -35.61777114868164, "global_step": 89041, "epoch": 735} {"train_loss": -38.346153259277344, "global_step": 89042, "epoch": 735} {"train_loss": -36.31930160522461, "global_step": 89043, "epoch": 735} {"train_loss": -37.34820556640625, "global_step": 89044, "epoch": 735} {"train_loss": -36.78189468383789, "global_step": 89045, "epoch": 735} {"train_loss": -37.8951530456543, "global_step": 89046, "epoch": 735} {"train_loss": -36.770809173583984, "global_step": 89047, "epoch": 735} {"train_loss": -36.93358612060547, "global_step": 89048, "epoch": 735} {"train_loss": -36.938392639160156, "global_step": 89049, "epoch": 735} {"train_loss": -37.29537582397461, "global_step": 89050, "epoch": 735} {"train_loss": -37.89826965332031, "global_step": 89051, "epoch": 735} {"train_loss": -37.48354721069336, "global_step": 89052, "epoch": 735} {"train_loss": -38.145606994628906, "global_step": 89053, "epoch": 735} {"train_loss": -37.79334259033203, "global_step": 89054, "epoch": 735} {"train_loss": -36.86778435825316, "global_step": 89055, "epoch": 735, "val_loss": 2629767.25} {"train_loss": -37.673587799072266, "global_step": 89056, "epoch": 736} {"train_loss": -38.17898178100586, "global_step": 89057, "epoch": 736} {"train_loss": -38.060184478759766, "global_step": 89058, "epoch": 736} {"train_loss": -37.7822265625, "global_step": 89059, "epoch": 736} {"train_loss": -37.76894760131836, "global_step": 89060, "epoch": 736} {"train_loss": -38.145225524902344, "global_step": 89061, "epoch": 736} {"train_loss": -38.17305374145508, "global_step": 89062, "epoch": 736} {"train_loss": -37.59910202026367, "global_step": 89063, "epoch": 736} {"train_loss": -37.71320724487305, "global_step": 89064, "epoch": 736} {"train_loss": -37.851375579833984, "global_step": 89065, "epoch": 736} {"train_loss": -38.20866394042969, "global_step": 89066, "epoch": 736} {"train_loss": -38.090118408203125, "global_step": 89067, "epoch": 736} {"train_loss": -38.05739212036133, "global_step": 89068, "epoch": 736} {"train_loss": -37.889583587646484, "global_step": 89069, "epoch": 736} {"train_loss": -38.13051986694336, "global_step": 89070, "epoch": 736} {"train_loss": -36.54132843017578, "global_step": 89071, "epoch": 736} {"train_loss": -37.99187469482422, "global_step": 89072, "epoch": 736} {"train_loss": -38.774505615234375, "global_step": 89073, "epoch": 736} {"train_loss": -37.93537521362305, "global_step": 89074, "epoch": 736} {"train_loss": -38.16230010986328, "global_step": 89075, "epoch": 736} {"train_loss": -37.821624755859375, "global_step": 89076, "epoch": 736} {"train_loss": -37.4942741394043, "global_step": 89077, "epoch": 736} {"train_loss": -37.91524887084961, "global_step": 89078, "epoch": 736} {"train_loss": -38.109249114990234, "global_step": 89079, "epoch": 736} {"train_loss": -37.86201095581055, "global_step": 89080, "epoch": 736} {"train_loss": -38.083580017089844, "global_step": 89081, "epoch": 736} {"train_loss": -38.06425476074219, "global_step": 89082, "epoch": 736} {"train_loss": -38.555763244628906, "global_step": 89083, "epoch": 736} {"train_loss": -38.242000579833984, "global_step": 89084, "epoch": 736} {"train_loss": -38.353721618652344, "global_step": 89085, "epoch": 736} {"train_loss": -37.44987106323242, "global_step": 89086, "epoch": 736} {"train_loss": -37.68706512451172, "global_step": 89087, "epoch": 736} {"train_loss": -37.920589447021484, "global_step": 89088, "epoch": 736} {"train_loss": -38.299800872802734, "global_step": 89089, "epoch": 736} {"train_loss": -37.850990295410156, "global_step": 89090, "epoch": 736} {"train_loss": -37.26033401489258, "global_step": 89091, "epoch": 736} {"train_loss": -37.08447265625, "global_step": 89092, "epoch": 736} {"train_loss": -38.51638412475586, "global_step": 89093, "epoch": 736} {"train_loss": -37.960365295410156, "global_step": 89094, "epoch": 736} {"train_loss": -38.465843200683594, "global_step": 89095, "epoch": 736} {"train_loss": -38.08272933959961, "global_step": 89096, "epoch": 736} {"train_loss": -37.62736511230469, "global_step": 89097, "epoch": 736} {"train_loss": -37.167518615722656, "global_step": 89098, "epoch": 736} {"train_loss": -36.80704879760742, "global_step": 89099, "epoch": 736} {"train_loss": -37.450416564941406, "global_step": 89100, "epoch": 736} {"train_loss": -38.36915969848633, "global_step": 89101, "epoch": 736} {"train_loss": -37.5667724609375, "global_step": 89102, "epoch": 736} {"train_loss": -37.54730987548828, "global_step": 89103, "epoch": 736} {"train_loss": -36.462738037109375, "global_step": 89104, "epoch": 736} {"train_loss": -37.05875778198242, "global_step": 89105, "epoch": 736} {"train_loss": -37.95515060424805, "global_step": 89106, "epoch": 736} {"train_loss": -37.39344024658203, "global_step": 89107, "epoch": 736} {"train_loss": -38.088741302490234, "global_step": 89108, "epoch": 736} {"train_loss": -36.60869598388672, "global_step": 89109, "epoch": 736} {"train_loss": -37.27843475341797, "global_step": 89110, "epoch": 736} {"train_loss": -37.466705322265625, "global_step": 89111, "epoch": 736} {"train_loss": -34.862953186035156, "global_step": 89112, "epoch": 736} {"train_loss": -38.250885009765625, "global_step": 89113, "epoch": 736} {"train_loss": -37.781494140625, "global_step": 89114, "epoch": 736} {"train_loss": -38.33085250854492, "global_step": 89115, "epoch": 736} {"train_loss": -37.82101058959961, "global_step": 89116, "epoch": 736} {"train_loss": -38.61419677734375, "global_step": 89117, "epoch": 736} {"train_loss": -38.071868896484375, "global_step": 89118, "epoch": 736} {"train_loss": -37.54155349731445, "global_step": 89119, "epoch": 736} {"train_loss": -37.737770080566406, "global_step": 89120, "epoch": 736} {"train_loss": -38.25516128540039, "global_step": 89121, "epoch": 736} {"train_loss": -37.97976303100586, "global_step": 89122, "epoch": 736} {"train_loss": -38.216712951660156, "global_step": 89123, "epoch": 736} {"train_loss": -38.39368438720703, "global_step": 89124, "epoch": 736} {"train_loss": -38.752315521240234, "global_step": 89125, "epoch": 736} {"train_loss": -38.54413604736328, "global_step": 89126, "epoch": 736} {"train_loss": -38.42424011230469, "global_step": 89127, "epoch": 736} {"train_loss": -38.01493453979492, "global_step": 89128, "epoch": 736} {"train_loss": -38.82636260986328, "global_step": 89129, "epoch": 736} {"train_loss": -38.37946701049805, "global_step": 89130, "epoch": 736} {"train_loss": -38.71961975097656, "global_step": 89131, "epoch": 736} {"train_loss": -38.97496032714844, "global_step": 89132, "epoch": 736} {"train_loss": -38.48722457885742, "global_step": 89133, "epoch": 736} {"train_loss": -37.787384033203125, "global_step": 89134, "epoch": 736} {"train_loss": -37.63059616088867, "global_step": 89135, "epoch": 736} {"train_loss": -38.747283935546875, "global_step": 89136, "epoch": 736} {"train_loss": -38.89608383178711, "global_step": 89137, "epoch": 736} {"train_loss": -38.90151596069336, "global_step": 89138, "epoch": 736} {"train_loss": -38.5670166015625, "global_step": 89139, "epoch": 736} {"train_loss": -37.80601119995117, "global_step": 89140, "epoch": 736} {"train_loss": -38.435211181640625, "global_step": 89141, "epoch": 736} {"train_loss": -37.925209045410156, "global_step": 89142, "epoch": 736} {"train_loss": -38.94269943237305, "global_step": 89143, "epoch": 736} {"train_loss": -38.686439514160156, "global_step": 89144, "epoch": 736} {"train_loss": -38.17912673950195, "global_step": 89145, "epoch": 736} {"train_loss": -38.19552230834961, "global_step": 89146, "epoch": 736} {"train_loss": -38.824615478515625, "global_step": 89147, "epoch": 736} {"train_loss": -38.21818542480469, "global_step": 89148, "epoch": 736} {"train_loss": -39.016048431396484, "global_step": 89149, "epoch": 736} {"train_loss": -38.519561767578125, "global_step": 89150, "epoch": 736} {"train_loss": -38.1957893371582, "global_step": 89151, "epoch": 736} {"train_loss": -38.05720901489258, "global_step": 89152, "epoch": 736} {"train_loss": -37.22410202026367, "global_step": 89153, "epoch": 736} {"train_loss": -36.62763595581055, "global_step": 89154, "epoch": 736} {"train_loss": -35.54494857788086, "global_step": 89155, "epoch": 736} {"train_loss": -35.22853469848633, "global_step": 89156, "epoch": 736} {"train_loss": -34.13325500488281, "global_step": 89157, "epoch": 736} {"train_loss": -38.21384048461914, "global_step": 89158, "epoch": 736} {"train_loss": -36.95490646362305, "global_step": 89159, "epoch": 736} {"train_loss": -33.222618103027344, "global_step": 89160, "epoch": 736} {"train_loss": -37.026458740234375, "global_step": 89161, "epoch": 736} {"train_loss": -36.51820755004883, "global_step": 89162, "epoch": 736} {"train_loss": -35.39580154418945, "global_step": 89163, "epoch": 736} {"train_loss": -34.1929817199707, "global_step": 89164, "epoch": 736} {"train_loss": -38.02379608154297, "global_step": 89165, "epoch": 736} {"train_loss": -34.82985305786133, "global_step": 89166, "epoch": 736} {"train_loss": -35.56646728515625, "global_step": 89167, "epoch": 736} {"train_loss": -36.85203170776367, "global_step": 89168, "epoch": 736} {"train_loss": -32.478946685791016, "global_step": 89169, "epoch": 736} {"train_loss": -37.18575668334961, "global_step": 89170, "epoch": 736} {"train_loss": -35.75065612792969, "global_step": 89171, "epoch": 736} {"train_loss": -35.565120697021484, "global_step": 89172, "epoch": 736} {"train_loss": -36.67121887207031, "global_step": 89173, "epoch": 736} {"train_loss": -36.48433303833008, "global_step": 89174, "epoch": 736} {"train_loss": -37.24496078491211, "global_step": 89175, "epoch": 736} {"train_loss": -37.59195387658994, "global_step": 89176, "epoch": 736, "val_loss": 2552351.25} {"train_loss": -37.263092041015625, "global_step": 89177, "epoch": 737} {"train_loss": -36.3805046081543, "global_step": 89178, "epoch": 737} {"train_loss": -36.361202239990234, "global_step": 89179, "epoch": 737} {"train_loss": -36.22840118408203, "global_step": 89180, "epoch": 737} {"train_loss": -37.86273193359375, "global_step": 89181, "epoch": 737} {"train_loss": -36.54838180541992, "global_step": 89182, "epoch": 737} {"train_loss": -37.32478713989258, "global_step": 89183, "epoch": 737} {"train_loss": -37.22295379638672, "global_step": 89184, "epoch": 737} {"train_loss": -38.27021026611328, "global_step": 89185, "epoch": 737} {"train_loss": -37.673431396484375, "global_step": 89186, "epoch": 737} {"train_loss": -37.51256561279297, "global_step": 89187, "epoch": 737} {"train_loss": -37.448631286621094, "global_step": 89188, "epoch": 737} {"train_loss": -38.237831115722656, "global_step": 89189, "epoch": 737} {"train_loss": -37.841068267822266, "global_step": 89190, "epoch": 737} {"train_loss": -36.96339797973633, "global_step": 89191, "epoch": 737} {"train_loss": -38.15448760986328, "global_step": 89192, "epoch": 737} {"train_loss": -36.491363525390625, "global_step": 89193, "epoch": 737} {"train_loss": -38.06190872192383, "global_step": 89194, "epoch": 737} {"train_loss": -37.01790237426758, "global_step": 89195, "epoch": 737} {"train_loss": -32.154876708984375, "global_step": 89196, "epoch": 737} {"train_loss": -37.6646842956543, "global_step": 89197, "epoch": 737} {"train_loss": -38.10702133178711, "global_step": 89198, "epoch": 737} {"train_loss": -36.745609283447266, "global_step": 89199, "epoch": 737} {"train_loss": -36.925559997558594, "global_step": 89200, "epoch": 737} {"train_loss": -36.67106628417969, "global_step": 89201, "epoch": 737} {"train_loss": -36.745662689208984, "global_step": 89202, "epoch": 737} {"train_loss": -36.632869720458984, "global_step": 89203, "epoch": 737} {"train_loss": -37.541725158691406, "global_step": 89204, "epoch": 737} {"train_loss": -37.91443634033203, "global_step": 89205, "epoch": 737} {"train_loss": -35.739990234375, "global_step": 89206, "epoch": 737} {"train_loss": -37.894866943359375, "global_step": 89207, "epoch": 737} {"train_loss": -37.271995544433594, "global_step": 89208, "epoch": 737} {"train_loss": -36.91019821166992, "global_step": 89209, "epoch": 737} {"train_loss": -38.127384185791016, "global_step": 89210, "epoch": 737} {"train_loss": -38.09646224975586, "global_step": 89211, "epoch": 737} {"train_loss": -37.67313003540039, "global_step": 89212, "epoch": 737} {"train_loss": -37.18778610229492, "global_step": 89213, "epoch": 737} {"train_loss": -35.43124008178711, "global_step": 89214, "epoch": 737} {"train_loss": -34.825347900390625, "global_step": 89215, "epoch": 737} {"train_loss": -36.93301010131836, "global_step": 89216, "epoch": 737} {"train_loss": -35.30678939819336, "global_step": 89217, "epoch": 737} {"train_loss": -38.17961883544922, "global_step": 89218, "epoch": 737} {"train_loss": -37.6934700012207, "global_step": 89219, "epoch": 737} {"train_loss": -37.45733642578125, "global_step": 89220, "epoch": 737} {"train_loss": -37.854496002197266, "global_step": 89221, "epoch": 737} {"train_loss": -38.07845687866211, "global_step": 89222, "epoch": 737} {"train_loss": -38.28480911254883, "global_step": 89223, "epoch": 737} {"train_loss": -37.76981735229492, "global_step": 89224, "epoch": 737} {"train_loss": -37.74421691894531, "global_step": 89225, "epoch": 737} {"train_loss": -38.319210052490234, "global_step": 89226, "epoch": 737} {"train_loss": -37.651641845703125, "global_step": 89227, "epoch": 737} {"train_loss": -37.743465423583984, "global_step": 89228, "epoch": 737} {"train_loss": -38.8202018737793, "global_step": 89229, "epoch": 737} {"train_loss": -37.44232177734375, "global_step": 89230, "epoch": 737} {"train_loss": -37.2515869140625, "global_step": 89231, "epoch": 737} {"train_loss": -37.45847702026367, "global_step": 89232, "epoch": 737} {"train_loss": -38.14034652709961, "global_step": 89233, "epoch": 737} {"train_loss": -38.36386489868164, "global_step": 89234, "epoch": 737} {"train_loss": -37.456783294677734, "global_step": 89235, "epoch": 737} {"train_loss": -36.772666931152344, "global_step": 89236, "epoch": 737} {"train_loss": -36.53339385986328, "global_step": 89237, "epoch": 737} {"train_loss": -37.917728424072266, "global_step": 89238, "epoch": 737} {"train_loss": -38.94342803955078, "global_step": 89239, "epoch": 737} {"train_loss": -38.11422348022461, "global_step": 89240, "epoch": 737} {"train_loss": -36.813838958740234, "global_step": 89241, "epoch": 737} {"train_loss": -38.52980422973633, "global_step": 89242, "epoch": 737} {"train_loss": -37.98301696777344, "global_step": 89243, "epoch": 737} {"train_loss": -37.448970794677734, "global_step": 89244, "epoch": 737} {"train_loss": -37.536865234375, "global_step": 89245, "epoch": 737} {"train_loss": -38.3796272277832, "global_step": 89246, "epoch": 737} {"train_loss": -38.477821350097656, "global_step": 89247, "epoch": 737} {"train_loss": -38.054378509521484, "global_step": 89248, "epoch": 737} {"train_loss": -38.407196044921875, "global_step": 89249, "epoch": 737} {"train_loss": -38.9782829284668, "global_step": 89250, "epoch": 737} {"train_loss": -38.43050765991211, "global_step": 89251, "epoch": 737} {"train_loss": -38.66828155517578, "global_step": 89252, "epoch": 737} {"train_loss": -37.78031539916992, "global_step": 89253, "epoch": 737} {"train_loss": -37.58498001098633, "global_step": 89254, "epoch": 737} {"train_loss": -38.8019905090332, "global_step": 89255, "epoch": 737} {"train_loss": -38.329559326171875, "global_step": 89256, "epoch": 737} {"train_loss": -38.229148864746094, "global_step": 89257, "epoch": 737} {"train_loss": -38.280670166015625, "global_step": 89258, "epoch": 737} {"train_loss": -38.2144775390625, "global_step": 89259, "epoch": 737} {"train_loss": -37.97257614135742, "global_step": 89260, "epoch": 737} {"train_loss": -38.01054763793945, "global_step": 89261, "epoch": 737} {"train_loss": -38.83204650878906, "global_step": 89262, "epoch": 737} {"train_loss": -37.160701751708984, "global_step": 89263, "epoch": 737} {"train_loss": -38.04296875, "global_step": 89264, "epoch": 737} {"train_loss": -38.401458740234375, "global_step": 89265, "epoch": 737} {"train_loss": -38.3536262512207, "global_step": 89266, "epoch": 737} {"train_loss": -38.261653900146484, "global_step": 89267, "epoch": 737} {"train_loss": -37.56740951538086, "global_step": 89268, "epoch": 737} {"train_loss": -36.9195442199707, "global_step": 89269, "epoch": 737} {"train_loss": -37.585323333740234, "global_step": 89270, "epoch": 737} {"train_loss": -36.286922454833984, "global_step": 89271, "epoch": 737} {"train_loss": -37.66682815551758, "global_step": 89272, "epoch": 737} {"train_loss": -38.083953857421875, "global_step": 89273, "epoch": 737} {"train_loss": -37.04754638671875, "global_step": 89274, "epoch": 737} {"train_loss": -36.04241943359375, "global_step": 89275, "epoch": 737} {"train_loss": -37.383460998535156, "global_step": 89276, "epoch": 737} {"train_loss": -38.256099700927734, "global_step": 89277, "epoch": 737} {"train_loss": -37.5022087097168, "global_step": 89278, "epoch": 737} {"train_loss": -37.334442138671875, "global_step": 89279, "epoch": 737} {"train_loss": -37.9012565612793, "global_step": 89280, "epoch": 737} {"train_loss": -37.520172119140625, "global_step": 89281, "epoch": 737} {"train_loss": -36.95024871826172, "global_step": 89282, "epoch": 737} {"train_loss": -37.99729919433594, "global_step": 89283, "epoch": 737} {"train_loss": -37.63947677612305, "global_step": 89284, "epoch": 737} {"train_loss": -37.485721588134766, "global_step": 89285, "epoch": 737} {"train_loss": -38.56351089477539, "global_step": 89286, "epoch": 737} {"train_loss": -37.01513671875, "global_step": 89287, "epoch": 737} {"train_loss": -38.38460922241211, "global_step": 89288, "epoch": 737} {"train_loss": -37.81693649291992, "global_step": 89289, "epoch": 737} {"train_loss": -38.6146125793457, "global_step": 89290, "epoch": 737} {"train_loss": -38.23708724975586, "global_step": 89291, "epoch": 737} {"train_loss": -38.03682327270508, "global_step": 89292, "epoch": 737} {"train_loss": -37.70389938354492, "global_step": 89293, "epoch": 737} {"train_loss": -37.575984954833984, "global_step": 89294, "epoch": 737} {"train_loss": -37.87784957885742, "global_step": 89295, "epoch": 737} {"train_loss": -38.82857894897461, "global_step": 89296, "epoch": 737} {"train_loss": -37.575212336768786, "global_step": 89297, "epoch": 737, "val_loss": 2565433.25} {"train_loss": -38.04497146606445, "global_step": 89298, "epoch": 738} {"train_loss": -38.25931930541992, "global_step": 89299, "epoch": 738} {"train_loss": -38.23598861694336, "global_step": 89300, "epoch": 738} {"train_loss": -38.640480041503906, "global_step": 89301, "epoch": 738} {"train_loss": -38.3376579284668, "global_step": 89302, "epoch": 738} {"train_loss": -38.38237762451172, "global_step": 89303, "epoch": 738} {"train_loss": -38.72853088378906, "global_step": 89304, "epoch": 738} {"train_loss": -38.223907470703125, "global_step": 89305, "epoch": 738} {"train_loss": -39.25593185424805, "global_step": 89306, "epoch": 738} {"train_loss": -38.618988037109375, "global_step": 89307, "epoch": 738} {"train_loss": -38.4461784362793, "global_step": 89308, "epoch": 738} {"train_loss": -38.049434661865234, "global_step": 89309, "epoch": 738} {"train_loss": -38.17351150512695, "global_step": 89310, "epoch": 738} {"train_loss": -38.38888168334961, "global_step": 89311, "epoch": 738} {"train_loss": -38.5903434753418, "global_step": 89312, "epoch": 738} {"train_loss": -38.610816955566406, "global_step": 89313, "epoch": 738} {"train_loss": -38.7131462097168, "global_step": 89314, "epoch": 738} {"train_loss": -38.462738037109375, "global_step": 89315, "epoch": 738} {"train_loss": -38.62543487548828, "global_step": 89316, "epoch": 738} {"train_loss": -38.26166915893555, "global_step": 89317, "epoch": 738} {"train_loss": -37.41337585449219, "global_step": 89318, "epoch": 738} {"train_loss": -38.01805114746094, "global_step": 89319, "epoch": 738} {"train_loss": -38.585941314697266, "global_step": 89320, "epoch": 738} {"train_loss": -37.31610870361328, "global_step": 89321, "epoch": 738} {"train_loss": -38.342140197753906, "global_step": 89322, "epoch": 738} {"train_loss": -34.7745361328125, "global_step": 89323, "epoch": 738} {"train_loss": -27.408063888549805, "global_step": 89324, "epoch": 738} {"train_loss": -34.74712371826172, "global_step": 89325, "epoch": 738} {"train_loss": -32.439517974853516, "global_step": 89326, "epoch": 738} {"train_loss": -26.961822509765625, "global_step": 89327, "epoch": 738} {"train_loss": -37.267250061035156, "global_step": 89328, "epoch": 738} {"train_loss": -27.152740478515625, "global_step": 89329, "epoch": 738} {"train_loss": -37.71797180175781, "global_step": 89330, "epoch": 738} {"train_loss": -33.584468841552734, "global_step": 89331, "epoch": 738} {"train_loss": -34.770416259765625, "global_step": 89332, "epoch": 738} {"train_loss": -36.032806396484375, "global_step": 89333, "epoch": 738} {"train_loss": -36.501220703125, "global_step": 89334, "epoch": 738} {"train_loss": -34.651824951171875, "global_step": 89335, "epoch": 738} {"train_loss": -38.36629867553711, "global_step": 89336, "epoch": 738} {"train_loss": -36.3443603515625, "global_step": 89337, "epoch": 738} {"train_loss": -35.67474365234375, "global_step": 89338, "epoch": 738} {"train_loss": -38.41035461425781, "global_step": 89339, "epoch": 738} {"train_loss": -37.19182205200195, "global_step": 89340, "epoch": 738} {"train_loss": -37.1968994140625, "global_step": 89341, "epoch": 738} {"train_loss": -37.505123138427734, "global_step": 89342, "epoch": 738} {"train_loss": -37.65275955200195, "global_step": 89343, "epoch": 738} {"train_loss": -38.56573486328125, "global_step": 89344, "epoch": 738} {"train_loss": -38.48844528198242, "global_step": 89345, "epoch": 738} {"train_loss": -37.77016830444336, "global_step": 89346, "epoch": 738} {"train_loss": -37.775856018066406, "global_step": 89347, "epoch": 738} {"train_loss": -38.719425201416016, "global_step": 89348, "epoch": 738} {"train_loss": -38.334110260009766, "global_step": 89349, "epoch": 738} {"train_loss": -38.760467529296875, "global_step": 89350, "epoch": 738} {"train_loss": -38.56264877319336, "global_step": 89351, "epoch": 738} {"train_loss": -38.42677688598633, "global_step": 89352, "epoch": 738} {"train_loss": -38.90633773803711, "global_step": 89353, "epoch": 738} {"train_loss": -38.67374038696289, "global_step": 89354, "epoch": 738} {"train_loss": -38.899776458740234, "global_step": 89355, "epoch": 738} {"train_loss": -38.79928207397461, "global_step": 89356, "epoch": 738} {"train_loss": -38.890228271484375, "global_step": 89357, "epoch": 738} {"train_loss": -38.12744903564453, "global_step": 89358, "epoch": 738} {"train_loss": -38.49622344970703, "global_step": 89359, "epoch": 738} {"train_loss": -38.905364990234375, "global_step": 89360, "epoch": 738} {"train_loss": -38.65446853637695, "global_step": 89361, "epoch": 738} {"train_loss": -38.83708953857422, "global_step": 89362, "epoch": 738} {"train_loss": -38.59131622314453, "global_step": 89363, "epoch": 738} {"train_loss": -38.62282943725586, "global_step": 89364, "epoch": 738} {"train_loss": -38.58626937866211, "global_step": 89365, "epoch": 738} {"train_loss": -38.62153244018555, "global_step": 89366, "epoch": 738} {"train_loss": -38.656158447265625, "global_step": 89367, "epoch": 738} {"train_loss": -38.65082550048828, "global_step": 89368, "epoch": 738} {"train_loss": -39.13068771362305, "global_step": 89369, "epoch": 738} {"train_loss": -38.74052810668945, "global_step": 89370, "epoch": 738} {"train_loss": -38.04311752319336, "global_step": 89371, "epoch": 738} {"train_loss": -38.596675872802734, "global_step": 89372, "epoch": 738} {"train_loss": -38.53471755981445, "global_step": 89373, "epoch": 738} {"train_loss": -38.953407287597656, "global_step": 89374, "epoch": 738} {"train_loss": -38.018436431884766, "global_step": 89375, "epoch": 738} {"train_loss": -37.19028854370117, "global_step": 89376, "epoch": 738} {"train_loss": -37.99454879760742, "global_step": 89377, "epoch": 738} {"train_loss": -37.52327346801758, "global_step": 89378, "epoch": 738} {"train_loss": -36.50810241699219, "global_step": 89379, "epoch": 738} {"train_loss": -37.35551452636719, "global_step": 89380, "epoch": 738} {"train_loss": -38.321388244628906, "global_step": 89381, "epoch": 738} {"train_loss": -38.65989685058594, "global_step": 89382, "epoch": 738} {"train_loss": -37.81925964355469, "global_step": 89383, "epoch": 738} {"train_loss": -36.95756912231445, "global_step": 89384, "epoch": 738} {"train_loss": -37.42063522338867, "global_step": 89385, "epoch": 738} {"train_loss": -37.7868766784668, "global_step": 89386, "epoch": 738} {"train_loss": -37.678279876708984, "global_step": 89387, "epoch": 738} {"train_loss": -38.47475051879883, "global_step": 89388, "epoch": 738} {"train_loss": -37.5233154296875, "global_step": 89389, "epoch": 738} {"train_loss": -38.49176788330078, "global_step": 89390, "epoch": 738} {"train_loss": -38.506614685058594, "global_step": 89391, "epoch": 738} {"train_loss": -38.680355072021484, "global_step": 89392, "epoch": 738} {"train_loss": -38.759002685546875, "global_step": 89393, "epoch": 738} {"train_loss": -38.85855484008789, "global_step": 89394, "epoch": 738} {"train_loss": -37.28402328491211, "global_step": 89395, "epoch": 738} {"train_loss": -37.224849700927734, "global_step": 89396, "epoch": 738} {"train_loss": -37.43113327026367, "global_step": 89397, "epoch": 738} {"train_loss": -37.70148468017578, "global_step": 89398, "epoch": 738} {"train_loss": -37.06053161621094, "global_step": 89399, "epoch": 738} {"train_loss": -38.1403694152832, "global_step": 89400, "epoch": 738} {"train_loss": -38.94632339477539, "global_step": 89401, "epoch": 738} {"train_loss": -38.665775299072266, "global_step": 89402, "epoch": 738} {"train_loss": -36.24555206298828, "global_step": 89403, "epoch": 738} {"train_loss": -33.04939270019531, "global_step": 89404, "epoch": 738} {"train_loss": -33.50905227661133, "global_step": 89405, "epoch": 738} {"train_loss": -36.91815948486328, "global_step": 89406, "epoch": 738} {"train_loss": -35.57489013671875, "global_step": 89407, "epoch": 738} {"train_loss": -31.892230987548828, "global_step": 89408, "epoch": 738} {"train_loss": -30.72395896911621, "global_step": 89409, "epoch": 738} {"train_loss": -34.6339225769043, "global_step": 89410, "epoch": 738} {"train_loss": -34.58726119995117, "global_step": 89411, "epoch": 738} {"train_loss": -32.1676139831543, "global_step": 89412, "epoch": 738} {"train_loss": -36.59779357910156, "global_step": 89413, "epoch": 738} {"train_loss": -35.76478958129883, "global_step": 89414, "epoch": 738} {"train_loss": -34.437984466552734, "global_step": 89415, "epoch": 738} {"train_loss": -36.55877685546875, "global_step": 89416, "epoch": 738} {"train_loss": -37.02978515625, "global_step": 89417, "epoch": 738} {"train_loss": -37.21759805600505, "global_step": 89418, "epoch": 738, "val_loss": 2529028.5} {"train_loss": -36.576045989990234, "global_step": 89419, "epoch": 739} {"train_loss": -36.24116134643555, "global_step": 89420, "epoch": 739} {"train_loss": -36.133235931396484, "global_step": 89421, "epoch": 739} {"train_loss": -33.786109924316406, "global_step": 89422, "epoch": 739} {"train_loss": -34.8113899230957, "global_step": 89423, "epoch": 739} {"train_loss": -37.520023345947266, "global_step": 89424, "epoch": 739} {"train_loss": -37.352500915527344, "global_step": 89425, "epoch": 739} {"train_loss": -37.519859313964844, "global_step": 89426, "epoch": 739} {"train_loss": -37.55315399169922, "global_step": 89427, "epoch": 739} {"train_loss": -37.66279220581055, "global_step": 89428, "epoch": 739} {"train_loss": -38.01678466796875, "global_step": 89429, "epoch": 739} {"train_loss": -37.33855056762695, "global_step": 89430, "epoch": 739} {"train_loss": -37.63373565673828, "global_step": 89431, "epoch": 739} {"train_loss": -36.54250717163086, "global_step": 89432, "epoch": 739} {"train_loss": -38.10140609741211, "global_step": 89433, "epoch": 739} {"train_loss": -37.10178756713867, "global_step": 89434, "epoch": 739} {"train_loss": -37.943389892578125, "global_step": 89435, "epoch": 739} {"train_loss": -37.12055206298828, "global_step": 89436, "epoch": 739} {"train_loss": -38.17209243774414, "global_step": 89437, "epoch": 739} {"train_loss": -37.4495849609375, "global_step": 89438, "epoch": 739} {"train_loss": -38.28378677368164, "global_step": 89439, "epoch": 739} {"train_loss": -38.15288162231445, "global_step": 89440, "epoch": 739} {"train_loss": -37.56825637817383, "global_step": 89441, "epoch": 739} {"train_loss": -38.00680160522461, "global_step": 89442, "epoch": 739} {"train_loss": -38.07114791870117, "global_step": 89443, "epoch": 739} {"train_loss": -38.20708465576172, "global_step": 89444, "epoch": 739} {"train_loss": -37.9893913269043, "global_step": 89445, "epoch": 739} {"train_loss": -38.396820068359375, "global_step": 89446, "epoch": 739} {"train_loss": -38.1871452331543, "global_step": 89447, "epoch": 739} {"train_loss": -38.559303283691406, "global_step": 89448, "epoch": 739} {"train_loss": -37.608482360839844, "global_step": 89449, "epoch": 739} {"train_loss": -38.550472259521484, "global_step": 89450, "epoch": 739} {"train_loss": -38.597991943359375, "global_step": 89451, "epoch": 739} {"train_loss": -38.05721664428711, "global_step": 89452, "epoch": 739} {"train_loss": -38.692047119140625, "global_step": 89453, "epoch": 739} {"train_loss": -38.029762268066406, "global_step": 89454, "epoch": 739} {"train_loss": -37.98842239379883, "global_step": 89455, "epoch": 739} {"train_loss": -38.35505676269531, "global_step": 89456, "epoch": 739} {"train_loss": -37.50405502319336, "global_step": 89457, "epoch": 739} {"train_loss": -38.64350128173828, "global_step": 89458, "epoch": 739} {"train_loss": -38.19512939453125, "global_step": 89459, "epoch": 739} {"train_loss": -38.228187561035156, "global_step": 89460, "epoch": 739} {"train_loss": -36.996299743652344, "global_step": 89461, "epoch": 739} {"train_loss": -37.79619216918945, "global_step": 89462, "epoch": 739} {"train_loss": -37.895240783691406, "global_step": 89463, "epoch": 739} {"train_loss": -36.9366569519043, "global_step": 89464, "epoch": 739} {"train_loss": -37.301788330078125, "global_step": 89465, "epoch": 739} {"train_loss": -38.22561264038086, "global_step": 89466, "epoch": 739} {"train_loss": -37.7463493347168, "global_step": 89467, "epoch": 739} {"train_loss": -37.66421127319336, "global_step": 89468, "epoch": 739} {"train_loss": -38.5455207824707, "global_step": 89469, "epoch": 739} {"train_loss": -37.91908645629883, "global_step": 89470, "epoch": 739} {"train_loss": -38.51217269897461, "global_step": 89471, "epoch": 739} {"train_loss": -38.80040740966797, "global_step": 89472, "epoch": 739} {"train_loss": -38.41577911376953, "global_step": 89473, "epoch": 739} {"train_loss": -38.509212493896484, "global_step": 89474, "epoch": 739} {"train_loss": -38.76830291748047, "global_step": 89475, "epoch": 739} {"train_loss": -38.82527542114258, "global_step": 89476, "epoch": 739} {"train_loss": -38.6421012878418, "global_step": 89477, "epoch": 739} {"train_loss": -39.02187728881836, "global_step": 89478, "epoch": 739} {"train_loss": -38.94724655151367, "global_step": 89479, "epoch": 739} {"train_loss": -39.05915069580078, "global_step": 89480, "epoch": 739} {"train_loss": -38.7783203125, "global_step": 89481, "epoch": 739} {"train_loss": -39.20647430419922, "global_step": 89482, "epoch": 739} {"train_loss": -38.915496826171875, "global_step": 89483, "epoch": 739} {"train_loss": -38.64573287963867, "global_step": 89484, "epoch": 739} {"train_loss": -39.322322845458984, "global_step": 89485, "epoch": 739} {"train_loss": -38.45994186401367, "global_step": 89486, "epoch": 739} {"train_loss": -39.103755950927734, "global_step": 89487, "epoch": 739} {"train_loss": -38.9431037902832, "global_step": 89488, "epoch": 739} {"train_loss": -38.81833267211914, "global_step": 89489, "epoch": 739} {"train_loss": -39.2923698425293, "global_step": 89490, "epoch": 739} {"train_loss": -38.67173767089844, "global_step": 89491, "epoch": 739} {"train_loss": -39.37887191772461, "global_step": 89492, "epoch": 739} {"train_loss": -38.473995208740234, "global_step": 89493, "epoch": 739} {"train_loss": -38.66132354736328, "global_step": 89494, "epoch": 739} {"train_loss": -38.11564636230469, "global_step": 89495, "epoch": 739} {"train_loss": -38.637935638427734, "global_step": 89496, "epoch": 739} {"train_loss": -39.043670654296875, "global_step": 89497, "epoch": 739} {"train_loss": -38.80799102783203, "global_step": 89498, "epoch": 739} {"train_loss": -38.424076080322266, "global_step": 89499, "epoch": 739} {"train_loss": -39.02201461791992, "global_step": 89500, "epoch": 739} {"train_loss": -38.35462188720703, "global_step": 89501, "epoch": 739} {"train_loss": -38.73146057128906, "global_step": 89502, "epoch": 739} {"train_loss": -38.50954055786133, "global_step": 89503, "epoch": 739} {"train_loss": -39.360042572021484, "global_step": 89504, "epoch": 739} {"train_loss": -38.81865310668945, "global_step": 89505, "epoch": 739} {"train_loss": -39.0600471496582, "global_step": 89506, "epoch": 739} {"train_loss": -38.68406295776367, "global_step": 89507, "epoch": 739} {"train_loss": -38.94361114501953, "global_step": 89508, "epoch": 739} {"train_loss": -38.7555046081543, "global_step": 89509, "epoch": 739} {"train_loss": -38.88156509399414, "global_step": 89510, "epoch": 739} {"train_loss": -38.0026969909668, "global_step": 89511, "epoch": 739} {"train_loss": -38.77201461791992, "global_step": 89512, "epoch": 739} {"train_loss": -38.36623764038086, "global_step": 89513, "epoch": 739} {"train_loss": -38.860286712646484, "global_step": 89514, "epoch": 739} {"train_loss": -35.407135009765625, "global_step": 89515, "epoch": 739} {"train_loss": -33.561439514160156, "global_step": 89516, "epoch": 739} {"train_loss": -34.38129806518555, "global_step": 89517, "epoch": 739} {"train_loss": -36.98834991455078, "global_step": 89518, "epoch": 739} {"train_loss": -37.47367477416992, "global_step": 89519, "epoch": 739} {"train_loss": -36.3340950012207, "global_step": 89520, "epoch": 739} {"train_loss": -36.129051208496094, "global_step": 89521, "epoch": 739} {"train_loss": -38.13174057006836, "global_step": 89522, "epoch": 739} {"train_loss": -38.35481643676758, "global_step": 89523, "epoch": 739} {"train_loss": -36.87384796142578, "global_step": 89524, "epoch": 739} {"train_loss": -36.24430465698242, "global_step": 89525, "epoch": 739} {"train_loss": -37.43914794921875, "global_step": 89526, "epoch": 739} {"train_loss": -37.80263900756836, "global_step": 89527, "epoch": 739} {"train_loss": -37.52497100830078, "global_step": 89528, "epoch": 739} {"train_loss": -35.31795883178711, "global_step": 89529, "epoch": 739} {"train_loss": -37.94930648803711, "global_step": 89530, "epoch": 739} {"train_loss": -36.97096252441406, "global_step": 89531, "epoch": 739} {"train_loss": -37.326045989990234, "global_step": 89532, "epoch": 739} {"train_loss": -36.21148681640625, "global_step": 89533, "epoch": 739} {"train_loss": -37.59188461303711, "global_step": 89534, "epoch": 739} {"train_loss": -35.806827545166016, "global_step": 89535, "epoch": 739} {"train_loss": -37.2349967956543, "global_step": 89536, "epoch": 739} {"train_loss": -38.74287033081055, "global_step": 89537, "epoch": 739} {"train_loss": -37.763038635253906, "global_step": 89538, "epoch": 739} {"train_loss": -37.89020122181285, "global_step": 89539, "epoch": 739, "val_loss": 2590410.5} {"train_loss": -38.43149948120117, "global_step": 89540, "epoch": 740} {"train_loss": -37.626800537109375, "global_step": 89541, "epoch": 740} {"train_loss": -37.748016357421875, "global_step": 89542, "epoch": 740} {"train_loss": -37.683570861816406, "global_step": 89543, "epoch": 740} {"train_loss": -36.52854537963867, "global_step": 89544, "epoch": 740} {"train_loss": -36.37984848022461, "global_step": 89545, "epoch": 740} {"train_loss": -38.24819564819336, "global_step": 89546, "epoch": 740} {"train_loss": -37.266456604003906, "global_step": 89547, "epoch": 740} {"train_loss": -37.4376335144043, "global_step": 89548, "epoch": 740} {"train_loss": -38.026241302490234, "global_step": 89549, "epoch": 740} {"train_loss": -37.911285400390625, "global_step": 89550, "epoch": 740} {"train_loss": -38.2039680480957, "global_step": 89551, "epoch": 740} {"train_loss": -37.7274284362793, "global_step": 89552, "epoch": 740} {"train_loss": -38.01665496826172, "global_step": 89553, "epoch": 740} {"train_loss": -37.76070785522461, "global_step": 89554, "epoch": 740} {"train_loss": -38.00154495239258, "global_step": 89555, "epoch": 740} {"train_loss": -37.27143478393555, "global_step": 89556, "epoch": 740} {"train_loss": -38.3017463684082, "global_step": 89557, "epoch": 740} {"train_loss": -37.39897537231445, "global_step": 89558, "epoch": 740} {"train_loss": -38.00764083862305, "global_step": 89559, "epoch": 740} {"train_loss": -38.29010772705078, "global_step": 89560, "epoch": 740} {"train_loss": -37.46099853515625, "global_step": 89561, "epoch": 740} {"train_loss": -38.41813278198242, "global_step": 89562, "epoch": 740} {"train_loss": -37.86638259887695, "global_step": 89563, "epoch": 740} {"train_loss": -38.327392578125, "global_step": 89564, "epoch": 740} {"train_loss": -38.50955581665039, "global_step": 89565, "epoch": 740} {"train_loss": -38.3148307800293, "global_step": 89566, "epoch": 740} {"train_loss": -38.87514877319336, "global_step": 89567, "epoch": 740} {"train_loss": -38.65147018432617, "global_step": 89568, "epoch": 740} {"train_loss": -37.737239837646484, "global_step": 89569, "epoch": 740} {"train_loss": -38.24506378173828, "global_step": 89570, "epoch": 740} {"train_loss": -38.30009078979492, "global_step": 89571, "epoch": 740} {"train_loss": -38.794612884521484, "global_step": 89572, "epoch": 740} {"train_loss": -38.76651382446289, "global_step": 89573, "epoch": 740} {"train_loss": -37.939605712890625, "global_step": 89574, "epoch": 740} {"train_loss": -38.882171630859375, "global_step": 89575, "epoch": 740} {"train_loss": -39.0111083984375, "global_step": 89576, "epoch": 740} {"train_loss": -38.402862548828125, "global_step": 89577, "epoch": 740} {"train_loss": -38.35842514038086, "global_step": 89578, "epoch": 740} {"train_loss": -38.16669464111328, "global_step": 89579, "epoch": 740} {"train_loss": -37.722633361816406, "global_step": 89580, "epoch": 740} {"train_loss": -38.15717315673828, "global_step": 89581, "epoch": 740} {"train_loss": -39.312007904052734, "global_step": 89582, "epoch": 740} {"train_loss": -37.73536682128906, "global_step": 89583, "epoch": 740} {"train_loss": -37.83380889892578, "global_step": 89584, "epoch": 740} {"train_loss": -37.89340591430664, "global_step": 89585, "epoch": 740} {"train_loss": -38.91939926147461, "global_step": 89586, "epoch": 740} {"train_loss": -38.6185188293457, "global_step": 89587, "epoch": 740} {"train_loss": -37.036521911621094, "global_step": 89588, "epoch": 740} {"train_loss": -36.896785736083984, "global_step": 89589, "epoch": 740} {"train_loss": -39.04197311401367, "global_step": 89590, "epoch": 740} {"train_loss": -38.94348907470703, "global_step": 89591, "epoch": 740} {"train_loss": -37.565547943115234, "global_step": 89592, "epoch": 740} {"train_loss": -38.76217269897461, "global_step": 89593, "epoch": 740} {"train_loss": -38.91645431518555, "global_step": 89594, "epoch": 740} {"train_loss": -38.49092483520508, "global_step": 89595, "epoch": 740} {"train_loss": -37.94253921508789, "global_step": 89596, "epoch": 740} {"train_loss": -38.93061828613281, "global_step": 89597, "epoch": 740} {"train_loss": -39.420082092285156, "global_step": 89598, "epoch": 740} {"train_loss": -39.4615478515625, "global_step": 89599, "epoch": 740} {"train_loss": -38.9461555480957, "global_step": 89600, "epoch": 740} {"train_loss": -39.566131591796875, "global_step": 89601, "epoch": 740} {"train_loss": -39.022613525390625, "global_step": 89602, "epoch": 740} {"train_loss": -39.61316680908203, "global_step": 89603, "epoch": 740} {"train_loss": -39.038753509521484, "global_step": 89604, "epoch": 740} {"train_loss": -38.783050537109375, "global_step": 89605, "epoch": 740} {"train_loss": -39.32778549194336, "global_step": 89606, "epoch": 740} {"train_loss": -38.97687530517578, "global_step": 89607, "epoch": 740} {"train_loss": -39.27027893066406, "global_step": 89608, "epoch": 740} {"train_loss": -39.55882263183594, "global_step": 89609, "epoch": 740} {"train_loss": -38.723663330078125, "global_step": 89610, "epoch": 740} {"train_loss": -39.32045364379883, "global_step": 89611, "epoch": 740} {"train_loss": -39.80570983886719, "global_step": 89612, "epoch": 740} {"train_loss": -38.590179443359375, "global_step": 89613, "epoch": 740} {"train_loss": -38.138526916503906, "global_step": 89614, "epoch": 740} {"train_loss": -38.25386428833008, "global_step": 89615, "epoch": 740} {"train_loss": -38.373207092285156, "global_step": 89616, "epoch": 740} {"train_loss": -37.625701904296875, "global_step": 89617, "epoch": 740} {"train_loss": -37.69645309448242, "global_step": 89618, "epoch": 740} {"train_loss": -38.2233772277832, "global_step": 89619, "epoch": 740} {"train_loss": -37.76093673706055, "global_step": 89620, "epoch": 740} {"train_loss": -37.557350158691406, "global_step": 89621, "epoch": 740} {"train_loss": -38.17818832397461, "global_step": 89622, "epoch": 740} {"train_loss": -38.175838470458984, "global_step": 89623, "epoch": 740} {"train_loss": -37.8220100402832, "global_step": 89624, "epoch": 740} {"train_loss": -38.04654312133789, "global_step": 89625, "epoch": 740} {"train_loss": -39.28950881958008, "global_step": 89626, "epoch": 740} {"train_loss": -38.535316467285156, "global_step": 89627, "epoch": 740} {"train_loss": -37.036041259765625, "global_step": 89628, "epoch": 740} {"train_loss": -36.099979400634766, "global_step": 89629, "epoch": 740} {"train_loss": -38.35313034057617, "global_step": 89630, "epoch": 740} {"train_loss": -38.806182861328125, "global_step": 89631, "epoch": 740} {"train_loss": -37.14659881591797, "global_step": 89632, "epoch": 740} {"train_loss": -37.84791946411133, "global_step": 89633, "epoch": 740} {"train_loss": -37.467952728271484, "global_step": 89634, "epoch": 740} {"train_loss": -38.08864974975586, "global_step": 89635, "epoch": 740} {"train_loss": -38.79834747314453, "global_step": 89636, "epoch": 740} {"train_loss": -36.97848129272461, "global_step": 89637, "epoch": 740} {"train_loss": -37.32298278808594, "global_step": 89638, "epoch": 740} {"train_loss": -37.22182846069336, "global_step": 89639, "epoch": 740} {"train_loss": -38.63801193237305, "global_step": 89640, "epoch": 740} {"train_loss": -38.79586410522461, "global_step": 89641, "epoch": 740} {"train_loss": -37.22822189331055, "global_step": 89642, "epoch": 740} {"train_loss": -36.6461296081543, "global_step": 89643, "epoch": 740} {"train_loss": -36.476043701171875, "global_step": 89644, "epoch": 740} {"train_loss": -37.680545806884766, "global_step": 89645, "epoch": 740} {"train_loss": -36.92365646362305, "global_step": 89646, "epoch": 740} {"train_loss": -37.73554229736328, "global_step": 89647, "epoch": 740} {"train_loss": -38.071231842041016, "global_step": 89648, "epoch": 740} {"train_loss": -36.990577697753906, "global_step": 89649, "epoch": 740} {"train_loss": -36.39801788330078, "global_step": 89650, "epoch": 740} {"train_loss": -37.3948860168457, "global_step": 89651, "epoch": 740} {"train_loss": -38.4716682434082, "global_step": 89652, "epoch": 740} {"train_loss": -37.80842971801758, "global_step": 89653, "epoch": 740} {"train_loss": -37.054656982421875, "global_step": 89654, "epoch": 740} {"train_loss": -38.1945686340332, "global_step": 89655, "epoch": 740} {"train_loss": -38.83202362060547, "global_step": 89656, "epoch": 740} {"train_loss": -37.61271667480469, "global_step": 89657, "epoch": 740} {"train_loss": -38.556121826171875, "global_step": 89658, "epoch": 740} {"train_loss": -38.505775451660156, "global_step": 89659, "epoch": 740} {"train_loss": -38.14007902539466, "global_step": 89660, "epoch": 740, "val_loss": 2600785.75} {"train_loss": -39.127899169921875, "global_step": 89661, "epoch": 741} {"train_loss": -37.97683334350586, "global_step": 89662, "epoch": 741} {"train_loss": -38.36129379272461, "global_step": 89663, "epoch": 741} {"train_loss": -38.7691764831543, "global_step": 89664, "epoch": 741} {"train_loss": -39.00141525268555, "global_step": 89665, "epoch": 741} {"train_loss": -38.68349838256836, "global_step": 89666, "epoch": 741} {"train_loss": -38.04880905151367, "global_step": 89667, "epoch": 741} {"train_loss": -38.417259216308594, "global_step": 89668, "epoch": 741} {"train_loss": -39.170528411865234, "global_step": 89669, "epoch": 741} {"train_loss": -39.430625915527344, "global_step": 89670, "epoch": 741} {"train_loss": -38.94865798950195, "global_step": 89671, "epoch": 741} {"train_loss": -38.44780731201172, "global_step": 89672, "epoch": 741} {"train_loss": -38.25973129272461, "global_step": 89673, "epoch": 741} {"train_loss": -39.17354965209961, "global_step": 89674, "epoch": 741} {"train_loss": -38.51169967651367, "global_step": 89675, "epoch": 741} {"train_loss": -38.011077880859375, "global_step": 89676, "epoch": 741} {"train_loss": -38.281368255615234, "global_step": 89677, "epoch": 741} {"train_loss": -38.63854217529297, "global_step": 89678, "epoch": 741} {"train_loss": -38.746437072753906, "global_step": 89679, "epoch": 741} {"train_loss": -38.32957077026367, "global_step": 89680, "epoch": 741} {"train_loss": -37.607723236083984, "global_step": 89681, "epoch": 741} {"train_loss": -34.4113883972168, "global_step": 89682, "epoch": 741} {"train_loss": -33.36262893676758, "global_step": 89683, "epoch": 741} {"train_loss": -38.48474884033203, "global_step": 89684, "epoch": 741} {"train_loss": -38.4431266784668, "global_step": 89685, "epoch": 741} {"train_loss": -36.889923095703125, "global_step": 89686, "epoch": 741} {"train_loss": -36.44318389892578, "global_step": 89687, "epoch": 741} {"train_loss": -35.865413665771484, "global_step": 89688, "epoch": 741} {"train_loss": -37.62709045410156, "global_step": 89689, "epoch": 741} {"train_loss": -39.104347229003906, "global_step": 89690, "epoch": 741} {"train_loss": -35.95054244995117, "global_step": 89691, "epoch": 741} {"train_loss": -35.36347198486328, "global_step": 89692, "epoch": 741} {"train_loss": -37.3228874206543, "global_step": 89693, "epoch": 741} {"train_loss": -38.500423431396484, "global_step": 89694, "epoch": 741} {"train_loss": -36.17123031616211, "global_step": 89695, "epoch": 741} {"train_loss": -36.52982711791992, "global_step": 89696, "epoch": 741} {"train_loss": -38.968013763427734, "global_step": 89697, "epoch": 741} {"train_loss": -37.824344635009766, "global_step": 89698, "epoch": 741} {"train_loss": -38.94569778442383, "global_step": 89699, "epoch": 741} {"train_loss": -38.887672424316406, "global_step": 89700, "epoch": 741} {"train_loss": -38.62485122680664, "global_step": 89701, "epoch": 741} {"train_loss": -39.06775665283203, "global_step": 89702, "epoch": 741} {"train_loss": -38.434547424316406, "global_step": 89703, "epoch": 741} {"train_loss": -39.27368927001953, "global_step": 89704, "epoch": 741} {"train_loss": -39.01007843017578, "global_step": 89705, "epoch": 741} {"train_loss": -39.22874069213867, "global_step": 89706, "epoch": 741} {"train_loss": -38.7762451171875, "global_step": 89707, "epoch": 741} {"train_loss": -39.4550895690918, "global_step": 89708, "epoch": 741} {"train_loss": -39.595821380615234, "global_step": 89709, "epoch": 741} {"train_loss": -39.35312271118164, "global_step": 89710, "epoch": 741} {"train_loss": -39.34613800048828, "global_step": 89711, "epoch": 741} {"train_loss": -39.47257614135742, "global_step": 89712, "epoch": 741} {"train_loss": -39.315277099609375, "global_step": 89713, "epoch": 741} {"train_loss": -39.23119354248047, "global_step": 89714, "epoch": 741} {"train_loss": -39.3017578125, "global_step": 89715, "epoch": 741} {"train_loss": -38.6873664855957, "global_step": 89716, "epoch": 741} {"train_loss": -38.843204498291016, "global_step": 89717, "epoch": 741} {"train_loss": -38.95728302001953, "global_step": 89718, "epoch": 741} {"train_loss": -39.052154541015625, "global_step": 89719, "epoch": 741} {"train_loss": -39.06629943847656, "global_step": 89720, "epoch": 741} {"train_loss": -39.658355712890625, "global_step": 89721, "epoch": 741} {"train_loss": -39.44285202026367, "global_step": 89722, "epoch": 741} {"train_loss": -38.76166915893555, "global_step": 89723, "epoch": 741} {"train_loss": -38.26704025268555, "global_step": 89724, "epoch": 741} {"train_loss": -37.82804489135742, "global_step": 89725, "epoch": 741} {"train_loss": -38.38424301147461, "global_step": 89726, "epoch": 741} {"train_loss": -39.36840057373047, "global_step": 89727, "epoch": 741} {"train_loss": -39.58864212036133, "global_step": 89728, "epoch": 741} {"train_loss": -39.315467834472656, "global_step": 89729, "epoch": 741} {"train_loss": -39.1241340637207, "global_step": 89730, "epoch": 741} {"train_loss": -38.50346755981445, "global_step": 89731, "epoch": 741} {"train_loss": -38.248512268066406, "global_step": 89732, "epoch": 741} {"train_loss": -37.589656829833984, "global_step": 89733, "epoch": 741} {"train_loss": -38.68343734741211, "global_step": 89734, "epoch": 741} {"train_loss": -38.813018798828125, "global_step": 89735, "epoch": 741} {"train_loss": -39.396114349365234, "global_step": 89736, "epoch": 741} {"train_loss": -37.60883712768555, "global_step": 89737, "epoch": 741} {"train_loss": -36.49735641479492, "global_step": 89738, "epoch": 741} {"train_loss": -34.890350341796875, "global_step": 89739, "epoch": 741} {"train_loss": -36.85247039794922, "global_step": 89740, "epoch": 741} {"train_loss": -37.36439895629883, "global_step": 89741, "epoch": 741} {"train_loss": -37.31373977661133, "global_step": 89742, "epoch": 741} {"train_loss": -36.0571174621582, "global_step": 89743, "epoch": 741} {"train_loss": -36.77580642700195, "global_step": 89744, "epoch": 741} {"train_loss": -36.556522369384766, "global_step": 89745, "epoch": 741} {"train_loss": -36.82603073120117, "global_step": 89746, "epoch": 741} {"train_loss": -34.433753967285156, "global_step": 89747, "epoch": 741} {"train_loss": -33.45119857788086, "global_step": 89748, "epoch": 741} {"train_loss": -29.96722412109375, "global_step": 89749, "epoch": 741} {"train_loss": -32.167030334472656, "global_step": 89750, "epoch": 741} {"train_loss": -27.97711753845215, "global_step": 89751, "epoch": 741} {"train_loss": -34.3451042175293, "global_step": 89752, "epoch": 741} {"train_loss": -28.870635986328125, "global_step": 89753, "epoch": 741} {"train_loss": -33.0665397644043, "global_step": 89754, "epoch": 741} {"train_loss": -31.79266929626465, "global_step": 89755, "epoch": 741} {"train_loss": -33.584659576416016, "global_step": 89756, "epoch": 741} {"train_loss": -33.4510383605957, "global_step": 89757, "epoch": 741} {"train_loss": -35.17903137207031, "global_step": 89758, "epoch": 741} {"train_loss": -34.97845458984375, "global_step": 89759, "epoch": 741} {"train_loss": -34.400970458984375, "global_step": 89760, "epoch": 741} {"train_loss": -35.1683464050293, "global_step": 89761, "epoch": 741} {"train_loss": -33.62128448486328, "global_step": 89762, "epoch": 741} {"train_loss": -35.77669906616211, "global_step": 89763, "epoch": 741} {"train_loss": -33.77010726928711, "global_step": 89764, "epoch": 741} {"train_loss": -35.8870964050293, "global_step": 89765, "epoch": 741} {"train_loss": -33.69782257080078, "global_step": 89766, "epoch": 741} {"train_loss": -36.31929397583008, "global_step": 89767, "epoch": 741} {"train_loss": -35.59274673461914, "global_step": 89768, "epoch": 741} {"train_loss": -36.23991012573242, "global_step": 89769, "epoch": 741} {"train_loss": -36.32585525512695, "global_step": 89770, "epoch": 741} {"train_loss": -36.041908264160156, "global_step": 89771, "epoch": 741} {"train_loss": -37.91703414916992, "global_step": 89772, "epoch": 741} {"train_loss": -35.599849700927734, "global_step": 89773, "epoch": 741} {"train_loss": -36.76943588256836, "global_step": 89774, "epoch": 741} {"train_loss": -37.715938568115234, "global_step": 89775, "epoch": 741} {"train_loss": -35.815765380859375, "global_step": 89776, "epoch": 741} {"train_loss": -37.58354187011719, "global_step": 89777, "epoch": 741} {"train_loss": -38.115108489990234, "global_step": 89778, "epoch": 741} {"train_loss": -36.71245193481445, "global_step": 89779, "epoch": 741} {"train_loss": -37.67338180541992, "global_step": 89780, "epoch": 741} {"train_loss": -37.21220675381747, "global_step": 89781, "epoch": 741, "val_loss": 2599742.0} {"train_loss": -37.41874694824219, "global_step": 89782, "epoch": 742} {"train_loss": -37.24092102050781, "global_step": 89783, "epoch": 742} {"train_loss": -38.02019119262695, "global_step": 89784, "epoch": 742} {"train_loss": -38.04120635986328, "global_step": 89785, "epoch": 742} {"train_loss": -37.78287887573242, "global_step": 89786, "epoch": 742} {"train_loss": -38.25155258178711, "global_step": 89787, "epoch": 742} {"train_loss": -38.29238510131836, "global_step": 89788, "epoch": 742} {"train_loss": -38.35368728637695, "global_step": 89789, "epoch": 742} {"train_loss": -37.854591369628906, "global_step": 89790, "epoch": 742} {"train_loss": -38.1495361328125, "global_step": 89791, "epoch": 742} {"train_loss": -38.536319732666016, "global_step": 89792, "epoch": 742} {"train_loss": -38.29276657104492, "global_step": 89793, "epoch": 742} {"train_loss": -38.42971420288086, "global_step": 89794, "epoch": 742} {"train_loss": -38.332454681396484, "global_step": 89795, "epoch": 742} {"train_loss": -38.67512512207031, "global_step": 89796, "epoch": 742} {"train_loss": -38.54114532470703, "global_step": 89797, "epoch": 742} {"train_loss": -38.23738098144531, "global_step": 89798, "epoch": 742} {"train_loss": -38.44464111328125, "global_step": 89799, "epoch": 742} {"train_loss": -38.721656799316406, "global_step": 89800, "epoch": 742} {"train_loss": -38.64652633666992, "global_step": 89801, "epoch": 742} {"train_loss": -38.479976654052734, "global_step": 89802, "epoch": 742} {"train_loss": -38.664161682128906, "global_step": 89803, "epoch": 742} {"train_loss": -39.0197868347168, "global_step": 89804, "epoch": 742} {"train_loss": -38.47065353393555, "global_step": 89805, "epoch": 742} {"train_loss": -38.77375411987305, "global_step": 89806, "epoch": 742} {"train_loss": -38.51735305786133, "global_step": 89807, "epoch": 742} {"train_loss": -38.44100570678711, "global_step": 89808, "epoch": 742} {"train_loss": -39.30048751831055, "global_step": 89809, "epoch": 742} {"train_loss": -39.08961486816406, "global_step": 89810, "epoch": 742} {"train_loss": -39.291282653808594, "global_step": 89811, "epoch": 742} {"train_loss": -39.028717041015625, "global_step": 89812, "epoch": 742} {"train_loss": -39.604984283447266, "global_step": 89813, "epoch": 742} {"train_loss": -39.412628173828125, "global_step": 89814, "epoch": 742} {"train_loss": -39.31318664550781, "global_step": 89815, "epoch": 742} {"train_loss": -39.4857063293457, "global_step": 89816, "epoch": 742} {"train_loss": -39.22490310668945, "global_step": 89817, "epoch": 742} {"train_loss": -39.439796447753906, "global_step": 89818, "epoch": 742} {"train_loss": -39.62635040283203, "global_step": 89819, "epoch": 742} {"train_loss": -39.4157829284668, "global_step": 89820, "epoch": 742} {"train_loss": -39.124610900878906, "global_step": 89821, "epoch": 742} {"train_loss": -39.16342544555664, "global_step": 89822, "epoch": 742} {"train_loss": -39.65768814086914, "global_step": 89823, "epoch": 742} {"train_loss": -38.61712646484375, "global_step": 89824, "epoch": 742} {"train_loss": -39.07481002807617, "global_step": 89825, "epoch": 742} {"train_loss": -39.07888412475586, "global_step": 89826, "epoch": 742} {"train_loss": -39.477291107177734, "global_step": 89827, "epoch": 742} {"train_loss": -39.52093505859375, "global_step": 89828, "epoch": 742} {"train_loss": -39.17413330078125, "global_step": 89829, "epoch": 742} {"train_loss": -39.61017608642578, "global_step": 89830, "epoch": 742} {"train_loss": -39.58018112182617, "global_step": 89831, "epoch": 742} {"train_loss": -39.0498161315918, "global_step": 89832, "epoch": 742} {"train_loss": -39.72904968261719, "global_step": 89833, "epoch": 742} {"train_loss": -39.459266662597656, "global_step": 89834, "epoch": 742} {"train_loss": -39.026397705078125, "global_step": 89835, "epoch": 742} {"train_loss": -39.12972640991211, "global_step": 89836, "epoch": 742} {"train_loss": -39.042991638183594, "global_step": 89837, "epoch": 742} {"train_loss": -39.424373626708984, "global_step": 89838, "epoch": 742} {"train_loss": -39.41743087768555, "global_step": 89839, "epoch": 742} {"train_loss": -39.362178802490234, "global_step": 89840, "epoch": 742} {"train_loss": -38.67145919799805, "global_step": 89841, "epoch": 742} {"train_loss": -38.541908264160156, "global_step": 89842, "epoch": 742} {"train_loss": -37.395503997802734, "global_step": 89843, "epoch": 742} {"train_loss": -37.51618576049805, "global_step": 89844, "epoch": 742} {"train_loss": -36.311580657958984, "global_step": 89845, "epoch": 742} {"train_loss": -36.265235900878906, "global_step": 89846, "epoch": 742} {"train_loss": -36.98755645751953, "global_step": 89847, "epoch": 742} {"train_loss": -38.27490997314453, "global_step": 89848, "epoch": 742} {"train_loss": -35.316524505615234, "global_step": 89849, "epoch": 742} {"train_loss": -33.85512924194336, "global_step": 89850, "epoch": 742} {"train_loss": -37.42334747314453, "global_step": 89851, "epoch": 742} {"train_loss": -31.5773983001709, "global_step": 89852, "epoch": 742} {"train_loss": -35.52925491333008, "global_step": 89853, "epoch": 742} {"train_loss": -30.64862060546875, "global_step": 89854, "epoch": 742} {"train_loss": -32.264286041259766, "global_step": 89855, "epoch": 742} {"train_loss": -35.45622634887695, "global_step": 89856, "epoch": 742} {"train_loss": -33.84779739379883, "global_step": 89857, "epoch": 742} {"train_loss": -37.836158752441406, "global_step": 89858, "epoch": 742} {"train_loss": -34.25379180908203, "global_step": 89859, "epoch": 742} {"train_loss": -37.00405502319336, "global_step": 89860, "epoch": 742} {"train_loss": -34.920814514160156, "global_step": 89861, "epoch": 742} {"train_loss": -37.826881408691406, "global_step": 89862, "epoch": 742} {"train_loss": -37.049312591552734, "global_step": 89863, "epoch": 742} {"train_loss": -37.44169998168945, "global_step": 89864, "epoch": 742} {"train_loss": -38.3221321105957, "global_step": 89865, "epoch": 742} {"train_loss": -37.507789611816406, "global_step": 89866, "epoch": 742} {"train_loss": -37.91133499145508, "global_step": 89867, "epoch": 742} {"train_loss": -38.40293502807617, "global_step": 89868, "epoch": 742} {"train_loss": -37.85592269897461, "global_step": 89869, "epoch": 742} {"train_loss": -38.07978057861328, "global_step": 89870, "epoch": 742} {"train_loss": -38.54232406616211, "global_step": 89871, "epoch": 742} {"train_loss": -37.85988998413086, "global_step": 89872, "epoch": 742} {"train_loss": -38.2996940612793, "global_step": 89873, "epoch": 742} {"train_loss": -38.75637435913086, "global_step": 89874, "epoch": 742} {"train_loss": -38.16387939453125, "global_step": 89875, "epoch": 742} {"train_loss": -38.73780059814453, "global_step": 89876, "epoch": 742} {"train_loss": -38.85514450073242, "global_step": 89877, "epoch": 742} {"train_loss": -38.32636642456055, "global_step": 89878, "epoch": 742} {"train_loss": -38.548248291015625, "global_step": 89879, "epoch": 742} {"train_loss": -38.799041748046875, "global_step": 89880, "epoch": 742} {"train_loss": -38.40749740600586, "global_step": 89881, "epoch": 742} {"train_loss": -38.37655258178711, "global_step": 89882, "epoch": 742} {"train_loss": -38.603248596191406, "global_step": 89883, "epoch": 742} {"train_loss": -38.95742416381836, "global_step": 89884, "epoch": 742} {"train_loss": -38.59225082397461, "global_step": 89885, "epoch": 742} {"train_loss": -39.02365493774414, "global_step": 89886, "epoch": 742} {"train_loss": -38.72282028198242, "global_step": 89887, "epoch": 742} {"train_loss": -38.43058395385742, "global_step": 89888, "epoch": 742} {"train_loss": -38.82112503051758, "global_step": 89889, "epoch": 742} {"train_loss": -38.87456512451172, "global_step": 89890, "epoch": 742} {"train_loss": -38.77825164794922, "global_step": 89891, "epoch": 742} {"train_loss": -39.27546691894531, "global_step": 89892, "epoch": 742} {"train_loss": -39.011451721191406, "global_step": 89893, "epoch": 742} {"train_loss": -38.70521545410156, "global_step": 89894, "epoch": 742} {"train_loss": -38.89219284057617, "global_step": 89895, "epoch": 742} {"train_loss": -38.4578857421875, "global_step": 89896, "epoch": 742} {"train_loss": -38.578060150146484, "global_step": 89897, "epoch": 742} {"train_loss": -39.1082878112793, "global_step": 89898, "epoch": 742} {"train_loss": -39.011817932128906, "global_step": 89899, "epoch": 742} {"train_loss": -38.62623977661133, "global_step": 89900, "epoch": 742} {"train_loss": -38.58743667602539, "global_step": 89901, "epoch": 742} {"train_loss": -38.18098697189457, "global_step": 89902, "epoch": 742, "val_loss": 2595944.25} {"train_loss": -38.70864486694336, "global_step": 89903, "epoch": 743} {"train_loss": -38.91697692871094, "global_step": 89904, "epoch": 743} {"train_loss": -37.73934555053711, "global_step": 89905, "epoch": 743} {"train_loss": -36.08517074584961, "global_step": 89906, "epoch": 743} {"train_loss": -34.316375732421875, "global_step": 89907, "epoch": 743} {"train_loss": -37.89527130126953, "global_step": 89908, "epoch": 743} {"train_loss": -38.27405548095703, "global_step": 89909, "epoch": 743} {"train_loss": -35.011878967285156, "global_step": 89910, "epoch": 743} {"train_loss": -36.870784759521484, "global_step": 89911, "epoch": 743} {"train_loss": -38.22794723510742, "global_step": 89912, "epoch": 743} {"train_loss": -37.30168914794922, "global_step": 89913, "epoch": 743} {"train_loss": -37.63371658325195, "global_step": 89914, "epoch": 743} {"train_loss": -38.455291748046875, "global_step": 89915, "epoch": 743} {"train_loss": -38.86214065551758, "global_step": 89916, "epoch": 743} {"train_loss": -38.346900939941406, "global_step": 89917, "epoch": 743} {"train_loss": -37.09589385986328, "global_step": 89918, "epoch": 743} {"train_loss": -37.0251579284668, "global_step": 89919, "epoch": 743} {"train_loss": -37.71480178833008, "global_step": 89920, "epoch": 743} {"train_loss": -37.0010871887207, "global_step": 89921, "epoch": 743} {"train_loss": -37.07004928588867, "global_step": 89922, "epoch": 743} {"train_loss": -38.54920959472656, "global_step": 89923, "epoch": 743} {"train_loss": -38.749813079833984, "global_step": 89924, "epoch": 743} {"train_loss": -36.88614273071289, "global_step": 89925, "epoch": 743} {"train_loss": -36.21084213256836, "global_step": 89926, "epoch": 743} {"train_loss": -37.90325164794922, "global_step": 89927, "epoch": 743} {"train_loss": -38.51615524291992, "global_step": 89928, "epoch": 743} {"train_loss": -35.18484115600586, "global_step": 89929, "epoch": 743} {"train_loss": -37.01871871948242, "global_step": 89930, "epoch": 743} {"train_loss": -39.01459884643555, "global_step": 89931, "epoch": 743} {"train_loss": -36.101131439208984, "global_step": 89932, "epoch": 743} {"train_loss": -37.729454040527344, "global_step": 89933, "epoch": 743} {"train_loss": -39.17915725708008, "global_step": 89934, "epoch": 743} {"train_loss": -36.33036422729492, "global_step": 89935, "epoch": 743} {"train_loss": -39.255027770996094, "global_step": 89936, "epoch": 743} {"train_loss": -37.2296142578125, "global_step": 89937, "epoch": 743} {"train_loss": -38.73051834106445, "global_step": 89938, "epoch": 743} {"train_loss": -36.819305419921875, "global_step": 89939, "epoch": 743} {"train_loss": -37.7531852722168, "global_step": 89940, "epoch": 743} {"train_loss": -37.31582260131836, "global_step": 89941, "epoch": 743} {"train_loss": -38.01324462890625, "global_step": 89942, "epoch": 743} {"train_loss": -38.41743850708008, "global_step": 89943, "epoch": 743} {"train_loss": -38.263668060302734, "global_step": 89944, "epoch": 743} {"train_loss": -38.4715576171875, "global_step": 89945, "epoch": 743} {"train_loss": -38.31510543823242, "global_step": 89946, "epoch": 743} {"train_loss": -38.874996185302734, "global_step": 89947, "epoch": 743} {"train_loss": -39.02065658569336, "global_step": 89948, "epoch": 743} {"train_loss": -38.376861572265625, "global_step": 89949, "epoch": 743} {"train_loss": -38.28385543823242, "global_step": 89950, "epoch": 743} {"train_loss": -38.57210159301758, "global_step": 89951, "epoch": 743} {"train_loss": -38.17189407348633, "global_step": 89952, "epoch": 743} {"train_loss": -36.9114875793457, "global_step": 89953, "epoch": 743} {"train_loss": -38.2671012878418, "global_step": 89954, "epoch": 743} {"train_loss": -39.01209259033203, "global_step": 89955, "epoch": 743} {"train_loss": -37.765052795410156, "global_step": 89956, "epoch": 743} {"train_loss": -37.840484619140625, "global_step": 89957, "epoch": 743} {"train_loss": -39.00532150268555, "global_step": 89958, "epoch": 743} {"train_loss": -37.69137191772461, "global_step": 89959, "epoch": 743} {"train_loss": -37.564937591552734, "global_step": 89960, "epoch": 743} {"train_loss": -38.10915756225586, "global_step": 89961, "epoch": 743} {"train_loss": -37.82223129272461, "global_step": 89962, "epoch": 743} {"train_loss": -38.45863723754883, "global_step": 89963, "epoch": 743} {"train_loss": -37.70107650756836, "global_step": 89964, "epoch": 743} {"train_loss": -38.124839782714844, "global_step": 89965, "epoch": 743} {"train_loss": -38.90107345581055, "global_step": 89966, "epoch": 743} {"train_loss": -38.0670166015625, "global_step": 89967, "epoch": 743} {"train_loss": -38.6906623840332, "global_step": 89968, "epoch": 743} {"train_loss": -38.37912368774414, "global_step": 89969, "epoch": 743} {"train_loss": -38.97172164916992, "global_step": 89970, "epoch": 743} {"train_loss": -38.937347412109375, "global_step": 89971, "epoch": 743} {"train_loss": -38.46393966674805, "global_step": 89972, "epoch": 743} {"train_loss": -38.95302200317383, "global_step": 89973, "epoch": 743} {"train_loss": -37.6624755859375, "global_step": 89974, "epoch": 743} {"train_loss": -34.35184097290039, "global_step": 89975, "epoch": 743} {"train_loss": -37.82877731323242, "global_step": 89976, "epoch": 743} {"train_loss": -38.182350158691406, "global_step": 89977, "epoch": 743} {"train_loss": -35.83665084838867, "global_step": 89978, "epoch": 743} {"train_loss": -33.291255950927734, "global_step": 89979, "epoch": 743} {"train_loss": -35.239837646484375, "global_step": 89980, "epoch": 743} {"train_loss": -33.24318313598633, "global_step": 89981, "epoch": 743} {"train_loss": -36.83079147338867, "global_step": 89982, "epoch": 743} {"train_loss": -34.865989685058594, "global_step": 89983, "epoch": 743} {"train_loss": -36.10737228393555, "global_step": 89984, "epoch": 743} {"train_loss": -35.78959274291992, "global_step": 89985, "epoch": 743} {"train_loss": -37.23165512084961, "global_step": 89986, "epoch": 743} {"train_loss": -35.746273040771484, "global_step": 89987, "epoch": 743} {"train_loss": -35.893184661865234, "global_step": 89988, "epoch": 743} {"train_loss": -37.316009521484375, "global_step": 89989, "epoch": 743} {"train_loss": -37.14299392700195, "global_step": 89990, "epoch": 743} {"train_loss": -35.64580154418945, "global_step": 89991, "epoch": 743} {"train_loss": -37.56344223022461, "global_step": 89992, "epoch": 743} {"train_loss": -35.96561813354492, "global_step": 89993, "epoch": 743} {"train_loss": -38.1554069519043, "global_step": 89994, "epoch": 743} {"train_loss": -36.605369567871094, "global_step": 89995, "epoch": 743} {"train_loss": -37.440452575683594, "global_step": 89996, "epoch": 743} {"train_loss": -37.75636672973633, "global_step": 89997, "epoch": 743} {"train_loss": -38.35437774658203, "global_step": 89998, "epoch": 743} {"train_loss": -38.29010009765625, "global_step": 89999, "epoch": 743} {"train_loss": -38.1318473815918, "global_step": 90000, "epoch": 743} {"train_loss": -39.2348747253418, "global_step": 90001, "epoch": 743} {"train_loss": -38.20907211303711, "global_step": 90002, "epoch": 743} {"train_loss": -38.502254486083984, "global_step": 90003, "epoch": 743} {"train_loss": -38.956539154052734, "global_step": 90004, "epoch": 743} {"train_loss": -38.233306884765625, "global_step": 90005, "epoch": 743} {"train_loss": -38.629249572753906, "global_step": 90006, "epoch": 743} {"train_loss": -39.30333709716797, "global_step": 90007, "epoch": 743} {"train_loss": -38.52061080932617, "global_step": 90008, "epoch": 743} {"train_loss": -38.8202018737793, "global_step": 90009, "epoch": 743} {"train_loss": -38.4509391784668, "global_step": 90010, "epoch": 743} {"train_loss": -38.21401596069336, "global_step": 90011, "epoch": 743} {"train_loss": -38.84316635131836, "global_step": 90012, "epoch": 743} {"train_loss": -38.537574768066406, "global_step": 90013, "epoch": 743} {"train_loss": -38.54246139526367, "global_step": 90014, "epoch": 743} {"train_loss": -38.5625114440918, "global_step": 90015, "epoch": 743} {"train_loss": -38.48002624511719, "global_step": 90016, "epoch": 743} {"train_loss": -38.486602783203125, "global_step": 90017, "epoch": 743} {"train_loss": -39.0433349609375, "global_step": 90018, "epoch": 743} {"train_loss": -39.05055236816406, "global_step": 90019, "epoch": 743} {"train_loss": -38.819053649902344, "global_step": 90020, "epoch": 743} {"train_loss": -38.97509002685547, "global_step": 90021, "epoch": 743} {"train_loss": -38.309478759765625, "global_step": 90022, "epoch": 743} {"train_loss": -37.730396365331224, "global_step": 90023, "epoch": 743, "val_loss": 2616751.75} {"train_loss": -39.96138381958008, "global_step": 90024, "epoch": 744} {"train_loss": -39.34613800048828, "global_step": 90025, "epoch": 744} {"train_loss": -39.00492858886719, "global_step": 90026, "epoch": 744} {"train_loss": -39.279273986816406, "global_step": 90027, "epoch": 744} {"train_loss": -39.19951629638672, "global_step": 90028, "epoch": 744} {"train_loss": -38.83120346069336, "global_step": 90029, "epoch": 744} {"train_loss": -38.757869720458984, "global_step": 90030, "epoch": 744} {"train_loss": -38.155555725097656, "global_step": 90031, "epoch": 744} {"train_loss": -37.81016159057617, "global_step": 90032, "epoch": 744} {"train_loss": -38.3170051574707, "global_step": 90033, "epoch": 744} {"train_loss": -38.18802261352539, "global_step": 90034, "epoch": 744} {"train_loss": -38.46281051635742, "global_step": 90035, "epoch": 744} {"train_loss": -38.32456588745117, "global_step": 90036, "epoch": 744} {"train_loss": -38.96857452392578, "global_step": 90037, "epoch": 744} {"train_loss": -38.558387756347656, "global_step": 90038, "epoch": 744} {"train_loss": -38.38682556152344, "global_step": 90039, "epoch": 744} {"train_loss": -38.77219772338867, "global_step": 90040, "epoch": 744} {"train_loss": -38.80861282348633, "global_step": 90041, "epoch": 744} {"train_loss": -38.869380950927734, "global_step": 90042, "epoch": 744} {"train_loss": -38.75106430053711, "global_step": 90043, "epoch": 744} {"train_loss": -38.57855224609375, "global_step": 90044, "epoch": 744} {"train_loss": -39.34956741333008, "global_step": 90045, "epoch": 744} {"train_loss": -38.407772064208984, "global_step": 90046, "epoch": 744} {"train_loss": -38.111366271972656, "global_step": 90047, "epoch": 744} {"train_loss": -38.39496612548828, "global_step": 90048, "epoch": 744} {"train_loss": -39.447479248046875, "global_step": 90049, "epoch": 744} {"train_loss": -37.87549591064453, "global_step": 90050, "epoch": 744} {"train_loss": -38.625335693359375, "global_step": 90051, "epoch": 744} {"train_loss": -39.176815032958984, "global_step": 90052, "epoch": 744} {"train_loss": -37.05826950073242, "global_step": 90053, "epoch": 744} {"train_loss": -34.907073974609375, "global_step": 90054, "epoch": 744} {"train_loss": -37.634578704833984, "global_step": 90055, "epoch": 744} {"train_loss": -33.804622650146484, "global_step": 90056, "epoch": 744} {"train_loss": -35.78229904174805, "global_step": 90057, "epoch": 744} {"train_loss": -33.588619232177734, "global_step": 90058, "epoch": 744} {"train_loss": -35.5081901550293, "global_step": 90059, "epoch": 744} {"train_loss": -30.196186065673828, "global_step": 90060, "epoch": 744} {"train_loss": -31.858795166015625, "global_step": 90061, "epoch": 744} {"train_loss": -32.352020263671875, "global_step": 90062, "epoch": 744} {"train_loss": -33.46241760253906, "global_step": 90063, "epoch": 744} {"train_loss": -27.318246841430664, "global_step": 90064, "epoch": 744} {"train_loss": -29.735858917236328, "global_step": 90065, "epoch": 744} {"train_loss": -31.33709716796875, "global_step": 90066, "epoch": 744} {"train_loss": -33.32692337036133, "global_step": 90067, "epoch": 744} {"train_loss": -34.643898010253906, "global_step": 90068, "epoch": 744} {"train_loss": -33.24732208251953, "global_step": 90069, "epoch": 744} {"train_loss": -35.793701171875, "global_step": 90070, "epoch": 744} {"train_loss": -32.915374755859375, "global_step": 90071, "epoch": 744} {"train_loss": -35.693939208984375, "global_step": 90072, "epoch": 744} {"train_loss": -36.15790939331055, "global_step": 90073, "epoch": 744} {"train_loss": -32.17523193359375, "global_step": 90074, "epoch": 744} {"train_loss": -35.84343719482422, "global_step": 90075, "epoch": 744} {"train_loss": -35.48503494262695, "global_step": 90076, "epoch": 744} {"train_loss": -35.58949661254883, "global_step": 90077, "epoch": 744} {"train_loss": -35.28623962402344, "global_step": 90078, "epoch": 744} {"train_loss": -36.53298568725586, "global_step": 90079, "epoch": 744} {"train_loss": -34.383094787597656, "global_step": 90080, "epoch": 744} {"train_loss": -36.06678009033203, "global_step": 90081, "epoch": 744} {"train_loss": -36.66996383666992, "global_step": 90082, "epoch": 744} {"train_loss": -37.12765884399414, "global_step": 90083, "epoch": 744} {"train_loss": -36.85207748413086, "global_step": 90084, "epoch": 744} {"train_loss": -37.10758972167969, "global_step": 90085, "epoch": 744} {"train_loss": -36.005489349365234, "global_step": 90086, "epoch": 744} {"train_loss": -34.193504333496094, "global_step": 90087, "epoch": 744} {"train_loss": -35.355098724365234, "global_step": 90088, "epoch": 744} {"train_loss": -36.58802032470703, "global_step": 90089, "epoch": 744} {"train_loss": -36.94197463989258, "global_step": 90090, "epoch": 744} {"train_loss": -37.259681701660156, "global_step": 90091, "epoch": 744} {"train_loss": -37.33327102661133, "global_step": 90092, "epoch": 744} {"train_loss": -36.42847442626953, "global_step": 90093, "epoch": 744} {"train_loss": -36.829933166503906, "global_step": 90094, "epoch": 744} {"train_loss": -37.78384017944336, "global_step": 90095, "epoch": 744} {"train_loss": -37.31849670410156, "global_step": 90096, "epoch": 744} {"train_loss": -37.34027862548828, "global_step": 90097, "epoch": 744} {"train_loss": -37.012237548828125, "global_step": 90098, "epoch": 744} {"train_loss": -37.68951416015625, "global_step": 90099, "epoch": 744} {"train_loss": -36.55255126953125, "global_step": 90100, "epoch": 744} {"train_loss": -37.74951171875, "global_step": 90101, "epoch": 744} {"train_loss": -37.56476974487305, "global_step": 90102, "epoch": 744} {"train_loss": -37.17915344238281, "global_step": 90103, "epoch": 744} {"train_loss": -37.81816482543945, "global_step": 90104, "epoch": 744} {"train_loss": -37.705780029296875, "global_step": 90105, "epoch": 744} {"train_loss": -37.952816009521484, "global_step": 90106, "epoch": 744} {"train_loss": -38.00130844116211, "global_step": 90107, "epoch": 744} {"train_loss": -37.947052001953125, "global_step": 90108, "epoch": 744} {"train_loss": -37.78887939453125, "global_step": 90109, "epoch": 744} {"train_loss": -38.19373321533203, "global_step": 90110, "epoch": 744} {"train_loss": -37.895751953125, "global_step": 90111, "epoch": 744} {"train_loss": -38.2177848815918, "global_step": 90112, "epoch": 744} {"train_loss": -37.602272033691406, "global_step": 90113, "epoch": 744} {"train_loss": -38.69840621948242, "global_step": 90114, "epoch": 744} {"train_loss": -38.29319763183594, "global_step": 90115, "epoch": 744} {"train_loss": -38.375457763671875, "global_step": 90116, "epoch": 744} {"train_loss": -38.09092712402344, "global_step": 90117, "epoch": 744} {"train_loss": -38.253902435302734, "global_step": 90118, "epoch": 744} {"train_loss": -38.30463790893555, "global_step": 90119, "epoch": 744} {"train_loss": -38.30535125732422, "global_step": 90120, "epoch": 744} {"train_loss": -38.2799072265625, "global_step": 90121, "epoch": 744} {"train_loss": -38.333740234375, "global_step": 90122, "epoch": 744} {"train_loss": -37.94422149658203, "global_step": 90123, "epoch": 744} {"train_loss": -38.920265197753906, "global_step": 90124, "epoch": 744} {"train_loss": -38.393550872802734, "global_step": 90125, "epoch": 744} {"train_loss": -38.506561279296875, "global_step": 90126, "epoch": 744} {"train_loss": -38.70256423950195, "global_step": 90127, "epoch": 744} {"train_loss": -38.916439056396484, "global_step": 90128, "epoch": 744} {"train_loss": -38.9769401550293, "global_step": 90129, "epoch": 744} {"train_loss": -39.12795639038086, "global_step": 90130, "epoch": 744} {"train_loss": -38.908138275146484, "global_step": 90131, "epoch": 744} {"train_loss": -38.45842361450195, "global_step": 90132, "epoch": 744} {"train_loss": -37.98719024658203, "global_step": 90133, "epoch": 744} {"train_loss": -38.74857711791992, "global_step": 90134, "epoch": 744} {"train_loss": -37.67095947265625, "global_step": 90135, "epoch": 744} {"train_loss": -34.44656753540039, "global_step": 90136, "epoch": 744} {"train_loss": -38.191280364990234, "global_step": 90137, "epoch": 744} {"train_loss": -31.3796443939209, "global_step": 90138, "epoch": 744} {"train_loss": -30.877416610717773, "global_step": 90139, "epoch": 744} {"train_loss": -32.951602935791016, "global_step": 90140, "epoch": 744} {"train_loss": -31.89041519165039, "global_step": 90141, "epoch": 744} {"train_loss": -33.26432418823242, "global_step": 90142, "epoch": 744} {"train_loss": -31.648096084594727, "global_step": 90143, "epoch": 744} {"train_loss": -36.73044163727563, "global_step": 90144, "epoch": 744, "val_loss": 2583406.0} {"train_loss": -34.177345275878906, "global_step": 90145, "epoch": 745} {"train_loss": -33.70124053955078, "global_step": 90146, "epoch": 745} {"train_loss": -32.836978912353516, "global_step": 90147, "epoch": 745} {"train_loss": -33.14689254760742, "global_step": 90148, "epoch": 745} {"train_loss": -34.31309509277344, "global_step": 90149, "epoch": 745} {"train_loss": -34.24711990356445, "global_step": 90150, "epoch": 745} {"train_loss": -34.193355560302734, "global_step": 90151, "epoch": 745} {"train_loss": -34.33140182495117, "global_step": 90152, "epoch": 745} {"train_loss": -34.30171203613281, "global_step": 90153, "epoch": 745} {"train_loss": -34.93027877807617, "global_step": 90154, "epoch": 745} {"train_loss": -35.21098709106445, "global_step": 90155, "epoch": 745} {"train_loss": -35.579891204833984, "global_step": 90156, "epoch": 745} {"train_loss": -35.369258880615234, "global_step": 90157, "epoch": 745} {"train_loss": -35.778106689453125, "global_step": 90158, "epoch": 745} {"train_loss": -35.20478439331055, "global_step": 90159, "epoch": 745} {"train_loss": -36.04920959472656, "global_step": 90160, "epoch": 745} {"train_loss": -35.93980026245117, "global_step": 90161, "epoch": 745} {"train_loss": -36.498069763183594, "global_step": 90162, "epoch": 745} {"train_loss": -36.53302764892578, "global_step": 90163, "epoch": 745} {"train_loss": -36.354644775390625, "global_step": 90164, "epoch": 745} {"train_loss": -35.15497970581055, "global_step": 90165, "epoch": 745} {"train_loss": -32.99703598022461, "global_step": 90166, "epoch": 745} {"train_loss": -31.49823570251465, "global_step": 90167, "epoch": 745} {"train_loss": -34.3095817565918, "global_step": 90168, "epoch": 745} {"train_loss": -34.591339111328125, "global_step": 90169, "epoch": 745} {"train_loss": -35.46818161010742, "global_step": 90170, "epoch": 745} {"train_loss": -36.761940002441406, "global_step": 90171, "epoch": 745} {"train_loss": -35.19973373413086, "global_step": 90172, "epoch": 745} {"train_loss": -32.397804260253906, "global_step": 90173, "epoch": 745} {"train_loss": -24.296384811401367, "global_step": 90174, "epoch": 745} {"train_loss": -36.03532791137695, "global_step": 90175, "epoch": 745} {"train_loss": -30.010107040405273, "global_step": 90176, "epoch": 745} {"train_loss": -36.5472297668457, "global_step": 90177, "epoch": 745} {"train_loss": -31.805601119995117, "global_step": 90178, "epoch": 745} {"train_loss": -34.84110641479492, "global_step": 90179, "epoch": 745} {"train_loss": -34.932186126708984, "global_step": 90180, "epoch": 745} {"train_loss": -33.82137680053711, "global_step": 90181, "epoch": 745} {"train_loss": -35.66748809814453, "global_step": 90182, "epoch": 745} {"train_loss": -33.9174919128418, "global_step": 90183, "epoch": 745} {"train_loss": -35.15847396850586, "global_step": 90184, "epoch": 745} {"train_loss": -36.25345993041992, "global_step": 90185, "epoch": 745} {"train_loss": -35.24605941772461, "global_step": 90186, "epoch": 745} {"train_loss": -35.688026428222656, "global_step": 90187, "epoch": 745} {"train_loss": -36.82419967651367, "global_step": 90188, "epoch": 745} {"train_loss": -35.82754135131836, "global_step": 90189, "epoch": 745} {"train_loss": -35.66805648803711, "global_step": 90190, "epoch": 745} {"train_loss": -36.919395446777344, "global_step": 90191, "epoch": 745} {"train_loss": -36.795204162597656, "global_step": 90192, "epoch": 745} {"train_loss": -36.35702133178711, "global_step": 90193, "epoch": 745} {"train_loss": -36.76120376586914, "global_step": 90194, "epoch": 745} {"train_loss": -37.02239990234375, "global_step": 90195, "epoch": 745} {"train_loss": -35.9443473815918, "global_step": 90196, "epoch": 745} {"train_loss": -33.71853256225586, "global_step": 90197, "epoch": 745} {"train_loss": -29.99127769470215, "global_step": 90198, "epoch": 745} {"train_loss": -31.185338973999023, "global_step": 90199, "epoch": 745} {"train_loss": -36.751644134521484, "global_step": 90200, "epoch": 745} {"train_loss": -32.3634033203125, "global_step": 90201, "epoch": 745} {"train_loss": -36.926570892333984, "global_step": 90202, "epoch": 745} {"train_loss": -34.12912368774414, "global_step": 90203, "epoch": 745} {"train_loss": -36.60661697387695, "global_step": 90204, "epoch": 745} {"train_loss": -34.87355041503906, "global_step": 90205, "epoch": 745} {"train_loss": -37.06911849975586, "global_step": 90206, "epoch": 745} {"train_loss": -35.57520294189453, "global_step": 90207, "epoch": 745} {"train_loss": -35.91263961791992, "global_step": 90208, "epoch": 745} {"train_loss": -34.65406036376953, "global_step": 90209, "epoch": 745} {"train_loss": -28.782453536987305, "global_step": 90210, "epoch": 745} {"train_loss": -26.0717716217041, "global_step": 90211, "epoch": 745} {"train_loss": -30.961929321289062, "global_step": 90212, "epoch": 745} {"train_loss": -35.92841339111328, "global_step": 90213, "epoch": 745} {"train_loss": -30.984603881835938, "global_step": 90214, "epoch": 745} {"train_loss": -36.804195404052734, "global_step": 90215, "epoch": 745} {"train_loss": -33.010894775390625, "global_step": 90216, "epoch": 745} {"train_loss": -37.27409362792969, "global_step": 90217, "epoch": 745} {"train_loss": -34.15147018432617, "global_step": 90218, "epoch": 745} {"train_loss": -36.53731918334961, "global_step": 90219, "epoch": 745} {"train_loss": -35.870391845703125, "global_step": 90220, "epoch": 745} {"train_loss": -36.19907760620117, "global_step": 90221, "epoch": 745} {"train_loss": -36.40462875366211, "global_step": 90222, "epoch": 745} {"train_loss": -34.95185470581055, "global_step": 90223, "epoch": 745} {"train_loss": -33.172550201416016, "global_step": 90224, "epoch": 745} {"train_loss": -27.490741729736328, "global_step": 90225, "epoch": 745} {"train_loss": -30.879230499267578, "global_step": 90226, "epoch": 745} {"train_loss": -36.64137649536133, "global_step": 90227, "epoch": 745} {"train_loss": -33.26929473876953, "global_step": 90228, "epoch": 745} {"train_loss": -36.54523468017578, "global_step": 90229, "epoch": 745} {"train_loss": -35.28181838989258, "global_step": 90230, "epoch": 745} {"train_loss": -34.121822357177734, "global_step": 90231, "epoch": 745} {"train_loss": -36.013771057128906, "global_step": 90232, "epoch": 745} {"train_loss": -34.69340515136719, "global_step": 90233, "epoch": 745} {"train_loss": -36.0254020690918, "global_step": 90234, "epoch": 745} {"train_loss": -35.57368087768555, "global_step": 90235, "epoch": 745} {"train_loss": -35.18342208862305, "global_step": 90236, "epoch": 745} {"train_loss": -35.317562103271484, "global_step": 90237, "epoch": 745} {"train_loss": -33.9758186340332, "global_step": 90238, "epoch": 745} {"train_loss": -33.72110366821289, "global_step": 90239, "epoch": 745} {"train_loss": -35.88494873046875, "global_step": 90240, "epoch": 745} {"train_loss": -36.207401275634766, "global_step": 90241, "epoch": 745} {"train_loss": -35.020992279052734, "global_step": 90242, "epoch": 745} {"train_loss": -35.55720520019531, "global_step": 90243, "epoch": 745} {"train_loss": -36.65150833129883, "global_step": 90244, "epoch": 745} {"train_loss": -35.538997650146484, "global_step": 90245, "epoch": 745} {"train_loss": -36.06035614013672, "global_step": 90246, "epoch": 745} {"train_loss": -36.66960525512695, "global_step": 90247, "epoch": 745} {"train_loss": -36.099124908447266, "global_step": 90248, "epoch": 745} {"train_loss": -36.42378616333008, "global_step": 90249, "epoch": 745} {"train_loss": -37.06116485595703, "global_step": 90250, "epoch": 745} {"train_loss": -36.6547737121582, "global_step": 90251, "epoch": 745} {"train_loss": -36.8108024597168, "global_step": 90252, "epoch": 745} {"train_loss": -36.8082389831543, "global_step": 90253, "epoch": 745} {"train_loss": -36.9141845703125, "global_step": 90254, "epoch": 745} {"train_loss": -36.998844146728516, "global_step": 90255, "epoch": 745} {"train_loss": -36.853614807128906, "global_step": 90256, "epoch": 745} {"train_loss": -36.85750961303711, "global_step": 90257, "epoch": 745} {"train_loss": -36.75371551513672, "global_step": 90258, "epoch": 745} {"train_loss": -36.16215133666992, "global_step": 90259, "epoch": 745} {"train_loss": -36.35374069213867, "global_step": 90260, "epoch": 745} {"train_loss": -37.01078414916992, "global_step": 90261, "epoch": 745} {"train_loss": -36.92428970336914, "global_step": 90262, "epoch": 745} {"train_loss": -36.783599853515625, "global_step": 90263, "epoch": 745} {"train_loss": -36.63629913330078, "global_step": 90264, "epoch": 745} {"train_loss": -34.941088432122854, "global_step": 90265, "epoch": 745, "val_loss": 2562956.75} {"train_loss": -33.69636917114258, "global_step": 90266, "epoch": 746} {"train_loss": -34.681819915771484, "global_step": 90267, "epoch": 746} {"train_loss": -36.60469055175781, "global_step": 90268, "epoch": 746} {"train_loss": -35.325740814208984, "global_step": 90269, "epoch": 746} {"train_loss": -35.68635177612305, "global_step": 90270, "epoch": 746} {"train_loss": -37.15843200683594, "global_step": 90271, "epoch": 746} {"train_loss": -35.7589111328125, "global_step": 90272, "epoch": 746} {"train_loss": -37.39854049682617, "global_step": 90273, "epoch": 746} {"train_loss": -36.073421478271484, "global_step": 90274, "epoch": 746} {"train_loss": -36.78159713745117, "global_step": 90275, "epoch": 746} {"train_loss": -36.24314498901367, "global_step": 90276, "epoch": 746} {"train_loss": -37.37873077392578, "global_step": 90277, "epoch": 746} {"train_loss": -36.67332077026367, "global_step": 90278, "epoch": 746} {"train_loss": -37.357879638671875, "global_step": 90279, "epoch": 746} {"train_loss": -37.135128021240234, "global_step": 90280, "epoch": 746} {"train_loss": -36.963783264160156, "global_step": 90281, "epoch": 746} {"train_loss": -37.201873779296875, "global_step": 90282, "epoch": 746} {"train_loss": -37.58590316772461, "global_step": 90283, "epoch": 746} {"train_loss": -36.9343147277832, "global_step": 90284, "epoch": 746} {"train_loss": -37.541725158691406, "global_step": 90285, "epoch": 746} {"train_loss": -37.0308952331543, "global_step": 90286, "epoch": 746} {"train_loss": -37.34400177001953, "global_step": 90287, "epoch": 746} {"train_loss": -37.187530517578125, "global_step": 90288, "epoch": 746} {"train_loss": -37.42710494995117, "global_step": 90289, "epoch": 746} {"train_loss": -36.53091812133789, "global_step": 90290, "epoch": 746} {"train_loss": -37.40927505493164, "global_step": 90291, "epoch": 746} {"train_loss": -37.765113830566406, "global_step": 90292, "epoch": 746} {"train_loss": -37.670223236083984, "global_step": 90293, "epoch": 746} {"train_loss": -37.76018142700195, "global_step": 90294, "epoch": 746} {"train_loss": -37.503360748291016, "global_step": 90295, "epoch": 746} {"train_loss": -37.089073181152344, "global_step": 90296, "epoch": 746} {"train_loss": -35.85829544067383, "global_step": 90297, "epoch": 746} {"train_loss": -37.25765609741211, "global_step": 90298, "epoch": 746} {"train_loss": -37.845001220703125, "global_step": 90299, "epoch": 746} {"train_loss": -37.25057601928711, "global_step": 90300, "epoch": 746} {"train_loss": -36.844539642333984, "global_step": 90301, "epoch": 746} {"train_loss": -36.47548294067383, "global_step": 90302, "epoch": 746} {"train_loss": -37.80225372314453, "global_step": 90303, "epoch": 746} {"train_loss": -37.829891204833984, "global_step": 90304, "epoch": 746} {"train_loss": -37.69504928588867, "global_step": 90305, "epoch": 746} {"train_loss": -36.80430603027344, "global_step": 90306, "epoch": 746} {"train_loss": -37.4788932800293, "global_step": 90307, "epoch": 746} {"train_loss": -38.07461166381836, "global_step": 90308, "epoch": 746} {"train_loss": -37.48651123046875, "global_step": 90309, "epoch": 746} {"train_loss": -37.9862060546875, "global_step": 90310, "epoch": 746} {"train_loss": -38.27467727661133, "global_step": 90311, "epoch": 746} {"train_loss": -37.84320068359375, "global_step": 90312, "epoch": 746} {"train_loss": -38.13519287109375, "global_step": 90313, "epoch": 746} {"train_loss": -37.874114990234375, "global_step": 90314, "epoch": 746} {"train_loss": -37.903018951416016, "global_step": 90315, "epoch": 746} {"train_loss": -38.2087287902832, "global_step": 90316, "epoch": 746} {"train_loss": -38.30188751220703, "global_step": 90317, "epoch": 746} {"train_loss": -37.96889877319336, "global_step": 90318, "epoch": 746} {"train_loss": -38.43935775756836, "global_step": 90319, "epoch": 746} {"train_loss": -38.218116760253906, "global_step": 90320, "epoch": 746} {"train_loss": -37.79902267456055, "global_step": 90321, "epoch": 746} {"train_loss": -37.89496994018555, "global_step": 90322, "epoch": 746} {"train_loss": -38.48685073852539, "global_step": 90323, "epoch": 746} {"train_loss": -38.2796745300293, "global_step": 90324, "epoch": 746} {"train_loss": -36.73579025268555, "global_step": 90325, "epoch": 746} {"train_loss": -37.941864013671875, "global_step": 90326, "epoch": 746} {"train_loss": -37.538360595703125, "global_step": 90327, "epoch": 746} {"train_loss": -34.56992721557617, "global_step": 90328, "epoch": 746} {"train_loss": -34.12192153930664, "global_step": 90329, "epoch": 746} {"train_loss": -36.232845306396484, "global_step": 90330, "epoch": 746} {"train_loss": -32.2072639465332, "global_step": 90331, "epoch": 746} {"train_loss": -34.18706130981445, "global_step": 90332, "epoch": 746} {"train_loss": -35.7551155090332, "global_step": 90333, "epoch": 746} {"train_loss": -38.26780319213867, "global_step": 90334, "epoch": 746} {"train_loss": -36.898616790771484, "global_step": 90335, "epoch": 746} {"train_loss": -37.6095085144043, "global_step": 90336, "epoch": 746} {"train_loss": -35.717262268066406, "global_step": 90337, "epoch": 746} {"train_loss": -33.773155212402344, "global_step": 90338, "epoch": 746} {"train_loss": -32.84295654296875, "global_step": 90339, "epoch": 746} {"train_loss": -34.850215911865234, "global_step": 90340, "epoch": 746} {"train_loss": -36.88540267944336, "global_step": 90341, "epoch": 746} {"train_loss": -37.40478515625, "global_step": 90342, "epoch": 746} {"train_loss": -36.229061126708984, "global_step": 90343, "epoch": 746} {"train_loss": -36.45718002319336, "global_step": 90344, "epoch": 746} {"train_loss": -36.86513900756836, "global_step": 90345, "epoch": 746} {"train_loss": -35.07908248901367, "global_step": 90346, "epoch": 746} {"train_loss": -36.62983703613281, "global_step": 90347, "epoch": 746} {"train_loss": -36.135833740234375, "global_step": 90348, "epoch": 746} {"train_loss": -37.007198333740234, "global_step": 90349, "epoch": 746} {"train_loss": -37.1137580871582, "global_step": 90350, "epoch": 746} {"train_loss": -36.87302780151367, "global_step": 90351, "epoch": 746} {"train_loss": -37.64981460571289, "global_step": 90352, "epoch": 746} {"train_loss": -37.37305450439453, "global_step": 90353, "epoch": 746} {"train_loss": -37.490962982177734, "global_step": 90354, "epoch": 746} {"train_loss": -37.67625045776367, "global_step": 90355, "epoch": 746} {"train_loss": -37.88873291015625, "global_step": 90356, "epoch": 746} {"train_loss": -37.97024154663086, "global_step": 90357, "epoch": 746} {"train_loss": -38.01993942260742, "global_step": 90358, "epoch": 746} {"train_loss": -37.45357131958008, "global_step": 90359, "epoch": 746} {"train_loss": -37.19499588012695, "global_step": 90360, "epoch": 746} {"train_loss": -37.56254196166992, "global_step": 90361, "epoch": 746} {"train_loss": -37.170814514160156, "global_step": 90362, "epoch": 746} {"train_loss": -38.115333557128906, "global_step": 90363, "epoch": 746} {"train_loss": -37.2468147277832, "global_step": 90364, "epoch": 746} {"train_loss": -37.097557067871094, "global_step": 90365, "epoch": 746} {"train_loss": -37.9239387512207, "global_step": 90366, "epoch": 746} {"train_loss": -38.51818084716797, "global_step": 90367, "epoch": 746} {"train_loss": -38.10264205932617, "global_step": 90368, "epoch": 746} {"train_loss": -37.63443374633789, "global_step": 90369, "epoch": 746} {"train_loss": -36.909698486328125, "global_step": 90370, "epoch": 746} {"train_loss": -37.6121826171875, "global_step": 90371, "epoch": 746} {"train_loss": -38.70714569091797, "global_step": 90372, "epoch": 746} {"train_loss": -37.280452728271484, "global_step": 90373, "epoch": 746} {"train_loss": -37.115203857421875, "global_step": 90374, "epoch": 746} {"train_loss": -38.44749069213867, "global_step": 90375, "epoch": 746} {"train_loss": -37.121742248535156, "global_step": 90376, "epoch": 746} {"train_loss": -37.02378463745117, "global_step": 90377, "epoch": 746} {"train_loss": -38.18281555175781, "global_step": 90378, "epoch": 746} {"train_loss": -36.774986267089844, "global_step": 90379, "epoch": 746} {"train_loss": -38.213314056396484, "global_step": 90380, "epoch": 746} {"train_loss": -36.68878173828125, "global_step": 90381, "epoch": 746} {"train_loss": -37.70060729980469, "global_step": 90382, "epoch": 746} {"train_loss": -37.49005126953125, "global_step": 90383, "epoch": 746} {"train_loss": -37.419437408447266, "global_step": 90384, "epoch": 746} {"train_loss": -37.83265686035156, "global_step": 90385, "epoch": 746} {"train_loss": -37.06355011364645, "global_step": 90386, "epoch": 746, "val_loss": 2611981.75} {"train_loss": -38.739471435546875, "global_step": 90387, "epoch": 747} {"train_loss": -38.465274810791016, "global_step": 90388, "epoch": 747} {"train_loss": -37.76791763305664, "global_step": 90389, "epoch": 747} {"train_loss": -36.83248519897461, "global_step": 90390, "epoch": 747} {"train_loss": -37.787628173828125, "global_step": 90391, "epoch": 747} {"train_loss": -37.804176330566406, "global_step": 90392, "epoch": 747} {"train_loss": -36.4076042175293, "global_step": 90393, "epoch": 747} {"train_loss": -37.975074768066406, "global_step": 90394, "epoch": 747} {"train_loss": -32.81410598754883, "global_step": 90395, "epoch": 747} {"train_loss": -32.67814254760742, "global_step": 90396, "epoch": 747} {"train_loss": -33.45534133911133, "global_step": 90397, "epoch": 747} {"train_loss": -30.091690063476562, "global_step": 90398, "epoch": 747} {"train_loss": -24.795103073120117, "global_step": 90399, "epoch": 747} {"train_loss": -24.54324722290039, "global_step": 90400, "epoch": 747} {"train_loss": -28.7218074798584, "global_step": 90401, "epoch": 747} {"train_loss": -28.592554092407227, "global_step": 90402, "epoch": 747} {"train_loss": -28.988483428955078, "global_step": 90403, "epoch": 747} {"train_loss": -25.51289176940918, "global_step": 90404, "epoch": 747} {"train_loss": -30.264163970947266, "global_step": 90405, "epoch": 747} {"train_loss": -29.40138816833496, "global_step": 90406, "epoch": 747} {"train_loss": -28.029773712158203, "global_step": 90407, "epoch": 747} {"train_loss": -28.69684410095215, "global_step": 90408, "epoch": 747} {"train_loss": -30.7297420501709, "global_step": 90409, "epoch": 747} {"train_loss": -25.565095901489258, "global_step": 90410, "epoch": 747} {"train_loss": -30.642379760742188, "global_step": 90411, "epoch": 747} {"train_loss": -28.96847915649414, "global_step": 90412, "epoch": 747} {"train_loss": -27.769872665405273, "global_step": 90413, "epoch": 747} {"train_loss": -26.360610961914062, "global_step": 90414, "epoch": 747} {"train_loss": -28.563180923461914, "global_step": 90415, "epoch": 747} {"train_loss": -31.310989379882812, "global_step": 90416, "epoch": 747} {"train_loss": -30.501697540283203, "global_step": 90417, "epoch": 747} {"train_loss": -29.05409049987793, "global_step": 90418, "epoch": 747} {"train_loss": -31.26909828186035, "global_step": 90419, "epoch": 747} {"train_loss": -31.0289249420166, "global_step": 90420, "epoch": 747} {"train_loss": -29.066791534423828, "global_step": 90421, "epoch": 747} {"train_loss": -31.704376220703125, "global_step": 90422, "epoch": 747} {"train_loss": -30.575809478759766, "global_step": 90423, "epoch": 747} {"train_loss": -32.56706619262695, "global_step": 90424, "epoch": 747} {"train_loss": -32.62118148803711, "global_step": 90425, "epoch": 747} {"train_loss": -33.2979850769043, "global_step": 90426, "epoch": 747} {"train_loss": -31.454526901245117, "global_step": 90427, "epoch": 747} {"train_loss": -32.74166488647461, "global_step": 90428, "epoch": 747} {"train_loss": -31.872074127197266, "global_step": 90429, "epoch": 747} {"train_loss": -32.59872055053711, "global_step": 90430, "epoch": 747} {"train_loss": -33.090850830078125, "global_step": 90431, "epoch": 747} {"train_loss": -32.28471755981445, "global_step": 90432, "epoch": 747} {"train_loss": -33.87296676635742, "global_step": 90433, "epoch": 747} {"train_loss": -32.948848724365234, "global_step": 90434, "epoch": 747} {"train_loss": -32.783447265625, "global_step": 90435, "epoch": 747} {"train_loss": -33.06026840209961, "global_step": 90436, "epoch": 747} {"train_loss": -33.59855270385742, "global_step": 90437, "epoch": 747} {"train_loss": -33.84788131713867, "global_step": 90438, "epoch": 747} {"train_loss": -34.330806732177734, "global_step": 90439, "epoch": 747} {"train_loss": -34.03705978393555, "global_step": 90440, "epoch": 747} {"train_loss": -33.983924865722656, "global_step": 90441, "epoch": 747} {"train_loss": -32.823177337646484, "global_step": 90442, "epoch": 747} {"train_loss": -33.32210159301758, "global_step": 90443, "epoch": 747} {"train_loss": -34.15695571899414, "global_step": 90444, "epoch": 747} {"train_loss": -33.73018264770508, "global_step": 90445, "epoch": 747} {"train_loss": -34.2652702331543, "global_step": 90446, "epoch": 747} {"train_loss": -33.43891906738281, "global_step": 90447, "epoch": 747} {"train_loss": -34.366085052490234, "global_step": 90448, "epoch": 747} {"train_loss": -33.9908447265625, "global_step": 90449, "epoch": 747} {"train_loss": -34.36513900756836, "global_step": 90450, "epoch": 747} {"train_loss": -34.54913330078125, "global_step": 90451, "epoch": 747} {"train_loss": -33.99685287475586, "global_step": 90452, "epoch": 747} {"train_loss": -34.054351806640625, "global_step": 90453, "epoch": 747} {"train_loss": -35.130435943603516, "global_step": 90454, "epoch": 747} {"train_loss": -34.23646926879883, "global_step": 90455, "epoch": 747} {"train_loss": -34.737693786621094, "global_step": 90456, "epoch": 747} {"train_loss": -34.12540817260742, "global_step": 90457, "epoch": 747} {"train_loss": -34.94106674194336, "global_step": 90458, "epoch": 747} {"train_loss": -34.43190383911133, "global_step": 90459, "epoch": 747} {"train_loss": -34.93947982788086, "global_step": 90460, "epoch": 747} {"train_loss": -34.72000503540039, "global_step": 90461, "epoch": 747} {"train_loss": -34.75649642944336, "global_step": 90462, "epoch": 747} {"train_loss": -35.17551040649414, "global_step": 90463, "epoch": 747} {"train_loss": -35.49372482299805, "global_step": 90464, "epoch": 747} {"train_loss": -34.88289260864258, "global_step": 90465, "epoch": 747} {"train_loss": -34.7597541809082, "global_step": 90466, "epoch": 747} {"train_loss": -34.87980270385742, "global_step": 90467, "epoch": 747} {"train_loss": -34.60567855834961, "global_step": 90468, "epoch": 747} {"train_loss": -35.330177307128906, "global_step": 90469, "epoch": 747} {"train_loss": -35.969940185546875, "global_step": 90470, "epoch": 747} {"train_loss": -35.886959075927734, "global_step": 90471, "epoch": 747} {"train_loss": -35.564292907714844, "global_step": 90472, "epoch": 747} {"train_loss": -35.61578369140625, "global_step": 90473, "epoch": 747} {"train_loss": -35.554744720458984, "global_step": 90474, "epoch": 747} {"train_loss": -35.94668960571289, "global_step": 90475, "epoch": 747} {"train_loss": -36.18071746826172, "global_step": 90476, "epoch": 747} {"train_loss": -35.97321701049805, "global_step": 90477, "epoch": 747} {"train_loss": -36.341552734375, "global_step": 90478, "epoch": 747} {"train_loss": -36.141822814941406, "global_step": 90479, "epoch": 747} {"train_loss": -35.804744720458984, "global_step": 90480, "epoch": 747} {"train_loss": -36.199703216552734, "global_step": 90481, "epoch": 747} {"train_loss": -36.36738204956055, "global_step": 90482, "epoch": 747} {"train_loss": -35.96480178833008, "global_step": 90483, "epoch": 747} {"train_loss": -35.671363830566406, "global_step": 90484, "epoch": 747} {"train_loss": -36.383792877197266, "global_step": 90485, "epoch": 747} {"train_loss": -35.73583984375, "global_step": 90486, "epoch": 747} {"train_loss": -36.600738525390625, "global_step": 90487, "epoch": 747} {"train_loss": -36.68229293823242, "global_step": 90488, "epoch": 747} {"train_loss": -36.503326416015625, "global_step": 90489, "epoch": 747} {"train_loss": -36.06467819213867, "global_step": 90490, "epoch": 747} {"train_loss": -36.2502326965332, "global_step": 90491, "epoch": 747} {"train_loss": -36.661678314208984, "global_step": 90492, "epoch": 747} {"train_loss": -36.798500061035156, "global_step": 90493, "epoch": 747} {"train_loss": -36.61688995361328, "global_step": 90494, "epoch": 747} {"train_loss": -36.566898345947266, "global_step": 90495, "epoch": 747} {"train_loss": -36.92744827270508, "global_step": 90496, "epoch": 747} {"train_loss": -36.5887565612793, "global_step": 90497, "epoch": 747} {"train_loss": -36.784637451171875, "global_step": 90498, "epoch": 747} {"train_loss": -37.19732666015625, "global_step": 90499, "epoch": 747} {"train_loss": -37.02360534667969, "global_step": 90500, "epoch": 747} {"train_loss": -35.871334075927734, "global_step": 90501, "epoch": 747} {"train_loss": -33.17963790893555, "global_step": 90502, "epoch": 747} {"train_loss": -31.475555419921875, "global_step": 90503, "epoch": 747} {"train_loss": -34.05599594116211, "global_step": 90504, "epoch": 747} {"train_loss": -36.9388427734375, "global_step": 90505, "epoch": 747} {"train_loss": -35.51223373413086, "global_step": 90506, "epoch": 747} {"train_loss": -33.704653211861604, "global_step": 90507, "epoch": 747, "val_loss": 2646875.0} {"train_loss": -36.556819915771484, "global_step": 90508, "epoch": 748} {"train_loss": -35.93703842163086, "global_step": 90509, "epoch": 748} {"train_loss": -36.035438537597656, "global_step": 90510, "epoch": 748} {"train_loss": -36.411537170410156, "global_step": 90511, "epoch": 748} {"train_loss": -35.1654052734375, "global_step": 90512, "epoch": 748} {"train_loss": -36.9765739440918, "global_step": 90513, "epoch": 748} {"train_loss": -35.130226135253906, "global_step": 90514, "epoch": 748} {"train_loss": -36.362060546875, "global_step": 90515, "epoch": 748} {"train_loss": -35.79986572265625, "global_step": 90516, "epoch": 748} {"train_loss": -37.04349899291992, "global_step": 90517, "epoch": 748} {"train_loss": -36.14422607421875, "global_step": 90518, "epoch": 748} {"train_loss": -36.911495208740234, "global_step": 90519, "epoch": 748} {"train_loss": -35.92631530761719, "global_step": 90520, "epoch": 748} {"train_loss": -37.73604965209961, "global_step": 90521, "epoch": 748} {"train_loss": -36.639678955078125, "global_step": 90522, "epoch": 748} {"train_loss": -36.96416091918945, "global_step": 90523, "epoch": 748} {"train_loss": -36.664894104003906, "global_step": 90524, "epoch": 748} {"train_loss": -35.309871673583984, "global_step": 90525, "epoch": 748} {"train_loss": -36.68956756591797, "global_step": 90526, "epoch": 748} {"train_loss": -35.5640754699707, "global_step": 90527, "epoch": 748} {"train_loss": -35.40900802612305, "global_step": 90528, "epoch": 748} {"train_loss": -36.38444137573242, "global_step": 90529, "epoch": 748} {"train_loss": -37.0358772277832, "global_step": 90530, "epoch": 748} {"train_loss": -35.93931198120117, "global_step": 90531, "epoch": 748} {"train_loss": -34.43810272216797, "global_step": 90532, "epoch": 748} {"train_loss": -34.64363479614258, "global_step": 90533, "epoch": 748} {"train_loss": -35.1456413269043, "global_step": 90534, "epoch": 748} {"train_loss": -35.52809524536133, "global_step": 90535, "epoch": 748} {"train_loss": -36.78453826904297, "global_step": 90536, "epoch": 748} {"train_loss": -37.56452941894531, "global_step": 90537, "epoch": 748} {"train_loss": -36.13991928100586, "global_step": 90538, "epoch": 748} {"train_loss": -35.21895217895508, "global_step": 90539, "epoch": 748} {"train_loss": -36.295799255371094, "global_step": 90540, "epoch": 748} {"train_loss": -36.521175384521484, "global_step": 90541, "epoch": 748} {"train_loss": -36.72779083251953, "global_step": 90542, "epoch": 748} {"train_loss": -36.572628021240234, "global_step": 90543, "epoch": 748} {"train_loss": -36.30997848510742, "global_step": 90544, "epoch": 748} {"train_loss": -36.69154739379883, "global_step": 90545, "epoch": 748} {"train_loss": -37.33714294433594, "global_step": 90546, "epoch": 748} {"train_loss": -36.147186279296875, "global_step": 90547, "epoch": 748} {"train_loss": -36.686737060546875, "global_step": 90548, "epoch": 748} {"train_loss": -37.80977249145508, "global_step": 90549, "epoch": 748} {"train_loss": -36.848915100097656, "global_step": 90550, "epoch": 748} {"train_loss": -36.9364128112793, "global_step": 90551, "epoch": 748} {"train_loss": -37.517032623291016, "global_step": 90552, "epoch": 748} {"train_loss": -37.402244567871094, "global_step": 90553, "epoch": 748} {"train_loss": -37.932430267333984, "global_step": 90554, "epoch": 748} {"train_loss": -38.154937744140625, "global_step": 90555, "epoch": 748} {"train_loss": -37.7934455871582, "global_step": 90556, "epoch": 748} {"train_loss": -37.9780387878418, "global_step": 90557, "epoch": 748} {"train_loss": -37.44921112060547, "global_step": 90558, "epoch": 748} {"train_loss": -36.82923126220703, "global_step": 90559, "epoch": 748} {"train_loss": -37.148529052734375, "global_step": 90560, "epoch": 748} {"train_loss": -37.57572555541992, "global_step": 90561, "epoch": 748} {"train_loss": -37.47287368774414, "global_step": 90562, "epoch": 748} {"train_loss": -37.29157638549805, "global_step": 90563, "epoch": 748} {"train_loss": -37.13695526123047, "global_step": 90564, "epoch": 748} {"train_loss": -37.58134078979492, "global_step": 90565, "epoch": 748} {"train_loss": -38.19138717651367, "global_step": 90566, "epoch": 748} {"train_loss": -38.39915466308594, "global_step": 90567, "epoch": 748} {"train_loss": -37.42255783081055, "global_step": 90568, "epoch": 748} {"train_loss": -38.079647064208984, "global_step": 90569, "epoch": 748} {"train_loss": -36.09379196166992, "global_step": 90570, "epoch": 748} {"train_loss": -36.65238952636719, "global_step": 90571, "epoch": 748} {"train_loss": -36.42013931274414, "global_step": 90572, "epoch": 748} {"train_loss": -36.754127502441406, "global_step": 90573, "epoch": 748} {"train_loss": -37.41805648803711, "global_step": 90574, "epoch": 748} {"train_loss": -36.92252731323242, "global_step": 90575, "epoch": 748} {"train_loss": -34.87001419067383, "global_step": 90576, "epoch": 748} {"train_loss": -35.80938720703125, "global_step": 90577, "epoch": 748} {"train_loss": -37.1692008972168, "global_step": 90578, "epoch": 748} {"train_loss": -35.204673767089844, "global_step": 90579, "epoch": 748} {"train_loss": -37.128753662109375, "global_step": 90580, "epoch": 748} {"train_loss": -33.98876953125, "global_step": 90581, "epoch": 748} {"train_loss": -35.2972526550293, "global_step": 90582, "epoch": 748} {"train_loss": -30.862884521484375, "global_step": 90583, "epoch": 748} {"train_loss": -29.183385848999023, "global_step": 90584, "epoch": 748} {"train_loss": -33.415618896484375, "global_step": 90585, "epoch": 748} {"train_loss": -35.89207458496094, "global_step": 90586, "epoch": 748} {"train_loss": -30.638662338256836, "global_step": 90587, "epoch": 748} {"train_loss": -33.46523666381836, "global_step": 90588, "epoch": 748} {"train_loss": -36.0301628112793, "global_step": 90589, "epoch": 748} {"train_loss": -34.76009750366211, "global_step": 90590, "epoch": 748} {"train_loss": -34.6231689453125, "global_step": 90591, "epoch": 748} {"train_loss": -35.50000762939453, "global_step": 90592, "epoch": 748} {"train_loss": -34.49261474609375, "global_step": 90593, "epoch": 748} {"train_loss": -35.58857345581055, "global_step": 90594, "epoch": 748} {"train_loss": -36.443538665771484, "global_step": 90595, "epoch": 748} {"train_loss": -34.39535140991211, "global_step": 90596, "epoch": 748} {"train_loss": -36.7446403503418, "global_step": 90597, "epoch": 748} {"train_loss": -35.53593063354492, "global_step": 90598, "epoch": 748} {"train_loss": -37.61179733276367, "global_step": 90599, "epoch": 748} {"train_loss": -34.58751678466797, "global_step": 90600, "epoch": 748} {"train_loss": -37.033447265625, "global_step": 90601, "epoch": 748} {"train_loss": -36.22968292236328, "global_step": 90602, "epoch": 748} {"train_loss": -37.15918731689453, "global_step": 90603, "epoch": 748} {"train_loss": -35.83523941040039, "global_step": 90604, "epoch": 748} {"train_loss": -37.53872299194336, "global_step": 90605, "epoch": 748} {"train_loss": -36.33794021606445, "global_step": 90606, "epoch": 748} {"train_loss": -37.198734283447266, "global_step": 90607, "epoch": 748} {"train_loss": -37.532100677490234, "global_step": 90608, "epoch": 748} {"train_loss": -37.05421829223633, "global_step": 90609, "epoch": 748} {"train_loss": -37.29774475097656, "global_step": 90610, "epoch": 748} {"train_loss": -37.4528923034668, "global_step": 90611, "epoch": 748} {"train_loss": -37.09444808959961, "global_step": 90612, "epoch": 748} {"train_loss": -37.92372131347656, "global_step": 90613, "epoch": 748} {"train_loss": -36.86750411987305, "global_step": 90614, "epoch": 748} {"train_loss": -37.224483489990234, "global_step": 90615, "epoch": 748} {"train_loss": -37.06881332397461, "global_step": 90616, "epoch": 748} {"train_loss": -37.12966537475586, "global_step": 90617, "epoch": 748} {"train_loss": -36.70293045043945, "global_step": 90618, "epoch": 748} {"train_loss": -37.86726760864258, "global_step": 90619, "epoch": 748} {"train_loss": -37.426788330078125, "global_step": 90620, "epoch": 748} {"train_loss": -37.55264663696289, "global_step": 90621, "epoch": 748} {"train_loss": -37.291011810302734, "global_step": 90622, "epoch": 748} {"train_loss": -37.174278259277344, "global_step": 90623, "epoch": 748} {"train_loss": -36.703392028808594, "global_step": 90624, "epoch": 748} {"train_loss": -36.52421188354492, "global_step": 90625, "epoch": 748} {"train_loss": -37.34247589111328, "global_step": 90626, "epoch": 748} {"train_loss": -38.12473678588867, "global_step": 90627, "epoch": 748} {"train_loss": -36.40291428368939, "global_step": 90628, "epoch": 748, "val_loss": 2549444.25} {"train_loss": -37.0994987487793, "global_step": 90629, "epoch": 749} {"train_loss": -35.03306198120117, "global_step": 90630, "epoch": 749} {"train_loss": -35.65285873413086, "global_step": 90631, "epoch": 749} {"train_loss": -36.88739013671875, "global_step": 90632, "epoch": 749} {"train_loss": -35.840667724609375, "global_step": 90633, "epoch": 749} {"train_loss": -35.277034759521484, "global_step": 90634, "epoch": 749} {"train_loss": -36.06731414794922, "global_step": 90635, "epoch": 749} {"train_loss": -37.88296127319336, "global_step": 90636, "epoch": 749} {"train_loss": -37.29221725463867, "global_step": 90637, "epoch": 749} {"train_loss": -37.03483200073242, "global_step": 90638, "epoch": 749} {"train_loss": -37.65214920043945, "global_step": 90639, "epoch": 749} {"train_loss": -36.74308776855469, "global_step": 90640, "epoch": 749} {"train_loss": -36.818084716796875, "global_step": 90641, "epoch": 749} {"train_loss": -37.7529182434082, "global_step": 90642, "epoch": 749} {"train_loss": -37.46446228027344, "global_step": 90643, "epoch": 749} {"train_loss": -37.685707092285156, "global_step": 90644, "epoch": 749} {"train_loss": -37.06007766723633, "global_step": 90645, "epoch": 749} {"train_loss": -37.89656066894531, "global_step": 90646, "epoch": 749} {"train_loss": -37.581329345703125, "global_step": 90647, "epoch": 749} {"train_loss": -37.852779388427734, "global_step": 90648, "epoch": 749} {"train_loss": -37.073970794677734, "global_step": 90649, "epoch": 749} {"train_loss": -37.41286849975586, "global_step": 90650, "epoch": 749} {"train_loss": -37.26558303833008, "global_step": 90651, "epoch": 749} {"train_loss": -37.2314338684082, "global_step": 90652, "epoch": 749} {"train_loss": -37.24557113647461, "global_step": 90653, "epoch": 749} {"train_loss": -37.72285842895508, "global_step": 90654, "epoch": 749} {"train_loss": -37.26571273803711, "global_step": 90655, "epoch": 749} {"train_loss": -37.68491744995117, "global_step": 90656, "epoch": 749} {"train_loss": -37.23781204223633, "global_step": 90657, "epoch": 749} {"train_loss": -37.87158203125, "global_step": 90658, "epoch": 749} {"train_loss": -37.000118255615234, "global_step": 90659, "epoch": 749} {"train_loss": -37.85441970825195, "global_step": 90660, "epoch": 749} {"train_loss": -36.56974411010742, "global_step": 90661, "epoch": 749} {"train_loss": -37.2126579284668, "global_step": 90662, "epoch": 749} {"train_loss": -37.232147216796875, "global_step": 90663, "epoch": 749} {"train_loss": -37.16010284423828, "global_step": 90664, "epoch": 749} {"train_loss": -38.32236862182617, "global_step": 90665, "epoch": 749} {"train_loss": -38.05432891845703, "global_step": 90666, "epoch": 749} {"train_loss": -36.140480041503906, "global_step": 90667, "epoch": 749} {"train_loss": -37.10409164428711, "global_step": 90668, "epoch": 749} {"train_loss": -38.8548698425293, "global_step": 90669, "epoch": 749} {"train_loss": -36.994117736816406, "global_step": 90670, "epoch": 749} {"train_loss": -37.556365966796875, "global_step": 90671, "epoch": 749} {"train_loss": -38.5990104675293, "global_step": 90672, "epoch": 749} {"train_loss": -38.1761474609375, "global_step": 90673, "epoch": 749} {"train_loss": -38.32958984375, "global_step": 90674, "epoch": 749} {"train_loss": -38.46337890625, "global_step": 90675, "epoch": 749} {"train_loss": -37.935054779052734, "global_step": 90676, "epoch": 749} {"train_loss": -37.9057731628418, "global_step": 90677, "epoch": 749} {"train_loss": -38.241844177246094, "global_step": 90678, "epoch": 749} {"train_loss": -38.307373046875, "global_step": 90679, "epoch": 749} {"train_loss": -38.538177490234375, "global_step": 90680, "epoch": 749} {"train_loss": -38.438472747802734, "global_step": 90681, "epoch": 749} {"train_loss": -38.13015365600586, "global_step": 90682, "epoch": 749} {"train_loss": -38.214141845703125, "global_step": 90683, "epoch": 749} {"train_loss": -38.60996627807617, "global_step": 90684, "epoch": 749} {"train_loss": -38.80147171020508, "global_step": 90685, "epoch": 749} {"train_loss": -38.08903884887695, "global_step": 90686, "epoch": 749} {"train_loss": -38.68867111206055, "global_step": 90687, "epoch": 749} {"train_loss": -37.76243209838867, "global_step": 90688, "epoch": 749} {"train_loss": -36.3984489440918, "global_step": 90689, "epoch": 749} {"train_loss": -37.40156555175781, "global_step": 90690, "epoch": 749} {"train_loss": -32.826515197753906, "global_step": 90691, "epoch": 749} {"train_loss": -36.98529052734375, "global_step": 90692, "epoch": 749} {"train_loss": -37.06556701660156, "global_step": 90693, "epoch": 749} {"train_loss": -36.71755599975586, "global_step": 90694, "epoch": 749} {"train_loss": -36.18311309814453, "global_step": 90695, "epoch": 749} {"train_loss": -36.72156524658203, "global_step": 90696, "epoch": 749} {"train_loss": -33.12925338745117, "global_step": 90697, "epoch": 749} {"train_loss": -33.785682678222656, "global_step": 90698, "epoch": 749} {"train_loss": -34.74396896362305, "global_step": 90699, "epoch": 749} {"train_loss": -35.16095733642578, "global_step": 90700, "epoch": 749} {"train_loss": -35.609588623046875, "global_step": 90701, "epoch": 749} {"train_loss": -33.70813751220703, "global_step": 90702, "epoch": 749} {"train_loss": -32.73604202270508, "global_step": 90703, "epoch": 749} {"train_loss": -32.469215393066406, "global_step": 90704, "epoch": 749} {"train_loss": -30.2397518157959, "global_step": 90705, "epoch": 749} {"train_loss": -35.22756576538086, "global_step": 90706, "epoch": 749} {"train_loss": -33.379241943359375, "global_step": 90707, "epoch": 749} {"train_loss": -33.84741973876953, "global_step": 90708, "epoch": 749} {"train_loss": -28.33380699157715, "global_step": 90709, "epoch": 749} {"train_loss": -26.2563419342041, "global_step": 90710, "epoch": 749} {"train_loss": -29.776432037353516, "global_step": 90711, "epoch": 749} {"train_loss": -30.694366455078125, "global_step": 90712, "epoch": 749} {"train_loss": -31.871305465698242, "global_step": 90713, "epoch": 749} {"train_loss": -29.43401527404785, "global_step": 90714, "epoch": 749} {"train_loss": -33.34376525878906, "global_step": 90715, "epoch": 749} {"train_loss": -27.811567306518555, "global_step": 90716, "epoch": 749} {"train_loss": -30.949859619140625, "global_step": 90717, "epoch": 749} {"train_loss": -26.807632446289062, "global_step": 90718, "epoch": 749} {"train_loss": -29.77471351623535, "global_step": 90719, "epoch": 749} {"train_loss": -21.760122299194336, "global_step": 90720, "epoch": 749} {"train_loss": -31.41458511352539, "global_step": 90721, "epoch": 749} {"train_loss": -30.993045806884766, "global_step": 90722, "epoch": 749} {"train_loss": -31.9052791595459, "global_step": 90723, "epoch": 749} {"train_loss": -29.806900024414062, "global_step": 90724, "epoch": 749} {"train_loss": -27.288238525390625, "global_step": 90725, "epoch": 749} {"train_loss": -30.387842178344727, "global_step": 90726, "epoch": 749} {"train_loss": -32.3361701965332, "global_step": 90727, "epoch": 749} {"train_loss": -31.186254501342773, "global_step": 90728, "epoch": 749} {"train_loss": -31.826440811157227, "global_step": 90729, "epoch": 749} {"train_loss": -29.810516357421875, "global_step": 90730, "epoch": 749} {"train_loss": -31.439905166625977, "global_step": 90731, "epoch": 749} {"train_loss": -32.40554428100586, "global_step": 90732, "epoch": 749} {"train_loss": -32.36769485473633, "global_step": 90733, "epoch": 749} {"train_loss": -32.90151596069336, "global_step": 90734, "epoch": 749} {"train_loss": -32.85409927368164, "global_step": 90735, "epoch": 749} {"train_loss": -31.9095516204834, "global_step": 90736, "epoch": 749} {"train_loss": -33.214473724365234, "global_step": 90737, "epoch": 749} {"train_loss": -32.223567962646484, "global_step": 90738, "epoch": 749} {"train_loss": -33.349361419677734, "global_step": 90739, "epoch": 749} {"train_loss": -34.125667572021484, "global_step": 90740, "epoch": 749} {"train_loss": -33.52126693725586, "global_step": 90741, "epoch": 749} {"train_loss": -34.428016662597656, "global_step": 90742, "epoch": 749} {"train_loss": -33.279685974121094, "global_step": 90743, "epoch": 749} {"train_loss": -33.58663558959961, "global_step": 90744, "epoch": 749} {"train_loss": -33.94291687011719, "global_step": 90745, "epoch": 749} {"train_loss": -33.99604034423828, "global_step": 90746, "epoch": 749} {"train_loss": -34.1812858581543, "global_step": 90747, "epoch": 749} {"train_loss": -32.80791473388672, "global_step": 90748, "epoch": 749} {"train_loss": -34.95223718438267, "global_step": 90749, "epoch": 749, "val_loss": 2586999.25} {"train_loss": -34.18043518066406, "global_step": 90750, "epoch": 750} {"train_loss": -33.729915618896484, "global_step": 90751, "epoch": 750} {"train_loss": -34.19425582885742, "global_step": 90752, "epoch": 750} {"train_loss": -34.48857116699219, "global_step": 90753, "epoch": 750} {"train_loss": -34.42920684814453, "global_step": 90754, "epoch": 750} {"train_loss": -34.64956283569336, "global_step": 90755, "epoch": 750} {"train_loss": -34.44282913208008, "global_step": 90756, "epoch": 750} {"train_loss": -34.92222213745117, "global_step": 90757, "epoch": 750} {"train_loss": -34.70028305053711, "global_step": 90758, "epoch": 750} {"train_loss": -35.21187210083008, "global_step": 90759, "epoch": 750} {"train_loss": -34.8840217590332, "global_step": 90760, "epoch": 750} {"train_loss": -34.801483154296875, "global_step": 90761, "epoch": 750} {"train_loss": -35.5339241027832, "global_step": 90762, "epoch": 750} {"train_loss": -35.41141891479492, "global_step": 90763, "epoch": 750} {"train_loss": -35.421875, "global_step": 90764, "epoch": 750} {"train_loss": -35.3879508972168, "global_step": 90765, "epoch": 750} {"train_loss": -35.48447799682617, "global_step": 90766, "epoch": 750} {"train_loss": -33.68598556518555, "global_step": 90767, "epoch": 750} {"train_loss": -35.518890380859375, "global_step": 90768, "epoch": 750} {"train_loss": -35.50740432739258, "global_step": 90769, "epoch": 750} {"train_loss": -35.207454681396484, "global_step": 90770, "epoch": 750} {"train_loss": -35.85779571533203, "global_step": 90771, "epoch": 750} {"train_loss": -35.457584381103516, "global_step": 90772, "epoch": 750} {"train_loss": -35.86887741088867, "global_step": 90773, "epoch": 750} {"train_loss": -35.44633483886719, "global_step": 90774, "epoch": 750} {"train_loss": -35.8663444519043, "global_step": 90775, "epoch": 750} {"train_loss": -36.21025085449219, "global_step": 90776, "epoch": 750} {"train_loss": -35.37725830078125, "global_step": 90777, "epoch": 750} {"train_loss": -36.21453094482422, "global_step": 90778, "epoch": 750} {"train_loss": -36.105445861816406, "global_step": 90779, "epoch": 750} {"train_loss": -35.95404052734375, "global_step": 90780, "epoch": 750} {"train_loss": -35.929054260253906, "global_step": 90781, "epoch": 750} {"train_loss": -36.269229888916016, "global_step": 90782, "epoch": 750} {"train_loss": -35.925323486328125, "global_step": 90783, "epoch": 750} {"train_loss": -36.56605911254883, "global_step": 90784, "epoch": 750} {"train_loss": -36.4461555480957, "global_step": 90785, "epoch": 750} {"train_loss": -36.28955078125, "global_step": 90786, "epoch": 750} {"train_loss": -36.56689453125, "global_step": 90787, "epoch": 750} {"train_loss": -36.48484420776367, "global_step": 90788, "epoch": 750} {"train_loss": -35.94232940673828, "global_step": 90789, "epoch": 750} {"train_loss": -36.66549301147461, "global_step": 90790, "epoch": 750} {"train_loss": -36.0614128112793, "global_step": 90791, "epoch": 750} {"train_loss": -36.74076461791992, "global_step": 90792, "epoch": 750} {"train_loss": -36.36503219604492, "global_step": 90793, "epoch": 750} {"train_loss": -36.708580017089844, "global_step": 90794, "epoch": 750} {"train_loss": -36.67017364501953, "global_step": 90795, "epoch": 750} {"train_loss": -36.430458068847656, "global_step": 90796, "epoch": 750} {"train_loss": -36.12910461425781, "global_step": 90797, "epoch": 750} {"train_loss": -35.509403228759766, "global_step": 90798, "epoch": 750} {"train_loss": -35.338436126708984, "global_step": 90799, "epoch": 750} {"train_loss": -34.81181716918945, "global_step": 90800, "epoch": 750} {"train_loss": -35.38712692260742, "global_step": 90801, "epoch": 750} {"train_loss": -36.25688552856445, "global_step": 90802, "epoch": 750} {"train_loss": -36.851924896240234, "global_step": 90803, "epoch": 750} {"train_loss": -36.83913040161133, "global_step": 90804, "epoch": 750} {"train_loss": -36.48788070678711, "global_step": 90805, "epoch": 750} {"train_loss": -36.893898010253906, "global_step": 90806, "epoch": 750} {"train_loss": -36.05543518066406, "global_step": 90807, "epoch": 750} {"train_loss": -31.1020565032959, "global_step": 90808, "epoch": 750} {"train_loss": -14.511171340942383, "global_step": 90809, "epoch": 750} {"train_loss": 13.98241138458252, "global_step": 90810, "epoch": 750} {"train_loss": -31.43757438659668, "global_step": 90811, "epoch": 750} {"train_loss": -22.535907745361328, "global_step": 90812, "epoch": 750} {"train_loss": -22.933462142944336, "global_step": 90813, "epoch": 750} {"train_loss": -17.397390365600586, "global_step": 90814, "epoch": 750} {"train_loss": -32.2712516784668, "global_step": 90815, "epoch": 750} {"train_loss": -28.69732093811035, "global_step": 90816, "epoch": 750} {"train_loss": -29.576435089111328, "global_step": 90817, "epoch": 750} {"train_loss": -30.901147842407227, "global_step": 90818, "epoch": 750} {"train_loss": -29.025959014892578, "global_step": 90819, "epoch": 750} {"train_loss": -34.62785339355469, "global_step": 90820, "epoch": 750} {"train_loss": -33.03916931152344, "global_step": 90821, "epoch": 750} {"train_loss": -32.271785736083984, "global_step": 90822, "epoch": 750} {"train_loss": -34.72977828979492, "global_step": 90823, "epoch": 750} {"train_loss": -33.73634719848633, "global_step": 90824, "epoch": 750} {"train_loss": -32.82563400268555, "global_step": 90825, "epoch": 750} {"train_loss": -34.1331901550293, "global_step": 90826, "epoch": 750} {"train_loss": -34.24732208251953, "global_step": 90827, "epoch": 750} {"train_loss": -34.15835952758789, "global_step": 90828, "epoch": 750} {"train_loss": -33.98334503173828, "global_step": 90829, "epoch": 750} {"train_loss": -35.239715576171875, "global_step": 90830, "epoch": 750} {"train_loss": -34.89814376831055, "global_step": 90831, "epoch": 750} {"train_loss": -34.78086471557617, "global_step": 90832, "epoch": 750} {"train_loss": -34.97431564331055, "global_step": 90833, "epoch": 750} {"train_loss": -35.67670440673828, "global_step": 90834, "epoch": 750} {"train_loss": -35.2878303527832, "global_step": 90835, "epoch": 750} {"train_loss": -35.043399810791016, "global_step": 90836, "epoch": 750} {"train_loss": -35.27826690673828, "global_step": 90837, "epoch": 750} {"train_loss": -35.4834098815918, "global_step": 90838, "epoch": 750} {"train_loss": -35.728641510009766, "global_step": 90839, "epoch": 750} {"train_loss": -35.3608283996582, "global_step": 90840, "epoch": 750} {"train_loss": -35.68571090698242, "global_step": 90841, "epoch": 750} {"train_loss": -35.72736358642578, "global_step": 90842, "epoch": 750} {"train_loss": -36.0242805480957, "global_step": 90843, "epoch": 750} {"train_loss": -36.0599250793457, "global_step": 90844, "epoch": 750} {"train_loss": -35.859169006347656, "global_step": 90845, "epoch": 750} {"train_loss": -35.804054260253906, "global_step": 90846, "epoch": 750} {"train_loss": -36.46977615356445, "global_step": 90847, "epoch": 750} {"train_loss": -36.32562255859375, "global_step": 90848, "epoch": 750} {"train_loss": -36.14908218383789, "global_step": 90849, "epoch": 750} {"train_loss": -36.6343879699707, "global_step": 90850, "epoch": 750} {"train_loss": -36.1717529296875, "global_step": 90851, "epoch": 750} {"train_loss": -36.480072021484375, "global_step": 90852, "epoch": 750} {"train_loss": -36.496803283691406, "global_step": 90853, "epoch": 750} {"train_loss": -36.895809173583984, "global_step": 90854, "epoch": 750} {"train_loss": -36.62971878051758, "global_step": 90855, "epoch": 750} {"train_loss": -36.28327560424805, "global_step": 90856, "epoch": 750} {"train_loss": -36.517677307128906, "global_step": 90857, "epoch": 750} {"train_loss": -36.64889144897461, "global_step": 90858, "epoch": 750} {"train_loss": -36.59526443481445, "global_step": 90859, "epoch": 750} {"train_loss": -36.70946502685547, "global_step": 90860, "epoch": 750} {"train_loss": -36.36089324951172, "global_step": 90861, "epoch": 750} {"train_loss": -36.5291748046875, "global_step": 90862, "epoch": 750} {"train_loss": -36.43160629272461, "global_step": 90863, "epoch": 750} {"train_loss": -36.8990364074707, "global_step": 90864, "epoch": 750} {"train_loss": -37.049774169921875, "global_step": 90865, "epoch": 750} {"train_loss": -36.9371337890625, "global_step": 90866, "epoch": 750} {"train_loss": -37.101009368896484, "global_step": 90867, "epoch": 750} {"train_loss": -37.56919860839844, "global_step": 90868, "epoch": 750} {"train_loss": -37.17493438720703, "global_step": 90869, "epoch": 750} {"train_loss": -34.424930611917794, "global_step": 90870, "epoch": 750, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4400000": 1.0, "test/sim_max_reward_4400001": 1.0, "test/sim_max_reward_4400002": 1.0, "test/sim_max_reward_4400003": 0.0, "test/sim_max_reward_4400004": 1.0, "test/sim_max_reward_4400005": 1.0, "test/sim_max_reward_4400006": 1.0, "test/sim_max_reward_4400007": 1.0, "test/sim_max_reward_4400008": 1.0, "test/sim_max_reward_4400009": 1.0, "test/sim_max_reward_4400010": 1.0, "test/sim_max_reward_4400011": 1.0, "test/sim_max_reward_4400012": 1.0, "test/sim_max_reward_4400013": 1.0, "test/sim_max_reward_4400014": 1.0, "test/sim_max_reward_4400015": 1.0, "test/sim_max_reward_4400016": 1.0, "test/sim_max_reward_4400017": 1.0, "test/sim_max_reward_4400018": 1.0, "test/sim_max_reward_4400019": 1.0, "test/sim_max_reward_4400020": 1.0, "test/sim_max_reward_4400021": 1.0, "train/mean_score": 1.0, "test/mean_score": 0.9545454545454546, "val_loss": 2573712.75} {"train_loss": -36.38101577758789, "global_step": 90871, "epoch": 751} {"train_loss": -37.071044921875, "global_step": 90872, "epoch": 751} {"train_loss": -37.24805450439453, "global_step": 90873, "epoch": 751} {"train_loss": -37.19173049926758, "global_step": 90874, "epoch": 751} {"train_loss": -36.11130905151367, "global_step": 90875, "epoch": 751} {"train_loss": -33.49222946166992, "global_step": 90876, "epoch": 751} {"train_loss": -33.26668167114258, "global_step": 90877, "epoch": 751} {"train_loss": -36.42388153076172, "global_step": 90878, "epoch": 751} {"train_loss": -37.17995834350586, "global_step": 90879, "epoch": 751} {"train_loss": -35.168025970458984, "global_step": 90880, "epoch": 751} {"train_loss": -33.459999084472656, "global_step": 90881, "epoch": 751} {"train_loss": -37.01475143432617, "global_step": 90882, "epoch": 751} {"train_loss": -35.90090560913086, "global_step": 90883, "epoch": 751} {"train_loss": -34.29665756225586, "global_step": 90884, "epoch": 751} {"train_loss": -36.37324142456055, "global_step": 90885, "epoch": 751} {"train_loss": -35.853973388671875, "global_step": 90886, "epoch": 751} {"train_loss": -34.57383728027344, "global_step": 90887, "epoch": 751} {"train_loss": -32.594970703125, "global_step": 90888, "epoch": 751} {"train_loss": -29.97767448425293, "global_step": 90889, "epoch": 751} {"train_loss": -31.490453720092773, "global_step": 90890, "epoch": 751} {"train_loss": -34.805015563964844, "global_step": 90891, "epoch": 751} {"train_loss": -37.22223663330078, "global_step": 90892, "epoch": 751} {"train_loss": -34.97084426879883, "global_step": 90893, "epoch": 751} {"train_loss": -36.43452072143555, "global_step": 90894, "epoch": 751} {"train_loss": -36.8231201171875, "global_step": 90895, "epoch": 751} {"train_loss": -36.6961784362793, "global_step": 90896, "epoch": 751} {"train_loss": -37.07804489135742, "global_step": 90897, "epoch": 751} {"train_loss": -36.35585021972656, "global_step": 90898, "epoch": 751} {"train_loss": -37.04487991333008, "global_step": 90899, "epoch": 751} {"train_loss": -36.19301986694336, "global_step": 90900, "epoch": 751} {"train_loss": -36.965843200683594, "global_step": 90901, "epoch": 751} {"train_loss": -37.21198654174805, "global_step": 90902, "epoch": 751} {"train_loss": -36.85374069213867, "global_step": 90903, "epoch": 751} {"train_loss": -36.90401077270508, "global_step": 90904, "epoch": 751} {"train_loss": -36.741973876953125, "global_step": 90905, "epoch": 751} {"train_loss": -37.3471565246582, "global_step": 90906, "epoch": 751} {"train_loss": -36.94267272949219, "global_step": 90907, "epoch": 751} {"train_loss": -36.61135482788086, "global_step": 90908, "epoch": 751} {"train_loss": -36.764705657958984, "global_step": 90909, "epoch": 751} {"train_loss": -37.13516616821289, "global_step": 90910, "epoch": 751} {"train_loss": -37.244041442871094, "global_step": 90911, "epoch": 751} {"train_loss": -36.827667236328125, "global_step": 90912, "epoch": 751} {"train_loss": -37.22673416137695, "global_step": 90913, "epoch": 751} {"train_loss": -37.1970100402832, "global_step": 90914, "epoch": 751} {"train_loss": -37.24742126464844, "global_step": 90915, "epoch": 751} {"train_loss": -37.564247131347656, "global_step": 90916, "epoch": 751} {"train_loss": -37.795448303222656, "global_step": 90917, "epoch": 751} {"train_loss": -37.4267578125, "global_step": 90918, "epoch": 751} {"train_loss": -37.17533493041992, "global_step": 90919, "epoch": 751} {"train_loss": -37.823028564453125, "global_step": 90920, "epoch": 751} {"train_loss": -37.688777923583984, "global_step": 90921, "epoch": 751} {"train_loss": -37.7057991027832, "global_step": 90922, "epoch": 751} {"train_loss": -36.89612579345703, "global_step": 90923, "epoch": 751} {"train_loss": -36.5234375, "global_step": 90924, "epoch": 751} {"train_loss": -37.76604461669922, "global_step": 90925, "epoch": 751} {"train_loss": -37.55486297607422, "global_step": 90926, "epoch": 751} {"train_loss": -37.341121673583984, "global_step": 90927, "epoch": 751} {"train_loss": -37.83775329589844, "global_step": 90928, "epoch": 751} {"train_loss": -37.78828811645508, "global_step": 90929, "epoch": 751} {"train_loss": -37.87818145751953, "global_step": 90930, "epoch": 751} {"train_loss": -37.8490104675293, "global_step": 90931, "epoch": 751} {"train_loss": -34.901519775390625, "global_step": 90932, "epoch": 751} {"train_loss": -37.65238952636719, "global_step": 90933, "epoch": 751} {"train_loss": -37.729244232177734, "global_step": 90934, "epoch": 751} {"train_loss": -37.7977294921875, "global_step": 90935, "epoch": 751} {"train_loss": -37.75225830078125, "global_step": 90936, "epoch": 751} {"train_loss": -37.603824615478516, "global_step": 90937, "epoch": 751} {"train_loss": -37.223487854003906, "global_step": 90938, "epoch": 751} {"train_loss": -38.18218231201172, "global_step": 90939, "epoch": 751} {"train_loss": -37.61272048950195, "global_step": 90940, "epoch": 751} {"train_loss": -37.79243850708008, "global_step": 90941, "epoch": 751} {"train_loss": -37.458221435546875, "global_step": 90942, "epoch": 751} {"train_loss": -37.71673583984375, "global_step": 90943, "epoch": 751} {"train_loss": -37.314979553222656, "global_step": 90944, "epoch": 751} {"train_loss": -37.878761291503906, "global_step": 90945, "epoch": 751} {"train_loss": -36.8741455078125, "global_step": 90946, "epoch": 751} {"train_loss": -37.866737365722656, "global_step": 90947, "epoch": 751} {"train_loss": -38.12892532348633, "global_step": 90948, "epoch": 751} {"train_loss": -37.14380645751953, "global_step": 90949, "epoch": 751} {"train_loss": -36.66691970825195, "global_step": 90950, "epoch": 751} {"train_loss": -37.52536392211914, "global_step": 90951, "epoch": 751} {"train_loss": -38.15095138549805, "global_step": 90952, "epoch": 751} {"train_loss": -37.42112350463867, "global_step": 90953, "epoch": 751} {"train_loss": -36.922481536865234, "global_step": 90954, "epoch": 751} {"train_loss": -37.63603591918945, "global_step": 90955, "epoch": 751} {"train_loss": -37.77775192260742, "global_step": 90956, "epoch": 751} {"train_loss": -35.59032440185547, "global_step": 90957, "epoch": 751} {"train_loss": -36.23381805419922, "global_step": 90958, "epoch": 751} {"train_loss": -37.176361083984375, "global_step": 90959, "epoch": 751} {"train_loss": -37.1891975402832, "global_step": 90960, "epoch": 751} {"train_loss": -35.17771530151367, "global_step": 90961, "epoch": 751} {"train_loss": -38.52779769897461, "global_step": 90962, "epoch": 751} {"train_loss": -36.293495178222656, "global_step": 90963, "epoch": 751} {"train_loss": -37.235992431640625, "global_step": 90964, "epoch": 751} {"train_loss": -37.87660598754883, "global_step": 90965, "epoch": 751} {"train_loss": -37.478580474853516, "global_step": 90966, "epoch": 751} {"train_loss": -37.40690994262695, "global_step": 90967, "epoch": 751} {"train_loss": -36.74433517456055, "global_step": 90968, "epoch": 751} {"train_loss": -37.07261657714844, "global_step": 90969, "epoch": 751} {"train_loss": -37.02553939819336, "global_step": 90970, "epoch": 751} {"train_loss": -37.8187370300293, "global_step": 90971, "epoch": 751} {"train_loss": -37.60910415649414, "global_step": 90972, "epoch": 751} {"train_loss": -37.713966369628906, "global_step": 90973, "epoch": 751} {"train_loss": -36.069488525390625, "global_step": 90974, "epoch": 751} {"train_loss": -36.201995849609375, "global_step": 90975, "epoch": 751} {"train_loss": -37.48701858520508, "global_step": 90976, "epoch": 751} {"train_loss": -38.05006790161133, "global_step": 90977, "epoch": 751} {"train_loss": -35.677425384521484, "global_step": 90978, "epoch": 751} {"train_loss": -32.0455322265625, "global_step": 90979, "epoch": 751} {"train_loss": -31.198835372924805, "global_step": 90980, "epoch": 751} {"train_loss": -29.1400089263916, "global_step": 90981, "epoch": 751} {"train_loss": -33.17105484008789, "global_step": 90982, "epoch": 751} {"train_loss": -36.69890213012695, "global_step": 90983, "epoch": 751} {"train_loss": -31.397968292236328, "global_step": 90984, "epoch": 751} {"train_loss": -35.42363357543945, "global_step": 90985, "epoch": 751} {"train_loss": -35.269527435302734, "global_step": 90986, "epoch": 751} {"train_loss": -31.77260398864746, "global_step": 90987, "epoch": 751} {"train_loss": -34.00529098510742, "global_step": 90988, "epoch": 751} {"train_loss": -34.05338668823242, "global_step": 90989, "epoch": 751} {"train_loss": -33.999420166015625, "global_step": 90990, "epoch": 751} {"train_loss": -36.40466225048727, "global_step": 90991, "epoch": 751, "val_loss": 2640666.25} {"train_loss": -33.38794708251953, "global_step": 90992, "epoch": 752} {"train_loss": -34.909664154052734, "global_step": 90993, "epoch": 752} {"train_loss": -34.192138671875, "global_step": 90994, "epoch": 752} {"train_loss": -36.08921432495117, "global_step": 90995, "epoch": 752} {"train_loss": -34.83451461791992, "global_step": 90996, "epoch": 752} {"train_loss": -36.15230178833008, "global_step": 90997, "epoch": 752} {"train_loss": -33.61341094970703, "global_step": 90998, "epoch": 752} {"train_loss": -36.6917724609375, "global_step": 90999, "epoch": 752} {"train_loss": -34.858028411865234, "global_step": 91000, "epoch": 752} {"train_loss": -35.75843811035156, "global_step": 91001, "epoch": 752} {"train_loss": -36.012245178222656, "global_step": 91002, "epoch": 752} {"train_loss": -35.45346450805664, "global_step": 91003, "epoch": 752} {"train_loss": -37.17998123168945, "global_step": 91004, "epoch": 752} {"train_loss": -36.894508361816406, "global_step": 91005, "epoch": 752} {"train_loss": -36.264217376708984, "global_step": 91006, "epoch": 752} {"train_loss": -36.767417907714844, "global_step": 91007, "epoch": 752} {"train_loss": -36.66709518432617, "global_step": 91008, "epoch": 752} {"train_loss": -37.32638931274414, "global_step": 91009, "epoch": 752} {"train_loss": -36.891822814941406, "global_step": 91010, "epoch": 752} {"train_loss": -35.8857421875, "global_step": 91011, "epoch": 752} {"train_loss": -36.40620040893555, "global_step": 91012, "epoch": 752} {"train_loss": -33.64961624145508, "global_step": 91013, "epoch": 752} {"train_loss": -36.95024108886719, "global_step": 91014, "epoch": 752} {"train_loss": -36.968563079833984, "global_step": 91015, "epoch": 752} {"train_loss": -37.40017318725586, "global_step": 91016, "epoch": 752} {"train_loss": -37.178260803222656, "global_step": 91017, "epoch": 752} {"train_loss": -36.657535552978516, "global_step": 91018, "epoch": 752} {"train_loss": -37.098289489746094, "global_step": 91019, "epoch": 752} {"train_loss": -37.13871383666992, "global_step": 91020, "epoch": 752} {"train_loss": -36.72132110595703, "global_step": 91021, "epoch": 752} {"train_loss": -36.0101318359375, "global_step": 91022, "epoch": 752} {"train_loss": -37.422943115234375, "global_step": 91023, "epoch": 752} {"train_loss": -36.97251892089844, "global_step": 91024, "epoch": 752} {"train_loss": -37.21540451049805, "global_step": 91025, "epoch": 752} {"train_loss": -38.01119613647461, "global_step": 91026, "epoch": 752} {"train_loss": -36.68195343017578, "global_step": 91027, "epoch": 752} {"train_loss": -37.14260482788086, "global_step": 91028, "epoch": 752} {"train_loss": -37.37078857421875, "global_step": 91029, "epoch": 752} {"train_loss": -35.719825744628906, "global_step": 91030, "epoch": 752} {"train_loss": -37.2191162109375, "global_step": 91031, "epoch": 752} {"train_loss": -37.547645568847656, "global_step": 91032, "epoch": 752} {"train_loss": -37.49208450317383, "global_step": 91033, "epoch": 752} {"train_loss": -37.353240966796875, "global_step": 91034, "epoch": 752} {"train_loss": -37.392425537109375, "global_step": 91035, "epoch": 752} {"train_loss": -37.6866340637207, "global_step": 91036, "epoch": 752} {"train_loss": -36.913028717041016, "global_step": 91037, "epoch": 752} {"train_loss": -37.145503997802734, "global_step": 91038, "epoch": 752} {"train_loss": -37.3563117980957, "global_step": 91039, "epoch": 752} {"train_loss": -37.82034683227539, "global_step": 91040, "epoch": 752} {"train_loss": -37.87028121948242, "global_step": 91041, "epoch": 752} {"train_loss": -37.75825881958008, "global_step": 91042, "epoch": 752} {"train_loss": -37.61296463012695, "global_step": 91043, "epoch": 752} {"train_loss": -37.85847091674805, "global_step": 91044, "epoch": 752} {"train_loss": -37.65414047241211, "global_step": 91045, "epoch": 752} {"train_loss": -37.95588684082031, "global_step": 91046, "epoch": 752} {"train_loss": -36.86811447143555, "global_step": 91047, "epoch": 752} {"train_loss": -37.351478576660156, "global_step": 91048, "epoch": 752} {"train_loss": -37.374053955078125, "global_step": 91049, "epoch": 752} {"train_loss": -37.9842643737793, "global_step": 91050, "epoch": 752} {"train_loss": -37.7927131652832, "global_step": 91051, "epoch": 752} {"train_loss": -36.941749572753906, "global_step": 91052, "epoch": 752} {"train_loss": -36.96343994140625, "global_step": 91053, "epoch": 752} {"train_loss": -37.66008377075195, "global_step": 91054, "epoch": 752} {"train_loss": -38.01538848876953, "global_step": 91055, "epoch": 752} {"train_loss": -36.85141372680664, "global_step": 91056, "epoch": 752} {"train_loss": -36.48922348022461, "global_step": 91057, "epoch": 752} {"train_loss": -34.982940673828125, "global_step": 91058, "epoch": 752} {"train_loss": -38.152687072753906, "global_step": 91059, "epoch": 752} {"train_loss": -37.56730270385742, "global_step": 91060, "epoch": 752} {"train_loss": -37.1927375793457, "global_step": 91061, "epoch": 752} {"train_loss": -33.77814483642578, "global_step": 91062, "epoch": 752} {"train_loss": -35.267967224121094, "global_step": 91063, "epoch": 752} {"train_loss": -37.23443603515625, "global_step": 91064, "epoch": 752} {"train_loss": -37.59133529663086, "global_step": 91065, "epoch": 752} {"train_loss": -35.390445709228516, "global_step": 91066, "epoch": 752} {"train_loss": -35.33053207397461, "global_step": 91067, "epoch": 752} {"train_loss": -35.89048385620117, "global_step": 91068, "epoch": 752} {"train_loss": -37.20343780517578, "global_step": 91069, "epoch": 752} {"train_loss": -24.807910919189453, "global_step": 91070, "epoch": 752} {"train_loss": -37.548675537109375, "global_step": 91071, "epoch": 752} {"train_loss": -36.72129440307617, "global_step": 91072, "epoch": 752} {"train_loss": -35.49534225463867, "global_step": 91073, "epoch": 752} {"train_loss": -32.37364196777344, "global_step": 91074, "epoch": 752} {"train_loss": -31.104562759399414, "global_step": 91075, "epoch": 752} {"train_loss": -21.780406951904297, "global_step": 91076, "epoch": 752} {"train_loss": -15.519055366516113, "global_step": 91077, "epoch": 752} {"train_loss": -35.42390060424805, "global_step": 91078, "epoch": 752} {"train_loss": -23.352764129638672, "global_step": 91079, "epoch": 752} {"train_loss": -30.23617935180664, "global_step": 91080, "epoch": 752} {"train_loss": -30.993988037109375, "global_step": 91081, "epoch": 752} {"train_loss": -32.19282913208008, "global_step": 91082, "epoch": 752} {"train_loss": -31.85408592224121, "global_step": 91083, "epoch": 752} {"train_loss": -31.94783592224121, "global_step": 91084, "epoch": 752} {"train_loss": -32.18748474121094, "global_step": 91085, "epoch": 752} {"train_loss": -33.27090072631836, "global_step": 91086, "epoch": 752} {"train_loss": -31.937891006469727, "global_step": 91087, "epoch": 752} {"train_loss": -34.990692138671875, "global_step": 91088, "epoch": 752} {"train_loss": -33.00048828125, "global_step": 91089, "epoch": 752} {"train_loss": -33.20420455932617, "global_step": 91090, "epoch": 752} {"train_loss": -35.131561279296875, "global_step": 91091, "epoch": 752} {"train_loss": -32.63734817504883, "global_step": 91092, "epoch": 752} {"train_loss": -33.85188293457031, "global_step": 91093, "epoch": 752} {"train_loss": -33.0113639831543, "global_step": 91094, "epoch": 752} {"train_loss": -34.988956451416016, "global_step": 91095, "epoch": 752} {"train_loss": -35.83757400512695, "global_step": 91096, "epoch": 752} {"train_loss": -34.76597213745117, "global_step": 91097, "epoch": 752} {"train_loss": -34.81550598144531, "global_step": 91098, "epoch": 752} {"train_loss": -34.76549530029297, "global_step": 91099, "epoch": 752} {"train_loss": -34.94881057739258, "global_step": 91100, "epoch": 752} {"train_loss": -34.48768615722656, "global_step": 91101, "epoch": 752} {"train_loss": -34.8742561340332, "global_step": 91102, "epoch": 752} {"train_loss": -34.87491989135742, "global_step": 91103, "epoch": 752} {"train_loss": -34.64631271362305, "global_step": 91104, "epoch": 752} {"train_loss": -34.45957946777344, "global_step": 91105, "epoch": 752} {"train_loss": -35.655487060546875, "global_step": 91106, "epoch": 752} {"train_loss": -36.22743606567383, "global_step": 91107, "epoch": 752} {"train_loss": -35.42200469970703, "global_step": 91108, "epoch": 752} {"train_loss": -35.865657806396484, "global_step": 91109, "epoch": 752} {"train_loss": -36.06098937988281, "global_step": 91110, "epoch": 752} {"train_loss": -35.69173812866211, "global_step": 91111, "epoch": 752} {"train_loss": -35.36226374255724, "global_step": 91112, "epoch": 752, "val_loss": 2606931.25} {"train_loss": -35.355342864990234, "global_step": 91113, "epoch": 753} {"train_loss": -35.83184814453125, "global_step": 91114, "epoch": 753} {"train_loss": -36.45449447631836, "global_step": 91115, "epoch": 753} {"train_loss": -35.73527145385742, "global_step": 91116, "epoch": 753} {"train_loss": -35.46586227416992, "global_step": 91117, "epoch": 753} {"train_loss": -36.612281799316406, "global_step": 91118, "epoch": 753} {"train_loss": -35.85784912109375, "global_step": 91119, "epoch": 753} {"train_loss": -36.6231689453125, "global_step": 91120, "epoch": 753} {"train_loss": -36.41899871826172, "global_step": 91121, "epoch": 753} {"train_loss": -36.484375, "global_step": 91122, "epoch": 753} {"train_loss": -36.820186614990234, "global_step": 91123, "epoch": 753} {"train_loss": -36.688968658447266, "global_step": 91124, "epoch": 753} {"train_loss": -36.64136505126953, "global_step": 91125, "epoch": 753} {"train_loss": -36.96492385864258, "global_step": 91126, "epoch": 753} {"train_loss": -36.230587005615234, "global_step": 91127, "epoch": 753} {"train_loss": -36.80205535888672, "global_step": 91128, "epoch": 753} {"train_loss": -36.77271270751953, "global_step": 91129, "epoch": 753} {"train_loss": -36.208839416503906, "global_step": 91130, "epoch": 753} {"train_loss": -36.84818649291992, "global_step": 91131, "epoch": 753} {"train_loss": -36.75970458984375, "global_step": 91132, "epoch": 753} {"train_loss": -36.68142318725586, "global_step": 91133, "epoch": 753} {"train_loss": -37.11686325073242, "global_step": 91134, "epoch": 753} {"train_loss": -37.28480911254883, "global_step": 91135, "epoch": 753} {"train_loss": -37.3426513671875, "global_step": 91136, "epoch": 753} {"train_loss": -37.26095199584961, "global_step": 91137, "epoch": 753} {"train_loss": -36.67129135131836, "global_step": 91138, "epoch": 753} {"train_loss": -36.70981979370117, "global_step": 91139, "epoch": 753} {"train_loss": -37.13886260986328, "global_step": 91140, "epoch": 753} {"train_loss": -37.112213134765625, "global_step": 91141, "epoch": 753} {"train_loss": -36.694332122802734, "global_step": 91142, "epoch": 753} {"train_loss": -37.12922286987305, "global_step": 91143, "epoch": 753} {"train_loss": -36.99148178100586, "global_step": 91144, "epoch": 753} {"train_loss": -37.36577606201172, "global_step": 91145, "epoch": 753} {"train_loss": -37.05985641479492, "global_step": 91146, "epoch": 753} {"train_loss": -36.9979133605957, "global_step": 91147, "epoch": 753} {"train_loss": -37.520957946777344, "global_step": 91148, "epoch": 753} {"train_loss": -37.743038177490234, "global_step": 91149, "epoch": 753} {"train_loss": -37.550132751464844, "global_step": 91150, "epoch": 753} {"train_loss": -37.633296966552734, "global_step": 91151, "epoch": 753} {"train_loss": -37.708221435546875, "global_step": 91152, "epoch": 753} {"train_loss": -37.600467681884766, "global_step": 91153, "epoch": 753} {"train_loss": -37.84075927734375, "global_step": 91154, "epoch": 753} {"train_loss": -37.802093505859375, "global_step": 91155, "epoch": 753} {"train_loss": -37.691017150878906, "global_step": 91156, "epoch": 753} {"train_loss": -37.468589782714844, "global_step": 91157, "epoch": 753} {"train_loss": -37.67969512939453, "global_step": 91158, "epoch": 753} {"train_loss": -38.17866516113281, "global_step": 91159, "epoch": 753} {"train_loss": -37.898860931396484, "global_step": 91160, "epoch": 753} {"train_loss": -38.212162017822266, "global_step": 91161, "epoch": 753} {"train_loss": -37.90801239013672, "global_step": 91162, "epoch": 753} {"train_loss": -37.95878982543945, "global_step": 91163, "epoch": 753} {"train_loss": -38.15671920776367, "global_step": 91164, "epoch": 753} {"train_loss": -38.1602783203125, "global_step": 91165, "epoch": 753} {"train_loss": -37.37975311279297, "global_step": 91166, "epoch": 753} {"train_loss": -38.55434799194336, "global_step": 91167, "epoch": 753} {"train_loss": -38.116268157958984, "global_step": 91168, "epoch": 753} {"train_loss": -38.221187591552734, "global_step": 91169, "epoch": 753} {"train_loss": -37.75345993041992, "global_step": 91170, "epoch": 753} {"train_loss": -38.286659240722656, "global_step": 91171, "epoch": 753} {"train_loss": -38.085445404052734, "global_step": 91172, "epoch": 753} {"train_loss": -37.901466369628906, "global_step": 91173, "epoch": 753} {"train_loss": -38.21126174926758, "global_step": 91174, "epoch": 753} {"train_loss": -37.924556732177734, "global_step": 91175, "epoch": 753} {"train_loss": -37.577274322509766, "global_step": 91176, "epoch": 753} {"train_loss": -38.21548080444336, "global_step": 91177, "epoch": 753} {"train_loss": -37.633705139160156, "global_step": 91178, "epoch": 753} {"train_loss": -36.57834243774414, "global_step": 91179, "epoch": 753} {"train_loss": -34.23451614379883, "global_step": 91180, "epoch": 753} {"train_loss": -36.173133850097656, "global_step": 91181, "epoch": 753} {"train_loss": -32.957611083984375, "global_step": 91182, "epoch": 753} {"train_loss": -26.668872833251953, "global_step": 91183, "epoch": 753} {"train_loss": -21.361928939819336, "global_step": 91184, "epoch": 753} {"train_loss": -27.521392822265625, "global_step": 91185, "epoch": 753} {"train_loss": -35.3698844909668, "global_step": 91186, "epoch": 753} {"train_loss": -26.684492111206055, "global_step": 91187, "epoch": 753} {"train_loss": -33.62778091430664, "global_step": 91188, "epoch": 753} {"train_loss": -33.84888458251953, "global_step": 91189, "epoch": 753} {"train_loss": -32.7697639465332, "global_step": 91190, "epoch": 753} {"train_loss": -34.21382141113281, "global_step": 91191, "epoch": 753} {"train_loss": -33.62060546875, "global_step": 91192, "epoch": 753} {"train_loss": -34.39613723754883, "global_step": 91193, "epoch": 753} {"train_loss": -36.63712692260742, "global_step": 91194, "epoch": 753} {"train_loss": -34.751766204833984, "global_step": 91195, "epoch": 753} {"train_loss": -36.751163482666016, "global_step": 91196, "epoch": 753} {"train_loss": -35.33504867553711, "global_step": 91197, "epoch": 753} {"train_loss": -36.164527893066406, "global_step": 91198, "epoch": 753} {"train_loss": -36.66033935546875, "global_step": 91199, "epoch": 753} {"train_loss": -36.34568405151367, "global_step": 91200, "epoch": 753} {"train_loss": -36.36638641357422, "global_step": 91201, "epoch": 753} {"train_loss": -36.580806732177734, "global_step": 91202, "epoch": 753} {"train_loss": -36.21694564819336, "global_step": 91203, "epoch": 753} {"train_loss": -36.6967887878418, "global_step": 91204, "epoch": 753} {"train_loss": -37.13743209838867, "global_step": 91205, "epoch": 753} {"train_loss": -36.97495651245117, "global_step": 91206, "epoch": 753} {"train_loss": -36.285430908203125, "global_step": 91207, "epoch": 753} {"train_loss": -37.30826950073242, "global_step": 91208, "epoch": 753} {"train_loss": -36.29255294799805, "global_step": 91209, "epoch": 753} {"train_loss": -37.15229415893555, "global_step": 91210, "epoch": 753} {"train_loss": -37.14505386352539, "global_step": 91211, "epoch": 753} {"train_loss": -36.377532958984375, "global_step": 91212, "epoch": 753} {"train_loss": -37.230377197265625, "global_step": 91213, "epoch": 753} {"train_loss": -37.44401168823242, "global_step": 91214, "epoch": 753} {"train_loss": -36.997676849365234, "global_step": 91215, "epoch": 753} {"train_loss": -37.36875534057617, "global_step": 91216, "epoch": 753} {"train_loss": -37.310028076171875, "global_step": 91217, "epoch": 753} {"train_loss": -37.137977600097656, "global_step": 91218, "epoch": 753} {"train_loss": -37.5470085144043, "global_step": 91219, "epoch": 753} {"train_loss": -37.20711898803711, "global_step": 91220, "epoch": 753} {"train_loss": -37.49960708618164, "global_step": 91221, "epoch": 753} {"train_loss": -37.58940887451172, "global_step": 91222, "epoch": 753} {"train_loss": -37.61306381225586, "global_step": 91223, "epoch": 753} {"train_loss": -38.06429672241211, "global_step": 91224, "epoch": 753} {"train_loss": -37.77960205078125, "global_step": 91225, "epoch": 753} {"train_loss": -37.76870346069336, "global_step": 91226, "epoch": 753} {"train_loss": -38.007144927978516, "global_step": 91227, "epoch": 753} {"train_loss": -37.809852600097656, "global_step": 91228, "epoch": 753} {"train_loss": -37.7764892578125, "global_step": 91229, "epoch": 753} {"train_loss": -37.34040451049805, "global_step": 91230, "epoch": 753} {"train_loss": -37.67098617553711, "global_step": 91231, "epoch": 753} {"train_loss": -37.67439651489258, "global_step": 91232, "epoch": 753} {"train_loss": -36.52377133330038, "global_step": 91233, "epoch": 753, "val_loss": 2637258.75} {"train_loss": -37.91676712036133, "global_step": 91234, "epoch": 754} {"train_loss": -37.992218017578125, "global_step": 91235, "epoch": 754} {"train_loss": -38.019622802734375, "global_step": 91236, "epoch": 754} {"train_loss": -37.885223388671875, "global_step": 91237, "epoch": 754} {"train_loss": -38.27241897583008, "global_step": 91238, "epoch": 754} {"train_loss": -38.107269287109375, "global_step": 91239, "epoch": 754} {"train_loss": -38.27616500854492, "global_step": 91240, "epoch": 754} {"train_loss": -38.33705520629883, "global_step": 91241, "epoch": 754} {"train_loss": -38.402278900146484, "global_step": 91242, "epoch": 754} {"train_loss": -38.38159942626953, "global_step": 91243, "epoch": 754} {"train_loss": -38.34406661987305, "global_step": 91244, "epoch": 754} {"train_loss": -37.98139572143555, "global_step": 91245, "epoch": 754} {"train_loss": -38.46450424194336, "global_step": 91246, "epoch": 754} {"train_loss": -38.313926696777344, "global_step": 91247, "epoch": 754} {"train_loss": -38.50861358642578, "global_step": 91248, "epoch": 754} {"train_loss": -38.4189567565918, "global_step": 91249, "epoch": 754} {"train_loss": -38.18648910522461, "global_step": 91250, "epoch": 754} {"train_loss": -38.85893249511719, "global_step": 91251, "epoch": 754} {"train_loss": -37.08958053588867, "global_step": 91252, "epoch": 754} {"train_loss": -38.025962829589844, "global_step": 91253, "epoch": 754} {"train_loss": -38.624244689941406, "global_step": 91254, "epoch": 754} {"train_loss": -37.973121643066406, "global_step": 91255, "epoch": 754} {"train_loss": -37.77665710449219, "global_step": 91256, "epoch": 754} {"train_loss": -37.376853942871094, "global_step": 91257, "epoch": 754} {"train_loss": -38.062400817871094, "global_step": 91258, "epoch": 754} {"train_loss": -38.074764251708984, "global_step": 91259, "epoch": 754} {"train_loss": -38.48141098022461, "global_step": 91260, "epoch": 754} {"train_loss": -38.39695358276367, "global_step": 91261, "epoch": 754} {"train_loss": -38.03523635864258, "global_step": 91262, "epoch": 754} {"train_loss": -38.73708724975586, "global_step": 91263, "epoch": 754} {"train_loss": -36.599830627441406, "global_step": 91264, "epoch": 754} {"train_loss": -38.654563903808594, "global_step": 91265, "epoch": 754} {"train_loss": -37.8272590637207, "global_step": 91266, "epoch": 754} {"train_loss": -38.65788269042969, "global_step": 91267, "epoch": 754} {"train_loss": -38.111724853515625, "global_step": 91268, "epoch": 754} {"train_loss": -37.81782150268555, "global_step": 91269, "epoch": 754} {"train_loss": -38.19264602661133, "global_step": 91270, "epoch": 754} {"train_loss": -38.13528060913086, "global_step": 91271, "epoch": 754} {"train_loss": -37.099952697753906, "global_step": 91272, "epoch": 754} {"train_loss": -37.24980926513672, "global_step": 91273, "epoch": 754} {"train_loss": -34.480342864990234, "global_step": 91274, "epoch": 754} {"train_loss": -36.88264083862305, "global_step": 91275, "epoch": 754} {"train_loss": -28.915878295898438, "global_step": 91276, "epoch": 754} {"train_loss": -36.022335052490234, "global_step": 91277, "epoch": 754} {"train_loss": -33.89081954956055, "global_step": 91278, "epoch": 754} {"train_loss": -28.654865264892578, "global_step": 91279, "epoch": 754} {"train_loss": -25.936376571655273, "global_step": 91280, "epoch": 754} {"train_loss": -35.3718147277832, "global_step": 91281, "epoch": 754} {"train_loss": -29.54158592224121, "global_step": 91282, "epoch": 754} {"train_loss": -17.07408332824707, "global_step": 91283, "epoch": 754} {"train_loss": -20.16494369506836, "global_step": 91284, "epoch": 754} {"train_loss": -25.549110412597656, "global_step": 91285, "epoch": 754} {"train_loss": -30.927030563354492, "global_step": 91286, "epoch": 754} {"train_loss": -26.34797477722168, "global_step": 91287, "epoch": 754} {"train_loss": -24.86659812927246, "global_step": 91288, "epoch": 754} {"train_loss": -28.968128204345703, "global_step": 91289, "epoch": 754} {"train_loss": -25.07792854309082, "global_step": 91290, "epoch": 754} {"train_loss": -28.331317901611328, "global_step": 91291, "epoch": 754} {"train_loss": -26.828580856323242, "global_step": 91292, "epoch": 754} {"train_loss": -23.965343475341797, "global_step": 91293, "epoch": 754} {"train_loss": -30.198261260986328, "global_step": 91294, "epoch": 754} {"train_loss": -30.240636825561523, "global_step": 91295, "epoch": 754} {"train_loss": -31.96695327758789, "global_step": 91296, "epoch": 754} {"train_loss": -32.05103302001953, "global_step": 91297, "epoch": 754} {"train_loss": -29.174819946289062, "global_step": 91298, "epoch": 754} {"train_loss": -33.119110107421875, "global_step": 91299, "epoch": 754} {"train_loss": -31.440336227416992, "global_step": 91300, "epoch": 754} {"train_loss": -32.1267204284668, "global_step": 91301, "epoch": 754} {"train_loss": -33.7102165222168, "global_step": 91302, "epoch": 754} {"train_loss": -33.1251220703125, "global_step": 91303, "epoch": 754} {"train_loss": -33.652679443359375, "global_step": 91304, "epoch": 754} {"train_loss": -33.75264358520508, "global_step": 91305, "epoch": 754} {"train_loss": -33.679283142089844, "global_step": 91306, "epoch": 754} {"train_loss": -33.793941497802734, "global_step": 91307, "epoch": 754} {"train_loss": -34.48508834838867, "global_step": 91308, "epoch": 754} {"train_loss": -33.29032516479492, "global_step": 91309, "epoch": 754} {"train_loss": -34.617733001708984, "global_step": 91310, "epoch": 754} {"train_loss": -34.20317840576172, "global_step": 91311, "epoch": 754} {"train_loss": -33.7730598449707, "global_step": 91312, "epoch": 754} {"train_loss": -32.81337356567383, "global_step": 91313, "epoch": 754} {"train_loss": -34.680030822753906, "global_step": 91314, "epoch": 754} {"train_loss": -34.257659912109375, "global_step": 91315, "epoch": 754} {"train_loss": -33.783626556396484, "global_step": 91316, "epoch": 754} {"train_loss": -34.134220123291016, "global_step": 91317, "epoch": 754} {"train_loss": -34.8344841003418, "global_step": 91318, "epoch": 754} {"train_loss": -35.01362228393555, "global_step": 91319, "epoch": 754} {"train_loss": -33.83665084838867, "global_step": 91320, "epoch": 754} {"train_loss": -35.0949821472168, "global_step": 91321, "epoch": 754} {"train_loss": -35.06234359741211, "global_step": 91322, "epoch": 754} {"train_loss": -34.7698860168457, "global_step": 91323, "epoch": 754} {"train_loss": -34.98933792114258, "global_step": 91324, "epoch": 754} {"train_loss": -34.53580856323242, "global_step": 91325, "epoch": 754} {"train_loss": -34.57822036743164, "global_step": 91326, "epoch": 754} {"train_loss": -35.03225326538086, "global_step": 91327, "epoch": 754} {"train_loss": -34.9002799987793, "global_step": 91328, "epoch": 754} {"train_loss": -35.309722900390625, "global_step": 91329, "epoch": 754} {"train_loss": -35.380794525146484, "global_step": 91330, "epoch": 754} {"train_loss": -34.81865310668945, "global_step": 91331, "epoch": 754} {"train_loss": -35.62801742553711, "global_step": 91332, "epoch": 754} {"train_loss": -35.122955322265625, "global_step": 91333, "epoch": 754} {"train_loss": -35.236656188964844, "global_step": 91334, "epoch": 754} {"train_loss": -34.669010162353516, "global_step": 91335, "epoch": 754} {"train_loss": -35.787818908691406, "global_step": 91336, "epoch": 754} {"train_loss": -34.99417495727539, "global_step": 91337, "epoch": 754} {"train_loss": -35.797969818115234, "global_step": 91338, "epoch": 754} {"train_loss": -36.1299934387207, "global_step": 91339, "epoch": 754} {"train_loss": -35.44515609741211, "global_step": 91340, "epoch": 754} {"train_loss": -36.06572341918945, "global_step": 91341, "epoch": 754} {"train_loss": -36.00881576538086, "global_step": 91342, "epoch": 754} {"train_loss": -36.10167694091797, "global_step": 91343, "epoch": 754} {"train_loss": -36.10293197631836, "global_step": 91344, "epoch": 754} {"train_loss": -36.15733337402344, "global_step": 91345, "epoch": 754} {"train_loss": -36.3963737487793, "global_step": 91346, "epoch": 754} {"train_loss": -36.02892303466797, "global_step": 91347, "epoch": 754} {"train_loss": -36.04993438720703, "global_step": 91348, "epoch": 754} {"train_loss": -35.83207321166992, "global_step": 91349, "epoch": 754} {"train_loss": -36.13576126098633, "global_step": 91350, "epoch": 754} {"train_loss": -36.1645393371582, "global_step": 91351, "epoch": 754} {"train_loss": -36.50107955932617, "global_step": 91352, "epoch": 754} {"train_loss": -36.52852249145508, "global_step": 91353, "epoch": 754} {"train_loss": -34.68602522542654, "global_step": 91354, "epoch": 754, "val_loss": 2598688.0} {"train_loss": -36.44895553588867, "global_step": 91355, "epoch": 755} {"train_loss": -36.46158981323242, "global_step": 91356, "epoch": 755} {"train_loss": -36.656681060791016, "global_step": 91357, "epoch": 755} {"train_loss": -36.662227630615234, "global_step": 91358, "epoch": 755} {"train_loss": -36.570045471191406, "global_step": 91359, "epoch": 755} {"train_loss": -36.4509162902832, "global_step": 91360, "epoch": 755} {"train_loss": -36.56730270385742, "global_step": 91361, "epoch": 755} {"train_loss": -36.75611114501953, "global_step": 91362, "epoch": 755} {"train_loss": -37.135536193847656, "global_step": 91363, "epoch": 755} {"train_loss": -37.09880447387695, "global_step": 91364, "epoch": 755} {"train_loss": -36.650264739990234, "global_step": 91365, "epoch": 755} {"train_loss": -37.169952392578125, "global_step": 91366, "epoch": 755} {"train_loss": -37.10776138305664, "global_step": 91367, "epoch": 755} {"train_loss": -36.60500717163086, "global_step": 91368, "epoch": 755} {"train_loss": -37.1829833984375, "global_step": 91369, "epoch": 755} {"train_loss": -37.222862243652344, "global_step": 91370, "epoch": 755} {"train_loss": -37.10084533691406, "global_step": 91371, "epoch": 755} {"train_loss": -37.35158920288086, "global_step": 91372, "epoch": 755} {"train_loss": -37.09525680541992, "global_step": 91373, "epoch": 755} {"train_loss": -37.232513427734375, "global_step": 91374, "epoch": 755} {"train_loss": -37.108455657958984, "global_step": 91375, "epoch": 755} {"train_loss": -37.027099609375, "global_step": 91376, "epoch": 755} {"train_loss": -37.35433578491211, "global_step": 91377, "epoch": 755} {"train_loss": -37.034698486328125, "global_step": 91378, "epoch": 755} {"train_loss": -37.539451599121094, "global_step": 91379, "epoch": 755} {"train_loss": -37.36301040649414, "global_step": 91380, "epoch": 755} {"train_loss": -37.419185638427734, "global_step": 91381, "epoch": 755} {"train_loss": -37.2381706237793, "global_step": 91382, "epoch": 755} {"train_loss": -37.134124755859375, "global_step": 91383, "epoch": 755} {"train_loss": -37.743343353271484, "global_step": 91384, "epoch": 755} {"train_loss": -37.66062927246094, "global_step": 91385, "epoch": 755} {"train_loss": -37.5363883972168, "global_step": 91386, "epoch": 755} {"train_loss": -37.46995162963867, "global_step": 91387, "epoch": 755} {"train_loss": -37.83999252319336, "global_step": 91388, "epoch": 755} {"train_loss": -37.68779754638672, "global_step": 91389, "epoch": 755} {"train_loss": -37.70357131958008, "global_step": 91390, "epoch": 755} {"train_loss": -37.7677001953125, "global_step": 91391, "epoch": 755} {"train_loss": -37.23492431640625, "global_step": 91392, "epoch": 755} {"train_loss": -37.425453186035156, "global_step": 91393, "epoch": 755} {"train_loss": -37.027095794677734, "global_step": 91394, "epoch": 755} {"train_loss": -37.10125732421875, "global_step": 91395, "epoch": 755} {"train_loss": -36.699127197265625, "global_step": 91396, "epoch": 755} {"train_loss": -37.142478942871094, "global_step": 91397, "epoch": 755} {"train_loss": -37.66872024536133, "global_step": 91398, "epoch": 755} {"train_loss": -37.458740234375, "global_step": 91399, "epoch": 755} {"train_loss": -37.19805908203125, "global_step": 91400, "epoch": 755} {"train_loss": -36.97854995727539, "global_step": 91401, "epoch": 755} {"train_loss": -36.355892181396484, "global_step": 91402, "epoch": 755} {"train_loss": -36.51210403442383, "global_step": 91403, "epoch": 755} {"train_loss": -36.90949630737305, "global_step": 91404, "epoch": 755} {"train_loss": -37.67655563354492, "global_step": 91405, "epoch": 755} {"train_loss": -37.279693603515625, "global_step": 91406, "epoch": 755} {"train_loss": -36.37531280517578, "global_step": 91407, "epoch": 755} {"train_loss": -37.288570404052734, "global_step": 91408, "epoch": 755} {"train_loss": -37.53776168823242, "global_step": 91409, "epoch": 755} {"train_loss": -37.10568618774414, "global_step": 91410, "epoch": 755} {"train_loss": -36.27167510986328, "global_step": 91411, "epoch": 755} {"train_loss": -36.668731689453125, "global_step": 91412, "epoch": 755} {"train_loss": -35.567813873291016, "global_step": 91413, "epoch": 755} {"train_loss": -34.96183776855469, "global_step": 91414, "epoch": 755} {"train_loss": -33.62946319580078, "global_step": 91415, "epoch": 755} {"train_loss": -35.56985092163086, "global_step": 91416, "epoch": 755} {"train_loss": -36.71645736694336, "global_step": 91417, "epoch": 755} {"train_loss": -33.259803771972656, "global_step": 91418, "epoch": 755} {"train_loss": -28.68549156188965, "global_step": 91419, "epoch": 755} {"train_loss": -29.857757568359375, "global_step": 91420, "epoch": 755} {"train_loss": -34.59564208984375, "global_step": 91421, "epoch": 755} {"train_loss": -37.24302291870117, "global_step": 91422, "epoch": 755} {"train_loss": -34.01777267456055, "global_step": 91423, "epoch": 755} {"train_loss": -32.258392333984375, "global_step": 91424, "epoch": 755} {"train_loss": -37.34688949584961, "global_step": 91425, "epoch": 755} {"train_loss": -34.34902572631836, "global_step": 91426, "epoch": 755} {"train_loss": -35.74466323852539, "global_step": 91427, "epoch": 755} {"train_loss": -36.80186080932617, "global_step": 91428, "epoch": 755} {"train_loss": -35.11637496948242, "global_step": 91429, "epoch": 755} {"train_loss": -37.5203742980957, "global_step": 91430, "epoch": 755} {"train_loss": -35.26082992553711, "global_step": 91431, "epoch": 755} {"train_loss": -37.110652923583984, "global_step": 91432, "epoch": 755} {"train_loss": -35.751224517822266, "global_step": 91433, "epoch": 755} {"train_loss": -36.443084716796875, "global_step": 91434, "epoch": 755} {"train_loss": -35.82305908203125, "global_step": 91435, "epoch": 755} {"train_loss": -36.88529586791992, "global_step": 91436, "epoch": 755} {"train_loss": -35.9381103515625, "global_step": 91437, "epoch": 755} {"train_loss": -37.29560852050781, "global_step": 91438, "epoch": 755} {"train_loss": -35.9201545715332, "global_step": 91439, "epoch": 755} {"train_loss": -37.11189651489258, "global_step": 91440, "epoch": 755} {"train_loss": -36.5346565246582, "global_step": 91441, "epoch": 755} {"train_loss": -36.25849533081055, "global_step": 91442, "epoch": 755} {"train_loss": -37.310428619384766, "global_step": 91443, "epoch": 755} {"train_loss": -36.99888229370117, "global_step": 91444, "epoch": 755} {"train_loss": -36.083919525146484, "global_step": 91445, "epoch": 755} {"train_loss": -37.473907470703125, "global_step": 91446, "epoch": 755} {"train_loss": -36.716346740722656, "global_step": 91447, "epoch": 755} {"train_loss": -37.40880584716797, "global_step": 91448, "epoch": 755} {"train_loss": -37.601715087890625, "global_step": 91449, "epoch": 755} {"train_loss": -36.57754135131836, "global_step": 91450, "epoch": 755} {"train_loss": -37.47623825073242, "global_step": 91451, "epoch": 755} {"train_loss": -37.00082015991211, "global_step": 91452, "epoch": 755} {"train_loss": -37.63684844970703, "global_step": 91453, "epoch": 755} {"train_loss": -36.688575744628906, "global_step": 91454, "epoch": 755} {"train_loss": -37.08454513549805, "global_step": 91455, "epoch": 755} {"train_loss": -37.58238220214844, "global_step": 91456, "epoch": 755} {"train_loss": -37.938629150390625, "global_step": 91457, "epoch": 755} {"train_loss": -37.97330856323242, "global_step": 91458, "epoch": 755} {"train_loss": -37.65888977050781, "global_step": 91459, "epoch": 755} {"train_loss": -37.52534103393555, "global_step": 91460, "epoch": 755} {"train_loss": -37.45558547973633, "global_step": 91461, "epoch": 755} {"train_loss": -38.088871002197266, "global_step": 91462, "epoch": 755} {"train_loss": -37.91946792602539, "global_step": 91463, "epoch": 755} {"train_loss": -37.742252349853516, "global_step": 91464, "epoch": 755} {"train_loss": -37.43960189819336, "global_step": 91465, "epoch": 755} {"train_loss": -36.44502258300781, "global_step": 91466, "epoch": 755} {"train_loss": -37.980403900146484, "global_step": 91467, "epoch": 755} {"train_loss": -37.767696380615234, "global_step": 91468, "epoch": 755} {"train_loss": -37.81000518798828, "global_step": 91469, "epoch": 755} {"train_loss": -38.100704193115234, "global_step": 91470, "epoch": 755} {"train_loss": -38.21036911010742, "global_step": 91471, "epoch": 755} {"train_loss": -37.6578254699707, "global_step": 91472, "epoch": 755} {"train_loss": -37.20504379272461, "global_step": 91473, "epoch": 755} {"train_loss": -37.82266616821289, "global_step": 91474, "epoch": 755} {"train_loss": -36.75893696871671, "global_step": 91475, "epoch": 755, "val_loss": 2597959.75} {"train_loss": -37.317256927490234, "global_step": 91476, "epoch": 756} {"train_loss": -36.8930778503418, "global_step": 91477, "epoch": 756} {"train_loss": -37.03937911987305, "global_step": 91478, "epoch": 756} {"train_loss": -37.401920318603516, "global_step": 91479, "epoch": 756} {"train_loss": -37.55677795410156, "global_step": 91480, "epoch": 756} {"train_loss": -38.26701736450195, "global_step": 91481, "epoch": 756} {"train_loss": -37.84830856323242, "global_step": 91482, "epoch": 756} {"train_loss": -37.87964630126953, "global_step": 91483, "epoch": 756} {"train_loss": -36.96807861328125, "global_step": 91484, "epoch": 756} {"train_loss": -37.32209014892578, "global_step": 91485, "epoch": 756} {"train_loss": -37.49886703491211, "global_step": 91486, "epoch": 756} {"train_loss": -37.32855987548828, "global_step": 91487, "epoch": 756} {"train_loss": -38.006343841552734, "global_step": 91488, "epoch": 756} {"train_loss": -37.5606803894043, "global_step": 91489, "epoch": 756} {"train_loss": -37.69148635864258, "global_step": 91490, "epoch": 756} {"train_loss": -38.11599349975586, "global_step": 91491, "epoch": 756} {"train_loss": -38.74015808105469, "global_step": 91492, "epoch": 756} {"train_loss": -38.268577575683594, "global_step": 91493, "epoch": 756} {"train_loss": -37.86159896850586, "global_step": 91494, "epoch": 756} {"train_loss": -38.11931228637695, "global_step": 91495, "epoch": 756} {"train_loss": -38.50825119018555, "global_step": 91496, "epoch": 756} {"train_loss": -38.50242233276367, "global_step": 91497, "epoch": 756} {"train_loss": -37.349124908447266, "global_step": 91498, "epoch": 756} {"train_loss": -37.94340133666992, "global_step": 91499, "epoch": 756} {"train_loss": -37.991851806640625, "global_step": 91500, "epoch": 756} {"train_loss": -38.31084060668945, "global_step": 91501, "epoch": 756} {"train_loss": -38.14350128173828, "global_step": 91502, "epoch": 756} {"train_loss": -37.927120208740234, "global_step": 91503, "epoch": 756} {"train_loss": -37.74856948852539, "global_step": 91504, "epoch": 756} {"train_loss": -38.42454528808594, "global_step": 91505, "epoch": 756} {"train_loss": -37.7691764831543, "global_step": 91506, "epoch": 756} {"train_loss": -37.53249740600586, "global_step": 91507, "epoch": 756} {"train_loss": -36.80290603637695, "global_step": 91508, "epoch": 756} {"train_loss": -36.611061096191406, "global_step": 91509, "epoch": 756} {"train_loss": -35.31758499145508, "global_step": 91510, "epoch": 756} {"train_loss": -35.51869583129883, "global_step": 91511, "epoch": 756} {"train_loss": -37.55866241455078, "global_step": 91512, "epoch": 756} {"train_loss": -38.29914474487305, "global_step": 91513, "epoch": 756} {"train_loss": -36.39424514770508, "global_step": 91514, "epoch": 756} {"train_loss": -34.643733978271484, "global_step": 91515, "epoch": 756} {"train_loss": -33.4458122253418, "global_step": 91516, "epoch": 756} {"train_loss": -38.167945861816406, "global_step": 91517, "epoch": 756} {"train_loss": -36.36426544189453, "global_step": 91518, "epoch": 756} {"train_loss": -35.40681076049805, "global_step": 91519, "epoch": 756} {"train_loss": -37.234378814697266, "global_step": 91520, "epoch": 756} {"train_loss": -37.43336486816406, "global_step": 91521, "epoch": 756} {"train_loss": -36.42382049560547, "global_step": 91522, "epoch": 756} {"train_loss": -37.1696891784668, "global_step": 91523, "epoch": 756} {"train_loss": -36.613807678222656, "global_step": 91524, "epoch": 756} {"train_loss": -38.172237396240234, "global_step": 91525, "epoch": 756} {"train_loss": -37.488014221191406, "global_step": 91526, "epoch": 756} {"train_loss": -37.397335052490234, "global_step": 91527, "epoch": 756} {"train_loss": -37.85491180419922, "global_step": 91528, "epoch": 756} {"train_loss": -36.42216873168945, "global_step": 91529, "epoch": 756} {"train_loss": -37.74237823486328, "global_step": 91530, "epoch": 756} {"train_loss": -38.24117660522461, "global_step": 91531, "epoch": 756} {"train_loss": -37.0323486328125, "global_step": 91532, "epoch": 756} {"train_loss": -36.78789138793945, "global_step": 91533, "epoch": 756} {"train_loss": -36.810340881347656, "global_step": 91534, "epoch": 756} {"train_loss": -37.92118835449219, "global_step": 91535, "epoch": 756} {"train_loss": -38.469730377197266, "global_step": 91536, "epoch": 756} {"train_loss": -37.581214904785156, "global_step": 91537, "epoch": 756} {"train_loss": -37.4925422668457, "global_step": 91538, "epoch": 756} {"train_loss": -37.880836486816406, "global_step": 91539, "epoch": 756} {"train_loss": -36.447837829589844, "global_step": 91540, "epoch": 756} {"train_loss": -37.41415023803711, "global_step": 91541, "epoch": 756} {"train_loss": -37.56020736694336, "global_step": 91542, "epoch": 756} {"train_loss": -37.22426223754883, "global_step": 91543, "epoch": 756} {"train_loss": -37.0800895690918, "global_step": 91544, "epoch": 756} {"train_loss": -37.212459564208984, "global_step": 91545, "epoch": 756} {"train_loss": -38.207664489746094, "global_step": 91546, "epoch": 756} {"train_loss": -38.00701904296875, "global_step": 91547, "epoch": 756} {"train_loss": -37.37522506713867, "global_step": 91548, "epoch": 756} {"train_loss": -37.36821746826172, "global_step": 91549, "epoch": 756} {"train_loss": -37.85724639892578, "global_step": 91550, "epoch": 756} {"train_loss": -37.4197883605957, "global_step": 91551, "epoch": 756} {"train_loss": -38.11195755004883, "global_step": 91552, "epoch": 756} {"train_loss": -37.93076705932617, "global_step": 91553, "epoch": 756} {"train_loss": -37.40852737426758, "global_step": 91554, "epoch": 756} {"train_loss": -37.85787582397461, "global_step": 91555, "epoch": 756} {"train_loss": -37.642578125, "global_step": 91556, "epoch": 756} {"train_loss": -37.97673416137695, "global_step": 91557, "epoch": 756} {"train_loss": -38.28432846069336, "global_step": 91558, "epoch": 756} {"train_loss": -37.86329650878906, "global_step": 91559, "epoch": 756} {"train_loss": -37.54231643676758, "global_step": 91560, "epoch": 756} {"train_loss": -37.30533218383789, "global_step": 91561, "epoch": 756} {"train_loss": -38.51115798950195, "global_step": 91562, "epoch": 756} {"train_loss": -38.60934066772461, "global_step": 91563, "epoch": 756} {"train_loss": -37.74425506591797, "global_step": 91564, "epoch": 756} {"train_loss": -37.44677734375, "global_step": 91565, "epoch": 756} {"train_loss": -38.69148635864258, "global_step": 91566, "epoch": 756} {"train_loss": -38.530029296875, "global_step": 91567, "epoch": 756} {"train_loss": -38.50002670288086, "global_step": 91568, "epoch": 756} {"train_loss": -38.68655014038086, "global_step": 91569, "epoch": 756} {"train_loss": -38.815303802490234, "global_step": 91570, "epoch": 756} {"train_loss": -38.1242561340332, "global_step": 91571, "epoch": 756} {"train_loss": -38.85840606689453, "global_step": 91572, "epoch": 756} {"train_loss": -38.980125427246094, "global_step": 91573, "epoch": 756} {"train_loss": -38.68659591674805, "global_step": 91574, "epoch": 756} {"train_loss": -38.6788215637207, "global_step": 91575, "epoch": 756} {"train_loss": -38.568214416503906, "global_step": 91576, "epoch": 756} {"train_loss": -38.319217681884766, "global_step": 91577, "epoch": 756} {"train_loss": -38.59905242919922, "global_step": 91578, "epoch": 756} {"train_loss": -38.1529426574707, "global_step": 91579, "epoch": 756} {"train_loss": -38.790504455566406, "global_step": 91580, "epoch": 756} {"train_loss": -38.54507064819336, "global_step": 91581, "epoch": 756} {"train_loss": -38.50276565551758, "global_step": 91582, "epoch": 756} {"train_loss": -38.74897766113281, "global_step": 91583, "epoch": 756} {"train_loss": -38.480587005615234, "global_step": 91584, "epoch": 756} {"train_loss": -38.475074768066406, "global_step": 91585, "epoch": 756} {"train_loss": -38.4056396484375, "global_step": 91586, "epoch": 756} {"train_loss": -38.19947052001953, "global_step": 91587, "epoch": 756} {"train_loss": -37.62314987182617, "global_step": 91588, "epoch": 756} {"train_loss": -37.902992248535156, "global_step": 91589, "epoch": 756} {"train_loss": -34.09267807006836, "global_step": 91590, "epoch": 756} {"train_loss": -37.207008361816406, "global_step": 91591, "epoch": 756} {"train_loss": -38.22478103637695, "global_step": 91592, "epoch": 756} {"train_loss": -36.3526611328125, "global_step": 91593, "epoch": 756} {"train_loss": -35.8402099609375, "global_step": 91594, "epoch": 756} {"train_loss": -36.84112548828125, "global_step": 91595, "epoch": 756} {"train_loss": -37.61031382537085, "global_step": 91596, "epoch": 756, "val_loss": 2666552.75} {"train_loss": -35.385963439941406, "global_step": 91597, "epoch": 757} {"train_loss": -36.03336715698242, "global_step": 91598, "epoch": 757} {"train_loss": -34.7645263671875, "global_step": 91599, "epoch": 757} {"train_loss": -37.14198684692383, "global_step": 91600, "epoch": 757} {"train_loss": -36.494503021240234, "global_step": 91601, "epoch": 757} {"train_loss": -38.14095687866211, "global_step": 91602, "epoch": 757} {"train_loss": -37.59542465209961, "global_step": 91603, "epoch": 757} {"train_loss": -37.30810546875, "global_step": 91604, "epoch": 757} {"train_loss": -33.6548957824707, "global_step": 91605, "epoch": 757} {"train_loss": -37.27808380126953, "global_step": 91606, "epoch": 757} {"train_loss": -36.1478385925293, "global_step": 91607, "epoch": 757} {"train_loss": -35.86602783203125, "global_step": 91608, "epoch": 757} {"train_loss": -36.9728889465332, "global_step": 91609, "epoch": 757} {"train_loss": -37.37399673461914, "global_step": 91610, "epoch": 757} {"train_loss": -36.311500549316406, "global_step": 91611, "epoch": 757} {"train_loss": -37.075714111328125, "global_step": 91612, "epoch": 757} {"train_loss": -37.89448165893555, "global_step": 91613, "epoch": 757} {"train_loss": -36.04038619995117, "global_step": 91614, "epoch": 757} {"train_loss": -34.567623138427734, "global_step": 91615, "epoch": 757} {"train_loss": -36.09910202026367, "global_step": 91616, "epoch": 757} {"train_loss": -37.557098388671875, "global_step": 91617, "epoch": 757} {"train_loss": -37.27767562866211, "global_step": 91618, "epoch": 757} {"train_loss": -37.5890998840332, "global_step": 91619, "epoch": 757} {"train_loss": -37.09800338745117, "global_step": 91620, "epoch": 757} {"train_loss": -37.315338134765625, "global_step": 91621, "epoch": 757} {"train_loss": -35.30802917480469, "global_step": 91622, "epoch": 757} {"train_loss": -36.354217529296875, "global_step": 91623, "epoch": 757} {"train_loss": -37.18817138671875, "global_step": 91624, "epoch": 757} {"train_loss": -36.685577392578125, "global_step": 91625, "epoch": 757} {"train_loss": -37.350826263427734, "global_step": 91626, "epoch": 757} {"train_loss": -37.181861877441406, "global_step": 91627, "epoch": 757} {"train_loss": -37.542110443115234, "global_step": 91628, "epoch": 757} {"train_loss": -36.85147476196289, "global_step": 91629, "epoch": 757} {"train_loss": -37.82883834838867, "global_step": 91630, "epoch": 757} {"train_loss": -37.98899459838867, "global_step": 91631, "epoch": 757} {"train_loss": -37.29972457885742, "global_step": 91632, "epoch": 757} {"train_loss": -37.548038482666016, "global_step": 91633, "epoch": 757} {"train_loss": -37.3765869140625, "global_step": 91634, "epoch": 757} {"train_loss": -36.824302673339844, "global_step": 91635, "epoch": 757} {"train_loss": -37.77781295776367, "global_step": 91636, "epoch": 757} {"train_loss": -38.308494567871094, "global_step": 91637, "epoch": 757} {"train_loss": -37.53410720825195, "global_step": 91638, "epoch": 757} {"train_loss": -36.32609939575195, "global_step": 91639, "epoch": 757} {"train_loss": -37.36068344116211, "global_step": 91640, "epoch": 757} {"train_loss": -38.08069610595703, "global_step": 91641, "epoch": 757} {"train_loss": -37.23245620727539, "global_step": 91642, "epoch": 757} {"train_loss": -38.2305793762207, "global_step": 91643, "epoch": 757} {"train_loss": -37.31534957885742, "global_step": 91644, "epoch": 757} {"train_loss": -38.52902603149414, "global_step": 91645, "epoch": 757} {"train_loss": -37.57039260864258, "global_step": 91646, "epoch": 757} {"train_loss": -37.7945556640625, "global_step": 91647, "epoch": 757} {"train_loss": -37.51119613647461, "global_step": 91648, "epoch": 757} {"train_loss": -37.39094924926758, "global_step": 91649, "epoch": 757} {"train_loss": -38.112831115722656, "global_step": 91650, "epoch": 757} {"train_loss": -36.46833038330078, "global_step": 91651, "epoch": 757} {"train_loss": -37.490665435791016, "global_step": 91652, "epoch": 757} {"train_loss": -38.21462631225586, "global_step": 91653, "epoch": 757} {"train_loss": -36.35447311401367, "global_step": 91654, "epoch": 757} {"train_loss": -36.214534759521484, "global_step": 91655, "epoch": 757} {"train_loss": -37.31684494018555, "global_step": 91656, "epoch": 757} {"train_loss": -37.10382080078125, "global_step": 91657, "epoch": 757} {"train_loss": -37.48985290527344, "global_step": 91658, "epoch": 757} {"train_loss": -37.48569869995117, "global_step": 91659, "epoch": 757} {"train_loss": -37.6561393737793, "global_step": 91660, "epoch": 757} {"train_loss": -37.22805404663086, "global_step": 91661, "epoch": 757} {"train_loss": -36.772865295410156, "global_step": 91662, "epoch": 757} {"train_loss": -36.463714599609375, "global_step": 91663, "epoch": 757} {"train_loss": -38.015655517578125, "global_step": 91664, "epoch": 757} {"train_loss": -35.78157424926758, "global_step": 91665, "epoch": 757} {"train_loss": -35.48031234741211, "global_step": 91666, "epoch": 757} {"train_loss": -35.548343658447266, "global_step": 91667, "epoch": 757} {"train_loss": -35.73795700073242, "global_step": 91668, "epoch": 757} {"train_loss": -35.71152877807617, "global_step": 91669, "epoch": 757} {"train_loss": -36.339412689208984, "global_step": 91670, "epoch": 757} {"train_loss": -37.0257568359375, "global_step": 91671, "epoch": 757} {"train_loss": -36.652626037597656, "global_step": 91672, "epoch": 757} {"train_loss": -37.29396438598633, "global_step": 91673, "epoch": 757} {"train_loss": -36.78705978393555, "global_step": 91674, "epoch": 757} {"train_loss": -36.52466583251953, "global_step": 91675, "epoch": 757} {"train_loss": -35.64759063720703, "global_step": 91676, "epoch": 757} {"train_loss": -36.535675048828125, "global_step": 91677, "epoch": 757} {"train_loss": -38.01557159423828, "global_step": 91678, "epoch": 757} {"train_loss": -36.749141693115234, "global_step": 91679, "epoch": 757} {"train_loss": -35.24977493286133, "global_step": 91680, "epoch": 757} {"train_loss": -34.068267822265625, "global_step": 91681, "epoch": 757} {"train_loss": -37.12041091918945, "global_step": 91682, "epoch": 757} {"train_loss": -36.55171585083008, "global_step": 91683, "epoch": 757} {"train_loss": -32.68960189819336, "global_step": 91684, "epoch": 757} {"train_loss": -32.91265869140625, "global_step": 91685, "epoch": 757} {"train_loss": -37.04606246948242, "global_step": 91686, "epoch": 757} {"train_loss": -34.275794982910156, "global_step": 91687, "epoch": 757} {"train_loss": -33.5030632019043, "global_step": 91688, "epoch": 757} {"train_loss": -37.1069450378418, "global_step": 91689, "epoch": 757} {"train_loss": -35.08854293823242, "global_step": 91690, "epoch": 757} {"train_loss": -35.33721160888672, "global_step": 91691, "epoch": 757} {"train_loss": -37.53607940673828, "global_step": 91692, "epoch": 757} {"train_loss": -34.53788757324219, "global_step": 91693, "epoch": 757} {"train_loss": -37.005977630615234, "global_step": 91694, "epoch": 757} {"train_loss": -35.61581039428711, "global_step": 91695, "epoch": 757} {"train_loss": -36.592037200927734, "global_step": 91696, "epoch": 757} {"train_loss": -37.137210845947266, "global_step": 91697, "epoch": 757} {"train_loss": -36.30918502807617, "global_step": 91698, "epoch": 757} {"train_loss": -37.49427795410156, "global_step": 91699, "epoch": 757} {"train_loss": -35.99809265136719, "global_step": 91700, "epoch": 757} {"train_loss": -37.42201614379883, "global_step": 91701, "epoch": 757} {"train_loss": -36.40265655517578, "global_step": 91702, "epoch": 757} {"train_loss": -37.73992156982422, "global_step": 91703, "epoch": 757} {"train_loss": -37.0433464050293, "global_step": 91704, "epoch": 757} {"train_loss": -37.86766815185547, "global_step": 91705, "epoch": 757} {"train_loss": -37.81968307495117, "global_step": 91706, "epoch": 757} {"train_loss": -38.1048469543457, "global_step": 91707, "epoch": 757} {"train_loss": -38.03719711303711, "global_step": 91708, "epoch": 757} {"train_loss": -38.39353561401367, "global_step": 91709, "epoch": 757} {"train_loss": -37.441890716552734, "global_step": 91710, "epoch": 757} {"train_loss": -38.3907356262207, "global_step": 91711, "epoch": 757} {"train_loss": -37.72941970825195, "global_step": 91712, "epoch": 757} {"train_loss": -38.32809066772461, "global_step": 91713, "epoch": 757} {"train_loss": -37.72974395751953, "global_step": 91714, "epoch": 757} {"train_loss": -37.753173828125, "global_step": 91715, "epoch": 757} {"train_loss": -38.04694366455078, "global_step": 91716, "epoch": 757} {"train_loss": -36.83603021921205, "global_step": 91717, "epoch": 757, "val_loss": 2552900.0} {"train_loss": -38.31899642944336, "global_step": 91718, "epoch": 758} {"train_loss": -38.14411544799805, "global_step": 91719, "epoch": 758} {"train_loss": -38.007667541503906, "global_step": 91720, "epoch": 758} {"train_loss": -38.6359977722168, "global_step": 91721, "epoch": 758} {"train_loss": -38.01683807373047, "global_step": 91722, "epoch": 758} {"train_loss": -38.23886489868164, "global_step": 91723, "epoch": 758} {"train_loss": -38.57778549194336, "global_step": 91724, "epoch": 758} {"train_loss": -38.77171325683594, "global_step": 91725, "epoch": 758} {"train_loss": -38.2440071105957, "global_step": 91726, "epoch": 758} {"train_loss": -38.513946533203125, "global_step": 91727, "epoch": 758} {"train_loss": -38.30831527709961, "global_step": 91728, "epoch": 758} {"train_loss": -38.68745803833008, "global_step": 91729, "epoch": 758} {"train_loss": -38.69794845581055, "global_step": 91730, "epoch": 758} {"train_loss": -35.777587890625, "global_step": 91731, "epoch": 758} {"train_loss": -38.78739547729492, "global_step": 91732, "epoch": 758} {"train_loss": -37.6376838684082, "global_step": 91733, "epoch": 758} {"train_loss": -37.32137680053711, "global_step": 91734, "epoch": 758} {"train_loss": -38.26807403564453, "global_step": 91735, "epoch": 758} {"train_loss": -37.900726318359375, "global_step": 91736, "epoch": 758} {"train_loss": -38.4448356628418, "global_step": 91737, "epoch": 758} {"train_loss": -38.23207473754883, "global_step": 91738, "epoch": 758} {"train_loss": -37.113189697265625, "global_step": 91739, "epoch": 758} {"train_loss": -37.5687370300293, "global_step": 91740, "epoch": 758} {"train_loss": -36.63558578491211, "global_step": 91741, "epoch": 758} {"train_loss": -35.05729293823242, "global_step": 91742, "epoch": 758} {"train_loss": -37.91123580932617, "global_step": 91743, "epoch": 758} {"train_loss": -38.21041488647461, "global_step": 91744, "epoch": 758} {"train_loss": -38.801856994628906, "global_step": 91745, "epoch": 758} {"train_loss": -37.78933334350586, "global_step": 91746, "epoch": 758} {"train_loss": -37.10342025756836, "global_step": 91747, "epoch": 758} {"train_loss": -38.3972282409668, "global_step": 91748, "epoch": 758} {"train_loss": -38.09883117675781, "global_step": 91749, "epoch": 758} {"train_loss": -36.77104187011719, "global_step": 91750, "epoch": 758} {"train_loss": -38.176265716552734, "global_step": 91751, "epoch": 758} {"train_loss": -38.12739181518555, "global_step": 91752, "epoch": 758} {"train_loss": -37.499671936035156, "global_step": 91753, "epoch": 758} {"train_loss": -38.091365814208984, "global_step": 91754, "epoch": 758} {"train_loss": -37.98545455932617, "global_step": 91755, "epoch": 758} {"train_loss": -37.08819580078125, "global_step": 91756, "epoch": 758} {"train_loss": -36.5281867980957, "global_step": 91757, "epoch": 758} {"train_loss": -34.414756774902344, "global_step": 91758, "epoch": 758} {"train_loss": -37.72357177734375, "global_step": 91759, "epoch": 758} {"train_loss": -36.9987907409668, "global_step": 91760, "epoch": 758} {"train_loss": -38.143348693847656, "global_step": 91761, "epoch": 758} {"train_loss": -37.257991790771484, "global_step": 91762, "epoch": 758} {"train_loss": -34.81985855102539, "global_step": 91763, "epoch": 758} {"train_loss": -37.39530563354492, "global_step": 91764, "epoch": 758} {"train_loss": -36.88198471069336, "global_step": 91765, "epoch": 758} {"train_loss": -36.49110794067383, "global_step": 91766, "epoch": 758} {"train_loss": -37.02342224121094, "global_step": 91767, "epoch": 758} {"train_loss": -36.779335021972656, "global_step": 91768, "epoch": 758} {"train_loss": -36.705047607421875, "global_step": 91769, "epoch": 758} {"train_loss": -36.52960205078125, "global_step": 91770, "epoch": 758} {"train_loss": -36.834293365478516, "global_step": 91771, "epoch": 758} {"train_loss": -35.77402877807617, "global_step": 91772, "epoch": 758} {"train_loss": -37.47754669189453, "global_step": 91773, "epoch": 758} {"train_loss": -37.48041915893555, "global_step": 91774, "epoch": 758} {"train_loss": -38.09761428833008, "global_step": 91775, "epoch": 758} {"train_loss": -36.84109115600586, "global_step": 91776, "epoch": 758} {"train_loss": -37.842220306396484, "global_step": 91777, "epoch": 758} {"train_loss": -38.05021286010742, "global_step": 91778, "epoch": 758} {"train_loss": -37.42926788330078, "global_step": 91779, "epoch": 758} {"train_loss": -35.9854736328125, "global_step": 91780, "epoch": 758} {"train_loss": -37.34780502319336, "global_step": 91781, "epoch": 758} {"train_loss": -34.5197868347168, "global_step": 91782, "epoch": 758} {"train_loss": -36.39854431152344, "global_step": 91783, "epoch": 758} {"train_loss": -33.06563949584961, "global_step": 91784, "epoch": 758} {"train_loss": -33.64142990112305, "global_step": 91785, "epoch": 758} {"train_loss": -37.77690505981445, "global_step": 91786, "epoch": 758} {"train_loss": -34.88987350463867, "global_step": 91787, "epoch": 758} {"train_loss": -35.7515869140625, "global_step": 91788, "epoch": 758} {"train_loss": -34.01201248168945, "global_step": 91789, "epoch": 758} {"train_loss": -36.55005645751953, "global_step": 91790, "epoch": 758} {"train_loss": -37.22370529174805, "global_step": 91791, "epoch": 758} {"train_loss": -34.957611083984375, "global_step": 91792, "epoch": 758} {"train_loss": -36.86098098754883, "global_step": 91793, "epoch": 758} {"train_loss": -37.41575241088867, "global_step": 91794, "epoch": 758} {"train_loss": -36.62358474731445, "global_step": 91795, "epoch": 758} {"train_loss": -36.44968795776367, "global_step": 91796, "epoch": 758} {"train_loss": -36.70556640625, "global_step": 91797, "epoch": 758} {"train_loss": -37.36598205566406, "global_step": 91798, "epoch": 758} {"train_loss": -36.3974609375, "global_step": 91799, "epoch": 758} {"train_loss": -37.4988899230957, "global_step": 91800, "epoch": 758} {"train_loss": -37.64971923828125, "global_step": 91801, "epoch": 758} {"train_loss": -36.76300048828125, "global_step": 91802, "epoch": 758} {"train_loss": -38.06146240234375, "global_step": 91803, "epoch": 758} {"train_loss": -36.9874382019043, "global_step": 91804, "epoch": 758} {"train_loss": -36.90914535522461, "global_step": 91805, "epoch": 758} {"train_loss": -37.205570220947266, "global_step": 91806, "epoch": 758} {"train_loss": -37.087562561035156, "global_step": 91807, "epoch": 758} {"train_loss": -37.4742546081543, "global_step": 91808, "epoch": 758} {"train_loss": -37.926841735839844, "global_step": 91809, "epoch": 758} {"train_loss": -37.55110549926758, "global_step": 91810, "epoch": 758} {"train_loss": -38.27357864379883, "global_step": 91811, "epoch": 758} {"train_loss": -37.350929260253906, "global_step": 91812, "epoch": 758} {"train_loss": -37.56129837036133, "global_step": 91813, "epoch": 758} {"train_loss": -36.552669525146484, "global_step": 91814, "epoch": 758} {"train_loss": -37.7087516784668, "global_step": 91815, "epoch": 758} {"train_loss": -37.848873138427734, "global_step": 91816, "epoch": 758} {"train_loss": -37.76416015625, "global_step": 91817, "epoch": 758} {"train_loss": -37.81157684326172, "global_step": 91818, "epoch": 758} {"train_loss": -37.75313186645508, "global_step": 91819, "epoch": 758} {"train_loss": -37.95124435424805, "global_step": 91820, "epoch": 758} {"train_loss": -37.747371673583984, "global_step": 91821, "epoch": 758} {"train_loss": -37.33927536010742, "global_step": 91822, "epoch": 758} {"train_loss": -38.59412384033203, "global_step": 91823, "epoch": 758} {"train_loss": -37.85956954956055, "global_step": 91824, "epoch": 758} {"train_loss": -38.318111419677734, "global_step": 91825, "epoch": 758} {"train_loss": -38.03359603881836, "global_step": 91826, "epoch": 758} {"train_loss": -38.7633056640625, "global_step": 91827, "epoch": 758} {"train_loss": -38.35639953613281, "global_step": 91828, "epoch": 758} {"train_loss": -38.45858383178711, "global_step": 91829, "epoch": 758} {"train_loss": -38.138771057128906, "global_step": 91830, "epoch": 758} {"train_loss": -38.322505950927734, "global_step": 91831, "epoch": 758} {"train_loss": -38.92399215698242, "global_step": 91832, "epoch": 758} {"train_loss": -38.22629928588867, "global_step": 91833, "epoch": 758} {"train_loss": -37.85698318481445, "global_step": 91834, "epoch": 758} {"train_loss": -38.2551383972168, "global_step": 91835, "epoch": 758} {"train_loss": -37.19011306762695, "global_step": 91836, "epoch": 758} {"train_loss": -38.523860931396484, "global_step": 91837, "epoch": 758} {"train_loss": -37.377007350448736, "global_step": 91838, "epoch": 758, "val_loss": 2575116.0} {"train_loss": -38.20855712890625, "global_step": 91839, "epoch": 759} {"train_loss": -38.423763275146484, "global_step": 91840, "epoch": 759} {"train_loss": -37.949005126953125, "global_step": 91841, "epoch": 759} {"train_loss": -38.422080993652344, "global_step": 91842, "epoch": 759} {"train_loss": -38.77266311645508, "global_step": 91843, "epoch": 759} {"train_loss": -38.56718063354492, "global_step": 91844, "epoch": 759} {"train_loss": -37.16017532348633, "global_step": 91845, "epoch": 759} {"train_loss": -36.21692657470703, "global_step": 91846, "epoch": 759} {"train_loss": -36.33572006225586, "global_step": 91847, "epoch": 759} {"train_loss": -36.84482955932617, "global_step": 91848, "epoch": 759} {"train_loss": -38.84291458129883, "global_step": 91849, "epoch": 759} {"train_loss": -37.80428695678711, "global_step": 91850, "epoch": 759} {"train_loss": -36.959564208984375, "global_step": 91851, "epoch": 759} {"train_loss": -37.163978576660156, "global_step": 91852, "epoch": 759} {"train_loss": -38.002349853515625, "global_step": 91853, "epoch": 759} {"train_loss": -37.30104446411133, "global_step": 91854, "epoch": 759} {"train_loss": -37.610897064208984, "global_step": 91855, "epoch": 759} {"train_loss": -38.8043212890625, "global_step": 91856, "epoch": 759} {"train_loss": -37.8591194152832, "global_step": 91857, "epoch": 759} {"train_loss": -37.78296661376953, "global_step": 91858, "epoch": 759} {"train_loss": -38.611183166503906, "global_step": 91859, "epoch": 759} {"train_loss": -37.92780303955078, "global_step": 91860, "epoch": 759} {"train_loss": -38.38230514526367, "global_step": 91861, "epoch": 759} {"train_loss": -37.94784164428711, "global_step": 91862, "epoch": 759} {"train_loss": -38.65245056152344, "global_step": 91863, "epoch": 759} {"train_loss": -38.16194152832031, "global_step": 91864, "epoch": 759} {"train_loss": -37.85316848754883, "global_step": 91865, "epoch": 759} {"train_loss": -38.01853942871094, "global_step": 91866, "epoch": 759} {"train_loss": -38.062416076660156, "global_step": 91867, "epoch": 759} {"train_loss": -38.748348236083984, "global_step": 91868, "epoch": 759} {"train_loss": -38.03959655761719, "global_step": 91869, "epoch": 759} {"train_loss": -38.461944580078125, "global_step": 91870, "epoch": 759} {"train_loss": -38.586204528808594, "global_step": 91871, "epoch": 759} {"train_loss": -37.15156173706055, "global_step": 91872, "epoch": 759} {"train_loss": -38.72578430175781, "global_step": 91873, "epoch": 759} {"train_loss": -35.58720779418945, "global_step": 91874, "epoch": 759} {"train_loss": -37.36005783081055, "global_step": 91875, "epoch": 759} {"train_loss": -37.36527633666992, "global_step": 91876, "epoch": 759} {"train_loss": -38.013267517089844, "global_step": 91877, "epoch": 759} {"train_loss": -37.927215576171875, "global_step": 91878, "epoch": 759} {"train_loss": -37.99306106567383, "global_step": 91879, "epoch": 759} {"train_loss": -37.82535934448242, "global_step": 91880, "epoch": 759} {"train_loss": -38.08132553100586, "global_step": 91881, "epoch": 759} {"train_loss": -38.0271110534668, "global_step": 91882, "epoch": 759} {"train_loss": -38.14326095581055, "global_step": 91883, "epoch": 759} {"train_loss": -38.80109405517578, "global_step": 91884, "epoch": 759} {"train_loss": -37.335113525390625, "global_step": 91885, "epoch": 759} {"train_loss": -37.87898254394531, "global_step": 91886, "epoch": 759} {"train_loss": -38.315818786621094, "global_step": 91887, "epoch": 759} {"train_loss": -38.4200325012207, "global_step": 91888, "epoch": 759} {"train_loss": -38.66941452026367, "global_step": 91889, "epoch": 759} {"train_loss": -38.63197708129883, "global_step": 91890, "epoch": 759} {"train_loss": -36.809234619140625, "global_step": 91891, "epoch": 759} {"train_loss": -37.737613677978516, "global_step": 91892, "epoch": 759} {"train_loss": -36.84806823730469, "global_step": 91893, "epoch": 759} {"train_loss": -35.53383255004883, "global_step": 91894, "epoch": 759} {"train_loss": -35.99878692626953, "global_step": 91895, "epoch": 759} {"train_loss": -37.51924514770508, "global_step": 91896, "epoch": 759} {"train_loss": -38.68475341796875, "global_step": 91897, "epoch": 759} {"train_loss": -38.131866455078125, "global_step": 91898, "epoch": 759} {"train_loss": -37.38479232788086, "global_step": 91899, "epoch": 759} {"train_loss": -36.8015022277832, "global_step": 91900, "epoch": 759} {"train_loss": -37.236541748046875, "global_step": 91901, "epoch": 759} {"train_loss": -37.99409866333008, "global_step": 91902, "epoch": 759} {"train_loss": -36.342323303222656, "global_step": 91903, "epoch": 759} {"train_loss": -37.60137176513672, "global_step": 91904, "epoch": 759} {"train_loss": -37.79018020629883, "global_step": 91905, "epoch": 759} {"train_loss": -37.61062240600586, "global_step": 91906, "epoch": 759} {"train_loss": -36.854705810546875, "global_step": 91907, "epoch": 759} {"train_loss": -36.1827507019043, "global_step": 91908, "epoch": 759} {"train_loss": -37.95313262939453, "global_step": 91909, "epoch": 759} {"train_loss": -38.01613998413086, "global_step": 91910, "epoch": 759} {"train_loss": -38.26967239379883, "global_step": 91911, "epoch": 759} {"train_loss": -38.107337951660156, "global_step": 91912, "epoch": 759} {"train_loss": -38.18268966674805, "global_step": 91913, "epoch": 759} {"train_loss": -38.07809066772461, "global_step": 91914, "epoch": 759} {"train_loss": -38.21601486206055, "global_step": 91915, "epoch": 759} {"train_loss": -37.178279876708984, "global_step": 91916, "epoch": 759} {"train_loss": -38.264892578125, "global_step": 91917, "epoch": 759} {"train_loss": -38.34346389770508, "global_step": 91918, "epoch": 759} {"train_loss": -37.495399475097656, "global_step": 91919, "epoch": 759} {"train_loss": -38.59421920776367, "global_step": 91920, "epoch": 759} {"train_loss": -37.819210052490234, "global_step": 91921, "epoch": 759} {"train_loss": -35.67852783203125, "global_step": 91922, "epoch": 759} {"train_loss": -35.09425735473633, "global_step": 91923, "epoch": 759} {"train_loss": -35.32036209106445, "global_step": 91924, "epoch": 759} {"train_loss": -34.7196159362793, "global_step": 91925, "epoch": 759} {"train_loss": -36.43803787231445, "global_step": 91926, "epoch": 759} {"train_loss": -38.54014587402344, "global_step": 91927, "epoch": 759} {"train_loss": -37.39577102661133, "global_step": 91928, "epoch": 759} {"train_loss": -37.757179260253906, "global_step": 91929, "epoch": 759} {"train_loss": -37.866947174072266, "global_step": 91930, "epoch": 759} {"train_loss": -37.194183349609375, "global_step": 91931, "epoch": 759} {"train_loss": -34.776180267333984, "global_step": 91932, "epoch": 759} {"train_loss": -37.722686767578125, "global_step": 91933, "epoch": 759} {"train_loss": -36.906490325927734, "global_step": 91934, "epoch": 759} {"train_loss": -37.0838623046875, "global_step": 91935, "epoch": 759} {"train_loss": -36.75844955444336, "global_step": 91936, "epoch": 759} {"train_loss": -37.17048263549805, "global_step": 91937, "epoch": 759} {"train_loss": -36.190738677978516, "global_step": 91938, "epoch": 759} {"train_loss": -37.96451950073242, "global_step": 91939, "epoch": 759} {"train_loss": -37.0711784362793, "global_step": 91940, "epoch": 759} {"train_loss": -37.17743682861328, "global_step": 91941, "epoch": 759} {"train_loss": -37.91942596435547, "global_step": 91942, "epoch": 759} {"train_loss": -38.02225112915039, "global_step": 91943, "epoch": 759} {"train_loss": -38.144508361816406, "global_step": 91944, "epoch": 759} {"train_loss": -38.4922981262207, "global_step": 91945, "epoch": 759} {"train_loss": -37.8553581237793, "global_step": 91946, "epoch": 759} {"train_loss": -37.331398010253906, "global_step": 91947, "epoch": 759} {"train_loss": -38.02216339111328, "global_step": 91948, "epoch": 759} {"train_loss": -37.0414924621582, "global_step": 91949, "epoch": 759} {"train_loss": -37.1772575378418, "global_step": 91950, "epoch": 759} {"train_loss": -37.597225189208984, "global_step": 91951, "epoch": 759} {"train_loss": -37.92519760131836, "global_step": 91952, "epoch": 759} {"train_loss": -38.320152282714844, "global_step": 91953, "epoch": 759} {"train_loss": -36.86460876464844, "global_step": 91954, "epoch": 759} {"train_loss": -37.193580627441406, "global_step": 91955, "epoch": 759} {"train_loss": -37.13027572631836, "global_step": 91956, "epoch": 759} {"train_loss": -36.880149841308594, "global_step": 91957, "epoch": 759} {"train_loss": -35.949127197265625, "global_step": 91958, "epoch": 759} {"train_loss": -37.57058189329037, "global_step": 91959, "epoch": 759, "val_loss": 2593063.0} {"train_loss": -37.19099044799805, "global_step": 91960, "epoch": 760} {"train_loss": -35.87656784057617, "global_step": 91961, "epoch": 760} {"train_loss": -36.68817138671875, "global_step": 91962, "epoch": 760} {"train_loss": -37.5621452331543, "global_step": 91963, "epoch": 760} {"train_loss": -37.06394577026367, "global_step": 91964, "epoch": 760} {"train_loss": -36.69904708862305, "global_step": 91965, "epoch": 760} {"train_loss": -37.393463134765625, "global_step": 91966, "epoch": 760} {"train_loss": -37.28609085083008, "global_step": 91967, "epoch": 760} {"train_loss": -37.16179275512695, "global_step": 91968, "epoch": 760} {"train_loss": -37.45587921142578, "global_step": 91969, "epoch": 760} {"train_loss": -37.334537506103516, "global_step": 91970, "epoch": 760} {"train_loss": -37.99010467529297, "global_step": 91971, "epoch": 760} {"train_loss": -36.82902145385742, "global_step": 91972, "epoch": 760} {"train_loss": -35.844688415527344, "global_step": 91973, "epoch": 760} {"train_loss": -37.084930419921875, "global_step": 91974, "epoch": 760} {"train_loss": -36.61379623413086, "global_step": 91975, "epoch": 760} {"train_loss": -37.14214324951172, "global_step": 91976, "epoch": 760} {"train_loss": -38.1927604675293, "global_step": 91977, "epoch": 760} {"train_loss": -36.848567962646484, "global_step": 91978, "epoch": 760} {"train_loss": -36.97412872314453, "global_step": 91979, "epoch": 760} {"train_loss": -37.65815353393555, "global_step": 91980, "epoch": 760} {"train_loss": -37.99065017700195, "global_step": 91981, "epoch": 760} {"train_loss": -38.0738525390625, "global_step": 91982, "epoch": 760} {"train_loss": -38.06262969970703, "global_step": 91983, "epoch": 760} {"train_loss": -37.75856399536133, "global_step": 91984, "epoch": 760} {"train_loss": -38.41225814819336, "global_step": 91985, "epoch": 760} {"train_loss": -37.97100830078125, "global_step": 91986, "epoch": 760} {"train_loss": -38.231685638427734, "global_step": 91987, "epoch": 760} {"train_loss": -37.9677619934082, "global_step": 91988, "epoch": 760} {"train_loss": -38.466644287109375, "global_step": 91989, "epoch": 760} {"train_loss": -37.915771484375, "global_step": 91990, "epoch": 760} {"train_loss": -37.98881912231445, "global_step": 91991, "epoch": 760} {"train_loss": -37.42448043823242, "global_step": 91992, "epoch": 760} {"train_loss": -38.615692138671875, "global_step": 91993, "epoch": 760} {"train_loss": -38.2028923034668, "global_step": 91994, "epoch": 760} {"train_loss": -38.00209426879883, "global_step": 91995, "epoch": 760} {"train_loss": -37.913448333740234, "global_step": 91996, "epoch": 760} {"train_loss": -38.159034729003906, "global_step": 91997, "epoch": 760} {"train_loss": -38.25236129760742, "global_step": 91998, "epoch": 760} {"train_loss": -38.625301361083984, "global_step": 91999, "epoch": 760} {"train_loss": -38.26919174194336, "global_step": 92000, "epoch": 760} {"train_loss": -37.76296615600586, "global_step": 92001, "epoch": 760} {"train_loss": -38.5817985534668, "global_step": 92002, "epoch": 760} {"train_loss": -37.7892951965332, "global_step": 92003, "epoch": 760} {"train_loss": -38.30535125732422, "global_step": 92004, "epoch": 760} {"train_loss": -38.26947021484375, "global_step": 92005, "epoch": 760} {"train_loss": -38.39653396606445, "global_step": 92006, "epoch": 760} {"train_loss": -37.4452018737793, "global_step": 92007, "epoch": 760} {"train_loss": -38.19673156738281, "global_step": 92008, "epoch": 760} {"train_loss": -38.87913131713867, "global_step": 92009, "epoch": 760} {"train_loss": -38.2337760925293, "global_step": 92010, "epoch": 760} {"train_loss": -37.78487777709961, "global_step": 92011, "epoch": 760} {"train_loss": -37.933815002441406, "global_step": 92012, "epoch": 760} {"train_loss": -37.81330871582031, "global_step": 92013, "epoch": 760} {"train_loss": -38.72185134887695, "global_step": 92014, "epoch": 760} {"train_loss": -38.432369232177734, "global_step": 92015, "epoch": 760} {"train_loss": -38.05038070678711, "global_step": 92016, "epoch": 760} {"train_loss": -38.93515396118164, "global_step": 92017, "epoch": 760} {"train_loss": -38.39618682861328, "global_step": 92018, "epoch": 760} {"train_loss": -37.75684356689453, "global_step": 92019, "epoch": 760} {"train_loss": -37.764583587646484, "global_step": 92020, "epoch": 760} {"train_loss": -38.066585540771484, "global_step": 92021, "epoch": 760} {"train_loss": -35.81124496459961, "global_step": 92022, "epoch": 760} {"train_loss": -37.83020782470703, "global_step": 92023, "epoch": 760} {"train_loss": -38.2081413269043, "global_step": 92024, "epoch": 760} {"train_loss": -37.941314697265625, "global_step": 92025, "epoch": 760} {"train_loss": -38.307586669921875, "global_step": 92026, "epoch": 760} {"train_loss": -37.42295837402344, "global_step": 92027, "epoch": 760} {"train_loss": -37.92829513549805, "global_step": 92028, "epoch": 760} {"train_loss": -38.654571533203125, "global_step": 92029, "epoch": 760} {"train_loss": -38.39649200439453, "global_step": 92030, "epoch": 760} {"train_loss": -38.69635772705078, "global_step": 92031, "epoch": 760} {"train_loss": -37.20340347290039, "global_step": 92032, "epoch": 760} {"train_loss": -34.93393325805664, "global_step": 92033, "epoch": 760} {"train_loss": -38.73963165283203, "global_step": 92034, "epoch": 760} {"train_loss": -37.06920623779297, "global_step": 92035, "epoch": 760} {"train_loss": -36.88887405395508, "global_step": 92036, "epoch": 760} {"train_loss": -36.11486053466797, "global_step": 92037, "epoch": 760} {"train_loss": -36.40645980834961, "global_step": 92038, "epoch": 760} {"train_loss": -34.48655700683594, "global_step": 92039, "epoch": 760} {"train_loss": -32.60902404785156, "global_step": 92040, "epoch": 760} {"train_loss": -34.8029899597168, "global_step": 92041, "epoch": 760} {"train_loss": -33.88887405395508, "global_step": 92042, "epoch": 760} {"train_loss": -35.08246612548828, "global_step": 92043, "epoch": 760} {"train_loss": -35.45571517944336, "global_step": 92044, "epoch": 760} {"train_loss": -33.936092376708984, "global_step": 92045, "epoch": 760} {"train_loss": -35.4505615234375, "global_step": 92046, "epoch": 760} {"train_loss": -34.79624557495117, "global_step": 92047, "epoch": 760} {"train_loss": -34.6691780090332, "global_step": 92048, "epoch": 760} {"train_loss": -29.203983306884766, "global_step": 92049, "epoch": 760} {"train_loss": -33.922218322753906, "global_step": 92050, "epoch": 760} {"train_loss": -32.4788703918457, "global_step": 92051, "epoch": 760} {"train_loss": -32.321868896484375, "global_step": 92052, "epoch": 760} {"train_loss": -34.39016342163086, "global_step": 92053, "epoch": 760} {"train_loss": -32.66939926147461, "global_step": 92054, "epoch": 760} {"train_loss": -34.09465408325195, "global_step": 92055, "epoch": 760} {"train_loss": -32.02775192260742, "global_step": 92056, "epoch": 760} {"train_loss": -34.32783889770508, "global_step": 92057, "epoch": 760} {"train_loss": -34.742340087890625, "global_step": 92058, "epoch": 760} {"train_loss": -33.390380859375, "global_step": 92059, "epoch": 760} {"train_loss": -30.680011749267578, "global_step": 92060, "epoch": 760} {"train_loss": -33.20673751831055, "global_step": 92061, "epoch": 760} {"train_loss": -34.01747512817383, "global_step": 92062, "epoch": 760} {"train_loss": -35.531883239746094, "global_step": 92063, "epoch": 760} {"train_loss": -32.71034622192383, "global_step": 92064, "epoch": 760} {"train_loss": -35.28167724609375, "global_step": 92065, "epoch": 760} {"train_loss": -36.27170181274414, "global_step": 92066, "epoch": 760} {"train_loss": -35.69367218017578, "global_step": 92067, "epoch": 760} {"train_loss": -35.363826751708984, "global_step": 92068, "epoch": 760} {"train_loss": -34.26851272583008, "global_step": 92069, "epoch": 760} {"train_loss": -32.82404708862305, "global_step": 92070, "epoch": 760} {"train_loss": -34.11030197143555, "global_step": 92071, "epoch": 760} {"train_loss": -35.15938949584961, "global_step": 92072, "epoch": 760} {"train_loss": -35.23379135131836, "global_step": 92073, "epoch": 760} {"train_loss": -34.8862419128418, "global_step": 92074, "epoch": 760} {"train_loss": -35.54362106323242, "global_step": 92075, "epoch": 760} {"train_loss": -35.48463821411133, "global_step": 92076, "epoch": 760} {"train_loss": -35.79301834106445, "global_step": 92077, "epoch": 760} {"train_loss": -35.74544906616211, "global_step": 92078, "epoch": 760} {"train_loss": -34.58000564575195, "global_step": 92079, "epoch": 760} {"train_loss": -36.49601953679865, "global_step": 92080, "epoch": 760, "val_loss": 2585685.0} {"train_loss": -35.78058624267578, "global_step": 92081, "epoch": 761} {"train_loss": -36.57592010498047, "global_step": 92082, "epoch": 761} {"train_loss": -35.9734992980957, "global_step": 92083, "epoch": 761} {"train_loss": -36.10279846191406, "global_step": 92084, "epoch": 761} {"train_loss": -36.45344543457031, "global_step": 92085, "epoch": 761} {"train_loss": -35.7627067565918, "global_step": 92086, "epoch": 761} {"train_loss": -36.59543991088867, "global_step": 92087, "epoch": 761} {"train_loss": -36.04496383666992, "global_step": 92088, "epoch": 761} {"train_loss": -32.79278564453125, "global_step": 92089, "epoch": 761} {"train_loss": -34.608951568603516, "global_step": 92090, "epoch": 761} {"train_loss": -36.07990646362305, "global_step": 92091, "epoch": 761} {"train_loss": -36.260433197021484, "global_step": 92092, "epoch": 761} {"train_loss": -35.85567092895508, "global_step": 92093, "epoch": 761} {"train_loss": -34.457279205322266, "global_step": 92094, "epoch": 761} {"train_loss": -35.92715072631836, "global_step": 92095, "epoch": 761} {"train_loss": -36.112388610839844, "global_step": 92096, "epoch": 761} {"train_loss": -35.90955352783203, "global_step": 92097, "epoch": 761} {"train_loss": -36.20722198486328, "global_step": 92098, "epoch": 761} {"train_loss": -35.12894821166992, "global_step": 92099, "epoch": 761} {"train_loss": -36.190792083740234, "global_step": 92100, "epoch": 761} {"train_loss": -35.409725189208984, "global_step": 92101, "epoch": 761} {"train_loss": -36.27744674682617, "global_step": 92102, "epoch": 761} {"train_loss": -35.14005661010742, "global_step": 92103, "epoch": 761} {"train_loss": -35.755306243896484, "global_step": 92104, "epoch": 761} {"train_loss": -36.0639533996582, "global_step": 92105, "epoch": 761} {"train_loss": -36.74929428100586, "global_step": 92106, "epoch": 761} {"train_loss": -36.10133743286133, "global_step": 92107, "epoch": 761} {"train_loss": -36.327293395996094, "global_step": 92108, "epoch": 761} {"train_loss": -36.41652297973633, "global_step": 92109, "epoch": 761} {"train_loss": -34.99091339111328, "global_step": 92110, "epoch": 761} {"train_loss": -37.18073654174805, "global_step": 92111, "epoch": 761} {"train_loss": -36.838287353515625, "global_step": 92112, "epoch": 761} {"train_loss": -36.76398468017578, "global_step": 92113, "epoch": 761} {"train_loss": -36.97744369506836, "global_step": 92114, "epoch": 761} {"train_loss": -37.25088119506836, "global_step": 92115, "epoch": 761} {"train_loss": -37.03025436401367, "global_step": 92116, "epoch": 761} {"train_loss": -36.487281799316406, "global_step": 92117, "epoch": 761} {"train_loss": -37.34984588623047, "global_step": 92118, "epoch": 761} {"train_loss": -37.0935173034668, "global_step": 92119, "epoch": 761} {"train_loss": -37.152626037597656, "global_step": 92120, "epoch": 761} {"train_loss": -37.51175308227539, "global_step": 92121, "epoch": 761} {"train_loss": -37.24615478515625, "global_step": 92122, "epoch": 761} {"train_loss": -37.450897216796875, "global_step": 92123, "epoch": 761} {"train_loss": -37.21781539916992, "global_step": 92124, "epoch": 761} {"train_loss": -37.3795280456543, "global_step": 92125, "epoch": 761} {"train_loss": -36.886940002441406, "global_step": 92126, "epoch": 761} {"train_loss": -37.81826400756836, "global_step": 92127, "epoch": 761} {"train_loss": -37.0992431640625, "global_step": 92128, "epoch": 761} {"train_loss": -37.036834716796875, "global_step": 92129, "epoch": 761} {"train_loss": -36.63436508178711, "global_step": 92130, "epoch": 761} {"train_loss": -36.9920768737793, "global_step": 92131, "epoch": 761} {"train_loss": -37.648048400878906, "global_step": 92132, "epoch": 761} {"train_loss": -37.563297271728516, "global_step": 92133, "epoch": 761} {"train_loss": -36.68880081176758, "global_step": 92134, "epoch": 761} {"train_loss": -36.66064453125, "global_step": 92135, "epoch": 761} {"train_loss": -36.59554672241211, "global_step": 92136, "epoch": 761} {"train_loss": -37.58201217651367, "global_step": 92137, "epoch": 761} {"train_loss": -37.67251205444336, "global_step": 92138, "epoch": 761} {"train_loss": -37.728511810302734, "global_step": 92139, "epoch": 761} {"train_loss": -38.02912521362305, "global_step": 92140, "epoch": 761} {"train_loss": -37.92509841918945, "global_step": 92141, "epoch": 761} {"train_loss": -37.54175567626953, "global_step": 92142, "epoch": 761} {"train_loss": -36.65929412841797, "global_step": 92143, "epoch": 761} {"train_loss": -37.600521087646484, "global_step": 92144, "epoch": 761} {"train_loss": -37.6883430480957, "global_step": 92145, "epoch": 761} {"train_loss": -37.281532287597656, "global_step": 92146, "epoch": 761} {"train_loss": -38.41914749145508, "global_step": 92147, "epoch": 761} {"train_loss": -37.00539016723633, "global_step": 92148, "epoch": 761} {"train_loss": -35.22556686401367, "global_step": 92149, "epoch": 761} {"train_loss": -35.611724853515625, "global_step": 92150, "epoch": 761} {"train_loss": -37.65447235107422, "global_step": 92151, "epoch": 761} {"train_loss": -33.53676223754883, "global_step": 92152, "epoch": 761} {"train_loss": -35.2529296875, "global_step": 92153, "epoch": 761} {"train_loss": -33.09807205200195, "global_step": 92154, "epoch": 761} {"train_loss": -35.383155822753906, "global_step": 92155, "epoch": 761} {"train_loss": -37.6209831237793, "global_step": 92156, "epoch": 761} {"train_loss": -35.512996673583984, "global_step": 92157, "epoch": 761} {"train_loss": -34.74397659301758, "global_step": 92158, "epoch": 761} {"train_loss": -35.65519332885742, "global_step": 92159, "epoch": 761} {"train_loss": -35.914581298828125, "global_step": 92160, "epoch": 761} {"train_loss": -35.75175857543945, "global_step": 92161, "epoch": 761} {"train_loss": -37.14736557006836, "global_step": 92162, "epoch": 761} {"train_loss": -36.744140625, "global_step": 92163, "epoch": 761} {"train_loss": -34.29800796508789, "global_step": 92164, "epoch": 761} {"train_loss": -34.317779541015625, "global_step": 92165, "epoch": 761} {"train_loss": -34.28486251831055, "global_step": 92166, "epoch": 761} {"train_loss": -35.541927337646484, "global_step": 92167, "epoch": 761} {"train_loss": -38.19404220581055, "global_step": 92168, "epoch": 761} {"train_loss": -35.740604400634766, "global_step": 92169, "epoch": 761} {"train_loss": -34.496192932128906, "global_step": 92170, "epoch": 761} {"train_loss": -34.8421516418457, "global_step": 92171, "epoch": 761} {"train_loss": -36.86050033569336, "global_step": 92172, "epoch": 761} {"train_loss": -36.59939193725586, "global_step": 92173, "epoch": 761} {"train_loss": -36.109954833984375, "global_step": 92174, "epoch": 761} {"train_loss": -37.32499313354492, "global_step": 92175, "epoch": 761} {"train_loss": -35.927513122558594, "global_step": 92176, "epoch": 761} {"train_loss": -36.75107955932617, "global_step": 92177, "epoch": 761} {"train_loss": -37.601436614990234, "global_step": 92178, "epoch": 761} {"train_loss": -35.47551727294922, "global_step": 92179, "epoch": 761} {"train_loss": -37.042484283447266, "global_step": 92180, "epoch": 761} {"train_loss": -37.08328628540039, "global_step": 92181, "epoch": 761} {"train_loss": -37.170814514160156, "global_step": 92182, "epoch": 761} {"train_loss": -37.71049499511719, "global_step": 92183, "epoch": 761} {"train_loss": -37.11648178100586, "global_step": 92184, "epoch": 761} {"train_loss": -37.41667938232422, "global_step": 92185, "epoch": 761} {"train_loss": -37.539058685302734, "global_step": 92186, "epoch": 761} {"train_loss": -36.92715072631836, "global_step": 92187, "epoch": 761} {"train_loss": -37.6734619140625, "global_step": 92188, "epoch": 761} {"train_loss": -37.239784240722656, "global_step": 92189, "epoch": 761} {"train_loss": -38.0367546081543, "global_step": 92190, "epoch": 761} {"train_loss": -37.50056076049805, "global_step": 92191, "epoch": 761} {"train_loss": -37.62677001953125, "global_step": 92192, "epoch": 761} {"train_loss": -37.761165618896484, "global_step": 92193, "epoch": 761} {"train_loss": -37.60581588745117, "global_step": 92194, "epoch": 761} {"train_loss": -37.759212493896484, "global_step": 92195, "epoch": 761} {"train_loss": -37.887454986572266, "global_step": 92196, "epoch": 761} {"train_loss": -37.696083068847656, "global_step": 92197, "epoch": 761} {"train_loss": -38.11417770385742, "global_step": 92198, "epoch": 761} {"train_loss": -37.615779876708984, "global_step": 92199, "epoch": 761} {"train_loss": -37.82973861694336, "global_step": 92200, "epoch": 761} {"train_loss": -36.57240292257514, "global_step": 92201, "epoch": 761, "val_loss": 2585217.25} {"train_loss": -38.079627990722656, "global_step": 92202, "epoch": 762} {"train_loss": -37.918121337890625, "global_step": 92203, "epoch": 762} {"train_loss": -37.83811950683594, "global_step": 92204, "epoch": 762} {"train_loss": -38.37764358520508, "global_step": 92205, "epoch": 762} {"train_loss": -38.76627731323242, "global_step": 92206, "epoch": 762} {"train_loss": -37.872161865234375, "global_step": 92207, "epoch": 762} {"train_loss": -37.968849182128906, "global_step": 92208, "epoch": 762} {"train_loss": -37.73783493041992, "global_step": 92209, "epoch": 762} {"train_loss": -37.98128890991211, "global_step": 92210, "epoch": 762} {"train_loss": -38.605628967285156, "global_step": 92211, "epoch": 762} {"train_loss": -38.04781723022461, "global_step": 92212, "epoch": 762} {"train_loss": -37.56662368774414, "global_step": 92213, "epoch": 762} {"train_loss": -38.35356521606445, "global_step": 92214, "epoch": 762} {"train_loss": -38.482723236083984, "global_step": 92215, "epoch": 762} {"train_loss": -38.54725646972656, "global_step": 92216, "epoch": 762} {"train_loss": -38.76042175292969, "global_step": 92217, "epoch": 762} {"train_loss": -38.3111686706543, "global_step": 92218, "epoch": 762} {"train_loss": -38.66423416137695, "global_step": 92219, "epoch": 762} {"train_loss": -38.50736618041992, "global_step": 92220, "epoch": 762} {"train_loss": -38.692684173583984, "global_step": 92221, "epoch": 762} {"train_loss": -38.39042282104492, "global_step": 92222, "epoch": 762} {"train_loss": -38.758644104003906, "global_step": 92223, "epoch": 762} {"train_loss": -38.43826675415039, "global_step": 92224, "epoch": 762} {"train_loss": -38.44354248046875, "global_step": 92225, "epoch": 762} {"train_loss": -38.58258819580078, "global_step": 92226, "epoch": 762} {"train_loss": -38.66590881347656, "global_step": 92227, "epoch": 762} {"train_loss": -38.72523880004883, "global_step": 92228, "epoch": 762} {"train_loss": -38.44263458251953, "global_step": 92229, "epoch": 762} {"train_loss": -38.756866455078125, "global_step": 92230, "epoch": 762} {"train_loss": -38.45903778076172, "global_step": 92231, "epoch": 762} {"train_loss": -38.992488861083984, "global_step": 92232, "epoch": 762} {"train_loss": -38.2476806640625, "global_step": 92233, "epoch": 762} {"train_loss": -38.72792434692383, "global_step": 92234, "epoch": 762} {"train_loss": -39.10342025756836, "global_step": 92235, "epoch": 762} {"train_loss": -38.33694076538086, "global_step": 92236, "epoch": 762} {"train_loss": -37.90763854980469, "global_step": 92237, "epoch": 762} {"train_loss": -36.05227279663086, "global_step": 92238, "epoch": 762} {"train_loss": -34.09617233276367, "global_step": 92239, "epoch": 762} {"train_loss": -32.58677673339844, "global_step": 92240, "epoch": 762} {"train_loss": -34.21196365356445, "global_step": 92241, "epoch": 762} {"train_loss": -38.260833740234375, "global_step": 92242, "epoch": 762} {"train_loss": -37.88875961303711, "global_step": 92243, "epoch": 762} {"train_loss": -36.35612106323242, "global_step": 92244, "epoch": 762} {"train_loss": -37.381813049316406, "global_step": 92245, "epoch": 762} {"train_loss": -38.79763412475586, "global_step": 92246, "epoch": 762} {"train_loss": -38.30152893066406, "global_step": 92247, "epoch": 762} {"train_loss": -37.21753692626953, "global_step": 92248, "epoch": 762} {"train_loss": -38.5826530456543, "global_step": 92249, "epoch": 762} {"train_loss": -38.413265228271484, "global_step": 92250, "epoch": 762} {"train_loss": -37.32373809814453, "global_step": 92251, "epoch": 762} {"train_loss": -37.8624382019043, "global_step": 92252, "epoch": 762} {"train_loss": -37.7900390625, "global_step": 92253, "epoch": 762} {"train_loss": -37.97866439819336, "global_step": 92254, "epoch": 762} {"train_loss": -37.38172149658203, "global_step": 92255, "epoch": 762} {"train_loss": -36.32033157348633, "global_step": 92256, "epoch": 762} {"train_loss": -37.64493942260742, "global_step": 92257, "epoch": 762} {"train_loss": -37.5588493347168, "global_step": 92258, "epoch": 762} {"train_loss": -36.92136764526367, "global_step": 92259, "epoch": 762} {"train_loss": -38.60650634765625, "global_step": 92260, "epoch": 762} {"train_loss": -37.71118927001953, "global_step": 92261, "epoch": 762} {"train_loss": -37.605804443359375, "global_step": 92262, "epoch": 762} {"train_loss": -38.60346221923828, "global_step": 92263, "epoch": 762} {"train_loss": -38.27449417114258, "global_step": 92264, "epoch": 762} {"train_loss": -37.82978439331055, "global_step": 92265, "epoch": 762} {"train_loss": -38.66481399536133, "global_step": 92266, "epoch": 762} {"train_loss": -37.48668670654297, "global_step": 92267, "epoch": 762} {"train_loss": -38.3967399597168, "global_step": 92268, "epoch": 762} {"train_loss": -37.43408966064453, "global_step": 92269, "epoch": 762} {"train_loss": -38.72315216064453, "global_step": 92270, "epoch": 762} {"train_loss": -38.008705139160156, "global_step": 92271, "epoch": 762} {"train_loss": -38.126060485839844, "global_step": 92272, "epoch": 762} {"train_loss": -36.8892707824707, "global_step": 92273, "epoch": 762} {"train_loss": -38.35396194458008, "global_step": 92274, "epoch": 762} {"train_loss": -37.43595504760742, "global_step": 92275, "epoch": 762} {"train_loss": -36.694000244140625, "global_step": 92276, "epoch": 762} {"train_loss": -36.8032112121582, "global_step": 92277, "epoch": 762} {"train_loss": -38.10224533081055, "global_step": 92278, "epoch": 762} {"train_loss": -36.94084548950195, "global_step": 92279, "epoch": 762} {"train_loss": -36.43021774291992, "global_step": 92280, "epoch": 762} {"train_loss": -36.66288375854492, "global_step": 92281, "epoch": 762} {"train_loss": -37.392818450927734, "global_step": 92282, "epoch": 762} {"train_loss": -37.37311935424805, "global_step": 92283, "epoch": 762} {"train_loss": -38.11112594604492, "global_step": 92284, "epoch": 762} {"train_loss": -37.693458557128906, "global_step": 92285, "epoch": 762} {"train_loss": -37.18900680541992, "global_step": 92286, "epoch": 762} {"train_loss": -37.57038116455078, "global_step": 92287, "epoch": 762} {"train_loss": -37.52618408203125, "global_step": 92288, "epoch": 762} {"train_loss": -37.341835021972656, "global_step": 92289, "epoch": 762} {"train_loss": -35.09711837768555, "global_step": 92290, "epoch": 762} {"train_loss": -37.336944580078125, "global_step": 92291, "epoch": 762} {"train_loss": -36.80905532836914, "global_step": 92292, "epoch": 762} {"train_loss": -35.7525634765625, "global_step": 92293, "epoch": 762} {"train_loss": -38.17755889892578, "global_step": 92294, "epoch": 762} {"train_loss": -37.82355499267578, "global_step": 92295, "epoch": 762} {"train_loss": -37.73081588745117, "global_step": 92296, "epoch": 762} {"train_loss": -37.18861389160156, "global_step": 92297, "epoch": 762} {"train_loss": -35.655208587646484, "global_step": 92298, "epoch": 762} {"train_loss": -38.49213409423828, "global_step": 92299, "epoch": 762} {"train_loss": -37.17399978637695, "global_step": 92300, "epoch": 762} {"train_loss": -37.32882308959961, "global_step": 92301, "epoch": 762} {"train_loss": -36.99299621582031, "global_step": 92302, "epoch": 762} {"train_loss": -36.27177810668945, "global_step": 92303, "epoch": 762} {"train_loss": -37.66835403442383, "global_step": 92304, "epoch": 762} {"train_loss": -38.064754486083984, "global_step": 92305, "epoch": 762} {"train_loss": -37.873111724853516, "global_step": 92306, "epoch": 762} {"train_loss": -37.48561477661133, "global_step": 92307, "epoch": 762} {"train_loss": -37.97056579589844, "global_step": 92308, "epoch": 762} {"train_loss": -38.07246017456055, "global_step": 92309, "epoch": 762} {"train_loss": -38.598724365234375, "global_step": 92310, "epoch": 762} {"train_loss": -37.63778305053711, "global_step": 92311, "epoch": 762} {"train_loss": -38.140052795410156, "global_step": 92312, "epoch": 762} {"train_loss": -38.44826126098633, "global_step": 92313, "epoch": 762} {"train_loss": -38.43524932861328, "global_step": 92314, "epoch": 762} {"train_loss": -38.27937698364258, "global_step": 92315, "epoch": 762} {"train_loss": -38.2580680847168, "global_step": 92316, "epoch": 762} {"train_loss": -38.145389556884766, "global_step": 92317, "epoch": 762} {"train_loss": -38.01502227783203, "global_step": 92318, "epoch": 762} {"train_loss": -37.8791618347168, "global_step": 92319, "epoch": 762} {"train_loss": -37.83184814453125, "global_step": 92320, "epoch": 762} {"train_loss": -37.555049896240234, "global_step": 92321, "epoch": 762} {"train_loss": -37.747123655208874, "global_step": 92322, "epoch": 762, "val_loss": 2544691.75} {"train_loss": -37.69355773925781, "global_step": 92323, "epoch": 763} {"train_loss": -38.9338493347168, "global_step": 92324, "epoch": 763} {"train_loss": -37.57219314575195, "global_step": 92325, "epoch": 763} {"train_loss": -38.993770599365234, "global_step": 92326, "epoch": 763} {"train_loss": -38.190975189208984, "global_step": 92327, "epoch": 763} {"train_loss": -36.72896194458008, "global_step": 92328, "epoch": 763} {"train_loss": -37.27626419067383, "global_step": 92329, "epoch": 763} {"train_loss": -36.43893814086914, "global_step": 92330, "epoch": 763} {"train_loss": -34.460018157958984, "global_step": 92331, "epoch": 763} {"train_loss": -32.58820724487305, "global_step": 92332, "epoch": 763} {"train_loss": -28.38884925842285, "global_step": 92333, "epoch": 763} {"train_loss": -26.71784782409668, "global_step": 92334, "epoch": 763} {"train_loss": -32.030521392822266, "global_step": 92335, "epoch": 763} {"train_loss": -37.60221481323242, "global_step": 92336, "epoch": 763} {"train_loss": -33.71208572387695, "global_step": 92337, "epoch": 763} {"train_loss": -34.037109375, "global_step": 92338, "epoch": 763} {"train_loss": -38.380897521972656, "global_step": 92339, "epoch": 763} {"train_loss": -35.19546127319336, "global_step": 92340, "epoch": 763} {"train_loss": -34.57242965698242, "global_step": 92341, "epoch": 763} {"train_loss": -36.935211181640625, "global_step": 92342, "epoch": 763} {"train_loss": -35.7556037902832, "global_step": 92343, "epoch": 763} {"train_loss": -36.69482421875, "global_step": 92344, "epoch": 763} {"train_loss": -33.647029876708984, "global_step": 92345, "epoch": 763} {"train_loss": -37.51948547363281, "global_step": 92346, "epoch": 763} {"train_loss": -34.89557647705078, "global_step": 92347, "epoch": 763} {"train_loss": -35.38554763793945, "global_step": 92348, "epoch": 763} {"train_loss": -36.99478530883789, "global_step": 92349, "epoch": 763} {"train_loss": -36.188934326171875, "global_step": 92350, "epoch": 763} {"train_loss": -37.75045394897461, "global_step": 92351, "epoch": 763} {"train_loss": -32.68313217163086, "global_step": 92352, "epoch": 763} {"train_loss": -37.16621017456055, "global_step": 92353, "epoch": 763} {"train_loss": -35.89933395385742, "global_step": 92354, "epoch": 763} {"train_loss": -37.03935623168945, "global_step": 92355, "epoch": 763} {"train_loss": -36.883731842041016, "global_step": 92356, "epoch": 763} {"train_loss": -35.32516098022461, "global_step": 92357, "epoch": 763} {"train_loss": -36.273231506347656, "global_step": 92358, "epoch": 763} {"train_loss": -36.8533821105957, "global_step": 92359, "epoch": 763} {"train_loss": -36.1827278137207, "global_step": 92360, "epoch": 763} {"train_loss": -35.40530014038086, "global_step": 92361, "epoch": 763} {"train_loss": -37.060787200927734, "global_step": 92362, "epoch": 763} {"train_loss": -36.26871871948242, "global_step": 92363, "epoch": 763} {"train_loss": -36.8721923828125, "global_step": 92364, "epoch": 763} {"train_loss": -37.067047119140625, "global_step": 92365, "epoch": 763} {"train_loss": -37.1575813293457, "global_step": 92366, "epoch": 763} {"train_loss": -35.862300872802734, "global_step": 92367, "epoch": 763} {"train_loss": -35.74342346191406, "global_step": 92368, "epoch": 763} {"train_loss": -37.10693359375, "global_step": 92369, "epoch": 763} {"train_loss": -36.901432037353516, "global_step": 92370, "epoch": 763} {"train_loss": -35.47206115722656, "global_step": 92371, "epoch": 763} {"train_loss": -36.36771774291992, "global_step": 92372, "epoch": 763} {"train_loss": -37.33149337768555, "global_step": 92373, "epoch": 763} {"train_loss": -36.3441162109375, "global_step": 92374, "epoch": 763} {"train_loss": -36.78865432739258, "global_step": 92375, "epoch": 763} {"train_loss": -36.8447380065918, "global_step": 92376, "epoch": 763} {"train_loss": -36.57682418823242, "global_step": 92377, "epoch": 763} {"train_loss": -37.622589111328125, "global_step": 92378, "epoch": 763} {"train_loss": -36.79060363769531, "global_step": 92379, "epoch": 763} {"train_loss": -37.123619079589844, "global_step": 92380, "epoch": 763} {"train_loss": -37.8599967956543, "global_step": 92381, "epoch": 763} {"train_loss": -37.55035400390625, "global_step": 92382, "epoch": 763} {"train_loss": -37.11015701293945, "global_step": 92383, "epoch": 763} {"train_loss": -37.455928802490234, "global_step": 92384, "epoch": 763} {"train_loss": -37.353023529052734, "global_step": 92385, "epoch": 763} {"train_loss": -37.57563400268555, "global_step": 92386, "epoch": 763} {"train_loss": -36.605934143066406, "global_step": 92387, "epoch": 763} {"train_loss": -37.73148727416992, "global_step": 92388, "epoch": 763} {"train_loss": -38.02542495727539, "global_step": 92389, "epoch": 763} {"train_loss": -38.09950637817383, "global_step": 92390, "epoch": 763} {"train_loss": -37.889984130859375, "global_step": 92391, "epoch": 763} {"train_loss": -37.72651290893555, "global_step": 92392, "epoch": 763} {"train_loss": -36.725486755371094, "global_step": 92393, "epoch": 763} {"train_loss": -38.03811264038086, "global_step": 92394, "epoch": 763} {"train_loss": -37.92088317871094, "global_step": 92395, "epoch": 763} {"train_loss": -37.77594757080078, "global_step": 92396, "epoch": 763} {"train_loss": -38.340576171875, "global_step": 92397, "epoch": 763} {"train_loss": -38.56048583984375, "global_step": 92398, "epoch": 763} {"train_loss": -38.028076171875, "global_step": 92399, "epoch": 763} {"train_loss": -38.134883880615234, "global_step": 92400, "epoch": 763} {"train_loss": -37.645320892333984, "global_step": 92401, "epoch": 763} {"train_loss": -38.22013473510742, "global_step": 92402, "epoch": 763} {"train_loss": -37.97715759277344, "global_step": 92403, "epoch": 763} {"train_loss": -38.63995361328125, "global_step": 92404, "epoch": 763} {"train_loss": -38.5190544128418, "global_step": 92405, "epoch": 763} {"train_loss": -38.40610122680664, "global_step": 92406, "epoch": 763} {"train_loss": -38.1290283203125, "global_step": 92407, "epoch": 763} {"train_loss": -38.56423568725586, "global_step": 92408, "epoch": 763} {"train_loss": -38.19729232788086, "global_step": 92409, "epoch": 763} {"train_loss": -38.53365707397461, "global_step": 92410, "epoch": 763} {"train_loss": -38.18247604370117, "global_step": 92411, "epoch": 763} {"train_loss": -38.605220794677734, "global_step": 92412, "epoch": 763} {"train_loss": -38.19621276855469, "global_step": 92413, "epoch": 763} {"train_loss": -38.07017135620117, "global_step": 92414, "epoch": 763} {"train_loss": -38.25333786010742, "global_step": 92415, "epoch": 763} {"train_loss": -37.3524284362793, "global_step": 92416, "epoch": 763} {"train_loss": -37.029541015625, "global_step": 92417, "epoch": 763} {"train_loss": -36.2182502746582, "global_step": 92418, "epoch": 763} {"train_loss": -35.41943359375, "global_step": 92419, "epoch": 763} {"train_loss": -31.941564559936523, "global_step": 92420, "epoch": 763} {"train_loss": -28.423492431640625, "global_step": 92421, "epoch": 763} {"train_loss": -24.672775268554688, "global_step": 92422, "epoch": 763} {"train_loss": -28.861684799194336, "global_step": 92423, "epoch": 763} {"train_loss": -34.609840393066406, "global_step": 92424, "epoch": 763} {"train_loss": -26.89568519592285, "global_step": 92425, "epoch": 763} {"train_loss": -31.15765380859375, "global_step": 92426, "epoch": 763} {"train_loss": -30.7515926361084, "global_step": 92427, "epoch": 763} {"train_loss": -35.653438568115234, "global_step": 92428, "epoch": 763} {"train_loss": -30.472156524658203, "global_step": 92429, "epoch": 763} {"train_loss": -35.143592834472656, "global_step": 92430, "epoch": 763} {"train_loss": -33.68288803100586, "global_step": 92431, "epoch": 763} {"train_loss": -33.64622116088867, "global_step": 92432, "epoch": 763} {"train_loss": -34.43873977661133, "global_step": 92433, "epoch": 763} {"train_loss": -34.4473991394043, "global_step": 92434, "epoch": 763} {"train_loss": -36.10981369018555, "global_step": 92435, "epoch": 763} {"train_loss": -34.86943435668945, "global_step": 92436, "epoch": 763} {"train_loss": -35.55485534667969, "global_step": 92437, "epoch": 763} {"train_loss": -34.762516021728516, "global_step": 92438, "epoch": 763} {"train_loss": -35.387691497802734, "global_step": 92439, "epoch": 763} {"train_loss": -35.59293746948242, "global_step": 92440, "epoch": 763} {"train_loss": -36.924102783203125, "global_step": 92441, "epoch": 763} {"train_loss": -35.71258544921875, "global_step": 92442, "epoch": 763} {"train_loss": -36.024490545603854, "global_step": 92443, "epoch": 763, "val_loss": 2605636.75} {"train_loss": -36.93889617919922, "global_step": 92444, "epoch": 764} {"train_loss": -36.129207611083984, "global_step": 92445, "epoch": 764} {"train_loss": -36.88108444213867, "global_step": 92446, "epoch": 764} {"train_loss": -36.8798713684082, "global_step": 92447, "epoch": 764} {"train_loss": -36.826995849609375, "global_step": 92448, "epoch": 764} {"train_loss": -37.19819259643555, "global_step": 92449, "epoch": 764} {"train_loss": -37.15109634399414, "global_step": 92450, "epoch": 764} {"train_loss": -37.09554672241211, "global_step": 92451, "epoch": 764} {"train_loss": -37.716182708740234, "global_step": 92452, "epoch": 764} {"train_loss": -37.546630859375, "global_step": 92453, "epoch": 764} {"train_loss": -37.51929473876953, "global_step": 92454, "epoch": 764} {"train_loss": -38.08364486694336, "global_step": 92455, "epoch": 764} {"train_loss": -37.97196578979492, "global_step": 92456, "epoch": 764} {"train_loss": -37.234657287597656, "global_step": 92457, "epoch": 764} {"train_loss": -37.6328125, "global_step": 92458, "epoch": 764} {"train_loss": -37.586524963378906, "global_step": 92459, "epoch": 764} {"train_loss": -37.7830696105957, "global_step": 92460, "epoch": 764} {"train_loss": -38.22193145751953, "global_step": 92461, "epoch": 764} {"train_loss": -38.14103317260742, "global_step": 92462, "epoch": 764} {"train_loss": -38.33106231689453, "global_step": 92463, "epoch": 764} {"train_loss": -38.08418273925781, "global_step": 92464, "epoch": 764} {"train_loss": -37.98231887817383, "global_step": 92465, "epoch": 764} {"train_loss": -37.9403190612793, "global_step": 92466, "epoch": 764} {"train_loss": -38.199459075927734, "global_step": 92467, "epoch": 764} {"train_loss": -38.239383697509766, "global_step": 92468, "epoch": 764} {"train_loss": -38.06947708129883, "global_step": 92469, "epoch": 764} {"train_loss": -38.31848907470703, "global_step": 92470, "epoch": 764} {"train_loss": -38.52067947387695, "global_step": 92471, "epoch": 764} {"train_loss": -38.69989013671875, "global_step": 92472, "epoch": 764} {"train_loss": -38.0563850402832, "global_step": 92473, "epoch": 764} {"train_loss": -38.60286331176758, "global_step": 92474, "epoch": 764} {"train_loss": -38.21894454956055, "global_step": 92475, "epoch": 764} {"train_loss": -38.17681884765625, "global_step": 92476, "epoch": 764} {"train_loss": -38.10839080810547, "global_step": 92477, "epoch": 764} {"train_loss": -38.31467819213867, "global_step": 92478, "epoch": 764} {"train_loss": -37.51838302612305, "global_step": 92479, "epoch": 764} {"train_loss": -38.81513595581055, "global_step": 92480, "epoch": 764} {"train_loss": -37.9969596862793, "global_step": 92481, "epoch": 764} {"train_loss": -38.248504638671875, "global_step": 92482, "epoch": 764} {"train_loss": -38.41532516479492, "global_step": 92483, "epoch": 764} {"train_loss": -38.08359146118164, "global_step": 92484, "epoch": 764} {"train_loss": -38.60340118408203, "global_step": 92485, "epoch": 764} {"train_loss": -38.96736526489258, "global_step": 92486, "epoch": 764} {"train_loss": -38.45821762084961, "global_step": 92487, "epoch": 764} {"train_loss": -38.4583740234375, "global_step": 92488, "epoch": 764} {"train_loss": -38.67570114135742, "global_step": 92489, "epoch": 764} {"train_loss": -38.84283447265625, "global_step": 92490, "epoch": 764} {"train_loss": -38.66355514526367, "global_step": 92491, "epoch": 764} {"train_loss": -38.757286071777344, "global_step": 92492, "epoch": 764} {"train_loss": -38.28066635131836, "global_step": 92493, "epoch": 764} {"train_loss": -38.73927307128906, "global_step": 92494, "epoch": 764} {"train_loss": -38.755470275878906, "global_step": 92495, "epoch": 764} {"train_loss": -38.49021911621094, "global_step": 92496, "epoch": 764} {"train_loss": -38.946144104003906, "global_step": 92497, "epoch": 764} {"train_loss": -38.71906280517578, "global_step": 92498, "epoch": 764} {"train_loss": -38.84377670288086, "global_step": 92499, "epoch": 764} {"train_loss": -39.062068939208984, "global_step": 92500, "epoch": 764} {"train_loss": -38.500091552734375, "global_step": 92501, "epoch": 764} {"train_loss": -37.8836784362793, "global_step": 92502, "epoch": 764} {"train_loss": -37.917850494384766, "global_step": 92503, "epoch": 764} {"train_loss": -38.75365447998047, "global_step": 92504, "epoch": 764} {"train_loss": -38.84616470336914, "global_step": 92505, "epoch": 764} {"train_loss": -38.01085662841797, "global_step": 92506, "epoch": 764} {"train_loss": -37.445674896240234, "global_step": 92507, "epoch": 764} {"train_loss": -37.34748077392578, "global_step": 92508, "epoch": 764} {"train_loss": -38.241336822509766, "global_step": 92509, "epoch": 764} {"train_loss": -37.401641845703125, "global_step": 92510, "epoch": 764} {"train_loss": -37.46809768676758, "global_step": 92511, "epoch": 764} {"train_loss": -38.33806228637695, "global_step": 92512, "epoch": 764} {"train_loss": -38.14535140991211, "global_step": 92513, "epoch": 764} {"train_loss": -37.30245590209961, "global_step": 92514, "epoch": 764} {"train_loss": -36.41030502319336, "global_step": 92515, "epoch": 764} {"train_loss": -37.33402633666992, "global_step": 92516, "epoch": 764} {"train_loss": -37.42991256713867, "global_step": 92517, "epoch": 764} {"train_loss": -37.06180191040039, "global_step": 92518, "epoch": 764} {"train_loss": -37.609649658203125, "global_step": 92519, "epoch": 764} {"train_loss": -37.047420501708984, "global_step": 92520, "epoch": 764} {"train_loss": -36.304046630859375, "global_step": 92521, "epoch": 764} {"train_loss": -37.77127456665039, "global_step": 92522, "epoch": 764} {"train_loss": -36.41074752807617, "global_step": 92523, "epoch": 764} {"train_loss": -35.554134368896484, "global_step": 92524, "epoch": 764} {"train_loss": -35.56854248046875, "global_step": 92525, "epoch": 764} {"train_loss": -37.69314193725586, "global_step": 92526, "epoch": 764} {"train_loss": -35.09281539916992, "global_step": 92527, "epoch": 764} {"train_loss": -33.246822357177734, "global_step": 92528, "epoch": 764} {"train_loss": -37.89974594116211, "global_step": 92529, "epoch": 764} {"train_loss": -35.56011962890625, "global_step": 92530, "epoch": 764} {"train_loss": -35.950374603271484, "global_step": 92531, "epoch": 764} {"train_loss": -37.75390625, "global_step": 92532, "epoch": 764} {"train_loss": -36.07997512817383, "global_step": 92533, "epoch": 764} {"train_loss": -37.099449157714844, "global_step": 92534, "epoch": 764} {"train_loss": -36.84730911254883, "global_step": 92535, "epoch": 764} {"train_loss": -36.77193832397461, "global_step": 92536, "epoch": 764} {"train_loss": -37.350196838378906, "global_step": 92537, "epoch": 764} {"train_loss": -37.28001022338867, "global_step": 92538, "epoch": 764} {"train_loss": -37.52457046508789, "global_step": 92539, "epoch": 764} {"train_loss": -37.879920959472656, "global_step": 92540, "epoch": 764} {"train_loss": -37.78384017944336, "global_step": 92541, "epoch": 764} {"train_loss": -35.195106506347656, "global_step": 92542, "epoch": 764} {"train_loss": -38.05059814453125, "global_step": 92543, "epoch": 764} {"train_loss": -38.22187805175781, "global_step": 92544, "epoch": 764} {"train_loss": -37.49603271484375, "global_step": 92545, "epoch": 764} {"train_loss": -38.028724670410156, "global_step": 92546, "epoch": 764} {"train_loss": -37.93795394897461, "global_step": 92547, "epoch": 764} {"train_loss": -36.96733856201172, "global_step": 92548, "epoch": 764} {"train_loss": -38.03169631958008, "global_step": 92549, "epoch": 764} {"train_loss": -38.044593811035156, "global_step": 92550, "epoch": 764} {"train_loss": -37.64493179321289, "global_step": 92551, "epoch": 764} {"train_loss": -37.80153274536133, "global_step": 92552, "epoch": 764} {"train_loss": -38.25868606567383, "global_step": 92553, "epoch": 764} {"train_loss": -38.14182662963867, "global_step": 92554, "epoch": 764} {"train_loss": -38.115699768066406, "global_step": 92555, "epoch": 764} {"train_loss": -37.850337982177734, "global_step": 92556, "epoch": 764} {"train_loss": -37.899051666259766, "global_step": 92557, "epoch": 764} {"train_loss": -38.25972366333008, "global_step": 92558, "epoch": 764} {"train_loss": -38.17461013793945, "global_step": 92559, "epoch": 764} {"train_loss": -38.21219253540039, "global_step": 92560, "epoch": 764} {"train_loss": -37.83047866821289, "global_step": 92561, "epoch": 764} {"train_loss": -38.554664611816406, "global_step": 92562, "epoch": 764} {"train_loss": -38.300838470458984, "global_step": 92563, "epoch": 764} {"train_loss": -37.7345957164922, "global_step": 92564, "epoch": 764, "val_loss": 2518444.75} {"train_loss": -38.79830551147461, "global_step": 92565, "epoch": 765} {"train_loss": -38.54362106323242, "global_step": 92566, "epoch": 765} {"train_loss": -38.09592056274414, "global_step": 92567, "epoch": 765} {"train_loss": -38.430458068847656, "global_step": 92568, "epoch": 765} {"train_loss": -38.44545364379883, "global_step": 92569, "epoch": 765} {"train_loss": -38.18558883666992, "global_step": 92570, "epoch": 765} {"train_loss": -39.1010856628418, "global_step": 92571, "epoch": 765} {"train_loss": -39.02312469482422, "global_step": 92572, "epoch": 765} {"train_loss": -38.889312744140625, "global_step": 92573, "epoch": 765} {"train_loss": -38.64608383178711, "global_step": 92574, "epoch": 765} {"train_loss": -38.58449935913086, "global_step": 92575, "epoch": 765} {"train_loss": -38.80367660522461, "global_step": 92576, "epoch": 765} {"train_loss": -37.72672653198242, "global_step": 92577, "epoch": 765} {"train_loss": -38.07374954223633, "global_step": 92578, "epoch": 765} {"train_loss": -38.79895782470703, "global_step": 92579, "epoch": 765} {"train_loss": -38.40815353393555, "global_step": 92580, "epoch": 765} {"train_loss": -38.87042236328125, "global_step": 92581, "epoch": 765} {"train_loss": -38.97652053833008, "global_step": 92582, "epoch": 765} {"train_loss": -39.00989532470703, "global_step": 92583, "epoch": 765} {"train_loss": -38.745208740234375, "global_step": 92584, "epoch": 765} {"train_loss": -39.09052658081055, "global_step": 92585, "epoch": 765} {"train_loss": -38.92622375488281, "global_step": 92586, "epoch": 765} {"train_loss": -38.81761169433594, "global_step": 92587, "epoch": 765} {"train_loss": -38.53464889526367, "global_step": 92588, "epoch": 765} {"train_loss": -37.215240478515625, "global_step": 92589, "epoch": 765} {"train_loss": -36.1716194152832, "global_step": 92590, "epoch": 765} {"train_loss": -33.448577880859375, "global_step": 92591, "epoch": 765} {"train_loss": -28.185827255249023, "global_step": 92592, "epoch": 765} {"train_loss": -19.680809020996094, "global_step": 92593, "epoch": 765} {"train_loss": -25.16592025756836, "global_step": 92594, "epoch": 765} {"train_loss": -39.07089614868164, "global_step": 92595, "epoch": 765} {"train_loss": -27.414295196533203, "global_step": 92596, "epoch": 765} {"train_loss": -33.28083419799805, "global_step": 92597, "epoch": 765} {"train_loss": -35.87461471557617, "global_step": 92598, "epoch": 765} {"train_loss": -35.038326263427734, "global_step": 92599, "epoch": 765} {"train_loss": -36.856788635253906, "global_step": 92600, "epoch": 765} {"train_loss": -35.22357940673828, "global_step": 92601, "epoch": 765} {"train_loss": -35.9005126953125, "global_step": 92602, "epoch": 765} {"train_loss": -36.63796615600586, "global_step": 92603, "epoch": 765} {"train_loss": -35.763641357421875, "global_step": 92604, "epoch": 765} {"train_loss": -37.598548889160156, "global_step": 92605, "epoch": 765} {"train_loss": -36.335205078125, "global_step": 92606, "epoch": 765} {"train_loss": -38.36066818237305, "global_step": 92607, "epoch": 765} {"train_loss": -37.53646469116211, "global_step": 92608, "epoch": 765} {"train_loss": -36.88190841674805, "global_step": 92609, "epoch": 765} {"train_loss": -37.07966613769531, "global_step": 92610, "epoch": 765} {"train_loss": -36.211830139160156, "global_step": 92611, "epoch": 765} {"train_loss": -37.467952728271484, "global_step": 92612, "epoch": 765} {"train_loss": -38.44643020629883, "global_step": 92613, "epoch": 765} {"train_loss": -36.55636978149414, "global_step": 92614, "epoch": 765} {"train_loss": -38.13078689575195, "global_step": 92615, "epoch": 765} {"train_loss": -35.249053955078125, "global_step": 92616, "epoch": 765} {"train_loss": -36.78418731689453, "global_step": 92617, "epoch": 765} {"train_loss": -37.50710678100586, "global_step": 92618, "epoch": 765} {"train_loss": -38.0397834777832, "global_step": 92619, "epoch": 765} {"train_loss": -38.17302322387695, "global_step": 92620, "epoch": 765} {"train_loss": -37.12061309814453, "global_step": 92621, "epoch": 765} {"train_loss": -37.58162307739258, "global_step": 92622, "epoch": 765} {"train_loss": -37.10783004760742, "global_step": 92623, "epoch": 765} {"train_loss": -38.47871017456055, "global_step": 92624, "epoch": 765} {"train_loss": -38.402740478515625, "global_step": 92625, "epoch": 765} {"train_loss": -37.19892501831055, "global_step": 92626, "epoch": 765} {"train_loss": -37.91984939575195, "global_step": 92627, "epoch": 765} {"train_loss": -35.64498519897461, "global_step": 92628, "epoch": 765} {"train_loss": -37.58278274536133, "global_step": 92629, "epoch": 765} {"train_loss": -38.186988830566406, "global_step": 92630, "epoch": 765} {"train_loss": -38.32258224487305, "global_step": 92631, "epoch": 765} {"train_loss": -37.04929733276367, "global_step": 92632, "epoch": 765} {"train_loss": -38.018001556396484, "global_step": 92633, "epoch": 765} {"train_loss": -37.84150314331055, "global_step": 92634, "epoch": 765} {"train_loss": -38.11678695678711, "global_step": 92635, "epoch": 765} {"train_loss": -38.352210998535156, "global_step": 92636, "epoch": 765} {"train_loss": -38.19740676879883, "global_step": 92637, "epoch": 765} {"train_loss": -38.09540939331055, "global_step": 92638, "epoch": 765} {"train_loss": -38.07094192504883, "global_step": 92639, "epoch": 765} {"train_loss": -37.72788619995117, "global_step": 92640, "epoch": 765} {"train_loss": -37.03204345703125, "global_step": 92641, "epoch": 765} {"train_loss": -37.91730499267578, "global_step": 92642, "epoch": 765} {"train_loss": -37.6486930847168, "global_step": 92643, "epoch": 765} {"train_loss": -38.290374755859375, "global_step": 92644, "epoch": 765} {"train_loss": -37.69441604614258, "global_step": 92645, "epoch": 765} {"train_loss": -37.65789794921875, "global_step": 92646, "epoch": 765} {"train_loss": -37.481658935546875, "global_step": 92647, "epoch": 765} {"train_loss": -37.92462921142578, "global_step": 92648, "epoch": 765} {"train_loss": -38.195411682128906, "global_step": 92649, "epoch": 765} {"train_loss": -38.15167999267578, "global_step": 92650, "epoch": 765} {"train_loss": -38.33234786987305, "global_step": 92651, "epoch": 765} {"train_loss": -37.56260299682617, "global_step": 92652, "epoch": 765} {"train_loss": -37.66534423828125, "global_step": 92653, "epoch": 765} {"train_loss": -37.73420333862305, "global_step": 92654, "epoch": 765} {"train_loss": -38.211544036865234, "global_step": 92655, "epoch": 765} {"train_loss": -37.98244857788086, "global_step": 92656, "epoch": 765} {"train_loss": -36.565425872802734, "global_step": 92657, "epoch": 765} {"train_loss": -37.75933837890625, "global_step": 92658, "epoch": 765} {"train_loss": -38.33042526245117, "global_step": 92659, "epoch": 765} {"train_loss": -38.53978729248047, "global_step": 92660, "epoch": 765} {"train_loss": -38.54127502441406, "global_step": 92661, "epoch": 765} {"train_loss": -38.336570739746094, "global_step": 92662, "epoch": 765} {"train_loss": -38.75459671020508, "global_step": 92663, "epoch": 765} {"train_loss": -39.12205123901367, "global_step": 92664, "epoch": 765} {"train_loss": -38.51170349121094, "global_step": 92665, "epoch": 765} {"train_loss": -38.167701721191406, "global_step": 92666, "epoch": 765} {"train_loss": -38.321163177490234, "global_step": 92667, "epoch": 765} {"train_loss": -38.57735061645508, "global_step": 92668, "epoch": 765} {"train_loss": -38.79652786254883, "global_step": 92669, "epoch": 765} {"train_loss": -38.4333610534668, "global_step": 92670, "epoch": 765} {"train_loss": -37.96682357788086, "global_step": 92671, "epoch": 765} {"train_loss": -38.3267936706543, "global_step": 92672, "epoch": 765} {"train_loss": -38.305747985839844, "global_step": 92673, "epoch": 765} {"train_loss": -38.06911849975586, "global_step": 92674, "epoch": 765} {"train_loss": -37.71443557739258, "global_step": 92675, "epoch": 765} {"train_loss": -37.90948486328125, "global_step": 92676, "epoch": 765} {"train_loss": -38.83844757080078, "global_step": 92677, "epoch": 765} {"train_loss": -37.04033279418945, "global_step": 92678, "epoch": 765} {"train_loss": -37.953609466552734, "global_step": 92679, "epoch": 765} {"train_loss": -38.634334564208984, "global_step": 92680, "epoch": 765} {"train_loss": -37.79664993286133, "global_step": 92681, "epoch": 765} {"train_loss": -36.40570068359375, "global_step": 92682, "epoch": 765} {"train_loss": -37.54643630981445, "global_step": 92683, "epoch": 765} {"train_loss": -39.08806228637695, "global_step": 92684, "epoch": 765} {"train_loss": -37.36586857630201, "global_step": 92685, "epoch": 765, "val_loss": 2620678.25} {"train_loss": -38.1822395324707, "global_step": 92686, "epoch": 766} {"train_loss": -38.79548645019531, "global_step": 92687, "epoch": 766} {"train_loss": -37.924652099609375, "global_step": 92688, "epoch": 766} {"train_loss": -37.82455062866211, "global_step": 92689, "epoch": 766} {"train_loss": -38.81147384643555, "global_step": 92690, "epoch": 766} {"train_loss": -38.0850944519043, "global_step": 92691, "epoch": 766} {"train_loss": -38.37199020385742, "global_step": 92692, "epoch": 766} {"train_loss": -35.6653938293457, "global_step": 92693, "epoch": 766} {"train_loss": -34.2859001159668, "global_step": 92694, "epoch": 766} {"train_loss": -36.83883285522461, "global_step": 92695, "epoch": 766} {"train_loss": -36.61951446533203, "global_step": 92696, "epoch": 766} {"train_loss": -37.32931137084961, "global_step": 92697, "epoch": 766} {"train_loss": -37.01089096069336, "global_step": 92698, "epoch": 766} {"train_loss": -37.5604248046875, "global_step": 92699, "epoch": 766} {"train_loss": -36.068748474121094, "global_step": 92700, "epoch": 766} {"train_loss": -36.248878479003906, "global_step": 92701, "epoch": 766} {"train_loss": -35.431739807128906, "global_step": 92702, "epoch": 766} {"train_loss": -36.60334014892578, "global_step": 92703, "epoch": 766} {"train_loss": -36.22894287109375, "global_step": 92704, "epoch": 766} {"train_loss": -34.335330963134766, "global_step": 92705, "epoch": 766} {"train_loss": -35.128692626953125, "global_step": 92706, "epoch": 766} {"train_loss": -37.16872787475586, "global_step": 92707, "epoch": 766} {"train_loss": -36.888057708740234, "global_step": 92708, "epoch": 766} {"train_loss": -34.696746826171875, "global_step": 92709, "epoch": 766} {"train_loss": -33.52103805541992, "global_step": 92710, "epoch": 766} {"train_loss": -37.16102981567383, "global_step": 92711, "epoch": 766} {"train_loss": -36.259620666503906, "global_step": 92712, "epoch": 766} {"train_loss": -35.074623107910156, "global_step": 92713, "epoch": 766} {"train_loss": -35.27649688720703, "global_step": 92714, "epoch": 766} {"train_loss": -36.285396575927734, "global_step": 92715, "epoch": 766} {"train_loss": -18.332324981689453, "global_step": 92716, "epoch": 766} {"train_loss": -35.51887893676758, "global_step": 92717, "epoch": 766} {"train_loss": 6.561913967132568, "global_step": 92718, "epoch": 766} {"train_loss": 8.747206687927246, "global_step": 92719, "epoch": 766} {"train_loss": -15.150731086730957, "global_step": 92720, "epoch": 766} {"train_loss": -25.75491714477539, "global_step": 92721, "epoch": 766} {"train_loss": 13.70945930480957, "global_step": 92722, "epoch": 766} {"train_loss": -13.719192504882812, "global_step": 92723, "epoch": 766} {"train_loss": -26.2471981048584, "global_step": 92724, "epoch": 766} {"train_loss": -25.843053817749023, "global_step": 92725, "epoch": 766} {"train_loss": -25.147146224975586, "global_step": 92726, "epoch": 766} {"train_loss": -20.190673828125, "global_step": 92727, "epoch": 766} {"train_loss": -23.091955184936523, "global_step": 92728, "epoch": 766} {"train_loss": -26.328882217407227, "global_step": 92729, "epoch": 766} {"train_loss": -30.04756736755371, "global_step": 92730, "epoch": 766} {"train_loss": -28.996295928955078, "global_step": 92731, "epoch": 766} {"train_loss": -30.52351188659668, "global_step": 92732, "epoch": 766} {"train_loss": -29.8004093170166, "global_step": 92733, "epoch": 766} {"train_loss": -27.453678131103516, "global_step": 92734, "epoch": 766} {"train_loss": -28.832319259643555, "global_step": 92735, "epoch": 766} {"train_loss": -27.42939567565918, "global_step": 92736, "epoch": 766} {"train_loss": -29.991064071655273, "global_step": 92737, "epoch": 766} {"train_loss": -28.700366973876953, "global_step": 92738, "epoch": 766} {"train_loss": -30.57404136657715, "global_step": 92739, "epoch": 766} {"train_loss": -29.250415802001953, "global_step": 92740, "epoch": 766} {"train_loss": -29.825824737548828, "global_step": 92741, "epoch": 766} {"train_loss": -29.853857040405273, "global_step": 92742, "epoch": 766} {"train_loss": -30.261377334594727, "global_step": 92743, "epoch": 766} {"train_loss": -30.148283004760742, "global_step": 92744, "epoch": 766} {"train_loss": -30.50477409362793, "global_step": 92745, "epoch": 766} {"train_loss": -30.318267822265625, "global_step": 92746, "epoch": 766} {"train_loss": -30.90496253967285, "global_step": 92747, "epoch": 766} {"train_loss": -29.725507736206055, "global_step": 92748, "epoch": 766} {"train_loss": -31.4539852142334, "global_step": 92749, "epoch": 766} {"train_loss": -30.20053482055664, "global_step": 92750, "epoch": 766} {"train_loss": -30.127227783203125, "global_step": 92751, "epoch": 766} {"train_loss": -31.323659896850586, "global_step": 92752, "epoch": 766} {"train_loss": -30.966257095336914, "global_step": 92753, "epoch": 766} {"train_loss": -31.40730094909668, "global_step": 92754, "epoch": 766} {"train_loss": -31.01456069946289, "global_step": 92755, "epoch": 766} {"train_loss": -31.405160903930664, "global_step": 92756, "epoch": 766} {"train_loss": -31.764606475830078, "global_step": 92757, "epoch": 766} {"train_loss": -31.387622833251953, "global_step": 92758, "epoch": 766} {"train_loss": -32.223243713378906, "global_step": 92759, "epoch": 766} {"train_loss": -33.013877868652344, "global_step": 92760, "epoch": 766} {"train_loss": -30.750391006469727, "global_step": 92761, "epoch": 766} {"train_loss": -32.0495491027832, "global_step": 92762, "epoch": 766} {"train_loss": -31.7391414642334, "global_step": 92763, "epoch": 766} {"train_loss": -30.850141525268555, "global_step": 92764, "epoch": 766} {"train_loss": -31.483936309814453, "global_step": 92765, "epoch": 766} {"train_loss": -32.545204162597656, "global_step": 92766, "epoch": 766} {"train_loss": -32.88387680053711, "global_step": 92767, "epoch": 766} {"train_loss": -32.713504791259766, "global_step": 92768, "epoch": 766} {"train_loss": -32.12009811401367, "global_step": 92769, "epoch": 766} {"train_loss": -32.68210983276367, "global_step": 92770, "epoch": 766} {"train_loss": -32.53911209106445, "global_step": 92771, "epoch": 766} {"train_loss": -31.959064483642578, "global_step": 92772, "epoch": 766} {"train_loss": -32.68366241455078, "global_step": 92773, "epoch": 766} {"train_loss": -33.42843246459961, "global_step": 92774, "epoch": 766} {"train_loss": -33.073150634765625, "global_step": 92775, "epoch": 766} {"train_loss": -32.500083923339844, "global_step": 92776, "epoch": 766} {"train_loss": -33.16917419433594, "global_step": 92777, "epoch": 766} {"train_loss": -33.20736312866211, "global_step": 92778, "epoch": 766} {"train_loss": -31.4488468170166, "global_step": 92779, "epoch": 766} {"train_loss": -33.16994857788086, "global_step": 92780, "epoch": 766} {"train_loss": -33.85559844970703, "global_step": 92781, "epoch": 766} {"train_loss": -33.4713020324707, "global_step": 92782, "epoch": 766} {"train_loss": -32.758827209472656, "global_step": 92783, "epoch": 766} {"train_loss": -33.256019592285156, "global_step": 92784, "epoch": 766} {"train_loss": -32.68555450439453, "global_step": 92785, "epoch": 766} {"train_loss": -33.29999923706055, "global_step": 92786, "epoch": 766} {"train_loss": -32.813148498535156, "global_step": 92787, "epoch": 766} {"train_loss": -33.660770416259766, "global_step": 92788, "epoch": 766} {"train_loss": -33.102413177490234, "global_step": 92789, "epoch": 766} {"train_loss": -32.74445724487305, "global_step": 92790, "epoch": 766} {"train_loss": -33.28904342651367, "global_step": 92791, "epoch": 766} {"train_loss": -33.96236038208008, "global_step": 92792, "epoch": 766} {"train_loss": -33.54903030395508, "global_step": 92793, "epoch": 766} {"train_loss": -34.102508544921875, "global_step": 92794, "epoch": 766} {"train_loss": -33.88295364379883, "global_step": 92795, "epoch": 766} {"train_loss": -33.5118522644043, "global_step": 92796, "epoch": 766} {"train_loss": -34.362701416015625, "global_step": 92797, "epoch": 766} {"train_loss": -34.0751953125, "global_step": 92798, "epoch": 766} {"train_loss": -35.11646270751953, "global_step": 92799, "epoch": 766} {"train_loss": -34.22748947143555, "global_step": 92800, "epoch": 766} {"train_loss": -33.94314956665039, "global_step": 92801, "epoch": 766} {"train_loss": -34.499019622802734, "global_step": 92802, "epoch": 766} {"train_loss": -34.49873352050781, "global_step": 92803, "epoch": 766} {"train_loss": -34.6251335144043, "global_step": 92804, "epoch": 766} {"train_loss": -34.73187255859375, "global_step": 92805, "epoch": 766} {"train_loss": -31.29199953709752, "global_step": 92806, "epoch": 766, "val_loss": 2635221.0} {"train_loss": -34.386871337890625, "global_step": 92807, "epoch": 767} {"train_loss": -34.63286209106445, "global_step": 92808, "epoch": 767} {"train_loss": -34.48259353637695, "global_step": 92809, "epoch": 767} {"train_loss": -35.11197280883789, "global_step": 92810, "epoch": 767} {"train_loss": -34.29931640625, "global_step": 92811, "epoch": 767} {"train_loss": -34.834800720214844, "global_step": 92812, "epoch": 767} {"train_loss": -34.83781433105469, "global_step": 92813, "epoch": 767} {"train_loss": -35.19632339477539, "global_step": 92814, "epoch": 767} {"train_loss": -33.64052963256836, "global_step": 92815, "epoch": 767} {"train_loss": -34.85072708129883, "global_step": 92816, "epoch": 767} {"train_loss": -35.62464904785156, "global_step": 92817, "epoch": 767} {"train_loss": -34.52267837524414, "global_step": 92818, "epoch": 767} {"train_loss": -35.878902435302734, "global_step": 92819, "epoch": 767} {"train_loss": -34.88670349121094, "global_step": 92820, "epoch": 767} {"train_loss": -35.42598342895508, "global_step": 92821, "epoch": 767} {"train_loss": -34.97320556640625, "global_step": 92822, "epoch": 767} {"train_loss": -35.74276351928711, "global_step": 92823, "epoch": 767} {"train_loss": -35.06153869628906, "global_step": 92824, "epoch": 767} {"train_loss": -34.32341003417969, "global_step": 92825, "epoch": 767} {"train_loss": -34.98126983642578, "global_step": 92826, "epoch": 767} {"train_loss": -35.61783981323242, "global_step": 92827, "epoch": 767} {"train_loss": -34.951576232910156, "global_step": 92828, "epoch": 767} {"train_loss": -35.73508834838867, "global_step": 92829, "epoch": 767} {"train_loss": -35.4317626953125, "global_step": 92830, "epoch": 767} {"train_loss": -35.45142364501953, "global_step": 92831, "epoch": 767} {"train_loss": -35.761600494384766, "global_step": 92832, "epoch": 767} {"train_loss": -36.31735610961914, "global_step": 92833, "epoch": 767} {"train_loss": -35.104488372802734, "global_step": 92834, "epoch": 767} {"train_loss": -36.363807678222656, "global_step": 92835, "epoch": 767} {"train_loss": -35.2503776550293, "global_step": 92836, "epoch": 767} {"train_loss": -35.526851654052734, "global_step": 92837, "epoch": 767} {"train_loss": -34.866092681884766, "global_step": 92838, "epoch": 767} {"train_loss": -36.40082931518555, "global_step": 92839, "epoch": 767} {"train_loss": -35.181758880615234, "global_step": 92840, "epoch": 767} {"train_loss": -35.632972717285156, "global_step": 92841, "epoch": 767} {"train_loss": -35.938385009765625, "global_step": 92842, "epoch": 767} {"train_loss": -36.451412200927734, "global_step": 92843, "epoch": 767} {"train_loss": -34.904476165771484, "global_step": 92844, "epoch": 767} {"train_loss": -36.607398986816406, "global_step": 92845, "epoch": 767} {"train_loss": -35.60087966918945, "global_step": 92846, "epoch": 767} {"train_loss": -35.711849212646484, "global_step": 92847, "epoch": 767} {"train_loss": -36.649654388427734, "global_step": 92848, "epoch": 767} {"train_loss": -35.764808654785156, "global_step": 92849, "epoch": 767} {"train_loss": -35.73000717163086, "global_step": 92850, "epoch": 767} {"train_loss": -35.91961669921875, "global_step": 92851, "epoch": 767} {"train_loss": -36.16054916381836, "global_step": 92852, "epoch": 767} {"train_loss": -36.094154357910156, "global_step": 92853, "epoch": 767} {"train_loss": -35.315425872802734, "global_step": 92854, "epoch": 767} {"train_loss": -36.0659294128418, "global_step": 92855, "epoch": 767} {"train_loss": -36.00360870361328, "global_step": 92856, "epoch": 767} {"train_loss": -36.19607162475586, "global_step": 92857, "epoch": 767} {"train_loss": -35.770809173583984, "global_step": 92858, "epoch": 767} {"train_loss": -36.565372467041016, "global_step": 92859, "epoch": 767} {"train_loss": -36.497100830078125, "global_step": 92860, "epoch": 767} {"train_loss": -36.36023712158203, "global_step": 92861, "epoch": 767} {"train_loss": -36.3133544921875, "global_step": 92862, "epoch": 767} {"train_loss": -36.36512756347656, "global_step": 92863, "epoch": 767} {"train_loss": -35.7489013671875, "global_step": 92864, "epoch": 767} {"train_loss": -36.27825164794922, "global_step": 92865, "epoch": 767} {"train_loss": -36.6646842956543, "global_step": 92866, "epoch": 767} {"train_loss": -34.61896896362305, "global_step": 92867, "epoch": 767} {"train_loss": -36.354393005371094, "global_step": 92868, "epoch": 767} {"train_loss": -35.700904846191406, "global_step": 92869, "epoch": 767} {"train_loss": -35.26506805419922, "global_step": 92870, "epoch": 767} {"train_loss": -35.73942565917969, "global_step": 92871, "epoch": 767} {"train_loss": -36.21857833862305, "global_step": 92872, "epoch": 767} {"train_loss": -34.45907211303711, "global_step": 92873, "epoch": 767} {"train_loss": -34.997379302978516, "global_step": 92874, "epoch": 767} {"train_loss": -34.64164352416992, "global_step": 92875, "epoch": 767} {"train_loss": -35.7977409362793, "global_step": 92876, "epoch": 767} {"train_loss": -32.6879768371582, "global_step": 92877, "epoch": 767} {"train_loss": -35.26010513305664, "global_step": 92878, "epoch": 767} {"train_loss": -34.43233108520508, "global_step": 92879, "epoch": 767} {"train_loss": -33.12855911254883, "global_step": 92880, "epoch": 767} {"train_loss": -25.681577682495117, "global_step": 92881, "epoch": 767} {"train_loss": -31.32087516784668, "global_step": 92882, "epoch": 767} {"train_loss": -32.239070892333984, "global_step": 92883, "epoch": 767} {"train_loss": -26.23480224609375, "global_step": 92884, "epoch": 767} {"train_loss": -32.60700225830078, "global_step": 92885, "epoch": 767} {"train_loss": -31.033720016479492, "global_step": 92886, "epoch": 767} {"train_loss": -30.356595993041992, "global_step": 92887, "epoch": 767} {"train_loss": -35.472938537597656, "global_step": 92888, "epoch": 767} {"train_loss": -33.353515625, "global_step": 92889, "epoch": 767} {"train_loss": -30.014501571655273, "global_step": 92890, "epoch": 767} {"train_loss": -34.890010833740234, "global_step": 92891, "epoch": 767} {"train_loss": -34.8248405456543, "global_step": 92892, "epoch": 767} {"train_loss": -33.7232666015625, "global_step": 92893, "epoch": 767} {"train_loss": -33.23115539550781, "global_step": 92894, "epoch": 767} {"train_loss": -35.06916809082031, "global_step": 92895, "epoch": 767} {"train_loss": -36.07514190673828, "global_step": 92896, "epoch": 767} {"train_loss": -36.23427200317383, "global_step": 92897, "epoch": 767} {"train_loss": -34.78813552856445, "global_step": 92898, "epoch": 767} {"train_loss": -34.82112503051758, "global_step": 92899, "epoch": 767} {"train_loss": -35.24637985229492, "global_step": 92900, "epoch": 767} {"train_loss": -35.85175704956055, "global_step": 92901, "epoch": 767} {"train_loss": -36.669368743896484, "global_step": 92902, "epoch": 767} {"train_loss": -36.38810348510742, "global_step": 92903, "epoch": 767} {"train_loss": -35.905860900878906, "global_step": 92904, "epoch": 767} {"train_loss": -36.37605667114258, "global_step": 92905, "epoch": 767} {"train_loss": -35.83420944213867, "global_step": 92906, "epoch": 767} {"train_loss": -35.79157257080078, "global_step": 92907, "epoch": 767} {"train_loss": -36.17356491088867, "global_step": 92908, "epoch": 767} {"train_loss": -36.28314208984375, "global_step": 92909, "epoch": 767} {"train_loss": -35.64596176147461, "global_step": 92910, "epoch": 767} {"train_loss": -36.20314407348633, "global_step": 92911, "epoch": 767} {"train_loss": -36.44179916381836, "global_step": 92912, "epoch": 767} {"train_loss": -35.355384826660156, "global_step": 92913, "epoch": 767} {"train_loss": -36.41440963745117, "global_step": 92914, "epoch": 767} {"train_loss": -36.12063980102539, "global_step": 92915, "epoch": 767} {"train_loss": -36.49580001831055, "global_step": 92916, "epoch": 767} {"train_loss": -36.06803512573242, "global_step": 92917, "epoch": 767} {"train_loss": -36.025146484375, "global_step": 92918, "epoch": 767} {"train_loss": -36.27933120727539, "global_step": 92919, "epoch": 767} {"train_loss": -36.5329475402832, "global_step": 92920, "epoch": 767} {"train_loss": -36.639259338378906, "global_step": 92921, "epoch": 767} {"train_loss": -36.27561569213867, "global_step": 92922, "epoch": 767} {"train_loss": -36.3102912902832, "global_step": 92923, "epoch": 767} {"train_loss": -36.77442169189453, "global_step": 92924, "epoch": 767} {"train_loss": -37.027618408203125, "global_step": 92925, "epoch": 767} {"train_loss": -36.50056076049805, "global_step": 92926, "epoch": 767} {"train_loss": -35.19378565953783, "global_step": 92927, "epoch": 767, "val_loss": 2528382.75} {"train_loss": -36.90983581542969, "global_step": 92928, "epoch": 768} {"train_loss": -37.099037170410156, "global_step": 92929, "epoch": 768} {"train_loss": -36.7341423034668, "global_step": 92930, "epoch": 768} {"train_loss": -36.70809555053711, "global_step": 92931, "epoch": 768} {"train_loss": -36.342464447021484, "global_step": 92932, "epoch": 768} {"train_loss": -36.51857376098633, "global_step": 92933, "epoch": 768} {"train_loss": -36.18376541137695, "global_step": 92934, "epoch": 768} {"train_loss": -36.7270393371582, "global_step": 92935, "epoch": 768} {"train_loss": -36.822208404541016, "global_step": 92936, "epoch": 768} {"train_loss": -37.526756286621094, "global_step": 92937, "epoch": 768} {"train_loss": -36.76095962524414, "global_step": 92938, "epoch": 768} {"train_loss": -37.097408294677734, "global_step": 92939, "epoch": 768} {"train_loss": -37.978492736816406, "global_step": 92940, "epoch": 768} {"train_loss": -37.041866302490234, "global_step": 92941, "epoch": 768} {"train_loss": -36.842586517333984, "global_step": 92942, "epoch": 768} {"train_loss": -36.72727584838867, "global_step": 92943, "epoch": 768} {"train_loss": -36.24819564819336, "global_step": 92944, "epoch": 768} {"train_loss": -33.349273681640625, "global_step": 92945, "epoch": 768} {"train_loss": -24.69636344909668, "global_step": 92946, "epoch": 768} {"train_loss": -11.111807823181152, "global_step": 92947, "epoch": 768} {"train_loss": -22.97829246520996, "global_step": 92948, "epoch": 768} {"train_loss": -36.79389572143555, "global_step": 92949, "epoch": 768} {"train_loss": -26.312519073486328, "global_step": 92950, "epoch": 768} {"train_loss": -31.868927001953125, "global_step": 92951, "epoch": 768} {"train_loss": -35.280120849609375, "global_step": 92952, "epoch": 768} {"train_loss": -33.25112533569336, "global_step": 92953, "epoch": 768} {"train_loss": -34.374053955078125, "global_step": 92954, "epoch": 768} {"train_loss": -34.52845001220703, "global_step": 92955, "epoch": 768} {"train_loss": -34.85302734375, "global_step": 92956, "epoch": 768} {"train_loss": -34.99097442626953, "global_step": 92957, "epoch": 768} {"train_loss": -35.10108184814453, "global_step": 92958, "epoch": 768} {"train_loss": -36.3297004699707, "global_step": 92959, "epoch": 768} {"train_loss": -35.33895492553711, "global_step": 92960, "epoch": 768} {"train_loss": -36.258827209472656, "global_step": 92961, "epoch": 768} {"train_loss": -35.86422348022461, "global_step": 92962, "epoch": 768} {"train_loss": -35.120765686035156, "global_step": 92963, "epoch": 768} {"train_loss": -36.46982955932617, "global_step": 92964, "epoch": 768} {"train_loss": -36.57578659057617, "global_step": 92965, "epoch": 768} {"train_loss": -35.97244644165039, "global_step": 92966, "epoch": 768} {"train_loss": -36.383758544921875, "global_step": 92967, "epoch": 768} {"train_loss": -36.186676025390625, "global_step": 92968, "epoch": 768} {"train_loss": -36.346431732177734, "global_step": 92969, "epoch": 768} {"train_loss": -35.94255065917969, "global_step": 92970, "epoch": 768} {"train_loss": -36.73834991455078, "global_step": 92971, "epoch": 768} {"train_loss": -35.9031867980957, "global_step": 92972, "epoch": 768} {"train_loss": -36.92920684814453, "global_step": 92973, "epoch": 768} {"train_loss": -36.596946716308594, "global_step": 92974, "epoch": 768} {"train_loss": -36.5285758972168, "global_step": 92975, "epoch": 768} {"train_loss": -36.278297424316406, "global_step": 92976, "epoch": 768} {"train_loss": -37.25313186645508, "global_step": 92977, "epoch": 768} {"train_loss": -36.60418701171875, "global_step": 92978, "epoch": 768} {"train_loss": -36.850582122802734, "global_step": 92979, "epoch": 768} {"train_loss": -37.034584045410156, "global_step": 92980, "epoch": 768} {"train_loss": -37.247127532958984, "global_step": 92981, "epoch": 768} {"train_loss": -36.94516372680664, "global_step": 92982, "epoch": 768} {"train_loss": -36.833900451660156, "global_step": 92983, "epoch": 768} {"train_loss": -36.596309661865234, "global_step": 92984, "epoch": 768} {"train_loss": -36.61119842529297, "global_step": 92985, "epoch": 768} {"train_loss": -36.49225616455078, "global_step": 92986, "epoch": 768} {"train_loss": -36.77541732788086, "global_step": 92987, "epoch": 768} {"train_loss": -36.48106002807617, "global_step": 92988, "epoch": 768} {"train_loss": -37.3583984375, "global_step": 92989, "epoch": 768} {"train_loss": -35.736873626708984, "global_step": 92990, "epoch": 768} {"train_loss": -37.233070373535156, "global_step": 92991, "epoch": 768} {"train_loss": -36.7061767578125, "global_step": 92992, "epoch": 768} {"train_loss": -38.26569366455078, "global_step": 92993, "epoch": 768} {"train_loss": -36.846649169921875, "global_step": 92994, "epoch": 768} {"train_loss": -37.3700065612793, "global_step": 92995, "epoch": 768} {"train_loss": -37.32990264892578, "global_step": 92996, "epoch": 768} {"train_loss": -36.71049880981445, "global_step": 92997, "epoch": 768} {"train_loss": -37.67432403564453, "global_step": 92998, "epoch": 768} {"train_loss": -37.03797912597656, "global_step": 92999, "epoch": 768} {"train_loss": -37.18604278564453, "global_step": 93000, "epoch": 768} {"train_loss": -37.69647979736328, "global_step": 93001, "epoch": 768} {"train_loss": -37.165771484375, "global_step": 93002, "epoch": 768} {"train_loss": -37.645503997802734, "global_step": 93003, "epoch": 768} {"train_loss": -37.77811813354492, "global_step": 93004, "epoch": 768} {"train_loss": -37.82371139526367, "global_step": 93005, "epoch": 768} {"train_loss": -37.65643310546875, "global_step": 93006, "epoch": 768} {"train_loss": -37.29829788208008, "global_step": 93007, "epoch": 768} {"train_loss": -37.473873138427734, "global_step": 93008, "epoch": 768} {"train_loss": -37.70420455932617, "global_step": 93009, "epoch": 768} {"train_loss": -37.77955627441406, "global_step": 93010, "epoch": 768} {"train_loss": -38.17893600463867, "global_step": 93011, "epoch": 768} {"train_loss": -37.05040740966797, "global_step": 93012, "epoch": 768} {"train_loss": -37.39200973510742, "global_step": 93013, "epoch": 768} {"train_loss": -37.77711486816406, "global_step": 93014, "epoch": 768} {"train_loss": -37.44300079345703, "global_step": 93015, "epoch": 768} {"train_loss": -38.172950744628906, "global_step": 93016, "epoch": 768} {"train_loss": -37.387603759765625, "global_step": 93017, "epoch": 768} {"train_loss": -37.66986846923828, "global_step": 93018, "epoch": 768} {"train_loss": -37.85917282104492, "global_step": 93019, "epoch": 768} {"train_loss": -37.58427810668945, "global_step": 93020, "epoch": 768} {"train_loss": -37.5138053894043, "global_step": 93021, "epoch": 768} {"train_loss": -38.004459381103516, "global_step": 93022, "epoch": 768} {"train_loss": -37.720314025878906, "global_step": 93023, "epoch": 768} {"train_loss": -37.9992790222168, "global_step": 93024, "epoch": 768} {"train_loss": -37.67761993408203, "global_step": 93025, "epoch": 768} {"train_loss": -37.63222122192383, "global_step": 93026, "epoch": 768} {"train_loss": -38.32392120361328, "global_step": 93027, "epoch": 768} {"train_loss": -37.58259201049805, "global_step": 93028, "epoch": 768} {"train_loss": -37.610206604003906, "global_step": 93029, "epoch": 768} {"train_loss": -37.9728889465332, "global_step": 93030, "epoch": 768} {"train_loss": -37.49827194213867, "global_step": 93031, "epoch": 768} {"train_loss": -37.94470977783203, "global_step": 93032, "epoch": 768} {"train_loss": -36.62177658081055, "global_step": 93033, "epoch": 768} {"train_loss": -37.03566360473633, "global_step": 93034, "epoch": 768} {"train_loss": -37.539669036865234, "global_step": 93035, "epoch": 768} {"train_loss": -37.9454231262207, "global_step": 93036, "epoch": 768} {"train_loss": -36.772823333740234, "global_step": 93037, "epoch": 768} {"train_loss": -37.022796630859375, "global_step": 93038, "epoch": 768} {"train_loss": -37.04832077026367, "global_step": 93039, "epoch": 768} {"train_loss": -37.562904357910156, "global_step": 93040, "epoch": 768} {"train_loss": -36.542667388916016, "global_step": 93041, "epoch": 768} {"train_loss": -38.26638412475586, "global_step": 93042, "epoch": 768} {"train_loss": -36.84783935546875, "global_step": 93043, "epoch": 768} {"train_loss": -36.841365814208984, "global_step": 93044, "epoch": 768} {"train_loss": -36.08059310913086, "global_step": 93045, "epoch": 768} {"train_loss": -35.93589401245117, "global_step": 93046, "epoch": 768} {"train_loss": -37.311676025390625, "global_step": 93047, "epoch": 768} {"train_loss": -36.31686441563377, "global_step": 93048, "epoch": 768, "val_loss": 2534061.75} {"train_loss": -36.20718002319336, "global_step": 93049, "epoch": 769} {"train_loss": -34.98228073120117, "global_step": 93050, "epoch": 769} {"train_loss": -34.48055648803711, "global_step": 93051, "epoch": 769} {"train_loss": -34.24588394165039, "global_step": 93052, "epoch": 769} {"train_loss": -36.32904052734375, "global_step": 93053, "epoch": 769} {"train_loss": -37.18143844604492, "global_step": 93054, "epoch": 769} {"train_loss": -36.61705780029297, "global_step": 93055, "epoch": 769} {"train_loss": -37.179420471191406, "global_step": 93056, "epoch": 769} {"train_loss": -36.911800384521484, "global_step": 93057, "epoch": 769} {"train_loss": -36.290016174316406, "global_step": 93058, "epoch": 769} {"train_loss": -37.06141662597656, "global_step": 93059, "epoch": 769} {"train_loss": -35.97846221923828, "global_step": 93060, "epoch": 769} {"train_loss": -36.185523986816406, "global_step": 93061, "epoch": 769} {"train_loss": -37.6682243347168, "global_step": 93062, "epoch": 769} {"train_loss": -37.06254577636719, "global_step": 93063, "epoch": 769} {"train_loss": -37.1717643737793, "global_step": 93064, "epoch": 769} {"train_loss": -37.12965774536133, "global_step": 93065, "epoch": 769} {"train_loss": -37.71377182006836, "global_step": 93066, "epoch": 769} {"train_loss": -37.447139739990234, "global_step": 93067, "epoch": 769} {"train_loss": -37.27003860473633, "global_step": 93068, "epoch": 769} {"train_loss": -37.7269401550293, "global_step": 93069, "epoch": 769} {"train_loss": -37.849422454833984, "global_step": 93070, "epoch": 769} {"train_loss": -37.596839904785156, "global_step": 93071, "epoch": 769} {"train_loss": -38.2119026184082, "global_step": 93072, "epoch": 769} {"train_loss": -38.23573684692383, "global_step": 93073, "epoch": 769} {"train_loss": -37.88017272949219, "global_step": 93074, "epoch": 769} {"train_loss": -37.96828842163086, "global_step": 93075, "epoch": 769} {"train_loss": -38.013404846191406, "global_step": 93076, "epoch": 769} {"train_loss": -36.93257522583008, "global_step": 93077, "epoch": 769} {"train_loss": -37.91142654418945, "global_step": 93078, "epoch": 769} {"train_loss": -37.798526763916016, "global_step": 93079, "epoch": 769} {"train_loss": -37.54165267944336, "global_step": 93080, "epoch": 769} {"train_loss": -38.15705108642578, "global_step": 93081, "epoch": 769} {"train_loss": -38.20131301879883, "global_step": 93082, "epoch": 769} {"train_loss": -38.31549835205078, "global_step": 93083, "epoch": 769} {"train_loss": -37.462032318115234, "global_step": 93084, "epoch": 769} {"train_loss": -37.476009368896484, "global_step": 93085, "epoch": 769} {"train_loss": -38.68598175048828, "global_step": 93086, "epoch": 769} {"train_loss": -38.3557243347168, "global_step": 93087, "epoch": 769} {"train_loss": -38.32094955444336, "global_step": 93088, "epoch": 769} {"train_loss": -38.28315353393555, "global_step": 93089, "epoch": 769} {"train_loss": -38.390098571777344, "global_step": 93090, "epoch": 769} {"train_loss": -38.634521484375, "global_step": 93091, "epoch": 769} {"train_loss": -37.42035675048828, "global_step": 93092, "epoch": 769} {"train_loss": -38.0374755859375, "global_step": 93093, "epoch": 769} {"train_loss": -37.652801513671875, "global_step": 93094, "epoch": 769} {"train_loss": -37.806251525878906, "global_step": 93095, "epoch": 769} {"train_loss": -38.11267852783203, "global_step": 93096, "epoch": 769} {"train_loss": -38.60144805908203, "global_step": 93097, "epoch": 769} {"train_loss": -38.46046829223633, "global_step": 93098, "epoch": 769} {"train_loss": -38.89730453491211, "global_step": 93099, "epoch": 769} {"train_loss": -37.44851303100586, "global_step": 93100, "epoch": 769} {"train_loss": -38.4644889831543, "global_step": 93101, "epoch": 769} {"train_loss": -38.566802978515625, "global_step": 93102, "epoch": 769} {"train_loss": -37.379539489746094, "global_step": 93103, "epoch": 769} {"train_loss": -37.955291748046875, "global_step": 93104, "epoch": 769} {"train_loss": -37.140296936035156, "global_step": 93105, "epoch": 769} {"train_loss": -37.72384262084961, "global_step": 93106, "epoch": 769} {"train_loss": -35.126182556152344, "global_step": 93107, "epoch": 769} {"train_loss": -36.8873291015625, "global_step": 93108, "epoch": 769} {"train_loss": -36.69145965576172, "global_step": 93109, "epoch": 769} {"train_loss": -37.13715744018555, "global_step": 93110, "epoch": 769} {"train_loss": -38.973060607910156, "global_step": 93111, "epoch": 769} {"train_loss": -37.58899688720703, "global_step": 93112, "epoch": 769} {"train_loss": -37.9648551940918, "global_step": 93113, "epoch": 769} {"train_loss": -37.14002227783203, "global_step": 93114, "epoch": 769} {"train_loss": -36.28046798706055, "global_step": 93115, "epoch": 769} {"train_loss": -36.4619140625, "global_step": 93116, "epoch": 769} {"train_loss": -36.623756408691406, "global_step": 93117, "epoch": 769} {"train_loss": -37.192726135253906, "global_step": 93118, "epoch": 769} {"train_loss": -36.70050048828125, "global_step": 93119, "epoch": 769} {"train_loss": -37.66868209838867, "global_step": 93120, "epoch": 769} {"train_loss": -37.879127502441406, "global_step": 93121, "epoch": 769} {"train_loss": -37.578548431396484, "global_step": 93122, "epoch": 769} {"train_loss": -37.23997116088867, "global_step": 93123, "epoch": 769} {"train_loss": -38.66485595703125, "global_step": 93124, "epoch": 769} {"train_loss": -37.6245002746582, "global_step": 93125, "epoch": 769} {"train_loss": -37.052894592285156, "global_step": 93126, "epoch": 769} {"train_loss": -37.073055267333984, "global_step": 93127, "epoch": 769} {"train_loss": -37.78122329711914, "global_step": 93128, "epoch": 769} {"train_loss": -37.360286712646484, "global_step": 93129, "epoch": 769} {"train_loss": -37.84633255004883, "global_step": 93130, "epoch": 769} {"train_loss": -36.893272399902344, "global_step": 93131, "epoch": 769} {"train_loss": -37.411094665527344, "global_step": 93132, "epoch": 769} {"train_loss": -38.14488983154297, "global_step": 93133, "epoch": 769} {"train_loss": -37.60183334350586, "global_step": 93134, "epoch": 769} {"train_loss": -38.34088134765625, "global_step": 93135, "epoch": 769} {"train_loss": -37.66152572631836, "global_step": 93136, "epoch": 769} {"train_loss": -37.13177490234375, "global_step": 93137, "epoch": 769} {"train_loss": -37.95817184448242, "global_step": 93138, "epoch": 769} {"train_loss": -38.580841064453125, "global_step": 93139, "epoch": 769} {"train_loss": -37.33524703979492, "global_step": 93140, "epoch": 769} {"train_loss": -36.94720458984375, "global_step": 93141, "epoch": 769} {"train_loss": -37.98124313354492, "global_step": 93142, "epoch": 769} {"train_loss": -37.996315002441406, "global_step": 93143, "epoch": 769} {"train_loss": -38.4658203125, "global_step": 93144, "epoch": 769} {"train_loss": -38.07333755493164, "global_step": 93145, "epoch": 769} {"train_loss": -38.24662780761719, "global_step": 93146, "epoch": 769} {"train_loss": -38.61970901489258, "global_step": 93147, "epoch": 769} {"train_loss": -38.45756149291992, "global_step": 93148, "epoch": 769} {"train_loss": -38.06620407104492, "global_step": 93149, "epoch": 769} {"train_loss": -38.47207260131836, "global_step": 93150, "epoch": 769} {"train_loss": -37.9170036315918, "global_step": 93151, "epoch": 769} {"train_loss": -37.387508392333984, "global_step": 93152, "epoch": 769} {"train_loss": -37.666595458984375, "global_step": 93153, "epoch": 769} {"train_loss": -36.573219299316406, "global_step": 93154, "epoch": 769} {"train_loss": -37.493309020996094, "global_step": 93155, "epoch": 769} {"train_loss": -37.38553237915039, "global_step": 93156, "epoch": 769} {"train_loss": -37.621437072753906, "global_step": 93157, "epoch": 769} {"train_loss": -37.856929779052734, "global_step": 93158, "epoch": 769} {"train_loss": -37.18225860595703, "global_step": 93159, "epoch": 769} {"train_loss": -36.555301666259766, "global_step": 93160, "epoch": 769} {"train_loss": -37.799739837646484, "global_step": 93161, "epoch": 769} {"train_loss": -35.978172302246094, "global_step": 93162, "epoch": 769} {"train_loss": -36.331966400146484, "global_step": 93163, "epoch": 769} {"train_loss": -36.626312255859375, "global_step": 93164, "epoch": 769} {"train_loss": -37.37092208862305, "global_step": 93165, "epoch": 769} {"train_loss": -37.68452072143555, "global_step": 93166, "epoch": 769} {"train_loss": -36.10649108886719, "global_step": 93167, "epoch": 769} {"train_loss": -36.704017639160156, "global_step": 93168, "epoch": 769} {"train_loss": -37.46968828942165, "global_step": 93169, "epoch": 769, "val_loss": 2530122.25} {"train_loss": -37.393863677978516, "global_step": 93170, "epoch": 770} {"train_loss": -36.31856155395508, "global_step": 93171, "epoch": 770} {"train_loss": -34.36115646362305, "global_step": 93172, "epoch": 770} {"train_loss": -36.60715866088867, "global_step": 93173, "epoch": 770} {"train_loss": -37.049110412597656, "global_step": 93174, "epoch": 770} {"train_loss": -35.03675842285156, "global_step": 93175, "epoch": 770} {"train_loss": -36.64583969116211, "global_step": 93176, "epoch": 770} {"train_loss": -37.20692825317383, "global_step": 93177, "epoch": 770} {"train_loss": -37.5921516418457, "global_step": 93178, "epoch": 770} {"train_loss": -36.471923828125, "global_step": 93179, "epoch": 770} {"train_loss": -37.430511474609375, "global_step": 93180, "epoch": 770} {"train_loss": -37.52764892578125, "global_step": 93181, "epoch": 770} {"train_loss": -37.32805252075195, "global_step": 93182, "epoch": 770} {"train_loss": -37.19039535522461, "global_step": 93183, "epoch": 770} {"train_loss": -34.953739166259766, "global_step": 93184, "epoch": 770} {"train_loss": -34.42395782470703, "global_step": 93185, "epoch": 770} {"train_loss": -37.834197998046875, "global_step": 93186, "epoch": 770} {"train_loss": -34.55058288574219, "global_step": 93187, "epoch": 770} {"train_loss": -36.45977783203125, "global_step": 93188, "epoch": 770} {"train_loss": -37.729244232177734, "global_step": 93189, "epoch": 770} {"train_loss": -36.736541748046875, "global_step": 93190, "epoch": 770} {"train_loss": -36.38816452026367, "global_step": 93191, "epoch": 770} {"train_loss": -38.20512008666992, "global_step": 93192, "epoch": 770} {"train_loss": -35.72560119628906, "global_step": 93193, "epoch": 770} {"train_loss": -37.300655364990234, "global_step": 93194, "epoch": 770} {"train_loss": -37.0208854675293, "global_step": 93195, "epoch": 770} {"train_loss": -37.24858474731445, "global_step": 93196, "epoch": 770} {"train_loss": -37.87083435058594, "global_step": 93197, "epoch": 770} {"train_loss": -37.7118034362793, "global_step": 93198, "epoch": 770} {"train_loss": -37.58646774291992, "global_step": 93199, "epoch": 770} {"train_loss": -37.7382926940918, "global_step": 93200, "epoch": 770} {"train_loss": -37.38822555541992, "global_step": 93201, "epoch": 770} {"train_loss": -37.40898132324219, "global_step": 93202, "epoch": 770} {"train_loss": -37.05742263793945, "global_step": 93203, "epoch": 770} {"train_loss": -37.077430725097656, "global_step": 93204, "epoch": 770} {"train_loss": -37.746089935302734, "global_step": 93205, "epoch": 770} {"train_loss": -37.47634506225586, "global_step": 93206, "epoch": 770} {"train_loss": -37.95426559448242, "global_step": 93207, "epoch": 770} {"train_loss": -37.175811767578125, "global_step": 93208, "epoch": 770} {"train_loss": -35.079219818115234, "global_step": 93209, "epoch": 770} {"train_loss": -37.98044967651367, "global_step": 93210, "epoch": 770} {"train_loss": -37.180912017822266, "global_step": 93211, "epoch": 770} {"train_loss": -35.81376266479492, "global_step": 93212, "epoch": 770} {"train_loss": -36.29269027709961, "global_step": 93213, "epoch": 770} {"train_loss": -35.76074981689453, "global_step": 93214, "epoch": 770} {"train_loss": -32.022735595703125, "global_step": 93215, "epoch": 770} {"train_loss": -34.06858444213867, "global_step": 93216, "epoch": 770} {"train_loss": -34.22557830810547, "global_step": 93217, "epoch": 770} {"train_loss": -36.873992919921875, "global_step": 93218, "epoch": 770} {"train_loss": -34.18247604370117, "global_step": 93219, "epoch": 770} {"train_loss": -35.711158752441406, "global_step": 93220, "epoch": 770} {"train_loss": -33.66963195800781, "global_step": 93221, "epoch": 770} {"train_loss": -36.55739974975586, "global_step": 93222, "epoch": 770} {"train_loss": -36.4099235534668, "global_step": 93223, "epoch": 770} {"train_loss": -36.4096565246582, "global_step": 93224, "epoch": 770} {"train_loss": -35.45722579956055, "global_step": 93225, "epoch": 770} {"train_loss": -34.574737548828125, "global_step": 93226, "epoch": 770} {"train_loss": -35.5870361328125, "global_step": 93227, "epoch": 770} {"train_loss": -35.39925003051758, "global_step": 93228, "epoch": 770} {"train_loss": -36.63152313232422, "global_step": 93229, "epoch": 770} {"train_loss": -37.204742431640625, "global_step": 93230, "epoch": 770} {"train_loss": -37.03994369506836, "global_step": 93231, "epoch": 770} {"train_loss": -37.48097229003906, "global_step": 93232, "epoch": 770} {"train_loss": -35.80622482299805, "global_step": 93233, "epoch": 770} {"train_loss": -36.92753982543945, "global_step": 93234, "epoch": 770} {"train_loss": -37.08210372924805, "global_step": 93235, "epoch": 770} {"train_loss": -37.39278793334961, "global_step": 93236, "epoch": 770} {"train_loss": -36.96633529663086, "global_step": 93237, "epoch": 770} {"train_loss": -37.45919418334961, "global_step": 93238, "epoch": 770} {"train_loss": -35.38422775268555, "global_step": 93239, "epoch": 770} {"train_loss": -37.007911682128906, "global_step": 93240, "epoch": 770} {"train_loss": -36.870635986328125, "global_step": 93241, "epoch": 770} {"train_loss": -36.28330612182617, "global_step": 93242, "epoch": 770} {"train_loss": -36.37677001953125, "global_step": 93243, "epoch": 770} {"train_loss": -34.937599182128906, "global_step": 93244, "epoch": 770} {"train_loss": -35.82893753051758, "global_step": 93245, "epoch": 770} {"train_loss": -36.78791427612305, "global_step": 93246, "epoch": 770} {"train_loss": -36.313236236572266, "global_step": 93247, "epoch": 770} {"train_loss": -36.158809661865234, "global_step": 93248, "epoch": 770} {"train_loss": -36.16048812866211, "global_step": 93249, "epoch": 770} {"train_loss": -36.72221755981445, "global_step": 93250, "epoch": 770} {"train_loss": -36.79255294799805, "global_step": 93251, "epoch": 770} {"train_loss": -35.94645309448242, "global_step": 93252, "epoch": 770} {"train_loss": -36.532283782958984, "global_step": 93253, "epoch": 770} {"train_loss": -36.20182800292969, "global_step": 93254, "epoch": 770} {"train_loss": -36.146488189697266, "global_step": 93255, "epoch": 770} {"train_loss": -35.2716178894043, "global_step": 93256, "epoch": 770} {"train_loss": -36.99277877807617, "global_step": 93257, "epoch": 770} {"train_loss": -37.630859375, "global_step": 93258, "epoch": 770} {"train_loss": -37.119384765625, "global_step": 93259, "epoch": 770} {"train_loss": -35.992740631103516, "global_step": 93260, "epoch": 770} {"train_loss": -37.85441207885742, "global_step": 93261, "epoch": 770} {"train_loss": -37.47907638549805, "global_step": 93262, "epoch": 770} {"train_loss": -37.21828842163086, "global_step": 93263, "epoch": 770} {"train_loss": -37.44147491455078, "global_step": 93264, "epoch": 770} {"train_loss": -36.5321159362793, "global_step": 93265, "epoch": 770} {"train_loss": -37.10477066040039, "global_step": 93266, "epoch": 770} {"train_loss": -36.7340202331543, "global_step": 93267, "epoch": 770} {"train_loss": -34.98780822753906, "global_step": 93268, "epoch": 770} {"train_loss": -37.3221549987793, "global_step": 93269, "epoch": 770} {"train_loss": -37.3554801940918, "global_step": 93270, "epoch": 770} {"train_loss": -36.60618209838867, "global_step": 93271, "epoch": 770} {"train_loss": -34.878265380859375, "global_step": 93272, "epoch": 770} {"train_loss": -29.55118751525879, "global_step": 93273, "epoch": 770} {"train_loss": -35.58675003051758, "global_step": 93274, "epoch": 770} {"train_loss": -36.28063201904297, "global_step": 93275, "epoch": 770} {"train_loss": -34.084957122802734, "global_step": 93276, "epoch": 770} {"train_loss": -34.670204162597656, "global_step": 93277, "epoch": 770} {"train_loss": -34.165321350097656, "global_step": 93278, "epoch": 770} {"train_loss": -33.37097930908203, "global_step": 93279, "epoch": 770} {"train_loss": -36.42734909057617, "global_step": 93280, "epoch": 770} {"train_loss": -35.38660430908203, "global_step": 93281, "epoch": 770} {"train_loss": -36.75919723510742, "global_step": 93282, "epoch": 770} {"train_loss": -35.93930435180664, "global_step": 93283, "epoch": 770} {"train_loss": -36.30022430419922, "global_step": 93284, "epoch": 770} {"train_loss": -36.13243865966797, "global_step": 93285, "epoch": 770} {"train_loss": -35.816322326660156, "global_step": 93286, "epoch": 770} {"train_loss": -33.408748626708984, "global_step": 93287, "epoch": 770} {"train_loss": -36.3114013671875, "global_step": 93288, "epoch": 770} {"train_loss": -35.82914352416992, "global_step": 93289, "epoch": 770} {"train_loss": -36.29184377686051, "global_step": 93290, "epoch": 770, "val_loss": 2560310.0} {"train_loss": -36.5620002746582, "global_step": 93291, "epoch": 771} {"train_loss": -37.08198928833008, "global_step": 93292, "epoch": 771} {"train_loss": -35.09148025512695, "global_step": 93293, "epoch": 771} {"train_loss": -37.11151123046875, "global_step": 93294, "epoch": 771} {"train_loss": -37.27445602416992, "global_step": 93295, "epoch": 771} {"train_loss": -37.58173751831055, "global_step": 93296, "epoch": 771} {"train_loss": -37.56154251098633, "global_step": 93297, "epoch": 771} {"train_loss": -37.283260345458984, "global_step": 93298, "epoch": 771} {"train_loss": -36.338958740234375, "global_step": 93299, "epoch": 771} {"train_loss": -36.29442596435547, "global_step": 93300, "epoch": 771} {"train_loss": -36.410675048828125, "global_step": 93301, "epoch": 771} {"train_loss": -37.156246185302734, "global_step": 93302, "epoch": 771} {"train_loss": -37.28095626831055, "global_step": 93303, "epoch": 771} {"train_loss": -37.57183837890625, "global_step": 93304, "epoch": 771} {"train_loss": -37.44075393676758, "global_step": 93305, "epoch": 771} {"train_loss": -37.634246826171875, "global_step": 93306, "epoch": 771} {"train_loss": -37.84367752075195, "global_step": 93307, "epoch": 771} {"train_loss": -36.7921028137207, "global_step": 93308, "epoch": 771} {"train_loss": -37.55580139160156, "global_step": 93309, "epoch": 771} {"train_loss": -37.39600372314453, "global_step": 93310, "epoch": 771} {"train_loss": -37.86084747314453, "global_step": 93311, "epoch": 771} {"train_loss": -37.9123420715332, "global_step": 93312, "epoch": 771} {"train_loss": -37.3510856628418, "global_step": 93313, "epoch": 771} {"train_loss": -38.1453742980957, "global_step": 93314, "epoch": 771} {"train_loss": -36.74854278564453, "global_step": 93315, "epoch": 771} {"train_loss": -35.84334182739258, "global_step": 93316, "epoch": 771} {"train_loss": -30.648529052734375, "global_step": 93317, "epoch": 771} {"train_loss": -32.65813064575195, "global_step": 93318, "epoch": 771} {"train_loss": -33.12563705444336, "global_step": 93319, "epoch": 771} {"train_loss": -36.909908294677734, "global_step": 93320, "epoch": 771} {"train_loss": -38.046443939208984, "global_step": 93321, "epoch": 771} {"train_loss": -35.62445831298828, "global_step": 93322, "epoch": 771} {"train_loss": -35.82270431518555, "global_step": 93323, "epoch": 771} {"train_loss": -36.41150665283203, "global_step": 93324, "epoch": 771} {"train_loss": -37.75947952270508, "global_step": 93325, "epoch": 771} {"train_loss": -37.36354064941406, "global_step": 93326, "epoch": 771} {"train_loss": -37.23015213012695, "global_step": 93327, "epoch": 771} {"train_loss": -37.89347457885742, "global_step": 93328, "epoch": 771} {"train_loss": -38.033302307128906, "global_step": 93329, "epoch": 771} {"train_loss": -37.74390411376953, "global_step": 93330, "epoch": 771} {"train_loss": -37.275604248046875, "global_step": 93331, "epoch": 771} {"train_loss": -37.617427825927734, "global_step": 93332, "epoch": 771} {"train_loss": -37.85725021362305, "global_step": 93333, "epoch": 771} {"train_loss": -36.210960388183594, "global_step": 93334, "epoch": 771} {"train_loss": -38.35189437866211, "global_step": 93335, "epoch": 771} {"train_loss": -38.42826461791992, "global_step": 93336, "epoch": 771} {"train_loss": -37.60080337524414, "global_step": 93337, "epoch": 771} {"train_loss": -37.86620330810547, "global_step": 93338, "epoch": 771} {"train_loss": -37.85933303833008, "global_step": 93339, "epoch": 771} {"train_loss": -37.96464157104492, "global_step": 93340, "epoch": 771} {"train_loss": -38.043251037597656, "global_step": 93341, "epoch": 771} {"train_loss": -37.766048431396484, "global_step": 93342, "epoch": 771} {"train_loss": -38.24333953857422, "global_step": 93343, "epoch": 771} {"train_loss": -37.60134506225586, "global_step": 93344, "epoch": 771} {"train_loss": -37.36509704589844, "global_step": 93345, "epoch": 771} {"train_loss": -38.56382369995117, "global_step": 93346, "epoch": 771} {"train_loss": -37.16913604736328, "global_step": 93347, "epoch": 771} {"train_loss": -37.314735412597656, "global_step": 93348, "epoch": 771} {"train_loss": -38.144874572753906, "global_step": 93349, "epoch": 771} {"train_loss": -37.84005355834961, "global_step": 93350, "epoch": 771} {"train_loss": -38.18645477294922, "global_step": 93351, "epoch": 771} {"train_loss": -37.6505126953125, "global_step": 93352, "epoch": 771} {"train_loss": -38.79146194458008, "global_step": 93353, "epoch": 771} {"train_loss": -37.8289909362793, "global_step": 93354, "epoch": 771} {"train_loss": -38.58286666870117, "global_step": 93355, "epoch": 771} {"train_loss": -38.006431579589844, "global_step": 93356, "epoch": 771} {"train_loss": -38.4335823059082, "global_step": 93357, "epoch": 771} {"train_loss": -38.393898010253906, "global_step": 93358, "epoch": 771} {"train_loss": -38.7489013671875, "global_step": 93359, "epoch": 771} {"train_loss": -38.563663482666016, "global_step": 93360, "epoch": 771} {"train_loss": -38.3278694152832, "global_step": 93361, "epoch": 771} {"train_loss": -38.75791549682617, "global_step": 93362, "epoch": 771} {"train_loss": -38.84499740600586, "global_step": 93363, "epoch": 771} {"train_loss": -38.7645378112793, "global_step": 93364, "epoch": 771} {"train_loss": -38.694881439208984, "global_step": 93365, "epoch": 771} {"train_loss": -38.210811614990234, "global_step": 93366, "epoch": 771} {"train_loss": -38.154327392578125, "global_step": 93367, "epoch": 771} {"train_loss": -37.614356994628906, "global_step": 93368, "epoch": 771} {"train_loss": -38.32979965209961, "global_step": 93369, "epoch": 771} {"train_loss": -38.811866760253906, "global_step": 93370, "epoch": 771} {"train_loss": -38.25075149536133, "global_step": 93371, "epoch": 771} {"train_loss": -39.05788803100586, "global_step": 93372, "epoch": 771} {"train_loss": -38.8004264831543, "global_step": 93373, "epoch": 771} {"train_loss": -37.15365219116211, "global_step": 93374, "epoch": 771} {"train_loss": -38.052398681640625, "global_step": 93375, "epoch": 771} {"train_loss": -37.25712966918945, "global_step": 93376, "epoch": 771} {"train_loss": -36.31232833862305, "global_step": 93377, "epoch": 771} {"train_loss": -38.560760498046875, "global_step": 93378, "epoch": 771} {"train_loss": -37.12636947631836, "global_step": 93379, "epoch": 771} {"train_loss": -35.40043258666992, "global_step": 93380, "epoch": 771} {"train_loss": -33.29142379760742, "global_step": 93381, "epoch": 771} {"train_loss": -30.35040283203125, "global_step": 93382, "epoch": 771} {"train_loss": -33.5969123840332, "global_step": 93383, "epoch": 771} {"train_loss": -37.37725830078125, "global_step": 93384, "epoch": 771} {"train_loss": -36.68410873413086, "global_step": 93385, "epoch": 771} {"train_loss": -34.43880844116211, "global_step": 93386, "epoch": 771} {"train_loss": -33.72861862182617, "global_step": 93387, "epoch": 771} {"train_loss": -36.29362869262695, "global_step": 93388, "epoch": 771} {"train_loss": -35.38251876831055, "global_step": 93389, "epoch": 771} {"train_loss": -34.59323501586914, "global_step": 93390, "epoch": 771} {"train_loss": -35.76700210571289, "global_step": 93391, "epoch": 771} {"train_loss": -36.25606155395508, "global_step": 93392, "epoch": 771} {"train_loss": -37.73530197143555, "global_step": 93393, "epoch": 771} {"train_loss": -36.66559600830078, "global_step": 93394, "epoch": 771} {"train_loss": -36.75773239135742, "global_step": 93395, "epoch": 771} {"train_loss": -37.2142219543457, "global_step": 93396, "epoch": 771} {"train_loss": -37.636627197265625, "global_step": 93397, "epoch": 771} {"train_loss": -37.7533073425293, "global_step": 93398, "epoch": 771} {"train_loss": -37.320892333984375, "global_step": 93399, "epoch": 771} {"train_loss": -37.87549591064453, "global_step": 93400, "epoch": 771} {"train_loss": -37.560546875, "global_step": 93401, "epoch": 771} {"train_loss": -37.50278854370117, "global_step": 93402, "epoch": 771} {"train_loss": -38.39786911010742, "global_step": 93403, "epoch": 771} {"train_loss": -37.759517669677734, "global_step": 93404, "epoch": 771} {"train_loss": -37.914466857910156, "global_step": 93405, "epoch": 771} {"train_loss": -37.6701774597168, "global_step": 93406, "epoch": 771} {"train_loss": -38.14254379272461, "global_step": 93407, "epoch": 771} {"train_loss": -38.02151107788086, "global_step": 93408, "epoch": 771} {"train_loss": -38.0114860534668, "global_step": 93409, "epoch": 771} {"train_loss": -37.9249382019043, "global_step": 93410, "epoch": 771} {"train_loss": -37.20573939173675, "global_step": 93411, "epoch": 771, "val_loss": 2513579.75} {"train_loss": -38.277320861816406, "global_step": 93412, "epoch": 772} {"train_loss": -37.557716369628906, "global_step": 93413, "epoch": 772} {"train_loss": -36.60804748535156, "global_step": 93414, "epoch": 772} {"train_loss": -37.60787582397461, "global_step": 93415, "epoch": 772} {"train_loss": -37.28105545043945, "global_step": 93416, "epoch": 772} {"train_loss": -38.051971435546875, "global_step": 93417, "epoch": 772} {"train_loss": -38.048458099365234, "global_step": 93418, "epoch": 772} {"train_loss": -38.10512161254883, "global_step": 93419, "epoch": 772} {"train_loss": -36.37135696411133, "global_step": 93420, "epoch": 772} {"train_loss": -38.099796295166016, "global_step": 93421, "epoch": 772} {"train_loss": -37.19252395629883, "global_step": 93422, "epoch": 772} {"train_loss": -37.80001449584961, "global_step": 93423, "epoch": 772} {"train_loss": -37.5921745300293, "global_step": 93424, "epoch": 772} {"train_loss": -37.895267486572266, "global_step": 93425, "epoch": 772} {"train_loss": -38.0422248840332, "global_step": 93426, "epoch": 772} {"train_loss": -36.862545013427734, "global_step": 93427, "epoch": 772} {"train_loss": -37.9959831237793, "global_step": 93428, "epoch": 772} {"train_loss": -37.40519332885742, "global_step": 93429, "epoch": 772} {"train_loss": -36.423736572265625, "global_step": 93430, "epoch": 772} {"train_loss": -37.89739227294922, "global_step": 93431, "epoch": 772} {"train_loss": -37.93703079223633, "global_step": 93432, "epoch": 772} {"train_loss": -36.99794006347656, "global_step": 93433, "epoch": 772} {"train_loss": -38.13555145263672, "global_step": 93434, "epoch": 772} {"train_loss": -38.334022521972656, "global_step": 93435, "epoch": 772} {"train_loss": -37.78828048706055, "global_step": 93436, "epoch": 772} {"train_loss": -37.840240478515625, "global_step": 93437, "epoch": 772} {"train_loss": -38.13809585571289, "global_step": 93438, "epoch": 772} {"train_loss": -37.85176467895508, "global_step": 93439, "epoch": 772} {"train_loss": -38.712337493896484, "global_step": 93440, "epoch": 772} {"train_loss": -38.84013748168945, "global_step": 93441, "epoch": 772} {"train_loss": -37.61670684814453, "global_step": 93442, "epoch": 772} {"train_loss": -38.631710052490234, "global_step": 93443, "epoch": 772} {"train_loss": -38.36973190307617, "global_step": 93444, "epoch": 772} {"train_loss": -38.99443817138672, "global_step": 93445, "epoch": 772} {"train_loss": -38.13930892944336, "global_step": 93446, "epoch": 772} {"train_loss": -38.26878356933594, "global_step": 93447, "epoch": 772} {"train_loss": -38.7779655456543, "global_step": 93448, "epoch": 772} {"train_loss": -38.02655792236328, "global_step": 93449, "epoch": 772} {"train_loss": -38.29070281982422, "global_step": 93450, "epoch": 772} {"train_loss": -38.51469802856445, "global_step": 93451, "epoch": 772} {"train_loss": -38.44209289550781, "global_step": 93452, "epoch": 772} {"train_loss": -38.43002700805664, "global_step": 93453, "epoch": 772} {"train_loss": -38.48322296142578, "global_step": 93454, "epoch": 772} {"train_loss": -38.02256393432617, "global_step": 93455, "epoch": 772} {"train_loss": -38.63885498046875, "global_step": 93456, "epoch": 772} {"train_loss": -39.20351791381836, "global_step": 93457, "epoch": 772} {"train_loss": -38.78742599487305, "global_step": 93458, "epoch": 772} {"train_loss": -37.90836715698242, "global_step": 93459, "epoch": 772} {"train_loss": -36.769508361816406, "global_step": 93460, "epoch": 772} {"train_loss": -37.77003860473633, "global_step": 93461, "epoch": 772} {"train_loss": -37.38090133666992, "global_step": 93462, "epoch": 772} {"train_loss": -38.21142578125, "global_step": 93463, "epoch": 772} {"train_loss": -38.03615188598633, "global_step": 93464, "epoch": 772} {"train_loss": -37.7253303527832, "global_step": 93465, "epoch": 772} {"train_loss": -38.306941986083984, "global_step": 93466, "epoch": 772} {"train_loss": -35.427608489990234, "global_step": 93467, "epoch": 772} {"train_loss": -35.69350814819336, "global_step": 93468, "epoch": 772} {"train_loss": -37.820960998535156, "global_step": 93469, "epoch": 772} {"train_loss": -37.71147537231445, "global_step": 93470, "epoch": 772} {"train_loss": -36.926902770996094, "global_step": 93471, "epoch": 772} {"train_loss": -37.19974899291992, "global_step": 93472, "epoch": 772} {"train_loss": -37.50139236450195, "global_step": 93473, "epoch": 772} {"train_loss": -37.92341995239258, "global_step": 93474, "epoch": 772} {"train_loss": -36.9838981628418, "global_step": 93475, "epoch": 772} {"train_loss": -37.558258056640625, "global_step": 93476, "epoch": 772} {"train_loss": -36.58173751831055, "global_step": 93477, "epoch": 772} {"train_loss": -37.584468841552734, "global_step": 93478, "epoch": 772} {"train_loss": -37.81331253051758, "global_step": 93479, "epoch": 772} {"train_loss": -37.87382507324219, "global_step": 93480, "epoch": 772} {"train_loss": -38.15495681762695, "global_step": 93481, "epoch": 772} {"train_loss": -38.11478805541992, "global_step": 93482, "epoch": 772} {"train_loss": -38.03311538696289, "global_step": 93483, "epoch": 772} {"train_loss": -37.497406005859375, "global_step": 93484, "epoch": 772} {"train_loss": -37.80086898803711, "global_step": 93485, "epoch": 772} {"train_loss": -38.14421463012695, "global_step": 93486, "epoch": 772} {"train_loss": -37.7874755859375, "global_step": 93487, "epoch": 772} {"train_loss": -38.43741989135742, "global_step": 93488, "epoch": 772} {"train_loss": -37.65558624267578, "global_step": 93489, "epoch": 772} {"train_loss": -38.265560150146484, "global_step": 93490, "epoch": 772} {"train_loss": -37.775306701660156, "global_step": 93491, "epoch": 772} {"train_loss": -36.92285919189453, "global_step": 93492, "epoch": 772} {"train_loss": -38.05668258666992, "global_step": 93493, "epoch": 772} {"train_loss": -37.59858322143555, "global_step": 93494, "epoch": 772} {"train_loss": -37.9852409362793, "global_step": 93495, "epoch": 772} {"train_loss": -38.865196228027344, "global_step": 93496, "epoch": 772} {"train_loss": -38.00193786621094, "global_step": 93497, "epoch": 772} {"train_loss": -37.858455657958984, "global_step": 93498, "epoch": 772} {"train_loss": -38.65863800048828, "global_step": 93499, "epoch": 772} {"train_loss": -38.89193344116211, "global_step": 93500, "epoch": 772} {"train_loss": -38.458526611328125, "global_step": 93501, "epoch": 772} {"train_loss": -38.67713165283203, "global_step": 93502, "epoch": 772} {"train_loss": -38.33232498168945, "global_step": 93503, "epoch": 772} {"train_loss": -38.269683837890625, "global_step": 93504, "epoch": 772} {"train_loss": -38.520320892333984, "global_step": 93505, "epoch": 772} {"train_loss": -38.62702178955078, "global_step": 93506, "epoch": 772} {"train_loss": -39.12419891357422, "global_step": 93507, "epoch": 772} {"train_loss": -38.650978088378906, "global_step": 93508, "epoch": 772} {"train_loss": -38.39277267456055, "global_step": 93509, "epoch": 772} {"train_loss": -38.4874382019043, "global_step": 93510, "epoch": 772} {"train_loss": -37.99747848510742, "global_step": 93511, "epoch": 772} {"train_loss": -38.7077751159668, "global_step": 93512, "epoch": 772} {"train_loss": -37.66395568847656, "global_step": 93513, "epoch": 772} {"train_loss": -36.93425369262695, "global_step": 93514, "epoch": 772} {"train_loss": -36.000640869140625, "global_step": 93515, "epoch": 772} {"train_loss": -34.646278381347656, "global_step": 93516, "epoch": 772} {"train_loss": -32.628692626953125, "global_step": 93517, "epoch": 772} {"train_loss": -34.786903381347656, "global_step": 93518, "epoch": 772} {"train_loss": -36.23191833496094, "global_step": 93519, "epoch": 772} {"train_loss": -37.806358337402344, "global_step": 93520, "epoch": 772} {"train_loss": -37.70620346069336, "global_step": 93521, "epoch": 772} {"train_loss": -36.38444900512695, "global_step": 93522, "epoch": 772} {"train_loss": -37.969234466552734, "global_step": 93523, "epoch": 772} {"train_loss": -38.3758659362793, "global_step": 93524, "epoch": 772} {"train_loss": -37.75228500366211, "global_step": 93525, "epoch": 772} {"train_loss": -37.29224395751953, "global_step": 93526, "epoch": 772} {"train_loss": -38.07208251953125, "global_step": 93527, "epoch": 772} {"train_loss": -37.1884765625, "global_step": 93528, "epoch": 772} {"train_loss": -38.32143020629883, "global_step": 93529, "epoch": 772} {"train_loss": -37.75980758666992, "global_step": 93530, "epoch": 772} {"train_loss": -38.43330001831055, "global_step": 93531, "epoch": 772} {"train_loss": -37.75464207672876, "global_step": 93532, "epoch": 772, "val_loss": 2469735.25} {"train_loss": -38.038692474365234, "global_step": 93533, "epoch": 773} {"train_loss": -37.76514434814453, "global_step": 93534, "epoch": 773} {"train_loss": -38.0076789855957, "global_step": 93535, "epoch": 773} {"train_loss": -38.474037170410156, "global_step": 93536, "epoch": 773} {"train_loss": -37.89494705200195, "global_step": 93537, "epoch": 773} {"train_loss": -37.467403411865234, "global_step": 93538, "epoch": 773} {"train_loss": -38.45632553100586, "global_step": 93539, "epoch": 773} {"train_loss": -38.39345169067383, "global_step": 93540, "epoch": 773} {"train_loss": -38.52470016479492, "global_step": 93541, "epoch": 773} {"train_loss": -38.37357711791992, "global_step": 93542, "epoch": 773} {"train_loss": -38.468902587890625, "global_step": 93543, "epoch": 773} {"train_loss": -38.25080108642578, "global_step": 93544, "epoch": 773} {"train_loss": -38.364654541015625, "global_step": 93545, "epoch": 773} {"train_loss": -37.47237777709961, "global_step": 93546, "epoch": 773} {"train_loss": -38.67832565307617, "global_step": 93547, "epoch": 773} {"train_loss": -38.73930358886719, "global_step": 93548, "epoch": 773} {"train_loss": -38.27596664428711, "global_step": 93549, "epoch": 773} {"train_loss": -38.71017074584961, "global_step": 93550, "epoch": 773} {"train_loss": -36.3176155090332, "global_step": 93551, "epoch": 773} {"train_loss": -36.55289840698242, "global_step": 93552, "epoch": 773} {"train_loss": -39.0897331237793, "global_step": 93553, "epoch": 773} {"train_loss": -38.49357223510742, "global_step": 93554, "epoch": 773} {"train_loss": -37.339027404785156, "global_step": 93555, "epoch": 773} {"train_loss": -37.50927734375, "global_step": 93556, "epoch": 773} {"train_loss": -36.8729248046875, "global_step": 93557, "epoch": 773} {"train_loss": -38.12795639038086, "global_step": 93558, "epoch": 773} {"train_loss": -37.86524200439453, "global_step": 93559, "epoch": 773} {"train_loss": -37.15497589111328, "global_step": 93560, "epoch": 773} {"train_loss": -38.15092086791992, "global_step": 93561, "epoch": 773} {"train_loss": -37.974647521972656, "global_step": 93562, "epoch": 773} {"train_loss": -37.2236328125, "global_step": 93563, "epoch": 773} {"train_loss": -38.7166862487793, "global_step": 93564, "epoch": 773} {"train_loss": -38.074989318847656, "global_step": 93565, "epoch": 773} {"train_loss": -35.537269592285156, "global_step": 93566, "epoch": 773} {"train_loss": -30.369882583618164, "global_step": 93567, "epoch": 773} {"train_loss": -37.46119689941406, "global_step": 93568, "epoch": 773} {"train_loss": -35.3469123840332, "global_step": 93569, "epoch": 773} {"train_loss": -34.969791412353516, "global_step": 93570, "epoch": 773} {"train_loss": -35.132911682128906, "global_step": 93571, "epoch": 773} {"train_loss": -34.97545623779297, "global_step": 93572, "epoch": 773} {"train_loss": -33.68524932861328, "global_step": 93573, "epoch": 773} {"train_loss": -35.75469207763672, "global_step": 93574, "epoch": 773} {"train_loss": -35.84048080444336, "global_step": 93575, "epoch": 773} {"train_loss": -36.45742416381836, "global_step": 93576, "epoch": 773} {"train_loss": -35.14760208129883, "global_step": 93577, "epoch": 773} {"train_loss": -36.25125503540039, "global_step": 93578, "epoch": 773} {"train_loss": -35.2969970703125, "global_step": 93579, "epoch": 773} {"train_loss": -34.99502944946289, "global_step": 93580, "epoch": 773} {"train_loss": -36.5961799621582, "global_step": 93581, "epoch": 773} {"train_loss": -36.637691497802734, "global_step": 93582, "epoch": 773} {"train_loss": -36.0937385559082, "global_step": 93583, "epoch": 773} {"train_loss": -35.9705696105957, "global_step": 93584, "epoch": 773} {"train_loss": -35.9105339050293, "global_step": 93585, "epoch": 773} {"train_loss": -35.496185302734375, "global_step": 93586, "epoch": 773} {"train_loss": -37.263397216796875, "global_step": 93587, "epoch": 773} {"train_loss": -36.542057037353516, "global_step": 93588, "epoch": 773} {"train_loss": -36.59049987792969, "global_step": 93589, "epoch": 773} {"train_loss": -35.73466873168945, "global_step": 93590, "epoch": 773} {"train_loss": -37.19854736328125, "global_step": 93591, "epoch": 773} {"train_loss": -36.30802536010742, "global_step": 93592, "epoch": 773} {"train_loss": -36.60095977783203, "global_step": 93593, "epoch": 773} {"train_loss": -36.961124420166016, "global_step": 93594, "epoch": 773} {"train_loss": -38.323822021484375, "global_step": 93595, "epoch": 773} {"train_loss": -36.47405242919922, "global_step": 93596, "epoch": 773} {"train_loss": -36.465755462646484, "global_step": 93597, "epoch": 773} {"train_loss": -37.71132278442383, "global_step": 93598, "epoch": 773} {"train_loss": -37.41572952270508, "global_step": 93599, "epoch": 773} {"train_loss": -37.7606315612793, "global_step": 93600, "epoch": 773} {"train_loss": -37.75707244873047, "global_step": 93601, "epoch": 773} {"train_loss": -38.034751892089844, "global_step": 93602, "epoch": 773} {"train_loss": -37.92961502075195, "global_step": 93603, "epoch": 773} {"train_loss": -38.180091857910156, "global_step": 93604, "epoch": 773} {"train_loss": -36.96149444580078, "global_step": 93605, "epoch": 773} {"train_loss": -35.53794479370117, "global_step": 93606, "epoch": 773} {"train_loss": -37.264583587646484, "global_step": 93607, "epoch": 773} {"train_loss": -37.86285400390625, "global_step": 93608, "epoch": 773} {"train_loss": -37.848175048828125, "global_step": 93609, "epoch": 773} {"train_loss": -37.99208068847656, "global_step": 93610, "epoch": 773} {"train_loss": -37.751319885253906, "global_step": 93611, "epoch": 773} {"train_loss": -38.072757720947266, "global_step": 93612, "epoch": 773} {"train_loss": -38.671566009521484, "global_step": 93613, "epoch": 773} {"train_loss": -38.49142074584961, "global_step": 93614, "epoch": 773} {"train_loss": -36.86842727661133, "global_step": 93615, "epoch": 773} {"train_loss": -37.956722259521484, "global_step": 93616, "epoch": 773} {"train_loss": -37.48747253417969, "global_step": 93617, "epoch": 773} {"train_loss": -38.289058685302734, "global_step": 93618, "epoch": 773} {"train_loss": -37.83964157104492, "global_step": 93619, "epoch": 773} {"train_loss": -36.3253173828125, "global_step": 93620, "epoch": 773} {"train_loss": -38.30024719238281, "global_step": 93621, "epoch": 773} {"train_loss": -37.58414840698242, "global_step": 93622, "epoch": 773} {"train_loss": -38.517452239990234, "global_step": 93623, "epoch": 773} {"train_loss": -38.194725036621094, "global_step": 93624, "epoch": 773} {"train_loss": -37.5006103515625, "global_step": 93625, "epoch": 773} {"train_loss": -38.492130279541016, "global_step": 93626, "epoch": 773} {"train_loss": -38.24762725830078, "global_step": 93627, "epoch": 773} {"train_loss": -37.048675537109375, "global_step": 93628, "epoch": 773} {"train_loss": -38.98594665527344, "global_step": 93629, "epoch": 773} {"train_loss": -38.821537017822266, "global_step": 93630, "epoch": 773} {"train_loss": -37.98163986206055, "global_step": 93631, "epoch": 773} {"train_loss": -37.6523323059082, "global_step": 93632, "epoch": 773} {"train_loss": -36.60678482055664, "global_step": 93633, "epoch": 773} {"train_loss": -37.9405403137207, "global_step": 93634, "epoch": 773} {"train_loss": -38.22340393066406, "global_step": 93635, "epoch": 773} {"train_loss": -36.77983856201172, "global_step": 93636, "epoch": 773} {"train_loss": -38.0130615234375, "global_step": 93637, "epoch": 773} {"train_loss": -37.883480072021484, "global_step": 93638, "epoch": 773} {"train_loss": -38.413429260253906, "global_step": 93639, "epoch": 773} {"train_loss": -37.71335983276367, "global_step": 93640, "epoch": 773} {"train_loss": -37.37595748901367, "global_step": 93641, "epoch": 773} {"train_loss": -37.9744758605957, "global_step": 93642, "epoch": 773} {"train_loss": -37.494300842285156, "global_step": 93643, "epoch": 773} {"train_loss": -37.22772216796875, "global_step": 93644, "epoch": 773} {"train_loss": -37.64753341674805, "global_step": 93645, "epoch": 773} {"train_loss": -37.43491744995117, "global_step": 93646, "epoch": 773} {"train_loss": -38.18672561645508, "global_step": 93647, "epoch": 773} {"train_loss": -37.862911224365234, "global_step": 93648, "epoch": 773} {"train_loss": -38.38840866088867, "global_step": 93649, "epoch": 773} {"train_loss": -38.315059661865234, "global_step": 93650, "epoch": 773} {"train_loss": -38.24323272705078, "global_step": 93651, "epoch": 773} {"train_loss": -36.14955139160156, "global_step": 93652, "epoch": 773} {"train_loss": -37.335637983211804, "global_step": 93653, "epoch": 773, "val_loss": 2625758.25} {"train_loss": -38.0027961730957, "global_step": 93654, "epoch": 774} {"train_loss": -37.769046783447266, "global_step": 93655, "epoch": 774} {"train_loss": -38.54629135131836, "global_step": 93656, "epoch": 774} {"train_loss": -38.18890380859375, "global_step": 93657, "epoch": 774} {"train_loss": -37.85280227661133, "global_step": 93658, "epoch": 774} {"train_loss": -37.51728439331055, "global_step": 93659, "epoch": 774} {"train_loss": -38.49111557006836, "global_step": 93660, "epoch": 774} {"train_loss": -36.020687103271484, "global_step": 93661, "epoch": 774} {"train_loss": -36.915523529052734, "global_step": 93662, "epoch": 774} {"train_loss": -35.803157806396484, "global_step": 93663, "epoch": 774} {"train_loss": -34.559112548828125, "global_step": 93664, "epoch": 774} {"train_loss": -37.679237365722656, "global_step": 93665, "epoch": 774} {"train_loss": -34.39655303955078, "global_step": 93666, "epoch": 774} {"train_loss": -28.610876083374023, "global_step": 93667, "epoch": 774} {"train_loss": -19.53348731994629, "global_step": 93668, "epoch": 774} {"train_loss": -21.699716567993164, "global_step": 93669, "epoch": 774} {"train_loss": -35.926177978515625, "global_step": 93670, "epoch": 774} {"train_loss": -29.247238159179688, "global_step": 93671, "epoch": 774} {"train_loss": -32.000240325927734, "global_step": 93672, "epoch": 774} {"train_loss": -32.330501556396484, "global_step": 93673, "epoch": 774} {"train_loss": -31.055469512939453, "global_step": 93674, "epoch": 774} {"train_loss": -32.70994186401367, "global_step": 93675, "epoch": 774} {"train_loss": -33.1429443359375, "global_step": 93676, "epoch": 774} {"train_loss": -34.23623275756836, "global_step": 93677, "epoch": 774} {"train_loss": -33.61115646362305, "global_step": 93678, "epoch": 774} {"train_loss": -34.60384750366211, "global_step": 93679, "epoch": 774} {"train_loss": -36.90681838989258, "global_step": 93680, "epoch": 774} {"train_loss": -34.338905334472656, "global_step": 93681, "epoch": 774} {"train_loss": -36.570167541503906, "global_step": 93682, "epoch": 774} {"train_loss": -35.030799865722656, "global_step": 93683, "epoch": 774} {"train_loss": -34.235069274902344, "global_step": 93684, "epoch": 774} {"train_loss": -36.80574417114258, "global_step": 93685, "epoch": 774} {"train_loss": -35.70248794555664, "global_step": 93686, "epoch": 774} {"train_loss": -35.89720916748047, "global_step": 93687, "epoch": 774} {"train_loss": -37.121803283691406, "global_step": 93688, "epoch": 774} {"train_loss": -35.594417572021484, "global_step": 93689, "epoch": 774} {"train_loss": -36.720855712890625, "global_step": 93690, "epoch": 774} {"train_loss": -37.12666702270508, "global_step": 93691, "epoch": 774} {"train_loss": -36.393798828125, "global_step": 93692, "epoch": 774} {"train_loss": -37.653564453125, "global_step": 93693, "epoch": 774} {"train_loss": -37.85149383544922, "global_step": 93694, "epoch": 774} {"train_loss": -37.40682601928711, "global_step": 93695, "epoch": 774} {"train_loss": -37.73745346069336, "global_step": 93696, "epoch": 774} {"train_loss": -37.588897705078125, "global_step": 93697, "epoch": 774} {"train_loss": -37.45358657836914, "global_step": 93698, "epoch": 774} {"train_loss": -37.18220520019531, "global_step": 93699, "epoch": 774} {"train_loss": -37.38731002807617, "global_step": 93700, "epoch": 774} {"train_loss": -37.68727493286133, "global_step": 93701, "epoch": 774} {"train_loss": -37.38436508178711, "global_step": 93702, "epoch": 774} {"train_loss": -37.75065994262695, "global_step": 93703, "epoch": 774} {"train_loss": -37.26935958862305, "global_step": 93704, "epoch": 774} {"train_loss": -37.8125, "global_step": 93705, "epoch": 774} {"train_loss": -37.68254470825195, "global_step": 93706, "epoch": 774} {"train_loss": -37.89558792114258, "global_step": 93707, "epoch": 774} {"train_loss": -38.27384567260742, "global_step": 93708, "epoch": 774} {"train_loss": -38.05012893676758, "global_step": 93709, "epoch": 774} {"train_loss": -38.178096771240234, "global_step": 93710, "epoch": 774} {"train_loss": -38.49144744873047, "global_step": 93711, "epoch": 774} {"train_loss": -37.82434844970703, "global_step": 93712, "epoch": 774} {"train_loss": -38.224239349365234, "global_step": 93713, "epoch": 774} {"train_loss": -38.043609619140625, "global_step": 93714, "epoch": 774} {"train_loss": -38.03622055053711, "global_step": 93715, "epoch": 774} {"train_loss": -38.10752487182617, "global_step": 93716, "epoch": 774} {"train_loss": -38.13591384887695, "global_step": 93717, "epoch": 774} {"train_loss": -38.15376663208008, "global_step": 93718, "epoch": 774} {"train_loss": -38.416690826416016, "global_step": 93719, "epoch": 774} {"train_loss": -38.381160736083984, "global_step": 93720, "epoch": 774} {"train_loss": -38.450584411621094, "global_step": 93721, "epoch": 774} {"train_loss": -38.61042404174805, "global_step": 93722, "epoch": 774} {"train_loss": -38.16164779663086, "global_step": 93723, "epoch": 774} {"train_loss": -37.96379089355469, "global_step": 93724, "epoch": 774} {"train_loss": -38.64931106567383, "global_step": 93725, "epoch": 774} {"train_loss": -38.5791130065918, "global_step": 93726, "epoch": 774} {"train_loss": -38.61821365356445, "global_step": 93727, "epoch": 774} {"train_loss": -37.90462875366211, "global_step": 93728, "epoch": 774} {"train_loss": -38.94547653198242, "global_step": 93729, "epoch": 774} {"train_loss": -38.6539306640625, "global_step": 93730, "epoch": 774} {"train_loss": -38.975189208984375, "global_step": 93731, "epoch": 774} {"train_loss": -38.77341842651367, "global_step": 93732, "epoch": 774} {"train_loss": -38.70566177368164, "global_step": 93733, "epoch": 774} {"train_loss": -38.7055778503418, "global_step": 93734, "epoch": 774} {"train_loss": -38.54300308227539, "global_step": 93735, "epoch": 774} {"train_loss": -38.309059143066406, "global_step": 93736, "epoch": 774} {"train_loss": -38.19698715209961, "global_step": 93737, "epoch": 774} {"train_loss": -39.01166915893555, "global_step": 93738, "epoch": 774} {"train_loss": -38.61534118652344, "global_step": 93739, "epoch": 774} {"train_loss": -37.815086364746094, "global_step": 93740, "epoch": 774} {"train_loss": -37.715938568115234, "global_step": 93741, "epoch": 774} {"train_loss": -38.8155517578125, "global_step": 93742, "epoch": 774} {"train_loss": -38.352901458740234, "global_step": 93743, "epoch": 774} {"train_loss": -38.79367446899414, "global_step": 93744, "epoch": 774} {"train_loss": -38.483001708984375, "global_step": 93745, "epoch": 774} {"train_loss": -38.777034759521484, "global_step": 93746, "epoch": 774} {"train_loss": -38.165889739990234, "global_step": 93747, "epoch": 774} {"train_loss": -38.37288284301758, "global_step": 93748, "epoch": 774} {"train_loss": -38.3388786315918, "global_step": 93749, "epoch": 774} {"train_loss": -37.9553108215332, "global_step": 93750, "epoch": 774} {"train_loss": -37.54784393310547, "global_step": 93751, "epoch": 774} {"train_loss": -35.91695785522461, "global_step": 93752, "epoch": 774} {"train_loss": -38.53108596801758, "global_step": 93753, "epoch": 774} {"train_loss": -37.84367370605469, "global_step": 93754, "epoch": 774} {"train_loss": -38.3757438659668, "global_step": 93755, "epoch": 774} {"train_loss": -37.390071868896484, "global_step": 93756, "epoch": 774} {"train_loss": -38.28346633911133, "global_step": 93757, "epoch": 774} {"train_loss": -37.07951736450195, "global_step": 93758, "epoch": 774} {"train_loss": -36.61631393432617, "global_step": 93759, "epoch": 774} {"train_loss": -34.23466110229492, "global_step": 93760, "epoch": 774} {"train_loss": -36.82454299926758, "global_step": 93761, "epoch": 774} {"train_loss": -36.55970764160156, "global_step": 93762, "epoch": 774} {"train_loss": -31.66291618347168, "global_step": 93763, "epoch": 774} {"train_loss": -37.53036117553711, "global_step": 93764, "epoch": 774} {"train_loss": -37.490745544433594, "global_step": 93765, "epoch": 774} {"train_loss": -36.23085403442383, "global_step": 93766, "epoch": 774} {"train_loss": -36.26461410522461, "global_step": 93767, "epoch": 774} {"train_loss": -36.79525375366211, "global_step": 93768, "epoch": 774} {"train_loss": -27.88543701171875, "global_step": 93769, "epoch": 774} {"train_loss": -37.026580810546875, "global_step": 93770, "epoch": 774} {"train_loss": -34.86695098876953, "global_step": 93771, "epoch": 774} {"train_loss": -30.436920166015625, "global_step": 93772, "epoch": 774} {"train_loss": -28.63031578063965, "global_step": 93773, "epoch": 774} {"train_loss": -36.45487652928376, "global_step": 93774, "epoch": 774, "val_loss": 2878752.0} {"train_loss": -29.78525161743164, "global_step": 93775, "epoch": 775} {"train_loss": -33.70732879638672, "global_step": 93776, "epoch": 775} {"train_loss": -13.454184532165527, "global_step": 93777, "epoch": 775} {"train_loss": -22.21767234802246, "global_step": 93778, "epoch": 775} {"train_loss": -29.20903968811035, "global_step": 93779, "epoch": 775} {"train_loss": -29.50661277770996, "global_step": 93780, "epoch": 775} {"train_loss": -25.28265380859375, "global_step": 93781, "epoch": 775} {"train_loss": -30.70598793029785, "global_step": 93782, "epoch": 775} {"train_loss": -28.367172241210938, "global_step": 93783, "epoch": 775} {"train_loss": -28.480859756469727, "global_step": 93784, "epoch": 775} {"train_loss": -29.557971954345703, "global_step": 93785, "epoch": 775} {"train_loss": -27.71970558166504, "global_step": 93786, "epoch": 775} {"train_loss": -29.689136505126953, "global_step": 93787, "epoch": 775} {"train_loss": -31.87917137145996, "global_step": 93788, "epoch": 775} {"train_loss": -31.53900718688965, "global_step": 93789, "epoch": 775} {"train_loss": -32.504432678222656, "global_step": 93790, "epoch": 775} {"train_loss": -30.430301666259766, "global_step": 93791, "epoch": 775} {"train_loss": -33.5948600769043, "global_step": 93792, "epoch": 775} {"train_loss": -32.194435119628906, "global_step": 93793, "epoch": 775} {"train_loss": -32.29110336303711, "global_step": 93794, "epoch": 775} {"train_loss": -32.84730911254883, "global_step": 93795, "epoch": 775} {"train_loss": -34.54771041870117, "global_step": 93796, "epoch": 775} {"train_loss": -33.178192138671875, "global_step": 93797, "epoch": 775} {"train_loss": -33.73264694213867, "global_step": 93798, "epoch": 775} {"train_loss": -33.77511215209961, "global_step": 93799, "epoch": 775} {"train_loss": -33.692718505859375, "global_step": 93800, "epoch": 775} {"train_loss": -34.01686477661133, "global_step": 93801, "epoch": 775} {"train_loss": -33.75224304199219, "global_step": 93802, "epoch": 775} {"train_loss": -33.711029052734375, "global_step": 93803, "epoch": 775} {"train_loss": -34.78242111206055, "global_step": 93804, "epoch": 775} {"train_loss": -34.63433837890625, "global_step": 93805, "epoch": 775} {"train_loss": -34.42457580566406, "global_step": 93806, "epoch": 775} {"train_loss": -34.3829345703125, "global_step": 93807, "epoch": 775} {"train_loss": -35.0522575378418, "global_step": 93808, "epoch": 775} {"train_loss": -34.6748161315918, "global_step": 93809, "epoch": 775} {"train_loss": -34.73843765258789, "global_step": 93810, "epoch": 775} {"train_loss": -35.12580490112305, "global_step": 93811, "epoch": 775} {"train_loss": -34.93583297729492, "global_step": 93812, "epoch": 775} {"train_loss": -34.98184585571289, "global_step": 93813, "epoch": 775} {"train_loss": -35.0298957824707, "global_step": 93814, "epoch": 775} {"train_loss": -35.06285095214844, "global_step": 93815, "epoch": 775} {"train_loss": -35.167720794677734, "global_step": 93816, "epoch": 775} {"train_loss": -35.34403610229492, "global_step": 93817, "epoch": 775} {"train_loss": -35.30958938598633, "global_step": 93818, "epoch": 775} {"train_loss": -35.91339874267578, "global_step": 93819, "epoch": 775} {"train_loss": -35.36996078491211, "global_step": 93820, "epoch": 775} {"train_loss": -35.6049919128418, "global_step": 93821, "epoch": 775} {"train_loss": -35.604671478271484, "global_step": 93822, "epoch": 775} {"train_loss": -34.8895263671875, "global_step": 93823, "epoch": 775} {"train_loss": -35.884918212890625, "global_step": 93824, "epoch": 775} {"train_loss": -35.92353439331055, "global_step": 93825, "epoch": 775} {"train_loss": -36.083003997802734, "global_step": 93826, "epoch": 775} {"train_loss": -35.78730392456055, "global_step": 93827, "epoch": 775} {"train_loss": -36.062007904052734, "global_step": 93828, "epoch": 775} {"train_loss": -36.278846740722656, "global_step": 93829, "epoch": 775} {"train_loss": -36.498939514160156, "global_step": 93830, "epoch": 775} {"train_loss": -36.19890213012695, "global_step": 93831, "epoch": 775} {"train_loss": -36.2603645324707, "global_step": 93832, "epoch": 775} {"train_loss": -36.02372360229492, "global_step": 93833, "epoch": 775} {"train_loss": -36.09701156616211, "global_step": 93834, "epoch": 775} {"train_loss": -36.1928825378418, "global_step": 93835, "epoch": 775} {"train_loss": -36.60111999511719, "global_step": 93836, "epoch": 775} {"train_loss": -36.477046966552734, "global_step": 93837, "epoch": 775} {"train_loss": -36.68640899658203, "global_step": 93838, "epoch": 775} {"train_loss": -36.60732650756836, "global_step": 93839, "epoch": 775} {"train_loss": -36.338130950927734, "global_step": 93840, "epoch": 775} {"train_loss": -36.42881393432617, "global_step": 93841, "epoch": 775} {"train_loss": -36.46879577636719, "global_step": 93842, "epoch": 775} {"train_loss": -36.638702392578125, "global_step": 93843, "epoch": 775} {"train_loss": -36.669769287109375, "global_step": 93844, "epoch": 775} {"train_loss": -36.90745162963867, "global_step": 93845, "epoch": 775} {"train_loss": -36.96207809448242, "global_step": 93846, "epoch": 775} {"train_loss": -36.90143966674805, "global_step": 93847, "epoch": 775} {"train_loss": -37.144874572753906, "global_step": 93848, "epoch": 775} {"train_loss": -36.76348876953125, "global_step": 93849, "epoch": 775} {"train_loss": -37.19837188720703, "global_step": 93850, "epoch": 775} {"train_loss": -36.795101165771484, "global_step": 93851, "epoch": 775} {"train_loss": -36.40608596801758, "global_step": 93852, "epoch": 775} {"train_loss": -36.95647048950195, "global_step": 93853, "epoch": 775} {"train_loss": -37.44892120361328, "global_step": 93854, "epoch": 775} {"train_loss": -37.40121078491211, "global_step": 93855, "epoch": 775} {"train_loss": -37.52460861206055, "global_step": 93856, "epoch": 775} {"train_loss": -37.39505386352539, "global_step": 93857, "epoch": 775} {"train_loss": -37.7366943359375, "global_step": 93858, "epoch": 775} {"train_loss": -37.136348724365234, "global_step": 93859, "epoch": 775} {"train_loss": -37.382747650146484, "global_step": 93860, "epoch": 775} {"train_loss": -37.50388717651367, "global_step": 93861, "epoch": 775} {"train_loss": -37.53957748413086, "global_step": 93862, "epoch": 775} {"train_loss": -37.878173828125, "global_step": 93863, "epoch": 775} {"train_loss": -37.13089370727539, "global_step": 93864, "epoch": 775} {"train_loss": -36.02749252319336, "global_step": 93865, "epoch": 775} {"train_loss": -37.24407196044922, "global_step": 93866, "epoch": 775} {"train_loss": -37.367340087890625, "global_step": 93867, "epoch": 775} {"train_loss": -37.72966003417969, "global_step": 93868, "epoch": 775} {"train_loss": -37.98868942260742, "global_step": 93869, "epoch": 775} {"train_loss": -37.44853591918945, "global_step": 93870, "epoch": 775} {"train_loss": -37.91584014892578, "global_step": 93871, "epoch": 775} {"train_loss": -37.23843002319336, "global_step": 93872, "epoch": 775} {"train_loss": -38.11249542236328, "global_step": 93873, "epoch": 775} {"train_loss": -37.20183563232422, "global_step": 93874, "epoch": 775} {"train_loss": -37.50985336303711, "global_step": 93875, "epoch": 775} {"train_loss": -38.172237396240234, "global_step": 93876, "epoch": 775} {"train_loss": -36.991485595703125, "global_step": 93877, "epoch": 775} {"train_loss": -37.70886993408203, "global_step": 93878, "epoch": 775} {"train_loss": -36.77210235595703, "global_step": 93879, "epoch": 775} {"train_loss": -37.27710723876953, "global_step": 93880, "epoch": 775} {"train_loss": -37.891231536865234, "global_step": 93881, "epoch": 775} {"train_loss": -38.0084114074707, "global_step": 93882, "epoch": 775} {"train_loss": -37.29582595825195, "global_step": 93883, "epoch": 775} {"train_loss": -37.715171813964844, "global_step": 93884, "epoch": 775} {"train_loss": -37.774417877197266, "global_step": 93885, "epoch": 775} {"train_loss": -37.80671310424805, "global_step": 93886, "epoch": 775} {"train_loss": -37.272823333740234, "global_step": 93887, "epoch": 775} {"train_loss": -37.384891510009766, "global_step": 93888, "epoch": 775} {"train_loss": -36.65604782104492, "global_step": 93889, "epoch": 775} {"train_loss": -34.281219482421875, "global_step": 93890, "epoch": 775} {"train_loss": -33.2646598815918, "global_step": 93891, "epoch": 775} {"train_loss": -32.586158752441406, "global_step": 93892, "epoch": 775} {"train_loss": -34.720035552978516, "global_step": 93893, "epoch": 775} {"train_loss": -36.98945236206055, "global_step": 93894, "epoch": 775} {"train_loss": -35.02877315016818, "global_step": 93895, "epoch": 775, "val_loss": 2572297.25} {"train_loss": -36.670692443847656, "global_step": 93896, "epoch": 776} {"train_loss": -35.503662109375, "global_step": 93897, "epoch": 776} {"train_loss": -37.10834884643555, "global_step": 93898, "epoch": 776} {"train_loss": -36.736263275146484, "global_step": 93899, "epoch": 776} {"train_loss": -35.599605560302734, "global_step": 93900, "epoch": 776} {"train_loss": -36.59278106689453, "global_step": 93901, "epoch": 776} {"train_loss": -36.97495651245117, "global_step": 93902, "epoch": 776} {"train_loss": -35.859901428222656, "global_step": 93903, "epoch": 776} {"train_loss": -38.04706954956055, "global_step": 93904, "epoch": 776} {"train_loss": -36.511688232421875, "global_step": 93905, "epoch": 776} {"train_loss": -37.357784271240234, "global_step": 93906, "epoch": 776} {"train_loss": -37.83465576171875, "global_step": 93907, "epoch": 776} {"train_loss": -36.82538986206055, "global_step": 93908, "epoch": 776} {"train_loss": -37.065372467041016, "global_step": 93909, "epoch": 776} {"train_loss": -36.39926528930664, "global_step": 93910, "epoch": 776} {"train_loss": -38.022151947021484, "global_step": 93911, "epoch": 776} {"train_loss": -37.393924713134766, "global_step": 93912, "epoch": 776} {"train_loss": -36.66679763793945, "global_step": 93913, "epoch": 776} {"train_loss": -38.013153076171875, "global_step": 93914, "epoch": 776} {"train_loss": -37.05241775512695, "global_step": 93915, "epoch": 776} {"train_loss": -37.822750091552734, "global_step": 93916, "epoch": 776} {"train_loss": -37.43172073364258, "global_step": 93917, "epoch": 776} {"train_loss": -38.19498825073242, "global_step": 93918, "epoch": 776} {"train_loss": -37.62228775024414, "global_step": 93919, "epoch": 776} {"train_loss": -38.15861892700195, "global_step": 93920, "epoch": 776} {"train_loss": -38.078887939453125, "global_step": 93921, "epoch": 776} {"train_loss": -37.81146240234375, "global_step": 93922, "epoch": 776} {"train_loss": -38.00115203857422, "global_step": 93923, "epoch": 776} {"train_loss": -37.734371185302734, "global_step": 93924, "epoch": 776} {"train_loss": -37.89043426513672, "global_step": 93925, "epoch": 776} {"train_loss": -37.30996322631836, "global_step": 93926, "epoch": 776} {"train_loss": -37.364532470703125, "global_step": 93927, "epoch": 776} {"train_loss": -37.513362884521484, "global_step": 93928, "epoch": 776} {"train_loss": -37.750484466552734, "global_step": 93929, "epoch": 776} {"train_loss": -36.428619384765625, "global_step": 93930, "epoch": 776} {"train_loss": -32.481353759765625, "global_step": 93931, "epoch": 776} {"train_loss": -32.90177536010742, "global_step": 93932, "epoch": 776} {"train_loss": -36.02922058105469, "global_step": 93933, "epoch": 776} {"train_loss": -35.759151458740234, "global_step": 93934, "epoch": 776} {"train_loss": -36.547359466552734, "global_step": 93935, "epoch": 776} {"train_loss": -32.40925216674805, "global_step": 93936, "epoch": 776} {"train_loss": -34.0836067199707, "global_step": 93937, "epoch": 776} {"train_loss": -31.43837547302246, "global_step": 93938, "epoch": 776} {"train_loss": -35.32119369506836, "global_step": 93939, "epoch": 776} {"train_loss": -32.362709045410156, "global_step": 93940, "epoch": 776} {"train_loss": -36.12661361694336, "global_step": 93941, "epoch": 776} {"train_loss": -33.431278228759766, "global_step": 93942, "epoch": 776} {"train_loss": -35.4574089050293, "global_step": 93943, "epoch": 776} {"train_loss": -35.039756774902344, "global_step": 93944, "epoch": 776} {"train_loss": -35.225433349609375, "global_step": 93945, "epoch": 776} {"train_loss": -36.07732391357422, "global_step": 93946, "epoch": 776} {"train_loss": -36.365848541259766, "global_step": 93947, "epoch": 776} {"train_loss": -36.07192611694336, "global_step": 93948, "epoch": 776} {"train_loss": -34.192710876464844, "global_step": 93949, "epoch": 776} {"train_loss": -37.27199935913086, "global_step": 93950, "epoch": 776} {"train_loss": -36.82822799682617, "global_step": 93951, "epoch": 776} {"train_loss": -35.371437072753906, "global_step": 93952, "epoch": 776} {"train_loss": -35.79484176635742, "global_step": 93953, "epoch": 776} {"train_loss": -36.52027130126953, "global_step": 93954, "epoch": 776} {"train_loss": -36.893898010253906, "global_step": 93955, "epoch": 776} {"train_loss": -37.09313201904297, "global_step": 93956, "epoch": 776} {"train_loss": -36.0489501953125, "global_step": 93957, "epoch": 776} {"train_loss": -36.85292434692383, "global_step": 93958, "epoch": 776} {"train_loss": -37.02710723876953, "global_step": 93959, "epoch": 776} {"train_loss": -37.13485336303711, "global_step": 93960, "epoch": 776} {"train_loss": -37.618629455566406, "global_step": 93961, "epoch": 776} {"train_loss": -36.71855926513672, "global_step": 93962, "epoch": 776} {"train_loss": -37.23194122314453, "global_step": 93963, "epoch": 776} {"train_loss": -37.477935791015625, "global_step": 93964, "epoch": 776} {"train_loss": -37.71626663208008, "global_step": 93965, "epoch": 776} {"train_loss": -37.266082763671875, "global_step": 93966, "epoch": 776} {"train_loss": -38.08717346191406, "global_step": 93967, "epoch": 776} {"train_loss": -37.49155807495117, "global_step": 93968, "epoch": 776} {"train_loss": -37.80514144897461, "global_step": 93969, "epoch": 776} {"train_loss": -38.03261947631836, "global_step": 93970, "epoch": 776} {"train_loss": -37.518009185791016, "global_step": 93971, "epoch": 776} {"train_loss": -37.95295333862305, "global_step": 93972, "epoch": 776} {"train_loss": -38.06406021118164, "global_step": 93973, "epoch": 776} {"train_loss": -37.30323028564453, "global_step": 93974, "epoch": 776} {"train_loss": -37.90776443481445, "global_step": 93975, "epoch": 776} {"train_loss": -37.97652053833008, "global_step": 93976, "epoch": 776} {"train_loss": -37.55317306518555, "global_step": 93977, "epoch": 776} {"train_loss": -38.05825424194336, "global_step": 93978, "epoch": 776} {"train_loss": -38.29730224609375, "global_step": 93979, "epoch": 776} {"train_loss": -37.37588119506836, "global_step": 93980, "epoch": 776} {"train_loss": -38.11902618408203, "global_step": 93981, "epoch": 776} {"train_loss": -38.3370475769043, "global_step": 93982, "epoch": 776} {"train_loss": -38.26156234741211, "global_step": 93983, "epoch": 776} {"train_loss": -38.30535888671875, "global_step": 93984, "epoch": 776} {"train_loss": -38.45858383178711, "global_step": 93985, "epoch": 776} {"train_loss": -38.421878814697266, "global_step": 93986, "epoch": 776} {"train_loss": -38.50495529174805, "global_step": 93987, "epoch": 776} {"train_loss": -38.54059600830078, "global_step": 93988, "epoch": 776} {"train_loss": -38.46464920043945, "global_step": 93989, "epoch": 776} {"train_loss": -38.71330642700195, "global_step": 93990, "epoch": 776} {"train_loss": -38.63630294799805, "global_step": 93991, "epoch": 776} {"train_loss": -38.22286605834961, "global_step": 93992, "epoch": 776} {"train_loss": -38.721805572509766, "global_step": 93993, "epoch": 776} {"train_loss": -38.71519088745117, "global_step": 93994, "epoch": 776} {"train_loss": -38.5712890625, "global_step": 93995, "epoch": 776} {"train_loss": -38.77096176147461, "global_step": 93996, "epoch": 776} {"train_loss": -39.028255462646484, "global_step": 93997, "epoch": 776} {"train_loss": -38.721614837646484, "global_step": 93998, "epoch": 776} {"train_loss": -38.481178283691406, "global_step": 93999, "epoch": 776} {"train_loss": -38.8063850402832, "global_step": 94000, "epoch": 776} {"train_loss": -38.71223068237305, "global_step": 94001, "epoch": 776} {"train_loss": -38.54923629760742, "global_step": 94002, "epoch": 776} {"train_loss": -38.70539474487305, "global_step": 94003, "epoch": 776} {"train_loss": -37.65629959106445, "global_step": 94004, "epoch": 776} {"train_loss": -38.42396926879883, "global_step": 94005, "epoch": 776} {"train_loss": -38.76050567626953, "global_step": 94006, "epoch": 776} {"train_loss": -38.659454345703125, "global_step": 94007, "epoch": 776} {"train_loss": -37.550838470458984, "global_step": 94008, "epoch": 776} {"train_loss": -35.95454406738281, "global_step": 94009, "epoch": 776} {"train_loss": -30.4229793548584, "global_step": 94010, "epoch": 776} {"train_loss": -22.150190353393555, "global_step": 94011, "epoch": 776} {"train_loss": -24.47150230407715, "global_step": 94012, "epoch": 776} {"train_loss": -34.418174743652344, "global_step": 94013, "epoch": 776} {"train_loss": -35.544307708740234, "global_step": 94014, "epoch": 776} {"train_loss": -22.01335906982422, "global_step": 94015, "epoch": 776} {"train_loss": -36.580353208809846, "global_step": 94016, "epoch": 776, "val_loss": 2603543.25} {"train_loss": -31.206329345703125, "global_step": 94017, "epoch": 777} {"train_loss": -33.88485336303711, "global_step": 94018, "epoch": 777} {"train_loss": -32.37179183959961, "global_step": 94019, "epoch": 777} {"train_loss": -32.25812530517578, "global_step": 94020, "epoch": 777} {"train_loss": -35.68351745605469, "global_step": 94021, "epoch": 777} {"train_loss": -36.061737060546875, "global_step": 94022, "epoch": 777} {"train_loss": -35.16450881958008, "global_step": 94023, "epoch": 777} {"train_loss": -35.38319778442383, "global_step": 94024, "epoch": 777} {"train_loss": -37.072444915771484, "global_step": 94025, "epoch": 777} {"train_loss": -35.58098220825195, "global_step": 94026, "epoch": 777} {"train_loss": -37.26245880126953, "global_step": 94027, "epoch": 777} {"train_loss": -36.5644416809082, "global_step": 94028, "epoch": 777} {"train_loss": -36.930545806884766, "global_step": 94029, "epoch": 777} {"train_loss": -36.89234924316406, "global_step": 94030, "epoch": 777} {"train_loss": -36.67817306518555, "global_step": 94031, "epoch": 777} {"train_loss": -37.417640686035156, "global_step": 94032, "epoch": 777} {"train_loss": -36.810020446777344, "global_step": 94033, "epoch": 777} {"train_loss": -37.64139175415039, "global_step": 94034, "epoch": 777} {"train_loss": -37.47072219848633, "global_step": 94035, "epoch": 777} {"train_loss": -37.23112106323242, "global_step": 94036, "epoch": 777} {"train_loss": -37.638587951660156, "global_step": 94037, "epoch": 777} {"train_loss": -36.927513122558594, "global_step": 94038, "epoch": 777} {"train_loss": -37.62321472167969, "global_step": 94039, "epoch": 777} {"train_loss": -37.46484375, "global_step": 94040, "epoch": 777} {"train_loss": -37.7168083190918, "global_step": 94041, "epoch": 777} {"train_loss": -37.82809066772461, "global_step": 94042, "epoch": 777} {"train_loss": -38.237022399902344, "global_step": 94043, "epoch": 777} {"train_loss": -37.398597717285156, "global_step": 94044, "epoch": 777} {"train_loss": -38.067665100097656, "global_step": 94045, "epoch": 777} {"train_loss": -38.174747467041016, "global_step": 94046, "epoch": 777} {"train_loss": -37.787025451660156, "global_step": 94047, "epoch": 777} {"train_loss": -37.76534652709961, "global_step": 94048, "epoch": 777} {"train_loss": -37.83865737915039, "global_step": 94049, "epoch": 777} {"train_loss": -37.9139404296875, "global_step": 94050, "epoch": 777} {"train_loss": -38.060482025146484, "global_step": 94051, "epoch": 777} {"train_loss": -38.04086685180664, "global_step": 94052, "epoch": 777} {"train_loss": -37.90940475463867, "global_step": 94053, "epoch": 777} {"train_loss": -37.924644470214844, "global_step": 94054, "epoch": 777} {"train_loss": -38.46584701538086, "global_step": 94055, "epoch": 777} {"train_loss": -37.99738311767578, "global_step": 94056, "epoch": 777} {"train_loss": -38.260440826416016, "global_step": 94057, "epoch": 777} {"train_loss": -37.9332389831543, "global_step": 94058, "epoch": 777} {"train_loss": -38.2592887878418, "global_step": 94059, "epoch": 777} {"train_loss": -38.395355224609375, "global_step": 94060, "epoch": 777} {"train_loss": -38.4415168762207, "global_step": 94061, "epoch": 777} {"train_loss": -38.365047454833984, "global_step": 94062, "epoch": 777} {"train_loss": -38.83544921875, "global_step": 94063, "epoch": 777} {"train_loss": -38.4940071105957, "global_step": 94064, "epoch": 777} {"train_loss": -38.36181640625, "global_step": 94065, "epoch": 777} {"train_loss": -38.383541107177734, "global_step": 94066, "epoch": 777} {"train_loss": -38.36648178100586, "global_step": 94067, "epoch": 777} {"train_loss": -38.56167221069336, "global_step": 94068, "epoch": 777} {"train_loss": -38.674049377441406, "global_step": 94069, "epoch": 777} {"train_loss": -38.31557846069336, "global_step": 94070, "epoch": 777} {"train_loss": -37.96044921875, "global_step": 94071, "epoch": 777} {"train_loss": -38.64985656738281, "global_step": 94072, "epoch": 777} {"train_loss": -38.139198303222656, "global_step": 94073, "epoch": 777} {"train_loss": -38.21437454223633, "global_step": 94074, "epoch": 777} {"train_loss": -37.514984130859375, "global_step": 94075, "epoch": 777} {"train_loss": -37.088401794433594, "global_step": 94076, "epoch": 777} {"train_loss": -37.393428802490234, "global_step": 94077, "epoch": 777} {"train_loss": -37.16524124145508, "global_step": 94078, "epoch": 777} {"train_loss": -37.32481002807617, "global_step": 94079, "epoch": 777} {"train_loss": -36.374366760253906, "global_step": 94080, "epoch": 777} {"train_loss": -35.3309440612793, "global_step": 94081, "epoch": 777} {"train_loss": -35.72294998168945, "global_step": 94082, "epoch": 777} {"train_loss": -36.518104553222656, "global_step": 94083, "epoch": 777} {"train_loss": -38.185054779052734, "global_step": 94084, "epoch": 777} {"train_loss": -38.160804748535156, "global_step": 94085, "epoch": 777} {"train_loss": -37.24262619018555, "global_step": 94086, "epoch": 777} {"train_loss": -37.28468704223633, "global_step": 94087, "epoch": 777} {"train_loss": -37.90351104736328, "global_step": 94088, "epoch": 777} {"train_loss": -37.56611251831055, "global_step": 94089, "epoch": 777} {"train_loss": -38.199485778808594, "global_step": 94090, "epoch": 777} {"train_loss": -37.52334976196289, "global_step": 94091, "epoch": 777} {"train_loss": -38.34491729736328, "global_step": 94092, "epoch": 777} {"train_loss": -37.036922454833984, "global_step": 94093, "epoch": 777} {"train_loss": -37.35173034667969, "global_step": 94094, "epoch": 777} {"train_loss": -37.89335250854492, "global_step": 94095, "epoch": 777} {"train_loss": -38.19841384887695, "global_step": 94096, "epoch": 777} {"train_loss": -37.87092971801758, "global_step": 94097, "epoch": 777} {"train_loss": -36.99959945678711, "global_step": 94098, "epoch": 777} {"train_loss": -37.886539459228516, "global_step": 94099, "epoch": 777} {"train_loss": -37.66621398925781, "global_step": 94100, "epoch": 777} {"train_loss": -38.40644073486328, "global_step": 94101, "epoch": 777} {"train_loss": -38.46889114379883, "global_step": 94102, "epoch": 777} {"train_loss": -38.230552673339844, "global_step": 94103, "epoch": 777} {"train_loss": -38.17005157470703, "global_step": 94104, "epoch": 777} {"train_loss": -37.69328308105469, "global_step": 94105, "epoch": 777} {"train_loss": -38.131771087646484, "global_step": 94106, "epoch": 777} {"train_loss": -38.0400505065918, "global_step": 94107, "epoch": 777} {"train_loss": -37.44072723388672, "global_step": 94108, "epoch": 777} {"train_loss": -37.90904235839844, "global_step": 94109, "epoch": 777} {"train_loss": -36.85633087158203, "global_step": 94110, "epoch": 777} {"train_loss": -37.64105224609375, "global_step": 94111, "epoch": 777} {"train_loss": -37.483280181884766, "global_step": 94112, "epoch": 777} {"train_loss": -37.84406280517578, "global_step": 94113, "epoch": 777} {"train_loss": -38.06935501098633, "global_step": 94114, "epoch": 777} {"train_loss": -37.91455841064453, "global_step": 94115, "epoch": 777} {"train_loss": -38.164913177490234, "global_step": 94116, "epoch": 777} {"train_loss": -38.19076156616211, "global_step": 94117, "epoch": 777} {"train_loss": -37.42132568359375, "global_step": 94118, "epoch": 777} {"train_loss": -37.88187789916992, "global_step": 94119, "epoch": 777} {"train_loss": -38.00161361694336, "global_step": 94120, "epoch": 777} {"train_loss": -37.746429443359375, "global_step": 94121, "epoch": 777} {"train_loss": -37.054847717285156, "global_step": 94122, "epoch": 777} {"train_loss": -37.039833068847656, "global_step": 94123, "epoch": 777} {"train_loss": -37.3607063293457, "global_step": 94124, "epoch": 777} {"train_loss": -38.414493560791016, "global_step": 94125, "epoch": 777} {"train_loss": -38.097450256347656, "global_step": 94126, "epoch": 777} {"train_loss": -38.18873977661133, "global_step": 94127, "epoch": 777} {"train_loss": -38.52462387084961, "global_step": 94128, "epoch": 777} {"train_loss": -37.6963005065918, "global_step": 94129, "epoch": 777} {"train_loss": -37.245277404785156, "global_step": 94130, "epoch": 777} {"train_loss": -37.15119171142578, "global_step": 94131, "epoch": 777} {"train_loss": -38.308921813964844, "global_step": 94132, "epoch": 777} {"train_loss": -37.95034408569336, "global_step": 94133, "epoch": 777} {"train_loss": -38.359493255615234, "global_step": 94134, "epoch": 777} {"train_loss": -38.13321304321289, "global_step": 94135, "epoch": 777} {"train_loss": -36.8892707824707, "global_step": 94136, "epoch": 777} {"train_loss": -37.4633207399983, "global_step": 94137, "epoch": 777, "val_loss": 2646745.0} {"train_loss": -36.59386444091797, "global_step": 94138, "epoch": 778} {"train_loss": -38.44165802001953, "global_step": 94139, "epoch": 778} {"train_loss": -36.896602630615234, "global_step": 94140, "epoch": 778} {"train_loss": -35.75543212890625, "global_step": 94141, "epoch": 778} {"train_loss": -36.50748062133789, "global_step": 94142, "epoch": 778} {"train_loss": -35.91469955444336, "global_step": 94143, "epoch": 778} {"train_loss": -36.83071517944336, "global_step": 94144, "epoch": 778} {"train_loss": -38.043914794921875, "global_step": 94145, "epoch": 778} {"train_loss": -36.98524856567383, "global_step": 94146, "epoch": 778} {"train_loss": -36.891517639160156, "global_step": 94147, "epoch": 778} {"train_loss": -38.05119323730469, "global_step": 94148, "epoch": 778} {"train_loss": -37.4556999206543, "global_step": 94149, "epoch": 778} {"train_loss": -37.2398796081543, "global_step": 94150, "epoch": 778} {"train_loss": -37.531185150146484, "global_step": 94151, "epoch": 778} {"train_loss": -37.47652816772461, "global_step": 94152, "epoch": 778} {"train_loss": -35.85627746582031, "global_step": 94153, "epoch": 778} {"train_loss": -37.664058685302734, "global_step": 94154, "epoch": 778} {"train_loss": -38.084136962890625, "global_step": 94155, "epoch": 778} {"train_loss": -37.6908073425293, "global_step": 94156, "epoch": 778} {"train_loss": -37.79175567626953, "global_step": 94157, "epoch": 778} {"train_loss": -37.6221809387207, "global_step": 94158, "epoch": 778} {"train_loss": -37.46671676635742, "global_step": 94159, "epoch": 778} {"train_loss": -38.474945068359375, "global_step": 94160, "epoch": 778} {"train_loss": -37.66774368286133, "global_step": 94161, "epoch": 778} {"train_loss": -38.035789489746094, "global_step": 94162, "epoch": 778} {"train_loss": -37.166542053222656, "global_step": 94163, "epoch": 778} {"train_loss": -38.06753158569336, "global_step": 94164, "epoch": 778} {"train_loss": -36.96975326538086, "global_step": 94165, "epoch": 778} {"train_loss": -37.32015609741211, "global_step": 94166, "epoch": 778} {"train_loss": -37.35012435913086, "global_step": 94167, "epoch": 778} {"train_loss": -37.0542106628418, "global_step": 94168, "epoch": 778} {"train_loss": -37.63847351074219, "global_step": 94169, "epoch": 778} {"train_loss": -36.5045280456543, "global_step": 94170, "epoch": 778} {"train_loss": -38.645042419433594, "global_step": 94171, "epoch": 778} {"train_loss": -37.567745208740234, "global_step": 94172, "epoch": 778} {"train_loss": -37.23158645629883, "global_step": 94173, "epoch": 778} {"train_loss": -38.253334045410156, "global_step": 94174, "epoch": 778} {"train_loss": -37.484283447265625, "global_step": 94175, "epoch": 778} {"train_loss": -35.09479904174805, "global_step": 94176, "epoch": 778} {"train_loss": -38.3343505859375, "global_step": 94177, "epoch": 778} {"train_loss": -36.58700942993164, "global_step": 94178, "epoch": 778} {"train_loss": -37.734107971191406, "global_step": 94179, "epoch": 778} {"train_loss": -37.27325439453125, "global_step": 94180, "epoch": 778} {"train_loss": -36.911048889160156, "global_step": 94181, "epoch": 778} {"train_loss": -37.35200500488281, "global_step": 94182, "epoch": 778} {"train_loss": -37.05103302001953, "global_step": 94183, "epoch": 778} {"train_loss": -36.888912200927734, "global_step": 94184, "epoch": 778} {"train_loss": -37.6236686706543, "global_step": 94185, "epoch": 778} {"train_loss": -37.57265090942383, "global_step": 94186, "epoch": 778} {"train_loss": -38.013397216796875, "global_step": 94187, "epoch": 778} {"train_loss": -37.73404312133789, "global_step": 94188, "epoch": 778} {"train_loss": -37.001495361328125, "global_step": 94189, "epoch": 778} {"train_loss": -38.12160873413086, "global_step": 94190, "epoch": 778} {"train_loss": -36.811397552490234, "global_step": 94191, "epoch": 778} {"train_loss": -37.037696838378906, "global_step": 94192, "epoch": 778} {"train_loss": -34.5457878112793, "global_step": 94193, "epoch": 778} {"train_loss": -34.487525939941406, "global_step": 94194, "epoch": 778} {"train_loss": -31.49720573425293, "global_step": 94195, "epoch": 778} {"train_loss": -36.51332473754883, "global_step": 94196, "epoch": 778} {"train_loss": -36.7505989074707, "global_step": 94197, "epoch": 778} {"train_loss": -37.33246994018555, "global_step": 94198, "epoch": 778} {"train_loss": -36.344459533691406, "global_step": 94199, "epoch": 778} {"train_loss": -32.23380661010742, "global_step": 94200, "epoch": 778} {"train_loss": -36.388526916503906, "global_step": 94201, "epoch": 778} {"train_loss": -36.95766830444336, "global_step": 94202, "epoch": 778} {"train_loss": -35.73647689819336, "global_step": 94203, "epoch": 778} {"train_loss": -34.56113815307617, "global_step": 94204, "epoch": 778} {"train_loss": -35.5177001953125, "global_step": 94205, "epoch": 778} {"train_loss": -33.177799224853516, "global_step": 94206, "epoch": 778} {"train_loss": -32.934513092041016, "global_step": 94207, "epoch": 778} {"train_loss": -35.69134521484375, "global_step": 94208, "epoch": 778} {"train_loss": -34.0202751159668, "global_step": 94209, "epoch": 778} {"train_loss": -35.20811080932617, "global_step": 94210, "epoch": 778} {"train_loss": -32.6219596862793, "global_step": 94211, "epoch": 778} {"train_loss": -35.60837173461914, "global_step": 94212, "epoch": 778} {"train_loss": -37.10163116455078, "global_step": 94213, "epoch": 778} {"train_loss": -34.91994857788086, "global_step": 94214, "epoch": 778} {"train_loss": -34.9290885925293, "global_step": 94215, "epoch": 778} {"train_loss": -36.7147331237793, "global_step": 94216, "epoch": 778} {"train_loss": -35.63328170776367, "global_step": 94217, "epoch": 778} {"train_loss": -36.24940490722656, "global_step": 94218, "epoch": 778} {"train_loss": -36.87618637084961, "global_step": 94219, "epoch": 778} {"train_loss": -35.661590576171875, "global_step": 94220, "epoch": 778} {"train_loss": -36.9070930480957, "global_step": 94221, "epoch": 778} {"train_loss": -37.20418930053711, "global_step": 94222, "epoch": 778} {"train_loss": -37.07809066772461, "global_step": 94223, "epoch": 778} {"train_loss": -36.41034698486328, "global_step": 94224, "epoch": 778} {"train_loss": -36.58285140991211, "global_step": 94225, "epoch": 778} {"train_loss": -37.04503631591797, "global_step": 94226, "epoch": 778} {"train_loss": -36.67277145385742, "global_step": 94227, "epoch": 778} {"train_loss": -37.81929397583008, "global_step": 94228, "epoch": 778} {"train_loss": -36.67647933959961, "global_step": 94229, "epoch": 778} {"train_loss": -37.27008056640625, "global_step": 94230, "epoch": 778} {"train_loss": -37.201026916503906, "global_step": 94231, "epoch": 778} {"train_loss": -37.33187484741211, "global_step": 94232, "epoch": 778} {"train_loss": -37.301673889160156, "global_step": 94233, "epoch": 778} {"train_loss": -37.480743408203125, "global_step": 94234, "epoch": 778} {"train_loss": -37.9918327331543, "global_step": 94235, "epoch": 778} {"train_loss": -37.77738571166992, "global_step": 94236, "epoch": 778} {"train_loss": -37.9581413269043, "global_step": 94237, "epoch": 778} {"train_loss": -38.150054931640625, "global_step": 94238, "epoch": 778} {"train_loss": -38.10435104370117, "global_step": 94239, "epoch": 778} {"train_loss": -38.086055755615234, "global_step": 94240, "epoch": 778} {"train_loss": -38.48739242553711, "global_step": 94241, "epoch": 778} {"train_loss": -37.093963623046875, "global_step": 94242, "epoch": 778} {"train_loss": -37.712852478027344, "global_step": 94243, "epoch": 778} {"train_loss": -38.30370330810547, "global_step": 94244, "epoch": 778} {"train_loss": -38.362056732177734, "global_step": 94245, "epoch": 778} {"train_loss": -38.36379623413086, "global_step": 94246, "epoch": 778} {"train_loss": -37.82939147949219, "global_step": 94247, "epoch": 778} {"train_loss": -37.78290557861328, "global_step": 94248, "epoch": 778} {"train_loss": -37.98835372924805, "global_step": 94249, "epoch": 778} {"train_loss": -38.50167465209961, "global_step": 94250, "epoch": 778} {"train_loss": -38.29871368408203, "global_step": 94251, "epoch": 778} {"train_loss": -38.24770736694336, "global_step": 94252, "epoch": 778} {"train_loss": -38.167781829833984, "global_step": 94253, "epoch": 778} {"train_loss": -38.25370407104492, "global_step": 94254, "epoch": 778} {"train_loss": -38.73350143432617, "global_step": 94255, "epoch": 778} {"train_loss": -38.40695571899414, "global_step": 94256, "epoch": 778} {"train_loss": -38.90340805053711, "global_step": 94257, "epoch": 778} {"train_loss": -36.977394151293545, "global_step": 94258, "epoch": 778, "val_loss": 2613053.75} {"train_loss": -38.582942962646484, "global_step": 94259, "epoch": 779} {"train_loss": -39.09171676635742, "global_step": 94260, "epoch": 779} {"train_loss": -37.70064163208008, "global_step": 94261, "epoch": 779} {"train_loss": -37.623992919921875, "global_step": 94262, "epoch": 779} {"train_loss": -37.87152099609375, "global_step": 94263, "epoch": 779} {"train_loss": -38.834075927734375, "global_step": 94264, "epoch": 779} {"train_loss": -38.226722717285156, "global_step": 94265, "epoch": 779} {"train_loss": -38.36957550048828, "global_step": 94266, "epoch": 779} {"train_loss": -38.60869216918945, "global_step": 94267, "epoch": 779} {"train_loss": -37.46809768676758, "global_step": 94268, "epoch": 779} {"train_loss": -38.021392822265625, "global_step": 94269, "epoch": 779} {"train_loss": -35.920169830322266, "global_step": 94270, "epoch": 779} {"train_loss": -36.38694381713867, "global_step": 94271, "epoch": 779} {"train_loss": -36.05887985229492, "global_step": 94272, "epoch": 779} {"train_loss": -34.2022590637207, "global_step": 94273, "epoch": 779} {"train_loss": -37.360443115234375, "global_step": 94274, "epoch": 779} {"train_loss": -36.76428985595703, "global_step": 94275, "epoch": 779} {"train_loss": -38.3663444519043, "global_step": 94276, "epoch": 779} {"train_loss": -36.843875885009766, "global_step": 94277, "epoch": 779} {"train_loss": -38.26824951171875, "global_step": 94278, "epoch": 779} {"train_loss": -35.36499786376953, "global_step": 94279, "epoch": 779} {"train_loss": -37.88404083251953, "global_step": 94280, "epoch": 779} {"train_loss": -36.7921257019043, "global_step": 94281, "epoch": 779} {"train_loss": -37.249671936035156, "global_step": 94282, "epoch": 779} {"train_loss": -36.950286865234375, "global_step": 94283, "epoch": 779} {"train_loss": -35.463401794433594, "global_step": 94284, "epoch": 779} {"train_loss": -35.97977828979492, "global_step": 94285, "epoch": 779} {"train_loss": -37.29861068725586, "global_step": 94286, "epoch": 779} {"train_loss": -38.4583740234375, "global_step": 94287, "epoch": 779} {"train_loss": -36.8311882019043, "global_step": 94288, "epoch": 779} {"train_loss": -36.41840362548828, "global_step": 94289, "epoch": 779} {"train_loss": -35.55955505371094, "global_step": 94290, "epoch": 779} {"train_loss": -36.556312561035156, "global_step": 94291, "epoch": 779} {"train_loss": -37.70907211303711, "global_step": 94292, "epoch": 779} {"train_loss": -37.3724365234375, "global_step": 94293, "epoch": 779} {"train_loss": -35.955196380615234, "global_step": 94294, "epoch": 779} {"train_loss": -31.699316024780273, "global_step": 94295, "epoch": 779} {"train_loss": -34.42356491088867, "global_step": 94296, "epoch": 779} {"train_loss": -37.11184310913086, "global_step": 94297, "epoch": 779} {"train_loss": -35.03841781616211, "global_step": 94298, "epoch": 779} {"train_loss": -33.68111038208008, "global_step": 94299, "epoch": 779} {"train_loss": -36.99478530883789, "global_step": 94300, "epoch": 779} {"train_loss": -37.23704147338867, "global_step": 94301, "epoch": 779} {"train_loss": -36.549495697021484, "global_step": 94302, "epoch": 779} {"train_loss": -36.9788932800293, "global_step": 94303, "epoch": 779} {"train_loss": -36.92500305175781, "global_step": 94304, "epoch": 779} {"train_loss": -37.48535919189453, "global_step": 94305, "epoch": 779} {"train_loss": -37.60026168823242, "global_step": 94306, "epoch": 779} {"train_loss": -37.06233596801758, "global_step": 94307, "epoch": 779} {"train_loss": -36.64140701293945, "global_step": 94308, "epoch": 779} {"train_loss": -38.256988525390625, "global_step": 94309, "epoch": 779} {"train_loss": -37.753047943115234, "global_step": 94310, "epoch": 779} {"train_loss": -37.5368766784668, "global_step": 94311, "epoch": 779} {"train_loss": -37.97080612182617, "global_step": 94312, "epoch": 779} {"train_loss": -38.53461456298828, "global_step": 94313, "epoch": 779} {"train_loss": -38.08492660522461, "global_step": 94314, "epoch": 779} {"train_loss": -37.844512939453125, "global_step": 94315, "epoch": 779} {"train_loss": -37.30616760253906, "global_step": 94316, "epoch": 779} {"train_loss": -38.018463134765625, "global_step": 94317, "epoch": 779} {"train_loss": -38.30759811401367, "global_step": 94318, "epoch": 779} {"train_loss": -38.077720642089844, "global_step": 94319, "epoch": 779} {"train_loss": -37.89026641845703, "global_step": 94320, "epoch": 779} {"train_loss": -37.21156692504883, "global_step": 94321, "epoch": 779} {"train_loss": -38.199501037597656, "global_step": 94322, "epoch": 779} {"train_loss": -38.18718338012695, "global_step": 94323, "epoch": 779} {"train_loss": -37.79533004760742, "global_step": 94324, "epoch": 779} {"train_loss": -38.947322845458984, "global_step": 94325, "epoch": 779} {"train_loss": -38.14277267456055, "global_step": 94326, "epoch": 779} {"train_loss": -37.13985824584961, "global_step": 94327, "epoch": 779} {"train_loss": -37.955322265625, "global_step": 94328, "epoch": 779} {"train_loss": -38.4235725402832, "global_step": 94329, "epoch": 779} {"train_loss": -37.80745315551758, "global_step": 94330, "epoch": 779} {"train_loss": -37.55417251586914, "global_step": 94331, "epoch": 779} {"train_loss": -38.517906188964844, "global_step": 94332, "epoch": 779} {"train_loss": -39.091163635253906, "global_step": 94333, "epoch": 779} {"train_loss": -37.962799072265625, "global_step": 94334, "epoch": 779} {"train_loss": -37.713050842285156, "global_step": 94335, "epoch": 779} {"train_loss": -38.56315994262695, "global_step": 94336, "epoch": 779} {"train_loss": -38.31047439575195, "global_step": 94337, "epoch": 779} {"train_loss": -37.66607666015625, "global_step": 94338, "epoch": 779} {"train_loss": -39.0096321105957, "global_step": 94339, "epoch": 779} {"train_loss": -37.95232391357422, "global_step": 94340, "epoch": 779} {"train_loss": -36.627628326416016, "global_step": 94341, "epoch": 779} {"train_loss": -37.6562614440918, "global_step": 94342, "epoch": 779} {"train_loss": -38.79865646362305, "global_step": 94343, "epoch": 779} {"train_loss": -38.031890869140625, "global_step": 94344, "epoch": 779} {"train_loss": -36.33430480957031, "global_step": 94345, "epoch": 779} {"train_loss": -37.547359466552734, "global_step": 94346, "epoch": 779} {"train_loss": -38.904640197753906, "global_step": 94347, "epoch": 779} {"train_loss": -38.15462112426758, "global_step": 94348, "epoch": 779} {"train_loss": -38.1817626953125, "global_step": 94349, "epoch": 779} {"train_loss": -38.908363342285156, "global_step": 94350, "epoch": 779} {"train_loss": -38.914180755615234, "global_step": 94351, "epoch": 779} {"train_loss": -38.8779296875, "global_step": 94352, "epoch": 779} {"train_loss": -39.20569610595703, "global_step": 94353, "epoch": 779} {"train_loss": -39.45701599121094, "global_step": 94354, "epoch": 779} {"train_loss": -39.194305419921875, "global_step": 94355, "epoch": 779} {"train_loss": -38.80326461791992, "global_step": 94356, "epoch": 779} {"train_loss": -39.929683685302734, "global_step": 94357, "epoch": 779} {"train_loss": -39.27406692504883, "global_step": 94358, "epoch": 779} {"train_loss": -39.140541076660156, "global_step": 94359, "epoch": 779} {"train_loss": -38.904605865478516, "global_step": 94360, "epoch": 779} {"train_loss": -39.10695266723633, "global_step": 94361, "epoch": 779} {"train_loss": -39.413082122802734, "global_step": 94362, "epoch": 779} {"train_loss": -39.05007553100586, "global_step": 94363, "epoch": 779} {"train_loss": -38.70827102661133, "global_step": 94364, "epoch": 779} {"train_loss": -38.17676544189453, "global_step": 94365, "epoch": 779} {"train_loss": -39.23189926147461, "global_step": 94366, "epoch": 779} {"train_loss": -39.536643981933594, "global_step": 94367, "epoch": 779} {"train_loss": -39.333736419677734, "global_step": 94368, "epoch": 779} {"train_loss": -39.25587844848633, "global_step": 94369, "epoch": 779} {"train_loss": -38.39487838745117, "global_step": 94370, "epoch": 779} {"train_loss": -39.190155029296875, "global_step": 94371, "epoch": 779} {"train_loss": -39.32733154296875, "global_step": 94372, "epoch": 779} {"train_loss": -39.214508056640625, "global_step": 94373, "epoch": 779} {"train_loss": -38.950408935546875, "global_step": 94374, "epoch": 779} {"train_loss": -39.38628387451172, "global_step": 94375, "epoch": 779} {"train_loss": -38.904476165771484, "global_step": 94376, "epoch": 779} {"train_loss": -38.446102142333984, "global_step": 94377, "epoch": 779} {"train_loss": -38.59188461303711, "global_step": 94378, "epoch": 779} {"train_loss": -37.79027249990416, "global_step": 94379, "epoch": 779, "val_loss": 2588694.0} {"train_loss": -37.454925537109375, "global_step": 94380, "epoch": 780} {"train_loss": -38.30733871459961, "global_step": 94381, "epoch": 780} {"train_loss": -38.13176345825195, "global_step": 94382, "epoch": 780} {"train_loss": -38.15930938720703, "global_step": 94383, "epoch": 780} {"train_loss": -36.87183380126953, "global_step": 94384, "epoch": 780} {"train_loss": -35.59625244140625, "global_step": 94385, "epoch": 780} {"train_loss": -34.5062370300293, "global_step": 94386, "epoch": 780} {"train_loss": -36.69355010986328, "global_step": 94387, "epoch": 780} {"train_loss": -37.0263671875, "global_step": 94388, "epoch": 780} {"train_loss": -37.72462463378906, "global_step": 94389, "epoch": 780} {"train_loss": -36.09156036376953, "global_step": 94390, "epoch": 780} {"train_loss": -36.66081237792969, "global_step": 94391, "epoch": 780} {"train_loss": -38.801734924316406, "global_step": 94392, "epoch": 780} {"train_loss": -36.59983825683594, "global_step": 94393, "epoch": 780} {"train_loss": -36.462432861328125, "global_step": 94394, "epoch": 780} {"train_loss": -37.80037307739258, "global_step": 94395, "epoch": 780} {"train_loss": -38.602752685546875, "global_step": 94396, "epoch": 780} {"train_loss": -37.79048538208008, "global_step": 94397, "epoch": 780} {"train_loss": -37.87236785888672, "global_step": 94398, "epoch": 780} {"train_loss": -38.25086212158203, "global_step": 94399, "epoch": 780} {"train_loss": -38.14249038696289, "global_step": 94400, "epoch": 780} {"train_loss": -37.995941162109375, "global_step": 94401, "epoch": 780} {"train_loss": -38.27006149291992, "global_step": 94402, "epoch": 780} {"train_loss": -39.19024658203125, "global_step": 94403, "epoch": 780} {"train_loss": -38.101806640625, "global_step": 94404, "epoch": 780} {"train_loss": -38.51359176635742, "global_step": 94405, "epoch": 780} {"train_loss": -38.433135986328125, "global_step": 94406, "epoch": 780} {"train_loss": -38.128875732421875, "global_step": 94407, "epoch": 780} {"train_loss": -38.98286437988281, "global_step": 94408, "epoch": 780} {"train_loss": -38.07356643676758, "global_step": 94409, "epoch": 780} {"train_loss": -38.792205810546875, "global_step": 94410, "epoch": 780} {"train_loss": -38.2303466796875, "global_step": 94411, "epoch": 780} {"train_loss": -38.0015754699707, "global_step": 94412, "epoch": 780} {"train_loss": -38.18244171142578, "global_step": 94413, "epoch": 780} {"train_loss": -38.354793548583984, "global_step": 94414, "epoch": 780} {"train_loss": -38.37409973144531, "global_step": 94415, "epoch": 780} {"train_loss": -37.84285354614258, "global_step": 94416, "epoch": 780} {"train_loss": -38.3025016784668, "global_step": 94417, "epoch": 780} {"train_loss": -38.68601608276367, "global_step": 94418, "epoch": 780} {"train_loss": -38.236053466796875, "global_step": 94419, "epoch": 780} {"train_loss": -38.1481819152832, "global_step": 94420, "epoch": 780} {"train_loss": -38.56946563720703, "global_step": 94421, "epoch": 780} {"train_loss": -38.4271125793457, "global_step": 94422, "epoch": 780} {"train_loss": -38.80702590942383, "global_step": 94423, "epoch": 780} {"train_loss": -39.04683303833008, "global_step": 94424, "epoch": 780} {"train_loss": -35.41600036621094, "global_step": 94425, "epoch": 780} {"train_loss": -36.46378707885742, "global_step": 94426, "epoch": 780} {"train_loss": -36.5852165222168, "global_step": 94427, "epoch": 780} {"train_loss": -37.73335647583008, "global_step": 94428, "epoch": 780} {"train_loss": -38.23836898803711, "global_step": 94429, "epoch": 780} {"train_loss": -37.691078186035156, "global_step": 94430, "epoch": 780} {"train_loss": -37.189945220947266, "global_step": 94431, "epoch": 780} {"train_loss": -38.80416488647461, "global_step": 94432, "epoch": 780} {"train_loss": -36.990360260009766, "global_step": 94433, "epoch": 780} {"train_loss": -38.86775207519531, "global_step": 94434, "epoch": 780} {"train_loss": -37.589805603027344, "global_step": 94435, "epoch": 780} {"train_loss": -37.57784652709961, "global_step": 94436, "epoch": 780} {"train_loss": -37.478267669677734, "global_step": 94437, "epoch": 780} {"train_loss": -36.02655792236328, "global_step": 94438, "epoch": 780} {"train_loss": -35.59162521362305, "global_step": 94439, "epoch": 780} {"train_loss": -35.127471923828125, "global_step": 94440, "epoch": 780} {"train_loss": -35.58155059814453, "global_step": 94441, "epoch": 780} {"train_loss": -35.693275451660156, "global_step": 94442, "epoch": 780} {"train_loss": -35.349796295166016, "global_step": 94443, "epoch": 780} {"train_loss": -37.33891677856445, "global_step": 94444, "epoch": 780} {"train_loss": -37.956722259521484, "global_step": 94445, "epoch": 780} {"train_loss": -36.793548583984375, "global_step": 94446, "epoch": 780} {"train_loss": -37.09783935546875, "global_step": 94447, "epoch": 780} {"train_loss": -38.05099105834961, "global_step": 94448, "epoch": 780} {"train_loss": -37.96425247192383, "global_step": 94449, "epoch": 780} {"train_loss": -36.004127502441406, "global_step": 94450, "epoch": 780} {"train_loss": -37.22041702270508, "global_step": 94451, "epoch": 780} {"train_loss": -37.1277961730957, "global_step": 94452, "epoch": 780} {"train_loss": -32.1166877746582, "global_step": 94453, "epoch": 780} {"train_loss": -36.79937744140625, "global_step": 94454, "epoch": 780} {"train_loss": -36.68770980834961, "global_step": 94455, "epoch": 780} {"train_loss": -36.17829895019531, "global_step": 94456, "epoch": 780} {"train_loss": -37.413330078125, "global_step": 94457, "epoch": 780} {"train_loss": -37.46439743041992, "global_step": 94458, "epoch": 780} {"train_loss": -36.635684967041016, "global_step": 94459, "epoch": 780} {"train_loss": -38.64473342895508, "global_step": 94460, "epoch": 780} {"train_loss": -38.357181549072266, "global_step": 94461, "epoch": 780} {"train_loss": -38.02582931518555, "global_step": 94462, "epoch": 780} {"train_loss": -38.355587005615234, "global_step": 94463, "epoch": 780} {"train_loss": -38.1909294128418, "global_step": 94464, "epoch": 780} {"train_loss": -38.15118408203125, "global_step": 94465, "epoch": 780} {"train_loss": -38.22478485107422, "global_step": 94466, "epoch": 780} {"train_loss": -36.03368377685547, "global_step": 94467, "epoch": 780} {"train_loss": -35.999534606933594, "global_step": 94468, "epoch": 780} {"train_loss": -37.42466354370117, "global_step": 94469, "epoch": 780} {"train_loss": -37.44479751586914, "global_step": 94470, "epoch": 780} {"train_loss": -38.22706985473633, "global_step": 94471, "epoch": 780} {"train_loss": -38.500244140625, "global_step": 94472, "epoch": 780} {"train_loss": -37.49871826171875, "global_step": 94473, "epoch": 780} {"train_loss": -37.98218536376953, "global_step": 94474, "epoch": 780} {"train_loss": -38.596290588378906, "global_step": 94475, "epoch": 780} {"train_loss": -38.548282623291016, "global_step": 94476, "epoch": 780} {"train_loss": -37.987796783447266, "global_step": 94477, "epoch": 780} {"train_loss": -37.957637786865234, "global_step": 94478, "epoch": 780} {"train_loss": -37.9879264831543, "global_step": 94479, "epoch": 780} {"train_loss": -37.3646125793457, "global_step": 94480, "epoch": 780} {"train_loss": -38.926998138427734, "global_step": 94481, "epoch": 780} {"train_loss": -38.21942901611328, "global_step": 94482, "epoch": 780} {"train_loss": -37.59368896484375, "global_step": 94483, "epoch": 780} {"train_loss": -38.46575164794922, "global_step": 94484, "epoch": 780} {"train_loss": -38.54741287231445, "global_step": 94485, "epoch": 780} {"train_loss": -38.416683197021484, "global_step": 94486, "epoch": 780} {"train_loss": -38.43326950073242, "global_step": 94487, "epoch": 780} {"train_loss": -38.71163558959961, "global_step": 94488, "epoch": 780} {"train_loss": -38.84284210205078, "global_step": 94489, "epoch": 780} {"train_loss": -38.48822784423828, "global_step": 94490, "epoch": 780} {"train_loss": -38.31046676635742, "global_step": 94491, "epoch": 780} {"train_loss": -39.222023010253906, "global_step": 94492, "epoch": 780} {"train_loss": -38.482051849365234, "global_step": 94493, "epoch": 780} {"train_loss": -38.45338439941406, "global_step": 94494, "epoch": 780} {"train_loss": -38.78126525878906, "global_step": 94495, "epoch": 780} {"train_loss": -39.08281326293945, "global_step": 94496, "epoch": 780} {"train_loss": -38.87300491333008, "global_step": 94497, "epoch": 780} {"train_loss": -38.01276779174805, "global_step": 94498, "epoch": 780} {"train_loss": -39.06965637207031, "global_step": 94499, "epoch": 780} {"train_loss": -37.7005603254334, "global_step": 94500, "epoch": 780, "val_loss": 2515296.75} {"train_loss": -38.55131912231445, "global_step": 94501, "epoch": 781} {"train_loss": -38.620967864990234, "global_step": 94502, "epoch": 781} {"train_loss": -38.477088928222656, "global_step": 94503, "epoch": 781} {"train_loss": -38.96944808959961, "global_step": 94504, "epoch": 781} {"train_loss": -39.19317626953125, "global_step": 94505, "epoch": 781} {"train_loss": -38.20984649658203, "global_step": 94506, "epoch": 781} {"train_loss": -37.552459716796875, "global_step": 94507, "epoch": 781} {"train_loss": -37.6693000793457, "global_step": 94508, "epoch": 781} {"train_loss": -37.5485954284668, "global_step": 94509, "epoch": 781} {"train_loss": -37.42039489746094, "global_step": 94510, "epoch": 781} {"train_loss": -38.98826217651367, "global_step": 94511, "epoch": 781} {"train_loss": -37.0809440612793, "global_step": 94512, "epoch": 781} {"train_loss": -34.580745697021484, "global_step": 94513, "epoch": 781} {"train_loss": -34.83500289916992, "global_step": 94514, "epoch": 781} {"train_loss": -34.457942962646484, "global_step": 94515, "epoch": 781} {"train_loss": -35.1213493347168, "global_step": 94516, "epoch": 781} {"train_loss": -35.18886947631836, "global_step": 94517, "epoch": 781} {"train_loss": -34.93172836303711, "global_step": 94518, "epoch": 781} {"train_loss": -36.689754486083984, "global_step": 94519, "epoch": 781} {"train_loss": -37.529972076416016, "global_step": 94520, "epoch": 781} {"train_loss": -34.63236999511719, "global_step": 94521, "epoch": 781} {"train_loss": -35.23921203613281, "global_step": 94522, "epoch": 781} {"train_loss": -37.39278793334961, "global_step": 94523, "epoch": 781} {"train_loss": -37.51054000854492, "global_step": 94524, "epoch": 781} {"train_loss": -36.27211380004883, "global_step": 94525, "epoch": 781} {"train_loss": -38.026222229003906, "global_step": 94526, "epoch": 781} {"train_loss": -38.09187698364258, "global_step": 94527, "epoch": 781} {"train_loss": -37.46525192260742, "global_step": 94528, "epoch": 781} {"train_loss": -38.433406829833984, "global_step": 94529, "epoch": 781} {"train_loss": -38.149837493896484, "global_step": 94530, "epoch": 781} {"train_loss": -37.98440170288086, "global_step": 94531, "epoch": 781} {"train_loss": -38.4997444152832, "global_step": 94532, "epoch": 781} {"train_loss": -37.98923873901367, "global_step": 94533, "epoch": 781} {"train_loss": -37.908321380615234, "global_step": 94534, "epoch": 781} {"train_loss": -38.26663589477539, "global_step": 94535, "epoch": 781} {"train_loss": -38.156551361083984, "global_step": 94536, "epoch": 781} {"train_loss": -38.16758346557617, "global_step": 94537, "epoch": 781} {"train_loss": -38.67583084106445, "global_step": 94538, "epoch": 781} {"train_loss": -38.354305267333984, "global_step": 94539, "epoch": 781} {"train_loss": -37.95437240600586, "global_step": 94540, "epoch": 781} {"train_loss": -38.70918655395508, "global_step": 94541, "epoch": 781} {"train_loss": -38.33501052856445, "global_step": 94542, "epoch": 781} {"train_loss": -38.525978088378906, "global_step": 94543, "epoch": 781} {"train_loss": -38.785335540771484, "global_step": 94544, "epoch": 781} {"train_loss": -38.47782516479492, "global_step": 94545, "epoch": 781} {"train_loss": -38.70060348510742, "global_step": 94546, "epoch": 781} {"train_loss": -39.305179595947266, "global_step": 94547, "epoch": 781} {"train_loss": -38.8347282409668, "global_step": 94548, "epoch": 781} {"train_loss": -38.29897689819336, "global_step": 94549, "epoch": 781} {"train_loss": -39.30677032470703, "global_step": 94550, "epoch": 781} {"train_loss": -38.89977264404297, "global_step": 94551, "epoch": 781} {"train_loss": -38.59538650512695, "global_step": 94552, "epoch": 781} {"train_loss": -38.858768463134766, "global_step": 94553, "epoch": 781} {"train_loss": -37.77666091918945, "global_step": 94554, "epoch": 781} {"train_loss": -38.351722717285156, "global_step": 94555, "epoch": 781} {"train_loss": -39.20307540893555, "global_step": 94556, "epoch": 781} {"train_loss": -38.290260314941406, "global_step": 94557, "epoch": 781} {"train_loss": -37.87095642089844, "global_step": 94558, "epoch": 781} {"train_loss": -38.0980339050293, "global_step": 94559, "epoch": 781} {"train_loss": -39.05119323730469, "global_step": 94560, "epoch": 781} {"train_loss": -38.260040283203125, "global_step": 94561, "epoch": 781} {"train_loss": -38.43333053588867, "global_step": 94562, "epoch": 781} {"train_loss": -38.48418045043945, "global_step": 94563, "epoch": 781} {"train_loss": -38.899356842041016, "global_step": 94564, "epoch": 781} {"train_loss": -37.735774993896484, "global_step": 94565, "epoch": 781} {"train_loss": -38.261653900146484, "global_step": 94566, "epoch": 781} {"train_loss": -37.441951751708984, "global_step": 94567, "epoch": 781} {"train_loss": -37.063594818115234, "global_step": 94568, "epoch": 781} {"train_loss": -37.55940628051758, "global_step": 94569, "epoch": 781} {"train_loss": -37.18850326538086, "global_step": 94570, "epoch": 781} {"train_loss": -37.06203842163086, "global_step": 94571, "epoch": 781} {"train_loss": -37.42278289794922, "global_step": 94572, "epoch": 781} {"train_loss": -37.69561767578125, "global_step": 94573, "epoch": 781} {"train_loss": -37.56879425048828, "global_step": 94574, "epoch": 781} {"train_loss": -37.97987365722656, "global_step": 94575, "epoch": 781} {"train_loss": -37.01963424682617, "global_step": 94576, "epoch": 781} {"train_loss": -38.0389404296875, "global_step": 94577, "epoch": 781} {"train_loss": -38.82512283325195, "global_step": 94578, "epoch": 781} {"train_loss": -38.373268127441406, "global_step": 94579, "epoch": 781} {"train_loss": -38.124324798583984, "global_step": 94580, "epoch": 781} {"train_loss": -37.810272216796875, "global_step": 94581, "epoch": 781} {"train_loss": -38.777462005615234, "global_step": 94582, "epoch": 781} {"train_loss": -37.29257583618164, "global_step": 94583, "epoch": 781} {"train_loss": -38.7963981628418, "global_step": 94584, "epoch": 781} {"train_loss": -38.452850341796875, "global_step": 94585, "epoch": 781} {"train_loss": -37.084869384765625, "global_step": 94586, "epoch": 781} {"train_loss": -37.68769454956055, "global_step": 94587, "epoch": 781} {"train_loss": -38.81787872314453, "global_step": 94588, "epoch": 781} {"train_loss": -37.15607833862305, "global_step": 94589, "epoch": 781} {"train_loss": -38.68227005004883, "global_step": 94590, "epoch": 781} {"train_loss": -38.62587356567383, "global_step": 94591, "epoch": 781} {"train_loss": -36.209346771240234, "global_step": 94592, "epoch": 781} {"train_loss": -36.14550018310547, "global_step": 94593, "epoch": 781} {"train_loss": -38.37874984741211, "global_step": 94594, "epoch": 781} {"train_loss": -38.02262878417969, "global_step": 94595, "epoch": 781} {"train_loss": -37.20412826538086, "global_step": 94596, "epoch": 781} {"train_loss": -38.62977981567383, "global_step": 94597, "epoch": 781} {"train_loss": -37.947879791259766, "global_step": 94598, "epoch": 781} {"train_loss": -37.01133728027344, "global_step": 94599, "epoch": 781} {"train_loss": -38.53530502319336, "global_step": 94600, "epoch": 781} {"train_loss": -38.25060272216797, "global_step": 94601, "epoch": 781} {"train_loss": -38.234004974365234, "global_step": 94602, "epoch": 781} {"train_loss": -38.40898895263672, "global_step": 94603, "epoch": 781} {"train_loss": -36.93218994140625, "global_step": 94604, "epoch": 781} {"train_loss": -38.423377990722656, "global_step": 94605, "epoch": 781} {"train_loss": -38.399749755859375, "global_step": 94606, "epoch": 781} {"train_loss": -38.187862396240234, "global_step": 94607, "epoch": 781} {"train_loss": -38.48418045043945, "global_step": 94608, "epoch": 781} {"train_loss": -38.9429817199707, "global_step": 94609, "epoch": 781} {"train_loss": -39.16459274291992, "global_step": 94610, "epoch": 781} {"train_loss": -38.799442291259766, "global_step": 94611, "epoch": 781} {"train_loss": -39.123165130615234, "global_step": 94612, "epoch": 781} {"train_loss": -38.48905563354492, "global_step": 94613, "epoch": 781} {"train_loss": -38.974708557128906, "global_step": 94614, "epoch": 781} {"train_loss": -38.704830169677734, "global_step": 94615, "epoch": 781} {"train_loss": -39.07029724121094, "global_step": 94616, "epoch": 781} {"train_loss": -38.64728927612305, "global_step": 94617, "epoch": 781} {"train_loss": -39.201778411865234, "global_step": 94618, "epoch": 781} {"train_loss": -39.0532341003418, "global_step": 94619, "epoch": 781} {"train_loss": -38.862464904785156, "global_step": 94620, "epoch": 781} {"train_loss": -37.96130582320789, "global_step": 94621, "epoch": 781, "val_loss": 2543210.0} {"train_loss": -38.95560836791992, "global_step": 94622, "epoch": 782} {"train_loss": -38.73702621459961, "global_step": 94623, "epoch": 782} {"train_loss": -38.72663116455078, "global_step": 94624, "epoch": 782} {"train_loss": -39.29964828491211, "global_step": 94625, "epoch": 782} {"train_loss": -38.660884857177734, "global_step": 94626, "epoch": 782} {"train_loss": -38.95527267456055, "global_step": 94627, "epoch": 782} {"train_loss": -39.08811569213867, "global_step": 94628, "epoch": 782} {"train_loss": -37.70869827270508, "global_step": 94629, "epoch": 782} {"train_loss": -39.132572174072266, "global_step": 94630, "epoch": 782} {"train_loss": -38.946441650390625, "global_step": 94631, "epoch": 782} {"train_loss": -39.04203414916992, "global_step": 94632, "epoch": 782} {"train_loss": -38.832759857177734, "global_step": 94633, "epoch": 782} {"train_loss": -39.150455474853516, "global_step": 94634, "epoch": 782} {"train_loss": -38.74860382080078, "global_step": 94635, "epoch": 782} {"train_loss": -38.303565979003906, "global_step": 94636, "epoch": 782} {"train_loss": -38.98786926269531, "global_step": 94637, "epoch": 782} {"train_loss": -38.35498046875, "global_step": 94638, "epoch": 782} {"train_loss": -37.78765869140625, "global_step": 94639, "epoch": 782} {"train_loss": -36.22911071777344, "global_step": 94640, "epoch": 782} {"train_loss": -33.75597381591797, "global_step": 94641, "epoch": 782} {"train_loss": -32.83203125, "global_step": 94642, "epoch": 782} {"train_loss": -37.76361083984375, "global_step": 94643, "epoch": 782} {"train_loss": -35.94222640991211, "global_step": 94644, "epoch": 782} {"train_loss": -29.05250358581543, "global_step": 94645, "epoch": 782} {"train_loss": -27.2656307220459, "global_step": 94646, "epoch": 782} {"train_loss": -34.33195877075195, "global_step": 94647, "epoch": 782} {"train_loss": -27.998218536376953, "global_step": 94648, "epoch": 782} {"train_loss": -28.086105346679688, "global_step": 94649, "epoch": 782} {"train_loss": -28.6802921295166, "global_step": 94650, "epoch": 782} {"train_loss": -34.86281967163086, "global_step": 94651, "epoch": 782} {"train_loss": -33.93606948852539, "global_step": 94652, "epoch": 782} {"train_loss": -32.96452331542969, "global_step": 94653, "epoch": 782} {"train_loss": -33.974849700927734, "global_step": 94654, "epoch": 782} {"train_loss": -34.3560791015625, "global_step": 94655, "epoch": 782} {"train_loss": -35.70186233520508, "global_step": 94656, "epoch": 782} {"train_loss": -35.881492614746094, "global_step": 94657, "epoch": 782} {"train_loss": -37.029449462890625, "global_step": 94658, "epoch": 782} {"train_loss": -37.101375579833984, "global_step": 94659, "epoch": 782} {"train_loss": -35.70377731323242, "global_step": 94660, "epoch": 782} {"train_loss": -37.91899871826172, "global_step": 94661, "epoch": 782} {"train_loss": -35.86662673950195, "global_step": 94662, "epoch": 782} {"train_loss": -37.29793930053711, "global_step": 94663, "epoch": 782} {"train_loss": -37.10648727416992, "global_step": 94664, "epoch": 782} {"train_loss": -37.240047454833984, "global_step": 94665, "epoch": 782} {"train_loss": -37.4742317199707, "global_step": 94666, "epoch": 782} {"train_loss": -37.980709075927734, "global_step": 94667, "epoch": 782} {"train_loss": -37.60866165161133, "global_step": 94668, "epoch": 782} {"train_loss": -37.87357711791992, "global_step": 94669, "epoch": 782} {"train_loss": -37.64863204956055, "global_step": 94670, "epoch": 782} {"train_loss": -37.26325607299805, "global_step": 94671, "epoch": 782} {"train_loss": -38.2396240234375, "global_step": 94672, "epoch": 782} {"train_loss": -38.08270263671875, "global_step": 94673, "epoch": 782} {"train_loss": -38.136573791503906, "global_step": 94674, "epoch": 782} {"train_loss": -38.47494125366211, "global_step": 94675, "epoch": 782} {"train_loss": -37.70356369018555, "global_step": 94676, "epoch": 782} {"train_loss": -38.489112854003906, "global_step": 94677, "epoch": 782} {"train_loss": -38.193336486816406, "global_step": 94678, "epoch": 782} {"train_loss": -38.60807418823242, "global_step": 94679, "epoch": 782} {"train_loss": -38.11781692504883, "global_step": 94680, "epoch": 782} {"train_loss": -38.4266471862793, "global_step": 94681, "epoch": 782} {"train_loss": -38.3634033203125, "global_step": 94682, "epoch": 782} {"train_loss": -38.33082580566406, "global_step": 94683, "epoch": 782} {"train_loss": -38.28548049926758, "global_step": 94684, "epoch": 782} {"train_loss": -38.60978317260742, "global_step": 94685, "epoch": 782} {"train_loss": -38.26009750366211, "global_step": 94686, "epoch": 782} {"train_loss": -38.31304931640625, "global_step": 94687, "epoch": 782} {"train_loss": -38.292335510253906, "global_step": 94688, "epoch": 782} {"train_loss": -38.67060470581055, "global_step": 94689, "epoch": 782} {"train_loss": -38.42307662963867, "global_step": 94690, "epoch": 782} {"train_loss": -39.02753448486328, "global_step": 94691, "epoch": 782} {"train_loss": -38.600643157958984, "global_step": 94692, "epoch": 782} {"train_loss": -38.76692581176758, "global_step": 94693, "epoch": 782} {"train_loss": -38.82698440551758, "global_step": 94694, "epoch": 782} {"train_loss": -38.53731155395508, "global_step": 94695, "epoch": 782} {"train_loss": -39.21530532836914, "global_step": 94696, "epoch": 782} {"train_loss": -38.99325180053711, "global_step": 94697, "epoch": 782} {"train_loss": -39.227874755859375, "global_step": 94698, "epoch": 782} {"train_loss": -39.03921890258789, "global_step": 94699, "epoch": 782} {"train_loss": -38.99921798706055, "global_step": 94700, "epoch": 782} {"train_loss": -37.37324142456055, "global_step": 94701, "epoch": 782} {"train_loss": -39.0947380065918, "global_step": 94702, "epoch": 782} {"train_loss": -39.05293655395508, "global_step": 94703, "epoch": 782} {"train_loss": -38.62139892578125, "global_step": 94704, "epoch": 782} {"train_loss": -38.57025146484375, "global_step": 94705, "epoch": 782} {"train_loss": -39.62425994873047, "global_step": 94706, "epoch": 782} {"train_loss": -38.08481979370117, "global_step": 94707, "epoch": 782} {"train_loss": -39.30186080932617, "global_step": 94708, "epoch": 782} {"train_loss": -39.05747604370117, "global_step": 94709, "epoch": 782} {"train_loss": -37.997154235839844, "global_step": 94710, "epoch": 782} {"train_loss": -38.658653259277344, "global_step": 94711, "epoch": 782} {"train_loss": -39.062583923339844, "global_step": 94712, "epoch": 782} {"train_loss": -38.96566390991211, "global_step": 94713, "epoch": 782} {"train_loss": -39.23621368408203, "global_step": 94714, "epoch": 782} {"train_loss": -39.21199417114258, "global_step": 94715, "epoch": 782} {"train_loss": -39.20137405395508, "global_step": 94716, "epoch": 782} {"train_loss": -38.88389587402344, "global_step": 94717, "epoch": 782} {"train_loss": -38.957942962646484, "global_step": 94718, "epoch": 782} {"train_loss": -39.14652633666992, "global_step": 94719, "epoch": 782} {"train_loss": -38.083126068115234, "global_step": 94720, "epoch": 782} {"train_loss": -36.9267578125, "global_step": 94721, "epoch": 782} {"train_loss": -36.22845458984375, "global_step": 94722, "epoch": 782} {"train_loss": -36.163185119628906, "global_step": 94723, "epoch": 782} {"train_loss": -38.72981643676758, "global_step": 94724, "epoch": 782} {"train_loss": -38.224605560302734, "global_step": 94725, "epoch": 782} {"train_loss": -36.28468322753906, "global_step": 94726, "epoch": 782} {"train_loss": -36.8861198425293, "global_step": 94727, "epoch": 782} {"train_loss": -39.185646057128906, "global_step": 94728, "epoch": 782} {"train_loss": -37.682525634765625, "global_step": 94729, "epoch": 782} {"train_loss": -38.61211013793945, "global_step": 94730, "epoch": 782} {"train_loss": -37.82803726196289, "global_step": 94731, "epoch": 782} {"train_loss": -37.0039176940918, "global_step": 94732, "epoch": 782} {"train_loss": -35.52200698852539, "global_step": 94733, "epoch": 782} {"train_loss": -35.75513458251953, "global_step": 94734, "epoch": 782} {"train_loss": -35.64432907104492, "global_step": 94735, "epoch": 782} {"train_loss": -36.45072555541992, "global_step": 94736, "epoch": 782} {"train_loss": -33.008846282958984, "global_step": 94737, "epoch": 782} {"train_loss": -33.683414459228516, "global_step": 94738, "epoch": 782} {"train_loss": -35.74374008178711, "global_step": 94739, "epoch": 782} {"train_loss": -36.62189483642578, "global_step": 94740, "epoch": 782} {"train_loss": -32.01975631713867, "global_step": 94741, "epoch": 782} {"train_loss": -37.18578663345211, "global_step": 94742, "epoch": 782, "val_loss": 2525305.25} {"train_loss": -32.82304382324219, "global_step": 94743, "epoch": 783} {"train_loss": -35.036415100097656, "global_step": 94744, "epoch": 783} {"train_loss": -34.58576965332031, "global_step": 94745, "epoch": 783} {"train_loss": -36.40038299560547, "global_step": 94746, "epoch": 783} {"train_loss": -35.852691650390625, "global_step": 94747, "epoch": 783} {"train_loss": -37.37163543701172, "global_step": 94748, "epoch": 783} {"train_loss": -33.657161712646484, "global_step": 94749, "epoch": 783} {"train_loss": -37.17361068725586, "global_step": 94750, "epoch": 783} {"train_loss": -35.56507873535156, "global_step": 94751, "epoch": 783} {"train_loss": -37.64126205444336, "global_step": 94752, "epoch": 783} {"train_loss": -35.20002365112305, "global_step": 94753, "epoch": 783} {"train_loss": -36.454139709472656, "global_step": 94754, "epoch": 783} {"train_loss": -34.34986877441406, "global_step": 94755, "epoch": 783} {"train_loss": -36.74177932739258, "global_step": 94756, "epoch": 783} {"train_loss": -35.63501739501953, "global_step": 94757, "epoch": 783} {"train_loss": -36.46063995361328, "global_step": 94758, "epoch": 783} {"train_loss": -37.044830322265625, "global_step": 94759, "epoch": 783} {"train_loss": -36.88169479370117, "global_step": 94760, "epoch": 783} {"train_loss": -37.11777114868164, "global_step": 94761, "epoch": 783} {"train_loss": -36.33546829223633, "global_step": 94762, "epoch": 783} {"train_loss": -37.20940399169922, "global_step": 94763, "epoch": 783} {"train_loss": -37.87543869018555, "global_step": 94764, "epoch": 783} {"train_loss": -36.52083969116211, "global_step": 94765, "epoch": 783} {"train_loss": -37.0362548828125, "global_step": 94766, "epoch": 783} {"train_loss": -37.29935836791992, "global_step": 94767, "epoch": 783} {"train_loss": -37.30669403076172, "global_step": 94768, "epoch": 783} {"train_loss": -37.3676872253418, "global_step": 94769, "epoch": 783} {"train_loss": -36.54887008666992, "global_step": 94770, "epoch": 783} {"train_loss": -37.69121170043945, "global_step": 94771, "epoch": 783} {"train_loss": -37.276424407958984, "global_step": 94772, "epoch": 783} {"train_loss": -35.08852005004883, "global_step": 94773, "epoch": 783} {"train_loss": -37.850120544433594, "global_step": 94774, "epoch": 783} {"train_loss": -37.626800537109375, "global_step": 94775, "epoch": 783} {"train_loss": -37.741451263427734, "global_step": 94776, "epoch": 783} {"train_loss": -36.04258728027344, "global_step": 94777, "epoch": 783} {"train_loss": -36.524879455566406, "global_step": 94778, "epoch": 783} {"train_loss": -36.7869987487793, "global_step": 94779, "epoch": 783} {"train_loss": -36.25335693359375, "global_step": 94780, "epoch": 783} {"train_loss": -36.35221481323242, "global_step": 94781, "epoch": 783} {"train_loss": -37.12460708618164, "global_step": 94782, "epoch": 783} {"train_loss": -37.499080657958984, "global_step": 94783, "epoch": 783} {"train_loss": -37.91620635986328, "global_step": 94784, "epoch": 783} {"train_loss": -37.222084045410156, "global_step": 94785, "epoch": 783} {"train_loss": -36.88538360595703, "global_step": 94786, "epoch": 783} {"train_loss": -37.93258285522461, "global_step": 94787, "epoch": 783} {"train_loss": -37.147560119628906, "global_step": 94788, "epoch": 783} {"train_loss": -37.59498977661133, "global_step": 94789, "epoch": 783} {"train_loss": -38.23816680908203, "global_step": 94790, "epoch": 783} {"train_loss": -37.178279876708984, "global_step": 94791, "epoch": 783} {"train_loss": -37.64586639404297, "global_step": 94792, "epoch": 783} {"train_loss": -36.98130416870117, "global_step": 94793, "epoch": 783} {"train_loss": -36.8595085144043, "global_step": 94794, "epoch": 783} {"train_loss": -38.00519943237305, "global_step": 94795, "epoch": 783} {"train_loss": -37.6479377746582, "global_step": 94796, "epoch": 783} {"train_loss": -37.21281814575195, "global_step": 94797, "epoch": 783} {"train_loss": -37.42857360839844, "global_step": 94798, "epoch": 783} {"train_loss": -37.623775482177734, "global_step": 94799, "epoch": 783} {"train_loss": -37.66686248779297, "global_step": 94800, "epoch": 783} {"train_loss": -36.738826751708984, "global_step": 94801, "epoch": 783} {"train_loss": -37.50179672241211, "global_step": 94802, "epoch": 783} {"train_loss": -37.8071174621582, "global_step": 94803, "epoch": 783} {"train_loss": -33.563716888427734, "global_step": 94804, "epoch": 783} {"train_loss": -35.30086135864258, "global_step": 94805, "epoch": 783} {"train_loss": -34.74173355102539, "global_step": 94806, "epoch": 783} {"train_loss": -36.78945541381836, "global_step": 94807, "epoch": 783} {"train_loss": -34.572444915771484, "global_step": 94808, "epoch": 783} {"train_loss": -34.90104293823242, "global_step": 94809, "epoch": 783} {"train_loss": -36.734092712402344, "global_step": 94810, "epoch": 783} {"train_loss": -35.396942138671875, "global_step": 94811, "epoch": 783} {"train_loss": -33.39743423461914, "global_step": 94812, "epoch": 783} {"train_loss": -37.4673957824707, "global_step": 94813, "epoch": 783} {"train_loss": -34.390499114990234, "global_step": 94814, "epoch": 783} {"train_loss": -36.802398681640625, "global_step": 94815, "epoch": 783} {"train_loss": -34.65713119506836, "global_step": 94816, "epoch": 783} {"train_loss": -36.56005859375, "global_step": 94817, "epoch": 783} {"train_loss": -36.40580368041992, "global_step": 94818, "epoch": 783} {"train_loss": -35.35402297973633, "global_step": 94819, "epoch": 783} {"train_loss": -35.91473388671875, "global_step": 94820, "epoch": 783} {"train_loss": -37.03242874145508, "global_step": 94821, "epoch": 783} {"train_loss": -32.95745849609375, "global_step": 94822, "epoch": 783} {"train_loss": -36.0982551574707, "global_step": 94823, "epoch": 783} {"train_loss": -34.24532699584961, "global_step": 94824, "epoch": 783} {"train_loss": -36.643089294433594, "global_step": 94825, "epoch": 783} {"train_loss": -35.6861572265625, "global_step": 94826, "epoch": 783} {"train_loss": -35.84307861328125, "global_step": 94827, "epoch": 783} {"train_loss": -36.42841339111328, "global_step": 94828, "epoch": 783} {"train_loss": -36.69807052612305, "global_step": 94829, "epoch": 783} {"train_loss": -35.90230941772461, "global_step": 94830, "epoch": 783} {"train_loss": -35.757102966308594, "global_step": 94831, "epoch": 783} {"train_loss": -37.143062591552734, "global_step": 94832, "epoch": 783} {"train_loss": -35.84752655029297, "global_step": 94833, "epoch": 783} {"train_loss": -37.12246322631836, "global_step": 94834, "epoch": 783} {"train_loss": -36.45146560668945, "global_step": 94835, "epoch": 783} {"train_loss": -36.514923095703125, "global_step": 94836, "epoch": 783} {"train_loss": -37.173702239990234, "global_step": 94837, "epoch": 783} {"train_loss": -36.706703186035156, "global_step": 94838, "epoch": 783} {"train_loss": -37.231239318847656, "global_step": 94839, "epoch": 783} {"train_loss": -36.53581619262695, "global_step": 94840, "epoch": 783} {"train_loss": -34.67962646484375, "global_step": 94841, "epoch": 783} {"train_loss": -37.55121994018555, "global_step": 94842, "epoch": 783} {"train_loss": -36.58175277709961, "global_step": 94843, "epoch": 783} {"train_loss": -37.415950775146484, "global_step": 94844, "epoch": 783} {"train_loss": -37.46376419067383, "global_step": 94845, "epoch": 783} {"train_loss": -37.835269927978516, "global_step": 94846, "epoch": 783} {"train_loss": -36.385128021240234, "global_step": 94847, "epoch": 783} {"train_loss": -37.25999069213867, "global_step": 94848, "epoch": 783} {"train_loss": -37.23545455932617, "global_step": 94849, "epoch": 783} {"train_loss": -37.455909729003906, "global_step": 94850, "epoch": 783} {"train_loss": -37.823856353759766, "global_step": 94851, "epoch": 783} {"train_loss": -37.58439254760742, "global_step": 94852, "epoch": 783} {"train_loss": -37.014747619628906, "global_step": 94853, "epoch": 783} {"train_loss": -36.96345901489258, "global_step": 94854, "epoch": 783} {"train_loss": -37.102603912353516, "global_step": 94855, "epoch": 783} {"train_loss": -36.98847198486328, "global_step": 94856, "epoch": 783} {"train_loss": -38.08134841918945, "global_step": 94857, "epoch": 783} {"train_loss": -36.194053649902344, "global_step": 94858, "epoch": 783} {"train_loss": -37.56795883178711, "global_step": 94859, "epoch": 783} {"train_loss": -37.28948974609375, "global_step": 94860, "epoch": 783} {"train_loss": -37.08930587768555, "global_step": 94861, "epoch": 783} {"train_loss": -37.29874801635742, "global_step": 94862, "epoch": 783} {"train_loss": -36.57971421549143, "global_step": 94863, "epoch": 783, "val_loss": 2559224.0} {"train_loss": -37.13480758666992, "global_step": 94864, "epoch": 784} {"train_loss": -38.23673629760742, "global_step": 94865, "epoch": 784} {"train_loss": -37.428955078125, "global_step": 94866, "epoch": 784} {"train_loss": -37.149574279785156, "global_step": 94867, "epoch": 784} {"train_loss": -37.767696380615234, "global_step": 94868, "epoch": 784} {"train_loss": -37.413753509521484, "global_step": 94869, "epoch": 784} {"train_loss": -37.45454025268555, "global_step": 94870, "epoch": 784} {"train_loss": -37.64306640625, "global_step": 94871, "epoch": 784} {"train_loss": -37.395145416259766, "global_step": 94872, "epoch": 784} {"train_loss": -37.60731887817383, "global_step": 94873, "epoch": 784} {"train_loss": -38.14922332763672, "global_step": 94874, "epoch": 784} {"train_loss": -37.9761962890625, "global_step": 94875, "epoch": 784} {"train_loss": -36.423221588134766, "global_step": 94876, "epoch": 784} {"train_loss": -37.437355041503906, "global_step": 94877, "epoch": 784} {"train_loss": -37.801937103271484, "global_step": 94878, "epoch": 784} {"train_loss": -37.089683532714844, "global_step": 94879, "epoch": 784} {"train_loss": -37.44553756713867, "global_step": 94880, "epoch": 784} {"train_loss": -37.936092376708984, "global_step": 94881, "epoch": 784} {"train_loss": -37.57344436645508, "global_step": 94882, "epoch": 784} {"train_loss": -38.54365158081055, "global_step": 94883, "epoch": 784} {"train_loss": -37.0986442565918, "global_step": 94884, "epoch": 784} {"train_loss": -38.119239807128906, "global_step": 94885, "epoch": 784} {"train_loss": -37.42662811279297, "global_step": 94886, "epoch": 784} {"train_loss": -38.03106689453125, "global_step": 94887, "epoch": 784} {"train_loss": -37.855037689208984, "global_step": 94888, "epoch": 784} {"train_loss": -37.39921188354492, "global_step": 94889, "epoch": 784} {"train_loss": -36.928707122802734, "global_step": 94890, "epoch": 784} {"train_loss": -37.8560676574707, "global_step": 94891, "epoch": 784} {"train_loss": -37.9356803894043, "global_step": 94892, "epoch": 784} {"train_loss": -38.02960968017578, "global_step": 94893, "epoch": 784} {"train_loss": -38.21198272705078, "global_step": 94894, "epoch": 784} {"train_loss": -37.9901123046875, "global_step": 94895, "epoch": 784} {"train_loss": -38.42343521118164, "global_step": 94896, "epoch": 784} {"train_loss": -38.3167724609375, "global_step": 94897, "epoch": 784} {"train_loss": -38.01676559448242, "global_step": 94898, "epoch": 784} {"train_loss": -37.78251266479492, "global_step": 94899, "epoch": 784} {"train_loss": -38.537513732910156, "global_step": 94900, "epoch": 784} {"train_loss": -38.09282684326172, "global_step": 94901, "epoch": 784} {"train_loss": -38.27321243286133, "global_step": 94902, "epoch": 784} {"train_loss": -38.178218841552734, "global_step": 94903, "epoch": 784} {"train_loss": -38.296852111816406, "global_step": 94904, "epoch": 784} {"train_loss": -38.17307662963867, "global_step": 94905, "epoch": 784} {"train_loss": -38.17406463623047, "global_step": 94906, "epoch": 784} {"train_loss": -38.02863311767578, "global_step": 94907, "epoch": 784} {"train_loss": -38.275325775146484, "global_step": 94908, "epoch": 784} {"train_loss": -37.51728820800781, "global_step": 94909, "epoch": 784} {"train_loss": -36.73198699951172, "global_step": 94910, "epoch": 784} {"train_loss": -38.56112289428711, "global_step": 94911, "epoch": 784} {"train_loss": -38.321651458740234, "global_step": 94912, "epoch": 784} {"train_loss": -38.4942741394043, "global_step": 94913, "epoch": 784} {"train_loss": -38.43841552734375, "global_step": 94914, "epoch": 784} {"train_loss": -39.16245651245117, "global_step": 94915, "epoch": 784} {"train_loss": -38.74271011352539, "global_step": 94916, "epoch": 784} {"train_loss": -37.42768859863281, "global_step": 94917, "epoch": 784} {"train_loss": -38.36994552612305, "global_step": 94918, "epoch": 784} {"train_loss": -38.25959777832031, "global_step": 94919, "epoch": 784} {"train_loss": -37.64704132080078, "global_step": 94920, "epoch": 784} {"train_loss": -37.943763732910156, "global_step": 94921, "epoch": 784} {"train_loss": -37.18860626220703, "global_step": 94922, "epoch": 784} {"train_loss": -36.15378952026367, "global_step": 94923, "epoch": 784} {"train_loss": -35.123565673828125, "global_step": 94924, "epoch": 784} {"train_loss": -31.93648338317871, "global_step": 94925, "epoch": 784} {"train_loss": -32.08578109741211, "global_step": 94926, "epoch": 784} {"train_loss": -36.224464416503906, "global_step": 94927, "epoch": 784} {"train_loss": -37.50924301147461, "global_step": 94928, "epoch": 784} {"train_loss": -36.199127197265625, "global_step": 94929, "epoch": 784} {"train_loss": -35.51163864135742, "global_step": 94930, "epoch": 784} {"train_loss": -37.67985153198242, "global_step": 94931, "epoch": 784} {"train_loss": -37.22693634033203, "global_step": 94932, "epoch": 784} {"train_loss": -36.46219253540039, "global_step": 94933, "epoch": 784} {"train_loss": -37.38374710083008, "global_step": 94934, "epoch": 784} {"train_loss": -37.756465911865234, "global_step": 94935, "epoch": 784} {"train_loss": -37.405067443847656, "global_step": 94936, "epoch": 784} {"train_loss": -37.3436393737793, "global_step": 94937, "epoch": 784} {"train_loss": -37.316593170166016, "global_step": 94938, "epoch": 784} {"train_loss": -38.258541107177734, "global_step": 94939, "epoch": 784} {"train_loss": -36.58005142211914, "global_step": 94940, "epoch": 784} {"train_loss": -37.7103385925293, "global_step": 94941, "epoch": 784} {"train_loss": -37.87709426879883, "global_step": 94942, "epoch": 784} {"train_loss": -37.55517578125, "global_step": 94943, "epoch": 784} {"train_loss": -37.262630462646484, "global_step": 94944, "epoch": 784} {"train_loss": -37.71955108642578, "global_step": 94945, "epoch": 784} {"train_loss": -38.476844787597656, "global_step": 94946, "epoch": 784} {"train_loss": -37.82548141479492, "global_step": 94947, "epoch": 784} {"train_loss": -38.21863555908203, "global_step": 94948, "epoch": 784} {"train_loss": -38.31747055053711, "global_step": 94949, "epoch": 784} {"train_loss": -37.73843002319336, "global_step": 94950, "epoch": 784} {"train_loss": -38.3054313659668, "global_step": 94951, "epoch": 784} {"train_loss": -38.648475646972656, "global_step": 94952, "epoch": 784} {"train_loss": -38.28915023803711, "global_step": 94953, "epoch": 784} {"train_loss": -38.3748664855957, "global_step": 94954, "epoch": 784} {"train_loss": -38.28842544555664, "global_step": 94955, "epoch": 784} {"train_loss": -38.62143325805664, "global_step": 94956, "epoch": 784} {"train_loss": -38.72262191772461, "global_step": 94957, "epoch": 784} {"train_loss": -38.642147064208984, "global_step": 94958, "epoch": 784} {"train_loss": -38.4930534362793, "global_step": 94959, "epoch": 784} {"train_loss": -37.65774154663086, "global_step": 94960, "epoch": 784} {"train_loss": -37.67926025390625, "global_step": 94961, "epoch": 784} {"train_loss": -38.42649459838867, "global_step": 94962, "epoch": 784} {"train_loss": -37.91679763793945, "global_step": 94963, "epoch": 784} {"train_loss": -38.94839096069336, "global_step": 94964, "epoch": 784} {"train_loss": -36.878047943115234, "global_step": 94965, "epoch": 784} {"train_loss": -37.93606185913086, "global_step": 94966, "epoch": 784} {"train_loss": -37.000160217285156, "global_step": 94967, "epoch": 784} {"train_loss": -38.02168655395508, "global_step": 94968, "epoch": 784} {"train_loss": -37.928279876708984, "global_step": 94969, "epoch": 784} {"train_loss": -38.351829528808594, "global_step": 94970, "epoch": 784} {"train_loss": -38.72184753417969, "global_step": 94971, "epoch": 784} {"train_loss": -38.47882843017578, "global_step": 94972, "epoch": 784} {"train_loss": -36.47092819213867, "global_step": 94973, "epoch": 784} {"train_loss": -35.38665008544922, "global_step": 94974, "epoch": 784} {"train_loss": -35.60206985473633, "global_step": 94975, "epoch": 784} {"train_loss": -37.48784255981445, "global_step": 94976, "epoch": 784} {"train_loss": -38.4774055480957, "global_step": 94977, "epoch": 784} {"train_loss": -37.4256706237793, "global_step": 94978, "epoch": 784} {"train_loss": -36.3873176574707, "global_step": 94979, "epoch": 784} {"train_loss": -38.53997039794922, "global_step": 94980, "epoch": 784} {"train_loss": -38.60895919799805, "global_step": 94981, "epoch": 784} {"train_loss": -37.33687210083008, "global_step": 94982, "epoch": 784} {"train_loss": -37.94785690307617, "global_step": 94983, "epoch": 784} {"train_loss": -37.64003212983943, "global_step": 94984, "epoch": 784, "val_loss": 2602668.0} {"train_loss": -37.33125686645508, "global_step": 94985, "epoch": 785} {"train_loss": -37.490875244140625, "global_step": 94986, "epoch": 785} {"train_loss": -38.80788040161133, "global_step": 94987, "epoch": 785} {"train_loss": -38.086910247802734, "global_step": 94988, "epoch": 785} {"train_loss": -39.04536819458008, "global_step": 94989, "epoch": 785} {"train_loss": -37.51235580444336, "global_step": 94990, "epoch": 785} {"train_loss": -38.55546188354492, "global_step": 94991, "epoch": 785} {"train_loss": -39.045623779296875, "global_step": 94992, "epoch": 785} {"train_loss": -38.49406814575195, "global_step": 94993, "epoch": 785} {"train_loss": -38.88629150390625, "global_step": 94994, "epoch": 785} {"train_loss": -38.512020111083984, "global_step": 94995, "epoch": 785} {"train_loss": -38.55451583862305, "global_step": 94996, "epoch": 785} {"train_loss": -38.04358673095703, "global_step": 94997, "epoch": 785} {"train_loss": -38.643768310546875, "global_step": 94998, "epoch": 785} {"train_loss": -38.983436584472656, "global_step": 94999, "epoch": 785} {"train_loss": -38.44451904296875, "global_step": 95000, "epoch": 785} {"train_loss": -38.997798919677734, "global_step": 95001, "epoch": 785} {"train_loss": -38.97510528564453, "global_step": 95002, "epoch": 785} {"train_loss": -38.918575286865234, "global_step": 95003, "epoch": 785} {"train_loss": -39.05885696411133, "global_step": 95004, "epoch": 785} {"train_loss": -38.92620849609375, "global_step": 95005, "epoch": 785} {"train_loss": -38.63459396362305, "global_step": 95006, "epoch": 785} {"train_loss": -38.79872512817383, "global_step": 95007, "epoch": 785} {"train_loss": -38.883460998535156, "global_step": 95008, "epoch": 785} {"train_loss": -38.93947982788086, "global_step": 95009, "epoch": 785} {"train_loss": -38.47522735595703, "global_step": 95010, "epoch": 785} {"train_loss": -39.1190299987793, "global_step": 95011, "epoch": 785} {"train_loss": -39.143310546875, "global_step": 95012, "epoch": 785} {"train_loss": -38.821102142333984, "global_step": 95013, "epoch": 785} {"train_loss": -39.48295974731445, "global_step": 95014, "epoch": 785} {"train_loss": -39.43708038330078, "global_step": 95015, "epoch": 785} {"train_loss": -39.06773376464844, "global_step": 95016, "epoch": 785} {"train_loss": -38.56120300292969, "global_step": 95017, "epoch": 785} {"train_loss": -38.77766799926758, "global_step": 95018, "epoch": 785} {"train_loss": -38.684539794921875, "global_step": 95019, "epoch": 785} {"train_loss": -39.03731918334961, "global_step": 95020, "epoch": 785} {"train_loss": -39.490821838378906, "global_step": 95021, "epoch": 785} {"train_loss": -38.689815521240234, "global_step": 95022, "epoch": 785} {"train_loss": -37.34177780151367, "global_step": 95023, "epoch": 785} {"train_loss": -38.3745231628418, "global_step": 95024, "epoch": 785} {"train_loss": -38.786834716796875, "global_step": 95025, "epoch": 785} {"train_loss": -37.170860290527344, "global_step": 95026, "epoch": 785} {"train_loss": -37.41872787475586, "global_step": 95027, "epoch": 785} {"train_loss": -38.26164245605469, "global_step": 95028, "epoch": 785} {"train_loss": -37.439353942871094, "global_step": 95029, "epoch": 785} {"train_loss": -37.6989631652832, "global_step": 95030, "epoch": 785} {"train_loss": -36.29610061645508, "global_step": 95031, "epoch": 785} {"train_loss": -37.499752044677734, "global_step": 95032, "epoch": 785} {"train_loss": -37.260379791259766, "global_step": 95033, "epoch": 785} {"train_loss": -36.1870231628418, "global_step": 95034, "epoch": 785} {"train_loss": -32.772823333740234, "global_step": 95035, "epoch": 785} {"train_loss": -34.68610382080078, "global_step": 95036, "epoch": 785} {"train_loss": -35.649810791015625, "global_step": 95037, "epoch": 785} {"train_loss": -35.503753662109375, "global_step": 95038, "epoch": 785} {"train_loss": -36.198524475097656, "global_step": 95039, "epoch": 785} {"train_loss": -34.76442337036133, "global_step": 95040, "epoch": 785} {"train_loss": -37.61933517456055, "global_step": 95041, "epoch": 785} {"train_loss": -34.81284713745117, "global_step": 95042, "epoch": 785} {"train_loss": -36.85081100463867, "global_step": 95043, "epoch": 785} {"train_loss": -37.808101654052734, "global_step": 95044, "epoch": 785} {"train_loss": -34.55898666381836, "global_step": 95045, "epoch": 785} {"train_loss": -37.83648681640625, "global_step": 95046, "epoch": 785} {"train_loss": -37.86506271362305, "global_step": 95047, "epoch": 785} {"train_loss": -37.414798736572266, "global_step": 95048, "epoch": 785} {"train_loss": -38.473167419433594, "global_step": 95049, "epoch": 785} {"train_loss": -37.43056106567383, "global_step": 95050, "epoch": 785} {"train_loss": -37.48752212524414, "global_step": 95051, "epoch": 785} {"train_loss": -37.796627044677734, "global_step": 95052, "epoch": 785} {"train_loss": -38.23630905151367, "global_step": 95053, "epoch": 785} {"train_loss": -37.95576095581055, "global_step": 95054, "epoch": 785} {"train_loss": -36.86769485473633, "global_step": 95055, "epoch": 785} {"train_loss": -37.862667083740234, "global_step": 95056, "epoch": 785} {"train_loss": -37.98604965209961, "global_step": 95057, "epoch": 785} {"train_loss": -37.96279525756836, "global_step": 95058, "epoch": 785} {"train_loss": -38.052345275878906, "global_step": 95059, "epoch": 785} {"train_loss": -38.81437683105469, "global_step": 95060, "epoch": 785} {"train_loss": -37.86048126220703, "global_step": 95061, "epoch": 785} {"train_loss": -38.99045944213867, "global_step": 95062, "epoch": 785} {"train_loss": -37.7460823059082, "global_step": 95063, "epoch": 785} {"train_loss": -38.2106819152832, "global_step": 95064, "epoch": 785} {"train_loss": -38.314876556396484, "global_step": 95065, "epoch": 785} {"train_loss": -38.40084457397461, "global_step": 95066, "epoch": 785} {"train_loss": -38.317440032958984, "global_step": 95067, "epoch": 785} {"train_loss": -38.464019775390625, "global_step": 95068, "epoch": 785} {"train_loss": -39.098670959472656, "global_step": 95069, "epoch": 785} {"train_loss": -38.96451950073242, "global_step": 95070, "epoch": 785} {"train_loss": -38.136444091796875, "global_step": 95071, "epoch": 785} {"train_loss": -38.56919479370117, "global_step": 95072, "epoch": 785} {"train_loss": -38.92287063598633, "global_step": 95073, "epoch": 785} {"train_loss": -38.65974807739258, "global_step": 95074, "epoch": 785} {"train_loss": -38.54954147338867, "global_step": 95075, "epoch": 785} {"train_loss": -39.04488754272461, "global_step": 95076, "epoch": 785} {"train_loss": -38.329132080078125, "global_step": 95077, "epoch": 785} {"train_loss": -38.259307861328125, "global_step": 95078, "epoch": 785} {"train_loss": -38.695804595947266, "global_step": 95079, "epoch": 785} {"train_loss": -38.9660530090332, "global_step": 95080, "epoch": 785} {"train_loss": -38.82878494262695, "global_step": 95081, "epoch": 785} {"train_loss": -38.33700180053711, "global_step": 95082, "epoch": 785} {"train_loss": -37.734256744384766, "global_step": 95083, "epoch": 785} {"train_loss": -38.346046447753906, "global_step": 95084, "epoch": 785} {"train_loss": -38.56763458251953, "global_step": 95085, "epoch": 785} {"train_loss": -37.73653793334961, "global_step": 95086, "epoch": 785} {"train_loss": -37.9641227722168, "global_step": 95087, "epoch": 785} {"train_loss": -37.31411361694336, "global_step": 95088, "epoch": 785} {"train_loss": -38.573848724365234, "global_step": 95089, "epoch": 785} {"train_loss": -38.902530670166016, "global_step": 95090, "epoch": 785} {"train_loss": -37.35327911376953, "global_step": 95091, "epoch": 785} {"train_loss": -34.194068908691406, "global_step": 95092, "epoch": 785} {"train_loss": -35.325740814208984, "global_step": 95093, "epoch": 785} {"train_loss": -38.40847396850586, "global_step": 95094, "epoch": 785} {"train_loss": -37.77291488647461, "global_step": 95095, "epoch": 785} {"train_loss": -37.14412307739258, "global_step": 95096, "epoch": 785} {"train_loss": -35.51752471923828, "global_step": 95097, "epoch": 785} {"train_loss": -36.69260787963867, "global_step": 95098, "epoch": 785} {"train_loss": -37.18232345581055, "global_step": 95099, "epoch": 785} {"train_loss": -37.26946258544922, "global_step": 95100, "epoch": 785} {"train_loss": -38.318389892578125, "global_step": 95101, "epoch": 785} {"train_loss": -37.96877670288086, "global_step": 95102, "epoch": 785} {"train_loss": -35.469505310058594, "global_step": 95103, "epoch": 785} {"train_loss": -38.016414642333984, "global_step": 95104, "epoch": 785} {"train_loss": -37.91582028727886, "global_step": 95105, "epoch": 785, "val_loss": 2565686.25} {"train_loss": -36.916236877441406, "global_step": 95106, "epoch": 786} {"train_loss": -38.181766510009766, "global_step": 95107, "epoch": 786} {"train_loss": -38.29311752319336, "global_step": 95108, "epoch": 786} {"train_loss": -38.08112335205078, "global_step": 95109, "epoch": 786} {"train_loss": -38.9184455871582, "global_step": 95110, "epoch": 786} {"train_loss": -37.13248062133789, "global_step": 95111, "epoch": 786} {"train_loss": -37.0887565612793, "global_step": 95112, "epoch": 786} {"train_loss": -38.62181854248047, "global_step": 95113, "epoch": 786} {"train_loss": -37.51225662231445, "global_step": 95114, "epoch": 786} {"train_loss": -38.455142974853516, "global_step": 95115, "epoch": 786} {"train_loss": -38.11001205444336, "global_step": 95116, "epoch": 786} {"train_loss": -37.606788635253906, "global_step": 95117, "epoch": 786} {"train_loss": -38.36197280883789, "global_step": 95118, "epoch": 786} {"train_loss": -36.91703414916992, "global_step": 95119, "epoch": 786} {"train_loss": -37.81174087524414, "global_step": 95120, "epoch": 786} {"train_loss": -37.90430450439453, "global_step": 95121, "epoch": 786} {"train_loss": -37.85112380981445, "global_step": 95122, "epoch": 786} {"train_loss": -39.17578887939453, "global_step": 95123, "epoch": 786} {"train_loss": -38.14899826049805, "global_step": 95124, "epoch": 786} {"train_loss": -38.54945755004883, "global_step": 95125, "epoch": 786} {"train_loss": -38.82316589355469, "global_step": 95126, "epoch": 786} {"train_loss": -38.1629524230957, "global_step": 95127, "epoch": 786} {"train_loss": -38.40983200073242, "global_step": 95128, "epoch": 786} {"train_loss": -38.578399658203125, "global_step": 95129, "epoch": 786} {"train_loss": -36.829952239990234, "global_step": 95130, "epoch": 786} {"train_loss": -38.22066116333008, "global_step": 95131, "epoch": 786} {"train_loss": -38.25080490112305, "global_step": 95132, "epoch": 786} {"train_loss": -37.8361701965332, "global_step": 95133, "epoch": 786} {"train_loss": -39.185543060302734, "global_step": 95134, "epoch": 786} {"train_loss": -38.54375457763672, "global_step": 95135, "epoch": 786} {"train_loss": -39.1893310546875, "global_step": 95136, "epoch": 786} {"train_loss": -38.475337982177734, "global_step": 95137, "epoch": 786} {"train_loss": -38.123748779296875, "global_step": 95138, "epoch": 786} {"train_loss": -38.728755950927734, "global_step": 95139, "epoch": 786} {"train_loss": -39.26932907104492, "global_step": 95140, "epoch": 786} {"train_loss": -38.44789505004883, "global_step": 95141, "epoch": 786} {"train_loss": -38.516456604003906, "global_step": 95142, "epoch": 786} {"train_loss": -35.27590560913086, "global_step": 95143, "epoch": 786} {"train_loss": -37.336822509765625, "global_step": 95144, "epoch": 786} {"train_loss": -38.25490951538086, "global_step": 95145, "epoch": 786} {"train_loss": -38.28169631958008, "global_step": 95146, "epoch": 786} {"train_loss": -37.42646408081055, "global_step": 95147, "epoch": 786} {"train_loss": -38.4407844543457, "global_step": 95148, "epoch": 786} {"train_loss": -38.3848991394043, "global_step": 95149, "epoch": 786} {"train_loss": -38.73982620239258, "global_step": 95150, "epoch": 786} {"train_loss": -38.867549896240234, "global_step": 95151, "epoch": 786} {"train_loss": -38.047698974609375, "global_step": 95152, "epoch": 786} {"train_loss": -37.35667037963867, "global_step": 95153, "epoch": 786} {"train_loss": -38.277870178222656, "global_step": 95154, "epoch": 786} {"train_loss": -38.71467971801758, "global_step": 95155, "epoch": 786} {"train_loss": -38.47920608520508, "global_step": 95156, "epoch": 786} {"train_loss": -38.949649810791016, "global_step": 95157, "epoch": 786} {"train_loss": -38.76978302001953, "global_step": 95158, "epoch": 786} {"train_loss": -38.25797653198242, "global_step": 95159, "epoch": 786} {"train_loss": -38.220638275146484, "global_step": 95160, "epoch": 786} {"train_loss": -38.20600509643555, "global_step": 95161, "epoch": 786} {"train_loss": -37.64841842651367, "global_step": 95162, "epoch": 786} {"train_loss": -38.30392074584961, "global_step": 95163, "epoch": 786} {"train_loss": -38.373470306396484, "global_step": 95164, "epoch": 786} {"train_loss": -38.53456115722656, "global_step": 95165, "epoch": 786} {"train_loss": -37.580562591552734, "global_step": 95166, "epoch": 786} {"train_loss": -38.87946701049805, "global_step": 95167, "epoch": 786} {"train_loss": -38.40654754638672, "global_step": 95168, "epoch": 786} {"train_loss": -37.79726028442383, "global_step": 95169, "epoch": 786} {"train_loss": -37.35097885131836, "global_step": 95170, "epoch": 786} {"train_loss": -37.65635299682617, "global_step": 95171, "epoch": 786} {"train_loss": -38.60552215576172, "global_step": 95172, "epoch": 786} {"train_loss": -38.012115478515625, "global_step": 95173, "epoch": 786} {"train_loss": -38.5743522644043, "global_step": 95174, "epoch": 786} {"train_loss": -35.5761604309082, "global_step": 95175, "epoch": 786} {"train_loss": -38.35254669189453, "global_step": 95176, "epoch": 786} {"train_loss": -36.463905334472656, "global_step": 95177, "epoch": 786} {"train_loss": -36.266719818115234, "global_step": 95178, "epoch": 786} {"train_loss": -36.931549072265625, "global_step": 95179, "epoch": 786} {"train_loss": -37.75606155395508, "global_step": 95180, "epoch": 786} {"train_loss": -37.98774337768555, "global_step": 95181, "epoch": 786} {"train_loss": -35.27011489868164, "global_step": 95182, "epoch": 786} {"train_loss": -36.19932174682617, "global_step": 95183, "epoch": 786} {"train_loss": -35.17372131347656, "global_step": 95184, "epoch": 786} {"train_loss": -33.20485305786133, "global_step": 95185, "epoch": 786} {"train_loss": -34.64741134643555, "global_step": 95186, "epoch": 786} {"train_loss": -36.0447883605957, "global_step": 95187, "epoch": 786} {"train_loss": -36.99231719970703, "global_step": 95188, "epoch": 786} {"train_loss": -35.105979919433594, "global_step": 95189, "epoch": 786} {"train_loss": -37.3038444519043, "global_step": 95190, "epoch": 786} {"train_loss": -36.69173049926758, "global_step": 95191, "epoch": 786} {"train_loss": -37.00956344604492, "global_step": 95192, "epoch": 786} {"train_loss": -36.15407943725586, "global_step": 95193, "epoch": 786} {"train_loss": -37.079193115234375, "global_step": 95194, "epoch": 786} {"train_loss": -37.2642707824707, "global_step": 95195, "epoch": 786} {"train_loss": -37.69814682006836, "global_step": 95196, "epoch": 786} {"train_loss": -35.888607025146484, "global_step": 95197, "epoch": 786} {"train_loss": -35.628807067871094, "global_step": 95198, "epoch": 786} {"train_loss": -36.758460998535156, "global_step": 95199, "epoch": 786} {"train_loss": -37.06891632080078, "global_step": 95200, "epoch": 786} {"train_loss": -32.152889251708984, "global_step": 95201, "epoch": 786} {"train_loss": -35.14304733276367, "global_step": 95202, "epoch": 786} {"train_loss": -35.68067169189453, "global_step": 95203, "epoch": 786} {"train_loss": -36.74162292480469, "global_step": 95204, "epoch": 786} {"train_loss": -36.5804328918457, "global_step": 95205, "epoch": 786} {"train_loss": -36.20988464355469, "global_step": 95206, "epoch": 786} {"train_loss": -34.660560607910156, "global_step": 95207, "epoch": 786} {"train_loss": -37.40704345703125, "global_step": 95208, "epoch": 786} {"train_loss": -35.3977165222168, "global_step": 95209, "epoch": 786} {"train_loss": -35.3889274597168, "global_step": 95210, "epoch": 786} {"train_loss": -37.37452697753906, "global_step": 95211, "epoch": 786} {"train_loss": -36.98525619506836, "global_step": 95212, "epoch": 786} {"train_loss": -37.920345306396484, "global_step": 95213, "epoch": 786} {"train_loss": -36.97572326660156, "global_step": 95214, "epoch": 786} {"train_loss": -36.451961517333984, "global_step": 95215, "epoch": 786} {"train_loss": -36.48232650756836, "global_step": 95216, "epoch": 786} {"train_loss": -36.321712493896484, "global_step": 95217, "epoch": 786} {"train_loss": -35.504207611083984, "global_step": 95218, "epoch": 786} {"train_loss": -37.26753234863281, "global_step": 95219, "epoch": 786} {"train_loss": -35.580135345458984, "global_step": 95220, "epoch": 786} {"train_loss": -36.888816833496094, "global_step": 95221, "epoch": 786} {"train_loss": -36.49190902709961, "global_step": 95222, "epoch": 786} {"train_loss": -37.69855880737305, "global_step": 95223, "epoch": 786} {"train_loss": -36.14365768432617, "global_step": 95224, "epoch": 786} {"train_loss": -37.129737854003906, "global_step": 95225, "epoch": 786} {"train_loss": -37.38411545556439, "global_step": 95226, "epoch": 786, "val_loss": 2601972.25} {"train_loss": -37.18227005004883, "global_step": 95227, "epoch": 787} {"train_loss": -37.83769607543945, "global_step": 95228, "epoch": 787} {"train_loss": -36.87663650512695, "global_step": 95229, "epoch": 787} {"train_loss": -38.08746337890625, "global_step": 95230, "epoch": 787} {"train_loss": -36.27206039428711, "global_step": 95231, "epoch": 787} {"train_loss": -38.10498809814453, "global_step": 95232, "epoch": 787} {"train_loss": -37.74653244018555, "global_step": 95233, "epoch": 787} {"train_loss": -37.290771484375, "global_step": 95234, "epoch": 787} {"train_loss": -37.3056640625, "global_step": 95235, "epoch": 787} {"train_loss": -37.46284103393555, "global_step": 95236, "epoch": 787} {"train_loss": -37.89228057861328, "global_step": 95237, "epoch": 787} {"train_loss": -37.43476486206055, "global_step": 95238, "epoch": 787} {"train_loss": -37.68284225463867, "global_step": 95239, "epoch": 787} {"train_loss": -37.958839416503906, "global_step": 95240, "epoch": 787} {"train_loss": -38.084102630615234, "global_step": 95241, "epoch": 787} {"train_loss": -38.07322692871094, "global_step": 95242, "epoch": 787} {"train_loss": -37.95415115356445, "global_step": 95243, "epoch": 787} {"train_loss": -37.84052658081055, "global_step": 95244, "epoch": 787} {"train_loss": -38.00880813598633, "global_step": 95245, "epoch": 787} {"train_loss": -38.3687629699707, "global_step": 95246, "epoch": 787} {"train_loss": -38.55485153198242, "global_step": 95247, "epoch": 787} {"train_loss": -38.88904571533203, "global_step": 95248, "epoch": 787} {"train_loss": -38.07394027709961, "global_step": 95249, "epoch": 787} {"train_loss": -38.39447021484375, "global_step": 95250, "epoch": 787} {"train_loss": -38.51908493041992, "global_step": 95251, "epoch": 787} {"train_loss": -36.866878509521484, "global_step": 95252, "epoch": 787} {"train_loss": -38.039222717285156, "global_step": 95253, "epoch": 787} {"train_loss": -38.04618453979492, "global_step": 95254, "epoch": 787} {"train_loss": -37.32733917236328, "global_step": 95255, "epoch": 787} {"train_loss": -37.38650131225586, "global_step": 95256, "epoch": 787} {"train_loss": -37.998538970947266, "global_step": 95257, "epoch": 787} {"train_loss": -38.24591064453125, "global_step": 95258, "epoch": 787} {"train_loss": -38.58858108520508, "global_step": 95259, "epoch": 787} {"train_loss": -38.93152618408203, "global_step": 95260, "epoch": 787} {"train_loss": -38.62301254272461, "global_step": 95261, "epoch": 787} {"train_loss": -37.98214340209961, "global_step": 95262, "epoch": 787} {"train_loss": -38.375579833984375, "global_step": 95263, "epoch": 787} {"train_loss": -38.06974411010742, "global_step": 95264, "epoch": 787} {"train_loss": -38.7290153503418, "global_step": 95265, "epoch": 787} {"train_loss": -38.51369857788086, "global_step": 95266, "epoch": 787} {"train_loss": -37.72530746459961, "global_step": 95267, "epoch": 787} {"train_loss": -35.80385208129883, "global_step": 95268, "epoch": 787} {"train_loss": -38.8126335144043, "global_step": 95269, "epoch": 787} {"train_loss": -37.41209030151367, "global_step": 95270, "epoch": 787} {"train_loss": -38.32373046875, "global_step": 95271, "epoch": 787} {"train_loss": -38.309207916259766, "global_step": 95272, "epoch": 787} {"train_loss": -37.68000030517578, "global_step": 95273, "epoch": 787} {"train_loss": -37.14834213256836, "global_step": 95274, "epoch": 787} {"train_loss": -37.430477142333984, "global_step": 95275, "epoch": 787} {"train_loss": -38.185115814208984, "global_step": 95276, "epoch": 787} {"train_loss": -38.7235221862793, "global_step": 95277, "epoch": 787} {"train_loss": -38.43503952026367, "global_step": 95278, "epoch": 787} {"train_loss": -37.462886810302734, "global_step": 95279, "epoch": 787} {"train_loss": -37.85593795776367, "global_step": 95280, "epoch": 787} {"train_loss": -38.57013702392578, "global_step": 95281, "epoch": 787} {"train_loss": -38.8149299621582, "global_step": 95282, "epoch": 787} {"train_loss": -37.81340408325195, "global_step": 95283, "epoch": 787} {"train_loss": -37.980926513671875, "global_step": 95284, "epoch": 787} {"train_loss": -37.48383331298828, "global_step": 95285, "epoch": 787} {"train_loss": -38.35105514526367, "global_step": 95286, "epoch": 787} {"train_loss": -37.51520919799805, "global_step": 95287, "epoch": 787} {"train_loss": -37.35149002075195, "global_step": 95288, "epoch": 787} {"train_loss": -38.209877014160156, "global_step": 95289, "epoch": 787} {"train_loss": -38.48288345336914, "global_step": 95290, "epoch": 787} {"train_loss": -38.051361083984375, "global_step": 95291, "epoch": 787} {"train_loss": -38.014705657958984, "global_step": 95292, "epoch": 787} {"train_loss": -38.709197998046875, "global_step": 95293, "epoch": 787} {"train_loss": -39.12964630126953, "global_step": 95294, "epoch": 787} {"train_loss": -38.573692321777344, "global_step": 95295, "epoch": 787} {"train_loss": -37.64210891723633, "global_step": 95296, "epoch": 787} {"train_loss": -37.495941162109375, "global_step": 95297, "epoch": 787} {"train_loss": -38.02865219116211, "global_step": 95298, "epoch": 787} {"train_loss": -38.50617218017578, "global_step": 95299, "epoch": 787} {"train_loss": -38.1478271484375, "global_step": 95300, "epoch": 787} {"train_loss": -37.850624084472656, "global_step": 95301, "epoch": 787} {"train_loss": -36.19480514526367, "global_step": 95302, "epoch": 787} {"train_loss": -38.970733642578125, "global_step": 95303, "epoch": 787} {"train_loss": -38.4500617980957, "global_step": 95304, "epoch": 787} {"train_loss": -38.271976470947266, "global_step": 95305, "epoch": 787} {"train_loss": -35.77096176147461, "global_step": 95306, "epoch": 787} {"train_loss": -38.08395004272461, "global_step": 95307, "epoch": 787} {"train_loss": -38.69893264770508, "global_step": 95308, "epoch": 787} {"train_loss": -36.40328598022461, "global_step": 95309, "epoch": 787} {"train_loss": -36.82700729370117, "global_step": 95310, "epoch": 787} {"train_loss": -38.2454719543457, "global_step": 95311, "epoch": 787} {"train_loss": -38.78935623168945, "global_step": 95312, "epoch": 787} {"train_loss": -38.20121383666992, "global_step": 95313, "epoch": 787} {"train_loss": -36.310115814208984, "global_step": 95314, "epoch": 787} {"train_loss": -38.1982536315918, "global_step": 95315, "epoch": 787} {"train_loss": -36.03286361694336, "global_step": 95316, "epoch": 787} {"train_loss": -36.69612121582031, "global_step": 95317, "epoch": 787} {"train_loss": -26.32680320739746, "global_step": 95318, "epoch": 787} {"train_loss": -35.191585540771484, "global_step": 95319, "epoch": 787} {"train_loss": -36.04026412963867, "global_step": 95320, "epoch": 787} {"train_loss": -36.88711166381836, "global_step": 95321, "epoch": 787} {"train_loss": -35.715606689453125, "global_step": 95322, "epoch": 787} {"train_loss": -33.879112243652344, "global_step": 95323, "epoch": 787} {"train_loss": -35.26599884033203, "global_step": 95324, "epoch": 787} {"train_loss": -37.20488357543945, "global_step": 95325, "epoch": 787} {"train_loss": -31.981037139892578, "global_step": 95326, "epoch": 787} {"train_loss": -28.974573135375977, "global_step": 95327, "epoch": 787} {"train_loss": -35.24090576171875, "global_step": 95328, "epoch": 787} {"train_loss": -37.537166595458984, "global_step": 95329, "epoch": 787} {"train_loss": -35.57126998901367, "global_step": 95330, "epoch": 787} {"train_loss": -33.57865524291992, "global_step": 95331, "epoch": 787} {"train_loss": -33.499568939208984, "global_step": 95332, "epoch": 787} {"train_loss": -34.6136589050293, "global_step": 95333, "epoch": 787} {"train_loss": -33.98068618774414, "global_step": 95334, "epoch": 787} {"train_loss": -33.9915657043457, "global_step": 95335, "epoch": 787} {"train_loss": -35.98047637939453, "global_step": 95336, "epoch": 787} {"train_loss": -35.95332717895508, "global_step": 95337, "epoch": 787} {"train_loss": -32.34133529663086, "global_step": 95338, "epoch": 787} {"train_loss": -34.084529876708984, "global_step": 95339, "epoch": 787} {"train_loss": -33.06681442260742, "global_step": 95340, "epoch": 787} {"train_loss": -36.686031341552734, "global_step": 95341, "epoch": 787} {"train_loss": -35.79317855834961, "global_step": 95342, "epoch": 787} {"train_loss": -33.59756851196289, "global_step": 95343, "epoch": 787} {"train_loss": -37.22451400756836, "global_step": 95344, "epoch": 787} {"train_loss": -36.953243255615234, "global_step": 95345, "epoch": 787} {"train_loss": -34.63662338256836, "global_step": 95346, "epoch": 787} {"train_loss": -37.0666940547218, "global_step": 95347, "epoch": 787, "val_loss": 2432171.25} {"train_loss": -36.05552291870117, "global_step": 95348, "epoch": 788} {"train_loss": -36.86312484741211, "global_step": 95349, "epoch": 788} {"train_loss": -36.906341552734375, "global_step": 95350, "epoch": 788} {"train_loss": -35.74272537231445, "global_step": 95351, "epoch": 788} {"train_loss": -36.209022521972656, "global_step": 95352, "epoch": 788} {"train_loss": -35.50373840332031, "global_step": 95353, "epoch": 788} {"train_loss": -31.547582626342773, "global_step": 95354, "epoch": 788} {"train_loss": -34.889278411865234, "global_step": 95355, "epoch": 788} {"train_loss": -33.90113067626953, "global_step": 95356, "epoch": 788} {"train_loss": -35.19880294799805, "global_step": 95357, "epoch": 788} {"train_loss": -34.20182418823242, "global_step": 95358, "epoch": 788} {"train_loss": -36.11373519897461, "global_step": 95359, "epoch": 788} {"train_loss": -35.1970100402832, "global_step": 95360, "epoch": 788} {"train_loss": -36.8625602722168, "global_step": 95361, "epoch": 788} {"train_loss": -36.45041275024414, "global_step": 95362, "epoch": 788} {"train_loss": -36.95716094970703, "global_step": 95363, "epoch": 788} {"train_loss": -36.46562194824219, "global_step": 95364, "epoch": 788} {"train_loss": -36.26527786254883, "global_step": 95365, "epoch": 788} {"train_loss": -35.685115814208984, "global_step": 95366, "epoch": 788} {"train_loss": -35.35276794433594, "global_step": 95367, "epoch": 788} {"train_loss": -37.075252532958984, "global_step": 95368, "epoch": 788} {"train_loss": -37.33204650878906, "global_step": 95369, "epoch": 788} {"train_loss": -35.76820755004883, "global_step": 95370, "epoch": 788} {"train_loss": -37.22444152832031, "global_step": 95371, "epoch": 788} {"train_loss": -36.966278076171875, "global_step": 95372, "epoch": 788} {"train_loss": -36.239444732666016, "global_step": 95373, "epoch": 788} {"train_loss": -36.56193923950195, "global_step": 95374, "epoch": 788} {"train_loss": -37.5178337097168, "global_step": 95375, "epoch": 788} {"train_loss": -36.031227111816406, "global_step": 95376, "epoch": 788} {"train_loss": -36.184608459472656, "global_step": 95377, "epoch": 788} {"train_loss": -37.42644500732422, "global_step": 95378, "epoch": 788} {"train_loss": -37.14458084106445, "global_step": 95379, "epoch": 788} {"train_loss": -37.37044143676758, "global_step": 95380, "epoch": 788} {"train_loss": -36.89448928833008, "global_step": 95381, "epoch": 788} {"train_loss": -37.7831916809082, "global_step": 95382, "epoch": 788} {"train_loss": -37.84609603881836, "global_step": 95383, "epoch": 788} {"train_loss": -37.4256706237793, "global_step": 95384, "epoch": 788} {"train_loss": -37.75551986694336, "global_step": 95385, "epoch": 788} {"train_loss": -37.57908248901367, "global_step": 95386, "epoch": 788} {"train_loss": -37.456756591796875, "global_step": 95387, "epoch": 788} {"train_loss": -37.67753601074219, "global_step": 95388, "epoch": 788} {"train_loss": -37.91355895996094, "global_step": 95389, "epoch": 788} {"train_loss": -35.90023422241211, "global_step": 95390, "epoch": 788} {"train_loss": -38.156402587890625, "global_step": 95391, "epoch": 788} {"train_loss": -37.35454559326172, "global_step": 95392, "epoch": 788} {"train_loss": -37.928070068359375, "global_step": 95393, "epoch": 788} {"train_loss": -37.85642623901367, "global_step": 95394, "epoch": 788} {"train_loss": -37.5024528503418, "global_step": 95395, "epoch": 788} {"train_loss": -37.40824890136719, "global_step": 95396, "epoch": 788} {"train_loss": -38.0736083984375, "global_step": 95397, "epoch": 788} {"train_loss": -38.208900451660156, "global_step": 95398, "epoch": 788} {"train_loss": -37.731685638427734, "global_step": 95399, "epoch": 788} {"train_loss": -38.311580657958984, "global_step": 95400, "epoch": 788} {"train_loss": -37.703975677490234, "global_step": 95401, "epoch": 788} {"train_loss": -38.516212463378906, "global_step": 95402, "epoch": 788} {"train_loss": -37.95870590209961, "global_step": 95403, "epoch": 788} {"train_loss": -37.3193473815918, "global_step": 95404, "epoch": 788} {"train_loss": -38.05062484741211, "global_step": 95405, "epoch": 788} {"train_loss": -37.596405029296875, "global_step": 95406, "epoch": 788} {"train_loss": -38.630516052246094, "global_step": 95407, "epoch": 788} {"train_loss": -36.65327072143555, "global_step": 95408, "epoch": 788} {"train_loss": -36.76392364501953, "global_step": 95409, "epoch": 788} {"train_loss": -37.411800384521484, "global_step": 95410, "epoch": 788} {"train_loss": -38.22075271606445, "global_step": 95411, "epoch": 788} {"train_loss": -38.3903923034668, "global_step": 95412, "epoch": 788} {"train_loss": -38.25309371948242, "global_step": 95413, "epoch": 788} {"train_loss": -38.12723922729492, "global_step": 95414, "epoch": 788} {"train_loss": -38.27687454223633, "global_step": 95415, "epoch": 788} {"train_loss": -38.78325271606445, "global_step": 95416, "epoch": 788} {"train_loss": -38.661190032958984, "global_step": 95417, "epoch": 788} {"train_loss": -38.508235931396484, "global_step": 95418, "epoch": 788} {"train_loss": -38.915374755859375, "global_step": 95419, "epoch": 788} {"train_loss": -38.00440979003906, "global_step": 95420, "epoch": 788} {"train_loss": -38.95840072631836, "global_step": 95421, "epoch": 788} {"train_loss": -37.957740783691406, "global_step": 95422, "epoch": 788} {"train_loss": -38.89578628540039, "global_step": 95423, "epoch": 788} {"train_loss": -38.55374526977539, "global_step": 95424, "epoch": 788} {"train_loss": -39.05235290527344, "global_step": 95425, "epoch": 788} {"train_loss": -38.39023971557617, "global_step": 95426, "epoch": 788} {"train_loss": -39.0729866027832, "global_step": 95427, "epoch": 788} {"train_loss": -38.06795120239258, "global_step": 95428, "epoch": 788} {"train_loss": -37.98490524291992, "global_step": 95429, "epoch": 788} {"train_loss": -37.64448928833008, "global_step": 95430, "epoch": 788} {"train_loss": -38.8997917175293, "global_step": 95431, "epoch": 788} {"train_loss": -38.90694046020508, "global_step": 95432, "epoch": 788} {"train_loss": -38.61379623413086, "global_step": 95433, "epoch": 788} {"train_loss": -37.40082931518555, "global_step": 95434, "epoch": 788} {"train_loss": -33.69489288330078, "global_step": 95435, "epoch": 788} {"train_loss": -26.384958267211914, "global_step": 95436, "epoch": 788} {"train_loss": -20.783498764038086, "global_step": 95437, "epoch": 788} {"train_loss": -19.477811813354492, "global_step": 95438, "epoch": 788} {"train_loss": -33.1004638671875, "global_step": 95439, "epoch": 788} {"train_loss": -32.13554000854492, "global_step": 95440, "epoch": 788} {"train_loss": -30.3266544342041, "global_step": 95441, "epoch": 788} {"train_loss": -36.48530960083008, "global_step": 95442, "epoch": 788} {"train_loss": -33.08749771118164, "global_step": 95443, "epoch": 788} {"train_loss": -37.23084259033203, "global_step": 95444, "epoch": 788} {"train_loss": -32.331756591796875, "global_step": 95445, "epoch": 788} {"train_loss": -37.979225158691406, "global_step": 95446, "epoch": 788} {"train_loss": -35.31226348876953, "global_step": 95447, "epoch": 788} {"train_loss": -36.959144592285156, "global_step": 95448, "epoch": 788} {"train_loss": -35.878761291503906, "global_step": 95449, "epoch": 788} {"train_loss": -35.79229736328125, "global_step": 95450, "epoch": 788} {"train_loss": -37.507728576660156, "global_step": 95451, "epoch": 788} {"train_loss": -36.50948715209961, "global_step": 95452, "epoch": 788} {"train_loss": -36.562095642089844, "global_step": 95453, "epoch": 788} {"train_loss": -36.998470306396484, "global_step": 95454, "epoch": 788} {"train_loss": -36.981563568115234, "global_step": 95455, "epoch": 788} {"train_loss": -36.348907470703125, "global_step": 95456, "epoch": 788} {"train_loss": -37.90526580810547, "global_step": 95457, "epoch": 788} {"train_loss": -37.07533264160156, "global_step": 95458, "epoch": 788} {"train_loss": -38.3237419128418, "global_step": 95459, "epoch": 788} {"train_loss": -37.10907745361328, "global_step": 95460, "epoch": 788} {"train_loss": -37.62477493286133, "global_step": 95461, "epoch": 788} {"train_loss": -37.332672119140625, "global_step": 95462, "epoch": 788} {"train_loss": -38.27045440673828, "global_step": 95463, "epoch": 788} {"train_loss": -37.374019622802734, "global_step": 95464, "epoch": 788} {"train_loss": -37.502193450927734, "global_step": 95465, "epoch": 788} {"train_loss": -37.81159591674805, "global_step": 95466, "epoch": 788} {"train_loss": -38.02016067504883, "global_step": 95467, "epoch": 788} {"train_loss": -36.631526206150525, "global_step": 95468, "epoch": 788, "val_loss": 2558605.25} {"train_loss": -37.63314437866211, "global_step": 95469, "epoch": 789} {"train_loss": -35.59220504760742, "global_step": 95470, "epoch": 789} {"train_loss": -37.071109771728516, "global_step": 95471, "epoch": 789} {"train_loss": -37.517669677734375, "global_step": 95472, "epoch": 789} {"train_loss": -37.744529724121094, "global_step": 95473, "epoch": 789} {"train_loss": -38.237281799316406, "global_step": 95474, "epoch": 789} {"train_loss": -38.148616790771484, "global_step": 95475, "epoch": 789} {"train_loss": -38.056339263916016, "global_step": 95476, "epoch": 789} {"train_loss": -38.373291015625, "global_step": 95477, "epoch": 789} {"train_loss": -37.97162628173828, "global_step": 95478, "epoch": 789} {"train_loss": -37.8847541809082, "global_step": 95479, "epoch": 789} {"train_loss": -38.31509017944336, "global_step": 95480, "epoch": 789} {"train_loss": -38.223915100097656, "global_step": 95481, "epoch": 789} {"train_loss": -38.513179779052734, "global_step": 95482, "epoch": 789} {"train_loss": -38.58280563354492, "global_step": 95483, "epoch": 789} {"train_loss": -36.747798919677734, "global_step": 95484, "epoch": 789} {"train_loss": -38.68561553955078, "global_step": 95485, "epoch": 789} {"train_loss": -38.366485595703125, "global_step": 95486, "epoch": 789} {"train_loss": -38.32461929321289, "global_step": 95487, "epoch": 789} {"train_loss": -36.955257415771484, "global_step": 95488, "epoch": 789} {"train_loss": -38.392250061035156, "global_step": 95489, "epoch": 789} {"train_loss": -38.04337692260742, "global_step": 95490, "epoch": 789} {"train_loss": -38.3743896484375, "global_step": 95491, "epoch": 789} {"train_loss": -37.201717376708984, "global_step": 95492, "epoch": 789} {"train_loss": -31.442487716674805, "global_step": 95493, "epoch": 789} {"train_loss": -22.534337997436523, "global_step": 95494, "epoch": 789} {"train_loss": -19.423118591308594, "global_step": 95495, "epoch": 789} {"train_loss": -32.28912353515625, "global_step": 95496, "epoch": 789} {"train_loss": -32.96243667602539, "global_step": 95497, "epoch": 789} {"train_loss": -22.472890853881836, "global_step": 95498, "epoch": 789} {"train_loss": -33.08799362182617, "global_step": 95499, "epoch": 789} {"train_loss": -30.65627098083496, "global_step": 95500, "epoch": 789} {"train_loss": -33.963531494140625, "global_step": 95501, "epoch": 789} {"train_loss": -30.65337562561035, "global_step": 95502, "epoch": 789} {"train_loss": -35.254459381103516, "global_step": 95503, "epoch": 789} {"train_loss": -31.214658737182617, "global_step": 95504, "epoch": 789} {"train_loss": -36.54443359375, "global_step": 95505, "epoch": 789} {"train_loss": -32.62842559814453, "global_step": 95506, "epoch": 789} {"train_loss": -35.41175079345703, "global_step": 95507, "epoch": 789} {"train_loss": -33.59795379638672, "global_step": 95508, "epoch": 789} {"train_loss": -35.105411529541016, "global_step": 95509, "epoch": 789} {"train_loss": -35.2751579284668, "global_step": 95510, "epoch": 789} {"train_loss": -34.85669708251953, "global_step": 95511, "epoch": 789} {"train_loss": -35.7398567199707, "global_step": 95512, "epoch": 789} {"train_loss": -36.22807693481445, "global_step": 95513, "epoch": 789} {"train_loss": -34.792537689208984, "global_step": 95514, "epoch": 789} {"train_loss": -36.141597747802734, "global_step": 95515, "epoch": 789} {"train_loss": -36.79499053955078, "global_step": 95516, "epoch": 789} {"train_loss": -36.25996017456055, "global_step": 95517, "epoch": 789} {"train_loss": -36.183040618896484, "global_step": 95518, "epoch": 789} {"train_loss": -35.87641143798828, "global_step": 95519, "epoch": 789} {"train_loss": -36.68939208984375, "global_step": 95520, "epoch": 789} {"train_loss": -36.92979049682617, "global_step": 95521, "epoch": 789} {"train_loss": -36.62588119506836, "global_step": 95522, "epoch": 789} {"train_loss": -37.03968048095703, "global_step": 95523, "epoch": 789} {"train_loss": -37.080482482910156, "global_step": 95524, "epoch": 789} {"train_loss": -36.386619567871094, "global_step": 95525, "epoch": 789} {"train_loss": -37.50154495239258, "global_step": 95526, "epoch": 789} {"train_loss": -36.531654357910156, "global_step": 95527, "epoch": 789} {"train_loss": -36.29379653930664, "global_step": 95528, "epoch": 789} {"train_loss": -36.2443962097168, "global_step": 95529, "epoch": 789} {"train_loss": -37.52235794067383, "global_step": 95530, "epoch": 789} {"train_loss": -37.072139739990234, "global_step": 95531, "epoch": 789} {"train_loss": -37.8717155456543, "global_step": 95532, "epoch": 789} {"train_loss": -37.4140510559082, "global_step": 95533, "epoch": 789} {"train_loss": -34.57328796386719, "global_step": 95534, "epoch": 789} {"train_loss": -36.63154220581055, "global_step": 95535, "epoch": 789} {"train_loss": -36.70675277709961, "global_step": 95536, "epoch": 789} {"train_loss": -36.08164596557617, "global_step": 95537, "epoch": 789} {"train_loss": -36.992645263671875, "global_step": 95538, "epoch": 789} {"train_loss": -36.880889892578125, "global_step": 95539, "epoch": 789} {"train_loss": -37.489253997802734, "global_step": 95540, "epoch": 789} {"train_loss": -37.899017333984375, "global_step": 95541, "epoch": 789} {"train_loss": -36.91486740112305, "global_step": 95542, "epoch": 789} {"train_loss": -36.402626037597656, "global_step": 95543, "epoch": 789} {"train_loss": -36.275611877441406, "global_step": 95544, "epoch": 789} {"train_loss": -37.25092697143555, "global_step": 95545, "epoch": 789} {"train_loss": -35.83120346069336, "global_step": 95546, "epoch": 789} {"train_loss": -37.263824462890625, "global_step": 95547, "epoch": 789} {"train_loss": -37.50006103515625, "global_step": 95548, "epoch": 789} {"train_loss": -37.928218841552734, "global_step": 95549, "epoch": 789} {"train_loss": -37.60551071166992, "global_step": 95550, "epoch": 789} {"train_loss": -35.80507278442383, "global_step": 95551, "epoch": 789} {"train_loss": -36.24788284301758, "global_step": 95552, "epoch": 789} {"train_loss": -35.54594039916992, "global_step": 95553, "epoch": 789} {"train_loss": -35.83668899536133, "global_step": 95554, "epoch": 789} {"train_loss": -37.059967041015625, "global_step": 95555, "epoch": 789} {"train_loss": -36.7904167175293, "global_step": 95556, "epoch": 789} {"train_loss": -36.0803337097168, "global_step": 95557, "epoch": 789} {"train_loss": -37.160743713378906, "global_step": 95558, "epoch": 789} {"train_loss": -37.45671463012695, "global_step": 95559, "epoch": 789} {"train_loss": -37.347755432128906, "global_step": 95560, "epoch": 789} {"train_loss": -37.301143646240234, "global_step": 95561, "epoch": 789} {"train_loss": -37.15753173828125, "global_step": 95562, "epoch": 789} {"train_loss": -36.3220329284668, "global_step": 95563, "epoch": 789} {"train_loss": -36.556976318359375, "global_step": 95564, "epoch": 789} {"train_loss": -37.12123107910156, "global_step": 95565, "epoch": 789} {"train_loss": -36.54465866088867, "global_step": 95566, "epoch": 789} {"train_loss": -37.20676803588867, "global_step": 95567, "epoch": 789} {"train_loss": -37.252899169921875, "global_step": 95568, "epoch": 789} {"train_loss": -37.559051513671875, "global_step": 95569, "epoch": 789} {"train_loss": -37.54977798461914, "global_step": 95570, "epoch": 789} {"train_loss": -36.83187484741211, "global_step": 95571, "epoch": 789} {"train_loss": -37.715972900390625, "global_step": 95572, "epoch": 789} {"train_loss": -37.741512298583984, "global_step": 95573, "epoch": 789} {"train_loss": -36.409366607666016, "global_step": 95574, "epoch": 789} {"train_loss": -36.796443939208984, "global_step": 95575, "epoch": 789} {"train_loss": -37.28250503540039, "global_step": 95576, "epoch": 789} {"train_loss": -37.507102966308594, "global_step": 95577, "epoch": 789} {"train_loss": -37.46348190307617, "global_step": 95578, "epoch": 789} {"train_loss": -37.28469467163086, "global_step": 95579, "epoch": 789} {"train_loss": -37.78657913208008, "global_step": 95580, "epoch": 789} {"train_loss": -37.58932876586914, "global_step": 95581, "epoch": 789} {"train_loss": -37.80234909057617, "global_step": 95582, "epoch": 789} {"train_loss": -37.5678825378418, "global_step": 95583, "epoch": 789} {"train_loss": -37.7333984375, "global_step": 95584, "epoch": 789} {"train_loss": -37.54912185668945, "global_step": 95585, "epoch": 789} {"train_loss": -37.91172409057617, "global_step": 95586, "epoch": 789} {"train_loss": -38.24416732788086, "global_step": 95587, "epoch": 789} {"train_loss": -37.511417388916016, "global_step": 95588, "epoch": 789} {"train_loss": -36.27022851991259, "global_step": 95589, "epoch": 789, "val_loss": 2561934.5} {"train_loss": -38.25119400024414, "global_step": 95590, "epoch": 790} {"train_loss": -38.11418914794922, "global_step": 95591, "epoch": 790} {"train_loss": -38.07366943359375, "global_step": 95592, "epoch": 790} {"train_loss": -36.96728515625, "global_step": 95593, "epoch": 790} {"train_loss": -37.32536697387695, "global_step": 95594, "epoch": 790} {"train_loss": -38.00708770751953, "global_step": 95595, "epoch": 790} {"train_loss": -37.53159713745117, "global_step": 95596, "epoch": 790} {"train_loss": -36.73051071166992, "global_step": 95597, "epoch": 790} {"train_loss": -34.70354080200195, "global_step": 95598, "epoch": 790} {"train_loss": -30.39666175842285, "global_step": 95599, "epoch": 790} {"train_loss": -32.042720794677734, "global_step": 95600, "epoch": 790} {"train_loss": -37.50244903564453, "global_step": 95601, "epoch": 790} {"train_loss": -29.46514320373535, "global_step": 95602, "epoch": 790} {"train_loss": -34.99946975708008, "global_step": 95603, "epoch": 790} {"train_loss": -32.31732177734375, "global_step": 95604, "epoch": 790} {"train_loss": -33.63149642944336, "global_step": 95605, "epoch": 790} {"train_loss": -33.364707946777344, "global_step": 95606, "epoch": 790} {"train_loss": -33.475101470947266, "global_step": 95607, "epoch": 790} {"train_loss": -34.583641052246094, "global_step": 95608, "epoch": 790} {"train_loss": -24.992313385009766, "global_step": 95609, "epoch": 790} {"train_loss": -34.542659759521484, "global_step": 95610, "epoch": 790} {"train_loss": -34.95798873901367, "global_step": 95611, "epoch": 790} {"train_loss": -35.5393180847168, "global_step": 95612, "epoch": 790} {"train_loss": -34.1009407043457, "global_step": 95613, "epoch": 790} {"train_loss": -34.354610443115234, "global_step": 95614, "epoch": 790} {"train_loss": -33.126888275146484, "global_step": 95615, "epoch": 790} {"train_loss": -34.875308990478516, "global_step": 95616, "epoch": 790} {"train_loss": -33.66462326049805, "global_step": 95617, "epoch": 790} {"train_loss": -34.79608917236328, "global_step": 95618, "epoch": 790} {"train_loss": -32.91036605834961, "global_step": 95619, "epoch": 790} {"train_loss": -34.05343246459961, "global_step": 95620, "epoch": 790} {"train_loss": -34.391578674316406, "global_step": 95621, "epoch": 790} {"train_loss": -32.655391693115234, "global_step": 95622, "epoch": 790} {"train_loss": -34.276546478271484, "global_step": 95623, "epoch": 790} {"train_loss": -35.0139274597168, "global_step": 95624, "epoch": 790} {"train_loss": -35.62466812133789, "global_step": 95625, "epoch": 790} {"train_loss": -35.697509765625, "global_step": 95626, "epoch": 790} {"train_loss": -35.835506439208984, "global_step": 95627, "epoch": 790} {"train_loss": -35.339027404785156, "global_step": 95628, "epoch": 790} {"train_loss": -35.49747848510742, "global_step": 95629, "epoch": 790} {"train_loss": -36.236541748046875, "global_step": 95630, "epoch": 790} {"train_loss": -36.204010009765625, "global_step": 95631, "epoch": 790} {"train_loss": -35.46976852416992, "global_step": 95632, "epoch": 790} {"train_loss": -35.5609130859375, "global_step": 95633, "epoch": 790} {"train_loss": -35.77315902709961, "global_step": 95634, "epoch": 790} {"train_loss": -36.46815872192383, "global_step": 95635, "epoch": 790} {"train_loss": -36.63727569580078, "global_step": 95636, "epoch": 790} {"train_loss": -34.97151565551758, "global_step": 95637, "epoch": 790} {"train_loss": -37.22987747192383, "global_step": 95638, "epoch": 790} {"train_loss": -36.37703323364258, "global_step": 95639, "epoch": 790} {"train_loss": -36.0391845703125, "global_step": 95640, "epoch": 790} {"train_loss": -36.64204406738281, "global_step": 95641, "epoch": 790} {"train_loss": -36.513851165771484, "global_step": 95642, "epoch": 790} {"train_loss": -36.4944953918457, "global_step": 95643, "epoch": 790} {"train_loss": -37.180694580078125, "global_step": 95644, "epoch": 790} {"train_loss": -36.8956413269043, "global_step": 95645, "epoch": 790} {"train_loss": -37.35830307006836, "global_step": 95646, "epoch": 790} {"train_loss": -36.404720306396484, "global_step": 95647, "epoch": 790} {"train_loss": -36.890541076660156, "global_step": 95648, "epoch": 790} {"train_loss": -36.969642639160156, "global_step": 95649, "epoch": 790} {"train_loss": -36.98408126831055, "global_step": 95650, "epoch": 790} {"train_loss": -35.83993148803711, "global_step": 95651, "epoch": 790} {"train_loss": -37.08540725708008, "global_step": 95652, "epoch": 790} {"train_loss": -36.238521575927734, "global_step": 95653, "epoch": 790} {"train_loss": -36.90094757080078, "global_step": 95654, "epoch": 790} {"train_loss": -37.542816162109375, "global_step": 95655, "epoch": 790} {"train_loss": -37.44612503051758, "global_step": 95656, "epoch": 790} {"train_loss": -37.71149826049805, "global_step": 95657, "epoch": 790} {"train_loss": -37.30815505981445, "global_step": 95658, "epoch": 790} {"train_loss": -37.24953842163086, "global_step": 95659, "epoch": 790} {"train_loss": -37.73383712768555, "global_step": 95660, "epoch": 790} {"train_loss": -37.394901275634766, "global_step": 95661, "epoch": 790} {"train_loss": -37.62069320678711, "global_step": 95662, "epoch": 790} {"train_loss": -36.300716400146484, "global_step": 95663, "epoch": 790} {"train_loss": -37.655731201171875, "global_step": 95664, "epoch": 790} {"train_loss": -37.46094512939453, "global_step": 95665, "epoch": 790} {"train_loss": -37.0251350402832, "global_step": 95666, "epoch": 790} {"train_loss": -37.29560852050781, "global_step": 95667, "epoch": 790} {"train_loss": -37.41543197631836, "global_step": 95668, "epoch": 790} {"train_loss": -37.57551193237305, "global_step": 95669, "epoch": 790} {"train_loss": -37.59857940673828, "global_step": 95670, "epoch": 790} {"train_loss": -37.07759475708008, "global_step": 95671, "epoch": 790} {"train_loss": -37.81342697143555, "global_step": 95672, "epoch": 790} {"train_loss": -38.065120697021484, "global_step": 95673, "epoch": 790} {"train_loss": -37.6458854675293, "global_step": 95674, "epoch": 790} {"train_loss": -37.914215087890625, "global_step": 95675, "epoch": 790} {"train_loss": -37.243812561035156, "global_step": 95676, "epoch": 790} {"train_loss": -38.147369384765625, "global_step": 95677, "epoch": 790} {"train_loss": -37.683319091796875, "global_step": 95678, "epoch": 790} {"train_loss": -37.639461517333984, "global_step": 95679, "epoch": 790} {"train_loss": -37.59014892578125, "global_step": 95680, "epoch": 790} {"train_loss": -38.379676818847656, "global_step": 95681, "epoch": 790} {"train_loss": -38.1693115234375, "global_step": 95682, "epoch": 790} {"train_loss": -38.253021240234375, "global_step": 95683, "epoch": 790} {"train_loss": -37.86518478393555, "global_step": 95684, "epoch": 790} {"train_loss": -38.42275619506836, "global_step": 95685, "epoch": 790} {"train_loss": -38.151023864746094, "global_step": 95686, "epoch": 790} {"train_loss": -37.540138244628906, "global_step": 95687, "epoch": 790} {"train_loss": -38.54459762573242, "global_step": 95688, "epoch": 790} {"train_loss": -38.181819915771484, "global_step": 95689, "epoch": 790} {"train_loss": -38.146419525146484, "global_step": 95690, "epoch": 790} {"train_loss": -38.43604278564453, "global_step": 95691, "epoch": 790} {"train_loss": -38.5523567199707, "global_step": 95692, "epoch": 790} {"train_loss": -38.19698715209961, "global_step": 95693, "epoch": 790} {"train_loss": -38.5371208190918, "global_step": 95694, "epoch": 790} {"train_loss": -38.43025588989258, "global_step": 95695, "epoch": 790} {"train_loss": -38.215267181396484, "global_step": 95696, "epoch": 790} {"train_loss": -38.822265625, "global_step": 95697, "epoch": 790} {"train_loss": -37.359222412109375, "global_step": 95698, "epoch": 790} {"train_loss": -38.63348388671875, "global_step": 95699, "epoch": 790} {"train_loss": -39.010921478271484, "global_step": 95700, "epoch": 790} {"train_loss": -38.054840087890625, "global_step": 95701, "epoch": 790} {"train_loss": -38.9023551940918, "global_step": 95702, "epoch": 790} {"train_loss": -39.06118392944336, "global_step": 95703, "epoch": 790} {"train_loss": -38.77777099609375, "global_step": 95704, "epoch": 790} {"train_loss": -38.700416564941406, "global_step": 95705, "epoch": 790} {"train_loss": -38.52181625366211, "global_step": 95706, "epoch": 790} {"train_loss": -38.588985443115234, "global_step": 95707, "epoch": 790} {"train_loss": -38.484901428222656, "global_step": 95708, "epoch": 790} {"train_loss": -38.203155517578125, "global_step": 95709, "epoch": 790} {"train_loss": -36.533539322782154, "global_step": 95710, "epoch": 790, "val_loss": 2500267.25} {"train_loss": -38.84320831298828, "global_step": 95711, "epoch": 791} {"train_loss": -39.08818435668945, "global_step": 95712, "epoch": 791} {"train_loss": -38.14614486694336, "global_step": 95713, "epoch": 791} {"train_loss": -38.62395477294922, "global_step": 95714, "epoch": 791} {"train_loss": -37.1003532409668, "global_step": 95715, "epoch": 791} {"train_loss": -36.9866943359375, "global_step": 95716, "epoch": 791} {"train_loss": -36.897552490234375, "global_step": 95717, "epoch": 791} {"train_loss": -36.56126022338867, "global_step": 95718, "epoch": 791} {"train_loss": -35.98711013793945, "global_step": 95719, "epoch": 791} {"train_loss": -35.7933464050293, "global_step": 95720, "epoch": 791} {"train_loss": -37.4660758972168, "global_step": 95721, "epoch": 791} {"train_loss": -38.230873107910156, "global_step": 95722, "epoch": 791} {"train_loss": -37.611080169677734, "global_step": 95723, "epoch": 791} {"train_loss": -37.716949462890625, "global_step": 95724, "epoch": 791} {"train_loss": -37.37962341308594, "global_step": 95725, "epoch": 791} {"train_loss": -38.92341995239258, "global_step": 95726, "epoch": 791} {"train_loss": -36.160926818847656, "global_step": 95727, "epoch": 791} {"train_loss": -34.691471099853516, "global_step": 95728, "epoch": 791} {"train_loss": -37.22638702392578, "global_step": 95729, "epoch": 791} {"train_loss": -37.20688247680664, "global_step": 95730, "epoch": 791} {"train_loss": -36.307498931884766, "global_step": 95731, "epoch": 791} {"train_loss": -38.52070236206055, "global_step": 95732, "epoch": 791} {"train_loss": -37.63446044921875, "global_step": 95733, "epoch": 791} {"train_loss": -36.16268539428711, "global_step": 95734, "epoch": 791} {"train_loss": -37.059661865234375, "global_step": 95735, "epoch": 791} {"train_loss": -35.51849365234375, "global_step": 95736, "epoch": 791} {"train_loss": -37.44994354248047, "global_step": 95737, "epoch": 791} {"train_loss": -36.15192413330078, "global_step": 95738, "epoch": 791} {"train_loss": -37.28169631958008, "global_step": 95739, "epoch": 791} {"train_loss": -35.679927825927734, "global_step": 95740, "epoch": 791} {"train_loss": -37.46211624145508, "global_step": 95741, "epoch": 791} {"train_loss": -35.91476058959961, "global_step": 95742, "epoch": 791} {"train_loss": -37.1159782409668, "global_step": 95743, "epoch": 791} {"train_loss": -37.22256088256836, "global_step": 95744, "epoch": 791} {"train_loss": -37.5059928894043, "global_step": 95745, "epoch": 791} {"train_loss": -36.66301345825195, "global_step": 95746, "epoch": 791} {"train_loss": -37.527732849121094, "global_step": 95747, "epoch": 791} {"train_loss": -37.106258392333984, "global_step": 95748, "epoch": 791} {"train_loss": -37.14641189575195, "global_step": 95749, "epoch": 791} {"train_loss": -35.90964889526367, "global_step": 95750, "epoch": 791} {"train_loss": -37.00868606567383, "global_step": 95751, "epoch": 791} {"train_loss": -33.06719970703125, "global_step": 95752, "epoch": 791} {"train_loss": -37.096866607666016, "global_step": 95753, "epoch": 791} {"train_loss": -37.04904556274414, "global_step": 95754, "epoch": 791} {"train_loss": -36.04664611816406, "global_step": 95755, "epoch": 791} {"train_loss": -35.11550521850586, "global_step": 95756, "epoch": 791} {"train_loss": -33.624053955078125, "global_step": 95757, "epoch": 791} {"train_loss": -34.53462600708008, "global_step": 95758, "epoch": 791} {"train_loss": -32.63014602661133, "global_step": 95759, "epoch": 791} {"train_loss": -35.07986831665039, "global_step": 95760, "epoch": 791} {"train_loss": -31.89875602722168, "global_step": 95761, "epoch": 791} {"train_loss": -35.57295608520508, "global_step": 95762, "epoch": 791} {"train_loss": -33.1473274230957, "global_step": 95763, "epoch": 791} {"train_loss": -34.22256088256836, "global_step": 95764, "epoch": 791} {"train_loss": -32.38248825073242, "global_step": 95765, "epoch": 791} {"train_loss": -34.561336517333984, "global_step": 95766, "epoch": 791} {"train_loss": -34.30293655395508, "global_step": 95767, "epoch": 791} {"train_loss": -34.79750442504883, "global_step": 95768, "epoch": 791} {"train_loss": -35.6715202331543, "global_step": 95769, "epoch": 791} {"train_loss": -35.416446685791016, "global_step": 95770, "epoch": 791} {"train_loss": -35.7421875, "global_step": 95771, "epoch": 791} {"train_loss": -34.11663055419922, "global_step": 95772, "epoch": 791} {"train_loss": -35.5656852722168, "global_step": 95773, "epoch": 791} {"train_loss": -35.0062370300293, "global_step": 95774, "epoch": 791} {"train_loss": -35.545860290527344, "global_step": 95775, "epoch": 791} {"train_loss": -35.076683044433594, "global_step": 95776, "epoch": 791} {"train_loss": -32.32551956176758, "global_step": 95777, "epoch": 791} {"train_loss": -35.20781326293945, "global_step": 95778, "epoch": 791} {"train_loss": -36.61275100708008, "global_step": 95779, "epoch": 791} {"train_loss": -33.15055465698242, "global_step": 95780, "epoch": 791} {"train_loss": -34.59796905517578, "global_step": 95781, "epoch": 791} {"train_loss": -36.80691146850586, "global_step": 95782, "epoch": 791} {"train_loss": -34.3018913269043, "global_step": 95783, "epoch": 791} {"train_loss": -33.900733947753906, "global_step": 95784, "epoch": 791} {"train_loss": -35.36614990234375, "global_step": 95785, "epoch": 791} {"train_loss": -35.673221588134766, "global_step": 95786, "epoch": 791} {"train_loss": -36.47172927856445, "global_step": 95787, "epoch": 791} {"train_loss": -35.997371673583984, "global_step": 95788, "epoch": 791} {"train_loss": -36.10630416870117, "global_step": 95789, "epoch": 791} {"train_loss": -36.053279876708984, "global_step": 95790, "epoch": 791} {"train_loss": -35.7909049987793, "global_step": 95791, "epoch": 791} {"train_loss": -35.78671646118164, "global_step": 95792, "epoch": 791} {"train_loss": -35.12458038330078, "global_step": 95793, "epoch": 791} {"train_loss": -36.628231048583984, "global_step": 95794, "epoch": 791} {"train_loss": -35.846675872802734, "global_step": 95795, "epoch": 791} {"train_loss": -36.260292053222656, "global_step": 95796, "epoch": 791} {"train_loss": -37.1680908203125, "global_step": 95797, "epoch": 791} {"train_loss": -36.69540023803711, "global_step": 95798, "epoch": 791} {"train_loss": -35.76303482055664, "global_step": 95799, "epoch": 791} {"train_loss": -33.9689826965332, "global_step": 95800, "epoch": 791} {"train_loss": -36.58748245239258, "global_step": 95801, "epoch": 791} {"train_loss": -37.3465461730957, "global_step": 95802, "epoch": 791} {"train_loss": -37.101436614990234, "global_step": 95803, "epoch": 791} {"train_loss": -36.80418395996094, "global_step": 95804, "epoch": 791} {"train_loss": -36.49665451049805, "global_step": 95805, "epoch": 791} {"train_loss": -36.759918212890625, "global_step": 95806, "epoch": 791} {"train_loss": -36.27155685424805, "global_step": 95807, "epoch": 791} {"train_loss": -36.7749137878418, "global_step": 95808, "epoch": 791} {"train_loss": -37.68614959716797, "global_step": 95809, "epoch": 791} {"train_loss": -36.89730453491211, "global_step": 95810, "epoch": 791} {"train_loss": -36.59503936767578, "global_step": 95811, "epoch": 791} {"train_loss": -36.72719192504883, "global_step": 95812, "epoch": 791} {"train_loss": -37.22330856323242, "global_step": 95813, "epoch": 791} {"train_loss": -37.05873489379883, "global_step": 95814, "epoch": 791} {"train_loss": -36.99962615966797, "global_step": 95815, "epoch": 791} {"train_loss": -37.19524002075195, "global_step": 95816, "epoch": 791} {"train_loss": -36.873897552490234, "global_step": 95817, "epoch": 791} {"train_loss": -37.251346588134766, "global_step": 95818, "epoch": 791} {"train_loss": -37.594207763671875, "global_step": 95819, "epoch": 791} {"train_loss": -37.59741973876953, "global_step": 95820, "epoch": 791} {"train_loss": -37.525367736816406, "global_step": 95821, "epoch": 791} {"train_loss": -37.407474517822266, "global_step": 95822, "epoch": 791} {"train_loss": -37.93287658691406, "global_step": 95823, "epoch": 791} {"train_loss": -37.77180099487305, "global_step": 95824, "epoch": 791} {"train_loss": -37.57861328125, "global_step": 95825, "epoch": 791} {"train_loss": -36.9650993347168, "global_step": 95826, "epoch": 791} {"train_loss": -37.692047119140625, "global_step": 95827, "epoch": 791} {"train_loss": -37.46846008300781, "global_step": 95828, "epoch": 791} {"train_loss": -37.98495101928711, "global_step": 95829, "epoch": 791} {"train_loss": -37.702735900878906, "global_step": 95830, "epoch": 791} {"train_loss": -36.310597396093954, "global_step": 95831, "epoch": 791, "val_loss": 2614500.75} {"train_loss": -37.981597900390625, "global_step": 95832, "epoch": 792} {"train_loss": -38.16896438598633, "global_step": 95833, "epoch": 792} {"train_loss": -38.378936767578125, "global_step": 95834, "epoch": 792} {"train_loss": -37.5647087097168, "global_step": 95835, "epoch": 792} {"train_loss": -38.139156341552734, "global_step": 95836, "epoch": 792} {"train_loss": -38.33977127075195, "global_step": 95837, "epoch": 792} {"train_loss": -38.246253967285156, "global_step": 95838, "epoch": 792} {"train_loss": -37.80704879760742, "global_step": 95839, "epoch": 792} {"train_loss": -37.96406173706055, "global_step": 95840, "epoch": 792} {"train_loss": -38.21928405761719, "global_step": 95841, "epoch": 792} {"train_loss": -38.504371643066406, "global_step": 95842, "epoch": 792} {"train_loss": -37.53584671020508, "global_step": 95843, "epoch": 792} {"train_loss": -38.1646614074707, "global_step": 95844, "epoch": 792} {"train_loss": -38.1700439453125, "global_step": 95845, "epoch": 792} {"train_loss": -38.21302032470703, "global_step": 95846, "epoch": 792} {"train_loss": -38.699440002441406, "global_step": 95847, "epoch": 792} {"train_loss": -37.805580139160156, "global_step": 95848, "epoch": 792} {"train_loss": -37.280269622802734, "global_step": 95849, "epoch": 792} {"train_loss": -37.02212142944336, "global_step": 95850, "epoch": 792} {"train_loss": -36.4119873046875, "global_step": 95851, "epoch": 792} {"train_loss": -37.276123046875, "global_step": 95852, "epoch": 792} {"train_loss": -38.182899475097656, "global_step": 95853, "epoch": 792} {"train_loss": -38.560096740722656, "global_step": 95854, "epoch": 792} {"train_loss": -38.291282653808594, "global_step": 95855, "epoch": 792} {"train_loss": -37.30601501464844, "global_step": 95856, "epoch": 792} {"train_loss": -37.78214645385742, "global_step": 95857, "epoch": 792} {"train_loss": -35.758155822753906, "global_step": 95858, "epoch": 792} {"train_loss": -36.36012649536133, "global_step": 95859, "epoch": 792} {"train_loss": -36.414955139160156, "global_step": 95860, "epoch": 792} {"train_loss": -37.78898239135742, "global_step": 95861, "epoch": 792} {"train_loss": -37.19959259033203, "global_step": 95862, "epoch": 792} {"train_loss": -36.9664306640625, "global_step": 95863, "epoch": 792} {"train_loss": -35.66298294067383, "global_step": 95864, "epoch": 792} {"train_loss": -38.0938835144043, "global_step": 95865, "epoch": 792} {"train_loss": -35.88157272338867, "global_step": 95866, "epoch": 792} {"train_loss": -35.32374954223633, "global_step": 95867, "epoch": 792} {"train_loss": -34.876644134521484, "global_step": 95868, "epoch": 792} {"train_loss": -36.794471740722656, "global_step": 95869, "epoch": 792} {"train_loss": -37.73926544189453, "global_step": 95870, "epoch": 792} {"train_loss": -36.78575897216797, "global_step": 95871, "epoch": 792} {"train_loss": -35.976173400878906, "global_step": 95872, "epoch": 792} {"train_loss": -36.83479690551758, "global_step": 95873, "epoch": 792} {"train_loss": -37.738128662109375, "global_step": 95874, "epoch": 792} {"train_loss": -37.575660705566406, "global_step": 95875, "epoch": 792} {"train_loss": -38.26669692993164, "global_step": 95876, "epoch": 792} {"train_loss": -37.358890533447266, "global_step": 95877, "epoch": 792} {"train_loss": -37.648006439208984, "global_step": 95878, "epoch": 792} {"train_loss": -37.925254821777344, "global_step": 95879, "epoch": 792} {"train_loss": -38.295833587646484, "global_step": 95880, "epoch": 792} {"train_loss": -37.075923919677734, "global_step": 95881, "epoch": 792} {"train_loss": -37.425106048583984, "global_step": 95882, "epoch": 792} {"train_loss": -37.61079788208008, "global_step": 95883, "epoch": 792} {"train_loss": -37.9801025390625, "global_step": 95884, "epoch": 792} {"train_loss": -37.86851119995117, "global_step": 95885, "epoch": 792} {"train_loss": -38.053096771240234, "global_step": 95886, "epoch": 792} {"train_loss": -38.853118896484375, "global_step": 95887, "epoch": 792} {"train_loss": -36.95682907104492, "global_step": 95888, "epoch": 792} {"train_loss": -37.37526321411133, "global_step": 95889, "epoch": 792} {"train_loss": -38.40723419189453, "global_step": 95890, "epoch": 792} {"train_loss": -37.625240325927734, "global_step": 95891, "epoch": 792} {"train_loss": -37.76727294921875, "global_step": 95892, "epoch": 792} {"train_loss": -37.53614807128906, "global_step": 95893, "epoch": 792} {"train_loss": -37.12074279785156, "global_step": 95894, "epoch": 792} {"train_loss": -37.626708984375, "global_step": 95895, "epoch": 792} {"train_loss": -37.433868408203125, "global_step": 95896, "epoch": 792} {"train_loss": -36.291873931884766, "global_step": 95897, "epoch": 792} {"train_loss": -38.17743682861328, "global_step": 95898, "epoch": 792} {"train_loss": -36.0474967956543, "global_step": 95899, "epoch": 792} {"train_loss": -38.030914306640625, "global_step": 95900, "epoch": 792} {"train_loss": -37.5032844543457, "global_step": 95901, "epoch": 792} {"train_loss": -37.04038619995117, "global_step": 95902, "epoch": 792} {"train_loss": -36.5192985534668, "global_step": 95903, "epoch": 792} {"train_loss": -38.68362045288086, "global_step": 95904, "epoch": 792} {"train_loss": -38.147789001464844, "global_step": 95905, "epoch": 792} {"train_loss": -36.39461135864258, "global_step": 95906, "epoch": 792} {"train_loss": -34.94894027709961, "global_step": 95907, "epoch": 792} {"train_loss": -36.9488639831543, "global_step": 95908, "epoch": 792} {"train_loss": -38.6702880859375, "global_step": 95909, "epoch": 792} {"train_loss": -37.5629997253418, "global_step": 95910, "epoch": 792} {"train_loss": -37.00181198120117, "global_step": 95911, "epoch": 792} {"train_loss": -37.6880989074707, "global_step": 95912, "epoch": 792} {"train_loss": -37.68122482299805, "global_step": 95913, "epoch": 792} {"train_loss": -37.27485275268555, "global_step": 95914, "epoch": 792} {"train_loss": -37.669429779052734, "global_step": 95915, "epoch": 792} {"train_loss": -37.04206466674805, "global_step": 95916, "epoch": 792} {"train_loss": -37.646053314208984, "global_step": 95917, "epoch": 792} {"train_loss": -37.23012924194336, "global_step": 95918, "epoch": 792} {"train_loss": -38.06525802612305, "global_step": 95919, "epoch": 792} {"train_loss": -37.351783752441406, "global_step": 95920, "epoch": 792} {"train_loss": -37.98632049560547, "global_step": 95921, "epoch": 792} {"train_loss": -38.16925811767578, "global_step": 95922, "epoch": 792} {"train_loss": -38.51591873168945, "global_step": 95923, "epoch": 792} {"train_loss": -38.27350616455078, "global_step": 95924, "epoch": 792} {"train_loss": -37.064430236816406, "global_step": 95925, "epoch": 792} {"train_loss": -37.5778694152832, "global_step": 95926, "epoch": 792} {"train_loss": -38.25696563720703, "global_step": 95927, "epoch": 792} {"train_loss": -38.05388641357422, "global_step": 95928, "epoch": 792} {"train_loss": -37.98372268676758, "global_step": 95929, "epoch": 792} {"train_loss": -37.52205276489258, "global_step": 95930, "epoch": 792} {"train_loss": -36.87961196899414, "global_step": 95931, "epoch": 792} {"train_loss": -38.21323776245117, "global_step": 95932, "epoch": 792} {"train_loss": -36.59947204589844, "global_step": 95933, "epoch": 792} {"train_loss": -37.18251419067383, "global_step": 95934, "epoch": 792} {"train_loss": -38.25497055053711, "global_step": 95935, "epoch": 792} {"train_loss": -36.80721664428711, "global_step": 95936, "epoch": 792} {"train_loss": -37.25731658935547, "global_step": 95937, "epoch": 792} {"train_loss": -37.94696044921875, "global_step": 95938, "epoch": 792} {"train_loss": -37.64348220825195, "global_step": 95939, "epoch": 792} {"train_loss": -38.48335647583008, "global_step": 95940, "epoch": 792} {"train_loss": -35.476722717285156, "global_step": 95941, "epoch": 792} {"train_loss": -37.71739196777344, "global_step": 95942, "epoch": 792} {"train_loss": -36.37889862060547, "global_step": 95943, "epoch": 792} {"train_loss": -38.1241455078125, "global_step": 95944, "epoch": 792} {"train_loss": -37.57487869262695, "global_step": 95945, "epoch": 792} {"train_loss": -37.203773498535156, "global_step": 95946, "epoch": 792} {"train_loss": -37.19212341308594, "global_step": 95947, "epoch": 792} {"train_loss": -38.352352142333984, "global_step": 95948, "epoch": 792} {"train_loss": -37.20130920410156, "global_step": 95949, "epoch": 792} {"train_loss": -37.50619125366211, "global_step": 95950, "epoch": 792} {"train_loss": -37.21039581298828, "global_step": 95951, "epoch": 792} {"train_loss": -37.49354644649285, "global_step": 95952, "epoch": 792, "val_loss": 2542499.0} {"train_loss": -37.24250793457031, "global_step": 95953, "epoch": 793} {"train_loss": -36.4566650390625, "global_step": 95954, "epoch": 793} {"train_loss": -36.50497055053711, "global_step": 95955, "epoch": 793} {"train_loss": -38.61435317993164, "global_step": 95956, "epoch": 793} {"train_loss": -38.126949310302734, "global_step": 95957, "epoch": 793} {"train_loss": -37.37398910522461, "global_step": 95958, "epoch": 793} {"train_loss": -38.02289581298828, "global_step": 95959, "epoch": 793} {"train_loss": -37.888179779052734, "global_step": 95960, "epoch": 793} {"train_loss": -37.220497131347656, "global_step": 95961, "epoch": 793} {"train_loss": -38.14203643798828, "global_step": 95962, "epoch": 793} {"train_loss": -38.3911247253418, "global_step": 95963, "epoch": 793} {"train_loss": -38.20424270629883, "global_step": 95964, "epoch": 793} {"train_loss": -38.0626106262207, "global_step": 95965, "epoch": 793} {"train_loss": -38.441593170166016, "global_step": 95966, "epoch": 793} {"train_loss": -38.18796920776367, "global_step": 95967, "epoch": 793} {"train_loss": -38.59727096557617, "global_step": 95968, "epoch": 793} {"train_loss": -38.23235321044922, "global_step": 95969, "epoch": 793} {"train_loss": -36.27464294433594, "global_step": 95970, "epoch": 793} {"train_loss": -38.74542999267578, "global_step": 95971, "epoch": 793} {"train_loss": -38.11286926269531, "global_step": 95972, "epoch": 793} {"train_loss": -37.619873046875, "global_step": 95973, "epoch": 793} {"train_loss": -38.0130500793457, "global_step": 95974, "epoch": 793} {"train_loss": -36.79411697387695, "global_step": 95975, "epoch": 793} {"train_loss": -38.24079895019531, "global_step": 95976, "epoch": 793} {"train_loss": -37.611351013183594, "global_step": 95977, "epoch": 793} {"train_loss": -36.73564529418945, "global_step": 95978, "epoch": 793} {"train_loss": -38.39471435546875, "global_step": 95979, "epoch": 793} {"train_loss": -37.04647445678711, "global_step": 95980, "epoch": 793} {"train_loss": -36.79294967651367, "global_step": 95981, "epoch": 793} {"train_loss": -38.1279182434082, "global_step": 95982, "epoch": 793} {"train_loss": -37.98551559448242, "global_step": 95983, "epoch": 793} {"train_loss": -36.73686218261719, "global_step": 95984, "epoch": 793} {"train_loss": -38.373958587646484, "global_step": 95985, "epoch": 793} {"train_loss": -38.173404693603516, "global_step": 95986, "epoch": 793} {"train_loss": -38.81815719604492, "global_step": 95987, "epoch": 793} {"train_loss": -37.91154098510742, "global_step": 95988, "epoch": 793} {"train_loss": -38.21390914916992, "global_step": 95989, "epoch": 793} {"train_loss": -37.84235763549805, "global_step": 95990, "epoch": 793} {"train_loss": -37.82633972167969, "global_step": 95991, "epoch": 793} {"train_loss": -38.55257034301758, "global_step": 95992, "epoch": 793} {"train_loss": -38.75739288330078, "global_step": 95993, "epoch": 793} {"train_loss": -37.73322677612305, "global_step": 95994, "epoch": 793} {"train_loss": -38.31339645385742, "global_step": 95995, "epoch": 793} {"train_loss": -39.191768646240234, "global_step": 95996, "epoch": 793} {"train_loss": -38.596435546875, "global_step": 95997, "epoch": 793} {"train_loss": -38.98776626586914, "global_step": 95998, "epoch": 793} {"train_loss": -38.4329719543457, "global_step": 95999, "epoch": 793} {"train_loss": -38.82603073120117, "global_step": 96000, "epoch": 793} {"train_loss": -38.17951583862305, "global_step": 96001, "epoch": 793} {"train_loss": -39.39748764038086, "global_step": 96002, "epoch": 793} {"train_loss": -38.9599494934082, "global_step": 96003, "epoch": 793} {"train_loss": -38.94905471801758, "global_step": 96004, "epoch": 793} {"train_loss": -39.3421630859375, "global_step": 96005, "epoch": 793} {"train_loss": -38.51715850830078, "global_step": 96006, "epoch": 793} {"train_loss": -39.356849670410156, "global_step": 96007, "epoch": 793} {"train_loss": -38.68560791015625, "global_step": 96008, "epoch": 793} {"train_loss": -38.93546676635742, "global_step": 96009, "epoch": 793} {"train_loss": -38.38459777832031, "global_step": 96010, "epoch": 793} {"train_loss": -39.02802276611328, "global_step": 96011, "epoch": 793} {"train_loss": -37.61743927001953, "global_step": 96012, "epoch": 793} {"train_loss": -38.056941986083984, "global_step": 96013, "epoch": 793} {"train_loss": -38.001953125, "global_step": 96014, "epoch": 793} {"train_loss": -38.86520004272461, "global_step": 96015, "epoch": 793} {"train_loss": -38.5686149597168, "global_step": 96016, "epoch": 793} {"train_loss": -37.37137222290039, "global_step": 96017, "epoch": 793} {"train_loss": -37.12713623046875, "global_step": 96018, "epoch": 793} {"train_loss": -36.82935333251953, "global_step": 96019, "epoch": 793} {"train_loss": -37.55486297607422, "global_step": 96020, "epoch": 793} {"train_loss": -37.726741790771484, "global_step": 96021, "epoch": 793} {"train_loss": -36.352783203125, "global_step": 96022, "epoch": 793} {"train_loss": -36.399085998535156, "global_step": 96023, "epoch": 793} {"train_loss": -38.316036224365234, "global_step": 96024, "epoch": 793} {"train_loss": -39.1992301940918, "global_step": 96025, "epoch": 793} {"train_loss": -39.32038497924805, "global_step": 96026, "epoch": 793} {"train_loss": -37.727359771728516, "global_step": 96027, "epoch": 793} {"train_loss": -37.90519332885742, "global_step": 96028, "epoch": 793} {"train_loss": -38.03748321533203, "global_step": 96029, "epoch": 793} {"train_loss": -39.35185241699219, "global_step": 96030, "epoch": 793} {"train_loss": -37.430179595947266, "global_step": 96031, "epoch": 793} {"train_loss": -38.67361068725586, "global_step": 96032, "epoch": 793} {"train_loss": -37.02781295776367, "global_step": 96033, "epoch": 793} {"train_loss": -39.33327865600586, "global_step": 96034, "epoch": 793} {"train_loss": -36.795562744140625, "global_step": 96035, "epoch": 793} {"train_loss": -35.825435638427734, "global_step": 96036, "epoch": 793} {"train_loss": -34.68247604370117, "global_step": 96037, "epoch": 793} {"train_loss": -34.22161102294922, "global_step": 96038, "epoch": 793} {"train_loss": -36.86130905151367, "global_step": 96039, "epoch": 793} {"train_loss": -37.019203186035156, "global_step": 96040, "epoch": 793} {"train_loss": -33.57472229003906, "global_step": 96041, "epoch": 793} {"train_loss": -35.618709564208984, "global_step": 96042, "epoch": 793} {"train_loss": -37.619544982910156, "global_step": 96043, "epoch": 793} {"train_loss": -35.540321350097656, "global_step": 96044, "epoch": 793} {"train_loss": -37.881893157958984, "global_step": 96045, "epoch": 793} {"train_loss": -36.075496673583984, "global_step": 96046, "epoch": 793} {"train_loss": -37.24811553955078, "global_step": 96047, "epoch": 793} {"train_loss": -37.51768112182617, "global_step": 96048, "epoch": 793} {"train_loss": -37.905975341796875, "global_step": 96049, "epoch": 793} {"train_loss": -36.27009963989258, "global_step": 96050, "epoch": 793} {"train_loss": -37.346866607666016, "global_step": 96051, "epoch": 793} {"train_loss": -37.20408248901367, "global_step": 96052, "epoch": 793} {"train_loss": -38.623477935791016, "global_step": 96053, "epoch": 793} {"train_loss": -37.56168746948242, "global_step": 96054, "epoch": 793} {"train_loss": -37.12991714477539, "global_step": 96055, "epoch": 793} {"train_loss": -36.03611373901367, "global_step": 96056, "epoch": 793} {"train_loss": -37.041561126708984, "global_step": 96057, "epoch": 793} {"train_loss": -36.309967041015625, "global_step": 96058, "epoch": 793} {"train_loss": -36.84920883178711, "global_step": 96059, "epoch": 793} {"train_loss": -35.24580001831055, "global_step": 96060, "epoch": 793} {"train_loss": -36.29183578491211, "global_step": 96061, "epoch": 793} {"train_loss": -36.965267181396484, "global_step": 96062, "epoch": 793} {"train_loss": -37.16141128540039, "global_step": 96063, "epoch": 793} {"train_loss": -35.47821044921875, "global_step": 96064, "epoch": 793} {"train_loss": -35.88267135620117, "global_step": 96065, "epoch": 793} {"train_loss": -30.925067901611328, "global_step": 96066, "epoch": 793} {"train_loss": -24.5714168548584, "global_step": 96067, "epoch": 793} {"train_loss": -28.93670654296875, "global_step": 96068, "epoch": 793} {"train_loss": -34.890140533447266, "global_step": 96069, "epoch": 793} {"train_loss": -27.929718017578125, "global_step": 96070, "epoch": 793} {"train_loss": -33.57577133178711, "global_step": 96071, "epoch": 793} {"train_loss": -33.51087188720703, "global_step": 96072, "epoch": 793} {"train_loss": -37.169155940536626, "global_step": 96073, "epoch": 793, "val_loss": 2485222.25} {"train_loss": -34.69645690917969, "global_step": 96074, "epoch": 794} {"train_loss": -22.201269149780273, "global_step": 96075, "epoch": 794} {"train_loss": -33.69190216064453, "global_step": 96076, "epoch": 794} {"train_loss": -19.716955184936523, "global_step": 96077, "epoch": 794} {"train_loss": -32.9621696472168, "global_step": 96078, "epoch": 794} {"train_loss": -32.28458023071289, "global_step": 96079, "epoch": 794} {"train_loss": -29.497852325439453, "global_step": 96080, "epoch": 794} {"train_loss": -28.87244987487793, "global_step": 96081, "epoch": 794} {"train_loss": -31.19647216796875, "global_step": 96082, "epoch": 794} {"train_loss": -30.500202178955078, "global_step": 96083, "epoch": 794} {"train_loss": -31.1486759185791, "global_step": 96084, "epoch": 794} {"train_loss": -33.02492904663086, "global_step": 96085, "epoch": 794} {"train_loss": -34.67535400390625, "global_step": 96086, "epoch": 794} {"train_loss": -33.114505767822266, "global_step": 96087, "epoch": 794} {"train_loss": -33.285945892333984, "global_step": 96088, "epoch": 794} {"train_loss": -33.311790466308594, "global_step": 96089, "epoch": 794} {"train_loss": -33.67487716674805, "global_step": 96090, "epoch": 794} {"train_loss": -33.144378662109375, "global_step": 96091, "epoch": 794} {"train_loss": -34.03030014038086, "global_step": 96092, "epoch": 794} {"train_loss": -33.912960052490234, "global_step": 96093, "epoch": 794} {"train_loss": -34.5079345703125, "global_step": 96094, "epoch": 794} {"train_loss": -33.69004440307617, "global_step": 96095, "epoch": 794} {"train_loss": -34.755462646484375, "global_step": 96096, "epoch": 794} {"train_loss": -34.64875411987305, "global_step": 96097, "epoch": 794} {"train_loss": -34.49729537963867, "global_step": 96098, "epoch": 794} {"train_loss": -34.54474639892578, "global_step": 96099, "epoch": 794} {"train_loss": -34.86277389526367, "global_step": 96100, "epoch": 794} {"train_loss": -32.80267333984375, "global_step": 96101, "epoch": 794} {"train_loss": -34.69738006591797, "global_step": 96102, "epoch": 794} {"train_loss": -34.60628128051758, "global_step": 96103, "epoch": 794} {"train_loss": -35.300811767578125, "global_step": 96104, "epoch": 794} {"train_loss": -35.49333953857422, "global_step": 96105, "epoch": 794} {"train_loss": -33.90324020385742, "global_step": 96106, "epoch": 794} {"train_loss": -35.76211929321289, "global_step": 96107, "epoch": 794} {"train_loss": -35.331581115722656, "global_step": 96108, "epoch": 794} {"train_loss": -35.30598068237305, "global_step": 96109, "epoch": 794} {"train_loss": -35.318824768066406, "global_step": 96110, "epoch": 794} {"train_loss": -35.260860443115234, "global_step": 96111, "epoch": 794} {"train_loss": -35.0743522644043, "global_step": 96112, "epoch": 794} {"train_loss": -35.05091094970703, "global_step": 96113, "epoch": 794} {"train_loss": -36.01453399658203, "global_step": 96114, "epoch": 794} {"train_loss": -35.74238204956055, "global_step": 96115, "epoch": 794} {"train_loss": -35.51656723022461, "global_step": 96116, "epoch": 794} {"train_loss": -36.121124267578125, "global_step": 96117, "epoch": 794} {"train_loss": -35.90939712524414, "global_step": 96118, "epoch": 794} {"train_loss": -36.45698547363281, "global_step": 96119, "epoch": 794} {"train_loss": -35.51185989379883, "global_step": 96120, "epoch": 794} {"train_loss": -36.18009567260742, "global_step": 96121, "epoch": 794} {"train_loss": -36.587310791015625, "global_step": 96122, "epoch": 794} {"train_loss": -36.010658264160156, "global_step": 96123, "epoch": 794} {"train_loss": -36.034664154052734, "global_step": 96124, "epoch": 794} {"train_loss": -36.086402893066406, "global_step": 96125, "epoch": 794} {"train_loss": -35.92605209350586, "global_step": 96126, "epoch": 794} {"train_loss": -36.82225036621094, "global_step": 96127, "epoch": 794} {"train_loss": -36.01523971557617, "global_step": 96128, "epoch": 794} {"train_loss": -36.4400634765625, "global_step": 96129, "epoch": 794} {"train_loss": -36.45998764038086, "global_step": 96130, "epoch": 794} {"train_loss": -36.741455078125, "global_step": 96131, "epoch": 794} {"train_loss": -37.517242431640625, "global_step": 96132, "epoch": 794} {"train_loss": -36.02773666381836, "global_step": 96133, "epoch": 794} {"train_loss": -36.2138786315918, "global_step": 96134, "epoch": 794} {"train_loss": -36.7436408996582, "global_step": 96135, "epoch": 794} {"train_loss": -35.93511199951172, "global_step": 96136, "epoch": 794} {"train_loss": -36.56781005859375, "global_step": 96137, "epoch": 794} {"train_loss": -37.18937301635742, "global_step": 96138, "epoch": 794} {"train_loss": -36.984962463378906, "global_step": 96139, "epoch": 794} {"train_loss": -37.223052978515625, "global_step": 96140, "epoch": 794} {"train_loss": -37.253971099853516, "global_step": 96141, "epoch": 794} {"train_loss": -37.30133819580078, "global_step": 96142, "epoch": 794} {"train_loss": -36.93061065673828, "global_step": 96143, "epoch": 794} {"train_loss": -36.863365173339844, "global_step": 96144, "epoch": 794} {"train_loss": -36.76772689819336, "global_step": 96145, "epoch": 794} {"train_loss": -37.3038330078125, "global_step": 96146, "epoch": 794} {"train_loss": -37.215301513671875, "global_step": 96147, "epoch": 794} {"train_loss": -37.03662109375, "global_step": 96148, "epoch": 794} {"train_loss": -37.47404861450195, "global_step": 96149, "epoch": 794} {"train_loss": -37.26027297973633, "global_step": 96150, "epoch": 794} {"train_loss": -37.529212951660156, "global_step": 96151, "epoch": 794} {"train_loss": -37.3616828918457, "global_step": 96152, "epoch": 794} {"train_loss": -38.097930908203125, "global_step": 96153, "epoch": 794} {"train_loss": -37.764644622802734, "global_step": 96154, "epoch": 794} {"train_loss": -37.43391799926758, "global_step": 96155, "epoch": 794} {"train_loss": -37.63425827026367, "global_step": 96156, "epoch": 794} {"train_loss": -37.73176956176758, "global_step": 96157, "epoch": 794} {"train_loss": -36.83860397338867, "global_step": 96158, "epoch": 794} {"train_loss": -37.2314338684082, "global_step": 96159, "epoch": 794} {"train_loss": -37.76329040527344, "global_step": 96160, "epoch": 794} {"train_loss": -38.128108978271484, "global_step": 96161, "epoch": 794} {"train_loss": -37.83409118652344, "global_step": 96162, "epoch": 794} {"train_loss": -37.48563766479492, "global_step": 96163, "epoch": 794} {"train_loss": -37.43990707397461, "global_step": 96164, "epoch": 794} {"train_loss": -36.91386032104492, "global_step": 96165, "epoch": 794} {"train_loss": -38.18007278442383, "global_step": 96166, "epoch": 794} {"train_loss": -37.80464553833008, "global_step": 96167, "epoch": 794} {"train_loss": -37.076534271240234, "global_step": 96168, "epoch": 794} {"train_loss": -38.253517150878906, "global_step": 96169, "epoch": 794} {"train_loss": -38.06599426269531, "global_step": 96170, "epoch": 794} {"train_loss": -38.16617202758789, "global_step": 96171, "epoch": 794} {"train_loss": -38.71828079223633, "global_step": 96172, "epoch": 794} {"train_loss": -37.91569137573242, "global_step": 96173, "epoch": 794} {"train_loss": -38.65699005126953, "global_step": 96174, "epoch": 794} {"train_loss": -38.46975326538086, "global_step": 96175, "epoch": 794} {"train_loss": -38.38021469116211, "global_step": 96176, "epoch": 794} {"train_loss": -38.53987503051758, "global_step": 96177, "epoch": 794} {"train_loss": -38.46381378173828, "global_step": 96178, "epoch": 794} {"train_loss": -38.755584716796875, "global_step": 96179, "epoch": 794} {"train_loss": -38.17238998413086, "global_step": 96180, "epoch": 794} {"train_loss": -38.18758773803711, "global_step": 96181, "epoch": 794} {"train_loss": -38.594337463378906, "global_step": 96182, "epoch": 794} {"train_loss": -38.78969192504883, "global_step": 96183, "epoch": 794} {"train_loss": -38.287567138671875, "global_step": 96184, "epoch": 794} {"train_loss": -38.13015365600586, "global_step": 96185, "epoch": 794} {"train_loss": -38.624385833740234, "global_step": 96186, "epoch": 794} {"train_loss": -39.09401321411133, "global_step": 96187, "epoch": 794} {"train_loss": -38.83773422241211, "global_step": 96188, "epoch": 794} {"train_loss": -37.542884826660156, "global_step": 96189, "epoch": 794} {"train_loss": -36.47122573852539, "global_step": 96190, "epoch": 794} {"train_loss": -35.1986198425293, "global_step": 96191, "epoch": 794} {"train_loss": -38.47322463989258, "global_step": 96192, "epoch": 794} {"train_loss": -33.160186767578125, "global_step": 96193, "epoch": 794} {"train_loss": -35.85799411111627, "global_step": 96194, "epoch": 794, "val_loss": 2686921.0} {"train_loss": -37.889949798583984, "global_step": 96195, "epoch": 795} {"train_loss": -36.72386169433594, "global_step": 96196, "epoch": 795} {"train_loss": -37.90688705444336, "global_step": 96197, "epoch": 795} {"train_loss": -37.995361328125, "global_step": 96198, "epoch": 795} {"train_loss": -37.73968505859375, "global_step": 96199, "epoch": 795} {"train_loss": -36.30908966064453, "global_step": 96200, "epoch": 795} {"train_loss": -35.153194427490234, "global_step": 96201, "epoch": 795} {"train_loss": -31.488340377807617, "global_step": 96202, "epoch": 795} {"train_loss": -21.031635284423828, "global_step": 96203, "epoch": 795} {"train_loss": -8.170404434204102, "global_step": 96204, "epoch": 795} {"train_loss": -20.6309871673584, "global_step": 96205, "epoch": 795} {"train_loss": -38.0447883605957, "global_step": 96206, "epoch": 795} {"train_loss": -28.02044677734375, "global_step": 96207, "epoch": 795} {"train_loss": -32.868934631347656, "global_step": 96208, "epoch": 795} {"train_loss": -35.24153137207031, "global_step": 96209, "epoch": 795} {"train_loss": -35.90208053588867, "global_step": 96210, "epoch": 795} {"train_loss": -35.17570114135742, "global_step": 96211, "epoch": 795} {"train_loss": -35.930538177490234, "global_step": 96212, "epoch": 795} {"train_loss": -35.193580627441406, "global_step": 96213, "epoch": 795} {"train_loss": -37.43962097167969, "global_step": 96214, "epoch": 795} {"train_loss": -35.91836166381836, "global_step": 96215, "epoch": 795} {"train_loss": -36.298179626464844, "global_step": 96216, "epoch": 795} {"train_loss": -37.42072677612305, "global_step": 96217, "epoch": 795} {"train_loss": -35.76699447631836, "global_step": 96218, "epoch": 795} {"train_loss": -36.17050552368164, "global_step": 96219, "epoch": 795} {"train_loss": -36.955055236816406, "global_step": 96220, "epoch": 795} {"train_loss": -36.35942459106445, "global_step": 96221, "epoch": 795} {"train_loss": -37.56453323364258, "global_step": 96222, "epoch": 795} {"train_loss": -37.111087799072266, "global_step": 96223, "epoch": 795} {"train_loss": -37.22391891479492, "global_step": 96224, "epoch": 795} {"train_loss": -37.55073928833008, "global_step": 96225, "epoch": 795} {"train_loss": -37.61918640136719, "global_step": 96226, "epoch": 795} {"train_loss": -37.4376335144043, "global_step": 96227, "epoch": 795} {"train_loss": -37.52594757080078, "global_step": 96228, "epoch": 795} {"train_loss": -38.23155975341797, "global_step": 96229, "epoch": 795} {"train_loss": -38.2239875793457, "global_step": 96230, "epoch": 795} {"train_loss": -38.44807052612305, "global_step": 96231, "epoch": 795} {"train_loss": -37.915470123291016, "global_step": 96232, "epoch": 795} {"train_loss": -37.806434631347656, "global_step": 96233, "epoch": 795} {"train_loss": -37.888580322265625, "global_step": 96234, "epoch": 795} {"train_loss": -38.1840934753418, "global_step": 96235, "epoch": 795} {"train_loss": -38.02788162231445, "global_step": 96236, "epoch": 795} {"train_loss": -37.895076751708984, "global_step": 96237, "epoch": 795} {"train_loss": -38.134498596191406, "global_step": 96238, "epoch": 795} {"train_loss": -38.5383415222168, "global_step": 96239, "epoch": 795} {"train_loss": -38.19118118286133, "global_step": 96240, "epoch": 795} {"train_loss": -38.34029006958008, "global_step": 96241, "epoch": 795} {"train_loss": -38.16144561767578, "global_step": 96242, "epoch": 795} {"train_loss": -38.24467086791992, "global_step": 96243, "epoch": 795} {"train_loss": -37.70319747924805, "global_step": 96244, "epoch": 795} {"train_loss": -38.21012496948242, "global_step": 96245, "epoch": 795} {"train_loss": -38.99776840209961, "global_step": 96246, "epoch": 795} {"train_loss": -38.56740188598633, "global_step": 96247, "epoch": 795} {"train_loss": -37.7893180847168, "global_step": 96248, "epoch": 795} {"train_loss": -38.43634796142578, "global_step": 96249, "epoch": 795} {"train_loss": -38.196170806884766, "global_step": 96250, "epoch": 795} {"train_loss": -38.57770919799805, "global_step": 96251, "epoch": 795} {"train_loss": -38.7357063293457, "global_step": 96252, "epoch": 795} {"train_loss": -38.37369918823242, "global_step": 96253, "epoch": 795} {"train_loss": -38.92972946166992, "global_step": 96254, "epoch": 795} {"train_loss": -38.879146575927734, "global_step": 96255, "epoch": 795} {"train_loss": -38.270851135253906, "global_step": 96256, "epoch": 795} {"train_loss": -38.13074493408203, "global_step": 96257, "epoch": 795} {"train_loss": -38.86941146850586, "global_step": 96258, "epoch": 795} {"train_loss": -39.07475662231445, "global_step": 96259, "epoch": 795} {"train_loss": -38.7187385559082, "global_step": 96260, "epoch": 795} {"train_loss": -38.52199172973633, "global_step": 96261, "epoch": 795} {"train_loss": -38.1250114440918, "global_step": 96262, "epoch": 795} {"train_loss": -38.77553176879883, "global_step": 96263, "epoch": 795} {"train_loss": -39.003570556640625, "global_step": 96264, "epoch": 795} {"train_loss": -39.2993278503418, "global_step": 96265, "epoch": 795} {"train_loss": -38.47312927246094, "global_step": 96266, "epoch": 795} {"train_loss": -37.4669303894043, "global_step": 96267, "epoch": 795} {"train_loss": -38.854244232177734, "global_step": 96268, "epoch": 795} {"train_loss": -38.55862045288086, "global_step": 96269, "epoch": 795} {"train_loss": -37.82978439331055, "global_step": 96270, "epoch": 795} {"train_loss": -37.928314208984375, "global_step": 96271, "epoch": 795} {"train_loss": -38.06517791748047, "global_step": 96272, "epoch": 795} {"train_loss": -36.604576110839844, "global_step": 96273, "epoch": 795} {"train_loss": -36.86853790283203, "global_step": 96274, "epoch": 795} {"train_loss": -37.72391891479492, "global_step": 96275, "epoch": 795} {"train_loss": -38.66541290283203, "global_step": 96276, "epoch": 795} {"train_loss": -38.776729583740234, "global_step": 96277, "epoch": 795} {"train_loss": -38.131160736083984, "global_step": 96278, "epoch": 795} {"train_loss": -38.68255615234375, "global_step": 96279, "epoch": 795} {"train_loss": -37.38924026489258, "global_step": 96280, "epoch": 795} {"train_loss": -38.27192306518555, "global_step": 96281, "epoch": 795} {"train_loss": -37.69369125366211, "global_step": 96282, "epoch": 795} {"train_loss": -37.99970626831055, "global_step": 96283, "epoch": 795} {"train_loss": -39.04581832885742, "global_step": 96284, "epoch": 795} {"train_loss": -38.84945297241211, "global_step": 96285, "epoch": 795} {"train_loss": -37.45375442504883, "global_step": 96286, "epoch": 795} {"train_loss": -36.640113830566406, "global_step": 96287, "epoch": 795} {"train_loss": -37.954463958740234, "global_step": 96288, "epoch": 795} {"train_loss": -38.548458099365234, "global_step": 96289, "epoch": 795} {"train_loss": -38.44562911987305, "global_step": 96290, "epoch": 795} {"train_loss": -37.941139221191406, "global_step": 96291, "epoch": 795} {"train_loss": -38.880706787109375, "global_step": 96292, "epoch": 795} {"train_loss": -38.958396911621094, "global_step": 96293, "epoch": 795} {"train_loss": -37.74573516845703, "global_step": 96294, "epoch": 795} {"train_loss": -38.1910285949707, "global_step": 96295, "epoch": 795} {"train_loss": -39.21570587158203, "global_step": 96296, "epoch": 795} {"train_loss": -37.76397705078125, "global_step": 96297, "epoch": 795} {"train_loss": -37.82619857788086, "global_step": 96298, "epoch": 795} {"train_loss": -38.67875289916992, "global_step": 96299, "epoch": 795} {"train_loss": -38.03632354736328, "global_step": 96300, "epoch": 795} {"train_loss": -38.577335357666016, "global_step": 96301, "epoch": 795} {"train_loss": -38.83174514770508, "global_step": 96302, "epoch": 795} {"train_loss": -37.616188049316406, "global_step": 96303, "epoch": 795} {"train_loss": -35.82093811035156, "global_step": 96304, "epoch": 795} {"train_loss": -31.955402374267578, "global_step": 96305, "epoch": 795} {"train_loss": -26.537885665893555, "global_step": 96306, "epoch": 795} {"train_loss": -12.517356872558594, "global_step": 96307, "epoch": 795} {"train_loss": -22.4864444732666, "global_step": 96308, "epoch": 795} {"train_loss": -36.419898986816406, "global_step": 96309, "epoch": 795} {"train_loss": -22.924306869506836, "global_step": 96310, "epoch": 795} {"train_loss": -36.103878021240234, "global_step": 96311, "epoch": 795} {"train_loss": -29.127277374267578, "global_step": 96312, "epoch": 795} {"train_loss": -35.580596923828125, "global_step": 96313, "epoch": 795} {"train_loss": -30.094043731689453, "global_step": 96314, "epoch": 795} {"train_loss": -36.34521106057916, "global_step": 96315, "epoch": 795, "val_loss": 2659693.75} {"train_loss": -31.343271255493164, "global_step": 96316, "epoch": 796} {"train_loss": -35.72353744506836, "global_step": 96317, "epoch": 796} {"train_loss": -34.9731330871582, "global_step": 96318, "epoch": 796} {"train_loss": -33.45585250854492, "global_step": 96319, "epoch": 796} {"train_loss": -36.53158187866211, "global_step": 96320, "epoch": 796} {"train_loss": -35.88208770751953, "global_step": 96321, "epoch": 796} {"train_loss": -34.7196159362793, "global_step": 96322, "epoch": 796} {"train_loss": -36.850990295410156, "global_step": 96323, "epoch": 796} {"train_loss": -35.79166793823242, "global_step": 96324, "epoch": 796} {"train_loss": -35.051902770996094, "global_step": 96325, "epoch": 796} {"train_loss": -36.12043380737305, "global_step": 96326, "epoch": 796} {"train_loss": -36.62663269042969, "global_step": 96327, "epoch": 796} {"train_loss": -36.880367279052734, "global_step": 96328, "epoch": 796} {"train_loss": -36.75397872924805, "global_step": 96329, "epoch": 796} {"train_loss": -34.53899002075195, "global_step": 96330, "epoch": 796} {"train_loss": -36.56623077392578, "global_step": 96331, "epoch": 796} {"train_loss": -36.89458084106445, "global_step": 96332, "epoch": 796} {"train_loss": -37.1635627746582, "global_step": 96333, "epoch": 796} {"train_loss": -37.35493087768555, "global_step": 96334, "epoch": 796} {"train_loss": -37.21149826049805, "global_step": 96335, "epoch": 796} {"train_loss": -37.13096237182617, "global_step": 96336, "epoch": 796} {"train_loss": -37.56111526489258, "global_step": 96337, "epoch": 796} {"train_loss": -37.34627914428711, "global_step": 96338, "epoch": 796} {"train_loss": -36.651588439941406, "global_step": 96339, "epoch": 796} {"train_loss": -36.693538665771484, "global_step": 96340, "epoch": 796} {"train_loss": -37.286834716796875, "global_step": 96341, "epoch": 796} {"train_loss": -37.80939483642578, "global_step": 96342, "epoch": 796} {"train_loss": -37.069759368896484, "global_step": 96343, "epoch": 796} {"train_loss": -38.02494430541992, "global_step": 96344, "epoch": 796} {"train_loss": -38.06321334838867, "global_step": 96345, "epoch": 796} {"train_loss": -37.83970642089844, "global_step": 96346, "epoch": 796} {"train_loss": -37.085994720458984, "global_step": 96347, "epoch": 796} {"train_loss": -37.51701354980469, "global_step": 96348, "epoch": 796} {"train_loss": -35.160186767578125, "global_step": 96349, "epoch": 796} {"train_loss": -37.958404541015625, "global_step": 96350, "epoch": 796} {"train_loss": -38.16259765625, "global_step": 96351, "epoch": 796} {"train_loss": -38.39274978637695, "global_step": 96352, "epoch": 796} {"train_loss": -37.34212875366211, "global_step": 96353, "epoch": 796} {"train_loss": -38.43778610229492, "global_step": 96354, "epoch": 796} {"train_loss": -37.82851791381836, "global_step": 96355, "epoch": 796} {"train_loss": -37.85626983642578, "global_step": 96356, "epoch": 796} {"train_loss": -37.860084533691406, "global_step": 96357, "epoch": 796} {"train_loss": -38.44035720825195, "global_step": 96358, "epoch": 796} {"train_loss": -37.62346267700195, "global_step": 96359, "epoch": 796} {"train_loss": -37.63561248779297, "global_step": 96360, "epoch": 796} {"train_loss": -38.083187103271484, "global_step": 96361, "epoch": 796} {"train_loss": -36.13126754760742, "global_step": 96362, "epoch": 796} {"train_loss": -38.38821029663086, "global_step": 96363, "epoch": 796} {"train_loss": -37.536434173583984, "global_step": 96364, "epoch": 796} {"train_loss": -38.39740753173828, "global_step": 96365, "epoch": 796} {"train_loss": -38.633663177490234, "global_step": 96366, "epoch": 796} {"train_loss": -38.3919563293457, "global_step": 96367, "epoch": 796} {"train_loss": -38.360504150390625, "global_step": 96368, "epoch": 796} {"train_loss": -37.36366653442383, "global_step": 96369, "epoch": 796} {"train_loss": -38.427032470703125, "global_step": 96370, "epoch": 796} {"train_loss": -38.277801513671875, "global_step": 96371, "epoch": 796} {"train_loss": -38.67792892456055, "global_step": 96372, "epoch": 796} {"train_loss": -38.527801513671875, "global_step": 96373, "epoch": 796} {"train_loss": -38.8166618347168, "global_step": 96374, "epoch": 796} {"train_loss": -38.0228271484375, "global_step": 96375, "epoch": 796} {"train_loss": -39.06525421142578, "global_step": 96376, "epoch": 796} {"train_loss": -33.15863800048828, "global_step": 96377, "epoch": 796} {"train_loss": -38.077911376953125, "global_step": 96378, "epoch": 796} {"train_loss": -38.1479377746582, "global_step": 96379, "epoch": 796} {"train_loss": -38.477325439453125, "global_step": 96380, "epoch": 796} {"train_loss": -38.43269729614258, "global_step": 96381, "epoch": 796} {"train_loss": -38.7152099609375, "global_step": 96382, "epoch": 796} {"train_loss": -38.34255599975586, "global_step": 96383, "epoch": 796} {"train_loss": -37.88361358642578, "global_step": 96384, "epoch": 796} {"train_loss": -38.212013244628906, "global_step": 96385, "epoch": 796} {"train_loss": -37.51424789428711, "global_step": 96386, "epoch": 796} {"train_loss": -38.48408126831055, "global_step": 96387, "epoch": 796} {"train_loss": -38.258872985839844, "global_step": 96388, "epoch": 796} {"train_loss": -38.356109619140625, "global_step": 96389, "epoch": 796} {"train_loss": -38.36918258666992, "global_step": 96390, "epoch": 796} {"train_loss": -36.24906539916992, "global_step": 96391, "epoch": 796} {"train_loss": -38.39423751831055, "global_step": 96392, "epoch": 796} {"train_loss": -38.543060302734375, "global_step": 96393, "epoch": 796} {"train_loss": -37.05728530883789, "global_step": 96394, "epoch": 796} {"train_loss": -38.47504425048828, "global_step": 96395, "epoch": 796} {"train_loss": -38.281715393066406, "global_step": 96396, "epoch": 796} {"train_loss": -38.17387008666992, "global_step": 96397, "epoch": 796} {"train_loss": -37.4966926574707, "global_step": 96398, "epoch": 796} {"train_loss": -37.312862396240234, "global_step": 96399, "epoch": 796} {"train_loss": -37.29571533203125, "global_step": 96400, "epoch": 796} {"train_loss": -36.65971755981445, "global_step": 96401, "epoch": 796} {"train_loss": -35.79030227661133, "global_step": 96402, "epoch": 796} {"train_loss": -33.750057220458984, "global_step": 96403, "epoch": 796} {"train_loss": -27.04779052734375, "global_step": 96404, "epoch": 796} {"train_loss": -26.76480484008789, "global_step": 96405, "epoch": 796} {"train_loss": -30.926349639892578, "global_step": 96406, "epoch": 796} {"train_loss": -36.78591537475586, "global_step": 96407, "epoch": 796} {"train_loss": -31.792673110961914, "global_step": 96408, "epoch": 796} {"train_loss": -33.74677658081055, "global_step": 96409, "epoch": 796} {"train_loss": -36.019325256347656, "global_step": 96410, "epoch": 796} {"train_loss": -35.07706832885742, "global_step": 96411, "epoch": 796} {"train_loss": -36.627655029296875, "global_step": 96412, "epoch": 796} {"train_loss": -35.94214630126953, "global_step": 96413, "epoch": 796} {"train_loss": -37.6078987121582, "global_step": 96414, "epoch": 796} {"train_loss": -36.64701843261719, "global_step": 96415, "epoch": 796} {"train_loss": -37.332191467285156, "global_step": 96416, "epoch": 796} {"train_loss": -36.929927825927734, "global_step": 96417, "epoch": 796} {"train_loss": -37.04560089111328, "global_step": 96418, "epoch": 796} {"train_loss": -36.803932189941406, "global_step": 96419, "epoch": 796} {"train_loss": -36.45619583129883, "global_step": 96420, "epoch": 796} {"train_loss": -37.306983947753906, "global_step": 96421, "epoch": 796} {"train_loss": -37.65359115600586, "global_step": 96422, "epoch": 796} {"train_loss": -36.80963134765625, "global_step": 96423, "epoch": 796} {"train_loss": -36.684303283691406, "global_step": 96424, "epoch": 796} {"train_loss": -37.26088333129883, "global_step": 96425, "epoch": 796} {"train_loss": -36.60319519042969, "global_step": 96426, "epoch": 796} {"train_loss": -36.421199798583984, "global_step": 96427, "epoch": 796} {"train_loss": -37.72907257080078, "global_step": 96428, "epoch": 796} {"train_loss": -36.956398010253906, "global_step": 96429, "epoch": 796} {"train_loss": -37.3538818359375, "global_step": 96430, "epoch": 796} {"train_loss": -36.812286376953125, "global_step": 96431, "epoch": 796} {"train_loss": -37.7502326965332, "global_step": 96432, "epoch": 796} {"train_loss": -37.303375244140625, "global_step": 96433, "epoch": 796} {"train_loss": -37.7330436706543, "global_step": 96434, "epoch": 796} {"train_loss": -37.98431396484375, "global_step": 96435, "epoch": 796} {"train_loss": -36.905745009745445, "global_step": 96436, "epoch": 796, "val_loss": 2634675.25} {"train_loss": -38.15626907348633, "global_step": 96437, "epoch": 797} {"train_loss": -37.84624099731445, "global_step": 96438, "epoch": 797} {"train_loss": -38.007171630859375, "global_step": 96439, "epoch": 797} {"train_loss": -38.069908142089844, "global_step": 96440, "epoch": 797} {"train_loss": -38.51639938354492, "global_step": 96441, "epoch": 797} {"train_loss": -37.89884567260742, "global_step": 96442, "epoch": 797} {"train_loss": -38.61336898803711, "global_step": 96443, "epoch": 797} {"train_loss": -37.60956954956055, "global_step": 96444, "epoch": 797} {"train_loss": -38.8157958984375, "global_step": 96445, "epoch": 797} {"train_loss": -37.801910400390625, "global_step": 96446, "epoch": 797} {"train_loss": -37.583003997802734, "global_step": 96447, "epoch": 797} {"train_loss": -38.21390914916992, "global_step": 96448, "epoch": 797} {"train_loss": -38.4271125793457, "global_step": 96449, "epoch": 797} {"train_loss": -38.616451263427734, "global_step": 96450, "epoch": 797} {"train_loss": -38.50571823120117, "global_step": 96451, "epoch": 797} {"train_loss": -38.20590591430664, "global_step": 96452, "epoch": 797} {"train_loss": -38.14097595214844, "global_step": 96453, "epoch": 797} {"train_loss": -38.48322677612305, "global_step": 96454, "epoch": 797} {"train_loss": -38.28046417236328, "global_step": 96455, "epoch": 797} {"train_loss": -38.2098503112793, "global_step": 96456, "epoch": 797} {"train_loss": -38.44218444824219, "global_step": 96457, "epoch": 797} {"train_loss": -38.600032806396484, "global_step": 96458, "epoch": 797} {"train_loss": -38.27537155151367, "global_step": 96459, "epoch": 797} {"train_loss": -38.580116271972656, "global_step": 96460, "epoch": 797} {"train_loss": -38.27652359008789, "global_step": 96461, "epoch": 797} {"train_loss": -38.14508819580078, "global_step": 96462, "epoch": 797} {"train_loss": -38.453369140625, "global_step": 96463, "epoch": 797} {"train_loss": -38.54874801635742, "global_step": 96464, "epoch": 797} {"train_loss": -38.72064971923828, "global_step": 96465, "epoch": 797} {"train_loss": -38.448631286621094, "global_step": 96466, "epoch": 797} {"train_loss": -38.96416473388672, "global_step": 96467, "epoch": 797} {"train_loss": -37.92892074584961, "global_step": 96468, "epoch": 797} {"train_loss": -38.42597198486328, "global_step": 96469, "epoch": 797} {"train_loss": -38.03353500366211, "global_step": 96470, "epoch": 797} {"train_loss": -38.38051223754883, "global_step": 96471, "epoch": 797} {"train_loss": -38.0274772644043, "global_step": 96472, "epoch": 797} {"train_loss": -39.095733642578125, "global_step": 96473, "epoch": 797} {"train_loss": -37.368858337402344, "global_step": 96474, "epoch": 797} {"train_loss": -37.80414962768555, "global_step": 96475, "epoch": 797} {"train_loss": -38.46917724609375, "global_step": 96476, "epoch": 797} {"train_loss": -38.31867218017578, "global_step": 96477, "epoch": 797} {"train_loss": -38.6728401184082, "global_step": 96478, "epoch": 797} {"train_loss": -38.15822982788086, "global_step": 96479, "epoch": 797} {"train_loss": -36.4775390625, "global_step": 96480, "epoch": 797} {"train_loss": -33.70639419555664, "global_step": 96481, "epoch": 797} {"train_loss": -29.67596435546875, "global_step": 96482, "epoch": 797} {"train_loss": -34.440948486328125, "global_step": 96483, "epoch": 797} {"train_loss": -33.317771911621094, "global_step": 96484, "epoch": 797} {"train_loss": -34.18819808959961, "global_step": 96485, "epoch": 797} {"train_loss": -32.5842170715332, "global_step": 96486, "epoch": 797} {"train_loss": -33.76776885986328, "global_step": 96487, "epoch": 797} {"train_loss": -34.97709274291992, "global_step": 96488, "epoch": 797} {"train_loss": -35.632057189941406, "global_step": 96489, "epoch": 797} {"train_loss": -35.85462188720703, "global_step": 96490, "epoch": 797} {"train_loss": -35.85806655883789, "global_step": 96491, "epoch": 797} {"train_loss": -37.95137405395508, "global_step": 96492, "epoch": 797} {"train_loss": -36.4805793762207, "global_step": 96493, "epoch": 797} {"train_loss": -36.38508605957031, "global_step": 96494, "epoch": 797} {"train_loss": -37.810874938964844, "global_step": 96495, "epoch": 797} {"train_loss": -36.977386474609375, "global_step": 96496, "epoch": 797} {"train_loss": -37.19966506958008, "global_step": 96497, "epoch": 797} {"train_loss": -38.15352249145508, "global_step": 96498, "epoch": 797} {"train_loss": -36.740325927734375, "global_step": 96499, "epoch": 797} {"train_loss": -37.505550384521484, "global_step": 96500, "epoch": 797} {"train_loss": -38.03571701049805, "global_step": 96501, "epoch": 797} {"train_loss": -38.0052375793457, "global_step": 96502, "epoch": 797} {"train_loss": -38.07179641723633, "global_step": 96503, "epoch": 797} {"train_loss": -37.8005485534668, "global_step": 96504, "epoch": 797} {"train_loss": -38.55170440673828, "global_step": 96505, "epoch": 797} {"train_loss": -38.24000549316406, "global_step": 96506, "epoch": 797} {"train_loss": -37.779083251953125, "global_step": 96507, "epoch": 797} {"train_loss": -38.13434982299805, "global_step": 96508, "epoch": 797} {"train_loss": -38.05255889892578, "global_step": 96509, "epoch": 797} {"train_loss": -38.330535888671875, "global_step": 96510, "epoch": 797} {"train_loss": -37.87772750854492, "global_step": 96511, "epoch": 797} {"train_loss": -38.319976806640625, "global_step": 96512, "epoch": 797} {"train_loss": -38.1336784362793, "global_step": 96513, "epoch": 797} {"train_loss": -38.3901252746582, "global_step": 96514, "epoch": 797} {"train_loss": -38.53337478637695, "global_step": 96515, "epoch": 797} {"train_loss": -38.43839645385742, "global_step": 96516, "epoch": 797} {"train_loss": -38.10837936401367, "global_step": 96517, "epoch": 797} {"train_loss": -37.88541030883789, "global_step": 96518, "epoch": 797} {"train_loss": -38.7703742980957, "global_step": 96519, "epoch": 797} {"train_loss": -38.70778274536133, "global_step": 96520, "epoch": 797} {"train_loss": -38.137935638427734, "global_step": 96521, "epoch": 797} {"train_loss": -38.18351364135742, "global_step": 96522, "epoch": 797} {"train_loss": -38.250484466552734, "global_step": 96523, "epoch": 797} {"train_loss": -38.803245544433594, "global_step": 96524, "epoch": 797} {"train_loss": -38.77901077270508, "global_step": 96525, "epoch": 797} {"train_loss": -38.595176696777344, "global_step": 96526, "epoch": 797} {"train_loss": -38.88607406616211, "global_step": 96527, "epoch": 797} {"train_loss": -38.5670280456543, "global_step": 96528, "epoch": 797} {"train_loss": -39.02425003051758, "global_step": 96529, "epoch": 797} {"train_loss": -38.84815979003906, "global_step": 96530, "epoch": 797} {"train_loss": -38.0993766784668, "global_step": 96531, "epoch": 797} {"train_loss": -39.24641036987305, "global_step": 96532, "epoch": 797} {"train_loss": -39.12184143066406, "global_step": 96533, "epoch": 797} {"train_loss": -38.954463958740234, "global_step": 96534, "epoch": 797} {"train_loss": -39.23067855834961, "global_step": 96535, "epoch": 797} {"train_loss": -39.018798828125, "global_step": 96536, "epoch": 797} {"train_loss": -39.16158676147461, "global_step": 96537, "epoch": 797} {"train_loss": -39.14406967163086, "global_step": 96538, "epoch": 797} {"train_loss": -39.270999908447266, "global_step": 96539, "epoch": 797} {"train_loss": -39.0828971862793, "global_step": 96540, "epoch": 797} {"train_loss": -39.440364837646484, "global_step": 96541, "epoch": 797} {"train_loss": -38.40340805053711, "global_step": 96542, "epoch": 797} {"train_loss": -37.86721420288086, "global_step": 96543, "epoch": 797} {"train_loss": -38.601112365722656, "global_step": 96544, "epoch": 797} {"train_loss": -38.2167854309082, "global_step": 96545, "epoch": 797} {"train_loss": -39.11300277709961, "global_step": 96546, "epoch": 797} {"train_loss": -38.45649337768555, "global_step": 96547, "epoch": 797} {"train_loss": -38.64921951293945, "global_step": 96548, "epoch": 797} {"train_loss": -38.52570724487305, "global_step": 96549, "epoch": 797} {"train_loss": -38.62117004394531, "global_step": 96550, "epoch": 797} {"train_loss": -38.30491256713867, "global_step": 96551, "epoch": 797} {"train_loss": -38.62083053588867, "global_step": 96552, "epoch": 797} {"train_loss": -38.429718017578125, "global_step": 96553, "epoch": 797} {"train_loss": -38.57805633544922, "global_step": 96554, "epoch": 797} {"train_loss": -38.68514633178711, "global_step": 96555, "epoch": 797} {"train_loss": -38.981258392333984, "global_step": 96556, "epoch": 797} {"train_loss": -37.92707279299901, "global_step": 96557, "epoch": 797, "val_loss": 2627550.0} {"train_loss": -38.68471908569336, "global_step": 96558, "epoch": 798} {"train_loss": -39.07489776611328, "global_step": 96559, "epoch": 798} {"train_loss": -38.861812591552734, "global_step": 96560, "epoch": 798} {"train_loss": -39.05332946777344, "global_step": 96561, "epoch": 798} {"train_loss": -39.022987365722656, "global_step": 96562, "epoch": 798} {"train_loss": -39.23810577392578, "global_step": 96563, "epoch": 798} {"train_loss": -38.56283950805664, "global_step": 96564, "epoch": 798} {"train_loss": -37.899208068847656, "global_step": 96565, "epoch": 798} {"train_loss": -38.2110481262207, "global_step": 96566, "epoch": 798} {"train_loss": -39.15961837768555, "global_step": 96567, "epoch": 798} {"train_loss": -38.72194290161133, "global_step": 96568, "epoch": 798} {"train_loss": -38.686431884765625, "global_step": 96569, "epoch": 798} {"train_loss": -38.33082962036133, "global_step": 96570, "epoch": 798} {"train_loss": -37.86199951171875, "global_step": 96571, "epoch": 798} {"train_loss": -38.192962646484375, "global_step": 96572, "epoch": 798} {"train_loss": -38.719783782958984, "global_step": 96573, "epoch": 798} {"train_loss": -36.374305725097656, "global_step": 96574, "epoch": 798} {"train_loss": -34.002113342285156, "global_step": 96575, "epoch": 798} {"train_loss": -32.16801834106445, "global_step": 96576, "epoch": 798} {"train_loss": -34.77751922607422, "global_step": 96577, "epoch": 798} {"train_loss": -34.140045166015625, "global_step": 96578, "epoch": 798} {"train_loss": -34.22959518432617, "global_step": 96579, "epoch": 798} {"train_loss": -34.99485397338867, "global_step": 96580, "epoch": 798} {"train_loss": -32.442848205566406, "global_step": 96581, "epoch": 798} {"train_loss": -37.163909912109375, "global_step": 96582, "epoch": 798} {"train_loss": -36.24310302734375, "global_step": 96583, "epoch": 798} {"train_loss": -31.43684959411621, "global_step": 96584, "epoch": 798} {"train_loss": -33.321136474609375, "global_step": 96585, "epoch": 798} {"train_loss": -37.23610305786133, "global_step": 96586, "epoch": 798} {"train_loss": -34.56889724731445, "global_step": 96587, "epoch": 798} {"train_loss": -32.50529098510742, "global_step": 96588, "epoch": 798} {"train_loss": -37.08742904663086, "global_step": 96589, "epoch": 798} {"train_loss": -36.01780319213867, "global_step": 96590, "epoch": 798} {"train_loss": -36.32631301879883, "global_step": 96591, "epoch": 798} {"train_loss": -37.31275939941406, "global_step": 96592, "epoch": 798} {"train_loss": -36.54738998413086, "global_step": 96593, "epoch": 798} {"train_loss": -37.48154830932617, "global_step": 96594, "epoch": 798} {"train_loss": -36.583106994628906, "global_step": 96595, "epoch": 798} {"train_loss": -37.52473831176758, "global_step": 96596, "epoch": 798} {"train_loss": -36.688297271728516, "global_step": 96597, "epoch": 798} {"train_loss": -36.497135162353516, "global_step": 96598, "epoch": 798} {"train_loss": -37.915313720703125, "global_step": 96599, "epoch": 798} {"train_loss": -36.75788497924805, "global_step": 96600, "epoch": 798} {"train_loss": -36.62827682495117, "global_step": 96601, "epoch": 798} {"train_loss": -36.51715087890625, "global_step": 96602, "epoch": 798} {"train_loss": -37.72853088378906, "global_step": 96603, "epoch": 798} {"train_loss": -37.348777770996094, "global_step": 96604, "epoch": 798} {"train_loss": -37.21181106567383, "global_step": 96605, "epoch": 798} {"train_loss": -37.40387725830078, "global_step": 96606, "epoch": 798} {"train_loss": -37.6423454284668, "global_step": 96607, "epoch": 798} {"train_loss": -37.896942138671875, "global_step": 96608, "epoch": 798} {"train_loss": -36.74156188964844, "global_step": 96609, "epoch": 798} {"train_loss": -37.944190979003906, "global_step": 96610, "epoch": 798} {"train_loss": -36.99272537231445, "global_step": 96611, "epoch": 798} {"train_loss": -38.2010612487793, "global_step": 96612, "epoch": 798} {"train_loss": -38.03693771362305, "global_step": 96613, "epoch": 798} {"train_loss": -38.327850341796875, "global_step": 96614, "epoch": 798} {"train_loss": -37.660675048828125, "global_step": 96615, "epoch": 798} {"train_loss": -37.22308349609375, "global_step": 96616, "epoch": 798} {"train_loss": -38.167335510253906, "global_step": 96617, "epoch": 798} {"train_loss": -38.40639114379883, "global_step": 96618, "epoch": 798} {"train_loss": -37.799049377441406, "global_step": 96619, "epoch": 798} {"train_loss": -38.319210052490234, "global_step": 96620, "epoch": 798} {"train_loss": -37.859771728515625, "global_step": 96621, "epoch": 798} {"train_loss": -37.61265182495117, "global_step": 96622, "epoch": 798} {"train_loss": -37.54572296142578, "global_step": 96623, "epoch": 798} {"train_loss": -35.67498779296875, "global_step": 96624, "epoch": 798} {"train_loss": -36.76812744140625, "global_step": 96625, "epoch": 798} {"train_loss": -37.57273483276367, "global_step": 96626, "epoch": 798} {"train_loss": -38.63896560668945, "global_step": 96627, "epoch": 798} {"train_loss": -35.711978912353516, "global_step": 96628, "epoch": 798} {"train_loss": -37.57319259643555, "global_step": 96629, "epoch": 798} {"train_loss": -37.978729248046875, "global_step": 96630, "epoch": 798} {"train_loss": -37.5852165222168, "global_step": 96631, "epoch": 798} {"train_loss": -37.93018341064453, "global_step": 96632, "epoch": 798} {"train_loss": -36.59815979003906, "global_step": 96633, "epoch": 798} {"train_loss": -35.785484313964844, "global_step": 96634, "epoch": 798} {"train_loss": -34.244911193847656, "global_step": 96635, "epoch": 798} {"train_loss": -33.375648498535156, "global_step": 96636, "epoch": 798} {"train_loss": -37.08469772338867, "global_step": 96637, "epoch": 798} {"train_loss": -35.874595642089844, "global_step": 96638, "epoch": 798} {"train_loss": -31.349197387695312, "global_step": 96639, "epoch": 798} {"train_loss": -35.0650520324707, "global_step": 96640, "epoch": 798} {"train_loss": -28.665979385375977, "global_step": 96641, "epoch": 798} {"train_loss": -36.3358039855957, "global_step": 96642, "epoch": 798} {"train_loss": -29.987995147705078, "global_step": 96643, "epoch": 798} {"train_loss": -30.614124298095703, "global_step": 96644, "epoch": 798} {"train_loss": -28.407846450805664, "global_step": 96645, "epoch": 798} {"train_loss": -31.57867431640625, "global_step": 96646, "epoch": 798} {"train_loss": -34.30611038208008, "global_step": 96647, "epoch": 798} {"train_loss": -33.610076904296875, "global_step": 96648, "epoch": 798} {"train_loss": -34.42269515991211, "global_step": 96649, "epoch": 798} {"train_loss": -33.37886428833008, "global_step": 96650, "epoch": 798} {"train_loss": -33.84629440307617, "global_step": 96651, "epoch": 798} {"train_loss": -33.89124298095703, "global_step": 96652, "epoch": 798} {"train_loss": -33.07014083862305, "global_step": 96653, "epoch": 798} {"train_loss": -35.07845687866211, "global_step": 96654, "epoch": 798} {"train_loss": -32.4767951965332, "global_step": 96655, "epoch": 798} {"train_loss": -35.45085525512695, "global_step": 96656, "epoch": 798} {"train_loss": -33.93988037109375, "global_step": 96657, "epoch": 798} {"train_loss": -34.114410400390625, "global_step": 96658, "epoch": 798} {"train_loss": -34.94468307495117, "global_step": 96659, "epoch": 798} {"train_loss": -35.01960372924805, "global_step": 96660, "epoch": 798} {"train_loss": -33.524349212646484, "global_step": 96661, "epoch": 798} {"train_loss": -36.11233139038086, "global_step": 96662, "epoch": 798} {"train_loss": -34.53884506225586, "global_step": 96663, "epoch": 798} {"train_loss": -35.68572998046875, "global_step": 96664, "epoch": 798} {"train_loss": -36.52739715576172, "global_step": 96665, "epoch": 798} {"train_loss": -35.707088470458984, "global_step": 96666, "epoch": 798} {"train_loss": -35.72673034667969, "global_step": 96667, "epoch": 798} {"train_loss": -35.86328125, "global_step": 96668, "epoch": 798} {"train_loss": -35.66183090209961, "global_step": 96669, "epoch": 798} {"train_loss": -35.43201446533203, "global_step": 96670, "epoch": 798} {"train_loss": -35.261043548583984, "global_step": 96671, "epoch": 798} {"train_loss": -36.750335693359375, "global_step": 96672, "epoch": 798} {"train_loss": -36.373104095458984, "global_step": 96673, "epoch": 798} {"train_loss": -36.8459358215332, "global_step": 96674, "epoch": 798} {"train_loss": -35.989601135253906, "global_step": 96675, "epoch": 798} {"train_loss": -36.517913818359375, "global_step": 96676, "epoch": 798} {"train_loss": -35.44350814819336, "global_step": 96677, "epoch": 798} {"train_loss": -36.06785563003918, "global_step": 96678, "epoch": 798, "val_loss": 2681093.25} {"train_loss": -36.70200729370117, "global_step": 96679, "epoch": 799} {"train_loss": -36.14461135864258, "global_step": 96680, "epoch": 799} {"train_loss": -35.99293899536133, "global_step": 96681, "epoch": 799} {"train_loss": -36.51107406616211, "global_step": 96682, "epoch": 799} {"train_loss": -36.62778854370117, "global_step": 96683, "epoch": 799} {"train_loss": -36.962493896484375, "global_step": 96684, "epoch": 799} {"train_loss": -35.77322006225586, "global_step": 96685, "epoch": 799} {"train_loss": -36.3564567565918, "global_step": 96686, "epoch": 799} {"train_loss": -37.55778884887695, "global_step": 96687, "epoch": 799} {"train_loss": -37.188541412353516, "global_step": 96688, "epoch": 799} {"train_loss": -36.353694915771484, "global_step": 96689, "epoch": 799} {"train_loss": -36.544776916503906, "global_step": 96690, "epoch": 799} {"train_loss": -37.142757415771484, "global_step": 96691, "epoch": 799} {"train_loss": -37.3266716003418, "global_step": 96692, "epoch": 799} {"train_loss": -37.8138313293457, "global_step": 96693, "epoch": 799} {"train_loss": -37.30970001220703, "global_step": 96694, "epoch": 799} {"train_loss": -36.99638366699219, "global_step": 96695, "epoch": 799} {"train_loss": -37.56150436401367, "global_step": 96696, "epoch": 799} {"train_loss": -37.59282302856445, "global_step": 96697, "epoch": 799} {"train_loss": -37.15183639526367, "global_step": 96698, "epoch": 799} {"train_loss": -37.5556755065918, "global_step": 96699, "epoch": 799} {"train_loss": -37.42101287841797, "global_step": 96700, "epoch": 799} {"train_loss": -37.13817596435547, "global_step": 96701, "epoch": 799} {"train_loss": -37.668739318847656, "global_step": 96702, "epoch": 799} {"train_loss": -37.23601150512695, "global_step": 96703, "epoch": 799} {"train_loss": -37.76249313354492, "global_step": 96704, "epoch": 799} {"train_loss": -37.9970588684082, "global_step": 96705, "epoch": 799} {"train_loss": -37.59531021118164, "global_step": 96706, "epoch": 799} {"train_loss": -37.948272705078125, "global_step": 96707, "epoch": 799} {"train_loss": -37.39639663696289, "global_step": 96708, "epoch": 799} {"train_loss": -38.3240966796875, "global_step": 96709, "epoch": 799} {"train_loss": -37.89545440673828, "global_step": 96710, "epoch": 799} {"train_loss": -38.401336669921875, "global_step": 96711, "epoch": 799} {"train_loss": -38.25100326538086, "global_step": 96712, "epoch": 799} {"train_loss": -37.766048431396484, "global_step": 96713, "epoch": 799} {"train_loss": -37.9898567199707, "global_step": 96714, "epoch": 799} {"train_loss": -38.12411117553711, "global_step": 96715, "epoch": 799} {"train_loss": -37.79546356201172, "global_step": 96716, "epoch": 799} {"train_loss": -38.47174835205078, "global_step": 96717, "epoch": 799} {"train_loss": -37.71932601928711, "global_step": 96718, "epoch": 799} {"train_loss": -37.913238525390625, "global_step": 96719, "epoch": 799} {"train_loss": -38.028076171875, "global_step": 96720, "epoch": 799} {"train_loss": -38.331947326660156, "global_step": 96721, "epoch": 799} {"train_loss": -38.094112396240234, "global_step": 96722, "epoch": 799} {"train_loss": -37.95748519897461, "global_step": 96723, "epoch": 799} {"train_loss": -38.75988006591797, "global_step": 96724, "epoch": 799} {"train_loss": -38.5582389831543, "global_step": 96725, "epoch": 799} {"train_loss": -38.360530853271484, "global_step": 96726, "epoch": 799} {"train_loss": -38.295509338378906, "global_step": 96727, "epoch": 799} {"train_loss": -38.92293930053711, "global_step": 96728, "epoch": 799} {"train_loss": -38.02437973022461, "global_step": 96729, "epoch": 799} {"train_loss": -38.7501335144043, "global_step": 96730, "epoch": 799} {"train_loss": -38.54172897338867, "global_step": 96731, "epoch": 799} {"train_loss": -38.66609191894531, "global_step": 96732, "epoch": 799} {"train_loss": -38.7686653137207, "global_step": 96733, "epoch": 799} {"train_loss": -38.298439025878906, "global_step": 96734, "epoch": 799} {"train_loss": -38.327552795410156, "global_step": 96735, "epoch": 799} {"train_loss": -38.0131721496582, "global_step": 96736, "epoch": 799} {"train_loss": -38.500823974609375, "global_step": 96737, "epoch": 799} {"train_loss": -38.96211624145508, "global_step": 96738, "epoch": 799} {"train_loss": -38.722007751464844, "global_step": 96739, "epoch": 799} {"train_loss": -39.063926696777344, "global_step": 96740, "epoch": 799} {"train_loss": -39.14738082885742, "global_step": 96741, "epoch": 799} {"train_loss": -38.539485931396484, "global_step": 96742, "epoch": 799} {"train_loss": -39.0500373840332, "global_step": 96743, "epoch": 799} {"train_loss": -39.30523681640625, "global_step": 96744, "epoch": 799} {"train_loss": -39.29354476928711, "global_step": 96745, "epoch": 799} {"train_loss": -39.1185417175293, "global_step": 96746, "epoch": 799} {"train_loss": -38.978878021240234, "global_step": 96747, "epoch": 799} {"train_loss": -38.725589752197266, "global_step": 96748, "epoch": 799} {"train_loss": -38.1489143371582, "global_step": 96749, "epoch": 799} {"train_loss": -39.28248977661133, "global_step": 96750, "epoch": 799} {"train_loss": -38.960079193115234, "global_step": 96751, "epoch": 799} {"train_loss": -38.1083984375, "global_step": 96752, "epoch": 799} {"train_loss": -38.92927169799805, "global_step": 96753, "epoch": 799} {"train_loss": -38.96664810180664, "global_step": 96754, "epoch": 799} {"train_loss": -38.65841293334961, "global_step": 96755, "epoch": 799} {"train_loss": -39.10508728027344, "global_step": 96756, "epoch": 799} {"train_loss": -38.937435150146484, "global_step": 96757, "epoch": 799} {"train_loss": -38.787471771240234, "global_step": 96758, "epoch": 799} {"train_loss": -37.16191482543945, "global_step": 96759, "epoch": 799} {"train_loss": -31.8336124420166, "global_step": 96760, "epoch": 799} {"train_loss": -19.88237953186035, "global_step": 96761, "epoch": 799} {"train_loss": -4.207876205444336, "global_step": 96762, "epoch": 799} {"train_loss": -25.403451919555664, "global_step": 96763, "epoch": 799} {"train_loss": -31.679182052612305, "global_step": 96764, "epoch": 799} {"train_loss": -0.4109003245830536, "global_step": 96765, "epoch": 799} {"train_loss": -17.065982818603516, "global_step": 96766, "epoch": 799} {"train_loss": -18.8992919921875, "global_step": 96767, "epoch": 799} {"train_loss": -19.95133399963379, "global_step": 96768, "epoch": 799} {"train_loss": -18.948583602905273, "global_step": 96769, "epoch": 799} {"train_loss": -31.8128662109375, "global_step": 96770, "epoch": 799} {"train_loss": -22.01496696472168, "global_step": 96771, "epoch": 799} {"train_loss": -28.445215225219727, "global_step": 96772, "epoch": 799} {"train_loss": -34.485382080078125, "global_step": 96773, "epoch": 799} {"train_loss": -28.683032989501953, "global_step": 96774, "epoch": 799} {"train_loss": -31.004819869995117, "global_step": 96775, "epoch": 799} {"train_loss": -36.0879020690918, "global_step": 96776, "epoch": 799} {"train_loss": -34.688114166259766, "global_step": 96777, "epoch": 799} {"train_loss": -31.954370498657227, "global_step": 96778, "epoch": 799} {"train_loss": -33.34437942504883, "global_step": 96779, "epoch": 799} {"train_loss": -36.42537307739258, "global_step": 96780, "epoch": 799} {"train_loss": -36.197383880615234, "global_step": 96781, "epoch": 799} {"train_loss": -34.692378997802734, "global_step": 96782, "epoch": 799} {"train_loss": -34.931785583496094, "global_step": 96783, "epoch": 799} {"train_loss": -35.758140563964844, "global_step": 96784, "epoch": 799} {"train_loss": -36.64956283569336, "global_step": 96785, "epoch": 799} {"train_loss": -36.46260452270508, "global_step": 96786, "epoch": 799} {"train_loss": -35.976051330566406, "global_step": 96787, "epoch": 799} {"train_loss": -35.061920166015625, "global_step": 96788, "epoch": 799} {"train_loss": -36.29875564575195, "global_step": 96789, "epoch": 799} {"train_loss": -36.81452178955078, "global_step": 96790, "epoch": 799} {"train_loss": -36.90877151489258, "global_step": 96791, "epoch": 799} {"train_loss": -36.58356857299805, "global_step": 96792, "epoch": 799} {"train_loss": -36.59116744995117, "global_step": 96793, "epoch": 799} {"train_loss": -36.745361328125, "global_step": 96794, "epoch": 799} {"train_loss": -36.658538818359375, "global_step": 96795, "epoch": 799} {"train_loss": -37.00653839111328, "global_step": 96796, "epoch": 799} {"train_loss": -37.443328857421875, "global_step": 96797, "epoch": 799} {"train_loss": -36.993526458740234, "global_step": 96798, "epoch": 799} {"train_loss": -35.57790739058463, "global_step": 96799, "epoch": 799, "val_loss": 2679142.75} {"train_loss": -37.23663330078125, "global_step": 96800, "epoch": 800} {"train_loss": -37.036842346191406, "global_step": 96801, "epoch": 800} {"train_loss": -37.08905029296875, "global_step": 96802, "epoch": 800} {"train_loss": -37.65332794189453, "global_step": 96803, "epoch": 800} {"train_loss": -37.55332565307617, "global_step": 96804, "epoch": 800} {"train_loss": -37.49935531616211, "global_step": 96805, "epoch": 800} {"train_loss": -37.34019088745117, "global_step": 96806, "epoch": 800} {"train_loss": -37.54453659057617, "global_step": 96807, "epoch": 800} {"train_loss": -37.453372955322266, "global_step": 96808, "epoch": 800} {"train_loss": -37.759193420410156, "global_step": 96809, "epoch": 800} {"train_loss": -37.698890686035156, "global_step": 96810, "epoch": 800} {"train_loss": -37.518558502197266, "global_step": 96811, "epoch": 800} {"train_loss": -37.73714065551758, "global_step": 96812, "epoch": 800} {"train_loss": -37.78314208984375, "global_step": 96813, "epoch": 800} {"train_loss": -37.93147659301758, "global_step": 96814, "epoch": 800} {"train_loss": -38.1700325012207, "global_step": 96815, "epoch": 800} {"train_loss": -38.282493591308594, "global_step": 96816, "epoch": 800} {"train_loss": -37.972625732421875, "global_step": 96817, "epoch": 800} {"train_loss": -38.09510040283203, "global_step": 96818, "epoch": 800} {"train_loss": -37.84721755981445, "global_step": 96819, "epoch": 800} {"train_loss": -38.25154495239258, "global_step": 96820, "epoch": 800} {"train_loss": -38.21936798095703, "global_step": 96821, "epoch": 800} {"train_loss": -38.17829132080078, "global_step": 96822, "epoch": 800} {"train_loss": -38.55532455444336, "global_step": 96823, "epoch": 800} {"train_loss": -38.48763656616211, "global_step": 96824, "epoch": 800} {"train_loss": -38.14765548706055, "global_step": 96825, "epoch": 800} {"train_loss": -37.069068908691406, "global_step": 96826, "epoch": 800} {"train_loss": -38.1427116394043, "global_step": 96827, "epoch": 800} {"train_loss": -38.3394889831543, "global_step": 96828, "epoch": 800} {"train_loss": -38.28323745727539, "global_step": 96829, "epoch": 800} {"train_loss": -37.893463134765625, "global_step": 96830, "epoch": 800} {"train_loss": -38.372230529785156, "global_step": 96831, "epoch": 800} {"train_loss": -38.55458450317383, "global_step": 96832, "epoch": 800} {"train_loss": -38.25518798828125, "global_step": 96833, "epoch": 800} {"train_loss": -38.74289321899414, "global_step": 96834, "epoch": 800} {"train_loss": -38.602657318115234, "global_step": 96835, "epoch": 800} {"train_loss": -38.397254943847656, "global_step": 96836, "epoch": 800} {"train_loss": -38.22895431518555, "global_step": 96837, "epoch": 800} {"train_loss": -38.70228958129883, "global_step": 96838, "epoch": 800} {"train_loss": -38.802696228027344, "global_step": 96839, "epoch": 800} {"train_loss": -38.852203369140625, "global_step": 96840, "epoch": 800} {"train_loss": -38.95679473876953, "global_step": 96841, "epoch": 800} {"train_loss": -38.66231155395508, "global_step": 96842, "epoch": 800} {"train_loss": -38.550987243652344, "global_step": 96843, "epoch": 800} {"train_loss": -38.52375411987305, "global_step": 96844, "epoch": 800} {"train_loss": -38.916622161865234, "global_step": 96845, "epoch": 800} {"train_loss": -38.81020736694336, "global_step": 96846, "epoch": 800} {"train_loss": -38.9207878112793, "global_step": 96847, "epoch": 800} {"train_loss": -38.56703186035156, "global_step": 96848, "epoch": 800} {"train_loss": -38.8685417175293, "global_step": 96849, "epoch": 800} {"train_loss": -39.111263275146484, "global_step": 96850, "epoch": 800} {"train_loss": -39.27262878417969, "global_step": 96851, "epoch": 800} {"train_loss": -39.1396484375, "global_step": 96852, "epoch": 800} {"train_loss": -38.75141143798828, "global_step": 96853, "epoch": 800} {"train_loss": -39.438323974609375, "global_step": 96854, "epoch": 800} {"train_loss": -38.933223724365234, "global_step": 96855, "epoch": 800} {"train_loss": -39.3625373840332, "global_step": 96856, "epoch": 800} {"train_loss": -39.07587432861328, "global_step": 96857, "epoch": 800} {"train_loss": -38.870948791503906, "global_step": 96858, "epoch": 800} {"train_loss": -38.839332580566406, "global_step": 96859, "epoch": 800} {"train_loss": -38.12300491333008, "global_step": 96860, "epoch": 800} {"train_loss": -35.82390594482422, "global_step": 96861, "epoch": 800} {"train_loss": -36.378936767578125, "global_step": 96862, "epoch": 800} {"train_loss": -33.806392669677734, "global_step": 96863, "epoch": 800} {"train_loss": -36.980159759521484, "global_step": 96864, "epoch": 800} {"train_loss": -37.75242233276367, "global_step": 96865, "epoch": 800} {"train_loss": -33.11382293701172, "global_step": 96866, "epoch": 800} {"train_loss": -34.96706008911133, "global_step": 96867, "epoch": 800} {"train_loss": -36.08640670776367, "global_step": 96868, "epoch": 800} {"train_loss": -30.90293312072754, "global_step": 96869, "epoch": 800} {"train_loss": -36.88885498046875, "global_step": 96870, "epoch": 800} {"train_loss": -36.39270782470703, "global_step": 96871, "epoch": 800} {"train_loss": -36.18024826049805, "global_step": 96872, "epoch": 800} {"train_loss": -36.41447067260742, "global_step": 96873, "epoch": 800} {"train_loss": -36.44947052001953, "global_step": 96874, "epoch": 800} {"train_loss": -33.09355545043945, "global_step": 96875, "epoch": 800} {"train_loss": -36.079158782958984, "global_step": 96876, "epoch": 800} {"train_loss": -32.941078186035156, "global_step": 96877, "epoch": 800} {"train_loss": -35.295570373535156, "global_step": 96878, "epoch": 800} {"train_loss": -35.67302322387695, "global_step": 96879, "epoch": 800} {"train_loss": -37.29499435424805, "global_step": 96880, "epoch": 800} {"train_loss": -35.946285247802734, "global_step": 96881, "epoch": 800} {"train_loss": -34.7894172668457, "global_step": 96882, "epoch": 800} {"train_loss": -37.69435501098633, "global_step": 96883, "epoch": 800} {"train_loss": -35.01630783081055, "global_step": 96884, "epoch": 800} {"train_loss": -35.396934509277344, "global_step": 96885, "epoch": 800} {"train_loss": -35.037879943847656, "global_step": 96886, "epoch": 800} {"train_loss": -35.81526565551758, "global_step": 96887, "epoch": 800} {"train_loss": -34.13440704345703, "global_step": 96888, "epoch": 800} {"train_loss": -35.49097442626953, "global_step": 96889, "epoch": 800} {"train_loss": -33.972530364990234, "global_step": 96890, "epoch": 800} {"train_loss": -34.89565658569336, "global_step": 96891, "epoch": 800} {"train_loss": -35.18152618408203, "global_step": 96892, "epoch": 800} {"train_loss": -36.68141555786133, "global_step": 96893, "epoch": 800} {"train_loss": -33.0588493347168, "global_step": 96894, "epoch": 800} {"train_loss": -36.73689270019531, "global_step": 96895, "epoch": 800} {"train_loss": -36.099822998046875, "global_step": 96896, "epoch": 800} {"train_loss": -35.6561393737793, "global_step": 96897, "epoch": 800} {"train_loss": -36.79861068725586, "global_step": 96898, "epoch": 800} {"train_loss": -35.56098175048828, "global_step": 96899, "epoch": 800} {"train_loss": -36.786529541015625, "global_step": 96900, "epoch": 800} {"train_loss": -36.240421295166016, "global_step": 96901, "epoch": 800} {"train_loss": -36.012298583984375, "global_step": 96902, "epoch": 800} {"train_loss": -36.086029052734375, "global_step": 96903, "epoch": 800} {"train_loss": -36.60438919067383, "global_step": 96904, "epoch": 800} {"train_loss": -37.51939010620117, "global_step": 96905, "epoch": 800} {"train_loss": -36.05112838745117, "global_step": 96906, "epoch": 800} {"train_loss": -37.18917465209961, "global_step": 96907, "epoch": 800} {"train_loss": -36.93589401245117, "global_step": 96908, "epoch": 800} {"train_loss": -37.5155143737793, "global_step": 96909, "epoch": 800} {"train_loss": -37.13654708862305, "global_step": 96910, "epoch": 800} {"train_loss": -37.24022674560547, "global_step": 96911, "epoch": 800} {"train_loss": -37.11259078979492, "global_step": 96912, "epoch": 800} {"train_loss": -37.53898239135742, "global_step": 96913, "epoch": 800} {"train_loss": -36.962646484375, "global_step": 96914, "epoch": 800} {"train_loss": -37.54368209838867, "global_step": 96915, "epoch": 800} {"train_loss": -37.542964935302734, "global_step": 96916, "epoch": 800} {"train_loss": -37.601078033447266, "global_step": 96917, "epoch": 800} {"train_loss": -37.963619232177734, "global_step": 96918, "epoch": 800} {"train_loss": -37.44969940185547, "global_step": 96919, "epoch": 800} {"train_loss": -37.16703832642106, "global_step": 96920, "epoch": 800, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4400000": 1.0, "test/sim_max_reward_4400001": 1.0, "test/sim_max_reward_4400002": 1.0, "test/sim_max_reward_4400003": 1.0, "test/sim_max_reward_4400004": 1.0, "test/sim_max_reward_4400005": 1.0, "test/sim_max_reward_4400006": 1.0, "test/sim_max_reward_4400007": 1.0, "test/sim_max_reward_4400008": 1.0, "test/sim_max_reward_4400009": 1.0, "test/sim_max_reward_4400010": 1.0, "test/sim_max_reward_4400011": 1.0, "test/sim_max_reward_4400012": 1.0, "test/sim_max_reward_4400013": 1.0, "test/sim_max_reward_4400014": 1.0, "test/sim_max_reward_4400015": 1.0, "test/sim_max_reward_4400016": 1.0, "test/sim_max_reward_4400017": 1.0, "test/sim_max_reward_4400018": 1.0, "test/sim_max_reward_4400019": 1.0, "test/sim_max_reward_4400020": 1.0, "test/sim_max_reward_4400021": 1.0, "train/mean_score": 1.0, "test/mean_score": 1.0, "val_loss": 2772164.0} {"train_loss": -37.969024658203125, "global_step": 96921, "epoch": 801} {"train_loss": -37.57001876831055, "global_step": 96922, "epoch": 801} {"train_loss": -37.7470588684082, "global_step": 96923, "epoch": 801} {"train_loss": -37.757808685302734, "global_step": 96924, "epoch": 801} {"train_loss": -37.65359115600586, "global_step": 96925, "epoch": 801} {"train_loss": -36.92409133911133, "global_step": 96926, "epoch": 801} {"train_loss": -37.67070388793945, "global_step": 96927, "epoch": 801} {"train_loss": -38.26953125, "global_step": 96928, "epoch": 801} {"train_loss": -37.310951232910156, "global_step": 96929, "epoch": 801} {"train_loss": -38.113800048828125, "global_step": 96930, "epoch": 801} {"train_loss": -37.97280502319336, "global_step": 96931, "epoch": 801} {"train_loss": -38.1572265625, "global_step": 96932, "epoch": 801} {"train_loss": -37.73627471923828, "global_step": 96933, "epoch": 801} {"train_loss": -37.61041259765625, "global_step": 96934, "epoch": 801} {"train_loss": -38.22058868408203, "global_step": 96935, "epoch": 801} {"train_loss": -38.03516387939453, "global_step": 96936, "epoch": 801} {"train_loss": -38.161224365234375, "global_step": 96937, "epoch": 801} {"train_loss": -38.24294662475586, "global_step": 96938, "epoch": 801} {"train_loss": -38.0286865234375, "global_step": 96939, "epoch": 801} {"train_loss": -35.01750946044922, "global_step": 96940, "epoch": 801} {"train_loss": -38.394073486328125, "global_step": 96941, "epoch": 801} {"train_loss": -38.418853759765625, "global_step": 96942, "epoch": 801} {"train_loss": -38.47761154174805, "global_step": 96943, "epoch": 801} {"train_loss": -37.888763427734375, "global_step": 96944, "epoch": 801} {"train_loss": -38.63802719116211, "global_step": 96945, "epoch": 801} {"train_loss": -37.146846771240234, "global_step": 96946, "epoch": 801} {"train_loss": -38.390621185302734, "global_step": 96947, "epoch": 801} {"train_loss": -37.66818618774414, "global_step": 96948, "epoch": 801} {"train_loss": -38.46249008178711, "global_step": 96949, "epoch": 801} {"train_loss": -38.653316497802734, "global_step": 96950, "epoch": 801} {"train_loss": -37.63469314575195, "global_step": 96951, "epoch": 801} {"train_loss": -38.76748275756836, "global_step": 96952, "epoch": 801} {"train_loss": -38.21552658081055, "global_step": 96953, "epoch": 801} {"train_loss": -38.65077209472656, "global_step": 96954, "epoch": 801} {"train_loss": -37.06184005737305, "global_step": 96955, "epoch": 801} {"train_loss": -37.1832160949707, "global_step": 96956, "epoch": 801} {"train_loss": -37.69698715209961, "global_step": 96957, "epoch": 801} {"train_loss": -35.0859489440918, "global_step": 96958, "epoch": 801} {"train_loss": -37.045936584472656, "global_step": 96959, "epoch": 801} {"train_loss": -37.86330795288086, "global_step": 96960, "epoch": 801} {"train_loss": -37.308074951171875, "global_step": 96961, "epoch": 801} {"train_loss": -37.1291618347168, "global_step": 96962, "epoch": 801} {"train_loss": -35.646507263183594, "global_step": 96963, "epoch": 801} {"train_loss": -31.121694564819336, "global_step": 96964, "epoch": 801} {"train_loss": -35.43560791015625, "global_step": 96965, "epoch": 801} {"train_loss": -35.84324645996094, "global_step": 96966, "epoch": 801} {"train_loss": -36.43838882446289, "global_step": 96967, "epoch": 801} {"train_loss": -37.565670013427734, "global_step": 96968, "epoch": 801} {"train_loss": -36.25227737426758, "global_step": 96969, "epoch": 801} {"train_loss": -37.10848617553711, "global_step": 96970, "epoch": 801} {"train_loss": -36.4818000793457, "global_step": 96971, "epoch": 801} {"train_loss": -34.73513412475586, "global_step": 96972, "epoch": 801} {"train_loss": -36.74447250366211, "global_step": 96973, "epoch": 801} {"train_loss": -38.178829193115234, "global_step": 96974, "epoch": 801} {"train_loss": -36.96232986450195, "global_step": 96975, "epoch": 801} {"train_loss": -36.07205581665039, "global_step": 96976, "epoch": 801} {"train_loss": -34.96233367919922, "global_step": 96977, "epoch": 801} {"train_loss": -36.23066329956055, "global_step": 96978, "epoch": 801} {"train_loss": -37.6861457824707, "global_step": 96979, "epoch": 801} {"train_loss": -37.16715621948242, "global_step": 96980, "epoch": 801} {"train_loss": -36.09733963012695, "global_step": 96981, "epoch": 801} {"train_loss": -37.5328369140625, "global_step": 96982, "epoch": 801} {"train_loss": -37.68062973022461, "global_step": 96983, "epoch": 801} {"train_loss": -35.865516662597656, "global_step": 96984, "epoch": 801} {"train_loss": -36.91437911987305, "global_step": 96985, "epoch": 801} {"train_loss": -37.47385025024414, "global_step": 96986, "epoch": 801} {"train_loss": -36.70222473144531, "global_step": 96987, "epoch": 801} {"train_loss": -37.43268966674805, "global_step": 96988, "epoch": 801} {"train_loss": -35.065513610839844, "global_step": 96989, "epoch": 801} {"train_loss": -35.989013671875, "global_step": 96990, "epoch": 801} {"train_loss": -37.38381576538086, "global_step": 96991, "epoch": 801} {"train_loss": -37.893775939941406, "global_step": 96992, "epoch": 801} {"train_loss": -37.14534378051758, "global_step": 96993, "epoch": 801} {"train_loss": -37.585899353027344, "global_step": 96994, "epoch": 801} {"train_loss": -37.5810432434082, "global_step": 96995, "epoch": 801} {"train_loss": -36.502803802490234, "global_step": 96996, "epoch": 801} {"train_loss": -37.8969841003418, "global_step": 96997, "epoch": 801} {"train_loss": -37.82719039916992, "global_step": 96998, "epoch": 801} {"train_loss": -38.050907135009766, "global_step": 96999, "epoch": 801} {"train_loss": -37.702362060546875, "global_step": 97000, "epoch": 801} {"train_loss": -37.69407272338867, "global_step": 97001, "epoch": 801} {"train_loss": -38.26714324951172, "global_step": 97002, "epoch": 801} {"train_loss": -38.36152267456055, "global_step": 97003, "epoch": 801} {"train_loss": -36.557411193847656, "global_step": 97004, "epoch": 801} {"train_loss": -37.92139434814453, "global_step": 97005, "epoch": 801} {"train_loss": -37.5111083984375, "global_step": 97006, "epoch": 801} {"train_loss": -37.55549240112305, "global_step": 97007, "epoch": 801} {"train_loss": -37.9328727722168, "global_step": 97008, "epoch": 801} {"train_loss": -37.50630569458008, "global_step": 97009, "epoch": 801} {"train_loss": -38.042198181152344, "global_step": 97010, "epoch": 801} {"train_loss": -38.32239532470703, "global_step": 97011, "epoch": 801} {"train_loss": -37.62078094482422, "global_step": 97012, "epoch": 801} {"train_loss": -38.158809661865234, "global_step": 97013, "epoch": 801} {"train_loss": -38.68806838989258, "global_step": 97014, "epoch": 801} {"train_loss": -37.651756286621094, "global_step": 97015, "epoch": 801} {"train_loss": -36.77675247192383, "global_step": 97016, "epoch": 801} {"train_loss": -36.22317123413086, "global_step": 97017, "epoch": 801} {"train_loss": -38.42610549926758, "global_step": 97018, "epoch": 801} {"train_loss": -37.48198318481445, "global_step": 97019, "epoch": 801} {"train_loss": -36.04160690307617, "global_step": 97020, "epoch": 801} {"train_loss": -36.618587493896484, "global_step": 97021, "epoch": 801} {"train_loss": -38.511253356933594, "global_step": 97022, "epoch": 801} {"train_loss": -37.55694580078125, "global_step": 97023, "epoch": 801} {"train_loss": -35.612361907958984, "global_step": 97024, "epoch": 801} {"train_loss": -35.236019134521484, "global_step": 97025, "epoch": 801} {"train_loss": -37.81224060058594, "global_step": 97026, "epoch": 801} {"train_loss": -37.57788848876953, "global_step": 97027, "epoch": 801} {"train_loss": -36.54789352416992, "global_step": 97028, "epoch": 801} {"train_loss": -36.13323211669922, "global_step": 97029, "epoch": 801} {"train_loss": -37.2696647644043, "global_step": 97030, "epoch": 801} {"train_loss": -37.46569061279297, "global_step": 97031, "epoch": 801} {"train_loss": -37.12754821777344, "global_step": 97032, "epoch": 801} {"train_loss": -37.643638610839844, "global_step": 97033, "epoch": 801} {"train_loss": -36.9901237487793, "global_step": 97034, "epoch": 801} {"train_loss": -36.46088790893555, "global_step": 97035, "epoch": 801} {"train_loss": -37.54179000854492, "global_step": 97036, "epoch": 801} {"train_loss": -37.71132278442383, "global_step": 97037, "epoch": 801} {"train_loss": -36.895423889160156, "global_step": 97038, "epoch": 801} {"train_loss": -35.71633529663086, "global_step": 97039, "epoch": 801} {"train_loss": -37.78377914428711, "global_step": 97040, "epoch": 801} {"train_loss": -37.266871003080006, "global_step": 97041, "epoch": 801, "val_loss": 2656255.75} {"train_loss": -37.761409759521484, "global_step": 97042, "epoch": 802} {"train_loss": -37.314453125, "global_step": 97043, "epoch": 802} {"train_loss": -37.8050537109375, "global_step": 97044, "epoch": 802} {"train_loss": -34.21284103393555, "global_step": 97045, "epoch": 802} {"train_loss": -37.46840286254883, "global_step": 97046, "epoch": 802} {"train_loss": -36.893646240234375, "global_step": 97047, "epoch": 802} {"train_loss": -36.45024108886719, "global_step": 97048, "epoch": 802} {"train_loss": -37.143592834472656, "global_step": 97049, "epoch": 802} {"train_loss": -38.470428466796875, "global_step": 97050, "epoch": 802} {"train_loss": -37.097496032714844, "global_step": 97051, "epoch": 802} {"train_loss": -37.59998321533203, "global_step": 97052, "epoch": 802} {"train_loss": -37.28225326538086, "global_step": 97053, "epoch": 802} {"train_loss": -37.59785842895508, "global_step": 97054, "epoch": 802} {"train_loss": -37.44795227050781, "global_step": 97055, "epoch": 802} {"train_loss": -37.2906379699707, "global_step": 97056, "epoch": 802} {"train_loss": -37.424312591552734, "global_step": 97057, "epoch": 802} {"train_loss": -37.183319091796875, "global_step": 97058, "epoch": 802} {"train_loss": -37.91923141479492, "global_step": 97059, "epoch": 802} {"train_loss": -36.552818298339844, "global_step": 97060, "epoch": 802} {"train_loss": -36.69516372680664, "global_step": 97061, "epoch": 802} {"train_loss": -35.72367477416992, "global_step": 97062, "epoch": 802} {"train_loss": -37.42158508300781, "global_step": 97063, "epoch": 802} {"train_loss": -36.54555892944336, "global_step": 97064, "epoch": 802} {"train_loss": -36.4063720703125, "global_step": 97065, "epoch": 802} {"train_loss": -37.79111862182617, "global_step": 97066, "epoch": 802} {"train_loss": -36.905635833740234, "global_step": 97067, "epoch": 802} {"train_loss": -36.756622314453125, "global_step": 97068, "epoch": 802} {"train_loss": -37.512813568115234, "global_step": 97069, "epoch": 802} {"train_loss": -36.605255126953125, "global_step": 97070, "epoch": 802} {"train_loss": -37.39815902709961, "global_step": 97071, "epoch": 802} {"train_loss": -38.294368743896484, "global_step": 97072, "epoch": 802} {"train_loss": -36.55222702026367, "global_step": 97073, "epoch": 802} {"train_loss": -37.91826248168945, "global_step": 97074, "epoch": 802} {"train_loss": -37.54835891723633, "global_step": 97075, "epoch": 802} {"train_loss": -36.56989669799805, "global_step": 97076, "epoch": 802} {"train_loss": -36.65328598022461, "global_step": 97077, "epoch": 802} {"train_loss": -37.96512222290039, "global_step": 97078, "epoch": 802} {"train_loss": -37.2894401550293, "global_step": 97079, "epoch": 802} {"train_loss": -36.71794509887695, "global_step": 97080, "epoch": 802} {"train_loss": -36.733524322509766, "global_step": 97081, "epoch": 802} {"train_loss": -38.04971694946289, "global_step": 97082, "epoch": 802} {"train_loss": -36.79478073120117, "global_step": 97083, "epoch": 802} {"train_loss": -38.03664016723633, "global_step": 97084, "epoch": 802} {"train_loss": -36.1580696105957, "global_step": 97085, "epoch": 802} {"train_loss": -37.16413879394531, "global_step": 97086, "epoch": 802} {"train_loss": -36.606781005859375, "global_step": 97087, "epoch": 802} {"train_loss": -37.47652053833008, "global_step": 97088, "epoch": 802} {"train_loss": -37.95258712768555, "global_step": 97089, "epoch": 802} {"train_loss": -36.65049362182617, "global_step": 97090, "epoch": 802} {"train_loss": -38.089561462402344, "global_step": 97091, "epoch": 802} {"train_loss": -37.56623077392578, "global_step": 97092, "epoch": 802} {"train_loss": -37.73637390136719, "global_step": 97093, "epoch": 802} {"train_loss": -37.785396575927734, "global_step": 97094, "epoch": 802} {"train_loss": -37.656715393066406, "global_step": 97095, "epoch": 802} {"train_loss": -38.276275634765625, "global_step": 97096, "epoch": 802} {"train_loss": -37.82584762573242, "global_step": 97097, "epoch": 802} {"train_loss": -38.15968704223633, "global_step": 97098, "epoch": 802} {"train_loss": -38.664608001708984, "global_step": 97099, "epoch": 802} {"train_loss": -38.29413986206055, "global_step": 97100, "epoch": 802} {"train_loss": -38.444061279296875, "global_step": 97101, "epoch": 802} {"train_loss": -38.125247955322266, "global_step": 97102, "epoch": 802} {"train_loss": -38.19002914428711, "global_step": 97103, "epoch": 802} {"train_loss": -38.15944290161133, "global_step": 97104, "epoch": 802} {"train_loss": -38.55903625488281, "global_step": 97105, "epoch": 802} {"train_loss": -38.22063446044922, "global_step": 97106, "epoch": 802} {"train_loss": -38.466304779052734, "global_step": 97107, "epoch": 802} {"train_loss": -38.45390319824219, "global_step": 97108, "epoch": 802} {"train_loss": -38.95969772338867, "global_step": 97109, "epoch": 802} {"train_loss": -38.42742156982422, "global_step": 97110, "epoch": 802} {"train_loss": -38.52699279785156, "global_step": 97111, "epoch": 802} {"train_loss": -38.87939453125, "global_step": 97112, "epoch": 802} {"train_loss": -38.441078186035156, "global_step": 97113, "epoch": 802} {"train_loss": -38.593013763427734, "global_step": 97114, "epoch": 802} {"train_loss": -38.612213134765625, "global_step": 97115, "epoch": 802} {"train_loss": -38.64748764038086, "global_step": 97116, "epoch": 802} {"train_loss": -39.01372528076172, "global_step": 97117, "epoch": 802} {"train_loss": -38.70518493652344, "global_step": 97118, "epoch": 802} {"train_loss": -39.081722259521484, "global_step": 97119, "epoch": 802} {"train_loss": -39.22698974609375, "global_step": 97120, "epoch": 802} {"train_loss": -39.33797836303711, "global_step": 97121, "epoch": 802} {"train_loss": -38.34011459350586, "global_step": 97122, "epoch": 802} {"train_loss": -38.59560775756836, "global_step": 97123, "epoch": 802} {"train_loss": -38.222259521484375, "global_step": 97124, "epoch": 802} {"train_loss": -39.10984420776367, "global_step": 97125, "epoch": 802} {"train_loss": -38.981014251708984, "global_step": 97126, "epoch": 802} {"train_loss": -38.653133392333984, "global_step": 97127, "epoch": 802} {"train_loss": -38.41262435913086, "global_step": 97128, "epoch": 802} {"train_loss": -38.637569427490234, "global_step": 97129, "epoch": 802} {"train_loss": -37.68015670776367, "global_step": 97130, "epoch": 802} {"train_loss": -38.60490798950195, "global_step": 97131, "epoch": 802} {"train_loss": -37.87641143798828, "global_step": 97132, "epoch": 802} {"train_loss": -37.604061126708984, "global_step": 97133, "epoch": 802} {"train_loss": -38.7014045715332, "global_step": 97134, "epoch": 802} {"train_loss": -37.65249252319336, "global_step": 97135, "epoch": 802} {"train_loss": -37.978736877441406, "global_step": 97136, "epoch": 802} {"train_loss": -37.96998596191406, "global_step": 97137, "epoch": 802} {"train_loss": -38.184852600097656, "global_step": 97138, "epoch": 802} {"train_loss": -38.77101135253906, "global_step": 97139, "epoch": 802} {"train_loss": -38.29556655883789, "global_step": 97140, "epoch": 802} {"train_loss": -37.35795211791992, "global_step": 97141, "epoch": 802} {"train_loss": -37.803627014160156, "global_step": 97142, "epoch": 802} {"train_loss": -36.86748123168945, "global_step": 97143, "epoch": 802} {"train_loss": -36.8208122253418, "global_step": 97144, "epoch": 802} {"train_loss": -38.72152328491211, "global_step": 97145, "epoch": 802} {"train_loss": -37.699954986572266, "global_step": 97146, "epoch": 802} {"train_loss": -38.6150016784668, "global_step": 97147, "epoch": 802} {"train_loss": -38.328277587890625, "global_step": 97148, "epoch": 802} {"train_loss": -38.1973876953125, "global_step": 97149, "epoch": 802} {"train_loss": -38.12514114379883, "global_step": 97150, "epoch": 802} {"train_loss": -37.676513671875, "global_step": 97151, "epoch": 802} {"train_loss": -38.82959747314453, "global_step": 97152, "epoch": 802} {"train_loss": -38.39167022705078, "global_step": 97153, "epoch": 802} {"train_loss": -36.671958923339844, "global_step": 97154, "epoch": 802} {"train_loss": -35.760406494140625, "global_step": 97155, "epoch": 802} {"train_loss": -37.25504684448242, "global_step": 97156, "epoch": 802} {"train_loss": -38.365116119384766, "global_step": 97157, "epoch": 802} {"train_loss": -37.39020538330078, "global_step": 97158, "epoch": 802} {"train_loss": -36.52425003051758, "global_step": 97159, "epoch": 802} {"train_loss": -36.67963790893555, "global_step": 97160, "epoch": 802} {"train_loss": -38.041439056396484, "global_step": 97161, "epoch": 802} {"train_loss": -37.739785943149535, "global_step": 97162, "epoch": 802, "val_loss": 2591414.25} {"train_loss": -38.456764221191406, "global_step": 97163, "epoch": 803} {"train_loss": -38.62510299682617, "global_step": 97164, "epoch": 803} {"train_loss": -37.51816940307617, "global_step": 97165, "epoch": 803} {"train_loss": -36.50094223022461, "global_step": 97166, "epoch": 803} {"train_loss": -38.185298919677734, "global_step": 97167, "epoch": 803} {"train_loss": -37.53657150268555, "global_step": 97168, "epoch": 803} {"train_loss": -38.181331634521484, "global_step": 97169, "epoch": 803} {"train_loss": -38.68172836303711, "global_step": 97170, "epoch": 803} {"train_loss": -38.39414978027344, "global_step": 97171, "epoch": 803} {"train_loss": -38.60947799682617, "global_step": 97172, "epoch": 803} {"train_loss": -37.85695266723633, "global_step": 97173, "epoch": 803} {"train_loss": -35.18227005004883, "global_step": 97174, "epoch": 803} {"train_loss": -34.3940544128418, "global_step": 97175, "epoch": 803} {"train_loss": -31.660200119018555, "global_step": 97176, "epoch": 803} {"train_loss": -31.49188804626465, "global_step": 97177, "epoch": 803} {"train_loss": -36.268978118896484, "global_step": 97178, "epoch": 803} {"train_loss": -37.57194900512695, "global_step": 97179, "epoch": 803} {"train_loss": -34.447025299072266, "global_step": 97180, "epoch": 803} {"train_loss": -33.672969818115234, "global_step": 97181, "epoch": 803} {"train_loss": -37.96482467651367, "global_step": 97182, "epoch": 803} {"train_loss": -36.967063903808594, "global_step": 97183, "epoch": 803} {"train_loss": -36.55202865600586, "global_step": 97184, "epoch": 803} {"train_loss": -37.51467514038086, "global_step": 97185, "epoch": 803} {"train_loss": -36.35640335083008, "global_step": 97186, "epoch": 803} {"train_loss": -37.2997932434082, "global_step": 97187, "epoch": 803} {"train_loss": -37.809505462646484, "global_step": 97188, "epoch": 803} {"train_loss": -37.76103210449219, "global_step": 97189, "epoch": 803} {"train_loss": -37.53894805908203, "global_step": 97190, "epoch": 803} {"train_loss": -37.33243942260742, "global_step": 97191, "epoch": 803} {"train_loss": -37.467201232910156, "global_step": 97192, "epoch": 803} {"train_loss": -37.96165084838867, "global_step": 97193, "epoch": 803} {"train_loss": -37.4560661315918, "global_step": 97194, "epoch": 803} {"train_loss": -37.81348419189453, "global_step": 97195, "epoch": 803} {"train_loss": -36.09309005737305, "global_step": 97196, "epoch": 803} {"train_loss": -37.90742111206055, "global_step": 97197, "epoch": 803} {"train_loss": -36.93299102783203, "global_step": 97198, "epoch": 803} {"train_loss": -38.388671875, "global_step": 97199, "epoch": 803} {"train_loss": -36.93843460083008, "global_step": 97200, "epoch": 803} {"train_loss": -38.22335433959961, "global_step": 97201, "epoch": 803} {"train_loss": -36.954505920410156, "global_step": 97202, "epoch": 803} {"train_loss": -37.509796142578125, "global_step": 97203, "epoch": 803} {"train_loss": -37.27651596069336, "global_step": 97204, "epoch": 803} {"train_loss": -37.93610763549805, "global_step": 97205, "epoch": 803} {"train_loss": -36.59641647338867, "global_step": 97206, "epoch": 803} {"train_loss": -38.73787307739258, "global_step": 97207, "epoch": 803} {"train_loss": -36.98031234741211, "global_step": 97208, "epoch": 803} {"train_loss": -38.26723098754883, "global_step": 97209, "epoch": 803} {"train_loss": -37.12980651855469, "global_step": 97210, "epoch": 803} {"train_loss": -37.38605499267578, "global_step": 97211, "epoch": 803} {"train_loss": -37.07379913330078, "global_step": 97212, "epoch": 803} {"train_loss": -37.14246368408203, "global_step": 97213, "epoch": 803} {"train_loss": -38.035701751708984, "global_step": 97214, "epoch": 803} {"train_loss": -37.090389251708984, "global_step": 97215, "epoch": 803} {"train_loss": -38.18132781982422, "global_step": 97216, "epoch": 803} {"train_loss": -36.458824157714844, "global_step": 97217, "epoch": 803} {"train_loss": -37.67569351196289, "global_step": 97218, "epoch": 803} {"train_loss": -37.25173568725586, "global_step": 97219, "epoch": 803} {"train_loss": -36.9765510559082, "global_step": 97220, "epoch": 803} {"train_loss": -38.04449462890625, "global_step": 97221, "epoch": 803} {"train_loss": -38.328773498535156, "global_step": 97222, "epoch": 803} {"train_loss": -37.62610626220703, "global_step": 97223, "epoch": 803} {"train_loss": -37.72820281982422, "global_step": 97224, "epoch": 803} {"train_loss": -38.03986358642578, "global_step": 97225, "epoch": 803} {"train_loss": -37.806026458740234, "global_step": 97226, "epoch": 803} {"train_loss": -37.96152114868164, "global_step": 97227, "epoch": 803} {"train_loss": -38.073116302490234, "global_step": 97228, "epoch": 803} {"train_loss": -37.726131439208984, "global_step": 97229, "epoch": 803} {"train_loss": -38.07810592651367, "global_step": 97230, "epoch": 803} {"train_loss": -38.198787689208984, "global_step": 97231, "epoch": 803} {"train_loss": -38.25727462768555, "global_step": 97232, "epoch": 803} {"train_loss": -37.60844039916992, "global_step": 97233, "epoch": 803} {"train_loss": -38.54835891723633, "global_step": 97234, "epoch": 803} {"train_loss": -37.598636627197266, "global_step": 97235, "epoch": 803} {"train_loss": -38.077476501464844, "global_step": 97236, "epoch": 803} {"train_loss": -38.1668701171875, "global_step": 97237, "epoch": 803} {"train_loss": -37.194679260253906, "global_step": 97238, "epoch": 803} {"train_loss": -38.764408111572266, "global_step": 97239, "epoch": 803} {"train_loss": -38.70638656616211, "global_step": 97240, "epoch": 803} {"train_loss": -37.66705322265625, "global_step": 97241, "epoch": 803} {"train_loss": -38.41119384765625, "global_step": 97242, "epoch": 803} {"train_loss": -39.05086135864258, "global_step": 97243, "epoch": 803} {"train_loss": -38.598575592041016, "global_step": 97244, "epoch": 803} {"train_loss": -38.84951400756836, "global_step": 97245, "epoch": 803} {"train_loss": -38.64433288574219, "global_step": 97246, "epoch": 803} {"train_loss": -38.06992721557617, "global_step": 97247, "epoch": 803} {"train_loss": -38.42820739746094, "global_step": 97248, "epoch": 803} {"train_loss": -38.52930450439453, "global_step": 97249, "epoch": 803} {"train_loss": -39.170528411865234, "global_step": 97250, "epoch": 803} {"train_loss": -38.617889404296875, "global_step": 97251, "epoch": 803} {"train_loss": -38.701026916503906, "global_step": 97252, "epoch": 803} {"train_loss": -39.01879119873047, "global_step": 97253, "epoch": 803} {"train_loss": -38.752071380615234, "global_step": 97254, "epoch": 803} {"train_loss": -39.114891052246094, "global_step": 97255, "epoch": 803} {"train_loss": -39.286659240722656, "global_step": 97256, "epoch": 803} {"train_loss": -38.98440170288086, "global_step": 97257, "epoch": 803} {"train_loss": -39.04022216796875, "global_step": 97258, "epoch": 803} {"train_loss": -39.156227111816406, "global_step": 97259, "epoch": 803} {"train_loss": -38.53407669067383, "global_step": 97260, "epoch": 803} {"train_loss": -38.5247917175293, "global_step": 97261, "epoch": 803} {"train_loss": -38.316917419433594, "global_step": 97262, "epoch": 803} {"train_loss": -37.07493591308594, "global_step": 97263, "epoch": 803} {"train_loss": -36.74073028564453, "global_step": 97264, "epoch": 803} {"train_loss": -38.658565521240234, "global_step": 97265, "epoch": 803} {"train_loss": -38.39547348022461, "global_step": 97266, "epoch": 803} {"train_loss": -36.01105880737305, "global_step": 97267, "epoch": 803} {"train_loss": -36.90422439575195, "global_step": 97268, "epoch": 803} {"train_loss": -39.36243438720703, "global_step": 97269, "epoch": 803} {"train_loss": -37.357635498046875, "global_step": 97270, "epoch": 803} {"train_loss": -36.542015075683594, "global_step": 97271, "epoch": 803} {"train_loss": -39.638710021972656, "global_step": 97272, "epoch": 803} {"train_loss": -38.0006103515625, "global_step": 97273, "epoch": 803} {"train_loss": -37.937618255615234, "global_step": 97274, "epoch": 803} {"train_loss": -38.917884826660156, "global_step": 97275, "epoch": 803} {"train_loss": -37.813777923583984, "global_step": 97276, "epoch": 803} {"train_loss": -38.80029296875, "global_step": 97277, "epoch": 803} {"train_loss": -38.65220260620117, "global_step": 97278, "epoch": 803} {"train_loss": -38.74276351928711, "global_step": 97279, "epoch": 803} {"train_loss": -37.688961029052734, "global_step": 97280, "epoch": 803} {"train_loss": -39.045528411865234, "global_step": 97281, "epoch": 803} {"train_loss": -37.693416595458984, "global_step": 97282, "epoch": 803} {"train_loss": -37.70020953091708, "global_step": 97283, "epoch": 803, "val_loss": 2631139.0} {"train_loss": -38.7962760925293, "global_step": 97284, "epoch": 804} {"train_loss": -37.69072341918945, "global_step": 97285, "epoch": 804} {"train_loss": -38.10560989379883, "global_step": 97286, "epoch": 804} {"train_loss": -37.57525634765625, "global_step": 97287, "epoch": 804} {"train_loss": -37.22451400756836, "global_step": 97288, "epoch": 804} {"train_loss": -37.92756271362305, "global_step": 97289, "epoch": 804} {"train_loss": -35.91779327392578, "global_step": 97290, "epoch": 804} {"train_loss": -38.878658294677734, "global_step": 97291, "epoch": 804} {"train_loss": -37.31727981567383, "global_step": 97292, "epoch": 804} {"train_loss": -38.69438552856445, "global_step": 97293, "epoch": 804} {"train_loss": -37.22528839111328, "global_step": 97294, "epoch": 804} {"train_loss": -39.082157135009766, "global_step": 97295, "epoch": 804} {"train_loss": -37.179847717285156, "global_step": 97296, "epoch": 804} {"train_loss": -38.55164337158203, "global_step": 97297, "epoch": 804} {"train_loss": -37.655025482177734, "global_step": 97298, "epoch": 804} {"train_loss": -37.63507080078125, "global_step": 97299, "epoch": 804} {"train_loss": -37.24317932128906, "global_step": 97300, "epoch": 804} {"train_loss": -38.16251754760742, "global_step": 97301, "epoch": 804} {"train_loss": -39.07034683227539, "global_step": 97302, "epoch": 804} {"train_loss": -38.40302276611328, "global_step": 97303, "epoch": 804} {"train_loss": -38.57522201538086, "global_step": 97304, "epoch": 804} {"train_loss": -38.84542465209961, "global_step": 97305, "epoch": 804} {"train_loss": -38.53158187866211, "global_step": 97306, "epoch": 804} {"train_loss": -38.842952728271484, "global_step": 97307, "epoch": 804} {"train_loss": -38.56303024291992, "global_step": 97308, "epoch": 804} {"train_loss": -38.96009063720703, "global_step": 97309, "epoch": 804} {"train_loss": -39.082252502441406, "global_step": 97310, "epoch": 804} {"train_loss": -37.71928787231445, "global_step": 97311, "epoch": 804} {"train_loss": -38.2678108215332, "global_step": 97312, "epoch": 804} {"train_loss": -38.8499755859375, "global_step": 97313, "epoch": 804} {"train_loss": -38.61743927001953, "global_step": 97314, "epoch": 804} {"train_loss": -38.77809143066406, "global_step": 97315, "epoch": 804} {"train_loss": -38.7738151550293, "global_step": 97316, "epoch": 804} {"train_loss": -38.46409225463867, "global_step": 97317, "epoch": 804} {"train_loss": -37.85871124267578, "global_step": 97318, "epoch": 804} {"train_loss": -38.32485580444336, "global_step": 97319, "epoch": 804} {"train_loss": -38.440765380859375, "global_step": 97320, "epoch": 804} {"train_loss": -38.468074798583984, "global_step": 97321, "epoch": 804} {"train_loss": -37.81590270996094, "global_step": 97322, "epoch": 804} {"train_loss": -38.52452087402344, "global_step": 97323, "epoch": 804} {"train_loss": -37.87076950073242, "global_step": 97324, "epoch": 804} {"train_loss": -37.74479675292969, "global_step": 97325, "epoch": 804} {"train_loss": -39.00852584838867, "global_step": 97326, "epoch": 804} {"train_loss": -38.11087417602539, "global_step": 97327, "epoch": 804} {"train_loss": -38.512088775634766, "global_step": 97328, "epoch": 804} {"train_loss": -38.8311653137207, "global_step": 97329, "epoch": 804} {"train_loss": -38.222713470458984, "global_step": 97330, "epoch": 804} {"train_loss": -38.473480224609375, "global_step": 97331, "epoch": 804} {"train_loss": -38.62446212768555, "global_step": 97332, "epoch": 804} {"train_loss": -37.72062683105469, "global_step": 97333, "epoch": 804} {"train_loss": -39.047420501708984, "global_step": 97334, "epoch": 804} {"train_loss": -38.30391311645508, "global_step": 97335, "epoch": 804} {"train_loss": -38.39486312866211, "global_step": 97336, "epoch": 804} {"train_loss": -38.49628448486328, "global_step": 97337, "epoch": 804} {"train_loss": -39.061553955078125, "global_step": 97338, "epoch": 804} {"train_loss": -38.7498893737793, "global_step": 97339, "epoch": 804} {"train_loss": -38.4457893371582, "global_step": 97340, "epoch": 804} {"train_loss": -39.313568115234375, "global_step": 97341, "epoch": 804} {"train_loss": -38.61970901489258, "global_step": 97342, "epoch": 804} {"train_loss": -38.988914489746094, "global_step": 97343, "epoch": 804} {"train_loss": -38.72259521484375, "global_step": 97344, "epoch": 804} {"train_loss": -38.79895782470703, "global_step": 97345, "epoch": 804} {"train_loss": -37.62430953979492, "global_step": 97346, "epoch": 804} {"train_loss": -38.209537506103516, "global_step": 97347, "epoch": 804} {"train_loss": -38.60704040527344, "global_step": 97348, "epoch": 804} {"train_loss": -37.883636474609375, "global_step": 97349, "epoch": 804} {"train_loss": -38.38975524902344, "global_step": 97350, "epoch": 804} {"train_loss": -37.860877990722656, "global_step": 97351, "epoch": 804} {"train_loss": -39.124263763427734, "global_step": 97352, "epoch": 804} {"train_loss": -39.627811431884766, "global_step": 97353, "epoch": 804} {"train_loss": -38.77555465698242, "global_step": 97354, "epoch": 804} {"train_loss": -38.173980712890625, "global_step": 97355, "epoch": 804} {"train_loss": -36.94961166381836, "global_step": 97356, "epoch": 804} {"train_loss": -35.364803314208984, "global_step": 97357, "epoch": 804} {"train_loss": -34.1848030090332, "global_step": 97358, "epoch": 804} {"train_loss": -32.85830307006836, "global_step": 97359, "epoch": 804} {"train_loss": -37.039772033691406, "global_step": 97360, "epoch": 804} {"train_loss": -38.472442626953125, "global_step": 97361, "epoch": 804} {"train_loss": -38.43442153930664, "global_step": 97362, "epoch": 804} {"train_loss": -39.02826690673828, "global_step": 97363, "epoch": 804} {"train_loss": -38.49312973022461, "global_step": 97364, "epoch": 804} {"train_loss": -38.33005905151367, "global_step": 97365, "epoch": 804} {"train_loss": -37.9476203918457, "global_step": 97366, "epoch": 804} {"train_loss": -38.14408493041992, "global_step": 97367, "epoch": 804} {"train_loss": -38.02686309814453, "global_step": 97368, "epoch": 804} {"train_loss": -38.54098892211914, "global_step": 97369, "epoch": 804} {"train_loss": -39.356143951416016, "global_step": 97370, "epoch": 804} {"train_loss": -39.03791046142578, "global_step": 97371, "epoch": 804} {"train_loss": -38.747642517089844, "global_step": 97372, "epoch": 804} {"train_loss": -38.07135772705078, "global_step": 97373, "epoch": 804} {"train_loss": -38.10599899291992, "global_step": 97374, "epoch": 804} {"train_loss": -38.49315643310547, "global_step": 97375, "epoch": 804} {"train_loss": -38.498870849609375, "global_step": 97376, "epoch": 804} {"train_loss": -38.156890869140625, "global_step": 97377, "epoch": 804} {"train_loss": -38.11697006225586, "global_step": 97378, "epoch": 804} {"train_loss": -38.36602783203125, "global_step": 97379, "epoch": 804} {"train_loss": -38.26835250854492, "global_step": 97380, "epoch": 804} {"train_loss": -39.263423919677734, "global_step": 97381, "epoch": 804} {"train_loss": -38.723731994628906, "global_step": 97382, "epoch": 804} {"train_loss": -38.09865951538086, "global_step": 97383, "epoch": 804} {"train_loss": -38.31864547729492, "global_step": 97384, "epoch": 804} {"train_loss": -38.518741607666016, "global_step": 97385, "epoch": 804} {"train_loss": -38.58614730834961, "global_step": 97386, "epoch": 804} {"train_loss": -37.995521545410156, "global_step": 97387, "epoch": 804} {"train_loss": -38.65163040161133, "global_step": 97388, "epoch": 804} {"train_loss": -38.78206253051758, "global_step": 97389, "epoch": 804} {"train_loss": -37.51194763183594, "global_step": 97390, "epoch": 804} {"train_loss": -37.939239501953125, "global_step": 97391, "epoch": 804} {"train_loss": -38.00441360473633, "global_step": 97392, "epoch": 804} {"train_loss": -37.502933502197266, "global_step": 97393, "epoch": 804} {"train_loss": -38.03013229370117, "global_step": 97394, "epoch": 804} {"train_loss": -37.8567008972168, "global_step": 97395, "epoch": 804} {"train_loss": -35.97190475463867, "global_step": 97396, "epoch": 804} {"train_loss": -38.162506103515625, "global_step": 97397, "epoch": 804} {"train_loss": -39.19990158081055, "global_step": 97398, "epoch": 804} {"train_loss": -37.306556701660156, "global_step": 97399, "epoch": 804} {"train_loss": -38.355262756347656, "global_step": 97400, "epoch": 804} {"train_loss": -37.68206787109375, "global_step": 97401, "epoch": 804} {"train_loss": -39.068172454833984, "global_step": 97402, "epoch": 804} {"train_loss": -38.39338302612305, "global_step": 97403, "epoch": 804} {"train_loss": -38.20160457516505, "global_step": 97404, "epoch": 804, "val_loss": 2619022.25} {"train_loss": -38.679603576660156, "global_step": 97405, "epoch": 805} {"train_loss": -38.80501174926758, "global_step": 97406, "epoch": 805} {"train_loss": -38.499629974365234, "global_step": 97407, "epoch": 805} {"train_loss": -38.4232177734375, "global_step": 97408, "epoch": 805} {"train_loss": -38.66048812866211, "global_step": 97409, "epoch": 805} {"train_loss": -38.93501663208008, "global_step": 97410, "epoch": 805} {"train_loss": -38.61410140991211, "global_step": 97411, "epoch": 805} {"train_loss": -38.819053649902344, "global_step": 97412, "epoch": 805} {"train_loss": -39.17391586303711, "global_step": 97413, "epoch": 805} {"train_loss": -38.550453186035156, "global_step": 97414, "epoch": 805} {"train_loss": -39.009674072265625, "global_step": 97415, "epoch": 805} {"train_loss": -38.98610305786133, "global_step": 97416, "epoch": 805} {"train_loss": -38.88130187988281, "global_step": 97417, "epoch": 805} {"train_loss": -39.526058197021484, "global_step": 97418, "epoch": 805} {"train_loss": -38.845619201660156, "global_step": 97419, "epoch": 805} {"train_loss": -38.72575759887695, "global_step": 97420, "epoch": 805} {"train_loss": -38.936527252197266, "global_step": 97421, "epoch": 805} {"train_loss": -38.97782516479492, "global_step": 97422, "epoch": 805} {"train_loss": -39.504127502441406, "global_step": 97423, "epoch": 805} {"train_loss": -39.13207244873047, "global_step": 97424, "epoch": 805} {"train_loss": -39.16654586791992, "global_step": 97425, "epoch": 805} {"train_loss": -38.975624084472656, "global_step": 97426, "epoch": 805} {"train_loss": -39.33309555053711, "global_step": 97427, "epoch": 805} {"train_loss": -38.92865753173828, "global_step": 97428, "epoch": 805} {"train_loss": -39.18115997314453, "global_step": 97429, "epoch": 805} {"train_loss": -39.49567794799805, "global_step": 97430, "epoch": 805} {"train_loss": -38.36550521850586, "global_step": 97431, "epoch": 805} {"train_loss": -39.290157318115234, "global_step": 97432, "epoch": 805} {"train_loss": -39.14375305175781, "global_step": 97433, "epoch": 805} {"train_loss": -39.02866744995117, "global_step": 97434, "epoch": 805} {"train_loss": -39.377193450927734, "global_step": 97435, "epoch": 805} {"train_loss": -38.855281829833984, "global_step": 97436, "epoch": 805} {"train_loss": -39.11097717285156, "global_step": 97437, "epoch": 805} {"train_loss": -39.422279357910156, "global_step": 97438, "epoch": 805} {"train_loss": -39.30793380737305, "global_step": 97439, "epoch": 805} {"train_loss": -39.04218292236328, "global_step": 97440, "epoch": 805} {"train_loss": -39.248477935791016, "global_step": 97441, "epoch": 805} {"train_loss": -38.96432113647461, "global_step": 97442, "epoch": 805} {"train_loss": -38.547542572021484, "global_step": 97443, "epoch": 805} {"train_loss": -38.54091262817383, "global_step": 97444, "epoch": 805} {"train_loss": -38.729736328125, "global_step": 97445, "epoch": 805} {"train_loss": -37.503543853759766, "global_step": 97446, "epoch": 805} {"train_loss": -34.52219009399414, "global_step": 97447, "epoch": 805} {"train_loss": -27.733539581298828, "global_step": 97448, "epoch": 805} {"train_loss": -24.71330451965332, "global_step": 97449, "epoch": 805} {"train_loss": 41.4490966796875, "global_step": 97450, "epoch": 805} {"train_loss": -7.499520301818848, "global_step": 97451, "epoch": 805} {"train_loss": -29.749975204467773, "global_step": 97452, "epoch": 805} {"train_loss": -23.36475944519043, "global_step": 97453, "epoch": 805} {"train_loss": -32.71685791015625, "global_step": 97454, "epoch": 805} {"train_loss": -31.345123291015625, "global_step": 97455, "epoch": 805} {"train_loss": -33.81873321533203, "global_step": 97456, "epoch": 805} {"train_loss": -33.078956604003906, "global_step": 97457, "epoch": 805} {"train_loss": -33.57487869262695, "global_step": 97458, "epoch": 805} {"train_loss": -33.349117279052734, "global_step": 97459, "epoch": 805} {"train_loss": -34.06483840942383, "global_step": 97460, "epoch": 805} {"train_loss": -34.35456848144531, "global_step": 97461, "epoch": 805} {"train_loss": -37.05100631713867, "global_step": 97462, "epoch": 805} {"train_loss": -35.92457962036133, "global_step": 97463, "epoch": 805} {"train_loss": -35.35447311401367, "global_step": 97464, "epoch": 805} {"train_loss": -36.94460678100586, "global_step": 97465, "epoch": 805} {"train_loss": -35.108516693115234, "global_step": 97466, "epoch": 805} {"train_loss": -36.56337356567383, "global_step": 97467, "epoch": 805} {"train_loss": -36.403194427490234, "global_step": 97468, "epoch": 805} {"train_loss": -36.465606689453125, "global_step": 97469, "epoch": 805} {"train_loss": -36.60094451904297, "global_step": 97470, "epoch": 805} {"train_loss": -36.48933792114258, "global_step": 97471, "epoch": 805} {"train_loss": -36.307708740234375, "global_step": 97472, "epoch": 805} {"train_loss": -36.335453033447266, "global_step": 97473, "epoch": 805} {"train_loss": -37.24898910522461, "global_step": 97474, "epoch": 805} {"train_loss": -36.77687454223633, "global_step": 97475, "epoch": 805} {"train_loss": -37.23038864135742, "global_step": 97476, "epoch": 805} {"train_loss": -37.18377685546875, "global_step": 97477, "epoch": 805} {"train_loss": -36.79415512084961, "global_step": 97478, "epoch": 805} {"train_loss": -37.7707405090332, "global_step": 97479, "epoch": 805} {"train_loss": -37.41730499267578, "global_step": 97480, "epoch": 805} {"train_loss": -37.598506927490234, "global_step": 97481, "epoch": 805} {"train_loss": -37.56976318359375, "global_step": 97482, "epoch": 805} {"train_loss": -37.876625061035156, "global_step": 97483, "epoch": 805} {"train_loss": -37.93539810180664, "global_step": 97484, "epoch": 805} {"train_loss": -38.015506744384766, "global_step": 97485, "epoch": 805} {"train_loss": -37.913551330566406, "global_step": 97486, "epoch": 805} {"train_loss": -37.82122802734375, "global_step": 97487, "epoch": 805} {"train_loss": -38.028865814208984, "global_step": 97488, "epoch": 805} {"train_loss": -38.083866119384766, "global_step": 97489, "epoch": 805} {"train_loss": -37.61712646484375, "global_step": 97490, "epoch": 805} {"train_loss": -38.43014144897461, "global_step": 97491, "epoch": 805} {"train_loss": -37.654518127441406, "global_step": 97492, "epoch": 805} {"train_loss": -38.18345260620117, "global_step": 97493, "epoch": 805} {"train_loss": -38.428550720214844, "global_step": 97494, "epoch": 805} {"train_loss": -38.52286148071289, "global_step": 97495, "epoch": 805} {"train_loss": -38.27053451538086, "global_step": 97496, "epoch": 805} {"train_loss": -38.66844177246094, "global_step": 97497, "epoch": 805} {"train_loss": -38.39603805541992, "global_step": 97498, "epoch": 805} {"train_loss": -38.90798568725586, "global_step": 97499, "epoch": 805} {"train_loss": -38.73844528198242, "global_step": 97500, "epoch": 805} {"train_loss": -38.67877197265625, "global_step": 97501, "epoch": 805} {"train_loss": -38.81816864013672, "global_step": 97502, "epoch": 805} {"train_loss": -38.896854400634766, "global_step": 97503, "epoch": 805} {"train_loss": -38.68571853637695, "global_step": 97504, "epoch": 805} {"train_loss": -38.8980712890625, "global_step": 97505, "epoch": 805} {"train_loss": -38.79603958129883, "global_step": 97506, "epoch": 805} {"train_loss": -38.83396530151367, "global_step": 97507, "epoch": 805} {"train_loss": -39.158992767333984, "global_step": 97508, "epoch": 805} {"train_loss": -38.88667678833008, "global_step": 97509, "epoch": 805} {"train_loss": -38.996551513671875, "global_step": 97510, "epoch": 805} {"train_loss": -38.94338607788086, "global_step": 97511, "epoch": 805} {"train_loss": -39.167396545410156, "global_step": 97512, "epoch": 805} {"train_loss": -38.74787139892578, "global_step": 97513, "epoch": 805} {"train_loss": -39.312767028808594, "global_step": 97514, "epoch": 805} {"train_loss": -39.2282829284668, "global_step": 97515, "epoch": 805} {"train_loss": -39.227210998535156, "global_step": 97516, "epoch": 805} {"train_loss": -39.057464599609375, "global_step": 97517, "epoch": 805} {"train_loss": -39.34347152709961, "global_step": 97518, "epoch": 805} {"train_loss": -39.08791732788086, "global_step": 97519, "epoch": 805} {"train_loss": -39.2187385559082, "global_step": 97520, "epoch": 805} {"train_loss": -39.57912826538086, "global_step": 97521, "epoch": 805} {"train_loss": -39.32400131225586, "global_step": 97522, "epoch": 805} {"train_loss": -39.06058883666992, "global_step": 97523, "epoch": 805} {"train_loss": -39.27091598510742, "global_step": 97524, "epoch": 805} {"train_loss": -36.71472838693414, "global_step": 97525, "epoch": 805, "val_loss": 2673439.25} {"train_loss": -38.772705078125, "global_step": 97526, "epoch": 806} {"train_loss": -39.10662841796875, "global_step": 97527, "epoch": 806} {"train_loss": -39.37665557861328, "global_step": 97528, "epoch": 806} {"train_loss": -39.20978927612305, "global_step": 97529, "epoch": 806} {"train_loss": -39.083168029785156, "global_step": 97530, "epoch": 806} {"train_loss": -39.571632385253906, "global_step": 97531, "epoch": 806} {"train_loss": -39.648624420166016, "global_step": 97532, "epoch": 806} {"train_loss": -39.711029052734375, "global_step": 97533, "epoch": 806} {"train_loss": -39.311744689941406, "global_step": 97534, "epoch": 806} {"train_loss": -39.28562545776367, "global_step": 97535, "epoch": 806} {"train_loss": -38.893043518066406, "global_step": 97536, "epoch": 806} {"train_loss": -39.15977478027344, "global_step": 97537, "epoch": 806} {"train_loss": -38.81509017944336, "global_step": 97538, "epoch": 806} {"train_loss": -38.50391387939453, "global_step": 97539, "epoch": 806} {"train_loss": -38.657535552978516, "global_step": 97540, "epoch": 806} {"train_loss": -39.343528747558594, "global_step": 97541, "epoch": 806} {"train_loss": -38.54814529418945, "global_step": 97542, "epoch": 806} {"train_loss": -37.17085266113281, "global_step": 97543, "epoch": 806} {"train_loss": -36.37583541870117, "global_step": 97544, "epoch": 806} {"train_loss": -34.00684356689453, "global_step": 97545, "epoch": 806} {"train_loss": -33.581764221191406, "global_step": 97546, "epoch": 806} {"train_loss": -33.9465217590332, "global_step": 97547, "epoch": 806} {"train_loss": -35.46298599243164, "global_step": 97548, "epoch": 806} {"train_loss": -38.45136260986328, "global_step": 97549, "epoch": 806} {"train_loss": -35.31696319580078, "global_step": 97550, "epoch": 806} {"train_loss": -36.78447341918945, "global_step": 97551, "epoch": 806} {"train_loss": -36.0222282409668, "global_step": 97552, "epoch": 806} {"train_loss": -37.61845397949219, "global_step": 97553, "epoch": 806} {"train_loss": -35.89460372924805, "global_step": 97554, "epoch": 806} {"train_loss": -36.41866683959961, "global_step": 97555, "epoch": 806} {"train_loss": -38.19614028930664, "global_step": 97556, "epoch": 806} {"train_loss": -35.99900436401367, "global_step": 97557, "epoch": 806} {"train_loss": -35.38576126098633, "global_step": 97558, "epoch": 806} {"train_loss": -36.846309661865234, "global_step": 97559, "epoch": 806} {"train_loss": -35.979740142822266, "global_step": 97560, "epoch": 806} {"train_loss": -36.2508659362793, "global_step": 97561, "epoch": 806} {"train_loss": -36.258872985839844, "global_step": 97562, "epoch": 806} {"train_loss": -37.6180419921875, "global_step": 97563, "epoch": 806} {"train_loss": -34.41483688354492, "global_step": 97564, "epoch": 806} {"train_loss": -34.69902801513672, "global_step": 97565, "epoch": 806} {"train_loss": -36.93141174316406, "global_step": 97566, "epoch": 806} {"train_loss": -36.93704605102539, "global_step": 97567, "epoch": 806} {"train_loss": -35.775543212890625, "global_step": 97568, "epoch": 806} {"train_loss": -37.749080657958984, "global_step": 97569, "epoch": 806} {"train_loss": -36.60616683959961, "global_step": 97570, "epoch": 806} {"train_loss": -37.72979736328125, "global_step": 97571, "epoch": 806} {"train_loss": -37.6788444519043, "global_step": 97572, "epoch": 806} {"train_loss": -37.60752487182617, "global_step": 97573, "epoch": 806} {"train_loss": -37.88093948364258, "global_step": 97574, "epoch": 806} {"train_loss": -37.037532806396484, "global_step": 97575, "epoch": 806} {"train_loss": -38.2514762878418, "global_step": 97576, "epoch": 806} {"train_loss": -37.990753173828125, "global_step": 97577, "epoch": 806} {"train_loss": -37.764801025390625, "global_step": 97578, "epoch": 806} {"train_loss": -38.1242790222168, "global_step": 97579, "epoch": 806} {"train_loss": -37.97367858886719, "global_step": 97580, "epoch": 806} {"train_loss": -37.358131408691406, "global_step": 97581, "epoch": 806} {"train_loss": -38.464481353759766, "global_step": 97582, "epoch": 806} {"train_loss": -37.40675735473633, "global_step": 97583, "epoch": 806} {"train_loss": -38.35419464111328, "global_step": 97584, "epoch": 806} {"train_loss": -37.48457717895508, "global_step": 97585, "epoch": 806} {"train_loss": -38.051570892333984, "global_step": 97586, "epoch": 806} {"train_loss": -38.334102630615234, "global_step": 97587, "epoch": 806} {"train_loss": -37.66720199584961, "global_step": 97588, "epoch": 806} {"train_loss": -37.97404098510742, "global_step": 97589, "epoch": 806} {"train_loss": -37.95429229736328, "global_step": 97590, "epoch": 806} {"train_loss": -37.90232467651367, "global_step": 97591, "epoch": 806} {"train_loss": -38.6070442199707, "global_step": 97592, "epoch": 806} {"train_loss": -38.33882141113281, "global_step": 97593, "epoch": 806} {"train_loss": -38.99233627319336, "global_step": 97594, "epoch": 806} {"train_loss": -38.37016296386719, "global_step": 97595, "epoch": 806} {"train_loss": -38.78339385986328, "global_step": 97596, "epoch": 806} {"train_loss": -38.385799407958984, "global_step": 97597, "epoch": 806} {"train_loss": -38.761661529541016, "global_step": 97598, "epoch": 806} {"train_loss": -38.485511779785156, "global_step": 97599, "epoch": 806} {"train_loss": -38.56428909301758, "global_step": 97600, "epoch": 806} {"train_loss": -38.96942138671875, "global_step": 97601, "epoch": 806} {"train_loss": -38.24351119995117, "global_step": 97602, "epoch": 806} {"train_loss": -38.39347457885742, "global_step": 97603, "epoch": 806} {"train_loss": -39.07160568237305, "global_step": 97604, "epoch": 806} {"train_loss": -38.064266204833984, "global_step": 97605, "epoch": 806} {"train_loss": -39.2304573059082, "global_step": 97606, "epoch": 806} {"train_loss": -39.09275436401367, "global_step": 97607, "epoch": 806} {"train_loss": -38.58155822753906, "global_step": 97608, "epoch": 806} {"train_loss": -39.319393157958984, "global_step": 97609, "epoch": 806} {"train_loss": -38.07721710205078, "global_step": 97610, "epoch": 806} {"train_loss": -39.1517219543457, "global_step": 97611, "epoch": 806} {"train_loss": -38.45357131958008, "global_step": 97612, "epoch": 806} {"train_loss": -39.30356979370117, "global_step": 97613, "epoch": 806} {"train_loss": -38.56183624267578, "global_step": 97614, "epoch": 806} {"train_loss": -39.09284973144531, "global_step": 97615, "epoch": 806} {"train_loss": -38.92517852783203, "global_step": 97616, "epoch": 806} {"train_loss": -38.75291061401367, "global_step": 97617, "epoch": 806} {"train_loss": -39.65971374511719, "global_step": 97618, "epoch": 806} {"train_loss": -38.3602409362793, "global_step": 97619, "epoch": 806} {"train_loss": -38.78316116333008, "global_step": 97620, "epoch": 806} {"train_loss": -39.05985641479492, "global_step": 97621, "epoch": 806} {"train_loss": -38.970703125, "global_step": 97622, "epoch": 806} {"train_loss": -38.93740463256836, "global_step": 97623, "epoch": 806} {"train_loss": -39.261417388916016, "global_step": 97624, "epoch": 806} {"train_loss": -39.60001754760742, "global_step": 97625, "epoch": 806} {"train_loss": -38.41264343261719, "global_step": 97626, "epoch": 806} {"train_loss": -38.965999603271484, "global_step": 97627, "epoch": 806} {"train_loss": -38.26103591918945, "global_step": 97628, "epoch": 806} {"train_loss": -39.47835159301758, "global_step": 97629, "epoch": 806} {"train_loss": -38.8426513671875, "global_step": 97630, "epoch": 806} {"train_loss": -38.29719924926758, "global_step": 97631, "epoch": 806} {"train_loss": -39.0252571105957, "global_step": 97632, "epoch": 806} {"train_loss": -38.00686264038086, "global_step": 97633, "epoch": 806} {"train_loss": -38.74172592163086, "global_step": 97634, "epoch": 806} {"train_loss": -38.335689544677734, "global_step": 97635, "epoch": 806} {"train_loss": -37.92212677001953, "global_step": 97636, "epoch": 806} {"train_loss": -37.58870315551758, "global_step": 97637, "epoch": 806} {"train_loss": -37.43970489501953, "global_step": 97638, "epoch": 806} {"train_loss": -37.500640869140625, "global_step": 97639, "epoch": 806} {"train_loss": -37.157535552978516, "global_step": 97640, "epoch": 806} {"train_loss": -37.51294708251953, "global_step": 97641, "epoch": 806} {"train_loss": -36.26797103881836, "global_step": 97642, "epoch": 806} {"train_loss": -27.209720611572266, "global_step": 97643, "epoch": 806} {"train_loss": -31.605819702148438, "global_step": 97644, "epoch": 806} {"train_loss": -35.035430908203125, "global_step": 97645, "epoch": 806} {"train_loss": -37.763381232900066, "global_step": 97646, "epoch": 806, "val_loss": 2708926.75} {"train_loss": -35.44211959838867, "global_step": 97647, "epoch": 807} {"train_loss": -24.68406867980957, "global_step": 97648, "epoch": 807} {"train_loss": -35.71812438964844, "global_step": 97649, "epoch": 807} {"train_loss": -34.667537689208984, "global_step": 97650, "epoch": 807} {"train_loss": -26.985137939453125, "global_step": 97651, "epoch": 807} {"train_loss": -33.49729537963867, "global_step": 97652, "epoch": 807} {"train_loss": -32.8235969543457, "global_step": 97653, "epoch": 807} {"train_loss": -28.110105514526367, "global_step": 97654, "epoch": 807} {"train_loss": -34.230804443359375, "global_step": 97655, "epoch": 807} {"train_loss": -31.9168643951416, "global_step": 97656, "epoch": 807} {"train_loss": -32.870948791503906, "global_step": 97657, "epoch": 807} {"train_loss": -32.22385787963867, "global_step": 97658, "epoch": 807} {"train_loss": -32.755489349365234, "global_step": 97659, "epoch": 807} {"train_loss": -31.6810245513916, "global_step": 97660, "epoch": 807} {"train_loss": -30.040502548217773, "global_step": 97661, "epoch": 807} {"train_loss": -30.92134666442871, "global_step": 97662, "epoch": 807} {"train_loss": -13.080592155456543, "global_step": 97663, "epoch": 807} {"train_loss": -32.781890869140625, "global_step": 97664, "epoch": 807} {"train_loss": -29.574914932250977, "global_step": 97665, "epoch": 807} {"train_loss": -30.143335342407227, "global_step": 97666, "epoch": 807} {"train_loss": -28.96076011657715, "global_step": 97667, "epoch": 807} {"train_loss": -24.53521156311035, "global_step": 97668, "epoch": 807} {"train_loss": -29.233213424682617, "global_step": 97669, "epoch": 807} {"train_loss": -31.189802169799805, "global_step": 97670, "epoch": 807} {"train_loss": -33.46100616455078, "global_step": 97671, "epoch": 807} {"train_loss": -31.30568504333496, "global_step": 97672, "epoch": 807} {"train_loss": -34.40749740600586, "global_step": 97673, "epoch": 807} {"train_loss": -32.07476043701172, "global_step": 97674, "epoch": 807} {"train_loss": -32.426910400390625, "global_step": 97675, "epoch": 807} {"train_loss": -33.37279510498047, "global_step": 97676, "epoch": 807} {"train_loss": -33.80364990234375, "global_step": 97677, "epoch": 807} {"train_loss": -32.99287033081055, "global_step": 97678, "epoch": 807} {"train_loss": -32.598201751708984, "global_step": 97679, "epoch": 807} {"train_loss": -33.57339096069336, "global_step": 97680, "epoch": 807} {"train_loss": -34.380950927734375, "global_step": 97681, "epoch": 807} {"train_loss": -32.256160736083984, "global_step": 97682, "epoch": 807} {"train_loss": -32.885467529296875, "global_step": 97683, "epoch": 807} {"train_loss": -31.95822525024414, "global_step": 97684, "epoch": 807} {"train_loss": -34.34693908691406, "global_step": 97685, "epoch": 807} {"train_loss": -34.058860778808594, "global_step": 97686, "epoch": 807} {"train_loss": -34.373531341552734, "global_step": 97687, "epoch": 807} {"train_loss": -34.83792495727539, "global_step": 97688, "epoch": 807} {"train_loss": -34.79267883300781, "global_step": 97689, "epoch": 807} {"train_loss": -35.02655029296875, "global_step": 97690, "epoch": 807} {"train_loss": -35.15719223022461, "global_step": 97691, "epoch": 807} {"train_loss": -34.12363815307617, "global_step": 97692, "epoch": 807} {"train_loss": -34.88767623901367, "global_step": 97693, "epoch": 807} {"train_loss": -35.181392669677734, "global_step": 97694, "epoch": 807} {"train_loss": -35.2664794921875, "global_step": 97695, "epoch": 807} {"train_loss": -34.96516036987305, "global_step": 97696, "epoch": 807} {"train_loss": -35.16755294799805, "global_step": 97697, "epoch": 807} {"train_loss": -35.2379264831543, "global_step": 97698, "epoch": 807} {"train_loss": -35.63526916503906, "global_step": 97699, "epoch": 807} {"train_loss": -35.42667770385742, "global_step": 97700, "epoch": 807} {"train_loss": -35.48836898803711, "global_step": 97701, "epoch": 807} {"train_loss": -34.46651077270508, "global_step": 97702, "epoch": 807} {"train_loss": -34.59381103515625, "global_step": 97703, "epoch": 807} {"train_loss": -35.634033203125, "global_step": 97704, "epoch": 807} {"train_loss": -35.726287841796875, "global_step": 97705, "epoch": 807} {"train_loss": -35.79234313964844, "global_step": 97706, "epoch": 807} {"train_loss": -35.55498504638672, "global_step": 97707, "epoch": 807} {"train_loss": -35.802978515625, "global_step": 97708, "epoch": 807} {"train_loss": -36.19927978515625, "global_step": 97709, "epoch": 807} {"train_loss": -36.259735107421875, "global_step": 97710, "epoch": 807} {"train_loss": -35.07352828979492, "global_step": 97711, "epoch": 807} {"train_loss": -35.207977294921875, "global_step": 97712, "epoch": 807} {"train_loss": -35.88137435913086, "global_step": 97713, "epoch": 807} {"train_loss": -36.0145263671875, "global_step": 97714, "epoch": 807} {"train_loss": -35.610565185546875, "global_step": 97715, "epoch": 807} {"train_loss": -35.92792510986328, "global_step": 97716, "epoch": 807} {"train_loss": -36.38827133178711, "global_step": 97717, "epoch": 807} {"train_loss": -35.28978729248047, "global_step": 97718, "epoch": 807} {"train_loss": -35.88483810424805, "global_step": 97719, "epoch": 807} {"train_loss": -36.31378936767578, "global_step": 97720, "epoch": 807} {"train_loss": -36.366615295410156, "global_step": 97721, "epoch": 807} {"train_loss": -36.55585479736328, "global_step": 97722, "epoch": 807} {"train_loss": -34.8689079284668, "global_step": 97723, "epoch": 807} {"train_loss": -36.22428512573242, "global_step": 97724, "epoch": 807} {"train_loss": -36.26408004760742, "global_step": 97725, "epoch": 807} {"train_loss": -36.431392669677734, "global_step": 97726, "epoch": 807} {"train_loss": -35.42182922363281, "global_step": 97727, "epoch": 807} {"train_loss": -35.63853454589844, "global_step": 97728, "epoch": 807} {"train_loss": -36.169410705566406, "global_step": 97729, "epoch": 807} {"train_loss": -36.30766677856445, "global_step": 97730, "epoch": 807} {"train_loss": -36.766441345214844, "global_step": 97731, "epoch": 807} {"train_loss": -36.51894760131836, "global_step": 97732, "epoch": 807} {"train_loss": -37.08892822265625, "global_step": 97733, "epoch": 807} {"train_loss": -36.700469970703125, "global_step": 97734, "epoch": 807} {"train_loss": -36.908294677734375, "global_step": 97735, "epoch": 807} {"train_loss": -36.81062698364258, "global_step": 97736, "epoch": 807} {"train_loss": -37.02268600463867, "global_step": 97737, "epoch": 807} {"train_loss": -37.0504264831543, "global_step": 97738, "epoch": 807} {"train_loss": -36.62035369873047, "global_step": 97739, "epoch": 807} {"train_loss": -37.058998107910156, "global_step": 97740, "epoch": 807} {"train_loss": -37.0152473449707, "global_step": 97741, "epoch": 807} {"train_loss": -36.639827728271484, "global_step": 97742, "epoch": 807} {"train_loss": -37.057350158691406, "global_step": 97743, "epoch": 807} {"train_loss": -37.441646575927734, "global_step": 97744, "epoch": 807} {"train_loss": -36.62355422973633, "global_step": 97745, "epoch": 807} {"train_loss": -36.644142150878906, "global_step": 97746, "epoch": 807} {"train_loss": -37.278438568115234, "global_step": 97747, "epoch": 807} {"train_loss": -37.2523307800293, "global_step": 97748, "epoch": 807} {"train_loss": -37.193603515625, "global_step": 97749, "epoch": 807} {"train_loss": -36.361488342285156, "global_step": 97750, "epoch": 807} {"train_loss": -37.708953857421875, "global_step": 97751, "epoch": 807} {"train_loss": -37.62783432006836, "global_step": 97752, "epoch": 807} {"train_loss": -36.435333251953125, "global_step": 97753, "epoch": 807} {"train_loss": -37.617610931396484, "global_step": 97754, "epoch": 807} {"train_loss": -37.22005081176758, "global_step": 97755, "epoch": 807} {"train_loss": -36.890525817871094, "global_step": 97756, "epoch": 807} {"train_loss": -37.33164596557617, "global_step": 97757, "epoch": 807} {"train_loss": -36.882476806640625, "global_step": 97758, "epoch": 807} {"train_loss": -37.09403991699219, "global_step": 97759, "epoch": 807} {"train_loss": -37.18154525756836, "global_step": 97760, "epoch": 807} {"train_loss": -37.397117614746094, "global_step": 97761, "epoch": 807} {"train_loss": -37.518306732177734, "global_step": 97762, "epoch": 807} {"train_loss": -37.477901458740234, "global_step": 97763, "epoch": 807} {"train_loss": -37.546600341796875, "global_step": 97764, "epoch": 807} {"train_loss": -37.76826095581055, "global_step": 97765, "epoch": 807} {"train_loss": -37.24808883666992, "global_step": 97766, "epoch": 807} {"train_loss": -34.6575175592722, "global_step": 97767, "epoch": 807, "val_loss": 2616904.5} {"train_loss": -37.69623947143555, "global_step": 97768, "epoch": 808} {"train_loss": -37.79133224487305, "global_step": 97769, "epoch": 808} {"train_loss": -37.35966873168945, "global_step": 97770, "epoch": 808} {"train_loss": -37.779693603515625, "global_step": 97771, "epoch": 808} {"train_loss": -37.94096755981445, "global_step": 97772, "epoch": 808} {"train_loss": -37.58916091918945, "global_step": 97773, "epoch": 808} {"train_loss": -37.76530075073242, "global_step": 97774, "epoch": 808} {"train_loss": -37.8546142578125, "global_step": 97775, "epoch": 808} {"train_loss": -37.91460418701172, "global_step": 97776, "epoch": 808} {"train_loss": -38.25720977783203, "global_step": 97777, "epoch": 808} {"train_loss": -38.19157028198242, "global_step": 97778, "epoch": 808} {"train_loss": -38.17363357543945, "global_step": 97779, "epoch": 808} {"train_loss": -38.154903411865234, "global_step": 97780, "epoch": 808} {"train_loss": -38.44809341430664, "global_step": 97781, "epoch": 808} {"train_loss": -38.46725082397461, "global_step": 97782, "epoch": 808} {"train_loss": -38.00910568237305, "global_step": 97783, "epoch": 808} {"train_loss": -38.47121047973633, "global_step": 97784, "epoch": 808} {"train_loss": -38.04776382446289, "global_step": 97785, "epoch": 808} {"train_loss": -37.89342498779297, "global_step": 97786, "epoch": 808} {"train_loss": -38.7041130065918, "global_step": 97787, "epoch": 808} {"train_loss": -37.967132568359375, "global_step": 97788, "epoch": 808} {"train_loss": -38.23441696166992, "global_step": 97789, "epoch": 808} {"train_loss": -37.689815521240234, "global_step": 97790, "epoch": 808} {"train_loss": -38.38945007324219, "global_step": 97791, "epoch": 808} {"train_loss": -38.33210372924805, "global_step": 97792, "epoch": 808} {"train_loss": -38.62456130981445, "global_step": 97793, "epoch": 808} {"train_loss": -38.48602294921875, "global_step": 97794, "epoch": 808} {"train_loss": -38.19186019897461, "global_step": 97795, "epoch": 808} {"train_loss": -38.21263885498047, "global_step": 97796, "epoch": 808} {"train_loss": -37.411582946777344, "global_step": 97797, "epoch": 808} {"train_loss": -34.93168640136719, "global_step": 97798, "epoch": 808} {"train_loss": -34.29087448120117, "global_step": 97799, "epoch": 808} {"train_loss": -30.249088287353516, "global_step": 97800, "epoch": 808} {"train_loss": -27.277179718017578, "global_step": 97801, "epoch": 808} {"train_loss": -31.648181915283203, "global_step": 97802, "epoch": 808} {"train_loss": -36.71383285522461, "global_step": 97803, "epoch": 808} {"train_loss": -37.694908142089844, "global_step": 97804, "epoch": 808} {"train_loss": -36.4803466796875, "global_step": 97805, "epoch": 808} {"train_loss": -37.70924758911133, "global_step": 97806, "epoch": 808} {"train_loss": -38.375221252441406, "global_step": 97807, "epoch": 808} {"train_loss": -37.11256790161133, "global_step": 97808, "epoch": 808} {"train_loss": -38.5196533203125, "global_step": 97809, "epoch": 808} {"train_loss": -38.22292709350586, "global_step": 97810, "epoch": 808} {"train_loss": -38.46608352661133, "global_step": 97811, "epoch": 808} {"train_loss": -38.459285736083984, "global_step": 97812, "epoch": 808} {"train_loss": -38.07197189331055, "global_step": 97813, "epoch": 808} {"train_loss": -38.471370697021484, "global_step": 97814, "epoch": 808} {"train_loss": -38.512020111083984, "global_step": 97815, "epoch": 808} {"train_loss": -38.3639030456543, "global_step": 97816, "epoch": 808} {"train_loss": -38.49834060668945, "global_step": 97817, "epoch": 808} {"train_loss": -37.81366729736328, "global_step": 97818, "epoch": 808} {"train_loss": -38.53346633911133, "global_step": 97819, "epoch": 808} {"train_loss": -38.25617599487305, "global_step": 97820, "epoch": 808} {"train_loss": -38.623619079589844, "global_step": 97821, "epoch": 808} {"train_loss": -38.58538055419922, "global_step": 97822, "epoch": 808} {"train_loss": -38.23319625854492, "global_step": 97823, "epoch": 808} {"train_loss": -38.147865295410156, "global_step": 97824, "epoch": 808} {"train_loss": -38.75852584838867, "global_step": 97825, "epoch": 808} {"train_loss": -38.70074462890625, "global_step": 97826, "epoch": 808} {"train_loss": -38.823936462402344, "global_step": 97827, "epoch": 808} {"train_loss": -38.401546478271484, "global_step": 97828, "epoch": 808} {"train_loss": -38.50032424926758, "global_step": 97829, "epoch": 808} {"train_loss": -38.06379318237305, "global_step": 97830, "epoch": 808} {"train_loss": -36.75303268432617, "global_step": 97831, "epoch": 808} {"train_loss": -36.9680290222168, "global_step": 97832, "epoch": 808} {"train_loss": -35.72774124145508, "global_step": 97833, "epoch": 808} {"train_loss": -35.088375091552734, "global_step": 97834, "epoch": 808} {"train_loss": -38.38853454589844, "global_step": 97835, "epoch": 808} {"train_loss": -35.81312942504883, "global_step": 97836, "epoch": 808} {"train_loss": -34.572811126708984, "global_step": 97837, "epoch": 808} {"train_loss": -37.326778411865234, "global_step": 97838, "epoch": 808} {"train_loss": -27.761865615844727, "global_step": 97839, "epoch": 808} {"train_loss": -35.84386444091797, "global_step": 97840, "epoch": 808} {"train_loss": -32.603370666503906, "global_step": 97841, "epoch": 808} {"train_loss": -35.042022705078125, "global_step": 97842, "epoch": 808} {"train_loss": -35.8275146484375, "global_step": 97843, "epoch": 808} {"train_loss": -35.85490036010742, "global_step": 97844, "epoch": 808} {"train_loss": -36.92922592163086, "global_step": 97845, "epoch": 808} {"train_loss": -37.27891159057617, "global_step": 97846, "epoch": 808} {"train_loss": -36.76009750366211, "global_step": 97847, "epoch": 808} {"train_loss": -36.726234436035156, "global_step": 97848, "epoch": 808} {"train_loss": -37.27862548828125, "global_step": 97849, "epoch": 808} {"train_loss": -37.31903839111328, "global_step": 97850, "epoch": 808} {"train_loss": -37.4235725402832, "global_step": 97851, "epoch": 808} {"train_loss": -38.36066818237305, "global_step": 97852, "epoch": 808} {"train_loss": -37.33797836303711, "global_step": 97853, "epoch": 808} {"train_loss": -38.65694808959961, "global_step": 97854, "epoch": 808} {"train_loss": -36.97319030761719, "global_step": 97855, "epoch": 808} {"train_loss": -38.105106353759766, "global_step": 97856, "epoch": 808} {"train_loss": -37.915069580078125, "global_step": 97857, "epoch": 808} {"train_loss": -38.5733642578125, "global_step": 97858, "epoch": 808} {"train_loss": -37.30134201049805, "global_step": 97859, "epoch": 808} {"train_loss": -37.36649703979492, "global_step": 97860, "epoch": 808} {"train_loss": -38.708106994628906, "global_step": 97861, "epoch": 808} {"train_loss": -37.8441162109375, "global_step": 97862, "epoch": 808} {"train_loss": -38.514644622802734, "global_step": 97863, "epoch": 808} {"train_loss": -37.18935775756836, "global_step": 97864, "epoch": 808} {"train_loss": -38.667266845703125, "global_step": 97865, "epoch": 808} {"train_loss": -37.8433837890625, "global_step": 97866, "epoch": 808} {"train_loss": -38.33323287963867, "global_step": 97867, "epoch": 808} {"train_loss": -38.915748596191406, "global_step": 97868, "epoch": 808} {"train_loss": -38.59796905517578, "global_step": 97869, "epoch": 808} {"train_loss": -38.45789337158203, "global_step": 97870, "epoch": 808} {"train_loss": -38.951454162597656, "global_step": 97871, "epoch": 808} {"train_loss": -38.442230224609375, "global_step": 97872, "epoch": 808} {"train_loss": -38.44641876220703, "global_step": 97873, "epoch": 808} {"train_loss": -38.31483459472656, "global_step": 97874, "epoch": 808} {"train_loss": -38.81848907470703, "global_step": 97875, "epoch": 808} {"train_loss": -38.87040328979492, "global_step": 97876, "epoch": 808} {"train_loss": -38.55659866333008, "global_step": 97877, "epoch": 808} {"train_loss": -37.79743576049805, "global_step": 97878, "epoch": 808} {"train_loss": -39.24591827392578, "global_step": 97879, "epoch": 808} {"train_loss": -38.857967376708984, "global_step": 97880, "epoch": 808} {"train_loss": -38.24825668334961, "global_step": 97881, "epoch": 808} {"train_loss": -38.4974479675293, "global_step": 97882, "epoch": 808} {"train_loss": -38.30852127075195, "global_step": 97883, "epoch": 808} {"train_loss": -38.52399826049805, "global_step": 97884, "epoch": 808} {"train_loss": -38.1917724609375, "global_step": 97885, "epoch": 808} {"train_loss": -38.85530471801758, "global_step": 97886, "epoch": 808} {"train_loss": -38.61183547973633, "global_step": 97887, "epoch": 808} {"train_loss": -37.525823845351034, "global_step": 97888, "epoch": 808, "val_loss": 2660710.75} {"train_loss": -39.091094970703125, "global_step": 97889, "epoch": 809} {"train_loss": -38.835453033447266, "global_step": 97890, "epoch": 809} {"train_loss": -39.28627395629883, "global_step": 97891, "epoch": 809} {"train_loss": -39.31440734863281, "global_step": 97892, "epoch": 809} {"train_loss": -39.36267852783203, "global_step": 97893, "epoch": 809} {"train_loss": -37.99583435058594, "global_step": 97894, "epoch": 809} {"train_loss": -38.7391357421875, "global_step": 97895, "epoch": 809} {"train_loss": -38.69315719604492, "global_step": 97896, "epoch": 809} {"train_loss": -39.076663970947266, "global_step": 97897, "epoch": 809} {"train_loss": -38.725440979003906, "global_step": 97898, "epoch": 809} {"train_loss": -38.8071174621582, "global_step": 97899, "epoch": 809} {"train_loss": -39.43960189819336, "global_step": 97900, "epoch": 809} {"train_loss": -39.18770980834961, "global_step": 97901, "epoch": 809} {"train_loss": -38.57850646972656, "global_step": 97902, "epoch": 809} {"train_loss": -39.32265853881836, "global_step": 97903, "epoch": 809} {"train_loss": -39.04753494262695, "global_step": 97904, "epoch": 809} {"train_loss": -37.16013717651367, "global_step": 97905, "epoch": 809} {"train_loss": -37.261070251464844, "global_step": 97906, "epoch": 809} {"train_loss": -37.588802337646484, "global_step": 97907, "epoch": 809} {"train_loss": -36.63092041015625, "global_step": 97908, "epoch": 809} {"train_loss": -37.3581657409668, "global_step": 97909, "epoch": 809} {"train_loss": -37.01953887939453, "global_step": 97910, "epoch": 809} {"train_loss": -38.393245697021484, "global_step": 97911, "epoch": 809} {"train_loss": -36.360103607177734, "global_step": 97912, "epoch": 809} {"train_loss": -33.323150634765625, "global_step": 97913, "epoch": 809} {"train_loss": -33.06525421142578, "global_step": 97914, "epoch": 809} {"train_loss": -37.058624267578125, "global_step": 97915, "epoch": 809} {"train_loss": -36.487430572509766, "global_step": 97916, "epoch": 809} {"train_loss": -32.24076461791992, "global_step": 97917, "epoch": 809} {"train_loss": -34.92380905151367, "global_step": 97918, "epoch": 809} {"train_loss": -35.61061477661133, "global_step": 97919, "epoch": 809} {"train_loss": -35.288116455078125, "global_step": 97920, "epoch": 809} {"train_loss": -36.91511535644531, "global_step": 97921, "epoch": 809} {"train_loss": -35.3978271484375, "global_step": 97922, "epoch": 809} {"train_loss": -36.082008361816406, "global_step": 97923, "epoch": 809} {"train_loss": -29.478113174438477, "global_step": 97924, "epoch": 809} {"train_loss": -35.49851608276367, "global_step": 97925, "epoch": 809} {"train_loss": -36.30720138549805, "global_step": 97926, "epoch": 809} {"train_loss": -36.19576644897461, "global_step": 97927, "epoch": 809} {"train_loss": -36.70643615722656, "global_step": 97928, "epoch": 809} {"train_loss": -36.37679672241211, "global_step": 97929, "epoch": 809} {"train_loss": -35.53094482421875, "global_step": 97930, "epoch": 809} {"train_loss": -35.316383361816406, "global_step": 97931, "epoch": 809} {"train_loss": -35.96786880493164, "global_step": 97932, "epoch": 809} {"train_loss": -33.27815628051758, "global_step": 97933, "epoch": 809} {"train_loss": -34.6318244934082, "global_step": 97934, "epoch": 809} {"train_loss": -36.15570831298828, "global_step": 97935, "epoch": 809} {"train_loss": -37.373348236083984, "global_step": 97936, "epoch": 809} {"train_loss": -32.23053741455078, "global_step": 97937, "epoch": 809} {"train_loss": -31.02448081970215, "global_step": 97938, "epoch": 809} {"train_loss": -35.67580032348633, "global_step": 97939, "epoch": 809} {"train_loss": -34.6154899597168, "global_step": 97940, "epoch": 809} {"train_loss": -35.85968017578125, "global_step": 97941, "epoch": 809} {"train_loss": -35.767738342285156, "global_step": 97942, "epoch": 809} {"train_loss": -34.42805862426758, "global_step": 97943, "epoch": 809} {"train_loss": -31.28377342224121, "global_step": 97944, "epoch": 809} {"train_loss": -36.33234786987305, "global_step": 97945, "epoch": 809} {"train_loss": -37.06664276123047, "global_step": 97946, "epoch": 809} {"train_loss": -31.322650909423828, "global_step": 97947, "epoch": 809} {"train_loss": -35.79585647583008, "global_step": 97948, "epoch": 809} {"train_loss": -32.73234176635742, "global_step": 97949, "epoch": 809} {"train_loss": -34.848793029785156, "global_step": 97950, "epoch": 809} {"train_loss": -32.6186408996582, "global_step": 97951, "epoch": 809} {"train_loss": -35.88845443725586, "global_step": 97952, "epoch": 809} {"train_loss": -34.299285888671875, "global_step": 97953, "epoch": 809} {"train_loss": -36.04186248779297, "global_step": 97954, "epoch": 809} {"train_loss": -34.55479049682617, "global_step": 97955, "epoch": 809} {"train_loss": -35.45309829711914, "global_step": 97956, "epoch": 809} {"train_loss": -33.63798904418945, "global_step": 97957, "epoch": 809} {"train_loss": -34.29571533203125, "global_step": 97958, "epoch": 809} {"train_loss": -32.501617431640625, "global_step": 97959, "epoch": 809} {"train_loss": -35.05072021484375, "global_step": 97960, "epoch": 809} {"train_loss": -34.62095260620117, "global_step": 97961, "epoch": 809} {"train_loss": -35.282386779785156, "global_step": 97962, "epoch": 809} {"train_loss": -34.658363342285156, "global_step": 97963, "epoch": 809} {"train_loss": -34.85187530517578, "global_step": 97964, "epoch": 809} {"train_loss": -32.589107513427734, "global_step": 97965, "epoch": 809} {"train_loss": -34.88210678100586, "global_step": 97966, "epoch": 809} {"train_loss": -35.42926788330078, "global_step": 97967, "epoch": 809} {"train_loss": -35.34105682373047, "global_step": 97968, "epoch": 809} {"train_loss": -36.05992889404297, "global_step": 97969, "epoch": 809} {"train_loss": -35.5573844909668, "global_step": 97970, "epoch": 809} {"train_loss": -34.19763946533203, "global_step": 97971, "epoch": 809} {"train_loss": -36.14569854736328, "global_step": 97972, "epoch": 809} {"train_loss": -35.4776611328125, "global_step": 97973, "epoch": 809} {"train_loss": -35.514625549316406, "global_step": 97974, "epoch": 809} {"train_loss": -35.92892074584961, "global_step": 97975, "epoch": 809} {"train_loss": -36.014556884765625, "global_step": 97976, "epoch": 809} {"train_loss": -36.58297348022461, "global_step": 97977, "epoch": 809} {"train_loss": -36.80859375, "global_step": 97978, "epoch": 809} {"train_loss": -36.766624450683594, "global_step": 97979, "epoch": 809} {"train_loss": -37.04435348510742, "global_step": 97980, "epoch": 809} {"train_loss": -36.58358383178711, "global_step": 97981, "epoch": 809} {"train_loss": -37.30937957763672, "global_step": 97982, "epoch": 809} {"train_loss": -36.19148254394531, "global_step": 97983, "epoch": 809} {"train_loss": -36.58712387084961, "global_step": 97984, "epoch": 809} {"train_loss": -36.431522369384766, "global_step": 97985, "epoch": 809} {"train_loss": -37.247962951660156, "global_step": 97986, "epoch": 809} {"train_loss": -37.054012298583984, "global_step": 97987, "epoch": 809} {"train_loss": -37.2113151550293, "global_step": 97988, "epoch": 809} {"train_loss": -37.009765625, "global_step": 97989, "epoch": 809} {"train_loss": -36.60918426513672, "global_step": 97990, "epoch": 809} {"train_loss": -36.748268127441406, "global_step": 97991, "epoch": 809} {"train_loss": -36.54536437988281, "global_step": 97992, "epoch": 809} {"train_loss": -36.82803726196289, "global_step": 97993, "epoch": 809} {"train_loss": -37.957454681396484, "global_step": 97994, "epoch": 809} {"train_loss": -37.50503921508789, "global_step": 97995, "epoch": 809} {"train_loss": -37.50037384033203, "global_step": 97996, "epoch": 809} {"train_loss": -37.96137237548828, "global_step": 97997, "epoch": 809} {"train_loss": -37.310428619384766, "global_step": 97998, "epoch": 809} {"train_loss": -37.199119567871094, "global_step": 97999, "epoch": 809} {"train_loss": -37.369197845458984, "global_step": 98000, "epoch": 809} {"train_loss": -37.94096755981445, "global_step": 98001, "epoch": 809} {"train_loss": -37.9210319519043, "global_step": 98002, "epoch": 809} {"train_loss": -37.56280517578125, "global_step": 98003, "epoch": 809} {"train_loss": -37.861454010009766, "global_step": 98004, "epoch": 809} {"train_loss": -37.365352630615234, "global_step": 98005, "epoch": 809} {"train_loss": -37.46543502807617, "global_step": 98006, "epoch": 809} {"train_loss": -37.79678726196289, "global_step": 98007, "epoch": 809} {"train_loss": -37.81081008911133, "global_step": 98008, "epoch": 809} {"train_loss": -36.20063947252006, "global_step": 98009, "epoch": 809, "val_loss": 2627068.25} {"train_loss": -37.69706726074219, "global_step": 98010, "epoch": 810} {"train_loss": -38.143802642822266, "global_step": 98011, "epoch": 810} {"train_loss": -37.5443000793457, "global_step": 98012, "epoch": 810} {"train_loss": -38.57761764526367, "global_step": 98013, "epoch": 810} {"train_loss": -38.02695846557617, "global_step": 98014, "epoch": 810} {"train_loss": -38.05472946166992, "global_step": 98015, "epoch": 810} {"train_loss": -38.48618698120117, "global_step": 98016, "epoch": 810} {"train_loss": -37.930477142333984, "global_step": 98017, "epoch": 810} {"train_loss": -38.2955207824707, "global_step": 98018, "epoch": 810} {"train_loss": -38.05419921875, "global_step": 98019, "epoch": 810} {"train_loss": -38.3931999206543, "global_step": 98020, "epoch": 810} {"train_loss": -38.35294723510742, "global_step": 98021, "epoch": 810} {"train_loss": -38.26185989379883, "global_step": 98022, "epoch": 810} {"train_loss": -38.16116714477539, "global_step": 98023, "epoch": 810} {"train_loss": -38.47758102416992, "global_step": 98024, "epoch": 810} {"train_loss": -38.29216384887695, "global_step": 98025, "epoch": 810} {"train_loss": -38.79952621459961, "global_step": 98026, "epoch": 810} {"train_loss": -38.79318618774414, "global_step": 98027, "epoch": 810} {"train_loss": -38.745609283447266, "global_step": 98028, "epoch": 810} {"train_loss": -38.78062057495117, "global_step": 98029, "epoch": 810} {"train_loss": -38.58662033081055, "global_step": 98030, "epoch": 810} {"train_loss": -38.35841751098633, "global_step": 98031, "epoch": 810} {"train_loss": -38.62197494506836, "global_step": 98032, "epoch": 810} {"train_loss": -38.68130111694336, "global_step": 98033, "epoch": 810} {"train_loss": -38.88840866088867, "global_step": 98034, "epoch": 810} {"train_loss": -38.82740020751953, "global_step": 98035, "epoch": 810} {"train_loss": -38.6834602355957, "global_step": 98036, "epoch": 810} {"train_loss": -38.521095275878906, "global_step": 98037, "epoch": 810} {"train_loss": -38.81924057006836, "global_step": 98038, "epoch": 810} {"train_loss": -38.260101318359375, "global_step": 98039, "epoch": 810} {"train_loss": -38.55498123168945, "global_step": 98040, "epoch": 810} {"train_loss": -36.20648193359375, "global_step": 98041, "epoch": 810} {"train_loss": -36.288665771484375, "global_step": 98042, "epoch": 810} {"train_loss": -37.618770599365234, "global_step": 98043, "epoch": 810} {"train_loss": -36.70425796508789, "global_step": 98044, "epoch": 810} {"train_loss": -36.682289123535156, "global_step": 98045, "epoch": 810} {"train_loss": -37.41262435913086, "global_step": 98046, "epoch": 810} {"train_loss": -36.46580123901367, "global_step": 98047, "epoch": 810} {"train_loss": -36.991844177246094, "global_step": 98048, "epoch": 810} {"train_loss": -35.177425384521484, "global_step": 98049, "epoch": 810} {"train_loss": -32.040401458740234, "global_step": 98050, "epoch": 810} {"train_loss": -37.52939987182617, "global_step": 98051, "epoch": 810} {"train_loss": -30.62348747253418, "global_step": 98052, "epoch": 810} {"train_loss": -38.472835540771484, "global_step": 98053, "epoch": 810} {"train_loss": -33.95827102661133, "global_step": 98054, "epoch": 810} {"train_loss": -36.797874450683594, "global_step": 98055, "epoch": 810} {"train_loss": -36.45689010620117, "global_step": 98056, "epoch": 810} {"train_loss": -33.30978012084961, "global_step": 98057, "epoch": 810} {"train_loss": -37.55756378173828, "global_step": 98058, "epoch": 810} {"train_loss": -33.986244201660156, "global_step": 98059, "epoch": 810} {"train_loss": -37.20961380004883, "global_step": 98060, "epoch": 810} {"train_loss": -36.07761764526367, "global_step": 98061, "epoch": 810} {"train_loss": -36.204402923583984, "global_step": 98062, "epoch": 810} {"train_loss": -35.88032913208008, "global_step": 98063, "epoch": 810} {"train_loss": -36.945030212402344, "global_step": 98064, "epoch": 810} {"train_loss": -36.69069290161133, "global_step": 98065, "epoch": 810} {"train_loss": -35.80776596069336, "global_step": 98066, "epoch": 810} {"train_loss": -36.9898567199707, "global_step": 98067, "epoch": 810} {"train_loss": -37.471466064453125, "global_step": 98068, "epoch": 810} {"train_loss": -36.309608459472656, "global_step": 98069, "epoch": 810} {"train_loss": -36.72232437133789, "global_step": 98070, "epoch": 810} {"train_loss": -37.538631439208984, "global_step": 98071, "epoch": 810} {"train_loss": -36.558387756347656, "global_step": 98072, "epoch": 810} {"train_loss": -36.969783782958984, "global_step": 98073, "epoch": 810} {"train_loss": -37.1956672668457, "global_step": 98074, "epoch": 810} {"train_loss": -35.28272247314453, "global_step": 98075, "epoch": 810} {"train_loss": -35.00324630737305, "global_step": 98076, "epoch": 810} {"train_loss": -36.779232025146484, "global_step": 98077, "epoch": 810} {"train_loss": -37.934608459472656, "global_step": 98078, "epoch": 810} {"train_loss": -37.42837142944336, "global_step": 98079, "epoch": 810} {"train_loss": -37.271183013916016, "global_step": 98080, "epoch": 810} {"train_loss": -36.859375, "global_step": 98081, "epoch": 810} {"train_loss": -37.90055465698242, "global_step": 98082, "epoch": 810} {"train_loss": -37.58345031738281, "global_step": 98083, "epoch": 810} {"train_loss": -37.729286193847656, "global_step": 98084, "epoch": 810} {"train_loss": -38.127323150634766, "global_step": 98085, "epoch": 810} {"train_loss": -38.48801803588867, "global_step": 98086, "epoch": 810} {"train_loss": -38.251705169677734, "global_step": 98087, "epoch": 810} {"train_loss": -38.54470443725586, "global_step": 98088, "epoch": 810} {"train_loss": -38.50627899169922, "global_step": 98089, "epoch": 810} {"train_loss": -37.30569076538086, "global_step": 98090, "epoch": 810} {"train_loss": -38.67708206176758, "global_step": 98091, "epoch": 810} {"train_loss": -38.57997512817383, "global_step": 98092, "epoch": 810} {"train_loss": -38.45402908325195, "global_step": 98093, "epoch": 810} {"train_loss": -37.631996154785156, "global_step": 98094, "epoch": 810} {"train_loss": -38.91951370239258, "global_step": 98095, "epoch": 810} {"train_loss": -38.48200225830078, "global_step": 98096, "epoch": 810} {"train_loss": -39.025733947753906, "global_step": 98097, "epoch": 810} {"train_loss": -38.18696975708008, "global_step": 98098, "epoch": 810} {"train_loss": -38.3233642578125, "global_step": 98099, "epoch": 810} {"train_loss": -38.91050338745117, "global_step": 98100, "epoch": 810} {"train_loss": -38.50291442871094, "global_step": 98101, "epoch": 810} {"train_loss": -38.223812103271484, "global_step": 98102, "epoch": 810} {"train_loss": -38.8803596496582, "global_step": 98103, "epoch": 810} {"train_loss": -38.679054260253906, "global_step": 98104, "epoch": 810} {"train_loss": -39.06721115112305, "global_step": 98105, "epoch": 810} {"train_loss": -38.946083068847656, "global_step": 98106, "epoch": 810} {"train_loss": -38.376522064208984, "global_step": 98107, "epoch": 810} {"train_loss": -38.85260009765625, "global_step": 98108, "epoch": 810} {"train_loss": -38.99879837036133, "global_step": 98109, "epoch": 810} {"train_loss": -39.15228271484375, "global_step": 98110, "epoch": 810} {"train_loss": -38.23896408081055, "global_step": 98111, "epoch": 810} {"train_loss": -38.187808990478516, "global_step": 98112, "epoch": 810} {"train_loss": -37.69095993041992, "global_step": 98113, "epoch": 810} {"train_loss": -38.82984161376953, "global_step": 98114, "epoch": 810} {"train_loss": -39.1312370300293, "global_step": 98115, "epoch": 810} {"train_loss": -38.97152328491211, "global_step": 98116, "epoch": 810} {"train_loss": -38.85679244995117, "global_step": 98117, "epoch": 810} {"train_loss": -38.76896286010742, "global_step": 98118, "epoch": 810} {"train_loss": -38.985206604003906, "global_step": 98119, "epoch": 810} {"train_loss": -39.031307220458984, "global_step": 98120, "epoch": 810} {"train_loss": -38.88114547729492, "global_step": 98121, "epoch": 810} {"train_loss": -39.50365447998047, "global_step": 98122, "epoch": 810} {"train_loss": -38.92121505737305, "global_step": 98123, "epoch": 810} {"train_loss": -39.10709762573242, "global_step": 98124, "epoch": 810} {"train_loss": -39.16455078125, "global_step": 98125, "epoch": 810} {"train_loss": -39.07123565673828, "global_step": 98126, "epoch": 810} {"train_loss": -38.3349723815918, "global_step": 98127, "epoch": 810} {"train_loss": -37.52470397949219, "global_step": 98128, "epoch": 810} {"train_loss": -35.011810302734375, "global_step": 98129, "epoch": 810} {"train_loss": -37.701474292219174, "global_step": 98130, "epoch": 810, "val_loss": 2691454.25} {"train_loss": -35.10585403442383, "global_step": 98131, "epoch": 811} {"train_loss": -33.394012451171875, "global_step": 98132, "epoch": 811} {"train_loss": -34.94969940185547, "global_step": 98133, "epoch": 811} {"train_loss": -39.0963249206543, "global_step": 98134, "epoch": 811} {"train_loss": -38.771114349365234, "global_step": 98135, "epoch": 811} {"train_loss": -37.891571044921875, "global_step": 98136, "epoch": 811} {"train_loss": -39.373104095458984, "global_step": 98137, "epoch": 811} {"train_loss": -38.69932174682617, "global_step": 98138, "epoch": 811} {"train_loss": -37.90766906738281, "global_step": 98139, "epoch": 811} {"train_loss": -38.37092590332031, "global_step": 98140, "epoch": 811} {"train_loss": -38.54426574707031, "global_step": 98141, "epoch": 811} {"train_loss": -39.03597640991211, "global_step": 98142, "epoch": 811} {"train_loss": -39.19122314453125, "global_step": 98143, "epoch": 811} {"train_loss": -38.2400016784668, "global_step": 98144, "epoch": 811} {"train_loss": -39.3121452331543, "global_step": 98145, "epoch": 811} {"train_loss": -39.40204620361328, "global_step": 98146, "epoch": 811} {"train_loss": -38.35728454589844, "global_step": 98147, "epoch": 811} {"train_loss": -39.44118118286133, "global_step": 98148, "epoch": 811} {"train_loss": -39.972503662109375, "global_step": 98149, "epoch": 811} {"train_loss": -39.203304290771484, "global_step": 98150, "epoch": 811} {"train_loss": -38.641868591308594, "global_step": 98151, "epoch": 811} {"train_loss": -38.86609649658203, "global_step": 98152, "epoch": 811} {"train_loss": -39.332027435302734, "global_step": 98153, "epoch": 811} {"train_loss": -39.051795959472656, "global_step": 98154, "epoch": 811} {"train_loss": -38.76006317138672, "global_step": 98155, "epoch": 811} {"train_loss": -39.188480377197266, "global_step": 98156, "epoch": 811} {"train_loss": -38.65655517578125, "global_step": 98157, "epoch": 811} {"train_loss": -37.46920394897461, "global_step": 98158, "epoch": 811} {"train_loss": -37.59859085083008, "global_step": 98159, "epoch": 811} {"train_loss": -37.99162673950195, "global_step": 98160, "epoch": 811} {"train_loss": -38.22904968261719, "global_step": 98161, "epoch": 811} {"train_loss": -33.23417663574219, "global_step": 98162, "epoch": 811} {"train_loss": -34.061431884765625, "global_step": 98163, "epoch": 811} {"train_loss": -34.87687301635742, "global_step": 98164, "epoch": 811} {"train_loss": -36.52285385131836, "global_step": 98165, "epoch": 811} {"train_loss": -38.95734786987305, "global_step": 98166, "epoch": 811} {"train_loss": -38.56690216064453, "global_step": 98167, "epoch": 811} {"train_loss": -35.89455795288086, "global_step": 98168, "epoch": 811} {"train_loss": -34.82854080200195, "global_step": 98169, "epoch": 811} {"train_loss": -37.06017303466797, "global_step": 98170, "epoch": 811} {"train_loss": -38.32814407348633, "global_step": 98171, "epoch": 811} {"train_loss": -36.67472839355469, "global_step": 98172, "epoch": 811} {"train_loss": -36.141815185546875, "global_step": 98173, "epoch": 811} {"train_loss": -36.05646514892578, "global_step": 98174, "epoch": 811} {"train_loss": -37.801185607910156, "global_step": 98175, "epoch": 811} {"train_loss": -35.78351974487305, "global_step": 98176, "epoch": 811} {"train_loss": -36.2270622253418, "global_step": 98177, "epoch": 811} {"train_loss": -36.816375732421875, "global_step": 98178, "epoch": 811} {"train_loss": -37.32100296020508, "global_step": 98179, "epoch": 811} {"train_loss": -38.48090362548828, "global_step": 98180, "epoch": 811} {"train_loss": -37.822540283203125, "global_step": 98181, "epoch": 811} {"train_loss": -38.12555694580078, "global_step": 98182, "epoch": 811} {"train_loss": -39.1989631652832, "global_step": 98183, "epoch": 811} {"train_loss": -37.234703063964844, "global_step": 98184, "epoch": 811} {"train_loss": -37.49067306518555, "global_step": 98185, "epoch": 811} {"train_loss": -38.290889739990234, "global_step": 98186, "epoch": 811} {"train_loss": -35.18198013305664, "global_step": 98187, "epoch": 811} {"train_loss": -38.34720993041992, "global_step": 98188, "epoch": 811} {"train_loss": -37.55393600463867, "global_step": 98189, "epoch": 811} {"train_loss": -34.747013092041016, "global_step": 98190, "epoch": 811} {"train_loss": -37.67060089111328, "global_step": 98191, "epoch": 811} {"train_loss": -37.56010818481445, "global_step": 98192, "epoch": 811} {"train_loss": -37.55599594116211, "global_step": 98193, "epoch": 811} {"train_loss": -38.21246337890625, "global_step": 98194, "epoch": 811} {"train_loss": -38.00629425048828, "global_step": 98195, "epoch": 811} {"train_loss": -37.83378219604492, "global_step": 98196, "epoch": 811} {"train_loss": -38.05544662475586, "global_step": 98197, "epoch": 811} {"train_loss": -38.475128173828125, "global_step": 98198, "epoch": 811} {"train_loss": -37.930110931396484, "global_step": 98199, "epoch": 811} {"train_loss": -38.86434555053711, "global_step": 98200, "epoch": 811} {"train_loss": -38.23111343383789, "global_step": 98201, "epoch": 811} {"train_loss": -38.59881591796875, "global_step": 98202, "epoch": 811} {"train_loss": -38.137935638427734, "global_step": 98203, "epoch": 811} {"train_loss": -38.642364501953125, "global_step": 98204, "epoch": 811} {"train_loss": -38.330787658691406, "global_step": 98205, "epoch": 811} {"train_loss": -39.25067901611328, "global_step": 98206, "epoch": 811} {"train_loss": -38.42722702026367, "global_step": 98207, "epoch": 811} {"train_loss": -39.239463806152344, "global_step": 98208, "epoch": 811} {"train_loss": -38.28450393676758, "global_step": 98209, "epoch": 811} {"train_loss": -38.83424377441406, "global_step": 98210, "epoch": 811} {"train_loss": -38.07295608520508, "global_step": 98211, "epoch": 811} {"train_loss": -38.52020263671875, "global_step": 98212, "epoch": 811} {"train_loss": -38.71550750732422, "global_step": 98213, "epoch": 811} {"train_loss": -39.16067123413086, "global_step": 98214, "epoch": 811} {"train_loss": -37.897212982177734, "global_step": 98215, "epoch": 811} {"train_loss": -38.06311798095703, "global_step": 98216, "epoch": 811} {"train_loss": -39.116939544677734, "global_step": 98217, "epoch": 811} {"train_loss": -39.28827667236328, "global_step": 98218, "epoch": 811} {"train_loss": -38.81146240234375, "global_step": 98219, "epoch": 811} {"train_loss": -39.03748321533203, "global_step": 98220, "epoch": 811} {"train_loss": -37.773136138916016, "global_step": 98221, "epoch": 811} {"train_loss": -39.3638916015625, "global_step": 98222, "epoch": 811} {"train_loss": -39.22768020629883, "global_step": 98223, "epoch": 811} {"train_loss": -39.04380416870117, "global_step": 98224, "epoch": 811} {"train_loss": -39.467830657958984, "global_step": 98225, "epoch": 811} {"train_loss": -38.724998474121094, "global_step": 98226, "epoch": 811} {"train_loss": -38.492149353027344, "global_step": 98227, "epoch": 811} {"train_loss": -38.41437911987305, "global_step": 98228, "epoch": 811} {"train_loss": -38.432533264160156, "global_step": 98229, "epoch": 811} {"train_loss": -38.92021560668945, "global_step": 98230, "epoch": 811} {"train_loss": -38.7253532409668, "global_step": 98231, "epoch": 811} {"train_loss": -38.7422981262207, "global_step": 98232, "epoch": 811} {"train_loss": -38.348018646240234, "global_step": 98233, "epoch": 811} {"train_loss": -38.20844650268555, "global_step": 98234, "epoch": 811} {"train_loss": -39.3299674987793, "global_step": 98235, "epoch": 811} {"train_loss": -39.471248626708984, "global_step": 98236, "epoch": 811} {"train_loss": -38.53428649902344, "global_step": 98237, "epoch": 811} {"train_loss": -38.4323616027832, "global_step": 98238, "epoch": 811} {"train_loss": -38.6693229675293, "global_step": 98239, "epoch": 811} {"train_loss": -38.457862854003906, "global_step": 98240, "epoch": 811} {"train_loss": -39.14387512207031, "global_step": 98241, "epoch": 811} {"train_loss": -39.70195770263672, "global_step": 98242, "epoch": 811} {"train_loss": -38.77505111694336, "global_step": 98243, "epoch": 811} {"train_loss": -38.84383010864258, "global_step": 98244, "epoch": 811} {"train_loss": -38.9707145690918, "global_step": 98245, "epoch": 811} {"train_loss": -37.43111801147461, "global_step": 98246, "epoch": 811} {"train_loss": -38.18555450439453, "global_step": 98247, "epoch": 811} {"train_loss": -37.161434173583984, "global_step": 98248, "epoch": 811} {"train_loss": -39.145423889160156, "global_step": 98249, "epoch": 811} {"train_loss": -38.3500862121582, "global_step": 98250, "epoch": 811} {"train_loss": -38.06635643825058, "global_step": 98251, "epoch": 811, "val_loss": 2678046.75} {"train_loss": -37.54929733276367, "global_step": 98252, "epoch": 812} {"train_loss": -39.16078567504883, "global_step": 98253, "epoch": 812} {"train_loss": -38.0750846862793, "global_step": 98254, "epoch": 812} {"train_loss": -38.904964447021484, "global_step": 98255, "epoch": 812} {"train_loss": -38.542964935302734, "global_step": 98256, "epoch": 812} {"train_loss": -37.49265670776367, "global_step": 98257, "epoch": 812} {"train_loss": -37.99309158325195, "global_step": 98258, "epoch": 812} {"train_loss": -36.7300910949707, "global_step": 98259, "epoch": 812} {"train_loss": -36.08073806762695, "global_step": 98260, "epoch": 812} {"train_loss": -34.840858459472656, "global_step": 98261, "epoch": 812} {"train_loss": -36.5269660949707, "global_step": 98262, "epoch": 812} {"train_loss": -37.671730041503906, "global_step": 98263, "epoch": 812} {"train_loss": -37.3394889831543, "global_step": 98264, "epoch": 812} {"train_loss": -37.87592315673828, "global_step": 98265, "epoch": 812} {"train_loss": -37.07575607299805, "global_step": 98266, "epoch": 812} {"train_loss": -37.389034271240234, "global_step": 98267, "epoch": 812} {"train_loss": -38.003753662109375, "global_step": 98268, "epoch": 812} {"train_loss": -38.3702392578125, "global_step": 98269, "epoch": 812} {"train_loss": -38.47308349609375, "global_step": 98270, "epoch": 812} {"train_loss": -38.2796630859375, "global_step": 98271, "epoch": 812} {"train_loss": -38.39358139038086, "global_step": 98272, "epoch": 812} {"train_loss": -38.73906707763672, "global_step": 98273, "epoch": 812} {"train_loss": -38.30451202392578, "global_step": 98274, "epoch": 812} {"train_loss": -38.39115905761719, "global_step": 98275, "epoch": 812} {"train_loss": -38.407554626464844, "global_step": 98276, "epoch": 812} {"train_loss": -38.54037094116211, "global_step": 98277, "epoch": 812} {"train_loss": -38.79995346069336, "global_step": 98278, "epoch": 812} {"train_loss": -38.22172164916992, "global_step": 98279, "epoch": 812} {"train_loss": -38.718074798583984, "global_step": 98280, "epoch": 812} {"train_loss": -39.05021286010742, "global_step": 98281, "epoch": 812} {"train_loss": -38.31241989135742, "global_step": 98282, "epoch": 812} {"train_loss": -39.08503723144531, "global_step": 98283, "epoch": 812} {"train_loss": -39.13551712036133, "global_step": 98284, "epoch": 812} {"train_loss": -39.311771392822266, "global_step": 98285, "epoch": 812} {"train_loss": -38.338985443115234, "global_step": 98286, "epoch": 812} {"train_loss": -39.29442596435547, "global_step": 98287, "epoch": 812} {"train_loss": -38.92521286010742, "global_step": 98288, "epoch": 812} {"train_loss": -39.3726692199707, "global_step": 98289, "epoch": 812} {"train_loss": -38.82485580444336, "global_step": 98290, "epoch": 812} {"train_loss": -39.06298828125, "global_step": 98291, "epoch": 812} {"train_loss": -38.667049407958984, "global_step": 98292, "epoch": 812} {"train_loss": -38.45458984375, "global_step": 98293, "epoch": 812} {"train_loss": -39.043453216552734, "global_step": 98294, "epoch": 812} {"train_loss": -38.14838409423828, "global_step": 98295, "epoch": 812} {"train_loss": -37.51154708862305, "global_step": 98296, "epoch": 812} {"train_loss": -37.83390808105469, "global_step": 98297, "epoch": 812} {"train_loss": -39.18561553955078, "global_step": 98298, "epoch": 812} {"train_loss": -38.65153121948242, "global_step": 98299, "epoch": 812} {"train_loss": -37.751277923583984, "global_step": 98300, "epoch": 812} {"train_loss": -38.69899368286133, "global_step": 98301, "epoch": 812} {"train_loss": -38.84061813354492, "global_step": 98302, "epoch": 812} {"train_loss": -39.39561080932617, "global_step": 98303, "epoch": 812} {"train_loss": -39.01580810546875, "global_step": 98304, "epoch": 812} {"train_loss": -39.475242614746094, "global_step": 98305, "epoch": 812} {"train_loss": -39.472259521484375, "global_step": 98306, "epoch": 812} {"train_loss": -39.21681594848633, "global_step": 98307, "epoch": 812} {"train_loss": -38.953407287597656, "global_step": 98308, "epoch": 812} {"train_loss": -39.26826858520508, "global_step": 98309, "epoch": 812} {"train_loss": -39.31940460205078, "global_step": 98310, "epoch": 812} {"train_loss": -39.66756820678711, "global_step": 98311, "epoch": 812} {"train_loss": -39.02476119995117, "global_step": 98312, "epoch": 812} {"train_loss": -39.3376579284668, "global_step": 98313, "epoch": 812} {"train_loss": -39.02827835083008, "global_step": 98314, "epoch": 812} {"train_loss": -39.206695556640625, "global_step": 98315, "epoch": 812} {"train_loss": -39.64887619018555, "global_step": 98316, "epoch": 812} {"train_loss": -39.752098083496094, "global_step": 98317, "epoch": 812} {"train_loss": -39.451995849609375, "global_step": 98318, "epoch": 812} {"train_loss": -38.9802131652832, "global_step": 98319, "epoch": 812} {"train_loss": -39.49356460571289, "global_step": 98320, "epoch": 812} {"train_loss": -39.74882125854492, "global_step": 98321, "epoch": 812} {"train_loss": -39.767879486083984, "global_step": 98322, "epoch": 812} {"train_loss": -39.85355758666992, "global_step": 98323, "epoch": 812} {"train_loss": -39.89246368408203, "global_step": 98324, "epoch": 812} {"train_loss": -39.53471755981445, "global_step": 98325, "epoch": 812} {"train_loss": -38.64521408081055, "global_step": 98326, "epoch": 812} {"train_loss": -34.561824798583984, "global_step": 98327, "epoch": 812} {"train_loss": -31.481287002563477, "global_step": 98328, "epoch": 812} {"train_loss": -38.593116760253906, "global_step": 98329, "epoch": 812} {"train_loss": -38.165374755859375, "global_step": 98330, "epoch": 812} {"train_loss": -32.8579216003418, "global_step": 98331, "epoch": 812} {"train_loss": -35.56465530395508, "global_step": 98332, "epoch": 812} {"train_loss": -38.81570816040039, "global_step": 98333, "epoch": 812} {"train_loss": -37.12470626831055, "global_step": 98334, "epoch": 812} {"train_loss": -35.08544158935547, "global_step": 98335, "epoch": 812} {"train_loss": -32.43760681152344, "global_step": 98336, "epoch": 812} {"train_loss": -38.66742706298828, "global_step": 98337, "epoch": 812} {"train_loss": -32.5346794128418, "global_step": 98338, "epoch": 812} {"train_loss": -35.8416633605957, "global_step": 98339, "epoch": 812} {"train_loss": -35.90432357788086, "global_step": 98340, "epoch": 812} {"train_loss": -36.03733825683594, "global_step": 98341, "epoch": 812} {"train_loss": -35.75568389892578, "global_step": 98342, "epoch": 812} {"train_loss": -36.184017181396484, "global_step": 98343, "epoch": 812} {"train_loss": -36.168190002441406, "global_step": 98344, "epoch": 812} {"train_loss": -36.777992248535156, "global_step": 98345, "epoch": 812} {"train_loss": -36.00349044799805, "global_step": 98346, "epoch": 812} {"train_loss": -37.54410171508789, "global_step": 98347, "epoch": 812} {"train_loss": -35.33900833129883, "global_step": 98348, "epoch": 812} {"train_loss": -35.73179626464844, "global_step": 98349, "epoch": 812} {"train_loss": -38.115150451660156, "global_step": 98350, "epoch": 812} {"train_loss": -35.55579376220703, "global_step": 98351, "epoch": 812} {"train_loss": -38.83436584472656, "global_step": 98352, "epoch": 812} {"train_loss": -35.52507400512695, "global_step": 98353, "epoch": 812} {"train_loss": -38.51778793334961, "global_step": 98354, "epoch": 812} {"train_loss": -37.1050910949707, "global_step": 98355, "epoch": 812} {"train_loss": -38.50513458251953, "global_step": 98356, "epoch": 812} {"train_loss": -37.854530334472656, "global_step": 98357, "epoch": 812} {"train_loss": -38.04043960571289, "global_step": 98358, "epoch": 812} {"train_loss": -38.62965393066406, "global_step": 98359, "epoch": 812} {"train_loss": -38.38271713256836, "global_step": 98360, "epoch": 812} {"train_loss": -38.81922149658203, "global_step": 98361, "epoch": 812} {"train_loss": -38.6308708190918, "global_step": 98362, "epoch": 812} {"train_loss": -39.0188102722168, "global_step": 98363, "epoch": 812} {"train_loss": -38.896881103515625, "global_step": 98364, "epoch": 812} {"train_loss": -39.0090446472168, "global_step": 98365, "epoch": 812} {"train_loss": -38.747100830078125, "global_step": 98366, "epoch": 812} {"train_loss": -39.36719512939453, "global_step": 98367, "epoch": 812} {"train_loss": -38.669105529785156, "global_step": 98368, "epoch": 812} {"train_loss": -39.235511779785156, "global_step": 98369, "epoch": 812} {"train_loss": -38.827606201171875, "global_step": 98370, "epoch": 812} {"train_loss": -39.26548385620117, "global_step": 98371, "epoch": 812} {"train_loss": -38.02616842916189, "global_step": 98372, "epoch": 812, "val_loss": 2713475.5} {"train_loss": -39.34144973754883, "global_step": 98373, "epoch": 813} {"train_loss": -39.26525115966797, "global_step": 98374, "epoch": 813} {"train_loss": -39.73070526123047, "global_step": 98375, "epoch": 813} {"train_loss": -39.03311538696289, "global_step": 98376, "epoch": 813} {"train_loss": -39.11756134033203, "global_step": 98377, "epoch": 813} {"train_loss": -39.217159271240234, "global_step": 98378, "epoch": 813} {"train_loss": -38.844295501708984, "global_step": 98379, "epoch": 813} {"train_loss": -39.075443267822266, "global_step": 98380, "epoch": 813} {"train_loss": -37.61336898803711, "global_step": 98381, "epoch": 813} {"train_loss": -36.73147201538086, "global_step": 98382, "epoch": 813} {"train_loss": -38.33213424682617, "global_step": 98383, "epoch": 813} {"train_loss": -38.535064697265625, "global_step": 98384, "epoch": 813} {"train_loss": -37.53011703491211, "global_step": 98385, "epoch": 813} {"train_loss": -37.273223876953125, "global_step": 98386, "epoch": 813} {"train_loss": -38.96035385131836, "global_step": 98387, "epoch": 813} {"train_loss": -38.47502899169922, "global_step": 98388, "epoch": 813} {"train_loss": -37.51573944091797, "global_step": 98389, "epoch": 813} {"train_loss": -37.937843322753906, "global_step": 98390, "epoch": 813} {"train_loss": -39.11295700073242, "global_step": 98391, "epoch": 813} {"train_loss": -39.112220764160156, "global_step": 98392, "epoch": 813} {"train_loss": -38.134212493896484, "global_step": 98393, "epoch": 813} {"train_loss": -38.78084182739258, "global_step": 98394, "epoch": 813} {"train_loss": -39.14052963256836, "global_step": 98395, "epoch": 813} {"train_loss": -38.3509407043457, "global_step": 98396, "epoch": 813} {"train_loss": -38.462677001953125, "global_step": 98397, "epoch": 813} {"train_loss": -38.9429817199707, "global_step": 98398, "epoch": 813} {"train_loss": -37.19211959838867, "global_step": 98399, "epoch": 813} {"train_loss": -38.2568359375, "global_step": 98400, "epoch": 813} {"train_loss": -39.0044059753418, "global_step": 98401, "epoch": 813} {"train_loss": -38.46529769897461, "global_step": 98402, "epoch": 813} {"train_loss": -37.745994567871094, "global_step": 98403, "epoch": 813} {"train_loss": -39.260379791259766, "global_step": 98404, "epoch": 813} {"train_loss": -37.1913948059082, "global_step": 98405, "epoch": 813} {"train_loss": -38.131439208984375, "global_step": 98406, "epoch": 813} {"train_loss": -39.11460876464844, "global_step": 98407, "epoch": 813} {"train_loss": -37.40741729736328, "global_step": 98408, "epoch": 813} {"train_loss": -38.064453125, "global_step": 98409, "epoch": 813} {"train_loss": -38.218502044677734, "global_step": 98410, "epoch": 813} {"train_loss": -38.36167526245117, "global_step": 98411, "epoch": 813} {"train_loss": -37.29936981201172, "global_step": 98412, "epoch": 813} {"train_loss": -37.80720901489258, "global_step": 98413, "epoch": 813} {"train_loss": -38.75690841674805, "global_step": 98414, "epoch": 813} {"train_loss": -37.765777587890625, "global_step": 98415, "epoch": 813} {"train_loss": -38.01570129394531, "global_step": 98416, "epoch": 813} {"train_loss": -38.594764709472656, "global_step": 98417, "epoch": 813} {"train_loss": -38.674468994140625, "global_step": 98418, "epoch": 813} {"train_loss": -38.913719177246094, "global_step": 98419, "epoch": 813} {"train_loss": -38.49460983276367, "global_step": 98420, "epoch": 813} {"train_loss": -38.87214660644531, "global_step": 98421, "epoch": 813} {"train_loss": -39.18455123901367, "global_step": 98422, "epoch": 813} {"train_loss": -39.109107971191406, "global_step": 98423, "epoch": 813} {"train_loss": -38.370819091796875, "global_step": 98424, "epoch": 813} {"train_loss": -39.43807601928711, "global_step": 98425, "epoch": 813} {"train_loss": -38.91958236694336, "global_step": 98426, "epoch": 813} {"train_loss": -37.85151290893555, "global_step": 98427, "epoch": 813} {"train_loss": -38.844520568847656, "global_step": 98428, "epoch": 813} {"train_loss": -38.17090606689453, "global_step": 98429, "epoch": 813} {"train_loss": -38.97883224487305, "global_step": 98430, "epoch": 813} {"train_loss": -39.003353118896484, "global_step": 98431, "epoch": 813} {"train_loss": -38.73586654663086, "global_step": 98432, "epoch": 813} {"train_loss": -38.915565490722656, "global_step": 98433, "epoch": 813} {"train_loss": -37.89392852783203, "global_step": 98434, "epoch": 813} {"train_loss": -38.32503128051758, "global_step": 98435, "epoch": 813} {"train_loss": -38.70465850830078, "global_step": 98436, "epoch": 813} {"train_loss": -38.67920684814453, "global_step": 98437, "epoch": 813} {"train_loss": -38.598915100097656, "global_step": 98438, "epoch": 813} {"train_loss": -38.505043029785156, "global_step": 98439, "epoch": 813} {"train_loss": -37.99143600463867, "global_step": 98440, "epoch": 813} {"train_loss": -39.60907745361328, "global_step": 98441, "epoch": 813} {"train_loss": -39.048030853271484, "global_step": 98442, "epoch": 813} {"train_loss": -39.133541107177734, "global_step": 98443, "epoch": 813} {"train_loss": -39.40378952026367, "global_step": 98444, "epoch": 813} {"train_loss": -38.77683639526367, "global_step": 98445, "epoch": 813} {"train_loss": -38.955596923828125, "global_step": 98446, "epoch": 813} {"train_loss": -39.40061950683594, "global_step": 98447, "epoch": 813} {"train_loss": -39.490821838378906, "global_step": 98448, "epoch": 813} {"train_loss": -39.56000518798828, "global_step": 98449, "epoch": 813} {"train_loss": -39.493247985839844, "global_step": 98450, "epoch": 813} {"train_loss": -39.28485870361328, "global_step": 98451, "epoch": 813} {"train_loss": -39.121788024902344, "global_step": 98452, "epoch": 813} {"train_loss": -39.56331253051758, "global_step": 98453, "epoch": 813} {"train_loss": -39.25457763671875, "global_step": 98454, "epoch": 813} {"train_loss": -39.27310562133789, "global_step": 98455, "epoch": 813} {"train_loss": -39.94379806518555, "global_step": 98456, "epoch": 813} {"train_loss": -39.78339385986328, "global_step": 98457, "epoch": 813} {"train_loss": -39.201515197753906, "global_step": 98458, "epoch": 813} {"train_loss": -39.63922882080078, "global_step": 98459, "epoch": 813} {"train_loss": -38.90435028076172, "global_step": 98460, "epoch": 813} {"train_loss": -38.60786056518555, "global_step": 98461, "epoch": 813} {"train_loss": -38.36377716064453, "global_step": 98462, "epoch": 813} {"train_loss": -38.8074836730957, "global_step": 98463, "epoch": 813} {"train_loss": -39.351131439208984, "global_step": 98464, "epoch": 813} {"train_loss": -39.78779220581055, "global_step": 98465, "epoch": 813} {"train_loss": -38.33144760131836, "global_step": 98466, "epoch": 813} {"train_loss": -35.02338409423828, "global_step": 98467, "epoch": 813} {"train_loss": -34.81895065307617, "global_step": 98468, "epoch": 813} {"train_loss": -39.451908111572266, "global_step": 98469, "epoch": 813} {"train_loss": -35.66254806518555, "global_step": 98470, "epoch": 813} {"train_loss": -33.4223747253418, "global_step": 98471, "epoch": 813} {"train_loss": -38.31523132324219, "global_step": 98472, "epoch": 813} {"train_loss": -39.09497833251953, "global_step": 98473, "epoch": 813} {"train_loss": -36.66156768798828, "global_step": 98474, "epoch": 813} {"train_loss": -38.25222396850586, "global_step": 98475, "epoch": 813} {"train_loss": -39.07563018798828, "global_step": 98476, "epoch": 813} {"train_loss": -37.91408920288086, "global_step": 98477, "epoch": 813} {"train_loss": -39.04339599609375, "global_step": 98478, "epoch": 813} {"train_loss": -38.37483596801758, "global_step": 98479, "epoch": 813} {"train_loss": -37.66611099243164, "global_step": 98480, "epoch": 813} {"train_loss": -38.736785888671875, "global_step": 98481, "epoch": 813} {"train_loss": -38.8928337097168, "global_step": 98482, "epoch": 813} {"train_loss": -39.05870056152344, "global_step": 98483, "epoch": 813} {"train_loss": -38.17033004760742, "global_step": 98484, "epoch": 813} {"train_loss": -39.37907791137695, "global_step": 98485, "epoch": 813} {"train_loss": -38.264808654785156, "global_step": 98486, "epoch": 813} {"train_loss": -38.56534957885742, "global_step": 98487, "epoch": 813} {"train_loss": -39.17770004272461, "global_step": 98488, "epoch": 813} {"train_loss": -39.15615463256836, "global_step": 98489, "epoch": 813} {"train_loss": -38.945735931396484, "global_step": 98490, "epoch": 813} {"train_loss": -39.054256439208984, "global_step": 98491, "epoch": 813} {"train_loss": -39.02811813354492, "global_step": 98492, "epoch": 813} {"train_loss": -38.54667096098593, "global_step": 98493, "epoch": 813, "val_loss": 2600354.5} {"train_loss": -38.5037956237793, "global_step": 98494, "epoch": 814} {"train_loss": -38.728759765625, "global_step": 98495, "epoch": 814} {"train_loss": -39.401763916015625, "global_step": 98496, "epoch": 814} {"train_loss": -38.94757843017578, "global_step": 98497, "epoch": 814} {"train_loss": -39.133358001708984, "global_step": 98498, "epoch": 814} {"train_loss": -37.783447265625, "global_step": 98499, "epoch": 814} {"train_loss": -38.66318893432617, "global_step": 98500, "epoch": 814} {"train_loss": -38.63360595703125, "global_step": 98501, "epoch": 814} {"train_loss": -38.433929443359375, "global_step": 98502, "epoch": 814} {"train_loss": -37.51389694213867, "global_step": 98503, "epoch": 814} {"train_loss": -37.76116180419922, "global_step": 98504, "epoch": 814} {"train_loss": -39.07643508911133, "global_step": 98505, "epoch": 814} {"train_loss": -38.990726470947266, "global_step": 98506, "epoch": 814} {"train_loss": -36.6706428527832, "global_step": 98507, "epoch": 814} {"train_loss": -37.539588928222656, "global_step": 98508, "epoch": 814} {"train_loss": -38.72711181640625, "global_step": 98509, "epoch": 814} {"train_loss": -38.41679000854492, "global_step": 98510, "epoch": 814} {"train_loss": -38.60783767700195, "global_step": 98511, "epoch": 814} {"train_loss": -38.592071533203125, "global_step": 98512, "epoch": 814} {"train_loss": -38.61842727661133, "global_step": 98513, "epoch": 814} {"train_loss": -38.78230667114258, "global_step": 98514, "epoch": 814} {"train_loss": -39.272743225097656, "global_step": 98515, "epoch": 814} {"train_loss": -38.95908737182617, "global_step": 98516, "epoch": 814} {"train_loss": -39.06864929199219, "global_step": 98517, "epoch": 814} {"train_loss": -39.332862854003906, "global_step": 98518, "epoch": 814} {"train_loss": -39.24247360229492, "global_step": 98519, "epoch": 814} {"train_loss": -38.73746871948242, "global_step": 98520, "epoch": 814} {"train_loss": -38.89419174194336, "global_step": 98521, "epoch": 814} {"train_loss": -37.33231735229492, "global_step": 98522, "epoch": 814} {"train_loss": -39.04130172729492, "global_step": 98523, "epoch": 814} {"train_loss": -38.4930305480957, "global_step": 98524, "epoch": 814} {"train_loss": -37.04566192626953, "global_step": 98525, "epoch": 814} {"train_loss": -38.728973388671875, "global_step": 98526, "epoch": 814} {"train_loss": -37.476837158203125, "global_step": 98527, "epoch": 814} {"train_loss": -37.74955368041992, "global_step": 98528, "epoch": 814} {"train_loss": -38.43130874633789, "global_step": 98529, "epoch": 814} {"train_loss": -37.488990783691406, "global_step": 98530, "epoch": 814} {"train_loss": -39.62956619262695, "global_step": 98531, "epoch": 814} {"train_loss": -37.901180267333984, "global_step": 98532, "epoch": 814} {"train_loss": -36.134464263916016, "global_step": 98533, "epoch": 814} {"train_loss": -37.544193267822266, "global_step": 98534, "epoch": 814} {"train_loss": -38.461769104003906, "global_step": 98535, "epoch": 814} {"train_loss": -36.7963752746582, "global_step": 98536, "epoch": 814} {"train_loss": -36.279449462890625, "global_step": 98537, "epoch": 814} {"train_loss": -37.55562210083008, "global_step": 98538, "epoch": 814} {"train_loss": -33.80453109741211, "global_step": 98539, "epoch": 814} {"train_loss": -34.267189025878906, "global_step": 98540, "epoch": 814} {"train_loss": -36.71443557739258, "global_step": 98541, "epoch": 814} {"train_loss": -35.45685958862305, "global_step": 98542, "epoch": 814} {"train_loss": -36.76798629760742, "global_step": 98543, "epoch": 814} {"train_loss": -36.32374954223633, "global_step": 98544, "epoch": 814} {"train_loss": -37.20298385620117, "global_step": 98545, "epoch": 814} {"train_loss": -36.552860260009766, "global_step": 98546, "epoch": 814} {"train_loss": -37.80438995361328, "global_step": 98547, "epoch": 814} {"train_loss": -37.51569366455078, "global_step": 98548, "epoch": 814} {"train_loss": -36.997459411621094, "global_step": 98549, "epoch": 814} {"train_loss": -38.7773551940918, "global_step": 98550, "epoch": 814} {"train_loss": -37.08759689331055, "global_step": 98551, "epoch": 814} {"train_loss": -36.98889923095703, "global_step": 98552, "epoch": 814} {"train_loss": -36.12984085083008, "global_step": 98553, "epoch": 814} {"train_loss": -35.00554275512695, "global_step": 98554, "epoch": 814} {"train_loss": -36.37504577636719, "global_step": 98555, "epoch": 814} {"train_loss": -36.354740142822266, "global_step": 98556, "epoch": 814} {"train_loss": -34.01430892944336, "global_step": 98557, "epoch": 814} {"train_loss": -35.991249084472656, "global_step": 98558, "epoch": 814} {"train_loss": -35.86434555053711, "global_step": 98559, "epoch": 814} {"train_loss": -35.58521270751953, "global_step": 98560, "epoch": 814} {"train_loss": -34.276973724365234, "global_step": 98561, "epoch": 814} {"train_loss": -34.608795166015625, "global_step": 98562, "epoch": 814} {"train_loss": -35.89872360229492, "global_step": 98563, "epoch": 814} {"train_loss": -35.78221130371094, "global_step": 98564, "epoch": 814} {"train_loss": -35.86692810058594, "global_step": 98565, "epoch": 814} {"train_loss": -36.668025970458984, "global_step": 98566, "epoch": 814} {"train_loss": -36.16835021972656, "global_step": 98567, "epoch": 814} {"train_loss": -37.38443374633789, "global_step": 98568, "epoch": 814} {"train_loss": -35.730873107910156, "global_step": 98569, "epoch": 814} {"train_loss": -37.60772705078125, "global_step": 98570, "epoch": 814} {"train_loss": -36.36701202392578, "global_step": 98571, "epoch": 814} {"train_loss": -37.29623031616211, "global_step": 98572, "epoch": 814} {"train_loss": -37.38296890258789, "global_step": 98573, "epoch": 814} {"train_loss": -37.63193130493164, "global_step": 98574, "epoch": 814} {"train_loss": -37.71272659301758, "global_step": 98575, "epoch": 814} {"train_loss": -38.0337028503418, "global_step": 98576, "epoch": 814} {"train_loss": -37.5903434753418, "global_step": 98577, "epoch": 814} {"train_loss": -37.47650909423828, "global_step": 98578, "epoch": 814} {"train_loss": -37.46609115600586, "global_step": 98579, "epoch": 814} {"train_loss": -37.84090805053711, "global_step": 98580, "epoch": 814} {"train_loss": -37.952911376953125, "global_step": 98581, "epoch": 814} {"train_loss": -38.151832580566406, "global_step": 98582, "epoch": 814} {"train_loss": -37.93256759643555, "global_step": 98583, "epoch": 814} {"train_loss": -38.092681884765625, "global_step": 98584, "epoch": 814} {"train_loss": -38.7348518371582, "global_step": 98585, "epoch": 814} {"train_loss": -38.45600509643555, "global_step": 98586, "epoch": 814} {"train_loss": -38.588172912597656, "global_step": 98587, "epoch": 814} {"train_loss": -38.68134689331055, "global_step": 98588, "epoch": 814} {"train_loss": -38.83787536621094, "global_step": 98589, "epoch": 814} {"train_loss": -38.794673919677734, "global_step": 98590, "epoch": 814} {"train_loss": -38.999755859375, "global_step": 98591, "epoch": 814} {"train_loss": -38.623714447021484, "global_step": 98592, "epoch": 814} {"train_loss": -38.91669464111328, "global_step": 98593, "epoch": 814} {"train_loss": -38.799781799316406, "global_step": 98594, "epoch": 814} {"train_loss": -38.941009521484375, "global_step": 98595, "epoch": 814} {"train_loss": -38.779380798339844, "global_step": 98596, "epoch": 814} {"train_loss": -38.9154052734375, "global_step": 98597, "epoch": 814} {"train_loss": -38.92903518676758, "global_step": 98598, "epoch": 814} {"train_loss": -39.358154296875, "global_step": 98599, "epoch": 814} {"train_loss": -39.14154052734375, "global_step": 98600, "epoch": 814} {"train_loss": -40.06014633178711, "global_step": 98601, "epoch": 814} {"train_loss": -39.26441192626953, "global_step": 98602, "epoch": 814} {"train_loss": -39.629859924316406, "global_step": 98603, "epoch": 814} {"train_loss": -39.504425048828125, "global_step": 98604, "epoch": 814} {"train_loss": -39.591087341308594, "global_step": 98605, "epoch": 814} {"train_loss": -39.80495071411133, "global_step": 98606, "epoch": 814} {"train_loss": -39.3974609375, "global_step": 98607, "epoch": 814} {"train_loss": -39.7098503112793, "global_step": 98608, "epoch": 814} {"train_loss": -39.683876037597656, "global_step": 98609, "epoch": 814} {"train_loss": -39.618751525878906, "global_step": 98610, "epoch": 814} {"train_loss": -39.4653434753418, "global_step": 98611, "epoch": 814} {"train_loss": -39.962158203125, "global_step": 98612, "epoch": 814} {"train_loss": -40.06892013549805, "global_step": 98613, "epoch": 814} {"train_loss": -37.88874274640044, "global_step": 98614, "epoch": 814, "val_loss": 2679552.25} {"train_loss": -39.821590423583984, "global_step": 98615, "epoch": 815} {"train_loss": -39.43126678466797, "global_step": 98616, "epoch": 815} {"train_loss": -39.7429313659668, "global_step": 98617, "epoch": 815} {"train_loss": -39.94578170776367, "global_step": 98618, "epoch": 815} {"train_loss": -40.14278030395508, "global_step": 98619, "epoch": 815} {"train_loss": -39.50738525390625, "global_step": 98620, "epoch": 815} {"train_loss": -39.30781173706055, "global_step": 98621, "epoch": 815} {"train_loss": -39.5194091796875, "global_step": 98622, "epoch": 815} {"train_loss": -39.817832946777344, "global_step": 98623, "epoch": 815} {"train_loss": -40.00042724609375, "global_step": 98624, "epoch": 815} {"train_loss": -40.02180099487305, "global_step": 98625, "epoch": 815} {"train_loss": -40.365447998046875, "global_step": 98626, "epoch": 815} {"train_loss": -40.043373107910156, "global_step": 98627, "epoch": 815} {"train_loss": -40.305049896240234, "global_step": 98628, "epoch": 815} {"train_loss": -40.179866790771484, "global_step": 98629, "epoch": 815} {"train_loss": -39.79313659667969, "global_step": 98630, "epoch": 815} {"train_loss": -39.514251708984375, "global_step": 98631, "epoch": 815} {"train_loss": -39.4442138671875, "global_step": 98632, "epoch": 815} {"train_loss": -39.516578674316406, "global_step": 98633, "epoch": 815} {"train_loss": -39.42115020751953, "global_step": 98634, "epoch": 815} {"train_loss": -39.8082389831543, "global_step": 98635, "epoch": 815} {"train_loss": -39.83540725708008, "global_step": 98636, "epoch": 815} {"train_loss": -40.326595306396484, "global_step": 98637, "epoch": 815} {"train_loss": -39.891597747802734, "global_step": 98638, "epoch": 815} {"train_loss": -39.79560852050781, "global_step": 98639, "epoch": 815} {"train_loss": -38.56327438354492, "global_step": 98640, "epoch": 815} {"train_loss": -37.09577178955078, "global_step": 98641, "epoch": 815} {"train_loss": -32.1536865234375, "global_step": 98642, "epoch": 815} {"train_loss": -31.15919303894043, "global_step": 98643, "epoch": 815} {"train_loss": -33.82161331176758, "global_step": 98644, "epoch": 815} {"train_loss": -34.81354522705078, "global_step": 98645, "epoch": 815} {"train_loss": -34.02705001831055, "global_step": 98646, "epoch": 815} {"train_loss": -34.26096725463867, "global_step": 98647, "epoch": 815} {"train_loss": -33.42533493041992, "global_step": 98648, "epoch": 815} {"train_loss": -34.2453727722168, "global_step": 98649, "epoch": 815} {"train_loss": -34.64154815673828, "global_step": 98650, "epoch": 815} {"train_loss": -34.065711975097656, "global_step": 98651, "epoch": 815} {"train_loss": -35.774166107177734, "global_step": 98652, "epoch": 815} {"train_loss": -34.6887321472168, "global_step": 98653, "epoch": 815} {"train_loss": -35.55678176879883, "global_step": 98654, "epoch": 815} {"train_loss": -36.51607131958008, "global_step": 98655, "epoch": 815} {"train_loss": -36.26252365112305, "global_step": 98656, "epoch": 815} {"train_loss": -37.29121017456055, "global_step": 98657, "epoch": 815} {"train_loss": -38.1436653137207, "global_step": 98658, "epoch": 815} {"train_loss": -36.289424896240234, "global_step": 98659, "epoch": 815} {"train_loss": -37.14774703979492, "global_step": 98660, "epoch": 815} {"train_loss": -36.3004264831543, "global_step": 98661, "epoch": 815} {"train_loss": -37.082820892333984, "global_step": 98662, "epoch": 815} {"train_loss": -37.982872009277344, "global_step": 98663, "epoch": 815} {"train_loss": -36.953975677490234, "global_step": 98664, "epoch": 815} {"train_loss": -36.528709411621094, "global_step": 98665, "epoch": 815} {"train_loss": -37.35765075683594, "global_step": 98666, "epoch": 815} {"train_loss": -35.8012580871582, "global_step": 98667, "epoch": 815} {"train_loss": -37.93537139892578, "global_step": 98668, "epoch": 815} {"train_loss": -37.576698303222656, "global_step": 98669, "epoch": 815} {"train_loss": -35.13020706176758, "global_step": 98670, "epoch": 815} {"train_loss": -36.2985954284668, "global_step": 98671, "epoch": 815} {"train_loss": -36.24169921875, "global_step": 98672, "epoch": 815} {"train_loss": -36.22829818725586, "global_step": 98673, "epoch": 815} {"train_loss": -34.958343505859375, "global_step": 98674, "epoch": 815} {"train_loss": -35.92784881591797, "global_step": 98675, "epoch": 815} {"train_loss": -37.94959259033203, "global_step": 98676, "epoch": 815} {"train_loss": -37.36188507080078, "global_step": 98677, "epoch": 815} {"train_loss": -35.524105072021484, "global_step": 98678, "epoch": 815} {"train_loss": -37.09993362426758, "global_step": 98679, "epoch": 815} {"train_loss": -37.570159912109375, "global_step": 98680, "epoch": 815} {"train_loss": -38.300804138183594, "global_step": 98681, "epoch": 815} {"train_loss": -38.42401885986328, "global_step": 98682, "epoch": 815} {"train_loss": -38.28110885620117, "global_step": 98683, "epoch": 815} {"train_loss": -38.43307876586914, "global_step": 98684, "epoch": 815} {"train_loss": -38.40131759643555, "global_step": 98685, "epoch": 815} {"train_loss": -38.26287841796875, "global_step": 98686, "epoch": 815} {"train_loss": -37.41496658325195, "global_step": 98687, "epoch": 815} {"train_loss": -38.95024871826172, "global_step": 98688, "epoch": 815} {"train_loss": -38.64198684692383, "global_step": 98689, "epoch": 815} {"train_loss": -38.79911422729492, "global_step": 98690, "epoch": 815} {"train_loss": -38.92470169067383, "global_step": 98691, "epoch": 815} {"train_loss": -39.28715896606445, "global_step": 98692, "epoch": 815} {"train_loss": -38.34204864501953, "global_step": 98693, "epoch": 815} {"train_loss": -38.394561767578125, "global_step": 98694, "epoch": 815} {"train_loss": -38.4034309387207, "global_step": 98695, "epoch": 815} {"train_loss": -37.057037353515625, "global_step": 98696, "epoch": 815} {"train_loss": -38.44526290893555, "global_step": 98697, "epoch": 815} {"train_loss": -38.660926818847656, "global_step": 98698, "epoch": 815} {"train_loss": -39.2550163269043, "global_step": 98699, "epoch": 815} {"train_loss": -38.45344924926758, "global_step": 98700, "epoch": 815} {"train_loss": -38.23762893676758, "global_step": 98701, "epoch": 815} {"train_loss": -37.82916259765625, "global_step": 98702, "epoch": 815} {"train_loss": -38.6344108581543, "global_step": 98703, "epoch": 815} {"train_loss": -38.6519889831543, "global_step": 98704, "epoch": 815} {"train_loss": -37.10485076904297, "global_step": 98705, "epoch": 815} {"train_loss": -36.3387336730957, "global_step": 98706, "epoch": 815} {"train_loss": -36.66457748413086, "global_step": 98707, "epoch": 815} {"train_loss": -37.29867935180664, "global_step": 98708, "epoch": 815} {"train_loss": -39.00041961669922, "global_step": 98709, "epoch": 815} {"train_loss": -37.88737869262695, "global_step": 98710, "epoch": 815} {"train_loss": -37.73870086669922, "global_step": 98711, "epoch": 815} {"train_loss": -37.81573486328125, "global_step": 98712, "epoch": 815} {"train_loss": -37.66652297973633, "global_step": 98713, "epoch": 815} {"train_loss": -37.9332389831543, "global_step": 98714, "epoch": 815} {"train_loss": -37.832271575927734, "global_step": 98715, "epoch": 815} {"train_loss": -38.11503219604492, "global_step": 98716, "epoch": 815} {"train_loss": -38.310882568359375, "global_step": 98717, "epoch": 815} {"train_loss": -37.98368453979492, "global_step": 98718, "epoch": 815} {"train_loss": -38.1096076965332, "global_step": 98719, "epoch": 815} {"train_loss": -38.62405014038086, "global_step": 98720, "epoch": 815} {"train_loss": -38.23945236206055, "global_step": 98721, "epoch": 815} {"train_loss": -38.78179931640625, "global_step": 98722, "epoch": 815} {"train_loss": -38.796043395996094, "global_step": 98723, "epoch": 815} {"train_loss": -38.077857971191406, "global_step": 98724, "epoch": 815} {"train_loss": -39.16999435424805, "global_step": 98725, "epoch": 815} {"train_loss": -39.219722747802734, "global_step": 98726, "epoch": 815} {"train_loss": -38.41569900512695, "global_step": 98727, "epoch": 815} {"train_loss": -38.95573806762695, "global_step": 98728, "epoch": 815} {"train_loss": -38.76573944091797, "global_step": 98729, "epoch": 815} {"train_loss": -39.117347717285156, "global_step": 98730, "epoch": 815} {"train_loss": -38.6021842956543, "global_step": 98731, "epoch": 815} {"train_loss": -38.747467041015625, "global_step": 98732, "epoch": 815} {"train_loss": -38.8289794921875, "global_step": 98733, "epoch": 815} {"train_loss": -38.318233489990234, "global_step": 98734, "epoch": 815} {"train_loss": -37.823519005263144, "global_step": 98735, "epoch": 815, "val_loss": 2662010.0} {"train_loss": -37.64616012573242, "global_step": 98736, "epoch": 816} {"train_loss": -39.37238693237305, "global_step": 98737, "epoch": 816} {"train_loss": -38.23153305053711, "global_step": 98738, "epoch": 816} {"train_loss": -38.4953498840332, "global_step": 98739, "epoch": 816} {"train_loss": -39.234745025634766, "global_step": 98740, "epoch": 816} {"train_loss": -38.43928909301758, "global_step": 98741, "epoch": 816} {"train_loss": -38.811737060546875, "global_step": 98742, "epoch": 816} {"train_loss": -39.034881591796875, "global_step": 98743, "epoch": 816} {"train_loss": -38.681617736816406, "global_step": 98744, "epoch": 816} {"train_loss": -38.50944137573242, "global_step": 98745, "epoch": 816} {"train_loss": -39.32418441772461, "global_step": 98746, "epoch": 816} {"train_loss": -38.63772201538086, "global_step": 98747, "epoch": 816} {"train_loss": -39.05136489868164, "global_step": 98748, "epoch": 816} {"train_loss": -39.255126953125, "global_step": 98749, "epoch": 816} {"train_loss": -38.71999740600586, "global_step": 98750, "epoch": 816} {"train_loss": -39.20044708251953, "global_step": 98751, "epoch": 816} {"train_loss": -39.82666015625, "global_step": 98752, "epoch": 816} {"train_loss": -38.98667526245117, "global_step": 98753, "epoch": 816} {"train_loss": -39.26241683959961, "global_step": 98754, "epoch": 816} {"train_loss": -39.340145111083984, "global_step": 98755, "epoch": 816} {"train_loss": -39.29685592651367, "global_step": 98756, "epoch": 816} {"train_loss": -39.01040267944336, "global_step": 98757, "epoch": 816} {"train_loss": -39.59702682495117, "global_step": 98758, "epoch": 816} {"train_loss": -38.82912826538086, "global_step": 98759, "epoch": 816} {"train_loss": -38.96342086791992, "global_step": 98760, "epoch": 816} {"train_loss": -39.463802337646484, "global_step": 98761, "epoch": 816} {"train_loss": -39.30947494506836, "global_step": 98762, "epoch": 816} {"train_loss": -38.99518966674805, "global_step": 98763, "epoch": 816} {"train_loss": -39.55472946166992, "global_step": 98764, "epoch": 816} {"train_loss": -38.92512130737305, "global_step": 98765, "epoch": 816} {"train_loss": -38.93024826049805, "global_step": 98766, "epoch": 816} {"train_loss": -38.98373031616211, "global_step": 98767, "epoch": 816} {"train_loss": -38.605690002441406, "global_step": 98768, "epoch": 816} {"train_loss": -38.21059799194336, "global_step": 98769, "epoch": 816} {"train_loss": -37.69917297363281, "global_step": 98770, "epoch": 816} {"train_loss": -37.81760787963867, "global_step": 98771, "epoch": 816} {"train_loss": -37.51715850830078, "global_step": 98772, "epoch": 816} {"train_loss": -37.74998092651367, "global_step": 98773, "epoch": 816} {"train_loss": -39.5266227722168, "global_step": 98774, "epoch": 816} {"train_loss": -38.9472770690918, "global_step": 98775, "epoch": 816} {"train_loss": -38.80219650268555, "global_step": 98776, "epoch": 816} {"train_loss": -38.0303840637207, "global_step": 98777, "epoch": 816} {"train_loss": -38.881404876708984, "global_step": 98778, "epoch": 816} {"train_loss": -39.186153411865234, "global_step": 98779, "epoch": 816} {"train_loss": -39.47019577026367, "global_step": 98780, "epoch": 816} {"train_loss": -40.051475524902344, "global_step": 98781, "epoch": 816} {"train_loss": -39.65081024169922, "global_step": 98782, "epoch": 816} {"train_loss": -40.09236526489258, "global_step": 98783, "epoch": 816} {"train_loss": -39.90676498413086, "global_step": 98784, "epoch": 816} {"train_loss": -39.47457504272461, "global_step": 98785, "epoch": 816} {"train_loss": -39.520565032958984, "global_step": 98786, "epoch": 816} {"train_loss": -39.634403228759766, "global_step": 98787, "epoch": 816} {"train_loss": -39.63349151611328, "global_step": 98788, "epoch": 816} {"train_loss": -39.0428352355957, "global_step": 98789, "epoch": 816} {"train_loss": -39.5585823059082, "global_step": 98790, "epoch": 816} {"train_loss": -39.15074157714844, "global_step": 98791, "epoch": 816} {"train_loss": -38.36297607421875, "global_step": 98792, "epoch": 816} {"train_loss": -39.85065841674805, "global_step": 98793, "epoch": 816} {"train_loss": -39.26264953613281, "global_step": 98794, "epoch": 816} {"train_loss": -38.82510757446289, "global_step": 98795, "epoch": 816} {"train_loss": -37.95003128051758, "global_step": 98796, "epoch": 816} {"train_loss": -38.189430236816406, "global_step": 98797, "epoch": 816} {"train_loss": -38.955692291259766, "global_step": 98798, "epoch": 816} {"train_loss": -38.90789794921875, "global_step": 98799, "epoch": 816} {"train_loss": -37.912139892578125, "global_step": 98800, "epoch": 816} {"train_loss": -37.47805404663086, "global_step": 98801, "epoch": 816} {"train_loss": -40.042903900146484, "global_step": 98802, "epoch": 816} {"train_loss": -39.12496566772461, "global_step": 98803, "epoch": 816} {"train_loss": -37.98124694824219, "global_step": 98804, "epoch": 816} {"train_loss": -38.40772247314453, "global_step": 98805, "epoch": 816} {"train_loss": -38.30165481567383, "global_step": 98806, "epoch": 816} {"train_loss": -36.61508560180664, "global_step": 98807, "epoch": 816} {"train_loss": -38.895904541015625, "global_step": 98808, "epoch": 816} {"train_loss": -38.169464111328125, "global_step": 98809, "epoch": 816} {"train_loss": -37.7772216796875, "global_step": 98810, "epoch": 816} {"train_loss": -39.354766845703125, "global_step": 98811, "epoch": 816} {"train_loss": -37.66958999633789, "global_step": 98812, "epoch": 816} {"train_loss": -37.88362121582031, "global_step": 98813, "epoch": 816} {"train_loss": -38.96806716918945, "global_step": 98814, "epoch": 816} {"train_loss": -38.3939094543457, "global_step": 98815, "epoch": 816} {"train_loss": -39.09351348876953, "global_step": 98816, "epoch": 816} {"train_loss": -38.12848663330078, "global_step": 98817, "epoch": 816} {"train_loss": -38.530696868896484, "global_step": 98818, "epoch": 816} {"train_loss": -38.464271545410156, "global_step": 98819, "epoch": 816} {"train_loss": -39.49300765991211, "global_step": 98820, "epoch": 816} {"train_loss": -38.361934661865234, "global_step": 98821, "epoch": 816} {"train_loss": -39.16058349609375, "global_step": 98822, "epoch": 816} {"train_loss": -37.595272064208984, "global_step": 98823, "epoch": 816} {"train_loss": -39.209285736083984, "global_step": 98824, "epoch": 816} {"train_loss": -38.79106521606445, "global_step": 98825, "epoch": 816} {"train_loss": -37.87629318237305, "global_step": 98826, "epoch": 816} {"train_loss": -36.85525131225586, "global_step": 98827, "epoch": 816} {"train_loss": -37.09008026123047, "global_step": 98828, "epoch": 816} {"train_loss": -38.36265182495117, "global_step": 98829, "epoch": 816} {"train_loss": -39.21684265136719, "global_step": 98830, "epoch": 816} {"train_loss": -37.16676712036133, "global_step": 98831, "epoch": 816} {"train_loss": -37.7843017578125, "global_step": 98832, "epoch": 816} {"train_loss": -39.23671340942383, "global_step": 98833, "epoch": 816} {"train_loss": -38.30134201049805, "global_step": 98834, "epoch": 816} {"train_loss": -38.6898078918457, "global_step": 98835, "epoch": 816} {"train_loss": -39.18683624267578, "global_step": 98836, "epoch": 816} {"train_loss": -38.775753021240234, "global_step": 98837, "epoch": 816} {"train_loss": -39.09127426147461, "global_step": 98838, "epoch": 816} {"train_loss": -38.545772552490234, "global_step": 98839, "epoch": 816} {"train_loss": -38.094093322753906, "global_step": 98840, "epoch": 816} {"train_loss": -39.06706619262695, "global_step": 98841, "epoch": 816} {"train_loss": -37.80757522583008, "global_step": 98842, "epoch": 816} {"train_loss": -37.213661193847656, "global_step": 98843, "epoch": 816} {"train_loss": -38.74129867553711, "global_step": 98844, "epoch": 816} {"train_loss": -37.29926300048828, "global_step": 98845, "epoch": 816} {"train_loss": -37.47464370727539, "global_step": 98846, "epoch": 816} {"train_loss": -39.243614196777344, "global_step": 98847, "epoch": 816} {"train_loss": -37.014198303222656, "global_step": 98848, "epoch": 816} {"train_loss": -38.61380386352539, "global_step": 98849, "epoch": 816} {"train_loss": -38.69721603393555, "global_step": 98850, "epoch": 816} {"train_loss": -37.6448860168457, "global_step": 98851, "epoch": 816} {"train_loss": -39.547332763671875, "global_step": 98852, "epoch": 816} {"train_loss": -38.88806915283203, "global_step": 98853, "epoch": 816} {"train_loss": -38.92375946044922, "global_step": 98854, "epoch": 816} {"train_loss": -38.724830627441406, "global_step": 98855, "epoch": 816} {"train_loss": -38.691022037474575, "global_step": 98856, "epoch": 816, "val_loss": 2635215.25} {"train_loss": -38.27845001220703, "global_step": 98857, "epoch": 817} {"train_loss": -38.26939010620117, "global_step": 98858, "epoch": 817} {"train_loss": -38.93920135498047, "global_step": 98859, "epoch": 817} {"train_loss": -36.888545989990234, "global_step": 98860, "epoch": 817} {"train_loss": -37.692657470703125, "global_step": 98861, "epoch": 817} {"train_loss": -36.94123458862305, "global_step": 98862, "epoch": 817} {"train_loss": -38.057220458984375, "global_step": 98863, "epoch": 817} {"train_loss": -37.20125961303711, "global_step": 98864, "epoch": 817} {"train_loss": -38.61503219604492, "global_step": 98865, "epoch": 817} {"train_loss": -38.44526290893555, "global_step": 98866, "epoch": 817} {"train_loss": -38.07666015625, "global_step": 98867, "epoch": 817} {"train_loss": -39.09803009033203, "global_step": 98868, "epoch": 817} {"train_loss": -38.07390213012695, "global_step": 98869, "epoch": 817} {"train_loss": -37.37224197387695, "global_step": 98870, "epoch": 817} {"train_loss": -37.869930267333984, "global_step": 98871, "epoch": 817} {"train_loss": -39.23505401611328, "global_step": 98872, "epoch": 817} {"train_loss": -37.022823333740234, "global_step": 98873, "epoch": 817} {"train_loss": -36.38165283203125, "global_step": 98874, "epoch": 817} {"train_loss": -37.99177169799805, "global_step": 98875, "epoch": 817} {"train_loss": -39.14602279663086, "global_step": 98876, "epoch": 817} {"train_loss": -36.53965377807617, "global_step": 98877, "epoch": 817} {"train_loss": -38.029457092285156, "global_step": 98878, "epoch": 817} {"train_loss": -37.87757110595703, "global_step": 98879, "epoch": 817} {"train_loss": -38.28815841674805, "global_step": 98880, "epoch": 817} {"train_loss": -39.14387893676758, "global_step": 98881, "epoch": 817} {"train_loss": -37.422271728515625, "global_step": 98882, "epoch": 817} {"train_loss": -37.34491729736328, "global_step": 98883, "epoch": 817} {"train_loss": -39.04536819458008, "global_step": 98884, "epoch": 817} {"train_loss": -39.59623336791992, "global_step": 98885, "epoch": 817} {"train_loss": -39.00654220581055, "global_step": 98886, "epoch": 817} {"train_loss": -38.777217864990234, "global_step": 98887, "epoch": 817} {"train_loss": -38.57456588745117, "global_step": 98888, "epoch": 817} {"train_loss": -39.04850387573242, "global_step": 98889, "epoch": 817} {"train_loss": -39.61122512817383, "global_step": 98890, "epoch": 817} {"train_loss": -39.48121643066406, "global_step": 98891, "epoch": 817} {"train_loss": -39.710269927978516, "global_step": 98892, "epoch": 817} {"train_loss": -39.41865158081055, "global_step": 98893, "epoch": 817} {"train_loss": -39.920902252197266, "global_step": 98894, "epoch": 817} {"train_loss": -39.35358810424805, "global_step": 98895, "epoch": 817} {"train_loss": -39.04280090332031, "global_step": 98896, "epoch": 817} {"train_loss": -39.48665237426758, "global_step": 98897, "epoch": 817} {"train_loss": -38.738643646240234, "global_step": 98898, "epoch": 817} {"train_loss": -39.6683464050293, "global_step": 98899, "epoch": 817} {"train_loss": -39.71055221557617, "global_step": 98900, "epoch": 817} {"train_loss": -39.35938262939453, "global_step": 98901, "epoch": 817} {"train_loss": -38.83846664428711, "global_step": 98902, "epoch": 817} {"train_loss": -38.71793746948242, "global_step": 98903, "epoch": 817} {"train_loss": -39.68620681762695, "global_step": 98904, "epoch": 817} {"train_loss": -39.0800666809082, "global_step": 98905, "epoch": 817} {"train_loss": -39.7518424987793, "global_step": 98906, "epoch": 817} {"train_loss": -39.47066116333008, "global_step": 98907, "epoch": 817} {"train_loss": -39.17204284667969, "global_step": 98908, "epoch": 817} {"train_loss": -39.30300521850586, "global_step": 98909, "epoch": 817} {"train_loss": -39.19939041137695, "global_step": 98910, "epoch": 817} {"train_loss": -38.58707809448242, "global_step": 98911, "epoch": 817} {"train_loss": -38.26129913330078, "global_step": 98912, "epoch": 817} {"train_loss": -38.943729400634766, "global_step": 98913, "epoch": 817} {"train_loss": -39.95284652709961, "global_step": 98914, "epoch": 817} {"train_loss": -39.36298370361328, "global_step": 98915, "epoch": 817} {"train_loss": -39.37110900878906, "global_step": 98916, "epoch": 817} {"train_loss": -38.97811508178711, "global_step": 98917, "epoch": 817} {"train_loss": -38.757301330566406, "global_step": 98918, "epoch": 817} {"train_loss": -38.46150588989258, "global_step": 98919, "epoch": 817} {"train_loss": -39.3736457824707, "global_step": 98920, "epoch": 817} {"train_loss": -39.821319580078125, "global_step": 98921, "epoch": 817} {"train_loss": -39.65279769897461, "global_step": 98922, "epoch": 817} {"train_loss": -39.211021423339844, "global_step": 98923, "epoch": 817} {"train_loss": -39.62870407104492, "global_step": 98924, "epoch": 817} {"train_loss": -39.4997673034668, "global_step": 98925, "epoch": 817} {"train_loss": -40.15290069580078, "global_step": 98926, "epoch": 817} {"train_loss": -39.14577865600586, "global_step": 98927, "epoch": 817} {"train_loss": -37.83170700073242, "global_step": 98928, "epoch": 817} {"train_loss": -37.30938720703125, "global_step": 98929, "epoch": 817} {"train_loss": -37.53911209106445, "global_step": 98930, "epoch": 817} {"train_loss": -38.95048141479492, "global_step": 98931, "epoch": 817} {"train_loss": -39.85921096801758, "global_step": 98932, "epoch": 817} {"train_loss": -39.897979736328125, "global_step": 98933, "epoch": 817} {"train_loss": -39.119449615478516, "global_step": 98934, "epoch": 817} {"train_loss": -39.34980010986328, "global_step": 98935, "epoch": 817} {"train_loss": -39.29944610595703, "global_step": 98936, "epoch": 817} {"train_loss": -39.57953643798828, "global_step": 98937, "epoch": 817} {"train_loss": -38.964351654052734, "global_step": 98938, "epoch": 817} {"train_loss": -39.102142333984375, "global_step": 98939, "epoch": 817} {"train_loss": -39.12238693237305, "global_step": 98940, "epoch": 817} {"train_loss": -38.53290939331055, "global_step": 98941, "epoch": 817} {"train_loss": -37.879207611083984, "global_step": 98942, "epoch": 817} {"train_loss": -38.965328216552734, "global_step": 98943, "epoch": 817} {"train_loss": -38.0367546081543, "global_step": 98944, "epoch": 817} {"train_loss": -39.33557891845703, "global_step": 98945, "epoch": 817} {"train_loss": -39.56638717651367, "global_step": 98946, "epoch": 817} {"train_loss": -39.184722900390625, "global_step": 98947, "epoch": 817} {"train_loss": -38.09712219238281, "global_step": 98948, "epoch": 817} {"train_loss": -38.35099411010742, "global_step": 98949, "epoch": 817} {"train_loss": -38.38629150390625, "global_step": 98950, "epoch": 817} {"train_loss": -38.41441345214844, "global_step": 98951, "epoch": 817} {"train_loss": -36.109046936035156, "global_step": 98952, "epoch": 817} {"train_loss": -37.62398147583008, "global_step": 98953, "epoch": 817} {"train_loss": -38.56817626953125, "global_step": 98954, "epoch": 817} {"train_loss": -38.57452392578125, "global_step": 98955, "epoch": 817} {"train_loss": -39.32275390625, "global_step": 98956, "epoch": 817} {"train_loss": -38.7709846496582, "global_step": 98957, "epoch": 817} {"train_loss": -38.447811126708984, "global_step": 98958, "epoch": 817} {"train_loss": -38.76386260986328, "global_step": 98959, "epoch": 817} {"train_loss": -38.489356994628906, "global_step": 98960, "epoch": 817} {"train_loss": -37.438720703125, "global_step": 98961, "epoch": 817} {"train_loss": -38.540794372558594, "global_step": 98962, "epoch": 817} {"train_loss": -39.431575775146484, "global_step": 98963, "epoch": 817} {"train_loss": -39.42206954956055, "global_step": 98964, "epoch": 817} {"train_loss": -38.447547912597656, "global_step": 98965, "epoch": 817} {"train_loss": -38.6480827331543, "global_step": 98966, "epoch": 817} {"train_loss": -39.43021774291992, "global_step": 98967, "epoch": 817} {"train_loss": -38.95974349975586, "global_step": 98968, "epoch": 817} {"train_loss": -38.72408676147461, "global_step": 98969, "epoch": 817} {"train_loss": -38.88896560668945, "global_step": 98970, "epoch": 817} {"train_loss": -39.7022705078125, "global_step": 98971, "epoch": 817} {"train_loss": -39.58187484741211, "global_step": 98972, "epoch": 817} {"train_loss": -39.28300857543945, "global_step": 98973, "epoch": 817} {"train_loss": -38.803497314453125, "global_step": 98974, "epoch": 817} {"train_loss": -38.7109489440918, "global_step": 98975, "epoch": 817} {"train_loss": -39.763099670410156, "global_step": 98976, "epoch": 817} {"train_loss": -38.764819689033445, "global_step": 98977, "epoch": 817, "val_loss": 2652750.25} {"train_loss": -38.73866653442383, "global_step": 98978, "epoch": 818} {"train_loss": -39.745521545410156, "global_step": 98979, "epoch": 818} {"train_loss": -38.75522994995117, "global_step": 98980, "epoch": 818} {"train_loss": -39.36270523071289, "global_step": 98981, "epoch": 818} {"train_loss": -39.2328987121582, "global_step": 98982, "epoch": 818} {"train_loss": -39.12405014038086, "global_step": 98983, "epoch": 818} {"train_loss": -38.98393630981445, "global_step": 98984, "epoch": 818} {"train_loss": -38.67853927612305, "global_step": 98985, "epoch": 818} {"train_loss": -38.58272933959961, "global_step": 98986, "epoch": 818} {"train_loss": -39.01961135864258, "global_step": 98987, "epoch": 818} {"train_loss": -39.193382263183594, "global_step": 98988, "epoch": 818} {"train_loss": -39.10154342651367, "global_step": 98989, "epoch": 818} {"train_loss": -39.176265716552734, "global_step": 98990, "epoch": 818} {"train_loss": -38.108741760253906, "global_step": 98991, "epoch": 818} {"train_loss": -38.85908889770508, "global_step": 98992, "epoch": 818} {"train_loss": -39.0643424987793, "global_step": 98993, "epoch": 818} {"train_loss": -37.848899841308594, "global_step": 98994, "epoch": 818} {"train_loss": -37.5677375793457, "global_step": 98995, "epoch": 818} {"train_loss": -36.53702926635742, "global_step": 98996, "epoch": 818} {"train_loss": -39.032501220703125, "global_step": 98997, "epoch": 818} {"train_loss": -39.134212493896484, "global_step": 98998, "epoch": 818} {"train_loss": -36.23077392578125, "global_step": 98999, "epoch": 818} {"train_loss": -37.88106918334961, "global_step": 99000, "epoch": 818} {"train_loss": -39.27486038208008, "global_step": 99001, "epoch": 818} {"train_loss": -39.1499137878418, "global_step": 99002, "epoch": 818} {"train_loss": -38.017333984375, "global_step": 99003, "epoch": 818} {"train_loss": -39.446449279785156, "global_step": 99004, "epoch": 818} {"train_loss": -39.16846466064453, "global_step": 99005, "epoch": 818} {"train_loss": -37.53435516357422, "global_step": 99006, "epoch": 818} {"train_loss": -37.306095123291016, "global_step": 99007, "epoch": 818} {"train_loss": -37.90730667114258, "global_step": 99008, "epoch": 818} {"train_loss": -35.72634506225586, "global_step": 99009, "epoch": 818} {"train_loss": -38.15327072143555, "global_step": 99010, "epoch": 818} {"train_loss": -39.5689697265625, "global_step": 99011, "epoch": 818} {"train_loss": -38.15439987182617, "global_step": 99012, "epoch": 818} {"train_loss": -37.26699447631836, "global_step": 99013, "epoch": 818} {"train_loss": -37.66814422607422, "global_step": 99014, "epoch": 818} {"train_loss": -38.876312255859375, "global_step": 99015, "epoch": 818} {"train_loss": -38.35797882080078, "global_step": 99016, "epoch": 818} {"train_loss": -36.261871337890625, "global_step": 99017, "epoch": 818} {"train_loss": -38.14990234375, "global_step": 99018, "epoch": 818} {"train_loss": -39.0081901550293, "global_step": 99019, "epoch": 818} {"train_loss": -37.592041015625, "global_step": 99020, "epoch": 818} {"train_loss": -38.1604118347168, "global_step": 99021, "epoch": 818} {"train_loss": -38.60015869140625, "global_step": 99022, "epoch": 818} {"train_loss": -39.29783630371094, "global_step": 99023, "epoch": 818} {"train_loss": -38.9971809387207, "global_step": 99024, "epoch": 818} {"train_loss": -39.15239715576172, "global_step": 99025, "epoch": 818} {"train_loss": -39.2852783203125, "global_step": 99026, "epoch": 818} {"train_loss": -39.064788818359375, "global_step": 99027, "epoch": 818} {"train_loss": -39.75527572631836, "global_step": 99028, "epoch": 818} {"train_loss": -39.43559646606445, "global_step": 99029, "epoch": 818} {"train_loss": -39.512840270996094, "global_step": 99030, "epoch": 818} {"train_loss": -39.46467208862305, "global_step": 99031, "epoch": 818} {"train_loss": -39.86188888549805, "global_step": 99032, "epoch": 818} {"train_loss": -39.64044952392578, "global_step": 99033, "epoch": 818} {"train_loss": -39.50513458251953, "global_step": 99034, "epoch": 818} {"train_loss": -39.69110870361328, "global_step": 99035, "epoch": 818} {"train_loss": -39.54616928100586, "global_step": 99036, "epoch": 818} {"train_loss": -39.9720458984375, "global_step": 99037, "epoch": 818} {"train_loss": -39.56012725830078, "global_step": 99038, "epoch": 818} {"train_loss": -39.35355758666992, "global_step": 99039, "epoch": 818} {"train_loss": -38.933345794677734, "global_step": 99040, "epoch": 818} {"train_loss": -38.874969482421875, "global_step": 99041, "epoch": 818} {"train_loss": -39.049190521240234, "global_step": 99042, "epoch": 818} {"train_loss": -38.69894027709961, "global_step": 99043, "epoch": 818} {"train_loss": -39.625511169433594, "global_step": 99044, "epoch": 818} {"train_loss": -38.594417572021484, "global_step": 99045, "epoch": 818} {"train_loss": -38.482051849365234, "global_step": 99046, "epoch": 818} {"train_loss": -39.85227966308594, "global_step": 99047, "epoch": 818} {"train_loss": -38.7015266418457, "global_step": 99048, "epoch": 818} {"train_loss": -38.37343215942383, "global_step": 99049, "epoch": 818} {"train_loss": -40.04761505126953, "global_step": 99050, "epoch": 818} {"train_loss": -38.16572189331055, "global_step": 99051, "epoch": 818} {"train_loss": -39.134944915771484, "global_step": 99052, "epoch": 818} {"train_loss": -38.794918060302734, "global_step": 99053, "epoch": 818} {"train_loss": -39.629310607910156, "global_step": 99054, "epoch": 818} {"train_loss": -39.409263610839844, "global_step": 99055, "epoch": 818} {"train_loss": -38.67017364501953, "global_step": 99056, "epoch": 818} {"train_loss": -39.19258499145508, "global_step": 99057, "epoch": 818} {"train_loss": -39.16180419921875, "global_step": 99058, "epoch": 818} {"train_loss": -39.36967849731445, "global_step": 99059, "epoch": 818} {"train_loss": -39.27958297729492, "global_step": 99060, "epoch": 818} {"train_loss": -38.35375213623047, "global_step": 99061, "epoch": 818} {"train_loss": -37.4307975769043, "global_step": 99062, "epoch": 818} {"train_loss": -38.940547943115234, "global_step": 99063, "epoch": 818} {"train_loss": -37.76268005371094, "global_step": 99064, "epoch": 818} {"train_loss": -37.364593505859375, "global_step": 99065, "epoch": 818} {"train_loss": -36.4430046081543, "global_step": 99066, "epoch": 818} {"train_loss": -37.17979049682617, "global_step": 99067, "epoch": 818} {"train_loss": -36.74033737182617, "global_step": 99068, "epoch": 818} {"train_loss": -37.207275390625, "global_step": 99069, "epoch": 818} {"train_loss": -37.92311477661133, "global_step": 99070, "epoch": 818} {"train_loss": -36.58842086791992, "global_step": 99071, "epoch": 818} {"train_loss": -37.164466857910156, "global_step": 99072, "epoch": 818} {"train_loss": -37.68940353393555, "global_step": 99073, "epoch": 818} {"train_loss": -38.81281280517578, "global_step": 99074, "epoch": 818} {"train_loss": -38.312721252441406, "global_step": 99075, "epoch": 818} {"train_loss": -38.9992790222168, "global_step": 99076, "epoch": 818} {"train_loss": -38.39632797241211, "global_step": 99077, "epoch": 818} {"train_loss": -38.569183349609375, "global_step": 99078, "epoch": 818} {"train_loss": -38.44025421142578, "global_step": 99079, "epoch": 818} {"train_loss": -38.38600540161133, "global_step": 99080, "epoch": 818} {"train_loss": -38.97037124633789, "global_step": 99081, "epoch": 818} {"train_loss": -38.91178894042969, "global_step": 99082, "epoch": 818} {"train_loss": -39.56331253051758, "global_step": 99083, "epoch": 818} {"train_loss": -39.774967193603516, "global_step": 99084, "epoch": 818} {"train_loss": -39.42228698730469, "global_step": 99085, "epoch": 818} {"train_loss": -39.51599884033203, "global_step": 99086, "epoch": 818} {"train_loss": -39.43952560424805, "global_step": 99087, "epoch": 818} {"train_loss": -39.3068962097168, "global_step": 99088, "epoch": 818} {"train_loss": -39.06043243408203, "global_step": 99089, "epoch": 818} {"train_loss": -39.47886276245117, "global_step": 99090, "epoch": 818} {"train_loss": -39.724063873291016, "global_step": 99091, "epoch": 818} {"train_loss": -39.31929397583008, "global_step": 99092, "epoch": 818} {"train_loss": -39.913204193115234, "global_step": 99093, "epoch": 818} {"train_loss": -39.5035400390625, "global_step": 99094, "epoch": 818} {"train_loss": -38.52901840209961, "global_step": 99095, "epoch": 818} {"train_loss": -38.89406967163086, "global_step": 99096, "epoch": 818} {"train_loss": -39.682491302490234, "global_step": 99097, "epoch": 818} {"train_loss": -38.70644599347075, "global_step": 99098, "epoch": 818, "val_loss": 2667773.25} {"train_loss": -38.77317428588867, "global_step": 99099, "epoch": 819} {"train_loss": -39.54246520996094, "global_step": 99100, "epoch": 819} {"train_loss": -39.713340759277344, "global_step": 99101, "epoch": 819} {"train_loss": -38.603759765625, "global_step": 99102, "epoch": 819} {"train_loss": -39.930335998535156, "global_step": 99103, "epoch": 819} {"train_loss": -39.10915756225586, "global_step": 99104, "epoch": 819} {"train_loss": -39.38434982299805, "global_step": 99105, "epoch": 819} {"train_loss": -39.526763916015625, "global_step": 99106, "epoch": 819} {"train_loss": -39.5910758972168, "global_step": 99107, "epoch": 819} {"train_loss": -39.443843841552734, "global_step": 99108, "epoch": 819} {"train_loss": -39.838714599609375, "global_step": 99109, "epoch": 819} {"train_loss": -39.15814971923828, "global_step": 99110, "epoch": 819} {"train_loss": -39.05802536010742, "global_step": 99111, "epoch": 819} {"train_loss": -39.32442855834961, "global_step": 99112, "epoch": 819} {"train_loss": -39.241817474365234, "global_step": 99113, "epoch": 819} {"train_loss": -38.918697357177734, "global_step": 99114, "epoch": 819} {"train_loss": -38.69116973876953, "global_step": 99115, "epoch": 819} {"train_loss": -39.77022933959961, "global_step": 99116, "epoch": 819} {"train_loss": -39.3443717956543, "global_step": 99117, "epoch": 819} {"train_loss": -37.45943832397461, "global_step": 99118, "epoch": 819} {"train_loss": -36.92414474487305, "global_step": 99119, "epoch": 819} {"train_loss": -38.43323516845703, "global_step": 99120, "epoch": 819} {"train_loss": -38.94572067260742, "global_step": 99121, "epoch": 819} {"train_loss": -37.78529357910156, "global_step": 99122, "epoch": 819} {"train_loss": -38.870941162109375, "global_step": 99123, "epoch": 819} {"train_loss": -38.54145050048828, "global_step": 99124, "epoch": 819} {"train_loss": -36.2381591796875, "global_step": 99125, "epoch": 819} {"train_loss": -36.1993293762207, "global_step": 99126, "epoch": 819} {"train_loss": -38.314937591552734, "global_step": 99127, "epoch": 819} {"train_loss": -38.12211990356445, "global_step": 99128, "epoch": 819} {"train_loss": -38.58758544921875, "global_step": 99129, "epoch": 819} {"train_loss": -39.02658462524414, "global_step": 99130, "epoch": 819} {"train_loss": -38.867218017578125, "global_step": 99131, "epoch": 819} {"train_loss": -39.09900665283203, "global_step": 99132, "epoch": 819} {"train_loss": -38.275062561035156, "global_step": 99133, "epoch": 819} {"train_loss": -38.15767288208008, "global_step": 99134, "epoch": 819} {"train_loss": -37.97991943359375, "global_step": 99135, "epoch": 819} {"train_loss": -38.69086837768555, "global_step": 99136, "epoch": 819} {"train_loss": -38.7600212097168, "global_step": 99137, "epoch": 819} {"train_loss": -38.471927642822266, "global_step": 99138, "epoch": 819} {"train_loss": -38.27143096923828, "global_step": 99139, "epoch": 819} {"train_loss": -37.3418083190918, "global_step": 99140, "epoch": 819} {"train_loss": -38.43460464477539, "global_step": 99141, "epoch": 819} {"train_loss": -39.33943557739258, "global_step": 99142, "epoch": 819} {"train_loss": -37.67020797729492, "global_step": 99143, "epoch": 819} {"train_loss": -37.9621696472168, "global_step": 99144, "epoch": 819} {"train_loss": -39.0083122253418, "global_step": 99145, "epoch": 819} {"train_loss": -38.333946228027344, "global_step": 99146, "epoch": 819} {"train_loss": -38.85084915161133, "global_step": 99147, "epoch": 819} {"train_loss": -39.0204963684082, "global_step": 99148, "epoch": 819} {"train_loss": -37.80560302734375, "global_step": 99149, "epoch": 819} {"train_loss": -38.64400863647461, "global_step": 99150, "epoch": 819} {"train_loss": -38.4289436340332, "global_step": 99151, "epoch": 819} {"train_loss": -37.890193939208984, "global_step": 99152, "epoch": 819} {"train_loss": -37.705841064453125, "global_step": 99153, "epoch": 819} {"train_loss": -36.54743576049805, "global_step": 99154, "epoch": 819} {"train_loss": -37.47304916381836, "global_step": 99155, "epoch": 819} {"train_loss": -36.959346771240234, "global_step": 99156, "epoch": 819} {"train_loss": -37.64411163330078, "global_step": 99157, "epoch": 819} {"train_loss": -36.05615234375, "global_step": 99158, "epoch": 819} {"train_loss": -36.794429779052734, "global_step": 99159, "epoch": 819} {"train_loss": -35.44866943359375, "global_step": 99160, "epoch": 819} {"train_loss": -38.03376007080078, "global_step": 99161, "epoch": 819} {"train_loss": -37.7418212890625, "global_step": 99162, "epoch": 819} {"train_loss": -38.4262580871582, "global_step": 99163, "epoch": 819} {"train_loss": -36.50986862182617, "global_step": 99164, "epoch": 819} {"train_loss": -38.611534118652344, "global_step": 99165, "epoch": 819} {"train_loss": -37.98236083984375, "global_step": 99166, "epoch": 819} {"train_loss": -37.88343048095703, "global_step": 99167, "epoch": 819} {"train_loss": -37.66154861450195, "global_step": 99168, "epoch": 819} {"train_loss": -38.34023666381836, "global_step": 99169, "epoch": 819} {"train_loss": -38.542659759521484, "global_step": 99170, "epoch": 819} {"train_loss": -38.218841552734375, "global_step": 99171, "epoch": 819} {"train_loss": -38.407867431640625, "global_step": 99172, "epoch": 819} {"train_loss": -38.206398010253906, "global_step": 99173, "epoch": 819} {"train_loss": -38.60897445678711, "global_step": 99174, "epoch": 819} {"train_loss": -36.17029571533203, "global_step": 99175, "epoch": 819} {"train_loss": -38.548133850097656, "global_step": 99176, "epoch": 819} {"train_loss": -36.17045211791992, "global_step": 99177, "epoch": 819} {"train_loss": -37.80522918701172, "global_step": 99178, "epoch": 819} {"train_loss": -38.33863067626953, "global_step": 99179, "epoch": 819} {"train_loss": -37.5955810546875, "global_step": 99180, "epoch": 819} {"train_loss": -37.456058502197266, "global_step": 99181, "epoch": 819} {"train_loss": -38.096038818359375, "global_step": 99182, "epoch": 819} {"train_loss": -38.99117660522461, "global_step": 99183, "epoch": 819} {"train_loss": -37.589195251464844, "global_step": 99184, "epoch": 819} {"train_loss": -37.47141647338867, "global_step": 99185, "epoch": 819} {"train_loss": -37.2827262878418, "global_step": 99186, "epoch": 819} {"train_loss": -37.664466857910156, "global_step": 99187, "epoch": 819} {"train_loss": -36.75026321411133, "global_step": 99188, "epoch": 819} {"train_loss": -35.78903579711914, "global_step": 99189, "epoch": 819} {"train_loss": -39.07732009887695, "global_step": 99190, "epoch": 819} {"train_loss": -38.28821563720703, "global_step": 99191, "epoch": 819} {"train_loss": -36.564117431640625, "global_step": 99192, "epoch": 819} {"train_loss": -36.93878936767578, "global_step": 99193, "epoch": 819} {"train_loss": -36.61226272583008, "global_step": 99194, "epoch": 819} {"train_loss": -38.21866989135742, "global_step": 99195, "epoch": 819} {"train_loss": -38.431949615478516, "global_step": 99196, "epoch": 819} {"train_loss": -36.626068115234375, "global_step": 99197, "epoch": 819} {"train_loss": -37.69816970825195, "global_step": 99198, "epoch": 819} {"train_loss": -38.0782585144043, "global_step": 99199, "epoch": 819} {"train_loss": -36.10392379760742, "global_step": 99200, "epoch": 819} {"train_loss": -37.11542510986328, "global_step": 99201, "epoch": 819} {"train_loss": -38.29783630371094, "global_step": 99202, "epoch": 819} {"train_loss": -36.8487663269043, "global_step": 99203, "epoch": 819} {"train_loss": -37.128204345703125, "global_step": 99204, "epoch": 819} {"train_loss": -38.336544036865234, "global_step": 99205, "epoch": 819} {"train_loss": -37.75673294067383, "global_step": 99206, "epoch": 819} {"train_loss": -37.262386322021484, "global_step": 99207, "epoch": 819} {"train_loss": -37.78790283203125, "global_step": 99208, "epoch": 819} {"train_loss": -38.162635803222656, "global_step": 99209, "epoch": 819} {"train_loss": -38.25703811645508, "global_step": 99210, "epoch": 819} {"train_loss": -38.55379104614258, "global_step": 99211, "epoch": 819} {"train_loss": -38.927040100097656, "global_step": 99212, "epoch": 819} {"train_loss": -38.18851852416992, "global_step": 99213, "epoch": 819} {"train_loss": -38.85932159423828, "global_step": 99214, "epoch": 819} {"train_loss": -38.54771041870117, "global_step": 99215, "epoch": 819} {"train_loss": -38.66864013671875, "global_step": 99216, "epoch": 819} {"train_loss": -37.14890670776367, "global_step": 99217, "epoch": 819} {"train_loss": -38.57243728637695, "global_step": 99218, "epoch": 819} {"train_loss": -38.10649238145056, "global_step": 99219, "epoch": 819, "val_loss": 2649523.75} {"train_loss": -38.0128059387207, "global_step": 99220, "epoch": 820} {"train_loss": -38.29217529296875, "global_step": 99221, "epoch": 820} {"train_loss": -39.11713790893555, "global_step": 99222, "epoch": 820} {"train_loss": -38.657684326171875, "global_step": 99223, "epoch": 820} {"train_loss": -38.09309768676758, "global_step": 99224, "epoch": 820} {"train_loss": -39.13608169555664, "global_step": 99225, "epoch": 820} {"train_loss": -38.979732513427734, "global_step": 99226, "epoch": 820} {"train_loss": -38.345497131347656, "global_step": 99227, "epoch": 820} {"train_loss": -38.9185791015625, "global_step": 99228, "epoch": 820} {"train_loss": -39.34296798706055, "global_step": 99229, "epoch": 820} {"train_loss": -38.36656951904297, "global_step": 99230, "epoch": 820} {"train_loss": -39.482421875, "global_step": 99231, "epoch": 820} {"train_loss": -39.10659408569336, "global_step": 99232, "epoch": 820} {"train_loss": -38.92574691772461, "global_step": 99233, "epoch": 820} {"train_loss": -39.434017181396484, "global_step": 99234, "epoch": 820} {"train_loss": -38.8071174621582, "global_step": 99235, "epoch": 820} {"train_loss": -39.28600311279297, "global_step": 99236, "epoch": 820} {"train_loss": -39.59833908081055, "global_step": 99237, "epoch": 820} {"train_loss": -38.67060470581055, "global_step": 99238, "epoch": 820} {"train_loss": -39.77628707885742, "global_step": 99239, "epoch": 820} {"train_loss": -38.63251876831055, "global_step": 99240, "epoch": 820} {"train_loss": -38.872291564941406, "global_step": 99241, "epoch": 820} {"train_loss": -38.80250549316406, "global_step": 99242, "epoch": 820} {"train_loss": -39.56818771362305, "global_step": 99243, "epoch": 820} {"train_loss": -39.778526306152344, "global_step": 99244, "epoch": 820} {"train_loss": -38.736427307128906, "global_step": 99245, "epoch": 820} {"train_loss": -38.481075286865234, "global_step": 99246, "epoch": 820} {"train_loss": -38.75382614135742, "global_step": 99247, "epoch": 820} {"train_loss": -38.76264572143555, "global_step": 99248, "epoch": 820} {"train_loss": -39.092506408691406, "global_step": 99249, "epoch": 820} {"train_loss": -38.90037155151367, "global_step": 99250, "epoch": 820} {"train_loss": -39.60195541381836, "global_step": 99251, "epoch": 820} {"train_loss": -37.9928092956543, "global_step": 99252, "epoch": 820} {"train_loss": -36.384765625, "global_step": 99253, "epoch": 820} {"train_loss": -35.746456146240234, "global_step": 99254, "epoch": 820} {"train_loss": -37.69612503051758, "global_step": 99255, "epoch": 820} {"train_loss": -37.52204895019531, "global_step": 99256, "epoch": 820} {"train_loss": -37.26784896850586, "global_step": 99257, "epoch": 820} {"train_loss": -38.18320846557617, "global_step": 99258, "epoch": 820} {"train_loss": -36.19533157348633, "global_step": 99259, "epoch": 820} {"train_loss": -38.93714141845703, "global_step": 99260, "epoch": 820} {"train_loss": -38.365447998046875, "global_step": 99261, "epoch": 820} {"train_loss": -37.07914352416992, "global_step": 99262, "epoch": 820} {"train_loss": -39.181846618652344, "global_step": 99263, "epoch": 820} {"train_loss": -38.38021469116211, "global_step": 99264, "epoch": 820} {"train_loss": -37.98844528198242, "global_step": 99265, "epoch": 820} {"train_loss": -38.6622428894043, "global_step": 99266, "epoch": 820} {"train_loss": -38.445430755615234, "global_step": 99267, "epoch": 820} {"train_loss": -38.71657943725586, "global_step": 99268, "epoch": 820} {"train_loss": -38.81822204589844, "global_step": 99269, "epoch": 820} {"train_loss": -38.28133773803711, "global_step": 99270, "epoch": 820} {"train_loss": -37.003841400146484, "global_step": 99271, "epoch": 820} {"train_loss": -37.47575759887695, "global_step": 99272, "epoch": 820} {"train_loss": -39.24946975708008, "global_step": 99273, "epoch": 820} {"train_loss": -39.31648635864258, "global_step": 99274, "epoch": 820} {"train_loss": -38.55628967285156, "global_step": 99275, "epoch": 820} {"train_loss": -39.09480667114258, "global_step": 99276, "epoch": 820} {"train_loss": -39.29067611694336, "global_step": 99277, "epoch": 820} {"train_loss": -38.45457077026367, "global_step": 99278, "epoch": 820} {"train_loss": -39.320735931396484, "global_step": 99279, "epoch": 820} {"train_loss": -39.074424743652344, "global_step": 99280, "epoch": 820} {"train_loss": -39.4078483581543, "global_step": 99281, "epoch": 820} {"train_loss": -38.080196380615234, "global_step": 99282, "epoch": 820} {"train_loss": -38.95063400268555, "global_step": 99283, "epoch": 820} {"train_loss": -38.922821044921875, "global_step": 99284, "epoch": 820} {"train_loss": -38.4480094909668, "global_step": 99285, "epoch": 820} {"train_loss": -38.40713882446289, "global_step": 99286, "epoch": 820} {"train_loss": -39.657569885253906, "global_step": 99287, "epoch": 820} {"train_loss": -39.385982513427734, "global_step": 99288, "epoch": 820} {"train_loss": -38.8566780090332, "global_step": 99289, "epoch": 820} {"train_loss": -39.809329986572266, "global_step": 99290, "epoch": 820} {"train_loss": -38.566497802734375, "global_step": 99291, "epoch": 820} {"train_loss": -39.11312484741211, "global_step": 99292, "epoch": 820} {"train_loss": -38.71907424926758, "global_step": 99293, "epoch": 820} {"train_loss": -38.690399169921875, "global_step": 99294, "epoch": 820} {"train_loss": -39.5152702331543, "global_step": 99295, "epoch": 820} {"train_loss": -38.106117248535156, "global_step": 99296, "epoch": 820} {"train_loss": -37.4945068359375, "global_step": 99297, "epoch": 820} {"train_loss": -36.733642578125, "global_step": 99298, "epoch": 820} {"train_loss": -39.510414123535156, "global_step": 99299, "epoch": 820} {"train_loss": -37.9254264831543, "global_step": 99300, "epoch": 820} {"train_loss": -38.86455535888672, "global_step": 99301, "epoch": 820} {"train_loss": -38.86519241333008, "global_step": 99302, "epoch": 820} {"train_loss": -40.05085372924805, "global_step": 99303, "epoch": 820} {"train_loss": -39.33999252319336, "global_step": 99304, "epoch": 820} {"train_loss": -38.4586296081543, "global_step": 99305, "epoch": 820} {"train_loss": -37.9731330871582, "global_step": 99306, "epoch": 820} {"train_loss": -39.48099136352539, "global_step": 99307, "epoch": 820} {"train_loss": -39.445125579833984, "global_step": 99308, "epoch": 820} {"train_loss": -38.95210647583008, "global_step": 99309, "epoch": 820} {"train_loss": -39.52812576293945, "global_step": 99310, "epoch": 820} {"train_loss": -38.54301071166992, "global_step": 99311, "epoch": 820} {"train_loss": -38.64822769165039, "global_step": 99312, "epoch": 820} {"train_loss": -38.68939971923828, "global_step": 99313, "epoch": 820} {"train_loss": -37.00798034667969, "global_step": 99314, "epoch": 820} {"train_loss": -33.73726272583008, "global_step": 99315, "epoch": 820} {"train_loss": -34.71291732788086, "global_step": 99316, "epoch": 820} {"train_loss": -33.969390869140625, "global_step": 99317, "epoch": 820} {"train_loss": -33.85209655761719, "global_step": 99318, "epoch": 820} {"train_loss": -33.91318893432617, "global_step": 99319, "epoch": 820} {"train_loss": -21.147321701049805, "global_step": 99320, "epoch": 820} {"train_loss": -35.214698791503906, "global_step": 99321, "epoch": 820} {"train_loss": -20.38532066345215, "global_step": 99322, "epoch": 820} {"train_loss": -18.8633975982666, "global_step": 99323, "epoch": 820} {"train_loss": -30.878253936767578, "global_step": 99324, "epoch": 820} {"train_loss": -36.479679107666016, "global_step": 99325, "epoch": 820} {"train_loss": -32.629600524902344, "global_step": 99326, "epoch": 820} {"train_loss": -32.47621154785156, "global_step": 99327, "epoch": 820} {"train_loss": -29.687734603881836, "global_step": 99328, "epoch": 820} {"train_loss": -37.36909866333008, "global_step": 99329, "epoch": 820} {"train_loss": -33.86511993408203, "global_step": 99330, "epoch": 820} {"train_loss": -37.21902847290039, "global_step": 99331, "epoch": 820} {"train_loss": -37.25551986694336, "global_step": 99332, "epoch": 820} {"train_loss": -35.27558517456055, "global_step": 99333, "epoch": 820} {"train_loss": -36.82609939575195, "global_step": 99334, "epoch": 820} {"train_loss": -33.687801361083984, "global_step": 99335, "epoch": 820} {"train_loss": -36.56779098510742, "global_step": 99336, "epoch": 820} {"train_loss": -37.46358871459961, "global_step": 99337, "epoch": 820} {"train_loss": -36.47835922241211, "global_step": 99338, "epoch": 820} {"train_loss": -37.98708724975586, "global_step": 99339, "epoch": 820} {"train_loss": -37.49385124395702, "global_step": 99340, "epoch": 820, "val_loss": 2630997.75} {"train_loss": -38.012882232666016, "global_step": 99341, "epoch": 821} {"train_loss": -37.802093505859375, "global_step": 99342, "epoch": 821} {"train_loss": -38.562381744384766, "global_step": 99343, "epoch": 821} {"train_loss": -37.75973129272461, "global_step": 99344, "epoch": 821} {"train_loss": -37.842464447021484, "global_step": 99345, "epoch": 821} {"train_loss": -38.47713088989258, "global_step": 99346, "epoch": 821} {"train_loss": -38.351905822753906, "global_step": 99347, "epoch": 821} {"train_loss": -38.60358810424805, "global_step": 99348, "epoch": 821} {"train_loss": -38.69171905517578, "global_step": 99349, "epoch": 821} {"train_loss": -38.8440055847168, "global_step": 99350, "epoch": 821} {"train_loss": -38.975399017333984, "global_step": 99351, "epoch": 821} {"train_loss": -38.66362380981445, "global_step": 99352, "epoch": 821} {"train_loss": -39.08832931518555, "global_step": 99353, "epoch": 821} {"train_loss": -38.65656280517578, "global_step": 99354, "epoch": 821} {"train_loss": -39.122352600097656, "global_step": 99355, "epoch": 821} {"train_loss": -38.914955139160156, "global_step": 99356, "epoch": 821} {"train_loss": -38.842369079589844, "global_step": 99357, "epoch": 821} {"train_loss": -38.75925827026367, "global_step": 99358, "epoch": 821} {"train_loss": -36.53661346435547, "global_step": 99359, "epoch": 821} {"train_loss": -38.6446533203125, "global_step": 99360, "epoch": 821} {"train_loss": -39.03098678588867, "global_step": 99361, "epoch": 821} {"train_loss": -39.129615783691406, "global_step": 99362, "epoch": 821} {"train_loss": -39.06834411621094, "global_step": 99363, "epoch": 821} {"train_loss": -39.53681564331055, "global_step": 99364, "epoch": 821} {"train_loss": -38.989959716796875, "global_step": 99365, "epoch": 821} {"train_loss": -38.25054168701172, "global_step": 99366, "epoch": 821} {"train_loss": -38.130859375, "global_step": 99367, "epoch": 821} {"train_loss": -38.181697845458984, "global_step": 99368, "epoch": 821} {"train_loss": -37.697975158691406, "global_step": 99369, "epoch": 821} {"train_loss": -38.555057525634766, "global_step": 99370, "epoch": 821} {"train_loss": -38.749168395996094, "global_step": 99371, "epoch": 821} {"train_loss": -38.81932830810547, "global_step": 99372, "epoch": 821} {"train_loss": -39.48480224609375, "global_step": 99373, "epoch": 821} {"train_loss": -38.67755889892578, "global_step": 99374, "epoch": 821} {"train_loss": -37.94285202026367, "global_step": 99375, "epoch": 821} {"train_loss": -38.77534484863281, "global_step": 99376, "epoch": 821} {"train_loss": -38.64323043823242, "global_step": 99377, "epoch": 821} {"train_loss": -38.86117935180664, "global_step": 99378, "epoch": 821} {"train_loss": -37.34012222290039, "global_step": 99379, "epoch": 821} {"train_loss": -35.99384307861328, "global_step": 99380, "epoch": 821} {"train_loss": -38.97049331665039, "global_step": 99381, "epoch": 821} {"train_loss": -35.83036422729492, "global_step": 99382, "epoch": 821} {"train_loss": -39.062496185302734, "global_step": 99383, "epoch": 821} {"train_loss": -36.92680740356445, "global_step": 99384, "epoch": 821} {"train_loss": -33.92582321166992, "global_step": 99385, "epoch": 821} {"train_loss": -36.95998001098633, "global_step": 99386, "epoch": 821} {"train_loss": -32.32143783569336, "global_step": 99387, "epoch": 821} {"train_loss": -32.69672393798828, "global_step": 99388, "epoch": 821} {"train_loss": -34.56707763671875, "global_step": 99389, "epoch": 821} {"train_loss": -32.39651107788086, "global_step": 99390, "epoch": 821} {"train_loss": -31.566999435424805, "global_step": 99391, "epoch": 821} {"train_loss": -33.43758773803711, "global_step": 99392, "epoch": 821} {"train_loss": -27.551593780517578, "global_step": 99393, "epoch": 821} {"train_loss": -33.37437057495117, "global_step": 99394, "epoch": 821} {"train_loss": -29.66233253479004, "global_step": 99395, "epoch": 821} {"train_loss": -29.235727310180664, "global_step": 99396, "epoch": 821} {"train_loss": -34.09035873413086, "global_step": 99397, "epoch": 821} {"train_loss": -29.660486221313477, "global_step": 99398, "epoch": 821} {"train_loss": -28.67177391052246, "global_step": 99399, "epoch": 821} {"train_loss": -28.923322677612305, "global_step": 99400, "epoch": 821} {"train_loss": -31.13079833984375, "global_step": 99401, "epoch": 821} {"train_loss": -23.5545597076416, "global_step": 99402, "epoch": 821} {"train_loss": -31.91926383972168, "global_step": 99403, "epoch": 821} {"train_loss": -30.126840591430664, "global_step": 99404, "epoch": 821} {"train_loss": -27.401212692260742, "global_step": 99405, "epoch": 821} {"train_loss": -30.436758041381836, "global_step": 99406, "epoch": 821} {"train_loss": -32.30416488647461, "global_step": 99407, "epoch": 821} {"train_loss": -32.956363677978516, "global_step": 99408, "epoch": 821} {"train_loss": -28.2752628326416, "global_step": 99409, "epoch": 821} {"train_loss": -32.80143356323242, "global_step": 99410, "epoch": 821} {"train_loss": -31.948652267456055, "global_step": 99411, "epoch": 821} {"train_loss": -29.377685546875, "global_step": 99412, "epoch": 821} {"train_loss": -30.768081665039062, "global_step": 99413, "epoch": 821} {"train_loss": -32.931331634521484, "global_step": 99414, "epoch": 821} {"train_loss": -32.3680305480957, "global_step": 99415, "epoch": 821} {"train_loss": -33.6104850769043, "global_step": 99416, "epoch": 821} {"train_loss": -33.95054244995117, "global_step": 99417, "epoch": 821} {"train_loss": -33.51310348510742, "global_step": 99418, "epoch": 821} {"train_loss": -33.25327682495117, "global_step": 99419, "epoch": 821} {"train_loss": -33.46406936645508, "global_step": 99420, "epoch": 821} {"train_loss": -33.756507873535156, "global_step": 99421, "epoch": 821} {"train_loss": -33.55470657348633, "global_step": 99422, "epoch": 821} {"train_loss": -33.93741989135742, "global_step": 99423, "epoch": 821} {"train_loss": -34.45042037963867, "global_step": 99424, "epoch": 821} {"train_loss": -34.22776412963867, "global_step": 99425, "epoch": 821} {"train_loss": -34.556331634521484, "global_step": 99426, "epoch": 821} {"train_loss": -35.098690032958984, "global_step": 99427, "epoch": 821} {"train_loss": -34.434600830078125, "global_step": 99428, "epoch": 821} {"train_loss": -34.400352478027344, "global_step": 99429, "epoch": 821} {"train_loss": -34.75126647949219, "global_step": 99430, "epoch": 821} {"train_loss": -34.4260139465332, "global_step": 99431, "epoch": 821} {"train_loss": -35.006629943847656, "global_step": 99432, "epoch": 821} {"train_loss": -34.60907745361328, "global_step": 99433, "epoch": 821} {"train_loss": -34.4384880065918, "global_step": 99434, "epoch": 821} {"train_loss": -34.864986419677734, "global_step": 99435, "epoch": 821} {"train_loss": -34.98671340942383, "global_step": 99436, "epoch": 821} {"train_loss": -35.659053802490234, "global_step": 99437, "epoch": 821} {"train_loss": -34.0586051940918, "global_step": 99438, "epoch": 821} {"train_loss": -35.37299728393555, "global_step": 99439, "epoch": 821} {"train_loss": -35.750789642333984, "global_step": 99440, "epoch": 821} {"train_loss": -35.15070343017578, "global_step": 99441, "epoch": 821} {"train_loss": -35.806758880615234, "global_step": 99442, "epoch": 821} {"train_loss": -35.89944076538086, "global_step": 99443, "epoch": 821} {"train_loss": -35.37797927856445, "global_step": 99444, "epoch": 821} {"train_loss": -35.876991271972656, "global_step": 99445, "epoch": 821} {"train_loss": -36.43430709838867, "global_step": 99446, "epoch": 821} {"train_loss": -36.04385757446289, "global_step": 99447, "epoch": 821} {"train_loss": -36.31787872314453, "global_step": 99448, "epoch": 821} {"train_loss": -36.281349182128906, "global_step": 99449, "epoch": 821} {"train_loss": -36.14210510253906, "global_step": 99450, "epoch": 821} {"train_loss": -35.50920486450195, "global_step": 99451, "epoch": 821} {"train_loss": -35.87176513671875, "global_step": 99452, "epoch": 821} {"train_loss": -36.31999588012695, "global_step": 99453, "epoch": 821} {"train_loss": -36.56760787963867, "global_step": 99454, "epoch": 821} {"train_loss": -36.272762298583984, "global_step": 99455, "epoch": 821} {"train_loss": -36.55936813354492, "global_step": 99456, "epoch": 821} {"train_loss": -36.40285873413086, "global_step": 99457, "epoch": 821} {"train_loss": -36.39388656616211, "global_step": 99458, "epoch": 821} {"train_loss": -36.29014587402344, "global_step": 99459, "epoch": 821} {"train_loss": -36.84824752807617, "global_step": 99460, "epoch": 821} {"train_loss": -35.34096207106409, "global_step": 99461, "epoch": 821, "val_loss": 2606330.0} {"train_loss": -36.33012008666992, "global_step": 99462, "epoch": 822} {"train_loss": -36.84792709350586, "global_step": 99463, "epoch": 822} {"train_loss": -36.795719146728516, "global_step": 99464, "epoch": 822} {"train_loss": -36.95829391479492, "global_step": 99465, "epoch": 822} {"train_loss": -37.06473159790039, "global_step": 99466, "epoch": 822} {"train_loss": -36.81684875488281, "global_step": 99467, "epoch": 822} {"train_loss": -37.1125602722168, "global_step": 99468, "epoch": 822} {"train_loss": -37.07571029663086, "global_step": 99469, "epoch": 822} {"train_loss": -37.2491569519043, "global_step": 99470, "epoch": 822} {"train_loss": -37.169857025146484, "global_step": 99471, "epoch": 822} {"train_loss": -37.53654861450195, "global_step": 99472, "epoch": 822} {"train_loss": -37.10871505737305, "global_step": 99473, "epoch": 822} {"train_loss": -37.481746673583984, "global_step": 99474, "epoch": 822} {"train_loss": -37.6611328125, "global_step": 99475, "epoch": 822} {"train_loss": -37.47260665893555, "global_step": 99476, "epoch": 822} {"train_loss": -37.16667938232422, "global_step": 99477, "epoch": 822} {"train_loss": -37.555301666259766, "global_step": 99478, "epoch": 822} {"train_loss": -37.67201232910156, "global_step": 99479, "epoch": 822} {"train_loss": -36.97199249267578, "global_step": 99480, "epoch": 822} {"train_loss": -37.4619026184082, "global_step": 99481, "epoch": 822} {"train_loss": -37.918617248535156, "global_step": 99482, "epoch": 822} {"train_loss": -37.636478424072266, "global_step": 99483, "epoch": 822} {"train_loss": -37.59182357788086, "global_step": 99484, "epoch": 822} {"train_loss": -37.668575286865234, "global_step": 99485, "epoch": 822} {"train_loss": -37.58263397216797, "global_step": 99486, "epoch": 822} {"train_loss": -38.04338455200195, "global_step": 99487, "epoch": 822} {"train_loss": -37.85519790649414, "global_step": 99488, "epoch": 822} {"train_loss": -37.970027923583984, "global_step": 99489, "epoch": 822} {"train_loss": -38.26586151123047, "global_step": 99490, "epoch": 822} {"train_loss": -38.09931564331055, "global_step": 99491, "epoch": 822} {"train_loss": -37.9155387878418, "global_step": 99492, "epoch": 822} {"train_loss": -38.22001266479492, "global_step": 99493, "epoch": 822} {"train_loss": -37.909637451171875, "global_step": 99494, "epoch": 822} {"train_loss": -37.70649337768555, "global_step": 99495, "epoch": 822} {"train_loss": -38.15785217285156, "global_step": 99496, "epoch": 822} {"train_loss": -38.15845489501953, "global_step": 99497, "epoch": 822} {"train_loss": -38.10171127319336, "global_step": 99498, "epoch": 822} {"train_loss": -37.31586456298828, "global_step": 99499, "epoch": 822} {"train_loss": -36.189144134521484, "global_step": 99500, "epoch": 822} {"train_loss": -37.009925842285156, "global_step": 99501, "epoch": 822} {"train_loss": -37.653114318847656, "global_step": 99502, "epoch": 822} {"train_loss": -38.57696533203125, "global_step": 99503, "epoch": 822} {"train_loss": -37.78308868408203, "global_step": 99504, "epoch": 822} {"train_loss": -37.361515045166016, "global_step": 99505, "epoch": 822} {"train_loss": -37.342037200927734, "global_step": 99506, "epoch": 822} {"train_loss": -38.51936721801758, "global_step": 99507, "epoch": 822} {"train_loss": -38.44929122924805, "global_step": 99508, "epoch": 822} {"train_loss": -38.15210723876953, "global_step": 99509, "epoch": 822} {"train_loss": -37.898468017578125, "global_step": 99510, "epoch": 822} {"train_loss": -38.67333221435547, "global_step": 99511, "epoch": 822} {"train_loss": -38.521060943603516, "global_step": 99512, "epoch": 822} {"train_loss": -38.43410873413086, "global_step": 99513, "epoch": 822} {"train_loss": -38.977535247802734, "global_step": 99514, "epoch": 822} {"train_loss": -38.74589157104492, "global_step": 99515, "epoch": 822} {"train_loss": -38.143524169921875, "global_step": 99516, "epoch": 822} {"train_loss": -38.34209442138672, "global_step": 99517, "epoch": 822} {"train_loss": -38.541133880615234, "global_step": 99518, "epoch": 822} {"train_loss": -38.629878997802734, "global_step": 99519, "epoch": 822} {"train_loss": -38.534664154052734, "global_step": 99520, "epoch": 822} {"train_loss": -38.52239990234375, "global_step": 99521, "epoch": 822} {"train_loss": -37.26203155517578, "global_step": 99522, "epoch": 822} {"train_loss": -36.1440315246582, "global_step": 99523, "epoch": 822} {"train_loss": -35.80854797363281, "global_step": 99524, "epoch": 822} {"train_loss": -34.1553840637207, "global_step": 99525, "epoch": 822} {"train_loss": -32.085384368896484, "global_step": 99526, "epoch": 822} {"train_loss": -36.81254959106445, "global_step": 99527, "epoch": 822} {"train_loss": -31.423877716064453, "global_step": 99528, "epoch": 822} {"train_loss": -31.521087646484375, "global_step": 99529, "epoch": 822} {"train_loss": -33.264766693115234, "global_step": 99530, "epoch": 822} {"train_loss": -28.0632266998291, "global_step": 99531, "epoch": 822} {"train_loss": -29.814706802368164, "global_step": 99532, "epoch": 822} {"train_loss": -28.093372344970703, "global_step": 99533, "epoch": 822} {"train_loss": -31.42984962463379, "global_step": 99534, "epoch": 822} {"train_loss": -29.025724411010742, "global_step": 99535, "epoch": 822} {"train_loss": -31.606054306030273, "global_step": 99536, "epoch": 822} {"train_loss": -33.16895294189453, "global_step": 99537, "epoch": 822} {"train_loss": -30.909881591796875, "global_step": 99538, "epoch": 822} {"train_loss": -32.018192291259766, "global_step": 99539, "epoch": 822} {"train_loss": -31.608524322509766, "global_step": 99540, "epoch": 822} {"train_loss": -33.73115921020508, "global_step": 99541, "epoch": 822} {"train_loss": -31.913618087768555, "global_step": 99542, "epoch": 822} {"train_loss": -32.83245086669922, "global_step": 99543, "epoch": 822} {"train_loss": -33.30182647705078, "global_step": 99544, "epoch": 822} {"train_loss": -33.630130767822266, "global_step": 99545, "epoch": 822} {"train_loss": -35.652618408203125, "global_step": 99546, "epoch": 822} {"train_loss": -34.9186897277832, "global_step": 99547, "epoch": 822} {"train_loss": -36.4355583190918, "global_step": 99548, "epoch": 822} {"train_loss": -35.55792999267578, "global_step": 99549, "epoch": 822} {"train_loss": -35.03346633911133, "global_step": 99550, "epoch": 822} {"train_loss": -36.64977264404297, "global_step": 99551, "epoch": 822} {"train_loss": -36.534759521484375, "global_step": 99552, "epoch": 822} {"train_loss": -35.771297454833984, "global_step": 99553, "epoch": 822} {"train_loss": -36.46383285522461, "global_step": 99554, "epoch": 822} {"train_loss": -36.37311935424805, "global_step": 99555, "epoch": 822} {"train_loss": -37.573387145996094, "global_step": 99556, "epoch": 822} {"train_loss": -37.23280715942383, "global_step": 99557, "epoch": 822} {"train_loss": -37.11338424682617, "global_step": 99558, "epoch": 822} {"train_loss": -37.67206954956055, "global_step": 99559, "epoch": 822} {"train_loss": -37.8150520324707, "global_step": 99560, "epoch": 822} {"train_loss": -37.423377990722656, "global_step": 99561, "epoch": 822} {"train_loss": -37.78652572631836, "global_step": 99562, "epoch": 822} {"train_loss": -37.303768157958984, "global_step": 99563, "epoch": 822} {"train_loss": -37.21505355834961, "global_step": 99564, "epoch": 822} {"train_loss": -37.94866943359375, "global_step": 99565, "epoch": 822} {"train_loss": -37.915626525878906, "global_step": 99566, "epoch": 822} {"train_loss": -37.44315719604492, "global_step": 99567, "epoch": 822} {"train_loss": -38.02185821533203, "global_step": 99568, "epoch": 822} {"train_loss": -38.43104934692383, "global_step": 99569, "epoch": 822} {"train_loss": -37.91376876831055, "global_step": 99570, "epoch": 822} {"train_loss": -37.82798385620117, "global_step": 99571, "epoch": 822} {"train_loss": -37.783180236816406, "global_step": 99572, "epoch": 822} {"train_loss": -38.08174514770508, "global_step": 99573, "epoch": 822} {"train_loss": -38.33048629760742, "global_step": 99574, "epoch": 822} {"train_loss": -38.091880798339844, "global_step": 99575, "epoch": 822} {"train_loss": -37.30133819580078, "global_step": 99576, "epoch": 822} {"train_loss": -37.406410217285156, "global_step": 99577, "epoch": 822} {"train_loss": -37.753318786621094, "global_step": 99578, "epoch": 822} {"train_loss": -37.82361602783203, "global_step": 99579, "epoch": 822} {"train_loss": -38.07308578491211, "global_step": 99580, "epoch": 822} {"train_loss": -38.37703323364258, "global_step": 99581, "epoch": 822} {"train_loss": -36.55320471771493, "global_step": 99582, "epoch": 822, "val_loss": 2530547.75} {"train_loss": -37.66679763793945, "global_step": 99583, "epoch": 823} {"train_loss": -38.408729553222656, "global_step": 99584, "epoch": 823} {"train_loss": -38.64638900756836, "global_step": 99585, "epoch": 823} {"train_loss": -38.554561614990234, "global_step": 99586, "epoch": 823} {"train_loss": -38.695858001708984, "global_step": 99587, "epoch": 823} {"train_loss": -39.0418815612793, "global_step": 99588, "epoch": 823} {"train_loss": -39.06675338745117, "global_step": 99589, "epoch": 823} {"train_loss": -38.57013702392578, "global_step": 99590, "epoch": 823} {"train_loss": -38.62843704223633, "global_step": 99591, "epoch": 823} {"train_loss": -38.524444580078125, "global_step": 99592, "epoch": 823} {"train_loss": -38.759544372558594, "global_step": 99593, "epoch": 823} {"train_loss": -38.22978591918945, "global_step": 99594, "epoch": 823} {"train_loss": -38.401065826416016, "global_step": 99595, "epoch": 823} {"train_loss": -37.082847595214844, "global_step": 99596, "epoch": 823} {"train_loss": -37.14971923828125, "global_step": 99597, "epoch": 823} {"train_loss": -37.98097229003906, "global_step": 99598, "epoch": 823} {"train_loss": -38.73784255981445, "global_step": 99599, "epoch": 823} {"train_loss": -39.16878128051758, "global_step": 99600, "epoch": 823} {"train_loss": -39.362022399902344, "global_step": 99601, "epoch": 823} {"train_loss": -38.65643310546875, "global_step": 99602, "epoch": 823} {"train_loss": -39.086708068847656, "global_step": 99603, "epoch": 823} {"train_loss": -39.14626693725586, "global_step": 99604, "epoch": 823} {"train_loss": -38.9141731262207, "global_step": 99605, "epoch": 823} {"train_loss": -39.150630950927734, "global_step": 99606, "epoch": 823} {"train_loss": -39.2165412902832, "global_step": 99607, "epoch": 823} {"train_loss": -39.03212356567383, "global_step": 99608, "epoch": 823} {"train_loss": -38.528472900390625, "global_step": 99609, "epoch": 823} {"train_loss": -39.554996490478516, "global_step": 99610, "epoch": 823} {"train_loss": -39.426902770996094, "global_step": 99611, "epoch": 823} {"train_loss": -38.30086135864258, "global_step": 99612, "epoch": 823} {"train_loss": -39.0244255065918, "global_step": 99613, "epoch": 823} {"train_loss": -39.36973190307617, "global_step": 99614, "epoch": 823} {"train_loss": -39.63853073120117, "global_step": 99615, "epoch": 823} {"train_loss": -39.0539665222168, "global_step": 99616, "epoch": 823} {"train_loss": -38.39535140991211, "global_step": 99617, "epoch": 823} {"train_loss": -39.34231185913086, "global_step": 99618, "epoch": 823} {"train_loss": -39.33543014526367, "global_step": 99619, "epoch": 823} {"train_loss": -39.035030364990234, "global_step": 99620, "epoch": 823} {"train_loss": -39.16360092163086, "global_step": 99621, "epoch": 823} {"train_loss": -38.99718475341797, "global_step": 99622, "epoch": 823} {"train_loss": -38.553077697753906, "global_step": 99623, "epoch": 823} {"train_loss": -39.286773681640625, "global_step": 99624, "epoch": 823} {"train_loss": -38.15653610229492, "global_step": 99625, "epoch": 823} {"train_loss": -37.81476593017578, "global_step": 99626, "epoch": 823} {"train_loss": -38.55997848510742, "global_step": 99627, "epoch": 823} {"train_loss": -38.10518264770508, "global_step": 99628, "epoch": 823} {"train_loss": -38.0110969543457, "global_step": 99629, "epoch": 823} {"train_loss": -39.4434814453125, "global_step": 99630, "epoch": 823} {"train_loss": -39.147823333740234, "global_step": 99631, "epoch": 823} {"train_loss": -39.06220626831055, "global_step": 99632, "epoch": 823} {"train_loss": -39.535133361816406, "global_step": 99633, "epoch": 823} {"train_loss": -38.95819091796875, "global_step": 99634, "epoch": 823} {"train_loss": -39.302059173583984, "global_step": 99635, "epoch": 823} {"train_loss": -38.28742218017578, "global_step": 99636, "epoch": 823} {"train_loss": -39.31944274902344, "global_step": 99637, "epoch": 823} {"train_loss": -37.931182861328125, "global_step": 99638, "epoch": 823} {"train_loss": -35.49543762207031, "global_step": 99639, "epoch": 823} {"train_loss": -34.18586730957031, "global_step": 99640, "epoch": 823} {"train_loss": -38.8190803527832, "global_step": 99641, "epoch": 823} {"train_loss": -34.6938362121582, "global_step": 99642, "epoch": 823} {"train_loss": -36.754085540771484, "global_step": 99643, "epoch": 823} {"train_loss": -37.13224411010742, "global_step": 99644, "epoch": 823} {"train_loss": -36.59865188598633, "global_step": 99645, "epoch": 823} {"train_loss": -38.15509033203125, "global_step": 99646, "epoch": 823} {"train_loss": -37.48960494995117, "global_step": 99647, "epoch": 823} {"train_loss": -38.542110443115234, "global_step": 99648, "epoch": 823} {"train_loss": -38.01420974731445, "global_step": 99649, "epoch": 823} {"train_loss": -37.49067306518555, "global_step": 99650, "epoch": 823} {"train_loss": -37.34193801879883, "global_step": 99651, "epoch": 823} {"train_loss": -37.5682258605957, "global_step": 99652, "epoch": 823} {"train_loss": -38.10249710083008, "global_step": 99653, "epoch": 823} {"train_loss": -36.44158935546875, "global_step": 99654, "epoch": 823} {"train_loss": -37.922142028808594, "global_step": 99655, "epoch": 823} {"train_loss": -37.5092887878418, "global_step": 99656, "epoch": 823} {"train_loss": -38.22597885131836, "global_step": 99657, "epoch": 823} {"train_loss": -37.746826171875, "global_step": 99658, "epoch": 823} {"train_loss": -36.84254837036133, "global_step": 99659, "epoch": 823} {"train_loss": -36.58792495727539, "global_step": 99660, "epoch": 823} {"train_loss": -37.89444351196289, "global_step": 99661, "epoch": 823} {"train_loss": -37.341609954833984, "global_step": 99662, "epoch": 823} {"train_loss": -37.04540252685547, "global_step": 99663, "epoch": 823} {"train_loss": -38.212589263916016, "global_step": 99664, "epoch": 823} {"train_loss": -36.6851921081543, "global_step": 99665, "epoch": 823} {"train_loss": -36.38069534301758, "global_step": 99666, "epoch": 823} {"train_loss": -37.76124572753906, "global_step": 99667, "epoch": 823} {"train_loss": -36.84217071533203, "global_step": 99668, "epoch": 823} {"train_loss": -38.023651123046875, "global_step": 99669, "epoch": 823} {"train_loss": -35.46010208129883, "global_step": 99670, "epoch": 823} {"train_loss": -37.20066452026367, "global_step": 99671, "epoch": 823} {"train_loss": -37.056884765625, "global_step": 99672, "epoch": 823} {"train_loss": -37.16570281982422, "global_step": 99673, "epoch": 823} {"train_loss": -36.113006591796875, "global_step": 99674, "epoch": 823} {"train_loss": -38.23778533935547, "global_step": 99675, "epoch": 823} {"train_loss": -36.24508285522461, "global_step": 99676, "epoch": 823} {"train_loss": -38.663818359375, "global_step": 99677, "epoch": 823} {"train_loss": -37.4514274597168, "global_step": 99678, "epoch": 823} {"train_loss": -38.39265823364258, "global_step": 99679, "epoch": 823} {"train_loss": -38.587867736816406, "global_step": 99680, "epoch": 823} {"train_loss": -38.670188903808594, "global_step": 99681, "epoch": 823} {"train_loss": -37.82554244995117, "global_step": 99682, "epoch": 823} {"train_loss": -38.36996078491211, "global_step": 99683, "epoch": 823} {"train_loss": -39.046722412109375, "global_step": 99684, "epoch": 823} {"train_loss": -38.82650375366211, "global_step": 99685, "epoch": 823} {"train_loss": -38.86225891113281, "global_step": 99686, "epoch": 823} {"train_loss": -38.29884719848633, "global_step": 99687, "epoch": 823} {"train_loss": -38.669281005859375, "global_step": 99688, "epoch": 823} {"train_loss": -38.66898727416992, "global_step": 99689, "epoch": 823} {"train_loss": -38.85825729370117, "global_step": 99690, "epoch": 823} {"train_loss": -38.9134407043457, "global_step": 99691, "epoch": 823} {"train_loss": -38.69688034057617, "global_step": 99692, "epoch": 823} {"train_loss": -38.64323043823242, "global_step": 99693, "epoch": 823} {"train_loss": -39.32368087768555, "global_step": 99694, "epoch": 823} {"train_loss": -38.869850158691406, "global_step": 99695, "epoch": 823} {"train_loss": -39.06471633911133, "global_step": 99696, "epoch": 823} {"train_loss": -39.35223388671875, "global_step": 99697, "epoch": 823} {"train_loss": -39.10985565185547, "global_step": 99698, "epoch": 823} {"train_loss": -38.91083908081055, "global_step": 99699, "epoch": 823} {"train_loss": -38.47477340698242, "global_step": 99700, "epoch": 823} {"train_loss": -38.71411895751953, "global_step": 99701, "epoch": 823} {"train_loss": -39.07518005371094, "global_step": 99702, "epoch": 823} {"train_loss": -38.245358396167596, "global_step": 99703, "epoch": 823, "val_loss": 2654996.0} {"train_loss": -39.18893051147461, "global_step": 99704, "epoch": 824} {"train_loss": -38.82218551635742, "global_step": 99705, "epoch": 824} {"train_loss": -38.56000900268555, "global_step": 99706, "epoch": 824} {"train_loss": -37.74541473388672, "global_step": 99707, "epoch": 824} {"train_loss": -38.38022232055664, "global_step": 99708, "epoch": 824} {"train_loss": -39.48443603515625, "global_step": 99709, "epoch": 824} {"train_loss": -39.405006408691406, "global_step": 99710, "epoch": 824} {"train_loss": -39.47842025756836, "global_step": 99711, "epoch": 824} {"train_loss": -39.441585540771484, "global_step": 99712, "epoch": 824} {"train_loss": -39.70397186279297, "global_step": 99713, "epoch": 824} {"train_loss": -39.60493850708008, "global_step": 99714, "epoch": 824} {"train_loss": -39.59379196166992, "global_step": 99715, "epoch": 824} {"train_loss": -38.9604606628418, "global_step": 99716, "epoch": 824} {"train_loss": -39.468902587890625, "global_step": 99717, "epoch": 824} {"train_loss": -39.83106231689453, "global_step": 99718, "epoch": 824} {"train_loss": -39.6044807434082, "global_step": 99719, "epoch": 824} {"train_loss": -38.80512619018555, "global_step": 99720, "epoch": 824} {"train_loss": -39.11198806762695, "global_step": 99721, "epoch": 824} {"train_loss": -38.35854721069336, "global_step": 99722, "epoch": 824} {"train_loss": -38.44453811645508, "global_step": 99723, "epoch": 824} {"train_loss": -39.13074493408203, "global_step": 99724, "epoch": 824} {"train_loss": -39.4622688293457, "global_step": 99725, "epoch": 824} {"train_loss": -38.37601852416992, "global_step": 99726, "epoch": 824} {"train_loss": -38.38904571533203, "global_step": 99727, "epoch": 824} {"train_loss": -38.42621612548828, "global_step": 99728, "epoch": 824} {"train_loss": -39.52983856201172, "global_step": 99729, "epoch": 824} {"train_loss": -39.374481201171875, "global_step": 99730, "epoch": 824} {"train_loss": -38.476314544677734, "global_step": 99731, "epoch": 824} {"train_loss": -37.30961990356445, "global_step": 99732, "epoch": 824} {"train_loss": -39.21343994140625, "global_step": 99733, "epoch": 824} {"train_loss": -39.37974548339844, "global_step": 99734, "epoch": 824} {"train_loss": -38.36165237426758, "global_step": 99735, "epoch": 824} {"train_loss": -38.04949188232422, "global_step": 99736, "epoch": 824} {"train_loss": -38.6402587890625, "global_step": 99737, "epoch": 824} {"train_loss": -39.32270050048828, "global_step": 99738, "epoch": 824} {"train_loss": -39.613563537597656, "global_step": 99739, "epoch": 824} {"train_loss": -38.67253112792969, "global_step": 99740, "epoch": 824} {"train_loss": -39.25874710083008, "global_step": 99741, "epoch": 824} {"train_loss": -39.04997634887695, "global_step": 99742, "epoch": 824} {"train_loss": -39.903953552246094, "global_step": 99743, "epoch": 824} {"train_loss": -39.83024978637695, "global_step": 99744, "epoch": 824} {"train_loss": -39.0778923034668, "global_step": 99745, "epoch": 824} {"train_loss": -36.31700897216797, "global_step": 99746, "epoch": 824} {"train_loss": -37.671138763427734, "global_step": 99747, "epoch": 824} {"train_loss": -39.48824691772461, "global_step": 99748, "epoch": 824} {"train_loss": -39.76007843017578, "global_step": 99749, "epoch": 824} {"train_loss": -38.49956130981445, "global_step": 99750, "epoch": 824} {"train_loss": -34.971893310546875, "global_step": 99751, "epoch": 824} {"train_loss": -37.76449203491211, "global_step": 99752, "epoch": 824} {"train_loss": -39.778587341308594, "global_step": 99753, "epoch": 824} {"train_loss": -39.360042572021484, "global_step": 99754, "epoch": 824} {"train_loss": -38.91556167602539, "global_step": 99755, "epoch": 824} {"train_loss": -37.60893630981445, "global_step": 99756, "epoch": 824} {"train_loss": -39.17530059814453, "global_step": 99757, "epoch": 824} {"train_loss": -38.75539779663086, "global_step": 99758, "epoch": 824} {"train_loss": -37.74848175048828, "global_step": 99759, "epoch": 824} {"train_loss": -37.26421356201172, "global_step": 99760, "epoch": 824} {"train_loss": -38.44375228881836, "global_step": 99761, "epoch": 824} {"train_loss": -38.60325241088867, "global_step": 99762, "epoch": 824} {"train_loss": -37.83222198486328, "global_step": 99763, "epoch": 824} {"train_loss": -38.3393440246582, "global_step": 99764, "epoch": 824} {"train_loss": -35.76359176635742, "global_step": 99765, "epoch": 824} {"train_loss": -38.80685043334961, "global_step": 99766, "epoch": 824} {"train_loss": -38.22329330444336, "global_step": 99767, "epoch": 824} {"train_loss": -35.205848693847656, "global_step": 99768, "epoch": 824} {"train_loss": -39.455238342285156, "global_step": 99769, "epoch": 824} {"train_loss": -36.44935989379883, "global_step": 99770, "epoch": 824} {"train_loss": -36.91548156738281, "global_step": 99771, "epoch": 824} {"train_loss": -39.27557373046875, "global_step": 99772, "epoch": 824} {"train_loss": -36.5114631652832, "global_step": 99773, "epoch": 824} {"train_loss": -39.13285827636719, "global_step": 99774, "epoch": 824} {"train_loss": -37.867523193359375, "global_step": 99775, "epoch": 824} {"train_loss": -37.97177505493164, "global_step": 99776, "epoch": 824} {"train_loss": -37.74915313720703, "global_step": 99777, "epoch": 824} {"train_loss": -38.60762023925781, "global_step": 99778, "epoch": 824} {"train_loss": -37.4146614074707, "global_step": 99779, "epoch": 824} {"train_loss": -38.37058639526367, "global_step": 99780, "epoch": 824} {"train_loss": -38.22801971435547, "global_step": 99781, "epoch": 824} {"train_loss": -37.41126251220703, "global_step": 99782, "epoch": 824} {"train_loss": -38.86842727661133, "global_step": 99783, "epoch": 824} {"train_loss": -38.30080795288086, "global_step": 99784, "epoch": 824} {"train_loss": -37.84175491333008, "global_step": 99785, "epoch": 824} {"train_loss": -38.18046951293945, "global_step": 99786, "epoch": 824} {"train_loss": -38.68107223510742, "global_step": 99787, "epoch": 824} {"train_loss": -38.26937484741211, "global_step": 99788, "epoch": 824} {"train_loss": -38.7956428527832, "global_step": 99789, "epoch": 824} {"train_loss": -38.650672912597656, "global_step": 99790, "epoch": 824} {"train_loss": -38.93561935424805, "global_step": 99791, "epoch": 824} {"train_loss": -39.23720932006836, "global_step": 99792, "epoch": 824} {"train_loss": -38.281986236572266, "global_step": 99793, "epoch": 824} {"train_loss": -38.795955657958984, "global_step": 99794, "epoch": 824} {"train_loss": -38.90436553955078, "global_step": 99795, "epoch": 824} {"train_loss": -37.89874267578125, "global_step": 99796, "epoch": 824} {"train_loss": -38.181697845458984, "global_step": 99797, "epoch": 824} {"train_loss": -36.5625, "global_step": 99798, "epoch": 824} {"train_loss": -38.35014724731445, "global_step": 99799, "epoch": 824} {"train_loss": -38.122127532958984, "global_step": 99800, "epoch": 824} {"train_loss": -37.99970245361328, "global_step": 99801, "epoch": 824} {"train_loss": -37.253387451171875, "global_step": 99802, "epoch": 824} {"train_loss": -38.871864318847656, "global_step": 99803, "epoch": 824} {"train_loss": -36.96452713012695, "global_step": 99804, "epoch": 824} {"train_loss": -37.22897720336914, "global_step": 99805, "epoch": 824} {"train_loss": -36.81266403198242, "global_step": 99806, "epoch": 824} {"train_loss": -37.93442916870117, "global_step": 99807, "epoch": 824} {"train_loss": -37.98445510864258, "global_step": 99808, "epoch": 824} {"train_loss": -37.16619873046875, "global_step": 99809, "epoch": 824} {"train_loss": -38.5844612121582, "global_step": 99810, "epoch": 824} {"train_loss": -38.16627502441406, "global_step": 99811, "epoch": 824} {"train_loss": -37.870880126953125, "global_step": 99812, "epoch": 824} {"train_loss": -37.87223815917969, "global_step": 99813, "epoch": 824} {"train_loss": -37.6900520324707, "global_step": 99814, "epoch": 824} {"train_loss": -37.7000732421875, "global_step": 99815, "epoch": 824} {"train_loss": -37.834327697753906, "global_step": 99816, "epoch": 824} {"train_loss": -38.49794387817383, "global_step": 99817, "epoch": 824} {"train_loss": -38.01455307006836, "global_step": 99818, "epoch": 824} {"train_loss": -37.88683319091797, "global_step": 99819, "epoch": 824} {"train_loss": -38.3857536315918, "global_step": 99820, "epoch": 824} {"train_loss": -38.54426956176758, "global_step": 99821, "epoch": 824} {"train_loss": -37.709381103515625, "global_step": 99822, "epoch": 824} {"train_loss": -38.461273193359375, "global_step": 99823, "epoch": 824} {"train_loss": -38.386682053242836, "global_step": 99824, "epoch": 824, "val_loss": 2584869.25} {"train_loss": -38.920406341552734, "global_step": 99825, "epoch": 825} {"train_loss": -38.34382247924805, "global_step": 99826, "epoch": 825} {"train_loss": -37.97517395019531, "global_step": 99827, "epoch": 825} {"train_loss": -38.91846466064453, "global_step": 99828, "epoch": 825} {"train_loss": -38.99210739135742, "global_step": 99829, "epoch": 825} {"train_loss": -38.220611572265625, "global_step": 99830, "epoch": 825} {"train_loss": -39.32664108276367, "global_step": 99831, "epoch": 825} {"train_loss": -38.110652923583984, "global_step": 99832, "epoch": 825} {"train_loss": -39.36092758178711, "global_step": 99833, "epoch": 825} {"train_loss": -39.12641525268555, "global_step": 99834, "epoch": 825} {"train_loss": -39.38283157348633, "global_step": 99835, "epoch": 825} {"train_loss": -38.30823516845703, "global_step": 99836, "epoch": 825} {"train_loss": -37.97713851928711, "global_step": 99837, "epoch": 825} {"train_loss": -39.05195236206055, "global_step": 99838, "epoch": 825} {"train_loss": -38.86066818237305, "global_step": 99839, "epoch": 825} {"train_loss": -36.997169494628906, "global_step": 99840, "epoch": 825} {"train_loss": -36.230812072753906, "global_step": 99841, "epoch": 825} {"train_loss": -38.67251205444336, "global_step": 99842, "epoch": 825} {"train_loss": -39.22715377807617, "global_step": 99843, "epoch": 825} {"train_loss": -38.210506439208984, "global_step": 99844, "epoch": 825} {"train_loss": -38.092647552490234, "global_step": 99845, "epoch": 825} {"train_loss": -39.21235275268555, "global_step": 99846, "epoch": 825} {"train_loss": -39.35309600830078, "global_step": 99847, "epoch": 825} {"train_loss": -38.523990631103516, "global_step": 99848, "epoch": 825} {"train_loss": -39.15625, "global_step": 99849, "epoch": 825} {"train_loss": -38.75773239135742, "global_step": 99850, "epoch": 825} {"train_loss": -38.04659652709961, "global_step": 99851, "epoch": 825} {"train_loss": -38.153987884521484, "global_step": 99852, "epoch": 825} {"train_loss": -39.421043395996094, "global_step": 99853, "epoch": 825} {"train_loss": -38.80302047729492, "global_step": 99854, "epoch": 825} {"train_loss": -37.85787582397461, "global_step": 99855, "epoch": 825} {"train_loss": -38.46260070800781, "global_step": 99856, "epoch": 825} {"train_loss": -39.41398239135742, "global_step": 99857, "epoch": 825} {"train_loss": -38.46771240234375, "global_step": 99858, "epoch": 825} {"train_loss": -39.7053337097168, "global_step": 99859, "epoch": 825} {"train_loss": -38.95191955566406, "global_step": 99860, "epoch": 825} {"train_loss": -38.40079879760742, "global_step": 99861, "epoch": 825} {"train_loss": -39.331939697265625, "global_step": 99862, "epoch": 825} {"train_loss": -38.913238525390625, "global_step": 99863, "epoch": 825} {"train_loss": -38.667640686035156, "global_step": 99864, "epoch": 825} {"train_loss": -39.5592155456543, "global_step": 99865, "epoch": 825} {"train_loss": -38.6968879699707, "global_step": 99866, "epoch": 825} {"train_loss": -37.120941162109375, "global_step": 99867, "epoch": 825} {"train_loss": -38.73734664916992, "global_step": 99868, "epoch": 825} {"train_loss": -39.102928161621094, "global_step": 99869, "epoch": 825} {"train_loss": -37.271095275878906, "global_step": 99870, "epoch": 825} {"train_loss": -36.81097412109375, "global_step": 99871, "epoch": 825} {"train_loss": -35.533748626708984, "global_step": 99872, "epoch": 825} {"train_loss": -36.09735107421875, "global_step": 99873, "epoch": 825} {"train_loss": -39.512210845947266, "global_step": 99874, "epoch": 825} {"train_loss": -38.20766067504883, "global_step": 99875, "epoch": 825} {"train_loss": -36.78120803833008, "global_step": 99876, "epoch": 825} {"train_loss": -38.082210540771484, "global_step": 99877, "epoch": 825} {"train_loss": -37.96190643310547, "global_step": 99878, "epoch": 825} {"train_loss": -38.27659606933594, "global_step": 99879, "epoch": 825} {"train_loss": -38.427425384521484, "global_step": 99880, "epoch": 825} {"train_loss": -37.87538528442383, "global_step": 99881, "epoch": 825} {"train_loss": -38.945648193359375, "global_step": 99882, "epoch": 825} {"train_loss": -38.850494384765625, "global_step": 99883, "epoch": 825} {"train_loss": -38.76381301879883, "global_step": 99884, "epoch": 825} {"train_loss": -39.26553726196289, "global_step": 99885, "epoch": 825} {"train_loss": -39.22188949584961, "global_step": 99886, "epoch": 825} {"train_loss": -38.27861022949219, "global_step": 99887, "epoch": 825} {"train_loss": -38.582191467285156, "global_step": 99888, "epoch": 825} {"train_loss": -39.31536865234375, "global_step": 99889, "epoch": 825} {"train_loss": -38.91333770751953, "global_step": 99890, "epoch": 825} {"train_loss": -38.29209899902344, "global_step": 99891, "epoch": 825} {"train_loss": -39.36954879760742, "global_step": 99892, "epoch": 825} {"train_loss": -39.159358978271484, "global_step": 99893, "epoch": 825} {"train_loss": -37.669795989990234, "global_step": 99894, "epoch": 825} {"train_loss": -39.29029846191406, "global_step": 99895, "epoch": 825} {"train_loss": -38.24907684326172, "global_step": 99896, "epoch": 825} {"train_loss": -37.368953704833984, "global_step": 99897, "epoch": 825} {"train_loss": -37.498836517333984, "global_step": 99898, "epoch": 825} {"train_loss": -38.98335647583008, "global_step": 99899, "epoch": 825} {"train_loss": -38.23417663574219, "global_step": 99900, "epoch": 825} {"train_loss": -36.56989288330078, "global_step": 99901, "epoch": 825} {"train_loss": -38.4962158203125, "global_step": 99902, "epoch": 825} {"train_loss": -37.81654357910156, "global_step": 99903, "epoch": 825} {"train_loss": -38.18726348876953, "global_step": 99904, "epoch": 825} {"train_loss": -38.217247009277344, "global_step": 99905, "epoch": 825} {"train_loss": -39.064056396484375, "global_step": 99906, "epoch": 825} {"train_loss": -38.20693588256836, "global_step": 99907, "epoch": 825} {"train_loss": -38.94143295288086, "global_step": 99908, "epoch": 825} {"train_loss": -38.539493560791016, "global_step": 99909, "epoch": 825} {"train_loss": -38.38377380371094, "global_step": 99910, "epoch": 825} {"train_loss": -39.01118469238281, "global_step": 99911, "epoch": 825} {"train_loss": -39.039791107177734, "global_step": 99912, "epoch": 825} {"train_loss": -38.54940414428711, "global_step": 99913, "epoch": 825} {"train_loss": -39.131134033203125, "global_step": 99914, "epoch": 825} {"train_loss": -38.94674301147461, "global_step": 99915, "epoch": 825} {"train_loss": -39.1458740234375, "global_step": 99916, "epoch": 825} {"train_loss": -39.066219329833984, "global_step": 99917, "epoch": 825} {"train_loss": -39.44960021972656, "global_step": 99918, "epoch": 825} {"train_loss": -39.83626174926758, "global_step": 99919, "epoch": 825} {"train_loss": -39.75679397583008, "global_step": 99920, "epoch": 825} {"train_loss": -38.646175384521484, "global_step": 99921, "epoch": 825} {"train_loss": -39.38507080078125, "global_step": 99922, "epoch": 825} {"train_loss": -39.605125427246094, "global_step": 99923, "epoch": 825} {"train_loss": -39.206626892089844, "global_step": 99924, "epoch": 825} {"train_loss": -39.63783645629883, "global_step": 99925, "epoch": 825} {"train_loss": -39.242431640625, "global_step": 99926, "epoch": 825} {"train_loss": -39.78605270385742, "global_step": 99927, "epoch": 825} {"train_loss": -39.369598388671875, "global_step": 99928, "epoch": 825} {"train_loss": -39.26970291137695, "global_step": 99929, "epoch": 825} {"train_loss": -39.7129020690918, "global_step": 99930, "epoch": 825} {"train_loss": -39.75901412963867, "global_step": 99931, "epoch": 825} {"train_loss": -38.90690612792969, "global_step": 99932, "epoch": 825} {"train_loss": -38.95832061767578, "global_step": 99933, "epoch": 825} {"train_loss": -38.255775451660156, "global_step": 99934, "epoch": 825} {"train_loss": -39.40143585205078, "global_step": 99935, "epoch": 825} {"train_loss": -39.70559310913086, "global_step": 99936, "epoch": 825} {"train_loss": -39.49976348876953, "global_step": 99937, "epoch": 825} {"train_loss": -39.4854850769043, "global_step": 99938, "epoch": 825} {"train_loss": -39.551353454589844, "global_step": 99939, "epoch": 825} {"train_loss": -38.58729934692383, "global_step": 99940, "epoch": 825} {"train_loss": -38.93595504760742, "global_step": 99941, "epoch": 825} {"train_loss": -39.825416564941406, "global_step": 99942, "epoch": 825} {"train_loss": -38.72001647949219, "global_step": 99943, "epoch": 825} {"train_loss": -38.87370681762695, "global_step": 99944, "epoch": 825} {"train_loss": -38.67660295470687, "global_step": 99945, "epoch": 825, "val_loss": 2624231.25} {"train_loss": -39.34092330932617, "global_step": 99946, "epoch": 826} {"train_loss": -39.5722770690918, "global_step": 99947, "epoch": 826} {"train_loss": -39.417781829833984, "global_step": 99948, "epoch": 826} {"train_loss": -38.92939758300781, "global_step": 99949, "epoch": 826} {"train_loss": -38.65738296508789, "global_step": 99950, "epoch": 826} {"train_loss": -38.93282699584961, "global_step": 99951, "epoch": 826} {"train_loss": -38.7899284362793, "global_step": 99952, "epoch": 826} {"train_loss": -38.25444412231445, "global_step": 99953, "epoch": 826} {"train_loss": -39.24231719970703, "global_step": 99954, "epoch": 826} {"train_loss": -38.966529846191406, "global_step": 99955, "epoch": 826} {"train_loss": -38.985408782958984, "global_step": 99956, "epoch": 826} {"train_loss": -38.70967102050781, "global_step": 99957, "epoch": 826} {"train_loss": -39.04541015625, "global_step": 99958, "epoch": 826} {"train_loss": -39.24560546875, "global_step": 99959, "epoch": 826} {"train_loss": -39.06808090209961, "global_step": 99960, "epoch": 826} {"train_loss": -39.343055725097656, "global_step": 99961, "epoch": 826} {"train_loss": -38.24460983276367, "global_step": 99962, "epoch": 826} {"train_loss": -39.194313049316406, "global_step": 99963, "epoch": 826} {"train_loss": -39.08559036254883, "global_step": 99964, "epoch": 826} {"train_loss": -39.12124252319336, "global_step": 99965, "epoch": 826} {"train_loss": -39.55373001098633, "global_step": 99966, "epoch": 826} {"train_loss": -38.35249328613281, "global_step": 99967, "epoch": 826} {"train_loss": -39.245174407958984, "global_step": 99968, "epoch": 826} {"train_loss": -38.83723831176758, "global_step": 99969, "epoch": 826} {"train_loss": -39.3272705078125, "global_step": 99970, "epoch": 826} {"train_loss": -39.73472213745117, "global_step": 99971, "epoch": 826} {"train_loss": -39.15224075317383, "global_step": 99972, "epoch": 826} {"train_loss": -39.925323486328125, "global_step": 99973, "epoch": 826} {"train_loss": -39.92362594604492, "global_step": 99974, "epoch": 826} {"train_loss": -39.383209228515625, "global_step": 99975, "epoch": 826} {"train_loss": -39.18637466430664, "global_step": 99976, "epoch": 826} {"train_loss": -39.21456527709961, "global_step": 99977, "epoch": 826} {"train_loss": -39.30792999267578, "global_step": 99978, "epoch": 826} {"train_loss": -39.61369705200195, "global_step": 99979, "epoch": 826} {"train_loss": -39.96842575073242, "global_step": 99980, "epoch": 826} {"train_loss": -39.57673263549805, "global_step": 99981, "epoch": 826} {"train_loss": -39.28414535522461, "global_step": 99982, "epoch": 826} {"train_loss": -39.75204849243164, "global_step": 99983, "epoch": 826} {"train_loss": -39.421661376953125, "global_step": 99984, "epoch": 826} {"train_loss": -39.82848358154297, "global_step": 99985, "epoch": 826} {"train_loss": -39.283172607421875, "global_step": 99986, "epoch": 826} {"train_loss": -39.31376266479492, "global_step": 99987, "epoch": 826} {"train_loss": -39.113033294677734, "global_step": 99988, "epoch": 826} {"train_loss": -40.165611267089844, "global_step": 99989, "epoch": 826} {"train_loss": -39.70681381225586, "global_step": 99990, "epoch": 826} {"train_loss": -39.57658767700195, "global_step": 99991, "epoch": 826} {"train_loss": -39.41291427612305, "global_step": 99992, "epoch": 826} {"train_loss": -39.845516204833984, "global_step": 99993, "epoch": 826} {"train_loss": -39.652862548828125, "global_step": 99994, "epoch": 826} {"train_loss": -39.338748931884766, "global_step": 99995, "epoch": 826} {"train_loss": -37.66950988769531, "global_step": 99996, "epoch": 826} {"train_loss": -34.235313415527344, "global_step": 99997, "epoch": 826} {"train_loss": -36.8411979675293, "global_step": 99998, "epoch": 826} {"train_loss": -37.516536712646484, "global_step": 99999, "epoch": 826} {"train_loss": -37.542476654052734, "global_step": 100000, "epoch": 826} {"train_loss": -37.890132904052734, "global_step": 100001, "epoch": 826} {"train_loss": -38.18738555908203, "global_step": 100002, "epoch": 826} {"train_loss": -36.762855529785156, "global_step": 100003, "epoch": 826} {"train_loss": -36.45579528808594, "global_step": 100004, "epoch": 826} {"train_loss": -38.13252639770508, "global_step": 100005, "epoch": 826} {"train_loss": -39.704803466796875, "global_step": 100006, "epoch": 826} {"train_loss": -38.33478927612305, "global_step": 100007, "epoch": 826} {"train_loss": -36.63947677612305, "global_step": 100008, "epoch": 826} {"train_loss": -37.933929443359375, "global_step": 100009, "epoch": 826} {"train_loss": -38.43108367919922, "global_step": 100010, "epoch": 826} {"train_loss": -38.286865234375, "global_step": 100011, "epoch": 826} {"train_loss": -37.480751037597656, "global_step": 100012, "epoch": 826} {"train_loss": -38.4814338684082, "global_step": 100013, "epoch": 826} {"train_loss": -39.14362335205078, "global_step": 100014, "epoch": 826} {"train_loss": -37.97028732299805, "global_step": 100015, "epoch": 826} {"train_loss": -38.590065002441406, "global_step": 100016, "epoch": 826} {"train_loss": -39.01845932006836, "global_step": 100017, "epoch": 826} {"train_loss": -38.85148239135742, "global_step": 100018, "epoch": 826} {"train_loss": -38.99995040893555, "global_step": 100019, "epoch": 826} {"train_loss": -38.78160095214844, "global_step": 100020, "epoch": 826} {"train_loss": -38.88356399536133, "global_step": 100021, "epoch": 826} {"train_loss": -39.48927688598633, "global_step": 100022, "epoch": 826} {"train_loss": -38.625465393066406, "global_step": 100023, "epoch": 826} {"train_loss": -39.12689971923828, "global_step": 100024, "epoch": 826} {"train_loss": -39.816078186035156, "global_step": 100025, "epoch": 826} {"train_loss": -38.075801849365234, "global_step": 100026, "epoch": 826} {"train_loss": -38.27574157714844, "global_step": 100027, "epoch": 826} {"train_loss": -37.516136169433594, "global_step": 100028, "epoch": 826} {"train_loss": -38.13943099975586, "global_step": 100029, "epoch": 826} {"train_loss": -39.556209564208984, "global_step": 100030, "epoch": 826} {"train_loss": -37.66838455200195, "global_step": 100031, "epoch": 826} {"train_loss": -36.70685958862305, "global_step": 100032, "epoch": 826} {"train_loss": -38.21150588989258, "global_step": 100033, "epoch": 826} {"train_loss": -38.66566848754883, "global_step": 100034, "epoch": 826} {"train_loss": -39.128211975097656, "global_step": 100035, "epoch": 826} {"train_loss": -37.2301139831543, "global_step": 100036, "epoch": 826} {"train_loss": -38.142364501953125, "global_step": 100037, "epoch": 826} {"train_loss": -39.319698333740234, "global_step": 100038, "epoch": 826} {"train_loss": -38.6771240234375, "global_step": 100039, "epoch": 826} {"train_loss": -36.58099365234375, "global_step": 100040, "epoch": 826} {"train_loss": -38.54336166381836, "global_step": 100041, "epoch": 826} {"train_loss": -37.19031524658203, "global_step": 100042, "epoch": 826} {"train_loss": -37.924495697021484, "global_step": 100043, "epoch": 826} {"train_loss": -37.72260665893555, "global_step": 100044, "epoch": 826} {"train_loss": -38.86825180053711, "global_step": 100045, "epoch": 826} {"train_loss": -37.26253128051758, "global_step": 100046, "epoch": 826} {"train_loss": -37.204036712646484, "global_step": 100047, "epoch": 826} {"train_loss": -39.1049919128418, "global_step": 100048, "epoch": 826} {"train_loss": -36.51103210449219, "global_step": 100049, "epoch": 826} {"train_loss": -38.0699348449707, "global_step": 100050, "epoch": 826} {"train_loss": -37.6998176574707, "global_step": 100051, "epoch": 826} {"train_loss": -38.20355987548828, "global_step": 100052, "epoch": 826} {"train_loss": -37.63197708129883, "global_step": 100053, "epoch": 826} {"train_loss": -37.89201736450195, "global_step": 100054, "epoch": 826} {"train_loss": -37.53805160522461, "global_step": 100055, "epoch": 826} {"train_loss": -38.48618698120117, "global_step": 100056, "epoch": 826} {"train_loss": -36.148460388183594, "global_step": 100057, "epoch": 826} {"train_loss": -38.70387649536133, "global_step": 100058, "epoch": 826} {"train_loss": -37.33649444580078, "global_step": 100059, "epoch": 826} {"train_loss": -38.5228157043457, "global_step": 100060, "epoch": 826} {"train_loss": -38.157039642333984, "global_step": 100061, "epoch": 826} {"train_loss": -38.570350646972656, "global_step": 100062, "epoch": 826} {"train_loss": -38.840877532958984, "global_step": 100063, "epoch": 826} {"train_loss": -38.45180892944336, "global_step": 100064, "epoch": 826} {"train_loss": -39.12614440917969, "global_step": 100065, "epoch": 826} {"train_loss": -38.581224236606566, "global_step": 100066, "epoch": 826, "val_loss": 2598919.5} {"train_loss": -38.80515670776367, "global_step": 100067, "epoch": 827} {"train_loss": -38.307945251464844, "global_step": 100068, "epoch": 827} {"train_loss": -38.602725982666016, "global_step": 100069, "epoch": 827} {"train_loss": -39.184322357177734, "global_step": 100070, "epoch": 827} {"train_loss": -39.214088439941406, "global_step": 100071, "epoch": 827} {"train_loss": -38.3889045715332, "global_step": 100072, "epoch": 827} {"train_loss": -38.71612548828125, "global_step": 100073, "epoch": 827} {"train_loss": -39.456233978271484, "global_step": 100074, "epoch": 827} {"train_loss": -38.17964172363281, "global_step": 100075, "epoch": 827} {"train_loss": -37.85732650756836, "global_step": 100076, "epoch": 827} {"train_loss": -37.7520751953125, "global_step": 100077, "epoch": 827} {"train_loss": -38.78181076049805, "global_step": 100078, "epoch": 827} {"train_loss": -39.13332748413086, "global_step": 100079, "epoch": 827} {"train_loss": -39.24773406982422, "global_step": 100080, "epoch": 827} {"train_loss": -38.397342681884766, "global_step": 100081, "epoch": 827} {"train_loss": -38.322235107421875, "global_step": 100082, "epoch": 827} {"train_loss": -39.4030647277832, "global_step": 100083, "epoch": 827} {"train_loss": -39.2762336730957, "global_step": 100084, "epoch": 827} {"train_loss": -38.33627700805664, "global_step": 100085, "epoch": 827} {"train_loss": -37.9665412902832, "global_step": 100086, "epoch": 827} {"train_loss": -39.098304748535156, "global_step": 100087, "epoch": 827} {"train_loss": -39.3155632019043, "global_step": 100088, "epoch": 827} {"train_loss": -38.02708053588867, "global_step": 100089, "epoch": 827} {"train_loss": -39.44504928588867, "global_step": 100090, "epoch": 827} {"train_loss": -39.0371208190918, "global_step": 100091, "epoch": 827} {"train_loss": -37.5194091796875, "global_step": 100092, "epoch": 827} {"train_loss": -38.431495666503906, "global_step": 100093, "epoch": 827} {"train_loss": -39.32542037963867, "global_step": 100094, "epoch": 827} {"train_loss": -37.13701248168945, "global_step": 100095, "epoch": 827} {"train_loss": -37.380958557128906, "global_step": 100096, "epoch": 827} {"train_loss": -38.3360710144043, "global_step": 100097, "epoch": 827} {"train_loss": -35.72452926635742, "global_step": 100098, "epoch": 827} {"train_loss": -39.03567123413086, "global_step": 100099, "epoch": 827} {"train_loss": -37.63288497924805, "global_step": 100100, "epoch": 827} {"train_loss": -36.2442626953125, "global_step": 100101, "epoch": 827} {"train_loss": -38.93922805786133, "global_step": 100102, "epoch": 827} {"train_loss": -37.36939239501953, "global_step": 100103, "epoch": 827} {"train_loss": -38.332645416259766, "global_step": 100104, "epoch": 827} {"train_loss": -38.603553771972656, "global_step": 100105, "epoch": 827} {"train_loss": -38.27138900756836, "global_step": 100106, "epoch": 827} {"train_loss": -38.45479965209961, "global_step": 100107, "epoch": 827} {"train_loss": -38.38885498046875, "global_step": 100108, "epoch": 827} {"train_loss": -38.853492736816406, "global_step": 100109, "epoch": 827} {"train_loss": -38.952980041503906, "global_step": 100110, "epoch": 827} {"train_loss": -38.42311477661133, "global_step": 100111, "epoch": 827} {"train_loss": -39.08760452270508, "global_step": 100112, "epoch": 827} {"train_loss": -39.02375411987305, "global_step": 100113, "epoch": 827} {"train_loss": -39.080318450927734, "global_step": 100114, "epoch": 827} {"train_loss": -38.02033615112305, "global_step": 100115, "epoch": 827} {"train_loss": -38.44967269897461, "global_step": 100116, "epoch": 827} {"train_loss": -39.30733871459961, "global_step": 100117, "epoch": 827} {"train_loss": -39.23900604248047, "global_step": 100118, "epoch": 827} {"train_loss": -39.35991668701172, "global_step": 100119, "epoch": 827} {"train_loss": -39.142127990722656, "global_step": 100120, "epoch": 827} {"train_loss": -39.808563232421875, "global_step": 100121, "epoch": 827} {"train_loss": -39.288265228271484, "global_step": 100122, "epoch": 827} {"train_loss": -39.72433090209961, "global_step": 100123, "epoch": 827} {"train_loss": -39.74806594848633, "global_step": 100124, "epoch": 827} {"train_loss": -39.753761291503906, "global_step": 100125, "epoch": 827} {"train_loss": -40.021453857421875, "global_step": 100126, "epoch": 827} {"train_loss": -39.7726936340332, "global_step": 100127, "epoch": 827} {"train_loss": -39.26566696166992, "global_step": 100128, "epoch": 827} {"train_loss": -40.04533004760742, "global_step": 100129, "epoch": 827} {"train_loss": -39.73624801635742, "global_step": 100130, "epoch": 827} {"train_loss": -39.83238220214844, "global_step": 100131, "epoch": 827} {"train_loss": -40.0114860534668, "global_step": 100132, "epoch": 827} {"train_loss": -40.18244552612305, "global_step": 100133, "epoch": 827} {"train_loss": -40.05681228637695, "global_step": 100134, "epoch": 827} {"train_loss": -40.07615280151367, "global_step": 100135, "epoch": 827} {"train_loss": -40.41415023803711, "global_step": 100136, "epoch": 827} {"train_loss": -40.26920700073242, "global_step": 100137, "epoch": 827} {"train_loss": -40.2390022277832, "global_step": 100138, "epoch": 827} {"train_loss": -40.574859619140625, "global_step": 100139, "epoch": 827} {"train_loss": -40.17759704589844, "global_step": 100140, "epoch": 827} {"train_loss": -40.143882751464844, "global_step": 100141, "epoch": 827} {"train_loss": -40.52008819580078, "global_step": 100142, "epoch": 827} {"train_loss": -39.744503021240234, "global_step": 100143, "epoch": 827} {"train_loss": -40.19878005981445, "global_step": 100144, "epoch": 827} {"train_loss": -40.52035140991211, "global_step": 100145, "epoch": 827} {"train_loss": -39.77108383178711, "global_step": 100146, "epoch": 827} {"train_loss": -39.71238327026367, "global_step": 100147, "epoch": 827} {"train_loss": -40.19768142700195, "global_step": 100148, "epoch": 827} {"train_loss": -39.712310791015625, "global_step": 100149, "epoch": 827} {"train_loss": -39.61682891845703, "global_step": 100150, "epoch": 827} {"train_loss": -39.69735336303711, "global_step": 100151, "epoch": 827} {"train_loss": -39.900360107421875, "global_step": 100152, "epoch": 827} {"train_loss": -40.06366729736328, "global_step": 100153, "epoch": 827} {"train_loss": -39.85054397583008, "global_step": 100154, "epoch": 827} {"train_loss": -39.32782745361328, "global_step": 100155, "epoch": 827} {"train_loss": -39.67840576171875, "global_step": 100156, "epoch": 827} {"train_loss": -39.1759147644043, "global_step": 100157, "epoch": 827} {"train_loss": -39.39872360229492, "global_step": 100158, "epoch": 827} {"train_loss": -38.4141960144043, "global_step": 100159, "epoch": 827} {"train_loss": -36.49591064453125, "global_step": 100160, "epoch": 827} {"train_loss": -34.353267669677734, "global_step": 100161, "epoch": 827} {"train_loss": -37.785545349121094, "global_step": 100162, "epoch": 827} {"train_loss": -38.348228454589844, "global_step": 100163, "epoch": 827} {"train_loss": -36.426570892333984, "global_step": 100164, "epoch": 827} {"train_loss": -34.61479949951172, "global_step": 100165, "epoch": 827} {"train_loss": -36.842445373535156, "global_step": 100166, "epoch": 827} {"train_loss": -38.1118278503418, "global_step": 100167, "epoch": 827} {"train_loss": -35.86507797241211, "global_step": 100168, "epoch": 827} {"train_loss": -35.79144287109375, "global_step": 100169, "epoch": 827} {"train_loss": -37.8316764831543, "global_step": 100170, "epoch": 827} {"train_loss": -37.71643829345703, "global_step": 100171, "epoch": 827} {"train_loss": -33.18610763549805, "global_step": 100172, "epoch": 827} {"train_loss": -38.442832946777344, "global_step": 100173, "epoch": 827} {"train_loss": -32.739463806152344, "global_step": 100174, "epoch": 827} {"train_loss": -34.38493728637695, "global_step": 100175, "epoch": 827} {"train_loss": -34.257057189941406, "global_step": 100176, "epoch": 827} {"train_loss": -35.7641716003418, "global_step": 100177, "epoch": 827} {"train_loss": -38.26358413696289, "global_step": 100178, "epoch": 827} {"train_loss": -34.99430847167969, "global_step": 100179, "epoch": 827} {"train_loss": -34.92152404785156, "global_step": 100180, "epoch": 827} {"train_loss": -34.241432189941406, "global_step": 100181, "epoch": 827} {"train_loss": -32.68882751464844, "global_step": 100182, "epoch": 827} {"train_loss": -34.496944427490234, "global_step": 100183, "epoch": 827} {"train_loss": -31.3915958404541, "global_step": 100184, "epoch": 827} {"train_loss": -35.4618034362793, "global_step": 100185, "epoch": 827} {"train_loss": -34.53606414794922, "global_step": 100186, "epoch": 827} {"train_loss": -38.17424063249068, "global_step": 100187, "epoch": 827, "val_loss": 2694836.25} {"train_loss": -32.52928161621094, "global_step": 100188, "epoch": 828} {"train_loss": -32.70095443725586, "global_step": 100189, "epoch": 828} {"train_loss": -32.80908203125, "global_step": 100190, "epoch": 828} {"train_loss": -29.990774154663086, "global_step": 100191, "epoch": 828} {"train_loss": -33.47774124145508, "global_step": 100192, "epoch": 828} {"train_loss": -33.16634750366211, "global_step": 100193, "epoch": 828} {"train_loss": -35.77804946899414, "global_step": 100194, "epoch": 828} {"train_loss": -34.26153564453125, "global_step": 100195, "epoch": 828} {"train_loss": -34.0007209777832, "global_step": 100196, "epoch": 828} {"train_loss": -34.24647903442383, "global_step": 100197, "epoch": 828} {"train_loss": -32.362091064453125, "global_step": 100198, "epoch": 828} {"train_loss": -35.67329788208008, "global_step": 100199, "epoch": 828} {"train_loss": -36.36796188354492, "global_step": 100200, "epoch": 828} {"train_loss": -35.10972213745117, "global_step": 100201, "epoch": 828} {"train_loss": -36.2072639465332, "global_step": 100202, "epoch": 828} {"train_loss": -34.95630645751953, "global_step": 100203, "epoch": 828} {"train_loss": -33.699188232421875, "global_step": 100204, "epoch": 828} {"train_loss": -35.49677276611328, "global_step": 100205, "epoch": 828} {"train_loss": -36.26582336425781, "global_step": 100206, "epoch": 828} {"train_loss": -36.79560470581055, "global_step": 100207, "epoch": 828} {"train_loss": -35.9593620300293, "global_step": 100208, "epoch": 828} {"train_loss": -36.510589599609375, "global_step": 100209, "epoch": 828} {"train_loss": -35.9972038269043, "global_step": 100210, "epoch": 828} {"train_loss": -36.67647933959961, "global_step": 100211, "epoch": 828} {"train_loss": -36.6864128112793, "global_step": 100212, "epoch": 828} {"train_loss": -36.99628829956055, "global_step": 100213, "epoch": 828} {"train_loss": -37.43620681762695, "global_step": 100214, "epoch": 828} {"train_loss": -36.91889190673828, "global_step": 100215, "epoch": 828} {"train_loss": -37.4612922668457, "global_step": 100216, "epoch": 828} {"train_loss": -37.10085678100586, "global_step": 100217, "epoch": 828} {"train_loss": -37.442806243896484, "global_step": 100218, "epoch": 828} {"train_loss": -38.02328109741211, "global_step": 100219, "epoch": 828} {"train_loss": -34.836299896240234, "global_step": 100220, "epoch": 828} {"train_loss": -38.579410552978516, "global_step": 100221, "epoch": 828} {"train_loss": -36.98894119262695, "global_step": 100222, "epoch": 828} {"train_loss": -38.13125228881836, "global_step": 100223, "epoch": 828} {"train_loss": -37.75093078613281, "global_step": 100224, "epoch": 828} {"train_loss": -37.893287658691406, "global_step": 100225, "epoch": 828} {"train_loss": -38.57891082763672, "global_step": 100226, "epoch": 828} {"train_loss": -37.84238815307617, "global_step": 100227, "epoch": 828} {"train_loss": -37.689273834228516, "global_step": 100228, "epoch": 828} {"train_loss": -38.47233581542969, "global_step": 100229, "epoch": 828} {"train_loss": -37.53364944458008, "global_step": 100230, "epoch": 828} {"train_loss": -38.26808547973633, "global_step": 100231, "epoch": 828} {"train_loss": -37.83903121948242, "global_step": 100232, "epoch": 828} {"train_loss": -37.632442474365234, "global_step": 100233, "epoch": 828} {"train_loss": -38.058448791503906, "global_step": 100234, "epoch": 828} {"train_loss": -37.941402435302734, "global_step": 100235, "epoch": 828} {"train_loss": -37.78614807128906, "global_step": 100236, "epoch": 828} {"train_loss": -38.06717300415039, "global_step": 100237, "epoch": 828} {"train_loss": -38.681983947753906, "global_step": 100238, "epoch": 828} {"train_loss": -38.72406005859375, "global_step": 100239, "epoch": 828} {"train_loss": -38.22501754760742, "global_step": 100240, "epoch": 828} {"train_loss": -38.314029693603516, "global_step": 100241, "epoch": 828} {"train_loss": -38.693302154541016, "global_step": 100242, "epoch": 828} {"train_loss": -37.81368637084961, "global_step": 100243, "epoch": 828} {"train_loss": -38.68015670776367, "global_step": 100244, "epoch": 828} {"train_loss": -38.60346221923828, "global_step": 100245, "epoch": 828} {"train_loss": -38.96189498901367, "global_step": 100246, "epoch": 828} {"train_loss": -38.06977462768555, "global_step": 100247, "epoch": 828} {"train_loss": -38.71970748901367, "global_step": 100248, "epoch": 828} {"train_loss": -38.97614288330078, "global_step": 100249, "epoch": 828} {"train_loss": -38.686767578125, "global_step": 100250, "epoch": 828} {"train_loss": -38.38029098510742, "global_step": 100251, "epoch": 828} {"train_loss": -38.61250305175781, "global_step": 100252, "epoch": 828} {"train_loss": -38.56769943237305, "global_step": 100253, "epoch": 828} {"train_loss": -38.948116302490234, "global_step": 100254, "epoch": 828} {"train_loss": -37.61220169067383, "global_step": 100255, "epoch": 828} {"train_loss": -36.58549499511719, "global_step": 100256, "epoch": 828} {"train_loss": -38.3935432434082, "global_step": 100257, "epoch": 828} {"train_loss": -38.76935958862305, "global_step": 100258, "epoch": 828} {"train_loss": -38.86167526245117, "global_step": 100259, "epoch": 828} {"train_loss": -39.169185638427734, "global_step": 100260, "epoch": 828} {"train_loss": -38.9920654296875, "global_step": 100261, "epoch": 828} {"train_loss": -38.659210205078125, "global_step": 100262, "epoch": 828} {"train_loss": -38.937496185302734, "global_step": 100263, "epoch": 828} {"train_loss": -38.332305908203125, "global_step": 100264, "epoch": 828} {"train_loss": -37.656776428222656, "global_step": 100265, "epoch": 828} {"train_loss": -37.863311767578125, "global_step": 100266, "epoch": 828} {"train_loss": -38.4505729675293, "global_step": 100267, "epoch": 828} {"train_loss": -37.99326705932617, "global_step": 100268, "epoch": 828} {"train_loss": -36.33754348754883, "global_step": 100269, "epoch": 828} {"train_loss": -37.57963180541992, "global_step": 100270, "epoch": 828} {"train_loss": -36.95174789428711, "global_step": 100271, "epoch": 828} {"train_loss": -38.174285888671875, "global_step": 100272, "epoch": 828} {"train_loss": -38.283206939697266, "global_step": 100273, "epoch": 828} {"train_loss": -38.702632904052734, "global_step": 100274, "epoch": 828} {"train_loss": -37.45369338989258, "global_step": 100275, "epoch": 828} {"train_loss": -34.91474151611328, "global_step": 100276, "epoch": 828} {"train_loss": -35.816734313964844, "global_step": 100277, "epoch": 828} {"train_loss": -38.688812255859375, "global_step": 100278, "epoch": 828} {"train_loss": -38.9937744140625, "global_step": 100279, "epoch": 828} {"train_loss": -37.91346740722656, "global_step": 100280, "epoch": 828} {"train_loss": -37.9841423034668, "global_step": 100281, "epoch": 828} {"train_loss": -38.34657669067383, "global_step": 100282, "epoch": 828} {"train_loss": -37.48392868041992, "global_step": 100283, "epoch": 828} {"train_loss": -35.34073257446289, "global_step": 100284, "epoch": 828} {"train_loss": -37.07158279418945, "global_step": 100285, "epoch": 828} {"train_loss": -37.399784088134766, "global_step": 100286, "epoch": 828} {"train_loss": -38.72825622558594, "global_step": 100287, "epoch": 828} {"train_loss": -38.73804473876953, "global_step": 100288, "epoch": 828} {"train_loss": -38.2584228515625, "global_step": 100289, "epoch": 828} {"train_loss": -37.344905853271484, "global_step": 100290, "epoch": 828} {"train_loss": -36.119415283203125, "global_step": 100291, "epoch": 828} {"train_loss": -37.614234924316406, "global_step": 100292, "epoch": 828} {"train_loss": -38.42007064819336, "global_step": 100293, "epoch": 828} {"train_loss": -38.134483337402344, "global_step": 100294, "epoch": 828} {"train_loss": -38.185489654541016, "global_step": 100295, "epoch": 828} {"train_loss": -36.58191680908203, "global_step": 100296, "epoch": 828} {"train_loss": -38.500980377197266, "global_step": 100297, "epoch": 828} {"train_loss": -38.74343490600586, "global_step": 100298, "epoch": 828} {"train_loss": -38.67802810668945, "global_step": 100299, "epoch": 828} {"train_loss": -38.090118408203125, "global_step": 100300, "epoch": 828} {"train_loss": -37.6661262512207, "global_step": 100301, "epoch": 828} {"train_loss": -38.733150482177734, "global_step": 100302, "epoch": 828} {"train_loss": -37.02727508544922, "global_step": 100303, "epoch": 828} {"train_loss": -37.07851028442383, "global_step": 100304, "epoch": 828} {"train_loss": -38.88167953491211, "global_step": 100305, "epoch": 828} {"train_loss": -37.8287467956543, "global_step": 100306, "epoch": 828} {"train_loss": -37.56327819824219, "global_step": 100307, "epoch": 828} {"train_loss": -37.2737328868267, "global_step": 100308, "epoch": 828, "val_loss": 2581833.75} {"train_loss": -38.3245735168457, "global_step": 100309, "epoch": 829} {"train_loss": -37.874691009521484, "global_step": 100310, "epoch": 829} {"train_loss": -38.72587203979492, "global_step": 100311, "epoch": 829} {"train_loss": -35.842811584472656, "global_step": 100312, "epoch": 829} {"train_loss": -38.651668548583984, "global_step": 100313, "epoch": 829} {"train_loss": -38.296695709228516, "global_step": 100314, "epoch": 829} {"train_loss": -36.9294548034668, "global_step": 100315, "epoch": 829} {"train_loss": -38.60293197631836, "global_step": 100316, "epoch": 829} {"train_loss": -38.147117614746094, "global_step": 100317, "epoch": 829} {"train_loss": -37.82538986206055, "global_step": 100318, "epoch": 829} {"train_loss": -38.2373046875, "global_step": 100319, "epoch": 829} {"train_loss": -37.70508575439453, "global_step": 100320, "epoch": 829} {"train_loss": -38.704715728759766, "global_step": 100321, "epoch": 829} {"train_loss": -37.59011459350586, "global_step": 100322, "epoch": 829} {"train_loss": -38.31706619262695, "global_step": 100323, "epoch": 829} {"train_loss": -38.01642608642578, "global_step": 100324, "epoch": 829} {"train_loss": -37.45583724975586, "global_step": 100325, "epoch": 829} {"train_loss": -38.54906463623047, "global_step": 100326, "epoch": 829} {"train_loss": -38.83201217651367, "global_step": 100327, "epoch": 829} {"train_loss": -36.80570602416992, "global_step": 100328, "epoch": 829} {"train_loss": -37.60068893432617, "global_step": 100329, "epoch": 829} {"train_loss": -38.976131439208984, "global_step": 100330, "epoch": 829} {"train_loss": -36.86143112182617, "global_step": 100331, "epoch": 829} {"train_loss": -37.91840362548828, "global_step": 100332, "epoch": 829} {"train_loss": -38.36817169189453, "global_step": 100333, "epoch": 829} {"train_loss": -36.39712142944336, "global_step": 100334, "epoch": 829} {"train_loss": -38.04338836669922, "global_step": 100335, "epoch": 829} {"train_loss": -38.308807373046875, "global_step": 100336, "epoch": 829} {"train_loss": -37.49812698364258, "global_step": 100337, "epoch": 829} {"train_loss": -38.30935287475586, "global_step": 100338, "epoch": 829} {"train_loss": -37.355010986328125, "global_step": 100339, "epoch": 829} {"train_loss": -38.42661666870117, "global_step": 100340, "epoch": 829} {"train_loss": -37.450836181640625, "global_step": 100341, "epoch": 829} {"train_loss": -38.674591064453125, "global_step": 100342, "epoch": 829} {"train_loss": -38.11726379394531, "global_step": 100343, "epoch": 829} {"train_loss": -37.78957748413086, "global_step": 100344, "epoch": 829} {"train_loss": -39.00299072265625, "global_step": 100345, "epoch": 829} {"train_loss": -38.8231201171875, "global_step": 100346, "epoch": 829} {"train_loss": -38.801300048828125, "global_step": 100347, "epoch": 829} {"train_loss": -39.02287673950195, "global_step": 100348, "epoch": 829} {"train_loss": -38.55720901489258, "global_step": 100349, "epoch": 829} {"train_loss": -38.41477584838867, "global_step": 100350, "epoch": 829} {"train_loss": -38.91048812866211, "global_step": 100351, "epoch": 829} {"train_loss": -39.38813400268555, "global_step": 100352, "epoch": 829} {"train_loss": -39.38006591796875, "global_step": 100353, "epoch": 829} {"train_loss": -39.58670425415039, "global_step": 100354, "epoch": 829} {"train_loss": -38.724605560302734, "global_step": 100355, "epoch": 829} {"train_loss": -37.74058532714844, "global_step": 100356, "epoch": 829} {"train_loss": -36.152320861816406, "global_step": 100357, "epoch": 829} {"train_loss": -37.81447982788086, "global_step": 100358, "epoch": 829} {"train_loss": -37.43449020385742, "global_step": 100359, "epoch": 829} {"train_loss": -38.052154541015625, "global_step": 100360, "epoch": 829} {"train_loss": -38.5922737121582, "global_step": 100361, "epoch": 829} {"train_loss": -39.131893157958984, "global_step": 100362, "epoch": 829} {"train_loss": -38.68463134765625, "global_step": 100363, "epoch": 829} {"train_loss": -38.907325744628906, "global_step": 100364, "epoch": 829} {"train_loss": -37.973724365234375, "global_step": 100365, "epoch": 829} {"train_loss": -37.86640548706055, "global_step": 100366, "epoch": 829} {"train_loss": -37.28074264526367, "global_step": 100367, "epoch": 829} {"train_loss": -33.7767448425293, "global_step": 100368, "epoch": 829} {"train_loss": -38.870235443115234, "global_step": 100369, "epoch": 829} {"train_loss": -32.89347839355469, "global_step": 100370, "epoch": 829} {"train_loss": -37.99284744262695, "global_step": 100371, "epoch": 829} {"train_loss": -37.9570426940918, "global_step": 100372, "epoch": 829} {"train_loss": -34.3983039855957, "global_step": 100373, "epoch": 829} {"train_loss": -33.4848747253418, "global_step": 100374, "epoch": 829} {"train_loss": -36.618019104003906, "global_step": 100375, "epoch": 829} {"train_loss": -37.35500717163086, "global_step": 100376, "epoch": 829} {"train_loss": -35.67100143432617, "global_step": 100377, "epoch": 829} {"train_loss": -34.129005432128906, "global_step": 100378, "epoch": 829} {"train_loss": -35.98740768432617, "global_step": 100379, "epoch": 829} {"train_loss": -36.46429443359375, "global_step": 100380, "epoch": 829} {"train_loss": -35.1607551574707, "global_step": 100381, "epoch": 829} {"train_loss": -35.96406936645508, "global_step": 100382, "epoch": 829} {"train_loss": -36.94561767578125, "global_step": 100383, "epoch": 829} {"train_loss": -36.56904983520508, "global_step": 100384, "epoch": 829} {"train_loss": -37.30784225463867, "global_step": 100385, "epoch": 829} {"train_loss": -36.820106506347656, "global_step": 100386, "epoch": 829} {"train_loss": -38.22330856323242, "global_step": 100387, "epoch": 829} {"train_loss": -36.765777587890625, "global_step": 100388, "epoch": 829} {"train_loss": -38.351863861083984, "global_step": 100389, "epoch": 829} {"train_loss": -37.688011169433594, "global_step": 100390, "epoch": 829} {"train_loss": -38.28094482421875, "global_step": 100391, "epoch": 829} {"train_loss": -37.99530029296875, "global_step": 100392, "epoch": 829} {"train_loss": -38.75289535522461, "global_step": 100393, "epoch": 829} {"train_loss": -37.885292053222656, "global_step": 100394, "epoch": 829} {"train_loss": -38.77141189575195, "global_step": 100395, "epoch": 829} {"train_loss": -37.69402313232422, "global_step": 100396, "epoch": 829} {"train_loss": -38.689918518066406, "global_step": 100397, "epoch": 829} {"train_loss": -37.89818572998047, "global_step": 100398, "epoch": 829} {"train_loss": -38.560943603515625, "global_step": 100399, "epoch": 829} {"train_loss": -37.81303787231445, "global_step": 100400, "epoch": 829} {"train_loss": -38.94655990600586, "global_step": 100401, "epoch": 829} {"train_loss": -38.6284294128418, "global_step": 100402, "epoch": 829} {"train_loss": -38.57477951049805, "global_step": 100403, "epoch": 829} {"train_loss": -38.665618896484375, "global_step": 100404, "epoch": 829} {"train_loss": -38.49250411987305, "global_step": 100405, "epoch": 829} {"train_loss": -39.013633728027344, "global_step": 100406, "epoch": 829} {"train_loss": -38.41666793823242, "global_step": 100407, "epoch": 829} {"train_loss": -38.627410888671875, "global_step": 100408, "epoch": 829} {"train_loss": -38.96035385131836, "global_step": 100409, "epoch": 829} {"train_loss": -38.81117248535156, "global_step": 100410, "epoch": 829} {"train_loss": -38.96896743774414, "global_step": 100411, "epoch": 829} {"train_loss": -39.14425277709961, "global_step": 100412, "epoch": 829} {"train_loss": -39.229610443115234, "global_step": 100413, "epoch": 829} {"train_loss": -38.8051643371582, "global_step": 100414, "epoch": 829} {"train_loss": -39.1038703918457, "global_step": 100415, "epoch": 829} {"train_loss": -39.19814682006836, "global_step": 100416, "epoch": 829} {"train_loss": -39.180511474609375, "global_step": 100417, "epoch": 829} {"train_loss": -39.046119689941406, "global_step": 100418, "epoch": 829} {"train_loss": -39.182403564453125, "global_step": 100419, "epoch": 829} {"train_loss": -38.89300537109375, "global_step": 100420, "epoch": 829} {"train_loss": -39.059444427490234, "global_step": 100421, "epoch": 829} {"train_loss": -38.80173110961914, "global_step": 100422, "epoch": 829} {"train_loss": -39.47967529296875, "global_step": 100423, "epoch": 829} {"train_loss": -39.124732971191406, "global_step": 100424, "epoch": 829} {"train_loss": -38.54358673095703, "global_step": 100425, "epoch": 829} {"train_loss": -39.53672409057617, "global_step": 100426, "epoch": 829} {"train_loss": -39.0031623840332, "global_step": 100427, "epoch": 829} {"train_loss": -39.55903625488281, "global_step": 100428, "epoch": 829} {"train_loss": -38.001045889105676, "global_step": 100429, "epoch": 829, "val_loss": 2571852.25} {"train_loss": -39.511322021484375, "global_step": 100430, "epoch": 830} {"train_loss": -39.42673873901367, "global_step": 100431, "epoch": 830} {"train_loss": -39.048126220703125, "global_step": 100432, "epoch": 830} {"train_loss": -39.688262939453125, "global_step": 100433, "epoch": 830} {"train_loss": -39.23519515991211, "global_step": 100434, "epoch": 830} {"train_loss": -39.36444854736328, "global_step": 100435, "epoch": 830} {"train_loss": -39.45673370361328, "global_step": 100436, "epoch": 830} {"train_loss": -39.87177276611328, "global_step": 100437, "epoch": 830} {"train_loss": -39.718406677246094, "global_step": 100438, "epoch": 830} {"train_loss": -39.73458480834961, "global_step": 100439, "epoch": 830} {"train_loss": -40.114994049072266, "global_step": 100440, "epoch": 830} {"train_loss": -39.74751663208008, "global_step": 100441, "epoch": 830} {"train_loss": -39.9846305847168, "global_step": 100442, "epoch": 830} {"train_loss": -39.08283233642578, "global_step": 100443, "epoch": 830} {"train_loss": -37.31643295288086, "global_step": 100444, "epoch": 830} {"train_loss": -36.84235382080078, "global_step": 100445, "epoch": 830} {"train_loss": -39.29140090942383, "global_step": 100446, "epoch": 830} {"train_loss": -39.48601150512695, "global_step": 100447, "epoch": 830} {"train_loss": -36.155696868896484, "global_step": 100448, "epoch": 830} {"train_loss": -35.43647384643555, "global_step": 100449, "epoch": 830} {"train_loss": -37.205440521240234, "global_step": 100450, "epoch": 830} {"train_loss": -35.64390182495117, "global_step": 100451, "epoch": 830} {"train_loss": -38.10599899291992, "global_step": 100452, "epoch": 830} {"train_loss": -35.61200714111328, "global_step": 100453, "epoch": 830} {"train_loss": -38.40353012084961, "global_step": 100454, "epoch": 830} {"train_loss": -33.795955657958984, "global_step": 100455, "epoch": 830} {"train_loss": -37.99681091308594, "global_step": 100456, "epoch": 830} {"train_loss": -35.26089096069336, "global_step": 100457, "epoch": 830} {"train_loss": -38.33390426635742, "global_step": 100458, "epoch": 830} {"train_loss": -35.724952697753906, "global_step": 100459, "epoch": 830} {"train_loss": -37.21065902709961, "global_step": 100460, "epoch": 830} {"train_loss": -37.07853317260742, "global_step": 100461, "epoch": 830} {"train_loss": -37.958980560302734, "global_step": 100462, "epoch": 830} {"train_loss": -37.6074333190918, "global_step": 100463, "epoch": 830} {"train_loss": -36.23075485229492, "global_step": 100464, "epoch": 830} {"train_loss": -38.546321868896484, "global_step": 100465, "epoch": 830} {"train_loss": -38.0677375793457, "global_step": 100466, "epoch": 830} {"train_loss": -37.526363372802734, "global_step": 100467, "epoch": 830} {"train_loss": -38.267818450927734, "global_step": 100468, "epoch": 830} {"train_loss": -38.030059814453125, "global_step": 100469, "epoch": 830} {"train_loss": -39.14735794067383, "global_step": 100470, "epoch": 830} {"train_loss": -38.47534942626953, "global_step": 100471, "epoch": 830} {"train_loss": -38.78164291381836, "global_step": 100472, "epoch": 830} {"train_loss": -39.19922637939453, "global_step": 100473, "epoch": 830} {"train_loss": -38.582427978515625, "global_step": 100474, "epoch": 830} {"train_loss": -38.877418518066406, "global_step": 100475, "epoch": 830} {"train_loss": -38.899662017822266, "global_step": 100476, "epoch": 830} {"train_loss": -38.78932571411133, "global_step": 100477, "epoch": 830} {"train_loss": -38.93330001831055, "global_step": 100478, "epoch": 830} {"train_loss": -39.18476486206055, "global_step": 100479, "epoch": 830} {"train_loss": -38.871673583984375, "global_step": 100480, "epoch": 830} {"train_loss": -38.905548095703125, "global_step": 100481, "epoch": 830} {"train_loss": -38.69366455078125, "global_step": 100482, "epoch": 830} {"train_loss": -39.213069915771484, "global_step": 100483, "epoch": 830} {"train_loss": -38.879173278808594, "global_step": 100484, "epoch": 830} {"train_loss": -38.91242599487305, "global_step": 100485, "epoch": 830} {"train_loss": -38.6676025390625, "global_step": 100486, "epoch": 830} {"train_loss": -39.210113525390625, "global_step": 100487, "epoch": 830} {"train_loss": -39.27911376953125, "global_step": 100488, "epoch": 830} {"train_loss": -38.88254928588867, "global_step": 100489, "epoch": 830} {"train_loss": -39.387569427490234, "global_step": 100490, "epoch": 830} {"train_loss": -39.412261962890625, "global_step": 100491, "epoch": 830} {"train_loss": -39.106632232666016, "global_step": 100492, "epoch": 830} {"train_loss": -38.58307647705078, "global_step": 100493, "epoch": 830} {"train_loss": -38.19538116455078, "global_step": 100494, "epoch": 830} {"train_loss": -37.1849479675293, "global_step": 100495, "epoch": 830} {"train_loss": -38.24737548828125, "global_step": 100496, "epoch": 830} {"train_loss": -39.063087463378906, "global_step": 100497, "epoch": 830} {"train_loss": -38.743099212646484, "global_step": 100498, "epoch": 830} {"train_loss": -38.15140151977539, "global_step": 100499, "epoch": 830} {"train_loss": -39.02570343017578, "global_step": 100500, "epoch": 830} {"train_loss": -38.986053466796875, "global_step": 100501, "epoch": 830} {"train_loss": -38.96086883544922, "global_step": 100502, "epoch": 830} {"train_loss": -39.153045654296875, "global_step": 100503, "epoch": 830} {"train_loss": -38.83256149291992, "global_step": 100504, "epoch": 830} {"train_loss": -38.993099212646484, "global_step": 100505, "epoch": 830} {"train_loss": -38.930694580078125, "global_step": 100506, "epoch": 830} {"train_loss": -38.83547592163086, "global_step": 100507, "epoch": 830} {"train_loss": -39.2081184387207, "global_step": 100508, "epoch": 830} {"train_loss": -37.998294830322266, "global_step": 100509, "epoch": 830} {"train_loss": -36.07526779174805, "global_step": 100510, "epoch": 830} {"train_loss": -30.77503776550293, "global_step": 100511, "epoch": 830} {"train_loss": -22.723180770874023, "global_step": 100512, "epoch": 830} {"train_loss": -23.530813217163086, "global_step": 100513, "epoch": 830} {"train_loss": -26.167428970336914, "global_step": 100514, "epoch": 830} {"train_loss": -32.20248031616211, "global_step": 100515, "epoch": 830} {"train_loss": -28.74212646484375, "global_step": 100516, "epoch": 830} {"train_loss": -30.559772491455078, "global_step": 100517, "epoch": 830} {"train_loss": -31.961828231811523, "global_step": 100518, "epoch": 830} {"train_loss": -33.857818603515625, "global_step": 100519, "epoch": 830} {"train_loss": -34.30788803100586, "global_step": 100520, "epoch": 830} {"train_loss": -33.005123138427734, "global_step": 100521, "epoch": 830} {"train_loss": -33.80494689941406, "global_step": 100522, "epoch": 830} {"train_loss": -35.14543914794922, "global_step": 100523, "epoch": 830} {"train_loss": -36.66780471801758, "global_step": 100524, "epoch": 830} {"train_loss": -36.60062789916992, "global_step": 100525, "epoch": 830} {"train_loss": -35.95464324951172, "global_step": 100526, "epoch": 830} {"train_loss": -36.487117767333984, "global_step": 100527, "epoch": 830} {"train_loss": -36.17808151245117, "global_step": 100528, "epoch": 830} {"train_loss": -37.45051956176758, "global_step": 100529, "epoch": 830} {"train_loss": -37.4824104309082, "global_step": 100530, "epoch": 830} {"train_loss": -38.1513557434082, "global_step": 100531, "epoch": 830} {"train_loss": -37.695037841796875, "global_step": 100532, "epoch": 830} {"train_loss": -38.202205657958984, "global_step": 100533, "epoch": 830} {"train_loss": -38.163299560546875, "global_step": 100534, "epoch": 830} {"train_loss": -37.62991714477539, "global_step": 100535, "epoch": 830} {"train_loss": -38.07209396362305, "global_step": 100536, "epoch": 830} {"train_loss": -38.5886344909668, "global_step": 100537, "epoch": 830} {"train_loss": -36.91224670410156, "global_step": 100538, "epoch": 830} {"train_loss": -37.983245849609375, "global_step": 100539, "epoch": 830} {"train_loss": -38.50830841064453, "global_step": 100540, "epoch": 830} {"train_loss": -37.52096176147461, "global_step": 100541, "epoch": 830} {"train_loss": -38.46405792236328, "global_step": 100542, "epoch": 830} {"train_loss": -38.34861373901367, "global_step": 100543, "epoch": 830} {"train_loss": -38.141448974609375, "global_step": 100544, "epoch": 830} {"train_loss": -38.81792449951172, "global_step": 100545, "epoch": 830} {"train_loss": -38.009315490722656, "global_step": 100546, "epoch": 830} {"train_loss": -37.8253173828125, "global_step": 100547, "epoch": 830} {"train_loss": -39.0377197265625, "global_step": 100548, "epoch": 830} {"train_loss": -38.82929229736328, "global_step": 100549, "epoch": 830} {"train_loss": -37.41813803113197, "global_step": 100550, "epoch": 830, "val_loss": 2602752.5} {"train_loss": -39.027400970458984, "global_step": 100551, "epoch": 831} {"train_loss": -39.09674072265625, "global_step": 100552, "epoch": 831} {"train_loss": -38.43585205078125, "global_step": 100553, "epoch": 831} {"train_loss": -39.103515625, "global_step": 100554, "epoch": 831} {"train_loss": -39.36980438232422, "global_step": 100555, "epoch": 831} {"train_loss": -38.932525634765625, "global_step": 100556, "epoch": 831} {"train_loss": -39.03211212158203, "global_step": 100557, "epoch": 831} {"train_loss": -39.66545486450195, "global_step": 100558, "epoch": 831} {"train_loss": -39.20934295654297, "global_step": 100559, "epoch": 831} {"train_loss": -38.97237014770508, "global_step": 100560, "epoch": 831} {"train_loss": -39.337459564208984, "global_step": 100561, "epoch": 831} {"train_loss": -39.585052490234375, "global_step": 100562, "epoch": 831} {"train_loss": -39.01738357543945, "global_step": 100563, "epoch": 831} {"train_loss": -39.38491439819336, "global_step": 100564, "epoch": 831} {"train_loss": -39.47808074951172, "global_step": 100565, "epoch": 831} {"train_loss": -39.37203598022461, "global_step": 100566, "epoch": 831} {"train_loss": -39.24755859375, "global_step": 100567, "epoch": 831} {"train_loss": -39.85820388793945, "global_step": 100568, "epoch": 831} {"train_loss": -39.71120834350586, "global_step": 100569, "epoch": 831} {"train_loss": -39.78010559082031, "global_step": 100570, "epoch": 831} {"train_loss": -38.41957473754883, "global_step": 100571, "epoch": 831} {"train_loss": -38.901981353759766, "global_step": 100572, "epoch": 831} {"train_loss": -38.696800231933594, "global_step": 100573, "epoch": 831} {"train_loss": -39.90475082397461, "global_step": 100574, "epoch": 831} {"train_loss": -39.8067626953125, "global_step": 100575, "epoch": 831} {"train_loss": -39.07659912109375, "global_step": 100576, "epoch": 831} {"train_loss": -37.410457611083984, "global_step": 100577, "epoch": 831} {"train_loss": -35.505767822265625, "global_step": 100578, "epoch": 831} {"train_loss": -37.518165588378906, "global_step": 100579, "epoch": 831} {"train_loss": -39.072357177734375, "global_step": 100580, "epoch": 831} {"train_loss": -39.70162582397461, "global_step": 100581, "epoch": 831} {"train_loss": -37.8414421081543, "global_step": 100582, "epoch": 831} {"train_loss": -36.70288848876953, "global_step": 100583, "epoch": 831} {"train_loss": -38.26405334472656, "global_step": 100584, "epoch": 831} {"train_loss": -38.75303649902344, "global_step": 100585, "epoch": 831} {"train_loss": -38.57278823852539, "global_step": 100586, "epoch": 831} {"train_loss": -38.000545501708984, "global_step": 100587, "epoch": 831} {"train_loss": -37.65003967285156, "global_step": 100588, "epoch": 831} {"train_loss": -39.190399169921875, "global_step": 100589, "epoch": 831} {"train_loss": -38.81344223022461, "global_step": 100590, "epoch": 831} {"train_loss": -38.81439971923828, "global_step": 100591, "epoch": 831} {"train_loss": -39.8289909362793, "global_step": 100592, "epoch": 831} {"train_loss": -39.243507385253906, "global_step": 100593, "epoch": 831} {"train_loss": -38.63920974731445, "global_step": 100594, "epoch": 831} {"train_loss": -38.849327087402344, "global_step": 100595, "epoch": 831} {"train_loss": -38.71693801879883, "global_step": 100596, "epoch": 831} {"train_loss": -37.404232025146484, "global_step": 100597, "epoch": 831} {"train_loss": -38.06130599975586, "global_step": 100598, "epoch": 831} {"train_loss": -38.863162994384766, "global_step": 100599, "epoch": 831} {"train_loss": -37.513465881347656, "global_step": 100600, "epoch": 831} {"train_loss": -35.57427978515625, "global_step": 100601, "epoch": 831} {"train_loss": -35.317901611328125, "global_step": 100602, "epoch": 831} {"train_loss": -37.37041091918945, "global_step": 100603, "epoch": 831} {"train_loss": -35.07158279418945, "global_step": 100604, "epoch": 831} {"train_loss": -36.429969787597656, "global_step": 100605, "epoch": 831} {"train_loss": -36.1441650390625, "global_step": 100606, "epoch": 831} {"train_loss": -37.25556564331055, "global_step": 100607, "epoch": 831} {"train_loss": -36.32346725463867, "global_step": 100608, "epoch": 831} {"train_loss": -37.03711700439453, "global_step": 100609, "epoch": 831} {"train_loss": -36.5363883972168, "global_step": 100610, "epoch": 831} {"train_loss": -36.60123825073242, "global_step": 100611, "epoch": 831} {"train_loss": -37.316558837890625, "global_step": 100612, "epoch": 831} {"train_loss": -35.73195266723633, "global_step": 100613, "epoch": 831} {"train_loss": -37.46590042114258, "global_step": 100614, "epoch": 831} {"train_loss": -36.2331657409668, "global_step": 100615, "epoch": 831} {"train_loss": -36.538360595703125, "global_step": 100616, "epoch": 831} {"train_loss": -36.04921340942383, "global_step": 100617, "epoch": 831} {"train_loss": -38.01220703125, "global_step": 100618, "epoch": 831} {"train_loss": -36.87358093261719, "global_step": 100619, "epoch": 831} {"train_loss": -37.76829147338867, "global_step": 100620, "epoch": 831} {"train_loss": -36.80794143676758, "global_step": 100621, "epoch": 831} {"train_loss": -37.099544525146484, "global_step": 100622, "epoch": 831} {"train_loss": -38.17074203491211, "global_step": 100623, "epoch": 831} {"train_loss": -37.615203857421875, "global_step": 100624, "epoch": 831} {"train_loss": -37.37397003173828, "global_step": 100625, "epoch": 831} {"train_loss": -38.23828887939453, "global_step": 100626, "epoch": 831} {"train_loss": -38.2296142578125, "global_step": 100627, "epoch": 831} {"train_loss": -38.6706428527832, "global_step": 100628, "epoch": 831} {"train_loss": -38.841064453125, "global_step": 100629, "epoch": 831} {"train_loss": -38.40915298461914, "global_step": 100630, "epoch": 831} {"train_loss": -38.86452102661133, "global_step": 100631, "epoch": 831} {"train_loss": -38.50437927246094, "global_step": 100632, "epoch": 831} {"train_loss": -38.513607025146484, "global_step": 100633, "epoch": 831} {"train_loss": -38.499305725097656, "global_step": 100634, "epoch": 831} {"train_loss": -38.81712341308594, "global_step": 100635, "epoch": 831} {"train_loss": -38.833003997802734, "global_step": 100636, "epoch": 831} {"train_loss": -38.821136474609375, "global_step": 100637, "epoch": 831} {"train_loss": -39.05762481689453, "global_step": 100638, "epoch": 831} {"train_loss": -38.60295104980469, "global_step": 100639, "epoch": 831} {"train_loss": -38.744667053222656, "global_step": 100640, "epoch": 831} {"train_loss": -39.09708786010742, "global_step": 100641, "epoch": 831} {"train_loss": -38.79281997680664, "global_step": 100642, "epoch": 831} {"train_loss": -38.72319030761719, "global_step": 100643, "epoch": 831} {"train_loss": -39.081756591796875, "global_step": 100644, "epoch": 831} {"train_loss": -39.46688461303711, "global_step": 100645, "epoch": 831} {"train_loss": -39.712093353271484, "global_step": 100646, "epoch": 831} {"train_loss": -39.0871467590332, "global_step": 100647, "epoch": 831} {"train_loss": -39.481178283691406, "global_step": 100648, "epoch": 831} {"train_loss": -39.62946701049805, "global_step": 100649, "epoch": 831} {"train_loss": -39.52311706542969, "global_step": 100650, "epoch": 831} {"train_loss": -39.2504997253418, "global_step": 100651, "epoch": 831} {"train_loss": -39.4063720703125, "global_step": 100652, "epoch": 831} {"train_loss": -39.53005599975586, "global_step": 100653, "epoch": 831} {"train_loss": -39.1782341003418, "global_step": 100654, "epoch": 831} {"train_loss": -39.631317138671875, "global_step": 100655, "epoch": 831} {"train_loss": -39.85392379760742, "global_step": 100656, "epoch": 831} {"train_loss": -40.11017990112305, "global_step": 100657, "epoch": 831} {"train_loss": -39.91744613647461, "global_step": 100658, "epoch": 831} {"train_loss": -39.711219787597656, "global_step": 100659, "epoch": 831} {"train_loss": -39.759788513183594, "global_step": 100660, "epoch": 831} {"train_loss": -39.92262268066406, "global_step": 100661, "epoch": 831} {"train_loss": -40.14469909667969, "global_step": 100662, "epoch": 831} {"train_loss": -40.26333236694336, "global_step": 100663, "epoch": 831} {"train_loss": -39.873199462890625, "global_step": 100664, "epoch": 831} {"train_loss": -40.00144577026367, "global_step": 100665, "epoch": 831} {"train_loss": -39.9218635559082, "global_step": 100666, "epoch": 831} {"train_loss": -39.91145706176758, "global_step": 100667, "epoch": 831} {"train_loss": -40.137916564941406, "global_step": 100668, "epoch": 831} {"train_loss": -40.008541107177734, "global_step": 100669, "epoch": 831} {"train_loss": -40.0931282043457, "global_step": 100670, "epoch": 831} {"train_loss": -38.5724626336216, "global_step": 100671, "epoch": 831, "val_loss": 2577396.25} {"train_loss": -40.10997009277344, "global_step": 100672, "epoch": 832} {"train_loss": -40.12876510620117, "global_step": 100673, "epoch": 832} {"train_loss": -40.32296371459961, "global_step": 100674, "epoch": 832} {"train_loss": -40.368221282958984, "global_step": 100675, "epoch": 832} {"train_loss": -40.354896545410156, "global_step": 100676, "epoch": 832} {"train_loss": -40.40083694458008, "global_step": 100677, "epoch": 832} {"train_loss": -40.35791778564453, "global_step": 100678, "epoch": 832} {"train_loss": -40.0890998840332, "global_step": 100679, "epoch": 832} {"train_loss": -40.10133361816406, "global_step": 100680, "epoch": 832} {"train_loss": -39.90949630737305, "global_step": 100681, "epoch": 832} {"train_loss": -39.294349670410156, "global_step": 100682, "epoch": 832} {"train_loss": -37.73783874511719, "global_step": 100683, "epoch": 832} {"train_loss": -33.73049545288086, "global_step": 100684, "epoch": 832} {"train_loss": -35.21165084838867, "global_step": 100685, "epoch": 832} {"train_loss": -35.644893646240234, "global_step": 100686, "epoch": 832} {"train_loss": -35.70893478393555, "global_step": 100687, "epoch": 832} {"train_loss": -38.25065231323242, "global_step": 100688, "epoch": 832} {"train_loss": -32.07326889038086, "global_step": 100689, "epoch": 832} {"train_loss": -34.684425354003906, "global_step": 100690, "epoch": 832} {"train_loss": -33.60894012451172, "global_step": 100691, "epoch": 832} {"train_loss": -37.90755081176758, "global_step": 100692, "epoch": 832} {"train_loss": -35.8591423034668, "global_step": 100693, "epoch": 832} {"train_loss": -36.626014709472656, "global_step": 100694, "epoch": 832} {"train_loss": -37.93584442138672, "global_step": 100695, "epoch": 832} {"train_loss": -36.753807067871094, "global_step": 100696, "epoch": 832} {"train_loss": -34.98533248901367, "global_step": 100697, "epoch": 832} {"train_loss": -38.27037811279297, "global_step": 100698, "epoch": 832} {"train_loss": -36.15104293823242, "global_step": 100699, "epoch": 832} {"train_loss": -36.833580017089844, "global_step": 100700, "epoch": 832} {"train_loss": -37.137908935546875, "global_step": 100701, "epoch": 832} {"train_loss": -38.41851806640625, "global_step": 100702, "epoch": 832} {"train_loss": -37.20024108886719, "global_step": 100703, "epoch": 832} {"train_loss": -38.106868743896484, "global_step": 100704, "epoch": 832} {"train_loss": -37.53706741333008, "global_step": 100705, "epoch": 832} {"train_loss": -38.190731048583984, "global_step": 100706, "epoch": 832} {"train_loss": -38.29103088378906, "global_step": 100707, "epoch": 832} {"train_loss": -38.6631965637207, "global_step": 100708, "epoch": 832} {"train_loss": -38.896663665771484, "global_step": 100709, "epoch": 832} {"train_loss": -38.05333709716797, "global_step": 100710, "epoch": 832} {"train_loss": -37.98115158081055, "global_step": 100711, "epoch": 832} {"train_loss": -37.97563552856445, "global_step": 100712, "epoch": 832} {"train_loss": -38.114070892333984, "global_step": 100713, "epoch": 832} {"train_loss": -38.624507904052734, "global_step": 100714, "epoch": 832} {"train_loss": -38.45632553100586, "global_step": 100715, "epoch": 832} {"train_loss": -39.268062591552734, "global_step": 100716, "epoch": 832} {"train_loss": -38.6294059753418, "global_step": 100717, "epoch": 832} {"train_loss": -38.67550277709961, "global_step": 100718, "epoch": 832} {"train_loss": -39.43194580078125, "global_step": 100719, "epoch": 832} {"train_loss": -38.91664123535156, "global_step": 100720, "epoch": 832} {"train_loss": -38.56349182128906, "global_step": 100721, "epoch": 832} {"train_loss": -39.23975372314453, "global_step": 100722, "epoch": 832} {"train_loss": -39.24174118041992, "global_step": 100723, "epoch": 832} {"train_loss": -39.053218841552734, "global_step": 100724, "epoch": 832} {"train_loss": -38.65700912475586, "global_step": 100725, "epoch": 832} {"train_loss": -39.66483688354492, "global_step": 100726, "epoch": 832} {"train_loss": -38.63767623901367, "global_step": 100727, "epoch": 832} {"train_loss": -39.473690032958984, "global_step": 100728, "epoch": 832} {"train_loss": -39.25428009033203, "global_step": 100729, "epoch": 832} {"train_loss": -38.886085510253906, "global_step": 100730, "epoch": 832} {"train_loss": -39.065853118896484, "global_step": 100731, "epoch": 832} {"train_loss": -39.7525520324707, "global_step": 100732, "epoch": 832} {"train_loss": -39.51087951660156, "global_step": 100733, "epoch": 832} {"train_loss": -39.68350601196289, "global_step": 100734, "epoch": 832} {"train_loss": -38.94449996948242, "global_step": 100735, "epoch": 832} {"train_loss": -38.31711196899414, "global_step": 100736, "epoch": 832} {"train_loss": -38.91297912597656, "global_step": 100737, "epoch": 832} {"train_loss": -38.72982406616211, "global_step": 100738, "epoch": 832} {"train_loss": -38.31246566772461, "global_step": 100739, "epoch": 832} {"train_loss": -39.29789733886719, "global_step": 100740, "epoch": 832} {"train_loss": -39.5445671081543, "global_step": 100741, "epoch": 832} {"train_loss": -39.79315948486328, "global_step": 100742, "epoch": 832} {"train_loss": -39.29166793823242, "global_step": 100743, "epoch": 832} {"train_loss": -37.35944747924805, "global_step": 100744, "epoch": 832} {"train_loss": -37.94148254394531, "global_step": 100745, "epoch": 832} {"train_loss": -39.51933670043945, "global_step": 100746, "epoch": 832} {"train_loss": -35.9571418762207, "global_step": 100747, "epoch": 832} {"train_loss": -39.037628173828125, "global_step": 100748, "epoch": 832} {"train_loss": -37.01074981689453, "global_step": 100749, "epoch": 832} {"train_loss": -39.129913330078125, "global_step": 100750, "epoch": 832} {"train_loss": -37.02000045776367, "global_step": 100751, "epoch": 832} {"train_loss": -39.11515426635742, "global_step": 100752, "epoch": 832} {"train_loss": -38.232688903808594, "global_step": 100753, "epoch": 832} {"train_loss": -38.98695373535156, "global_step": 100754, "epoch": 832} {"train_loss": -38.44439697265625, "global_step": 100755, "epoch": 832} {"train_loss": -37.53846740722656, "global_step": 100756, "epoch": 832} {"train_loss": -38.312931060791016, "global_step": 100757, "epoch": 832} {"train_loss": -38.68349075317383, "global_step": 100758, "epoch": 832} {"train_loss": -36.900543212890625, "global_step": 100759, "epoch": 832} {"train_loss": -38.73844528198242, "global_step": 100760, "epoch": 832} {"train_loss": -38.474876403808594, "global_step": 100761, "epoch": 832} {"train_loss": -37.5485954284668, "global_step": 100762, "epoch": 832} {"train_loss": -38.68757247924805, "global_step": 100763, "epoch": 832} {"train_loss": -38.78099822998047, "global_step": 100764, "epoch": 832} {"train_loss": -38.00802230834961, "global_step": 100765, "epoch": 832} {"train_loss": -38.93281173706055, "global_step": 100766, "epoch": 832} {"train_loss": -38.59516525268555, "global_step": 100767, "epoch": 832} {"train_loss": -37.581146240234375, "global_step": 100768, "epoch": 832} {"train_loss": -38.51192092895508, "global_step": 100769, "epoch": 832} {"train_loss": -38.99740219116211, "global_step": 100770, "epoch": 832} {"train_loss": -38.863372802734375, "global_step": 100771, "epoch": 832} {"train_loss": -38.94233322143555, "global_step": 100772, "epoch": 832} {"train_loss": -38.76919174194336, "global_step": 100773, "epoch": 832} {"train_loss": -39.4375, "global_step": 100774, "epoch": 832} {"train_loss": -39.07773971557617, "global_step": 100775, "epoch": 832} {"train_loss": -39.77338790893555, "global_step": 100776, "epoch": 832} {"train_loss": -38.94146728515625, "global_step": 100777, "epoch": 832} {"train_loss": -39.12055969238281, "global_step": 100778, "epoch": 832} {"train_loss": -39.75680923461914, "global_step": 100779, "epoch": 832} {"train_loss": -39.45272445678711, "global_step": 100780, "epoch": 832} {"train_loss": -38.70327377319336, "global_step": 100781, "epoch": 832} {"train_loss": -38.86235809326172, "global_step": 100782, "epoch": 832} {"train_loss": -39.35548400878906, "global_step": 100783, "epoch": 832} {"train_loss": -39.98948287963867, "global_step": 100784, "epoch": 832} {"train_loss": -39.389076232910156, "global_step": 100785, "epoch": 832} {"train_loss": -38.340614318847656, "global_step": 100786, "epoch": 832} {"train_loss": -38.37961959838867, "global_step": 100787, "epoch": 832} {"train_loss": -38.75021743774414, "global_step": 100788, "epoch": 832} {"train_loss": -38.657745361328125, "global_step": 100789, "epoch": 832} {"train_loss": -39.26087188720703, "global_step": 100790, "epoch": 832} {"train_loss": -38.64878463745117, "global_step": 100791, "epoch": 832} {"train_loss": -38.40344805756876, "global_step": 100792, "epoch": 832, "val_loss": 2540332.25} {"train_loss": -37.400634765625, "global_step": 100793, "epoch": 833} {"train_loss": -39.29117965698242, "global_step": 100794, "epoch": 833} {"train_loss": -38.304927825927734, "global_step": 100795, "epoch": 833} {"train_loss": -37.59833908081055, "global_step": 100796, "epoch": 833} {"train_loss": -36.13159942626953, "global_step": 100797, "epoch": 833} {"train_loss": -38.801509857177734, "global_step": 100798, "epoch": 833} {"train_loss": -38.346981048583984, "global_step": 100799, "epoch": 833} {"train_loss": -38.077701568603516, "global_step": 100800, "epoch": 833} {"train_loss": -37.57578659057617, "global_step": 100801, "epoch": 833} {"train_loss": -38.932247161865234, "global_step": 100802, "epoch": 833} {"train_loss": -38.80703353881836, "global_step": 100803, "epoch": 833} {"train_loss": -38.431190490722656, "global_step": 100804, "epoch": 833} {"train_loss": -39.8036003112793, "global_step": 100805, "epoch": 833} {"train_loss": -37.74825668334961, "global_step": 100806, "epoch": 833} {"train_loss": -38.06760787963867, "global_step": 100807, "epoch": 833} {"train_loss": -38.8651237487793, "global_step": 100808, "epoch": 833} {"train_loss": -38.82618713378906, "global_step": 100809, "epoch": 833} {"train_loss": -38.9091796875, "global_step": 100810, "epoch": 833} {"train_loss": -38.552711486816406, "global_step": 100811, "epoch": 833} {"train_loss": -39.411834716796875, "global_step": 100812, "epoch": 833} {"train_loss": -39.207550048828125, "global_step": 100813, "epoch": 833} {"train_loss": -38.70819091796875, "global_step": 100814, "epoch": 833} {"train_loss": -39.2584342956543, "global_step": 100815, "epoch": 833} {"train_loss": -38.255950927734375, "global_step": 100816, "epoch": 833} {"train_loss": -39.06684494018555, "global_step": 100817, "epoch": 833} {"train_loss": -39.09676742553711, "global_step": 100818, "epoch": 833} {"train_loss": -37.16572952270508, "global_step": 100819, "epoch": 833} {"train_loss": -39.295284271240234, "global_step": 100820, "epoch": 833} {"train_loss": -38.95588302612305, "global_step": 100821, "epoch": 833} {"train_loss": -38.679718017578125, "global_step": 100822, "epoch": 833} {"train_loss": -39.54497146606445, "global_step": 100823, "epoch": 833} {"train_loss": -39.55318069458008, "global_step": 100824, "epoch": 833} {"train_loss": -38.501853942871094, "global_step": 100825, "epoch": 833} {"train_loss": -39.505462646484375, "global_step": 100826, "epoch": 833} {"train_loss": -38.34043502807617, "global_step": 100827, "epoch": 833} {"train_loss": -38.2191162109375, "global_step": 100828, "epoch": 833} {"train_loss": -38.922035217285156, "global_step": 100829, "epoch": 833} {"train_loss": -37.6436767578125, "global_step": 100830, "epoch": 833} {"train_loss": -38.28043746948242, "global_step": 100831, "epoch": 833} {"train_loss": -38.418575286865234, "global_step": 100832, "epoch": 833} {"train_loss": -36.9159049987793, "global_step": 100833, "epoch": 833} {"train_loss": -38.64704132080078, "global_step": 100834, "epoch": 833} {"train_loss": -38.72335433959961, "global_step": 100835, "epoch": 833} {"train_loss": -37.519996643066406, "global_step": 100836, "epoch": 833} {"train_loss": -39.00411605834961, "global_step": 100837, "epoch": 833} {"train_loss": -37.61530303955078, "global_step": 100838, "epoch": 833} {"train_loss": -38.62841033935547, "global_step": 100839, "epoch": 833} {"train_loss": -37.85691452026367, "global_step": 100840, "epoch": 833} {"train_loss": -37.65603256225586, "global_step": 100841, "epoch": 833} {"train_loss": -36.726436614990234, "global_step": 100842, "epoch": 833} {"train_loss": -38.157386779785156, "global_step": 100843, "epoch": 833} {"train_loss": -37.748329162597656, "global_step": 100844, "epoch": 833} {"train_loss": -38.89925765991211, "global_step": 100845, "epoch": 833} {"train_loss": -37.2763557434082, "global_step": 100846, "epoch": 833} {"train_loss": -37.577632904052734, "global_step": 100847, "epoch": 833} {"train_loss": -38.7911491394043, "global_step": 100848, "epoch": 833} {"train_loss": -38.363643646240234, "global_step": 100849, "epoch": 833} {"train_loss": -38.8758544921875, "global_step": 100850, "epoch": 833} {"train_loss": -38.17554473876953, "global_step": 100851, "epoch": 833} {"train_loss": -38.272762298583984, "global_step": 100852, "epoch": 833} {"train_loss": -37.64988327026367, "global_step": 100853, "epoch": 833} {"train_loss": -37.14912033081055, "global_step": 100854, "epoch": 833} {"train_loss": -36.61458969116211, "global_step": 100855, "epoch": 833} {"train_loss": -38.57849884033203, "global_step": 100856, "epoch": 833} {"train_loss": -37.69792938232422, "global_step": 100857, "epoch": 833} {"train_loss": -38.08631896972656, "global_step": 100858, "epoch": 833} {"train_loss": -39.232688903808594, "global_step": 100859, "epoch": 833} {"train_loss": -39.08580780029297, "global_step": 100860, "epoch": 833} {"train_loss": -38.0014762878418, "global_step": 100861, "epoch": 833} {"train_loss": -37.95068359375, "global_step": 100862, "epoch": 833} {"train_loss": -38.427101135253906, "global_step": 100863, "epoch": 833} {"train_loss": -38.514373779296875, "global_step": 100864, "epoch": 833} {"train_loss": -38.889930725097656, "global_step": 100865, "epoch": 833} {"train_loss": -38.63685989379883, "global_step": 100866, "epoch": 833} {"train_loss": -39.10344696044922, "global_step": 100867, "epoch": 833} {"train_loss": -39.232364654541016, "global_step": 100868, "epoch": 833} {"train_loss": -38.66123580932617, "global_step": 100869, "epoch": 833} {"train_loss": -38.744625091552734, "global_step": 100870, "epoch": 833} {"train_loss": -39.5955924987793, "global_step": 100871, "epoch": 833} {"train_loss": -39.11469268798828, "global_step": 100872, "epoch": 833} {"train_loss": -38.855831146240234, "global_step": 100873, "epoch": 833} {"train_loss": -38.626686096191406, "global_step": 100874, "epoch": 833} {"train_loss": -39.46722412109375, "global_step": 100875, "epoch": 833} {"train_loss": -39.662540435791016, "global_step": 100876, "epoch": 833} {"train_loss": -39.013675689697266, "global_step": 100877, "epoch": 833} {"train_loss": -38.82197189331055, "global_step": 100878, "epoch": 833} {"train_loss": -39.46234130859375, "global_step": 100879, "epoch": 833} {"train_loss": -39.52813720703125, "global_step": 100880, "epoch": 833} {"train_loss": -39.01420974731445, "global_step": 100881, "epoch": 833} {"train_loss": -38.71263885498047, "global_step": 100882, "epoch": 833} {"train_loss": -39.22799301147461, "global_step": 100883, "epoch": 833} {"train_loss": -39.85689163208008, "global_step": 100884, "epoch": 833} {"train_loss": -39.23641586303711, "global_step": 100885, "epoch": 833} {"train_loss": -39.68032455444336, "global_step": 100886, "epoch": 833} {"train_loss": -39.251522064208984, "global_step": 100887, "epoch": 833} {"train_loss": -39.63436508178711, "global_step": 100888, "epoch": 833} {"train_loss": -39.85738754272461, "global_step": 100889, "epoch": 833} {"train_loss": -39.102848052978516, "global_step": 100890, "epoch": 833} {"train_loss": -38.68679428100586, "global_step": 100891, "epoch": 833} {"train_loss": -38.86800003051758, "global_step": 100892, "epoch": 833} {"train_loss": -38.823978424072266, "global_step": 100893, "epoch": 833} {"train_loss": -38.108482360839844, "global_step": 100894, "epoch": 833} {"train_loss": -39.72978591918945, "global_step": 100895, "epoch": 833} {"train_loss": -38.471614837646484, "global_step": 100896, "epoch": 833} {"train_loss": -39.558326721191406, "global_step": 100897, "epoch": 833} {"train_loss": -38.76563262939453, "global_step": 100898, "epoch": 833} {"train_loss": -39.12990951538086, "global_step": 100899, "epoch": 833} {"train_loss": -37.93407440185547, "global_step": 100900, "epoch": 833} {"train_loss": -38.80970764160156, "global_step": 100901, "epoch": 833} {"train_loss": -39.13218307495117, "global_step": 100902, "epoch": 833} {"train_loss": -39.30817794799805, "global_step": 100903, "epoch": 833} {"train_loss": -39.566253662109375, "global_step": 100904, "epoch": 833} {"train_loss": -38.936580657958984, "global_step": 100905, "epoch": 833} {"train_loss": -39.29279708862305, "global_step": 100906, "epoch": 833} {"train_loss": -39.90105056762695, "global_step": 100907, "epoch": 833} {"train_loss": -38.666542053222656, "global_step": 100908, "epoch": 833} {"train_loss": -39.62595748901367, "global_step": 100909, "epoch": 833} {"train_loss": -38.81648635864258, "global_step": 100910, "epoch": 833} {"train_loss": -39.27979278564453, "global_step": 100911, "epoch": 833} {"train_loss": -40.11576461791992, "global_step": 100912, "epoch": 833} {"train_loss": -38.661797200352694, "global_step": 100913, "epoch": 833, "val_loss": 2623024.25} {"train_loss": -39.63669204711914, "global_step": 100914, "epoch": 834} {"train_loss": -38.81437683105469, "global_step": 100915, "epoch": 834} {"train_loss": -39.59481430053711, "global_step": 100916, "epoch": 834} {"train_loss": -39.989410400390625, "global_step": 100917, "epoch": 834} {"train_loss": -39.66511917114258, "global_step": 100918, "epoch": 834} {"train_loss": -39.389495849609375, "global_step": 100919, "epoch": 834} {"train_loss": -39.791988372802734, "global_step": 100920, "epoch": 834} {"train_loss": -39.33662796020508, "global_step": 100921, "epoch": 834} {"train_loss": -39.698524475097656, "global_step": 100922, "epoch": 834} {"train_loss": -39.530357360839844, "global_step": 100923, "epoch": 834} {"train_loss": -39.66306686401367, "global_step": 100924, "epoch": 834} {"train_loss": -39.78729248046875, "global_step": 100925, "epoch": 834} {"train_loss": -39.87223434448242, "global_step": 100926, "epoch": 834} {"train_loss": -40.15607833862305, "global_step": 100927, "epoch": 834} {"train_loss": -40.09457778930664, "global_step": 100928, "epoch": 834} {"train_loss": -39.7020263671875, "global_step": 100929, "epoch": 834} {"train_loss": -40.067359924316406, "global_step": 100930, "epoch": 834} {"train_loss": -39.49110412597656, "global_step": 100931, "epoch": 834} {"train_loss": -39.822593688964844, "global_step": 100932, "epoch": 834} {"train_loss": -39.46969223022461, "global_step": 100933, "epoch": 834} {"train_loss": -36.32540512084961, "global_step": 100934, "epoch": 834} {"train_loss": -33.1121940612793, "global_step": 100935, "epoch": 834} {"train_loss": -37.1563835144043, "global_step": 100936, "epoch": 834} {"train_loss": -28.614423751831055, "global_step": 100937, "epoch": 834} {"train_loss": -24.84650230407715, "global_step": 100938, "epoch": 834} {"train_loss": -30.328516006469727, "global_step": 100939, "epoch": 834} {"train_loss": -28.298206329345703, "global_step": 100940, "epoch": 834} {"train_loss": -28.315610885620117, "global_step": 100941, "epoch": 834} {"train_loss": -30.5318660736084, "global_step": 100942, "epoch": 834} {"train_loss": -30.461200714111328, "global_step": 100943, "epoch": 834} {"train_loss": -29.310285568237305, "global_step": 100944, "epoch": 834} {"train_loss": -30.781147003173828, "global_step": 100945, "epoch": 834} {"train_loss": -30.619064331054688, "global_step": 100946, "epoch": 834} {"train_loss": -31.053863525390625, "global_step": 100947, "epoch": 834} {"train_loss": -30.2618408203125, "global_step": 100948, "epoch": 834} {"train_loss": -31.821664810180664, "global_step": 100949, "epoch": 834} {"train_loss": -31.91729164123535, "global_step": 100950, "epoch": 834} {"train_loss": -31.404699325561523, "global_step": 100951, "epoch": 834} {"train_loss": -32.666568756103516, "global_step": 100952, "epoch": 834} {"train_loss": -32.26406478881836, "global_step": 100953, "epoch": 834} {"train_loss": -31.88916015625, "global_step": 100954, "epoch": 834} {"train_loss": -32.83696365356445, "global_step": 100955, "epoch": 834} {"train_loss": -31.635828018188477, "global_step": 100956, "epoch": 834} {"train_loss": -31.20438003540039, "global_step": 100957, "epoch": 834} {"train_loss": -32.042633056640625, "global_step": 100958, "epoch": 834} {"train_loss": -31.970844268798828, "global_step": 100959, "epoch": 834} {"train_loss": -32.793922424316406, "global_step": 100960, "epoch": 834} {"train_loss": -32.5788688659668, "global_step": 100961, "epoch": 834} {"train_loss": -33.30768966674805, "global_step": 100962, "epoch": 834} {"train_loss": -33.1713981628418, "global_step": 100963, "epoch": 834} {"train_loss": -32.680545806884766, "global_step": 100964, "epoch": 834} {"train_loss": -32.50016403198242, "global_step": 100965, "epoch": 834} {"train_loss": -28.742170333862305, "global_step": 100966, "epoch": 834} {"train_loss": -32.17196273803711, "global_step": 100967, "epoch": 834} {"train_loss": -32.31254959106445, "global_step": 100968, "epoch": 834} {"train_loss": -32.1352653503418, "global_step": 100969, "epoch": 834} {"train_loss": -32.64780044555664, "global_step": 100970, "epoch": 834} {"train_loss": -33.70841598510742, "global_step": 100971, "epoch": 834} {"train_loss": -32.89376449584961, "global_step": 100972, "epoch": 834} {"train_loss": -34.170284271240234, "global_step": 100973, "epoch": 834} {"train_loss": -33.14988327026367, "global_step": 100974, "epoch": 834} {"train_loss": -34.10287094116211, "global_step": 100975, "epoch": 834} {"train_loss": -34.13689041137695, "global_step": 100976, "epoch": 834} {"train_loss": -33.97936248779297, "global_step": 100977, "epoch": 834} {"train_loss": -33.72034454345703, "global_step": 100978, "epoch": 834} {"train_loss": -33.99966812133789, "global_step": 100979, "epoch": 834} {"train_loss": -32.774261474609375, "global_step": 100980, "epoch": 834} {"train_loss": -32.02487564086914, "global_step": 100981, "epoch": 834} {"train_loss": -34.39784622192383, "global_step": 100982, "epoch": 834} {"train_loss": -34.24158477783203, "global_step": 100983, "epoch": 834} {"train_loss": -33.11418914794922, "global_step": 100984, "epoch": 834} {"train_loss": -35.03805923461914, "global_step": 100985, "epoch": 834} {"train_loss": -33.639251708984375, "global_step": 100986, "epoch": 834} {"train_loss": -35.016902923583984, "global_step": 100987, "epoch": 834} {"train_loss": -34.043975830078125, "global_step": 100988, "epoch": 834} {"train_loss": -35.5861701965332, "global_step": 100989, "epoch": 834} {"train_loss": -34.2696647644043, "global_step": 100990, "epoch": 834} {"train_loss": -35.06869125366211, "global_step": 100991, "epoch": 834} {"train_loss": -34.86203384399414, "global_step": 100992, "epoch": 834} {"train_loss": -35.4686393737793, "global_step": 100993, "epoch": 834} {"train_loss": -35.00580596923828, "global_step": 100994, "epoch": 834} {"train_loss": -34.6119270324707, "global_step": 100995, "epoch": 834} {"train_loss": -35.020084381103516, "global_step": 100996, "epoch": 834} {"train_loss": -33.58732223510742, "global_step": 100997, "epoch": 834} {"train_loss": -32.718772888183594, "global_step": 100998, "epoch": 834} {"train_loss": -35.022979736328125, "global_step": 100999, "epoch": 834} {"train_loss": -33.552764892578125, "global_step": 101000, "epoch": 834} {"train_loss": -35.57427978515625, "global_step": 101001, "epoch": 834} {"train_loss": -34.00236892700195, "global_step": 101002, "epoch": 834} {"train_loss": -31.999181747436523, "global_step": 101003, "epoch": 834} {"train_loss": -35.409912109375, "global_step": 101004, "epoch": 834} {"train_loss": -35.648841857910156, "global_step": 101005, "epoch": 834} {"train_loss": -34.75904083251953, "global_step": 101006, "epoch": 834} {"train_loss": -35.603187561035156, "global_step": 101007, "epoch": 834} {"train_loss": -36.129180908203125, "global_step": 101008, "epoch": 834} {"train_loss": -34.60578155517578, "global_step": 101009, "epoch": 834} {"train_loss": -36.187110900878906, "global_step": 101010, "epoch": 834} {"train_loss": -35.80061340332031, "global_step": 101011, "epoch": 834} {"train_loss": -35.38724899291992, "global_step": 101012, "epoch": 834} {"train_loss": -35.25618362426758, "global_step": 101013, "epoch": 834} {"train_loss": -35.7609748840332, "global_step": 101014, "epoch": 834} {"train_loss": -35.4304084777832, "global_step": 101015, "epoch": 834} {"train_loss": -35.98793411254883, "global_step": 101016, "epoch": 834} {"train_loss": -35.86434555053711, "global_step": 101017, "epoch": 834} {"train_loss": -35.53988265991211, "global_step": 101018, "epoch": 834} {"train_loss": -36.021507263183594, "global_step": 101019, "epoch": 834} {"train_loss": -36.13304901123047, "global_step": 101020, "epoch": 834} {"train_loss": -35.71007537841797, "global_step": 101021, "epoch": 834} {"train_loss": -36.194725036621094, "global_step": 101022, "epoch": 834} {"train_loss": -35.71236801147461, "global_step": 101023, "epoch": 834} {"train_loss": -35.818294525146484, "global_step": 101024, "epoch": 834} {"train_loss": -35.59581756591797, "global_step": 101025, "epoch": 834} {"train_loss": -36.511470794677734, "global_step": 101026, "epoch": 834} {"train_loss": -34.79067611694336, "global_step": 101027, "epoch": 834} {"train_loss": -36.545166015625, "global_step": 101028, "epoch": 834} {"train_loss": -36.004722595214844, "global_step": 101029, "epoch": 834} {"train_loss": -36.01982116699219, "global_step": 101030, "epoch": 834} {"train_loss": -36.42033004760742, "global_step": 101031, "epoch": 834} {"train_loss": -35.2391471862793, "global_step": 101032, "epoch": 834} {"train_loss": -36.72188949584961, "global_step": 101033, "epoch": 834} {"train_loss": -34.656050658423055, "global_step": 101034, "epoch": 834, "val_loss": 2426676.75} {"train_loss": -36.83124923706055, "global_step": 101035, "epoch": 835} {"train_loss": -36.398441314697266, "global_step": 101036, "epoch": 835} {"train_loss": -36.08053207397461, "global_step": 101037, "epoch": 835} {"train_loss": -36.76618194580078, "global_step": 101038, "epoch": 835} {"train_loss": -36.95833969116211, "global_step": 101039, "epoch": 835} {"train_loss": -36.86796951293945, "global_step": 101040, "epoch": 835} {"train_loss": -34.55678939819336, "global_step": 101041, "epoch": 835} {"train_loss": -36.129066467285156, "global_step": 101042, "epoch": 835} {"train_loss": -35.34406661987305, "global_step": 101043, "epoch": 835} {"train_loss": -36.29792022705078, "global_step": 101044, "epoch": 835} {"train_loss": -35.21738815307617, "global_step": 101045, "epoch": 835} {"train_loss": -36.70966339111328, "global_step": 101046, "epoch": 835} {"train_loss": -36.57483673095703, "global_step": 101047, "epoch": 835} {"train_loss": -36.4821662902832, "global_step": 101048, "epoch": 835} {"train_loss": -33.266998291015625, "global_step": 101049, "epoch": 835} {"train_loss": -33.89371871948242, "global_step": 101050, "epoch": 835} {"train_loss": -35.511409759521484, "global_step": 101051, "epoch": 835} {"train_loss": -36.42588806152344, "global_step": 101052, "epoch": 835} {"train_loss": -34.531272888183594, "global_step": 101053, "epoch": 835} {"train_loss": -35.956764221191406, "global_step": 101054, "epoch": 835} {"train_loss": -35.353939056396484, "global_step": 101055, "epoch": 835} {"train_loss": -36.28224182128906, "global_step": 101056, "epoch": 835} {"train_loss": -34.63038635253906, "global_step": 101057, "epoch": 835} {"train_loss": -36.583717346191406, "global_step": 101058, "epoch": 835} {"train_loss": -35.34784698486328, "global_step": 101059, "epoch": 835} {"train_loss": -35.13385009765625, "global_step": 101060, "epoch": 835} {"train_loss": -31.335712432861328, "global_step": 101061, "epoch": 835} {"train_loss": -29.77979850769043, "global_step": 101062, "epoch": 835} {"train_loss": -33.22422409057617, "global_step": 101063, "epoch": 835} {"train_loss": -33.50507736206055, "global_step": 101064, "epoch": 835} {"train_loss": -33.618465423583984, "global_step": 101065, "epoch": 835} {"train_loss": -36.202606201171875, "global_step": 101066, "epoch": 835} {"train_loss": -34.56575393676758, "global_step": 101067, "epoch": 835} {"train_loss": -35.62130355834961, "global_step": 101068, "epoch": 835} {"train_loss": -33.45745849609375, "global_step": 101069, "epoch": 835} {"train_loss": -35.38970947265625, "global_step": 101070, "epoch": 835} {"train_loss": -35.77981185913086, "global_step": 101071, "epoch": 835} {"train_loss": -34.3714714050293, "global_step": 101072, "epoch": 835} {"train_loss": -36.081634521484375, "global_step": 101073, "epoch": 835} {"train_loss": -35.32756423950195, "global_step": 101074, "epoch": 835} {"train_loss": -34.68085479736328, "global_step": 101075, "epoch": 835} {"train_loss": -35.7048454284668, "global_step": 101076, "epoch": 835} {"train_loss": -36.13245391845703, "global_step": 101077, "epoch": 835} {"train_loss": -36.3540153503418, "global_step": 101078, "epoch": 835} {"train_loss": -35.115230560302734, "global_step": 101079, "epoch": 835} {"train_loss": -35.84614944458008, "global_step": 101080, "epoch": 835} {"train_loss": -35.25959396362305, "global_step": 101081, "epoch": 835} {"train_loss": -34.130126953125, "global_step": 101082, "epoch": 835} {"train_loss": -36.262542724609375, "global_step": 101083, "epoch": 835} {"train_loss": -36.071041107177734, "global_step": 101084, "epoch": 835} {"train_loss": -36.304443359375, "global_step": 101085, "epoch": 835} {"train_loss": -35.674781799316406, "global_step": 101086, "epoch": 835} {"train_loss": -37.022090911865234, "global_step": 101087, "epoch": 835} {"train_loss": -36.53800964355469, "global_step": 101088, "epoch": 835} {"train_loss": -36.893585205078125, "global_step": 101089, "epoch": 835} {"train_loss": -36.450592041015625, "global_step": 101090, "epoch": 835} {"train_loss": -36.1828727722168, "global_step": 101091, "epoch": 835} {"train_loss": -36.760528564453125, "global_step": 101092, "epoch": 835} {"train_loss": -36.172576904296875, "global_step": 101093, "epoch": 835} {"train_loss": -36.71672058105469, "global_step": 101094, "epoch": 835} {"train_loss": -37.50898361206055, "global_step": 101095, "epoch": 835} {"train_loss": -36.850738525390625, "global_step": 101096, "epoch": 835} {"train_loss": -36.841976165771484, "global_step": 101097, "epoch": 835} {"train_loss": -37.17836380004883, "global_step": 101098, "epoch": 835} {"train_loss": -37.1616325378418, "global_step": 101099, "epoch": 835} {"train_loss": -36.557491302490234, "global_step": 101100, "epoch": 835} {"train_loss": -36.6014289855957, "global_step": 101101, "epoch": 835} {"train_loss": -36.83351516723633, "global_step": 101102, "epoch": 835} {"train_loss": -35.92202377319336, "global_step": 101103, "epoch": 835} {"train_loss": -37.53621292114258, "global_step": 101104, "epoch": 835} {"train_loss": -37.201271057128906, "global_step": 101105, "epoch": 835} {"train_loss": -37.636775970458984, "global_step": 101106, "epoch": 835} {"train_loss": -37.03867721557617, "global_step": 101107, "epoch": 835} {"train_loss": -37.61695861816406, "global_step": 101108, "epoch": 835} {"train_loss": -37.139686584472656, "global_step": 101109, "epoch": 835} {"train_loss": -36.60019302368164, "global_step": 101110, "epoch": 835} {"train_loss": -37.009647369384766, "global_step": 101111, "epoch": 835} {"train_loss": -35.863861083984375, "global_step": 101112, "epoch": 835} {"train_loss": -35.69454574584961, "global_step": 101113, "epoch": 835} {"train_loss": -37.05215072631836, "global_step": 101114, "epoch": 835} {"train_loss": -36.534889221191406, "global_step": 101115, "epoch": 835} {"train_loss": -37.660560607910156, "global_step": 101116, "epoch": 835} {"train_loss": -36.76589584350586, "global_step": 101117, "epoch": 835} {"train_loss": -37.25716781616211, "global_step": 101118, "epoch": 835} {"train_loss": -36.89318084716797, "global_step": 101119, "epoch": 835} {"train_loss": -34.211158752441406, "global_step": 101120, "epoch": 835} {"train_loss": -34.934085845947266, "global_step": 101121, "epoch": 835} {"train_loss": -32.71387481689453, "global_step": 101122, "epoch": 835} {"train_loss": -24.895906448364258, "global_step": 101123, "epoch": 835} {"train_loss": -9.607260704040527, "global_step": 101124, "epoch": 835} {"train_loss": -31.637609481811523, "global_step": 101125, "epoch": 835} {"train_loss": -29.855932235717773, "global_step": 101126, "epoch": 835} {"train_loss": -31.93341636657715, "global_step": 101127, "epoch": 835} {"train_loss": -25.95448112487793, "global_step": 101128, "epoch": 835} {"train_loss": -32.689449310302734, "global_step": 101129, "epoch": 835} {"train_loss": -31.541397094726562, "global_step": 101130, "epoch": 835} {"train_loss": -33.05165481567383, "global_step": 101131, "epoch": 835} {"train_loss": -31.820663452148438, "global_step": 101132, "epoch": 835} {"train_loss": -31.48855972290039, "global_step": 101133, "epoch": 835} {"train_loss": -33.71736526489258, "global_step": 101134, "epoch": 835} {"train_loss": -32.889808654785156, "global_step": 101135, "epoch": 835} {"train_loss": -30.98066520690918, "global_step": 101136, "epoch": 835} {"train_loss": -31.276838302612305, "global_step": 101137, "epoch": 835} {"train_loss": -31.34857177734375, "global_step": 101138, "epoch": 835} {"train_loss": -33.09577178955078, "global_step": 101139, "epoch": 835} {"train_loss": -34.45247268676758, "global_step": 101140, "epoch": 835} {"train_loss": -33.704647064208984, "global_step": 101141, "epoch": 835} {"train_loss": -32.53815460205078, "global_step": 101142, "epoch": 835} {"train_loss": -33.72444534301758, "global_step": 101143, "epoch": 835} {"train_loss": -34.792152404785156, "global_step": 101144, "epoch": 835} {"train_loss": -32.52470016479492, "global_step": 101145, "epoch": 835} {"train_loss": -33.84257125854492, "global_step": 101146, "epoch": 835} {"train_loss": -31.497770309448242, "global_step": 101147, "epoch": 835} {"train_loss": -34.74821090698242, "global_step": 101148, "epoch": 835} {"train_loss": -33.94682693481445, "global_step": 101149, "epoch": 835} {"train_loss": -34.58575439453125, "global_step": 101150, "epoch": 835} {"train_loss": -34.5281982421875, "global_step": 101151, "epoch": 835} {"train_loss": -34.232784271240234, "global_step": 101152, "epoch": 835} {"train_loss": -34.95547866821289, "global_step": 101153, "epoch": 835} {"train_loss": -35.07778549194336, "global_step": 101154, "epoch": 835} {"train_loss": -34.753430461095384, "global_step": 101155, "epoch": 835, "val_loss": 3098967.75} {"train_loss": -35.76659393310547, "global_step": 101156, "epoch": 836} {"train_loss": -34.8719367980957, "global_step": 101157, "epoch": 836} {"train_loss": -35.14067459106445, "global_step": 101158, "epoch": 836} {"train_loss": -35.626190185546875, "global_step": 101159, "epoch": 836} {"train_loss": -33.51338577270508, "global_step": 101160, "epoch": 836} {"train_loss": -34.07123565673828, "global_step": 101161, "epoch": 836} {"train_loss": -35.817054748535156, "global_step": 101162, "epoch": 836} {"train_loss": -35.21110916137695, "global_step": 101163, "epoch": 836} {"train_loss": -35.56077194213867, "global_step": 101164, "epoch": 836} {"train_loss": -35.12633514404297, "global_step": 101165, "epoch": 836} {"train_loss": -36.05419921875, "global_step": 101166, "epoch": 836} {"train_loss": -35.692745208740234, "global_step": 101167, "epoch": 836} {"train_loss": -35.60294723510742, "global_step": 101168, "epoch": 836} {"train_loss": -35.75654220581055, "global_step": 101169, "epoch": 836} {"train_loss": -35.97603225708008, "global_step": 101170, "epoch": 836} {"train_loss": -35.801334381103516, "global_step": 101171, "epoch": 836} {"train_loss": -35.737892150878906, "global_step": 101172, "epoch": 836} {"train_loss": -35.87521743774414, "global_step": 101173, "epoch": 836} {"train_loss": -36.39858627319336, "global_step": 101174, "epoch": 836} {"train_loss": -35.991790771484375, "global_step": 101175, "epoch": 836} {"train_loss": -36.009029388427734, "global_step": 101176, "epoch": 836} {"train_loss": -36.14686965942383, "global_step": 101177, "epoch": 836} {"train_loss": -35.72428894042969, "global_step": 101178, "epoch": 836} {"train_loss": -35.99201583862305, "global_step": 101179, "epoch": 836} {"train_loss": -36.2065544128418, "global_step": 101180, "epoch": 836} {"train_loss": -36.43375778198242, "global_step": 101181, "epoch": 836} {"train_loss": -36.869441986083984, "global_step": 101182, "epoch": 836} {"train_loss": -36.887672424316406, "global_step": 101183, "epoch": 836} {"train_loss": -36.15327835083008, "global_step": 101184, "epoch": 836} {"train_loss": -36.449337005615234, "global_step": 101185, "epoch": 836} {"train_loss": -35.95445251464844, "global_step": 101186, "epoch": 836} {"train_loss": -36.04441452026367, "global_step": 101187, "epoch": 836} {"train_loss": -36.495140075683594, "global_step": 101188, "epoch": 836} {"train_loss": -36.96246337890625, "global_step": 101189, "epoch": 836} {"train_loss": -37.140655517578125, "global_step": 101190, "epoch": 836} {"train_loss": -36.831993103027344, "global_step": 101191, "epoch": 836} {"train_loss": -36.33384704589844, "global_step": 101192, "epoch": 836} {"train_loss": -36.85477828979492, "global_step": 101193, "epoch": 836} {"train_loss": -36.617706298828125, "global_step": 101194, "epoch": 836} {"train_loss": -36.312583923339844, "global_step": 101195, "epoch": 836} {"train_loss": -36.44029998779297, "global_step": 101196, "epoch": 836} {"train_loss": -35.20571517944336, "global_step": 101197, "epoch": 836} {"train_loss": -35.14973831176758, "global_step": 101198, "epoch": 836} {"train_loss": -36.31795120239258, "global_step": 101199, "epoch": 836} {"train_loss": -37.64997863769531, "global_step": 101200, "epoch": 836} {"train_loss": -35.81371307373047, "global_step": 101201, "epoch": 836} {"train_loss": -35.31219482421875, "global_step": 101202, "epoch": 836} {"train_loss": -37.10519790649414, "global_step": 101203, "epoch": 836} {"train_loss": -37.51250076293945, "global_step": 101204, "epoch": 836} {"train_loss": -36.87241744995117, "global_step": 101205, "epoch": 836} {"train_loss": -37.780025482177734, "global_step": 101206, "epoch": 836} {"train_loss": -37.55146408081055, "global_step": 101207, "epoch": 836} {"train_loss": -36.98130416870117, "global_step": 101208, "epoch": 836} {"train_loss": -37.43413543701172, "global_step": 101209, "epoch": 836} {"train_loss": -37.250308990478516, "global_step": 101210, "epoch": 836} {"train_loss": -37.541934967041016, "global_step": 101211, "epoch": 836} {"train_loss": -37.18231964111328, "global_step": 101212, "epoch": 836} {"train_loss": -37.81016159057617, "global_step": 101213, "epoch": 836} {"train_loss": -37.35160446166992, "global_step": 101214, "epoch": 836} {"train_loss": -37.5383415222168, "global_step": 101215, "epoch": 836} {"train_loss": -37.75685119628906, "global_step": 101216, "epoch": 836} {"train_loss": -37.714698791503906, "global_step": 101217, "epoch": 836} {"train_loss": -37.850311279296875, "global_step": 101218, "epoch": 836} {"train_loss": -37.46056365966797, "global_step": 101219, "epoch": 836} {"train_loss": -38.088687896728516, "global_step": 101220, "epoch": 836} {"train_loss": -37.489410400390625, "global_step": 101221, "epoch": 836} {"train_loss": -37.865814208984375, "global_step": 101222, "epoch": 836} {"train_loss": -38.587486267089844, "global_step": 101223, "epoch": 836} {"train_loss": -38.09847640991211, "global_step": 101224, "epoch": 836} {"train_loss": -38.71953582763672, "global_step": 101225, "epoch": 836} {"train_loss": -38.090511322021484, "global_step": 101226, "epoch": 836} {"train_loss": -37.861968994140625, "global_step": 101227, "epoch": 836} {"train_loss": -38.39641189575195, "global_step": 101228, "epoch": 836} {"train_loss": -37.98710250854492, "global_step": 101229, "epoch": 836} {"train_loss": -37.4099235534668, "global_step": 101230, "epoch": 836} {"train_loss": -38.08012008666992, "global_step": 101231, "epoch": 836} {"train_loss": -37.83427047729492, "global_step": 101232, "epoch": 836} {"train_loss": -37.65855026245117, "global_step": 101233, "epoch": 836} {"train_loss": -36.78541564941406, "global_step": 101234, "epoch": 836} {"train_loss": -35.57423400878906, "global_step": 101235, "epoch": 836} {"train_loss": -29.63593864440918, "global_step": 101236, "epoch": 836} {"train_loss": -18.229808807373047, "global_step": 101237, "epoch": 836} {"train_loss": -30.79607582092285, "global_step": 101238, "epoch": 836} {"train_loss": -32.36244583129883, "global_step": 101239, "epoch": 836} {"train_loss": -31.934473037719727, "global_step": 101240, "epoch": 836} {"train_loss": -31.953943252563477, "global_step": 101241, "epoch": 836} {"train_loss": -32.6489143371582, "global_step": 101242, "epoch": 836} {"train_loss": -33.084571838378906, "global_step": 101243, "epoch": 836} {"train_loss": -36.50242233276367, "global_step": 101244, "epoch": 836} {"train_loss": -33.00980758666992, "global_step": 101245, "epoch": 836} {"train_loss": -33.739288330078125, "global_step": 101246, "epoch": 836} {"train_loss": -36.101112365722656, "global_step": 101247, "epoch": 836} {"train_loss": -31.559843063354492, "global_step": 101248, "epoch": 836} {"train_loss": -36.480743408203125, "global_step": 101249, "epoch": 836} {"train_loss": -33.7133674621582, "global_step": 101250, "epoch": 836} {"train_loss": -34.54908752441406, "global_step": 101251, "epoch": 836} {"train_loss": -32.21151351928711, "global_step": 101252, "epoch": 836} {"train_loss": -32.65827560424805, "global_step": 101253, "epoch": 836} {"train_loss": -33.009525299072266, "global_step": 101254, "epoch": 836} {"train_loss": -32.081825256347656, "global_step": 101255, "epoch": 836} {"train_loss": -35.8835563659668, "global_step": 101256, "epoch": 836} {"train_loss": -32.242916107177734, "global_step": 101257, "epoch": 836} {"train_loss": -35.87754440307617, "global_step": 101258, "epoch": 836} {"train_loss": -35.54345703125, "global_step": 101259, "epoch": 836} {"train_loss": -34.2889289855957, "global_step": 101260, "epoch": 836} {"train_loss": -36.11884307861328, "global_step": 101261, "epoch": 836} {"train_loss": -36.26153564453125, "global_step": 101262, "epoch": 836} {"train_loss": -36.16093826293945, "global_step": 101263, "epoch": 836} {"train_loss": -36.27261734008789, "global_step": 101264, "epoch": 836} {"train_loss": -35.83054733276367, "global_step": 101265, "epoch": 836} {"train_loss": -36.80143356323242, "global_step": 101266, "epoch": 836} {"train_loss": -36.43902587890625, "global_step": 101267, "epoch": 836} {"train_loss": -36.07029342651367, "global_step": 101268, "epoch": 836} {"train_loss": -37.11593246459961, "global_step": 101269, "epoch": 836} {"train_loss": -36.158607482910156, "global_step": 101270, "epoch": 836} {"train_loss": -36.27878952026367, "global_step": 101271, "epoch": 836} {"train_loss": -36.424720764160156, "global_step": 101272, "epoch": 836} {"train_loss": -36.083412170410156, "global_step": 101273, "epoch": 836} {"train_loss": -36.74427032470703, "global_step": 101274, "epoch": 836} {"train_loss": -37.1450080871582, "global_step": 101275, "epoch": 836} {"train_loss": -35.81804995891476, "global_step": 101276, "epoch": 836, "val_loss": 2597939.75} {"train_loss": -37.4481315612793, "global_step": 101277, "epoch": 837} {"train_loss": -37.31081008911133, "global_step": 101278, "epoch": 837} {"train_loss": -37.13361740112305, "global_step": 101279, "epoch": 837} {"train_loss": -37.1921501159668, "global_step": 101280, "epoch": 837} {"train_loss": -37.19950485229492, "global_step": 101281, "epoch": 837} {"train_loss": -37.448516845703125, "global_step": 101282, "epoch": 837} {"train_loss": -37.17025375366211, "global_step": 101283, "epoch": 837} {"train_loss": -37.019046783447266, "global_step": 101284, "epoch": 837} {"train_loss": -37.88447189331055, "global_step": 101285, "epoch": 837} {"train_loss": -37.527767181396484, "global_step": 101286, "epoch": 837} {"train_loss": -37.5353889465332, "global_step": 101287, "epoch": 837} {"train_loss": -36.921295166015625, "global_step": 101288, "epoch": 837} {"train_loss": -37.53980255126953, "global_step": 101289, "epoch": 837} {"train_loss": -37.730770111083984, "global_step": 101290, "epoch": 837} {"train_loss": -37.2922477722168, "global_step": 101291, "epoch": 837} {"train_loss": -37.413455963134766, "global_step": 101292, "epoch": 837} {"train_loss": -37.48145294189453, "global_step": 101293, "epoch": 837} {"train_loss": -37.32912063598633, "global_step": 101294, "epoch": 837} {"train_loss": -37.16463851928711, "global_step": 101295, "epoch": 837} {"train_loss": -35.063777923583984, "global_step": 101296, "epoch": 837} {"train_loss": -26.894071578979492, "global_step": 101297, "epoch": 837} {"train_loss": -1.1375690698623657, "global_step": 101298, "epoch": 837} {"train_loss": -4.2241692543029785, "global_step": 101299, "epoch": 837} {"train_loss": -37.800201416015625, "global_step": 101300, "epoch": 837} {"train_loss": -15.498947143554688, "global_step": 101301, "epoch": 837} {"train_loss": -36.73305892944336, "global_step": 101302, "epoch": 837} {"train_loss": -22.959991455078125, "global_step": 101303, "epoch": 837} {"train_loss": -36.08064651489258, "global_step": 101304, "epoch": 837} {"train_loss": -30.997907638549805, "global_step": 101305, "epoch": 837} {"train_loss": -31.3348331451416, "global_step": 101306, "epoch": 837} {"train_loss": -36.752342224121094, "global_step": 101307, "epoch": 837} {"train_loss": -32.678131103515625, "global_step": 101308, "epoch": 837} {"train_loss": -32.90965270996094, "global_step": 101309, "epoch": 837} {"train_loss": -35.81804656982422, "global_step": 101310, "epoch": 837} {"train_loss": -35.03816223144531, "global_step": 101311, "epoch": 837} {"train_loss": -33.66579818725586, "global_step": 101312, "epoch": 837} {"train_loss": -36.156612396240234, "global_step": 101313, "epoch": 837} {"train_loss": -36.2079963684082, "global_step": 101314, "epoch": 837} {"train_loss": -35.007869720458984, "global_step": 101315, "epoch": 837} {"train_loss": -33.90192794799805, "global_step": 101316, "epoch": 837} {"train_loss": -36.59818649291992, "global_step": 101317, "epoch": 837} {"train_loss": -36.931060791015625, "global_step": 101318, "epoch": 837} {"train_loss": -35.7097053527832, "global_step": 101319, "epoch": 837} {"train_loss": -35.67732620239258, "global_step": 101320, "epoch": 837} {"train_loss": -36.844417572021484, "global_step": 101321, "epoch": 837} {"train_loss": -37.313697814941406, "global_step": 101322, "epoch": 837} {"train_loss": -36.484619140625, "global_step": 101323, "epoch": 837} {"train_loss": -36.337947845458984, "global_step": 101324, "epoch": 837} {"train_loss": -36.53117752075195, "global_step": 101325, "epoch": 837} {"train_loss": -36.79627990722656, "global_step": 101326, "epoch": 837} {"train_loss": -37.1441764831543, "global_step": 101327, "epoch": 837} {"train_loss": -36.841304779052734, "global_step": 101328, "epoch": 837} {"train_loss": -36.695045471191406, "global_step": 101329, "epoch": 837} {"train_loss": -37.354591369628906, "global_step": 101330, "epoch": 837} {"train_loss": -37.43052291870117, "global_step": 101331, "epoch": 837} {"train_loss": -37.35712814331055, "global_step": 101332, "epoch": 837} {"train_loss": -37.651248931884766, "global_step": 101333, "epoch": 837} {"train_loss": -37.342140197753906, "global_step": 101334, "epoch": 837} {"train_loss": -37.692630767822266, "global_step": 101335, "epoch": 837} {"train_loss": -37.828731536865234, "global_step": 101336, "epoch": 837} {"train_loss": -37.459983825683594, "global_step": 101337, "epoch": 837} {"train_loss": -37.4431266784668, "global_step": 101338, "epoch": 837} {"train_loss": -37.75901412963867, "global_step": 101339, "epoch": 837} {"train_loss": -37.015724182128906, "global_step": 101340, "epoch": 837} {"train_loss": -37.61935043334961, "global_step": 101341, "epoch": 837} {"train_loss": -37.4795036315918, "global_step": 101342, "epoch": 837} {"train_loss": -38.01884078979492, "global_step": 101343, "epoch": 837} {"train_loss": -37.477264404296875, "global_step": 101344, "epoch": 837} {"train_loss": -38.12693405151367, "global_step": 101345, "epoch": 837} {"train_loss": -38.18328857421875, "global_step": 101346, "epoch": 837} {"train_loss": -37.764739990234375, "global_step": 101347, "epoch": 837} {"train_loss": -38.107784271240234, "global_step": 101348, "epoch": 837} {"train_loss": -38.133052825927734, "global_step": 101349, "epoch": 837} {"train_loss": -37.8728141784668, "global_step": 101350, "epoch": 837} {"train_loss": -37.2364501953125, "global_step": 101351, "epoch": 837} {"train_loss": -37.72410583496094, "global_step": 101352, "epoch": 837} {"train_loss": -37.694515228271484, "global_step": 101353, "epoch": 837} {"train_loss": -38.29502487182617, "global_step": 101354, "epoch": 837} {"train_loss": -37.25140380859375, "global_step": 101355, "epoch": 837} {"train_loss": -36.762115478515625, "global_step": 101356, "epoch": 837} {"train_loss": -37.39973831176758, "global_step": 101357, "epoch": 837} {"train_loss": -38.323890686035156, "global_step": 101358, "epoch": 837} {"train_loss": -36.5614128112793, "global_step": 101359, "epoch": 837} {"train_loss": -36.92790985107422, "global_step": 101360, "epoch": 837} {"train_loss": -36.501373291015625, "global_step": 101361, "epoch": 837} {"train_loss": -37.15436935424805, "global_step": 101362, "epoch": 837} {"train_loss": -34.997230529785156, "global_step": 101363, "epoch": 837} {"train_loss": -30.38409996032715, "global_step": 101364, "epoch": 837} {"train_loss": -21.916776657104492, "global_step": 101365, "epoch": 837} {"train_loss": -24.964475631713867, "global_step": 101366, "epoch": 837} {"train_loss": -32.689186096191406, "global_step": 101367, "epoch": 837} {"train_loss": -19.95787811279297, "global_step": 101368, "epoch": 837} {"train_loss": -28.1672420501709, "global_step": 101369, "epoch": 837} {"train_loss": -26.99884033203125, "global_step": 101370, "epoch": 837} {"train_loss": -30.170185089111328, "global_step": 101371, "epoch": 837} {"train_loss": -32.61001205444336, "global_step": 101372, "epoch": 837} {"train_loss": -34.08049392700195, "global_step": 101373, "epoch": 837} {"train_loss": -32.51169967651367, "global_step": 101374, "epoch": 837} {"train_loss": -33.8714714050293, "global_step": 101375, "epoch": 837} {"train_loss": -34.879608154296875, "global_step": 101376, "epoch": 837} {"train_loss": -35.03436279296875, "global_step": 101377, "epoch": 837} {"train_loss": -34.34835433959961, "global_step": 101378, "epoch": 837} {"train_loss": -34.71017074584961, "global_step": 101379, "epoch": 837} {"train_loss": -34.704402923583984, "global_step": 101380, "epoch": 837} {"train_loss": -35.14760208129883, "global_step": 101381, "epoch": 837} {"train_loss": -35.087013244628906, "global_step": 101382, "epoch": 837} {"train_loss": -35.377235412597656, "global_step": 101383, "epoch": 837} {"train_loss": -35.76142501831055, "global_step": 101384, "epoch": 837} {"train_loss": -34.57927322387695, "global_step": 101385, "epoch": 837} {"train_loss": -34.036224365234375, "global_step": 101386, "epoch": 837} {"train_loss": -35.23639678955078, "global_step": 101387, "epoch": 837} {"train_loss": -35.01771926879883, "global_step": 101388, "epoch": 837} {"train_loss": -36.441158294677734, "global_step": 101389, "epoch": 837} {"train_loss": -35.86550521850586, "global_step": 101390, "epoch": 837} {"train_loss": -35.87769317626953, "global_step": 101391, "epoch": 837} {"train_loss": -35.39535140991211, "global_step": 101392, "epoch": 837} {"train_loss": -35.9174919128418, "global_step": 101393, "epoch": 837} {"train_loss": -36.15427780151367, "global_step": 101394, "epoch": 837} {"train_loss": -36.35759353637695, "global_step": 101395, "epoch": 837} {"train_loss": -35.91660690307617, "global_step": 101396, "epoch": 837} {"train_loss": -34.81638506522849, "global_step": 101397, "epoch": 837, "val_loss": 2593323.25} {"train_loss": -36.550819396972656, "global_step": 101398, "epoch": 838} {"train_loss": -36.3447265625, "global_step": 101399, "epoch": 838} {"train_loss": -36.250755310058594, "global_step": 101400, "epoch": 838} {"train_loss": -36.4581413269043, "global_step": 101401, "epoch": 838} {"train_loss": -36.55280685424805, "global_step": 101402, "epoch": 838} {"train_loss": -36.388301849365234, "global_step": 101403, "epoch": 838} {"train_loss": -36.48431396484375, "global_step": 101404, "epoch": 838} {"train_loss": -36.43715286254883, "global_step": 101405, "epoch": 838} {"train_loss": -36.7191276550293, "global_step": 101406, "epoch": 838} {"train_loss": -36.626522064208984, "global_step": 101407, "epoch": 838} {"train_loss": -36.932857513427734, "global_step": 101408, "epoch": 838} {"train_loss": -37.22255325317383, "global_step": 101409, "epoch": 838} {"train_loss": -36.97201156616211, "global_step": 101410, "epoch": 838} {"train_loss": -36.96613693237305, "global_step": 101411, "epoch": 838} {"train_loss": -37.13545608520508, "global_step": 101412, "epoch": 838} {"train_loss": -37.18162155151367, "global_step": 101413, "epoch": 838} {"train_loss": -37.01048278808594, "global_step": 101414, "epoch": 838} {"train_loss": -37.332767486572266, "global_step": 101415, "epoch": 838} {"train_loss": -37.03710174560547, "global_step": 101416, "epoch": 838} {"train_loss": -37.006141662597656, "global_step": 101417, "epoch": 838} {"train_loss": -36.960201263427734, "global_step": 101418, "epoch": 838} {"train_loss": -37.191932678222656, "global_step": 101419, "epoch": 838} {"train_loss": -37.29575729370117, "global_step": 101420, "epoch": 838} {"train_loss": -37.53617477416992, "global_step": 101421, "epoch": 838} {"train_loss": -37.79520797729492, "global_step": 101422, "epoch": 838} {"train_loss": -35.59245300292969, "global_step": 101423, "epoch": 838} {"train_loss": -37.722713470458984, "global_step": 101424, "epoch": 838} {"train_loss": -37.31345748901367, "global_step": 101425, "epoch": 838} {"train_loss": -37.14784622192383, "global_step": 101426, "epoch": 838} {"train_loss": -37.04852294921875, "global_step": 101427, "epoch": 838} {"train_loss": -37.37696075439453, "global_step": 101428, "epoch": 838} {"train_loss": -37.555904388427734, "global_step": 101429, "epoch": 838} {"train_loss": -37.754974365234375, "global_step": 101430, "epoch": 838} {"train_loss": -37.082984924316406, "global_step": 101431, "epoch": 838} {"train_loss": -37.88203430175781, "global_step": 101432, "epoch": 838} {"train_loss": -37.36874771118164, "global_step": 101433, "epoch": 838} {"train_loss": -37.74671173095703, "global_step": 101434, "epoch": 838} {"train_loss": -37.241676330566406, "global_step": 101435, "epoch": 838} {"train_loss": -37.76654815673828, "global_step": 101436, "epoch": 838} {"train_loss": -37.90530014038086, "global_step": 101437, "epoch": 838} {"train_loss": -37.666378021240234, "global_step": 101438, "epoch": 838} {"train_loss": -37.148475646972656, "global_step": 101439, "epoch": 838} {"train_loss": -37.61233901977539, "global_step": 101440, "epoch": 838} {"train_loss": -37.677120208740234, "global_step": 101441, "epoch": 838} {"train_loss": -37.477169036865234, "global_step": 101442, "epoch": 838} {"train_loss": -37.887367248535156, "global_step": 101443, "epoch": 838} {"train_loss": -38.062095642089844, "global_step": 101444, "epoch": 838} {"train_loss": -37.97536849975586, "global_step": 101445, "epoch": 838} {"train_loss": -37.782371520996094, "global_step": 101446, "epoch": 838} {"train_loss": -38.56110382080078, "global_step": 101447, "epoch": 838} {"train_loss": -38.04645919799805, "global_step": 101448, "epoch": 838} {"train_loss": -37.66814041137695, "global_step": 101449, "epoch": 838} {"train_loss": -36.0428466796875, "global_step": 101450, "epoch": 838} {"train_loss": -32.921905517578125, "global_step": 101451, "epoch": 838} {"train_loss": -25.53452491760254, "global_step": 101452, "epoch": 838} {"train_loss": -30.84228515625, "global_step": 101453, "epoch": 838} {"train_loss": -35.75779342651367, "global_step": 101454, "epoch": 838} {"train_loss": -26.6221866607666, "global_step": 101455, "epoch": 838} {"train_loss": -35.50736618041992, "global_step": 101456, "epoch": 838} {"train_loss": -32.30982208251953, "global_step": 101457, "epoch": 838} {"train_loss": -34.961673736572266, "global_step": 101458, "epoch": 838} {"train_loss": -34.087215423583984, "global_step": 101459, "epoch": 838} {"train_loss": -35.26545333862305, "global_step": 101460, "epoch": 838} {"train_loss": -34.407249450683594, "global_step": 101461, "epoch": 838} {"train_loss": -35.15375900268555, "global_step": 101462, "epoch": 838} {"train_loss": -34.723575592041016, "global_step": 101463, "epoch": 838} {"train_loss": -36.2707633972168, "global_step": 101464, "epoch": 838} {"train_loss": -35.29342269897461, "global_step": 101465, "epoch": 838} {"train_loss": -35.53657913208008, "global_step": 101466, "epoch": 838} {"train_loss": -35.697879791259766, "global_step": 101467, "epoch": 838} {"train_loss": -32.97136306762695, "global_step": 101468, "epoch": 838} {"train_loss": -36.3479118347168, "global_step": 101469, "epoch": 838} {"train_loss": -34.85162353515625, "global_step": 101470, "epoch": 838} {"train_loss": -35.29692459106445, "global_step": 101471, "epoch": 838} {"train_loss": -35.65334701538086, "global_step": 101472, "epoch": 838} {"train_loss": -35.39772415161133, "global_step": 101473, "epoch": 838} {"train_loss": -35.6541862487793, "global_step": 101474, "epoch": 838} {"train_loss": -36.4588623046875, "global_step": 101475, "epoch": 838} {"train_loss": -36.348079681396484, "global_step": 101476, "epoch": 838} {"train_loss": -36.479469299316406, "global_step": 101477, "epoch": 838} {"train_loss": -36.73637390136719, "global_step": 101478, "epoch": 838} {"train_loss": -36.920310974121094, "global_step": 101479, "epoch": 838} {"train_loss": -36.782257080078125, "global_step": 101480, "epoch": 838} {"train_loss": -37.39130783081055, "global_step": 101481, "epoch": 838} {"train_loss": -36.73320388793945, "global_step": 101482, "epoch": 838} {"train_loss": -36.99824523925781, "global_step": 101483, "epoch": 838} {"train_loss": -37.1871452331543, "global_step": 101484, "epoch": 838} {"train_loss": -37.481292724609375, "global_step": 101485, "epoch": 838} {"train_loss": -37.38125228881836, "global_step": 101486, "epoch": 838} {"train_loss": -37.91133499145508, "global_step": 101487, "epoch": 838} {"train_loss": -37.94504928588867, "global_step": 101488, "epoch": 838} {"train_loss": -37.327880859375, "global_step": 101489, "epoch": 838} {"train_loss": -37.63623809814453, "global_step": 101490, "epoch": 838} {"train_loss": -37.2185173034668, "global_step": 101491, "epoch": 838} {"train_loss": -37.40964889526367, "global_step": 101492, "epoch": 838} {"train_loss": -37.30546569824219, "global_step": 101493, "epoch": 838} {"train_loss": -37.55542755126953, "global_step": 101494, "epoch": 838} {"train_loss": -38.28462600708008, "global_step": 101495, "epoch": 838} {"train_loss": -37.082149505615234, "global_step": 101496, "epoch": 838} {"train_loss": -37.78890609741211, "global_step": 101497, "epoch": 838} {"train_loss": -37.99577713012695, "global_step": 101498, "epoch": 838} {"train_loss": -37.86200714111328, "global_step": 101499, "epoch": 838} {"train_loss": -38.06673812866211, "global_step": 101500, "epoch": 838} {"train_loss": -37.83671188354492, "global_step": 101501, "epoch": 838} {"train_loss": -37.84444046020508, "global_step": 101502, "epoch": 838} {"train_loss": -38.184051513671875, "global_step": 101503, "epoch": 838} {"train_loss": -37.71710205078125, "global_step": 101504, "epoch": 838} {"train_loss": -37.77954864501953, "global_step": 101505, "epoch": 838} {"train_loss": -38.020606994628906, "global_step": 101506, "epoch": 838} {"train_loss": -37.99605178833008, "global_step": 101507, "epoch": 838} {"train_loss": -38.17765426635742, "global_step": 101508, "epoch": 838} {"train_loss": -38.012699127197266, "global_step": 101509, "epoch": 838} {"train_loss": -37.95188522338867, "global_step": 101510, "epoch": 838} {"train_loss": -37.84603500366211, "global_step": 101511, "epoch": 838} {"train_loss": -38.393131256103516, "global_step": 101512, "epoch": 838} {"train_loss": -38.42473602294922, "global_step": 101513, "epoch": 838} {"train_loss": -38.15546798706055, "global_step": 101514, "epoch": 838} {"train_loss": -38.72569274902344, "global_step": 101515, "epoch": 838} {"train_loss": -38.6368293762207, "global_step": 101516, "epoch": 838} {"train_loss": -38.27376174926758, "global_step": 101517, "epoch": 838} {"train_loss": -36.74619882757013, "global_step": 101518, "epoch": 838, "val_loss": 2645092.0} {"train_loss": -38.654293060302734, "global_step": 101519, "epoch": 839} {"train_loss": -38.41750717163086, "global_step": 101520, "epoch": 839} {"train_loss": -38.418975830078125, "global_step": 101521, "epoch": 839} {"train_loss": -38.564605712890625, "global_step": 101522, "epoch": 839} {"train_loss": -38.543678283691406, "global_step": 101523, "epoch": 839} {"train_loss": -38.4066276550293, "global_step": 101524, "epoch": 839} {"train_loss": -38.33781051635742, "global_step": 101525, "epoch": 839} {"train_loss": -38.63664245605469, "global_step": 101526, "epoch": 839} {"train_loss": -38.73916244506836, "global_step": 101527, "epoch": 839} {"train_loss": -38.39083480834961, "global_step": 101528, "epoch": 839} {"train_loss": -38.38008499145508, "global_step": 101529, "epoch": 839} {"train_loss": -38.8573112487793, "global_step": 101530, "epoch": 839} {"train_loss": -38.65262985229492, "global_step": 101531, "epoch": 839} {"train_loss": -38.79136276245117, "global_step": 101532, "epoch": 839} {"train_loss": -39.03591537475586, "global_step": 101533, "epoch": 839} {"train_loss": -38.914119720458984, "global_step": 101534, "epoch": 839} {"train_loss": -38.26042938232422, "global_step": 101535, "epoch": 839} {"train_loss": -38.06365203857422, "global_step": 101536, "epoch": 839} {"train_loss": -38.0074348449707, "global_step": 101537, "epoch": 839} {"train_loss": -38.22802734375, "global_step": 101538, "epoch": 839} {"train_loss": -38.37283706665039, "global_step": 101539, "epoch": 839} {"train_loss": -38.18636703491211, "global_step": 101540, "epoch": 839} {"train_loss": -38.362525939941406, "global_step": 101541, "epoch": 839} {"train_loss": -38.347713470458984, "global_step": 101542, "epoch": 839} {"train_loss": -37.69269561767578, "global_step": 101543, "epoch": 839} {"train_loss": -37.56289291381836, "global_step": 101544, "epoch": 839} {"train_loss": -38.661739349365234, "global_step": 101545, "epoch": 839} {"train_loss": -37.338829040527344, "global_step": 101546, "epoch": 839} {"train_loss": -37.1428337097168, "global_step": 101547, "epoch": 839} {"train_loss": -37.59521484375, "global_step": 101548, "epoch": 839} {"train_loss": -38.530208587646484, "global_step": 101549, "epoch": 839} {"train_loss": -38.49491500854492, "global_step": 101550, "epoch": 839} {"train_loss": -37.947044372558594, "global_step": 101551, "epoch": 839} {"train_loss": -38.53779602050781, "global_step": 101552, "epoch": 839} {"train_loss": -38.27408981323242, "global_step": 101553, "epoch": 839} {"train_loss": -37.78852081298828, "global_step": 101554, "epoch": 839} {"train_loss": -38.23250961303711, "global_step": 101555, "epoch": 839} {"train_loss": -36.016578674316406, "global_step": 101556, "epoch": 839} {"train_loss": -33.12302780151367, "global_step": 101557, "epoch": 839} {"train_loss": -32.891021728515625, "global_step": 101558, "epoch": 839} {"train_loss": -32.380409240722656, "global_step": 101559, "epoch": 839} {"train_loss": -35.22141647338867, "global_step": 101560, "epoch": 839} {"train_loss": -37.980403900146484, "global_step": 101561, "epoch": 839} {"train_loss": -33.8615837097168, "global_step": 101562, "epoch": 839} {"train_loss": -31.662988662719727, "global_step": 101563, "epoch": 839} {"train_loss": -34.860015869140625, "global_step": 101564, "epoch": 839} {"train_loss": -37.84501266479492, "global_step": 101565, "epoch": 839} {"train_loss": -35.615604400634766, "global_step": 101566, "epoch": 839} {"train_loss": -36.99288558959961, "global_step": 101567, "epoch": 839} {"train_loss": -37.02335739135742, "global_step": 101568, "epoch": 839} {"train_loss": -37.05241012573242, "global_step": 101569, "epoch": 839} {"train_loss": -36.77524948120117, "global_step": 101570, "epoch": 839} {"train_loss": -36.828060150146484, "global_step": 101571, "epoch": 839} {"train_loss": -36.14455032348633, "global_step": 101572, "epoch": 839} {"train_loss": -35.93703842163086, "global_step": 101573, "epoch": 839} {"train_loss": -37.06166458129883, "global_step": 101574, "epoch": 839} {"train_loss": -37.831886291503906, "global_step": 101575, "epoch": 839} {"train_loss": -36.885009765625, "global_step": 101576, "epoch": 839} {"train_loss": -36.77954864501953, "global_step": 101577, "epoch": 839} {"train_loss": -37.650238037109375, "global_step": 101578, "epoch": 839} {"train_loss": -37.683990478515625, "global_step": 101579, "epoch": 839} {"train_loss": -36.55269241333008, "global_step": 101580, "epoch": 839} {"train_loss": -37.11991500854492, "global_step": 101581, "epoch": 839} {"train_loss": -37.13778305053711, "global_step": 101582, "epoch": 839} {"train_loss": -37.61887741088867, "global_step": 101583, "epoch": 839} {"train_loss": -38.226863861083984, "global_step": 101584, "epoch": 839} {"train_loss": -38.02671432495117, "global_step": 101585, "epoch": 839} {"train_loss": -37.428802490234375, "global_step": 101586, "epoch": 839} {"train_loss": -37.740840911865234, "global_step": 101587, "epoch": 839} {"train_loss": -37.317745208740234, "global_step": 101588, "epoch": 839} {"train_loss": -37.51743698120117, "global_step": 101589, "epoch": 839} {"train_loss": -37.404884338378906, "global_step": 101590, "epoch": 839} {"train_loss": -37.90638732910156, "global_step": 101591, "epoch": 839} {"train_loss": -37.58213806152344, "global_step": 101592, "epoch": 839} {"train_loss": -36.88924789428711, "global_step": 101593, "epoch": 839} {"train_loss": -37.230873107910156, "global_step": 101594, "epoch": 839} {"train_loss": -38.09403610229492, "global_step": 101595, "epoch": 839} {"train_loss": -36.386451721191406, "global_step": 101596, "epoch": 839} {"train_loss": -37.1242561340332, "global_step": 101597, "epoch": 839} {"train_loss": -37.06838607788086, "global_step": 101598, "epoch": 839} {"train_loss": -37.510711669921875, "global_step": 101599, "epoch": 839} {"train_loss": -36.96128463745117, "global_step": 101600, "epoch": 839} {"train_loss": -35.90396499633789, "global_step": 101601, "epoch": 839} {"train_loss": -37.25465774536133, "global_step": 101602, "epoch": 839} {"train_loss": -36.152462005615234, "global_step": 101603, "epoch": 839} {"train_loss": -37.21285629272461, "global_step": 101604, "epoch": 839} {"train_loss": -35.45966720581055, "global_step": 101605, "epoch": 839} {"train_loss": -36.72602081298828, "global_step": 101606, "epoch": 839} {"train_loss": -37.916900634765625, "global_step": 101607, "epoch": 839} {"train_loss": -37.90106201171875, "global_step": 101608, "epoch": 839} {"train_loss": -36.91072082519531, "global_step": 101609, "epoch": 839} {"train_loss": -36.72915267944336, "global_step": 101610, "epoch": 839} {"train_loss": -36.76661682128906, "global_step": 101611, "epoch": 839} {"train_loss": -35.28465270996094, "global_step": 101612, "epoch": 839} {"train_loss": -37.700931549072266, "global_step": 101613, "epoch": 839} {"train_loss": -37.39461898803711, "global_step": 101614, "epoch": 839} {"train_loss": -37.450111389160156, "global_step": 101615, "epoch": 839} {"train_loss": -35.82320022583008, "global_step": 101616, "epoch": 839} {"train_loss": -37.20589828491211, "global_step": 101617, "epoch": 839} {"train_loss": -36.93471145629883, "global_step": 101618, "epoch": 839} {"train_loss": -34.80064010620117, "global_step": 101619, "epoch": 839} {"train_loss": -37.290199279785156, "global_step": 101620, "epoch": 839} {"train_loss": -35.75916290283203, "global_step": 101621, "epoch": 839} {"train_loss": -37.350746154785156, "global_step": 101622, "epoch": 839} {"train_loss": -37.74723434448242, "global_step": 101623, "epoch": 839} {"train_loss": -36.60988235473633, "global_step": 101624, "epoch": 839} {"train_loss": -37.35856246948242, "global_step": 101625, "epoch": 839} {"train_loss": -36.53180694580078, "global_step": 101626, "epoch": 839} {"train_loss": -36.899715423583984, "global_step": 101627, "epoch": 839} {"train_loss": -37.2219352722168, "global_step": 101628, "epoch": 839} {"train_loss": -37.4453125, "global_step": 101629, "epoch": 839} {"train_loss": -37.7969970703125, "global_step": 101630, "epoch": 839} {"train_loss": -36.7248420715332, "global_step": 101631, "epoch": 839} {"train_loss": -35.72553634643555, "global_step": 101632, "epoch": 839} {"train_loss": -37.344730377197266, "global_step": 101633, "epoch": 839} {"train_loss": -36.78937911987305, "global_step": 101634, "epoch": 839} {"train_loss": -36.818538665771484, "global_step": 101635, "epoch": 839} {"train_loss": -37.03839111328125, "global_step": 101636, "epoch": 839} {"train_loss": -37.2564811706543, "global_step": 101637, "epoch": 839} {"train_loss": -36.69390106201172, "global_step": 101638, "epoch": 839} {"train_loss": -37.20103361586894, "global_step": 101639, "epoch": 839, "val_loss": 2635296.75} {"train_loss": -37.77804183959961, "global_step": 101640, "epoch": 840} {"train_loss": -37.89479064941406, "global_step": 101641, "epoch": 840} {"train_loss": -37.51839065551758, "global_step": 101642, "epoch": 840} {"train_loss": -36.94965362548828, "global_step": 101643, "epoch": 840} {"train_loss": -36.944801330566406, "global_step": 101644, "epoch": 840} {"train_loss": -37.9107551574707, "global_step": 101645, "epoch": 840} {"train_loss": -37.25044631958008, "global_step": 101646, "epoch": 840} {"train_loss": -37.11073684692383, "global_step": 101647, "epoch": 840} {"train_loss": -37.247100830078125, "global_step": 101648, "epoch": 840} {"train_loss": -37.42713165283203, "global_step": 101649, "epoch": 840} {"train_loss": -36.83796310424805, "global_step": 101650, "epoch": 840} {"train_loss": -35.38928985595703, "global_step": 101651, "epoch": 840} {"train_loss": -32.41878890991211, "global_step": 101652, "epoch": 840} {"train_loss": -37.13092041015625, "global_step": 101653, "epoch": 840} {"train_loss": -37.09197998046875, "global_step": 101654, "epoch": 840} {"train_loss": -36.23293685913086, "global_step": 101655, "epoch": 840} {"train_loss": -37.272666931152344, "global_step": 101656, "epoch": 840} {"train_loss": -36.72835922241211, "global_step": 101657, "epoch": 840} {"train_loss": -36.91685104370117, "global_step": 101658, "epoch": 840} {"train_loss": -37.041748046875, "global_step": 101659, "epoch": 840} {"train_loss": -36.328739166259766, "global_step": 101660, "epoch": 840} {"train_loss": -36.356597900390625, "global_step": 101661, "epoch": 840} {"train_loss": -36.71589279174805, "global_step": 101662, "epoch": 840} {"train_loss": -36.40032958984375, "global_step": 101663, "epoch": 840} {"train_loss": -37.75612258911133, "global_step": 101664, "epoch": 840} {"train_loss": -37.49656677246094, "global_step": 101665, "epoch": 840} {"train_loss": -37.4411735534668, "global_step": 101666, "epoch": 840} {"train_loss": -37.558013916015625, "global_step": 101667, "epoch": 840} {"train_loss": -38.16957473754883, "global_step": 101668, "epoch": 840} {"train_loss": -36.5587043762207, "global_step": 101669, "epoch": 840} {"train_loss": -36.733360290527344, "global_step": 101670, "epoch": 840} {"train_loss": -38.23383712768555, "global_step": 101671, "epoch": 840} {"train_loss": -38.01070022583008, "global_step": 101672, "epoch": 840} {"train_loss": -36.524024963378906, "global_step": 101673, "epoch": 840} {"train_loss": -37.36538314819336, "global_step": 101674, "epoch": 840} {"train_loss": -37.51708984375, "global_step": 101675, "epoch": 840} {"train_loss": -37.001220703125, "global_step": 101676, "epoch": 840} {"train_loss": -37.667015075683594, "global_step": 101677, "epoch": 840} {"train_loss": -36.61351013183594, "global_step": 101678, "epoch": 840} {"train_loss": -37.88417434692383, "global_step": 101679, "epoch": 840} {"train_loss": -37.307701110839844, "global_step": 101680, "epoch": 840} {"train_loss": -37.184322357177734, "global_step": 101681, "epoch": 840} {"train_loss": -36.11466979980469, "global_step": 101682, "epoch": 840} {"train_loss": -37.28116226196289, "global_step": 101683, "epoch": 840} {"train_loss": -36.967811584472656, "global_step": 101684, "epoch": 840} {"train_loss": -36.47217559814453, "global_step": 101685, "epoch": 840} {"train_loss": -36.99326705932617, "global_step": 101686, "epoch": 840} {"train_loss": -37.24184036254883, "global_step": 101687, "epoch": 840} {"train_loss": -36.01927947998047, "global_step": 101688, "epoch": 840} {"train_loss": -36.82032012939453, "global_step": 101689, "epoch": 840} {"train_loss": -37.67521286010742, "global_step": 101690, "epoch": 840} {"train_loss": -36.985599517822266, "global_step": 101691, "epoch": 840} {"train_loss": -36.54591751098633, "global_step": 101692, "epoch": 840} {"train_loss": -36.00634765625, "global_step": 101693, "epoch": 840} {"train_loss": -36.511146545410156, "global_step": 101694, "epoch": 840} {"train_loss": -33.44184112548828, "global_step": 101695, "epoch": 840} {"train_loss": -36.3308219909668, "global_step": 101696, "epoch": 840} {"train_loss": -35.79974365234375, "global_step": 101697, "epoch": 840} {"train_loss": -37.68118667602539, "global_step": 101698, "epoch": 840} {"train_loss": -37.17896270751953, "global_step": 101699, "epoch": 840} {"train_loss": -36.48338317871094, "global_step": 101700, "epoch": 840} {"train_loss": -37.58927536010742, "global_step": 101701, "epoch": 840} {"train_loss": -37.81474685668945, "global_step": 101702, "epoch": 840} {"train_loss": -37.22275924682617, "global_step": 101703, "epoch": 840} {"train_loss": -37.53106689453125, "global_step": 101704, "epoch": 840} {"train_loss": -37.50682067871094, "global_step": 101705, "epoch": 840} {"train_loss": -35.925559997558594, "global_step": 101706, "epoch": 840} {"train_loss": -37.23026657104492, "global_step": 101707, "epoch": 840} {"train_loss": -36.80205535888672, "global_step": 101708, "epoch": 840} {"train_loss": -30.18218994140625, "global_step": 101709, "epoch": 840} {"train_loss": -36.99094009399414, "global_step": 101710, "epoch": 840} {"train_loss": -37.548274993896484, "global_step": 101711, "epoch": 840} {"train_loss": -36.677040100097656, "global_step": 101712, "epoch": 840} {"train_loss": -37.29033279418945, "global_step": 101713, "epoch": 840} {"train_loss": -37.57890701293945, "global_step": 101714, "epoch": 840} {"train_loss": -35.69327926635742, "global_step": 101715, "epoch": 840} {"train_loss": -37.6624755859375, "global_step": 101716, "epoch": 840} {"train_loss": -37.550540924072266, "global_step": 101717, "epoch": 840} {"train_loss": -37.5437126159668, "global_step": 101718, "epoch": 840} {"train_loss": -37.46173095703125, "global_step": 101719, "epoch": 840} {"train_loss": -36.51457595825195, "global_step": 101720, "epoch": 840} {"train_loss": -34.47773361206055, "global_step": 101721, "epoch": 840} {"train_loss": -34.70976638793945, "global_step": 101722, "epoch": 840} {"train_loss": -37.745277404785156, "global_step": 101723, "epoch": 840} {"train_loss": -36.110652923583984, "global_step": 101724, "epoch": 840} {"train_loss": -37.057159423828125, "global_step": 101725, "epoch": 840} {"train_loss": -36.369384765625, "global_step": 101726, "epoch": 840} {"train_loss": -37.51646041870117, "global_step": 101727, "epoch": 840} {"train_loss": -37.74154281616211, "global_step": 101728, "epoch": 840} {"train_loss": -28.948698043823242, "global_step": 101729, "epoch": 840} {"train_loss": -36.60263442993164, "global_step": 101730, "epoch": 840} {"train_loss": -37.48138427734375, "global_step": 101731, "epoch": 840} {"train_loss": -38.174373626708984, "global_step": 101732, "epoch": 840} {"train_loss": -35.88186264038086, "global_step": 101733, "epoch": 840} {"train_loss": -36.74312973022461, "global_step": 101734, "epoch": 840} {"train_loss": -32.41871643066406, "global_step": 101735, "epoch": 840} {"train_loss": -34.629207611083984, "global_step": 101736, "epoch": 840} {"train_loss": -36.516822814941406, "global_step": 101737, "epoch": 840} {"train_loss": -36.332359313964844, "global_step": 101738, "epoch": 840} {"train_loss": -36.634883880615234, "global_step": 101739, "epoch": 840} {"train_loss": -34.7945442199707, "global_step": 101740, "epoch": 840} {"train_loss": -36.75941848754883, "global_step": 101741, "epoch": 840} {"train_loss": -33.86417007446289, "global_step": 101742, "epoch": 840} {"train_loss": -33.346248626708984, "global_step": 101743, "epoch": 840} {"train_loss": -36.004920959472656, "global_step": 101744, "epoch": 840} {"train_loss": -36.38136291503906, "global_step": 101745, "epoch": 840} {"train_loss": -35.89656448364258, "global_step": 101746, "epoch": 840} {"train_loss": -36.70834732055664, "global_step": 101747, "epoch": 840} {"train_loss": -33.471588134765625, "global_step": 101748, "epoch": 840} {"train_loss": -36.2573127746582, "global_step": 101749, "epoch": 840} {"train_loss": -36.70592498779297, "global_step": 101750, "epoch": 840} {"train_loss": -37.233036041259766, "global_step": 101751, "epoch": 840} {"train_loss": -37.3879280090332, "global_step": 101752, "epoch": 840} {"train_loss": -37.00661087036133, "global_step": 101753, "epoch": 840} {"train_loss": -36.8504753112793, "global_step": 101754, "epoch": 840} {"train_loss": -36.75395202636719, "global_step": 101755, "epoch": 840} {"train_loss": -35.603878021240234, "global_step": 101756, "epoch": 840} {"train_loss": -36.80902099609375, "global_step": 101757, "epoch": 840} {"train_loss": -36.326473236083984, "global_step": 101758, "epoch": 840} {"train_loss": -36.905399322509766, "global_step": 101759, "epoch": 840} {"train_loss": -36.58269401424187, "global_step": 101760, "epoch": 840, "val_loss": 2685216.75} {"train_loss": -37.39431381225586, "global_step": 101761, "epoch": 841} {"train_loss": -37.1208381652832, "global_step": 101762, "epoch": 841} {"train_loss": -37.36481857299805, "global_step": 101763, "epoch": 841} {"train_loss": -36.81533432006836, "global_step": 101764, "epoch": 841} {"train_loss": -37.7861213684082, "global_step": 101765, "epoch": 841} {"train_loss": -36.17805099487305, "global_step": 101766, "epoch": 841} {"train_loss": -37.8859977722168, "global_step": 101767, "epoch": 841} {"train_loss": -37.53841018676758, "global_step": 101768, "epoch": 841} {"train_loss": -37.220069885253906, "global_step": 101769, "epoch": 841} {"train_loss": -37.64320755004883, "global_step": 101770, "epoch": 841} {"train_loss": -36.93674850463867, "global_step": 101771, "epoch": 841} {"train_loss": -36.92890167236328, "global_step": 101772, "epoch": 841} {"train_loss": -37.664039611816406, "global_step": 101773, "epoch": 841} {"train_loss": -37.85515594482422, "global_step": 101774, "epoch": 841} {"train_loss": -36.867061614990234, "global_step": 101775, "epoch": 841} {"train_loss": -36.32056427001953, "global_step": 101776, "epoch": 841} {"train_loss": -37.6256103515625, "global_step": 101777, "epoch": 841} {"train_loss": -37.15761184692383, "global_step": 101778, "epoch": 841} {"train_loss": -37.81100845336914, "global_step": 101779, "epoch": 841} {"train_loss": -37.32539749145508, "global_step": 101780, "epoch": 841} {"train_loss": -37.78988265991211, "global_step": 101781, "epoch": 841} {"train_loss": -37.57524490356445, "global_step": 101782, "epoch": 841} {"train_loss": -38.059627532958984, "global_step": 101783, "epoch": 841} {"train_loss": -37.36945343017578, "global_step": 101784, "epoch": 841} {"train_loss": -37.18406677246094, "global_step": 101785, "epoch": 841} {"train_loss": -37.991329193115234, "global_step": 101786, "epoch": 841} {"train_loss": -37.34908676147461, "global_step": 101787, "epoch": 841} {"train_loss": -37.89024353027344, "global_step": 101788, "epoch": 841} {"train_loss": -38.055946350097656, "global_step": 101789, "epoch": 841} {"train_loss": -38.153778076171875, "global_step": 101790, "epoch": 841} {"train_loss": -38.42391586303711, "global_step": 101791, "epoch": 841} {"train_loss": -38.25580978393555, "global_step": 101792, "epoch": 841} {"train_loss": -38.12929153442383, "global_step": 101793, "epoch": 841} {"train_loss": -37.330989837646484, "global_step": 101794, "epoch": 841} {"train_loss": -38.30622100830078, "global_step": 101795, "epoch": 841} {"train_loss": -38.13262939453125, "global_step": 101796, "epoch": 841} {"train_loss": -37.56752395629883, "global_step": 101797, "epoch": 841} {"train_loss": -37.74787521362305, "global_step": 101798, "epoch": 841} {"train_loss": -38.10449981689453, "global_step": 101799, "epoch": 841} {"train_loss": -38.43806838989258, "global_step": 101800, "epoch": 841} {"train_loss": -38.25404739379883, "global_step": 101801, "epoch": 841} {"train_loss": -38.46181869506836, "global_step": 101802, "epoch": 841} {"train_loss": -38.113311767578125, "global_step": 101803, "epoch": 841} {"train_loss": -36.26113510131836, "global_step": 101804, "epoch": 841} {"train_loss": -34.29137420654297, "global_step": 101805, "epoch": 841} {"train_loss": -32.57426834106445, "global_step": 101806, "epoch": 841} {"train_loss": -33.99445343017578, "global_step": 101807, "epoch": 841} {"train_loss": -37.15754318237305, "global_step": 101808, "epoch": 841} {"train_loss": -37.1728630065918, "global_step": 101809, "epoch": 841} {"train_loss": -32.371150970458984, "global_step": 101810, "epoch": 841} {"train_loss": -36.6417236328125, "global_step": 101811, "epoch": 841} {"train_loss": -37.85372543334961, "global_step": 101812, "epoch": 841} {"train_loss": -33.330116271972656, "global_step": 101813, "epoch": 841} {"train_loss": -37.85150146484375, "global_step": 101814, "epoch": 841} {"train_loss": -36.37398147583008, "global_step": 101815, "epoch": 841} {"train_loss": -36.145809173583984, "global_step": 101816, "epoch": 841} {"train_loss": -37.31543731689453, "global_step": 101817, "epoch": 841} {"train_loss": -35.9821662902832, "global_step": 101818, "epoch": 841} {"train_loss": -37.53644561767578, "global_step": 101819, "epoch": 841} {"train_loss": -36.396888732910156, "global_step": 101820, "epoch": 841} {"train_loss": -36.55350875854492, "global_step": 101821, "epoch": 841} {"train_loss": -37.16667175292969, "global_step": 101822, "epoch": 841} {"train_loss": -37.002140045166016, "global_step": 101823, "epoch": 841} {"train_loss": -38.07494354248047, "global_step": 101824, "epoch": 841} {"train_loss": -37.36063766479492, "global_step": 101825, "epoch": 841} {"train_loss": -37.381256103515625, "global_step": 101826, "epoch": 841} {"train_loss": -37.00974655151367, "global_step": 101827, "epoch": 841} {"train_loss": -37.17802810668945, "global_step": 101828, "epoch": 841} {"train_loss": -37.01322555541992, "global_step": 101829, "epoch": 841} {"train_loss": -36.69964599609375, "global_step": 101830, "epoch": 841} {"train_loss": -37.074092864990234, "global_step": 101831, "epoch": 841} {"train_loss": -35.1568717956543, "global_step": 101832, "epoch": 841} {"train_loss": -36.41997146606445, "global_step": 101833, "epoch": 841} {"train_loss": -33.4202995300293, "global_step": 101834, "epoch": 841} {"train_loss": -35.42264938354492, "global_step": 101835, "epoch": 841} {"train_loss": -35.537322998046875, "global_step": 101836, "epoch": 841} {"train_loss": -37.3221549987793, "global_step": 101837, "epoch": 841} {"train_loss": -34.16897964477539, "global_step": 101838, "epoch": 841} {"train_loss": -38.18295669555664, "global_step": 101839, "epoch": 841} {"train_loss": -35.060970306396484, "global_step": 101840, "epoch": 841} {"train_loss": -38.297019958496094, "global_step": 101841, "epoch": 841} {"train_loss": -36.518375396728516, "global_step": 101842, "epoch": 841} {"train_loss": -37.712520599365234, "global_step": 101843, "epoch": 841} {"train_loss": -37.68514633178711, "global_step": 101844, "epoch": 841} {"train_loss": -37.62140655517578, "global_step": 101845, "epoch": 841} {"train_loss": -38.047340393066406, "global_step": 101846, "epoch": 841} {"train_loss": -37.351478576660156, "global_step": 101847, "epoch": 841} {"train_loss": -38.293758392333984, "global_step": 101848, "epoch": 841} {"train_loss": -38.216346740722656, "global_step": 101849, "epoch": 841} {"train_loss": -37.8513069152832, "global_step": 101850, "epoch": 841} {"train_loss": -37.337608337402344, "global_step": 101851, "epoch": 841} {"train_loss": -38.40123748779297, "global_step": 101852, "epoch": 841} {"train_loss": -38.636268615722656, "global_step": 101853, "epoch": 841} {"train_loss": -38.06130599975586, "global_step": 101854, "epoch": 841} {"train_loss": -38.3049201965332, "global_step": 101855, "epoch": 841} {"train_loss": -38.142616271972656, "global_step": 101856, "epoch": 841} {"train_loss": -37.82091522216797, "global_step": 101857, "epoch": 841} {"train_loss": -38.51137161254883, "global_step": 101858, "epoch": 841} {"train_loss": -38.79281234741211, "global_step": 101859, "epoch": 841} {"train_loss": -37.88286590576172, "global_step": 101860, "epoch": 841} {"train_loss": -38.37409591674805, "global_step": 101861, "epoch": 841} {"train_loss": -37.91318893432617, "global_step": 101862, "epoch": 841} {"train_loss": -38.1681022644043, "global_step": 101863, "epoch": 841} {"train_loss": -37.965999603271484, "global_step": 101864, "epoch": 841} {"train_loss": -38.27394485473633, "global_step": 101865, "epoch": 841} {"train_loss": -37.519615173339844, "global_step": 101866, "epoch": 841} {"train_loss": -38.75971603393555, "global_step": 101867, "epoch": 841} {"train_loss": -37.82528305053711, "global_step": 101868, "epoch": 841} {"train_loss": -38.251495361328125, "global_step": 101869, "epoch": 841} {"train_loss": -38.800994873046875, "global_step": 101870, "epoch": 841} {"train_loss": -37.94794845581055, "global_step": 101871, "epoch": 841} {"train_loss": -36.72035598754883, "global_step": 101872, "epoch": 841} {"train_loss": -35.91242599487305, "global_step": 101873, "epoch": 841} {"train_loss": -36.820980072021484, "global_step": 101874, "epoch": 841} {"train_loss": -37.219093322753906, "global_step": 101875, "epoch": 841} {"train_loss": -38.47703552246094, "global_step": 101876, "epoch": 841} {"train_loss": -38.39472579956055, "global_step": 101877, "epoch": 841} {"train_loss": -37.1364860534668, "global_step": 101878, "epoch": 841} {"train_loss": -37.848297119140625, "global_step": 101879, "epoch": 841} {"train_loss": -38.851707458496094, "global_step": 101880, "epoch": 841} {"train_loss": -37.28685700597842, "global_step": 101881, "epoch": 841, "val_loss": 2664470.25} {"train_loss": -37.7453498840332, "global_step": 101882, "epoch": 842} {"train_loss": -35.504573822021484, "global_step": 101883, "epoch": 842} {"train_loss": -36.3580322265625, "global_step": 101884, "epoch": 842} {"train_loss": -38.37333297729492, "global_step": 101885, "epoch": 842} {"train_loss": -37.687255859375, "global_step": 101886, "epoch": 842} {"train_loss": -35.073055267333984, "global_step": 101887, "epoch": 842} {"train_loss": -37.2026481628418, "global_step": 101888, "epoch": 842} {"train_loss": -38.045406341552734, "global_step": 101889, "epoch": 842} {"train_loss": -37.17403793334961, "global_step": 101890, "epoch": 842} {"train_loss": -37.821109771728516, "global_step": 101891, "epoch": 842} {"train_loss": -38.040260314941406, "global_step": 101892, "epoch": 842} {"train_loss": -34.49407958984375, "global_step": 101893, "epoch": 842} {"train_loss": -37.84397506713867, "global_step": 101894, "epoch": 842} {"train_loss": -38.34029006958008, "global_step": 101895, "epoch": 842} {"train_loss": -38.56507110595703, "global_step": 101896, "epoch": 842} {"train_loss": -37.12104034423828, "global_step": 101897, "epoch": 842} {"train_loss": -34.9671630859375, "global_step": 101898, "epoch": 842} {"train_loss": -36.725067138671875, "global_step": 101899, "epoch": 842} {"train_loss": -37.62010192871094, "global_step": 101900, "epoch": 842} {"train_loss": -37.4974250793457, "global_step": 101901, "epoch": 842} {"train_loss": -35.923763275146484, "global_step": 101902, "epoch": 842} {"train_loss": -35.73406219482422, "global_step": 101903, "epoch": 842} {"train_loss": -33.50275802612305, "global_step": 101904, "epoch": 842} {"train_loss": -36.96296310424805, "global_step": 101905, "epoch": 842} {"train_loss": -37.330841064453125, "global_step": 101906, "epoch": 842} {"train_loss": -34.17765426635742, "global_step": 101907, "epoch": 842} {"train_loss": -35.40212631225586, "global_step": 101908, "epoch": 842} {"train_loss": -33.10463333129883, "global_step": 101909, "epoch": 842} {"train_loss": -30.599945068359375, "global_step": 101910, "epoch": 842} {"train_loss": -34.663265228271484, "global_step": 101911, "epoch": 842} {"train_loss": -32.37823486328125, "global_step": 101912, "epoch": 842} {"train_loss": -32.61454391479492, "global_step": 101913, "epoch": 842} {"train_loss": -34.170108795166016, "global_step": 101914, "epoch": 842} {"train_loss": -31.724945068359375, "global_step": 101915, "epoch": 842} {"train_loss": -26.275781631469727, "global_step": 101916, "epoch": 842} {"train_loss": -32.4942626953125, "global_step": 101917, "epoch": 842} {"train_loss": -30.26222038269043, "global_step": 101918, "epoch": 842} {"train_loss": -35.33515548706055, "global_step": 101919, "epoch": 842} {"train_loss": -34.086952209472656, "global_step": 101920, "epoch": 842} {"train_loss": -31.188812255859375, "global_step": 101921, "epoch": 842} {"train_loss": -33.37947082519531, "global_step": 101922, "epoch": 842} {"train_loss": -29.637805938720703, "global_step": 101923, "epoch": 842} {"train_loss": -34.78974151611328, "global_step": 101924, "epoch": 842} {"train_loss": -32.81206130981445, "global_step": 101925, "epoch": 842} {"train_loss": -30.721357345581055, "global_step": 101926, "epoch": 842} {"train_loss": -34.873836517333984, "global_step": 101927, "epoch": 842} {"train_loss": -33.347564697265625, "global_step": 101928, "epoch": 842} {"train_loss": -34.20771408081055, "global_step": 101929, "epoch": 842} {"train_loss": -34.86771774291992, "global_step": 101930, "epoch": 842} {"train_loss": -35.43540573120117, "global_step": 101931, "epoch": 842} {"train_loss": -34.677642822265625, "global_step": 101932, "epoch": 842} {"train_loss": -35.17268753051758, "global_step": 101933, "epoch": 842} {"train_loss": -33.7209587097168, "global_step": 101934, "epoch": 842} {"train_loss": -34.39397430419922, "global_step": 101935, "epoch": 842} {"train_loss": -35.4190788269043, "global_step": 101936, "epoch": 842} {"train_loss": -34.59543991088867, "global_step": 101937, "epoch": 842} {"train_loss": -35.43862533569336, "global_step": 101938, "epoch": 842} {"train_loss": -35.459877014160156, "global_step": 101939, "epoch": 842} {"train_loss": -34.918800354003906, "global_step": 101940, "epoch": 842} {"train_loss": -35.46389389038086, "global_step": 101941, "epoch": 842} {"train_loss": -35.354644775390625, "global_step": 101942, "epoch": 842} {"train_loss": -35.560428619384766, "global_step": 101943, "epoch": 842} {"train_loss": -36.020137786865234, "global_step": 101944, "epoch": 842} {"train_loss": -35.43857955932617, "global_step": 101945, "epoch": 842} {"train_loss": -36.3720588684082, "global_step": 101946, "epoch": 842} {"train_loss": -36.184234619140625, "global_step": 101947, "epoch": 842} {"train_loss": -35.62166976928711, "global_step": 101948, "epoch": 842} {"train_loss": -35.565582275390625, "global_step": 101949, "epoch": 842} {"train_loss": -35.576480865478516, "global_step": 101950, "epoch": 842} {"train_loss": -36.736328125, "global_step": 101951, "epoch": 842} {"train_loss": -35.52118682861328, "global_step": 101952, "epoch": 842} {"train_loss": -36.22038650512695, "global_step": 101953, "epoch": 842} {"train_loss": -35.88624954223633, "global_step": 101954, "epoch": 842} {"train_loss": -36.21233367919922, "global_step": 101955, "epoch": 842} {"train_loss": -35.98377990722656, "global_step": 101956, "epoch": 842} {"train_loss": -36.676666259765625, "global_step": 101957, "epoch": 842} {"train_loss": -36.17626190185547, "global_step": 101958, "epoch": 842} {"train_loss": -36.83014678955078, "global_step": 101959, "epoch": 842} {"train_loss": -36.58250427246094, "global_step": 101960, "epoch": 842} {"train_loss": -36.73836135864258, "global_step": 101961, "epoch": 842} {"train_loss": -36.681304931640625, "global_step": 101962, "epoch": 842} {"train_loss": -36.63381576538086, "global_step": 101963, "epoch": 842} {"train_loss": -36.986717224121094, "global_step": 101964, "epoch": 842} {"train_loss": -36.68036651611328, "global_step": 101965, "epoch": 842} {"train_loss": -37.312530517578125, "global_step": 101966, "epoch": 842} {"train_loss": -36.83391189575195, "global_step": 101967, "epoch": 842} {"train_loss": -37.21514892578125, "global_step": 101968, "epoch": 842} {"train_loss": -36.39713668823242, "global_step": 101969, "epoch": 842} {"train_loss": -37.16665267944336, "global_step": 101970, "epoch": 842} {"train_loss": -37.15670394897461, "global_step": 101971, "epoch": 842} {"train_loss": -37.37032699584961, "global_step": 101972, "epoch": 842} {"train_loss": -37.20217514038086, "global_step": 101973, "epoch": 842} {"train_loss": -37.05952835083008, "global_step": 101974, "epoch": 842} {"train_loss": -37.6079216003418, "global_step": 101975, "epoch": 842} {"train_loss": -37.49451446533203, "global_step": 101976, "epoch": 842} {"train_loss": -37.21614456176758, "global_step": 101977, "epoch": 842} {"train_loss": -37.70478057861328, "global_step": 101978, "epoch": 842} {"train_loss": -38.01649856567383, "global_step": 101979, "epoch": 842} {"train_loss": -37.38412857055664, "global_step": 101980, "epoch": 842} {"train_loss": -37.71805953979492, "global_step": 101981, "epoch": 842} {"train_loss": -37.526893615722656, "global_step": 101982, "epoch": 842} {"train_loss": -37.282142639160156, "global_step": 101983, "epoch": 842} {"train_loss": -37.4236946105957, "global_step": 101984, "epoch": 842} {"train_loss": -37.34971237182617, "global_step": 101985, "epoch": 842} {"train_loss": -37.74757385253906, "global_step": 101986, "epoch": 842} {"train_loss": -38.09983444213867, "global_step": 101987, "epoch": 842} {"train_loss": -37.65768051147461, "global_step": 101988, "epoch": 842} {"train_loss": -37.15449905395508, "global_step": 101989, "epoch": 842} {"train_loss": -37.383480072021484, "global_step": 101990, "epoch": 842} {"train_loss": -37.4388427734375, "global_step": 101991, "epoch": 842} {"train_loss": -37.480037689208984, "global_step": 101992, "epoch": 842} {"train_loss": -37.65839767456055, "global_step": 101993, "epoch": 842} {"train_loss": -38.647239685058594, "global_step": 101994, "epoch": 842} {"train_loss": -37.84330368041992, "global_step": 101995, "epoch": 842} {"train_loss": -37.70549774169922, "global_step": 101996, "epoch": 842} {"train_loss": -37.85750961303711, "global_step": 101997, "epoch": 842} {"train_loss": -38.033966064453125, "global_step": 101998, "epoch": 842} {"train_loss": -38.03567123413086, "global_step": 101999, "epoch": 842} {"train_loss": -37.83535385131836, "global_step": 102000, "epoch": 842} {"train_loss": -38.05411911010742, "global_step": 102001, "epoch": 842} {"train_loss": -35.94805096397715, "global_step": 102002, "epoch": 842, "val_loss": 2589279.25} {"train_loss": -38.032711029052734, "global_step": 102003, "epoch": 843} {"train_loss": -37.83045196533203, "global_step": 102004, "epoch": 843} {"train_loss": -36.64350509643555, "global_step": 102005, "epoch": 843} {"train_loss": -35.18281555175781, "global_step": 102006, "epoch": 843} {"train_loss": -35.80729293823242, "global_step": 102007, "epoch": 843} {"train_loss": -37.469451904296875, "global_step": 102008, "epoch": 843} {"train_loss": -38.278587341308594, "global_step": 102009, "epoch": 843} {"train_loss": -37.88134765625, "global_step": 102010, "epoch": 843} {"train_loss": -37.809295654296875, "global_step": 102011, "epoch": 843} {"train_loss": -36.04885482788086, "global_step": 102012, "epoch": 843} {"train_loss": -35.81209945678711, "global_step": 102013, "epoch": 843} {"train_loss": -36.67560577392578, "global_step": 102014, "epoch": 843} {"train_loss": -37.68709945678711, "global_step": 102015, "epoch": 843} {"train_loss": -37.99924087524414, "global_step": 102016, "epoch": 843} {"train_loss": -37.55685043334961, "global_step": 102017, "epoch": 843} {"train_loss": -38.14530563354492, "global_step": 102018, "epoch": 843} {"train_loss": -38.295738220214844, "global_step": 102019, "epoch": 843} {"train_loss": -38.50007247924805, "global_step": 102020, "epoch": 843} {"train_loss": -38.366939544677734, "global_step": 102021, "epoch": 843} {"train_loss": -38.181705474853516, "global_step": 102022, "epoch": 843} {"train_loss": -37.92069625854492, "global_step": 102023, "epoch": 843} {"train_loss": -37.31538009643555, "global_step": 102024, "epoch": 843} {"train_loss": -37.68244552612305, "global_step": 102025, "epoch": 843} {"train_loss": -37.53144073486328, "global_step": 102026, "epoch": 843} {"train_loss": -37.53652572631836, "global_step": 102027, "epoch": 843} {"train_loss": -36.59812545776367, "global_step": 102028, "epoch": 843} {"train_loss": -35.41405487060547, "global_step": 102029, "epoch": 843} {"train_loss": -36.19761276245117, "global_step": 102030, "epoch": 843} {"train_loss": -35.581214904785156, "global_step": 102031, "epoch": 843} {"train_loss": -37.18684005737305, "global_step": 102032, "epoch": 843} {"train_loss": -38.485450744628906, "global_step": 102033, "epoch": 843} {"train_loss": -38.38008117675781, "global_step": 102034, "epoch": 843} {"train_loss": -37.52278518676758, "global_step": 102035, "epoch": 843} {"train_loss": -38.658355712890625, "global_step": 102036, "epoch": 843} {"train_loss": -38.40861129760742, "global_step": 102037, "epoch": 843} {"train_loss": -38.029396057128906, "global_step": 102038, "epoch": 843} {"train_loss": -38.79702377319336, "global_step": 102039, "epoch": 843} {"train_loss": -38.110347747802734, "global_step": 102040, "epoch": 843} {"train_loss": -38.176490783691406, "global_step": 102041, "epoch": 843} {"train_loss": -38.39447784423828, "global_step": 102042, "epoch": 843} {"train_loss": -36.99819564819336, "global_step": 102043, "epoch": 843} {"train_loss": -36.37495422363281, "global_step": 102044, "epoch": 843} {"train_loss": -37.055938720703125, "global_step": 102045, "epoch": 843} {"train_loss": -35.922054290771484, "global_step": 102046, "epoch": 843} {"train_loss": -36.772396087646484, "global_step": 102047, "epoch": 843} {"train_loss": -38.59760284423828, "global_step": 102048, "epoch": 843} {"train_loss": -37.48338317871094, "global_step": 102049, "epoch": 843} {"train_loss": -34.75949478149414, "global_step": 102050, "epoch": 843} {"train_loss": -32.25457763671875, "global_step": 102051, "epoch": 843} {"train_loss": -32.09476089477539, "global_step": 102052, "epoch": 843} {"train_loss": -35.069091796875, "global_step": 102053, "epoch": 843} {"train_loss": -36.55884552001953, "global_step": 102054, "epoch": 843} {"train_loss": -35.795230865478516, "global_step": 102055, "epoch": 843} {"train_loss": -35.35490036010742, "global_step": 102056, "epoch": 843} {"train_loss": -33.79780960083008, "global_step": 102057, "epoch": 843} {"train_loss": -34.874420166015625, "global_step": 102058, "epoch": 843} {"train_loss": -35.242977142333984, "global_step": 102059, "epoch": 843} {"train_loss": -36.66426086425781, "global_step": 102060, "epoch": 843} {"train_loss": -35.70008087158203, "global_step": 102061, "epoch": 843} {"train_loss": -36.17439651489258, "global_step": 102062, "epoch": 843} {"train_loss": -37.04387283325195, "global_step": 102063, "epoch": 843} {"train_loss": -38.086761474609375, "global_step": 102064, "epoch": 843} {"train_loss": -37.57004928588867, "global_step": 102065, "epoch": 843} {"train_loss": -38.359615325927734, "global_step": 102066, "epoch": 843} {"train_loss": -37.57321548461914, "global_step": 102067, "epoch": 843} {"train_loss": -37.086769104003906, "global_step": 102068, "epoch": 843} {"train_loss": -37.877174377441406, "global_step": 102069, "epoch": 843} {"train_loss": -38.382755279541016, "global_step": 102070, "epoch": 843} {"train_loss": -37.435848236083984, "global_step": 102071, "epoch": 843} {"train_loss": -38.418800354003906, "global_step": 102072, "epoch": 843} {"train_loss": -37.9809455871582, "global_step": 102073, "epoch": 843} {"train_loss": -38.732181549072266, "global_step": 102074, "epoch": 843} {"train_loss": -38.19377517700195, "global_step": 102075, "epoch": 843} {"train_loss": -37.262638092041016, "global_step": 102076, "epoch": 843} {"train_loss": -38.397274017333984, "global_step": 102077, "epoch": 843} {"train_loss": -38.47690963745117, "global_step": 102078, "epoch": 843} {"train_loss": -38.90181350708008, "global_step": 102079, "epoch": 843} {"train_loss": -39.05735397338867, "global_step": 102080, "epoch": 843} {"train_loss": -38.42606735229492, "global_step": 102081, "epoch": 843} {"train_loss": -38.68600845336914, "global_step": 102082, "epoch": 843} {"train_loss": -38.65283203125, "global_step": 102083, "epoch": 843} {"train_loss": -38.55093002319336, "global_step": 102084, "epoch": 843} {"train_loss": -38.34187316894531, "global_step": 102085, "epoch": 843} {"train_loss": -38.90891647338867, "global_step": 102086, "epoch": 843} {"train_loss": -38.65909957885742, "global_step": 102087, "epoch": 843} {"train_loss": -38.41920852661133, "global_step": 102088, "epoch": 843} {"train_loss": -38.90644454956055, "global_step": 102089, "epoch": 843} {"train_loss": -38.13241195678711, "global_step": 102090, "epoch": 843} {"train_loss": -39.1611442565918, "global_step": 102091, "epoch": 843} {"train_loss": -38.9349479675293, "global_step": 102092, "epoch": 843} {"train_loss": -39.04542922973633, "global_step": 102093, "epoch": 843} {"train_loss": -38.5102653503418, "global_step": 102094, "epoch": 843} {"train_loss": -38.900211334228516, "global_step": 102095, "epoch": 843} {"train_loss": -39.014888763427734, "global_step": 102096, "epoch": 843} {"train_loss": -39.238704681396484, "global_step": 102097, "epoch": 843} {"train_loss": -38.95075607299805, "global_step": 102098, "epoch": 843} {"train_loss": -39.21092224121094, "global_step": 102099, "epoch": 843} {"train_loss": -38.696998596191406, "global_step": 102100, "epoch": 843} {"train_loss": -38.681243896484375, "global_step": 102101, "epoch": 843} {"train_loss": -38.37736892700195, "global_step": 102102, "epoch": 843} {"train_loss": -38.97685241699219, "global_step": 102103, "epoch": 843} {"train_loss": -39.309749603271484, "global_step": 102104, "epoch": 843} {"train_loss": -38.61769485473633, "global_step": 102105, "epoch": 843} {"train_loss": -38.61641311645508, "global_step": 102106, "epoch": 843} {"train_loss": -39.30837631225586, "global_step": 102107, "epoch": 843} {"train_loss": -38.98604965209961, "global_step": 102108, "epoch": 843} {"train_loss": -38.83207321166992, "global_step": 102109, "epoch": 843} {"train_loss": -38.740203857421875, "global_step": 102110, "epoch": 843} {"train_loss": -38.446346282958984, "global_step": 102111, "epoch": 843} {"train_loss": -39.091583251953125, "global_step": 102112, "epoch": 843} {"train_loss": -38.77124786376953, "global_step": 102113, "epoch": 843} {"train_loss": -38.7135124206543, "global_step": 102114, "epoch": 843} {"train_loss": -39.16199493408203, "global_step": 102115, "epoch": 843} {"train_loss": -38.564029693603516, "global_step": 102116, "epoch": 843} {"train_loss": -37.48383331298828, "global_step": 102117, "epoch": 843} {"train_loss": -37.61848068237305, "global_step": 102118, "epoch": 843} {"train_loss": -38.96035385131836, "global_step": 102119, "epoch": 843} {"train_loss": -38.76737976074219, "global_step": 102120, "epoch": 843} {"train_loss": -37.35931396484375, "global_step": 102121, "epoch": 843} {"train_loss": -38.104976654052734, "global_step": 102122, "epoch": 843} {"train_loss": -37.71069619675313, "global_step": 102123, "epoch": 843, "val_loss": 2642341.75} {"train_loss": -38.598873138427734, "global_step": 102124, "epoch": 844} {"train_loss": -37.983497619628906, "global_step": 102125, "epoch": 844} {"train_loss": -38.742801666259766, "global_step": 102126, "epoch": 844} {"train_loss": -38.88261795043945, "global_step": 102127, "epoch": 844} {"train_loss": -38.4534912109375, "global_step": 102128, "epoch": 844} {"train_loss": -38.309261322021484, "global_step": 102129, "epoch": 844} {"train_loss": -39.26008605957031, "global_step": 102130, "epoch": 844} {"train_loss": -38.49351119995117, "global_step": 102131, "epoch": 844} {"train_loss": -37.51263427734375, "global_step": 102132, "epoch": 844} {"train_loss": -35.652278900146484, "global_step": 102133, "epoch": 844} {"train_loss": -31.506444931030273, "global_step": 102134, "epoch": 844} {"train_loss": -25.252094268798828, "global_step": 102135, "epoch": 844} {"train_loss": -30.061874389648438, "global_step": 102136, "epoch": 844} {"train_loss": -35.7278938293457, "global_step": 102137, "epoch": 844} {"train_loss": -31.418912887573242, "global_step": 102138, "epoch": 844} {"train_loss": -29.573007583618164, "global_step": 102139, "epoch": 844} {"train_loss": -35.68679428100586, "global_step": 102140, "epoch": 844} {"train_loss": -33.271541595458984, "global_step": 102141, "epoch": 844} {"train_loss": -37.08120346069336, "global_step": 102142, "epoch": 844} {"train_loss": -34.064735412597656, "global_step": 102143, "epoch": 844} {"train_loss": -36.90924072265625, "global_step": 102144, "epoch": 844} {"train_loss": -33.490570068359375, "global_step": 102145, "epoch": 844} {"train_loss": -37.329219818115234, "global_step": 102146, "epoch": 844} {"train_loss": -35.498802185058594, "global_step": 102147, "epoch": 844} {"train_loss": -37.158424377441406, "global_step": 102148, "epoch": 844} {"train_loss": -36.03939437866211, "global_step": 102149, "epoch": 844} {"train_loss": -37.129241943359375, "global_step": 102150, "epoch": 844} {"train_loss": -36.06290817260742, "global_step": 102151, "epoch": 844} {"train_loss": -37.356746673583984, "global_step": 102152, "epoch": 844} {"train_loss": -36.000946044921875, "global_step": 102153, "epoch": 844} {"train_loss": -36.40035629272461, "global_step": 102154, "epoch": 844} {"train_loss": -37.39338302612305, "global_step": 102155, "epoch": 844} {"train_loss": -37.03522872924805, "global_step": 102156, "epoch": 844} {"train_loss": -37.888668060302734, "global_step": 102157, "epoch": 844} {"train_loss": -37.876373291015625, "global_step": 102158, "epoch": 844} {"train_loss": -37.470726013183594, "global_step": 102159, "epoch": 844} {"train_loss": -38.05256652832031, "global_step": 102160, "epoch": 844} {"train_loss": -38.16215133666992, "global_step": 102161, "epoch": 844} {"train_loss": -37.923458099365234, "global_step": 102162, "epoch": 844} {"train_loss": -37.78229522705078, "global_step": 102163, "epoch": 844} {"train_loss": -37.447723388671875, "global_step": 102164, "epoch": 844} {"train_loss": -38.26047897338867, "global_step": 102165, "epoch": 844} {"train_loss": -37.88212203979492, "global_step": 102166, "epoch": 844} {"train_loss": -35.096858978271484, "global_step": 102167, "epoch": 844} {"train_loss": -38.20180892944336, "global_step": 102168, "epoch": 844} {"train_loss": -37.59019088745117, "global_step": 102169, "epoch": 844} {"train_loss": -37.733924865722656, "global_step": 102170, "epoch": 844} {"train_loss": -37.8466911315918, "global_step": 102171, "epoch": 844} {"train_loss": -37.83976364135742, "global_step": 102172, "epoch": 844} {"train_loss": -38.43153762817383, "global_step": 102173, "epoch": 844} {"train_loss": -37.9775390625, "global_step": 102174, "epoch": 844} {"train_loss": -38.135372161865234, "global_step": 102175, "epoch": 844} {"train_loss": -38.15906524658203, "global_step": 102176, "epoch": 844} {"train_loss": -38.10807418823242, "global_step": 102177, "epoch": 844} {"train_loss": -37.43130111694336, "global_step": 102178, "epoch": 844} {"train_loss": -38.45685958862305, "global_step": 102179, "epoch": 844} {"train_loss": -37.57973861694336, "global_step": 102180, "epoch": 844} {"train_loss": -37.71669387817383, "global_step": 102181, "epoch": 844} {"train_loss": -38.65354537963867, "global_step": 102182, "epoch": 844} {"train_loss": -38.028472900390625, "global_step": 102183, "epoch": 844} {"train_loss": -38.2080192565918, "global_step": 102184, "epoch": 844} {"train_loss": -37.424156188964844, "global_step": 102185, "epoch": 844} {"train_loss": -38.689456939697266, "global_step": 102186, "epoch": 844} {"train_loss": -37.792747497558594, "global_step": 102187, "epoch": 844} {"train_loss": -38.81809616088867, "global_step": 102188, "epoch": 844} {"train_loss": -38.667205810546875, "global_step": 102189, "epoch": 844} {"train_loss": -38.261695861816406, "global_step": 102190, "epoch": 844} {"train_loss": -37.753746032714844, "global_step": 102191, "epoch": 844} {"train_loss": -38.946014404296875, "global_step": 102192, "epoch": 844} {"train_loss": -38.3057975769043, "global_step": 102193, "epoch": 844} {"train_loss": -39.02568435668945, "global_step": 102194, "epoch": 844} {"train_loss": -38.22306442260742, "global_step": 102195, "epoch": 844} {"train_loss": -38.6939697265625, "global_step": 102196, "epoch": 844} {"train_loss": -38.424949645996094, "global_step": 102197, "epoch": 844} {"train_loss": -37.399696350097656, "global_step": 102198, "epoch": 844} {"train_loss": -38.00552749633789, "global_step": 102199, "epoch": 844} {"train_loss": -39.152870178222656, "global_step": 102200, "epoch": 844} {"train_loss": -38.759864807128906, "global_step": 102201, "epoch": 844} {"train_loss": -38.48264694213867, "global_step": 102202, "epoch": 844} {"train_loss": -38.767974853515625, "global_step": 102203, "epoch": 844} {"train_loss": -38.909175872802734, "global_step": 102204, "epoch": 844} {"train_loss": -38.38031005859375, "global_step": 102205, "epoch": 844} {"train_loss": -37.127288818359375, "global_step": 102206, "epoch": 844} {"train_loss": -36.29067611694336, "global_step": 102207, "epoch": 844} {"train_loss": -33.2557487487793, "global_step": 102208, "epoch": 844} {"train_loss": -33.4873046875, "global_step": 102209, "epoch": 844} {"train_loss": -32.14971923828125, "global_step": 102210, "epoch": 844} {"train_loss": -35.13846969604492, "global_step": 102211, "epoch": 844} {"train_loss": -34.904449462890625, "global_step": 102212, "epoch": 844} {"train_loss": -38.263179779052734, "global_step": 102213, "epoch": 844} {"train_loss": -36.4046745300293, "global_step": 102214, "epoch": 844} {"train_loss": -36.5008430480957, "global_step": 102215, "epoch": 844} {"train_loss": -36.94942092895508, "global_step": 102216, "epoch": 844} {"train_loss": -37.83234786987305, "global_step": 102217, "epoch": 844} {"train_loss": -37.76308059692383, "global_step": 102218, "epoch": 844} {"train_loss": -37.56875991821289, "global_step": 102219, "epoch": 844} {"train_loss": -34.879241943359375, "global_step": 102220, "epoch": 844} {"train_loss": -22.817657470703125, "global_step": 102221, "epoch": 844} {"train_loss": -36.627296447753906, "global_step": 102222, "epoch": 844} {"train_loss": -34.27253341674805, "global_step": 102223, "epoch": 844} {"train_loss": -32.276222229003906, "global_step": 102224, "epoch": 844} {"train_loss": -31.20137596130371, "global_step": 102225, "epoch": 844} {"train_loss": -30.69235610961914, "global_step": 102226, "epoch": 844} {"train_loss": -35.664119720458984, "global_step": 102227, "epoch": 844} {"train_loss": -34.22870635986328, "global_step": 102228, "epoch": 844} {"train_loss": -30.328327178955078, "global_step": 102229, "epoch": 844} {"train_loss": -21.412933349609375, "global_step": 102230, "epoch": 844} {"train_loss": -29.20509147644043, "global_step": 102231, "epoch": 844} {"train_loss": -30.52900505065918, "global_step": 102232, "epoch": 844} {"train_loss": -31.35529899597168, "global_step": 102233, "epoch": 844} {"train_loss": -33.93439865112305, "global_step": 102234, "epoch": 844} {"train_loss": -30.562910079956055, "global_step": 102235, "epoch": 844} {"train_loss": -33.21551513671875, "global_step": 102236, "epoch": 844} {"train_loss": -34.6998291015625, "global_step": 102237, "epoch": 844} {"train_loss": -33.39094161987305, "global_step": 102238, "epoch": 844} {"train_loss": -33.79235076904297, "global_step": 102239, "epoch": 844} {"train_loss": -31.21137809753418, "global_step": 102240, "epoch": 844} {"train_loss": -33.5556526184082, "global_step": 102241, "epoch": 844} {"train_loss": -34.944454193115234, "global_step": 102242, "epoch": 844} {"train_loss": -31.3338565826416, "global_step": 102243, "epoch": 844} {"train_loss": -35.92423282970082, "global_step": 102244, "epoch": 844, "val_loss": 3008861.25} {"train_loss": -33.73421096801758, "global_step": 102245, "epoch": 845} {"train_loss": -35.40937423706055, "global_step": 102246, "epoch": 845} {"train_loss": -33.01789093017578, "global_step": 102247, "epoch": 845} {"train_loss": -34.30841064453125, "global_step": 102248, "epoch": 845} {"train_loss": -34.72456359863281, "global_step": 102249, "epoch": 845} {"train_loss": -34.87241744995117, "global_step": 102250, "epoch": 845} {"train_loss": -34.36532211303711, "global_step": 102251, "epoch": 845} {"train_loss": -34.48666000366211, "global_step": 102252, "epoch": 845} {"train_loss": -35.46827697753906, "global_step": 102253, "epoch": 845} {"train_loss": -35.37102127075195, "global_step": 102254, "epoch": 845} {"train_loss": -35.835811614990234, "global_step": 102255, "epoch": 845} {"train_loss": -35.24916458129883, "global_step": 102256, "epoch": 845} {"train_loss": -33.81769561767578, "global_step": 102257, "epoch": 845} {"train_loss": -35.4213981628418, "global_step": 102258, "epoch": 845} {"train_loss": -35.985374450683594, "global_step": 102259, "epoch": 845} {"train_loss": -35.1489372253418, "global_step": 102260, "epoch": 845} {"train_loss": -36.046268463134766, "global_step": 102261, "epoch": 845} {"train_loss": -35.88444519042969, "global_step": 102262, "epoch": 845} {"train_loss": -35.84333038330078, "global_step": 102263, "epoch": 845} {"train_loss": -35.59415817260742, "global_step": 102264, "epoch": 845} {"train_loss": -35.75758743286133, "global_step": 102265, "epoch": 845} {"train_loss": -36.371395111083984, "global_step": 102266, "epoch": 845} {"train_loss": -36.4603385925293, "global_step": 102267, "epoch": 845} {"train_loss": -36.404396057128906, "global_step": 102268, "epoch": 845} {"train_loss": -36.172645568847656, "global_step": 102269, "epoch": 845} {"train_loss": -36.7462043762207, "global_step": 102270, "epoch": 845} {"train_loss": -36.51008224487305, "global_step": 102271, "epoch": 845} {"train_loss": -36.64853286743164, "global_step": 102272, "epoch": 845} {"train_loss": -36.69585418701172, "global_step": 102273, "epoch": 845} {"train_loss": -36.24142074584961, "global_step": 102274, "epoch": 845} {"train_loss": -36.07505416870117, "global_step": 102275, "epoch": 845} {"train_loss": -36.383392333984375, "global_step": 102276, "epoch": 845} {"train_loss": -37.41597366333008, "global_step": 102277, "epoch": 845} {"train_loss": -36.24520492553711, "global_step": 102278, "epoch": 845} {"train_loss": -36.95778274536133, "global_step": 102279, "epoch": 845} {"train_loss": -36.7034797668457, "global_step": 102280, "epoch": 845} {"train_loss": -36.912635803222656, "global_step": 102281, "epoch": 845} {"train_loss": -37.353858947753906, "global_step": 102282, "epoch": 845} {"train_loss": -36.73571014404297, "global_step": 102283, "epoch": 845} {"train_loss": -37.16590118408203, "global_step": 102284, "epoch": 845} {"train_loss": -37.14265060424805, "global_step": 102285, "epoch": 845} {"train_loss": -37.425533294677734, "global_step": 102286, "epoch": 845} {"train_loss": -37.14348220825195, "global_step": 102287, "epoch": 845} {"train_loss": -37.18135452270508, "global_step": 102288, "epoch": 845} {"train_loss": -37.118629455566406, "global_step": 102289, "epoch": 845} {"train_loss": -37.785888671875, "global_step": 102290, "epoch": 845} {"train_loss": -37.090118408203125, "global_step": 102291, "epoch": 845} {"train_loss": -37.420745849609375, "global_step": 102292, "epoch": 845} {"train_loss": -37.74880599975586, "global_step": 102293, "epoch": 845} {"train_loss": -37.36659240722656, "global_step": 102294, "epoch": 845} {"train_loss": -37.427154541015625, "global_step": 102295, "epoch": 845} {"train_loss": -37.53345489501953, "global_step": 102296, "epoch": 845} {"train_loss": -37.98169708251953, "global_step": 102297, "epoch": 845} {"train_loss": -37.23063278198242, "global_step": 102298, "epoch": 845} {"train_loss": -37.46989059448242, "global_step": 102299, "epoch": 845} {"train_loss": -38.145503997802734, "global_step": 102300, "epoch": 845} {"train_loss": -37.452491760253906, "global_step": 102301, "epoch": 845} {"train_loss": -37.36750030517578, "global_step": 102302, "epoch": 845} {"train_loss": -37.85579299926758, "global_step": 102303, "epoch": 845} {"train_loss": -37.671142578125, "global_step": 102304, "epoch": 845} {"train_loss": -37.73164749145508, "global_step": 102305, "epoch": 845} {"train_loss": -38.28296661376953, "global_step": 102306, "epoch": 845} {"train_loss": -38.50526809692383, "global_step": 102307, "epoch": 845} {"train_loss": -37.772361755371094, "global_step": 102308, "epoch": 845} {"train_loss": -38.127166748046875, "global_step": 102309, "epoch": 845} {"train_loss": -38.07710266113281, "global_step": 102310, "epoch": 845} {"train_loss": -38.40056228637695, "global_step": 102311, "epoch": 845} {"train_loss": -38.47710037231445, "global_step": 102312, "epoch": 845} {"train_loss": -38.592864990234375, "global_step": 102313, "epoch": 845} {"train_loss": -38.07234191894531, "global_step": 102314, "epoch": 845} {"train_loss": -37.57074737548828, "global_step": 102315, "epoch": 845} {"train_loss": -38.41465377807617, "global_step": 102316, "epoch": 845} {"train_loss": -38.103736877441406, "global_step": 102317, "epoch": 845} {"train_loss": -38.52186965942383, "global_step": 102318, "epoch": 845} {"train_loss": -38.24513626098633, "global_step": 102319, "epoch": 845} {"train_loss": -38.30955123901367, "global_step": 102320, "epoch": 845} {"train_loss": -37.96688461303711, "global_step": 102321, "epoch": 845} {"train_loss": -37.33466339111328, "global_step": 102322, "epoch": 845} {"train_loss": -36.80027389526367, "global_step": 102323, "epoch": 845} {"train_loss": -34.4217414855957, "global_step": 102324, "epoch": 845} {"train_loss": -35.23747634887695, "global_step": 102325, "epoch": 845} {"train_loss": -36.86138916015625, "global_step": 102326, "epoch": 845} {"train_loss": -36.53940963745117, "global_step": 102327, "epoch": 845} {"train_loss": -33.54011917114258, "global_step": 102328, "epoch": 845} {"train_loss": -30.6207275390625, "global_step": 102329, "epoch": 845} {"train_loss": -22.71714210510254, "global_step": 102330, "epoch": 845} {"train_loss": -18.576345443725586, "global_step": 102331, "epoch": 845} {"train_loss": -28.8421688079834, "global_step": 102332, "epoch": 845} {"train_loss": -36.74789047241211, "global_step": 102333, "epoch": 845} {"train_loss": -21.00661277770996, "global_step": 102334, "epoch": 845} {"train_loss": -19.66339111328125, "global_step": 102335, "epoch": 845} {"train_loss": -28.930505752563477, "global_step": 102336, "epoch": 845} {"train_loss": -19.447967529296875, "global_step": 102337, "epoch": 845} {"train_loss": -31.418371200561523, "global_step": 102338, "epoch": 845} {"train_loss": -27.395572662353516, "global_step": 102339, "epoch": 845} {"train_loss": -28.081159591674805, "global_step": 102340, "epoch": 845} {"train_loss": -35.13405990600586, "global_step": 102341, "epoch": 845} {"train_loss": -27.169631958007812, "global_step": 102342, "epoch": 845} {"train_loss": -33.63942337036133, "global_step": 102343, "epoch": 845} {"train_loss": -34.73832321166992, "global_step": 102344, "epoch": 845} {"train_loss": -30.631620407104492, "global_step": 102345, "epoch": 845} {"train_loss": -34.53611373901367, "global_step": 102346, "epoch": 845} {"train_loss": -36.36745834350586, "global_step": 102347, "epoch": 845} {"train_loss": -34.07172775268555, "global_step": 102348, "epoch": 845} {"train_loss": -34.53765106201172, "global_step": 102349, "epoch": 845} {"train_loss": -36.309818267822266, "global_step": 102350, "epoch": 845} {"train_loss": -36.039337158203125, "global_step": 102351, "epoch": 845} {"train_loss": -35.08191680908203, "global_step": 102352, "epoch": 845} {"train_loss": -35.02857208251953, "global_step": 102353, "epoch": 845} {"train_loss": -36.08050537109375, "global_step": 102354, "epoch": 845} {"train_loss": -36.95249557495117, "global_step": 102355, "epoch": 845} {"train_loss": -35.846107482910156, "global_step": 102356, "epoch": 845} {"train_loss": -36.388973236083984, "global_step": 102357, "epoch": 845} {"train_loss": -36.10042953491211, "global_step": 102358, "epoch": 845} {"train_loss": -36.567352294921875, "global_step": 102359, "epoch": 845} {"train_loss": -36.58979415893555, "global_step": 102360, "epoch": 845} {"train_loss": -36.44635009765625, "global_step": 102361, "epoch": 845} {"train_loss": -36.182891845703125, "global_step": 102362, "epoch": 845} {"train_loss": -37.07748031616211, "global_step": 102363, "epoch": 845} {"train_loss": -37.1965217590332, "global_step": 102364, "epoch": 845} {"train_loss": -35.34819922959509, "global_step": 102365, "epoch": 845, "val_loss": 2607941.25} {"train_loss": -36.9219970703125, "global_step": 102366, "epoch": 846} {"train_loss": -36.9454345703125, "global_step": 102367, "epoch": 846} {"train_loss": -36.91297912597656, "global_step": 102368, "epoch": 846} {"train_loss": -37.73863220214844, "global_step": 102369, "epoch": 846} {"train_loss": -36.926143646240234, "global_step": 102370, "epoch": 846} {"train_loss": -37.53110885620117, "global_step": 102371, "epoch": 846} {"train_loss": -37.312965393066406, "global_step": 102372, "epoch": 846} {"train_loss": -37.39030075073242, "global_step": 102373, "epoch": 846} {"train_loss": -37.63077163696289, "global_step": 102374, "epoch": 846} {"train_loss": -37.093318939208984, "global_step": 102375, "epoch": 846} {"train_loss": -37.34616470336914, "global_step": 102376, "epoch": 846} {"train_loss": -37.844356536865234, "global_step": 102377, "epoch": 846} {"train_loss": -37.56451416015625, "global_step": 102378, "epoch": 846} {"train_loss": -38.06047439575195, "global_step": 102379, "epoch": 846} {"train_loss": -37.9246826171875, "global_step": 102380, "epoch": 846} {"train_loss": -37.631309509277344, "global_step": 102381, "epoch": 846} {"train_loss": -37.796783447265625, "global_step": 102382, "epoch": 846} {"train_loss": -38.087646484375, "global_step": 102383, "epoch": 846} {"train_loss": -38.3383674621582, "global_step": 102384, "epoch": 846} {"train_loss": -38.122581481933594, "global_step": 102385, "epoch": 846} {"train_loss": -37.96360397338867, "global_step": 102386, "epoch": 846} {"train_loss": -38.150115966796875, "global_step": 102387, "epoch": 846} {"train_loss": -38.721641540527344, "global_step": 102388, "epoch": 846} {"train_loss": -38.42775344848633, "global_step": 102389, "epoch": 846} {"train_loss": -38.29429626464844, "global_step": 102390, "epoch": 846} {"train_loss": -38.15715408325195, "global_step": 102391, "epoch": 846} {"train_loss": -38.05808639526367, "global_step": 102392, "epoch": 846} {"train_loss": -38.2609977722168, "global_step": 102393, "epoch": 846} {"train_loss": -38.52106475830078, "global_step": 102394, "epoch": 846} {"train_loss": -38.243988037109375, "global_step": 102395, "epoch": 846} {"train_loss": -38.2045783996582, "global_step": 102396, "epoch": 846} {"train_loss": -38.663787841796875, "global_step": 102397, "epoch": 846} {"train_loss": -38.5229377746582, "global_step": 102398, "epoch": 846} {"train_loss": -38.76909255981445, "global_step": 102399, "epoch": 846} {"train_loss": -38.796287536621094, "global_step": 102400, "epoch": 846} {"train_loss": -38.6948356628418, "global_step": 102401, "epoch": 846} {"train_loss": -38.58601760864258, "global_step": 102402, "epoch": 846} {"train_loss": -38.63557052612305, "global_step": 102403, "epoch": 846} {"train_loss": -38.702392578125, "global_step": 102404, "epoch": 846} {"train_loss": -38.957969665527344, "global_step": 102405, "epoch": 846} {"train_loss": -38.6827507019043, "global_step": 102406, "epoch": 846} {"train_loss": -38.872230529785156, "global_step": 102407, "epoch": 846} {"train_loss": -39.01980972290039, "global_step": 102408, "epoch": 846} {"train_loss": -38.90082931518555, "global_step": 102409, "epoch": 846} {"train_loss": -38.57242202758789, "global_step": 102410, "epoch": 846} {"train_loss": -39.09876251220703, "global_step": 102411, "epoch": 846} {"train_loss": -39.15742874145508, "global_step": 102412, "epoch": 846} {"train_loss": -39.00048828125, "global_step": 102413, "epoch": 846} {"train_loss": -39.146514892578125, "global_step": 102414, "epoch": 846} {"train_loss": -38.655094146728516, "global_step": 102415, "epoch": 846} {"train_loss": -39.092533111572266, "global_step": 102416, "epoch": 846} {"train_loss": -38.99467086791992, "global_step": 102417, "epoch": 846} {"train_loss": -39.045166015625, "global_step": 102418, "epoch": 846} {"train_loss": -38.750911712646484, "global_step": 102419, "epoch": 846} {"train_loss": -39.092987060546875, "global_step": 102420, "epoch": 846} {"train_loss": -38.83222579956055, "global_step": 102421, "epoch": 846} {"train_loss": -38.785919189453125, "global_step": 102422, "epoch": 846} {"train_loss": -39.30366134643555, "global_step": 102423, "epoch": 846} {"train_loss": -38.8022346496582, "global_step": 102424, "epoch": 846} {"train_loss": -39.1165771484375, "global_step": 102425, "epoch": 846} {"train_loss": -38.74290084838867, "global_step": 102426, "epoch": 846} {"train_loss": -39.12892532348633, "global_step": 102427, "epoch": 846} {"train_loss": -38.43391799926758, "global_step": 102428, "epoch": 846} {"train_loss": -39.3420524597168, "global_step": 102429, "epoch": 846} {"train_loss": -39.3214111328125, "global_step": 102430, "epoch": 846} {"train_loss": -38.87968826293945, "global_step": 102431, "epoch": 846} {"train_loss": -37.831478118896484, "global_step": 102432, "epoch": 846} {"train_loss": -38.834449768066406, "global_step": 102433, "epoch": 846} {"train_loss": -38.65441131591797, "global_step": 102434, "epoch": 846} {"train_loss": -37.716060638427734, "global_step": 102435, "epoch": 846} {"train_loss": -35.62883377075195, "global_step": 102436, "epoch": 846} {"train_loss": -32.99222946166992, "global_step": 102437, "epoch": 846} {"train_loss": -23.973041534423828, "global_step": 102438, "epoch": 846} {"train_loss": -7.931848049163818, "global_step": 102439, "epoch": 846} {"train_loss": -8.198882102966309, "global_step": 102440, "epoch": 846} {"train_loss": -32.88105773925781, "global_step": 102441, "epoch": 846} {"train_loss": -25.248926162719727, "global_step": 102442, "epoch": 846} {"train_loss": -23.504318237304688, "global_step": 102443, "epoch": 846} {"train_loss": -31.382034301757812, "global_step": 102444, "epoch": 846} {"train_loss": -25.20850944519043, "global_step": 102445, "epoch": 846} {"train_loss": -32.4736442565918, "global_step": 102446, "epoch": 846} {"train_loss": -27.231128692626953, "global_step": 102447, "epoch": 846} {"train_loss": -34.1847038269043, "global_step": 102448, "epoch": 846} {"train_loss": -30.983495712280273, "global_step": 102449, "epoch": 846} {"train_loss": -34.17694854736328, "global_step": 102450, "epoch": 846} {"train_loss": -34.233333587646484, "global_step": 102451, "epoch": 846} {"train_loss": -32.329830169677734, "global_step": 102452, "epoch": 846} {"train_loss": -36.452632904052734, "global_step": 102453, "epoch": 846} {"train_loss": -34.233253479003906, "global_step": 102454, "epoch": 846} {"train_loss": -34.05949783325195, "global_step": 102455, "epoch": 846} {"train_loss": -36.00764083862305, "global_step": 102456, "epoch": 846} {"train_loss": -35.63496017456055, "global_step": 102457, "epoch": 846} {"train_loss": -35.94671630859375, "global_step": 102458, "epoch": 846} {"train_loss": -35.73196792602539, "global_step": 102459, "epoch": 846} {"train_loss": -34.884613037109375, "global_step": 102460, "epoch": 846} {"train_loss": -36.6146240234375, "global_step": 102461, "epoch": 846} {"train_loss": -36.14241409301758, "global_step": 102462, "epoch": 846} {"train_loss": -36.56606674194336, "global_step": 102463, "epoch": 846} {"train_loss": -36.656280517578125, "global_step": 102464, "epoch": 846} {"train_loss": -36.6143798828125, "global_step": 102465, "epoch": 846} {"train_loss": -36.06437301635742, "global_step": 102466, "epoch": 846} {"train_loss": -36.31073760986328, "global_step": 102467, "epoch": 846} {"train_loss": -36.8045654296875, "global_step": 102468, "epoch": 846} {"train_loss": -36.54648971557617, "global_step": 102469, "epoch": 846} {"train_loss": -36.9144401550293, "global_step": 102470, "epoch": 846} {"train_loss": -36.68488311767578, "global_step": 102471, "epoch": 846} {"train_loss": -35.9079704284668, "global_step": 102472, "epoch": 846} {"train_loss": -36.786476135253906, "global_step": 102473, "epoch": 846} {"train_loss": -36.9109001159668, "global_step": 102474, "epoch": 846} {"train_loss": -35.800048828125, "global_step": 102475, "epoch": 846} {"train_loss": -36.93235397338867, "global_step": 102476, "epoch": 846} {"train_loss": -37.04835510253906, "global_step": 102477, "epoch": 846} {"train_loss": -36.810585021972656, "global_step": 102478, "epoch": 846} {"train_loss": -37.125362396240234, "global_step": 102479, "epoch": 846} {"train_loss": -37.66132736206055, "global_step": 102480, "epoch": 846} {"train_loss": -37.1151008605957, "global_step": 102481, "epoch": 846} {"train_loss": -37.31220626831055, "global_step": 102482, "epoch": 846} {"train_loss": -37.34457015991211, "global_step": 102483, "epoch": 846} {"train_loss": -37.73969650268555, "global_step": 102484, "epoch": 846} {"train_loss": -37.87000274658203, "global_step": 102485, "epoch": 846} {"train_loss": -36.35862172733653, "global_step": 102486, "epoch": 846, "val_loss": 2652898.75} {"train_loss": -37.5525016784668, "global_step": 102487, "epoch": 847} {"train_loss": -37.62321090698242, "global_step": 102488, "epoch": 847} {"train_loss": -37.29851150512695, "global_step": 102489, "epoch": 847} {"train_loss": -37.372535705566406, "global_step": 102490, "epoch": 847} {"train_loss": -38.073341369628906, "global_step": 102491, "epoch": 847} {"train_loss": -38.01667404174805, "global_step": 102492, "epoch": 847} {"train_loss": -37.82490158081055, "global_step": 102493, "epoch": 847} {"train_loss": -38.05077362060547, "global_step": 102494, "epoch": 847} {"train_loss": -37.3922004699707, "global_step": 102495, "epoch": 847} {"train_loss": -38.0414924621582, "global_step": 102496, "epoch": 847} {"train_loss": -37.77706527709961, "global_step": 102497, "epoch": 847} {"train_loss": -37.556495666503906, "global_step": 102498, "epoch": 847} {"train_loss": -37.62103271484375, "global_step": 102499, "epoch": 847} {"train_loss": -38.20517349243164, "global_step": 102500, "epoch": 847} {"train_loss": -38.266639709472656, "global_step": 102501, "epoch": 847} {"train_loss": -38.3909797668457, "global_step": 102502, "epoch": 847} {"train_loss": -37.413307189941406, "global_step": 102503, "epoch": 847} {"train_loss": -37.994384765625, "global_step": 102504, "epoch": 847} {"train_loss": -38.21205520629883, "global_step": 102505, "epoch": 847} {"train_loss": -38.19477081298828, "global_step": 102506, "epoch": 847} {"train_loss": -38.423194885253906, "global_step": 102507, "epoch": 847} {"train_loss": -37.86619186401367, "global_step": 102508, "epoch": 847} {"train_loss": -37.24026107788086, "global_step": 102509, "epoch": 847} {"train_loss": -38.15763473510742, "global_step": 102510, "epoch": 847} {"train_loss": -38.229366302490234, "global_step": 102511, "epoch": 847} {"train_loss": -37.58049392700195, "global_step": 102512, "epoch": 847} {"train_loss": -38.52033615112305, "global_step": 102513, "epoch": 847} {"train_loss": -38.89023971557617, "global_step": 102514, "epoch": 847} {"train_loss": -38.237545013427734, "global_step": 102515, "epoch": 847} {"train_loss": -38.21516418457031, "global_step": 102516, "epoch": 847} {"train_loss": -38.46758270263672, "global_step": 102517, "epoch": 847} {"train_loss": -34.66638946533203, "global_step": 102518, "epoch": 847} {"train_loss": -38.06553649902344, "global_step": 102519, "epoch": 847} {"train_loss": -35.135353088378906, "global_step": 102520, "epoch": 847} {"train_loss": -36.70586013793945, "global_step": 102521, "epoch": 847} {"train_loss": -37.51896286010742, "global_step": 102522, "epoch": 847} {"train_loss": -37.8779296875, "global_step": 102523, "epoch": 847} {"train_loss": -37.11582565307617, "global_step": 102524, "epoch": 847} {"train_loss": -34.58773422241211, "global_step": 102525, "epoch": 847} {"train_loss": -37.10384750366211, "global_step": 102526, "epoch": 847} {"train_loss": -36.38546371459961, "global_step": 102527, "epoch": 847} {"train_loss": -37.207332611083984, "global_step": 102528, "epoch": 847} {"train_loss": -30.104177474975586, "global_step": 102529, "epoch": 847} {"train_loss": -36.32748031616211, "global_step": 102530, "epoch": 847} {"train_loss": -36.9406852722168, "global_step": 102531, "epoch": 847} {"train_loss": -35.05714797973633, "global_step": 102532, "epoch": 847} {"train_loss": -36.26139450073242, "global_step": 102533, "epoch": 847} {"train_loss": -35.441932678222656, "global_step": 102534, "epoch": 847} {"train_loss": -37.60493850708008, "global_step": 102535, "epoch": 847} {"train_loss": -36.86257553100586, "global_step": 102536, "epoch": 847} {"train_loss": -36.66768264770508, "global_step": 102537, "epoch": 847} {"train_loss": -35.42584228515625, "global_step": 102538, "epoch": 847} {"train_loss": -34.049922943115234, "global_step": 102539, "epoch": 847} {"train_loss": -34.153621673583984, "global_step": 102540, "epoch": 847} {"train_loss": -34.46400833129883, "global_step": 102541, "epoch": 847} {"train_loss": -37.38827896118164, "global_step": 102542, "epoch": 847} {"train_loss": -35.229610443115234, "global_step": 102543, "epoch": 847} {"train_loss": -33.6040153503418, "global_step": 102544, "epoch": 847} {"train_loss": -36.03940963745117, "global_step": 102545, "epoch": 847} {"train_loss": -35.786869049072266, "global_step": 102546, "epoch": 847} {"train_loss": -31.439075469970703, "global_step": 102547, "epoch": 847} {"train_loss": -35.31817626953125, "global_step": 102548, "epoch": 847} {"train_loss": -27.752609252929688, "global_step": 102549, "epoch": 847} {"train_loss": -35.31013107299805, "global_step": 102550, "epoch": 847} {"train_loss": -35.7253303527832, "global_step": 102551, "epoch": 847} {"train_loss": -34.7502326965332, "global_step": 102552, "epoch": 847} {"train_loss": -34.68263626098633, "global_step": 102553, "epoch": 847} {"train_loss": -32.556678771972656, "global_step": 102554, "epoch": 847} {"train_loss": -36.061187744140625, "global_step": 102555, "epoch": 847} {"train_loss": -35.86674499511719, "global_step": 102556, "epoch": 847} {"train_loss": -33.79712677001953, "global_step": 102557, "epoch": 847} {"train_loss": -35.5069694519043, "global_step": 102558, "epoch": 847} {"train_loss": -35.62423324584961, "global_step": 102559, "epoch": 847} {"train_loss": -36.56381607055664, "global_step": 102560, "epoch": 847} {"train_loss": -36.48478317260742, "global_step": 102561, "epoch": 847} {"train_loss": -34.884037017822266, "global_step": 102562, "epoch": 847} {"train_loss": -36.07439041137695, "global_step": 102563, "epoch": 847} {"train_loss": -33.3665771484375, "global_step": 102564, "epoch": 847} {"train_loss": -36.56519317626953, "global_step": 102565, "epoch": 847} {"train_loss": -35.570003509521484, "global_step": 102566, "epoch": 847} {"train_loss": -36.34537887573242, "global_step": 102567, "epoch": 847} {"train_loss": -36.616554260253906, "global_step": 102568, "epoch": 847} {"train_loss": -36.61393356323242, "global_step": 102569, "epoch": 847} {"train_loss": -36.155426025390625, "global_step": 102570, "epoch": 847} {"train_loss": -36.15985870361328, "global_step": 102571, "epoch": 847} {"train_loss": -36.03462219238281, "global_step": 102572, "epoch": 847} {"train_loss": -35.90180587768555, "global_step": 102573, "epoch": 847} {"train_loss": -36.495609283447266, "global_step": 102574, "epoch": 847} {"train_loss": -35.52261734008789, "global_step": 102575, "epoch": 847} {"train_loss": -37.05076217651367, "global_step": 102576, "epoch": 847} {"train_loss": -35.9047966003418, "global_step": 102577, "epoch": 847} {"train_loss": -36.38767623901367, "global_step": 102578, "epoch": 847} {"train_loss": -37.01351547241211, "global_step": 102579, "epoch": 847} {"train_loss": -36.56460189819336, "global_step": 102580, "epoch": 847} {"train_loss": -36.755958557128906, "global_step": 102581, "epoch": 847} {"train_loss": -36.86934280395508, "global_step": 102582, "epoch": 847} {"train_loss": -36.64813232421875, "global_step": 102583, "epoch": 847} {"train_loss": -37.15047836303711, "global_step": 102584, "epoch": 847} {"train_loss": -36.557106018066406, "global_step": 102585, "epoch": 847} {"train_loss": -37.36220169067383, "global_step": 102586, "epoch": 847} {"train_loss": -36.993324279785156, "global_step": 102587, "epoch": 847} {"train_loss": -37.004852294921875, "global_step": 102588, "epoch": 847} {"train_loss": -37.76359176635742, "global_step": 102589, "epoch": 847} {"train_loss": -37.04084014892578, "global_step": 102590, "epoch": 847} {"train_loss": -36.74024200439453, "global_step": 102591, "epoch": 847} {"train_loss": -37.454769134521484, "global_step": 102592, "epoch": 847} {"train_loss": -37.386348724365234, "global_step": 102593, "epoch": 847} {"train_loss": -37.41811752319336, "global_step": 102594, "epoch": 847} {"train_loss": -36.72408676147461, "global_step": 102595, "epoch": 847} {"train_loss": -37.60658645629883, "global_step": 102596, "epoch": 847} {"train_loss": -37.397979736328125, "global_step": 102597, "epoch": 847} {"train_loss": -37.3897705078125, "global_step": 102598, "epoch": 847} {"train_loss": -37.62396240234375, "global_step": 102599, "epoch": 847} {"train_loss": -37.52406311035156, "global_step": 102600, "epoch": 847} {"train_loss": -38.03689193725586, "global_step": 102601, "epoch": 847} {"train_loss": -37.969547271728516, "global_step": 102602, "epoch": 847} {"train_loss": -37.87496566772461, "global_step": 102603, "epoch": 847} {"train_loss": -38.3284797668457, "global_step": 102604, "epoch": 847} {"train_loss": -37.20711898803711, "global_step": 102605, "epoch": 847} {"train_loss": -37.78677749633789, "global_step": 102606, "epoch": 847} {"train_loss": -36.589420555051696, "global_step": 102607, "epoch": 847, "val_loss": 2657673.75} {"train_loss": -38.202728271484375, "global_step": 102608, "epoch": 848} {"train_loss": -37.935298919677734, "global_step": 102609, "epoch": 848} {"train_loss": -37.85590362548828, "global_step": 102610, "epoch": 848} {"train_loss": -37.82054138183594, "global_step": 102611, "epoch": 848} {"train_loss": -37.606563568115234, "global_step": 102612, "epoch": 848} {"train_loss": -38.248046875, "global_step": 102613, "epoch": 848} {"train_loss": -37.7239990234375, "global_step": 102614, "epoch": 848} {"train_loss": -37.94581985473633, "global_step": 102615, "epoch": 848} {"train_loss": -37.69649124145508, "global_step": 102616, "epoch": 848} {"train_loss": -37.869808197021484, "global_step": 102617, "epoch": 848} {"train_loss": -38.19013214111328, "global_step": 102618, "epoch": 848} {"train_loss": -38.26577377319336, "global_step": 102619, "epoch": 848} {"train_loss": -38.0662841796875, "global_step": 102620, "epoch": 848} {"train_loss": -37.661312103271484, "global_step": 102621, "epoch": 848} {"train_loss": -38.25737380981445, "global_step": 102622, "epoch": 848} {"train_loss": -38.11430740356445, "global_step": 102623, "epoch": 848} {"train_loss": -38.225276947021484, "global_step": 102624, "epoch": 848} {"train_loss": -37.11440658569336, "global_step": 102625, "epoch": 848} {"train_loss": -38.43496322631836, "global_step": 102626, "epoch": 848} {"train_loss": -36.749080657958984, "global_step": 102627, "epoch": 848} {"train_loss": -37.91343307495117, "global_step": 102628, "epoch": 848} {"train_loss": -37.12361145019531, "global_step": 102629, "epoch": 848} {"train_loss": -36.70267868041992, "global_step": 102630, "epoch": 848} {"train_loss": -38.23347854614258, "global_step": 102631, "epoch": 848} {"train_loss": -37.48554611206055, "global_step": 102632, "epoch": 848} {"train_loss": -38.10995101928711, "global_step": 102633, "epoch": 848} {"train_loss": -37.8083610534668, "global_step": 102634, "epoch": 848} {"train_loss": -37.723480224609375, "global_step": 102635, "epoch": 848} {"train_loss": -37.747947692871094, "global_step": 102636, "epoch": 848} {"train_loss": -38.226070404052734, "global_step": 102637, "epoch": 848} {"train_loss": -36.411041259765625, "global_step": 102638, "epoch": 848} {"train_loss": -35.17023849487305, "global_step": 102639, "epoch": 848} {"train_loss": -36.458255767822266, "global_step": 102640, "epoch": 848} {"train_loss": -38.0037956237793, "global_step": 102641, "epoch": 848} {"train_loss": -36.91230392456055, "global_step": 102642, "epoch": 848} {"train_loss": -36.646785736083984, "global_step": 102643, "epoch": 848} {"train_loss": -37.70095443725586, "global_step": 102644, "epoch": 848} {"train_loss": -37.31419372558594, "global_step": 102645, "epoch": 848} {"train_loss": -38.72392654418945, "global_step": 102646, "epoch": 848} {"train_loss": -37.28440475463867, "global_step": 102647, "epoch": 848} {"train_loss": -38.41636276245117, "global_step": 102648, "epoch": 848} {"train_loss": -38.39300537109375, "global_step": 102649, "epoch": 848} {"train_loss": -38.38131332397461, "global_step": 102650, "epoch": 848} {"train_loss": -38.2865104675293, "global_step": 102651, "epoch": 848} {"train_loss": -38.6602897644043, "global_step": 102652, "epoch": 848} {"train_loss": -38.26458740234375, "global_step": 102653, "epoch": 848} {"train_loss": -38.58657455444336, "global_step": 102654, "epoch": 848} {"train_loss": -38.28466796875, "global_step": 102655, "epoch": 848} {"train_loss": -38.28620147705078, "global_step": 102656, "epoch": 848} {"train_loss": -38.518306732177734, "global_step": 102657, "epoch": 848} {"train_loss": -38.796627044677734, "global_step": 102658, "epoch": 848} {"train_loss": -38.66605758666992, "global_step": 102659, "epoch": 848} {"train_loss": -38.75559616088867, "global_step": 102660, "epoch": 848} {"train_loss": -38.92793273925781, "global_step": 102661, "epoch": 848} {"train_loss": -39.03202438354492, "global_step": 102662, "epoch": 848} {"train_loss": -38.56578063964844, "global_step": 102663, "epoch": 848} {"train_loss": -38.78868865966797, "global_step": 102664, "epoch": 848} {"train_loss": -38.63080596923828, "global_step": 102665, "epoch": 848} {"train_loss": -38.44970703125, "global_step": 102666, "epoch": 848} {"train_loss": -38.9916877746582, "global_step": 102667, "epoch": 848} {"train_loss": -38.309139251708984, "global_step": 102668, "epoch": 848} {"train_loss": -38.962860107421875, "global_step": 102669, "epoch": 848} {"train_loss": -38.99971008300781, "global_step": 102670, "epoch": 848} {"train_loss": -39.23273849487305, "global_step": 102671, "epoch": 848} {"train_loss": -38.32880783081055, "global_step": 102672, "epoch": 848} {"train_loss": -39.36665344238281, "global_step": 102673, "epoch": 848} {"train_loss": -38.62067413330078, "global_step": 102674, "epoch": 848} {"train_loss": -38.70838165283203, "global_step": 102675, "epoch": 848} {"train_loss": -38.80129623413086, "global_step": 102676, "epoch": 848} {"train_loss": -38.493473052978516, "global_step": 102677, "epoch": 848} {"train_loss": -38.84807205200195, "global_step": 102678, "epoch": 848} {"train_loss": -39.22756576538086, "global_step": 102679, "epoch": 848} {"train_loss": -39.04926681518555, "global_step": 102680, "epoch": 848} {"train_loss": -38.93478012084961, "global_step": 102681, "epoch": 848} {"train_loss": -38.488250732421875, "global_step": 102682, "epoch": 848} {"train_loss": -38.92672348022461, "global_step": 102683, "epoch": 848} {"train_loss": -39.13029098510742, "global_step": 102684, "epoch": 848} {"train_loss": -38.44014358520508, "global_step": 102685, "epoch": 848} {"train_loss": -38.25666427612305, "global_step": 102686, "epoch": 848} {"train_loss": -38.719512939453125, "global_step": 102687, "epoch": 848} {"train_loss": -39.21419143676758, "global_step": 102688, "epoch": 848} {"train_loss": -38.56989669799805, "global_step": 102689, "epoch": 848} {"train_loss": -39.4228401184082, "global_step": 102690, "epoch": 848} {"train_loss": -38.78351593017578, "global_step": 102691, "epoch": 848} {"train_loss": -39.247623443603516, "global_step": 102692, "epoch": 848} {"train_loss": -39.114017486572266, "global_step": 102693, "epoch": 848} {"train_loss": -38.521728515625, "global_step": 102694, "epoch": 848} {"train_loss": -36.77898025512695, "global_step": 102695, "epoch": 848} {"train_loss": -34.857269287109375, "global_step": 102696, "epoch": 848} {"train_loss": -36.307613372802734, "global_step": 102697, "epoch": 848} {"train_loss": -35.6617546081543, "global_step": 102698, "epoch": 848} {"train_loss": -38.442970275878906, "global_step": 102699, "epoch": 848} {"train_loss": -37.408416748046875, "global_step": 102700, "epoch": 848} {"train_loss": -38.15706253051758, "global_step": 102701, "epoch": 848} {"train_loss": -37.71937561035156, "global_step": 102702, "epoch": 848} {"train_loss": -36.855831146240234, "global_step": 102703, "epoch": 848} {"train_loss": -36.07310104370117, "global_step": 102704, "epoch": 848} {"train_loss": -36.564369201660156, "global_step": 102705, "epoch": 848} {"train_loss": -36.8645133972168, "global_step": 102706, "epoch": 848} {"train_loss": -38.47972106933594, "global_step": 102707, "epoch": 848} {"train_loss": -37.4870719909668, "global_step": 102708, "epoch": 848} {"train_loss": -36.383155822753906, "global_step": 102709, "epoch": 848} {"train_loss": -38.31032180786133, "global_step": 102710, "epoch": 848} {"train_loss": -38.29936218261719, "global_step": 102711, "epoch": 848} {"train_loss": -37.01995849609375, "global_step": 102712, "epoch": 848} {"train_loss": -38.157100677490234, "global_step": 102713, "epoch": 848} {"train_loss": -37.365333557128906, "global_step": 102714, "epoch": 848} {"train_loss": -36.98135757446289, "global_step": 102715, "epoch": 848} {"train_loss": -37.212738037109375, "global_step": 102716, "epoch": 848} {"train_loss": -37.18105697631836, "global_step": 102717, "epoch": 848} {"train_loss": -37.451576232910156, "global_step": 102718, "epoch": 848} {"train_loss": -36.83590316772461, "global_step": 102719, "epoch": 848} {"train_loss": -38.05388259887695, "global_step": 102720, "epoch": 848} {"train_loss": -37.60386276245117, "global_step": 102721, "epoch": 848} {"train_loss": -37.215911865234375, "global_step": 102722, "epoch": 848} {"train_loss": -36.90761947631836, "global_step": 102723, "epoch": 848} {"train_loss": -36.81512451171875, "global_step": 102724, "epoch": 848} {"train_loss": -36.29496383666992, "global_step": 102725, "epoch": 848} {"train_loss": -38.51824951171875, "global_step": 102726, "epoch": 848} {"train_loss": -36.7032356262207, "global_step": 102727, "epoch": 848} {"train_loss": -37.91452515026754, "global_step": 102728, "epoch": 848, "val_loss": 2678686.0} {"train_loss": -37.522743225097656, "global_step": 102729, "epoch": 849} {"train_loss": -38.17395782470703, "global_step": 102730, "epoch": 849} {"train_loss": -36.76972579956055, "global_step": 102731, "epoch": 849} {"train_loss": -37.77299880981445, "global_step": 102732, "epoch": 849} {"train_loss": -37.85390853881836, "global_step": 102733, "epoch": 849} {"train_loss": -37.53849411010742, "global_step": 102734, "epoch": 849} {"train_loss": -38.11076736450195, "global_step": 102735, "epoch": 849} {"train_loss": -38.55938720703125, "global_step": 102736, "epoch": 849} {"train_loss": -38.155731201171875, "global_step": 102737, "epoch": 849} {"train_loss": -38.79757308959961, "global_step": 102738, "epoch": 849} {"train_loss": -38.305946350097656, "global_step": 102739, "epoch": 849} {"train_loss": -36.709476470947266, "global_step": 102740, "epoch": 849} {"train_loss": -38.10956954956055, "global_step": 102741, "epoch": 849} {"train_loss": -38.164669036865234, "global_step": 102742, "epoch": 849} {"train_loss": -38.97962188720703, "global_step": 102743, "epoch": 849} {"train_loss": -38.637168884277344, "global_step": 102744, "epoch": 849} {"train_loss": -38.02288818359375, "global_step": 102745, "epoch": 849} {"train_loss": -38.138545989990234, "global_step": 102746, "epoch": 849} {"train_loss": -38.89995193481445, "global_step": 102747, "epoch": 849} {"train_loss": -38.5790901184082, "global_step": 102748, "epoch": 849} {"train_loss": -38.50942611694336, "global_step": 102749, "epoch": 849} {"train_loss": -38.81421661376953, "global_step": 102750, "epoch": 849} {"train_loss": -37.90757751464844, "global_step": 102751, "epoch": 849} {"train_loss": -38.7786979675293, "global_step": 102752, "epoch": 849} {"train_loss": -38.263641357421875, "global_step": 102753, "epoch": 849} {"train_loss": -38.77767562866211, "global_step": 102754, "epoch": 849} {"train_loss": -38.4517707824707, "global_step": 102755, "epoch": 849} {"train_loss": -38.993316650390625, "global_step": 102756, "epoch": 849} {"train_loss": -38.06242752075195, "global_step": 102757, "epoch": 849} {"train_loss": -38.909969329833984, "global_step": 102758, "epoch": 849} {"train_loss": -38.94913864135742, "global_step": 102759, "epoch": 849} {"train_loss": -38.78266525268555, "global_step": 102760, "epoch": 849} {"train_loss": -39.09890365600586, "global_step": 102761, "epoch": 849} {"train_loss": -38.76992416381836, "global_step": 102762, "epoch": 849} {"train_loss": -39.089820861816406, "global_step": 102763, "epoch": 849} {"train_loss": -38.91288375854492, "global_step": 102764, "epoch": 849} {"train_loss": -38.053009033203125, "global_step": 102765, "epoch": 849} {"train_loss": -38.26428985595703, "global_step": 102766, "epoch": 849} {"train_loss": -38.9271354675293, "global_step": 102767, "epoch": 849} {"train_loss": -39.007564544677734, "global_step": 102768, "epoch": 849} {"train_loss": -38.95357894897461, "global_step": 102769, "epoch": 849} {"train_loss": -38.52058029174805, "global_step": 102770, "epoch": 849} {"train_loss": -38.56734848022461, "global_step": 102771, "epoch": 849} {"train_loss": -38.89554977416992, "global_step": 102772, "epoch": 849} {"train_loss": -39.45943832397461, "global_step": 102773, "epoch": 849} {"train_loss": -38.80286407470703, "global_step": 102774, "epoch": 849} {"train_loss": -38.625362396240234, "global_step": 102775, "epoch": 849} {"train_loss": -38.640480041503906, "global_step": 102776, "epoch": 849} {"train_loss": -38.710357666015625, "global_step": 102777, "epoch": 849} {"train_loss": -38.35982894897461, "global_step": 102778, "epoch": 849} {"train_loss": -38.13648986816406, "global_step": 102779, "epoch": 849} {"train_loss": -38.277679443359375, "global_step": 102780, "epoch": 849} {"train_loss": -39.28571319580078, "global_step": 102781, "epoch": 849} {"train_loss": -39.411231994628906, "global_step": 102782, "epoch": 849} {"train_loss": -39.24113082885742, "global_step": 102783, "epoch": 849} {"train_loss": -38.231300354003906, "global_step": 102784, "epoch": 849} {"train_loss": -38.57633590698242, "global_step": 102785, "epoch": 849} {"train_loss": -38.627689361572266, "global_step": 102786, "epoch": 849} {"train_loss": -38.362815856933594, "global_step": 102787, "epoch": 849} {"train_loss": -38.357208251953125, "global_step": 102788, "epoch": 849} {"train_loss": -39.01331329345703, "global_step": 102789, "epoch": 849} {"train_loss": -37.76871109008789, "global_step": 102790, "epoch": 849} {"train_loss": -38.12160873413086, "global_step": 102791, "epoch": 849} {"train_loss": -38.42539596557617, "global_step": 102792, "epoch": 849} {"train_loss": -37.86587905883789, "global_step": 102793, "epoch": 849} {"train_loss": -38.55403518676758, "global_step": 102794, "epoch": 849} {"train_loss": -38.59010696411133, "global_step": 102795, "epoch": 849} {"train_loss": -38.759159088134766, "global_step": 102796, "epoch": 849} {"train_loss": -38.53963088989258, "global_step": 102797, "epoch": 849} {"train_loss": -37.24113082885742, "global_step": 102798, "epoch": 849} {"train_loss": -37.133148193359375, "global_step": 102799, "epoch": 849} {"train_loss": -38.936519622802734, "global_step": 102800, "epoch": 849} {"train_loss": -37.491939544677734, "global_step": 102801, "epoch": 849} {"train_loss": -35.36842727661133, "global_step": 102802, "epoch": 849} {"train_loss": -34.92527389526367, "global_step": 102803, "epoch": 849} {"train_loss": -35.83506393432617, "global_step": 102804, "epoch": 849} {"train_loss": -36.99683380126953, "global_step": 102805, "epoch": 849} {"train_loss": -35.51601791381836, "global_step": 102806, "epoch": 849} {"train_loss": -36.17299270629883, "global_step": 102807, "epoch": 849} {"train_loss": -36.86824035644531, "global_step": 102808, "epoch": 849} {"train_loss": -34.28828048706055, "global_step": 102809, "epoch": 849} {"train_loss": -37.6011848449707, "global_step": 102810, "epoch": 849} {"train_loss": -36.61365509033203, "global_step": 102811, "epoch": 849} {"train_loss": -36.62423324584961, "global_step": 102812, "epoch": 849} {"train_loss": -36.18528747558594, "global_step": 102813, "epoch": 849} {"train_loss": -35.98695755004883, "global_step": 102814, "epoch": 849} {"train_loss": -36.32001495361328, "global_step": 102815, "epoch": 849} {"train_loss": -33.582374572753906, "global_step": 102816, "epoch": 849} {"train_loss": -37.54425048828125, "global_step": 102817, "epoch": 849} {"train_loss": -35.95893478393555, "global_step": 102818, "epoch": 849} {"train_loss": -32.854408264160156, "global_step": 102819, "epoch": 849} {"train_loss": -34.08156204223633, "global_step": 102820, "epoch": 849} {"train_loss": -35.26002502441406, "global_step": 102821, "epoch": 849} {"train_loss": -35.115962982177734, "global_step": 102822, "epoch": 849} {"train_loss": -36.1651725769043, "global_step": 102823, "epoch": 849} {"train_loss": -36.70405960083008, "global_step": 102824, "epoch": 849} {"train_loss": -34.8142204284668, "global_step": 102825, "epoch": 849} {"train_loss": -35.913978576660156, "global_step": 102826, "epoch": 849} {"train_loss": -36.099205017089844, "global_step": 102827, "epoch": 849} {"train_loss": -35.33087921142578, "global_step": 102828, "epoch": 849} {"train_loss": -32.166175842285156, "global_step": 102829, "epoch": 849} {"train_loss": -32.202823638916016, "global_step": 102830, "epoch": 849} {"train_loss": -36.905250549316406, "global_step": 102831, "epoch": 849} {"train_loss": -35.174930572509766, "global_step": 102832, "epoch": 849} {"train_loss": -35.77299118041992, "global_step": 102833, "epoch": 849} {"train_loss": -36.097145080566406, "global_step": 102834, "epoch": 849} {"train_loss": -35.54865264892578, "global_step": 102835, "epoch": 849} {"train_loss": -34.802650451660156, "global_step": 102836, "epoch": 849} {"train_loss": -36.309959411621094, "global_step": 102837, "epoch": 849} {"train_loss": -36.346710205078125, "global_step": 102838, "epoch": 849} {"train_loss": -35.56468200683594, "global_step": 102839, "epoch": 849} {"train_loss": -36.392303466796875, "global_step": 102840, "epoch": 849} {"train_loss": -36.289588928222656, "global_step": 102841, "epoch": 849} {"train_loss": -36.12921905517578, "global_step": 102842, "epoch": 849} {"train_loss": -37.16755294799805, "global_step": 102843, "epoch": 849} {"train_loss": -37.26762008666992, "global_step": 102844, "epoch": 849} {"train_loss": -36.01068115234375, "global_step": 102845, "epoch": 849} {"train_loss": -36.8780517578125, "global_step": 102846, "epoch": 849} {"train_loss": -37.078521728515625, "global_step": 102847, "epoch": 849} {"train_loss": -36.6550178527832, "global_step": 102848, "epoch": 849} {"train_loss": -37.3857105034442, "global_step": 102849, "epoch": 849, "val_loss": 2675135.0} {"train_loss": -36.961158752441406, "global_step": 102850, "epoch": 850} {"train_loss": -37.18389892578125, "global_step": 102851, "epoch": 850} {"train_loss": -37.33018493652344, "global_step": 102852, "epoch": 850} {"train_loss": -37.61322021484375, "global_step": 102853, "epoch": 850} {"train_loss": -37.03373336791992, "global_step": 102854, "epoch": 850} {"train_loss": -37.319969177246094, "global_step": 102855, "epoch": 850} {"train_loss": -37.390655517578125, "global_step": 102856, "epoch": 850} {"train_loss": -37.56953048706055, "global_step": 102857, "epoch": 850} {"train_loss": -37.613739013671875, "global_step": 102858, "epoch": 850} {"train_loss": -36.90304183959961, "global_step": 102859, "epoch": 850} {"train_loss": -37.72739791870117, "global_step": 102860, "epoch": 850} {"train_loss": -36.63579177856445, "global_step": 102861, "epoch": 850} {"train_loss": -37.540061950683594, "global_step": 102862, "epoch": 850} {"train_loss": -37.493629455566406, "global_step": 102863, "epoch": 850} {"train_loss": -37.33197021484375, "global_step": 102864, "epoch": 850} {"train_loss": -37.14344024658203, "global_step": 102865, "epoch": 850} {"train_loss": -37.558895111083984, "global_step": 102866, "epoch": 850} {"train_loss": -37.70524978637695, "global_step": 102867, "epoch": 850} {"train_loss": -38.10065460205078, "global_step": 102868, "epoch": 850} {"train_loss": -37.833717346191406, "global_step": 102869, "epoch": 850} {"train_loss": -38.1529655456543, "global_step": 102870, "epoch": 850} {"train_loss": -38.09275436401367, "global_step": 102871, "epoch": 850} {"train_loss": -37.976043701171875, "global_step": 102872, "epoch": 850} {"train_loss": -38.12183380126953, "global_step": 102873, "epoch": 850} {"train_loss": -37.89836883544922, "global_step": 102874, "epoch": 850} {"train_loss": -38.10786056518555, "global_step": 102875, "epoch": 850} {"train_loss": -38.220760345458984, "global_step": 102876, "epoch": 850} {"train_loss": -38.54896545410156, "global_step": 102877, "epoch": 850} {"train_loss": -37.793312072753906, "global_step": 102878, "epoch": 850} {"train_loss": -38.001224517822266, "global_step": 102879, "epoch": 850} {"train_loss": -38.5379753112793, "global_step": 102880, "epoch": 850} {"train_loss": -38.60444259643555, "global_step": 102881, "epoch": 850} {"train_loss": -38.91060256958008, "global_step": 102882, "epoch": 850} {"train_loss": -38.199920654296875, "global_step": 102883, "epoch": 850} {"train_loss": -38.66818618774414, "global_step": 102884, "epoch": 850} {"train_loss": -38.30303192138672, "global_step": 102885, "epoch": 850} {"train_loss": -37.77492904663086, "global_step": 102886, "epoch": 850} {"train_loss": -38.49549865722656, "global_step": 102887, "epoch": 850} {"train_loss": -38.71669387817383, "global_step": 102888, "epoch": 850} {"train_loss": -39.06834411621094, "global_step": 102889, "epoch": 850} {"train_loss": -38.520172119140625, "global_step": 102890, "epoch": 850} {"train_loss": -38.85600280761719, "global_step": 102891, "epoch": 850} {"train_loss": -38.727699279785156, "global_step": 102892, "epoch": 850} {"train_loss": -38.881378173828125, "global_step": 102893, "epoch": 850} {"train_loss": -38.61982345581055, "global_step": 102894, "epoch": 850} {"train_loss": -38.252193450927734, "global_step": 102895, "epoch": 850} {"train_loss": -38.028541564941406, "global_step": 102896, "epoch": 850} {"train_loss": -37.7822380065918, "global_step": 102897, "epoch": 850} {"train_loss": -37.93164825439453, "global_step": 102898, "epoch": 850} {"train_loss": -38.143306732177734, "global_step": 102899, "epoch": 850} {"train_loss": -38.38913345336914, "global_step": 102900, "epoch": 850} {"train_loss": -38.426239013671875, "global_step": 102901, "epoch": 850} {"train_loss": -38.8117561340332, "global_step": 102902, "epoch": 850} {"train_loss": -38.76186752319336, "global_step": 102903, "epoch": 850} {"train_loss": -38.595184326171875, "global_step": 102904, "epoch": 850} {"train_loss": -38.431976318359375, "global_step": 102905, "epoch": 850} {"train_loss": -37.26095199584961, "global_step": 102906, "epoch": 850} {"train_loss": -37.30585861206055, "global_step": 102907, "epoch": 850} {"train_loss": -37.09553909301758, "global_step": 102908, "epoch": 850} {"train_loss": -35.88288497924805, "global_step": 102909, "epoch": 850} {"train_loss": -33.920989990234375, "global_step": 102910, "epoch": 850} {"train_loss": -33.53262710571289, "global_step": 102911, "epoch": 850} {"train_loss": -34.054744720458984, "global_step": 102912, "epoch": 850} {"train_loss": -37.03923416137695, "global_step": 102913, "epoch": 850} {"train_loss": -37.600502014160156, "global_step": 102914, "epoch": 850} {"train_loss": -37.572696685791016, "global_step": 102915, "epoch": 850} {"train_loss": -38.39496612548828, "global_step": 102916, "epoch": 850} {"train_loss": -38.585731506347656, "global_step": 102917, "epoch": 850} {"train_loss": -37.28560256958008, "global_step": 102918, "epoch": 850} {"train_loss": -36.57318115234375, "global_step": 102919, "epoch": 850} {"train_loss": -34.63480758666992, "global_step": 102920, "epoch": 850} {"train_loss": -30.182235717773438, "global_step": 102921, "epoch": 850} {"train_loss": -34.03472137451172, "global_step": 102922, "epoch": 850} {"train_loss": -38.30826950073242, "global_step": 102923, "epoch": 850} {"train_loss": -30.9372501373291, "global_step": 102924, "epoch": 850} {"train_loss": -31.70991325378418, "global_step": 102925, "epoch": 850} {"train_loss": -33.02255630493164, "global_step": 102926, "epoch": 850} {"train_loss": -29.512699127197266, "global_step": 102927, "epoch": 850} {"train_loss": -33.68380355834961, "global_step": 102928, "epoch": 850} {"train_loss": -34.570072174072266, "global_step": 102929, "epoch": 850} {"train_loss": -29.233551025390625, "global_step": 102930, "epoch": 850} {"train_loss": -33.089874267578125, "global_step": 102931, "epoch": 850} {"train_loss": -27.658048629760742, "global_step": 102932, "epoch": 850} {"train_loss": -29.25007438659668, "global_step": 102933, "epoch": 850} {"train_loss": -36.33987045288086, "global_step": 102934, "epoch": 850} {"train_loss": -34.635101318359375, "global_step": 102935, "epoch": 850} {"train_loss": -33.227874755859375, "global_step": 102936, "epoch": 850} {"train_loss": -34.1621208190918, "global_step": 102937, "epoch": 850} {"train_loss": -36.083251953125, "global_step": 102938, "epoch": 850} {"train_loss": -35.470455169677734, "global_step": 102939, "epoch": 850} {"train_loss": -34.99876403808594, "global_step": 102940, "epoch": 850} {"train_loss": -35.16451644897461, "global_step": 102941, "epoch": 850} {"train_loss": -35.61245346069336, "global_step": 102942, "epoch": 850} {"train_loss": -35.91530227661133, "global_step": 102943, "epoch": 850} {"train_loss": -29.31304359436035, "global_step": 102944, "epoch": 850} {"train_loss": -36.4024543762207, "global_step": 102945, "epoch": 850} {"train_loss": -36.801361083984375, "global_step": 102946, "epoch": 850} {"train_loss": -32.8680305480957, "global_step": 102947, "epoch": 850} {"train_loss": -35.40614700317383, "global_step": 102948, "epoch": 850} {"train_loss": -35.00642013549805, "global_step": 102949, "epoch": 850} {"train_loss": -30.693023681640625, "global_step": 102950, "epoch": 850} {"train_loss": -34.64216995239258, "global_step": 102951, "epoch": 850} {"train_loss": -35.27462387084961, "global_step": 102952, "epoch": 850} {"train_loss": -34.62403869628906, "global_step": 102953, "epoch": 850} {"train_loss": -35.54484176635742, "global_step": 102954, "epoch": 850} {"train_loss": -35.681365966796875, "global_step": 102955, "epoch": 850} {"train_loss": -35.574214935302734, "global_step": 102956, "epoch": 850} {"train_loss": -36.80503845214844, "global_step": 102957, "epoch": 850} {"train_loss": -35.98257064819336, "global_step": 102958, "epoch": 850} {"train_loss": -33.1065673828125, "global_step": 102959, "epoch": 850} {"train_loss": -35.4336051940918, "global_step": 102960, "epoch": 850} {"train_loss": -33.3636589050293, "global_step": 102961, "epoch": 850} {"train_loss": -33.015953063964844, "global_step": 102962, "epoch": 850} {"train_loss": -34.928932189941406, "global_step": 102963, "epoch": 850} {"train_loss": -36.08341979980469, "global_step": 102964, "epoch": 850} {"train_loss": -36.3691520690918, "global_step": 102965, "epoch": 850} {"train_loss": -35.66780471801758, "global_step": 102966, "epoch": 850} {"train_loss": -36.46913528442383, "global_step": 102967, "epoch": 850} {"train_loss": -36.36332321166992, "global_step": 102968, "epoch": 850} {"train_loss": -34.309871673583984, "global_step": 102969, "epoch": 850} {"train_loss": -36.242328628035615, "global_step": 102970, "epoch": 850, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4400000": 1.0, "test/sim_max_reward_4400001": 0.0, "test/sim_max_reward_4400002": 1.0, "test/sim_max_reward_4400003": 1.0, "test/sim_max_reward_4400004": 1.0, "test/sim_max_reward_4400005": 1.0, "test/sim_max_reward_4400006": 1.0, "test/sim_max_reward_4400007": 1.0, "test/sim_max_reward_4400008": 1.0, "test/sim_max_reward_4400009": 1.0, "test/sim_max_reward_4400010": 1.0, "test/sim_max_reward_4400011": 1.0, "test/sim_max_reward_4400012": 1.0, "test/sim_max_reward_4400013": 1.0, "test/sim_max_reward_4400014": 1.0, "test/sim_max_reward_4400015": 1.0, "test/sim_max_reward_4400016": 1.0, "test/sim_max_reward_4400017": 1.0, "test/sim_max_reward_4400018": 1.0, "test/sim_max_reward_4400019": 1.0, "test/sim_max_reward_4400020": 1.0, "test/sim_max_reward_4400021": 1.0, "train/mean_score": 1.0, "test/mean_score": 0.9545454545454546, "val_loss": 2614537.25} {"train_loss": -37.15625762939453, "global_step": 102971, "epoch": 851} {"train_loss": -33.54356384277344, "global_step": 102972, "epoch": 851} {"train_loss": -36.085906982421875, "global_step": 102973, "epoch": 851} {"train_loss": -36.00585174560547, "global_step": 102974, "epoch": 851} {"train_loss": -36.65073776245117, "global_step": 102975, "epoch": 851} {"train_loss": -37.02102279663086, "global_step": 102976, "epoch": 851} {"train_loss": -36.76983642578125, "global_step": 102977, "epoch": 851} {"train_loss": -36.87738800048828, "global_step": 102978, "epoch": 851} {"train_loss": -36.343135833740234, "global_step": 102979, "epoch": 851} {"train_loss": -36.701080322265625, "global_step": 102980, "epoch": 851} {"train_loss": -36.72184371948242, "global_step": 102981, "epoch": 851} {"train_loss": -36.56421661376953, "global_step": 102982, "epoch": 851} {"train_loss": -37.04801940917969, "global_step": 102983, "epoch": 851} {"train_loss": -36.91512680053711, "global_step": 102984, "epoch": 851} {"train_loss": -37.14258575439453, "global_step": 102985, "epoch": 851} {"train_loss": -37.276771545410156, "global_step": 102986, "epoch": 851} {"train_loss": -36.91776657104492, "global_step": 102987, "epoch": 851} {"train_loss": -37.71284866333008, "global_step": 102988, "epoch": 851} {"train_loss": -37.38645553588867, "global_step": 102989, "epoch": 851} {"train_loss": -37.00678253173828, "global_step": 102990, "epoch": 851} {"train_loss": -37.593223571777344, "global_step": 102991, "epoch": 851} {"train_loss": -37.805973052978516, "global_step": 102992, "epoch": 851} {"train_loss": -37.71895980834961, "global_step": 102993, "epoch": 851} {"train_loss": -37.651397705078125, "global_step": 102994, "epoch": 851} {"train_loss": -37.348968505859375, "global_step": 102995, "epoch": 851} {"train_loss": -37.5403938293457, "global_step": 102996, "epoch": 851} {"train_loss": -37.59334182739258, "global_step": 102997, "epoch": 851} {"train_loss": -38.08241271972656, "global_step": 102998, "epoch": 851} {"train_loss": -37.901737213134766, "global_step": 102999, "epoch": 851} {"train_loss": -37.908111572265625, "global_step": 103000, "epoch": 851} {"train_loss": -38.18983840942383, "global_step": 103001, "epoch": 851} {"train_loss": -38.21445846557617, "global_step": 103002, "epoch": 851} {"train_loss": -38.279293060302734, "global_step": 103003, "epoch": 851} {"train_loss": -38.36372756958008, "global_step": 103004, "epoch": 851} {"train_loss": -36.7989501953125, "global_step": 103005, "epoch": 851} {"train_loss": -37.50865173339844, "global_step": 103006, "epoch": 851} {"train_loss": -36.293025970458984, "global_step": 103007, "epoch": 851} {"train_loss": -38.30086898803711, "global_step": 103008, "epoch": 851} {"train_loss": -38.41779708862305, "global_step": 103009, "epoch": 851} {"train_loss": -38.14542770385742, "global_step": 103010, "epoch": 851} {"train_loss": -38.523963928222656, "global_step": 103011, "epoch": 851} {"train_loss": -38.247161865234375, "global_step": 103012, "epoch": 851} {"train_loss": -38.31232833862305, "global_step": 103013, "epoch": 851} {"train_loss": -37.983943939208984, "global_step": 103014, "epoch": 851} {"train_loss": -38.525394439697266, "global_step": 103015, "epoch": 851} {"train_loss": -38.3990364074707, "global_step": 103016, "epoch": 851} {"train_loss": -38.76154327392578, "global_step": 103017, "epoch": 851} {"train_loss": -38.78154373168945, "global_step": 103018, "epoch": 851} {"train_loss": -38.2183837890625, "global_step": 103019, "epoch": 851} {"train_loss": -38.18489074707031, "global_step": 103020, "epoch": 851} {"train_loss": -38.53889846801758, "global_step": 103021, "epoch": 851} {"train_loss": -38.99443435668945, "global_step": 103022, "epoch": 851} {"train_loss": -38.453792572021484, "global_step": 103023, "epoch": 851} {"train_loss": -37.96600341796875, "global_step": 103024, "epoch": 851} {"train_loss": -38.934505462646484, "global_step": 103025, "epoch": 851} {"train_loss": -38.2003059387207, "global_step": 103026, "epoch": 851} {"train_loss": -38.67397689819336, "global_step": 103027, "epoch": 851} {"train_loss": -38.21331787109375, "global_step": 103028, "epoch": 851} {"train_loss": -38.75014877319336, "global_step": 103029, "epoch": 851} {"train_loss": -39.11799240112305, "global_step": 103030, "epoch": 851} {"train_loss": -38.94697189331055, "global_step": 103031, "epoch": 851} {"train_loss": -38.64179229736328, "global_step": 103032, "epoch": 851} {"train_loss": -39.13108825683594, "global_step": 103033, "epoch": 851} {"train_loss": -39.03324508666992, "global_step": 103034, "epoch": 851} {"train_loss": -38.77631759643555, "global_step": 103035, "epoch": 851} {"train_loss": -38.79011917114258, "global_step": 103036, "epoch": 851} {"train_loss": -38.42527389526367, "global_step": 103037, "epoch": 851} {"train_loss": -39.10878372192383, "global_step": 103038, "epoch": 851} {"train_loss": -38.81074142456055, "global_step": 103039, "epoch": 851} {"train_loss": -38.268001556396484, "global_step": 103040, "epoch": 851} {"train_loss": -38.72329330444336, "global_step": 103041, "epoch": 851} {"train_loss": -38.649635314941406, "global_step": 103042, "epoch": 851} {"train_loss": -38.71039962768555, "global_step": 103043, "epoch": 851} {"train_loss": -38.53957748413086, "global_step": 103044, "epoch": 851} {"train_loss": -39.07803726196289, "global_step": 103045, "epoch": 851} {"train_loss": -38.49625778198242, "global_step": 103046, "epoch": 851} {"train_loss": -39.017574310302734, "global_step": 103047, "epoch": 851} {"train_loss": -38.77180480957031, "global_step": 103048, "epoch": 851} {"train_loss": -38.860816955566406, "global_step": 103049, "epoch": 851} {"train_loss": -38.42548370361328, "global_step": 103050, "epoch": 851} {"train_loss": -38.86745071411133, "global_step": 103051, "epoch": 851} {"train_loss": -38.73933029174805, "global_step": 103052, "epoch": 851} {"train_loss": -39.15900802612305, "global_step": 103053, "epoch": 851} {"train_loss": -39.303688049316406, "global_step": 103054, "epoch": 851} {"train_loss": -39.179927825927734, "global_step": 103055, "epoch": 851} {"train_loss": -39.15064239501953, "global_step": 103056, "epoch": 851} {"train_loss": -39.31447219848633, "global_step": 103057, "epoch": 851} {"train_loss": -39.03736114501953, "global_step": 103058, "epoch": 851} {"train_loss": -39.01742935180664, "global_step": 103059, "epoch": 851} {"train_loss": -37.960243225097656, "global_step": 103060, "epoch": 851} {"train_loss": -39.0971794128418, "global_step": 103061, "epoch": 851} {"train_loss": -37.850440979003906, "global_step": 103062, "epoch": 851} {"train_loss": -38.56069564819336, "global_step": 103063, "epoch": 851} {"train_loss": -37.883724212646484, "global_step": 103064, "epoch": 851} {"train_loss": -38.86824417114258, "global_step": 103065, "epoch": 851} {"train_loss": -38.8581657409668, "global_step": 103066, "epoch": 851} {"train_loss": -38.857521057128906, "global_step": 103067, "epoch": 851} {"train_loss": -38.16119384765625, "global_step": 103068, "epoch": 851} {"train_loss": -37.62687683105469, "global_step": 103069, "epoch": 851} {"train_loss": -38.5770149230957, "global_step": 103070, "epoch": 851} {"train_loss": -37.57931900024414, "global_step": 103071, "epoch": 851} {"train_loss": -34.43439865112305, "global_step": 103072, "epoch": 851} {"train_loss": -30.97212028503418, "global_step": 103073, "epoch": 851} {"train_loss": -30.844436645507812, "global_step": 103074, "epoch": 851} {"train_loss": -36.17176055908203, "global_step": 103075, "epoch": 851} {"train_loss": -31.0606689453125, "global_step": 103076, "epoch": 851} {"train_loss": -31.49149513244629, "global_step": 103077, "epoch": 851} {"train_loss": -33.88100814819336, "global_step": 103078, "epoch": 851} {"train_loss": -36.25022506713867, "global_step": 103079, "epoch": 851} {"train_loss": -36.293067932128906, "global_step": 103080, "epoch": 851} {"train_loss": -33.89262008666992, "global_step": 103081, "epoch": 851} {"train_loss": -36.67619323730469, "global_step": 103082, "epoch": 851} {"train_loss": -35.392112731933594, "global_step": 103083, "epoch": 851} {"train_loss": -35.25790023803711, "global_step": 103084, "epoch": 851} {"train_loss": -36.394012451171875, "global_step": 103085, "epoch": 851} {"train_loss": -35.66259765625, "global_step": 103086, "epoch": 851} {"train_loss": -36.180789947509766, "global_step": 103087, "epoch": 851} {"train_loss": -36.93975830078125, "global_step": 103088, "epoch": 851} {"train_loss": -36.81415939331055, "global_step": 103089, "epoch": 851} {"train_loss": -36.3246955871582, "global_step": 103090, "epoch": 851} {"train_loss": -37.556790060248254, "global_step": 103091, "epoch": 851, "val_loss": 2593226.5} {"train_loss": -36.038936614990234, "global_step": 103092, "epoch": 852} {"train_loss": -35.6521110534668, "global_step": 103093, "epoch": 852} {"train_loss": -36.67182159423828, "global_step": 103094, "epoch": 852} {"train_loss": -37.217159271240234, "global_step": 103095, "epoch": 852} {"train_loss": -37.30491256713867, "global_step": 103096, "epoch": 852} {"train_loss": -36.798744201660156, "global_step": 103097, "epoch": 852} {"train_loss": -37.386627197265625, "global_step": 103098, "epoch": 852} {"train_loss": -37.18986129760742, "global_step": 103099, "epoch": 852} {"train_loss": -37.363975524902344, "global_step": 103100, "epoch": 852} {"train_loss": -37.90170669555664, "global_step": 103101, "epoch": 852} {"train_loss": -37.26935958862305, "global_step": 103102, "epoch": 852} {"train_loss": -37.404808044433594, "global_step": 103103, "epoch": 852} {"train_loss": -37.45939254760742, "global_step": 103104, "epoch": 852} {"train_loss": -37.232452392578125, "global_step": 103105, "epoch": 852} {"train_loss": -37.36683654785156, "global_step": 103106, "epoch": 852} {"train_loss": -37.769615173339844, "global_step": 103107, "epoch": 852} {"train_loss": -36.768333435058594, "global_step": 103108, "epoch": 852} {"train_loss": -37.84361267089844, "global_step": 103109, "epoch": 852} {"train_loss": -37.96992111206055, "global_step": 103110, "epoch": 852} {"train_loss": -36.80574417114258, "global_step": 103111, "epoch": 852} {"train_loss": -38.607765197753906, "global_step": 103112, "epoch": 852} {"train_loss": -37.43171310424805, "global_step": 103113, "epoch": 852} {"train_loss": -38.571937561035156, "global_step": 103114, "epoch": 852} {"train_loss": -37.89791488647461, "global_step": 103115, "epoch": 852} {"train_loss": -38.35464096069336, "global_step": 103116, "epoch": 852} {"train_loss": -38.2303581237793, "global_step": 103117, "epoch": 852} {"train_loss": -38.9318962097168, "global_step": 103118, "epoch": 852} {"train_loss": -38.400054931640625, "global_step": 103119, "epoch": 852} {"train_loss": -38.192623138427734, "global_step": 103120, "epoch": 852} {"train_loss": -38.38145065307617, "global_step": 103121, "epoch": 852} {"train_loss": -39.200069427490234, "global_step": 103122, "epoch": 852} {"train_loss": -38.937843322753906, "global_step": 103123, "epoch": 852} {"train_loss": -38.489200592041016, "global_step": 103124, "epoch": 852} {"train_loss": -38.38139724731445, "global_step": 103125, "epoch": 852} {"train_loss": -38.61065673828125, "global_step": 103126, "epoch": 852} {"train_loss": -38.16671371459961, "global_step": 103127, "epoch": 852} {"train_loss": -39.2186393737793, "global_step": 103128, "epoch": 852} {"train_loss": -38.62807846069336, "global_step": 103129, "epoch": 852} {"train_loss": -38.68281936645508, "global_step": 103130, "epoch": 852} {"train_loss": -38.73973846435547, "global_step": 103131, "epoch": 852} {"train_loss": -38.9455680847168, "global_step": 103132, "epoch": 852} {"train_loss": -38.54098129272461, "global_step": 103133, "epoch": 852} {"train_loss": -38.807613372802734, "global_step": 103134, "epoch": 852} {"train_loss": -38.93606185913086, "global_step": 103135, "epoch": 852} {"train_loss": -38.831172943115234, "global_step": 103136, "epoch": 852} {"train_loss": -38.74653625488281, "global_step": 103137, "epoch": 852} {"train_loss": -38.99724197387695, "global_step": 103138, "epoch": 852} {"train_loss": -38.759307861328125, "global_step": 103139, "epoch": 852} {"train_loss": -39.21159362792969, "global_step": 103140, "epoch": 852} {"train_loss": -39.292396545410156, "global_step": 103141, "epoch": 852} {"train_loss": -38.774173736572266, "global_step": 103142, "epoch": 852} {"train_loss": -39.11440658569336, "global_step": 103143, "epoch": 852} {"train_loss": -39.00819778442383, "global_step": 103144, "epoch": 852} {"train_loss": -39.191043853759766, "global_step": 103145, "epoch": 852} {"train_loss": -39.38320541381836, "global_step": 103146, "epoch": 852} {"train_loss": -38.77418899536133, "global_step": 103147, "epoch": 852} {"train_loss": -39.24898147583008, "global_step": 103148, "epoch": 852} {"train_loss": -39.248008728027344, "global_step": 103149, "epoch": 852} {"train_loss": -39.369537353515625, "global_step": 103150, "epoch": 852} {"train_loss": -39.27812576293945, "global_step": 103151, "epoch": 852} {"train_loss": -39.46971893310547, "global_step": 103152, "epoch": 852} {"train_loss": -39.31393051147461, "global_step": 103153, "epoch": 852} {"train_loss": -38.891902923583984, "global_step": 103154, "epoch": 852} {"train_loss": -39.55681228637695, "global_step": 103155, "epoch": 852} {"train_loss": -38.578243255615234, "global_step": 103156, "epoch": 852} {"train_loss": -38.38077926635742, "global_step": 103157, "epoch": 852} {"train_loss": -39.15300369262695, "global_step": 103158, "epoch": 852} {"train_loss": -39.10405349731445, "global_step": 103159, "epoch": 852} {"train_loss": -38.70985412597656, "global_step": 103160, "epoch": 852} {"train_loss": -38.53329849243164, "global_step": 103161, "epoch": 852} {"train_loss": -38.838905334472656, "global_step": 103162, "epoch": 852} {"train_loss": -39.21173095703125, "global_step": 103163, "epoch": 852} {"train_loss": -39.16034698486328, "global_step": 103164, "epoch": 852} {"train_loss": -39.02602767944336, "global_step": 103165, "epoch": 852} {"train_loss": -38.18037796020508, "global_step": 103166, "epoch": 852} {"train_loss": -38.29144287109375, "global_step": 103167, "epoch": 852} {"train_loss": -38.6379280090332, "global_step": 103168, "epoch": 852} {"train_loss": -39.42085266113281, "global_step": 103169, "epoch": 852} {"train_loss": -39.212379455566406, "global_step": 103170, "epoch": 852} {"train_loss": -39.354393005371094, "global_step": 103171, "epoch": 852} {"train_loss": -39.62531661987305, "global_step": 103172, "epoch": 852} {"train_loss": -39.387447357177734, "global_step": 103173, "epoch": 852} {"train_loss": -38.177886962890625, "global_step": 103174, "epoch": 852} {"train_loss": -38.63393783569336, "global_step": 103175, "epoch": 852} {"train_loss": -39.49626541137695, "global_step": 103176, "epoch": 852} {"train_loss": -38.874847412109375, "global_step": 103177, "epoch": 852} {"train_loss": -37.970008850097656, "global_step": 103178, "epoch": 852} {"train_loss": -38.214698791503906, "global_step": 103179, "epoch": 852} {"train_loss": -37.8590202331543, "global_step": 103180, "epoch": 852} {"train_loss": -38.94271469116211, "global_step": 103181, "epoch": 852} {"train_loss": -37.91038131713867, "global_step": 103182, "epoch": 852} {"train_loss": -38.450111389160156, "global_step": 103183, "epoch": 852} {"train_loss": -39.75212478637695, "global_step": 103184, "epoch": 852} {"train_loss": -38.88689041137695, "global_step": 103185, "epoch": 852} {"train_loss": -37.962623596191406, "global_step": 103186, "epoch": 852} {"train_loss": -38.56119918823242, "global_step": 103187, "epoch": 852} {"train_loss": -38.45331954956055, "global_step": 103188, "epoch": 852} {"train_loss": -39.38405227661133, "global_step": 103189, "epoch": 852} {"train_loss": -39.56322479248047, "global_step": 103190, "epoch": 852} {"train_loss": -39.2347526550293, "global_step": 103191, "epoch": 852} {"train_loss": -38.520076751708984, "global_step": 103192, "epoch": 852} {"train_loss": -38.805152893066406, "global_step": 103193, "epoch": 852} {"train_loss": -38.36811065673828, "global_step": 103194, "epoch": 852} {"train_loss": -39.16116714477539, "global_step": 103195, "epoch": 852} {"train_loss": -37.8590202331543, "global_step": 103196, "epoch": 852} {"train_loss": -37.950096130371094, "global_step": 103197, "epoch": 852} {"train_loss": -37.66321563720703, "global_step": 103198, "epoch": 852} {"train_loss": -37.04109573364258, "global_step": 103199, "epoch": 852} {"train_loss": -39.17667770385742, "global_step": 103200, "epoch": 852} {"train_loss": -36.16022872924805, "global_step": 103201, "epoch": 852} {"train_loss": -31.58108901977539, "global_step": 103202, "epoch": 852} {"train_loss": -30.509540557861328, "global_step": 103203, "epoch": 852} {"train_loss": -28.535486221313477, "global_step": 103204, "epoch": 852} {"train_loss": -34.714290618896484, "global_step": 103205, "epoch": 852} {"train_loss": -37.5733642578125, "global_step": 103206, "epoch": 852} {"train_loss": -37.6313591003418, "global_step": 103207, "epoch": 852} {"train_loss": -38.648887634277344, "global_step": 103208, "epoch": 852} {"train_loss": -36.90410614013672, "global_step": 103209, "epoch": 852} {"train_loss": -38.01393127441406, "global_step": 103210, "epoch": 852} {"train_loss": -38.12348556518555, "global_step": 103211, "epoch": 852} {"train_loss": -38.175830163246346, "global_step": 103212, "epoch": 852, "val_loss": 2616224.75} {"train_loss": -38.8701286315918, "global_step": 103213, "epoch": 853} {"train_loss": -38.315059661865234, "global_step": 103214, "epoch": 853} {"train_loss": -38.366756439208984, "global_step": 103215, "epoch": 853} {"train_loss": -37.41801071166992, "global_step": 103216, "epoch": 853} {"train_loss": -38.37567901611328, "global_step": 103217, "epoch": 853} {"train_loss": -38.3387336730957, "global_step": 103218, "epoch": 853} {"train_loss": -38.772560119628906, "global_step": 103219, "epoch": 853} {"train_loss": -38.63569259643555, "global_step": 103220, "epoch": 853} {"train_loss": -38.828765869140625, "global_step": 103221, "epoch": 853} {"train_loss": -37.388946533203125, "global_step": 103222, "epoch": 853} {"train_loss": -38.453399658203125, "global_step": 103223, "epoch": 853} {"train_loss": -38.40350341796875, "global_step": 103224, "epoch": 853} {"train_loss": -36.26569747924805, "global_step": 103225, "epoch": 853} {"train_loss": -37.921592712402344, "global_step": 103226, "epoch": 853} {"train_loss": -38.46812057495117, "global_step": 103227, "epoch": 853} {"train_loss": -38.163360595703125, "global_step": 103228, "epoch": 853} {"train_loss": -38.76701354980469, "global_step": 103229, "epoch": 853} {"train_loss": -38.866943359375, "global_step": 103230, "epoch": 853} {"train_loss": -38.433650970458984, "global_step": 103231, "epoch": 853} {"train_loss": -38.149436950683594, "global_step": 103232, "epoch": 853} {"train_loss": -38.70736312866211, "global_step": 103233, "epoch": 853} {"train_loss": -38.687191009521484, "global_step": 103234, "epoch": 853} {"train_loss": -38.3966064453125, "global_step": 103235, "epoch": 853} {"train_loss": -37.718353271484375, "global_step": 103236, "epoch": 853} {"train_loss": -38.61935806274414, "global_step": 103237, "epoch": 853} {"train_loss": -38.73069381713867, "global_step": 103238, "epoch": 853} {"train_loss": -39.06105422973633, "global_step": 103239, "epoch": 853} {"train_loss": -37.64009094238281, "global_step": 103240, "epoch": 853} {"train_loss": -38.155521392822266, "global_step": 103241, "epoch": 853} {"train_loss": -37.964691162109375, "global_step": 103242, "epoch": 853} {"train_loss": -38.56435012817383, "global_step": 103243, "epoch": 853} {"train_loss": -38.079200744628906, "global_step": 103244, "epoch": 853} {"train_loss": -38.72453308105469, "global_step": 103245, "epoch": 853} {"train_loss": -38.266387939453125, "global_step": 103246, "epoch": 853} {"train_loss": -38.82947540283203, "global_step": 103247, "epoch": 853} {"train_loss": -38.340145111083984, "global_step": 103248, "epoch": 853} {"train_loss": -37.95998001098633, "global_step": 103249, "epoch": 853} {"train_loss": -37.873939514160156, "global_step": 103250, "epoch": 853} {"train_loss": -38.65160369873047, "global_step": 103251, "epoch": 853} {"train_loss": -38.54826736450195, "global_step": 103252, "epoch": 853} {"train_loss": -36.93391036987305, "global_step": 103253, "epoch": 853} {"train_loss": -38.42374801635742, "global_step": 103254, "epoch": 853} {"train_loss": -39.154605865478516, "global_step": 103255, "epoch": 853} {"train_loss": -38.08662796020508, "global_step": 103256, "epoch": 853} {"train_loss": -38.34381866455078, "global_step": 103257, "epoch": 853} {"train_loss": -38.10298538208008, "global_step": 103258, "epoch": 853} {"train_loss": -38.31140899658203, "global_step": 103259, "epoch": 853} {"train_loss": -39.05498123168945, "global_step": 103260, "epoch": 853} {"train_loss": -37.11091995239258, "global_step": 103261, "epoch": 853} {"train_loss": -38.655296325683594, "global_step": 103262, "epoch": 853} {"train_loss": -38.989654541015625, "global_step": 103263, "epoch": 853} {"train_loss": -39.00109100341797, "global_step": 103264, "epoch": 853} {"train_loss": -37.44941711425781, "global_step": 103265, "epoch": 853} {"train_loss": -35.15202713012695, "global_step": 103266, "epoch": 853} {"train_loss": -38.313968658447266, "global_step": 103267, "epoch": 853} {"train_loss": -38.71799850463867, "global_step": 103268, "epoch": 853} {"train_loss": -31.153074264526367, "global_step": 103269, "epoch": 853} {"train_loss": -37.24457931518555, "global_step": 103270, "epoch": 853} {"train_loss": -35.97840118408203, "global_step": 103271, "epoch": 853} {"train_loss": -23.487789154052734, "global_step": 103272, "epoch": 853} {"train_loss": -35.833126068115234, "global_step": 103273, "epoch": 853} {"train_loss": -32.230751037597656, "global_step": 103274, "epoch": 853} {"train_loss": -16.727157592773438, "global_step": 103275, "epoch": 853} {"train_loss": -27.540082931518555, "global_step": 103276, "epoch": 853} {"train_loss": -16.079864501953125, "global_step": 103277, "epoch": 853} {"train_loss": -31.364500045776367, "global_step": 103278, "epoch": 853} {"train_loss": -24.379104614257812, "global_step": 103279, "epoch": 853} {"train_loss": -12.501861572265625, "global_step": 103280, "epoch": 853} {"train_loss": -17.582094192504883, "global_step": 103281, "epoch": 853} {"train_loss": -26.111780166625977, "global_step": 103282, "epoch": 853} {"train_loss": -29.651611328125, "global_step": 103283, "epoch": 853} {"train_loss": -28.55311393737793, "global_step": 103284, "epoch": 853} {"train_loss": -30.3850154876709, "global_step": 103285, "epoch": 853} {"train_loss": -29.441207885742188, "global_step": 103286, "epoch": 853} {"train_loss": -30.25948143005371, "global_step": 103287, "epoch": 853} {"train_loss": -27.570785522460938, "global_step": 103288, "epoch": 853} {"train_loss": -26.3376407623291, "global_step": 103289, "epoch": 853} {"train_loss": -27.62896728515625, "global_step": 103290, "epoch": 853} {"train_loss": -26.43861198425293, "global_step": 103291, "epoch": 853} {"train_loss": -30.2542724609375, "global_step": 103292, "epoch": 853} {"train_loss": -30.587310791015625, "global_step": 103293, "epoch": 853} {"train_loss": -31.99163246154785, "global_step": 103294, "epoch": 853} {"train_loss": -33.41268539428711, "global_step": 103295, "epoch": 853} {"train_loss": -32.3959846496582, "global_step": 103296, "epoch": 853} {"train_loss": -33.34178161621094, "global_step": 103297, "epoch": 853} {"train_loss": -32.28656005859375, "global_step": 103298, "epoch": 853} {"train_loss": -33.1090202331543, "global_step": 103299, "epoch": 853} {"train_loss": -32.026981353759766, "global_step": 103300, "epoch": 853} {"train_loss": -33.18570327758789, "global_step": 103301, "epoch": 853} {"train_loss": -32.70831298828125, "global_step": 103302, "epoch": 853} {"train_loss": -32.224464416503906, "global_step": 103303, "epoch": 853} {"train_loss": -33.05305099487305, "global_step": 103304, "epoch": 853} {"train_loss": -33.03904342651367, "global_step": 103305, "epoch": 853} {"train_loss": -33.28997039794922, "global_step": 103306, "epoch": 853} {"train_loss": -33.70033264160156, "global_step": 103307, "epoch": 853} {"train_loss": -33.11328887939453, "global_step": 103308, "epoch": 853} {"train_loss": -33.571563720703125, "global_step": 103309, "epoch": 853} {"train_loss": -33.880043029785156, "global_step": 103310, "epoch": 853} {"train_loss": -33.6680908203125, "global_step": 103311, "epoch": 853} {"train_loss": -33.479827880859375, "global_step": 103312, "epoch": 853} {"train_loss": -33.02152633666992, "global_step": 103313, "epoch": 853} {"train_loss": -34.0281867980957, "global_step": 103314, "epoch": 853} {"train_loss": -34.03976058959961, "global_step": 103315, "epoch": 853} {"train_loss": -34.142887115478516, "global_step": 103316, "epoch": 853} {"train_loss": -33.09312057495117, "global_step": 103317, "epoch": 853} {"train_loss": -34.15566635131836, "global_step": 103318, "epoch": 853} {"train_loss": -34.40743637084961, "global_step": 103319, "epoch": 853} {"train_loss": -34.09908676147461, "global_step": 103320, "epoch": 853} {"train_loss": -34.59596633911133, "global_step": 103321, "epoch": 853} {"train_loss": -34.85993576049805, "global_step": 103322, "epoch": 853} {"train_loss": -34.9533805847168, "global_step": 103323, "epoch": 853} {"train_loss": -34.52967071533203, "global_step": 103324, "epoch": 853} {"train_loss": -34.9571647644043, "global_step": 103325, "epoch": 853} {"train_loss": -33.88740921020508, "global_step": 103326, "epoch": 853} {"train_loss": -34.773597717285156, "global_step": 103327, "epoch": 853} {"train_loss": -34.5296745300293, "global_step": 103328, "epoch": 853} {"train_loss": -34.71419906616211, "global_step": 103329, "epoch": 853} {"train_loss": -34.9000244140625, "global_step": 103330, "epoch": 853} {"train_loss": -34.67680740356445, "global_step": 103331, "epoch": 853} {"train_loss": -34.9222412109375, "global_step": 103332, "epoch": 853} {"train_loss": -34.52642691430967, "global_step": 103333, "epoch": 853, "val_loss": 2708366.0} {"train_loss": -36.1684684753418, "global_step": 103334, "epoch": 854} {"train_loss": -35.312496185302734, "global_step": 103335, "epoch": 854} {"train_loss": -35.98785400390625, "global_step": 103336, "epoch": 854} {"train_loss": -35.74689483642578, "global_step": 103337, "epoch": 854} {"train_loss": -35.83531188964844, "global_step": 103338, "epoch": 854} {"train_loss": -35.38327407836914, "global_step": 103339, "epoch": 854} {"train_loss": -36.321990966796875, "global_step": 103340, "epoch": 854} {"train_loss": -34.89348220825195, "global_step": 103341, "epoch": 854} {"train_loss": -35.92768478393555, "global_step": 103342, "epoch": 854} {"train_loss": -35.03273391723633, "global_step": 103343, "epoch": 854} {"train_loss": -35.881752014160156, "global_step": 103344, "epoch": 854} {"train_loss": -35.74756622314453, "global_step": 103345, "epoch": 854} {"train_loss": -36.00312423706055, "global_step": 103346, "epoch": 854} {"train_loss": -35.612056732177734, "global_step": 103347, "epoch": 854} {"train_loss": -35.92055892944336, "global_step": 103348, "epoch": 854} {"train_loss": -35.58548355102539, "global_step": 103349, "epoch": 854} {"train_loss": -36.2996940612793, "global_step": 103350, "epoch": 854} {"train_loss": -36.77568054199219, "global_step": 103351, "epoch": 854} {"train_loss": -35.9444465637207, "global_step": 103352, "epoch": 854} {"train_loss": -36.479183197021484, "global_step": 103353, "epoch": 854} {"train_loss": -36.563411712646484, "global_step": 103354, "epoch": 854} {"train_loss": -35.76214599609375, "global_step": 103355, "epoch": 854} {"train_loss": -37.13700485229492, "global_step": 103356, "epoch": 854} {"train_loss": -36.184730529785156, "global_step": 103357, "epoch": 854} {"train_loss": -37.05669021606445, "global_step": 103358, "epoch": 854} {"train_loss": -37.48561477661133, "global_step": 103359, "epoch": 854} {"train_loss": -36.61275100708008, "global_step": 103360, "epoch": 854} {"train_loss": -36.80499267578125, "global_step": 103361, "epoch": 854} {"train_loss": -35.9232063293457, "global_step": 103362, "epoch": 854} {"train_loss": -36.63241195678711, "global_step": 103363, "epoch": 854} {"train_loss": -36.86301803588867, "global_step": 103364, "epoch": 854} {"train_loss": -37.334815979003906, "global_step": 103365, "epoch": 854} {"train_loss": -37.46266555786133, "global_step": 103366, "epoch": 854} {"train_loss": -37.21378707885742, "global_step": 103367, "epoch": 854} {"train_loss": -36.78424835205078, "global_step": 103368, "epoch": 854} {"train_loss": -36.888668060302734, "global_step": 103369, "epoch": 854} {"train_loss": -36.62446212768555, "global_step": 103370, "epoch": 854} {"train_loss": -37.320369720458984, "global_step": 103371, "epoch": 854} {"train_loss": -36.91887664794922, "global_step": 103372, "epoch": 854} {"train_loss": -37.06159591674805, "global_step": 103373, "epoch": 854} {"train_loss": -36.82528305053711, "global_step": 103374, "epoch": 854} {"train_loss": -36.125038146972656, "global_step": 103375, "epoch": 854} {"train_loss": -37.1175422668457, "global_step": 103376, "epoch": 854} {"train_loss": -37.07215881347656, "global_step": 103377, "epoch": 854} {"train_loss": -37.53011703491211, "global_step": 103378, "epoch": 854} {"train_loss": -37.47249984741211, "global_step": 103379, "epoch": 854} {"train_loss": -37.358924865722656, "global_step": 103380, "epoch": 854} {"train_loss": -37.97086715698242, "global_step": 103381, "epoch": 854} {"train_loss": -37.646236419677734, "global_step": 103382, "epoch": 854} {"train_loss": -37.238155364990234, "global_step": 103383, "epoch": 854} {"train_loss": -37.032310485839844, "global_step": 103384, "epoch": 854} {"train_loss": -37.68952560424805, "global_step": 103385, "epoch": 854} {"train_loss": -38.49294662475586, "global_step": 103386, "epoch": 854} {"train_loss": -37.54197311401367, "global_step": 103387, "epoch": 854} {"train_loss": -36.738399505615234, "global_step": 103388, "epoch": 854} {"train_loss": -37.474281311035156, "global_step": 103389, "epoch": 854} {"train_loss": -37.8104133605957, "global_step": 103390, "epoch": 854} {"train_loss": -37.313018798828125, "global_step": 103391, "epoch": 854} {"train_loss": -37.16416931152344, "global_step": 103392, "epoch": 854} {"train_loss": -37.4986686706543, "global_step": 103393, "epoch": 854} {"train_loss": -37.43903732299805, "global_step": 103394, "epoch": 854} {"train_loss": -37.085872650146484, "global_step": 103395, "epoch": 854} {"train_loss": -37.147254943847656, "global_step": 103396, "epoch": 854} {"train_loss": -37.725624084472656, "global_step": 103397, "epoch": 854} {"train_loss": -37.64406204223633, "global_step": 103398, "epoch": 854} {"train_loss": -37.9726676940918, "global_step": 103399, "epoch": 854} {"train_loss": -37.679840087890625, "global_step": 103400, "epoch": 854} {"train_loss": -36.40034103393555, "global_step": 103401, "epoch": 854} {"train_loss": -37.12595748901367, "global_step": 103402, "epoch": 854} {"train_loss": -36.838565826416016, "global_step": 103403, "epoch": 854} {"train_loss": -37.58199691772461, "global_step": 103404, "epoch": 854} {"train_loss": -36.68947982788086, "global_step": 103405, "epoch": 854} {"train_loss": -37.57184600830078, "global_step": 103406, "epoch": 854} {"train_loss": -37.64013671875, "global_step": 103407, "epoch": 854} {"train_loss": -36.85373306274414, "global_step": 103408, "epoch": 854} {"train_loss": -38.36882400512695, "global_step": 103409, "epoch": 854} {"train_loss": -36.84941482543945, "global_step": 103410, "epoch": 854} {"train_loss": -37.17167282104492, "global_step": 103411, "epoch": 854} {"train_loss": -35.4142951965332, "global_step": 103412, "epoch": 854} {"train_loss": -37.69704818725586, "global_step": 103413, "epoch": 854} {"train_loss": -35.55799102783203, "global_step": 103414, "epoch": 854} {"train_loss": -33.972442626953125, "global_step": 103415, "epoch": 854} {"train_loss": -35.342281341552734, "global_step": 103416, "epoch": 854} {"train_loss": -36.4011344909668, "global_step": 103417, "epoch": 854} {"train_loss": -36.47874069213867, "global_step": 103418, "epoch": 854} {"train_loss": -36.3972282409668, "global_step": 103419, "epoch": 854} {"train_loss": -36.64226531982422, "global_step": 103420, "epoch": 854} {"train_loss": -36.499637603759766, "global_step": 103421, "epoch": 854} {"train_loss": -37.4421272277832, "global_step": 103422, "epoch": 854} {"train_loss": -36.36906814575195, "global_step": 103423, "epoch": 854} {"train_loss": -37.25602340698242, "global_step": 103424, "epoch": 854} {"train_loss": -37.85381317138672, "global_step": 103425, "epoch": 854} {"train_loss": -37.122589111328125, "global_step": 103426, "epoch": 854} {"train_loss": -37.23517608642578, "global_step": 103427, "epoch": 854} {"train_loss": -37.3621711730957, "global_step": 103428, "epoch": 854} {"train_loss": -37.53329086303711, "global_step": 103429, "epoch": 854} {"train_loss": -37.7844352722168, "global_step": 103430, "epoch": 854} {"train_loss": -36.3514404296875, "global_step": 103431, "epoch": 854} {"train_loss": -38.00291061401367, "global_step": 103432, "epoch": 854} {"train_loss": -37.056121826171875, "global_step": 103433, "epoch": 854} {"train_loss": -38.03242111206055, "global_step": 103434, "epoch": 854} {"train_loss": -35.83842086791992, "global_step": 103435, "epoch": 854} {"train_loss": -37.680908203125, "global_step": 103436, "epoch": 854} {"train_loss": -36.57012176513672, "global_step": 103437, "epoch": 854} {"train_loss": -37.19147491455078, "global_step": 103438, "epoch": 854} {"train_loss": -37.253318786621094, "global_step": 103439, "epoch": 854} {"train_loss": -36.979183197021484, "global_step": 103440, "epoch": 854} {"train_loss": -37.231258392333984, "global_step": 103441, "epoch": 854} {"train_loss": -36.981319427490234, "global_step": 103442, "epoch": 854} {"train_loss": -37.73360824584961, "global_step": 103443, "epoch": 854} {"train_loss": -36.977386474609375, "global_step": 103444, "epoch": 854} {"train_loss": -37.64242172241211, "global_step": 103445, "epoch": 854} {"train_loss": -37.6341667175293, "global_step": 103446, "epoch": 854} {"train_loss": -38.32374954223633, "global_step": 103447, "epoch": 854} {"train_loss": -37.80282974243164, "global_step": 103448, "epoch": 854} {"train_loss": -37.9051513671875, "global_step": 103449, "epoch": 854} {"train_loss": -37.79494857788086, "global_step": 103450, "epoch": 854} {"train_loss": -37.935829162597656, "global_step": 103451, "epoch": 854} {"train_loss": -37.12040328979492, "global_step": 103452, "epoch": 854} {"train_loss": -38.15110778808594, "global_step": 103453, "epoch": 854} {"train_loss": -36.909509737629534, "global_step": 103454, "epoch": 854, "val_loss": 2675542.0} {"train_loss": -36.13063049316406, "global_step": 103455, "epoch": 855} {"train_loss": -37.117977142333984, "global_step": 103456, "epoch": 855} {"train_loss": -37.786956787109375, "global_step": 103457, "epoch": 855} {"train_loss": -38.47808837890625, "global_step": 103458, "epoch": 855} {"train_loss": -37.585506439208984, "global_step": 103459, "epoch": 855} {"train_loss": -37.04282760620117, "global_step": 103460, "epoch": 855} {"train_loss": -35.5218505859375, "global_step": 103461, "epoch": 855} {"train_loss": -35.01154327392578, "global_step": 103462, "epoch": 855} {"train_loss": -37.708290100097656, "global_step": 103463, "epoch": 855} {"train_loss": -37.838104248046875, "global_step": 103464, "epoch": 855} {"train_loss": -35.44643020629883, "global_step": 103465, "epoch": 855} {"train_loss": -34.17840576171875, "global_step": 103466, "epoch": 855} {"train_loss": -36.89887619018555, "global_step": 103467, "epoch": 855} {"train_loss": -34.98904800415039, "global_step": 103468, "epoch": 855} {"train_loss": -30.922332763671875, "global_step": 103469, "epoch": 855} {"train_loss": -35.85087966918945, "global_step": 103470, "epoch": 855} {"train_loss": -36.8465690612793, "global_step": 103471, "epoch": 855} {"train_loss": -35.52100372314453, "global_step": 103472, "epoch": 855} {"train_loss": -36.0703010559082, "global_step": 103473, "epoch": 855} {"train_loss": -37.49945831298828, "global_step": 103474, "epoch": 855} {"train_loss": -37.614444732666016, "global_step": 103475, "epoch": 855} {"train_loss": -36.99427032470703, "global_step": 103476, "epoch": 855} {"train_loss": -37.211585998535156, "global_step": 103477, "epoch": 855} {"train_loss": -37.352516174316406, "global_step": 103478, "epoch": 855} {"train_loss": -37.03412628173828, "global_step": 103479, "epoch": 855} {"train_loss": -36.70612335205078, "global_step": 103480, "epoch": 855} {"train_loss": -37.516258239746094, "global_step": 103481, "epoch": 855} {"train_loss": -35.667789459228516, "global_step": 103482, "epoch": 855} {"train_loss": -37.50046920776367, "global_step": 103483, "epoch": 855} {"train_loss": -37.88644027709961, "global_step": 103484, "epoch": 855} {"train_loss": -38.092681884765625, "global_step": 103485, "epoch": 855} {"train_loss": -37.04864501953125, "global_step": 103486, "epoch": 855} {"train_loss": -37.289894104003906, "global_step": 103487, "epoch": 855} {"train_loss": -37.57383346557617, "global_step": 103488, "epoch": 855} {"train_loss": -37.14809036254883, "global_step": 103489, "epoch": 855} {"train_loss": -36.54597091674805, "global_step": 103490, "epoch": 855} {"train_loss": -37.59843063354492, "global_step": 103491, "epoch": 855} {"train_loss": -37.81036376953125, "global_step": 103492, "epoch": 855} {"train_loss": -36.962608337402344, "global_step": 103493, "epoch": 855} {"train_loss": -37.50651931762695, "global_step": 103494, "epoch": 855} {"train_loss": -35.26693344116211, "global_step": 103495, "epoch": 855} {"train_loss": -36.84442901611328, "global_step": 103496, "epoch": 855} {"train_loss": -34.96855926513672, "global_step": 103497, "epoch": 855} {"train_loss": -29.5888614654541, "global_step": 103498, "epoch": 855} {"train_loss": -25.450902938842773, "global_step": 103499, "epoch": 855} {"train_loss": -33.97958755493164, "global_step": 103500, "epoch": 855} {"train_loss": -35.2093505859375, "global_step": 103501, "epoch": 855} {"train_loss": -33.26179122924805, "global_step": 103502, "epoch": 855} {"train_loss": -34.13620376586914, "global_step": 103503, "epoch": 855} {"train_loss": -33.84299850463867, "global_step": 103504, "epoch": 855} {"train_loss": -33.02788162231445, "global_step": 103505, "epoch": 855} {"train_loss": -36.75607681274414, "global_step": 103506, "epoch": 855} {"train_loss": -36.569759368896484, "global_step": 103507, "epoch": 855} {"train_loss": -36.46637725830078, "global_step": 103508, "epoch": 855} {"train_loss": -34.6472282409668, "global_step": 103509, "epoch": 855} {"train_loss": -33.63286590576172, "global_step": 103510, "epoch": 855} {"train_loss": -36.06006622314453, "global_step": 103511, "epoch": 855} {"train_loss": -35.735713958740234, "global_step": 103512, "epoch": 855} {"train_loss": -35.52538299560547, "global_step": 103513, "epoch": 855} {"train_loss": -36.259830474853516, "global_step": 103514, "epoch": 855} {"train_loss": -30.929685592651367, "global_step": 103515, "epoch": 855} {"train_loss": -37.18427276611328, "global_step": 103516, "epoch": 855} {"train_loss": -36.31573486328125, "global_step": 103517, "epoch": 855} {"train_loss": -36.74677276611328, "global_step": 103518, "epoch": 855} {"train_loss": -32.7357292175293, "global_step": 103519, "epoch": 855} {"train_loss": -35.906951904296875, "global_step": 103520, "epoch": 855} {"train_loss": -35.6970100402832, "global_step": 103521, "epoch": 855} {"train_loss": -35.43525314331055, "global_step": 103522, "epoch": 855} {"train_loss": -36.97147750854492, "global_step": 103523, "epoch": 855} {"train_loss": -36.39255142211914, "global_step": 103524, "epoch": 855} {"train_loss": -37.7598762512207, "global_step": 103525, "epoch": 855} {"train_loss": -36.58243179321289, "global_step": 103526, "epoch": 855} {"train_loss": -36.9410400390625, "global_step": 103527, "epoch": 855} {"train_loss": -36.2259635925293, "global_step": 103528, "epoch": 855} {"train_loss": -36.97036361694336, "global_step": 103529, "epoch": 855} {"train_loss": -37.59723663330078, "global_step": 103530, "epoch": 855} {"train_loss": -37.10248947143555, "global_step": 103531, "epoch": 855} {"train_loss": -37.332515716552734, "global_step": 103532, "epoch": 855} {"train_loss": -37.2623291015625, "global_step": 103533, "epoch": 855} {"train_loss": -37.26142120361328, "global_step": 103534, "epoch": 855} {"train_loss": -37.365882873535156, "global_step": 103535, "epoch": 855} {"train_loss": -37.58625030517578, "global_step": 103536, "epoch": 855} {"train_loss": -37.760555267333984, "global_step": 103537, "epoch": 855} {"train_loss": -37.3299560546875, "global_step": 103538, "epoch": 855} {"train_loss": -37.19911575317383, "global_step": 103539, "epoch": 855} {"train_loss": -37.174434661865234, "global_step": 103540, "epoch": 855} {"train_loss": -36.55621337890625, "global_step": 103541, "epoch": 855} {"train_loss": -35.98738479614258, "global_step": 103542, "epoch": 855} {"train_loss": -37.976436614990234, "global_step": 103543, "epoch": 855} {"train_loss": -37.76066207885742, "global_step": 103544, "epoch": 855} {"train_loss": -35.55428695678711, "global_step": 103545, "epoch": 855} {"train_loss": -36.849525451660156, "global_step": 103546, "epoch": 855} {"train_loss": -37.15606689453125, "global_step": 103547, "epoch": 855} {"train_loss": -37.52611541748047, "global_step": 103548, "epoch": 855} {"train_loss": -37.729061126708984, "global_step": 103549, "epoch": 855} {"train_loss": -37.975189208984375, "global_step": 103550, "epoch": 855} {"train_loss": -35.36189651489258, "global_step": 103551, "epoch": 855} {"train_loss": -37.12757873535156, "global_step": 103552, "epoch": 855} {"train_loss": -37.0466423034668, "global_step": 103553, "epoch": 855} {"train_loss": -36.42367935180664, "global_step": 103554, "epoch": 855} {"train_loss": -37.84873962402344, "global_step": 103555, "epoch": 855} {"train_loss": -37.627166748046875, "global_step": 103556, "epoch": 855} {"train_loss": -37.59029769897461, "global_step": 103557, "epoch": 855} {"train_loss": -37.79720687866211, "global_step": 103558, "epoch": 855} {"train_loss": -37.83042526245117, "global_step": 103559, "epoch": 855} {"train_loss": -36.62055206298828, "global_step": 103560, "epoch": 855} {"train_loss": -37.60634231567383, "global_step": 103561, "epoch": 855} {"train_loss": -37.27365493774414, "global_step": 103562, "epoch": 855} {"train_loss": -38.23196029663086, "global_step": 103563, "epoch": 855} {"train_loss": -38.15424728393555, "global_step": 103564, "epoch": 855} {"train_loss": -37.28537368774414, "global_step": 103565, "epoch": 855} {"train_loss": -36.141475677490234, "global_step": 103566, "epoch": 855} {"train_loss": -37.61262893676758, "global_step": 103567, "epoch": 855} {"train_loss": -38.05327224731445, "global_step": 103568, "epoch": 855} {"train_loss": -37.59419250488281, "global_step": 103569, "epoch": 855} {"train_loss": -37.52949905395508, "global_step": 103570, "epoch": 855} {"train_loss": -38.16244125366211, "global_step": 103571, "epoch": 855} {"train_loss": -37.795501708984375, "global_step": 103572, "epoch": 855} {"train_loss": -38.389984130859375, "global_step": 103573, "epoch": 855} {"train_loss": -37.621734619140625, "global_step": 103574, "epoch": 855} {"train_loss": -36.481668535342884, "global_step": 103575, "epoch": 855, "val_loss": 2797756.75} {"train_loss": -37.980220794677734, "global_step": 103576, "epoch": 856} {"train_loss": -36.40213394165039, "global_step": 103577, "epoch": 856} {"train_loss": -37.62556838989258, "global_step": 103578, "epoch": 856} {"train_loss": -34.70734786987305, "global_step": 103579, "epoch": 856} {"train_loss": -36.24041748046875, "global_step": 103580, "epoch": 856} {"train_loss": -37.84758377075195, "global_step": 103581, "epoch": 856} {"train_loss": -36.961212158203125, "global_step": 103582, "epoch": 856} {"train_loss": -38.45880126953125, "global_step": 103583, "epoch": 856} {"train_loss": -37.67621994018555, "global_step": 103584, "epoch": 856} {"train_loss": -38.160396575927734, "global_step": 103585, "epoch": 856} {"train_loss": -38.263580322265625, "global_step": 103586, "epoch": 856} {"train_loss": -37.75296401977539, "global_step": 103587, "epoch": 856} {"train_loss": -38.001155853271484, "global_step": 103588, "epoch": 856} {"train_loss": -37.80183792114258, "global_step": 103589, "epoch": 856} {"train_loss": -36.760414123535156, "global_step": 103590, "epoch": 856} {"train_loss": -37.480979919433594, "global_step": 103591, "epoch": 856} {"train_loss": -38.980316162109375, "global_step": 103592, "epoch": 856} {"train_loss": -38.32630920410156, "global_step": 103593, "epoch": 856} {"train_loss": -36.86454772949219, "global_step": 103594, "epoch": 856} {"train_loss": -35.761985778808594, "global_step": 103595, "epoch": 856} {"train_loss": -37.12257766723633, "global_step": 103596, "epoch": 856} {"train_loss": -34.06831741333008, "global_step": 103597, "epoch": 856} {"train_loss": -33.9044075012207, "global_step": 103598, "epoch": 856} {"train_loss": -33.55567169189453, "global_step": 103599, "epoch": 856} {"train_loss": -36.03916549682617, "global_step": 103600, "epoch": 856} {"train_loss": -38.089988708496094, "global_step": 103601, "epoch": 856} {"train_loss": -37.658687591552734, "global_step": 103602, "epoch": 856} {"train_loss": -36.84510803222656, "global_step": 103603, "epoch": 856} {"train_loss": -37.809730529785156, "global_step": 103604, "epoch": 856} {"train_loss": -32.16105270385742, "global_step": 103605, "epoch": 856} {"train_loss": -37.46993637084961, "global_step": 103606, "epoch": 856} {"train_loss": -36.73454666137695, "global_step": 103607, "epoch": 856} {"train_loss": -36.586830139160156, "global_step": 103608, "epoch": 856} {"train_loss": -37.69723129272461, "global_step": 103609, "epoch": 856} {"train_loss": -37.55989456176758, "global_step": 103610, "epoch": 856} {"train_loss": -36.362449645996094, "global_step": 103611, "epoch": 856} {"train_loss": -36.638450622558594, "global_step": 103612, "epoch": 856} {"train_loss": -37.33365249633789, "global_step": 103613, "epoch": 856} {"train_loss": -35.76185989379883, "global_step": 103614, "epoch": 856} {"train_loss": -35.97377014160156, "global_step": 103615, "epoch": 856} {"train_loss": -37.02116775512695, "global_step": 103616, "epoch": 856} {"train_loss": -34.54563522338867, "global_step": 103617, "epoch": 856} {"train_loss": -35.33906173706055, "global_step": 103618, "epoch": 856} {"train_loss": -36.838497161865234, "global_step": 103619, "epoch": 856} {"train_loss": -33.73643112182617, "global_step": 103620, "epoch": 856} {"train_loss": -35.93868637084961, "global_step": 103621, "epoch": 856} {"train_loss": -37.41392517089844, "global_step": 103622, "epoch": 856} {"train_loss": -35.52509689331055, "global_step": 103623, "epoch": 856} {"train_loss": -37.214561462402344, "global_step": 103624, "epoch": 856} {"train_loss": -35.9704704284668, "global_step": 103625, "epoch": 856} {"train_loss": -37.54693603515625, "global_step": 103626, "epoch": 856} {"train_loss": -36.55766677856445, "global_step": 103627, "epoch": 856} {"train_loss": -37.06621551513672, "global_step": 103628, "epoch": 856} {"train_loss": -37.769447326660156, "global_step": 103629, "epoch": 856} {"train_loss": -35.945125579833984, "global_step": 103630, "epoch": 856} {"train_loss": -38.25899887084961, "global_step": 103631, "epoch": 856} {"train_loss": -37.59870147705078, "global_step": 103632, "epoch": 856} {"train_loss": -37.05086898803711, "global_step": 103633, "epoch": 856} {"train_loss": -37.50972366333008, "global_step": 103634, "epoch": 856} {"train_loss": -37.12240219116211, "global_step": 103635, "epoch": 856} {"train_loss": -38.27138137817383, "global_step": 103636, "epoch": 856} {"train_loss": -37.00560760498047, "global_step": 103637, "epoch": 856} {"train_loss": -37.63912582397461, "global_step": 103638, "epoch": 856} {"train_loss": -37.17151641845703, "global_step": 103639, "epoch": 856} {"train_loss": -37.92815399169922, "global_step": 103640, "epoch": 856} {"train_loss": -36.961299896240234, "global_step": 103641, "epoch": 856} {"train_loss": -38.49379348754883, "global_step": 103642, "epoch": 856} {"train_loss": -38.04118347167969, "global_step": 103643, "epoch": 856} {"train_loss": -37.56596755981445, "global_step": 103644, "epoch": 856} {"train_loss": -38.00785446166992, "global_step": 103645, "epoch": 856} {"train_loss": -37.37836837768555, "global_step": 103646, "epoch": 856} {"train_loss": -38.67982864379883, "global_step": 103647, "epoch": 856} {"train_loss": -38.227970123291016, "global_step": 103648, "epoch": 856} {"train_loss": -35.86015701293945, "global_step": 103649, "epoch": 856} {"train_loss": -37.970191955566406, "global_step": 103650, "epoch": 856} {"train_loss": -37.78682327270508, "global_step": 103651, "epoch": 856} {"train_loss": -38.55450439453125, "global_step": 103652, "epoch": 856} {"train_loss": -37.93639373779297, "global_step": 103653, "epoch": 856} {"train_loss": -38.71916580200195, "global_step": 103654, "epoch": 856} {"train_loss": -35.078704833984375, "global_step": 103655, "epoch": 856} {"train_loss": -38.70662307739258, "global_step": 103656, "epoch": 856} {"train_loss": -37.886878967285156, "global_step": 103657, "epoch": 856} {"train_loss": -38.47224044799805, "global_step": 103658, "epoch": 856} {"train_loss": -38.16695785522461, "global_step": 103659, "epoch": 856} {"train_loss": -38.39253616333008, "global_step": 103660, "epoch": 856} {"train_loss": -37.953643798828125, "global_step": 103661, "epoch": 856} {"train_loss": -37.38570785522461, "global_step": 103662, "epoch": 856} {"train_loss": -38.14377975463867, "global_step": 103663, "epoch": 856} {"train_loss": -38.92348861694336, "global_step": 103664, "epoch": 856} {"train_loss": -38.17720031738281, "global_step": 103665, "epoch": 856} {"train_loss": -37.8619270324707, "global_step": 103666, "epoch": 856} {"train_loss": -37.07265853881836, "global_step": 103667, "epoch": 856} {"train_loss": -37.57390213012695, "global_step": 103668, "epoch": 856} {"train_loss": -35.896095275878906, "global_step": 103669, "epoch": 856} {"train_loss": -37.81928634643555, "global_step": 103670, "epoch": 856} {"train_loss": -37.655372619628906, "global_step": 103671, "epoch": 856} {"train_loss": -37.73686981201172, "global_step": 103672, "epoch": 856} {"train_loss": -37.6829948425293, "global_step": 103673, "epoch": 856} {"train_loss": -36.87525939941406, "global_step": 103674, "epoch": 856} {"train_loss": -35.57121658325195, "global_step": 103675, "epoch": 856} {"train_loss": -33.026092529296875, "global_step": 103676, "epoch": 856} {"train_loss": -35.229976654052734, "global_step": 103677, "epoch": 856} {"train_loss": -36.653045654296875, "global_step": 103678, "epoch": 856} {"train_loss": -37.16436767578125, "global_step": 103679, "epoch": 856} {"train_loss": -37.86444091796875, "global_step": 103680, "epoch": 856} {"train_loss": -36.37578201293945, "global_step": 103681, "epoch": 856} {"train_loss": -36.989044189453125, "global_step": 103682, "epoch": 856} {"train_loss": -37.80800247192383, "global_step": 103683, "epoch": 856} {"train_loss": -36.90365219116211, "global_step": 103684, "epoch": 856} {"train_loss": -37.61174774169922, "global_step": 103685, "epoch": 856} {"train_loss": -35.876766204833984, "global_step": 103686, "epoch": 856} {"train_loss": -37.22195816040039, "global_step": 103687, "epoch": 856} {"train_loss": -38.481597900390625, "global_step": 103688, "epoch": 856} {"train_loss": -38.39805603027344, "global_step": 103689, "epoch": 856} {"train_loss": -36.9728889465332, "global_step": 103690, "epoch": 856} {"train_loss": -37.76688766479492, "global_step": 103691, "epoch": 856} {"train_loss": -37.84579086303711, "global_step": 103692, "epoch": 856} {"train_loss": -35.8281364440918, "global_step": 103693, "epoch": 856} {"train_loss": -38.14237594604492, "global_step": 103694, "epoch": 856} {"train_loss": -35.90018844604492, "global_step": 103695, "epoch": 856} {"train_loss": -37.090865521391564, "global_step": 103696, "epoch": 856, "val_loss": 2838348.0} {"train_loss": -37.622894287109375, "global_step": 103697, "epoch": 857} {"train_loss": -37.112361907958984, "global_step": 103698, "epoch": 857} {"train_loss": -36.7811164855957, "global_step": 103699, "epoch": 857} {"train_loss": -38.37119674682617, "global_step": 103700, "epoch": 857} {"train_loss": -38.10185241699219, "global_step": 103701, "epoch": 857} {"train_loss": -37.96736145019531, "global_step": 103702, "epoch": 857} {"train_loss": -38.01957321166992, "global_step": 103703, "epoch": 857} {"train_loss": -38.36606979370117, "global_step": 103704, "epoch": 857} {"train_loss": -35.02592849731445, "global_step": 103705, "epoch": 857} {"train_loss": -37.61330795288086, "global_step": 103706, "epoch": 857} {"train_loss": -38.23550033569336, "global_step": 103707, "epoch": 857} {"train_loss": -37.331356048583984, "global_step": 103708, "epoch": 857} {"train_loss": -38.021297454833984, "global_step": 103709, "epoch": 857} {"train_loss": -36.64036178588867, "global_step": 103710, "epoch": 857} {"train_loss": -36.52376174926758, "global_step": 103711, "epoch": 857} {"train_loss": -37.32573699951172, "global_step": 103712, "epoch": 857} {"train_loss": -37.2773323059082, "global_step": 103713, "epoch": 857} {"train_loss": -37.487770080566406, "global_step": 103714, "epoch": 857} {"train_loss": -37.71892166137695, "global_step": 103715, "epoch": 857} {"train_loss": -37.95158767700195, "global_step": 103716, "epoch": 857} {"train_loss": -36.83949661254883, "global_step": 103717, "epoch": 857} {"train_loss": -37.66133499145508, "global_step": 103718, "epoch": 857} {"train_loss": -38.71518325805664, "global_step": 103719, "epoch": 857} {"train_loss": -38.43878936767578, "global_step": 103720, "epoch": 857} {"train_loss": -38.55472946166992, "global_step": 103721, "epoch": 857} {"train_loss": -36.51995849609375, "global_step": 103722, "epoch": 857} {"train_loss": -36.67905807495117, "global_step": 103723, "epoch": 857} {"train_loss": -37.81889343261719, "global_step": 103724, "epoch": 857} {"train_loss": -38.4874267578125, "global_step": 103725, "epoch": 857} {"train_loss": -38.56638717651367, "global_step": 103726, "epoch": 857} {"train_loss": -38.508018493652344, "global_step": 103727, "epoch": 857} {"train_loss": -37.867401123046875, "global_step": 103728, "epoch": 857} {"train_loss": -38.046566009521484, "global_step": 103729, "epoch": 857} {"train_loss": -37.5687370300293, "global_step": 103730, "epoch": 857} {"train_loss": -37.23952865600586, "global_step": 103731, "epoch": 857} {"train_loss": -35.343135833740234, "global_step": 103732, "epoch": 857} {"train_loss": -37.50303268432617, "global_step": 103733, "epoch": 857} {"train_loss": -38.324886322021484, "global_step": 103734, "epoch": 857} {"train_loss": -34.70345687866211, "global_step": 103735, "epoch": 857} {"train_loss": -32.82017135620117, "global_step": 103736, "epoch": 857} {"train_loss": -33.817176818847656, "global_step": 103737, "epoch": 857} {"train_loss": -38.13698959350586, "global_step": 103738, "epoch": 857} {"train_loss": -34.76384353637695, "global_step": 103739, "epoch": 857} {"train_loss": -33.8663215637207, "global_step": 103740, "epoch": 857} {"train_loss": -36.43124008178711, "global_step": 103741, "epoch": 857} {"train_loss": -37.61997604370117, "global_step": 103742, "epoch": 857} {"train_loss": -35.903926849365234, "global_step": 103743, "epoch": 857} {"train_loss": -37.75580596923828, "global_step": 103744, "epoch": 857} {"train_loss": -36.78020095825195, "global_step": 103745, "epoch": 857} {"train_loss": -37.25712203979492, "global_step": 103746, "epoch": 857} {"train_loss": -37.86501693725586, "global_step": 103747, "epoch": 857} {"train_loss": -35.91156005859375, "global_step": 103748, "epoch": 857} {"train_loss": -38.4890251159668, "global_step": 103749, "epoch": 857} {"train_loss": -37.729278564453125, "global_step": 103750, "epoch": 857} {"train_loss": -38.510372161865234, "global_step": 103751, "epoch": 857} {"train_loss": -37.12677764892578, "global_step": 103752, "epoch": 857} {"train_loss": -38.00616455078125, "global_step": 103753, "epoch": 857} {"train_loss": -38.03495788574219, "global_step": 103754, "epoch": 857} {"train_loss": -37.9957389831543, "global_step": 103755, "epoch": 857} {"train_loss": -38.089813232421875, "global_step": 103756, "epoch": 857} {"train_loss": -37.76882553100586, "global_step": 103757, "epoch": 857} {"train_loss": -38.3115234375, "global_step": 103758, "epoch": 857} {"train_loss": -38.232845306396484, "global_step": 103759, "epoch": 857} {"train_loss": -39.125667572021484, "global_step": 103760, "epoch": 857} {"train_loss": -38.1210823059082, "global_step": 103761, "epoch": 857} {"train_loss": -38.097511291503906, "global_step": 103762, "epoch": 857} {"train_loss": -38.562198638916016, "global_step": 103763, "epoch": 857} {"train_loss": -37.7033576965332, "global_step": 103764, "epoch": 857} {"train_loss": -38.87764358520508, "global_step": 103765, "epoch": 857} {"train_loss": -38.545372009277344, "global_step": 103766, "epoch": 857} {"train_loss": -37.342185974121094, "global_step": 103767, "epoch": 857} {"train_loss": -38.99137496948242, "global_step": 103768, "epoch": 857} {"train_loss": -38.293724060058594, "global_step": 103769, "epoch": 857} {"train_loss": -38.695980072021484, "global_step": 103770, "epoch": 857} {"train_loss": -39.06361389160156, "global_step": 103771, "epoch": 857} {"train_loss": -38.727108001708984, "global_step": 103772, "epoch": 857} {"train_loss": -38.7517204284668, "global_step": 103773, "epoch": 857} {"train_loss": -36.634605407714844, "global_step": 103774, "epoch": 857} {"train_loss": -38.793209075927734, "global_step": 103775, "epoch": 857} {"train_loss": -38.563594818115234, "global_step": 103776, "epoch": 857} {"train_loss": -38.84591293334961, "global_step": 103777, "epoch": 857} {"train_loss": -36.55367660522461, "global_step": 103778, "epoch": 857} {"train_loss": -38.4734001159668, "global_step": 103779, "epoch": 857} {"train_loss": -38.84122848510742, "global_step": 103780, "epoch": 857} {"train_loss": -38.45730209350586, "global_step": 103781, "epoch": 857} {"train_loss": -38.07866287231445, "global_step": 103782, "epoch": 857} {"train_loss": -39.25461959838867, "global_step": 103783, "epoch": 857} {"train_loss": -38.33430099487305, "global_step": 103784, "epoch": 857} {"train_loss": -38.419429779052734, "global_step": 103785, "epoch": 857} {"train_loss": -38.03682327270508, "global_step": 103786, "epoch": 857} {"train_loss": -37.68572235107422, "global_step": 103787, "epoch": 857} {"train_loss": -38.12748336791992, "global_step": 103788, "epoch": 857} {"train_loss": -37.1236572265625, "global_step": 103789, "epoch": 857} {"train_loss": -36.226844787597656, "global_step": 103790, "epoch": 857} {"train_loss": -36.322689056396484, "global_step": 103791, "epoch": 857} {"train_loss": -37.03797912597656, "global_step": 103792, "epoch": 857} {"train_loss": -37.730220794677734, "global_step": 103793, "epoch": 857} {"train_loss": -39.00043487548828, "global_step": 103794, "epoch": 857} {"train_loss": -37.40473175048828, "global_step": 103795, "epoch": 857} {"train_loss": -34.547367095947266, "global_step": 103796, "epoch": 857} {"train_loss": -36.47469711303711, "global_step": 103797, "epoch": 857} {"train_loss": -38.99159622192383, "global_step": 103798, "epoch": 857} {"train_loss": -37.171810150146484, "global_step": 103799, "epoch": 857} {"train_loss": -36.88715744018555, "global_step": 103800, "epoch": 857} {"train_loss": -39.01225662231445, "global_step": 103801, "epoch": 857} {"train_loss": -37.35681915283203, "global_step": 103802, "epoch": 857} {"train_loss": -37.48960494995117, "global_step": 103803, "epoch": 857} {"train_loss": -38.61787033081055, "global_step": 103804, "epoch": 857} {"train_loss": -37.05259704589844, "global_step": 103805, "epoch": 857} {"train_loss": -38.88607406616211, "global_step": 103806, "epoch": 857} {"train_loss": -37.8439826965332, "global_step": 103807, "epoch": 857} {"train_loss": -38.4473762512207, "global_step": 103808, "epoch": 857} {"train_loss": -38.21574020385742, "global_step": 103809, "epoch": 857} {"train_loss": -38.4146614074707, "global_step": 103810, "epoch": 857} {"train_loss": -38.95986557006836, "global_step": 103811, "epoch": 857} {"train_loss": -38.5933952331543, "global_step": 103812, "epoch": 857} {"train_loss": -38.21329879760742, "global_step": 103813, "epoch": 857} {"train_loss": -39.341060638427734, "global_step": 103814, "epoch": 857} {"train_loss": -38.760929107666016, "global_step": 103815, "epoch": 857} {"train_loss": -38.866329193115234, "global_step": 103816, "epoch": 857} {"train_loss": -37.686789552042306, "global_step": 103817, "epoch": 857, "val_loss": 2781701.25} {"train_loss": -39.11690902709961, "global_step": 103818, "epoch": 858} {"train_loss": -38.63776779174805, "global_step": 103819, "epoch": 858} {"train_loss": -38.9176025390625, "global_step": 103820, "epoch": 858} {"train_loss": -38.54087448120117, "global_step": 103821, "epoch": 858} {"train_loss": -36.60282516479492, "global_step": 103822, "epoch": 858} {"train_loss": -37.57023239135742, "global_step": 103823, "epoch": 858} {"train_loss": -38.54413986206055, "global_step": 103824, "epoch": 858} {"train_loss": -39.02395248413086, "global_step": 103825, "epoch": 858} {"train_loss": -38.445716857910156, "global_step": 103826, "epoch": 858} {"train_loss": -37.9942741394043, "global_step": 103827, "epoch": 858} {"train_loss": -37.93603515625, "global_step": 103828, "epoch": 858} {"train_loss": -38.87293243408203, "global_step": 103829, "epoch": 858} {"train_loss": -38.861026763916016, "global_step": 103830, "epoch": 858} {"train_loss": -38.630226135253906, "global_step": 103831, "epoch": 858} {"train_loss": -39.19289779663086, "global_step": 103832, "epoch": 858} {"train_loss": -38.25577926635742, "global_step": 103833, "epoch": 858} {"train_loss": -38.56156539916992, "global_step": 103834, "epoch": 858} {"train_loss": -38.49155807495117, "global_step": 103835, "epoch": 858} {"train_loss": -37.228668212890625, "global_step": 103836, "epoch": 858} {"train_loss": -36.964263916015625, "global_step": 103837, "epoch": 858} {"train_loss": -36.14493179321289, "global_step": 103838, "epoch": 858} {"train_loss": -38.579566955566406, "global_step": 103839, "epoch": 858} {"train_loss": -38.148258209228516, "global_step": 103840, "epoch": 858} {"train_loss": -37.2659912109375, "global_step": 103841, "epoch": 858} {"train_loss": -37.684906005859375, "global_step": 103842, "epoch": 858} {"train_loss": -37.809993743896484, "global_step": 103843, "epoch": 858} {"train_loss": -36.618038177490234, "global_step": 103844, "epoch": 858} {"train_loss": -37.53706359863281, "global_step": 103845, "epoch": 858} {"train_loss": -36.43265914916992, "global_step": 103846, "epoch": 858} {"train_loss": -36.55790710449219, "global_step": 103847, "epoch": 858} {"train_loss": -37.55361557006836, "global_step": 103848, "epoch": 858} {"train_loss": -36.830970764160156, "global_step": 103849, "epoch": 858} {"train_loss": -38.035945892333984, "global_step": 103850, "epoch": 858} {"train_loss": -37.31439971923828, "global_step": 103851, "epoch": 858} {"train_loss": -38.711761474609375, "global_step": 103852, "epoch": 858} {"train_loss": -38.73871612548828, "global_step": 103853, "epoch": 858} {"train_loss": -38.815494537353516, "global_step": 103854, "epoch": 858} {"train_loss": -37.970863342285156, "global_step": 103855, "epoch": 858} {"train_loss": -36.76816940307617, "global_step": 103856, "epoch": 858} {"train_loss": -38.85999298095703, "global_step": 103857, "epoch": 858} {"train_loss": -37.5704345703125, "global_step": 103858, "epoch": 858} {"train_loss": -38.86188507080078, "global_step": 103859, "epoch": 858} {"train_loss": -37.83851623535156, "global_step": 103860, "epoch": 858} {"train_loss": -38.190547943115234, "global_step": 103861, "epoch": 858} {"train_loss": -37.45624923706055, "global_step": 103862, "epoch": 858} {"train_loss": -38.231014251708984, "global_step": 103863, "epoch": 858} {"train_loss": -38.027130126953125, "global_step": 103864, "epoch": 858} {"train_loss": -38.82277297973633, "global_step": 103865, "epoch": 858} {"train_loss": -38.34394454956055, "global_step": 103866, "epoch": 858} {"train_loss": -38.6422004699707, "global_step": 103867, "epoch": 858} {"train_loss": -38.914695739746094, "global_step": 103868, "epoch": 858} {"train_loss": -38.5346565246582, "global_step": 103869, "epoch": 858} {"train_loss": -38.80939865112305, "global_step": 103870, "epoch": 858} {"train_loss": -38.04921340942383, "global_step": 103871, "epoch": 858} {"train_loss": -38.84195327758789, "global_step": 103872, "epoch": 858} {"train_loss": -38.66813659667969, "global_step": 103873, "epoch": 858} {"train_loss": -38.70261764526367, "global_step": 103874, "epoch": 858} {"train_loss": -38.95066452026367, "global_step": 103875, "epoch": 858} {"train_loss": -37.914634704589844, "global_step": 103876, "epoch": 858} {"train_loss": -32.640350341796875, "global_step": 103877, "epoch": 858} {"train_loss": -37.69921875, "global_step": 103878, "epoch": 858} {"train_loss": -38.961307525634766, "global_step": 103879, "epoch": 858} {"train_loss": -38.491966247558594, "global_step": 103880, "epoch": 858} {"train_loss": -37.99036407470703, "global_step": 103881, "epoch": 858} {"train_loss": -38.955596923828125, "global_step": 103882, "epoch": 858} {"train_loss": -38.822509765625, "global_step": 103883, "epoch": 858} {"train_loss": -38.807350158691406, "global_step": 103884, "epoch": 858} {"train_loss": -37.675350189208984, "global_step": 103885, "epoch": 858} {"train_loss": -38.85132598876953, "global_step": 103886, "epoch": 858} {"train_loss": -39.34434127807617, "global_step": 103887, "epoch": 858} {"train_loss": -36.143585205078125, "global_step": 103888, "epoch": 858} {"train_loss": -37.732112884521484, "global_step": 103889, "epoch": 858} {"train_loss": -38.33179473876953, "global_step": 103890, "epoch": 858} {"train_loss": -38.868202209472656, "global_step": 103891, "epoch": 858} {"train_loss": -36.1966667175293, "global_step": 103892, "epoch": 858} {"train_loss": -37.01961898803711, "global_step": 103893, "epoch": 858} {"train_loss": -37.333248138427734, "global_step": 103894, "epoch": 858} {"train_loss": -37.414852142333984, "global_step": 103895, "epoch": 858} {"train_loss": -37.41696548461914, "global_step": 103896, "epoch": 858} {"train_loss": -37.98892593383789, "global_step": 103897, "epoch": 858} {"train_loss": -38.84812927246094, "global_step": 103898, "epoch": 858} {"train_loss": -37.14336395263672, "global_step": 103899, "epoch": 858} {"train_loss": -34.713321685791016, "global_step": 103900, "epoch": 858} {"train_loss": -35.68070983886719, "global_step": 103901, "epoch": 858} {"train_loss": -37.64537048339844, "global_step": 103902, "epoch": 858} {"train_loss": -38.291717529296875, "global_step": 103903, "epoch": 858} {"train_loss": -34.184452056884766, "global_step": 103904, "epoch": 858} {"train_loss": -36.68741226196289, "global_step": 103905, "epoch": 858} {"train_loss": -35.1330451965332, "global_step": 103906, "epoch": 858} {"train_loss": -33.918670654296875, "global_step": 103907, "epoch": 858} {"train_loss": -34.89992904663086, "global_step": 103908, "epoch": 858} {"train_loss": -36.004119873046875, "global_step": 103909, "epoch": 858} {"train_loss": -35.745365142822266, "global_step": 103910, "epoch": 858} {"train_loss": -35.101375579833984, "global_step": 103911, "epoch": 858} {"train_loss": -34.12604522705078, "global_step": 103912, "epoch": 858} {"train_loss": -33.59910583496094, "global_step": 103913, "epoch": 858} {"train_loss": -38.27809524536133, "global_step": 103914, "epoch": 858} {"train_loss": -36.3676643371582, "global_step": 103915, "epoch": 858} {"train_loss": -36.9515495300293, "global_step": 103916, "epoch": 858} {"train_loss": -37.31332015991211, "global_step": 103917, "epoch": 858} {"train_loss": -36.658958435058594, "global_step": 103918, "epoch": 858} {"train_loss": -37.20376968383789, "global_step": 103919, "epoch": 858} {"train_loss": -33.99257278442383, "global_step": 103920, "epoch": 858} {"train_loss": -35.80337142944336, "global_step": 103921, "epoch": 858} {"train_loss": -36.77213668823242, "global_step": 103922, "epoch": 858} {"train_loss": -36.409847259521484, "global_step": 103923, "epoch": 858} {"train_loss": -37.23005294799805, "global_step": 103924, "epoch": 858} {"train_loss": -36.76735305786133, "global_step": 103925, "epoch": 858} {"train_loss": -34.51108169555664, "global_step": 103926, "epoch": 858} {"train_loss": -37.1273078918457, "global_step": 103927, "epoch": 858} {"train_loss": -36.835872650146484, "global_step": 103928, "epoch": 858} {"train_loss": -37.38869094848633, "global_step": 103929, "epoch": 858} {"train_loss": -37.55074691772461, "global_step": 103930, "epoch": 858} {"train_loss": -33.89287185668945, "global_step": 103931, "epoch": 858} {"train_loss": -37.15554428100586, "global_step": 103932, "epoch": 858} {"train_loss": -35.322628021240234, "global_step": 103933, "epoch": 858} {"train_loss": -36.650447845458984, "global_step": 103934, "epoch": 858} {"train_loss": -37.06028366088867, "global_step": 103935, "epoch": 858} {"train_loss": -37.36387252807617, "global_step": 103936, "epoch": 858} {"train_loss": -37.30215072631836, "global_step": 103937, "epoch": 858} {"train_loss": -37.41884729684877, "global_step": 103938, "epoch": 858, "val_loss": 2793635.75} {"train_loss": -37.44761657714844, "global_step": 103939, "epoch": 859} {"train_loss": -36.43608474731445, "global_step": 103940, "epoch": 859} {"train_loss": -37.373146057128906, "global_step": 103941, "epoch": 859} {"train_loss": -36.41501998901367, "global_step": 103942, "epoch": 859} {"train_loss": -37.264129638671875, "global_step": 103943, "epoch": 859} {"train_loss": -37.123653411865234, "global_step": 103944, "epoch": 859} {"train_loss": -36.40171813964844, "global_step": 103945, "epoch": 859} {"train_loss": -37.6202507019043, "global_step": 103946, "epoch": 859} {"train_loss": -37.34541320800781, "global_step": 103947, "epoch": 859} {"train_loss": -37.435787200927734, "global_step": 103948, "epoch": 859} {"train_loss": -37.80562973022461, "global_step": 103949, "epoch": 859} {"train_loss": -36.91753005981445, "global_step": 103950, "epoch": 859} {"train_loss": -37.50715637207031, "global_step": 103951, "epoch": 859} {"train_loss": -37.38385772705078, "global_step": 103952, "epoch": 859} {"train_loss": -37.09234619140625, "global_step": 103953, "epoch": 859} {"train_loss": -37.53986740112305, "global_step": 103954, "epoch": 859} {"train_loss": -37.779296875, "global_step": 103955, "epoch": 859} {"train_loss": -37.42704391479492, "global_step": 103956, "epoch": 859} {"train_loss": -37.50312042236328, "global_step": 103957, "epoch": 859} {"train_loss": -37.958702087402344, "global_step": 103958, "epoch": 859} {"train_loss": -36.63063430786133, "global_step": 103959, "epoch": 859} {"train_loss": -36.361331939697266, "global_step": 103960, "epoch": 859} {"train_loss": -37.15374755859375, "global_step": 103961, "epoch": 859} {"train_loss": -36.718318939208984, "global_step": 103962, "epoch": 859} {"train_loss": -36.31252670288086, "global_step": 103963, "epoch": 859} {"train_loss": -36.27360534667969, "global_step": 103964, "epoch": 859} {"train_loss": -38.33710861206055, "global_step": 103965, "epoch": 859} {"train_loss": -36.084041595458984, "global_step": 103966, "epoch": 859} {"train_loss": -35.60466766357422, "global_step": 103967, "epoch": 859} {"train_loss": -36.06303024291992, "global_step": 103968, "epoch": 859} {"train_loss": -37.7274055480957, "global_step": 103969, "epoch": 859} {"train_loss": -37.729549407958984, "global_step": 103970, "epoch": 859} {"train_loss": -37.789154052734375, "global_step": 103971, "epoch": 859} {"train_loss": -38.11362838745117, "global_step": 103972, "epoch": 859} {"train_loss": -37.163631439208984, "global_step": 103973, "epoch": 859} {"train_loss": -37.05317306518555, "global_step": 103974, "epoch": 859} {"train_loss": -38.180084228515625, "global_step": 103975, "epoch": 859} {"train_loss": -37.57599639892578, "global_step": 103976, "epoch": 859} {"train_loss": -36.95574951171875, "global_step": 103977, "epoch": 859} {"train_loss": -37.79764938354492, "global_step": 103978, "epoch": 859} {"train_loss": -37.99969482421875, "global_step": 103979, "epoch": 859} {"train_loss": -38.263397216796875, "global_step": 103980, "epoch": 859} {"train_loss": -38.474578857421875, "global_step": 103981, "epoch": 859} {"train_loss": -38.414485931396484, "global_step": 103982, "epoch": 859} {"train_loss": -38.31682205200195, "global_step": 103983, "epoch": 859} {"train_loss": -38.205379486083984, "global_step": 103984, "epoch": 859} {"train_loss": -38.3377685546875, "global_step": 103985, "epoch": 859} {"train_loss": -38.36126708984375, "global_step": 103986, "epoch": 859} {"train_loss": -38.53646469116211, "global_step": 103987, "epoch": 859} {"train_loss": -38.37007522583008, "global_step": 103988, "epoch": 859} {"train_loss": -38.87793731689453, "global_step": 103989, "epoch": 859} {"train_loss": -38.79520797729492, "global_step": 103990, "epoch": 859} {"train_loss": -38.38131332397461, "global_step": 103991, "epoch": 859} {"train_loss": -38.55963897705078, "global_step": 103992, "epoch": 859} {"train_loss": -38.65656661987305, "global_step": 103993, "epoch": 859} {"train_loss": -38.54287338256836, "global_step": 103994, "epoch": 859} {"train_loss": -38.215476989746094, "global_step": 103995, "epoch": 859} {"train_loss": -38.7503547668457, "global_step": 103996, "epoch": 859} {"train_loss": -38.9454460144043, "global_step": 103997, "epoch": 859} {"train_loss": -38.39704513549805, "global_step": 103998, "epoch": 859} {"train_loss": -38.90447235107422, "global_step": 103999, "epoch": 859} {"train_loss": -38.42356491088867, "global_step": 104000, "epoch": 859} {"train_loss": -38.023677825927734, "global_step": 104001, "epoch": 859} {"train_loss": -38.99656295776367, "global_step": 104002, "epoch": 859} {"train_loss": -38.8928108215332, "global_step": 104003, "epoch": 859} {"train_loss": -39.232730865478516, "global_step": 104004, "epoch": 859} {"train_loss": -38.536502838134766, "global_step": 104005, "epoch": 859} {"train_loss": -37.77157974243164, "global_step": 104006, "epoch": 859} {"train_loss": -37.0266227722168, "global_step": 104007, "epoch": 859} {"train_loss": -35.13916015625, "global_step": 104008, "epoch": 859} {"train_loss": -31.110992431640625, "global_step": 104009, "epoch": 859} {"train_loss": -23.2296142578125, "global_step": 104010, "epoch": 859} {"train_loss": -22.074216842651367, "global_step": 104011, "epoch": 859} {"train_loss": -32.78690719604492, "global_step": 104012, "epoch": 859} {"train_loss": -32.58876419067383, "global_step": 104013, "epoch": 859} {"train_loss": -25.954559326171875, "global_step": 104014, "epoch": 859} {"train_loss": -34.67597579956055, "global_step": 104015, "epoch": 859} {"train_loss": -31.865808486938477, "global_step": 104016, "epoch": 859} {"train_loss": -34.910736083984375, "global_step": 104017, "epoch": 859} {"train_loss": -30.890750885009766, "global_step": 104018, "epoch": 859} {"train_loss": -35.816871643066406, "global_step": 104019, "epoch": 859} {"train_loss": -34.85622787475586, "global_step": 104020, "epoch": 859} {"train_loss": -34.881385803222656, "global_step": 104021, "epoch": 859} {"train_loss": -33.5346794128418, "global_step": 104022, "epoch": 859} {"train_loss": -35.172969818115234, "global_step": 104023, "epoch": 859} {"train_loss": -35.72573471069336, "global_step": 104024, "epoch": 859} {"train_loss": -35.21623992919922, "global_step": 104025, "epoch": 859} {"train_loss": -36.83572006225586, "global_step": 104026, "epoch": 859} {"train_loss": -35.35274124145508, "global_step": 104027, "epoch": 859} {"train_loss": -37.31759262084961, "global_step": 104028, "epoch": 859} {"train_loss": -36.394100189208984, "global_step": 104029, "epoch": 859} {"train_loss": -36.903018951416016, "global_step": 104030, "epoch": 859} {"train_loss": -36.94277572631836, "global_step": 104031, "epoch": 859} {"train_loss": -36.87298583984375, "global_step": 104032, "epoch": 859} {"train_loss": -36.907020568847656, "global_step": 104033, "epoch": 859} {"train_loss": -37.20437240600586, "global_step": 104034, "epoch": 859} {"train_loss": -37.38823699951172, "global_step": 104035, "epoch": 859} {"train_loss": -37.10626983642578, "global_step": 104036, "epoch": 859} {"train_loss": -36.81173324584961, "global_step": 104037, "epoch": 859} {"train_loss": -37.437835693359375, "global_step": 104038, "epoch": 859} {"train_loss": -37.245704650878906, "global_step": 104039, "epoch": 859} {"train_loss": -37.84821701049805, "global_step": 104040, "epoch": 859} {"train_loss": -37.84640121459961, "global_step": 104041, "epoch": 859} {"train_loss": -37.873104095458984, "global_step": 104042, "epoch": 859} {"train_loss": -37.512020111083984, "global_step": 104043, "epoch": 859} {"train_loss": -38.03753662109375, "global_step": 104044, "epoch": 859} {"train_loss": -38.3153190612793, "global_step": 104045, "epoch": 859} {"train_loss": -38.058563232421875, "global_step": 104046, "epoch": 859} {"train_loss": -38.102596282958984, "global_step": 104047, "epoch": 859} {"train_loss": -38.43887710571289, "global_step": 104048, "epoch": 859} {"train_loss": -38.72793197631836, "global_step": 104049, "epoch": 859} {"train_loss": -38.23175811767578, "global_step": 104050, "epoch": 859} {"train_loss": -38.543212890625, "global_step": 104051, "epoch": 859} {"train_loss": -38.69990921020508, "global_step": 104052, "epoch": 859} {"train_loss": -38.726558685302734, "global_step": 104053, "epoch": 859} {"train_loss": -38.87262725830078, "global_step": 104054, "epoch": 859} {"train_loss": -38.62568283081055, "global_step": 104055, "epoch": 859} {"train_loss": -38.31499099731445, "global_step": 104056, "epoch": 859} {"train_loss": -36.945064544677734, "global_step": 104057, "epoch": 859} {"train_loss": -38.87442398071289, "global_step": 104058, "epoch": 859} {"train_loss": -36.89842479485126, "global_step": 104059, "epoch": 859, "val_loss": 2794608.25} {"train_loss": -38.707435607910156, "global_step": 104060, "epoch": 860} {"train_loss": -38.77583694458008, "global_step": 104061, "epoch": 860} {"train_loss": -38.69036865234375, "global_step": 104062, "epoch": 860} {"train_loss": -39.11733627319336, "global_step": 104063, "epoch": 860} {"train_loss": -38.11197280883789, "global_step": 104064, "epoch": 860} {"train_loss": -39.02949142456055, "global_step": 104065, "epoch": 860} {"train_loss": -38.5247917175293, "global_step": 104066, "epoch": 860} {"train_loss": -39.093421936035156, "global_step": 104067, "epoch": 860} {"train_loss": -38.4512825012207, "global_step": 104068, "epoch": 860} {"train_loss": -38.996498107910156, "global_step": 104069, "epoch": 860} {"train_loss": -38.97182846069336, "global_step": 104070, "epoch": 860} {"train_loss": -39.159400939941406, "global_step": 104071, "epoch": 860} {"train_loss": -38.763423919677734, "global_step": 104072, "epoch": 860} {"train_loss": -38.2248649597168, "global_step": 104073, "epoch": 860} {"train_loss": -38.44112777709961, "global_step": 104074, "epoch": 860} {"train_loss": -38.947357177734375, "global_step": 104075, "epoch": 860} {"train_loss": -38.89884567260742, "global_step": 104076, "epoch": 860} {"train_loss": -37.63676452636719, "global_step": 104077, "epoch": 860} {"train_loss": -39.18115997314453, "global_step": 104078, "epoch": 860} {"train_loss": -39.32363510131836, "global_step": 104079, "epoch": 860} {"train_loss": -39.153499603271484, "global_step": 104080, "epoch": 860} {"train_loss": -39.462554931640625, "global_step": 104081, "epoch": 860} {"train_loss": -38.63768005371094, "global_step": 104082, "epoch": 860} {"train_loss": -36.79986572265625, "global_step": 104083, "epoch": 860} {"train_loss": -39.269893646240234, "global_step": 104084, "epoch": 860} {"train_loss": -39.49409103393555, "global_step": 104085, "epoch": 860} {"train_loss": -38.80052947998047, "global_step": 104086, "epoch": 860} {"train_loss": -38.585304260253906, "global_step": 104087, "epoch": 860} {"train_loss": -38.683990478515625, "global_step": 104088, "epoch": 860} {"train_loss": -38.102752685546875, "global_step": 104089, "epoch": 860} {"train_loss": -38.19192123413086, "global_step": 104090, "epoch": 860} {"train_loss": -39.15425491333008, "global_step": 104091, "epoch": 860} {"train_loss": -38.84232711791992, "global_step": 104092, "epoch": 860} {"train_loss": -38.701324462890625, "global_step": 104093, "epoch": 860} {"train_loss": -38.34884262084961, "global_step": 104094, "epoch": 860} {"train_loss": -39.084075927734375, "global_step": 104095, "epoch": 860} {"train_loss": -38.75582504272461, "global_step": 104096, "epoch": 860} {"train_loss": -38.2084846496582, "global_step": 104097, "epoch": 860} {"train_loss": -38.78527069091797, "global_step": 104098, "epoch": 860} {"train_loss": -38.29990768432617, "global_step": 104099, "epoch": 860} {"train_loss": -39.133968353271484, "global_step": 104100, "epoch": 860} {"train_loss": -37.993778228759766, "global_step": 104101, "epoch": 860} {"train_loss": -38.27539825439453, "global_step": 104102, "epoch": 860} {"train_loss": -38.070526123046875, "global_step": 104103, "epoch": 860} {"train_loss": -36.5619010925293, "global_step": 104104, "epoch": 860} {"train_loss": -35.194969177246094, "global_step": 104105, "epoch": 860} {"train_loss": -26.955780029296875, "global_step": 104106, "epoch": 860} {"train_loss": -12.274104118347168, "global_step": 104107, "epoch": 860} {"train_loss": -14.804361343383789, "global_step": 104108, "epoch": 860} {"train_loss": -36.497161865234375, "global_step": 104109, "epoch": 860} {"train_loss": -29.484130859375, "global_step": 104110, "epoch": 860} {"train_loss": -31.604877471923828, "global_step": 104111, "epoch": 860} {"train_loss": -37.53272247314453, "global_step": 104112, "epoch": 860} {"train_loss": -31.22504234313965, "global_step": 104113, "epoch": 860} {"train_loss": -37.725318908691406, "global_step": 104114, "epoch": 860} {"train_loss": -32.01247787475586, "global_step": 104115, "epoch": 860} {"train_loss": -37.68077087402344, "global_step": 104116, "epoch": 860} {"train_loss": -35.43610382080078, "global_step": 104117, "epoch": 860} {"train_loss": -37.134368896484375, "global_step": 104118, "epoch": 860} {"train_loss": -37.40652084350586, "global_step": 104119, "epoch": 860} {"train_loss": -35.11430740356445, "global_step": 104120, "epoch": 860} {"train_loss": -37.557899475097656, "global_step": 104121, "epoch": 860} {"train_loss": -36.703121185302734, "global_step": 104122, "epoch": 860} {"train_loss": -36.238338470458984, "global_step": 104123, "epoch": 860} {"train_loss": -37.33889389038086, "global_step": 104124, "epoch": 860} {"train_loss": -37.08254623413086, "global_step": 104125, "epoch": 860} {"train_loss": -36.935333251953125, "global_step": 104126, "epoch": 860} {"train_loss": -37.7552490234375, "global_step": 104127, "epoch": 860} {"train_loss": -37.28154373168945, "global_step": 104128, "epoch": 860} {"train_loss": -37.285003662109375, "global_step": 104129, "epoch": 860} {"train_loss": -38.50228500366211, "global_step": 104130, "epoch": 860} {"train_loss": -38.09115219116211, "global_step": 104131, "epoch": 860} {"train_loss": -37.93603515625, "global_step": 104132, "epoch": 860} {"train_loss": -38.21272659301758, "global_step": 104133, "epoch": 860} {"train_loss": -38.25284957885742, "global_step": 104134, "epoch": 860} {"train_loss": -38.17172622680664, "global_step": 104135, "epoch": 860} {"train_loss": -37.84383773803711, "global_step": 104136, "epoch": 860} {"train_loss": -38.33278274536133, "global_step": 104137, "epoch": 860} {"train_loss": -37.416709899902344, "global_step": 104138, "epoch": 860} {"train_loss": -37.984405517578125, "global_step": 104139, "epoch": 860} {"train_loss": -38.02362823486328, "global_step": 104140, "epoch": 860} {"train_loss": -37.816070556640625, "global_step": 104141, "epoch": 860} {"train_loss": -38.08501052856445, "global_step": 104142, "epoch": 860} {"train_loss": -38.08649444580078, "global_step": 104143, "epoch": 860} {"train_loss": -38.18891143798828, "global_step": 104144, "epoch": 860} {"train_loss": -38.58975601196289, "global_step": 104145, "epoch": 860} {"train_loss": -38.25185012817383, "global_step": 104146, "epoch": 860} {"train_loss": -38.58579635620117, "global_step": 104147, "epoch": 860} {"train_loss": -38.750640869140625, "global_step": 104148, "epoch": 860} {"train_loss": -38.559539794921875, "global_step": 104149, "epoch": 860} {"train_loss": -38.31471633911133, "global_step": 104150, "epoch": 860} {"train_loss": -38.634700775146484, "global_step": 104151, "epoch": 860} {"train_loss": -37.970088958740234, "global_step": 104152, "epoch": 860} {"train_loss": -38.43754196166992, "global_step": 104153, "epoch": 860} {"train_loss": -38.578819274902344, "global_step": 104154, "epoch": 860} {"train_loss": -39.220237731933594, "global_step": 104155, "epoch": 860} {"train_loss": -38.991146087646484, "global_step": 104156, "epoch": 860} {"train_loss": -39.113197326660156, "global_step": 104157, "epoch": 860} {"train_loss": -38.2689323425293, "global_step": 104158, "epoch": 860} {"train_loss": -38.74588394165039, "global_step": 104159, "epoch": 860} {"train_loss": -38.960689544677734, "global_step": 104160, "epoch": 860} {"train_loss": -38.74155044555664, "global_step": 104161, "epoch": 860} {"train_loss": -38.73969650268555, "global_step": 104162, "epoch": 860} {"train_loss": -38.9874267578125, "global_step": 104163, "epoch": 860} {"train_loss": -38.94692611694336, "global_step": 104164, "epoch": 860} {"train_loss": -39.06162643432617, "global_step": 104165, "epoch": 860} {"train_loss": -39.067195892333984, "global_step": 104166, "epoch": 860} {"train_loss": -38.75828170776367, "global_step": 104167, "epoch": 860} {"train_loss": -39.061580657958984, "global_step": 104168, "epoch": 860} {"train_loss": -39.32265090942383, "global_step": 104169, "epoch": 860} {"train_loss": -39.30303955078125, "global_step": 104170, "epoch": 860} {"train_loss": -38.40657424926758, "global_step": 104171, "epoch": 860} {"train_loss": -39.15697479248047, "global_step": 104172, "epoch": 860} {"train_loss": -38.86320877075195, "global_step": 104173, "epoch": 860} {"train_loss": -38.97770309448242, "global_step": 104174, "epoch": 860} {"train_loss": -38.85874938964844, "global_step": 104175, "epoch": 860} {"train_loss": -39.04519271850586, "global_step": 104176, "epoch": 860} {"train_loss": -38.656959533691406, "global_step": 104177, "epoch": 860} {"train_loss": -39.02724838256836, "global_step": 104178, "epoch": 860} {"train_loss": -38.707054138183594, "global_step": 104179, "epoch": 860} {"train_loss": -37.58533782801352, "global_step": 104180, "epoch": 860, "val_loss": 2742937.75} {"train_loss": -38.993408203125, "global_step": 104181, "epoch": 861} {"train_loss": -38.98406219482422, "global_step": 104182, "epoch": 861} {"train_loss": -38.64321517944336, "global_step": 104183, "epoch": 861} {"train_loss": -38.61918258666992, "global_step": 104184, "epoch": 861} {"train_loss": -38.744468688964844, "global_step": 104185, "epoch": 861} {"train_loss": -37.366756439208984, "global_step": 104186, "epoch": 861} {"train_loss": -33.24274444580078, "global_step": 104187, "epoch": 861} {"train_loss": -28.8257999420166, "global_step": 104188, "epoch": 861} {"train_loss": -21.98685646057129, "global_step": 104189, "epoch": 861} {"train_loss": -18.076841354370117, "global_step": 104190, "epoch": 861} {"train_loss": -29.612457275390625, "global_step": 104191, "epoch": 861} {"train_loss": -36.449214935302734, "global_step": 104192, "epoch": 861} {"train_loss": -30.68494987487793, "global_step": 104193, "epoch": 861} {"train_loss": -36.54890060424805, "global_step": 104194, "epoch": 861} {"train_loss": -31.766693115234375, "global_step": 104195, "epoch": 861} {"train_loss": -35.48463439941406, "global_step": 104196, "epoch": 861} {"train_loss": -35.498512268066406, "global_step": 104197, "epoch": 861} {"train_loss": -34.946929931640625, "global_step": 104198, "epoch": 861} {"train_loss": -35.50496292114258, "global_step": 104199, "epoch": 861} {"train_loss": -33.945404052734375, "global_step": 104200, "epoch": 861} {"train_loss": -36.20505905151367, "global_step": 104201, "epoch": 861} {"train_loss": -36.05601119995117, "global_step": 104202, "epoch": 861} {"train_loss": -36.17756271362305, "global_step": 104203, "epoch": 861} {"train_loss": -36.82125473022461, "global_step": 104204, "epoch": 861} {"train_loss": -36.385353088378906, "global_step": 104205, "epoch": 861} {"train_loss": -36.669044494628906, "global_step": 104206, "epoch": 861} {"train_loss": -33.771358489990234, "global_step": 104207, "epoch": 861} {"train_loss": -36.98378372192383, "global_step": 104208, "epoch": 861} {"train_loss": -37.43864059448242, "global_step": 104209, "epoch": 861} {"train_loss": -37.15958786010742, "global_step": 104210, "epoch": 861} {"train_loss": -37.65504837036133, "global_step": 104211, "epoch": 861} {"train_loss": -37.31085205078125, "global_step": 104212, "epoch": 861} {"train_loss": -37.6407356262207, "global_step": 104213, "epoch": 861} {"train_loss": -37.689666748046875, "global_step": 104214, "epoch": 861} {"train_loss": -37.79949951171875, "global_step": 104215, "epoch": 861} {"train_loss": -37.66347122192383, "global_step": 104216, "epoch": 861} {"train_loss": -37.787872314453125, "global_step": 104217, "epoch": 861} {"train_loss": -37.72504806518555, "global_step": 104218, "epoch": 861} {"train_loss": -38.34102249145508, "global_step": 104219, "epoch": 861} {"train_loss": -37.517574310302734, "global_step": 104220, "epoch": 861} {"train_loss": -38.20899200439453, "global_step": 104221, "epoch": 861} {"train_loss": -37.66658020019531, "global_step": 104222, "epoch": 861} {"train_loss": -38.07748031616211, "global_step": 104223, "epoch": 861} {"train_loss": -37.9746208190918, "global_step": 104224, "epoch": 861} {"train_loss": -38.18568801879883, "global_step": 104225, "epoch": 861} {"train_loss": -38.255435943603516, "global_step": 104226, "epoch": 861} {"train_loss": -37.96814727783203, "global_step": 104227, "epoch": 861} {"train_loss": -38.07537078857422, "global_step": 104228, "epoch": 861} {"train_loss": -38.03437423706055, "global_step": 104229, "epoch": 861} {"train_loss": -38.423091888427734, "global_step": 104230, "epoch": 861} {"train_loss": -38.055572509765625, "global_step": 104231, "epoch": 861} {"train_loss": -38.332149505615234, "global_step": 104232, "epoch": 861} {"train_loss": -38.262149810791016, "global_step": 104233, "epoch": 861} {"train_loss": -38.52952194213867, "global_step": 104234, "epoch": 861} {"train_loss": -38.3753776550293, "global_step": 104235, "epoch": 861} {"train_loss": -38.15716552734375, "global_step": 104236, "epoch": 861} {"train_loss": -38.52656555175781, "global_step": 104237, "epoch": 861} {"train_loss": -38.300228118896484, "global_step": 104238, "epoch": 861} {"train_loss": -38.60558319091797, "global_step": 104239, "epoch": 861} {"train_loss": -38.99031066894531, "global_step": 104240, "epoch": 861} {"train_loss": -38.40021896362305, "global_step": 104241, "epoch": 861} {"train_loss": -38.84263229370117, "global_step": 104242, "epoch": 861} {"train_loss": -38.87884521484375, "global_step": 104243, "epoch": 861} {"train_loss": -38.70661163330078, "global_step": 104244, "epoch": 861} {"train_loss": -38.715232849121094, "global_step": 104245, "epoch": 861} {"train_loss": -38.21453857421875, "global_step": 104246, "epoch": 861} {"train_loss": -37.231101989746094, "global_step": 104247, "epoch": 861} {"train_loss": -38.828834533691406, "global_step": 104248, "epoch": 861} {"train_loss": -38.89739990234375, "global_step": 104249, "epoch": 861} {"train_loss": -39.198486328125, "global_step": 104250, "epoch": 861} {"train_loss": -38.547664642333984, "global_step": 104251, "epoch": 861} {"train_loss": -38.83321762084961, "global_step": 104252, "epoch": 861} {"train_loss": -38.9174919128418, "global_step": 104253, "epoch": 861} {"train_loss": -39.015228271484375, "global_step": 104254, "epoch": 861} {"train_loss": -39.31258010864258, "global_step": 104255, "epoch": 861} {"train_loss": -38.476837158203125, "global_step": 104256, "epoch": 861} {"train_loss": -38.558570861816406, "global_step": 104257, "epoch": 861} {"train_loss": -39.096492767333984, "global_step": 104258, "epoch": 861} {"train_loss": -38.66653060913086, "global_step": 104259, "epoch": 861} {"train_loss": -39.335174560546875, "global_step": 104260, "epoch": 861} {"train_loss": -39.18198013305664, "global_step": 104261, "epoch": 861} {"train_loss": -38.801963806152344, "global_step": 104262, "epoch": 861} {"train_loss": -39.36433029174805, "global_step": 104263, "epoch": 861} {"train_loss": -38.6626091003418, "global_step": 104264, "epoch": 861} {"train_loss": -39.46369552612305, "global_step": 104265, "epoch": 861} {"train_loss": -39.00815200805664, "global_step": 104266, "epoch": 861} {"train_loss": -39.00761413574219, "global_step": 104267, "epoch": 861} {"train_loss": -39.4063606262207, "global_step": 104268, "epoch": 861} {"train_loss": -39.483802795410156, "global_step": 104269, "epoch": 861} {"train_loss": -39.45583724975586, "global_step": 104270, "epoch": 861} {"train_loss": -39.558197021484375, "global_step": 104271, "epoch": 861} {"train_loss": -39.663944244384766, "global_step": 104272, "epoch": 861} {"train_loss": -39.49818801879883, "global_step": 104273, "epoch": 861} {"train_loss": -39.5839729309082, "global_step": 104274, "epoch": 861} {"train_loss": -39.279541015625, "global_step": 104275, "epoch": 861} {"train_loss": -39.583740234375, "global_step": 104276, "epoch": 861} {"train_loss": -38.75982666015625, "global_step": 104277, "epoch": 861} {"train_loss": -38.6552734375, "global_step": 104278, "epoch": 861} {"train_loss": -39.47392654418945, "global_step": 104279, "epoch": 861} {"train_loss": -39.30398178100586, "global_step": 104280, "epoch": 861} {"train_loss": -39.396629333496094, "global_step": 104281, "epoch": 861} {"train_loss": -39.52610778808594, "global_step": 104282, "epoch": 861} {"train_loss": -38.446834564208984, "global_step": 104283, "epoch": 861} {"train_loss": -37.558650970458984, "global_step": 104284, "epoch": 861} {"train_loss": -38.00653839111328, "global_step": 104285, "epoch": 861} {"train_loss": -35.7525634765625, "global_step": 104286, "epoch": 861} {"train_loss": -33.792415618896484, "global_step": 104287, "epoch": 861} {"train_loss": -37.70794677734375, "global_step": 104288, "epoch": 861} {"train_loss": -38.00239944458008, "global_step": 104289, "epoch": 861} {"train_loss": -35.98650360107422, "global_step": 104290, "epoch": 861} {"train_loss": -34.4692497253418, "global_step": 104291, "epoch": 861} {"train_loss": -36.7146110534668, "global_step": 104292, "epoch": 861} {"train_loss": -37.49809646606445, "global_step": 104293, "epoch": 861} {"train_loss": -37.965084075927734, "global_step": 104294, "epoch": 861} {"train_loss": -35.71590042114258, "global_step": 104295, "epoch": 861} {"train_loss": -38.264163970947266, "global_step": 104296, "epoch": 861} {"train_loss": -38.32200241088867, "global_step": 104297, "epoch": 861} {"train_loss": -37.95721435546875, "global_step": 104298, "epoch": 861} {"train_loss": -37.712459564208984, "global_step": 104299, "epoch": 861} {"train_loss": -37.08066177368164, "global_step": 104300, "epoch": 861} {"train_loss": -37.38587727822548, "global_step": 104301, "epoch": 861, "val_loss": 2733451.0} {"train_loss": -38.83350372314453, "global_step": 104302, "epoch": 862} {"train_loss": -38.526824951171875, "global_step": 104303, "epoch": 862} {"train_loss": -38.52810287475586, "global_step": 104304, "epoch": 862} {"train_loss": -38.496341705322266, "global_step": 104305, "epoch": 862} {"train_loss": -35.69327926635742, "global_step": 104306, "epoch": 862} {"train_loss": -38.72119903564453, "global_step": 104307, "epoch": 862} {"train_loss": -36.80475997924805, "global_step": 104308, "epoch": 862} {"train_loss": -36.7190055847168, "global_step": 104309, "epoch": 862} {"train_loss": -37.31834030151367, "global_step": 104310, "epoch": 862} {"train_loss": -38.01250457763672, "global_step": 104311, "epoch": 862} {"train_loss": -37.552425384521484, "global_step": 104312, "epoch": 862} {"train_loss": -36.30874252319336, "global_step": 104313, "epoch": 862} {"train_loss": -38.01469421386719, "global_step": 104314, "epoch": 862} {"train_loss": -35.16725158691406, "global_step": 104315, "epoch": 862} {"train_loss": -38.49991989135742, "global_step": 104316, "epoch": 862} {"train_loss": -36.44873046875, "global_step": 104317, "epoch": 862} {"train_loss": -38.36539077758789, "global_step": 104318, "epoch": 862} {"train_loss": -34.001522064208984, "global_step": 104319, "epoch": 862} {"train_loss": -35.79010009765625, "global_step": 104320, "epoch": 862} {"train_loss": -37.634368896484375, "global_step": 104321, "epoch": 862} {"train_loss": -36.40331268310547, "global_step": 104322, "epoch": 862} {"train_loss": -37.55537796020508, "global_step": 104323, "epoch": 862} {"train_loss": -35.987850189208984, "global_step": 104324, "epoch": 862} {"train_loss": -36.115394592285156, "global_step": 104325, "epoch": 862} {"train_loss": -34.820831298828125, "global_step": 104326, "epoch": 862} {"train_loss": -35.573944091796875, "global_step": 104327, "epoch": 862} {"train_loss": -35.3555908203125, "global_step": 104328, "epoch": 862} {"train_loss": -36.33664321899414, "global_step": 104329, "epoch": 862} {"train_loss": -31.1160888671875, "global_step": 104330, "epoch": 862} {"train_loss": -34.626792907714844, "global_step": 104331, "epoch": 862} {"train_loss": -32.138668060302734, "global_step": 104332, "epoch": 862} {"train_loss": -35.96466827392578, "global_step": 104333, "epoch": 862} {"train_loss": -34.70927810668945, "global_step": 104334, "epoch": 862} {"train_loss": -35.92133712768555, "global_step": 104335, "epoch": 862} {"train_loss": -34.54800033569336, "global_step": 104336, "epoch": 862} {"train_loss": -36.398433685302734, "global_step": 104337, "epoch": 862} {"train_loss": -35.637962341308594, "global_step": 104338, "epoch": 862} {"train_loss": -36.99862289428711, "global_step": 104339, "epoch": 862} {"train_loss": -36.705604553222656, "global_step": 104340, "epoch": 862} {"train_loss": -36.41748046875, "global_step": 104341, "epoch": 862} {"train_loss": -36.10407638549805, "global_step": 104342, "epoch": 862} {"train_loss": -36.05101776123047, "global_step": 104343, "epoch": 862} {"train_loss": -36.911346435546875, "global_step": 104344, "epoch": 862} {"train_loss": -35.12797164916992, "global_step": 104345, "epoch": 862} {"train_loss": -34.346412658691406, "global_step": 104346, "epoch": 862} {"train_loss": -33.6779670715332, "global_step": 104347, "epoch": 862} {"train_loss": -35.888946533203125, "global_step": 104348, "epoch": 862} {"train_loss": -36.79152297973633, "global_step": 104349, "epoch": 862} {"train_loss": -36.20438003540039, "global_step": 104350, "epoch": 862} {"train_loss": -36.86370849609375, "global_step": 104351, "epoch": 862} {"train_loss": -36.178836822509766, "global_step": 104352, "epoch": 862} {"train_loss": -36.87557601928711, "global_step": 104353, "epoch": 862} {"train_loss": -37.02916717529297, "global_step": 104354, "epoch": 862} {"train_loss": -37.34897994995117, "global_step": 104355, "epoch": 862} {"train_loss": -37.432167053222656, "global_step": 104356, "epoch": 862} {"train_loss": -37.2524528503418, "global_step": 104357, "epoch": 862} {"train_loss": -37.20957946777344, "global_step": 104358, "epoch": 862} {"train_loss": -37.52921676635742, "global_step": 104359, "epoch": 862} {"train_loss": -36.33219909667969, "global_step": 104360, "epoch": 862} {"train_loss": -37.39990997314453, "global_step": 104361, "epoch": 862} {"train_loss": -37.19443893432617, "global_step": 104362, "epoch": 862} {"train_loss": -37.42251205444336, "global_step": 104363, "epoch": 862} {"train_loss": -37.56126022338867, "global_step": 104364, "epoch": 862} {"train_loss": -37.86777877807617, "global_step": 104365, "epoch": 862} {"train_loss": -38.00997543334961, "global_step": 104366, "epoch": 862} {"train_loss": -36.99100875854492, "global_step": 104367, "epoch": 862} {"train_loss": -37.55015563964844, "global_step": 104368, "epoch": 862} {"train_loss": -37.66707992553711, "global_step": 104369, "epoch": 862} {"train_loss": -37.971282958984375, "global_step": 104370, "epoch": 862} {"train_loss": -38.10285568237305, "global_step": 104371, "epoch": 862} {"train_loss": -37.1483039855957, "global_step": 104372, "epoch": 862} {"train_loss": -38.264305114746094, "global_step": 104373, "epoch": 862} {"train_loss": -38.08300018310547, "global_step": 104374, "epoch": 862} {"train_loss": -38.241329193115234, "global_step": 104375, "epoch": 862} {"train_loss": -37.81731414794922, "global_step": 104376, "epoch": 862} {"train_loss": -38.195648193359375, "global_step": 104377, "epoch": 862} {"train_loss": -38.05085754394531, "global_step": 104378, "epoch": 862} {"train_loss": -38.35635757446289, "global_step": 104379, "epoch": 862} {"train_loss": -38.23777389526367, "global_step": 104380, "epoch": 862} {"train_loss": -38.61741256713867, "global_step": 104381, "epoch": 862} {"train_loss": -38.22099685668945, "global_step": 104382, "epoch": 862} {"train_loss": -38.92036056518555, "global_step": 104383, "epoch": 862} {"train_loss": -38.3968505859375, "global_step": 104384, "epoch": 862} {"train_loss": -38.52614974975586, "global_step": 104385, "epoch": 862} {"train_loss": -38.28504180908203, "global_step": 104386, "epoch": 862} {"train_loss": -38.58210754394531, "global_step": 104387, "epoch": 862} {"train_loss": -38.74107360839844, "global_step": 104388, "epoch": 862} {"train_loss": -38.395687103271484, "global_step": 104389, "epoch": 862} {"train_loss": -38.8184928894043, "global_step": 104390, "epoch": 862} {"train_loss": -38.650638580322266, "global_step": 104391, "epoch": 862} {"train_loss": -39.03048324584961, "global_step": 104392, "epoch": 862} {"train_loss": -38.70071792602539, "global_step": 104393, "epoch": 862} {"train_loss": -38.691097259521484, "global_step": 104394, "epoch": 862} {"train_loss": -37.23838806152344, "global_step": 104395, "epoch": 862} {"train_loss": -39.07079315185547, "global_step": 104396, "epoch": 862} {"train_loss": -38.543949127197266, "global_step": 104397, "epoch": 862} {"train_loss": -38.947078704833984, "global_step": 104398, "epoch": 862} {"train_loss": -38.96963119506836, "global_step": 104399, "epoch": 862} {"train_loss": -38.615901947021484, "global_step": 104400, "epoch": 862} {"train_loss": -38.75033950805664, "global_step": 104401, "epoch": 862} {"train_loss": -38.946685791015625, "global_step": 104402, "epoch": 862} {"train_loss": -38.64193344116211, "global_step": 104403, "epoch": 862} {"train_loss": -38.66554641723633, "global_step": 104404, "epoch": 862} {"train_loss": -38.35105514526367, "global_step": 104405, "epoch": 862} {"train_loss": -39.12604522705078, "global_step": 104406, "epoch": 862} {"train_loss": -38.84577560424805, "global_step": 104407, "epoch": 862} {"train_loss": -38.6033935546875, "global_step": 104408, "epoch": 862} {"train_loss": -39.43629455566406, "global_step": 104409, "epoch": 862} {"train_loss": -38.670658111572266, "global_step": 104410, "epoch": 862} {"train_loss": -38.7380256652832, "global_step": 104411, "epoch": 862} {"train_loss": -38.67829895019531, "global_step": 104412, "epoch": 862} {"train_loss": -38.726070404052734, "global_step": 104413, "epoch": 862} {"train_loss": -38.568695068359375, "global_step": 104414, "epoch": 862} {"train_loss": -35.43552780151367, "global_step": 104415, "epoch": 862} {"train_loss": -38.752044677734375, "global_step": 104416, "epoch": 862} {"train_loss": -37.22542953491211, "global_step": 104417, "epoch": 862} {"train_loss": -38.23464584350586, "global_step": 104418, "epoch": 862} {"train_loss": -39.044036865234375, "global_step": 104419, "epoch": 862} {"train_loss": -39.110836029052734, "global_step": 104420, "epoch": 862} {"train_loss": -38.112728118896484, "global_step": 104421, "epoch": 862} {"train_loss": -37.359586069406554, "global_step": 104422, "epoch": 862, "val_loss": 2765407.75} {"train_loss": -36.69179916381836, "global_step": 104423, "epoch": 863} {"train_loss": -34.396095275878906, "global_step": 104424, "epoch": 863} {"train_loss": -37.02632522583008, "global_step": 104425, "epoch": 863} {"train_loss": -36.644920349121094, "global_step": 104426, "epoch": 863} {"train_loss": -36.906612396240234, "global_step": 104427, "epoch": 863} {"train_loss": -34.653465270996094, "global_step": 104428, "epoch": 863} {"train_loss": -38.00909423828125, "global_step": 104429, "epoch": 863} {"train_loss": -38.2938346862793, "global_step": 104430, "epoch": 863} {"train_loss": -35.98676300048828, "global_step": 104431, "epoch": 863} {"train_loss": -35.870460510253906, "global_step": 104432, "epoch": 863} {"train_loss": -36.21516036987305, "global_step": 104433, "epoch": 863} {"train_loss": -38.40240478515625, "global_step": 104434, "epoch": 863} {"train_loss": -36.04500198364258, "global_step": 104435, "epoch": 863} {"train_loss": -34.65913009643555, "global_step": 104436, "epoch": 863} {"train_loss": -34.44149398803711, "global_step": 104437, "epoch": 863} {"train_loss": -35.227203369140625, "global_step": 104438, "epoch": 863} {"train_loss": -37.386783599853516, "global_step": 104439, "epoch": 863} {"train_loss": -37.39259338378906, "global_step": 104440, "epoch": 863} {"train_loss": -37.828163146972656, "global_step": 104441, "epoch": 863} {"train_loss": -35.337581634521484, "global_step": 104442, "epoch": 863} {"train_loss": -38.38397979736328, "global_step": 104443, "epoch": 863} {"train_loss": -36.306884765625, "global_step": 104444, "epoch": 863} {"train_loss": -36.116939544677734, "global_step": 104445, "epoch": 863} {"train_loss": -36.7279167175293, "global_step": 104446, "epoch": 863} {"train_loss": -32.46953582763672, "global_step": 104447, "epoch": 863} {"train_loss": -37.06265640258789, "global_step": 104448, "epoch": 863} {"train_loss": -34.433265686035156, "global_step": 104449, "epoch": 863} {"train_loss": -35.11432647705078, "global_step": 104450, "epoch": 863} {"train_loss": -38.034423828125, "global_step": 104451, "epoch": 863} {"train_loss": -36.8690071105957, "global_step": 104452, "epoch": 863} {"train_loss": -36.7398681640625, "global_step": 104453, "epoch": 863} {"train_loss": -37.40667724609375, "global_step": 104454, "epoch": 863} {"train_loss": -37.759212493896484, "global_step": 104455, "epoch": 863} {"train_loss": -36.90019607543945, "global_step": 104456, "epoch": 863} {"train_loss": -37.00987243652344, "global_step": 104457, "epoch": 863} {"train_loss": -36.4929084777832, "global_step": 104458, "epoch": 863} {"train_loss": -37.583553314208984, "global_step": 104459, "epoch": 863} {"train_loss": -34.50986862182617, "global_step": 104460, "epoch": 863} {"train_loss": -35.81554412841797, "global_step": 104461, "epoch": 863} {"train_loss": -37.49836349487305, "global_step": 104462, "epoch": 863} {"train_loss": -37.84834289550781, "global_step": 104463, "epoch": 863} {"train_loss": -35.63159942626953, "global_step": 104464, "epoch": 863} {"train_loss": -35.184791564941406, "global_step": 104465, "epoch": 863} {"train_loss": -37.51569747924805, "global_step": 104466, "epoch": 863} {"train_loss": -37.3886833190918, "global_step": 104467, "epoch": 863} {"train_loss": -36.353023529052734, "global_step": 104468, "epoch": 863} {"train_loss": -32.80116271972656, "global_step": 104469, "epoch": 863} {"train_loss": -37.602901458740234, "global_step": 104470, "epoch": 863} {"train_loss": -36.52556228637695, "global_step": 104471, "epoch": 863} {"train_loss": -37.631065368652344, "global_step": 104472, "epoch": 863} {"train_loss": -36.82583236694336, "global_step": 104473, "epoch": 863} {"train_loss": -37.905799865722656, "global_step": 104474, "epoch": 863} {"train_loss": -37.26630783081055, "global_step": 104475, "epoch": 863} {"train_loss": -37.53506088256836, "global_step": 104476, "epoch": 863} {"train_loss": -36.73835372924805, "global_step": 104477, "epoch": 863} {"train_loss": -37.377140045166016, "global_step": 104478, "epoch": 863} {"train_loss": -37.15224838256836, "global_step": 104479, "epoch": 863} {"train_loss": -38.21029281616211, "global_step": 104480, "epoch": 863} {"train_loss": -38.03766632080078, "global_step": 104481, "epoch": 863} {"train_loss": -37.174896240234375, "global_step": 104482, "epoch": 863} {"train_loss": -36.923126220703125, "global_step": 104483, "epoch": 863} {"train_loss": -37.916236877441406, "global_step": 104484, "epoch": 863} {"train_loss": -37.93294143676758, "global_step": 104485, "epoch": 863} {"train_loss": -37.38142776489258, "global_step": 104486, "epoch": 863} {"train_loss": -37.8429069519043, "global_step": 104487, "epoch": 863} {"train_loss": -36.57369613647461, "global_step": 104488, "epoch": 863} {"train_loss": -37.2473030090332, "global_step": 104489, "epoch": 863} {"train_loss": -38.091670989990234, "global_step": 104490, "epoch": 863} {"train_loss": -37.03468704223633, "global_step": 104491, "epoch": 863} {"train_loss": -36.748592376708984, "global_step": 104492, "epoch": 863} {"train_loss": -37.482460021972656, "global_step": 104493, "epoch": 863} {"train_loss": -38.05511474609375, "global_step": 104494, "epoch": 863} {"train_loss": -36.87295150756836, "global_step": 104495, "epoch": 863} {"train_loss": -37.52032470703125, "global_step": 104496, "epoch": 863} {"train_loss": -37.644081115722656, "global_step": 104497, "epoch": 863} {"train_loss": -37.30619430541992, "global_step": 104498, "epoch": 863} {"train_loss": -37.51380157470703, "global_step": 104499, "epoch": 863} {"train_loss": -38.357521057128906, "global_step": 104500, "epoch": 863} {"train_loss": -38.234432220458984, "global_step": 104501, "epoch": 863} {"train_loss": -37.182613372802734, "global_step": 104502, "epoch": 863} {"train_loss": -38.69565963745117, "global_step": 104503, "epoch": 863} {"train_loss": -37.19890213012695, "global_step": 104504, "epoch": 863} {"train_loss": -38.59099197387695, "global_step": 104505, "epoch": 863} {"train_loss": -37.13665008544922, "global_step": 104506, "epoch": 863} {"train_loss": -38.13804244995117, "global_step": 104507, "epoch": 863} {"train_loss": -38.58869171142578, "global_step": 104508, "epoch": 863} {"train_loss": -38.67678451538086, "global_step": 104509, "epoch": 863} {"train_loss": -37.621212005615234, "global_step": 104510, "epoch": 863} {"train_loss": -38.221004486083984, "global_step": 104511, "epoch": 863} {"train_loss": -37.3584098815918, "global_step": 104512, "epoch": 863} {"train_loss": -38.24116134643555, "global_step": 104513, "epoch": 863} {"train_loss": -38.38911819458008, "global_step": 104514, "epoch": 863} {"train_loss": -37.86206817626953, "global_step": 104515, "epoch": 863} {"train_loss": -38.16707229614258, "global_step": 104516, "epoch": 863} {"train_loss": -38.23787307739258, "global_step": 104517, "epoch": 863} {"train_loss": -38.2789421081543, "global_step": 104518, "epoch": 863} {"train_loss": -38.85490798950195, "global_step": 104519, "epoch": 863} {"train_loss": -37.910972595214844, "global_step": 104520, "epoch": 863} {"train_loss": -37.40321731567383, "global_step": 104521, "epoch": 863} {"train_loss": -38.7907829284668, "global_step": 104522, "epoch": 863} {"train_loss": -38.00259780883789, "global_step": 104523, "epoch": 863} {"train_loss": -38.77600860595703, "global_step": 104524, "epoch": 863} {"train_loss": -37.6005973815918, "global_step": 104525, "epoch": 863} {"train_loss": -38.685115814208984, "global_step": 104526, "epoch": 863} {"train_loss": -38.4696159362793, "global_step": 104527, "epoch": 863} {"train_loss": -38.50666046142578, "global_step": 104528, "epoch": 863} {"train_loss": -38.57748031616211, "global_step": 104529, "epoch": 863} {"train_loss": -38.86394119262695, "global_step": 104530, "epoch": 863} {"train_loss": -38.417720794677734, "global_step": 104531, "epoch": 863} {"train_loss": -39.00715255737305, "global_step": 104532, "epoch": 863} {"train_loss": -38.7041130065918, "global_step": 104533, "epoch": 863} {"train_loss": -39.135833740234375, "global_step": 104534, "epoch": 863} {"train_loss": -38.8271598815918, "global_step": 104535, "epoch": 863} {"train_loss": -38.06809997558594, "global_step": 104536, "epoch": 863} {"train_loss": -38.232460021972656, "global_step": 104537, "epoch": 863} {"train_loss": -39.16105270385742, "global_step": 104538, "epoch": 863} {"train_loss": -37.34214782714844, "global_step": 104539, "epoch": 863} {"train_loss": -35.53007888793945, "global_step": 104540, "epoch": 863} {"train_loss": -31.59307861328125, "global_step": 104541, "epoch": 863} {"train_loss": -27.235172271728516, "global_step": 104542, "epoch": 863} {"train_loss": -37.09142702276056, "global_step": 104543, "epoch": 863, "val_loss": 2652966.0} {"train_loss": -36.53519821166992, "global_step": 104544, "epoch": 864} {"train_loss": -38.8516845703125, "global_step": 104545, "epoch": 864} {"train_loss": -36.1794548034668, "global_step": 104546, "epoch": 864} {"train_loss": -37.5181999206543, "global_step": 104547, "epoch": 864} {"train_loss": -37.98977279663086, "global_step": 104548, "epoch": 864} {"train_loss": -34.01557540893555, "global_step": 104549, "epoch": 864} {"train_loss": -36.72784423828125, "global_step": 104550, "epoch": 864} {"train_loss": -37.936580657958984, "global_step": 104551, "epoch": 864} {"train_loss": -36.16486740112305, "global_step": 104552, "epoch": 864} {"train_loss": -38.34172439575195, "global_step": 104553, "epoch": 864} {"train_loss": -35.79559326171875, "global_step": 104554, "epoch": 864} {"train_loss": -38.38509750366211, "global_step": 104555, "epoch": 864} {"train_loss": -37.230926513671875, "global_step": 104556, "epoch": 864} {"train_loss": -36.42525863647461, "global_step": 104557, "epoch": 864} {"train_loss": -39.01790237426758, "global_step": 104558, "epoch": 864} {"train_loss": -37.11830520629883, "global_step": 104559, "epoch": 864} {"train_loss": -38.825923919677734, "global_step": 104560, "epoch": 864} {"train_loss": -37.54685592651367, "global_step": 104561, "epoch": 864} {"train_loss": -39.55024719238281, "global_step": 104562, "epoch": 864} {"train_loss": -38.08794021606445, "global_step": 104563, "epoch": 864} {"train_loss": -39.00263595581055, "global_step": 104564, "epoch": 864} {"train_loss": -37.84679412841797, "global_step": 104565, "epoch": 864} {"train_loss": -38.41865158081055, "global_step": 104566, "epoch": 864} {"train_loss": -37.695068359375, "global_step": 104567, "epoch": 864} {"train_loss": -39.031341552734375, "global_step": 104568, "epoch": 864} {"train_loss": -38.092464447021484, "global_step": 104569, "epoch": 864} {"train_loss": -38.8486442565918, "global_step": 104570, "epoch": 864} {"train_loss": -38.33893966674805, "global_step": 104571, "epoch": 864} {"train_loss": -38.79462814331055, "global_step": 104572, "epoch": 864} {"train_loss": -38.575862884521484, "global_step": 104573, "epoch": 864} {"train_loss": -39.16939163208008, "global_step": 104574, "epoch": 864} {"train_loss": -38.63798141479492, "global_step": 104575, "epoch": 864} {"train_loss": -39.162841796875, "global_step": 104576, "epoch": 864} {"train_loss": -38.82855987548828, "global_step": 104577, "epoch": 864} {"train_loss": -38.5140266418457, "global_step": 104578, "epoch": 864} {"train_loss": -39.19883346557617, "global_step": 104579, "epoch": 864} {"train_loss": -38.920005798339844, "global_step": 104580, "epoch": 864} {"train_loss": -39.15970993041992, "global_step": 104581, "epoch": 864} {"train_loss": -38.91836166381836, "global_step": 104582, "epoch": 864} {"train_loss": -39.12910842895508, "global_step": 104583, "epoch": 864} {"train_loss": -39.390804290771484, "global_step": 104584, "epoch": 864} {"train_loss": -38.88166809082031, "global_step": 104585, "epoch": 864} {"train_loss": -39.29209518432617, "global_step": 104586, "epoch": 864} {"train_loss": -38.834747314453125, "global_step": 104587, "epoch": 864} {"train_loss": -38.82362747192383, "global_step": 104588, "epoch": 864} {"train_loss": -38.89501190185547, "global_step": 104589, "epoch": 864} {"train_loss": -39.069976806640625, "global_step": 104590, "epoch": 864} {"train_loss": -39.77838134765625, "global_step": 104591, "epoch": 864} {"train_loss": -39.26081466674805, "global_step": 104592, "epoch": 864} {"train_loss": -38.53074264526367, "global_step": 104593, "epoch": 864} {"train_loss": -38.50153732299805, "global_step": 104594, "epoch": 864} {"train_loss": -38.1403923034668, "global_step": 104595, "epoch": 864} {"train_loss": -39.03896713256836, "global_step": 104596, "epoch": 864} {"train_loss": -38.50315475463867, "global_step": 104597, "epoch": 864} {"train_loss": -39.37267303466797, "global_step": 104598, "epoch": 864} {"train_loss": -38.371070861816406, "global_step": 104599, "epoch": 864} {"train_loss": -38.77234649658203, "global_step": 104600, "epoch": 864} {"train_loss": -38.46879577636719, "global_step": 104601, "epoch": 864} {"train_loss": -37.57095718383789, "global_step": 104602, "epoch": 864} {"train_loss": -38.16184616088867, "global_step": 104603, "epoch": 864} {"train_loss": -38.13370132446289, "global_step": 104604, "epoch": 864} {"train_loss": -38.193763732910156, "global_step": 104605, "epoch": 864} {"train_loss": -39.02750778198242, "global_step": 104606, "epoch": 864} {"train_loss": -37.585365295410156, "global_step": 104607, "epoch": 864} {"train_loss": -37.335205078125, "global_step": 104608, "epoch": 864} {"train_loss": -34.70155715942383, "global_step": 104609, "epoch": 864} {"train_loss": -32.731964111328125, "global_step": 104610, "epoch": 864} {"train_loss": -28.964109420776367, "global_step": 104611, "epoch": 864} {"train_loss": -23.630041122436523, "global_step": 104612, "epoch": 864} {"train_loss": -35.87480545043945, "global_step": 104613, "epoch": 864} {"train_loss": -37.81120681762695, "global_step": 104614, "epoch": 864} {"train_loss": -32.645381927490234, "global_step": 104615, "epoch": 864} {"train_loss": -37.934505462646484, "global_step": 104616, "epoch": 864} {"train_loss": -35.04084777832031, "global_step": 104617, "epoch": 864} {"train_loss": -34.52058029174805, "global_step": 104618, "epoch": 864} {"train_loss": -38.3995361328125, "global_step": 104619, "epoch": 864} {"train_loss": -35.02466583251953, "global_step": 104620, "epoch": 864} {"train_loss": -37.28116226196289, "global_step": 104621, "epoch": 864} {"train_loss": -36.56446075439453, "global_step": 104622, "epoch": 864} {"train_loss": -36.71066665649414, "global_step": 104623, "epoch": 864} {"train_loss": -36.987674713134766, "global_step": 104624, "epoch": 864} {"train_loss": -38.00724411010742, "global_step": 104625, "epoch": 864} {"train_loss": -38.22724533081055, "global_step": 104626, "epoch": 864} {"train_loss": -37.82823944091797, "global_step": 104627, "epoch": 864} {"train_loss": -38.38015365600586, "global_step": 104628, "epoch": 864} {"train_loss": -37.533233642578125, "global_step": 104629, "epoch": 864} {"train_loss": -38.20001983642578, "global_step": 104630, "epoch": 864} {"train_loss": -38.25395965576172, "global_step": 104631, "epoch": 864} {"train_loss": -37.3921012878418, "global_step": 104632, "epoch": 864} {"train_loss": -38.02838897705078, "global_step": 104633, "epoch": 864} {"train_loss": -38.554988861083984, "global_step": 104634, "epoch": 864} {"train_loss": -38.31605911254883, "global_step": 104635, "epoch": 864} {"train_loss": -37.8783073425293, "global_step": 104636, "epoch": 864} {"train_loss": -38.10493850708008, "global_step": 104637, "epoch": 864} {"train_loss": -39.1033935546875, "global_step": 104638, "epoch": 864} {"train_loss": -38.20029830932617, "global_step": 104639, "epoch": 864} {"train_loss": -38.585208892822266, "global_step": 104640, "epoch": 864} {"train_loss": -38.9494514465332, "global_step": 104641, "epoch": 864} {"train_loss": -38.02204895019531, "global_step": 104642, "epoch": 864} {"train_loss": -38.650333404541016, "global_step": 104643, "epoch": 864} {"train_loss": -38.85942077636719, "global_step": 104644, "epoch": 864} {"train_loss": -38.95290756225586, "global_step": 104645, "epoch": 864} {"train_loss": -38.79500198364258, "global_step": 104646, "epoch": 864} {"train_loss": -39.44760513305664, "global_step": 104647, "epoch": 864} {"train_loss": -39.15560531616211, "global_step": 104648, "epoch": 864} {"train_loss": -39.4082145690918, "global_step": 104649, "epoch": 864} {"train_loss": -39.12333297729492, "global_step": 104650, "epoch": 864} {"train_loss": -38.450416564941406, "global_step": 104651, "epoch": 864} {"train_loss": -38.91871643066406, "global_step": 104652, "epoch": 864} {"train_loss": -39.384925842285156, "global_step": 104653, "epoch": 864} {"train_loss": -39.122920989990234, "global_step": 104654, "epoch": 864} {"train_loss": -38.77272415161133, "global_step": 104655, "epoch": 864} {"train_loss": -39.27686309814453, "global_step": 104656, "epoch": 864} {"train_loss": -39.683868408203125, "global_step": 104657, "epoch": 864} {"train_loss": -39.08604049682617, "global_step": 104658, "epoch": 864} {"train_loss": -38.94711685180664, "global_step": 104659, "epoch": 864} {"train_loss": -39.284175872802734, "global_step": 104660, "epoch": 864} {"train_loss": -39.558441162109375, "global_step": 104661, "epoch": 864} {"train_loss": -39.12102508544922, "global_step": 104662, "epoch": 864} {"train_loss": -39.277992248535156, "global_step": 104663, "epoch": 864} {"train_loss": -37.94301381387001, "global_step": 104664, "epoch": 864, "val_loss": 2642394.75} {"train_loss": -39.54155349731445, "global_step": 104665, "epoch": 865} {"train_loss": -39.3267936706543, "global_step": 104666, "epoch": 865} {"train_loss": -39.34160232543945, "global_step": 104667, "epoch": 865} {"train_loss": -39.6357421875, "global_step": 104668, "epoch": 865} {"train_loss": -39.44832229614258, "global_step": 104669, "epoch": 865} {"train_loss": -39.32001876831055, "global_step": 104670, "epoch": 865} {"train_loss": -39.536861419677734, "global_step": 104671, "epoch": 865} {"train_loss": -39.63226318359375, "global_step": 104672, "epoch": 865} {"train_loss": -39.72954177856445, "global_step": 104673, "epoch": 865} {"train_loss": -39.6740837097168, "global_step": 104674, "epoch": 865} {"train_loss": -39.38129806518555, "global_step": 104675, "epoch": 865} {"train_loss": -40.22263717651367, "global_step": 104676, "epoch": 865} {"train_loss": -39.08386993408203, "global_step": 104677, "epoch": 865} {"train_loss": -39.57192611694336, "global_step": 104678, "epoch": 865} {"train_loss": -39.2911262512207, "global_step": 104679, "epoch": 865} {"train_loss": -39.401180267333984, "global_step": 104680, "epoch": 865} {"train_loss": -38.64887619018555, "global_step": 104681, "epoch": 865} {"train_loss": -39.18896484375, "global_step": 104682, "epoch": 865} {"train_loss": -39.066593170166016, "global_step": 104683, "epoch": 865} {"train_loss": -38.9901237487793, "global_step": 104684, "epoch": 865} {"train_loss": -39.29917526245117, "global_step": 104685, "epoch": 865} {"train_loss": -39.55333709716797, "global_step": 104686, "epoch": 865} {"train_loss": -39.499359130859375, "global_step": 104687, "epoch": 865} {"train_loss": -38.793212890625, "global_step": 104688, "epoch": 865} {"train_loss": -37.990779876708984, "global_step": 104689, "epoch": 865} {"train_loss": -37.156803131103516, "global_step": 104690, "epoch": 865} {"train_loss": -34.7122802734375, "global_step": 104691, "epoch": 865} {"train_loss": -33.96324157714844, "global_step": 104692, "epoch": 865} {"train_loss": -38.63985824584961, "global_step": 104693, "epoch": 865} {"train_loss": -38.3564567565918, "global_step": 104694, "epoch": 865} {"train_loss": -36.47544479370117, "global_step": 104695, "epoch": 865} {"train_loss": -39.23702621459961, "global_step": 104696, "epoch": 865} {"train_loss": -37.6698112487793, "global_step": 104697, "epoch": 865} {"train_loss": -36.52121353149414, "global_step": 104698, "epoch": 865} {"train_loss": -38.48310852050781, "global_step": 104699, "epoch": 865} {"train_loss": -37.0973014831543, "global_step": 104700, "epoch": 865} {"train_loss": -36.353275299072266, "global_step": 104701, "epoch": 865} {"train_loss": -37.682525634765625, "global_step": 104702, "epoch": 865} {"train_loss": -38.34308624267578, "global_step": 104703, "epoch": 865} {"train_loss": -39.19416046142578, "global_step": 104704, "epoch": 865} {"train_loss": -37.855262756347656, "global_step": 104705, "epoch": 865} {"train_loss": -38.1029167175293, "global_step": 104706, "epoch": 865} {"train_loss": -38.29871368408203, "global_step": 104707, "epoch": 865} {"train_loss": -39.00629806518555, "global_step": 104708, "epoch": 865} {"train_loss": -38.88429641723633, "global_step": 104709, "epoch": 865} {"train_loss": -39.13234329223633, "global_step": 104710, "epoch": 865} {"train_loss": -39.1505126953125, "global_step": 104711, "epoch": 865} {"train_loss": -39.231224060058594, "global_step": 104712, "epoch": 865} {"train_loss": -38.81025695800781, "global_step": 104713, "epoch": 865} {"train_loss": -38.87314987182617, "global_step": 104714, "epoch": 865} {"train_loss": -37.53891372680664, "global_step": 104715, "epoch": 865} {"train_loss": -38.45945358276367, "global_step": 104716, "epoch": 865} {"train_loss": -38.7667236328125, "global_step": 104717, "epoch": 865} {"train_loss": -39.151832580566406, "global_step": 104718, "epoch": 865} {"train_loss": -38.38977813720703, "global_step": 104719, "epoch": 865} {"train_loss": -38.2511100769043, "global_step": 104720, "epoch": 865} {"train_loss": -38.45957565307617, "global_step": 104721, "epoch": 865} {"train_loss": -38.551414489746094, "global_step": 104722, "epoch": 865} {"train_loss": -37.14716720581055, "global_step": 104723, "epoch": 865} {"train_loss": -39.08631896972656, "global_step": 104724, "epoch": 865} {"train_loss": -38.397857666015625, "global_step": 104725, "epoch": 865} {"train_loss": -38.48516845703125, "global_step": 104726, "epoch": 865} {"train_loss": -37.657711029052734, "global_step": 104727, "epoch": 865} {"train_loss": -37.103458404541016, "global_step": 104728, "epoch": 865} {"train_loss": -39.48041915893555, "global_step": 104729, "epoch": 865} {"train_loss": -37.498008728027344, "global_step": 104730, "epoch": 865} {"train_loss": -37.88433837890625, "global_step": 104731, "epoch": 865} {"train_loss": -37.960140228271484, "global_step": 104732, "epoch": 865} {"train_loss": -37.69295883178711, "global_step": 104733, "epoch": 865} {"train_loss": -37.95093536376953, "global_step": 104734, "epoch": 865} {"train_loss": -36.75820541381836, "global_step": 104735, "epoch": 865} {"train_loss": -38.47705841064453, "global_step": 104736, "epoch": 865} {"train_loss": -36.473567962646484, "global_step": 104737, "epoch": 865} {"train_loss": -38.07292556762695, "global_step": 104738, "epoch": 865} {"train_loss": -36.87077713012695, "global_step": 104739, "epoch": 865} {"train_loss": -37.62751388549805, "global_step": 104740, "epoch": 865} {"train_loss": -37.61097717285156, "global_step": 104741, "epoch": 865} {"train_loss": -36.52020263671875, "global_step": 104742, "epoch": 865} {"train_loss": -37.817962646484375, "global_step": 104743, "epoch": 865} {"train_loss": -36.33185577392578, "global_step": 104744, "epoch": 865} {"train_loss": -36.55680465698242, "global_step": 104745, "epoch": 865} {"train_loss": -37.259212493896484, "global_step": 104746, "epoch": 865} {"train_loss": -37.394134521484375, "global_step": 104747, "epoch": 865} {"train_loss": -36.11568069458008, "global_step": 104748, "epoch": 865} {"train_loss": -38.52600860595703, "global_step": 104749, "epoch": 865} {"train_loss": -35.451263427734375, "global_step": 104750, "epoch": 865} {"train_loss": -37.444801330566406, "global_step": 104751, "epoch": 865} {"train_loss": -37.10676193237305, "global_step": 104752, "epoch": 865} {"train_loss": -35.96533203125, "global_step": 104753, "epoch": 865} {"train_loss": -37.642852783203125, "global_step": 104754, "epoch": 865} {"train_loss": -36.7566032409668, "global_step": 104755, "epoch": 865} {"train_loss": -35.72956466674805, "global_step": 104756, "epoch": 865} {"train_loss": -37.0179443359375, "global_step": 104757, "epoch": 865} {"train_loss": -36.649715423583984, "global_step": 104758, "epoch": 865} {"train_loss": -37.870086669921875, "global_step": 104759, "epoch": 865} {"train_loss": -37.76078414916992, "global_step": 104760, "epoch": 865} {"train_loss": -38.676239013671875, "global_step": 104761, "epoch": 865} {"train_loss": -38.118186950683594, "global_step": 104762, "epoch": 865} {"train_loss": -38.18218994140625, "global_step": 104763, "epoch": 865} {"train_loss": -38.62795639038086, "global_step": 104764, "epoch": 865} {"train_loss": -36.6031379699707, "global_step": 104765, "epoch": 865} {"train_loss": -35.15181350708008, "global_step": 104766, "epoch": 865} {"train_loss": -35.638118743896484, "global_step": 104767, "epoch": 865} {"train_loss": -38.598079681396484, "global_step": 104768, "epoch": 865} {"train_loss": -37.53471755981445, "global_step": 104769, "epoch": 865} {"train_loss": -36.73696517944336, "global_step": 104770, "epoch": 865} {"train_loss": -34.432342529296875, "global_step": 104771, "epoch": 865} {"train_loss": -36.75511169433594, "global_step": 104772, "epoch": 865} {"train_loss": -38.19477462768555, "global_step": 104773, "epoch": 865} {"train_loss": -36.123756408691406, "global_step": 104774, "epoch": 865} {"train_loss": -37.545284271240234, "global_step": 104775, "epoch": 865} {"train_loss": -38.287689208984375, "global_step": 104776, "epoch": 865} {"train_loss": -36.47636795043945, "global_step": 104777, "epoch": 865} {"train_loss": -35.7275505065918, "global_step": 104778, "epoch": 865} {"train_loss": -37.29366683959961, "global_step": 104779, "epoch": 865} {"train_loss": -34.61831283569336, "global_step": 104780, "epoch": 865} {"train_loss": -36.21294403076172, "global_step": 104781, "epoch": 865} {"train_loss": -37.0892448425293, "global_step": 104782, "epoch": 865} {"train_loss": -38.331268310546875, "global_step": 104783, "epoch": 865} {"train_loss": -37.89272689819336, "global_step": 104784, "epoch": 865} {"train_loss": -37.892683265622985, "global_step": 104785, "epoch": 865, "val_loss": 2760147.75} {"train_loss": -36.998565673828125, "global_step": 104786, "epoch": 866} {"train_loss": -36.98954391479492, "global_step": 104787, "epoch": 866} {"train_loss": -36.84980392456055, "global_step": 104788, "epoch": 866} {"train_loss": -38.4464225769043, "global_step": 104789, "epoch": 866} {"train_loss": -37.62752914428711, "global_step": 104790, "epoch": 866} {"train_loss": -38.03452682495117, "global_step": 104791, "epoch": 866} {"train_loss": -37.749549865722656, "global_step": 104792, "epoch": 866} {"train_loss": -37.41242599487305, "global_step": 104793, "epoch": 866} {"train_loss": -36.80750274658203, "global_step": 104794, "epoch": 866} {"train_loss": -38.32866287231445, "global_step": 104795, "epoch": 866} {"train_loss": -38.012107849121094, "global_step": 104796, "epoch": 866} {"train_loss": -37.85686111450195, "global_step": 104797, "epoch": 866} {"train_loss": -38.12736129760742, "global_step": 104798, "epoch": 866} {"train_loss": -37.94366455078125, "global_step": 104799, "epoch": 866} {"train_loss": -36.3182258605957, "global_step": 104800, "epoch": 866} {"train_loss": -38.65015411376953, "global_step": 104801, "epoch": 866} {"train_loss": -38.49273681640625, "global_step": 104802, "epoch": 866} {"train_loss": -36.78622817993164, "global_step": 104803, "epoch": 866} {"train_loss": -36.88529586791992, "global_step": 104804, "epoch": 866} {"train_loss": -36.356468200683594, "global_step": 104805, "epoch": 866} {"train_loss": -36.45203399658203, "global_step": 104806, "epoch": 866} {"train_loss": -36.994625091552734, "global_step": 104807, "epoch": 866} {"train_loss": -37.97443389892578, "global_step": 104808, "epoch": 866} {"train_loss": -37.19536209106445, "global_step": 104809, "epoch": 866} {"train_loss": -37.881282806396484, "global_step": 104810, "epoch": 866} {"train_loss": -34.7416877746582, "global_step": 104811, "epoch": 866} {"train_loss": -37.1241455078125, "global_step": 104812, "epoch": 866} {"train_loss": -37.65438461303711, "global_step": 104813, "epoch": 866} {"train_loss": -38.14512252807617, "global_step": 104814, "epoch": 866} {"train_loss": -37.33180618286133, "global_step": 104815, "epoch": 866} {"train_loss": -36.66189193725586, "global_step": 104816, "epoch": 866} {"train_loss": -37.193763732910156, "global_step": 104817, "epoch": 866} {"train_loss": -37.725215911865234, "global_step": 104818, "epoch": 866} {"train_loss": -38.71169662475586, "global_step": 104819, "epoch": 866} {"train_loss": -37.75077438354492, "global_step": 104820, "epoch": 866} {"train_loss": -37.05778121948242, "global_step": 104821, "epoch": 866} {"train_loss": -37.837039947509766, "global_step": 104822, "epoch": 866} {"train_loss": -37.89865493774414, "global_step": 104823, "epoch": 866} {"train_loss": -36.446964263916016, "global_step": 104824, "epoch": 866} {"train_loss": -37.95991897583008, "global_step": 104825, "epoch": 866} {"train_loss": -37.88727569580078, "global_step": 104826, "epoch": 866} {"train_loss": -35.99729537963867, "global_step": 104827, "epoch": 866} {"train_loss": -37.268096923828125, "global_step": 104828, "epoch": 866} {"train_loss": -37.42605209350586, "global_step": 104829, "epoch": 866} {"train_loss": -38.27717208862305, "global_step": 104830, "epoch": 866} {"train_loss": -38.100196838378906, "global_step": 104831, "epoch": 866} {"train_loss": -37.20909881591797, "global_step": 104832, "epoch": 866} {"train_loss": -38.25074005126953, "global_step": 104833, "epoch": 866} {"train_loss": -38.562835693359375, "global_step": 104834, "epoch": 866} {"train_loss": -37.530460357666016, "global_step": 104835, "epoch": 866} {"train_loss": -37.21367263793945, "global_step": 104836, "epoch": 866} {"train_loss": -35.57738494873047, "global_step": 104837, "epoch": 866} {"train_loss": -37.59675216674805, "global_step": 104838, "epoch": 866} {"train_loss": -38.490821838378906, "global_step": 104839, "epoch": 866} {"train_loss": -37.9770622253418, "global_step": 104840, "epoch": 866} {"train_loss": -36.97743606567383, "global_step": 104841, "epoch": 866} {"train_loss": -36.710609436035156, "global_step": 104842, "epoch": 866} {"train_loss": -37.614013671875, "global_step": 104843, "epoch": 866} {"train_loss": -38.198246002197266, "global_step": 104844, "epoch": 866} {"train_loss": -38.54146194458008, "global_step": 104845, "epoch": 866} {"train_loss": -38.692848205566406, "global_step": 104846, "epoch": 866} {"train_loss": -37.53990936279297, "global_step": 104847, "epoch": 866} {"train_loss": -38.068172454833984, "global_step": 104848, "epoch": 866} {"train_loss": -39.127967834472656, "global_step": 104849, "epoch": 866} {"train_loss": -38.812435150146484, "global_step": 104850, "epoch": 866} {"train_loss": -38.16291427612305, "global_step": 104851, "epoch": 866} {"train_loss": -38.624000549316406, "global_step": 104852, "epoch": 866} {"train_loss": -38.2520637512207, "global_step": 104853, "epoch": 866} {"train_loss": -38.91819381713867, "global_step": 104854, "epoch": 866} {"train_loss": -38.958290100097656, "global_step": 104855, "epoch": 866} {"train_loss": -38.44381332397461, "global_step": 104856, "epoch": 866} {"train_loss": -38.09006881713867, "global_step": 104857, "epoch": 866} {"train_loss": -38.85423278808594, "global_step": 104858, "epoch": 866} {"train_loss": -38.75166320800781, "global_step": 104859, "epoch": 866} {"train_loss": -39.04018783569336, "global_step": 104860, "epoch": 866} {"train_loss": -39.0531120300293, "global_step": 104861, "epoch": 866} {"train_loss": -38.564674377441406, "global_step": 104862, "epoch": 866} {"train_loss": -37.443111419677734, "global_step": 104863, "epoch": 866} {"train_loss": -36.763404846191406, "global_step": 104864, "epoch": 866} {"train_loss": -37.57937240600586, "global_step": 104865, "epoch": 866} {"train_loss": -38.34867477416992, "global_step": 104866, "epoch": 866} {"train_loss": -39.183658599853516, "global_step": 104867, "epoch": 866} {"train_loss": -38.177310943603516, "global_step": 104868, "epoch": 866} {"train_loss": -37.824886322021484, "global_step": 104869, "epoch": 866} {"train_loss": -37.90873336791992, "global_step": 104870, "epoch": 866} {"train_loss": -38.27798843383789, "global_step": 104871, "epoch": 866} {"train_loss": -38.992218017578125, "global_step": 104872, "epoch": 866} {"train_loss": -37.96907043457031, "global_step": 104873, "epoch": 866} {"train_loss": -37.66530990600586, "global_step": 104874, "epoch": 866} {"train_loss": -35.42654037475586, "global_step": 104875, "epoch": 866} {"train_loss": -37.88529586791992, "global_step": 104876, "epoch": 866} {"train_loss": -39.18083572387695, "global_step": 104877, "epoch": 866} {"train_loss": -38.34309005737305, "global_step": 104878, "epoch": 866} {"train_loss": -38.1597900390625, "global_step": 104879, "epoch": 866} {"train_loss": -39.06396484375, "global_step": 104880, "epoch": 866} {"train_loss": -38.66911697387695, "global_step": 104881, "epoch": 866} {"train_loss": -38.997215270996094, "global_step": 104882, "epoch": 866} {"train_loss": -39.19082260131836, "global_step": 104883, "epoch": 866} {"train_loss": -38.6132698059082, "global_step": 104884, "epoch": 866} {"train_loss": -38.42598342895508, "global_step": 104885, "epoch": 866} {"train_loss": -39.026912689208984, "global_step": 104886, "epoch": 866} {"train_loss": -38.93819808959961, "global_step": 104887, "epoch": 866} {"train_loss": -38.554134368896484, "global_step": 104888, "epoch": 866} {"train_loss": -39.63357925415039, "global_step": 104889, "epoch": 866} {"train_loss": -38.294803619384766, "global_step": 104890, "epoch": 866} {"train_loss": -38.7426872253418, "global_step": 104891, "epoch": 866} {"train_loss": -38.717281341552734, "global_step": 104892, "epoch": 866} {"train_loss": -39.269100189208984, "global_step": 104893, "epoch": 866} {"train_loss": -38.488765716552734, "global_step": 104894, "epoch": 866} {"train_loss": -36.899539947509766, "global_step": 104895, "epoch": 866} {"train_loss": -32.45398712158203, "global_step": 104896, "epoch": 866} {"train_loss": -28.118749618530273, "global_step": 104897, "epoch": 866} {"train_loss": -30.771854400634766, "global_step": 104898, "epoch": 866} {"train_loss": -37.569149017333984, "global_step": 104899, "epoch": 866} {"train_loss": -36.47373580932617, "global_step": 104900, "epoch": 866} {"train_loss": -34.196861267089844, "global_step": 104901, "epoch": 866} {"train_loss": -36.931758880615234, "global_step": 104902, "epoch": 866} {"train_loss": -35.383670806884766, "global_step": 104903, "epoch": 866} {"train_loss": -36.86970138549805, "global_step": 104904, "epoch": 866} {"train_loss": -37.375404357910156, "global_step": 104905, "epoch": 866} {"train_loss": -37.61793856975461, "global_step": 104906, "epoch": 866, "val_loss": 2696759.25} {"train_loss": -37.13961410522461, "global_step": 104907, "epoch": 867} {"train_loss": -37.33183288574219, "global_step": 104908, "epoch": 867} {"train_loss": -37.54521179199219, "global_step": 104909, "epoch": 867} {"train_loss": -37.7873649597168, "global_step": 104910, "epoch": 867} {"train_loss": -37.87578201293945, "global_step": 104911, "epoch": 867} {"train_loss": -37.503395080566406, "global_step": 104912, "epoch": 867} {"train_loss": -38.00981521606445, "global_step": 104913, "epoch": 867} {"train_loss": -38.2752799987793, "global_step": 104914, "epoch": 867} {"train_loss": -37.78772735595703, "global_step": 104915, "epoch": 867} {"train_loss": -38.9139518737793, "global_step": 104916, "epoch": 867} {"train_loss": -37.97445297241211, "global_step": 104917, "epoch": 867} {"train_loss": -38.42746353149414, "global_step": 104918, "epoch": 867} {"train_loss": -38.171348571777344, "global_step": 104919, "epoch": 867} {"train_loss": -38.96873092651367, "global_step": 104920, "epoch": 867} {"train_loss": -38.57160568237305, "global_step": 104921, "epoch": 867} {"train_loss": -38.16440963745117, "global_step": 104922, "epoch": 867} {"train_loss": -38.570899963378906, "global_step": 104923, "epoch": 867} {"train_loss": -38.73317337036133, "global_step": 104924, "epoch": 867} {"train_loss": -38.34283447265625, "global_step": 104925, "epoch": 867} {"train_loss": -38.72358703613281, "global_step": 104926, "epoch": 867} {"train_loss": -38.721900939941406, "global_step": 104927, "epoch": 867} {"train_loss": -36.639923095703125, "global_step": 104928, "epoch": 867} {"train_loss": -37.679012298583984, "global_step": 104929, "epoch": 867} {"train_loss": -38.955928802490234, "global_step": 104930, "epoch": 867} {"train_loss": -38.23588943481445, "global_step": 104931, "epoch": 867} {"train_loss": -38.99675369262695, "global_step": 104932, "epoch": 867} {"train_loss": -37.577049255371094, "global_step": 104933, "epoch": 867} {"train_loss": -39.23012924194336, "global_step": 104934, "epoch": 867} {"train_loss": -38.3511962890625, "global_step": 104935, "epoch": 867} {"train_loss": -39.053768157958984, "global_step": 104936, "epoch": 867} {"train_loss": -39.02032470703125, "global_step": 104937, "epoch": 867} {"train_loss": -38.85009002685547, "global_step": 104938, "epoch": 867} {"train_loss": -39.253822326660156, "global_step": 104939, "epoch": 867} {"train_loss": -39.419349670410156, "global_step": 104940, "epoch": 867} {"train_loss": -38.07904052734375, "global_step": 104941, "epoch": 867} {"train_loss": -38.315406799316406, "global_step": 104942, "epoch": 867} {"train_loss": -39.446083068847656, "global_step": 104943, "epoch": 867} {"train_loss": -38.22865295410156, "global_step": 104944, "epoch": 867} {"train_loss": -39.15821838378906, "global_step": 104945, "epoch": 867} {"train_loss": -39.144866943359375, "global_step": 104946, "epoch": 867} {"train_loss": -38.46445846557617, "global_step": 104947, "epoch": 867} {"train_loss": -38.58378601074219, "global_step": 104948, "epoch": 867} {"train_loss": -39.02187728881836, "global_step": 104949, "epoch": 867} {"train_loss": -39.34687042236328, "global_step": 104950, "epoch": 867} {"train_loss": -38.99911117553711, "global_step": 104951, "epoch": 867} {"train_loss": -39.065521240234375, "global_step": 104952, "epoch": 867} {"train_loss": -39.160518646240234, "global_step": 104953, "epoch": 867} {"train_loss": -39.47634506225586, "global_step": 104954, "epoch": 867} {"train_loss": -39.07326889038086, "global_step": 104955, "epoch": 867} {"train_loss": -38.71078109741211, "global_step": 104956, "epoch": 867} {"train_loss": -38.89008331298828, "global_step": 104957, "epoch": 867} {"train_loss": -38.49214553833008, "global_step": 104958, "epoch": 867} {"train_loss": -38.430458068847656, "global_step": 104959, "epoch": 867} {"train_loss": -39.3797492980957, "global_step": 104960, "epoch": 867} {"train_loss": -39.195068359375, "global_step": 104961, "epoch": 867} {"train_loss": -38.7311897277832, "global_step": 104962, "epoch": 867} {"train_loss": -38.596771240234375, "global_step": 104963, "epoch": 867} {"train_loss": -38.713069915771484, "global_step": 104964, "epoch": 867} {"train_loss": -39.52529525756836, "global_step": 104965, "epoch": 867} {"train_loss": -38.986846923828125, "global_step": 104966, "epoch": 867} {"train_loss": -38.85968780517578, "global_step": 104967, "epoch": 867} {"train_loss": -39.005558013916016, "global_step": 104968, "epoch": 867} {"train_loss": -39.026153564453125, "global_step": 104969, "epoch": 867} {"train_loss": -37.66582489013672, "global_step": 104970, "epoch": 867} {"train_loss": -39.017799377441406, "global_step": 104971, "epoch": 867} {"train_loss": -39.18841552734375, "global_step": 104972, "epoch": 867} {"train_loss": -37.803646087646484, "global_step": 104973, "epoch": 867} {"train_loss": -38.0072135925293, "global_step": 104974, "epoch": 867} {"train_loss": -39.56657791137695, "global_step": 104975, "epoch": 867} {"train_loss": -37.8504524230957, "global_step": 104976, "epoch": 867} {"train_loss": -38.058876037597656, "global_step": 104977, "epoch": 867} {"train_loss": -39.1355094909668, "global_step": 104978, "epoch": 867} {"train_loss": -37.74765396118164, "global_step": 104979, "epoch": 867} {"train_loss": -38.58848190307617, "global_step": 104980, "epoch": 867} {"train_loss": -36.98261642456055, "global_step": 104981, "epoch": 867} {"train_loss": -36.79317855834961, "global_step": 104982, "epoch": 867} {"train_loss": -37.97224426269531, "global_step": 104983, "epoch": 867} {"train_loss": -37.59016418457031, "global_step": 104984, "epoch": 867} {"train_loss": -36.39567184448242, "global_step": 104985, "epoch": 867} {"train_loss": -38.555965423583984, "global_step": 104986, "epoch": 867} {"train_loss": -38.05972671508789, "global_step": 104987, "epoch": 867} {"train_loss": -38.10789108276367, "global_step": 104988, "epoch": 867} {"train_loss": -37.61731719970703, "global_step": 104989, "epoch": 867} {"train_loss": -35.41716384887695, "global_step": 104990, "epoch": 867} {"train_loss": -37.84272003173828, "global_step": 104991, "epoch": 867} {"train_loss": -38.647682189941406, "global_step": 104992, "epoch": 867} {"train_loss": -38.095314025878906, "global_step": 104993, "epoch": 867} {"train_loss": -39.11600875854492, "global_step": 104994, "epoch": 867} {"train_loss": -38.70098876953125, "global_step": 104995, "epoch": 867} {"train_loss": -36.327850341796875, "global_step": 104996, "epoch": 867} {"train_loss": -37.85172653198242, "global_step": 104997, "epoch": 867} {"train_loss": -33.84077072143555, "global_step": 104998, "epoch": 867} {"train_loss": -38.179256439208984, "global_step": 104999, "epoch": 867} {"train_loss": -37.08171463012695, "global_step": 105000, "epoch": 867} {"train_loss": -37.235382080078125, "global_step": 105001, "epoch": 867} {"train_loss": -38.72694778442383, "global_step": 105002, "epoch": 867} {"train_loss": -37.48356246948242, "global_step": 105003, "epoch": 867} {"train_loss": -38.113807678222656, "global_step": 105004, "epoch": 867} {"train_loss": -38.09432601928711, "global_step": 105005, "epoch": 867} {"train_loss": -38.26112747192383, "global_step": 105006, "epoch": 867} {"train_loss": -38.86735916137695, "global_step": 105007, "epoch": 867} {"train_loss": -37.989601135253906, "global_step": 105008, "epoch": 867} {"train_loss": -38.865501403808594, "global_step": 105009, "epoch": 867} {"train_loss": -37.35044860839844, "global_step": 105010, "epoch": 867} {"train_loss": -36.80282211303711, "global_step": 105011, "epoch": 867} {"train_loss": -38.294708251953125, "global_step": 105012, "epoch": 867} {"train_loss": -36.484981536865234, "global_step": 105013, "epoch": 867} {"train_loss": -37.059749603271484, "global_step": 105014, "epoch": 867} {"train_loss": -36.1199951171875, "global_step": 105015, "epoch": 867} {"train_loss": -37.175628662109375, "global_step": 105016, "epoch": 867} {"train_loss": -37.11605453491211, "global_step": 105017, "epoch": 867} {"train_loss": -36.8822135925293, "global_step": 105018, "epoch": 867} {"train_loss": -33.297664642333984, "global_step": 105019, "epoch": 867} {"train_loss": -33.99982833862305, "global_step": 105020, "epoch": 867} {"train_loss": -37.558773040771484, "global_step": 105021, "epoch": 867} {"train_loss": -37.29085159301758, "global_step": 105022, "epoch": 867} {"train_loss": -34.80422592163086, "global_step": 105023, "epoch": 867} {"train_loss": -34.13676452636719, "global_step": 105024, "epoch": 867} {"train_loss": -37.87168502807617, "global_step": 105025, "epoch": 867} {"train_loss": -36.733516693115234, "global_step": 105026, "epoch": 867} {"train_loss": -38.01534781968298, "global_step": 105027, "epoch": 867, "val_loss": 2660339.5} {"train_loss": -33.31315231323242, "global_step": 105028, "epoch": 868} {"train_loss": -35.18917465209961, "global_step": 105029, "epoch": 868} {"train_loss": -31.067411422729492, "global_step": 105030, "epoch": 868} {"train_loss": -36.33018112182617, "global_step": 105031, "epoch": 868} {"train_loss": -33.91209030151367, "global_step": 105032, "epoch": 868} {"train_loss": -27.097402572631836, "global_step": 105033, "epoch": 868} {"train_loss": -36.69282150268555, "global_step": 105034, "epoch": 868} {"train_loss": -36.18162155151367, "global_step": 105035, "epoch": 868} {"train_loss": -34.59719467163086, "global_step": 105036, "epoch": 868} {"train_loss": -35.191463470458984, "global_step": 105037, "epoch": 868} {"train_loss": -37.089996337890625, "global_step": 105038, "epoch": 868} {"train_loss": -36.77341842651367, "global_step": 105039, "epoch": 868} {"train_loss": -35.95523452758789, "global_step": 105040, "epoch": 868} {"train_loss": -36.2932243347168, "global_step": 105041, "epoch": 868} {"train_loss": -35.70463180541992, "global_step": 105042, "epoch": 868} {"train_loss": -36.169132232666016, "global_step": 105043, "epoch": 868} {"train_loss": -34.55253219604492, "global_step": 105044, "epoch": 868} {"train_loss": -37.61592483520508, "global_step": 105045, "epoch": 868} {"train_loss": -37.62351989746094, "global_step": 105046, "epoch": 868} {"train_loss": -37.01694869995117, "global_step": 105047, "epoch": 868} {"train_loss": -37.27954864501953, "global_step": 105048, "epoch": 868} {"train_loss": -36.59804153442383, "global_step": 105049, "epoch": 868} {"train_loss": -37.0095329284668, "global_step": 105050, "epoch": 868} {"train_loss": -36.73661422729492, "global_step": 105051, "epoch": 868} {"train_loss": -37.8278923034668, "global_step": 105052, "epoch": 868} {"train_loss": -36.74514389038086, "global_step": 105053, "epoch": 868} {"train_loss": -35.90571212768555, "global_step": 105054, "epoch": 868} {"train_loss": -37.00970458984375, "global_step": 105055, "epoch": 868} {"train_loss": -37.48961639404297, "global_step": 105056, "epoch": 868} {"train_loss": -37.33683776855469, "global_step": 105057, "epoch": 868} {"train_loss": -36.31666946411133, "global_step": 105058, "epoch": 868} {"train_loss": -36.96085739135742, "global_step": 105059, "epoch": 868} {"train_loss": -37.799102783203125, "global_step": 105060, "epoch": 868} {"train_loss": -36.45057678222656, "global_step": 105061, "epoch": 868} {"train_loss": -38.37982940673828, "global_step": 105062, "epoch": 868} {"train_loss": -36.91775131225586, "global_step": 105063, "epoch": 868} {"train_loss": -37.713008880615234, "global_step": 105064, "epoch": 868} {"train_loss": -37.44491195678711, "global_step": 105065, "epoch": 868} {"train_loss": -37.59530258178711, "global_step": 105066, "epoch": 868} {"train_loss": -38.11287307739258, "global_step": 105067, "epoch": 868} {"train_loss": -37.9277229309082, "global_step": 105068, "epoch": 868} {"train_loss": -37.54932403564453, "global_step": 105069, "epoch": 868} {"train_loss": -38.16400909423828, "global_step": 105070, "epoch": 868} {"train_loss": -37.83604049682617, "global_step": 105071, "epoch": 868} {"train_loss": -38.24807357788086, "global_step": 105072, "epoch": 868} {"train_loss": -37.38838577270508, "global_step": 105073, "epoch": 868} {"train_loss": -38.24079132080078, "global_step": 105074, "epoch": 868} {"train_loss": -38.1730842590332, "global_step": 105075, "epoch": 868} {"train_loss": -38.04832077026367, "global_step": 105076, "epoch": 868} {"train_loss": -38.2645378112793, "global_step": 105077, "epoch": 868} {"train_loss": -38.335323333740234, "global_step": 105078, "epoch": 868} {"train_loss": -38.57454299926758, "global_step": 105079, "epoch": 868} {"train_loss": -38.86604690551758, "global_step": 105080, "epoch": 868} {"train_loss": -38.150508880615234, "global_step": 105081, "epoch": 868} {"train_loss": -38.422264099121094, "global_step": 105082, "epoch": 868} {"train_loss": -38.73001480102539, "global_step": 105083, "epoch": 868} {"train_loss": -39.02815628051758, "global_step": 105084, "epoch": 868} {"train_loss": -38.5633659362793, "global_step": 105085, "epoch": 868} {"train_loss": -38.83244705200195, "global_step": 105086, "epoch": 868} {"train_loss": -39.2318115234375, "global_step": 105087, "epoch": 868} {"train_loss": -38.78333282470703, "global_step": 105088, "epoch": 868} {"train_loss": -39.30863571166992, "global_step": 105089, "epoch": 868} {"train_loss": -39.32918167114258, "global_step": 105090, "epoch": 868} {"train_loss": -39.570133209228516, "global_step": 105091, "epoch": 868} {"train_loss": -39.341304779052734, "global_step": 105092, "epoch": 868} {"train_loss": -39.045387268066406, "global_step": 105093, "epoch": 868} {"train_loss": -39.593814849853516, "global_step": 105094, "epoch": 868} {"train_loss": -39.193756103515625, "global_step": 105095, "epoch": 868} {"train_loss": -39.31794357299805, "global_step": 105096, "epoch": 868} {"train_loss": -38.36587142944336, "global_step": 105097, "epoch": 868} {"train_loss": -38.78342819213867, "global_step": 105098, "epoch": 868} {"train_loss": -39.3002815246582, "global_step": 105099, "epoch": 868} {"train_loss": -38.46975326538086, "global_step": 105100, "epoch": 868} {"train_loss": -38.16379928588867, "global_step": 105101, "epoch": 868} {"train_loss": -39.0961799621582, "global_step": 105102, "epoch": 868} {"train_loss": -38.64976119995117, "global_step": 105103, "epoch": 868} {"train_loss": -39.578468322753906, "global_step": 105104, "epoch": 868} {"train_loss": -38.552345275878906, "global_step": 105105, "epoch": 868} {"train_loss": -38.777748107910156, "global_step": 105106, "epoch": 868} {"train_loss": -39.22138214111328, "global_step": 105107, "epoch": 868} {"train_loss": -38.25444412231445, "global_step": 105108, "epoch": 868} {"train_loss": -38.972381591796875, "global_step": 105109, "epoch": 868} {"train_loss": -39.21271896362305, "global_step": 105110, "epoch": 868} {"train_loss": -39.302337646484375, "global_step": 105111, "epoch": 868} {"train_loss": -39.00665283203125, "global_step": 105112, "epoch": 868} {"train_loss": -39.066463470458984, "global_step": 105113, "epoch": 868} {"train_loss": -39.05647659301758, "global_step": 105114, "epoch": 868} {"train_loss": -39.432926177978516, "global_step": 105115, "epoch": 868} {"train_loss": -39.12188720703125, "global_step": 105116, "epoch": 868} {"train_loss": -39.884761810302734, "global_step": 105117, "epoch": 868} {"train_loss": -39.156585693359375, "global_step": 105118, "epoch": 868} {"train_loss": -38.84469223022461, "global_step": 105119, "epoch": 868} {"train_loss": -39.06599044799805, "global_step": 105120, "epoch": 868} {"train_loss": -36.9769172668457, "global_step": 105121, "epoch": 868} {"train_loss": -38.655921936035156, "global_step": 105122, "epoch": 868} {"train_loss": -37.84693145751953, "global_step": 105123, "epoch": 868} {"train_loss": -38.422367095947266, "global_step": 105124, "epoch": 868} {"train_loss": -37.39094924926758, "global_step": 105125, "epoch": 868} {"train_loss": -35.322898864746094, "global_step": 105126, "epoch": 868} {"train_loss": -30.398527145385742, "global_step": 105127, "epoch": 868} {"train_loss": -25.28211784362793, "global_step": 105128, "epoch": 868} {"train_loss": -25.680042266845703, "global_step": 105129, "epoch": 868} {"train_loss": -33.202266693115234, "global_step": 105130, "epoch": 868} {"train_loss": -36.152584075927734, "global_step": 105131, "epoch": 868} {"train_loss": -35.00288009643555, "global_step": 105132, "epoch": 868} {"train_loss": -36.869441986083984, "global_step": 105133, "epoch": 868} {"train_loss": -34.511260986328125, "global_step": 105134, "epoch": 868} {"train_loss": -35.34888458251953, "global_step": 105135, "epoch": 868} {"train_loss": -36.89836120605469, "global_step": 105136, "epoch": 868} {"train_loss": -36.862701416015625, "global_step": 105137, "epoch": 868} {"train_loss": -37.659523010253906, "global_step": 105138, "epoch": 868} {"train_loss": -38.3699951171875, "global_step": 105139, "epoch": 868} {"train_loss": -37.71080780029297, "global_step": 105140, "epoch": 868} {"train_loss": -37.80652618408203, "global_step": 105141, "epoch": 868} {"train_loss": -38.2926139831543, "global_step": 105142, "epoch": 868} {"train_loss": -37.69687271118164, "global_step": 105143, "epoch": 868} {"train_loss": -38.85013961791992, "global_step": 105144, "epoch": 868} {"train_loss": -37.999019622802734, "global_step": 105145, "epoch": 868} {"train_loss": -39.12534713745117, "global_step": 105146, "epoch": 868} {"train_loss": -38.32589340209961, "global_step": 105147, "epoch": 868} {"train_loss": -37.316013998236535, "global_step": 105148, "epoch": 868, "val_loss": 2553931.5} {"train_loss": -38.69350814819336, "global_step": 105149, "epoch": 869} {"train_loss": -39.141510009765625, "global_step": 105150, "epoch": 869} {"train_loss": -38.54450225830078, "global_step": 105151, "epoch": 869} {"train_loss": -39.36692428588867, "global_step": 105152, "epoch": 869} {"train_loss": -38.788848876953125, "global_step": 105153, "epoch": 869} {"train_loss": -39.37370681762695, "global_step": 105154, "epoch": 869} {"train_loss": -39.337886810302734, "global_step": 105155, "epoch": 869} {"train_loss": -39.12370681762695, "global_step": 105156, "epoch": 869} {"train_loss": -39.19390106201172, "global_step": 105157, "epoch": 869} {"train_loss": -39.37335205078125, "global_step": 105158, "epoch": 869} {"train_loss": -38.937313079833984, "global_step": 105159, "epoch": 869} {"train_loss": -39.11187744140625, "global_step": 105160, "epoch": 869} {"train_loss": -39.33425521850586, "global_step": 105161, "epoch": 869} {"train_loss": -39.264068603515625, "global_step": 105162, "epoch": 869} {"train_loss": -39.454097747802734, "global_step": 105163, "epoch": 869} {"train_loss": -38.85931396484375, "global_step": 105164, "epoch": 869} {"train_loss": -39.81158447265625, "global_step": 105165, "epoch": 869} {"train_loss": -38.6771354675293, "global_step": 105166, "epoch": 869} {"train_loss": -39.54651641845703, "global_step": 105167, "epoch": 869} {"train_loss": -38.58240509033203, "global_step": 105168, "epoch": 869} {"train_loss": -39.09566879272461, "global_step": 105169, "epoch": 869} {"train_loss": -39.2196159362793, "global_step": 105170, "epoch": 869} {"train_loss": -39.62272644042969, "global_step": 105171, "epoch": 869} {"train_loss": -39.79780197143555, "global_step": 105172, "epoch": 869} {"train_loss": -38.68574142456055, "global_step": 105173, "epoch": 869} {"train_loss": -39.30435562133789, "global_step": 105174, "epoch": 869} {"train_loss": -39.160091400146484, "global_step": 105175, "epoch": 869} {"train_loss": -38.5737419128418, "global_step": 105176, "epoch": 869} {"train_loss": -39.25971603393555, "global_step": 105177, "epoch": 869} {"train_loss": -38.85866165161133, "global_step": 105178, "epoch": 869} {"train_loss": -38.16497802734375, "global_step": 105179, "epoch": 869} {"train_loss": -39.089691162109375, "global_step": 105180, "epoch": 869} {"train_loss": -38.888038635253906, "global_step": 105181, "epoch": 869} {"train_loss": -39.574005126953125, "global_step": 105182, "epoch": 869} {"train_loss": -39.448089599609375, "global_step": 105183, "epoch": 869} {"train_loss": -39.388671875, "global_step": 105184, "epoch": 869} {"train_loss": -38.87614822387695, "global_step": 105185, "epoch": 869} {"train_loss": -38.91587448120117, "global_step": 105186, "epoch": 869} {"train_loss": -38.930355072021484, "global_step": 105187, "epoch": 869} {"train_loss": -38.95248031616211, "global_step": 105188, "epoch": 869} {"train_loss": -39.2008056640625, "global_step": 105189, "epoch": 869} {"train_loss": -38.3535270690918, "global_step": 105190, "epoch": 869} {"train_loss": -37.56692123413086, "global_step": 105191, "epoch": 869} {"train_loss": -38.911651611328125, "global_step": 105192, "epoch": 869} {"train_loss": -38.938514709472656, "global_step": 105193, "epoch": 869} {"train_loss": -37.52690124511719, "global_step": 105194, "epoch": 869} {"train_loss": -36.22697067260742, "global_step": 105195, "epoch": 869} {"train_loss": -35.37596893310547, "global_step": 105196, "epoch": 869} {"train_loss": -36.03803634643555, "global_step": 105197, "epoch": 869} {"train_loss": -34.65265655517578, "global_step": 105198, "epoch": 869} {"train_loss": -35.296173095703125, "global_step": 105199, "epoch": 869} {"train_loss": -34.82860565185547, "global_step": 105200, "epoch": 869} {"train_loss": -37.61054611206055, "global_step": 105201, "epoch": 869} {"train_loss": -39.45547103881836, "global_step": 105202, "epoch": 869} {"train_loss": -38.39912033081055, "global_step": 105203, "epoch": 869} {"train_loss": -36.783470153808594, "global_step": 105204, "epoch": 869} {"train_loss": -38.11423110961914, "global_step": 105205, "epoch": 869} {"train_loss": -37.99921798706055, "global_step": 105206, "epoch": 869} {"train_loss": -38.753501892089844, "global_step": 105207, "epoch": 869} {"train_loss": -36.86223220825195, "global_step": 105208, "epoch": 869} {"train_loss": -37.38275909423828, "global_step": 105209, "epoch": 869} {"train_loss": -38.83301544189453, "global_step": 105210, "epoch": 869} {"train_loss": -36.6678581237793, "global_step": 105211, "epoch": 869} {"train_loss": -37.55709457397461, "global_step": 105212, "epoch": 869} {"train_loss": -38.513450622558594, "global_step": 105213, "epoch": 869} {"train_loss": -37.96598434448242, "global_step": 105214, "epoch": 869} {"train_loss": -38.400962829589844, "global_step": 105215, "epoch": 869} {"train_loss": -36.80951690673828, "global_step": 105216, "epoch": 869} {"train_loss": -38.7007942199707, "global_step": 105217, "epoch": 869} {"train_loss": -37.48421859741211, "global_step": 105218, "epoch": 869} {"train_loss": -39.226863861083984, "global_step": 105219, "epoch": 869} {"train_loss": -37.544925689697266, "global_step": 105220, "epoch": 869} {"train_loss": -38.8690299987793, "global_step": 105221, "epoch": 869} {"train_loss": -38.0327033996582, "global_step": 105222, "epoch": 869} {"train_loss": -38.38428497314453, "global_step": 105223, "epoch": 869} {"train_loss": -38.58772659301758, "global_step": 105224, "epoch": 869} {"train_loss": -38.74085235595703, "global_step": 105225, "epoch": 869} {"train_loss": -38.66181564331055, "global_step": 105226, "epoch": 869} {"train_loss": -38.98499298095703, "global_step": 105227, "epoch": 869} {"train_loss": -38.67766189575195, "global_step": 105228, "epoch": 869} {"train_loss": -38.909358978271484, "global_step": 105229, "epoch": 869} {"train_loss": -38.48896408081055, "global_step": 105230, "epoch": 869} {"train_loss": -38.355037689208984, "global_step": 105231, "epoch": 869} {"train_loss": -38.42531204223633, "global_step": 105232, "epoch": 869} {"train_loss": -39.011322021484375, "global_step": 105233, "epoch": 869} {"train_loss": -39.103084564208984, "global_step": 105234, "epoch": 869} {"train_loss": -38.48419189453125, "global_step": 105235, "epoch": 869} {"train_loss": -39.22437286376953, "global_step": 105236, "epoch": 869} {"train_loss": -38.98024368286133, "global_step": 105237, "epoch": 869} {"train_loss": -38.539634704589844, "global_step": 105238, "epoch": 869} {"train_loss": -39.0013542175293, "global_step": 105239, "epoch": 869} {"train_loss": -38.79578399658203, "global_step": 105240, "epoch": 869} {"train_loss": -38.99519729614258, "global_step": 105241, "epoch": 869} {"train_loss": -38.62200164794922, "global_step": 105242, "epoch": 869} {"train_loss": -38.628448486328125, "global_step": 105243, "epoch": 869} {"train_loss": -38.6292610168457, "global_step": 105244, "epoch": 869} {"train_loss": -37.2103157043457, "global_step": 105245, "epoch": 869} {"train_loss": -37.50638961791992, "global_step": 105246, "epoch": 869} {"train_loss": -37.72166061401367, "global_step": 105247, "epoch": 869} {"train_loss": -39.12763214111328, "global_step": 105248, "epoch": 869} {"train_loss": -36.3418083190918, "global_step": 105249, "epoch": 869} {"train_loss": -35.774776458740234, "global_step": 105250, "epoch": 869} {"train_loss": -38.222679138183594, "global_step": 105251, "epoch": 869} {"train_loss": -34.034141540527344, "global_step": 105252, "epoch": 869} {"train_loss": -31.318449020385742, "global_step": 105253, "epoch": 869} {"train_loss": -38.314064025878906, "global_step": 105254, "epoch": 869} {"train_loss": -33.95916748046875, "global_step": 105255, "epoch": 869} {"train_loss": -37.21441650390625, "global_step": 105256, "epoch": 869} {"train_loss": -37.304813385009766, "global_step": 105257, "epoch": 869} {"train_loss": -35.82950210571289, "global_step": 105258, "epoch": 869} {"train_loss": -38.24513626098633, "global_step": 105259, "epoch": 869} {"train_loss": -36.0609130859375, "global_step": 105260, "epoch": 869} {"train_loss": -36.78947067260742, "global_step": 105261, "epoch": 869} {"train_loss": -37.04789352416992, "global_step": 105262, "epoch": 869} {"train_loss": -38.028011322021484, "global_step": 105263, "epoch": 869} {"train_loss": -36.8397331237793, "global_step": 105264, "epoch": 869} {"train_loss": -38.44514083862305, "global_step": 105265, "epoch": 869} {"train_loss": -37.45293045043945, "global_step": 105266, "epoch": 869} {"train_loss": -38.91775894165039, "global_step": 105267, "epoch": 869} {"train_loss": -38.210121154785156, "global_step": 105268, "epoch": 869} {"train_loss": -38.185509342792606, "global_step": 105269, "epoch": 869, "val_loss": 2659637.75} {"train_loss": -38.34723663330078, "global_step": 105270, "epoch": 870} {"train_loss": -38.220916748046875, "global_step": 105271, "epoch": 870} {"train_loss": -38.246944427490234, "global_step": 105272, "epoch": 870} {"train_loss": -38.477027893066406, "global_step": 105273, "epoch": 870} {"train_loss": -38.65205001831055, "global_step": 105274, "epoch": 870} {"train_loss": -38.96522903442383, "global_step": 105275, "epoch": 870} {"train_loss": -39.10372543334961, "global_step": 105276, "epoch": 870} {"train_loss": -39.13624954223633, "global_step": 105277, "epoch": 870} {"train_loss": -38.87095260620117, "global_step": 105278, "epoch": 870} {"train_loss": -38.85755157470703, "global_step": 105279, "epoch": 870} {"train_loss": -38.86007308959961, "global_step": 105280, "epoch": 870} {"train_loss": -39.23889923095703, "global_step": 105281, "epoch": 870} {"train_loss": -39.141456604003906, "global_step": 105282, "epoch": 870} {"train_loss": -38.768062591552734, "global_step": 105283, "epoch": 870} {"train_loss": -39.29810333251953, "global_step": 105284, "epoch": 870} {"train_loss": -39.243526458740234, "global_step": 105285, "epoch": 870} {"train_loss": -38.542518615722656, "global_step": 105286, "epoch": 870} {"train_loss": -39.398128509521484, "global_step": 105287, "epoch": 870} {"train_loss": -39.16361999511719, "global_step": 105288, "epoch": 870} {"train_loss": -39.0892448425293, "global_step": 105289, "epoch": 870} {"train_loss": -38.63648986816406, "global_step": 105290, "epoch": 870} {"train_loss": -39.43160629272461, "global_step": 105291, "epoch": 870} {"train_loss": -38.983917236328125, "global_step": 105292, "epoch": 870} {"train_loss": -39.70014953613281, "global_step": 105293, "epoch": 870} {"train_loss": -39.79567337036133, "global_step": 105294, "epoch": 870} {"train_loss": -39.22028732299805, "global_step": 105295, "epoch": 870} {"train_loss": -39.45467758178711, "global_step": 105296, "epoch": 870} {"train_loss": -38.683135986328125, "global_step": 105297, "epoch": 870} {"train_loss": -39.06747817993164, "global_step": 105298, "epoch": 870} {"train_loss": -40.0871696472168, "global_step": 105299, "epoch": 870} {"train_loss": -39.07601547241211, "global_step": 105300, "epoch": 870} {"train_loss": -38.459495544433594, "global_step": 105301, "epoch": 870} {"train_loss": -38.245460510253906, "global_step": 105302, "epoch": 870} {"train_loss": -38.7747688293457, "global_step": 105303, "epoch": 870} {"train_loss": -39.6526985168457, "global_step": 105304, "epoch": 870} {"train_loss": -39.65497970581055, "global_step": 105305, "epoch": 870} {"train_loss": -38.457523345947266, "global_step": 105306, "epoch": 870} {"train_loss": -38.81519317626953, "global_step": 105307, "epoch": 870} {"train_loss": -38.90086364746094, "global_step": 105308, "epoch": 870} {"train_loss": -39.13785934448242, "global_step": 105309, "epoch": 870} {"train_loss": -37.214942932128906, "global_step": 105310, "epoch": 870} {"train_loss": -38.72454833984375, "global_step": 105311, "epoch": 870} {"train_loss": -39.820716857910156, "global_step": 105312, "epoch": 870} {"train_loss": -39.808902740478516, "global_step": 105313, "epoch": 870} {"train_loss": -39.10392379760742, "global_step": 105314, "epoch": 870} {"train_loss": -39.421913146972656, "global_step": 105315, "epoch": 870} {"train_loss": -38.82805633544922, "global_step": 105316, "epoch": 870} {"train_loss": -39.73997497558594, "global_step": 105317, "epoch": 870} {"train_loss": -39.97433090209961, "global_step": 105318, "epoch": 870} {"train_loss": -39.49595260620117, "global_step": 105319, "epoch": 870} {"train_loss": -39.65864181518555, "global_step": 105320, "epoch": 870} {"train_loss": -39.76152801513672, "global_step": 105321, "epoch": 870} {"train_loss": -39.450836181640625, "global_step": 105322, "epoch": 870} {"train_loss": -38.637229919433594, "global_step": 105323, "epoch": 870} {"train_loss": -37.05815887451172, "global_step": 105324, "epoch": 870} {"train_loss": -36.47795486450195, "global_step": 105325, "epoch": 870} {"train_loss": -34.157737731933594, "global_step": 105326, "epoch": 870} {"train_loss": -38.338504791259766, "global_step": 105327, "epoch": 870} {"train_loss": -34.864845275878906, "global_step": 105328, "epoch": 870} {"train_loss": -34.934234619140625, "global_step": 105329, "epoch": 870} {"train_loss": -37.84186553955078, "global_step": 105330, "epoch": 870} {"train_loss": -35.79384994506836, "global_step": 105331, "epoch": 870} {"train_loss": -38.06817626953125, "global_step": 105332, "epoch": 870} {"train_loss": -37.15189743041992, "global_step": 105333, "epoch": 870} {"train_loss": -38.20601272583008, "global_step": 105334, "epoch": 870} {"train_loss": -37.54119873046875, "global_step": 105335, "epoch": 870} {"train_loss": -36.89790725708008, "global_step": 105336, "epoch": 870} {"train_loss": -38.35567855834961, "global_step": 105337, "epoch": 870} {"train_loss": -38.374755859375, "global_step": 105338, "epoch": 870} {"train_loss": -37.12733840942383, "global_step": 105339, "epoch": 870} {"train_loss": -37.4736442565918, "global_step": 105340, "epoch": 870} {"train_loss": -38.490821838378906, "global_step": 105341, "epoch": 870} {"train_loss": -38.06574630737305, "global_step": 105342, "epoch": 870} {"train_loss": -37.59479904174805, "global_step": 105343, "epoch": 870} {"train_loss": -38.25589370727539, "global_step": 105344, "epoch": 870} {"train_loss": -36.8388671875, "global_step": 105345, "epoch": 870} {"train_loss": -38.62287902832031, "global_step": 105346, "epoch": 870} {"train_loss": -38.5595817565918, "global_step": 105347, "epoch": 870} {"train_loss": -38.6954231262207, "global_step": 105348, "epoch": 870} {"train_loss": -39.22937774658203, "global_step": 105349, "epoch": 870} {"train_loss": -39.30092239379883, "global_step": 105350, "epoch": 870} {"train_loss": -38.85956573486328, "global_step": 105351, "epoch": 870} {"train_loss": -39.382259368896484, "global_step": 105352, "epoch": 870} {"train_loss": -39.435882568359375, "global_step": 105353, "epoch": 870} {"train_loss": -39.42782211303711, "global_step": 105354, "epoch": 870} {"train_loss": -39.52534866333008, "global_step": 105355, "epoch": 870} {"train_loss": -39.42993927001953, "global_step": 105356, "epoch": 870} {"train_loss": -39.40517807006836, "global_step": 105357, "epoch": 870} {"train_loss": -39.58663558959961, "global_step": 105358, "epoch": 870} {"train_loss": -39.64982223510742, "global_step": 105359, "epoch": 870} {"train_loss": -39.56855392456055, "global_step": 105360, "epoch": 870} {"train_loss": -39.47447967529297, "global_step": 105361, "epoch": 870} {"train_loss": -39.289817810058594, "global_step": 105362, "epoch": 870} {"train_loss": -39.958106994628906, "global_step": 105363, "epoch": 870} {"train_loss": -39.81927490234375, "global_step": 105364, "epoch": 870} {"train_loss": -39.62351989746094, "global_step": 105365, "epoch": 870} {"train_loss": -40.08619689941406, "global_step": 105366, "epoch": 870} {"train_loss": -39.844356536865234, "global_step": 105367, "epoch": 870} {"train_loss": -39.95695877075195, "global_step": 105368, "epoch": 870} {"train_loss": -39.95068359375, "global_step": 105369, "epoch": 870} {"train_loss": -39.519290924072266, "global_step": 105370, "epoch": 870} {"train_loss": -38.864173889160156, "global_step": 105371, "epoch": 870} {"train_loss": -38.99633026123047, "global_step": 105372, "epoch": 870} {"train_loss": -39.1317024230957, "global_step": 105373, "epoch": 870} {"train_loss": -37.551265716552734, "global_step": 105374, "epoch": 870} {"train_loss": -33.5811882019043, "global_step": 105375, "epoch": 870} {"train_loss": -26.088895797729492, "global_step": 105376, "epoch": 870} {"train_loss": -25.233688354492188, "global_step": 105377, "epoch": 870} {"train_loss": -34.35504150390625, "global_step": 105378, "epoch": 870} {"train_loss": -38.86043930053711, "global_step": 105379, "epoch": 870} {"train_loss": -35.840049743652344, "global_step": 105380, "epoch": 870} {"train_loss": -36.041107177734375, "global_step": 105381, "epoch": 870} {"train_loss": -38.38759994506836, "global_step": 105382, "epoch": 870} {"train_loss": -37.355995178222656, "global_step": 105383, "epoch": 870} {"train_loss": -36.998409271240234, "global_step": 105384, "epoch": 870} {"train_loss": -38.309715270996094, "global_step": 105385, "epoch": 870} {"train_loss": -38.159706115722656, "global_step": 105386, "epoch": 870} {"train_loss": -37.99280548095703, "global_step": 105387, "epoch": 870} {"train_loss": -38.323516845703125, "global_step": 105388, "epoch": 870} {"train_loss": -38.18030548095703, "global_step": 105389, "epoch": 870} {"train_loss": -38.35284188956268, "global_step": 105390, "epoch": 870, "val_loss": 2607683.75} {"train_loss": -38.879974365234375, "global_step": 105391, "epoch": 871} {"train_loss": -38.714107513427734, "global_step": 105392, "epoch": 871} {"train_loss": -39.04966354370117, "global_step": 105393, "epoch": 871} {"train_loss": -38.916587829589844, "global_step": 105394, "epoch": 871} {"train_loss": -38.849422454833984, "global_step": 105395, "epoch": 871} {"train_loss": -38.72978591918945, "global_step": 105396, "epoch": 871} {"train_loss": -39.092647552490234, "global_step": 105397, "epoch": 871} {"train_loss": -39.2225341796875, "global_step": 105398, "epoch": 871} {"train_loss": -39.188270568847656, "global_step": 105399, "epoch": 871} {"train_loss": -39.28316879272461, "global_step": 105400, "epoch": 871} {"train_loss": -39.39272689819336, "global_step": 105401, "epoch": 871} {"train_loss": -39.65302276611328, "global_step": 105402, "epoch": 871} {"train_loss": -39.65833282470703, "global_step": 105403, "epoch": 871} {"train_loss": -39.33138656616211, "global_step": 105404, "epoch": 871} {"train_loss": -38.95294189453125, "global_step": 105405, "epoch": 871} {"train_loss": -39.70530700683594, "global_step": 105406, "epoch": 871} {"train_loss": -39.32003402709961, "global_step": 105407, "epoch": 871} {"train_loss": -39.4354133605957, "global_step": 105408, "epoch": 871} {"train_loss": -39.72408676147461, "global_step": 105409, "epoch": 871} {"train_loss": -39.68703079223633, "global_step": 105410, "epoch": 871} {"train_loss": -39.38127517700195, "global_step": 105411, "epoch": 871} {"train_loss": -39.85854721069336, "global_step": 105412, "epoch": 871} {"train_loss": -38.8021354675293, "global_step": 105413, "epoch": 871} {"train_loss": -39.053794860839844, "global_step": 105414, "epoch": 871} {"train_loss": -39.5612678527832, "global_step": 105415, "epoch": 871} {"train_loss": -39.4405632019043, "global_step": 105416, "epoch": 871} {"train_loss": -39.44034957885742, "global_step": 105417, "epoch": 871} {"train_loss": -39.3539924621582, "global_step": 105418, "epoch": 871} {"train_loss": -39.837459564208984, "global_step": 105419, "epoch": 871} {"train_loss": -39.2884635925293, "global_step": 105420, "epoch": 871} {"train_loss": -38.64324951171875, "global_step": 105421, "epoch": 871} {"train_loss": -38.062950134277344, "global_step": 105422, "epoch": 871} {"train_loss": -38.848995208740234, "global_step": 105423, "epoch": 871} {"train_loss": -39.763362884521484, "global_step": 105424, "epoch": 871} {"train_loss": -39.443599700927734, "global_step": 105425, "epoch": 871} {"train_loss": -39.52499008178711, "global_step": 105426, "epoch": 871} {"train_loss": -39.07454299926758, "global_step": 105427, "epoch": 871} {"train_loss": -39.1709098815918, "global_step": 105428, "epoch": 871} {"train_loss": -40.02490997314453, "global_step": 105429, "epoch": 871} {"train_loss": -39.88920974731445, "global_step": 105430, "epoch": 871} {"train_loss": -39.35383224487305, "global_step": 105431, "epoch": 871} {"train_loss": -39.5074348449707, "global_step": 105432, "epoch": 871} {"train_loss": -38.96360397338867, "global_step": 105433, "epoch": 871} {"train_loss": -38.22828674316406, "global_step": 105434, "epoch": 871} {"train_loss": -37.67080307006836, "global_step": 105435, "epoch": 871} {"train_loss": -38.67151641845703, "global_step": 105436, "epoch": 871} {"train_loss": -39.3362922668457, "global_step": 105437, "epoch": 871} {"train_loss": -39.532012939453125, "global_step": 105438, "epoch": 871} {"train_loss": -37.789161682128906, "global_step": 105439, "epoch": 871} {"train_loss": -29.099496841430664, "global_step": 105440, "epoch": 871} {"train_loss": -20.46900749206543, "global_step": 105441, "epoch": 871} {"train_loss": -29.2420654296875, "global_step": 105442, "epoch": 871} {"train_loss": -36.1337776184082, "global_step": 105443, "epoch": 871} {"train_loss": -34.151424407958984, "global_step": 105444, "epoch": 871} {"train_loss": -34.3532829284668, "global_step": 105445, "epoch": 871} {"train_loss": -36.30157470703125, "global_step": 105446, "epoch": 871} {"train_loss": -34.81241989135742, "global_step": 105447, "epoch": 871} {"train_loss": -35.095455169677734, "global_step": 105448, "epoch": 871} {"train_loss": -37.46168518066406, "global_step": 105449, "epoch": 871} {"train_loss": -34.83191680908203, "global_step": 105450, "epoch": 871} {"train_loss": -36.83823776245117, "global_step": 105451, "epoch": 871} {"train_loss": -34.98751449584961, "global_step": 105452, "epoch": 871} {"train_loss": -37.66471862792969, "global_step": 105453, "epoch": 871} {"train_loss": -36.13849639892578, "global_step": 105454, "epoch": 871} {"train_loss": -37.08358383178711, "global_step": 105455, "epoch": 871} {"train_loss": -37.1640510559082, "global_step": 105456, "epoch": 871} {"train_loss": -36.92412567138672, "global_step": 105457, "epoch": 871} {"train_loss": -37.84736633300781, "global_step": 105458, "epoch": 871} {"train_loss": -37.56842803955078, "global_step": 105459, "epoch": 871} {"train_loss": -38.32947540283203, "global_step": 105460, "epoch": 871} {"train_loss": -36.97906494140625, "global_step": 105461, "epoch": 871} {"train_loss": -37.99868392944336, "global_step": 105462, "epoch": 871} {"train_loss": -38.30173110961914, "global_step": 105463, "epoch": 871} {"train_loss": -37.810848236083984, "global_step": 105464, "epoch": 871} {"train_loss": -38.60749816894531, "global_step": 105465, "epoch": 871} {"train_loss": -38.262054443359375, "global_step": 105466, "epoch": 871} {"train_loss": -38.651180267333984, "global_step": 105467, "epoch": 871} {"train_loss": -38.830501556396484, "global_step": 105468, "epoch": 871} {"train_loss": -38.42578125, "global_step": 105469, "epoch": 871} {"train_loss": -38.401084899902344, "global_step": 105470, "epoch": 871} {"train_loss": -37.73617172241211, "global_step": 105471, "epoch": 871} {"train_loss": -39.0562744140625, "global_step": 105472, "epoch": 871} {"train_loss": -38.9879035949707, "global_step": 105473, "epoch": 871} {"train_loss": -38.631187438964844, "global_step": 105474, "epoch": 871} {"train_loss": -38.84392166137695, "global_step": 105475, "epoch": 871} {"train_loss": -38.09461212158203, "global_step": 105476, "epoch": 871} {"train_loss": -38.754676818847656, "global_step": 105477, "epoch": 871} {"train_loss": -39.23865509033203, "global_step": 105478, "epoch": 871} {"train_loss": -38.87916946411133, "global_step": 105479, "epoch": 871} {"train_loss": -39.130863189697266, "global_step": 105480, "epoch": 871} {"train_loss": -38.30038070678711, "global_step": 105481, "epoch": 871} {"train_loss": -38.958980560302734, "global_step": 105482, "epoch": 871} {"train_loss": -38.7115478515625, "global_step": 105483, "epoch": 871} {"train_loss": -38.9940071105957, "global_step": 105484, "epoch": 871} {"train_loss": -38.4554557800293, "global_step": 105485, "epoch": 871} {"train_loss": -39.159820556640625, "global_step": 105486, "epoch": 871} {"train_loss": -38.728328704833984, "global_step": 105487, "epoch": 871} {"train_loss": -37.21692657470703, "global_step": 105488, "epoch": 871} {"train_loss": -34.15473556518555, "global_step": 105489, "epoch": 871} {"train_loss": -33.51050567626953, "global_step": 105490, "epoch": 871} {"train_loss": -36.32075119018555, "global_step": 105491, "epoch": 871} {"train_loss": -39.52128982543945, "global_step": 105492, "epoch": 871} {"train_loss": -35.41864776611328, "global_step": 105493, "epoch": 871} {"train_loss": -32.98710250854492, "global_step": 105494, "epoch": 871} {"train_loss": -37.67237854003906, "global_step": 105495, "epoch": 871} {"train_loss": -37.944496154785156, "global_step": 105496, "epoch": 871} {"train_loss": -37.41811752319336, "global_step": 105497, "epoch": 871} {"train_loss": -38.845741271972656, "global_step": 105498, "epoch": 871} {"train_loss": -36.262481689453125, "global_step": 105499, "epoch": 871} {"train_loss": -38.15930938720703, "global_step": 105500, "epoch": 871} {"train_loss": -37.97479248046875, "global_step": 105501, "epoch": 871} {"train_loss": -37.73856735229492, "global_step": 105502, "epoch": 871} {"train_loss": -38.14780807495117, "global_step": 105503, "epoch": 871} {"train_loss": -38.10517120361328, "global_step": 105504, "epoch": 871} {"train_loss": -38.2668342590332, "global_step": 105505, "epoch": 871} {"train_loss": -38.58671188354492, "global_step": 105506, "epoch": 871} {"train_loss": -38.956722259521484, "global_step": 105507, "epoch": 871} {"train_loss": -38.127838134765625, "global_step": 105508, "epoch": 871} {"train_loss": -39.468135833740234, "global_step": 105509, "epoch": 871} {"train_loss": -38.7122688293457, "global_step": 105510, "epoch": 871} {"train_loss": -37.95204843568408, "global_step": 105511, "epoch": 871, "val_loss": 2676683.75} {"train_loss": -39.194068908691406, "global_step": 105512, "epoch": 872} {"train_loss": -38.993717193603516, "global_step": 105513, "epoch": 872} {"train_loss": -39.4222297668457, "global_step": 105514, "epoch": 872} {"train_loss": -39.17947769165039, "global_step": 105515, "epoch": 872} {"train_loss": -39.0238037109375, "global_step": 105516, "epoch": 872} {"train_loss": -39.164424896240234, "global_step": 105517, "epoch": 872} {"train_loss": -39.46607208251953, "global_step": 105518, "epoch": 872} {"train_loss": -39.278194427490234, "global_step": 105519, "epoch": 872} {"train_loss": -39.198631286621094, "global_step": 105520, "epoch": 872} {"train_loss": -39.24595642089844, "global_step": 105521, "epoch": 872} {"train_loss": -38.924049377441406, "global_step": 105522, "epoch": 872} {"train_loss": -39.51446533203125, "global_step": 105523, "epoch": 872} {"train_loss": -39.69074630737305, "global_step": 105524, "epoch": 872} {"train_loss": -39.65222930908203, "global_step": 105525, "epoch": 872} {"train_loss": -39.63309860229492, "global_step": 105526, "epoch": 872} {"train_loss": -39.439002990722656, "global_step": 105527, "epoch": 872} {"train_loss": -39.64312744140625, "global_step": 105528, "epoch": 872} {"train_loss": -39.49192810058594, "global_step": 105529, "epoch": 872} {"train_loss": -39.59035110473633, "global_step": 105530, "epoch": 872} {"train_loss": -39.96444320678711, "global_step": 105531, "epoch": 872} {"train_loss": -39.9803466796875, "global_step": 105532, "epoch": 872} {"train_loss": -39.38917541503906, "global_step": 105533, "epoch": 872} {"train_loss": -39.825401306152344, "global_step": 105534, "epoch": 872} {"train_loss": -39.66892623901367, "global_step": 105535, "epoch": 872} {"train_loss": -40.12259292602539, "global_step": 105536, "epoch": 872} {"train_loss": -40.0279541015625, "global_step": 105537, "epoch": 872} {"train_loss": -39.91921615600586, "global_step": 105538, "epoch": 872} {"train_loss": -40.20231246948242, "global_step": 105539, "epoch": 872} {"train_loss": -39.32316207885742, "global_step": 105540, "epoch": 872} {"train_loss": -39.9016227722168, "global_step": 105541, "epoch": 872} {"train_loss": -39.783233642578125, "global_step": 105542, "epoch": 872} {"train_loss": -39.49154281616211, "global_step": 105543, "epoch": 872} {"train_loss": -39.67087173461914, "global_step": 105544, "epoch": 872} {"train_loss": -39.11533737182617, "global_step": 105545, "epoch": 872} {"train_loss": -37.84288024902344, "global_step": 105546, "epoch": 872} {"train_loss": -36.74063491821289, "global_step": 105547, "epoch": 872} {"train_loss": -39.40568161010742, "global_step": 105548, "epoch": 872} {"train_loss": -38.69332504272461, "global_step": 105549, "epoch": 872} {"train_loss": -38.213783264160156, "global_step": 105550, "epoch": 872} {"train_loss": -39.35272979736328, "global_step": 105551, "epoch": 872} {"train_loss": -38.86725997924805, "global_step": 105552, "epoch": 872} {"train_loss": -39.25021743774414, "global_step": 105553, "epoch": 872} {"train_loss": -38.45058059692383, "global_step": 105554, "epoch": 872} {"train_loss": -39.41361618041992, "global_step": 105555, "epoch": 872} {"train_loss": -39.53721618652344, "global_step": 105556, "epoch": 872} {"train_loss": -39.164161682128906, "global_step": 105557, "epoch": 872} {"train_loss": -39.35224914550781, "global_step": 105558, "epoch": 872} {"train_loss": -39.53752517700195, "global_step": 105559, "epoch": 872} {"train_loss": -39.025299072265625, "global_step": 105560, "epoch": 872} {"train_loss": -38.80385208129883, "global_step": 105561, "epoch": 872} {"train_loss": -39.00849533081055, "global_step": 105562, "epoch": 872} {"train_loss": -39.3632926940918, "global_step": 105563, "epoch": 872} {"train_loss": -39.58881759643555, "global_step": 105564, "epoch": 872} {"train_loss": -38.62091064453125, "global_step": 105565, "epoch": 872} {"train_loss": -37.92690658569336, "global_step": 105566, "epoch": 872} {"train_loss": -39.10917282104492, "global_step": 105567, "epoch": 872} {"train_loss": -38.274810791015625, "global_step": 105568, "epoch": 872} {"train_loss": -36.945350646972656, "global_step": 105569, "epoch": 872} {"train_loss": -36.6362190246582, "global_step": 105570, "epoch": 872} {"train_loss": -36.09597396850586, "global_step": 105571, "epoch": 872} {"train_loss": -38.58445358276367, "global_step": 105572, "epoch": 872} {"train_loss": -38.86075973510742, "global_step": 105573, "epoch": 872} {"train_loss": -39.239864349365234, "global_step": 105574, "epoch": 872} {"train_loss": -35.790016174316406, "global_step": 105575, "epoch": 872} {"train_loss": -39.23768997192383, "global_step": 105576, "epoch": 872} {"train_loss": -38.38899612426758, "global_step": 105577, "epoch": 872} {"train_loss": -38.24626541137695, "global_step": 105578, "epoch": 872} {"train_loss": -38.3988151550293, "global_step": 105579, "epoch": 872} {"train_loss": -38.79279327392578, "global_step": 105580, "epoch": 872} {"train_loss": -39.26984786987305, "global_step": 105581, "epoch": 872} {"train_loss": -38.87002944946289, "global_step": 105582, "epoch": 872} {"train_loss": -38.351383209228516, "global_step": 105583, "epoch": 872} {"train_loss": -37.202972412109375, "global_step": 105584, "epoch": 872} {"train_loss": -38.66090774536133, "global_step": 105585, "epoch": 872} {"train_loss": -38.25504684448242, "global_step": 105586, "epoch": 872} {"train_loss": -36.795562744140625, "global_step": 105587, "epoch": 872} {"train_loss": -37.1093864440918, "global_step": 105588, "epoch": 872} {"train_loss": -38.39984893798828, "global_step": 105589, "epoch": 872} {"train_loss": -35.13558578491211, "global_step": 105590, "epoch": 872} {"train_loss": -31.212604522705078, "global_step": 105591, "epoch": 872} {"train_loss": -35.019344329833984, "global_step": 105592, "epoch": 872} {"train_loss": -34.247032165527344, "global_step": 105593, "epoch": 872} {"train_loss": -37.275211334228516, "global_step": 105594, "epoch": 872} {"train_loss": -36.967891693115234, "global_step": 105595, "epoch": 872} {"train_loss": -33.765541076660156, "global_step": 105596, "epoch": 872} {"train_loss": -31.5611572265625, "global_step": 105597, "epoch": 872} {"train_loss": -32.12858200073242, "global_step": 105598, "epoch": 872} {"train_loss": -37.81270980834961, "global_step": 105599, "epoch": 872} {"train_loss": -35.94678497314453, "global_step": 105600, "epoch": 872} {"train_loss": -37.13460159301758, "global_step": 105601, "epoch": 872} {"train_loss": -36.67813491821289, "global_step": 105602, "epoch": 872} {"train_loss": -36.29926300048828, "global_step": 105603, "epoch": 872} {"train_loss": -37.76874923706055, "global_step": 105604, "epoch": 872} {"train_loss": -35.33070755004883, "global_step": 105605, "epoch": 872} {"train_loss": -34.756385803222656, "global_step": 105606, "epoch": 872} {"train_loss": -36.15354537963867, "global_step": 105607, "epoch": 872} {"train_loss": -34.725887298583984, "global_step": 105608, "epoch": 872} {"train_loss": -37.18988037109375, "global_step": 105609, "epoch": 872} {"train_loss": -35.83980178833008, "global_step": 105610, "epoch": 872} {"train_loss": -32.731712341308594, "global_step": 105611, "epoch": 872} {"train_loss": -36.635250091552734, "global_step": 105612, "epoch": 872} {"train_loss": -36.07758331298828, "global_step": 105613, "epoch": 872} {"train_loss": -36.96407699584961, "global_step": 105614, "epoch": 872} {"train_loss": -36.00967025756836, "global_step": 105615, "epoch": 872} {"train_loss": -37.35515594482422, "global_step": 105616, "epoch": 872} {"train_loss": -37.3442497253418, "global_step": 105617, "epoch": 872} {"train_loss": -36.473995208740234, "global_step": 105618, "epoch": 872} {"train_loss": -37.019447326660156, "global_step": 105619, "epoch": 872} {"train_loss": -36.91407775878906, "global_step": 105620, "epoch": 872} {"train_loss": -36.44168472290039, "global_step": 105621, "epoch": 872} {"train_loss": -36.67474365234375, "global_step": 105622, "epoch": 872} {"train_loss": -37.69727325439453, "global_step": 105623, "epoch": 872} {"train_loss": -37.951133728027344, "global_step": 105624, "epoch": 872} {"train_loss": -37.86552810668945, "global_step": 105625, "epoch": 872} {"train_loss": -36.055809020996094, "global_step": 105626, "epoch": 872} {"train_loss": -38.12283706665039, "global_step": 105627, "epoch": 872} {"train_loss": -38.0638542175293, "global_step": 105628, "epoch": 872} {"train_loss": -37.8695182800293, "global_step": 105629, "epoch": 872} {"train_loss": -38.84929275512695, "global_step": 105630, "epoch": 872} {"train_loss": -37.76974105834961, "global_step": 105631, "epoch": 872} {"train_loss": -37.961713838183194, "global_step": 105632, "epoch": 872, "val_loss": 2622900.0} {"train_loss": -38.29875946044922, "global_step": 105633, "epoch": 873} {"train_loss": -38.09371566772461, "global_step": 105634, "epoch": 873} {"train_loss": -38.253849029541016, "global_step": 105635, "epoch": 873} {"train_loss": -38.35972213745117, "global_step": 105636, "epoch": 873} {"train_loss": -38.3634147644043, "global_step": 105637, "epoch": 873} {"train_loss": -38.45062255859375, "global_step": 105638, "epoch": 873} {"train_loss": -38.43250274658203, "global_step": 105639, "epoch": 873} {"train_loss": -37.906105041503906, "global_step": 105640, "epoch": 873} {"train_loss": -38.371700286865234, "global_step": 105641, "epoch": 873} {"train_loss": -37.03306198120117, "global_step": 105642, "epoch": 873} {"train_loss": -38.957122802734375, "global_step": 105643, "epoch": 873} {"train_loss": -36.79653549194336, "global_step": 105644, "epoch": 873} {"train_loss": -38.67570114135742, "global_step": 105645, "epoch": 873} {"train_loss": -38.75788497924805, "global_step": 105646, "epoch": 873} {"train_loss": -39.07607650756836, "global_step": 105647, "epoch": 873} {"train_loss": -38.6014518737793, "global_step": 105648, "epoch": 873} {"train_loss": -38.803096771240234, "global_step": 105649, "epoch": 873} {"train_loss": -38.671852111816406, "global_step": 105650, "epoch": 873} {"train_loss": -38.78845977783203, "global_step": 105651, "epoch": 873} {"train_loss": -37.897972106933594, "global_step": 105652, "epoch": 873} {"train_loss": -38.75405502319336, "global_step": 105653, "epoch": 873} {"train_loss": -38.73873519897461, "global_step": 105654, "epoch": 873} {"train_loss": -38.59040069580078, "global_step": 105655, "epoch": 873} {"train_loss": -39.0914306640625, "global_step": 105656, "epoch": 873} {"train_loss": -39.15203857421875, "global_step": 105657, "epoch": 873} {"train_loss": -39.196739196777344, "global_step": 105658, "epoch": 873} {"train_loss": -38.43703842163086, "global_step": 105659, "epoch": 873} {"train_loss": -38.76839828491211, "global_step": 105660, "epoch": 873} {"train_loss": -38.95935821533203, "global_step": 105661, "epoch": 873} {"train_loss": -39.34611511230469, "global_step": 105662, "epoch": 873} {"train_loss": -39.35023880004883, "global_step": 105663, "epoch": 873} {"train_loss": -39.01436996459961, "global_step": 105664, "epoch": 873} {"train_loss": -39.10491180419922, "global_step": 105665, "epoch": 873} {"train_loss": -39.33330154418945, "global_step": 105666, "epoch": 873} {"train_loss": -38.91660690307617, "global_step": 105667, "epoch": 873} {"train_loss": -38.89039611816406, "global_step": 105668, "epoch": 873} {"train_loss": -38.61770248413086, "global_step": 105669, "epoch": 873} {"train_loss": -38.51630401611328, "global_step": 105670, "epoch": 873} {"train_loss": -39.11627960205078, "global_step": 105671, "epoch": 873} {"train_loss": -39.03164291381836, "global_step": 105672, "epoch": 873} {"train_loss": -39.4057502746582, "global_step": 105673, "epoch": 873} {"train_loss": -39.342098236083984, "global_step": 105674, "epoch": 873} {"train_loss": -39.59701156616211, "global_step": 105675, "epoch": 873} {"train_loss": -39.21024703979492, "global_step": 105676, "epoch": 873} {"train_loss": -39.48196029663086, "global_step": 105677, "epoch": 873} {"train_loss": -39.51220703125, "global_step": 105678, "epoch": 873} {"train_loss": -39.43787384033203, "global_step": 105679, "epoch": 873} {"train_loss": -39.65806198120117, "global_step": 105680, "epoch": 873} {"train_loss": -39.689613342285156, "global_step": 105681, "epoch": 873} {"train_loss": -38.7526741027832, "global_step": 105682, "epoch": 873} {"train_loss": -39.53704071044922, "global_step": 105683, "epoch": 873} {"train_loss": -39.602134704589844, "global_step": 105684, "epoch": 873} {"train_loss": -39.40354537963867, "global_step": 105685, "epoch": 873} {"train_loss": -39.355892181396484, "global_step": 105686, "epoch": 873} {"train_loss": -39.07709503173828, "global_step": 105687, "epoch": 873} {"train_loss": -38.925506591796875, "global_step": 105688, "epoch": 873} {"train_loss": -38.55499267578125, "global_step": 105689, "epoch": 873} {"train_loss": -39.162559509277344, "global_step": 105690, "epoch": 873} {"train_loss": -39.56543731689453, "global_step": 105691, "epoch": 873} {"train_loss": -34.52690505981445, "global_step": 105692, "epoch": 873} {"train_loss": -39.28540802001953, "global_step": 105693, "epoch": 873} {"train_loss": -39.6684684753418, "global_step": 105694, "epoch": 873} {"train_loss": -39.14784622192383, "global_step": 105695, "epoch": 873} {"train_loss": -39.24208450317383, "global_step": 105696, "epoch": 873} {"train_loss": -39.31529235839844, "global_step": 105697, "epoch": 873} {"train_loss": -38.80341720581055, "global_step": 105698, "epoch": 873} {"train_loss": -37.263221740722656, "global_step": 105699, "epoch": 873} {"train_loss": -35.52133560180664, "global_step": 105700, "epoch": 873} {"train_loss": -35.149566650390625, "global_step": 105701, "epoch": 873} {"train_loss": -34.4305419921875, "global_step": 105702, "epoch": 873} {"train_loss": -31.675434112548828, "global_step": 105703, "epoch": 873} {"train_loss": -33.73809814453125, "global_step": 105704, "epoch": 873} {"train_loss": -36.66889572143555, "global_step": 105705, "epoch": 873} {"train_loss": -37.47798538208008, "global_step": 105706, "epoch": 873} {"train_loss": -37.73871994018555, "global_step": 105707, "epoch": 873} {"train_loss": -37.78741455078125, "global_step": 105708, "epoch": 873} {"train_loss": -37.62519073486328, "global_step": 105709, "epoch": 873} {"train_loss": -33.4156494140625, "global_step": 105710, "epoch": 873} {"train_loss": -38.48149490356445, "global_step": 105711, "epoch": 873} {"train_loss": -36.72127914428711, "global_step": 105712, "epoch": 873} {"train_loss": -38.239501953125, "global_step": 105713, "epoch": 873} {"train_loss": -37.89002227783203, "global_step": 105714, "epoch": 873} {"train_loss": -38.167816162109375, "global_step": 105715, "epoch": 873} {"train_loss": -38.01166534423828, "global_step": 105716, "epoch": 873} {"train_loss": -38.190670013427734, "global_step": 105717, "epoch": 873} {"train_loss": -36.49514389038086, "global_step": 105718, "epoch": 873} {"train_loss": -39.00400924682617, "global_step": 105719, "epoch": 873} {"train_loss": -37.966339111328125, "global_step": 105720, "epoch": 873} {"train_loss": -35.99349594116211, "global_step": 105721, "epoch": 873} {"train_loss": -37.7619743347168, "global_step": 105722, "epoch": 873} {"train_loss": -39.05474090576172, "global_step": 105723, "epoch": 873} {"train_loss": -38.836036682128906, "global_step": 105724, "epoch": 873} {"train_loss": -38.087623596191406, "global_step": 105725, "epoch": 873} {"train_loss": -37.55045700073242, "global_step": 105726, "epoch": 873} {"train_loss": -38.65345001220703, "global_step": 105727, "epoch": 873} {"train_loss": -38.55305480957031, "global_step": 105728, "epoch": 873} {"train_loss": -37.63520812988281, "global_step": 105729, "epoch": 873} {"train_loss": -38.617958068847656, "global_step": 105730, "epoch": 873} {"train_loss": -38.70905685424805, "global_step": 105731, "epoch": 873} {"train_loss": -38.85084915161133, "global_step": 105732, "epoch": 873} {"train_loss": -39.446632385253906, "global_step": 105733, "epoch": 873} {"train_loss": -38.84696578979492, "global_step": 105734, "epoch": 873} {"train_loss": -37.441078186035156, "global_step": 105735, "epoch": 873} {"train_loss": -36.48973846435547, "global_step": 105736, "epoch": 873} {"train_loss": -38.3474235534668, "global_step": 105737, "epoch": 873} {"train_loss": -36.349822998046875, "global_step": 105738, "epoch": 873} {"train_loss": -37.12813949584961, "global_step": 105739, "epoch": 873} {"train_loss": -36.81304931640625, "global_step": 105740, "epoch": 873} {"train_loss": -36.33392333984375, "global_step": 105741, "epoch": 873} {"train_loss": -30.266138076782227, "global_step": 105742, "epoch": 873} {"train_loss": -38.17474365234375, "global_step": 105743, "epoch": 873} {"train_loss": -37.3438606262207, "global_step": 105744, "epoch": 873} {"train_loss": -37.12590026855469, "global_step": 105745, "epoch": 873} {"train_loss": -37.852447509765625, "global_step": 105746, "epoch": 873} {"train_loss": -33.9218864440918, "global_step": 105747, "epoch": 873} {"train_loss": -36.14376449584961, "global_step": 105748, "epoch": 873} {"train_loss": -35.71113204956055, "global_step": 105749, "epoch": 873} {"train_loss": -35.5389518737793, "global_step": 105750, "epoch": 873} {"train_loss": -35.448673248291016, "global_step": 105751, "epoch": 873} {"train_loss": -36.17318344116211, "global_step": 105752, "epoch": 873} {"train_loss": -37.981242455726814, "global_step": 105753, "epoch": 873, "val_loss": 2547300.0} {"train_loss": -35.46633529663086, "global_step": 105754, "epoch": 874} {"train_loss": -37.68386459350586, "global_step": 105755, "epoch": 874} {"train_loss": -35.804073333740234, "global_step": 105756, "epoch": 874} {"train_loss": -35.5272216796875, "global_step": 105757, "epoch": 874} {"train_loss": -28.015607833862305, "global_step": 105758, "epoch": 874} {"train_loss": -36.98628234863281, "global_step": 105759, "epoch": 874} {"train_loss": -35.5109977722168, "global_step": 105760, "epoch": 874} {"train_loss": -35.88671875, "global_step": 105761, "epoch": 874} {"train_loss": -35.59235382080078, "global_step": 105762, "epoch": 874} {"train_loss": -37.24538803100586, "global_step": 105763, "epoch": 874} {"train_loss": -36.04454040527344, "global_step": 105764, "epoch": 874} {"train_loss": -35.79537582397461, "global_step": 105765, "epoch": 874} {"train_loss": -36.37259292602539, "global_step": 105766, "epoch": 874} {"train_loss": -35.998390197753906, "global_step": 105767, "epoch": 874} {"train_loss": -34.810848236083984, "global_step": 105768, "epoch": 874} {"train_loss": -36.18537139892578, "global_step": 105769, "epoch": 874} {"train_loss": -37.51826477050781, "global_step": 105770, "epoch": 874} {"train_loss": -33.58262252807617, "global_step": 105771, "epoch": 874} {"train_loss": -37.992984771728516, "global_step": 105772, "epoch": 874} {"train_loss": -37.522796630859375, "global_step": 105773, "epoch": 874} {"train_loss": -36.863319396972656, "global_step": 105774, "epoch": 874} {"train_loss": -37.244598388671875, "global_step": 105775, "epoch": 874} {"train_loss": -37.45466232299805, "global_step": 105776, "epoch": 874} {"train_loss": -36.275733947753906, "global_step": 105777, "epoch": 874} {"train_loss": -37.51078414916992, "global_step": 105778, "epoch": 874} {"train_loss": -37.817684173583984, "global_step": 105779, "epoch": 874} {"train_loss": -36.964046478271484, "global_step": 105780, "epoch": 874} {"train_loss": -37.859840393066406, "global_step": 105781, "epoch": 874} {"train_loss": -37.95140838623047, "global_step": 105782, "epoch": 874} {"train_loss": -37.22002029418945, "global_step": 105783, "epoch": 874} {"train_loss": -37.615333557128906, "global_step": 105784, "epoch": 874} {"train_loss": -38.39750289916992, "global_step": 105785, "epoch": 874} {"train_loss": -38.033302307128906, "global_step": 105786, "epoch": 874} {"train_loss": -37.90171432495117, "global_step": 105787, "epoch": 874} {"train_loss": -37.0543212890625, "global_step": 105788, "epoch": 874} {"train_loss": -37.57658767700195, "global_step": 105789, "epoch": 874} {"train_loss": -37.26015853881836, "global_step": 105790, "epoch": 874} {"train_loss": -38.21151351928711, "global_step": 105791, "epoch": 874} {"train_loss": -37.49855041503906, "global_step": 105792, "epoch": 874} {"train_loss": -38.45235824584961, "global_step": 105793, "epoch": 874} {"train_loss": -38.1386833190918, "global_step": 105794, "epoch": 874} {"train_loss": -37.05477523803711, "global_step": 105795, "epoch": 874} {"train_loss": -38.47001266479492, "global_step": 105796, "epoch": 874} {"train_loss": -37.365753173828125, "global_step": 105797, "epoch": 874} {"train_loss": -38.48041915893555, "global_step": 105798, "epoch": 874} {"train_loss": -37.987403869628906, "global_step": 105799, "epoch": 874} {"train_loss": -38.48462677001953, "global_step": 105800, "epoch": 874} {"train_loss": -38.536861419677734, "global_step": 105801, "epoch": 874} {"train_loss": -38.83461380004883, "global_step": 105802, "epoch": 874} {"train_loss": -38.7132453918457, "global_step": 105803, "epoch": 874} {"train_loss": -38.99494552612305, "global_step": 105804, "epoch": 874} {"train_loss": -39.17158126831055, "global_step": 105805, "epoch": 874} {"train_loss": -38.66677474975586, "global_step": 105806, "epoch": 874} {"train_loss": -38.95400619506836, "global_step": 105807, "epoch": 874} {"train_loss": -38.72486114501953, "global_step": 105808, "epoch": 874} {"train_loss": -37.083438873291016, "global_step": 105809, "epoch": 874} {"train_loss": -39.2114372253418, "global_step": 105810, "epoch": 874} {"train_loss": -39.078704833984375, "global_step": 105811, "epoch": 874} {"train_loss": -38.884281158447266, "global_step": 105812, "epoch": 874} {"train_loss": -38.98438262939453, "global_step": 105813, "epoch": 874} {"train_loss": -38.553157806396484, "global_step": 105814, "epoch": 874} {"train_loss": -39.4256477355957, "global_step": 105815, "epoch": 874} {"train_loss": -39.2085075378418, "global_step": 105816, "epoch": 874} {"train_loss": -38.718597412109375, "global_step": 105817, "epoch": 874} {"train_loss": -39.170650482177734, "global_step": 105818, "epoch": 874} {"train_loss": -39.28792190551758, "global_step": 105819, "epoch": 874} {"train_loss": -39.0966682434082, "global_step": 105820, "epoch": 874} {"train_loss": -38.7655029296875, "global_step": 105821, "epoch": 874} {"train_loss": -38.56816482543945, "global_step": 105822, "epoch": 874} {"train_loss": -38.61098098754883, "global_step": 105823, "epoch": 874} {"train_loss": -39.18827438354492, "global_step": 105824, "epoch": 874} {"train_loss": -38.722137451171875, "global_step": 105825, "epoch": 874} {"train_loss": -38.95402908325195, "global_step": 105826, "epoch": 874} {"train_loss": -39.36857223510742, "global_step": 105827, "epoch": 874} {"train_loss": -38.94825744628906, "global_step": 105828, "epoch": 874} {"train_loss": -39.145721435546875, "global_step": 105829, "epoch": 874} {"train_loss": -38.291786193847656, "global_step": 105830, "epoch": 874} {"train_loss": -39.407222747802734, "global_step": 105831, "epoch": 874} {"train_loss": -39.14774703979492, "global_step": 105832, "epoch": 874} {"train_loss": -39.37502670288086, "global_step": 105833, "epoch": 874} {"train_loss": -38.89834213256836, "global_step": 105834, "epoch": 874} {"train_loss": -38.49473190307617, "global_step": 105835, "epoch": 874} {"train_loss": -37.44668197631836, "global_step": 105836, "epoch": 874} {"train_loss": -37.06303024291992, "global_step": 105837, "epoch": 874} {"train_loss": -38.29573440551758, "global_step": 105838, "epoch": 874} {"train_loss": -37.40742111206055, "global_step": 105839, "epoch": 874} {"train_loss": -37.48548889160156, "global_step": 105840, "epoch": 874} {"train_loss": -39.372127532958984, "global_step": 105841, "epoch": 874} {"train_loss": -38.50790023803711, "global_step": 105842, "epoch": 874} {"train_loss": -36.458160400390625, "global_step": 105843, "epoch": 874} {"train_loss": -35.01533889770508, "global_step": 105844, "epoch": 874} {"train_loss": -38.017459869384766, "global_step": 105845, "epoch": 874} {"train_loss": -38.59260177612305, "global_step": 105846, "epoch": 874} {"train_loss": -37.2011833190918, "global_step": 105847, "epoch": 874} {"train_loss": -36.991493225097656, "global_step": 105848, "epoch": 874} {"train_loss": -38.66999435424805, "global_step": 105849, "epoch": 874} {"train_loss": -37.156005859375, "global_step": 105850, "epoch": 874} {"train_loss": -33.777828216552734, "global_step": 105851, "epoch": 874} {"train_loss": -35.064666748046875, "global_step": 105852, "epoch": 874} {"train_loss": -37.9744987487793, "global_step": 105853, "epoch": 874} {"train_loss": -35.02328109741211, "global_step": 105854, "epoch": 874} {"train_loss": -33.94222640991211, "global_step": 105855, "epoch": 874} {"train_loss": -37.921165466308594, "global_step": 105856, "epoch": 874} {"train_loss": -34.55280303955078, "global_step": 105857, "epoch": 874} {"train_loss": -33.17658996582031, "global_step": 105858, "epoch": 874} {"train_loss": -37.94904708862305, "global_step": 105859, "epoch": 874} {"train_loss": -33.38788986206055, "global_step": 105860, "epoch": 874} {"train_loss": -37.830379486083984, "global_step": 105861, "epoch": 874} {"train_loss": -36.722808837890625, "global_step": 105862, "epoch": 874} {"train_loss": -37.244056701660156, "global_step": 105863, "epoch": 874} {"train_loss": -37.63423156738281, "global_step": 105864, "epoch": 874} {"train_loss": -36.3674430847168, "global_step": 105865, "epoch": 874} {"train_loss": -38.525306701660156, "global_step": 105866, "epoch": 874} {"train_loss": -36.341583251953125, "global_step": 105867, "epoch": 874} {"train_loss": -37.8084831237793, "global_step": 105868, "epoch": 874} {"train_loss": -35.99616241455078, "global_step": 105869, "epoch": 874} {"train_loss": -36.378334045410156, "global_step": 105870, "epoch": 874} {"train_loss": -37.09189224243164, "global_step": 105871, "epoch": 874} {"train_loss": -38.32149887084961, "global_step": 105872, "epoch": 874} {"train_loss": -35.35396957397461, "global_step": 105873, "epoch": 874} {"train_loss": -37.43063977139055, "global_step": 105874, "epoch": 874, "val_loss": 2591071.75} {"train_loss": -38.01207733154297, "global_step": 105875, "epoch": 875} {"train_loss": -37.60911178588867, "global_step": 105876, "epoch": 875} {"train_loss": -37.67283630371094, "global_step": 105877, "epoch": 875} {"train_loss": -37.273414611816406, "global_step": 105878, "epoch": 875} {"train_loss": -37.8205680847168, "global_step": 105879, "epoch": 875} {"train_loss": -37.51909255981445, "global_step": 105880, "epoch": 875} {"train_loss": -37.88840866088867, "global_step": 105881, "epoch": 875} {"train_loss": -36.61195373535156, "global_step": 105882, "epoch": 875} {"train_loss": -33.954803466796875, "global_step": 105883, "epoch": 875} {"train_loss": -35.98501205444336, "global_step": 105884, "epoch": 875} {"train_loss": -38.123497009277344, "global_step": 105885, "epoch": 875} {"train_loss": -36.46993637084961, "global_step": 105886, "epoch": 875} {"train_loss": -28.59368896484375, "global_step": 105887, "epoch": 875} {"train_loss": -36.07944869995117, "global_step": 105888, "epoch": 875} {"train_loss": -29.181005477905273, "global_step": 105889, "epoch": 875} {"train_loss": -33.9842529296875, "global_step": 105890, "epoch": 875} {"train_loss": -35.45254135131836, "global_step": 105891, "epoch": 875} {"train_loss": -34.54840850830078, "global_step": 105892, "epoch": 875} {"train_loss": -33.23423385620117, "global_step": 105893, "epoch": 875} {"train_loss": -33.129451751708984, "global_step": 105894, "epoch": 875} {"train_loss": -36.080448150634766, "global_step": 105895, "epoch": 875} {"train_loss": -34.29594802856445, "global_step": 105896, "epoch": 875} {"train_loss": -34.265419006347656, "global_step": 105897, "epoch": 875} {"train_loss": -33.14707565307617, "global_step": 105898, "epoch": 875} {"train_loss": -30.718957901000977, "global_step": 105899, "epoch": 875} {"train_loss": -35.06837844848633, "global_step": 105900, "epoch": 875} {"train_loss": -32.080101013183594, "global_step": 105901, "epoch": 875} {"train_loss": -35.76838302612305, "global_step": 105902, "epoch": 875} {"train_loss": -34.951507568359375, "global_step": 105903, "epoch": 875} {"train_loss": -34.371578216552734, "global_step": 105904, "epoch": 875} {"train_loss": -36.252220153808594, "global_step": 105905, "epoch": 875} {"train_loss": -35.230648040771484, "global_step": 105906, "epoch": 875} {"train_loss": -33.03126907348633, "global_step": 105907, "epoch": 875} {"train_loss": -36.262351989746094, "global_step": 105908, "epoch": 875} {"train_loss": -34.673831939697266, "global_step": 105909, "epoch": 875} {"train_loss": -36.788021087646484, "global_step": 105910, "epoch": 875} {"train_loss": -36.581390380859375, "global_step": 105911, "epoch": 875} {"train_loss": -36.89812088012695, "global_step": 105912, "epoch": 875} {"train_loss": -34.59833908081055, "global_step": 105913, "epoch": 875} {"train_loss": -37.06293487548828, "global_step": 105914, "epoch": 875} {"train_loss": -36.66653823852539, "global_step": 105915, "epoch": 875} {"train_loss": -35.67407989501953, "global_step": 105916, "epoch": 875} {"train_loss": -36.60171127319336, "global_step": 105917, "epoch": 875} {"train_loss": -36.84706115722656, "global_step": 105918, "epoch": 875} {"train_loss": -36.95732498168945, "global_step": 105919, "epoch": 875} {"train_loss": -36.67842483520508, "global_step": 105920, "epoch": 875} {"train_loss": -36.535396575927734, "global_step": 105921, "epoch": 875} {"train_loss": -37.07988739013672, "global_step": 105922, "epoch": 875} {"train_loss": -37.36027908325195, "global_step": 105923, "epoch": 875} {"train_loss": -36.59205627441406, "global_step": 105924, "epoch": 875} {"train_loss": -35.3249397277832, "global_step": 105925, "epoch": 875} {"train_loss": -36.44831466674805, "global_step": 105926, "epoch": 875} {"train_loss": -36.93964767456055, "global_step": 105927, "epoch": 875} {"train_loss": -37.50012969970703, "global_step": 105928, "epoch": 875} {"train_loss": -37.15549850463867, "global_step": 105929, "epoch": 875} {"train_loss": -37.322174072265625, "global_step": 105930, "epoch": 875} {"train_loss": -37.465492248535156, "global_step": 105931, "epoch": 875} {"train_loss": -37.08660888671875, "global_step": 105932, "epoch": 875} {"train_loss": -37.466461181640625, "global_step": 105933, "epoch": 875} {"train_loss": -37.59169387817383, "global_step": 105934, "epoch": 875} {"train_loss": -37.28634262084961, "global_step": 105935, "epoch": 875} {"train_loss": -37.91323471069336, "global_step": 105936, "epoch": 875} {"train_loss": -38.093990325927734, "global_step": 105937, "epoch": 875} {"train_loss": -37.598121643066406, "global_step": 105938, "epoch": 875} {"train_loss": -37.932369232177734, "global_step": 105939, "epoch": 875} {"train_loss": -38.45769500732422, "global_step": 105940, "epoch": 875} {"train_loss": -37.938106536865234, "global_step": 105941, "epoch": 875} {"train_loss": -38.152565002441406, "global_step": 105942, "epoch": 875} {"train_loss": -37.896446228027344, "global_step": 105943, "epoch": 875} {"train_loss": -38.144073486328125, "global_step": 105944, "epoch": 875} {"train_loss": -38.11272430419922, "global_step": 105945, "epoch": 875} {"train_loss": -38.45212936401367, "global_step": 105946, "epoch": 875} {"train_loss": -38.04901885986328, "global_step": 105947, "epoch": 875} {"train_loss": -38.307777404785156, "global_step": 105948, "epoch": 875} {"train_loss": -37.98741912841797, "global_step": 105949, "epoch": 875} {"train_loss": -38.1591911315918, "global_step": 105950, "epoch": 875} {"train_loss": -38.391029357910156, "global_step": 105951, "epoch": 875} {"train_loss": -38.216712951660156, "global_step": 105952, "epoch": 875} {"train_loss": -38.57204818725586, "global_step": 105953, "epoch": 875} {"train_loss": -38.56394577026367, "global_step": 105954, "epoch": 875} {"train_loss": -38.358882904052734, "global_step": 105955, "epoch": 875} {"train_loss": -38.2565803527832, "global_step": 105956, "epoch": 875} {"train_loss": -38.444740295410156, "global_step": 105957, "epoch": 875} {"train_loss": -38.22871017456055, "global_step": 105958, "epoch": 875} {"train_loss": -38.4465446472168, "global_step": 105959, "epoch": 875} {"train_loss": -38.87417984008789, "global_step": 105960, "epoch": 875} {"train_loss": -38.71364974975586, "global_step": 105961, "epoch": 875} {"train_loss": -38.99049758911133, "global_step": 105962, "epoch": 875} {"train_loss": -38.851043701171875, "global_step": 105963, "epoch": 875} {"train_loss": -38.43827438354492, "global_step": 105964, "epoch": 875} {"train_loss": -38.927242279052734, "global_step": 105965, "epoch": 875} {"train_loss": -39.09038162231445, "global_step": 105966, "epoch": 875} {"train_loss": -38.46315383911133, "global_step": 105967, "epoch": 875} {"train_loss": -38.46085739135742, "global_step": 105968, "epoch": 875} {"train_loss": -38.56976318359375, "global_step": 105969, "epoch": 875} {"train_loss": -38.83950424194336, "global_step": 105970, "epoch": 875} {"train_loss": -38.864803314208984, "global_step": 105971, "epoch": 875} {"train_loss": -38.54817581176758, "global_step": 105972, "epoch": 875} {"train_loss": -38.2186164855957, "global_step": 105973, "epoch": 875} {"train_loss": -36.93157958984375, "global_step": 105974, "epoch": 875} {"train_loss": -36.10342025756836, "global_step": 105975, "epoch": 875} {"train_loss": -35.89655685424805, "global_step": 105976, "epoch": 875} {"train_loss": -38.28937530517578, "global_step": 105977, "epoch": 875} {"train_loss": -38.396461486816406, "global_step": 105978, "epoch": 875} {"train_loss": -37.35926055908203, "global_step": 105979, "epoch": 875} {"train_loss": -38.9774169921875, "global_step": 105980, "epoch": 875} {"train_loss": -38.948055267333984, "global_step": 105981, "epoch": 875} {"train_loss": -37.921539306640625, "global_step": 105982, "epoch": 875} {"train_loss": -38.7952995300293, "global_step": 105983, "epoch": 875} {"train_loss": -38.944149017333984, "global_step": 105984, "epoch": 875} {"train_loss": -38.18109893798828, "global_step": 105985, "epoch": 875} {"train_loss": -37.91748046875, "global_step": 105986, "epoch": 875} {"train_loss": -38.99131393432617, "global_step": 105987, "epoch": 875} {"train_loss": -39.12264633178711, "global_step": 105988, "epoch": 875} {"train_loss": -38.40260696411133, "global_step": 105989, "epoch": 875} {"train_loss": -38.629127502441406, "global_step": 105990, "epoch": 875} {"train_loss": -39.47509765625, "global_step": 105991, "epoch": 875} {"train_loss": -38.772178649902344, "global_step": 105992, "epoch": 875} {"train_loss": -38.05771255493164, "global_step": 105993, "epoch": 875} {"train_loss": -38.85302734375, "global_step": 105994, "epoch": 875} {"train_loss": -37.0435198634124, "global_step": 105995, "epoch": 875, "val_loss": 2609616.75} {"train_loss": -39.13472366333008, "global_step": 105996, "epoch": 876} {"train_loss": -39.26088333129883, "global_step": 105997, "epoch": 876} {"train_loss": -38.35105514526367, "global_step": 105998, "epoch": 876} {"train_loss": -39.138206481933594, "global_step": 105999, "epoch": 876} {"train_loss": -38.94399642944336, "global_step": 106000, "epoch": 876} {"train_loss": -39.011104583740234, "global_step": 106001, "epoch": 876} {"train_loss": -39.67737579345703, "global_step": 106002, "epoch": 876} {"train_loss": -38.651817321777344, "global_step": 106003, "epoch": 876} {"train_loss": -39.68632125854492, "global_step": 106004, "epoch": 876} {"train_loss": -39.15707015991211, "global_step": 106005, "epoch": 876} {"train_loss": -39.52021408081055, "global_step": 106006, "epoch": 876} {"train_loss": -39.816162109375, "global_step": 106007, "epoch": 876} {"train_loss": -39.694305419921875, "global_step": 106008, "epoch": 876} {"train_loss": -39.555545806884766, "global_step": 106009, "epoch": 876} {"train_loss": -39.85825729370117, "global_step": 106010, "epoch": 876} {"train_loss": -39.1214714050293, "global_step": 106011, "epoch": 876} {"train_loss": -39.228485107421875, "global_step": 106012, "epoch": 876} {"train_loss": -38.286556243896484, "global_step": 106013, "epoch": 876} {"train_loss": -36.65620040893555, "global_step": 106014, "epoch": 876} {"train_loss": -35.01326370239258, "global_step": 106015, "epoch": 876} {"train_loss": -36.95875930786133, "global_step": 106016, "epoch": 876} {"train_loss": -37.27544021606445, "global_step": 106017, "epoch": 876} {"train_loss": -36.223175048828125, "global_step": 106018, "epoch": 876} {"train_loss": -36.8026123046875, "global_step": 106019, "epoch": 876} {"train_loss": -35.76887130737305, "global_step": 106020, "epoch": 876} {"train_loss": -34.50263595581055, "global_step": 106021, "epoch": 876} {"train_loss": -33.64617919921875, "global_step": 106022, "epoch": 876} {"train_loss": -39.106048583984375, "global_step": 106023, "epoch": 876} {"train_loss": -34.692169189453125, "global_step": 106024, "epoch": 876} {"train_loss": -33.36137008666992, "global_step": 106025, "epoch": 876} {"train_loss": -33.47564697265625, "global_step": 106026, "epoch": 876} {"train_loss": -35.716976165771484, "global_step": 106027, "epoch": 876} {"train_loss": -32.19447708129883, "global_step": 106028, "epoch": 876} {"train_loss": -36.13676071166992, "global_step": 106029, "epoch": 876} {"train_loss": -29.834585189819336, "global_step": 106030, "epoch": 876} {"train_loss": -36.47624206542969, "global_step": 106031, "epoch": 876} {"train_loss": -33.6401252746582, "global_step": 106032, "epoch": 876} {"train_loss": -33.46444320678711, "global_step": 106033, "epoch": 876} {"train_loss": -35.73542404174805, "global_step": 106034, "epoch": 876} {"train_loss": -30.68306541442871, "global_step": 106035, "epoch": 876} {"train_loss": -35.365814208984375, "global_step": 106036, "epoch": 876} {"train_loss": -35.78003692626953, "global_step": 106037, "epoch": 876} {"train_loss": -37.84725570678711, "global_step": 106038, "epoch": 876} {"train_loss": -36.51698303222656, "global_step": 106039, "epoch": 876} {"train_loss": -37.33130645751953, "global_step": 106040, "epoch": 876} {"train_loss": -36.95038986206055, "global_step": 106041, "epoch": 876} {"train_loss": -37.837764739990234, "global_step": 106042, "epoch": 876} {"train_loss": -37.117095947265625, "global_step": 106043, "epoch": 876} {"train_loss": -38.62127685546875, "global_step": 106044, "epoch": 876} {"train_loss": -36.5767936706543, "global_step": 106045, "epoch": 876} {"train_loss": -38.27309036254883, "global_step": 106046, "epoch": 876} {"train_loss": -37.34334945678711, "global_step": 106047, "epoch": 876} {"train_loss": -38.65199661254883, "global_step": 106048, "epoch": 876} {"train_loss": -37.39765548706055, "global_step": 106049, "epoch": 876} {"train_loss": -38.63584518432617, "global_step": 106050, "epoch": 876} {"train_loss": -38.18962478637695, "global_step": 106051, "epoch": 876} {"train_loss": -37.8953742980957, "global_step": 106052, "epoch": 876} {"train_loss": -38.44651794433594, "global_step": 106053, "epoch": 876} {"train_loss": -38.20293045043945, "global_step": 106054, "epoch": 876} {"train_loss": -38.981536865234375, "global_step": 106055, "epoch": 876} {"train_loss": -38.83333969116211, "global_step": 106056, "epoch": 876} {"train_loss": -38.624603271484375, "global_step": 106057, "epoch": 876} {"train_loss": -38.498870849609375, "global_step": 106058, "epoch": 876} {"train_loss": -38.1475715637207, "global_step": 106059, "epoch": 876} {"train_loss": -38.92123031616211, "global_step": 106060, "epoch": 876} {"train_loss": -38.846492767333984, "global_step": 106061, "epoch": 876} {"train_loss": -38.65910339355469, "global_step": 106062, "epoch": 876} {"train_loss": -38.53438186645508, "global_step": 106063, "epoch": 876} {"train_loss": -39.10719299316406, "global_step": 106064, "epoch": 876} {"train_loss": -39.2497673034668, "global_step": 106065, "epoch": 876} {"train_loss": -39.24486541748047, "global_step": 106066, "epoch": 876} {"train_loss": -38.75621032714844, "global_step": 106067, "epoch": 876} {"train_loss": -39.1012077331543, "global_step": 106068, "epoch": 876} {"train_loss": -39.07861328125, "global_step": 106069, "epoch": 876} {"train_loss": -39.4031982421875, "global_step": 106070, "epoch": 876} {"train_loss": -38.66756820678711, "global_step": 106071, "epoch": 876} {"train_loss": -38.89546203613281, "global_step": 106072, "epoch": 876} {"train_loss": -39.218421936035156, "global_step": 106073, "epoch": 876} {"train_loss": -38.400020599365234, "global_step": 106074, "epoch": 876} {"train_loss": -38.62151336669922, "global_step": 106075, "epoch": 876} {"train_loss": -38.498104095458984, "global_step": 106076, "epoch": 876} {"train_loss": -39.453548431396484, "global_step": 106077, "epoch": 876} {"train_loss": -39.43962478637695, "global_step": 106078, "epoch": 876} {"train_loss": -38.80012130737305, "global_step": 106079, "epoch": 876} {"train_loss": -37.71177291870117, "global_step": 106080, "epoch": 876} {"train_loss": -38.61372756958008, "global_step": 106081, "epoch": 876} {"train_loss": -39.2265739440918, "global_step": 106082, "epoch": 876} {"train_loss": -38.6322135925293, "global_step": 106083, "epoch": 876} {"train_loss": -38.51506423950195, "global_step": 106084, "epoch": 876} {"train_loss": -39.0672607421875, "global_step": 106085, "epoch": 876} {"train_loss": -38.97428512573242, "global_step": 106086, "epoch": 876} {"train_loss": -38.57942581176758, "global_step": 106087, "epoch": 876} {"train_loss": -39.327056884765625, "global_step": 106088, "epoch": 876} {"train_loss": -38.7583122253418, "global_step": 106089, "epoch": 876} {"train_loss": -38.85205841064453, "global_step": 106090, "epoch": 876} {"train_loss": -39.630855560302734, "global_step": 106091, "epoch": 876} {"train_loss": -39.225460052490234, "global_step": 106092, "epoch": 876} {"train_loss": -38.605003356933594, "global_step": 106093, "epoch": 876} {"train_loss": -38.1971549987793, "global_step": 106094, "epoch": 876} {"train_loss": -38.58544921875, "global_step": 106095, "epoch": 876} {"train_loss": -38.7738037109375, "global_step": 106096, "epoch": 876} {"train_loss": -38.052215576171875, "global_step": 106097, "epoch": 876} {"train_loss": -38.8782958984375, "global_step": 106098, "epoch": 876} {"train_loss": -39.518123626708984, "global_step": 106099, "epoch": 876} {"train_loss": -38.291316986083984, "global_step": 106100, "epoch": 876} {"train_loss": -39.13203811645508, "global_step": 106101, "epoch": 876} {"train_loss": -39.271358489990234, "global_step": 106102, "epoch": 876} {"train_loss": -39.30943298339844, "global_step": 106103, "epoch": 876} {"train_loss": -39.8764762878418, "global_step": 106104, "epoch": 876} {"train_loss": -39.03300476074219, "global_step": 106105, "epoch": 876} {"train_loss": -38.25691604614258, "global_step": 106106, "epoch": 876} {"train_loss": -39.38744354248047, "global_step": 106107, "epoch": 876} {"train_loss": -38.88298416137695, "global_step": 106108, "epoch": 876} {"train_loss": -39.74943161010742, "global_step": 106109, "epoch": 876} {"train_loss": -39.45659255981445, "global_step": 106110, "epoch": 876} {"train_loss": -39.21686935424805, "global_step": 106111, "epoch": 876} {"train_loss": -39.43561935424805, "global_step": 106112, "epoch": 876} {"train_loss": -38.925750732421875, "global_step": 106113, "epoch": 876} {"train_loss": -38.82145309448242, "global_step": 106114, "epoch": 876} {"train_loss": -39.22917556762695, "global_step": 106115, "epoch": 876} {"train_loss": -38.01166833924853, "global_step": 106116, "epoch": 876, "val_loss": 2612455.0} {"train_loss": -40.139766693115234, "global_step": 106117, "epoch": 877} {"train_loss": -39.497093200683594, "global_step": 106118, "epoch": 877} {"train_loss": -39.66483688354492, "global_step": 106119, "epoch": 877} {"train_loss": -39.35325241088867, "global_step": 106120, "epoch": 877} {"train_loss": -38.632347106933594, "global_step": 106121, "epoch": 877} {"train_loss": -37.9385986328125, "global_step": 106122, "epoch": 877} {"train_loss": -38.57727813720703, "global_step": 106123, "epoch": 877} {"train_loss": -37.40039825439453, "global_step": 106124, "epoch": 877} {"train_loss": -38.24186325073242, "global_step": 106125, "epoch": 877} {"train_loss": -39.76057434082031, "global_step": 106126, "epoch": 877} {"train_loss": -38.65037155151367, "global_step": 106127, "epoch": 877} {"train_loss": -37.90459442138672, "global_step": 106128, "epoch": 877} {"train_loss": -38.2336540222168, "global_step": 106129, "epoch": 877} {"train_loss": -38.649715423583984, "global_step": 106130, "epoch": 877} {"train_loss": -37.89658737182617, "global_step": 106131, "epoch": 877} {"train_loss": -37.18601608276367, "global_step": 106132, "epoch": 877} {"train_loss": -38.06270217895508, "global_step": 106133, "epoch": 877} {"train_loss": -37.7158088684082, "global_step": 106134, "epoch": 877} {"train_loss": -34.82719802856445, "global_step": 106135, "epoch": 877} {"train_loss": -33.521907806396484, "global_step": 106136, "epoch": 877} {"train_loss": -34.35931396484375, "global_step": 106137, "epoch": 877} {"train_loss": -35.210243225097656, "global_step": 106138, "epoch": 877} {"train_loss": -37.06507110595703, "global_step": 106139, "epoch": 877} {"train_loss": -37.3630485534668, "global_step": 106140, "epoch": 877} {"train_loss": -36.99154281616211, "global_step": 106141, "epoch": 877} {"train_loss": -37.749996185302734, "global_step": 106142, "epoch": 877} {"train_loss": -37.05506134033203, "global_step": 106143, "epoch": 877} {"train_loss": -38.17261505126953, "global_step": 106144, "epoch": 877} {"train_loss": -35.763099670410156, "global_step": 106145, "epoch": 877} {"train_loss": -38.158443450927734, "global_step": 106146, "epoch": 877} {"train_loss": -36.25065231323242, "global_step": 106147, "epoch": 877} {"train_loss": -37.94816207885742, "global_step": 106148, "epoch": 877} {"train_loss": -37.24972915649414, "global_step": 106149, "epoch": 877} {"train_loss": -38.27058029174805, "global_step": 106150, "epoch": 877} {"train_loss": -36.71738815307617, "global_step": 106151, "epoch": 877} {"train_loss": -37.59071731567383, "global_step": 106152, "epoch": 877} {"train_loss": -37.97317123413086, "global_step": 106153, "epoch": 877} {"train_loss": -36.33266067504883, "global_step": 106154, "epoch": 877} {"train_loss": -37.09060287475586, "global_step": 106155, "epoch": 877} {"train_loss": -37.65491485595703, "global_step": 106156, "epoch": 877} {"train_loss": -37.11724090576172, "global_step": 106157, "epoch": 877} {"train_loss": -37.866573333740234, "global_step": 106158, "epoch": 877} {"train_loss": -38.15743637084961, "global_step": 106159, "epoch": 877} {"train_loss": -38.4121208190918, "global_step": 106160, "epoch": 877} {"train_loss": -38.64142608642578, "global_step": 106161, "epoch": 877} {"train_loss": -38.892372131347656, "global_step": 106162, "epoch": 877} {"train_loss": -38.42109680175781, "global_step": 106163, "epoch": 877} {"train_loss": -38.99758529663086, "global_step": 106164, "epoch": 877} {"train_loss": -39.4688835144043, "global_step": 106165, "epoch": 877} {"train_loss": -38.752037048339844, "global_step": 106166, "epoch": 877} {"train_loss": -39.16561508178711, "global_step": 106167, "epoch": 877} {"train_loss": -39.024654388427734, "global_step": 106168, "epoch": 877} {"train_loss": -39.12837219238281, "global_step": 106169, "epoch": 877} {"train_loss": -38.21780014038086, "global_step": 106170, "epoch": 877} {"train_loss": -39.26994705200195, "global_step": 106171, "epoch": 877} {"train_loss": -39.374019622802734, "global_step": 106172, "epoch": 877} {"train_loss": -39.058372497558594, "global_step": 106173, "epoch": 877} {"train_loss": -39.092647552490234, "global_step": 106174, "epoch": 877} {"train_loss": -39.431549072265625, "global_step": 106175, "epoch": 877} {"train_loss": -39.4855842590332, "global_step": 106176, "epoch": 877} {"train_loss": -39.537452697753906, "global_step": 106177, "epoch": 877} {"train_loss": -39.451812744140625, "global_step": 106178, "epoch": 877} {"train_loss": -39.97079086303711, "global_step": 106179, "epoch": 877} {"train_loss": -39.23385238647461, "global_step": 106180, "epoch": 877} {"train_loss": -39.27888107299805, "global_step": 106181, "epoch": 877} {"train_loss": -39.635257720947266, "global_step": 106182, "epoch": 877} {"train_loss": -39.517616271972656, "global_step": 106183, "epoch": 877} {"train_loss": -39.3639030456543, "global_step": 106184, "epoch": 877} {"train_loss": -39.756919860839844, "global_step": 106185, "epoch": 877} {"train_loss": -39.705928802490234, "global_step": 106186, "epoch": 877} {"train_loss": -40.17680358886719, "global_step": 106187, "epoch": 877} {"train_loss": -39.24843978881836, "global_step": 106188, "epoch": 877} {"train_loss": -39.804012298583984, "global_step": 106189, "epoch": 877} {"train_loss": -39.817657470703125, "global_step": 106190, "epoch": 877} {"train_loss": -39.72246170043945, "global_step": 106191, "epoch": 877} {"train_loss": -38.720211029052734, "global_step": 106192, "epoch": 877} {"train_loss": -39.55758285522461, "global_step": 106193, "epoch": 877} {"train_loss": -39.28622817993164, "global_step": 106194, "epoch": 877} {"train_loss": -39.74284744262695, "global_step": 106195, "epoch": 877} {"train_loss": -39.16396713256836, "global_step": 106196, "epoch": 877} {"train_loss": -39.5851936340332, "global_step": 106197, "epoch": 877} {"train_loss": -39.86297607421875, "global_step": 106198, "epoch": 877} {"train_loss": -39.786781311035156, "global_step": 106199, "epoch": 877} {"train_loss": -40.017024993896484, "global_step": 106200, "epoch": 877} {"train_loss": -39.20485305786133, "global_step": 106201, "epoch": 877} {"train_loss": -39.083126068115234, "global_step": 106202, "epoch": 877} {"train_loss": -39.67380142211914, "global_step": 106203, "epoch": 877} {"train_loss": -40.050567626953125, "global_step": 106204, "epoch": 877} {"train_loss": -39.378597259521484, "global_step": 106205, "epoch": 877} {"train_loss": -38.473060607910156, "global_step": 106206, "epoch": 877} {"train_loss": -39.80402374267578, "global_step": 106207, "epoch": 877} {"train_loss": -39.895294189453125, "global_step": 106208, "epoch": 877} {"train_loss": -39.38125228881836, "global_step": 106209, "epoch": 877} {"train_loss": -37.55495834350586, "global_step": 106210, "epoch": 877} {"train_loss": -35.82141876220703, "global_step": 106211, "epoch": 877} {"train_loss": -37.39664077758789, "global_step": 106212, "epoch": 877} {"train_loss": -38.06984329223633, "global_step": 106213, "epoch": 877} {"train_loss": -37.229400634765625, "global_step": 106214, "epoch": 877} {"train_loss": -34.71707534790039, "global_step": 106215, "epoch": 877} {"train_loss": -30.061634063720703, "global_step": 106216, "epoch": 877} {"train_loss": -37.83771514892578, "global_step": 106217, "epoch": 877} {"train_loss": -38.36973571777344, "global_step": 106218, "epoch": 877} {"train_loss": -36.19173049926758, "global_step": 106219, "epoch": 877} {"train_loss": -31.731969833374023, "global_step": 106220, "epoch": 877} {"train_loss": -37.42350769042969, "global_step": 106221, "epoch": 877} {"train_loss": -33.648738861083984, "global_step": 106222, "epoch": 877} {"train_loss": -27.918195724487305, "global_step": 106223, "epoch": 877} {"train_loss": -36.806217193603516, "global_step": 106224, "epoch": 877} {"train_loss": -34.00981521606445, "global_step": 106225, "epoch": 877} {"train_loss": -36.091468811035156, "global_step": 106226, "epoch": 877} {"train_loss": -35.22766876220703, "global_step": 106227, "epoch": 877} {"train_loss": -36.69617462158203, "global_step": 106228, "epoch": 877} {"train_loss": -36.748870849609375, "global_step": 106229, "epoch": 877} {"train_loss": -35.37443161010742, "global_step": 106230, "epoch": 877} {"train_loss": -38.31912612915039, "global_step": 106231, "epoch": 877} {"train_loss": -36.8269157409668, "global_step": 106232, "epoch": 877} {"train_loss": -37.389095306396484, "global_step": 106233, "epoch": 877} {"train_loss": -38.125404357910156, "global_step": 106234, "epoch": 877} {"train_loss": -37.166114807128906, "global_step": 106235, "epoch": 877} {"train_loss": -38.13236999511719, "global_step": 106236, "epoch": 877} {"train_loss": -37.95419279997014, "global_step": 106237, "epoch": 877, "val_loss": 2618513.0} {"train_loss": -38.52587890625, "global_step": 106238, "epoch": 878} {"train_loss": -38.28227233886719, "global_step": 106239, "epoch": 878} {"train_loss": -38.53273391723633, "global_step": 106240, "epoch": 878} {"train_loss": -38.75178146362305, "global_step": 106241, "epoch": 878} {"train_loss": -38.77285385131836, "global_step": 106242, "epoch": 878} {"train_loss": -38.44283676147461, "global_step": 106243, "epoch": 878} {"train_loss": -39.045982360839844, "global_step": 106244, "epoch": 878} {"train_loss": -38.73465347290039, "global_step": 106245, "epoch": 878} {"train_loss": -39.042110443115234, "global_step": 106246, "epoch": 878} {"train_loss": -39.27715301513672, "global_step": 106247, "epoch": 878} {"train_loss": -39.008148193359375, "global_step": 106248, "epoch": 878} {"train_loss": -39.474979400634766, "global_step": 106249, "epoch": 878} {"train_loss": -39.210323333740234, "global_step": 106250, "epoch": 878} {"train_loss": -38.954776763916016, "global_step": 106251, "epoch": 878} {"train_loss": -39.33233642578125, "global_step": 106252, "epoch": 878} {"train_loss": -38.990478515625, "global_step": 106253, "epoch": 878} {"train_loss": -39.53266525268555, "global_step": 106254, "epoch": 878} {"train_loss": -39.53623580932617, "global_step": 106255, "epoch": 878} {"train_loss": -39.16147994995117, "global_step": 106256, "epoch": 878} {"train_loss": -39.382484436035156, "global_step": 106257, "epoch": 878} {"train_loss": -39.53316116333008, "global_step": 106258, "epoch": 878} {"train_loss": -39.61336135864258, "global_step": 106259, "epoch": 878} {"train_loss": -39.48189163208008, "global_step": 106260, "epoch": 878} {"train_loss": -39.80440902709961, "global_step": 106261, "epoch": 878} {"train_loss": -39.8165397644043, "global_step": 106262, "epoch": 878} {"train_loss": -39.514522552490234, "global_step": 106263, "epoch": 878} {"train_loss": -39.50823974609375, "global_step": 106264, "epoch": 878} {"train_loss": -39.4649772644043, "global_step": 106265, "epoch": 878} {"train_loss": -40.009849548339844, "global_step": 106266, "epoch": 878} {"train_loss": -39.68248748779297, "global_step": 106267, "epoch": 878} {"train_loss": -39.99320602416992, "global_step": 106268, "epoch": 878} {"train_loss": -39.64906692504883, "global_step": 106269, "epoch": 878} {"train_loss": -39.69594192504883, "global_step": 106270, "epoch": 878} {"train_loss": -39.55121612548828, "global_step": 106271, "epoch": 878} {"train_loss": -39.4072380065918, "global_step": 106272, "epoch": 878} {"train_loss": -39.753326416015625, "global_step": 106273, "epoch": 878} {"train_loss": -39.16598892211914, "global_step": 106274, "epoch": 878} {"train_loss": -38.452842712402344, "global_step": 106275, "epoch": 878} {"train_loss": -38.45414352416992, "global_step": 106276, "epoch": 878} {"train_loss": -39.193363189697266, "global_step": 106277, "epoch": 878} {"train_loss": -39.5242805480957, "global_step": 106278, "epoch": 878} {"train_loss": -39.72774124145508, "global_step": 106279, "epoch": 878} {"train_loss": -40.0887336730957, "global_step": 106280, "epoch": 878} {"train_loss": -40.23824691772461, "global_step": 106281, "epoch": 878} {"train_loss": -39.958858489990234, "global_step": 106282, "epoch": 878} {"train_loss": -39.569210052490234, "global_step": 106283, "epoch": 878} {"train_loss": -39.772586822509766, "global_step": 106284, "epoch": 878} {"train_loss": -40.18002700805664, "global_step": 106285, "epoch": 878} {"train_loss": -40.04505157470703, "global_step": 106286, "epoch": 878} {"train_loss": -39.75257110595703, "global_step": 106287, "epoch": 878} {"train_loss": -39.94114303588867, "global_step": 106288, "epoch": 878} {"train_loss": -39.75461959838867, "global_step": 106289, "epoch": 878} {"train_loss": -39.85997772216797, "global_step": 106290, "epoch": 878} {"train_loss": -39.61445236206055, "global_step": 106291, "epoch": 878} {"train_loss": -40.13200378417969, "global_step": 106292, "epoch": 878} {"train_loss": -39.962730407714844, "global_step": 106293, "epoch": 878} {"train_loss": -38.98688888549805, "global_step": 106294, "epoch": 878} {"train_loss": -40.252723693847656, "global_step": 106295, "epoch": 878} {"train_loss": -39.95821762084961, "global_step": 106296, "epoch": 878} {"train_loss": -39.6589469909668, "global_step": 106297, "epoch": 878} {"train_loss": -39.9950065612793, "global_step": 106298, "epoch": 878} {"train_loss": -40.01032257080078, "global_step": 106299, "epoch": 878} {"train_loss": -39.694114685058594, "global_step": 106300, "epoch": 878} {"train_loss": -39.44512939453125, "global_step": 106301, "epoch": 878} {"train_loss": -39.43122100830078, "global_step": 106302, "epoch": 878} {"train_loss": -39.82481002807617, "global_step": 106303, "epoch": 878} {"train_loss": -38.92669677734375, "global_step": 106304, "epoch": 878} {"train_loss": -39.471187591552734, "global_step": 106305, "epoch": 878} {"train_loss": -39.05141830444336, "global_step": 106306, "epoch": 878} {"train_loss": -37.54413604736328, "global_step": 106307, "epoch": 878} {"train_loss": -31.3065185546875, "global_step": 106308, "epoch": 878} {"train_loss": -39.47379684448242, "global_step": 106309, "epoch": 878} {"train_loss": -32.24083709716797, "global_step": 106310, "epoch": 878} {"train_loss": -38.252159118652344, "global_step": 106311, "epoch": 878} {"train_loss": -32.45049285888672, "global_step": 106312, "epoch": 878} {"train_loss": -34.5165901184082, "global_step": 106313, "epoch": 878} {"train_loss": -36.61627197265625, "global_step": 106314, "epoch": 878} {"train_loss": -34.868316650390625, "global_step": 106315, "epoch": 878} {"train_loss": -38.646976470947266, "global_step": 106316, "epoch": 878} {"train_loss": -34.43148422241211, "global_step": 106317, "epoch": 878} {"train_loss": -36.93974304199219, "global_step": 106318, "epoch": 878} {"train_loss": -36.13956069946289, "global_step": 106319, "epoch": 878} {"train_loss": -37.49329376220703, "global_step": 106320, "epoch": 878} {"train_loss": -37.26931381225586, "global_step": 106321, "epoch": 878} {"train_loss": -37.99105453491211, "global_step": 106322, "epoch": 878} {"train_loss": -37.744476318359375, "global_step": 106323, "epoch": 878} {"train_loss": -37.81031036376953, "global_step": 106324, "epoch": 878} {"train_loss": -38.006656646728516, "global_step": 106325, "epoch": 878} {"train_loss": -37.430809020996094, "global_step": 106326, "epoch": 878} {"train_loss": -38.375118255615234, "global_step": 106327, "epoch": 878} {"train_loss": -38.171688079833984, "global_step": 106328, "epoch": 878} {"train_loss": -38.65345001220703, "global_step": 106329, "epoch": 878} {"train_loss": -37.37273025512695, "global_step": 106330, "epoch": 878} {"train_loss": -38.92954635620117, "global_step": 106331, "epoch": 878} {"train_loss": -38.02604675292969, "global_step": 106332, "epoch": 878} {"train_loss": -37.9510612487793, "global_step": 106333, "epoch": 878} {"train_loss": -38.744869232177734, "global_step": 106334, "epoch": 878} {"train_loss": -38.17744064331055, "global_step": 106335, "epoch": 878} {"train_loss": -37.162879943847656, "global_step": 106336, "epoch": 878} {"train_loss": -38.452430725097656, "global_step": 106337, "epoch": 878} {"train_loss": -37.17506790161133, "global_step": 106338, "epoch": 878} {"train_loss": -37.7216682434082, "global_step": 106339, "epoch": 878} {"train_loss": -38.28752517700195, "global_step": 106340, "epoch": 878} {"train_loss": -38.18641662597656, "global_step": 106341, "epoch": 878} {"train_loss": -37.7271614074707, "global_step": 106342, "epoch": 878} {"train_loss": -39.11440658569336, "global_step": 106343, "epoch": 878} {"train_loss": -38.569969177246094, "global_step": 106344, "epoch": 878} {"train_loss": -39.06987380981445, "global_step": 106345, "epoch": 878} {"train_loss": -38.04951095581055, "global_step": 106346, "epoch": 878} {"train_loss": -39.109493255615234, "global_step": 106347, "epoch": 878} {"train_loss": -39.34566879272461, "global_step": 106348, "epoch": 878} {"train_loss": -38.7628059387207, "global_step": 106349, "epoch": 878} {"train_loss": -39.005043029785156, "global_step": 106350, "epoch": 878} {"train_loss": -39.676116943359375, "global_step": 106351, "epoch": 878} {"train_loss": -38.61053466796875, "global_step": 106352, "epoch": 878} {"train_loss": -39.208553314208984, "global_step": 106353, "epoch": 878} {"train_loss": -38.421627044677734, "global_step": 106354, "epoch": 878} {"train_loss": -38.2244873046875, "global_step": 106355, "epoch": 878} {"train_loss": -38.55927658081055, "global_step": 106356, "epoch": 878} {"train_loss": -38.9420280456543, "global_step": 106357, "epoch": 878} {"train_loss": -38.674841951732795, "global_step": 106358, "epoch": 878, "val_loss": 2598143.0} {"train_loss": -38.395355224609375, "global_step": 106359, "epoch": 879} {"train_loss": -37.98165512084961, "global_step": 106360, "epoch": 879} {"train_loss": -39.213783264160156, "global_step": 106361, "epoch": 879} {"train_loss": -37.92940902709961, "global_step": 106362, "epoch": 879} {"train_loss": -37.639495849609375, "global_step": 106363, "epoch": 879} {"train_loss": -38.589534759521484, "global_step": 106364, "epoch": 879} {"train_loss": -37.26457214355469, "global_step": 106365, "epoch": 879} {"train_loss": -38.41164016723633, "global_step": 106366, "epoch": 879} {"train_loss": -38.17364501953125, "global_step": 106367, "epoch": 879} {"train_loss": -38.79570770263672, "global_step": 106368, "epoch": 879} {"train_loss": -37.816341400146484, "global_step": 106369, "epoch": 879} {"train_loss": -39.334651947021484, "global_step": 106370, "epoch": 879} {"train_loss": -38.93296432495117, "global_step": 106371, "epoch": 879} {"train_loss": -38.93165969848633, "global_step": 106372, "epoch": 879} {"train_loss": -39.803627014160156, "global_step": 106373, "epoch": 879} {"train_loss": -38.90718460083008, "global_step": 106374, "epoch": 879} {"train_loss": -38.70390701293945, "global_step": 106375, "epoch": 879} {"train_loss": -39.68144607543945, "global_step": 106376, "epoch": 879} {"train_loss": -39.132240295410156, "global_step": 106377, "epoch": 879} {"train_loss": -39.269752502441406, "global_step": 106378, "epoch": 879} {"train_loss": -39.174591064453125, "global_step": 106379, "epoch": 879} {"train_loss": -39.54690170288086, "global_step": 106380, "epoch": 879} {"train_loss": -38.91484451293945, "global_step": 106381, "epoch": 879} {"train_loss": -40.009769439697266, "global_step": 106382, "epoch": 879} {"train_loss": -39.16598129272461, "global_step": 106383, "epoch": 879} {"train_loss": -38.86555862426758, "global_step": 106384, "epoch": 879} {"train_loss": -38.77640151977539, "global_step": 106385, "epoch": 879} {"train_loss": -40.010433197021484, "global_step": 106386, "epoch": 879} {"train_loss": -39.07749938964844, "global_step": 106387, "epoch": 879} {"train_loss": -39.930397033691406, "global_step": 106388, "epoch": 879} {"train_loss": -39.89487838745117, "global_step": 106389, "epoch": 879} {"train_loss": -40.0112419128418, "global_step": 106390, "epoch": 879} {"train_loss": -39.97674560546875, "global_step": 106391, "epoch": 879} {"train_loss": -39.69760513305664, "global_step": 106392, "epoch": 879} {"train_loss": -40.0128173828125, "global_step": 106393, "epoch": 879} {"train_loss": -39.216182708740234, "global_step": 106394, "epoch": 879} {"train_loss": -39.894920349121094, "global_step": 106395, "epoch": 879} {"train_loss": -40.00867462158203, "global_step": 106396, "epoch": 879} {"train_loss": -39.546104431152344, "global_step": 106397, "epoch": 879} {"train_loss": -38.893253326416016, "global_step": 106398, "epoch": 879} {"train_loss": -39.37843704223633, "global_step": 106399, "epoch": 879} {"train_loss": -39.82697296142578, "global_step": 106400, "epoch": 879} {"train_loss": -38.946556091308594, "global_step": 106401, "epoch": 879} {"train_loss": -38.322357177734375, "global_step": 106402, "epoch": 879} {"train_loss": -36.874263763427734, "global_step": 106403, "epoch": 879} {"train_loss": -33.33186340332031, "global_step": 106404, "epoch": 879} {"train_loss": -37.541744232177734, "global_step": 106405, "epoch": 879} {"train_loss": -30.56220054626465, "global_step": 106406, "epoch": 879} {"train_loss": -29.832061767578125, "global_step": 106407, "epoch": 879} {"train_loss": -31.362157821655273, "global_step": 106408, "epoch": 879} {"train_loss": -31.62872886657715, "global_step": 106409, "epoch": 879} {"train_loss": -31.216876983642578, "global_step": 106410, "epoch": 879} {"train_loss": -33.51449203491211, "global_step": 106411, "epoch": 879} {"train_loss": -31.751529693603516, "global_step": 106412, "epoch": 879} {"train_loss": -32.582210540771484, "global_step": 106413, "epoch": 879} {"train_loss": -32.43339920043945, "global_step": 106414, "epoch": 879} {"train_loss": -31.618000030517578, "global_step": 106415, "epoch": 879} {"train_loss": -29.321063995361328, "global_step": 106416, "epoch": 879} {"train_loss": -25.821813583374023, "global_step": 106417, "epoch": 879} {"train_loss": -33.25022506713867, "global_step": 106418, "epoch": 879} {"train_loss": -27.568090438842773, "global_step": 106419, "epoch": 879} {"train_loss": -33.074462890625, "global_step": 106420, "epoch": 879} {"train_loss": -28.897598266601562, "global_step": 106421, "epoch": 879} {"train_loss": -33.53727340698242, "global_step": 106422, "epoch": 879} {"train_loss": -31.129220962524414, "global_step": 106423, "epoch": 879} {"train_loss": -33.6427001953125, "global_step": 106424, "epoch": 879} {"train_loss": -33.47639083862305, "global_step": 106425, "epoch": 879} {"train_loss": -32.185302734375, "global_step": 106426, "epoch": 879} {"train_loss": -33.78173828125, "global_step": 106427, "epoch": 879} {"train_loss": -33.82382583618164, "global_step": 106428, "epoch": 879} {"train_loss": -32.72597885131836, "global_step": 106429, "epoch": 879} {"train_loss": -34.42137908935547, "global_step": 106430, "epoch": 879} {"train_loss": -34.2810173034668, "global_step": 106431, "epoch": 879} {"train_loss": -34.342926025390625, "global_step": 106432, "epoch": 879} {"train_loss": -35.54732894897461, "global_step": 106433, "epoch": 879} {"train_loss": -35.06562042236328, "global_step": 106434, "epoch": 879} {"train_loss": -34.86559295654297, "global_step": 106435, "epoch": 879} {"train_loss": -34.81085205078125, "global_step": 106436, "epoch": 879} {"train_loss": -35.652740478515625, "global_step": 106437, "epoch": 879} {"train_loss": -35.96004867553711, "global_step": 106438, "epoch": 879} {"train_loss": -35.539100646972656, "global_step": 106439, "epoch": 879} {"train_loss": -35.48497009277344, "global_step": 106440, "epoch": 879} {"train_loss": -35.02537155151367, "global_step": 106441, "epoch": 879} {"train_loss": -31.414936065673828, "global_step": 106442, "epoch": 879} {"train_loss": -24.722700119018555, "global_step": 106443, "epoch": 879} {"train_loss": -30.075510025024414, "global_step": 106444, "epoch": 879} {"train_loss": -34.820003509521484, "global_step": 106445, "epoch": 879} {"train_loss": -31.556564331054688, "global_step": 106446, "epoch": 879} {"train_loss": -34.804500579833984, "global_step": 106447, "epoch": 879} {"train_loss": -34.08280563354492, "global_step": 106448, "epoch": 879} {"train_loss": -35.5984992980957, "global_step": 106449, "epoch": 879} {"train_loss": -34.07691955566406, "global_step": 106450, "epoch": 879} {"train_loss": -34.534759521484375, "global_step": 106451, "epoch": 879} {"train_loss": -34.457271575927734, "global_step": 106452, "epoch": 879} {"train_loss": -33.48585891723633, "global_step": 106453, "epoch": 879} {"train_loss": -35.80534744262695, "global_step": 106454, "epoch": 879} {"train_loss": -34.70780563354492, "global_step": 106455, "epoch": 879} {"train_loss": -35.198787689208984, "global_step": 106456, "epoch": 879} {"train_loss": -34.49641799926758, "global_step": 106457, "epoch": 879} {"train_loss": -34.56935119628906, "global_step": 106458, "epoch": 879} {"train_loss": -35.66778564453125, "global_step": 106459, "epoch": 879} {"train_loss": -36.43306350708008, "global_step": 106460, "epoch": 879} {"train_loss": -35.44765090942383, "global_step": 106461, "epoch": 879} {"train_loss": -35.358455657958984, "global_step": 106462, "epoch": 879} {"train_loss": -36.32503128051758, "global_step": 106463, "epoch": 879} {"train_loss": -36.18304443359375, "global_step": 106464, "epoch": 879} {"train_loss": -36.71918869018555, "global_step": 106465, "epoch": 879} {"train_loss": -36.67427444458008, "global_step": 106466, "epoch": 879} {"train_loss": -36.0040397644043, "global_step": 106467, "epoch": 879} {"train_loss": -36.35024642944336, "global_step": 106468, "epoch": 879} {"train_loss": -36.5728645324707, "global_step": 106469, "epoch": 879} {"train_loss": -36.458656311035156, "global_step": 106470, "epoch": 879} {"train_loss": -37.38648223876953, "global_step": 106471, "epoch": 879} {"train_loss": -36.316619873046875, "global_step": 106472, "epoch": 879} {"train_loss": -36.84116744995117, "global_step": 106473, "epoch": 879} {"train_loss": -36.79770278930664, "global_step": 106474, "epoch": 879} {"train_loss": -36.61739730834961, "global_step": 106475, "epoch": 879} {"train_loss": -37.84205627441406, "global_step": 106476, "epoch": 879} {"train_loss": -36.71961975097656, "global_step": 106477, "epoch": 879} {"train_loss": -37.76902389526367, "global_step": 106478, "epoch": 879} {"train_loss": -35.896475705233485, "global_step": 106479, "epoch": 879, "val_loss": 2473878.25} {"train_loss": -37.58302307128906, "global_step": 106480, "epoch": 880} {"train_loss": -36.56255340576172, "global_step": 106481, "epoch": 880} {"train_loss": -36.91680908203125, "global_step": 106482, "epoch": 880} {"train_loss": -37.60376739501953, "global_step": 106483, "epoch": 880} {"train_loss": -36.719642639160156, "global_step": 106484, "epoch": 880} {"train_loss": -37.57644271850586, "global_step": 106485, "epoch": 880} {"train_loss": -37.74135971069336, "global_step": 106486, "epoch": 880} {"train_loss": -37.224857330322266, "global_step": 106487, "epoch": 880} {"train_loss": -37.63488006591797, "global_step": 106488, "epoch": 880} {"train_loss": -37.931884765625, "global_step": 106489, "epoch": 880} {"train_loss": -37.06855392456055, "global_step": 106490, "epoch": 880} {"train_loss": -35.951698303222656, "global_step": 106491, "epoch": 880} {"train_loss": -34.86556625366211, "global_step": 106492, "epoch": 880} {"train_loss": -34.96023178100586, "global_step": 106493, "epoch": 880} {"train_loss": -35.9957160949707, "global_step": 106494, "epoch": 880} {"train_loss": -37.53425979614258, "global_step": 106495, "epoch": 880} {"train_loss": -36.297603607177734, "global_step": 106496, "epoch": 880} {"train_loss": -36.358036041259766, "global_step": 106497, "epoch": 880} {"train_loss": -37.29751205444336, "global_step": 106498, "epoch": 880} {"train_loss": -35.431182861328125, "global_step": 106499, "epoch": 880} {"train_loss": -36.450191497802734, "global_step": 106500, "epoch": 880} {"train_loss": -36.01839065551758, "global_step": 106501, "epoch": 880} {"train_loss": -36.09722900390625, "global_step": 106502, "epoch": 880} {"train_loss": -35.972164154052734, "global_step": 106503, "epoch": 880} {"train_loss": -35.940643310546875, "global_step": 106504, "epoch": 880} {"train_loss": -35.339595794677734, "global_step": 106505, "epoch": 880} {"train_loss": -37.26902389526367, "global_step": 106506, "epoch": 880} {"train_loss": -36.99705123901367, "global_step": 106507, "epoch": 880} {"train_loss": -37.76991653442383, "global_step": 106508, "epoch": 880} {"train_loss": -36.653228759765625, "global_step": 106509, "epoch": 880} {"train_loss": -36.173973083496094, "global_step": 106510, "epoch": 880} {"train_loss": -36.92092514038086, "global_step": 106511, "epoch": 880} {"train_loss": -36.85980987548828, "global_step": 106512, "epoch": 880} {"train_loss": -37.5749626159668, "global_step": 106513, "epoch": 880} {"train_loss": -37.4323844909668, "global_step": 106514, "epoch": 880} {"train_loss": -37.475215911865234, "global_step": 106515, "epoch": 880} {"train_loss": -36.565673828125, "global_step": 106516, "epoch": 880} {"train_loss": -37.00236892700195, "global_step": 106517, "epoch": 880} {"train_loss": -36.054107666015625, "global_step": 106518, "epoch": 880} {"train_loss": -36.14533615112305, "global_step": 106519, "epoch": 880} {"train_loss": -37.348121643066406, "global_step": 106520, "epoch": 880} {"train_loss": -37.01399612426758, "global_step": 106521, "epoch": 880} {"train_loss": -36.22317886352539, "global_step": 106522, "epoch": 880} {"train_loss": -37.138580322265625, "global_step": 106523, "epoch": 880} {"train_loss": -37.78243637084961, "global_step": 106524, "epoch": 880} {"train_loss": -36.25115966796875, "global_step": 106525, "epoch": 880} {"train_loss": -37.645565032958984, "global_step": 106526, "epoch": 880} {"train_loss": -37.72745895385742, "global_step": 106527, "epoch": 880} {"train_loss": -36.9888916015625, "global_step": 106528, "epoch": 880} {"train_loss": -38.276336669921875, "global_step": 106529, "epoch": 880} {"train_loss": -36.87832260131836, "global_step": 106530, "epoch": 880} {"train_loss": -37.81117630004883, "global_step": 106531, "epoch": 880} {"train_loss": -37.360450744628906, "global_step": 106532, "epoch": 880} {"train_loss": -36.53059005737305, "global_step": 106533, "epoch": 880} {"train_loss": -35.76771545410156, "global_step": 106534, "epoch": 880} {"train_loss": -36.15029525756836, "global_step": 106535, "epoch": 880} {"train_loss": -36.97782516479492, "global_step": 106536, "epoch": 880} {"train_loss": -37.354488372802734, "global_step": 106537, "epoch": 880} {"train_loss": -37.543617248535156, "global_step": 106538, "epoch": 880} {"train_loss": -36.56476593017578, "global_step": 106539, "epoch": 880} {"train_loss": -38.24127197265625, "global_step": 106540, "epoch": 880} {"train_loss": -37.70904541015625, "global_step": 106541, "epoch": 880} {"train_loss": -38.1507682800293, "global_step": 106542, "epoch": 880} {"train_loss": -37.47591781616211, "global_step": 106543, "epoch": 880} {"train_loss": -38.34668731689453, "global_step": 106544, "epoch": 880} {"train_loss": -37.8569450378418, "global_step": 106545, "epoch": 880} {"train_loss": -37.8701286315918, "global_step": 106546, "epoch": 880} {"train_loss": -38.560298919677734, "global_step": 106547, "epoch": 880} {"train_loss": -38.113460540771484, "global_step": 106548, "epoch": 880} {"train_loss": -38.193763732910156, "global_step": 106549, "epoch": 880} {"train_loss": -38.2453727722168, "global_step": 106550, "epoch": 880} {"train_loss": -38.4078254699707, "global_step": 106551, "epoch": 880} {"train_loss": -38.654781341552734, "global_step": 106552, "epoch": 880} {"train_loss": -38.51948547363281, "global_step": 106553, "epoch": 880} {"train_loss": -38.25626754760742, "global_step": 106554, "epoch": 880} {"train_loss": -38.85639572143555, "global_step": 106555, "epoch": 880} {"train_loss": -38.881507873535156, "global_step": 106556, "epoch": 880} {"train_loss": -38.395355224609375, "global_step": 106557, "epoch": 880} {"train_loss": -39.09037399291992, "global_step": 106558, "epoch": 880} {"train_loss": -38.67209243774414, "global_step": 106559, "epoch": 880} {"train_loss": -38.80999755859375, "global_step": 106560, "epoch": 880} {"train_loss": -38.64742660522461, "global_step": 106561, "epoch": 880} {"train_loss": -38.47197723388672, "global_step": 106562, "epoch": 880} {"train_loss": -38.549774169921875, "global_step": 106563, "epoch": 880} {"train_loss": -39.16781234741211, "global_step": 106564, "epoch": 880} {"train_loss": -38.69812774658203, "global_step": 106565, "epoch": 880} {"train_loss": -39.19586181640625, "global_step": 106566, "epoch": 880} {"train_loss": -38.76088333129883, "global_step": 106567, "epoch": 880} {"train_loss": -38.758819580078125, "global_step": 106568, "epoch": 880} {"train_loss": -38.55601119995117, "global_step": 106569, "epoch": 880} {"train_loss": -39.228485107421875, "global_step": 106570, "epoch": 880} {"train_loss": -39.59968948364258, "global_step": 106571, "epoch": 880} {"train_loss": -39.05959701538086, "global_step": 106572, "epoch": 880} {"train_loss": -39.26754379272461, "global_step": 106573, "epoch": 880} {"train_loss": -39.10665512084961, "global_step": 106574, "epoch": 880} {"train_loss": -38.62491226196289, "global_step": 106575, "epoch": 880} {"train_loss": -37.0471305847168, "global_step": 106576, "epoch": 880} {"train_loss": -29.397205352783203, "global_step": 106577, "epoch": 880} {"train_loss": -14.518523216247559, "global_step": 106578, "epoch": 880} {"train_loss": -30.872507095336914, "global_step": 106579, "epoch": 880} {"train_loss": -29.4491024017334, "global_step": 106580, "epoch": 880} {"train_loss": -30.101715087890625, "global_step": 106581, "epoch": 880} {"train_loss": -26.48499870300293, "global_step": 106582, "epoch": 880} {"train_loss": -31.535612106323242, "global_step": 106583, "epoch": 880} {"train_loss": -33.43430709838867, "global_step": 106584, "epoch": 880} {"train_loss": -33.43818283081055, "global_step": 106585, "epoch": 880} {"train_loss": -34.657081604003906, "global_step": 106586, "epoch": 880} {"train_loss": -33.09143829345703, "global_step": 106587, "epoch": 880} {"train_loss": -36.17621612548828, "global_step": 106588, "epoch": 880} {"train_loss": -32.08952331542969, "global_step": 106589, "epoch": 880} {"train_loss": -37.39604949951172, "global_step": 106590, "epoch": 880} {"train_loss": -33.65769577026367, "global_step": 106591, "epoch": 880} {"train_loss": -36.3599967956543, "global_step": 106592, "epoch": 880} {"train_loss": -34.52071762084961, "global_step": 106593, "epoch": 880} {"train_loss": -38.39569854736328, "global_step": 106594, "epoch": 880} {"train_loss": -35.31447982788086, "global_step": 106595, "epoch": 880} {"train_loss": -36.08665084838867, "global_step": 106596, "epoch": 880} {"train_loss": -37.22915267944336, "global_step": 106597, "epoch": 880} {"train_loss": -36.16674041748047, "global_step": 106598, "epoch": 880} {"train_loss": -36.237979888916016, "global_step": 106599, "epoch": 880} {"train_loss": -36.59840001350592, "global_step": 106600, "epoch": 880, "val_loss": 2523772.75} {"train_loss": -37.07352828979492, "global_step": 106601, "epoch": 881} {"train_loss": -36.991554260253906, "global_step": 106602, "epoch": 881} {"train_loss": -36.6934928894043, "global_step": 106603, "epoch": 881} {"train_loss": -37.45697784423828, "global_step": 106604, "epoch": 881} {"train_loss": -37.88606262207031, "global_step": 106605, "epoch": 881} {"train_loss": -37.06209945678711, "global_step": 106606, "epoch": 881} {"train_loss": -37.295047760009766, "global_step": 106607, "epoch": 881} {"train_loss": -37.5322151184082, "global_step": 106608, "epoch": 881} {"train_loss": -37.51420974731445, "global_step": 106609, "epoch": 881} {"train_loss": -37.18848419189453, "global_step": 106610, "epoch": 881} {"train_loss": -37.378055572509766, "global_step": 106611, "epoch": 881} {"train_loss": -37.45701217651367, "global_step": 106612, "epoch": 881} {"train_loss": -38.02687072753906, "global_step": 106613, "epoch": 881} {"train_loss": -37.96521759033203, "global_step": 106614, "epoch": 881} {"train_loss": -36.707122802734375, "global_step": 106615, "epoch": 881} {"train_loss": -36.54825973510742, "global_step": 106616, "epoch": 881} {"train_loss": -35.95371627807617, "global_step": 106617, "epoch": 881} {"train_loss": -35.074729919433594, "global_step": 106618, "epoch": 881} {"train_loss": -37.04676055908203, "global_step": 106619, "epoch": 881} {"train_loss": -37.67763900756836, "global_step": 106620, "epoch": 881} {"train_loss": -36.186397552490234, "global_step": 106621, "epoch": 881} {"train_loss": -37.0097770690918, "global_step": 106622, "epoch": 881} {"train_loss": -37.9754753112793, "global_step": 106623, "epoch": 881} {"train_loss": -36.73972702026367, "global_step": 106624, "epoch": 881} {"train_loss": -36.347408294677734, "global_step": 106625, "epoch": 881} {"train_loss": -37.66508102416992, "global_step": 106626, "epoch": 881} {"train_loss": -37.214088439941406, "global_step": 106627, "epoch": 881} {"train_loss": -36.271148681640625, "global_step": 106628, "epoch": 881} {"train_loss": -38.22310256958008, "global_step": 106629, "epoch": 881} {"train_loss": -36.50678253173828, "global_step": 106630, "epoch": 881} {"train_loss": -37.508338928222656, "global_step": 106631, "epoch": 881} {"train_loss": -36.442848205566406, "global_step": 106632, "epoch": 881} {"train_loss": -37.86670684814453, "global_step": 106633, "epoch": 881} {"train_loss": -37.58393096923828, "global_step": 106634, "epoch": 881} {"train_loss": -38.04330062866211, "global_step": 106635, "epoch": 881} {"train_loss": -37.945186614990234, "global_step": 106636, "epoch": 881} {"train_loss": -37.72382354736328, "global_step": 106637, "epoch": 881} {"train_loss": -38.125640869140625, "global_step": 106638, "epoch": 881} {"train_loss": -38.070133209228516, "global_step": 106639, "epoch": 881} {"train_loss": -38.012508392333984, "global_step": 106640, "epoch": 881} {"train_loss": -38.07844161987305, "global_step": 106641, "epoch": 881} {"train_loss": -37.56780242919922, "global_step": 106642, "epoch": 881} {"train_loss": -36.98691940307617, "global_step": 106643, "epoch": 881} {"train_loss": -38.44419479370117, "global_step": 106644, "epoch": 881} {"train_loss": -37.38503646850586, "global_step": 106645, "epoch": 881} {"train_loss": -38.36975860595703, "global_step": 106646, "epoch": 881} {"train_loss": -37.746089935302734, "global_step": 106647, "epoch": 881} {"train_loss": -37.71685791015625, "global_step": 106648, "epoch": 881} {"train_loss": -38.498958587646484, "global_step": 106649, "epoch": 881} {"train_loss": -38.28772735595703, "global_step": 106650, "epoch": 881} {"train_loss": -38.49149703979492, "global_step": 106651, "epoch": 881} {"train_loss": -38.54655456542969, "global_step": 106652, "epoch": 881} {"train_loss": -37.66019821166992, "global_step": 106653, "epoch": 881} {"train_loss": -38.730098724365234, "global_step": 106654, "epoch": 881} {"train_loss": -38.206363677978516, "global_step": 106655, "epoch": 881} {"train_loss": -38.35748291015625, "global_step": 106656, "epoch": 881} {"train_loss": -38.7044677734375, "global_step": 106657, "epoch": 881} {"train_loss": -37.10214614868164, "global_step": 106658, "epoch": 881} {"train_loss": -37.40619659423828, "global_step": 106659, "epoch": 881} {"train_loss": -38.543025970458984, "global_step": 106660, "epoch": 881} {"train_loss": -37.930484771728516, "global_step": 106661, "epoch": 881} {"train_loss": -38.31642532348633, "global_step": 106662, "epoch": 881} {"train_loss": -38.186126708984375, "global_step": 106663, "epoch": 881} {"train_loss": -38.98999786376953, "global_step": 106664, "epoch": 881} {"train_loss": -38.303382873535156, "global_step": 106665, "epoch": 881} {"train_loss": -38.916969299316406, "global_step": 106666, "epoch": 881} {"train_loss": -38.80941390991211, "global_step": 106667, "epoch": 881} {"train_loss": -38.6712760925293, "global_step": 106668, "epoch": 881} {"train_loss": -38.53902816772461, "global_step": 106669, "epoch": 881} {"train_loss": -39.31804656982422, "global_step": 106670, "epoch": 881} {"train_loss": -38.966888427734375, "global_step": 106671, "epoch": 881} {"train_loss": -38.83568572998047, "global_step": 106672, "epoch": 881} {"train_loss": -38.835750579833984, "global_step": 106673, "epoch": 881} {"train_loss": -38.76240921020508, "global_step": 106674, "epoch": 881} {"train_loss": -38.9824104309082, "global_step": 106675, "epoch": 881} {"train_loss": -37.196449279785156, "global_step": 106676, "epoch": 881} {"train_loss": -39.42730712890625, "global_step": 106677, "epoch": 881} {"train_loss": -38.665462493896484, "global_step": 106678, "epoch": 881} {"train_loss": -38.82477569580078, "global_step": 106679, "epoch": 881} {"train_loss": -38.88714599609375, "global_step": 106680, "epoch": 881} {"train_loss": -37.44160842895508, "global_step": 106681, "epoch": 881} {"train_loss": -37.969207763671875, "global_step": 106682, "epoch": 881} {"train_loss": -38.447975158691406, "global_step": 106683, "epoch": 881} {"train_loss": -36.643795013427734, "global_step": 106684, "epoch": 881} {"train_loss": -37.70577621459961, "global_step": 106685, "epoch": 881} {"train_loss": -38.19517517089844, "global_step": 106686, "epoch": 881} {"train_loss": -36.64603805541992, "global_step": 106687, "epoch": 881} {"train_loss": -36.90675735473633, "global_step": 106688, "epoch": 881} {"train_loss": -38.71656036376953, "global_step": 106689, "epoch": 881} {"train_loss": -37.275691986083984, "global_step": 106690, "epoch": 881} {"train_loss": -36.473812103271484, "global_step": 106691, "epoch": 881} {"train_loss": -35.78322219848633, "global_step": 106692, "epoch": 881} {"train_loss": -38.72390365600586, "global_step": 106693, "epoch": 881} {"train_loss": -37.0831184387207, "global_step": 106694, "epoch": 881} {"train_loss": -36.97895050048828, "global_step": 106695, "epoch": 881} {"train_loss": -38.19149398803711, "global_step": 106696, "epoch": 881} {"train_loss": -36.09641647338867, "global_step": 106697, "epoch": 881} {"train_loss": -35.46475601196289, "global_step": 106698, "epoch": 881} {"train_loss": -36.03092575073242, "global_step": 106699, "epoch": 881} {"train_loss": -34.76663589477539, "global_step": 106700, "epoch": 881} {"train_loss": -33.50514221191406, "global_step": 106701, "epoch": 881} {"train_loss": -34.8492546081543, "global_step": 106702, "epoch": 881} {"train_loss": -36.0875244140625, "global_step": 106703, "epoch": 881} {"train_loss": -36.95487594604492, "global_step": 106704, "epoch": 881} {"train_loss": -38.091793060302734, "global_step": 106705, "epoch": 881} {"train_loss": -36.82896041870117, "global_step": 106706, "epoch": 881} {"train_loss": -37.32049560546875, "global_step": 106707, "epoch": 881} {"train_loss": -33.6894416809082, "global_step": 106708, "epoch": 881} {"train_loss": -34.09366989135742, "global_step": 106709, "epoch": 881} {"train_loss": -35.67983627319336, "global_step": 106710, "epoch": 881} {"train_loss": -35.72269821166992, "global_step": 106711, "epoch": 881} {"train_loss": -35.65869903564453, "global_step": 106712, "epoch": 881} {"train_loss": -35.76225662231445, "global_step": 106713, "epoch": 881} {"train_loss": -35.73241424560547, "global_step": 106714, "epoch": 881} {"train_loss": -35.6895637512207, "global_step": 106715, "epoch": 881} {"train_loss": -36.351680755615234, "global_step": 106716, "epoch": 881} {"train_loss": -36.428348541259766, "global_step": 106717, "epoch": 881} {"train_loss": -32.064815521240234, "global_step": 106718, "epoch": 881} {"train_loss": -35.61323928833008, "global_step": 106719, "epoch": 881} {"train_loss": -33.76308059692383, "global_step": 106720, "epoch": 881} {"train_loss": -37.27627002306221, "global_step": 106721, "epoch": 881, "val_loss": 2601060.0} {"train_loss": -34.79176712036133, "global_step": 106722, "epoch": 882} {"train_loss": -34.389183044433594, "global_step": 106723, "epoch": 882} {"train_loss": -36.231483459472656, "global_step": 106724, "epoch": 882} {"train_loss": -37.10936737060547, "global_step": 106725, "epoch": 882} {"train_loss": -36.61837387084961, "global_step": 106726, "epoch": 882} {"train_loss": -36.445037841796875, "global_step": 106727, "epoch": 882} {"train_loss": -36.612388610839844, "global_step": 106728, "epoch": 882} {"train_loss": -36.74680709838867, "global_step": 106729, "epoch": 882} {"train_loss": -36.356689453125, "global_step": 106730, "epoch": 882} {"train_loss": -36.56650924682617, "global_step": 106731, "epoch": 882} {"train_loss": -36.4783935546875, "global_step": 106732, "epoch": 882} {"train_loss": -36.48442077636719, "global_step": 106733, "epoch": 882} {"train_loss": -36.85053634643555, "global_step": 106734, "epoch": 882} {"train_loss": -36.51142501831055, "global_step": 106735, "epoch": 882} {"train_loss": -36.168540954589844, "global_step": 106736, "epoch": 882} {"train_loss": -35.841732025146484, "global_step": 106737, "epoch": 882} {"train_loss": -37.60555648803711, "global_step": 106738, "epoch": 882} {"train_loss": -36.76995849609375, "global_step": 106739, "epoch": 882} {"train_loss": -35.21442794799805, "global_step": 106740, "epoch": 882} {"train_loss": -35.6878662109375, "global_step": 106741, "epoch": 882} {"train_loss": -37.246761322021484, "global_step": 106742, "epoch": 882} {"train_loss": -37.084503173828125, "global_step": 106743, "epoch": 882} {"train_loss": -37.346988677978516, "global_step": 106744, "epoch": 882} {"train_loss": -36.951171875, "global_step": 106745, "epoch": 882} {"train_loss": -37.51643753051758, "global_step": 106746, "epoch": 882} {"train_loss": -36.631492614746094, "global_step": 106747, "epoch": 882} {"train_loss": -36.907875061035156, "global_step": 106748, "epoch": 882} {"train_loss": -37.542640686035156, "global_step": 106749, "epoch": 882} {"train_loss": -37.377437591552734, "global_step": 106750, "epoch": 882} {"train_loss": -37.085845947265625, "global_step": 106751, "epoch": 882} {"train_loss": -35.58552932739258, "global_step": 106752, "epoch": 882} {"train_loss": -36.77756881713867, "global_step": 106753, "epoch": 882} {"train_loss": -37.70112991333008, "global_step": 106754, "epoch": 882} {"train_loss": -37.638694763183594, "global_step": 106755, "epoch": 882} {"train_loss": -36.88214874267578, "global_step": 106756, "epoch": 882} {"train_loss": -37.21664047241211, "global_step": 106757, "epoch": 882} {"train_loss": -36.70388412475586, "global_step": 106758, "epoch": 882} {"train_loss": -37.06549835205078, "global_step": 106759, "epoch": 882} {"train_loss": -35.03242111206055, "global_step": 106760, "epoch": 882} {"train_loss": -36.36101150512695, "global_step": 106761, "epoch": 882} {"train_loss": -34.673587799072266, "global_step": 106762, "epoch": 882} {"train_loss": -30.9759464263916, "global_step": 106763, "epoch": 882} {"train_loss": -37.8651237487793, "global_step": 106764, "epoch": 882} {"train_loss": -36.110958099365234, "global_step": 106765, "epoch": 882} {"train_loss": -31.710996627807617, "global_step": 106766, "epoch": 882} {"train_loss": -38.01404571533203, "global_step": 106767, "epoch": 882} {"train_loss": -36.16617965698242, "global_step": 106768, "epoch": 882} {"train_loss": -34.38182067871094, "global_step": 106769, "epoch": 882} {"train_loss": -37.840126037597656, "global_step": 106770, "epoch": 882} {"train_loss": -36.52848434448242, "global_step": 106771, "epoch": 882} {"train_loss": -34.30582809448242, "global_step": 106772, "epoch": 882} {"train_loss": -37.16440963745117, "global_step": 106773, "epoch": 882} {"train_loss": -34.89080810546875, "global_step": 106774, "epoch": 882} {"train_loss": -35.68572235107422, "global_step": 106775, "epoch": 882} {"train_loss": -36.23230743408203, "global_step": 106776, "epoch": 882} {"train_loss": -35.24916458129883, "global_step": 106777, "epoch": 882} {"train_loss": -36.633949279785156, "global_step": 106778, "epoch": 882} {"train_loss": -36.517093658447266, "global_step": 106779, "epoch": 882} {"train_loss": -36.36799240112305, "global_step": 106780, "epoch": 882} {"train_loss": -36.57787322998047, "global_step": 106781, "epoch": 882} {"train_loss": -35.96156311035156, "global_step": 106782, "epoch": 882} {"train_loss": -35.020050048828125, "global_step": 106783, "epoch": 882} {"train_loss": -36.14793395996094, "global_step": 106784, "epoch": 882} {"train_loss": -36.008628845214844, "global_step": 106785, "epoch": 882} {"train_loss": -36.47111892700195, "global_step": 106786, "epoch": 882} {"train_loss": -36.619075775146484, "global_step": 106787, "epoch": 882} {"train_loss": -37.2575569152832, "global_step": 106788, "epoch": 882} {"train_loss": -37.35402297973633, "global_step": 106789, "epoch": 882} {"train_loss": -36.16143035888672, "global_step": 106790, "epoch": 882} {"train_loss": -37.36652755737305, "global_step": 106791, "epoch": 882} {"train_loss": -37.45516586303711, "global_step": 106792, "epoch": 882} {"train_loss": -36.83543395996094, "global_step": 106793, "epoch": 882} {"train_loss": -37.24599075317383, "global_step": 106794, "epoch": 882} {"train_loss": -36.422672271728516, "global_step": 106795, "epoch": 882} {"train_loss": -37.34273147583008, "global_step": 106796, "epoch": 882} {"train_loss": -37.62002944946289, "global_step": 106797, "epoch": 882} {"train_loss": -36.16367721557617, "global_step": 106798, "epoch": 882} {"train_loss": -37.51262283325195, "global_step": 106799, "epoch": 882} {"train_loss": -37.78173828125, "global_step": 106800, "epoch": 882} {"train_loss": -38.119510650634766, "global_step": 106801, "epoch": 882} {"train_loss": -37.6334342956543, "global_step": 106802, "epoch": 882} {"train_loss": -37.11676025390625, "global_step": 106803, "epoch": 882} {"train_loss": -38.2160530090332, "global_step": 106804, "epoch": 882} {"train_loss": -38.11129379272461, "global_step": 106805, "epoch": 882} {"train_loss": -38.4080696105957, "global_step": 106806, "epoch": 882} {"train_loss": -36.860225677490234, "global_step": 106807, "epoch": 882} {"train_loss": -37.60822677612305, "global_step": 106808, "epoch": 882} {"train_loss": -37.36225509643555, "global_step": 106809, "epoch": 882} {"train_loss": -38.46738815307617, "global_step": 106810, "epoch": 882} {"train_loss": -37.906715393066406, "global_step": 106811, "epoch": 882} {"train_loss": -37.31180953979492, "global_step": 106812, "epoch": 882} {"train_loss": -36.86504364013672, "global_step": 106813, "epoch": 882} {"train_loss": -37.011940002441406, "global_step": 106814, "epoch": 882} {"train_loss": -38.421730041503906, "global_step": 106815, "epoch": 882} {"train_loss": -37.74564743041992, "global_step": 106816, "epoch": 882} {"train_loss": -38.06344223022461, "global_step": 106817, "epoch": 882} {"train_loss": -38.631404876708984, "global_step": 106818, "epoch": 882} {"train_loss": -38.32041549682617, "global_step": 106819, "epoch": 882} {"train_loss": -38.08142852783203, "global_step": 106820, "epoch": 882} {"train_loss": -38.01339340209961, "global_step": 106821, "epoch": 882} {"train_loss": -38.50952911376953, "global_step": 106822, "epoch": 882} {"train_loss": -37.921630859375, "global_step": 106823, "epoch": 882} {"train_loss": -38.94098663330078, "global_step": 106824, "epoch": 882} {"train_loss": -38.716976165771484, "global_step": 106825, "epoch": 882} {"train_loss": -38.65499496459961, "global_step": 106826, "epoch": 882} {"train_loss": -38.14829635620117, "global_step": 106827, "epoch": 882} {"train_loss": -38.51466751098633, "global_step": 106828, "epoch": 882} {"train_loss": -39.09516525268555, "global_step": 106829, "epoch": 882} {"train_loss": -38.519832611083984, "global_step": 106830, "epoch": 882} {"train_loss": -38.788368225097656, "global_step": 106831, "epoch": 882} {"train_loss": -39.11513137817383, "global_step": 106832, "epoch": 882} {"train_loss": -38.8015251159668, "global_step": 106833, "epoch": 882} {"train_loss": -38.70217514038086, "global_step": 106834, "epoch": 882} {"train_loss": -39.125091552734375, "global_step": 106835, "epoch": 882} {"train_loss": -38.32754135131836, "global_step": 106836, "epoch": 882} {"train_loss": -38.69343185424805, "global_step": 106837, "epoch": 882} {"train_loss": -38.93277359008789, "global_step": 106838, "epoch": 882} {"train_loss": -38.80183792114258, "global_step": 106839, "epoch": 882} {"train_loss": -38.18349838256836, "global_step": 106840, "epoch": 882} {"train_loss": -38.41288375854492, "global_step": 106841, "epoch": 882} {"train_loss": -37.05177212549635, "global_step": 106842, "epoch": 882, "val_loss": 2486756.0} {"train_loss": -38.99421310424805, "global_step": 106843, "epoch": 883} {"train_loss": -39.26017379760742, "global_step": 106844, "epoch": 883} {"train_loss": -38.86132049560547, "global_step": 106845, "epoch": 883} {"train_loss": -38.62015914916992, "global_step": 106846, "epoch": 883} {"train_loss": -39.12630081176758, "global_step": 106847, "epoch": 883} {"train_loss": -37.685733795166016, "global_step": 106848, "epoch": 883} {"train_loss": -38.79694747924805, "global_step": 106849, "epoch": 883} {"train_loss": -39.14760208129883, "global_step": 106850, "epoch": 883} {"train_loss": -39.16386032104492, "global_step": 106851, "epoch": 883} {"train_loss": -38.540992736816406, "global_step": 106852, "epoch": 883} {"train_loss": -39.27744674682617, "global_step": 106853, "epoch": 883} {"train_loss": -38.782020568847656, "global_step": 106854, "epoch": 883} {"train_loss": -38.45097732543945, "global_step": 106855, "epoch": 883} {"train_loss": -33.9526252746582, "global_step": 106856, "epoch": 883} {"train_loss": -23.831119537353516, "global_step": 106857, "epoch": 883} {"train_loss": -18.63718605041504, "global_step": 106858, "epoch": 883} {"train_loss": -23.743642807006836, "global_step": 106859, "epoch": 883} {"train_loss": -35.222835540771484, "global_step": 106860, "epoch": 883} {"train_loss": -28.110837936401367, "global_step": 106861, "epoch": 883} {"train_loss": -36.166500091552734, "global_step": 106862, "epoch": 883} {"train_loss": -31.11233901977539, "global_step": 106863, "epoch": 883} {"train_loss": -33.98244094848633, "global_step": 106864, "epoch": 883} {"train_loss": -34.01603317260742, "global_step": 106865, "epoch": 883} {"train_loss": -34.738197326660156, "global_step": 106866, "epoch": 883} {"train_loss": -34.61687469482422, "global_step": 106867, "epoch": 883} {"train_loss": -34.8902473449707, "global_step": 106868, "epoch": 883} {"train_loss": -37.090301513671875, "global_step": 106869, "epoch": 883} {"train_loss": -31.904052734375, "global_step": 106870, "epoch": 883} {"train_loss": -36.22941970825195, "global_step": 106871, "epoch": 883} {"train_loss": -36.11852264404297, "global_step": 106872, "epoch": 883} {"train_loss": -34.82307815551758, "global_step": 106873, "epoch": 883} {"train_loss": -36.880897521972656, "global_step": 106874, "epoch": 883} {"train_loss": -36.466033935546875, "global_step": 106875, "epoch": 883} {"train_loss": -37.08626937866211, "global_step": 106876, "epoch": 883} {"train_loss": -36.36190414428711, "global_step": 106877, "epoch": 883} {"train_loss": -37.0561408996582, "global_step": 106878, "epoch": 883} {"train_loss": -36.702762603759766, "global_step": 106879, "epoch": 883} {"train_loss": -36.99331283569336, "global_step": 106880, "epoch": 883} {"train_loss": -37.12392807006836, "global_step": 106881, "epoch": 883} {"train_loss": -37.36603546142578, "global_step": 106882, "epoch": 883} {"train_loss": -36.8659553527832, "global_step": 106883, "epoch": 883} {"train_loss": -37.56781768798828, "global_step": 106884, "epoch": 883} {"train_loss": -37.73828887939453, "global_step": 106885, "epoch": 883} {"train_loss": -37.2518196105957, "global_step": 106886, "epoch": 883} {"train_loss": -38.1448974609375, "global_step": 106887, "epoch": 883} {"train_loss": -37.7867546081543, "global_step": 106888, "epoch": 883} {"train_loss": -37.71589660644531, "global_step": 106889, "epoch": 883} {"train_loss": -37.714813232421875, "global_step": 106890, "epoch": 883} {"train_loss": -37.992061614990234, "global_step": 106891, "epoch": 883} {"train_loss": -36.83039474487305, "global_step": 106892, "epoch": 883} {"train_loss": -37.46338653564453, "global_step": 106893, "epoch": 883} {"train_loss": -38.4146614074707, "global_step": 106894, "epoch": 883} {"train_loss": -38.00472640991211, "global_step": 106895, "epoch": 883} {"train_loss": -38.31049346923828, "global_step": 106896, "epoch": 883} {"train_loss": -37.418670654296875, "global_step": 106897, "epoch": 883} {"train_loss": -37.68927764892578, "global_step": 106898, "epoch": 883} {"train_loss": -37.621212005615234, "global_step": 106899, "epoch": 883} {"train_loss": -38.36680221557617, "global_step": 106900, "epoch": 883} {"train_loss": -38.22127914428711, "global_step": 106901, "epoch": 883} {"train_loss": -37.65448760986328, "global_step": 106902, "epoch": 883} {"train_loss": -37.788265228271484, "global_step": 106903, "epoch": 883} {"train_loss": -38.56226348876953, "global_step": 106904, "epoch": 883} {"train_loss": -38.542503356933594, "global_step": 106905, "epoch": 883} {"train_loss": -38.131465911865234, "global_step": 106906, "epoch": 883} {"train_loss": -38.36112594604492, "global_step": 106907, "epoch": 883} {"train_loss": -38.7705192565918, "global_step": 106908, "epoch": 883} {"train_loss": -38.392303466796875, "global_step": 106909, "epoch": 883} {"train_loss": -38.56565475463867, "global_step": 106910, "epoch": 883} {"train_loss": -38.790870666503906, "global_step": 106911, "epoch": 883} {"train_loss": -38.330909729003906, "global_step": 106912, "epoch": 883} {"train_loss": -36.6958122253418, "global_step": 106913, "epoch": 883} {"train_loss": -38.52370834350586, "global_step": 106914, "epoch": 883} {"train_loss": -37.5614128112793, "global_step": 106915, "epoch": 883} {"train_loss": -37.4743537902832, "global_step": 106916, "epoch": 883} {"train_loss": -39.17572021484375, "global_step": 106917, "epoch": 883} {"train_loss": -35.95759963989258, "global_step": 106918, "epoch": 883} {"train_loss": -37.80715560913086, "global_step": 106919, "epoch": 883} {"train_loss": -37.71702575683594, "global_step": 106920, "epoch": 883} {"train_loss": -38.290863037109375, "global_step": 106921, "epoch": 883} {"train_loss": -38.39289474487305, "global_step": 106922, "epoch": 883} {"train_loss": -37.17457962036133, "global_step": 106923, "epoch": 883} {"train_loss": -38.46445083618164, "global_step": 106924, "epoch": 883} {"train_loss": -38.38161849975586, "global_step": 106925, "epoch": 883} {"train_loss": -37.61178207397461, "global_step": 106926, "epoch": 883} {"train_loss": -38.43328857421875, "global_step": 106927, "epoch": 883} {"train_loss": -38.44549560546875, "global_step": 106928, "epoch": 883} {"train_loss": -37.70292282104492, "global_step": 106929, "epoch": 883} {"train_loss": -38.635780334472656, "global_step": 106930, "epoch": 883} {"train_loss": -37.099830627441406, "global_step": 106931, "epoch": 883} {"train_loss": -37.27876663208008, "global_step": 106932, "epoch": 883} {"train_loss": -33.463653564453125, "global_step": 106933, "epoch": 883} {"train_loss": -37.38478469848633, "global_step": 106934, "epoch": 883} {"train_loss": -35.93299102783203, "global_step": 106935, "epoch": 883} {"train_loss": -36.695068359375, "global_step": 106936, "epoch": 883} {"train_loss": -36.008888244628906, "global_step": 106937, "epoch": 883} {"train_loss": -37.411678314208984, "global_step": 106938, "epoch": 883} {"train_loss": -37.688018798828125, "global_step": 106939, "epoch": 883} {"train_loss": -34.135921478271484, "global_step": 106940, "epoch": 883} {"train_loss": -33.533782958984375, "global_step": 106941, "epoch": 883} {"train_loss": -31.074552536010742, "global_step": 106942, "epoch": 883} {"train_loss": -29.521503448486328, "global_step": 106943, "epoch": 883} {"train_loss": -37.736000061035156, "global_step": 106944, "epoch": 883} {"train_loss": -35.52039337158203, "global_step": 106945, "epoch": 883} {"train_loss": -33.53170394897461, "global_step": 106946, "epoch": 883} {"train_loss": -35.68843460083008, "global_step": 106947, "epoch": 883} {"train_loss": -34.23818588256836, "global_step": 106948, "epoch": 883} {"train_loss": -36.380550384521484, "global_step": 106949, "epoch": 883} {"train_loss": -35.65201950073242, "global_step": 106950, "epoch": 883} {"train_loss": -35.800594329833984, "global_step": 106951, "epoch": 883} {"train_loss": -35.72046661376953, "global_step": 106952, "epoch": 883} {"train_loss": -35.43746566772461, "global_step": 106953, "epoch": 883} {"train_loss": -35.457759857177734, "global_step": 106954, "epoch": 883} {"train_loss": -34.715087890625, "global_step": 106955, "epoch": 883} {"train_loss": -36.67257308959961, "global_step": 106956, "epoch": 883} {"train_loss": -36.11674118041992, "global_step": 106957, "epoch": 883} {"train_loss": -35.1596565246582, "global_step": 106958, "epoch": 883} {"train_loss": -35.5119743347168, "global_step": 106959, "epoch": 883} {"train_loss": -36.72101593017578, "global_step": 106960, "epoch": 883} {"train_loss": -34.9763069152832, "global_step": 106961, "epoch": 883} {"train_loss": -37.33822250366211, "global_step": 106962, "epoch": 883} {"train_loss": -36.43752181628519, "global_step": 106963, "epoch": 883, "val_loss": 2844791.75} {"train_loss": -35.590782165527344, "global_step": 106964, "epoch": 884} {"train_loss": -36.078304290771484, "global_step": 106965, "epoch": 884} {"train_loss": -37.348243713378906, "global_step": 106966, "epoch": 884} {"train_loss": -35.22993469238281, "global_step": 106967, "epoch": 884} {"train_loss": -37.657997131347656, "global_step": 106968, "epoch": 884} {"train_loss": -37.120643615722656, "global_step": 106969, "epoch": 884} {"train_loss": -36.990081787109375, "global_step": 106970, "epoch": 884} {"train_loss": -35.975067138671875, "global_step": 106971, "epoch": 884} {"train_loss": -35.98570251464844, "global_step": 106972, "epoch": 884} {"train_loss": -37.01227951049805, "global_step": 106973, "epoch": 884} {"train_loss": -36.93172073364258, "global_step": 106974, "epoch": 884} {"train_loss": -36.585243225097656, "global_step": 106975, "epoch": 884} {"train_loss": -35.0765380859375, "global_step": 106976, "epoch": 884} {"train_loss": -37.262664794921875, "global_step": 106977, "epoch": 884} {"train_loss": -35.86351013183594, "global_step": 106978, "epoch": 884} {"train_loss": -34.92197799682617, "global_step": 106979, "epoch": 884} {"train_loss": -37.25810623168945, "global_step": 106980, "epoch": 884} {"train_loss": -36.5516357421875, "global_step": 106981, "epoch": 884} {"train_loss": -35.655086517333984, "global_step": 106982, "epoch": 884} {"train_loss": -36.964378356933594, "global_step": 106983, "epoch": 884} {"train_loss": -36.90353012084961, "global_step": 106984, "epoch": 884} {"train_loss": -36.986114501953125, "global_step": 106985, "epoch": 884} {"train_loss": -37.77018356323242, "global_step": 106986, "epoch": 884} {"train_loss": -37.70960235595703, "global_step": 106987, "epoch": 884} {"train_loss": -37.82196807861328, "global_step": 106988, "epoch": 884} {"train_loss": -36.832969665527344, "global_step": 106989, "epoch": 884} {"train_loss": -37.479915618896484, "global_step": 106990, "epoch": 884} {"train_loss": -37.11155319213867, "global_step": 106991, "epoch": 884} {"train_loss": -36.82322692871094, "global_step": 106992, "epoch": 884} {"train_loss": -37.47502136230469, "global_step": 106993, "epoch": 884} {"train_loss": -37.77415466308594, "global_step": 106994, "epoch": 884} {"train_loss": -37.76129913330078, "global_step": 106995, "epoch": 884} {"train_loss": -37.03935623168945, "global_step": 106996, "epoch": 884} {"train_loss": -36.798152923583984, "global_step": 106997, "epoch": 884} {"train_loss": -36.876827239990234, "global_step": 106998, "epoch": 884} {"train_loss": -38.19208908081055, "global_step": 106999, "epoch": 884} {"train_loss": -37.438507080078125, "global_step": 107000, "epoch": 884} {"train_loss": -37.290706634521484, "global_step": 107001, "epoch": 884} {"train_loss": -38.19618225097656, "global_step": 107002, "epoch": 884} {"train_loss": -37.999366760253906, "global_step": 107003, "epoch": 884} {"train_loss": -38.222957611083984, "global_step": 107004, "epoch": 884} {"train_loss": -38.351417541503906, "global_step": 107005, "epoch": 884} {"train_loss": -38.07135009765625, "global_step": 107006, "epoch": 884} {"train_loss": -38.73761749267578, "global_step": 107007, "epoch": 884} {"train_loss": -38.5858268737793, "global_step": 107008, "epoch": 884} {"train_loss": -38.683956146240234, "global_step": 107009, "epoch": 884} {"train_loss": -38.536067962646484, "global_step": 107010, "epoch": 884} {"train_loss": -38.28773880004883, "global_step": 107011, "epoch": 884} {"train_loss": -38.42010498046875, "global_step": 107012, "epoch": 884} {"train_loss": -38.141357421875, "global_step": 107013, "epoch": 884} {"train_loss": -37.61431884765625, "global_step": 107014, "epoch": 884} {"train_loss": -38.13984298706055, "global_step": 107015, "epoch": 884} {"train_loss": -38.530364990234375, "global_step": 107016, "epoch": 884} {"train_loss": -38.19401168823242, "global_step": 107017, "epoch": 884} {"train_loss": -37.41901779174805, "global_step": 107018, "epoch": 884} {"train_loss": -37.28603744506836, "global_step": 107019, "epoch": 884} {"train_loss": -38.13821029663086, "global_step": 107020, "epoch": 884} {"train_loss": -35.69626998901367, "global_step": 107021, "epoch": 884} {"train_loss": -38.53721618652344, "global_step": 107022, "epoch": 884} {"train_loss": -38.27701950073242, "global_step": 107023, "epoch": 884} {"train_loss": -37.34708786010742, "global_step": 107024, "epoch": 884} {"train_loss": -38.09946823120117, "global_step": 107025, "epoch": 884} {"train_loss": -37.08914566040039, "global_step": 107026, "epoch": 884} {"train_loss": -37.5213737487793, "global_step": 107027, "epoch": 884} {"train_loss": -37.26469802856445, "global_step": 107028, "epoch": 884} {"train_loss": -37.85908126831055, "global_step": 107029, "epoch": 884} {"train_loss": -37.989933013916016, "global_step": 107030, "epoch": 884} {"train_loss": -38.22193908691406, "global_step": 107031, "epoch": 884} {"train_loss": -38.995479583740234, "global_step": 107032, "epoch": 884} {"train_loss": -38.27473068237305, "global_step": 107033, "epoch": 884} {"train_loss": -38.57075119018555, "global_step": 107034, "epoch": 884} {"train_loss": -37.5456657409668, "global_step": 107035, "epoch": 884} {"train_loss": -37.946346282958984, "global_step": 107036, "epoch": 884} {"train_loss": -38.123600006103516, "global_step": 107037, "epoch": 884} {"train_loss": -38.73882293701172, "global_step": 107038, "epoch": 884} {"train_loss": -38.020599365234375, "global_step": 107039, "epoch": 884} {"train_loss": -38.8856201171875, "global_step": 107040, "epoch": 884} {"train_loss": -38.59682083129883, "global_step": 107041, "epoch": 884} {"train_loss": -37.663726806640625, "global_step": 107042, "epoch": 884} {"train_loss": -38.124141693115234, "global_step": 107043, "epoch": 884} {"train_loss": -38.44287109375, "global_step": 107044, "epoch": 884} {"train_loss": -37.17864990234375, "global_step": 107045, "epoch": 884} {"train_loss": -37.48281478881836, "global_step": 107046, "epoch": 884} {"train_loss": -37.74184799194336, "global_step": 107047, "epoch": 884} {"train_loss": -38.0540657043457, "global_step": 107048, "epoch": 884} {"train_loss": -37.09608840942383, "global_step": 107049, "epoch": 884} {"train_loss": -36.94987869262695, "global_step": 107050, "epoch": 884} {"train_loss": -38.40379333496094, "global_step": 107051, "epoch": 884} {"train_loss": -35.594791412353516, "global_step": 107052, "epoch": 884} {"train_loss": -35.45231628417969, "global_step": 107053, "epoch": 884} {"train_loss": -34.202735900878906, "global_step": 107054, "epoch": 884} {"train_loss": -28.630956649780273, "global_step": 107055, "epoch": 884} {"train_loss": -28.342145919799805, "global_step": 107056, "epoch": 884} {"train_loss": -35.49556350708008, "global_step": 107057, "epoch": 884} {"train_loss": -37.412384033203125, "global_step": 107058, "epoch": 884} {"train_loss": -36.0802116394043, "global_step": 107059, "epoch": 884} {"train_loss": -38.384273529052734, "global_step": 107060, "epoch": 884} {"train_loss": -37.42070388793945, "global_step": 107061, "epoch": 884} {"train_loss": -37.745235443115234, "global_step": 107062, "epoch": 884} {"train_loss": -37.62070083618164, "global_step": 107063, "epoch": 884} {"train_loss": -37.56521987915039, "global_step": 107064, "epoch": 884} {"train_loss": -38.35000228881836, "global_step": 107065, "epoch": 884} {"train_loss": -37.77050018310547, "global_step": 107066, "epoch": 884} {"train_loss": -37.22956085205078, "global_step": 107067, "epoch": 884} {"train_loss": -38.305992126464844, "global_step": 107068, "epoch": 884} {"train_loss": -37.48069381713867, "global_step": 107069, "epoch": 884} {"train_loss": -38.40957260131836, "global_step": 107070, "epoch": 884} {"train_loss": -38.400115966796875, "global_step": 107071, "epoch": 884} {"train_loss": -38.59564971923828, "global_step": 107072, "epoch": 884} {"train_loss": -37.632904052734375, "global_step": 107073, "epoch": 884} {"train_loss": -38.23422622680664, "global_step": 107074, "epoch": 884} {"train_loss": -36.69492721557617, "global_step": 107075, "epoch": 884} {"train_loss": -38.389427185058594, "global_step": 107076, "epoch": 884} {"train_loss": -37.33475112915039, "global_step": 107077, "epoch": 884} {"train_loss": -38.597511291503906, "global_step": 107078, "epoch": 884} {"train_loss": -38.54649353027344, "global_step": 107079, "epoch": 884} {"train_loss": -38.54597091674805, "global_step": 107080, "epoch": 884} {"train_loss": -37.214141845703125, "global_step": 107081, "epoch": 884} {"train_loss": -37.4351921081543, "global_step": 107082, "epoch": 884} {"train_loss": -39.07219314575195, "global_step": 107083, "epoch": 884} {"train_loss": -37.371526702376435, "global_step": 107084, "epoch": 884, "val_loss": 2471297.25} {"train_loss": -38.20160675048828, "global_step": 107085, "epoch": 885} {"train_loss": -38.9078483581543, "global_step": 107086, "epoch": 885} {"train_loss": -38.56558609008789, "global_step": 107087, "epoch": 885} {"train_loss": -37.063350677490234, "global_step": 107088, "epoch": 885} {"train_loss": -38.6015625, "global_step": 107089, "epoch": 885} {"train_loss": -39.0240592956543, "global_step": 107090, "epoch": 885} {"train_loss": -38.81666564941406, "global_step": 107091, "epoch": 885} {"train_loss": -36.72892379760742, "global_step": 107092, "epoch": 885} {"train_loss": -38.0624885559082, "global_step": 107093, "epoch": 885} {"train_loss": -38.91045379638672, "global_step": 107094, "epoch": 885} {"train_loss": -38.04750442504883, "global_step": 107095, "epoch": 885} {"train_loss": -38.31474685668945, "global_step": 107096, "epoch": 885} {"train_loss": -37.574851989746094, "global_step": 107097, "epoch": 885} {"train_loss": -37.507259368896484, "global_step": 107098, "epoch": 885} {"train_loss": -35.8979377746582, "global_step": 107099, "epoch": 885} {"train_loss": -36.8011360168457, "global_step": 107100, "epoch": 885} {"train_loss": -39.04399108886719, "global_step": 107101, "epoch": 885} {"train_loss": -38.243804931640625, "global_step": 107102, "epoch": 885} {"train_loss": -38.2126579284668, "global_step": 107103, "epoch": 885} {"train_loss": -38.9471321105957, "global_step": 107104, "epoch": 885} {"train_loss": -39.00232696533203, "global_step": 107105, "epoch": 885} {"train_loss": -38.79137420654297, "global_step": 107106, "epoch": 885} {"train_loss": -38.76484298706055, "global_step": 107107, "epoch": 885} {"train_loss": -38.51877975463867, "global_step": 107108, "epoch": 885} {"train_loss": -37.352378845214844, "global_step": 107109, "epoch": 885} {"train_loss": -36.611412048339844, "global_step": 107110, "epoch": 885} {"train_loss": -38.84139633178711, "global_step": 107111, "epoch": 885} {"train_loss": -38.38209533691406, "global_step": 107112, "epoch": 885} {"train_loss": -38.33806228637695, "global_step": 107113, "epoch": 885} {"train_loss": -37.85760498046875, "global_step": 107114, "epoch": 885} {"train_loss": -37.92179870605469, "global_step": 107115, "epoch": 885} {"train_loss": -36.973140716552734, "global_step": 107116, "epoch": 885} {"train_loss": -37.068763732910156, "global_step": 107117, "epoch": 885} {"train_loss": -38.07327651977539, "global_step": 107118, "epoch": 885} {"train_loss": -37.44363021850586, "global_step": 107119, "epoch": 885} {"train_loss": -36.66068649291992, "global_step": 107120, "epoch": 885} {"train_loss": -39.214542388916016, "global_step": 107121, "epoch": 885} {"train_loss": -38.282901763916016, "global_step": 107122, "epoch": 885} {"train_loss": -38.857086181640625, "global_step": 107123, "epoch": 885} {"train_loss": -38.80036544799805, "global_step": 107124, "epoch": 885} {"train_loss": -37.92676544189453, "global_step": 107125, "epoch": 885} {"train_loss": -39.09867858886719, "global_step": 107126, "epoch": 885} {"train_loss": -38.45588302612305, "global_step": 107127, "epoch": 885} {"train_loss": -38.39876937866211, "global_step": 107128, "epoch": 885} {"train_loss": -37.88444900512695, "global_step": 107129, "epoch": 885} {"train_loss": -38.65108108520508, "global_step": 107130, "epoch": 885} {"train_loss": -39.5778694152832, "global_step": 107131, "epoch": 885} {"train_loss": -37.0057487487793, "global_step": 107132, "epoch": 885} {"train_loss": -38.250064849853516, "global_step": 107133, "epoch": 885} {"train_loss": -38.413665771484375, "global_step": 107134, "epoch": 885} {"train_loss": -36.8272819519043, "global_step": 107135, "epoch": 885} {"train_loss": -36.22821807861328, "global_step": 107136, "epoch": 885} {"train_loss": -36.29423522949219, "global_step": 107137, "epoch": 885} {"train_loss": -37.93123245239258, "global_step": 107138, "epoch": 885} {"train_loss": -34.633277893066406, "global_step": 107139, "epoch": 885} {"train_loss": -38.39319610595703, "global_step": 107140, "epoch": 885} {"train_loss": -37.12651062011719, "global_step": 107141, "epoch": 885} {"train_loss": -38.1756591796875, "global_step": 107142, "epoch": 885} {"train_loss": -36.53681564331055, "global_step": 107143, "epoch": 885} {"train_loss": -33.71510314941406, "global_step": 107144, "epoch": 885} {"train_loss": -35.8979606628418, "global_step": 107145, "epoch": 885} {"train_loss": -36.608943939208984, "global_step": 107146, "epoch": 885} {"train_loss": -37.32271957397461, "global_step": 107147, "epoch": 885} {"train_loss": -37.31924057006836, "global_step": 107148, "epoch": 885} {"train_loss": -37.901573181152344, "global_step": 107149, "epoch": 885} {"train_loss": -38.36357498168945, "global_step": 107150, "epoch": 885} {"train_loss": -37.974609375, "global_step": 107151, "epoch": 885} {"train_loss": -37.68239974975586, "global_step": 107152, "epoch": 885} {"train_loss": -35.879364013671875, "global_step": 107153, "epoch": 885} {"train_loss": -37.718990325927734, "global_step": 107154, "epoch": 885} {"train_loss": -38.2783317565918, "global_step": 107155, "epoch": 885} {"train_loss": -36.83932113647461, "global_step": 107156, "epoch": 885} {"train_loss": -38.28390121459961, "global_step": 107157, "epoch": 885} {"train_loss": -37.59381103515625, "global_step": 107158, "epoch": 885} {"train_loss": -38.12956619262695, "global_step": 107159, "epoch": 885} {"train_loss": -37.32269287109375, "global_step": 107160, "epoch": 885} {"train_loss": -38.06459045410156, "global_step": 107161, "epoch": 885} {"train_loss": -38.36624526977539, "global_step": 107162, "epoch": 885} {"train_loss": -38.46406555175781, "global_step": 107163, "epoch": 885} {"train_loss": -38.233062744140625, "global_step": 107164, "epoch": 885} {"train_loss": -38.192806243896484, "global_step": 107165, "epoch": 885} {"train_loss": -38.25663375854492, "global_step": 107166, "epoch": 885} {"train_loss": -38.38906478881836, "global_step": 107167, "epoch": 885} {"train_loss": -38.74774932861328, "global_step": 107168, "epoch": 885} {"train_loss": -36.41851043701172, "global_step": 107169, "epoch": 885} {"train_loss": -38.32518768310547, "global_step": 107170, "epoch": 885} {"train_loss": -38.269405364990234, "global_step": 107171, "epoch": 885} {"train_loss": -36.16341781616211, "global_step": 107172, "epoch": 885} {"train_loss": -31.960378646850586, "global_step": 107173, "epoch": 885} {"train_loss": -37.29263687133789, "global_step": 107174, "epoch": 885} {"train_loss": -35.40211868286133, "global_step": 107175, "epoch": 885} {"train_loss": -37.504295349121094, "global_step": 107176, "epoch": 885} {"train_loss": -35.950130462646484, "global_step": 107177, "epoch": 885} {"train_loss": -36.93489456176758, "global_step": 107178, "epoch": 885} {"train_loss": -36.8618278503418, "global_step": 107179, "epoch": 885} {"train_loss": -23.816940307617188, "global_step": 107180, "epoch": 885} {"train_loss": -37.181427001953125, "global_step": 107181, "epoch": 885} {"train_loss": -34.639095306396484, "global_step": 107182, "epoch": 885} {"train_loss": -25.820423126220703, "global_step": 107183, "epoch": 885} {"train_loss": -35.72563934326172, "global_step": 107184, "epoch": 885} {"train_loss": -33.49776077270508, "global_step": 107185, "epoch": 885} {"train_loss": -34.007259368896484, "global_step": 107186, "epoch": 885} {"train_loss": -35.333133697509766, "global_step": 107187, "epoch": 885} {"train_loss": -35.83726119995117, "global_step": 107188, "epoch": 885} {"train_loss": -29.933393478393555, "global_step": 107189, "epoch": 885} {"train_loss": -33.581905364990234, "global_step": 107190, "epoch": 885} {"train_loss": -34.952877044677734, "global_step": 107191, "epoch": 885} {"train_loss": -36.732818603515625, "global_step": 107192, "epoch": 885} {"train_loss": -31.595422744750977, "global_step": 107193, "epoch": 885} {"train_loss": -33.11194610595703, "global_step": 107194, "epoch": 885} {"train_loss": -36.510189056396484, "global_step": 107195, "epoch": 885} {"train_loss": -35.53019332885742, "global_step": 107196, "epoch": 885} {"train_loss": -35.8620719909668, "global_step": 107197, "epoch": 885} {"train_loss": -36.0693473815918, "global_step": 107198, "epoch": 885} {"train_loss": -36.09212112426758, "global_step": 107199, "epoch": 885} {"train_loss": -36.35532760620117, "global_step": 107200, "epoch": 885} {"train_loss": -35.67572021484375, "global_step": 107201, "epoch": 885} {"train_loss": -35.330074310302734, "global_step": 107202, "epoch": 885} {"train_loss": -35.92399978637695, "global_step": 107203, "epoch": 885} {"train_loss": -35.670875549316406, "global_step": 107204, "epoch": 885} {"train_loss": -36.948225210520846, "global_step": 107205, "epoch": 885, "val_loss": 2471943.0} {"train_loss": -36.73374557495117, "global_step": 107206, "epoch": 886} {"train_loss": -37.526214599609375, "global_step": 107207, "epoch": 886} {"train_loss": -37.19757843017578, "global_step": 107208, "epoch": 886} {"train_loss": -36.82906723022461, "global_step": 107209, "epoch": 886} {"train_loss": -35.52531051635742, "global_step": 107210, "epoch": 886} {"train_loss": -36.93675994873047, "global_step": 107211, "epoch": 886} {"train_loss": -36.013362884521484, "global_step": 107212, "epoch": 886} {"train_loss": -36.171058654785156, "global_step": 107213, "epoch": 886} {"train_loss": -34.89461898803711, "global_step": 107214, "epoch": 886} {"train_loss": -37.19657897949219, "global_step": 107215, "epoch": 886} {"train_loss": -36.83416748046875, "global_step": 107216, "epoch": 886} {"train_loss": -37.08443832397461, "global_step": 107217, "epoch": 886} {"train_loss": -37.594627380371094, "global_step": 107218, "epoch": 886} {"train_loss": -37.070106506347656, "global_step": 107219, "epoch": 886} {"train_loss": -37.26731491088867, "global_step": 107220, "epoch": 886} {"train_loss": -37.243072509765625, "global_step": 107221, "epoch": 886} {"train_loss": -37.75883102416992, "global_step": 107222, "epoch": 886} {"train_loss": -36.896427154541016, "global_step": 107223, "epoch": 886} {"train_loss": -37.75426483154297, "global_step": 107224, "epoch": 886} {"train_loss": -37.1611328125, "global_step": 107225, "epoch": 886} {"train_loss": -37.58542251586914, "global_step": 107226, "epoch": 886} {"train_loss": -36.98283004760742, "global_step": 107227, "epoch": 886} {"train_loss": -37.80592346191406, "global_step": 107228, "epoch": 886} {"train_loss": -37.439205169677734, "global_step": 107229, "epoch": 886} {"train_loss": -37.72365188598633, "global_step": 107230, "epoch": 886} {"train_loss": -37.58342742919922, "global_step": 107231, "epoch": 886} {"train_loss": -37.962223052978516, "global_step": 107232, "epoch": 886} {"train_loss": -37.97151565551758, "global_step": 107233, "epoch": 886} {"train_loss": -38.04945373535156, "global_step": 107234, "epoch": 886} {"train_loss": -37.19562911987305, "global_step": 107235, "epoch": 886} {"train_loss": -38.009315490722656, "global_step": 107236, "epoch": 886} {"train_loss": -37.716529846191406, "global_step": 107237, "epoch": 886} {"train_loss": -38.14603042602539, "global_step": 107238, "epoch": 886} {"train_loss": -38.07616424560547, "global_step": 107239, "epoch": 886} {"train_loss": -38.124053955078125, "global_step": 107240, "epoch": 886} {"train_loss": -37.94093322753906, "global_step": 107241, "epoch": 886} {"train_loss": -38.33384323120117, "global_step": 107242, "epoch": 886} {"train_loss": -38.69797897338867, "global_step": 107243, "epoch": 886} {"train_loss": -38.043128967285156, "global_step": 107244, "epoch": 886} {"train_loss": -38.68492126464844, "global_step": 107245, "epoch": 886} {"train_loss": -38.368507385253906, "global_step": 107246, "epoch": 886} {"train_loss": -38.11349105834961, "global_step": 107247, "epoch": 886} {"train_loss": -38.51076889038086, "global_step": 107248, "epoch": 886} {"train_loss": -38.52350616455078, "global_step": 107249, "epoch": 886} {"train_loss": -37.9687614440918, "global_step": 107250, "epoch": 886} {"train_loss": -37.9113655090332, "global_step": 107251, "epoch": 886} {"train_loss": -37.81654739379883, "global_step": 107252, "epoch": 886} {"train_loss": -38.3328857421875, "global_step": 107253, "epoch": 886} {"train_loss": -38.34831619262695, "global_step": 107254, "epoch": 886} {"train_loss": -38.52643585205078, "global_step": 107255, "epoch": 886} {"train_loss": -38.66842269897461, "global_step": 107256, "epoch": 886} {"train_loss": -38.66337203979492, "global_step": 107257, "epoch": 886} {"train_loss": -38.52726364135742, "global_step": 107258, "epoch": 886} {"train_loss": -38.1657829284668, "global_step": 107259, "epoch": 886} {"train_loss": -38.21416091918945, "global_step": 107260, "epoch": 886} {"train_loss": -38.04145431518555, "global_step": 107261, "epoch": 886} {"train_loss": -36.431026458740234, "global_step": 107262, "epoch": 886} {"train_loss": -28.604721069335938, "global_step": 107263, "epoch": 886} {"train_loss": -1.8643566370010376, "global_step": 107264, "epoch": 886} {"train_loss": 16.779672622680664, "global_step": 107265, "epoch": 886} {"train_loss": -20.991308212280273, "global_step": 107266, "epoch": 886} {"train_loss": -29.167150497436523, "global_step": 107267, "epoch": 886} {"train_loss": -26.799518585205078, "global_step": 107268, "epoch": 886} {"train_loss": -26.535964965820312, "global_step": 107269, "epoch": 886} {"train_loss": -32.73507308959961, "global_step": 107270, "epoch": 886} {"train_loss": -26.84747314453125, "global_step": 107271, "epoch": 886} {"train_loss": -34.5455322265625, "global_step": 107272, "epoch": 886} {"train_loss": -31.8780517578125, "global_step": 107273, "epoch": 886} {"train_loss": -30.066974639892578, "global_step": 107274, "epoch": 886} {"train_loss": -35.677001953125, "global_step": 107275, "epoch": 886} {"train_loss": -34.131893157958984, "global_step": 107276, "epoch": 886} {"train_loss": -31.848718643188477, "global_step": 107277, "epoch": 886} {"train_loss": -35.9878044128418, "global_step": 107278, "epoch": 886} {"train_loss": -36.30733871459961, "global_step": 107279, "epoch": 886} {"train_loss": -35.14435577392578, "global_step": 107280, "epoch": 886} {"train_loss": -34.96577453613281, "global_step": 107281, "epoch": 886} {"train_loss": -35.52143096923828, "global_step": 107282, "epoch": 886} {"train_loss": -36.54728317260742, "global_step": 107283, "epoch": 886} {"train_loss": -36.59629440307617, "global_step": 107284, "epoch": 886} {"train_loss": -35.85256576538086, "global_step": 107285, "epoch": 886} {"train_loss": -36.45856475830078, "global_step": 107286, "epoch": 886} {"train_loss": -37.300148010253906, "global_step": 107287, "epoch": 886} {"train_loss": -37.17000961303711, "global_step": 107288, "epoch": 886} {"train_loss": -37.044410705566406, "global_step": 107289, "epoch": 886} {"train_loss": -36.67312240600586, "global_step": 107290, "epoch": 886} {"train_loss": -36.75027084350586, "global_step": 107291, "epoch": 886} {"train_loss": -37.35475540161133, "global_step": 107292, "epoch": 886} {"train_loss": -37.54465866088867, "global_step": 107293, "epoch": 886} {"train_loss": -37.240089416503906, "global_step": 107294, "epoch": 886} {"train_loss": -37.02741622924805, "global_step": 107295, "epoch": 886} {"train_loss": -37.29480743408203, "global_step": 107296, "epoch": 886} {"train_loss": -37.16619873046875, "global_step": 107297, "epoch": 886} {"train_loss": -37.42200469970703, "global_step": 107298, "epoch": 886} {"train_loss": -37.78826141357422, "global_step": 107299, "epoch": 886} {"train_loss": -37.722496032714844, "global_step": 107300, "epoch": 886} {"train_loss": -37.907615661621094, "global_step": 107301, "epoch": 886} {"train_loss": -37.24172592163086, "global_step": 107302, "epoch": 886} {"train_loss": -37.69807815551758, "global_step": 107303, "epoch": 886} {"train_loss": -37.922794342041016, "global_step": 107304, "epoch": 886} {"train_loss": -37.427852630615234, "global_step": 107305, "epoch": 886} {"train_loss": -38.03913497924805, "global_step": 107306, "epoch": 886} {"train_loss": -38.323158264160156, "global_step": 107307, "epoch": 886} {"train_loss": -37.67133712768555, "global_step": 107308, "epoch": 886} {"train_loss": -37.30363845825195, "global_step": 107309, "epoch": 886} {"train_loss": -38.327571868896484, "global_step": 107310, "epoch": 886} {"train_loss": -37.80115509033203, "global_step": 107311, "epoch": 886} {"train_loss": -37.64681625366211, "global_step": 107312, "epoch": 886} {"train_loss": -38.08953857421875, "global_step": 107313, "epoch": 886} {"train_loss": -37.80753707885742, "global_step": 107314, "epoch": 886} {"train_loss": -38.18754196166992, "global_step": 107315, "epoch": 886} {"train_loss": -38.34778594970703, "global_step": 107316, "epoch": 886} {"train_loss": -37.910552978515625, "global_step": 107317, "epoch": 886} {"train_loss": -38.15298080444336, "global_step": 107318, "epoch": 886} {"train_loss": -38.082763671875, "global_step": 107319, "epoch": 886} {"train_loss": -38.32065963745117, "global_step": 107320, "epoch": 886} {"train_loss": -38.36598205566406, "global_step": 107321, "epoch": 886} {"train_loss": -38.70541000366211, "global_step": 107322, "epoch": 886} {"train_loss": -38.499202728271484, "global_step": 107323, "epoch": 886} {"train_loss": -38.52401351928711, "global_step": 107324, "epoch": 886} {"train_loss": -38.74013900756836, "global_step": 107325, "epoch": 886} {"train_loss": -35.98697192314243, "global_step": 107326, "epoch": 886, "val_loss": 2570603.75} {"train_loss": -38.66241455078125, "global_step": 107327, "epoch": 887} {"train_loss": -39.0478401184082, "global_step": 107328, "epoch": 887} {"train_loss": -38.64481735229492, "global_step": 107329, "epoch": 887} {"train_loss": -38.8427619934082, "global_step": 107330, "epoch": 887} {"train_loss": -38.71553039550781, "global_step": 107331, "epoch": 887} {"train_loss": -38.15609359741211, "global_step": 107332, "epoch": 887} {"train_loss": -38.27338790893555, "global_step": 107333, "epoch": 887} {"train_loss": -38.27016067504883, "global_step": 107334, "epoch": 887} {"train_loss": -38.9189338684082, "global_step": 107335, "epoch": 887} {"train_loss": -39.08728790283203, "global_step": 107336, "epoch": 887} {"train_loss": -38.87440872192383, "global_step": 107337, "epoch": 887} {"train_loss": -39.295143127441406, "global_step": 107338, "epoch": 887} {"train_loss": -39.12443923950195, "global_step": 107339, "epoch": 887} {"train_loss": -39.436031341552734, "global_step": 107340, "epoch": 887} {"train_loss": -39.07008743286133, "global_step": 107341, "epoch": 887} {"train_loss": -39.448116302490234, "global_step": 107342, "epoch": 887} {"train_loss": -39.5315055847168, "global_step": 107343, "epoch": 887} {"train_loss": -39.311710357666016, "global_step": 107344, "epoch": 887} {"train_loss": -39.41148376464844, "global_step": 107345, "epoch": 887} {"train_loss": -38.76713180541992, "global_step": 107346, "epoch": 887} {"train_loss": -37.37824249267578, "global_step": 107347, "epoch": 887} {"train_loss": -35.639976501464844, "global_step": 107348, "epoch": 887} {"train_loss": -30.82407569885254, "global_step": 107349, "epoch": 887} {"train_loss": -24.097705841064453, "global_step": 107350, "epoch": 887} {"train_loss": -26.422937393188477, "global_step": 107351, "epoch": 887} {"train_loss": -38.97224426269531, "global_step": 107352, "epoch": 887} {"train_loss": -31.3868408203125, "global_step": 107353, "epoch": 887} {"train_loss": -33.30644989013672, "global_step": 107354, "epoch": 887} {"train_loss": -37.36992645263672, "global_step": 107355, "epoch": 887} {"train_loss": -33.64158248901367, "global_step": 107356, "epoch": 887} {"train_loss": -36.45180892944336, "global_step": 107357, "epoch": 887} {"train_loss": -34.653621673583984, "global_step": 107358, "epoch": 887} {"train_loss": -35.84736633300781, "global_step": 107359, "epoch": 887} {"train_loss": -35.74110794067383, "global_step": 107360, "epoch": 887} {"train_loss": -36.781166076660156, "global_step": 107361, "epoch": 887} {"train_loss": -36.29054641723633, "global_step": 107362, "epoch": 887} {"train_loss": -36.69498825073242, "global_step": 107363, "epoch": 887} {"train_loss": -37.04970169067383, "global_step": 107364, "epoch": 887} {"train_loss": -36.56571578979492, "global_step": 107365, "epoch": 887} {"train_loss": -37.417354583740234, "global_step": 107366, "epoch": 887} {"train_loss": -36.107818603515625, "global_step": 107367, "epoch": 887} {"train_loss": -36.25910186767578, "global_step": 107368, "epoch": 887} {"train_loss": -37.79024124145508, "global_step": 107369, "epoch": 887} {"train_loss": -34.776668548583984, "global_step": 107370, "epoch": 887} {"train_loss": -38.3197021484375, "global_step": 107371, "epoch": 887} {"train_loss": -35.45464324951172, "global_step": 107372, "epoch": 887} {"train_loss": -37.6594123840332, "global_step": 107373, "epoch": 887} {"train_loss": -36.7701416015625, "global_step": 107374, "epoch": 887} {"train_loss": -38.101173400878906, "global_step": 107375, "epoch": 887} {"train_loss": -37.7069206237793, "global_step": 107376, "epoch": 887} {"train_loss": -37.66056442260742, "global_step": 107377, "epoch": 887} {"train_loss": -37.605133056640625, "global_step": 107378, "epoch": 887} {"train_loss": -37.21890640258789, "global_step": 107379, "epoch": 887} {"train_loss": -38.24161911010742, "global_step": 107380, "epoch": 887} {"train_loss": -37.09941482543945, "global_step": 107381, "epoch": 887} {"train_loss": -37.760379791259766, "global_step": 107382, "epoch": 887} {"train_loss": -37.5872917175293, "global_step": 107383, "epoch": 887} {"train_loss": -37.734893798828125, "global_step": 107384, "epoch": 887} {"train_loss": -38.39179611206055, "global_step": 107385, "epoch": 887} {"train_loss": -37.89032745361328, "global_step": 107386, "epoch": 887} {"train_loss": -37.61396789550781, "global_step": 107387, "epoch": 887} {"train_loss": -38.211814880371094, "global_step": 107388, "epoch": 887} {"train_loss": -38.04325485229492, "global_step": 107389, "epoch": 887} {"train_loss": -37.954368591308594, "global_step": 107390, "epoch": 887} {"train_loss": -38.6021614074707, "global_step": 107391, "epoch": 887} {"train_loss": -37.86350631713867, "global_step": 107392, "epoch": 887} {"train_loss": -38.3508415222168, "global_step": 107393, "epoch": 887} {"train_loss": -38.22013473510742, "global_step": 107394, "epoch": 887} {"train_loss": -38.323116302490234, "global_step": 107395, "epoch": 887} {"train_loss": -38.3304443359375, "global_step": 107396, "epoch": 887} {"train_loss": -38.14339065551758, "global_step": 107397, "epoch": 887} {"train_loss": -37.12929916381836, "global_step": 107398, "epoch": 887} {"train_loss": -37.41384506225586, "global_step": 107399, "epoch": 887} {"train_loss": -38.375057220458984, "global_step": 107400, "epoch": 887} {"train_loss": -37.13371658325195, "global_step": 107401, "epoch": 887} {"train_loss": -38.07236099243164, "global_step": 107402, "epoch": 887} {"train_loss": -37.439476013183594, "global_step": 107403, "epoch": 887} {"train_loss": -37.3888053894043, "global_step": 107404, "epoch": 887} {"train_loss": -36.873836517333984, "global_step": 107405, "epoch": 887} {"train_loss": -37.55402755737305, "global_step": 107406, "epoch": 887} {"train_loss": -37.891265869140625, "global_step": 107407, "epoch": 887} {"train_loss": -38.26136779785156, "global_step": 107408, "epoch": 887} {"train_loss": -37.335689544677734, "global_step": 107409, "epoch": 887} {"train_loss": -36.59960174560547, "global_step": 107410, "epoch": 887} {"train_loss": -37.591365814208984, "global_step": 107411, "epoch": 887} {"train_loss": -36.70915985107422, "global_step": 107412, "epoch": 887} {"train_loss": -37.2013053894043, "global_step": 107413, "epoch": 887} {"train_loss": -37.24840545654297, "global_step": 107414, "epoch": 887} {"train_loss": -37.7919807434082, "global_step": 107415, "epoch": 887} {"train_loss": -37.5667724609375, "global_step": 107416, "epoch": 887} {"train_loss": -37.84969711303711, "global_step": 107417, "epoch": 887} {"train_loss": -38.14799118041992, "global_step": 107418, "epoch": 887} {"train_loss": -36.61140441894531, "global_step": 107419, "epoch": 887} {"train_loss": -38.54472732543945, "global_step": 107420, "epoch": 887} {"train_loss": -36.507911682128906, "global_step": 107421, "epoch": 887} {"train_loss": -38.17176055908203, "global_step": 107422, "epoch": 887} {"train_loss": -37.700626373291016, "global_step": 107423, "epoch": 887} {"train_loss": -38.48245620727539, "global_step": 107424, "epoch": 887} {"train_loss": -37.1230583190918, "global_step": 107425, "epoch": 887} {"train_loss": -37.91268539428711, "global_step": 107426, "epoch": 887} {"train_loss": -37.6953125, "global_step": 107427, "epoch": 887} {"train_loss": -38.60329818725586, "global_step": 107428, "epoch": 887} {"train_loss": -38.63633346557617, "global_step": 107429, "epoch": 887} {"train_loss": -38.12335968017578, "global_step": 107430, "epoch": 887} {"train_loss": -38.29798126220703, "global_step": 107431, "epoch": 887} {"train_loss": -38.94245529174805, "global_step": 107432, "epoch": 887} {"train_loss": -38.40718460083008, "global_step": 107433, "epoch": 887} {"train_loss": -38.2953987121582, "global_step": 107434, "epoch": 887} {"train_loss": -38.308807373046875, "global_step": 107435, "epoch": 887} {"train_loss": -38.94607162475586, "global_step": 107436, "epoch": 887} {"train_loss": -38.35749435424805, "global_step": 107437, "epoch": 887} {"train_loss": -38.7215576171875, "global_step": 107438, "epoch": 887} {"train_loss": -38.75416564941406, "global_step": 107439, "epoch": 887} {"train_loss": -38.68746566772461, "global_step": 107440, "epoch": 887} {"train_loss": -39.32114791870117, "global_step": 107441, "epoch": 887} {"train_loss": -39.22731399536133, "global_step": 107442, "epoch": 887} {"train_loss": -38.41249465942383, "global_step": 107443, "epoch": 887} {"train_loss": -37.967403411865234, "global_step": 107444, "epoch": 887} {"train_loss": -38.35200119018555, "global_step": 107445, "epoch": 887} {"train_loss": -38.58304977416992, "global_step": 107446, "epoch": 887} {"train_loss": -37.47639213120642, "global_step": 107447, "epoch": 887, "val_loss": 2463188.25} {"train_loss": -38.6700553894043, "global_step": 107448, "epoch": 888} {"train_loss": -38.697235107421875, "global_step": 107449, "epoch": 888} {"train_loss": -38.2684326171875, "global_step": 107450, "epoch": 888} {"train_loss": -37.7943000793457, "global_step": 107451, "epoch": 888} {"train_loss": -38.329769134521484, "global_step": 107452, "epoch": 888} {"train_loss": -38.863739013671875, "global_step": 107453, "epoch": 888} {"train_loss": -38.69655227661133, "global_step": 107454, "epoch": 888} {"train_loss": -37.8413200378418, "global_step": 107455, "epoch": 888} {"train_loss": -37.102291107177734, "global_step": 107456, "epoch": 888} {"train_loss": -38.09845733642578, "global_step": 107457, "epoch": 888} {"train_loss": -37.42139434814453, "global_step": 107458, "epoch": 888} {"train_loss": -37.6252555847168, "global_step": 107459, "epoch": 888} {"train_loss": -39.25411605834961, "global_step": 107460, "epoch": 888} {"train_loss": -38.422508239746094, "global_step": 107461, "epoch": 888} {"train_loss": -37.662841796875, "global_step": 107462, "epoch": 888} {"train_loss": -38.762123107910156, "global_step": 107463, "epoch": 888} {"train_loss": -37.6638298034668, "global_step": 107464, "epoch": 888} {"train_loss": -38.364437103271484, "global_step": 107465, "epoch": 888} {"train_loss": -38.40718078613281, "global_step": 107466, "epoch": 888} {"train_loss": -38.04647445678711, "global_step": 107467, "epoch": 888} {"train_loss": -38.57929229736328, "global_step": 107468, "epoch": 888} {"train_loss": -38.678428649902344, "global_step": 107469, "epoch": 888} {"train_loss": -39.2462272644043, "global_step": 107470, "epoch": 888} {"train_loss": -39.15898513793945, "global_step": 107471, "epoch": 888} {"train_loss": -38.788330078125, "global_step": 107472, "epoch": 888} {"train_loss": -38.61624526977539, "global_step": 107473, "epoch": 888} {"train_loss": -38.6331901550293, "global_step": 107474, "epoch": 888} {"train_loss": -38.583961486816406, "global_step": 107475, "epoch": 888} {"train_loss": -39.19818878173828, "global_step": 107476, "epoch": 888} {"train_loss": -38.41217803955078, "global_step": 107477, "epoch": 888} {"train_loss": -38.71737289428711, "global_step": 107478, "epoch": 888} {"train_loss": -38.1714973449707, "global_step": 107479, "epoch": 888} {"train_loss": -38.71729278564453, "global_step": 107480, "epoch": 888} {"train_loss": -37.48427963256836, "global_step": 107481, "epoch": 888} {"train_loss": -36.45310592651367, "global_step": 107482, "epoch": 888} {"train_loss": -35.089290618896484, "global_step": 107483, "epoch": 888} {"train_loss": -32.180702209472656, "global_step": 107484, "epoch": 888} {"train_loss": -31.25343132019043, "global_step": 107485, "epoch": 888} {"train_loss": -29.34797477722168, "global_step": 107486, "epoch": 888} {"train_loss": -37.46946334838867, "global_step": 107487, "epoch": 888} {"train_loss": -36.504638671875, "global_step": 107488, "epoch": 888} {"train_loss": -29.720062255859375, "global_step": 107489, "epoch": 888} {"train_loss": -35.28639602661133, "global_step": 107490, "epoch": 888} {"train_loss": -36.07722473144531, "global_step": 107491, "epoch": 888} {"train_loss": -34.71956253051758, "global_step": 107492, "epoch": 888} {"train_loss": -35.104652404785156, "global_step": 107493, "epoch": 888} {"train_loss": -33.53801727294922, "global_step": 107494, "epoch": 888} {"train_loss": -34.28249740600586, "global_step": 107495, "epoch": 888} {"train_loss": -32.9573974609375, "global_step": 107496, "epoch": 888} {"train_loss": -28.80655860900879, "global_step": 107497, "epoch": 888} {"train_loss": -36.578548431396484, "global_step": 107498, "epoch": 888} {"train_loss": -33.04122543334961, "global_step": 107499, "epoch": 888} {"train_loss": -30.764551162719727, "global_step": 107500, "epoch": 888} {"train_loss": -30.477258682250977, "global_step": 107501, "epoch": 888} {"train_loss": -32.47158432006836, "global_step": 107502, "epoch": 888} {"train_loss": -32.95180130004883, "global_step": 107503, "epoch": 888} {"train_loss": -33.34884262084961, "global_step": 107504, "epoch": 888} {"train_loss": -33.84944534301758, "global_step": 107505, "epoch": 888} {"train_loss": -34.2930908203125, "global_step": 107506, "epoch": 888} {"train_loss": -34.01955795288086, "global_step": 107507, "epoch": 888} {"train_loss": -32.66111755371094, "global_step": 107508, "epoch": 888} {"train_loss": -32.156288146972656, "global_step": 107509, "epoch": 888} {"train_loss": -34.288429260253906, "global_step": 107510, "epoch": 888} {"train_loss": -33.685791015625, "global_step": 107511, "epoch": 888} {"train_loss": -33.1993293762207, "global_step": 107512, "epoch": 888} {"train_loss": -33.386390686035156, "global_step": 107513, "epoch": 888} {"train_loss": -34.117958068847656, "global_step": 107514, "epoch": 888} {"train_loss": -31.210168838500977, "global_step": 107515, "epoch": 888} {"train_loss": -33.70984649658203, "global_step": 107516, "epoch": 888} {"train_loss": -34.55036926269531, "global_step": 107517, "epoch": 888} {"train_loss": -35.35487747192383, "global_step": 107518, "epoch": 888} {"train_loss": -35.299991607666016, "global_step": 107519, "epoch": 888} {"train_loss": -33.28702926635742, "global_step": 107520, "epoch": 888} {"train_loss": -33.87730407714844, "global_step": 107521, "epoch": 888} {"train_loss": -32.63157272338867, "global_step": 107522, "epoch": 888} {"train_loss": -35.353031158447266, "global_step": 107523, "epoch": 888} {"train_loss": -35.81652069091797, "global_step": 107524, "epoch": 888} {"train_loss": -33.36658477783203, "global_step": 107525, "epoch": 888} {"train_loss": -35.125423431396484, "global_step": 107526, "epoch": 888} {"train_loss": -31.17154884338379, "global_step": 107527, "epoch": 888} {"train_loss": -34.08942794799805, "global_step": 107528, "epoch": 888} {"train_loss": -35.03983688354492, "global_step": 107529, "epoch": 888} {"train_loss": -35.82424545288086, "global_step": 107530, "epoch": 888} {"train_loss": -35.735633850097656, "global_step": 107531, "epoch": 888} {"train_loss": -35.72152328491211, "global_step": 107532, "epoch": 888} {"train_loss": -33.84780502319336, "global_step": 107533, "epoch": 888} {"train_loss": -34.3113899230957, "global_step": 107534, "epoch": 888} {"train_loss": -35.80012130737305, "global_step": 107535, "epoch": 888} {"train_loss": -35.54587173461914, "global_step": 107536, "epoch": 888} {"train_loss": -35.797725677490234, "global_step": 107537, "epoch": 888} {"train_loss": -34.966453552246094, "global_step": 107538, "epoch": 888} {"train_loss": -35.70505905151367, "global_step": 107539, "epoch": 888} {"train_loss": -35.32962417602539, "global_step": 107540, "epoch": 888} {"train_loss": -35.61758041381836, "global_step": 107541, "epoch": 888} {"train_loss": -35.84721755981445, "global_step": 107542, "epoch": 888} {"train_loss": -36.0570182800293, "global_step": 107543, "epoch": 888} {"train_loss": -35.6898193359375, "global_step": 107544, "epoch": 888} {"train_loss": -36.3656005859375, "global_step": 107545, "epoch": 888} {"train_loss": -36.13955307006836, "global_step": 107546, "epoch": 888} {"train_loss": -36.7012825012207, "global_step": 107547, "epoch": 888} {"train_loss": -35.88056564331055, "global_step": 107548, "epoch": 888} {"train_loss": -35.90080642700195, "global_step": 107549, "epoch": 888} {"train_loss": -36.3271484375, "global_step": 107550, "epoch": 888} {"train_loss": -35.93305206298828, "global_step": 107551, "epoch": 888} {"train_loss": -36.48435592651367, "global_step": 107552, "epoch": 888} {"train_loss": -36.86695861816406, "global_step": 107553, "epoch": 888} {"train_loss": -36.37441635131836, "global_step": 107554, "epoch": 888} {"train_loss": -36.2590446472168, "global_step": 107555, "epoch": 888} {"train_loss": -36.648284912109375, "global_step": 107556, "epoch": 888} {"train_loss": -36.698768615722656, "global_step": 107557, "epoch": 888} {"train_loss": -36.47822952270508, "global_step": 107558, "epoch": 888} {"train_loss": -36.65249252319336, "global_step": 107559, "epoch": 888} {"train_loss": -36.60987091064453, "global_step": 107560, "epoch": 888} {"train_loss": -36.7745246887207, "global_step": 107561, "epoch": 888} {"train_loss": -36.902503967285156, "global_step": 107562, "epoch": 888} {"train_loss": -37.69845962524414, "global_step": 107563, "epoch": 888} {"train_loss": -37.32497787475586, "global_step": 107564, "epoch": 888} {"train_loss": -36.6563835144043, "global_step": 107565, "epoch": 888} {"train_loss": -37.487449645996094, "global_step": 107566, "epoch": 888} {"train_loss": -38.0693473815918, "global_step": 107567, "epoch": 888} {"train_loss": -35.792513807943045, "global_step": 107568, "epoch": 888, "val_loss": 2500840.25} {"train_loss": -37.18600082397461, "global_step": 107569, "epoch": 889} {"train_loss": -37.267574310302734, "global_step": 107570, "epoch": 889} {"train_loss": -37.55712890625, "global_step": 107571, "epoch": 889} {"train_loss": -37.515594482421875, "global_step": 107572, "epoch": 889} {"train_loss": -37.574764251708984, "global_step": 107573, "epoch": 889} {"train_loss": -37.5474739074707, "global_step": 107574, "epoch": 889} {"train_loss": -37.781349182128906, "global_step": 107575, "epoch": 889} {"train_loss": -38.11225128173828, "global_step": 107576, "epoch": 889} {"train_loss": -37.66746139526367, "global_step": 107577, "epoch": 889} {"train_loss": -37.88850021362305, "global_step": 107578, "epoch": 889} {"train_loss": -37.99579620361328, "global_step": 107579, "epoch": 889} {"train_loss": -38.01791000366211, "global_step": 107580, "epoch": 889} {"train_loss": -37.898468017578125, "global_step": 107581, "epoch": 889} {"train_loss": -38.461177825927734, "global_step": 107582, "epoch": 889} {"train_loss": -37.29114532470703, "global_step": 107583, "epoch": 889} {"train_loss": -37.937591552734375, "global_step": 107584, "epoch": 889} {"train_loss": -38.29629135131836, "global_step": 107585, "epoch": 889} {"train_loss": -38.52500534057617, "global_step": 107586, "epoch": 889} {"train_loss": -38.48427963256836, "global_step": 107587, "epoch": 889} {"train_loss": -38.48785400390625, "global_step": 107588, "epoch": 889} {"train_loss": -38.18783187866211, "global_step": 107589, "epoch": 889} {"train_loss": -38.17300033569336, "global_step": 107590, "epoch": 889} {"train_loss": -37.965938568115234, "global_step": 107591, "epoch": 889} {"train_loss": -38.20554733276367, "global_step": 107592, "epoch": 889} {"train_loss": -38.2655143737793, "global_step": 107593, "epoch": 889} {"train_loss": -37.964935302734375, "global_step": 107594, "epoch": 889} {"train_loss": -38.3128662109375, "global_step": 107595, "epoch": 889} {"train_loss": -37.76583480834961, "global_step": 107596, "epoch": 889} {"train_loss": -38.57661819458008, "global_step": 107597, "epoch": 889} {"train_loss": -38.12548065185547, "global_step": 107598, "epoch": 889} {"train_loss": -38.809112548828125, "global_step": 107599, "epoch": 889} {"train_loss": -38.671504974365234, "global_step": 107600, "epoch": 889} {"train_loss": -38.87531280517578, "global_step": 107601, "epoch": 889} {"train_loss": -38.41757583618164, "global_step": 107602, "epoch": 889} {"train_loss": -38.830684661865234, "global_step": 107603, "epoch": 889} {"train_loss": -38.683467864990234, "global_step": 107604, "epoch": 889} {"train_loss": -38.34288024902344, "global_step": 107605, "epoch": 889} {"train_loss": -39.179256439208984, "global_step": 107606, "epoch": 889} {"train_loss": -38.62582015991211, "global_step": 107607, "epoch": 889} {"train_loss": -39.00020980834961, "global_step": 107608, "epoch": 889} {"train_loss": -38.20194625854492, "global_step": 107609, "epoch": 889} {"train_loss": -38.90850830078125, "global_step": 107610, "epoch": 889} {"train_loss": -38.64961624145508, "global_step": 107611, "epoch": 889} {"train_loss": -38.868099212646484, "global_step": 107612, "epoch": 889} {"train_loss": -39.09600830078125, "global_step": 107613, "epoch": 889} {"train_loss": -38.446533203125, "global_step": 107614, "epoch": 889} {"train_loss": -38.57740020751953, "global_step": 107615, "epoch": 889} {"train_loss": -39.026981353759766, "global_step": 107616, "epoch": 889} {"train_loss": -38.67039489746094, "global_step": 107617, "epoch": 889} {"train_loss": -38.73737716674805, "global_step": 107618, "epoch": 889} {"train_loss": -38.79118347167969, "global_step": 107619, "epoch": 889} {"train_loss": -39.04080581665039, "global_step": 107620, "epoch": 889} {"train_loss": -39.122711181640625, "global_step": 107621, "epoch": 889} {"train_loss": -38.86423873901367, "global_step": 107622, "epoch": 889} {"train_loss": -39.002685546875, "global_step": 107623, "epoch": 889} {"train_loss": -38.61526107788086, "global_step": 107624, "epoch": 889} {"train_loss": -38.15098190307617, "global_step": 107625, "epoch": 889} {"train_loss": -35.00188064575195, "global_step": 107626, "epoch": 889} {"train_loss": -34.64593505859375, "global_step": 107627, "epoch": 889} {"train_loss": -37.33548355102539, "global_step": 107628, "epoch": 889} {"train_loss": -32.95042037963867, "global_step": 107629, "epoch": 889} {"train_loss": -36.214962005615234, "global_step": 107630, "epoch": 889} {"train_loss": -33.660484313964844, "global_step": 107631, "epoch": 889} {"train_loss": -36.73286819458008, "global_step": 107632, "epoch": 889} {"train_loss": -36.91957473754883, "global_step": 107633, "epoch": 889} {"train_loss": -33.15921401977539, "global_step": 107634, "epoch": 889} {"train_loss": -38.30942916870117, "global_step": 107635, "epoch": 889} {"train_loss": -34.9978141784668, "global_step": 107636, "epoch": 889} {"train_loss": -35.8149299621582, "global_step": 107637, "epoch": 889} {"train_loss": -37.01191329956055, "global_step": 107638, "epoch": 889} {"train_loss": -35.88846969604492, "global_step": 107639, "epoch": 889} {"train_loss": -37.893768310546875, "global_step": 107640, "epoch": 889} {"train_loss": -37.462398529052734, "global_step": 107641, "epoch": 889} {"train_loss": -38.12645721435547, "global_step": 107642, "epoch": 889} {"train_loss": -38.584312438964844, "global_step": 107643, "epoch": 889} {"train_loss": -37.66950607299805, "global_step": 107644, "epoch": 889} {"train_loss": -38.042388916015625, "global_step": 107645, "epoch": 889} {"train_loss": -38.17691421508789, "global_step": 107646, "epoch": 889} {"train_loss": -37.51764678955078, "global_step": 107647, "epoch": 889} {"train_loss": -37.92947769165039, "global_step": 107648, "epoch": 889} {"train_loss": -37.48421859741211, "global_step": 107649, "epoch": 889} {"train_loss": -39.013824462890625, "global_step": 107650, "epoch": 889} {"train_loss": -38.75468063354492, "global_step": 107651, "epoch": 889} {"train_loss": -38.3151969909668, "global_step": 107652, "epoch": 889} {"train_loss": -38.626190185546875, "global_step": 107653, "epoch": 889} {"train_loss": -38.59237289428711, "global_step": 107654, "epoch": 889} {"train_loss": -38.40230941772461, "global_step": 107655, "epoch": 889} {"train_loss": -38.37925720214844, "global_step": 107656, "epoch": 889} {"train_loss": -37.76261901855469, "global_step": 107657, "epoch": 889} {"train_loss": -38.10853576660156, "global_step": 107658, "epoch": 889} {"train_loss": -38.73684310913086, "global_step": 107659, "epoch": 889} {"train_loss": -38.954769134521484, "global_step": 107660, "epoch": 889} {"train_loss": -38.7108154296875, "global_step": 107661, "epoch": 889} {"train_loss": -39.24285125732422, "global_step": 107662, "epoch": 889} {"train_loss": -39.00252151489258, "global_step": 107663, "epoch": 889} {"train_loss": -39.30873489379883, "global_step": 107664, "epoch": 889} {"train_loss": -39.135616302490234, "global_step": 107665, "epoch": 889} {"train_loss": -39.12113571166992, "global_step": 107666, "epoch": 889} {"train_loss": -39.3751106262207, "global_step": 107667, "epoch": 889} {"train_loss": -38.47711944580078, "global_step": 107668, "epoch": 889} {"train_loss": -39.11826705932617, "global_step": 107669, "epoch": 889} {"train_loss": -39.3380241394043, "global_step": 107670, "epoch": 889} {"train_loss": -38.408504486083984, "global_step": 107671, "epoch": 889} {"train_loss": -38.412593841552734, "global_step": 107672, "epoch": 889} {"train_loss": -39.372650146484375, "global_step": 107673, "epoch": 889} {"train_loss": -38.4508056640625, "global_step": 107674, "epoch": 889} {"train_loss": -38.97095489501953, "global_step": 107675, "epoch": 889} {"train_loss": -38.86265182495117, "global_step": 107676, "epoch": 889} {"train_loss": -38.59254837036133, "global_step": 107677, "epoch": 889} {"train_loss": -37.420833587646484, "global_step": 107678, "epoch": 889} {"train_loss": -37.02436447143555, "global_step": 107679, "epoch": 889} {"train_loss": -34.46487808227539, "global_step": 107680, "epoch": 889} {"train_loss": -26.497785568237305, "global_step": 107681, "epoch": 889} {"train_loss": -19.5020809173584, "global_step": 107682, "epoch": 889} {"train_loss": -22.32455825805664, "global_step": 107683, "epoch": 889} {"train_loss": -37.298789978027344, "global_step": 107684, "epoch": 889} {"train_loss": -28.890228271484375, "global_step": 107685, "epoch": 889} {"train_loss": -23.865026473999023, "global_step": 107686, "epoch": 889} {"train_loss": -35.33939743041992, "global_step": 107687, "epoch": 889} {"train_loss": -30.317419052124023, "global_step": 107688, "epoch": 889} {"train_loss": -37.31198079132837, "global_step": 107689, "epoch": 889, "val_loss": 2480893.0} {"train_loss": -31.386072158813477, "global_step": 107690, "epoch": 890} {"train_loss": -35.430694580078125, "global_step": 107691, "epoch": 890} {"train_loss": -33.82395935058594, "global_step": 107692, "epoch": 890} {"train_loss": -34.9178466796875, "global_step": 107693, "epoch": 890} {"train_loss": -35.4592170715332, "global_step": 107694, "epoch": 890} {"train_loss": -34.2933464050293, "global_step": 107695, "epoch": 890} {"train_loss": -37.52849197387695, "global_step": 107696, "epoch": 890} {"train_loss": -35.5271110534668, "global_step": 107697, "epoch": 890} {"train_loss": -36.80890655517578, "global_step": 107698, "epoch": 890} {"train_loss": -36.69658279418945, "global_step": 107699, "epoch": 890} {"train_loss": -36.155094146728516, "global_step": 107700, "epoch": 890} {"train_loss": -37.5964469909668, "global_step": 107701, "epoch": 890} {"train_loss": -37.480140686035156, "global_step": 107702, "epoch": 890} {"train_loss": -36.996978759765625, "global_step": 107703, "epoch": 890} {"train_loss": -37.63951873779297, "global_step": 107704, "epoch": 890} {"train_loss": -37.393798828125, "global_step": 107705, "epoch": 890} {"train_loss": -37.29049301147461, "global_step": 107706, "epoch": 890} {"train_loss": -37.695068359375, "global_step": 107707, "epoch": 890} {"train_loss": -37.957271575927734, "global_step": 107708, "epoch": 890} {"train_loss": -37.45784378051758, "global_step": 107709, "epoch": 890} {"train_loss": -37.116424560546875, "global_step": 107710, "epoch": 890} {"train_loss": -38.14065170288086, "global_step": 107711, "epoch": 890} {"train_loss": -38.19794845581055, "global_step": 107712, "epoch": 890} {"train_loss": -37.17076873779297, "global_step": 107713, "epoch": 890} {"train_loss": -37.82999038696289, "global_step": 107714, "epoch": 890} {"train_loss": -38.3623161315918, "global_step": 107715, "epoch": 890} {"train_loss": -37.90867233276367, "global_step": 107716, "epoch": 890} {"train_loss": -38.01911163330078, "global_step": 107717, "epoch": 890} {"train_loss": -38.5111198425293, "global_step": 107718, "epoch": 890} {"train_loss": -38.6672248840332, "global_step": 107719, "epoch": 890} {"train_loss": -38.12516403198242, "global_step": 107720, "epoch": 890} {"train_loss": -38.526039123535156, "global_step": 107721, "epoch": 890} {"train_loss": -38.169769287109375, "global_step": 107722, "epoch": 890} {"train_loss": -38.25197219848633, "global_step": 107723, "epoch": 890} {"train_loss": -38.31572723388672, "global_step": 107724, "epoch": 890} {"train_loss": -38.40864562988281, "global_step": 107725, "epoch": 890} {"train_loss": -37.74142837524414, "global_step": 107726, "epoch": 890} {"train_loss": -38.2110481262207, "global_step": 107727, "epoch": 890} {"train_loss": -38.58771514892578, "global_step": 107728, "epoch": 890} {"train_loss": -38.3964958190918, "global_step": 107729, "epoch": 890} {"train_loss": -38.769744873046875, "global_step": 107730, "epoch": 890} {"train_loss": -39.11031723022461, "global_step": 107731, "epoch": 890} {"train_loss": -38.699432373046875, "global_step": 107732, "epoch": 890} {"train_loss": -39.023826599121094, "global_step": 107733, "epoch": 890} {"train_loss": -38.45304489135742, "global_step": 107734, "epoch": 890} {"train_loss": -38.98151779174805, "global_step": 107735, "epoch": 890} {"train_loss": -38.61445236206055, "global_step": 107736, "epoch": 890} {"train_loss": -39.20546340942383, "global_step": 107737, "epoch": 890} {"train_loss": -38.47751998901367, "global_step": 107738, "epoch": 890} {"train_loss": -39.040279388427734, "global_step": 107739, "epoch": 890} {"train_loss": -38.37308883666992, "global_step": 107740, "epoch": 890} {"train_loss": -38.41404342651367, "global_step": 107741, "epoch": 890} {"train_loss": -38.142974853515625, "global_step": 107742, "epoch": 890} {"train_loss": -38.70804977416992, "global_step": 107743, "epoch": 890} {"train_loss": -38.5384407043457, "global_step": 107744, "epoch": 890} {"train_loss": -38.038143157958984, "global_step": 107745, "epoch": 890} {"train_loss": -38.387367248535156, "global_step": 107746, "epoch": 890} {"train_loss": -38.777687072753906, "global_step": 107747, "epoch": 890} {"train_loss": -38.72121810913086, "global_step": 107748, "epoch": 890} {"train_loss": -37.79262924194336, "global_step": 107749, "epoch": 890} {"train_loss": -38.94944381713867, "global_step": 107750, "epoch": 890} {"train_loss": -39.175148010253906, "global_step": 107751, "epoch": 890} {"train_loss": -39.26966094970703, "global_step": 107752, "epoch": 890} {"train_loss": -39.0566291809082, "global_step": 107753, "epoch": 890} {"train_loss": -39.500160217285156, "global_step": 107754, "epoch": 890} {"train_loss": -38.6249885559082, "global_step": 107755, "epoch": 890} {"train_loss": -39.16897201538086, "global_step": 107756, "epoch": 890} {"train_loss": -39.079994201660156, "global_step": 107757, "epoch": 890} {"train_loss": -39.258880615234375, "global_step": 107758, "epoch": 890} {"train_loss": -39.228824615478516, "global_step": 107759, "epoch": 890} {"train_loss": -39.22077178955078, "global_step": 107760, "epoch": 890} {"train_loss": -38.787227630615234, "global_step": 107761, "epoch": 890} {"train_loss": -39.25704574584961, "global_step": 107762, "epoch": 890} {"train_loss": -38.81841278076172, "global_step": 107763, "epoch": 890} {"train_loss": -39.331172943115234, "global_step": 107764, "epoch": 890} {"train_loss": -39.311500549316406, "global_step": 107765, "epoch": 890} {"train_loss": -39.08488845825195, "global_step": 107766, "epoch": 890} {"train_loss": -38.7726936340332, "global_step": 107767, "epoch": 890} {"train_loss": -38.88505172729492, "global_step": 107768, "epoch": 890} {"train_loss": -38.04801940917969, "global_step": 107769, "epoch": 890} {"train_loss": -38.721160888671875, "global_step": 107770, "epoch": 890} {"train_loss": -38.87648391723633, "global_step": 107771, "epoch": 890} {"train_loss": -38.8464241027832, "global_step": 107772, "epoch": 890} {"train_loss": -38.851009368896484, "global_step": 107773, "epoch": 890} {"train_loss": -39.31964111328125, "global_step": 107774, "epoch": 890} {"train_loss": -38.24432373046875, "global_step": 107775, "epoch": 890} {"train_loss": -38.05803298950195, "global_step": 107776, "epoch": 890} {"train_loss": -39.03247833251953, "global_step": 107777, "epoch": 890} {"train_loss": -39.42267608642578, "global_step": 107778, "epoch": 890} {"train_loss": -39.11274337768555, "global_step": 107779, "epoch": 890} {"train_loss": -38.222591400146484, "global_step": 107780, "epoch": 890} {"train_loss": -37.60563278198242, "global_step": 107781, "epoch": 890} {"train_loss": -37.56591796875, "global_step": 107782, "epoch": 890} {"train_loss": -38.369659423828125, "global_step": 107783, "epoch": 890} {"train_loss": -37.87636184692383, "global_step": 107784, "epoch": 890} {"train_loss": -33.20545196533203, "global_step": 107785, "epoch": 890} {"train_loss": -37.98294448852539, "global_step": 107786, "epoch": 890} {"train_loss": -36.20266342163086, "global_step": 107787, "epoch": 890} {"train_loss": -34.9793586730957, "global_step": 107788, "epoch": 890} {"train_loss": -36.153770446777344, "global_step": 107789, "epoch": 890} {"train_loss": -36.9912109375, "global_step": 107790, "epoch": 890} {"train_loss": -36.883846282958984, "global_step": 107791, "epoch": 890} {"train_loss": -34.9138298034668, "global_step": 107792, "epoch": 890} {"train_loss": -35.948585510253906, "global_step": 107793, "epoch": 890} {"train_loss": -37.6494140625, "global_step": 107794, "epoch": 890} {"train_loss": -38.45109939575195, "global_step": 107795, "epoch": 890} {"train_loss": -34.83401107788086, "global_step": 107796, "epoch": 890} {"train_loss": -36.955440521240234, "global_step": 107797, "epoch": 890} {"train_loss": -36.94820785522461, "global_step": 107798, "epoch": 890} {"train_loss": -34.38894271850586, "global_step": 107799, "epoch": 890} {"train_loss": -36.78121566772461, "global_step": 107800, "epoch": 890} {"train_loss": -36.929039001464844, "global_step": 107801, "epoch": 890} {"train_loss": -36.684078216552734, "global_step": 107802, "epoch": 890} {"train_loss": -38.18182373046875, "global_step": 107803, "epoch": 890} {"train_loss": -36.68626022338867, "global_step": 107804, "epoch": 890} {"train_loss": -35.9766960144043, "global_step": 107805, "epoch": 890} {"train_loss": -38.0352668762207, "global_step": 107806, "epoch": 890} {"train_loss": -35.43148422241211, "global_step": 107807, "epoch": 890} {"train_loss": -37.83295822143555, "global_step": 107808, "epoch": 890} {"train_loss": -37.650936126708984, "global_step": 107809, "epoch": 890} {"train_loss": -37.759539154935474, "global_step": 107810, "epoch": 890, "val_loss": 2565162.75} {"train_loss": -37.05415725708008, "global_step": 107811, "epoch": 891} {"train_loss": -37.787017822265625, "global_step": 107812, "epoch": 891} {"train_loss": -38.212188720703125, "global_step": 107813, "epoch": 891} {"train_loss": -38.176448822021484, "global_step": 107814, "epoch": 891} {"train_loss": -37.83028030395508, "global_step": 107815, "epoch": 891} {"train_loss": -37.993896484375, "global_step": 107816, "epoch": 891} {"train_loss": -37.238948822021484, "global_step": 107817, "epoch": 891} {"train_loss": -36.366214752197266, "global_step": 107818, "epoch": 891} {"train_loss": -37.95086669921875, "global_step": 107819, "epoch": 891} {"train_loss": -37.86565017700195, "global_step": 107820, "epoch": 891} {"train_loss": -38.0456428527832, "global_step": 107821, "epoch": 891} {"train_loss": -37.857398986816406, "global_step": 107822, "epoch": 891} {"train_loss": -36.96152114868164, "global_step": 107823, "epoch": 891} {"train_loss": -37.860984802246094, "global_step": 107824, "epoch": 891} {"train_loss": -38.495628356933594, "global_step": 107825, "epoch": 891} {"train_loss": -38.46174240112305, "global_step": 107826, "epoch": 891} {"train_loss": -38.93757247924805, "global_step": 107827, "epoch": 891} {"train_loss": -38.25944900512695, "global_step": 107828, "epoch": 891} {"train_loss": -37.92295837402344, "global_step": 107829, "epoch": 891} {"train_loss": -38.07312774658203, "global_step": 107830, "epoch": 891} {"train_loss": -38.79329299926758, "global_step": 107831, "epoch": 891} {"train_loss": -38.77083206176758, "global_step": 107832, "epoch": 891} {"train_loss": -38.96879959106445, "global_step": 107833, "epoch": 891} {"train_loss": -38.206512451171875, "global_step": 107834, "epoch": 891} {"train_loss": -38.8187141418457, "global_step": 107835, "epoch": 891} {"train_loss": -38.70989990234375, "global_step": 107836, "epoch": 891} {"train_loss": -38.004554748535156, "global_step": 107837, "epoch": 891} {"train_loss": -38.6982307434082, "global_step": 107838, "epoch": 891} {"train_loss": -39.1646842956543, "global_step": 107839, "epoch": 891} {"train_loss": -38.24775314331055, "global_step": 107840, "epoch": 891} {"train_loss": -37.92924118041992, "global_step": 107841, "epoch": 891} {"train_loss": -38.81868362426758, "global_step": 107842, "epoch": 891} {"train_loss": -39.71919631958008, "global_step": 107843, "epoch": 891} {"train_loss": -38.72547149658203, "global_step": 107844, "epoch": 891} {"train_loss": -39.20821762084961, "global_step": 107845, "epoch": 891} {"train_loss": -38.858062744140625, "global_step": 107846, "epoch": 891} {"train_loss": -38.55229568481445, "global_step": 107847, "epoch": 891} {"train_loss": -37.78985595703125, "global_step": 107848, "epoch": 891} {"train_loss": -38.330169677734375, "global_step": 107849, "epoch": 891} {"train_loss": -38.65850830078125, "global_step": 107850, "epoch": 891} {"train_loss": -38.91294860839844, "global_step": 107851, "epoch": 891} {"train_loss": -39.347984313964844, "global_step": 107852, "epoch": 891} {"train_loss": -39.39580535888672, "global_step": 107853, "epoch": 891} {"train_loss": -38.88697052001953, "global_step": 107854, "epoch": 891} {"train_loss": -39.44409942626953, "global_step": 107855, "epoch": 891} {"train_loss": -39.10126876831055, "global_step": 107856, "epoch": 891} {"train_loss": -39.10773468017578, "global_step": 107857, "epoch": 891} {"train_loss": -38.928916931152344, "global_step": 107858, "epoch": 891} {"train_loss": -39.3552131652832, "global_step": 107859, "epoch": 891} {"train_loss": -39.0714111328125, "global_step": 107860, "epoch": 891} {"train_loss": -39.29010009765625, "global_step": 107861, "epoch": 891} {"train_loss": -39.07455062866211, "global_step": 107862, "epoch": 891} {"train_loss": -39.08846664428711, "global_step": 107863, "epoch": 891} {"train_loss": -39.58662414550781, "global_step": 107864, "epoch": 891} {"train_loss": -39.799072265625, "global_step": 107865, "epoch": 891} {"train_loss": -39.004940032958984, "global_step": 107866, "epoch": 891} {"train_loss": -38.406898498535156, "global_step": 107867, "epoch": 891} {"train_loss": -34.82542037963867, "global_step": 107868, "epoch": 891} {"train_loss": -32.43438720703125, "global_step": 107869, "epoch": 891} {"train_loss": -38.418087005615234, "global_step": 107870, "epoch": 891} {"train_loss": -38.086402893066406, "global_step": 107871, "epoch": 891} {"train_loss": -33.29773712158203, "global_step": 107872, "epoch": 891} {"train_loss": -35.26003646850586, "global_step": 107873, "epoch": 891} {"train_loss": -38.775054931640625, "global_step": 107874, "epoch": 891} {"train_loss": -37.863250732421875, "global_step": 107875, "epoch": 891} {"train_loss": -37.715938568115234, "global_step": 107876, "epoch": 891} {"train_loss": -38.44915008544922, "global_step": 107877, "epoch": 891} {"train_loss": -38.4350700378418, "global_step": 107878, "epoch": 891} {"train_loss": -38.70610046386719, "global_step": 107879, "epoch": 891} {"train_loss": -37.809444427490234, "global_step": 107880, "epoch": 891} {"train_loss": -39.024173736572266, "global_step": 107881, "epoch": 891} {"train_loss": -39.28825759887695, "global_step": 107882, "epoch": 891} {"train_loss": -39.14291000366211, "global_step": 107883, "epoch": 891} {"train_loss": -38.4582633972168, "global_step": 107884, "epoch": 891} {"train_loss": -39.50405502319336, "global_step": 107885, "epoch": 891} {"train_loss": -39.05953598022461, "global_step": 107886, "epoch": 891} {"train_loss": -38.66366195678711, "global_step": 107887, "epoch": 891} {"train_loss": -38.97324752807617, "global_step": 107888, "epoch": 891} {"train_loss": -39.34407424926758, "global_step": 107889, "epoch": 891} {"train_loss": -39.05107498168945, "global_step": 107890, "epoch": 891} {"train_loss": -39.55464553833008, "global_step": 107891, "epoch": 891} {"train_loss": -39.361873626708984, "global_step": 107892, "epoch": 891} {"train_loss": -39.31640625, "global_step": 107893, "epoch": 891} {"train_loss": -39.345096588134766, "global_step": 107894, "epoch": 891} {"train_loss": -39.8765754699707, "global_step": 107895, "epoch": 891} {"train_loss": -39.52463912963867, "global_step": 107896, "epoch": 891} {"train_loss": -39.5169677734375, "global_step": 107897, "epoch": 891} {"train_loss": -38.699012756347656, "global_step": 107898, "epoch": 891} {"train_loss": -39.89385986328125, "global_step": 107899, "epoch": 891} {"train_loss": -39.37675094604492, "global_step": 107900, "epoch": 891} {"train_loss": -38.92007064819336, "global_step": 107901, "epoch": 891} {"train_loss": -38.36768341064453, "global_step": 107902, "epoch": 891} {"train_loss": -39.60116195678711, "global_step": 107903, "epoch": 891} {"train_loss": -39.45594787597656, "global_step": 107904, "epoch": 891} {"train_loss": -38.66755294799805, "global_step": 107905, "epoch": 891} {"train_loss": -39.21084213256836, "global_step": 107906, "epoch": 891} {"train_loss": -39.0007209777832, "global_step": 107907, "epoch": 891} {"train_loss": -37.83026885986328, "global_step": 107908, "epoch": 891} {"train_loss": -39.15872573852539, "global_step": 107909, "epoch": 891} {"train_loss": -39.6230583190918, "global_step": 107910, "epoch": 891} {"train_loss": -39.32147216796875, "global_step": 107911, "epoch": 891} {"train_loss": -38.98876953125, "global_step": 107912, "epoch": 891} {"train_loss": -39.31173324584961, "global_step": 107913, "epoch": 891} {"train_loss": -38.86301803588867, "global_step": 107914, "epoch": 891} {"train_loss": -39.3992805480957, "global_step": 107915, "epoch": 891} {"train_loss": -38.573143005371094, "global_step": 107916, "epoch": 891} {"train_loss": -36.127010345458984, "global_step": 107917, "epoch": 891} {"train_loss": -30.269439697265625, "global_step": 107918, "epoch": 891} {"train_loss": -27.7320556640625, "global_step": 107919, "epoch": 891} {"train_loss": -37.00117111206055, "global_step": 107920, "epoch": 891} {"train_loss": -29.8233699798584, "global_step": 107921, "epoch": 891} {"train_loss": -37.43083572387695, "global_step": 107922, "epoch": 891} {"train_loss": -33.374794006347656, "global_step": 107923, "epoch": 891} {"train_loss": -38.134178161621094, "global_step": 107924, "epoch": 891} {"train_loss": -35.14484405517578, "global_step": 107925, "epoch": 891} {"train_loss": -37.501564025878906, "global_step": 107926, "epoch": 891} {"train_loss": -35.73061752319336, "global_step": 107927, "epoch": 891} {"train_loss": -37.80389404296875, "global_step": 107928, "epoch": 891} {"train_loss": -38.031429290771484, "global_step": 107929, "epoch": 891} {"train_loss": -37.248592376708984, "global_step": 107930, "epoch": 891} {"train_loss": -38.141807792600524, "global_step": 107931, "epoch": 891, "val_loss": 2593151.25} {"train_loss": -38.49155044555664, "global_step": 107932, "epoch": 892} {"train_loss": -37.176822662353516, "global_step": 107933, "epoch": 892} {"train_loss": -39.06850814819336, "global_step": 107934, "epoch": 892} {"train_loss": -38.093994140625, "global_step": 107935, "epoch": 892} {"train_loss": -37.514347076416016, "global_step": 107936, "epoch": 892} {"train_loss": -38.62751007080078, "global_step": 107937, "epoch": 892} {"train_loss": -38.9635009765625, "global_step": 107938, "epoch": 892} {"train_loss": -37.5806770324707, "global_step": 107939, "epoch": 892} {"train_loss": -39.224639892578125, "global_step": 107940, "epoch": 892} {"train_loss": -38.52631378173828, "global_step": 107941, "epoch": 892} {"train_loss": -37.93342590332031, "global_step": 107942, "epoch": 892} {"train_loss": -37.81056213378906, "global_step": 107943, "epoch": 892} {"train_loss": -39.29277038574219, "global_step": 107944, "epoch": 892} {"train_loss": -38.42741012573242, "global_step": 107945, "epoch": 892} {"train_loss": -38.80375289916992, "global_step": 107946, "epoch": 892} {"train_loss": -38.8958740234375, "global_step": 107947, "epoch": 892} {"train_loss": -39.27103805541992, "global_step": 107948, "epoch": 892} {"train_loss": -38.76355743408203, "global_step": 107949, "epoch": 892} {"train_loss": -38.8211784362793, "global_step": 107950, "epoch": 892} {"train_loss": -39.539180755615234, "global_step": 107951, "epoch": 892} {"train_loss": -38.95517349243164, "global_step": 107952, "epoch": 892} {"train_loss": -39.2637825012207, "global_step": 107953, "epoch": 892} {"train_loss": -38.94399642944336, "global_step": 107954, "epoch": 892} {"train_loss": -39.58253860473633, "global_step": 107955, "epoch": 892} {"train_loss": -39.25590515136719, "global_step": 107956, "epoch": 892} {"train_loss": -38.965084075927734, "global_step": 107957, "epoch": 892} {"train_loss": -39.37708282470703, "global_step": 107958, "epoch": 892} {"train_loss": -39.397335052490234, "global_step": 107959, "epoch": 892} {"train_loss": -39.83930969238281, "global_step": 107960, "epoch": 892} {"train_loss": -39.602745056152344, "global_step": 107961, "epoch": 892} {"train_loss": -39.688880920410156, "global_step": 107962, "epoch": 892} {"train_loss": -39.420654296875, "global_step": 107963, "epoch": 892} {"train_loss": -39.73882293701172, "global_step": 107964, "epoch": 892} {"train_loss": -39.863914489746094, "global_step": 107965, "epoch": 892} {"train_loss": -39.61763381958008, "global_step": 107966, "epoch": 892} {"train_loss": -39.71505355834961, "global_step": 107967, "epoch": 892} {"train_loss": -39.73358917236328, "global_step": 107968, "epoch": 892} {"train_loss": -39.96729278564453, "global_step": 107969, "epoch": 892} {"train_loss": -39.48385238647461, "global_step": 107970, "epoch": 892} {"train_loss": -39.21366882324219, "global_step": 107971, "epoch": 892} {"train_loss": -39.0343017578125, "global_step": 107972, "epoch": 892} {"train_loss": -39.11371994018555, "global_step": 107973, "epoch": 892} {"train_loss": -38.50265121459961, "global_step": 107974, "epoch": 892} {"train_loss": -38.970726013183594, "global_step": 107975, "epoch": 892} {"train_loss": -39.963050842285156, "global_step": 107976, "epoch": 892} {"train_loss": -38.95075988769531, "global_step": 107977, "epoch": 892} {"train_loss": -35.85498046875, "global_step": 107978, "epoch": 892} {"train_loss": -36.76458740234375, "global_step": 107979, "epoch": 892} {"train_loss": -37.367923736572266, "global_step": 107980, "epoch": 892} {"train_loss": -37.62815475463867, "global_step": 107981, "epoch": 892} {"train_loss": -39.30921173095703, "global_step": 107982, "epoch": 892} {"train_loss": -38.80784225463867, "global_step": 107983, "epoch": 892} {"train_loss": -38.12911605834961, "global_step": 107984, "epoch": 892} {"train_loss": -37.42340087890625, "global_step": 107985, "epoch": 892} {"train_loss": -38.48101806640625, "global_step": 107986, "epoch": 892} {"train_loss": -39.68157958984375, "global_step": 107987, "epoch": 892} {"train_loss": -38.94586944580078, "global_step": 107988, "epoch": 892} {"train_loss": -39.05846405029297, "global_step": 107989, "epoch": 892} {"train_loss": -39.15712356567383, "global_step": 107990, "epoch": 892} {"train_loss": -39.55598831176758, "global_step": 107991, "epoch": 892} {"train_loss": -39.46790313720703, "global_step": 107992, "epoch": 892} {"train_loss": -39.437252044677734, "global_step": 107993, "epoch": 892} {"train_loss": -39.368160247802734, "global_step": 107994, "epoch": 892} {"train_loss": -39.663387298583984, "global_step": 107995, "epoch": 892} {"train_loss": -39.804073333740234, "global_step": 107996, "epoch": 892} {"train_loss": -39.97340774536133, "global_step": 107997, "epoch": 892} {"train_loss": -39.91949462890625, "global_step": 107998, "epoch": 892} {"train_loss": -39.704864501953125, "global_step": 107999, "epoch": 892} {"train_loss": -39.663612365722656, "global_step": 108000, "epoch": 892} {"train_loss": -39.91911315917969, "global_step": 108001, "epoch": 892} {"train_loss": -39.96144485473633, "global_step": 108002, "epoch": 892} {"train_loss": -39.64506149291992, "global_step": 108003, "epoch": 892} {"train_loss": -39.914608001708984, "global_step": 108004, "epoch": 892} {"train_loss": -39.41284942626953, "global_step": 108005, "epoch": 892} {"train_loss": -38.73368453979492, "global_step": 108006, "epoch": 892} {"train_loss": -39.27145004272461, "global_step": 108007, "epoch": 892} {"train_loss": -39.88386535644531, "global_step": 108008, "epoch": 892} {"train_loss": -39.369564056396484, "global_step": 108009, "epoch": 892} {"train_loss": -39.71737289428711, "global_step": 108010, "epoch": 892} {"train_loss": -40.12080764770508, "global_step": 108011, "epoch": 892} {"train_loss": -39.477413177490234, "global_step": 108012, "epoch": 892} {"train_loss": -38.2929801940918, "global_step": 108013, "epoch": 892} {"train_loss": -34.48877716064453, "global_step": 108014, "epoch": 892} {"train_loss": -35.417869567871094, "global_step": 108015, "epoch": 892} {"train_loss": -37.841094970703125, "global_step": 108016, "epoch": 892} {"train_loss": -38.90115737915039, "global_step": 108017, "epoch": 892} {"train_loss": -36.184932708740234, "global_step": 108018, "epoch": 892} {"train_loss": -35.6281623840332, "global_step": 108019, "epoch": 892} {"train_loss": -37.925228118896484, "global_step": 108020, "epoch": 892} {"train_loss": -36.49991989135742, "global_step": 108021, "epoch": 892} {"train_loss": -37.9801025390625, "global_step": 108022, "epoch": 892} {"train_loss": -37.81891632080078, "global_step": 108023, "epoch": 892} {"train_loss": -35.49557113647461, "global_step": 108024, "epoch": 892} {"train_loss": -38.276580810546875, "global_step": 108025, "epoch": 892} {"train_loss": -37.9108772277832, "global_step": 108026, "epoch": 892} {"train_loss": -37.532711029052734, "global_step": 108027, "epoch": 892} {"train_loss": -37.4275016784668, "global_step": 108028, "epoch": 892} {"train_loss": -38.83784866333008, "global_step": 108029, "epoch": 892} {"train_loss": -37.79337692260742, "global_step": 108030, "epoch": 892} {"train_loss": -37.487586975097656, "global_step": 108031, "epoch": 892} {"train_loss": -38.32878112792969, "global_step": 108032, "epoch": 892} {"train_loss": -37.75199508666992, "global_step": 108033, "epoch": 892} {"train_loss": -37.53474044799805, "global_step": 108034, "epoch": 892} {"train_loss": -39.012630462646484, "global_step": 108035, "epoch": 892} {"train_loss": -37.549903869628906, "global_step": 108036, "epoch": 892} {"train_loss": -35.91811752319336, "global_step": 108037, "epoch": 892} {"train_loss": -38.00997543334961, "global_step": 108038, "epoch": 892} {"train_loss": -31.761322021484375, "global_step": 108039, "epoch": 892} {"train_loss": -36.75851058959961, "global_step": 108040, "epoch": 892} {"train_loss": -35.84231185913086, "global_step": 108041, "epoch": 892} {"train_loss": -36.64330291748047, "global_step": 108042, "epoch": 892} {"train_loss": -37.73836135864258, "global_step": 108043, "epoch": 892} {"train_loss": -37.246883392333984, "global_step": 108044, "epoch": 892} {"train_loss": -38.6679573059082, "global_step": 108045, "epoch": 892} {"train_loss": -37.51568603515625, "global_step": 108046, "epoch": 892} {"train_loss": -37.794212341308594, "global_step": 108047, "epoch": 892} {"train_loss": -37.41796875, "global_step": 108048, "epoch": 892} {"train_loss": -37.1030158996582, "global_step": 108049, "epoch": 892} {"train_loss": -38.59687423706055, "global_step": 108050, "epoch": 892} {"train_loss": -38.109657287597656, "global_step": 108051, "epoch": 892} {"train_loss": -38.46435203236982, "global_step": 108052, "epoch": 892, "val_loss": 2626079.0} {"train_loss": -35.93026351928711, "global_step": 108053, "epoch": 893} {"train_loss": -37.55254364013672, "global_step": 108054, "epoch": 893} {"train_loss": -39.17167282104492, "global_step": 108055, "epoch": 893} {"train_loss": -36.135581970214844, "global_step": 108056, "epoch": 893} {"train_loss": -38.029476165771484, "global_step": 108057, "epoch": 893} {"train_loss": -38.850223541259766, "global_step": 108058, "epoch": 893} {"train_loss": -38.374237060546875, "global_step": 108059, "epoch": 893} {"train_loss": -38.518714904785156, "global_step": 108060, "epoch": 893} {"train_loss": -38.31820297241211, "global_step": 108061, "epoch": 893} {"train_loss": -38.12230682373047, "global_step": 108062, "epoch": 893} {"train_loss": -38.81759262084961, "global_step": 108063, "epoch": 893} {"train_loss": -38.3193359375, "global_step": 108064, "epoch": 893} {"train_loss": -37.37196731567383, "global_step": 108065, "epoch": 893} {"train_loss": -38.92338562011719, "global_step": 108066, "epoch": 893} {"train_loss": -36.51728057861328, "global_step": 108067, "epoch": 893} {"train_loss": -39.63275146484375, "global_step": 108068, "epoch": 893} {"train_loss": -38.695125579833984, "global_step": 108069, "epoch": 893} {"train_loss": -39.04591751098633, "global_step": 108070, "epoch": 893} {"train_loss": -38.57358932495117, "global_step": 108071, "epoch": 893} {"train_loss": -39.14414596557617, "global_step": 108072, "epoch": 893} {"train_loss": -37.979095458984375, "global_step": 108073, "epoch": 893} {"train_loss": -38.85561752319336, "global_step": 108074, "epoch": 893} {"train_loss": -38.32304000854492, "global_step": 108075, "epoch": 893} {"train_loss": -39.36835479736328, "global_step": 108076, "epoch": 893} {"train_loss": -38.9956169128418, "global_step": 108077, "epoch": 893} {"train_loss": -39.12335205078125, "global_step": 108078, "epoch": 893} {"train_loss": -39.46395492553711, "global_step": 108079, "epoch": 893} {"train_loss": -39.06358337402344, "global_step": 108080, "epoch": 893} {"train_loss": -39.58698272705078, "global_step": 108081, "epoch": 893} {"train_loss": -38.6328125, "global_step": 108082, "epoch": 893} {"train_loss": -39.189964294433594, "global_step": 108083, "epoch": 893} {"train_loss": -39.17057418823242, "global_step": 108084, "epoch": 893} {"train_loss": -39.361751556396484, "global_step": 108085, "epoch": 893} {"train_loss": -39.436676025390625, "global_step": 108086, "epoch": 893} {"train_loss": -38.81550598144531, "global_step": 108087, "epoch": 893} {"train_loss": -39.63840866088867, "global_step": 108088, "epoch": 893} {"train_loss": -39.191192626953125, "global_step": 108089, "epoch": 893} {"train_loss": -39.51484680175781, "global_step": 108090, "epoch": 893} {"train_loss": -38.79218292236328, "global_step": 108091, "epoch": 893} {"train_loss": -39.85371780395508, "global_step": 108092, "epoch": 893} {"train_loss": -39.62331771850586, "global_step": 108093, "epoch": 893} {"train_loss": -39.49259567260742, "global_step": 108094, "epoch": 893} {"train_loss": -39.776123046875, "global_step": 108095, "epoch": 893} {"train_loss": -40.06411361694336, "global_step": 108096, "epoch": 893} {"train_loss": -39.5864372253418, "global_step": 108097, "epoch": 893} {"train_loss": -39.63235855102539, "global_step": 108098, "epoch": 893} {"train_loss": -39.850624084472656, "global_step": 108099, "epoch": 893} {"train_loss": -39.6677131652832, "global_step": 108100, "epoch": 893} {"train_loss": -39.674278259277344, "global_step": 108101, "epoch": 893} {"train_loss": -39.99201583862305, "global_step": 108102, "epoch": 893} {"train_loss": -39.87567901611328, "global_step": 108103, "epoch": 893} {"train_loss": -39.75074768066406, "global_step": 108104, "epoch": 893} {"train_loss": -40.36668014526367, "global_step": 108105, "epoch": 893} {"train_loss": -39.983638763427734, "global_step": 108106, "epoch": 893} {"train_loss": -39.8235969543457, "global_step": 108107, "epoch": 893} {"train_loss": -39.63202667236328, "global_step": 108108, "epoch": 893} {"train_loss": -39.57905960083008, "global_step": 108109, "epoch": 893} {"train_loss": -40.20991897583008, "global_step": 108110, "epoch": 893} {"train_loss": -40.349849700927734, "global_step": 108111, "epoch": 893} {"train_loss": -39.475059509277344, "global_step": 108112, "epoch": 893} {"train_loss": -38.76982498168945, "global_step": 108113, "epoch": 893} {"train_loss": -38.64933395385742, "global_step": 108114, "epoch": 893} {"train_loss": -38.407325744628906, "global_step": 108115, "epoch": 893} {"train_loss": -36.746559143066406, "global_step": 108116, "epoch": 893} {"train_loss": -31.690519332885742, "global_step": 108117, "epoch": 893} {"train_loss": -38.940223693847656, "global_step": 108118, "epoch": 893} {"train_loss": -32.9372673034668, "global_step": 108119, "epoch": 893} {"train_loss": -34.711402893066406, "global_step": 108120, "epoch": 893} {"train_loss": -35.49161911010742, "global_step": 108121, "epoch": 893} {"train_loss": -35.471675872802734, "global_step": 108122, "epoch": 893} {"train_loss": -35.90754318237305, "global_step": 108123, "epoch": 893} {"train_loss": -35.37748336791992, "global_step": 108124, "epoch": 893} {"train_loss": -32.687538146972656, "global_step": 108125, "epoch": 893} {"train_loss": -36.247642517089844, "global_step": 108126, "epoch": 893} {"train_loss": -35.85730743408203, "global_step": 108127, "epoch": 893} {"train_loss": -36.462562561035156, "global_step": 108128, "epoch": 893} {"train_loss": -34.161415100097656, "global_step": 108129, "epoch": 893} {"train_loss": -37.64875411987305, "global_step": 108130, "epoch": 893} {"train_loss": -36.499046325683594, "global_step": 108131, "epoch": 893} {"train_loss": -38.32740020751953, "global_step": 108132, "epoch": 893} {"train_loss": -36.25161361694336, "global_step": 108133, "epoch": 893} {"train_loss": -38.37795639038086, "global_step": 108134, "epoch": 893} {"train_loss": -37.23771286010742, "global_step": 108135, "epoch": 893} {"train_loss": -38.4455680847168, "global_step": 108136, "epoch": 893} {"train_loss": -37.56379318237305, "global_step": 108137, "epoch": 893} {"train_loss": -38.205501556396484, "global_step": 108138, "epoch": 893} {"train_loss": -38.560211181640625, "global_step": 108139, "epoch": 893} {"train_loss": -37.99184036254883, "global_step": 108140, "epoch": 893} {"train_loss": -38.49190902709961, "global_step": 108141, "epoch": 893} {"train_loss": -38.4891471862793, "global_step": 108142, "epoch": 893} {"train_loss": -38.69380569458008, "global_step": 108143, "epoch": 893} {"train_loss": -39.21810531616211, "global_step": 108144, "epoch": 893} {"train_loss": -38.51237106323242, "global_step": 108145, "epoch": 893} {"train_loss": -38.88782501220703, "global_step": 108146, "epoch": 893} {"train_loss": -38.59878158569336, "global_step": 108147, "epoch": 893} {"train_loss": -37.6277961730957, "global_step": 108148, "epoch": 893} {"train_loss": -37.546932220458984, "global_step": 108149, "epoch": 893} {"train_loss": -38.87941360473633, "global_step": 108150, "epoch": 893} {"train_loss": -38.2645263671875, "global_step": 108151, "epoch": 893} {"train_loss": -37.98175811767578, "global_step": 108152, "epoch": 893} {"train_loss": -38.6689567565918, "global_step": 108153, "epoch": 893} {"train_loss": -39.1497688293457, "global_step": 108154, "epoch": 893} {"train_loss": -38.167598724365234, "global_step": 108155, "epoch": 893} {"train_loss": -38.87092208862305, "global_step": 108156, "epoch": 893} {"train_loss": -39.319602966308594, "global_step": 108157, "epoch": 893} {"train_loss": -38.336875915527344, "global_step": 108158, "epoch": 893} {"train_loss": -39.491676330566406, "global_step": 108159, "epoch": 893} {"train_loss": -39.019813537597656, "global_step": 108160, "epoch": 893} {"train_loss": -38.931575775146484, "global_step": 108161, "epoch": 893} {"train_loss": -38.61896896362305, "global_step": 108162, "epoch": 893} {"train_loss": -38.11534118652344, "global_step": 108163, "epoch": 893} {"train_loss": -39.20133590698242, "global_step": 108164, "epoch": 893} {"train_loss": -38.61490249633789, "global_step": 108165, "epoch": 893} {"train_loss": -38.4975700378418, "global_step": 108166, "epoch": 893} {"train_loss": -38.922882080078125, "global_step": 108167, "epoch": 893} {"train_loss": -39.050384521484375, "global_step": 108168, "epoch": 893} {"train_loss": -39.15691375732422, "global_step": 108169, "epoch": 893} {"train_loss": -39.4764289855957, "global_step": 108170, "epoch": 893} {"train_loss": -39.59271240234375, "global_step": 108171, "epoch": 893} {"train_loss": -39.163856506347656, "global_step": 108172, "epoch": 893} {"train_loss": -38.382146173272254, "global_step": 108173, "epoch": 893, "val_loss": 2658799.25} {"train_loss": -39.75403594970703, "global_step": 108174, "epoch": 894} {"train_loss": -39.30644607543945, "global_step": 108175, "epoch": 894} {"train_loss": -39.207096099853516, "global_step": 108176, "epoch": 894} {"train_loss": -39.226802825927734, "global_step": 108177, "epoch": 894} {"train_loss": -39.49452590942383, "global_step": 108178, "epoch": 894} {"train_loss": -39.78890609741211, "global_step": 108179, "epoch": 894} {"train_loss": -40.078670501708984, "global_step": 108180, "epoch": 894} {"train_loss": -39.41579818725586, "global_step": 108181, "epoch": 894} {"train_loss": -39.66740417480469, "global_step": 108182, "epoch": 894} {"train_loss": -40.024085998535156, "global_step": 108183, "epoch": 894} {"train_loss": -39.800167083740234, "global_step": 108184, "epoch": 894} {"train_loss": -39.15617370605469, "global_step": 108185, "epoch": 894} {"train_loss": -38.829349517822266, "global_step": 108186, "epoch": 894} {"train_loss": -39.971534729003906, "global_step": 108187, "epoch": 894} {"train_loss": -40.169593811035156, "global_step": 108188, "epoch": 894} {"train_loss": -39.87252426147461, "global_step": 108189, "epoch": 894} {"train_loss": -39.867713928222656, "global_step": 108190, "epoch": 894} {"train_loss": -39.311092376708984, "global_step": 108191, "epoch": 894} {"train_loss": -40.00741195678711, "global_step": 108192, "epoch": 894} {"train_loss": -39.79730987548828, "global_step": 108193, "epoch": 894} {"train_loss": -39.10210418701172, "global_step": 108194, "epoch": 894} {"train_loss": -38.57467269897461, "global_step": 108195, "epoch": 894} {"train_loss": -38.656185150146484, "global_step": 108196, "epoch": 894} {"train_loss": -37.09780502319336, "global_step": 108197, "epoch": 894} {"train_loss": -35.838680267333984, "global_step": 108198, "epoch": 894} {"train_loss": -35.20905685424805, "global_step": 108199, "epoch": 894} {"train_loss": -33.492958068847656, "global_step": 108200, "epoch": 894} {"train_loss": -34.13175582885742, "global_step": 108201, "epoch": 894} {"train_loss": -38.85323715209961, "global_step": 108202, "epoch": 894} {"train_loss": -38.32979965209961, "global_step": 108203, "epoch": 894} {"train_loss": -35.90534210205078, "global_step": 108204, "epoch": 894} {"train_loss": -39.237972259521484, "global_step": 108205, "epoch": 894} {"train_loss": -39.45179748535156, "global_step": 108206, "epoch": 894} {"train_loss": -37.65675735473633, "global_step": 108207, "epoch": 894} {"train_loss": -39.2305908203125, "global_step": 108208, "epoch": 894} {"train_loss": -37.18282699584961, "global_step": 108209, "epoch": 894} {"train_loss": -38.156314849853516, "global_step": 108210, "epoch": 894} {"train_loss": -39.523250579833984, "global_step": 108211, "epoch": 894} {"train_loss": -37.60128402709961, "global_step": 108212, "epoch": 894} {"train_loss": -38.0023307800293, "global_step": 108213, "epoch": 894} {"train_loss": -39.3658561706543, "global_step": 108214, "epoch": 894} {"train_loss": -37.387451171875, "global_step": 108215, "epoch": 894} {"train_loss": -39.409847259521484, "global_step": 108216, "epoch": 894} {"train_loss": -38.26831817626953, "global_step": 108217, "epoch": 894} {"train_loss": -38.35856246948242, "global_step": 108218, "epoch": 894} {"train_loss": -38.18696212768555, "global_step": 108219, "epoch": 894} {"train_loss": -38.651763916015625, "global_step": 108220, "epoch": 894} {"train_loss": -38.76284408569336, "global_step": 108221, "epoch": 894} {"train_loss": -37.56721878051758, "global_step": 108222, "epoch": 894} {"train_loss": -38.178260803222656, "global_step": 108223, "epoch": 894} {"train_loss": -38.51339340209961, "global_step": 108224, "epoch": 894} {"train_loss": -38.20166778564453, "global_step": 108225, "epoch": 894} {"train_loss": -39.07915115356445, "global_step": 108226, "epoch": 894} {"train_loss": -38.05537796020508, "global_step": 108227, "epoch": 894} {"train_loss": -39.07265090942383, "global_step": 108228, "epoch": 894} {"train_loss": -38.34737777709961, "global_step": 108229, "epoch": 894} {"train_loss": -39.389644622802734, "global_step": 108230, "epoch": 894} {"train_loss": -39.422176361083984, "global_step": 108231, "epoch": 894} {"train_loss": -39.11871337890625, "global_step": 108232, "epoch": 894} {"train_loss": -39.320308685302734, "global_step": 108233, "epoch": 894} {"train_loss": -39.1492805480957, "global_step": 108234, "epoch": 894} {"train_loss": -38.665462493896484, "global_step": 108235, "epoch": 894} {"train_loss": -37.89410400390625, "global_step": 108236, "epoch": 894} {"train_loss": -38.95383834838867, "global_step": 108237, "epoch": 894} {"train_loss": -38.586395263671875, "global_step": 108238, "epoch": 894} {"train_loss": -39.58632278442383, "global_step": 108239, "epoch": 894} {"train_loss": -38.694068908691406, "global_step": 108240, "epoch": 894} {"train_loss": -39.09502029418945, "global_step": 108241, "epoch": 894} {"train_loss": -39.53688430786133, "global_step": 108242, "epoch": 894} {"train_loss": -37.6627311706543, "global_step": 108243, "epoch": 894} {"train_loss": -38.300445556640625, "global_step": 108244, "epoch": 894} {"train_loss": -39.482120513916016, "global_step": 108245, "epoch": 894} {"train_loss": -39.47628402709961, "global_step": 108246, "epoch": 894} {"train_loss": -37.14144515991211, "global_step": 108247, "epoch": 894} {"train_loss": -38.43867111206055, "global_step": 108248, "epoch": 894} {"train_loss": -39.221710205078125, "global_step": 108249, "epoch": 894} {"train_loss": -39.020606994628906, "global_step": 108250, "epoch": 894} {"train_loss": -39.6209716796875, "global_step": 108251, "epoch": 894} {"train_loss": -39.35099411010742, "global_step": 108252, "epoch": 894} {"train_loss": -37.82565689086914, "global_step": 108253, "epoch": 894} {"train_loss": -38.932071685791016, "global_step": 108254, "epoch": 894} {"train_loss": -38.7254638671875, "global_step": 108255, "epoch": 894} {"train_loss": -39.29575729370117, "global_step": 108256, "epoch": 894} {"train_loss": -39.23469924926758, "global_step": 108257, "epoch": 894} {"train_loss": -37.63114547729492, "global_step": 108258, "epoch": 894} {"train_loss": -38.288490295410156, "global_step": 108259, "epoch": 894} {"train_loss": -39.23311233520508, "global_step": 108260, "epoch": 894} {"train_loss": -37.28586196899414, "global_step": 108261, "epoch": 894} {"train_loss": -37.9194450378418, "global_step": 108262, "epoch": 894} {"train_loss": -37.881263732910156, "global_step": 108263, "epoch": 894} {"train_loss": -38.490631103515625, "global_step": 108264, "epoch": 894} {"train_loss": -35.84637451171875, "global_step": 108265, "epoch": 894} {"train_loss": -38.77325439453125, "global_step": 108266, "epoch": 894} {"train_loss": -38.20737075805664, "global_step": 108267, "epoch": 894} {"train_loss": -37.90174102783203, "global_step": 108268, "epoch": 894} {"train_loss": -38.842872619628906, "global_step": 108269, "epoch": 894} {"train_loss": -37.69669723510742, "global_step": 108270, "epoch": 894} {"train_loss": -38.23806381225586, "global_step": 108271, "epoch": 894} {"train_loss": -37.71045684814453, "global_step": 108272, "epoch": 894} {"train_loss": -38.780006408691406, "global_step": 108273, "epoch": 894} {"train_loss": -37.77256393432617, "global_step": 108274, "epoch": 894} {"train_loss": -37.71921920776367, "global_step": 108275, "epoch": 894} {"train_loss": -36.99911880493164, "global_step": 108276, "epoch": 894} {"train_loss": -36.23881912231445, "global_step": 108277, "epoch": 894} {"train_loss": -33.5803337097168, "global_step": 108278, "epoch": 894} {"train_loss": -33.92567825317383, "global_step": 108279, "epoch": 894} {"train_loss": -36.531646728515625, "global_step": 108280, "epoch": 894} {"train_loss": -37.577606201171875, "global_step": 108281, "epoch": 894} {"train_loss": -35.52288818359375, "global_step": 108282, "epoch": 894} {"train_loss": -35.835609436035156, "global_step": 108283, "epoch": 894} {"train_loss": -37.37456130981445, "global_step": 108284, "epoch": 894} {"train_loss": -36.542903900146484, "global_step": 108285, "epoch": 894} {"train_loss": -36.3713493347168, "global_step": 108286, "epoch": 894} {"train_loss": -38.11317825317383, "global_step": 108287, "epoch": 894} {"train_loss": -37.351722717285156, "global_step": 108288, "epoch": 894} {"train_loss": -37.35576248168945, "global_step": 108289, "epoch": 894} {"train_loss": -36.26287078857422, "global_step": 108290, "epoch": 894} {"train_loss": -36.98200225830078, "global_step": 108291, "epoch": 894} {"train_loss": -37.53746032714844, "global_step": 108292, "epoch": 894} {"train_loss": -36.09728240966797, "global_step": 108293, "epoch": 894} {"train_loss": -38.2397136215336, "global_step": 108294, "epoch": 894, "val_loss": 2652832.75} {"train_loss": -36.84077072143555, "global_step": 108295, "epoch": 895} {"train_loss": -37.95602035522461, "global_step": 108296, "epoch": 895} {"train_loss": -37.36468505859375, "global_step": 108297, "epoch": 895} {"train_loss": -36.72504806518555, "global_step": 108298, "epoch": 895} {"train_loss": -37.674007415771484, "global_step": 108299, "epoch": 895} {"train_loss": -38.02815628051758, "global_step": 108300, "epoch": 895} {"train_loss": -36.42817687988281, "global_step": 108301, "epoch": 895} {"train_loss": -36.93170928955078, "global_step": 108302, "epoch": 895} {"train_loss": -35.763160705566406, "global_step": 108303, "epoch": 895} {"train_loss": -34.137786865234375, "global_step": 108304, "epoch": 895} {"train_loss": -34.175872802734375, "global_step": 108305, "epoch": 895} {"train_loss": -36.319786071777344, "global_step": 108306, "epoch": 895} {"train_loss": -33.04331588745117, "global_step": 108307, "epoch": 895} {"train_loss": -36.9685173034668, "global_step": 108308, "epoch": 895} {"train_loss": -32.7963752746582, "global_step": 108309, "epoch": 895} {"train_loss": -37.39772415161133, "global_step": 108310, "epoch": 895} {"train_loss": -36.333961486816406, "global_step": 108311, "epoch": 895} {"train_loss": -35.99715042114258, "global_step": 108312, "epoch": 895} {"train_loss": -38.082942962646484, "global_step": 108313, "epoch": 895} {"train_loss": -37.044288635253906, "global_step": 108314, "epoch": 895} {"train_loss": -36.99274826049805, "global_step": 108315, "epoch": 895} {"train_loss": -37.737342834472656, "global_step": 108316, "epoch": 895} {"train_loss": -38.72932052612305, "global_step": 108317, "epoch": 895} {"train_loss": -37.70888137817383, "global_step": 108318, "epoch": 895} {"train_loss": -38.01967239379883, "global_step": 108319, "epoch": 895} {"train_loss": -38.056522369384766, "global_step": 108320, "epoch": 895} {"train_loss": -38.72469711303711, "global_step": 108321, "epoch": 895} {"train_loss": -38.58961868286133, "global_step": 108322, "epoch": 895} {"train_loss": -38.04548263549805, "global_step": 108323, "epoch": 895} {"train_loss": -39.19594955444336, "global_step": 108324, "epoch": 895} {"train_loss": -38.96551513671875, "global_step": 108325, "epoch": 895} {"train_loss": -39.45560836791992, "global_step": 108326, "epoch": 895} {"train_loss": -38.86156463623047, "global_step": 108327, "epoch": 895} {"train_loss": -38.82282638549805, "global_step": 108328, "epoch": 895} {"train_loss": -38.89876937866211, "global_step": 108329, "epoch": 895} {"train_loss": -38.71982192993164, "global_step": 108330, "epoch": 895} {"train_loss": -39.2114372253418, "global_step": 108331, "epoch": 895} {"train_loss": -39.1046142578125, "global_step": 108332, "epoch": 895} {"train_loss": -39.20621871948242, "global_step": 108333, "epoch": 895} {"train_loss": -39.45699691772461, "global_step": 108334, "epoch": 895} {"train_loss": -39.589935302734375, "global_step": 108335, "epoch": 895} {"train_loss": -39.03364944458008, "global_step": 108336, "epoch": 895} {"train_loss": -39.164894104003906, "global_step": 108337, "epoch": 895} {"train_loss": -39.80301284790039, "global_step": 108338, "epoch": 895} {"train_loss": -39.520389556884766, "global_step": 108339, "epoch": 895} {"train_loss": -39.78840255737305, "global_step": 108340, "epoch": 895} {"train_loss": -39.76171875, "global_step": 108341, "epoch": 895} {"train_loss": -39.7711296081543, "global_step": 108342, "epoch": 895} {"train_loss": -39.962554931640625, "global_step": 108343, "epoch": 895} {"train_loss": -39.67724609375, "global_step": 108344, "epoch": 895} {"train_loss": -39.75969314575195, "global_step": 108345, "epoch": 895} {"train_loss": -39.67538070678711, "global_step": 108346, "epoch": 895} {"train_loss": -39.545406341552734, "global_step": 108347, "epoch": 895} {"train_loss": -39.291133880615234, "global_step": 108348, "epoch": 895} {"train_loss": -38.93528366088867, "global_step": 108349, "epoch": 895} {"train_loss": -38.984500885009766, "global_step": 108350, "epoch": 895} {"train_loss": -39.31958770751953, "global_step": 108351, "epoch": 895} {"train_loss": -39.22080612182617, "global_step": 108352, "epoch": 895} {"train_loss": -39.546234130859375, "global_step": 108353, "epoch": 895} {"train_loss": -38.77323532104492, "global_step": 108354, "epoch": 895} {"train_loss": -39.0973014831543, "global_step": 108355, "epoch": 895} {"train_loss": -39.80650329589844, "global_step": 108356, "epoch": 895} {"train_loss": -39.792327880859375, "global_step": 108357, "epoch": 895} {"train_loss": -39.57789993286133, "global_step": 108358, "epoch": 895} {"train_loss": -39.925025939941406, "global_step": 108359, "epoch": 895} {"train_loss": -39.38289260864258, "global_step": 108360, "epoch": 895} {"train_loss": -39.72603225708008, "global_step": 108361, "epoch": 895} {"train_loss": -39.278053283691406, "global_step": 108362, "epoch": 895} {"train_loss": -38.47133255004883, "global_step": 108363, "epoch": 895} {"train_loss": -37.110107421875, "global_step": 108364, "epoch": 895} {"train_loss": -38.944618225097656, "global_step": 108365, "epoch": 895} {"train_loss": -39.38570022583008, "global_step": 108366, "epoch": 895} {"train_loss": -39.31317901611328, "global_step": 108367, "epoch": 895} {"train_loss": -39.04816818237305, "global_step": 108368, "epoch": 895} {"train_loss": -38.16279983520508, "global_step": 108369, "epoch": 895} {"train_loss": -38.37673568725586, "global_step": 108370, "epoch": 895} {"train_loss": -38.904273986816406, "global_step": 108371, "epoch": 895} {"train_loss": -39.05247116088867, "global_step": 108372, "epoch": 895} {"train_loss": -39.200958251953125, "global_step": 108373, "epoch": 895} {"train_loss": -39.7273063659668, "global_step": 108374, "epoch": 895} {"train_loss": -39.87939453125, "global_step": 108375, "epoch": 895} {"train_loss": -39.26694869995117, "global_step": 108376, "epoch": 895} {"train_loss": -38.53818893432617, "global_step": 108377, "epoch": 895} {"train_loss": -38.189300537109375, "global_step": 108378, "epoch": 895} {"train_loss": -39.760616302490234, "global_step": 108379, "epoch": 895} {"train_loss": -39.74723434448242, "global_step": 108380, "epoch": 895} {"train_loss": -38.84680938720703, "global_step": 108381, "epoch": 895} {"train_loss": -39.07770919799805, "global_step": 108382, "epoch": 895} {"train_loss": -39.55295944213867, "global_step": 108383, "epoch": 895} {"train_loss": -40.010860443115234, "global_step": 108384, "epoch": 895} {"train_loss": -38.8493766784668, "global_step": 108385, "epoch": 895} {"train_loss": -38.481136322021484, "global_step": 108386, "epoch": 895} {"train_loss": -39.98446273803711, "global_step": 108387, "epoch": 895} {"train_loss": -39.0510139465332, "global_step": 108388, "epoch": 895} {"train_loss": -38.67112350463867, "global_step": 108389, "epoch": 895} {"train_loss": -38.845272064208984, "global_step": 108390, "epoch": 895} {"train_loss": -39.11053466796875, "global_step": 108391, "epoch": 895} {"train_loss": -38.962158203125, "global_step": 108392, "epoch": 895} {"train_loss": -38.41892623901367, "global_step": 108393, "epoch": 895} {"train_loss": -38.519954681396484, "global_step": 108394, "epoch": 895} {"train_loss": -39.95039749145508, "global_step": 108395, "epoch": 895} {"train_loss": -38.96027374267578, "global_step": 108396, "epoch": 895} {"train_loss": -38.77962875366211, "global_step": 108397, "epoch": 895} {"train_loss": -39.652854919433594, "global_step": 108398, "epoch": 895} {"train_loss": -38.87369918823242, "global_step": 108399, "epoch": 895} {"train_loss": -37.11086654663086, "global_step": 108400, "epoch": 895} {"train_loss": -39.474700927734375, "global_step": 108401, "epoch": 895} {"train_loss": -36.29996871948242, "global_step": 108402, "epoch": 895} {"train_loss": -39.29716110229492, "global_step": 108403, "epoch": 895} {"train_loss": -36.35307312011719, "global_step": 108404, "epoch": 895} {"train_loss": -39.526546478271484, "global_step": 108405, "epoch": 895} {"train_loss": -36.27443313598633, "global_step": 108406, "epoch": 895} {"train_loss": -38.129295349121094, "global_step": 108407, "epoch": 895} {"train_loss": -37.42848587036133, "global_step": 108408, "epoch": 895} {"train_loss": -38.39775466918945, "global_step": 108409, "epoch": 895} {"train_loss": -37.063804626464844, "global_step": 108410, "epoch": 895} {"train_loss": -37.882720947265625, "global_step": 108411, "epoch": 895} {"train_loss": -37.8297119140625, "global_step": 108412, "epoch": 895} {"train_loss": -38.39099884033203, "global_step": 108413, "epoch": 895} {"train_loss": -38.890846252441406, "global_step": 108414, "epoch": 895} {"train_loss": -38.461647443534915, "global_step": 108415, "epoch": 895, "val_loss": 2703748.25} {"train_loss": -38.50676345825195, "global_step": 108416, "epoch": 896} {"train_loss": -36.9737548828125, "global_step": 108417, "epoch": 896} {"train_loss": -39.44789123535156, "global_step": 108418, "epoch": 896} {"train_loss": -37.92934799194336, "global_step": 108419, "epoch": 896} {"train_loss": -39.43539047241211, "global_step": 108420, "epoch": 896} {"train_loss": -38.627376556396484, "global_step": 108421, "epoch": 896} {"train_loss": -39.789798736572266, "global_step": 108422, "epoch": 896} {"train_loss": -39.2152214050293, "global_step": 108423, "epoch": 896} {"train_loss": -39.4787712097168, "global_step": 108424, "epoch": 896} {"train_loss": -39.194000244140625, "global_step": 108425, "epoch": 896} {"train_loss": -39.057735443115234, "global_step": 108426, "epoch": 896} {"train_loss": -38.59495544433594, "global_step": 108427, "epoch": 896} {"train_loss": -38.189849853515625, "global_step": 108428, "epoch": 896} {"train_loss": -39.015350341796875, "global_step": 108429, "epoch": 896} {"train_loss": -38.30281448364258, "global_step": 108430, "epoch": 896} {"train_loss": -39.22822570800781, "global_step": 108431, "epoch": 896} {"train_loss": -38.44649124145508, "global_step": 108432, "epoch": 896} {"train_loss": -37.91078567504883, "global_step": 108433, "epoch": 896} {"train_loss": -38.1922607421875, "global_step": 108434, "epoch": 896} {"train_loss": -38.472530364990234, "global_step": 108435, "epoch": 896} {"train_loss": -37.96559524536133, "global_step": 108436, "epoch": 896} {"train_loss": -39.046504974365234, "global_step": 108437, "epoch": 896} {"train_loss": -39.31982421875, "global_step": 108438, "epoch": 896} {"train_loss": -38.579071044921875, "global_step": 108439, "epoch": 896} {"train_loss": -39.12995529174805, "global_step": 108440, "epoch": 896} {"train_loss": -39.59653854370117, "global_step": 108441, "epoch": 896} {"train_loss": -39.33110046386719, "global_step": 108442, "epoch": 896} {"train_loss": -39.90656661987305, "global_step": 108443, "epoch": 896} {"train_loss": -39.9073371887207, "global_step": 108444, "epoch": 896} {"train_loss": -40.153533935546875, "global_step": 108445, "epoch": 896} {"train_loss": -40.07426071166992, "global_step": 108446, "epoch": 896} {"train_loss": -38.82459259033203, "global_step": 108447, "epoch": 896} {"train_loss": -39.273521423339844, "global_step": 108448, "epoch": 896} {"train_loss": -39.4896240234375, "global_step": 108449, "epoch": 896} {"train_loss": -39.85044479370117, "global_step": 108450, "epoch": 896} {"train_loss": -39.720420837402344, "global_step": 108451, "epoch": 896} {"train_loss": -39.75997543334961, "global_step": 108452, "epoch": 896} {"train_loss": -38.84455490112305, "global_step": 108453, "epoch": 896} {"train_loss": -39.012508392333984, "global_step": 108454, "epoch": 896} {"train_loss": -37.909847259521484, "global_step": 108455, "epoch": 896} {"train_loss": -38.90399169921875, "global_step": 108456, "epoch": 896} {"train_loss": -38.631832122802734, "global_step": 108457, "epoch": 896} {"train_loss": -39.72645950317383, "global_step": 108458, "epoch": 896} {"train_loss": -39.13209915161133, "global_step": 108459, "epoch": 896} {"train_loss": -39.2139892578125, "global_step": 108460, "epoch": 896} {"train_loss": -37.85894775390625, "global_step": 108461, "epoch": 896} {"train_loss": -38.016693115234375, "global_step": 108462, "epoch": 896} {"train_loss": -39.22730255126953, "global_step": 108463, "epoch": 896} {"train_loss": -38.923336029052734, "global_step": 108464, "epoch": 896} {"train_loss": -37.51256561279297, "global_step": 108465, "epoch": 896} {"train_loss": -38.257110595703125, "global_step": 108466, "epoch": 896} {"train_loss": -35.826202392578125, "global_step": 108467, "epoch": 896} {"train_loss": -38.97994613647461, "global_step": 108468, "epoch": 896} {"train_loss": -34.275787353515625, "global_step": 108469, "epoch": 896} {"train_loss": -35.79939651489258, "global_step": 108470, "epoch": 896} {"train_loss": -29.843835830688477, "global_step": 108471, "epoch": 896} {"train_loss": -31.33851432800293, "global_step": 108472, "epoch": 896} {"train_loss": -35.53232955932617, "global_step": 108473, "epoch": 896} {"train_loss": -31.696731567382812, "global_step": 108474, "epoch": 896} {"train_loss": -33.683929443359375, "global_step": 108475, "epoch": 896} {"train_loss": -33.75946044921875, "global_step": 108476, "epoch": 896} {"train_loss": -32.645050048828125, "global_step": 108477, "epoch": 896} {"train_loss": -36.54815673828125, "global_step": 108478, "epoch": 896} {"train_loss": -34.60115432739258, "global_step": 108479, "epoch": 896} {"train_loss": -30.743127822875977, "global_step": 108480, "epoch": 896} {"train_loss": -37.89703369140625, "global_step": 108481, "epoch": 896} {"train_loss": -33.870540618896484, "global_step": 108482, "epoch": 896} {"train_loss": -34.78392028808594, "global_step": 108483, "epoch": 896} {"train_loss": -37.48247146606445, "global_step": 108484, "epoch": 896} {"train_loss": -34.5506477355957, "global_step": 108485, "epoch": 896} {"train_loss": -35.66487503051758, "global_step": 108486, "epoch": 896} {"train_loss": -37.513973236083984, "global_step": 108487, "epoch": 896} {"train_loss": -35.689666748046875, "global_step": 108488, "epoch": 896} {"train_loss": -35.797096252441406, "global_step": 108489, "epoch": 896} {"train_loss": -36.88714599609375, "global_step": 108490, "epoch": 896} {"train_loss": -37.708839416503906, "global_step": 108491, "epoch": 896} {"train_loss": -36.80330276489258, "global_step": 108492, "epoch": 896} {"train_loss": -37.5711669921875, "global_step": 108493, "epoch": 896} {"train_loss": -36.80768966674805, "global_step": 108494, "epoch": 896} {"train_loss": -37.25712203979492, "global_step": 108495, "epoch": 896} {"train_loss": -37.48600387573242, "global_step": 108496, "epoch": 896} {"train_loss": -37.67982864379883, "global_step": 108497, "epoch": 896} {"train_loss": -38.17530059814453, "global_step": 108498, "epoch": 896} {"train_loss": -37.69995880126953, "global_step": 108499, "epoch": 896} {"train_loss": -38.009254455566406, "global_step": 108500, "epoch": 896} {"train_loss": -37.24980545043945, "global_step": 108501, "epoch": 896} {"train_loss": -36.57155990600586, "global_step": 108502, "epoch": 896} {"train_loss": -38.048824310302734, "global_step": 108503, "epoch": 896} {"train_loss": -37.09846878051758, "global_step": 108504, "epoch": 896} {"train_loss": -38.16950225830078, "global_step": 108505, "epoch": 896} {"train_loss": -37.47306442260742, "global_step": 108506, "epoch": 896} {"train_loss": -38.3931999206543, "global_step": 108507, "epoch": 896} {"train_loss": -37.93276596069336, "global_step": 108508, "epoch": 896} {"train_loss": -38.09525680541992, "global_step": 108509, "epoch": 896} {"train_loss": -37.97014236450195, "global_step": 108510, "epoch": 896} {"train_loss": -38.62949752807617, "global_step": 108511, "epoch": 896} {"train_loss": -38.39028549194336, "global_step": 108512, "epoch": 896} {"train_loss": -37.079891204833984, "global_step": 108513, "epoch": 896} {"train_loss": -38.86295700073242, "global_step": 108514, "epoch": 896} {"train_loss": -38.03049850463867, "global_step": 108515, "epoch": 896} {"train_loss": -39.13294219970703, "global_step": 108516, "epoch": 896} {"train_loss": -38.574859619140625, "global_step": 108517, "epoch": 896} {"train_loss": -38.65892028808594, "global_step": 108518, "epoch": 896} {"train_loss": -38.5696907043457, "global_step": 108519, "epoch": 896} {"train_loss": -39.31108474731445, "global_step": 108520, "epoch": 896} {"train_loss": -38.8229866027832, "global_step": 108521, "epoch": 896} {"train_loss": -39.07304000854492, "global_step": 108522, "epoch": 896} {"train_loss": -39.23588562011719, "global_step": 108523, "epoch": 896} {"train_loss": -38.99041748046875, "global_step": 108524, "epoch": 896} {"train_loss": -39.316463470458984, "global_step": 108525, "epoch": 896} {"train_loss": -38.94674301147461, "global_step": 108526, "epoch": 896} {"train_loss": -39.313961029052734, "global_step": 108527, "epoch": 896} {"train_loss": -39.45827865600586, "global_step": 108528, "epoch": 896} {"train_loss": -39.21474075317383, "global_step": 108529, "epoch": 896} {"train_loss": -39.54543685913086, "global_step": 108530, "epoch": 896} {"train_loss": -39.320281982421875, "global_step": 108531, "epoch": 896} {"train_loss": -39.5536003112793, "global_step": 108532, "epoch": 896} {"train_loss": -39.3985710144043, "global_step": 108533, "epoch": 896} {"train_loss": -38.59660720825195, "global_step": 108534, "epoch": 896} {"train_loss": -39.52959060668945, "global_step": 108535, "epoch": 896} {"train_loss": -37.89789954886949, "global_step": 108536, "epoch": 896, "val_loss": 2686699.0} {"train_loss": -39.65156936645508, "global_step": 108537, "epoch": 897} {"train_loss": -39.4354248046875, "global_step": 108538, "epoch": 897} {"train_loss": -39.34747314453125, "global_step": 108539, "epoch": 897} {"train_loss": -38.4444580078125, "global_step": 108540, "epoch": 897} {"train_loss": -38.802364349365234, "global_step": 108541, "epoch": 897} {"train_loss": -39.125465393066406, "global_step": 108542, "epoch": 897} {"train_loss": -39.72886657714844, "global_step": 108543, "epoch": 897} {"train_loss": -39.982505798339844, "global_step": 108544, "epoch": 897} {"train_loss": -39.73682403564453, "global_step": 108545, "epoch": 897} {"train_loss": -39.77186965942383, "global_step": 108546, "epoch": 897} {"train_loss": -39.654293060302734, "global_step": 108547, "epoch": 897} {"train_loss": -39.82208251953125, "global_step": 108548, "epoch": 897} {"train_loss": -39.95232009887695, "global_step": 108549, "epoch": 897} {"train_loss": -40.00209426879883, "global_step": 108550, "epoch": 897} {"train_loss": -39.808589935302734, "global_step": 108551, "epoch": 897} {"train_loss": -39.508235931396484, "global_step": 108552, "epoch": 897} {"train_loss": -38.7245979309082, "global_step": 108553, "epoch": 897} {"train_loss": -38.71278381347656, "global_step": 108554, "epoch": 897} {"train_loss": -39.82341384887695, "global_step": 108555, "epoch": 897} {"train_loss": -40.124820709228516, "global_step": 108556, "epoch": 897} {"train_loss": -38.594810485839844, "global_step": 108557, "epoch": 897} {"train_loss": -33.58984375, "global_step": 108558, "epoch": 897} {"train_loss": -27.738611221313477, "global_step": 108559, "epoch": 897} {"train_loss": -33.740447998046875, "global_step": 108560, "epoch": 897} {"train_loss": -39.95566177368164, "global_step": 108561, "epoch": 897} {"train_loss": -34.832855224609375, "global_step": 108562, "epoch": 897} {"train_loss": -35.697689056396484, "global_step": 108563, "epoch": 897} {"train_loss": -39.820281982421875, "global_step": 108564, "epoch": 897} {"train_loss": -36.873592376708984, "global_step": 108565, "epoch": 897} {"train_loss": -38.84126663208008, "global_step": 108566, "epoch": 897} {"train_loss": -37.55987548828125, "global_step": 108567, "epoch": 897} {"train_loss": -36.92850875854492, "global_step": 108568, "epoch": 897} {"train_loss": -39.247188568115234, "global_step": 108569, "epoch": 897} {"train_loss": -36.626529693603516, "global_step": 108570, "epoch": 897} {"train_loss": -39.073081970214844, "global_step": 108571, "epoch": 897} {"train_loss": -36.90386962890625, "global_step": 108572, "epoch": 897} {"train_loss": -38.38694381713867, "global_step": 108573, "epoch": 897} {"train_loss": -37.612003326416016, "global_step": 108574, "epoch": 897} {"train_loss": -38.35334777832031, "global_step": 108575, "epoch": 897} {"train_loss": -37.9382438659668, "global_step": 108576, "epoch": 897} {"train_loss": -38.277156829833984, "global_step": 108577, "epoch": 897} {"train_loss": -38.06325912475586, "global_step": 108578, "epoch": 897} {"train_loss": -39.18691635131836, "global_step": 108579, "epoch": 897} {"train_loss": -33.301639556884766, "global_step": 108580, "epoch": 897} {"train_loss": -39.12870407104492, "global_step": 108581, "epoch": 897} {"train_loss": -37.93939971923828, "global_step": 108582, "epoch": 897} {"train_loss": -38.98408889770508, "global_step": 108583, "epoch": 897} {"train_loss": -36.22287368774414, "global_step": 108584, "epoch": 897} {"train_loss": -36.802242279052734, "global_step": 108585, "epoch": 897} {"train_loss": -37.823699951171875, "global_step": 108586, "epoch": 897} {"train_loss": -37.49848175048828, "global_step": 108587, "epoch": 897} {"train_loss": -39.059600830078125, "global_step": 108588, "epoch": 897} {"train_loss": -33.58343505859375, "global_step": 108589, "epoch": 897} {"train_loss": -34.648983001708984, "global_step": 108590, "epoch": 897} {"train_loss": -36.29795837402344, "global_step": 108591, "epoch": 897} {"train_loss": -30.96282958984375, "global_step": 108592, "epoch": 897} {"train_loss": -33.181060791015625, "global_step": 108593, "epoch": 897} {"train_loss": -35.37504196166992, "global_step": 108594, "epoch": 897} {"train_loss": -30.674041748046875, "global_step": 108595, "epoch": 897} {"train_loss": -33.459102630615234, "global_step": 108596, "epoch": 897} {"train_loss": -28.33546257019043, "global_step": 108597, "epoch": 897} {"train_loss": -32.54264450073242, "global_step": 108598, "epoch": 897} {"train_loss": -26.877408981323242, "global_step": 108599, "epoch": 897} {"train_loss": -27.216711044311523, "global_step": 108600, "epoch": 897} {"train_loss": -30.695165634155273, "global_step": 108601, "epoch": 897} {"train_loss": -29.71530532836914, "global_step": 108602, "epoch": 897} {"train_loss": -28.370336532592773, "global_step": 108603, "epoch": 897} {"train_loss": -32.962249755859375, "global_step": 108604, "epoch": 897} {"train_loss": -29.634613037109375, "global_step": 108605, "epoch": 897} {"train_loss": -32.45998001098633, "global_step": 108606, "epoch": 897} {"train_loss": -33.10541915893555, "global_step": 108607, "epoch": 897} {"train_loss": -34.05144119262695, "global_step": 108608, "epoch": 897} {"train_loss": -31.577726364135742, "global_step": 108609, "epoch": 897} {"train_loss": -31.066883087158203, "global_step": 108610, "epoch": 897} {"train_loss": -32.47636032104492, "global_step": 108611, "epoch": 897} {"train_loss": -32.4222297668457, "global_step": 108612, "epoch": 897} {"train_loss": -33.12053298950195, "global_step": 108613, "epoch": 897} {"train_loss": -34.64762878417969, "global_step": 108614, "epoch": 897} {"train_loss": -33.409507751464844, "global_step": 108615, "epoch": 897} {"train_loss": -34.59812545776367, "global_step": 108616, "epoch": 897} {"train_loss": -33.7667350769043, "global_step": 108617, "epoch": 897} {"train_loss": -34.00539016723633, "global_step": 108618, "epoch": 897} {"train_loss": -31.493818283081055, "global_step": 108619, "epoch": 897} {"train_loss": -34.24656295776367, "global_step": 108620, "epoch": 897} {"train_loss": -35.19609451293945, "global_step": 108621, "epoch": 897} {"train_loss": -34.47919464111328, "global_step": 108622, "epoch": 897} {"train_loss": -34.965118408203125, "global_step": 108623, "epoch": 897} {"train_loss": -35.5083122253418, "global_step": 108624, "epoch": 897} {"train_loss": -34.75202560424805, "global_step": 108625, "epoch": 897} {"train_loss": -35.82041549682617, "global_step": 108626, "epoch": 897} {"train_loss": -35.49673080444336, "global_step": 108627, "epoch": 897} {"train_loss": -35.542842864990234, "global_step": 108628, "epoch": 897} {"train_loss": -35.74110794067383, "global_step": 108629, "epoch": 897} {"train_loss": -34.01397705078125, "global_step": 108630, "epoch": 897} {"train_loss": -35.91714096069336, "global_step": 108631, "epoch": 897} {"train_loss": -35.661556243896484, "global_step": 108632, "epoch": 897} {"train_loss": -35.699378967285156, "global_step": 108633, "epoch": 897} {"train_loss": -36.07206344604492, "global_step": 108634, "epoch": 897} {"train_loss": -35.85676193237305, "global_step": 108635, "epoch": 897} {"train_loss": -36.28931427001953, "global_step": 108636, "epoch": 897} {"train_loss": -36.26119613647461, "global_step": 108637, "epoch": 897} {"train_loss": -36.93218994140625, "global_step": 108638, "epoch": 897} {"train_loss": -36.3785514831543, "global_step": 108639, "epoch": 897} {"train_loss": -36.776268005371094, "global_step": 108640, "epoch": 897} {"train_loss": -36.467403411865234, "global_step": 108641, "epoch": 897} {"train_loss": -36.7125358581543, "global_step": 108642, "epoch": 897} {"train_loss": -36.673927307128906, "global_step": 108643, "epoch": 897} {"train_loss": -36.616111755371094, "global_step": 108644, "epoch": 897} {"train_loss": -36.914424896240234, "global_step": 108645, "epoch": 897} {"train_loss": -37.281246185302734, "global_step": 108646, "epoch": 897} {"train_loss": -36.94698715209961, "global_step": 108647, "epoch": 897} {"train_loss": -37.06643295288086, "global_step": 108648, "epoch": 897} {"train_loss": -37.15869140625, "global_step": 108649, "epoch": 897} {"train_loss": -37.17890548706055, "global_step": 108650, "epoch": 897} {"train_loss": -36.73861312866211, "global_step": 108651, "epoch": 897} {"train_loss": -37.2854118347168, "global_step": 108652, "epoch": 897} {"train_loss": -36.85245895385742, "global_step": 108653, "epoch": 897} {"train_loss": -37.46332931518555, "global_step": 108654, "epoch": 897} {"train_loss": -37.14146423339844, "global_step": 108655, "epoch": 897} {"train_loss": -37.24074935913086, "global_step": 108656, "epoch": 897} {"train_loss": -35.98431986028498, "global_step": 108657, "epoch": 897, "val_loss": 2488522.25} {"train_loss": -37.4310417175293, "global_step": 108658, "epoch": 898} {"train_loss": -37.55558395385742, "global_step": 108659, "epoch": 898} {"train_loss": -37.709739685058594, "global_step": 108660, "epoch": 898} {"train_loss": -37.91665267944336, "global_step": 108661, "epoch": 898} {"train_loss": -37.5252685546875, "global_step": 108662, "epoch": 898} {"train_loss": -38.04787063598633, "global_step": 108663, "epoch": 898} {"train_loss": -38.174591064453125, "global_step": 108664, "epoch": 898} {"train_loss": -38.13335418701172, "global_step": 108665, "epoch": 898} {"train_loss": -37.935665130615234, "global_step": 108666, "epoch": 898} {"train_loss": -37.8499870300293, "global_step": 108667, "epoch": 898} {"train_loss": -38.30084228515625, "global_step": 108668, "epoch": 898} {"train_loss": -38.087642669677734, "global_step": 108669, "epoch": 898} {"train_loss": -37.60444259643555, "global_step": 108670, "epoch": 898} {"train_loss": -38.3867301940918, "global_step": 108671, "epoch": 898} {"train_loss": -37.94712829589844, "global_step": 108672, "epoch": 898} {"train_loss": -38.489131927490234, "global_step": 108673, "epoch": 898} {"train_loss": -37.865020751953125, "global_step": 108674, "epoch": 898} {"train_loss": -38.48354721069336, "global_step": 108675, "epoch": 898} {"train_loss": -38.46120834350586, "global_step": 108676, "epoch": 898} {"train_loss": -38.58451461791992, "global_step": 108677, "epoch": 898} {"train_loss": -38.69841384887695, "global_step": 108678, "epoch": 898} {"train_loss": -38.476619720458984, "global_step": 108679, "epoch": 898} {"train_loss": -38.765872955322266, "global_step": 108680, "epoch": 898} {"train_loss": -38.11568069458008, "global_step": 108681, "epoch": 898} {"train_loss": -38.328975677490234, "global_step": 108682, "epoch": 898} {"train_loss": -38.46382522583008, "global_step": 108683, "epoch": 898} {"train_loss": -38.9740104675293, "global_step": 108684, "epoch": 898} {"train_loss": -38.56343460083008, "global_step": 108685, "epoch": 898} {"train_loss": -38.98225784301758, "global_step": 108686, "epoch": 898} {"train_loss": -38.6160774230957, "global_step": 108687, "epoch": 898} {"train_loss": -38.750247955322266, "global_step": 108688, "epoch": 898} {"train_loss": -38.434261322021484, "global_step": 108689, "epoch": 898} {"train_loss": -38.6369514465332, "global_step": 108690, "epoch": 898} {"train_loss": -38.81135177612305, "global_step": 108691, "epoch": 898} {"train_loss": -38.78843307495117, "global_step": 108692, "epoch": 898} {"train_loss": -38.796302795410156, "global_step": 108693, "epoch": 898} {"train_loss": -39.137508392333984, "global_step": 108694, "epoch": 898} {"train_loss": -38.90245056152344, "global_step": 108695, "epoch": 898} {"train_loss": -38.694923400878906, "global_step": 108696, "epoch": 898} {"train_loss": -38.92121124267578, "global_step": 108697, "epoch": 898} {"train_loss": -39.06438064575195, "global_step": 108698, "epoch": 898} {"train_loss": -39.00315475463867, "global_step": 108699, "epoch": 898} {"train_loss": -39.082698822021484, "global_step": 108700, "epoch": 898} {"train_loss": -38.58419418334961, "global_step": 108701, "epoch": 898} {"train_loss": -38.006858825683594, "global_step": 108702, "epoch": 898} {"train_loss": -38.12678527832031, "global_step": 108703, "epoch": 898} {"train_loss": -38.3609504699707, "global_step": 108704, "epoch": 898} {"train_loss": -39.32310485839844, "global_step": 108705, "epoch": 898} {"train_loss": -38.90388488769531, "global_step": 108706, "epoch": 898} {"train_loss": -38.39459228515625, "global_step": 108707, "epoch": 898} {"train_loss": -37.81538391113281, "global_step": 108708, "epoch": 898} {"train_loss": -38.71993637084961, "global_step": 108709, "epoch": 898} {"train_loss": -38.8930778503418, "global_step": 108710, "epoch": 898} {"train_loss": -38.533809661865234, "global_step": 108711, "epoch": 898} {"train_loss": -37.3689079284668, "global_step": 108712, "epoch": 898} {"train_loss": -36.67116165161133, "global_step": 108713, "epoch": 898} {"train_loss": -38.594085693359375, "global_step": 108714, "epoch": 898} {"train_loss": -38.506404876708984, "global_step": 108715, "epoch": 898} {"train_loss": -38.17361068725586, "global_step": 108716, "epoch": 898} {"train_loss": -38.31279373168945, "global_step": 108717, "epoch": 898} {"train_loss": -38.4328498840332, "global_step": 108718, "epoch": 898} {"train_loss": -38.008056640625, "global_step": 108719, "epoch": 898} {"train_loss": -38.87031173706055, "global_step": 108720, "epoch": 898} {"train_loss": -38.91225051879883, "global_step": 108721, "epoch": 898} {"train_loss": -39.40164566040039, "global_step": 108722, "epoch": 898} {"train_loss": -39.02535629272461, "global_step": 108723, "epoch": 898} {"train_loss": -39.25827407836914, "global_step": 108724, "epoch": 898} {"train_loss": -38.887901306152344, "global_step": 108725, "epoch": 898} {"train_loss": -38.85358428955078, "global_step": 108726, "epoch": 898} {"train_loss": -38.89797592163086, "global_step": 108727, "epoch": 898} {"train_loss": -39.11333084106445, "global_step": 108728, "epoch": 898} {"train_loss": -39.08256912231445, "global_step": 108729, "epoch": 898} {"train_loss": -38.06996536254883, "global_step": 108730, "epoch": 898} {"train_loss": -38.907840728759766, "global_step": 108731, "epoch": 898} {"train_loss": -39.212928771972656, "global_step": 108732, "epoch": 898} {"train_loss": -39.039241790771484, "global_step": 108733, "epoch": 898} {"train_loss": -39.053619384765625, "global_step": 108734, "epoch": 898} {"train_loss": -37.85874557495117, "global_step": 108735, "epoch": 898} {"train_loss": -37.51736831665039, "global_step": 108736, "epoch": 898} {"train_loss": -37.341949462890625, "global_step": 108737, "epoch": 898} {"train_loss": -35.681846618652344, "global_step": 108738, "epoch": 898} {"train_loss": -34.739315032958984, "global_step": 108739, "epoch": 898} {"train_loss": -38.562129974365234, "global_step": 108740, "epoch": 898} {"train_loss": -33.135440826416016, "global_step": 108741, "epoch": 898} {"train_loss": -33.01984786987305, "global_step": 108742, "epoch": 898} {"train_loss": -32.93262481689453, "global_step": 108743, "epoch": 898} {"train_loss": -32.79782485961914, "global_step": 108744, "epoch": 898} {"train_loss": -33.01958084106445, "global_step": 108745, "epoch": 898} {"train_loss": -33.911231994628906, "global_step": 108746, "epoch": 898} {"train_loss": -32.959747314453125, "global_step": 108747, "epoch": 898} {"train_loss": -33.76267623901367, "global_step": 108748, "epoch": 898} {"train_loss": -33.88157272338867, "global_step": 108749, "epoch": 898} {"train_loss": -33.954254150390625, "global_step": 108750, "epoch": 898} {"train_loss": -33.27861022949219, "global_step": 108751, "epoch": 898} {"train_loss": -34.49879837036133, "global_step": 108752, "epoch": 898} {"train_loss": -33.50005340576172, "global_step": 108753, "epoch": 898} {"train_loss": -34.643157958984375, "global_step": 108754, "epoch": 898} {"train_loss": -34.05604934692383, "global_step": 108755, "epoch": 898} {"train_loss": -34.59527587890625, "global_step": 108756, "epoch": 898} {"train_loss": -34.79052734375, "global_step": 108757, "epoch": 898} {"train_loss": -34.98698043823242, "global_step": 108758, "epoch": 898} {"train_loss": -34.484893798828125, "global_step": 108759, "epoch": 898} {"train_loss": -35.0571174621582, "global_step": 108760, "epoch": 898} {"train_loss": -34.4964714050293, "global_step": 108761, "epoch": 898} {"train_loss": -35.12663650512695, "global_step": 108762, "epoch": 898} {"train_loss": -34.74742126464844, "global_step": 108763, "epoch": 898} {"train_loss": -35.40554428100586, "global_step": 108764, "epoch": 898} {"train_loss": -34.620418548583984, "global_step": 108765, "epoch": 898} {"train_loss": -35.79207229614258, "global_step": 108766, "epoch": 898} {"train_loss": -35.241058349609375, "global_step": 108767, "epoch": 898} {"train_loss": -35.8094596862793, "global_step": 108768, "epoch": 898} {"train_loss": -35.33433151245117, "global_step": 108769, "epoch": 898} {"train_loss": -34.60135269165039, "global_step": 108770, "epoch": 898} {"train_loss": -34.00979232788086, "global_step": 108771, "epoch": 898} {"train_loss": -32.272804260253906, "global_step": 108772, "epoch": 898} {"train_loss": -29.6364688873291, "global_step": 108773, "epoch": 898} {"train_loss": -30.19474220275879, "global_step": 108774, "epoch": 898} {"train_loss": -34.70437240600586, "global_step": 108775, "epoch": 898} {"train_loss": -35.49519729614258, "global_step": 108776, "epoch": 898} {"train_loss": -34.27315139770508, "global_step": 108777, "epoch": 898} {"train_loss": -37.02515931562944, "global_step": 108778, "epoch": 898, "val_loss": 2519178.0} {"train_loss": -35.365997314453125, "global_step": 108779, "epoch": 899} {"train_loss": -36.097511291503906, "global_step": 108780, "epoch": 899} {"train_loss": -36.96989059448242, "global_step": 108781, "epoch": 899} {"train_loss": -36.597572326660156, "global_step": 108782, "epoch": 899} {"train_loss": -36.6324577331543, "global_step": 108783, "epoch": 899} {"train_loss": -35.62971878051758, "global_step": 108784, "epoch": 899} {"train_loss": -30.413532257080078, "global_step": 108785, "epoch": 899} {"train_loss": -14.190652847290039, "global_step": 108786, "epoch": 899} {"train_loss": -13.170477867126465, "global_step": 108787, "epoch": 899} {"train_loss": -37.08474349975586, "global_step": 108788, "epoch": 899} {"train_loss": -21.854965209960938, "global_step": 108789, "epoch": 899} {"train_loss": -34.20618438720703, "global_step": 108790, "epoch": 899} {"train_loss": -24.29515266418457, "global_step": 108791, "epoch": 899} {"train_loss": -34.491424560546875, "global_step": 108792, "epoch": 899} {"train_loss": -25.76173210144043, "global_step": 108793, "epoch": 899} {"train_loss": -35.07284164428711, "global_step": 108794, "epoch": 899} {"train_loss": -31.165679931640625, "global_step": 108795, "epoch": 899} {"train_loss": -32.2005500793457, "global_step": 108796, "epoch": 899} {"train_loss": -35.61472702026367, "global_step": 108797, "epoch": 899} {"train_loss": -33.42562484741211, "global_step": 108798, "epoch": 899} {"train_loss": -33.55524826049805, "global_step": 108799, "epoch": 899} {"train_loss": -36.7541389465332, "global_step": 108800, "epoch": 899} {"train_loss": -34.760135650634766, "global_step": 108801, "epoch": 899} {"train_loss": -34.425289154052734, "global_step": 108802, "epoch": 899} {"train_loss": -36.74710464477539, "global_step": 108803, "epoch": 899} {"train_loss": -35.9613151550293, "global_step": 108804, "epoch": 899} {"train_loss": -35.247093200683594, "global_step": 108805, "epoch": 899} {"train_loss": -36.48404312133789, "global_step": 108806, "epoch": 899} {"train_loss": -36.41070556640625, "global_step": 108807, "epoch": 899} {"train_loss": -36.28158187866211, "global_step": 108808, "epoch": 899} {"train_loss": -36.53279495239258, "global_step": 108809, "epoch": 899} {"train_loss": -36.106807708740234, "global_step": 108810, "epoch": 899} {"train_loss": -37.09009552001953, "global_step": 108811, "epoch": 899} {"train_loss": -37.07612991333008, "global_step": 108812, "epoch": 899} {"train_loss": -36.254703521728516, "global_step": 108813, "epoch": 899} {"train_loss": -36.312904357910156, "global_step": 108814, "epoch": 899} {"train_loss": -36.0277214050293, "global_step": 108815, "epoch": 899} {"train_loss": -37.00751495361328, "global_step": 108816, "epoch": 899} {"train_loss": -37.04177474975586, "global_step": 108817, "epoch": 899} {"train_loss": -36.62116622924805, "global_step": 108818, "epoch": 899} {"train_loss": -37.15557861328125, "global_step": 108819, "epoch": 899} {"train_loss": -37.336910247802734, "global_step": 108820, "epoch": 899} {"train_loss": -37.08967971801758, "global_step": 108821, "epoch": 899} {"train_loss": -37.01215362548828, "global_step": 108822, "epoch": 899} {"train_loss": -37.7677001953125, "global_step": 108823, "epoch": 899} {"train_loss": -37.03800582885742, "global_step": 108824, "epoch": 899} {"train_loss": -37.3826789855957, "global_step": 108825, "epoch": 899} {"train_loss": -37.57632827758789, "global_step": 108826, "epoch": 899} {"train_loss": -37.797054290771484, "global_step": 108827, "epoch": 899} {"train_loss": -37.90991973876953, "global_step": 108828, "epoch": 899} {"train_loss": -38.159095764160156, "global_step": 108829, "epoch": 899} {"train_loss": -37.94694900512695, "global_step": 108830, "epoch": 899} {"train_loss": -38.0149040222168, "global_step": 108831, "epoch": 899} {"train_loss": -36.993019104003906, "global_step": 108832, "epoch": 899} {"train_loss": -37.66071319580078, "global_step": 108833, "epoch": 899} {"train_loss": -37.51326370239258, "global_step": 108834, "epoch": 899} {"train_loss": -38.15557861328125, "global_step": 108835, "epoch": 899} {"train_loss": -38.147762298583984, "global_step": 108836, "epoch": 899} {"train_loss": -37.444976806640625, "global_step": 108837, "epoch": 899} {"train_loss": -38.5074348449707, "global_step": 108838, "epoch": 899} {"train_loss": -37.927364349365234, "global_step": 108839, "epoch": 899} {"train_loss": -37.9918327331543, "global_step": 108840, "epoch": 899} {"train_loss": -38.21537399291992, "global_step": 108841, "epoch": 899} {"train_loss": -38.35260772705078, "global_step": 108842, "epoch": 899} {"train_loss": -38.69585037231445, "global_step": 108843, "epoch": 899} {"train_loss": -38.52605056762695, "global_step": 108844, "epoch": 899} {"train_loss": -38.535552978515625, "global_step": 108845, "epoch": 899} {"train_loss": -37.59206771850586, "global_step": 108846, "epoch": 899} {"train_loss": -37.860355377197266, "global_step": 108847, "epoch": 899} {"train_loss": -37.29341506958008, "global_step": 108848, "epoch": 899} {"train_loss": -38.52970504760742, "global_step": 108849, "epoch": 899} {"train_loss": -38.51923370361328, "global_step": 108850, "epoch": 899} {"train_loss": -37.2984504699707, "global_step": 108851, "epoch": 899} {"train_loss": -38.49169158935547, "global_step": 108852, "epoch": 899} {"train_loss": -38.489959716796875, "global_step": 108853, "epoch": 899} {"train_loss": -38.52263641357422, "global_step": 108854, "epoch": 899} {"train_loss": -38.40494155883789, "global_step": 108855, "epoch": 899} {"train_loss": -38.712158203125, "global_step": 108856, "epoch": 899} {"train_loss": -36.705692291259766, "global_step": 108857, "epoch": 899} {"train_loss": -36.74569320678711, "global_step": 108858, "epoch": 899} {"train_loss": -33.57592010498047, "global_step": 108859, "epoch": 899} {"train_loss": -26.284687042236328, "global_step": 108860, "epoch": 899} {"train_loss": -22.93242835998535, "global_step": 108861, "epoch": 899} {"train_loss": -34.490631103515625, "global_step": 108862, "epoch": 899} {"train_loss": -36.151206970214844, "global_step": 108863, "epoch": 899} {"train_loss": -30.493268966674805, "global_step": 108864, "epoch": 899} {"train_loss": -37.45244216918945, "global_step": 108865, "epoch": 899} {"train_loss": -34.308982849121094, "global_step": 108866, "epoch": 899} {"train_loss": -35.947357177734375, "global_step": 108867, "epoch": 899} {"train_loss": -36.35622787475586, "global_step": 108868, "epoch": 899} {"train_loss": -36.674774169921875, "global_step": 108869, "epoch": 899} {"train_loss": -36.39988327026367, "global_step": 108870, "epoch": 899} {"train_loss": -37.249141693115234, "global_step": 108871, "epoch": 899} {"train_loss": -35.800994873046875, "global_step": 108872, "epoch": 899} {"train_loss": -37.57483673095703, "global_step": 108873, "epoch": 899} {"train_loss": -37.100460052490234, "global_step": 108874, "epoch": 899} {"train_loss": -37.43776321411133, "global_step": 108875, "epoch": 899} {"train_loss": -37.69639205932617, "global_step": 108876, "epoch": 899} {"train_loss": -37.17620849609375, "global_step": 108877, "epoch": 899} {"train_loss": -37.8801155090332, "global_step": 108878, "epoch": 899} {"train_loss": -37.4986572265625, "global_step": 108879, "epoch": 899} {"train_loss": -37.94704818725586, "global_step": 108880, "epoch": 899} {"train_loss": -36.803646087646484, "global_step": 108881, "epoch": 899} {"train_loss": -37.7982063293457, "global_step": 108882, "epoch": 899} {"train_loss": -37.884063720703125, "global_step": 108883, "epoch": 899} {"train_loss": -36.68435287475586, "global_step": 108884, "epoch": 899} {"train_loss": -37.62272262573242, "global_step": 108885, "epoch": 899} {"train_loss": -37.02790451049805, "global_step": 108886, "epoch": 899} {"train_loss": -37.510345458984375, "global_step": 108887, "epoch": 899} {"train_loss": -38.1465950012207, "global_step": 108888, "epoch": 899} {"train_loss": -38.202205657958984, "global_step": 108889, "epoch": 899} {"train_loss": -38.29036331176758, "global_step": 108890, "epoch": 899} {"train_loss": -38.163368225097656, "global_step": 108891, "epoch": 899} {"train_loss": -38.05738830566406, "global_step": 108892, "epoch": 899} {"train_loss": -38.26781463623047, "global_step": 108893, "epoch": 899} {"train_loss": -38.0904426574707, "global_step": 108894, "epoch": 899} {"train_loss": -36.71364974975586, "global_step": 108895, "epoch": 899} {"train_loss": -37.566585540771484, "global_step": 108896, "epoch": 899} {"train_loss": -37.41466522216797, "global_step": 108897, "epoch": 899} {"train_loss": -38.29702377319336, "global_step": 108898, "epoch": 899} {"train_loss": -35.93219713731246, "global_step": 108899, "epoch": 899, "val_loss": 2656074.0} {"train_loss": -37.77849197387695, "global_step": 108900, "epoch": 900} {"train_loss": -37.7757568359375, "global_step": 108901, "epoch": 900} {"train_loss": -37.759368896484375, "global_step": 108902, "epoch": 900} {"train_loss": -35.2819709777832, "global_step": 108903, "epoch": 900} {"train_loss": -36.511634826660156, "global_step": 108904, "epoch": 900} {"train_loss": -36.679344177246094, "global_step": 108905, "epoch": 900} {"train_loss": -37.95978927612305, "global_step": 108906, "epoch": 900} {"train_loss": -34.28828811645508, "global_step": 108907, "epoch": 900} {"train_loss": -37.449005126953125, "global_step": 108908, "epoch": 900} {"train_loss": -35.6249885559082, "global_step": 108909, "epoch": 900} {"train_loss": -30.699323654174805, "global_step": 108910, "epoch": 900} {"train_loss": -30.391199111938477, "global_step": 108911, "epoch": 900} {"train_loss": -35.41726303100586, "global_step": 108912, "epoch": 900} {"train_loss": -33.60081100463867, "global_step": 108913, "epoch": 900} {"train_loss": -28.922962188720703, "global_step": 108914, "epoch": 900} {"train_loss": -35.392669677734375, "global_step": 108915, "epoch": 900} {"train_loss": -34.389137268066406, "global_step": 108916, "epoch": 900} {"train_loss": -34.37948226928711, "global_step": 108917, "epoch": 900} {"train_loss": -32.875450134277344, "global_step": 108918, "epoch": 900} {"train_loss": -32.566158294677734, "global_step": 108919, "epoch": 900} {"train_loss": -35.13148880004883, "global_step": 108920, "epoch": 900} {"train_loss": -33.869354248046875, "global_step": 108921, "epoch": 900} {"train_loss": -34.29024887084961, "global_step": 108922, "epoch": 900} {"train_loss": -35.754493713378906, "global_step": 108923, "epoch": 900} {"train_loss": -33.768104553222656, "global_step": 108924, "epoch": 900} {"train_loss": -37.4390869140625, "global_step": 108925, "epoch": 900} {"train_loss": -34.21941375732422, "global_step": 108926, "epoch": 900} {"train_loss": -35.865631103515625, "global_step": 108927, "epoch": 900} {"train_loss": -37.2855110168457, "global_step": 108928, "epoch": 900} {"train_loss": -34.71156692504883, "global_step": 108929, "epoch": 900} {"train_loss": -35.768951416015625, "global_step": 108930, "epoch": 900} {"train_loss": -36.85865020751953, "global_step": 108931, "epoch": 900} {"train_loss": -35.524757385253906, "global_step": 108932, "epoch": 900} {"train_loss": -36.34979248046875, "global_step": 108933, "epoch": 900} {"train_loss": -37.54262924194336, "global_step": 108934, "epoch": 900} {"train_loss": -36.14052963256836, "global_step": 108935, "epoch": 900} {"train_loss": -37.11638641357422, "global_step": 108936, "epoch": 900} {"train_loss": -37.361419677734375, "global_step": 108937, "epoch": 900} {"train_loss": -36.9984245300293, "global_step": 108938, "epoch": 900} {"train_loss": -36.33799743652344, "global_step": 108939, "epoch": 900} {"train_loss": -36.76229476928711, "global_step": 108940, "epoch": 900} {"train_loss": -37.49702072143555, "global_step": 108941, "epoch": 900} {"train_loss": -37.01311111450195, "global_step": 108942, "epoch": 900} {"train_loss": -37.362464904785156, "global_step": 108943, "epoch": 900} {"train_loss": -36.98192596435547, "global_step": 108944, "epoch": 900} {"train_loss": -37.659358978271484, "global_step": 108945, "epoch": 900} {"train_loss": -37.67060089111328, "global_step": 108946, "epoch": 900} {"train_loss": -37.31986618041992, "global_step": 108947, "epoch": 900} {"train_loss": -37.493446350097656, "global_step": 108948, "epoch": 900} {"train_loss": -37.41877746582031, "global_step": 108949, "epoch": 900} {"train_loss": -37.34308624267578, "global_step": 108950, "epoch": 900} {"train_loss": -37.86198425292969, "global_step": 108951, "epoch": 900} {"train_loss": -37.33041000366211, "global_step": 108952, "epoch": 900} {"train_loss": -38.028175354003906, "global_step": 108953, "epoch": 900} {"train_loss": -38.048133850097656, "global_step": 108954, "epoch": 900} {"train_loss": -37.861263275146484, "global_step": 108955, "epoch": 900} {"train_loss": -37.04816818237305, "global_step": 108956, "epoch": 900} {"train_loss": -36.42353439331055, "global_step": 108957, "epoch": 900} {"train_loss": -37.885009765625, "global_step": 108958, "epoch": 900} {"train_loss": -37.78144073486328, "global_step": 108959, "epoch": 900} {"train_loss": -38.34552764892578, "global_step": 108960, "epoch": 900} {"train_loss": -37.91997146606445, "global_step": 108961, "epoch": 900} {"train_loss": -37.761714935302734, "global_step": 108962, "epoch": 900} {"train_loss": -38.38762283325195, "global_step": 108963, "epoch": 900} {"train_loss": -37.213626861572266, "global_step": 108964, "epoch": 900} {"train_loss": -37.94004821777344, "global_step": 108965, "epoch": 900} {"train_loss": -37.929954528808594, "global_step": 108966, "epoch": 900} {"train_loss": -38.59941864013672, "global_step": 108967, "epoch": 900} {"train_loss": -38.08674240112305, "global_step": 108968, "epoch": 900} {"train_loss": -38.40451431274414, "global_step": 108969, "epoch": 900} {"train_loss": -37.661399841308594, "global_step": 108970, "epoch": 900} {"train_loss": -37.580604553222656, "global_step": 108971, "epoch": 900} {"train_loss": -38.42216110229492, "global_step": 108972, "epoch": 900} {"train_loss": -38.588134765625, "global_step": 108973, "epoch": 900} {"train_loss": -38.14509201049805, "global_step": 108974, "epoch": 900} {"train_loss": -38.714599609375, "global_step": 108975, "epoch": 900} {"train_loss": -38.723716735839844, "global_step": 108976, "epoch": 900} {"train_loss": -38.546417236328125, "global_step": 108977, "epoch": 900} {"train_loss": -38.630348205566406, "global_step": 108978, "epoch": 900} {"train_loss": -38.85913848876953, "global_step": 108979, "epoch": 900} {"train_loss": -38.708465576171875, "global_step": 108980, "epoch": 900} {"train_loss": -38.65281295776367, "global_step": 108981, "epoch": 900} {"train_loss": -38.5396842956543, "global_step": 108982, "epoch": 900} {"train_loss": -38.7213020324707, "global_step": 108983, "epoch": 900} {"train_loss": -38.28208541870117, "global_step": 108984, "epoch": 900} {"train_loss": -38.18578338623047, "global_step": 108985, "epoch": 900} {"train_loss": -37.03213119506836, "global_step": 108986, "epoch": 900} {"train_loss": -38.76876449584961, "global_step": 108987, "epoch": 900} {"train_loss": -36.95323181152344, "global_step": 108988, "epoch": 900} {"train_loss": -36.416412353515625, "global_step": 108989, "epoch": 900} {"train_loss": -38.21079635620117, "global_step": 108990, "epoch": 900} {"train_loss": -38.64118576049805, "global_step": 108991, "epoch": 900} {"train_loss": -37.51564025878906, "global_step": 108992, "epoch": 900} {"train_loss": -37.3900032043457, "global_step": 108993, "epoch": 900} {"train_loss": -38.72443389892578, "global_step": 108994, "epoch": 900} {"train_loss": -38.15717697143555, "global_step": 108995, "epoch": 900} {"train_loss": -35.503379821777344, "global_step": 108996, "epoch": 900} {"train_loss": -37.06354522705078, "global_step": 108997, "epoch": 900} {"train_loss": -36.61945724487305, "global_step": 108998, "epoch": 900} {"train_loss": -35.94521713256836, "global_step": 108999, "epoch": 900} {"train_loss": -37.36014175415039, "global_step": 109000, "epoch": 900} {"train_loss": -37.503116607666016, "global_step": 109001, "epoch": 900} {"train_loss": -37.44850540161133, "global_step": 109002, "epoch": 900} {"train_loss": -37.88071060180664, "global_step": 109003, "epoch": 900} {"train_loss": -37.83113479614258, "global_step": 109004, "epoch": 900} {"train_loss": -36.44230270385742, "global_step": 109005, "epoch": 900} {"train_loss": -37.162269592285156, "global_step": 109006, "epoch": 900} {"train_loss": -36.591487884521484, "global_step": 109007, "epoch": 900} {"train_loss": -37.46231460571289, "global_step": 109008, "epoch": 900} {"train_loss": -37.5770149230957, "global_step": 109009, "epoch": 900} {"train_loss": -37.38131332397461, "global_step": 109010, "epoch": 900} {"train_loss": -36.76484298706055, "global_step": 109011, "epoch": 900} {"train_loss": -37.78836441040039, "global_step": 109012, "epoch": 900} {"train_loss": -35.95148849487305, "global_step": 109013, "epoch": 900} {"train_loss": -37.1313362121582, "global_step": 109014, "epoch": 900} {"train_loss": -37.37376022338867, "global_step": 109015, "epoch": 900} {"train_loss": -37.01009750366211, "global_step": 109016, "epoch": 900} {"train_loss": -36.69893264770508, "global_step": 109017, "epoch": 900} {"train_loss": -37.11537551879883, "global_step": 109018, "epoch": 900} {"train_loss": -37.08514404296875, "global_step": 109019, "epoch": 900} {"train_loss": -36.86827065333847, "global_step": 109020, "epoch": 900, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4400000": 1.0, "test/sim_max_reward_4400001": 1.0, "test/sim_max_reward_4400002": 1.0, "test/sim_max_reward_4400003": 1.0, "test/sim_max_reward_4400004": 1.0, "test/sim_max_reward_4400005": 1.0, "test/sim_max_reward_4400006": 1.0, "test/sim_max_reward_4400007": 1.0, "test/sim_max_reward_4400008": 1.0, "test/sim_max_reward_4400009": 1.0, "test/sim_max_reward_4400010": 1.0, "test/sim_max_reward_4400011": 1.0, "test/sim_max_reward_4400012": 1.0, "test/sim_max_reward_4400013": 1.0, "test/sim_max_reward_4400014": 1.0, "test/sim_max_reward_4400015": 1.0, "test/sim_max_reward_4400016": 1.0, "test/sim_max_reward_4400017": 1.0, "test/sim_max_reward_4400018": 1.0, "test/sim_max_reward_4400019": 1.0, "test/sim_max_reward_4400020": 1.0, "test/sim_max_reward_4400021": 1.0, "train/mean_score": 1.0, "test/mean_score": 1.0, "val_loss": 2516838.75} {"train_loss": -37.42905807495117, "global_step": 109021, "epoch": 901} {"train_loss": -37.138668060302734, "global_step": 109022, "epoch": 901} {"train_loss": -37.55543899536133, "global_step": 109023, "epoch": 901} {"train_loss": -36.9211311340332, "global_step": 109024, "epoch": 901} {"train_loss": -37.00410079956055, "global_step": 109025, "epoch": 901} {"train_loss": -38.208656311035156, "global_step": 109026, "epoch": 901} {"train_loss": -38.11033630371094, "global_step": 109027, "epoch": 901} {"train_loss": -37.884735107421875, "global_step": 109028, "epoch": 901} {"train_loss": -38.108463287353516, "global_step": 109029, "epoch": 901} {"train_loss": -38.40399169921875, "global_step": 109030, "epoch": 901} {"train_loss": -37.467041015625, "global_step": 109031, "epoch": 901} {"train_loss": -38.10892105102539, "global_step": 109032, "epoch": 901} {"train_loss": -37.9471549987793, "global_step": 109033, "epoch": 901} {"train_loss": -38.695682525634766, "global_step": 109034, "epoch": 901} {"train_loss": -36.9971809387207, "global_step": 109035, "epoch": 901} {"train_loss": -38.17870330810547, "global_step": 109036, "epoch": 901} {"train_loss": -37.97610092163086, "global_step": 109037, "epoch": 901} {"train_loss": -37.557823181152344, "global_step": 109038, "epoch": 901} {"train_loss": -38.183712005615234, "global_step": 109039, "epoch": 901} {"train_loss": -38.709957122802734, "global_step": 109040, "epoch": 901} {"train_loss": -38.17938995361328, "global_step": 109041, "epoch": 901} {"train_loss": -38.35636520385742, "global_step": 109042, "epoch": 901} {"train_loss": -37.787353515625, "global_step": 109043, "epoch": 901} {"train_loss": -37.70142364501953, "global_step": 109044, "epoch": 901} {"train_loss": -37.706703186035156, "global_step": 109045, "epoch": 901} {"train_loss": -37.86598587036133, "global_step": 109046, "epoch": 901} {"train_loss": -38.594642639160156, "global_step": 109047, "epoch": 901} {"train_loss": -37.301021575927734, "global_step": 109048, "epoch": 901} {"train_loss": -37.710758209228516, "global_step": 109049, "epoch": 901} {"train_loss": -38.19724655151367, "global_step": 109050, "epoch": 901} {"train_loss": -39.01089096069336, "global_step": 109051, "epoch": 901} {"train_loss": -33.38602828979492, "global_step": 109052, "epoch": 901} {"train_loss": -37.7131462097168, "global_step": 109053, "epoch": 901} {"train_loss": -39.10633087158203, "global_step": 109054, "epoch": 901} {"train_loss": -38.6651725769043, "global_step": 109055, "epoch": 901} {"train_loss": -38.22780227661133, "global_step": 109056, "epoch": 901} {"train_loss": -38.90144348144531, "global_step": 109057, "epoch": 901} {"train_loss": -37.45608139038086, "global_step": 109058, "epoch": 901} {"train_loss": -38.895965576171875, "global_step": 109059, "epoch": 901} {"train_loss": -38.623199462890625, "global_step": 109060, "epoch": 901} {"train_loss": -38.25166320800781, "global_step": 109061, "epoch": 901} {"train_loss": -38.294647216796875, "global_step": 109062, "epoch": 901} {"train_loss": -38.93501663208008, "global_step": 109063, "epoch": 901} {"train_loss": -37.85749816894531, "global_step": 109064, "epoch": 901} {"train_loss": -37.880126953125, "global_step": 109065, "epoch": 901} {"train_loss": -38.006107330322266, "global_step": 109066, "epoch": 901} {"train_loss": -35.759559631347656, "global_step": 109067, "epoch": 901} {"train_loss": -36.26835250854492, "global_step": 109068, "epoch": 901} {"train_loss": -37.619110107421875, "global_step": 109069, "epoch": 901} {"train_loss": -37.59299850463867, "global_step": 109070, "epoch": 901} {"train_loss": -37.756996154785156, "global_step": 109071, "epoch": 901} {"train_loss": -36.39844512939453, "global_step": 109072, "epoch": 901} {"train_loss": -34.9194221496582, "global_step": 109073, "epoch": 901} {"train_loss": -35.880859375, "global_step": 109074, "epoch": 901} {"train_loss": -36.79429244995117, "global_step": 109075, "epoch": 901} {"train_loss": -36.5124397277832, "global_step": 109076, "epoch": 901} {"train_loss": -32.19215774536133, "global_step": 109077, "epoch": 901} {"train_loss": -32.64777755737305, "global_step": 109078, "epoch": 901} {"train_loss": -37.72771072387695, "global_step": 109079, "epoch": 901} {"train_loss": -35.22913360595703, "global_step": 109080, "epoch": 901} {"train_loss": -34.14381408691406, "global_step": 109081, "epoch": 901} {"train_loss": -38.2254638671875, "global_step": 109082, "epoch": 901} {"train_loss": -35.56941604614258, "global_step": 109083, "epoch": 901} {"train_loss": -37.9619026184082, "global_step": 109084, "epoch": 901} {"train_loss": -32.83378219604492, "global_step": 109085, "epoch": 901} {"train_loss": -37.27602767944336, "global_step": 109086, "epoch": 901} {"train_loss": -36.224090576171875, "global_step": 109087, "epoch": 901} {"train_loss": -37.89919662475586, "global_step": 109088, "epoch": 901} {"train_loss": -36.76158905029297, "global_step": 109089, "epoch": 901} {"train_loss": -38.163082122802734, "global_step": 109090, "epoch": 901} {"train_loss": -37.63783264160156, "global_step": 109091, "epoch": 901} {"train_loss": -35.89620590209961, "global_step": 109092, "epoch": 901} {"train_loss": -37.27616500854492, "global_step": 109093, "epoch": 901} {"train_loss": -36.801544189453125, "global_step": 109094, "epoch": 901} {"train_loss": -33.71918487548828, "global_step": 109095, "epoch": 901} {"train_loss": -37.75283432006836, "global_step": 109096, "epoch": 901} {"train_loss": -37.2080192565918, "global_step": 109097, "epoch": 901} {"train_loss": -37.15441131591797, "global_step": 109098, "epoch": 901} {"train_loss": -36.501216888427734, "global_step": 109099, "epoch": 901} {"train_loss": -35.737796783447266, "global_step": 109100, "epoch": 901} {"train_loss": -37.1702880859375, "global_step": 109101, "epoch": 901} {"train_loss": -36.04071044921875, "global_step": 109102, "epoch": 901} {"train_loss": -36.898590087890625, "global_step": 109103, "epoch": 901} {"train_loss": -34.8026237487793, "global_step": 109104, "epoch": 901} {"train_loss": -36.456024169921875, "global_step": 109105, "epoch": 901} {"train_loss": -37.32978820800781, "global_step": 109106, "epoch": 901} {"train_loss": -35.749732971191406, "global_step": 109107, "epoch": 901} {"train_loss": -35.641090393066406, "global_step": 109108, "epoch": 901} {"train_loss": -36.791114807128906, "global_step": 109109, "epoch": 901} {"train_loss": -37.4005126953125, "global_step": 109110, "epoch": 901} {"train_loss": -35.72826385498047, "global_step": 109111, "epoch": 901} {"train_loss": -37.32624435424805, "global_step": 109112, "epoch": 901} {"train_loss": -37.73960494995117, "global_step": 109113, "epoch": 901} {"train_loss": -36.73016357421875, "global_step": 109114, "epoch": 901} {"train_loss": -36.89323806762695, "global_step": 109115, "epoch": 901} {"train_loss": -36.2236328125, "global_step": 109116, "epoch": 901} {"train_loss": -36.659423828125, "global_step": 109117, "epoch": 901} {"train_loss": -37.16634750366211, "global_step": 109118, "epoch": 901} {"train_loss": -36.99824905395508, "global_step": 109119, "epoch": 901} {"train_loss": -36.3243293762207, "global_step": 109120, "epoch": 901} {"train_loss": -38.02524948120117, "global_step": 109121, "epoch": 901} {"train_loss": -37.72784423828125, "global_step": 109122, "epoch": 901} {"train_loss": -37.3709831237793, "global_step": 109123, "epoch": 901} {"train_loss": -37.94343566894531, "global_step": 109124, "epoch": 901} {"train_loss": -38.329627990722656, "global_step": 109125, "epoch": 901} {"train_loss": -37.55130386352539, "global_step": 109126, "epoch": 901} {"train_loss": -37.99203109741211, "global_step": 109127, "epoch": 901} {"train_loss": -37.7216796875, "global_step": 109128, "epoch": 901} {"train_loss": -38.247894287109375, "global_step": 109129, "epoch": 901} {"train_loss": -37.80219268798828, "global_step": 109130, "epoch": 901} {"train_loss": -37.05733871459961, "global_step": 109131, "epoch": 901} {"train_loss": -38.452232360839844, "global_step": 109132, "epoch": 901} {"train_loss": -37.885093688964844, "global_step": 109133, "epoch": 901} {"train_loss": -37.70663070678711, "global_step": 109134, "epoch": 901} {"train_loss": -38.49604415893555, "global_step": 109135, "epoch": 901} {"train_loss": -37.74066162109375, "global_step": 109136, "epoch": 901} {"train_loss": -37.85588073730469, "global_step": 109137, "epoch": 901} {"train_loss": -37.95107650756836, "global_step": 109138, "epoch": 901} {"train_loss": -38.111000061035156, "global_step": 109139, "epoch": 901} {"train_loss": -38.64227294921875, "global_step": 109140, "epoch": 901} {"train_loss": -37.2581338488366, "global_step": 109141, "epoch": 901, "val_loss": 2571591.25} {"train_loss": -37.6651496887207, "global_step": 109142, "epoch": 902} {"train_loss": -38.797264099121094, "global_step": 109143, "epoch": 902} {"train_loss": -38.17323684692383, "global_step": 109144, "epoch": 902} {"train_loss": -38.55466842651367, "global_step": 109145, "epoch": 902} {"train_loss": -37.851497650146484, "global_step": 109146, "epoch": 902} {"train_loss": -38.2875862121582, "global_step": 109147, "epoch": 902} {"train_loss": -38.592872619628906, "global_step": 109148, "epoch": 902} {"train_loss": -38.51272201538086, "global_step": 109149, "epoch": 902} {"train_loss": -37.96160125732422, "global_step": 109150, "epoch": 902} {"train_loss": -38.231380462646484, "global_step": 109151, "epoch": 902} {"train_loss": -38.61745071411133, "global_step": 109152, "epoch": 902} {"train_loss": -38.3399658203125, "global_step": 109153, "epoch": 902} {"train_loss": -38.17195510864258, "global_step": 109154, "epoch": 902} {"train_loss": -38.44816207885742, "global_step": 109155, "epoch": 902} {"train_loss": -38.65802764892578, "global_step": 109156, "epoch": 902} {"train_loss": -37.43088912963867, "global_step": 109157, "epoch": 902} {"train_loss": -38.675384521484375, "global_step": 109158, "epoch": 902} {"train_loss": -38.69172668457031, "global_step": 109159, "epoch": 902} {"train_loss": -38.606788635253906, "global_step": 109160, "epoch": 902} {"train_loss": -38.728214263916016, "global_step": 109161, "epoch": 902} {"train_loss": -38.48124313354492, "global_step": 109162, "epoch": 902} {"train_loss": -39.20347595214844, "global_step": 109163, "epoch": 902} {"train_loss": -38.355377197265625, "global_step": 109164, "epoch": 902} {"train_loss": -37.495399475097656, "global_step": 109165, "epoch": 902} {"train_loss": -33.69072341918945, "global_step": 109166, "epoch": 902} {"train_loss": -30.2719669342041, "global_step": 109167, "epoch": 902} {"train_loss": -26.788806915283203, "global_step": 109168, "epoch": 902} {"train_loss": -34.46883010864258, "global_step": 109169, "epoch": 902} {"train_loss": -37.1502799987793, "global_step": 109170, "epoch": 902} {"train_loss": -29.975204467773438, "global_step": 109171, "epoch": 902} {"train_loss": -37.23285675048828, "global_step": 109172, "epoch": 902} {"train_loss": -35.40058898925781, "global_step": 109173, "epoch": 902} {"train_loss": -35.724605560302734, "global_step": 109174, "epoch": 902} {"train_loss": -36.89094924926758, "global_step": 109175, "epoch": 902} {"train_loss": -34.7626838684082, "global_step": 109176, "epoch": 902} {"train_loss": -37.940765380859375, "global_step": 109177, "epoch": 902} {"train_loss": -36.736846923828125, "global_step": 109178, "epoch": 902} {"train_loss": -38.571380615234375, "global_step": 109179, "epoch": 902} {"train_loss": -36.780391693115234, "global_step": 109180, "epoch": 902} {"train_loss": -36.04085159301758, "global_step": 109181, "epoch": 902} {"train_loss": -36.91022872924805, "global_step": 109182, "epoch": 902} {"train_loss": -36.9010124206543, "global_step": 109183, "epoch": 902} {"train_loss": -37.82302474975586, "global_step": 109184, "epoch": 902} {"train_loss": -36.742862701416016, "global_step": 109185, "epoch": 902} {"train_loss": -37.816131591796875, "global_step": 109186, "epoch": 902} {"train_loss": -37.24311828613281, "global_step": 109187, "epoch": 902} {"train_loss": -37.039695739746094, "global_step": 109188, "epoch": 902} {"train_loss": -37.40194320678711, "global_step": 109189, "epoch": 902} {"train_loss": -37.801849365234375, "global_step": 109190, "epoch": 902} {"train_loss": -37.7209587097168, "global_step": 109191, "epoch": 902} {"train_loss": -37.46839141845703, "global_step": 109192, "epoch": 902} {"train_loss": -37.8674430847168, "global_step": 109193, "epoch": 902} {"train_loss": -37.182613372802734, "global_step": 109194, "epoch": 902} {"train_loss": -37.4581413269043, "global_step": 109195, "epoch": 902} {"train_loss": -36.77457046508789, "global_step": 109196, "epoch": 902} {"train_loss": -38.30339813232422, "global_step": 109197, "epoch": 902} {"train_loss": -37.21174240112305, "global_step": 109198, "epoch": 902} {"train_loss": -37.73125076293945, "global_step": 109199, "epoch": 902} {"train_loss": -36.983070373535156, "global_step": 109200, "epoch": 902} {"train_loss": -37.15449142456055, "global_step": 109201, "epoch": 902} {"train_loss": -38.080360412597656, "global_step": 109202, "epoch": 902} {"train_loss": -38.519317626953125, "global_step": 109203, "epoch": 902} {"train_loss": -37.446861267089844, "global_step": 109204, "epoch": 902} {"train_loss": -37.71590805053711, "global_step": 109205, "epoch": 902} {"train_loss": -38.54872512817383, "global_step": 109206, "epoch": 902} {"train_loss": -38.5267448425293, "global_step": 109207, "epoch": 902} {"train_loss": -38.204139709472656, "global_step": 109208, "epoch": 902} {"train_loss": -37.17951583862305, "global_step": 109209, "epoch": 902} {"train_loss": -38.12885665893555, "global_step": 109210, "epoch": 902} {"train_loss": -38.51189041137695, "global_step": 109211, "epoch": 902} {"train_loss": -35.72510528564453, "global_step": 109212, "epoch": 902} {"train_loss": -37.72132110595703, "global_step": 109213, "epoch": 902} {"train_loss": -37.362098693847656, "global_step": 109214, "epoch": 902} {"train_loss": -37.842308044433594, "global_step": 109215, "epoch": 902} {"train_loss": -37.392799377441406, "global_step": 109216, "epoch": 902} {"train_loss": -38.02252960205078, "global_step": 109217, "epoch": 902} {"train_loss": -38.09894943237305, "global_step": 109218, "epoch": 902} {"train_loss": -37.29641342163086, "global_step": 109219, "epoch": 902} {"train_loss": -34.43622970581055, "global_step": 109220, "epoch": 902} {"train_loss": -34.091861724853516, "global_step": 109221, "epoch": 902} {"train_loss": -38.14338302612305, "global_step": 109222, "epoch": 902} {"train_loss": -37.35805130004883, "global_step": 109223, "epoch": 902} {"train_loss": -38.2881965637207, "global_step": 109224, "epoch": 902} {"train_loss": -37.44944763183594, "global_step": 109225, "epoch": 902} {"train_loss": -35.95645523071289, "global_step": 109226, "epoch": 902} {"train_loss": -33.573455810546875, "global_step": 109227, "epoch": 902} {"train_loss": -36.51394271850586, "global_step": 109228, "epoch": 902} {"train_loss": -36.30534362792969, "global_step": 109229, "epoch": 902} {"train_loss": -36.50873947143555, "global_step": 109230, "epoch": 902} {"train_loss": -35.881935119628906, "global_step": 109231, "epoch": 902} {"train_loss": -35.55207443237305, "global_step": 109232, "epoch": 902} {"train_loss": -36.6596794128418, "global_step": 109233, "epoch": 902} {"train_loss": -36.5869255065918, "global_step": 109234, "epoch": 902} {"train_loss": -36.36336135864258, "global_step": 109235, "epoch": 902} {"train_loss": -34.280155181884766, "global_step": 109236, "epoch": 902} {"train_loss": -35.44466781616211, "global_step": 109237, "epoch": 902} {"train_loss": -36.58009719848633, "global_step": 109238, "epoch": 902} {"train_loss": -37.61692428588867, "global_step": 109239, "epoch": 902} {"train_loss": -37.842559814453125, "global_step": 109240, "epoch": 902} {"train_loss": -36.63450241088867, "global_step": 109241, "epoch": 902} {"train_loss": -35.72587203979492, "global_step": 109242, "epoch": 902} {"train_loss": -37.42196273803711, "global_step": 109243, "epoch": 902} {"train_loss": -38.00761795043945, "global_step": 109244, "epoch": 902} {"train_loss": -38.21087646484375, "global_step": 109245, "epoch": 902} {"train_loss": -37.93021774291992, "global_step": 109246, "epoch": 902} {"train_loss": -37.08477783203125, "global_step": 109247, "epoch": 902} {"train_loss": -37.97175979614258, "global_step": 109248, "epoch": 902} {"train_loss": -37.488521575927734, "global_step": 109249, "epoch": 902} {"train_loss": -37.18690872192383, "global_step": 109250, "epoch": 902} {"train_loss": -37.60371398925781, "global_step": 109251, "epoch": 902} {"train_loss": -38.194358825683594, "global_step": 109252, "epoch": 902} {"train_loss": -38.28522491455078, "global_step": 109253, "epoch": 902} {"train_loss": -38.249488830566406, "global_step": 109254, "epoch": 902} {"train_loss": -37.6832275390625, "global_step": 109255, "epoch": 902} {"train_loss": -38.491451263427734, "global_step": 109256, "epoch": 902} {"train_loss": -38.35456466674805, "global_step": 109257, "epoch": 902} {"train_loss": -37.68579864501953, "global_step": 109258, "epoch": 902} {"train_loss": -38.084774017333984, "global_step": 109259, "epoch": 902} {"train_loss": -37.40351486206055, "global_step": 109260, "epoch": 902} {"train_loss": -38.67255783081055, "global_step": 109261, "epoch": 902} {"train_loss": -37.176660348561185, "global_step": 109262, "epoch": 902, "val_loss": 2530327.75} {"train_loss": -37.39525604248047, "global_step": 109263, "epoch": 903} {"train_loss": -38.09830093383789, "global_step": 109264, "epoch": 903} {"train_loss": -38.38990020751953, "global_step": 109265, "epoch": 903} {"train_loss": -38.19756317138672, "global_step": 109266, "epoch": 903} {"train_loss": -37.21494674682617, "global_step": 109267, "epoch": 903} {"train_loss": -37.03862762451172, "global_step": 109268, "epoch": 903} {"train_loss": -37.799381256103516, "global_step": 109269, "epoch": 903} {"train_loss": -39.05493927001953, "global_step": 109270, "epoch": 903} {"train_loss": -36.97884750366211, "global_step": 109271, "epoch": 903} {"train_loss": -35.22931671142578, "global_step": 109272, "epoch": 903} {"train_loss": -37.082374572753906, "global_step": 109273, "epoch": 903} {"train_loss": -38.146297454833984, "global_step": 109274, "epoch": 903} {"train_loss": -36.907711029052734, "global_step": 109275, "epoch": 903} {"train_loss": -37.2071647644043, "global_step": 109276, "epoch": 903} {"train_loss": -38.966678619384766, "global_step": 109277, "epoch": 903} {"train_loss": -37.32039260864258, "global_step": 109278, "epoch": 903} {"train_loss": -37.76609420776367, "global_step": 109279, "epoch": 903} {"train_loss": -38.719173431396484, "global_step": 109280, "epoch": 903} {"train_loss": -38.26783752441406, "global_step": 109281, "epoch": 903} {"train_loss": -37.4902229309082, "global_step": 109282, "epoch": 903} {"train_loss": -36.53879928588867, "global_step": 109283, "epoch": 903} {"train_loss": -38.288082122802734, "global_step": 109284, "epoch": 903} {"train_loss": -36.695831298828125, "global_step": 109285, "epoch": 903} {"train_loss": -38.50284957885742, "global_step": 109286, "epoch": 903} {"train_loss": -36.18571472167969, "global_step": 109287, "epoch": 903} {"train_loss": -37.04922103881836, "global_step": 109288, "epoch": 903} {"train_loss": -38.780155181884766, "global_step": 109289, "epoch": 903} {"train_loss": -38.33940887451172, "global_step": 109290, "epoch": 903} {"train_loss": -38.491065979003906, "global_step": 109291, "epoch": 903} {"train_loss": -38.055721282958984, "global_step": 109292, "epoch": 903} {"train_loss": -38.13954544067383, "global_step": 109293, "epoch": 903} {"train_loss": -37.96269607543945, "global_step": 109294, "epoch": 903} {"train_loss": -37.88747787475586, "global_step": 109295, "epoch": 903} {"train_loss": -37.643611907958984, "global_step": 109296, "epoch": 903} {"train_loss": -37.46548080444336, "global_step": 109297, "epoch": 903} {"train_loss": -38.429359436035156, "global_step": 109298, "epoch": 903} {"train_loss": -38.75773239135742, "global_step": 109299, "epoch": 903} {"train_loss": -38.64738082885742, "global_step": 109300, "epoch": 903} {"train_loss": -39.015052795410156, "global_step": 109301, "epoch": 903} {"train_loss": -37.8912467956543, "global_step": 109302, "epoch": 903} {"train_loss": -37.14908981323242, "global_step": 109303, "epoch": 903} {"train_loss": -38.56638717651367, "global_step": 109304, "epoch": 903} {"train_loss": -37.74580001831055, "global_step": 109305, "epoch": 903} {"train_loss": -37.9495849609375, "global_step": 109306, "epoch": 903} {"train_loss": -38.27407455444336, "global_step": 109307, "epoch": 903} {"train_loss": -37.636741638183594, "global_step": 109308, "epoch": 903} {"train_loss": -38.7397575378418, "global_step": 109309, "epoch": 903} {"train_loss": -38.43647384643555, "global_step": 109310, "epoch": 903} {"train_loss": -37.452239990234375, "global_step": 109311, "epoch": 903} {"train_loss": -38.58647537231445, "global_step": 109312, "epoch": 903} {"train_loss": -37.77980041503906, "global_step": 109313, "epoch": 903} {"train_loss": -38.09616470336914, "global_step": 109314, "epoch": 903} {"train_loss": -38.12921905517578, "global_step": 109315, "epoch": 903} {"train_loss": -37.561981201171875, "global_step": 109316, "epoch": 903} {"train_loss": -37.980690002441406, "global_step": 109317, "epoch": 903} {"train_loss": -38.66117477416992, "global_step": 109318, "epoch": 903} {"train_loss": -38.94252395629883, "global_step": 109319, "epoch": 903} {"train_loss": -38.028621673583984, "global_step": 109320, "epoch": 903} {"train_loss": -37.935760498046875, "global_step": 109321, "epoch": 903} {"train_loss": -39.220333099365234, "global_step": 109322, "epoch": 903} {"train_loss": -38.04167556762695, "global_step": 109323, "epoch": 903} {"train_loss": -37.73137283325195, "global_step": 109324, "epoch": 903} {"train_loss": -38.855751037597656, "global_step": 109325, "epoch": 903} {"train_loss": -37.49873352050781, "global_step": 109326, "epoch": 903} {"train_loss": -37.120418548583984, "global_step": 109327, "epoch": 903} {"train_loss": -37.70695114135742, "global_step": 109328, "epoch": 903} {"train_loss": -37.396480560302734, "global_step": 109329, "epoch": 903} {"train_loss": -38.6179084777832, "global_step": 109330, "epoch": 903} {"train_loss": -38.28045654296875, "global_step": 109331, "epoch": 903} {"train_loss": -37.88104248046875, "global_step": 109332, "epoch": 903} {"train_loss": -38.141231536865234, "global_step": 109333, "epoch": 903} {"train_loss": -38.674068450927734, "global_step": 109334, "epoch": 903} {"train_loss": -38.828548431396484, "global_step": 109335, "epoch": 903} {"train_loss": -36.58295440673828, "global_step": 109336, "epoch": 903} {"train_loss": -37.248146057128906, "global_step": 109337, "epoch": 903} {"train_loss": -39.46138381958008, "global_step": 109338, "epoch": 903} {"train_loss": -38.92069625854492, "global_step": 109339, "epoch": 903} {"train_loss": -37.51836013793945, "global_step": 109340, "epoch": 903} {"train_loss": -39.29513168334961, "global_step": 109341, "epoch": 903} {"train_loss": -38.82451248168945, "global_step": 109342, "epoch": 903} {"train_loss": -38.969425201416016, "global_step": 109343, "epoch": 903} {"train_loss": -39.196346282958984, "global_step": 109344, "epoch": 903} {"train_loss": -37.221744537353516, "global_step": 109345, "epoch": 903} {"train_loss": -38.95452880859375, "global_step": 109346, "epoch": 903} {"train_loss": -39.5040283203125, "global_step": 109347, "epoch": 903} {"train_loss": -38.62765121459961, "global_step": 109348, "epoch": 903} {"train_loss": -38.1309928894043, "global_step": 109349, "epoch": 903} {"train_loss": -38.63484573364258, "global_step": 109350, "epoch": 903} {"train_loss": -37.50291061401367, "global_step": 109351, "epoch": 903} {"train_loss": -38.71798324584961, "global_step": 109352, "epoch": 903} {"train_loss": -37.05605697631836, "global_step": 109353, "epoch": 903} {"train_loss": -37.20038986206055, "global_step": 109354, "epoch": 903} {"train_loss": -37.791656494140625, "global_step": 109355, "epoch": 903} {"train_loss": -37.535560607910156, "global_step": 109356, "epoch": 903} {"train_loss": -37.612064361572266, "global_step": 109357, "epoch": 903} {"train_loss": -37.33879852294922, "global_step": 109358, "epoch": 903} {"train_loss": -38.62773132324219, "global_step": 109359, "epoch": 903} {"train_loss": -38.451839447021484, "global_step": 109360, "epoch": 903} {"train_loss": -36.7193603515625, "global_step": 109361, "epoch": 903} {"train_loss": -38.24606704711914, "global_step": 109362, "epoch": 903} {"train_loss": -37.80635452270508, "global_step": 109363, "epoch": 903} {"train_loss": -37.119876861572266, "global_step": 109364, "epoch": 903} {"train_loss": -38.95045852661133, "global_step": 109365, "epoch": 903} {"train_loss": -38.741119384765625, "global_step": 109366, "epoch": 903} {"train_loss": -38.3924560546875, "global_step": 109367, "epoch": 903} {"train_loss": -38.180233001708984, "global_step": 109368, "epoch": 903} {"train_loss": -38.9245719909668, "global_step": 109369, "epoch": 903} {"train_loss": -38.1224250793457, "global_step": 109370, "epoch": 903} {"train_loss": -37.6817626953125, "global_step": 109371, "epoch": 903} {"train_loss": -37.94509506225586, "global_step": 109372, "epoch": 903} {"train_loss": -38.310157775878906, "global_step": 109373, "epoch": 903} {"train_loss": -39.146297454833984, "global_step": 109374, "epoch": 903} {"train_loss": -39.25904083251953, "global_step": 109375, "epoch": 903} {"train_loss": -38.392677307128906, "global_step": 109376, "epoch": 903} {"train_loss": -36.74089431762695, "global_step": 109377, "epoch": 903} {"train_loss": -37.13477325439453, "global_step": 109378, "epoch": 903} {"train_loss": -38.455787658691406, "global_step": 109379, "epoch": 903} {"train_loss": -38.2460823059082, "global_step": 109380, "epoch": 903} {"train_loss": -37.68399429321289, "global_step": 109381, "epoch": 903} {"train_loss": -37.172401428222656, "global_step": 109382, "epoch": 903} {"train_loss": -38.01202660552726, "global_step": 109383, "epoch": 903, "val_loss": 2625466.5} {"train_loss": -38.74393844604492, "global_step": 109384, "epoch": 904} {"train_loss": -38.71192932128906, "global_step": 109385, "epoch": 904} {"train_loss": -34.54084014892578, "global_step": 109386, "epoch": 904} {"train_loss": -35.00679016113281, "global_step": 109387, "epoch": 904} {"train_loss": -37.2651481628418, "global_step": 109388, "epoch": 904} {"train_loss": -38.19165802001953, "global_step": 109389, "epoch": 904} {"train_loss": -36.15603256225586, "global_step": 109390, "epoch": 904} {"train_loss": -36.869178771972656, "global_step": 109391, "epoch": 904} {"train_loss": -37.225704193115234, "global_step": 109392, "epoch": 904} {"train_loss": -35.76752853393555, "global_step": 109393, "epoch": 904} {"train_loss": -37.13398742675781, "global_step": 109394, "epoch": 904} {"train_loss": -36.85017776489258, "global_step": 109395, "epoch": 904} {"train_loss": -38.63158416748047, "global_step": 109396, "epoch": 904} {"train_loss": -37.02878952026367, "global_step": 109397, "epoch": 904} {"train_loss": -38.07371139526367, "global_step": 109398, "epoch": 904} {"train_loss": -36.1666259765625, "global_step": 109399, "epoch": 904} {"train_loss": -37.8446159362793, "global_step": 109400, "epoch": 904} {"train_loss": -36.90355682373047, "global_step": 109401, "epoch": 904} {"train_loss": -37.55929183959961, "global_step": 109402, "epoch": 904} {"train_loss": -37.24225616455078, "global_step": 109403, "epoch": 904} {"train_loss": -35.81389617919922, "global_step": 109404, "epoch": 904} {"train_loss": -34.56678009033203, "global_step": 109405, "epoch": 904} {"train_loss": -37.65078353881836, "global_step": 109406, "epoch": 904} {"train_loss": -37.96059799194336, "global_step": 109407, "epoch": 904} {"train_loss": -38.32229995727539, "global_step": 109408, "epoch": 904} {"train_loss": -37.47091293334961, "global_step": 109409, "epoch": 904} {"train_loss": -38.667537689208984, "global_step": 109410, "epoch": 904} {"train_loss": -37.990421295166016, "global_step": 109411, "epoch": 904} {"train_loss": -38.926025390625, "global_step": 109412, "epoch": 904} {"train_loss": -38.791282653808594, "global_step": 109413, "epoch": 904} {"train_loss": -38.21674346923828, "global_step": 109414, "epoch": 904} {"train_loss": -37.19365310668945, "global_step": 109415, "epoch": 904} {"train_loss": -37.65682601928711, "global_step": 109416, "epoch": 904} {"train_loss": -37.47349166870117, "global_step": 109417, "epoch": 904} {"train_loss": -38.4521369934082, "global_step": 109418, "epoch": 904} {"train_loss": -37.6371955871582, "global_step": 109419, "epoch": 904} {"train_loss": -38.54389953613281, "global_step": 109420, "epoch": 904} {"train_loss": -39.28666687011719, "global_step": 109421, "epoch": 904} {"train_loss": -38.32465744018555, "global_step": 109422, "epoch": 904} {"train_loss": -37.95974349975586, "global_step": 109423, "epoch": 904} {"train_loss": -38.38399887084961, "global_step": 109424, "epoch": 904} {"train_loss": -38.36269760131836, "global_step": 109425, "epoch": 904} {"train_loss": -38.231868743896484, "global_step": 109426, "epoch": 904} {"train_loss": -38.534912109375, "global_step": 109427, "epoch": 904} {"train_loss": -39.428585052490234, "global_step": 109428, "epoch": 904} {"train_loss": -38.78327560424805, "global_step": 109429, "epoch": 904} {"train_loss": -38.52716064453125, "global_step": 109430, "epoch": 904} {"train_loss": -38.677467346191406, "global_step": 109431, "epoch": 904} {"train_loss": -39.23694610595703, "global_step": 109432, "epoch": 904} {"train_loss": -38.70981216430664, "global_step": 109433, "epoch": 904} {"train_loss": -37.39240646362305, "global_step": 109434, "epoch": 904} {"train_loss": -38.343868255615234, "global_step": 109435, "epoch": 904} {"train_loss": -38.00197982788086, "global_step": 109436, "epoch": 904} {"train_loss": -38.66584014892578, "global_step": 109437, "epoch": 904} {"train_loss": -38.23696517944336, "global_step": 109438, "epoch": 904} {"train_loss": -39.09298324584961, "global_step": 109439, "epoch": 904} {"train_loss": -38.72154235839844, "global_step": 109440, "epoch": 904} {"train_loss": -38.61027908325195, "global_step": 109441, "epoch": 904} {"train_loss": -37.54071807861328, "global_step": 109442, "epoch": 904} {"train_loss": -39.13261032104492, "global_step": 109443, "epoch": 904} {"train_loss": -37.7258186340332, "global_step": 109444, "epoch": 904} {"train_loss": -38.36692428588867, "global_step": 109445, "epoch": 904} {"train_loss": -38.617916107177734, "global_step": 109446, "epoch": 904} {"train_loss": -38.56777572631836, "global_step": 109447, "epoch": 904} {"train_loss": -37.851131439208984, "global_step": 109448, "epoch": 904} {"train_loss": -36.897640228271484, "global_step": 109449, "epoch": 904} {"train_loss": -37.891422271728516, "global_step": 109450, "epoch": 904} {"train_loss": -36.521114349365234, "global_step": 109451, "epoch": 904} {"train_loss": -33.18221664428711, "global_step": 109452, "epoch": 904} {"train_loss": -26.30494499206543, "global_step": 109453, "epoch": 904} {"train_loss": -20.5658016204834, "global_step": 109454, "epoch": 904} {"train_loss": -23.25487518310547, "global_step": 109455, "epoch": 904} {"train_loss": -35.83393096923828, "global_step": 109456, "epoch": 904} {"train_loss": -36.00084686279297, "global_step": 109457, "epoch": 904} {"train_loss": -34.83826446533203, "global_step": 109458, "epoch": 904} {"train_loss": -34.87937545776367, "global_step": 109459, "epoch": 904} {"train_loss": -35.954463958740234, "global_step": 109460, "epoch": 904} {"train_loss": -35.90142822265625, "global_step": 109461, "epoch": 904} {"train_loss": -36.965423583984375, "global_step": 109462, "epoch": 904} {"train_loss": -35.69826889038086, "global_step": 109463, "epoch": 904} {"train_loss": -37.61528396606445, "global_step": 109464, "epoch": 904} {"train_loss": -36.022850036621094, "global_step": 109465, "epoch": 904} {"train_loss": -36.66778564453125, "global_step": 109466, "epoch": 904} {"train_loss": -36.9788818359375, "global_step": 109467, "epoch": 904} {"train_loss": -37.54707717895508, "global_step": 109468, "epoch": 904} {"train_loss": -37.379188537597656, "global_step": 109469, "epoch": 904} {"train_loss": -36.948707580566406, "global_step": 109470, "epoch": 904} {"train_loss": -37.54286575317383, "global_step": 109471, "epoch": 904} {"train_loss": -37.610389709472656, "global_step": 109472, "epoch": 904} {"train_loss": -37.32255172729492, "global_step": 109473, "epoch": 904} {"train_loss": -36.9525146484375, "global_step": 109474, "epoch": 904} {"train_loss": -37.88566207885742, "global_step": 109475, "epoch": 904} {"train_loss": -36.75943374633789, "global_step": 109476, "epoch": 904} {"train_loss": -36.65161895751953, "global_step": 109477, "epoch": 904} {"train_loss": -36.86945724487305, "global_step": 109478, "epoch": 904} {"train_loss": -36.40977478027344, "global_step": 109479, "epoch": 904} {"train_loss": -38.09595489501953, "global_step": 109480, "epoch": 904} {"train_loss": -36.70522689819336, "global_step": 109481, "epoch": 904} {"train_loss": -35.14962387084961, "global_step": 109482, "epoch": 904} {"train_loss": -37.83580017089844, "global_step": 109483, "epoch": 904} {"train_loss": -37.42906951904297, "global_step": 109484, "epoch": 904} {"train_loss": -37.810428619384766, "global_step": 109485, "epoch": 904} {"train_loss": -35.14065170288086, "global_step": 109486, "epoch": 904} {"train_loss": -34.557857513427734, "global_step": 109487, "epoch": 904} {"train_loss": -38.171142578125, "global_step": 109488, "epoch": 904} {"train_loss": -37.99628829956055, "global_step": 109489, "epoch": 904} {"train_loss": -38.176055908203125, "global_step": 109490, "epoch": 904} {"train_loss": -36.40169906616211, "global_step": 109491, "epoch": 904} {"train_loss": -37.7913818359375, "global_step": 109492, "epoch": 904} {"train_loss": -37.47473907470703, "global_step": 109493, "epoch": 904} {"train_loss": -38.09098434448242, "global_step": 109494, "epoch": 904} {"train_loss": -36.80659484863281, "global_step": 109495, "epoch": 904} {"train_loss": -37.82600021362305, "global_step": 109496, "epoch": 904} {"train_loss": -38.008480072021484, "global_step": 109497, "epoch": 904} {"train_loss": -37.0275993347168, "global_step": 109498, "epoch": 904} {"train_loss": -36.4148063659668, "global_step": 109499, "epoch": 904} {"train_loss": -37.779815673828125, "global_step": 109500, "epoch": 904} {"train_loss": -37.906776428222656, "global_step": 109501, "epoch": 904} {"train_loss": -37.7136344909668, "global_step": 109502, "epoch": 904} {"train_loss": -38.57713317871094, "global_step": 109503, "epoch": 904} {"train_loss": -37.08427873721793, "global_step": 109504, "epoch": 904, "val_loss": 2594188.75} {"train_loss": -37.983001708984375, "global_step": 109505, "epoch": 905} {"train_loss": -37.01557540893555, "global_step": 109506, "epoch": 905} {"train_loss": -38.65495681762695, "global_step": 109507, "epoch": 905} {"train_loss": -38.14411163330078, "global_step": 109508, "epoch": 905} {"train_loss": -37.95176315307617, "global_step": 109509, "epoch": 905} {"train_loss": -38.765541076660156, "global_step": 109510, "epoch": 905} {"train_loss": -38.256813049316406, "global_step": 109511, "epoch": 905} {"train_loss": -38.79347229003906, "global_step": 109512, "epoch": 905} {"train_loss": -38.77802276611328, "global_step": 109513, "epoch": 905} {"train_loss": -38.01317596435547, "global_step": 109514, "epoch": 905} {"train_loss": -37.635826110839844, "global_step": 109515, "epoch": 905} {"train_loss": -38.772464752197266, "global_step": 109516, "epoch": 905} {"train_loss": -36.86166000366211, "global_step": 109517, "epoch": 905} {"train_loss": -38.15692901611328, "global_step": 109518, "epoch": 905} {"train_loss": -38.723915100097656, "global_step": 109519, "epoch": 905} {"train_loss": -39.05867385864258, "global_step": 109520, "epoch": 905} {"train_loss": -37.33920669555664, "global_step": 109521, "epoch": 905} {"train_loss": -38.38459014892578, "global_step": 109522, "epoch": 905} {"train_loss": -38.50167465209961, "global_step": 109523, "epoch": 905} {"train_loss": -38.944759368896484, "global_step": 109524, "epoch": 905} {"train_loss": -38.39003372192383, "global_step": 109525, "epoch": 905} {"train_loss": -37.81108856201172, "global_step": 109526, "epoch": 905} {"train_loss": -38.13776397705078, "global_step": 109527, "epoch": 905} {"train_loss": -39.009498596191406, "global_step": 109528, "epoch": 905} {"train_loss": -38.87395095825195, "global_step": 109529, "epoch": 905} {"train_loss": -38.5807991027832, "global_step": 109530, "epoch": 905} {"train_loss": -37.90645980834961, "global_step": 109531, "epoch": 905} {"train_loss": -36.80263137817383, "global_step": 109532, "epoch": 905} {"train_loss": -35.598876953125, "global_step": 109533, "epoch": 905} {"train_loss": -37.96904373168945, "global_step": 109534, "epoch": 905} {"train_loss": -37.874717712402344, "global_step": 109535, "epoch": 905} {"train_loss": -36.58109664916992, "global_step": 109536, "epoch": 905} {"train_loss": -37.38705062866211, "global_step": 109537, "epoch": 905} {"train_loss": -37.80721664428711, "global_step": 109538, "epoch": 905} {"train_loss": -38.96733474731445, "global_step": 109539, "epoch": 905} {"train_loss": -38.25262451171875, "global_step": 109540, "epoch": 905} {"train_loss": -37.83382797241211, "global_step": 109541, "epoch": 905} {"train_loss": -38.06577682495117, "global_step": 109542, "epoch": 905} {"train_loss": -38.68571472167969, "global_step": 109543, "epoch": 905} {"train_loss": -38.78257369995117, "global_step": 109544, "epoch": 905} {"train_loss": -37.61109161376953, "global_step": 109545, "epoch": 905} {"train_loss": -38.1799430847168, "global_step": 109546, "epoch": 905} {"train_loss": -37.75613784790039, "global_step": 109547, "epoch": 905} {"train_loss": -37.99269104003906, "global_step": 109548, "epoch": 905} {"train_loss": -38.52953338623047, "global_step": 109549, "epoch": 905} {"train_loss": -38.18180847167969, "global_step": 109550, "epoch": 905} {"train_loss": -38.332359313964844, "global_step": 109551, "epoch": 905} {"train_loss": -37.76374435424805, "global_step": 109552, "epoch": 905} {"train_loss": -38.86587142944336, "global_step": 109553, "epoch": 905} {"train_loss": -38.73616409301758, "global_step": 109554, "epoch": 905} {"train_loss": -38.81339645385742, "global_step": 109555, "epoch": 905} {"train_loss": -37.26164245605469, "global_step": 109556, "epoch": 905} {"train_loss": -37.9862174987793, "global_step": 109557, "epoch": 905} {"train_loss": -38.649879455566406, "global_step": 109558, "epoch": 905} {"train_loss": -38.50806427001953, "global_step": 109559, "epoch": 905} {"train_loss": -39.136680603027344, "global_step": 109560, "epoch": 905} {"train_loss": -38.842811584472656, "global_step": 109561, "epoch": 905} {"train_loss": -39.02896499633789, "global_step": 109562, "epoch": 905} {"train_loss": -38.74776840209961, "global_step": 109563, "epoch": 905} {"train_loss": -37.5841178894043, "global_step": 109564, "epoch": 905} {"train_loss": -39.24285888671875, "global_step": 109565, "epoch": 905} {"train_loss": -39.19668960571289, "global_step": 109566, "epoch": 905} {"train_loss": -38.457313537597656, "global_step": 109567, "epoch": 905} {"train_loss": -37.43083572387695, "global_step": 109568, "epoch": 905} {"train_loss": -37.71535873413086, "global_step": 109569, "epoch": 905} {"train_loss": -37.354793548583984, "global_step": 109570, "epoch": 905} {"train_loss": -38.5015754699707, "global_step": 109571, "epoch": 905} {"train_loss": -38.68672561645508, "global_step": 109572, "epoch": 905} {"train_loss": -38.11894607543945, "global_step": 109573, "epoch": 905} {"train_loss": -38.65183639526367, "global_step": 109574, "epoch": 905} {"train_loss": -37.81699752807617, "global_step": 109575, "epoch": 905} {"train_loss": -38.23917770385742, "global_step": 109576, "epoch": 905} {"train_loss": -32.37699508666992, "global_step": 109577, "epoch": 905} {"train_loss": -35.6547966003418, "global_step": 109578, "epoch": 905} {"train_loss": -37.22248077392578, "global_step": 109579, "epoch": 905} {"train_loss": -37.29492950439453, "global_step": 109580, "epoch": 905} {"train_loss": -36.53419876098633, "global_step": 109581, "epoch": 905} {"train_loss": -36.79945755004883, "global_step": 109582, "epoch": 905} {"train_loss": -38.45937728881836, "global_step": 109583, "epoch": 905} {"train_loss": -37.51884078979492, "global_step": 109584, "epoch": 905} {"train_loss": -35.04088592529297, "global_step": 109585, "epoch": 905} {"train_loss": -37.681758880615234, "global_step": 109586, "epoch": 905} {"train_loss": -38.2341423034668, "global_step": 109587, "epoch": 905} {"train_loss": -38.291744232177734, "global_step": 109588, "epoch": 905} {"train_loss": -36.96803665161133, "global_step": 109589, "epoch": 905} {"train_loss": -37.13668441772461, "global_step": 109590, "epoch": 905} {"train_loss": -37.85768127441406, "global_step": 109591, "epoch": 905} {"train_loss": -38.39223098754883, "global_step": 109592, "epoch": 905} {"train_loss": -36.1218376159668, "global_step": 109593, "epoch": 905} {"train_loss": -38.25613021850586, "global_step": 109594, "epoch": 905} {"train_loss": -36.817317962646484, "global_step": 109595, "epoch": 905} {"train_loss": -38.3029670715332, "global_step": 109596, "epoch": 905} {"train_loss": -37.77559280395508, "global_step": 109597, "epoch": 905} {"train_loss": -37.358497619628906, "global_step": 109598, "epoch": 905} {"train_loss": -37.48130416870117, "global_step": 109599, "epoch": 905} {"train_loss": -35.70171356201172, "global_step": 109600, "epoch": 905} {"train_loss": -37.90236282348633, "global_step": 109601, "epoch": 905} {"train_loss": -37.41031265258789, "global_step": 109602, "epoch": 905} {"train_loss": -37.80333709716797, "global_step": 109603, "epoch": 905} {"train_loss": -37.24435043334961, "global_step": 109604, "epoch": 905} {"train_loss": -36.61682891845703, "global_step": 109605, "epoch": 905} {"train_loss": -36.08376693725586, "global_step": 109606, "epoch": 905} {"train_loss": -38.39457702636719, "global_step": 109607, "epoch": 905} {"train_loss": -37.578182220458984, "global_step": 109608, "epoch": 905} {"train_loss": -38.656219482421875, "global_step": 109609, "epoch": 905} {"train_loss": -37.74240493774414, "global_step": 109610, "epoch": 905} {"train_loss": -38.373104095458984, "global_step": 109611, "epoch": 905} {"train_loss": -38.1401481628418, "global_step": 109612, "epoch": 905} {"train_loss": -37.57880401611328, "global_step": 109613, "epoch": 905} {"train_loss": -38.0461311340332, "global_step": 109614, "epoch": 905} {"train_loss": -38.35065841674805, "global_step": 109615, "epoch": 905} {"train_loss": -38.02095031738281, "global_step": 109616, "epoch": 905} {"train_loss": -37.72178649902344, "global_step": 109617, "epoch": 905} {"train_loss": -37.326908111572266, "global_step": 109618, "epoch": 905} {"train_loss": -38.25028991699219, "global_step": 109619, "epoch": 905} {"train_loss": -38.21335220336914, "global_step": 109620, "epoch": 905} {"train_loss": -38.925209045410156, "global_step": 109621, "epoch": 905} {"train_loss": -38.105892181396484, "global_step": 109622, "epoch": 905} {"train_loss": -37.76192855834961, "global_step": 109623, "epoch": 905} {"train_loss": -38.362613677978516, "global_step": 109624, "epoch": 905} {"train_loss": -37.90000042245408, "global_step": 109625, "epoch": 905, "val_loss": 2715552.25} {"train_loss": -38.39553451538086, "global_step": 109626, "epoch": 906} {"train_loss": -38.947933197021484, "global_step": 109627, "epoch": 906} {"train_loss": -38.82818603515625, "global_step": 109628, "epoch": 906} {"train_loss": -38.58278274536133, "global_step": 109629, "epoch": 906} {"train_loss": -36.53205108642578, "global_step": 109630, "epoch": 906} {"train_loss": -38.695655822753906, "global_step": 109631, "epoch": 906} {"train_loss": -38.85565948486328, "global_step": 109632, "epoch": 906} {"train_loss": -38.7937126159668, "global_step": 109633, "epoch": 906} {"train_loss": -36.708740234375, "global_step": 109634, "epoch": 906} {"train_loss": -37.79434585571289, "global_step": 109635, "epoch": 906} {"train_loss": -38.4817008972168, "global_step": 109636, "epoch": 906} {"train_loss": -37.033023834228516, "global_step": 109637, "epoch": 906} {"train_loss": -36.23748016357422, "global_step": 109638, "epoch": 906} {"train_loss": -37.1379280090332, "global_step": 109639, "epoch": 906} {"train_loss": -37.332000732421875, "global_step": 109640, "epoch": 906} {"train_loss": -36.36933898925781, "global_step": 109641, "epoch": 906} {"train_loss": -38.395015716552734, "global_step": 109642, "epoch": 906} {"train_loss": -33.553096771240234, "global_step": 109643, "epoch": 906} {"train_loss": -38.38582992553711, "global_step": 109644, "epoch": 906} {"train_loss": -37.886749267578125, "global_step": 109645, "epoch": 906} {"train_loss": -37.67205047607422, "global_step": 109646, "epoch": 906} {"train_loss": -36.679115295410156, "global_step": 109647, "epoch": 906} {"train_loss": -38.212432861328125, "global_step": 109648, "epoch": 906} {"train_loss": -38.45930099487305, "global_step": 109649, "epoch": 906} {"train_loss": -36.96884536743164, "global_step": 109650, "epoch": 906} {"train_loss": -36.94282150268555, "global_step": 109651, "epoch": 906} {"train_loss": -37.579254150390625, "global_step": 109652, "epoch": 906} {"train_loss": -36.074073791503906, "global_step": 109653, "epoch": 906} {"train_loss": -38.0538330078125, "global_step": 109654, "epoch": 906} {"train_loss": -33.4433479309082, "global_step": 109655, "epoch": 906} {"train_loss": -35.50460433959961, "global_step": 109656, "epoch": 906} {"train_loss": -37.51505661010742, "global_step": 109657, "epoch": 906} {"train_loss": -34.443973541259766, "global_step": 109658, "epoch": 906} {"train_loss": -33.11102294921875, "global_step": 109659, "epoch": 906} {"train_loss": -35.876522064208984, "global_step": 109660, "epoch": 906} {"train_loss": -29.812030792236328, "global_step": 109661, "epoch": 906} {"train_loss": -29.220853805541992, "global_step": 109662, "epoch": 906} {"train_loss": -34.26422882080078, "global_step": 109663, "epoch": 906} {"train_loss": -31.366989135742188, "global_step": 109664, "epoch": 906} {"train_loss": -33.1108512878418, "global_step": 109665, "epoch": 906} {"train_loss": -32.46510696411133, "global_step": 109666, "epoch": 906} {"train_loss": -34.220516204833984, "global_step": 109667, "epoch": 906} {"train_loss": -30.21388816833496, "global_step": 109668, "epoch": 906} {"train_loss": -32.49330139160156, "global_step": 109669, "epoch": 906} {"train_loss": -31.176855087280273, "global_step": 109670, "epoch": 906} {"train_loss": -30.951343536376953, "global_step": 109671, "epoch": 906} {"train_loss": -33.56690216064453, "global_step": 109672, "epoch": 906} {"train_loss": -32.93845748901367, "global_step": 109673, "epoch": 906} {"train_loss": -34.65176773071289, "global_step": 109674, "epoch": 906} {"train_loss": -35.24294662475586, "global_step": 109675, "epoch": 906} {"train_loss": -33.68967056274414, "global_step": 109676, "epoch": 906} {"train_loss": -34.729774475097656, "global_step": 109677, "epoch": 906} {"train_loss": -34.218074798583984, "global_step": 109678, "epoch": 906} {"train_loss": -35.089229583740234, "global_step": 109679, "epoch": 906} {"train_loss": -33.25243377685547, "global_step": 109680, "epoch": 906} {"train_loss": -33.2009162902832, "global_step": 109681, "epoch": 906} {"train_loss": -33.92591094970703, "global_step": 109682, "epoch": 906} {"train_loss": -32.987266540527344, "global_step": 109683, "epoch": 906} {"train_loss": -32.578060150146484, "global_step": 109684, "epoch": 906} {"train_loss": -34.545467376708984, "global_step": 109685, "epoch": 906} {"train_loss": -34.030426025390625, "global_step": 109686, "epoch": 906} {"train_loss": -34.83651351928711, "global_step": 109687, "epoch": 906} {"train_loss": -35.43294906616211, "global_step": 109688, "epoch": 906} {"train_loss": -35.90339279174805, "global_step": 109689, "epoch": 906} {"train_loss": -35.51546096801758, "global_step": 109690, "epoch": 906} {"train_loss": -34.57836151123047, "global_step": 109691, "epoch": 906} {"train_loss": -34.67112350463867, "global_step": 109692, "epoch": 906} {"train_loss": -36.09902572631836, "global_step": 109693, "epoch": 906} {"train_loss": -35.061492919921875, "global_step": 109694, "epoch": 906} {"train_loss": -35.87104034423828, "global_step": 109695, "epoch": 906} {"train_loss": -36.24221420288086, "global_step": 109696, "epoch": 906} {"train_loss": -36.229061126708984, "global_step": 109697, "epoch": 906} {"train_loss": -36.169551849365234, "global_step": 109698, "epoch": 906} {"train_loss": -36.38363265991211, "global_step": 109699, "epoch": 906} {"train_loss": -35.862606048583984, "global_step": 109700, "epoch": 906} {"train_loss": -36.765350341796875, "global_step": 109701, "epoch": 906} {"train_loss": -36.42559814453125, "global_step": 109702, "epoch": 906} {"train_loss": -36.21969223022461, "global_step": 109703, "epoch": 906} {"train_loss": -36.0091552734375, "global_step": 109704, "epoch": 906} {"train_loss": -37.08757400512695, "global_step": 109705, "epoch": 906} {"train_loss": -36.27166748046875, "global_step": 109706, "epoch": 906} {"train_loss": -36.598609924316406, "global_step": 109707, "epoch": 906} {"train_loss": -36.52498245239258, "global_step": 109708, "epoch": 906} {"train_loss": -37.091644287109375, "global_step": 109709, "epoch": 906} {"train_loss": -37.22765350341797, "global_step": 109710, "epoch": 906} {"train_loss": -36.97772979736328, "global_step": 109711, "epoch": 906} {"train_loss": -36.76566696166992, "global_step": 109712, "epoch": 906} {"train_loss": -37.24197006225586, "global_step": 109713, "epoch": 906} {"train_loss": -37.32343673706055, "global_step": 109714, "epoch": 906} {"train_loss": -37.40452194213867, "global_step": 109715, "epoch": 906} {"train_loss": -37.26932907104492, "global_step": 109716, "epoch": 906} {"train_loss": -37.28689193725586, "global_step": 109717, "epoch": 906} {"train_loss": -37.40195846557617, "global_step": 109718, "epoch": 906} {"train_loss": -37.16135787963867, "global_step": 109719, "epoch": 906} {"train_loss": -37.8855094909668, "global_step": 109720, "epoch": 906} {"train_loss": -37.47206115722656, "global_step": 109721, "epoch": 906} {"train_loss": -37.569252014160156, "global_step": 109722, "epoch": 906} {"train_loss": -37.61177062988281, "global_step": 109723, "epoch": 906} {"train_loss": -37.73676681518555, "global_step": 109724, "epoch": 906} {"train_loss": -37.612144470214844, "global_step": 109725, "epoch": 906} {"train_loss": -37.70489501953125, "global_step": 109726, "epoch": 906} {"train_loss": -37.63388442993164, "global_step": 109727, "epoch": 906} {"train_loss": -37.71858215332031, "global_step": 109728, "epoch": 906} {"train_loss": -38.2169189453125, "global_step": 109729, "epoch": 906} {"train_loss": -37.50051498413086, "global_step": 109730, "epoch": 906} {"train_loss": -38.15108108520508, "global_step": 109731, "epoch": 906} {"train_loss": -37.806087493896484, "global_step": 109732, "epoch": 906} {"train_loss": -38.02836227416992, "global_step": 109733, "epoch": 906} {"train_loss": -37.86616134643555, "global_step": 109734, "epoch": 906} {"train_loss": -38.177005767822266, "global_step": 109735, "epoch": 906} {"train_loss": -37.49135971069336, "global_step": 109736, "epoch": 906} {"train_loss": -37.8753547668457, "global_step": 109737, "epoch": 906} {"train_loss": -37.64533996582031, "global_step": 109738, "epoch": 906} {"train_loss": -38.09814453125, "global_step": 109739, "epoch": 906} {"train_loss": -38.23407745361328, "global_step": 109740, "epoch": 906} {"train_loss": -38.46981430053711, "global_step": 109741, "epoch": 906} {"train_loss": -37.34010696411133, "global_step": 109742, "epoch": 906} {"train_loss": -37.65938949584961, "global_step": 109743, "epoch": 906} {"train_loss": -37.31466293334961, "global_step": 109744, "epoch": 906} {"train_loss": -38.06650924682617, "global_step": 109745, "epoch": 906} {"train_loss": -36.18499978120662, "global_step": 109746, "epoch": 906, "val_loss": 2515493.0} {"train_loss": -38.07863235473633, "global_step": 109747, "epoch": 907} {"train_loss": -38.71825408935547, "global_step": 109748, "epoch": 907} {"train_loss": -38.59720993041992, "global_step": 109749, "epoch": 907} {"train_loss": -37.80369186401367, "global_step": 109750, "epoch": 907} {"train_loss": -37.9351921081543, "global_step": 109751, "epoch": 907} {"train_loss": -38.01044845581055, "global_step": 109752, "epoch": 907} {"train_loss": -38.32435989379883, "global_step": 109753, "epoch": 907} {"train_loss": -38.5168571472168, "global_step": 109754, "epoch": 907} {"train_loss": -38.880367279052734, "global_step": 109755, "epoch": 907} {"train_loss": -38.77616500854492, "global_step": 109756, "epoch": 907} {"train_loss": -38.61075973510742, "global_step": 109757, "epoch": 907} {"train_loss": -38.57918930053711, "global_step": 109758, "epoch": 907} {"train_loss": -38.87445831298828, "global_step": 109759, "epoch": 907} {"train_loss": -39.13004684448242, "global_step": 109760, "epoch": 907} {"train_loss": -38.77374267578125, "global_step": 109761, "epoch": 907} {"train_loss": -39.153541564941406, "global_step": 109762, "epoch": 907} {"train_loss": -39.280582427978516, "global_step": 109763, "epoch": 907} {"train_loss": -38.8623046875, "global_step": 109764, "epoch": 907} {"train_loss": -38.868309020996094, "global_step": 109765, "epoch": 907} {"train_loss": -38.802154541015625, "global_step": 109766, "epoch": 907} {"train_loss": -39.16605758666992, "global_step": 109767, "epoch": 907} {"train_loss": -39.24212646484375, "global_step": 109768, "epoch": 907} {"train_loss": -39.53718948364258, "global_step": 109769, "epoch": 907} {"train_loss": -38.613643646240234, "global_step": 109770, "epoch": 907} {"train_loss": -39.31007766723633, "global_step": 109771, "epoch": 907} {"train_loss": -38.971473693847656, "global_step": 109772, "epoch": 907} {"train_loss": -39.23004150390625, "global_step": 109773, "epoch": 907} {"train_loss": -38.852569580078125, "global_step": 109774, "epoch": 907} {"train_loss": -38.46058654785156, "global_step": 109775, "epoch": 907} {"train_loss": -38.657135009765625, "global_step": 109776, "epoch": 907} {"train_loss": -39.61328125, "global_step": 109777, "epoch": 907} {"train_loss": -38.6929817199707, "global_step": 109778, "epoch": 907} {"train_loss": -37.56565856933594, "global_step": 109779, "epoch": 907} {"train_loss": -33.93020248413086, "global_step": 109780, "epoch": 907} {"train_loss": -28.601892471313477, "global_step": 109781, "epoch": 907} {"train_loss": -29.699161529541016, "global_step": 109782, "epoch": 907} {"train_loss": -37.244991302490234, "global_step": 109783, "epoch": 907} {"train_loss": -37.7656364440918, "global_step": 109784, "epoch": 907} {"train_loss": -34.356014251708984, "global_step": 109785, "epoch": 907} {"train_loss": -37.362117767333984, "global_step": 109786, "epoch": 907} {"train_loss": -37.384857177734375, "global_step": 109787, "epoch": 907} {"train_loss": -35.67753601074219, "global_step": 109788, "epoch": 907} {"train_loss": -38.405208587646484, "global_step": 109789, "epoch": 907} {"train_loss": -35.43699264526367, "global_step": 109790, "epoch": 907} {"train_loss": -36.8584098815918, "global_step": 109791, "epoch": 907} {"train_loss": -37.459136962890625, "global_step": 109792, "epoch": 907} {"train_loss": -37.91612243652344, "global_step": 109793, "epoch": 907} {"train_loss": -37.325984954833984, "global_step": 109794, "epoch": 907} {"train_loss": -37.59904098510742, "global_step": 109795, "epoch": 907} {"train_loss": -38.135528564453125, "global_step": 109796, "epoch": 907} {"train_loss": -36.58668899536133, "global_step": 109797, "epoch": 907} {"train_loss": -38.318115234375, "global_step": 109798, "epoch": 907} {"train_loss": -37.27267074584961, "global_step": 109799, "epoch": 907} {"train_loss": -37.411338806152344, "global_step": 109800, "epoch": 907} {"train_loss": -37.658111572265625, "global_step": 109801, "epoch": 907} {"train_loss": -38.18925476074219, "global_step": 109802, "epoch": 907} {"train_loss": -37.56670379638672, "global_step": 109803, "epoch": 907} {"train_loss": -38.25102996826172, "global_step": 109804, "epoch": 907} {"train_loss": -38.407264709472656, "global_step": 109805, "epoch": 907} {"train_loss": -37.57395553588867, "global_step": 109806, "epoch": 907} {"train_loss": -37.03054428100586, "global_step": 109807, "epoch": 907} {"train_loss": -35.98200225830078, "global_step": 109808, "epoch": 907} {"train_loss": -37.26252365112305, "global_step": 109809, "epoch": 907} {"train_loss": -37.44658279418945, "global_step": 109810, "epoch": 907} {"train_loss": -36.2369384765625, "global_step": 109811, "epoch": 907} {"train_loss": -36.937095642089844, "global_step": 109812, "epoch": 907} {"train_loss": -38.340145111083984, "global_step": 109813, "epoch": 907} {"train_loss": -37.19414138793945, "global_step": 109814, "epoch": 907} {"train_loss": -38.026763916015625, "global_step": 109815, "epoch": 907} {"train_loss": -38.5721321105957, "global_step": 109816, "epoch": 907} {"train_loss": -38.28335189819336, "global_step": 109817, "epoch": 907} {"train_loss": -38.76355743408203, "global_step": 109818, "epoch": 907} {"train_loss": -38.21578598022461, "global_step": 109819, "epoch": 907} {"train_loss": -37.56350326538086, "global_step": 109820, "epoch": 907} {"train_loss": -38.027809143066406, "global_step": 109821, "epoch": 907} {"train_loss": -37.99052810668945, "global_step": 109822, "epoch": 907} {"train_loss": -37.998165130615234, "global_step": 109823, "epoch": 907} {"train_loss": -38.68109130859375, "global_step": 109824, "epoch": 907} {"train_loss": -36.7697868347168, "global_step": 109825, "epoch": 907} {"train_loss": -37.61773681640625, "global_step": 109826, "epoch": 907} {"train_loss": -38.22705078125, "global_step": 109827, "epoch": 907} {"train_loss": -38.36927032470703, "global_step": 109828, "epoch": 907} {"train_loss": -38.106231689453125, "global_step": 109829, "epoch": 907} {"train_loss": -37.7355842590332, "global_step": 109830, "epoch": 907} {"train_loss": -36.634803771972656, "global_step": 109831, "epoch": 907} {"train_loss": -38.55256652832031, "global_step": 109832, "epoch": 907} {"train_loss": -38.16817855834961, "global_step": 109833, "epoch": 907} {"train_loss": -38.05318832397461, "global_step": 109834, "epoch": 907} {"train_loss": -37.637142181396484, "global_step": 109835, "epoch": 907} {"train_loss": -38.281707763671875, "global_step": 109836, "epoch": 907} {"train_loss": -38.62033462524414, "global_step": 109837, "epoch": 907} {"train_loss": -38.793121337890625, "global_step": 109838, "epoch": 907} {"train_loss": -37.01984405517578, "global_step": 109839, "epoch": 907} {"train_loss": -38.957637786865234, "global_step": 109840, "epoch": 907} {"train_loss": -38.42646026611328, "global_step": 109841, "epoch": 907} {"train_loss": -38.47770690917969, "global_step": 109842, "epoch": 907} {"train_loss": -38.85841369628906, "global_step": 109843, "epoch": 907} {"train_loss": -37.61510467529297, "global_step": 109844, "epoch": 907} {"train_loss": -37.37345504760742, "global_step": 109845, "epoch": 907} {"train_loss": -38.91908264160156, "global_step": 109846, "epoch": 907} {"train_loss": -37.48503494262695, "global_step": 109847, "epoch": 907} {"train_loss": -35.81337356567383, "global_step": 109848, "epoch": 907} {"train_loss": -38.650390625, "global_step": 109849, "epoch": 907} {"train_loss": -37.560482025146484, "global_step": 109850, "epoch": 907} {"train_loss": -36.22152328491211, "global_step": 109851, "epoch": 907} {"train_loss": -37.09950256347656, "global_step": 109852, "epoch": 907} {"train_loss": -38.14348220825195, "global_step": 109853, "epoch": 907} {"train_loss": -37.523712158203125, "global_step": 109854, "epoch": 907} {"train_loss": -36.558692932128906, "global_step": 109855, "epoch": 907} {"train_loss": -37.3451042175293, "global_step": 109856, "epoch": 907} {"train_loss": -37.44710922241211, "global_step": 109857, "epoch": 907} {"train_loss": -36.57067108154297, "global_step": 109858, "epoch": 907} {"train_loss": -36.55531692504883, "global_step": 109859, "epoch": 907} {"train_loss": -36.28508758544922, "global_step": 109860, "epoch": 907} {"train_loss": -38.51942825317383, "global_step": 109861, "epoch": 907} {"train_loss": -38.0300407409668, "global_step": 109862, "epoch": 907} {"train_loss": -38.00392532348633, "global_step": 109863, "epoch": 907} {"train_loss": -38.39425277709961, "global_step": 109864, "epoch": 907} {"train_loss": -13.101452827453613, "global_step": 109865, "epoch": 907} {"train_loss": -34.4660758972168, "global_step": 109866, "epoch": 907} {"train_loss": -37.483183986884505, "global_step": 109867, "epoch": 907, "val_loss": 2578602.75} {"train_loss": -32.285221099853516, "global_step": 109868, "epoch": 908} {"train_loss": -23.63797378540039, "global_step": 109869, "epoch": 908} {"train_loss": -33.87911605834961, "global_step": 109870, "epoch": 908} {"train_loss": -35.364288330078125, "global_step": 109871, "epoch": 908} {"train_loss": -30.769697189331055, "global_step": 109872, "epoch": 908} {"train_loss": -34.37763595581055, "global_step": 109873, "epoch": 908} {"train_loss": -31.315174102783203, "global_step": 109874, "epoch": 908} {"train_loss": -34.63108444213867, "global_step": 109875, "epoch": 908} {"train_loss": -33.559783935546875, "global_step": 109876, "epoch": 908} {"train_loss": -34.52064514160156, "global_step": 109877, "epoch": 908} {"train_loss": -35.362831115722656, "global_step": 109878, "epoch": 908} {"train_loss": -34.49677658081055, "global_step": 109879, "epoch": 908} {"train_loss": -35.697654724121094, "global_step": 109880, "epoch": 908} {"train_loss": -33.1265754699707, "global_step": 109881, "epoch": 908} {"train_loss": -34.03472900390625, "global_step": 109882, "epoch": 908} {"train_loss": -27.794824600219727, "global_step": 109883, "epoch": 908} {"train_loss": -34.53556823730469, "global_step": 109884, "epoch": 908} {"train_loss": -35.29545211791992, "global_step": 109885, "epoch": 908} {"train_loss": -36.15815353393555, "global_step": 109886, "epoch": 908} {"train_loss": -35.581153869628906, "global_step": 109887, "epoch": 908} {"train_loss": -35.545982360839844, "global_step": 109888, "epoch": 908} {"train_loss": -35.2451057434082, "global_step": 109889, "epoch": 908} {"train_loss": -35.1265869140625, "global_step": 109890, "epoch": 908} {"train_loss": -35.65781021118164, "global_step": 109891, "epoch": 908} {"train_loss": -35.75202941894531, "global_step": 109892, "epoch": 908} {"train_loss": -35.3162727355957, "global_step": 109893, "epoch": 908} {"train_loss": -35.505855560302734, "global_step": 109894, "epoch": 908} {"train_loss": -35.68730926513672, "global_step": 109895, "epoch": 908} {"train_loss": -36.16457748413086, "global_step": 109896, "epoch": 908} {"train_loss": -36.14192581176758, "global_step": 109897, "epoch": 908} {"train_loss": -35.399715423583984, "global_step": 109898, "epoch": 908} {"train_loss": -36.12438201904297, "global_step": 109899, "epoch": 908} {"train_loss": -36.38785934448242, "global_step": 109900, "epoch": 908} {"train_loss": -36.93756103515625, "global_step": 109901, "epoch": 908} {"train_loss": -34.20766067504883, "global_step": 109902, "epoch": 908} {"train_loss": -36.355464935302734, "global_step": 109903, "epoch": 908} {"train_loss": -36.43214797973633, "global_step": 109904, "epoch": 908} {"train_loss": -36.44568634033203, "global_step": 109905, "epoch": 908} {"train_loss": -37.21210861206055, "global_step": 109906, "epoch": 908} {"train_loss": -37.173702239990234, "global_step": 109907, "epoch": 908} {"train_loss": -36.3678092956543, "global_step": 109908, "epoch": 908} {"train_loss": -37.01591110229492, "global_step": 109909, "epoch": 908} {"train_loss": -36.141231536865234, "global_step": 109910, "epoch": 908} {"train_loss": -36.62018585205078, "global_step": 109911, "epoch": 908} {"train_loss": -37.50042724609375, "global_step": 109912, "epoch": 908} {"train_loss": -36.754268646240234, "global_step": 109913, "epoch": 908} {"train_loss": -37.042274475097656, "global_step": 109914, "epoch": 908} {"train_loss": -37.097591400146484, "global_step": 109915, "epoch": 908} {"train_loss": -36.85129928588867, "global_step": 109916, "epoch": 908} {"train_loss": -37.2147102355957, "global_step": 109917, "epoch": 908} {"train_loss": -37.389095306396484, "global_step": 109918, "epoch": 908} {"train_loss": -37.233543395996094, "global_step": 109919, "epoch": 908} {"train_loss": -37.08348083496094, "global_step": 109920, "epoch": 908} {"train_loss": -37.76144027709961, "global_step": 109921, "epoch": 908} {"train_loss": -36.796932220458984, "global_step": 109922, "epoch": 908} {"train_loss": -36.87207794189453, "global_step": 109923, "epoch": 908} {"train_loss": -37.63859176635742, "global_step": 109924, "epoch": 908} {"train_loss": -37.695640563964844, "global_step": 109925, "epoch": 908} {"train_loss": -37.57844543457031, "global_step": 109926, "epoch": 908} {"train_loss": -37.79275131225586, "global_step": 109927, "epoch": 908} {"train_loss": -37.56342697143555, "global_step": 109928, "epoch": 908} {"train_loss": -37.75379180908203, "global_step": 109929, "epoch": 908} {"train_loss": -37.684139251708984, "global_step": 109930, "epoch": 908} {"train_loss": -37.29362869262695, "global_step": 109931, "epoch": 908} {"train_loss": -37.61931228637695, "global_step": 109932, "epoch": 908} {"train_loss": -37.59902572631836, "global_step": 109933, "epoch": 908} {"train_loss": -37.6727180480957, "global_step": 109934, "epoch": 908} {"train_loss": -37.85807418823242, "global_step": 109935, "epoch": 908} {"train_loss": -37.812217712402344, "global_step": 109936, "epoch": 908} {"train_loss": -37.49348068237305, "global_step": 109937, "epoch": 908} {"train_loss": -38.05241012573242, "global_step": 109938, "epoch": 908} {"train_loss": -37.17235565185547, "global_step": 109939, "epoch": 908} {"train_loss": -38.06126022338867, "global_step": 109940, "epoch": 908} {"train_loss": -37.88508224487305, "global_step": 109941, "epoch": 908} {"train_loss": -38.09476089477539, "global_step": 109942, "epoch": 908} {"train_loss": -37.53843307495117, "global_step": 109943, "epoch": 908} {"train_loss": -37.428688049316406, "global_step": 109944, "epoch": 908} {"train_loss": -38.1666374206543, "global_step": 109945, "epoch": 908} {"train_loss": -37.95380783081055, "global_step": 109946, "epoch": 908} {"train_loss": -38.53803253173828, "global_step": 109947, "epoch": 908} {"train_loss": -37.94932174682617, "global_step": 109948, "epoch": 908} {"train_loss": -38.44321823120117, "global_step": 109949, "epoch": 908} {"train_loss": -38.436344146728516, "global_step": 109950, "epoch": 908} {"train_loss": -37.611080169677734, "global_step": 109951, "epoch": 908} {"train_loss": -38.765316009521484, "global_step": 109952, "epoch": 908} {"train_loss": -38.31911087036133, "global_step": 109953, "epoch": 908} {"train_loss": -38.334285736083984, "global_step": 109954, "epoch": 908} {"train_loss": -38.71247100830078, "global_step": 109955, "epoch": 908} {"train_loss": -38.4095573425293, "global_step": 109956, "epoch": 908} {"train_loss": -38.6954460144043, "global_step": 109957, "epoch": 908} {"train_loss": -38.60748291015625, "global_step": 109958, "epoch": 908} {"train_loss": -38.37627029418945, "global_step": 109959, "epoch": 908} {"train_loss": -39.02417755126953, "global_step": 109960, "epoch": 908} {"train_loss": -38.32167434692383, "global_step": 109961, "epoch": 908} {"train_loss": -38.33481979370117, "global_step": 109962, "epoch": 908} {"train_loss": -38.953529357910156, "global_step": 109963, "epoch": 908} {"train_loss": -38.021339416503906, "global_step": 109964, "epoch": 908} {"train_loss": -38.484230041503906, "global_step": 109965, "epoch": 908} {"train_loss": -38.451839447021484, "global_step": 109966, "epoch": 908} {"train_loss": -38.850555419921875, "global_step": 109967, "epoch": 908} {"train_loss": -37.995479583740234, "global_step": 109968, "epoch": 908} {"train_loss": -38.14973831176758, "global_step": 109969, "epoch": 908} {"train_loss": -37.21963119506836, "global_step": 109970, "epoch": 908} {"train_loss": -36.0120735168457, "global_step": 109971, "epoch": 908} {"train_loss": -35.7292594909668, "global_step": 109972, "epoch": 908} {"train_loss": -34.046539306640625, "global_step": 109973, "epoch": 908} {"train_loss": -34.20646286010742, "global_step": 109974, "epoch": 908} {"train_loss": -34.2926139831543, "global_step": 109975, "epoch": 908} {"train_loss": -34.85994338989258, "global_step": 109976, "epoch": 908} {"train_loss": -36.63258361816406, "global_step": 109977, "epoch": 908} {"train_loss": -38.32155227661133, "global_step": 109978, "epoch": 908} {"train_loss": -37.792579650878906, "global_step": 109979, "epoch": 908} {"train_loss": -36.55827331542969, "global_step": 109980, "epoch": 908} {"train_loss": -37.787776947021484, "global_step": 109981, "epoch": 908} {"train_loss": -38.960079193115234, "global_step": 109982, "epoch": 908} {"train_loss": -37.714107513427734, "global_step": 109983, "epoch": 908} {"train_loss": -37.2507438659668, "global_step": 109984, "epoch": 908} {"train_loss": -38.05990219116211, "global_step": 109985, "epoch": 908} {"train_loss": -38.50286865234375, "global_step": 109986, "epoch": 908} {"train_loss": -37.78068923950195, "global_step": 109987, "epoch": 908} {"train_loss": -36.60059703480113, "global_step": 109988, "epoch": 908, "val_loss": 2560725.25} {"train_loss": -37.5550651550293, "global_step": 109989, "epoch": 909} {"train_loss": -37.2499885559082, "global_step": 109990, "epoch": 909} {"train_loss": -38.60172653198242, "global_step": 109991, "epoch": 909} {"train_loss": -38.56181716918945, "global_step": 109992, "epoch": 909} {"train_loss": -37.36787414550781, "global_step": 109993, "epoch": 909} {"train_loss": -37.25938034057617, "global_step": 109994, "epoch": 909} {"train_loss": -38.0809211730957, "global_step": 109995, "epoch": 909} {"train_loss": -39.11448287963867, "global_step": 109996, "epoch": 909} {"train_loss": -38.162872314453125, "global_step": 109997, "epoch": 909} {"train_loss": -38.12273025512695, "global_step": 109998, "epoch": 909} {"train_loss": -38.06136703491211, "global_step": 109999, "epoch": 909} {"train_loss": -38.95158004760742, "global_step": 110000, "epoch": 909} {"train_loss": -38.20691680908203, "global_step": 110001, "epoch": 909} {"train_loss": -37.867488861083984, "global_step": 110002, "epoch": 909} {"train_loss": -37.130672454833984, "global_step": 110003, "epoch": 909} {"train_loss": -38.911834716796875, "global_step": 110004, "epoch": 909} {"train_loss": -38.54948043823242, "global_step": 110005, "epoch": 909} {"train_loss": -37.661834716796875, "global_step": 110006, "epoch": 909} {"train_loss": -37.44704055786133, "global_step": 110007, "epoch": 909} {"train_loss": -39.08477783203125, "global_step": 110008, "epoch": 909} {"train_loss": -38.233802795410156, "global_step": 110009, "epoch": 909} {"train_loss": -37.020633697509766, "global_step": 110010, "epoch": 909} {"train_loss": -38.214569091796875, "global_step": 110011, "epoch": 909} {"train_loss": -38.81739044189453, "global_step": 110012, "epoch": 909} {"train_loss": -37.78175735473633, "global_step": 110013, "epoch": 909} {"train_loss": -39.0047721862793, "global_step": 110014, "epoch": 909} {"train_loss": -39.03968048095703, "global_step": 110015, "epoch": 909} {"train_loss": -38.526546478271484, "global_step": 110016, "epoch": 909} {"train_loss": -38.28626251220703, "global_step": 110017, "epoch": 909} {"train_loss": -38.569637298583984, "global_step": 110018, "epoch": 909} {"train_loss": -38.337154388427734, "global_step": 110019, "epoch": 909} {"train_loss": -38.82536697387695, "global_step": 110020, "epoch": 909} {"train_loss": -38.22132110595703, "global_step": 110021, "epoch": 909} {"train_loss": -38.1490592956543, "global_step": 110022, "epoch": 909} {"train_loss": -38.25197219848633, "global_step": 110023, "epoch": 909} {"train_loss": -38.39274215698242, "global_step": 110024, "epoch": 909} {"train_loss": -38.97052764892578, "global_step": 110025, "epoch": 909} {"train_loss": -38.0408821105957, "global_step": 110026, "epoch": 909} {"train_loss": -39.05399703979492, "global_step": 110027, "epoch": 909} {"train_loss": -38.9378547668457, "global_step": 110028, "epoch": 909} {"train_loss": -38.329566955566406, "global_step": 110029, "epoch": 909} {"train_loss": -39.147613525390625, "global_step": 110030, "epoch": 909} {"train_loss": -38.22304153442383, "global_step": 110031, "epoch": 909} {"train_loss": -39.663002014160156, "global_step": 110032, "epoch": 909} {"train_loss": -38.301353454589844, "global_step": 110033, "epoch": 909} {"train_loss": -39.371707916259766, "global_step": 110034, "epoch": 909} {"train_loss": -38.81582260131836, "global_step": 110035, "epoch": 909} {"train_loss": -38.96955108642578, "global_step": 110036, "epoch": 909} {"train_loss": -39.2154655456543, "global_step": 110037, "epoch": 909} {"train_loss": -38.24222946166992, "global_step": 110038, "epoch": 909} {"train_loss": -39.06643295288086, "global_step": 110039, "epoch": 909} {"train_loss": -38.920379638671875, "global_step": 110040, "epoch": 909} {"train_loss": -38.9748649597168, "global_step": 110041, "epoch": 909} {"train_loss": -38.1555290222168, "global_step": 110042, "epoch": 909} {"train_loss": -39.25442123413086, "global_step": 110043, "epoch": 909} {"train_loss": -37.68896484375, "global_step": 110044, "epoch": 909} {"train_loss": -38.737091064453125, "global_step": 110045, "epoch": 909} {"train_loss": -36.966163635253906, "global_step": 110046, "epoch": 909} {"train_loss": -38.0948600769043, "global_step": 110047, "epoch": 909} {"train_loss": -37.99852752685547, "global_step": 110048, "epoch": 909} {"train_loss": -38.34949493408203, "global_step": 110049, "epoch": 909} {"train_loss": -37.083126068115234, "global_step": 110050, "epoch": 909} {"train_loss": -36.82963943481445, "global_step": 110051, "epoch": 909} {"train_loss": -36.41108703613281, "global_step": 110052, "epoch": 909} {"train_loss": -37.55064010620117, "global_step": 110053, "epoch": 909} {"train_loss": -38.79225158691406, "global_step": 110054, "epoch": 909} {"train_loss": -38.4211311340332, "global_step": 110055, "epoch": 909} {"train_loss": -37.389068603515625, "global_step": 110056, "epoch": 909} {"train_loss": -36.109947204589844, "global_step": 110057, "epoch": 909} {"train_loss": -35.197296142578125, "global_step": 110058, "epoch": 909} {"train_loss": -36.13559341430664, "global_step": 110059, "epoch": 909} {"train_loss": -35.97706985473633, "global_step": 110060, "epoch": 909} {"train_loss": -37.898136138916016, "global_step": 110061, "epoch": 909} {"train_loss": -36.65492630004883, "global_step": 110062, "epoch": 909} {"train_loss": -37.485633850097656, "global_step": 110063, "epoch": 909} {"train_loss": -37.207664489746094, "global_step": 110064, "epoch": 909} {"train_loss": -36.97039031982422, "global_step": 110065, "epoch": 909} {"train_loss": -38.282135009765625, "global_step": 110066, "epoch": 909} {"train_loss": -38.15901565551758, "global_step": 110067, "epoch": 909} {"train_loss": -37.80714797973633, "global_step": 110068, "epoch": 909} {"train_loss": -38.1370735168457, "global_step": 110069, "epoch": 909} {"train_loss": -38.381866455078125, "global_step": 110070, "epoch": 909} {"train_loss": -37.99995803833008, "global_step": 110071, "epoch": 909} {"train_loss": -38.209327697753906, "global_step": 110072, "epoch": 909} {"train_loss": -38.551082611083984, "global_step": 110073, "epoch": 909} {"train_loss": -38.232398986816406, "global_step": 110074, "epoch": 909} {"train_loss": -36.6043815612793, "global_step": 110075, "epoch": 909} {"train_loss": -38.0863037109375, "global_step": 110076, "epoch": 909} {"train_loss": -37.6527099609375, "global_step": 110077, "epoch": 909} {"train_loss": -36.49359130859375, "global_step": 110078, "epoch": 909} {"train_loss": -37.835548400878906, "global_step": 110079, "epoch": 909} {"train_loss": -36.777496337890625, "global_step": 110080, "epoch": 909} {"train_loss": -36.141441345214844, "global_step": 110081, "epoch": 909} {"train_loss": -37.79886245727539, "global_step": 110082, "epoch": 909} {"train_loss": -37.026405334472656, "global_step": 110083, "epoch": 909} {"train_loss": -37.427581787109375, "global_step": 110084, "epoch": 909} {"train_loss": -37.823299407958984, "global_step": 110085, "epoch": 909} {"train_loss": -37.41333770751953, "global_step": 110086, "epoch": 909} {"train_loss": -38.1153564453125, "global_step": 110087, "epoch": 909} {"train_loss": -36.76340103149414, "global_step": 110088, "epoch": 909} {"train_loss": -39.04868698120117, "global_step": 110089, "epoch": 909} {"train_loss": -36.570228576660156, "global_step": 110090, "epoch": 909} {"train_loss": -37.73081588745117, "global_step": 110091, "epoch": 909} {"train_loss": -38.3187141418457, "global_step": 110092, "epoch": 909} {"train_loss": -38.26473617553711, "global_step": 110093, "epoch": 909} {"train_loss": -38.403255462646484, "global_step": 110094, "epoch": 909} {"train_loss": -37.855445861816406, "global_step": 110095, "epoch": 909} {"train_loss": -38.294677734375, "global_step": 110096, "epoch": 909} {"train_loss": -38.47399139404297, "global_step": 110097, "epoch": 909} {"train_loss": -38.12629318237305, "global_step": 110098, "epoch": 909} {"train_loss": -38.47400665283203, "global_step": 110099, "epoch": 909} {"train_loss": -37.990753173828125, "global_step": 110100, "epoch": 909} {"train_loss": -38.77030563354492, "global_step": 110101, "epoch": 909} {"train_loss": -38.03103256225586, "global_step": 110102, "epoch": 909} {"train_loss": -38.648738861083984, "global_step": 110103, "epoch": 909} {"train_loss": -37.686336517333984, "global_step": 110104, "epoch": 909} {"train_loss": -38.756019592285156, "global_step": 110105, "epoch": 909} {"train_loss": -37.73466110229492, "global_step": 110106, "epoch": 909} {"train_loss": -38.6263427734375, "global_step": 110107, "epoch": 909} {"train_loss": -38.789302825927734, "global_step": 110108, "epoch": 909} {"train_loss": -38.022256457115994, "global_step": 110109, "epoch": 909, "val_loss": 2552854.25} {"train_loss": -38.34446334838867, "global_step": 110110, "epoch": 910} {"train_loss": -38.7005615234375, "global_step": 110111, "epoch": 910} {"train_loss": -38.69159698486328, "global_step": 110112, "epoch": 910} {"train_loss": -39.1313591003418, "global_step": 110113, "epoch": 910} {"train_loss": -38.96340560913086, "global_step": 110114, "epoch": 910} {"train_loss": -38.98255157470703, "global_step": 110115, "epoch": 910} {"train_loss": -38.75472640991211, "global_step": 110116, "epoch": 910} {"train_loss": -39.28614044189453, "global_step": 110117, "epoch": 910} {"train_loss": -39.0008659362793, "global_step": 110118, "epoch": 910} {"train_loss": -38.689422607421875, "global_step": 110119, "epoch": 910} {"train_loss": -38.689849853515625, "global_step": 110120, "epoch": 910} {"train_loss": -38.963157653808594, "global_step": 110121, "epoch": 910} {"train_loss": -38.89377975463867, "global_step": 110122, "epoch": 910} {"train_loss": -39.607330322265625, "global_step": 110123, "epoch": 910} {"train_loss": -39.44879150390625, "global_step": 110124, "epoch": 910} {"train_loss": -39.48834228515625, "global_step": 110125, "epoch": 910} {"train_loss": -39.64728927612305, "global_step": 110126, "epoch": 910} {"train_loss": -39.441932678222656, "global_step": 110127, "epoch": 910} {"train_loss": -39.874488830566406, "global_step": 110128, "epoch": 910} {"train_loss": -39.71963119506836, "global_step": 110129, "epoch": 910} {"train_loss": -39.44253158569336, "global_step": 110130, "epoch": 910} {"train_loss": -39.33329391479492, "global_step": 110131, "epoch": 910} {"train_loss": -39.30197525024414, "global_step": 110132, "epoch": 910} {"train_loss": -39.49623489379883, "global_step": 110133, "epoch": 910} {"train_loss": -39.66770553588867, "global_step": 110134, "epoch": 910} {"train_loss": -39.841583251953125, "global_step": 110135, "epoch": 910} {"train_loss": -39.78751754760742, "global_step": 110136, "epoch": 910} {"train_loss": -39.47111511230469, "global_step": 110137, "epoch": 910} {"train_loss": -39.47764205932617, "global_step": 110138, "epoch": 910} {"train_loss": -38.630611419677734, "global_step": 110139, "epoch": 910} {"train_loss": -37.4130973815918, "global_step": 110140, "epoch": 910} {"train_loss": -38.96479034423828, "global_step": 110141, "epoch": 910} {"train_loss": -38.78977584838867, "global_step": 110142, "epoch": 910} {"train_loss": -39.4859733581543, "global_step": 110143, "epoch": 910} {"train_loss": -38.999610900878906, "global_step": 110144, "epoch": 910} {"train_loss": -38.82370376586914, "global_step": 110145, "epoch": 910} {"train_loss": -39.08852005004883, "global_step": 110146, "epoch": 910} {"train_loss": -37.67427444458008, "global_step": 110147, "epoch": 910} {"train_loss": -36.64537048339844, "global_step": 110148, "epoch": 910} {"train_loss": -36.38246154785156, "global_step": 110149, "epoch": 910} {"train_loss": -35.8963508605957, "global_step": 110150, "epoch": 910} {"train_loss": -35.474666595458984, "global_step": 110151, "epoch": 910} {"train_loss": -36.58674240112305, "global_step": 110152, "epoch": 910} {"train_loss": -37.89243698120117, "global_step": 110153, "epoch": 910} {"train_loss": -38.615543365478516, "global_step": 110154, "epoch": 910} {"train_loss": -38.01704788208008, "global_step": 110155, "epoch": 910} {"train_loss": -33.09965896606445, "global_step": 110156, "epoch": 910} {"train_loss": -37.24750900268555, "global_step": 110157, "epoch": 910} {"train_loss": -36.90285873413086, "global_step": 110158, "epoch": 910} {"train_loss": -38.015846252441406, "global_step": 110159, "epoch": 910} {"train_loss": -39.14863204956055, "global_step": 110160, "epoch": 910} {"train_loss": -38.11207962036133, "global_step": 110161, "epoch": 910} {"train_loss": -38.351287841796875, "global_step": 110162, "epoch": 910} {"train_loss": -37.66624069213867, "global_step": 110163, "epoch": 910} {"train_loss": -37.399906158447266, "global_step": 110164, "epoch": 910} {"train_loss": -36.94869613647461, "global_step": 110165, "epoch": 910} {"train_loss": -37.4406623840332, "global_step": 110166, "epoch": 910} {"train_loss": -38.37897491455078, "global_step": 110167, "epoch": 910} {"train_loss": -37.9691276550293, "global_step": 110168, "epoch": 910} {"train_loss": -38.71795654296875, "global_step": 110169, "epoch": 910} {"train_loss": -37.363895416259766, "global_step": 110170, "epoch": 910} {"train_loss": -37.256038665771484, "global_step": 110171, "epoch": 910} {"train_loss": -39.03363037109375, "global_step": 110172, "epoch": 910} {"train_loss": -38.161415100097656, "global_step": 110173, "epoch": 910} {"train_loss": -37.865997314453125, "global_step": 110174, "epoch": 910} {"train_loss": -38.896156311035156, "global_step": 110175, "epoch": 910} {"train_loss": -38.61975860595703, "global_step": 110176, "epoch": 910} {"train_loss": -37.948055267333984, "global_step": 110177, "epoch": 910} {"train_loss": -38.52241897583008, "global_step": 110178, "epoch": 910} {"train_loss": -37.7672119140625, "global_step": 110179, "epoch": 910} {"train_loss": -39.05567169189453, "global_step": 110180, "epoch": 910} {"train_loss": -36.905494689941406, "global_step": 110181, "epoch": 910} {"train_loss": -37.2088623046875, "global_step": 110182, "epoch": 910} {"train_loss": -38.958221435546875, "global_step": 110183, "epoch": 910} {"train_loss": -38.26334762573242, "global_step": 110184, "epoch": 910} {"train_loss": -38.5526008605957, "global_step": 110185, "epoch": 910} {"train_loss": -38.31391525268555, "global_step": 110186, "epoch": 910} {"train_loss": -36.834877014160156, "global_step": 110187, "epoch": 910} {"train_loss": -37.68372344970703, "global_step": 110188, "epoch": 910} {"train_loss": -39.128047943115234, "global_step": 110189, "epoch": 910} {"train_loss": -38.320533752441406, "global_step": 110190, "epoch": 910} {"train_loss": -39.081512451171875, "global_step": 110191, "epoch": 910} {"train_loss": -38.73420333862305, "global_step": 110192, "epoch": 910} {"train_loss": -37.9801025390625, "global_step": 110193, "epoch": 910} {"train_loss": -38.52193832397461, "global_step": 110194, "epoch": 910} {"train_loss": -38.71529769897461, "global_step": 110195, "epoch": 910} {"train_loss": -39.12299728393555, "global_step": 110196, "epoch": 910} {"train_loss": -38.13632583618164, "global_step": 110197, "epoch": 910} {"train_loss": -38.39924621582031, "global_step": 110198, "epoch": 910} {"train_loss": -38.5139274597168, "global_step": 110199, "epoch": 910} {"train_loss": -37.92826461791992, "global_step": 110200, "epoch": 910} {"train_loss": -38.32237243652344, "global_step": 110201, "epoch": 910} {"train_loss": -37.76543045043945, "global_step": 110202, "epoch": 910} {"train_loss": -38.468101501464844, "global_step": 110203, "epoch": 910} {"train_loss": -39.10493087768555, "global_step": 110204, "epoch": 910} {"train_loss": -38.54582595825195, "global_step": 110205, "epoch": 910} {"train_loss": -38.42995834350586, "global_step": 110206, "epoch": 910} {"train_loss": -37.49412155151367, "global_step": 110207, "epoch": 910} {"train_loss": -38.09856033325195, "global_step": 110208, "epoch": 910} {"train_loss": -38.42897415161133, "global_step": 110209, "epoch": 910} {"train_loss": -36.729801177978516, "global_step": 110210, "epoch": 910} {"train_loss": -35.054264068603516, "global_step": 110211, "epoch": 910} {"train_loss": -35.45283889770508, "global_step": 110212, "epoch": 910} {"train_loss": -37.046138763427734, "global_step": 110213, "epoch": 910} {"train_loss": -34.47103500366211, "global_step": 110214, "epoch": 910} {"train_loss": -38.092037200927734, "global_step": 110215, "epoch": 910} {"train_loss": -36.042110443115234, "global_step": 110216, "epoch": 910} {"train_loss": -37.45661163330078, "global_step": 110217, "epoch": 910} {"train_loss": -36.92043685913086, "global_step": 110218, "epoch": 910} {"train_loss": -37.6309928894043, "global_step": 110219, "epoch": 910} {"train_loss": -35.669471740722656, "global_step": 110220, "epoch": 910} {"train_loss": -37.4211311340332, "global_step": 110221, "epoch": 910} {"train_loss": -38.35227966308594, "global_step": 110222, "epoch": 910} {"train_loss": -36.05302047729492, "global_step": 110223, "epoch": 910} {"train_loss": -38.325828552246094, "global_step": 110224, "epoch": 910} {"train_loss": -38.07255935668945, "global_step": 110225, "epoch": 910} {"train_loss": -38.30278396606445, "global_step": 110226, "epoch": 910} {"train_loss": -38.55941390991211, "global_step": 110227, "epoch": 910} {"train_loss": -38.91345977783203, "global_step": 110228, "epoch": 910} {"train_loss": -37.56285095214844, "global_step": 110229, "epoch": 910} {"train_loss": -38.15900402226724, "global_step": 110230, "epoch": 910, "val_loss": 2674826.25} {"train_loss": -37.29834747314453, "global_step": 110231, "epoch": 911} {"train_loss": -38.74946212768555, "global_step": 110232, "epoch": 911} {"train_loss": -33.60943603515625, "global_step": 110233, "epoch": 911} {"train_loss": -38.81406021118164, "global_step": 110234, "epoch": 911} {"train_loss": -35.11674499511719, "global_step": 110235, "epoch": 911} {"train_loss": -37.553077697753906, "global_step": 110236, "epoch": 911} {"train_loss": -35.980403900146484, "global_step": 110237, "epoch": 911} {"train_loss": -37.82634353637695, "global_step": 110238, "epoch": 911} {"train_loss": -38.60832595825195, "global_step": 110239, "epoch": 911} {"train_loss": -36.281761169433594, "global_step": 110240, "epoch": 911} {"train_loss": -39.09446334838867, "global_step": 110241, "epoch": 911} {"train_loss": -37.235660552978516, "global_step": 110242, "epoch": 911} {"train_loss": -37.67819595336914, "global_step": 110243, "epoch": 911} {"train_loss": -37.310909271240234, "global_step": 110244, "epoch": 911} {"train_loss": -37.50847244262695, "global_step": 110245, "epoch": 911} {"train_loss": -36.18748474121094, "global_step": 110246, "epoch": 911} {"train_loss": -38.37008285522461, "global_step": 110247, "epoch": 911} {"train_loss": -37.56649398803711, "global_step": 110248, "epoch": 911} {"train_loss": -38.68612289428711, "global_step": 110249, "epoch": 911} {"train_loss": -38.78832244873047, "global_step": 110250, "epoch": 911} {"train_loss": -37.762569427490234, "global_step": 110251, "epoch": 911} {"train_loss": -37.95562744140625, "global_step": 110252, "epoch": 911} {"train_loss": -38.6372184753418, "global_step": 110253, "epoch": 911} {"train_loss": -38.07696533203125, "global_step": 110254, "epoch": 911} {"train_loss": -38.01939010620117, "global_step": 110255, "epoch": 911} {"train_loss": -38.4785270690918, "global_step": 110256, "epoch": 911} {"train_loss": -38.054683685302734, "global_step": 110257, "epoch": 911} {"train_loss": -38.2928466796875, "global_step": 110258, "epoch": 911} {"train_loss": -38.48500061035156, "global_step": 110259, "epoch": 911} {"train_loss": -38.557193756103516, "global_step": 110260, "epoch": 911} {"train_loss": -38.564300537109375, "global_step": 110261, "epoch": 911} {"train_loss": -39.22886276245117, "global_step": 110262, "epoch": 911} {"train_loss": -38.47236251831055, "global_step": 110263, "epoch": 911} {"train_loss": -39.001773834228516, "global_step": 110264, "epoch": 911} {"train_loss": -38.18042755126953, "global_step": 110265, "epoch": 911} {"train_loss": -39.292083740234375, "global_step": 110266, "epoch": 911} {"train_loss": -38.396541595458984, "global_step": 110267, "epoch": 911} {"train_loss": -38.054866790771484, "global_step": 110268, "epoch": 911} {"train_loss": -38.914485931396484, "global_step": 110269, "epoch": 911} {"train_loss": -39.00651931762695, "global_step": 110270, "epoch": 911} {"train_loss": -38.9321403503418, "global_step": 110271, "epoch": 911} {"train_loss": -37.609588623046875, "global_step": 110272, "epoch": 911} {"train_loss": -38.387142181396484, "global_step": 110273, "epoch": 911} {"train_loss": -39.2753791809082, "global_step": 110274, "epoch": 911} {"train_loss": -39.40542221069336, "global_step": 110275, "epoch": 911} {"train_loss": -38.1934814453125, "global_step": 110276, "epoch": 911} {"train_loss": -39.084407806396484, "global_step": 110277, "epoch": 911} {"train_loss": -38.13157272338867, "global_step": 110278, "epoch": 911} {"train_loss": -38.90938186645508, "global_step": 110279, "epoch": 911} {"train_loss": -38.46195602416992, "global_step": 110280, "epoch": 911} {"train_loss": -37.582576751708984, "global_step": 110281, "epoch": 911} {"train_loss": -38.974552154541016, "global_step": 110282, "epoch": 911} {"train_loss": -38.777706146240234, "global_step": 110283, "epoch": 911} {"train_loss": -36.93841552734375, "global_step": 110284, "epoch": 911} {"train_loss": -39.18042755126953, "global_step": 110285, "epoch": 911} {"train_loss": -38.70159149169922, "global_step": 110286, "epoch": 911} {"train_loss": -38.454681396484375, "global_step": 110287, "epoch": 911} {"train_loss": -39.14579391479492, "global_step": 110288, "epoch": 911} {"train_loss": -36.34568405151367, "global_step": 110289, "epoch": 911} {"train_loss": -37.61370086669922, "global_step": 110290, "epoch": 911} {"train_loss": -38.55381393432617, "global_step": 110291, "epoch": 911} {"train_loss": -38.20866775512695, "global_step": 110292, "epoch": 911} {"train_loss": -37.899112701416016, "global_step": 110293, "epoch": 911} {"train_loss": -37.70856857299805, "global_step": 110294, "epoch": 911} {"train_loss": -38.459285736083984, "global_step": 110295, "epoch": 911} {"train_loss": -37.921512603759766, "global_step": 110296, "epoch": 911} {"train_loss": -36.7205810546875, "global_step": 110297, "epoch": 911} {"train_loss": -36.581390380859375, "global_step": 110298, "epoch": 911} {"train_loss": -38.12053298950195, "global_step": 110299, "epoch": 911} {"train_loss": -38.3747444152832, "global_step": 110300, "epoch": 911} {"train_loss": -37.16004180908203, "global_step": 110301, "epoch": 911} {"train_loss": -37.74500274658203, "global_step": 110302, "epoch": 911} {"train_loss": -37.83259201049805, "global_step": 110303, "epoch": 911} {"train_loss": -38.495906829833984, "global_step": 110304, "epoch": 911} {"train_loss": -38.96375274658203, "global_step": 110305, "epoch": 911} {"train_loss": -36.321022033691406, "global_step": 110306, "epoch": 911} {"train_loss": -36.8282585144043, "global_step": 110307, "epoch": 911} {"train_loss": -37.55803298950195, "global_step": 110308, "epoch": 911} {"train_loss": -38.2337532043457, "global_step": 110309, "epoch": 911} {"train_loss": -38.5809211730957, "global_step": 110310, "epoch": 911} {"train_loss": -38.32672882080078, "global_step": 110311, "epoch": 911} {"train_loss": -38.649959564208984, "global_step": 110312, "epoch": 911} {"train_loss": -37.681087493896484, "global_step": 110313, "epoch": 911} {"train_loss": -37.37818145751953, "global_step": 110314, "epoch": 911} {"train_loss": -37.147743225097656, "global_step": 110315, "epoch": 911} {"train_loss": -38.013526916503906, "global_step": 110316, "epoch": 911} {"train_loss": -38.3469123840332, "global_step": 110317, "epoch": 911} {"train_loss": -38.78924560546875, "global_step": 110318, "epoch": 911} {"train_loss": -38.88465881347656, "global_step": 110319, "epoch": 911} {"train_loss": -37.22236251831055, "global_step": 110320, "epoch": 911} {"train_loss": -38.30134201049805, "global_step": 110321, "epoch": 911} {"train_loss": -37.68180465698242, "global_step": 110322, "epoch": 911} {"train_loss": -38.61399459838867, "global_step": 110323, "epoch": 911} {"train_loss": -37.913726806640625, "global_step": 110324, "epoch": 911} {"train_loss": -38.48832321166992, "global_step": 110325, "epoch": 911} {"train_loss": -38.70624923706055, "global_step": 110326, "epoch": 911} {"train_loss": -38.70940017700195, "global_step": 110327, "epoch": 911} {"train_loss": -38.64994430541992, "global_step": 110328, "epoch": 911} {"train_loss": -38.757503509521484, "global_step": 110329, "epoch": 911} {"train_loss": -38.463253021240234, "global_step": 110330, "epoch": 911} {"train_loss": -37.464027404785156, "global_step": 110331, "epoch": 911} {"train_loss": -38.695655822753906, "global_step": 110332, "epoch": 911} {"train_loss": -39.006019592285156, "global_step": 110333, "epoch": 911} {"train_loss": -37.5356559753418, "global_step": 110334, "epoch": 911} {"train_loss": -38.90792465209961, "global_step": 110335, "epoch": 911} {"train_loss": -38.720394134521484, "global_step": 110336, "epoch": 911} {"train_loss": -36.425045013427734, "global_step": 110337, "epoch": 911} {"train_loss": -38.88862991333008, "global_step": 110338, "epoch": 911} {"train_loss": -37.974853515625, "global_step": 110339, "epoch": 911} {"train_loss": -38.813636779785156, "global_step": 110340, "epoch": 911} {"train_loss": -39.18519973754883, "global_step": 110341, "epoch": 911} {"train_loss": -38.65602493286133, "global_step": 110342, "epoch": 911} {"train_loss": -38.352294921875, "global_step": 110343, "epoch": 911} {"train_loss": -38.67938995361328, "global_step": 110344, "epoch": 911} {"train_loss": -38.541866302490234, "global_step": 110345, "epoch": 911} {"train_loss": -38.20024108886719, "global_step": 110346, "epoch": 911} {"train_loss": -37.68598175048828, "global_step": 110347, "epoch": 911} {"train_loss": -37.38500213623047, "global_step": 110348, "epoch": 911} {"train_loss": -38.73020935058594, "global_step": 110349, "epoch": 911} {"train_loss": -38.7974853515625, "global_step": 110350, "epoch": 911} {"train_loss": -38.11938016276714, "global_step": 110351, "epoch": 911, "val_loss": 2676921.5} {"train_loss": -38.86593246459961, "global_step": 110352, "epoch": 912} {"train_loss": -39.062503814697266, "global_step": 110353, "epoch": 912} {"train_loss": -39.32273483276367, "global_step": 110354, "epoch": 912} {"train_loss": -39.312232971191406, "global_step": 110355, "epoch": 912} {"train_loss": -38.853675842285156, "global_step": 110356, "epoch": 912} {"train_loss": -38.06539535522461, "global_step": 110357, "epoch": 912} {"train_loss": -38.656517028808594, "global_step": 110358, "epoch": 912} {"train_loss": -39.11676025390625, "global_step": 110359, "epoch": 912} {"train_loss": -38.219783782958984, "global_step": 110360, "epoch": 912} {"train_loss": -37.7345085144043, "global_step": 110361, "epoch": 912} {"train_loss": -38.23957443237305, "global_step": 110362, "epoch": 912} {"train_loss": -36.474700927734375, "global_step": 110363, "epoch": 912} {"train_loss": -36.7798957824707, "global_step": 110364, "epoch": 912} {"train_loss": -38.367279052734375, "global_step": 110365, "epoch": 912} {"train_loss": -38.384151458740234, "global_step": 110366, "epoch": 912} {"train_loss": -38.755924224853516, "global_step": 110367, "epoch": 912} {"train_loss": -38.59803009033203, "global_step": 110368, "epoch": 912} {"train_loss": -37.83347702026367, "global_step": 110369, "epoch": 912} {"train_loss": -37.34363555908203, "global_step": 110370, "epoch": 912} {"train_loss": -38.096435546875, "global_step": 110371, "epoch": 912} {"train_loss": -37.375911712646484, "global_step": 110372, "epoch": 912} {"train_loss": -38.728614807128906, "global_step": 110373, "epoch": 912} {"train_loss": -38.72935104370117, "global_step": 110374, "epoch": 912} {"train_loss": -35.56724548339844, "global_step": 110375, "epoch": 912} {"train_loss": -34.36600875854492, "global_step": 110376, "epoch": 912} {"train_loss": -35.73160171508789, "global_step": 110377, "epoch": 912} {"train_loss": -38.008602142333984, "global_step": 110378, "epoch": 912} {"train_loss": -38.994930267333984, "global_step": 110379, "epoch": 912} {"train_loss": -35.7725944519043, "global_step": 110380, "epoch": 912} {"train_loss": -37.83707046508789, "global_step": 110381, "epoch": 912} {"train_loss": -38.771270751953125, "global_step": 110382, "epoch": 912} {"train_loss": -38.167877197265625, "global_step": 110383, "epoch": 912} {"train_loss": -37.7574577331543, "global_step": 110384, "epoch": 912} {"train_loss": -37.66737365722656, "global_step": 110385, "epoch": 912} {"train_loss": -39.2483024597168, "global_step": 110386, "epoch": 912} {"train_loss": -36.890377044677734, "global_step": 110387, "epoch": 912} {"train_loss": -38.32947540283203, "global_step": 110388, "epoch": 912} {"train_loss": -38.14870834350586, "global_step": 110389, "epoch": 912} {"train_loss": -37.973785400390625, "global_step": 110390, "epoch": 912} {"train_loss": -38.927764892578125, "global_step": 110391, "epoch": 912} {"train_loss": -37.583072662353516, "global_step": 110392, "epoch": 912} {"train_loss": -38.783260345458984, "global_step": 110393, "epoch": 912} {"train_loss": -37.6160774230957, "global_step": 110394, "epoch": 912} {"train_loss": -38.919151306152344, "global_step": 110395, "epoch": 912} {"train_loss": -38.387123107910156, "global_step": 110396, "epoch": 912} {"train_loss": -38.6112174987793, "global_step": 110397, "epoch": 912} {"train_loss": -39.45606231689453, "global_step": 110398, "epoch": 912} {"train_loss": -38.86993408203125, "global_step": 110399, "epoch": 912} {"train_loss": -39.130855560302734, "global_step": 110400, "epoch": 912} {"train_loss": -38.40232467651367, "global_step": 110401, "epoch": 912} {"train_loss": -38.336673736572266, "global_step": 110402, "epoch": 912} {"train_loss": -39.08357238769531, "global_step": 110403, "epoch": 912} {"train_loss": -39.34013366699219, "global_step": 110404, "epoch": 912} {"train_loss": -38.55985641479492, "global_step": 110405, "epoch": 912} {"train_loss": -39.57501983642578, "global_step": 110406, "epoch": 912} {"train_loss": -38.80769348144531, "global_step": 110407, "epoch": 912} {"train_loss": -38.75666427612305, "global_step": 110408, "epoch": 912} {"train_loss": -39.34591293334961, "global_step": 110409, "epoch": 912} {"train_loss": -39.192806243896484, "global_step": 110410, "epoch": 912} {"train_loss": -39.41297149658203, "global_step": 110411, "epoch": 912} {"train_loss": -39.60773849487305, "global_step": 110412, "epoch": 912} {"train_loss": -39.01865768432617, "global_step": 110413, "epoch": 912} {"train_loss": -39.07987594604492, "global_step": 110414, "epoch": 912} {"train_loss": -38.96783447265625, "global_step": 110415, "epoch": 912} {"train_loss": -39.37563705444336, "global_step": 110416, "epoch": 912} {"train_loss": -39.410030364990234, "global_step": 110417, "epoch": 912} {"train_loss": -39.26762771606445, "global_step": 110418, "epoch": 912} {"train_loss": -38.334285736083984, "global_step": 110419, "epoch": 912} {"train_loss": -39.180702209472656, "global_step": 110420, "epoch": 912} {"train_loss": -38.77781295776367, "global_step": 110421, "epoch": 912} {"train_loss": -38.52602005004883, "global_step": 110422, "epoch": 912} {"train_loss": -38.54375076293945, "global_step": 110423, "epoch": 912} {"train_loss": -39.22639846801758, "global_step": 110424, "epoch": 912} {"train_loss": -38.34463119506836, "global_step": 110425, "epoch": 912} {"train_loss": -38.19926834106445, "global_step": 110426, "epoch": 912} {"train_loss": -38.21910095214844, "global_step": 110427, "epoch": 912} {"train_loss": -37.773860931396484, "global_step": 110428, "epoch": 912} {"train_loss": -37.66897201538086, "global_step": 110429, "epoch": 912} {"train_loss": -35.43299102783203, "global_step": 110430, "epoch": 912} {"train_loss": -35.93205642700195, "global_step": 110431, "epoch": 912} {"train_loss": -36.341880798339844, "global_step": 110432, "epoch": 912} {"train_loss": -37.66469955444336, "global_step": 110433, "epoch": 912} {"train_loss": -36.2197380065918, "global_step": 110434, "epoch": 912} {"train_loss": -34.59864044189453, "global_step": 110435, "epoch": 912} {"train_loss": -35.5399055480957, "global_step": 110436, "epoch": 912} {"train_loss": -37.16218566894531, "global_step": 110437, "epoch": 912} {"train_loss": -36.94636154174805, "global_step": 110438, "epoch": 912} {"train_loss": -35.64179229736328, "global_step": 110439, "epoch": 912} {"train_loss": -35.72043228149414, "global_step": 110440, "epoch": 912} {"train_loss": -37.32279586791992, "global_step": 110441, "epoch": 912} {"train_loss": -36.06377410888672, "global_step": 110442, "epoch": 912} {"train_loss": -36.67995071411133, "global_step": 110443, "epoch": 912} {"train_loss": -38.1374626159668, "global_step": 110444, "epoch": 912} {"train_loss": -37.605125427246094, "global_step": 110445, "epoch": 912} {"train_loss": -37.8892936706543, "global_step": 110446, "epoch": 912} {"train_loss": -36.06754684448242, "global_step": 110447, "epoch": 912} {"train_loss": -37.66596221923828, "global_step": 110448, "epoch": 912} {"train_loss": -37.39127731323242, "global_step": 110449, "epoch": 912} {"train_loss": -36.00454330444336, "global_step": 110450, "epoch": 912} {"train_loss": -38.171566009521484, "global_step": 110451, "epoch": 912} {"train_loss": -38.362918853759766, "global_step": 110452, "epoch": 912} {"train_loss": -38.18223190307617, "global_step": 110453, "epoch": 912} {"train_loss": -36.882991790771484, "global_step": 110454, "epoch": 912} {"train_loss": -38.29624938964844, "global_step": 110455, "epoch": 912} {"train_loss": -35.62716293334961, "global_step": 110456, "epoch": 912} {"train_loss": -37.90140914916992, "global_step": 110457, "epoch": 912} {"train_loss": -38.033138275146484, "global_step": 110458, "epoch": 912} {"train_loss": -38.402313232421875, "global_step": 110459, "epoch": 912} {"train_loss": -38.18391418457031, "global_step": 110460, "epoch": 912} {"train_loss": -38.17495346069336, "global_step": 110461, "epoch": 912} {"train_loss": -37.466552734375, "global_step": 110462, "epoch": 912} {"train_loss": -38.34579086303711, "global_step": 110463, "epoch": 912} {"train_loss": -37.53147506713867, "global_step": 110464, "epoch": 912} {"train_loss": -37.02860641479492, "global_step": 110465, "epoch": 912} {"train_loss": -37.69944763183594, "global_step": 110466, "epoch": 912} {"train_loss": -38.06562423706055, "global_step": 110467, "epoch": 912} {"train_loss": -37.18315505981445, "global_step": 110468, "epoch": 912} {"train_loss": -38.3285026550293, "global_step": 110469, "epoch": 912} {"train_loss": -38.305076599121094, "global_step": 110470, "epoch": 912} {"train_loss": -37.63352966308594, "global_step": 110471, "epoch": 912} {"train_loss": -37.961503020988026, "global_step": 110472, "epoch": 912, "val_loss": 2989011.25} {"train_loss": -38.416481018066406, "global_step": 110473, "epoch": 913} {"train_loss": -38.609676361083984, "global_step": 110474, "epoch": 913} {"train_loss": -37.15119552612305, "global_step": 110475, "epoch": 913} {"train_loss": -38.704368591308594, "global_step": 110476, "epoch": 913} {"train_loss": -37.998321533203125, "global_step": 110477, "epoch": 913} {"train_loss": -37.937042236328125, "global_step": 110478, "epoch": 913} {"train_loss": -36.65603256225586, "global_step": 110479, "epoch": 913} {"train_loss": -38.0613899230957, "global_step": 110480, "epoch": 913} {"train_loss": -38.2254524230957, "global_step": 110481, "epoch": 913} {"train_loss": -38.66028594970703, "global_step": 110482, "epoch": 913} {"train_loss": -36.615718841552734, "global_step": 110483, "epoch": 913} {"train_loss": -37.92717742919922, "global_step": 110484, "epoch": 913} {"train_loss": -38.42705154418945, "global_step": 110485, "epoch": 913} {"train_loss": -37.77569580078125, "global_step": 110486, "epoch": 913} {"train_loss": -38.52964401245117, "global_step": 110487, "epoch": 913} {"train_loss": -38.050331115722656, "global_step": 110488, "epoch": 913} {"train_loss": -38.868465423583984, "global_step": 110489, "epoch": 913} {"train_loss": -36.05387496948242, "global_step": 110490, "epoch": 913} {"train_loss": -38.51026153564453, "global_step": 110491, "epoch": 913} {"train_loss": -37.49723434448242, "global_step": 110492, "epoch": 913} {"train_loss": -37.87849044799805, "global_step": 110493, "epoch": 913} {"train_loss": -39.55659103393555, "global_step": 110494, "epoch": 913} {"train_loss": -38.1237678527832, "global_step": 110495, "epoch": 913} {"train_loss": -37.550174713134766, "global_step": 110496, "epoch": 913} {"train_loss": -38.88279342651367, "global_step": 110497, "epoch": 913} {"train_loss": -38.69905471801758, "global_step": 110498, "epoch": 913} {"train_loss": -37.44761276245117, "global_step": 110499, "epoch": 913} {"train_loss": -35.82851791381836, "global_step": 110500, "epoch": 913} {"train_loss": -38.408477783203125, "global_step": 110501, "epoch": 913} {"train_loss": -38.293922424316406, "global_step": 110502, "epoch": 913} {"train_loss": -38.38669204711914, "global_step": 110503, "epoch": 913} {"train_loss": -38.30910110473633, "global_step": 110504, "epoch": 913} {"train_loss": -37.86397171020508, "global_step": 110505, "epoch": 913} {"train_loss": -39.330875396728516, "global_step": 110506, "epoch": 913} {"train_loss": -38.79949951171875, "global_step": 110507, "epoch": 913} {"train_loss": -38.46625900268555, "global_step": 110508, "epoch": 913} {"train_loss": -38.37205505371094, "global_step": 110509, "epoch": 913} {"train_loss": -37.605892181396484, "global_step": 110510, "epoch": 913} {"train_loss": -37.643348693847656, "global_step": 110511, "epoch": 913} {"train_loss": -38.703243255615234, "global_step": 110512, "epoch": 913} {"train_loss": -37.815067291259766, "global_step": 110513, "epoch": 913} {"train_loss": -38.3282585144043, "global_step": 110514, "epoch": 913} {"train_loss": -36.963993072509766, "global_step": 110515, "epoch": 913} {"train_loss": -37.23992919921875, "global_step": 110516, "epoch": 913} {"train_loss": -38.26496124267578, "global_step": 110517, "epoch": 913} {"train_loss": -36.0080680847168, "global_step": 110518, "epoch": 913} {"train_loss": -34.41531753540039, "global_step": 110519, "epoch": 913} {"train_loss": -37.56447219848633, "global_step": 110520, "epoch": 913} {"train_loss": -36.401275634765625, "global_step": 110521, "epoch": 913} {"train_loss": -38.43765640258789, "global_step": 110522, "epoch": 913} {"train_loss": -38.139137268066406, "global_step": 110523, "epoch": 913} {"train_loss": -38.76007843017578, "global_step": 110524, "epoch": 913} {"train_loss": -38.1231803894043, "global_step": 110525, "epoch": 913} {"train_loss": -37.83356857299805, "global_step": 110526, "epoch": 913} {"train_loss": -38.35171127319336, "global_step": 110527, "epoch": 913} {"train_loss": -37.0625114440918, "global_step": 110528, "epoch": 913} {"train_loss": -37.97775650024414, "global_step": 110529, "epoch": 913} {"train_loss": -37.58109664916992, "global_step": 110530, "epoch": 913} {"train_loss": -38.424686431884766, "global_step": 110531, "epoch": 913} {"train_loss": -38.078060150146484, "global_step": 110532, "epoch": 913} {"train_loss": -38.74183654785156, "global_step": 110533, "epoch": 913} {"train_loss": -38.18978500366211, "global_step": 110534, "epoch": 913} {"train_loss": -36.192996978759766, "global_step": 110535, "epoch": 913} {"train_loss": -38.480098724365234, "global_step": 110536, "epoch": 913} {"train_loss": -37.19252395629883, "global_step": 110537, "epoch": 913} {"train_loss": -38.06510543823242, "global_step": 110538, "epoch": 913} {"train_loss": -38.280704498291016, "global_step": 110539, "epoch": 913} {"train_loss": -37.5004997253418, "global_step": 110540, "epoch": 913} {"train_loss": -38.05463790893555, "global_step": 110541, "epoch": 913} {"train_loss": -38.28782653808594, "global_step": 110542, "epoch": 913} {"train_loss": -38.24513244628906, "global_step": 110543, "epoch": 913} {"train_loss": -38.233612060546875, "global_step": 110544, "epoch": 913} {"train_loss": -38.28389358520508, "global_step": 110545, "epoch": 913} {"train_loss": -38.56442642211914, "global_step": 110546, "epoch": 913} {"train_loss": -38.83615493774414, "global_step": 110547, "epoch": 913} {"train_loss": -38.91586685180664, "global_step": 110548, "epoch": 913} {"train_loss": -38.4594841003418, "global_step": 110549, "epoch": 913} {"train_loss": -38.75247573852539, "global_step": 110550, "epoch": 913} {"train_loss": -38.69228744506836, "global_step": 110551, "epoch": 913} {"train_loss": -39.314674377441406, "global_step": 110552, "epoch": 913} {"train_loss": -38.275142669677734, "global_step": 110553, "epoch": 913} {"train_loss": -38.40509796142578, "global_step": 110554, "epoch": 913} {"train_loss": -38.276302337646484, "global_step": 110555, "epoch": 913} {"train_loss": -37.41999435424805, "global_step": 110556, "epoch": 913} {"train_loss": -38.71883773803711, "global_step": 110557, "epoch": 913} {"train_loss": -38.722286224365234, "global_step": 110558, "epoch": 913} {"train_loss": -38.63422393798828, "global_step": 110559, "epoch": 913} {"train_loss": -38.48765182495117, "global_step": 110560, "epoch": 913} {"train_loss": -38.2388801574707, "global_step": 110561, "epoch": 913} {"train_loss": -38.936458587646484, "global_step": 110562, "epoch": 913} {"train_loss": -38.802734375, "global_step": 110563, "epoch": 913} {"train_loss": -38.65394973754883, "global_step": 110564, "epoch": 913} {"train_loss": -38.30682373046875, "global_step": 110565, "epoch": 913} {"train_loss": -39.22329330444336, "global_step": 110566, "epoch": 913} {"train_loss": -39.67192077636719, "global_step": 110567, "epoch": 913} {"train_loss": -39.036720275878906, "global_step": 110568, "epoch": 913} {"train_loss": -38.45989227294922, "global_step": 110569, "epoch": 913} {"train_loss": -38.06096267700195, "global_step": 110570, "epoch": 913} {"train_loss": -39.17023849487305, "global_step": 110571, "epoch": 913} {"train_loss": -38.2299919128418, "global_step": 110572, "epoch": 913} {"train_loss": -37.46821594238281, "global_step": 110573, "epoch": 913} {"train_loss": -37.26395034790039, "global_step": 110574, "epoch": 913} {"train_loss": -36.5921630859375, "global_step": 110575, "epoch": 913} {"train_loss": -34.9827995300293, "global_step": 110576, "epoch": 913} {"train_loss": -32.26841354370117, "global_step": 110577, "epoch": 913} {"train_loss": -32.416133880615234, "global_step": 110578, "epoch": 913} {"train_loss": -35.090423583984375, "global_step": 110579, "epoch": 913} {"train_loss": -37.83563232421875, "global_step": 110580, "epoch": 913} {"train_loss": -36.36280059814453, "global_step": 110581, "epoch": 913} {"train_loss": -30.21565055847168, "global_step": 110582, "epoch": 913} {"train_loss": -36.03602981567383, "global_step": 110583, "epoch": 913} {"train_loss": -37.16363525390625, "global_step": 110584, "epoch": 913} {"train_loss": -31.0368595123291, "global_step": 110585, "epoch": 913} {"train_loss": -37.709651947021484, "global_step": 110586, "epoch": 913} {"train_loss": -32.68207550048828, "global_step": 110587, "epoch": 913} {"train_loss": -36.461063385009766, "global_step": 110588, "epoch": 913} {"train_loss": -34.393550872802734, "global_step": 110589, "epoch": 913} {"train_loss": -35.16538619995117, "global_step": 110590, "epoch": 913} {"train_loss": -36.020179748535156, "global_step": 110591, "epoch": 913} {"train_loss": -35.96156692504883, "global_step": 110592, "epoch": 913} {"train_loss": -37.602289215592315, "global_step": 110593, "epoch": 913, "val_loss": 2652869.25} {"train_loss": -38.46302795410156, "global_step": 110594, "epoch": 914} {"train_loss": -36.584556579589844, "global_step": 110595, "epoch": 914} {"train_loss": -37.14593505859375, "global_step": 110596, "epoch": 914} {"train_loss": -37.101837158203125, "global_step": 110597, "epoch": 914} {"train_loss": -36.58211898803711, "global_step": 110598, "epoch": 914} {"train_loss": -36.89716339111328, "global_step": 110599, "epoch": 914} {"train_loss": -37.7862548828125, "global_step": 110600, "epoch": 914} {"train_loss": -37.25204086303711, "global_step": 110601, "epoch": 914} {"train_loss": -37.60126876831055, "global_step": 110602, "epoch": 914} {"train_loss": -38.42145538330078, "global_step": 110603, "epoch": 914} {"train_loss": -37.808815002441406, "global_step": 110604, "epoch": 914} {"train_loss": -38.18691635131836, "global_step": 110605, "epoch": 914} {"train_loss": -38.16594314575195, "global_step": 110606, "epoch": 914} {"train_loss": -38.18946075439453, "global_step": 110607, "epoch": 914} {"train_loss": -38.31181716918945, "global_step": 110608, "epoch": 914} {"train_loss": -38.193504333496094, "global_step": 110609, "epoch": 914} {"train_loss": -38.35559844970703, "global_step": 110610, "epoch": 914} {"train_loss": -38.32291793823242, "global_step": 110611, "epoch": 914} {"train_loss": -37.93838119506836, "global_step": 110612, "epoch": 914} {"train_loss": -38.632354736328125, "global_step": 110613, "epoch": 914} {"train_loss": -37.775970458984375, "global_step": 110614, "epoch": 914} {"train_loss": -37.821773529052734, "global_step": 110615, "epoch": 914} {"train_loss": -38.36290740966797, "global_step": 110616, "epoch": 914} {"train_loss": -38.266517639160156, "global_step": 110617, "epoch": 914} {"train_loss": -38.831111907958984, "global_step": 110618, "epoch": 914} {"train_loss": -38.63651657104492, "global_step": 110619, "epoch": 914} {"train_loss": -38.060401916503906, "global_step": 110620, "epoch": 914} {"train_loss": -37.35981369018555, "global_step": 110621, "epoch": 914} {"train_loss": -38.97072982788086, "global_step": 110622, "epoch": 914} {"train_loss": -38.37794876098633, "global_step": 110623, "epoch": 914} {"train_loss": -38.232208251953125, "global_step": 110624, "epoch": 914} {"train_loss": -37.87648010253906, "global_step": 110625, "epoch": 914} {"train_loss": -38.6766357421875, "global_step": 110626, "epoch": 914} {"train_loss": -38.812721252441406, "global_step": 110627, "epoch": 914} {"train_loss": -38.86114501953125, "global_step": 110628, "epoch": 914} {"train_loss": -38.93914794921875, "global_step": 110629, "epoch": 914} {"train_loss": -38.567596435546875, "global_step": 110630, "epoch": 914} {"train_loss": -38.8375129699707, "global_step": 110631, "epoch": 914} {"train_loss": -38.832420349121094, "global_step": 110632, "epoch": 914} {"train_loss": -38.27358627319336, "global_step": 110633, "epoch": 914} {"train_loss": -39.08540725708008, "global_step": 110634, "epoch": 914} {"train_loss": -38.32234191894531, "global_step": 110635, "epoch": 914} {"train_loss": -38.01240158081055, "global_step": 110636, "epoch": 914} {"train_loss": -38.96186065673828, "global_step": 110637, "epoch": 914} {"train_loss": -38.71074676513672, "global_step": 110638, "epoch": 914} {"train_loss": -38.060508728027344, "global_step": 110639, "epoch": 914} {"train_loss": -37.932926177978516, "global_step": 110640, "epoch": 914} {"train_loss": -38.876068115234375, "global_step": 110641, "epoch": 914} {"train_loss": -38.94403839111328, "global_step": 110642, "epoch": 914} {"train_loss": -37.57255935668945, "global_step": 110643, "epoch": 914} {"train_loss": -36.329864501953125, "global_step": 110644, "epoch": 914} {"train_loss": -38.01544952392578, "global_step": 110645, "epoch": 914} {"train_loss": -38.76469039916992, "global_step": 110646, "epoch": 914} {"train_loss": -38.7885856628418, "global_step": 110647, "epoch": 914} {"train_loss": -38.71016311645508, "global_step": 110648, "epoch": 914} {"train_loss": -38.734039306640625, "global_step": 110649, "epoch": 914} {"train_loss": -38.3162956237793, "global_step": 110650, "epoch": 914} {"train_loss": -38.051483154296875, "global_step": 110651, "epoch": 914} {"train_loss": -38.483245849609375, "global_step": 110652, "epoch": 914} {"train_loss": -37.47347640991211, "global_step": 110653, "epoch": 914} {"train_loss": -38.69069290161133, "global_step": 110654, "epoch": 914} {"train_loss": -39.04140853881836, "global_step": 110655, "epoch": 914} {"train_loss": -39.225337982177734, "global_step": 110656, "epoch": 914} {"train_loss": -38.88226318359375, "global_step": 110657, "epoch": 914} {"train_loss": -37.99557876586914, "global_step": 110658, "epoch": 914} {"train_loss": -38.16505813598633, "global_step": 110659, "epoch": 914} {"train_loss": -38.3699951171875, "global_step": 110660, "epoch": 914} {"train_loss": -38.53582763671875, "global_step": 110661, "epoch": 914} {"train_loss": -38.12968063354492, "global_step": 110662, "epoch": 914} {"train_loss": -37.06550979614258, "global_step": 110663, "epoch": 914} {"train_loss": -38.43849563598633, "global_step": 110664, "epoch": 914} {"train_loss": -38.64945602416992, "global_step": 110665, "epoch": 914} {"train_loss": -39.29568099975586, "global_step": 110666, "epoch": 914} {"train_loss": -37.33079147338867, "global_step": 110667, "epoch": 914} {"train_loss": -37.53032684326172, "global_step": 110668, "epoch": 914} {"train_loss": -35.138648986816406, "global_step": 110669, "epoch": 914} {"train_loss": -38.00666046142578, "global_step": 110670, "epoch": 914} {"train_loss": -37.130401611328125, "global_step": 110671, "epoch": 914} {"train_loss": -37.16665267944336, "global_step": 110672, "epoch": 914} {"train_loss": -35.98027038574219, "global_step": 110673, "epoch": 914} {"train_loss": -38.25029754638672, "global_step": 110674, "epoch": 914} {"train_loss": -35.85862731933594, "global_step": 110675, "epoch": 914} {"train_loss": -37.98537826538086, "global_step": 110676, "epoch": 914} {"train_loss": -37.349517822265625, "global_step": 110677, "epoch": 914} {"train_loss": -38.35624313354492, "global_step": 110678, "epoch": 914} {"train_loss": -36.27267837524414, "global_step": 110679, "epoch": 914} {"train_loss": -38.52134704589844, "global_step": 110680, "epoch": 914} {"train_loss": -37.86503219604492, "global_step": 110681, "epoch": 914} {"train_loss": -37.329097747802734, "global_step": 110682, "epoch": 914} {"train_loss": -34.83806610107422, "global_step": 110683, "epoch": 914} {"train_loss": -34.296810150146484, "global_step": 110684, "epoch": 914} {"train_loss": -37.781288146972656, "global_step": 110685, "epoch": 914} {"train_loss": -37.37261199951172, "global_step": 110686, "epoch": 914} {"train_loss": -37.102447509765625, "global_step": 110687, "epoch": 914} {"train_loss": -36.99074172973633, "global_step": 110688, "epoch": 914} {"train_loss": -36.79682540893555, "global_step": 110689, "epoch": 914} {"train_loss": -37.5502815246582, "global_step": 110690, "epoch": 914} {"train_loss": -36.4373893737793, "global_step": 110691, "epoch": 914} {"train_loss": -36.3303337097168, "global_step": 110692, "epoch": 914} {"train_loss": -36.54579544067383, "global_step": 110693, "epoch": 914} {"train_loss": -37.01764678955078, "global_step": 110694, "epoch": 914} {"train_loss": -35.38411331176758, "global_step": 110695, "epoch": 914} {"train_loss": -37.30356216430664, "global_step": 110696, "epoch": 914} {"train_loss": -35.89492416381836, "global_step": 110697, "epoch": 914} {"train_loss": -36.57664108276367, "global_step": 110698, "epoch": 914} {"train_loss": -36.667476654052734, "global_step": 110699, "epoch": 914} {"train_loss": -34.833126068115234, "global_step": 110700, "epoch": 914} {"train_loss": -36.63467025756836, "global_step": 110701, "epoch": 914} {"train_loss": -34.564971923828125, "global_step": 110702, "epoch": 914} {"train_loss": -27.939960479736328, "global_step": 110703, "epoch": 914} {"train_loss": -35.83164596557617, "global_step": 110704, "epoch": 914} {"train_loss": -30.831241607666016, "global_step": 110705, "epoch": 914} {"train_loss": -36.26556396484375, "global_step": 110706, "epoch": 914} {"train_loss": -36.73163986206055, "global_step": 110707, "epoch": 914} {"train_loss": -31.997146606445312, "global_step": 110708, "epoch": 914} {"train_loss": -34.57408142089844, "global_step": 110709, "epoch": 914} {"train_loss": -35.976226806640625, "global_step": 110710, "epoch": 914} {"train_loss": -36.10187530517578, "global_step": 110711, "epoch": 914} {"train_loss": -35.1100959777832, "global_step": 110712, "epoch": 914} {"train_loss": -32.24977493286133, "global_step": 110713, "epoch": 914} {"train_loss": -37.37507582104896, "global_step": 110714, "epoch": 914, "val_loss": 2893443.25} {"train_loss": -34.28473663330078, "global_step": 110715, "epoch": 915} {"train_loss": -35.927467346191406, "global_step": 110716, "epoch": 915} {"train_loss": -34.301883697509766, "global_step": 110717, "epoch": 915} {"train_loss": -35.15297317504883, "global_step": 110718, "epoch": 915} {"train_loss": -35.43068313598633, "global_step": 110719, "epoch": 915} {"train_loss": -35.31925964355469, "global_step": 110720, "epoch": 915} {"train_loss": -35.66093063354492, "global_step": 110721, "epoch": 915} {"train_loss": -34.02590560913086, "global_step": 110722, "epoch": 915} {"train_loss": -36.57027053833008, "global_step": 110723, "epoch": 915} {"train_loss": -35.907318115234375, "global_step": 110724, "epoch": 915} {"train_loss": -37.036476135253906, "global_step": 110725, "epoch": 915} {"train_loss": -36.547218322753906, "global_step": 110726, "epoch": 915} {"train_loss": -36.0079231262207, "global_step": 110727, "epoch": 915} {"train_loss": -36.038307189941406, "global_step": 110728, "epoch": 915} {"train_loss": -36.920082092285156, "global_step": 110729, "epoch": 915} {"train_loss": -35.98564529418945, "global_step": 110730, "epoch": 915} {"train_loss": -37.08314514160156, "global_step": 110731, "epoch": 915} {"train_loss": -34.36532211303711, "global_step": 110732, "epoch": 915} {"train_loss": -35.55796432495117, "global_step": 110733, "epoch": 915} {"train_loss": -35.57880783081055, "global_step": 110734, "epoch": 915} {"train_loss": -37.182533264160156, "global_step": 110735, "epoch": 915} {"train_loss": -37.058040618896484, "global_step": 110736, "epoch": 915} {"train_loss": -36.768821716308594, "global_step": 110737, "epoch": 915} {"train_loss": -37.08372497558594, "global_step": 110738, "epoch": 915} {"train_loss": -37.35858154296875, "global_step": 110739, "epoch": 915} {"train_loss": -37.3563232421875, "global_step": 110740, "epoch": 915} {"train_loss": -36.97096633911133, "global_step": 110741, "epoch": 915} {"train_loss": -36.83919906616211, "global_step": 110742, "epoch": 915} {"train_loss": -37.570621490478516, "global_step": 110743, "epoch": 915} {"train_loss": -36.7381477355957, "global_step": 110744, "epoch": 915} {"train_loss": -37.145668029785156, "global_step": 110745, "epoch": 915} {"train_loss": -37.5383186340332, "global_step": 110746, "epoch": 915} {"train_loss": -37.3892822265625, "global_step": 110747, "epoch": 915} {"train_loss": -37.607967376708984, "global_step": 110748, "epoch": 915} {"train_loss": -37.380699157714844, "global_step": 110749, "epoch": 915} {"train_loss": -37.202903747558594, "global_step": 110750, "epoch": 915} {"train_loss": -37.52961349487305, "global_step": 110751, "epoch": 915} {"train_loss": -37.69641876220703, "global_step": 110752, "epoch": 915} {"train_loss": -37.66038131713867, "global_step": 110753, "epoch": 915} {"train_loss": -36.920875549316406, "global_step": 110754, "epoch": 915} {"train_loss": -38.045204162597656, "global_step": 110755, "epoch": 915} {"train_loss": -37.902584075927734, "global_step": 110756, "epoch": 915} {"train_loss": -38.165374755859375, "global_step": 110757, "epoch": 915} {"train_loss": -37.8843994140625, "global_step": 110758, "epoch": 915} {"train_loss": -37.95831298828125, "global_step": 110759, "epoch": 915} {"train_loss": -38.17304611206055, "global_step": 110760, "epoch": 915} {"train_loss": -38.2225456237793, "global_step": 110761, "epoch": 915} {"train_loss": -38.31001663208008, "global_step": 110762, "epoch": 915} {"train_loss": -37.93476486206055, "global_step": 110763, "epoch": 915} {"train_loss": -38.07036209106445, "global_step": 110764, "epoch": 915} {"train_loss": -38.25796127319336, "global_step": 110765, "epoch": 915} {"train_loss": -38.408485412597656, "global_step": 110766, "epoch": 915} {"train_loss": -37.90974426269531, "global_step": 110767, "epoch": 915} {"train_loss": -38.52350997924805, "global_step": 110768, "epoch": 915} {"train_loss": -38.82871627807617, "global_step": 110769, "epoch": 915} {"train_loss": -38.77216339111328, "global_step": 110770, "epoch": 915} {"train_loss": -38.58109664916992, "global_step": 110771, "epoch": 915} {"train_loss": -38.741310119628906, "global_step": 110772, "epoch": 915} {"train_loss": -38.018157958984375, "global_step": 110773, "epoch": 915} {"train_loss": -37.1035270690918, "global_step": 110774, "epoch": 915} {"train_loss": -36.867340087890625, "global_step": 110775, "epoch": 915} {"train_loss": -35.51924514770508, "global_step": 110776, "epoch": 915} {"train_loss": -32.6246337890625, "global_step": 110777, "epoch": 915} {"train_loss": -31.14874839782715, "global_step": 110778, "epoch": 915} {"train_loss": -31.554309844970703, "global_step": 110779, "epoch": 915} {"train_loss": -36.308109283447266, "global_step": 110780, "epoch": 915} {"train_loss": -39.06029510498047, "global_step": 110781, "epoch": 915} {"train_loss": -36.94582748413086, "global_step": 110782, "epoch": 915} {"train_loss": -36.63130187988281, "global_step": 110783, "epoch": 915} {"train_loss": -38.38773727416992, "global_step": 110784, "epoch": 915} {"train_loss": -37.040462493896484, "global_step": 110785, "epoch": 915} {"train_loss": -37.83015060424805, "global_step": 110786, "epoch": 915} {"train_loss": -38.93131637573242, "global_step": 110787, "epoch": 915} {"train_loss": -38.05122756958008, "global_step": 110788, "epoch": 915} {"train_loss": -38.83370590209961, "global_step": 110789, "epoch": 915} {"train_loss": -37.807918548583984, "global_step": 110790, "epoch": 915} {"train_loss": -38.510597229003906, "global_step": 110791, "epoch": 915} {"train_loss": -38.76936340332031, "global_step": 110792, "epoch": 915} {"train_loss": -38.505592346191406, "global_step": 110793, "epoch": 915} {"train_loss": -38.800933837890625, "global_step": 110794, "epoch": 915} {"train_loss": -38.47307205200195, "global_step": 110795, "epoch": 915} {"train_loss": -38.4222526550293, "global_step": 110796, "epoch": 915} {"train_loss": -38.58760452270508, "global_step": 110797, "epoch": 915} {"train_loss": -39.06024169921875, "global_step": 110798, "epoch": 915} {"train_loss": -38.742767333984375, "global_step": 110799, "epoch": 915} {"train_loss": -38.969356536865234, "global_step": 110800, "epoch": 915} {"train_loss": -39.002506256103516, "global_step": 110801, "epoch": 915} {"train_loss": -38.88944625854492, "global_step": 110802, "epoch": 915} {"train_loss": -39.076820373535156, "global_step": 110803, "epoch": 915} {"train_loss": -39.09878921508789, "global_step": 110804, "epoch": 915} {"train_loss": -38.64298629760742, "global_step": 110805, "epoch": 915} {"train_loss": -38.99781799316406, "global_step": 110806, "epoch": 915} {"train_loss": -37.6394157409668, "global_step": 110807, "epoch": 915} {"train_loss": -39.00489044189453, "global_step": 110808, "epoch": 915} {"train_loss": -38.22489929199219, "global_step": 110809, "epoch": 915} {"train_loss": -38.441280364990234, "global_step": 110810, "epoch": 915} {"train_loss": -38.487403869628906, "global_step": 110811, "epoch": 915} {"train_loss": -38.71937942504883, "global_step": 110812, "epoch": 915} {"train_loss": -38.652278900146484, "global_step": 110813, "epoch": 915} {"train_loss": -38.78376388549805, "global_step": 110814, "epoch": 915} {"train_loss": -39.48378372192383, "global_step": 110815, "epoch": 915} {"train_loss": -38.54732894897461, "global_step": 110816, "epoch": 915} {"train_loss": -37.534271240234375, "global_step": 110817, "epoch": 915} {"train_loss": -39.00368118286133, "global_step": 110818, "epoch": 915} {"train_loss": -38.10573959350586, "global_step": 110819, "epoch": 915} {"train_loss": -37.276222229003906, "global_step": 110820, "epoch": 915} {"train_loss": -39.112648010253906, "global_step": 110821, "epoch": 915} {"train_loss": -37.502750396728516, "global_step": 110822, "epoch": 915} {"train_loss": -38.940765380859375, "global_step": 110823, "epoch": 915} {"train_loss": -36.04673385620117, "global_step": 110824, "epoch": 915} {"train_loss": -38.41769027709961, "global_step": 110825, "epoch": 915} {"train_loss": -38.8287353515625, "global_step": 110826, "epoch": 915} {"train_loss": -39.189186096191406, "global_step": 110827, "epoch": 915} {"train_loss": -39.47297668457031, "global_step": 110828, "epoch": 915} {"train_loss": -38.226959228515625, "global_step": 110829, "epoch": 915} {"train_loss": -37.29066848754883, "global_step": 110830, "epoch": 915} {"train_loss": -35.03961944580078, "global_step": 110831, "epoch": 915} {"train_loss": -30.67267417907715, "global_step": 110832, "epoch": 915} {"train_loss": -32.12019729614258, "global_step": 110833, "epoch": 915} {"train_loss": -35.95266342163086, "global_step": 110834, "epoch": 915} {"train_loss": -37.353634668775825, "global_step": 110835, "epoch": 915, "val_loss": 2602231.75} {"train_loss": -35.44169998168945, "global_step": 110836, "epoch": 916} {"train_loss": -36.13398361206055, "global_step": 110837, "epoch": 916} {"train_loss": -37.50320053100586, "global_step": 110838, "epoch": 916} {"train_loss": -38.65138626098633, "global_step": 110839, "epoch": 916} {"train_loss": -38.180171966552734, "global_step": 110840, "epoch": 916} {"train_loss": -38.35502624511719, "global_step": 110841, "epoch": 916} {"train_loss": -38.13009262084961, "global_step": 110842, "epoch": 916} {"train_loss": -38.570457458496094, "global_step": 110843, "epoch": 916} {"train_loss": -38.31690216064453, "global_step": 110844, "epoch": 916} {"train_loss": -39.1881103515625, "global_step": 110845, "epoch": 916} {"train_loss": -37.741615295410156, "global_step": 110846, "epoch": 916} {"train_loss": -38.78806686401367, "global_step": 110847, "epoch": 916} {"train_loss": -38.17360305786133, "global_step": 110848, "epoch": 916} {"train_loss": -39.04937744140625, "global_step": 110849, "epoch": 916} {"train_loss": -38.61044692993164, "global_step": 110850, "epoch": 916} {"train_loss": -39.370540618896484, "global_step": 110851, "epoch": 916} {"train_loss": -38.89604568481445, "global_step": 110852, "epoch": 916} {"train_loss": -38.57900619506836, "global_step": 110853, "epoch": 916} {"train_loss": -39.17325973510742, "global_step": 110854, "epoch": 916} {"train_loss": -38.38261795043945, "global_step": 110855, "epoch": 916} {"train_loss": -39.14711380004883, "global_step": 110856, "epoch": 916} {"train_loss": -38.22616195678711, "global_step": 110857, "epoch": 916} {"train_loss": -37.78274154663086, "global_step": 110858, "epoch": 916} {"train_loss": -39.03165817260742, "global_step": 110859, "epoch": 916} {"train_loss": -37.650238037109375, "global_step": 110860, "epoch": 916} {"train_loss": -34.80683517456055, "global_step": 110861, "epoch": 916} {"train_loss": -37.74680709838867, "global_step": 110862, "epoch": 916} {"train_loss": -36.25141525268555, "global_step": 110863, "epoch": 916} {"train_loss": -38.71935272216797, "global_step": 110864, "epoch": 916} {"train_loss": -37.151485443115234, "global_step": 110865, "epoch": 916} {"train_loss": -38.78973388671875, "global_step": 110866, "epoch": 916} {"train_loss": -38.713043212890625, "global_step": 110867, "epoch": 916} {"train_loss": -38.422279357910156, "global_step": 110868, "epoch": 916} {"train_loss": -38.4197998046875, "global_step": 110869, "epoch": 916} {"train_loss": -38.191993713378906, "global_step": 110870, "epoch": 916} {"train_loss": -38.65436935424805, "global_step": 110871, "epoch": 916} {"train_loss": -38.6998405456543, "global_step": 110872, "epoch": 916} {"train_loss": -38.44541549682617, "global_step": 110873, "epoch": 916} {"train_loss": -38.99866485595703, "global_step": 110874, "epoch": 916} {"train_loss": -38.28181076049805, "global_step": 110875, "epoch": 916} {"train_loss": -38.38582992553711, "global_step": 110876, "epoch": 916} {"train_loss": -39.02946090698242, "global_step": 110877, "epoch": 916} {"train_loss": -33.00869369506836, "global_step": 110878, "epoch": 916} {"train_loss": -39.034542083740234, "global_step": 110879, "epoch": 916} {"train_loss": -38.95652770996094, "global_step": 110880, "epoch": 916} {"train_loss": -38.27005386352539, "global_step": 110881, "epoch": 916} {"train_loss": -38.09852981567383, "global_step": 110882, "epoch": 916} {"train_loss": -35.830013275146484, "global_step": 110883, "epoch": 916} {"train_loss": -18.37259292602539, "global_step": 110884, "epoch": 916} {"train_loss": -35.56950759887695, "global_step": 110885, "epoch": 916} {"train_loss": -33.671939849853516, "global_step": 110886, "epoch": 916} {"train_loss": -34.34921646118164, "global_step": 110887, "epoch": 916} {"train_loss": -20.323076248168945, "global_step": 110888, "epoch": 916} {"train_loss": -34.15299606323242, "global_step": 110889, "epoch": 916} {"train_loss": -34.44837951660156, "global_step": 110890, "epoch": 916} {"train_loss": -29.782825469970703, "global_step": 110891, "epoch": 916} {"train_loss": -30.812902450561523, "global_step": 110892, "epoch": 916} {"train_loss": -32.73611068725586, "global_step": 110893, "epoch": 916} {"train_loss": -35.16011047363281, "global_step": 110894, "epoch": 916} {"train_loss": -31.61785888671875, "global_step": 110895, "epoch": 916} {"train_loss": -30.750568389892578, "global_step": 110896, "epoch": 916} {"train_loss": -31.785507202148438, "global_step": 110897, "epoch": 916} {"train_loss": -33.631160736083984, "global_step": 110898, "epoch": 916} {"train_loss": -33.72111129760742, "global_step": 110899, "epoch": 916} {"train_loss": -33.843441009521484, "global_step": 110900, "epoch": 916} {"train_loss": -33.1795654296875, "global_step": 110901, "epoch": 916} {"train_loss": -35.2672004699707, "global_step": 110902, "epoch": 916} {"train_loss": -35.79188919067383, "global_step": 110903, "epoch": 916} {"train_loss": -36.52962875366211, "global_step": 110904, "epoch": 916} {"train_loss": -35.88124465942383, "global_step": 110905, "epoch": 916} {"train_loss": -35.60236358642578, "global_step": 110906, "epoch": 916} {"train_loss": -32.56368637084961, "global_step": 110907, "epoch": 916} {"train_loss": -35.24613571166992, "global_step": 110908, "epoch": 916} {"train_loss": -35.678955078125, "global_step": 110909, "epoch": 916} {"train_loss": -36.103797912597656, "global_step": 110910, "epoch": 916} {"train_loss": -36.796566009521484, "global_step": 110911, "epoch": 916} {"train_loss": -36.215328216552734, "global_step": 110912, "epoch": 916} {"train_loss": -35.97329330444336, "global_step": 110913, "epoch": 916} {"train_loss": -36.59041213989258, "global_step": 110914, "epoch": 916} {"train_loss": -35.71238327026367, "global_step": 110915, "epoch": 916} {"train_loss": -35.59235763549805, "global_step": 110916, "epoch": 916} {"train_loss": -36.045654296875, "global_step": 110917, "epoch": 916} {"train_loss": -36.02901077270508, "global_step": 110918, "epoch": 916} {"train_loss": -35.79645538330078, "global_step": 110919, "epoch": 916} {"train_loss": -36.18794631958008, "global_step": 110920, "epoch": 916} {"train_loss": -37.24409103393555, "global_step": 110921, "epoch": 916} {"train_loss": -36.19509506225586, "global_step": 110922, "epoch": 916} {"train_loss": -36.80106735229492, "global_step": 110923, "epoch": 916} {"train_loss": -36.74738311767578, "global_step": 110924, "epoch": 916} {"train_loss": -36.882930755615234, "global_step": 110925, "epoch": 916} {"train_loss": -36.99357223510742, "global_step": 110926, "epoch": 916} {"train_loss": -37.392513275146484, "global_step": 110927, "epoch": 916} {"train_loss": -36.93289566040039, "global_step": 110928, "epoch": 916} {"train_loss": -36.723426818847656, "global_step": 110929, "epoch": 916} {"train_loss": -37.28438949584961, "global_step": 110930, "epoch": 916} {"train_loss": -37.19260787963867, "global_step": 110931, "epoch": 916} {"train_loss": -34.992794036865234, "global_step": 110932, "epoch": 916} {"train_loss": -37.029327392578125, "global_step": 110933, "epoch": 916} {"train_loss": -37.65681838989258, "global_step": 110934, "epoch": 916} {"train_loss": -37.289344787597656, "global_step": 110935, "epoch": 916} {"train_loss": -37.71395492553711, "global_step": 110936, "epoch": 916} {"train_loss": -37.41468048095703, "global_step": 110937, "epoch": 916} {"train_loss": -37.0493278503418, "global_step": 110938, "epoch": 916} {"train_loss": -37.525146484375, "global_step": 110939, "epoch": 916} {"train_loss": -37.85712814331055, "global_step": 110940, "epoch": 916} {"train_loss": -37.818275451660156, "global_step": 110941, "epoch": 916} {"train_loss": -38.07522964477539, "global_step": 110942, "epoch": 916} {"train_loss": -37.165443420410156, "global_step": 110943, "epoch": 916} {"train_loss": -37.5467414855957, "global_step": 110944, "epoch": 916} {"train_loss": -38.075069427490234, "global_step": 110945, "epoch": 916} {"train_loss": -38.02775955200195, "global_step": 110946, "epoch": 916} {"train_loss": -38.025306701660156, "global_step": 110947, "epoch": 916} {"train_loss": -38.077392578125, "global_step": 110948, "epoch": 916} {"train_loss": -38.142208099365234, "global_step": 110949, "epoch": 916} {"train_loss": -37.97007751464844, "global_step": 110950, "epoch": 916} {"train_loss": -38.05184555053711, "global_step": 110951, "epoch": 916} {"train_loss": -38.1278076171875, "global_step": 110952, "epoch": 916} {"train_loss": -38.137454986572266, "global_step": 110953, "epoch": 916} {"train_loss": -38.341426849365234, "global_step": 110954, "epoch": 916} {"train_loss": -38.19028091430664, "global_step": 110955, "epoch": 916} {"train_loss": -36.56557764100634, "global_step": 110956, "epoch": 916, "val_loss": 2596097.75} {"train_loss": -38.25053787231445, "global_step": 110957, "epoch": 917} {"train_loss": -38.46781921386719, "global_step": 110958, "epoch": 917} {"train_loss": -38.69318771362305, "global_step": 110959, "epoch": 917} {"train_loss": -38.92572784423828, "global_step": 110960, "epoch": 917} {"train_loss": -38.89931106567383, "global_step": 110961, "epoch": 917} {"train_loss": -38.39119338989258, "global_step": 110962, "epoch": 917} {"train_loss": -38.773250579833984, "global_step": 110963, "epoch": 917} {"train_loss": -38.80867385864258, "global_step": 110964, "epoch": 917} {"train_loss": -39.15805435180664, "global_step": 110965, "epoch": 917} {"train_loss": -38.952396392822266, "global_step": 110966, "epoch": 917} {"train_loss": -38.74618148803711, "global_step": 110967, "epoch": 917} {"train_loss": -38.90421676635742, "global_step": 110968, "epoch": 917} {"train_loss": -38.774383544921875, "global_step": 110969, "epoch": 917} {"train_loss": -39.08300018310547, "global_step": 110970, "epoch": 917} {"train_loss": -38.95458984375, "global_step": 110971, "epoch": 917} {"train_loss": -39.0689697265625, "global_step": 110972, "epoch": 917} {"train_loss": -39.134212493896484, "global_step": 110973, "epoch": 917} {"train_loss": -39.27434158325195, "global_step": 110974, "epoch": 917} {"train_loss": -39.27000045776367, "global_step": 110975, "epoch": 917} {"train_loss": -39.350250244140625, "global_step": 110976, "epoch": 917} {"train_loss": -38.99479675292969, "global_step": 110977, "epoch": 917} {"train_loss": -39.47463607788086, "global_step": 110978, "epoch": 917} {"train_loss": -38.101112365722656, "global_step": 110979, "epoch": 917} {"train_loss": -39.19382858276367, "global_step": 110980, "epoch": 917} {"train_loss": -39.329010009765625, "global_step": 110981, "epoch": 917} {"train_loss": -39.32904815673828, "global_step": 110982, "epoch": 917} {"train_loss": -38.8045539855957, "global_step": 110983, "epoch": 917} {"train_loss": -38.87870407104492, "global_step": 110984, "epoch": 917} {"train_loss": -37.716548919677734, "global_step": 110985, "epoch": 917} {"train_loss": -37.9242057800293, "global_step": 110986, "epoch": 917} {"train_loss": -35.28752136230469, "global_step": 110987, "epoch": 917} {"train_loss": -31.9615535736084, "global_step": 110988, "epoch": 917} {"train_loss": -38.104286193847656, "global_step": 110989, "epoch": 917} {"train_loss": -35.36607360839844, "global_step": 110990, "epoch": 917} {"train_loss": -36.62827682495117, "global_step": 110991, "epoch": 917} {"train_loss": -37.27388381958008, "global_step": 110992, "epoch": 917} {"train_loss": -34.9472770690918, "global_step": 110993, "epoch": 917} {"train_loss": -34.58705520629883, "global_step": 110994, "epoch": 917} {"train_loss": -32.26870346069336, "global_step": 110995, "epoch": 917} {"train_loss": -37.313026428222656, "global_step": 110996, "epoch": 917} {"train_loss": -36.8241081237793, "global_step": 110997, "epoch": 917} {"train_loss": -35.57081985473633, "global_step": 110998, "epoch": 917} {"train_loss": -38.196327209472656, "global_step": 110999, "epoch": 917} {"train_loss": -36.16810607910156, "global_step": 111000, "epoch": 917} {"train_loss": -35.70433807373047, "global_step": 111001, "epoch": 917} {"train_loss": -37.742000579833984, "global_step": 111002, "epoch": 917} {"train_loss": -36.501686096191406, "global_step": 111003, "epoch": 917} {"train_loss": -37.27851486206055, "global_step": 111004, "epoch": 917} {"train_loss": -38.096397399902344, "global_step": 111005, "epoch": 917} {"train_loss": -38.61969757080078, "global_step": 111006, "epoch": 917} {"train_loss": -37.01082229614258, "global_step": 111007, "epoch": 917} {"train_loss": -38.589027404785156, "global_step": 111008, "epoch": 917} {"train_loss": -38.48686599731445, "global_step": 111009, "epoch": 917} {"train_loss": -38.3106575012207, "global_step": 111010, "epoch": 917} {"train_loss": -38.19073486328125, "global_step": 111011, "epoch": 917} {"train_loss": -38.630611419677734, "global_step": 111012, "epoch": 917} {"train_loss": -38.81574630737305, "global_step": 111013, "epoch": 917} {"train_loss": -38.38629913330078, "global_step": 111014, "epoch": 917} {"train_loss": -38.49501037597656, "global_step": 111015, "epoch": 917} {"train_loss": -39.12281036376953, "global_step": 111016, "epoch": 917} {"train_loss": -38.99151611328125, "global_step": 111017, "epoch": 917} {"train_loss": -38.81614303588867, "global_step": 111018, "epoch": 917} {"train_loss": -39.02079391479492, "global_step": 111019, "epoch": 917} {"train_loss": -38.96234893798828, "global_step": 111020, "epoch": 917} {"train_loss": -38.96635055541992, "global_step": 111021, "epoch": 917} {"train_loss": -39.01811599731445, "global_step": 111022, "epoch": 917} {"train_loss": -38.831233978271484, "global_step": 111023, "epoch": 917} {"train_loss": -39.20680618286133, "global_step": 111024, "epoch": 917} {"train_loss": -39.080352783203125, "global_step": 111025, "epoch": 917} {"train_loss": -38.97339630126953, "global_step": 111026, "epoch": 917} {"train_loss": -38.86488723754883, "global_step": 111027, "epoch": 917} {"train_loss": -38.85153579711914, "global_step": 111028, "epoch": 917} {"train_loss": -38.91323471069336, "global_step": 111029, "epoch": 917} {"train_loss": -39.63957214355469, "global_step": 111030, "epoch": 917} {"train_loss": -39.455833435058594, "global_step": 111031, "epoch": 917} {"train_loss": -39.65156173706055, "global_step": 111032, "epoch": 917} {"train_loss": -39.1463508605957, "global_step": 111033, "epoch": 917} {"train_loss": -39.50852584838867, "global_step": 111034, "epoch": 917} {"train_loss": -39.360347747802734, "global_step": 111035, "epoch": 917} {"train_loss": -39.50249099731445, "global_step": 111036, "epoch": 917} {"train_loss": -39.80438995361328, "global_step": 111037, "epoch": 917} {"train_loss": -39.04517364501953, "global_step": 111038, "epoch": 917} {"train_loss": -39.60283279418945, "global_step": 111039, "epoch": 917} {"train_loss": -38.69975662231445, "global_step": 111040, "epoch": 917} {"train_loss": -40.01578140258789, "global_step": 111041, "epoch": 917} {"train_loss": -39.82600021362305, "global_step": 111042, "epoch": 917} {"train_loss": -39.38427734375, "global_step": 111043, "epoch": 917} {"train_loss": -38.72361373901367, "global_step": 111044, "epoch": 917} {"train_loss": -39.39176940917969, "global_step": 111045, "epoch": 917} {"train_loss": -39.15148162841797, "global_step": 111046, "epoch": 917} {"train_loss": -39.34128952026367, "global_step": 111047, "epoch": 917} {"train_loss": -39.01100540161133, "global_step": 111048, "epoch": 917} {"train_loss": -39.18328857421875, "global_step": 111049, "epoch": 917} {"train_loss": -38.8537712097168, "global_step": 111050, "epoch": 917} {"train_loss": -36.84345245361328, "global_step": 111051, "epoch": 917} {"train_loss": -34.054569244384766, "global_step": 111052, "epoch": 917} {"train_loss": -25.283206939697266, "global_step": 111053, "epoch": 917} {"train_loss": -13.304908752441406, "global_step": 111054, "epoch": 917} {"train_loss": -27.350208282470703, "global_step": 111055, "epoch": 917} {"train_loss": -38.9505729675293, "global_step": 111056, "epoch": 917} {"train_loss": -30.975894927978516, "global_step": 111057, "epoch": 917} {"train_loss": -37.29290771484375, "global_step": 111058, "epoch": 917} {"train_loss": -37.071929931640625, "global_step": 111059, "epoch": 917} {"train_loss": -37.55375289916992, "global_step": 111060, "epoch": 917} {"train_loss": -36.872154235839844, "global_step": 111061, "epoch": 917} {"train_loss": -36.76839065551758, "global_step": 111062, "epoch": 917} {"train_loss": -36.29957962036133, "global_step": 111063, "epoch": 917} {"train_loss": -35.72018814086914, "global_step": 111064, "epoch": 917} {"train_loss": -36.89282989501953, "global_step": 111065, "epoch": 917} {"train_loss": -36.379817962646484, "global_step": 111066, "epoch": 917} {"train_loss": -37.8702507019043, "global_step": 111067, "epoch": 917} {"train_loss": -37.47523880004883, "global_step": 111068, "epoch": 917} {"train_loss": -38.11219787597656, "global_step": 111069, "epoch": 917} {"train_loss": -37.15998458862305, "global_step": 111070, "epoch": 917} {"train_loss": -38.28109359741211, "global_step": 111071, "epoch": 917} {"train_loss": -37.96051788330078, "global_step": 111072, "epoch": 917} {"train_loss": -38.897735595703125, "global_step": 111073, "epoch": 917} {"train_loss": -38.40966796875, "global_step": 111074, "epoch": 917} {"train_loss": -39.10097885131836, "global_step": 111075, "epoch": 917} {"train_loss": -38.81010055541992, "global_step": 111076, "epoch": 917} {"train_loss": -37.73154312322948, "global_step": 111077, "epoch": 917, "val_loss": 2607854.0} {"train_loss": -38.433841705322266, "global_step": 111078, "epoch": 918} {"train_loss": -39.07253646850586, "global_step": 111079, "epoch": 918} {"train_loss": -39.0007209777832, "global_step": 111080, "epoch": 918} {"train_loss": -38.58669662475586, "global_step": 111081, "epoch": 918} {"train_loss": -39.60532760620117, "global_step": 111082, "epoch": 918} {"train_loss": -39.392608642578125, "global_step": 111083, "epoch": 918} {"train_loss": -38.97832489013672, "global_step": 111084, "epoch": 918} {"train_loss": -39.264034271240234, "global_step": 111085, "epoch": 918} {"train_loss": -39.017486572265625, "global_step": 111086, "epoch": 918} {"train_loss": -39.396759033203125, "global_step": 111087, "epoch": 918} {"train_loss": -39.2093391418457, "global_step": 111088, "epoch": 918} {"train_loss": -39.137447357177734, "global_step": 111089, "epoch": 918} {"train_loss": -39.29377365112305, "global_step": 111090, "epoch": 918} {"train_loss": -39.30447006225586, "global_step": 111091, "epoch": 918} {"train_loss": -39.15717315673828, "global_step": 111092, "epoch": 918} {"train_loss": -39.496612548828125, "global_step": 111093, "epoch": 918} {"train_loss": -39.69107437133789, "global_step": 111094, "epoch": 918} {"train_loss": -39.825294494628906, "global_step": 111095, "epoch": 918} {"train_loss": -39.59507369995117, "global_step": 111096, "epoch": 918} {"train_loss": -39.44493865966797, "global_step": 111097, "epoch": 918} {"train_loss": -39.847267150878906, "global_step": 111098, "epoch": 918} {"train_loss": -40.00564193725586, "global_step": 111099, "epoch": 918} {"train_loss": -39.795284271240234, "global_step": 111100, "epoch": 918} {"train_loss": -39.49079132080078, "global_step": 111101, "epoch": 918} {"train_loss": -40.25543975830078, "global_step": 111102, "epoch": 918} {"train_loss": -39.60329818725586, "global_step": 111103, "epoch": 918} {"train_loss": -39.79570388793945, "global_step": 111104, "epoch": 918} {"train_loss": -39.91514587402344, "global_step": 111105, "epoch": 918} {"train_loss": -39.91332244873047, "global_step": 111106, "epoch": 918} {"train_loss": -40.10769271850586, "global_step": 111107, "epoch": 918} {"train_loss": -39.421180725097656, "global_step": 111108, "epoch": 918} {"train_loss": -39.58154296875, "global_step": 111109, "epoch": 918} {"train_loss": -38.43353271484375, "global_step": 111110, "epoch": 918} {"train_loss": -33.361881256103516, "global_step": 111111, "epoch": 918} {"train_loss": -19.974699020385742, "global_step": 111112, "epoch": 918} {"train_loss": -1.4404668807983398, "global_step": 111113, "epoch": 918} {"train_loss": -1.373559832572937, "global_step": 111114, "epoch": 918} {"train_loss": -26.376800537109375, "global_step": 111115, "epoch": 918} {"train_loss": -32.55259323120117, "global_step": 111116, "epoch": 918} {"train_loss": -23.783567428588867, "global_step": 111117, "epoch": 918} {"train_loss": -31.83503532409668, "global_step": 111118, "epoch": 918} {"train_loss": -31.294775009155273, "global_step": 111119, "epoch": 918} {"train_loss": -32.70900344848633, "global_step": 111120, "epoch": 918} {"train_loss": -30.157806396484375, "global_step": 111121, "epoch": 918} {"train_loss": -34.262386322021484, "global_step": 111122, "epoch": 918} {"train_loss": -30.514789581298828, "global_step": 111123, "epoch": 918} {"train_loss": -35.97534942626953, "global_step": 111124, "epoch": 918} {"train_loss": -33.25242233276367, "global_step": 111125, "epoch": 918} {"train_loss": -35.05851364135742, "global_step": 111126, "epoch": 918} {"train_loss": -35.62055587768555, "global_step": 111127, "epoch": 918} {"train_loss": -34.49553298950195, "global_step": 111128, "epoch": 918} {"train_loss": -35.1024055480957, "global_step": 111129, "epoch": 918} {"train_loss": -35.86880111694336, "global_step": 111130, "epoch": 918} {"train_loss": -36.08554458618164, "global_step": 111131, "epoch": 918} {"train_loss": -36.403804779052734, "global_step": 111132, "epoch": 918} {"train_loss": -35.87333297729492, "global_step": 111133, "epoch": 918} {"train_loss": -36.662166595458984, "global_step": 111134, "epoch": 918} {"train_loss": -36.66606903076172, "global_step": 111135, "epoch": 918} {"train_loss": -36.73307418823242, "global_step": 111136, "epoch": 918} {"train_loss": -37.10166549682617, "global_step": 111137, "epoch": 918} {"train_loss": -36.98505401611328, "global_step": 111138, "epoch": 918} {"train_loss": -36.686431884765625, "global_step": 111139, "epoch": 918} {"train_loss": -37.258087158203125, "global_step": 111140, "epoch": 918} {"train_loss": -37.1912727355957, "global_step": 111141, "epoch": 918} {"train_loss": -36.85271072387695, "global_step": 111142, "epoch": 918} {"train_loss": -37.362220764160156, "global_step": 111143, "epoch": 918} {"train_loss": -37.71499252319336, "global_step": 111144, "epoch": 918} {"train_loss": -37.134586334228516, "global_step": 111145, "epoch": 918} {"train_loss": -37.24964141845703, "global_step": 111146, "epoch": 918} {"train_loss": -37.874691009521484, "global_step": 111147, "epoch": 918} {"train_loss": -37.646728515625, "global_step": 111148, "epoch": 918} {"train_loss": -37.64784622192383, "global_step": 111149, "epoch": 918} {"train_loss": -37.493587493896484, "global_step": 111150, "epoch": 918} {"train_loss": -37.678524017333984, "global_step": 111151, "epoch": 918} {"train_loss": -37.987579345703125, "global_step": 111152, "epoch": 918} {"train_loss": -38.0472297668457, "global_step": 111153, "epoch": 918} {"train_loss": -37.78663635253906, "global_step": 111154, "epoch": 918} {"train_loss": -38.13180923461914, "global_step": 111155, "epoch": 918} {"train_loss": -38.03953552246094, "global_step": 111156, "epoch": 918} {"train_loss": -38.117584228515625, "global_step": 111157, "epoch": 918} {"train_loss": -38.16837692260742, "global_step": 111158, "epoch": 918} {"train_loss": -38.01849365234375, "global_step": 111159, "epoch": 918} {"train_loss": -37.9317741394043, "global_step": 111160, "epoch": 918} {"train_loss": -38.04377365112305, "global_step": 111161, "epoch": 918} {"train_loss": -38.031349182128906, "global_step": 111162, "epoch": 918} {"train_loss": -38.17668914794922, "global_step": 111163, "epoch": 918} {"train_loss": -38.04154968261719, "global_step": 111164, "epoch": 918} {"train_loss": -38.276363372802734, "global_step": 111165, "epoch": 918} {"train_loss": -38.225685119628906, "global_step": 111166, "epoch": 918} {"train_loss": -38.56146240234375, "global_step": 111167, "epoch": 918} {"train_loss": -38.38218688964844, "global_step": 111168, "epoch": 918} {"train_loss": -38.7527961730957, "global_step": 111169, "epoch": 918} {"train_loss": -38.54841613769531, "global_step": 111170, "epoch": 918} {"train_loss": -38.313411712646484, "global_step": 111171, "epoch": 918} {"train_loss": -38.670223236083984, "global_step": 111172, "epoch": 918} {"train_loss": -38.73271179199219, "global_step": 111173, "epoch": 918} {"train_loss": -38.52772903442383, "global_step": 111174, "epoch": 918} {"train_loss": -38.700801849365234, "global_step": 111175, "epoch": 918} {"train_loss": -38.9560661315918, "global_step": 111176, "epoch": 918} {"train_loss": -38.66093826293945, "global_step": 111177, "epoch": 918} {"train_loss": -39.05100631713867, "global_step": 111178, "epoch": 918} {"train_loss": -38.7952995300293, "global_step": 111179, "epoch": 918} {"train_loss": -39.032752990722656, "global_step": 111180, "epoch": 918} {"train_loss": -38.91545486450195, "global_step": 111181, "epoch": 918} {"train_loss": -38.953067779541016, "global_step": 111182, "epoch": 918} {"train_loss": -39.069332122802734, "global_step": 111183, "epoch": 918} {"train_loss": -39.312843322753906, "global_step": 111184, "epoch": 918} {"train_loss": -39.10208511352539, "global_step": 111185, "epoch": 918} {"train_loss": -39.08528518676758, "global_step": 111186, "epoch": 918} {"train_loss": -39.13759994506836, "global_step": 111187, "epoch": 918} {"train_loss": -39.416236877441406, "global_step": 111188, "epoch": 918} {"train_loss": -39.29205322265625, "global_step": 111189, "epoch": 918} {"train_loss": -38.739295959472656, "global_step": 111190, "epoch": 918} {"train_loss": -39.14980697631836, "global_step": 111191, "epoch": 918} {"train_loss": -39.36434555053711, "global_step": 111192, "epoch": 918} {"train_loss": -39.29777908325195, "global_step": 111193, "epoch": 918} {"train_loss": -39.2373161315918, "global_step": 111194, "epoch": 918} {"train_loss": -39.526885986328125, "global_step": 111195, "epoch": 918} {"train_loss": -39.28238296508789, "global_step": 111196, "epoch": 918} {"train_loss": -39.32619857788086, "global_step": 111197, "epoch": 918} {"train_loss": -36.96561568138028, "global_step": 111198, "epoch": 918, "val_loss": 2592368.0} {"train_loss": -39.43363571166992, "global_step": 111199, "epoch": 919} {"train_loss": -39.619529724121094, "global_step": 111200, "epoch": 919} {"train_loss": -39.715553283691406, "global_step": 111201, "epoch": 919} {"train_loss": -39.7791862487793, "global_step": 111202, "epoch": 919} {"train_loss": -39.72462844848633, "global_step": 111203, "epoch": 919} {"train_loss": -40.01206588745117, "global_step": 111204, "epoch": 919} {"train_loss": -39.68751907348633, "global_step": 111205, "epoch": 919} {"train_loss": -39.314239501953125, "global_step": 111206, "epoch": 919} {"train_loss": -38.14677429199219, "global_step": 111207, "epoch": 919} {"train_loss": -36.36961364746094, "global_step": 111208, "epoch": 919} {"train_loss": -29.15717887878418, "global_step": 111209, "epoch": 919} {"train_loss": -24.554676055908203, "global_step": 111210, "epoch": 919} {"train_loss": -21.680219650268555, "global_step": 111211, "epoch": 919} {"train_loss": -25.719318389892578, "global_step": 111212, "epoch": 919} {"train_loss": -36.83415603637695, "global_step": 111213, "epoch": 919} {"train_loss": -31.765100479125977, "global_step": 111214, "epoch": 919} {"train_loss": -32.925167083740234, "global_step": 111215, "epoch": 919} {"train_loss": -36.78882598876953, "global_step": 111216, "epoch": 919} {"train_loss": -32.98334884643555, "global_step": 111217, "epoch": 919} {"train_loss": -37.04180145263672, "global_step": 111218, "epoch": 919} {"train_loss": -34.1710205078125, "global_step": 111219, "epoch": 919} {"train_loss": -37.83991241455078, "global_step": 111220, "epoch": 919} {"train_loss": -37.149837493896484, "global_step": 111221, "epoch": 919} {"train_loss": -37.072261810302734, "global_step": 111222, "epoch": 919} {"train_loss": -38.08181381225586, "global_step": 111223, "epoch": 919} {"train_loss": -36.10586166381836, "global_step": 111224, "epoch": 919} {"train_loss": -37.44921875, "global_step": 111225, "epoch": 919} {"train_loss": -37.77993392944336, "global_step": 111226, "epoch": 919} {"train_loss": -37.679405212402344, "global_step": 111227, "epoch": 919} {"train_loss": -38.58268356323242, "global_step": 111228, "epoch": 919} {"train_loss": -37.939414978027344, "global_step": 111229, "epoch": 919} {"train_loss": -38.029624938964844, "global_step": 111230, "epoch": 919} {"train_loss": -38.4449577331543, "global_step": 111231, "epoch": 919} {"train_loss": -38.13715362548828, "global_step": 111232, "epoch": 919} {"train_loss": -38.210357666015625, "global_step": 111233, "epoch": 919} {"train_loss": -38.47235870361328, "global_step": 111234, "epoch": 919} {"train_loss": -38.655330657958984, "global_step": 111235, "epoch": 919} {"train_loss": -38.44846725463867, "global_step": 111236, "epoch": 919} {"train_loss": -39.13665771484375, "global_step": 111237, "epoch": 919} {"train_loss": -37.7292366027832, "global_step": 111238, "epoch": 919} {"train_loss": -38.67854309082031, "global_step": 111239, "epoch": 919} {"train_loss": -38.26031494140625, "global_step": 111240, "epoch": 919} {"train_loss": -38.21260452270508, "global_step": 111241, "epoch": 919} {"train_loss": -38.73037338256836, "global_step": 111242, "epoch": 919} {"train_loss": -38.4764518737793, "global_step": 111243, "epoch": 919} {"train_loss": -38.910091400146484, "global_step": 111244, "epoch": 919} {"train_loss": -38.850643157958984, "global_step": 111245, "epoch": 919} {"train_loss": -39.00720977783203, "global_step": 111246, "epoch": 919} {"train_loss": -38.133644104003906, "global_step": 111247, "epoch": 919} {"train_loss": -38.89389419555664, "global_step": 111248, "epoch": 919} {"train_loss": -38.512939453125, "global_step": 111249, "epoch": 919} {"train_loss": -39.08842849731445, "global_step": 111250, "epoch": 919} {"train_loss": -38.60406494140625, "global_step": 111251, "epoch": 919} {"train_loss": -38.39512252807617, "global_step": 111252, "epoch": 919} {"train_loss": -38.633270263671875, "global_step": 111253, "epoch": 919} {"train_loss": -38.87761306762695, "global_step": 111254, "epoch": 919} {"train_loss": -38.39313888549805, "global_step": 111255, "epoch": 919} {"train_loss": -39.387813568115234, "global_step": 111256, "epoch": 919} {"train_loss": -39.198524475097656, "global_step": 111257, "epoch": 919} {"train_loss": -38.55184555053711, "global_step": 111258, "epoch": 919} {"train_loss": -38.885372161865234, "global_step": 111259, "epoch": 919} {"train_loss": -39.24072265625, "global_step": 111260, "epoch": 919} {"train_loss": -39.244197845458984, "global_step": 111261, "epoch": 919} {"train_loss": -39.089881896972656, "global_step": 111262, "epoch": 919} {"train_loss": -39.26078414916992, "global_step": 111263, "epoch": 919} {"train_loss": -38.9187126159668, "global_step": 111264, "epoch": 919} {"train_loss": -39.30882263183594, "global_step": 111265, "epoch": 919} {"train_loss": -38.844486236572266, "global_step": 111266, "epoch": 919} {"train_loss": -39.17499542236328, "global_step": 111267, "epoch": 919} {"train_loss": -38.572998046875, "global_step": 111268, "epoch": 919} {"train_loss": -39.48384094238281, "global_step": 111269, "epoch": 919} {"train_loss": -38.737850189208984, "global_step": 111270, "epoch": 919} {"train_loss": -39.2072639465332, "global_step": 111271, "epoch": 919} {"train_loss": -38.79875946044922, "global_step": 111272, "epoch": 919} {"train_loss": -38.9069709777832, "global_step": 111273, "epoch": 919} {"train_loss": -39.140174865722656, "global_step": 111274, "epoch": 919} {"train_loss": -39.167903900146484, "global_step": 111275, "epoch": 919} {"train_loss": -39.31032180786133, "global_step": 111276, "epoch": 919} {"train_loss": -38.98965072631836, "global_step": 111277, "epoch": 919} {"train_loss": -38.992977142333984, "global_step": 111278, "epoch": 919} {"train_loss": -39.06241989135742, "global_step": 111279, "epoch": 919} {"train_loss": -39.572418212890625, "global_step": 111280, "epoch": 919} {"train_loss": -39.6416015625, "global_step": 111281, "epoch": 919} {"train_loss": -39.02054977416992, "global_step": 111282, "epoch": 919} {"train_loss": -38.05485153198242, "global_step": 111283, "epoch": 919} {"train_loss": -39.14302444458008, "global_step": 111284, "epoch": 919} {"train_loss": -39.45235824584961, "global_step": 111285, "epoch": 919} {"train_loss": -39.84084701538086, "global_step": 111286, "epoch": 919} {"train_loss": -39.1751823425293, "global_step": 111287, "epoch": 919} {"train_loss": -39.096649169921875, "global_step": 111288, "epoch": 919} {"train_loss": -39.33988571166992, "global_step": 111289, "epoch": 919} {"train_loss": -39.01462936401367, "global_step": 111290, "epoch": 919} {"train_loss": -38.40456008911133, "global_step": 111291, "epoch": 919} {"train_loss": -38.88130569458008, "global_step": 111292, "epoch": 919} {"train_loss": -38.91716003417969, "global_step": 111293, "epoch": 919} {"train_loss": -39.29934310913086, "global_step": 111294, "epoch": 919} {"train_loss": -38.78474426269531, "global_step": 111295, "epoch": 919} {"train_loss": -39.24814987182617, "global_step": 111296, "epoch": 919} {"train_loss": -39.3713493347168, "global_step": 111297, "epoch": 919} {"train_loss": -39.1319580078125, "global_step": 111298, "epoch": 919} {"train_loss": -39.3200569152832, "global_step": 111299, "epoch": 919} {"train_loss": -38.299720764160156, "global_step": 111300, "epoch": 919} {"train_loss": -39.18782424926758, "global_step": 111301, "epoch": 919} {"train_loss": -39.62464904785156, "global_step": 111302, "epoch": 919} {"train_loss": -39.0808219909668, "global_step": 111303, "epoch": 919} {"train_loss": -39.93513870239258, "global_step": 111304, "epoch": 919} {"train_loss": -39.3513069152832, "global_step": 111305, "epoch": 919} {"train_loss": -39.331111907958984, "global_step": 111306, "epoch": 919} {"train_loss": -38.71544647216797, "global_step": 111307, "epoch": 919} {"train_loss": -39.0131721496582, "global_step": 111308, "epoch": 919} {"train_loss": -38.87207794189453, "global_step": 111309, "epoch": 919} {"train_loss": -38.53173828125, "global_step": 111310, "epoch": 919} {"train_loss": -39.083152770996094, "global_step": 111311, "epoch": 919} {"train_loss": -38.4267578125, "global_step": 111312, "epoch": 919} {"train_loss": -38.39341354370117, "global_step": 111313, "epoch": 919} {"train_loss": -35.316097259521484, "global_step": 111314, "epoch": 919} {"train_loss": -37.20580291748047, "global_step": 111315, "epoch": 919} {"train_loss": -37.382965087890625, "global_step": 111316, "epoch": 919} {"train_loss": -38.45859909057617, "global_step": 111317, "epoch": 919} {"train_loss": -38.412288665771484, "global_step": 111318, "epoch": 919} {"train_loss": -38.05198639483491, "global_step": 111319, "epoch": 919, "val_loss": 2719640.25} {"train_loss": -37.86012268066406, "global_step": 111320, "epoch": 920} {"train_loss": -38.28528594970703, "global_step": 111321, "epoch": 920} {"train_loss": -37.333797454833984, "global_step": 111322, "epoch": 920} {"train_loss": -36.93181228637695, "global_step": 111323, "epoch": 920} {"train_loss": -37.13714599609375, "global_step": 111324, "epoch": 920} {"train_loss": -37.536014556884766, "global_step": 111325, "epoch": 920} {"train_loss": -36.1274528503418, "global_step": 111326, "epoch": 920} {"train_loss": -35.9467887878418, "global_step": 111327, "epoch": 920} {"train_loss": -39.03300857543945, "global_step": 111328, "epoch": 920} {"train_loss": -36.1390266418457, "global_step": 111329, "epoch": 920} {"train_loss": -36.1791877746582, "global_step": 111330, "epoch": 920} {"train_loss": -36.810630798339844, "global_step": 111331, "epoch": 920} {"train_loss": -36.40256881713867, "global_step": 111332, "epoch": 920} {"train_loss": -38.118804931640625, "global_step": 111333, "epoch": 920} {"train_loss": -34.06716537475586, "global_step": 111334, "epoch": 920} {"train_loss": -37.23921203613281, "global_step": 111335, "epoch": 920} {"train_loss": -36.604652404785156, "global_step": 111336, "epoch": 920} {"train_loss": -37.42658233642578, "global_step": 111337, "epoch": 920} {"train_loss": -37.04835510253906, "global_step": 111338, "epoch": 920} {"train_loss": -38.54142379760742, "global_step": 111339, "epoch": 920} {"train_loss": -37.66618728637695, "global_step": 111340, "epoch": 920} {"train_loss": -38.08005905151367, "global_step": 111341, "epoch": 920} {"train_loss": -37.78208541870117, "global_step": 111342, "epoch": 920} {"train_loss": -36.45534896850586, "global_step": 111343, "epoch": 920} {"train_loss": -39.351417541503906, "global_step": 111344, "epoch": 920} {"train_loss": -35.03517532348633, "global_step": 111345, "epoch": 920} {"train_loss": -38.05794143676758, "global_step": 111346, "epoch": 920} {"train_loss": -37.9459342956543, "global_step": 111347, "epoch": 920} {"train_loss": -39.09578323364258, "global_step": 111348, "epoch": 920} {"train_loss": -36.86240768432617, "global_step": 111349, "epoch": 920} {"train_loss": -37.70657730102539, "global_step": 111350, "epoch": 920} {"train_loss": -37.44394302368164, "global_step": 111351, "epoch": 920} {"train_loss": -36.508323669433594, "global_step": 111352, "epoch": 920} {"train_loss": -38.4333381652832, "global_step": 111353, "epoch": 920} {"train_loss": -37.46388626098633, "global_step": 111354, "epoch": 920} {"train_loss": -38.77518844604492, "global_step": 111355, "epoch": 920} {"train_loss": -38.78489685058594, "global_step": 111356, "epoch": 920} {"train_loss": -38.7363166809082, "global_step": 111357, "epoch": 920} {"train_loss": -38.81608200073242, "global_step": 111358, "epoch": 920} {"train_loss": -38.83760070800781, "global_step": 111359, "epoch": 920} {"train_loss": -38.81650161743164, "global_step": 111360, "epoch": 920} {"train_loss": -39.03818893432617, "global_step": 111361, "epoch": 920} {"train_loss": -38.346797943115234, "global_step": 111362, "epoch": 920} {"train_loss": -39.1375846862793, "global_step": 111363, "epoch": 920} {"train_loss": -39.426673889160156, "global_step": 111364, "epoch": 920} {"train_loss": -38.952877044677734, "global_step": 111365, "epoch": 920} {"train_loss": -39.45293045043945, "global_step": 111366, "epoch": 920} {"train_loss": -38.77769088745117, "global_step": 111367, "epoch": 920} {"train_loss": -39.24959945678711, "global_step": 111368, "epoch": 920} {"train_loss": -39.4971809387207, "global_step": 111369, "epoch": 920} {"train_loss": -39.00773239135742, "global_step": 111370, "epoch": 920} {"train_loss": -38.65404510498047, "global_step": 111371, "epoch": 920} {"train_loss": -39.34634017944336, "global_step": 111372, "epoch": 920} {"train_loss": -39.3696174621582, "global_step": 111373, "epoch": 920} {"train_loss": -39.84446334838867, "global_step": 111374, "epoch": 920} {"train_loss": -39.848907470703125, "global_step": 111375, "epoch": 920} {"train_loss": -39.70473098754883, "global_step": 111376, "epoch": 920} {"train_loss": -39.83048629760742, "global_step": 111377, "epoch": 920} {"train_loss": -39.416053771972656, "global_step": 111378, "epoch": 920} {"train_loss": -39.822425842285156, "global_step": 111379, "epoch": 920} {"train_loss": -39.59389877319336, "global_step": 111380, "epoch": 920} {"train_loss": -40.07362747192383, "global_step": 111381, "epoch": 920} {"train_loss": -39.54798126220703, "global_step": 111382, "epoch": 920} {"train_loss": -39.95274353027344, "global_step": 111383, "epoch": 920} {"train_loss": -39.743526458740234, "global_step": 111384, "epoch": 920} {"train_loss": -39.85816192626953, "global_step": 111385, "epoch": 920} {"train_loss": -39.331825256347656, "global_step": 111386, "epoch": 920} {"train_loss": -39.009151458740234, "global_step": 111387, "epoch": 920} {"train_loss": -39.53336715698242, "global_step": 111388, "epoch": 920} {"train_loss": -39.97048568725586, "global_step": 111389, "epoch": 920} {"train_loss": -39.47734832763672, "global_step": 111390, "epoch": 920} {"train_loss": -40.27053451538086, "global_step": 111391, "epoch": 920} {"train_loss": -39.994384765625, "global_step": 111392, "epoch": 920} {"train_loss": -40.058082580566406, "global_step": 111393, "epoch": 920} {"train_loss": -40.13856506347656, "global_step": 111394, "epoch": 920} {"train_loss": -40.394386291503906, "global_step": 111395, "epoch": 920} {"train_loss": -40.266361236572266, "global_step": 111396, "epoch": 920} {"train_loss": -40.12644577026367, "global_step": 111397, "epoch": 920} {"train_loss": -40.01434326171875, "global_step": 111398, "epoch": 920} {"train_loss": -40.08417510986328, "global_step": 111399, "epoch": 920} {"train_loss": -40.02724075317383, "global_step": 111400, "epoch": 920} {"train_loss": -40.20490646362305, "global_step": 111401, "epoch": 920} {"train_loss": -40.53644943237305, "global_step": 111402, "epoch": 920} {"train_loss": -40.06697082519531, "global_step": 111403, "epoch": 920} {"train_loss": -40.40116500854492, "global_step": 111404, "epoch": 920} {"train_loss": -40.32978439331055, "global_step": 111405, "epoch": 920} {"train_loss": -40.320465087890625, "global_step": 111406, "epoch": 920} {"train_loss": -40.441036224365234, "global_step": 111407, "epoch": 920} {"train_loss": -40.211795806884766, "global_step": 111408, "epoch": 920} {"train_loss": -40.27909469604492, "global_step": 111409, "epoch": 920} {"train_loss": -40.59565734863281, "global_step": 111410, "epoch": 920} {"train_loss": -40.73444747924805, "global_step": 111411, "epoch": 920} {"train_loss": -40.37006378173828, "global_step": 111412, "epoch": 920} {"train_loss": -40.46531295776367, "global_step": 111413, "epoch": 920} {"train_loss": -39.70754623413086, "global_step": 111414, "epoch": 920} {"train_loss": -39.45509719848633, "global_step": 111415, "epoch": 920} {"train_loss": -39.72757339477539, "global_step": 111416, "epoch": 920} {"train_loss": -40.02927780151367, "global_step": 111417, "epoch": 920} {"train_loss": -40.4791259765625, "global_step": 111418, "epoch": 920} {"train_loss": -40.342830657958984, "global_step": 111419, "epoch": 920} {"train_loss": -38.8139533996582, "global_step": 111420, "epoch": 920} {"train_loss": -37.22074508666992, "global_step": 111421, "epoch": 920} {"train_loss": -38.602317810058594, "global_step": 111422, "epoch": 920} {"train_loss": -36.074337005615234, "global_step": 111423, "epoch": 920} {"train_loss": -32.38569641113281, "global_step": 111424, "epoch": 920} {"train_loss": -38.71509552001953, "global_step": 111425, "epoch": 920} {"train_loss": -25.929767608642578, "global_step": 111426, "epoch": 920} {"train_loss": -35.83565139770508, "global_step": 111427, "epoch": 920} {"train_loss": -34.14979553222656, "global_step": 111428, "epoch": 920} {"train_loss": -15.153360366821289, "global_step": 111429, "epoch": 920} {"train_loss": -25.60898208618164, "global_step": 111430, "epoch": 920} {"train_loss": -33.46884536743164, "global_step": 111431, "epoch": 920} {"train_loss": -32.61417770385742, "global_step": 111432, "epoch": 920} {"train_loss": -33.53032302856445, "global_step": 111433, "epoch": 920} {"train_loss": -33.569026947021484, "global_step": 111434, "epoch": 920} {"train_loss": -33.81742858886719, "global_step": 111435, "epoch": 920} {"train_loss": -35.13589096069336, "global_step": 111436, "epoch": 920} {"train_loss": -32.99306869506836, "global_step": 111437, "epoch": 920} {"train_loss": -36.491451263427734, "global_step": 111438, "epoch": 920} {"train_loss": -34.956974029541016, "global_step": 111439, "epoch": 920} {"train_loss": -37.91265936922436, "global_step": 111440, "epoch": 920, "val_loss": 2570130.25} {"train_loss": -36.7935905456543, "global_step": 111441, "epoch": 921} {"train_loss": -35.65217208862305, "global_step": 111442, "epoch": 921} {"train_loss": -37.40117263793945, "global_step": 111443, "epoch": 921} {"train_loss": -36.13650131225586, "global_step": 111444, "epoch": 921} {"train_loss": -37.61546325683594, "global_step": 111445, "epoch": 921} {"train_loss": -36.88642120361328, "global_step": 111446, "epoch": 921} {"train_loss": -36.84406661987305, "global_step": 111447, "epoch": 921} {"train_loss": -37.93578338623047, "global_step": 111448, "epoch": 921} {"train_loss": -37.10129928588867, "global_step": 111449, "epoch": 921} {"train_loss": -36.97268295288086, "global_step": 111450, "epoch": 921} {"train_loss": -38.10833740234375, "global_step": 111451, "epoch": 921} {"train_loss": -36.95594787597656, "global_step": 111452, "epoch": 921} {"train_loss": -38.19685363769531, "global_step": 111453, "epoch": 921} {"train_loss": -37.68659591674805, "global_step": 111454, "epoch": 921} {"train_loss": -37.91923141479492, "global_step": 111455, "epoch": 921} {"train_loss": -38.41857147216797, "global_step": 111456, "epoch": 921} {"train_loss": -37.8564338684082, "global_step": 111457, "epoch": 921} {"train_loss": -38.17049026489258, "global_step": 111458, "epoch": 921} {"train_loss": -38.43742752075195, "global_step": 111459, "epoch": 921} {"train_loss": -38.354034423828125, "global_step": 111460, "epoch": 921} {"train_loss": -38.67654037475586, "global_step": 111461, "epoch": 921} {"train_loss": -38.84888458251953, "global_step": 111462, "epoch": 921} {"train_loss": -37.882511138916016, "global_step": 111463, "epoch": 921} {"train_loss": -38.6123161315918, "global_step": 111464, "epoch": 921} {"train_loss": -38.7962760925293, "global_step": 111465, "epoch": 921} {"train_loss": -38.63889694213867, "global_step": 111466, "epoch": 921} {"train_loss": -38.87394332885742, "global_step": 111467, "epoch": 921} {"train_loss": -38.923030853271484, "global_step": 111468, "epoch": 921} {"train_loss": -38.801918029785156, "global_step": 111469, "epoch": 921} {"train_loss": -38.8883056640625, "global_step": 111470, "epoch": 921} {"train_loss": -38.981689453125, "global_step": 111471, "epoch": 921} {"train_loss": -38.89836120605469, "global_step": 111472, "epoch": 921} {"train_loss": -38.83944320678711, "global_step": 111473, "epoch": 921} {"train_loss": -38.99953079223633, "global_step": 111474, "epoch": 921} {"train_loss": -39.0863037109375, "global_step": 111475, "epoch": 921} {"train_loss": -39.06893539428711, "global_step": 111476, "epoch": 921} {"train_loss": -39.257591247558594, "global_step": 111477, "epoch": 921} {"train_loss": -39.0789794921875, "global_step": 111478, "epoch": 921} {"train_loss": -39.08112716674805, "global_step": 111479, "epoch": 921} {"train_loss": -39.31411361694336, "global_step": 111480, "epoch": 921} {"train_loss": -39.845130920410156, "global_step": 111481, "epoch": 921} {"train_loss": -39.48044967651367, "global_step": 111482, "epoch": 921} {"train_loss": -39.48292922973633, "global_step": 111483, "epoch": 921} {"train_loss": -39.436737060546875, "global_step": 111484, "epoch": 921} {"train_loss": -39.62543869018555, "global_step": 111485, "epoch": 921} {"train_loss": -39.3690299987793, "global_step": 111486, "epoch": 921} {"train_loss": -39.55599594116211, "global_step": 111487, "epoch": 921} {"train_loss": -39.53938293457031, "global_step": 111488, "epoch": 921} {"train_loss": -39.59502410888672, "global_step": 111489, "epoch": 921} {"train_loss": -39.55628967285156, "global_step": 111490, "epoch": 921} {"train_loss": -39.9090690612793, "global_step": 111491, "epoch": 921} {"train_loss": -39.822078704833984, "global_step": 111492, "epoch": 921} {"train_loss": -39.70314025878906, "global_step": 111493, "epoch": 921} {"train_loss": -40.111202239990234, "global_step": 111494, "epoch": 921} {"train_loss": -39.89627456665039, "global_step": 111495, "epoch": 921} {"train_loss": -39.469058990478516, "global_step": 111496, "epoch": 921} {"train_loss": -39.07072067260742, "global_step": 111497, "epoch": 921} {"train_loss": -39.47481918334961, "global_step": 111498, "epoch": 921} {"train_loss": -39.81277084350586, "global_step": 111499, "epoch": 921} {"train_loss": -40.14836120605469, "global_step": 111500, "epoch": 921} {"train_loss": -39.727352142333984, "global_step": 111501, "epoch": 921} {"train_loss": -39.384429931640625, "global_step": 111502, "epoch": 921} {"train_loss": -39.1911735534668, "global_step": 111503, "epoch": 921} {"train_loss": -38.9609489440918, "global_step": 111504, "epoch": 921} {"train_loss": -40.03375244140625, "global_step": 111505, "epoch": 921} {"train_loss": -39.841941833496094, "global_step": 111506, "epoch": 921} {"train_loss": -40.1273193359375, "global_step": 111507, "epoch": 921} {"train_loss": -39.1978645324707, "global_step": 111508, "epoch": 921} {"train_loss": -38.295928955078125, "global_step": 111509, "epoch": 921} {"train_loss": -38.28032684326172, "global_step": 111510, "epoch": 921} {"train_loss": -39.905094146728516, "global_step": 111511, "epoch": 921} {"train_loss": -40.15938186645508, "global_step": 111512, "epoch": 921} {"train_loss": -39.18819046020508, "global_step": 111513, "epoch": 921} {"train_loss": -38.04923629760742, "global_step": 111514, "epoch": 921} {"train_loss": -38.678897857666016, "global_step": 111515, "epoch": 921} {"train_loss": -40.2042236328125, "global_step": 111516, "epoch": 921} {"train_loss": -38.978668212890625, "global_step": 111517, "epoch": 921} {"train_loss": -39.213417053222656, "global_step": 111518, "epoch": 921} {"train_loss": -39.156227111816406, "global_step": 111519, "epoch": 921} {"train_loss": -39.95941925048828, "global_step": 111520, "epoch": 921} {"train_loss": -39.76093673706055, "global_step": 111521, "epoch": 921} {"train_loss": -38.50654220581055, "global_step": 111522, "epoch": 921} {"train_loss": -39.931793212890625, "global_step": 111523, "epoch": 921} {"train_loss": -40.439327239990234, "global_step": 111524, "epoch": 921} {"train_loss": -39.46904373168945, "global_step": 111525, "epoch": 921} {"train_loss": -40.15522003173828, "global_step": 111526, "epoch": 921} {"train_loss": -39.78683853149414, "global_step": 111527, "epoch": 921} {"train_loss": -39.08955001831055, "global_step": 111528, "epoch": 921} {"train_loss": -37.8453483581543, "global_step": 111529, "epoch": 921} {"train_loss": -38.33946990966797, "global_step": 111530, "epoch": 921} {"train_loss": -39.189430236816406, "global_step": 111531, "epoch": 921} {"train_loss": -40.06931686401367, "global_step": 111532, "epoch": 921} {"train_loss": -39.80685043334961, "global_step": 111533, "epoch": 921} {"train_loss": -39.972713470458984, "global_step": 111534, "epoch": 921} {"train_loss": -40.159690856933594, "global_step": 111535, "epoch": 921} {"train_loss": -39.94469451904297, "global_step": 111536, "epoch": 921} {"train_loss": -39.85200119018555, "global_step": 111537, "epoch": 921} {"train_loss": -40.27342224121094, "global_step": 111538, "epoch": 921} {"train_loss": -40.09261703491211, "global_step": 111539, "epoch": 921} {"train_loss": -39.98747634887695, "global_step": 111540, "epoch": 921} {"train_loss": -40.21567916870117, "global_step": 111541, "epoch": 921} {"train_loss": -40.17401123046875, "global_step": 111542, "epoch": 921} {"train_loss": -40.20953369140625, "global_step": 111543, "epoch": 921} {"train_loss": -40.34402084350586, "global_step": 111544, "epoch": 921} {"train_loss": -40.184993743896484, "global_step": 111545, "epoch": 921} {"train_loss": -39.266937255859375, "global_step": 111546, "epoch": 921} {"train_loss": -39.10822296142578, "global_step": 111547, "epoch": 921} {"train_loss": -39.660362243652344, "global_step": 111548, "epoch": 921} {"train_loss": -39.61177444458008, "global_step": 111549, "epoch": 921} {"train_loss": -39.92196273803711, "global_step": 111550, "epoch": 921} {"train_loss": -40.31427764892578, "global_step": 111551, "epoch": 921} {"train_loss": -39.94951248168945, "global_step": 111552, "epoch": 921} {"train_loss": -39.968013763427734, "global_step": 111553, "epoch": 921} {"train_loss": -40.522682189941406, "global_step": 111554, "epoch": 921} {"train_loss": -40.47093200683594, "global_step": 111555, "epoch": 921} {"train_loss": -40.316341400146484, "global_step": 111556, "epoch": 921} {"train_loss": -40.18425369262695, "global_step": 111557, "epoch": 921} {"train_loss": -39.40935134887695, "global_step": 111558, "epoch": 921} {"train_loss": -39.38717269897461, "global_step": 111559, "epoch": 921} {"train_loss": -39.764156341552734, "global_step": 111560, "epoch": 921} {"train_loss": -39.156563971653455, "global_step": 111561, "epoch": 921, "val_loss": 2524701.25} {"train_loss": -40.684906005859375, "global_step": 111562, "epoch": 922} {"train_loss": -39.9769401550293, "global_step": 111563, "epoch": 922} {"train_loss": -39.94337844848633, "global_step": 111564, "epoch": 922} {"train_loss": -40.1322021484375, "global_step": 111565, "epoch": 922} {"train_loss": -39.672821044921875, "global_step": 111566, "epoch": 922} {"train_loss": -39.301265716552734, "global_step": 111567, "epoch": 922} {"train_loss": -38.97954177856445, "global_step": 111568, "epoch": 922} {"train_loss": -36.2980842590332, "global_step": 111569, "epoch": 922} {"train_loss": -33.39381790161133, "global_step": 111570, "epoch": 922} {"train_loss": -36.77754592895508, "global_step": 111571, "epoch": 922} {"train_loss": -39.69813919067383, "global_step": 111572, "epoch": 922} {"train_loss": -37.93208694458008, "global_step": 111573, "epoch": 922} {"train_loss": -38.12197494506836, "global_step": 111574, "epoch": 922} {"train_loss": -39.21371078491211, "global_step": 111575, "epoch": 922} {"train_loss": -38.3160285949707, "global_step": 111576, "epoch": 922} {"train_loss": -37.01860427856445, "global_step": 111577, "epoch": 922} {"train_loss": -37.20469284057617, "global_step": 111578, "epoch": 922} {"train_loss": -39.36478042602539, "global_step": 111579, "epoch": 922} {"train_loss": -36.753597259521484, "global_step": 111580, "epoch": 922} {"train_loss": -34.93655014038086, "global_step": 111581, "epoch": 922} {"train_loss": -37.703033447265625, "global_step": 111582, "epoch": 922} {"train_loss": -37.24040603637695, "global_step": 111583, "epoch": 922} {"train_loss": -37.94819259643555, "global_step": 111584, "epoch": 922} {"train_loss": -35.18171310424805, "global_step": 111585, "epoch": 922} {"train_loss": -34.69253158569336, "global_step": 111586, "epoch": 922} {"train_loss": -35.7840576171875, "global_step": 111587, "epoch": 922} {"train_loss": -35.04707336425781, "global_step": 111588, "epoch": 922} {"train_loss": -38.4775505065918, "global_step": 111589, "epoch": 922} {"train_loss": -36.369293212890625, "global_step": 111590, "epoch": 922} {"train_loss": -34.00456619262695, "global_step": 111591, "epoch": 922} {"train_loss": -36.79031753540039, "global_step": 111592, "epoch": 922} {"train_loss": -35.98530197143555, "global_step": 111593, "epoch": 922} {"train_loss": -36.89689254760742, "global_step": 111594, "epoch": 922} {"train_loss": -36.65330123901367, "global_step": 111595, "epoch": 922} {"train_loss": -37.396575927734375, "global_step": 111596, "epoch": 922} {"train_loss": -37.74420166015625, "global_step": 111597, "epoch": 922} {"train_loss": -37.607643127441406, "global_step": 111598, "epoch": 922} {"train_loss": -38.54035568237305, "global_step": 111599, "epoch": 922} {"train_loss": -37.40450668334961, "global_step": 111600, "epoch": 922} {"train_loss": -37.43098068237305, "global_step": 111601, "epoch": 922} {"train_loss": -38.39139938354492, "global_step": 111602, "epoch": 922} {"train_loss": -37.389949798583984, "global_step": 111603, "epoch": 922} {"train_loss": -38.7337760925293, "global_step": 111604, "epoch": 922} {"train_loss": -38.57688522338867, "global_step": 111605, "epoch": 922} {"train_loss": -37.07403564453125, "global_step": 111606, "epoch": 922} {"train_loss": -38.74294662475586, "global_step": 111607, "epoch": 922} {"train_loss": -38.38937759399414, "global_step": 111608, "epoch": 922} {"train_loss": -39.33657455444336, "global_step": 111609, "epoch": 922} {"train_loss": -38.165653228759766, "global_step": 111610, "epoch": 922} {"train_loss": -39.29671859741211, "global_step": 111611, "epoch": 922} {"train_loss": -39.36220932006836, "global_step": 111612, "epoch": 922} {"train_loss": -39.26053237915039, "global_step": 111613, "epoch": 922} {"train_loss": -38.911224365234375, "global_step": 111614, "epoch": 922} {"train_loss": -39.22218704223633, "global_step": 111615, "epoch": 922} {"train_loss": -39.44498825073242, "global_step": 111616, "epoch": 922} {"train_loss": -39.02328109741211, "global_step": 111617, "epoch": 922} {"train_loss": -39.214988708496094, "global_step": 111618, "epoch": 922} {"train_loss": -39.0123291015625, "global_step": 111619, "epoch": 922} {"train_loss": -39.44867706298828, "global_step": 111620, "epoch": 922} {"train_loss": -39.45783233642578, "global_step": 111621, "epoch": 922} {"train_loss": -39.22636032104492, "global_step": 111622, "epoch": 922} {"train_loss": -39.07258224487305, "global_step": 111623, "epoch": 922} {"train_loss": -39.982269287109375, "global_step": 111624, "epoch": 922} {"train_loss": -39.85307693481445, "global_step": 111625, "epoch": 922} {"train_loss": -39.8310432434082, "global_step": 111626, "epoch": 922} {"train_loss": -39.67902755737305, "global_step": 111627, "epoch": 922} {"train_loss": -40.193721771240234, "global_step": 111628, "epoch": 922} {"train_loss": -40.05867385864258, "global_step": 111629, "epoch": 922} {"train_loss": -40.382564544677734, "global_step": 111630, "epoch": 922} {"train_loss": -39.78692626953125, "global_step": 111631, "epoch": 922} {"train_loss": -40.198543548583984, "global_step": 111632, "epoch": 922} {"train_loss": -40.21406173706055, "global_step": 111633, "epoch": 922} {"train_loss": -40.15635299682617, "global_step": 111634, "epoch": 922} {"train_loss": -39.88912582397461, "global_step": 111635, "epoch": 922} {"train_loss": -40.30080795288086, "global_step": 111636, "epoch": 922} {"train_loss": -40.26522445678711, "global_step": 111637, "epoch": 922} {"train_loss": -40.2215461730957, "global_step": 111638, "epoch": 922} {"train_loss": -40.152496337890625, "global_step": 111639, "epoch": 922} {"train_loss": -40.31917190551758, "global_step": 111640, "epoch": 922} {"train_loss": -40.05412673950195, "global_step": 111641, "epoch": 922} {"train_loss": -40.04513168334961, "global_step": 111642, "epoch": 922} {"train_loss": -39.77779006958008, "global_step": 111643, "epoch": 922} {"train_loss": -40.299434661865234, "global_step": 111644, "epoch": 922} {"train_loss": -39.816009521484375, "global_step": 111645, "epoch": 922} {"train_loss": -39.14573287963867, "global_step": 111646, "epoch": 922} {"train_loss": -39.50813293457031, "global_step": 111647, "epoch": 922} {"train_loss": -40.34357833862305, "global_step": 111648, "epoch": 922} {"train_loss": -40.085838317871094, "global_step": 111649, "epoch": 922} {"train_loss": -38.34843063354492, "global_step": 111650, "epoch": 922} {"train_loss": -38.67181396484375, "global_step": 111651, "epoch": 922} {"train_loss": -39.63222885131836, "global_step": 111652, "epoch": 922} {"train_loss": -39.745357513427734, "global_step": 111653, "epoch": 922} {"train_loss": -39.38941192626953, "global_step": 111654, "epoch": 922} {"train_loss": -38.72708511352539, "global_step": 111655, "epoch": 922} {"train_loss": -40.1315803527832, "global_step": 111656, "epoch": 922} {"train_loss": -40.1694221496582, "global_step": 111657, "epoch": 922} {"train_loss": -39.69968795776367, "global_step": 111658, "epoch": 922} {"train_loss": -39.79697799682617, "global_step": 111659, "epoch": 922} {"train_loss": -39.7704963684082, "global_step": 111660, "epoch": 922} {"train_loss": -39.87056350708008, "global_step": 111661, "epoch": 922} {"train_loss": -40.01646041870117, "global_step": 111662, "epoch": 922} {"train_loss": -39.672462463378906, "global_step": 111663, "epoch": 922} {"train_loss": -40.258949279785156, "global_step": 111664, "epoch": 922} {"train_loss": -40.235469818115234, "global_step": 111665, "epoch": 922} {"train_loss": -40.09851837158203, "global_step": 111666, "epoch": 922} {"train_loss": -39.6545524597168, "global_step": 111667, "epoch": 922} {"train_loss": -39.941280364990234, "global_step": 111668, "epoch": 922} {"train_loss": -40.077449798583984, "global_step": 111669, "epoch": 922} {"train_loss": -39.54635238647461, "global_step": 111670, "epoch": 922} {"train_loss": -40.03955841064453, "global_step": 111671, "epoch": 922} {"train_loss": -39.614898681640625, "global_step": 111672, "epoch": 922} {"train_loss": -37.33735275268555, "global_step": 111673, "epoch": 922} {"train_loss": -37.10895538330078, "global_step": 111674, "epoch": 922} {"train_loss": -38.57088088989258, "global_step": 111675, "epoch": 922} {"train_loss": -39.759578704833984, "global_step": 111676, "epoch": 922} {"train_loss": -38.87752151489258, "global_step": 111677, "epoch": 922} {"train_loss": -35.55670928955078, "global_step": 111678, "epoch": 922} {"train_loss": -38.0037841796875, "global_step": 111679, "epoch": 922} {"train_loss": -31.986387252807617, "global_step": 111680, "epoch": 922} {"train_loss": -32.35055160522461, "global_step": 111681, "epoch": 922} {"train_loss": -38.57184250886775, "global_step": 111682, "epoch": 922, "val_loss": 2587328.25} {"train_loss": -11.623023986816406, "global_step": 111683, "epoch": 923} {"train_loss": 40.386268615722656, "global_step": 111684, "epoch": 923} {"train_loss": -20.359888076782227, "global_step": 111685, "epoch": 923} {"train_loss": 22.90555191040039, "global_step": 111686, "epoch": 923} {"train_loss": -20.486656188964844, "global_step": 111687, "epoch": 923} {"train_loss": 21.523818969726562, "global_step": 111688, "epoch": 923} {"train_loss": -27.6165828704834, "global_step": 111689, "epoch": 923} {"train_loss": -8.728372573852539, "global_step": 111690, "epoch": 923} {"train_loss": -6.759789943695068, "global_step": 111691, "epoch": 923} {"train_loss": -25.340518951416016, "global_step": 111692, "epoch": 923} {"train_loss": -28.497833251953125, "global_step": 111693, "epoch": 923} {"train_loss": -18.788785934448242, "global_step": 111694, "epoch": 923} {"train_loss": -16.840299606323242, "global_step": 111695, "epoch": 923} {"train_loss": -26.871423721313477, "global_step": 111696, "epoch": 923} {"train_loss": -31.330778121948242, "global_step": 111697, "epoch": 923} {"train_loss": -28.915287017822266, "global_step": 111698, "epoch": 923} {"train_loss": -28.347000122070312, "global_step": 111699, "epoch": 923} {"train_loss": -26.659366607666016, "global_step": 111700, "epoch": 923} {"train_loss": -26.46559715270996, "global_step": 111701, "epoch": 923} {"train_loss": -29.40740966796875, "global_step": 111702, "epoch": 923} {"train_loss": -31.49122428894043, "global_step": 111703, "epoch": 923} {"train_loss": -32.600852966308594, "global_step": 111704, "epoch": 923} {"train_loss": -31.887714385986328, "global_step": 111705, "epoch": 923} {"train_loss": -31.40234375, "global_step": 111706, "epoch": 923} {"train_loss": -31.277429580688477, "global_step": 111707, "epoch": 923} {"train_loss": -32.122589111328125, "global_step": 111708, "epoch": 923} {"train_loss": -32.94779586791992, "global_step": 111709, "epoch": 923} {"train_loss": -32.164756774902344, "global_step": 111710, "epoch": 923} {"train_loss": -32.747886657714844, "global_step": 111711, "epoch": 923} {"train_loss": -33.23188018798828, "global_step": 111712, "epoch": 923} {"train_loss": -33.187110900878906, "global_step": 111713, "epoch": 923} {"train_loss": -33.03498458862305, "global_step": 111714, "epoch": 923} {"train_loss": -33.33909225463867, "global_step": 111715, "epoch": 923} {"train_loss": -34.44129180908203, "global_step": 111716, "epoch": 923} {"train_loss": -34.269527435302734, "global_step": 111717, "epoch": 923} {"train_loss": -33.590484619140625, "global_step": 111718, "epoch": 923} {"train_loss": -34.4246711730957, "global_step": 111719, "epoch": 923} {"train_loss": -34.355499267578125, "global_step": 111720, "epoch": 923} {"train_loss": -34.4705924987793, "global_step": 111721, "epoch": 923} {"train_loss": -34.17219543457031, "global_step": 111722, "epoch": 923} {"train_loss": -34.7191047668457, "global_step": 111723, "epoch": 923} {"train_loss": -35.17783737182617, "global_step": 111724, "epoch": 923} {"train_loss": -35.189273834228516, "global_step": 111725, "epoch": 923} {"train_loss": -35.05323028564453, "global_step": 111726, "epoch": 923} {"train_loss": -35.2288932800293, "global_step": 111727, "epoch": 923} {"train_loss": -35.233680725097656, "global_step": 111728, "epoch": 923} {"train_loss": -35.70570373535156, "global_step": 111729, "epoch": 923} {"train_loss": -35.65007400512695, "global_step": 111730, "epoch": 923} {"train_loss": -35.38750457763672, "global_step": 111731, "epoch": 923} {"train_loss": -35.53347396850586, "global_step": 111732, "epoch": 923} {"train_loss": -35.48408126831055, "global_step": 111733, "epoch": 923} {"train_loss": -35.88869857788086, "global_step": 111734, "epoch": 923} {"train_loss": -35.978843688964844, "global_step": 111735, "epoch": 923} {"train_loss": -36.00685501098633, "global_step": 111736, "epoch": 923} {"train_loss": -35.868324279785156, "global_step": 111737, "epoch": 923} {"train_loss": -36.22383117675781, "global_step": 111738, "epoch": 923} {"train_loss": -36.536216735839844, "global_step": 111739, "epoch": 923} {"train_loss": -36.255157470703125, "global_step": 111740, "epoch": 923} {"train_loss": -36.649986267089844, "global_step": 111741, "epoch": 923} {"train_loss": -36.52177810668945, "global_step": 111742, "epoch": 923} {"train_loss": -36.55910873413086, "global_step": 111743, "epoch": 923} {"train_loss": -36.5478401184082, "global_step": 111744, "epoch": 923} {"train_loss": -36.932342529296875, "global_step": 111745, "epoch": 923} {"train_loss": -36.65789794921875, "global_step": 111746, "epoch": 923} {"train_loss": -36.89602279663086, "global_step": 111747, "epoch": 923} {"train_loss": -37.0606689453125, "global_step": 111748, "epoch": 923} {"train_loss": -37.139312744140625, "global_step": 111749, "epoch": 923} {"train_loss": -37.44529342651367, "global_step": 111750, "epoch": 923} {"train_loss": -37.39360427856445, "global_step": 111751, "epoch": 923} {"train_loss": -37.45576095581055, "global_step": 111752, "epoch": 923} {"train_loss": -37.71660232543945, "global_step": 111753, "epoch": 923} {"train_loss": -37.173858642578125, "global_step": 111754, "epoch": 923} {"train_loss": -37.8239860534668, "global_step": 111755, "epoch": 923} {"train_loss": -37.92521667480469, "global_step": 111756, "epoch": 923} {"train_loss": -37.82294845581055, "global_step": 111757, "epoch": 923} {"train_loss": -38.0860481262207, "global_step": 111758, "epoch": 923} {"train_loss": -37.60034942626953, "global_step": 111759, "epoch": 923} {"train_loss": -38.10907745361328, "global_step": 111760, "epoch": 923} {"train_loss": -38.203857421875, "global_step": 111761, "epoch": 923} {"train_loss": -37.752071380615234, "global_step": 111762, "epoch": 923} {"train_loss": -38.16556167602539, "global_step": 111763, "epoch": 923} {"train_loss": -37.99513626098633, "global_step": 111764, "epoch": 923} {"train_loss": -38.1280517578125, "global_step": 111765, "epoch": 923} {"train_loss": -38.16788864135742, "global_step": 111766, "epoch": 923} {"train_loss": -37.995704650878906, "global_step": 111767, "epoch": 923} {"train_loss": -37.96957778930664, "global_step": 111768, "epoch": 923} {"train_loss": -38.534420013427734, "global_step": 111769, "epoch": 923} {"train_loss": -38.393592834472656, "global_step": 111770, "epoch": 923} {"train_loss": -38.278133392333984, "global_step": 111771, "epoch": 923} {"train_loss": -38.156028747558594, "global_step": 111772, "epoch": 923} {"train_loss": -38.70649337768555, "global_step": 111773, "epoch": 923} {"train_loss": -38.86564254760742, "global_step": 111774, "epoch": 923} {"train_loss": -38.1638069152832, "global_step": 111775, "epoch": 923} {"train_loss": -39.0037841796875, "global_step": 111776, "epoch": 923} {"train_loss": -38.266639709472656, "global_step": 111777, "epoch": 923} {"train_loss": -38.46767807006836, "global_step": 111778, "epoch": 923} {"train_loss": -38.904048919677734, "global_step": 111779, "epoch": 923} {"train_loss": -38.89655303955078, "global_step": 111780, "epoch": 923} {"train_loss": -39.010799407958984, "global_step": 111781, "epoch": 923} {"train_loss": -38.59791564941406, "global_step": 111782, "epoch": 923} {"train_loss": -38.946807861328125, "global_step": 111783, "epoch": 923} {"train_loss": -39.12275314331055, "global_step": 111784, "epoch": 923} {"train_loss": -39.095191955566406, "global_step": 111785, "epoch": 923} {"train_loss": -38.8222770690918, "global_step": 111786, "epoch": 923} {"train_loss": -38.99422836303711, "global_step": 111787, "epoch": 923} {"train_loss": -39.04716491699219, "global_step": 111788, "epoch": 923} {"train_loss": -39.176509857177734, "global_step": 111789, "epoch": 923} {"train_loss": -38.8283576965332, "global_step": 111790, "epoch": 923} {"train_loss": -39.08403015136719, "global_step": 111791, "epoch": 923} {"train_loss": -39.48444747924805, "global_step": 111792, "epoch": 923} {"train_loss": -39.182247161865234, "global_step": 111793, "epoch": 923} {"train_loss": -39.55172348022461, "global_step": 111794, "epoch": 923} {"train_loss": -39.3383674621582, "global_step": 111795, "epoch": 923} {"train_loss": -39.301387786865234, "global_step": 111796, "epoch": 923} {"train_loss": -39.71684646606445, "global_step": 111797, "epoch": 923} {"train_loss": -40.029300689697266, "global_step": 111798, "epoch": 923} {"train_loss": -39.614681243896484, "global_step": 111799, "epoch": 923} {"train_loss": -39.228633880615234, "global_step": 111800, "epoch": 923} {"train_loss": -39.645652770996094, "global_step": 111801, "epoch": 923} {"train_loss": -39.673038482666016, "global_step": 111802, "epoch": 923} {"train_loss": -33.190184581378276, "global_step": 111803, "epoch": 923, "val_loss": 2624461.25} {"train_loss": -39.94173812866211, "global_step": 111804, "epoch": 924} {"train_loss": -39.68932342529297, "global_step": 111805, "epoch": 924} {"train_loss": -39.83845138549805, "global_step": 111806, "epoch": 924} {"train_loss": -39.821136474609375, "global_step": 111807, "epoch": 924} {"train_loss": -39.62435531616211, "global_step": 111808, "epoch": 924} {"train_loss": -39.72927474975586, "global_step": 111809, "epoch": 924} {"train_loss": -39.82476806640625, "global_step": 111810, "epoch": 924} {"train_loss": -39.40347671508789, "global_step": 111811, "epoch": 924} {"train_loss": -39.730281829833984, "global_step": 111812, "epoch": 924} {"train_loss": -40.01279830932617, "global_step": 111813, "epoch": 924} {"train_loss": -39.591651916503906, "global_step": 111814, "epoch": 924} {"train_loss": -39.854183197021484, "global_step": 111815, "epoch": 924} {"train_loss": -40.07884979248047, "global_step": 111816, "epoch": 924} {"train_loss": -39.48695755004883, "global_step": 111817, "epoch": 924} {"train_loss": -40.1813850402832, "global_step": 111818, "epoch": 924} {"train_loss": -39.97220993041992, "global_step": 111819, "epoch": 924} {"train_loss": -40.057044982910156, "global_step": 111820, "epoch": 924} {"train_loss": -40.282196044921875, "global_step": 111821, "epoch": 924} {"train_loss": -39.616943359375, "global_step": 111822, "epoch": 924} {"train_loss": -39.8761100769043, "global_step": 111823, "epoch": 924} {"train_loss": -40.410552978515625, "global_step": 111824, "epoch": 924} {"train_loss": -39.80836868286133, "global_step": 111825, "epoch": 924} {"train_loss": -40.195404052734375, "global_step": 111826, "epoch": 924} {"train_loss": -39.8067512512207, "global_step": 111827, "epoch": 924} {"train_loss": -40.44364929199219, "global_step": 111828, "epoch": 924} {"train_loss": -39.987728118896484, "global_step": 111829, "epoch": 924} {"train_loss": -40.08199691772461, "global_step": 111830, "epoch": 924} {"train_loss": -40.04018020629883, "global_step": 111831, "epoch": 924} {"train_loss": -40.33015823364258, "global_step": 111832, "epoch": 924} {"train_loss": -40.604103088378906, "global_step": 111833, "epoch": 924} {"train_loss": -40.485801696777344, "global_step": 111834, "epoch": 924} {"train_loss": -39.52321243286133, "global_step": 111835, "epoch": 924} {"train_loss": -40.34777069091797, "global_step": 111836, "epoch": 924} {"train_loss": -39.75703811645508, "global_step": 111837, "epoch": 924} {"train_loss": -39.69380187988281, "global_step": 111838, "epoch": 924} {"train_loss": -38.44891357421875, "global_step": 111839, "epoch": 924} {"train_loss": -36.58386993408203, "global_step": 111840, "epoch": 924} {"train_loss": -39.21293258666992, "global_step": 111841, "epoch": 924} {"train_loss": -36.448238372802734, "global_step": 111842, "epoch": 924} {"train_loss": -25.194976806640625, "global_step": 111843, "epoch": 924} {"train_loss": -0.31149616837501526, "global_step": 111844, "epoch": 924} {"train_loss": -3.4168503284454346, "global_step": 111845, "epoch": 924} {"train_loss": -21.58223533630371, "global_step": 111846, "epoch": 924} {"train_loss": -18.114303588867188, "global_step": 111847, "epoch": 924} {"train_loss": -29.130945205688477, "global_step": 111848, "epoch": 924} {"train_loss": -18.91691017150879, "global_step": 111849, "epoch": 924} {"train_loss": -33.091556549072266, "global_step": 111850, "epoch": 924} {"train_loss": -21.38876724243164, "global_step": 111851, "epoch": 924} {"train_loss": -31.162031173706055, "global_step": 111852, "epoch": 924} {"train_loss": -33.128395080566406, "global_step": 111853, "epoch": 924} {"train_loss": -31.56288719177246, "global_step": 111854, "epoch": 924} {"train_loss": -33.60161590576172, "global_step": 111855, "epoch": 924} {"train_loss": -33.61623001098633, "global_step": 111856, "epoch": 924} {"train_loss": -33.652374267578125, "global_step": 111857, "epoch": 924} {"train_loss": -32.619441986083984, "global_step": 111858, "epoch": 924} {"train_loss": -34.31770324707031, "global_step": 111859, "epoch": 924} {"train_loss": -35.76055908203125, "global_step": 111860, "epoch": 924} {"train_loss": -35.018245697021484, "global_step": 111861, "epoch": 924} {"train_loss": -34.3602409362793, "global_step": 111862, "epoch": 924} {"train_loss": -36.51869583129883, "global_step": 111863, "epoch": 924} {"train_loss": -36.754249572753906, "global_step": 111864, "epoch": 924} {"train_loss": -36.198848724365234, "global_step": 111865, "epoch": 924} {"train_loss": -35.79391098022461, "global_step": 111866, "epoch": 924} {"train_loss": -37.166259765625, "global_step": 111867, "epoch": 924} {"train_loss": -36.904510498046875, "global_step": 111868, "epoch": 924} {"train_loss": -36.510738372802734, "global_step": 111869, "epoch": 924} {"train_loss": -36.71012496948242, "global_step": 111870, "epoch": 924} {"train_loss": -36.90447998046875, "global_step": 111871, "epoch": 924} {"train_loss": -37.328609466552734, "global_step": 111872, "epoch": 924} {"train_loss": -37.20723342895508, "global_step": 111873, "epoch": 924} {"train_loss": -37.01888656616211, "global_step": 111874, "epoch": 924} {"train_loss": -37.5250358581543, "global_step": 111875, "epoch": 924} {"train_loss": -37.203670501708984, "global_step": 111876, "epoch": 924} {"train_loss": -36.93842315673828, "global_step": 111877, "epoch": 924} {"train_loss": -37.1285400390625, "global_step": 111878, "epoch": 924} {"train_loss": -37.591773986816406, "global_step": 111879, "epoch": 924} {"train_loss": -37.5660514831543, "global_step": 111880, "epoch": 924} {"train_loss": -37.78028869628906, "global_step": 111881, "epoch": 924} {"train_loss": -37.4434928894043, "global_step": 111882, "epoch": 924} {"train_loss": -37.95068359375, "global_step": 111883, "epoch": 924} {"train_loss": -37.974212646484375, "global_step": 111884, "epoch": 924} {"train_loss": -37.8983039855957, "global_step": 111885, "epoch": 924} {"train_loss": -37.892024993896484, "global_step": 111886, "epoch": 924} {"train_loss": -38.0153923034668, "global_step": 111887, "epoch": 924} {"train_loss": -37.91965866088867, "global_step": 111888, "epoch": 924} {"train_loss": -38.2005615234375, "global_step": 111889, "epoch": 924} {"train_loss": -38.29545211791992, "global_step": 111890, "epoch": 924} {"train_loss": -38.28696823120117, "global_step": 111891, "epoch": 924} {"train_loss": -38.093807220458984, "global_step": 111892, "epoch": 924} {"train_loss": -38.056026458740234, "global_step": 111893, "epoch": 924} {"train_loss": -37.81847381591797, "global_step": 111894, "epoch": 924} {"train_loss": -38.466182708740234, "global_step": 111895, "epoch": 924} {"train_loss": -38.18207931518555, "global_step": 111896, "epoch": 924} {"train_loss": -38.51560592651367, "global_step": 111897, "epoch": 924} {"train_loss": -38.64076232910156, "global_step": 111898, "epoch": 924} {"train_loss": -38.69251251220703, "global_step": 111899, "epoch": 924} {"train_loss": -38.700096130371094, "global_step": 111900, "epoch": 924} {"train_loss": -38.471649169921875, "global_step": 111901, "epoch": 924} {"train_loss": -38.57524108886719, "global_step": 111902, "epoch": 924} {"train_loss": -38.634796142578125, "global_step": 111903, "epoch": 924} {"train_loss": -38.753204345703125, "global_step": 111904, "epoch": 924} {"train_loss": -38.88165283203125, "global_step": 111905, "epoch": 924} {"train_loss": -38.689308166503906, "global_step": 111906, "epoch": 924} {"train_loss": -38.75288009643555, "global_step": 111907, "epoch": 924} {"train_loss": -38.87017822265625, "global_step": 111908, "epoch": 924} {"train_loss": -38.84504318237305, "global_step": 111909, "epoch": 924} {"train_loss": -39.0179557800293, "global_step": 111910, "epoch": 924} {"train_loss": -39.02614212036133, "global_step": 111911, "epoch": 924} {"train_loss": -38.93248748779297, "global_step": 111912, "epoch": 924} {"train_loss": -39.30170822143555, "global_step": 111913, "epoch": 924} {"train_loss": -38.74753189086914, "global_step": 111914, "epoch": 924} {"train_loss": -39.36558532714844, "global_step": 111915, "epoch": 924} {"train_loss": -39.23849105834961, "global_step": 111916, "epoch": 924} {"train_loss": -39.17327880859375, "global_step": 111917, "epoch": 924} {"train_loss": -39.347320556640625, "global_step": 111918, "epoch": 924} {"train_loss": -39.2194709777832, "global_step": 111919, "epoch": 924} {"train_loss": -39.27490234375, "global_step": 111920, "epoch": 924} {"train_loss": -39.32785415649414, "global_step": 111921, "epoch": 924} {"train_loss": -39.360286712646484, "global_step": 111922, "epoch": 924} {"train_loss": -39.65753173828125, "global_step": 111923, "epoch": 924} {"train_loss": -36.805909595459944, "global_step": 111924, "epoch": 924, "val_loss": 2563434.25} {"train_loss": -39.42261505126953, "global_step": 111925, "epoch": 925} {"train_loss": -39.698707580566406, "global_step": 111926, "epoch": 925} {"train_loss": -39.741451263427734, "global_step": 111927, "epoch": 925} {"train_loss": -39.5914421081543, "global_step": 111928, "epoch": 925} {"train_loss": -39.88387680053711, "global_step": 111929, "epoch": 925} {"train_loss": -39.90023422241211, "global_step": 111930, "epoch": 925} {"train_loss": -39.960052490234375, "global_step": 111931, "epoch": 925} {"train_loss": -39.83584976196289, "global_step": 111932, "epoch": 925} {"train_loss": -39.849151611328125, "global_step": 111933, "epoch": 925} {"train_loss": -39.957035064697266, "global_step": 111934, "epoch": 925} {"train_loss": -39.70256805419922, "global_step": 111935, "epoch": 925} {"train_loss": -39.80002975463867, "global_step": 111936, "epoch": 925} {"train_loss": -39.6307487487793, "global_step": 111937, "epoch": 925} {"train_loss": -39.8260612487793, "global_step": 111938, "epoch": 925} {"train_loss": -40.05804443359375, "global_step": 111939, "epoch": 925} {"train_loss": -39.663482666015625, "global_step": 111940, "epoch": 925} {"train_loss": -39.8864860534668, "global_step": 111941, "epoch": 925} {"train_loss": -39.83795928955078, "global_step": 111942, "epoch": 925} {"train_loss": -39.961753845214844, "global_step": 111943, "epoch": 925} {"train_loss": -40.04058074951172, "global_step": 111944, "epoch": 925} {"train_loss": -39.70109558105469, "global_step": 111945, "epoch": 925} {"train_loss": -38.73200225830078, "global_step": 111946, "epoch": 925} {"train_loss": -38.18557357788086, "global_step": 111947, "epoch": 925} {"train_loss": -39.71250534057617, "global_step": 111948, "epoch": 925} {"train_loss": -39.420658111572266, "global_step": 111949, "epoch": 925} {"train_loss": -37.585365295410156, "global_step": 111950, "epoch": 925} {"train_loss": -38.539337158203125, "global_step": 111951, "epoch": 925} {"train_loss": -39.0057487487793, "global_step": 111952, "epoch": 925} {"train_loss": -38.896602630615234, "global_step": 111953, "epoch": 925} {"train_loss": -38.824188232421875, "global_step": 111954, "epoch": 925} {"train_loss": -38.75825881958008, "global_step": 111955, "epoch": 925} {"train_loss": -38.89955520629883, "global_step": 111956, "epoch": 925} {"train_loss": -37.265193939208984, "global_step": 111957, "epoch": 925} {"train_loss": -36.78803634643555, "global_step": 111958, "epoch": 925} {"train_loss": -37.398658752441406, "global_step": 111959, "epoch": 925} {"train_loss": -38.66651153564453, "global_step": 111960, "epoch": 925} {"train_loss": -38.768165588378906, "global_step": 111961, "epoch": 925} {"train_loss": -39.45345687866211, "global_step": 111962, "epoch": 925} {"train_loss": -39.31165313720703, "global_step": 111963, "epoch": 925} {"train_loss": -38.622589111328125, "global_step": 111964, "epoch": 925} {"train_loss": -37.34897994995117, "global_step": 111965, "epoch": 925} {"train_loss": -35.84253692626953, "global_step": 111966, "epoch": 925} {"train_loss": -35.40827178955078, "global_step": 111967, "epoch": 925} {"train_loss": -35.722320556640625, "global_step": 111968, "epoch": 925} {"train_loss": -38.19928741455078, "global_step": 111969, "epoch": 925} {"train_loss": -39.673946380615234, "global_step": 111970, "epoch": 925} {"train_loss": -38.017738342285156, "global_step": 111971, "epoch": 925} {"train_loss": -37.118343353271484, "global_step": 111972, "epoch": 925} {"train_loss": -38.4034309387207, "global_step": 111973, "epoch": 925} {"train_loss": -39.196102142333984, "global_step": 111974, "epoch": 925} {"train_loss": -39.21411895751953, "global_step": 111975, "epoch": 925} {"train_loss": -38.23826599121094, "global_step": 111976, "epoch": 925} {"train_loss": -39.18522262573242, "global_step": 111977, "epoch": 925} {"train_loss": -38.819091796875, "global_step": 111978, "epoch": 925} {"train_loss": -38.963253021240234, "global_step": 111979, "epoch": 925} {"train_loss": -39.360107421875, "global_step": 111980, "epoch": 925} {"train_loss": -38.40904998779297, "global_step": 111981, "epoch": 925} {"train_loss": -38.3358268737793, "global_step": 111982, "epoch": 925} {"train_loss": -39.0267333984375, "global_step": 111983, "epoch": 925} {"train_loss": -39.51304244995117, "global_step": 111984, "epoch": 925} {"train_loss": -38.65061569213867, "global_step": 111985, "epoch": 925} {"train_loss": -38.953853607177734, "global_step": 111986, "epoch": 925} {"train_loss": -39.57394027709961, "global_step": 111987, "epoch": 925} {"train_loss": -38.13552474975586, "global_step": 111988, "epoch": 925} {"train_loss": -38.10896682739258, "global_step": 111989, "epoch": 925} {"train_loss": -39.76337814331055, "global_step": 111990, "epoch": 925} {"train_loss": -37.403900146484375, "global_step": 111991, "epoch": 925} {"train_loss": -36.39376449584961, "global_step": 111992, "epoch": 925} {"train_loss": -39.35280227661133, "global_step": 111993, "epoch": 925} {"train_loss": -38.790618896484375, "global_step": 111994, "epoch": 925} {"train_loss": -38.709468841552734, "global_step": 111995, "epoch": 925} {"train_loss": -39.342037200927734, "global_step": 111996, "epoch": 925} {"train_loss": -37.6959114074707, "global_step": 111997, "epoch": 925} {"train_loss": -39.50175094604492, "global_step": 111998, "epoch": 925} {"train_loss": -38.637420654296875, "global_step": 111999, "epoch": 925} {"train_loss": -38.213417053222656, "global_step": 112000, "epoch": 925} {"train_loss": -39.94077682495117, "global_step": 112001, "epoch": 925} {"train_loss": -37.77459716796875, "global_step": 112002, "epoch": 925} {"train_loss": -39.01934814453125, "global_step": 112003, "epoch": 925} {"train_loss": -38.42223358154297, "global_step": 112004, "epoch": 925} {"train_loss": -39.12235641479492, "global_step": 112005, "epoch": 925} {"train_loss": -38.57639694213867, "global_step": 112006, "epoch": 925} {"train_loss": -39.3385009765625, "global_step": 112007, "epoch": 925} {"train_loss": -39.87343978881836, "global_step": 112008, "epoch": 925} {"train_loss": -38.45096969604492, "global_step": 112009, "epoch": 925} {"train_loss": -39.672420501708984, "global_step": 112010, "epoch": 925} {"train_loss": -39.30801010131836, "global_step": 112011, "epoch": 925} {"train_loss": -39.55610275268555, "global_step": 112012, "epoch": 925} {"train_loss": -39.40826416015625, "global_step": 112013, "epoch": 925} {"train_loss": -39.61982345581055, "global_step": 112014, "epoch": 925} {"train_loss": -38.5670051574707, "global_step": 112015, "epoch": 925} {"train_loss": -39.491756439208984, "global_step": 112016, "epoch": 925} {"train_loss": -39.32307052612305, "global_step": 112017, "epoch": 925} {"train_loss": -38.355812072753906, "global_step": 112018, "epoch": 925} {"train_loss": -38.77181625366211, "global_step": 112019, "epoch": 925} {"train_loss": -39.36384201049805, "global_step": 112020, "epoch": 925} {"train_loss": -39.4069938659668, "global_step": 112021, "epoch": 925} {"train_loss": -38.13789749145508, "global_step": 112022, "epoch": 925} {"train_loss": -39.05588912963867, "global_step": 112023, "epoch": 925} {"train_loss": -38.898162841796875, "global_step": 112024, "epoch": 925} {"train_loss": -38.02692794799805, "global_step": 112025, "epoch": 925} {"train_loss": -37.750526428222656, "global_step": 112026, "epoch": 925} {"train_loss": -38.372161865234375, "global_step": 112027, "epoch": 925} {"train_loss": -38.22809982299805, "global_step": 112028, "epoch": 925} {"train_loss": -39.0450553894043, "global_step": 112029, "epoch": 925} {"train_loss": -38.60091018676758, "global_step": 112030, "epoch": 925} {"train_loss": -38.65829849243164, "global_step": 112031, "epoch": 925} {"train_loss": -38.4317512512207, "global_step": 112032, "epoch": 925} {"train_loss": -38.6325798034668, "global_step": 112033, "epoch": 925} {"train_loss": -38.507911682128906, "global_step": 112034, "epoch": 925} {"train_loss": -37.65859603881836, "global_step": 112035, "epoch": 925} {"train_loss": -37.04903793334961, "global_step": 112036, "epoch": 925} {"train_loss": -38.22239303588867, "global_step": 112037, "epoch": 925} {"train_loss": -39.33277130126953, "global_step": 112038, "epoch": 925} {"train_loss": -38.79735565185547, "global_step": 112039, "epoch": 925} {"train_loss": -38.46810531616211, "global_step": 112040, "epoch": 925} {"train_loss": -38.103736877441406, "global_step": 112041, "epoch": 925} {"train_loss": -38.843143463134766, "global_step": 112042, "epoch": 925} {"train_loss": -39.194332122802734, "global_step": 112043, "epoch": 925} {"train_loss": -38.259864807128906, "global_step": 112044, "epoch": 925} {"train_loss": -38.80570592959065, "global_step": 112045, "epoch": 925, "val_loss": 2557246.0} {"train_loss": -38.65330123901367, "global_step": 112046, "epoch": 926} {"train_loss": -39.4142951965332, "global_step": 112047, "epoch": 926} {"train_loss": -38.99397659301758, "global_step": 112048, "epoch": 926} {"train_loss": -39.661949157714844, "global_step": 112049, "epoch": 926} {"train_loss": -39.508358001708984, "global_step": 112050, "epoch": 926} {"train_loss": -39.06519317626953, "global_step": 112051, "epoch": 926} {"train_loss": -39.18812942504883, "global_step": 112052, "epoch": 926} {"train_loss": -39.6926383972168, "global_step": 112053, "epoch": 926} {"train_loss": -39.997249603271484, "global_step": 112054, "epoch": 926} {"train_loss": -39.53811264038086, "global_step": 112055, "epoch": 926} {"train_loss": -37.19681930541992, "global_step": 112056, "epoch": 926} {"train_loss": -39.971778869628906, "global_step": 112057, "epoch": 926} {"train_loss": -39.991600036621094, "global_step": 112058, "epoch": 926} {"train_loss": -39.559513092041016, "global_step": 112059, "epoch": 926} {"train_loss": -38.509727478027344, "global_step": 112060, "epoch": 926} {"train_loss": -34.71333694458008, "global_step": 112061, "epoch": 926} {"train_loss": -33.79607391357422, "global_step": 112062, "epoch": 926} {"train_loss": -38.83957290649414, "global_step": 112063, "epoch": 926} {"train_loss": -36.6135368347168, "global_step": 112064, "epoch": 926} {"train_loss": -32.35045623779297, "global_step": 112065, "epoch": 926} {"train_loss": -9.925989151000977, "global_step": 112066, "epoch": 926} {"train_loss": -30.6024112701416, "global_step": 112067, "epoch": 926} {"train_loss": -25.867944717407227, "global_step": 112068, "epoch": 926} {"train_loss": -26.795063018798828, "global_step": 112069, "epoch": 926} {"train_loss": -22.46881103515625, "global_step": 112070, "epoch": 926} {"train_loss": -14.850157737731934, "global_step": 112071, "epoch": 926} {"train_loss": -13.569238662719727, "global_step": 112072, "epoch": 926} {"train_loss": -25.666288375854492, "global_step": 112073, "epoch": 926} {"train_loss": -13.508135795593262, "global_step": 112074, "epoch": 926} {"train_loss": -8.338069915771484, "global_step": 112075, "epoch": 926} {"train_loss": -21.813650131225586, "global_step": 112076, "epoch": 926} {"train_loss": -10.333383560180664, "global_step": 112077, "epoch": 926} {"train_loss": -23.623825073242188, "global_step": 112078, "epoch": 926} {"train_loss": -27.88511085510254, "global_step": 112079, "epoch": 926} {"train_loss": -23.872167587280273, "global_step": 112080, "epoch": 926} {"train_loss": -20.052249908447266, "global_step": 112081, "epoch": 926} {"train_loss": -18.116060256958008, "global_step": 112082, "epoch": 926} {"train_loss": -18.9912109375, "global_step": 112083, "epoch": 926} {"train_loss": -24.136934280395508, "global_step": 112084, "epoch": 926} {"train_loss": -27.793859481811523, "global_step": 112085, "epoch": 926} {"train_loss": -26.494245529174805, "global_step": 112086, "epoch": 926} {"train_loss": -28.451339721679688, "global_step": 112087, "epoch": 926} {"train_loss": -29.737470626831055, "global_step": 112088, "epoch": 926} {"train_loss": -29.146717071533203, "global_step": 112089, "epoch": 926} {"train_loss": -28.17754554748535, "global_step": 112090, "epoch": 926} {"train_loss": -28.56220817565918, "global_step": 112091, "epoch": 926} {"train_loss": -30.629291534423828, "global_step": 112092, "epoch": 926} {"train_loss": -29.963397979736328, "global_step": 112093, "epoch": 926} {"train_loss": -30.24466896057129, "global_step": 112094, "epoch": 926} {"train_loss": -31.906005859375, "global_step": 112095, "epoch": 926} {"train_loss": -31.87775993347168, "global_step": 112096, "epoch": 926} {"train_loss": -31.075952529907227, "global_step": 112097, "epoch": 926} {"train_loss": -31.44829750061035, "global_step": 112098, "epoch": 926} {"train_loss": -32.06962585449219, "global_step": 112099, "epoch": 926} {"train_loss": -31.6862735748291, "global_step": 112100, "epoch": 926} {"train_loss": -32.452213287353516, "global_step": 112101, "epoch": 926} {"train_loss": -32.7142333984375, "global_step": 112102, "epoch": 926} {"train_loss": -31.817855834960938, "global_step": 112103, "epoch": 926} {"train_loss": -33.06436538696289, "global_step": 112104, "epoch": 926} {"train_loss": -33.4271240234375, "global_step": 112105, "epoch": 926} {"train_loss": -31.7044620513916, "global_step": 112106, "epoch": 926} {"train_loss": -33.05759048461914, "global_step": 112107, "epoch": 926} {"train_loss": -32.89321517944336, "global_step": 112108, "epoch": 926} {"train_loss": -33.452613830566406, "global_step": 112109, "epoch": 926} {"train_loss": -33.23952102661133, "global_step": 112110, "epoch": 926} {"train_loss": -34.15322494506836, "global_step": 112111, "epoch": 926} {"train_loss": -33.53740310668945, "global_step": 112112, "epoch": 926} {"train_loss": -33.634525299072266, "global_step": 112113, "epoch": 926} {"train_loss": -33.20491027832031, "global_step": 112114, "epoch": 926} {"train_loss": -33.56865310668945, "global_step": 112115, "epoch": 926} {"train_loss": -33.21821212768555, "global_step": 112116, "epoch": 926} {"train_loss": -33.331886291503906, "global_step": 112117, "epoch": 926} {"train_loss": -33.67384338378906, "global_step": 112118, "epoch": 926} {"train_loss": -34.008724212646484, "global_step": 112119, "epoch": 926} {"train_loss": -33.80388259887695, "global_step": 112120, "epoch": 926} {"train_loss": -33.807708740234375, "global_step": 112121, "epoch": 926} {"train_loss": -33.997833251953125, "global_step": 112122, "epoch": 926} {"train_loss": -33.88705062866211, "global_step": 112123, "epoch": 926} {"train_loss": -34.175270080566406, "global_step": 112124, "epoch": 926} {"train_loss": -34.03583908081055, "global_step": 112125, "epoch": 926} {"train_loss": -34.282066345214844, "global_step": 112126, "epoch": 926} {"train_loss": -34.33818435668945, "global_step": 112127, "epoch": 926} {"train_loss": -34.39805603027344, "global_step": 112128, "epoch": 926} {"train_loss": -34.679317474365234, "global_step": 112129, "epoch": 926} {"train_loss": -35.01725387573242, "global_step": 112130, "epoch": 926} {"train_loss": -34.62956237792969, "global_step": 112131, "epoch": 926} {"train_loss": -34.4036865234375, "global_step": 112132, "epoch": 926} {"train_loss": -34.355342864990234, "global_step": 112133, "epoch": 926} {"train_loss": -34.97523880004883, "global_step": 112134, "epoch": 926} {"train_loss": -34.54461669921875, "global_step": 112135, "epoch": 926} {"train_loss": -34.191776275634766, "global_step": 112136, "epoch": 926} {"train_loss": -34.72005844116211, "global_step": 112137, "epoch": 926} {"train_loss": -34.92977523803711, "global_step": 112138, "epoch": 926} {"train_loss": -35.21294021606445, "global_step": 112139, "epoch": 926} {"train_loss": -34.761104583740234, "global_step": 112140, "epoch": 926} {"train_loss": -35.05733108520508, "global_step": 112141, "epoch": 926} {"train_loss": -35.3785514831543, "global_step": 112142, "epoch": 926} {"train_loss": -35.2122802734375, "global_step": 112143, "epoch": 926} {"train_loss": -35.775447845458984, "global_step": 112144, "epoch": 926} {"train_loss": -34.94887161254883, "global_step": 112145, "epoch": 926} {"train_loss": -35.58456039428711, "global_step": 112146, "epoch": 926} {"train_loss": -35.185909271240234, "global_step": 112147, "epoch": 926} {"train_loss": -35.1259880065918, "global_step": 112148, "epoch": 926} {"train_loss": -35.687355041503906, "global_step": 112149, "epoch": 926} {"train_loss": -35.3107795715332, "global_step": 112150, "epoch": 926} {"train_loss": -35.371578216552734, "global_step": 112151, "epoch": 926} {"train_loss": -35.665016174316406, "global_step": 112152, "epoch": 926} {"train_loss": -35.48256301879883, "global_step": 112153, "epoch": 926} {"train_loss": -35.61873245239258, "global_step": 112154, "epoch": 926} {"train_loss": -35.439762115478516, "global_step": 112155, "epoch": 926} {"train_loss": -36.0626335144043, "global_step": 112156, "epoch": 926} {"train_loss": -35.904449462890625, "global_step": 112157, "epoch": 926} {"train_loss": -35.69967269897461, "global_step": 112158, "epoch": 926} {"train_loss": -35.905433654785156, "global_step": 112159, "epoch": 926} {"train_loss": -36.082061767578125, "global_step": 112160, "epoch": 926} {"train_loss": -35.920623779296875, "global_step": 112161, "epoch": 926} {"train_loss": -35.78512191772461, "global_step": 112162, "epoch": 926} {"train_loss": -36.12288284301758, "global_step": 112163, "epoch": 926} {"train_loss": -36.34748458862305, "global_step": 112164, "epoch": 926} {"train_loss": -36.36896896362305, "global_step": 112165, "epoch": 926} {"train_loss": -32.27554805219666, "global_step": 112166, "epoch": 926, "val_loss": 2561958.0} {"train_loss": -36.202449798583984, "global_step": 112167, "epoch": 927} {"train_loss": -36.44721221923828, "global_step": 112168, "epoch": 927} {"train_loss": -35.7938117980957, "global_step": 112169, "epoch": 927} {"train_loss": -36.716041564941406, "global_step": 112170, "epoch": 927} {"train_loss": -36.59992218017578, "global_step": 112171, "epoch": 927} {"train_loss": -36.59359359741211, "global_step": 112172, "epoch": 927} {"train_loss": -36.389705657958984, "global_step": 112173, "epoch": 927} {"train_loss": -36.28700637817383, "global_step": 112174, "epoch": 927} {"train_loss": -36.82213592529297, "global_step": 112175, "epoch": 927} {"train_loss": -36.507991790771484, "global_step": 112176, "epoch": 927} {"train_loss": -36.68740463256836, "global_step": 112177, "epoch": 927} {"train_loss": -36.58636474609375, "global_step": 112178, "epoch": 927} {"train_loss": -37.27268600463867, "global_step": 112179, "epoch": 927} {"train_loss": -37.04114532470703, "global_step": 112180, "epoch": 927} {"train_loss": -37.149452209472656, "global_step": 112181, "epoch": 927} {"train_loss": -36.891510009765625, "global_step": 112182, "epoch": 927} {"train_loss": -36.83705520629883, "global_step": 112183, "epoch": 927} {"train_loss": -36.76911544799805, "global_step": 112184, "epoch": 927} {"train_loss": -36.74726486206055, "global_step": 112185, "epoch": 927} {"train_loss": -36.88798904418945, "global_step": 112186, "epoch": 927} {"train_loss": -36.769779205322266, "global_step": 112187, "epoch": 927} {"train_loss": -37.0329475402832, "global_step": 112188, "epoch": 927} {"train_loss": -36.96076583862305, "global_step": 112189, "epoch": 927} {"train_loss": -37.15555191040039, "global_step": 112190, "epoch": 927} {"train_loss": -37.68624496459961, "global_step": 112191, "epoch": 927} {"train_loss": -37.07183837890625, "global_step": 112192, "epoch": 927} {"train_loss": -36.97597122192383, "global_step": 112193, "epoch": 927} {"train_loss": -37.16389083862305, "global_step": 112194, "epoch": 927} {"train_loss": -37.36147689819336, "global_step": 112195, "epoch": 927} {"train_loss": -37.25001907348633, "global_step": 112196, "epoch": 927} {"train_loss": -37.56718826293945, "global_step": 112197, "epoch": 927} {"train_loss": -37.30976867675781, "global_step": 112198, "epoch": 927} {"train_loss": -37.60310745239258, "global_step": 112199, "epoch": 927} {"train_loss": -37.58839416503906, "global_step": 112200, "epoch": 927} {"train_loss": -38.05247116088867, "global_step": 112201, "epoch": 927} {"train_loss": -37.38959884643555, "global_step": 112202, "epoch": 927} {"train_loss": -37.634483337402344, "global_step": 112203, "epoch": 927} {"train_loss": -37.510250091552734, "global_step": 112204, "epoch": 927} {"train_loss": -37.506385803222656, "global_step": 112205, "epoch": 927} {"train_loss": -37.48393249511719, "global_step": 112206, "epoch": 927} {"train_loss": -37.372005462646484, "global_step": 112207, "epoch": 927} {"train_loss": -37.696136474609375, "global_step": 112208, "epoch": 927} {"train_loss": -37.86262130737305, "global_step": 112209, "epoch": 927} {"train_loss": -38.39848709106445, "global_step": 112210, "epoch": 927} {"train_loss": -37.594234466552734, "global_step": 112211, "epoch": 927} {"train_loss": -37.692535400390625, "global_step": 112212, "epoch": 927} {"train_loss": -37.428802490234375, "global_step": 112213, "epoch": 927} {"train_loss": -37.54022216796875, "global_step": 112214, "epoch": 927} {"train_loss": -37.736602783203125, "global_step": 112215, "epoch": 927} {"train_loss": -36.85732650756836, "global_step": 112216, "epoch": 927} {"train_loss": -38.11659622192383, "global_step": 112217, "epoch": 927} {"train_loss": -38.014434814453125, "global_step": 112218, "epoch": 927} {"train_loss": -37.78342819213867, "global_step": 112219, "epoch": 927} {"train_loss": -37.8085823059082, "global_step": 112220, "epoch": 927} {"train_loss": -37.83846664428711, "global_step": 112221, "epoch": 927} {"train_loss": -37.97396469116211, "global_step": 112222, "epoch": 927} {"train_loss": -37.968563079833984, "global_step": 112223, "epoch": 927} {"train_loss": -37.79262924194336, "global_step": 112224, "epoch": 927} {"train_loss": -37.799495697021484, "global_step": 112225, "epoch": 927} {"train_loss": -38.41170883178711, "global_step": 112226, "epoch": 927} {"train_loss": -38.512813568115234, "global_step": 112227, "epoch": 927} {"train_loss": -37.94593048095703, "global_step": 112228, "epoch": 927} {"train_loss": -37.8758430480957, "global_step": 112229, "epoch": 927} {"train_loss": -37.83840560913086, "global_step": 112230, "epoch": 927} {"train_loss": -38.39242172241211, "global_step": 112231, "epoch": 927} {"train_loss": -38.36727523803711, "global_step": 112232, "epoch": 927} {"train_loss": -38.13998794555664, "global_step": 112233, "epoch": 927} {"train_loss": -38.16863250732422, "global_step": 112234, "epoch": 927} {"train_loss": -38.573463439941406, "global_step": 112235, "epoch": 927} {"train_loss": -38.42545700073242, "global_step": 112236, "epoch": 927} {"train_loss": -38.18982696533203, "global_step": 112237, "epoch": 927} {"train_loss": -38.52027130126953, "global_step": 112238, "epoch": 927} {"train_loss": -37.858795166015625, "global_step": 112239, "epoch": 927} {"train_loss": -38.47751998901367, "global_step": 112240, "epoch": 927} {"train_loss": -38.583168029785156, "global_step": 112241, "epoch": 927} {"train_loss": -38.57670211791992, "global_step": 112242, "epoch": 927} {"train_loss": -38.30841064453125, "global_step": 112243, "epoch": 927} {"train_loss": -38.87091064453125, "global_step": 112244, "epoch": 927} {"train_loss": -38.60517120361328, "global_step": 112245, "epoch": 927} {"train_loss": -38.73007583618164, "global_step": 112246, "epoch": 927} {"train_loss": -38.54240036010742, "global_step": 112247, "epoch": 927} {"train_loss": -38.19254684448242, "global_step": 112248, "epoch": 927} {"train_loss": -38.627410888671875, "global_step": 112249, "epoch": 927} {"train_loss": -38.9922981262207, "global_step": 112250, "epoch": 927} {"train_loss": -37.97907638549805, "global_step": 112251, "epoch": 927} {"train_loss": -38.69808578491211, "global_step": 112252, "epoch": 927} {"train_loss": -38.431705474853516, "global_step": 112253, "epoch": 927} {"train_loss": -38.58966064453125, "global_step": 112254, "epoch": 927} {"train_loss": -38.411163330078125, "global_step": 112255, "epoch": 927} {"train_loss": -37.911712646484375, "global_step": 112256, "epoch": 927} {"train_loss": -38.24464416503906, "global_step": 112257, "epoch": 927} {"train_loss": -38.47849655151367, "global_step": 112258, "epoch": 927} {"train_loss": -37.979408264160156, "global_step": 112259, "epoch": 927} {"train_loss": -38.48562240600586, "global_step": 112260, "epoch": 927} {"train_loss": -38.776424407958984, "global_step": 112261, "epoch": 927} {"train_loss": -38.45825958251953, "global_step": 112262, "epoch": 927} {"train_loss": -38.578453063964844, "global_step": 112263, "epoch": 927} {"train_loss": -38.1712760925293, "global_step": 112264, "epoch": 927} {"train_loss": -36.48702621459961, "global_step": 112265, "epoch": 927} {"train_loss": -32.629032135009766, "global_step": 112266, "epoch": 927} {"train_loss": -23.6574764251709, "global_step": 112267, "epoch": 927} {"train_loss": -26.818191528320312, "global_step": 112268, "epoch": 927} {"train_loss": -31.491809844970703, "global_step": 112269, "epoch": 927} {"train_loss": -29.70318031311035, "global_step": 112270, "epoch": 927} {"train_loss": -28.723896026611328, "global_step": 112271, "epoch": 927} {"train_loss": -28.263904571533203, "global_step": 112272, "epoch": 927} {"train_loss": -29.479248046875, "global_step": 112273, "epoch": 927} {"train_loss": -28.855615615844727, "global_step": 112274, "epoch": 927} {"train_loss": -28.712976455688477, "global_step": 112275, "epoch": 927} {"train_loss": -30.707006454467773, "global_step": 112276, "epoch": 927} {"train_loss": -31.56756019592285, "global_step": 112277, "epoch": 927} {"train_loss": -31.443695068359375, "global_step": 112278, "epoch": 927} {"train_loss": -30.392547607421875, "global_step": 112279, "epoch": 927} {"train_loss": -31.510366439819336, "global_step": 112280, "epoch": 927} {"train_loss": -31.401426315307617, "global_step": 112281, "epoch": 927} {"train_loss": -32.070011138916016, "global_step": 112282, "epoch": 927} {"train_loss": -32.588844299316406, "global_step": 112283, "epoch": 927} {"train_loss": -32.5526123046875, "global_step": 112284, "epoch": 927} {"train_loss": -32.84406280517578, "global_step": 112285, "epoch": 927} {"train_loss": -32.736141204833984, "global_step": 112286, "epoch": 927} {"train_loss": -36.37587722273898, "global_step": 112287, "epoch": 927, "val_loss": 2650565.75} {"train_loss": -32.692928314208984, "global_step": 112288, "epoch": 928} {"train_loss": -33.248924255371094, "global_step": 112289, "epoch": 928} {"train_loss": -33.85920333862305, "global_step": 112290, "epoch": 928} {"train_loss": -33.64451217651367, "global_step": 112291, "epoch": 928} {"train_loss": -32.83720779418945, "global_step": 112292, "epoch": 928} {"train_loss": -33.07904815673828, "global_step": 112293, "epoch": 928} {"train_loss": -33.299434661865234, "global_step": 112294, "epoch": 928} {"train_loss": -33.20985794067383, "global_step": 112295, "epoch": 928} {"train_loss": -33.81161117553711, "global_step": 112296, "epoch": 928} {"train_loss": -34.45582962036133, "global_step": 112297, "epoch": 928} {"train_loss": -33.84799575805664, "global_step": 112298, "epoch": 928} {"train_loss": -34.04349899291992, "global_step": 112299, "epoch": 928} {"train_loss": -34.0216178894043, "global_step": 112300, "epoch": 928} {"train_loss": -34.99907684326172, "global_step": 112301, "epoch": 928} {"train_loss": -33.9918098449707, "global_step": 112302, "epoch": 928} {"train_loss": -34.512020111083984, "global_step": 112303, "epoch": 928} {"train_loss": -34.449092864990234, "global_step": 112304, "epoch": 928} {"train_loss": -34.63051986694336, "global_step": 112305, "epoch": 928} {"train_loss": -34.770259857177734, "global_step": 112306, "epoch": 928} {"train_loss": -34.8579216003418, "global_step": 112307, "epoch": 928} {"train_loss": -34.73027420043945, "global_step": 112308, "epoch": 928} {"train_loss": -35.33192825317383, "global_step": 112309, "epoch": 928} {"train_loss": -34.6523323059082, "global_step": 112310, "epoch": 928} {"train_loss": -34.559871673583984, "global_step": 112311, "epoch": 928} {"train_loss": -34.697242736816406, "global_step": 112312, "epoch": 928} {"train_loss": -34.80644607543945, "global_step": 112313, "epoch": 928} {"train_loss": -35.60065841674805, "global_step": 112314, "epoch": 928} {"train_loss": -34.95044708251953, "global_step": 112315, "epoch": 928} {"train_loss": -35.53028106689453, "global_step": 112316, "epoch": 928} {"train_loss": -35.23928451538086, "global_step": 112317, "epoch": 928} {"train_loss": -35.34892654418945, "global_step": 112318, "epoch": 928} {"train_loss": -35.995052337646484, "global_step": 112319, "epoch": 928} {"train_loss": -35.33029556274414, "global_step": 112320, "epoch": 928} {"train_loss": -35.06284713745117, "global_step": 112321, "epoch": 928} {"train_loss": -35.169647216796875, "global_step": 112322, "epoch": 928} {"train_loss": -34.027313232421875, "global_step": 112323, "epoch": 928} {"train_loss": -33.76726150512695, "global_step": 112324, "epoch": 928} {"train_loss": -35.26221466064453, "global_step": 112325, "epoch": 928} {"train_loss": -35.64563751220703, "global_step": 112326, "epoch": 928} {"train_loss": -32.46151351928711, "global_step": 112327, "epoch": 928} {"train_loss": -30.078771591186523, "global_step": 112328, "epoch": 928} {"train_loss": -34.4078254699707, "global_step": 112329, "epoch": 928} {"train_loss": -35.236846923828125, "global_step": 112330, "epoch": 928} {"train_loss": -33.28264617919922, "global_step": 112331, "epoch": 928} {"train_loss": -35.79307174682617, "global_step": 112332, "epoch": 928} {"train_loss": -34.36383819580078, "global_step": 112333, "epoch": 928} {"train_loss": -35.500885009765625, "global_step": 112334, "epoch": 928} {"train_loss": -35.626338958740234, "global_step": 112335, "epoch": 928} {"train_loss": -36.209205627441406, "global_step": 112336, "epoch": 928} {"train_loss": -35.785343170166016, "global_step": 112337, "epoch": 928} {"train_loss": -36.49534225463867, "global_step": 112338, "epoch": 928} {"train_loss": -36.08006286621094, "global_step": 112339, "epoch": 928} {"train_loss": -36.09355926513672, "global_step": 112340, "epoch": 928} {"train_loss": -36.160823822021484, "global_step": 112341, "epoch": 928} {"train_loss": -36.48274612426758, "global_step": 112342, "epoch": 928} {"train_loss": -36.77521896362305, "global_step": 112343, "epoch": 928} {"train_loss": -36.24833297729492, "global_step": 112344, "epoch": 928} {"train_loss": -37.113826751708984, "global_step": 112345, "epoch": 928} {"train_loss": -36.250362396240234, "global_step": 112346, "epoch": 928} {"train_loss": -36.64431381225586, "global_step": 112347, "epoch": 928} {"train_loss": -35.82271957397461, "global_step": 112348, "epoch": 928} {"train_loss": -36.6308479309082, "global_step": 112349, "epoch": 928} {"train_loss": -36.46306228637695, "global_step": 112350, "epoch": 928} {"train_loss": -37.05864334106445, "global_step": 112351, "epoch": 928} {"train_loss": -37.0350341796875, "global_step": 112352, "epoch": 928} {"train_loss": -36.711830139160156, "global_step": 112353, "epoch": 928} {"train_loss": -36.189701080322266, "global_step": 112354, "epoch": 928} {"train_loss": -36.402381896972656, "global_step": 112355, "epoch": 928} {"train_loss": -37.25075912475586, "global_step": 112356, "epoch": 928} {"train_loss": -36.72172164916992, "global_step": 112357, "epoch": 928} {"train_loss": -37.07893753051758, "global_step": 112358, "epoch": 928} {"train_loss": -36.95302200317383, "global_step": 112359, "epoch": 928} {"train_loss": -36.91936111450195, "global_step": 112360, "epoch": 928} {"train_loss": -36.94137191772461, "global_step": 112361, "epoch": 928} {"train_loss": -36.832672119140625, "global_step": 112362, "epoch": 928} {"train_loss": -37.329410552978516, "global_step": 112363, "epoch": 928} {"train_loss": -37.11273956298828, "global_step": 112364, "epoch": 928} {"train_loss": -37.13163375854492, "global_step": 112365, "epoch": 928} {"train_loss": -36.84663009643555, "global_step": 112366, "epoch": 928} {"train_loss": -36.819766998291016, "global_step": 112367, "epoch": 928} {"train_loss": -37.40408706665039, "global_step": 112368, "epoch": 928} {"train_loss": -36.791439056396484, "global_step": 112369, "epoch": 928} {"train_loss": -37.7808723449707, "global_step": 112370, "epoch": 928} {"train_loss": -37.12295150756836, "global_step": 112371, "epoch": 928} {"train_loss": -37.335723876953125, "global_step": 112372, "epoch": 928} {"train_loss": -36.91820526123047, "global_step": 112373, "epoch": 928} {"train_loss": -36.652992248535156, "global_step": 112374, "epoch": 928} {"train_loss": -37.30018615722656, "global_step": 112375, "epoch": 928} {"train_loss": -36.52849197387695, "global_step": 112376, "epoch": 928} {"train_loss": -37.201873779296875, "global_step": 112377, "epoch": 928} {"train_loss": -38.07576370239258, "global_step": 112378, "epoch": 928} {"train_loss": -37.13682174682617, "global_step": 112379, "epoch": 928} {"train_loss": -37.91189193725586, "global_step": 112380, "epoch": 928} {"train_loss": -37.60578155517578, "global_step": 112381, "epoch": 928} {"train_loss": -36.83498764038086, "global_step": 112382, "epoch": 928} {"train_loss": -37.452850341796875, "global_step": 112383, "epoch": 928} {"train_loss": -36.99433517456055, "global_step": 112384, "epoch": 928} {"train_loss": -37.125362396240234, "global_step": 112385, "epoch": 928} {"train_loss": -37.02057647705078, "global_step": 112386, "epoch": 928} {"train_loss": -37.20876693725586, "global_step": 112387, "epoch": 928} {"train_loss": -37.4445915222168, "global_step": 112388, "epoch": 928} {"train_loss": -37.541236877441406, "global_step": 112389, "epoch": 928} {"train_loss": -37.715431213378906, "global_step": 112390, "epoch": 928} {"train_loss": -37.476806640625, "global_step": 112391, "epoch": 928} {"train_loss": -37.978946685791016, "global_step": 112392, "epoch": 928} {"train_loss": -37.265830993652344, "global_step": 112393, "epoch": 928} {"train_loss": -37.56111526489258, "global_step": 112394, "epoch": 928} {"train_loss": -37.086578369140625, "global_step": 112395, "epoch": 928} {"train_loss": -37.13151931762695, "global_step": 112396, "epoch": 928} {"train_loss": -37.6589469909668, "global_step": 112397, "epoch": 928} {"train_loss": -37.33380889892578, "global_step": 112398, "epoch": 928} {"train_loss": -37.241844177246094, "global_step": 112399, "epoch": 928} {"train_loss": -36.62438201904297, "global_step": 112400, "epoch": 928} {"train_loss": -36.921051025390625, "global_step": 112401, "epoch": 928} {"train_loss": -37.59878158569336, "global_step": 112402, "epoch": 928} {"train_loss": -36.26896667480469, "global_step": 112403, "epoch": 928} {"train_loss": -37.107418060302734, "global_step": 112404, "epoch": 928} {"train_loss": -37.055458068847656, "global_step": 112405, "epoch": 928} {"train_loss": -36.96273422241211, "global_step": 112406, "epoch": 928} {"train_loss": -37.9577522277832, "global_step": 112407, "epoch": 928} {"train_loss": -35.95173574085078, "global_step": 112408, "epoch": 928, "val_loss": 2594604.75} {"train_loss": -37.34682083129883, "global_step": 112409, "epoch": 929} {"train_loss": -35.15535354614258, "global_step": 112410, "epoch": 929} {"train_loss": -33.556785583496094, "global_step": 112411, "epoch": 929} {"train_loss": -35.960147857666016, "global_step": 112412, "epoch": 929} {"train_loss": -36.31401443481445, "global_step": 112413, "epoch": 929} {"train_loss": -30.625995635986328, "global_step": 112414, "epoch": 929} {"train_loss": -35.57217788696289, "global_step": 112415, "epoch": 929} {"train_loss": -34.366024017333984, "global_step": 112416, "epoch": 929} {"train_loss": -30.539325714111328, "global_step": 112417, "epoch": 929} {"train_loss": -36.8855094909668, "global_step": 112418, "epoch": 929} {"train_loss": -33.95294952392578, "global_step": 112419, "epoch": 929} {"train_loss": -35.22646713256836, "global_step": 112420, "epoch": 929} {"train_loss": -35.77822494506836, "global_step": 112421, "epoch": 929} {"train_loss": -34.085872650146484, "global_step": 112422, "epoch": 929} {"train_loss": -36.72358322143555, "global_step": 112423, "epoch": 929} {"train_loss": -34.07474136352539, "global_step": 112424, "epoch": 929} {"train_loss": -33.60715103149414, "global_step": 112425, "epoch": 929} {"train_loss": -34.91484451293945, "global_step": 112426, "epoch": 929} {"train_loss": -34.29894256591797, "global_step": 112427, "epoch": 929} {"train_loss": -36.47211837768555, "global_step": 112428, "epoch": 929} {"train_loss": -35.651790618896484, "global_step": 112429, "epoch": 929} {"train_loss": -34.84931564331055, "global_step": 112430, "epoch": 929} {"train_loss": -36.83064270019531, "global_step": 112431, "epoch": 929} {"train_loss": -35.59196090698242, "global_step": 112432, "epoch": 929} {"train_loss": -36.88409423828125, "global_step": 112433, "epoch": 929} {"train_loss": -36.801387786865234, "global_step": 112434, "epoch": 929} {"train_loss": -36.56232833862305, "global_step": 112435, "epoch": 929} {"train_loss": -37.19758224487305, "global_step": 112436, "epoch": 929} {"train_loss": -35.90993881225586, "global_step": 112437, "epoch": 929} {"train_loss": -36.63709259033203, "global_step": 112438, "epoch": 929} {"train_loss": -37.04233932495117, "global_step": 112439, "epoch": 929} {"train_loss": -36.444252014160156, "global_step": 112440, "epoch": 929} {"train_loss": -37.67381286621094, "global_step": 112441, "epoch": 929} {"train_loss": -35.99109649658203, "global_step": 112442, "epoch": 929} {"train_loss": -36.55573654174805, "global_step": 112443, "epoch": 929} {"train_loss": -36.580482482910156, "global_step": 112444, "epoch": 929} {"train_loss": -37.108402252197266, "global_step": 112445, "epoch": 929} {"train_loss": -36.30839920043945, "global_step": 112446, "epoch": 929} {"train_loss": -37.7845573425293, "global_step": 112447, "epoch": 929} {"train_loss": -37.626251220703125, "global_step": 112448, "epoch": 929} {"train_loss": -37.272586822509766, "global_step": 112449, "epoch": 929} {"train_loss": -37.53913116455078, "global_step": 112450, "epoch": 929} {"train_loss": -36.693912506103516, "global_step": 112451, "epoch": 929} {"train_loss": -37.93864059448242, "global_step": 112452, "epoch": 929} {"train_loss": -37.267486572265625, "global_step": 112453, "epoch": 929} {"train_loss": -37.43709945678711, "global_step": 112454, "epoch": 929} {"train_loss": -37.43034362792969, "global_step": 112455, "epoch": 929} {"train_loss": -36.63013458251953, "global_step": 112456, "epoch": 929} {"train_loss": -37.85213088989258, "global_step": 112457, "epoch": 929} {"train_loss": -37.46040725708008, "global_step": 112458, "epoch": 929} {"train_loss": -37.436187744140625, "global_step": 112459, "epoch": 929} {"train_loss": -36.5123291015625, "global_step": 112460, "epoch": 929} {"train_loss": -37.753692626953125, "global_step": 112461, "epoch": 929} {"train_loss": -37.12549591064453, "global_step": 112462, "epoch": 929} {"train_loss": -36.81203842163086, "global_step": 112463, "epoch": 929} {"train_loss": -37.0275764465332, "global_step": 112464, "epoch": 929} {"train_loss": -36.24899673461914, "global_step": 112465, "epoch": 929} {"train_loss": -38.26804733276367, "global_step": 112466, "epoch": 929} {"train_loss": -37.634613037109375, "global_step": 112467, "epoch": 929} {"train_loss": -34.9072151184082, "global_step": 112468, "epoch": 929} {"train_loss": -38.12378692626953, "global_step": 112469, "epoch": 929} {"train_loss": -37.48851776123047, "global_step": 112470, "epoch": 929} {"train_loss": -37.953060150146484, "global_step": 112471, "epoch": 929} {"train_loss": -37.944000244140625, "global_step": 112472, "epoch": 929} {"train_loss": -35.48960494995117, "global_step": 112473, "epoch": 929} {"train_loss": -38.088623046875, "global_step": 112474, "epoch": 929} {"train_loss": -36.6693229675293, "global_step": 112475, "epoch": 929} {"train_loss": -37.963802337646484, "global_step": 112476, "epoch": 929} {"train_loss": -37.96160888671875, "global_step": 112477, "epoch": 929} {"train_loss": -38.0716438293457, "global_step": 112478, "epoch": 929} {"train_loss": -37.72334289550781, "global_step": 112479, "epoch": 929} {"train_loss": -37.213111877441406, "global_step": 112480, "epoch": 929} {"train_loss": -37.67261505126953, "global_step": 112481, "epoch": 929} {"train_loss": -35.26560592651367, "global_step": 112482, "epoch": 929} {"train_loss": -37.93136215209961, "global_step": 112483, "epoch": 929} {"train_loss": -38.34452438354492, "global_step": 112484, "epoch": 929} {"train_loss": -38.08899688720703, "global_step": 112485, "epoch": 929} {"train_loss": -37.780845642089844, "global_step": 112486, "epoch": 929} {"train_loss": -36.90717697143555, "global_step": 112487, "epoch": 929} {"train_loss": -38.34364700317383, "global_step": 112488, "epoch": 929} {"train_loss": -37.995361328125, "global_step": 112489, "epoch": 929} {"train_loss": -35.96470642089844, "global_step": 112490, "epoch": 929} {"train_loss": -36.78978729248047, "global_step": 112491, "epoch": 929} {"train_loss": -37.784751892089844, "global_step": 112492, "epoch": 929} {"train_loss": -37.710079193115234, "global_step": 112493, "epoch": 929} {"train_loss": -36.33186721801758, "global_step": 112494, "epoch": 929} {"train_loss": -37.2606315612793, "global_step": 112495, "epoch": 929} {"train_loss": -36.63294219970703, "global_step": 112496, "epoch": 929} {"train_loss": -37.94517135620117, "global_step": 112497, "epoch": 929} {"train_loss": -37.23702621459961, "global_step": 112498, "epoch": 929} {"train_loss": -37.51198959350586, "global_step": 112499, "epoch": 929} {"train_loss": -37.6604118347168, "global_step": 112500, "epoch": 929} {"train_loss": -38.322509765625, "global_step": 112501, "epoch": 929} {"train_loss": -38.10083770751953, "global_step": 112502, "epoch": 929} {"train_loss": -38.12672805786133, "global_step": 112503, "epoch": 929} {"train_loss": -38.66244888305664, "global_step": 112504, "epoch": 929} {"train_loss": -37.088035583496094, "global_step": 112505, "epoch": 929} {"train_loss": -38.2784309387207, "global_step": 112506, "epoch": 929} {"train_loss": -37.875404357910156, "global_step": 112507, "epoch": 929} {"train_loss": -38.28578567504883, "global_step": 112508, "epoch": 929} {"train_loss": -37.9870491027832, "global_step": 112509, "epoch": 929} {"train_loss": -38.2130126953125, "global_step": 112510, "epoch": 929} {"train_loss": -36.11054611206055, "global_step": 112511, "epoch": 929} {"train_loss": -33.24807357788086, "global_step": 112512, "epoch": 929} {"train_loss": -15.06145191192627, "global_step": 112513, "epoch": 929} {"train_loss": -5.284186840057373, "global_step": 112514, "epoch": 929} {"train_loss": -33.09747314453125, "global_step": 112515, "epoch": 929} {"train_loss": -28.412982940673828, "global_step": 112516, "epoch": 929} {"train_loss": -31.43605613708496, "global_step": 112517, "epoch": 929} {"train_loss": -34.51436996459961, "global_step": 112518, "epoch": 929} {"train_loss": -34.49369812011719, "global_step": 112519, "epoch": 929} {"train_loss": -34.01499557495117, "global_step": 112520, "epoch": 929} {"train_loss": -36.09774398803711, "global_step": 112521, "epoch": 929} {"train_loss": -33.694007873535156, "global_step": 112522, "epoch": 929} {"train_loss": -36.94939041137695, "global_step": 112523, "epoch": 929} {"train_loss": -34.272857666015625, "global_step": 112524, "epoch": 929} {"train_loss": -32.707115173339844, "global_step": 112525, "epoch": 929} {"train_loss": -36.66055679321289, "global_step": 112526, "epoch": 929} {"train_loss": -36.199676513671875, "global_step": 112527, "epoch": 929} {"train_loss": -36.82133483886719, "global_step": 112528, "epoch": 929} {"train_loss": -35.99491483909039, "global_step": 112529, "epoch": 929, "val_loss": 2638916.0} {"train_loss": -36.078399658203125, "global_step": 112530, "epoch": 930} {"train_loss": -36.57474899291992, "global_step": 112531, "epoch": 930} {"train_loss": -36.57134246826172, "global_step": 112532, "epoch": 930} {"train_loss": -35.4763069152832, "global_step": 112533, "epoch": 930} {"train_loss": -36.84476852416992, "global_step": 112534, "epoch": 930} {"train_loss": -36.625701904296875, "global_step": 112535, "epoch": 930} {"train_loss": -36.98947525024414, "global_step": 112536, "epoch": 930} {"train_loss": -37.18740463256836, "global_step": 112537, "epoch": 930} {"train_loss": -36.030696868896484, "global_step": 112538, "epoch": 930} {"train_loss": -37.59761428833008, "global_step": 112539, "epoch": 930} {"train_loss": -37.49796676635742, "global_step": 112540, "epoch": 930} {"train_loss": -37.11809158325195, "global_step": 112541, "epoch": 930} {"train_loss": -37.1926383972168, "global_step": 112542, "epoch": 930} {"train_loss": -37.64181137084961, "global_step": 112543, "epoch": 930} {"train_loss": -37.802490234375, "global_step": 112544, "epoch": 930} {"train_loss": -37.740516662597656, "global_step": 112545, "epoch": 930} {"train_loss": -37.5301628112793, "global_step": 112546, "epoch": 930} {"train_loss": -37.79883575439453, "global_step": 112547, "epoch": 930} {"train_loss": -37.645416259765625, "global_step": 112548, "epoch": 930} {"train_loss": -37.67164993286133, "global_step": 112549, "epoch": 930} {"train_loss": -37.79387283325195, "global_step": 112550, "epoch": 930} {"train_loss": -37.14278030395508, "global_step": 112551, "epoch": 930} {"train_loss": -37.53750991821289, "global_step": 112552, "epoch": 930} {"train_loss": -37.6218376159668, "global_step": 112553, "epoch": 930} {"train_loss": -37.33850860595703, "global_step": 112554, "epoch": 930} {"train_loss": -38.09747314453125, "global_step": 112555, "epoch": 930} {"train_loss": -36.61170196533203, "global_step": 112556, "epoch": 930} {"train_loss": -37.52587890625, "global_step": 112557, "epoch": 930} {"train_loss": -37.25294876098633, "global_step": 112558, "epoch": 930} {"train_loss": -37.72079849243164, "global_step": 112559, "epoch": 930} {"train_loss": -33.25442123413086, "global_step": 112560, "epoch": 930} {"train_loss": -38.21897888183594, "global_step": 112561, "epoch": 930} {"train_loss": -37.99465560913086, "global_step": 112562, "epoch": 930} {"train_loss": -37.45599365234375, "global_step": 112563, "epoch": 930} {"train_loss": -38.33710861206055, "global_step": 112564, "epoch": 930} {"train_loss": -37.186702728271484, "global_step": 112565, "epoch": 930} {"train_loss": -37.35273742675781, "global_step": 112566, "epoch": 930} {"train_loss": -35.769142150878906, "global_step": 112567, "epoch": 930} {"train_loss": -37.520137786865234, "global_step": 112568, "epoch": 930} {"train_loss": -37.530799865722656, "global_step": 112569, "epoch": 930} {"train_loss": -36.828277587890625, "global_step": 112570, "epoch": 930} {"train_loss": -37.68434524536133, "global_step": 112571, "epoch": 930} {"train_loss": -36.91121292114258, "global_step": 112572, "epoch": 930} {"train_loss": -37.604591369628906, "global_step": 112573, "epoch": 930} {"train_loss": -37.45571517944336, "global_step": 112574, "epoch": 930} {"train_loss": -37.521018981933594, "global_step": 112575, "epoch": 930} {"train_loss": -35.76617431640625, "global_step": 112576, "epoch": 930} {"train_loss": -37.386531829833984, "global_step": 112577, "epoch": 930} {"train_loss": -37.49778366088867, "global_step": 112578, "epoch": 930} {"train_loss": -38.19501876831055, "global_step": 112579, "epoch": 930} {"train_loss": -37.104461669921875, "global_step": 112580, "epoch": 930} {"train_loss": -37.70591735839844, "global_step": 112581, "epoch": 930} {"train_loss": -38.001888275146484, "global_step": 112582, "epoch": 930} {"train_loss": -38.58393478393555, "global_step": 112583, "epoch": 930} {"train_loss": -37.29941177368164, "global_step": 112584, "epoch": 930} {"train_loss": -36.717735290527344, "global_step": 112585, "epoch": 930} {"train_loss": -37.79647445678711, "global_step": 112586, "epoch": 930} {"train_loss": -37.37137985229492, "global_step": 112587, "epoch": 930} {"train_loss": -37.886016845703125, "global_step": 112588, "epoch": 930} {"train_loss": -38.32766342163086, "global_step": 112589, "epoch": 930} {"train_loss": -34.64408493041992, "global_step": 112590, "epoch": 930} {"train_loss": -37.84542465209961, "global_step": 112591, "epoch": 930} {"train_loss": -35.49697494506836, "global_step": 112592, "epoch": 930} {"train_loss": -37.163265228271484, "global_step": 112593, "epoch": 930} {"train_loss": -35.08344268798828, "global_step": 112594, "epoch": 930} {"train_loss": -37.60012435913086, "global_step": 112595, "epoch": 930} {"train_loss": -36.54541015625, "global_step": 112596, "epoch": 930} {"train_loss": -37.97800064086914, "global_step": 112597, "epoch": 930} {"train_loss": -37.47092056274414, "global_step": 112598, "epoch": 930} {"train_loss": -37.56513595581055, "global_step": 112599, "epoch": 930} {"train_loss": -37.690677642822266, "global_step": 112600, "epoch": 930} {"train_loss": -37.873046875, "global_step": 112601, "epoch": 930} {"train_loss": -36.96583557128906, "global_step": 112602, "epoch": 930} {"train_loss": -37.90766143798828, "global_step": 112603, "epoch": 930} {"train_loss": -37.14748764038086, "global_step": 112604, "epoch": 930} {"train_loss": -37.4879035949707, "global_step": 112605, "epoch": 930} {"train_loss": -37.08400344848633, "global_step": 112606, "epoch": 930} {"train_loss": -38.284339904785156, "global_step": 112607, "epoch": 930} {"train_loss": -37.647525787353516, "global_step": 112608, "epoch": 930} {"train_loss": -38.11288070678711, "global_step": 112609, "epoch": 930} {"train_loss": -38.0573844909668, "global_step": 112610, "epoch": 930} {"train_loss": -37.248538970947266, "global_step": 112611, "epoch": 930} {"train_loss": -37.35988998413086, "global_step": 112612, "epoch": 930} {"train_loss": -37.101749420166016, "global_step": 112613, "epoch": 930} {"train_loss": -35.923370361328125, "global_step": 112614, "epoch": 930} {"train_loss": -37.8570442199707, "global_step": 112615, "epoch": 930} {"train_loss": -36.33442687988281, "global_step": 112616, "epoch": 930} {"train_loss": -37.750362396240234, "global_step": 112617, "epoch": 930} {"train_loss": -38.02962112426758, "global_step": 112618, "epoch": 930} {"train_loss": -37.13039779663086, "global_step": 112619, "epoch": 930} {"train_loss": -38.17491149902344, "global_step": 112620, "epoch": 930} {"train_loss": -38.320560455322266, "global_step": 112621, "epoch": 930} {"train_loss": -38.336212158203125, "global_step": 112622, "epoch": 930} {"train_loss": -37.824378967285156, "global_step": 112623, "epoch": 930} {"train_loss": -37.70289993286133, "global_step": 112624, "epoch": 930} {"train_loss": -38.573509216308594, "global_step": 112625, "epoch": 930} {"train_loss": -38.148475646972656, "global_step": 112626, "epoch": 930} {"train_loss": -37.94768142700195, "global_step": 112627, "epoch": 930} {"train_loss": -38.532310485839844, "global_step": 112628, "epoch": 930} {"train_loss": -38.459712982177734, "global_step": 112629, "epoch": 930} {"train_loss": -38.389442443847656, "global_step": 112630, "epoch": 930} {"train_loss": -38.275001525878906, "global_step": 112631, "epoch": 930} {"train_loss": -38.70875549316406, "global_step": 112632, "epoch": 930} {"train_loss": -37.99055480957031, "global_step": 112633, "epoch": 930} {"train_loss": -36.960262298583984, "global_step": 112634, "epoch": 930} {"train_loss": -38.4082145690918, "global_step": 112635, "epoch": 930} {"train_loss": -38.68386459350586, "global_step": 112636, "epoch": 930} {"train_loss": -37.33997344970703, "global_step": 112637, "epoch": 930} {"train_loss": -36.29948425292969, "global_step": 112638, "epoch": 930} {"train_loss": -37.34733200073242, "global_step": 112639, "epoch": 930} {"train_loss": -38.64375686645508, "global_step": 112640, "epoch": 930} {"train_loss": -37.42625045776367, "global_step": 112641, "epoch": 930} {"train_loss": -35.845558166503906, "global_step": 112642, "epoch": 930} {"train_loss": -38.58927536010742, "global_step": 112643, "epoch": 930} {"train_loss": -36.558448791503906, "global_step": 112644, "epoch": 930} {"train_loss": -38.216854095458984, "global_step": 112645, "epoch": 930} {"train_loss": -38.043609619140625, "global_step": 112646, "epoch": 930} {"train_loss": -36.935550689697266, "global_step": 112647, "epoch": 930} {"train_loss": -38.11487579345703, "global_step": 112648, "epoch": 930} {"train_loss": -36.470211029052734, "global_step": 112649, "epoch": 930} {"train_loss": -37.40961724273429, "global_step": 112650, "epoch": 930, "val_loss": 2662086.5} {"train_loss": -37.16321563720703, "global_step": 112651, "epoch": 931} {"train_loss": -39.057044982910156, "global_step": 112652, "epoch": 931} {"train_loss": -37.57963943481445, "global_step": 112653, "epoch": 931} {"train_loss": -38.5450325012207, "global_step": 112654, "epoch": 931} {"train_loss": -37.34001922607422, "global_step": 112655, "epoch": 931} {"train_loss": -37.91543197631836, "global_step": 112656, "epoch": 931} {"train_loss": -36.6529426574707, "global_step": 112657, "epoch": 931} {"train_loss": -38.61895751953125, "global_step": 112658, "epoch": 931} {"train_loss": -37.35494613647461, "global_step": 112659, "epoch": 931} {"train_loss": -38.6201171875, "global_step": 112660, "epoch": 931} {"train_loss": -37.95267868041992, "global_step": 112661, "epoch": 931} {"train_loss": -38.57950973510742, "global_step": 112662, "epoch": 931} {"train_loss": -38.36360549926758, "global_step": 112663, "epoch": 931} {"train_loss": -37.077880859375, "global_step": 112664, "epoch": 931} {"train_loss": -38.64148712158203, "global_step": 112665, "epoch": 931} {"train_loss": -37.744503021240234, "global_step": 112666, "epoch": 931} {"train_loss": -38.54339599609375, "global_step": 112667, "epoch": 931} {"train_loss": -38.3833122253418, "global_step": 112668, "epoch": 931} {"train_loss": -38.9398078918457, "global_step": 112669, "epoch": 931} {"train_loss": -38.9972038269043, "global_step": 112670, "epoch": 931} {"train_loss": -38.15720748901367, "global_step": 112671, "epoch": 931} {"train_loss": -38.60159683227539, "global_step": 112672, "epoch": 931} {"train_loss": -36.36088180541992, "global_step": 112673, "epoch": 931} {"train_loss": -38.84328842163086, "global_step": 112674, "epoch": 931} {"train_loss": -37.87388229370117, "global_step": 112675, "epoch": 931} {"train_loss": -38.822998046875, "global_step": 112676, "epoch": 931} {"train_loss": -38.75152587890625, "global_step": 112677, "epoch": 931} {"train_loss": -38.393798828125, "global_step": 112678, "epoch": 931} {"train_loss": -37.75919723510742, "global_step": 112679, "epoch": 931} {"train_loss": -37.70193862915039, "global_step": 112680, "epoch": 931} {"train_loss": -37.66839599609375, "global_step": 112681, "epoch": 931} {"train_loss": -38.98128890991211, "global_step": 112682, "epoch": 931} {"train_loss": -38.886322021484375, "global_step": 112683, "epoch": 931} {"train_loss": -38.00425338745117, "global_step": 112684, "epoch": 931} {"train_loss": -37.51188278198242, "global_step": 112685, "epoch": 931} {"train_loss": -38.729408264160156, "global_step": 112686, "epoch": 931} {"train_loss": -38.64522933959961, "global_step": 112687, "epoch": 931} {"train_loss": -38.01258087158203, "global_step": 112688, "epoch": 931} {"train_loss": -36.83795928955078, "global_step": 112689, "epoch": 931} {"train_loss": -36.51570129394531, "global_step": 112690, "epoch": 931} {"train_loss": -37.326629638671875, "global_step": 112691, "epoch": 931} {"train_loss": -36.924781799316406, "global_step": 112692, "epoch": 931} {"train_loss": -38.32017517089844, "global_step": 112693, "epoch": 931} {"train_loss": -37.14348602294922, "global_step": 112694, "epoch": 931} {"train_loss": -36.58413314819336, "global_step": 112695, "epoch": 931} {"train_loss": -38.43545913696289, "global_step": 112696, "epoch": 931} {"train_loss": -37.39530944824219, "global_step": 112697, "epoch": 931} {"train_loss": -37.589134216308594, "global_step": 112698, "epoch": 931} {"train_loss": -37.91990280151367, "global_step": 112699, "epoch": 931} {"train_loss": -37.880226135253906, "global_step": 112700, "epoch": 931} {"train_loss": -37.75178909301758, "global_step": 112701, "epoch": 931} {"train_loss": -38.68365478515625, "global_step": 112702, "epoch": 931} {"train_loss": -37.78089141845703, "global_step": 112703, "epoch": 931} {"train_loss": -38.744319915771484, "global_step": 112704, "epoch": 931} {"train_loss": -38.627777099609375, "global_step": 112705, "epoch": 931} {"train_loss": -38.15888214111328, "global_step": 112706, "epoch": 931} {"train_loss": -38.33002853393555, "global_step": 112707, "epoch": 931} {"train_loss": -38.121437072753906, "global_step": 112708, "epoch": 931} {"train_loss": -38.47739791870117, "global_step": 112709, "epoch": 931} {"train_loss": -36.037017822265625, "global_step": 112710, "epoch": 931} {"train_loss": -38.4204216003418, "global_step": 112711, "epoch": 931} {"train_loss": -38.750179290771484, "global_step": 112712, "epoch": 931} {"train_loss": -37.635807037353516, "global_step": 112713, "epoch": 931} {"train_loss": -38.92363739013672, "global_step": 112714, "epoch": 931} {"train_loss": -38.24406051635742, "global_step": 112715, "epoch": 931} {"train_loss": -39.120479583740234, "global_step": 112716, "epoch": 931} {"train_loss": -38.89052200317383, "global_step": 112717, "epoch": 931} {"train_loss": -38.73902130126953, "global_step": 112718, "epoch": 931} {"train_loss": -38.50885009765625, "global_step": 112719, "epoch": 931} {"train_loss": -38.32459259033203, "global_step": 112720, "epoch": 931} {"train_loss": -37.059322357177734, "global_step": 112721, "epoch": 931} {"train_loss": -37.802669525146484, "global_step": 112722, "epoch": 931} {"train_loss": -38.36131286621094, "global_step": 112723, "epoch": 931} {"train_loss": -38.64265823364258, "global_step": 112724, "epoch": 931} {"train_loss": -38.964656829833984, "global_step": 112725, "epoch": 931} {"train_loss": -39.02975082397461, "global_step": 112726, "epoch": 931} {"train_loss": -37.70591354370117, "global_step": 112727, "epoch": 931} {"train_loss": -37.721866607666016, "global_step": 112728, "epoch": 931} {"train_loss": -38.09095001220703, "global_step": 112729, "epoch": 931} {"train_loss": -38.78291702270508, "global_step": 112730, "epoch": 931} {"train_loss": -35.95418930053711, "global_step": 112731, "epoch": 931} {"train_loss": -38.63706588745117, "global_step": 112732, "epoch": 931} {"train_loss": -38.22624969482422, "global_step": 112733, "epoch": 931} {"train_loss": -38.83830642700195, "global_step": 112734, "epoch": 931} {"train_loss": -37.179664611816406, "global_step": 112735, "epoch": 931} {"train_loss": -37.98983383178711, "global_step": 112736, "epoch": 931} {"train_loss": -37.58042907714844, "global_step": 112737, "epoch": 931} {"train_loss": -37.22707748413086, "global_step": 112738, "epoch": 931} {"train_loss": -38.124446868896484, "global_step": 112739, "epoch": 931} {"train_loss": -38.735870361328125, "global_step": 112740, "epoch": 931} {"train_loss": -37.82223129272461, "global_step": 112741, "epoch": 931} {"train_loss": -38.40084457397461, "global_step": 112742, "epoch": 931} {"train_loss": -37.76615905761719, "global_step": 112743, "epoch": 931} {"train_loss": -38.6274528503418, "global_step": 112744, "epoch": 931} {"train_loss": -38.69269943237305, "global_step": 112745, "epoch": 931} {"train_loss": -37.82084274291992, "global_step": 112746, "epoch": 931} {"train_loss": -38.48830032348633, "global_step": 112747, "epoch": 931} {"train_loss": -38.02524948120117, "global_step": 112748, "epoch": 931} {"train_loss": -37.46089172363281, "global_step": 112749, "epoch": 931} {"train_loss": -37.06521224975586, "global_step": 112750, "epoch": 931} {"train_loss": -36.96503448486328, "global_step": 112751, "epoch": 931} {"train_loss": -37.618446350097656, "global_step": 112752, "epoch": 931} {"train_loss": -36.04368209838867, "global_step": 112753, "epoch": 931} {"train_loss": -37.50598907470703, "global_step": 112754, "epoch": 931} {"train_loss": -37.28603744506836, "global_step": 112755, "epoch": 931} {"train_loss": -38.06364822387695, "global_step": 112756, "epoch": 931} {"train_loss": -37.74068832397461, "global_step": 112757, "epoch": 931} {"train_loss": -35.64990234375, "global_step": 112758, "epoch": 931} {"train_loss": -37.87897872924805, "global_step": 112759, "epoch": 931} {"train_loss": -35.93618392944336, "global_step": 112760, "epoch": 931} {"train_loss": -37.08611297607422, "global_step": 112761, "epoch": 931} {"train_loss": -38.144046783447266, "global_step": 112762, "epoch": 931} {"train_loss": -37.10251998901367, "global_step": 112763, "epoch": 931} {"train_loss": -38.33256912231445, "global_step": 112764, "epoch": 931} {"train_loss": -38.11851119995117, "global_step": 112765, "epoch": 931} {"train_loss": -38.40330123901367, "global_step": 112766, "epoch": 931} {"train_loss": -37.739681243896484, "global_step": 112767, "epoch": 931} {"train_loss": -38.20863342285156, "global_step": 112768, "epoch": 931} {"train_loss": -38.031227111816406, "global_step": 112769, "epoch": 931} {"train_loss": -38.564178466796875, "global_step": 112770, "epoch": 931} {"train_loss": -37.972314913410784, "global_step": 112771, "epoch": 931, "val_loss": 2640703.75} {"train_loss": -37.163883209228516, "global_step": 112772, "epoch": 932} {"train_loss": -38.575618743896484, "global_step": 112773, "epoch": 932} {"train_loss": -37.793636322021484, "global_step": 112774, "epoch": 932} {"train_loss": -38.49643325805664, "global_step": 112775, "epoch": 932} {"train_loss": -38.630619049072266, "global_step": 112776, "epoch": 932} {"train_loss": -38.49031066894531, "global_step": 112777, "epoch": 932} {"train_loss": -39.15452194213867, "global_step": 112778, "epoch": 932} {"train_loss": -38.110145568847656, "global_step": 112779, "epoch": 932} {"train_loss": -38.58005905151367, "global_step": 112780, "epoch": 932} {"train_loss": -38.89760971069336, "global_step": 112781, "epoch": 932} {"train_loss": -38.70429992675781, "global_step": 112782, "epoch": 932} {"train_loss": -38.90253829956055, "global_step": 112783, "epoch": 932} {"train_loss": -38.89387130737305, "global_step": 112784, "epoch": 932} {"train_loss": -38.99199295043945, "global_step": 112785, "epoch": 932} {"train_loss": -38.97549057006836, "global_step": 112786, "epoch": 932} {"train_loss": -38.9080924987793, "global_step": 112787, "epoch": 932} {"train_loss": -39.02097702026367, "global_step": 112788, "epoch": 932} {"train_loss": -36.3733024597168, "global_step": 112789, "epoch": 932} {"train_loss": -36.35487747192383, "global_step": 112790, "epoch": 932} {"train_loss": -38.373531341552734, "global_step": 112791, "epoch": 932} {"train_loss": -39.37624740600586, "global_step": 112792, "epoch": 932} {"train_loss": -39.161766052246094, "global_step": 112793, "epoch": 932} {"train_loss": -38.767906188964844, "global_step": 112794, "epoch": 932} {"train_loss": -38.076568603515625, "global_step": 112795, "epoch": 932} {"train_loss": -38.68782043457031, "global_step": 112796, "epoch": 932} {"train_loss": -39.29606246948242, "global_step": 112797, "epoch": 932} {"train_loss": -38.474727630615234, "global_step": 112798, "epoch": 932} {"train_loss": -38.332820892333984, "global_step": 112799, "epoch": 932} {"train_loss": -38.76150131225586, "global_step": 112800, "epoch": 932} {"train_loss": -37.52492904663086, "global_step": 112801, "epoch": 932} {"train_loss": -39.0169563293457, "global_step": 112802, "epoch": 932} {"train_loss": -38.90552520751953, "global_step": 112803, "epoch": 932} {"train_loss": -38.72127151489258, "global_step": 112804, "epoch": 932} {"train_loss": -38.6341552734375, "global_step": 112805, "epoch": 932} {"train_loss": -39.39771270751953, "global_step": 112806, "epoch": 932} {"train_loss": -38.67053985595703, "global_step": 112807, "epoch": 932} {"train_loss": -39.05069351196289, "global_step": 112808, "epoch": 932} {"train_loss": -39.38584899902344, "global_step": 112809, "epoch": 932} {"train_loss": -38.95943832397461, "global_step": 112810, "epoch": 932} {"train_loss": -38.97065353393555, "global_step": 112811, "epoch": 932} {"train_loss": -38.815521240234375, "global_step": 112812, "epoch": 932} {"train_loss": -38.93620681762695, "global_step": 112813, "epoch": 932} {"train_loss": -39.390377044677734, "global_step": 112814, "epoch": 932} {"train_loss": -39.48466873168945, "global_step": 112815, "epoch": 932} {"train_loss": -38.982051849365234, "global_step": 112816, "epoch": 932} {"train_loss": -39.08290481567383, "global_step": 112817, "epoch": 932} {"train_loss": -39.669837951660156, "global_step": 112818, "epoch": 932} {"train_loss": -38.922576904296875, "global_step": 112819, "epoch": 932} {"train_loss": -39.83551025390625, "global_step": 112820, "epoch": 932} {"train_loss": -38.88288497924805, "global_step": 112821, "epoch": 932} {"train_loss": -39.331905364990234, "global_step": 112822, "epoch": 932} {"train_loss": -40.02865219116211, "global_step": 112823, "epoch": 932} {"train_loss": -39.42118453979492, "global_step": 112824, "epoch": 932} {"train_loss": -39.54915237426758, "global_step": 112825, "epoch": 932} {"train_loss": -38.87693405151367, "global_step": 112826, "epoch": 932} {"train_loss": -39.76465606689453, "global_step": 112827, "epoch": 932} {"train_loss": -39.95547103881836, "global_step": 112828, "epoch": 932} {"train_loss": -38.400962829589844, "global_step": 112829, "epoch": 932} {"train_loss": -39.86726379394531, "global_step": 112830, "epoch": 932} {"train_loss": -39.613677978515625, "global_step": 112831, "epoch": 932} {"train_loss": -39.85308074951172, "global_step": 112832, "epoch": 932} {"train_loss": -38.522335052490234, "global_step": 112833, "epoch": 932} {"train_loss": -39.454383850097656, "global_step": 112834, "epoch": 932} {"train_loss": -39.16135787963867, "global_step": 112835, "epoch": 932} {"train_loss": -38.95740509033203, "global_step": 112836, "epoch": 932} {"train_loss": -38.61754608154297, "global_step": 112837, "epoch": 932} {"train_loss": -37.9589729309082, "global_step": 112838, "epoch": 932} {"train_loss": -35.92481994628906, "global_step": 112839, "epoch": 932} {"train_loss": -33.48030471801758, "global_step": 112840, "epoch": 932} {"train_loss": -34.40116882324219, "global_step": 112841, "epoch": 932} {"train_loss": -37.86754608154297, "global_step": 112842, "epoch": 932} {"train_loss": -38.3731575012207, "global_step": 112843, "epoch": 932} {"train_loss": -37.658050537109375, "global_step": 112844, "epoch": 932} {"train_loss": -36.91209030151367, "global_step": 112845, "epoch": 932} {"train_loss": -36.082550048828125, "global_step": 112846, "epoch": 932} {"train_loss": -37.08651351928711, "global_step": 112847, "epoch": 932} {"train_loss": -37.57158279418945, "global_step": 112848, "epoch": 932} {"train_loss": -37.78282165527344, "global_step": 112849, "epoch": 932} {"train_loss": -35.07063293457031, "global_step": 112850, "epoch": 932} {"train_loss": -37.161983489990234, "global_step": 112851, "epoch": 932} {"train_loss": -38.95998001098633, "global_step": 112852, "epoch": 932} {"train_loss": -36.45240020751953, "global_step": 112853, "epoch": 932} {"train_loss": -38.22468948364258, "global_step": 112854, "epoch": 932} {"train_loss": -37.74011993408203, "global_step": 112855, "epoch": 932} {"train_loss": -36.33543014526367, "global_step": 112856, "epoch": 932} {"train_loss": -38.083797454833984, "global_step": 112857, "epoch": 932} {"train_loss": -36.68156051635742, "global_step": 112858, "epoch": 932} {"train_loss": -37.291908264160156, "global_step": 112859, "epoch": 932} {"train_loss": -37.14380645751953, "global_step": 112860, "epoch": 932} {"train_loss": -38.028961181640625, "global_step": 112861, "epoch": 932} {"train_loss": -38.36613082885742, "global_step": 112862, "epoch": 932} {"train_loss": -37.99006271362305, "global_step": 112863, "epoch": 932} {"train_loss": -37.333595275878906, "global_step": 112864, "epoch": 932} {"train_loss": -38.750770568847656, "global_step": 112865, "epoch": 932} {"train_loss": -37.6461296081543, "global_step": 112866, "epoch": 932} {"train_loss": -38.08449172973633, "global_step": 112867, "epoch": 932} {"train_loss": -37.721893310546875, "global_step": 112868, "epoch": 932} {"train_loss": -38.95630645751953, "global_step": 112869, "epoch": 932} {"train_loss": -37.9304313659668, "global_step": 112870, "epoch": 932} {"train_loss": -39.26359176635742, "global_step": 112871, "epoch": 932} {"train_loss": -38.5793571472168, "global_step": 112872, "epoch": 932} {"train_loss": -39.111751556396484, "global_step": 112873, "epoch": 932} {"train_loss": -38.892147064208984, "global_step": 112874, "epoch": 932} {"train_loss": -38.64150619506836, "global_step": 112875, "epoch": 932} {"train_loss": -39.23693084716797, "global_step": 112876, "epoch": 932} {"train_loss": -38.747432708740234, "global_step": 112877, "epoch": 932} {"train_loss": -39.12070846557617, "global_step": 112878, "epoch": 932} {"train_loss": -38.890926361083984, "global_step": 112879, "epoch": 932} {"train_loss": -39.20454406738281, "global_step": 112880, "epoch": 932} {"train_loss": -39.08319091796875, "global_step": 112881, "epoch": 932} {"train_loss": -38.70332717895508, "global_step": 112882, "epoch": 932} {"train_loss": -38.952392578125, "global_step": 112883, "epoch": 932} {"train_loss": -38.63640213012695, "global_step": 112884, "epoch": 932} {"train_loss": -38.90887451171875, "global_step": 112885, "epoch": 932} {"train_loss": -38.38727569580078, "global_step": 112886, "epoch": 932} {"train_loss": -39.37566375732422, "global_step": 112887, "epoch": 932} {"train_loss": -38.25142288208008, "global_step": 112888, "epoch": 932} {"train_loss": -37.402122497558594, "global_step": 112889, "epoch": 932} {"train_loss": -38.712947845458984, "global_step": 112890, "epoch": 932} {"train_loss": -36.26446533203125, "global_step": 112891, "epoch": 932} {"train_loss": -38.40569838216482, "global_step": 112892, "epoch": 932, "val_loss": 2600663.0} {"train_loss": -38.22469711303711, "global_step": 112893, "epoch": 933} {"train_loss": -38.82052230834961, "global_step": 112894, "epoch": 933} {"train_loss": -38.43850326538086, "global_step": 112895, "epoch": 933} {"train_loss": -38.81171798706055, "global_step": 112896, "epoch": 933} {"train_loss": -38.78972244262695, "global_step": 112897, "epoch": 933} {"train_loss": -39.0867805480957, "global_step": 112898, "epoch": 933} {"train_loss": -38.268123626708984, "global_step": 112899, "epoch": 933} {"train_loss": -38.96415328979492, "global_step": 112900, "epoch": 933} {"train_loss": -39.029052734375, "global_step": 112901, "epoch": 933} {"train_loss": -39.38078689575195, "global_step": 112902, "epoch": 933} {"train_loss": -38.18140411376953, "global_step": 112903, "epoch": 933} {"train_loss": -38.54421615600586, "global_step": 112904, "epoch": 933} {"train_loss": -38.71588897705078, "global_step": 112905, "epoch": 933} {"train_loss": -38.5831413269043, "global_step": 112906, "epoch": 933} {"train_loss": -39.25974655151367, "global_step": 112907, "epoch": 933} {"train_loss": -39.29309844970703, "global_step": 112908, "epoch": 933} {"train_loss": -39.23189926147461, "global_step": 112909, "epoch": 933} {"train_loss": -38.56377029418945, "global_step": 112910, "epoch": 933} {"train_loss": -39.36351013183594, "global_step": 112911, "epoch": 933} {"train_loss": -39.30016326904297, "global_step": 112912, "epoch": 933} {"train_loss": -39.35603713989258, "global_step": 112913, "epoch": 933} {"train_loss": -38.86568832397461, "global_step": 112914, "epoch": 933} {"train_loss": -38.45325469970703, "global_step": 112915, "epoch": 933} {"train_loss": -38.67448806762695, "global_step": 112916, "epoch": 933} {"train_loss": -37.872283935546875, "global_step": 112917, "epoch": 933} {"train_loss": -39.22694778442383, "global_step": 112918, "epoch": 933} {"train_loss": -38.838584899902344, "global_step": 112919, "epoch": 933} {"train_loss": -38.382232666015625, "global_step": 112920, "epoch": 933} {"train_loss": -38.601837158203125, "global_step": 112921, "epoch": 933} {"train_loss": -38.33049774169922, "global_step": 112922, "epoch": 933} {"train_loss": -39.12131881713867, "global_step": 112923, "epoch": 933} {"train_loss": -39.42169189453125, "global_step": 112924, "epoch": 933} {"train_loss": -37.7809944152832, "global_step": 112925, "epoch": 933} {"train_loss": -37.06673049926758, "global_step": 112926, "epoch": 933} {"train_loss": -37.821937561035156, "global_step": 112927, "epoch": 933} {"train_loss": -38.774749755859375, "global_step": 112928, "epoch": 933} {"train_loss": -38.977325439453125, "global_step": 112929, "epoch": 933} {"train_loss": -34.320472717285156, "global_step": 112930, "epoch": 933} {"train_loss": -38.76250457763672, "global_step": 112931, "epoch": 933} {"train_loss": -37.286651611328125, "global_step": 112932, "epoch": 933} {"train_loss": -38.6015625, "global_step": 112933, "epoch": 933} {"train_loss": -37.39375686645508, "global_step": 112934, "epoch": 933} {"train_loss": -38.131587982177734, "global_step": 112935, "epoch": 933} {"train_loss": -37.51293182373047, "global_step": 112936, "epoch": 933} {"train_loss": -39.24763870239258, "global_step": 112937, "epoch": 933} {"train_loss": -38.28571701049805, "global_step": 112938, "epoch": 933} {"train_loss": -37.964263916015625, "global_step": 112939, "epoch": 933} {"train_loss": -38.057701110839844, "global_step": 112940, "epoch": 933} {"train_loss": -39.032318115234375, "global_step": 112941, "epoch": 933} {"train_loss": -35.59646224975586, "global_step": 112942, "epoch": 933} {"train_loss": -38.18003463745117, "global_step": 112943, "epoch": 933} {"train_loss": -38.08985137939453, "global_step": 112944, "epoch": 933} {"train_loss": -37.91398239135742, "global_step": 112945, "epoch": 933} {"train_loss": -37.53623580932617, "global_step": 112946, "epoch": 933} {"train_loss": -33.23533630371094, "global_step": 112947, "epoch": 933} {"train_loss": -37.545406341552734, "global_step": 112948, "epoch": 933} {"train_loss": -36.75391387939453, "global_step": 112949, "epoch": 933} {"train_loss": -37.80570602416992, "global_step": 112950, "epoch": 933} {"train_loss": -37.90179443359375, "global_step": 112951, "epoch": 933} {"train_loss": -37.69588851928711, "global_step": 112952, "epoch": 933} {"train_loss": -37.23537826538086, "global_step": 112953, "epoch": 933} {"train_loss": -36.392364501953125, "global_step": 112954, "epoch": 933} {"train_loss": -37.7558479309082, "global_step": 112955, "epoch": 933} {"train_loss": -36.49592971801758, "global_step": 112956, "epoch": 933} {"train_loss": -32.890010833740234, "global_step": 112957, "epoch": 933} {"train_loss": -38.03707504272461, "global_step": 112958, "epoch": 933} {"train_loss": -37.53073501586914, "global_step": 112959, "epoch": 933} {"train_loss": -37.42073440551758, "global_step": 112960, "epoch": 933} {"train_loss": -38.02942657470703, "global_step": 112961, "epoch": 933} {"train_loss": -36.97334671020508, "global_step": 112962, "epoch": 933} {"train_loss": -37.222286224365234, "global_step": 112963, "epoch": 933} {"train_loss": -37.374935150146484, "global_step": 112964, "epoch": 933} {"train_loss": -37.75830841064453, "global_step": 112965, "epoch": 933} {"train_loss": -29.739675521850586, "global_step": 112966, "epoch": 933} {"train_loss": -37.42376708984375, "global_step": 112967, "epoch": 933} {"train_loss": -37.95326232910156, "global_step": 112968, "epoch": 933} {"train_loss": -36.823333740234375, "global_step": 112969, "epoch": 933} {"train_loss": -38.4991340637207, "global_step": 112970, "epoch": 933} {"train_loss": -37.434837341308594, "global_step": 112971, "epoch": 933} {"train_loss": -35.72711181640625, "global_step": 112972, "epoch": 933} {"train_loss": -34.58517074584961, "global_step": 112973, "epoch": 933} {"train_loss": -2.5394341945648193, "global_step": 112974, "epoch": 933} {"train_loss": -31.038450241088867, "global_step": 112975, "epoch": 933} {"train_loss": -35.316158294677734, "global_step": 112976, "epoch": 933} {"train_loss": -13.10948657989502, "global_step": 112977, "epoch": 933} {"train_loss": -19.18710708618164, "global_step": 112978, "epoch": 933} {"train_loss": -28.493228912353516, "global_step": 112979, "epoch": 933} {"train_loss": -22.87921714782715, "global_step": 112980, "epoch": 933} {"train_loss": -27.653076171875, "global_step": 112981, "epoch": 933} {"train_loss": -20.418283462524414, "global_step": 112982, "epoch": 933} {"train_loss": -24.282703399658203, "global_step": 112983, "epoch": 933} {"train_loss": -27.58026695251465, "global_step": 112984, "epoch": 933} {"train_loss": -29.966938018798828, "global_step": 112985, "epoch": 933} {"train_loss": -31.42323112487793, "global_step": 112986, "epoch": 933} {"train_loss": -34.089805603027344, "global_step": 112987, "epoch": 933} {"train_loss": -29.06182289123535, "global_step": 112988, "epoch": 933} {"train_loss": -28.604248046875, "global_step": 112989, "epoch": 933} {"train_loss": -27.500431060791016, "global_step": 112990, "epoch": 933} {"train_loss": -31.031354904174805, "global_step": 112991, "epoch": 933} {"train_loss": -31.459095001220703, "global_step": 112992, "epoch": 933} {"train_loss": -32.564613342285156, "global_step": 112993, "epoch": 933} {"train_loss": -32.25905227661133, "global_step": 112994, "epoch": 933} {"train_loss": -32.01508331298828, "global_step": 112995, "epoch": 933} {"train_loss": -32.382991790771484, "global_step": 112996, "epoch": 933} {"train_loss": -33.57170867919922, "global_step": 112997, "epoch": 933} {"train_loss": -33.9350471496582, "global_step": 112998, "epoch": 933} {"train_loss": -34.150909423828125, "global_step": 112999, "epoch": 933} {"train_loss": -33.43750762939453, "global_step": 113000, "epoch": 933} {"train_loss": -33.45452880859375, "global_step": 113001, "epoch": 933} {"train_loss": -34.709529876708984, "global_step": 113002, "epoch": 933} {"train_loss": -33.94257354736328, "global_step": 113003, "epoch": 933} {"train_loss": -34.07337951660156, "global_step": 113004, "epoch": 933} {"train_loss": -35.136390686035156, "global_step": 113005, "epoch": 933} {"train_loss": -34.52836990356445, "global_step": 113006, "epoch": 933} {"train_loss": -34.23384094238281, "global_step": 113007, "epoch": 933} {"train_loss": -34.2635612487793, "global_step": 113008, "epoch": 933} {"train_loss": -34.255287170410156, "global_step": 113009, "epoch": 933} {"train_loss": -33.672767639160156, "global_step": 113010, "epoch": 933} {"train_loss": -33.87606430053711, "global_step": 113011, "epoch": 933} {"train_loss": -34.617919921875, "global_step": 113012, "epoch": 933} {"train_loss": -35.288922701985385, "global_step": 113013, "epoch": 933, "val_loss": 2732645.25} {"train_loss": -35.36376953125, "global_step": 113014, "epoch": 934} {"train_loss": -35.106319427490234, "global_step": 113015, "epoch": 934} {"train_loss": -35.338130950927734, "global_step": 113016, "epoch": 934} {"train_loss": -34.13199996948242, "global_step": 113017, "epoch": 934} {"train_loss": -34.91691970825195, "global_step": 113018, "epoch": 934} {"train_loss": -34.806129455566406, "global_step": 113019, "epoch": 934} {"train_loss": -34.8767204284668, "global_step": 113020, "epoch": 934} {"train_loss": -35.36558532714844, "global_step": 113021, "epoch": 934} {"train_loss": -34.80144119262695, "global_step": 113022, "epoch": 934} {"train_loss": -35.56781768798828, "global_step": 113023, "epoch": 934} {"train_loss": -34.7718620300293, "global_step": 113024, "epoch": 934} {"train_loss": -35.251121520996094, "global_step": 113025, "epoch": 934} {"train_loss": -35.67502975463867, "global_step": 113026, "epoch": 934} {"train_loss": -34.4717903137207, "global_step": 113027, "epoch": 934} {"train_loss": -35.79030990600586, "global_step": 113028, "epoch": 934} {"train_loss": -35.48165512084961, "global_step": 113029, "epoch": 934} {"train_loss": -35.872215270996094, "global_step": 113030, "epoch": 934} {"train_loss": -35.5467414855957, "global_step": 113031, "epoch": 934} {"train_loss": -35.48639678955078, "global_step": 113032, "epoch": 934} {"train_loss": -35.634857177734375, "global_step": 113033, "epoch": 934} {"train_loss": -35.69355010986328, "global_step": 113034, "epoch": 934} {"train_loss": -35.40702438354492, "global_step": 113035, "epoch": 934} {"train_loss": -36.016944885253906, "global_step": 113036, "epoch": 934} {"train_loss": -35.461029052734375, "global_step": 113037, "epoch": 934} {"train_loss": -36.02777099609375, "global_step": 113038, "epoch": 934} {"train_loss": -35.7978630065918, "global_step": 113039, "epoch": 934} {"train_loss": -35.84804153442383, "global_step": 113040, "epoch": 934} {"train_loss": -36.58229064941406, "global_step": 113041, "epoch": 934} {"train_loss": -36.108028411865234, "global_step": 113042, "epoch": 934} {"train_loss": -35.33545684814453, "global_step": 113043, "epoch": 934} {"train_loss": -36.33620071411133, "global_step": 113044, "epoch": 934} {"train_loss": -36.289791107177734, "global_step": 113045, "epoch": 934} {"train_loss": -36.93227005004883, "global_step": 113046, "epoch": 934} {"train_loss": -37.02985382080078, "global_step": 113047, "epoch": 934} {"train_loss": -36.88065719604492, "global_step": 113048, "epoch": 934} {"train_loss": -35.92486572265625, "global_step": 113049, "epoch": 934} {"train_loss": -35.77570724487305, "global_step": 113050, "epoch": 934} {"train_loss": -36.37323760986328, "global_step": 113051, "epoch": 934} {"train_loss": -36.499629974365234, "global_step": 113052, "epoch": 934} {"train_loss": -36.97199630737305, "global_step": 113053, "epoch": 934} {"train_loss": -36.441383361816406, "global_step": 113054, "epoch": 934} {"train_loss": -36.80965805053711, "global_step": 113055, "epoch": 934} {"train_loss": -36.910789489746094, "global_step": 113056, "epoch": 934} {"train_loss": -35.93467330932617, "global_step": 113057, "epoch": 934} {"train_loss": -36.578330993652344, "global_step": 113058, "epoch": 934} {"train_loss": -36.95550537109375, "global_step": 113059, "epoch": 934} {"train_loss": -37.13850021362305, "global_step": 113060, "epoch": 934} {"train_loss": -37.115638732910156, "global_step": 113061, "epoch": 934} {"train_loss": -36.70321273803711, "global_step": 113062, "epoch": 934} {"train_loss": -37.289276123046875, "global_step": 113063, "epoch": 934} {"train_loss": -37.262420654296875, "global_step": 113064, "epoch": 934} {"train_loss": -37.078609466552734, "global_step": 113065, "epoch": 934} {"train_loss": -37.80678939819336, "global_step": 113066, "epoch": 934} {"train_loss": -36.98442459106445, "global_step": 113067, "epoch": 934} {"train_loss": -36.071746826171875, "global_step": 113068, "epoch": 934} {"train_loss": -38.064964294433594, "global_step": 113069, "epoch": 934} {"train_loss": -38.10615921020508, "global_step": 113070, "epoch": 934} {"train_loss": -37.613460540771484, "global_step": 113071, "epoch": 934} {"train_loss": -37.67673110961914, "global_step": 113072, "epoch": 934} {"train_loss": -37.291786193847656, "global_step": 113073, "epoch": 934} {"train_loss": -37.13193130493164, "global_step": 113074, "epoch": 934} {"train_loss": -36.77311325073242, "global_step": 113075, "epoch": 934} {"train_loss": -37.683006286621094, "global_step": 113076, "epoch": 934} {"train_loss": -37.8640022277832, "global_step": 113077, "epoch": 934} {"train_loss": -37.77733612060547, "global_step": 113078, "epoch": 934} {"train_loss": -38.172035217285156, "global_step": 113079, "epoch": 934} {"train_loss": -37.1210823059082, "global_step": 113080, "epoch": 934} {"train_loss": -37.19017028808594, "global_step": 113081, "epoch": 934} {"train_loss": -38.26911544799805, "global_step": 113082, "epoch": 934} {"train_loss": -37.085575103759766, "global_step": 113083, "epoch": 934} {"train_loss": -37.09406661987305, "global_step": 113084, "epoch": 934} {"train_loss": -37.444156646728516, "global_step": 113085, "epoch": 934} {"train_loss": -37.81647872924805, "global_step": 113086, "epoch": 934} {"train_loss": -37.32395553588867, "global_step": 113087, "epoch": 934} {"train_loss": -37.37855911254883, "global_step": 113088, "epoch": 934} {"train_loss": -38.172935485839844, "global_step": 113089, "epoch": 934} {"train_loss": -37.42565155029297, "global_step": 113090, "epoch": 934} {"train_loss": -37.38710403442383, "global_step": 113091, "epoch": 934} {"train_loss": -38.17688751220703, "global_step": 113092, "epoch": 934} {"train_loss": -37.729042053222656, "global_step": 113093, "epoch": 934} {"train_loss": -37.71083450317383, "global_step": 113094, "epoch": 934} {"train_loss": -38.264652252197266, "global_step": 113095, "epoch": 934} {"train_loss": -38.3001823425293, "global_step": 113096, "epoch": 934} {"train_loss": -38.4318733215332, "global_step": 113097, "epoch": 934} {"train_loss": -38.00291442871094, "global_step": 113098, "epoch": 934} {"train_loss": -38.27322769165039, "global_step": 113099, "epoch": 934} {"train_loss": -38.49631881713867, "global_step": 113100, "epoch": 934} {"train_loss": -38.38397216796875, "global_step": 113101, "epoch": 934} {"train_loss": -38.37007141113281, "global_step": 113102, "epoch": 934} {"train_loss": -38.55973815917969, "global_step": 113103, "epoch": 934} {"train_loss": -38.17763137817383, "global_step": 113104, "epoch": 934} {"train_loss": -38.130611419677734, "global_step": 113105, "epoch": 934} {"train_loss": -37.87433624267578, "global_step": 113106, "epoch": 934} {"train_loss": -37.97047805786133, "global_step": 113107, "epoch": 934} {"train_loss": -37.46894454956055, "global_step": 113108, "epoch": 934} {"train_loss": -38.29853439331055, "global_step": 113109, "epoch": 934} {"train_loss": -38.024635314941406, "global_step": 113110, "epoch": 934} {"train_loss": -37.9241943359375, "global_step": 113111, "epoch": 934} {"train_loss": -38.160316467285156, "global_step": 113112, "epoch": 934} {"train_loss": -37.421573638916016, "global_step": 113113, "epoch": 934} {"train_loss": -38.902313232421875, "global_step": 113114, "epoch": 934} {"train_loss": -39.08678436279297, "global_step": 113115, "epoch": 934} {"train_loss": -38.0197639465332, "global_step": 113116, "epoch": 934} {"train_loss": -35.8535041809082, "global_step": 113117, "epoch": 934} {"train_loss": -35.04730987548828, "global_step": 113118, "epoch": 934} {"train_loss": -34.03384017944336, "global_step": 113119, "epoch": 934} {"train_loss": -34.48944854736328, "global_step": 113120, "epoch": 934} {"train_loss": -37.53762435913086, "global_step": 113121, "epoch": 934} {"train_loss": -35.237342834472656, "global_step": 113122, "epoch": 934} {"train_loss": -37.15787887573242, "global_step": 113123, "epoch": 934} {"train_loss": -36.724830627441406, "global_step": 113124, "epoch": 934} {"train_loss": -37.28554916381836, "global_step": 113125, "epoch": 934} {"train_loss": -37.7994270324707, "global_step": 113126, "epoch": 934} {"train_loss": -36.18289566040039, "global_step": 113127, "epoch": 934} {"train_loss": -38.68852233886719, "global_step": 113128, "epoch": 934} {"train_loss": -36.80192184448242, "global_step": 113129, "epoch": 934} {"train_loss": -37.65409469604492, "global_step": 113130, "epoch": 934} {"train_loss": -36.748939514160156, "global_step": 113131, "epoch": 934} {"train_loss": -38.138710021972656, "global_step": 113132, "epoch": 934} {"train_loss": -36.959999084472656, "global_step": 113133, "epoch": 934} {"train_loss": -36.85126378713561, "global_step": 113134, "epoch": 934, "val_loss": 2674378.25} {"train_loss": -37.46903610229492, "global_step": 113135, "epoch": 935} {"train_loss": -37.796749114990234, "global_step": 113136, "epoch": 935} {"train_loss": -38.6384162902832, "global_step": 113137, "epoch": 935} {"train_loss": -38.76306915283203, "global_step": 113138, "epoch": 935} {"train_loss": -37.77223205566406, "global_step": 113139, "epoch": 935} {"train_loss": -37.16525650024414, "global_step": 113140, "epoch": 935} {"train_loss": -38.24930953979492, "global_step": 113141, "epoch": 935} {"train_loss": -38.15401840209961, "global_step": 113142, "epoch": 935} {"train_loss": -38.31582260131836, "global_step": 113143, "epoch": 935} {"train_loss": -38.35163497924805, "global_step": 113144, "epoch": 935} {"train_loss": -37.943824768066406, "global_step": 113145, "epoch": 935} {"train_loss": -37.40190124511719, "global_step": 113146, "epoch": 935} {"train_loss": -36.32258224487305, "global_step": 113147, "epoch": 935} {"train_loss": -37.92877960205078, "global_step": 113148, "epoch": 935} {"train_loss": -38.70633316040039, "global_step": 113149, "epoch": 935} {"train_loss": -38.33198547363281, "global_step": 113150, "epoch": 935} {"train_loss": -39.12226486206055, "global_step": 113151, "epoch": 935} {"train_loss": -38.40079879760742, "global_step": 113152, "epoch": 935} {"train_loss": -39.050472259521484, "global_step": 113153, "epoch": 935} {"train_loss": -38.485652923583984, "global_step": 113154, "epoch": 935} {"train_loss": -38.932621002197266, "global_step": 113155, "epoch": 935} {"train_loss": -38.71235275268555, "global_step": 113156, "epoch": 935} {"train_loss": -38.69556427001953, "global_step": 113157, "epoch": 935} {"train_loss": -39.259517669677734, "global_step": 113158, "epoch": 935} {"train_loss": -38.86920166015625, "global_step": 113159, "epoch": 935} {"train_loss": -38.94132614135742, "global_step": 113160, "epoch": 935} {"train_loss": -38.48821258544922, "global_step": 113161, "epoch": 935} {"train_loss": -38.43978500366211, "global_step": 113162, "epoch": 935} {"train_loss": -37.876888275146484, "global_step": 113163, "epoch": 935} {"train_loss": -39.02960968017578, "global_step": 113164, "epoch": 935} {"train_loss": -39.00629425048828, "global_step": 113165, "epoch": 935} {"train_loss": -38.92402648925781, "global_step": 113166, "epoch": 935} {"train_loss": -38.95663070678711, "global_step": 113167, "epoch": 935} {"train_loss": -38.32108688354492, "global_step": 113168, "epoch": 935} {"train_loss": -39.58225631713867, "global_step": 113169, "epoch": 935} {"train_loss": -38.086421966552734, "global_step": 113170, "epoch": 935} {"train_loss": -37.28109359741211, "global_step": 113171, "epoch": 935} {"train_loss": -36.14569854736328, "global_step": 113172, "epoch": 935} {"train_loss": -36.654354095458984, "global_step": 113173, "epoch": 935} {"train_loss": -38.88897705078125, "global_step": 113174, "epoch": 935} {"train_loss": -38.73574447631836, "global_step": 113175, "epoch": 935} {"train_loss": -36.882171630859375, "global_step": 113176, "epoch": 935} {"train_loss": -38.19698715209961, "global_step": 113177, "epoch": 935} {"train_loss": -38.77367401123047, "global_step": 113178, "epoch": 935} {"train_loss": -38.13414001464844, "global_step": 113179, "epoch": 935} {"train_loss": -37.64776611328125, "global_step": 113180, "epoch": 935} {"train_loss": -38.04679489135742, "global_step": 113181, "epoch": 935} {"train_loss": -37.916900634765625, "global_step": 113182, "epoch": 935} {"train_loss": -38.025390625, "global_step": 113183, "epoch": 935} {"train_loss": -37.04624938964844, "global_step": 113184, "epoch": 935} {"train_loss": -36.8074951171875, "global_step": 113185, "epoch": 935} {"train_loss": -38.77704620361328, "global_step": 113186, "epoch": 935} {"train_loss": -36.864097595214844, "global_step": 113187, "epoch": 935} {"train_loss": -37.42654037475586, "global_step": 113188, "epoch": 935} {"train_loss": -38.12275314331055, "global_step": 113189, "epoch": 935} {"train_loss": -37.031951904296875, "global_step": 113190, "epoch": 935} {"train_loss": -38.15925216674805, "global_step": 113191, "epoch": 935} {"train_loss": -37.19091033935547, "global_step": 113192, "epoch": 935} {"train_loss": -36.67751693725586, "global_step": 113193, "epoch": 935} {"train_loss": -37.20595169067383, "global_step": 113194, "epoch": 935} {"train_loss": -36.4442253112793, "global_step": 113195, "epoch": 935} {"train_loss": -37.5129280090332, "global_step": 113196, "epoch": 935} {"train_loss": -36.2353630065918, "global_step": 113197, "epoch": 935} {"train_loss": -37.61149215698242, "global_step": 113198, "epoch": 935} {"train_loss": -37.612667083740234, "global_step": 113199, "epoch": 935} {"train_loss": -38.678138732910156, "global_step": 113200, "epoch": 935} {"train_loss": -36.93272018432617, "global_step": 113201, "epoch": 935} {"train_loss": -38.10110855102539, "global_step": 113202, "epoch": 935} {"train_loss": -37.853816986083984, "global_step": 113203, "epoch": 935} {"train_loss": -37.201778411865234, "global_step": 113204, "epoch": 935} {"train_loss": -36.640838623046875, "global_step": 113205, "epoch": 935} {"train_loss": -36.731502532958984, "global_step": 113206, "epoch": 935} {"train_loss": -37.36497497558594, "global_step": 113207, "epoch": 935} {"train_loss": -37.11708450317383, "global_step": 113208, "epoch": 935} {"train_loss": -37.81966018676758, "global_step": 113209, "epoch": 935} {"train_loss": -38.08865737915039, "global_step": 113210, "epoch": 935} {"train_loss": -37.039520263671875, "global_step": 113211, "epoch": 935} {"train_loss": -37.421600341796875, "global_step": 113212, "epoch": 935} {"train_loss": -36.42138671875, "global_step": 113213, "epoch": 935} {"train_loss": -37.724822998046875, "global_step": 113214, "epoch": 935} {"train_loss": -36.8337287902832, "global_step": 113215, "epoch": 935} {"train_loss": -37.17022705078125, "global_step": 113216, "epoch": 935} {"train_loss": -37.98711013793945, "global_step": 113217, "epoch": 935} {"train_loss": -37.941566467285156, "global_step": 113218, "epoch": 935} {"train_loss": -36.78506851196289, "global_step": 113219, "epoch": 935} {"train_loss": -37.6001091003418, "global_step": 113220, "epoch": 935} {"train_loss": -37.84978485107422, "global_step": 113221, "epoch": 935} {"train_loss": -36.37949752807617, "global_step": 113222, "epoch": 935} {"train_loss": -37.898799896240234, "global_step": 113223, "epoch": 935} {"train_loss": -38.1331901550293, "global_step": 113224, "epoch": 935} {"train_loss": -37.680660247802734, "global_step": 113225, "epoch": 935} {"train_loss": -37.70325469970703, "global_step": 113226, "epoch": 935} {"train_loss": -38.36118698120117, "global_step": 113227, "epoch": 935} {"train_loss": -38.175655364990234, "global_step": 113228, "epoch": 935} {"train_loss": -38.37478256225586, "global_step": 113229, "epoch": 935} {"train_loss": -37.805850982666016, "global_step": 113230, "epoch": 935} {"train_loss": -38.68928146362305, "global_step": 113231, "epoch": 935} {"train_loss": -38.75104904174805, "global_step": 113232, "epoch": 935} {"train_loss": -37.9693717956543, "global_step": 113233, "epoch": 935} {"train_loss": -38.933162689208984, "global_step": 113234, "epoch": 935} {"train_loss": -39.1660041809082, "global_step": 113235, "epoch": 935} {"train_loss": -38.58875274658203, "global_step": 113236, "epoch": 935} {"train_loss": -39.23789978027344, "global_step": 113237, "epoch": 935} {"train_loss": -38.63063430786133, "global_step": 113238, "epoch": 935} {"train_loss": -39.517887115478516, "global_step": 113239, "epoch": 935} {"train_loss": -38.5994758605957, "global_step": 113240, "epoch": 935} {"train_loss": -39.0832633972168, "global_step": 113241, "epoch": 935} {"train_loss": -38.848876953125, "global_step": 113242, "epoch": 935} {"train_loss": -39.41563034057617, "global_step": 113243, "epoch": 935} {"train_loss": -38.746002197265625, "global_step": 113244, "epoch": 935} {"train_loss": -38.772743225097656, "global_step": 113245, "epoch": 935} {"train_loss": -38.4726448059082, "global_step": 113246, "epoch": 935} {"train_loss": -38.56907272338867, "global_step": 113247, "epoch": 935} {"train_loss": -38.11664581298828, "global_step": 113248, "epoch": 935} {"train_loss": -38.30349349975586, "global_step": 113249, "epoch": 935} {"train_loss": -38.32743453979492, "global_step": 113250, "epoch": 935} {"train_loss": -38.51606369018555, "global_step": 113251, "epoch": 935} {"train_loss": -37.82926559448242, "global_step": 113252, "epoch": 935} {"train_loss": -35.790748596191406, "global_step": 113253, "epoch": 935} {"train_loss": -35.704341888427734, "global_step": 113254, "epoch": 935} {"train_loss": -37.96175286789571, "global_step": 113255, "epoch": 935, "val_loss": 2620825.25} {"train_loss": -38.00778579711914, "global_step": 113256, "epoch": 936} {"train_loss": -39.0305061340332, "global_step": 113257, "epoch": 936} {"train_loss": -37.515838623046875, "global_step": 113258, "epoch": 936} {"train_loss": -36.21104431152344, "global_step": 113259, "epoch": 936} {"train_loss": -39.07002639770508, "global_step": 113260, "epoch": 936} {"train_loss": -38.01005935668945, "global_step": 113261, "epoch": 936} {"train_loss": -37.487709045410156, "global_step": 113262, "epoch": 936} {"train_loss": -38.06313705444336, "global_step": 113263, "epoch": 936} {"train_loss": -38.609371185302734, "global_step": 113264, "epoch": 936} {"train_loss": -36.1366081237793, "global_step": 113265, "epoch": 936} {"train_loss": -37.62122344970703, "global_step": 113266, "epoch": 936} {"train_loss": -36.33237075805664, "global_step": 113267, "epoch": 936} {"train_loss": -34.41633224487305, "global_step": 113268, "epoch": 936} {"train_loss": -35.76261520385742, "global_step": 113269, "epoch": 936} {"train_loss": -38.14686965942383, "global_step": 113270, "epoch": 936} {"train_loss": -36.418495178222656, "global_step": 113271, "epoch": 936} {"train_loss": -35.626930236816406, "global_step": 113272, "epoch": 936} {"train_loss": -36.97671127319336, "global_step": 113273, "epoch": 936} {"train_loss": -33.15741729736328, "global_step": 113274, "epoch": 936} {"train_loss": -29.75917625427246, "global_step": 113275, "epoch": 936} {"train_loss": -31.408355712890625, "global_step": 113276, "epoch": 936} {"train_loss": -35.479248046875, "global_step": 113277, "epoch": 936} {"train_loss": -28.941165924072266, "global_step": 113278, "epoch": 936} {"train_loss": -23.66262435913086, "global_step": 113279, "epoch": 936} {"train_loss": -27.81007194519043, "global_step": 113280, "epoch": 936} {"train_loss": -35.69797897338867, "global_step": 113281, "epoch": 936} {"train_loss": -33.91131591796875, "global_step": 113282, "epoch": 936} {"train_loss": -30.64337730407715, "global_step": 113283, "epoch": 936} {"train_loss": -33.704437255859375, "global_step": 113284, "epoch": 936} {"train_loss": -28.051101684570312, "global_step": 113285, "epoch": 936} {"train_loss": -34.357357025146484, "global_step": 113286, "epoch": 936} {"train_loss": -32.859703063964844, "global_step": 113287, "epoch": 936} {"train_loss": -30.23406982421875, "global_step": 113288, "epoch": 936} {"train_loss": -30.852025985717773, "global_step": 113289, "epoch": 936} {"train_loss": -32.87705612182617, "global_step": 113290, "epoch": 936} {"train_loss": -29.15559196472168, "global_step": 113291, "epoch": 936} {"train_loss": -33.92930221557617, "global_step": 113292, "epoch": 936} {"train_loss": -31.376144409179688, "global_step": 113293, "epoch": 936} {"train_loss": -34.426753997802734, "global_step": 113294, "epoch": 936} {"train_loss": -30.301422119140625, "global_step": 113295, "epoch": 936} {"train_loss": -33.62293243408203, "global_step": 113296, "epoch": 936} {"train_loss": -33.59322738647461, "global_step": 113297, "epoch": 936} {"train_loss": -34.16243362426758, "global_step": 113298, "epoch": 936} {"train_loss": -33.6817626953125, "global_step": 113299, "epoch": 936} {"train_loss": -35.44165802001953, "global_step": 113300, "epoch": 936} {"train_loss": -34.346004486083984, "global_step": 113301, "epoch": 936} {"train_loss": -35.27080154418945, "global_step": 113302, "epoch": 936} {"train_loss": -34.51103591918945, "global_step": 113303, "epoch": 936} {"train_loss": -34.230167388916016, "global_step": 113304, "epoch": 936} {"train_loss": -34.607845306396484, "global_step": 113305, "epoch": 936} {"train_loss": -35.300506591796875, "global_step": 113306, "epoch": 936} {"train_loss": -35.6284294128418, "global_step": 113307, "epoch": 936} {"train_loss": -34.348304748535156, "global_step": 113308, "epoch": 936} {"train_loss": -36.07521438598633, "global_step": 113309, "epoch": 936} {"train_loss": -35.51652145385742, "global_step": 113310, "epoch": 936} {"train_loss": -35.28266143798828, "global_step": 113311, "epoch": 936} {"train_loss": -35.15232849121094, "global_step": 113312, "epoch": 936} {"train_loss": -35.55827713012695, "global_step": 113313, "epoch": 936} {"train_loss": -35.659358978271484, "global_step": 113314, "epoch": 936} {"train_loss": -36.29501724243164, "global_step": 113315, "epoch": 936} {"train_loss": -34.93897247314453, "global_step": 113316, "epoch": 936} {"train_loss": -35.93313980102539, "global_step": 113317, "epoch": 936} {"train_loss": -35.91046142578125, "global_step": 113318, "epoch": 936} {"train_loss": -36.5827522277832, "global_step": 113319, "epoch": 936} {"train_loss": -36.01567459106445, "global_step": 113320, "epoch": 936} {"train_loss": -36.649593353271484, "global_step": 113321, "epoch": 936} {"train_loss": -36.3491325378418, "global_step": 113322, "epoch": 936} {"train_loss": -36.533451080322266, "global_step": 113323, "epoch": 936} {"train_loss": -36.154640197753906, "global_step": 113324, "epoch": 936} {"train_loss": -35.94099044799805, "global_step": 113325, "epoch": 936} {"train_loss": -36.33913040161133, "global_step": 113326, "epoch": 936} {"train_loss": -36.0607795715332, "global_step": 113327, "epoch": 936} {"train_loss": -36.066131591796875, "global_step": 113328, "epoch": 936} {"train_loss": -36.74420166015625, "global_step": 113329, "epoch": 936} {"train_loss": -36.714805603027344, "global_step": 113330, "epoch": 936} {"train_loss": -36.72672653198242, "global_step": 113331, "epoch": 936} {"train_loss": -37.500732421875, "global_step": 113332, "epoch": 936} {"train_loss": -36.520545959472656, "global_step": 113333, "epoch": 936} {"train_loss": -36.938636779785156, "global_step": 113334, "epoch": 936} {"train_loss": -36.78693389892578, "global_step": 113335, "epoch": 936} {"train_loss": -36.7705192565918, "global_step": 113336, "epoch": 936} {"train_loss": -36.778045654296875, "global_step": 113337, "epoch": 936} {"train_loss": -37.11442184448242, "global_step": 113338, "epoch": 936} {"train_loss": -37.48952865600586, "global_step": 113339, "epoch": 936} {"train_loss": -37.2536735534668, "global_step": 113340, "epoch": 936} {"train_loss": -37.29118728637695, "global_step": 113341, "epoch": 936} {"train_loss": -36.46723556518555, "global_step": 113342, "epoch": 936} {"train_loss": -37.51893997192383, "global_step": 113343, "epoch": 936} {"train_loss": -37.43278121948242, "global_step": 113344, "epoch": 936} {"train_loss": -37.2365837097168, "global_step": 113345, "epoch": 936} {"train_loss": -36.93159866333008, "global_step": 113346, "epoch": 936} {"train_loss": -37.10650634765625, "global_step": 113347, "epoch": 936} {"train_loss": -37.586181640625, "global_step": 113348, "epoch": 936} {"train_loss": -37.70819854736328, "global_step": 113349, "epoch": 936} {"train_loss": -37.364906311035156, "global_step": 113350, "epoch": 936} {"train_loss": -37.938167572021484, "global_step": 113351, "epoch": 936} {"train_loss": -38.263431549072266, "global_step": 113352, "epoch": 936} {"train_loss": -37.63077163696289, "global_step": 113353, "epoch": 936} {"train_loss": -37.66352081298828, "global_step": 113354, "epoch": 936} {"train_loss": -37.81739044189453, "global_step": 113355, "epoch": 936} {"train_loss": -38.00390625, "global_step": 113356, "epoch": 936} {"train_loss": -37.847747802734375, "global_step": 113357, "epoch": 936} {"train_loss": -37.899017333984375, "global_step": 113358, "epoch": 936} {"train_loss": -37.649837493896484, "global_step": 113359, "epoch": 936} {"train_loss": -38.196800231933594, "global_step": 113360, "epoch": 936} {"train_loss": -37.85033416748047, "global_step": 113361, "epoch": 936} {"train_loss": -37.94514846801758, "global_step": 113362, "epoch": 936} {"train_loss": -37.627288818359375, "global_step": 113363, "epoch": 936} {"train_loss": -38.09130859375, "global_step": 113364, "epoch": 936} {"train_loss": -38.192237854003906, "global_step": 113365, "epoch": 936} {"train_loss": -38.0816650390625, "global_step": 113366, "epoch": 936} {"train_loss": -38.062259674072266, "global_step": 113367, "epoch": 936} {"train_loss": -37.76615524291992, "global_step": 113368, "epoch": 936} {"train_loss": -38.16408920288086, "global_step": 113369, "epoch": 936} {"train_loss": -38.433349609375, "global_step": 113370, "epoch": 936} {"train_loss": -38.223690032958984, "global_step": 113371, "epoch": 936} {"train_loss": -37.97802734375, "global_step": 113372, "epoch": 936} {"train_loss": -38.66822814941406, "global_step": 113373, "epoch": 936} {"train_loss": -38.34587860107422, "global_step": 113374, "epoch": 936} {"train_loss": -38.0484619140625, "global_step": 113375, "epoch": 936} {"train_loss": -35.81573787405471, "global_step": 113376, "epoch": 936, "val_loss": 2773360.75} {"train_loss": -38.21559524536133, "global_step": 113377, "epoch": 937} {"train_loss": -38.68832015991211, "global_step": 113378, "epoch": 937} {"train_loss": -38.518646240234375, "global_step": 113379, "epoch": 937} {"train_loss": -38.667598724365234, "global_step": 113380, "epoch": 937} {"train_loss": -38.61076736450195, "global_step": 113381, "epoch": 937} {"train_loss": -38.12874221801758, "global_step": 113382, "epoch": 937} {"train_loss": -38.336544036865234, "global_step": 113383, "epoch": 937} {"train_loss": -38.6351432800293, "global_step": 113384, "epoch": 937} {"train_loss": -38.704227447509766, "global_step": 113385, "epoch": 937} {"train_loss": -38.8333625793457, "global_step": 113386, "epoch": 937} {"train_loss": -37.34119415283203, "global_step": 113387, "epoch": 937} {"train_loss": -38.86756896972656, "global_step": 113388, "epoch": 937} {"train_loss": -39.02523422241211, "global_step": 113389, "epoch": 937} {"train_loss": -39.031822204589844, "global_step": 113390, "epoch": 937} {"train_loss": -38.4968376159668, "global_step": 113391, "epoch": 937} {"train_loss": -39.15287399291992, "global_step": 113392, "epoch": 937} {"train_loss": -38.8316764831543, "global_step": 113393, "epoch": 937} {"train_loss": -38.80141830444336, "global_step": 113394, "epoch": 937} {"train_loss": -38.885982513427734, "global_step": 113395, "epoch": 937} {"train_loss": -39.27281188964844, "global_step": 113396, "epoch": 937} {"train_loss": -39.012813568115234, "global_step": 113397, "epoch": 937} {"train_loss": -38.748783111572266, "global_step": 113398, "epoch": 937} {"train_loss": -38.7578010559082, "global_step": 113399, "epoch": 937} {"train_loss": -38.05146789550781, "global_step": 113400, "epoch": 937} {"train_loss": -38.87809371948242, "global_step": 113401, "epoch": 937} {"train_loss": -39.098670959472656, "global_step": 113402, "epoch": 937} {"train_loss": -38.6837272644043, "global_step": 113403, "epoch": 937} {"train_loss": -39.35188674926758, "global_step": 113404, "epoch": 937} {"train_loss": -39.05268478393555, "global_step": 113405, "epoch": 937} {"train_loss": -38.70026779174805, "global_step": 113406, "epoch": 937} {"train_loss": -38.649410247802734, "global_step": 113407, "epoch": 937} {"train_loss": -39.39424514770508, "global_step": 113408, "epoch": 937} {"train_loss": -39.515804290771484, "global_step": 113409, "epoch": 937} {"train_loss": -39.20846939086914, "global_step": 113410, "epoch": 937} {"train_loss": -39.01460647583008, "global_step": 113411, "epoch": 937} {"train_loss": -38.975128173828125, "global_step": 113412, "epoch": 937} {"train_loss": -38.918434143066406, "global_step": 113413, "epoch": 937} {"train_loss": -38.38713455200195, "global_step": 113414, "epoch": 937} {"train_loss": -39.5124626159668, "global_step": 113415, "epoch": 937} {"train_loss": -38.633785247802734, "global_step": 113416, "epoch": 937} {"train_loss": -38.48670196533203, "global_step": 113417, "epoch": 937} {"train_loss": -39.23629379272461, "global_step": 113418, "epoch": 937} {"train_loss": -38.202239990234375, "global_step": 113419, "epoch": 937} {"train_loss": -38.87640380859375, "global_step": 113420, "epoch": 937} {"train_loss": -38.33778762817383, "global_step": 113421, "epoch": 937} {"train_loss": -39.49148178100586, "global_step": 113422, "epoch": 937} {"train_loss": -39.135414123535156, "global_step": 113423, "epoch": 937} {"train_loss": -38.406494140625, "global_step": 113424, "epoch": 937} {"train_loss": -38.455257415771484, "global_step": 113425, "epoch": 937} {"train_loss": -39.234764099121094, "global_step": 113426, "epoch": 937} {"train_loss": -39.21235275268555, "global_step": 113427, "epoch": 937} {"train_loss": -39.442073822021484, "global_step": 113428, "epoch": 937} {"train_loss": -39.50679397583008, "global_step": 113429, "epoch": 937} {"train_loss": -38.03123092651367, "global_step": 113430, "epoch": 937} {"train_loss": -38.456783294677734, "global_step": 113431, "epoch": 937} {"train_loss": -38.25827407836914, "global_step": 113432, "epoch": 937} {"train_loss": -39.348114013671875, "global_step": 113433, "epoch": 937} {"train_loss": -36.144447326660156, "global_step": 113434, "epoch": 937} {"train_loss": -34.22440719604492, "global_step": 113435, "epoch": 937} {"train_loss": -33.807308197021484, "global_step": 113436, "epoch": 937} {"train_loss": -36.27933883666992, "global_step": 113437, "epoch": 937} {"train_loss": -32.09634780883789, "global_step": 113438, "epoch": 937} {"train_loss": -38.1606330871582, "global_step": 113439, "epoch": 937} {"train_loss": -28.569578170776367, "global_step": 113440, "epoch": 937} {"train_loss": -31.5741024017334, "global_step": 113441, "epoch": 937} {"train_loss": -34.538936614990234, "global_step": 113442, "epoch": 937} {"train_loss": -34.62086868286133, "global_step": 113443, "epoch": 937} {"train_loss": -36.31195068359375, "global_step": 113444, "epoch": 937} {"train_loss": -33.099708557128906, "global_step": 113445, "epoch": 937} {"train_loss": -34.61393356323242, "global_step": 113446, "epoch": 937} {"train_loss": -32.87186050415039, "global_step": 113447, "epoch": 937} {"train_loss": -33.60056686401367, "global_step": 113448, "epoch": 937} {"train_loss": -32.447086334228516, "global_step": 113449, "epoch": 937} {"train_loss": -35.20037841796875, "global_step": 113450, "epoch": 937} {"train_loss": -34.994171142578125, "global_step": 113451, "epoch": 937} {"train_loss": -35.27413558959961, "global_step": 113452, "epoch": 937} {"train_loss": -36.86407470703125, "global_step": 113453, "epoch": 937} {"train_loss": -35.75439453125, "global_step": 113454, "epoch": 937} {"train_loss": -35.782493591308594, "global_step": 113455, "epoch": 937} {"train_loss": -36.23339080810547, "global_step": 113456, "epoch": 937} {"train_loss": -36.8908805847168, "global_step": 113457, "epoch": 937} {"train_loss": -36.6552619934082, "global_step": 113458, "epoch": 937} {"train_loss": -35.684608459472656, "global_step": 113459, "epoch": 937} {"train_loss": -37.49011993408203, "global_step": 113460, "epoch": 937} {"train_loss": -36.81574630737305, "global_step": 113461, "epoch": 937} {"train_loss": -36.490413665771484, "global_step": 113462, "epoch": 937} {"train_loss": -37.575782775878906, "global_step": 113463, "epoch": 937} {"train_loss": -36.97962188720703, "global_step": 113464, "epoch": 937} {"train_loss": -37.13447189331055, "global_step": 113465, "epoch": 937} {"train_loss": -37.001705169677734, "global_step": 113466, "epoch": 937} {"train_loss": -36.5133171081543, "global_step": 113467, "epoch": 937} {"train_loss": -37.57276916503906, "global_step": 113468, "epoch": 937} {"train_loss": -36.795841217041016, "global_step": 113469, "epoch": 937} {"train_loss": -38.05225372314453, "global_step": 113470, "epoch": 937} {"train_loss": -36.71937561035156, "global_step": 113471, "epoch": 937} {"train_loss": -37.74489974975586, "global_step": 113472, "epoch": 937} {"train_loss": -35.29285430908203, "global_step": 113473, "epoch": 937} {"train_loss": -37.83040237426758, "global_step": 113474, "epoch": 937} {"train_loss": -37.79212951660156, "global_step": 113475, "epoch": 937} {"train_loss": -37.94063186645508, "global_step": 113476, "epoch": 937} {"train_loss": -38.055416107177734, "global_step": 113477, "epoch": 937} {"train_loss": -37.93134307861328, "global_step": 113478, "epoch": 937} {"train_loss": -38.09629821777344, "global_step": 113479, "epoch": 937} {"train_loss": -37.85041427612305, "global_step": 113480, "epoch": 937} {"train_loss": -37.95307540893555, "global_step": 113481, "epoch": 937} {"train_loss": -38.01306915283203, "global_step": 113482, "epoch": 937} {"train_loss": -38.50240707397461, "global_step": 113483, "epoch": 937} {"train_loss": -38.16576385498047, "global_step": 113484, "epoch": 937} {"train_loss": -38.10993194580078, "global_step": 113485, "epoch": 937} {"train_loss": -38.89504623413086, "global_step": 113486, "epoch": 937} {"train_loss": -38.77366256713867, "global_step": 113487, "epoch": 937} {"train_loss": -38.117431640625, "global_step": 113488, "epoch": 937} {"train_loss": -38.434814453125, "global_step": 113489, "epoch": 937} {"train_loss": -38.59387969970703, "global_step": 113490, "epoch": 937} {"train_loss": -38.69807052612305, "global_step": 113491, "epoch": 937} {"train_loss": -38.5713005065918, "global_step": 113492, "epoch": 937} {"train_loss": -38.34922790527344, "global_step": 113493, "epoch": 937} {"train_loss": -39.00291061401367, "global_step": 113494, "epoch": 937} {"train_loss": -38.19607162475586, "global_step": 113495, "epoch": 937} {"train_loss": -38.720455169677734, "global_step": 113496, "epoch": 937} {"train_loss": -37.615285447806365, "global_step": 113497, "epoch": 937, "val_loss": 2685041.0} {"train_loss": -38.71199417114258, "global_step": 113498, "epoch": 938} {"train_loss": -38.496910095214844, "global_step": 113499, "epoch": 938} {"train_loss": -38.05567169189453, "global_step": 113500, "epoch": 938} {"train_loss": -38.539615631103516, "global_step": 113501, "epoch": 938} {"train_loss": -38.36933517456055, "global_step": 113502, "epoch": 938} {"train_loss": -39.18503189086914, "global_step": 113503, "epoch": 938} {"train_loss": -38.70228576660156, "global_step": 113504, "epoch": 938} {"train_loss": -38.37233352661133, "global_step": 113505, "epoch": 938} {"train_loss": -37.908992767333984, "global_step": 113506, "epoch": 938} {"train_loss": -38.35500717163086, "global_step": 113507, "epoch": 938} {"train_loss": -38.10057067871094, "global_step": 113508, "epoch": 938} {"train_loss": -38.39813232421875, "global_step": 113509, "epoch": 938} {"train_loss": -38.82048416137695, "global_step": 113510, "epoch": 938} {"train_loss": -39.0200080871582, "global_step": 113511, "epoch": 938} {"train_loss": -39.257057189941406, "global_step": 113512, "epoch": 938} {"train_loss": -38.72404098510742, "global_step": 113513, "epoch": 938} {"train_loss": -38.86381530761719, "global_step": 113514, "epoch": 938} {"train_loss": -38.16728591918945, "global_step": 113515, "epoch": 938} {"train_loss": -38.451961517333984, "global_step": 113516, "epoch": 938} {"train_loss": -38.9096565246582, "global_step": 113517, "epoch": 938} {"train_loss": -39.371463775634766, "global_step": 113518, "epoch": 938} {"train_loss": -38.77581787109375, "global_step": 113519, "epoch": 938} {"train_loss": -38.88523864746094, "global_step": 113520, "epoch": 938} {"train_loss": -39.30216598510742, "global_step": 113521, "epoch": 938} {"train_loss": -38.41947555541992, "global_step": 113522, "epoch": 938} {"train_loss": -38.036834716796875, "global_step": 113523, "epoch": 938} {"train_loss": -37.98933792114258, "global_step": 113524, "epoch": 938} {"train_loss": -37.1755485534668, "global_step": 113525, "epoch": 938} {"train_loss": -38.49897384643555, "global_step": 113526, "epoch": 938} {"train_loss": -39.08181381225586, "global_step": 113527, "epoch": 938} {"train_loss": -37.03935623168945, "global_step": 113528, "epoch": 938} {"train_loss": -38.495826721191406, "global_step": 113529, "epoch": 938} {"train_loss": -37.77114486694336, "global_step": 113530, "epoch": 938} {"train_loss": -38.64437484741211, "global_step": 113531, "epoch": 938} {"train_loss": -38.21132278442383, "global_step": 113532, "epoch": 938} {"train_loss": -35.63606262207031, "global_step": 113533, "epoch": 938} {"train_loss": -37.29571533203125, "global_step": 113534, "epoch": 938} {"train_loss": -37.516788482666016, "global_step": 113535, "epoch": 938} {"train_loss": -37.685646057128906, "global_step": 113536, "epoch": 938} {"train_loss": -38.77717208862305, "global_step": 113537, "epoch": 938} {"train_loss": -38.376708984375, "global_step": 113538, "epoch": 938} {"train_loss": -38.4455680847168, "global_step": 113539, "epoch": 938} {"train_loss": -38.06758499145508, "global_step": 113540, "epoch": 938} {"train_loss": -38.27471160888672, "global_step": 113541, "epoch": 938} {"train_loss": -37.687110900878906, "global_step": 113542, "epoch": 938} {"train_loss": -36.7431526184082, "global_step": 113543, "epoch": 938} {"train_loss": -38.156829833984375, "global_step": 113544, "epoch": 938} {"train_loss": -37.143585205078125, "global_step": 113545, "epoch": 938} {"train_loss": -36.0733642578125, "global_step": 113546, "epoch": 938} {"train_loss": -32.0357666015625, "global_step": 113547, "epoch": 938} {"train_loss": -37.203277587890625, "global_step": 113548, "epoch": 938} {"train_loss": -36.90420913696289, "global_step": 113549, "epoch": 938} {"train_loss": -36.811256408691406, "global_step": 113550, "epoch": 938} {"train_loss": -35.336788177490234, "global_step": 113551, "epoch": 938} {"train_loss": -33.348236083984375, "global_step": 113552, "epoch": 938} {"train_loss": -36.26401901245117, "global_step": 113553, "epoch": 938} {"train_loss": -36.948394775390625, "global_step": 113554, "epoch": 938} {"train_loss": -34.2535514831543, "global_step": 113555, "epoch": 938} {"train_loss": -33.11915588378906, "global_step": 113556, "epoch": 938} {"train_loss": -33.79460144042969, "global_step": 113557, "epoch": 938} {"train_loss": -35.52106475830078, "global_step": 113558, "epoch": 938} {"train_loss": -36.12434005737305, "global_step": 113559, "epoch": 938} {"train_loss": -35.160884857177734, "global_step": 113560, "epoch": 938} {"train_loss": -35.451416015625, "global_step": 113561, "epoch": 938} {"train_loss": -36.256465911865234, "global_step": 113562, "epoch": 938} {"train_loss": -36.998390197753906, "global_step": 113563, "epoch": 938} {"train_loss": -36.56321334838867, "global_step": 113564, "epoch": 938} {"train_loss": -35.88264846801758, "global_step": 113565, "epoch": 938} {"train_loss": -35.98899459838867, "global_step": 113566, "epoch": 938} {"train_loss": -35.59937286376953, "global_step": 113567, "epoch": 938} {"train_loss": -33.29990768432617, "global_step": 113568, "epoch": 938} {"train_loss": -35.04555130004883, "global_step": 113569, "epoch": 938} {"train_loss": -34.66598892211914, "global_step": 113570, "epoch": 938} {"train_loss": -36.726722717285156, "global_step": 113571, "epoch": 938} {"train_loss": -34.58892822265625, "global_step": 113572, "epoch": 938} {"train_loss": -36.120155334472656, "global_step": 113573, "epoch": 938} {"train_loss": -33.869625091552734, "global_step": 113574, "epoch": 938} {"train_loss": -37.26604080200195, "global_step": 113575, "epoch": 938} {"train_loss": -37.37482452392578, "global_step": 113576, "epoch": 938} {"train_loss": -35.164146423339844, "global_step": 113577, "epoch": 938} {"train_loss": -36.774532318115234, "global_step": 113578, "epoch": 938} {"train_loss": -35.274959564208984, "global_step": 113579, "epoch": 938} {"train_loss": -36.72992706298828, "global_step": 113580, "epoch": 938} {"train_loss": -36.5373420715332, "global_step": 113581, "epoch": 938} {"train_loss": -36.34882736206055, "global_step": 113582, "epoch": 938} {"train_loss": -36.51572799682617, "global_step": 113583, "epoch": 938} {"train_loss": -36.9443244934082, "global_step": 113584, "epoch": 938} {"train_loss": -37.49978256225586, "global_step": 113585, "epoch": 938} {"train_loss": -35.887115478515625, "global_step": 113586, "epoch": 938} {"train_loss": -36.531280517578125, "global_step": 113587, "epoch": 938} {"train_loss": -36.51991653442383, "global_step": 113588, "epoch": 938} {"train_loss": -37.45564651489258, "global_step": 113589, "epoch": 938} {"train_loss": -37.006160736083984, "global_step": 113590, "epoch": 938} {"train_loss": -37.407508850097656, "global_step": 113591, "epoch": 938} {"train_loss": -36.911197662353516, "global_step": 113592, "epoch": 938} {"train_loss": -37.69395065307617, "global_step": 113593, "epoch": 938} {"train_loss": -37.945518493652344, "global_step": 113594, "epoch": 938} {"train_loss": -37.150062561035156, "global_step": 113595, "epoch": 938} {"train_loss": -36.329002380371094, "global_step": 113596, "epoch": 938} {"train_loss": -38.22481155395508, "global_step": 113597, "epoch": 938} {"train_loss": -37.912322998046875, "global_step": 113598, "epoch": 938} {"train_loss": -38.008121490478516, "global_step": 113599, "epoch": 938} {"train_loss": -37.893428802490234, "global_step": 113600, "epoch": 938} {"train_loss": -37.43089294433594, "global_step": 113601, "epoch": 938} {"train_loss": -37.96184158325195, "global_step": 113602, "epoch": 938} {"train_loss": -38.27290344238281, "global_step": 113603, "epoch": 938} {"train_loss": -37.81069564819336, "global_step": 113604, "epoch": 938} {"train_loss": -37.95612716674805, "global_step": 113605, "epoch": 938} {"train_loss": -38.40543746948242, "global_step": 113606, "epoch": 938} {"train_loss": -38.53568649291992, "global_step": 113607, "epoch": 938} {"train_loss": -38.08799362182617, "global_step": 113608, "epoch": 938} {"train_loss": -38.48455047607422, "global_step": 113609, "epoch": 938} {"train_loss": -38.62094497680664, "global_step": 113610, "epoch": 938} {"train_loss": -38.741539001464844, "global_step": 113611, "epoch": 938} {"train_loss": -38.345985412597656, "global_step": 113612, "epoch": 938} {"train_loss": -38.74800491333008, "global_step": 113613, "epoch": 938} {"train_loss": -38.42413330078125, "global_step": 113614, "epoch": 938} {"train_loss": -38.13249969482422, "global_step": 113615, "epoch": 938} {"train_loss": -38.265419006347656, "global_step": 113616, "epoch": 938} {"train_loss": -38.42105484008789, "global_step": 113617, "epoch": 938} {"train_loss": -37.300964607680136, "global_step": 113618, "epoch": 938, "val_loss": 2686474.25} {"train_loss": -38.65081787109375, "global_step": 113619, "epoch": 939} {"train_loss": -38.79084014892578, "global_step": 113620, "epoch": 939} {"train_loss": -38.22721862792969, "global_step": 113621, "epoch": 939} {"train_loss": -38.4928092956543, "global_step": 113622, "epoch": 939} {"train_loss": -38.717018127441406, "global_step": 113623, "epoch": 939} {"train_loss": -38.672119140625, "global_step": 113624, "epoch": 939} {"train_loss": -39.04508590698242, "global_step": 113625, "epoch": 939} {"train_loss": -38.962799072265625, "global_step": 113626, "epoch": 939} {"train_loss": -38.845306396484375, "global_step": 113627, "epoch": 939} {"train_loss": -39.05982208251953, "global_step": 113628, "epoch": 939} {"train_loss": -39.342525482177734, "global_step": 113629, "epoch": 939} {"train_loss": -39.085670471191406, "global_step": 113630, "epoch": 939} {"train_loss": -38.786956787109375, "global_step": 113631, "epoch": 939} {"train_loss": -38.3400764465332, "global_step": 113632, "epoch": 939} {"train_loss": -35.79171371459961, "global_step": 113633, "epoch": 939} {"train_loss": -33.33274841308594, "global_step": 113634, "epoch": 939} {"train_loss": -29.848474502563477, "global_step": 113635, "epoch": 939} {"train_loss": -28.1588191986084, "global_step": 113636, "epoch": 939} {"train_loss": -33.39598846435547, "global_step": 113637, "epoch": 939} {"train_loss": -37.442588806152344, "global_step": 113638, "epoch": 939} {"train_loss": -36.8558235168457, "global_step": 113639, "epoch": 939} {"train_loss": -37.347816467285156, "global_step": 113640, "epoch": 939} {"train_loss": -38.03853225708008, "global_step": 113641, "epoch": 939} {"train_loss": -35.61836242675781, "global_step": 113642, "epoch": 939} {"train_loss": -35.73711013793945, "global_step": 113643, "epoch": 939} {"train_loss": -38.31705856323242, "global_step": 113644, "epoch": 939} {"train_loss": -36.812076568603516, "global_step": 113645, "epoch": 939} {"train_loss": -38.38755416870117, "global_step": 113646, "epoch": 939} {"train_loss": -36.92510986328125, "global_step": 113647, "epoch": 939} {"train_loss": -36.785926818847656, "global_step": 113648, "epoch": 939} {"train_loss": -38.83855056762695, "global_step": 113649, "epoch": 939} {"train_loss": -36.0784797668457, "global_step": 113650, "epoch": 939} {"train_loss": -38.486324310302734, "global_step": 113651, "epoch": 939} {"train_loss": -36.62095260620117, "global_step": 113652, "epoch": 939} {"train_loss": -37.833106994628906, "global_step": 113653, "epoch": 939} {"train_loss": -38.21638488769531, "global_step": 113654, "epoch": 939} {"train_loss": -37.97834396362305, "global_step": 113655, "epoch": 939} {"train_loss": -37.74928665161133, "global_step": 113656, "epoch": 939} {"train_loss": -37.62225341796875, "global_step": 113657, "epoch": 939} {"train_loss": -37.94390869140625, "global_step": 113658, "epoch": 939} {"train_loss": -38.322872161865234, "global_step": 113659, "epoch": 939} {"train_loss": -37.33635330200195, "global_step": 113660, "epoch": 939} {"train_loss": -38.329673767089844, "global_step": 113661, "epoch": 939} {"train_loss": -37.75255584716797, "global_step": 113662, "epoch": 939} {"train_loss": -38.44430160522461, "global_step": 113663, "epoch": 939} {"train_loss": -37.73870086669922, "global_step": 113664, "epoch": 939} {"train_loss": -38.55660629272461, "global_step": 113665, "epoch": 939} {"train_loss": -37.403934478759766, "global_step": 113666, "epoch": 939} {"train_loss": -37.74634552001953, "global_step": 113667, "epoch": 939} {"train_loss": -38.173709869384766, "global_step": 113668, "epoch": 939} {"train_loss": -38.03666687011719, "global_step": 113669, "epoch": 939} {"train_loss": -37.915470123291016, "global_step": 113670, "epoch": 939} {"train_loss": -37.656490325927734, "global_step": 113671, "epoch": 939} {"train_loss": -38.90386199951172, "global_step": 113672, "epoch": 939} {"train_loss": -38.216583251953125, "global_step": 113673, "epoch": 939} {"train_loss": -38.746315002441406, "global_step": 113674, "epoch": 939} {"train_loss": -38.96555709838867, "global_step": 113675, "epoch": 939} {"train_loss": -38.6754150390625, "global_step": 113676, "epoch": 939} {"train_loss": -38.51998519897461, "global_step": 113677, "epoch": 939} {"train_loss": -39.201786041259766, "global_step": 113678, "epoch": 939} {"train_loss": -38.911842346191406, "global_step": 113679, "epoch": 939} {"train_loss": -38.24036407470703, "global_step": 113680, "epoch": 939} {"train_loss": -38.06858825683594, "global_step": 113681, "epoch": 939} {"train_loss": -38.326351165771484, "global_step": 113682, "epoch": 939} {"train_loss": -38.81359100341797, "global_step": 113683, "epoch": 939} {"train_loss": -37.56431579589844, "global_step": 113684, "epoch": 939} {"train_loss": -35.93057632446289, "global_step": 113685, "epoch": 939} {"train_loss": -36.74359130859375, "global_step": 113686, "epoch": 939} {"train_loss": -38.18337631225586, "global_step": 113687, "epoch": 939} {"train_loss": -36.993621826171875, "global_step": 113688, "epoch": 939} {"train_loss": -38.42890548706055, "global_step": 113689, "epoch": 939} {"train_loss": -39.615421295166016, "global_step": 113690, "epoch": 939} {"train_loss": -38.443382263183594, "global_step": 113691, "epoch": 939} {"train_loss": -37.63905334472656, "global_step": 113692, "epoch": 939} {"train_loss": -38.195499420166016, "global_step": 113693, "epoch": 939} {"train_loss": -39.39466857910156, "global_step": 113694, "epoch": 939} {"train_loss": -38.614540100097656, "global_step": 113695, "epoch": 939} {"train_loss": -37.346065521240234, "global_step": 113696, "epoch": 939} {"train_loss": -38.00226974487305, "global_step": 113697, "epoch": 939} {"train_loss": -39.105499267578125, "global_step": 113698, "epoch": 939} {"train_loss": -38.99232864379883, "global_step": 113699, "epoch": 939} {"train_loss": -38.094112396240234, "global_step": 113700, "epoch": 939} {"train_loss": -38.84695053100586, "global_step": 113701, "epoch": 939} {"train_loss": -38.96989059448242, "global_step": 113702, "epoch": 939} {"train_loss": -38.65140914916992, "global_step": 113703, "epoch": 939} {"train_loss": -39.21552276611328, "global_step": 113704, "epoch": 939} {"train_loss": -38.662723541259766, "global_step": 113705, "epoch": 939} {"train_loss": -38.559993743896484, "global_step": 113706, "epoch": 939} {"train_loss": -38.874183654785156, "global_step": 113707, "epoch": 939} {"train_loss": -38.11494064331055, "global_step": 113708, "epoch": 939} {"train_loss": -38.49679183959961, "global_step": 113709, "epoch": 939} {"train_loss": -38.8947868347168, "global_step": 113710, "epoch": 939} {"train_loss": -38.11506652832031, "global_step": 113711, "epoch": 939} {"train_loss": -39.151329040527344, "global_step": 113712, "epoch": 939} {"train_loss": -38.27132797241211, "global_step": 113713, "epoch": 939} {"train_loss": -38.38977813720703, "global_step": 113714, "epoch": 939} {"train_loss": -38.56144332885742, "global_step": 113715, "epoch": 939} {"train_loss": -38.78559494018555, "global_step": 113716, "epoch": 939} {"train_loss": -39.354854583740234, "global_step": 113717, "epoch": 939} {"train_loss": -38.032264709472656, "global_step": 113718, "epoch": 939} {"train_loss": -36.47394561767578, "global_step": 113719, "epoch": 939} {"train_loss": -38.55409622192383, "global_step": 113720, "epoch": 939} {"train_loss": -39.613101959228516, "global_step": 113721, "epoch": 939} {"train_loss": -39.221038818359375, "global_step": 113722, "epoch": 939} {"train_loss": -37.72892761230469, "global_step": 113723, "epoch": 939} {"train_loss": -37.52992248535156, "global_step": 113724, "epoch": 939} {"train_loss": -38.67744064331055, "global_step": 113725, "epoch": 939} {"train_loss": -38.958736419677734, "global_step": 113726, "epoch": 939} {"train_loss": -37.60661697387695, "global_step": 113727, "epoch": 939} {"train_loss": -38.814571380615234, "global_step": 113728, "epoch": 939} {"train_loss": -39.067440032958984, "global_step": 113729, "epoch": 939} {"train_loss": -38.28425216674805, "global_step": 113730, "epoch": 939} {"train_loss": -38.3125114440918, "global_step": 113731, "epoch": 939} {"train_loss": -38.88396072387695, "global_step": 113732, "epoch": 939} {"train_loss": -39.175472259521484, "global_step": 113733, "epoch": 939} {"train_loss": -38.41286849975586, "global_step": 113734, "epoch": 939} {"train_loss": -39.520259857177734, "global_step": 113735, "epoch": 939} {"train_loss": -38.61846923828125, "global_step": 113736, "epoch": 939} {"train_loss": -38.3260383605957, "global_step": 113737, "epoch": 939} {"train_loss": -38.91590118408203, "global_step": 113738, "epoch": 939} {"train_loss": -38.00009202563073, "global_step": 113739, "epoch": 939, "val_loss": 2699916.75} {"train_loss": -39.877742767333984, "global_step": 113740, "epoch": 940} {"train_loss": -39.15264892578125, "global_step": 113741, "epoch": 940} {"train_loss": -37.596435546875, "global_step": 113742, "epoch": 940} {"train_loss": -38.762306213378906, "global_step": 113743, "epoch": 940} {"train_loss": -38.51417922973633, "global_step": 113744, "epoch": 940} {"train_loss": -38.17317581176758, "global_step": 113745, "epoch": 940} {"train_loss": -38.29713821411133, "global_step": 113746, "epoch": 940} {"train_loss": -39.042999267578125, "global_step": 113747, "epoch": 940} {"train_loss": -37.12333297729492, "global_step": 113748, "epoch": 940} {"train_loss": -36.589134216308594, "global_step": 113749, "epoch": 940} {"train_loss": -37.61345291137695, "global_step": 113750, "epoch": 940} {"train_loss": -38.17563247680664, "global_step": 113751, "epoch": 940} {"train_loss": -38.815467834472656, "global_step": 113752, "epoch": 940} {"train_loss": -36.96934127807617, "global_step": 113753, "epoch": 940} {"train_loss": -37.74232864379883, "global_step": 113754, "epoch": 940} {"train_loss": -38.036495208740234, "global_step": 113755, "epoch": 940} {"train_loss": -36.74892044067383, "global_step": 113756, "epoch": 940} {"train_loss": -37.479095458984375, "global_step": 113757, "epoch": 940} {"train_loss": -38.277462005615234, "global_step": 113758, "epoch": 940} {"train_loss": -37.27150344848633, "global_step": 113759, "epoch": 940} {"train_loss": -30.424697875976562, "global_step": 113760, "epoch": 940} {"train_loss": -32.47677230834961, "global_step": 113761, "epoch": 940} {"train_loss": -36.887332916259766, "global_step": 113762, "epoch": 940} {"train_loss": -28.3541316986084, "global_step": 113763, "epoch": 940} {"train_loss": -35.78413391113281, "global_step": 113764, "epoch": 940} {"train_loss": -34.84906768798828, "global_step": 113765, "epoch": 940} {"train_loss": -31.73054313659668, "global_step": 113766, "epoch": 940} {"train_loss": -32.15131759643555, "global_step": 113767, "epoch": 940} {"train_loss": -35.471900939941406, "global_step": 113768, "epoch": 940} {"train_loss": -35.462501525878906, "global_step": 113769, "epoch": 940} {"train_loss": -36.76758575439453, "global_step": 113770, "epoch": 940} {"train_loss": -36.860042572021484, "global_step": 113771, "epoch": 940} {"train_loss": -17.795713424682617, "global_step": 113772, "epoch": 940} {"train_loss": -35.474857330322266, "global_step": 113773, "epoch": 940} {"train_loss": -35.93904495239258, "global_step": 113774, "epoch": 940} {"train_loss": -33.17095947265625, "global_step": 113775, "epoch": 940} {"train_loss": -33.226707458496094, "global_step": 113776, "epoch": 940} {"train_loss": -32.56062698364258, "global_step": 113777, "epoch": 940} {"train_loss": -35.74387741088867, "global_step": 113778, "epoch": 940} {"train_loss": -36.43375778198242, "global_step": 113779, "epoch": 940} {"train_loss": -33.99993896484375, "global_step": 113780, "epoch": 940} {"train_loss": -32.019466400146484, "global_step": 113781, "epoch": 940} {"train_loss": -36.061767578125, "global_step": 113782, "epoch": 940} {"train_loss": -35.396087646484375, "global_step": 113783, "epoch": 940} {"train_loss": -35.21113967895508, "global_step": 113784, "epoch": 940} {"train_loss": -36.790870666503906, "global_step": 113785, "epoch": 940} {"train_loss": -35.944820404052734, "global_step": 113786, "epoch": 940} {"train_loss": -36.90956497192383, "global_step": 113787, "epoch": 940} {"train_loss": -35.67855453491211, "global_step": 113788, "epoch": 940} {"train_loss": -37.0017204284668, "global_step": 113789, "epoch": 940} {"train_loss": -35.494686126708984, "global_step": 113790, "epoch": 940} {"train_loss": -36.35663986206055, "global_step": 113791, "epoch": 940} {"train_loss": -36.722328186035156, "global_step": 113792, "epoch": 940} {"train_loss": -37.40916061401367, "global_step": 113793, "epoch": 940} {"train_loss": -36.359619140625, "global_step": 113794, "epoch": 940} {"train_loss": -36.3004264831543, "global_step": 113795, "epoch": 940} {"train_loss": -36.036128997802734, "global_step": 113796, "epoch": 940} {"train_loss": -36.4991455078125, "global_step": 113797, "epoch": 940} {"train_loss": -37.18638610839844, "global_step": 113798, "epoch": 940} {"train_loss": -34.196693420410156, "global_step": 113799, "epoch": 940} {"train_loss": -36.47452926635742, "global_step": 113800, "epoch": 940} {"train_loss": -36.75899887084961, "global_step": 113801, "epoch": 940} {"train_loss": -36.86611557006836, "global_step": 113802, "epoch": 940} {"train_loss": -37.39484786987305, "global_step": 113803, "epoch": 940} {"train_loss": -37.23409652709961, "global_step": 113804, "epoch": 940} {"train_loss": -37.40366744995117, "global_step": 113805, "epoch": 940} {"train_loss": -37.591800689697266, "global_step": 113806, "epoch": 940} {"train_loss": -37.85883331298828, "global_step": 113807, "epoch": 940} {"train_loss": -37.65846633911133, "global_step": 113808, "epoch": 940} {"train_loss": -37.58494186401367, "global_step": 113809, "epoch": 940} {"train_loss": -37.42763900756836, "global_step": 113810, "epoch": 940} {"train_loss": -37.82784652709961, "global_step": 113811, "epoch": 940} {"train_loss": -38.00688934326172, "global_step": 113812, "epoch": 940} {"train_loss": -37.39873504638672, "global_step": 113813, "epoch": 940} {"train_loss": -37.93368148803711, "global_step": 113814, "epoch": 940} {"train_loss": -37.19525146484375, "global_step": 113815, "epoch": 940} {"train_loss": -37.69099044799805, "global_step": 113816, "epoch": 940} {"train_loss": -37.32437515258789, "global_step": 113817, "epoch": 940} {"train_loss": -38.37257766723633, "global_step": 113818, "epoch": 940} {"train_loss": -37.14550018310547, "global_step": 113819, "epoch": 940} {"train_loss": -38.31891632080078, "global_step": 113820, "epoch": 940} {"train_loss": -37.85663986206055, "global_step": 113821, "epoch": 940} {"train_loss": -38.267677307128906, "global_step": 113822, "epoch": 940} {"train_loss": -38.10268783569336, "global_step": 113823, "epoch": 940} {"train_loss": -37.714752197265625, "global_step": 113824, "epoch": 940} {"train_loss": -38.62101745605469, "global_step": 113825, "epoch": 940} {"train_loss": -38.48274612426758, "global_step": 113826, "epoch": 940} {"train_loss": -38.20835494995117, "global_step": 113827, "epoch": 940} {"train_loss": -38.367454528808594, "global_step": 113828, "epoch": 940} {"train_loss": -38.12761688232422, "global_step": 113829, "epoch": 940} {"train_loss": -38.62793731689453, "global_step": 113830, "epoch": 940} {"train_loss": -38.85490036010742, "global_step": 113831, "epoch": 940} {"train_loss": -38.1424674987793, "global_step": 113832, "epoch": 940} {"train_loss": -38.79499053955078, "global_step": 113833, "epoch": 940} {"train_loss": -38.663875579833984, "global_step": 113834, "epoch": 940} {"train_loss": -37.89875793457031, "global_step": 113835, "epoch": 940} {"train_loss": -38.35357666015625, "global_step": 113836, "epoch": 940} {"train_loss": -38.77827835083008, "global_step": 113837, "epoch": 940} {"train_loss": -38.69347381591797, "global_step": 113838, "epoch": 940} {"train_loss": -38.773895263671875, "global_step": 113839, "epoch": 940} {"train_loss": -38.73448944091797, "global_step": 113840, "epoch": 940} {"train_loss": -39.07296371459961, "global_step": 113841, "epoch": 940} {"train_loss": -38.605201721191406, "global_step": 113842, "epoch": 940} {"train_loss": -38.64765930175781, "global_step": 113843, "epoch": 940} {"train_loss": -38.4506950378418, "global_step": 113844, "epoch": 940} {"train_loss": -38.852561950683594, "global_step": 113845, "epoch": 940} {"train_loss": -39.18606185913086, "global_step": 113846, "epoch": 940} {"train_loss": -39.12364959716797, "global_step": 113847, "epoch": 940} {"train_loss": -39.483001708984375, "global_step": 113848, "epoch": 940} {"train_loss": -38.75846481323242, "global_step": 113849, "epoch": 940} {"train_loss": -38.06365966796875, "global_step": 113850, "epoch": 940} {"train_loss": -39.25681686401367, "global_step": 113851, "epoch": 940} {"train_loss": -39.24764633178711, "global_step": 113852, "epoch": 940} {"train_loss": -39.73329544067383, "global_step": 113853, "epoch": 940} {"train_loss": -39.10676956176758, "global_step": 113854, "epoch": 940} {"train_loss": -39.04899215698242, "global_step": 113855, "epoch": 940} {"train_loss": -39.1553955078125, "global_step": 113856, "epoch": 940} {"train_loss": -39.03306198120117, "global_step": 113857, "epoch": 940} {"train_loss": -39.30965042114258, "global_step": 113858, "epoch": 940} {"train_loss": -39.07533645629883, "global_step": 113859, "epoch": 940} {"train_loss": -37.038585836237125, "global_step": 113860, "epoch": 940, "val_loss": 2841963.0} {"train_loss": -39.196651458740234, "global_step": 113861, "epoch": 941} {"train_loss": -39.37310791015625, "global_step": 113862, "epoch": 941} {"train_loss": -39.71147155761719, "global_step": 113863, "epoch": 941} {"train_loss": -39.439632415771484, "global_step": 113864, "epoch": 941} {"train_loss": -39.65137481689453, "global_step": 113865, "epoch": 941} {"train_loss": -39.57978439331055, "global_step": 113866, "epoch": 941} {"train_loss": -39.75988006591797, "global_step": 113867, "epoch": 941} {"train_loss": -39.15625762939453, "global_step": 113868, "epoch": 941} {"train_loss": -38.60968780517578, "global_step": 113869, "epoch": 941} {"train_loss": -38.35704040527344, "global_step": 113870, "epoch": 941} {"train_loss": -37.91453170776367, "global_step": 113871, "epoch": 941} {"train_loss": -39.05646896362305, "global_step": 113872, "epoch": 941} {"train_loss": -38.309600830078125, "global_step": 113873, "epoch": 941} {"train_loss": -38.47440719604492, "global_step": 113874, "epoch": 941} {"train_loss": -36.00447082519531, "global_step": 113875, "epoch": 941} {"train_loss": -33.0264892578125, "global_step": 113876, "epoch": 941} {"train_loss": -34.906307220458984, "global_step": 113877, "epoch": 941} {"train_loss": -38.235694885253906, "global_step": 113878, "epoch": 941} {"train_loss": -38.89797592163086, "global_step": 113879, "epoch": 941} {"train_loss": -36.77157974243164, "global_step": 113880, "epoch": 941} {"train_loss": -34.63888931274414, "global_step": 113881, "epoch": 941} {"train_loss": -38.9086799621582, "global_step": 113882, "epoch": 941} {"train_loss": -35.46738052368164, "global_step": 113883, "epoch": 941} {"train_loss": -35.74613571166992, "global_step": 113884, "epoch": 941} {"train_loss": -38.70115280151367, "global_step": 113885, "epoch": 941} {"train_loss": -37.139034271240234, "global_step": 113886, "epoch": 941} {"train_loss": -38.610015869140625, "global_step": 113887, "epoch": 941} {"train_loss": -37.03500747680664, "global_step": 113888, "epoch": 941} {"train_loss": -37.519832611083984, "global_step": 113889, "epoch": 941} {"train_loss": -37.89289093017578, "global_step": 113890, "epoch": 941} {"train_loss": -38.17695236206055, "global_step": 113891, "epoch": 941} {"train_loss": -37.3017578125, "global_step": 113892, "epoch": 941} {"train_loss": -37.335670471191406, "global_step": 113893, "epoch": 941} {"train_loss": -38.74153137207031, "global_step": 113894, "epoch": 941} {"train_loss": -38.12211990356445, "global_step": 113895, "epoch": 941} {"train_loss": -37.9830436706543, "global_step": 113896, "epoch": 941} {"train_loss": -37.66752243041992, "global_step": 113897, "epoch": 941} {"train_loss": -38.33665084838867, "global_step": 113898, "epoch": 941} {"train_loss": -38.3323860168457, "global_step": 113899, "epoch": 941} {"train_loss": -38.562232971191406, "global_step": 113900, "epoch": 941} {"train_loss": -38.24935531616211, "global_step": 113901, "epoch": 941} {"train_loss": -38.563514709472656, "global_step": 113902, "epoch": 941} {"train_loss": -38.614315032958984, "global_step": 113903, "epoch": 941} {"train_loss": -38.669654846191406, "global_step": 113904, "epoch": 941} {"train_loss": -38.18855285644531, "global_step": 113905, "epoch": 941} {"train_loss": -37.63191604614258, "global_step": 113906, "epoch": 941} {"train_loss": -37.85608673095703, "global_step": 113907, "epoch": 941} {"train_loss": -38.897396087646484, "global_step": 113908, "epoch": 941} {"train_loss": -38.5867805480957, "global_step": 113909, "epoch": 941} {"train_loss": -37.2210578918457, "global_step": 113910, "epoch": 941} {"train_loss": -37.69232177734375, "global_step": 113911, "epoch": 941} {"train_loss": -38.822906494140625, "global_step": 113912, "epoch": 941} {"train_loss": -38.321651458740234, "global_step": 113913, "epoch": 941} {"train_loss": -38.3671875, "global_step": 113914, "epoch": 941} {"train_loss": -39.11090850830078, "global_step": 113915, "epoch": 941} {"train_loss": -38.662349700927734, "global_step": 113916, "epoch": 941} {"train_loss": -38.037105560302734, "global_step": 113917, "epoch": 941} {"train_loss": -38.72319412231445, "global_step": 113918, "epoch": 941} {"train_loss": -37.475006103515625, "global_step": 113919, "epoch": 941} {"train_loss": -37.072444915771484, "global_step": 113920, "epoch": 941} {"train_loss": -38.55424118041992, "global_step": 113921, "epoch": 941} {"train_loss": -38.1390380859375, "global_step": 113922, "epoch": 941} {"train_loss": -37.07908630371094, "global_step": 113923, "epoch": 941} {"train_loss": -38.45173263549805, "global_step": 113924, "epoch": 941} {"train_loss": -38.49549102783203, "global_step": 113925, "epoch": 941} {"train_loss": -38.27743148803711, "global_step": 113926, "epoch": 941} {"train_loss": -38.59904861450195, "global_step": 113927, "epoch": 941} {"train_loss": -38.79429244995117, "global_step": 113928, "epoch": 941} {"train_loss": -38.332889556884766, "global_step": 113929, "epoch": 941} {"train_loss": -38.43645095825195, "global_step": 113930, "epoch": 941} {"train_loss": -38.119815826416016, "global_step": 113931, "epoch": 941} {"train_loss": -37.408233642578125, "global_step": 113932, "epoch": 941} {"train_loss": -37.409481048583984, "global_step": 113933, "epoch": 941} {"train_loss": -38.25956344604492, "global_step": 113934, "epoch": 941} {"train_loss": -38.498470306396484, "global_step": 113935, "epoch": 941} {"train_loss": -37.389766693115234, "global_step": 113936, "epoch": 941} {"train_loss": -38.738037109375, "global_step": 113937, "epoch": 941} {"train_loss": -38.01570129394531, "global_step": 113938, "epoch": 941} {"train_loss": -38.14262008666992, "global_step": 113939, "epoch": 941} {"train_loss": -38.872615814208984, "global_step": 113940, "epoch": 941} {"train_loss": -38.38337707519531, "global_step": 113941, "epoch": 941} {"train_loss": -38.16218948364258, "global_step": 113942, "epoch": 941} {"train_loss": -37.66804885864258, "global_step": 113943, "epoch": 941} {"train_loss": -39.22251510620117, "global_step": 113944, "epoch": 941} {"train_loss": -38.89020919799805, "global_step": 113945, "epoch": 941} {"train_loss": -39.4837646484375, "global_step": 113946, "epoch": 941} {"train_loss": -38.86769485473633, "global_step": 113947, "epoch": 941} {"train_loss": -37.95338439941406, "global_step": 113948, "epoch": 941} {"train_loss": -39.50128936767578, "global_step": 113949, "epoch": 941} {"train_loss": -38.28596115112305, "global_step": 113950, "epoch": 941} {"train_loss": -38.89179229736328, "global_step": 113951, "epoch": 941} {"train_loss": -38.78554916381836, "global_step": 113952, "epoch": 941} {"train_loss": -37.83564376831055, "global_step": 113953, "epoch": 941} {"train_loss": -37.596435546875, "global_step": 113954, "epoch": 941} {"train_loss": -39.29111862182617, "global_step": 113955, "epoch": 941} {"train_loss": -39.330833435058594, "global_step": 113956, "epoch": 941} {"train_loss": -38.31629943847656, "global_step": 113957, "epoch": 941} {"train_loss": -38.22408676147461, "global_step": 113958, "epoch": 941} {"train_loss": -39.0554313659668, "global_step": 113959, "epoch": 941} {"train_loss": -38.33298873901367, "global_step": 113960, "epoch": 941} {"train_loss": -38.64567184448242, "global_step": 113961, "epoch": 941} {"train_loss": -38.53285598754883, "global_step": 113962, "epoch": 941} {"train_loss": -38.596824645996094, "global_step": 113963, "epoch": 941} {"train_loss": -38.14094924926758, "global_step": 113964, "epoch": 941} {"train_loss": -37.21657943725586, "global_step": 113965, "epoch": 941} {"train_loss": -39.268917083740234, "global_step": 113966, "epoch": 941} {"train_loss": -38.2104606628418, "global_step": 113967, "epoch": 941} {"train_loss": -38.810638427734375, "global_step": 113968, "epoch": 941} {"train_loss": -37.94524383544922, "global_step": 113969, "epoch": 941} {"train_loss": -38.855079650878906, "global_step": 113970, "epoch": 941} {"train_loss": -38.46148681640625, "global_step": 113971, "epoch": 941} {"train_loss": -39.18991470336914, "global_step": 113972, "epoch": 941} {"train_loss": -38.87812423706055, "global_step": 113973, "epoch": 941} {"train_loss": -39.154457092285156, "global_step": 113974, "epoch": 941} {"train_loss": -38.899566650390625, "global_step": 113975, "epoch": 941} {"train_loss": -39.267822265625, "global_step": 113976, "epoch": 941} {"train_loss": -38.893341064453125, "global_step": 113977, "epoch": 941} {"train_loss": -38.58906936645508, "global_step": 113978, "epoch": 941} {"train_loss": -38.4464111328125, "global_step": 113979, "epoch": 941} {"train_loss": -36.9788818359375, "global_step": 113980, "epoch": 941} {"train_loss": -38.2335049337592, "global_step": 113981, "epoch": 941, "val_loss": 2751971.75} {"train_loss": -35.24628829956055, "global_step": 113982, "epoch": 942} {"train_loss": -35.06175994873047, "global_step": 113983, "epoch": 942} {"train_loss": -34.15824508666992, "global_step": 113984, "epoch": 942} {"train_loss": -36.548255920410156, "global_step": 113985, "epoch": 942} {"train_loss": -39.56956481933594, "global_step": 113986, "epoch": 942} {"train_loss": -36.47782897949219, "global_step": 113987, "epoch": 942} {"train_loss": -38.082763671875, "global_step": 113988, "epoch": 942} {"train_loss": -38.45542526245117, "global_step": 113989, "epoch": 942} {"train_loss": -38.700958251953125, "global_step": 113990, "epoch": 942} {"train_loss": -38.03019332885742, "global_step": 113991, "epoch": 942} {"train_loss": -38.72237777709961, "global_step": 113992, "epoch": 942} {"train_loss": -39.052284240722656, "global_step": 113993, "epoch": 942} {"train_loss": -38.9508171081543, "global_step": 113994, "epoch": 942} {"train_loss": -39.351234436035156, "global_step": 113995, "epoch": 942} {"train_loss": -38.8498649597168, "global_step": 113996, "epoch": 942} {"train_loss": -39.35490036010742, "global_step": 113997, "epoch": 942} {"train_loss": -39.5946159362793, "global_step": 113998, "epoch": 942} {"train_loss": -39.58732223510742, "global_step": 113999, "epoch": 942} {"train_loss": -38.4980583190918, "global_step": 114000, "epoch": 942} {"train_loss": -39.397193908691406, "global_step": 114001, "epoch": 942} {"train_loss": -38.587703704833984, "global_step": 114002, "epoch": 942} {"train_loss": -38.947731018066406, "global_step": 114003, "epoch": 942} {"train_loss": -38.93107223510742, "global_step": 114004, "epoch": 942} {"train_loss": -37.5625, "global_step": 114005, "epoch": 942} {"train_loss": -38.81159591674805, "global_step": 114006, "epoch": 942} {"train_loss": -39.064186096191406, "global_step": 114007, "epoch": 942} {"train_loss": -38.94207763671875, "global_step": 114008, "epoch": 942} {"train_loss": -39.246150970458984, "global_step": 114009, "epoch": 942} {"train_loss": -38.617950439453125, "global_step": 114010, "epoch": 942} {"train_loss": -38.96037292480469, "global_step": 114011, "epoch": 942} {"train_loss": -39.420528411865234, "global_step": 114012, "epoch": 942} {"train_loss": -39.46358108520508, "global_step": 114013, "epoch": 942} {"train_loss": -39.029598236083984, "global_step": 114014, "epoch": 942} {"train_loss": -39.59237289428711, "global_step": 114015, "epoch": 942} {"train_loss": -38.942745208740234, "global_step": 114016, "epoch": 942} {"train_loss": -39.31232452392578, "global_step": 114017, "epoch": 942} {"train_loss": -39.650047302246094, "global_step": 114018, "epoch": 942} {"train_loss": -39.65400314331055, "global_step": 114019, "epoch": 942} {"train_loss": -38.94993209838867, "global_step": 114020, "epoch": 942} {"train_loss": -39.369564056396484, "global_step": 114021, "epoch": 942} {"train_loss": -39.52933883666992, "global_step": 114022, "epoch": 942} {"train_loss": -39.91610336303711, "global_step": 114023, "epoch": 942} {"train_loss": -39.58785629272461, "global_step": 114024, "epoch": 942} {"train_loss": -39.60647201538086, "global_step": 114025, "epoch": 942} {"train_loss": -40.0275993347168, "global_step": 114026, "epoch": 942} {"train_loss": -39.60786056518555, "global_step": 114027, "epoch": 942} {"train_loss": -39.81126022338867, "global_step": 114028, "epoch": 942} {"train_loss": -38.538509368896484, "global_step": 114029, "epoch": 942} {"train_loss": -39.9730339050293, "global_step": 114030, "epoch": 942} {"train_loss": -37.83160400390625, "global_step": 114031, "epoch": 942} {"train_loss": -38.900028228759766, "global_step": 114032, "epoch": 942} {"train_loss": -39.51870346069336, "global_step": 114033, "epoch": 942} {"train_loss": -37.86167526245117, "global_step": 114034, "epoch": 942} {"train_loss": -39.44529342651367, "global_step": 114035, "epoch": 942} {"train_loss": -38.045162200927734, "global_step": 114036, "epoch": 942} {"train_loss": -39.41008377075195, "global_step": 114037, "epoch": 942} {"train_loss": -39.19826126098633, "global_step": 114038, "epoch": 942} {"train_loss": -37.97489547729492, "global_step": 114039, "epoch": 942} {"train_loss": -39.234310150146484, "global_step": 114040, "epoch": 942} {"train_loss": -38.65743637084961, "global_step": 114041, "epoch": 942} {"train_loss": -39.10050582885742, "global_step": 114042, "epoch": 942} {"train_loss": -38.744720458984375, "global_step": 114043, "epoch": 942} {"train_loss": -38.848182678222656, "global_step": 114044, "epoch": 942} {"train_loss": -37.43593215942383, "global_step": 114045, "epoch": 942} {"train_loss": -36.36322021484375, "global_step": 114046, "epoch": 942} {"train_loss": -35.73777389526367, "global_step": 114047, "epoch": 942} {"train_loss": -37.70777893066406, "global_step": 114048, "epoch": 942} {"train_loss": -33.206356048583984, "global_step": 114049, "epoch": 942} {"train_loss": -30.34739112854004, "global_step": 114050, "epoch": 942} {"train_loss": -24.664825439453125, "global_step": 114051, "epoch": 942} {"train_loss": -22.457258224487305, "global_step": 114052, "epoch": 942} {"train_loss": -32.566829681396484, "global_step": 114053, "epoch": 942} {"train_loss": -34.834739685058594, "global_step": 114054, "epoch": 942} {"train_loss": -21.635101318359375, "global_step": 114055, "epoch": 942} {"train_loss": -33.5418586730957, "global_step": 114056, "epoch": 942} {"train_loss": -31.37135124206543, "global_step": 114057, "epoch": 942} {"train_loss": -32.24446487426758, "global_step": 114058, "epoch": 942} {"train_loss": -34.19792556762695, "global_step": 114059, "epoch": 942} {"train_loss": -34.97336959838867, "global_step": 114060, "epoch": 942} {"train_loss": -33.86603546142578, "global_step": 114061, "epoch": 942} {"train_loss": -37.01081466674805, "global_step": 114062, "epoch": 942} {"train_loss": -33.49508285522461, "global_step": 114063, "epoch": 942} {"train_loss": -37.52106475830078, "global_step": 114064, "epoch": 942} {"train_loss": -35.49436569213867, "global_step": 114065, "epoch": 942} {"train_loss": -36.379085540771484, "global_step": 114066, "epoch": 942} {"train_loss": -38.0007438659668, "global_step": 114067, "epoch": 942} {"train_loss": -36.4626350402832, "global_step": 114068, "epoch": 942} {"train_loss": -37.386295318603516, "global_step": 114069, "epoch": 942} {"train_loss": -37.87480926513672, "global_step": 114070, "epoch": 942} {"train_loss": -37.26079559326172, "global_step": 114071, "epoch": 942} {"train_loss": -37.65819549560547, "global_step": 114072, "epoch": 942} {"train_loss": -38.0250358581543, "global_step": 114073, "epoch": 942} {"train_loss": -37.825927734375, "global_step": 114074, "epoch": 942} {"train_loss": -38.22747802734375, "global_step": 114075, "epoch": 942} {"train_loss": -38.18276596069336, "global_step": 114076, "epoch": 942} {"train_loss": -37.7828369140625, "global_step": 114077, "epoch": 942} {"train_loss": -38.024505615234375, "global_step": 114078, "epoch": 942} {"train_loss": -38.22944259643555, "global_step": 114079, "epoch": 942} {"train_loss": -37.85910415649414, "global_step": 114080, "epoch": 942} {"train_loss": -38.66164779663086, "global_step": 114081, "epoch": 942} {"train_loss": -38.6380500793457, "global_step": 114082, "epoch": 942} {"train_loss": -38.22156524658203, "global_step": 114083, "epoch": 942} {"train_loss": -39.12554931640625, "global_step": 114084, "epoch": 942} {"train_loss": -38.233253479003906, "global_step": 114085, "epoch": 942} {"train_loss": -38.31937026977539, "global_step": 114086, "epoch": 942} {"train_loss": -38.8223762512207, "global_step": 114087, "epoch": 942} {"train_loss": -38.93905258178711, "global_step": 114088, "epoch": 942} {"train_loss": -37.98160934448242, "global_step": 114089, "epoch": 942} {"train_loss": -38.66144943237305, "global_step": 114090, "epoch": 942} {"train_loss": -38.889896392822266, "global_step": 114091, "epoch": 942} {"train_loss": -38.906036376953125, "global_step": 114092, "epoch": 942} {"train_loss": -39.4199104309082, "global_step": 114093, "epoch": 942} {"train_loss": -38.54315185546875, "global_step": 114094, "epoch": 942} {"train_loss": -39.391334533691406, "global_step": 114095, "epoch": 942} {"train_loss": -39.480010986328125, "global_step": 114096, "epoch": 942} {"train_loss": -39.24790954589844, "global_step": 114097, "epoch": 942} {"train_loss": -39.06733322143555, "global_step": 114098, "epoch": 942} {"train_loss": -39.03668212890625, "global_step": 114099, "epoch": 942} {"train_loss": -37.649288177490234, "global_step": 114100, "epoch": 942} {"train_loss": -39.25326156616211, "global_step": 114101, "epoch": 942} {"train_loss": -37.61862114835377, "global_step": 114102, "epoch": 942, "val_loss": 2738568.0} {"train_loss": -39.46073532104492, "global_step": 114103, "epoch": 943} {"train_loss": -39.25782012939453, "global_step": 114104, "epoch": 943} {"train_loss": -39.521297454833984, "global_step": 114105, "epoch": 943} {"train_loss": -39.2178955078125, "global_step": 114106, "epoch": 943} {"train_loss": -39.49065399169922, "global_step": 114107, "epoch": 943} {"train_loss": -39.48335647583008, "global_step": 114108, "epoch": 943} {"train_loss": -39.31893539428711, "global_step": 114109, "epoch": 943} {"train_loss": -39.54796600341797, "global_step": 114110, "epoch": 943} {"train_loss": -39.525142669677734, "global_step": 114111, "epoch": 943} {"train_loss": -39.6936149597168, "global_step": 114112, "epoch": 943} {"train_loss": -39.77414321899414, "global_step": 114113, "epoch": 943} {"train_loss": -39.740020751953125, "global_step": 114114, "epoch": 943} {"train_loss": -39.5388298034668, "global_step": 114115, "epoch": 943} {"train_loss": -39.7092170715332, "global_step": 114116, "epoch": 943} {"train_loss": -39.67168426513672, "global_step": 114117, "epoch": 943} {"train_loss": -39.47522735595703, "global_step": 114118, "epoch": 943} {"train_loss": -39.44068145751953, "global_step": 114119, "epoch": 943} {"train_loss": -39.26007843017578, "global_step": 114120, "epoch": 943} {"train_loss": -39.651039123535156, "global_step": 114121, "epoch": 943} {"train_loss": -39.39129638671875, "global_step": 114122, "epoch": 943} {"train_loss": -39.639991760253906, "global_step": 114123, "epoch": 943} {"train_loss": -40.24081039428711, "global_step": 114124, "epoch": 943} {"train_loss": -39.9227294921875, "global_step": 114125, "epoch": 943} {"train_loss": -40.12148666381836, "global_step": 114126, "epoch": 943} {"train_loss": -40.25213623046875, "global_step": 114127, "epoch": 943} {"train_loss": -40.22614288330078, "global_step": 114128, "epoch": 943} {"train_loss": -39.59033203125, "global_step": 114129, "epoch": 943} {"train_loss": -40.16880416870117, "global_step": 114130, "epoch": 943} {"train_loss": -40.14146041870117, "global_step": 114131, "epoch": 943} {"train_loss": -40.087501525878906, "global_step": 114132, "epoch": 943} {"train_loss": -40.3435173034668, "global_step": 114133, "epoch": 943} {"train_loss": -40.247127532958984, "global_step": 114134, "epoch": 943} {"train_loss": -39.9698600769043, "global_step": 114135, "epoch": 943} {"train_loss": -39.48783493041992, "global_step": 114136, "epoch": 943} {"train_loss": -36.87543869018555, "global_step": 114137, "epoch": 943} {"train_loss": -34.90555953979492, "global_step": 114138, "epoch": 943} {"train_loss": -35.970916748046875, "global_step": 114139, "epoch": 943} {"train_loss": -35.82197952270508, "global_step": 114140, "epoch": 943} {"train_loss": -34.12769317626953, "global_step": 114141, "epoch": 943} {"train_loss": -35.63068771362305, "global_step": 114142, "epoch": 943} {"train_loss": -33.78829574584961, "global_step": 114143, "epoch": 943} {"train_loss": -34.073143005371094, "global_step": 114144, "epoch": 943} {"train_loss": -35.96266555786133, "global_step": 114145, "epoch": 943} {"train_loss": -35.42128372192383, "global_step": 114146, "epoch": 943} {"train_loss": -37.292274475097656, "global_step": 114147, "epoch": 943} {"train_loss": -39.13411331176758, "global_step": 114148, "epoch": 943} {"train_loss": -37.80192947387695, "global_step": 114149, "epoch": 943} {"train_loss": -37.591766357421875, "global_step": 114150, "epoch": 943} {"train_loss": -37.97758483886719, "global_step": 114151, "epoch": 943} {"train_loss": -38.66868209838867, "global_step": 114152, "epoch": 943} {"train_loss": -38.21102523803711, "global_step": 114153, "epoch": 943} {"train_loss": -38.130821228027344, "global_step": 114154, "epoch": 943} {"train_loss": -39.155067443847656, "global_step": 114155, "epoch": 943} {"train_loss": -38.48887252807617, "global_step": 114156, "epoch": 943} {"train_loss": -39.14850616455078, "global_step": 114157, "epoch": 943} {"train_loss": -38.578250885009766, "global_step": 114158, "epoch": 943} {"train_loss": -38.98525619506836, "global_step": 114159, "epoch": 943} {"train_loss": -38.92414093017578, "global_step": 114160, "epoch": 943} {"train_loss": -38.99101257324219, "global_step": 114161, "epoch": 943} {"train_loss": -39.44002151489258, "global_step": 114162, "epoch": 943} {"train_loss": -39.1278076171875, "global_step": 114163, "epoch": 943} {"train_loss": -39.39667510986328, "global_step": 114164, "epoch": 943} {"train_loss": -39.11882781982422, "global_step": 114165, "epoch": 943} {"train_loss": -39.280555725097656, "global_step": 114166, "epoch": 943} {"train_loss": -38.912940979003906, "global_step": 114167, "epoch": 943} {"train_loss": -38.94455337524414, "global_step": 114168, "epoch": 943} {"train_loss": -39.42911911010742, "global_step": 114169, "epoch": 943} {"train_loss": -39.35957717895508, "global_step": 114170, "epoch": 943} {"train_loss": -39.396034240722656, "global_step": 114171, "epoch": 943} {"train_loss": -38.96540451049805, "global_step": 114172, "epoch": 943} {"train_loss": -38.39473342895508, "global_step": 114173, "epoch": 943} {"train_loss": -39.33674240112305, "global_step": 114174, "epoch": 943} {"train_loss": -39.187496185302734, "global_step": 114175, "epoch": 943} {"train_loss": -38.31219482421875, "global_step": 114176, "epoch": 943} {"train_loss": -39.563018798828125, "global_step": 114177, "epoch": 943} {"train_loss": -38.907230377197266, "global_step": 114178, "epoch": 943} {"train_loss": -39.224002838134766, "global_step": 114179, "epoch": 943} {"train_loss": -40.00959014892578, "global_step": 114180, "epoch": 943} {"train_loss": -39.25688171386719, "global_step": 114181, "epoch": 943} {"train_loss": -37.73350143432617, "global_step": 114182, "epoch": 943} {"train_loss": -37.79446029663086, "global_step": 114183, "epoch": 943} {"train_loss": -38.379302978515625, "global_step": 114184, "epoch": 943} {"train_loss": -39.10651779174805, "global_step": 114185, "epoch": 943} {"train_loss": -37.53556442260742, "global_step": 114186, "epoch": 943} {"train_loss": -37.80475616455078, "global_step": 114187, "epoch": 943} {"train_loss": -39.07255935668945, "global_step": 114188, "epoch": 943} {"train_loss": -37.958770751953125, "global_step": 114189, "epoch": 943} {"train_loss": -35.44813919067383, "global_step": 114190, "epoch": 943} {"train_loss": -38.61409378051758, "global_step": 114191, "epoch": 943} {"train_loss": -38.0854377746582, "global_step": 114192, "epoch": 943} {"train_loss": -37.55031967163086, "global_step": 114193, "epoch": 943} {"train_loss": -38.8520393371582, "global_step": 114194, "epoch": 943} {"train_loss": -37.49921798706055, "global_step": 114195, "epoch": 943} {"train_loss": -38.04623031616211, "global_step": 114196, "epoch": 943} {"train_loss": -38.5539436340332, "global_step": 114197, "epoch": 943} {"train_loss": -38.11434555053711, "global_step": 114198, "epoch": 943} {"train_loss": -39.12778854370117, "global_step": 114199, "epoch": 943} {"train_loss": -38.012813568115234, "global_step": 114200, "epoch": 943} {"train_loss": -39.54566955566406, "global_step": 114201, "epoch": 943} {"train_loss": -37.805179595947266, "global_step": 114202, "epoch": 943} {"train_loss": -39.34560775756836, "global_step": 114203, "epoch": 943} {"train_loss": -38.08012771606445, "global_step": 114204, "epoch": 943} {"train_loss": -39.15140914916992, "global_step": 114205, "epoch": 943} {"train_loss": -38.74163818359375, "global_step": 114206, "epoch": 943} {"train_loss": -38.38229751586914, "global_step": 114207, "epoch": 943} {"train_loss": -39.05922317504883, "global_step": 114208, "epoch": 943} {"train_loss": -38.78923034667969, "global_step": 114209, "epoch": 943} {"train_loss": -39.153045654296875, "global_step": 114210, "epoch": 943} {"train_loss": -39.34559631347656, "global_step": 114211, "epoch": 943} {"train_loss": -38.86851501464844, "global_step": 114212, "epoch": 943} {"train_loss": -39.20849609375, "global_step": 114213, "epoch": 943} {"train_loss": -39.54110336303711, "global_step": 114214, "epoch": 943} {"train_loss": -38.24049758911133, "global_step": 114215, "epoch": 943} {"train_loss": -39.010005950927734, "global_step": 114216, "epoch": 943} {"train_loss": -39.38862228393555, "global_step": 114217, "epoch": 943} {"train_loss": -39.55772018432617, "global_step": 114218, "epoch": 943} {"train_loss": -39.328975677490234, "global_step": 114219, "epoch": 943} {"train_loss": -39.15383529663086, "global_step": 114220, "epoch": 943} {"train_loss": -39.38065719604492, "global_step": 114221, "epoch": 943} {"train_loss": -38.861900329589844, "global_step": 114222, "epoch": 943} {"train_loss": -38.71088046869956, "global_step": 114223, "epoch": 943, "val_loss": 2753370.75} {"train_loss": -39.36199951171875, "global_step": 114224, "epoch": 944} {"train_loss": -40.2969970703125, "global_step": 114225, "epoch": 944} {"train_loss": -39.61790084838867, "global_step": 114226, "epoch": 944} {"train_loss": -39.535457611083984, "global_step": 114227, "epoch": 944} {"train_loss": -39.05731964111328, "global_step": 114228, "epoch": 944} {"train_loss": -39.38932418823242, "global_step": 114229, "epoch": 944} {"train_loss": -39.52077102661133, "global_step": 114230, "epoch": 944} {"train_loss": -39.48215866088867, "global_step": 114231, "epoch": 944} {"train_loss": -39.64193344116211, "global_step": 114232, "epoch": 944} {"train_loss": -39.4649658203125, "global_step": 114233, "epoch": 944} {"train_loss": -39.650665283203125, "global_step": 114234, "epoch": 944} {"train_loss": -39.26424026489258, "global_step": 114235, "epoch": 944} {"train_loss": -39.171356201171875, "global_step": 114236, "epoch": 944} {"train_loss": -39.900081634521484, "global_step": 114237, "epoch": 944} {"train_loss": -38.5485954284668, "global_step": 114238, "epoch": 944} {"train_loss": -38.773406982421875, "global_step": 114239, "epoch": 944} {"train_loss": -39.021183013916016, "global_step": 114240, "epoch": 944} {"train_loss": -38.36534118652344, "global_step": 114241, "epoch": 944} {"train_loss": -38.2063102722168, "global_step": 114242, "epoch": 944} {"train_loss": -37.91941452026367, "global_step": 114243, "epoch": 944} {"train_loss": -39.3905029296875, "global_step": 114244, "epoch": 944} {"train_loss": -39.114654541015625, "global_step": 114245, "epoch": 944} {"train_loss": -38.60463333129883, "global_step": 114246, "epoch": 944} {"train_loss": -34.694244384765625, "global_step": 114247, "epoch": 944} {"train_loss": -32.041015625, "global_step": 114248, "epoch": 944} {"train_loss": -32.30967330932617, "global_step": 114249, "epoch": 944} {"train_loss": -37.71620178222656, "global_step": 114250, "epoch": 944} {"train_loss": -38.6702880859375, "global_step": 114251, "epoch": 944} {"train_loss": -37.65686798095703, "global_step": 114252, "epoch": 944} {"train_loss": -38.57041549682617, "global_step": 114253, "epoch": 944} {"train_loss": -38.37137222290039, "global_step": 114254, "epoch": 944} {"train_loss": -38.3452033996582, "global_step": 114255, "epoch": 944} {"train_loss": -37.994693756103516, "global_step": 114256, "epoch": 944} {"train_loss": -37.84385681152344, "global_step": 114257, "epoch": 944} {"train_loss": -37.40032196044922, "global_step": 114258, "epoch": 944} {"train_loss": -38.07780075073242, "global_step": 114259, "epoch": 944} {"train_loss": -37.89083480834961, "global_step": 114260, "epoch": 944} {"train_loss": -38.64257049560547, "global_step": 114261, "epoch": 944} {"train_loss": -39.38956832885742, "global_step": 114262, "epoch": 944} {"train_loss": -39.124027252197266, "global_step": 114263, "epoch": 944} {"train_loss": -39.33837127685547, "global_step": 114264, "epoch": 944} {"train_loss": -39.31153106689453, "global_step": 114265, "epoch": 944} {"train_loss": -39.066261291503906, "global_step": 114266, "epoch": 944} {"train_loss": -39.51264190673828, "global_step": 114267, "epoch": 944} {"train_loss": -38.96550369262695, "global_step": 114268, "epoch": 944} {"train_loss": -39.42558288574219, "global_step": 114269, "epoch": 944} {"train_loss": -39.25654983520508, "global_step": 114270, "epoch": 944} {"train_loss": -37.62033462524414, "global_step": 114271, "epoch": 944} {"train_loss": -39.22240447998047, "global_step": 114272, "epoch": 944} {"train_loss": -38.35488510131836, "global_step": 114273, "epoch": 944} {"train_loss": -38.80768966674805, "global_step": 114274, "epoch": 944} {"train_loss": -38.25893783569336, "global_step": 114275, "epoch": 944} {"train_loss": -37.41276931762695, "global_step": 114276, "epoch": 944} {"train_loss": -35.762306213378906, "global_step": 114277, "epoch": 944} {"train_loss": -39.26829147338867, "global_step": 114278, "epoch": 944} {"train_loss": -39.794158935546875, "global_step": 114279, "epoch": 944} {"train_loss": -38.74827194213867, "global_step": 114280, "epoch": 944} {"train_loss": -38.66858673095703, "global_step": 114281, "epoch": 944} {"train_loss": -39.52294921875, "global_step": 114282, "epoch": 944} {"train_loss": -38.478729248046875, "global_step": 114283, "epoch": 944} {"train_loss": -39.96648406982422, "global_step": 114284, "epoch": 944} {"train_loss": -39.77263259887695, "global_step": 114285, "epoch": 944} {"train_loss": -38.18056106567383, "global_step": 114286, "epoch": 944} {"train_loss": -39.32537078857422, "global_step": 114287, "epoch": 944} {"train_loss": -39.11919021606445, "global_step": 114288, "epoch": 944} {"train_loss": -39.5846061706543, "global_step": 114289, "epoch": 944} {"train_loss": -39.842960357666016, "global_step": 114290, "epoch": 944} {"train_loss": -39.78679275512695, "global_step": 114291, "epoch": 944} {"train_loss": -39.90818786621094, "global_step": 114292, "epoch": 944} {"train_loss": -38.535892486572266, "global_step": 114293, "epoch": 944} {"train_loss": -39.923709869384766, "global_step": 114294, "epoch": 944} {"train_loss": -40.04741668701172, "global_step": 114295, "epoch": 944} {"train_loss": -39.884517669677734, "global_step": 114296, "epoch": 944} {"train_loss": -39.8137321472168, "global_step": 114297, "epoch": 944} {"train_loss": -39.23897933959961, "global_step": 114298, "epoch": 944} {"train_loss": -39.217716217041016, "global_step": 114299, "epoch": 944} {"train_loss": -40.08429718017578, "global_step": 114300, "epoch": 944} {"train_loss": -39.25531005859375, "global_step": 114301, "epoch": 944} {"train_loss": -38.53371047973633, "global_step": 114302, "epoch": 944} {"train_loss": -38.557350158691406, "global_step": 114303, "epoch": 944} {"train_loss": -37.4608039855957, "global_step": 114304, "epoch": 944} {"train_loss": -35.609954833984375, "global_step": 114305, "epoch": 944} {"train_loss": -39.729942321777344, "global_step": 114306, "epoch": 944} {"train_loss": -39.2310791015625, "global_step": 114307, "epoch": 944} {"train_loss": -34.65214157104492, "global_step": 114308, "epoch": 944} {"train_loss": -37.440120697021484, "global_step": 114309, "epoch": 944} {"train_loss": -39.242881774902344, "global_step": 114310, "epoch": 944} {"train_loss": -37.159786224365234, "global_step": 114311, "epoch": 944} {"train_loss": -37.737770080566406, "global_step": 114312, "epoch": 944} {"train_loss": -38.587371826171875, "global_step": 114313, "epoch": 944} {"train_loss": -37.260986328125, "global_step": 114314, "epoch": 944} {"train_loss": -37.386959075927734, "global_step": 114315, "epoch": 944} {"train_loss": -37.207740783691406, "global_step": 114316, "epoch": 944} {"train_loss": -37.635894775390625, "global_step": 114317, "epoch": 944} {"train_loss": -36.306053161621094, "global_step": 114318, "epoch": 944} {"train_loss": -37.07688903808594, "global_step": 114319, "epoch": 944} {"train_loss": -37.69313049316406, "global_step": 114320, "epoch": 944} {"train_loss": -36.57607650756836, "global_step": 114321, "epoch": 944} {"train_loss": -37.191158294677734, "global_step": 114322, "epoch": 944} {"train_loss": -34.03388977050781, "global_step": 114323, "epoch": 944} {"train_loss": -37.23809814453125, "global_step": 114324, "epoch": 944} {"train_loss": -35.11750411987305, "global_step": 114325, "epoch": 944} {"train_loss": -37.8181266784668, "global_step": 114326, "epoch": 944} {"train_loss": -36.44065475463867, "global_step": 114327, "epoch": 944} {"train_loss": -30.102319717407227, "global_step": 114328, "epoch": 944} {"train_loss": -34.088985443115234, "global_step": 114329, "epoch": 944} {"train_loss": -31.088001251220703, "global_step": 114330, "epoch": 944} {"train_loss": -34.78885269165039, "global_step": 114331, "epoch": 944} {"train_loss": -33.71788024902344, "global_step": 114332, "epoch": 944} {"train_loss": -33.068668365478516, "global_step": 114333, "epoch": 944} {"train_loss": -33.37693405151367, "global_step": 114334, "epoch": 944} {"train_loss": -34.424774169921875, "global_step": 114335, "epoch": 944} {"train_loss": -32.29224395751953, "global_step": 114336, "epoch": 944} {"train_loss": -33.95207595825195, "global_step": 114337, "epoch": 944} {"train_loss": -32.45272445678711, "global_step": 114338, "epoch": 944} {"train_loss": -33.29812240600586, "global_step": 114339, "epoch": 944} {"train_loss": -34.94427490234375, "global_step": 114340, "epoch": 944} {"train_loss": -34.73138427734375, "global_step": 114341, "epoch": 944} {"train_loss": -34.8661994934082, "global_step": 114342, "epoch": 944} {"train_loss": -34.98707962036133, "global_step": 114343, "epoch": 944} {"train_loss": -37.71283502815184, "global_step": 114344, "epoch": 944, "val_loss": 2827734.0} {"train_loss": -35.75356674194336, "global_step": 114345, "epoch": 945} {"train_loss": -34.15426254272461, "global_step": 114346, "epoch": 945} {"train_loss": -33.767879486083984, "global_step": 114347, "epoch": 945} {"train_loss": -35.8012809753418, "global_step": 114348, "epoch": 945} {"train_loss": -36.31477355957031, "global_step": 114349, "epoch": 945} {"train_loss": -36.02389907836914, "global_step": 114350, "epoch": 945} {"train_loss": -36.47917938232422, "global_step": 114351, "epoch": 945} {"train_loss": -36.11302185058594, "global_step": 114352, "epoch": 945} {"train_loss": -36.34852981567383, "global_step": 114353, "epoch": 945} {"train_loss": -36.45050048828125, "global_step": 114354, "epoch": 945} {"train_loss": -36.659725189208984, "global_step": 114355, "epoch": 945} {"train_loss": -35.30990219116211, "global_step": 114356, "epoch": 945} {"train_loss": -36.85749053955078, "global_step": 114357, "epoch": 945} {"train_loss": -36.929466247558594, "global_step": 114358, "epoch": 945} {"train_loss": -35.93398666381836, "global_step": 114359, "epoch": 945} {"train_loss": -36.5956916809082, "global_step": 114360, "epoch": 945} {"train_loss": -36.84697723388672, "global_step": 114361, "epoch": 945} {"train_loss": -37.02511215209961, "global_step": 114362, "epoch": 945} {"train_loss": -37.63986587524414, "global_step": 114363, "epoch": 945} {"train_loss": -36.96671676635742, "global_step": 114364, "epoch": 945} {"train_loss": -36.991371154785156, "global_step": 114365, "epoch": 945} {"train_loss": -35.855918884277344, "global_step": 114366, "epoch": 945} {"train_loss": -37.60250473022461, "global_step": 114367, "epoch": 945} {"train_loss": -37.16135025024414, "global_step": 114368, "epoch": 945} {"train_loss": -37.3183708190918, "global_step": 114369, "epoch": 945} {"train_loss": -37.37932586669922, "global_step": 114370, "epoch": 945} {"train_loss": -37.71975326538086, "global_step": 114371, "epoch": 945} {"train_loss": -37.59428024291992, "global_step": 114372, "epoch": 945} {"train_loss": -38.26996612548828, "global_step": 114373, "epoch": 945} {"train_loss": -37.5544319152832, "global_step": 114374, "epoch": 945} {"train_loss": -38.0034294128418, "global_step": 114375, "epoch": 945} {"train_loss": -37.40232467651367, "global_step": 114376, "epoch": 945} {"train_loss": -37.87895584106445, "global_step": 114377, "epoch": 945} {"train_loss": -36.950050354003906, "global_step": 114378, "epoch": 945} {"train_loss": -37.92998123168945, "global_step": 114379, "epoch": 945} {"train_loss": -37.95322799682617, "global_step": 114380, "epoch": 945} {"train_loss": -37.417335510253906, "global_step": 114381, "epoch": 945} {"train_loss": -38.08210372924805, "global_step": 114382, "epoch": 945} {"train_loss": -37.721370697021484, "global_step": 114383, "epoch": 945} {"train_loss": -37.82426071166992, "global_step": 114384, "epoch": 945} {"train_loss": -37.430259704589844, "global_step": 114385, "epoch": 945} {"train_loss": -37.81758499145508, "global_step": 114386, "epoch": 945} {"train_loss": -38.0349006652832, "global_step": 114387, "epoch": 945} {"train_loss": -38.36502456665039, "global_step": 114388, "epoch": 945} {"train_loss": -38.80930709838867, "global_step": 114389, "epoch": 945} {"train_loss": -38.187644958496094, "global_step": 114390, "epoch": 945} {"train_loss": -38.43429183959961, "global_step": 114391, "epoch": 945} {"train_loss": -39.03399658203125, "global_step": 114392, "epoch": 945} {"train_loss": -38.46688461303711, "global_step": 114393, "epoch": 945} {"train_loss": -38.25613021850586, "global_step": 114394, "epoch": 945} {"train_loss": -37.916717529296875, "global_step": 114395, "epoch": 945} {"train_loss": -38.25725173950195, "global_step": 114396, "epoch": 945} {"train_loss": -37.922157287597656, "global_step": 114397, "epoch": 945} {"train_loss": -38.654293060302734, "global_step": 114398, "epoch": 945} {"train_loss": -38.859153747558594, "global_step": 114399, "epoch": 945} {"train_loss": -38.23921585083008, "global_step": 114400, "epoch": 945} {"train_loss": -38.03701400756836, "global_step": 114401, "epoch": 945} {"train_loss": -39.012813568115234, "global_step": 114402, "epoch": 945} {"train_loss": -39.03173828125, "global_step": 114403, "epoch": 945} {"train_loss": -38.05002975463867, "global_step": 114404, "epoch": 945} {"train_loss": -38.67426300048828, "global_step": 114405, "epoch": 945} {"train_loss": -38.287776947021484, "global_step": 114406, "epoch": 945} {"train_loss": -38.63916015625, "global_step": 114407, "epoch": 945} {"train_loss": -38.56084060668945, "global_step": 114408, "epoch": 945} {"train_loss": -38.87345504760742, "global_step": 114409, "epoch": 945} {"train_loss": -39.4114875793457, "global_step": 114410, "epoch": 945} {"train_loss": -39.34695053100586, "global_step": 114411, "epoch": 945} {"train_loss": -39.16720199584961, "global_step": 114412, "epoch": 945} {"train_loss": -39.022003173828125, "global_step": 114413, "epoch": 945} {"train_loss": -39.386287689208984, "global_step": 114414, "epoch": 945} {"train_loss": -38.977622985839844, "global_step": 114415, "epoch": 945} {"train_loss": -38.31725311279297, "global_step": 114416, "epoch": 945} {"train_loss": -39.731502532958984, "global_step": 114417, "epoch": 945} {"train_loss": -39.600563049316406, "global_step": 114418, "epoch": 945} {"train_loss": -39.68669509887695, "global_step": 114419, "epoch": 945} {"train_loss": -39.51856231689453, "global_step": 114420, "epoch": 945} {"train_loss": -39.93339157104492, "global_step": 114421, "epoch": 945} {"train_loss": -39.889503479003906, "global_step": 114422, "epoch": 945} {"train_loss": -38.9182243347168, "global_step": 114423, "epoch": 945} {"train_loss": -38.8173828125, "global_step": 114424, "epoch": 945} {"train_loss": -39.42408752441406, "global_step": 114425, "epoch": 945} {"train_loss": -38.04035568237305, "global_step": 114426, "epoch": 945} {"train_loss": -38.99005889892578, "global_step": 114427, "epoch": 945} {"train_loss": -37.727989196777344, "global_step": 114428, "epoch": 945} {"train_loss": -38.59645462036133, "global_step": 114429, "epoch": 945} {"train_loss": -37.771480560302734, "global_step": 114430, "epoch": 945} {"train_loss": -36.84940719604492, "global_step": 114431, "epoch": 945} {"train_loss": -34.45193099975586, "global_step": 114432, "epoch": 945} {"train_loss": -31.4235782623291, "global_step": 114433, "epoch": 945} {"train_loss": -34.61549377441406, "global_step": 114434, "epoch": 945} {"train_loss": -37.172359466552734, "global_step": 114435, "epoch": 945} {"train_loss": -35.65205764770508, "global_step": 114436, "epoch": 945} {"train_loss": -36.672725677490234, "global_step": 114437, "epoch": 945} {"train_loss": -38.70355224609375, "global_step": 114438, "epoch": 945} {"train_loss": -39.16851043701172, "global_step": 114439, "epoch": 945} {"train_loss": -36.89241409301758, "global_step": 114440, "epoch": 945} {"train_loss": -36.14434814453125, "global_step": 114441, "epoch": 945} {"train_loss": -32.7179069519043, "global_step": 114442, "epoch": 945} {"train_loss": -33.19367218017578, "global_step": 114443, "epoch": 945} {"train_loss": -34.57378005981445, "global_step": 114444, "epoch": 945} {"train_loss": -37.96026611328125, "global_step": 114445, "epoch": 945} {"train_loss": -39.1627311706543, "global_step": 114446, "epoch": 945} {"train_loss": -36.02961349487305, "global_step": 114447, "epoch": 945} {"train_loss": -37.99409866333008, "global_step": 114448, "epoch": 945} {"train_loss": -37.68314743041992, "global_step": 114449, "epoch": 945} {"train_loss": -37.14175033569336, "global_step": 114450, "epoch": 945} {"train_loss": -36.060272216796875, "global_step": 114451, "epoch": 945} {"train_loss": -38.73856735229492, "global_step": 114452, "epoch": 945} {"train_loss": -36.74814224243164, "global_step": 114453, "epoch": 945} {"train_loss": -37.88818359375, "global_step": 114454, "epoch": 945} {"train_loss": -38.2437744140625, "global_step": 114455, "epoch": 945} {"train_loss": -37.85871124267578, "global_step": 114456, "epoch": 945} {"train_loss": -37.44630813598633, "global_step": 114457, "epoch": 945} {"train_loss": -38.659332275390625, "global_step": 114458, "epoch": 945} {"train_loss": -38.55690383911133, "global_step": 114459, "epoch": 945} {"train_loss": -39.04905319213867, "global_step": 114460, "epoch": 945} {"train_loss": -38.5827751159668, "global_step": 114461, "epoch": 945} {"train_loss": -38.323001861572266, "global_step": 114462, "epoch": 945} {"train_loss": -38.901283264160156, "global_step": 114463, "epoch": 945} {"train_loss": -39.172386169433594, "global_step": 114464, "epoch": 945} {"train_loss": -37.61585593420612, "global_step": 114465, "epoch": 945, "val_loss": 2750759.25} {"train_loss": -38.9757080078125, "global_step": 114466, "epoch": 946} {"train_loss": -38.67169952392578, "global_step": 114467, "epoch": 946} {"train_loss": -38.84463882446289, "global_step": 114468, "epoch": 946} {"train_loss": -39.6195068359375, "global_step": 114469, "epoch": 946} {"train_loss": -39.52872085571289, "global_step": 114470, "epoch": 946} {"train_loss": -38.78013229370117, "global_step": 114471, "epoch": 946} {"train_loss": -38.00202178955078, "global_step": 114472, "epoch": 946} {"train_loss": -38.77313232421875, "global_step": 114473, "epoch": 946} {"train_loss": -39.30583572387695, "global_step": 114474, "epoch": 946} {"train_loss": -36.8368034362793, "global_step": 114475, "epoch": 946} {"train_loss": -38.68775939941406, "global_step": 114476, "epoch": 946} {"train_loss": -39.26027297973633, "global_step": 114477, "epoch": 946} {"train_loss": -39.1485710144043, "global_step": 114478, "epoch": 946} {"train_loss": -39.00999069213867, "global_step": 114479, "epoch": 946} {"train_loss": -39.4081916809082, "global_step": 114480, "epoch": 946} {"train_loss": -38.81729507446289, "global_step": 114481, "epoch": 946} {"train_loss": -39.51119613647461, "global_step": 114482, "epoch": 946} {"train_loss": -39.1732292175293, "global_step": 114483, "epoch": 946} {"train_loss": -39.20981979370117, "global_step": 114484, "epoch": 946} {"train_loss": -39.114593505859375, "global_step": 114485, "epoch": 946} {"train_loss": -38.57501983642578, "global_step": 114486, "epoch": 946} {"train_loss": -39.03367233276367, "global_step": 114487, "epoch": 946} {"train_loss": -39.9980354309082, "global_step": 114488, "epoch": 946} {"train_loss": -39.79928207397461, "global_step": 114489, "epoch": 946} {"train_loss": -39.94330978393555, "global_step": 114490, "epoch": 946} {"train_loss": -39.16284942626953, "global_step": 114491, "epoch": 946} {"train_loss": -39.09566879272461, "global_step": 114492, "epoch": 946} {"train_loss": -39.688209533691406, "global_step": 114493, "epoch": 946} {"train_loss": -37.96734619140625, "global_step": 114494, "epoch": 946} {"train_loss": -38.35548782348633, "global_step": 114495, "epoch": 946} {"train_loss": -39.315879821777344, "global_step": 114496, "epoch": 946} {"train_loss": -37.766475677490234, "global_step": 114497, "epoch": 946} {"train_loss": -38.4438591003418, "global_step": 114498, "epoch": 946} {"train_loss": -37.21079635620117, "global_step": 114499, "epoch": 946} {"train_loss": -39.1524543762207, "global_step": 114500, "epoch": 946} {"train_loss": -38.60256576538086, "global_step": 114501, "epoch": 946} {"train_loss": -37.61489486694336, "global_step": 114502, "epoch": 946} {"train_loss": -37.74411392211914, "global_step": 114503, "epoch": 946} {"train_loss": -38.396053314208984, "global_step": 114504, "epoch": 946} {"train_loss": -38.34013748168945, "global_step": 114505, "epoch": 946} {"train_loss": -37.896297454833984, "global_step": 114506, "epoch": 946} {"train_loss": -38.959739685058594, "global_step": 114507, "epoch": 946} {"train_loss": -37.62837600708008, "global_step": 114508, "epoch": 946} {"train_loss": -36.87094497680664, "global_step": 114509, "epoch": 946} {"train_loss": -37.73739242553711, "global_step": 114510, "epoch": 946} {"train_loss": -36.596920013427734, "global_step": 114511, "epoch": 946} {"train_loss": -38.409549713134766, "global_step": 114512, "epoch": 946} {"train_loss": -38.18068313598633, "global_step": 114513, "epoch": 946} {"train_loss": -38.25656509399414, "global_step": 114514, "epoch": 946} {"train_loss": -38.922786712646484, "global_step": 114515, "epoch": 946} {"train_loss": -37.063392639160156, "global_step": 114516, "epoch": 946} {"train_loss": -35.08041000366211, "global_step": 114517, "epoch": 946} {"train_loss": -38.520992279052734, "global_step": 114518, "epoch": 946} {"train_loss": -34.85315704345703, "global_step": 114519, "epoch": 946} {"train_loss": -39.063987731933594, "global_step": 114520, "epoch": 946} {"train_loss": -35.164180755615234, "global_step": 114521, "epoch": 946} {"train_loss": -33.92422103881836, "global_step": 114522, "epoch": 946} {"train_loss": -37.38772964477539, "global_step": 114523, "epoch": 946} {"train_loss": -38.543121337890625, "global_step": 114524, "epoch": 946} {"train_loss": -34.56791305541992, "global_step": 114525, "epoch": 946} {"train_loss": -38.143035888671875, "global_step": 114526, "epoch": 946} {"train_loss": -33.522884368896484, "global_step": 114527, "epoch": 946} {"train_loss": -38.17153549194336, "global_step": 114528, "epoch": 946} {"train_loss": -37.72954559326172, "global_step": 114529, "epoch": 946} {"train_loss": -35.612525939941406, "global_step": 114530, "epoch": 946} {"train_loss": -38.74159622192383, "global_step": 114531, "epoch": 946} {"train_loss": -37.77096176147461, "global_step": 114532, "epoch": 946} {"train_loss": -36.53772735595703, "global_step": 114533, "epoch": 946} {"train_loss": -37.983856201171875, "global_step": 114534, "epoch": 946} {"train_loss": -37.72481918334961, "global_step": 114535, "epoch": 946} {"train_loss": -38.41323471069336, "global_step": 114536, "epoch": 946} {"train_loss": -37.972755432128906, "global_step": 114537, "epoch": 946} {"train_loss": -36.86207962036133, "global_step": 114538, "epoch": 946} {"train_loss": -37.755428314208984, "global_step": 114539, "epoch": 946} {"train_loss": -37.19365310668945, "global_step": 114540, "epoch": 946} {"train_loss": -36.28011703491211, "global_step": 114541, "epoch": 946} {"train_loss": -35.77035140991211, "global_step": 114542, "epoch": 946} {"train_loss": -36.87105941772461, "global_step": 114543, "epoch": 946} {"train_loss": -38.11650466918945, "global_step": 114544, "epoch": 946} {"train_loss": -35.69525909423828, "global_step": 114545, "epoch": 946} {"train_loss": -37.970428466796875, "global_step": 114546, "epoch": 946} {"train_loss": -38.05337142944336, "global_step": 114547, "epoch": 946} {"train_loss": -35.66668701171875, "global_step": 114548, "epoch": 946} {"train_loss": -38.08506393432617, "global_step": 114549, "epoch": 946} {"train_loss": -38.798397064208984, "global_step": 114550, "epoch": 946} {"train_loss": -37.589107513427734, "global_step": 114551, "epoch": 946} {"train_loss": -37.78443145751953, "global_step": 114552, "epoch": 946} {"train_loss": -37.564422607421875, "global_step": 114553, "epoch": 946} {"train_loss": -37.5327033996582, "global_step": 114554, "epoch": 946} {"train_loss": -37.92483139038086, "global_step": 114555, "epoch": 946} {"train_loss": -38.534671783447266, "global_step": 114556, "epoch": 946} {"train_loss": -38.17374801635742, "global_step": 114557, "epoch": 946} {"train_loss": -37.64352798461914, "global_step": 114558, "epoch": 946} {"train_loss": -38.96535873413086, "global_step": 114559, "epoch": 946} {"train_loss": -37.64821243286133, "global_step": 114560, "epoch": 946} {"train_loss": -37.85695266723633, "global_step": 114561, "epoch": 946} {"train_loss": -38.809059143066406, "global_step": 114562, "epoch": 946} {"train_loss": -38.0289192199707, "global_step": 114563, "epoch": 946} {"train_loss": -38.91819763183594, "global_step": 114564, "epoch": 946} {"train_loss": -38.45792007446289, "global_step": 114565, "epoch": 946} {"train_loss": -38.51365280151367, "global_step": 114566, "epoch": 946} {"train_loss": -38.11677169799805, "global_step": 114567, "epoch": 946} {"train_loss": -39.19824981689453, "global_step": 114568, "epoch": 946} {"train_loss": -39.07520294189453, "global_step": 114569, "epoch": 946} {"train_loss": -38.288612365722656, "global_step": 114570, "epoch": 946} {"train_loss": -39.535499572753906, "global_step": 114571, "epoch": 946} {"train_loss": -38.66463851928711, "global_step": 114572, "epoch": 946} {"train_loss": -39.07737350463867, "global_step": 114573, "epoch": 946} {"train_loss": -38.593353271484375, "global_step": 114574, "epoch": 946} {"train_loss": -38.82477569580078, "global_step": 114575, "epoch": 946} {"train_loss": -38.88039779663086, "global_step": 114576, "epoch": 946} {"train_loss": -39.217552185058594, "global_step": 114577, "epoch": 946} {"train_loss": -38.999183654785156, "global_step": 114578, "epoch": 946} {"train_loss": -39.376441955566406, "global_step": 114579, "epoch": 946} {"train_loss": -39.070308685302734, "global_step": 114580, "epoch": 946} {"train_loss": -39.72854232788086, "global_step": 114581, "epoch": 946} {"train_loss": -39.54331588745117, "global_step": 114582, "epoch": 946} {"train_loss": -38.687286376953125, "global_step": 114583, "epoch": 946} {"train_loss": -39.15005111694336, "global_step": 114584, "epoch": 946} {"train_loss": -38.99247360229492, "global_step": 114585, "epoch": 946} {"train_loss": -38.16771836714311, "global_step": 114586, "epoch": 946, "val_loss": 2696085.0} {"train_loss": -38.63459396362305, "global_step": 114587, "epoch": 947} {"train_loss": -40.016502380371094, "global_step": 114588, "epoch": 947} {"train_loss": -39.400657653808594, "global_step": 114589, "epoch": 947} {"train_loss": -39.94205093383789, "global_step": 114590, "epoch": 947} {"train_loss": -39.16900634765625, "global_step": 114591, "epoch": 947} {"train_loss": -39.54523849487305, "global_step": 114592, "epoch": 947} {"train_loss": -39.69306564331055, "global_step": 114593, "epoch": 947} {"train_loss": -39.64631271362305, "global_step": 114594, "epoch": 947} {"train_loss": -39.95333480834961, "global_step": 114595, "epoch": 947} {"train_loss": -39.19821548461914, "global_step": 114596, "epoch": 947} {"train_loss": -39.44812774658203, "global_step": 114597, "epoch": 947} {"train_loss": -39.884212493896484, "global_step": 114598, "epoch": 947} {"train_loss": -39.326210021972656, "global_step": 114599, "epoch": 947} {"train_loss": -39.84367752075195, "global_step": 114600, "epoch": 947} {"train_loss": -38.63460922241211, "global_step": 114601, "epoch": 947} {"train_loss": -39.54869079589844, "global_step": 114602, "epoch": 947} {"train_loss": -39.61726379394531, "global_step": 114603, "epoch": 947} {"train_loss": -39.568355560302734, "global_step": 114604, "epoch": 947} {"train_loss": -39.65079879760742, "global_step": 114605, "epoch": 947} {"train_loss": -39.72954559326172, "global_step": 114606, "epoch": 947} {"train_loss": -39.56528854370117, "global_step": 114607, "epoch": 947} {"train_loss": -39.580928802490234, "global_step": 114608, "epoch": 947} {"train_loss": -39.38740539550781, "global_step": 114609, "epoch": 947} {"train_loss": -38.20866012573242, "global_step": 114610, "epoch": 947} {"train_loss": -35.031837463378906, "global_step": 114611, "epoch": 947} {"train_loss": -33.36362075805664, "global_step": 114612, "epoch": 947} {"train_loss": -33.5954475402832, "global_step": 114613, "epoch": 947} {"train_loss": -34.33059310913086, "global_step": 114614, "epoch": 947} {"train_loss": -35.66804122924805, "global_step": 114615, "epoch": 947} {"train_loss": -37.2795524597168, "global_step": 114616, "epoch": 947} {"train_loss": -38.862239837646484, "global_step": 114617, "epoch": 947} {"train_loss": -37.30708312988281, "global_step": 114618, "epoch": 947} {"train_loss": -35.36443328857422, "global_step": 114619, "epoch": 947} {"train_loss": -36.68891525268555, "global_step": 114620, "epoch": 947} {"train_loss": -26.287321090698242, "global_step": 114621, "epoch": 947} {"train_loss": -17.45273780822754, "global_step": 114622, "epoch": 947} {"train_loss": -8.0538969039917, "global_step": 114623, "epoch": 947} {"train_loss": -14.100181579589844, "global_step": 114624, "epoch": 947} {"train_loss": -34.21923828125, "global_step": 114625, "epoch": 947} {"train_loss": -16.154165267944336, "global_step": 114626, "epoch": 947} {"train_loss": -18.453716278076172, "global_step": 114627, "epoch": 947} {"train_loss": -26.4722900390625, "global_step": 114628, "epoch": 947} {"train_loss": -33.94086456298828, "global_step": 114629, "epoch": 947} {"train_loss": -27.99542808532715, "global_step": 114630, "epoch": 947} {"train_loss": -35.84077072143555, "global_step": 114631, "epoch": 947} {"train_loss": -32.53718948364258, "global_step": 114632, "epoch": 947} {"train_loss": -31.780811309814453, "global_step": 114633, "epoch": 947} {"train_loss": -36.748382568359375, "global_step": 114634, "epoch": 947} {"train_loss": -32.979209899902344, "global_step": 114635, "epoch": 947} {"train_loss": -33.170291900634766, "global_step": 114636, "epoch": 947} {"train_loss": -36.324432373046875, "global_step": 114637, "epoch": 947} {"train_loss": -35.84701156616211, "global_step": 114638, "epoch": 947} {"train_loss": -34.35797119140625, "global_step": 114639, "epoch": 947} {"train_loss": -35.021888732910156, "global_step": 114640, "epoch": 947} {"train_loss": -33.896175384521484, "global_step": 114641, "epoch": 947} {"train_loss": -35.8084831237793, "global_step": 114642, "epoch": 947} {"train_loss": -34.8750114440918, "global_step": 114643, "epoch": 947} {"train_loss": -36.86660385131836, "global_step": 114644, "epoch": 947} {"train_loss": -37.25429916381836, "global_step": 114645, "epoch": 947} {"train_loss": -37.10276412963867, "global_step": 114646, "epoch": 947} {"train_loss": -35.85627746582031, "global_step": 114647, "epoch": 947} {"train_loss": -37.055023193359375, "global_step": 114648, "epoch": 947} {"train_loss": -37.33504867553711, "global_step": 114649, "epoch": 947} {"train_loss": -36.790382385253906, "global_step": 114650, "epoch": 947} {"train_loss": -36.87373733520508, "global_step": 114651, "epoch": 947} {"train_loss": -36.933929443359375, "global_step": 114652, "epoch": 947} {"train_loss": -36.83381271362305, "global_step": 114653, "epoch": 947} {"train_loss": -37.412166595458984, "global_step": 114654, "epoch": 947} {"train_loss": -37.404781341552734, "global_step": 114655, "epoch": 947} {"train_loss": -37.06439971923828, "global_step": 114656, "epoch": 947} {"train_loss": -36.125362396240234, "global_step": 114657, "epoch": 947} {"train_loss": -37.11521530151367, "global_step": 114658, "epoch": 947} {"train_loss": -37.707637786865234, "global_step": 114659, "epoch": 947} {"train_loss": -37.44742965698242, "global_step": 114660, "epoch": 947} {"train_loss": -37.95307159423828, "global_step": 114661, "epoch": 947} {"train_loss": -37.2236213684082, "global_step": 114662, "epoch": 947} {"train_loss": -37.77347946166992, "global_step": 114663, "epoch": 947} {"train_loss": -37.92817687988281, "global_step": 114664, "epoch": 947} {"train_loss": -37.8198127746582, "global_step": 114665, "epoch": 947} {"train_loss": -37.743587493896484, "global_step": 114666, "epoch": 947} {"train_loss": -37.51935958862305, "global_step": 114667, "epoch": 947} {"train_loss": -37.433135986328125, "global_step": 114668, "epoch": 947} {"train_loss": -38.11042022705078, "global_step": 114669, "epoch": 947} {"train_loss": -38.44315719604492, "global_step": 114670, "epoch": 947} {"train_loss": -37.763641357421875, "global_step": 114671, "epoch": 947} {"train_loss": -37.9974479675293, "global_step": 114672, "epoch": 947} {"train_loss": -38.40920639038086, "global_step": 114673, "epoch": 947} {"train_loss": -38.18714141845703, "global_step": 114674, "epoch": 947} {"train_loss": -38.34701156616211, "global_step": 114675, "epoch": 947} {"train_loss": -38.352020263671875, "global_step": 114676, "epoch": 947} {"train_loss": -38.63938903808594, "global_step": 114677, "epoch": 947} {"train_loss": -38.56648635864258, "global_step": 114678, "epoch": 947} {"train_loss": -38.756649017333984, "global_step": 114679, "epoch": 947} {"train_loss": -38.37199020385742, "global_step": 114680, "epoch": 947} {"train_loss": -38.088523864746094, "global_step": 114681, "epoch": 947} {"train_loss": -38.477420806884766, "global_step": 114682, "epoch": 947} {"train_loss": -38.44088363647461, "global_step": 114683, "epoch": 947} {"train_loss": -38.93690872192383, "global_step": 114684, "epoch": 947} {"train_loss": -38.50437545776367, "global_step": 114685, "epoch": 947} {"train_loss": -38.733863830566406, "global_step": 114686, "epoch": 947} {"train_loss": -38.84011459350586, "global_step": 114687, "epoch": 947} {"train_loss": -38.862972259521484, "global_step": 114688, "epoch": 947} {"train_loss": -39.039161682128906, "global_step": 114689, "epoch": 947} {"train_loss": -39.28174591064453, "global_step": 114690, "epoch": 947} {"train_loss": -38.718990325927734, "global_step": 114691, "epoch": 947} {"train_loss": -38.56892776489258, "global_step": 114692, "epoch": 947} {"train_loss": -37.85371017456055, "global_step": 114693, "epoch": 947} {"train_loss": -39.238014221191406, "global_step": 114694, "epoch": 947} {"train_loss": -39.36130905151367, "global_step": 114695, "epoch": 947} {"train_loss": -39.12565231323242, "global_step": 114696, "epoch": 947} {"train_loss": -39.6410026550293, "global_step": 114697, "epoch": 947} {"train_loss": -39.275482177734375, "global_step": 114698, "epoch": 947} {"train_loss": -38.717620849609375, "global_step": 114699, "epoch": 947} {"train_loss": -38.59284591674805, "global_step": 114700, "epoch": 947} {"train_loss": -38.6253776550293, "global_step": 114701, "epoch": 947} {"train_loss": -38.61233139038086, "global_step": 114702, "epoch": 947} {"train_loss": -39.01285934448242, "global_step": 114703, "epoch": 947} {"train_loss": -38.2700309753418, "global_step": 114704, "epoch": 947} {"train_loss": -39.036277770996094, "global_step": 114705, "epoch": 947} {"train_loss": -38.187286376953125, "global_step": 114706, "epoch": 947} {"train_loss": -36.48570692046615, "global_step": 114707, "epoch": 947, "val_loss": 2594879.75} {"train_loss": -39.48991394042969, "global_step": 114708, "epoch": 948} {"train_loss": -38.90714645385742, "global_step": 114709, "epoch": 948} {"train_loss": -38.620784759521484, "global_step": 114710, "epoch": 948} {"train_loss": -38.88996124267578, "global_step": 114711, "epoch": 948} {"train_loss": -38.78322219848633, "global_step": 114712, "epoch": 948} {"train_loss": -38.87986755371094, "global_step": 114713, "epoch": 948} {"train_loss": -39.306495666503906, "global_step": 114714, "epoch": 948} {"train_loss": -38.53662109375, "global_step": 114715, "epoch": 948} {"train_loss": -38.82871627807617, "global_step": 114716, "epoch": 948} {"train_loss": -38.57307815551758, "global_step": 114717, "epoch": 948} {"train_loss": -38.78752517700195, "global_step": 114718, "epoch": 948} {"train_loss": -39.40873336791992, "global_step": 114719, "epoch": 948} {"train_loss": -38.27423858642578, "global_step": 114720, "epoch": 948} {"train_loss": -37.954925537109375, "global_step": 114721, "epoch": 948} {"train_loss": -39.07242202758789, "global_step": 114722, "epoch": 948} {"train_loss": -38.8933219909668, "global_step": 114723, "epoch": 948} {"train_loss": -39.64491271972656, "global_step": 114724, "epoch": 948} {"train_loss": -39.038124084472656, "global_step": 114725, "epoch": 948} {"train_loss": -38.18277359008789, "global_step": 114726, "epoch": 948} {"train_loss": -39.505001068115234, "global_step": 114727, "epoch": 948} {"train_loss": -38.610198974609375, "global_step": 114728, "epoch": 948} {"train_loss": -37.885372161865234, "global_step": 114729, "epoch": 948} {"train_loss": -39.351009368896484, "global_step": 114730, "epoch": 948} {"train_loss": -39.13087844848633, "global_step": 114731, "epoch": 948} {"train_loss": -39.5140380859375, "global_step": 114732, "epoch": 948} {"train_loss": -39.30868911743164, "global_step": 114733, "epoch": 948} {"train_loss": -38.29124069213867, "global_step": 114734, "epoch": 948} {"train_loss": -39.11540603637695, "global_step": 114735, "epoch": 948} {"train_loss": -39.57892990112305, "global_step": 114736, "epoch": 948} {"train_loss": -39.46157455444336, "global_step": 114737, "epoch": 948} {"train_loss": -39.177032470703125, "global_step": 114738, "epoch": 948} {"train_loss": -38.52543640136719, "global_step": 114739, "epoch": 948} {"train_loss": -39.64046859741211, "global_step": 114740, "epoch": 948} {"train_loss": -38.53364181518555, "global_step": 114741, "epoch": 948} {"train_loss": -38.96210479736328, "global_step": 114742, "epoch": 948} {"train_loss": -39.17084503173828, "global_step": 114743, "epoch": 948} {"train_loss": -38.7869758605957, "global_step": 114744, "epoch": 948} {"train_loss": -39.06303787231445, "global_step": 114745, "epoch": 948} {"train_loss": -38.787200927734375, "global_step": 114746, "epoch": 948} {"train_loss": -38.406219482421875, "global_step": 114747, "epoch": 948} {"train_loss": -36.28817367553711, "global_step": 114748, "epoch": 948} {"train_loss": -32.37699508666992, "global_step": 114749, "epoch": 948} {"train_loss": -27.9222354888916, "global_step": 114750, "epoch": 948} {"train_loss": -28.29443359375, "global_step": 114751, "epoch": 948} {"train_loss": -32.1236572265625, "global_step": 114752, "epoch": 948} {"train_loss": -37.80772018432617, "global_step": 114753, "epoch": 948} {"train_loss": -36.95319366455078, "global_step": 114754, "epoch": 948} {"train_loss": -34.63922882080078, "global_step": 114755, "epoch": 948} {"train_loss": -38.489192962646484, "global_step": 114756, "epoch": 948} {"train_loss": -36.761863708496094, "global_step": 114757, "epoch": 948} {"train_loss": -36.791847229003906, "global_step": 114758, "epoch": 948} {"train_loss": -37.93682861328125, "global_step": 114759, "epoch": 948} {"train_loss": -36.720882415771484, "global_step": 114760, "epoch": 948} {"train_loss": -37.487709045410156, "global_step": 114761, "epoch": 948} {"train_loss": -36.79209899902344, "global_step": 114762, "epoch": 948} {"train_loss": -38.63645553588867, "global_step": 114763, "epoch": 948} {"train_loss": -37.796592712402344, "global_step": 114764, "epoch": 948} {"train_loss": -38.56071090698242, "global_step": 114765, "epoch": 948} {"train_loss": -38.055816650390625, "global_step": 114766, "epoch": 948} {"train_loss": -37.84828567504883, "global_step": 114767, "epoch": 948} {"train_loss": -38.68236541748047, "global_step": 114768, "epoch": 948} {"train_loss": -38.050559997558594, "global_step": 114769, "epoch": 948} {"train_loss": -38.34351348876953, "global_step": 114770, "epoch": 948} {"train_loss": -38.04612731933594, "global_step": 114771, "epoch": 948} {"train_loss": -37.06235885620117, "global_step": 114772, "epoch": 948} {"train_loss": -39.0295524597168, "global_step": 114773, "epoch": 948} {"train_loss": -37.938167572021484, "global_step": 114774, "epoch": 948} {"train_loss": -37.96181869506836, "global_step": 114775, "epoch": 948} {"train_loss": -37.87760543823242, "global_step": 114776, "epoch": 948} {"train_loss": -38.06228256225586, "global_step": 114777, "epoch": 948} {"train_loss": -38.450557708740234, "global_step": 114778, "epoch": 948} {"train_loss": -38.48588180541992, "global_step": 114779, "epoch": 948} {"train_loss": -38.473506927490234, "global_step": 114780, "epoch": 948} {"train_loss": -38.22876739501953, "global_step": 114781, "epoch": 948} {"train_loss": -38.7869873046875, "global_step": 114782, "epoch": 948} {"train_loss": -38.6403694152832, "global_step": 114783, "epoch": 948} {"train_loss": -38.274471282958984, "global_step": 114784, "epoch": 948} {"train_loss": -38.32119369506836, "global_step": 114785, "epoch": 948} {"train_loss": -38.276405334472656, "global_step": 114786, "epoch": 948} {"train_loss": -38.43477249145508, "global_step": 114787, "epoch": 948} {"train_loss": -38.90006637573242, "global_step": 114788, "epoch": 948} {"train_loss": -38.2020149230957, "global_step": 114789, "epoch": 948} {"train_loss": -39.166717529296875, "global_step": 114790, "epoch": 948} {"train_loss": -38.65523910522461, "global_step": 114791, "epoch": 948} {"train_loss": -39.076087951660156, "global_step": 114792, "epoch": 948} {"train_loss": -38.99506378173828, "global_step": 114793, "epoch": 948} {"train_loss": -38.80412673950195, "global_step": 114794, "epoch": 948} {"train_loss": -39.27986526489258, "global_step": 114795, "epoch": 948} {"train_loss": -39.06752395629883, "global_step": 114796, "epoch": 948} {"train_loss": -39.01906967163086, "global_step": 114797, "epoch": 948} {"train_loss": -39.15656661987305, "global_step": 114798, "epoch": 948} {"train_loss": -39.202022552490234, "global_step": 114799, "epoch": 948} {"train_loss": -39.52939987182617, "global_step": 114800, "epoch": 948} {"train_loss": -39.6386604309082, "global_step": 114801, "epoch": 948} {"train_loss": -39.78487777709961, "global_step": 114802, "epoch": 948} {"train_loss": -37.97113800048828, "global_step": 114803, "epoch": 948} {"train_loss": -38.93097686767578, "global_step": 114804, "epoch": 948} {"train_loss": -39.365718841552734, "global_step": 114805, "epoch": 948} {"train_loss": -38.781776428222656, "global_step": 114806, "epoch": 948} {"train_loss": -37.97280502319336, "global_step": 114807, "epoch": 948} {"train_loss": -38.991065979003906, "global_step": 114808, "epoch": 948} {"train_loss": -39.12015914916992, "global_step": 114809, "epoch": 948} {"train_loss": -38.42948532104492, "global_step": 114810, "epoch": 948} {"train_loss": -39.605438232421875, "global_step": 114811, "epoch": 948} {"train_loss": -38.92829513549805, "global_step": 114812, "epoch": 948} {"train_loss": -39.203487396240234, "global_step": 114813, "epoch": 948} {"train_loss": -38.39658737182617, "global_step": 114814, "epoch": 948} {"train_loss": -38.30723190307617, "global_step": 114815, "epoch": 948} {"train_loss": -39.675575256347656, "global_step": 114816, "epoch": 948} {"train_loss": -38.78702163696289, "global_step": 114817, "epoch": 948} {"train_loss": -38.988868713378906, "global_step": 114818, "epoch": 948} {"train_loss": -36.95452117919922, "global_step": 114819, "epoch": 948} {"train_loss": -39.591094970703125, "global_step": 114820, "epoch": 948} {"train_loss": -39.86067581176758, "global_step": 114821, "epoch": 948} {"train_loss": -39.7910270690918, "global_step": 114822, "epoch": 948} {"train_loss": -39.4705810546875, "global_step": 114823, "epoch": 948} {"train_loss": -39.848121643066406, "global_step": 114824, "epoch": 948} {"train_loss": -38.944549560546875, "global_step": 114825, "epoch": 948} {"train_loss": -39.2178840637207, "global_step": 114826, "epoch": 948} {"train_loss": -39.88700485229492, "global_step": 114827, "epoch": 948} {"train_loss": -38.35730123913978, "global_step": 114828, "epoch": 948, "val_loss": 2578516.0} {"train_loss": -39.572731018066406, "global_step": 114829, "epoch": 949} {"train_loss": -40.075443267822266, "global_step": 114830, "epoch": 949} {"train_loss": -39.708187103271484, "global_step": 114831, "epoch": 949} {"train_loss": -37.911563873291016, "global_step": 114832, "epoch": 949} {"train_loss": -36.75135803222656, "global_step": 114833, "epoch": 949} {"train_loss": -37.333770751953125, "global_step": 114834, "epoch": 949} {"train_loss": -38.85795974731445, "global_step": 114835, "epoch": 949} {"train_loss": -39.15785598754883, "global_step": 114836, "epoch": 949} {"train_loss": -39.217220306396484, "global_step": 114837, "epoch": 949} {"train_loss": -37.55503463745117, "global_step": 114838, "epoch": 949} {"train_loss": -39.38162612915039, "global_step": 114839, "epoch": 949} {"train_loss": -38.635860443115234, "global_step": 114840, "epoch": 949} {"train_loss": -39.11834716796875, "global_step": 114841, "epoch": 949} {"train_loss": -39.175079345703125, "global_step": 114842, "epoch": 949} {"train_loss": -37.780635833740234, "global_step": 114843, "epoch": 949} {"train_loss": -37.36918258666992, "global_step": 114844, "epoch": 949} {"train_loss": -38.23779296875, "global_step": 114845, "epoch": 949} {"train_loss": -37.207515716552734, "global_step": 114846, "epoch": 949} {"train_loss": -38.48711013793945, "global_step": 114847, "epoch": 949} {"train_loss": -36.99338912963867, "global_step": 114848, "epoch": 949} {"train_loss": -38.41202926635742, "global_step": 114849, "epoch": 949} {"train_loss": -38.451324462890625, "global_step": 114850, "epoch": 949} {"train_loss": -37.790828704833984, "global_step": 114851, "epoch": 949} {"train_loss": -37.372283935546875, "global_step": 114852, "epoch": 949} {"train_loss": -37.95327377319336, "global_step": 114853, "epoch": 949} {"train_loss": -35.078346252441406, "global_step": 114854, "epoch": 949} {"train_loss": -38.2919807434082, "global_step": 114855, "epoch": 949} {"train_loss": -37.71596145629883, "global_step": 114856, "epoch": 949} {"train_loss": -37.049800872802734, "global_step": 114857, "epoch": 949} {"train_loss": -37.8292121887207, "global_step": 114858, "epoch": 949} {"train_loss": -37.3023567199707, "global_step": 114859, "epoch": 949} {"train_loss": -37.145896911621094, "global_step": 114860, "epoch": 949} {"train_loss": -38.373939514160156, "global_step": 114861, "epoch": 949} {"train_loss": -36.5861930847168, "global_step": 114862, "epoch": 949} {"train_loss": -39.0954704284668, "global_step": 114863, "epoch": 949} {"train_loss": -38.49798583984375, "global_step": 114864, "epoch": 949} {"train_loss": -37.13593292236328, "global_step": 114865, "epoch": 949} {"train_loss": -38.568458557128906, "global_step": 114866, "epoch": 949} {"train_loss": -36.692909240722656, "global_step": 114867, "epoch": 949} {"train_loss": -34.140846252441406, "global_step": 114868, "epoch": 949} {"train_loss": -32.723384857177734, "global_step": 114869, "epoch": 949} {"train_loss": -32.57960510253906, "global_step": 114870, "epoch": 949} {"train_loss": -34.94532775878906, "global_step": 114871, "epoch": 949} {"train_loss": -37.01139831542969, "global_step": 114872, "epoch": 949} {"train_loss": -36.49038314819336, "global_step": 114873, "epoch": 949} {"train_loss": -36.44102096557617, "global_step": 114874, "epoch": 949} {"train_loss": -34.1313362121582, "global_step": 114875, "epoch": 949} {"train_loss": -38.13833236694336, "global_step": 114876, "epoch": 949} {"train_loss": -37.33619689941406, "global_step": 114877, "epoch": 949} {"train_loss": -34.85131072998047, "global_step": 114878, "epoch": 949} {"train_loss": -35.956787109375, "global_step": 114879, "epoch": 949} {"train_loss": -35.85453796386719, "global_step": 114880, "epoch": 949} {"train_loss": -36.488983154296875, "global_step": 114881, "epoch": 949} {"train_loss": -36.104736328125, "global_step": 114882, "epoch": 949} {"train_loss": -35.89119338989258, "global_step": 114883, "epoch": 949} {"train_loss": -36.37051773071289, "global_step": 114884, "epoch": 949} {"train_loss": -36.56330871582031, "global_step": 114885, "epoch": 949} {"train_loss": -37.50355911254883, "global_step": 114886, "epoch": 949} {"train_loss": -37.26167678833008, "global_step": 114887, "epoch": 949} {"train_loss": -37.08408737182617, "global_step": 114888, "epoch": 949} {"train_loss": -37.68339538574219, "global_step": 114889, "epoch": 949} {"train_loss": -36.856204986572266, "global_step": 114890, "epoch": 949} {"train_loss": -28.8676700592041, "global_step": 114891, "epoch": 949} {"train_loss": -36.70607376098633, "global_step": 114892, "epoch": 949} {"train_loss": -37.135833740234375, "global_step": 114893, "epoch": 949} {"train_loss": -36.03255844116211, "global_step": 114894, "epoch": 949} {"train_loss": -35.9660758972168, "global_step": 114895, "epoch": 949} {"train_loss": -37.852691650390625, "global_step": 114896, "epoch": 949} {"train_loss": -37.63577651977539, "global_step": 114897, "epoch": 949} {"train_loss": -36.38954544067383, "global_step": 114898, "epoch": 949} {"train_loss": -33.4529914855957, "global_step": 114899, "epoch": 949} {"train_loss": -35.6569938659668, "global_step": 114900, "epoch": 949} {"train_loss": -37.612483978271484, "global_step": 114901, "epoch": 949} {"train_loss": -37.06281661987305, "global_step": 114902, "epoch": 949} {"train_loss": -36.732025146484375, "global_step": 114903, "epoch": 949} {"train_loss": -37.31901168823242, "global_step": 114904, "epoch": 949} {"train_loss": -36.275421142578125, "global_step": 114905, "epoch": 949} {"train_loss": -37.98063278198242, "global_step": 114906, "epoch": 949} {"train_loss": -36.83897018432617, "global_step": 114907, "epoch": 949} {"train_loss": -36.45858383178711, "global_step": 114908, "epoch": 949} {"train_loss": -37.0483512878418, "global_step": 114909, "epoch": 949} {"train_loss": -36.97372055053711, "global_step": 114910, "epoch": 949} {"train_loss": -35.863800048828125, "global_step": 114911, "epoch": 949} {"train_loss": -35.36994552612305, "global_step": 114912, "epoch": 949} {"train_loss": -36.00741958618164, "global_step": 114913, "epoch": 949} {"train_loss": -38.13327407836914, "global_step": 114914, "epoch": 949} {"train_loss": -37.969051361083984, "global_step": 114915, "epoch": 949} {"train_loss": -37.362674713134766, "global_step": 114916, "epoch": 949} {"train_loss": -38.3983268737793, "global_step": 114917, "epoch": 949} {"train_loss": -38.25251388549805, "global_step": 114918, "epoch": 949} {"train_loss": -37.91199493408203, "global_step": 114919, "epoch": 949} {"train_loss": -37.10388946533203, "global_step": 114920, "epoch": 949} {"train_loss": -38.62762451171875, "global_step": 114921, "epoch": 949} {"train_loss": -38.2026252746582, "global_step": 114922, "epoch": 949} {"train_loss": -38.118263244628906, "global_step": 114923, "epoch": 949} {"train_loss": -37.385223388671875, "global_step": 114924, "epoch": 949} {"train_loss": -38.503082275390625, "global_step": 114925, "epoch": 949} {"train_loss": -38.2592887878418, "global_step": 114926, "epoch": 949} {"train_loss": -38.12068557739258, "global_step": 114927, "epoch": 949} {"train_loss": -37.94364547729492, "global_step": 114928, "epoch": 949} {"train_loss": -38.290340423583984, "global_step": 114929, "epoch": 949} {"train_loss": -37.18008804321289, "global_step": 114930, "epoch": 949} {"train_loss": -37.36079788208008, "global_step": 114931, "epoch": 949} {"train_loss": -39.058650970458984, "global_step": 114932, "epoch": 949} {"train_loss": -38.39423370361328, "global_step": 114933, "epoch": 949} {"train_loss": -38.470062255859375, "global_step": 114934, "epoch": 949} {"train_loss": -38.97665023803711, "global_step": 114935, "epoch": 949} {"train_loss": -37.00358963012695, "global_step": 114936, "epoch": 949} {"train_loss": -37.721439361572266, "global_step": 114937, "epoch": 949} {"train_loss": -38.87771987915039, "global_step": 114938, "epoch": 949} {"train_loss": -37.02705001831055, "global_step": 114939, "epoch": 949} {"train_loss": -39.03768539428711, "global_step": 114940, "epoch": 949} {"train_loss": -38.707637786865234, "global_step": 114941, "epoch": 949} {"train_loss": -38.700904846191406, "global_step": 114942, "epoch": 949} {"train_loss": -38.23496627807617, "global_step": 114943, "epoch": 949} {"train_loss": -39.0660400390625, "global_step": 114944, "epoch": 949} {"train_loss": -39.432125091552734, "global_step": 114945, "epoch": 949} {"train_loss": -38.75124740600586, "global_step": 114946, "epoch": 949} {"train_loss": -38.82181930541992, "global_step": 114947, "epoch": 949} {"train_loss": -38.90078353881836, "global_step": 114948, "epoch": 949} {"train_loss": -37.379726394148896, "global_step": 114949, "epoch": 949, "val_loss": 2616584.25} {"train_loss": -38.44060516357422, "global_step": 114950, "epoch": 950} {"train_loss": -39.447731018066406, "global_step": 114951, "epoch": 950} {"train_loss": -39.19041061401367, "global_step": 114952, "epoch": 950} {"train_loss": -37.858848571777344, "global_step": 114953, "epoch": 950} {"train_loss": -38.949466705322266, "global_step": 114954, "epoch": 950} {"train_loss": -38.821285247802734, "global_step": 114955, "epoch": 950} {"train_loss": -39.26337432861328, "global_step": 114956, "epoch": 950} {"train_loss": -39.443843841552734, "global_step": 114957, "epoch": 950} {"train_loss": -38.545631408691406, "global_step": 114958, "epoch": 950} {"train_loss": -39.16188430786133, "global_step": 114959, "epoch": 950} {"train_loss": -39.646331787109375, "global_step": 114960, "epoch": 950} {"train_loss": -38.99739074707031, "global_step": 114961, "epoch": 950} {"train_loss": -39.185909271240234, "global_step": 114962, "epoch": 950} {"train_loss": -39.12595748901367, "global_step": 114963, "epoch": 950} {"train_loss": -39.62851333618164, "global_step": 114964, "epoch": 950} {"train_loss": -39.37808609008789, "global_step": 114965, "epoch": 950} {"train_loss": -39.142574310302734, "global_step": 114966, "epoch": 950} {"train_loss": -39.30107116699219, "global_step": 114967, "epoch": 950} {"train_loss": -39.575347900390625, "global_step": 114968, "epoch": 950} {"train_loss": -39.635066986083984, "global_step": 114969, "epoch": 950} {"train_loss": -39.81986999511719, "global_step": 114970, "epoch": 950} {"train_loss": -39.24143981933594, "global_step": 114971, "epoch": 950} {"train_loss": -39.625244140625, "global_step": 114972, "epoch": 950} {"train_loss": -39.188385009765625, "global_step": 114973, "epoch": 950} {"train_loss": -38.77602767944336, "global_step": 114974, "epoch": 950} {"train_loss": -39.2819938659668, "global_step": 114975, "epoch": 950} {"train_loss": -39.6591911315918, "global_step": 114976, "epoch": 950} {"train_loss": -39.694278717041016, "global_step": 114977, "epoch": 950} {"train_loss": -38.81492614746094, "global_step": 114978, "epoch": 950} {"train_loss": -39.181556701660156, "global_step": 114979, "epoch": 950} {"train_loss": -39.352169036865234, "global_step": 114980, "epoch": 950} {"train_loss": -39.7584342956543, "global_step": 114981, "epoch": 950} {"train_loss": -38.1917839050293, "global_step": 114982, "epoch": 950} {"train_loss": -37.31260681152344, "global_step": 114983, "epoch": 950} {"train_loss": -37.35494613647461, "global_step": 114984, "epoch": 950} {"train_loss": -39.51305389404297, "global_step": 114985, "epoch": 950} {"train_loss": -39.333377838134766, "global_step": 114986, "epoch": 950} {"train_loss": -38.751678466796875, "global_step": 114987, "epoch": 950} {"train_loss": -39.418495178222656, "global_step": 114988, "epoch": 950} {"train_loss": -39.211219787597656, "global_step": 114989, "epoch": 950} {"train_loss": -39.2487907409668, "global_step": 114990, "epoch": 950} {"train_loss": -39.210693359375, "global_step": 114991, "epoch": 950} {"train_loss": -36.81666946411133, "global_step": 114992, "epoch": 950} {"train_loss": -36.5539436340332, "global_step": 114993, "epoch": 950} {"train_loss": -37.49396896362305, "global_step": 114994, "epoch": 950} {"train_loss": -37.04380416870117, "global_step": 114995, "epoch": 950} {"train_loss": -38.877685546875, "global_step": 114996, "epoch": 950} {"train_loss": -38.650367736816406, "global_step": 114997, "epoch": 950} {"train_loss": -39.00645065307617, "global_step": 114998, "epoch": 950} {"train_loss": -37.70105743408203, "global_step": 114999, "epoch": 950} {"train_loss": -36.49635696411133, "global_step": 115000, "epoch": 950} {"train_loss": -35.25855255126953, "global_step": 115001, "epoch": 950} {"train_loss": -33.43292236328125, "global_step": 115002, "epoch": 950} {"train_loss": -28.367145538330078, "global_step": 115003, "epoch": 950} {"train_loss": -31.40699577331543, "global_step": 115004, "epoch": 950} {"train_loss": -37.38784408569336, "global_step": 115005, "epoch": 950} {"train_loss": -38.521095275878906, "global_step": 115006, "epoch": 950} {"train_loss": -36.433135986328125, "global_step": 115007, "epoch": 950} {"train_loss": -38.592994689941406, "global_step": 115008, "epoch": 950} {"train_loss": -36.31779098510742, "global_step": 115009, "epoch": 950} {"train_loss": -34.76691818237305, "global_step": 115010, "epoch": 950} {"train_loss": -38.558921813964844, "global_step": 115011, "epoch": 950} {"train_loss": -34.54311752319336, "global_step": 115012, "epoch": 950} {"train_loss": -37.15849685668945, "global_step": 115013, "epoch": 950} {"train_loss": -37.35036087036133, "global_step": 115014, "epoch": 950} {"train_loss": -36.38004684448242, "global_step": 115015, "epoch": 950} {"train_loss": -37.46861267089844, "global_step": 115016, "epoch": 950} {"train_loss": -37.184852600097656, "global_step": 115017, "epoch": 950} {"train_loss": -38.54004669189453, "global_step": 115018, "epoch": 950} {"train_loss": -37.973533630371094, "global_step": 115019, "epoch": 950} {"train_loss": -37.84699630737305, "global_step": 115020, "epoch": 950} {"train_loss": -37.66355514526367, "global_step": 115021, "epoch": 950} {"train_loss": -36.194576263427734, "global_step": 115022, "epoch": 950} {"train_loss": -37.303932189941406, "global_step": 115023, "epoch": 950} {"train_loss": -36.634857177734375, "global_step": 115024, "epoch": 950} {"train_loss": -37.2820930480957, "global_step": 115025, "epoch": 950} {"train_loss": -37.85721969604492, "global_step": 115026, "epoch": 950} {"train_loss": -35.207496643066406, "global_step": 115027, "epoch": 950} {"train_loss": -35.545528411865234, "global_step": 115028, "epoch": 950} {"train_loss": -37.7252311706543, "global_step": 115029, "epoch": 950} {"train_loss": -37.43872833251953, "global_step": 115030, "epoch": 950} {"train_loss": -38.147491455078125, "global_step": 115031, "epoch": 950} {"train_loss": -37.272274017333984, "global_step": 115032, "epoch": 950} {"train_loss": -37.553749084472656, "global_step": 115033, "epoch": 950} {"train_loss": -37.01841735839844, "global_step": 115034, "epoch": 950} {"train_loss": -38.06623458862305, "global_step": 115035, "epoch": 950} {"train_loss": -37.79875946044922, "global_step": 115036, "epoch": 950} {"train_loss": -37.67409133911133, "global_step": 115037, "epoch": 950} {"train_loss": -37.5109977722168, "global_step": 115038, "epoch": 950} {"train_loss": -37.732330322265625, "global_step": 115039, "epoch": 950} {"train_loss": -37.00046920776367, "global_step": 115040, "epoch": 950} {"train_loss": -37.858673095703125, "global_step": 115041, "epoch": 950} {"train_loss": -38.32424545288086, "global_step": 115042, "epoch": 950} {"train_loss": -38.1546630859375, "global_step": 115043, "epoch": 950} {"train_loss": -38.57753372192383, "global_step": 115044, "epoch": 950} {"train_loss": -37.60842514038086, "global_step": 115045, "epoch": 950} {"train_loss": -37.580657958984375, "global_step": 115046, "epoch": 950} {"train_loss": -38.67290115356445, "global_step": 115047, "epoch": 950} {"train_loss": -38.35041427612305, "global_step": 115048, "epoch": 950} {"train_loss": -37.55629348754883, "global_step": 115049, "epoch": 950} {"train_loss": -38.110877990722656, "global_step": 115050, "epoch": 950} {"train_loss": -38.64509963989258, "global_step": 115051, "epoch": 950} {"train_loss": -37.73640060424805, "global_step": 115052, "epoch": 950} {"train_loss": -38.75468063354492, "global_step": 115053, "epoch": 950} {"train_loss": -38.697166442871094, "global_step": 115054, "epoch": 950} {"train_loss": -38.96125030517578, "global_step": 115055, "epoch": 950} {"train_loss": -37.09827423095703, "global_step": 115056, "epoch": 950} {"train_loss": -38.4609260559082, "global_step": 115057, "epoch": 950} {"train_loss": -38.200958251953125, "global_step": 115058, "epoch": 950} {"train_loss": -37.46402359008789, "global_step": 115059, "epoch": 950} {"train_loss": -38.731224060058594, "global_step": 115060, "epoch": 950} {"train_loss": -37.759071350097656, "global_step": 115061, "epoch": 950} {"train_loss": -38.728240966796875, "global_step": 115062, "epoch": 950} {"train_loss": -38.28059005737305, "global_step": 115063, "epoch": 950} {"train_loss": -38.5008659362793, "global_step": 115064, "epoch": 950} {"train_loss": -39.05953598022461, "global_step": 115065, "epoch": 950} {"train_loss": -38.17694854736328, "global_step": 115066, "epoch": 950} {"train_loss": -37.89472579956055, "global_step": 115067, "epoch": 950} {"train_loss": -37.28606033325195, "global_step": 115068, "epoch": 950} {"train_loss": -38.66920852661133, "global_step": 115069, "epoch": 950} {"train_loss": -37.98299693273119, "global_step": 115070, "epoch": 950, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4400000": 1.0, "test/sim_max_reward_4400001": 1.0, "test/sim_max_reward_4400002": 1.0, "test/sim_max_reward_4400003": 0.0, "test/sim_max_reward_4400004": 1.0, "test/sim_max_reward_4400005": 1.0, "test/sim_max_reward_4400006": 1.0, "test/sim_max_reward_4400007": 1.0, "test/sim_max_reward_4400008": 1.0, "test/sim_max_reward_4400009": 1.0, "test/sim_max_reward_4400010": 1.0, "test/sim_max_reward_4400011": 1.0, "test/sim_max_reward_4400012": 1.0, "test/sim_max_reward_4400013": 1.0, "test/sim_max_reward_4400014": 1.0, "test/sim_max_reward_4400015": 1.0, "test/sim_max_reward_4400016": 1.0, "test/sim_max_reward_4400017": 1.0, "test/sim_max_reward_4400018": 1.0, "test/sim_max_reward_4400019": 1.0, "test/sim_max_reward_4400020": 1.0, "test/sim_max_reward_4400021": 1.0, "train/mean_score": 1.0, "test/mean_score": 0.9545454545454546, "val_loss": 2711621.25} {"train_loss": -38.14246368408203, "global_step": 115071, "epoch": 951} {"train_loss": -38.70003890991211, "global_step": 115072, "epoch": 951} {"train_loss": -38.98059844970703, "global_step": 115073, "epoch": 951} {"train_loss": -37.85508346557617, "global_step": 115074, "epoch": 951} {"train_loss": -38.88082504272461, "global_step": 115075, "epoch": 951} {"train_loss": -38.13230514526367, "global_step": 115076, "epoch": 951} {"train_loss": -38.54559326171875, "global_step": 115077, "epoch": 951} {"train_loss": -38.823001861572266, "global_step": 115078, "epoch": 951} {"train_loss": -38.11314010620117, "global_step": 115079, "epoch": 951} {"train_loss": -38.73664093017578, "global_step": 115080, "epoch": 951} {"train_loss": -38.94173049926758, "global_step": 115081, "epoch": 951} {"train_loss": -38.814361572265625, "global_step": 115082, "epoch": 951} {"train_loss": -39.66416549682617, "global_step": 115083, "epoch": 951} {"train_loss": -39.10110092163086, "global_step": 115084, "epoch": 951} {"train_loss": -38.6398811340332, "global_step": 115085, "epoch": 951} {"train_loss": -39.53007507324219, "global_step": 115086, "epoch": 951} {"train_loss": -39.08523178100586, "global_step": 115087, "epoch": 951} {"train_loss": -38.863033294677734, "global_step": 115088, "epoch": 951} {"train_loss": -39.09859848022461, "global_step": 115089, "epoch": 951} {"train_loss": -38.00426483154297, "global_step": 115090, "epoch": 951} {"train_loss": -39.167545318603516, "global_step": 115091, "epoch": 951} {"train_loss": -37.356651306152344, "global_step": 115092, "epoch": 951} {"train_loss": -39.06709289550781, "global_step": 115093, "epoch": 951} {"train_loss": -38.79254913330078, "global_step": 115094, "epoch": 951} {"train_loss": -39.26964569091797, "global_step": 115095, "epoch": 951} {"train_loss": -39.494808197021484, "global_step": 115096, "epoch": 951} {"train_loss": -39.54631805419922, "global_step": 115097, "epoch": 951} {"train_loss": -39.150634765625, "global_step": 115098, "epoch": 951} {"train_loss": -39.30902099609375, "global_step": 115099, "epoch": 951} {"train_loss": -39.67707443237305, "global_step": 115100, "epoch": 951} {"train_loss": -38.797767639160156, "global_step": 115101, "epoch": 951} {"train_loss": -38.86543655395508, "global_step": 115102, "epoch": 951} {"train_loss": -39.80630111694336, "global_step": 115103, "epoch": 951} {"train_loss": -39.2332763671875, "global_step": 115104, "epoch": 951} {"train_loss": -38.80884552001953, "global_step": 115105, "epoch": 951} {"train_loss": -39.57320785522461, "global_step": 115106, "epoch": 951} {"train_loss": -39.102970123291016, "global_step": 115107, "epoch": 951} {"train_loss": -38.1117057800293, "global_step": 115108, "epoch": 951} {"train_loss": -39.72174835205078, "global_step": 115109, "epoch": 951} {"train_loss": -39.080841064453125, "global_step": 115110, "epoch": 951} {"train_loss": -39.026512145996094, "global_step": 115111, "epoch": 951} {"train_loss": -38.700191497802734, "global_step": 115112, "epoch": 951} {"train_loss": -39.042999267578125, "global_step": 115113, "epoch": 951} {"train_loss": -38.75603485107422, "global_step": 115114, "epoch": 951} {"train_loss": -39.58170700073242, "global_step": 115115, "epoch": 951} {"train_loss": -39.65462112426758, "global_step": 115116, "epoch": 951} {"train_loss": -39.10396194458008, "global_step": 115117, "epoch": 951} {"train_loss": -34.72041702270508, "global_step": 115118, "epoch": 951} {"train_loss": -38.89741134643555, "global_step": 115119, "epoch": 951} {"train_loss": -39.5405387878418, "global_step": 115120, "epoch": 951} {"train_loss": -38.952293395996094, "global_step": 115121, "epoch": 951} {"train_loss": -36.20316696166992, "global_step": 115122, "epoch": 951} {"train_loss": -32.73408126831055, "global_step": 115123, "epoch": 951} {"train_loss": -37.40108871459961, "global_step": 115124, "epoch": 951} {"train_loss": -38.312740325927734, "global_step": 115125, "epoch": 951} {"train_loss": -10.40787124633789, "global_step": 115126, "epoch": 951} {"train_loss": -34.17426300048828, "global_step": 115127, "epoch": 951} {"train_loss": -33.17529296875, "global_step": 115128, "epoch": 951} {"train_loss": -35.52248001098633, "global_step": 115129, "epoch": 951} {"train_loss": -33.26652145385742, "global_step": 115130, "epoch": 951} {"train_loss": -33.0538444519043, "global_step": 115131, "epoch": 951} {"train_loss": -34.87336349487305, "global_step": 115132, "epoch": 951} {"train_loss": -30.31206703186035, "global_step": 115133, "epoch": 951} {"train_loss": -31.306781768798828, "global_step": 115134, "epoch": 951} {"train_loss": -32.33250045776367, "global_step": 115135, "epoch": 951} {"train_loss": -22.10055923461914, "global_step": 115136, "epoch": 951} {"train_loss": -35.78081130981445, "global_step": 115137, "epoch": 951} {"train_loss": -31.216760635375977, "global_step": 115138, "epoch": 951} {"train_loss": -27.202199935913086, "global_step": 115139, "epoch": 951} {"train_loss": -32.73503494262695, "global_step": 115140, "epoch": 951} {"train_loss": -31.901844024658203, "global_step": 115141, "epoch": 951} {"train_loss": -31.827367782592773, "global_step": 115142, "epoch": 951} {"train_loss": -34.267791748046875, "global_step": 115143, "epoch": 951} {"train_loss": -32.323673248291016, "global_step": 115144, "epoch": 951} {"train_loss": -33.74164962768555, "global_step": 115145, "epoch": 951} {"train_loss": -34.17295455932617, "global_step": 115146, "epoch": 951} {"train_loss": -34.9415168762207, "global_step": 115147, "epoch": 951} {"train_loss": -34.77744674682617, "global_step": 115148, "epoch": 951} {"train_loss": -31.082181930541992, "global_step": 115149, "epoch": 951} {"train_loss": -35.490867614746094, "global_step": 115150, "epoch": 951} {"train_loss": -34.43333053588867, "global_step": 115151, "epoch": 951} {"train_loss": -35.65790557861328, "global_step": 115152, "epoch": 951} {"train_loss": -33.22092819213867, "global_step": 115153, "epoch": 951} {"train_loss": -35.123374938964844, "global_step": 115154, "epoch": 951} {"train_loss": -36.173606872558594, "global_step": 115155, "epoch": 951} {"train_loss": -36.71156692504883, "global_step": 115156, "epoch": 951} {"train_loss": -37.15130615234375, "global_step": 115157, "epoch": 951} {"train_loss": -36.488067626953125, "global_step": 115158, "epoch": 951} {"train_loss": -34.95441818237305, "global_step": 115159, "epoch": 951} {"train_loss": -35.681880950927734, "global_step": 115160, "epoch": 951} {"train_loss": -35.60776901245117, "global_step": 115161, "epoch": 951} {"train_loss": -35.64229965209961, "global_step": 115162, "epoch": 951} {"train_loss": -36.477901458740234, "global_step": 115163, "epoch": 951} {"train_loss": -35.22413635253906, "global_step": 115164, "epoch": 951} {"train_loss": -36.288246154785156, "global_step": 115165, "epoch": 951} {"train_loss": -37.03953552246094, "global_step": 115166, "epoch": 951} {"train_loss": -36.91355514526367, "global_step": 115167, "epoch": 951} {"train_loss": -36.79598617553711, "global_step": 115168, "epoch": 951} {"train_loss": -37.164119720458984, "global_step": 115169, "epoch": 951} {"train_loss": -36.720306396484375, "global_step": 115170, "epoch": 951} {"train_loss": -36.26426315307617, "global_step": 115171, "epoch": 951} {"train_loss": -36.16750717163086, "global_step": 115172, "epoch": 951} {"train_loss": -37.4599723815918, "global_step": 115173, "epoch": 951} {"train_loss": -36.60622024536133, "global_step": 115174, "epoch": 951} {"train_loss": -37.04856491088867, "global_step": 115175, "epoch": 951} {"train_loss": -37.577880859375, "global_step": 115176, "epoch": 951} {"train_loss": -37.69999313354492, "global_step": 115177, "epoch": 951} {"train_loss": -37.30846405029297, "global_step": 115178, "epoch": 951} {"train_loss": -37.14881896972656, "global_step": 115179, "epoch": 951} {"train_loss": -37.46635055541992, "global_step": 115180, "epoch": 951} {"train_loss": -37.888912200927734, "global_step": 115181, "epoch": 951} {"train_loss": -37.71052169799805, "global_step": 115182, "epoch": 951} {"train_loss": -37.848175048828125, "global_step": 115183, "epoch": 951} {"train_loss": -36.91411209106445, "global_step": 115184, "epoch": 951} {"train_loss": -37.627708435058594, "global_step": 115185, "epoch": 951} {"train_loss": -38.26028823852539, "global_step": 115186, "epoch": 951} {"train_loss": -37.79396438598633, "global_step": 115187, "epoch": 951} {"train_loss": -37.808597564697266, "global_step": 115188, "epoch": 951} {"train_loss": -37.92566680908203, "global_step": 115189, "epoch": 951} {"train_loss": -38.095245361328125, "global_step": 115190, "epoch": 951} {"train_loss": -36.567703199780674, "global_step": 115191, "epoch": 951, "val_loss": 2613959.0} {"train_loss": -37.86208724975586, "global_step": 115192, "epoch": 952} {"train_loss": -38.29030227661133, "global_step": 115193, "epoch": 952} {"train_loss": -38.02120590209961, "global_step": 115194, "epoch": 952} {"train_loss": -37.66752243041992, "global_step": 115195, "epoch": 952} {"train_loss": -37.787654876708984, "global_step": 115196, "epoch": 952} {"train_loss": -38.21825408935547, "global_step": 115197, "epoch": 952} {"train_loss": -37.9445915222168, "global_step": 115198, "epoch": 952} {"train_loss": -37.3065071105957, "global_step": 115199, "epoch": 952} {"train_loss": -38.70168685913086, "global_step": 115200, "epoch": 952} {"train_loss": -37.795066833496094, "global_step": 115201, "epoch": 952} {"train_loss": -38.47198486328125, "global_step": 115202, "epoch": 952} {"train_loss": -37.81925582885742, "global_step": 115203, "epoch": 952} {"train_loss": -38.318702697753906, "global_step": 115204, "epoch": 952} {"train_loss": -38.07586669921875, "global_step": 115205, "epoch": 952} {"train_loss": -38.36815643310547, "global_step": 115206, "epoch": 952} {"train_loss": -38.505191802978516, "global_step": 115207, "epoch": 952} {"train_loss": -38.55149459838867, "global_step": 115208, "epoch": 952} {"train_loss": -38.79475021362305, "global_step": 115209, "epoch": 952} {"train_loss": -38.996822357177734, "global_step": 115210, "epoch": 952} {"train_loss": -38.51948928833008, "global_step": 115211, "epoch": 952} {"train_loss": -38.53519821166992, "global_step": 115212, "epoch": 952} {"train_loss": -38.609127044677734, "global_step": 115213, "epoch": 952} {"train_loss": -38.771724700927734, "global_step": 115214, "epoch": 952} {"train_loss": -38.81504440307617, "global_step": 115215, "epoch": 952} {"train_loss": -38.90711212158203, "global_step": 115216, "epoch": 952} {"train_loss": -38.62691116333008, "global_step": 115217, "epoch": 952} {"train_loss": -38.742733001708984, "global_step": 115218, "epoch": 952} {"train_loss": -38.805206298828125, "global_step": 115219, "epoch": 952} {"train_loss": -37.2146110534668, "global_step": 115220, "epoch": 952} {"train_loss": -38.20319747924805, "global_step": 115221, "epoch": 952} {"train_loss": -38.060821533203125, "global_step": 115222, "epoch": 952} {"train_loss": -37.59340286254883, "global_step": 115223, "epoch": 952} {"train_loss": -38.97806930541992, "global_step": 115224, "epoch": 952} {"train_loss": -38.6198616027832, "global_step": 115225, "epoch": 952} {"train_loss": -38.51508712768555, "global_step": 115226, "epoch": 952} {"train_loss": -38.34674072265625, "global_step": 115227, "epoch": 952} {"train_loss": -38.75856018066406, "global_step": 115228, "epoch": 952} {"train_loss": -39.008052825927734, "global_step": 115229, "epoch": 952} {"train_loss": -38.598140716552734, "global_step": 115230, "epoch": 952} {"train_loss": -38.43623352050781, "global_step": 115231, "epoch": 952} {"train_loss": -38.77492904663086, "global_step": 115232, "epoch": 952} {"train_loss": -37.76328659057617, "global_step": 115233, "epoch": 952} {"train_loss": -38.19970703125, "global_step": 115234, "epoch": 952} {"train_loss": -39.66213607788086, "global_step": 115235, "epoch": 952} {"train_loss": -37.0510139465332, "global_step": 115236, "epoch": 952} {"train_loss": -35.61209487915039, "global_step": 115237, "epoch": 952} {"train_loss": -37.41244888305664, "global_step": 115238, "epoch": 952} {"train_loss": -39.21955490112305, "global_step": 115239, "epoch": 952} {"train_loss": -36.93916702270508, "global_step": 115240, "epoch": 952} {"train_loss": -35.40795135498047, "global_step": 115241, "epoch": 952} {"train_loss": -38.05131912231445, "global_step": 115242, "epoch": 952} {"train_loss": -38.13492965698242, "global_step": 115243, "epoch": 952} {"train_loss": -34.85685348510742, "global_step": 115244, "epoch": 952} {"train_loss": -38.734100341796875, "global_step": 115245, "epoch": 952} {"train_loss": -37.641597747802734, "global_step": 115246, "epoch": 952} {"train_loss": -38.36719512939453, "global_step": 115247, "epoch": 952} {"train_loss": -37.30546951293945, "global_step": 115248, "epoch": 952} {"train_loss": -36.79838180541992, "global_step": 115249, "epoch": 952} {"train_loss": -39.07652282714844, "global_step": 115250, "epoch": 952} {"train_loss": -36.771240234375, "global_step": 115251, "epoch": 952} {"train_loss": -37.0148811340332, "global_step": 115252, "epoch": 952} {"train_loss": -36.458065032958984, "global_step": 115253, "epoch": 952} {"train_loss": -37.09182357788086, "global_step": 115254, "epoch": 952} {"train_loss": -37.731075286865234, "global_step": 115255, "epoch": 952} {"train_loss": -37.90913009643555, "global_step": 115256, "epoch": 952} {"train_loss": -37.16501998901367, "global_step": 115257, "epoch": 952} {"train_loss": -38.44883346557617, "global_step": 115258, "epoch": 952} {"train_loss": -36.955692291259766, "global_step": 115259, "epoch": 952} {"train_loss": -38.0880241394043, "global_step": 115260, "epoch": 952} {"train_loss": -37.37202835083008, "global_step": 115261, "epoch": 952} {"train_loss": -38.000244140625, "global_step": 115262, "epoch": 952} {"train_loss": -37.11151123046875, "global_step": 115263, "epoch": 952} {"train_loss": -37.2378044128418, "global_step": 115264, "epoch": 952} {"train_loss": -37.67197799682617, "global_step": 115265, "epoch": 952} {"train_loss": -37.24259948730469, "global_step": 115266, "epoch": 952} {"train_loss": -38.06690216064453, "global_step": 115267, "epoch": 952} {"train_loss": -37.481807708740234, "global_step": 115268, "epoch": 952} {"train_loss": -38.30173873901367, "global_step": 115269, "epoch": 952} {"train_loss": -37.97821807861328, "global_step": 115270, "epoch": 952} {"train_loss": -38.20692825317383, "global_step": 115271, "epoch": 952} {"train_loss": -38.54010772705078, "global_step": 115272, "epoch": 952} {"train_loss": -38.78666305541992, "global_step": 115273, "epoch": 952} {"train_loss": -37.82106399536133, "global_step": 115274, "epoch": 952} {"train_loss": -37.516841888427734, "global_step": 115275, "epoch": 952} {"train_loss": -38.359317779541016, "global_step": 115276, "epoch": 952} {"train_loss": -37.601661682128906, "global_step": 115277, "epoch": 952} {"train_loss": -38.73688888549805, "global_step": 115278, "epoch": 952} {"train_loss": -38.54660415649414, "global_step": 115279, "epoch": 952} {"train_loss": -39.40187454223633, "global_step": 115280, "epoch": 952} {"train_loss": -38.70427322387695, "global_step": 115281, "epoch": 952} {"train_loss": -38.36751174926758, "global_step": 115282, "epoch": 952} {"train_loss": -39.29351806640625, "global_step": 115283, "epoch": 952} {"train_loss": -38.25751876831055, "global_step": 115284, "epoch": 952} {"train_loss": -38.86686325073242, "global_step": 115285, "epoch": 952} {"train_loss": -39.184051513671875, "global_step": 115286, "epoch": 952} {"train_loss": -38.7443962097168, "global_step": 115287, "epoch": 952} {"train_loss": -39.363800048828125, "global_step": 115288, "epoch": 952} {"train_loss": -39.154293060302734, "global_step": 115289, "epoch": 952} {"train_loss": -39.07608413696289, "global_step": 115290, "epoch": 952} {"train_loss": -38.69828414916992, "global_step": 115291, "epoch": 952} {"train_loss": -38.72408676147461, "global_step": 115292, "epoch": 952} {"train_loss": -38.6817512512207, "global_step": 115293, "epoch": 952} {"train_loss": -38.91144561767578, "global_step": 115294, "epoch": 952} {"train_loss": -38.85809326171875, "global_step": 115295, "epoch": 952} {"train_loss": -39.0069694519043, "global_step": 115296, "epoch": 952} {"train_loss": -39.40031051635742, "global_step": 115297, "epoch": 952} {"train_loss": -38.88386917114258, "global_step": 115298, "epoch": 952} {"train_loss": -38.813533782958984, "global_step": 115299, "epoch": 952} {"train_loss": -39.17014694213867, "global_step": 115300, "epoch": 952} {"train_loss": -39.425392150878906, "global_step": 115301, "epoch": 952} {"train_loss": -38.86363220214844, "global_step": 115302, "epoch": 952} {"train_loss": -39.45993423461914, "global_step": 115303, "epoch": 952} {"train_loss": -39.28103256225586, "global_step": 115304, "epoch": 952} {"train_loss": -39.065704345703125, "global_step": 115305, "epoch": 952} {"train_loss": -38.7200927734375, "global_step": 115306, "epoch": 952} {"train_loss": -39.67795944213867, "global_step": 115307, "epoch": 952} {"train_loss": -39.04159164428711, "global_step": 115308, "epoch": 952} {"train_loss": -39.689125061035156, "global_step": 115309, "epoch": 952} {"train_loss": -39.097713470458984, "global_step": 115310, "epoch": 952} {"train_loss": -39.50495147705078, "global_step": 115311, "epoch": 952} {"train_loss": -38.2839067947766, "global_step": 115312, "epoch": 952, "val_loss": 2543601.25} {"train_loss": -38.870323181152344, "global_step": 115313, "epoch": 953} {"train_loss": -38.65079879760742, "global_step": 115314, "epoch": 953} {"train_loss": -39.6497917175293, "global_step": 115315, "epoch": 953} {"train_loss": -39.70305252075195, "global_step": 115316, "epoch": 953} {"train_loss": -38.48287582397461, "global_step": 115317, "epoch": 953} {"train_loss": -38.98503112792969, "global_step": 115318, "epoch": 953} {"train_loss": -38.715858459472656, "global_step": 115319, "epoch": 953} {"train_loss": -38.3315315246582, "global_step": 115320, "epoch": 953} {"train_loss": -38.20566940307617, "global_step": 115321, "epoch": 953} {"train_loss": -38.62964630126953, "global_step": 115322, "epoch": 953} {"train_loss": -38.50020217895508, "global_step": 115323, "epoch": 953} {"train_loss": -38.38387680053711, "global_step": 115324, "epoch": 953} {"train_loss": -37.40235137939453, "global_step": 115325, "epoch": 953} {"train_loss": -36.75141525268555, "global_step": 115326, "epoch": 953} {"train_loss": -37.733882904052734, "global_step": 115327, "epoch": 953} {"train_loss": -36.47286605834961, "global_step": 115328, "epoch": 953} {"train_loss": -35.329891204833984, "global_step": 115329, "epoch": 953} {"train_loss": -38.431297302246094, "global_step": 115330, "epoch": 953} {"train_loss": -39.67110824584961, "global_step": 115331, "epoch": 953} {"train_loss": -37.303245544433594, "global_step": 115332, "epoch": 953} {"train_loss": -36.40717315673828, "global_step": 115333, "epoch": 953} {"train_loss": -38.4361686706543, "global_step": 115334, "epoch": 953} {"train_loss": -39.187408447265625, "global_step": 115335, "epoch": 953} {"train_loss": -39.39111328125, "global_step": 115336, "epoch": 953} {"train_loss": -38.99634552001953, "global_step": 115337, "epoch": 953} {"train_loss": -39.16987228393555, "global_step": 115338, "epoch": 953} {"train_loss": -38.53697204589844, "global_step": 115339, "epoch": 953} {"train_loss": -39.032466888427734, "global_step": 115340, "epoch": 953} {"train_loss": -37.32046127319336, "global_step": 115341, "epoch": 953} {"train_loss": -38.93892288208008, "global_step": 115342, "epoch": 953} {"train_loss": -37.53557205200195, "global_step": 115343, "epoch": 953} {"train_loss": -36.24087142944336, "global_step": 115344, "epoch": 953} {"train_loss": -39.59601593017578, "global_step": 115345, "epoch": 953} {"train_loss": -37.975711822509766, "global_step": 115346, "epoch": 953} {"train_loss": -39.063777923583984, "global_step": 115347, "epoch": 953} {"train_loss": -38.610206604003906, "global_step": 115348, "epoch": 953} {"train_loss": -38.50741195678711, "global_step": 115349, "epoch": 953} {"train_loss": -38.70174789428711, "global_step": 115350, "epoch": 953} {"train_loss": -38.22101593017578, "global_step": 115351, "epoch": 953} {"train_loss": -38.88235092163086, "global_step": 115352, "epoch": 953} {"train_loss": -39.5589714050293, "global_step": 115353, "epoch": 953} {"train_loss": -37.93342971801758, "global_step": 115354, "epoch": 953} {"train_loss": -39.0048942565918, "global_step": 115355, "epoch": 953} {"train_loss": -37.93963623046875, "global_step": 115356, "epoch": 953} {"train_loss": -38.748077392578125, "global_step": 115357, "epoch": 953} {"train_loss": -36.96161651611328, "global_step": 115358, "epoch": 953} {"train_loss": -38.62983703613281, "global_step": 115359, "epoch": 953} {"train_loss": -38.64296340942383, "global_step": 115360, "epoch": 953} {"train_loss": -37.77625274658203, "global_step": 115361, "epoch": 953} {"train_loss": -37.68670654296875, "global_step": 115362, "epoch": 953} {"train_loss": -38.17237091064453, "global_step": 115363, "epoch": 953} {"train_loss": -38.88583755493164, "global_step": 115364, "epoch": 953} {"train_loss": -38.74722671508789, "global_step": 115365, "epoch": 953} {"train_loss": -38.45534133911133, "global_step": 115366, "epoch": 953} {"train_loss": -38.4100456237793, "global_step": 115367, "epoch": 953} {"train_loss": -39.40616989135742, "global_step": 115368, "epoch": 953} {"train_loss": -39.605899810791016, "global_step": 115369, "epoch": 953} {"train_loss": -39.651641845703125, "global_step": 115370, "epoch": 953} {"train_loss": -39.00167465209961, "global_step": 115371, "epoch": 953} {"train_loss": -39.14482879638672, "global_step": 115372, "epoch": 953} {"train_loss": -39.07529830932617, "global_step": 115373, "epoch": 953} {"train_loss": -39.4666748046875, "global_step": 115374, "epoch": 953} {"train_loss": -38.6924934387207, "global_step": 115375, "epoch": 953} {"train_loss": -38.57879638671875, "global_step": 115376, "epoch": 953} {"train_loss": -38.970367431640625, "global_step": 115377, "epoch": 953} {"train_loss": -39.5687141418457, "global_step": 115378, "epoch": 953} {"train_loss": -38.979957580566406, "global_step": 115379, "epoch": 953} {"train_loss": -38.490211486816406, "global_step": 115380, "epoch": 953} {"train_loss": -39.73641586303711, "global_step": 115381, "epoch": 953} {"train_loss": -38.99135971069336, "global_step": 115382, "epoch": 953} {"train_loss": -37.667781829833984, "global_step": 115383, "epoch": 953} {"train_loss": -39.00875473022461, "global_step": 115384, "epoch": 953} {"train_loss": -39.80179977416992, "global_step": 115385, "epoch": 953} {"train_loss": -39.2884635925293, "global_step": 115386, "epoch": 953} {"train_loss": -38.93711471557617, "global_step": 115387, "epoch": 953} {"train_loss": -39.10226821899414, "global_step": 115388, "epoch": 953} {"train_loss": -38.39943313598633, "global_step": 115389, "epoch": 953} {"train_loss": -38.13691329956055, "global_step": 115390, "epoch": 953} {"train_loss": -37.880859375, "global_step": 115391, "epoch": 953} {"train_loss": -38.9183349609375, "global_step": 115392, "epoch": 953} {"train_loss": -39.205230712890625, "global_step": 115393, "epoch": 953} {"train_loss": -38.779327392578125, "global_step": 115394, "epoch": 953} {"train_loss": -36.53953170776367, "global_step": 115395, "epoch": 953} {"train_loss": -37.621395111083984, "global_step": 115396, "epoch": 953} {"train_loss": -38.2271614074707, "global_step": 115397, "epoch": 953} {"train_loss": -38.65977096557617, "global_step": 115398, "epoch": 953} {"train_loss": -39.04256820678711, "global_step": 115399, "epoch": 953} {"train_loss": -38.82111358642578, "global_step": 115400, "epoch": 953} {"train_loss": -38.531978607177734, "global_step": 115401, "epoch": 953} {"train_loss": -38.343238830566406, "global_step": 115402, "epoch": 953} {"train_loss": -36.04136276245117, "global_step": 115403, "epoch": 953} {"train_loss": -37.634971618652344, "global_step": 115404, "epoch": 953} {"train_loss": -37.690101623535156, "global_step": 115405, "epoch": 953} {"train_loss": -39.01856231689453, "global_step": 115406, "epoch": 953} {"train_loss": -38.840003967285156, "global_step": 115407, "epoch": 953} {"train_loss": -36.61751937866211, "global_step": 115408, "epoch": 953} {"train_loss": -37.397621154785156, "global_step": 115409, "epoch": 953} {"train_loss": -38.6796989440918, "global_step": 115410, "epoch": 953} {"train_loss": -37.615535736083984, "global_step": 115411, "epoch": 953} {"train_loss": -38.838462829589844, "global_step": 115412, "epoch": 953} {"train_loss": -38.498775482177734, "global_step": 115413, "epoch": 953} {"train_loss": -38.351409912109375, "global_step": 115414, "epoch": 953} {"train_loss": -37.57581329345703, "global_step": 115415, "epoch": 953} {"train_loss": -37.34934616088867, "global_step": 115416, "epoch": 953} {"train_loss": -38.828914642333984, "global_step": 115417, "epoch": 953} {"train_loss": -37.882301330566406, "global_step": 115418, "epoch": 953} {"train_loss": -38.66922378540039, "global_step": 115419, "epoch": 953} {"train_loss": -35.46553421020508, "global_step": 115420, "epoch": 953} {"train_loss": -39.28196334838867, "global_step": 115421, "epoch": 953} {"train_loss": -37.67444610595703, "global_step": 115422, "epoch": 953} {"train_loss": -39.249786376953125, "global_step": 115423, "epoch": 953} {"train_loss": -38.279354095458984, "global_step": 115424, "epoch": 953} {"train_loss": -39.17405319213867, "global_step": 115425, "epoch": 953} {"train_loss": -38.86664962768555, "global_step": 115426, "epoch": 953} {"train_loss": -39.07680130004883, "global_step": 115427, "epoch": 953} {"train_loss": -38.87428665161133, "global_step": 115428, "epoch": 953} {"train_loss": -38.8128662109375, "global_step": 115429, "epoch": 953} {"train_loss": -39.29270935058594, "global_step": 115430, "epoch": 953} {"train_loss": -38.55912399291992, "global_step": 115431, "epoch": 953} {"train_loss": -39.78947067260742, "global_step": 115432, "epoch": 953} {"train_loss": -38.46021072135484, "global_step": 115433, "epoch": 953, "val_loss": 2588407.5} {"train_loss": -38.81007766723633, "global_step": 115434, "epoch": 954} {"train_loss": -38.90995407104492, "global_step": 115435, "epoch": 954} {"train_loss": -39.020263671875, "global_step": 115436, "epoch": 954} {"train_loss": -39.44901657104492, "global_step": 115437, "epoch": 954} {"train_loss": -38.9373893737793, "global_step": 115438, "epoch": 954} {"train_loss": -39.217708587646484, "global_step": 115439, "epoch": 954} {"train_loss": -38.823238372802734, "global_step": 115440, "epoch": 954} {"train_loss": -39.29041290283203, "global_step": 115441, "epoch": 954} {"train_loss": -39.597938537597656, "global_step": 115442, "epoch": 954} {"train_loss": -38.70588684082031, "global_step": 115443, "epoch": 954} {"train_loss": -39.165809631347656, "global_step": 115444, "epoch": 954} {"train_loss": -37.64684295654297, "global_step": 115445, "epoch": 954} {"train_loss": -39.030025482177734, "global_step": 115446, "epoch": 954} {"train_loss": -38.44683837890625, "global_step": 115447, "epoch": 954} {"train_loss": -39.281524658203125, "global_step": 115448, "epoch": 954} {"train_loss": -39.142181396484375, "global_step": 115449, "epoch": 954} {"train_loss": -39.550697326660156, "global_step": 115450, "epoch": 954} {"train_loss": -39.872745513916016, "global_step": 115451, "epoch": 954} {"train_loss": -38.2584114074707, "global_step": 115452, "epoch": 954} {"train_loss": -39.5805778503418, "global_step": 115453, "epoch": 954} {"train_loss": -39.52130126953125, "global_step": 115454, "epoch": 954} {"train_loss": -40.35709762573242, "global_step": 115455, "epoch": 954} {"train_loss": -39.82936477661133, "global_step": 115456, "epoch": 954} {"train_loss": -39.0709114074707, "global_step": 115457, "epoch": 954} {"train_loss": -39.472923278808594, "global_step": 115458, "epoch": 954} {"train_loss": -39.059898376464844, "global_step": 115459, "epoch": 954} {"train_loss": -39.46110916137695, "global_step": 115460, "epoch": 954} {"train_loss": -39.287025451660156, "global_step": 115461, "epoch": 954} {"train_loss": -39.99061965942383, "global_step": 115462, "epoch": 954} {"train_loss": -39.342926025390625, "global_step": 115463, "epoch": 954} {"train_loss": -39.133453369140625, "global_step": 115464, "epoch": 954} {"train_loss": -38.635189056396484, "global_step": 115465, "epoch": 954} {"train_loss": -38.24620056152344, "global_step": 115466, "epoch": 954} {"train_loss": -37.8134880065918, "global_step": 115467, "epoch": 954} {"train_loss": -37.334415435791016, "global_step": 115468, "epoch": 954} {"train_loss": -37.06516647338867, "global_step": 115469, "epoch": 954} {"train_loss": -37.312591552734375, "global_step": 115470, "epoch": 954} {"train_loss": -35.95048522949219, "global_step": 115471, "epoch": 954} {"train_loss": -39.11656951904297, "global_step": 115472, "epoch": 954} {"train_loss": -38.888431549072266, "global_step": 115473, "epoch": 954} {"train_loss": -39.50410079956055, "global_step": 115474, "epoch": 954} {"train_loss": -39.29624557495117, "global_step": 115475, "epoch": 954} {"train_loss": -39.283721923828125, "global_step": 115476, "epoch": 954} {"train_loss": -38.48896026611328, "global_step": 115477, "epoch": 954} {"train_loss": -39.38656234741211, "global_step": 115478, "epoch": 954} {"train_loss": -37.42768478393555, "global_step": 115479, "epoch": 954} {"train_loss": -39.51874923706055, "global_step": 115480, "epoch": 954} {"train_loss": -39.036956787109375, "global_step": 115481, "epoch": 954} {"train_loss": -36.711158752441406, "global_step": 115482, "epoch": 954} {"train_loss": -37.681312561035156, "global_step": 115483, "epoch": 954} {"train_loss": -39.04848861694336, "global_step": 115484, "epoch": 954} {"train_loss": -37.202415466308594, "global_step": 115485, "epoch": 954} {"train_loss": -37.3564338684082, "global_step": 115486, "epoch": 954} {"train_loss": -38.273956298828125, "global_step": 115487, "epoch": 954} {"train_loss": -39.21112823486328, "global_step": 115488, "epoch": 954} {"train_loss": -39.2763786315918, "global_step": 115489, "epoch": 954} {"train_loss": -38.68751907348633, "global_step": 115490, "epoch": 954} {"train_loss": -39.553504943847656, "global_step": 115491, "epoch": 954} {"train_loss": -38.997615814208984, "global_step": 115492, "epoch": 954} {"train_loss": -38.152278900146484, "global_step": 115493, "epoch": 954} {"train_loss": -38.1019287109375, "global_step": 115494, "epoch": 954} {"train_loss": -38.08696746826172, "global_step": 115495, "epoch": 954} {"train_loss": -37.23938751220703, "global_step": 115496, "epoch": 954} {"train_loss": -38.94532012939453, "global_step": 115497, "epoch": 954} {"train_loss": -39.06855773925781, "global_step": 115498, "epoch": 954} {"train_loss": -35.42659378051758, "global_step": 115499, "epoch": 954} {"train_loss": -38.699859619140625, "global_step": 115500, "epoch": 954} {"train_loss": -36.45415115356445, "global_step": 115501, "epoch": 954} {"train_loss": -37.700477600097656, "global_step": 115502, "epoch": 954} {"train_loss": -37.6191520690918, "global_step": 115503, "epoch": 954} {"train_loss": -38.018592834472656, "global_step": 115504, "epoch": 954} {"train_loss": -38.96274185180664, "global_step": 115505, "epoch": 954} {"train_loss": -37.73666763305664, "global_step": 115506, "epoch": 954} {"train_loss": -38.22528839111328, "global_step": 115507, "epoch": 954} {"train_loss": -38.3272819519043, "global_step": 115508, "epoch": 954} {"train_loss": -38.52156448364258, "global_step": 115509, "epoch": 954} {"train_loss": -38.525848388671875, "global_step": 115510, "epoch": 954} {"train_loss": -38.74317169189453, "global_step": 115511, "epoch": 954} {"train_loss": -38.473140716552734, "global_step": 115512, "epoch": 954} {"train_loss": -39.69175338745117, "global_step": 115513, "epoch": 954} {"train_loss": -38.79463577270508, "global_step": 115514, "epoch": 954} {"train_loss": -39.06705856323242, "global_step": 115515, "epoch": 954} {"train_loss": -39.312835693359375, "global_step": 115516, "epoch": 954} {"train_loss": -37.80316162109375, "global_step": 115517, "epoch": 954} {"train_loss": -39.55094909667969, "global_step": 115518, "epoch": 954} {"train_loss": -38.949676513671875, "global_step": 115519, "epoch": 954} {"train_loss": -39.2050666809082, "global_step": 115520, "epoch": 954} {"train_loss": -39.9661979675293, "global_step": 115521, "epoch": 954} {"train_loss": -38.81298828125, "global_step": 115522, "epoch": 954} {"train_loss": -39.50014877319336, "global_step": 115523, "epoch": 954} {"train_loss": -38.2428092956543, "global_step": 115524, "epoch": 954} {"train_loss": -39.35634231567383, "global_step": 115525, "epoch": 954} {"train_loss": -39.41552734375, "global_step": 115526, "epoch": 954} {"train_loss": -39.039588928222656, "global_step": 115527, "epoch": 954} {"train_loss": -39.89142608642578, "global_step": 115528, "epoch": 954} {"train_loss": -39.089481353759766, "global_step": 115529, "epoch": 954} {"train_loss": -40.01055908203125, "global_step": 115530, "epoch": 954} {"train_loss": -39.50416946411133, "global_step": 115531, "epoch": 954} {"train_loss": -38.93788528442383, "global_step": 115532, "epoch": 954} {"train_loss": -39.936126708984375, "global_step": 115533, "epoch": 954} {"train_loss": -39.61587905883789, "global_step": 115534, "epoch": 954} {"train_loss": -39.869110107421875, "global_step": 115535, "epoch": 954} {"train_loss": -39.0747184753418, "global_step": 115536, "epoch": 954} {"train_loss": -38.37661361694336, "global_step": 115537, "epoch": 954} {"train_loss": -39.474525451660156, "global_step": 115538, "epoch": 954} {"train_loss": -40.09720993041992, "global_step": 115539, "epoch": 954} {"train_loss": -39.17047119140625, "global_step": 115540, "epoch": 954} {"train_loss": -39.44758224487305, "global_step": 115541, "epoch": 954} {"train_loss": -39.302608489990234, "global_step": 115542, "epoch": 954} {"train_loss": -39.15253448486328, "global_step": 115543, "epoch": 954} {"train_loss": -38.14585494995117, "global_step": 115544, "epoch": 954} {"train_loss": -38.46726989746094, "global_step": 115545, "epoch": 954} {"train_loss": -37.22355270385742, "global_step": 115546, "epoch": 954} {"train_loss": -38.521087646484375, "global_step": 115547, "epoch": 954} {"train_loss": -38.39253234863281, "global_step": 115548, "epoch": 954} {"train_loss": -38.04653549194336, "global_step": 115549, "epoch": 954} {"train_loss": -36.11686325073242, "global_step": 115550, "epoch": 954} {"train_loss": -37.98080062866211, "global_step": 115551, "epoch": 954} {"train_loss": -39.071861267089844, "global_step": 115552, "epoch": 954} {"train_loss": -39.198524475097656, "global_step": 115553, "epoch": 954} {"train_loss": -38.73690045569554, "global_step": 115554, "epoch": 954, "val_loss": 2680837.75} {"train_loss": -38.46577835083008, "global_step": 115555, "epoch": 955} {"train_loss": -38.433021545410156, "global_step": 115556, "epoch": 955} {"train_loss": -38.31867218017578, "global_step": 115557, "epoch": 955} {"train_loss": -39.23802947998047, "global_step": 115558, "epoch": 955} {"train_loss": -39.97391891479492, "global_step": 115559, "epoch": 955} {"train_loss": -38.78597640991211, "global_step": 115560, "epoch": 955} {"train_loss": -38.68927001953125, "global_step": 115561, "epoch": 955} {"train_loss": -38.54697799682617, "global_step": 115562, "epoch": 955} {"train_loss": -36.988441467285156, "global_step": 115563, "epoch": 955} {"train_loss": -37.14204788208008, "global_step": 115564, "epoch": 955} {"train_loss": -38.314151763916016, "global_step": 115565, "epoch": 955} {"train_loss": -39.26533889770508, "global_step": 115566, "epoch": 955} {"train_loss": -39.09711456298828, "global_step": 115567, "epoch": 955} {"train_loss": -39.17719268798828, "global_step": 115568, "epoch": 955} {"train_loss": -38.690311431884766, "global_step": 115569, "epoch": 955} {"train_loss": -39.44810104370117, "global_step": 115570, "epoch": 955} {"train_loss": -38.97604751586914, "global_step": 115571, "epoch": 955} {"train_loss": -39.866878509521484, "global_step": 115572, "epoch": 955} {"train_loss": -39.1448974609375, "global_step": 115573, "epoch": 955} {"train_loss": -39.62333297729492, "global_step": 115574, "epoch": 955} {"train_loss": -39.294639587402344, "global_step": 115575, "epoch": 955} {"train_loss": -39.76908493041992, "global_step": 115576, "epoch": 955} {"train_loss": -40.11298751831055, "global_step": 115577, "epoch": 955} {"train_loss": -39.47490310668945, "global_step": 115578, "epoch": 955} {"train_loss": -39.85956954956055, "global_step": 115579, "epoch": 955} {"train_loss": -39.60044479370117, "global_step": 115580, "epoch": 955} {"train_loss": -39.63706588745117, "global_step": 115581, "epoch": 955} {"train_loss": -39.1213493347168, "global_step": 115582, "epoch": 955} {"train_loss": -37.73696517944336, "global_step": 115583, "epoch": 955} {"train_loss": -37.257789611816406, "global_step": 115584, "epoch": 955} {"train_loss": -35.27923583984375, "global_step": 115585, "epoch": 955} {"train_loss": -34.838741302490234, "global_step": 115586, "epoch": 955} {"train_loss": -39.79095458984375, "global_step": 115587, "epoch": 955} {"train_loss": -37.242591857910156, "global_step": 115588, "epoch": 955} {"train_loss": -37.353450775146484, "global_step": 115589, "epoch": 955} {"train_loss": -39.16831588745117, "global_step": 115590, "epoch": 955} {"train_loss": -38.245235443115234, "global_step": 115591, "epoch": 955} {"train_loss": -37.88798904418945, "global_step": 115592, "epoch": 955} {"train_loss": -38.88778305053711, "global_step": 115593, "epoch": 955} {"train_loss": -38.88302230834961, "global_step": 115594, "epoch": 955} {"train_loss": -39.16184997558594, "global_step": 115595, "epoch": 955} {"train_loss": -39.248165130615234, "global_step": 115596, "epoch": 955} {"train_loss": -39.629695892333984, "global_step": 115597, "epoch": 955} {"train_loss": -39.15073776245117, "global_step": 115598, "epoch": 955} {"train_loss": -39.578609466552734, "global_step": 115599, "epoch": 955} {"train_loss": -39.09089279174805, "global_step": 115600, "epoch": 955} {"train_loss": -39.112178802490234, "global_step": 115601, "epoch": 955} {"train_loss": -39.746334075927734, "global_step": 115602, "epoch": 955} {"train_loss": -38.89852523803711, "global_step": 115603, "epoch": 955} {"train_loss": -40.41155242919922, "global_step": 115604, "epoch": 955} {"train_loss": -39.44596481323242, "global_step": 115605, "epoch": 955} {"train_loss": -40.0977668762207, "global_step": 115606, "epoch": 955} {"train_loss": -39.3614387512207, "global_step": 115607, "epoch": 955} {"train_loss": -39.37978744506836, "global_step": 115608, "epoch": 955} {"train_loss": -39.94699478149414, "global_step": 115609, "epoch": 955} {"train_loss": -39.22423553466797, "global_step": 115610, "epoch": 955} {"train_loss": -40.186344146728516, "global_step": 115611, "epoch": 955} {"train_loss": -39.5933952331543, "global_step": 115612, "epoch": 955} {"train_loss": -40.19620132446289, "global_step": 115613, "epoch": 955} {"train_loss": -39.874359130859375, "global_step": 115614, "epoch": 955} {"train_loss": -39.31383514404297, "global_step": 115615, "epoch": 955} {"train_loss": -39.87374496459961, "global_step": 115616, "epoch": 955} {"train_loss": -39.00948715209961, "global_step": 115617, "epoch": 955} {"train_loss": -38.38762283325195, "global_step": 115618, "epoch": 955} {"train_loss": -36.235260009765625, "global_step": 115619, "epoch": 955} {"train_loss": -34.97630310058594, "global_step": 115620, "epoch": 955} {"train_loss": -34.6856575012207, "global_step": 115621, "epoch": 955} {"train_loss": -35.84597396850586, "global_step": 115622, "epoch": 955} {"train_loss": -38.37748336791992, "global_step": 115623, "epoch": 955} {"train_loss": -38.69975662231445, "global_step": 115624, "epoch": 955} {"train_loss": -36.30829620361328, "global_step": 115625, "epoch": 955} {"train_loss": -32.990814208984375, "global_step": 115626, "epoch": 955} {"train_loss": -35.26555633544922, "global_step": 115627, "epoch": 955} {"train_loss": -37.643638610839844, "global_step": 115628, "epoch": 955} {"train_loss": -35.5126953125, "global_step": 115629, "epoch": 955} {"train_loss": -35.82712936401367, "global_step": 115630, "epoch": 955} {"train_loss": -36.7523078918457, "global_step": 115631, "epoch": 955} {"train_loss": -36.9571418762207, "global_step": 115632, "epoch": 955} {"train_loss": -38.121089935302734, "global_step": 115633, "epoch": 955} {"train_loss": -30.4553279876709, "global_step": 115634, "epoch": 955} {"train_loss": -36.28242111206055, "global_step": 115635, "epoch": 955} {"train_loss": -37.71803665161133, "global_step": 115636, "epoch": 955} {"train_loss": -36.140533447265625, "global_step": 115637, "epoch": 955} {"train_loss": -36.85129928588867, "global_step": 115638, "epoch": 955} {"train_loss": -37.8936767578125, "global_step": 115639, "epoch": 955} {"train_loss": -37.0464973449707, "global_step": 115640, "epoch": 955} {"train_loss": -37.00269317626953, "global_step": 115641, "epoch": 955} {"train_loss": -37.92600631713867, "global_step": 115642, "epoch": 955} {"train_loss": -34.702186584472656, "global_step": 115643, "epoch": 955} {"train_loss": -37.03670883178711, "global_step": 115644, "epoch": 955} {"train_loss": -36.65022659301758, "global_step": 115645, "epoch": 955} {"train_loss": -38.05447769165039, "global_step": 115646, "epoch": 955} {"train_loss": -34.47564697265625, "global_step": 115647, "epoch": 955} {"train_loss": -37.26639938354492, "global_step": 115648, "epoch": 955} {"train_loss": -36.666927337646484, "global_step": 115649, "epoch": 955} {"train_loss": -37.23795700073242, "global_step": 115650, "epoch": 955} {"train_loss": -37.5721435546875, "global_step": 115651, "epoch": 955} {"train_loss": -37.67694854736328, "global_step": 115652, "epoch": 955} {"train_loss": -38.099491119384766, "global_step": 115653, "epoch": 955} {"train_loss": -36.946861267089844, "global_step": 115654, "epoch": 955} {"train_loss": -37.994380950927734, "global_step": 115655, "epoch": 955} {"train_loss": -37.92746353149414, "global_step": 115656, "epoch": 955} {"train_loss": -37.100425720214844, "global_step": 115657, "epoch": 955} {"train_loss": -38.01382064819336, "global_step": 115658, "epoch": 955} {"train_loss": -38.125240325927734, "global_step": 115659, "epoch": 955} {"train_loss": -38.324867248535156, "global_step": 115660, "epoch": 955} {"train_loss": -38.720516204833984, "global_step": 115661, "epoch": 955} {"train_loss": -37.76953125, "global_step": 115662, "epoch": 955} {"train_loss": -38.01604461669922, "global_step": 115663, "epoch": 955} {"train_loss": -39.10195541381836, "global_step": 115664, "epoch": 955} {"train_loss": -38.471492767333984, "global_step": 115665, "epoch": 955} {"train_loss": -38.42374801635742, "global_step": 115666, "epoch": 955} {"train_loss": -39.23529815673828, "global_step": 115667, "epoch": 955} {"train_loss": -38.43793869018555, "global_step": 115668, "epoch": 955} {"train_loss": -39.30836868286133, "global_step": 115669, "epoch": 955} {"train_loss": -38.47489547729492, "global_step": 115670, "epoch": 955} {"train_loss": -38.934513092041016, "global_step": 115671, "epoch": 955} {"train_loss": -38.85118865966797, "global_step": 115672, "epoch": 955} {"train_loss": -38.84174728393555, "global_step": 115673, "epoch": 955} {"train_loss": -38.86854553222656, "global_step": 115674, "epoch": 955} {"train_loss": -38.141435623168945, "global_step": 115675, "epoch": 955, "val_loss": 2607963.75} {"train_loss": -38.46963882446289, "global_step": 115676, "epoch": 956} {"train_loss": -39.58457565307617, "global_step": 115677, "epoch": 956} {"train_loss": -38.97766876220703, "global_step": 115678, "epoch": 956} {"train_loss": -39.15260696411133, "global_step": 115679, "epoch": 956} {"train_loss": -38.935115814208984, "global_step": 115680, "epoch": 956} {"train_loss": -39.35585403442383, "global_step": 115681, "epoch": 956} {"train_loss": -39.092140197753906, "global_step": 115682, "epoch": 956} {"train_loss": -39.425655364990234, "global_step": 115683, "epoch": 956} {"train_loss": -39.75365447998047, "global_step": 115684, "epoch": 956} {"train_loss": -38.924110412597656, "global_step": 115685, "epoch": 956} {"train_loss": -39.27760696411133, "global_step": 115686, "epoch": 956} {"train_loss": -38.494049072265625, "global_step": 115687, "epoch": 956} {"train_loss": -38.91008758544922, "global_step": 115688, "epoch": 956} {"train_loss": -39.3016242980957, "global_step": 115689, "epoch": 956} {"train_loss": -39.16184616088867, "global_step": 115690, "epoch": 956} {"train_loss": -38.58193588256836, "global_step": 115691, "epoch": 956} {"train_loss": -38.8316650390625, "global_step": 115692, "epoch": 956} {"train_loss": -39.75568771362305, "global_step": 115693, "epoch": 956} {"train_loss": -39.43099594116211, "global_step": 115694, "epoch": 956} {"train_loss": -38.552364349365234, "global_step": 115695, "epoch": 956} {"train_loss": -38.34048843383789, "global_step": 115696, "epoch": 956} {"train_loss": -39.24248123168945, "global_step": 115697, "epoch": 956} {"train_loss": -39.33037185668945, "global_step": 115698, "epoch": 956} {"train_loss": -38.21366500854492, "global_step": 115699, "epoch": 956} {"train_loss": -36.2764778137207, "global_step": 115700, "epoch": 956} {"train_loss": -37.71925735473633, "global_step": 115701, "epoch": 956} {"train_loss": -39.93274688720703, "global_step": 115702, "epoch": 956} {"train_loss": -38.39033126831055, "global_step": 115703, "epoch": 956} {"train_loss": -38.87851333618164, "global_step": 115704, "epoch": 956} {"train_loss": -39.33037185668945, "global_step": 115705, "epoch": 956} {"train_loss": -38.9754638671875, "global_step": 115706, "epoch": 956} {"train_loss": -38.246334075927734, "global_step": 115707, "epoch": 956} {"train_loss": -39.864013671875, "global_step": 115708, "epoch": 956} {"train_loss": -39.440887451171875, "global_step": 115709, "epoch": 956} {"train_loss": -39.60055160522461, "global_step": 115710, "epoch": 956} {"train_loss": -39.74034881591797, "global_step": 115711, "epoch": 956} {"train_loss": -40.034751892089844, "global_step": 115712, "epoch": 956} {"train_loss": -39.46132278442383, "global_step": 115713, "epoch": 956} {"train_loss": -39.68778610229492, "global_step": 115714, "epoch": 956} {"train_loss": -40.14247512817383, "global_step": 115715, "epoch": 956} {"train_loss": -39.478851318359375, "global_step": 115716, "epoch": 956} {"train_loss": -39.70827865600586, "global_step": 115717, "epoch": 956} {"train_loss": -40.18701171875, "global_step": 115718, "epoch": 956} {"train_loss": -39.899871826171875, "global_step": 115719, "epoch": 956} {"train_loss": -39.61698913574219, "global_step": 115720, "epoch": 956} {"train_loss": -40.00146484375, "global_step": 115721, "epoch": 956} {"train_loss": -39.66809844970703, "global_step": 115722, "epoch": 956} {"train_loss": -39.68292236328125, "global_step": 115723, "epoch": 956} {"train_loss": -39.964752197265625, "global_step": 115724, "epoch": 956} {"train_loss": -40.692543029785156, "global_step": 115725, "epoch": 956} {"train_loss": -39.86786651611328, "global_step": 115726, "epoch": 956} {"train_loss": -39.73336410522461, "global_step": 115727, "epoch": 956} {"train_loss": -39.65366744995117, "global_step": 115728, "epoch": 956} {"train_loss": -38.58085632324219, "global_step": 115729, "epoch": 956} {"train_loss": -37.53155517578125, "global_step": 115730, "epoch": 956} {"train_loss": -34.869842529296875, "global_step": 115731, "epoch": 956} {"train_loss": -39.45172119140625, "global_step": 115732, "epoch": 956} {"train_loss": -32.389381408691406, "global_step": 115733, "epoch": 956} {"train_loss": -38.70661544799805, "global_step": 115734, "epoch": 956} {"train_loss": -31.0451717376709, "global_step": 115735, "epoch": 956} {"train_loss": -30.669992446899414, "global_step": 115736, "epoch": 956} {"train_loss": -36.938053131103516, "global_step": 115737, "epoch": 956} {"train_loss": -31.72193717956543, "global_step": 115738, "epoch": 956} {"train_loss": -35.34428024291992, "global_step": 115739, "epoch": 956} {"train_loss": -35.12101364135742, "global_step": 115740, "epoch": 956} {"train_loss": -32.64519500732422, "global_step": 115741, "epoch": 956} {"train_loss": -37.611610412597656, "global_step": 115742, "epoch": 956} {"train_loss": -36.56454086303711, "global_step": 115743, "epoch": 956} {"train_loss": -36.34503173828125, "global_step": 115744, "epoch": 956} {"train_loss": -36.243194580078125, "global_step": 115745, "epoch": 956} {"train_loss": -37.45221710205078, "global_step": 115746, "epoch": 956} {"train_loss": -36.509132385253906, "global_step": 115747, "epoch": 956} {"train_loss": -35.92012023925781, "global_step": 115748, "epoch": 956} {"train_loss": -36.80957794189453, "global_step": 115749, "epoch": 956} {"train_loss": -38.0955810546875, "global_step": 115750, "epoch": 956} {"train_loss": -35.8813362121582, "global_step": 115751, "epoch": 956} {"train_loss": -37.99578857421875, "global_step": 115752, "epoch": 956} {"train_loss": -36.507564544677734, "global_step": 115753, "epoch": 956} {"train_loss": -38.299312591552734, "global_step": 115754, "epoch": 956} {"train_loss": -37.18274688720703, "global_step": 115755, "epoch": 956} {"train_loss": -37.40969467163086, "global_step": 115756, "epoch": 956} {"train_loss": -37.924808502197266, "global_step": 115757, "epoch": 956} {"train_loss": -38.32011032104492, "global_step": 115758, "epoch": 956} {"train_loss": -37.32179641723633, "global_step": 115759, "epoch": 956} {"train_loss": -37.46663284301758, "global_step": 115760, "epoch": 956} {"train_loss": -38.65393829345703, "global_step": 115761, "epoch": 956} {"train_loss": -38.40377426147461, "global_step": 115762, "epoch": 956} {"train_loss": -38.56930923461914, "global_step": 115763, "epoch": 956} {"train_loss": -37.84914779663086, "global_step": 115764, "epoch": 956} {"train_loss": -38.51432418823242, "global_step": 115765, "epoch": 956} {"train_loss": -38.42509078979492, "global_step": 115766, "epoch": 956} {"train_loss": -37.78364944458008, "global_step": 115767, "epoch": 956} {"train_loss": -37.53382110595703, "global_step": 115768, "epoch": 956} {"train_loss": -38.874359130859375, "global_step": 115769, "epoch": 956} {"train_loss": -38.00490951538086, "global_step": 115770, "epoch": 956} {"train_loss": -38.91593933105469, "global_step": 115771, "epoch": 956} {"train_loss": -38.751708984375, "global_step": 115772, "epoch": 956} {"train_loss": -38.67881393432617, "global_step": 115773, "epoch": 956} {"train_loss": -38.76892852783203, "global_step": 115774, "epoch": 956} {"train_loss": -39.247962951660156, "global_step": 115775, "epoch": 956} {"train_loss": -39.2309684753418, "global_step": 115776, "epoch": 956} {"train_loss": -39.00811004638672, "global_step": 115777, "epoch": 956} {"train_loss": -39.18227767944336, "global_step": 115778, "epoch": 956} {"train_loss": -39.32229232788086, "global_step": 115779, "epoch": 956} {"train_loss": -39.20737838745117, "global_step": 115780, "epoch": 956} {"train_loss": -39.216278076171875, "global_step": 115781, "epoch": 956} {"train_loss": -39.42708969116211, "global_step": 115782, "epoch": 956} {"train_loss": -39.2431640625, "global_step": 115783, "epoch": 956} {"train_loss": -39.94400405883789, "global_step": 115784, "epoch": 956} {"train_loss": -39.327327728271484, "global_step": 115785, "epoch": 956} {"train_loss": -39.22657775878906, "global_step": 115786, "epoch": 956} {"train_loss": -38.63943099975586, "global_step": 115787, "epoch": 956} {"train_loss": -39.59255599975586, "global_step": 115788, "epoch": 956} {"train_loss": -39.79182052612305, "global_step": 115789, "epoch": 956} {"train_loss": -39.48625946044922, "global_step": 115790, "epoch": 956} {"train_loss": -39.48740768432617, "global_step": 115791, "epoch": 956} {"train_loss": -39.69843292236328, "global_step": 115792, "epoch": 956} {"train_loss": -38.814491271972656, "global_step": 115793, "epoch": 956} {"train_loss": -39.781856536865234, "global_step": 115794, "epoch": 956} {"train_loss": -39.681854248046875, "global_step": 115795, "epoch": 956} {"train_loss": -38.393999194310716, "global_step": 115796, "epoch": 956, "val_loss": 2671904.75} {"train_loss": -39.531463623046875, "global_step": 115797, "epoch": 957} {"train_loss": -39.65208053588867, "global_step": 115798, "epoch": 957} {"train_loss": -39.80228805541992, "global_step": 115799, "epoch": 957} {"train_loss": -39.92734909057617, "global_step": 115800, "epoch": 957} {"train_loss": -39.46541976928711, "global_step": 115801, "epoch": 957} {"train_loss": -39.606910705566406, "global_step": 115802, "epoch": 957} {"train_loss": -40.1331901550293, "global_step": 115803, "epoch": 957} {"train_loss": -39.98861312866211, "global_step": 115804, "epoch": 957} {"train_loss": -39.195831298828125, "global_step": 115805, "epoch": 957} {"train_loss": -40.0953254699707, "global_step": 115806, "epoch": 957} {"train_loss": -40.16263961791992, "global_step": 115807, "epoch": 957} {"train_loss": -39.94523620605469, "global_step": 115808, "epoch": 957} {"train_loss": -39.97513198852539, "global_step": 115809, "epoch": 957} {"train_loss": -40.316192626953125, "global_step": 115810, "epoch": 957} {"train_loss": -39.638458251953125, "global_step": 115811, "epoch": 957} {"train_loss": -39.61745071411133, "global_step": 115812, "epoch": 957} {"train_loss": -39.804931640625, "global_step": 115813, "epoch": 957} {"train_loss": -39.278472900390625, "global_step": 115814, "epoch": 957} {"train_loss": -39.01816177368164, "global_step": 115815, "epoch": 957} {"train_loss": -39.29976272583008, "global_step": 115816, "epoch": 957} {"train_loss": -39.686092376708984, "global_step": 115817, "epoch": 957} {"train_loss": -37.15054702758789, "global_step": 115818, "epoch": 957} {"train_loss": -36.41948318481445, "global_step": 115819, "epoch": 957} {"train_loss": -38.48686981201172, "global_step": 115820, "epoch": 957} {"train_loss": -39.63788986206055, "global_step": 115821, "epoch": 957} {"train_loss": -38.00600814819336, "global_step": 115822, "epoch": 957} {"train_loss": -35.31689453125, "global_step": 115823, "epoch": 957} {"train_loss": -34.19961166381836, "global_step": 115824, "epoch": 957} {"train_loss": -33.612548828125, "global_step": 115825, "epoch": 957} {"train_loss": -35.319000244140625, "global_step": 115826, "epoch": 957} {"train_loss": -36.2271842956543, "global_step": 115827, "epoch": 957} {"train_loss": -36.01914596557617, "global_step": 115828, "epoch": 957} {"train_loss": -36.22721481323242, "global_step": 115829, "epoch": 957} {"train_loss": -38.02090835571289, "global_step": 115830, "epoch": 957} {"train_loss": -38.338130950927734, "global_step": 115831, "epoch": 957} {"train_loss": -37.65584945678711, "global_step": 115832, "epoch": 957} {"train_loss": -37.855384826660156, "global_step": 115833, "epoch": 957} {"train_loss": -39.02220153808594, "global_step": 115834, "epoch": 957} {"train_loss": -38.996543884277344, "global_step": 115835, "epoch": 957} {"train_loss": -38.843597412109375, "global_step": 115836, "epoch": 957} {"train_loss": -38.545806884765625, "global_step": 115837, "epoch": 957} {"train_loss": -39.31595993041992, "global_step": 115838, "epoch": 957} {"train_loss": -38.55074691772461, "global_step": 115839, "epoch": 957} {"train_loss": -38.67919158935547, "global_step": 115840, "epoch": 957} {"train_loss": -39.191524505615234, "global_step": 115841, "epoch": 957} {"train_loss": -39.44526290893555, "global_step": 115842, "epoch": 957} {"train_loss": -39.089229583740234, "global_step": 115843, "epoch": 957} {"train_loss": -39.62208557128906, "global_step": 115844, "epoch": 957} {"train_loss": -39.284297943115234, "global_step": 115845, "epoch": 957} {"train_loss": -39.2066535949707, "global_step": 115846, "epoch": 957} {"train_loss": -39.75962448120117, "global_step": 115847, "epoch": 957} {"train_loss": -38.972984313964844, "global_step": 115848, "epoch": 957} {"train_loss": -39.9123649597168, "global_step": 115849, "epoch": 957} {"train_loss": -39.67040252685547, "global_step": 115850, "epoch": 957} {"train_loss": -39.01511764526367, "global_step": 115851, "epoch": 957} {"train_loss": -39.77729415893555, "global_step": 115852, "epoch": 957} {"train_loss": -39.350135803222656, "global_step": 115853, "epoch": 957} {"train_loss": -40.00017166137695, "global_step": 115854, "epoch": 957} {"train_loss": -38.73151779174805, "global_step": 115855, "epoch": 957} {"train_loss": -38.689369201660156, "global_step": 115856, "epoch": 957} {"train_loss": -39.24030685424805, "global_step": 115857, "epoch": 957} {"train_loss": -39.1716423034668, "global_step": 115858, "epoch": 957} {"train_loss": -39.673274993896484, "global_step": 115859, "epoch": 957} {"train_loss": -39.107276916503906, "global_step": 115860, "epoch": 957} {"train_loss": -40.1220817565918, "global_step": 115861, "epoch": 957} {"train_loss": -38.96577072143555, "global_step": 115862, "epoch": 957} {"train_loss": -39.97380065917969, "global_step": 115863, "epoch": 957} {"train_loss": -39.265113830566406, "global_step": 115864, "epoch": 957} {"train_loss": -38.8117561340332, "global_step": 115865, "epoch": 957} {"train_loss": -39.398902893066406, "global_step": 115866, "epoch": 957} {"train_loss": -39.814571380615234, "global_step": 115867, "epoch": 957} {"train_loss": -38.803627014160156, "global_step": 115868, "epoch": 957} {"train_loss": -39.40872573852539, "global_step": 115869, "epoch": 957} {"train_loss": -39.06074523925781, "global_step": 115870, "epoch": 957} {"train_loss": -39.03721237182617, "global_step": 115871, "epoch": 957} {"train_loss": -39.2024040222168, "global_step": 115872, "epoch": 957} {"train_loss": -39.476585388183594, "global_step": 115873, "epoch": 957} {"train_loss": -39.477745056152344, "global_step": 115874, "epoch": 957} {"train_loss": -40.085723876953125, "global_step": 115875, "epoch": 957} {"train_loss": -40.01538848876953, "global_step": 115876, "epoch": 957} {"train_loss": -39.66340637207031, "global_step": 115877, "epoch": 957} {"train_loss": -39.6542854309082, "global_step": 115878, "epoch": 957} {"train_loss": -39.71037673950195, "global_step": 115879, "epoch": 957} {"train_loss": -39.58951950073242, "global_step": 115880, "epoch": 957} {"train_loss": -38.75503158569336, "global_step": 115881, "epoch": 957} {"train_loss": -39.48268127441406, "global_step": 115882, "epoch": 957} {"train_loss": -39.396453857421875, "global_step": 115883, "epoch": 957} {"train_loss": -39.17695236206055, "global_step": 115884, "epoch": 957} {"train_loss": -39.17950439453125, "global_step": 115885, "epoch": 957} {"train_loss": -39.19291305541992, "global_step": 115886, "epoch": 957} {"train_loss": -40.56013870239258, "global_step": 115887, "epoch": 957} {"train_loss": -39.065704345703125, "global_step": 115888, "epoch": 957} {"train_loss": -39.08755874633789, "global_step": 115889, "epoch": 957} {"train_loss": -40.11814880371094, "global_step": 115890, "epoch": 957} {"train_loss": -37.17033004760742, "global_step": 115891, "epoch": 957} {"train_loss": -40.0390625, "global_step": 115892, "epoch": 957} {"train_loss": -40.14088821411133, "global_step": 115893, "epoch": 957} {"train_loss": -39.55305099487305, "global_step": 115894, "epoch": 957} {"train_loss": -39.053924560546875, "global_step": 115895, "epoch": 957} {"train_loss": -39.831398010253906, "global_step": 115896, "epoch": 957} {"train_loss": -39.72332000732422, "global_step": 115897, "epoch": 957} {"train_loss": -38.69470977783203, "global_step": 115898, "epoch": 957} {"train_loss": -38.936885833740234, "global_step": 115899, "epoch": 957} {"train_loss": -36.853153228759766, "global_step": 115900, "epoch": 957} {"train_loss": -38.38161849975586, "global_step": 115901, "epoch": 957} {"train_loss": -38.87702941894531, "global_step": 115902, "epoch": 957} {"train_loss": -38.790042877197266, "global_step": 115903, "epoch": 957} {"train_loss": -37.96697998046875, "global_step": 115904, "epoch": 957} {"train_loss": -38.72210693359375, "global_step": 115905, "epoch": 957} {"train_loss": -39.36005783081055, "global_step": 115906, "epoch": 957} {"train_loss": -37.828765869140625, "global_step": 115907, "epoch": 957} {"train_loss": -38.82466506958008, "global_step": 115908, "epoch": 957} {"train_loss": -39.059730529785156, "global_step": 115909, "epoch": 957} {"train_loss": -39.60470199584961, "global_step": 115910, "epoch": 957} {"train_loss": -38.53217697143555, "global_step": 115911, "epoch": 957} {"train_loss": -39.07302474975586, "global_step": 115912, "epoch": 957} {"train_loss": -39.23639678955078, "global_step": 115913, "epoch": 957} {"train_loss": -38.59725570678711, "global_step": 115914, "epoch": 957} {"train_loss": -39.05299377441406, "global_step": 115915, "epoch": 957} {"train_loss": -39.59548568725586, "global_step": 115916, "epoch": 957} {"train_loss": -38.96065347844904, "global_step": 115917, "epoch": 957, "val_loss": 2692780.75} {"train_loss": -37.99971008300781, "global_step": 115918, "epoch": 958} {"train_loss": -39.70289611816406, "global_step": 115919, "epoch": 958} {"train_loss": -37.07768630981445, "global_step": 115920, "epoch": 958} {"train_loss": -38.75259017944336, "global_step": 115921, "epoch": 958} {"train_loss": -38.40855026245117, "global_step": 115922, "epoch": 958} {"train_loss": -37.91774368286133, "global_step": 115923, "epoch": 958} {"train_loss": -39.27170944213867, "global_step": 115924, "epoch": 958} {"train_loss": -37.37449645996094, "global_step": 115925, "epoch": 958} {"train_loss": -38.6981086730957, "global_step": 115926, "epoch": 958} {"train_loss": -37.81867599487305, "global_step": 115927, "epoch": 958} {"train_loss": -39.231285095214844, "global_step": 115928, "epoch": 958} {"train_loss": -37.77363204956055, "global_step": 115929, "epoch": 958} {"train_loss": -39.23936080932617, "global_step": 115930, "epoch": 958} {"train_loss": -39.38593673706055, "global_step": 115931, "epoch": 958} {"train_loss": -38.23405075073242, "global_step": 115932, "epoch": 958} {"train_loss": -39.0152702331543, "global_step": 115933, "epoch": 958} {"train_loss": -39.558570861816406, "global_step": 115934, "epoch": 958} {"train_loss": -38.684532165527344, "global_step": 115935, "epoch": 958} {"train_loss": -39.03278350830078, "global_step": 115936, "epoch": 958} {"train_loss": -39.146663665771484, "global_step": 115937, "epoch": 958} {"train_loss": -39.56761169433594, "global_step": 115938, "epoch": 958} {"train_loss": -39.449432373046875, "global_step": 115939, "epoch": 958} {"train_loss": -39.056427001953125, "global_step": 115940, "epoch": 958} {"train_loss": -39.82223129272461, "global_step": 115941, "epoch": 958} {"train_loss": -38.5765495300293, "global_step": 115942, "epoch": 958} {"train_loss": -39.335304260253906, "global_step": 115943, "epoch": 958} {"train_loss": -39.01090621948242, "global_step": 115944, "epoch": 958} {"train_loss": -38.96114730834961, "global_step": 115945, "epoch": 958} {"train_loss": -39.88639450073242, "global_step": 115946, "epoch": 958} {"train_loss": -39.23455047607422, "global_step": 115947, "epoch": 958} {"train_loss": -39.456451416015625, "global_step": 115948, "epoch": 958} {"train_loss": -39.762413024902344, "global_step": 115949, "epoch": 958} {"train_loss": -39.288204193115234, "global_step": 115950, "epoch": 958} {"train_loss": -39.27544021606445, "global_step": 115951, "epoch": 958} {"train_loss": -39.69553756713867, "global_step": 115952, "epoch": 958} {"train_loss": -39.27067947387695, "global_step": 115953, "epoch": 958} {"train_loss": -39.21809768676758, "global_step": 115954, "epoch": 958} {"train_loss": -39.60136032104492, "global_step": 115955, "epoch": 958} {"train_loss": -39.083309173583984, "global_step": 115956, "epoch": 958} {"train_loss": -39.86589431762695, "global_step": 115957, "epoch": 958} {"train_loss": -40.03376007080078, "global_step": 115958, "epoch": 958} {"train_loss": -39.47249221801758, "global_step": 115959, "epoch": 958} {"train_loss": -39.839481353759766, "global_step": 115960, "epoch": 958} {"train_loss": -40.24306106567383, "global_step": 115961, "epoch": 958} {"train_loss": -38.72174072265625, "global_step": 115962, "epoch": 958} {"train_loss": -39.51746368408203, "global_step": 115963, "epoch": 958} {"train_loss": -39.972965240478516, "global_step": 115964, "epoch": 958} {"train_loss": -40.425453186035156, "global_step": 115965, "epoch": 958} {"train_loss": -39.369441986083984, "global_step": 115966, "epoch": 958} {"train_loss": -39.175682067871094, "global_step": 115967, "epoch": 958} {"train_loss": -39.294952392578125, "global_step": 115968, "epoch": 958} {"train_loss": -38.83571243286133, "global_step": 115969, "epoch": 958} {"train_loss": -39.65780258178711, "global_step": 115970, "epoch": 958} {"train_loss": -39.79615020751953, "global_step": 115971, "epoch": 958} {"train_loss": -39.89382553100586, "global_step": 115972, "epoch": 958} {"train_loss": -39.16368103027344, "global_step": 115973, "epoch": 958} {"train_loss": -39.00773620605469, "global_step": 115974, "epoch": 958} {"train_loss": -39.127132415771484, "global_step": 115975, "epoch": 958} {"train_loss": -37.03188705444336, "global_step": 115976, "epoch": 958} {"train_loss": -34.16249465942383, "global_step": 115977, "epoch": 958} {"train_loss": -29.34661293029785, "global_step": 115978, "epoch": 958} {"train_loss": -27.451589584350586, "global_step": 115979, "epoch": 958} {"train_loss": -30.736886978149414, "global_step": 115980, "epoch": 958} {"train_loss": -38.528411865234375, "global_step": 115981, "epoch": 958} {"train_loss": -37.87318801879883, "global_step": 115982, "epoch": 958} {"train_loss": -35.78158187866211, "global_step": 115983, "epoch": 958} {"train_loss": -38.99306869506836, "global_step": 115984, "epoch": 958} {"train_loss": -37.2928581237793, "global_step": 115985, "epoch": 958} {"train_loss": -38.922279357910156, "global_step": 115986, "epoch": 958} {"train_loss": -37.97617721557617, "global_step": 115987, "epoch": 958} {"train_loss": -36.62360763549805, "global_step": 115988, "epoch": 958} {"train_loss": -37.99312973022461, "global_step": 115989, "epoch": 958} {"train_loss": -38.52230453491211, "global_step": 115990, "epoch": 958} {"train_loss": -38.32490921020508, "global_step": 115991, "epoch": 958} {"train_loss": -39.39213562011719, "global_step": 115992, "epoch": 958} {"train_loss": -38.58946228027344, "global_step": 115993, "epoch": 958} {"train_loss": -39.32582092285156, "global_step": 115994, "epoch": 958} {"train_loss": -38.6148681640625, "global_step": 115995, "epoch": 958} {"train_loss": -39.43524169921875, "global_step": 115996, "epoch": 958} {"train_loss": -38.4208869934082, "global_step": 115997, "epoch": 958} {"train_loss": -39.6315803527832, "global_step": 115998, "epoch": 958} {"train_loss": -39.02747344970703, "global_step": 115999, "epoch": 958} {"train_loss": -39.235694885253906, "global_step": 116000, "epoch": 958} {"train_loss": -39.06795883178711, "global_step": 116001, "epoch": 958} {"train_loss": -39.43520736694336, "global_step": 116002, "epoch": 958} {"train_loss": -39.097007751464844, "global_step": 116003, "epoch": 958} {"train_loss": -39.24833679199219, "global_step": 116004, "epoch": 958} {"train_loss": -39.855594635009766, "global_step": 116005, "epoch": 958} {"train_loss": -39.292415618896484, "global_step": 116006, "epoch": 958} {"train_loss": -39.33586502075195, "global_step": 116007, "epoch": 958} {"train_loss": -39.582969665527344, "global_step": 116008, "epoch": 958} {"train_loss": -38.93819046020508, "global_step": 116009, "epoch": 958} {"train_loss": -39.786163330078125, "global_step": 116010, "epoch": 958} {"train_loss": -38.94935989379883, "global_step": 116011, "epoch": 958} {"train_loss": -39.45072937011719, "global_step": 116012, "epoch": 958} {"train_loss": -39.303401947021484, "global_step": 116013, "epoch": 958} {"train_loss": -39.37357711791992, "global_step": 116014, "epoch": 958} {"train_loss": -39.160804748535156, "global_step": 116015, "epoch": 958} {"train_loss": -38.699981689453125, "global_step": 116016, "epoch": 958} {"train_loss": -39.08868408203125, "global_step": 116017, "epoch": 958} {"train_loss": -39.61619186401367, "global_step": 116018, "epoch": 958} {"train_loss": -38.96015930175781, "global_step": 116019, "epoch": 958} {"train_loss": -37.62285232543945, "global_step": 116020, "epoch": 958} {"train_loss": -38.95149612426758, "global_step": 116021, "epoch": 958} {"train_loss": -39.697017669677734, "global_step": 116022, "epoch": 958} {"train_loss": -38.23490905761719, "global_step": 116023, "epoch": 958} {"train_loss": -38.52429962158203, "global_step": 116024, "epoch": 958} {"train_loss": -38.787147521972656, "global_step": 116025, "epoch": 958} {"train_loss": -39.20746612548828, "global_step": 116026, "epoch": 958} {"train_loss": -39.657344818115234, "global_step": 116027, "epoch": 958} {"train_loss": -39.602046966552734, "global_step": 116028, "epoch": 958} {"train_loss": -39.54664993286133, "global_step": 116029, "epoch": 958} {"train_loss": -39.46818923950195, "global_step": 116030, "epoch": 958} {"train_loss": -40.22965621948242, "global_step": 116031, "epoch": 958} {"train_loss": -39.22773361206055, "global_step": 116032, "epoch": 958} {"train_loss": -38.72941207885742, "global_step": 116033, "epoch": 958} {"train_loss": -40.50196075439453, "global_step": 116034, "epoch": 958} {"train_loss": -39.29548645019531, "global_step": 116035, "epoch": 958} {"train_loss": -38.58355712890625, "global_step": 116036, "epoch": 958} {"train_loss": -38.354164123535156, "global_step": 116037, "epoch": 958} {"train_loss": -38.74480906399813, "global_step": 116038, "epoch": 958, "val_loss": 2686808.25} {"train_loss": -40.17623519897461, "global_step": 116039, "epoch": 959} {"train_loss": -39.90403366088867, "global_step": 116040, "epoch": 959} {"train_loss": -39.680667877197266, "global_step": 116041, "epoch": 959} {"train_loss": -39.99815368652344, "global_step": 116042, "epoch": 959} {"train_loss": -39.904396057128906, "global_step": 116043, "epoch": 959} {"train_loss": -39.934654235839844, "global_step": 116044, "epoch": 959} {"train_loss": -39.96035385131836, "global_step": 116045, "epoch": 959} {"train_loss": -38.56222152709961, "global_step": 116046, "epoch": 959} {"train_loss": -38.643798828125, "global_step": 116047, "epoch": 959} {"train_loss": -39.69124984741211, "global_step": 116048, "epoch": 959} {"train_loss": -39.80727767944336, "global_step": 116049, "epoch": 959} {"train_loss": -39.150142669677734, "global_step": 116050, "epoch": 959} {"train_loss": -39.39358901977539, "global_step": 116051, "epoch": 959} {"train_loss": -39.85775375366211, "global_step": 116052, "epoch": 959} {"train_loss": -39.61682891845703, "global_step": 116053, "epoch": 959} {"train_loss": -33.52483367919922, "global_step": 116054, "epoch": 959} {"train_loss": -39.11787033081055, "global_step": 116055, "epoch": 959} {"train_loss": -38.141021728515625, "global_step": 116056, "epoch": 959} {"train_loss": -38.64508056640625, "global_step": 116057, "epoch": 959} {"train_loss": -36.58903884887695, "global_step": 116058, "epoch": 959} {"train_loss": -35.651466369628906, "global_step": 116059, "epoch": 959} {"train_loss": -32.7799186706543, "global_step": 116060, "epoch": 959} {"train_loss": -38.14516830444336, "global_step": 116061, "epoch": 959} {"train_loss": -36.8580207824707, "global_step": 116062, "epoch": 959} {"train_loss": -38.542293548583984, "global_step": 116063, "epoch": 959} {"train_loss": -33.01802062988281, "global_step": 116064, "epoch": 959} {"train_loss": -33.45489501953125, "global_step": 116065, "epoch": 959} {"train_loss": -35.01229476928711, "global_step": 116066, "epoch": 959} {"train_loss": -32.802974700927734, "global_step": 116067, "epoch": 959} {"train_loss": -36.98558044433594, "global_step": 116068, "epoch": 959} {"train_loss": -35.79924392700195, "global_step": 116069, "epoch": 959} {"train_loss": -37.45850372314453, "global_step": 116070, "epoch": 959} {"train_loss": -36.83604049682617, "global_step": 116071, "epoch": 959} {"train_loss": -36.90481948852539, "global_step": 116072, "epoch": 959} {"train_loss": -34.612220764160156, "global_step": 116073, "epoch": 959} {"train_loss": -35.134315490722656, "global_step": 116074, "epoch": 959} {"train_loss": -30.15818214416504, "global_step": 116075, "epoch": 959} {"train_loss": -35.04389572143555, "global_step": 116076, "epoch": 959} {"train_loss": -36.211490631103516, "global_step": 116077, "epoch": 959} {"train_loss": -37.9238166809082, "global_step": 116078, "epoch": 959} {"train_loss": -35.70074462890625, "global_step": 116079, "epoch": 959} {"train_loss": -33.984127044677734, "global_step": 116080, "epoch": 959} {"train_loss": -35.63356018066406, "global_step": 116081, "epoch": 959} {"train_loss": -36.8892822265625, "global_step": 116082, "epoch": 959} {"train_loss": -36.87740707397461, "global_step": 116083, "epoch": 959} {"train_loss": -36.78068923950195, "global_step": 116084, "epoch": 959} {"train_loss": -35.99800491333008, "global_step": 116085, "epoch": 959} {"train_loss": -36.26131820678711, "global_step": 116086, "epoch": 959} {"train_loss": -36.035003662109375, "global_step": 116087, "epoch": 959} {"train_loss": -37.17432403564453, "global_step": 116088, "epoch": 959} {"train_loss": -36.34381103515625, "global_step": 116089, "epoch": 959} {"train_loss": -37.1590461730957, "global_step": 116090, "epoch": 959} {"train_loss": -37.37025451660156, "global_step": 116091, "epoch": 959} {"train_loss": -37.46746826171875, "global_step": 116092, "epoch": 959} {"train_loss": -37.2228889465332, "global_step": 116093, "epoch": 959} {"train_loss": -36.36787033081055, "global_step": 116094, "epoch": 959} {"train_loss": -37.2712287902832, "global_step": 116095, "epoch": 959} {"train_loss": -38.64710235595703, "global_step": 116096, "epoch": 959} {"train_loss": -36.908660888671875, "global_step": 116097, "epoch": 959} {"train_loss": -37.72373580932617, "global_step": 116098, "epoch": 959} {"train_loss": -37.00840377807617, "global_step": 116099, "epoch": 959} {"train_loss": -38.42878341674805, "global_step": 116100, "epoch": 959} {"train_loss": -38.4715690612793, "global_step": 116101, "epoch": 959} {"train_loss": -38.540443420410156, "global_step": 116102, "epoch": 959} {"train_loss": -38.12499237060547, "global_step": 116103, "epoch": 959} {"train_loss": -37.80036163330078, "global_step": 116104, "epoch": 959} {"train_loss": -37.840450286865234, "global_step": 116105, "epoch": 959} {"train_loss": -37.917320251464844, "global_step": 116106, "epoch": 959} {"train_loss": -38.09139633178711, "global_step": 116107, "epoch": 959} {"train_loss": -37.33797073364258, "global_step": 116108, "epoch": 959} {"train_loss": -37.6972541809082, "global_step": 116109, "epoch": 959} {"train_loss": -38.321353912353516, "global_step": 116110, "epoch": 959} {"train_loss": -39.024932861328125, "global_step": 116111, "epoch": 959} {"train_loss": -38.77472686767578, "global_step": 116112, "epoch": 959} {"train_loss": -38.44669723510742, "global_step": 116113, "epoch": 959} {"train_loss": -39.19877624511719, "global_step": 116114, "epoch": 959} {"train_loss": -38.704524993896484, "global_step": 116115, "epoch": 959} {"train_loss": -39.20857620239258, "global_step": 116116, "epoch": 959} {"train_loss": -39.18882369995117, "global_step": 116117, "epoch": 959} {"train_loss": -38.61709976196289, "global_step": 116118, "epoch": 959} {"train_loss": -39.73763656616211, "global_step": 116119, "epoch": 959} {"train_loss": -39.65456008911133, "global_step": 116120, "epoch": 959} {"train_loss": -38.83112335205078, "global_step": 116121, "epoch": 959} {"train_loss": -38.88328170776367, "global_step": 116122, "epoch": 959} {"train_loss": -39.133460998535156, "global_step": 116123, "epoch": 959} {"train_loss": -38.99498748779297, "global_step": 116124, "epoch": 959} {"train_loss": -39.277442932128906, "global_step": 116125, "epoch": 959} {"train_loss": -39.47874069213867, "global_step": 116126, "epoch": 959} {"train_loss": -39.36684799194336, "global_step": 116127, "epoch": 959} {"train_loss": -38.912349700927734, "global_step": 116128, "epoch": 959} {"train_loss": -39.525508880615234, "global_step": 116129, "epoch": 959} {"train_loss": -39.31671142578125, "global_step": 116130, "epoch": 959} {"train_loss": -39.45854568481445, "global_step": 116131, "epoch": 959} {"train_loss": -39.95271682739258, "global_step": 116132, "epoch": 959} {"train_loss": -39.7580680847168, "global_step": 116133, "epoch": 959} {"train_loss": -40.044891357421875, "global_step": 116134, "epoch": 959} {"train_loss": -39.305355072021484, "global_step": 116135, "epoch": 959} {"train_loss": -39.64973068237305, "global_step": 116136, "epoch": 959} {"train_loss": -39.129417419433594, "global_step": 116137, "epoch": 959} {"train_loss": -40.23488998413086, "global_step": 116138, "epoch": 959} {"train_loss": -39.09882736206055, "global_step": 116139, "epoch": 959} {"train_loss": -39.3765869140625, "global_step": 116140, "epoch": 959} {"train_loss": -39.840248107910156, "global_step": 116141, "epoch": 959} {"train_loss": -39.97841262817383, "global_step": 116142, "epoch": 959} {"train_loss": -40.16413879394531, "global_step": 116143, "epoch": 959} {"train_loss": -40.315589904785156, "global_step": 116144, "epoch": 959} {"train_loss": -40.014251708984375, "global_step": 116145, "epoch": 959} {"train_loss": -40.04214096069336, "global_step": 116146, "epoch": 959} {"train_loss": -39.62363815307617, "global_step": 116147, "epoch": 959} {"train_loss": -39.776611328125, "global_step": 116148, "epoch": 959} {"train_loss": -39.87718200683594, "global_step": 116149, "epoch": 959} {"train_loss": -39.61457824707031, "global_step": 116150, "epoch": 959} {"train_loss": -40.3304557800293, "global_step": 116151, "epoch": 959} {"train_loss": -38.83099365234375, "global_step": 116152, "epoch": 959} {"train_loss": -37.35127258300781, "global_step": 116153, "epoch": 959} {"train_loss": -35.92216873168945, "global_step": 116154, "epoch": 959} {"train_loss": -37.87179946899414, "global_step": 116155, "epoch": 959} {"train_loss": -38.68207931518555, "global_step": 116156, "epoch": 959} {"train_loss": -39.86122512817383, "global_step": 116157, "epoch": 959} {"train_loss": -38.63053894042969, "global_step": 116158, "epoch": 959} {"train_loss": -38.041206281047224, "global_step": 116159, "epoch": 959, "val_loss": 2637747.0} {"train_loss": -39.85654830932617, "global_step": 116160, "epoch": 960} {"train_loss": -39.65286636352539, "global_step": 116161, "epoch": 960} {"train_loss": -39.25849914550781, "global_step": 116162, "epoch": 960} {"train_loss": -38.430389404296875, "global_step": 116163, "epoch": 960} {"train_loss": -37.71398162841797, "global_step": 116164, "epoch": 960} {"train_loss": -39.03791427612305, "global_step": 116165, "epoch": 960} {"train_loss": -39.31977462768555, "global_step": 116166, "epoch": 960} {"train_loss": -39.14337921142578, "global_step": 116167, "epoch": 960} {"train_loss": -38.2315673828125, "global_step": 116168, "epoch": 960} {"train_loss": -37.996089935302734, "global_step": 116169, "epoch": 960} {"train_loss": -38.36748123168945, "global_step": 116170, "epoch": 960} {"train_loss": -39.65241241455078, "global_step": 116171, "epoch": 960} {"train_loss": -39.61973190307617, "global_step": 116172, "epoch": 960} {"train_loss": -38.37114334106445, "global_step": 116173, "epoch": 960} {"train_loss": -38.846710205078125, "global_step": 116174, "epoch": 960} {"train_loss": -40.02737045288086, "global_step": 116175, "epoch": 960} {"train_loss": -39.64677047729492, "global_step": 116176, "epoch": 960} {"train_loss": -39.5704460144043, "global_step": 116177, "epoch": 960} {"train_loss": -39.701271057128906, "global_step": 116178, "epoch": 960} {"train_loss": -40.069644927978516, "global_step": 116179, "epoch": 960} {"train_loss": -39.394996643066406, "global_step": 116180, "epoch": 960} {"train_loss": -40.23453903198242, "global_step": 116181, "epoch": 960} {"train_loss": -40.18349075317383, "global_step": 116182, "epoch": 960} {"train_loss": -38.35978698730469, "global_step": 116183, "epoch": 960} {"train_loss": -39.85443115234375, "global_step": 116184, "epoch": 960} {"train_loss": -39.904048919677734, "global_step": 116185, "epoch": 960} {"train_loss": -39.79738998413086, "global_step": 116186, "epoch": 960} {"train_loss": -39.88819122314453, "global_step": 116187, "epoch": 960} {"train_loss": -40.59369659423828, "global_step": 116188, "epoch": 960} {"train_loss": -39.3025016784668, "global_step": 116189, "epoch": 960} {"train_loss": -39.7264404296875, "global_step": 116190, "epoch": 960} {"train_loss": -38.975852966308594, "global_step": 116191, "epoch": 960} {"train_loss": -39.72815704345703, "global_step": 116192, "epoch": 960} {"train_loss": -39.3488655090332, "global_step": 116193, "epoch": 960} {"train_loss": -39.24351119995117, "global_step": 116194, "epoch": 960} {"train_loss": -39.58549118041992, "global_step": 116195, "epoch": 960} {"train_loss": -39.98153305053711, "global_step": 116196, "epoch": 960} {"train_loss": -39.20842361450195, "global_step": 116197, "epoch": 960} {"train_loss": -40.056976318359375, "global_step": 116198, "epoch": 960} {"train_loss": -39.765167236328125, "global_step": 116199, "epoch": 960} {"train_loss": -39.92971420288086, "global_step": 116200, "epoch": 960} {"train_loss": -39.91304397583008, "global_step": 116201, "epoch": 960} {"train_loss": -39.40234375, "global_step": 116202, "epoch": 960} {"train_loss": -39.8173942565918, "global_step": 116203, "epoch": 960} {"train_loss": -38.68571090698242, "global_step": 116204, "epoch": 960} {"train_loss": -39.113887786865234, "global_step": 116205, "epoch": 960} {"train_loss": -40.047115325927734, "global_step": 116206, "epoch": 960} {"train_loss": -38.8760986328125, "global_step": 116207, "epoch": 960} {"train_loss": -39.5086555480957, "global_step": 116208, "epoch": 960} {"train_loss": -39.405311584472656, "global_step": 116209, "epoch": 960} {"train_loss": -38.14071273803711, "global_step": 116210, "epoch": 960} {"train_loss": -38.27069091796875, "global_step": 116211, "epoch": 960} {"train_loss": -35.785606384277344, "global_step": 116212, "epoch": 960} {"train_loss": -34.40565490722656, "global_step": 116213, "epoch": 960} {"train_loss": -39.01682662963867, "global_step": 116214, "epoch": 960} {"train_loss": -37.81806182861328, "global_step": 116215, "epoch": 960} {"train_loss": -35.93752670288086, "global_step": 116216, "epoch": 960} {"train_loss": -32.86232376098633, "global_step": 116217, "epoch": 960} {"train_loss": -33.0930290222168, "global_step": 116218, "epoch": 960} {"train_loss": -34.08820724487305, "global_step": 116219, "epoch": 960} {"train_loss": -34.78010177612305, "global_step": 116220, "epoch": 960} {"train_loss": -34.46442794799805, "global_step": 116221, "epoch": 960} {"train_loss": -34.215423583984375, "global_step": 116222, "epoch": 960} {"train_loss": -37.08750534057617, "global_step": 116223, "epoch": 960} {"train_loss": -36.144962310791016, "global_step": 116224, "epoch": 960} {"train_loss": -35.24979019165039, "global_step": 116225, "epoch": 960} {"train_loss": -38.28076934814453, "global_step": 116226, "epoch": 960} {"train_loss": -36.93696975708008, "global_step": 116227, "epoch": 960} {"train_loss": -34.62887191772461, "global_step": 116228, "epoch": 960} {"train_loss": -36.917572021484375, "global_step": 116229, "epoch": 960} {"train_loss": -38.17735290527344, "global_step": 116230, "epoch": 960} {"train_loss": -33.7285270690918, "global_step": 116231, "epoch": 960} {"train_loss": -37.75777816772461, "global_step": 116232, "epoch": 960} {"train_loss": -36.660797119140625, "global_step": 116233, "epoch": 960} {"train_loss": -37.46891403198242, "global_step": 116234, "epoch": 960} {"train_loss": -36.95673370361328, "global_step": 116235, "epoch": 960} {"train_loss": -37.34233474731445, "global_step": 116236, "epoch": 960} {"train_loss": -38.04310989379883, "global_step": 116237, "epoch": 960} {"train_loss": -37.49227523803711, "global_step": 116238, "epoch": 960} {"train_loss": -37.51472091674805, "global_step": 116239, "epoch": 960} {"train_loss": -38.64308547973633, "global_step": 116240, "epoch": 960} {"train_loss": -37.31081771850586, "global_step": 116241, "epoch": 960} {"train_loss": -39.211456298828125, "global_step": 116242, "epoch": 960} {"train_loss": -37.69539260864258, "global_step": 116243, "epoch": 960} {"train_loss": -38.76969528198242, "global_step": 116244, "epoch": 960} {"train_loss": -38.452247619628906, "global_step": 116245, "epoch": 960} {"train_loss": -38.87488555908203, "global_step": 116246, "epoch": 960} {"train_loss": -38.78572463989258, "global_step": 116247, "epoch": 960} {"train_loss": -38.92545700073242, "global_step": 116248, "epoch": 960} {"train_loss": -38.83851623535156, "global_step": 116249, "epoch": 960} {"train_loss": -38.701961517333984, "global_step": 116250, "epoch": 960} {"train_loss": -38.72173309326172, "global_step": 116251, "epoch": 960} {"train_loss": -38.802188873291016, "global_step": 116252, "epoch": 960} {"train_loss": -39.38877487182617, "global_step": 116253, "epoch": 960} {"train_loss": -38.99030303955078, "global_step": 116254, "epoch": 960} {"train_loss": -39.5872917175293, "global_step": 116255, "epoch": 960} {"train_loss": -39.14655303955078, "global_step": 116256, "epoch": 960} {"train_loss": -39.46934127807617, "global_step": 116257, "epoch": 960} {"train_loss": -39.5059928894043, "global_step": 116258, "epoch": 960} {"train_loss": -39.800045013427734, "global_step": 116259, "epoch": 960} {"train_loss": -39.926109313964844, "global_step": 116260, "epoch": 960} {"train_loss": -39.618011474609375, "global_step": 116261, "epoch": 960} {"train_loss": -39.866546630859375, "global_step": 116262, "epoch": 960} {"train_loss": -39.75239181518555, "global_step": 116263, "epoch": 960} {"train_loss": -39.20718002319336, "global_step": 116264, "epoch": 960} {"train_loss": -40.185543060302734, "global_step": 116265, "epoch": 960} {"train_loss": -39.58258819580078, "global_step": 116266, "epoch": 960} {"train_loss": -40.08059310913086, "global_step": 116267, "epoch": 960} {"train_loss": -39.45805740356445, "global_step": 116268, "epoch": 960} {"train_loss": -39.53972625732422, "global_step": 116269, "epoch": 960} {"train_loss": -40.224884033203125, "global_step": 116270, "epoch": 960} {"train_loss": -39.083431243896484, "global_step": 116271, "epoch": 960} {"train_loss": -38.8823127746582, "global_step": 116272, "epoch": 960} {"train_loss": -39.9058723449707, "global_step": 116273, "epoch": 960} {"train_loss": -39.981300354003906, "global_step": 116274, "epoch": 960} {"train_loss": -39.315555572509766, "global_step": 116275, "epoch": 960} {"train_loss": -40.204952239990234, "global_step": 116276, "epoch": 960} {"train_loss": -40.368133544921875, "global_step": 116277, "epoch": 960} {"train_loss": -39.08993148803711, "global_step": 116278, "epoch": 960} {"train_loss": -39.85006332397461, "global_step": 116279, "epoch": 960} {"train_loss": -38.60626873300095, "global_step": 116280, "epoch": 960, "val_loss": 2699542.25} {"train_loss": -39.74059295654297, "global_step": 116281, "epoch": 961} {"train_loss": -39.3929328918457, "global_step": 116282, "epoch": 961} {"train_loss": -39.63262939453125, "global_step": 116283, "epoch": 961} {"train_loss": -39.41538619995117, "global_step": 116284, "epoch": 961} {"train_loss": -40.01667404174805, "global_step": 116285, "epoch": 961} {"train_loss": -39.66241455078125, "global_step": 116286, "epoch": 961} {"train_loss": -39.299373626708984, "global_step": 116287, "epoch": 961} {"train_loss": -39.79505157470703, "global_step": 116288, "epoch": 961} {"train_loss": -40.3514289855957, "global_step": 116289, "epoch": 961} {"train_loss": -40.2555046081543, "global_step": 116290, "epoch": 961} {"train_loss": -40.523128509521484, "global_step": 116291, "epoch": 961} {"train_loss": -40.18971633911133, "global_step": 116292, "epoch": 961} {"train_loss": -40.145870208740234, "global_step": 116293, "epoch": 961} {"train_loss": -39.83967208862305, "global_step": 116294, "epoch": 961} {"train_loss": -40.428836822509766, "global_step": 116295, "epoch": 961} {"train_loss": -40.455806732177734, "global_step": 116296, "epoch": 961} {"train_loss": -40.30808639526367, "global_step": 116297, "epoch": 961} {"train_loss": -40.14917755126953, "global_step": 116298, "epoch": 961} {"train_loss": -40.27804183959961, "global_step": 116299, "epoch": 961} {"train_loss": -40.51513671875, "global_step": 116300, "epoch": 961} {"train_loss": -39.50414276123047, "global_step": 116301, "epoch": 961} {"train_loss": -39.9226188659668, "global_step": 116302, "epoch": 961} {"train_loss": -39.33127212524414, "global_step": 116303, "epoch": 961} {"train_loss": -38.31874465942383, "global_step": 116304, "epoch": 961} {"train_loss": -37.02352523803711, "global_step": 116305, "epoch": 961} {"train_loss": -39.58317184448242, "global_step": 116306, "epoch": 961} {"train_loss": -39.94495391845703, "global_step": 116307, "epoch": 961} {"train_loss": -39.743072509765625, "global_step": 116308, "epoch": 961} {"train_loss": -38.78120040893555, "global_step": 116309, "epoch": 961} {"train_loss": -38.63093948364258, "global_step": 116310, "epoch": 961} {"train_loss": -38.430267333984375, "global_step": 116311, "epoch": 961} {"train_loss": -36.62154006958008, "global_step": 116312, "epoch": 961} {"train_loss": -36.93552780151367, "global_step": 116313, "epoch": 961} {"train_loss": -38.24406051635742, "global_step": 116314, "epoch": 961} {"train_loss": -39.97280502319336, "global_step": 116315, "epoch": 961} {"train_loss": -40.15806198120117, "global_step": 116316, "epoch": 961} {"train_loss": -38.77010726928711, "global_step": 116317, "epoch": 961} {"train_loss": -38.728187561035156, "global_step": 116318, "epoch": 961} {"train_loss": -38.952362060546875, "global_step": 116319, "epoch": 961} {"train_loss": -34.456417083740234, "global_step": 116320, "epoch": 961} {"train_loss": -38.425655364990234, "global_step": 116321, "epoch": 961} {"train_loss": -36.79447555541992, "global_step": 116322, "epoch": 961} {"train_loss": -36.438804626464844, "global_step": 116323, "epoch": 961} {"train_loss": -38.91432571411133, "global_step": 116324, "epoch": 961} {"train_loss": -37.826839447021484, "global_step": 116325, "epoch": 961} {"train_loss": -34.836952209472656, "global_step": 116326, "epoch": 961} {"train_loss": -39.75261306762695, "global_step": 116327, "epoch": 961} {"train_loss": -36.16184997558594, "global_step": 116328, "epoch": 961} {"train_loss": -34.621826171875, "global_step": 116329, "epoch": 961} {"train_loss": -34.905426025390625, "global_step": 116330, "epoch": 961} {"train_loss": -36.385963439941406, "global_step": 116331, "epoch": 961} {"train_loss": -36.40147399902344, "global_step": 116332, "epoch": 961} {"train_loss": -36.77555465698242, "global_step": 116333, "epoch": 961} {"train_loss": -35.90476989746094, "global_step": 116334, "epoch": 961} {"train_loss": -38.053321838378906, "global_step": 116335, "epoch": 961} {"train_loss": -37.918212890625, "global_step": 116336, "epoch": 961} {"train_loss": -36.27143859863281, "global_step": 116337, "epoch": 961} {"train_loss": -37.06502914428711, "global_step": 116338, "epoch": 961} {"train_loss": -36.09901809692383, "global_step": 116339, "epoch": 961} {"train_loss": -38.32546615600586, "global_step": 116340, "epoch": 961} {"train_loss": -35.79877853393555, "global_step": 116341, "epoch": 961} {"train_loss": -36.09309768676758, "global_step": 116342, "epoch": 961} {"train_loss": -37.24209213256836, "global_step": 116343, "epoch": 961} {"train_loss": -37.90960693359375, "global_step": 116344, "epoch": 961} {"train_loss": -38.26819610595703, "global_step": 116345, "epoch": 961} {"train_loss": -37.8300666809082, "global_step": 116346, "epoch": 961} {"train_loss": -38.620662689208984, "global_step": 116347, "epoch": 961} {"train_loss": -38.09172821044922, "global_step": 116348, "epoch": 961} {"train_loss": -38.8125114440918, "global_step": 116349, "epoch": 961} {"train_loss": -38.90388870239258, "global_step": 116350, "epoch": 961} {"train_loss": -38.812965393066406, "global_step": 116351, "epoch": 961} {"train_loss": -39.04403305053711, "global_step": 116352, "epoch": 961} {"train_loss": -39.34833908081055, "global_step": 116353, "epoch": 961} {"train_loss": -39.40843963623047, "global_step": 116354, "epoch": 961} {"train_loss": -38.34159469604492, "global_step": 116355, "epoch": 961} {"train_loss": -39.11350631713867, "global_step": 116356, "epoch": 961} {"train_loss": -39.081520080566406, "global_step": 116357, "epoch": 961} {"train_loss": -38.77875518798828, "global_step": 116358, "epoch": 961} {"train_loss": -39.2211799621582, "global_step": 116359, "epoch": 961} {"train_loss": -39.673919677734375, "global_step": 116360, "epoch": 961} {"train_loss": -39.4178466796875, "global_step": 116361, "epoch": 961} {"train_loss": -39.240081787109375, "global_step": 116362, "epoch": 961} {"train_loss": -39.00448989868164, "global_step": 116363, "epoch": 961} {"train_loss": -39.689300537109375, "global_step": 116364, "epoch": 961} {"train_loss": -39.23895263671875, "global_step": 116365, "epoch": 961} {"train_loss": -39.48519515991211, "global_step": 116366, "epoch": 961} {"train_loss": -40.395931243896484, "global_step": 116367, "epoch": 961} {"train_loss": -39.857234954833984, "global_step": 116368, "epoch": 961} {"train_loss": -39.85205841064453, "global_step": 116369, "epoch": 961} {"train_loss": -39.9394416809082, "global_step": 116370, "epoch": 961} {"train_loss": -39.6660270690918, "global_step": 116371, "epoch": 961} {"train_loss": -39.69569778442383, "global_step": 116372, "epoch": 961} {"train_loss": -39.811458587646484, "global_step": 116373, "epoch": 961} {"train_loss": -40.11402893066406, "global_step": 116374, "epoch": 961} {"train_loss": -39.684810638427734, "global_step": 116375, "epoch": 961} {"train_loss": -40.233150482177734, "global_step": 116376, "epoch": 961} {"train_loss": -40.04172897338867, "global_step": 116377, "epoch": 961} {"train_loss": -39.570343017578125, "global_step": 116378, "epoch": 961} {"train_loss": -40.30108642578125, "global_step": 116379, "epoch": 961} {"train_loss": -39.855770111083984, "global_step": 116380, "epoch": 961} {"train_loss": -39.92082214355469, "global_step": 116381, "epoch": 961} {"train_loss": -40.40890121459961, "global_step": 116382, "epoch": 961} {"train_loss": -40.24169158935547, "global_step": 116383, "epoch": 961} {"train_loss": -40.10712814331055, "global_step": 116384, "epoch": 961} {"train_loss": -40.6598014831543, "global_step": 116385, "epoch": 961} {"train_loss": -39.43709182739258, "global_step": 116386, "epoch": 961} {"train_loss": -40.08650207519531, "global_step": 116387, "epoch": 961} {"train_loss": -40.10884475708008, "global_step": 116388, "epoch": 961} {"train_loss": -40.28357696533203, "global_step": 116389, "epoch": 961} {"train_loss": -40.42414093017578, "global_step": 116390, "epoch": 961} {"train_loss": -40.6154670715332, "global_step": 116391, "epoch": 961} {"train_loss": -40.130767822265625, "global_step": 116392, "epoch": 961} {"train_loss": -39.23458480834961, "global_step": 116393, "epoch": 961} {"train_loss": -40.5770263671875, "global_step": 116394, "epoch": 961} {"train_loss": -40.611427307128906, "global_step": 116395, "epoch": 961} {"train_loss": -40.500572204589844, "global_step": 116396, "epoch": 961} {"train_loss": -40.25437545776367, "global_step": 116397, "epoch": 961} {"train_loss": -40.73159408569336, "global_step": 116398, "epoch": 961} {"train_loss": -39.754634857177734, "global_step": 116399, "epoch": 961} {"train_loss": -39.67595291137695, "global_step": 116400, "epoch": 961} {"train_loss": -38.987305034290664, "global_step": 116401, "epoch": 961, "val_loss": 2704511.75} {"train_loss": -38.913108825683594, "global_step": 116402, "epoch": 962} {"train_loss": -39.65130615234375, "global_step": 116403, "epoch": 962} {"train_loss": -39.0568962097168, "global_step": 116404, "epoch": 962} {"train_loss": -39.007755279541016, "global_step": 116405, "epoch": 962} {"train_loss": -38.35736083984375, "global_step": 116406, "epoch": 962} {"train_loss": -38.659889221191406, "global_step": 116407, "epoch": 962} {"train_loss": -39.736061096191406, "global_step": 116408, "epoch": 962} {"train_loss": -38.662757873535156, "global_step": 116409, "epoch": 962} {"train_loss": -34.46390151977539, "global_step": 116410, "epoch": 962} {"train_loss": -35.871089935302734, "global_step": 116411, "epoch": 962} {"train_loss": -36.884883880615234, "global_step": 116412, "epoch": 962} {"train_loss": -36.001338958740234, "global_step": 116413, "epoch": 962} {"train_loss": -35.52633285522461, "global_step": 116414, "epoch": 962} {"train_loss": -37.4787712097168, "global_step": 116415, "epoch": 962} {"train_loss": -37.383785247802734, "global_step": 116416, "epoch": 962} {"train_loss": -34.96778869628906, "global_step": 116417, "epoch": 962} {"train_loss": -38.11848068237305, "global_step": 116418, "epoch": 962} {"train_loss": -33.98491668701172, "global_step": 116419, "epoch": 962} {"train_loss": -39.071083068847656, "global_step": 116420, "epoch": 962} {"train_loss": -35.19794464111328, "global_step": 116421, "epoch": 962} {"train_loss": -36.610633850097656, "global_step": 116422, "epoch": 962} {"train_loss": -37.082759857177734, "global_step": 116423, "epoch": 962} {"train_loss": -35.08552932739258, "global_step": 116424, "epoch": 962} {"train_loss": -34.006771087646484, "global_step": 116425, "epoch": 962} {"train_loss": -37.392303466796875, "global_step": 116426, "epoch": 962} {"train_loss": -36.5400505065918, "global_step": 116427, "epoch": 962} {"train_loss": -37.02241897583008, "global_step": 116428, "epoch": 962} {"train_loss": -38.5360221862793, "global_step": 116429, "epoch": 962} {"train_loss": -35.93795394897461, "global_step": 116430, "epoch": 962} {"train_loss": -36.77325439453125, "global_step": 116431, "epoch": 962} {"train_loss": -37.921302795410156, "global_step": 116432, "epoch": 962} {"train_loss": -38.02608871459961, "global_step": 116433, "epoch": 962} {"train_loss": -37.8966178894043, "global_step": 116434, "epoch": 962} {"train_loss": -37.562313079833984, "global_step": 116435, "epoch": 962} {"train_loss": -38.522850036621094, "global_step": 116436, "epoch": 962} {"train_loss": -38.16319274902344, "global_step": 116437, "epoch": 962} {"train_loss": -36.42533493041992, "global_step": 116438, "epoch": 962} {"train_loss": -36.91607666015625, "global_step": 116439, "epoch": 962} {"train_loss": -38.505470275878906, "global_step": 116440, "epoch": 962} {"train_loss": -38.57121276855469, "global_step": 116441, "epoch": 962} {"train_loss": -38.661407470703125, "global_step": 116442, "epoch": 962} {"train_loss": -38.24025344848633, "global_step": 116443, "epoch": 962} {"train_loss": -38.40867233276367, "global_step": 116444, "epoch": 962} {"train_loss": -39.51715850830078, "global_step": 116445, "epoch": 962} {"train_loss": -38.38112258911133, "global_step": 116446, "epoch": 962} {"train_loss": -38.78242874145508, "global_step": 116447, "epoch": 962} {"train_loss": -39.28681564331055, "global_step": 116448, "epoch": 962} {"train_loss": -39.06416702270508, "global_step": 116449, "epoch": 962} {"train_loss": -39.0040283203125, "global_step": 116450, "epoch": 962} {"train_loss": -39.9061279296875, "global_step": 116451, "epoch": 962} {"train_loss": -39.17149353027344, "global_step": 116452, "epoch": 962} {"train_loss": -39.52645492553711, "global_step": 116453, "epoch": 962} {"train_loss": -39.5201301574707, "global_step": 116454, "epoch": 962} {"train_loss": -39.73076248168945, "global_step": 116455, "epoch": 962} {"train_loss": -39.6942138671875, "global_step": 116456, "epoch": 962} {"train_loss": -39.42290496826172, "global_step": 116457, "epoch": 962} {"train_loss": -39.65143585205078, "global_step": 116458, "epoch": 962} {"train_loss": -39.79302215576172, "global_step": 116459, "epoch": 962} {"train_loss": -39.648860931396484, "global_step": 116460, "epoch": 962} {"train_loss": -39.545753479003906, "global_step": 116461, "epoch": 962} {"train_loss": -39.20633316040039, "global_step": 116462, "epoch": 962} {"train_loss": -39.67557907104492, "global_step": 116463, "epoch": 962} {"train_loss": -39.8172721862793, "global_step": 116464, "epoch": 962} {"train_loss": -39.485877990722656, "global_step": 116465, "epoch": 962} {"train_loss": -39.90846633911133, "global_step": 116466, "epoch": 962} {"train_loss": -39.403724670410156, "global_step": 116467, "epoch": 962} {"train_loss": -39.67854309082031, "global_step": 116468, "epoch": 962} {"train_loss": -39.86542510986328, "global_step": 116469, "epoch": 962} {"train_loss": -39.899532318115234, "global_step": 116470, "epoch": 962} {"train_loss": -39.45002365112305, "global_step": 116471, "epoch": 962} {"train_loss": -38.92597198486328, "global_step": 116472, "epoch": 962} {"train_loss": -40.00440216064453, "global_step": 116473, "epoch": 962} {"train_loss": -39.23219680786133, "global_step": 116474, "epoch": 962} {"train_loss": -39.493064880371094, "global_step": 116475, "epoch": 962} {"train_loss": -39.462554931640625, "global_step": 116476, "epoch": 962} {"train_loss": -40.119056701660156, "global_step": 116477, "epoch": 962} {"train_loss": -39.94375991821289, "global_step": 116478, "epoch": 962} {"train_loss": -39.597412109375, "global_step": 116479, "epoch": 962} {"train_loss": -40.1021614074707, "global_step": 116480, "epoch": 962} {"train_loss": -40.00444412231445, "global_step": 116481, "epoch": 962} {"train_loss": -38.71969223022461, "global_step": 116482, "epoch": 962} {"train_loss": -39.58107376098633, "global_step": 116483, "epoch": 962} {"train_loss": -39.36241912841797, "global_step": 116484, "epoch": 962} {"train_loss": -39.61478805541992, "global_step": 116485, "epoch": 962} {"train_loss": -40.06889724731445, "global_step": 116486, "epoch": 962} {"train_loss": -39.54107666015625, "global_step": 116487, "epoch": 962} {"train_loss": -38.86859130859375, "global_step": 116488, "epoch": 962} {"train_loss": -39.05891799926758, "global_step": 116489, "epoch": 962} {"train_loss": -40.29176330566406, "global_step": 116490, "epoch": 962} {"train_loss": -39.304481506347656, "global_step": 116491, "epoch": 962} {"train_loss": -39.768959045410156, "global_step": 116492, "epoch": 962} {"train_loss": -39.522544860839844, "global_step": 116493, "epoch": 962} {"train_loss": -39.799293518066406, "global_step": 116494, "epoch": 962} {"train_loss": -38.646827697753906, "global_step": 116495, "epoch": 962} {"train_loss": -37.86030960083008, "global_step": 116496, "epoch": 962} {"train_loss": -38.93282699584961, "global_step": 116497, "epoch": 962} {"train_loss": -39.639198303222656, "global_step": 116498, "epoch": 962} {"train_loss": -40.1030158996582, "global_step": 116499, "epoch": 962} {"train_loss": -39.954017639160156, "global_step": 116500, "epoch": 962} {"train_loss": -39.43412399291992, "global_step": 116501, "epoch": 962} {"train_loss": -39.6603889465332, "global_step": 116502, "epoch": 962} {"train_loss": -39.79841995239258, "global_step": 116503, "epoch": 962} {"train_loss": -39.8405647277832, "global_step": 116504, "epoch": 962} {"train_loss": -37.462337493896484, "global_step": 116505, "epoch": 962} {"train_loss": -37.913734436035156, "global_step": 116506, "epoch": 962} {"train_loss": -38.63885498046875, "global_step": 116507, "epoch": 962} {"train_loss": -38.911224365234375, "global_step": 116508, "epoch": 962} {"train_loss": -38.40653610229492, "global_step": 116509, "epoch": 962} {"train_loss": -38.794349670410156, "global_step": 116510, "epoch": 962} {"train_loss": -37.452972412109375, "global_step": 116511, "epoch": 962} {"train_loss": -37.729183197021484, "global_step": 116512, "epoch": 962} {"train_loss": -38.45083236694336, "global_step": 116513, "epoch": 962} {"train_loss": -38.00742721557617, "global_step": 116514, "epoch": 962} {"train_loss": -36.86886215209961, "global_step": 116515, "epoch": 962} {"train_loss": -37.473419189453125, "global_step": 116516, "epoch": 962} {"train_loss": -38.95151138305664, "global_step": 116517, "epoch": 962} {"train_loss": -39.26962661743164, "global_step": 116518, "epoch": 962} {"train_loss": -38.074867248535156, "global_step": 116519, "epoch": 962} {"train_loss": -39.20952224731445, "global_step": 116520, "epoch": 962} {"train_loss": -38.76941680908203, "global_step": 116521, "epoch": 962} {"train_loss": -38.56130243726998, "global_step": 116522, "epoch": 962, "val_loss": 2783883.5} {"train_loss": -39.040401458740234, "global_step": 116523, "epoch": 963} {"train_loss": -37.41449737548828, "global_step": 116524, "epoch": 963} {"train_loss": -38.346435546875, "global_step": 116525, "epoch": 963} {"train_loss": -39.709598541259766, "global_step": 116526, "epoch": 963} {"train_loss": -38.37757110595703, "global_step": 116527, "epoch": 963} {"train_loss": -39.44740676879883, "global_step": 116528, "epoch": 963} {"train_loss": -39.439571380615234, "global_step": 116529, "epoch": 963} {"train_loss": -38.68771743774414, "global_step": 116530, "epoch": 963} {"train_loss": -38.77037048339844, "global_step": 116531, "epoch": 963} {"train_loss": -40.15240478515625, "global_step": 116532, "epoch": 963} {"train_loss": -39.105712890625, "global_step": 116533, "epoch": 963} {"train_loss": -38.98042678833008, "global_step": 116534, "epoch": 963} {"train_loss": -39.2011604309082, "global_step": 116535, "epoch": 963} {"train_loss": -39.252193450927734, "global_step": 116536, "epoch": 963} {"train_loss": -38.34149169921875, "global_step": 116537, "epoch": 963} {"train_loss": -40.12751770019531, "global_step": 116538, "epoch": 963} {"train_loss": -40.13682174682617, "global_step": 116539, "epoch": 963} {"train_loss": -40.155391693115234, "global_step": 116540, "epoch": 963} {"train_loss": -39.730594635009766, "global_step": 116541, "epoch": 963} {"train_loss": -40.2767219543457, "global_step": 116542, "epoch": 963} {"train_loss": -39.565181732177734, "global_step": 116543, "epoch": 963} {"train_loss": -39.789878845214844, "global_step": 116544, "epoch": 963} {"train_loss": -39.58071517944336, "global_step": 116545, "epoch": 963} {"train_loss": -40.46683883666992, "global_step": 116546, "epoch": 963} {"train_loss": -38.96389389038086, "global_step": 116547, "epoch": 963} {"train_loss": -39.77456283569336, "global_step": 116548, "epoch": 963} {"train_loss": -39.448394775390625, "global_step": 116549, "epoch": 963} {"train_loss": -39.30873107910156, "global_step": 116550, "epoch": 963} {"train_loss": -38.71772003173828, "global_step": 116551, "epoch": 963} {"train_loss": -39.80149459838867, "global_step": 116552, "epoch": 963} {"train_loss": -40.376808166503906, "global_step": 116553, "epoch": 963} {"train_loss": -38.93210220336914, "global_step": 116554, "epoch": 963} {"train_loss": -38.3294563293457, "global_step": 116555, "epoch": 963} {"train_loss": -39.62807083129883, "global_step": 116556, "epoch": 963} {"train_loss": -39.976436614990234, "global_step": 116557, "epoch": 963} {"train_loss": -38.88655471801758, "global_step": 116558, "epoch": 963} {"train_loss": -39.14469528198242, "global_step": 116559, "epoch": 963} {"train_loss": -39.5045166015625, "global_step": 116560, "epoch": 963} {"train_loss": -39.36738204956055, "global_step": 116561, "epoch": 963} {"train_loss": -39.13462448120117, "global_step": 116562, "epoch": 963} {"train_loss": -38.97016525268555, "global_step": 116563, "epoch": 963} {"train_loss": -37.41300582885742, "global_step": 116564, "epoch": 963} {"train_loss": -35.42963409423828, "global_step": 116565, "epoch": 963} {"train_loss": -39.95374298095703, "global_step": 116566, "epoch": 963} {"train_loss": -35.98775863647461, "global_step": 116567, "epoch": 963} {"train_loss": -37.95258712768555, "global_step": 116568, "epoch": 963} {"train_loss": -36.17360305786133, "global_step": 116569, "epoch": 963} {"train_loss": -36.18027877807617, "global_step": 116570, "epoch": 963} {"train_loss": -38.26430892944336, "global_step": 116571, "epoch": 963} {"train_loss": -35.62846374511719, "global_step": 116572, "epoch": 963} {"train_loss": -39.766082763671875, "global_step": 116573, "epoch": 963} {"train_loss": -36.0916862487793, "global_step": 116574, "epoch": 963} {"train_loss": -38.5207633972168, "global_step": 116575, "epoch": 963} {"train_loss": -38.12034225463867, "global_step": 116576, "epoch": 963} {"train_loss": -36.3203010559082, "global_step": 116577, "epoch": 963} {"train_loss": -39.20064926147461, "global_step": 116578, "epoch": 963} {"train_loss": -37.81269454956055, "global_step": 116579, "epoch": 963} {"train_loss": -38.97108840942383, "global_step": 116580, "epoch": 963} {"train_loss": -39.03371810913086, "global_step": 116581, "epoch": 963} {"train_loss": -38.131439208984375, "global_step": 116582, "epoch": 963} {"train_loss": -39.604671478271484, "global_step": 116583, "epoch": 963} {"train_loss": -38.87374496459961, "global_step": 116584, "epoch": 963} {"train_loss": -39.208534240722656, "global_step": 116585, "epoch": 963} {"train_loss": -39.11487579345703, "global_step": 116586, "epoch": 963} {"train_loss": -38.68783187866211, "global_step": 116587, "epoch": 963} {"train_loss": -38.99619674682617, "global_step": 116588, "epoch": 963} {"train_loss": -38.80781936645508, "global_step": 116589, "epoch": 963} {"train_loss": -39.29026412963867, "global_step": 116590, "epoch": 963} {"train_loss": -37.91807174682617, "global_step": 116591, "epoch": 963} {"train_loss": -39.39105224609375, "global_step": 116592, "epoch": 963} {"train_loss": -38.25664138793945, "global_step": 116593, "epoch": 963} {"train_loss": -39.70595932006836, "global_step": 116594, "epoch": 963} {"train_loss": -39.05428695678711, "global_step": 116595, "epoch": 963} {"train_loss": -39.90584182739258, "global_step": 116596, "epoch": 963} {"train_loss": -39.19357681274414, "global_step": 116597, "epoch": 963} {"train_loss": -39.74353790283203, "global_step": 116598, "epoch": 963} {"train_loss": -38.6524658203125, "global_step": 116599, "epoch": 963} {"train_loss": -40.01186752319336, "global_step": 116600, "epoch": 963} {"train_loss": -39.29850769042969, "global_step": 116601, "epoch": 963} {"train_loss": -39.49686813354492, "global_step": 116602, "epoch": 963} {"train_loss": -39.88554382324219, "global_step": 116603, "epoch": 963} {"train_loss": -39.458797454833984, "global_step": 116604, "epoch": 963} {"train_loss": -39.621578216552734, "global_step": 116605, "epoch": 963} {"train_loss": -40.19489288330078, "global_step": 116606, "epoch": 963} {"train_loss": -39.83285140991211, "global_step": 116607, "epoch": 963} {"train_loss": -39.7541618347168, "global_step": 116608, "epoch": 963} {"train_loss": -39.379188537597656, "global_step": 116609, "epoch": 963} {"train_loss": -39.01359176635742, "global_step": 116610, "epoch": 963} {"train_loss": -40.115509033203125, "global_step": 116611, "epoch": 963} {"train_loss": -39.35166549682617, "global_step": 116612, "epoch": 963} {"train_loss": -39.01380157470703, "global_step": 116613, "epoch": 963} {"train_loss": -39.728492736816406, "global_step": 116614, "epoch": 963} {"train_loss": -40.09714889526367, "global_step": 116615, "epoch": 963} {"train_loss": -39.50360107421875, "global_step": 116616, "epoch": 963} {"train_loss": -39.74125671386719, "global_step": 116617, "epoch": 963} {"train_loss": -40.1513671875, "global_step": 116618, "epoch": 963} {"train_loss": -39.33967208862305, "global_step": 116619, "epoch": 963} {"train_loss": -40.26227569580078, "global_step": 116620, "epoch": 963} {"train_loss": -40.33019256591797, "global_step": 116621, "epoch": 963} {"train_loss": -39.97211837768555, "global_step": 116622, "epoch": 963} {"train_loss": -40.187538146972656, "global_step": 116623, "epoch": 963} {"train_loss": -40.28896713256836, "global_step": 116624, "epoch": 963} {"train_loss": -39.65790557861328, "global_step": 116625, "epoch": 963} {"train_loss": -39.98114776611328, "global_step": 116626, "epoch": 963} {"train_loss": -39.73897933959961, "global_step": 116627, "epoch": 963} {"train_loss": -40.27214431762695, "global_step": 116628, "epoch": 963} {"train_loss": -39.99879455566406, "global_step": 116629, "epoch": 963} {"train_loss": -39.926326751708984, "global_step": 116630, "epoch": 963} {"train_loss": -40.21556091308594, "global_step": 116631, "epoch": 963} {"train_loss": -40.64006042480469, "global_step": 116632, "epoch": 963} {"train_loss": -40.47451400756836, "global_step": 116633, "epoch": 963} {"train_loss": -40.714271545410156, "global_step": 116634, "epoch": 963} {"train_loss": -40.252986907958984, "global_step": 116635, "epoch": 963} {"train_loss": -39.680519104003906, "global_step": 116636, "epoch": 963} {"train_loss": -39.56171798706055, "global_step": 116637, "epoch": 963} {"train_loss": -39.42814254760742, "global_step": 116638, "epoch": 963} {"train_loss": -38.82246780395508, "global_step": 116639, "epoch": 963} {"train_loss": -38.9071044921875, "global_step": 116640, "epoch": 963} {"train_loss": -40.6318359375, "global_step": 116641, "epoch": 963} {"train_loss": -40.44435501098633, "global_step": 116642, "epoch": 963} {"train_loss": -39.216042163943456, "global_step": 116643, "epoch": 963, "val_loss": 2694437.25} {"train_loss": -39.6797981262207, "global_step": 116644, "epoch": 964} {"train_loss": -38.14802169799805, "global_step": 116645, "epoch": 964} {"train_loss": -37.76316452026367, "global_step": 116646, "epoch": 964} {"train_loss": -38.56283187866211, "global_step": 116647, "epoch": 964} {"train_loss": -40.3040771484375, "global_step": 116648, "epoch": 964} {"train_loss": -40.26093673706055, "global_step": 116649, "epoch": 964} {"train_loss": -39.681758880615234, "global_step": 116650, "epoch": 964} {"train_loss": -38.69197082519531, "global_step": 116651, "epoch": 964} {"train_loss": -35.387962341308594, "global_step": 116652, "epoch": 964} {"train_loss": -35.9595947265625, "global_step": 116653, "epoch": 964} {"train_loss": -34.66951370239258, "global_step": 116654, "epoch": 964} {"train_loss": -32.29505157470703, "global_step": 116655, "epoch": 964} {"train_loss": -36.81635665893555, "global_step": 116656, "epoch": 964} {"train_loss": -36.975528717041016, "global_step": 116657, "epoch": 964} {"train_loss": -35.4542236328125, "global_step": 116658, "epoch": 964} {"train_loss": -35.17623519897461, "global_step": 116659, "epoch": 964} {"train_loss": -35.833099365234375, "global_step": 116660, "epoch": 964} {"train_loss": -34.76581954956055, "global_step": 116661, "epoch": 964} {"train_loss": -33.68624496459961, "global_step": 116662, "epoch": 964} {"train_loss": -34.592403411865234, "global_step": 116663, "epoch": 964} {"train_loss": -36.87027359008789, "global_step": 116664, "epoch": 964} {"train_loss": -35.62012481689453, "global_step": 116665, "epoch": 964} {"train_loss": -36.55623245239258, "global_step": 116666, "epoch": 964} {"train_loss": -35.82699966430664, "global_step": 116667, "epoch": 964} {"train_loss": -36.79000473022461, "global_step": 116668, "epoch": 964} {"train_loss": -36.79830551147461, "global_step": 116669, "epoch": 964} {"train_loss": -37.703651428222656, "global_step": 116670, "epoch": 964} {"train_loss": -37.33670425415039, "global_step": 116671, "epoch": 964} {"train_loss": -37.22370529174805, "global_step": 116672, "epoch": 964} {"train_loss": -37.575313568115234, "global_step": 116673, "epoch": 964} {"train_loss": -38.29307174682617, "global_step": 116674, "epoch": 964} {"train_loss": -38.39608383178711, "global_step": 116675, "epoch": 964} {"train_loss": -38.644222259521484, "global_step": 116676, "epoch": 964} {"train_loss": -38.97895431518555, "global_step": 116677, "epoch": 964} {"train_loss": -39.27633285522461, "global_step": 116678, "epoch": 964} {"train_loss": -39.17142105102539, "global_step": 116679, "epoch": 964} {"train_loss": -39.64060974121094, "global_step": 116680, "epoch": 964} {"train_loss": -39.74605178833008, "global_step": 116681, "epoch": 964} {"train_loss": -39.37606430053711, "global_step": 116682, "epoch": 964} {"train_loss": -39.17588424682617, "global_step": 116683, "epoch": 964} {"train_loss": -38.9676399230957, "global_step": 116684, "epoch": 964} {"train_loss": -39.258216857910156, "global_step": 116685, "epoch": 964} {"train_loss": -39.488037109375, "global_step": 116686, "epoch": 964} {"train_loss": -39.28068161010742, "global_step": 116687, "epoch": 964} {"train_loss": -39.38919448852539, "global_step": 116688, "epoch": 964} {"train_loss": -39.08570098876953, "global_step": 116689, "epoch": 964} {"train_loss": -38.922706604003906, "global_step": 116690, "epoch": 964} {"train_loss": -39.45536422729492, "global_step": 116691, "epoch": 964} {"train_loss": -39.25149154663086, "global_step": 116692, "epoch": 964} {"train_loss": -39.939449310302734, "global_step": 116693, "epoch": 964} {"train_loss": -40.25624084472656, "global_step": 116694, "epoch": 964} {"train_loss": -39.82294845581055, "global_step": 116695, "epoch": 964} {"train_loss": -38.88904571533203, "global_step": 116696, "epoch": 964} {"train_loss": -37.21574401855469, "global_step": 116697, "epoch": 964} {"train_loss": -37.5985107421875, "global_step": 116698, "epoch": 964} {"train_loss": -39.87119674682617, "global_step": 116699, "epoch": 964} {"train_loss": -38.90707778930664, "global_step": 116700, "epoch": 964} {"train_loss": -37.295108795166016, "global_step": 116701, "epoch": 964} {"train_loss": -38.383663177490234, "global_step": 116702, "epoch": 964} {"train_loss": -34.88116455078125, "global_step": 116703, "epoch": 964} {"train_loss": -35.3497428894043, "global_step": 116704, "epoch": 964} {"train_loss": -22.97330665588379, "global_step": 116705, "epoch": 964} {"train_loss": 6.634677410125732, "global_step": 116706, "epoch": 964} {"train_loss": -25.59090232849121, "global_step": 116707, "epoch": 964} {"train_loss": -17.427318572998047, "global_step": 116708, "epoch": 964} {"train_loss": -30.393896102905273, "global_step": 116709, "epoch": 964} {"train_loss": -16.996030807495117, "global_step": 116710, "epoch": 964} {"train_loss": -35.1546516418457, "global_step": 116711, "epoch": 964} {"train_loss": -21.170454025268555, "global_step": 116712, "epoch": 964} {"train_loss": -30.762805938720703, "global_step": 116713, "epoch": 964} {"train_loss": -34.19820022583008, "global_step": 116714, "epoch": 964} {"train_loss": -28.081968307495117, "global_step": 116715, "epoch": 964} {"train_loss": -30.916046142578125, "global_step": 116716, "epoch": 964} {"train_loss": -35.51375198364258, "global_step": 116717, "epoch": 964} {"train_loss": -33.0529670715332, "global_step": 116718, "epoch": 964} {"train_loss": -29.9534969329834, "global_step": 116719, "epoch": 964} {"train_loss": -34.02993392944336, "global_step": 116720, "epoch": 964} {"train_loss": -35.93599319458008, "global_step": 116721, "epoch": 964} {"train_loss": -34.3315544128418, "global_step": 116722, "epoch": 964} {"train_loss": -33.4693489074707, "global_step": 116723, "epoch": 964} {"train_loss": -34.20782470703125, "global_step": 116724, "epoch": 964} {"train_loss": -36.06612777709961, "global_step": 116725, "epoch": 964} {"train_loss": -36.27522659301758, "global_step": 116726, "epoch": 964} {"train_loss": -34.77573776245117, "global_step": 116727, "epoch": 964} {"train_loss": -34.837860107421875, "global_step": 116728, "epoch": 964} {"train_loss": -36.13437271118164, "global_step": 116729, "epoch": 964} {"train_loss": -36.44247055053711, "global_step": 116730, "epoch": 964} {"train_loss": -36.334537506103516, "global_step": 116731, "epoch": 964} {"train_loss": -36.21982955932617, "global_step": 116732, "epoch": 964} {"train_loss": -36.499263763427734, "global_step": 116733, "epoch": 964} {"train_loss": -36.554012298583984, "global_step": 116734, "epoch": 964} {"train_loss": -37.27430725097656, "global_step": 116735, "epoch": 964} {"train_loss": -37.130027770996094, "global_step": 116736, "epoch": 964} {"train_loss": -36.54793930053711, "global_step": 116737, "epoch": 964} {"train_loss": -36.63383102416992, "global_step": 116738, "epoch": 964} {"train_loss": -36.341453552246094, "global_step": 116739, "epoch": 964} {"train_loss": -37.4505615234375, "global_step": 116740, "epoch": 964} {"train_loss": -37.27368927001953, "global_step": 116741, "epoch": 964} {"train_loss": -37.09858322143555, "global_step": 116742, "epoch": 964} {"train_loss": -37.04877853393555, "global_step": 116743, "epoch": 964} {"train_loss": -37.216339111328125, "global_step": 116744, "epoch": 964} {"train_loss": -35.73868942260742, "global_step": 116745, "epoch": 964} {"train_loss": -36.549190521240234, "global_step": 116746, "epoch": 964} {"train_loss": -36.39817810058594, "global_step": 116747, "epoch": 964} {"train_loss": -33.80179977416992, "global_step": 116748, "epoch": 964} {"train_loss": -32.599891662597656, "global_step": 116749, "epoch": 964} {"train_loss": -36.2597770690918, "global_step": 116750, "epoch": 964} {"train_loss": -37.13310623168945, "global_step": 116751, "epoch": 964} {"train_loss": -34.122310638427734, "global_step": 116752, "epoch": 964} {"train_loss": -35.40055465698242, "global_step": 116753, "epoch": 964} {"train_loss": -36.50753402709961, "global_step": 116754, "epoch": 964} {"train_loss": -33.89395523071289, "global_step": 116755, "epoch": 964} {"train_loss": -34.31769943237305, "global_step": 116756, "epoch": 964} {"train_loss": -34.02849197387695, "global_step": 116757, "epoch": 964} {"train_loss": -37.3715934753418, "global_step": 116758, "epoch": 964} {"train_loss": -36.1639289855957, "global_step": 116759, "epoch": 964} {"train_loss": -36.71421432495117, "global_step": 116760, "epoch": 964} {"train_loss": -37.13715744018555, "global_step": 116761, "epoch": 964} {"train_loss": -35.6214714050293, "global_step": 116762, "epoch": 964} {"train_loss": -36.938167572021484, "global_step": 116763, "epoch": 964} {"train_loss": -35.5895736513059, "global_step": 116764, "epoch": 964, "val_loss": 2647904.75} {"train_loss": -37.16819381713867, "global_step": 116765, "epoch": 965} {"train_loss": -37.98843002319336, "global_step": 116766, "epoch": 965} {"train_loss": -36.77134323120117, "global_step": 116767, "epoch": 965} {"train_loss": -37.90386962890625, "global_step": 116768, "epoch": 965} {"train_loss": -34.195247650146484, "global_step": 116769, "epoch": 965} {"train_loss": -37.43960189819336, "global_step": 116770, "epoch": 965} {"train_loss": -37.47021484375, "global_step": 116771, "epoch": 965} {"train_loss": -37.729793548583984, "global_step": 116772, "epoch": 965} {"train_loss": -37.2036247253418, "global_step": 116773, "epoch": 965} {"train_loss": -36.94259262084961, "global_step": 116774, "epoch": 965} {"train_loss": -37.393592834472656, "global_step": 116775, "epoch": 965} {"train_loss": -36.913002014160156, "global_step": 116776, "epoch": 965} {"train_loss": -37.39976119995117, "global_step": 116777, "epoch": 965} {"train_loss": -38.2656135559082, "global_step": 116778, "epoch": 965} {"train_loss": -37.431304931640625, "global_step": 116779, "epoch": 965} {"train_loss": -38.0243034362793, "global_step": 116780, "epoch": 965} {"train_loss": -37.76374816894531, "global_step": 116781, "epoch": 965} {"train_loss": -38.08205795288086, "global_step": 116782, "epoch": 965} {"train_loss": -37.83768844604492, "global_step": 116783, "epoch": 965} {"train_loss": -37.201576232910156, "global_step": 116784, "epoch": 965} {"train_loss": -36.746253967285156, "global_step": 116785, "epoch": 965} {"train_loss": -35.9355354309082, "global_step": 116786, "epoch": 965} {"train_loss": -36.68560791015625, "global_step": 116787, "epoch": 965} {"train_loss": -38.692291259765625, "global_step": 116788, "epoch": 965} {"train_loss": -36.082740783691406, "global_step": 116789, "epoch": 965} {"train_loss": -36.69630813598633, "global_step": 116790, "epoch": 965} {"train_loss": -38.370826721191406, "global_step": 116791, "epoch": 965} {"train_loss": -36.38689041137695, "global_step": 116792, "epoch": 965} {"train_loss": -37.47434616088867, "global_step": 116793, "epoch": 965} {"train_loss": -37.63401412963867, "global_step": 116794, "epoch": 965} {"train_loss": -36.90724563598633, "global_step": 116795, "epoch": 965} {"train_loss": -38.0792121887207, "global_step": 116796, "epoch": 965} {"train_loss": -38.0257682800293, "global_step": 116797, "epoch": 965} {"train_loss": -37.991432189941406, "global_step": 116798, "epoch": 965} {"train_loss": -36.72121810913086, "global_step": 116799, "epoch": 965} {"train_loss": -37.5697135925293, "global_step": 116800, "epoch": 965} {"train_loss": -37.8625373840332, "global_step": 116801, "epoch": 965} {"train_loss": -37.927486419677734, "global_step": 116802, "epoch": 965} {"train_loss": -37.26865768432617, "global_step": 116803, "epoch": 965} {"train_loss": -37.59833908081055, "global_step": 116804, "epoch": 965} {"train_loss": -37.25806427001953, "global_step": 116805, "epoch": 965} {"train_loss": -38.09699249267578, "global_step": 116806, "epoch": 965} {"train_loss": -38.089576721191406, "global_step": 116807, "epoch": 965} {"train_loss": -37.53041458129883, "global_step": 116808, "epoch": 965} {"train_loss": -35.62470245361328, "global_step": 116809, "epoch": 965} {"train_loss": -36.952430725097656, "global_step": 116810, "epoch": 965} {"train_loss": -37.40813064575195, "global_step": 116811, "epoch": 965} {"train_loss": -37.54133224487305, "global_step": 116812, "epoch": 965} {"train_loss": -37.18000411987305, "global_step": 116813, "epoch": 965} {"train_loss": -37.60802459716797, "global_step": 116814, "epoch": 965} {"train_loss": -37.68394088745117, "global_step": 116815, "epoch": 965} {"train_loss": -38.272064208984375, "global_step": 116816, "epoch": 965} {"train_loss": -38.55851364135742, "global_step": 116817, "epoch": 965} {"train_loss": -37.11017990112305, "global_step": 116818, "epoch": 965} {"train_loss": -36.814422607421875, "global_step": 116819, "epoch": 965} {"train_loss": -37.99190902709961, "global_step": 116820, "epoch": 965} {"train_loss": -38.03273391723633, "global_step": 116821, "epoch": 965} {"train_loss": -37.830501556396484, "global_step": 116822, "epoch": 965} {"train_loss": -38.290645599365234, "global_step": 116823, "epoch": 965} {"train_loss": -37.36644744873047, "global_step": 116824, "epoch": 965} {"train_loss": -37.617130279541016, "global_step": 116825, "epoch": 965} {"train_loss": -38.537662506103516, "global_step": 116826, "epoch": 965} {"train_loss": -38.09377670288086, "global_step": 116827, "epoch": 965} {"train_loss": -38.97317886352539, "global_step": 116828, "epoch": 965} {"train_loss": -39.09054183959961, "global_step": 116829, "epoch": 965} {"train_loss": -37.488468170166016, "global_step": 116830, "epoch": 965} {"train_loss": -37.93855667114258, "global_step": 116831, "epoch": 965} {"train_loss": -37.20564651489258, "global_step": 116832, "epoch": 965} {"train_loss": -35.99122619628906, "global_step": 116833, "epoch": 965} {"train_loss": -39.08457946777344, "global_step": 116834, "epoch": 965} {"train_loss": -37.928592681884766, "global_step": 116835, "epoch": 965} {"train_loss": -36.6087532043457, "global_step": 116836, "epoch": 965} {"train_loss": -38.156436920166016, "global_step": 116837, "epoch": 965} {"train_loss": -36.7550163269043, "global_step": 116838, "epoch": 965} {"train_loss": -37.9495849609375, "global_step": 116839, "epoch": 965} {"train_loss": -38.5325813293457, "global_step": 116840, "epoch": 965} {"train_loss": -36.699649810791016, "global_step": 116841, "epoch": 965} {"train_loss": -37.668338775634766, "global_step": 116842, "epoch": 965} {"train_loss": -37.26748275756836, "global_step": 116843, "epoch": 965} {"train_loss": -37.449378967285156, "global_step": 116844, "epoch": 965} {"train_loss": -36.854095458984375, "global_step": 116845, "epoch": 965} {"train_loss": -35.44828414916992, "global_step": 116846, "epoch": 965} {"train_loss": -36.576263427734375, "global_step": 116847, "epoch": 965} {"train_loss": -36.82158279418945, "global_step": 116848, "epoch": 965} {"train_loss": -36.446327209472656, "global_step": 116849, "epoch": 965} {"train_loss": -36.60301971435547, "global_step": 116850, "epoch": 965} {"train_loss": -37.10671615600586, "global_step": 116851, "epoch": 965} {"train_loss": -38.07594299316406, "global_step": 116852, "epoch": 965} {"train_loss": -37.30062484741211, "global_step": 116853, "epoch": 965} {"train_loss": -37.125083923339844, "global_step": 116854, "epoch": 965} {"train_loss": -38.0884895324707, "global_step": 116855, "epoch": 965} {"train_loss": -38.037261962890625, "global_step": 116856, "epoch": 965} {"train_loss": -37.742671966552734, "global_step": 116857, "epoch": 965} {"train_loss": -38.693580627441406, "global_step": 116858, "epoch": 965} {"train_loss": -37.62964630126953, "global_step": 116859, "epoch": 965} {"train_loss": -38.1065673828125, "global_step": 116860, "epoch": 965} {"train_loss": -38.24260330200195, "global_step": 116861, "epoch": 965} {"train_loss": -38.02202606201172, "global_step": 116862, "epoch": 965} {"train_loss": -38.304481506347656, "global_step": 116863, "epoch": 965} {"train_loss": -38.107261657714844, "global_step": 116864, "epoch": 965} {"train_loss": -37.72134780883789, "global_step": 116865, "epoch": 965} {"train_loss": -38.00452423095703, "global_step": 116866, "epoch": 965} {"train_loss": -38.53506851196289, "global_step": 116867, "epoch": 965} {"train_loss": -37.89950180053711, "global_step": 116868, "epoch": 965} {"train_loss": -37.09084701538086, "global_step": 116869, "epoch": 965} {"train_loss": -37.81563186645508, "global_step": 116870, "epoch": 965} {"train_loss": -38.07263946533203, "global_step": 116871, "epoch": 965} {"train_loss": -38.06865692138672, "global_step": 116872, "epoch": 965} {"train_loss": -38.237361907958984, "global_step": 116873, "epoch": 965} {"train_loss": -37.50278854370117, "global_step": 116874, "epoch": 965} {"train_loss": -38.275638580322266, "global_step": 116875, "epoch": 965} {"train_loss": -36.33582305908203, "global_step": 116876, "epoch": 965} {"train_loss": -38.21145248413086, "global_step": 116877, "epoch": 965} {"train_loss": -36.845680236816406, "global_step": 116878, "epoch": 965} {"train_loss": -36.05953598022461, "global_step": 116879, "epoch": 965} {"train_loss": -34.6496696472168, "global_step": 116880, "epoch": 965} {"train_loss": -25.103511810302734, "global_step": 116881, "epoch": 965} {"train_loss": -22.048526763916016, "global_step": 116882, "epoch": 965} {"train_loss": -34.0555534362793, "global_step": 116883, "epoch": 965} {"train_loss": -34.18404769897461, "global_step": 116884, "epoch": 965} {"train_loss": -37.159276095303625, "global_step": 116885, "epoch": 965, "val_loss": 2835605.25} {"train_loss": -34.725502014160156, "global_step": 116886, "epoch": 966} {"train_loss": -34.51055145263672, "global_step": 116887, "epoch": 966} {"train_loss": -37.65044021606445, "global_step": 116888, "epoch": 966} {"train_loss": -35.86119842529297, "global_step": 116889, "epoch": 966} {"train_loss": -37.2174186706543, "global_step": 116890, "epoch": 966} {"train_loss": -36.977516174316406, "global_step": 116891, "epoch": 966} {"train_loss": -36.77596664428711, "global_step": 116892, "epoch": 966} {"train_loss": -37.42811965942383, "global_step": 116893, "epoch": 966} {"train_loss": -36.359432220458984, "global_step": 116894, "epoch": 966} {"train_loss": -37.27511215209961, "global_step": 116895, "epoch": 966} {"train_loss": -37.07987594604492, "global_step": 116896, "epoch": 966} {"train_loss": -37.732887268066406, "global_step": 116897, "epoch": 966} {"train_loss": -36.94932174682617, "global_step": 116898, "epoch": 966} {"train_loss": -37.28756332397461, "global_step": 116899, "epoch": 966} {"train_loss": -37.201698303222656, "global_step": 116900, "epoch": 966} {"train_loss": -36.89223861694336, "global_step": 116901, "epoch": 966} {"train_loss": -37.27690505981445, "global_step": 116902, "epoch": 966} {"train_loss": -37.71928787231445, "global_step": 116903, "epoch": 966} {"train_loss": -38.00753402709961, "global_step": 116904, "epoch": 966} {"train_loss": -36.73451614379883, "global_step": 116905, "epoch": 966} {"train_loss": -37.571529388427734, "global_step": 116906, "epoch": 966} {"train_loss": -37.98004913330078, "global_step": 116907, "epoch": 966} {"train_loss": -38.30296325683594, "global_step": 116908, "epoch": 966} {"train_loss": -38.583045959472656, "global_step": 116909, "epoch": 966} {"train_loss": -37.055904388427734, "global_step": 116910, "epoch": 966} {"train_loss": -37.84200668334961, "global_step": 116911, "epoch": 966} {"train_loss": -38.11750411987305, "global_step": 116912, "epoch": 966} {"train_loss": -37.73575973510742, "global_step": 116913, "epoch": 966} {"train_loss": -37.09383773803711, "global_step": 116914, "epoch": 966} {"train_loss": -38.4746208190918, "global_step": 116915, "epoch": 966} {"train_loss": -36.655696868896484, "global_step": 116916, "epoch": 966} {"train_loss": -38.72323226928711, "global_step": 116917, "epoch": 966} {"train_loss": -38.26408004760742, "global_step": 116918, "epoch": 966} {"train_loss": -37.47420883178711, "global_step": 116919, "epoch": 966} {"train_loss": -38.28855514526367, "global_step": 116920, "epoch": 966} {"train_loss": -37.9293098449707, "global_step": 116921, "epoch": 966} {"train_loss": -37.4404182434082, "global_step": 116922, "epoch": 966} {"train_loss": -36.37395095825195, "global_step": 116923, "epoch": 966} {"train_loss": -37.328025817871094, "global_step": 116924, "epoch": 966} {"train_loss": -35.288429260253906, "global_step": 116925, "epoch": 966} {"train_loss": -28.12308692932129, "global_step": 116926, "epoch": 966} {"train_loss": -8.261192321777344, "global_step": 116927, "epoch": 966} {"train_loss": -15.735417366027832, "global_step": 116928, "epoch": 966} {"train_loss": -35.42359924316406, "global_step": 116929, "epoch": 966} {"train_loss": -19.163183212280273, "global_step": 116930, "epoch": 966} {"train_loss": -36.80105209350586, "global_step": 116931, "epoch": 966} {"train_loss": -27.473297119140625, "global_step": 116932, "epoch": 966} {"train_loss": -34.720298767089844, "global_step": 116933, "epoch": 966} {"train_loss": -31.13740348815918, "global_step": 116934, "epoch": 966} {"train_loss": -32.52134323120117, "global_step": 116935, "epoch": 966} {"train_loss": -35.5031623840332, "global_step": 116936, "epoch": 966} {"train_loss": -33.155677795410156, "global_step": 116937, "epoch": 966} {"train_loss": -34.45357894897461, "global_step": 116938, "epoch": 966} {"train_loss": -36.2020263671875, "global_step": 116939, "epoch": 966} {"train_loss": -34.770843505859375, "global_step": 116940, "epoch": 966} {"train_loss": -35.01405334472656, "global_step": 116941, "epoch": 966} {"train_loss": -36.29698944091797, "global_step": 116942, "epoch": 966} {"train_loss": -34.19903564453125, "global_step": 116943, "epoch": 966} {"train_loss": -35.39561080932617, "global_step": 116944, "epoch": 966} {"train_loss": -35.60738754272461, "global_step": 116945, "epoch": 966} {"train_loss": -36.383785247802734, "global_step": 116946, "epoch": 966} {"train_loss": -35.31719970703125, "global_step": 116947, "epoch": 966} {"train_loss": -36.27480697631836, "global_step": 116948, "epoch": 966} {"train_loss": -35.72501754760742, "global_step": 116949, "epoch": 966} {"train_loss": -35.21268844604492, "global_step": 116950, "epoch": 966} {"train_loss": -36.55897521972656, "global_step": 116951, "epoch": 966} {"train_loss": -34.84496307373047, "global_step": 116952, "epoch": 966} {"train_loss": -36.3018684387207, "global_step": 116953, "epoch": 966} {"train_loss": -36.62611770629883, "global_step": 116954, "epoch": 966} {"train_loss": -36.50905227661133, "global_step": 116955, "epoch": 966} {"train_loss": -36.022056579589844, "global_step": 116956, "epoch": 966} {"train_loss": -36.45647048950195, "global_step": 116957, "epoch": 966} {"train_loss": -36.4871940612793, "global_step": 116958, "epoch": 966} {"train_loss": -37.3941764831543, "global_step": 116959, "epoch": 966} {"train_loss": -36.55947494506836, "global_step": 116960, "epoch": 966} {"train_loss": -37.502227783203125, "global_step": 116961, "epoch": 966} {"train_loss": -37.5911865234375, "global_step": 116962, "epoch": 966} {"train_loss": -37.165714263916016, "global_step": 116963, "epoch": 966} {"train_loss": -37.37055587768555, "global_step": 116964, "epoch": 966} {"train_loss": -37.49959182739258, "global_step": 116965, "epoch": 966} {"train_loss": -37.2065544128418, "global_step": 116966, "epoch": 966} {"train_loss": -37.36505889892578, "global_step": 116967, "epoch": 966} {"train_loss": -37.68899154663086, "global_step": 116968, "epoch": 966} {"train_loss": -37.00815963745117, "global_step": 116969, "epoch": 966} {"train_loss": -37.480003356933594, "global_step": 116970, "epoch": 966} {"train_loss": -37.3898811340332, "global_step": 116971, "epoch": 966} {"train_loss": -37.6928825378418, "global_step": 116972, "epoch": 966} {"train_loss": -37.58866882324219, "global_step": 116973, "epoch": 966} {"train_loss": -37.995052337646484, "global_step": 116974, "epoch": 966} {"train_loss": -37.40949630737305, "global_step": 116975, "epoch": 966} {"train_loss": -36.92691421508789, "global_step": 116976, "epoch": 966} {"train_loss": -38.08772277832031, "global_step": 116977, "epoch": 966} {"train_loss": -37.61393356323242, "global_step": 116978, "epoch": 966} {"train_loss": -37.84720993041992, "global_step": 116979, "epoch": 966} {"train_loss": -37.55880355834961, "global_step": 116980, "epoch": 966} {"train_loss": -38.12556076049805, "global_step": 116981, "epoch": 966} {"train_loss": -37.99247360229492, "global_step": 116982, "epoch": 966} {"train_loss": -37.664405822753906, "global_step": 116983, "epoch": 966} {"train_loss": -38.517303466796875, "global_step": 116984, "epoch": 966} {"train_loss": -38.096221923828125, "global_step": 116985, "epoch": 966} {"train_loss": -36.51921463012695, "global_step": 116986, "epoch": 966} {"train_loss": -37.30388259887695, "global_step": 116987, "epoch": 966} {"train_loss": -37.74738311767578, "global_step": 116988, "epoch": 966} {"train_loss": -38.193214416503906, "global_step": 116989, "epoch": 966} {"train_loss": -38.65323257446289, "global_step": 116990, "epoch": 966} {"train_loss": -38.221675872802734, "global_step": 116991, "epoch": 966} {"train_loss": -37.91650390625, "global_step": 116992, "epoch": 966} {"train_loss": -35.493446350097656, "global_step": 116993, "epoch": 966} {"train_loss": -32.76583480834961, "global_step": 116994, "epoch": 966} {"train_loss": -38.211116790771484, "global_step": 116995, "epoch": 966} {"train_loss": -37.986854553222656, "global_step": 116996, "epoch": 966} {"train_loss": -38.28950119018555, "global_step": 116997, "epoch": 966} {"train_loss": -37.77393341064453, "global_step": 116998, "epoch": 966} {"train_loss": -37.502685546875, "global_step": 116999, "epoch": 966} {"train_loss": -36.97279739379883, "global_step": 117000, "epoch": 966} {"train_loss": -34.90685272216797, "global_step": 117001, "epoch": 966} {"train_loss": -38.59540939331055, "global_step": 117002, "epoch": 966} {"train_loss": -37.40699768066406, "global_step": 117003, "epoch": 966} {"train_loss": -34.77478790283203, "global_step": 117004, "epoch": 966} {"train_loss": -33.7604866027832, "global_step": 117005, "epoch": 966} {"train_loss": -36.09767134327534, "global_step": 117006, "epoch": 966, "val_loss": 2940693.25} {"train_loss": -37.48917770385742, "global_step": 117007, "epoch": 967} {"train_loss": -36.63936233520508, "global_step": 117008, "epoch": 967} {"train_loss": -37.12507629394531, "global_step": 117009, "epoch": 967} {"train_loss": -35.9326286315918, "global_step": 117010, "epoch": 967} {"train_loss": -37.506507873535156, "global_step": 117011, "epoch": 967} {"train_loss": -35.317054748535156, "global_step": 117012, "epoch": 967} {"train_loss": -33.37558364868164, "global_step": 117013, "epoch": 967} {"train_loss": -37.048282623291016, "global_step": 117014, "epoch": 967} {"train_loss": -35.521629333496094, "global_step": 117015, "epoch": 967} {"train_loss": -36.842594146728516, "global_step": 117016, "epoch": 967} {"train_loss": -36.84901809692383, "global_step": 117017, "epoch": 967} {"train_loss": -37.538604736328125, "global_step": 117018, "epoch": 967} {"train_loss": -37.0908088684082, "global_step": 117019, "epoch": 967} {"train_loss": -32.88380813598633, "global_step": 117020, "epoch": 967} {"train_loss": -36.297786712646484, "global_step": 117021, "epoch": 967} {"train_loss": -36.02281188964844, "global_step": 117022, "epoch": 967} {"train_loss": -36.416481018066406, "global_step": 117023, "epoch": 967} {"train_loss": -36.693790435791016, "global_step": 117024, "epoch": 967} {"train_loss": -32.160308837890625, "global_step": 117025, "epoch": 967} {"train_loss": -34.0756721496582, "global_step": 117026, "epoch": 967} {"train_loss": -36.7694206237793, "global_step": 117027, "epoch": 967} {"train_loss": -36.273170471191406, "global_step": 117028, "epoch": 967} {"train_loss": -35.75202941894531, "global_step": 117029, "epoch": 967} {"train_loss": -34.93798065185547, "global_step": 117030, "epoch": 967} {"train_loss": -36.567466735839844, "global_step": 117031, "epoch": 967} {"train_loss": -36.46946334838867, "global_step": 117032, "epoch": 967} {"train_loss": -36.301631927490234, "global_step": 117033, "epoch": 967} {"train_loss": -36.57724380493164, "global_step": 117034, "epoch": 967} {"train_loss": -35.06446075439453, "global_step": 117035, "epoch": 967} {"train_loss": -36.13198471069336, "global_step": 117036, "epoch": 967} {"train_loss": -36.35240936279297, "global_step": 117037, "epoch": 967} {"train_loss": -36.94624710083008, "global_step": 117038, "epoch": 967} {"train_loss": -37.49546432495117, "global_step": 117039, "epoch": 967} {"train_loss": -36.50472640991211, "global_step": 117040, "epoch": 967} {"train_loss": -36.88850021362305, "global_step": 117041, "epoch": 967} {"train_loss": -35.55183029174805, "global_step": 117042, "epoch": 967} {"train_loss": -37.4725341796875, "global_step": 117043, "epoch": 967} {"train_loss": -36.27644729614258, "global_step": 117044, "epoch": 967} {"train_loss": -36.80263900756836, "global_step": 117045, "epoch": 967} {"train_loss": -37.238563537597656, "global_step": 117046, "epoch": 967} {"train_loss": -36.77613067626953, "global_step": 117047, "epoch": 967} {"train_loss": -36.8082389831543, "global_step": 117048, "epoch": 967} {"train_loss": -37.60797119140625, "global_step": 117049, "epoch": 967} {"train_loss": -37.7088508605957, "global_step": 117050, "epoch": 967} {"train_loss": -37.62028884887695, "global_step": 117051, "epoch": 967} {"train_loss": -37.76714324951172, "global_step": 117052, "epoch": 967} {"train_loss": -37.583831787109375, "global_step": 117053, "epoch": 967} {"train_loss": -37.00129318237305, "global_step": 117054, "epoch": 967} {"train_loss": -36.79970169067383, "global_step": 117055, "epoch": 967} {"train_loss": -37.8274040222168, "global_step": 117056, "epoch": 967} {"train_loss": -37.6452522277832, "global_step": 117057, "epoch": 967} {"train_loss": -38.1530876159668, "global_step": 117058, "epoch": 967} {"train_loss": -35.89680099487305, "global_step": 117059, "epoch": 967} {"train_loss": -37.8551025390625, "global_step": 117060, "epoch": 967} {"train_loss": -37.506935119628906, "global_step": 117061, "epoch": 967} {"train_loss": -37.79446792602539, "global_step": 117062, "epoch": 967} {"train_loss": -37.95908737182617, "global_step": 117063, "epoch": 967} {"train_loss": -36.431331634521484, "global_step": 117064, "epoch": 967} {"train_loss": -34.72230529785156, "global_step": 117065, "epoch": 967} {"train_loss": -37.580787658691406, "global_step": 117066, "epoch": 967} {"train_loss": -37.716529846191406, "global_step": 117067, "epoch": 967} {"train_loss": -37.79165267944336, "global_step": 117068, "epoch": 967} {"train_loss": -36.969757080078125, "global_step": 117069, "epoch": 967} {"train_loss": -37.784420013427734, "global_step": 117070, "epoch": 967} {"train_loss": -38.01241683959961, "global_step": 117071, "epoch": 967} {"train_loss": -36.988304138183594, "global_step": 117072, "epoch": 967} {"train_loss": -37.58339309692383, "global_step": 117073, "epoch": 967} {"train_loss": -37.3797492980957, "global_step": 117074, "epoch": 967} {"train_loss": -38.068267822265625, "global_step": 117075, "epoch": 967} {"train_loss": -37.85620880126953, "global_step": 117076, "epoch": 967} {"train_loss": -38.25684356689453, "global_step": 117077, "epoch": 967} {"train_loss": -37.62162399291992, "global_step": 117078, "epoch": 967} {"train_loss": -37.74503707885742, "global_step": 117079, "epoch": 967} {"train_loss": -37.620086669921875, "global_step": 117080, "epoch": 967} {"train_loss": -37.939239501953125, "global_step": 117081, "epoch": 967} {"train_loss": -36.518611907958984, "global_step": 117082, "epoch": 967} {"train_loss": -37.06990432739258, "global_step": 117083, "epoch": 967} {"train_loss": -37.48923873901367, "global_step": 117084, "epoch": 967} {"train_loss": -37.83012771606445, "global_step": 117085, "epoch": 967} {"train_loss": -37.888893127441406, "global_step": 117086, "epoch": 967} {"train_loss": -38.37787628173828, "global_step": 117087, "epoch": 967} {"train_loss": -37.9225959777832, "global_step": 117088, "epoch": 967} {"train_loss": -38.099239349365234, "global_step": 117089, "epoch": 967} {"train_loss": -38.08577346801758, "global_step": 117090, "epoch": 967} {"train_loss": -37.765342712402344, "global_step": 117091, "epoch": 967} {"train_loss": -38.207191467285156, "global_step": 117092, "epoch": 967} {"train_loss": -37.307228088378906, "global_step": 117093, "epoch": 967} {"train_loss": -37.657623291015625, "global_step": 117094, "epoch": 967} {"train_loss": -38.14707565307617, "global_step": 117095, "epoch": 967} {"train_loss": -38.09672164916992, "global_step": 117096, "epoch": 967} {"train_loss": -38.49901580810547, "global_step": 117097, "epoch": 967} {"train_loss": -38.25856399536133, "global_step": 117098, "epoch": 967} {"train_loss": -38.66120529174805, "global_step": 117099, "epoch": 967} {"train_loss": -38.63850402832031, "global_step": 117100, "epoch": 967} {"train_loss": -38.39439010620117, "global_step": 117101, "epoch": 967} {"train_loss": -38.742671966552734, "global_step": 117102, "epoch": 967} {"train_loss": -39.0098991394043, "global_step": 117103, "epoch": 967} {"train_loss": -34.96570587158203, "global_step": 117104, "epoch": 967} {"train_loss": -38.57268142700195, "global_step": 117105, "epoch": 967} {"train_loss": -38.4908447265625, "global_step": 117106, "epoch": 967} {"train_loss": -38.66810989379883, "global_step": 117107, "epoch": 967} {"train_loss": -38.01096725463867, "global_step": 117108, "epoch": 967} {"train_loss": -33.839576721191406, "global_step": 117109, "epoch": 967} {"train_loss": -38.45002365112305, "global_step": 117110, "epoch": 967} {"train_loss": -37.793514251708984, "global_step": 117111, "epoch": 967} {"train_loss": -37.52186965942383, "global_step": 117112, "epoch": 967} {"train_loss": -38.88686752319336, "global_step": 117113, "epoch": 967} {"train_loss": -33.30904006958008, "global_step": 117114, "epoch": 967} {"train_loss": -36.83028793334961, "global_step": 117115, "epoch": 967} {"train_loss": -38.3863639831543, "global_step": 117116, "epoch": 967} {"train_loss": -36.7928352355957, "global_step": 117117, "epoch": 967} {"train_loss": -35.74193572998047, "global_step": 117118, "epoch": 967} {"train_loss": -34.9034423828125, "global_step": 117119, "epoch": 967} {"train_loss": -37.61402130126953, "global_step": 117120, "epoch": 967} {"train_loss": -37.86086654663086, "global_step": 117121, "epoch": 967} {"train_loss": -37.577850341796875, "global_step": 117122, "epoch": 967} {"train_loss": -35.604305267333984, "global_step": 117123, "epoch": 967} {"train_loss": -38.291954040527344, "global_step": 117124, "epoch": 967} {"train_loss": -38.004817962646484, "global_step": 117125, "epoch": 967} {"train_loss": -38.66947555541992, "global_step": 117126, "epoch": 967} {"train_loss": -37.076615357201945, "global_step": 117127, "epoch": 967, "val_loss": 2963238.75} {"train_loss": -36.530914306640625, "global_step": 117128, "epoch": 968} {"train_loss": -37.897560119628906, "global_step": 117129, "epoch": 968} {"train_loss": -36.55083465576172, "global_step": 117130, "epoch": 968} {"train_loss": -37.18354797363281, "global_step": 117131, "epoch": 968} {"train_loss": -37.64768600463867, "global_step": 117132, "epoch": 968} {"train_loss": -38.23495101928711, "global_step": 117133, "epoch": 968} {"train_loss": -36.89460372924805, "global_step": 117134, "epoch": 968} {"train_loss": -38.5847282409668, "global_step": 117135, "epoch": 968} {"train_loss": -37.852317810058594, "global_step": 117136, "epoch": 968} {"train_loss": -38.50999069213867, "global_step": 117137, "epoch": 968} {"train_loss": -38.58331298828125, "global_step": 117138, "epoch": 968} {"train_loss": -38.6439094543457, "global_step": 117139, "epoch": 968} {"train_loss": -38.350189208984375, "global_step": 117140, "epoch": 968} {"train_loss": -38.62717819213867, "global_step": 117141, "epoch": 968} {"train_loss": -38.95060348510742, "global_step": 117142, "epoch": 968} {"train_loss": -38.765106201171875, "global_step": 117143, "epoch": 968} {"train_loss": -38.66970443725586, "global_step": 117144, "epoch": 968} {"train_loss": -39.04653549194336, "global_step": 117145, "epoch": 968} {"train_loss": -38.04749298095703, "global_step": 117146, "epoch": 968} {"train_loss": -38.38151550292969, "global_step": 117147, "epoch": 968} {"train_loss": -38.17361068725586, "global_step": 117148, "epoch": 968} {"train_loss": -37.691444396972656, "global_step": 117149, "epoch": 968} {"train_loss": -39.097328186035156, "global_step": 117150, "epoch": 968} {"train_loss": -38.15803527832031, "global_step": 117151, "epoch": 968} {"train_loss": -39.007301330566406, "global_step": 117152, "epoch": 968} {"train_loss": -38.543190002441406, "global_step": 117153, "epoch": 968} {"train_loss": -38.36261749267578, "global_step": 117154, "epoch": 968} {"train_loss": -39.105064392089844, "global_step": 117155, "epoch": 968} {"train_loss": -38.57049560546875, "global_step": 117156, "epoch": 968} {"train_loss": -38.59318923950195, "global_step": 117157, "epoch": 968} {"train_loss": -39.1246337890625, "global_step": 117158, "epoch": 968} {"train_loss": -37.99129867553711, "global_step": 117159, "epoch": 968} {"train_loss": -38.80760192871094, "global_step": 117160, "epoch": 968} {"train_loss": -39.10892868041992, "global_step": 117161, "epoch": 968} {"train_loss": -38.67915725708008, "global_step": 117162, "epoch": 968} {"train_loss": -39.30044174194336, "global_step": 117163, "epoch": 968} {"train_loss": -38.46572494506836, "global_step": 117164, "epoch": 968} {"train_loss": -38.852535247802734, "global_step": 117165, "epoch": 968} {"train_loss": -39.16859817504883, "global_step": 117166, "epoch": 968} {"train_loss": -38.75718307495117, "global_step": 117167, "epoch": 968} {"train_loss": -38.73197555541992, "global_step": 117168, "epoch": 968} {"train_loss": -38.06882095336914, "global_step": 117169, "epoch": 968} {"train_loss": -38.24355697631836, "global_step": 117170, "epoch": 968} {"train_loss": -36.751827239990234, "global_step": 117171, "epoch": 968} {"train_loss": -37.70162582397461, "global_step": 117172, "epoch": 968} {"train_loss": -38.99807357788086, "global_step": 117173, "epoch": 968} {"train_loss": -39.09493637084961, "global_step": 117174, "epoch": 968} {"train_loss": -38.855194091796875, "global_step": 117175, "epoch": 968} {"train_loss": -38.80189895629883, "global_step": 117176, "epoch": 968} {"train_loss": -38.809120178222656, "global_step": 117177, "epoch": 968} {"train_loss": -39.12934494018555, "global_step": 117178, "epoch": 968} {"train_loss": -39.05721664428711, "global_step": 117179, "epoch": 968} {"train_loss": -39.10921096801758, "global_step": 117180, "epoch": 968} {"train_loss": -37.31732177734375, "global_step": 117181, "epoch": 968} {"train_loss": -39.32748794555664, "global_step": 117182, "epoch": 968} {"train_loss": -38.68416213989258, "global_step": 117183, "epoch": 968} {"train_loss": -36.22945022583008, "global_step": 117184, "epoch": 968} {"train_loss": -38.839481353759766, "global_step": 117185, "epoch": 968} {"train_loss": -38.46326446533203, "global_step": 117186, "epoch": 968} {"train_loss": -38.84335708618164, "global_step": 117187, "epoch": 968} {"train_loss": -37.79963684082031, "global_step": 117188, "epoch": 968} {"train_loss": -37.7705078125, "global_step": 117189, "epoch": 968} {"train_loss": -39.022640228271484, "global_step": 117190, "epoch": 968} {"train_loss": -38.87481689453125, "global_step": 117191, "epoch": 968} {"train_loss": -38.482696533203125, "global_step": 117192, "epoch": 968} {"train_loss": -37.94206619262695, "global_step": 117193, "epoch": 968} {"train_loss": -37.41737365722656, "global_step": 117194, "epoch": 968} {"train_loss": -36.78984832763672, "global_step": 117195, "epoch": 968} {"train_loss": -38.727352142333984, "global_step": 117196, "epoch": 968} {"train_loss": -38.14118576049805, "global_step": 117197, "epoch": 968} {"train_loss": -35.30415725708008, "global_step": 117198, "epoch": 968} {"train_loss": -39.25448226928711, "global_step": 117199, "epoch": 968} {"train_loss": -38.98041915893555, "global_step": 117200, "epoch": 968} {"train_loss": -38.00211715698242, "global_step": 117201, "epoch": 968} {"train_loss": -38.39358139038086, "global_step": 117202, "epoch": 968} {"train_loss": -38.591529846191406, "global_step": 117203, "epoch": 968} {"train_loss": -38.48630905151367, "global_step": 117204, "epoch": 968} {"train_loss": -38.64282989501953, "global_step": 117205, "epoch": 968} {"train_loss": -38.50126266479492, "global_step": 117206, "epoch": 968} {"train_loss": -39.02588653564453, "global_step": 117207, "epoch": 968} {"train_loss": -37.42940902709961, "global_step": 117208, "epoch": 968} {"train_loss": -37.98173141479492, "global_step": 117209, "epoch": 968} {"train_loss": -38.18655776977539, "global_step": 117210, "epoch": 968} {"train_loss": -39.08553695678711, "global_step": 117211, "epoch": 968} {"train_loss": -39.38820266723633, "global_step": 117212, "epoch": 968} {"train_loss": -39.537052154541016, "global_step": 117213, "epoch": 968} {"train_loss": -39.02353286743164, "global_step": 117214, "epoch": 968} {"train_loss": -38.79511642456055, "global_step": 117215, "epoch": 968} {"train_loss": -39.14974594116211, "global_step": 117216, "epoch": 968} {"train_loss": -38.561256408691406, "global_step": 117217, "epoch": 968} {"train_loss": -39.13709259033203, "global_step": 117218, "epoch": 968} {"train_loss": -38.85944747924805, "global_step": 117219, "epoch": 968} {"train_loss": -39.6740837097168, "global_step": 117220, "epoch": 968} {"train_loss": -38.944183349609375, "global_step": 117221, "epoch": 968} {"train_loss": -39.43964385986328, "global_step": 117222, "epoch": 968} {"train_loss": -36.22214889526367, "global_step": 117223, "epoch": 968} {"train_loss": -38.81079864501953, "global_step": 117224, "epoch": 968} {"train_loss": -39.14578628540039, "global_step": 117225, "epoch": 968} {"train_loss": -38.87061309814453, "global_step": 117226, "epoch": 968} {"train_loss": -39.445980072021484, "global_step": 117227, "epoch": 968} {"train_loss": -39.31891632080078, "global_step": 117228, "epoch": 968} {"train_loss": -39.12665557861328, "global_step": 117229, "epoch": 968} {"train_loss": -38.12372970581055, "global_step": 117230, "epoch": 968} {"train_loss": -39.586666107177734, "global_step": 117231, "epoch": 968} {"train_loss": -39.30291748046875, "global_step": 117232, "epoch": 968} {"train_loss": -37.887733459472656, "global_step": 117233, "epoch": 968} {"train_loss": -38.61811447143555, "global_step": 117234, "epoch": 968} {"train_loss": -39.089111328125, "global_step": 117235, "epoch": 968} {"train_loss": -38.903236389160156, "global_step": 117236, "epoch": 968} {"train_loss": -38.9220085144043, "global_step": 117237, "epoch": 968} {"train_loss": -39.00217819213867, "global_step": 117238, "epoch": 968} {"train_loss": -38.658504486083984, "global_step": 117239, "epoch": 968} {"train_loss": -36.700523376464844, "global_step": 117240, "epoch": 968} {"train_loss": -38.7239990234375, "global_step": 117241, "epoch": 968} {"train_loss": -38.55592727661133, "global_step": 117242, "epoch": 968} {"train_loss": -36.56278991699219, "global_step": 117243, "epoch": 968} {"train_loss": -27.76656150817871, "global_step": 117244, "epoch": 968} {"train_loss": -36.6436882019043, "global_step": 117245, "epoch": 968} {"train_loss": -36.381500244140625, "global_step": 117246, "epoch": 968} {"train_loss": -30.769128799438477, "global_step": 117247, "epoch": 968} {"train_loss": -38.21767201699501, "global_step": 117248, "epoch": 968, "val_loss": 2746735.0} {"train_loss": -34.770347595214844, "global_step": 117249, "epoch": 969} {"train_loss": -25.397537231445312, "global_step": 117250, "epoch": 969} {"train_loss": -29.238605499267578, "global_step": 117251, "epoch": 969} {"train_loss": -33.076045989990234, "global_step": 117252, "epoch": 969} {"train_loss": -31.27943992614746, "global_step": 117253, "epoch": 969} {"train_loss": -30.645917892456055, "global_step": 117254, "epoch": 969} {"train_loss": -15.550219535827637, "global_step": 117255, "epoch": 969} {"train_loss": -29.385786056518555, "global_step": 117256, "epoch": 969} {"train_loss": -28.935230255126953, "global_step": 117257, "epoch": 969} {"train_loss": -30.182958602905273, "global_step": 117258, "epoch": 969} {"train_loss": -30.957035064697266, "global_step": 117259, "epoch": 969} {"train_loss": -31.628992080688477, "global_step": 117260, "epoch": 969} {"train_loss": -30.610437393188477, "global_step": 117261, "epoch": 969} {"train_loss": -31.366607666015625, "global_step": 117262, "epoch": 969} {"train_loss": -33.23028564453125, "global_step": 117263, "epoch": 969} {"train_loss": -34.1231803894043, "global_step": 117264, "epoch": 969} {"train_loss": -30.702335357666016, "global_step": 117265, "epoch": 969} {"train_loss": -33.24067306518555, "global_step": 117266, "epoch": 969} {"train_loss": -33.29875183105469, "global_step": 117267, "epoch": 969} {"train_loss": -34.353065490722656, "global_step": 117268, "epoch": 969} {"train_loss": -33.544708251953125, "global_step": 117269, "epoch": 969} {"train_loss": -34.549922943115234, "global_step": 117270, "epoch": 969} {"train_loss": -34.057289123535156, "global_step": 117271, "epoch": 969} {"train_loss": -33.2308349609375, "global_step": 117272, "epoch": 969} {"train_loss": -34.511016845703125, "global_step": 117273, "epoch": 969} {"train_loss": -32.9992561340332, "global_step": 117274, "epoch": 969} {"train_loss": -34.9005241394043, "global_step": 117275, "epoch": 969} {"train_loss": -34.8741340637207, "global_step": 117276, "epoch": 969} {"train_loss": -33.160301208496094, "global_step": 117277, "epoch": 969} {"train_loss": -34.245628356933594, "global_step": 117278, "epoch": 969} {"train_loss": -35.252071380615234, "global_step": 117279, "epoch": 969} {"train_loss": -35.87801742553711, "global_step": 117280, "epoch": 969} {"train_loss": -35.704952239990234, "global_step": 117281, "epoch": 969} {"train_loss": -36.1080436706543, "global_step": 117282, "epoch": 969} {"train_loss": -35.468807220458984, "global_step": 117283, "epoch": 969} {"train_loss": -35.36161422729492, "global_step": 117284, "epoch": 969} {"train_loss": -35.77569580078125, "global_step": 117285, "epoch": 969} {"train_loss": -35.052364349365234, "global_step": 117286, "epoch": 969} {"train_loss": -35.95720291137695, "global_step": 117287, "epoch": 969} {"train_loss": -35.78242111206055, "global_step": 117288, "epoch": 969} {"train_loss": -35.808509826660156, "global_step": 117289, "epoch": 969} {"train_loss": -36.053462982177734, "global_step": 117290, "epoch": 969} {"train_loss": -36.238243103027344, "global_step": 117291, "epoch": 969} {"train_loss": -35.645538330078125, "global_step": 117292, "epoch": 969} {"train_loss": -35.079769134521484, "global_step": 117293, "epoch": 969} {"train_loss": -36.152923583984375, "global_step": 117294, "epoch": 969} {"train_loss": -36.70965576171875, "global_step": 117295, "epoch": 969} {"train_loss": -36.084938049316406, "global_step": 117296, "epoch": 969} {"train_loss": -36.44777297973633, "global_step": 117297, "epoch": 969} {"train_loss": -36.71320724487305, "global_step": 117298, "epoch": 969} {"train_loss": -36.954158782958984, "global_step": 117299, "epoch": 969} {"train_loss": -36.889766693115234, "global_step": 117300, "epoch": 969} {"train_loss": -35.8408317565918, "global_step": 117301, "epoch": 969} {"train_loss": -36.84166717529297, "global_step": 117302, "epoch": 969} {"train_loss": -36.49797439575195, "global_step": 117303, "epoch": 969} {"train_loss": -36.69282531738281, "global_step": 117304, "epoch": 969} {"train_loss": -37.014381408691406, "global_step": 117305, "epoch": 969} {"train_loss": -37.10003662109375, "global_step": 117306, "epoch": 969} {"train_loss": -36.78970718383789, "global_step": 117307, "epoch": 969} {"train_loss": -36.93589782714844, "global_step": 117308, "epoch": 969} {"train_loss": -36.6939697265625, "global_step": 117309, "epoch": 969} {"train_loss": -37.32115936279297, "global_step": 117310, "epoch": 969} {"train_loss": -36.98027420043945, "global_step": 117311, "epoch": 969} {"train_loss": -37.29128646850586, "global_step": 117312, "epoch": 969} {"train_loss": -37.18646240234375, "global_step": 117313, "epoch": 969} {"train_loss": -37.655174255371094, "global_step": 117314, "epoch": 969} {"train_loss": -37.310359954833984, "global_step": 117315, "epoch": 969} {"train_loss": -37.51567459106445, "global_step": 117316, "epoch": 969} {"train_loss": -37.539485931396484, "global_step": 117317, "epoch": 969} {"train_loss": -37.69033432006836, "global_step": 117318, "epoch": 969} {"train_loss": -37.97370529174805, "global_step": 117319, "epoch": 969} {"train_loss": -37.73284912109375, "global_step": 117320, "epoch": 969} {"train_loss": -37.39176559448242, "global_step": 117321, "epoch": 969} {"train_loss": -37.34127426147461, "global_step": 117322, "epoch": 969} {"train_loss": -37.955928802490234, "global_step": 117323, "epoch": 969} {"train_loss": -37.93103790283203, "global_step": 117324, "epoch": 969} {"train_loss": -38.084102630615234, "global_step": 117325, "epoch": 969} {"train_loss": -37.701683044433594, "global_step": 117326, "epoch": 969} {"train_loss": -37.796363830566406, "global_step": 117327, "epoch": 969} {"train_loss": -37.787418365478516, "global_step": 117328, "epoch": 969} {"train_loss": -37.6396484375, "global_step": 117329, "epoch": 969} {"train_loss": -37.83887481689453, "global_step": 117330, "epoch": 969} {"train_loss": -38.23344802856445, "global_step": 117331, "epoch": 969} {"train_loss": -38.15015411376953, "global_step": 117332, "epoch": 969} {"train_loss": -38.365047454833984, "global_step": 117333, "epoch": 969} {"train_loss": -38.17750549316406, "global_step": 117334, "epoch": 969} {"train_loss": -37.84002685546875, "global_step": 117335, "epoch": 969} {"train_loss": -38.06684875488281, "global_step": 117336, "epoch": 969} {"train_loss": -38.300392150878906, "global_step": 117337, "epoch": 969} {"train_loss": -38.229801177978516, "global_step": 117338, "epoch": 969} {"train_loss": -38.48592758178711, "global_step": 117339, "epoch": 969} {"train_loss": -38.488887786865234, "global_step": 117340, "epoch": 969} {"train_loss": -38.71390914916992, "global_step": 117341, "epoch": 969} {"train_loss": -38.57149124145508, "global_step": 117342, "epoch": 969} {"train_loss": -38.24876022338867, "global_step": 117343, "epoch": 969} {"train_loss": -38.34366989135742, "global_step": 117344, "epoch": 969} {"train_loss": -37.89591598510742, "global_step": 117345, "epoch": 969} {"train_loss": -38.765037536621094, "global_step": 117346, "epoch": 969} {"train_loss": -38.646793365478516, "global_step": 117347, "epoch": 969} {"train_loss": -38.65122604370117, "global_step": 117348, "epoch": 969} {"train_loss": -38.800697326660156, "global_step": 117349, "epoch": 969} {"train_loss": -38.71299362182617, "global_step": 117350, "epoch": 969} {"train_loss": -38.723297119140625, "global_step": 117351, "epoch": 969} {"train_loss": -38.753299713134766, "global_step": 117352, "epoch": 969} {"train_loss": -38.8328742980957, "global_step": 117353, "epoch": 969} {"train_loss": -39.277618408203125, "global_step": 117354, "epoch": 969} {"train_loss": -38.62287521362305, "global_step": 117355, "epoch": 969} {"train_loss": -38.62775802612305, "global_step": 117356, "epoch": 969} {"train_loss": -38.66626739501953, "global_step": 117357, "epoch": 969} {"train_loss": -39.12179946899414, "global_step": 117358, "epoch": 969} {"train_loss": -39.11763381958008, "global_step": 117359, "epoch": 969} {"train_loss": -38.89284896850586, "global_step": 117360, "epoch": 969} {"train_loss": -39.1119384765625, "global_step": 117361, "epoch": 969} {"train_loss": -38.6589241027832, "global_step": 117362, "epoch": 969} {"train_loss": -39.2464599609375, "global_step": 117363, "epoch": 969} {"train_loss": -39.023616790771484, "global_step": 117364, "epoch": 969} {"train_loss": -39.228607177734375, "global_step": 117365, "epoch": 969} {"train_loss": -39.185523986816406, "global_step": 117366, "epoch": 969} {"train_loss": -39.37279510498047, "global_step": 117367, "epoch": 969} {"train_loss": -38.88199234008789, "global_step": 117368, "epoch": 969} {"train_loss": -36.12593317425941, "global_step": 117369, "epoch": 969, "val_loss": 2731096.75} {"train_loss": -38.79860305786133, "global_step": 117370, "epoch": 970} {"train_loss": -38.92486572265625, "global_step": 117371, "epoch": 970} {"train_loss": -38.373268127441406, "global_step": 117372, "epoch": 970} {"train_loss": -38.2454719543457, "global_step": 117373, "epoch": 970} {"train_loss": -39.173805236816406, "global_step": 117374, "epoch": 970} {"train_loss": -39.07179641723633, "global_step": 117375, "epoch": 970} {"train_loss": -38.72195053100586, "global_step": 117376, "epoch": 970} {"train_loss": -37.17539596557617, "global_step": 117377, "epoch": 970} {"train_loss": -36.8560676574707, "global_step": 117378, "epoch": 970} {"train_loss": -35.79719161987305, "global_step": 117379, "epoch": 970} {"train_loss": -35.84321975708008, "global_step": 117380, "epoch": 970} {"train_loss": -38.639461517333984, "global_step": 117381, "epoch": 970} {"train_loss": -37.430694580078125, "global_step": 117382, "epoch": 970} {"train_loss": -36.20807647705078, "global_step": 117383, "epoch": 970} {"train_loss": -36.794097900390625, "global_step": 117384, "epoch": 970} {"train_loss": -37.763057708740234, "global_step": 117385, "epoch": 970} {"train_loss": -38.74932861328125, "global_step": 117386, "epoch": 970} {"train_loss": -38.24494171142578, "global_step": 117387, "epoch": 970} {"train_loss": -37.95161056518555, "global_step": 117388, "epoch": 970} {"train_loss": -38.87824630737305, "global_step": 117389, "epoch": 970} {"train_loss": -37.87705612182617, "global_step": 117390, "epoch": 970} {"train_loss": -38.03290939331055, "global_step": 117391, "epoch": 970} {"train_loss": -38.92716598510742, "global_step": 117392, "epoch": 970} {"train_loss": -38.14234161376953, "global_step": 117393, "epoch": 970} {"train_loss": -37.794857025146484, "global_step": 117394, "epoch": 970} {"train_loss": -38.820716857910156, "global_step": 117395, "epoch": 970} {"train_loss": -37.83430480957031, "global_step": 117396, "epoch": 970} {"train_loss": -36.886566162109375, "global_step": 117397, "epoch": 970} {"train_loss": -37.9980583190918, "global_step": 117398, "epoch": 970} {"train_loss": -38.35344696044922, "global_step": 117399, "epoch": 970} {"train_loss": -38.86911392211914, "global_step": 117400, "epoch": 970} {"train_loss": -39.0, "global_step": 117401, "epoch": 970} {"train_loss": -38.61659622192383, "global_step": 117402, "epoch": 970} {"train_loss": -38.797462463378906, "global_step": 117403, "epoch": 970} {"train_loss": -38.37273025512695, "global_step": 117404, "epoch": 970} {"train_loss": -38.649497985839844, "global_step": 117405, "epoch": 970} {"train_loss": -37.78204345703125, "global_step": 117406, "epoch": 970} {"train_loss": -38.71009063720703, "global_step": 117407, "epoch": 970} {"train_loss": -39.6361198425293, "global_step": 117408, "epoch": 970} {"train_loss": -39.172462463378906, "global_step": 117409, "epoch": 970} {"train_loss": -38.35136413574219, "global_step": 117410, "epoch": 970} {"train_loss": -38.60335159301758, "global_step": 117411, "epoch": 970} {"train_loss": -39.260501861572266, "global_step": 117412, "epoch": 970} {"train_loss": -39.277191162109375, "global_step": 117413, "epoch": 970} {"train_loss": -38.73472595214844, "global_step": 117414, "epoch": 970} {"train_loss": -38.73838424682617, "global_step": 117415, "epoch": 970} {"train_loss": -38.66572189331055, "global_step": 117416, "epoch": 970} {"train_loss": -38.2055778503418, "global_step": 117417, "epoch": 970} {"train_loss": -38.161006927490234, "global_step": 117418, "epoch": 970} {"train_loss": -37.774330139160156, "global_step": 117419, "epoch": 970} {"train_loss": -38.818416595458984, "global_step": 117420, "epoch": 970} {"train_loss": -38.55123519897461, "global_step": 117421, "epoch": 970} {"train_loss": -36.99055099487305, "global_step": 117422, "epoch": 970} {"train_loss": -35.07778549194336, "global_step": 117423, "epoch": 970} {"train_loss": -35.871700286865234, "global_step": 117424, "epoch": 970} {"train_loss": -38.42214584350586, "global_step": 117425, "epoch": 970} {"train_loss": -39.26053237915039, "global_step": 117426, "epoch": 970} {"train_loss": -37.307594299316406, "global_step": 117427, "epoch": 970} {"train_loss": -35.876625061035156, "global_step": 117428, "epoch": 970} {"train_loss": -38.49384689331055, "global_step": 117429, "epoch": 970} {"train_loss": -37.52898025512695, "global_step": 117430, "epoch": 970} {"train_loss": -35.85163116455078, "global_step": 117431, "epoch": 970} {"train_loss": -38.74799728393555, "global_step": 117432, "epoch": 970} {"train_loss": -38.15925979614258, "global_step": 117433, "epoch": 970} {"train_loss": -36.9835090637207, "global_step": 117434, "epoch": 970} {"train_loss": -38.63739776611328, "global_step": 117435, "epoch": 970} {"train_loss": -37.1221923828125, "global_step": 117436, "epoch": 970} {"train_loss": -36.057952880859375, "global_step": 117437, "epoch": 970} {"train_loss": -38.0764274597168, "global_step": 117438, "epoch": 970} {"train_loss": -38.453826904296875, "global_step": 117439, "epoch": 970} {"train_loss": -37.45273208618164, "global_step": 117440, "epoch": 970} {"train_loss": -38.011024475097656, "global_step": 117441, "epoch": 970} {"train_loss": -38.760311126708984, "global_step": 117442, "epoch": 970} {"train_loss": -37.062042236328125, "global_step": 117443, "epoch": 970} {"train_loss": -38.470733642578125, "global_step": 117444, "epoch": 970} {"train_loss": -38.392574310302734, "global_step": 117445, "epoch": 970} {"train_loss": -37.82277297973633, "global_step": 117446, "epoch": 970} {"train_loss": -38.89105224609375, "global_step": 117447, "epoch": 970} {"train_loss": -37.79734420776367, "global_step": 117448, "epoch": 970} {"train_loss": -38.27317428588867, "global_step": 117449, "epoch": 970} {"train_loss": -37.03214645385742, "global_step": 117450, "epoch": 970} {"train_loss": -38.79398727416992, "global_step": 117451, "epoch": 970} {"train_loss": -38.12441635131836, "global_step": 117452, "epoch": 970} {"train_loss": -37.597694396972656, "global_step": 117453, "epoch": 970} {"train_loss": -38.46662521362305, "global_step": 117454, "epoch": 970} {"train_loss": -38.9276123046875, "global_step": 117455, "epoch": 970} {"train_loss": -38.288299560546875, "global_step": 117456, "epoch": 970} {"train_loss": -37.26168441772461, "global_step": 117457, "epoch": 970} {"train_loss": -37.653900146484375, "global_step": 117458, "epoch": 970} {"train_loss": -38.1865119934082, "global_step": 117459, "epoch": 970} {"train_loss": -38.759033203125, "global_step": 117460, "epoch": 970} {"train_loss": -37.99068832397461, "global_step": 117461, "epoch": 970} {"train_loss": -38.17897415161133, "global_step": 117462, "epoch": 970} {"train_loss": -38.507545471191406, "global_step": 117463, "epoch": 970} {"train_loss": -37.96036911010742, "global_step": 117464, "epoch": 970} {"train_loss": -38.98963165283203, "global_step": 117465, "epoch": 970} {"train_loss": -38.78414535522461, "global_step": 117466, "epoch": 970} {"train_loss": -38.79328155517578, "global_step": 117467, "epoch": 970} {"train_loss": -38.72511672973633, "global_step": 117468, "epoch": 970} {"train_loss": -38.602264404296875, "global_step": 117469, "epoch": 970} {"train_loss": -38.632606506347656, "global_step": 117470, "epoch": 970} {"train_loss": -37.151771545410156, "global_step": 117471, "epoch": 970} {"train_loss": -37.56294250488281, "global_step": 117472, "epoch": 970} {"train_loss": -37.90383529663086, "global_step": 117473, "epoch": 970} {"train_loss": -36.988460540771484, "global_step": 117474, "epoch": 970} {"train_loss": -36.5981330871582, "global_step": 117475, "epoch": 970} {"train_loss": -37.981876373291016, "global_step": 117476, "epoch": 970} {"train_loss": -37.70886993408203, "global_step": 117477, "epoch": 970} {"train_loss": -37.87813186645508, "global_step": 117478, "epoch": 970} {"train_loss": -38.28773880004883, "global_step": 117479, "epoch": 970} {"train_loss": -38.2868766784668, "global_step": 117480, "epoch": 970} {"train_loss": -38.2790641784668, "global_step": 117481, "epoch": 970} {"train_loss": -38.4750862121582, "global_step": 117482, "epoch": 970} {"train_loss": -38.098243713378906, "global_step": 117483, "epoch": 970} {"train_loss": -39.11268615722656, "global_step": 117484, "epoch": 970} {"train_loss": -37.46186828613281, "global_step": 117485, "epoch": 970} {"train_loss": -39.50361633300781, "global_step": 117486, "epoch": 970} {"train_loss": -39.50038528442383, "global_step": 117487, "epoch": 970} {"train_loss": -38.54879379272461, "global_step": 117488, "epoch": 970} {"train_loss": -37.4951171875, "global_step": 117489, "epoch": 970} {"train_loss": -38.0877238186923, "global_step": 117490, "epoch": 970, "val_loss": 2673807.75} {"train_loss": -38.69580078125, "global_step": 117491, "epoch": 971} {"train_loss": -39.43729782104492, "global_step": 117492, "epoch": 971} {"train_loss": -38.164207458496094, "global_step": 117493, "epoch": 971} {"train_loss": -37.06333541870117, "global_step": 117494, "epoch": 971} {"train_loss": -39.05658721923828, "global_step": 117495, "epoch": 971} {"train_loss": -38.16389083862305, "global_step": 117496, "epoch": 971} {"train_loss": -36.63485336303711, "global_step": 117497, "epoch": 971} {"train_loss": -35.00674057006836, "global_step": 117498, "epoch": 971} {"train_loss": -38.6496696472168, "global_step": 117499, "epoch": 971} {"train_loss": -37.1156120300293, "global_step": 117500, "epoch": 971} {"train_loss": -37.34385681152344, "global_step": 117501, "epoch": 971} {"train_loss": -34.753231048583984, "global_step": 117502, "epoch": 971} {"train_loss": -38.23624038696289, "global_step": 117503, "epoch": 971} {"train_loss": -38.10132598876953, "global_step": 117504, "epoch": 971} {"train_loss": -37.52595138549805, "global_step": 117505, "epoch": 971} {"train_loss": -37.04840087890625, "global_step": 117506, "epoch": 971} {"train_loss": -36.417293548583984, "global_step": 117507, "epoch": 971} {"train_loss": -38.12196731567383, "global_step": 117508, "epoch": 971} {"train_loss": -37.22945785522461, "global_step": 117509, "epoch": 971} {"train_loss": -35.44221115112305, "global_step": 117510, "epoch": 971} {"train_loss": -31.800207138061523, "global_step": 117511, "epoch": 971} {"train_loss": -36.64254379272461, "global_step": 117512, "epoch": 971} {"train_loss": -37.40922164916992, "global_step": 117513, "epoch": 971} {"train_loss": -37.5173225402832, "global_step": 117514, "epoch": 971} {"train_loss": -32.136940002441406, "global_step": 117515, "epoch": 971} {"train_loss": -37.76884841918945, "global_step": 117516, "epoch": 971} {"train_loss": -36.44425582885742, "global_step": 117517, "epoch": 971} {"train_loss": -32.80834197998047, "global_step": 117518, "epoch": 971} {"train_loss": -37.11183547973633, "global_step": 117519, "epoch": 971} {"train_loss": -36.72377395629883, "global_step": 117520, "epoch": 971} {"train_loss": -33.75746536254883, "global_step": 117521, "epoch": 971} {"train_loss": -35.27368927001953, "global_step": 117522, "epoch": 971} {"train_loss": -37.103755950927734, "global_step": 117523, "epoch": 971} {"train_loss": -31.609760284423828, "global_step": 117524, "epoch": 971} {"train_loss": -32.75020980834961, "global_step": 117525, "epoch": 971} {"train_loss": -35.541805267333984, "global_step": 117526, "epoch": 971} {"train_loss": -36.791595458984375, "global_step": 117527, "epoch": 971} {"train_loss": -36.86614990234375, "global_step": 117528, "epoch": 971} {"train_loss": -36.37799835205078, "global_step": 117529, "epoch": 971} {"train_loss": -33.92548370361328, "global_step": 117530, "epoch": 971} {"train_loss": -37.781280517578125, "global_step": 117531, "epoch": 971} {"train_loss": -36.254295349121094, "global_step": 117532, "epoch": 971} {"train_loss": -35.816341400146484, "global_step": 117533, "epoch": 971} {"train_loss": -35.37520217895508, "global_step": 117534, "epoch": 971} {"train_loss": -35.21468734741211, "global_step": 117535, "epoch": 971} {"train_loss": -36.7253532409668, "global_step": 117536, "epoch": 971} {"train_loss": -37.118736267089844, "global_step": 117537, "epoch": 971} {"train_loss": -35.5494270324707, "global_step": 117538, "epoch": 971} {"train_loss": -38.03361892700195, "global_step": 117539, "epoch": 971} {"train_loss": -37.1573600769043, "global_step": 117540, "epoch": 971} {"train_loss": -37.43406295776367, "global_step": 117541, "epoch": 971} {"train_loss": -37.05097579956055, "global_step": 117542, "epoch": 971} {"train_loss": -37.257503509521484, "global_step": 117543, "epoch": 971} {"train_loss": -37.965492248535156, "global_step": 117544, "epoch": 971} {"train_loss": -38.205013275146484, "global_step": 117545, "epoch": 971} {"train_loss": -36.817779541015625, "global_step": 117546, "epoch": 971} {"train_loss": -37.91463088989258, "global_step": 117547, "epoch": 971} {"train_loss": -37.87839889526367, "global_step": 117548, "epoch": 971} {"train_loss": -38.04909133911133, "global_step": 117549, "epoch": 971} {"train_loss": -37.582515716552734, "global_step": 117550, "epoch": 971} {"train_loss": -38.22096633911133, "global_step": 117551, "epoch": 971} {"train_loss": -38.111454010009766, "global_step": 117552, "epoch": 971} {"train_loss": -37.07036590576172, "global_step": 117553, "epoch": 971} {"train_loss": -38.07673263549805, "global_step": 117554, "epoch": 971} {"train_loss": -38.0044059753418, "global_step": 117555, "epoch": 971} {"train_loss": -38.137569427490234, "global_step": 117556, "epoch": 971} {"train_loss": -37.71993637084961, "global_step": 117557, "epoch": 971} {"train_loss": -38.56828689575195, "global_step": 117558, "epoch": 971} {"train_loss": -38.122352600097656, "global_step": 117559, "epoch": 971} {"train_loss": -38.40492630004883, "global_step": 117560, "epoch": 971} {"train_loss": -37.95941162109375, "global_step": 117561, "epoch": 971} {"train_loss": -38.290260314941406, "global_step": 117562, "epoch": 971} {"train_loss": -37.875064849853516, "global_step": 117563, "epoch": 971} {"train_loss": -38.17181396484375, "global_step": 117564, "epoch": 971} {"train_loss": -38.65204620361328, "global_step": 117565, "epoch": 971} {"train_loss": -38.27204895019531, "global_step": 117566, "epoch": 971} {"train_loss": -38.394752502441406, "global_step": 117567, "epoch": 971} {"train_loss": -38.60696029663086, "global_step": 117568, "epoch": 971} {"train_loss": -38.650787353515625, "global_step": 117569, "epoch": 971} {"train_loss": -38.5709114074707, "global_step": 117570, "epoch": 971} {"train_loss": -38.529541015625, "global_step": 117571, "epoch": 971} {"train_loss": -38.47200393676758, "global_step": 117572, "epoch": 971} {"train_loss": -38.83578109741211, "global_step": 117573, "epoch": 971} {"train_loss": -38.71848678588867, "global_step": 117574, "epoch": 971} {"train_loss": -38.7939567565918, "global_step": 117575, "epoch": 971} {"train_loss": -38.54209518432617, "global_step": 117576, "epoch": 971} {"train_loss": -39.019874572753906, "global_step": 117577, "epoch": 971} {"train_loss": -38.7280387878418, "global_step": 117578, "epoch": 971} {"train_loss": -38.87274932861328, "global_step": 117579, "epoch": 971} {"train_loss": -38.99785232543945, "global_step": 117580, "epoch": 971} {"train_loss": -37.93842697143555, "global_step": 117581, "epoch": 971} {"train_loss": -38.65192794799805, "global_step": 117582, "epoch": 971} {"train_loss": -38.92747116088867, "global_step": 117583, "epoch": 971} {"train_loss": -38.66850662231445, "global_step": 117584, "epoch": 971} {"train_loss": -38.53816604614258, "global_step": 117585, "epoch": 971} {"train_loss": -38.32872009277344, "global_step": 117586, "epoch": 971} {"train_loss": -37.88157272338867, "global_step": 117587, "epoch": 971} {"train_loss": -38.1050910949707, "global_step": 117588, "epoch": 971} {"train_loss": -37.222930908203125, "global_step": 117589, "epoch": 971} {"train_loss": -37.668670654296875, "global_step": 117590, "epoch": 971} {"train_loss": -38.80277633666992, "global_step": 117591, "epoch": 971} {"train_loss": -38.59867477416992, "global_step": 117592, "epoch": 971} {"train_loss": -38.243804931640625, "global_step": 117593, "epoch": 971} {"train_loss": -36.46351623535156, "global_step": 117594, "epoch": 971} {"train_loss": -35.13017272949219, "global_step": 117595, "epoch": 971} {"train_loss": -36.923702239990234, "global_step": 117596, "epoch": 971} {"train_loss": -38.69212341308594, "global_step": 117597, "epoch": 971} {"train_loss": -36.19357681274414, "global_step": 117598, "epoch": 971} {"train_loss": -33.04342269897461, "global_step": 117599, "epoch": 971} {"train_loss": -37.833465576171875, "global_step": 117600, "epoch": 971} {"train_loss": -39.159950256347656, "global_step": 117601, "epoch": 971} {"train_loss": -36.17153549194336, "global_step": 117602, "epoch": 971} {"train_loss": -37.502655029296875, "global_step": 117603, "epoch": 971} {"train_loss": -38.36886978149414, "global_step": 117604, "epoch": 971} {"train_loss": -37.73079299926758, "global_step": 117605, "epoch": 971} {"train_loss": -37.27460861206055, "global_step": 117606, "epoch": 971} {"train_loss": -37.200557708740234, "global_step": 117607, "epoch": 971} {"train_loss": -38.33457565307617, "global_step": 117608, "epoch": 971} {"train_loss": -37.320777893066406, "global_step": 117609, "epoch": 971} {"train_loss": -38.05805206298828, "global_step": 117610, "epoch": 971} {"train_loss": -37.29039371900322, "global_step": 117611, "epoch": 971, "val_loss": 2693444.75} {"train_loss": -35.30611801147461, "global_step": 117612, "epoch": 972} {"train_loss": -37.37977600097656, "global_step": 117613, "epoch": 972} {"train_loss": -35.383705139160156, "global_step": 117614, "epoch": 972} {"train_loss": -31.797760009765625, "global_step": 117615, "epoch": 972} {"train_loss": -32.89971923828125, "global_step": 117616, "epoch": 972} {"train_loss": -37.501625061035156, "global_step": 117617, "epoch": 972} {"train_loss": -37.068519592285156, "global_step": 117618, "epoch": 972} {"train_loss": -36.5606689453125, "global_step": 117619, "epoch": 972} {"train_loss": -35.606624603271484, "global_step": 117620, "epoch": 972} {"train_loss": -37.525569915771484, "global_step": 117621, "epoch": 972} {"train_loss": -37.58478927612305, "global_step": 117622, "epoch": 972} {"train_loss": -36.971412658691406, "global_step": 117623, "epoch": 972} {"train_loss": -36.979156494140625, "global_step": 117624, "epoch": 972} {"train_loss": -37.58222579956055, "global_step": 117625, "epoch": 972} {"train_loss": -37.52083969116211, "global_step": 117626, "epoch": 972} {"train_loss": -38.03984069824219, "global_step": 117627, "epoch": 972} {"train_loss": -36.92317581176758, "global_step": 117628, "epoch": 972} {"train_loss": -38.50869369506836, "global_step": 117629, "epoch": 972} {"train_loss": -38.40562057495117, "global_step": 117630, "epoch": 972} {"train_loss": -38.368072509765625, "global_step": 117631, "epoch": 972} {"train_loss": -38.894588470458984, "global_step": 117632, "epoch": 972} {"train_loss": -38.31324005126953, "global_step": 117633, "epoch": 972} {"train_loss": -38.433956146240234, "global_step": 117634, "epoch": 972} {"train_loss": -38.24976348876953, "global_step": 117635, "epoch": 972} {"train_loss": -38.17176818847656, "global_step": 117636, "epoch": 972} {"train_loss": -38.2747802734375, "global_step": 117637, "epoch": 972} {"train_loss": -38.686065673828125, "global_step": 117638, "epoch": 972} {"train_loss": -38.5184440612793, "global_step": 117639, "epoch": 972} {"train_loss": -38.365665435791016, "global_step": 117640, "epoch": 972} {"train_loss": -39.324562072753906, "global_step": 117641, "epoch": 972} {"train_loss": -38.681026458740234, "global_step": 117642, "epoch": 972} {"train_loss": -38.84614181518555, "global_step": 117643, "epoch": 972} {"train_loss": -39.12595748901367, "global_step": 117644, "epoch": 972} {"train_loss": -38.9898681640625, "global_step": 117645, "epoch": 972} {"train_loss": -39.39735794067383, "global_step": 117646, "epoch": 972} {"train_loss": -39.05952072143555, "global_step": 117647, "epoch": 972} {"train_loss": -39.168941497802734, "global_step": 117648, "epoch": 972} {"train_loss": -39.22201156616211, "global_step": 117649, "epoch": 972} {"train_loss": -39.494972229003906, "global_step": 117650, "epoch": 972} {"train_loss": -39.16437911987305, "global_step": 117651, "epoch": 972} {"train_loss": -39.53914260864258, "global_step": 117652, "epoch": 972} {"train_loss": -39.181575775146484, "global_step": 117653, "epoch": 972} {"train_loss": -38.94178009033203, "global_step": 117654, "epoch": 972} {"train_loss": -39.232975006103516, "global_step": 117655, "epoch": 972} {"train_loss": -39.38174819946289, "global_step": 117656, "epoch": 972} {"train_loss": -39.5768928527832, "global_step": 117657, "epoch": 972} {"train_loss": -39.81355667114258, "global_step": 117658, "epoch": 972} {"train_loss": -39.055580139160156, "global_step": 117659, "epoch": 972} {"train_loss": -39.6059684753418, "global_step": 117660, "epoch": 972} {"train_loss": -39.511348724365234, "global_step": 117661, "epoch": 972} {"train_loss": -38.86311721801758, "global_step": 117662, "epoch": 972} {"train_loss": -39.28035354614258, "global_step": 117663, "epoch": 972} {"train_loss": -39.48594284057617, "global_step": 117664, "epoch": 972} {"train_loss": -39.10610580444336, "global_step": 117665, "epoch": 972} {"train_loss": -39.68738555908203, "global_step": 117666, "epoch": 972} {"train_loss": -39.51473617553711, "global_step": 117667, "epoch": 972} {"train_loss": -40.13790512084961, "global_step": 117668, "epoch": 972} {"train_loss": -39.5749397277832, "global_step": 117669, "epoch": 972} {"train_loss": -35.93397521972656, "global_step": 117670, "epoch": 972} {"train_loss": -37.618927001953125, "global_step": 117671, "epoch": 972} {"train_loss": -36.12577438354492, "global_step": 117672, "epoch": 972} {"train_loss": -34.77483367919922, "global_step": 117673, "epoch": 972} {"train_loss": -38.56144332885742, "global_step": 117674, "epoch": 972} {"train_loss": -36.89751052856445, "global_step": 117675, "epoch": 972} {"train_loss": -35.0040397644043, "global_step": 117676, "epoch": 972} {"train_loss": -39.05910110473633, "global_step": 117677, "epoch": 972} {"train_loss": -37.326393127441406, "global_step": 117678, "epoch": 972} {"train_loss": -37.7243537902832, "global_step": 117679, "epoch": 972} {"train_loss": -38.34344482421875, "global_step": 117680, "epoch": 972} {"train_loss": -38.779937744140625, "global_step": 117681, "epoch": 972} {"train_loss": -39.06600570678711, "global_step": 117682, "epoch": 972} {"train_loss": -38.1196403503418, "global_step": 117683, "epoch": 972} {"train_loss": -38.35948181152344, "global_step": 117684, "epoch": 972} {"train_loss": -37.28340148925781, "global_step": 117685, "epoch": 972} {"train_loss": -36.36159133911133, "global_step": 117686, "epoch": 972} {"train_loss": -34.74723434448242, "global_step": 117687, "epoch": 972} {"train_loss": -35.057987213134766, "global_step": 117688, "epoch": 972} {"train_loss": -37.534523010253906, "global_step": 117689, "epoch": 972} {"train_loss": -33.56215286254883, "global_step": 117690, "epoch": 972} {"train_loss": -32.912349700927734, "global_step": 117691, "epoch": 972} {"train_loss": -38.0372200012207, "global_step": 117692, "epoch": 972} {"train_loss": -37.268001556396484, "global_step": 117693, "epoch": 972} {"train_loss": -36.61200714111328, "global_step": 117694, "epoch": 972} {"train_loss": -35.73969268798828, "global_step": 117695, "epoch": 972} {"train_loss": -37.042633056640625, "global_step": 117696, "epoch": 972} {"train_loss": -38.3979606628418, "global_step": 117697, "epoch": 972} {"train_loss": -38.55257797241211, "global_step": 117698, "epoch": 972} {"train_loss": -38.61513900756836, "global_step": 117699, "epoch": 972} {"train_loss": -39.14038848876953, "global_step": 117700, "epoch": 972} {"train_loss": -38.35578536987305, "global_step": 117701, "epoch": 972} {"train_loss": -38.88642501831055, "global_step": 117702, "epoch": 972} {"train_loss": -39.328826904296875, "global_step": 117703, "epoch": 972} {"train_loss": -38.719032287597656, "global_step": 117704, "epoch": 972} {"train_loss": -39.22166061401367, "global_step": 117705, "epoch": 972} {"train_loss": -37.943519592285156, "global_step": 117706, "epoch": 972} {"train_loss": -39.20094299316406, "global_step": 117707, "epoch": 972} {"train_loss": -38.82526779174805, "global_step": 117708, "epoch": 972} {"train_loss": -35.31061553955078, "global_step": 117709, "epoch": 972} {"train_loss": -39.076534271240234, "global_step": 117710, "epoch": 972} {"train_loss": -39.23286819458008, "global_step": 117711, "epoch": 972} {"train_loss": -39.37983322143555, "global_step": 117712, "epoch": 972} {"train_loss": -39.3253288269043, "global_step": 117713, "epoch": 972} {"train_loss": -39.15614318847656, "global_step": 117714, "epoch": 972} {"train_loss": -38.032569885253906, "global_step": 117715, "epoch": 972} {"train_loss": -39.32070541381836, "global_step": 117716, "epoch": 972} {"train_loss": -39.20530319213867, "global_step": 117717, "epoch": 972} {"train_loss": -37.8405876159668, "global_step": 117718, "epoch": 972} {"train_loss": -38.78985595703125, "global_step": 117719, "epoch": 972} {"train_loss": -38.68964767456055, "global_step": 117720, "epoch": 972} {"train_loss": -39.1682014465332, "global_step": 117721, "epoch": 972} {"train_loss": -38.7058219909668, "global_step": 117722, "epoch": 972} {"train_loss": -39.39749526977539, "global_step": 117723, "epoch": 972} {"train_loss": -39.11659240722656, "global_step": 117724, "epoch": 972} {"train_loss": -38.94468307495117, "global_step": 117725, "epoch": 972} {"train_loss": -38.64191818237305, "global_step": 117726, "epoch": 972} {"train_loss": -38.11709213256836, "global_step": 117727, "epoch": 972} {"train_loss": -39.08806610107422, "global_step": 117728, "epoch": 972} {"train_loss": -38.11714553833008, "global_step": 117729, "epoch": 972} {"train_loss": -38.04164505004883, "global_step": 117730, "epoch": 972} {"train_loss": -39.48752975463867, "global_step": 117731, "epoch": 972} {"train_loss": -38.08877617071483, "global_step": 117732, "epoch": 972, "val_loss": 2930490.75} {"train_loss": -39.64048385620117, "global_step": 117733, "epoch": 973} {"train_loss": -39.588016510009766, "global_step": 117734, "epoch": 973} {"train_loss": -39.8094596862793, "global_step": 117735, "epoch": 973} {"train_loss": -39.22429275512695, "global_step": 117736, "epoch": 973} {"train_loss": -39.713348388671875, "global_step": 117737, "epoch": 973} {"train_loss": -39.71514892578125, "global_step": 117738, "epoch": 973} {"train_loss": -39.662864685058594, "global_step": 117739, "epoch": 973} {"train_loss": -40.00188064575195, "global_step": 117740, "epoch": 973} {"train_loss": -39.24403762817383, "global_step": 117741, "epoch": 973} {"train_loss": -38.50623321533203, "global_step": 117742, "epoch": 973} {"train_loss": -40.22035217285156, "global_step": 117743, "epoch": 973} {"train_loss": -39.63349151611328, "global_step": 117744, "epoch": 973} {"train_loss": -39.67354965209961, "global_step": 117745, "epoch": 973} {"train_loss": -40.04097366333008, "global_step": 117746, "epoch": 973} {"train_loss": -39.24199295043945, "global_step": 117747, "epoch": 973} {"train_loss": -39.654170989990234, "global_step": 117748, "epoch": 973} {"train_loss": -39.49265670776367, "global_step": 117749, "epoch": 973} {"train_loss": -38.488582611083984, "global_step": 117750, "epoch": 973} {"train_loss": -37.655860900878906, "global_step": 117751, "epoch": 973} {"train_loss": -31.410261154174805, "global_step": 117752, "epoch": 973} {"train_loss": -18.465518951416016, "global_step": 117753, "epoch": 973} {"train_loss": -4.122186183929443, "global_step": 117754, "epoch": 973} {"train_loss": -27.233261108398438, "global_step": 117755, "epoch": 973} {"train_loss": -34.43336486816406, "global_step": 117756, "epoch": 973} {"train_loss": -22.678590774536133, "global_step": 117757, "epoch": 973} {"train_loss": -36.121280670166016, "global_step": 117758, "epoch": 973} {"train_loss": -24.0202693939209, "global_step": 117759, "epoch": 973} {"train_loss": -37.88386154174805, "global_step": 117760, "epoch": 973} {"train_loss": -29.686338424682617, "global_step": 117761, "epoch": 973} {"train_loss": -36.93657302856445, "global_step": 117762, "epoch": 973} {"train_loss": -34.46848678588867, "global_step": 117763, "epoch": 973} {"train_loss": -32.534339904785156, "global_step": 117764, "epoch": 973} {"train_loss": -37.179256439208984, "global_step": 117765, "epoch": 973} {"train_loss": -34.85155487060547, "global_step": 117766, "epoch": 973} {"train_loss": -36.17843246459961, "global_step": 117767, "epoch": 973} {"train_loss": -37.51230239868164, "global_step": 117768, "epoch": 973} {"train_loss": -36.59485626220703, "global_step": 117769, "epoch": 973} {"train_loss": -36.2381477355957, "global_step": 117770, "epoch": 973} {"train_loss": -38.53683090209961, "global_step": 117771, "epoch": 973} {"train_loss": -35.916255950927734, "global_step": 117772, "epoch": 973} {"train_loss": -37.15841293334961, "global_step": 117773, "epoch": 973} {"train_loss": -37.86662673950195, "global_step": 117774, "epoch": 973} {"train_loss": -37.94972610473633, "global_step": 117775, "epoch": 973} {"train_loss": -37.31949996948242, "global_step": 117776, "epoch": 973} {"train_loss": -38.36088943481445, "global_step": 117777, "epoch": 973} {"train_loss": -38.4911994934082, "global_step": 117778, "epoch": 973} {"train_loss": -37.88664627075195, "global_step": 117779, "epoch": 973} {"train_loss": -38.23169708251953, "global_step": 117780, "epoch": 973} {"train_loss": -38.71480941772461, "global_step": 117781, "epoch": 973} {"train_loss": -38.9019660949707, "global_step": 117782, "epoch": 973} {"train_loss": -38.53430938720703, "global_step": 117783, "epoch": 973} {"train_loss": -38.068115234375, "global_step": 117784, "epoch": 973} {"train_loss": -39.1461067199707, "global_step": 117785, "epoch": 973} {"train_loss": -38.83203125, "global_step": 117786, "epoch": 973} {"train_loss": -38.71824645996094, "global_step": 117787, "epoch": 973} {"train_loss": -38.996856689453125, "global_step": 117788, "epoch": 973} {"train_loss": -39.0128288269043, "global_step": 117789, "epoch": 973} {"train_loss": -38.85305404663086, "global_step": 117790, "epoch": 973} {"train_loss": -38.38282012939453, "global_step": 117791, "epoch": 973} {"train_loss": -38.37543869018555, "global_step": 117792, "epoch": 973} {"train_loss": -38.87353515625, "global_step": 117793, "epoch": 973} {"train_loss": -37.9320182800293, "global_step": 117794, "epoch": 973} {"train_loss": -39.1248779296875, "global_step": 117795, "epoch": 973} {"train_loss": -39.01443099975586, "global_step": 117796, "epoch": 973} {"train_loss": -38.92134475708008, "global_step": 117797, "epoch": 973} {"train_loss": -39.175777435302734, "global_step": 117798, "epoch": 973} {"train_loss": -39.16401290893555, "global_step": 117799, "epoch": 973} {"train_loss": -38.99410629272461, "global_step": 117800, "epoch": 973} {"train_loss": -38.7519645690918, "global_step": 117801, "epoch": 973} {"train_loss": -39.56989669799805, "global_step": 117802, "epoch": 973} {"train_loss": -38.580543518066406, "global_step": 117803, "epoch": 973} {"train_loss": -39.368865966796875, "global_step": 117804, "epoch": 973} {"train_loss": -39.39535140991211, "global_step": 117805, "epoch": 973} {"train_loss": -39.414852142333984, "global_step": 117806, "epoch": 973} {"train_loss": -38.90714645385742, "global_step": 117807, "epoch": 973} {"train_loss": -39.06144332885742, "global_step": 117808, "epoch": 973} {"train_loss": -39.48134994506836, "global_step": 117809, "epoch": 973} {"train_loss": -39.23409652709961, "global_step": 117810, "epoch": 973} {"train_loss": -39.54698944091797, "global_step": 117811, "epoch": 973} {"train_loss": -39.21009063720703, "global_step": 117812, "epoch": 973} {"train_loss": -39.38108825683594, "global_step": 117813, "epoch": 973} {"train_loss": -39.46688461303711, "global_step": 117814, "epoch": 973} {"train_loss": -39.933528900146484, "global_step": 117815, "epoch": 973} {"train_loss": -39.79743576049805, "global_step": 117816, "epoch": 973} {"train_loss": -39.61204147338867, "global_step": 117817, "epoch": 973} {"train_loss": -39.14002227783203, "global_step": 117818, "epoch": 973} {"train_loss": -39.15134811401367, "global_step": 117819, "epoch": 973} {"train_loss": -39.71348190307617, "global_step": 117820, "epoch": 973} {"train_loss": -37.38483810424805, "global_step": 117821, "epoch": 973} {"train_loss": -39.4463996887207, "global_step": 117822, "epoch": 973} {"train_loss": -39.32584762573242, "global_step": 117823, "epoch": 973} {"train_loss": -39.960079193115234, "global_step": 117824, "epoch": 973} {"train_loss": -39.692718505859375, "global_step": 117825, "epoch": 973} {"train_loss": -37.237518310546875, "global_step": 117826, "epoch": 973} {"train_loss": -39.29342269897461, "global_step": 117827, "epoch": 973} {"train_loss": -39.26975631713867, "global_step": 117828, "epoch": 973} {"train_loss": -39.21599197387695, "global_step": 117829, "epoch": 973} {"train_loss": -38.14005661010742, "global_step": 117830, "epoch": 973} {"train_loss": -36.67886734008789, "global_step": 117831, "epoch": 973} {"train_loss": -30.553852081298828, "global_step": 117832, "epoch": 973} {"train_loss": -29.559858322143555, "global_step": 117833, "epoch": 973} {"train_loss": -32.11420440673828, "global_step": 117834, "epoch": 973} {"train_loss": -37.77975082397461, "global_step": 117835, "epoch": 973} {"train_loss": -34.78520584106445, "global_step": 117836, "epoch": 973} {"train_loss": -27.439985275268555, "global_step": 117837, "epoch": 973} {"train_loss": -33.64154815673828, "global_step": 117838, "epoch": 973} {"train_loss": -38.39960861206055, "global_step": 117839, "epoch": 973} {"train_loss": -32.55221176147461, "global_step": 117840, "epoch": 973} {"train_loss": -38.49176025390625, "global_step": 117841, "epoch": 973} {"train_loss": -32.53995132446289, "global_step": 117842, "epoch": 973} {"train_loss": -34.583560943603516, "global_step": 117843, "epoch": 973} {"train_loss": -34.3282585144043, "global_step": 117844, "epoch": 973} {"train_loss": -26.34136962890625, "global_step": 117845, "epoch": 973} {"train_loss": -36.31145095825195, "global_step": 117846, "epoch": 973} {"train_loss": -34.520931243896484, "global_step": 117847, "epoch": 973} {"train_loss": -34.20038986206055, "global_step": 117848, "epoch": 973} {"train_loss": -30.711462020874023, "global_step": 117849, "epoch": 973} {"train_loss": -32.9130973815918, "global_step": 117850, "epoch": 973} {"train_loss": -32.91419219970703, "global_step": 117851, "epoch": 973} {"train_loss": -35.15538024902344, "global_step": 117852, "epoch": 973} {"train_loss": -36.65382388012468, "global_step": 117853, "epoch": 973, "val_loss": 4222491.5} {"train_loss": -31.326339721679688, "global_step": 117854, "epoch": 974} {"train_loss": -30.773141860961914, "global_step": 117855, "epoch": 974} {"train_loss": -34.845237731933594, "global_step": 117856, "epoch": 974} {"train_loss": -34.295074462890625, "global_step": 117857, "epoch": 974} {"train_loss": -34.67275619506836, "global_step": 117858, "epoch": 974} {"train_loss": -32.53981018066406, "global_step": 117859, "epoch": 974} {"train_loss": -30.673192977905273, "global_step": 117860, "epoch": 974} {"train_loss": -35.38013458251953, "global_step": 117861, "epoch": 974} {"train_loss": -34.45920181274414, "global_step": 117862, "epoch": 974} {"train_loss": -34.503658294677734, "global_step": 117863, "epoch": 974} {"train_loss": -32.406158447265625, "global_step": 117864, "epoch": 974} {"train_loss": -33.94047164916992, "global_step": 117865, "epoch": 974} {"train_loss": -34.378334045410156, "global_step": 117866, "epoch": 974} {"train_loss": -35.62726593017578, "global_step": 117867, "epoch": 974} {"train_loss": -35.752647399902344, "global_step": 117868, "epoch": 974} {"train_loss": -34.562591552734375, "global_step": 117869, "epoch": 974} {"train_loss": -33.614288330078125, "global_step": 117870, "epoch": 974} {"train_loss": -31.19272804260254, "global_step": 117871, "epoch": 974} {"train_loss": -35.73387145996094, "global_step": 117872, "epoch": 974} {"train_loss": -35.05436325073242, "global_step": 117873, "epoch": 974} {"train_loss": -31.696561813354492, "global_step": 117874, "epoch": 974} {"train_loss": -35.995914459228516, "global_step": 117875, "epoch": 974} {"train_loss": -34.553871154785156, "global_step": 117876, "epoch": 974} {"train_loss": -35.9235954284668, "global_step": 117877, "epoch": 974} {"train_loss": -35.46784591674805, "global_step": 117878, "epoch": 974} {"train_loss": -35.59652328491211, "global_step": 117879, "epoch": 974} {"train_loss": -35.859710693359375, "global_step": 117880, "epoch": 974} {"train_loss": -34.18739700317383, "global_step": 117881, "epoch": 974} {"train_loss": -35.9013786315918, "global_step": 117882, "epoch": 974} {"train_loss": -35.59891891479492, "global_step": 117883, "epoch": 974} {"train_loss": -35.85592269897461, "global_step": 117884, "epoch": 974} {"train_loss": -35.874595642089844, "global_step": 117885, "epoch": 974} {"train_loss": -35.49858474731445, "global_step": 117886, "epoch": 974} {"train_loss": -36.312591552734375, "global_step": 117887, "epoch": 974} {"train_loss": -35.168731689453125, "global_step": 117888, "epoch": 974} {"train_loss": -35.4487190246582, "global_step": 117889, "epoch": 974} {"train_loss": -36.2252197265625, "global_step": 117890, "epoch": 974} {"train_loss": -36.909271240234375, "global_step": 117891, "epoch": 974} {"train_loss": -36.9886360168457, "global_step": 117892, "epoch": 974} {"train_loss": -36.78623580932617, "global_step": 117893, "epoch": 974} {"train_loss": -36.78304672241211, "global_step": 117894, "epoch": 974} {"train_loss": -37.00440216064453, "global_step": 117895, "epoch": 974} {"train_loss": -36.9819450378418, "global_step": 117896, "epoch": 974} {"train_loss": -37.11884689331055, "global_step": 117897, "epoch": 974} {"train_loss": -35.489192962646484, "global_step": 117898, "epoch": 974} {"train_loss": -36.022457122802734, "global_step": 117899, "epoch": 974} {"train_loss": -36.20748519897461, "global_step": 117900, "epoch": 974} {"train_loss": -36.7698860168457, "global_step": 117901, "epoch": 974} {"train_loss": -37.14381790161133, "global_step": 117902, "epoch": 974} {"train_loss": -37.039886474609375, "global_step": 117903, "epoch": 974} {"train_loss": -35.83175277709961, "global_step": 117904, "epoch": 974} {"train_loss": -37.3111457824707, "global_step": 117905, "epoch": 974} {"train_loss": -35.82719039916992, "global_step": 117906, "epoch": 974} {"train_loss": -37.034236907958984, "global_step": 117907, "epoch": 974} {"train_loss": -37.365692138671875, "global_step": 117908, "epoch": 974} {"train_loss": -37.197235107421875, "global_step": 117909, "epoch": 974} {"train_loss": -36.89199447631836, "global_step": 117910, "epoch": 974} {"train_loss": -37.1069221496582, "global_step": 117911, "epoch": 974} {"train_loss": -37.31840515136719, "global_step": 117912, "epoch": 974} {"train_loss": -37.489192962646484, "global_step": 117913, "epoch": 974} {"train_loss": -37.81687545776367, "global_step": 117914, "epoch": 974} {"train_loss": -36.72153091430664, "global_step": 117915, "epoch": 974} {"train_loss": -37.66249465942383, "global_step": 117916, "epoch": 974} {"train_loss": -37.195377349853516, "global_step": 117917, "epoch": 974} {"train_loss": -37.3614501953125, "global_step": 117918, "epoch": 974} {"train_loss": -37.16102981567383, "global_step": 117919, "epoch": 974} {"train_loss": -37.50287628173828, "global_step": 117920, "epoch": 974} {"train_loss": -37.40131378173828, "global_step": 117921, "epoch": 974} {"train_loss": -37.570343017578125, "global_step": 117922, "epoch": 974} {"train_loss": -36.69709396362305, "global_step": 117923, "epoch": 974} {"train_loss": -37.68441390991211, "global_step": 117924, "epoch": 974} {"train_loss": -37.48373031616211, "global_step": 117925, "epoch": 974} {"train_loss": -37.26570129394531, "global_step": 117926, "epoch": 974} {"train_loss": -37.891414642333984, "global_step": 117927, "epoch": 974} {"train_loss": -37.982757568359375, "global_step": 117928, "epoch": 974} {"train_loss": -37.903377532958984, "global_step": 117929, "epoch": 974} {"train_loss": -37.56956100463867, "global_step": 117930, "epoch": 974} {"train_loss": -37.940608978271484, "global_step": 117931, "epoch": 974} {"train_loss": -37.6864013671875, "global_step": 117932, "epoch": 974} {"train_loss": -38.197845458984375, "global_step": 117933, "epoch": 974} {"train_loss": -37.811649322509766, "global_step": 117934, "epoch": 974} {"train_loss": -37.90361404418945, "global_step": 117935, "epoch": 974} {"train_loss": -37.8328971862793, "global_step": 117936, "epoch": 974} {"train_loss": -37.864620208740234, "global_step": 117937, "epoch": 974} {"train_loss": -37.9907112121582, "global_step": 117938, "epoch": 974} {"train_loss": -38.118682861328125, "global_step": 117939, "epoch": 974} {"train_loss": -38.05207443237305, "global_step": 117940, "epoch": 974} {"train_loss": -38.641963958740234, "global_step": 117941, "epoch": 974} {"train_loss": -38.170738220214844, "global_step": 117942, "epoch": 974} {"train_loss": -38.27018356323242, "global_step": 117943, "epoch": 974} {"train_loss": -36.794830322265625, "global_step": 117944, "epoch": 974} {"train_loss": -37.97829818725586, "global_step": 117945, "epoch": 974} {"train_loss": -38.560726165771484, "global_step": 117946, "epoch": 974} {"train_loss": -38.2614631652832, "global_step": 117947, "epoch": 974} {"train_loss": -38.4731330871582, "global_step": 117948, "epoch": 974} {"train_loss": -38.22803497314453, "global_step": 117949, "epoch": 974} {"train_loss": -38.66661834716797, "global_step": 117950, "epoch": 974} {"train_loss": -38.2752685546875, "global_step": 117951, "epoch": 974} {"train_loss": -37.91718673706055, "global_step": 117952, "epoch": 974} {"train_loss": -38.38068771362305, "global_step": 117953, "epoch": 974} {"train_loss": -38.723506927490234, "global_step": 117954, "epoch": 974} {"train_loss": -37.31277084350586, "global_step": 117955, "epoch": 974} {"train_loss": -38.4002799987793, "global_step": 117956, "epoch": 974} {"train_loss": -38.520626068115234, "global_step": 117957, "epoch": 974} {"train_loss": -38.75216293334961, "global_step": 117958, "epoch": 974} {"train_loss": -38.645965576171875, "global_step": 117959, "epoch": 974} {"train_loss": -37.687129974365234, "global_step": 117960, "epoch": 974} {"train_loss": -38.3236083984375, "global_step": 117961, "epoch": 974} {"train_loss": -38.26176071166992, "global_step": 117962, "epoch": 974} {"train_loss": -38.76902389526367, "global_step": 117963, "epoch": 974} {"train_loss": -39.14306640625, "global_step": 117964, "epoch": 974} {"train_loss": -37.69538116455078, "global_step": 117965, "epoch": 974} {"train_loss": -38.45469284057617, "global_step": 117966, "epoch": 974} {"train_loss": -38.58802032470703, "global_step": 117967, "epoch": 974} {"train_loss": -38.2244758605957, "global_step": 117968, "epoch": 974} {"train_loss": -38.64424133300781, "global_step": 117969, "epoch": 974} {"train_loss": -38.45541763305664, "global_step": 117970, "epoch": 974} {"train_loss": -38.045204162597656, "global_step": 117971, "epoch": 974} {"train_loss": -36.5665397644043, "global_step": 117972, "epoch": 974} {"train_loss": -34.93754577636719, "global_step": 117973, "epoch": 974} {"train_loss": -36.66018843847858, "global_step": 117974, "epoch": 974, "val_loss": 2746476.75} {"train_loss": -34.67041778564453, "global_step": 117975, "epoch": 975} {"train_loss": -36.135215759277344, "global_step": 117976, "epoch": 975} {"train_loss": -37.83197784423828, "global_step": 117977, "epoch": 975} {"train_loss": -36.17023468017578, "global_step": 117978, "epoch": 975} {"train_loss": -36.70259475708008, "global_step": 117979, "epoch": 975} {"train_loss": -33.623382568359375, "global_step": 117980, "epoch": 975} {"train_loss": -35.658443450927734, "global_step": 117981, "epoch": 975} {"train_loss": -37.134971618652344, "global_step": 117982, "epoch": 975} {"train_loss": -38.26884078979492, "global_step": 117983, "epoch": 975} {"train_loss": -35.33136749267578, "global_step": 117984, "epoch": 975} {"train_loss": -38.126380920410156, "global_step": 117985, "epoch": 975} {"train_loss": -38.004478454589844, "global_step": 117986, "epoch": 975} {"train_loss": -37.81073760986328, "global_step": 117987, "epoch": 975} {"train_loss": -38.482051849365234, "global_step": 117988, "epoch": 975} {"train_loss": -37.62632369995117, "global_step": 117989, "epoch": 975} {"train_loss": -37.70610809326172, "global_step": 117990, "epoch": 975} {"train_loss": -37.8460693359375, "global_step": 117991, "epoch": 975} {"train_loss": -37.20014572143555, "global_step": 117992, "epoch": 975} {"train_loss": -37.71946334838867, "global_step": 117993, "epoch": 975} {"train_loss": -38.297447204589844, "global_step": 117994, "epoch": 975} {"train_loss": -38.1363410949707, "global_step": 117995, "epoch": 975} {"train_loss": -38.116634368896484, "global_step": 117996, "epoch": 975} {"train_loss": -38.04409408569336, "global_step": 117997, "epoch": 975} {"train_loss": -37.9893684387207, "global_step": 117998, "epoch": 975} {"train_loss": -37.6483154296875, "global_step": 117999, "epoch": 975} {"train_loss": -38.48450469970703, "global_step": 118000, "epoch": 975} {"train_loss": -37.92478942871094, "global_step": 118001, "epoch": 975} {"train_loss": -37.63869094848633, "global_step": 118002, "epoch": 975} {"train_loss": -38.03126525878906, "global_step": 118003, "epoch": 975} {"train_loss": -37.725948333740234, "global_step": 118004, "epoch": 975} {"train_loss": -37.49637985229492, "global_step": 118005, "epoch": 975} {"train_loss": -37.23795700073242, "global_step": 118006, "epoch": 975} {"train_loss": -37.77906799316406, "global_step": 118007, "epoch": 975} {"train_loss": -38.357242584228516, "global_step": 118008, "epoch": 975} {"train_loss": -36.38513946533203, "global_step": 118009, "epoch": 975} {"train_loss": -38.060787200927734, "global_step": 118010, "epoch": 975} {"train_loss": -38.52116775512695, "global_step": 118011, "epoch": 975} {"train_loss": -38.048152923583984, "global_step": 118012, "epoch": 975} {"train_loss": -37.5972785949707, "global_step": 118013, "epoch": 975} {"train_loss": -38.408058166503906, "global_step": 118014, "epoch": 975} {"train_loss": -38.10603713989258, "global_step": 118015, "epoch": 975} {"train_loss": -39.067386627197266, "global_step": 118016, "epoch": 975} {"train_loss": -38.42142105102539, "global_step": 118017, "epoch": 975} {"train_loss": -38.814781188964844, "global_step": 118018, "epoch": 975} {"train_loss": -38.15662384033203, "global_step": 118019, "epoch": 975} {"train_loss": -39.42325973510742, "global_step": 118020, "epoch": 975} {"train_loss": -38.6168327331543, "global_step": 118021, "epoch": 975} {"train_loss": -38.460731506347656, "global_step": 118022, "epoch": 975} {"train_loss": -37.696044921875, "global_step": 118023, "epoch": 975} {"train_loss": -39.341678619384766, "global_step": 118024, "epoch": 975} {"train_loss": -39.02802276611328, "global_step": 118025, "epoch": 975} {"train_loss": -38.848854064941406, "global_step": 118026, "epoch": 975} {"train_loss": -38.89058303833008, "global_step": 118027, "epoch": 975} {"train_loss": -38.75242233276367, "global_step": 118028, "epoch": 975} {"train_loss": -38.81496810913086, "global_step": 118029, "epoch": 975} {"train_loss": -39.18891525268555, "global_step": 118030, "epoch": 975} {"train_loss": -39.43937301635742, "global_step": 118031, "epoch": 975} {"train_loss": -38.47622299194336, "global_step": 118032, "epoch": 975} {"train_loss": -39.13750457763672, "global_step": 118033, "epoch": 975} {"train_loss": -38.93292999267578, "global_step": 118034, "epoch": 975} {"train_loss": -38.795833587646484, "global_step": 118035, "epoch": 975} {"train_loss": -39.21135330200195, "global_step": 118036, "epoch": 975} {"train_loss": -39.40373611450195, "global_step": 118037, "epoch": 975} {"train_loss": -39.33026123046875, "global_step": 118038, "epoch": 975} {"train_loss": -39.35954284667969, "global_step": 118039, "epoch": 975} {"train_loss": -39.61680221557617, "global_step": 118040, "epoch": 975} {"train_loss": -39.3455810546875, "global_step": 118041, "epoch": 975} {"train_loss": -39.0677490234375, "global_step": 118042, "epoch": 975} {"train_loss": -38.9803352355957, "global_step": 118043, "epoch": 975} {"train_loss": -38.90327072143555, "global_step": 118044, "epoch": 975} {"train_loss": -39.348907470703125, "global_step": 118045, "epoch": 975} {"train_loss": -39.34952926635742, "global_step": 118046, "epoch": 975} {"train_loss": -39.018714904785156, "global_step": 118047, "epoch": 975} {"train_loss": -39.34275436401367, "global_step": 118048, "epoch": 975} {"train_loss": -39.255001068115234, "global_step": 118049, "epoch": 975} {"train_loss": -38.92323303222656, "global_step": 118050, "epoch": 975} {"train_loss": -39.14809799194336, "global_step": 118051, "epoch": 975} {"train_loss": -37.78022384643555, "global_step": 118052, "epoch": 975} {"train_loss": -39.05195617675781, "global_step": 118053, "epoch": 975} {"train_loss": -39.2707633972168, "global_step": 118054, "epoch": 975} {"train_loss": -39.33858108520508, "global_step": 118055, "epoch": 975} {"train_loss": -38.10648727416992, "global_step": 118056, "epoch": 975} {"train_loss": -38.65088653564453, "global_step": 118057, "epoch": 975} {"train_loss": -36.277584075927734, "global_step": 118058, "epoch": 975} {"train_loss": -36.642879486083984, "global_step": 118059, "epoch": 975} {"train_loss": -38.16884231567383, "global_step": 118060, "epoch": 975} {"train_loss": -37.76223373413086, "global_step": 118061, "epoch": 975} {"train_loss": -39.03139114379883, "global_step": 118062, "epoch": 975} {"train_loss": -37.868316650390625, "global_step": 118063, "epoch": 975} {"train_loss": -38.18783187866211, "global_step": 118064, "epoch": 975} {"train_loss": -38.79460525512695, "global_step": 118065, "epoch": 975} {"train_loss": -38.007450103759766, "global_step": 118066, "epoch": 975} {"train_loss": -38.847023010253906, "global_step": 118067, "epoch": 975} {"train_loss": -38.03711700439453, "global_step": 118068, "epoch": 975} {"train_loss": -39.2110710144043, "global_step": 118069, "epoch": 975} {"train_loss": -38.8629150390625, "global_step": 118070, "epoch": 975} {"train_loss": -38.271480560302734, "global_step": 118071, "epoch": 975} {"train_loss": -38.1727409362793, "global_step": 118072, "epoch": 975} {"train_loss": -39.18952178955078, "global_step": 118073, "epoch": 975} {"train_loss": -39.297576904296875, "global_step": 118074, "epoch": 975} {"train_loss": -38.498714447021484, "global_step": 118075, "epoch": 975} {"train_loss": -38.066925048828125, "global_step": 118076, "epoch": 975} {"train_loss": -38.37832260131836, "global_step": 118077, "epoch": 975} {"train_loss": -37.026973724365234, "global_step": 118078, "epoch": 975} {"train_loss": -39.17036819458008, "global_step": 118079, "epoch": 975} {"train_loss": -38.225826263427734, "global_step": 118080, "epoch": 975} {"train_loss": -38.35126876831055, "global_step": 118081, "epoch": 975} {"train_loss": -37.248321533203125, "global_step": 118082, "epoch": 975} {"train_loss": -38.52323532104492, "global_step": 118083, "epoch": 975} {"train_loss": -34.655609130859375, "global_step": 118084, "epoch": 975} {"train_loss": -37.593910217285156, "global_step": 118085, "epoch": 975} {"train_loss": -38.56623077392578, "global_step": 118086, "epoch": 975} {"train_loss": -34.49856948852539, "global_step": 118087, "epoch": 975} {"train_loss": -34.444915771484375, "global_step": 118088, "epoch": 975} {"train_loss": -35.1765251159668, "global_step": 118089, "epoch": 975} {"train_loss": -36.19990158081055, "global_step": 118090, "epoch": 975} {"train_loss": -33.87941360473633, "global_step": 118091, "epoch": 975} {"train_loss": -32.893524169921875, "global_step": 118092, "epoch": 975} {"train_loss": -28.37135887145996, "global_step": 118093, "epoch": 975} {"train_loss": -36.461769104003906, "global_step": 118094, "epoch": 975} {"train_loss": -37.84937016826031, "global_step": 118095, "epoch": 975, "val_loss": 2796862.0} {"train_loss": -30.954015731811523, "global_step": 118096, "epoch": 976} {"train_loss": -35.30012130737305, "global_step": 118097, "epoch": 976} {"train_loss": -32.064842224121094, "global_step": 118098, "epoch": 976} {"train_loss": -20.54437828063965, "global_step": 118099, "epoch": 976} {"train_loss": -33.15186309814453, "global_step": 118100, "epoch": 976} {"train_loss": -25.888208389282227, "global_step": 118101, "epoch": 976} {"train_loss": -21.132373809814453, "global_step": 118102, "epoch": 976} {"train_loss": -29.9785213470459, "global_step": 118103, "epoch": 976} {"train_loss": -30.850910186767578, "global_step": 118104, "epoch": 976} {"train_loss": -35.65908432006836, "global_step": 118105, "epoch": 976} {"train_loss": -29.423566818237305, "global_step": 118106, "epoch": 976} {"train_loss": -29.378864288330078, "global_step": 118107, "epoch": 976} {"train_loss": -32.68177032470703, "global_step": 118108, "epoch": 976} {"train_loss": -29.255573272705078, "global_step": 118109, "epoch": 976} {"train_loss": -34.455318450927734, "global_step": 118110, "epoch": 976} {"train_loss": -33.1916618347168, "global_step": 118111, "epoch": 976} {"train_loss": -31.757200241088867, "global_step": 118112, "epoch": 976} {"train_loss": -32.921146392822266, "global_step": 118113, "epoch": 976} {"train_loss": -34.4902458190918, "global_step": 118114, "epoch": 976} {"train_loss": -34.69184112548828, "global_step": 118115, "epoch": 976} {"train_loss": -35.44154739379883, "global_step": 118116, "epoch": 976} {"train_loss": -34.26945877075195, "global_step": 118117, "epoch": 976} {"train_loss": -34.808895111083984, "global_step": 118118, "epoch": 976} {"train_loss": -33.29471969604492, "global_step": 118119, "epoch": 976} {"train_loss": -35.87295150756836, "global_step": 118120, "epoch": 976} {"train_loss": -35.237857818603516, "global_step": 118121, "epoch": 976} {"train_loss": -34.72505569458008, "global_step": 118122, "epoch": 976} {"train_loss": -34.989044189453125, "global_step": 118123, "epoch": 976} {"train_loss": -35.22461700439453, "global_step": 118124, "epoch": 976} {"train_loss": -34.59051513671875, "global_step": 118125, "epoch": 976} {"train_loss": -35.50790023803711, "global_step": 118126, "epoch": 976} {"train_loss": -35.07865524291992, "global_step": 118127, "epoch": 976} {"train_loss": -35.970314025878906, "global_step": 118128, "epoch": 976} {"train_loss": -35.79935836791992, "global_step": 118129, "epoch": 976} {"train_loss": -36.132720947265625, "global_step": 118130, "epoch": 976} {"train_loss": -35.44356918334961, "global_step": 118131, "epoch": 976} {"train_loss": -35.92975616455078, "global_step": 118132, "epoch": 976} {"train_loss": -36.558082580566406, "global_step": 118133, "epoch": 976} {"train_loss": -35.54328536987305, "global_step": 118134, "epoch": 976} {"train_loss": -36.30076217651367, "global_step": 118135, "epoch": 976} {"train_loss": -36.32424545288086, "global_step": 118136, "epoch": 976} {"train_loss": -36.31136703491211, "global_step": 118137, "epoch": 976} {"train_loss": -35.950950622558594, "global_step": 118138, "epoch": 976} {"train_loss": -36.73969650268555, "global_step": 118139, "epoch": 976} {"train_loss": -36.037994384765625, "global_step": 118140, "epoch": 976} {"train_loss": -36.90462875366211, "global_step": 118141, "epoch": 976} {"train_loss": -36.136268615722656, "global_step": 118142, "epoch": 976} {"train_loss": -35.915809631347656, "global_step": 118143, "epoch": 976} {"train_loss": -36.68781280517578, "global_step": 118144, "epoch": 976} {"train_loss": -36.56305694580078, "global_step": 118145, "epoch": 976} {"train_loss": -36.19910430908203, "global_step": 118146, "epoch": 976} {"train_loss": -36.81156539916992, "global_step": 118147, "epoch": 976} {"train_loss": -37.056434631347656, "global_step": 118148, "epoch": 976} {"train_loss": -36.6388053894043, "global_step": 118149, "epoch": 976} {"train_loss": -36.9439697265625, "global_step": 118150, "epoch": 976} {"train_loss": -36.74360275268555, "global_step": 118151, "epoch": 976} {"train_loss": -36.650691986083984, "global_step": 118152, "epoch": 976} {"train_loss": -37.113399505615234, "global_step": 118153, "epoch": 976} {"train_loss": -36.745094299316406, "global_step": 118154, "epoch": 976} {"train_loss": -37.310237884521484, "global_step": 118155, "epoch": 976} {"train_loss": -36.6779899597168, "global_step": 118156, "epoch": 976} {"train_loss": -37.89339065551758, "global_step": 118157, "epoch": 976} {"train_loss": -37.63370895385742, "global_step": 118158, "epoch": 976} {"train_loss": -36.90555953979492, "global_step": 118159, "epoch": 976} {"train_loss": -37.44793701171875, "global_step": 118160, "epoch": 976} {"train_loss": -37.15018081665039, "global_step": 118161, "epoch": 976} {"train_loss": -38.1826286315918, "global_step": 118162, "epoch": 976} {"train_loss": -36.73894119262695, "global_step": 118163, "epoch": 976} {"train_loss": -36.86638641357422, "global_step": 118164, "epoch": 976} {"train_loss": -37.67915344238281, "global_step": 118165, "epoch": 976} {"train_loss": -37.392513275146484, "global_step": 118166, "epoch": 976} {"train_loss": -37.690101623535156, "global_step": 118167, "epoch": 976} {"train_loss": -37.948421478271484, "global_step": 118168, "epoch": 976} {"train_loss": -37.44840621948242, "global_step": 118169, "epoch": 976} {"train_loss": -37.591514587402344, "global_step": 118170, "epoch": 976} {"train_loss": -38.078765869140625, "global_step": 118171, "epoch": 976} {"train_loss": -37.59847640991211, "global_step": 118172, "epoch": 976} {"train_loss": -37.57196807861328, "global_step": 118173, "epoch": 976} {"train_loss": -37.2889404296875, "global_step": 118174, "epoch": 976} {"train_loss": -38.170875549316406, "global_step": 118175, "epoch": 976} {"train_loss": -37.86930465698242, "global_step": 118176, "epoch": 976} {"train_loss": -37.8106803894043, "global_step": 118177, "epoch": 976} {"train_loss": -37.58476257324219, "global_step": 118178, "epoch": 976} {"train_loss": -38.14431381225586, "global_step": 118179, "epoch": 976} {"train_loss": -38.103092193603516, "global_step": 118180, "epoch": 976} {"train_loss": -37.7169189453125, "global_step": 118181, "epoch": 976} {"train_loss": -38.13985061645508, "global_step": 118182, "epoch": 976} {"train_loss": -38.6966667175293, "global_step": 118183, "epoch": 976} {"train_loss": -38.165077209472656, "global_step": 118184, "epoch": 976} {"train_loss": -38.73827362060547, "global_step": 118185, "epoch": 976} {"train_loss": -38.4162483215332, "global_step": 118186, "epoch": 976} {"train_loss": -38.60548782348633, "global_step": 118187, "epoch": 976} {"train_loss": -38.67676544189453, "global_step": 118188, "epoch": 976} {"train_loss": -38.322872161865234, "global_step": 118189, "epoch": 976} {"train_loss": -38.17917251586914, "global_step": 118190, "epoch": 976} {"train_loss": -38.5186653137207, "global_step": 118191, "epoch": 976} {"train_loss": -38.208518981933594, "global_step": 118192, "epoch": 976} {"train_loss": -38.685516357421875, "global_step": 118193, "epoch": 976} {"train_loss": -38.11249542236328, "global_step": 118194, "epoch": 976} {"train_loss": -37.932491302490234, "global_step": 118195, "epoch": 976} {"train_loss": -39.219459533691406, "global_step": 118196, "epoch": 976} {"train_loss": -38.4403190612793, "global_step": 118197, "epoch": 976} {"train_loss": -37.415687561035156, "global_step": 118198, "epoch": 976} {"train_loss": -37.92445755004883, "global_step": 118199, "epoch": 976} {"train_loss": -38.10131072998047, "global_step": 118200, "epoch": 976} {"train_loss": -37.36100387573242, "global_step": 118201, "epoch": 976} {"train_loss": -37.78268051147461, "global_step": 118202, "epoch": 976} {"train_loss": -38.57206344604492, "global_step": 118203, "epoch": 976} {"train_loss": -37.53139877319336, "global_step": 118204, "epoch": 976} {"train_loss": -38.21675491333008, "global_step": 118205, "epoch": 976} {"train_loss": -38.185142517089844, "global_step": 118206, "epoch": 976} {"train_loss": -37.74363327026367, "global_step": 118207, "epoch": 976} {"train_loss": -38.510223388671875, "global_step": 118208, "epoch": 976} {"train_loss": -37.7650146484375, "global_step": 118209, "epoch": 976} {"train_loss": -38.51348876953125, "global_step": 118210, "epoch": 976} {"train_loss": -38.84682083129883, "global_step": 118211, "epoch": 976} {"train_loss": -38.454566955566406, "global_step": 118212, "epoch": 976} {"train_loss": -39.06443405151367, "global_step": 118213, "epoch": 976} {"train_loss": -38.40502166748047, "global_step": 118214, "epoch": 976} {"train_loss": -38.700557708740234, "global_step": 118215, "epoch": 976} {"train_loss": -36.15128701580458, "global_step": 118216, "epoch": 976, "val_loss": 2756779.25} {"train_loss": -38.38680648803711, "global_step": 118217, "epoch": 977} {"train_loss": -38.84096145629883, "global_step": 118218, "epoch": 977} {"train_loss": -38.72225570678711, "global_step": 118219, "epoch": 977} {"train_loss": -38.278717041015625, "global_step": 118220, "epoch": 977} {"train_loss": -38.551448822021484, "global_step": 118221, "epoch": 977} {"train_loss": -37.97986602783203, "global_step": 118222, "epoch": 977} {"train_loss": -38.92274856567383, "global_step": 118223, "epoch": 977} {"train_loss": -38.62431335449219, "global_step": 118224, "epoch": 977} {"train_loss": -37.46562194824219, "global_step": 118225, "epoch": 977} {"train_loss": -38.366004943847656, "global_step": 118226, "epoch": 977} {"train_loss": -38.27407455444336, "global_step": 118227, "epoch": 977} {"train_loss": -38.918087005615234, "global_step": 118228, "epoch": 977} {"train_loss": -38.34609603881836, "global_step": 118229, "epoch": 977} {"train_loss": -37.17976379394531, "global_step": 118230, "epoch": 977} {"train_loss": -36.233917236328125, "global_step": 118231, "epoch": 977} {"train_loss": -31.013208389282227, "global_step": 118232, "epoch": 977} {"train_loss": -23.9638671875, "global_step": 118233, "epoch": 977} {"train_loss": -24.318992614746094, "global_step": 118234, "epoch": 977} {"train_loss": -32.490291595458984, "global_step": 118235, "epoch": 977} {"train_loss": -35.90668869018555, "global_step": 118236, "epoch": 977} {"train_loss": -29.233545303344727, "global_step": 118237, "epoch": 977} {"train_loss": -36.76215744018555, "global_step": 118238, "epoch": 977} {"train_loss": -31.561548233032227, "global_step": 118239, "epoch": 977} {"train_loss": -36.842708587646484, "global_step": 118240, "epoch": 977} {"train_loss": -33.68471908569336, "global_step": 118241, "epoch": 977} {"train_loss": -36.38859939575195, "global_step": 118242, "epoch": 977} {"train_loss": -34.843997955322266, "global_step": 118243, "epoch": 977} {"train_loss": -36.38423538208008, "global_step": 118244, "epoch": 977} {"train_loss": -35.8021240234375, "global_step": 118245, "epoch": 977} {"train_loss": -37.29119110107422, "global_step": 118246, "epoch": 977} {"train_loss": -33.9552001953125, "global_step": 118247, "epoch": 977} {"train_loss": -36.463294982910156, "global_step": 118248, "epoch": 977} {"train_loss": -34.93365478515625, "global_step": 118249, "epoch": 977} {"train_loss": -35.695804595947266, "global_step": 118250, "epoch": 977} {"train_loss": -36.421844482421875, "global_step": 118251, "epoch": 977} {"train_loss": -36.218257904052734, "global_step": 118252, "epoch": 977} {"train_loss": -36.67847442626953, "global_step": 118253, "epoch": 977} {"train_loss": -36.646236419677734, "global_step": 118254, "epoch": 977} {"train_loss": -37.832275390625, "global_step": 118255, "epoch": 977} {"train_loss": -37.01837158203125, "global_step": 118256, "epoch": 977} {"train_loss": -37.22598648071289, "global_step": 118257, "epoch": 977} {"train_loss": -37.659786224365234, "global_step": 118258, "epoch": 977} {"train_loss": -38.174564361572266, "global_step": 118259, "epoch": 977} {"train_loss": -37.42047119140625, "global_step": 118260, "epoch": 977} {"train_loss": -37.8833122253418, "global_step": 118261, "epoch": 977} {"train_loss": -37.916831970214844, "global_step": 118262, "epoch": 977} {"train_loss": -38.08559036254883, "global_step": 118263, "epoch": 977} {"train_loss": -37.892364501953125, "global_step": 118264, "epoch": 977} {"train_loss": -38.16901779174805, "global_step": 118265, "epoch": 977} {"train_loss": -38.44437789916992, "global_step": 118266, "epoch": 977} {"train_loss": -38.16388702392578, "global_step": 118267, "epoch": 977} {"train_loss": -38.23845291137695, "global_step": 118268, "epoch": 977} {"train_loss": -38.69481658935547, "global_step": 118269, "epoch": 977} {"train_loss": -37.043460845947266, "global_step": 118270, "epoch": 977} {"train_loss": -38.11420822143555, "global_step": 118271, "epoch": 977} {"train_loss": -38.014400482177734, "global_step": 118272, "epoch": 977} {"train_loss": -38.04700469970703, "global_step": 118273, "epoch": 977} {"train_loss": -38.785491943359375, "global_step": 118274, "epoch": 977} {"train_loss": -38.1462287902832, "global_step": 118275, "epoch": 977} {"train_loss": -38.52151107788086, "global_step": 118276, "epoch": 977} {"train_loss": -37.50983810424805, "global_step": 118277, "epoch": 977} {"train_loss": -38.497802734375, "global_step": 118278, "epoch": 977} {"train_loss": -38.626129150390625, "global_step": 118279, "epoch": 977} {"train_loss": -38.86304473876953, "global_step": 118280, "epoch": 977} {"train_loss": -38.66482162475586, "global_step": 118281, "epoch": 977} {"train_loss": -38.98128890991211, "global_step": 118282, "epoch": 977} {"train_loss": -38.612361907958984, "global_step": 118283, "epoch": 977} {"train_loss": -38.409385681152344, "global_step": 118284, "epoch": 977} {"train_loss": -38.78390121459961, "global_step": 118285, "epoch": 977} {"train_loss": -38.72783660888672, "global_step": 118286, "epoch": 977} {"train_loss": -39.05215072631836, "global_step": 118287, "epoch": 977} {"train_loss": -39.00164794921875, "global_step": 118288, "epoch": 977} {"train_loss": -38.400184631347656, "global_step": 118289, "epoch": 977} {"train_loss": -38.73420333862305, "global_step": 118290, "epoch": 977} {"train_loss": -38.73795700073242, "global_step": 118291, "epoch": 977} {"train_loss": -38.76588439941406, "global_step": 118292, "epoch": 977} {"train_loss": -38.791107177734375, "global_step": 118293, "epoch": 977} {"train_loss": -38.95083236694336, "global_step": 118294, "epoch": 977} {"train_loss": -38.69301986694336, "global_step": 118295, "epoch": 977} {"train_loss": -38.99730682373047, "global_step": 118296, "epoch": 977} {"train_loss": -39.24013900756836, "global_step": 118297, "epoch": 977} {"train_loss": -38.70551681518555, "global_step": 118298, "epoch": 977} {"train_loss": -38.53219223022461, "global_step": 118299, "epoch": 977} {"train_loss": -38.879520416259766, "global_step": 118300, "epoch": 977} {"train_loss": -39.09798812866211, "global_step": 118301, "epoch": 977} {"train_loss": -39.171504974365234, "global_step": 118302, "epoch": 977} {"train_loss": -38.533260345458984, "global_step": 118303, "epoch": 977} {"train_loss": -39.651512145996094, "global_step": 118304, "epoch": 977} {"train_loss": -39.08466720581055, "global_step": 118305, "epoch": 977} {"train_loss": -39.39153289794922, "global_step": 118306, "epoch": 977} {"train_loss": -38.904048919677734, "global_step": 118307, "epoch": 977} {"train_loss": -38.52810287475586, "global_step": 118308, "epoch": 977} {"train_loss": -38.7547721862793, "global_step": 118309, "epoch": 977} {"train_loss": -38.713966369628906, "global_step": 118310, "epoch": 977} {"train_loss": -38.602020263671875, "global_step": 118311, "epoch": 977} {"train_loss": -38.3547477722168, "global_step": 118312, "epoch": 977} {"train_loss": -37.61733627319336, "global_step": 118313, "epoch": 977} {"train_loss": -36.66009521484375, "global_step": 118314, "epoch": 977} {"train_loss": -37.24308776855469, "global_step": 118315, "epoch": 977} {"train_loss": -38.622554779052734, "global_step": 118316, "epoch": 977} {"train_loss": -37.62635040283203, "global_step": 118317, "epoch": 977} {"train_loss": -37.00840377807617, "global_step": 118318, "epoch": 977} {"train_loss": -37.66933822631836, "global_step": 118319, "epoch": 977} {"train_loss": -35.97809982299805, "global_step": 118320, "epoch": 977} {"train_loss": -37.96897506713867, "global_step": 118321, "epoch": 977} {"train_loss": -36.96487045288086, "global_step": 118322, "epoch": 977} {"train_loss": -36.58396530151367, "global_step": 118323, "epoch": 977} {"train_loss": -38.57279586791992, "global_step": 118324, "epoch": 977} {"train_loss": -37.65812301635742, "global_step": 118325, "epoch": 977} {"train_loss": -35.92656326293945, "global_step": 118326, "epoch": 977} {"train_loss": -35.828060150146484, "global_step": 118327, "epoch": 977} {"train_loss": -37.971595764160156, "global_step": 118328, "epoch": 977} {"train_loss": -37.97345733642578, "global_step": 118329, "epoch": 977} {"train_loss": -35.5613899230957, "global_step": 118330, "epoch": 977} {"train_loss": -38.369808197021484, "global_step": 118331, "epoch": 977} {"train_loss": -37.35720443725586, "global_step": 118332, "epoch": 977} {"train_loss": -36.43497848510742, "global_step": 118333, "epoch": 977} {"train_loss": -37.66565704345703, "global_step": 118334, "epoch": 977} {"train_loss": -37.37919998168945, "global_step": 118335, "epoch": 977} {"train_loss": -36.55418395996094, "global_step": 118336, "epoch": 977} {"train_loss": -37.35289510616586, "global_step": 118337, "epoch": 977, "val_loss": 2716558.25} {"train_loss": -38.320247650146484, "global_step": 118338, "epoch": 978} {"train_loss": -37.568519592285156, "global_step": 118339, "epoch": 978} {"train_loss": -39.01002883911133, "global_step": 118340, "epoch": 978} {"train_loss": -38.31605529785156, "global_step": 118341, "epoch": 978} {"train_loss": -38.582820892333984, "global_step": 118342, "epoch": 978} {"train_loss": -38.716487884521484, "global_step": 118343, "epoch": 978} {"train_loss": -38.833465576171875, "global_step": 118344, "epoch": 978} {"train_loss": -38.30350875854492, "global_step": 118345, "epoch": 978} {"train_loss": -38.16950607299805, "global_step": 118346, "epoch": 978} {"train_loss": -38.61055374145508, "global_step": 118347, "epoch": 978} {"train_loss": -39.15815734863281, "global_step": 118348, "epoch": 978} {"train_loss": -38.544158935546875, "global_step": 118349, "epoch": 978} {"train_loss": -39.063045501708984, "global_step": 118350, "epoch": 978} {"train_loss": -38.04270553588867, "global_step": 118351, "epoch": 978} {"train_loss": -38.992347717285156, "global_step": 118352, "epoch": 978} {"train_loss": -38.967010498046875, "global_step": 118353, "epoch": 978} {"train_loss": -38.409095764160156, "global_step": 118354, "epoch": 978} {"train_loss": -38.73615646362305, "global_step": 118355, "epoch": 978} {"train_loss": -38.62925338745117, "global_step": 118356, "epoch": 978} {"train_loss": -39.42544174194336, "global_step": 118357, "epoch": 978} {"train_loss": -38.806453704833984, "global_step": 118358, "epoch": 978} {"train_loss": -39.378448486328125, "global_step": 118359, "epoch": 978} {"train_loss": -39.16952896118164, "global_step": 118360, "epoch": 978} {"train_loss": -39.06190490722656, "global_step": 118361, "epoch": 978} {"train_loss": -39.59153366088867, "global_step": 118362, "epoch": 978} {"train_loss": -39.19014358520508, "global_step": 118363, "epoch": 978} {"train_loss": -39.43288040161133, "global_step": 118364, "epoch": 978} {"train_loss": -39.55247116088867, "global_step": 118365, "epoch": 978} {"train_loss": -39.00699234008789, "global_step": 118366, "epoch": 978} {"train_loss": -39.72432327270508, "global_step": 118367, "epoch": 978} {"train_loss": -39.45659255981445, "global_step": 118368, "epoch": 978} {"train_loss": -39.47495651245117, "global_step": 118369, "epoch": 978} {"train_loss": -39.665584564208984, "global_step": 118370, "epoch": 978} {"train_loss": -39.0269889831543, "global_step": 118371, "epoch": 978} {"train_loss": -39.604732513427734, "global_step": 118372, "epoch": 978} {"train_loss": -39.682228088378906, "global_step": 118373, "epoch": 978} {"train_loss": -39.87092971801758, "global_step": 118374, "epoch": 978} {"train_loss": -39.6135368347168, "global_step": 118375, "epoch": 978} {"train_loss": -39.2440185546875, "global_step": 118376, "epoch": 978} {"train_loss": -38.92206573486328, "global_step": 118377, "epoch": 978} {"train_loss": -39.312557220458984, "global_step": 118378, "epoch": 978} {"train_loss": -39.973609924316406, "global_step": 118379, "epoch": 978} {"train_loss": -39.60165023803711, "global_step": 118380, "epoch": 978} {"train_loss": -39.703128814697266, "global_step": 118381, "epoch": 978} {"train_loss": -39.34174728393555, "global_step": 118382, "epoch": 978} {"train_loss": -38.94452667236328, "global_step": 118383, "epoch": 978} {"train_loss": -39.9649772644043, "global_step": 118384, "epoch": 978} {"train_loss": -39.5857048034668, "global_step": 118385, "epoch": 978} {"train_loss": -39.3592414855957, "global_step": 118386, "epoch": 978} {"train_loss": -39.53453826904297, "global_step": 118387, "epoch": 978} {"train_loss": -39.049407958984375, "global_step": 118388, "epoch": 978} {"train_loss": -36.802391052246094, "global_step": 118389, "epoch": 978} {"train_loss": -35.43244552612305, "global_step": 118390, "epoch": 978} {"train_loss": -37.60646438598633, "global_step": 118391, "epoch": 978} {"train_loss": -38.44043731689453, "global_step": 118392, "epoch": 978} {"train_loss": -37.786376953125, "global_step": 118393, "epoch": 978} {"train_loss": -37.171810150146484, "global_step": 118394, "epoch": 978} {"train_loss": -39.221893310546875, "global_step": 118395, "epoch": 978} {"train_loss": -36.43354415893555, "global_step": 118396, "epoch": 978} {"train_loss": -38.17409133911133, "global_step": 118397, "epoch": 978} {"train_loss": -38.40572738647461, "global_step": 118398, "epoch": 978} {"train_loss": -37.85329055786133, "global_step": 118399, "epoch": 978} {"train_loss": -37.69691848754883, "global_step": 118400, "epoch": 978} {"train_loss": -38.89093017578125, "global_step": 118401, "epoch": 978} {"train_loss": -37.8983039855957, "global_step": 118402, "epoch": 978} {"train_loss": -37.774810791015625, "global_step": 118403, "epoch": 978} {"train_loss": -38.124366760253906, "global_step": 118404, "epoch": 978} {"train_loss": -36.808956146240234, "global_step": 118405, "epoch": 978} {"train_loss": -37.6572265625, "global_step": 118406, "epoch": 978} {"train_loss": -38.83369064331055, "global_step": 118407, "epoch": 978} {"train_loss": -38.036766052246094, "global_step": 118408, "epoch": 978} {"train_loss": -35.00245666503906, "global_step": 118409, "epoch": 978} {"train_loss": -35.62925338745117, "global_step": 118410, "epoch": 978} {"train_loss": -37.23236083984375, "global_step": 118411, "epoch": 978} {"train_loss": -38.06944274902344, "global_step": 118412, "epoch": 978} {"train_loss": -37.44338607788086, "global_step": 118413, "epoch": 978} {"train_loss": -38.360816955566406, "global_step": 118414, "epoch": 978} {"train_loss": -36.52858352661133, "global_step": 118415, "epoch": 978} {"train_loss": -36.638336181640625, "global_step": 118416, "epoch": 978} {"train_loss": -37.352577209472656, "global_step": 118417, "epoch": 978} {"train_loss": -36.01389694213867, "global_step": 118418, "epoch": 978} {"train_loss": -37.07955551147461, "global_step": 118419, "epoch": 978} {"train_loss": -33.37160873413086, "global_step": 118420, "epoch": 978} {"train_loss": -36.62838363647461, "global_step": 118421, "epoch": 978} {"train_loss": -37.350990295410156, "global_step": 118422, "epoch": 978} {"train_loss": -36.93645095825195, "global_step": 118423, "epoch": 978} {"train_loss": -36.851051330566406, "global_step": 118424, "epoch": 978} {"train_loss": -37.041744232177734, "global_step": 118425, "epoch": 978} {"train_loss": -37.718441009521484, "global_step": 118426, "epoch": 978} {"train_loss": -37.77153396606445, "global_step": 118427, "epoch": 978} {"train_loss": -34.84403610229492, "global_step": 118428, "epoch": 978} {"train_loss": -38.36492156982422, "global_step": 118429, "epoch": 978} {"train_loss": -38.13589096069336, "global_step": 118430, "epoch": 978} {"train_loss": -36.190120697021484, "global_step": 118431, "epoch": 978} {"train_loss": -36.91521072387695, "global_step": 118432, "epoch": 978} {"train_loss": -38.93180465698242, "global_step": 118433, "epoch": 978} {"train_loss": -37.8730583190918, "global_step": 118434, "epoch": 978} {"train_loss": -38.47930908203125, "global_step": 118435, "epoch": 978} {"train_loss": -38.221458435058594, "global_step": 118436, "epoch": 978} {"train_loss": -38.05326461791992, "global_step": 118437, "epoch": 978} {"train_loss": -37.173580169677734, "global_step": 118438, "epoch": 978} {"train_loss": -37.96367645263672, "global_step": 118439, "epoch": 978} {"train_loss": -39.260475158691406, "global_step": 118440, "epoch": 978} {"train_loss": -39.05019760131836, "global_step": 118441, "epoch": 978} {"train_loss": -38.5155029296875, "global_step": 118442, "epoch": 978} {"train_loss": -38.28555679321289, "global_step": 118443, "epoch": 978} {"train_loss": -38.7216911315918, "global_step": 118444, "epoch": 978} {"train_loss": -38.46038818359375, "global_step": 118445, "epoch": 978} {"train_loss": -38.9259147644043, "global_step": 118446, "epoch": 978} {"train_loss": -39.03252410888672, "global_step": 118447, "epoch": 978} {"train_loss": -37.682281494140625, "global_step": 118448, "epoch": 978} {"train_loss": -38.52065658569336, "global_step": 118449, "epoch": 978} {"train_loss": -39.0541877746582, "global_step": 118450, "epoch": 978} {"train_loss": -38.9119873046875, "global_step": 118451, "epoch": 978} {"train_loss": -39.276397705078125, "global_step": 118452, "epoch": 978} {"train_loss": -38.42734909057617, "global_step": 118453, "epoch": 978} {"train_loss": -38.677520751953125, "global_step": 118454, "epoch": 978} {"train_loss": -39.1512565612793, "global_step": 118455, "epoch": 978} {"train_loss": -38.702632904052734, "global_step": 118456, "epoch": 978} {"train_loss": -38.78855514526367, "global_step": 118457, "epoch": 978} {"train_loss": -38.315697504469185, "global_step": 118458, "epoch": 978, "val_loss": 2713456.25} {"train_loss": -38.10634231567383, "global_step": 118459, "epoch": 979} {"train_loss": -39.15787124633789, "global_step": 118460, "epoch": 979} {"train_loss": -39.265357971191406, "global_step": 118461, "epoch": 979} {"train_loss": -39.15351486206055, "global_step": 118462, "epoch": 979} {"train_loss": -38.15003204345703, "global_step": 118463, "epoch": 979} {"train_loss": -39.678619384765625, "global_step": 118464, "epoch": 979} {"train_loss": -39.1574821472168, "global_step": 118465, "epoch": 979} {"train_loss": -38.47724533081055, "global_step": 118466, "epoch": 979} {"train_loss": -38.860877990722656, "global_step": 118467, "epoch": 979} {"train_loss": -39.0498046875, "global_step": 118468, "epoch": 979} {"train_loss": -39.7008056640625, "global_step": 118469, "epoch": 979} {"train_loss": -39.42041015625, "global_step": 118470, "epoch": 979} {"train_loss": -37.37189865112305, "global_step": 118471, "epoch": 979} {"train_loss": -38.63092041015625, "global_step": 118472, "epoch": 979} {"train_loss": -38.85358428955078, "global_step": 118473, "epoch": 979} {"train_loss": -38.9782829284668, "global_step": 118474, "epoch": 979} {"train_loss": -39.93327713012695, "global_step": 118475, "epoch": 979} {"train_loss": -39.272823333740234, "global_step": 118476, "epoch": 979} {"train_loss": -38.96965408325195, "global_step": 118477, "epoch": 979} {"train_loss": -39.30820083618164, "global_step": 118478, "epoch": 979} {"train_loss": -38.925968170166016, "global_step": 118479, "epoch": 979} {"train_loss": -39.61894989013672, "global_step": 118480, "epoch": 979} {"train_loss": -39.809234619140625, "global_step": 118481, "epoch": 979} {"train_loss": -39.58603286743164, "global_step": 118482, "epoch": 979} {"train_loss": -39.952884674072266, "global_step": 118483, "epoch": 979} {"train_loss": -39.73472213745117, "global_step": 118484, "epoch": 979} {"train_loss": -38.4806022644043, "global_step": 118485, "epoch": 979} {"train_loss": -39.47585678100586, "global_step": 118486, "epoch": 979} {"train_loss": -38.39707565307617, "global_step": 118487, "epoch": 979} {"train_loss": -37.1778678894043, "global_step": 118488, "epoch": 979} {"train_loss": -33.61499786376953, "global_step": 118489, "epoch": 979} {"train_loss": -29.265731811523438, "global_step": 118490, "epoch": 979} {"train_loss": -24.142765045166016, "global_step": 118491, "epoch": 979} {"train_loss": -30.553632736206055, "global_step": 118492, "epoch": 979} {"train_loss": -38.96775817871094, "global_step": 118493, "epoch": 979} {"train_loss": -33.35007858276367, "global_step": 118494, "epoch": 979} {"train_loss": -31.171987533569336, "global_step": 118495, "epoch": 979} {"train_loss": -37.89943313598633, "global_step": 118496, "epoch": 979} {"train_loss": -33.22846603393555, "global_step": 118497, "epoch": 979} {"train_loss": -38.13273239135742, "global_step": 118498, "epoch": 979} {"train_loss": -33.1338005065918, "global_step": 118499, "epoch": 979} {"train_loss": -33.848941802978516, "global_step": 118500, "epoch": 979} {"train_loss": -36.60626983642578, "global_step": 118501, "epoch": 979} {"train_loss": -37.60173416137695, "global_step": 118502, "epoch": 979} {"train_loss": -36.97927474975586, "global_step": 118503, "epoch": 979} {"train_loss": -36.5565299987793, "global_step": 118504, "epoch": 979} {"train_loss": -36.53765869140625, "global_step": 118505, "epoch": 979} {"train_loss": -36.536922454833984, "global_step": 118506, "epoch": 979} {"train_loss": -37.08684158325195, "global_step": 118507, "epoch": 979} {"train_loss": -37.5296745300293, "global_step": 118508, "epoch": 979} {"train_loss": -37.45105743408203, "global_step": 118509, "epoch": 979} {"train_loss": -37.499568939208984, "global_step": 118510, "epoch": 979} {"train_loss": -38.55177688598633, "global_step": 118511, "epoch": 979} {"train_loss": -37.877071380615234, "global_step": 118512, "epoch": 979} {"train_loss": -37.915016174316406, "global_step": 118513, "epoch": 979} {"train_loss": -38.119136810302734, "global_step": 118514, "epoch": 979} {"train_loss": -37.723304748535156, "global_step": 118515, "epoch": 979} {"train_loss": -38.932010650634766, "global_step": 118516, "epoch": 979} {"train_loss": -38.55970764160156, "global_step": 118517, "epoch": 979} {"train_loss": -38.67549133300781, "global_step": 118518, "epoch": 979} {"train_loss": -37.904151916503906, "global_step": 118519, "epoch": 979} {"train_loss": -39.05446243286133, "global_step": 118520, "epoch": 979} {"train_loss": -38.4785270690918, "global_step": 118521, "epoch": 979} {"train_loss": -38.77418899536133, "global_step": 118522, "epoch": 979} {"train_loss": -38.92892074584961, "global_step": 118523, "epoch": 979} {"train_loss": -38.409767150878906, "global_step": 118524, "epoch": 979} {"train_loss": -39.06556701660156, "global_step": 118525, "epoch": 979} {"train_loss": -38.676265716552734, "global_step": 118526, "epoch": 979} {"train_loss": -38.908363342285156, "global_step": 118527, "epoch": 979} {"train_loss": -38.5220832824707, "global_step": 118528, "epoch": 979} {"train_loss": -38.785621643066406, "global_step": 118529, "epoch": 979} {"train_loss": -39.54136276245117, "global_step": 118530, "epoch": 979} {"train_loss": -39.3406982421875, "global_step": 118531, "epoch": 979} {"train_loss": -39.36336135864258, "global_step": 118532, "epoch": 979} {"train_loss": -39.190704345703125, "global_step": 118533, "epoch": 979} {"train_loss": -39.08066177368164, "global_step": 118534, "epoch": 979} {"train_loss": -39.21244430541992, "global_step": 118535, "epoch": 979} {"train_loss": -39.212459564208984, "global_step": 118536, "epoch": 979} {"train_loss": -38.794376373291016, "global_step": 118537, "epoch": 979} {"train_loss": -37.40552520751953, "global_step": 118538, "epoch": 979} {"train_loss": -39.02106475830078, "global_step": 118539, "epoch": 979} {"train_loss": -38.004390716552734, "global_step": 118540, "epoch": 979} {"train_loss": -39.691673278808594, "global_step": 118541, "epoch": 979} {"train_loss": -39.510494232177734, "global_step": 118542, "epoch": 979} {"train_loss": -39.609886169433594, "global_step": 118543, "epoch": 979} {"train_loss": -39.38587188720703, "global_step": 118544, "epoch": 979} {"train_loss": -39.70650100708008, "global_step": 118545, "epoch": 979} {"train_loss": -39.3380126953125, "global_step": 118546, "epoch": 979} {"train_loss": -38.690467834472656, "global_step": 118547, "epoch": 979} {"train_loss": -38.01702880859375, "global_step": 118548, "epoch": 979} {"train_loss": -39.26668930053711, "global_step": 118549, "epoch": 979} {"train_loss": -38.77933120727539, "global_step": 118550, "epoch": 979} {"train_loss": -38.99658966064453, "global_step": 118551, "epoch": 979} {"train_loss": -39.73441696166992, "global_step": 118552, "epoch": 979} {"train_loss": -38.123443603515625, "global_step": 118553, "epoch": 979} {"train_loss": -38.64304733276367, "global_step": 118554, "epoch": 979} {"train_loss": -39.915618896484375, "global_step": 118555, "epoch": 979} {"train_loss": -38.41211700439453, "global_step": 118556, "epoch": 979} {"train_loss": -39.23457717895508, "global_step": 118557, "epoch": 979} {"train_loss": -38.68377685546875, "global_step": 118558, "epoch": 979} {"train_loss": -38.380584716796875, "global_step": 118559, "epoch": 979} {"train_loss": -38.75952911376953, "global_step": 118560, "epoch": 979} {"train_loss": -39.39756393432617, "global_step": 118561, "epoch": 979} {"train_loss": -39.274654388427734, "global_step": 118562, "epoch": 979} {"train_loss": -39.42234420776367, "global_step": 118563, "epoch": 979} {"train_loss": -39.83157730102539, "global_step": 118564, "epoch": 979} {"train_loss": -37.501712799072266, "global_step": 118565, "epoch": 979} {"train_loss": -39.45664596557617, "global_step": 118566, "epoch": 979} {"train_loss": -38.12766647338867, "global_step": 118567, "epoch": 979} {"train_loss": -37.6472282409668, "global_step": 118568, "epoch": 979} {"train_loss": -39.61500930786133, "global_step": 118569, "epoch": 979} {"train_loss": -39.38347244262695, "global_step": 118570, "epoch": 979} {"train_loss": -39.2349739074707, "global_step": 118571, "epoch": 979} {"train_loss": -38.03925704956055, "global_step": 118572, "epoch": 979} {"train_loss": -38.19036102294922, "global_step": 118573, "epoch": 979} {"train_loss": -38.75544357299805, "global_step": 118574, "epoch": 979} {"train_loss": -36.83665466308594, "global_step": 118575, "epoch": 979} {"train_loss": -35.951416015625, "global_step": 118576, "epoch": 979} {"train_loss": -32.06410598754883, "global_step": 118577, "epoch": 979} {"train_loss": -28.73860740661621, "global_step": 118578, "epoch": 979} {"train_loss": -37.93116859562141, "global_step": 118579, "epoch": 979, "val_loss": 2648823.25} {"train_loss": -36.0868034362793, "global_step": 118580, "epoch": 980} {"train_loss": -37.6873779296875, "global_step": 118581, "epoch": 980} {"train_loss": -36.795867919921875, "global_step": 118582, "epoch": 980} {"train_loss": -36.044677734375, "global_step": 118583, "epoch": 980} {"train_loss": -36.648250579833984, "global_step": 118584, "epoch": 980} {"train_loss": -37.422306060791016, "global_step": 118585, "epoch": 980} {"train_loss": -37.65354919433594, "global_step": 118586, "epoch": 980} {"train_loss": -37.80664825439453, "global_step": 118587, "epoch": 980} {"train_loss": -37.85524368286133, "global_step": 118588, "epoch": 980} {"train_loss": -37.99290466308594, "global_step": 118589, "epoch": 980} {"train_loss": -37.16068649291992, "global_step": 118590, "epoch": 980} {"train_loss": -37.883541107177734, "global_step": 118591, "epoch": 980} {"train_loss": -37.10740280151367, "global_step": 118592, "epoch": 980} {"train_loss": -37.88295364379883, "global_step": 118593, "epoch": 980} {"train_loss": -36.298439025878906, "global_step": 118594, "epoch": 980} {"train_loss": -37.747291564941406, "global_step": 118595, "epoch": 980} {"train_loss": -38.98780059814453, "global_step": 118596, "epoch": 980} {"train_loss": -38.39118194580078, "global_step": 118597, "epoch": 980} {"train_loss": -38.10111618041992, "global_step": 118598, "epoch": 980} {"train_loss": -37.47929382324219, "global_step": 118599, "epoch": 980} {"train_loss": -38.63370895385742, "global_step": 118600, "epoch": 980} {"train_loss": -38.3988151550293, "global_step": 118601, "epoch": 980} {"train_loss": -38.41775894165039, "global_step": 118602, "epoch": 980} {"train_loss": -38.935115814208984, "global_step": 118603, "epoch": 980} {"train_loss": -37.10642623901367, "global_step": 118604, "epoch": 980} {"train_loss": -37.7381706237793, "global_step": 118605, "epoch": 980} {"train_loss": -38.8983268737793, "global_step": 118606, "epoch": 980} {"train_loss": -39.12943649291992, "global_step": 118607, "epoch": 980} {"train_loss": -38.54304122924805, "global_step": 118608, "epoch": 980} {"train_loss": -37.50631332397461, "global_step": 118609, "epoch": 980} {"train_loss": -39.16426467895508, "global_step": 118610, "epoch": 980} {"train_loss": -38.3065071105957, "global_step": 118611, "epoch": 980} {"train_loss": -35.991546630859375, "global_step": 118612, "epoch": 980} {"train_loss": -38.643245697021484, "global_step": 118613, "epoch": 980} {"train_loss": -38.13496780395508, "global_step": 118614, "epoch": 980} {"train_loss": -38.56066131591797, "global_step": 118615, "epoch": 980} {"train_loss": -38.88688278198242, "global_step": 118616, "epoch": 980} {"train_loss": -37.637447357177734, "global_step": 118617, "epoch": 980} {"train_loss": -38.93614196777344, "global_step": 118618, "epoch": 980} {"train_loss": -38.857696533203125, "global_step": 118619, "epoch": 980} {"train_loss": -38.38155746459961, "global_step": 118620, "epoch": 980} {"train_loss": -38.55793380737305, "global_step": 118621, "epoch": 980} {"train_loss": -37.02195358276367, "global_step": 118622, "epoch": 980} {"train_loss": -37.61720275878906, "global_step": 118623, "epoch": 980} {"train_loss": -38.012752532958984, "global_step": 118624, "epoch": 980} {"train_loss": -39.30106735229492, "global_step": 118625, "epoch": 980} {"train_loss": -39.32024002075195, "global_step": 118626, "epoch": 980} {"train_loss": -38.720157623291016, "global_step": 118627, "epoch": 980} {"train_loss": -31.987516403198242, "global_step": 118628, "epoch": 980} {"train_loss": -37.35848617553711, "global_step": 118629, "epoch": 980} {"train_loss": -38.7977294921875, "global_step": 118630, "epoch": 980} {"train_loss": -39.16970443725586, "global_step": 118631, "epoch": 980} {"train_loss": -38.5198860168457, "global_step": 118632, "epoch": 980} {"train_loss": -37.453853607177734, "global_step": 118633, "epoch": 980} {"train_loss": -38.981475830078125, "global_step": 118634, "epoch": 980} {"train_loss": -37.399986267089844, "global_step": 118635, "epoch": 980} {"train_loss": -38.64835739135742, "global_step": 118636, "epoch": 980} {"train_loss": -38.96063995361328, "global_step": 118637, "epoch": 980} {"train_loss": -38.18983459472656, "global_step": 118638, "epoch": 980} {"train_loss": -37.67307662963867, "global_step": 118639, "epoch": 980} {"train_loss": -38.95779037475586, "global_step": 118640, "epoch": 980} {"train_loss": -39.12736892700195, "global_step": 118641, "epoch": 980} {"train_loss": -37.95992660522461, "global_step": 118642, "epoch": 980} {"train_loss": -38.24918746948242, "global_step": 118643, "epoch": 980} {"train_loss": -36.63604736328125, "global_step": 118644, "epoch": 980} {"train_loss": -36.90835189819336, "global_step": 118645, "epoch": 980} {"train_loss": -37.470333099365234, "global_step": 118646, "epoch": 980} {"train_loss": -38.21254348754883, "global_step": 118647, "epoch": 980} {"train_loss": -37.351806640625, "global_step": 118648, "epoch": 980} {"train_loss": -37.18919372558594, "global_step": 118649, "epoch": 980} {"train_loss": -38.09038162231445, "global_step": 118650, "epoch": 980} {"train_loss": -37.33510971069336, "global_step": 118651, "epoch": 980} {"train_loss": -37.944149017333984, "global_step": 118652, "epoch": 980} {"train_loss": -37.839595794677734, "global_step": 118653, "epoch": 980} {"train_loss": -36.445472717285156, "global_step": 118654, "epoch": 980} {"train_loss": -38.1110954284668, "global_step": 118655, "epoch": 980} {"train_loss": -36.4407958984375, "global_step": 118656, "epoch": 980} {"train_loss": -38.13178253173828, "global_step": 118657, "epoch": 980} {"train_loss": -35.39107131958008, "global_step": 118658, "epoch": 980} {"train_loss": -33.627662658691406, "global_step": 118659, "epoch": 980} {"train_loss": -37.78416061401367, "global_step": 118660, "epoch": 980} {"train_loss": -35.18523025512695, "global_step": 118661, "epoch": 980} {"train_loss": -36.72773361206055, "global_step": 118662, "epoch": 980} {"train_loss": -37.4703369140625, "global_step": 118663, "epoch": 980} {"train_loss": -38.56507873535156, "global_step": 118664, "epoch": 980} {"train_loss": -36.45436096191406, "global_step": 118665, "epoch": 980} {"train_loss": -37.43595886230469, "global_step": 118666, "epoch": 980} {"train_loss": -38.331451416015625, "global_step": 118667, "epoch": 980} {"train_loss": -38.35850143432617, "global_step": 118668, "epoch": 980} {"train_loss": -38.309539794921875, "global_step": 118669, "epoch": 980} {"train_loss": -37.48013687133789, "global_step": 118670, "epoch": 980} {"train_loss": -37.81268310546875, "global_step": 118671, "epoch": 980} {"train_loss": -35.227779388427734, "global_step": 118672, "epoch": 980} {"train_loss": -37.471927642822266, "global_step": 118673, "epoch": 980} {"train_loss": -38.70638656616211, "global_step": 118674, "epoch": 980} {"train_loss": -36.2288703918457, "global_step": 118675, "epoch": 980} {"train_loss": -38.69315719604492, "global_step": 118676, "epoch": 980} {"train_loss": -37.74508285522461, "global_step": 118677, "epoch": 980} {"train_loss": -36.130062103271484, "global_step": 118678, "epoch": 980} {"train_loss": -38.360137939453125, "global_step": 118679, "epoch": 980} {"train_loss": -38.69968795776367, "global_step": 118680, "epoch": 980} {"train_loss": -38.2795524597168, "global_step": 118681, "epoch": 980} {"train_loss": -36.567081451416016, "global_step": 118682, "epoch": 980} {"train_loss": -38.9770622253418, "global_step": 118683, "epoch": 980} {"train_loss": -38.31068801879883, "global_step": 118684, "epoch": 980} {"train_loss": -38.967098236083984, "global_step": 118685, "epoch": 980} {"train_loss": -39.2542724609375, "global_step": 118686, "epoch": 980} {"train_loss": -37.54630661010742, "global_step": 118687, "epoch": 980} {"train_loss": -38.88979721069336, "global_step": 118688, "epoch": 980} {"train_loss": -39.06926727294922, "global_step": 118689, "epoch": 980} {"train_loss": -39.03139114379883, "global_step": 118690, "epoch": 980} {"train_loss": -38.961727142333984, "global_step": 118691, "epoch": 980} {"train_loss": -36.46356964111328, "global_step": 118692, "epoch": 980} {"train_loss": -38.13351058959961, "global_step": 118693, "epoch": 980} {"train_loss": -38.440635681152344, "global_step": 118694, "epoch": 980} {"train_loss": -38.42264938354492, "global_step": 118695, "epoch": 980} {"train_loss": -38.6300048828125, "global_step": 118696, "epoch": 980} {"train_loss": -38.4356803894043, "global_step": 118697, "epoch": 980} {"train_loss": -37.26888656616211, "global_step": 118698, "epoch": 980} {"train_loss": -38.269569396972656, "global_step": 118699, "epoch": 980} {"train_loss": -37.82714678236275, "global_step": 118700, "epoch": 980, "val_loss": 2671706.75} {"train_loss": -38.423458099365234, "global_step": 118701, "epoch": 981} {"train_loss": -37.969093322753906, "global_step": 118702, "epoch": 981} {"train_loss": -38.680267333984375, "global_step": 118703, "epoch": 981} {"train_loss": -39.226497650146484, "global_step": 118704, "epoch": 981} {"train_loss": -38.834232330322266, "global_step": 118705, "epoch": 981} {"train_loss": -38.86818313598633, "global_step": 118706, "epoch": 981} {"train_loss": -36.80186462402344, "global_step": 118707, "epoch": 981} {"train_loss": -38.498165130615234, "global_step": 118708, "epoch": 981} {"train_loss": -38.85130310058594, "global_step": 118709, "epoch": 981} {"train_loss": -38.7930908203125, "global_step": 118710, "epoch": 981} {"train_loss": -37.84149932861328, "global_step": 118711, "epoch": 981} {"train_loss": -39.541595458984375, "global_step": 118712, "epoch": 981} {"train_loss": -37.97229766845703, "global_step": 118713, "epoch": 981} {"train_loss": -38.884979248046875, "global_step": 118714, "epoch": 981} {"train_loss": -39.49732971191406, "global_step": 118715, "epoch": 981} {"train_loss": -38.63991928100586, "global_step": 118716, "epoch": 981} {"train_loss": -39.26963424682617, "global_step": 118717, "epoch": 981} {"train_loss": -38.8846321105957, "global_step": 118718, "epoch": 981} {"train_loss": -39.076881408691406, "global_step": 118719, "epoch": 981} {"train_loss": -38.89341354370117, "global_step": 118720, "epoch": 981} {"train_loss": -38.63768005371094, "global_step": 118721, "epoch": 981} {"train_loss": -39.1213493347168, "global_step": 118722, "epoch": 981} {"train_loss": -39.1551628112793, "global_step": 118723, "epoch": 981} {"train_loss": -39.9318962097168, "global_step": 118724, "epoch": 981} {"train_loss": -39.07604217529297, "global_step": 118725, "epoch": 981} {"train_loss": -39.314998626708984, "global_step": 118726, "epoch": 981} {"train_loss": -39.34010314941406, "global_step": 118727, "epoch": 981} {"train_loss": -39.181007385253906, "global_step": 118728, "epoch": 981} {"train_loss": -39.174922943115234, "global_step": 118729, "epoch": 981} {"train_loss": -39.07163619995117, "global_step": 118730, "epoch": 981} {"train_loss": -39.87361145019531, "global_step": 118731, "epoch": 981} {"train_loss": -38.69655990600586, "global_step": 118732, "epoch": 981} {"train_loss": -39.2190055847168, "global_step": 118733, "epoch": 981} {"train_loss": -39.403846740722656, "global_step": 118734, "epoch": 981} {"train_loss": -39.74978256225586, "global_step": 118735, "epoch": 981} {"train_loss": -39.6679801940918, "global_step": 118736, "epoch": 981} {"train_loss": -39.29264450073242, "global_step": 118737, "epoch": 981} {"train_loss": -39.27092742919922, "global_step": 118738, "epoch": 981} {"train_loss": -39.43473815917969, "global_step": 118739, "epoch": 981} {"train_loss": -38.6739501953125, "global_step": 118740, "epoch": 981} {"train_loss": -39.09858322143555, "global_step": 118741, "epoch": 981} {"train_loss": -39.87493896484375, "global_step": 118742, "epoch": 981} {"train_loss": -39.54072952270508, "global_step": 118743, "epoch": 981} {"train_loss": -39.867916107177734, "global_step": 118744, "epoch": 981} {"train_loss": -39.37583541870117, "global_step": 118745, "epoch": 981} {"train_loss": -36.8741340637207, "global_step": 118746, "epoch": 981} {"train_loss": -39.18009567260742, "global_step": 118747, "epoch": 981} {"train_loss": -36.90871047973633, "global_step": 118748, "epoch": 981} {"train_loss": -39.939327239990234, "global_step": 118749, "epoch": 981} {"train_loss": -39.76065444946289, "global_step": 118750, "epoch": 981} {"train_loss": -39.283966064453125, "global_step": 118751, "epoch": 981} {"train_loss": -38.85002899169922, "global_step": 118752, "epoch": 981} {"train_loss": -38.504478454589844, "global_step": 118753, "epoch": 981} {"train_loss": -38.05349349975586, "global_step": 118754, "epoch": 981} {"train_loss": -38.48881149291992, "global_step": 118755, "epoch": 981} {"train_loss": -39.7802734375, "global_step": 118756, "epoch": 981} {"train_loss": -39.45777893066406, "global_step": 118757, "epoch": 981} {"train_loss": -38.951663970947266, "global_step": 118758, "epoch": 981} {"train_loss": -39.205055236816406, "global_step": 118759, "epoch": 981} {"train_loss": -37.97986602783203, "global_step": 118760, "epoch": 981} {"train_loss": -35.76176071166992, "global_step": 118761, "epoch": 981} {"train_loss": -38.23311233520508, "global_step": 118762, "epoch": 981} {"train_loss": -38.55280685424805, "global_step": 118763, "epoch": 981} {"train_loss": -38.450225830078125, "global_step": 118764, "epoch": 981} {"train_loss": -38.369571685791016, "global_step": 118765, "epoch": 981} {"train_loss": -37.780555725097656, "global_step": 118766, "epoch": 981} {"train_loss": -38.4605712890625, "global_step": 118767, "epoch": 981} {"train_loss": -38.623374938964844, "global_step": 118768, "epoch": 981} {"train_loss": -37.89351272583008, "global_step": 118769, "epoch": 981} {"train_loss": -36.59233093261719, "global_step": 118770, "epoch": 981} {"train_loss": -37.385475158691406, "global_step": 118771, "epoch": 981} {"train_loss": -34.565147399902344, "global_step": 118772, "epoch": 981} {"train_loss": -35.7380485534668, "global_step": 118773, "epoch": 981} {"train_loss": -33.97420883178711, "global_step": 118774, "epoch": 981} {"train_loss": -34.82218551635742, "global_step": 118775, "epoch": 981} {"train_loss": -35.86127471923828, "global_step": 118776, "epoch": 981} {"train_loss": -36.83369064331055, "global_step": 118777, "epoch": 981} {"train_loss": -38.98006820678711, "global_step": 118778, "epoch": 981} {"train_loss": -36.34721755981445, "global_step": 118779, "epoch": 981} {"train_loss": -38.33675765991211, "global_step": 118780, "epoch": 981} {"train_loss": -38.13306427001953, "global_step": 118781, "epoch": 981} {"train_loss": -37.68589401245117, "global_step": 118782, "epoch": 981} {"train_loss": -36.966182708740234, "global_step": 118783, "epoch": 981} {"train_loss": -38.473182678222656, "global_step": 118784, "epoch": 981} {"train_loss": -36.772315979003906, "global_step": 118785, "epoch": 981} {"train_loss": -36.24116897583008, "global_step": 118786, "epoch": 981} {"train_loss": -38.06511306762695, "global_step": 118787, "epoch": 981} {"train_loss": -39.30973434448242, "global_step": 118788, "epoch": 981} {"train_loss": -38.54026412963867, "global_step": 118789, "epoch": 981} {"train_loss": -38.260738372802734, "global_step": 118790, "epoch": 981} {"train_loss": -39.23472595214844, "global_step": 118791, "epoch": 981} {"train_loss": -37.9098014831543, "global_step": 118792, "epoch": 981} {"train_loss": -38.54996109008789, "global_step": 118793, "epoch": 981} {"train_loss": -38.5863037109375, "global_step": 118794, "epoch": 981} {"train_loss": -38.9334602355957, "global_step": 118795, "epoch": 981} {"train_loss": -39.4431266784668, "global_step": 118796, "epoch": 981} {"train_loss": -39.10660934448242, "global_step": 118797, "epoch": 981} {"train_loss": -38.8719596862793, "global_step": 118798, "epoch": 981} {"train_loss": -39.28945541381836, "global_step": 118799, "epoch": 981} {"train_loss": -38.8548698425293, "global_step": 118800, "epoch": 981} {"train_loss": -39.04446029663086, "global_step": 118801, "epoch": 981} {"train_loss": -39.211334228515625, "global_step": 118802, "epoch": 981} {"train_loss": -39.376399993896484, "global_step": 118803, "epoch": 981} {"train_loss": -39.547607421875, "global_step": 118804, "epoch": 981} {"train_loss": -39.04386901855469, "global_step": 118805, "epoch": 981} {"train_loss": -37.890480041503906, "global_step": 118806, "epoch": 981} {"train_loss": -39.36974334716797, "global_step": 118807, "epoch": 981} {"train_loss": -39.427120208740234, "global_step": 118808, "epoch": 981} {"train_loss": -39.80074691772461, "global_step": 118809, "epoch": 981} {"train_loss": -38.63668441772461, "global_step": 118810, "epoch": 981} {"train_loss": -37.216087341308594, "global_step": 118811, "epoch": 981} {"train_loss": -38.79190444946289, "global_step": 118812, "epoch": 981} {"train_loss": -38.08621597290039, "global_step": 118813, "epoch": 981} {"train_loss": -39.70737838745117, "global_step": 118814, "epoch": 981} {"train_loss": -38.97773361206055, "global_step": 118815, "epoch": 981} {"train_loss": -39.09096908569336, "global_step": 118816, "epoch": 981} {"train_loss": -38.94289779663086, "global_step": 118817, "epoch": 981} {"train_loss": -39.429195404052734, "global_step": 118818, "epoch": 981} {"train_loss": -38.89208221435547, "global_step": 118819, "epoch": 981} {"train_loss": -39.44207763671875, "global_step": 118820, "epoch": 981} {"train_loss": -38.55751772163328, "global_step": 118821, "epoch": 981, "val_loss": 2774282.75} {"train_loss": -38.65522384643555, "global_step": 118822, "epoch": 982} {"train_loss": -39.85521697998047, "global_step": 118823, "epoch": 982} {"train_loss": -38.304847717285156, "global_step": 118824, "epoch": 982} {"train_loss": -38.77199935913086, "global_step": 118825, "epoch": 982} {"train_loss": -39.17676544189453, "global_step": 118826, "epoch": 982} {"train_loss": -39.59279251098633, "global_step": 118827, "epoch": 982} {"train_loss": -39.566986083984375, "global_step": 118828, "epoch": 982} {"train_loss": -39.745643615722656, "global_step": 118829, "epoch": 982} {"train_loss": -38.956268310546875, "global_step": 118830, "epoch": 982} {"train_loss": -40.01018142700195, "global_step": 118831, "epoch": 982} {"train_loss": -39.995601654052734, "global_step": 118832, "epoch": 982} {"train_loss": -39.51598358154297, "global_step": 118833, "epoch": 982} {"train_loss": -38.294830322265625, "global_step": 118834, "epoch": 982} {"train_loss": -39.86518478393555, "global_step": 118835, "epoch": 982} {"train_loss": -39.12464141845703, "global_step": 118836, "epoch": 982} {"train_loss": -39.066402435302734, "global_step": 118837, "epoch": 982} {"train_loss": -40.11246109008789, "global_step": 118838, "epoch": 982} {"train_loss": -39.23151397705078, "global_step": 118839, "epoch": 982} {"train_loss": -38.82046127319336, "global_step": 118840, "epoch": 982} {"train_loss": -38.740379333496094, "global_step": 118841, "epoch": 982} {"train_loss": -38.5500602722168, "global_step": 118842, "epoch": 982} {"train_loss": -37.68288803100586, "global_step": 118843, "epoch": 982} {"train_loss": -39.30215835571289, "global_step": 118844, "epoch": 982} {"train_loss": -39.2568244934082, "global_step": 118845, "epoch": 982} {"train_loss": -38.54923629760742, "global_step": 118846, "epoch": 982} {"train_loss": -38.425933837890625, "global_step": 118847, "epoch": 982} {"train_loss": -38.99821853637695, "global_step": 118848, "epoch": 982} {"train_loss": -39.368194580078125, "global_step": 118849, "epoch": 982} {"train_loss": -39.47380447387695, "global_step": 118850, "epoch": 982} {"train_loss": -37.83423614501953, "global_step": 118851, "epoch": 982} {"train_loss": -36.411128997802734, "global_step": 118852, "epoch": 982} {"train_loss": -37.95857238769531, "global_step": 118853, "epoch": 982} {"train_loss": -38.90245056152344, "global_step": 118854, "epoch": 982} {"train_loss": -39.893985748291016, "global_step": 118855, "epoch": 982} {"train_loss": -38.70725631713867, "global_step": 118856, "epoch": 982} {"train_loss": -38.0244026184082, "global_step": 118857, "epoch": 982} {"train_loss": -38.313201904296875, "global_step": 118858, "epoch": 982} {"train_loss": -38.6099739074707, "global_step": 118859, "epoch": 982} {"train_loss": -35.95555114746094, "global_step": 118860, "epoch": 982} {"train_loss": -37.60511016845703, "global_step": 118861, "epoch": 982} {"train_loss": -35.522151947021484, "global_step": 118862, "epoch": 982} {"train_loss": -39.14555740356445, "global_step": 118863, "epoch": 982} {"train_loss": -37.81532669067383, "global_step": 118864, "epoch": 982} {"train_loss": -35.731353759765625, "global_step": 118865, "epoch": 982} {"train_loss": -34.53942108154297, "global_step": 118866, "epoch": 982} {"train_loss": -38.21491241455078, "global_step": 118867, "epoch": 982} {"train_loss": -39.30807876586914, "global_step": 118868, "epoch": 982} {"train_loss": -37.39539337158203, "global_step": 118869, "epoch": 982} {"train_loss": -37.19149398803711, "global_step": 118870, "epoch": 982} {"train_loss": -38.020957946777344, "global_step": 118871, "epoch": 982} {"train_loss": -39.032257080078125, "global_step": 118872, "epoch": 982} {"train_loss": -37.98060989379883, "global_step": 118873, "epoch": 982} {"train_loss": -34.515926361083984, "global_step": 118874, "epoch": 982} {"train_loss": -36.94755172729492, "global_step": 118875, "epoch": 982} {"train_loss": -37.230159759521484, "global_step": 118876, "epoch": 982} {"train_loss": -36.519866943359375, "global_step": 118877, "epoch": 982} {"train_loss": -36.004493713378906, "global_step": 118878, "epoch": 982} {"train_loss": -38.58095932006836, "global_step": 118879, "epoch": 982} {"train_loss": -36.93653869628906, "global_step": 118880, "epoch": 982} {"train_loss": -36.477291107177734, "global_step": 118881, "epoch": 982} {"train_loss": -37.3056755065918, "global_step": 118882, "epoch": 982} {"train_loss": -38.5198974609375, "global_step": 118883, "epoch": 982} {"train_loss": -36.106624603271484, "global_step": 118884, "epoch": 982} {"train_loss": -38.51484298706055, "global_step": 118885, "epoch": 982} {"train_loss": -38.9136848449707, "global_step": 118886, "epoch": 982} {"train_loss": -39.22275924682617, "global_step": 118887, "epoch": 982} {"train_loss": -37.28593063354492, "global_step": 118888, "epoch": 982} {"train_loss": -37.65383529663086, "global_step": 118889, "epoch": 982} {"train_loss": -39.02851104736328, "global_step": 118890, "epoch": 982} {"train_loss": -37.77204132080078, "global_step": 118891, "epoch": 982} {"train_loss": -37.11045455932617, "global_step": 118892, "epoch": 982} {"train_loss": -37.58605194091797, "global_step": 118893, "epoch": 982} {"train_loss": -39.41130447387695, "global_step": 118894, "epoch": 982} {"train_loss": -36.922340393066406, "global_step": 118895, "epoch": 982} {"train_loss": -39.252227783203125, "global_step": 118896, "epoch": 982} {"train_loss": -38.443939208984375, "global_step": 118897, "epoch": 982} {"train_loss": -38.1308708190918, "global_step": 118898, "epoch": 982} {"train_loss": -38.212501525878906, "global_step": 118899, "epoch": 982} {"train_loss": -38.428714752197266, "global_step": 118900, "epoch": 982} {"train_loss": -38.98191452026367, "global_step": 118901, "epoch": 982} {"train_loss": -38.7791748046875, "global_step": 118902, "epoch": 982} {"train_loss": -38.11335372924805, "global_step": 118903, "epoch": 982} {"train_loss": -38.63162612915039, "global_step": 118904, "epoch": 982} {"train_loss": -37.133907318115234, "global_step": 118905, "epoch": 982} {"train_loss": -39.47016525268555, "global_step": 118906, "epoch": 982} {"train_loss": -38.46053695678711, "global_step": 118907, "epoch": 982} {"train_loss": -39.30388259887695, "global_step": 118908, "epoch": 982} {"train_loss": -38.84889221191406, "global_step": 118909, "epoch": 982} {"train_loss": -38.854087829589844, "global_step": 118910, "epoch": 982} {"train_loss": -39.0986328125, "global_step": 118911, "epoch": 982} {"train_loss": -38.34708786010742, "global_step": 118912, "epoch": 982} {"train_loss": -39.38290023803711, "global_step": 118913, "epoch": 982} {"train_loss": -39.09821701049805, "global_step": 118914, "epoch": 982} {"train_loss": -39.029598236083984, "global_step": 118915, "epoch": 982} {"train_loss": -38.987300872802734, "global_step": 118916, "epoch": 982} {"train_loss": -39.04345703125, "global_step": 118917, "epoch": 982} {"train_loss": -39.43687057495117, "global_step": 118918, "epoch": 982} {"train_loss": -39.268917083740234, "global_step": 118919, "epoch": 982} {"train_loss": -38.74467849731445, "global_step": 118920, "epoch": 982} {"train_loss": -38.86649703979492, "global_step": 118921, "epoch": 982} {"train_loss": -39.00846862792969, "global_step": 118922, "epoch": 982} {"train_loss": -38.052886962890625, "global_step": 118923, "epoch": 982} {"train_loss": -40.09068298339844, "global_step": 118924, "epoch": 982} {"train_loss": -39.565914154052734, "global_step": 118925, "epoch": 982} {"train_loss": -39.63372039794922, "global_step": 118926, "epoch": 982} {"train_loss": -38.92115020751953, "global_step": 118927, "epoch": 982} {"train_loss": -38.927120208740234, "global_step": 118928, "epoch": 982} {"train_loss": -40.148284912109375, "global_step": 118929, "epoch": 982} {"train_loss": -39.842586517333984, "global_step": 118930, "epoch": 982} {"train_loss": -39.61859130859375, "global_step": 118931, "epoch": 982} {"train_loss": -38.088436126708984, "global_step": 118932, "epoch": 982} {"train_loss": -39.794830322265625, "global_step": 118933, "epoch": 982} {"train_loss": -39.955848693847656, "global_step": 118934, "epoch": 982} {"train_loss": -39.32564163208008, "global_step": 118935, "epoch": 982} {"train_loss": -39.83144760131836, "global_step": 118936, "epoch": 982} {"train_loss": -39.77635955810547, "global_step": 118937, "epoch": 982} {"train_loss": -39.79105758666992, "global_step": 118938, "epoch": 982} {"train_loss": -39.033870697021484, "global_step": 118939, "epoch": 982} {"train_loss": -39.80175018310547, "global_step": 118940, "epoch": 982} {"train_loss": -38.918399810791016, "global_step": 118941, "epoch": 982} {"train_loss": -38.52979369991082, "global_step": 118942, "epoch": 982, "val_loss": 2780890.25} {"train_loss": -38.60805892944336, "global_step": 118943, "epoch": 983} {"train_loss": -39.096099853515625, "global_step": 118944, "epoch": 983} {"train_loss": -38.84132766723633, "global_step": 118945, "epoch": 983} {"train_loss": -38.05714416503906, "global_step": 118946, "epoch": 983} {"train_loss": -38.0052375793457, "global_step": 118947, "epoch": 983} {"train_loss": -39.40958786010742, "global_step": 118948, "epoch": 983} {"train_loss": -39.42582321166992, "global_step": 118949, "epoch": 983} {"train_loss": -37.155738830566406, "global_step": 118950, "epoch": 983} {"train_loss": -38.16936111450195, "global_step": 118951, "epoch": 983} {"train_loss": -39.41053009033203, "global_step": 118952, "epoch": 983} {"train_loss": -37.3470573425293, "global_step": 118953, "epoch": 983} {"train_loss": -34.62309646606445, "global_step": 118954, "epoch": 983} {"train_loss": -37.926387786865234, "global_step": 118955, "epoch": 983} {"train_loss": -39.54365158081055, "global_step": 118956, "epoch": 983} {"train_loss": -38.50323486328125, "global_step": 118957, "epoch": 983} {"train_loss": -38.4269905090332, "global_step": 118958, "epoch": 983} {"train_loss": -38.570430755615234, "global_step": 118959, "epoch": 983} {"train_loss": -38.19315719604492, "global_step": 118960, "epoch": 983} {"train_loss": -38.04645919799805, "global_step": 118961, "epoch": 983} {"train_loss": -39.04985809326172, "global_step": 118962, "epoch": 983} {"train_loss": -39.18170928955078, "global_step": 118963, "epoch": 983} {"train_loss": -38.90573501586914, "global_step": 118964, "epoch": 983} {"train_loss": -37.21426010131836, "global_step": 118965, "epoch": 983} {"train_loss": -38.323299407958984, "global_step": 118966, "epoch": 983} {"train_loss": -38.42996597290039, "global_step": 118967, "epoch": 983} {"train_loss": -38.85738754272461, "global_step": 118968, "epoch": 983} {"train_loss": -38.4926872253418, "global_step": 118969, "epoch": 983} {"train_loss": -38.52315139770508, "global_step": 118970, "epoch": 983} {"train_loss": -38.293739318847656, "global_step": 118971, "epoch": 983} {"train_loss": -38.551368713378906, "global_step": 118972, "epoch": 983} {"train_loss": -39.2985954284668, "global_step": 118973, "epoch": 983} {"train_loss": -39.06861114501953, "global_step": 118974, "epoch": 983} {"train_loss": -38.605281829833984, "global_step": 118975, "epoch": 983} {"train_loss": -37.35215377807617, "global_step": 118976, "epoch": 983} {"train_loss": -38.742977142333984, "global_step": 118977, "epoch": 983} {"train_loss": -38.99494552612305, "global_step": 118978, "epoch": 983} {"train_loss": -38.80767059326172, "global_step": 118979, "epoch": 983} {"train_loss": -39.610591888427734, "global_step": 118980, "epoch": 983} {"train_loss": -39.13862228393555, "global_step": 118981, "epoch": 983} {"train_loss": -39.65810775756836, "global_step": 118982, "epoch": 983} {"train_loss": -39.88694763183594, "global_step": 118983, "epoch": 983} {"train_loss": -34.04360580444336, "global_step": 118984, "epoch": 983} {"train_loss": -39.14059066772461, "global_step": 118985, "epoch": 983} {"train_loss": -38.991634368896484, "global_step": 118986, "epoch": 983} {"train_loss": -39.84641647338867, "global_step": 118987, "epoch": 983} {"train_loss": -39.48991394042969, "global_step": 118988, "epoch": 983} {"train_loss": -38.44095993041992, "global_step": 118989, "epoch": 983} {"train_loss": -37.44742965698242, "global_step": 118990, "epoch": 983} {"train_loss": -38.753902435302734, "global_step": 118991, "epoch": 983} {"train_loss": -39.248870849609375, "global_step": 118992, "epoch": 983} {"train_loss": -38.760250091552734, "global_step": 118993, "epoch": 983} {"train_loss": -39.06039047241211, "global_step": 118994, "epoch": 983} {"train_loss": -39.64024353027344, "global_step": 118995, "epoch": 983} {"train_loss": -38.74750518798828, "global_step": 118996, "epoch": 983} {"train_loss": -40.0058479309082, "global_step": 118997, "epoch": 983} {"train_loss": -38.17375564575195, "global_step": 118998, "epoch": 983} {"train_loss": -39.477901458740234, "global_step": 118999, "epoch": 983} {"train_loss": -39.14631271362305, "global_step": 119000, "epoch": 983} {"train_loss": -38.7845458984375, "global_step": 119001, "epoch": 983} {"train_loss": -38.79519271850586, "global_step": 119002, "epoch": 983} {"train_loss": -39.50068283081055, "global_step": 119003, "epoch": 983} {"train_loss": -36.82200241088867, "global_step": 119004, "epoch": 983} {"train_loss": -39.1470832824707, "global_step": 119005, "epoch": 983} {"train_loss": -38.79885482788086, "global_step": 119006, "epoch": 983} {"train_loss": -39.37144470214844, "global_step": 119007, "epoch": 983} {"train_loss": -37.30810546875, "global_step": 119008, "epoch": 983} {"train_loss": -39.55494689941406, "global_step": 119009, "epoch": 983} {"train_loss": -39.6367301940918, "global_step": 119010, "epoch": 983} {"train_loss": -39.03935623168945, "global_step": 119011, "epoch": 983} {"train_loss": -39.13563919067383, "global_step": 119012, "epoch": 983} {"train_loss": -39.16567611694336, "global_step": 119013, "epoch": 983} {"train_loss": -38.913719177246094, "global_step": 119014, "epoch": 983} {"train_loss": -36.05257797241211, "global_step": 119015, "epoch": 983} {"train_loss": -38.10765838623047, "global_step": 119016, "epoch": 983} {"train_loss": -38.03542709350586, "global_step": 119017, "epoch": 983} {"train_loss": -39.35006332397461, "global_step": 119018, "epoch": 983} {"train_loss": -33.978240966796875, "global_step": 119019, "epoch": 983} {"train_loss": -37.97512435913086, "global_step": 119020, "epoch": 983} {"train_loss": -39.02494430541992, "global_step": 119021, "epoch": 983} {"train_loss": -37.688968658447266, "global_step": 119022, "epoch": 983} {"train_loss": -35.13149642944336, "global_step": 119023, "epoch": 983} {"train_loss": -39.2775764465332, "global_step": 119024, "epoch": 983} {"train_loss": -39.44782638549805, "global_step": 119025, "epoch": 983} {"train_loss": -37.702674865722656, "global_step": 119026, "epoch": 983} {"train_loss": -37.03837203979492, "global_step": 119027, "epoch": 983} {"train_loss": -37.3480339050293, "global_step": 119028, "epoch": 983} {"train_loss": -37.47932052612305, "global_step": 119029, "epoch": 983} {"train_loss": -38.368831634521484, "global_step": 119030, "epoch": 983} {"train_loss": -37.102596282958984, "global_step": 119031, "epoch": 983} {"train_loss": -37.30308151245117, "global_step": 119032, "epoch": 983} {"train_loss": -37.63249588012695, "global_step": 119033, "epoch": 983} {"train_loss": -36.1207160949707, "global_step": 119034, "epoch": 983} {"train_loss": -34.67742156982422, "global_step": 119035, "epoch": 983} {"train_loss": -38.141326904296875, "global_step": 119036, "epoch": 983} {"train_loss": -37.44802474975586, "global_step": 119037, "epoch": 983} {"train_loss": -36.598018646240234, "global_step": 119038, "epoch": 983} {"train_loss": -35.982051849365234, "global_step": 119039, "epoch": 983} {"train_loss": -35.97035598754883, "global_step": 119040, "epoch": 983} {"train_loss": -38.4520263671875, "global_step": 119041, "epoch": 983} {"train_loss": -34.84890365600586, "global_step": 119042, "epoch": 983} {"train_loss": -34.76668167114258, "global_step": 119043, "epoch": 983} {"train_loss": -37.85066223144531, "global_step": 119044, "epoch": 983} {"train_loss": -37.23869323730469, "global_step": 119045, "epoch": 983} {"train_loss": -36.851051330566406, "global_step": 119046, "epoch": 983} {"train_loss": -38.169395446777344, "global_step": 119047, "epoch": 983} {"train_loss": -38.05947494506836, "global_step": 119048, "epoch": 983} {"train_loss": -38.27146530151367, "global_step": 119049, "epoch": 983} {"train_loss": -36.20223617553711, "global_step": 119050, "epoch": 983} {"train_loss": -38.65443801879883, "global_step": 119051, "epoch": 983} {"train_loss": -37.22645950317383, "global_step": 119052, "epoch": 983} {"train_loss": -37.84877395629883, "global_step": 119053, "epoch": 983} {"train_loss": -37.90211868286133, "global_step": 119054, "epoch": 983} {"train_loss": -38.09444808959961, "global_step": 119055, "epoch": 983} {"train_loss": -38.44538497924805, "global_step": 119056, "epoch": 983} {"train_loss": -38.28052520751953, "global_step": 119057, "epoch": 983} {"train_loss": -38.120758056640625, "global_step": 119058, "epoch": 983} {"train_loss": -37.86843490600586, "global_step": 119059, "epoch": 983} {"train_loss": -37.60763168334961, "global_step": 119060, "epoch": 983} {"train_loss": -38.232505798339844, "global_step": 119061, "epoch": 983} {"train_loss": -38.21247482299805, "global_step": 119062, "epoch": 983} {"train_loss": -38.157101371071555, "global_step": 119063, "epoch": 983, "val_loss": 2706486.0} {"train_loss": -38.20731735229492, "global_step": 119064, "epoch": 984} {"train_loss": -38.30988693237305, "global_step": 119065, "epoch": 984} {"train_loss": -38.87248611450195, "global_step": 119066, "epoch": 984} {"train_loss": -38.32021713256836, "global_step": 119067, "epoch": 984} {"train_loss": -39.295711517333984, "global_step": 119068, "epoch": 984} {"train_loss": -38.957401275634766, "global_step": 119069, "epoch": 984} {"train_loss": -39.00877380371094, "global_step": 119070, "epoch": 984} {"train_loss": -38.71210479736328, "global_step": 119071, "epoch": 984} {"train_loss": -38.97426223754883, "global_step": 119072, "epoch": 984} {"train_loss": -38.80927658081055, "global_step": 119073, "epoch": 984} {"train_loss": -39.1871337890625, "global_step": 119074, "epoch": 984} {"train_loss": -38.52980041503906, "global_step": 119075, "epoch": 984} {"train_loss": -38.18899917602539, "global_step": 119076, "epoch": 984} {"train_loss": -38.71523666381836, "global_step": 119077, "epoch": 984} {"train_loss": -39.04173278808594, "global_step": 119078, "epoch": 984} {"train_loss": -38.576171875, "global_step": 119079, "epoch": 984} {"train_loss": -39.03815460205078, "global_step": 119080, "epoch": 984} {"train_loss": -38.92738342285156, "global_step": 119081, "epoch": 984} {"train_loss": -38.7913818359375, "global_step": 119082, "epoch": 984} {"train_loss": -38.728599548339844, "global_step": 119083, "epoch": 984} {"train_loss": -36.552894592285156, "global_step": 119084, "epoch": 984} {"train_loss": -36.54969024658203, "global_step": 119085, "epoch": 984} {"train_loss": -34.57062911987305, "global_step": 119086, "epoch": 984} {"train_loss": -34.32685852050781, "global_step": 119087, "epoch": 984} {"train_loss": -35.43995666503906, "global_step": 119088, "epoch": 984} {"train_loss": -37.38225555419922, "global_step": 119089, "epoch": 984} {"train_loss": -38.45269775390625, "global_step": 119090, "epoch": 984} {"train_loss": -34.869293212890625, "global_step": 119091, "epoch": 984} {"train_loss": -37.025611877441406, "global_step": 119092, "epoch": 984} {"train_loss": -38.77075958251953, "global_step": 119093, "epoch": 984} {"train_loss": -38.44443893432617, "global_step": 119094, "epoch": 984} {"train_loss": -37.517669677734375, "global_step": 119095, "epoch": 984} {"train_loss": -37.75469207763672, "global_step": 119096, "epoch": 984} {"train_loss": -38.889217376708984, "global_step": 119097, "epoch": 984} {"train_loss": -34.4366569519043, "global_step": 119098, "epoch": 984} {"train_loss": -37.27302932739258, "global_step": 119099, "epoch": 984} {"train_loss": -38.75828552246094, "global_step": 119100, "epoch": 984} {"train_loss": -35.48154067993164, "global_step": 119101, "epoch": 984} {"train_loss": -37.72040939331055, "global_step": 119102, "epoch": 984} {"train_loss": -38.12049102783203, "global_step": 119103, "epoch": 984} {"train_loss": -35.09931564331055, "global_step": 119104, "epoch": 984} {"train_loss": -38.369483947753906, "global_step": 119105, "epoch": 984} {"train_loss": -36.68067932128906, "global_step": 119106, "epoch": 984} {"train_loss": -37.89349365234375, "global_step": 119107, "epoch": 984} {"train_loss": -37.63481140136719, "global_step": 119108, "epoch": 984} {"train_loss": -38.40227508544922, "global_step": 119109, "epoch": 984} {"train_loss": -37.77130126953125, "global_step": 119110, "epoch": 984} {"train_loss": -38.026573181152344, "global_step": 119111, "epoch": 984} {"train_loss": -38.84892654418945, "global_step": 119112, "epoch": 984} {"train_loss": -38.13959884643555, "global_step": 119113, "epoch": 984} {"train_loss": -39.23212814331055, "global_step": 119114, "epoch": 984} {"train_loss": -38.210792541503906, "global_step": 119115, "epoch": 984} {"train_loss": -39.29311752319336, "global_step": 119116, "epoch": 984} {"train_loss": -38.8045768737793, "global_step": 119117, "epoch": 984} {"train_loss": -39.25305938720703, "global_step": 119118, "epoch": 984} {"train_loss": -38.62924575805664, "global_step": 119119, "epoch": 984} {"train_loss": -38.48649215698242, "global_step": 119120, "epoch": 984} {"train_loss": -38.836158752441406, "global_step": 119121, "epoch": 984} {"train_loss": -39.13956832885742, "global_step": 119122, "epoch": 984} {"train_loss": -38.35311508178711, "global_step": 119123, "epoch": 984} {"train_loss": -39.39160919189453, "global_step": 119124, "epoch": 984} {"train_loss": -38.77388381958008, "global_step": 119125, "epoch": 984} {"train_loss": -39.038082122802734, "global_step": 119126, "epoch": 984} {"train_loss": -39.03590393066406, "global_step": 119127, "epoch": 984} {"train_loss": -38.74544143676758, "global_step": 119128, "epoch": 984} {"train_loss": -38.88765335083008, "global_step": 119129, "epoch": 984} {"train_loss": -38.75947189331055, "global_step": 119130, "epoch": 984} {"train_loss": -39.009395599365234, "global_step": 119131, "epoch": 984} {"train_loss": -39.50603103637695, "global_step": 119132, "epoch": 984} {"train_loss": -39.2575798034668, "global_step": 119133, "epoch": 984} {"train_loss": -39.024410247802734, "global_step": 119134, "epoch": 984} {"train_loss": -39.535091400146484, "global_step": 119135, "epoch": 984} {"train_loss": -38.77973556518555, "global_step": 119136, "epoch": 984} {"train_loss": -39.54936599731445, "global_step": 119137, "epoch": 984} {"train_loss": -39.65585708618164, "global_step": 119138, "epoch": 984} {"train_loss": -39.400814056396484, "global_step": 119139, "epoch": 984} {"train_loss": -38.47894287109375, "global_step": 119140, "epoch": 984} {"train_loss": -38.30019760131836, "global_step": 119141, "epoch": 984} {"train_loss": -38.514583587646484, "global_step": 119142, "epoch": 984} {"train_loss": -39.01557159423828, "global_step": 119143, "epoch": 984} {"train_loss": -39.75914764404297, "global_step": 119144, "epoch": 984} {"train_loss": -38.829193115234375, "global_step": 119145, "epoch": 984} {"train_loss": -39.58277893066406, "global_step": 119146, "epoch": 984} {"train_loss": -37.3455924987793, "global_step": 119147, "epoch": 984} {"train_loss": -38.488346099853516, "global_step": 119148, "epoch": 984} {"train_loss": -38.64794921875, "global_step": 119149, "epoch": 984} {"train_loss": -39.384979248046875, "global_step": 119150, "epoch": 984} {"train_loss": -39.51992416381836, "global_step": 119151, "epoch": 984} {"train_loss": -37.0496711730957, "global_step": 119152, "epoch": 984} {"train_loss": -37.18843460083008, "global_step": 119153, "epoch": 984} {"train_loss": -37.99491500854492, "global_step": 119154, "epoch": 984} {"train_loss": -37.71851348876953, "global_step": 119155, "epoch": 984} {"train_loss": -39.32729721069336, "global_step": 119156, "epoch": 984} {"train_loss": -39.21612548828125, "global_step": 119157, "epoch": 984} {"train_loss": -38.9322395324707, "global_step": 119158, "epoch": 984} {"train_loss": -39.067527770996094, "global_step": 119159, "epoch": 984} {"train_loss": -38.75689697265625, "global_step": 119160, "epoch": 984} {"train_loss": -39.29136276245117, "global_step": 119161, "epoch": 984} {"train_loss": -39.714515686035156, "global_step": 119162, "epoch": 984} {"train_loss": -39.52225875854492, "global_step": 119163, "epoch": 984} {"train_loss": -38.75689697265625, "global_step": 119164, "epoch": 984} {"train_loss": -39.63936996459961, "global_step": 119165, "epoch": 984} {"train_loss": -39.130638122558594, "global_step": 119166, "epoch": 984} {"train_loss": -39.28548812866211, "global_step": 119167, "epoch": 984} {"train_loss": -39.32181930541992, "global_step": 119168, "epoch": 984} {"train_loss": -39.7320556640625, "global_step": 119169, "epoch": 984} {"train_loss": -39.532867431640625, "global_step": 119170, "epoch": 984} {"train_loss": -39.7829475402832, "global_step": 119171, "epoch": 984} {"train_loss": -39.675132751464844, "global_step": 119172, "epoch": 984} {"train_loss": -39.595760345458984, "global_step": 119173, "epoch": 984} {"train_loss": -38.88336181640625, "global_step": 119174, "epoch": 984} {"train_loss": -39.919429779052734, "global_step": 119175, "epoch": 984} {"train_loss": -39.763309478759766, "global_step": 119176, "epoch": 984} {"train_loss": -40.197914123535156, "global_step": 119177, "epoch": 984} {"train_loss": -38.862876892089844, "global_step": 119178, "epoch": 984} {"train_loss": -39.53007125854492, "global_step": 119179, "epoch": 984} {"train_loss": -38.9740104675293, "global_step": 119180, "epoch": 984} {"train_loss": -38.81635665893555, "global_step": 119181, "epoch": 984} {"train_loss": -38.63506317138672, "global_step": 119182, "epoch": 984} {"train_loss": -38.61015701293945, "global_step": 119183, "epoch": 984} {"train_loss": -38.5145118650326, "global_step": 119184, "epoch": 984, "val_loss": 2748185.75} {"train_loss": -39.69011306762695, "global_step": 119185, "epoch": 985} {"train_loss": -40.303871154785156, "global_step": 119186, "epoch": 985} {"train_loss": -39.84011459350586, "global_step": 119187, "epoch": 985} {"train_loss": -38.8189582824707, "global_step": 119188, "epoch": 985} {"train_loss": -35.66596221923828, "global_step": 119189, "epoch": 985} {"train_loss": -35.05718231201172, "global_step": 119190, "epoch": 985} {"train_loss": -31.8133544921875, "global_step": 119191, "epoch": 985} {"train_loss": -34.68975830078125, "global_step": 119192, "epoch": 985} {"train_loss": -36.97164535522461, "global_step": 119193, "epoch": 985} {"train_loss": -35.91969299316406, "global_step": 119194, "epoch": 985} {"train_loss": -32.75986862182617, "global_step": 119195, "epoch": 985} {"train_loss": -28.499374389648438, "global_step": 119196, "epoch": 985} {"train_loss": -35.647823333740234, "global_step": 119197, "epoch": 985} {"train_loss": -34.11307907104492, "global_step": 119198, "epoch": 985} {"train_loss": -36.56380844116211, "global_step": 119199, "epoch": 985} {"train_loss": -36.37923049926758, "global_step": 119200, "epoch": 985} {"train_loss": -34.64971160888672, "global_step": 119201, "epoch": 985} {"train_loss": -37.212215423583984, "global_step": 119202, "epoch": 985} {"train_loss": -37.158084869384766, "global_step": 119203, "epoch": 985} {"train_loss": -29.586362838745117, "global_step": 119204, "epoch": 985} {"train_loss": -36.45901107788086, "global_step": 119205, "epoch": 985} {"train_loss": -36.54925537109375, "global_step": 119206, "epoch": 985} {"train_loss": -36.32955551147461, "global_step": 119207, "epoch": 985} {"train_loss": -36.76575469970703, "global_step": 119208, "epoch": 985} {"train_loss": -37.255714416503906, "global_step": 119209, "epoch": 985} {"train_loss": -37.807125091552734, "global_step": 119210, "epoch": 985} {"train_loss": -37.57753372192383, "global_step": 119211, "epoch": 985} {"train_loss": -36.86408615112305, "global_step": 119212, "epoch": 985} {"train_loss": -38.54445266723633, "global_step": 119213, "epoch": 985} {"train_loss": -38.522491455078125, "global_step": 119214, "epoch": 985} {"train_loss": -38.842437744140625, "global_step": 119215, "epoch": 985} {"train_loss": -37.14301681518555, "global_step": 119216, "epoch": 985} {"train_loss": -37.09108352661133, "global_step": 119217, "epoch": 985} {"train_loss": -38.4284782409668, "global_step": 119218, "epoch": 985} {"train_loss": -38.395416259765625, "global_step": 119219, "epoch": 985} {"train_loss": -39.19085693359375, "global_step": 119220, "epoch": 985} {"train_loss": -37.97145080566406, "global_step": 119221, "epoch": 985} {"train_loss": -38.49363327026367, "global_step": 119222, "epoch": 985} {"train_loss": -38.4932975769043, "global_step": 119223, "epoch": 985} {"train_loss": -38.679405212402344, "global_step": 119224, "epoch": 985} {"train_loss": -37.56321334838867, "global_step": 119225, "epoch": 985} {"train_loss": -38.08079147338867, "global_step": 119226, "epoch": 985} {"train_loss": -39.04599380493164, "global_step": 119227, "epoch": 985} {"train_loss": -38.233089447021484, "global_step": 119228, "epoch": 985} {"train_loss": -38.459075927734375, "global_step": 119229, "epoch": 985} {"train_loss": -39.267547607421875, "global_step": 119230, "epoch": 985} {"train_loss": -38.496368408203125, "global_step": 119231, "epoch": 985} {"train_loss": -38.63981246948242, "global_step": 119232, "epoch": 985} {"train_loss": -34.10384750366211, "global_step": 119233, "epoch": 985} {"train_loss": -39.121253967285156, "global_step": 119234, "epoch": 985} {"train_loss": -38.2774658203125, "global_step": 119235, "epoch": 985} {"train_loss": -38.04753875732422, "global_step": 119236, "epoch": 985} {"train_loss": -38.311973571777344, "global_step": 119237, "epoch": 985} {"train_loss": -38.2312126159668, "global_step": 119238, "epoch": 985} {"train_loss": -38.81172561645508, "global_step": 119239, "epoch": 985} {"train_loss": -37.76313400268555, "global_step": 119240, "epoch": 985} {"train_loss": -38.14594650268555, "global_step": 119241, "epoch": 985} {"train_loss": -38.2266731262207, "global_step": 119242, "epoch": 985} {"train_loss": -38.096126556396484, "global_step": 119243, "epoch": 985} {"train_loss": -37.62982940673828, "global_step": 119244, "epoch": 985} {"train_loss": -37.99092483520508, "global_step": 119245, "epoch": 985} {"train_loss": -38.30757522583008, "global_step": 119246, "epoch": 985} {"train_loss": -36.09196090698242, "global_step": 119247, "epoch": 985} {"train_loss": -38.83315658569336, "global_step": 119248, "epoch": 985} {"train_loss": -38.41512680053711, "global_step": 119249, "epoch": 985} {"train_loss": -38.761451721191406, "global_step": 119250, "epoch": 985} {"train_loss": -37.64997482299805, "global_step": 119251, "epoch": 985} {"train_loss": -37.45667266845703, "global_step": 119252, "epoch": 985} {"train_loss": -38.851593017578125, "global_step": 119253, "epoch": 985} {"train_loss": -38.99211502075195, "global_step": 119254, "epoch": 985} {"train_loss": -38.87502670288086, "global_step": 119255, "epoch": 985} {"train_loss": -39.12090301513672, "global_step": 119256, "epoch": 985} {"train_loss": -39.325462341308594, "global_step": 119257, "epoch": 985} {"train_loss": -38.5377082824707, "global_step": 119258, "epoch": 985} {"train_loss": -38.771766662597656, "global_step": 119259, "epoch": 985} {"train_loss": -38.516845703125, "global_step": 119260, "epoch": 985} {"train_loss": -38.37567138671875, "global_step": 119261, "epoch": 985} {"train_loss": -39.35936737060547, "global_step": 119262, "epoch": 985} {"train_loss": -38.062294006347656, "global_step": 119263, "epoch": 985} {"train_loss": -38.612667083740234, "global_step": 119264, "epoch": 985} {"train_loss": -39.08701705932617, "global_step": 119265, "epoch": 985} {"train_loss": -38.34121322631836, "global_step": 119266, "epoch": 985} {"train_loss": -38.80430221557617, "global_step": 119267, "epoch": 985} {"train_loss": -38.88001251220703, "global_step": 119268, "epoch": 985} {"train_loss": -39.14064407348633, "global_step": 119269, "epoch": 985} {"train_loss": -38.93886184692383, "global_step": 119270, "epoch": 985} {"train_loss": -39.60683059692383, "global_step": 119271, "epoch": 985} {"train_loss": -39.14982986450195, "global_step": 119272, "epoch": 985} {"train_loss": -39.65791320800781, "global_step": 119273, "epoch": 985} {"train_loss": -39.24256134033203, "global_step": 119274, "epoch": 985} {"train_loss": -39.134368896484375, "global_step": 119275, "epoch": 985} {"train_loss": -38.547054290771484, "global_step": 119276, "epoch": 985} {"train_loss": -38.243377685546875, "global_step": 119277, "epoch": 985} {"train_loss": -39.723419189453125, "global_step": 119278, "epoch": 985} {"train_loss": -39.37373352050781, "global_step": 119279, "epoch": 985} {"train_loss": -39.7479133605957, "global_step": 119280, "epoch": 985} {"train_loss": -38.57331466674805, "global_step": 119281, "epoch": 985} {"train_loss": -39.09937286376953, "global_step": 119282, "epoch": 985} {"train_loss": -39.832374572753906, "global_step": 119283, "epoch": 985} {"train_loss": -38.94625473022461, "global_step": 119284, "epoch": 985} {"train_loss": -39.174217224121094, "global_step": 119285, "epoch": 985} {"train_loss": -38.02193832397461, "global_step": 119286, "epoch": 985} {"train_loss": -38.859554290771484, "global_step": 119287, "epoch": 985} {"train_loss": -38.37664031982422, "global_step": 119288, "epoch": 985} {"train_loss": -39.115570068359375, "global_step": 119289, "epoch": 985} {"train_loss": -38.41947555541992, "global_step": 119290, "epoch": 985} {"train_loss": -39.0195426940918, "global_step": 119291, "epoch": 985} {"train_loss": -39.219295501708984, "global_step": 119292, "epoch": 985} {"train_loss": -39.49968338012695, "global_step": 119293, "epoch": 985} {"train_loss": -38.469444274902344, "global_step": 119294, "epoch": 985} {"train_loss": -38.50936508178711, "global_step": 119295, "epoch": 985} {"train_loss": -38.92941665649414, "global_step": 119296, "epoch": 985} {"train_loss": -39.29303741455078, "global_step": 119297, "epoch": 985} {"train_loss": -39.083065032958984, "global_step": 119298, "epoch": 985} {"train_loss": -39.606441497802734, "global_step": 119299, "epoch": 985} {"train_loss": -38.36357498168945, "global_step": 119300, "epoch": 985} {"train_loss": -38.859771728515625, "global_step": 119301, "epoch": 985} {"train_loss": -39.39296340942383, "global_step": 119302, "epoch": 985} {"train_loss": -39.48077392578125, "global_step": 119303, "epoch": 985} {"train_loss": -40.00196075439453, "global_step": 119304, "epoch": 985} {"train_loss": -38.011505174242764, "global_step": 119305, "epoch": 985, "val_loss": 2925080.75} {"train_loss": -39.71635055541992, "global_step": 119306, "epoch": 986} {"train_loss": -39.77357864379883, "global_step": 119307, "epoch": 986} {"train_loss": -39.94175338745117, "global_step": 119308, "epoch": 986} {"train_loss": -39.277069091796875, "global_step": 119309, "epoch": 986} {"train_loss": -39.61725616455078, "global_step": 119310, "epoch": 986} {"train_loss": -38.16831588745117, "global_step": 119311, "epoch": 986} {"train_loss": -40.047645568847656, "global_step": 119312, "epoch": 986} {"train_loss": -39.99346923828125, "global_step": 119313, "epoch": 986} {"train_loss": -39.45207977294922, "global_step": 119314, "epoch": 986} {"train_loss": -39.72451400756836, "global_step": 119315, "epoch": 986} {"train_loss": -39.92816162109375, "global_step": 119316, "epoch": 986} {"train_loss": -39.162628173828125, "global_step": 119317, "epoch": 986} {"train_loss": -39.54094314575195, "global_step": 119318, "epoch": 986} {"train_loss": -40.22058868408203, "global_step": 119319, "epoch": 986} {"train_loss": -39.65398025512695, "global_step": 119320, "epoch": 986} {"train_loss": -39.94570541381836, "global_step": 119321, "epoch": 986} {"train_loss": -39.81242752075195, "global_step": 119322, "epoch": 986} {"train_loss": -39.67293167114258, "global_step": 119323, "epoch": 986} {"train_loss": -39.64618682861328, "global_step": 119324, "epoch": 986} {"train_loss": -38.340843200683594, "global_step": 119325, "epoch": 986} {"train_loss": -39.30766677856445, "global_step": 119326, "epoch": 986} {"train_loss": -39.02836990356445, "global_step": 119327, "epoch": 986} {"train_loss": -38.212982177734375, "global_step": 119328, "epoch": 986} {"train_loss": -38.76191329956055, "global_step": 119329, "epoch": 986} {"train_loss": -38.302608489990234, "global_step": 119330, "epoch": 986} {"train_loss": -37.45542526245117, "global_step": 119331, "epoch": 986} {"train_loss": -38.51807403564453, "global_step": 119332, "epoch": 986} {"train_loss": -40.286319732666016, "global_step": 119333, "epoch": 986} {"train_loss": -39.20747756958008, "global_step": 119334, "epoch": 986} {"train_loss": -38.034828186035156, "global_step": 119335, "epoch": 986} {"train_loss": -36.72553634643555, "global_step": 119336, "epoch": 986} {"train_loss": -29.89226722717285, "global_step": 119337, "epoch": 986} {"train_loss": -33.593170166015625, "global_step": 119338, "epoch": 986} {"train_loss": -37.336639404296875, "global_step": 119339, "epoch": 986} {"train_loss": -34.71638107299805, "global_step": 119340, "epoch": 986} {"train_loss": -35.35779571533203, "global_step": 119341, "epoch": 986} {"train_loss": -37.780025482177734, "global_step": 119342, "epoch": 986} {"train_loss": -36.67460250854492, "global_step": 119343, "epoch": 986} {"train_loss": -36.49846649169922, "global_step": 119344, "epoch": 986} {"train_loss": -36.2631721496582, "global_step": 119345, "epoch": 986} {"train_loss": -37.962772369384766, "global_step": 119346, "epoch": 986} {"train_loss": -37.127655029296875, "global_step": 119347, "epoch": 986} {"train_loss": -37.22673797607422, "global_step": 119348, "epoch": 986} {"train_loss": -37.214698791503906, "global_step": 119349, "epoch": 986} {"train_loss": -38.67034149169922, "global_step": 119350, "epoch": 986} {"train_loss": -35.96275329589844, "global_step": 119351, "epoch": 986} {"train_loss": -39.21588897705078, "global_step": 119352, "epoch": 986} {"train_loss": -35.43607711791992, "global_step": 119353, "epoch": 986} {"train_loss": -38.578712463378906, "global_step": 119354, "epoch": 986} {"train_loss": -37.74421310424805, "global_step": 119355, "epoch": 986} {"train_loss": -36.816749572753906, "global_step": 119356, "epoch": 986} {"train_loss": -38.929420471191406, "global_step": 119357, "epoch": 986} {"train_loss": -38.107173919677734, "global_step": 119358, "epoch": 986} {"train_loss": -38.00120544433594, "global_step": 119359, "epoch": 986} {"train_loss": -38.788204193115234, "global_step": 119360, "epoch": 986} {"train_loss": -37.655914306640625, "global_step": 119361, "epoch": 986} {"train_loss": -38.06370162963867, "global_step": 119362, "epoch": 986} {"train_loss": -39.1748046875, "global_step": 119363, "epoch": 986} {"train_loss": -38.16070556640625, "global_step": 119364, "epoch": 986} {"train_loss": -38.442100524902344, "global_step": 119365, "epoch": 986} {"train_loss": -38.9149284362793, "global_step": 119366, "epoch": 986} {"train_loss": -37.85049057006836, "global_step": 119367, "epoch": 986} {"train_loss": -38.790199279785156, "global_step": 119368, "epoch": 986} {"train_loss": -38.05990219116211, "global_step": 119369, "epoch": 986} {"train_loss": -39.47703170776367, "global_step": 119370, "epoch": 986} {"train_loss": -38.6979866027832, "global_step": 119371, "epoch": 986} {"train_loss": -38.6583366394043, "global_step": 119372, "epoch": 986} {"train_loss": -38.59968566894531, "global_step": 119373, "epoch": 986} {"train_loss": -39.03395462036133, "global_step": 119374, "epoch": 986} {"train_loss": -36.90439224243164, "global_step": 119375, "epoch": 986} {"train_loss": -38.43834686279297, "global_step": 119376, "epoch": 986} {"train_loss": -38.62038803100586, "global_step": 119377, "epoch": 986} {"train_loss": -38.9835205078125, "global_step": 119378, "epoch": 986} {"train_loss": -38.5236930847168, "global_step": 119379, "epoch": 986} {"train_loss": -39.27260971069336, "global_step": 119380, "epoch": 986} {"train_loss": -38.91228103637695, "global_step": 119381, "epoch": 986} {"train_loss": -39.50898361206055, "global_step": 119382, "epoch": 986} {"train_loss": -40.0927734375, "global_step": 119383, "epoch": 986} {"train_loss": -38.990028381347656, "global_step": 119384, "epoch": 986} {"train_loss": -39.15407180786133, "global_step": 119385, "epoch": 986} {"train_loss": -39.59919357299805, "global_step": 119386, "epoch": 986} {"train_loss": -39.31443405151367, "global_step": 119387, "epoch": 986} {"train_loss": -39.5118293762207, "global_step": 119388, "epoch": 986} {"train_loss": -39.39433288574219, "global_step": 119389, "epoch": 986} {"train_loss": -38.64280319213867, "global_step": 119390, "epoch": 986} {"train_loss": -40.005977630615234, "global_step": 119391, "epoch": 986} {"train_loss": -39.04104232788086, "global_step": 119392, "epoch": 986} {"train_loss": -38.87820053100586, "global_step": 119393, "epoch": 986} {"train_loss": -39.994441986083984, "global_step": 119394, "epoch": 986} {"train_loss": -39.361785888671875, "global_step": 119395, "epoch": 986} {"train_loss": -38.712677001953125, "global_step": 119396, "epoch": 986} {"train_loss": -39.388916015625, "global_step": 119397, "epoch": 986} {"train_loss": -38.6518440246582, "global_step": 119398, "epoch": 986} {"train_loss": -39.655513763427734, "global_step": 119399, "epoch": 986} {"train_loss": -38.9453239440918, "global_step": 119400, "epoch": 986} {"train_loss": -39.46329116821289, "global_step": 119401, "epoch": 986} {"train_loss": -38.981624603271484, "global_step": 119402, "epoch": 986} {"train_loss": -39.038936614990234, "global_step": 119403, "epoch": 986} {"train_loss": -39.6098518371582, "global_step": 119404, "epoch": 986} {"train_loss": -39.349857330322266, "global_step": 119405, "epoch": 986} {"train_loss": -39.084693908691406, "global_step": 119406, "epoch": 986} {"train_loss": -38.286983489990234, "global_step": 119407, "epoch": 986} {"train_loss": -38.55710220336914, "global_step": 119408, "epoch": 986} {"train_loss": -38.88359451293945, "global_step": 119409, "epoch": 986} {"train_loss": -40.005008697509766, "global_step": 119410, "epoch": 986} {"train_loss": -39.266639709472656, "global_step": 119411, "epoch": 986} {"train_loss": -38.0091667175293, "global_step": 119412, "epoch": 986} {"train_loss": -38.9644775390625, "global_step": 119413, "epoch": 986} {"train_loss": -39.7520751953125, "global_step": 119414, "epoch": 986} {"train_loss": -38.95659637451172, "global_step": 119415, "epoch": 986} {"train_loss": -38.920738220214844, "global_step": 119416, "epoch": 986} {"train_loss": -40.17084884643555, "global_step": 119417, "epoch": 986} {"train_loss": -39.743709564208984, "global_step": 119418, "epoch": 986} {"train_loss": -39.10081100463867, "global_step": 119419, "epoch": 986} {"train_loss": -38.69265365600586, "global_step": 119420, "epoch": 986} {"train_loss": -38.75208282470703, "global_step": 119421, "epoch": 986} {"train_loss": -39.95386505126953, "global_step": 119422, "epoch": 986} {"train_loss": -39.10590744018555, "global_step": 119423, "epoch": 986} {"train_loss": -39.38469696044922, "global_step": 119424, "epoch": 986} {"train_loss": -39.065147399902344, "global_step": 119425, "epoch": 986} {"train_loss": -38.615601988863354, "global_step": 119426, "epoch": 986, "val_loss": 2680340.0} {"train_loss": -39.31036376953125, "global_step": 119427, "epoch": 987} {"train_loss": -37.78322982788086, "global_step": 119428, "epoch": 987} {"train_loss": -36.851585388183594, "global_step": 119429, "epoch": 987} {"train_loss": -36.92177963256836, "global_step": 119430, "epoch": 987} {"train_loss": -38.18449783325195, "global_step": 119431, "epoch": 987} {"train_loss": -38.855384826660156, "global_step": 119432, "epoch": 987} {"train_loss": -38.93510818481445, "global_step": 119433, "epoch": 987} {"train_loss": -39.21230697631836, "global_step": 119434, "epoch": 987} {"train_loss": -37.887001037597656, "global_step": 119435, "epoch": 987} {"train_loss": -36.351261138916016, "global_step": 119436, "epoch": 987} {"train_loss": -36.802181243896484, "global_step": 119437, "epoch": 987} {"train_loss": -38.87451934814453, "global_step": 119438, "epoch": 987} {"train_loss": -38.54584503173828, "global_step": 119439, "epoch": 987} {"train_loss": -38.50753402709961, "global_step": 119440, "epoch": 987} {"train_loss": -36.57893371582031, "global_step": 119441, "epoch": 987} {"train_loss": -36.4143180847168, "global_step": 119442, "epoch": 987} {"train_loss": -39.46100616455078, "global_step": 119443, "epoch": 987} {"train_loss": -37.74156188964844, "global_step": 119444, "epoch": 987} {"train_loss": -37.63904571533203, "global_step": 119445, "epoch": 987} {"train_loss": -36.56226348876953, "global_step": 119446, "epoch": 987} {"train_loss": -37.61920166015625, "global_step": 119447, "epoch": 987} {"train_loss": -38.631507873535156, "global_step": 119448, "epoch": 987} {"train_loss": -38.566043853759766, "global_step": 119449, "epoch": 987} {"train_loss": -38.847774505615234, "global_step": 119450, "epoch": 987} {"train_loss": -37.87833786010742, "global_step": 119451, "epoch": 987} {"train_loss": -39.83098220825195, "global_step": 119452, "epoch": 987} {"train_loss": -37.7718620300293, "global_step": 119453, "epoch": 987} {"train_loss": -37.270484924316406, "global_step": 119454, "epoch": 987} {"train_loss": -39.3050422668457, "global_step": 119455, "epoch": 987} {"train_loss": -39.34498977661133, "global_step": 119456, "epoch": 987} {"train_loss": -39.152442932128906, "global_step": 119457, "epoch": 987} {"train_loss": -39.001258850097656, "global_step": 119458, "epoch": 987} {"train_loss": -39.061153411865234, "global_step": 119459, "epoch": 987} {"train_loss": -39.332603454589844, "global_step": 119460, "epoch": 987} {"train_loss": -38.55678939819336, "global_step": 119461, "epoch": 987} {"train_loss": -38.416160583496094, "global_step": 119462, "epoch": 987} {"train_loss": -39.4398078918457, "global_step": 119463, "epoch": 987} {"train_loss": -38.887542724609375, "global_step": 119464, "epoch": 987} {"train_loss": -39.51721954345703, "global_step": 119465, "epoch": 987} {"train_loss": -39.289764404296875, "global_step": 119466, "epoch": 987} {"train_loss": -39.52021408081055, "global_step": 119467, "epoch": 987} {"train_loss": -37.75234603881836, "global_step": 119468, "epoch": 987} {"train_loss": -39.13657760620117, "global_step": 119469, "epoch": 987} {"train_loss": -36.85334396362305, "global_step": 119470, "epoch": 987} {"train_loss": -38.35260772705078, "global_step": 119471, "epoch": 987} {"train_loss": -38.48942565917969, "global_step": 119472, "epoch": 987} {"train_loss": -38.06599044799805, "global_step": 119473, "epoch": 987} {"train_loss": -38.3936767578125, "global_step": 119474, "epoch": 987} {"train_loss": -38.464454650878906, "global_step": 119475, "epoch": 987} {"train_loss": -39.22031784057617, "global_step": 119476, "epoch": 987} {"train_loss": -38.437782287597656, "global_step": 119477, "epoch": 987} {"train_loss": -39.151607513427734, "global_step": 119478, "epoch": 987} {"train_loss": -37.3818473815918, "global_step": 119479, "epoch": 987} {"train_loss": -38.27238845825195, "global_step": 119480, "epoch": 987} {"train_loss": -39.01093673706055, "global_step": 119481, "epoch": 987} {"train_loss": -39.20579147338867, "global_step": 119482, "epoch": 987} {"train_loss": -38.81002426147461, "global_step": 119483, "epoch": 987} {"train_loss": -39.413246154785156, "global_step": 119484, "epoch": 987} {"train_loss": -38.34425735473633, "global_step": 119485, "epoch": 987} {"train_loss": -40.1453742980957, "global_step": 119486, "epoch": 987} {"train_loss": -38.278900146484375, "global_step": 119487, "epoch": 987} {"train_loss": -39.11528396606445, "global_step": 119488, "epoch": 987} {"train_loss": -38.33894729614258, "global_step": 119489, "epoch": 987} {"train_loss": -39.24357986450195, "global_step": 119490, "epoch": 987} {"train_loss": -39.29494857788086, "global_step": 119491, "epoch": 987} {"train_loss": -39.51580047607422, "global_step": 119492, "epoch": 987} {"train_loss": -39.5467414855957, "global_step": 119493, "epoch": 987} {"train_loss": -39.57184982299805, "global_step": 119494, "epoch": 987} {"train_loss": -39.16115188598633, "global_step": 119495, "epoch": 987} {"train_loss": -39.228755950927734, "global_step": 119496, "epoch": 987} {"train_loss": -39.642635345458984, "global_step": 119497, "epoch": 987} {"train_loss": -39.77101516723633, "global_step": 119498, "epoch": 987} {"train_loss": -39.588985443115234, "global_step": 119499, "epoch": 987} {"train_loss": -39.15900802612305, "global_step": 119500, "epoch": 987} {"train_loss": -38.46617889404297, "global_step": 119501, "epoch": 987} {"train_loss": -39.8121337890625, "global_step": 119502, "epoch": 987} {"train_loss": -38.790096282958984, "global_step": 119503, "epoch": 987} {"train_loss": -39.81393051147461, "global_step": 119504, "epoch": 987} {"train_loss": -39.85307693481445, "global_step": 119505, "epoch": 987} {"train_loss": -39.87101364135742, "global_step": 119506, "epoch": 987} {"train_loss": -39.787513732910156, "global_step": 119507, "epoch": 987} {"train_loss": -40.10383605957031, "global_step": 119508, "epoch": 987} {"train_loss": -39.51646423339844, "global_step": 119509, "epoch": 987} {"train_loss": -39.6445426940918, "global_step": 119510, "epoch": 987} {"train_loss": -39.39506149291992, "global_step": 119511, "epoch": 987} {"train_loss": -40.215057373046875, "global_step": 119512, "epoch": 987} {"train_loss": -40.006309509277344, "global_step": 119513, "epoch": 987} {"train_loss": -39.862667083740234, "global_step": 119514, "epoch": 987} {"train_loss": -39.265037536621094, "global_step": 119515, "epoch": 987} {"train_loss": -39.35593795776367, "global_step": 119516, "epoch": 987} {"train_loss": -39.36095428466797, "global_step": 119517, "epoch": 987} {"train_loss": -39.511756896972656, "global_step": 119518, "epoch": 987} {"train_loss": -38.12884521484375, "global_step": 119519, "epoch": 987} {"train_loss": -35.47248077392578, "global_step": 119520, "epoch": 987} {"train_loss": -22.981088638305664, "global_step": 119521, "epoch": 987} {"train_loss": 2.493593692779541, "global_step": 119522, "epoch": 987} {"train_loss": 3.01664662361145, "global_step": 119523, "epoch": 987} {"train_loss": -38.21126174926758, "global_step": 119524, "epoch": 987} {"train_loss": -11.131308555603027, "global_step": 119525, "epoch": 987} {"train_loss": -37.236358642578125, "global_step": 119526, "epoch": 987} {"train_loss": -19.29740333557129, "global_step": 119527, "epoch": 987} {"train_loss": -37.98392105102539, "global_step": 119528, "epoch": 987} {"train_loss": -19.852872848510742, "global_step": 119529, "epoch": 987} {"train_loss": -37.85982131958008, "global_step": 119530, "epoch": 987} {"train_loss": -25.874435424804688, "global_step": 119531, "epoch": 987} {"train_loss": -36.62190246582031, "global_step": 119532, "epoch": 987} {"train_loss": -35.83930587768555, "global_step": 119533, "epoch": 987} {"train_loss": -28.779356002807617, "global_step": 119534, "epoch": 987} {"train_loss": -37.514583587646484, "global_step": 119535, "epoch": 987} {"train_loss": -35.9951171875, "global_step": 119536, "epoch": 987} {"train_loss": -34.16785430908203, "global_step": 119537, "epoch": 987} {"train_loss": -37.069618225097656, "global_step": 119538, "epoch": 987} {"train_loss": -37.37491989135742, "global_step": 119539, "epoch": 987} {"train_loss": -36.078922271728516, "global_step": 119540, "epoch": 987} {"train_loss": -36.67610549926758, "global_step": 119541, "epoch": 987} {"train_loss": -37.89722442626953, "global_step": 119542, "epoch": 987} {"train_loss": -37.63326644897461, "global_step": 119543, "epoch": 987} {"train_loss": -37.2408332824707, "global_step": 119544, "epoch": 987} {"train_loss": -36.8385009765625, "global_step": 119545, "epoch": 987} {"train_loss": -38.15890884399414, "global_step": 119546, "epoch": 987} {"train_loss": -36.92178478122743, "global_step": 119547, "epoch": 987, "val_loss": 2636216.75} {"train_loss": -38.1066780090332, "global_step": 119548, "epoch": 988} {"train_loss": -36.68195343017578, "global_step": 119549, "epoch": 988} {"train_loss": -37.99574661254883, "global_step": 119550, "epoch": 988} {"train_loss": -38.15030288696289, "global_step": 119551, "epoch": 988} {"train_loss": -38.11542510986328, "global_step": 119552, "epoch": 988} {"train_loss": -37.72157669067383, "global_step": 119553, "epoch": 988} {"train_loss": -38.04384994506836, "global_step": 119554, "epoch": 988} {"train_loss": -38.298316955566406, "global_step": 119555, "epoch": 988} {"train_loss": -38.55116653442383, "global_step": 119556, "epoch": 988} {"train_loss": -38.07159423828125, "global_step": 119557, "epoch": 988} {"train_loss": -38.12604904174805, "global_step": 119558, "epoch": 988} {"train_loss": -38.60347366333008, "global_step": 119559, "epoch": 988} {"train_loss": -38.91264724731445, "global_step": 119560, "epoch": 988} {"train_loss": -39.15803146362305, "global_step": 119561, "epoch": 988} {"train_loss": -38.656517028808594, "global_step": 119562, "epoch": 988} {"train_loss": -39.253150939941406, "global_step": 119563, "epoch": 988} {"train_loss": -38.8636474609375, "global_step": 119564, "epoch": 988} {"train_loss": -39.38595962524414, "global_step": 119565, "epoch": 988} {"train_loss": -39.035125732421875, "global_step": 119566, "epoch": 988} {"train_loss": -38.907711029052734, "global_step": 119567, "epoch": 988} {"train_loss": -39.1591682434082, "global_step": 119568, "epoch": 988} {"train_loss": -39.268043518066406, "global_step": 119569, "epoch": 988} {"train_loss": -39.06826400756836, "global_step": 119570, "epoch": 988} {"train_loss": -39.22565460205078, "global_step": 119571, "epoch": 988} {"train_loss": -39.29012680053711, "global_step": 119572, "epoch": 988} {"train_loss": -38.72331619262695, "global_step": 119573, "epoch": 988} {"train_loss": -39.32479476928711, "global_step": 119574, "epoch": 988} {"train_loss": -39.050567626953125, "global_step": 119575, "epoch": 988} {"train_loss": -39.384765625, "global_step": 119576, "epoch": 988} {"train_loss": -38.94138717651367, "global_step": 119577, "epoch": 988} {"train_loss": -39.74677276611328, "global_step": 119578, "epoch": 988} {"train_loss": -39.7048225402832, "global_step": 119579, "epoch": 988} {"train_loss": -39.937435150146484, "global_step": 119580, "epoch": 988} {"train_loss": -39.591064453125, "global_step": 119581, "epoch": 988} {"train_loss": -39.81974411010742, "global_step": 119582, "epoch": 988} {"train_loss": -39.72234344482422, "global_step": 119583, "epoch": 988} {"train_loss": -39.3166389465332, "global_step": 119584, "epoch": 988} {"train_loss": -39.65558624267578, "global_step": 119585, "epoch": 988} {"train_loss": -39.871742248535156, "global_step": 119586, "epoch": 988} {"train_loss": -39.685829162597656, "global_step": 119587, "epoch": 988} {"train_loss": -39.8859748840332, "global_step": 119588, "epoch": 988} {"train_loss": -39.96923065185547, "global_step": 119589, "epoch": 988} {"train_loss": -40.149879455566406, "global_step": 119590, "epoch": 988} {"train_loss": -39.64300537109375, "global_step": 119591, "epoch": 988} {"train_loss": -39.99274826049805, "global_step": 119592, "epoch": 988} {"train_loss": -39.69295883178711, "global_step": 119593, "epoch": 988} {"train_loss": -40.08175277709961, "global_step": 119594, "epoch": 988} {"train_loss": -39.759090423583984, "global_step": 119595, "epoch": 988} {"train_loss": -39.945472717285156, "global_step": 119596, "epoch": 988} {"train_loss": -40.2276611328125, "global_step": 119597, "epoch": 988} {"train_loss": -40.24343490600586, "global_step": 119598, "epoch": 988} {"train_loss": -40.169036865234375, "global_step": 119599, "epoch": 988} {"train_loss": -40.295806884765625, "global_step": 119600, "epoch": 988} {"train_loss": -40.53782272338867, "global_step": 119601, "epoch": 988} {"train_loss": -39.947322845458984, "global_step": 119602, "epoch": 988} {"train_loss": -40.298179626464844, "global_step": 119603, "epoch": 988} {"train_loss": -40.13602828979492, "global_step": 119604, "epoch": 988} {"train_loss": -40.18513870239258, "global_step": 119605, "epoch": 988} {"train_loss": -39.933956146240234, "global_step": 119606, "epoch": 988} {"train_loss": -40.626155853271484, "global_step": 119607, "epoch": 988} {"train_loss": -39.5445671081543, "global_step": 119608, "epoch": 988} {"train_loss": -39.82297897338867, "global_step": 119609, "epoch": 988} {"train_loss": -37.6848030090332, "global_step": 119610, "epoch": 988} {"train_loss": -38.6755256652832, "global_step": 119611, "epoch": 988} {"train_loss": -39.70841598510742, "global_step": 119612, "epoch": 988} {"train_loss": -39.88279342651367, "global_step": 119613, "epoch": 988} {"train_loss": -40.043678283691406, "global_step": 119614, "epoch": 988} {"train_loss": -38.353057861328125, "global_step": 119615, "epoch": 988} {"train_loss": -36.288360595703125, "global_step": 119616, "epoch": 988} {"train_loss": -35.68044662475586, "global_step": 119617, "epoch": 988} {"train_loss": -35.903358459472656, "global_step": 119618, "epoch": 988} {"train_loss": -38.227691650390625, "global_step": 119619, "epoch": 988} {"train_loss": -36.4704704284668, "global_step": 119620, "epoch": 988} {"train_loss": -33.246681213378906, "global_step": 119621, "epoch": 988} {"train_loss": -33.68783950805664, "global_step": 119622, "epoch": 988} {"train_loss": -38.68052673339844, "global_step": 119623, "epoch": 988} {"train_loss": -38.066131591796875, "global_step": 119624, "epoch": 988} {"train_loss": -36.42707443237305, "global_step": 119625, "epoch": 988} {"train_loss": -37.9178466796875, "global_step": 119626, "epoch": 988} {"train_loss": -38.13751220703125, "global_step": 119627, "epoch": 988} {"train_loss": -37.99394607543945, "global_step": 119628, "epoch": 988} {"train_loss": -38.30585861206055, "global_step": 119629, "epoch": 988} {"train_loss": -37.73317337036133, "global_step": 119630, "epoch": 988} {"train_loss": -37.61206817626953, "global_step": 119631, "epoch": 988} {"train_loss": -37.84928894042969, "global_step": 119632, "epoch": 988} {"train_loss": -38.25319290161133, "global_step": 119633, "epoch": 988} {"train_loss": -36.858150482177734, "global_step": 119634, "epoch": 988} {"train_loss": -37.611080169677734, "global_step": 119635, "epoch": 988} {"train_loss": -37.74962615966797, "global_step": 119636, "epoch": 988} {"train_loss": -38.415077209472656, "global_step": 119637, "epoch": 988} {"train_loss": -39.05908966064453, "global_step": 119638, "epoch": 988} {"train_loss": -38.92123031616211, "global_step": 119639, "epoch": 988} {"train_loss": -39.24241256713867, "global_step": 119640, "epoch": 988} {"train_loss": -38.958885192871094, "global_step": 119641, "epoch": 988} {"train_loss": -38.203826904296875, "global_step": 119642, "epoch": 988} {"train_loss": -39.040985107421875, "global_step": 119643, "epoch": 988} {"train_loss": -39.08692169189453, "global_step": 119644, "epoch": 988} {"train_loss": -38.288726806640625, "global_step": 119645, "epoch": 988} {"train_loss": -38.74538040161133, "global_step": 119646, "epoch": 988} {"train_loss": -38.50511169433594, "global_step": 119647, "epoch": 988} {"train_loss": -38.218196868896484, "global_step": 119648, "epoch": 988} {"train_loss": -38.99166488647461, "global_step": 119649, "epoch": 988} {"train_loss": -38.24396896362305, "global_step": 119650, "epoch": 988} {"train_loss": -37.0755500793457, "global_step": 119651, "epoch": 988} {"train_loss": -39.00746536254883, "global_step": 119652, "epoch": 988} {"train_loss": -38.70949172973633, "global_step": 119653, "epoch": 988} {"train_loss": -38.53987121582031, "global_step": 119654, "epoch": 988} {"train_loss": -38.904541015625, "global_step": 119655, "epoch": 988} {"train_loss": -39.09685134887695, "global_step": 119656, "epoch": 988} {"train_loss": -39.03016662597656, "global_step": 119657, "epoch": 988} {"train_loss": -38.726806640625, "global_step": 119658, "epoch": 988} {"train_loss": -38.804561614990234, "global_step": 119659, "epoch": 988} {"train_loss": -39.25492477416992, "global_step": 119660, "epoch": 988} {"train_loss": -38.771026611328125, "global_step": 119661, "epoch": 988} {"train_loss": -38.7705192565918, "global_step": 119662, "epoch": 988} {"train_loss": -39.17279815673828, "global_step": 119663, "epoch": 988} {"train_loss": -38.57978439331055, "global_step": 119664, "epoch": 988} {"train_loss": -38.785457611083984, "global_step": 119665, "epoch": 988} {"train_loss": -38.93803024291992, "global_step": 119666, "epoch": 988} {"train_loss": -39.48476028442383, "global_step": 119667, "epoch": 988} {"train_loss": -38.77418874314994, "global_step": 119668, "epoch": 988, "val_loss": 2720230.0} {"train_loss": -39.107173919677734, "global_step": 119669, "epoch": 989} {"train_loss": -39.22365951538086, "global_step": 119670, "epoch": 989} {"train_loss": -39.42780685424805, "global_step": 119671, "epoch": 989} {"train_loss": -39.67822265625, "global_step": 119672, "epoch": 989} {"train_loss": -39.275428771972656, "global_step": 119673, "epoch": 989} {"train_loss": -39.19977951049805, "global_step": 119674, "epoch": 989} {"train_loss": -39.32038879394531, "global_step": 119675, "epoch": 989} {"train_loss": -38.994197845458984, "global_step": 119676, "epoch": 989} {"train_loss": -39.352325439453125, "global_step": 119677, "epoch": 989} {"train_loss": -39.67255401611328, "global_step": 119678, "epoch": 989} {"train_loss": -38.64488983154297, "global_step": 119679, "epoch": 989} {"train_loss": -39.58039474487305, "global_step": 119680, "epoch": 989} {"train_loss": -39.43134689331055, "global_step": 119681, "epoch": 989} {"train_loss": -39.512943267822266, "global_step": 119682, "epoch": 989} {"train_loss": -39.2111701965332, "global_step": 119683, "epoch": 989} {"train_loss": -39.39632797241211, "global_step": 119684, "epoch": 989} {"train_loss": -39.40510559082031, "global_step": 119685, "epoch": 989} {"train_loss": -38.441410064697266, "global_step": 119686, "epoch": 989} {"train_loss": -39.051971435546875, "global_step": 119687, "epoch": 989} {"train_loss": -39.377838134765625, "global_step": 119688, "epoch": 989} {"train_loss": -38.844154357910156, "global_step": 119689, "epoch": 989} {"train_loss": -38.3006706237793, "global_step": 119690, "epoch": 989} {"train_loss": -39.59842300415039, "global_step": 119691, "epoch": 989} {"train_loss": -38.56850051879883, "global_step": 119692, "epoch": 989} {"train_loss": -37.55131912231445, "global_step": 119693, "epoch": 989} {"train_loss": -39.16021728515625, "global_step": 119694, "epoch": 989} {"train_loss": -38.960662841796875, "global_step": 119695, "epoch": 989} {"train_loss": -39.1596565246582, "global_step": 119696, "epoch": 989} {"train_loss": -39.332759857177734, "global_step": 119697, "epoch": 989} {"train_loss": -39.39391326904297, "global_step": 119698, "epoch": 989} {"train_loss": -39.728416442871094, "global_step": 119699, "epoch": 989} {"train_loss": -39.19819259643555, "global_step": 119700, "epoch": 989} {"train_loss": -39.63297653198242, "global_step": 119701, "epoch": 989} {"train_loss": -39.60165786743164, "global_step": 119702, "epoch": 989} {"train_loss": -38.862098693847656, "global_step": 119703, "epoch": 989} {"train_loss": -38.53699493408203, "global_step": 119704, "epoch": 989} {"train_loss": -38.575477600097656, "global_step": 119705, "epoch": 989} {"train_loss": -39.62778091430664, "global_step": 119706, "epoch": 989} {"train_loss": -39.85221481323242, "global_step": 119707, "epoch": 989} {"train_loss": -39.668785095214844, "global_step": 119708, "epoch": 989} {"train_loss": -39.75010299682617, "global_step": 119709, "epoch": 989} {"train_loss": -39.63091278076172, "global_step": 119710, "epoch": 989} {"train_loss": -38.23875045776367, "global_step": 119711, "epoch": 989} {"train_loss": -36.64227294921875, "global_step": 119712, "epoch": 989} {"train_loss": -38.00490188598633, "global_step": 119713, "epoch": 989} {"train_loss": -38.01335525512695, "global_step": 119714, "epoch": 989} {"train_loss": -37.87802505493164, "global_step": 119715, "epoch": 989} {"train_loss": -38.82322311401367, "global_step": 119716, "epoch": 989} {"train_loss": -39.28261947631836, "global_step": 119717, "epoch": 989} {"train_loss": -38.817970275878906, "global_step": 119718, "epoch": 989} {"train_loss": -38.18011474609375, "global_step": 119719, "epoch": 989} {"train_loss": -39.52991485595703, "global_step": 119720, "epoch": 989} {"train_loss": -39.02870559692383, "global_step": 119721, "epoch": 989} {"train_loss": -38.19203567504883, "global_step": 119722, "epoch": 989} {"train_loss": -37.99668502807617, "global_step": 119723, "epoch": 989} {"train_loss": -39.342018127441406, "global_step": 119724, "epoch": 989} {"train_loss": -39.29548263549805, "global_step": 119725, "epoch": 989} {"train_loss": -38.97298049926758, "global_step": 119726, "epoch": 989} {"train_loss": -39.40359115600586, "global_step": 119727, "epoch": 989} {"train_loss": -37.26455307006836, "global_step": 119728, "epoch": 989} {"train_loss": -39.3609733581543, "global_step": 119729, "epoch": 989} {"train_loss": -40.111759185791016, "global_step": 119730, "epoch": 989} {"train_loss": -38.1604118347168, "global_step": 119731, "epoch": 989} {"train_loss": -39.087646484375, "global_step": 119732, "epoch": 989} {"train_loss": -38.59716796875, "global_step": 119733, "epoch": 989} {"train_loss": -40.17734909057617, "global_step": 119734, "epoch": 989} {"train_loss": -38.97901153564453, "global_step": 119735, "epoch": 989} {"train_loss": -40.14768981933594, "global_step": 119736, "epoch": 989} {"train_loss": -38.87687301635742, "global_step": 119737, "epoch": 989} {"train_loss": -38.488826751708984, "global_step": 119738, "epoch": 989} {"train_loss": -39.124183654785156, "global_step": 119739, "epoch": 989} {"train_loss": -39.07822799682617, "global_step": 119740, "epoch": 989} {"train_loss": -40.31034469604492, "global_step": 119741, "epoch": 989} {"train_loss": -38.943294525146484, "global_step": 119742, "epoch": 989} {"train_loss": -39.40932846069336, "global_step": 119743, "epoch": 989} {"train_loss": -39.123252868652344, "global_step": 119744, "epoch": 989} {"train_loss": -40.094661712646484, "global_step": 119745, "epoch": 989} {"train_loss": -39.36359405517578, "global_step": 119746, "epoch": 989} {"train_loss": -38.83976364135742, "global_step": 119747, "epoch": 989} {"train_loss": -39.62234115600586, "global_step": 119748, "epoch": 989} {"train_loss": -39.003841400146484, "global_step": 119749, "epoch": 989} {"train_loss": -39.981693267822266, "global_step": 119750, "epoch": 989} {"train_loss": -39.44529724121094, "global_step": 119751, "epoch": 989} {"train_loss": -39.41056442260742, "global_step": 119752, "epoch": 989} {"train_loss": -39.391353607177734, "global_step": 119753, "epoch": 989} {"train_loss": -39.20067596435547, "global_step": 119754, "epoch": 989} {"train_loss": -39.81369400024414, "global_step": 119755, "epoch": 989} {"train_loss": -39.0820426940918, "global_step": 119756, "epoch": 989} {"train_loss": -38.0670166015625, "global_step": 119757, "epoch": 989} {"train_loss": -38.99883270263672, "global_step": 119758, "epoch": 989} {"train_loss": -39.42607498168945, "global_step": 119759, "epoch": 989} {"train_loss": -38.33858871459961, "global_step": 119760, "epoch": 989} {"train_loss": -38.074012756347656, "global_step": 119761, "epoch": 989} {"train_loss": -38.4309196472168, "global_step": 119762, "epoch": 989} {"train_loss": -34.77419662475586, "global_step": 119763, "epoch": 989} {"train_loss": -35.21923828125, "global_step": 119764, "epoch": 989} {"train_loss": -39.085060119628906, "global_step": 119765, "epoch": 989} {"train_loss": -39.180633544921875, "global_step": 119766, "epoch": 989} {"train_loss": -36.14495849609375, "global_step": 119767, "epoch": 989} {"train_loss": -36.611690521240234, "global_step": 119768, "epoch": 989} {"train_loss": -37.563072204589844, "global_step": 119769, "epoch": 989} {"train_loss": -39.529605865478516, "global_step": 119770, "epoch": 989} {"train_loss": -38.30649948120117, "global_step": 119771, "epoch": 989} {"train_loss": -37.25770950317383, "global_step": 119772, "epoch": 989} {"train_loss": -38.23203659057617, "global_step": 119773, "epoch": 989} {"train_loss": -39.018123626708984, "global_step": 119774, "epoch": 989} {"train_loss": -38.63294982910156, "global_step": 119775, "epoch": 989} {"train_loss": -37.505741119384766, "global_step": 119776, "epoch": 989} {"train_loss": -39.207881927490234, "global_step": 119777, "epoch": 989} {"train_loss": -39.62647247314453, "global_step": 119778, "epoch": 989} {"train_loss": -39.51618576049805, "global_step": 119779, "epoch": 989} {"train_loss": -39.94768142700195, "global_step": 119780, "epoch": 989} {"train_loss": -39.56344223022461, "global_step": 119781, "epoch": 989} {"train_loss": -39.77214431762695, "global_step": 119782, "epoch": 989} {"train_loss": -39.561614990234375, "global_step": 119783, "epoch": 989} {"train_loss": -39.53903579711914, "global_step": 119784, "epoch": 989} {"train_loss": -39.24501419067383, "global_step": 119785, "epoch": 989} {"train_loss": -39.932186126708984, "global_step": 119786, "epoch": 989} {"train_loss": -39.62824630737305, "global_step": 119787, "epoch": 989} {"train_loss": -39.29458999633789, "global_step": 119788, "epoch": 989} {"train_loss": -38.952724488313535, "global_step": 119789, "epoch": 989, "val_loss": 2642896.75} {"train_loss": -40.074127197265625, "global_step": 119790, "epoch": 990} {"train_loss": -40.00053024291992, "global_step": 119791, "epoch": 990} {"train_loss": -39.19068908691406, "global_step": 119792, "epoch": 990} {"train_loss": -38.09766387939453, "global_step": 119793, "epoch": 990} {"train_loss": -37.459022521972656, "global_step": 119794, "epoch": 990} {"train_loss": -39.65812301635742, "global_step": 119795, "epoch": 990} {"train_loss": -39.29810333251953, "global_step": 119796, "epoch": 990} {"train_loss": -36.573219299316406, "global_step": 119797, "epoch": 990} {"train_loss": -36.476104736328125, "global_step": 119798, "epoch": 990} {"train_loss": -40.03453826904297, "global_step": 119799, "epoch": 990} {"train_loss": -38.80471420288086, "global_step": 119800, "epoch": 990} {"train_loss": -39.33217239379883, "global_step": 119801, "epoch": 990} {"train_loss": -39.893733978271484, "global_step": 119802, "epoch": 990} {"train_loss": -37.76697540283203, "global_step": 119803, "epoch": 990} {"train_loss": -39.20029830932617, "global_step": 119804, "epoch": 990} {"train_loss": -39.60017776489258, "global_step": 119805, "epoch": 990} {"train_loss": -39.07733917236328, "global_step": 119806, "epoch": 990} {"train_loss": -39.69354248046875, "global_step": 119807, "epoch": 990} {"train_loss": -39.066162109375, "global_step": 119808, "epoch": 990} {"train_loss": -38.85309600830078, "global_step": 119809, "epoch": 990} {"train_loss": -39.83584213256836, "global_step": 119810, "epoch": 990} {"train_loss": -39.5234489440918, "global_step": 119811, "epoch": 990} {"train_loss": -39.86642074584961, "global_step": 119812, "epoch": 990} {"train_loss": -40.102081298828125, "global_step": 119813, "epoch": 990} {"train_loss": -40.07411193847656, "global_step": 119814, "epoch": 990} {"train_loss": -40.01576614379883, "global_step": 119815, "epoch": 990} {"train_loss": -40.05385208129883, "global_step": 119816, "epoch": 990} {"train_loss": -40.27916717529297, "global_step": 119817, "epoch": 990} {"train_loss": -40.05172348022461, "global_step": 119818, "epoch": 990} {"train_loss": -40.2115592956543, "global_step": 119819, "epoch": 990} {"train_loss": -40.2282600402832, "global_step": 119820, "epoch": 990} {"train_loss": -39.7496452331543, "global_step": 119821, "epoch": 990} {"train_loss": -40.407264709472656, "global_step": 119822, "epoch": 990} {"train_loss": -39.92716598510742, "global_step": 119823, "epoch": 990} {"train_loss": -40.12575149536133, "global_step": 119824, "epoch": 990} {"train_loss": -39.69841766357422, "global_step": 119825, "epoch": 990} {"train_loss": -40.36670684814453, "global_step": 119826, "epoch": 990} {"train_loss": -40.03456497192383, "global_step": 119827, "epoch": 990} {"train_loss": -40.44865036010742, "global_step": 119828, "epoch": 990} {"train_loss": -40.389381408691406, "global_step": 119829, "epoch": 990} {"train_loss": -40.0576057434082, "global_step": 119830, "epoch": 990} {"train_loss": -40.54724884033203, "global_step": 119831, "epoch": 990} {"train_loss": -39.928565979003906, "global_step": 119832, "epoch": 990} {"train_loss": -38.60487747192383, "global_step": 119833, "epoch": 990} {"train_loss": -35.95783615112305, "global_step": 119834, "epoch": 990} {"train_loss": -37.20881652832031, "global_step": 119835, "epoch": 990} {"train_loss": -38.73139572143555, "global_step": 119836, "epoch": 990} {"train_loss": -38.883968353271484, "global_step": 119837, "epoch": 990} {"train_loss": -39.2881965637207, "global_step": 119838, "epoch": 990} {"train_loss": -37.801204681396484, "global_step": 119839, "epoch": 990} {"train_loss": -38.75238800048828, "global_step": 119840, "epoch": 990} {"train_loss": -39.35841369628906, "global_step": 119841, "epoch": 990} {"train_loss": -38.306396484375, "global_step": 119842, "epoch": 990} {"train_loss": -37.7651481628418, "global_step": 119843, "epoch": 990} {"train_loss": -38.19635772705078, "global_step": 119844, "epoch": 990} {"train_loss": -39.525936126708984, "global_step": 119845, "epoch": 990} {"train_loss": -37.657649993896484, "global_step": 119846, "epoch": 990} {"train_loss": -36.20541000366211, "global_step": 119847, "epoch": 990} {"train_loss": -38.58586120605469, "global_step": 119848, "epoch": 990} {"train_loss": -38.89022445678711, "global_step": 119849, "epoch": 990} {"train_loss": -37.194454193115234, "global_step": 119850, "epoch": 990} {"train_loss": -38.194129943847656, "global_step": 119851, "epoch": 990} {"train_loss": -37.851009368896484, "global_step": 119852, "epoch": 990} {"train_loss": -37.70272445678711, "global_step": 119853, "epoch": 990} {"train_loss": -38.68671798706055, "global_step": 119854, "epoch": 990} {"train_loss": -37.35209274291992, "global_step": 119855, "epoch": 990} {"train_loss": -38.54964828491211, "global_step": 119856, "epoch": 990} {"train_loss": -38.242740631103516, "global_step": 119857, "epoch": 990} {"train_loss": -38.35763931274414, "global_step": 119858, "epoch": 990} {"train_loss": -36.818748474121094, "global_step": 119859, "epoch": 990} {"train_loss": -39.193328857421875, "global_step": 119860, "epoch": 990} {"train_loss": -37.714141845703125, "global_step": 119861, "epoch": 990} {"train_loss": -38.43976974487305, "global_step": 119862, "epoch": 990} {"train_loss": -38.893402099609375, "global_step": 119863, "epoch": 990} {"train_loss": -37.94014358520508, "global_step": 119864, "epoch": 990} {"train_loss": -38.826351165771484, "global_step": 119865, "epoch": 990} {"train_loss": -38.20867919921875, "global_step": 119866, "epoch": 990} {"train_loss": -39.15877151489258, "global_step": 119867, "epoch": 990} {"train_loss": -39.33224105834961, "global_step": 119868, "epoch": 990} {"train_loss": -38.90886306762695, "global_step": 119869, "epoch": 990} {"train_loss": -38.67295455932617, "global_step": 119870, "epoch": 990} {"train_loss": -38.29641342163086, "global_step": 119871, "epoch": 990} {"train_loss": -38.120243072509766, "global_step": 119872, "epoch": 990} {"train_loss": -39.1444091796875, "global_step": 119873, "epoch": 990} {"train_loss": -37.23285675048828, "global_step": 119874, "epoch": 990} {"train_loss": -39.17350387573242, "global_step": 119875, "epoch": 990} {"train_loss": -37.804683685302734, "global_step": 119876, "epoch": 990} {"train_loss": -38.9617919921875, "global_step": 119877, "epoch": 990} {"train_loss": -39.6142692565918, "global_step": 119878, "epoch": 990} {"train_loss": -38.963722229003906, "global_step": 119879, "epoch": 990} {"train_loss": -39.272247314453125, "global_step": 119880, "epoch": 990} {"train_loss": -38.88861846923828, "global_step": 119881, "epoch": 990} {"train_loss": -39.3754768371582, "global_step": 119882, "epoch": 990} {"train_loss": -38.94997787475586, "global_step": 119883, "epoch": 990} {"train_loss": -39.32416534423828, "global_step": 119884, "epoch": 990} {"train_loss": -38.86304473876953, "global_step": 119885, "epoch": 990} {"train_loss": -37.39325714111328, "global_step": 119886, "epoch": 990} {"train_loss": -38.562313079833984, "global_step": 119887, "epoch": 990} {"train_loss": -39.55364990234375, "global_step": 119888, "epoch": 990} {"train_loss": -38.59708786010742, "global_step": 119889, "epoch": 990} {"train_loss": -39.97373962402344, "global_step": 119890, "epoch": 990} {"train_loss": -38.28061294555664, "global_step": 119891, "epoch": 990} {"train_loss": -38.9956169128418, "global_step": 119892, "epoch": 990} {"train_loss": -38.59511947631836, "global_step": 119893, "epoch": 990} {"train_loss": -37.16461181640625, "global_step": 119894, "epoch": 990} {"train_loss": -38.69906997680664, "global_step": 119895, "epoch": 990} {"train_loss": -39.567203521728516, "global_step": 119896, "epoch": 990} {"train_loss": -39.126258850097656, "global_step": 119897, "epoch": 990} {"train_loss": -38.930946350097656, "global_step": 119898, "epoch": 990} {"train_loss": -39.44793701171875, "global_step": 119899, "epoch": 990} {"train_loss": -39.46100997924805, "global_step": 119900, "epoch": 990} {"train_loss": -39.51723098754883, "global_step": 119901, "epoch": 990} {"train_loss": -39.35837936401367, "global_step": 119902, "epoch": 990} {"train_loss": -39.270931243896484, "global_step": 119903, "epoch": 990} {"train_loss": -39.37672424316406, "global_step": 119904, "epoch": 990} {"train_loss": -40.25917434692383, "global_step": 119905, "epoch": 990} {"train_loss": -33.69181823730469, "global_step": 119906, "epoch": 990} {"train_loss": -39.19934844970703, "global_step": 119907, "epoch": 990} {"train_loss": -38.51087951660156, "global_step": 119908, "epoch": 990} {"train_loss": -37.00954818725586, "global_step": 119909, "epoch": 990} {"train_loss": -38.821177458960165, "global_step": 119910, "epoch": 990, "val_loss": 2656920.0} {"train_loss": -38.130130767822266, "global_step": 119911, "epoch": 991} {"train_loss": -29.027311325073242, "global_step": 119912, "epoch": 991} {"train_loss": -31.239944458007812, "global_step": 119913, "epoch": 991} {"train_loss": -25.1344051361084, "global_step": 119914, "epoch": 991} {"train_loss": -32.72936248779297, "global_step": 119915, "epoch": 991} {"train_loss": -27.472076416015625, "global_step": 119916, "epoch": 991} {"train_loss": -29.65054702758789, "global_step": 119917, "epoch": 991} {"train_loss": -31.316211700439453, "global_step": 119918, "epoch": 991} {"train_loss": -28.09004783630371, "global_step": 119919, "epoch": 991} {"train_loss": -32.4122428894043, "global_step": 119920, "epoch": 991} {"train_loss": -32.657100677490234, "global_step": 119921, "epoch": 991} {"train_loss": -28.550878524780273, "global_step": 119922, "epoch": 991} {"train_loss": -30.855321884155273, "global_step": 119923, "epoch": 991} {"train_loss": -25.57071304321289, "global_step": 119924, "epoch": 991} {"train_loss": -22.120901107788086, "global_step": 119925, "epoch": 991} {"train_loss": -31.478063583374023, "global_step": 119926, "epoch": 991} {"train_loss": -30.994842529296875, "global_step": 119927, "epoch": 991} {"train_loss": -35.431488037109375, "global_step": 119928, "epoch": 991} {"train_loss": -35.3247184753418, "global_step": 119929, "epoch": 991} {"train_loss": -33.37351608276367, "global_step": 119930, "epoch": 991} {"train_loss": -35.47713851928711, "global_step": 119931, "epoch": 991} {"train_loss": -32.9393310546875, "global_step": 119932, "epoch": 991} {"train_loss": -34.31024932861328, "global_step": 119933, "epoch": 991} {"train_loss": -33.80559158325195, "global_step": 119934, "epoch": 991} {"train_loss": -33.8144645690918, "global_step": 119935, "epoch": 991} {"train_loss": -34.99292755126953, "global_step": 119936, "epoch": 991} {"train_loss": -34.472023010253906, "global_step": 119937, "epoch": 991} {"train_loss": -32.82198715209961, "global_step": 119938, "epoch": 991} {"train_loss": -34.71240997314453, "global_step": 119939, "epoch": 991} {"train_loss": -35.41624069213867, "global_step": 119940, "epoch": 991} {"train_loss": -35.916236877441406, "global_step": 119941, "epoch": 991} {"train_loss": -33.51887130737305, "global_step": 119942, "epoch": 991} {"train_loss": -36.076210021972656, "global_step": 119943, "epoch": 991} {"train_loss": -34.632930755615234, "global_step": 119944, "epoch": 991} {"train_loss": -34.82890701293945, "global_step": 119945, "epoch": 991} {"train_loss": -35.5517692565918, "global_step": 119946, "epoch": 991} {"train_loss": -35.84040069580078, "global_step": 119947, "epoch": 991} {"train_loss": -35.336673736572266, "global_step": 119948, "epoch": 991} {"train_loss": -36.546878814697266, "global_step": 119949, "epoch": 991} {"train_loss": -35.55435562133789, "global_step": 119950, "epoch": 991} {"train_loss": -35.838714599609375, "global_step": 119951, "epoch": 991} {"train_loss": -35.41828155517578, "global_step": 119952, "epoch": 991} {"train_loss": -35.54704666137695, "global_step": 119953, "epoch": 991} {"train_loss": -36.53623580932617, "global_step": 119954, "epoch": 991} {"train_loss": -36.64859390258789, "global_step": 119955, "epoch": 991} {"train_loss": -36.7637939453125, "global_step": 119956, "epoch": 991} {"train_loss": -36.52463912963867, "global_step": 119957, "epoch": 991} {"train_loss": -36.6551628112793, "global_step": 119958, "epoch": 991} {"train_loss": -36.194454193115234, "global_step": 119959, "epoch": 991} {"train_loss": -36.14408874511719, "global_step": 119960, "epoch": 991} {"train_loss": -36.73276901245117, "global_step": 119961, "epoch": 991} {"train_loss": -35.30617904663086, "global_step": 119962, "epoch": 991} {"train_loss": -36.358333587646484, "global_step": 119963, "epoch": 991} {"train_loss": -37.28348922729492, "global_step": 119964, "epoch": 991} {"train_loss": -36.592952728271484, "global_step": 119965, "epoch": 991} {"train_loss": -36.68468475341797, "global_step": 119966, "epoch": 991} {"train_loss": -37.20447540283203, "global_step": 119967, "epoch": 991} {"train_loss": -36.99957275390625, "global_step": 119968, "epoch": 991} {"train_loss": -35.90366744995117, "global_step": 119969, "epoch": 991} {"train_loss": -36.72792434692383, "global_step": 119970, "epoch": 991} {"train_loss": -37.16725158691406, "global_step": 119971, "epoch": 991} {"train_loss": -36.42420196533203, "global_step": 119972, "epoch": 991} {"train_loss": -37.83652877807617, "global_step": 119973, "epoch": 991} {"train_loss": -36.92422103881836, "global_step": 119974, "epoch": 991} {"train_loss": -37.57526779174805, "global_step": 119975, "epoch": 991} {"train_loss": -36.98603820800781, "global_step": 119976, "epoch": 991} {"train_loss": -37.10433578491211, "global_step": 119977, "epoch": 991} {"train_loss": -37.35010528564453, "global_step": 119978, "epoch": 991} {"train_loss": -37.014339447021484, "global_step": 119979, "epoch": 991} {"train_loss": -38.38240432739258, "global_step": 119980, "epoch": 991} {"train_loss": -37.480499267578125, "global_step": 119981, "epoch": 991} {"train_loss": -37.97742462158203, "global_step": 119982, "epoch": 991} {"train_loss": -37.35559844970703, "global_step": 119983, "epoch": 991} {"train_loss": -37.90781784057617, "global_step": 119984, "epoch": 991} {"train_loss": -37.49077224731445, "global_step": 119985, "epoch": 991} {"train_loss": -37.592803955078125, "global_step": 119986, "epoch": 991} {"train_loss": -37.76639938354492, "global_step": 119987, "epoch": 991} {"train_loss": -37.574012756347656, "global_step": 119988, "epoch": 991} {"train_loss": -38.042335510253906, "global_step": 119989, "epoch": 991} {"train_loss": -38.435054779052734, "global_step": 119990, "epoch": 991} {"train_loss": -38.63753890991211, "global_step": 119991, "epoch": 991} {"train_loss": -38.37839126586914, "global_step": 119992, "epoch": 991} {"train_loss": -37.68882369995117, "global_step": 119993, "epoch": 991} {"train_loss": -38.0287971496582, "global_step": 119994, "epoch": 991} {"train_loss": -37.95359420776367, "global_step": 119995, "epoch": 991} {"train_loss": -38.1776237487793, "global_step": 119996, "epoch": 991} {"train_loss": -38.112239837646484, "global_step": 119997, "epoch": 991} {"train_loss": -38.135955810546875, "global_step": 119998, "epoch": 991} {"train_loss": -38.45965576171875, "global_step": 119999, "epoch": 991} {"train_loss": -38.50227355957031, "global_step": 120000, "epoch": 991} {"train_loss": -39.155006408691406, "global_step": 120001, "epoch": 991} {"train_loss": -38.5984992980957, "global_step": 120002, "epoch": 991} {"train_loss": -38.41459274291992, "global_step": 120003, "epoch": 991} {"train_loss": -37.60762023925781, "global_step": 120004, "epoch": 991} {"train_loss": -39.08759689331055, "global_step": 120005, "epoch": 991} {"train_loss": -38.680973052978516, "global_step": 120006, "epoch": 991} {"train_loss": -38.13201904296875, "global_step": 120007, "epoch": 991} {"train_loss": -38.54933547973633, "global_step": 120008, "epoch": 991} {"train_loss": -39.001338958740234, "global_step": 120009, "epoch": 991} {"train_loss": -38.04597854614258, "global_step": 120010, "epoch": 991} {"train_loss": -38.99635696411133, "global_step": 120011, "epoch": 991} {"train_loss": -39.003929138183594, "global_step": 120012, "epoch": 991} {"train_loss": -37.0269775390625, "global_step": 120013, "epoch": 991} {"train_loss": -38.40433883666992, "global_step": 120014, "epoch": 991} {"train_loss": -38.20537185668945, "global_step": 120015, "epoch": 991} {"train_loss": -38.841651916503906, "global_step": 120016, "epoch": 991} {"train_loss": -38.822261810302734, "global_step": 120017, "epoch": 991} {"train_loss": -39.11314010620117, "global_step": 120018, "epoch": 991} {"train_loss": -39.32609176635742, "global_step": 120019, "epoch": 991} {"train_loss": -38.86550521850586, "global_step": 120020, "epoch": 991} {"train_loss": -39.18621826171875, "global_step": 120021, "epoch": 991} {"train_loss": -39.548919677734375, "global_step": 120022, "epoch": 991} {"train_loss": -39.1264533996582, "global_step": 120023, "epoch": 991} {"train_loss": -39.462677001953125, "global_step": 120024, "epoch": 991} {"train_loss": -39.45543670654297, "global_step": 120025, "epoch": 991} {"train_loss": -38.816986083984375, "global_step": 120026, "epoch": 991} {"train_loss": -38.996726989746094, "global_step": 120027, "epoch": 991} {"train_loss": -39.43672561645508, "global_step": 120028, "epoch": 991} {"train_loss": -39.13680648803711, "global_step": 120029, "epoch": 991} {"train_loss": -39.3004150390625, "global_step": 120030, "epoch": 991} {"train_loss": -36.12962686522933, "global_step": 120031, "epoch": 991, "val_loss": 2687332.0} {"train_loss": -39.20327377319336, "global_step": 120032, "epoch": 992} {"train_loss": -38.778560638427734, "global_step": 120033, "epoch": 992} {"train_loss": -39.094512939453125, "global_step": 120034, "epoch": 992} {"train_loss": -39.03685760498047, "global_step": 120035, "epoch": 992} {"train_loss": -39.302425384521484, "global_step": 120036, "epoch": 992} {"train_loss": -39.429771423339844, "global_step": 120037, "epoch": 992} {"train_loss": -39.99293899536133, "global_step": 120038, "epoch": 992} {"train_loss": -39.03661346435547, "global_step": 120039, "epoch": 992} {"train_loss": -39.275997161865234, "global_step": 120040, "epoch": 992} {"train_loss": -39.154781341552734, "global_step": 120041, "epoch": 992} {"train_loss": -37.86698532104492, "global_step": 120042, "epoch": 992} {"train_loss": -37.8817024230957, "global_step": 120043, "epoch": 992} {"train_loss": -39.154109954833984, "global_step": 120044, "epoch": 992} {"train_loss": -37.86359405517578, "global_step": 120045, "epoch": 992} {"train_loss": -38.31278610229492, "global_step": 120046, "epoch": 992} {"train_loss": -36.112300872802734, "global_step": 120047, "epoch": 992} {"train_loss": -32.18939971923828, "global_step": 120048, "epoch": 992} {"train_loss": -31.004825592041016, "global_step": 120049, "epoch": 992} {"train_loss": -30.95354652404785, "global_step": 120050, "epoch": 992} {"train_loss": -29.311328887939453, "global_step": 120051, "epoch": 992} {"train_loss": -34.99277114868164, "global_step": 120052, "epoch": 992} {"train_loss": -37.20541000366211, "global_step": 120053, "epoch": 992} {"train_loss": -32.06659698486328, "global_step": 120054, "epoch": 992} {"train_loss": -36.79595947265625, "global_step": 120055, "epoch": 992} {"train_loss": -36.53315353393555, "global_step": 120056, "epoch": 992} {"train_loss": -37.948116302490234, "global_step": 120057, "epoch": 992} {"train_loss": -37.389827728271484, "global_step": 120058, "epoch": 992} {"train_loss": -37.801979064941406, "global_step": 120059, "epoch": 992} {"train_loss": -38.35323715209961, "global_step": 120060, "epoch": 992} {"train_loss": -37.9848518371582, "global_step": 120061, "epoch": 992} {"train_loss": -37.994789123535156, "global_step": 120062, "epoch": 992} {"train_loss": -37.7330436706543, "global_step": 120063, "epoch": 992} {"train_loss": -38.02046585083008, "global_step": 120064, "epoch": 992} {"train_loss": -37.93362808227539, "global_step": 120065, "epoch": 992} {"train_loss": -37.9395866394043, "global_step": 120066, "epoch": 992} {"train_loss": -38.947723388671875, "global_step": 120067, "epoch": 992} {"train_loss": -37.75452423095703, "global_step": 120068, "epoch": 992} {"train_loss": -37.89805221557617, "global_step": 120069, "epoch": 992} {"train_loss": -37.930355072021484, "global_step": 120070, "epoch": 992} {"train_loss": -38.68866729736328, "global_step": 120071, "epoch": 992} {"train_loss": -38.48149490356445, "global_step": 120072, "epoch": 992} {"train_loss": -39.16609573364258, "global_step": 120073, "epoch": 992} {"train_loss": -38.959999084472656, "global_step": 120074, "epoch": 992} {"train_loss": -38.939796447753906, "global_step": 120075, "epoch": 992} {"train_loss": -38.95827102661133, "global_step": 120076, "epoch": 992} {"train_loss": -39.53116989135742, "global_step": 120077, "epoch": 992} {"train_loss": -39.16422653198242, "global_step": 120078, "epoch": 992} {"train_loss": -39.575904846191406, "global_step": 120079, "epoch": 992} {"train_loss": -39.49545669555664, "global_step": 120080, "epoch": 992} {"train_loss": -39.64130783081055, "global_step": 120081, "epoch": 992} {"train_loss": -39.18439865112305, "global_step": 120082, "epoch": 992} {"train_loss": -39.5983772277832, "global_step": 120083, "epoch": 992} {"train_loss": -39.48354721069336, "global_step": 120084, "epoch": 992} {"train_loss": -39.690608978271484, "global_step": 120085, "epoch": 992} {"train_loss": -39.90055465698242, "global_step": 120086, "epoch": 992} {"train_loss": -39.33571243286133, "global_step": 120087, "epoch": 992} {"train_loss": -39.18842697143555, "global_step": 120088, "epoch": 992} {"train_loss": -39.41994857788086, "global_step": 120089, "epoch": 992} {"train_loss": -39.96894073486328, "global_step": 120090, "epoch": 992} {"train_loss": -38.9611930847168, "global_step": 120091, "epoch": 992} {"train_loss": -39.9261360168457, "global_step": 120092, "epoch": 992} {"train_loss": -39.4211311340332, "global_step": 120093, "epoch": 992} {"train_loss": -39.82284164428711, "global_step": 120094, "epoch": 992} {"train_loss": -39.43709945678711, "global_step": 120095, "epoch": 992} {"train_loss": -40.11233139038086, "global_step": 120096, "epoch": 992} {"train_loss": -39.61167907714844, "global_step": 120097, "epoch": 992} {"train_loss": -39.87269973754883, "global_step": 120098, "epoch": 992} {"train_loss": -39.62284469604492, "global_step": 120099, "epoch": 992} {"train_loss": -39.43818283081055, "global_step": 120100, "epoch": 992} {"train_loss": -39.952850341796875, "global_step": 120101, "epoch": 992} {"train_loss": -39.042179107666016, "global_step": 120102, "epoch": 992} {"train_loss": -39.22185516357422, "global_step": 120103, "epoch": 992} {"train_loss": -40.411556243896484, "global_step": 120104, "epoch": 992} {"train_loss": -39.512325286865234, "global_step": 120105, "epoch": 992} {"train_loss": -40.12850570678711, "global_step": 120106, "epoch": 992} {"train_loss": -39.76807403564453, "global_step": 120107, "epoch": 992} {"train_loss": -39.70634841918945, "global_step": 120108, "epoch": 992} {"train_loss": -39.8029899597168, "global_step": 120109, "epoch": 992} {"train_loss": -39.75872039794922, "global_step": 120110, "epoch": 992} {"train_loss": -36.12712860107422, "global_step": 120111, "epoch": 992} {"train_loss": -38.8990592956543, "global_step": 120112, "epoch": 992} {"train_loss": -39.60476303100586, "global_step": 120113, "epoch": 992} {"train_loss": -39.44907760620117, "global_step": 120114, "epoch": 992} {"train_loss": -39.74359893798828, "global_step": 120115, "epoch": 992} {"train_loss": -37.849876403808594, "global_step": 120116, "epoch": 992} {"train_loss": -39.7669677734375, "global_step": 120117, "epoch": 992} {"train_loss": -37.7326774597168, "global_step": 120118, "epoch": 992} {"train_loss": -39.30140686035156, "global_step": 120119, "epoch": 992} {"train_loss": -37.72701644897461, "global_step": 120120, "epoch": 992} {"train_loss": -39.75069046020508, "global_step": 120121, "epoch": 992} {"train_loss": -39.59885025024414, "global_step": 120122, "epoch": 992} {"train_loss": -36.86072540283203, "global_step": 120123, "epoch": 992} {"train_loss": -39.02217483520508, "global_step": 120124, "epoch": 992} {"train_loss": -39.326778411865234, "global_step": 120125, "epoch": 992} {"train_loss": -38.820411682128906, "global_step": 120126, "epoch": 992} {"train_loss": -38.85748291015625, "global_step": 120127, "epoch": 992} {"train_loss": -37.94672393798828, "global_step": 120128, "epoch": 992} {"train_loss": -38.63015365600586, "global_step": 120129, "epoch": 992} {"train_loss": -38.877925872802734, "global_step": 120130, "epoch": 992} {"train_loss": -37.59534454345703, "global_step": 120131, "epoch": 992} {"train_loss": -37.53739547729492, "global_step": 120132, "epoch": 992} {"train_loss": -39.383888244628906, "global_step": 120133, "epoch": 992} {"train_loss": -38.27105712890625, "global_step": 120134, "epoch": 992} {"train_loss": -37.147953033447266, "global_step": 120135, "epoch": 992} {"train_loss": -35.270992279052734, "global_step": 120136, "epoch": 992} {"train_loss": -39.35573196411133, "global_step": 120137, "epoch": 992} {"train_loss": -37.51806640625, "global_step": 120138, "epoch": 992} {"train_loss": -38.183284759521484, "global_step": 120139, "epoch": 992} {"train_loss": -35.246646881103516, "global_step": 120140, "epoch": 992} {"train_loss": -36.5191764831543, "global_step": 120141, "epoch": 992} {"train_loss": -36.370361328125, "global_step": 120142, "epoch": 992} {"train_loss": -35.46609878540039, "global_step": 120143, "epoch": 992} {"train_loss": -35.85248565673828, "global_step": 120144, "epoch": 992} {"train_loss": -37.448787689208984, "global_step": 120145, "epoch": 992} {"train_loss": -36.04092025756836, "global_step": 120146, "epoch": 992} {"train_loss": -33.97819137573242, "global_step": 120147, "epoch": 992} {"train_loss": -31.015304565429688, "global_step": 120148, "epoch": 992} {"train_loss": -33.39876937866211, "global_step": 120149, "epoch": 992} {"train_loss": -35.634063720703125, "global_step": 120150, "epoch": 992} {"train_loss": -32.54286193847656, "global_step": 120151, "epoch": 992} {"train_loss": -38.035162287310136, "global_step": 120152, "epoch": 992, "val_loss": 2773446.75} {"train_loss": -36.92877960205078, "global_step": 120153, "epoch": 993} {"train_loss": -36.0410041809082, "global_step": 120154, "epoch": 993} {"train_loss": -34.934600830078125, "global_step": 120155, "epoch": 993} {"train_loss": -34.8531379699707, "global_step": 120156, "epoch": 993} {"train_loss": -36.9781379699707, "global_step": 120157, "epoch": 993} {"train_loss": -37.32591247558594, "global_step": 120158, "epoch": 993} {"train_loss": -36.480224609375, "global_step": 120159, "epoch": 993} {"train_loss": -37.04574966430664, "global_step": 120160, "epoch": 993} {"train_loss": -36.70916748046875, "global_step": 120161, "epoch": 993} {"train_loss": -34.95211410522461, "global_step": 120162, "epoch": 993} {"train_loss": -36.1860237121582, "global_step": 120163, "epoch": 993} {"train_loss": -37.072052001953125, "global_step": 120164, "epoch": 993} {"train_loss": -35.36704635620117, "global_step": 120165, "epoch": 993} {"train_loss": -36.61246871948242, "global_step": 120166, "epoch": 993} {"train_loss": -34.78619384765625, "global_step": 120167, "epoch": 993} {"train_loss": -35.547203063964844, "global_step": 120168, "epoch": 993} {"train_loss": -36.645626068115234, "global_step": 120169, "epoch": 993} {"train_loss": -37.06510543823242, "global_step": 120170, "epoch": 993} {"train_loss": -36.83089828491211, "global_step": 120171, "epoch": 993} {"train_loss": -35.63198471069336, "global_step": 120172, "epoch": 993} {"train_loss": -36.551536560058594, "global_step": 120173, "epoch": 993} {"train_loss": -37.62279510498047, "global_step": 120174, "epoch": 993} {"train_loss": -37.364864349365234, "global_step": 120175, "epoch": 993} {"train_loss": -37.68971633911133, "global_step": 120176, "epoch": 993} {"train_loss": -36.89996337890625, "global_step": 120177, "epoch": 993} {"train_loss": -37.31351852416992, "global_step": 120178, "epoch": 993} {"train_loss": -37.16914749145508, "global_step": 120179, "epoch": 993} {"train_loss": -36.44148254394531, "global_step": 120180, "epoch": 993} {"train_loss": -36.75675582885742, "global_step": 120181, "epoch": 993} {"train_loss": -36.94584655761719, "global_step": 120182, "epoch": 993} {"train_loss": -37.736412048339844, "global_step": 120183, "epoch": 993} {"train_loss": -38.52415084838867, "global_step": 120184, "epoch": 993} {"train_loss": -38.09698486328125, "global_step": 120185, "epoch": 993} {"train_loss": -37.90876388549805, "global_step": 120186, "epoch": 993} {"train_loss": -37.44266128540039, "global_step": 120187, "epoch": 993} {"train_loss": -37.208248138427734, "global_step": 120188, "epoch": 993} {"train_loss": -38.24507522583008, "global_step": 120189, "epoch": 993} {"train_loss": -38.017696380615234, "global_step": 120190, "epoch": 993} {"train_loss": -38.19940185546875, "global_step": 120191, "epoch": 993} {"train_loss": -38.397037506103516, "global_step": 120192, "epoch": 993} {"train_loss": -37.91705322265625, "global_step": 120193, "epoch": 993} {"train_loss": -38.192012786865234, "global_step": 120194, "epoch": 993} {"train_loss": -38.868160247802734, "global_step": 120195, "epoch": 993} {"train_loss": -38.29921340942383, "global_step": 120196, "epoch": 993} {"train_loss": -37.102718353271484, "global_step": 120197, "epoch": 993} {"train_loss": -37.932308197021484, "global_step": 120198, "epoch": 993} {"train_loss": -38.565982818603516, "global_step": 120199, "epoch": 993} {"train_loss": -38.557044982910156, "global_step": 120200, "epoch": 993} {"train_loss": -38.24468231201172, "global_step": 120201, "epoch": 993} {"train_loss": -38.53178787231445, "global_step": 120202, "epoch": 993} {"train_loss": -38.90635299682617, "global_step": 120203, "epoch": 993} {"train_loss": -38.64228439331055, "global_step": 120204, "epoch": 993} {"train_loss": -38.376583099365234, "global_step": 120205, "epoch": 993} {"train_loss": -38.706512451171875, "global_step": 120206, "epoch": 993} {"train_loss": -38.63751983642578, "global_step": 120207, "epoch": 993} {"train_loss": -39.006710052490234, "global_step": 120208, "epoch": 993} {"train_loss": -38.983516693115234, "global_step": 120209, "epoch": 993} {"train_loss": -39.23991775512695, "global_step": 120210, "epoch": 993} {"train_loss": -39.3729133605957, "global_step": 120211, "epoch": 993} {"train_loss": -39.12697982788086, "global_step": 120212, "epoch": 993} {"train_loss": -39.19625473022461, "global_step": 120213, "epoch": 993} {"train_loss": -39.245513916015625, "global_step": 120214, "epoch": 993} {"train_loss": -38.897674560546875, "global_step": 120215, "epoch": 993} {"train_loss": -39.398441314697266, "global_step": 120216, "epoch": 993} {"train_loss": -39.3300666809082, "global_step": 120217, "epoch": 993} {"train_loss": -39.067378997802734, "global_step": 120218, "epoch": 993} {"train_loss": -39.293819427490234, "global_step": 120219, "epoch": 993} {"train_loss": -39.508811950683594, "global_step": 120220, "epoch": 993} {"train_loss": -39.34688949584961, "global_step": 120221, "epoch": 993} {"train_loss": -39.432533264160156, "global_step": 120222, "epoch": 993} {"train_loss": -39.31108856201172, "global_step": 120223, "epoch": 993} {"train_loss": -39.444637298583984, "global_step": 120224, "epoch": 993} {"train_loss": -39.39577865600586, "global_step": 120225, "epoch": 993} {"train_loss": -39.52846908569336, "global_step": 120226, "epoch": 993} {"train_loss": -39.51216125488281, "global_step": 120227, "epoch": 993} {"train_loss": -38.90712356567383, "global_step": 120228, "epoch": 993} {"train_loss": -39.22286605834961, "global_step": 120229, "epoch": 993} {"train_loss": -39.38127517700195, "global_step": 120230, "epoch": 993} {"train_loss": -39.82590103149414, "global_step": 120231, "epoch": 993} {"train_loss": -39.49089050292969, "global_step": 120232, "epoch": 993} {"train_loss": -38.3072624206543, "global_step": 120233, "epoch": 993} {"train_loss": -38.944732666015625, "global_step": 120234, "epoch": 993} {"train_loss": -38.92009353637695, "global_step": 120235, "epoch": 993} {"train_loss": -39.026458740234375, "global_step": 120236, "epoch": 993} {"train_loss": -39.75642776489258, "global_step": 120237, "epoch": 993} {"train_loss": -39.895809173583984, "global_step": 120238, "epoch": 993} {"train_loss": -39.5764045715332, "global_step": 120239, "epoch": 993} {"train_loss": -39.3779411315918, "global_step": 120240, "epoch": 993} {"train_loss": -39.22280502319336, "global_step": 120241, "epoch": 993} {"train_loss": -39.93102264404297, "global_step": 120242, "epoch": 993} {"train_loss": -39.44226837158203, "global_step": 120243, "epoch": 993} {"train_loss": -40.037628173828125, "global_step": 120244, "epoch": 993} {"train_loss": -39.74677276611328, "global_step": 120245, "epoch": 993} {"train_loss": -39.896915435791016, "global_step": 120246, "epoch": 993} {"train_loss": -39.409847259521484, "global_step": 120247, "epoch": 993} {"train_loss": -40.08366394042969, "global_step": 120248, "epoch": 993} {"train_loss": -40.16191864013672, "global_step": 120249, "epoch": 993} {"train_loss": -39.97610092163086, "global_step": 120250, "epoch": 993} {"train_loss": -40.013885498046875, "global_step": 120251, "epoch": 993} {"train_loss": -39.74360275268555, "global_step": 120252, "epoch": 993} {"train_loss": -39.71367263793945, "global_step": 120253, "epoch": 993} {"train_loss": -40.12321090698242, "global_step": 120254, "epoch": 993} {"train_loss": -39.18790817260742, "global_step": 120255, "epoch": 993} {"train_loss": -38.91741943359375, "global_step": 120256, "epoch": 993} {"train_loss": -40.3062629699707, "global_step": 120257, "epoch": 993} {"train_loss": -39.23798370361328, "global_step": 120258, "epoch": 993} {"train_loss": -40.032806396484375, "global_step": 120259, "epoch": 993} {"train_loss": -39.899593353271484, "global_step": 120260, "epoch": 993} {"train_loss": -39.43006134033203, "global_step": 120261, "epoch": 993} {"train_loss": -39.588802337646484, "global_step": 120262, "epoch": 993} {"train_loss": -39.64537811279297, "global_step": 120263, "epoch": 993} {"train_loss": -40.15837478637695, "global_step": 120264, "epoch": 993} {"train_loss": -39.87889099121094, "global_step": 120265, "epoch": 993} {"train_loss": -40.10285568237305, "global_step": 120266, "epoch": 993} {"train_loss": -40.355445861816406, "global_step": 120267, "epoch": 993} {"train_loss": -40.62992477416992, "global_step": 120268, "epoch": 993} {"train_loss": -40.48297882080078, "global_step": 120269, "epoch": 993} {"train_loss": -40.02692794799805, "global_step": 120270, "epoch": 993} {"train_loss": -40.181907653808594, "global_step": 120271, "epoch": 993} {"train_loss": -39.41289138793945, "global_step": 120272, "epoch": 993} {"train_loss": -38.50734575129738, "global_step": 120273, "epoch": 993, "val_loss": 2725360.5} {"train_loss": -34.74650192260742, "global_step": 120274, "epoch": 994} {"train_loss": -34.65228271484375, "global_step": 120275, "epoch": 994} {"train_loss": -34.89729309082031, "global_step": 120276, "epoch": 994} {"train_loss": -35.03300857543945, "global_step": 120277, "epoch": 994} {"train_loss": -37.05134201049805, "global_step": 120278, "epoch": 994} {"train_loss": -38.704498291015625, "global_step": 120279, "epoch": 994} {"train_loss": -36.68076705932617, "global_step": 120280, "epoch": 994} {"train_loss": -36.16898727416992, "global_step": 120281, "epoch": 994} {"train_loss": -37.7150764465332, "global_step": 120282, "epoch": 994} {"train_loss": -39.49020004272461, "global_step": 120283, "epoch": 994} {"train_loss": -37.101051330566406, "global_step": 120284, "epoch": 994} {"train_loss": -37.093936920166016, "global_step": 120285, "epoch": 994} {"train_loss": -37.7534294128418, "global_step": 120286, "epoch": 994} {"train_loss": -39.00785446166992, "global_step": 120287, "epoch": 994} {"train_loss": -38.81145095825195, "global_step": 120288, "epoch": 994} {"train_loss": -38.386566162109375, "global_step": 120289, "epoch": 994} {"train_loss": -38.43404769897461, "global_step": 120290, "epoch": 994} {"train_loss": -39.24227523803711, "global_step": 120291, "epoch": 994} {"train_loss": -38.02478790283203, "global_step": 120292, "epoch": 994} {"train_loss": -39.5136604309082, "global_step": 120293, "epoch": 994} {"train_loss": -38.24673080444336, "global_step": 120294, "epoch": 994} {"train_loss": -38.75751495361328, "global_step": 120295, "epoch": 994} {"train_loss": -36.88644027709961, "global_step": 120296, "epoch": 994} {"train_loss": -38.556236267089844, "global_step": 120297, "epoch": 994} {"train_loss": -36.91373062133789, "global_step": 120298, "epoch": 994} {"train_loss": -38.94004440307617, "global_step": 120299, "epoch": 994} {"train_loss": -38.13946533203125, "global_step": 120300, "epoch": 994} {"train_loss": -38.3874626159668, "global_step": 120301, "epoch": 994} {"train_loss": -39.19768142700195, "global_step": 120302, "epoch": 994} {"train_loss": -38.427974700927734, "global_step": 120303, "epoch": 994} {"train_loss": -37.78895950317383, "global_step": 120304, "epoch": 994} {"train_loss": -38.57363510131836, "global_step": 120305, "epoch": 994} {"train_loss": -39.449188232421875, "global_step": 120306, "epoch": 994} {"train_loss": -38.82001876831055, "global_step": 120307, "epoch": 994} {"train_loss": -39.3726921081543, "global_step": 120308, "epoch": 994} {"train_loss": -39.07111740112305, "global_step": 120309, "epoch": 994} {"train_loss": -39.063934326171875, "global_step": 120310, "epoch": 994} {"train_loss": -38.86149978637695, "global_step": 120311, "epoch": 994} {"train_loss": -39.09824752807617, "global_step": 120312, "epoch": 994} {"train_loss": -38.86811447143555, "global_step": 120313, "epoch": 994} {"train_loss": -37.810691833496094, "global_step": 120314, "epoch": 994} {"train_loss": -38.8223991394043, "global_step": 120315, "epoch": 994} {"train_loss": -39.13456726074219, "global_step": 120316, "epoch": 994} {"train_loss": -38.45359802246094, "global_step": 120317, "epoch": 994} {"train_loss": -39.7666015625, "global_step": 120318, "epoch": 994} {"train_loss": -39.58442306518555, "global_step": 120319, "epoch": 994} {"train_loss": -39.75774002075195, "global_step": 120320, "epoch": 994} {"train_loss": -38.77124786376953, "global_step": 120321, "epoch": 994} {"train_loss": -39.45469665527344, "global_step": 120322, "epoch": 994} {"train_loss": -35.84294891357422, "global_step": 120323, "epoch": 994} {"train_loss": -40.01128005981445, "global_step": 120324, "epoch": 994} {"train_loss": -39.18058395385742, "global_step": 120325, "epoch": 994} {"train_loss": -37.95071029663086, "global_step": 120326, "epoch": 994} {"train_loss": -39.04890060424805, "global_step": 120327, "epoch": 994} {"train_loss": -37.35895538330078, "global_step": 120328, "epoch": 994} {"train_loss": -38.67466354370117, "global_step": 120329, "epoch": 994} {"train_loss": -39.738128662109375, "global_step": 120330, "epoch": 994} {"train_loss": -39.66731643676758, "global_step": 120331, "epoch": 994} {"train_loss": -38.16831588745117, "global_step": 120332, "epoch": 994} {"train_loss": -39.71021270751953, "global_step": 120333, "epoch": 994} {"train_loss": -39.27197265625, "global_step": 120334, "epoch": 994} {"train_loss": -39.01194763183594, "global_step": 120335, "epoch": 994} {"train_loss": -39.49691390991211, "global_step": 120336, "epoch": 994} {"train_loss": -39.42428970336914, "global_step": 120337, "epoch": 994} {"train_loss": -39.28281784057617, "global_step": 120338, "epoch": 994} {"train_loss": -38.883052825927734, "global_step": 120339, "epoch": 994} {"train_loss": -39.75458526611328, "global_step": 120340, "epoch": 994} {"train_loss": -38.231422424316406, "global_step": 120341, "epoch": 994} {"train_loss": -38.494747161865234, "global_step": 120342, "epoch": 994} {"train_loss": -39.227867126464844, "global_step": 120343, "epoch": 994} {"train_loss": -39.757476806640625, "global_step": 120344, "epoch": 994} {"train_loss": -39.62590408325195, "global_step": 120345, "epoch": 994} {"train_loss": -39.85224533081055, "global_step": 120346, "epoch": 994} {"train_loss": -39.21348190307617, "global_step": 120347, "epoch": 994} {"train_loss": -39.704097747802734, "global_step": 120348, "epoch": 994} {"train_loss": -40.186012268066406, "global_step": 120349, "epoch": 994} {"train_loss": -39.826866149902344, "global_step": 120350, "epoch": 994} {"train_loss": -39.61581039428711, "global_step": 120351, "epoch": 994} {"train_loss": -39.463233947753906, "global_step": 120352, "epoch": 994} {"train_loss": -40.063934326171875, "global_step": 120353, "epoch": 994} {"train_loss": -39.417903900146484, "global_step": 120354, "epoch": 994} {"train_loss": -38.509254455566406, "global_step": 120355, "epoch": 994} {"train_loss": -37.58784866333008, "global_step": 120356, "epoch": 994} {"train_loss": -38.745567321777344, "global_step": 120357, "epoch": 994} {"train_loss": -37.18225860595703, "global_step": 120358, "epoch": 994} {"train_loss": -36.34455490112305, "global_step": 120359, "epoch": 994} {"train_loss": -37.309200286865234, "global_step": 120360, "epoch": 994} {"train_loss": -38.791786193847656, "global_step": 120361, "epoch": 994} {"train_loss": -39.34609603881836, "global_step": 120362, "epoch": 994} {"train_loss": -39.31181716918945, "global_step": 120363, "epoch": 994} {"train_loss": -37.89199447631836, "global_step": 120364, "epoch": 994} {"train_loss": -39.011959075927734, "global_step": 120365, "epoch": 994} {"train_loss": -39.23063278198242, "global_step": 120366, "epoch": 994} {"train_loss": -39.5316276550293, "global_step": 120367, "epoch": 994} {"train_loss": -39.696895599365234, "global_step": 120368, "epoch": 994} {"train_loss": -39.35760498046875, "global_step": 120369, "epoch": 994} {"train_loss": -39.86915969848633, "global_step": 120370, "epoch": 994} {"train_loss": -39.7315788269043, "global_step": 120371, "epoch": 994} {"train_loss": -39.26600646972656, "global_step": 120372, "epoch": 994} {"train_loss": -38.49933624267578, "global_step": 120373, "epoch": 994} {"train_loss": -39.75664138793945, "global_step": 120374, "epoch": 994} {"train_loss": -39.62335205078125, "global_step": 120375, "epoch": 994} {"train_loss": -39.68060302734375, "global_step": 120376, "epoch": 994} {"train_loss": -38.3829345703125, "global_step": 120377, "epoch": 994} {"train_loss": -39.44491195678711, "global_step": 120378, "epoch": 994} {"train_loss": -37.66469955444336, "global_step": 120379, "epoch": 994} {"train_loss": -36.927528381347656, "global_step": 120380, "epoch": 994} {"train_loss": -38.980587005615234, "global_step": 120381, "epoch": 994} {"train_loss": -38.843345642089844, "global_step": 120382, "epoch": 994} {"train_loss": -38.70956039428711, "global_step": 120383, "epoch": 994} {"train_loss": -38.97544479370117, "global_step": 120384, "epoch": 994} {"train_loss": -38.68243408203125, "global_step": 120385, "epoch": 994} {"train_loss": -38.524017333984375, "global_step": 120386, "epoch": 994} {"train_loss": -39.177337646484375, "global_step": 120387, "epoch": 994} {"train_loss": -38.74148178100586, "global_step": 120388, "epoch": 994} {"train_loss": -37.80799102783203, "global_step": 120389, "epoch": 994} {"train_loss": -38.619808197021484, "global_step": 120390, "epoch": 994} {"train_loss": -39.114662170410156, "global_step": 120391, "epoch": 994} {"train_loss": -37.665035247802734, "global_step": 120392, "epoch": 994} {"train_loss": -37.802215576171875, "global_step": 120393, "epoch": 994} {"train_loss": -38.60609637804268, "global_step": 120394, "epoch": 994, "val_loss": 2710475.25} {"train_loss": -39.18169021606445, "global_step": 120395, "epoch": 995} {"train_loss": -38.643951416015625, "global_step": 120396, "epoch": 995} {"train_loss": -37.994850158691406, "global_step": 120397, "epoch": 995} {"train_loss": -39.42799377441406, "global_step": 120398, "epoch": 995} {"train_loss": -37.91046905517578, "global_step": 120399, "epoch": 995} {"train_loss": -37.54738998413086, "global_step": 120400, "epoch": 995} {"train_loss": -37.702003479003906, "global_step": 120401, "epoch": 995} {"train_loss": -39.60593032836914, "global_step": 120402, "epoch": 995} {"train_loss": -38.44730758666992, "global_step": 120403, "epoch": 995} {"train_loss": -38.41073989868164, "global_step": 120404, "epoch": 995} {"train_loss": -39.32236862182617, "global_step": 120405, "epoch": 995} {"train_loss": -37.402374267578125, "global_step": 120406, "epoch": 995} {"train_loss": -39.470794677734375, "global_step": 120407, "epoch": 995} {"train_loss": -39.16842269897461, "global_step": 120408, "epoch": 995} {"train_loss": -37.842689514160156, "global_step": 120409, "epoch": 995} {"train_loss": -37.71009826660156, "global_step": 120410, "epoch": 995} {"train_loss": -38.382972717285156, "global_step": 120411, "epoch": 995} {"train_loss": -39.09199142456055, "global_step": 120412, "epoch": 995} {"train_loss": -38.42129135131836, "global_step": 120413, "epoch": 995} {"train_loss": -38.10661697387695, "global_step": 120414, "epoch": 995} {"train_loss": -39.44050979614258, "global_step": 120415, "epoch": 995} {"train_loss": -39.2474479675293, "global_step": 120416, "epoch": 995} {"train_loss": -38.6309814453125, "global_step": 120417, "epoch": 995} {"train_loss": -37.33700180053711, "global_step": 120418, "epoch": 995} {"train_loss": -38.295623779296875, "global_step": 120419, "epoch": 995} {"train_loss": -38.691043853759766, "global_step": 120420, "epoch": 995} {"train_loss": -39.73535919189453, "global_step": 120421, "epoch": 995} {"train_loss": -39.10888671875, "global_step": 120422, "epoch": 995} {"train_loss": -38.788734436035156, "global_step": 120423, "epoch": 995} {"train_loss": -39.676483154296875, "global_step": 120424, "epoch": 995} {"train_loss": -38.723731994628906, "global_step": 120425, "epoch": 995} {"train_loss": -39.4138298034668, "global_step": 120426, "epoch": 995} {"train_loss": -38.59403610229492, "global_step": 120427, "epoch": 995} {"train_loss": -38.13760757446289, "global_step": 120428, "epoch": 995} {"train_loss": -38.97589874267578, "global_step": 120429, "epoch": 995} {"train_loss": -38.90108871459961, "global_step": 120430, "epoch": 995} {"train_loss": -39.70703125, "global_step": 120431, "epoch": 995} {"train_loss": -38.8448600769043, "global_step": 120432, "epoch": 995} {"train_loss": -38.50930404663086, "global_step": 120433, "epoch": 995} {"train_loss": -39.27061462402344, "global_step": 120434, "epoch": 995} {"train_loss": -39.14698028564453, "global_step": 120435, "epoch": 995} {"train_loss": -38.45925521850586, "global_step": 120436, "epoch": 995} {"train_loss": -38.975257873535156, "global_step": 120437, "epoch": 995} {"train_loss": -38.511600494384766, "global_step": 120438, "epoch": 995} {"train_loss": -39.20966720581055, "global_step": 120439, "epoch": 995} {"train_loss": -39.07747268676758, "global_step": 120440, "epoch": 995} {"train_loss": -38.14425277709961, "global_step": 120441, "epoch": 995} {"train_loss": -37.74312210083008, "global_step": 120442, "epoch": 995} {"train_loss": -39.5240592956543, "global_step": 120443, "epoch": 995} {"train_loss": -37.01822280883789, "global_step": 120444, "epoch": 995} {"train_loss": -39.3708610534668, "global_step": 120445, "epoch": 995} {"train_loss": -37.45563888549805, "global_step": 120446, "epoch": 995} {"train_loss": -37.883785247802734, "global_step": 120447, "epoch": 995} {"train_loss": -35.90190505981445, "global_step": 120448, "epoch": 995} {"train_loss": -36.910804748535156, "global_step": 120449, "epoch": 995} {"train_loss": -35.90126419067383, "global_step": 120450, "epoch": 995} {"train_loss": -37.63202667236328, "global_step": 120451, "epoch": 995} {"train_loss": -38.706146240234375, "global_step": 120452, "epoch": 995} {"train_loss": -36.568355560302734, "global_step": 120453, "epoch": 995} {"train_loss": -37.68548583984375, "global_step": 120454, "epoch": 995} {"train_loss": -36.453487396240234, "global_step": 120455, "epoch": 995} {"train_loss": -35.386775970458984, "global_step": 120456, "epoch": 995} {"train_loss": -38.208282470703125, "global_step": 120457, "epoch": 995} {"train_loss": -37.30958557128906, "global_step": 120458, "epoch": 995} {"train_loss": -38.33063888549805, "global_step": 120459, "epoch": 995} {"train_loss": -37.7145881652832, "global_step": 120460, "epoch": 995} {"train_loss": -34.514183044433594, "global_step": 120461, "epoch": 995} {"train_loss": -36.43440628051758, "global_step": 120462, "epoch": 995} {"train_loss": -37.57494354248047, "global_step": 120463, "epoch": 995} {"train_loss": -37.78157424926758, "global_step": 120464, "epoch": 995} {"train_loss": -37.319679260253906, "global_step": 120465, "epoch": 995} {"train_loss": -38.574920654296875, "global_step": 120466, "epoch": 995} {"train_loss": -37.57550048828125, "global_step": 120467, "epoch": 995} {"train_loss": -36.95797348022461, "global_step": 120468, "epoch": 995} {"train_loss": -38.338478088378906, "global_step": 120469, "epoch": 995} {"train_loss": -32.08099365234375, "global_step": 120470, "epoch": 995} {"train_loss": -37.217872619628906, "global_step": 120471, "epoch": 995} {"train_loss": -37.79822540283203, "global_step": 120472, "epoch": 995} {"train_loss": -37.03017807006836, "global_step": 120473, "epoch": 995} {"train_loss": -37.60698318481445, "global_step": 120474, "epoch": 995} {"train_loss": -38.30949783325195, "global_step": 120475, "epoch": 995} {"train_loss": -38.424232482910156, "global_step": 120476, "epoch": 995} {"train_loss": -38.26567840576172, "global_step": 120477, "epoch": 995} {"train_loss": -36.16585159301758, "global_step": 120478, "epoch": 995} {"train_loss": -38.36263656616211, "global_step": 120479, "epoch": 995} {"train_loss": -38.508033752441406, "global_step": 120480, "epoch": 995} {"train_loss": -38.78459548950195, "global_step": 120481, "epoch": 995} {"train_loss": -37.4092903137207, "global_step": 120482, "epoch": 995} {"train_loss": -38.72394943237305, "global_step": 120483, "epoch": 995} {"train_loss": -38.01508331298828, "global_step": 120484, "epoch": 995} {"train_loss": -36.971553802490234, "global_step": 120485, "epoch": 995} {"train_loss": -38.20339584350586, "global_step": 120486, "epoch": 995} {"train_loss": -36.79124450683594, "global_step": 120487, "epoch": 995} {"train_loss": -37.596710205078125, "global_step": 120488, "epoch": 995} {"train_loss": -38.4931755065918, "global_step": 120489, "epoch": 995} {"train_loss": -37.375244140625, "global_step": 120490, "epoch": 995} {"train_loss": -38.402313232421875, "global_step": 120491, "epoch": 995} {"train_loss": -38.625946044921875, "global_step": 120492, "epoch": 995} {"train_loss": -38.43128204345703, "global_step": 120493, "epoch": 995} {"train_loss": -36.459896087646484, "global_step": 120494, "epoch": 995} {"train_loss": -37.003211975097656, "global_step": 120495, "epoch": 995} {"train_loss": -37.91102981567383, "global_step": 120496, "epoch": 995} {"train_loss": -37.36045455932617, "global_step": 120497, "epoch": 995} {"train_loss": -37.706268310546875, "global_step": 120498, "epoch": 995} {"train_loss": -36.40639114379883, "global_step": 120499, "epoch": 995} {"train_loss": -37.3311882019043, "global_step": 120500, "epoch": 995} {"train_loss": -36.36962890625, "global_step": 120501, "epoch": 995} {"train_loss": -36.02479934692383, "global_step": 120502, "epoch": 995} {"train_loss": -36.09473419189453, "global_step": 120503, "epoch": 995} {"train_loss": -37.667686462402344, "global_step": 120504, "epoch": 995} {"train_loss": -36.023311614990234, "global_step": 120505, "epoch": 995} {"train_loss": -36.48296356201172, "global_step": 120506, "epoch": 995} {"train_loss": -37.093788146972656, "global_step": 120507, "epoch": 995} {"train_loss": -37.69242858886719, "global_step": 120508, "epoch": 995} {"train_loss": -37.14699172973633, "global_step": 120509, "epoch": 995} {"train_loss": -38.14276123046875, "global_step": 120510, "epoch": 995} {"train_loss": -36.54982376098633, "global_step": 120511, "epoch": 995} {"train_loss": -35.59454345703125, "global_step": 120512, "epoch": 995} {"train_loss": -38.44430160522461, "global_step": 120513, "epoch": 995} {"train_loss": -34.41105651855469, "global_step": 120514, "epoch": 995} {"train_loss": -37.87084875816156, "global_step": 120515, "epoch": 995, "val_loss": 2695448.25} {"train_loss": -37.12630844116211, "global_step": 120516, "epoch": 996} {"train_loss": -37.721614837646484, "global_step": 120517, "epoch": 996} {"train_loss": -37.76127624511719, "global_step": 120518, "epoch": 996} {"train_loss": -37.728206634521484, "global_step": 120519, "epoch": 996} {"train_loss": -38.44588088989258, "global_step": 120520, "epoch": 996} {"train_loss": -38.33993148803711, "global_step": 120521, "epoch": 996} {"train_loss": -36.29221725463867, "global_step": 120522, "epoch": 996} {"train_loss": -37.89439010620117, "global_step": 120523, "epoch": 996} {"train_loss": -38.516021728515625, "global_step": 120524, "epoch": 996} {"train_loss": -38.503353118896484, "global_step": 120525, "epoch": 996} {"train_loss": -36.7346076965332, "global_step": 120526, "epoch": 996} {"train_loss": -38.67490005493164, "global_step": 120527, "epoch": 996} {"train_loss": -38.606876373291016, "global_step": 120528, "epoch": 996} {"train_loss": -38.17902755737305, "global_step": 120529, "epoch": 996} {"train_loss": -38.564205169677734, "global_step": 120530, "epoch": 996} {"train_loss": -38.09325408935547, "global_step": 120531, "epoch": 996} {"train_loss": -36.42684555053711, "global_step": 120532, "epoch": 996} {"train_loss": -38.37847900390625, "global_step": 120533, "epoch": 996} {"train_loss": -38.52888107299805, "global_step": 120534, "epoch": 996} {"train_loss": -38.598026275634766, "global_step": 120535, "epoch": 996} {"train_loss": -38.815101623535156, "global_step": 120536, "epoch": 996} {"train_loss": -38.6805419921875, "global_step": 120537, "epoch": 996} {"train_loss": -38.499637603759766, "global_step": 120538, "epoch": 996} {"train_loss": -38.620887756347656, "global_step": 120539, "epoch": 996} {"train_loss": -39.23824691772461, "global_step": 120540, "epoch": 996} {"train_loss": -39.613075256347656, "global_step": 120541, "epoch": 996} {"train_loss": -37.91311264038086, "global_step": 120542, "epoch": 996} {"train_loss": -39.062740325927734, "global_step": 120543, "epoch": 996} {"train_loss": -39.41098403930664, "global_step": 120544, "epoch": 996} {"train_loss": -37.80886459350586, "global_step": 120545, "epoch": 996} {"train_loss": -38.6555290222168, "global_step": 120546, "epoch": 996} {"train_loss": -38.9992561340332, "global_step": 120547, "epoch": 996} {"train_loss": -39.14866256713867, "global_step": 120548, "epoch": 996} {"train_loss": -39.31753158569336, "global_step": 120549, "epoch": 996} {"train_loss": -39.38649368286133, "global_step": 120550, "epoch": 996} {"train_loss": -39.38930892944336, "global_step": 120551, "epoch": 996} {"train_loss": -39.5544548034668, "global_step": 120552, "epoch": 996} {"train_loss": -39.887184143066406, "global_step": 120553, "epoch": 996} {"train_loss": -39.3358154296875, "global_step": 120554, "epoch": 996} {"train_loss": -38.5180778503418, "global_step": 120555, "epoch": 996} {"train_loss": -39.72921371459961, "global_step": 120556, "epoch": 996} {"train_loss": -39.30719757080078, "global_step": 120557, "epoch": 996} {"train_loss": -39.549129486083984, "global_step": 120558, "epoch": 996} {"train_loss": -39.86531448364258, "global_step": 120559, "epoch": 996} {"train_loss": -40.16535949707031, "global_step": 120560, "epoch": 996} {"train_loss": -39.94344711303711, "global_step": 120561, "epoch": 996} {"train_loss": -39.26012420654297, "global_step": 120562, "epoch": 996} {"train_loss": -39.92966842651367, "global_step": 120563, "epoch": 996} {"train_loss": -39.37615966796875, "global_step": 120564, "epoch": 996} {"train_loss": -39.807918548583984, "global_step": 120565, "epoch": 996} {"train_loss": -39.388160705566406, "global_step": 120566, "epoch": 996} {"train_loss": -39.85549545288086, "global_step": 120567, "epoch": 996} {"train_loss": -40.159297943115234, "global_step": 120568, "epoch": 996} {"train_loss": -39.667816162109375, "global_step": 120569, "epoch": 996} {"train_loss": -38.57505798339844, "global_step": 120570, "epoch": 996} {"train_loss": -39.86710739135742, "global_step": 120571, "epoch": 996} {"train_loss": -40.03919219970703, "global_step": 120572, "epoch": 996} {"train_loss": -39.976070404052734, "global_step": 120573, "epoch": 996} {"train_loss": -39.766357421875, "global_step": 120574, "epoch": 996} {"train_loss": -40.034481048583984, "global_step": 120575, "epoch": 996} {"train_loss": -40.42519760131836, "global_step": 120576, "epoch": 996} {"train_loss": -40.08271408081055, "global_step": 120577, "epoch": 996} {"train_loss": -40.27970886230469, "global_step": 120578, "epoch": 996} {"train_loss": -39.812294006347656, "global_step": 120579, "epoch": 996} {"train_loss": -40.03656768798828, "global_step": 120580, "epoch": 996} {"train_loss": -40.51510238647461, "global_step": 120581, "epoch": 996} {"train_loss": -39.82630157470703, "global_step": 120582, "epoch": 996} {"train_loss": -39.80508041381836, "global_step": 120583, "epoch": 996} {"train_loss": -39.89087677001953, "global_step": 120584, "epoch": 996} {"train_loss": -40.06819534301758, "global_step": 120585, "epoch": 996} {"train_loss": -40.20078659057617, "global_step": 120586, "epoch": 996} {"train_loss": -40.55253219604492, "global_step": 120587, "epoch": 996} {"train_loss": -39.953765869140625, "global_step": 120588, "epoch": 996} {"train_loss": -39.90402603149414, "global_step": 120589, "epoch": 996} {"train_loss": -40.285552978515625, "global_step": 120590, "epoch": 996} {"train_loss": -39.78593444824219, "global_step": 120591, "epoch": 996} {"train_loss": -40.3731803894043, "global_step": 120592, "epoch": 996} {"train_loss": -39.327056884765625, "global_step": 120593, "epoch": 996} {"train_loss": -35.1043815612793, "global_step": 120594, "epoch": 996} {"train_loss": -29.99879264831543, "global_step": 120595, "epoch": 996} {"train_loss": -21.760183334350586, "global_step": 120596, "epoch": 996} {"train_loss": -1.4434922933578491, "global_step": 120597, "epoch": 996} {"train_loss": -27.476184844970703, "global_step": 120598, "epoch": 996} {"train_loss": -36.45046615600586, "global_step": 120599, "epoch": 996} {"train_loss": -27.392873764038086, "global_step": 120600, "epoch": 996} {"train_loss": -38.363468170166016, "global_step": 120601, "epoch": 996} {"train_loss": -32.09584426879883, "global_step": 120602, "epoch": 996} {"train_loss": -37.861759185791016, "global_step": 120603, "epoch": 996} {"train_loss": -33.18399429321289, "global_step": 120604, "epoch": 996} {"train_loss": -38.74858474731445, "global_step": 120605, "epoch": 996} {"train_loss": -36.40485763549805, "global_step": 120606, "epoch": 996} {"train_loss": -37.805965423583984, "global_step": 120607, "epoch": 996} {"train_loss": -38.36934280395508, "global_step": 120608, "epoch": 996} {"train_loss": -38.02307891845703, "global_step": 120609, "epoch": 996} {"train_loss": -36.92995834350586, "global_step": 120610, "epoch": 996} {"train_loss": -37.852569580078125, "global_step": 120611, "epoch": 996} {"train_loss": -38.17068099975586, "global_step": 120612, "epoch": 996} {"train_loss": -38.39339828491211, "global_step": 120613, "epoch": 996} {"train_loss": -38.4262580871582, "global_step": 120614, "epoch": 996} {"train_loss": -38.46430587768555, "global_step": 120615, "epoch": 996} {"train_loss": -38.17875289916992, "global_step": 120616, "epoch": 996} {"train_loss": -38.22990036010742, "global_step": 120617, "epoch": 996} {"train_loss": -39.05537033081055, "global_step": 120618, "epoch": 996} {"train_loss": -38.69110870361328, "global_step": 120619, "epoch": 996} {"train_loss": -39.281463623046875, "global_step": 120620, "epoch": 996} {"train_loss": -38.62223434448242, "global_step": 120621, "epoch": 996} {"train_loss": -37.771484375, "global_step": 120622, "epoch": 996} {"train_loss": -39.11499786376953, "global_step": 120623, "epoch": 996} {"train_loss": -38.89030075073242, "global_step": 120624, "epoch": 996} {"train_loss": -38.596961975097656, "global_step": 120625, "epoch": 996} {"train_loss": -39.49573516845703, "global_step": 120626, "epoch": 996} {"train_loss": -39.06949996948242, "global_step": 120627, "epoch": 996} {"train_loss": -38.445125579833984, "global_step": 120628, "epoch": 996} {"train_loss": -38.94481658935547, "global_step": 120629, "epoch": 996} {"train_loss": -39.046016693115234, "global_step": 120630, "epoch": 996} {"train_loss": -38.95119857788086, "global_step": 120631, "epoch": 996} {"train_loss": -39.32197952270508, "global_step": 120632, "epoch": 996} {"train_loss": -39.913753509521484, "global_step": 120633, "epoch": 996} {"train_loss": -38.95023727416992, "global_step": 120634, "epoch": 996} {"train_loss": -39.63975143432617, "global_step": 120635, "epoch": 996} {"train_loss": -38.102159242984676, "global_step": 120636, "epoch": 996, "val_loss": 2781085.75} {"train_loss": -39.745643615722656, "global_step": 120637, "epoch": 997} {"train_loss": -39.389183044433594, "global_step": 120638, "epoch": 997} {"train_loss": -39.784461975097656, "global_step": 120639, "epoch": 997} {"train_loss": -39.34627914428711, "global_step": 120640, "epoch": 997} {"train_loss": -39.861000061035156, "global_step": 120641, "epoch": 997} {"train_loss": -39.9734992980957, "global_step": 120642, "epoch": 997} {"train_loss": -39.540992736816406, "global_step": 120643, "epoch": 997} {"train_loss": -39.80436325073242, "global_step": 120644, "epoch": 997} {"train_loss": -40.257755279541016, "global_step": 120645, "epoch": 997} {"train_loss": -40.03945541381836, "global_step": 120646, "epoch": 997} {"train_loss": -39.95090866088867, "global_step": 120647, "epoch": 997} {"train_loss": -40.28963088989258, "global_step": 120648, "epoch": 997} {"train_loss": -40.31572341918945, "global_step": 120649, "epoch": 997} {"train_loss": -40.386470794677734, "global_step": 120650, "epoch": 997} {"train_loss": -40.194366455078125, "global_step": 120651, "epoch": 997} {"train_loss": -40.091121673583984, "global_step": 120652, "epoch": 997} {"train_loss": -38.935150146484375, "global_step": 120653, "epoch": 997} {"train_loss": -40.2655143737793, "global_step": 120654, "epoch": 997} {"train_loss": -40.04035186767578, "global_step": 120655, "epoch": 997} {"train_loss": -40.58198928833008, "global_step": 120656, "epoch": 997} {"train_loss": -39.95359802246094, "global_step": 120657, "epoch": 997} {"train_loss": -40.190834045410156, "global_step": 120658, "epoch": 997} {"train_loss": -40.05634307861328, "global_step": 120659, "epoch": 997} {"train_loss": -39.6412467956543, "global_step": 120660, "epoch": 997} {"train_loss": -40.26665115356445, "global_step": 120661, "epoch": 997} {"train_loss": -37.6993293762207, "global_step": 120662, "epoch": 997} {"train_loss": -38.804534912109375, "global_step": 120663, "epoch": 997} {"train_loss": -36.692039489746094, "global_step": 120664, "epoch": 997} {"train_loss": -39.04656982421875, "global_step": 120665, "epoch": 997} {"train_loss": -37.86775588989258, "global_step": 120666, "epoch": 997} {"train_loss": -37.95869064331055, "global_step": 120667, "epoch": 997} {"train_loss": -37.02229690551758, "global_step": 120668, "epoch": 997} {"train_loss": -33.12350082397461, "global_step": 120669, "epoch": 997} {"train_loss": -19.336824417114258, "global_step": 120670, "epoch": 997} {"train_loss": -1.876551866531372, "global_step": 120671, "epoch": 997} {"train_loss": -29.111581802368164, "global_step": 120672, "epoch": 997} {"train_loss": -31.577716827392578, "global_step": 120673, "epoch": 997} {"train_loss": -21.568828582763672, "global_step": 120674, "epoch": 997} {"train_loss": -34.511287689208984, "global_step": 120675, "epoch": 997} {"train_loss": -27.78278160095215, "global_step": 120676, "epoch": 997} {"train_loss": -32.376956939697266, "global_step": 120677, "epoch": 997} {"train_loss": -31.377002716064453, "global_step": 120678, "epoch": 997} {"train_loss": -34.51791763305664, "global_step": 120679, "epoch": 997} {"train_loss": -29.64609718322754, "global_step": 120680, "epoch": 997} {"train_loss": -34.782657623291016, "global_step": 120681, "epoch": 997} {"train_loss": -37.07558822631836, "global_step": 120682, "epoch": 997} {"train_loss": -32.771175384521484, "global_step": 120683, "epoch": 997} {"train_loss": -37.35530471801758, "global_step": 120684, "epoch": 997} {"train_loss": -35.57651901245117, "global_step": 120685, "epoch": 997} {"train_loss": -31.5933837890625, "global_step": 120686, "epoch": 997} {"train_loss": -36.987369537353516, "global_step": 120687, "epoch": 997} {"train_loss": -36.46314239501953, "global_step": 120688, "epoch": 997} {"train_loss": -36.05830764770508, "global_step": 120689, "epoch": 997} {"train_loss": -37.54862976074219, "global_step": 120690, "epoch": 997} {"train_loss": -36.215576171875, "global_step": 120691, "epoch": 997} {"train_loss": -37.0458869934082, "global_step": 120692, "epoch": 997} {"train_loss": -36.5415153503418, "global_step": 120693, "epoch": 997} {"train_loss": -37.30755615234375, "global_step": 120694, "epoch": 997} {"train_loss": -37.534420013427734, "global_step": 120695, "epoch": 997} {"train_loss": -37.103363037109375, "global_step": 120696, "epoch": 997} {"train_loss": -37.883113861083984, "global_step": 120697, "epoch": 997} {"train_loss": -38.318809509277344, "global_step": 120698, "epoch": 997} {"train_loss": -37.69133377075195, "global_step": 120699, "epoch": 997} {"train_loss": -37.84162139892578, "global_step": 120700, "epoch": 997} {"train_loss": -37.924407958984375, "global_step": 120701, "epoch": 997} {"train_loss": -37.97990036010742, "global_step": 120702, "epoch": 997} {"train_loss": -38.09674835205078, "global_step": 120703, "epoch": 997} {"train_loss": -38.3190803527832, "global_step": 120704, "epoch": 997} {"train_loss": -38.6351203918457, "global_step": 120705, "epoch": 997} {"train_loss": -36.9206657409668, "global_step": 120706, "epoch": 997} {"train_loss": -38.084075927734375, "global_step": 120707, "epoch": 997} {"train_loss": -38.020626068115234, "global_step": 120708, "epoch": 997} {"train_loss": -38.639686584472656, "global_step": 120709, "epoch": 997} {"train_loss": -38.30100631713867, "global_step": 120710, "epoch": 997} {"train_loss": -38.760276794433594, "global_step": 120711, "epoch": 997} {"train_loss": -38.8291130065918, "global_step": 120712, "epoch": 997} {"train_loss": -38.819095611572266, "global_step": 120713, "epoch": 997} {"train_loss": -38.805381774902344, "global_step": 120714, "epoch": 997} {"train_loss": -38.87047576904297, "global_step": 120715, "epoch": 997} {"train_loss": -38.585018157958984, "global_step": 120716, "epoch": 997} {"train_loss": -39.24113845825195, "global_step": 120717, "epoch": 997} {"train_loss": -38.9107780456543, "global_step": 120718, "epoch": 997} {"train_loss": -38.82133102416992, "global_step": 120719, "epoch": 997} {"train_loss": -39.13484573364258, "global_step": 120720, "epoch": 997} {"train_loss": -38.9510612487793, "global_step": 120721, "epoch": 997} {"train_loss": -39.141292572021484, "global_step": 120722, "epoch": 997} {"train_loss": -38.73505783081055, "global_step": 120723, "epoch": 997} {"train_loss": -39.307430267333984, "global_step": 120724, "epoch": 997} {"train_loss": -39.21775436401367, "global_step": 120725, "epoch": 997} {"train_loss": -39.45321273803711, "global_step": 120726, "epoch": 997} {"train_loss": -39.471435546875, "global_step": 120727, "epoch": 997} {"train_loss": -39.31714630126953, "global_step": 120728, "epoch": 997} {"train_loss": -39.19834518432617, "global_step": 120729, "epoch": 997} {"train_loss": -39.24140548706055, "global_step": 120730, "epoch": 997} {"train_loss": -39.46192169189453, "global_step": 120731, "epoch": 997} {"train_loss": -39.34521484375, "global_step": 120732, "epoch": 997} {"train_loss": -39.08195114135742, "global_step": 120733, "epoch": 997} {"train_loss": -39.623836517333984, "global_step": 120734, "epoch": 997} {"train_loss": -39.56657791137695, "global_step": 120735, "epoch": 997} {"train_loss": -39.69132614135742, "global_step": 120736, "epoch": 997} {"train_loss": -39.05367660522461, "global_step": 120737, "epoch": 997} {"train_loss": -39.22487258911133, "global_step": 120738, "epoch": 997} {"train_loss": -39.19865036010742, "global_step": 120739, "epoch": 997} {"train_loss": -39.35829544067383, "global_step": 120740, "epoch": 997} {"train_loss": -39.155975341796875, "global_step": 120741, "epoch": 997} {"train_loss": -39.36897659301758, "global_step": 120742, "epoch": 997} {"train_loss": -39.56925582885742, "global_step": 120743, "epoch": 997} {"train_loss": -39.527626037597656, "global_step": 120744, "epoch": 997} {"train_loss": -39.91847610473633, "global_step": 120745, "epoch": 997} {"train_loss": -38.27119827270508, "global_step": 120746, "epoch": 997} {"train_loss": -38.96668243408203, "global_step": 120747, "epoch": 997} {"train_loss": -39.75834274291992, "global_step": 120748, "epoch": 997} {"train_loss": -39.6106071472168, "global_step": 120749, "epoch": 997} {"train_loss": -39.485347747802734, "global_step": 120750, "epoch": 997} {"train_loss": -39.964229583740234, "global_step": 120751, "epoch": 997} {"train_loss": -39.9704704284668, "global_step": 120752, "epoch": 997} {"train_loss": -39.757049560546875, "global_step": 120753, "epoch": 997} {"train_loss": -39.97915267944336, "global_step": 120754, "epoch": 997} {"train_loss": -39.55659103393555, "global_step": 120755, "epoch": 997} {"train_loss": -38.88359069824219, "global_step": 120756, "epoch": 997} {"train_loss": -37.56686167480532, "global_step": 120757, "epoch": 997, "val_loss": 2708524.75} {"train_loss": -39.21613693237305, "global_step": 120758, "epoch": 998} {"train_loss": -40.02996826171875, "global_step": 120759, "epoch": 998} {"train_loss": -39.786537170410156, "global_step": 120760, "epoch": 998} {"train_loss": -38.42823028564453, "global_step": 120761, "epoch": 998} {"train_loss": -37.83681869506836, "global_step": 120762, "epoch": 998} {"train_loss": -37.23432922363281, "global_step": 120763, "epoch": 998} {"train_loss": -38.675689697265625, "global_step": 120764, "epoch": 998} {"train_loss": -39.250728607177734, "global_step": 120765, "epoch": 998} {"train_loss": -39.20018768310547, "global_step": 120766, "epoch": 998} {"train_loss": -38.45549392700195, "global_step": 120767, "epoch": 998} {"train_loss": -38.3015251159668, "global_step": 120768, "epoch": 998} {"train_loss": -38.48768997192383, "global_step": 120769, "epoch": 998} {"train_loss": -39.003143310546875, "global_step": 120770, "epoch": 998} {"train_loss": -37.79366683959961, "global_step": 120771, "epoch": 998} {"train_loss": -39.59682846069336, "global_step": 120772, "epoch": 998} {"train_loss": -38.536739349365234, "global_step": 120773, "epoch": 998} {"train_loss": -38.46249008178711, "global_step": 120774, "epoch": 998} {"train_loss": -39.48737716674805, "global_step": 120775, "epoch": 998} {"train_loss": -39.106109619140625, "global_step": 120776, "epoch": 998} {"train_loss": -39.120582580566406, "global_step": 120777, "epoch": 998} {"train_loss": -38.44470977783203, "global_step": 120778, "epoch": 998} {"train_loss": -39.91636276245117, "global_step": 120779, "epoch": 998} {"train_loss": -39.01416778564453, "global_step": 120780, "epoch": 998} {"train_loss": -38.67142868041992, "global_step": 120781, "epoch": 998} {"train_loss": -39.529781341552734, "global_step": 120782, "epoch": 998} {"train_loss": -38.69287872314453, "global_step": 120783, "epoch": 998} {"train_loss": -38.903263092041016, "global_step": 120784, "epoch": 998} {"train_loss": -39.3781852722168, "global_step": 120785, "epoch": 998} {"train_loss": -39.257484436035156, "global_step": 120786, "epoch": 998} {"train_loss": -38.26975631713867, "global_step": 120787, "epoch": 998} {"train_loss": -39.18045425415039, "global_step": 120788, "epoch": 998} {"train_loss": -39.30731964111328, "global_step": 120789, "epoch": 998} {"train_loss": -38.26015853881836, "global_step": 120790, "epoch": 998} {"train_loss": -38.75078582763672, "global_step": 120791, "epoch": 998} {"train_loss": -39.48086166381836, "global_step": 120792, "epoch": 998} {"train_loss": -39.350067138671875, "global_step": 120793, "epoch": 998} {"train_loss": -39.33332443237305, "global_step": 120794, "epoch": 998} {"train_loss": -38.73541259765625, "global_step": 120795, "epoch": 998} {"train_loss": -38.831939697265625, "global_step": 120796, "epoch": 998} {"train_loss": -39.434749603271484, "global_step": 120797, "epoch": 998} {"train_loss": -38.932464599609375, "global_step": 120798, "epoch": 998} {"train_loss": -39.74638748168945, "global_step": 120799, "epoch": 998} {"train_loss": -39.3983268737793, "global_step": 120800, "epoch": 998} {"train_loss": -39.49516296386719, "global_step": 120801, "epoch": 998} {"train_loss": -39.386383056640625, "global_step": 120802, "epoch": 998} {"train_loss": -39.121524810791016, "global_step": 120803, "epoch": 998} {"train_loss": -39.81230926513672, "global_step": 120804, "epoch": 998} {"train_loss": -38.134803771972656, "global_step": 120805, "epoch": 998} {"train_loss": -38.945796966552734, "global_step": 120806, "epoch": 998} {"train_loss": -39.81406021118164, "global_step": 120807, "epoch": 998} {"train_loss": -38.74038314819336, "global_step": 120808, "epoch": 998} {"train_loss": -39.90613555908203, "global_step": 120809, "epoch": 998} {"train_loss": -39.479103088378906, "global_step": 120810, "epoch": 998} {"train_loss": -38.49949264526367, "global_step": 120811, "epoch": 998} {"train_loss": -39.4867057800293, "global_step": 120812, "epoch": 998} {"train_loss": -38.6478157043457, "global_step": 120813, "epoch": 998} {"train_loss": -37.93308639526367, "global_step": 120814, "epoch": 998} {"train_loss": -33.97296142578125, "global_step": 120815, "epoch": 998} {"train_loss": -34.263458251953125, "global_step": 120816, "epoch": 998} {"train_loss": -37.02370071411133, "global_step": 120817, "epoch": 998} {"train_loss": -38.72825241088867, "global_step": 120818, "epoch": 998} {"train_loss": -39.550453186035156, "global_step": 120819, "epoch": 998} {"train_loss": -38.962852478027344, "global_step": 120820, "epoch": 998} {"train_loss": -36.99372863769531, "global_step": 120821, "epoch": 998} {"train_loss": -35.58368682861328, "global_step": 120822, "epoch": 998} {"train_loss": -37.33937072753906, "global_step": 120823, "epoch": 998} {"train_loss": -37.6156120300293, "global_step": 120824, "epoch": 998} {"train_loss": -39.68752670288086, "global_step": 120825, "epoch": 998} {"train_loss": -37.50225830078125, "global_step": 120826, "epoch": 998} {"train_loss": -37.205474853515625, "global_step": 120827, "epoch": 998} {"train_loss": -38.162696838378906, "global_step": 120828, "epoch": 998} {"train_loss": -39.619930267333984, "global_step": 120829, "epoch": 998} {"train_loss": -39.32808303833008, "global_step": 120830, "epoch": 998} {"train_loss": -39.1214714050293, "global_step": 120831, "epoch": 998} {"train_loss": -39.60942840576172, "global_step": 120832, "epoch": 998} {"train_loss": -39.63593292236328, "global_step": 120833, "epoch": 998} {"train_loss": -39.29358673095703, "global_step": 120834, "epoch": 998} {"train_loss": -38.40752029418945, "global_step": 120835, "epoch": 998} {"train_loss": -39.24505615234375, "global_step": 120836, "epoch": 998} {"train_loss": -39.5406608581543, "global_step": 120837, "epoch": 998} {"train_loss": -38.5914192199707, "global_step": 120838, "epoch": 998} {"train_loss": -39.470314025878906, "global_step": 120839, "epoch": 998} {"train_loss": -39.871707916259766, "global_step": 120840, "epoch": 998} {"train_loss": -39.24025344848633, "global_step": 120841, "epoch": 998} {"train_loss": -39.61281204223633, "global_step": 120842, "epoch": 998} {"train_loss": -39.62369918823242, "global_step": 120843, "epoch": 998} {"train_loss": -39.09063720703125, "global_step": 120844, "epoch": 998} {"train_loss": -40.11080551147461, "global_step": 120845, "epoch": 998} {"train_loss": -39.4484977722168, "global_step": 120846, "epoch": 998} {"train_loss": -38.84173583984375, "global_step": 120847, "epoch": 998} {"train_loss": -38.97658920288086, "global_step": 120848, "epoch": 998} {"train_loss": -39.61765670776367, "global_step": 120849, "epoch": 998} {"train_loss": -39.384979248046875, "global_step": 120850, "epoch": 998} {"train_loss": -39.00800704956055, "global_step": 120851, "epoch": 998} {"train_loss": -39.64337158203125, "global_step": 120852, "epoch": 998} {"train_loss": -37.462528228759766, "global_step": 120853, "epoch": 998} {"train_loss": -38.623809814453125, "global_step": 120854, "epoch": 998} {"train_loss": -37.640052795410156, "global_step": 120855, "epoch": 998} {"train_loss": -39.586212158203125, "global_step": 120856, "epoch": 998} {"train_loss": -39.52294921875, "global_step": 120857, "epoch": 998} {"train_loss": -37.697967529296875, "global_step": 120858, "epoch": 998} {"train_loss": -39.37075424194336, "global_step": 120859, "epoch": 998} {"train_loss": -39.49787139892578, "global_step": 120860, "epoch": 998} {"train_loss": -37.29114532470703, "global_step": 120861, "epoch": 998} {"train_loss": -38.379676818847656, "global_step": 120862, "epoch": 998} {"train_loss": -36.88267135620117, "global_step": 120863, "epoch": 998} {"train_loss": -37.87137985229492, "global_step": 120864, "epoch": 998} {"train_loss": -39.19139862060547, "global_step": 120865, "epoch": 998} {"train_loss": -37.59709548950195, "global_step": 120866, "epoch": 998} {"train_loss": -37.36217498779297, "global_step": 120867, "epoch": 998} {"train_loss": -35.87107849121094, "global_step": 120868, "epoch": 998} {"train_loss": -35.25397491455078, "global_step": 120869, "epoch": 998} {"train_loss": -38.40896224975586, "global_step": 120870, "epoch": 998} {"train_loss": -37.467079162597656, "global_step": 120871, "epoch": 998} {"train_loss": -37.42964172363281, "global_step": 120872, "epoch": 998} {"train_loss": -38.50513458251953, "global_step": 120873, "epoch": 998} {"train_loss": -34.949134826660156, "global_step": 120874, "epoch": 998} {"train_loss": -36.863895416259766, "global_step": 120875, "epoch": 998} {"train_loss": -38.18992233276367, "global_step": 120876, "epoch": 998} {"train_loss": -30.379257202148438, "global_step": 120877, "epoch": 998} {"train_loss": -38.53659707061515, "global_step": 120878, "epoch": 998, "val_loss": 2720470.75} {"train_loss": -35.48317337036133, "global_step": 120879, "epoch": 999} {"train_loss": -34.657257080078125, "global_step": 120880, "epoch": 999} {"train_loss": -34.09407424926758, "global_step": 120881, "epoch": 999} {"train_loss": -37.87861251831055, "global_step": 120882, "epoch": 999} {"train_loss": -36.21712112426758, "global_step": 120883, "epoch": 999} {"train_loss": -35.81815719604492, "global_step": 120884, "epoch": 999} {"train_loss": -34.547882080078125, "global_step": 120885, "epoch": 999} {"train_loss": -35.819488525390625, "global_step": 120886, "epoch": 999} {"train_loss": -36.78865432739258, "global_step": 120887, "epoch": 999} {"train_loss": -37.38743591308594, "global_step": 120888, "epoch": 999} {"train_loss": -36.94921112060547, "global_step": 120889, "epoch": 999} {"train_loss": -36.91840744018555, "global_step": 120890, "epoch": 999} {"train_loss": -36.14701461791992, "global_step": 120891, "epoch": 999} {"train_loss": -38.83308792114258, "global_step": 120892, "epoch": 999} {"train_loss": -38.56443405151367, "global_step": 120893, "epoch": 999} {"train_loss": -37.26290512084961, "global_step": 120894, "epoch": 999} {"train_loss": -37.22265625, "global_step": 120895, "epoch": 999} {"train_loss": -38.76123046875, "global_step": 120896, "epoch": 999} {"train_loss": -37.50263595581055, "global_step": 120897, "epoch": 999} {"train_loss": -38.74394226074219, "global_step": 120898, "epoch": 999} {"train_loss": -38.29133224487305, "global_step": 120899, "epoch": 999} {"train_loss": -38.42107391357422, "global_step": 120900, "epoch": 999} {"train_loss": -38.479408264160156, "global_step": 120901, "epoch": 999} {"train_loss": -37.94168472290039, "global_step": 120902, "epoch": 999} {"train_loss": -38.452239990234375, "global_step": 120903, "epoch": 999} {"train_loss": -38.305870056152344, "global_step": 120904, "epoch": 999} {"train_loss": -38.63261032104492, "global_step": 120905, "epoch": 999} {"train_loss": -38.658470153808594, "global_step": 120906, "epoch": 999} {"train_loss": -38.583984375, "global_step": 120907, "epoch": 999} {"train_loss": -38.57752990722656, "global_step": 120908, "epoch": 999} {"train_loss": -39.07373046875, "global_step": 120909, "epoch": 999} {"train_loss": -38.3499755859375, "global_step": 120910, "epoch": 999} {"train_loss": -38.87439727783203, "global_step": 120911, "epoch": 999} {"train_loss": -39.30375289916992, "global_step": 120912, "epoch": 999} {"train_loss": -39.111934661865234, "global_step": 120913, "epoch": 999} {"train_loss": -39.11118698120117, "global_step": 120914, "epoch": 999} {"train_loss": -39.07302474975586, "global_step": 120915, "epoch": 999} {"train_loss": -39.58697509765625, "global_step": 120916, "epoch": 999} {"train_loss": -39.77052688598633, "global_step": 120917, "epoch": 999} {"train_loss": -39.301448822021484, "global_step": 120918, "epoch": 999} {"train_loss": -39.7142448425293, "global_step": 120919, "epoch": 999} {"train_loss": -39.496009826660156, "global_step": 120920, "epoch": 999} {"train_loss": -39.70225143432617, "global_step": 120921, "epoch": 999} {"train_loss": -39.56561279296875, "global_step": 120922, "epoch": 999} {"train_loss": -38.89496612548828, "global_step": 120923, "epoch": 999} {"train_loss": -39.08271408081055, "global_step": 120924, "epoch": 999} {"train_loss": -39.765419006347656, "global_step": 120925, "epoch": 999} {"train_loss": -39.58408737182617, "global_step": 120926, "epoch": 999} {"train_loss": -39.36879348754883, "global_step": 120927, "epoch": 999} {"train_loss": -39.848384857177734, "global_step": 120928, "epoch": 999} {"train_loss": -39.29584503173828, "global_step": 120929, "epoch": 999} {"train_loss": -40.017181396484375, "global_step": 120930, "epoch": 999} {"train_loss": -39.16897201538086, "global_step": 120931, "epoch": 999} {"train_loss": -40.07743453979492, "global_step": 120932, "epoch": 999} {"train_loss": -39.819122314453125, "global_step": 120933, "epoch": 999} {"train_loss": -39.78257369995117, "global_step": 120934, "epoch": 999} {"train_loss": -40.06187057495117, "global_step": 120935, "epoch": 999} {"train_loss": -39.74102783203125, "global_step": 120936, "epoch": 999} {"train_loss": -40.38021469116211, "global_step": 120937, "epoch": 999} {"train_loss": -39.978118896484375, "global_step": 120938, "epoch": 999} {"train_loss": -39.74506759643555, "global_step": 120939, "epoch": 999} {"train_loss": -40.384559631347656, "global_step": 120940, "epoch": 999} {"train_loss": -39.966552734375, "global_step": 120941, "epoch": 999} {"train_loss": -40.22646713256836, "global_step": 120942, "epoch": 999} {"train_loss": -39.239112854003906, "global_step": 120943, "epoch": 999} {"train_loss": -38.27009201049805, "global_step": 120944, "epoch": 999} {"train_loss": -38.87623596191406, "global_step": 120945, "epoch": 999} {"train_loss": -37.61356735229492, "global_step": 120946, "epoch": 999} {"train_loss": -37.394378662109375, "global_step": 120947, "epoch": 999} {"train_loss": -38.48971176147461, "global_step": 120948, "epoch": 999} {"train_loss": -39.799007415771484, "global_step": 120949, "epoch": 999} {"train_loss": -38.14799880981445, "global_step": 120950, "epoch": 999} {"train_loss": -37.39703369140625, "global_step": 120951, "epoch": 999} {"train_loss": -40.219974517822266, "global_step": 120952, "epoch": 999} {"train_loss": -37.59072494506836, "global_step": 120953, "epoch": 999} {"train_loss": -37.43556213378906, "global_step": 120954, "epoch": 999} {"train_loss": -39.36869812011719, "global_step": 120955, "epoch": 999} {"train_loss": -37.20230484008789, "global_step": 120956, "epoch": 999} {"train_loss": -39.978675842285156, "global_step": 120957, "epoch": 999} {"train_loss": -37.08930587768555, "global_step": 120958, "epoch": 999} {"train_loss": -39.208980560302734, "global_step": 120959, "epoch": 999} {"train_loss": -37.62998580932617, "global_step": 120960, "epoch": 999} {"train_loss": -39.07149124145508, "global_step": 120961, "epoch": 999} {"train_loss": -38.131649017333984, "global_step": 120962, "epoch": 999} {"train_loss": -38.929683685302734, "global_step": 120963, "epoch": 999} {"train_loss": -39.32070541381836, "global_step": 120964, "epoch": 999} {"train_loss": -38.31063461303711, "global_step": 120965, "epoch": 999} {"train_loss": -39.393531799316406, "global_step": 120966, "epoch": 999} {"train_loss": -38.16744613647461, "global_step": 120967, "epoch": 999} {"train_loss": -39.785369873046875, "global_step": 120968, "epoch": 999} {"train_loss": -38.8001708984375, "global_step": 120969, "epoch": 999} {"train_loss": -39.36812973022461, "global_step": 120970, "epoch": 999} {"train_loss": -38.535823822021484, "global_step": 120971, "epoch": 999} {"train_loss": -38.55119705200195, "global_step": 120972, "epoch": 999} {"train_loss": -39.85847091674805, "global_step": 120973, "epoch": 999} {"train_loss": -38.36280822753906, "global_step": 120974, "epoch": 999} {"train_loss": -37.5304069519043, "global_step": 120975, "epoch": 999} {"train_loss": -37.91974639892578, "global_step": 120976, "epoch": 999} {"train_loss": -35.597267150878906, "global_step": 120977, "epoch": 999} {"train_loss": -39.07365036010742, "global_step": 120978, "epoch": 999} {"train_loss": -35.415775299072266, "global_step": 120979, "epoch": 999} {"train_loss": -34.807525634765625, "global_step": 120980, "epoch": 999} {"train_loss": -36.58534622192383, "global_step": 120981, "epoch": 999} {"train_loss": -35.24071502685547, "global_step": 120982, "epoch": 999} {"train_loss": -35.43959045410156, "global_step": 120983, "epoch": 999} {"train_loss": -36.07215881347656, "global_step": 120984, "epoch": 999} {"train_loss": -36.4248046875, "global_step": 120985, "epoch": 999} {"train_loss": -36.00089645385742, "global_step": 120986, "epoch": 999} {"train_loss": -36.224403381347656, "global_step": 120987, "epoch": 999} {"train_loss": -37.034759521484375, "global_step": 120988, "epoch": 999} {"train_loss": -35.349849700927734, "global_step": 120989, "epoch": 999} {"train_loss": -37.398677825927734, "global_step": 120990, "epoch": 999} {"train_loss": -37.40011215209961, "global_step": 120991, "epoch": 999} {"train_loss": -36.08180236816406, "global_step": 120992, "epoch": 999} {"train_loss": -37.89970016479492, "global_step": 120993, "epoch": 999} {"train_loss": -36.10268783569336, "global_step": 120994, "epoch": 999} {"train_loss": -37.38913345336914, "global_step": 120995, "epoch": 999} {"train_loss": -37.55210494995117, "global_step": 120996, "epoch": 999} {"train_loss": -37.32040023803711, "global_step": 120997, "epoch": 999} {"train_loss": -38.072017669677734, "global_step": 120998, "epoch": 999} {"train_loss": -38.14314143913837, "global_step": 120999, "epoch": 999, "val_loss": 2695149.0} {"train_loss": -38.34872817993164, "global_step": 121000, "epoch": 1000} {"train_loss": -36.93043899536133, "global_step": 121001, "epoch": 1000} {"train_loss": -37.48238754272461, "global_step": 121002, "epoch": 1000} {"train_loss": -39.25351333618164, "global_step": 121003, "epoch": 1000} {"train_loss": -38.054691314697266, "global_step": 121004, "epoch": 1000} {"train_loss": -38.2693977355957, "global_step": 121005, "epoch": 1000} {"train_loss": -38.93124771118164, "global_step": 121006, "epoch": 1000} {"train_loss": -38.60174560546875, "global_step": 121007, "epoch": 1000} {"train_loss": -38.92240905761719, "global_step": 121008, "epoch": 1000} {"train_loss": -39.073463439941406, "global_step": 121009, "epoch": 1000} {"train_loss": -39.33414077758789, "global_step": 121010, "epoch": 1000} {"train_loss": -39.46401596069336, "global_step": 121011, "epoch": 1000} {"train_loss": -39.63749313354492, "global_step": 121012, "epoch": 1000} {"train_loss": -39.578125, "global_step": 121013, "epoch": 1000} {"train_loss": -40.03175735473633, "global_step": 121014, "epoch": 1000} {"train_loss": -39.57775115966797, "global_step": 121015, "epoch": 1000} {"train_loss": -39.8033447265625, "global_step": 121016, "epoch": 1000} {"train_loss": -39.623146057128906, "global_step": 121017, "epoch": 1000} {"train_loss": -39.34420394897461, "global_step": 121018, "epoch": 1000} {"train_loss": -39.571990966796875, "global_step": 121019, "epoch": 1000} {"train_loss": -39.98310089111328, "global_step": 121020, "epoch": 1000} {"train_loss": -39.6684455871582, "global_step": 121021, "epoch": 1000} {"train_loss": -39.553802490234375, "global_step": 121022, "epoch": 1000} {"train_loss": -39.6902961730957, "global_step": 121023, "epoch": 1000} {"train_loss": -39.8526496887207, "global_step": 121024, "epoch": 1000} {"train_loss": -39.916587829589844, "global_step": 121025, "epoch": 1000} {"train_loss": -39.79201126098633, "global_step": 121026, "epoch": 1000} {"train_loss": -39.92263412475586, "global_step": 121027, "epoch": 1000} {"train_loss": -39.862457275390625, "global_step": 121028, "epoch": 1000} {"train_loss": -39.53974914550781, "global_step": 121029, "epoch": 1000} {"train_loss": -39.45380783081055, "global_step": 121030, "epoch": 1000} {"train_loss": -39.6296272277832, "global_step": 121031, "epoch": 1000} {"train_loss": -40.328983306884766, "global_step": 121032, "epoch": 1000} {"train_loss": -39.2592658996582, "global_step": 121033, "epoch": 1000} {"train_loss": -40.25675582885742, "global_step": 121034, "epoch": 1000} {"train_loss": -40.64265441894531, "global_step": 121035, "epoch": 1000} {"train_loss": -40.00490951538086, "global_step": 121036, "epoch": 1000} {"train_loss": -38.02485275268555, "global_step": 121037, "epoch": 1000} {"train_loss": -40.00746536254883, "global_step": 121038, "epoch": 1000} {"train_loss": -40.148067474365234, "global_step": 121039, "epoch": 1000} {"train_loss": -38.62480545043945, "global_step": 121040, "epoch": 1000} {"train_loss": -39.31317901611328, "global_step": 121041, "epoch": 1000} {"train_loss": -40.3619384765625, "global_step": 121042, "epoch": 1000} {"train_loss": -40.34281921386719, "global_step": 121043, "epoch": 1000} {"train_loss": -39.63886642456055, "global_step": 121044, "epoch": 1000} {"train_loss": -40.60966491699219, "global_step": 121045, "epoch": 1000} {"train_loss": -40.17431640625, "global_step": 121046, "epoch": 1000} {"train_loss": -39.693359375, "global_step": 121047, "epoch": 1000} {"train_loss": -40.4625129699707, "global_step": 121048, "epoch": 1000} {"train_loss": -40.331966400146484, "global_step": 121049, "epoch": 1000} {"train_loss": -39.83641052246094, "global_step": 121050, "epoch": 1000} {"train_loss": -40.377010345458984, "global_step": 121051, "epoch": 1000} {"train_loss": -39.91084671020508, "global_step": 121052, "epoch": 1000} {"train_loss": -40.54036331176758, "global_step": 121053, "epoch": 1000} {"train_loss": -40.53067398071289, "global_step": 121054, "epoch": 1000} {"train_loss": -40.434444427490234, "global_step": 121055, "epoch": 1000} {"train_loss": -40.838314056396484, "global_step": 121056, "epoch": 1000} {"train_loss": -40.59358596801758, "global_step": 121057, "epoch": 1000} {"train_loss": -39.98542022705078, "global_step": 121058, "epoch": 1000} {"train_loss": -39.669734954833984, "global_step": 121059, "epoch": 1000} {"train_loss": -39.102928161621094, "global_step": 121060, "epoch": 1000} {"train_loss": -39.0509033203125, "global_step": 121061, "epoch": 1000} {"train_loss": -39.90128707885742, "global_step": 121062, "epoch": 1000} {"train_loss": -40.61511993408203, "global_step": 121063, "epoch": 1000} {"train_loss": -40.892452239990234, "global_step": 121064, "epoch": 1000} {"train_loss": -40.66598129272461, "global_step": 121065, "epoch": 1000} {"train_loss": -39.79594802856445, "global_step": 121066, "epoch": 1000} {"train_loss": -39.96841049194336, "global_step": 121067, "epoch": 1000} {"train_loss": -40.748958587646484, "global_step": 121068, "epoch": 1000} {"train_loss": -40.40753173828125, "global_step": 121069, "epoch": 1000} {"train_loss": -39.898677825927734, "global_step": 121070, "epoch": 1000} {"train_loss": -40.52404022216797, "global_step": 121071, "epoch": 1000} {"train_loss": -40.4870491027832, "global_step": 121072, "epoch": 1000} {"train_loss": -40.638919830322266, "global_step": 121073, "epoch": 1000} {"train_loss": -40.64434814453125, "global_step": 121074, "epoch": 1000} {"train_loss": -40.23556137084961, "global_step": 121075, "epoch": 1000} {"train_loss": -40.819000244140625, "global_step": 121076, "epoch": 1000} {"train_loss": -40.31333541870117, "global_step": 121077, "epoch": 1000} {"train_loss": -39.576377868652344, "global_step": 121078, "epoch": 1000} {"train_loss": -39.91877365112305, "global_step": 121079, "epoch": 1000} {"train_loss": -38.82807540893555, "global_step": 121080, "epoch": 1000} {"train_loss": -39.835750579833984, "global_step": 121081, "epoch": 1000} {"train_loss": -40.27326583862305, "global_step": 121082, "epoch": 1000} {"train_loss": -40.17729568481445, "global_step": 121083, "epoch": 1000} {"train_loss": -39.05758285522461, "global_step": 121084, "epoch": 1000} {"train_loss": -37.803462982177734, "global_step": 121085, "epoch": 1000} {"train_loss": -39.97681427001953, "global_step": 121086, "epoch": 1000} {"train_loss": -39.53718948364258, "global_step": 121087, "epoch": 1000} {"train_loss": -38.55964279174805, "global_step": 121088, "epoch": 1000} {"train_loss": -39.302703857421875, "global_step": 121089, "epoch": 1000} {"train_loss": -38.296165466308594, "global_step": 121090, "epoch": 1000} {"train_loss": -38.54671859741211, "global_step": 121091, "epoch": 1000} {"train_loss": -39.90521240234375, "global_step": 121092, "epoch": 1000} {"train_loss": -37.9716682434082, "global_step": 121093, "epoch": 1000} {"train_loss": -37.57271957397461, "global_step": 121094, "epoch": 1000} {"train_loss": -39.04500198364258, "global_step": 121095, "epoch": 1000} {"train_loss": -38.234920501708984, "global_step": 121096, "epoch": 1000} {"train_loss": -40.45075988769531, "global_step": 121097, "epoch": 1000} {"train_loss": -38.59648132324219, "global_step": 121098, "epoch": 1000} {"train_loss": -38.871864318847656, "global_step": 121099, "epoch": 1000} {"train_loss": -40.69295883178711, "global_step": 121100, "epoch": 1000} {"train_loss": -38.57697296142578, "global_step": 121101, "epoch": 1000} {"train_loss": -39.116573333740234, "global_step": 121102, "epoch": 1000} {"train_loss": -38.76399230957031, "global_step": 121103, "epoch": 1000} {"train_loss": -38.10465621948242, "global_step": 121104, "epoch": 1000} {"train_loss": -38.157073974609375, "global_step": 121105, "epoch": 1000} {"train_loss": -37.416595458984375, "global_step": 121106, "epoch": 1000} {"train_loss": -38.5765495300293, "global_step": 121107, "epoch": 1000} {"train_loss": -38.066261291503906, "global_step": 121108, "epoch": 1000} {"train_loss": -39.60691452026367, "global_step": 121109, "epoch": 1000} {"train_loss": -36.71171188354492, "global_step": 121110, "epoch": 1000} {"train_loss": -39.122650146484375, "global_step": 121111, "epoch": 1000} {"train_loss": -37.84916687011719, "global_step": 121112, "epoch": 1000} {"train_loss": -36.41964340209961, "global_step": 121113, "epoch": 1000} {"train_loss": -37.56447982788086, "global_step": 121114, "epoch": 1000} {"train_loss": -39.55955123901367, "global_step": 121115, "epoch": 1000} {"train_loss": -35.77961730957031, "global_step": 121116, "epoch": 1000} {"train_loss": -38.27346420288086, "global_step": 121117, "epoch": 1000} {"train_loss": -35.93551254272461, "global_step": 121118, "epoch": 1000} {"train_loss": -36.586544036865234, "global_step": 121119, "epoch": 1000} {"train_loss": -39.34837221508184, "global_step": 121120, "epoch": 1000, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4400000": 1.0, "test/sim_max_reward_4400001": 1.0, "test/sim_max_reward_4400002": 1.0, "test/sim_max_reward_4400003": 0.0, "test/sim_max_reward_4400004": 1.0, "test/sim_max_reward_4400005": 1.0, "test/sim_max_reward_4400006": 1.0, "test/sim_max_reward_4400007": 1.0, "test/sim_max_reward_4400008": 1.0, "test/sim_max_reward_4400009": 1.0, "test/sim_max_reward_4400010": 1.0, "test/sim_max_reward_4400011": 1.0, "test/sim_max_reward_4400012": 1.0, "test/sim_max_reward_4400013": 1.0, "test/sim_max_reward_4400014": 1.0, "test/sim_max_reward_4400015": 1.0, "test/sim_max_reward_4400016": 1.0, "test/sim_max_reward_4400017": 1.0, "test/sim_max_reward_4400018": 1.0, "test/sim_max_reward_4400019": 1.0, "test/sim_max_reward_4400020": 1.0, "test/sim_max_reward_4400021": 1.0, "train/mean_score": 1.0, "test/mean_score": 0.9545454545454546, "val_loss": 2703848.25} {"train_loss": -37.39634704589844, "global_step": 121121, "epoch": 1001} {"train_loss": -36.50765609741211, "global_step": 121122, "epoch": 1001} {"train_loss": -37.33956527709961, "global_step": 121123, "epoch": 1001} {"train_loss": -38.4078254699707, "global_step": 121124, "epoch": 1001} {"train_loss": -37.18556213378906, "global_step": 121125, "epoch": 1001} {"train_loss": -37.95072555541992, "global_step": 121126, "epoch": 1001} {"train_loss": -39.39574432373047, "global_step": 121127, "epoch": 1001} {"train_loss": -38.56875228881836, "global_step": 121128, "epoch": 1001} {"train_loss": -36.9456901550293, "global_step": 121129, "epoch": 1001} {"train_loss": -38.117889404296875, "global_step": 121130, "epoch": 1001} {"train_loss": -38.19788360595703, "global_step": 121131, "epoch": 1001} {"train_loss": -37.079647064208984, "global_step": 121132, "epoch": 1001} {"train_loss": -39.503658294677734, "global_step": 121133, "epoch": 1001} {"train_loss": -38.40639877319336, "global_step": 121134, "epoch": 1001} {"train_loss": -39.468589782714844, "global_step": 121135, "epoch": 1001} {"train_loss": -38.74076461791992, "global_step": 121136, "epoch": 1001} {"train_loss": -38.7971076965332, "global_step": 121137, "epoch": 1001} {"train_loss": -38.4286003112793, "global_step": 121138, "epoch": 1001} {"train_loss": -39.58787155151367, "global_step": 121139, "epoch": 1001} {"train_loss": -38.81203079223633, "global_step": 121140, "epoch": 1001} {"train_loss": -39.26768112182617, "global_step": 121141, "epoch": 1001} {"train_loss": -39.563846588134766, "global_step": 121142, "epoch": 1001} {"train_loss": -38.71709060668945, "global_step": 121143, "epoch": 1001} {"train_loss": -39.1220588684082, "global_step": 121144, "epoch": 1001} {"train_loss": -39.46809387207031, "global_step": 121145, "epoch": 1001} {"train_loss": -37.5924186706543, "global_step": 121146, "epoch": 1001} {"train_loss": -39.7604866027832, "global_step": 121147, "epoch": 1001} {"train_loss": -38.4594841003418, "global_step": 121148, "epoch": 1001} {"train_loss": -39.26910400390625, "global_step": 121149, "epoch": 1001} {"train_loss": -40.344844818115234, "global_step": 121150, "epoch": 1001} {"train_loss": -39.44083023071289, "global_step": 121151, "epoch": 1001} {"train_loss": -38.941532135009766, "global_step": 121152, "epoch": 1001} {"train_loss": -38.801761627197266, "global_step": 121153, "epoch": 1001} {"train_loss": -39.75905227661133, "global_step": 121154, "epoch": 1001} {"train_loss": -40.104183197021484, "global_step": 121155, "epoch": 1001} {"train_loss": -40.149444580078125, "global_step": 121156, "epoch": 1001} {"train_loss": -39.80457305908203, "global_step": 121157, "epoch": 1001} {"train_loss": -40.503692626953125, "global_step": 121158, "epoch": 1001} {"train_loss": -39.82442092895508, "global_step": 121159, "epoch": 1001} {"train_loss": -40.02081298828125, "global_step": 121160, "epoch": 1001} {"train_loss": -40.019168853759766, "global_step": 121161, "epoch": 1001} {"train_loss": -40.06523513793945, "global_step": 121162, "epoch": 1001} {"train_loss": -39.8233757019043, "global_step": 121163, "epoch": 1001} {"train_loss": -40.0932731628418, "global_step": 121164, "epoch": 1001} {"train_loss": -40.01646041870117, "global_step": 121165, "epoch": 1001} {"train_loss": -40.049129486083984, "global_step": 121166, "epoch": 1001} {"train_loss": -40.45406723022461, "global_step": 121167, "epoch": 1001} {"train_loss": -40.189300537109375, "global_step": 121168, "epoch": 1001} {"train_loss": -40.337032318115234, "global_step": 121169, "epoch": 1001} {"train_loss": -40.4557991027832, "global_step": 121170, "epoch": 1001} {"train_loss": -40.319610595703125, "global_step": 121171, "epoch": 1001} {"train_loss": -40.5255126953125, "global_step": 121172, "epoch": 1001} {"train_loss": -40.654212951660156, "global_step": 121173, "epoch": 1001} {"train_loss": -40.421966552734375, "global_step": 121174, "epoch": 1001} {"train_loss": -40.70563507080078, "global_step": 121175, "epoch": 1001} {"train_loss": -40.45136642456055, "global_step": 121176, "epoch": 1001} {"train_loss": -40.380367279052734, "global_step": 121177, "epoch": 1001} {"train_loss": -40.23271942138672, "global_step": 121178, "epoch": 1001} {"train_loss": -40.73954391479492, "global_step": 121179, "epoch": 1001} {"train_loss": -40.65610122680664, "global_step": 121180, "epoch": 1001} {"train_loss": -40.42063522338867, "global_step": 121181, "epoch": 1001} {"train_loss": -40.60700225830078, "global_step": 121182, "epoch": 1001} {"train_loss": -40.34969711303711, "global_step": 121183, "epoch": 1001} {"train_loss": -39.66184616088867, "global_step": 121184, "epoch": 1001} {"train_loss": -37.92987060546875, "global_step": 121185, "epoch": 1001} {"train_loss": -39.359962463378906, "global_step": 121186, "epoch": 1001} {"train_loss": -40.41771697998047, "global_step": 121187, "epoch": 1001} {"train_loss": -39.685062408447266, "global_step": 121188, "epoch": 1001} {"train_loss": -38.69511795043945, "global_step": 121189, "epoch": 1001} {"train_loss": -37.974178314208984, "global_step": 121190, "epoch": 1001} {"train_loss": -39.164947509765625, "global_step": 121191, "epoch": 1001} {"train_loss": -39.62203598022461, "global_step": 121192, "epoch": 1001} {"train_loss": -38.96682357788086, "global_step": 121193, "epoch": 1001} {"train_loss": -39.051448822021484, "global_step": 121194, "epoch": 1001} {"train_loss": -38.804805755615234, "global_step": 121195, "epoch": 1001} {"train_loss": -39.164833068847656, "global_step": 121196, "epoch": 1001} {"train_loss": -39.3756217956543, "global_step": 121197, "epoch": 1001} {"train_loss": -39.79934310913086, "global_step": 121198, "epoch": 1001} {"train_loss": -39.00940704345703, "global_step": 121199, "epoch": 1001} {"train_loss": -39.41294479370117, "global_step": 121200, "epoch": 1001} {"train_loss": -39.31915283203125, "global_step": 121201, "epoch": 1001} {"train_loss": -37.71051788330078, "global_step": 121202, "epoch": 1001} {"train_loss": -38.09809875488281, "global_step": 121203, "epoch": 1001} {"train_loss": -38.1273078918457, "global_step": 121204, "epoch": 1001} {"train_loss": -39.398643493652344, "global_step": 121205, "epoch": 1001} {"train_loss": -38.12557601928711, "global_step": 121206, "epoch": 1001} {"train_loss": -38.48963165283203, "global_step": 121207, "epoch": 1001} {"train_loss": -40.03471374511719, "global_step": 121208, "epoch": 1001} {"train_loss": -39.0853157043457, "global_step": 121209, "epoch": 1001} {"train_loss": -39.083534240722656, "global_step": 121210, "epoch": 1001} {"train_loss": -39.20960235595703, "global_step": 121211, "epoch": 1001} {"train_loss": -40.245628356933594, "global_step": 121212, "epoch": 1001} {"train_loss": -40.335609436035156, "global_step": 121213, "epoch": 1001} {"train_loss": -40.31393051147461, "global_step": 121214, "epoch": 1001} {"train_loss": -40.55717086791992, "global_step": 121215, "epoch": 1001} {"train_loss": -40.2883415222168, "global_step": 121216, "epoch": 1001} {"train_loss": -39.54292678833008, "global_step": 121217, "epoch": 1001} {"train_loss": -38.45908737182617, "global_step": 121218, "epoch": 1001} {"train_loss": -39.5235595703125, "global_step": 121219, "epoch": 1001} {"train_loss": -39.795562744140625, "global_step": 121220, "epoch": 1001} {"train_loss": -38.93794631958008, "global_step": 121221, "epoch": 1001} {"train_loss": -39.86637496948242, "global_step": 121222, "epoch": 1001} {"train_loss": -40.16889572143555, "global_step": 121223, "epoch": 1001} {"train_loss": -39.07958984375, "global_step": 121224, "epoch": 1001} {"train_loss": -39.815162658691406, "global_step": 121225, "epoch": 1001} {"train_loss": -40.29645538330078, "global_step": 121226, "epoch": 1001} {"train_loss": -39.142181396484375, "global_step": 121227, "epoch": 1001} {"train_loss": -38.694854736328125, "global_step": 121228, "epoch": 1001} {"train_loss": -39.74155044555664, "global_step": 121229, "epoch": 1001} {"train_loss": -39.30097579956055, "global_step": 121230, "epoch": 1001} {"train_loss": -39.077545166015625, "global_step": 121231, "epoch": 1001} {"train_loss": -39.83108139038086, "global_step": 121232, "epoch": 1001} {"train_loss": -38.835693359375, "global_step": 121233, "epoch": 1001} {"train_loss": -39.977291107177734, "global_step": 121234, "epoch": 1001} {"train_loss": -38.18442916870117, "global_step": 121235, "epoch": 1001} {"train_loss": -39.0483512878418, "global_step": 121236, "epoch": 1001} {"train_loss": -40.02264404296875, "global_step": 121237, "epoch": 1001} {"train_loss": -39.14516067504883, "global_step": 121238, "epoch": 1001} {"train_loss": -39.87274932861328, "global_step": 121239, "epoch": 1001} {"train_loss": -39.929954528808594, "global_step": 121240, "epoch": 1001} {"train_loss": -39.35451409836446, "global_step": 121241, "epoch": 1001, "val_loss": 2711098.25} {"train_loss": -40.487545013427734, "global_step": 121242, "epoch": 1002} {"train_loss": -39.98309326171875, "global_step": 121243, "epoch": 1002} {"train_loss": -39.77809143066406, "global_step": 121244, "epoch": 1002} {"train_loss": -39.992733001708984, "global_step": 121245, "epoch": 1002} {"train_loss": -38.85763931274414, "global_step": 121246, "epoch": 1002} {"train_loss": -38.0640869140625, "global_step": 121247, "epoch": 1002} {"train_loss": -39.87757873535156, "global_step": 121248, "epoch": 1002} {"train_loss": -39.274051666259766, "global_step": 121249, "epoch": 1002} {"train_loss": -39.76129150390625, "global_step": 121250, "epoch": 1002} {"train_loss": -38.41851043701172, "global_step": 121251, "epoch": 1002} {"train_loss": -39.20567321777344, "global_step": 121252, "epoch": 1002} {"train_loss": -40.8562126159668, "global_step": 121253, "epoch": 1002} {"train_loss": -40.20026397705078, "global_step": 121254, "epoch": 1002} {"train_loss": -40.454872131347656, "global_step": 121255, "epoch": 1002} {"train_loss": -39.484840393066406, "global_step": 121256, "epoch": 1002} {"train_loss": -39.31873321533203, "global_step": 121257, "epoch": 1002} {"train_loss": -40.6256103515625, "global_step": 121258, "epoch": 1002} {"train_loss": -38.78437423706055, "global_step": 121259, "epoch": 1002} {"train_loss": -39.27653121948242, "global_step": 121260, "epoch": 1002} {"train_loss": -39.31984329223633, "global_step": 121261, "epoch": 1002} {"train_loss": -40.26974105834961, "global_step": 121262, "epoch": 1002} {"train_loss": -40.26505661010742, "global_step": 121263, "epoch": 1002} {"train_loss": -39.3538703918457, "global_step": 121264, "epoch": 1002} {"train_loss": -39.94795608520508, "global_step": 121265, "epoch": 1002} {"train_loss": -40.0313720703125, "global_step": 121266, "epoch": 1002} {"train_loss": -39.9135856628418, "global_step": 121267, "epoch": 1002} {"train_loss": -40.7244987487793, "global_step": 121268, "epoch": 1002} {"train_loss": -39.851131439208984, "global_step": 121269, "epoch": 1002} {"train_loss": -40.277828216552734, "global_step": 121270, "epoch": 1002} {"train_loss": -40.02669143676758, "global_step": 121271, "epoch": 1002} {"train_loss": -40.41236877441406, "global_step": 121272, "epoch": 1002} {"train_loss": -40.43156051635742, "global_step": 121273, "epoch": 1002} {"train_loss": -40.2478141784668, "global_step": 121274, "epoch": 1002} {"train_loss": -40.846923828125, "global_step": 121275, "epoch": 1002} {"train_loss": -40.383724212646484, "global_step": 121276, "epoch": 1002} {"train_loss": -40.2684440612793, "global_step": 121277, "epoch": 1002} {"train_loss": -40.98344802856445, "global_step": 121278, "epoch": 1002} {"train_loss": -40.88861083984375, "global_step": 121279, "epoch": 1002} {"train_loss": -40.61220932006836, "global_step": 121280, "epoch": 1002} {"train_loss": -40.55259323120117, "global_step": 121281, "epoch": 1002} {"train_loss": -40.16599655151367, "global_step": 121282, "epoch": 1002} {"train_loss": -39.61626052856445, "global_step": 121283, "epoch": 1002} {"train_loss": -40.90085983276367, "global_step": 121284, "epoch": 1002} {"train_loss": -39.24506378173828, "global_step": 121285, "epoch": 1002} {"train_loss": -38.033939361572266, "global_step": 121286, "epoch": 1002} {"train_loss": -39.60322189331055, "global_step": 121287, "epoch": 1002} {"train_loss": -40.04924774169922, "global_step": 121288, "epoch": 1002} {"train_loss": -40.37712860107422, "global_step": 121289, "epoch": 1002} {"train_loss": -39.236019134521484, "global_step": 121290, "epoch": 1002} {"train_loss": -38.80738830566406, "global_step": 121291, "epoch": 1002} {"train_loss": -40.37199020385742, "global_step": 121292, "epoch": 1002} {"train_loss": -40.1959228515625, "global_step": 121293, "epoch": 1002} {"train_loss": -39.125518798828125, "global_step": 121294, "epoch": 1002} {"train_loss": -37.766902923583984, "global_step": 121295, "epoch": 1002} {"train_loss": -38.87290573120117, "global_step": 121296, "epoch": 1002} {"train_loss": -39.10024642944336, "global_step": 121297, "epoch": 1002} {"train_loss": -38.135597229003906, "global_step": 121298, "epoch": 1002} {"train_loss": -36.79004669189453, "global_step": 121299, "epoch": 1002} {"train_loss": -39.515869140625, "global_step": 121300, "epoch": 1002} {"train_loss": -39.9878044128418, "global_step": 121301, "epoch": 1002} {"train_loss": -38.53314971923828, "global_step": 121302, "epoch": 1002} {"train_loss": -38.59822463989258, "global_step": 121303, "epoch": 1002} {"train_loss": -38.92118453979492, "global_step": 121304, "epoch": 1002} {"train_loss": -37.83089828491211, "global_step": 121305, "epoch": 1002} {"train_loss": -39.23745346069336, "global_step": 121306, "epoch": 1002} {"train_loss": -40.38426208496094, "global_step": 121307, "epoch": 1002} {"train_loss": -40.357154846191406, "global_step": 121308, "epoch": 1002} {"train_loss": -39.52118682861328, "global_step": 121309, "epoch": 1002} {"train_loss": -39.5389404296875, "global_step": 121310, "epoch": 1002} {"train_loss": -40.338966369628906, "global_step": 121311, "epoch": 1002} {"train_loss": -39.65092468261719, "global_step": 121312, "epoch": 1002} {"train_loss": -38.38370895385742, "global_step": 121313, "epoch": 1002} {"train_loss": -40.199867248535156, "global_step": 121314, "epoch": 1002} {"train_loss": -39.3608283996582, "global_step": 121315, "epoch": 1002} {"train_loss": -38.758270263671875, "global_step": 121316, "epoch": 1002} {"train_loss": -37.857666015625, "global_step": 121317, "epoch": 1002} {"train_loss": -39.47309875488281, "global_step": 121318, "epoch": 1002} {"train_loss": -39.472930908203125, "global_step": 121319, "epoch": 1002} {"train_loss": -38.99778366088867, "global_step": 121320, "epoch": 1002} {"train_loss": -39.759117126464844, "global_step": 121321, "epoch": 1002} {"train_loss": -39.57475280761719, "global_step": 121322, "epoch": 1002} {"train_loss": -39.62221145629883, "global_step": 121323, "epoch": 1002} {"train_loss": -39.53694152832031, "global_step": 121324, "epoch": 1002} {"train_loss": -38.62910461425781, "global_step": 121325, "epoch": 1002} {"train_loss": -37.33883285522461, "global_step": 121326, "epoch": 1002} {"train_loss": -39.28298568725586, "global_step": 121327, "epoch": 1002} {"train_loss": -39.62636184692383, "global_step": 121328, "epoch": 1002} {"train_loss": -39.11879348754883, "global_step": 121329, "epoch": 1002} {"train_loss": -39.20643997192383, "global_step": 121330, "epoch": 1002} {"train_loss": -38.87653732299805, "global_step": 121331, "epoch": 1002} {"train_loss": -39.6146354675293, "global_step": 121332, "epoch": 1002} {"train_loss": -40.08613586425781, "global_step": 121333, "epoch": 1002} {"train_loss": -38.842647552490234, "global_step": 121334, "epoch": 1002} {"train_loss": -38.34558868408203, "global_step": 121335, "epoch": 1002} {"train_loss": -39.198272705078125, "global_step": 121336, "epoch": 1002} {"train_loss": -37.91139221191406, "global_step": 121337, "epoch": 1002} {"train_loss": -38.33913040161133, "global_step": 121338, "epoch": 1002} {"train_loss": -38.13605499267578, "global_step": 121339, "epoch": 1002} {"train_loss": -38.38511276245117, "global_step": 121340, "epoch": 1002} {"train_loss": -38.7225456237793, "global_step": 121341, "epoch": 1002} {"train_loss": -38.29095458984375, "global_step": 121342, "epoch": 1002} {"train_loss": -38.56258773803711, "global_step": 121343, "epoch": 1002} {"train_loss": -38.2913932800293, "global_step": 121344, "epoch": 1002} {"train_loss": -37.67637634277344, "global_step": 121345, "epoch": 1002} {"train_loss": -39.68410873413086, "global_step": 121346, "epoch": 1002} {"train_loss": -38.64066696166992, "global_step": 121347, "epoch": 1002} {"train_loss": -39.55710220336914, "global_step": 121348, "epoch": 1002} {"train_loss": -38.748130798339844, "global_step": 121349, "epoch": 1002} {"train_loss": -39.47592544555664, "global_step": 121350, "epoch": 1002} {"train_loss": -38.95340347290039, "global_step": 121351, "epoch": 1002} {"train_loss": -39.86430358886719, "global_step": 121352, "epoch": 1002} {"train_loss": -39.92593002319336, "global_step": 121353, "epoch": 1002} {"train_loss": -39.304893493652344, "global_step": 121354, "epoch": 1002} {"train_loss": -40.38396072387695, "global_step": 121355, "epoch": 1002} {"train_loss": -40.13442611694336, "global_step": 121356, "epoch": 1002} {"train_loss": -38.58134841918945, "global_step": 121357, "epoch": 1002} {"train_loss": -39.983272552490234, "global_step": 121358, "epoch": 1002} {"train_loss": -39.90401840209961, "global_step": 121359, "epoch": 1002} {"train_loss": -39.78995895385742, "global_step": 121360, "epoch": 1002} {"train_loss": -40.199947357177734, "global_step": 121361, "epoch": 1002} {"train_loss": -39.45530208871384, "global_step": 121362, "epoch": 1002, "val_loss": 2735390.0} {"train_loss": -40.583927154541016, "global_step": 121363, "epoch": 1003} {"train_loss": -40.31915283203125, "global_step": 121364, "epoch": 1003} {"train_loss": -39.9633903503418, "global_step": 121365, "epoch": 1003} {"train_loss": -40.00343704223633, "global_step": 121366, "epoch": 1003} {"train_loss": -40.425472259521484, "global_step": 121367, "epoch": 1003} {"train_loss": -40.710018157958984, "global_step": 121368, "epoch": 1003} {"train_loss": -40.227447509765625, "global_step": 121369, "epoch": 1003} {"train_loss": -40.403987884521484, "global_step": 121370, "epoch": 1003} {"train_loss": -40.6152229309082, "global_step": 121371, "epoch": 1003} {"train_loss": -40.20797348022461, "global_step": 121372, "epoch": 1003} {"train_loss": -39.881446838378906, "global_step": 121373, "epoch": 1003} {"train_loss": -40.01023483276367, "global_step": 121374, "epoch": 1003} {"train_loss": -40.76901626586914, "global_step": 121375, "epoch": 1003} {"train_loss": -39.64803695678711, "global_step": 121376, "epoch": 1003} {"train_loss": -38.84539794921875, "global_step": 121377, "epoch": 1003} {"train_loss": -39.41143035888672, "global_step": 121378, "epoch": 1003} {"train_loss": -40.6368408203125, "global_step": 121379, "epoch": 1003} {"train_loss": -40.67147445678711, "global_step": 121380, "epoch": 1003} {"train_loss": -40.44758224487305, "global_step": 121381, "epoch": 1003} {"train_loss": -40.38154602050781, "global_step": 121382, "epoch": 1003} {"train_loss": -40.93788146972656, "global_step": 121383, "epoch": 1003} {"train_loss": -40.55084991455078, "global_step": 121384, "epoch": 1003} {"train_loss": -39.71596145629883, "global_step": 121385, "epoch": 1003} {"train_loss": -40.19174575805664, "global_step": 121386, "epoch": 1003} {"train_loss": -40.563209533691406, "global_step": 121387, "epoch": 1003} {"train_loss": -38.908729553222656, "global_step": 121388, "epoch": 1003} {"train_loss": -40.77730941772461, "global_step": 121389, "epoch": 1003} {"train_loss": -39.97153091430664, "global_step": 121390, "epoch": 1003} {"train_loss": -37.94475173950195, "global_step": 121391, "epoch": 1003} {"train_loss": -39.974361419677734, "global_step": 121392, "epoch": 1003} {"train_loss": -35.96305465698242, "global_step": 121393, "epoch": 1003} {"train_loss": -36.54914474487305, "global_step": 121394, "epoch": 1003} {"train_loss": -33.1605339050293, "global_step": 121395, "epoch": 1003} {"train_loss": -37.77961349487305, "global_step": 121396, "epoch": 1003} {"train_loss": -38.27744674682617, "global_step": 121397, "epoch": 1003} {"train_loss": -37.50234603881836, "global_step": 121398, "epoch": 1003} {"train_loss": -39.32782745361328, "global_step": 121399, "epoch": 1003} {"train_loss": -37.68809127807617, "global_step": 121400, "epoch": 1003} {"train_loss": -37.201271057128906, "global_step": 121401, "epoch": 1003} {"train_loss": -38.340309143066406, "global_step": 121402, "epoch": 1003} {"train_loss": -38.6951789855957, "global_step": 121403, "epoch": 1003} {"train_loss": -40.16421127319336, "global_step": 121404, "epoch": 1003} {"train_loss": -38.30489730834961, "global_step": 121405, "epoch": 1003} {"train_loss": -37.30978775024414, "global_step": 121406, "epoch": 1003} {"train_loss": -37.76226043701172, "global_step": 121407, "epoch": 1003} {"train_loss": -39.5511474609375, "global_step": 121408, "epoch": 1003} {"train_loss": -40.16492462158203, "global_step": 121409, "epoch": 1003} {"train_loss": -39.790313720703125, "global_step": 121410, "epoch": 1003} {"train_loss": -40.20947265625, "global_step": 121411, "epoch": 1003} {"train_loss": -40.39059829711914, "global_step": 121412, "epoch": 1003} {"train_loss": -39.61652755737305, "global_step": 121413, "epoch": 1003} {"train_loss": -39.76338577270508, "global_step": 121414, "epoch": 1003} {"train_loss": -40.198509216308594, "global_step": 121415, "epoch": 1003} {"train_loss": -39.99141311645508, "global_step": 121416, "epoch": 1003} {"train_loss": -39.08759689331055, "global_step": 121417, "epoch": 1003} {"train_loss": -39.59464645385742, "global_step": 121418, "epoch": 1003} {"train_loss": -39.1572380065918, "global_step": 121419, "epoch": 1003} {"train_loss": -40.01982498168945, "global_step": 121420, "epoch": 1003} {"train_loss": -39.18489074707031, "global_step": 121421, "epoch": 1003} {"train_loss": -38.368141174316406, "global_step": 121422, "epoch": 1003} {"train_loss": -39.83545684814453, "global_step": 121423, "epoch": 1003} {"train_loss": -39.79740524291992, "global_step": 121424, "epoch": 1003} {"train_loss": -39.933589935302734, "global_step": 121425, "epoch": 1003} {"train_loss": -39.92476272583008, "global_step": 121426, "epoch": 1003} {"train_loss": -39.98772048950195, "global_step": 121427, "epoch": 1003} {"train_loss": -39.84298324584961, "global_step": 121428, "epoch": 1003} {"train_loss": -39.18553161621094, "global_step": 121429, "epoch": 1003} {"train_loss": -39.54240798950195, "global_step": 121430, "epoch": 1003} {"train_loss": -40.5227165222168, "global_step": 121431, "epoch": 1003} {"train_loss": -40.131141662597656, "global_step": 121432, "epoch": 1003} {"train_loss": -39.60905075073242, "global_step": 121433, "epoch": 1003} {"train_loss": -40.13616180419922, "global_step": 121434, "epoch": 1003} {"train_loss": -40.02403259277344, "global_step": 121435, "epoch": 1003} {"train_loss": -39.56291580200195, "global_step": 121436, "epoch": 1003} {"train_loss": -39.544044494628906, "global_step": 121437, "epoch": 1003} {"train_loss": -39.9525260925293, "global_step": 121438, "epoch": 1003} {"train_loss": -40.39089584350586, "global_step": 121439, "epoch": 1003} {"train_loss": -39.80465316772461, "global_step": 121440, "epoch": 1003} {"train_loss": -39.36516571044922, "global_step": 121441, "epoch": 1003} {"train_loss": -40.42368698120117, "global_step": 121442, "epoch": 1003} {"train_loss": -40.45912551879883, "global_step": 121443, "epoch": 1003} {"train_loss": -39.290008544921875, "global_step": 121444, "epoch": 1003} {"train_loss": -40.51906967163086, "global_step": 121445, "epoch": 1003} {"train_loss": -39.70718002319336, "global_step": 121446, "epoch": 1003} {"train_loss": -39.0491828918457, "global_step": 121447, "epoch": 1003} {"train_loss": -40.0321159362793, "global_step": 121448, "epoch": 1003} {"train_loss": -38.44552230834961, "global_step": 121449, "epoch": 1003} {"train_loss": -37.5702018737793, "global_step": 121450, "epoch": 1003} {"train_loss": -37.684898376464844, "global_step": 121451, "epoch": 1003} {"train_loss": -39.11846160888672, "global_step": 121452, "epoch": 1003} {"train_loss": -39.242244720458984, "global_step": 121453, "epoch": 1003} {"train_loss": -39.86790084838867, "global_step": 121454, "epoch": 1003} {"train_loss": -38.59147644042969, "global_step": 121455, "epoch": 1003} {"train_loss": -38.104854583740234, "global_step": 121456, "epoch": 1003} {"train_loss": -38.72385025024414, "global_step": 121457, "epoch": 1003} {"train_loss": -39.61152267456055, "global_step": 121458, "epoch": 1003} {"train_loss": -40.42325973510742, "global_step": 121459, "epoch": 1003} {"train_loss": -39.7501335144043, "global_step": 121460, "epoch": 1003} {"train_loss": -38.675533294677734, "global_step": 121461, "epoch": 1003} {"train_loss": -37.293487548828125, "global_step": 121462, "epoch": 1003} {"train_loss": -38.36075973510742, "global_step": 121463, "epoch": 1003} {"train_loss": -40.0586051940918, "global_step": 121464, "epoch": 1003} {"train_loss": -39.52409744262695, "global_step": 121465, "epoch": 1003} {"train_loss": -37.52824020385742, "global_step": 121466, "epoch": 1003} {"train_loss": -39.06313705444336, "global_step": 121467, "epoch": 1003} {"train_loss": -39.568782806396484, "global_step": 121468, "epoch": 1003} {"train_loss": -37.598384857177734, "global_step": 121469, "epoch": 1003} {"train_loss": -39.85377883911133, "global_step": 121470, "epoch": 1003} {"train_loss": -38.940673828125, "global_step": 121471, "epoch": 1003} {"train_loss": -39.04239273071289, "global_step": 121472, "epoch": 1003} {"train_loss": -40.04257583618164, "global_step": 121473, "epoch": 1003} {"train_loss": -38.61804962158203, "global_step": 121474, "epoch": 1003} {"train_loss": -38.909332275390625, "global_step": 121475, "epoch": 1003} {"train_loss": -40.079833984375, "global_step": 121476, "epoch": 1003} {"train_loss": -38.527889251708984, "global_step": 121477, "epoch": 1003} {"train_loss": -39.62885665893555, "global_step": 121478, "epoch": 1003} {"train_loss": -39.36952590942383, "global_step": 121479, "epoch": 1003} {"train_loss": -38.486942291259766, "global_step": 121480, "epoch": 1003} {"train_loss": -40.3718376159668, "global_step": 121481, "epoch": 1003} {"train_loss": -39.16990661621094, "global_step": 121482, "epoch": 1003} {"train_loss": -39.379165933151874, "global_step": 121483, "epoch": 1003, "val_loss": 2759854.75} {"train_loss": -38.6055793762207, "global_step": 121484, "epoch": 1004} {"train_loss": -39.17578125, "global_step": 121485, "epoch": 1004} {"train_loss": -40.510833740234375, "global_step": 121486, "epoch": 1004} {"train_loss": -39.62773513793945, "global_step": 121487, "epoch": 1004} {"train_loss": -39.664852142333984, "global_step": 121488, "epoch": 1004} {"train_loss": -39.6242790222168, "global_step": 121489, "epoch": 1004} {"train_loss": -39.87825012207031, "global_step": 121490, "epoch": 1004} {"train_loss": -39.83842086791992, "global_step": 121491, "epoch": 1004} {"train_loss": -40.37483596801758, "global_step": 121492, "epoch": 1004} {"train_loss": -40.11623001098633, "global_step": 121493, "epoch": 1004} {"train_loss": -40.322486877441406, "global_step": 121494, "epoch": 1004} {"train_loss": -40.34524154663086, "global_step": 121495, "epoch": 1004} {"train_loss": -39.972408294677734, "global_step": 121496, "epoch": 1004} {"train_loss": -40.23250198364258, "global_step": 121497, "epoch": 1004} {"train_loss": -40.39156723022461, "global_step": 121498, "epoch": 1004} {"train_loss": -40.82715606689453, "global_step": 121499, "epoch": 1004} {"train_loss": -40.54140090942383, "global_step": 121500, "epoch": 1004} {"train_loss": -40.5096549987793, "global_step": 121501, "epoch": 1004} {"train_loss": -40.85683822631836, "global_step": 121502, "epoch": 1004} {"train_loss": -40.670040130615234, "global_step": 121503, "epoch": 1004} {"train_loss": -40.41254425048828, "global_step": 121504, "epoch": 1004} {"train_loss": -40.94453430175781, "global_step": 121505, "epoch": 1004} {"train_loss": -40.820064544677734, "global_step": 121506, "epoch": 1004} {"train_loss": -40.6936149597168, "global_step": 121507, "epoch": 1004} {"train_loss": -41.022945404052734, "global_step": 121508, "epoch": 1004} {"train_loss": -40.802345275878906, "global_step": 121509, "epoch": 1004} {"train_loss": -40.875526428222656, "global_step": 121510, "epoch": 1004} {"train_loss": -40.5281867980957, "global_step": 121511, "epoch": 1004} {"train_loss": -40.80832290649414, "global_step": 121512, "epoch": 1004} {"train_loss": -40.66744613647461, "global_step": 121513, "epoch": 1004} {"train_loss": -41.007015228271484, "global_step": 121514, "epoch": 1004} {"train_loss": -40.13667678833008, "global_step": 121515, "epoch": 1004} {"train_loss": -39.741939544677734, "global_step": 121516, "epoch": 1004} {"train_loss": -39.39414978027344, "global_step": 121517, "epoch": 1004} {"train_loss": -39.148677825927734, "global_step": 121518, "epoch": 1004} {"train_loss": -40.31766891479492, "global_step": 121519, "epoch": 1004} {"train_loss": -39.65477752685547, "global_step": 121520, "epoch": 1004} {"train_loss": -40.18941879272461, "global_step": 121521, "epoch": 1004} {"train_loss": -39.57796859741211, "global_step": 121522, "epoch": 1004} {"train_loss": -38.42329788208008, "global_step": 121523, "epoch": 1004} {"train_loss": -38.47603988647461, "global_step": 121524, "epoch": 1004} {"train_loss": -36.99482345581055, "global_step": 121525, "epoch": 1004} {"train_loss": -40.18851852416992, "global_step": 121526, "epoch": 1004} {"train_loss": -38.67299270629883, "global_step": 121527, "epoch": 1004} {"train_loss": -37.81096267700195, "global_step": 121528, "epoch": 1004} {"train_loss": -40.14400100708008, "global_step": 121529, "epoch": 1004} {"train_loss": -37.336795806884766, "global_step": 121530, "epoch": 1004} {"train_loss": -36.47930145263672, "global_step": 121531, "epoch": 1004} {"train_loss": -40.22166061401367, "global_step": 121532, "epoch": 1004} {"train_loss": -39.16599655151367, "global_step": 121533, "epoch": 1004} {"train_loss": -37.31955337524414, "global_step": 121534, "epoch": 1004} {"train_loss": -40.14545822143555, "global_step": 121535, "epoch": 1004} {"train_loss": -39.24177169799805, "global_step": 121536, "epoch": 1004} {"train_loss": -39.736663818359375, "global_step": 121537, "epoch": 1004} {"train_loss": -39.21454620361328, "global_step": 121538, "epoch": 1004} {"train_loss": -40.1429328918457, "global_step": 121539, "epoch": 1004} {"train_loss": -39.04737091064453, "global_step": 121540, "epoch": 1004} {"train_loss": -40.16040802001953, "global_step": 121541, "epoch": 1004} {"train_loss": -39.34197998046875, "global_step": 121542, "epoch": 1004} {"train_loss": -38.68247985839844, "global_step": 121543, "epoch": 1004} {"train_loss": -38.80743408203125, "global_step": 121544, "epoch": 1004} {"train_loss": -40.08078384399414, "global_step": 121545, "epoch": 1004} {"train_loss": -39.172218322753906, "global_step": 121546, "epoch": 1004} {"train_loss": -39.602596282958984, "global_step": 121547, "epoch": 1004} {"train_loss": -39.368961334228516, "global_step": 121548, "epoch": 1004} {"train_loss": -38.48053741455078, "global_step": 121549, "epoch": 1004} {"train_loss": -38.91676712036133, "global_step": 121550, "epoch": 1004} {"train_loss": -40.49637985229492, "global_step": 121551, "epoch": 1004} {"train_loss": -38.69496536254883, "global_step": 121552, "epoch": 1004} {"train_loss": -38.75699996948242, "global_step": 121553, "epoch": 1004} {"train_loss": -40.083587646484375, "global_step": 121554, "epoch": 1004} {"train_loss": -39.82402420043945, "global_step": 121555, "epoch": 1004} {"train_loss": -39.82223129272461, "global_step": 121556, "epoch": 1004} {"train_loss": -38.60928726196289, "global_step": 121557, "epoch": 1004} {"train_loss": -40.127655029296875, "global_step": 121558, "epoch": 1004} {"train_loss": -40.24232482910156, "global_step": 121559, "epoch": 1004} {"train_loss": -39.18394088745117, "global_step": 121560, "epoch": 1004} {"train_loss": -39.86684036254883, "global_step": 121561, "epoch": 1004} {"train_loss": -39.592472076416016, "global_step": 121562, "epoch": 1004} {"train_loss": -38.30978012084961, "global_step": 121563, "epoch": 1004} {"train_loss": -38.29237747192383, "global_step": 121564, "epoch": 1004} {"train_loss": -38.396705627441406, "global_step": 121565, "epoch": 1004} {"train_loss": -38.95707321166992, "global_step": 121566, "epoch": 1004} {"train_loss": -38.3223762512207, "global_step": 121567, "epoch": 1004} {"train_loss": -35.23865509033203, "global_step": 121568, "epoch": 1004} {"train_loss": -38.625762939453125, "global_step": 121569, "epoch": 1004} {"train_loss": -36.09062576293945, "global_step": 121570, "epoch": 1004} {"train_loss": -38.271888732910156, "global_step": 121571, "epoch": 1004} {"train_loss": -33.890377044677734, "global_step": 121572, "epoch": 1004} {"train_loss": -38.80046463012695, "global_step": 121573, "epoch": 1004} {"train_loss": -38.9161262512207, "global_step": 121574, "epoch": 1004} {"train_loss": -35.62913131713867, "global_step": 121575, "epoch": 1004} {"train_loss": -38.982051849365234, "global_step": 121576, "epoch": 1004} {"train_loss": -37.95762252807617, "global_step": 121577, "epoch": 1004} {"train_loss": -38.2856559753418, "global_step": 121578, "epoch": 1004} {"train_loss": -38.422401428222656, "global_step": 121579, "epoch": 1004} {"train_loss": -37.10947036743164, "global_step": 121580, "epoch": 1004} {"train_loss": -39.168453216552734, "global_step": 121581, "epoch": 1004} {"train_loss": -37.000999450683594, "global_step": 121582, "epoch": 1004} {"train_loss": -38.866371154785156, "global_step": 121583, "epoch": 1004} {"train_loss": -37.467254638671875, "global_step": 121584, "epoch": 1004} {"train_loss": -37.59450149536133, "global_step": 121585, "epoch": 1004} {"train_loss": -37.1739501953125, "global_step": 121586, "epoch": 1004} {"train_loss": -35.03736877441406, "global_step": 121587, "epoch": 1004} {"train_loss": -37.017520904541016, "global_step": 121588, "epoch": 1004} {"train_loss": -37.24833297729492, "global_step": 121589, "epoch": 1004} {"train_loss": -36.6762809753418, "global_step": 121590, "epoch": 1004} {"train_loss": -37.11762237548828, "global_step": 121591, "epoch": 1004} {"train_loss": -38.46049118041992, "global_step": 121592, "epoch": 1004} {"train_loss": -38.064109802246094, "global_step": 121593, "epoch": 1004} {"train_loss": -39.20548629760742, "global_step": 121594, "epoch": 1004} {"train_loss": -36.66032791137695, "global_step": 121595, "epoch": 1004} {"train_loss": -37.70656204223633, "global_step": 121596, "epoch": 1004} {"train_loss": -36.92281723022461, "global_step": 121597, "epoch": 1004} {"train_loss": -39.264503479003906, "global_step": 121598, "epoch": 1004} {"train_loss": -37.650177001953125, "global_step": 121599, "epoch": 1004} {"train_loss": -39.52618408203125, "global_step": 121600, "epoch": 1004} {"train_loss": -38.62006378173828, "global_step": 121601, "epoch": 1004} {"train_loss": -37.9940299987793, "global_step": 121602, "epoch": 1004} {"train_loss": -37.609928131103516, "global_step": 121603, "epoch": 1004} {"train_loss": -39.01739955933626, "global_step": 121604, "epoch": 1004, "val_loss": 2789885.0} {"train_loss": -38.3192024230957, "global_step": 121605, "epoch": 1005} {"train_loss": -38.4254035949707, "global_step": 121606, "epoch": 1005} {"train_loss": -38.60928726196289, "global_step": 121607, "epoch": 1005} {"train_loss": -38.84705352783203, "global_step": 121608, "epoch": 1005} {"train_loss": -38.76597213745117, "global_step": 121609, "epoch": 1005} {"train_loss": -37.41634750366211, "global_step": 121610, "epoch": 1005} {"train_loss": -37.724308013916016, "global_step": 121611, "epoch": 1005} {"train_loss": -39.017601013183594, "global_step": 121612, "epoch": 1005} {"train_loss": -38.90237045288086, "global_step": 121613, "epoch": 1005} {"train_loss": -39.352294921875, "global_step": 121614, "epoch": 1005} {"train_loss": -37.805633544921875, "global_step": 121615, "epoch": 1005} {"train_loss": -39.65919876098633, "global_step": 121616, "epoch": 1005} {"train_loss": -39.163970947265625, "global_step": 121617, "epoch": 1005} {"train_loss": -39.535675048828125, "global_step": 121618, "epoch": 1005} {"train_loss": -39.92991256713867, "global_step": 121619, "epoch": 1005} {"train_loss": -39.3873176574707, "global_step": 121620, "epoch": 1005} {"train_loss": -39.77931213378906, "global_step": 121621, "epoch": 1005} {"train_loss": -39.38975143432617, "global_step": 121622, "epoch": 1005} {"train_loss": -38.890865325927734, "global_step": 121623, "epoch": 1005} {"train_loss": -39.48615646362305, "global_step": 121624, "epoch": 1005} {"train_loss": -36.95759963989258, "global_step": 121625, "epoch": 1005} {"train_loss": -39.63093948364258, "global_step": 121626, "epoch": 1005} {"train_loss": -39.53644943237305, "global_step": 121627, "epoch": 1005} {"train_loss": -38.91035079956055, "global_step": 121628, "epoch": 1005} {"train_loss": -39.65058898925781, "global_step": 121629, "epoch": 1005} {"train_loss": -38.80598831176758, "global_step": 121630, "epoch": 1005} {"train_loss": -38.17734909057617, "global_step": 121631, "epoch": 1005} {"train_loss": -39.624691009521484, "global_step": 121632, "epoch": 1005} {"train_loss": -39.67867660522461, "global_step": 121633, "epoch": 1005} {"train_loss": -39.82925033569336, "global_step": 121634, "epoch": 1005} {"train_loss": -39.09970474243164, "global_step": 121635, "epoch": 1005} {"train_loss": -39.312705993652344, "global_step": 121636, "epoch": 1005} {"train_loss": -38.99151611328125, "global_step": 121637, "epoch": 1005} {"train_loss": -39.53313064575195, "global_step": 121638, "epoch": 1005} {"train_loss": -39.516357421875, "global_step": 121639, "epoch": 1005} {"train_loss": -39.46065139770508, "global_step": 121640, "epoch": 1005} {"train_loss": -40.445465087890625, "global_step": 121641, "epoch": 1005} {"train_loss": -38.29595947265625, "global_step": 121642, "epoch": 1005} {"train_loss": -39.78806686401367, "global_step": 121643, "epoch": 1005} {"train_loss": -39.423126220703125, "global_step": 121644, "epoch": 1005} {"train_loss": -39.14301300048828, "global_step": 121645, "epoch": 1005} {"train_loss": -39.37005615234375, "global_step": 121646, "epoch": 1005} {"train_loss": -39.92244338989258, "global_step": 121647, "epoch": 1005} {"train_loss": -40.3360710144043, "global_step": 121648, "epoch": 1005} {"train_loss": -40.227874755859375, "global_step": 121649, "epoch": 1005} {"train_loss": -39.831668853759766, "global_step": 121650, "epoch": 1005} {"train_loss": -40.455047607421875, "global_step": 121651, "epoch": 1005} {"train_loss": -39.9964599609375, "global_step": 121652, "epoch": 1005} {"train_loss": -40.23904037475586, "global_step": 121653, "epoch": 1005} {"train_loss": -40.22089385986328, "global_step": 121654, "epoch": 1005} {"train_loss": -39.45630645751953, "global_step": 121655, "epoch": 1005} {"train_loss": -39.441497802734375, "global_step": 121656, "epoch": 1005} {"train_loss": -40.22877502441406, "global_step": 121657, "epoch": 1005} {"train_loss": -40.19936752319336, "global_step": 121658, "epoch": 1005} {"train_loss": -39.82869338989258, "global_step": 121659, "epoch": 1005} {"train_loss": -39.768638610839844, "global_step": 121660, "epoch": 1005} {"train_loss": -39.732425689697266, "global_step": 121661, "epoch": 1005} {"train_loss": -40.087703704833984, "global_step": 121662, "epoch": 1005} {"train_loss": -39.10047149658203, "global_step": 121663, "epoch": 1005} {"train_loss": -40.04684066772461, "global_step": 121664, "epoch": 1005} {"train_loss": -40.48310089111328, "global_step": 121665, "epoch": 1005} {"train_loss": -38.731353759765625, "global_step": 121666, "epoch": 1005} {"train_loss": -38.62099838256836, "global_step": 121667, "epoch": 1005} {"train_loss": -40.21919631958008, "global_step": 121668, "epoch": 1005} {"train_loss": -39.735511779785156, "global_step": 121669, "epoch": 1005} {"train_loss": -39.99435043334961, "global_step": 121670, "epoch": 1005} {"train_loss": -37.02435302734375, "global_step": 121671, "epoch": 1005} {"train_loss": -35.54264450073242, "global_step": 121672, "epoch": 1005} {"train_loss": -39.385128021240234, "global_step": 121673, "epoch": 1005} {"train_loss": -31.698637008666992, "global_step": 121674, "epoch": 1005} {"train_loss": -2.038378953933716, "global_step": 121675, "epoch": 1005} {"train_loss": 19.295413970947266, "global_step": 121676, "epoch": 1005} {"train_loss": -28.045578002929688, "global_step": 121677, "epoch": 1005} {"train_loss": -4.745699882507324, "global_step": 121678, "epoch": 1005} {"train_loss": -27.13197898864746, "global_step": 121679, "epoch": 1005} {"train_loss": -21.774709701538086, "global_step": 121680, "epoch": 1005} {"train_loss": -19.262191772460938, "global_step": 121681, "epoch": 1005} {"train_loss": -30.786359786987305, "global_step": 121682, "epoch": 1005} {"train_loss": -25.303518295288086, "global_step": 121683, "epoch": 1005} {"train_loss": -24.81282615661621, "global_step": 121684, "epoch": 1005} {"train_loss": -32.45479965209961, "global_step": 121685, "epoch": 1005} {"train_loss": -30.373764038085938, "global_step": 121686, "epoch": 1005} {"train_loss": -28.528711318969727, "global_step": 121687, "epoch": 1005} {"train_loss": -31.674850463867188, "global_step": 121688, "epoch": 1005} {"train_loss": -32.694175720214844, "global_step": 121689, "epoch": 1005} {"train_loss": -32.559322357177734, "global_step": 121690, "epoch": 1005} {"train_loss": -32.24648666381836, "global_step": 121691, "epoch": 1005} {"train_loss": -32.918968200683594, "global_step": 121692, "epoch": 1005} {"train_loss": -33.6882209777832, "global_step": 121693, "epoch": 1005} {"train_loss": -33.65681076049805, "global_step": 121694, "epoch": 1005} {"train_loss": -33.52920150756836, "global_step": 121695, "epoch": 1005} {"train_loss": -34.27363204956055, "global_step": 121696, "epoch": 1005} {"train_loss": -33.88734817504883, "global_step": 121697, "epoch": 1005} {"train_loss": -34.62640380859375, "global_step": 121698, "epoch": 1005} {"train_loss": -35.059967041015625, "global_step": 121699, "epoch": 1005} {"train_loss": -34.76804733276367, "global_step": 121700, "epoch": 1005} {"train_loss": -35.0739860534668, "global_step": 121701, "epoch": 1005} {"train_loss": -35.62263870239258, "global_step": 121702, "epoch": 1005} {"train_loss": -35.271575927734375, "global_step": 121703, "epoch": 1005} {"train_loss": -35.214630126953125, "global_step": 121704, "epoch": 1005} {"train_loss": -34.74116516113281, "global_step": 121705, "epoch": 1005} {"train_loss": -34.459712982177734, "global_step": 121706, "epoch": 1005} {"train_loss": -35.20430374145508, "global_step": 121707, "epoch": 1005} {"train_loss": -36.08091354370117, "global_step": 121708, "epoch": 1005} {"train_loss": -35.60244369506836, "global_step": 121709, "epoch": 1005} {"train_loss": -35.3740119934082, "global_step": 121710, "epoch": 1005} {"train_loss": -36.13194274902344, "global_step": 121711, "epoch": 1005} {"train_loss": -36.2563591003418, "global_step": 121712, "epoch": 1005} {"train_loss": -36.03684616088867, "global_step": 121713, "epoch": 1005} {"train_loss": -36.35680389404297, "global_step": 121714, "epoch": 1005} {"train_loss": -36.546783447265625, "global_step": 121715, "epoch": 1005} {"train_loss": -36.27632522583008, "global_step": 121716, "epoch": 1005} {"train_loss": -33.94484329223633, "global_step": 121717, "epoch": 1005} {"train_loss": -33.282020568847656, "global_step": 121718, "epoch": 1005} {"train_loss": -35.00955581665039, "global_step": 121719, "epoch": 1005} {"train_loss": -34.129425048828125, "global_step": 121720, "epoch": 1005} {"train_loss": -36.938350677490234, "global_step": 121721, "epoch": 1005} {"train_loss": -34.76969528198242, "global_step": 121722, "epoch": 1005} {"train_loss": -36.6397819519043, "global_step": 121723, "epoch": 1005} {"train_loss": -32.615631103515625, "global_step": 121724, "epoch": 1005} {"train_loss": -35.61483616671286, "global_step": 121725, "epoch": 1005, "val_loss": 2710369.75} {"train_loss": -26.799787521362305, "global_step": 121726, "epoch": 1006} {"train_loss": -37.29597473144531, "global_step": 121727, "epoch": 1006} {"train_loss": -31.20115089416504, "global_step": 121728, "epoch": 1006} {"train_loss": -35.940425872802734, "global_step": 121729, "epoch": 1006} {"train_loss": -32.50054168701172, "global_step": 121730, "epoch": 1006} {"train_loss": -36.008453369140625, "global_step": 121731, "epoch": 1006} {"train_loss": -35.80878829956055, "global_step": 121732, "epoch": 1006} {"train_loss": -35.25405502319336, "global_step": 121733, "epoch": 1006} {"train_loss": -36.49253463745117, "global_step": 121734, "epoch": 1006} {"train_loss": -35.28501892089844, "global_step": 121735, "epoch": 1006} {"train_loss": -36.645320892333984, "global_step": 121736, "epoch": 1006} {"train_loss": -36.414180755615234, "global_step": 121737, "epoch": 1006} {"train_loss": -35.9821662902832, "global_step": 121738, "epoch": 1006} {"train_loss": -36.5967903137207, "global_step": 121739, "epoch": 1006} {"train_loss": -36.36244583129883, "global_step": 121740, "epoch": 1006} {"train_loss": -36.27104568481445, "global_step": 121741, "epoch": 1006} {"train_loss": -36.40476608276367, "global_step": 121742, "epoch": 1006} {"train_loss": -36.95748519897461, "global_step": 121743, "epoch": 1006} {"train_loss": -36.77097702026367, "global_step": 121744, "epoch": 1006} {"train_loss": -36.53245162963867, "global_step": 121745, "epoch": 1006} {"train_loss": -36.98796844482422, "global_step": 121746, "epoch": 1006} {"train_loss": -37.20262145996094, "global_step": 121747, "epoch": 1006} {"train_loss": -37.21909713745117, "global_step": 121748, "epoch": 1006} {"train_loss": -37.53152084350586, "global_step": 121749, "epoch": 1006} {"train_loss": -36.35700607299805, "global_step": 121750, "epoch": 1006} {"train_loss": -35.24702835083008, "global_step": 121751, "epoch": 1006} {"train_loss": -34.54244613647461, "global_step": 121752, "epoch": 1006} {"train_loss": -36.16895294189453, "global_step": 121753, "epoch": 1006} {"train_loss": -37.466590881347656, "global_step": 121754, "epoch": 1006} {"train_loss": -35.672115325927734, "global_step": 121755, "epoch": 1006} {"train_loss": -36.92929458618164, "global_step": 121756, "epoch": 1006} {"train_loss": -36.9337043762207, "global_step": 121757, "epoch": 1006} {"train_loss": -36.72528076171875, "global_step": 121758, "epoch": 1006} {"train_loss": -37.30405807495117, "global_step": 121759, "epoch": 1006} {"train_loss": -36.348453521728516, "global_step": 121760, "epoch": 1006} {"train_loss": -37.300392150878906, "global_step": 121761, "epoch": 1006} {"train_loss": -36.689205169677734, "global_step": 121762, "epoch": 1006} {"train_loss": -37.28829574584961, "global_step": 121763, "epoch": 1006} {"train_loss": -37.17412567138672, "global_step": 121764, "epoch": 1006} {"train_loss": -36.856807708740234, "global_step": 121765, "epoch": 1006} {"train_loss": -37.80704879760742, "global_step": 121766, "epoch": 1006} {"train_loss": -37.3310432434082, "global_step": 121767, "epoch": 1006} {"train_loss": -37.531551361083984, "global_step": 121768, "epoch": 1006} {"train_loss": -37.45138931274414, "global_step": 121769, "epoch": 1006} {"train_loss": -37.93540573120117, "global_step": 121770, "epoch": 1006} {"train_loss": -37.58195114135742, "global_step": 121771, "epoch": 1006} {"train_loss": -37.25790023803711, "global_step": 121772, "epoch": 1006} {"train_loss": -37.50699996948242, "global_step": 121773, "epoch": 1006} {"train_loss": -37.813167572021484, "global_step": 121774, "epoch": 1006} {"train_loss": -38.030242919921875, "global_step": 121775, "epoch": 1006} {"train_loss": -38.2379264831543, "global_step": 121776, "epoch": 1006} {"train_loss": -37.8424186706543, "global_step": 121777, "epoch": 1006} {"train_loss": -38.36652374267578, "global_step": 121778, "epoch": 1006} {"train_loss": -38.229652404785156, "global_step": 121779, "epoch": 1006} {"train_loss": -38.252464294433594, "global_step": 121780, "epoch": 1006} {"train_loss": -37.75420379638672, "global_step": 121781, "epoch": 1006} {"train_loss": -36.680572509765625, "global_step": 121782, "epoch": 1006} {"train_loss": -36.15354537963867, "global_step": 121783, "epoch": 1006} {"train_loss": -37.36237716674805, "global_step": 121784, "epoch": 1006} {"train_loss": -38.02642059326172, "global_step": 121785, "epoch": 1006} {"train_loss": -37.85620880126953, "global_step": 121786, "epoch": 1006} {"train_loss": -37.944801330566406, "global_step": 121787, "epoch": 1006} {"train_loss": -38.332550048828125, "global_step": 121788, "epoch": 1006} {"train_loss": -37.73922348022461, "global_step": 121789, "epoch": 1006} {"train_loss": -38.44702911376953, "global_step": 121790, "epoch": 1006} {"train_loss": -37.6698112487793, "global_step": 121791, "epoch": 1006} {"train_loss": -37.96947479248047, "global_step": 121792, "epoch": 1006} {"train_loss": -38.35335159301758, "global_step": 121793, "epoch": 1006} {"train_loss": -38.556617736816406, "global_step": 121794, "epoch": 1006} {"train_loss": -39.15728759765625, "global_step": 121795, "epoch": 1006} {"train_loss": -38.11112976074219, "global_step": 121796, "epoch": 1006} {"train_loss": -38.1552734375, "global_step": 121797, "epoch": 1006} {"train_loss": -38.06539535522461, "global_step": 121798, "epoch": 1006} {"train_loss": -38.57551574707031, "global_step": 121799, "epoch": 1006} {"train_loss": -38.83933639526367, "global_step": 121800, "epoch": 1006} {"train_loss": -38.29935836791992, "global_step": 121801, "epoch": 1006} {"train_loss": -38.362327575683594, "global_step": 121802, "epoch": 1006} {"train_loss": -38.43442916870117, "global_step": 121803, "epoch": 1006} {"train_loss": -38.2656135559082, "global_step": 121804, "epoch": 1006} {"train_loss": -37.81703567504883, "global_step": 121805, "epoch": 1006} {"train_loss": -36.712642669677734, "global_step": 121806, "epoch": 1006} {"train_loss": -36.509517669677734, "global_step": 121807, "epoch": 1006} {"train_loss": -38.04007339477539, "global_step": 121808, "epoch": 1006} {"train_loss": -38.748146057128906, "global_step": 121809, "epoch": 1006} {"train_loss": -38.165157318115234, "global_step": 121810, "epoch": 1006} {"train_loss": -38.362823486328125, "global_step": 121811, "epoch": 1006} {"train_loss": -38.891807556152344, "global_step": 121812, "epoch": 1006} {"train_loss": -38.55852508544922, "global_step": 121813, "epoch": 1006} {"train_loss": -38.03894805908203, "global_step": 121814, "epoch": 1006} {"train_loss": -38.71586990356445, "global_step": 121815, "epoch": 1006} {"train_loss": -38.646846771240234, "global_step": 121816, "epoch": 1006} {"train_loss": -38.02363967895508, "global_step": 121817, "epoch": 1006} {"train_loss": -38.67313766479492, "global_step": 121818, "epoch": 1006} {"train_loss": -38.37553787231445, "global_step": 121819, "epoch": 1006} {"train_loss": -38.72663879394531, "global_step": 121820, "epoch": 1006} {"train_loss": -39.10352325439453, "global_step": 121821, "epoch": 1006} {"train_loss": -38.8516960144043, "global_step": 121822, "epoch": 1006} {"train_loss": -39.1677360534668, "global_step": 121823, "epoch": 1006} {"train_loss": -38.42715072631836, "global_step": 121824, "epoch": 1006} {"train_loss": -38.805206298828125, "global_step": 121825, "epoch": 1006} {"train_loss": -37.634883880615234, "global_step": 121826, "epoch": 1006} {"train_loss": -39.148250579833984, "global_step": 121827, "epoch": 1006} {"train_loss": -38.631954193115234, "global_step": 121828, "epoch": 1006} {"train_loss": -38.689998626708984, "global_step": 121829, "epoch": 1006} {"train_loss": -39.226722717285156, "global_step": 121830, "epoch": 1006} {"train_loss": -38.4338493347168, "global_step": 121831, "epoch": 1006} {"train_loss": -39.06852340698242, "global_step": 121832, "epoch": 1006} {"train_loss": -38.4072380065918, "global_step": 121833, "epoch": 1006} {"train_loss": -38.319400787353516, "global_step": 121834, "epoch": 1006} {"train_loss": -38.88228988647461, "global_step": 121835, "epoch": 1006} {"train_loss": -37.06768035888672, "global_step": 121836, "epoch": 1006} {"train_loss": -38.44851303100586, "global_step": 121837, "epoch": 1006} {"train_loss": -37.7841682434082, "global_step": 121838, "epoch": 1006} {"train_loss": -37.7765007019043, "global_step": 121839, "epoch": 1006} {"train_loss": -38.45209503173828, "global_step": 121840, "epoch": 1006} {"train_loss": -38.2321662902832, "global_step": 121841, "epoch": 1006} {"train_loss": -37.129539489746094, "global_step": 121842, "epoch": 1006} {"train_loss": -35.83177947998047, "global_step": 121843, "epoch": 1006} {"train_loss": -37.7000617980957, "global_step": 121844, "epoch": 1006} {"train_loss": -36.189659118652344, "global_step": 121845, "epoch": 1006} {"train_loss": -37.38813189041516, "global_step": 121846, "epoch": 1006, "val_loss": 2734550.75} {"train_loss": -34.519649505615234, "global_step": 121847, "epoch": 1007} {"train_loss": -33.56977081298828, "global_step": 121848, "epoch": 1007} {"train_loss": -30.5919246673584, "global_step": 121849, "epoch": 1007} {"train_loss": -33.14894104003906, "global_step": 121850, "epoch": 1007} {"train_loss": -34.498565673828125, "global_step": 121851, "epoch": 1007} {"train_loss": -31.35791015625, "global_step": 121852, "epoch": 1007} {"train_loss": -37.478248596191406, "global_step": 121853, "epoch": 1007} {"train_loss": -32.43564987182617, "global_step": 121854, "epoch": 1007} {"train_loss": -33.42509078979492, "global_step": 121855, "epoch": 1007} {"train_loss": -34.976375579833984, "global_step": 121856, "epoch": 1007} {"train_loss": -34.68661117553711, "global_step": 121857, "epoch": 1007} {"train_loss": -36.97930908203125, "global_step": 121858, "epoch": 1007} {"train_loss": -34.28865432739258, "global_step": 121859, "epoch": 1007} {"train_loss": -35.406620025634766, "global_step": 121860, "epoch": 1007} {"train_loss": -36.5076789855957, "global_step": 121861, "epoch": 1007} {"train_loss": -36.278316497802734, "global_step": 121862, "epoch": 1007} {"train_loss": -37.84035110473633, "global_step": 121863, "epoch": 1007} {"train_loss": -35.60670471191406, "global_step": 121864, "epoch": 1007} {"train_loss": -37.19039535522461, "global_step": 121865, "epoch": 1007} {"train_loss": -37.03660583496094, "global_step": 121866, "epoch": 1007} {"train_loss": -36.88276672363281, "global_step": 121867, "epoch": 1007} {"train_loss": -37.452056884765625, "global_step": 121868, "epoch": 1007} {"train_loss": -37.178462982177734, "global_step": 121869, "epoch": 1007} {"train_loss": -36.749629974365234, "global_step": 121870, "epoch": 1007} {"train_loss": -37.59119415283203, "global_step": 121871, "epoch": 1007} {"train_loss": -37.804805755615234, "global_step": 121872, "epoch": 1007} {"train_loss": -37.11072540283203, "global_step": 121873, "epoch": 1007} {"train_loss": -36.901981353759766, "global_step": 121874, "epoch": 1007} {"train_loss": -37.76749801635742, "global_step": 121875, "epoch": 1007} {"train_loss": -37.61528015136719, "global_step": 121876, "epoch": 1007} {"train_loss": -36.934226989746094, "global_step": 121877, "epoch": 1007} {"train_loss": -37.319210052490234, "global_step": 121878, "epoch": 1007} {"train_loss": -36.510284423828125, "global_step": 121879, "epoch": 1007} {"train_loss": -37.34053039550781, "global_step": 121880, "epoch": 1007} {"train_loss": -38.10375213623047, "global_step": 121881, "epoch": 1007} {"train_loss": -37.73099136352539, "global_step": 121882, "epoch": 1007} {"train_loss": -37.817317962646484, "global_step": 121883, "epoch": 1007} {"train_loss": -37.28224182128906, "global_step": 121884, "epoch": 1007} {"train_loss": -37.640106201171875, "global_step": 121885, "epoch": 1007} {"train_loss": -37.89921569824219, "global_step": 121886, "epoch": 1007} {"train_loss": -37.567626953125, "global_step": 121887, "epoch": 1007} {"train_loss": -36.591468811035156, "global_step": 121888, "epoch": 1007} {"train_loss": -37.44562911987305, "global_step": 121889, "epoch": 1007} {"train_loss": -37.83463668823242, "global_step": 121890, "epoch": 1007} {"train_loss": -37.655975341796875, "global_step": 121891, "epoch": 1007} {"train_loss": -37.81892013549805, "global_step": 121892, "epoch": 1007} {"train_loss": -37.94219970703125, "global_step": 121893, "epoch": 1007} {"train_loss": -37.949337005615234, "global_step": 121894, "epoch": 1007} {"train_loss": -36.9635124206543, "global_step": 121895, "epoch": 1007} {"train_loss": -38.0479850769043, "global_step": 121896, "epoch": 1007} {"train_loss": -37.13396072387695, "global_step": 121897, "epoch": 1007} {"train_loss": -37.68381881713867, "global_step": 121898, "epoch": 1007} {"train_loss": -37.203487396240234, "global_step": 121899, "epoch": 1007} {"train_loss": -37.39361572265625, "global_step": 121900, "epoch": 1007} {"train_loss": -37.044803619384766, "global_step": 121901, "epoch": 1007} {"train_loss": -37.80327224731445, "global_step": 121902, "epoch": 1007} {"train_loss": -38.43913650512695, "global_step": 121903, "epoch": 1007} {"train_loss": -37.82413864135742, "global_step": 121904, "epoch": 1007} {"train_loss": -37.36812973022461, "global_step": 121905, "epoch": 1007} {"train_loss": -38.45008087158203, "global_step": 121906, "epoch": 1007} {"train_loss": -37.602291107177734, "global_step": 121907, "epoch": 1007} {"train_loss": -38.134334564208984, "global_step": 121908, "epoch": 1007} {"train_loss": -38.77950668334961, "global_step": 121909, "epoch": 1007} {"train_loss": -38.91237258911133, "global_step": 121910, "epoch": 1007} {"train_loss": -38.0717658996582, "global_step": 121911, "epoch": 1007} {"train_loss": -38.72840118408203, "global_step": 121912, "epoch": 1007} {"train_loss": -38.74750518798828, "global_step": 121913, "epoch": 1007} {"train_loss": -38.5800666809082, "global_step": 121914, "epoch": 1007} {"train_loss": -38.68520736694336, "global_step": 121915, "epoch": 1007} {"train_loss": -38.584163665771484, "global_step": 121916, "epoch": 1007} {"train_loss": -38.024208068847656, "global_step": 121917, "epoch": 1007} {"train_loss": -36.14024353027344, "global_step": 121918, "epoch": 1007} {"train_loss": -35.48419952392578, "global_step": 121919, "epoch": 1007} {"train_loss": -38.187416076660156, "global_step": 121920, "epoch": 1007} {"train_loss": -38.44806671142578, "global_step": 121921, "epoch": 1007} {"train_loss": -38.679378509521484, "global_step": 121922, "epoch": 1007} {"train_loss": -37.992774963378906, "global_step": 121923, "epoch": 1007} {"train_loss": -38.49211120605469, "global_step": 121924, "epoch": 1007} {"train_loss": -38.64039993286133, "global_step": 121925, "epoch": 1007} {"train_loss": -38.35614776611328, "global_step": 121926, "epoch": 1007} {"train_loss": -39.167823791503906, "global_step": 121927, "epoch": 1007} {"train_loss": -37.65678787231445, "global_step": 121928, "epoch": 1007} {"train_loss": -37.747806549072266, "global_step": 121929, "epoch": 1007} {"train_loss": -38.689239501953125, "global_step": 121930, "epoch": 1007} {"train_loss": -38.82155227661133, "global_step": 121931, "epoch": 1007} {"train_loss": -38.06938552856445, "global_step": 121932, "epoch": 1007} {"train_loss": -38.07640075683594, "global_step": 121933, "epoch": 1007} {"train_loss": -37.65267562866211, "global_step": 121934, "epoch": 1007} {"train_loss": -39.29954147338867, "global_step": 121935, "epoch": 1007} {"train_loss": -38.90055847167969, "global_step": 121936, "epoch": 1007} {"train_loss": -35.664363861083984, "global_step": 121937, "epoch": 1007} {"train_loss": -39.03420639038086, "global_step": 121938, "epoch": 1007} {"train_loss": -37.98894500732422, "global_step": 121939, "epoch": 1007} {"train_loss": -39.144771575927734, "global_step": 121940, "epoch": 1007} {"train_loss": -38.74140167236328, "global_step": 121941, "epoch": 1007} {"train_loss": -39.170204162597656, "global_step": 121942, "epoch": 1007} {"train_loss": -39.033935546875, "global_step": 121943, "epoch": 1007} {"train_loss": -38.251617431640625, "global_step": 121944, "epoch": 1007} {"train_loss": -37.95265579223633, "global_step": 121945, "epoch": 1007} {"train_loss": -36.79086685180664, "global_step": 121946, "epoch": 1007} {"train_loss": -38.69200897216797, "global_step": 121947, "epoch": 1007} {"train_loss": -37.342796325683594, "global_step": 121948, "epoch": 1007} {"train_loss": -38.49477767944336, "global_step": 121949, "epoch": 1007} {"train_loss": -37.51839065551758, "global_step": 121950, "epoch": 1007} {"train_loss": -38.02787399291992, "global_step": 121951, "epoch": 1007} {"train_loss": -38.79082107543945, "global_step": 121952, "epoch": 1007} {"train_loss": -37.80889892578125, "global_step": 121953, "epoch": 1007} {"train_loss": -34.41371536254883, "global_step": 121954, "epoch": 1007} {"train_loss": -37.23904037475586, "global_step": 121955, "epoch": 1007} {"train_loss": -38.35920715332031, "global_step": 121956, "epoch": 1007} {"train_loss": -38.832393646240234, "global_step": 121957, "epoch": 1007} {"train_loss": -39.07553482055664, "global_step": 121958, "epoch": 1007} {"train_loss": -38.72712326049805, "global_step": 121959, "epoch": 1007} {"train_loss": -38.45685958862305, "global_step": 121960, "epoch": 1007} {"train_loss": -34.89051055908203, "global_step": 121961, "epoch": 1007} {"train_loss": -37.322418212890625, "global_step": 121962, "epoch": 1007} {"train_loss": -36.02286911010742, "global_step": 121963, "epoch": 1007} {"train_loss": -38.213470458984375, "global_step": 121964, "epoch": 1007} {"train_loss": -37.029598236083984, "global_step": 121965, "epoch": 1007} {"train_loss": -30.179981231689453, "global_step": 121966, "epoch": 1007} {"train_loss": -37.1880322133214, "global_step": 121967, "epoch": 1007, "val_loss": 2921755.75} {"train_loss": -36.4423942565918, "global_step": 121968, "epoch": 1008} {"train_loss": -17.80093765258789, "global_step": 121969, "epoch": 1008} {"train_loss": -34.4306526184082, "global_step": 121970, "epoch": 1008} {"train_loss": -30.6092472076416, "global_step": 121971, "epoch": 1008} {"train_loss": -29.422393798828125, "global_step": 121972, "epoch": 1008} {"train_loss": -32.43802261352539, "global_step": 121973, "epoch": 1008} {"train_loss": -32.93169403076172, "global_step": 121974, "epoch": 1008} {"train_loss": -33.783870697021484, "global_step": 121975, "epoch": 1008} {"train_loss": -23.473703384399414, "global_step": 121976, "epoch": 1008} {"train_loss": -34.5064582824707, "global_step": 121977, "epoch": 1008} {"train_loss": -36.70478439331055, "global_step": 121978, "epoch": 1008} {"train_loss": -30.72779655456543, "global_step": 121979, "epoch": 1008} {"train_loss": -31.167236328125, "global_step": 121980, "epoch": 1008} {"train_loss": -35.648048400878906, "global_step": 121981, "epoch": 1008} {"train_loss": -34.101070404052734, "global_step": 121982, "epoch": 1008} {"train_loss": -33.60123825073242, "global_step": 121983, "epoch": 1008} {"train_loss": -33.1788444519043, "global_step": 121984, "epoch": 1008} {"train_loss": -35.39093780517578, "global_step": 121985, "epoch": 1008} {"train_loss": -33.34416580200195, "global_step": 121986, "epoch": 1008} {"train_loss": -33.96018600463867, "global_step": 121987, "epoch": 1008} {"train_loss": -35.92592239379883, "global_step": 121988, "epoch": 1008} {"train_loss": -35.82876205444336, "global_step": 121989, "epoch": 1008} {"train_loss": -35.28409957885742, "global_step": 121990, "epoch": 1008} {"train_loss": -34.87273025512695, "global_step": 121991, "epoch": 1008} {"train_loss": -34.13047790527344, "global_step": 121992, "epoch": 1008} {"train_loss": -33.90935134887695, "global_step": 121993, "epoch": 1008} {"train_loss": -35.43191146850586, "global_step": 121994, "epoch": 1008} {"train_loss": -35.59120559692383, "global_step": 121995, "epoch": 1008} {"train_loss": -34.911964416503906, "global_step": 121996, "epoch": 1008} {"train_loss": -34.73038101196289, "global_step": 121997, "epoch": 1008} {"train_loss": -35.62876892089844, "global_step": 121998, "epoch": 1008} {"train_loss": -36.01616287231445, "global_step": 121999, "epoch": 1008} {"train_loss": -36.3659553527832, "global_step": 122000, "epoch": 1008} {"train_loss": -35.55983352661133, "global_step": 122001, "epoch": 1008} {"train_loss": -35.58477783203125, "global_step": 122002, "epoch": 1008} {"train_loss": -35.707298278808594, "global_step": 122003, "epoch": 1008} {"train_loss": -35.8338508605957, "global_step": 122004, "epoch": 1008} {"train_loss": -35.68821716308594, "global_step": 122005, "epoch": 1008} {"train_loss": -36.23603057861328, "global_step": 122006, "epoch": 1008} {"train_loss": -36.93087387084961, "global_step": 122007, "epoch": 1008} {"train_loss": -36.581878662109375, "global_step": 122008, "epoch": 1008} {"train_loss": -36.646541595458984, "global_step": 122009, "epoch": 1008} {"train_loss": -37.05658721923828, "global_step": 122010, "epoch": 1008} {"train_loss": -36.5477409362793, "global_step": 122011, "epoch": 1008} {"train_loss": -36.20512008666992, "global_step": 122012, "epoch": 1008} {"train_loss": -36.40243148803711, "global_step": 122013, "epoch": 1008} {"train_loss": -36.848876953125, "global_step": 122014, "epoch": 1008} {"train_loss": -36.30924987792969, "global_step": 122015, "epoch": 1008} {"train_loss": -36.80455780029297, "global_step": 122016, "epoch": 1008} {"train_loss": -36.756568908691406, "global_step": 122017, "epoch": 1008} {"train_loss": -35.64304733276367, "global_step": 122018, "epoch": 1008} {"train_loss": -36.87678146362305, "global_step": 122019, "epoch": 1008} {"train_loss": -36.173736572265625, "global_step": 122020, "epoch": 1008} {"train_loss": -36.587032318115234, "global_step": 122021, "epoch": 1008} {"train_loss": -36.61452865600586, "global_step": 122022, "epoch": 1008} {"train_loss": -37.5329475402832, "global_step": 122023, "epoch": 1008} {"train_loss": -37.185035705566406, "global_step": 122024, "epoch": 1008} {"train_loss": -36.5088996887207, "global_step": 122025, "epoch": 1008} {"train_loss": -37.30230712890625, "global_step": 122026, "epoch": 1008} {"train_loss": -36.188087463378906, "global_step": 122027, "epoch": 1008} {"train_loss": -37.4708366394043, "global_step": 122028, "epoch": 1008} {"train_loss": -36.237579345703125, "global_step": 122029, "epoch": 1008} {"train_loss": -37.90255355834961, "global_step": 122030, "epoch": 1008} {"train_loss": -37.024227142333984, "global_step": 122031, "epoch": 1008} {"train_loss": -37.33567428588867, "global_step": 122032, "epoch": 1008} {"train_loss": -36.46472930908203, "global_step": 122033, "epoch": 1008} {"train_loss": -38.088497161865234, "global_step": 122034, "epoch": 1008} {"train_loss": -37.3044548034668, "global_step": 122035, "epoch": 1008} {"train_loss": -37.326351165771484, "global_step": 122036, "epoch": 1008} {"train_loss": -36.50397491455078, "global_step": 122037, "epoch": 1008} {"train_loss": -37.50612258911133, "global_step": 122038, "epoch": 1008} {"train_loss": -37.492252349853516, "global_step": 122039, "epoch": 1008} {"train_loss": -38.351356506347656, "global_step": 122040, "epoch": 1008} {"train_loss": -37.89192581176758, "global_step": 122041, "epoch": 1008} {"train_loss": -38.13090133666992, "global_step": 122042, "epoch": 1008} {"train_loss": -37.74530792236328, "global_step": 122043, "epoch": 1008} {"train_loss": -38.184417724609375, "global_step": 122044, "epoch": 1008} {"train_loss": -38.06111526489258, "global_step": 122045, "epoch": 1008} {"train_loss": -38.113399505615234, "global_step": 122046, "epoch": 1008} {"train_loss": -37.96688461303711, "global_step": 122047, "epoch": 1008} {"train_loss": -37.566497802734375, "global_step": 122048, "epoch": 1008} {"train_loss": -38.14280319213867, "global_step": 122049, "epoch": 1008} {"train_loss": -38.43716049194336, "global_step": 122050, "epoch": 1008} {"train_loss": -37.71551513671875, "global_step": 122051, "epoch": 1008} {"train_loss": -38.081443786621094, "global_step": 122052, "epoch": 1008} {"train_loss": -37.725341796875, "global_step": 122053, "epoch": 1008} {"train_loss": -38.5966796875, "global_step": 122054, "epoch": 1008} {"train_loss": -38.33098602294922, "global_step": 122055, "epoch": 1008} {"train_loss": -38.159698486328125, "global_step": 122056, "epoch": 1008} {"train_loss": -38.45212173461914, "global_step": 122057, "epoch": 1008} {"train_loss": -38.29092788696289, "global_step": 122058, "epoch": 1008} {"train_loss": -38.689388275146484, "global_step": 122059, "epoch": 1008} {"train_loss": -38.241519927978516, "global_step": 122060, "epoch": 1008} {"train_loss": -38.37514877319336, "global_step": 122061, "epoch": 1008} {"train_loss": -38.00580596923828, "global_step": 122062, "epoch": 1008} {"train_loss": -38.0173454284668, "global_step": 122063, "epoch": 1008} {"train_loss": -38.53168869018555, "global_step": 122064, "epoch": 1008} {"train_loss": -39.01580047607422, "global_step": 122065, "epoch": 1008} {"train_loss": -38.51632308959961, "global_step": 122066, "epoch": 1008} {"train_loss": -38.37806701660156, "global_step": 122067, "epoch": 1008} {"train_loss": -38.813377380371094, "global_step": 122068, "epoch": 1008} {"train_loss": -38.75543975830078, "global_step": 122069, "epoch": 1008} {"train_loss": -38.529266357421875, "global_step": 122070, "epoch": 1008} {"train_loss": -38.35552978515625, "global_step": 122071, "epoch": 1008} {"train_loss": -37.30552673339844, "global_step": 122072, "epoch": 1008} {"train_loss": -37.56941223144531, "global_step": 122073, "epoch": 1008} {"train_loss": -37.51980209350586, "global_step": 122074, "epoch": 1008} {"train_loss": -38.150909423828125, "global_step": 122075, "epoch": 1008} {"train_loss": -38.78341293334961, "global_step": 122076, "epoch": 1008} {"train_loss": -38.82058334350586, "global_step": 122077, "epoch": 1008} {"train_loss": -38.70112991333008, "global_step": 122078, "epoch": 1008} {"train_loss": -38.878929138183594, "global_step": 122079, "epoch": 1008} {"train_loss": -38.943538665771484, "global_step": 122080, "epoch": 1008} {"train_loss": -38.6647834777832, "global_step": 122081, "epoch": 1008} {"train_loss": -38.87448501586914, "global_step": 122082, "epoch": 1008} {"train_loss": -37.756141662597656, "global_step": 122083, "epoch": 1008} {"train_loss": -38.0823860168457, "global_step": 122084, "epoch": 1008} {"train_loss": -37.69403839111328, "global_step": 122085, "epoch": 1008} {"train_loss": -37.28251266479492, "global_step": 122086, "epoch": 1008} {"train_loss": -37.096832275390625, "global_step": 122087, "epoch": 1008} {"train_loss": -36.41124632338847, "global_step": 122088, "epoch": 1008, "val_loss": 2615566.75} {"train_loss": -38.570167541503906, "global_step": 122089, "epoch": 1009} {"train_loss": -38.4281120300293, "global_step": 122090, "epoch": 1009} {"train_loss": -37.39469909667969, "global_step": 122091, "epoch": 1009} {"train_loss": -36.48533248901367, "global_step": 122092, "epoch": 1009} {"train_loss": -37.655147552490234, "global_step": 122093, "epoch": 1009} {"train_loss": -36.49845504760742, "global_step": 122094, "epoch": 1009} {"train_loss": -37.89111328125, "global_step": 122095, "epoch": 1009} {"train_loss": -37.19587707519531, "global_step": 122096, "epoch": 1009} {"train_loss": -38.172542572021484, "global_step": 122097, "epoch": 1009} {"train_loss": -38.4593620300293, "global_step": 122098, "epoch": 1009} {"train_loss": -38.13178634643555, "global_step": 122099, "epoch": 1009} {"train_loss": -38.41099166870117, "global_step": 122100, "epoch": 1009} {"train_loss": -39.16792297363281, "global_step": 122101, "epoch": 1009} {"train_loss": -38.62563705444336, "global_step": 122102, "epoch": 1009} {"train_loss": -38.76011276245117, "global_step": 122103, "epoch": 1009} {"train_loss": -38.399810791015625, "global_step": 122104, "epoch": 1009} {"train_loss": -38.98938751220703, "global_step": 122105, "epoch": 1009} {"train_loss": -38.355655670166016, "global_step": 122106, "epoch": 1009} {"train_loss": -38.99800491333008, "global_step": 122107, "epoch": 1009} {"train_loss": -38.49932098388672, "global_step": 122108, "epoch": 1009} {"train_loss": -37.42402267456055, "global_step": 122109, "epoch": 1009} {"train_loss": -39.09769821166992, "global_step": 122110, "epoch": 1009} {"train_loss": -37.972023010253906, "global_step": 122111, "epoch": 1009} {"train_loss": -38.94757080078125, "global_step": 122112, "epoch": 1009} {"train_loss": -39.24575424194336, "global_step": 122113, "epoch": 1009} {"train_loss": -37.578895568847656, "global_step": 122114, "epoch": 1009} {"train_loss": -38.631290435791016, "global_step": 122115, "epoch": 1009} {"train_loss": -38.587154388427734, "global_step": 122116, "epoch": 1009} {"train_loss": -39.12538528442383, "global_step": 122117, "epoch": 1009} {"train_loss": -39.34257125854492, "global_step": 122118, "epoch": 1009} {"train_loss": -38.576053619384766, "global_step": 122119, "epoch": 1009} {"train_loss": -32.03276443481445, "global_step": 122120, "epoch": 1009} {"train_loss": -37.76827621459961, "global_step": 122121, "epoch": 1009} {"train_loss": -38.40437698364258, "global_step": 122122, "epoch": 1009} {"train_loss": -32.6731071472168, "global_step": 122123, "epoch": 1009} {"train_loss": -35.12666702270508, "global_step": 122124, "epoch": 1009} {"train_loss": -37.42586898803711, "global_step": 122125, "epoch": 1009} {"train_loss": -31.197179794311523, "global_step": 122126, "epoch": 1009} {"train_loss": -30.34030532836914, "global_step": 122127, "epoch": 1009} {"train_loss": -37.68626022338867, "global_step": 122128, "epoch": 1009} {"train_loss": -35.00827407836914, "global_step": 122129, "epoch": 1009} {"train_loss": -36.74004364013672, "global_step": 122130, "epoch": 1009} {"train_loss": -37.481624603271484, "global_step": 122131, "epoch": 1009} {"train_loss": -36.234554290771484, "global_step": 122132, "epoch": 1009} {"train_loss": -36.72233963012695, "global_step": 122133, "epoch": 1009} {"train_loss": -33.05830001831055, "global_step": 122134, "epoch": 1009} {"train_loss": -26.82962989807129, "global_step": 122135, "epoch": 1009} {"train_loss": -33.630775451660156, "global_step": 122136, "epoch": 1009} {"train_loss": -26.588621139526367, "global_step": 122137, "epoch": 1009} {"train_loss": -34.65724563598633, "global_step": 122138, "epoch": 1009} {"train_loss": -35.358367919921875, "global_step": 122139, "epoch": 1009} {"train_loss": -35.38223648071289, "global_step": 122140, "epoch": 1009} {"train_loss": -34.818965911865234, "global_step": 122141, "epoch": 1009} {"train_loss": -35.40532684326172, "global_step": 122142, "epoch": 1009} {"train_loss": -36.18101119995117, "global_step": 122143, "epoch": 1009} {"train_loss": -32.30465316772461, "global_step": 122144, "epoch": 1009} {"train_loss": -36.886940002441406, "global_step": 122145, "epoch": 1009} {"train_loss": -32.139862060546875, "global_step": 122146, "epoch": 1009} {"train_loss": -36.864501953125, "global_step": 122147, "epoch": 1009} {"train_loss": -34.49702835083008, "global_step": 122148, "epoch": 1009} {"train_loss": -34.60951614379883, "global_step": 122149, "epoch": 1009} {"train_loss": -36.25205993652344, "global_step": 122150, "epoch": 1009} {"train_loss": 0.9662414789199829, "global_step": 122151, "epoch": 1009} {"train_loss": -22.58071517944336, "global_step": 122152, "epoch": 1009} {"train_loss": -34.65347671508789, "global_step": 122153, "epoch": 1009} {"train_loss": -33.20320510864258, "global_step": 122154, "epoch": 1009} {"train_loss": -30.780508041381836, "global_step": 122155, "epoch": 1009} {"train_loss": -33.02854537963867, "global_step": 122156, "epoch": 1009} {"train_loss": -31.609411239624023, "global_step": 122157, "epoch": 1009} {"train_loss": -32.09222412109375, "global_step": 122158, "epoch": 1009} {"train_loss": -29.103376388549805, "global_step": 122159, "epoch": 1009} {"train_loss": -32.10081481933594, "global_step": 122160, "epoch": 1009} {"train_loss": -32.65154266357422, "global_step": 122161, "epoch": 1009} {"train_loss": -33.97981262207031, "global_step": 122162, "epoch": 1009} {"train_loss": -32.25556182861328, "global_step": 122163, "epoch": 1009} {"train_loss": -35.177391052246094, "global_step": 122164, "epoch": 1009} {"train_loss": -34.41781234741211, "global_step": 122165, "epoch": 1009} {"train_loss": -28.718902587890625, "global_step": 122166, "epoch": 1009} {"train_loss": -27.09796714782715, "global_step": 122167, "epoch": 1009} {"train_loss": -33.759552001953125, "global_step": 122168, "epoch": 1009} {"train_loss": -34.48590087890625, "global_step": 122169, "epoch": 1009} {"train_loss": -33.94333267211914, "global_step": 122170, "epoch": 1009} {"train_loss": -34.129478454589844, "global_step": 122171, "epoch": 1009} {"train_loss": -35.652130126953125, "global_step": 122172, "epoch": 1009} {"train_loss": -33.45796585083008, "global_step": 122173, "epoch": 1009} {"train_loss": -35.06354522705078, "global_step": 122174, "epoch": 1009} {"train_loss": -35.52572250366211, "global_step": 122175, "epoch": 1009} {"train_loss": -35.8358039855957, "global_step": 122176, "epoch": 1009} {"train_loss": -35.94155502319336, "global_step": 122177, "epoch": 1009} {"train_loss": -35.55109786987305, "global_step": 122178, "epoch": 1009} {"train_loss": -36.075679779052734, "global_step": 122179, "epoch": 1009} {"train_loss": -35.57596206665039, "global_step": 122180, "epoch": 1009} {"train_loss": -35.198116302490234, "global_step": 122181, "epoch": 1009} {"train_loss": -35.48128890991211, "global_step": 122182, "epoch": 1009} {"train_loss": -35.87076187133789, "global_step": 122183, "epoch": 1009} {"train_loss": -36.25577926635742, "global_step": 122184, "epoch": 1009} {"train_loss": -35.6210823059082, "global_step": 122185, "epoch": 1009} {"train_loss": -35.725730895996094, "global_step": 122186, "epoch": 1009} {"train_loss": -36.19704055786133, "global_step": 122187, "epoch": 1009} {"train_loss": -36.09049606323242, "global_step": 122188, "epoch": 1009} {"train_loss": -35.255210876464844, "global_step": 122189, "epoch": 1009} {"train_loss": -35.66757583618164, "global_step": 122190, "epoch": 1009} {"train_loss": -36.249000549316406, "global_step": 122191, "epoch": 1009} {"train_loss": -36.42641830444336, "global_step": 122192, "epoch": 1009} {"train_loss": -36.429500579833984, "global_step": 122193, "epoch": 1009} {"train_loss": -35.17036437988281, "global_step": 122194, "epoch": 1009} {"train_loss": -36.46834945678711, "global_step": 122195, "epoch": 1009} {"train_loss": -36.85541915893555, "global_step": 122196, "epoch": 1009} {"train_loss": -36.76276779174805, "global_step": 122197, "epoch": 1009} {"train_loss": -35.837890625, "global_step": 122198, "epoch": 1009} {"train_loss": -36.50983810424805, "global_step": 122199, "epoch": 1009} {"train_loss": -35.740291595458984, "global_step": 122200, "epoch": 1009} {"train_loss": -36.43464279174805, "global_step": 122201, "epoch": 1009} {"train_loss": -36.42060089111328, "global_step": 122202, "epoch": 1009} {"train_loss": -36.58974075317383, "global_step": 122203, "epoch": 1009} {"train_loss": -36.582820892333984, "global_step": 122204, "epoch": 1009} {"train_loss": -36.91118240356445, "global_step": 122205, "epoch": 1009} {"train_loss": -36.856658935546875, "global_step": 122206, "epoch": 1009} {"train_loss": -37.083656311035156, "global_step": 122207, "epoch": 1009} {"train_loss": -36.652191162109375, "global_step": 122208, "epoch": 1009} {"train_loss": -35.25147143572815, "global_step": 122209, "epoch": 1009, "val_loss": 2572782.75} {"train_loss": -37.1661491394043, "global_step": 122210, "epoch": 1010} {"train_loss": -36.643856048583984, "global_step": 122211, "epoch": 1010} {"train_loss": -36.36711502075195, "global_step": 122212, "epoch": 1010} {"train_loss": -37.2313346862793, "global_step": 122213, "epoch": 1010} {"train_loss": -37.55290985107422, "global_step": 122214, "epoch": 1010} {"train_loss": -37.52708053588867, "global_step": 122215, "epoch": 1010} {"train_loss": -37.17722702026367, "global_step": 122216, "epoch": 1010} {"train_loss": -37.060359954833984, "global_step": 122217, "epoch": 1010} {"train_loss": -37.133113861083984, "global_step": 122218, "epoch": 1010} {"train_loss": -37.781097412109375, "global_step": 122219, "epoch": 1010} {"train_loss": -37.32942199707031, "global_step": 122220, "epoch": 1010} {"train_loss": -37.57728958129883, "global_step": 122221, "epoch": 1010} {"train_loss": -36.937042236328125, "global_step": 122222, "epoch": 1010} {"train_loss": -37.60140609741211, "global_step": 122223, "epoch": 1010} {"train_loss": -37.77323532104492, "global_step": 122224, "epoch": 1010} {"train_loss": -37.39559555053711, "global_step": 122225, "epoch": 1010} {"train_loss": -37.686004638671875, "global_step": 122226, "epoch": 1010} {"train_loss": -37.91209030151367, "global_step": 122227, "epoch": 1010} {"train_loss": -37.83109664916992, "global_step": 122228, "epoch": 1010} {"train_loss": -37.2336311340332, "global_step": 122229, "epoch": 1010} {"train_loss": -37.85848617553711, "global_step": 122230, "epoch": 1010} {"train_loss": -37.28156280517578, "global_step": 122231, "epoch": 1010} {"train_loss": -37.82648468017578, "global_step": 122232, "epoch": 1010} {"train_loss": -38.269798278808594, "global_step": 122233, "epoch": 1010} {"train_loss": -38.074031829833984, "global_step": 122234, "epoch": 1010} {"train_loss": -37.39448547363281, "global_step": 122235, "epoch": 1010} {"train_loss": -38.0974235534668, "global_step": 122236, "epoch": 1010} {"train_loss": -37.864315032958984, "global_step": 122237, "epoch": 1010} {"train_loss": -37.8208122253418, "global_step": 122238, "epoch": 1010} {"train_loss": -38.348907470703125, "global_step": 122239, "epoch": 1010} {"train_loss": -38.067256927490234, "global_step": 122240, "epoch": 1010} {"train_loss": -37.99019241333008, "global_step": 122241, "epoch": 1010} {"train_loss": -37.38032150268555, "global_step": 122242, "epoch": 1010} {"train_loss": -37.37885665893555, "global_step": 122243, "epoch": 1010} {"train_loss": -37.04865646362305, "global_step": 122244, "epoch": 1010} {"train_loss": -36.71826934814453, "global_step": 122245, "epoch": 1010} {"train_loss": -37.03129959106445, "global_step": 122246, "epoch": 1010} {"train_loss": -38.16805648803711, "global_step": 122247, "epoch": 1010} {"train_loss": -37.48038864135742, "global_step": 122248, "epoch": 1010} {"train_loss": -37.116573333740234, "global_step": 122249, "epoch": 1010} {"train_loss": -37.471309661865234, "global_step": 122250, "epoch": 1010} {"train_loss": -36.91301345825195, "global_step": 122251, "epoch": 1010} {"train_loss": -36.7607536315918, "global_step": 122252, "epoch": 1010} {"train_loss": -36.10730743408203, "global_step": 122253, "epoch": 1010} {"train_loss": -37.44808578491211, "global_step": 122254, "epoch": 1010} {"train_loss": -37.9144172668457, "global_step": 122255, "epoch": 1010} {"train_loss": -37.24067306518555, "global_step": 122256, "epoch": 1010} {"train_loss": -38.074649810791016, "global_step": 122257, "epoch": 1010} {"train_loss": -38.44904708862305, "global_step": 122258, "epoch": 1010} {"train_loss": -37.49723434448242, "global_step": 122259, "epoch": 1010} {"train_loss": -38.578861236572266, "global_step": 122260, "epoch": 1010} {"train_loss": -38.58521270751953, "global_step": 122261, "epoch": 1010} {"train_loss": -38.269527435302734, "global_step": 122262, "epoch": 1010} {"train_loss": -37.8199348449707, "global_step": 122263, "epoch": 1010} {"train_loss": -37.88985061645508, "global_step": 122264, "epoch": 1010} {"train_loss": -37.98776626586914, "global_step": 122265, "epoch": 1010} {"train_loss": -38.390689849853516, "global_step": 122266, "epoch": 1010} {"train_loss": -38.62478256225586, "global_step": 122267, "epoch": 1010} {"train_loss": -38.283016204833984, "global_step": 122268, "epoch": 1010} {"train_loss": -37.8318977355957, "global_step": 122269, "epoch": 1010} {"train_loss": -38.89876937866211, "global_step": 122270, "epoch": 1010} {"train_loss": -38.073394775390625, "global_step": 122271, "epoch": 1010} {"train_loss": -38.4897346496582, "global_step": 122272, "epoch": 1010} {"train_loss": -37.845027923583984, "global_step": 122273, "epoch": 1010} {"train_loss": -38.468536376953125, "global_step": 122274, "epoch": 1010} {"train_loss": -39.006961822509766, "global_step": 122275, "epoch": 1010} {"train_loss": -38.769771575927734, "global_step": 122276, "epoch": 1010} {"train_loss": -38.60563278198242, "global_step": 122277, "epoch": 1010} {"train_loss": -38.51343536376953, "global_step": 122278, "epoch": 1010} {"train_loss": -38.829689025878906, "global_step": 122279, "epoch": 1010} {"train_loss": -38.491729736328125, "global_step": 122280, "epoch": 1010} {"train_loss": -38.28994369506836, "global_step": 122281, "epoch": 1010} {"train_loss": -36.43500518798828, "global_step": 122282, "epoch": 1010} {"train_loss": -37.16367721557617, "global_step": 122283, "epoch": 1010} {"train_loss": -38.348655700683594, "global_step": 122284, "epoch": 1010} {"train_loss": -38.21012496948242, "global_step": 122285, "epoch": 1010} {"train_loss": -37.16132736206055, "global_step": 122286, "epoch": 1010} {"train_loss": -35.69899368286133, "global_step": 122287, "epoch": 1010} {"train_loss": -36.304222106933594, "global_step": 122288, "epoch": 1010} {"train_loss": -38.017982482910156, "global_step": 122289, "epoch": 1010} {"train_loss": -38.728450775146484, "global_step": 122290, "epoch": 1010} {"train_loss": -37.835411071777344, "global_step": 122291, "epoch": 1010} {"train_loss": -37.226478576660156, "global_step": 122292, "epoch": 1010} {"train_loss": -38.8175163269043, "global_step": 122293, "epoch": 1010} {"train_loss": -38.25839614868164, "global_step": 122294, "epoch": 1010} {"train_loss": -38.30421829223633, "global_step": 122295, "epoch": 1010} {"train_loss": -38.785762786865234, "global_step": 122296, "epoch": 1010} {"train_loss": -38.9067497253418, "global_step": 122297, "epoch": 1010} {"train_loss": -38.7288818359375, "global_step": 122298, "epoch": 1010} {"train_loss": -38.29423141479492, "global_step": 122299, "epoch": 1010} {"train_loss": -38.975276947021484, "global_step": 122300, "epoch": 1010} {"train_loss": -38.64022445678711, "global_step": 122301, "epoch": 1010} {"train_loss": -38.43495559692383, "global_step": 122302, "epoch": 1010} {"train_loss": -38.693641662597656, "global_step": 122303, "epoch": 1010} {"train_loss": -38.898765563964844, "global_step": 122304, "epoch": 1010} {"train_loss": -39.16205596923828, "global_step": 122305, "epoch": 1010} {"train_loss": -38.68796157836914, "global_step": 122306, "epoch": 1010} {"train_loss": -39.0982666015625, "global_step": 122307, "epoch": 1010} {"train_loss": -38.269439697265625, "global_step": 122308, "epoch": 1010} {"train_loss": -39.37932205200195, "global_step": 122309, "epoch": 1010} {"train_loss": -39.20894241333008, "global_step": 122310, "epoch": 1010} {"train_loss": -39.58228302001953, "global_step": 122311, "epoch": 1010} {"train_loss": -39.2641487121582, "global_step": 122312, "epoch": 1010} {"train_loss": -39.2275505065918, "global_step": 122313, "epoch": 1010} {"train_loss": -38.771270751953125, "global_step": 122314, "epoch": 1010} {"train_loss": -38.26707077026367, "global_step": 122315, "epoch": 1010} {"train_loss": -37.3581657409668, "global_step": 122316, "epoch": 1010} {"train_loss": -38.75323486328125, "global_step": 122317, "epoch": 1010} {"train_loss": -39.13796615600586, "global_step": 122318, "epoch": 1010} {"train_loss": -39.532562255859375, "global_step": 122319, "epoch": 1010} {"train_loss": -38.77003860473633, "global_step": 122320, "epoch": 1010} {"train_loss": -38.8254508972168, "global_step": 122321, "epoch": 1010} {"train_loss": -37.547523498535156, "global_step": 122322, "epoch": 1010} {"train_loss": -38.876766204833984, "global_step": 122323, "epoch": 1010} {"train_loss": -39.2943229675293, "global_step": 122324, "epoch": 1010} {"train_loss": -38.66615676879883, "global_step": 122325, "epoch": 1010} {"train_loss": -39.085323333740234, "global_step": 122326, "epoch": 1010} {"train_loss": -39.12907409667969, "global_step": 122327, "epoch": 1010} {"train_loss": -39.19955062866211, "global_step": 122328, "epoch": 1010} {"train_loss": -37.529415130615234, "global_step": 122329, "epoch": 1010} {"train_loss": -38.037585707735424, "global_step": 122330, "epoch": 1010, "val_loss": 2616799.75} {"train_loss": -38.599578857421875, "global_step": 122331, "epoch": 1011} {"train_loss": -37.45882797241211, "global_step": 122332, "epoch": 1011} {"train_loss": -37.53327178955078, "global_step": 122333, "epoch": 1011} {"train_loss": -38.319862365722656, "global_step": 122334, "epoch": 1011} {"train_loss": -39.7202262878418, "global_step": 122335, "epoch": 1011} {"train_loss": -36.35190963745117, "global_step": 122336, "epoch": 1011} {"train_loss": -35.77168655395508, "global_step": 122337, "epoch": 1011} {"train_loss": -34.60177230834961, "global_step": 122338, "epoch": 1011} {"train_loss": -35.779239654541016, "global_step": 122339, "epoch": 1011} {"train_loss": -37.18136978149414, "global_step": 122340, "epoch": 1011} {"train_loss": -36.38898468017578, "global_step": 122341, "epoch": 1011} {"train_loss": -37.62803649902344, "global_step": 122342, "epoch": 1011} {"train_loss": -38.423343658447266, "global_step": 122343, "epoch": 1011} {"train_loss": -36.07869338989258, "global_step": 122344, "epoch": 1011} {"train_loss": -37.486785888671875, "global_step": 122345, "epoch": 1011} {"train_loss": -38.367950439453125, "global_step": 122346, "epoch": 1011} {"train_loss": -37.744667053222656, "global_step": 122347, "epoch": 1011} {"train_loss": -38.325923919677734, "global_step": 122348, "epoch": 1011} {"train_loss": -37.701904296875, "global_step": 122349, "epoch": 1011} {"train_loss": -37.87278747558594, "global_step": 122350, "epoch": 1011} {"train_loss": -38.54174041748047, "global_step": 122351, "epoch": 1011} {"train_loss": -38.51554489135742, "global_step": 122352, "epoch": 1011} {"train_loss": -38.24266052246094, "global_step": 122353, "epoch": 1011} {"train_loss": -39.004615783691406, "global_step": 122354, "epoch": 1011} {"train_loss": -38.029151916503906, "global_step": 122355, "epoch": 1011} {"train_loss": -35.16608428955078, "global_step": 122356, "epoch": 1011} {"train_loss": -38.290184020996094, "global_step": 122357, "epoch": 1011} {"train_loss": -37.91324234008789, "global_step": 122358, "epoch": 1011} {"train_loss": -37.980621337890625, "global_step": 122359, "epoch": 1011} {"train_loss": -36.8870849609375, "global_step": 122360, "epoch": 1011} {"train_loss": -37.74969482421875, "global_step": 122361, "epoch": 1011} {"train_loss": -38.247291564941406, "global_step": 122362, "epoch": 1011} {"train_loss": -38.385257720947266, "global_step": 122363, "epoch": 1011} {"train_loss": -37.832157135009766, "global_step": 122364, "epoch": 1011} {"train_loss": -37.69916534423828, "global_step": 122365, "epoch": 1011} {"train_loss": -38.80097198486328, "global_step": 122366, "epoch": 1011} {"train_loss": -37.74851608276367, "global_step": 122367, "epoch": 1011} {"train_loss": -38.12803268432617, "global_step": 122368, "epoch": 1011} {"train_loss": -38.36348342895508, "global_step": 122369, "epoch": 1011} {"train_loss": -36.835994720458984, "global_step": 122370, "epoch": 1011} {"train_loss": -37.76697540283203, "global_step": 122371, "epoch": 1011} {"train_loss": -38.069332122802734, "global_step": 122372, "epoch": 1011} {"train_loss": -38.087825775146484, "global_step": 122373, "epoch": 1011} {"train_loss": -36.192874908447266, "global_step": 122374, "epoch": 1011} {"train_loss": -38.104759216308594, "global_step": 122375, "epoch": 1011} {"train_loss": -37.971275329589844, "global_step": 122376, "epoch": 1011} {"train_loss": -37.87746047973633, "global_step": 122377, "epoch": 1011} {"train_loss": -37.440574645996094, "global_step": 122378, "epoch": 1011} {"train_loss": -38.163490295410156, "global_step": 122379, "epoch": 1011} {"train_loss": -38.53924560546875, "global_step": 122380, "epoch": 1011} {"train_loss": -38.575408935546875, "global_step": 122381, "epoch": 1011} {"train_loss": -38.42436981201172, "global_step": 122382, "epoch": 1011} {"train_loss": -38.4432487487793, "global_step": 122383, "epoch": 1011} {"train_loss": -38.49860763549805, "global_step": 122384, "epoch": 1011} {"train_loss": -38.259830474853516, "global_step": 122385, "epoch": 1011} {"train_loss": -37.89559555053711, "global_step": 122386, "epoch": 1011} {"train_loss": -38.59833526611328, "global_step": 122387, "epoch": 1011} {"train_loss": -37.36379623413086, "global_step": 122388, "epoch": 1011} {"train_loss": -38.20878982543945, "global_step": 122389, "epoch": 1011} {"train_loss": -38.78340530395508, "global_step": 122390, "epoch": 1011} {"train_loss": -38.83713912963867, "global_step": 122391, "epoch": 1011} {"train_loss": -38.156028747558594, "global_step": 122392, "epoch": 1011} {"train_loss": -38.5624885559082, "global_step": 122393, "epoch": 1011} {"train_loss": -38.86684799194336, "global_step": 122394, "epoch": 1011} {"train_loss": -39.1130256652832, "global_step": 122395, "epoch": 1011} {"train_loss": -37.96639633178711, "global_step": 122396, "epoch": 1011} {"train_loss": -38.472084045410156, "global_step": 122397, "epoch": 1011} {"train_loss": -37.118038177490234, "global_step": 122398, "epoch": 1011} {"train_loss": -37.34332275390625, "global_step": 122399, "epoch": 1011} {"train_loss": -38.12570571899414, "global_step": 122400, "epoch": 1011} {"train_loss": -37.67397689819336, "global_step": 122401, "epoch": 1011} {"train_loss": -38.4336051940918, "global_step": 122402, "epoch": 1011} {"train_loss": -37.9453125, "global_step": 122403, "epoch": 1011} {"train_loss": -37.263946533203125, "global_step": 122404, "epoch": 1011} {"train_loss": -38.849090576171875, "global_step": 122405, "epoch": 1011} {"train_loss": -32.965797424316406, "global_step": 122406, "epoch": 1011} {"train_loss": -38.45852279663086, "global_step": 122407, "epoch": 1011} {"train_loss": -37.73421096801758, "global_step": 122408, "epoch": 1011} {"train_loss": -38.73651123046875, "global_step": 122409, "epoch": 1011} {"train_loss": -39.047725677490234, "global_step": 122410, "epoch": 1011} {"train_loss": -34.84992599487305, "global_step": 122411, "epoch": 1011} {"train_loss": -37.60681915283203, "global_step": 122412, "epoch": 1011} {"train_loss": -35.28834533691406, "global_step": 122413, "epoch": 1011} {"train_loss": -31.71979331970215, "global_step": 122414, "epoch": 1011} {"train_loss": -38.50849533081055, "global_step": 122415, "epoch": 1011} {"train_loss": -37.8421745300293, "global_step": 122416, "epoch": 1011} {"train_loss": -38.17841339111328, "global_step": 122417, "epoch": 1011} {"train_loss": -37.46849822998047, "global_step": 122418, "epoch": 1011} {"train_loss": -37.220252990722656, "global_step": 122419, "epoch": 1011} {"train_loss": -36.19838333129883, "global_step": 122420, "epoch": 1011} {"train_loss": -37.81480026245117, "global_step": 122421, "epoch": 1011} {"train_loss": -35.29730224609375, "global_step": 122422, "epoch": 1011} {"train_loss": -35.841548919677734, "global_step": 122423, "epoch": 1011} {"train_loss": -37.562957763671875, "global_step": 122424, "epoch": 1011} {"train_loss": -36.2401237487793, "global_step": 122425, "epoch": 1011} {"train_loss": -33.91230010986328, "global_step": 122426, "epoch": 1011} {"train_loss": -37.37870407104492, "global_step": 122427, "epoch": 1011} {"train_loss": -35.819637298583984, "global_step": 122428, "epoch": 1011} {"train_loss": -34.38692855834961, "global_step": 122429, "epoch": 1011} {"train_loss": -37.30915069580078, "global_step": 122430, "epoch": 1011} {"train_loss": -37.44139099121094, "global_step": 122431, "epoch": 1011} {"train_loss": -37.481346130371094, "global_step": 122432, "epoch": 1011} {"train_loss": -36.30683135986328, "global_step": 122433, "epoch": 1011} {"train_loss": -35.99003601074219, "global_step": 122434, "epoch": 1011} {"train_loss": -37.29916000366211, "global_step": 122435, "epoch": 1011} {"train_loss": -37.278961181640625, "global_step": 122436, "epoch": 1011} {"train_loss": -38.21547317504883, "global_step": 122437, "epoch": 1011} {"train_loss": -37.7852897644043, "global_step": 122438, "epoch": 1011} {"train_loss": -38.306617736816406, "global_step": 122439, "epoch": 1011} {"train_loss": -38.22776412963867, "global_step": 122440, "epoch": 1011} {"train_loss": -38.090980529785156, "global_step": 122441, "epoch": 1011} {"train_loss": -38.08589553833008, "global_step": 122442, "epoch": 1011} {"train_loss": -38.54317855834961, "global_step": 122443, "epoch": 1011} {"train_loss": -38.17988967895508, "global_step": 122444, "epoch": 1011} {"train_loss": -37.83152389526367, "global_step": 122445, "epoch": 1011} {"train_loss": -37.28802490234375, "global_step": 122446, "epoch": 1011} {"train_loss": -38.67927169799805, "global_step": 122447, "epoch": 1011} {"train_loss": -38.052852630615234, "global_step": 122448, "epoch": 1011} {"train_loss": -38.3787956237793, "global_step": 122449, "epoch": 1011} {"train_loss": -38.55498123168945, "global_step": 122450, "epoch": 1011} {"train_loss": -37.58381947604093, "global_step": 122451, "epoch": 1011, "val_loss": 2656067.0} {"train_loss": -38.179481506347656, "global_step": 122452, "epoch": 1012} {"train_loss": -37.06279373168945, "global_step": 122453, "epoch": 1012} {"train_loss": -38.649658203125, "global_step": 122454, "epoch": 1012} {"train_loss": -38.60639572143555, "global_step": 122455, "epoch": 1012} {"train_loss": -38.419673919677734, "global_step": 122456, "epoch": 1012} {"train_loss": -37.499507904052734, "global_step": 122457, "epoch": 1012} {"train_loss": -38.463497161865234, "global_step": 122458, "epoch": 1012} {"train_loss": -38.213924407958984, "global_step": 122459, "epoch": 1012} {"train_loss": -36.991546630859375, "global_step": 122460, "epoch": 1012} {"train_loss": -37.669578552246094, "global_step": 122461, "epoch": 1012} {"train_loss": -37.482967376708984, "global_step": 122462, "epoch": 1012} {"train_loss": -38.379844665527344, "global_step": 122463, "epoch": 1012} {"train_loss": -38.76845932006836, "global_step": 122464, "epoch": 1012} {"train_loss": -38.09017562866211, "global_step": 122465, "epoch": 1012} {"train_loss": -38.807579040527344, "global_step": 122466, "epoch": 1012} {"train_loss": -38.72004318237305, "global_step": 122467, "epoch": 1012} {"train_loss": -38.88274002075195, "global_step": 122468, "epoch": 1012} {"train_loss": -38.287628173828125, "global_step": 122469, "epoch": 1012} {"train_loss": -39.13474655151367, "global_step": 122470, "epoch": 1012} {"train_loss": -39.487701416015625, "global_step": 122471, "epoch": 1012} {"train_loss": -38.82586669921875, "global_step": 122472, "epoch": 1012} {"train_loss": -38.361167907714844, "global_step": 122473, "epoch": 1012} {"train_loss": -38.642822265625, "global_step": 122474, "epoch": 1012} {"train_loss": -38.114990234375, "global_step": 122475, "epoch": 1012} {"train_loss": -37.808284759521484, "global_step": 122476, "epoch": 1012} {"train_loss": -38.27582931518555, "global_step": 122477, "epoch": 1012} {"train_loss": -38.454933166503906, "global_step": 122478, "epoch": 1012} {"train_loss": -39.30526351928711, "global_step": 122479, "epoch": 1012} {"train_loss": -38.49867248535156, "global_step": 122480, "epoch": 1012} {"train_loss": -38.746578216552734, "global_step": 122481, "epoch": 1012} {"train_loss": -38.963741302490234, "global_step": 122482, "epoch": 1012} {"train_loss": -38.4473991394043, "global_step": 122483, "epoch": 1012} {"train_loss": -37.00428009033203, "global_step": 122484, "epoch": 1012} {"train_loss": -38.47015380859375, "global_step": 122485, "epoch": 1012} {"train_loss": -37.38552474975586, "global_step": 122486, "epoch": 1012} {"train_loss": -36.369529724121094, "global_step": 122487, "epoch": 1012} {"train_loss": -32.978973388671875, "global_step": 122488, "epoch": 1012} {"train_loss": -38.587867736816406, "global_step": 122489, "epoch": 1012} {"train_loss": -38.47686767578125, "global_step": 122490, "epoch": 1012} {"train_loss": -37.476280212402344, "global_step": 122491, "epoch": 1012} {"train_loss": -37.052337646484375, "global_step": 122492, "epoch": 1012} {"train_loss": -36.336181640625, "global_step": 122493, "epoch": 1012} {"train_loss": -34.94746017456055, "global_step": 122494, "epoch": 1012} {"train_loss": -34.220184326171875, "global_step": 122495, "epoch": 1012} {"train_loss": -35.9160041809082, "global_step": 122496, "epoch": 1012} {"train_loss": -38.23617172241211, "global_step": 122497, "epoch": 1012} {"train_loss": -34.01890563964844, "global_step": 122498, "epoch": 1012} {"train_loss": -32.303863525390625, "global_step": 122499, "epoch": 1012} {"train_loss": -34.57145309448242, "global_step": 122500, "epoch": 1012} {"train_loss": -35.8792610168457, "global_step": 122501, "epoch": 1012} {"train_loss": -35.80454635620117, "global_step": 122502, "epoch": 1012} {"train_loss": -33.35712814331055, "global_step": 122503, "epoch": 1012} {"train_loss": -34.09304428100586, "global_step": 122504, "epoch": 1012} {"train_loss": -37.820438385009766, "global_step": 122505, "epoch": 1012} {"train_loss": -35.080013275146484, "global_step": 122506, "epoch": 1012} {"train_loss": -36.397621154785156, "global_step": 122507, "epoch": 1012} {"train_loss": -36.58317184448242, "global_step": 122508, "epoch": 1012} {"train_loss": -36.54914474487305, "global_step": 122509, "epoch": 1012} {"train_loss": -34.92493438720703, "global_step": 122510, "epoch": 1012} {"train_loss": -36.87717819213867, "global_step": 122511, "epoch": 1012} {"train_loss": -35.53699493408203, "global_step": 122512, "epoch": 1012} {"train_loss": -36.388038635253906, "global_step": 122513, "epoch": 1012} {"train_loss": -36.373409271240234, "global_step": 122514, "epoch": 1012} {"train_loss": -38.1541862487793, "global_step": 122515, "epoch": 1012} {"train_loss": -35.000362396240234, "global_step": 122516, "epoch": 1012} {"train_loss": -35.562801361083984, "global_step": 122517, "epoch": 1012} {"train_loss": -37.769474029541016, "global_step": 122518, "epoch": 1012} {"train_loss": -37.289398193359375, "global_step": 122519, "epoch": 1012} {"train_loss": -36.79560089111328, "global_step": 122520, "epoch": 1012} {"train_loss": -37.144893646240234, "global_step": 122521, "epoch": 1012} {"train_loss": -34.43236541748047, "global_step": 122522, "epoch": 1012} {"train_loss": -36.57575225830078, "global_step": 122523, "epoch": 1012} {"train_loss": -35.55805206298828, "global_step": 122524, "epoch": 1012} {"train_loss": -34.89268112182617, "global_step": 122525, "epoch": 1012} {"train_loss": -37.084991455078125, "global_step": 122526, "epoch": 1012} {"train_loss": -37.12713623046875, "global_step": 122527, "epoch": 1012} {"train_loss": -36.80318832397461, "global_step": 122528, "epoch": 1012} {"train_loss": -37.00580978393555, "global_step": 122529, "epoch": 1012} {"train_loss": -36.28641128540039, "global_step": 122530, "epoch": 1012} {"train_loss": -37.02342224121094, "global_step": 122531, "epoch": 1012} {"train_loss": -36.23850631713867, "global_step": 122532, "epoch": 1012} {"train_loss": -37.18156814575195, "global_step": 122533, "epoch": 1012} {"train_loss": -37.81516647338867, "global_step": 122534, "epoch": 1012} {"train_loss": -37.01021957397461, "global_step": 122535, "epoch": 1012} {"train_loss": -37.02078628540039, "global_step": 122536, "epoch": 1012} {"train_loss": -37.66500473022461, "global_step": 122537, "epoch": 1012} {"train_loss": -36.829097747802734, "global_step": 122538, "epoch": 1012} {"train_loss": -38.026607513427734, "global_step": 122539, "epoch": 1012} {"train_loss": -37.485286712646484, "global_step": 122540, "epoch": 1012} {"train_loss": -38.251529693603516, "global_step": 122541, "epoch": 1012} {"train_loss": -37.63511276245117, "global_step": 122542, "epoch": 1012} {"train_loss": -36.74470138549805, "global_step": 122543, "epoch": 1012} {"train_loss": -37.468048095703125, "global_step": 122544, "epoch": 1012} {"train_loss": -37.67449951171875, "global_step": 122545, "epoch": 1012} {"train_loss": -38.26219177246094, "global_step": 122546, "epoch": 1012} {"train_loss": -37.180049896240234, "global_step": 122547, "epoch": 1012} {"train_loss": -37.415706634521484, "global_step": 122548, "epoch": 1012} {"train_loss": -38.07408142089844, "global_step": 122549, "epoch": 1012} {"train_loss": -37.23677062988281, "global_step": 122550, "epoch": 1012} {"train_loss": -37.97651290893555, "global_step": 122551, "epoch": 1012} {"train_loss": -37.42946243286133, "global_step": 122552, "epoch": 1012} {"train_loss": -37.631134033203125, "global_step": 122553, "epoch": 1012} {"train_loss": -38.09957504272461, "global_step": 122554, "epoch": 1012} {"train_loss": -37.5750617980957, "global_step": 122555, "epoch": 1012} {"train_loss": -38.23390197753906, "global_step": 122556, "epoch": 1012} {"train_loss": -38.516963958740234, "global_step": 122557, "epoch": 1012} {"train_loss": -38.311126708984375, "global_step": 122558, "epoch": 1012} {"train_loss": -37.90693283081055, "global_step": 122559, "epoch": 1012} {"train_loss": -37.9578742980957, "global_step": 122560, "epoch": 1012} {"train_loss": -37.98477554321289, "global_step": 122561, "epoch": 1012} {"train_loss": -38.40023422241211, "global_step": 122562, "epoch": 1012} {"train_loss": -37.816078186035156, "global_step": 122563, "epoch": 1012} {"train_loss": -38.92228317260742, "global_step": 122564, "epoch": 1012} {"train_loss": -38.13594436645508, "global_step": 122565, "epoch": 1012} {"train_loss": -38.797393798828125, "global_step": 122566, "epoch": 1012} {"train_loss": -38.859317779541016, "global_step": 122567, "epoch": 1012} {"train_loss": -38.414127349853516, "global_step": 122568, "epoch": 1012} {"train_loss": -38.840118408203125, "global_step": 122569, "epoch": 1012} {"train_loss": -38.153995513916016, "global_step": 122570, "epoch": 1012} {"train_loss": -38.387325286865234, "global_step": 122571, "epoch": 1012} {"train_loss": -37.33754537913425, "global_step": 122572, "epoch": 1012, "val_loss": 2663247.25} {"train_loss": -38.76698684692383, "global_step": 122573, "epoch": 1013} {"train_loss": -38.85430908203125, "global_step": 122574, "epoch": 1013} {"train_loss": -38.58315658569336, "global_step": 122575, "epoch": 1013} {"train_loss": -38.0141487121582, "global_step": 122576, "epoch": 1013} {"train_loss": -38.87968826293945, "global_step": 122577, "epoch": 1013} {"train_loss": -38.04462432861328, "global_step": 122578, "epoch": 1013} {"train_loss": -38.737342834472656, "global_step": 122579, "epoch": 1013} {"train_loss": -38.1522102355957, "global_step": 122580, "epoch": 1013} {"train_loss": -38.85968780517578, "global_step": 122581, "epoch": 1013} {"train_loss": -38.32847213745117, "global_step": 122582, "epoch": 1013} {"train_loss": -38.13347244262695, "global_step": 122583, "epoch": 1013} {"train_loss": -38.3414306640625, "global_step": 122584, "epoch": 1013} {"train_loss": -38.54293441772461, "global_step": 122585, "epoch": 1013} {"train_loss": -39.28782272338867, "global_step": 122586, "epoch": 1013} {"train_loss": -38.65886306762695, "global_step": 122587, "epoch": 1013} {"train_loss": -39.4206657409668, "global_step": 122588, "epoch": 1013} {"train_loss": -38.50771713256836, "global_step": 122589, "epoch": 1013} {"train_loss": -39.65787887573242, "global_step": 122590, "epoch": 1013} {"train_loss": -38.96977233886719, "global_step": 122591, "epoch": 1013} {"train_loss": -38.152679443359375, "global_step": 122592, "epoch": 1013} {"train_loss": -37.9221076965332, "global_step": 122593, "epoch": 1013} {"train_loss": -39.2960205078125, "global_step": 122594, "epoch": 1013} {"train_loss": -39.28523635864258, "global_step": 122595, "epoch": 1013} {"train_loss": -39.32638168334961, "global_step": 122596, "epoch": 1013} {"train_loss": -39.44255447387695, "global_step": 122597, "epoch": 1013} {"train_loss": -39.3580436706543, "global_step": 122598, "epoch": 1013} {"train_loss": -39.48527145385742, "global_step": 122599, "epoch": 1013} {"train_loss": -39.48857498168945, "global_step": 122600, "epoch": 1013} {"train_loss": -39.90394973754883, "global_step": 122601, "epoch": 1013} {"train_loss": -39.39131164550781, "global_step": 122602, "epoch": 1013} {"train_loss": -39.64014434814453, "global_step": 122603, "epoch": 1013} {"train_loss": -38.68593978881836, "global_step": 122604, "epoch": 1013} {"train_loss": -38.565887451171875, "global_step": 122605, "epoch": 1013} {"train_loss": -38.456748962402344, "global_step": 122606, "epoch": 1013} {"train_loss": -39.26198959350586, "global_step": 122607, "epoch": 1013} {"train_loss": -39.74544906616211, "global_step": 122608, "epoch": 1013} {"train_loss": -38.6351432800293, "global_step": 122609, "epoch": 1013} {"train_loss": -38.888336181640625, "global_step": 122610, "epoch": 1013} {"train_loss": -39.0387077331543, "global_step": 122611, "epoch": 1013} {"train_loss": -36.11334991455078, "global_step": 122612, "epoch": 1013} {"train_loss": -33.521156311035156, "global_step": 122613, "epoch": 1013} {"train_loss": -36.26431655883789, "global_step": 122614, "epoch": 1013} {"train_loss": -34.88422775268555, "global_step": 122615, "epoch": 1013} {"train_loss": -35.86729049682617, "global_step": 122616, "epoch": 1013} {"train_loss": -28.598407745361328, "global_step": 122617, "epoch": 1013} {"train_loss": -27.635913848876953, "global_step": 122618, "epoch": 1013} {"train_loss": -34.38220977783203, "global_step": 122619, "epoch": 1013} {"train_loss": -29.307178497314453, "global_step": 122620, "epoch": 1013} {"train_loss": -31.379852294921875, "global_step": 122621, "epoch": 1013} {"train_loss": -34.685298919677734, "global_step": 122622, "epoch": 1013} {"train_loss": -34.1397590637207, "global_step": 122623, "epoch": 1013} {"train_loss": -29.773035049438477, "global_step": 122624, "epoch": 1013} {"train_loss": -37.78939437866211, "global_step": 122625, "epoch": 1013} {"train_loss": -33.66535186767578, "global_step": 122626, "epoch": 1013} {"train_loss": -34.29594802856445, "global_step": 122627, "epoch": 1013} {"train_loss": -36.87032699584961, "global_step": 122628, "epoch": 1013} {"train_loss": -35.90790939331055, "global_step": 122629, "epoch": 1013} {"train_loss": -34.10624313354492, "global_step": 122630, "epoch": 1013} {"train_loss": -36.86292266845703, "global_step": 122631, "epoch": 1013} {"train_loss": -37.07967758178711, "global_step": 122632, "epoch": 1013} {"train_loss": -34.14394760131836, "global_step": 122633, "epoch": 1013} {"train_loss": -37.54777526855469, "global_step": 122634, "epoch": 1013} {"train_loss": -36.461116790771484, "global_step": 122635, "epoch": 1013} {"train_loss": -36.85598373413086, "global_step": 122636, "epoch": 1013} {"train_loss": -36.674713134765625, "global_step": 122637, "epoch": 1013} {"train_loss": -37.33025360107422, "global_step": 122638, "epoch": 1013} {"train_loss": -38.091552734375, "global_step": 122639, "epoch": 1013} {"train_loss": -35.999507904052734, "global_step": 122640, "epoch": 1013} {"train_loss": -37.968143463134766, "global_step": 122641, "epoch": 1013} {"train_loss": -37.36682891845703, "global_step": 122642, "epoch": 1013} {"train_loss": -38.05223846435547, "global_step": 122643, "epoch": 1013} {"train_loss": -38.19083023071289, "global_step": 122644, "epoch": 1013} {"train_loss": -38.05506896972656, "global_step": 122645, "epoch": 1013} {"train_loss": -38.27579879760742, "global_step": 122646, "epoch": 1013} {"train_loss": -38.383968353271484, "global_step": 122647, "epoch": 1013} {"train_loss": -38.712493896484375, "global_step": 122648, "epoch": 1013} {"train_loss": -37.866600036621094, "global_step": 122649, "epoch": 1013} {"train_loss": -37.71052169799805, "global_step": 122650, "epoch": 1013} {"train_loss": -37.189727783203125, "global_step": 122651, "epoch": 1013} {"train_loss": -38.2231559753418, "global_step": 122652, "epoch": 1013} {"train_loss": -38.444244384765625, "global_step": 122653, "epoch": 1013} {"train_loss": -38.35873031616211, "global_step": 122654, "epoch": 1013} {"train_loss": -38.88570785522461, "global_step": 122655, "epoch": 1013} {"train_loss": -38.79853057861328, "global_step": 122656, "epoch": 1013} {"train_loss": -38.72494125366211, "global_step": 122657, "epoch": 1013} {"train_loss": -38.69426345825195, "global_step": 122658, "epoch": 1013} {"train_loss": -38.578678131103516, "global_step": 122659, "epoch": 1013} {"train_loss": -38.67802429199219, "global_step": 122660, "epoch": 1013} {"train_loss": -38.86440658569336, "global_step": 122661, "epoch": 1013} {"train_loss": -38.22602462768555, "global_step": 122662, "epoch": 1013} {"train_loss": -38.53919219970703, "global_step": 122663, "epoch": 1013} {"train_loss": -39.1251106262207, "global_step": 122664, "epoch": 1013} {"train_loss": -38.4709358215332, "global_step": 122665, "epoch": 1013} {"train_loss": -39.08015441894531, "global_step": 122666, "epoch": 1013} {"train_loss": -39.12677764892578, "global_step": 122667, "epoch": 1013} {"train_loss": -39.20258712768555, "global_step": 122668, "epoch": 1013} {"train_loss": -39.70771408081055, "global_step": 122669, "epoch": 1013} {"train_loss": -39.14992141723633, "global_step": 122670, "epoch": 1013} {"train_loss": -39.23141098022461, "global_step": 122671, "epoch": 1013} {"train_loss": -38.95182418823242, "global_step": 122672, "epoch": 1013} {"train_loss": -39.43099594116211, "global_step": 122673, "epoch": 1013} {"train_loss": -39.47514724731445, "global_step": 122674, "epoch": 1013} {"train_loss": -38.80125045776367, "global_step": 122675, "epoch": 1013} {"train_loss": -39.77775192260742, "global_step": 122676, "epoch": 1013} {"train_loss": -39.206298828125, "global_step": 122677, "epoch": 1013} {"train_loss": -39.22007369995117, "global_step": 122678, "epoch": 1013} {"train_loss": -39.4727897644043, "global_step": 122679, "epoch": 1013} {"train_loss": -39.5527458190918, "global_step": 122680, "epoch": 1013} {"train_loss": -39.747920989990234, "global_step": 122681, "epoch": 1013} {"train_loss": -39.27395248413086, "global_step": 122682, "epoch": 1013} {"train_loss": -39.77301025390625, "global_step": 122683, "epoch": 1013} {"train_loss": -39.254493713378906, "global_step": 122684, "epoch": 1013} {"train_loss": -39.71151351928711, "global_step": 122685, "epoch": 1013} {"train_loss": -39.56388473510742, "global_step": 122686, "epoch": 1013} {"train_loss": -40.121891021728516, "global_step": 122687, "epoch": 1013} {"train_loss": -39.539756774902344, "global_step": 122688, "epoch": 1013} {"train_loss": -39.20817947387695, "global_step": 122689, "epoch": 1013} {"train_loss": -39.669349670410156, "global_step": 122690, "epoch": 1013} {"train_loss": -39.78828811645508, "global_step": 122691, "epoch": 1013} {"train_loss": -40.111019134521484, "global_step": 122692, "epoch": 1013} {"train_loss": -37.90149409711854, "global_step": 122693, "epoch": 1013, "val_loss": 2540925.75} {"train_loss": -38.90089797973633, "global_step": 122694, "epoch": 1014} {"train_loss": -38.974609375, "global_step": 122695, "epoch": 1014} {"train_loss": -38.71670150756836, "global_step": 122696, "epoch": 1014} {"train_loss": -38.889610290527344, "global_step": 122697, "epoch": 1014} {"train_loss": -39.991912841796875, "global_step": 122698, "epoch": 1014} {"train_loss": -40.18075942993164, "global_step": 122699, "epoch": 1014} {"train_loss": -39.53300094604492, "global_step": 122700, "epoch": 1014} {"train_loss": -39.06439208984375, "global_step": 122701, "epoch": 1014} {"train_loss": -38.61777877807617, "global_step": 122702, "epoch": 1014} {"train_loss": -39.28983688354492, "global_step": 122703, "epoch": 1014} {"train_loss": -39.3712158203125, "global_step": 122704, "epoch": 1014} {"train_loss": -37.173553466796875, "global_step": 122705, "epoch": 1014} {"train_loss": -37.36583709716797, "global_step": 122706, "epoch": 1014} {"train_loss": -38.48698806762695, "global_step": 122707, "epoch": 1014} {"train_loss": -37.3785514831543, "global_step": 122708, "epoch": 1014} {"train_loss": -36.960689544677734, "global_step": 122709, "epoch": 1014} {"train_loss": -36.01475143432617, "global_step": 122710, "epoch": 1014} {"train_loss": -37.575042724609375, "global_step": 122711, "epoch": 1014} {"train_loss": -37.74114227294922, "global_step": 122712, "epoch": 1014} {"train_loss": -37.64084243774414, "global_step": 122713, "epoch": 1014} {"train_loss": -38.1605339050293, "global_step": 122714, "epoch": 1014} {"train_loss": -39.165748596191406, "global_step": 122715, "epoch": 1014} {"train_loss": -39.18136215209961, "global_step": 122716, "epoch": 1014} {"train_loss": -39.11782455444336, "global_step": 122717, "epoch": 1014} {"train_loss": -38.284759521484375, "global_step": 122718, "epoch": 1014} {"train_loss": -38.35193634033203, "global_step": 122719, "epoch": 1014} {"train_loss": -38.551395416259766, "global_step": 122720, "epoch": 1014} {"train_loss": -37.81013870239258, "global_step": 122721, "epoch": 1014} {"train_loss": -38.80454635620117, "global_step": 122722, "epoch": 1014} {"train_loss": -39.07221603393555, "global_step": 122723, "epoch": 1014} {"train_loss": -39.15000534057617, "global_step": 122724, "epoch": 1014} {"train_loss": -39.170684814453125, "global_step": 122725, "epoch": 1014} {"train_loss": -38.82304763793945, "global_step": 122726, "epoch": 1014} {"train_loss": -38.661720275878906, "global_step": 122727, "epoch": 1014} {"train_loss": -38.75619888305664, "global_step": 122728, "epoch": 1014} {"train_loss": -38.81667709350586, "global_step": 122729, "epoch": 1014} {"train_loss": -39.0727653503418, "global_step": 122730, "epoch": 1014} {"train_loss": -38.47364044189453, "global_step": 122731, "epoch": 1014} {"train_loss": -38.20258331298828, "global_step": 122732, "epoch": 1014} {"train_loss": -38.5306396484375, "global_step": 122733, "epoch": 1014} {"train_loss": -38.872779846191406, "global_step": 122734, "epoch": 1014} {"train_loss": -39.2778434753418, "global_step": 122735, "epoch": 1014} {"train_loss": -38.5918083190918, "global_step": 122736, "epoch": 1014} {"train_loss": -38.32167434692383, "global_step": 122737, "epoch": 1014} {"train_loss": -39.18752670288086, "global_step": 122738, "epoch": 1014} {"train_loss": -39.35663604736328, "global_step": 122739, "epoch": 1014} {"train_loss": -38.44355010986328, "global_step": 122740, "epoch": 1014} {"train_loss": -38.61052322387695, "global_step": 122741, "epoch": 1014} {"train_loss": -39.27313232421875, "global_step": 122742, "epoch": 1014} {"train_loss": -39.25851058959961, "global_step": 122743, "epoch": 1014} {"train_loss": -38.33247375488281, "global_step": 122744, "epoch": 1014} {"train_loss": -38.33683395385742, "global_step": 122745, "epoch": 1014} {"train_loss": -38.710426330566406, "global_step": 122746, "epoch": 1014} {"train_loss": -39.4024658203125, "global_step": 122747, "epoch": 1014} {"train_loss": -38.97222900390625, "global_step": 122748, "epoch": 1014} {"train_loss": -38.829402923583984, "global_step": 122749, "epoch": 1014} {"train_loss": -39.83829879760742, "global_step": 122750, "epoch": 1014} {"train_loss": -39.03172302246094, "global_step": 122751, "epoch": 1014} {"train_loss": -39.50499725341797, "global_step": 122752, "epoch": 1014} {"train_loss": -39.7717170715332, "global_step": 122753, "epoch": 1014} {"train_loss": -39.498661041259766, "global_step": 122754, "epoch": 1014} {"train_loss": -38.28363800048828, "global_step": 122755, "epoch": 1014} {"train_loss": -39.05458450317383, "global_step": 122756, "epoch": 1014} {"train_loss": -39.76825714111328, "global_step": 122757, "epoch": 1014} {"train_loss": -39.293575286865234, "global_step": 122758, "epoch": 1014} {"train_loss": -39.38307571411133, "global_step": 122759, "epoch": 1014} {"train_loss": -39.270320892333984, "global_step": 122760, "epoch": 1014} {"train_loss": -39.36771774291992, "global_step": 122761, "epoch": 1014} {"train_loss": -39.73731231689453, "global_step": 122762, "epoch": 1014} {"train_loss": -39.34690475463867, "global_step": 122763, "epoch": 1014} {"train_loss": -39.52204895019531, "global_step": 122764, "epoch": 1014} {"train_loss": -39.614280700683594, "global_step": 122765, "epoch": 1014} {"train_loss": -38.820289611816406, "global_step": 122766, "epoch": 1014} {"train_loss": -39.737056732177734, "global_step": 122767, "epoch": 1014} {"train_loss": -39.29878616333008, "global_step": 122768, "epoch": 1014} {"train_loss": -37.601985931396484, "global_step": 122769, "epoch": 1014} {"train_loss": -38.8584098815918, "global_step": 122770, "epoch": 1014} {"train_loss": -25.880064010620117, "global_step": 122771, "epoch": 1014} {"train_loss": -38.7758674621582, "global_step": 122772, "epoch": 1014} {"train_loss": -29.32401466369629, "global_step": 122773, "epoch": 1014} {"train_loss": -22.115598678588867, "global_step": 122774, "epoch": 1014} {"train_loss": -6.9226250648498535, "global_step": 122775, "epoch": 1014} {"train_loss": -31.113555908203125, "global_step": 122776, "epoch": 1014} {"train_loss": -32.94221115112305, "global_step": 122777, "epoch": 1014} {"train_loss": -35.569366455078125, "global_step": 122778, "epoch": 1014} {"train_loss": -19.12957191467285, "global_step": 122779, "epoch": 1014} {"train_loss": -10.910715103149414, "global_step": 122780, "epoch": 1014} {"train_loss": -28.774295806884766, "global_step": 122781, "epoch": 1014} {"train_loss": -31.733173370361328, "global_step": 122782, "epoch": 1014} {"train_loss": -29.127094268798828, "global_step": 122783, "epoch": 1014} {"train_loss": -18.09866714477539, "global_step": 122784, "epoch": 1014} {"train_loss": -18.26692771911621, "global_step": 122785, "epoch": 1014} {"train_loss": -24.686410903930664, "global_step": 122786, "epoch": 1014} {"train_loss": -31.877058029174805, "global_step": 122787, "epoch": 1014} {"train_loss": -28.079511642456055, "global_step": 122788, "epoch": 1014} {"train_loss": -31.713489532470703, "global_step": 122789, "epoch": 1014} {"train_loss": -32.2614631652832, "global_step": 122790, "epoch": 1014} {"train_loss": -33.657222747802734, "global_step": 122791, "epoch": 1014} {"train_loss": -32.924861907958984, "global_step": 122792, "epoch": 1014} {"train_loss": -33.30094528198242, "global_step": 122793, "epoch": 1014} {"train_loss": -32.165863037109375, "global_step": 122794, "epoch": 1014} {"train_loss": -31.72006607055664, "global_step": 122795, "epoch": 1014} {"train_loss": -31.1378173828125, "global_step": 122796, "epoch": 1014} {"train_loss": -31.08197593688965, "global_step": 122797, "epoch": 1014} {"train_loss": -33.1114616394043, "global_step": 122798, "epoch": 1014} {"train_loss": -33.62751007080078, "global_step": 122799, "epoch": 1014} {"train_loss": -32.00628662109375, "global_step": 122800, "epoch": 1014} {"train_loss": -33.7830810546875, "global_step": 122801, "epoch": 1014} {"train_loss": -32.0604362487793, "global_step": 122802, "epoch": 1014} {"train_loss": -34.20414352416992, "global_step": 122803, "epoch": 1014} {"train_loss": -34.35593795776367, "global_step": 122804, "epoch": 1014} {"train_loss": -33.97418975830078, "global_step": 122805, "epoch": 1014} {"train_loss": -34.01571273803711, "global_step": 122806, "epoch": 1014} {"train_loss": -33.55080795288086, "global_step": 122807, "epoch": 1014} {"train_loss": -34.86175537109375, "global_step": 122808, "epoch": 1014} {"train_loss": -34.205997467041016, "global_step": 122809, "epoch": 1014} {"train_loss": -34.40699005126953, "global_step": 122810, "epoch": 1014} {"train_loss": -33.37600326538086, "global_step": 122811, "epoch": 1014} {"train_loss": -34.18083953857422, "global_step": 122812, "epoch": 1014} {"train_loss": -34.45719528198242, "global_step": 122813, "epoch": 1014} {"train_loss": -35.67327577023467, "global_step": 122814, "epoch": 1014, "val_loss": 2816210.75} {"train_loss": -35.68732452392578, "global_step": 122815, "epoch": 1015} {"train_loss": -35.11970138549805, "global_step": 122816, "epoch": 1015} {"train_loss": -35.02910232543945, "global_step": 122817, "epoch": 1015} {"train_loss": -34.15306854248047, "global_step": 122818, "epoch": 1015} {"train_loss": -34.319801330566406, "global_step": 122819, "epoch": 1015} {"train_loss": -35.46293258666992, "global_step": 122820, "epoch": 1015} {"train_loss": -35.39627456665039, "global_step": 122821, "epoch": 1015} {"train_loss": -35.0306396484375, "global_step": 122822, "epoch": 1015} {"train_loss": -35.66898727416992, "global_step": 122823, "epoch": 1015} {"train_loss": -35.36726760864258, "global_step": 122824, "epoch": 1015} {"train_loss": -35.782222747802734, "global_step": 122825, "epoch": 1015} {"train_loss": -36.1762809753418, "global_step": 122826, "epoch": 1015} {"train_loss": -36.19426345825195, "global_step": 122827, "epoch": 1015} {"train_loss": -35.65073776245117, "global_step": 122828, "epoch": 1015} {"train_loss": -35.982975006103516, "global_step": 122829, "epoch": 1015} {"train_loss": -36.057857513427734, "global_step": 122830, "epoch": 1015} {"train_loss": -35.9886474609375, "global_step": 122831, "epoch": 1015} {"train_loss": -36.40094757080078, "global_step": 122832, "epoch": 1015} {"train_loss": -35.83876037597656, "global_step": 122833, "epoch": 1015} {"train_loss": -35.11307907104492, "global_step": 122834, "epoch": 1015} {"train_loss": -36.14456558227539, "global_step": 122835, "epoch": 1015} {"train_loss": -35.74222946166992, "global_step": 122836, "epoch": 1015} {"train_loss": -35.32986831665039, "global_step": 122837, "epoch": 1015} {"train_loss": -36.51618576049805, "global_step": 122838, "epoch": 1015} {"train_loss": -35.773475646972656, "global_step": 122839, "epoch": 1015} {"train_loss": -36.81391906738281, "global_step": 122840, "epoch": 1015} {"train_loss": -35.56191635131836, "global_step": 122841, "epoch": 1015} {"train_loss": -36.67253112792969, "global_step": 122842, "epoch": 1015} {"train_loss": -35.5069580078125, "global_step": 122843, "epoch": 1015} {"train_loss": -36.412715911865234, "global_step": 122844, "epoch": 1015} {"train_loss": -36.53927993774414, "global_step": 122845, "epoch": 1015} {"train_loss": -36.856773376464844, "global_step": 122846, "epoch": 1015} {"train_loss": -35.19935989379883, "global_step": 122847, "epoch": 1015} {"train_loss": -36.56796646118164, "global_step": 122848, "epoch": 1015} {"train_loss": -36.4034423828125, "global_step": 122849, "epoch": 1015} {"train_loss": -36.77949142456055, "global_step": 122850, "epoch": 1015} {"train_loss": -36.90782165527344, "global_step": 122851, "epoch": 1015} {"train_loss": -37.629638671875, "global_step": 122852, "epoch": 1015} {"train_loss": -35.53498458862305, "global_step": 122853, "epoch": 1015} {"train_loss": -36.12705993652344, "global_step": 122854, "epoch": 1015} {"train_loss": -36.91562271118164, "global_step": 122855, "epoch": 1015} {"train_loss": -36.66789627075195, "global_step": 122856, "epoch": 1015} {"train_loss": -36.459442138671875, "global_step": 122857, "epoch": 1015} {"train_loss": -37.69382858276367, "global_step": 122858, "epoch": 1015} {"train_loss": -37.19870376586914, "global_step": 122859, "epoch": 1015} {"train_loss": -36.42957305908203, "global_step": 122860, "epoch": 1015} {"train_loss": -36.36759567260742, "global_step": 122861, "epoch": 1015} {"train_loss": -36.67412185668945, "global_step": 122862, "epoch": 1015} {"train_loss": -37.83369064331055, "global_step": 122863, "epoch": 1015} {"train_loss": -37.228702545166016, "global_step": 122864, "epoch": 1015} {"train_loss": -37.30437088012695, "global_step": 122865, "epoch": 1015} {"train_loss": -37.5628547668457, "global_step": 122866, "epoch": 1015} {"train_loss": -38.1762580871582, "global_step": 122867, "epoch": 1015} {"train_loss": -37.93546676635742, "global_step": 122868, "epoch": 1015} {"train_loss": -37.683837890625, "global_step": 122869, "epoch": 1015} {"train_loss": -37.97455978393555, "global_step": 122870, "epoch": 1015} {"train_loss": -37.14995574951172, "global_step": 122871, "epoch": 1015} {"train_loss": -36.56985092163086, "global_step": 122872, "epoch": 1015} {"train_loss": -37.236328125, "global_step": 122873, "epoch": 1015} {"train_loss": -36.776607513427734, "global_step": 122874, "epoch": 1015} {"train_loss": -37.58143615722656, "global_step": 122875, "epoch": 1015} {"train_loss": -38.29386520385742, "global_step": 122876, "epoch": 1015} {"train_loss": -37.556671142578125, "global_step": 122877, "epoch": 1015} {"train_loss": -37.93301010131836, "global_step": 122878, "epoch": 1015} {"train_loss": -38.49134826660156, "global_step": 122879, "epoch": 1015} {"train_loss": -37.903968811035156, "global_step": 122880, "epoch": 1015} {"train_loss": -37.95317459106445, "global_step": 122881, "epoch": 1015} {"train_loss": -36.83723068237305, "global_step": 122882, "epoch": 1015} {"train_loss": -37.50714874267578, "global_step": 122883, "epoch": 1015} {"train_loss": -38.19105911254883, "global_step": 122884, "epoch": 1015} {"train_loss": -38.20189666748047, "global_step": 122885, "epoch": 1015} {"train_loss": -38.18024826049805, "global_step": 122886, "epoch": 1015} {"train_loss": -38.398353576660156, "global_step": 122887, "epoch": 1015} {"train_loss": -39.10417556762695, "global_step": 122888, "epoch": 1015} {"train_loss": -37.87541580200195, "global_step": 122889, "epoch": 1015} {"train_loss": -38.919795989990234, "global_step": 122890, "epoch": 1015} {"train_loss": -38.429298400878906, "global_step": 122891, "epoch": 1015} {"train_loss": -37.862491607666016, "global_step": 122892, "epoch": 1015} {"train_loss": -38.829280853271484, "global_step": 122893, "epoch": 1015} {"train_loss": -38.432437896728516, "global_step": 122894, "epoch": 1015} {"train_loss": -38.50893783569336, "global_step": 122895, "epoch": 1015} {"train_loss": -38.37714767456055, "global_step": 122896, "epoch": 1015} {"train_loss": -37.38758850097656, "global_step": 122897, "epoch": 1015} {"train_loss": -37.88066482543945, "global_step": 122898, "epoch": 1015} {"train_loss": -38.37238693237305, "global_step": 122899, "epoch": 1015} {"train_loss": -37.93656921386719, "global_step": 122900, "epoch": 1015} {"train_loss": -37.35338592529297, "global_step": 122901, "epoch": 1015} {"train_loss": -37.57117462158203, "global_step": 122902, "epoch": 1015} {"train_loss": -37.759681701660156, "global_step": 122903, "epoch": 1015} {"train_loss": -38.25288009643555, "global_step": 122904, "epoch": 1015} {"train_loss": -37.90045928955078, "global_step": 122905, "epoch": 1015} {"train_loss": -37.06753158569336, "global_step": 122906, "epoch": 1015} {"train_loss": -38.00699996948242, "global_step": 122907, "epoch": 1015} {"train_loss": -38.351558685302734, "global_step": 122908, "epoch": 1015} {"train_loss": -38.0739631652832, "global_step": 122909, "epoch": 1015} {"train_loss": -35.52204132080078, "global_step": 122910, "epoch": 1015} {"train_loss": -37.617244720458984, "global_step": 122911, "epoch": 1015} {"train_loss": -38.0267448425293, "global_step": 122912, "epoch": 1015} {"train_loss": -37.34404754638672, "global_step": 122913, "epoch": 1015} {"train_loss": -38.183937072753906, "global_step": 122914, "epoch": 1015} {"train_loss": -38.34009552001953, "global_step": 122915, "epoch": 1015} {"train_loss": -38.40262985229492, "global_step": 122916, "epoch": 1015} {"train_loss": -38.66178512573242, "global_step": 122917, "epoch": 1015} {"train_loss": -38.3564338684082, "global_step": 122918, "epoch": 1015} {"train_loss": -37.90877914428711, "global_step": 122919, "epoch": 1015} {"train_loss": -37.5504150390625, "global_step": 122920, "epoch": 1015} {"train_loss": -37.93253707885742, "global_step": 122921, "epoch": 1015} {"train_loss": -38.31006622314453, "global_step": 122922, "epoch": 1015} {"train_loss": -38.453590393066406, "global_step": 122923, "epoch": 1015} {"train_loss": -37.63525390625, "global_step": 122924, "epoch": 1015} {"train_loss": -36.007354736328125, "global_step": 122925, "epoch": 1015} {"train_loss": -36.55108642578125, "global_step": 122926, "epoch": 1015} {"train_loss": -37.98569869995117, "global_step": 122927, "epoch": 1015} {"train_loss": -37.90932846069336, "global_step": 122928, "epoch": 1015} {"train_loss": -38.105445861816406, "global_step": 122929, "epoch": 1015} {"train_loss": -38.8446159362793, "global_step": 122930, "epoch": 1015} {"train_loss": -39.08189392089844, "global_step": 122931, "epoch": 1015} {"train_loss": -38.0103874206543, "global_step": 122932, "epoch": 1015} {"train_loss": -38.25019454956055, "global_step": 122933, "epoch": 1015} {"train_loss": -38.90454864501953, "global_step": 122934, "epoch": 1015} {"train_loss": -37.15105974181625, "global_step": 122935, "epoch": 1015, "val_loss": 2679594.0} {"train_loss": -33.94422912597656, "global_step": 122936, "epoch": 1016} {"train_loss": -34.64236068725586, "global_step": 122937, "epoch": 1016} {"train_loss": -38.516815185546875, "global_step": 122938, "epoch": 1016} {"train_loss": -34.44918441772461, "global_step": 122939, "epoch": 1016} {"train_loss": -34.69564437866211, "global_step": 122940, "epoch": 1016} {"train_loss": -38.76144027709961, "global_step": 122941, "epoch": 1016} {"train_loss": -37.502506256103516, "global_step": 122942, "epoch": 1016} {"train_loss": -37.63869857788086, "global_step": 122943, "epoch": 1016} {"train_loss": -35.97105407714844, "global_step": 122944, "epoch": 1016} {"train_loss": -36.71514892578125, "global_step": 122945, "epoch": 1016} {"train_loss": -38.203765869140625, "global_step": 122946, "epoch": 1016} {"train_loss": -38.679386138916016, "global_step": 122947, "epoch": 1016} {"train_loss": -36.61811828613281, "global_step": 122948, "epoch": 1016} {"train_loss": -37.5925178527832, "global_step": 122949, "epoch": 1016} {"train_loss": -35.89024353027344, "global_step": 122950, "epoch": 1016} {"train_loss": -38.05813217163086, "global_step": 122951, "epoch": 1016} {"train_loss": -38.19126510620117, "global_step": 122952, "epoch": 1016} {"train_loss": -38.04568862915039, "global_step": 122953, "epoch": 1016} {"train_loss": -38.77388381958008, "global_step": 122954, "epoch": 1016} {"train_loss": -38.89589309692383, "global_step": 122955, "epoch": 1016} {"train_loss": -38.26182174682617, "global_step": 122956, "epoch": 1016} {"train_loss": -37.40983963012695, "global_step": 122957, "epoch": 1016} {"train_loss": -38.63729476928711, "global_step": 122958, "epoch": 1016} {"train_loss": -37.761810302734375, "global_step": 122959, "epoch": 1016} {"train_loss": -38.504913330078125, "global_step": 122960, "epoch": 1016} {"train_loss": -38.33960723876953, "global_step": 122961, "epoch": 1016} {"train_loss": -37.09792709350586, "global_step": 122962, "epoch": 1016} {"train_loss": -38.10689163208008, "global_step": 122963, "epoch": 1016} {"train_loss": -36.366798400878906, "global_step": 122964, "epoch": 1016} {"train_loss": -37.93068313598633, "global_step": 122965, "epoch": 1016} {"train_loss": -36.39990234375, "global_step": 122966, "epoch": 1016} {"train_loss": -37.07497024536133, "global_step": 122967, "epoch": 1016} {"train_loss": -38.188838958740234, "global_step": 122968, "epoch": 1016} {"train_loss": -35.87211990356445, "global_step": 122969, "epoch": 1016} {"train_loss": -38.97738265991211, "global_step": 122970, "epoch": 1016} {"train_loss": -36.96917724609375, "global_step": 122971, "epoch": 1016} {"train_loss": -37.698097229003906, "global_step": 122972, "epoch": 1016} {"train_loss": -36.47471237182617, "global_step": 122973, "epoch": 1016} {"train_loss": -36.619667053222656, "global_step": 122974, "epoch": 1016} {"train_loss": -37.693233489990234, "global_step": 122975, "epoch": 1016} {"train_loss": -38.2635383605957, "global_step": 122976, "epoch": 1016} {"train_loss": -38.12621307373047, "global_step": 122977, "epoch": 1016} {"train_loss": -38.66059875488281, "global_step": 122978, "epoch": 1016} {"train_loss": -38.21900177001953, "global_step": 122979, "epoch": 1016} {"train_loss": -38.170467376708984, "global_step": 122980, "epoch": 1016} {"train_loss": -37.829978942871094, "global_step": 122981, "epoch": 1016} {"train_loss": -38.00954055786133, "global_step": 122982, "epoch": 1016} {"train_loss": -37.97806930541992, "global_step": 122983, "epoch": 1016} {"train_loss": -38.277374267578125, "global_step": 122984, "epoch": 1016} {"train_loss": -37.71269607543945, "global_step": 122985, "epoch": 1016} {"train_loss": -38.120174407958984, "global_step": 122986, "epoch": 1016} {"train_loss": -37.33091354370117, "global_step": 122987, "epoch": 1016} {"train_loss": -37.433162689208984, "global_step": 122988, "epoch": 1016} {"train_loss": -38.02204132080078, "global_step": 122989, "epoch": 1016} {"train_loss": -37.919734954833984, "global_step": 122990, "epoch": 1016} {"train_loss": -38.28304672241211, "global_step": 122991, "epoch": 1016} {"train_loss": -38.358917236328125, "global_step": 122992, "epoch": 1016} {"train_loss": -38.334259033203125, "global_step": 122993, "epoch": 1016} {"train_loss": -37.57244873046875, "global_step": 122994, "epoch": 1016} {"train_loss": -38.65414047241211, "global_step": 122995, "epoch": 1016} {"train_loss": -38.67454528808594, "global_step": 122996, "epoch": 1016} {"train_loss": -38.33673095703125, "global_step": 122997, "epoch": 1016} {"train_loss": -38.322811126708984, "global_step": 122998, "epoch": 1016} {"train_loss": -37.9772834777832, "global_step": 122999, "epoch": 1016} {"train_loss": -38.22861862182617, "global_step": 123000, "epoch": 1016} {"train_loss": -38.805416107177734, "global_step": 123001, "epoch": 1016} {"train_loss": -38.163307189941406, "global_step": 123002, "epoch": 1016} {"train_loss": -38.10740280151367, "global_step": 123003, "epoch": 1016} {"train_loss": -37.30808639526367, "global_step": 123004, "epoch": 1016} {"train_loss": -38.14474105834961, "global_step": 123005, "epoch": 1016} {"train_loss": -36.95258712768555, "global_step": 123006, "epoch": 1016} {"train_loss": -38.361412048339844, "global_step": 123007, "epoch": 1016} {"train_loss": -38.489315032958984, "global_step": 123008, "epoch": 1016} {"train_loss": -31.080657958984375, "global_step": 123009, "epoch": 1016} {"train_loss": -37.543697357177734, "global_step": 123010, "epoch": 1016} {"train_loss": -38.419185638427734, "global_step": 123011, "epoch": 1016} {"train_loss": -35.414833068847656, "global_step": 123012, "epoch": 1016} {"train_loss": -37.49225997924805, "global_step": 123013, "epoch": 1016} {"train_loss": -37.44752883911133, "global_step": 123014, "epoch": 1016} {"train_loss": -37.92882537841797, "global_step": 123015, "epoch": 1016} {"train_loss": -36.670833587646484, "global_step": 123016, "epoch": 1016} {"train_loss": -36.95901107788086, "global_step": 123017, "epoch": 1016} {"train_loss": -37.13545227050781, "global_step": 123018, "epoch": 1016} {"train_loss": -37.6505241394043, "global_step": 123019, "epoch": 1016} {"train_loss": -37.805694580078125, "global_step": 123020, "epoch": 1016} {"train_loss": -36.13603591918945, "global_step": 123021, "epoch": 1016} {"train_loss": -37.5880241394043, "global_step": 123022, "epoch": 1016} {"train_loss": -38.225955963134766, "global_step": 123023, "epoch": 1016} {"train_loss": -38.03627395629883, "global_step": 123024, "epoch": 1016} {"train_loss": -37.85974884033203, "global_step": 123025, "epoch": 1016} {"train_loss": -37.8385124206543, "global_step": 123026, "epoch": 1016} {"train_loss": -36.51849365234375, "global_step": 123027, "epoch": 1016} {"train_loss": -37.25738525390625, "global_step": 123028, "epoch": 1016} {"train_loss": -36.875831604003906, "global_step": 123029, "epoch": 1016} {"train_loss": -37.22487258911133, "global_step": 123030, "epoch": 1016} {"train_loss": -36.7130012512207, "global_step": 123031, "epoch": 1016} {"train_loss": -35.09113693237305, "global_step": 123032, "epoch": 1016} {"train_loss": -36.33259201049805, "global_step": 123033, "epoch": 1016} {"train_loss": -36.77082443237305, "global_step": 123034, "epoch": 1016} {"train_loss": -36.62079620361328, "global_step": 123035, "epoch": 1016} {"train_loss": -35.138893127441406, "global_step": 123036, "epoch": 1016} {"train_loss": -36.100826263427734, "global_step": 123037, "epoch": 1016} {"train_loss": -35.051429748535156, "global_step": 123038, "epoch": 1016} {"train_loss": -37.455806732177734, "global_step": 123039, "epoch": 1016} {"train_loss": -36.6116943359375, "global_step": 123040, "epoch": 1016} {"train_loss": -36.23908233642578, "global_step": 123041, "epoch": 1016} {"train_loss": -37.38462448120117, "global_step": 123042, "epoch": 1016} {"train_loss": -35.18520736694336, "global_step": 123043, "epoch": 1016} {"train_loss": -36.81031036376953, "global_step": 123044, "epoch": 1016} {"train_loss": -36.896419525146484, "global_step": 123045, "epoch": 1016} {"train_loss": -37.349361419677734, "global_step": 123046, "epoch": 1016} {"train_loss": -37.128475189208984, "global_step": 123047, "epoch": 1016} {"train_loss": -36.46848678588867, "global_step": 123048, "epoch": 1016} {"train_loss": -37.42033004760742, "global_step": 123049, "epoch": 1016} {"train_loss": -35.8902702331543, "global_step": 123050, "epoch": 1016} {"train_loss": -38.36418533325195, "global_step": 123051, "epoch": 1016} {"train_loss": -37.1926155090332, "global_step": 123052, "epoch": 1016} {"train_loss": -36.401336669921875, "global_step": 123053, "epoch": 1016} {"train_loss": -37.338104248046875, "global_step": 123054, "epoch": 1016} {"train_loss": -36.508270263671875, "global_step": 123055, "epoch": 1016} {"train_loss": -37.321002613414414, "global_step": 123056, "epoch": 1016, "val_loss": 2654241.75} {"train_loss": -37.17402267456055, "global_step": 123057, "epoch": 1017} {"train_loss": -35.85798263549805, "global_step": 123058, "epoch": 1017} {"train_loss": -37.40568161010742, "global_step": 123059, "epoch": 1017} {"train_loss": -37.34722900390625, "global_step": 123060, "epoch": 1017} {"train_loss": -35.58899688720703, "global_step": 123061, "epoch": 1017} {"train_loss": -35.99591064453125, "global_step": 123062, "epoch": 1017} {"train_loss": -36.18367385864258, "global_step": 123063, "epoch": 1017} {"train_loss": -37.90039825439453, "global_step": 123064, "epoch": 1017} {"train_loss": -36.706729888916016, "global_step": 123065, "epoch": 1017} {"train_loss": -35.7666130065918, "global_step": 123066, "epoch": 1017} {"train_loss": -35.384151458740234, "global_step": 123067, "epoch": 1017} {"train_loss": -37.75382614135742, "global_step": 123068, "epoch": 1017} {"train_loss": -37.43157958984375, "global_step": 123069, "epoch": 1017} {"train_loss": -37.007568359375, "global_step": 123070, "epoch": 1017} {"train_loss": -36.368934631347656, "global_step": 123071, "epoch": 1017} {"train_loss": -37.33135223388672, "global_step": 123072, "epoch": 1017} {"train_loss": -37.424739837646484, "global_step": 123073, "epoch": 1017} {"train_loss": -36.35946273803711, "global_step": 123074, "epoch": 1017} {"train_loss": -37.67951583862305, "global_step": 123075, "epoch": 1017} {"train_loss": -37.11456298828125, "global_step": 123076, "epoch": 1017} {"train_loss": -37.889892578125, "global_step": 123077, "epoch": 1017} {"train_loss": -35.93830490112305, "global_step": 123078, "epoch": 1017} {"train_loss": -38.30501937866211, "global_step": 123079, "epoch": 1017} {"train_loss": -37.57996368408203, "global_step": 123080, "epoch": 1017} {"train_loss": -37.541351318359375, "global_step": 123081, "epoch": 1017} {"train_loss": -37.72325134277344, "global_step": 123082, "epoch": 1017} {"train_loss": -37.01367950439453, "global_step": 123083, "epoch": 1017} {"train_loss": -38.1002311706543, "global_step": 123084, "epoch": 1017} {"train_loss": -37.343814849853516, "global_step": 123085, "epoch": 1017} {"train_loss": -37.8491096496582, "global_step": 123086, "epoch": 1017} {"train_loss": -36.86050033569336, "global_step": 123087, "epoch": 1017} {"train_loss": -38.44709014892578, "global_step": 123088, "epoch": 1017} {"train_loss": -37.5953369140625, "global_step": 123089, "epoch": 1017} {"train_loss": -38.32413864135742, "global_step": 123090, "epoch": 1017} {"train_loss": -37.956050872802734, "global_step": 123091, "epoch": 1017} {"train_loss": -38.41773986816406, "global_step": 123092, "epoch": 1017} {"train_loss": -37.68413162231445, "global_step": 123093, "epoch": 1017} {"train_loss": -37.39161682128906, "global_step": 123094, "epoch": 1017} {"train_loss": -37.962860107421875, "global_step": 123095, "epoch": 1017} {"train_loss": -38.03829574584961, "global_step": 123096, "epoch": 1017} {"train_loss": -37.759639739990234, "global_step": 123097, "epoch": 1017} {"train_loss": -37.19807815551758, "global_step": 123098, "epoch": 1017} {"train_loss": -38.141727447509766, "global_step": 123099, "epoch": 1017} {"train_loss": -37.96730422973633, "global_step": 123100, "epoch": 1017} {"train_loss": -36.99631881713867, "global_step": 123101, "epoch": 1017} {"train_loss": -36.79616165161133, "global_step": 123102, "epoch": 1017} {"train_loss": -36.046077728271484, "global_step": 123103, "epoch": 1017} {"train_loss": -36.07368087768555, "global_step": 123104, "epoch": 1017} {"train_loss": -38.2398796081543, "global_step": 123105, "epoch": 1017} {"train_loss": -37.13045883178711, "global_step": 123106, "epoch": 1017} {"train_loss": -36.0512809753418, "global_step": 123107, "epoch": 1017} {"train_loss": -35.17831039428711, "global_step": 123108, "epoch": 1017} {"train_loss": -37.460243225097656, "global_step": 123109, "epoch": 1017} {"train_loss": -38.260860443115234, "global_step": 123110, "epoch": 1017} {"train_loss": -36.04775619506836, "global_step": 123111, "epoch": 1017} {"train_loss": -34.28858184814453, "global_step": 123112, "epoch": 1017} {"train_loss": -39.12250518798828, "global_step": 123113, "epoch": 1017} {"train_loss": -37.07338333129883, "global_step": 123114, "epoch": 1017} {"train_loss": -37.38927459716797, "global_step": 123115, "epoch": 1017} {"train_loss": -37.84090805053711, "global_step": 123116, "epoch": 1017} {"train_loss": -36.03853988647461, "global_step": 123117, "epoch": 1017} {"train_loss": -38.19649887084961, "global_step": 123118, "epoch": 1017} {"train_loss": -37.948944091796875, "global_step": 123119, "epoch": 1017} {"train_loss": -37.769283294677734, "global_step": 123120, "epoch": 1017} {"train_loss": -37.800941467285156, "global_step": 123121, "epoch": 1017} {"train_loss": -38.029476165771484, "global_step": 123122, "epoch": 1017} {"train_loss": -37.71856689453125, "global_step": 123123, "epoch": 1017} {"train_loss": -37.52649688720703, "global_step": 123124, "epoch": 1017} {"train_loss": -38.10924530029297, "global_step": 123125, "epoch": 1017} {"train_loss": -37.06183624267578, "global_step": 123126, "epoch": 1017} {"train_loss": -38.96245193481445, "global_step": 123127, "epoch": 1017} {"train_loss": -36.69342041015625, "global_step": 123128, "epoch": 1017} {"train_loss": -38.50358200073242, "global_step": 123129, "epoch": 1017} {"train_loss": -38.758785247802734, "global_step": 123130, "epoch": 1017} {"train_loss": -38.214744567871094, "global_step": 123131, "epoch": 1017} {"train_loss": -38.073543548583984, "global_step": 123132, "epoch": 1017} {"train_loss": -38.318885803222656, "global_step": 123133, "epoch": 1017} {"train_loss": -38.018733978271484, "global_step": 123134, "epoch": 1017} {"train_loss": -38.42604446411133, "global_step": 123135, "epoch": 1017} {"train_loss": -38.642032623291016, "global_step": 123136, "epoch": 1017} {"train_loss": -37.94256591796875, "global_step": 123137, "epoch": 1017} {"train_loss": -38.039642333984375, "global_step": 123138, "epoch": 1017} {"train_loss": -38.29761505126953, "global_step": 123139, "epoch": 1017} {"train_loss": -38.80253982543945, "global_step": 123140, "epoch": 1017} {"train_loss": -38.71170425415039, "global_step": 123141, "epoch": 1017} {"train_loss": -38.57155227661133, "global_step": 123142, "epoch": 1017} {"train_loss": -37.98740768432617, "global_step": 123143, "epoch": 1017} {"train_loss": -38.642452239990234, "global_step": 123144, "epoch": 1017} {"train_loss": -38.76294708251953, "global_step": 123145, "epoch": 1017} {"train_loss": -38.608795166015625, "global_step": 123146, "epoch": 1017} {"train_loss": -38.7535514831543, "global_step": 123147, "epoch": 1017} {"train_loss": -39.76152420043945, "global_step": 123148, "epoch": 1017} {"train_loss": -38.81596374511719, "global_step": 123149, "epoch": 1017} {"train_loss": -39.41212463378906, "global_step": 123150, "epoch": 1017} {"train_loss": -39.045082092285156, "global_step": 123151, "epoch": 1017} {"train_loss": -39.117897033691406, "global_step": 123152, "epoch": 1017} {"train_loss": -39.176753997802734, "global_step": 123153, "epoch": 1017} {"train_loss": -38.72943115234375, "global_step": 123154, "epoch": 1017} {"train_loss": -39.18349075317383, "global_step": 123155, "epoch": 1017} {"train_loss": -39.5764274597168, "global_step": 123156, "epoch": 1017} {"train_loss": -38.693050384521484, "global_step": 123157, "epoch": 1017} {"train_loss": -39.00486373901367, "global_step": 123158, "epoch": 1017} {"train_loss": -39.19129943847656, "global_step": 123159, "epoch": 1017} {"train_loss": -39.24982833862305, "global_step": 123160, "epoch": 1017} {"train_loss": -39.824153900146484, "global_step": 123161, "epoch": 1017} {"train_loss": -39.20029830932617, "global_step": 123162, "epoch": 1017} {"train_loss": -39.71208190917969, "global_step": 123163, "epoch": 1017} {"train_loss": -39.813045501708984, "global_step": 123164, "epoch": 1017} {"train_loss": -39.25606155395508, "global_step": 123165, "epoch": 1017} {"train_loss": -39.64571762084961, "global_step": 123166, "epoch": 1017} {"train_loss": -39.3159294128418, "global_step": 123167, "epoch": 1017} {"train_loss": -39.995391845703125, "global_step": 123168, "epoch": 1017} {"train_loss": -39.547096252441406, "global_step": 123169, "epoch": 1017} {"train_loss": -39.445098876953125, "global_step": 123170, "epoch": 1017} {"train_loss": -39.42196273803711, "global_step": 123171, "epoch": 1017} {"train_loss": -39.3121337890625, "global_step": 123172, "epoch": 1017} {"train_loss": -38.887081146240234, "global_step": 123173, "epoch": 1017} {"train_loss": -39.82194900512695, "global_step": 123174, "epoch": 1017} {"train_loss": -39.420753479003906, "global_step": 123175, "epoch": 1017} {"train_loss": -39.562110900878906, "global_step": 123176, "epoch": 1017} {"train_loss": -37.95911114274963, "global_step": 123177, "epoch": 1017, "val_loss": 2641053.75} {"train_loss": -39.296504974365234, "global_step": 123178, "epoch": 1018} {"train_loss": -39.42783737182617, "global_step": 123179, "epoch": 1018} {"train_loss": -38.29069137573242, "global_step": 123180, "epoch": 1018} {"train_loss": -39.16267776489258, "global_step": 123181, "epoch": 1018} {"train_loss": -39.77262878417969, "global_step": 123182, "epoch": 1018} {"train_loss": -39.86647415161133, "global_step": 123183, "epoch": 1018} {"train_loss": -39.75485610961914, "global_step": 123184, "epoch": 1018} {"train_loss": -39.217952728271484, "global_step": 123185, "epoch": 1018} {"train_loss": -34.154563903808594, "global_step": 123186, "epoch": 1018} {"train_loss": -27.91522789001465, "global_step": 123187, "epoch": 1018} {"train_loss": -13.092005729675293, "global_step": 123188, "epoch": 1018} {"train_loss": -4.803733825683594, "global_step": 123189, "epoch": 1018} {"train_loss": -25.911840438842773, "global_step": 123190, "epoch": 1018} {"train_loss": -30.54355239868164, "global_step": 123191, "epoch": 1018} {"train_loss": -24.964405059814453, "global_step": 123192, "epoch": 1018} {"train_loss": -32.85663986206055, "global_step": 123193, "epoch": 1018} {"train_loss": -32.72806930541992, "global_step": 123194, "epoch": 1018} {"train_loss": -33.22027587890625, "global_step": 123195, "epoch": 1018} {"train_loss": -35.136226654052734, "global_step": 123196, "epoch": 1018} {"train_loss": -33.41286087036133, "global_step": 123197, "epoch": 1018} {"train_loss": -35.84711456298828, "global_step": 123198, "epoch": 1018} {"train_loss": -33.349117279052734, "global_step": 123199, "epoch": 1018} {"train_loss": -36.055843353271484, "global_step": 123200, "epoch": 1018} {"train_loss": -35.040775299072266, "global_step": 123201, "epoch": 1018} {"train_loss": -33.15516662597656, "global_step": 123202, "epoch": 1018} {"train_loss": -37.03855895996094, "global_step": 123203, "epoch": 1018} {"train_loss": -32.30643081665039, "global_step": 123204, "epoch": 1018} {"train_loss": -36.52449035644531, "global_step": 123205, "epoch": 1018} {"train_loss": -36.473602294921875, "global_step": 123206, "epoch": 1018} {"train_loss": -36.71263122558594, "global_step": 123207, "epoch": 1018} {"train_loss": -36.36787033081055, "global_step": 123208, "epoch": 1018} {"train_loss": -36.802486419677734, "global_step": 123209, "epoch": 1018} {"train_loss": -36.95893859863281, "global_step": 123210, "epoch": 1018} {"train_loss": -36.63261032104492, "global_step": 123211, "epoch": 1018} {"train_loss": -37.09696578979492, "global_step": 123212, "epoch": 1018} {"train_loss": -37.883052825927734, "global_step": 123213, "epoch": 1018} {"train_loss": -37.282196044921875, "global_step": 123214, "epoch": 1018} {"train_loss": -37.28341293334961, "global_step": 123215, "epoch": 1018} {"train_loss": -38.003028869628906, "global_step": 123216, "epoch": 1018} {"train_loss": -38.054840087890625, "global_step": 123217, "epoch": 1018} {"train_loss": -38.10601806640625, "global_step": 123218, "epoch": 1018} {"train_loss": -37.86699295043945, "global_step": 123219, "epoch": 1018} {"train_loss": -37.85697555541992, "global_step": 123220, "epoch": 1018} {"train_loss": -38.316551208496094, "global_step": 123221, "epoch": 1018} {"train_loss": -38.386600494384766, "global_step": 123222, "epoch": 1018} {"train_loss": -38.023433685302734, "global_step": 123223, "epoch": 1018} {"train_loss": -38.372249603271484, "global_step": 123224, "epoch": 1018} {"train_loss": -37.955230712890625, "global_step": 123225, "epoch": 1018} {"train_loss": -38.29725646972656, "global_step": 123226, "epoch": 1018} {"train_loss": -38.843807220458984, "global_step": 123227, "epoch": 1018} {"train_loss": -39.1441650390625, "global_step": 123228, "epoch": 1018} {"train_loss": -38.220577239990234, "global_step": 123229, "epoch": 1018} {"train_loss": -38.332916259765625, "global_step": 123230, "epoch": 1018} {"train_loss": -38.571632385253906, "global_step": 123231, "epoch": 1018} {"train_loss": -37.997554779052734, "global_step": 123232, "epoch": 1018} {"train_loss": -38.98566436767578, "global_step": 123233, "epoch": 1018} {"train_loss": -38.52765655517578, "global_step": 123234, "epoch": 1018} {"train_loss": -38.259700775146484, "global_step": 123235, "epoch": 1018} {"train_loss": -38.85489273071289, "global_step": 123236, "epoch": 1018} {"train_loss": -38.94989776611328, "global_step": 123237, "epoch": 1018} {"train_loss": -39.46416091918945, "global_step": 123238, "epoch": 1018} {"train_loss": -39.091949462890625, "global_step": 123239, "epoch": 1018} {"train_loss": -38.789527893066406, "global_step": 123240, "epoch": 1018} {"train_loss": -38.75746536254883, "global_step": 123241, "epoch": 1018} {"train_loss": -39.349666595458984, "global_step": 123242, "epoch": 1018} {"train_loss": -38.87632369995117, "global_step": 123243, "epoch": 1018} {"train_loss": -38.99817657470703, "global_step": 123244, "epoch": 1018} {"train_loss": -38.96992111206055, "global_step": 123245, "epoch": 1018} {"train_loss": -38.81914138793945, "global_step": 123246, "epoch": 1018} {"train_loss": -39.26892852783203, "global_step": 123247, "epoch": 1018} {"train_loss": -39.205299377441406, "global_step": 123248, "epoch": 1018} {"train_loss": -39.17782211303711, "global_step": 123249, "epoch": 1018} {"train_loss": -39.11725997924805, "global_step": 123250, "epoch": 1018} {"train_loss": -39.190040588378906, "global_step": 123251, "epoch": 1018} {"train_loss": -39.14039993286133, "global_step": 123252, "epoch": 1018} {"train_loss": -39.75642013549805, "global_step": 123253, "epoch": 1018} {"train_loss": -38.9579963684082, "global_step": 123254, "epoch": 1018} {"train_loss": -39.47734451293945, "global_step": 123255, "epoch": 1018} {"train_loss": -38.98714065551758, "global_step": 123256, "epoch": 1018} {"train_loss": -39.48816680908203, "global_step": 123257, "epoch": 1018} {"train_loss": -39.022579193115234, "global_step": 123258, "epoch": 1018} {"train_loss": -39.54058837890625, "global_step": 123259, "epoch": 1018} {"train_loss": -39.59012985229492, "global_step": 123260, "epoch": 1018} {"train_loss": -37.78059005737305, "global_step": 123261, "epoch": 1018} {"train_loss": -38.24882125854492, "global_step": 123262, "epoch": 1018} {"train_loss": -39.43635940551758, "global_step": 123263, "epoch": 1018} {"train_loss": -38.62035369873047, "global_step": 123264, "epoch": 1018} {"train_loss": -38.82257843017578, "global_step": 123265, "epoch": 1018} {"train_loss": -39.64622116088867, "global_step": 123266, "epoch": 1018} {"train_loss": -39.574440002441406, "global_step": 123267, "epoch": 1018} {"train_loss": -39.7103271484375, "global_step": 123268, "epoch": 1018} {"train_loss": -38.9034309387207, "global_step": 123269, "epoch": 1018} {"train_loss": -38.88692855834961, "global_step": 123270, "epoch": 1018} {"train_loss": -39.97932815551758, "global_step": 123271, "epoch": 1018} {"train_loss": -40.041011810302734, "global_step": 123272, "epoch": 1018} {"train_loss": -39.003028869628906, "global_step": 123273, "epoch": 1018} {"train_loss": -39.64667892456055, "global_step": 123274, "epoch": 1018} {"train_loss": -39.68309020996094, "global_step": 123275, "epoch": 1018} {"train_loss": -40.063045501708984, "global_step": 123276, "epoch": 1018} {"train_loss": -40.05762481689453, "global_step": 123277, "epoch": 1018} {"train_loss": -38.83120346069336, "global_step": 123278, "epoch": 1018} {"train_loss": -38.89335250854492, "global_step": 123279, "epoch": 1018} {"train_loss": -39.44807815551758, "global_step": 123280, "epoch": 1018} {"train_loss": -38.877079010009766, "global_step": 123281, "epoch": 1018} {"train_loss": -37.49544906616211, "global_step": 123282, "epoch": 1018} {"train_loss": -39.20640182495117, "global_step": 123283, "epoch": 1018} {"train_loss": -39.46184158325195, "global_step": 123284, "epoch": 1018} {"train_loss": -38.37485885620117, "global_step": 123285, "epoch": 1018} {"train_loss": -38.997840881347656, "global_step": 123286, "epoch": 1018} {"train_loss": -35.9745979309082, "global_step": 123287, "epoch": 1018} {"train_loss": -32.076961517333984, "global_step": 123288, "epoch": 1018} {"train_loss": -30.20342445373535, "global_step": 123289, "epoch": 1018} {"train_loss": -37.318363189697266, "global_step": 123290, "epoch": 1018} {"train_loss": -37.486671447753906, "global_step": 123291, "epoch": 1018} {"train_loss": -31.856351852416992, "global_step": 123292, "epoch": 1018} {"train_loss": -36.928836822509766, "global_step": 123293, "epoch": 1018} {"train_loss": -37.09183120727539, "global_step": 123294, "epoch": 1018} {"train_loss": -33.72978973388672, "global_step": 123295, "epoch": 1018} {"train_loss": -38.13298034667969, "global_step": 123296, "epoch": 1018} {"train_loss": -34.8151741027832, "global_step": 123297, "epoch": 1018} {"train_loss": -37.00394908652818, "global_step": 123298, "epoch": 1018, "val_loss": 2644825.25} {"train_loss": -36.037662506103516, "global_step": 123299, "epoch": 1019} {"train_loss": -35.84590148925781, "global_step": 123300, "epoch": 1019} {"train_loss": -35.990238189697266, "global_step": 123301, "epoch": 1019} {"train_loss": -37.71994400024414, "global_step": 123302, "epoch": 1019} {"train_loss": -36.65923309326172, "global_step": 123303, "epoch": 1019} {"train_loss": -37.38870620727539, "global_step": 123304, "epoch": 1019} {"train_loss": -37.84885787963867, "global_step": 123305, "epoch": 1019} {"train_loss": -35.11356735229492, "global_step": 123306, "epoch": 1019} {"train_loss": -37.919769287109375, "global_step": 123307, "epoch": 1019} {"train_loss": -37.72590255737305, "global_step": 123308, "epoch": 1019} {"train_loss": -37.405372619628906, "global_step": 123309, "epoch": 1019} {"train_loss": -37.86640548706055, "global_step": 123310, "epoch": 1019} {"train_loss": -37.64670181274414, "global_step": 123311, "epoch": 1019} {"train_loss": -38.326969146728516, "global_step": 123312, "epoch": 1019} {"train_loss": -37.7052116394043, "global_step": 123313, "epoch": 1019} {"train_loss": -38.22637939453125, "global_step": 123314, "epoch": 1019} {"train_loss": -37.757171630859375, "global_step": 123315, "epoch": 1019} {"train_loss": -37.907196044921875, "global_step": 123316, "epoch": 1019} {"train_loss": -38.711158752441406, "global_step": 123317, "epoch": 1019} {"train_loss": -38.82538986206055, "global_step": 123318, "epoch": 1019} {"train_loss": -38.33634567260742, "global_step": 123319, "epoch": 1019} {"train_loss": -37.711578369140625, "global_step": 123320, "epoch": 1019} {"train_loss": -37.88496780395508, "global_step": 123321, "epoch": 1019} {"train_loss": -37.6865348815918, "global_step": 123322, "epoch": 1019} {"train_loss": -36.57729721069336, "global_step": 123323, "epoch": 1019} {"train_loss": -33.73910140991211, "global_step": 123324, "epoch": 1019} {"train_loss": -34.30572509765625, "global_step": 123325, "epoch": 1019} {"train_loss": -38.445796966552734, "global_step": 123326, "epoch": 1019} {"train_loss": -38.81622314453125, "global_step": 123327, "epoch": 1019} {"train_loss": -35.14509201049805, "global_step": 123328, "epoch": 1019} {"train_loss": -36.711875915527344, "global_step": 123329, "epoch": 1019} {"train_loss": -37.18952560424805, "global_step": 123330, "epoch": 1019} {"train_loss": -36.87470626831055, "global_step": 123331, "epoch": 1019} {"train_loss": -37.22700119018555, "global_step": 123332, "epoch": 1019} {"train_loss": -34.085472106933594, "global_step": 123333, "epoch": 1019} {"train_loss": -36.60825729370117, "global_step": 123334, "epoch": 1019} {"train_loss": -39.00701141357422, "global_step": 123335, "epoch": 1019} {"train_loss": -37.27056121826172, "global_step": 123336, "epoch": 1019} {"train_loss": -37.907135009765625, "global_step": 123337, "epoch": 1019} {"train_loss": -33.92512893676758, "global_step": 123338, "epoch": 1019} {"train_loss": -36.59514617919922, "global_step": 123339, "epoch": 1019} {"train_loss": -35.3174934387207, "global_step": 123340, "epoch": 1019} {"train_loss": -37.130462646484375, "global_step": 123341, "epoch": 1019} {"train_loss": -37.98335266113281, "global_step": 123342, "epoch": 1019} {"train_loss": -38.12047576904297, "global_step": 123343, "epoch": 1019} {"train_loss": -37.1754264831543, "global_step": 123344, "epoch": 1019} {"train_loss": -32.98970413208008, "global_step": 123345, "epoch": 1019} {"train_loss": -37.05137634277344, "global_step": 123346, "epoch": 1019} {"train_loss": -37.019954681396484, "global_step": 123347, "epoch": 1019} {"train_loss": -36.54150390625, "global_step": 123348, "epoch": 1019} {"train_loss": -36.2790641784668, "global_step": 123349, "epoch": 1019} {"train_loss": -35.20074462890625, "global_step": 123350, "epoch": 1019} {"train_loss": -37.61228561401367, "global_step": 123351, "epoch": 1019} {"train_loss": -37.71827697753906, "global_step": 123352, "epoch": 1019} {"train_loss": -36.3338508605957, "global_step": 123353, "epoch": 1019} {"train_loss": -36.3518180847168, "global_step": 123354, "epoch": 1019} {"train_loss": -37.2563591003418, "global_step": 123355, "epoch": 1019} {"train_loss": -38.11178970336914, "global_step": 123356, "epoch": 1019} {"train_loss": -36.90058135986328, "global_step": 123357, "epoch": 1019} {"train_loss": -37.12934112548828, "global_step": 123358, "epoch": 1019} {"train_loss": -37.93303298950195, "global_step": 123359, "epoch": 1019} {"train_loss": -37.51993179321289, "global_step": 123360, "epoch": 1019} {"train_loss": -37.549354553222656, "global_step": 123361, "epoch": 1019} {"train_loss": -38.704158782958984, "global_step": 123362, "epoch": 1019} {"train_loss": -38.40435028076172, "global_step": 123363, "epoch": 1019} {"train_loss": -38.42983627319336, "global_step": 123364, "epoch": 1019} {"train_loss": -38.1096076965332, "global_step": 123365, "epoch": 1019} {"train_loss": -38.24495315551758, "global_step": 123366, "epoch": 1019} {"train_loss": -37.56806182861328, "global_step": 123367, "epoch": 1019} {"train_loss": -38.19453811645508, "global_step": 123368, "epoch": 1019} {"train_loss": -38.144771575927734, "global_step": 123369, "epoch": 1019} {"train_loss": -38.00343704223633, "global_step": 123370, "epoch": 1019} {"train_loss": -38.06464385986328, "global_step": 123371, "epoch": 1019} {"train_loss": -38.520294189453125, "global_step": 123372, "epoch": 1019} {"train_loss": -37.990657806396484, "global_step": 123373, "epoch": 1019} {"train_loss": -38.06004333496094, "global_step": 123374, "epoch": 1019} {"train_loss": -37.73078918457031, "global_step": 123375, "epoch": 1019} {"train_loss": -38.206844329833984, "global_step": 123376, "epoch": 1019} {"train_loss": -38.181129455566406, "global_step": 123377, "epoch": 1019} {"train_loss": -37.13836669921875, "global_step": 123378, "epoch": 1019} {"train_loss": -36.712806701660156, "global_step": 123379, "epoch": 1019} {"train_loss": -36.79252243041992, "global_step": 123380, "epoch": 1019} {"train_loss": -37.785133361816406, "global_step": 123381, "epoch": 1019} {"train_loss": -37.26566696166992, "global_step": 123382, "epoch": 1019} {"train_loss": -37.61965560913086, "global_step": 123383, "epoch": 1019} {"train_loss": -38.621742248535156, "global_step": 123384, "epoch": 1019} {"train_loss": -38.386505126953125, "global_step": 123385, "epoch": 1019} {"train_loss": -38.55375289916992, "global_step": 123386, "epoch": 1019} {"train_loss": -38.887184143066406, "global_step": 123387, "epoch": 1019} {"train_loss": -38.612037658691406, "global_step": 123388, "epoch": 1019} {"train_loss": -38.80820083618164, "global_step": 123389, "epoch": 1019} {"train_loss": -38.334346771240234, "global_step": 123390, "epoch": 1019} {"train_loss": -38.5385627746582, "global_step": 123391, "epoch": 1019} {"train_loss": -39.00977325439453, "global_step": 123392, "epoch": 1019} {"train_loss": -35.95228958129883, "global_step": 123393, "epoch": 1019} {"train_loss": -37.84634017944336, "global_step": 123394, "epoch": 1019} {"train_loss": -37.926963806152344, "global_step": 123395, "epoch": 1019} {"train_loss": -39.038246154785156, "global_step": 123396, "epoch": 1019} {"train_loss": -39.05251693725586, "global_step": 123397, "epoch": 1019} {"train_loss": -38.63642501831055, "global_step": 123398, "epoch": 1019} {"train_loss": -38.682044982910156, "global_step": 123399, "epoch": 1019} {"train_loss": -38.882686614990234, "global_step": 123400, "epoch": 1019} {"train_loss": -37.57255172729492, "global_step": 123401, "epoch": 1019} {"train_loss": -38.021034240722656, "global_step": 123402, "epoch": 1019} {"train_loss": -38.81231689453125, "global_step": 123403, "epoch": 1019} {"train_loss": -39.280269622802734, "global_step": 123404, "epoch": 1019} {"train_loss": -38.136505126953125, "global_step": 123405, "epoch": 1019} {"train_loss": -38.81745529174805, "global_step": 123406, "epoch": 1019} {"train_loss": -38.27385711669922, "global_step": 123407, "epoch": 1019} {"train_loss": -39.0030517578125, "global_step": 123408, "epoch": 1019} {"train_loss": -38.39612579345703, "global_step": 123409, "epoch": 1019} {"train_loss": -39.25782012939453, "global_step": 123410, "epoch": 1019} {"train_loss": -39.10902786254883, "global_step": 123411, "epoch": 1019} {"train_loss": -38.522804260253906, "global_step": 123412, "epoch": 1019} {"train_loss": -38.622249603271484, "global_step": 123413, "epoch": 1019} {"train_loss": -39.245243072509766, "global_step": 123414, "epoch": 1019} {"train_loss": -39.330448150634766, "global_step": 123415, "epoch": 1019} {"train_loss": -38.91355514526367, "global_step": 123416, "epoch": 1019} {"train_loss": -39.00571823120117, "global_step": 123417, "epoch": 1019} {"train_loss": -38.794857025146484, "global_step": 123418, "epoch": 1019} {"train_loss": -37.650830828453884, "global_step": 123419, "epoch": 1019, "val_loss": 2650098.0} {"train_loss": -39.50551986694336, "global_step": 123420, "epoch": 1020} {"train_loss": -37.83625411987305, "global_step": 123421, "epoch": 1020} {"train_loss": -38.72584915161133, "global_step": 123422, "epoch": 1020} {"train_loss": -39.49333953857422, "global_step": 123423, "epoch": 1020} {"train_loss": -39.83901596069336, "global_step": 123424, "epoch": 1020} {"train_loss": -39.560420989990234, "global_step": 123425, "epoch": 1020} {"train_loss": -38.639892578125, "global_step": 123426, "epoch": 1020} {"train_loss": -39.22871017456055, "global_step": 123427, "epoch": 1020} {"train_loss": -39.704193115234375, "global_step": 123428, "epoch": 1020} {"train_loss": -39.627986907958984, "global_step": 123429, "epoch": 1020} {"train_loss": -36.66230392456055, "global_step": 123430, "epoch": 1020} {"train_loss": -39.26466369628906, "global_step": 123431, "epoch": 1020} {"train_loss": -38.47652816772461, "global_step": 123432, "epoch": 1020} {"train_loss": -39.04196548461914, "global_step": 123433, "epoch": 1020} {"train_loss": -38.03293991088867, "global_step": 123434, "epoch": 1020} {"train_loss": -39.07304000854492, "global_step": 123435, "epoch": 1020} {"train_loss": -38.46492385864258, "global_step": 123436, "epoch": 1020} {"train_loss": -39.460819244384766, "global_step": 123437, "epoch": 1020} {"train_loss": -39.3551025390625, "global_step": 123438, "epoch": 1020} {"train_loss": -39.6738166809082, "global_step": 123439, "epoch": 1020} {"train_loss": -39.36002731323242, "global_step": 123440, "epoch": 1020} {"train_loss": -39.27458572387695, "global_step": 123441, "epoch": 1020} {"train_loss": -39.408504486083984, "global_step": 123442, "epoch": 1020} {"train_loss": -38.891109466552734, "global_step": 123443, "epoch": 1020} {"train_loss": -37.59507369995117, "global_step": 123444, "epoch": 1020} {"train_loss": -38.408912658691406, "global_step": 123445, "epoch": 1020} {"train_loss": -37.435577392578125, "global_step": 123446, "epoch": 1020} {"train_loss": -37.76041793823242, "global_step": 123447, "epoch": 1020} {"train_loss": -36.841739654541016, "global_step": 123448, "epoch": 1020} {"train_loss": -36.01084899902344, "global_step": 123449, "epoch": 1020} {"train_loss": -37.623382568359375, "global_step": 123450, "epoch": 1020} {"train_loss": -38.18384552001953, "global_step": 123451, "epoch": 1020} {"train_loss": -39.00454330444336, "global_step": 123452, "epoch": 1020} {"train_loss": -38.99046325683594, "global_step": 123453, "epoch": 1020} {"train_loss": -38.47224807739258, "global_step": 123454, "epoch": 1020} {"train_loss": -38.66311264038086, "global_step": 123455, "epoch": 1020} {"train_loss": -38.90127182006836, "global_step": 123456, "epoch": 1020} {"train_loss": -37.86012649536133, "global_step": 123457, "epoch": 1020} {"train_loss": -37.281982421875, "global_step": 123458, "epoch": 1020} {"train_loss": -36.9422721862793, "global_step": 123459, "epoch": 1020} {"train_loss": -39.55741500854492, "global_step": 123460, "epoch": 1020} {"train_loss": -38.212242126464844, "global_step": 123461, "epoch": 1020} {"train_loss": -37.34328842163086, "global_step": 123462, "epoch": 1020} {"train_loss": -38.06802749633789, "global_step": 123463, "epoch": 1020} {"train_loss": -37.7632942199707, "global_step": 123464, "epoch": 1020} {"train_loss": -38.22648239135742, "global_step": 123465, "epoch": 1020} {"train_loss": -37.53670883178711, "global_step": 123466, "epoch": 1020} {"train_loss": -38.51953887939453, "global_step": 123467, "epoch": 1020} {"train_loss": -38.61558151245117, "global_step": 123468, "epoch": 1020} {"train_loss": -37.63250732421875, "global_step": 123469, "epoch": 1020} {"train_loss": -38.28971481323242, "global_step": 123470, "epoch": 1020} {"train_loss": -37.55936813354492, "global_step": 123471, "epoch": 1020} {"train_loss": -37.643775939941406, "global_step": 123472, "epoch": 1020} {"train_loss": -38.970245361328125, "global_step": 123473, "epoch": 1020} {"train_loss": -37.0635986328125, "global_step": 123474, "epoch": 1020} {"train_loss": -36.55159378051758, "global_step": 123475, "epoch": 1020} {"train_loss": -39.503841400146484, "global_step": 123476, "epoch": 1020} {"train_loss": -37.408504486083984, "global_step": 123477, "epoch": 1020} {"train_loss": -37.02616500854492, "global_step": 123478, "epoch": 1020} {"train_loss": -38.88851547241211, "global_step": 123479, "epoch": 1020} {"train_loss": -36.88173294067383, "global_step": 123480, "epoch": 1020} {"train_loss": -38.92913818359375, "global_step": 123481, "epoch": 1020} {"train_loss": -38.09306335449219, "global_step": 123482, "epoch": 1020} {"train_loss": -37.787803649902344, "global_step": 123483, "epoch": 1020} {"train_loss": -38.91457748413086, "global_step": 123484, "epoch": 1020} {"train_loss": -38.32583236694336, "global_step": 123485, "epoch": 1020} {"train_loss": -39.28432846069336, "global_step": 123486, "epoch": 1020} {"train_loss": -38.41773223876953, "global_step": 123487, "epoch": 1020} {"train_loss": -39.029151916503906, "global_step": 123488, "epoch": 1020} {"train_loss": -38.9075813293457, "global_step": 123489, "epoch": 1020} {"train_loss": -39.03343200683594, "global_step": 123490, "epoch": 1020} {"train_loss": -39.09678268432617, "global_step": 123491, "epoch": 1020} {"train_loss": -39.130096435546875, "global_step": 123492, "epoch": 1020} {"train_loss": -37.76930618286133, "global_step": 123493, "epoch": 1020} {"train_loss": -38.62590408325195, "global_step": 123494, "epoch": 1020} {"train_loss": -39.46297073364258, "global_step": 123495, "epoch": 1020} {"train_loss": -39.26702880859375, "global_step": 123496, "epoch": 1020} {"train_loss": -39.333805084228516, "global_step": 123497, "epoch": 1020} {"train_loss": -39.256927490234375, "global_step": 123498, "epoch": 1020} {"train_loss": -39.60044479370117, "global_step": 123499, "epoch": 1020} {"train_loss": -38.90610885620117, "global_step": 123500, "epoch": 1020} {"train_loss": -38.6565055847168, "global_step": 123501, "epoch": 1020} {"train_loss": -38.82007598876953, "global_step": 123502, "epoch": 1020} {"train_loss": -39.5357551574707, "global_step": 123503, "epoch": 1020} {"train_loss": -39.44610595703125, "global_step": 123504, "epoch": 1020} {"train_loss": -39.35297393798828, "global_step": 123505, "epoch": 1020} {"train_loss": -39.23882293701172, "global_step": 123506, "epoch": 1020} {"train_loss": -38.83942413330078, "global_step": 123507, "epoch": 1020} {"train_loss": -39.51702880859375, "global_step": 123508, "epoch": 1020} {"train_loss": -39.67745590209961, "global_step": 123509, "epoch": 1020} {"train_loss": -39.95732116699219, "global_step": 123510, "epoch": 1020} {"train_loss": -38.74338912963867, "global_step": 123511, "epoch": 1020} {"train_loss": -39.26930236816406, "global_step": 123512, "epoch": 1020} {"train_loss": -39.458251953125, "global_step": 123513, "epoch": 1020} {"train_loss": -39.327919006347656, "global_step": 123514, "epoch": 1020} {"train_loss": -38.97584915161133, "global_step": 123515, "epoch": 1020} {"train_loss": -38.77164840698242, "global_step": 123516, "epoch": 1020} {"train_loss": -39.40740966796875, "global_step": 123517, "epoch": 1020} {"train_loss": -39.53672790527344, "global_step": 123518, "epoch": 1020} {"train_loss": -39.155147552490234, "global_step": 123519, "epoch": 1020} {"train_loss": -39.36082077026367, "global_step": 123520, "epoch": 1020} {"train_loss": -39.85480880737305, "global_step": 123521, "epoch": 1020} {"train_loss": -39.423648834228516, "global_step": 123522, "epoch": 1020} {"train_loss": -39.315425872802734, "global_step": 123523, "epoch": 1020} {"train_loss": -39.72665023803711, "global_step": 123524, "epoch": 1020} {"train_loss": -39.93202590942383, "global_step": 123525, "epoch": 1020} {"train_loss": -39.85390090942383, "global_step": 123526, "epoch": 1020} {"train_loss": -39.431358337402344, "global_step": 123527, "epoch": 1020} {"train_loss": -39.41505813598633, "global_step": 123528, "epoch": 1020} {"train_loss": -38.34644317626953, "global_step": 123529, "epoch": 1020} {"train_loss": -39.749542236328125, "global_step": 123530, "epoch": 1020} {"train_loss": -39.262550354003906, "global_step": 123531, "epoch": 1020} {"train_loss": -39.033348083496094, "global_step": 123532, "epoch": 1020} {"train_loss": -38.53713607788086, "global_step": 123533, "epoch": 1020} {"train_loss": -37.99384307861328, "global_step": 123534, "epoch": 1020} {"train_loss": -39.850746154785156, "global_step": 123535, "epoch": 1020} {"train_loss": -38.26824188232422, "global_step": 123536, "epoch": 1020} {"train_loss": -38.34304428100586, "global_step": 123537, "epoch": 1020} {"train_loss": -37.566646575927734, "global_step": 123538, "epoch": 1020} {"train_loss": -38.56399917602539, "global_step": 123539, "epoch": 1020} {"train_loss": -38.711676637003244, "global_step": 123540, "epoch": 1020, "val_loss": 2689631.75} {"train_loss": -38.734195709228516, "global_step": 123541, "epoch": 1021} {"train_loss": -39.04063415527344, "global_step": 123542, "epoch": 1021} {"train_loss": -39.06193923950195, "global_step": 123543, "epoch": 1021} {"train_loss": -37.92908477783203, "global_step": 123544, "epoch": 1021} {"train_loss": -39.116493225097656, "global_step": 123545, "epoch": 1021} {"train_loss": -39.327083587646484, "global_step": 123546, "epoch": 1021} {"train_loss": -38.720855712890625, "global_step": 123547, "epoch": 1021} {"train_loss": -38.6731071472168, "global_step": 123548, "epoch": 1021} {"train_loss": -37.91062545776367, "global_step": 123549, "epoch": 1021} {"train_loss": -37.305728912353516, "global_step": 123550, "epoch": 1021} {"train_loss": -39.36463928222656, "global_step": 123551, "epoch": 1021} {"train_loss": -38.44758224487305, "global_step": 123552, "epoch": 1021} {"train_loss": -39.043617248535156, "global_step": 123553, "epoch": 1021} {"train_loss": -38.66633987426758, "global_step": 123554, "epoch": 1021} {"train_loss": -38.92112731933594, "global_step": 123555, "epoch": 1021} {"train_loss": -38.169471740722656, "global_step": 123556, "epoch": 1021} {"train_loss": -38.50714111328125, "global_step": 123557, "epoch": 1021} {"train_loss": -39.0421028137207, "global_step": 123558, "epoch": 1021} {"train_loss": -36.66256332397461, "global_step": 123559, "epoch": 1021} {"train_loss": -39.34623336791992, "global_step": 123560, "epoch": 1021} {"train_loss": -38.88504409790039, "global_step": 123561, "epoch": 1021} {"train_loss": -37.353759765625, "global_step": 123562, "epoch": 1021} {"train_loss": -39.33579635620117, "global_step": 123563, "epoch": 1021} {"train_loss": -38.86330795288086, "global_step": 123564, "epoch": 1021} {"train_loss": -39.45237350463867, "global_step": 123565, "epoch": 1021} {"train_loss": -39.03587341308594, "global_step": 123566, "epoch": 1021} {"train_loss": -38.93903732299805, "global_step": 123567, "epoch": 1021} {"train_loss": -38.93827438354492, "global_step": 123568, "epoch": 1021} {"train_loss": -39.572669982910156, "global_step": 123569, "epoch": 1021} {"train_loss": -39.430660247802734, "global_step": 123570, "epoch": 1021} {"train_loss": -39.3804931640625, "global_step": 123571, "epoch": 1021} {"train_loss": -39.641475677490234, "global_step": 123572, "epoch": 1021} {"train_loss": -39.795860290527344, "global_step": 123573, "epoch": 1021} {"train_loss": -39.00992965698242, "global_step": 123574, "epoch": 1021} {"train_loss": -38.674312591552734, "global_step": 123575, "epoch": 1021} {"train_loss": -38.95781707763672, "global_step": 123576, "epoch": 1021} {"train_loss": -39.5923957824707, "global_step": 123577, "epoch": 1021} {"train_loss": -39.09731674194336, "global_step": 123578, "epoch": 1021} {"train_loss": -38.3057746887207, "global_step": 123579, "epoch": 1021} {"train_loss": -37.99727249145508, "global_step": 123580, "epoch": 1021} {"train_loss": -39.604610443115234, "global_step": 123581, "epoch": 1021} {"train_loss": -38.69582748413086, "global_step": 123582, "epoch": 1021} {"train_loss": -38.85677719116211, "global_step": 123583, "epoch": 1021} {"train_loss": -39.006649017333984, "global_step": 123584, "epoch": 1021} {"train_loss": -38.122859954833984, "global_step": 123585, "epoch": 1021} {"train_loss": -37.16389083862305, "global_step": 123586, "epoch": 1021} {"train_loss": -39.93461227416992, "global_step": 123587, "epoch": 1021} {"train_loss": -36.55894088745117, "global_step": 123588, "epoch": 1021} {"train_loss": -39.11884689331055, "global_step": 123589, "epoch": 1021} {"train_loss": -38.304317474365234, "global_step": 123590, "epoch": 1021} {"train_loss": -38.284420013427734, "global_step": 123591, "epoch": 1021} {"train_loss": -37.42008590698242, "global_step": 123592, "epoch": 1021} {"train_loss": -38.24992752075195, "global_step": 123593, "epoch": 1021} {"train_loss": -39.048030853271484, "global_step": 123594, "epoch": 1021} {"train_loss": -38.76168441772461, "global_step": 123595, "epoch": 1021} {"train_loss": -38.351966857910156, "global_step": 123596, "epoch": 1021} {"train_loss": -39.70501708984375, "global_step": 123597, "epoch": 1021} {"train_loss": -39.40178680419922, "global_step": 123598, "epoch": 1021} {"train_loss": -38.54184341430664, "global_step": 123599, "epoch": 1021} {"train_loss": -38.381629943847656, "global_step": 123600, "epoch": 1021} {"train_loss": -39.65620803833008, "global_step": 123601, "epoch": 1021} {"train_loss": -39.79893112182617, "global_step": 123602, "epoch": 1021} {"train_loss": -38.93640899658203, "global_step": 123603, "epoch": 1021} {"train_loss": -39.40114212036133, "global_step": 123604, "epoch": 1021} {"train_loss": -39.14946365356445, "global_step": 123605, "epoch": 1021} {"train_loss": -39.3050422668457, "global_step": 123606, "epoch": 1021} {"train_loss": -38.781898498535156, "global_step": 123607, "epoch": 1021} {"train_loss": -39.38666915893555, "global_step": 123608, "epoch": 1021} {"train_loss": -39.21684265136719, "global_step": 123609, "epoch": 1021} {"train_loss": -38.55466079711914, "global_step": 123610, "epoch": 1021} {"train_loss": -39.646331787109375, "global_step": 123611, "epoch": 1021} {"train_loss": -39.85221481323242, "global_step": 123612, "epoch": 1021} {"train_loss": -38.57835388183594, "global_step": 123613, "epoch": 1021} {"train_loss": -39.3150634765625, "global_step": 123614, "epoch": 1021} {"train_loss": -37.724239349365234, "global_step": 123615, "epoch": 1021} {"train_loss": -39.63057327270508, "global_step": 123616, "epoch": 1021} {"train_loss": -38.84750747680664, "global_step": 123617, "epoch": 1021} {"train_loss": -39.989139556884766, "global_step": 123618, "epoch": 1021} {"train_loss": -39.80941390991211, "global_step": 123619, "epoch": 1021} {"train_loss": -39.28445053100586, "global_step": 123620, "epoch": 1021} {"train_loss": -39.88131332397461, "global_step": 123621, "epoch": 1021} {"train_loss": -39.885074615478516, "global_step": 123622, "epoch": 1021} {"train_loss": -37.89411926269531, "global_step": 123623, "epoch": 1021} {"train_loss": -39.23517608642578, "global_step": 123624, "epoch": 1021} {"train_loss": -39.3946533203125, "global_step": 123625, "epoch": 1021} {"train_loss": -38.01456832885742, "global_step": 123626, "epoch": 1021} {"train_loss": -39.40214920043945, "global_step": 123627, "epoch": 1021} {"train_loss": -38.4632568359375, "global_step": 123628, "epoch": 1021} {"train_loss": -39.986785888671875, "global_step": 123629, "epoch": 1021} {"train_loss": -39.70501708984375, "global_step": 123630, "epoch": 1021} {"train_loss": -39.50728988647461, "global_step": 123631, "epoch": 1021} {"train_loss": -38.75216293334961, "global_step": 123632, "epoch": 1021} {"train_loss": -40.0063362121582, "global_step": 123633, "epoch": 1021} {"train_loss": -39.30744934082031, "global_step": 123634, "epoch": 1021} {"train_loss": -39.987205505371094, "global_step": 123635, "epoch": 1021} {"train_loss": -39.522911071777344, "global_step": 123636, "epoch": 1021} {"train_loss": -38.540443420410156, "global_step": 123637, "epoch": 1021} {"train_loss": -40.383663177490234, "global_step": 123638, "epoch": 1021} {"train_loss": -39.390052795410156, "global_step": 123639, "epoch": 1021} {"train_loss": -38.77357864379883, "global_step": 123640, "epoch": 1021} {"train_loss": -38.2879638671875, "global_step": 123641, "epoch": 1021} {"train_loss": -38.511878967285156, "global_step": 123642, "epoch": 1021} {"train_loss": -39.71745300292969, "global_step": 123643, "epoch": 1021} {"train_loss": -39.68915939331055, "global_step": 123644, "epoch": 1021} {"train_loss": -40.089813232421875, "global_step": 123645, "epoch": 1021} {"train_loss": -38.838924407958984, "global_step": 123646, "epoch": 1021} {"train_loss": -39.11567306518555, "global_step": 123647, "epoch": 1021} {"train_loss": -39.369075775146484, "global_step": 123648, "epoch": 1021} {"train_loss": -40.372520446777344, "global_step": 123649, "epoch": 1021} {"train_loss": -40.358760833740234, "global_step": 123650, "epoch": 1021} {"train_loss": -40.28412628173828, "global_step": 123651, "epoch": 1021} {"train_loss": -39.730037689208984, "global_step": 123652, "epoch": 1021} {"train_loss": -40.24936294555664, "global_step": 123653, "epoch": 1021} {"train_loss": -39.87308883666992, "global_step": 123654, "epoch": 1021} {"train_loss": -40.016780853271484, "global_step": 123655, "epoch": 1021} {"train_loss": -40.20377731323242, "global_step": 123656, "epoch": 1021} {"train_loss": -40.122833251953125, "global_step": 123657, "epoch": 1021} {"train_loss": -38.36763381958008, "global_step": 123658, "epoch": 1021} {"train_loss": -32.385955810546875, "global_step": 123659, "epoch": 1021} {"train_loss": -18.179611206054688, "global_step": 123660, "epoch": 1021} {"train_loss": -38.55593438976067, "global_step": 123661, "epoch": 1021, "val_loss": 2680514.25} {"train_loss": -2.635631799697876, "global_step": 123662, "epoch": 1022} {"train_loss": -30.797321319580078, "global_step": 123663, "epoch": 1022} {"train_loss": -25.861801147460938, "global_step": 123664, "epoch": 1022} {"train_loss": -29.1922664642334, "global_step": 123665, "epoch": 1022} {"train_loss": -30.800445556640625, "global_step": 123666, "epoch": 1022} {"train_loss": -34.69730758666992, "global_step": 123667, "epoch": 1022} {"train_loss": -30.36578369140625, "global_step": 123668, "epoch": 1022} {"train_loss": -37.0423698425293, "global_step": 123669, "epoch": 1022} {"train_loss": -33.271907806396484, "global_step": 123670, "epoch": 1022} {"train_loss": -36.53167724609375, "global_step": 123671, "epoch": 1022} {"train_loss": -36.927101135253906, "global_step": 123672, "epoch": 1022} {"train_loss": -35.209503173828125, "global_step": 123673, "epoch": 1022} {"train_loss": -36.450439453125, "global_step": 123674, "epoch": 1022} {"train_loss": -37.85060501098633, "global_step": 123675, "epoch": 1022} {"train_loss": -34.7176628112793, "global_step": 123676, "epoch": 1022} {"train_loss": -37.38706588745117, "global_step": 123677, "epoch": 1022} {"train_loss": -37.796573638916016, "global_step": 123678, "epoch": 1022} {"train_loss": -35.872432708740234, "global_step": 123679, "epoch": 1022} {"train_loss": -36.13277053833008, "global_step": 123680, "epoch": 1022} {"train_loss": -38.10020065307617, "global_step": 123681, "epoch": 1022} {"train_loss": -37.46232223510742, "global_step": 123682, "epoch": 1022} {"train_loss": -36.58647918701172, "global_step": 123683, "epoch": 1022} {"train_loss": -37.57841873168945, "global_step": 123684, "epoch": 1022} {"train_loss": -37.69964599609375, "global_step": 123685, "epoch": 1022} {"train_loss": -37.667335510253906, "global_step": 123686, "epoch": 1022} {"train_loss": -37.163421630859375, "global_step": 123687, "epoch": 1022} {"train_loss": -38.207054138183594, "global_step": 123688, "epoch": 1022} {"train_loss": -38.57676696777344, "global_step": 123689, "epoch": 1022} {"train_loss": -38.45289993286133, "global_step": 123690, "epoch": 1022} {"train_loss": -37.73931884765625, "global_step": 123691, "epoch": 1022} {"train_loss": -38.479896545410156, "global_step": 123692, "epoch": 1022} {"train_loss": -38.5042610168457, "global_step": 123693, "epoch": 1022} {"train_loss": -38.74427032470703, "global_step": 123694, "epoch": 1022} {"train_loss": -38.50398635864258, "global_step": 123695, "epoch": 1022} {"train_loss": -38.63743209838867, "global_step": 123696, "epoch": 1022} {"train_loss": -38.31403350830078, "global_step": 123697, "epoch": 1022} {"train_loss": -39.0078125, "global_step": 123698, "epoch": 1022} {"train_loss": -38.5721549987793, "global_step": 123699, "epoch": 1022} {"train_loss": -38.99141311645508, "global_step": 123700, "epoch": 1022} {"train_loss": -38.918731689453125, "global_step": 123701, "epoch": 1022} {"train_loss": -39.23697280883789, "global_step": 123702, "epoch": 1022} {"train_loss": -39.01320266723633, "global_step": 123703, "epoch": 1022} {"train_loss": -39.40732192993164, "global_step": 123704, "epoch": 1022} {"train_loss": -38.926326751708984, "global_step": 123705, "epoch": 1022} {"train_loss": -39.29037094116211, "global_step": 123706, "epoch": 1022} {"train_loss": -38.87101364135742, "global_step": 123707, "epoch": 1022} {"train_loss": -39.15949630737305, "global_step": 123708, "epoch": 1022} {"train_loss": -39.41740036010742, "global_step": 123709, "epoch": 1022} {"train_loss": -39.247314453125, "global_step": 123710, "epoch": 1022} {"train_loss": -39.4348030090332, "global_step": 123711, "epoch": 1022} {"train_loss": -39.552242279052734, "global_step": 123712, "epoch": 1022} {"train_loss": -39.81304931640625, "global_step": 123713, "epoch": 1022} {"train_loss": -39.27359390258789, "global_step": 123714, "epoch": 1022} {"train_loss": -39.60470962524414, "global_step": 123715, "epoch": 1022} {"train_loss": -39.236663818359375, "global_step": 123716, "epoch": 1022} {"train_loss": -39.77695846557617, "global_step": 123717, "epoch": 1022} {"train_loss": -39.65015411376953, "global_step": 123718, "epoch": 1022} {"train_loss": -39.30973434448242, "global_step": 123719, "epoch": 1022} {"train_loss": -39.402488708496094, "global_step": 123720, "epoch": 1022} {"train_loss": -39.5881462097168, "global_step": 123721, "epoch": 1022} {"train_loss": -39.6802978515625, "global_step": 123722, "epoch": 1022} {"train_loss": -39.70848083496094, "global_step": 123723, "epoch": 1022} {"train_loss": -39.932960510253906, "global_step": 123724, "epoch": 1022} {"train_loss": -39.58211898803711, "global_step": 123725, "epoch": 1022} {"train_loss": -39.57882308959961, "global_step": 123726, "epoch": 1022} {"train_loss": -39.76902389526367, "global_step": 123727, "epoch": 1022} {"train_loss": -39.411956787109375, "global_step": 123728, "epoch": 1022} {"train_loss": -39.60317611694336, "global_step": 123729, "epoch": 1022} {"train_loss": -39.893218994140625, "global_step": 123730, "epoch": 1022} {"train_loss": -40.07011032104492, "global_step": 123731, "epoch": 1022} {"train_loss": -39.86481857299805, "global_step": 123732, "epoch": 1022} {"train_loss": -39.70579147338867, "global_step": 123733, "epoch": 1022} {"train_loss": -40.26959228515625, "global_step": 123734, "epoch": 1022} {"train_loss": -39.6902961730957, "global_step": 123735, "epoch": 1022} {"train_loss": -39.937530517578125, "global_step": 123736, "epoch": 1022} {"train_loss": -40.005889892578125, "global_step": 123737, "epoch": 1022} {"train_loss": -40.17266845703125, "global_step": 123738, "epoch": 1022} {"train_loss": -40.0734977722168, "global_step": 123739, "epoch": 1022} {"train_loss": -40.11818313598633, "global_step": 123740, "epoch": 1022} {"train_loss": -40.21082305908203, "global_step": 123741, "epoch": 1022} {"train_loss": -40.05784225463867, "global_step": 123742, "epoch": 1022} {"train_loss": -40.51243209838867, "global_step": 123743, "epoch": 1022} {"train_loss": -40.06304168701172, "global_step": 123744, "epoch": 1022} {"train_loss": -40.4871940612793, "global_step": 123745, "epoch": 1022} {"train_loss": -39.687007904052734, "global_step": 123746, "epoch": 1022} {"train_loss": -39.92177963256836, "global_step": 123747, "epoch": 1022} {"train_loss": -40.0455436706543, "global_step": 123748, "epoch": 1022} {"train_loss": -39.01619338989258, "global_step": 123749, "epoch": 1022} {"train_loss": -39.132102966308594, "global_step": 123750, "epoch": 1022} {"train_loss": -38.972267150878906, "global_step": 123751, "epoch": 1022} {"train_loss": -36.87343215942383, "global_step": 123752, "epoch": 1022} {"train_loss": -35.882171630859375, "global_step": 123753, "epoch": 1022} {"train_loss": -35.63325119018555, "global_step": 123754, "epoch": 1022} {"train_loss": -36.86531448364258, "global_step": 123755, "epoch": 1022} {"train_loss": -39.73884963989258, "global_step": 123756, "epoch": 1022} {"train_loss": -36.35573196411133, "global_step": 123757, "epoch": 1022} {"train_loss": -32.62644577026367, "global_step": 123758, "epoch": 1022} {"train_loss": -32.97372055053711, "global_step": 123759, "epoch": 1022} {"train_loss": -37.78413009643555, "global_step": 123760, "epoch": 1022} {"train_loss": -36.43207931518555, "global_step": 123761, "epoch": 1022} {"train_loss": -30.29154396057129, "global_step": 123762, "epoch": 1022} {"train_loss": -29.683807373046875, "global_step": 123763, "epoch": 1022} {"train_loss": -37.55181884765625, "global_step": 123764, "epoch": 1022} {"train_loss": -34.7736930847168, "global_step": 123765, "epoch": 1022} {"train_loss": -33.95390319824219, "global_step": 123766, "epoch": 1022} {"train_loss": -37.265438079833984, "global_step": 123767, "epoch": 1022} {"train_loss": -37.91466522216797, "global_step": 123768, "epoch": 1022} {"train_loss": -36.91017150878906, "global_step": 123769, "epoch": 1022} {"train_loss": -36.757877349853516, "global_step": 123770, "epoch": 1022} {"train_loss": -37.67338180541992, "global_step": 123771, "epoch": 1022} {"train_loss": -36.17757034301758, "global_step": 123772, "epoch": 1022} {"train_loss": -37.80641174316406, "global_step": 123773, "epoch": 1022} {"train_loss": -37.49557876586914, "global_step": 123774, "epoch": 1022} {"train_loss": -37.795867919921875, "global_step": 123775, "epoch": 1022} {"train_loss": -37.11090850830078, "global_step": 123776, "epoch": 1022} {"train_loss": -36.85955810546875, "global_step": 123777, "epoch": 1022} {"train_loss": -38.20648956298828, "global_step": 123778, "epoch": 1022} {"train_loss": -37.65922927856445, "global_step": 123779, "epoch": 1022} {"train_loss": -38.11688232421875, "global_step": 123780, "epoch": 1022} {"train_loss": -37.83455276489258, "global_step": 123781, "epoch": 1022} {"train_loss": -37.44638591364396, "global_step": 123782, "epoch": 1022, "val_loss": 2676474.75} {"train_loss": -38.17090606689453, "global_step": 123783, "epoch": 1023} {"train_loss": -38.25605773925781, "global_step": 123784, "epoch": 1023} {"train_loss": -37.861358642578125, "global_step": 123785, "epoch": 1023} {"train_loss": -38.766048431396484, "global_step": 123786, "epoch": 1023} {"train_loss": -38.56166458129883, "global_step": 123787, "epoch": 1023} {"train_loss": -38.48820114135742, "global_step": 123788, "epoch": 1023} {"train_loss": -38.47780990600586, "global_step": 123789, "epoch": 1023} {"train_loss": -38.75089645385742, "global_step": 123790, "epoch": 1023} {"train_loss": -37.920745849609375, "global_step": 123791, "epoch": 1023} {"train_loss": -38.82957458496094, "global_step": 123792, "epoch": 1023} {"train_loss": -38.70983123779297, "global_step": 123793, "epoch": 1023} {"train_loss": -38.74971389770508, "global_step": 123794, "epoch": 1023} {"train_loss": -38.43368911743164, "global_step": 123795, "epoch": 1023} {"train_loss": -38.66162872314453, "global_step": 123796, "epoch": 1023} {"train_loss": -38.355098724365234, "global_step": 123797, "epoch": 1023} {"train_loss": -39.143009185791016, "global_step": 123798, "epoch": 1023} {"train_loss": -38.9119987487793, "global_step": 123799, "epoch": 1023} {"train_loss": -39.49431228637695, "global_step": 123800, "epoch": 1023} {"train_loss": -38.779541015625, "global_step": 123801, "epoch": 1023} {"train_loss": -39.08415603637695, "global_step": 123802, "epoch": 1023} {"train_loss": -39.4056510925293, "global_step": 123803, "epoch": 1023} {"train_loss": -39.22748947143555, "global_step": 123804, "epoch": 1023} {"train_loss": -39.342655181884766, "global_step": 123805, "epoch": 1023} {"train_loss": -39.6044921875, "global_step": 123806, "epoch": 1023} {"train_loss": -38.78286361694336, "global_step": 123807, "epoch": 1023} {"train_loss": -39.49628448486328, "global_step": 123808, "epoch": 1023} {"train_loss": -39.57135772705078, "global_step": 123809, "epoch": 1023} {"train_loss": -39.33604049682617, "global_step": 123810, "epoch": 1023} {"train_loss": -39.31301498413086, "global_step": 123811, "epoch": 1023} {"train_loss": -38.99420928955078, "global_step": 123812, "epoch": 1023} {"train_loss": -39.560447692871094, "global_step": 123813, "epoch": 1023} {"train_loss": -39.93370056152344, "global_step": 123814, "epoch": 1023} {"train_loss": -39.66669845581055, "global_step": 123815, "epoch": 1023} {"train_loss": -39.8620491027832, "global_step": 123816, "epoch": 1023} {"train_loss": -39.69240951538086, "global_step": 123817, "epoch": 1023} {"train_loss": -39.809532165527344, "global_step": 123818, "epoch": 1023} {"train_loss": -39.634029388427734, "global_step": 123819, "epoch": 1023} {"train_loss": -40.037532806396484, "global_step": 123820, "epoch": 1023} {"train_loss": -39.93784713745117, "global_step": 123821, "epoch": 1023} {"train_loss": -40.28096389770508, "global_step": 123822, "epoch": 1023} {"train_loss": -39.902400970458984, "global_step": 123823, "epoch": 1023} {"train_loss": -40.01243209838867, "global_step": 123824, "epoch": 1023} {"train_loss": -40.12137222290039, "global_step": 123825, "epoch": 1023} {"train_loss": -39.72913360595703, "global_step": 123826, "epoch": 1023} {"train_loss": -40.004207611083984, "global_step": 123827, "epoch": 1023} {"train_loss": -40.1565055847168, "global_step": 123828, "epoch": 1023} {"train_loss": -40.0248908996582, "global_step": 123829, "epoch": 1023} {"train_loss": -38.976905822753906, "global_step": 123830, "epoch": 1023} {"train_loss": -39.62876510620117, "global_step": 123831, "epoch": 1023} {"train_loss": -40.18402099609375, "global_step": 123832, "epoch": 1023} {"train_loss": -39.946258544921875, "global_step": 123833, "epoch": 1023} {"train_loss": -39.829002380371094, "global_step": 123834, "epoch": 1023} {"train_loss": -39.879791259765625, "global_step": 123835, "epoch": 1023} {"train_loss": -39.91324996948242, "global_step": 123836, "epoch": 1023} {"train_loss": -39.73176193237305, "global_step": 123837, "epoch": 1023} {"train_loss": -39.94236755371094, "global_step": 123838, "epoch": 1023} {"train_loss": -39.88689422607422, "global_step": 123839, "epoch": 1023} {"train_loss": -39.03251266479492, "global_step": 123840, "epoch": 1023} {"train_loss": -39.60781478881836, "global_step": 123841, "epoch": 1023} {"train_loss": -40.312957763671875, "global_step": 123842, "epoch": 1023} {"train_loss": -40.129608154296875, "global_step": 123843, "epoch": 1023} {"train_loss": -39.18831253051758, "global_step": 123844, "epoch": 1023} {"train_loss": -39.827266693115234, "global_step": 123845, "epoch": 1023} {"train_loss": -39.38882064819336, "global_step": 123846, "epoch": 1023} {"train_loss": -38.9273796081543, "global_step": 123847, "epoch": 1023} {"train_loss": -38.700233459472656, "global_step": 123848, "epoch": 1023} {"train_loss": -39.721397399902344, "global_step": 123849, "epoch": 1023} {"train_loss": -38.894290924072266, "global_step": 123850, "epoch": 1023} {"train_loss": -37.4506950378418, "global_step": 123851, "epoch": 1023} {"train_loss": -39.31148910522461, "global_step": 123852, "epoch": 1023} {"train_loss": -39.53007125854492, "global_step": 123853, "epoch": 1023} {"train_loss": -36.420440673828125, "global_step": 123854, "epoch": 1023} {"train_loss": -37.98176956176758, "global_step": 123855, "epoch": 1023} {"train_loss": -38.75304412841797, "global_step": 123856, "epoch": 1023} {"train_loss": -36.1881103515625, "global_step": 123857, "epoch": 1023} {"train_loss": -38.14636993408203, "global_step": 123858, "epoch": 1023} {"train_loss": -38.89156723022461, "global_step": 123859, "epoch": 1023} {"train_loss": -38.750484466552734, "global_step": 123860, "epoch": 1023} {"train_loss": -39.600189208984375, "global_step": 123861, "epoch": 1023} {"train_loss": -38.42915344238281, "global_step": 123862, "epoch": 1023} {"train_loss": -36.88539505004883, "global_step": 123863, "epoch": 1023} {"train_loss": -37.46697998046875, "global_step": 123864, "epoch": 1023} {"train_loss": -36.76995849609375, "global_step": 123865, "epoch": 1023} {"train_loss": -38.3585205078125, "global_step": 123866, "epoch": 1023} {"train_loss": -39.24188232421875, "global_step": 123867, "epoch": 1023} {"train_loss": -38.35664749145508, "global_step": 123868, "epoch": 1023} {"train_loss": -37.611305236816406, "global_step": 123869, "epoch": 1023} {"train_loss": -38.3197135925293, "global_step": 123870, "epoch": 1023} {"train_loss": -38.25693893432617, "global_step": 123871, "epoch": 1023} {"train_loss": -36.98381805419922, "global_step": 123872, "epoch": 1023} {"train_loss": -37.9484977722168, "global_step": 123873, "epoch": 1023} {"train_loss": -38.104434967041016, "global_step": 123874, "epoch": 1023} {"train_loss": -37.6725959777832, "global_step": 123875, "epoch": 1023} {"train_loss": -36.34745788574219, "global_step": 123876, "epoch": 1023} {"train_loss": -38.69775390625, "global_step": 123877, "epoch": 1023} {"train_loss": -38.22216796875, "global_step": 123878, "epoch": 1023} {"train_loss": -36.683380126953125, "global_step": 123879, "epoch": 1023} {"train_loss": -38.13447952270508, "global_step": 123880, "epoch": 1023} {"train_loss": -37.99266815185547, "global_step": 123881, "epoch": 1023} {"train_loss": -36.74946975708008, "global_step": 123882, "epoch": 1023} {"train_loss": -37.982574462890625, "global_step": 123883, "epoch": 1023} {"train_loss": -38.27158737182617, "global_step": 123884, "epoch": 1023} {"train_loss": -38.89563751220703, "global_step": 123885, "epoch": 1023} {"train_loss": -38.12702941894531, "global_step": 123886, "epoch": 1023} {"train_loss": -38.92887878417969, "global_step": 123887, "epoch": 1023} {"train_loss": -39.2991828918457, "global_step": 123888, "epoch": 1023} {"train_loss": -38.12846755981445, "global_step": 123889, "epoch": 1023} {"train_loss": -37.90849685668945, "global_step": 123890, "epoch": 1023} {"train_loss": -38.68032455444336, "global_step": 123891, "epoch": 1023} {"train_loss": -38.55970764160156, "global_step": 123892, "epoch": 1023} {"train_loss": -39.19096755981445, "global_step": 123893, "epoch": 1023} {"train_loss": -39.14335632324219, "global_step": 123894, "epoch": 1023} {"train_loss": -37.71709060668945, "global_step": 123895, "epoch": 1023} {"train_loss": -38.58562088012695, "global_step": 123896, "epoch": 1023} {"train_loss": -38.55348587036133, "global_step": 123897, "epoch": 1023} {"train_loss": -38.895999908447266, "global_step": 123898, "epoch": 1023} {"train_loss": -39.195465087890625, "global_step": 123899, "epoch": 1023} {"train_loss": -38.991512298583984, "global_step": 123900, "epoch": 1023} {"train_loss": -39.73884963989258, "global_step": 123901, "epoch": 1023} {"train_loss": -37.653316497802734, "global_step": 123902, "epoch": 1023} {"train_loss": -38.837756007170874, "global_step": 123903, "epoch": 1023, "val_loss": 2634835.75} {"train_loss": -38.15358352661133, "global_step": 123904, "epoch": 1024} {"train_loss": -38.075828552246094, "global_step": 123905, "epoch": 1024} {"train_loss": -36.61829376220703, "global_step": 123906, "epoch": 1024} {"train_loss": -38.243682861328125, "global_step": 123907, "epoch": 1024} {"train_loss": -38.50323486328125, "global_step": 123908, "epoch": 1024} {"train_loss": -37.82896041870117, "global_step": 123909, "epoch": 1024} {"train_loss": -37.522430419921875, "global_step": 123910, "epoch": 1024} {"train_loss": -37.43471908569336, "global_step": 123911, "epoch": 1024} {"train_loss": -36.941741943359375, "global_step": 123912, "epoch": 1024} {"train_loss": -36.791996002197266, "global_step": 123913, "epoch": 1024} {"train_loss": -38.920204162597656, "global_step": 123914, "epoch": 1024} {"train_loss": -37.33944320678711, "global_step": 123915, "epoch": 1024} {"train_loss": -39.14899826049805, "global_step": 123916, "epoch": 1024} {"train_loss": -37.938961029052734, "global_step": 123917, "epoch": 1024} {"train_loss": -38.88920974731445, "global_step": 123918, "epoch": 1024} {"train_loss": -38.39079666137695, "global_step": 123919, "epoch": 1024} {"train_loss": -38.773284912109375, "global_step": 123920, "epoch": 1024} {"train_loss": -38.633663177490234, "global_step": 123921, "epoch": 1024} {"train_loss": -38.80712127685547, "global_step": 123922, "epoch": 1024} {"train_loss": -38.87534713745117, "global_step": 123923, "epoch": 1024} {"train_loss": -39.59300231933594, "global_step": 123924, "epoch": 1024} {"train_loss": -38.66526412963867, "global_step": 123925, "epoch": 1024} {"train_loss": -39.679500579833984, "global_step": 123926, "epoch": 1024} {"train_loss": -39.04176330566406, "global_step": 123927, "epoch": 1024} {"train_loss": -39.36405563354492, "global_step": 123928, "epoch": 1024} {"train_loss": -38.728572845458984, "global_step": 123929, "epoch": 1024} {"train_loss": -39.005863189697266, "global_step": 123930, "epoch": 1024} {"train_loss": -38.423004150390625, "global_step": 123931, "epoch": 1024} {"train_loss": -38.9266357421875, "global_step": 123932, "epoch": 1024} {"train_loss": -39.61799240112305, "global_step": 123933, "epoch": 1024} {"train_loss": -38.24373245239258, "global_step": 123934, "epoch": 1024} {"train_loss": -39.922760009765625, "global_step": 123935, "epoch": 1024} {"train_loss": -39.08408737182617, "global_step": 123936, "epoch": 1024} {"train_loss": -39.92042922973633, "global_step": 123937, "epoch": 1024} {"train_loss": -39.61576461791992, "global_step": 123938, "epoch": 1024} {"train_loss": -39.904476165771484, "global_step": 123939, "epoch": 1024} {"train_loss": -39.25245666503906, "global_step": 123940, "epoch": 1024} {"train_loss": -39.99817657470703, "global_step": 123941, "epoch": 1024} {"train_loss": -39.18525695800781, "global_step": 123942, "epoch": 1024} {"train_loss": -39.65913009643555, "global_step": 123943, "epoch": 1024} {"train_loss": -39.028133392333984, "global_step": 123944, "epoch": 1024} {"train_loss": -39.34484100341797, "global_step": 123945, "epoch": 1024} {"train_loss": -39.20343017578125, "global_step": 123946, "epoch": 1024} {"train_loss": -39.725032806396484, "global_step": 123947, "epoch": 1024} {"train_loss": -39.06982421875, "global_step": 123948, "epoch": 1024} {"train_loss": -39.42661666870117, "global_step": 123949, "epoch": 1024} {"train_loss": -39.71314239501953, "global_step": 123950, "epoch": 1024} {"train_loss": -39.78840255737305, "global_step": 123951, "epoch": 1024} {"train_loss": -39.518367767333984, "global_step": 123952, "epoch": 1024} {"train_loss": -39.702083587646484, "global_step": 123953, "epoch": 1024} {"train_loss": -39.71053695678711, "global_step": 123954, "epoch": 1024} {"train_loss": -40.66164779663086, "global_step": 123955, "epoch": 1024} {"train_loss": -39.57341003417969, "global_step": 123956, "epoch": 1024} {"train_loss": -39.75712585449219, "global_step": 123957, "epoch": 1024} {"train_loss": -38.54496383666992, "global_step": 123958, "epoch": 1024} {"train_loss": -40.19404220581055, "global_step": 123959, "epoch": 1024} {"train_loss": -40.07282638549805, "global_step": 123960, "epoch": 1024} {"train_loss": -39.30915069580078, "global_step": 123961, "epoch": 1024} {"train_loss": -38.185420989990234, "global_step": 123962, "epoch": 1024} {"train_loss": -38.937618255615234, "global_step": 123963, "epoch": 1024} {"train_loss": -39.39716720581055, "global_step": 123964, "epoch": 1024} {"train_loss": -40.64052200317383, "global_step": 123965, "epoch": 1024} {"train_loss": -40.341854095458984, "global_step": 123966, "epoch": 1024} {"train_loss": -39.931453704833984, "global_step": 123967, "epoch": 1024} {"train_loss": -40.0020751953125, "global_step": 123968, "epoch": 1024} {"train_loss": -39.9887809753418, "global_step": 123969, "epoch": 1024} {"train_loss": -39.940650939941406, "global_step": 123970, "epoch": 1024} {"train_loss": -39.20124435424805, "global_step": 123971, "epoch": 1024} {"train_loss": -39.64613723754883, "global_step": 123972, "epoch": 1024} {"train_loss": -39.91482162475586, "global_step": 123973, "epoch": 1024} {"train_loss": -40.3784065246582, "global_step": 123974, "epoch": 1024} {"train_loss": -39.57277297973633, "global_step": 123975, "epoch": 1024} {"train_loss": -38.720542907714844, "global_step": 123976, "epoch": 1024} {"train_loss": -39.286006927490234, "global_step": 123977, "epoch": 1024} {"train_loss": -39.9151496887207, "global_step": 123978, "epoch": 1024} {"train_loss": -38.871910095214844, "global_step": 123979, "epoch": 1024} {"train_loss": -38.55751419067383, "global_step": 123980, "epoch": 1024} {"train_loss": -36.94900131225586, "global_step": 123981, "epoch": 1024} {"train_loss": -36.95299530029297, "global_step": 123982, "epoch": 1024} {"train_loss": -36.93195724487305, "global_step": 123983, "epoch": 1024} {"train_loss": -37.8369255065918, "global_step": 123984, "epoch": 1024} {"train_loss": -39.71006393432617, "global_step": 123985, "epoch": 1024} {"train_loss": -38.8253288269043, "global_step": 123986, "epoch": 1024} {"train_loss": -36.1480598449707, "global_step": 123987, "epoch": 1024} {"train_loss": -34.9781379699707, "global_step": 123988, "epoch": 1024} {"train_loss": -36.00117492675781, "global_step": 123989, "epoch": 1024} {"train_loss": -38.13875961303711, "global_step": 123990, "epoch": 1024} {"train_loss": -35.41591262817383, "global_step": 123991, "epoch": 1024} {"train_loss": -34.98563766479492, "global_step": 123992, "epoch": 1024} {"train_loss": -36.77381134033203, "global_step": 123993, "epoch": 1024} {"train_loss": -36.1396484375, "global_step": 123994, "epoch": 1024} {"train_loss": -35.38016891479492, "global_step": 123995, "epoch": 1024} {"train_loss": -38.55084991455078, "global_step": 123996, "epoch": 1024} {"train_loss": -37.652164459228516, "global_step": 123997, "epoch": 1024} {"train_loss": -37.206581115722656, "global_step": 123998, "epoch": 1024} {"train_loss": -36.55177688598633, "global_step": 123999, "epoch": 1024} {"train_loss": -37.61692428588867, "global_step": 124000, "epoch": 1024} {"train_loss": -36.87233352661133, "global_step": 124001, "epoch": 1024} {"train_loss": -38.755550384521484, "global_step": 124002, "epoch": 1024} {"train_loss": -35.8891716003418, "global_step": 124003, "epoch": 1024} {"train_loss": -37.49060821533203, "global_step": 124004, "epoch": 1024} {"train_loss": -38.7509880065918, "global_step": 124005, "epoch": 1024} {"train_loss": -37.58156967163086, "global_step": 124006, "epoch": 1024} {"train_loss": -38.23957824707031, "global_step": 124007, "epoch": 1024} {"train_loss": -38.31816482543945, "global_step": 124008, "epoch": 1024} {"train_loss": -38.34698486328125, "global_step": 124009, "epoch": 1024} {"train_loss": -38.335811614990234, "global_step": 124010, "epoch": 1024} {"train_loss": -38.9203987121582, "global_step": 124011, "epoch": 1024} {"train_loss": -38.85286331176758, "global_step": 124012, "epoch": 1024} {"train_loss": -38.56081771850586, "global_step": 124013, "epoch": 1024} {"train_loss": -38.655799865722656, "global_step": 124014, "epoch": 1024} {"train_loss": -38.24199295043945, "global_step": 124015, "epoch": 1024} {"train_loss": -39.13896179199219, "global_step": 124016, "epoch": 1024} {"train_loss": -37.889644622802734, "global_step": 124017, "epoch": 1024} {"train_loss": -39.5235595703125, "global_step": 124018, "epoch": 1024} {"train_loss": -38.95009994506836, "global_step": 124019, "epoch": 1024} {"train_loss": -39.43569564819336, "global_step": 124020, "epoch": 1024} {"train_loss": -39.188411712646484, "global_step": 124021, "epoch": 1024} {"train_loss": -39.684200286865234, "global_step": 124022, "epoch": 1024} {"train_loss": -38.78544998168945, "global_step": 124023, "epoch": 1024} {"train_loss": -38.628628439154504, "global_step": 124024, "epoch": 1024, "val_loss": 2806124.0} {"train_loss": -38.24645233154297, "global_step": 124025, "epoch": 1025} {"train_loss": -39.41889953613281, "global_step": 124026, "epoch": 1025} {"train_loss": -39.59330368041992, "global_step": 124027, "epoch": 1025} {"train_loss": -37.84678268432617, "global_step": 124028, "epoch": 1025} {"train_loss": -39.41451644897461, "global_step": 124029, "epoch": 1025} {"train_loss": -39.20486068725586, "global_step": 124030, "epoch": 1025} {"train_loss": -39.49570846557617, "global_step": 124031, "epoch": 1025} {"train_loss": -39.136932373046875, "global_step": 124032, "epoch": 1025} {"train_loss": -39.660491943359375, "global_step": 124033, "epoch": 1025} {"train_loss": -40.19187545776367, "global_step": 124034, "epoch": 1025} {"train_loss": -37.9742431640625, "global_step": 124035, "epoch": 1025} {"train_loss": -39.89148712158203, "global_step": 124036, "epoch": 1025} {"train_loss": -33.51121139526367, "global_step": 124037, "epoch": 1025} {"train_loss": -39.33681106567383, "global_step": 124038, "epoch": 1025} {"train_loss": -37.72711944580078, "global_step": 124039, "epoch": 1025} {"train_loss": -37.3090705871582, "global_step": 124040, "epoch": 1025} {"train_loss": -35.29295349121094, "global_step": 124041, "epoch": 1025} {"train_loss": -20.429994583129883, "global_step": 124042, "epoch": 1025} {"train_loss": -36.86420440673828, "global_step": 124043, "epoch": 1025} {"train_loss": -30.009143829345703, "global_step": 124044, "epoch": 1025} {"train_loss": -16.54823875427246, "global_step": 124045, "epoch": 1025} {"train_loss": -33.87911605834961, "global_step": 124046, "epoch": 1025} {"train_loss": -29.425207138061523, "global_step": 124047, "epoch": 1025} {"train_loss": -31.832128524780273, "global_step": 124048, "epoch": 1025} {"train_loss": -24.772830963134766, "global_step": 124049, "epoch": 1025} {"train_loss": -32.199073791503906, "global_step": 124050, "epoch": 1025} {"train_loss": -35.14980697631836, "global_step": 124051, "epoch": 1025} {"train_loss": -32.89097213745117, "global_step": 124052, "epoch": 1025} {"train_loss": -34.07598114013672, "global_step": 124053, "epoch": 1025} {"train_loss": -26.23377799987793, "global_step": 124054, "epoch": 1025} {"train_loss": -30.823352813720703, "global_step": 124055, "epoch": 1025} {"train_loss": -30.403949737548828, "global_step": 124056, "epoch": 1025} {"train_loss": -34.065608978271484, "global_step": 124057, "epoch": 1025} {"train_loss": -33.166786193847656, "global_step": 124058, "epoch": 1025} {"train_loss": -28.449689865112305, "global_step": 124059, "epoch": 1025} {"train_loss": -33.2652473449707, "global_step": 124060, "epoch": 1025} {"train_loss": -34.485389709472656, "global_step": 124061, "epoch": 1025} {"train_loss": -33.68050765991211, "global_step": 124062, "epoch": 1025} {"train_loss": -34.24057388305664, "global_step": 124063, "epoch": 1025} {"train_loss": -32.95267105102539, "global_step": 124064, "epoch": 1025} {"train_loss": -35.337772369384766, "global_step": 124065, "epoch": 1025} {"train_loss": -35.22085189819336, "global_step": 124066, "epoch": 1025} {"train_loss": -35.45386505126953, "global_step": 124067, "epoch": 1025} {"train_loss": -35.715309143066406, "global_step": 124068, "epoch": 1025} {"train_loss": -36.268917083740234, "global_step": 124069, "epoch": 1025} {"train_loss": -36.487220764160156, "global_step": 124070, "epoch": 1025} {"train_loss": -35.84478759765625, "global_step": 124071, "epoch": 1025} {"train_loss": -35.916866302490234, "global_step": 124072, "epoch": 1025} {"train_loss": -34.971038818359375, "global_step": 124073, "epoch": 1025} {"train_loss": -36.23533248901367, "global_step": 124074, "epoch": 1025} {"train_loss": -36.35212326049805, "global_step": 124075, "epoch": 1025} {"train_loss": -36.27880859375, "global_step": 124076, "epoch": 1025} {"train_loss": -35.579402923583984, "global_step": 124077, "epoch": 1025} {"train_loss": -36.00666427612305, "global_step": 124078, "epoch": 1025} {"train_loss": -36.576473236083984, "global_step": 124079, "epoch": 1025} {"train_loss": -36.29833984375, "global_step": 124080, "epoch": 1025} {"train_loss": -36.53766632080078, "global_step": 124081, "epoch": 1025} {"train_loss": -36.68764114379883, "global_step": 124082, "epoch": 1025} {"train_loss": -36.82681655883789, "global_step": 124083, "epoch": 1025} {"train_loss": -36.839813232421875, "global_step": 124084, "epoch": 1025} {"train_loss": -36.30277633666992, "global_step": 124085, "epoch": 1025} {"train_loss": -36.839229583740234, "global_step": 124086, "epoch": 1025} {"train_loss": -37.006893157958984, "global_step": 124087, "epoch": 1025} {"train_loss": -37.10369873046875, "global_step": 124088, "epoch": 1025} {"train_loss": -37.08025360107422, "global_step": 124089, "epoch": 1025} {"train_loss": -36.45729064941406, "global_step": 124090, "epoch": 1025} {"train_loss": -37.52224349975586, "global_step": 124091, "epoch": 1025} {"train_loss": -36.82904815673828, "global_step": 124092, "epoch": 1025} {"train_loss": -37.26155471801758, "global_step": 124093, "epoch": 1025} {"train_loss": -37.043663024902344, "global_step": 124094, "epoch": 1025} {"train_loss": -37.5692138671875, "global_step": 124095, "epoch": 1025} {"train_loss": -37.23995590209961, "global_step": 124096, "epoch": 1025} {"train_loss": -37.46255111694336, "global_step": 124097, "epoch": 1025} {"train_loss": -37.45318603515625, "global_step": 124098, "epoch": 1025} {"train_loss": -37.52272033691406, "global_step": 124099, "epoch": 1025} {"train_loss": -37.544471740722656, "global_step": 124100, "epoch": 1025} {"train_loss": -37.75746154785156, "global_step": 124101, "epoch": 1025} {"train_loss": -37.559722900390625, "global_step": 124102, "epoch": 1025} {"train_loss": -36.78860092163086, "global_step": 124103, "epoch": 1025} {"train_loss": -37.30522537231445, "global_step": 124104, "epoch": 1025} {"train_loss": -37.65029525756836, "global_step": 124105, "epoch": 1025} {"train_loss": -36.77195358276367, "global_step": 124106, "epoch": 1025} {"train_loss": -37.80398941040039, "global_step": 124107, "epoch": 1025} {"train_loss": -37.69417953491211, "global_step": 124108, "epoch": 1025} {"train_loss": -38.12269973754883, "global_step": 124109, "epoch": 1025} {"train_loss": -37.91348648071289, "global_step": 124110, "epoch": 1025} {"train_loss": -38.336814880371094, "global_step": 124111, "epoch": 1025} {"train_loss": -37.55337142944336, "global_step": 124112, "epoch": 1025} {"train_loss": -37.48889923095703, "global_step": 124113, "epoch": 1025} {"train_loss": -38.18333435058594, "global_step": 124114, "epoch": 1025} {"train_loss": -38.347713470458984, "global_step": 124115, "epoch": 1025} {"train_loss": -37.783203125, "global_step": 124116, "epoch": 1025} {"train_loss": -38.00688552856445, "global_step": 124117, "epoch": 1025} {"train_loss": -38.82497787475586, "global_step": 124118, "epoch": 1025} {"train_loss": -37.61326217651367, "global_step": 124119, "epoch": 1025} {"train_loss": -37.755611419677734, "global_step": 124120, "epoch": 1025} {"train_loss": -37.51409912109375, "global_step": 124121, "epoch": 1025} {"train_loss": -38.363033294677734, "global_step": 124122, "epoch": 1025} {"train_loss": -38.2854118347168, "global_step": 124123, "epoch": 1025} {"train_loss": -38.0987434387207, "global_step": 124124, "epoch": 1025} {"train_loss": -37.99544906616211, "global_step": 124125, "epoch": 1025} {"train_loss": -37.64768981933594, "global_step": 124126, "epoch": 1025} {"train_loss": -38.29135513305664, "global_step": 124127, "epoch": 1025} {"train_loss": -38.198028564453125, "global_step": 124128, "epoch": 1025} {"train_loss": -38.473873138427734, "global_step": 124129, "epoch": 1025} {"train_loss": -38.365333557128906, "global_step": 124130, "epoch": 1025} {"train_loss": -38.382137298583984, "global_step": 124131, "epoch": 1025} {"train_loss": -38.39164352416992, "global_step": 124132, "epoch": 1025} {"train_loss": -38.50551986694336, "global_step": 124133, "epoch": 1025} {"train_loss": -38.785892486572266, "global_step": 124134, "epoch": 1025} {"train_loss": -38.77766418457031, "global_step": 124135, "epoch": 1025} {"train_loss": -38.563873291015625, "global_step": 124136, "epoch": 1025} {"train_loss": -38.52011489868164, "global_step": 124137, "epoch": 1025} {"train_loss": -37.9001579284668, "global_step": 124138, "epoch": 1025} {"train_loss": -38.526214599609375, "global_step": 124139, "epoch": 1025} {"train_loss": -38.47428512573242, "global_step": 124140, "epoch": 1025} {"train_loss": -38.679969787597656, "global_step": 124141, "epoch": 1025} {"train_loss": -38.72587203979492, "global_step": 124142, "epoch": 1025} {"train_loss": -38.832672119140625, "global_step": 124143, "epoch": 1025} {"train_loss": -38.7304801940918, "global_step": 124144, "epoch": 1025} {"train_loss": -36.31319143752421, "global_step": 124145, "epoch": 1025, "val_loss": 2540737.5} {"train_loss": -39.18084716796875, "global_step": 124146, "epoch": 1026} {"train_loss": -39.3743896484375, "global_step": 124147, "epoch": 1026} {"train_loss": -38.7140998840332, "global_step": 124148, "epoch": 1026} {"train_loss": -38.46501541137695, "global_step": 124149, "epoch": 1026} {"train_loss": -39.58315658569336, "global_step": 124150, "epoch": 1026} {"train_loss": -38.48653793334961, "global_step": 124151, "epoch": 1026} {"train_loss": -38.57822036743164, "global_step": 124152, "epoch": 1026} {"train_loss": -38.83757781982422, "global_step": 124153, "epoch": 1026} {"train_loss": -39.11859893798828, "global_step": 124154, "epoch": 1026} {"train_loss": -38.74845504760742, "global_step": 124155, "epoch": 1026} {"train_loss": -39.3597526550293, "global_step": 124156, "epoch": 1026} {"train_loss": -38.942481994628906, "global_step": 124157, "epoch": 1026} {"train_loss": -39.2330436706543, "global_step": 124158, "epoch": 1026} {"train_loss": -38.986507415771484, "global_step": 124159, "epoch": 1026} {"train_loss": -39.08930587768555, "global_step": 124160, "epoch": 1026} {"train_loss": -39.194122314453125, "global_step": 124161, "epoch": 1026} {"train_loss": -39.42003631591797, "global_step": 124162, "epoch": 1026} {"train_loss": -39.541011810302734, "global_step": 124163, "epoch": 1026} {"train_loss": -39.348628997802734, "global_step": 124164, "epoch": 1026} {"train_loss": -39.34550476074219, "global_step": 124165, "epoch": 1026} {"train_loss": -39.55598449707031, "global_step": 124166, "epoch": 1026} {"train_loss": -39.18131637573242, "global_step": 124167, "epoch": 1026} {"train_loss": -39.50979232788086, "global_step": 124168, "epoch": 1026} {"train_loss": -39.68685531616211, "global_step": 124169, "epoch": 1026} {"train_loss": -39.1267204284668, "global_step": 124170, "epoch": 1026} {"train_loss": -39.194881439208984, "global_step": 124171, "epoch": 1026} {"train_loss": -39.892303466796875, "global_step": 124172, "epoch": 1026} {"train_loss": -39.486690521240234, "global_step": 124173, "epoch": 1026} {"train_loss": -39.86415481567383, "global_step": 124174, "epoch": 1026} {"train_loss": -39.166866302490234, "global_step": 124175, "epoch": 1026} {"train_loss": -39.68320846557617, "global_step": 124176, "epoch": 1026} {"train_loss": -39.72982406616211, "global_step": 124177, "epoch": 1026} {"train_loss": -39.40601348876953, "global_step": 124178, "epoch": 1026} {"train_loss": -39.3737907409668, "global_step": 124179, "epoch": 1026} {"train_loss": -39.042869567871094, "global_step": 124180, "epoch": 1026} {"train_loss": -38.51361083984375, "global_step": 124181, "epoch": 1026} {"train_loss": -38.65799331665039, "global_step": 124182, "epoch": 1026} {"train_loss": -39.25020217895508, "global_step": 124183, "epoch": 1026} {"train_loss": -38.47296905517578, "global_step": 124184, "epoch": 1026} {"train_loss": -38.38320541381836, "global_step": 124185, "epoch": 1026} {"train_loss": -38.21526336669922, "global_step": 124186, "epoch": 1026} {"train_loss": -38.30813217163086, "global_step": 124187, "epoch": 1026} {"train_loss": -39.2674446105957, "global_step": 124188, "epoch": 1026} {"train_loss": -37.855384826660156, "global_step": 124189, "epoch": 1026} {"train_loss": -36.222145080566406, "global_step": 124190, "epoch": 1026} {"train_loss": -37.46863555908203, "global_step": 124191, "epoch": 1026} {"train_loss": -37.0565071105957, "global_step": 124192, "epoch": 1026} {"train_loss": -35.121795654296875, "global_step": 124193, "epoch": 1026} {"train_loss": -35.80900192260742, "global_step": 124194, "epoch": 1026} {"train_loss": -35.372711181640625, "global_step": 124195, "epoch": 1026} {"train_loss": -39.17191696166992, "global_step": 124196, "epoch": 1026} {"train_loss": -37.7982292175293, "global_step": 124197, "epoch": 1026} {"train_loss": -36.671844482421875, "global_step": 124198, "epoch": 1026} {"train_loss": -36.00332260131836, "global_step": 124199, "epoch": 1026} {"train_loss": -37.234703063964844, "global_step": 124200, "epoch": 1026} {"train_loss": -36.71918869018555, "global_step": 124201, "epoch": 1026} {"train_loss": -33.67256546020508, "global_step": 124202, "epoch": 1026} {"train_loss": -37.84574508666992, "global_step": 124203, "epoch": 1026} {"train_loss": -34.78312301635742, "global_step": 124204, "epoch": 1026} {"train_loss": -38.85799026489258, "global_step": 124205, "epoch": 1026} {"train_loss": -35.44614791870117, "global_step": 124206, "epoch": 1026} {"train_loss": -37.8487434387207, "global_step": 124207, "epoch": 1026} {"train_loss": -37.47478103637695, "global_step": 124208, "epoch": 1026} {"train_loss": -37.872291564941406, "global_step": 124209, "epoch": 1026} {"train_loss": -37.42301559448242, "global_step": 124210, "epoch": 1026} {"train_loss": -37.910396575927734, "global_step": 124211, "epoch": 1026} {"train_loss": -38.2314338684082, "global_step": 124212, "epoch": 1026} {"train_loss": -38.36005783081055, "global_step": 124213, "epoch": 1026} {"train_loss": -38.804710388183594, "global_step": 124214, "epoch": 1026} {"train_loss": -38.02959060668945, "global_step": 124215, "epoch": 1026} {"train_loss": -38.757633209228516, "global_step": 124216, "epoch": 1026} {"train_loss": -38.20245361328125, "global_step": 124217, "epoch": 1026} {"train_loss": -39.25201416015625, "global_step": 124218, "epoch": 1026} {"train_loss": -37.85145950317383, "global_step": 124219, "epoch": 1026} {"train_loss": -39.221004486083984, "global_step": 124220, "epoch": 1026} {"train_loss": -37.85422897338867, "global_step": 124221, "epoch": 1026} {"train_loss": -38.36348342895508, "global_step": 124222, "epoch": 1026} {"train_loss": -39.06272506713867, "global_step": 124223, "epoch": 1026} {"train_loss": -39.30635452270508, "global_step": 124224, "epoch": 1026} {"train_loss": -39.37457275390625, "global_step": 124225, "epoch": 1026} {"train_loss": -39.16225814819336, "global_step": 124226, "epoch": 1026} {"train_loss": -38.56585693359375, "global_step": 124227, "epoch": 1026} {"train_loss": -38.62589645385742, "global_step": 124228, "epoch": 1026} {"train_loss": -39.257080078125, "global_step": 124229, "epoch": 1026} {"train_loss": -38.84975814819336, "global_step": 124230, "epoch": 1026} {"train_loss": -39.11904525756836, "global_step": 124231, "epoch": 1026} {"train_loss": -39.45283889770508, "global_step": 124232, "epoch": 1026} {"train_loss": -39.4552116394043, "global_step": 124233, "epoch": 1026} {"train_loss": -39.604732513427734, "global_step": 124234, "epoch": 1026} {"train_loss": -39.3607177734375, "global_step": 124235, "epoch": 1026} {"train_loss": -39.1872444152832, "global_step": 124236, "epoch": 1026} {"train_loss": -38.736663818359375, "global_step": 124237, "epoch": 1026} {"train_loss": -39.5526008605957, "global_step": 124238, "epoch": 1026} {"train_loss": -39.78117752075195, "global_step": 124239, "epoch": 1026} {"train_loss": -39.584957122802734, "global_step": 124240, "epoch": 1026} {"train_loss": -39.569610595703125, "global_step": 124241, "epoch": 1026} {"train_loss": -39.75700759887695, "global_step": 124242, "epoch": 1026} {"train_loss": -39.036495208740234, "global_step": 124243, "epoch": 1026} {"train_loss": -39.35588455200195, "global_step": 124244, "epoch": 1026} {"train_loss": -39.73496627807617, "global_step": 124245, "epoch": 1026} {"train_loss": -39.244728088378906, "global_step": 124246, "epoch": 1026} {"train_loss": -39.53847122192383, "global_step": 124247, "epoch": 1026} {"train_loss": -39.5437126159668, "global_step": 124248, "epoch": 1026} {"train_loss": -39.85517120361328, "global_step": 124249, "epoch": 1026} {"train_loss": -39.31789016723633, "global_step": 124250, "epoch": 1026} {"train_loss": -39.78900146484375, "global_step": 124251, "epoch": 1026} {"train_loss": -39.94914627075195, "global_step": 124252, "epoch": 1026} {"train_loss": -39.13204574584961, "global_step": 124253, "epoch": 1026} {"train_loss": -38.40626907348633, "global_step": 124254, "epoch": 1026} {"train_loss": -38.51731491088867, "global_step": 124255, "epoch": 1026} {"train_loss": -33.66805648803711, "global_step": 124256, "epoch": 1026} {"train_loss": -19.53152847290039, "global_step": 124257, "epoch": 1026} {"train_loss": 6.881782054901123, "global_step": 124258, "epoch": 1026} {"train_loss": 13.755789756774902, "global_step": 124259, "epoch": 1026} {"train_loss": -36.533138275146484, "global_step": 124260, "epoch": 1026} {"train_loss": -11.834389686584473, "global_step": 124261, "epoch": 1026} {"train_loss": -28.150390625, "global_step": 124262, "epoch": 1026} {"train_loss": -20.66358757019043, "global_step": 124263, "epoch": 1026} {"train_loss": -36.0365104675293, "global_step": 124264, "epoch": 1026} {"train_loss": -21.720279693603516, "global_step": 124265, "epoch": 1026} {"train_loss": -36.973195072047965, "global_step": 124266, "epoch": 1026, "val_loss": 2719933.0} {"train_loss": -29.130191802978516, "global_step": 124267, "epoch": 1027} {"train_loss": -29.1479549407959, "global_step": 124268, "epoch": 1027} {"train_loss": -36.93743896484375, "global_step": 124269, "epoch": 1027} {"train_loss": -34.137718200683594, "global_step": 124270, "epoch": 1027} {"train_loss": -32.28760528564453, "global_step": 124271, "epoch": 1027} {"train_loss": -36.44060134887695, "global_step": 124272, "epoch": 1027} {"train_loss": -37.07831573486328, "global_step": 124273, "epoch": 1027} {"train_loss": -34.410709381103516, "global_step": 124274, "epoch": 1027} {"train_loss": -35.49262619018555, "global_step": 124275, "epoch": 1027} {"train_loss": -37.05634307861328, "global_step": 124276, "epoch": 1027} {"train_loss": -36.28487777709961, "global_step": 124277, "epoch": 1027} {"train_loss": -35.544254302978516, "global_step": 124278, "epoch": 1027} {"train_loss": -35.853248596191406, "global_step": 124279, "epoch": 1027} {"train_loss": -37.152244567871094, "global_step": 124280, "epoch": 1027} {"train_loss": -37.6285514831543, "global_step": 124281, "epoch": 1027} {"train_loss": -37.32273483276367, "global_step": 124282, "epoch": 1027} {"train_loss": -36.32961654663086, "global_step": 124283, "epoch": 1027} {"train_loss": -36.84015655517578, "global_step": 124284, "epoch": 1027} {"train_loss": -37.90513229370117, "global_step": 124285, "epoch": 1027} {"train_loss": -36.000885009765625, "global_step": 124286, "epoch": 1027} {"train_loss": -37.580955505371094, "global_step": 124287, "epoch": 1027} {"train_loss": -37.396541595458984, "global_step": 124288, "epoch": 1027} {"train_loss": -37.716163635253906, "global_step": 124289, "epoch": 1027} {"train_loss": -37.59797286987305, "global_step": 124290, "epoch": 1027} {"train_loss": -37.74470138549805, "global_step": 124291, "epoch": 1027} {"train_loss": -38.165340423583984, "global_step": 124292, "epoch": 1027} {"train_loss": -37.739501953125, "global_step": 124293, "epoch": 1027} {"train_loss": -38.1271858215332, "global_step": 124294, "epoch": 1027} {"train_loss": -38.156280517578125, "global_step": 124295, "epoch": 1027} {"train_loss": -38.358612060546875, "global_step": 124296, "epoch": 1027} {"train_loss": -37.92942810058594, "global_step": 124297, "epoch": 1027} {"train_loss": -38.01636505126953, "global_step": 124298, "epoch": 1027} {"train_loss": -37.823760986328125, "global_step": 124299, "epoch": 1027} {"train_loss": -37.85689926147461, "global_step": 124300, "epoch": 1027} {"train_loss": -38.0362548828125, "global_step": 124301, "epoch": 1027} {"train_loss": -38.78757858276367, "global_step": 124302, "epoch": 1027} {"train_loss": -38.660518646240234, "global_step": 124303, "epoch": 1027} {"train_loss": -38.4970588684082, "global_step": 124304, "epoch": 1027} {"train_loss": -38.46764373779297, "global_step": 124305, "epoch": 1027} {"train_loss": -38.34530258178711, "global_step": 124306, "epoch": 1027} {"train_loss": -38.33723831176758, "global_step": 124307, "epoch": 1027} {"train_loss": -37.409339904785156, "global_step": 124308, "epoch": 1027} {"train_loss": -38.30311965942383, "global_step": 124309, "epoch": 1027} {"train_loss": -38.45506286621094, "global_step": 124310, "epoch": 1027} {"train_loss": -38.70737838745117, "global_step": 124311, "epoch": 1027} {"train_loss": -38.554359436035156, "global_step": 124312, "epoch": 1027} {"train_loss": -39.080604553222656, "global_step": 124313, "epoch": 1027} {"train_loss": -37.721866607666016, "global_step": 124314, "epoch": 1027} {"train_loss": -38.75752639770508, "global_step": 124315, "epoch": 1027} {"train_loss": -38.84602737426758, "global_step": 124316, "epoch": 1027} {"train_loss": -37.34767532348633, "global_step": 124317, "epoch": 1027} {"train_loss": -38.65171432495117, "global_step": 124318, "epoch": 1027} {"train_loss": -39.1693229675293, "global_step": 124319, "epoch": 1027} {"train_loss": -39.066829681396484, "global_step": 124320, "epoch": 1027} {"train_loss": -38.78828811645508, "global_step": 124321, "epoch": 1027} {"train_loss": -39.29212188720703, "global_step": 124322, "epoch": 1027} {"train_loss": -39.187591552734375, "global_step": 124323, "epoch": 1027} {"train_loss": -39.387184143066406, "global_step": 124324, "epoch": 1027} {"train_loss": -38.94224166870117, "global_step": 124325, "epoch": 1027} {"train_loss": -38.94426727294922, "global_step": 124326, "epoch": 1027} {"train_loss": -39.12800598144531, "global_step": 124327, "epoch": 1027} {"train_loss": -39.596797943115234, "global_step": 124328, "epoch": 1027} {"train_loss": -39.39105987548828, "global_step": 124329, "epoch": 1027} {"train_loss": -39.348243713378906, "global_step": 124330, "epoch": 1027} {"train_loss": -39.658687591552734, "global_step": 124331, "epoch": 1027} {"train_loss": -39.451637268066406, "global_step": 124332, "epoch": 1027} {"train_loss": -38.956825256347656, "global_step": 124333, "epoch": 1027} {"train_loss": -38.74532699584961, "global_step": 124334, "epoch": 1027} {"train_loss": -39.22858810424805, "global_step": 124335, "epoch": 1027} {"train_loss": -39.41135025024414, "global_step": 124336, "epoch": 1027} {"train_loss": -38.52947998046875, "global_step": 124337, "epoch": 1027} {"train_loss": -38.89020919799805, "global_step": 124338, "epoch": 1027} {"train_loss": -38.99753952026367, "global_step": 124339, "epoch": 1027} {"train_loss": -39.198673248291016, "global_step": 124340, "epoch": 1027} {"train_loss": -39.71556854248047, "global_step": 124341, "epoch": 1027} {"train_loss": -39.07355499267578, "global_step": 124342, "epoch": 1027} {"train_loss": -39.39508056640625, "global_step": 124343, "epoch": 1027} {"train_loss": -39.41506576538086, "global_step": 124344, "epoch": 1027} {"train_loss": -39.80192184448242, "global_step": 124345, "epoch": 1027} {"train_loss": -39.45521926879883, "global_step": 124346, "epoch": 1027} {"train_loss": -39.72351837158203, "global_step": 124347, "epoch": 1027} {"train_loss": -39.672523498535156, "global_step": 124348, "epoch": 1027} {"train_loss": -39.81574630737305, "global_step": 124349, "epoch": 1027} {"train_loss": -39.838191986083984, "global_step": 124350, "epoch": 1027} {"train_loss": -39.85334396362305, "global_step": 124351, "epoch": 1027} {"train_loss": -39.61572265625, "global_step": 124352, "epoch": 1027} {"train_loss": -39.60565948486328, "global_step": 124353, "epoch": 1027} {"train_loss": -39.54813766479492, "global_step": 124354, "epoch": 1027} {"train_loss": -38.516456604003906, "global_step": 124355, "epoch": 1027} {"train_loss": -39.916744232177734, "global_step": 124356, "epoch": 1027} {"train_loss": -39.560054779052734, "global_step": 124357, "epoch": 1027} {"train_loss": -40.014190673828125, "global_step": 124358, "epoch": 1027} {"train_loss": -39.24882125854492, "global_step": 124359, "epoch": 1027} {"train_loss": -39.91337966918945, "global_step": 124360, "epoch": 1027} {"train_loss": -39.45261001586914, "global_step": 124361, "epoch": 1027} {"train_loss": -39.556793212890625, "global_step": 124362, "epoch": 1027} {"train_loss": -39.3712158203125, "global_step": 124363, "epoch": 1027} {"train_loss": -38.555721282958984, "global_step": 124364, "epoch": 1027} {"train_loss": -39.61122131347656, "global_step": 124365, "epoch": 1027} {"train_loss": -40.32008743286133, "global_step": 124366, "epoch": 1027} {"train_loss": -39.7335090637207, "global_step": 124367, "epoch": 1027} {"train_loss": -40.18032455444336, "global_step": 124368, "epoch": 1027} {"train_loss": -39.83345031738281, "global_step": 124369, "epoch": 1027} {"train_loss": -38.91718673706055, "global_step": 124370, "epoch": 1027} {"train_loss": -38.53729248046875, "global_step": 124371, "epoch": 1027} {"train_loss": -38.7398796081543, "global_step": 124372, "epoch": 1027} {"train_loss": -39.27749252319336, "global_step": 124373, "epoch": 1027} {"train_loss": -39.5322380065918, "global_step": 124374, "epoch": 1027} {"train_loss": -39.59187316894531, "global_step": 124375, "epoch": 1027} {"train_loss": -38.38117599487305, "global_step": 124376, "epoch": 1027} {"train_loss": -38.41651916503906, "global_step": 124377, "epoch": 1027} {"train_loss": -39.31026840209961, "global_step": 124378, "epoch": 1027} {"train_loss": -39.306514739990234, "global_step": 124379, "epoch": 1027} {"train_loss": -36.253395080566406, "global_step": 124380, "epoch": 1027} {"train_loss": -35.737422943115234, "global_step": 124381, "epoch": 1027} {"train_loss": -37.845001220703125, "global_step": 124382, "epoch": 1027} {"train_loss": -38.44357681274414, "global_step": 124383, "epoch": 1027} {"train_loss": -38.41286087036133, "global_step": 124384, "epoch": 1027} {"train_loss": -38.463375091552734, "global_step": 124385, "epoch": 1027} {"train_loss": -38.563011169433594, "global_step": 124386, "epoch": 1027} {"train_loss": -38.28532313512377, "global_step": 124387, "epoch": 1027, "val_loss": 2613228.25} {"train_loss": -38.79303741455078, "global_step": 124388, "epoch": 1028} {"train_loss": -39.049251556396484, "global_step": 124389, "epoch": 1028} {"train_loss": -38.55767822265625, "global_step": 124390, "epoch": 1028} {"train_loss": -38.956214904785156, "global_step": 124391, "epoch": 1028} {"train_loss": -38.93281173706055, "global_step": 124392, "epoch": 1028} {"train_loss": -38.18586349487305, "global_step": 124393, "epoch": 1028} {"train_loss": -39.31929397583008, "global_step": 124394, "epoch": 1028} {"train_loss": -38.57510757446289, "global_step": 124395, "epoch": 1028} {"train_loss": -39.414974212646484, "global_step": 124396, "epoch": 1028} {"train_loss": -39.1453857421875, "global_step": 124397, "epoch": 1028} {"train_loss": -39.332576751708984, "global_step": 124398, "epoch": 1028} {"train_loss": -39.7417106628418, "global_step": 124399, "epoch": 1028} {"train_loss": -39.375457763671875, "global_step": 124400, "epoch": 1028} {"train_loss": -39.69793701171875, "global_step": 124401, "epoch": 1028} {"train_loss": -39.770015716552734, "global_step": 124402, "epoch": 1028} {"train_loss": -38.9294319152832, "global_step": 124403, "epoch": 1028} {"train_loss": -38.98648452758789, "global_step": 124404, "epoch": 1028} {"train_loss": -39.652801513671875, "global_step": 124405, "epoch": 1028} {"train_loss": -39.9980354309082, "global_step": 124406, "epoch": 1028} {"train_loss": -39.515071868896484, "global_step": 124407, "epoch": 1028} {"train_loss": -39.8634147644043, "global_step": 124408, "epoch": 1028} {"train_loss": -40.077354431152344, "global_step": 124409, "epoch": 1028} {"train_loss": -39.916561126708984, "global_step": 124410, "epoch": 1028} {"train_loss": -39.709720611572266, "global_step": 124411, "epoch": 1028} {"train_loss": -39.28482437133789, "global_step": 124412, "epoch": 1028} {"train_loss": -39.79368209838867, "global_step": 124413, "epoch": 1028} {"train_loss": -39.39332962036133, "global_step": 124414, "epoch": 1028} {"train_loss": -39.539703369140625, "global_step": 124415, "epoch": 1028} {"train_loss": -39.80746078491211, "global_step": 124416, "epoch": 1028} {"train_loss": -39.24326705932617, "global_step": 124417, "epoch": 1028} {"train_loss": -37.143795013427734, "global_step": 124418, "epoch": 1028} {"train_loss": -38.92555618286133, "global_step": 124419, "epoch": 1028} {"train_loss": -39.54625701904297, "global_step": 124420, "epoch": 1028} {"train_loss": -38.658599853515625, "global_step": 124421, "epoch": 1028} {"train_loss": -37.55354690551758, "global_step": 124422, "epoch": 1028} {"train_loss": -37.00150680541992, "global_step": 124423, "epoch": 1028} {"train_loss": -38.872623443603516, "global_step": 124424, "epoch": 1028} {"train_loss": -38.94529342651367, "global_step": 124425, "epoch": 1028} {"train_loss": -37.25471115112305, "global_step": 124426, "epoch": 1028} {"train_loss": -38.21699523925781, "global_step": 124427, "epoch": 1028} {"train_loss": -38.63552474975586, "global_step": 124428, "epoch": 1028} {"train_loss": -37.79417037963867, "global_step": 124429, "epoch": 1028} {"train_loss": -38.29848098754883, "global_step": 124430, "epoch": 1028} {"train_loss": -38.583290100097656, "global_step": 124431, "epoch": 1028} {"train_loss": -38.54227828979492, "global_step": 124432, "epoch": 1028} {"train_loss": -37.80672836303711, "global_step": 124433, "epoch": 1028} {"train_loss": -37.50452423095703, "global_step": 124434, "epoch": 1028} {"train_loss": -39.65092086791992, "global_step": 124435, "epoch": 1028} {"train_loss": -38.29143142700195, "global_step": 124436, "epoch": 1028} {"train_loss": -39.2169303894043, "global_step": 124437, "epoch": 1028} {"train_loss": -38.47356033325195, "global_step": 124438, "epoch": 1028} {"train_loss": -36.12086868286133, "global_step": 124439, "epoch": 1028} {"train_loss": -38.66269302368164, "global_step": 124440, "epoch": 1028} {"train_loss": -38.44645309448242, "global_step": 124441, "epoch": 1028} {"train_loss": -38.748695373535156, "global_step": 124442, "epoch": 1028} {"train_loss": -39.130428314208984, "global_step": 124443, "epoch": 1028} {"train_loss": -37.41707229614258, "global_step": 124444, "epoch": 1028} {"train_loss": -38.14663314819336, "global_step": 124445, "epoch": 1028} {"train_loss": -38.54295349121094, "global_step": 124446, "epoch": 1028} {"train_loss": -34.84877395629883, "global_step": 124447, "epoch": 1028} {"train_loss": -37.34003829956055, "global_step": 124448, "epoch": 1028} {"train_loss": -38.1174430847168, "global_step": 124449, "epoch": 1028} {"train_loss": -37.40787887573242, "global_step": 124450, "epoch": 1028} {"train_loss": -38.18156814575195, "global_step": 124451, "epoch": 1028} {"train_loss": -36.754268646240234, "global_step": 124452, "epoch": 1028} {"train_loss": -36.77102279663086, "global_step": 124453, "epoch": 1028} {"train_loss": -37.449527740478516, "global_step": 124454, "epoch": 1028} {"train_loss": -37.83346939086914, "global_step": 124455, "epoch": 1028} {"train_loss": -31.38982582092285, "global_step": 124456, "epoch": 1028} {"train_loss": -37.474769592285156, "global_step": 124457, "epoch": 1028} {"train_loss": -32.597015380859375, "global_step": 124458, "epoch": 1028} {"train_loss": -34.50949478149414, "global_step": 124459, "epoch": 1028} {"train_loss": -36.29204177856445, "global_step": 124460, "epoch": 1028} {"train_loss": -36.792537689208984, "global_step": 124461, "epoch": 1028} {"train_loss": -33.507110595703125, "global_step": 124462, "epoch": 1028} {"train_loss": -26.421268463134766, "global_step": 124463, "epoch": 1028} {"train_loss": -36.634578704833984, "global_step": 124464, "epoch": 1028} {"train_loss": -36.11287307739258, "global_step": 124465, "epoch": 1028} {"train_loss": -32.528995513916016, "global_step": 124466, "epoch": 1028} {"train_loss": -34.55851364135742, "global_step": 124467, "epoch": 1028} {"train_loss": -31.312545776367188, "global_step": 124468, "epoch": 1028} {"train_loss": -35.3564338684082, "global_step": 124469, "epoch": 1028} {"train_loss": -35.001739501953125, "global_step": 124470, "epoch": 1028} {"train_loss": -35.137611389160156, "global_step": 124471, "epoch": 1028} {"train_loss": -33.90281295776367, "global_step": 124472, "epoch": 1028} {"train_loss": -28.276418685913086, "global_step": 124473, "epoch": 1028} {"train_loss": -35.4161491394043, "global_step": 124474, "epoch": 1028} {"train_loss": -29.63056755065918, "global_step": 124475, "epoch": 1028} {"train_loss": -31.91363525390625, "global_step": 124476, "epoch": 1028} {"train_loss": -36.81393814086914, "global_step": 124477, "epoch": 1028} {"train_loss": -35.374481201171875, "global_step": 124478, "epoch": 1028} {"train_loss": -34.53422546386719, "global_step": 124479, "epoch": 1028} {"train_loss": -35.66916275024414, "global_step": 124480, "epoch": 1028} {"train_loss": -36.177791595458984, "global_step": 124481, "epoch": 1028} {"train_loss": -34.29671096801758, "global_step": 124482, "epoch": 1028} {"train_loss": -33.56494903564453, "global_step": 124483, "epoch": 1028} {"train_loss": -35.63672637939453, "global_step": 124484, "epoch": 1028} {"train_loss": -33.718711853027344, "global_step": 124485, "epoch": 1028} {"train_loss": -34.921939849853516, "global_step": 124486, "epoch": 1028} {"train_loss": -33.330970764160156, "global_step": 124487, "epoch": 1028} {"train_loss": -34.040348052978516, "global_step": 124488, "epoch": 1028} {"train_loss": -35.79935836791992, "global_step": 124489, "epoch": 1028} {"train_loss": -30.9643497467041, "global_step": 124490, "epoch": 1028} {"train_loss": -35.41305160522461, "global_step": 124491, "epoch": 1028} {"train_loss": -34.42262649536133, "global_step": 124492, "epoch": 1028} {"train_loss": -36.078758239746094, "global_step": 124493, "epoch": 1028} {"train_loss": -35.81486892700195, "global_step": 124494, "epoch": 1028} {"train_loss": -36.342308044433594, "global_step": 124495, "epoch": 1028} {"train_loss": -35.6414794921875, "global_step": 124496, "epoch": 1028} {"train_loss": -35.43377685546875, "global_step": 124497, "epoch": 1028} {"train_loss": -36.009490966796875, "global_step": 124498, "epoch": 1028} {"train_loss": -36.68445587158203, "global_step": 124499, "epoch": 1028} {"train_loss": -37.023799896240234, "global_step": 124500, "epoch": 1028} {"train_loss": -36.316078186035156, "global_step": 124501, "epoch": 1028} {"train_loss": -34.83203125, "global_step": 124502, "epoch": 1028} {"train_loss": -35.008209228515625, "global_step": 124503, "epoch": 1028} {"train_loss": -33.92904281616211, "global_step": 124504, "epoch": 1028} {"train_loss": -37.29419708251953, "global_step": 124505, "epoch": 1028} {"train_loss": -34.566123962402344, "global_step": 124506, "epoch": 1028} {"train_loss": -35.5029411315918, "global_step": 124507, "epoch": 1028} {"train_loss": -36.828387835794246, "global_step": 124508, "epoch": 1028, "val_loss": 2705199.25} {"train_loss": -37.05025100708008, "global_step": 124509, "epoch": 1029} {"train_loss": -35.94270706176758, "global_step": 124510, "epoch": 1029} {"train_loss": -36.174400329589844, "global_step": 124511, "epoch": 1029} {"train_loss": -36.674503326416016, "global_step": 124512, "epoch": 1029} {"train_loss": -35.9359245300293, "global_step": 124513, "epoch": 1029} {"train_loss": -37.4774169921875, "global_step": 124514, "epoch": 1029} {"train_loss": -36.50924301147461, "global_step": 124515, "epoch": 1029} {"train_loss": -35.45100402832031, "global_step": 124516, "epoch": 1029} {"train_loss": -36.63350296020508, "global_step": 124517, "epoch": 1029} {"train_loss": -37.173030853271484, "global_step": 124518, "epoch": 1029} {"train_loss": -36.2340202331543, "global_step": 124519, "epoch": 1029} {"train_loss": -35.57380676269531, "global_step": 124520, "epoch": 1029} {"train_loss": -36.05111312866211, "global_step": 124521, "epoch": 1029} {"train_loss": -36.93313980102539, "global_step": 124522, "epoch": 1029} {"train_loss": -37.527950286865234, "global_step": 124523, "epoch": 1029} {"train_loss": -36.6709098815918, "global_step": 124524, "epoch": 1029} {"train_loss": -36.5239372253418, "global_step": 124525, "epoch": 1029} {"train_loss": -36.7160758972168, "global_step": 124526, "epoch": 1029} {"train_loss": -37.79754638671875, "global_step": 124527, "epoch": 1029} {"train_loss": -37.10745620727539, "global_step": 124528, "epoch": 1029} {"train_loss": -37.29763412475586, "global_step": 124529, "epoch": 1029} {"train_loss": -36.936248779296875, "global_step": 124530, "epoch": 1029} {"train_loss": -36.868900299072266, "global_step": 124531, "epoch": 1029} {"train_loss": -37.32859420776367, "global_step": 124532, "epoch": 1029} {"train_loss": -37.50327682495117, "global_step": 124533, "epoch": 1029} {"train_loss": -37.30205154418945, "global_step": 124534, "epoch": 1029} {"train_loss": -37.49168014526367, "global_step": 124535, "epoch": 1029} {"train_loss": -37.0900993347168, "global_step": 124536, "epoch": 1029} {"train_loss": -36.978981018066406, "global_step": 124537, "epoch": 1029} {"train_loss": -37.373836517333984, "global_step": 124538, "epoch": 1029} {"train_loss": -37.243255615234375, "global_step": 124539, "epoch": 1029} {"train_loss": -37.89616012573242, "global_step": 124540, "epoch": 1029} {"train_loss": -37.64777374267578, "global_step": 124541, "epoch": 1029} {"train_loss": -38.11670684814453, "global_step": 124542, "epoch": 1029} {"train_loss": -37.739166259765625, "global_step": 124543, "epoch": 1029} {"train_loss": -38.237152099609375, "global_step": 124544, "epoch": 1029} {"train_loss": -37.21857452392578, "global_step": 124545, "epoch": 1029} {"train_loss": -38.02997970581055, "global_step": 124546, "epoch": 1029} {"train_loss": -38.250770568847656, "global_step": 124547, "epoch": 1029} {"train_loss": -37.57300567626953, "global_step": 124548, "epoch": 1029} {"train_loss": -37.805660247802734, "global_step": 124549, "epoch": 1029} {"train_loss": -37.41183090209961, "global_step": 124550, "epoch": 1029} {"train_loss": -38.425201416015625, "global_step": 124551, "epoch": 1029} {"train_loss": -37.5588264465332, "global_step": 124552, "epoch": 1029} {"train_loss": -37.81154251098633, "global_step": 124553, "epoch": 1029} {"train_loss": -37.897010803222656, "global_step": 124554, "epoch": 1029} {"train_loss": -38.02571487426758, "global_step": 124555, "epoch": 1029} {"train_loss": -38.208404541015625, "global_step": 124556, "epoch": 1029} {"train_loss": -38.187049865722656, "global_step": 124557, "epoch": 1029} {"train_loss": -37.741058349609375, "global_step": 124558, "epoch": 1029} {"train_loss": -37.743289947509766, "global_step": 124559, "epoch": 1029} {"train_loss": -38.38877868652344, "global_step": 124560, "epoch": 1029} {"train_loss": -38.12693405151367, "global_step": 124561, "epoch": 1029} {"train_loss": -38.54331588745117, "global_step": 124562, "epoch": 1029} {"train_loss": -37.95577621459961, "global_step": 124563, "epoch": 1029} {"train_loss": -38.52825164794922, "global_step": 124564, "epoch": 1029} {"train_loss": -38.26483917236328, "global_step": 124565, "epoch": 1029} {"train_loss": -38.46255111694336, "global_step": 124566, "epoch": 1029} {"train_loss": -38.41998291015625, "global_step": 124567, "epoch": 1029} {"train_loss": -38.72891616821289, "global_step": 124568, "epoch": 1029} {"train_loss": -38.721431732177734, "global_step": 124569, "epoch": 1029} {"train_loss": -38.05475616455078, "global_step": 124570, "epoch": 1029} {"train_loss": -38.444480895996094, "global_step": 124571, "epoch": 1029} {"train_loss": -38.73109817504883, "global_step": 124572, "epoch": 1029} {"train_loss": -38.94926834106445, "global_step": 124573, "epoch": 1029} {"train_loss": -38.37390899658203, "global_step": 124574, "epoch": 1029} {"train_loss": -39.118656158447266, "global_step": 124575, "epoch": 1029} {"train_loss": -39.0137939453125, "global_step": 124576, "epoch": 1029} {"train_loss": -38.82292938232422, "global_step": 124577, "epoch": 1029} {"train_loss": -38.4560661315918, "global_step": 124578, "epoch": 1029} {"train_loss": -39.17845153808594, "global_step": 124579, "epoch": 1029} {"train_loss": -39.03942108154297, "global_step": 124580, "epoch": 1029} {"train_loss": -38.40255355834961, "global_step": 124581, "epoch": 1029} {"train_loss": -38.79173278808594, "global_step": 124582, "epoch": 1029} {"train_loss": -39.00255584716797, "global_step": 124583, "epoch": 1029} {"train_loss": -38.9383430480957, "global_step": 124584, "epoch": 1029} {"train_loss": -38.860084533691406, "global_step": 124585, "epoch": 1029} {"train_loss": -38.801605224609375, "global_step": 124586, "epoch": 1029} {"train_loss": -38.961517333984375, "global_step": 124587, "epoch": 1029} {"train_loss": -39.019657135009766, "global_step": 124588, "epoch": 1029} {"train_loss": -39.29269027709961, "global_step": 124589, "epoch": 1029} {"train_loss": -38.661529541015625, "global_step": 124590, "epoch": 1029} {"train_loss": -38.42708969116211, "global_step": 124591, "epoch": 1029} {"train_loss": -39.264564514160156, "global_step": 124592, "epoch": 1029} {"train_loss": -38.959861755371094, "global_step": 124593, "epoch": 1029} {"train_loss": -39.06116485595703, "global_step": 124594, "epoch": 1029} {"train_loss": -38.83443069458008, "global_step": 124595, "epoch": 1029} {"train_loss": -39.437835693359375, "global_step": 124596, "epoch": 1029} {"train_loss": -38.5319709777832, "global_step": 124597, "epoch": 1029} {"train_loss": -39.158843994140625, "global_step": 124598, "epoch": 1029} {"train_loss": -38.620330810546875, "global_step": 124599, "epoch": 1029} {"train_loss": -38.919342041015625, "global_step": 124600, "epoch": 1029} {"train_loss": -38.287384033203125, "global_step": 124601, "epoch": 1029} {"train_loss": -39.245059967041016, "global_step": 124602, "epoch": 1029} {"train_loss": -38.59490966796875, "global_step": 124603, "epoch": 1029} {"train_loss": -39.4713134765625, "global_step": 124604, "epoch": 1029} {"train_loss": -39.3242301940918, "global_step": 124605, "epoch": 1029} {"train_loss": -39.678340911865234, "global_step": 124606, "epoch": 1029} {"train_loss": -39.30200958251953, "global_step": 124607, "epoch": 1029} {"train_loss": -39.33402633666992, "global_step": 124608, "epoch": 1029} {"train_loss": -39.733150482177734, "global_step": 124609, "epoch": 1029} {"train_loss": -39.81560134887695, "global_step": 124610, "epoch": 1029} {"train_loss": -39.28316879272461, "global_step": 124611, "epoch": 1029} {"train_loss": -39.3576545715332, "global_step": 124612, "epoch": 1029} {"train_loss": -39.282684326171875, "global_step": 124613, "epoch": 1029} {"train_loss": -39.405792236328125, "global_step": 124614, "epoch": 1029} {"train_loss": -39.331764221191406, "global_step": 124615, "epoch": 1029} {"train_loss": -39.02470016479492, "global_step": 124616, "epoch": 1029} {"train_loss": -39.7208366394043, "global_step": 124617, "epoch": 1029} {"train_loss": -39.81928253173828, "global_step": 124618, "epoch": 1029} {"train_loss": -39.49939727783203, "global_step": 124619, "epoch": 1029} {"train_loss": -39.473079681396484, "global_step": 124620, "epoch": 1029} {"train_loss": -38.091243743896484, "global_step": 124621, "epoch": 1029} {"train_loss": -38.27593994140625, "global_step": 124622, "epoch": 1029} {"train_loss": -37.62641906738281, "global_step": 124623, "epoch": 1029} {"train_loss": -35.31779861450195, "global_step": 124624, "epoch": 1029} {"train_loss": -26.530426025390625, "global_step": 124625, "epoch": 1029} {"train_loss": -8.103792190551758, "global_step": 124626, "epoch": 1029} {"train_loss": 4.952916622161865, "global_step": 124627, "epoch": 1029} {"train_loss": -12.696098327636719, "global_step": 124628, "epoch": 1029} {"train_loss": -37.181919101841196, "global_step": 124629, "epoch": 1029, "val_loss": 2696259.75} {"train_loss": -14.89246654510498, "global_step": 124630, "epoch": 1030} {"train_loss": -33.8543586730957, "global_step": 124631, "epoch": 1030} {"train_loss": -20.70014190673828, "global_step": 124632, "epoch": 1030} {"train_loss": -34.77497863769531, "global_step": 124633, "epoch": 1030} {"train_loss": -27.651199340820312, "global_step": 124634, "epoch": 1030} {"train_loss": -35.32875442504883, "global_step": 124635, "epoch": 1030} {"train_loss": -30.806365966796875, "global_step": 124636, "epoch": 1030} {"train_loss": -31.059574127197266, "global_step": 124637, "epoch": 1030} {"train_loss": -34.75704574584961, "global_step": 124638, "epoch": 1030} {"train_loss": -33.89887237548828, "global_step": 124639, "epoch": 1030} {"train_loss": -32.682857513427734, "global_step": 124640, "epoch": 1030} {"train_loss": -32.75393295288086, "global_step": 124641, "epoch": 1030} {"train_loss": -34.64796447753906, "global_step": 124642, "epoch": 1030} {"train_loss": -33.59584426879883, "global_step": 124643, "epoch": 1030} {"train_loss": -35.15182113647461, "global_step": 124644, "epoch": 1030} {"train_loss": -35.1429557800293, "global_step": 124645, "epoch": 1030} {"train_loss": -35.88045120239258, "global_step": 124646, "epoch": 1030} {"train_loss": -35.163455963134766, "global_step": 124647, "epoch": 1030} {"train_loss": -34.81497573852539, "global_step": 124648, "epoch": 1030} {"train_loss": -36.00554656982422, "global_step": 124649, "epoch": 1030} {"train_loss": -36.82746124267578, "global_step": 124650, "epoch": 1030} {"train_loss": -36.13450241088867, "global_step": 124651, "epoch": 1030} {"train_loss": -36.000545501708984, "global_step": 124652, "epoch": 1030} {"train_loss": -36.02463912963867, "global_step": 124653, "epoch": 1030} {"train_loss": -36.516414642333984, "global_step": 124654, "epoch": 1030} {"train_loss": -37.279273986816406, "global_step": 124655, "epoch": 1030} {"train_loss": -36.959228515625, "global_step": 124656, "epoch": 1030} {"train_loss": -36.930274963378906, "global_step": 124657, "epoch": 1030} {"train_loss": -36.65536117553711, "global_step": 124658, "epoch": 1030} {"train_loss": -37.22068405151367, "global_step": 124659, "epoch": 1030} {"train_loss": -37.39421081542969, "global_step": 124660, "epoch": 1030} {"train_loss": -37.37668991088867, "global_step": 124661, "epoch": 1030} {"train_loss": -37.45554733276367, "global_step": 124662, "epoch": 1030} {"train_loss": -37.40517807006836, "global_step": 124663, "epoch": 1030} {"train_loss": -37.53561019897461, "global_step": 124664, "epoch": 1030} {"train_loss": -38.024349212646484, "global_step": 124665, "epoch": 1030} {"train_loss": -37.5654182434082, "global_step": 124666, "epoch": 1030} {"train_loss": -37.74717712402344, "global_step": 124667, "epoch": 1030} {"train_loss": -37.6960563659668, "global_step": 124668, "epoch": 1030} {"train_loss": -37.87299728393555, "global_step": 124669, "epoch": 1030} {"train_loss": -37.592124938964844, "global_step": 124670, "epoch": 1030} {"train_loss": -37.58815002441406, "global_step": 124671, "epoch": 1030} {"train_loss": -37.94587707519531, "global_step": 124672, "epoch": 1030} {"train_loss": -38.16117477416992, "global_step": 124673, "epoch": 1030} {"train_loss": -37.861053466796875, "global_step": 124674, "epoch": 1030} {"train_loss": -38.158870697021484, "global_step": 124675, "epoch": 1030} {"train_loss": -38.225643157958984, "global_step": 124676, "epoch": 1030} {"train_loss": -38.504791259765625, "global_step": 124677, "epoch": 1030} {"train_loss": -38.28214645385742, "global_step": 124678, "epoch": 1030} {"train_loss": -38.3340950012207, "global_step": 124679, "epoch": 1030} {"train_loss": -38.32954788208008, "global_step": 124680, "epoch": 1030} {"train_loss": -38.46438217163086, "global_step": 124681, "epoch": 1030} {"train_loss": -38.181114196777344, "global_step": 124682, "epoch": 1030} {"train_loss": -38.50715255737305, "global_step": 124683, "epoch": 1030} {"train_loss": -38.436641693115234, "global_step": 124684, "epoch": 1030} {"train_loss": -38.52570724487305, "global_step": 124685, "epoch": 1030} {"train_loss": -38.394386291503906, "global_step": 124686, "epoch": 1030} {"train_loss": -37.844322204589844, "global_step": 124687, "epoch": 1030} {"train_loss": -38.26957321166992, "global_step": 124688, "epoch": 1030} {"train_loss": -38.65658187866211, "global_step": 124689, "epoch": 1030} {"train_loss": -39.197750091552734, "global_step": 124690, "epoch": 1030} {"train_loss": -38.597938537597656, "global_step": 124691, "epoch": 1030} {"train_loss": -38.83749008178711, "global_step": 124692, "epoch": 1030} {"train_loss": -38.9952507019043, "global_step": 124693, "epoch": 1030} {"train_loss": -39.0534782409668, "global_step": 124694, "epoch": 1030} {"train_loss": -38.365108489990234, "global_step": 124695, "epoch": 1030} {"train_loss": -39.03861618041992, "global_step": 124696, "epoch": 1030} {"train_loss": -39.31999588012695, "global_step": 124697, "epoch": 1030} {"train_loss": -38.89064025878906, "global_step": 124698, "epoch": 1030} {"train_loss": -38.957801818847656, "global_step": 124699, "epoch": 1030} {"train_loss": -38.8702507019043, "global_step": 124700, "epoch": 1030} {"train_loss": -39.14936447143555, "global_step": 124701, "epoch": 1030} {"train_loss": -39.06455612182617, "global_step": 124702, "epoch": 1030} {"train_loss": -39.254207611083984, "global_step": 124703, "epoch": 1030} {"train_loss": -39.25240707397461, "global_step": 124704, "epoch": 1030} {"train_loss": -39.07670974731445, "global_step": 124705, "epoch": 1030} {"train_loss": -39.63627243041992, "global_step": 124706, "epoch": 1030} {"train_loss": -39.37321472167969, "global_step": 124707, "epoch": 1030} {"train_loss": -39.38447189331055, "global_step": 124708, "epoch": 1030} {"train_loss": -39.21950912475586, "global_step": 124709, "epoch": 1030} {"train_loss": -39.47419357299805, "global_step": 124710, "epoch": 1030} {"train_loss": -39.37640380859375, "global_step": 124711, "epoch": 1030} {"train_loss": -39.39888000488281, "global_step": 124712, "epoch": 1030} {"train_loss": -39.65988540649414, "global_step": 124713, "epoch": 1030} {"train_loss": -39.50010299682617, "global_step": 124714, "epoch": 1030} {"train_loss": -39.47798156738281, "global_step": 124715, "epoch": 1030} {"train_loss": -39.758140563964844, "global_step": 124716, "epoch": 1030} {"train_loss": -39.024993896484375, "global_step": 124717, "epoch": 1030} {"train_loss": -39.823299407958984, "global_step": 124718, "epoch": 1030} {"train_loss": -39.28923416137695, "global_step": 124719, "epoch": 1030} {"train_loss": -39.658931732177734, "global_step": 124720, "epoch": 1030} {"train_loss": -39.47833251953125, "global_step": 124721, "epoch": 1030} {"train_loss": -39.35051345825195, "global_step": 124722, "epoch": 1030} {"train_loss": -39.80949783325195, "global_step": 124723, "epoch": 1030} {"train_loss": -40.098876953125, "global_step": 124724, "epoch": 1030} {"train_loss": -39.78939437866211, "global_step": 124725, "epoch": 1030} {"train_loss": -39.727333068847656, "global_step": 124726, "epoch": 1030} {"train_loss": -39.97825241088867, "global_step": 124727, "epoch": 1030} {"train_loss": -39.90510940551758, "global_step": 124728, "epoch": 1030} {"train_loss": -39.51853561401367, "global_step": 124729, "epoch": 1030} {"train_loss": -39.1695442199707, "global_step": 124730, "epoch": 1030} {"train_loss": -39.28682327270508, "global_step": 124731, "epoch": 1030} {"train_loss": -38.87498474121094, "global_step": 124732, "epoch": 1030} {"train_loss": -39.8409423828125, "global_step": 124733, "epoch": 1030} {"train_loss": -39.76848220825195, "global_step": 124734, "epoch": 1030} {"train_loss": -39.45540237426758, "global_step": 124735, "epoch": 1030} {"train_loss": -38.282527923583984, "global_step": 124736, "epoch": 1030} {"train_loss": -38.39192581176758, "global_step": 124737, "epoch": 1030} {"train_loss": -37.966094970703125, "global_step": 124738, "epoch": 1030} {"train_loss": -38.83626174926758, "global_step": 124739, "epoch": 1030} {"train_loss": -39.595985412597656, "global_step": 124740, "epoch": 1030} {"train_loss": -39.278289794921875, "global_step": 124741, "epoch": 1030} {"train_loss": -39.24264144897461, "global_step": 124742, "epoch": 1030} {"train_loss": -37.11570358276367, "global_step": 124743, "epoch": 1030} {"train_loss": -31.797910690307617, "global_step": 124744, "epoch": 1030} {"train_loss": -31.94452476501465, "global_step": 124745, "epoch": 1030} {"train_loss": -35.51520538330078, "global_step": 124746, "epoch": 1030} {"train_loss": -39.04445266723633, "global_step": 124747, "epoch": 1030} {"train_loss": -35.9951286315918, "global_step": 124748, "epoch": 1030} {"train_loss": -36.202491760253906, "global_step": 124749, "epoch": 1030} {"train_loss": -37.33766785140865, "global_step": 124750, "epoch": 1030, "val_loss": 2660289.75} {"train_loss": -38.03985595703125, "global_step": 124751, "epoch": 1031} {"train_loss": -37.10984420776367, "global_step": 124752, "epoch": 1031} {"train_loss": -39.478878021240234, "global_step": 124753, "epoch": 1031} {"train_loss": -37.04325866699219, "global_step": 124754, "epoch": 1031} {"train_loss": -38.487060546875, "global_step": 124755, "epoch": 1031} {"train_loss": -38.404632568359375, "global_step": 124756, "epoch": 1031} {"train_loss": -38.135555267333984, "global_step": 124757, "epoch": 1031} {"train_loss": -38.92951202392578, "global_step": 124758, "epoch": 1031} {"train_loss": -37.45204162597656, "global_step": 124759, "epoch": 1031} {"train_loss": -38.79560470581055, "global_step": 124760, "epoch": 1031} {"train_loss": -38.484683990478516, "global_step": 124761, "epoch": 1031} {"train_loss": -39.16853713989258, "global_step": 124762, "epoch": 1031} {"train_loss": -38.0827522277832, "global_step": 124763, "epoch": 1031} {"train_loss": -37.53622055053711, "global_step": 124764, "epoch": 1031} {"train_loss": -38.14900207519531, "global_step": 124765, "epoch": 1031} {"train_loss": -39.44404983520508, "global_step": 124766, "epoch": 1031} {"train_loss": -39.10418701171875, "global_step": 124767, "epoch": 1031} {"train_loss": -37.93624496459961, "global_step": 124768, "epoch": 1031} {"train_loss": -38.531795501708984, "global_step": 124769, "epoch": 1031} {"train_loss": -38.8134765625, "global_step": 124770, "epoch": 1031} {"train_loss": -38.94922637939453, "global_step": 124771, "epoch": 1031} {"train_loss": -39.04121780395508, "global_step": 124772, "epoch": 1031} {"train_loss": -38.46638107299805, "global_step": 124773, "epoch": 1031} {"train_loss": -39.23907470703125, "global_step": 124774, "epoch": 1031} {"train_loss": -38.20203399658203, "global_step": 124775, "epoch": 1031} {"train_loss": -38.08028793334961, "global_step": 124776, "epoch": 1031} {"train_loss": -38.380516052246094, "global_step": 124777, "epoch": 1031} {"train_loss": -37.96100997924805, "global_step": 124778, "epoch": 1031} {"train_loss": -38.89837646484375, "global_step": 124779, "epoch": 1031} {"train_loss": -39.500892639160156, "global_step": 124780, "epoch": 1031} {"train_loss": -38.842376708984375, "global_step": 124781, "epoch": 1031} {"train_loss": -39.18711471557617, "global_step": 124782, "epoch": 1031} {"train_loss": -39.53852462768555, "global_step": 124783, "epoch": 1031} {"train_loss": -38.0157585144043, "global_step": 124784, "epoch": 1031} {"train_loss": -38.698211669921875, "global_step": 124785, "epoch": 1031} {"train_loss": -39.22736358642578, "global_step": 124786, "epoch": 1031} {"train_loss": -39.16273880004883, "global_step": 124787, "epoch": 1031} {"train_loss": -39.5457878112793, "global_step": 124788, "epoch": 1031} {"train_loss": -39.051727294921875, "global_step": 124789, "epoch": 1031} {"train_loss": -39.16107940673828, "global_step": 124790, "epoch": 1031} {"train_loss": -39.165283203125, "global_step": 124791, "epoch": 1031} {"train_loss": -39.16400909423828, "global_step": 124792, "epoch": 1031} {"train_loss": -39.672393798828125, "global_step": 124793, "epoch": 1031} {"train_loss": -39.500789642333984, "global_step": 124794, "epoch": 1031} {"train_loss": -38.94914627075195, "global_step": 124795, "epoch": 1031} {"train_loss": -39.555702209472656, "global_step": 124796, "epoch": 1031} {"train_loss": -39.52120590209961, "global_step": 124797, "epoch": 1031} {"train_loss": -38.25041580200195, "global_step": 124798, "epoch": 1031} {"train_loss": -39.446563720703125, "global_step": 124799, "epoch": 1031} {"train_loss": -39.6470832824707, "global_step": 124800, "epoch": 1031} {"train_loss": -39.3381233215332, "global_step": 124801, "epoch": 1031} {"train_loss": -39.28894805908203, "global_step": 124802, "epoch": 1031} {"train_loss": -39.45156478881836, "global_step": 124803, "epoch": 1031} {"train_loss": -39.27239990234375, "global_step": 124804, "epoch": 1031} {"train_loss": -39.1107292175293, "global_step": 124805, "epoch": 1031} {"train_loss": -37.79415512084961, "global_step": 124806, "epoch": 1031} {"train_loss": -39.10322952270508, "global_step": 124807, "epoch": 1031} {"train_loss": -38.400665283203125, "global_step": 124808, "epoch": 1031} {"train_loss": -39.602203369140625, "global_step": 124809, "epoch": 1031} {"train_loss": -38.96095275878906, "global_step": 124810, "epoch": 1031} {"train_loss": -38.370384216308594, "global_step": 124811, "epoch": 1031} {"train_loss": -39.451385498046875, "global_step": 124812, "epoch": 1031} {"train_loss": -36.73427200317383, "global_step": 124813, "epoch": 1031} {"train_loss": -38.1705436706543, "global_step": 124814, "epoch": 1031} {"train_loss": -38.32961654663086, "global_step": 124815, "epoch": 1031} {"train_loss": -38.431514739990234, "global_step": 124816, "epoch": 1031} {"train_loss": -38.9259147644043, "global_step": 124817, "epoch": 1031} {"train_loss": -37.187801361083984, "global_step": 124818, "epoch": 1031} {"train_loss": -38.31655502319336, "global_step": 124819, "epoch": 1031} {"train_loss": -38.0297966003418, "global_step": 124820, "epoch": 1031} {"train_loss": -38.26408386230469, "global_step": 124821, "epoch": 1031} {"train_loss": -38.85624694824219, "global_step": 124822, "epoch": 1031} {"train_loss": -37.9219970703125, "global_step": 124823, "epoch": 1031} {"train_loss": -38.4123420715332, "global_step": 124824, "epoch": 1031} {"train_loss": -38.80754470825195, "global_step": 124825, "epoch": 1031} {"train_loss": -37.684783935546875, "global_step": 124826, "epoch": 1031} {"train_loss": -38.08264923095703, "global_step": 124827, "epoch": 1031} {"train_loss": -36.99055099487305, "global_step": 124828, "epoch": 1031} {"train_loss": -38.433197021484375, "global_step": 124829, "epoch": 1031} {"train_loss": -38.144161224365234, "global_step": 124830, "epoch": 1031} {"train_loss": -38.62747573852539, "global_step": 124831, "epoch": 1031} {"train_loss": -38.438716888427734, "global_step": 124832, "epoch": 1031} {"train_loss": -37.85419845581055, "global_step": 124833, "epoch": 1031} {"train_loss": -37.8513298034668, "global_step": 124834, "epoch": 1031} {"train_loss": -38.74202346801758, "global_step": 124835, "epoch": 1031} {"train_loss": -37.68271255493164, "global_step": 124836, "epoch": 1031} {"train_loss": -38.506202697753906, "global_step": 124837, "epoch": 1031} {"train_loss": -38.52265167236328, "global_step": 124838, "epoch": 1031} {"train_loss": -37.958274841308594, "global_step": 124839, "epoch": 1031} {"train_loss": -39.21376419067383, "global_step": 124840, "epoch": 1031} {"train_loss": -36.860450744628906, "global_step": 124841, "epoch": 1031} {"train_loss": -37.65843200683594, "global_step": 124842, "epoch": 1031} {"train_loss": -39.06243133544922, "global_step": 124843, "epoch": 1031} {"train_loss": -38.22600173950195, "global_step": 124844, "epoch": 1031} {"train_loss": -38.073326110839844, "global_step": 124845, "epoch": 1031} {"train_loss": -38.94707107543945, "global_step": 124846, "epoch": 1031} {"train_loss": -37.836971282958984, "global_step": 124847, "epoch": 1031} {"train_loss": -38.18818664550781, "global_step": 124848, "epoch": 1031} {"train_loss": -37.88981246948242, "global_step": 124849, "epoch": 1031} {"train_loss": -37.74261474609375, "global_step": 124850, "epoch": 1031} {"train_loss": -38.296844482421875, "global_step": 124851, "epoch": 1031} {"train_loss": -38.55178451538086, "global_step": 124852, "epoch": 1031} {"train_loss": -37.638160705566406, "global_step": 124853, "epoch": 1031} {"train_loss": -38.43576431274414, "global_step": 124854, "epoch": 1031} {"train_loss": -38.28817367553711, "global_step": 124855, "epoch": 1031} {"train_loss": -38.86886215209961, "global_step": 124856, "epoch": 1031} {"train_loss": -38.6610221862793, "global_step": 124857, "epoch": 1031} {"train_loss": -39.0903434753418, "global_step": 124858, "epoch": 1031} {"train_loss": -38.86550521850586, "global_step": 124859, "epoch": 1031} {"train_loss": -38.76552963256836, "global_step": 124860, "epoch": 1031} {"train_loss": -38.657318115234375, "global_step": 124861, "epoch": 1031} {"train_loss": -38.91535186767578, "global_step": 124862, "epoch": 1031} {"train_loss": -39.15293502807617, "global_step": 124863, "epoch": 1031} {"train_loss": -39.6171760559082, "global_step": 124864, "epoch": 1031} {"train_loss": -39.25912094116211, "global_step": 124865, "epoch": 1031} {"train_loss": -38.96151351928711, "global_step": 124866, "epoch": 1031} {"train_loss": -38.9647331237793, "global_step": 124867, "epoch": 1031} {"train_loss": -39.293487548828125, "global_step": 124868, "epoch": 1031} {"train_loss": -38.9320068359375, "global_step": 124869, "epoch": 1031} {"train_loss": -38.80990219116211, "global_step": 124870, "epoch": 1031} {"train_loss": -38.58998814102047, "global_step": 124871, "epoch": 1031, "val_loss": 2659359.75} {"train_loss": -39.28052520751953, "global_step": 124872, "epoch": 1032} {"train_loss": -39.706119537353516, "global_step": 124873, "epoch": 1032} {"train_loss": -38.85392761230469, "global_step": 124874, "epoch": 1032} {"train_loss": -39.09755325317383, "global_step": 124875, "epoch": 1032} {"train_loss": -39.48200607299805, "global_step": 124876, "epoch": 1032} {"train_loss": -39.97613525390625, "global_step": 124877, "epoch": 1032} {"train_loss": -39.742488861083984, "global_step": 124878, "epoch": 1032} {"train_loss": -39.29569625854492, "global_step": 124879, "epoch": 1032} {"train_loss": -39.15797805786133, "global_step": 124880, "epoch": 1032} {"train_loss": -39.190460205078125, "global_step": 124881, "epoch": 1032} {"train_loss": -38.805843353271484, "global_step": 124882, "epoch": 1032} {"train_loss": -39.538936614990234, "global_step": 124883, "epoch": 1032} {"train_loss": -39.5754280090332, "global_step": 124884, "epoch": 1032} {"train_loss": -39.638648986816406, "global_step": 124885, "epoch": 1032} {"train_loss": -39.681243896484375, "global_step": 124886, "epoch": 1032} {"train_loss": -39.296756744384766, "global_step": 124887, "epoch": 1032} {"train_loss": -38.46096420288086, "global_step": 124888, "epoch": 1032} {"train_loss": -39.478023529052734, "global_step": 124889, "epoch": 1032} {"train_loss": -39.9909782409668, "global_step": 124890, "epoch": 1032} {"train_loss": -39.72523880004883, "global_step": 124891, "epoch": 1032} {"train_loss": -39.16804885864258, "global_step": 124892, "epoch": 1032} {"train_loss": -39.82959747314453, "global_step": 124893, "epoch": 1032} {"train_loss": -39.37910842895508, "global_step": 124894, "epoch": 1032} {"train_loss": -39.256649017333984, "global_step": 124895, "epoch": 1032} {"train_loss": -40.099822998046875, "global_step": 124896, "epoch": 1032} {"train_loss": -40.078285217285156, "global_step": 124897, "epoch": 1032} {"train_loss": -40.034427642822266, "global_step": 124898, "epoch": 1032} {"train_loss": -40.20798110961914, "global_step": 124899, "epoch": 1032} {"train_loss": -40.181636810302734, "global_step": 124900, "epoch": 1032} {"train_loss": -39.82474899291992, "global_step": 124901, "epoch": 1032} {"train_loss": -39.707740783691406, "global_step": 124902, "epoch": 1032} {"train_loss": -40.16444396972656, "global_step": 124903, "epoch": 1032} {"train_loss": -38.66691207885742, "global_step": 124904, "epoch": 1032} {"train_loss": -39.531890869140625, "global_step": 124905, "epoch": 1032} {"train_loss": -40.251312255859375, "global_step": 124906, "epoch": 1032} {"train_loss": -40.555938720703125, "global_step": 124907, "epoch": 1032} {"train_loss": -39.67136764526367, "global_step": 124908, "epoch": 1032} {"train_loss": -39.4220085144043, "global_step": 124909, "epoch": 1032} {"train_loss": -40.43168258666992, "global_step": 124910, "epoch": 1032} {"train_loss": -39.7642707824707, "global_step": 124911, "epoch": 1032} {"train_loss": -39.355411529541016, "global_step": 124912, "epoch": 1032} {"train_loss": -38.528568267822266, "global_step": 124913, "epoch": 1032} {"train_loss": -39.9650993347168, "global_step": 124914, "epoch": 1032} {"train_loss": -40.02427291870117, "global_step": 124915, "epoch": 1032} {"train_loss": -39.328609466552734, "global_step": 124916, "epoch": 1032} {"train_loss": -39.79816436767578, "global_step": 124917, "epoch": 1032} {"train_loss": -39.5842170715332, "global_step": 124918, "epoch": 1032} {"train_loss": -39.40119171142578, "global_step": 124919, "epoch": 1032} {"train_loss": -38.55921173095703, "global_step": 124920, "epoch": 1032} {"train_loss": -39.45270538330078, "global_step": 124921, "epoch": 1032} {"train_loss": -39.836219787597656, "global_step": 124922, "epoch": 1032} {"train_loss": -38.99507522583008, "global_step": 124923, "epoch": 1032} {"train_loss": -39.092689514160156, "global_step": 124924, "epoch": 1032} {"train_loss": -40.45561218261719, "global_step": 124925, "epoch": 1032} {"train_loss": -39.41107940673828, "global_step": 124926, "epoch": 1032} {"train_loss": -36.874298095703125, "global_step": 124927, "epoch": 1032} {"train_loss": -39.009178161621094, "global_step": 124928, "epoch": 1032} {"train_loss": -39.74063491821289, "global_step": 124929, "epoch": 1032} {"train_loss": -38.6325798034668, "global_step": 124930, "epoch": 1032} {"train_loss": -39.069156646728516, "global_step": 124931, "epoch": 1032} {"train_loss": -40.4200325012207, "global_step": 124932, "epoch": 1032} {"train_loss": -38.31059646606445, "global_step": 124933, "epoch": 1032} {"train_loss": -38.301025390625, "global_step": 124934, "epoch": 1032} {"train_loss": -38.492916107177734, "global_step": 124935, "epoch": 1032} {"train_loss": -39.141273498535156, "global_step": 124936, "epoch": 1032} {"train_loss": -39.08020782470703, "global_step": 124937, "epoch": 1032} {"train_loss": -37.89922332763672, "global_step": 124938, "epoch": 1032} {"train_loss": -39.61177444458008, "global_step": 124939, "epoch": 1032} {"train_loss": -39.33643341064453, "global_step": 124940, "epoch": 1032} {"train_loss": -39.516334533691406, "global_step": 124941, "epoch": 1032} {"train_loss": -39.1178092956543, "global_step": 124942, "epoch": 1032} {"train_loss": -39.25359344482422, "global_step": 124943, "epoch": 1032} {"train_loss": -38.2367057800293, "global_step": 124944, "epoch": 1032} {"train_loss": -39.927772521972656, "global_step": 124945, "epoch": 1032} {"train_loss": -38.583553314208984, "global_step": 124946, "epoch": 1032} {"train_loss": -39.59603500366211, "global_step": 124947, "epoch": 1032} {"train_loss": -39.51837921142578, "global_step": 124948, "epoch": 1032} {"train_loss": -39.46673583984375, "global_step": 124949, "epoch": 1032} {"train_loss": -40.11202621459961, "global_step": 124950, "epoch": 1032} {"train_loss": -39.81843185424805, "global_step": 124951, "epoch": 1032} {"train_loss": -39.49635696411133, "global_step": 124952, "epoch": 1032} {"train_loss": -40.22236633300781, "global_step": 124953, "epoch": 1032} {"train_loss": -39.8479118347168, "global_step": 124954, "epoch": 1032} {"train_loss": -39.49253463745117, "global_step": 124955, "epoch": 1032} {"train_loss": -39.408447265625, "global_step": 124956, "epoch": 1032} {"train_loss": -40.17041778564453, "global_step": 124957, "epoch": 1032} {"train_loss": -39.51278305053711, "global_step": 124958, "epoch": 1032} {"train_loss": -40.062957763671875, "global_step": 124959, "epoch": 1032} {"train_loss": -38.42742919921875, "global_step": 124960, "epoch": 1032} {"train_loss": -38.10404586791992, "global_step": 124961, "epoch": 1032} {"train_loss": -39.77363204956055, "global_step": 124962, "epoch": 1032} {"train_loss": -40.04861068725586, "global_step": 124963, "epoch": 1032} {"train_loss": -39.9567756652832, "global_step": 124964, "epoch": 1032} {"train_loss": -39.93778610229492, "global_step": 124965, "epoch": 1032} {"train_loss": -38.34383773803711, "global_step": 124966, "epoch": 1032} {"train_loss": -39.5285530090332, "global_step": 124967, "epoch": 1032} {"train_loss": -39.36490249633789, "global_step": 124968, "epoch": 1032} {"train_loss": -39.59104537963867, "global_step": 124969, "epoch": 1032} {"train_loss": -39.58778762817383, "global_step": 124970, "epoch": 1032} {"train_loss": -39.3153190612793, "global_step": 124971, "epoch": 1032} {"train_loss": -35.480804443359375, "global_step": 124972, "epoch": 1032} {"train_loss": -39.22138214111328, "global_step": 124973, "epoch": 1032} {"train_loss": -36.782814025878906, "global_step": 124974, "epoch": 1032} {"train_loss": -37.30587387084961, "global_step": 124975, "epoch": 1032} {"train_loss": -39.68839645385742, "global_step": 124976, "epoch": 1032} {"train_loss": -38.78867721557617, "global_step": 124977, "epoch": 1032} {"train_loss": -38.76756286621094, "global_step": 124978, "epoch": 1032} {"train_loss": -38.443634033203125, "global_step": 124979, "epoch": 1032} {"train_loss": -37.65863800048828, "global_step": 124980, "epoch": 1032} {"train_loss": -38.442344665527344, "global_step": 124981, "epoch": 1032} {"train_loss": -38.53858947753906, "global_step": 124982, "epoch": 1032} {"train_loss": -38.96743392944336, "global_step": 124983, "epoch": 1032} {"train_loss": -36.62410354614258, "global_step": 124984, "epoch": 1032} {"train_loss": -39.05817794799805, "global_step": 124985, "epoch": 1032} {"train_loss": -35.692806243896484, "global_step": 124986, "epoch": 1032} {"train_loss": -36.15624237060547, "global_step": 124987, "epoch": 1032} {"train_loss": -37.271583557128906, "global_step": 124988, "epoch": 1032} {"train_loss": -38.98804473876953, "global_step": 124989, "epoch": 1032} {"train_loss": -37.64432907104492, "global_step": 124990, "epoch": 1032} {"train_loss": -38.012359619140625, "global_step": 124991, "epoch": 1032} {"train_loss": -39.14202950217507, "global_step": 124992, "epoch": 1032, "val_loss": 2825289.0} {"train_loss": -37.415130615234375, "global_step": 124993, "epoch": 1033} {"train_loss": -34.79949188232422, "global_step": 124994, "epoch": 1033} {"train_loss": -36.71840286254883, "global_step": 124995, "epoch": 1033} {"train_loss": -37.4122200012207, "global_step": 124996, "epoch": 1033} {"train_loss": -36.77256393432617, "global_step": 124997, "epoch": 1033} {"train_loss": -36.30670928955078, "global_step": 124998, "epoch": 1033} {"train_loss": -34.86262893676758, "global_step": 124999, "epoch": 1033} {"train_loss": -36.094966888427734, "global_step": 125000, "epoch": 1033} {"train_loss": -32.804561614990234, "global_step": 125001, "epoch": 1033} {"train_loss": -33.870269775390625, "global_step": 125002, "epoch": 1033} {"train_loss": -35.90139389038086, "global_step": 125003, "epoch": 1033} {"train_loss": -35.623260498046875, "global_step": 125004, "epoch": 1033} {"train_loss": -33.986297607421875, "global_step": 125005, "epoch": 1033} {"train_loss": -35.3854866027832, "global_step": 125006, "epoch": 1033} {"train_loss": -35.329193115234375, "global_step": 125007, "epoch": 1033} {"train_loss": -30.78791618347168, "global_step": 125008, "epoch": 1033} {"train_loss": -35.076271057128906, "global_step": 125009, "epoch": 1033} {"train_loss": -33.889984130859375, "global_step": 125010, "epoch": 1033} {"train_loss": -34.26721954345703, "global_step": 125011, "epoch": 1033} {"train_loss": -33.871334075927734, "global_step": 125012, "epoch": 1033} {"train_loss": -34.192012786865234, "global_step": 125013, "epoch": 1033} {"train_loss": -35.995540618896484, "global_step": 125014, "epoch": 1033} {"train_loss": -34.121856689453125, "global_step": 125015, "epoch": 1033} {"train_loss": -36.21560287475586, "global_step": 125016, "epoch": 1033} {"train_loss": -33.05817794799805, "global_step": 125017, "epoch": 1033} {"train_loss": -37.39777755737305, "global_step": 125018, "epoch": 1033} {"train_loss": -37.2532844543457, "global_step": 125019, "epoch": 1033} {"train_loss": -35.15568923950195, "global_step": 125020, "epoch": 1033} {"train_loss": -35.86457061767578, "global_step": 125021, "epoch": 1033} {"train_loss": -35.423095703125, "global_step": 125022, "epoch": 1033} {"train_loss": -36.107582092285156, "global_step": 125023, "epoch": 1033} {"train_loss": -36.43151092529297, "global_step": 125024, "epoch": 1033} {"train_loss": -37.1850471496582, "global_step": 125025, "epoch": 1033} {"train_loss": -36.46902084350586, "global_step": 125026, "epoch": 1033} {"train_loss": -37.395442962646484, "global_step": 125027, "epoch": 1033} {"train_loss": -36.353736877441406, "global_step": 125028, "epoch": 1033} {"train_loss": -37.19062805175781, "global_step": 125029, "epoch": 1033} {"train_loss": -37.29104232788086, "global_step": 125030, "epoch": 1033} {"train_loss": -35.8645133972168, "global_step": 125031, "epoch": 1033} {"train_loss": -37.933876037597656, "global_step": 125032, "epoch": 1033} {"train_loss": -37.582489013671875, "global_step": 125033, "epoch": 1033} {"train_loss": -35.65877914428711, "global_step": 125034, "epoch": 1033} {"train_loss": -37.7520751953125, "global_step": 125035, "epoch": 1033} {"train_loss": -36.5260124206543, "global_step": 125036, "epoch": 1033} {"train_loss": -37.03951644897461, "global_step": 125037, "epoch": 1033} {"train_loss": -38.007652282714844, "global_step": 125038, "epoch": 1033} {"train_loss": -38.058380126953125, "global_step": 125039, "epoch": 1033} {"train_loss": -37.452392578125, "global_step": 125040, "epoch": 1033} {"train_loss": -37.6051025390625, "global_step": 125041, "epoch": 1033} {"train_loss": -36.82172393798828, "global_step": 125042, "epoch": 1033} {"train_loss": -36.09661102294922, "global_step": 125043, "epoch": 1033} {"train_loss": -38.33955001831055, "global_step": 125044, "epoch": 1033} {"train_loss": -37.62268829345703, "global_step": 125045, "epoch": 1033} {"train_loss": -37.419124603271484, "global_step": 125046, "epoch": 1033} {"train_loss": -37.64760971069336, "global_step": 125047, "epoch": 1033} {"train_loss": -37.78060531616211, "global_step": 125048, "epoch": 1033} {"train_loss": -38.43247604370117, "global_step": 125049, "epoch": 1033} {"train_loss": -38.27410125732422, "global_step": 125050, "epoch": 1033} {"train_loss": -38.19562911987305, "global_step": 125051, "epoch": 1033} {"train_loss": -38.540283203125, "global_step": 125052, "epoch": 1033} {"train_loss": -38.469879150390625, "global_step": 125053, "epoch": 1033} {"train_loss": -38.36825180053711, "global_step": 125054, "epoch": 1033} {"train_loss": -38.48023223876953, "global_step": 125055, "epoch": 1033} {"train_loss": -37.81110382080078, "global_step": 125056, "epoch": 1033} {"train_loss": -38.66579055786133, "global_step": 125057, "epoch": 1033} {"train_loss": -38.76987838745117, "global_step": 125058, "epoch": 1033} {"train_loss": -37.11931228637695, "global_step": 125059, "epoch": 1033} {"train_loss": -38.371639251708984, "global_step": 125060, "epoch": 1033} {"train_loss": -38.543514251708984, "global_step": 125061, "epoch": 1033} {"train_loss": -38.52081298828125, "global_step": 125062, "epoch": 1033} {"train_loss": -38.64364242553711, "global_step": 125063, "epoch": 1033} {"train_loss": -38.79252243041992, "global_step": 125064, "epoch": 1033} {"train_loss": -38.815914154052734, "global_step": 125065, "epoch": 1033} {"train_loss": -38.4820556640625, "global_step": 125066, "epoch": 1033} {"train_loss": -38.8172607421875, "global_step": 125067, "epoch": 1033} {"train_loss": -38.99742126464844, "global_step": 125068, "epoch": 1033} {"train_loss": -37.991554260253906, "global_step": 125069, "epoch": 1033} {"train_loss": -39.13064193725586, "global_step": 125070, "epoch": 1033} {"train_loss": -38.358917236328125, "global_step": 125071, "epoch": 1033} {"train_loss": -39.05964660644531, "global_step": 125072, "epoch": 1033} {"train_loss": -37.06205368041992, "global_step": 125073, "epoch": 1033} {"train_loss": -39.3292236328125, "global_step": 125074, "epoch": 1033} {"train_loss": -38.952999114990234, "global_step": 125075, "epoch": 1033} {"train_loss": -38.93549728393555, "global_step": 125076, "epoch": 1033} {"train_loss": -38.94140625, "global_step": 125077, "epoch": 1033} {"train_loss": -39.08209991455078, "global_step": 125078, "epoch": 1033} {"train_loss": -38.79767608642578, "global_step": 125079, "epoch": 1033} {"train_loss": -38.936397552490234, "global_step": 125080, "epoch": 1033} {"train_loss": -38.60783767700195, "global_step": 125081, "epoch": 1033} {"train_loss": -37.90085983276367, "global_step": 125082, "epoch": 1033} {"train_loss": -39.36857223510742, "global_step": 125083, "epoch": 1033} {"train_loss": -39.406768798828125, "global_step": 125084, "epoch": 1033} {"train_loss": -39.119625091552734, "global_step": 125085, "epoch": 1033} {"train_loss": -38.5500373840332, "global_step": 125086, "epoch": 1033} {"train_loss": -39.0512580871582, "global_step": 125087, "epoch": 1033} {"train_loss": -39.209049224853516, "global_step": 125088, "epoch": 1033} {"train_loss": -39.736412048339844, "global_step": 125089, "epoch": 1033} {"train_loss": -38.8119010925293, "global_step": 125090, "epoch": 1033} {"train_loss": -39.3891716003418, "global_step": 125091, "epoch": 1033} {"train_loss": -38.879127502441406, "global_step": 125092, "epoch": 1033} {"train_loss": -39.2878303527832, "global_step": 125093, "epoch": 1033} {"train_loss": -38.59834671020508, "global_step": 125094, "epoch": 1033} {"train_loss": -38.916683197021484, "global_step": 125095, "epoch": 1033} {"train_loss": -39.414520263671875, "global_step": 125096, "epoch": 1033} {"train_loss": -39.0029411315918, "global_step": 125097, "epoch": 1033} {"train_loss": -39.23176956176758, "global_step": 125098, "epoch": 1033} {"train_loss": -39.62449264526367, "global_step": 125099, "epoch": 1033} {"train_loss": -38.850704193115234, "global_step": 125100, "epoch": 1033} {"train_loss": -39.323848724365234, "global_step": 125101, "epoch": 1033} {"train_loss": -38.17466354370117, "global_step": 125102, "epoch": 1033} {"train_loss": -39.3677978515625, "global_step": 125103, "epoch": 1033} {"train_loss": -38.75415802001953, "global_step": 125104, "epoch": 1033} {"train_loss": -39.393150329589844, "global_step": 125105, "epoch": 1033} {"train_loss": -38.925025939941406, "global_step": 125106, "epoch": 1033} {"train_loss": -39.57167434692383, "global_step": 125107, "epoch": 1033} {"train_loss": -39.8131217956543, "global_step": 125108, "epoch": 1033} {"train_loss": -39.718135833740234, "global_step": 125109, "epoch": 1033} {"train_loss": -39.556766510009766, "global_step": 125110, "epoch": 1033} {"train_loss": -38.67595291137695, "global_step": 125111, "epoch": 1033} {"train_loss": -39.14836120605469, "global_step": 125112, "epoch": 1033} {"train_loss": -37.57312978003636, "global_step": 125113, "epoch": 1033, "val_loss": 2679687.25} {"train_loss": -39.75019454956055, "global_step": 125114, "epoch": 1034} {"train_loss": -39.447357177734375, "global_step": 125115, "epoch": 1034} {"train_loss": -39.897212982177734, "global_step": 125116, "epoch": 1034} {"train_loss": -37.94365310668945, "global_step": 125117, "epoch": 1034} {"train_loss": -38.24458694458008, "global_step": 125118, "epoch": 1034} {"train_loss": -39.13508224487305, "global_step": 125119, "epoch": 1034} {"train_loss": -38.56635665893555, "global_step": 125120, "epoch": 1034} {"train_loss": -38.10200881958008, "global_step": 125121, "epoch": 1034} {"train_loss": -38.84902572631836, "global_step": 125122, "epoch": 1034} {"train_loss": -36.42679214477539, "global_step": 125123, "epoch": 1034} {"train_loss": -31.734655380249023, "global_step": 125124, "epoch": 1034} {"train_loss": -24.13614273071289, "global_step": 125125, "epoch": 1034} {"train_loss": 2.24419903755188, "global_step": 125126, "epoch": 1034} {"train_loss": 26.382970809936523, "global_step": 125127, "epoch": 1034} {"train_loss": -19.545183181762695, "global_step": 125128, "epoch": 1034} {"train_loss": -20.285184860229492, "global_step": 125129, "epoch": 1034} {"train_loss": -18.216684341430664, "global_step": 125130, "epoch": 1034} {"train_loss": -24.050928115844727, "global_step": 125131, "epoch": 1034} {"train_loss": -28.688308715820312, "global_step": 125132, "epoch": 1034} {"train_loss": -22.45647621154785, "global_step": 125133, "epoch": 1034} {"train_loss": -35.9617805480957, "global_step": 125134, "epoch": 1034} {"train_loss": -28.845788955688477, "global_step": 125135, "epoch": 1034} {"train_loss": -28.13821792602539, "global_step": 125136, "epoch": 1034} {"train_loss": -36.015071868896484, "global_step": 125137, "epoch": 1034} {"train_loss": -33.04475402832031, "global_step": 125138, "epoch": 1034} {"train_loss": -31.48719596862793, "global_step": 125139, "epoch": 1034} {"train_loss": -34.35679244995117, "global_step": 125140, "epoch": 1034} {"train_loss": -36.9341926574707, "global_step": 125141, "epoch": 1034} {"train_loss": -35.01828384399414, "global_step": 125142, "epoch": 1034} {"train_loss": -33.88751220703125, "global_step": 125143, "epoch": 1034} {"train_loss": -35.6200065612793, "global_step": 125144, "epoch": 1034} {"train_loss": -36.064090728759766, "global_step": 125145, "epoch": 1034} {"train_loss": -35.921051025390625, "global_step": 125146, "epoch": 1034} {"train_loss": -35.63774490356445, "global_step": 125147, "epoch": 1034} {"train_loss": -36.009803771972656, "global_step": 125148, "epoch": 1034} {"train_loss": -35.897682189941406, "global_step": 125149, "epoch": 1034} {"train_loss": -37.02390670776367, "global_step": 125150, "epoch": 1034} {"train_loss": -36.504859924316406, "global_step": 125151, "epoch": 1034} {"train_loss": -36.94517135620117, "global_step": 125152, "epoch": 1034} {"train_loss": -36.61979293823242, "global_step": 125153, "epoch": 1034} {"train_loss": -36.83180618286133, "global_step": 125154, "epoch": 1034} {"train_loss": -37.520240783691406, "global_step": 125155, "epoch": 1034} {"train_loss": -37.49085235595703, "global_step": 125156, "epoch": 1034} {"train_loss": -37.0098876953125, "global_step": 125157, "epoch": 1034} {"train_loss": -37.60633087158203, "global_step": 125158, "epoch": 1034} {"train_loss": -37.34515380859375, "global_step": 125159, "epoch": 1034} {"train_loss": -37.43464279174805, "global_step": 125160, "epoch": 1034} {"train_loss": -37.579803466796875, "global_step": 125161, "epoch": 1034} {"train_loss": -37.75931167602539, "global_step": 125162, "epoch": 1034} {"train_loss": -37.4721794128418, "global_step": 125163, "epoch": 1034} {"train_loss": -37.911930084228516, "global_step": 125164, "epoch": 1034} {"train_loss": -37.73382568359375, "global_step": 125165, "epoch": 1034} {"train_loss": -37.91783905029297, "global_step": 125166, "epoch": 1034} {"train_loss": -38.10654830932617, "global_step": 125167, "epoch": 1034} {"train_loss": -37.538021087646484, "global_step": 125168, "epoch": 1034} {"train_loss": -38.00649642944336, "global_step": 125169, "epoch": 1034} {"train_loss": -37.8917236328125, "global_step": 125170, "epoch": 1034} {"train_loss": -37.74421310424805, "global_step": 125171, "epoch": 1034} {"train_loss": -37.80707931518555, "global_step": 125172, "epoch": 1034} {"train_loss": -38.08697509765625, "global_step": 125173, "epoch": 1034} {"train_loss": -38.29341125488281, "global_step": 125174, "epoch": 1034} {"train_loss": -38.0627326965332, "global_step": 125175, "epoch": 1034} {"train_loss": -38.471981048583984, "global_step": 125176, "epoch": 1034} {"train_loss": -38.05035400390625, "global_step": 125177, "epoch": 1034} {"train_loss": -38.39837646484375, "global_step": 125178, "epoch": 1034} {"train_loss": -37.916194915771484, "global_step": 125179, "epoch": 1034} {"train_loss": -38.60304260253906, "global_step": 125180, "epoch": 1034} {"train_loss": -38.596412658691406, "global_step": 125181, "epoch": 1034} {"train_loss": -38.735233306884766, "global_step": 125182, "epoch": 1034} {"train_loss": -38.44330596923828, "global_step": 125183, "epoch": 1034} {"train_loss": -38.3061408996582, "global_step": 125184, "epoch": 1034} {"train_loss": -38.46479034423828, "global_step": 125185, "epoch": 1034} {"train_loss": -38.69650650024414, "global_step": 125186, "epoch": 1034} {"train_loss": -38.481807708740234, "global_step": 125187, "epoch": 1034} {"train_loss": -38.70829391479492, "global_step": 125188, "epoch": 1034} {"train_loss": -38.908451080322266, "global_step": 125189, "epoch": 1034} {"train_loss": -38.624969482421875, "global_step": 125190, "epoch": 1034} {"train_loss": -38.18758010864258, "global_step": 125191, "epoch": 1034} {"train_loss": -39.044639587402344, "global_step": 125192, "epoch": 1034} {"train_loss": -38.508697509765625, "global_step": 125193, "epoch": 1034} {"train_loss": -39.23313522338867, "global_step": 125194, "epoch": 1034} {"train_loss": -39.09218215942383, "global_step": 125195, "epoch": 1034} {"train_loss": -38.8684196472168, "global_step": 125196, "epoch": 1034} {"train_loss": -38.89279556274414, "global_step": 125197, "epoch": 1034} {"train_loss": -39.28718948364258, "global_step": 125198, "epoch": 1034} {"train_loss": -38.94296646118164, "global_step": 125199, "epoch": 1034} {"train_loss": -39.2828483581543, "global_step": 125200, "epoch": 1034} {"train_loss": -39.365047454833984, "global_step": 125201, "epoch": 1034} {"train_loss": -39.43007278442383, "global_step": 125202, "epoch": 1034} {"train_loss": -38.756160736083984, "global_step": 125203, "epoch": 1034} {"train_loss": -39.266334533691406, "global_step": 125204, "epoch": 1034} {"train_loss": -39.341697692871094, "global_step": 125205, "epoch": 1034} {"train_loss": -39.22874450683594, "global_step": 125206, "epoch": 1034} {"train_loss": -39.34613037109375, "global_step": 125207, "epoch": 1034} {"train_loss": -38.339595794677734, "global_step": 125208, "epoch": 1034} {"train_loss": -39.102943420410156, "global_step": 125209, "epoch": 1034} {"train_loss": -39.6103515625, "global_step": 125210, "epoch": 1034} {"train_loss": -39.65306854248047, "global_step": 125211, "epoch": 1034} {"train_loss": -39.303951263427734, "global_step": 125212, "epoch": 1034} {"train_loss": -39.4664192199707, "global_step": 125213, "epoch": 1034} {"train_loss": -39.105682373046875, "global_step": 125214, "epoch": 1034} {"train_loss": -39.668067932128906, "global_step": 125215, "epoch": 1034} {"train_loss": -38.80854415893555, "global_step": 125216, "epoch": 1034} {"train_loss": -38.87928771972656, "global_step": 125217, "epoch": 1034} {"train_loss": -39.61444854736328, "global_step": 125218, "epoch": 1034} {"train_loss": -39.19386672973633, "global_step": 125219, "epoch": 1034} {"train_loss": -39.40937423706055, "global_step": 125220, "epoch": 1034} {"train_loss": -39.389320373535156, "global_step": 125221, "epoch": 1034} {"train_loss": -39.576210021972656, "global_step": 125222, "epoch": 1034} {"train_loss": -39.75104904174805, "global_step": 125223, "epoch": 1034} {"train_loss": -39.514366149902344, "global_step": 125224, "epoch": 1034} {"train_loss": -39.766075134277344, "global_step": 125225, "epoch": 1034} {"train_loss": -39.87092971801758, "global_step": 125226, "epoch": 1034} {"train_loss": -39.488929748535156, "global_step": 125227, "epoch": 1034} {"train_loss": -39.70711135864258, "global_step": 125228, "epoch": 1034} {"train_loss": -39.8306770324707, "global_step": 125229, "epoch": 1034} {"train_loss": -39.38992691040039, "global_step": 125230, "epoch": 1034} {"train_loss": -39.884979248046875, "global_step": 125231, "epoch": 1034} {"train_loss": -39.969627380371094, "global_step": 125232, "epoch": 1034} {"train_loss": -40.009437561035156, "global_step": 125233, "epoch": 1034} {"train_loss": -36.195635147331174, "global_step": 125234, "epoch": 1034, "val_loss": 2691850.75} {"train_loss": -40.0053596496582, "global_step": 125235, "epoch": 1035} {"train_loss": -39.646934509277344, "global_step": 125236, "epoch": 1035} {"train_loss": -40.179298400878906, "global_step": 125237, "epoch": 1035} {"train_loss": -39.81661605834961, "global_step": 125238, "epoch": 1035} {"train_loss": -39.773582458496094, "global_step": 125239, "epoch": 1035} {"train_loss": -39.85893249511719, "global_step": 125240, "epoch": 1035} {"train_loss": -39.891510009765625, "global_step": 125241, "epoch": 1035} {"train_loss": -40.21302032470703, "global_step": 125242, "epoch": 1035} {"train_loss": -39.903987884521484, "global_step": 125243, "epoch": 1035} {"train_loss": -39.94389724731445, "global_step": 125244, "epoch": 1035} {"train_loss": -40.19499588012695, "global_step": 125245, "epoch": 1035} {"train_loss": -40.07642364501953, "global_step": 125246, "epoch": 1035} {"train_loss": -40.15913391113281, "global_step": 125247, "epoch": 1035} {"train_loss": -40.21328353881836, "global_step": 125248, "epoch": 1035} {"train_loss": -40.1001091003418, "global_step": 125249, "epoch": 1035} {"train_loss": -40.08380889892578, "global_step": 125250, "epoch": 1035} {"train_loss": -39.9691162109375, "global_step": 125251, "epoch": 1035} {"train_loss": -39.829708099365234, "global_step": 125252, "epoch": 1035} {"train_loss": -40.349334716796875, "global_step": 125253, "epoch": 1035} {"train_loss": -40.0207633972168, "global_step": 125254, "epoch": 1035} {"train_loss": -39.09644317626953, "global_step": 125255, "epoch": 1035} {"train_loss": -40.25237274169922, "global_step": 125256, "epoch": 1035} {"train_loss": -40.334083557128906, "global_step": 125257, "epoch": 1035} {"train_loss": -39.914215087890625, "global_step": 125258, "epoch": 1035} {"train_loss": -39.32828903198242, "global_step": 125259, "epoch": 1035} {"train_loss": -39.6746940612793, "global_step": 125260, "epoch": 1035} {"train_loss": -40.108619689941406, "global_step": 125261, "epoch": 1035} {"train_loss": -39.96065139770508, "global_step": 125262, "epoch": 1035} {"train_loss": -39.774925231933594, "global_step": 125263, "epoch": 1035} {"train_loss": -39.80843734741211, "global_step": 125264, "epoch": 1035} {"train_loss": -37.45347213745117, "global_step": 125265, "epoch": 1035} {"train_loss": -38.69306182861328, "global_step": 125266, "epoch": 1035} {"train_loss": -37.55942916870117, "global_step": 125267, "epoch": 1035} {"train_loss": -37.15483093261719, "global_step": 125268, "epoch": 1035} {"train_loss": -36.74562454223633, "global_step": 125269, "epoch": 1035} {"train_loss": -38.57294464111328, "global_step": 125270, "epoch": 1035} {"train_loss": -39.50838088989258, "global_step": 125271, "epoch": 1035} {"train_loss": -37.67329788208008, "global_step": 125272, "epoch": 1035} {"train_loss": -36.150634765625, "global_step": 125273, "epoch": 1035} {"train_loss": -38.652774810791016, "global_step": 125274, "epoch": 1035} {"train_loss": -39.26142501831055, "global_step": 125275, "epoch": 1035} {"train_loss": -38.493194580078125, "global_step": 125276, "epoch": 1035} {"train_loss": -38.24445724487305, "global_step": 125277, "epoch": 1035} {"train_loss": -38.6319694519043, "global_step": 125278, "epoch": 1035} {"train_loss": -38.998741149902344, "global_step": 125279, "epoch": 1035} {"train_loss": -33.608272552490234, "global_step": 125280, "epoch": 1035} {"train_loss": -38.09589767456055, "global_step": 125281, "epoch": 1035} {"train_loss": -38.70271301269531, "global_step": 125282, "epoch": 1035} {"train_loss": -38.810604095458984, "global_step": 125283, "epoch": 1035} {"train_loss": -37.250728607177734, "global_step": 125284, "epoch": 1035} {"train_loss": -39.041072845458984, "global_step": 125285, "epoch": 1035} {"train_loss": -38.279109954833984, "global_step": 125286, "epoch": 1035} {"train_loss": -38.29055404663086, "global_step": 125287, "epoch": 1035} {"train_loss": -39.069210052490234, "global_step": 125288, "epoch": 1035} {"train_loss": -38.80819320678711, "global_step": 125289, "epoch": 1035} {"train_loss": -38.320682525634766, "global_step": 125290, "epoch": 1035} {"train_loss": -38.51178741455078, "global_step": 125291, "epoch": 1035} {"train_loss": -38.112388610839844, "global_step": 125292, "epoch": 1035} {"train_loss": -38.80778121948242, "global_step": 125293, "epoch": 1035} {"train_loss": -37.522254943847656, "global_step": 125294, "epoch": 1035} {"train_loss": -37.853973388671875, "global_step": 125295, "epoch": 1035} {"train_loss": -38.60368728637695, "global_step": 125296, "epoch": 1035} {"train_loss": -38.903743743896484, "global_step": 125297, "epoch": 1035} {"train_loss": -38.09792709350586, "global_step": 125298, "epoch": 1035} {"train_loss": -31.36817741394043, "global_step": 125299, "epoch": 1035} {"train_loss": -38.735164642333984, "global_step": 125300, "epoch": 1035} {"train_loss": -35.920257568359375, "global_step": 125301, "epoch": 1035} {"train_loss": -37.82282257080078, "global_step": 125302, "epoch": 1035} {"train_loss": -38.424049377441406, "global_step": 125303, "epoch": 1035} {"train_loss": -38.022361755371094, "global_step": 125304, "epoch": 1035} {"train_loss": -38.15494918823242, "global_step": 125305, "epoch": 1035} {"train_loss": -36.018733978271484, "global_step": 125306, "epoch": 1035} {"train_loss": -38.39076614379883, "global_step": 125307, "epoch": 1035} {"train_loss": -36.149627685546875, "global_step": 125308, "epoch": 1035} {"train_loss": -37.233943939208984, "global_step": 125309, "epoch": 1035} {"train_loss": -20.428009033203125, "global_step": 125310, "epoch": 1035} {"train_loss": -36.980079650878906, "global_step": 125311, "epoch": 1035} {"train_loss": -36.976890563964844, "global_step": 125312, "epoch": 1035} {"train_loss": -35.99371337890625, "global_step": 125313, "epoch": 1035} {"train_loss": -38.26051330566406, "global_step": 125314, "epoch": 1035} {"train_loss": -37.05622482299805, "global_step": 125315, "epoch": 1035} {"train_loss": -34.52128982543945, "global_step": 125316, "epoch": 1035} {"train_loss": -35.31083297729492, "global_step": 125317, "epoch": 1035} {"train_loss": -37.242244720458984, "global_step": 125318, "epoch": 1035} {"train_loss": -34.455989837646484, "global_step": 125319, "epoch": 1035} {"train_loss": -37.91575241088867, "global_step": 125320, "epoch": 1035} {"train_loss": -32.70731735229492, "global_step": 125321, "epoch": 1035} {"train_loss": -38.028717041015625, "global_step": 125322, "epoch": 1035} {"train_loss": -35.79508972167969, "global_step": 125323, "epoch": 1035} {"train_loss": -36.33449935913086, "global_step": 125324, "epoch": 1035} {"train_loss": -36.95827102661133, "global_step": 125325, "epoch": 1035} {"train_loss": -35.9011344909668, "global_step": 125326, "epoch": 1035} {"train_loss": -37.28800582885742, "global_step": 125327, "epoch": 1035} {"train_loss": -38.14794921875, "global_step": 125328, "epoch": 1035} {"train_loss": -36.02376937866211, "global_step": 125329, "epoch": 1035} {"train_loss": -37.50899887084961, "global_step": 125330, "epoch": 1035} {"train_loss": -37.4801025390625, "global_step": 125331, "epoch": 1035} {"train_loss": -36.95028305053711, "global_step": 125332, "epoch": 1035} {"train_loss": -37.347930908203125, "global_step": 125333, "epoch": 1035} {"train_loss": -37.93147277832031, "global_step": 125334, "epoch": 1035} {"train_loss": -38.57490158081055, "global_step": 125335, "epoch": 1035} {"train_loss": -38.42816162109375, "global_step": 125336, "epoch": 1035} {"train_loss": -35.26314926147461, "global_step": 125337, "epoch": 1035} {"train_loss": -37.044673919677734, "global_step": 125338, "epoch": 1035} {"train_loss": -37.677913665771484, "global_step": 125339, "epoch": 1035} {"train_loss": -38.67273712158203, "global_step": 125340, "epoch": 1035} {"train_loss": -38.878662109375, "global_step": 125341, "epoch": 1035} {"train_loss": -37.6697883605957, "global_step": 125342, "epoch": 1035} {"train_loss": -37.658939361572266, "global_step": 125343, "epoch": 1035} {"train_loss": -38.4149284362793, "global_step": 125344, "epoch": 1035} {"train_loss": -38.94434356689453, "global_step": 125345, "epoch": 1035} {"train_loss": -37.340511322021484, "global_step": 125346, "epoch": 1035} {"train_loss": -37.69741439819336, "global_step": 125347, "epoch": 1035} {"train_loss": -36.9243049621582, "global_step": 125348, "epoch": 1035} {"train_loss": -37.67470932006836, "global_step": 125349, "epoch": 1035} {"train_loss": -35.36166000366211, "global_step": 125350, "epoch": 1035} {"train_loss": -38.634368896484375, "global_step": 125351, "epoch": 1035} {"train_loss": -38.366031646728516, "global_step": 125352, "epoch": 1035} {"train_loss": -38.53388214111328, "global_step": 125353, "epoch": 1035} {"train_loss": -38.513851165771484, "global_step": 125354, "epoch": 1035} {"train_loss": -37.97693559946107, "global_step": 125355, "epoch": 1035, "val_loss": 2681725.0} {"train_loss": -38.10285568237305, "global_step": 125356, "epoch": 1036} {"train_loss": -38.800140380859375, "global_step": 125357, "epoch": 1036} {"train_loss": -38.93187713623047, "global_step": 125358, "epoch": 1036} {"train_loss": -38.67425537109375, "global_step": 125359, "epoch": 1036} {"train_loss": -37.42814254760742, "global_step": 125360, "epoch": 1036} {"train_loss": -38.94364929199219, "global_step": 125361, "epoch": 1036} {"train_loss": -39.13636779785156, "global_step": 125362, "epoch": 1036} {"train_loss": -38.5830192565918, "global_step": 125363, "epoch": 1036} {"train_loss": -38.724239349365234, "global_step": 125364, "epoch": 1036} {"train_loss": -38.89365768432617, "global_step": 125365, "epoch": 1036} {"train_loss": -38.885684967041016, "global_step": 125366, "epoch": 1036} {"train_loss": -39.106651306152344, "global_step": 125367, "epoch": 1036} {"train_loss": -38.779781341552734, "global_step": 125368, "epoch": 1036} {"train_loss": -38.46875, "global_step": 125369, "epoch": 1036} {"train_loss": -38.7849235534668, "global_step": 125370, "epoch": 1036} {"train_loss": -39.170841217041016, "global_step": 125371, "epoch": 1036} {"train_loss": -38.72274398803711, "global_step": 125372, "epoch": 1036} {"train_loss": -39.19036865234375, "global_step": 125373, "epoch": 1036} {"train_loss": -38.8901481628418, "global_step": 125374, "epoch": 1036} {"train_loss": -38.318763732910156, "global_step": 125375, "epoch": 1036} {"train_loss": -39.371131896972656, "global_step": 125376, "epoch": 1036} {"train_loss": -38.69452667236328, "global_step": 125377, "epoch": 1036} {"train_loss": -39.39752960205078, "global_step": 125378, "epoch": 1036} {"train_loss": -39.20724868774414, "global_step": 125379, "epoch": 1036} {"train_loss": -39.116336822509766, "global_step": 125380, "epoch": 1036} {"train_loss": -37.262733459472656, "global_step": 125381, "epoch": 1036} {"train_loss": -38.107940673828125, "global_step": 125382, "epoch": 1036} {"train_loss": -37.789974212646484, "global_step": 125383, "epoch": 1036} {"train_loss": -38.440101623535156, "global_step": 125384, "epoch": 1036} {"train_loss": -38.2655143737793, "global_step": 125385, "epoch": 1036} {"train_loss": -38.2774658203125, "global_step": 125386, "epoch": 1036} {"train_loss": -38.99102783203125, "global_step": 125387, "epoch": 1036} {"train_loss": -38.686790466308594, "global_step": 125388, "epoch": 1036} {"train_loss": -38.4680290222168, "global_step": 125389, "epoch": 1036} {"train_loss": -27.82492446899414, "global_step": 125390, "epoch": 1036} {"train_loss": -37.70037841796875, "global_step": 125391, "epoch": 1036} {"train_loss": -36.30632019042969, "global_step": 125392, "epoch": 1036} {"train_loss": -28.90479850769043, "global_step": 125393, "epoch": 1036} {"train_loss": -35.78246307373047, "global_step": 125394, "epoch": 1036} {"train_loss": -36.289161682128906, "global_step": 125395, "epoch": 1036} {"train_loss": -37.79861068725586, "global_step": 125396, "epoch": 1036} {"train_loss": -35.495845794677734, "global_step": 125397, "epoch": 1036} {"train_loss": -37.315277099609375, "global_step": 125398, "epoch": 1036} {"train_loss": -38.15298080444336, "global_step": 125399, "epoch": 1036} {"train_loss": -31.080902099609375, "global_step": 125400, "epoch": 1036} {"train_loss": -36.790950775146484, "global_step": 125401, "epoch": 1036} {"train_loss": -36.35859298706055, "global_step": 125402, "epoch": 1036} {"train_loss": -35.564552307128906, "global_step": 125403, "epoch": 1036} {"train_loss": -37.92707443237305, "global_step": 125404, "epoch": 1036} {"train_loss": -38.626644134521484, "global_step": 125405, "epoch": 1036} {"train_loss": -37.85506820678711, "global_step": 125406, "epoch": 1036} {"train_loss": -37.51319122314453, "global_step": 125407, "epoch": 1036} {"train_loss": -37.738525390625, "global_step": 125408, "epoch": 1036} {"train_loss": -37.95688247680664, "global_step": 125409, "epoch": 1036} {"train_loss": -38.0110969543457, "global_step": 125410, "epoch": 1036} {"train_loss": -37.730892181396484, "global_step": 125411, "epoch": 1036} {"train_loss": -36.91450500488281, "global_step": 125412, "epoch": 1036} {"train_loss": -37.67127227783203, "global_step": 125413, "epoch": 1036} {"train_loss": -38.03833770751953, "global_step": 125414, "epoch": 1036} {"train_loss": -37.478572845458984, "global_step": 125415, "epoch": 1036} {"train_loss": -38.74932861328125, "global_step": 125416, "epoch": 1036} {"train_loss": -38.286678314208984, "global_step": 125417, "epoch": 1036} {"train_loss": -38.54983139038086, "global_step": 125418, "epoch": 1036} {"train_loss": -38.468170166015625, "global_step": 125419, "epoch": 1036} {"train_loss": -38.9083366394043, "global_step": 125420, "epoch": 1036} {"train_loss": -38.61420822143555, "global_step": 125421, "epoch": 1036} {"train_loss": -37.583839416503906, "global_step": 125422, "epoch": 1036} {"train_loss": -38.800838470458984, "global_step": 125423, "epoch": 1036} {"train_loss": -37.912353515625, "global_step": 125424, "epoch": 1036} {"train_loss": -37.43675231933594, "global_step": 125425, "epoch": 1036} {"train_loss": -34.06880569458008, "global_step": 125426, "epoch": 1036} {"train_loss": -37.79787063598633, "global_step": 125427, "epoch": 1036} {"train_loss": -38.367488861083984, "global_step": 125428, "epoch": 1036} {"train_loss": -38.282527923583984, "global_step": 125429, "epoch": 1036} {"train_loss": -37.70730209350586, "global_step": 125430, "epoch": 1036} {"train_loss": -37.27155685424805, "global_step": 125431, "epoch": 1036} {"train_loss": -36.41327667236328, "global_step": 125432, "epoch": 1036} {"train_loss": -37.93037033081055, "global_step": 125433, "epoch": 1036} {"train_loss": -37.69636535644531, "global_step": 125434, "epoch": 1036} {"train_loss": -38.26066207885742, "global_step": 125435, "epoch": 1036} {"train_loss": -38.383052825927734, "global_step": 125436, "epoch": 1036} {"train_loss": -38.147361755371094, "global_step": 125437, "epoch": 1036} {"train_loss": -38.12668991088867, "global_step": 125438, "epoch": 1036} {"train_loss": -39.095855712890625, "global_step": 125439, "epoch": 1036} {"train_loss": -37.592952728271484, "global_step": 125440, "epoch": 1036} {"train_loss": -36.79408264160156, "global_step": 125441, "epoch": 1036} {"train_loss": -39.303409576416016, "global_step": 125442, "epoch": 1036} {"train_loss": -38.196929931640625, "global_step": 125443, "epoch": 1036} {"train_loss": -38.359169006347656, "global_step": 125444, "epoch": 1036} {"train_loss": -37.57503890991211, "global_step": 125445, "epoch": 1036} {"train_loss": -38.35209274291992, "global_step": 125446, "epoch": 1036} {"train_loss": -39.16843032836914, "global_step": 125447, "epoch": 1036} {"train_loss": -38.36113739013672, "global_step": 125448, "epoch": 1036} {"train_loss": -38.90386962890625, "global_step": 125449, "epoch": 1036} {"train_loss": -38.62691116333008, "global_step": 125450, "epoch": 1036} {"train_loss": -39.1982307434082, "global_step": 125451, "epoch": 1036} {"train_loss": -37.835853576660156, "global_step": 125452, "epoch": 1036} {"train_loss": -39.47133255004883, "global_step": 125453, "epoch": 1036} {"train_loss": -39.40254211425781, "global_step": 125454, "epoch": 1036} {"train_loss": -38.637882232666016, "global_step": 125455, "epoch": 1036} {"train_loss": -39.02082061767578, "global_step": 125456, "epoch": 1036} {"train_loss": -39.44809341430664, "global_step": 125457, "epoch": 1036} {"train_loss": -39.3641242980957, "global_step": 125458, "epoch": 1036} {"train_loss": -39.10433578491211, "global_step": 125459, "epoch": 1036} {"train_loss": -39.097007751464844, "global_step": 125460, "epoch": 1036} {"train_loss": -38.855064392089844, "global_step": 125461, "epoch": 1036} {"train_loss": -39.26021957397461, "global_step": 125462, "epoch": 1036} {"train_loss": -39.363800048828125, "global_step": 125463, "epoch": 1036} {"train_loss": -39.0497932434082, "global_step": 125464, "epoch": 1036} {"train_loss": -39.73820114135742, "global_step": 125465, "epoch": 1036} {"train_loss": -38.952964782714844, "global_step": 125466, "epoch": 1036} {"train_loss": -39.36415481567383, "global_step": 125467, "epoch": 1036} {"train_loss": -38.86295700073242, "global_step": 125468, "epoch": 1036} {"train_loss": -38.898834228515625, "global_step": 125469, "epoch": 1036} {"train_loss": -39.107757568359375, "global_step": 125470, "epoch": 1036} {"train_loss": -39.381507873535156, "global_step": 125471, "epoch": 1036} {"train_loss": -38.84688186645508, "global_step": 125472, "epoch": 1036} {"train_loss": -39.41517639160156, "global_step": 125473, "epoch": 1036} {"train_loss": -39.1578254699707, "global_step": 125474, "epoch": 1036} {"train_loss": -39.539772033691406, "global_step": 125475, "epoch": 1036} {"train_loss": -38.095201050939636, "global_step": 125476, "epoch": 1036, "val_loss": 2715783.25} {"train_loss": -39.12641525268555, "global_step": 125477, "epoch": 1037} {"train_loss": -38.98167037963867, "global_step": 125478, "epoch": 1037} {"train_loss": -39.286163330078125, "global_step": 125479, "epoch": 1037} {"train_loss": -38.80842971801758, "global_step": 125480, "epoch": 1037} {"train_loss": -39.647857666015625, "global_step": 125481, "epoch": 1037} {"train_loss": -39.512298583984375, "global_step": 125482, "epoch": 1037} {"train_loss": -38.57131576538086, "global_step": 125483, "epoch": 1037} {"train_loss": -39.50185775756836, "global_step": 125484, "epoch": 1037} {"train_loss": -39.19875717163086, "global_step": 125485, "epoch": 1037} {"train_loss": -39.87639617919922, "global_step": 125486, "epoch": 1037} {"train_loss": -39.51277160644531, "global_step": 125487, "epoch": 1037} {"train_loss": -38.817386627197266, "global_step": 125488, "epoch": 1037} {"train_loss": -39.25590896606445, "global_step": 125489, "epoch": 1037} {"train_loss": -38.71224594116211, "global_step": 125490, "epoch": 1037} {"train_loss": -39.63880920410156, "global_step": 125491, "epoch": 1037} {"train_loss": -39.11101150512695, "global_step": 125492, "epoch": 1037} {"train_loss": -36.74325180053711, "global_step": 125493, "epoch": 1037} {"train_loss": -39.59115982055664, "global_step": 125494, "epoch": 1037} {"train_loss": -38.63764190673828, "global_step": 125495, "epoch": 1037} {"train_loss": -37.94527053833008, "global_step": 125496, "epoch": 1037} {"train_loss": -36.15842056274414, "global_step": 125497, "epoch": 1037} {"train_loss": -35.62897491455078, "global_step": 125498, "epoch": 1037} {"train_loss": -36.835060119628906, "global_step": 125499, "epoch": 1037} {"train_loss": -38.31631088256836, "global_step": 125500, "epoch": 1037} {"train_loss": -39.553138732910156, "global_step": 125501, "epoch": 1037} {"train_loss": -37.58319854736328, "global_step": 125502, "epoch": 1037} {"train_loss": -38.768890380859375, "global_step": 125503, "epoch": 1037} {"train_loss": -38.780879974365234, "global_step": 125504, "epoch": 1037} {"train_loss": -38.679893493652344, "global_step": 125505, "epoch": 1037} {"train_loss": -37.937068939208984, "global_step": 125506, "epoch": 1037} {"train_loss": -39.44541549682617, "global_step": 125507, "epoch": 1037} {"train_loss": -38.12525177001953, "global_step": 125508, "epoch": 1037} {"train_loss": -37.432594299316406, "global_step": 125509, "epoch": 1037} {"train_loss": -38.09077072143555, "global_step": 125510, "epoch": 1037} {"train_loss": -39.336238861083984, "global_step": 125511, "epoch": 1037} {"train_loss": -38.63054275512695, "global_step": 125512, "epoch": 1037} {"train_loss": -38.48377227783203, "global_step": 125513, "epoch": 1037} {"train_loss": -39.20395278930664, "global_step": 125514, "epoch": 1037} {"train_loss": -39.364593505859375, "global_step": 125515, "epoch": 1037} {"train_loss": -39.64140701293945, "global_step": 125516, "epoch": 1037} {"train_loss": -38.83349609375, "global_step": 125517, "epoch": 1037} {"train_loss": -38.95425796508789, "global_step": 125518, "epoch": 1037} {"train_loss": -38.98057556152344, "global_step": 125519, "epoch": 1037} {"train_loss": -39.11769485473633, "global_step": 125520, "epoch": 1037} {"train_loss": -39.51442337036133, "global_step": 125521, "epoch": 1037} {"train_loss": -39.14665985107422, "global_step": 125522, "epoch": 1037} {"train_loss": -39.52132034301758, "global_step": 125523, "epoch": 1037} {"train_loss": -39.011409759521484, "global_step": 125524, "epoch": 1037} {"train_loss": -39.330360412597656, "global_step": 125525, "epoch": 1037} {"train_loss": -39.53137969970703, "global_step": 125526, "epoch": 1037} {"train_loss": -39.28578567504883, "global_step": 125527, "epoch": 1037} {"train_loss": -39.95426559448242, "global_step": 125528, "epoch": 1037} {"train_loss": -39.4959602355957, "global_step": 125529, "epoch": 1037} {"train_loss": -39.77299118041992, "global_step": 125530, "epoch": 1037} {"train_loss": -39.78278350830078, "global_step": 125531, "epoch": 1037} {"train_loss": -39.91080093383789, "global_step": 125532, "epoch": 1037} {"train_loss": -38.67824935913086, "global_step": 125533, "epoch": 1037} {"train_loss": -38.3632926940918, "global_step": 125534, "epoch": 1037} {"train_loss": -39.2746696472168, "global_step": 125535, "epoch": 1037} {"train_loss": -39.83626937866211, "global_step": 125536, "epoch": 1037} {"train_loss": -39.87751007080078, "global_step": 125537, "epoch": 1037} {"train_loss": -39.9788932800293, "global_step": 125538, "epoch": 1037} {"train_loss": -39.20824432373047, "global_step": 125539, "epoch": 1037} {"train_loss": -39.23319625854492, "global_step": 125540, "epoch": 1037} {"train_loss": -39.785701751708984, "global_step": 125541, "epoch": 1037} {"train_loss": -40.30050277709961, "global_step": 125542, "epoch": 1037} {"train_loss": -40.00838088989258, "global_step": 125543, "epoch": 1037} {"train_loss": -39.77946853637695, "global_step": 125544, "epoch": 1037} {"train_loss": -40.35663986206055, "global_step": 125545, "epoch": 1037} {"train_loss": -40.05196762084961, "global_step": 125546, "epoch": 1037} {"train_loss": -39.500396728515625, "global_step": 125547, "epoch": 1037} {"train_loss": -39.87798309326172, "global_step": 125548, "epoch": 1037} {"train_loss": -38.119354248046875, "global_step": 125549, "epoch": 1037} {"train_loss": -36.88713455200195, "global_step": 125550, "epoch": 1037} {"train_loss": -37.517086029052734, "global_step": 125551, "epoch": 1037} {"train_loss": -37.69131088256836, "global_step": 125552, "epoch": 1037} {"train_loss": -38.963645935058594, "global_step": 125553, "epoch": 1037} {"train_loss": -39.69723129272461, "global_step": 125554, "epoch": 1037} {"train_loss": -39.648292541503906, "global_step": 125555, "epoch": 1037} {"train_loss": -39.74878692626953, "global_step": 125556, "epoch": 1037} {"train_loss": -38.63716506958008, "global_step": 125557, "epoch": 1037} {"train_loss": -39.69621658325195, "global_step": 125558, "epoch": 1037} {"train_loss": -39.863216400146484, "global_step": 125559, "epoch": 1037} {"train_loss": -39.01150131225586, "global_step": 125560, "epoch": 1037} {"train_loss": -39.24570846557617, "global_step": 125561, "epoch": 1037} {"train_loss": -38.181026458740234, "global_step": 125562, "epoch": 1037} {"train_loss": -38.95062255859375, "global_step": 125563, "epoch": 1037} {"train_loss": -39.516387939453125, "global_step": 125564, "epoch": 1037} {"train_loss": -38.8653678894043, "global_step": 125565, "epoch": 1037} {"train_loss": -38.644691467285156, "global_step": 125566, "epoch": 1037} {"train_loss": -39.15169906616211, "global_step": 125567, "epoch": 1037} {"train_loss": -38.82749557495117, "global_step": 125568, "epoch": 1037} {"train_loss": -39.19159698486328, "global_step": 125569, "epoch": 1037} {"train_loss": -39.66599655151367, "global_step": 125570, "epoch": 1037} {"train_loss": -38.9670295715332, "global_step": 125571, "epoch": 1037} {"train_loss": -39.7420654296875, "global_step": 125572, "epoch": 1037} {"train_loss": -39.466766357421875, "global_step": 125573, "epoch": 1037} {"train_loss": -39.138668060302734, "global_step": 125574, "epoch": 1037} {"train_loss": -39.86979293823242, "global_step": 125575, "epoch": 1037} {"train_loss": -39.74089813232422, "global_step": 125576, "epoch": 1037} {"train_loss": -39.132293701171875, "global_step": 125577, "epoch": 1037} {"train_loss": -39.747215270996094, "global_step": 125578, "epoch": 1037} {"train_loss": -39.77760696411133, "global_step": 125579, "epoch": 1037} {"train_loss": -39.29096221923828, "global_step": 125580, "epoch": 1037} {"train_loss": -38.784881591796875, "global_step": 125581, "epoch": 1037} {"train_loss": -38.75354766845703, "global_step": 125582, "epoch": 1037} {"train_loss": -38.481895446777344, "global_step": 125583, "epoch": 1037} {"train_loss": -39.18349075317383, "global_step": 125584, "epoch": 1037} {"train_loss": -38.42610549926758, "global_step": 125585, "epoch": 1037} {"train_loss": -39.28505325317383, "global_step": 125586, "epoch": 1037} {"train_loss": -38.7991943359375, "global_step": 125587, "epoch": 1037} {"train_loss": -39.34637451171875, "global_step": 125588, "epoch": 1037} {"train_loss": -38.16695785522461, "global_step": 125589, "epoch": 1037} {"train_loss": -38.8380012512207, "global_step": 125590, "epoch": 1037} {"train_loss": -39.16969680786133, "global_step": 125591, "epoch": 1037} {"train_loss": -39.128623962402344, "global_step": 125592, "epoch": 1037} {"train_loss": -38.88911056518555, "global_step": 125593, "epoch": 1037} {"train_loss": -38.83573532104492, "global_step": 125594, "epoch": 1037} {"train_loss": -39.44849395751953, "global_step": 125595, "epoch": 1037} {"train_loss": -39.02289962768555, "global_step": 125596, "epoch": 1037} {"train_loss": -39.02547508428905, "global_step": 125597, "epoch": 1037, "val_loss": 2728554.75} {"train_loss": -38.60629653930664, "global_step": 125598, "epoch": 1038} {"train_loss": -40.2040901184082, "global_step": 125599, "epoch": 1038} {"train_loss": -39.20991134643555, "global_step": 125600, "epoch": 1038} {"train_loss": -38.776790618896484, "global_step": 125601, "epoch": 1038} {"train_loss": -39.23565673828125, "global_step": 125602, "epoch": 1038} {"train_loss": -39.769161224365234, "global_step": 125603, "epoch": 1038} {"train_loss": -38.99209213256836, "global_step": 125604, "epoch": 1038} {"train_loss": -39.617374420166016, "global_step": 125605, "epoch": 1038} {"train_loss": -39.58606719970703, "global_step": 125606, "epoch": 1038} {"train_loss": -39.41065216064453, "global_step": 125607, "epoch": 1038} {"train_loss": -38.716835021972656, "global_step": 125608, "epoch": 1038} {"train_loss": -38.77505111694336, "global_step": 125609, "epoch": 1038} {"train_loss": -39.83474349975586, "global_step": 125610, "epoch": 1038} {"train_loss": -40.045677185058594, "global_step": 125611, "epoch": 1038} {"train_loss": -39.496456146240234, "global_step": 125612, "epoch": 1038} {"train_loss": -39.292781829833984, "global_step": 125613, "epoch": 1038} {"train_loss": -38.3632926940918, "global_step": 125614, "epoch": 1038} {"train_loss": -36.23989486694336, "global_step": 125615, "epoch": 1038} {"train_loss": -34.616676330566406, "global_step": 125616, "epoch": 1038} {"train_loss": -33.93101501464844, "global_step": 125617, "epoch": 1038} {"train_loss": -37.2202262878418, "global_step": 125618, "epoch": 1038} {"train_loss": -38.814796447753906, "global_step": 125619, "epoch": 1038} {"train_loss": -38.713783264160156, "global_step": 125620, "epoch": 1038} {"train_loss": -38.66463851928711, "global_step": 125621, "epoch": 1038} {"train_loss": -37.92375183105469, "global_step": 125622, "epoch": 1038} {"train_loss": -38.37413787841797, "global_step": 125623, "epoch": 1038} {"train_loss": -39.3345947265625, "global_step": 125624, "epoch": 1038} {"train_loss": -38.71992111206055, "global_step": 125625, "epoch": 1038} {"train_loss": -38.43524932861328, "global_step": 125626, "epoch": 1038} {"train_loss": -39.43397521972656, "global_step": 125627, "epoch": 1038} {"train_loss": -39.64530563354492, "global_step": 125628, "epoch": 1038} {"train_loss": -39.313629150390625, "global_step": 125629, "epoch": 1038} {"train_loss": -40.0418586730957, "global_step": 125630, "epoch": 1038} {"train_loss": -39.80348587036133, "global_step": 125631, "epoch": 1038} {"train_loss": -39.7275390625, "global_step": 125632, "epoch": 1038} {"train_loss": -39.51970291137695, "global_step": 125633, "epoch": 1038} {"train_loss": -39.99116134643555, "global_step": 125634, "epoch": 1038} {"train_loss": -39.37871170043945, "global_step": 125635, "epoch": 1038} {"train_loss": -39.77820587158203, "global_step": 125636, "epoch": 1038} {"train_loss": -40.12954330444336, "global_step": 125637, "epoch": 1038} {"train_loss": -39.6082763671875, "global_step": 125638, "epoch": 1038} {"train_loss": -39.95970916748047, "global_step": 125639, "epoch": 1038} {"train_loss": -39.22451400756836, "global_step": 125640, "epoch": 1038} {"train_loss": -40.106910705566406, "global_step": 125641, "epoch": 1038} {"train_loss": -39.52594757080078, "global_step": 125642, "epoch": 1038} {"train_loss": -39.503143310546875, "global_step": 125643, "epoch": 1038} {"train_loss": -39.52724075317383, "global_step": 125644, "epoch": 1038} {"train_loss": -39.89503479003906, "global_step": 125645, "epoch": 1038} {"train_loss": -39.430301666259766, "global_step": 125646, "epoch": 1038} {"train_loss": -39.53276443481445, "global_step": 125647, "epoch": 1038} {"train_loss": -39.9901237487793, "global_step": 125648, "epoch": 1038} {"train_loss": -40.02248764038086, "global_step": 125649, "epoch": 1038} {"train_loss": -39.48413848876953, "global_step": 125650, "epoch": 1038} {"train_loss": -39.2200927734375, "global_step": 125651, "epoch": 1038} {"train_loss": -39.89106369018555, "global_step": 125652, "epoch": 1038} {"train_loss": -38.61204147338867, "global_step": 125653, "epoch": 1038} {"train_loss": -38.1936149597168, "global_step": 125654, "epoch": 1038} {"train_loss": -39.79204559326172, "global_step": 125655, "epoch": 1038} {"train_loss": -39.71363067626953, "global_step": 125656, "epoch": 1038} {"train_loss": -38.45793151855469, "global_step": 125657, "epoch": 1038} {"train_loss": -39.90938949584961, "global_step": 125658, "epoch": 1038} {"train_loss": -39.91097640991211, "global_step": 125659, "epoch": 1038} {"train_loss": -38.7738151550293, "global_step": 125660, "epoch": 1038} {"train_loss": -39.339080810546875, "global_step": 125661, "epoch": 1038} {"train_loss": -39.72865676879883, "global_step": 125662, "epoch": 1038} {"train_loss": -39.074337005615234, "global_step": 125663, "epoch": 1038} {"train_loss": -39.32880401611328, "global_step": 125664, "epoch": 1038} {"train_loss": -39.89724349975586, "global_step": 125665, "epoch": 1038} {"train_loss": -39.6368293762207, "global_step": 125666, "epoch": 1038} {"train_loss": -39.9924430847168, "global_step": 125667, "epoch": 1038} {"train_loss": -40.31087875366211, "global_step": 125668, "epoch": 1038} {"train_loss": -40.110530853271484, "global_step": 125669, "epoch": 1038} {"train_loss": -39.962398529052734, "global_step": 125670, "epoch": 1038} {"train_loss": -40.220558166503906, "global_step": 125671, "epoch": 1038} {"train_loss": -40.35225296020508, "global_step": 125672, "epoch": 1038} {"train_loss": -39.74040603637695, "global_step": 125673, "epoch": 1038} {"train_loss": -39.47565841674805, "global_step": 125674, "epoch": 1038} {"train_loss": -39.70962142944336, "global_step": 125675, "epoch": 1038} {"train_loss": -40.21236801147461, "global_step": 125676, "epoch": 1038} {"train_loss": -40.29714584350586, "global_step": 125677, "epoch": 1038} {"train_loss": -40.06997299194336, "global_step": 125678, "epoch": 1038} {"train_loss": -40.174739837646484, "global_step": 125679, "epoch": 1038} {"train_loss": -40.12907028198242, "global_step": 125680, "epoch": 1038} {"train_loss": -40.141151428222656, "global_step": 125681, "epoch": 1038} {"train_loss": -40.00436019897461, "global_step": 125682, "epoch": 1038} {"train_loss": -40.26319122314453, "global_step": 125683, "epoch": 1038} {"train_loss": -40.6267204284668, "global_step": 125684, "epoch": 1038} {"train_loss": -40.595821380615234, "global_step": 125685, "epoch": 1038} {"train_loss": -40.45516586303711, "global_step": 125686, "epoch": 1038} {"train_loss": -40.65834045410156, "global_step": 125687, "epoch": 1038} {"train_loss": -40.25266647338867, "global_step": 125688, "epoch": 1038} {"train_loss": -40.763301849365234, "global_step": 125689, "epoch": 1038} {"train_loss": -41.109981536865234, "global_step": 125690, "epoch": 1038} {"train_loss": -40.62934112548828, "global_step": 125691, "epoch": 1038} {"train_loss": -40.02036666870117, "global_step": 125692, "epoch": 1038} {"train_loss": -40.8803825378418, "global_step": 125693, "epoch": 1038} {"train_loss": -40.56657028198242, "global_step": 125694, "epoch": 1038} {"train_loss": -40.55742645263672, "global_step": 125695, "epoch": 1038} {"train_loss": -40.63180160522461, "global_step": 125696, "epoch": 1038} {"train_loss": -40.235145568847656, "global_step": 125697, "epoch": 1038} {"train_loss": -40.418434143066406, "global_step": 125698, "epoch": 1038} {"train_loss": -39.52685546875, "global_step": 125699, "epoch": 1038} {"train_loss": -39.966732025146484, "global_step": 125700, "epoch": 1038} {"train_loss": -38.85447311401367, "global_step": 125701, "epoch": 1038} {"train_loss": -38.3091926574707, "global_step": 125702, "epoch": 1038} {"train_loss": -36.5694465637207, "global_step": 125703, "epoch": 1038} {"train_loss": -31.99017333984375, "global_step": 125704, "epoch": 1038} {"train_loss": -31.566816329956055, "global_step": 125705, "epoch": 1038} {"train_loss": -36.2548828125, "global_step": 125706, "epoch": 1038} {"train_loss": -37.37253189086914, "global_step": 125707, "epoch": 1038} {"train_loss": -34.4516716003418, "global_step": 125708, "epoch": 1038} {"train_loss": -32.42510986328125, "global_step": 125709, "epoch": 1038} {"train_loss": -34.7779426574707, "global_step": 125710, "epoch": 1038} {"train_loss": -31.533536911010742, "global_step": 125711, "epoch": 1038} {"train_loss": -38.53916549682617, "global_step": 125712, "epoch": 1038} {"train_loss": -34.430076599121094, "global_step": 125713, "epoch": 1038} {"train_loss": -35.51030349731445, "global_step": 125714, "epoch": 1038} {"train_loss": -36.16646957397461, "global_step": 125715, "epoch": 1038} {"train_loss": -37.51428985595703, "global_step": 125716, "epoch": 1038} {"train_loss": -36.64192581176758, "global_step": 125717, "epoch": 1038} {"train_loss": -38.93467810134257, "global_step": 125718, "epoch": 1038, "val_loss": 2666075.25} {"train_loss": -36.93278503417969, "global_step": 125719, "epoch": 1039} {"train_loss": -38.84652328491211, "global_step": 125720, "epoch": 1039} {"train_loss": -35.72620391845703, "global_step": 125721, "epoch": 1039} {"train_loss": -38.84028244018555, "global_step": 125722, "epoch": 1039} {"train_loss": -37.3511962890625, "global_step": 125723, "epoch": 1039} {"train_loss": -37.98972702026367, "global_step": 125724, "epoch": 1039} {"train_loss": -37.94552993774414, "global_step": 125725, "epoch": 1039} {"train_loss": -36.70435333251953, "global_step": 125726, "epoch": 1039} {"train_loss": -38.977779388427734, "global_step": 125727, "epoch": 1039} {"train_loss": -36.124755859375, "global_step": 125728, "epoch": 1039} {"train_loss": -38.99658966064453, "global_step": 125729, "epoch": 1039} {"train_loss": -37.057884216308594, "global_step": 125730, "epoch": 1039} {"train_loss": -38.61857986450195, "global_step": 125731, "epoch": 1039} {"train_loss": -38.3213996887207, "global_step": 125732, "epoch": 1039} {"train_loss": -38.56600570678711, "global_step": 125733, "epoch": 1039} {"train_loss": -37.928497314453125, "global_step": 125734, "epoch": 1039} {"train_loss": -39.02415084838867, "global_step": 125735, "epoch": 1039} {"train_loss": -39.03812789916992, "global_step": 125736, "epoch": 1039} {"train_loss": -37.80463790893555, "global_step": 125737, "epoch": 1039} {"train_loss": -38.58812713623047, "global_step": 125738, "epoch": 1039} {"train_loss": -38.51151657104492, "global_step": 125739, "epoch": 1039} {"train_loss": -38.281558990478516, "global_step": 125740, "epoch": 1039} {"train_loss": -39.025230407714844, "global_step": 125741, "epoch": 1039} {"train_loss": -39.34196090698242, "global_step": 125742, "epoch": 1039} {"train_loss": -38.65008544921875, "global_step": 125743, "epoch": 1039} {"train_loss": -39.365814208984375, "global_step": 125744, "epoch": 1039} {"train_loss": -39.0671272277832, "global_step": 125745, "epoch": 1039} {"train_loss": -38.80652618408203, "global_step": 125746, "epoch": 1039} {"train_loss": -39.084747314453125, "global_step": 125747, "epoch": 1039} {"train_loss": -39.385189056396484, "global_step": 125748, "epoch": 1039} {"train_loss": -39.72286605834961, "global_step": 125749, "epoch": 1039} {"train_loss": -39.06472396850586, "global_step": 125750, "epoch": 1039} {"train_loss": -39.39105224609375, "global_step": 125751, "epoch": 1039} {"train_loss": -39.418426513671875, "global_step": 125752, "epoch": 1039} {"train_loss": -39.25114822387695, "global_step": 125753, "epoch": 1039} {"train_loss": -39.44953536987305, "global_step": 125754, "epoch": 1039} {"train_loss": -40.01046371459961, "global_step": 125755, "epoch": 1039} {"train_loss": -39.49223709106445, "global_step": 125756, "epoch": 1039} {"train_loss": -39.7495231628418, "global_step": 125757, "epoch": 1039} {"train_loss": -39.459625244140625, "global_step": 125758, "epoch": 1039} {"train_loss": -39.40715789794922, "global_step": 125759, "epoch": 1039} {"train_loss": -40.19443893432617, "global_step": 125760, "epoch": 1039} {"train_loss": -39.383583068847656, "global_step": 125761, "epoch": 1039} {"train_loss": -39.62158966064453, "global_step": 125762, "epoch": 1039} {"train_loss": -40.17690658569336, "global_step": 125763, "epoch": 1039} {"train_loss": -40.19255447387695, "global_step": 125764, "epoch": 1039} {"train_loss": -40.17787551879883, "global_step": 125765, "epoch": 1039} {"train_loss": -40.288021087646484, "global_step": 125766, "epoch": 1039} {"train_loss": -39.7755012512207, "global_step": 125767, "epoch": 1039} {"train_loss": -40.1885986328125, "global_step": 125768, "epoch": 1039} {"train_loss": -40.18120193481445, "global_step": 125769, "epoch": 1039} {"train_loss": -40.31197738647461, "global_step": 125770, "epoch": 1039} {"train_loss": -39.89748764038086, "global_step": 125771, "epoch": 1039} {"train_loss": -40.64997482299805, "global_step": 125772, "epoch": 1039} {"train_loss": -40.18621826171875, "global_step": 125773, "epoch": 1039} {"train_loss": -40.028106689453125, "global_step": 125774, "epoch": 1039} {"train_loss": -40.163753509521484, "global_step": 125775, "epoch": 1039} {"train_loss": -40.32554626464844, "global_step": 125776, "epoch": 1039} {"train_loss": -40.23716354370117, "global_step": 125777, "epoch": 1039} {"train_loss": -40.37479782104492, "global_step": 125778, "epoch": 1039} {"train_loss": -40.19382858276367, "global_step": 125779, "epoch": 1039} {"train_loss": -40.418331146240234, "global_step": 125780, "epoch": 1039} {"train_loss": -40.55036163330078, "global_step": 125781, "epoch": 1039} {"train_loss": -40.719078063964844, "global_step": 125782, "epoch": 1039} {"train_loss": -40.208045959472656, "global_step": 125783, "epoch": 1039} {"train_loss": -40.78181076049805, "global_step": 125784, "epoch": 1039} {"train_loss": -40.10819625854492, "global_step": 125785, "epoch": 1039} {"train_loss": -40.02922821044922, "global_step": 125786, "epoch": 1039} {"train_loss": -40.48832321166992, "global_step": 125787, "epoch": 1039} {"train_loss": -40.2678337097168, "global_step": 125788, "epoch": 1039} {"train_loss": -40.44777297973633, "global_step": 125789, "epoch": 1039} {"train_loss": -40.18624496459961, "global_step": 125790, "epoch": 1039} {"train_loss": -40.12468338012695, "global_step": 125791, "epoch": 1039} {"train_loss": -40.062782287597656, "global_step": 125792, "epoch": 1039} {"train_loss": -40.08022689819336, "global_step": 125793, "epoch": 1039} {"train_loss": -39.73947525024414, "global_step": 125794, "epoch": 1039} {"train_loss": -39.2799186706543, "global_step": 125795, "epoch": 1039} {"train_loss": -40.608734130859375, "global_step": 125796, "epoch": 1039} {"train_loss": -39.98594284057617, "global_step": 125797, "epoch": 1039} {"train_loss": -39.06794357299805, "global_step": 125798, "epoch": 1039} {"train_loss": -40.17631530761719, "global_step": 125799, "epoch": 1039} {"train_loss": -39.273372650146484, "global_step": 125800, "epoch": 1039} {"train_loss": -37.87109375, "global_step": 125801, "epoch": 1039} {"train_loss": -40.50328063964844, "global_step": 125802, "epoch": 1039} {"train_loss": -39.08769607543945, "global_step": 125803, "epoch": 1039} {"train_loss": -40.25351333618164, "global_step": 125804, "epoch": 1039} {"train_loss": -39.68781280517578, "global_step": 125805, "epoch": 1039} {"train_loss": -40.04352951049805, "global_step": 125806, "epoch": 1039} {"train_loss": -39.62936019897461, "global_step": 125807, "epoch": 1039} {"train_loss": -39.8753776550293, "global_step": 125808, "epoch": 1039} {"train_loss": -37.98891830444336, "global_step": 125809, "epoch": 1039} {"train_loss": -37.00300979614258, "global_step": 125810, "epoch": 1039} {"train_loss": -32.551971435546875, "global_step": 125811, "epoch": 1039} {"train_loss": -28.577747344970703, "global_step": 125812, "epoch": 1039} {"train_loss": -29.072006225585938, "global_step": 125813, "epoch": 1039} {"train_loss": -35.798221588134766, "global_step": 125814, "epoch": 1039} {"train_loss": -37.3956413269043, "global_step": 125815, "epoch": 1039} {"train_loss": -25.97616958618164, "global_step": 125816, "epoch": 1039} {"train_loss": -32.155738830566406, "global_step": 125817, "epoch": 1039} {"train_loss": -38.5981330871582, "global_step": 125818, "epoch": 1039} {"train_loss": -30.551069259643555, "global_step": 125819, "epoch": 1039} {"train_loss": -37.9213981628418, "global_step": 125820, "epoch": 1039} {"train_loss": -36.69061279296875, "global_step": 125821, "epoch": 1039} {"train_loss": -37.357112884521484, "global_step": 125822, "epoch": 1039} {"train_loss": -37.21706771850586, "global_step": 125823, "epoch": 1039} {"train_loss": -38.26654052734375, "global_step": 125824, "epoch": 1039} {"train_loss": -38.93144607543945, "global_step": 125825, "epoch": 1039} {"train_loss": -38.7642707824707, "global_step": 125826, "epoch": 1039} {"train_loss": -39.012718200683594, "global_step": 125827, "epoch": 1039} {"train_loss": -38.46024703979492, "global_step": 125828, "epoch": 1039} {"train_loss": -38.62471389770508, "global_step": 125829, "epoch": 1039} {"train_loss": -39.21828842163086, "global_step": 125830, "epoch": 1039} {"train_loss": -37.55439376831055, "global_step": 125831, "epoch": 1039} {"train_loss": -38.87084197998047, "global_step": 125832, "epoch": 1039} {"train_loss": -38.276153564453125, "global_step": 125833, "epoch": 1039} {"train_loss": -39.19205856323242, "global_step": 125834, "epoch": 1039} {"train_loss": -39.139686584472656, "global_step": 125835, "epoch": 1039} {"train_loss": -39.5130729675293, "global_step": 125836, "epoch": 1039} {"train_loss": -38.99467849731445, "global_step": 125837, "epoch": 1039} {"train_loss": -40.14986038208008, "global_step": 125838, "epoch": 1039} {"train_loss": -38.697139188277816, "global_step": 125839, "epoch": 1039, "val_loss": 2714338.75} {"train_loss": -39.780677795410156, "global_step": 125840, "epoch": 1040} {"train_loss": -39.71580123901367, "global_step": 125841, "epoch": 1040} {"train_loss": -39.80076217651367, "global_step": 125842, "epoch": 1040} {"train_loss": -40.19824981689453, "global_step": 125843, "epoch": 1040} {"train_loss": -39.77714920043945, "global_step": 125844, "epoch": 1040} {"train_loss": -39.76332473754883, "global_step": 125845, "epoch": 1040} {"train_loss": -40.28721618652344, "global_step": 125846, "epoch": 1040} {"train_loss": -39.659996032714844, "global_step": 125847, "epoch": 1040} {"train_loss": -39.901451110839844, "global_step": 125848, "epoch": 1040} {"train_loss": -40.21602249145508, "global_step": 125849, "epoch": 1040} {"train_loss": -39.84637451171875, "global_step": 125850, "epoch": 1040} {"train_loss": -40.12438201904297, "global_step": 125851, "epoch": 1040} {"train_loss": -39.881160736083984, "global_step": 125852, "epoch": 1040} {"train_loss": -40.37943649291992, "global_step": 125853, "epoch": 1040} {"train_loss": -39.683204650878906, "global_step": 125854, "epoch": 1040} {"train_loss": -39.98299789428711, "global_step": 125855, "epoch": 1040} {"train_loss": -39.36159133911133, "global_step": 125856, "epoch": 1040} {"train_loss": -40.38326644897461, "global_step": 125857, "epoch": 1040} {"train_loss": -40.200775146484375, "global_step": 125858, "epoch": 1040} {"train_loss": -40.0962028503418, "global_step": 125859, "epoch": 1040} {"train_loss": -39.87491989135742, "global_step": 125860, "epoch": 1040} {"train_loss": -40.05039978027344, "global_step": 125861, "epoch": 1040} {"train_loss": -40.79850387573242, "global_step": 125862, "epoch": 1040} {"train_loss": -40.5439453125, "global_step": 125863, "epoch": 1040} {"train_loss": -40.07334518432617, "global_step": 125864, "epoch": 1040} {"train_loss": -40.086585998535156, "global_step": 125865, "epoch": 1040} {"train_loss": -39.96588897705078, "global_step": 125866, "epoch": 1040} {"train_loss": -40.23690414428711, "global_step": 125867, "epoch": 1040} {"train_loss": -40.33835983276367, "global_step": 125868, "epoch": 1040} {"train_loss": -40.38629150390625, "global_step": 125869, "epoch": 1040} {"train_loss": -40.873382568359375, "global_step": 125870, "epoch": 1040} {"train_loss": -40.291744232177734, "global_step": 125871, "epoch": 1040} {"train_loss": -39.748207092285156, "global_step": 125872, "epoch": 1040} {"train_loss": -39.529884338378906, "global_step": 125873, "epoch": 1040} {"train_loss": -39.70233154296875, "global_step": 125874, "epoch": 1040} {"train_loss": -39.68770217895508, "global_step": 125875, "epoch": 1040} {"train_loss": -40.22688293457031, "global_step": 125876, "epoch": 1040} {"train_loss": -40.21266555786133, "global_step": 125877, "epoch": 1040} {"train_loss": -39.975006103515625, "global_step": 125878, "epoch": 1040} {"train_loss": -40.092079162597656, "global_step": 125879, "epoch": 1040} {"train_loss": -40.09502029418945, "global_step": 125880, "epoch": 1040} {"train_loss": -40.994789123535156, "global_step": 125881, "epoch": 1040} {"train_loss": -40.54240036010742, "global_step": 125882, "epoch": 1040} {"train_loss": -40.1778678894043, "global_step": 125883, "epoch": 1040} {"train_loss": -39.879302978515625, "global_step": 125884, "epoch": 1040} {"train_loss": -40.21845245361328, "global_step": 125885, "epoch": 1040} {"train_loss": -39.95384979248047, "global_step": 125886, "epoch": 1040} {"train_loss": -39.571937561035156, "global_step": 125887, "epoch": 1040} {"train_loss": -39.104759216308594, "global_step": 125888, "epoch": 1040} {"train_loss": -39.60725784301758, "global_step": 125889, "epoch": 1040} {"train_loss": -40.36007308959961, "global_step": 125890, "epoch": 1040} {"train_loss": -39.2445068359375, "global_step": 125891, "epoch": 1040} {"train_loss": -39.817745208740234, "global_step": 125892, "epoch": 1040} {"train_loss": -39.268856048583984, "global_step": 125893, "epoch": 1040} {"train_loss": -39.738372802734375, "global_step": 125894, "epoch": 1040} {"train_loss": -39.568965911865234, "global_step": 125895, "epoch": 1040} {"train_loss": -38.867618560791016, "global_step": 125896, "epoch": 1040} {"train_loss": -39.07283401489258, "global_step": 125897, "epoch": 1040} {"train_loss": -39.108802795410156, "global_step": 125898, "epoch": 1040} {"train_loss": -40.30288314819336, "global_step": 125899, "epoch": 1040} {"train_loss": -38.332061767578125, "global_step": 125900, "epoch": 1040} {"train_loss": -39.36181640625, "global_step": 125901, "epoch": 1040} {"train_loss": -38.666011810302734, "global_step": 125902, "epoch": 1040} {"train_loss": -37.737422943115234, "global_step": 125903, "epoch": 1040} {"train_loss": -38.9052848815918, "global_step": 125904, "epoch": 1040} {"train_loss": -40.257686614990234, "global_step": 125905, "epoch": 1040} {"train_loss": -38.63312530517578, "global_step": 125906, "epoch": 1040} {"train_loss": -39.95058822631836, "global_step": 125907, "epoch": 1040} {"train_loss": -40.30946731567383, "global_step": 125908, "epoch": 1040} {"train_loss": -40.371368408203125, "global_step": 125909, "epoch": 1040} {"train_loss": -40.3860969543457, "global_step": 125910, "epoch": 1040} {"train_loss": -39.68302536010742, "global_step": 125911, "epoch": 1040} {"train_loss": -39.672691345214844, "global_step": 125912, "epoch": 1040} {"train_loss": -40.82230758666992, "global_step": 125913, "epoch": 1040} {"train_loss": -39.57737350463867, "global_step": 125914, "epoch": 1040} {"train_loss": -39.76393127441406, "global_step": 125915, "epoch": 1040} {"train_loss": -40.286746978759766, "global_step": 125916, "epoch": 1040} {"train_loss": -40.050174713134766, "global_step": 125917, "epoch": 1040} {"train_loss": -40.502410888671875, "global_step": 125918, "epoch": 1040} {"train_loss": -39.76634979248047, "global_step": 125919, "epoch": 1040} {"train_loss": -39.856475830078125, "global_step": 125920, "epoch": 1040} {"train_loss": -40.79264450073242, "global_step": 125921, "epoch": 1040} {"train_loss": -39.83949661254883, "global_step": 125922, "epoch": 1040} {"train_loss": -39.698524475097656, "global_step": 125923, "epoch": 1040} {"train_loss": -39.740570068359375, "global_step": 125924, "epoch": 1040} {"train_loss": -39.600303649902344, "global_step": 125925, "epoch": 1040} {"train_loss": -40.5869255065918, "global_step": 125926, "epoch": 1040} {"train_loss": -40.46515655517578, "global_step": 125927, "epoch": 1040} {"train_loss": -40.065208435058594, "global_step": 125928, "epoch": 1040} {"train_loss": -40.1836051940918, "global_step": 125929, "epoch": 1040} {"train_loss": -39.924476623535156, "global_step": 125930, "epoch": 1040} {"train_loss": -40.34208679199219, "global_step": 125931, "epoch": 1040} {"train_loss": -40.38352966308594, "global_step": 125932, "epoch": 1040} {"train_loss": -40.09200668334961, "global_step": 125933, "epoch": 1040} {"train_loss": -40.11157989501953, "global_step": 125934, "epoch": 1040} {"train_loss": -38.15869903564453, "global_step": 125935, "epoch": 1040} {"train_loss": -38.917457580566406, "global_step": 125936, "epoch": 1040} {"train_loss": -39.8691291809082, "global_step": 125937, "epoch": 1040} {"train_loss": -39.182735443115234, "global_step": 125938, "epoch": 1040} {"train_loss": -39.69308090209961, "global_step": 125939, "epoch": 1040} {"train_loss": -37.988582611083984, "global_step": 125940, "epoch": 1040} {"train_loss": -40.34821319580078, "global_step": 125941, "epoch": 1040} {"train_loss": -38.63311767578125, "global_step": 125942, "epoch": 1040} {"train_loss": -39.895503997802734, "global_step": 125943, "epoch": 1040} {"train_loss": -40.118099212646484, "global_step": 125944, "epoch": 1040} {"train_loss": -37.90788650512695, "global_step": 125945, "epoch": 1040} {"train_loss": -39.520652770996094, "global_step": 125946, "epoch": 1040} {"train_loss": -37.3988037109375, "global_step": 125947, "epoch": 1040} {"train_loss": -37.643394470214844, "global_step": 125948, "epoch": 1040} {"train_loss": -40.10206985473633, "global_step": 125949, "epoch": 1040} {"train_loss": -37.86900329589844, "global_step": 125950, "epoch": 1040} {"train_loss": -38.896759033203125, "global_step": 125951, "epoch": 1040} {"train_loss": -39.30997848510742, "global_step": 125952, "epoch": 1040} {"train_loss": -37.946136474609375, "global_step": 125953, "epoch": 1040} {"train_loss": -39.56039047241211, "global_step": 125954, "epoch": 1040} {"train_loss": -38.593318939208984, "global_step": 125955, "epoch": 1040} {"train_loss": -39.504432678222656, "global_step": 125956, "epoch": 1040} {"train_loss": -39.36092758178711, "global_step": 125957, "epoch": 1040} {"train_loss": -39.55289840698242, "global_step": 125958, "epoch": 1040} {"train_loss": -38.565093994140625, "global_step": 125959, "epoch": 1040} {"train_loss": -39.72014000002018, "global_step": 125960, "epoch": 1040, "val_loss": 2825121.25} {"train_loss": -39.871734619140625, "global_step": 125961, "epoch": 1041} {"train_loss": -39.52971267700195, "global_step": 125962, "epoch": 1041} {"train_loss": -38.704994201660156, "global_step": 125963, "epoch": 1041} {"train_loss": -40.01923370361328, "global_step": 125964, "epoch": 1041} {"train_loss": -40.06087112426758, "global_step": 125965, "epoch": 1041} {"train_loss": -39.31744384765625, "global_step": 125966, "epoch": 1041} {"train_loss": -39.58710861206055, "global_step": 125967, "epoch": 1041} {"train_loss": -38.84003448486328, "global_step": 125968, "epoch": 1041} {"train_loss": -38.257965087890625, "global_step": 125969, "epoch": 1041} {"train_loss": -38.05976104736328, "global_step": 125970, "epoch": 1041} {"train_loss": -38.99036407470703, "global_step": 125971, "epoch": 1041} {"train_loss": -40.0396842956543, "global_step": 125972, "epoch": 1041} {"train_loss": -39.466346740722656, "global_step": 125973, "epoch": 1041} {"train_loss": -39.05168533325195, "global_step": 125974, "epoch": 1041} {"train_loss": -39.94826889038086, "global_step": 125975, "epoch": 1041} {"train_loss": -39.89895248413086, "global_step": 125976, "epoch": 1041} {"train_loss": -40.09562301635742, "global_step": 125977, "epoch": 1041} {"train_loss": -40.07188415527344, "global_step": 125978, "epoch": 1041} {"train_loss": -40.01311111450195, "global_step": 125979, "epoch": 1041} {"train_loss": -40.59419631958008, "global_step": 125980, "epoch": 1041} {"train_loss": -40.44535446166992, "global_step": 125981, "epoch": 1041} {"train_loss": -40.0703239440918, "global_step": 125982, "epoch": 1041} {"train_loss": -39.450286865234375, "global_step": 125983, "epoch": 1041} {"train_loss": -39.588348388671875, "global_step": 125984, "epoch": 1041} {"train_loss": -39.984718322753906, "global_step": 125985, "epoch": 1041} {"train_loss": -39.50579833984375, "global_step": 125986, "epoch": 1041} {"train_loss": -39.79923629760742, "global_step": 125987, "epoch": 1041} {"train_loss": -40.31940460205078, "global_step": 125988, "epoch": 1041} {"train_loss": -40.04140853881836, "global_step": 125989, "epoch": 1041} {"train_loss": -40.27518081665039, "global_step": 125990, "epoch": 1041} {"train_loss": -40.471771240234375, "global_step": 125991, "epoch": 1041} {"train_loss": -40.73061752319336, "global_step": 125992, "epoch": 1041} {"train_loss": -40.51163864135742, "global_step": 125993, "epoch": 1041} {"train_loss": -39.6594123840332, "global_step": 125994, "epoch": 1041} {"train_loss": -39.65213394165039, "global_step": 125995, "epoch": 1041} {"train_loss": -40.7907600402832, "global_step": 125996, "epoch": 1041} {"train_loss": -40.3484992980957, "global_step": 125997, "epoch": 1041} {"train_loss": -40.377742767333984, "global_step": 125998, "epoch": 1041} {"train_loss": -40.24409103393555, "global_step": 125999, "epoch": 1041} {"train_loss": -40.791927337646484, "global_step": 126000, "epoch": 1041} {"train_loss": -40.642059326171875, "global_step": 126001, "epoch": 1041} {"train_loss": -40.23778533935547, "global_step": 126002, "epoch": 1041} {"train_loss": -40.719879150390625, "global_step": 126003, "epoch": 1041} {"train_loss": -40.682228088378906, "global_step": 126004, "epoch": 1041} {"train_loss": -40.452754974365234, "global_step": 126005, "epoch": 1041} {"train_loss": -40.35984420776367, "global_step": 126006, "epoch": 1041} {"train_loss": -40.336158752441406, "global_step": 126007, "epoch": 1041} {"train_loss": -40.47175979614258, "global_step": 126008, "epoch": 1041} {"train_loss": -40.545467376708984, "global_step": 126009, "epoch": 1041} {"train_loss": -40.1362190246582, "global_step": 126010, "epoch": 1041} {"train_loss": -40.07429504394531, "global_step": 126011, "epoch": 1041} {"train_loss": -40.34430694580078, "global_step": 126012, "epoch": 1041} {"train_loss": -39.8845329284668, "global_step": 126013, "epoch": 1041} {"train_loss": -40.020626068115234, "global_step": 126014, "epoch": 1041} {"train_loss": -39.7540168762207, "global_step": 126015, "epoch": 1041} {"train_loss": -39.949981689453125, "global_step": 126016, "epoch": 1041} {"train_loss": -39.53159713745117, "global_step": 126017, "epoch": 1041} {"train_loss": -40.32973861694336, "global_step": 126018, "epoch": 1041} {"train_loss": -40.416778564453125, "global_step": 126019, "epoch": 1041} {"train_loss": -38.872528076171875, "global_step": 126020, "epoch": 1041} {"train_loss": -39.317359924316406, "global_step": 126021, "epoch": 1041} {"train_loss": -38.56202697753906, "global_step": 126022, "epoch": 1041} {"train_loss": -38.327117919921875, "global_step": 126023, "epoch": 1041} {"train_loss": -40.34214782714844, "global_step": 126024, "epoch": 1041} {"train_loss": -40.0627555847168, "global_step": 126025, "epoch": 1041} {"train_loss": -38.59616470336914, "global_step": 126026, "epoch": 1041} {"train_loss": -38.94099044799805, "global_step": 126027, "epoch": 1041} {"train_loss": -40.52040481567383, "global_step": 126028, "epoch": 1041} {"train_loss": -38.26250457763672, "global_step": 126029, "epoch": 1041} {"train_loss": -39.47541046142578, "global_step": 126030, "epoch": 1041} {"train_loss": -39.3223991394043, "global_step": 126031, "epoch": 1041} {"train_loss": -39.48995590209961, "global_step": 126032, "epoch": 1041} {"train_loss": -40.615779876708984, "global_step": 126033, "epoch": 1041} {"train_loss": -37.54499053955078, "global_step": 126034, "epoch": 1041} {"train_loss": -38.89895248413086, "global_step": 126035, "epoch": 1041} {"train_loss": -38.06136703491211, "global_step": 126036, "epoch": 1041} {"train_loss": -39.79745101928711, "global_step": 126037, "epoch": 1041} {"train_loss": -39.2991943359375, "global_step": 126038, "epoch": 1041} {"train_loss": -37.51163864135742, "global_step": 126039, "epoch": 1041} {"train_loss": -34.90542221069336, "global_step": 126040, "epoch": 1041} {"train_loss": -33.699462890625, "global_step": 126041, "epoch": 1041} {"train_loss": -34.810970306396484, "global_step": 126042, "epoch": 1041} {"train_loss": -36.488643646240234, "global_step": 126043, "epoch": 1041} {"train_loss": -35.4219970703125, "global_step": 126044, "epoch": 1041} {"train_loss": -38.91254806518555, "global_step": 126045, "epoch": 1041} {"train_loss": -38.411102294921875, "global_step": 126046, "epoch": 1041} {"train_loss": -34.25889205932617, "global_step": 126047, "epoch": 1041} {"train_loss": -36.893550872802734, "global_step": 126048, "epoch": 1041} {"train_loss": -36.7650146484375, "global_step": 126049, "epoch": 1041} {"train_loss": -35.048885345458984, "global_step": 126050, "epoch": 1041} {"train_loss": -37.620887756347656, "global_step": 126051, "epoch": 1041} {"train_loss": -36.60597229003906, "global_step": 126052, "epoch": 1041} {"train_loss": -36.82840347290039, "global_step": 126053, "epoch": 1041} {"train_loss": -37.94633102416992, "global_step": 126054, "epoch": 1041} {"train_loss": -37.052555084228516, "global_step": 126055, "epoch": 1041} {"train_loss": -37.6443977355957, "global_step": 126056, "epoch": 1041} {"train_loss": -38.00248336791992, "global_step": 126057, "epoch": 1041} {"train_loss": -36.06460189819336, "global_step": 126058, "epoch": 1041} {"train_loss": -34.51264190673828, "global_step": 126059, "epoch": 1041} {"train_loss": -36.198116302490234, "global_step": 126060, "epoch": 1041} {"train_loss": -35.62739944458008, "global_step": 126061, "epoch": 1041} {"train_loss": -31.719465255737305, "global_step": 126062, "epoch": 1041} {"train_loss": -37.9996337890625, "global_step": 126063, "epoch": 1041} {"train_loss": -36.406192779541016, "global_step": 126064, "epoch": 1041} {"train_loss": -36.576534271240234, "global_step": 126065, "epoch": 1041} {"train_loss": -35.00809860229492, "global_step": 126066, "epoch": 1041} {"train_loss": -37.54746627807617, "global_step": 126067, "epoch": 1041} {"train_loss": -37.56317901611328, "global_step": 126068, "epoch": 1041} {"train_loss": -37.301239013671875, "global_step": 126069, "epoch": 1041} {"train_loss": -38.47365188598633, "global_step": 126070, "epoch": 1041} {"train_loss": -37.85206985473633, "global_step": 126071, "epoch": 1041} {"train_loss": -38.534095764160156, "global_step": 126072, "epoch": 1041} {"train_loss": -37.802337646484375, "global_step": 126073, "epoch": 1041} {"train_loss": -38.81736373901367, "global_step": 126074, "epoch": 1041} {"train_loss": -38.05316925048828, "global_step": 126075, "epoch": 1041} {"train_loss": -38.560482025146484, "global_step": 126076, "epoch": 1041} {"train_loss": -37.52363967895508, "global_step": 126077, "epoch": 1041} {"train_loss": -38.223052978515625, "global_step": 126078, "epoch": 1041} {"train_loss": -39.11692428588867, "global_step": 126079, "epoch": 1041} {"train_loss": -38.39101791381836, "global_step": 126080, "epoch": 1041} {"train_loss": -38.75461094438537, "global_step": 126081, "epoch": 1041, "val_loss": 2877161.0} {"train_loss": -38.857215881347656, "global_step": 126082, "epoch": 1042} {"train_loss": -38.95298767089844, "global_step": 126083, "epoch": 1042} {"train_loss": -39.20881652832031, "global_step": 126084, "epoch": 1042} {"train_loss": -38.29384994506836, "global_step": 126085, "epoch": 1042} {"train_loss": -38.89553451538086, "global_step": 126086, "epoch": 1042} {"train_loss": -36.27717971801758, "global_step": 126087, "epoch": 1042} {"train_loss": -35.41143798828125, "global_step": 126088, "epoch": 1042} {"train_loss": -39.34501266479492, "global_step": 126089, "epoch": 1042} {"train_loss": -39.3242073059082, "global_step": 126090, "epoch": 1042} {"train_loss": -38.907588958740234, "global_step": 126091, "epoch": 1042} {"train_loss": -39.015899658203125, "global_step": 126092, "epoch": 1042} {"train_loss": -39.78013229370117, "global_step": 126093, "epoch": 1042} {"train_loss": -39.22325134277344, "global_step": 126094, "epoch": 1042} {"train_loss": -38.79083251953125, "global_step": 126095, "epoch": 1042} {"train_loss": -39.651084899902344, "global_step": 126096, "epoch": 1042} {"train_loss": -39.07962417602539, "global_step": 126097, "epoch": 1042} {"train_loss": -38.467647552490234, "global_step": 126098, "epoch": 1042} {"train_loss": -39.771175384521484, "global_step": 126099, "epoch": 1042} {"train_loss": -39.38167953491211, "global_step": 126100, "epoch": 1042} {"train_loss": -39.583892822265625, "global_step": 126101, "epoch": 1042} {"train_loss": -39.45545196533203, "global_step": 126102, "epoch": 1042} {"train_loss": -39.52881622314453, "global_step": 126103, "epoch": 1042} {"train_loss": -38.59208297729492, "global_step": 126104, "epoch": 1042} {"train_loss": -40.196468353271484, "global_step": 126105, "epoch": 1042} {"train_loss": -39.27588653564453, "global_step": 126106, "epoch": 1042} {"train_loss": -39.986087799072266, "global_step": 126107, "epoch": 1042} {"train_loss": -40.185707092285156, "global_step": 126108, "epoch": 1042} {"train_loss": -40.0136833190918, "global_step": 126109, "epoch": 1042} {"train_loss": -39.25045394897461, "global_step": 126110, "epoch": 1042} {"train_loss": -39.956787109375, "global_step": 126111, "epoch": 1042} {"train_loss": -39.487770080566406, "global_step": 126112, "epoch": 1042} {"train_loss": -40.2789192199707, "global_step": 126113, "epoch": 1042} {"train_loss": -39.86576461791992, "global_step": 126114, "epoch": 1042} {"train_loss": -39.47722625732422, "global_step": 126115, "epoch": 1042} {"train_loss": -38.35365676879883, "global_step": 126116, "epoch": 1042} {"train_loss": -39.00564193725586, "global_step": 126117, "epoch": 1042} {"train_loss": -39.73953628540039, "global_step": 126118, "epoch": 1042} {"train_loss": -38.67818069458008, "global_step": 126119, "epoch": 1042} {"train_loss": -38.24288558959961, "global_step": 126120, "epoch": 1042} {"train_loss": -39.20563507080078, "global_step": 126121, "epoch": 1042} {"train_loss": -38.865699768066406, "global_step": 126122, "epoch": 1042} {"train_loss": -38.66640853881836, "global_step": 126123, "epoch": 1042} {"train_loss": -39.534515380859375, "global_step": 126124, "epoch": 1042} {"train_loss": -39.7326774597168, "global_step": 126125, "epoch": 1042} {"train_loss": -39.17214584350586, "global_step": 126126, "epoch": 1042} {"train_loss": -39.33137130737305, "global_step": 126127, "epoch": 1042} {"train_loss": -36.46992111206055, "global_step": 126128, "epoch": 1042} {"train_loss": -37.191131591796875, "global_step": 126129, "epoch": 1042} {"train_loss": -38.44962692260742, "global_step": 126130, "epoch": 1042} {"train_loss": -39.808441162109375, "global_step": 126131, "epoch": 1042} {"train_loss": -39.634735107421875, "global_step": 126132, "epoch": 1042} {"train_loss": -39.922664642333984, "global_step": 126133, "epoch": 1042} {"train_loss": -39.31502914428711, "global_step": 126134, "epoch": 1042} {"train_loss": -39.23603439331055, "global_step": 126135, "epoch": 1042} {"train_loss": -39.48539733886719, "global_step": 126136, "epoch": 1042} {"train_loss": -36.85606002807617, "global_step": 126137, "epoch": 1042} {"train_loss": -37.58953094482422, "global_step": 126138, "epoch": 1042} {"train_loss": -39.812774658203125, "global_step": 126139, "epoch": 1042} {"train_loss": -40.030189514160156, "global_step": 126140, "epoch": 1042} {"train_loss": -39.29266357421875, "global_step": 126141, "epoch": 1042} {"train_loss": -38.9442138671875, "global_step": 126142, "epoch": 1042} {"train_loss": -39.80427169799805, "global_step": 126143, "epoch": 1042} {"train_loss": -38.7140998840332, "global_step": 126144, "epoch": 1042} {"train_loss": -39.49845504760742, "global_step": 126145, "epoch": 1042} {"train_loss": -37.40107345581055, "global_step": 126146, "epoch": 1042} {"train_loss": -39.66740036010742, "global_step": 126147, "epoch": 1042} {"train_loss": -39.62859344482422, "global_step": 126148, "epoch": 1042} {"train_loss": -37.232521057128906, "global_step": 126149, "epoch": 1042} {"train_loss": -37.156368255615234, "global_step": 126150, "epoch": 1042} {"train_loss": -40.208900451660156, "global_step": 126151, "epoch": 1042} {"train_loss": -39.91447830200195, "global_step": 126152, "epoch": 1042} {"train_loss": -40.19511032104492, "global_step": 126153, "epoch": 1042} {"train_loss": -39.81177520751953, "global_step": 126154, "epoch": 1042} {"train_loss": -39.829158782958984, "global_step": 126155, "epoch": 1042} {"train_loss": -38.684444427490234, "global_step": 126156, "epoch": 1042} {"train_loss": -39.40422058105469, "global_step": 126157, "epoch": 1042} {"train_loss": -38.87130355834961, "global_step": 126158, "epoch": 1042} {"train_loss": -40.38608169555664, "global_step": 126159, "epoch": 1042} {"train_loss": -39.62006759643555, "global_step": 126160, "epoch": 1042} {"train_loss": -39.576271057128906, "global_step": 126161, "epoch": 1042} {"train_loss": -39.59685516357422, "global_step": 126162, "epoch": 1042} {"train_loss": -37.82118606567383, "global_step": 126163, "epoch": 1042} {"train_loss": -39.262020111083984, "global_step": 126164, "epoch": 1042} {"train_loss": -39.22585678100586, "global_step": 126165, "epoch": 1042} {"train_loss": -39.70771026611328, "global_step": 126166, "epoch": 1042} {"train_loss": -39.0975456237793, "global_step": 126167, "epoch": 1042} {"train_loss": -39.560028076171875, "global_step": 126168, "epoch": 1042} {"train_loss": -39.4337043762207, "global_step": 126169, "epoch": 1042} {"train_loss": -37.999507904052734, "global_step": 126170, "epoch": 1042} {"train_loss": -39.245033264160156, "global_step": 126171, "epoch": 1042} {"train_loss": -38.58638381958008, "global_step": 126172, "epoch": 1042} {"train_loss": -38.97921371459961, "global_step": 126173, "epoch": 1042} {"train_loss": -38.55732345581055, "global_step": 126174, "epoch": 1042} {"train_loss": -37.857757568359375, "global_step": 126175, "epoch": 1042} {"train_loss": -38.36644744873047, "global_step": 126176, "epoch": 1042} {"train_loss": -31.6436767578125, "global_step": 126177, "epoch": 1042} {"train_loss": -37.903255462646484, "global_step": 126178, "epoch": 1042} {"train_loss": -38.21946334838867, "global_step": 126179, "epoch": 1042} {"train_loss": -34.88523483276367, "global_step": 126180, "epoch": 1042} {"train_loss": -31.923511505126953, "global_step": 126181, "epoch": 1042} {"train_loss": -38.0485954284668, "global_step": 126182, "epoch": 1042} {"train_loss": -34.62928009033203, "global_step": 126183, "epoch": 1042} {"train_loss": -35.96553039550781, "global_step": 126184, "epoch": 1042} {"train_loss": -33.226192474365234, "global_step": 126185, "epoch": 1042} {"train_loss": -33.43285369873047, "global_step": 126186, "epoch": 1042} {"train_loss": -36.46737289428711, "global_step": 126187, "epoch": 1042} {"train_loss": -35.537147521972656, "global_step": 126188, "epoch": 1042} {"train_loss": -35.555416107177734, "global_step": 126189, "epoch": 1042} {"train_loss": -35.9881477355957, "global_step": 126190, "epoch": 1042} {"train_loss": -33.402809143066406, "global_step": 126191, "epoch": 1042} {"train_loss": -34.472442626953125, "global_step": 126192, "epoch": 1042} {"train_loss": -35.92920684814453, "global_step": 126193, "epoch": 1042} {"train_loss": -33.6519775390625, "global_step": 126194, "epoch": 1042} {"train_loss": -34.95822525024414, "global_step": 126195, "epoch": 1042} {"train_loss": -28.739309310913086, "global_step": 126196, "epoch": 1042} {"train_loss": -34.850868225097656, "global_step": 126197, "epoch": 1042} {"train_loss": -34.54828643798828, "global_step": 126198, "epoch": 1042} {"train_loss": -33.92513656616211, "global_step": 126199, "epoch": 1042} {"train_loss": -34.65629196166992, "global_step": 126200, "epoch": 1042} {"train_loss": -34.24251937866211, "global_step": 126201, "epoch": 1042} {"train_loss": -38.138282161113644, "global_step": 126202, "epoch": 1042, "val_loss": 4566748.5} {"train_loss": -34.98594665527344, "global_step": 126203, "epoch": 1043} {"train_loss": -34.723350524902344, "global_step": 126204, "epoch": 1043} {"train_loss": -36.341712951660156, "global_step": 126205, "epoch": 1043} {"train_loss": -36.572757720947266, "global_step": 126206, "epoch": 1043} {"train_loss": -36.78554916381836, "global_step": 126207, "epoch": 1043} {"train_loss": -36.98136520385742, "global_step": 126208, "epoch": 1043} {"train_loss": -37.26227569580078, "global_step": 126209, "epoch": 1043} {"train_loss": -38.26435470581055, "global_step": 126210, "epoch": 1043} {"train_loss": -37.5505485534668, "global_step": 126211, "epoch": 1043} {"train_loss": -36.96078109741211, "global_step": 126212, "epoch": 1043} {"train_loss": -36.65181350708008, "global_step": 126213, "epoch": 1043} {"train_loss": -36.230281829833984, "global_step": 126214, "epoch": 1043} {"train_loss": -36.80170822143555, "global_step": 126215, "epoch": 1043} {"train_loss": -37.23745346069336, "global_step": 126216, "epoch": 1043} {"train_loss": -37.56815719604492, "global_step": 126217, "epoch": 1043} {"train_loss": -34.4383430480957, "global_step": 126218, "epoch": 1043} {"train_loss": -37.343257904052734, "global_step": 126219, "epoch": 1043} {"train_loss": -38.11654281616211, "global_step": 126220, "epoch": 1043} {"train_loss": -37.03285598754883, "global_step": 126221, "epoch": 1043} {"train_loss": -36.745330810546875, "global_step": 126222, "epoch": 1043} {"train_loss": -38.70298385620117, "global_step": 126223, "epoch": 1043} {"train_loss": -37.04853439331055, "global_step": 126224, "epoch": 1043} {"train_loss": -38.36798858642578, "global_step": 126225, "epoch": 1043} {"train_loss": -38.34403610229492, "global_step": 126226, "epoch": 1043} {"train_loss": -38.66023635864258, "global_step": 126227, "epoch": 1043} {"train_loss": -38.27150344848633, "global_step": 126228, "epoch": 1043} {"train_loss": -37.97249984741211, "global_step": 126229, "epoch": 1043} {"train_loss": -37.9273796081543, "global_step": 126230, "epoch": 1043} {"train_loss": -38.96863555908203, "global_step": 126231, "epoch": 1043} {"train_loss": -38.13681411743164, "global_step": 126232, "epoch": 1043} {"train_loss": -38.5160026550293, "global_step": 126233, "epoch": 1043} {"train_loss": -38.783748626708984, "global_step": 126234, "epoch": 1043} {"train_loss": -38.74469757080078, "global_step": 126235, "epoch": 1043} {"train_loss": -38.6081657409668, "global_step": 126236, "epoch": 1043} {"train_loss": -37.614479064941406, "global_step": 126237, "epoch": 1043} {"train_loss": -38.89592742919922, "global_step": 126238, "epoch": 1043} {"train_loss": -38.88468551635742, "global_step": 126239, "epoch": 1043} {"train_loss": -38.86161804199219, "global_step": 126240, "epoch": 1043} {"train_loss": -38.92864227294922, "global_step": 126241, "epoch": 1043} {"train_loss": -38.51690673828125, "global_step": 126242, "epoch": 1043} {"train_loss": -39.329185485839844, "global_step": 126243, "epoch": 1043} {"train_loss": -38.57994842529297, "global_step": 126244, "epoch": 1043} {"train_loss": -38.95681381225586, "global_step": 126245, "epoch": 1043} {"train_loss": -39.064239501953125, "global_step": 126246, "epoch": 1043} {"train_loss": -38.91490173339844, "global_step": 126247, "epoch": 1043} {"train_loss": -38.71283721923828, "global_step": 126248, "epoch": 1043} {"train_loss": -39.303829193115234, "global_step": 126249, "epoch": 1043} {"train_loss": -39.083675384521484, "global_step": 126250, "epoch": 1043} {"train_loss": -39.20682907104492, "global_step": 126251, "epoch": 1043} {"train_loss": -39.37605667114258, "global_step": 126252, "epoch": 1043} {"train_loss": -39.442073822021484, "global_step": 126253, "epoch": 1043} {"train_loss": -39.319976806640625, "global_step": 126254, "epoch": 1043} {"train_loss": -39.176612854003906, "global_step": 126255, "epoch": 1043} {"train_loss": -39.52900314331055, "global_step": 126256, "epoch": 1043} {"train_loss": -39.51513671875, "global_step": 126257, "epoch": 1043} {"train_loss": -38.454246520996094, "global_step": 126258, "epoch": 1043} {"train_loss": -39.29301834106445, "global_step": 126259, "epoch": 1043} {"train_loss": -39.31452560424805, "global_step": 126260, "epoch": 1043} {"train_loss": -39.1369743347168, "global_step": 126261, "epoch": 1043} {"train_loss": -39.74324417114258, "global_step": 126262, "epoch": 1043} {"train_loss": -39.35205078125, "global_step": 126263, "epoch": 1043} {"train_loss": -39.671512603759766, "global_step": 126264, "epoch": 1043} {"train_loss": -39.966552734375, "global_step": 126265, "epoch": 1043} {"train_loss": -39.55388641357422, "global_step": 126266, "epoch": 1043} {"train_loss": -39.89636993408203, "global_step": 126267, "epoch": 1043} {"train_loss": -39.182891845703125, "global_step": 126268, "epoch": 1043} {"train_loss": -39.345638275146484, "global_step": 126269, "epoch": 1043} {"train_loss": -39.38924026489258, "global_step": 126270, "epoch": 1043} {"train_loss": -40.28571319580078, "global_step": 126271, "epoch": 1043} {"train_loss": -39.10090255737305, "global_step": 126272, "epoch": 1043} {"train_loss": -39.119441986083984, "global_step": 126273, "epoch": 1043} {"train_loss": -39.477516174316406, "global_step": 126274, "epoch": 1043} {"train_loss": -40.0370979309082, "global_step": 126275, "epoch": 1043} {"train_loss": -39.9368782043457, "global_step": 126276, "epoch": 1043} {"train_loss": -39.25012969970703, "global_step": 126277, "epoch": 1043} {"train_loss": -39.368465423583984, "global_step": 126278, "epoch": 1043} {"train_loss": -39.923458099365234, "global_step": 126279, "epoch": 1043} {"train_loss": -39.820186614990234, "global_step": 126280, "epoch": 1043} {"train_loss": -39.28520584106445, "global_step": 126281, "epoch": 1043} {"train_loss": -39.58451461791992, "global_step": 126282, "epoch": 1043} {"train_loss": -39.77806854248047, "global_step": 126283, "epoch": 1043} {"train_loss": -39.795589447021484, "global_step": 126284, "epoch": 1043} {"train_loss": -38.929847717285156, "global_step": 126285, "epoch": 1043} {"train_loss": -38.680419921875, "global_step": 126286, "epoch": 1043} {"train_loss": -38.644386291503906, "global_step": 126287, "epoch": 1043} {"train_loss": -38.156673431396484, "global_step": 126288, "epoch": 1043} {"train_loss": -35.715755462646484, "global_step": 126289, "epoch": 1043} {"train_loss": -35.2252197265625, "global_step": 126290, "epoch": 1043} {"train_loss": -34.23900604248047, "global_step": 126291, "epoch": 1043} {"train_loss": -34.17963790893555, "global_step": 126292, "epoch": 1043} {"train_loss": -35.45082473754883, "global_step": 126293, "epoch": 1043} {"train_loss": -33.78395462036133, "global_step": 126294, "epoch": 1043} {"train_loss": -33.66573715209961, "global_step": 126295, "epoch": 1043} {"train_loss": -35.788246154785156, "global_step": 126296, "epoch": 1043} {"train_loss": -38.11429214477539, "global_step": 126297, "epoch": 1043} {"train_loss": -36.2566032409668, "global_step": 126298, "epoch": 1043} {"train_loss": -37.9596061706543, "global_step": 126299, "epoch": 1043} {"train_loss": -39.459659576416016, "global_step": 126300, "epoch": 1043} {"train_loss": -35.83697509765625, "global_step": 126301, "epoch": 1043} {"train_loss": -37.34172439575195, "global_step": 126302, "epoch": 1043} {"train_loss": -36.83536911010742, "global_step": 126303, "epoch": 1043} {"train_loss": -33.530677795410156, "global_step": 126304, "epoch": 1043} {"train_loss": -35.546504974365234, "global_step": 126305, "epoch": 1043} {"train_loss": -39.31801986694336, "global_step": 126306, "epoch": 1043} {"train_loss": -36.8298225402832, "global_step": 126307, "epoch": 1043} {"train_loss": -37.00136947631836, "global_step": 126308, "epoch": 1043} {"train_loss": -38.1734733581543, "global_step": 126309, "epoch": 1043} {"train_loss": -37.85378646850586, "global_step": 126310, "epoch": 1043} {"train_loss": -37.908329010009766, "global_step": 126311, "epoch": 1043} {"train_loss": -38.65485763549805, "global_step": 126312, "epoch": 1043} {"train_loss": -38.449462890625, "global_step": 126313, "epoch": 1043} {"train_loss": -38.29530334472656, "global_step": 126314, "epoch": 1043} {"train_loss": -38.2203483581543, "global_step": 126315, "epoch": 1043} {"train_loss": -38.68867111206055, "global_step": 126316, "epoch": 1043} {"train_loss": -38.4791374206543, "global_step": 126317, "epoch": 1043} {"train_loss": -39.11636734008789, "global_step": 126318, "epoch": 1043} {"train_loss": -39.44529724121094, "global_step": 126319, "epoch": 1043} {"train_loss": -39.40459060668945, "global_step": 126320, "epoch": 1043} {"train_loss": -39.775299072265625, "global_step": 126321, "epoch": 1043} {"train_loss": -39.58464431762695, "global_step": 126322, "epoch": 1043} {"train_loss": -38.143232077606456, "global_step": 126323, "epoch": 1043, "val_loss": 2763782.75} {"train_loss": -40.13417434692383, "global_step": 126324, "epoch": 1044} {"train_loss": -39.28694534301758, "global_step": 126325, "epoch": 1044} {"train_loss": -40.02342224121094, "global_step": 126326, "epoch": 1044} {"train_loss": -39.450740814208984, "global_step": 126327, "epoch": 1044} {"train_loss": -39.64961624145508, "global_step": 126328, "epoch": 1044} {"train_loss": -38.96391677856445, "global_step": 126329, "epoch": 1044} {"train_loss": -39.6905517578125, "global_step": 126330, "epoch": 1044} {"train_loss": -39.94911193847656, "global_step": 126331, "epoch": 1044} {"train_loss": -39.69199752807617, "global_step": 126332, "epoch": 1044} {"train_loss": -39.93841552734375, "global_step": 126333, "epoch": 1044} {"train_loss": -39.499549865722656, "global_step": 126334, "epoch": 1044} {"train_loss": -39.62708282470703, "global_step": 126335, "epoch": 1044} {"train_loss": -36.907894134521484, "global_step": 126336, "epoch": 1044} {"train_loss": -40.12917709350586, "global_step": 126337, "epoch": 1044} {"train_loss": -39.09286880493164, "global_step": 126338, "epoch": 1044} {"train_loss": -39.96675491333008, "global_step": 126339, "epoch": 1044} {"train_loss": -39.9238166809082, "global_step": 126340, "epoch": 1044} {"train_loss": -39.919654846191406, "global_step": 126341, "epoch": 1044} {"train_loss": -40.153289794921875, "global_step": 126342, "epoch": 1044} {"train_loss": -39.376258850097656, "global_step": 126343, "epoch": 1044} {"train_loss": -40.3801383972168, "global_step": 126344, "epoch": 1044} {"train_loss": -38.247222900390625, "global_step": 126345, "epoch": 1044} {"train_loss": -40.021942138671875, "global_step": 126346, "epoch": 1044} {"train_loss": -39.58839797973633, "global_step": 126347, "epoch": 1044} {"train_loss": -39.66440963745117, "global_step": 126348, "epoch": 1044} {"train_loss": -29.329309463500977, "global_step": 126349, "epoch": 1044} {"train_loss": -38.836280822753906, "global_step": 126350, "epoch": 1044} {"train_loss": -38.76824951171875, "global_step": 126351, "epoch": 1044} {"train_loss": -36.64694595336914, "global_step": 126352, "epoch": 1044} {"train_loss": -17.17950439453125, "global_step": 126353, "epoch": 1044} {"train_loss": -35.863338470458984, "global_step": 126354, "epoch": 1044} {"train_loss": -32.662147521972656, "global_step": 126355, "epoch": 1044} {"train_loss": -34.19109344482422, "global_step": 126356, "epoch": 1044} {"train_loss": -33.84605026245117, "global_step": 126357, "epoch": 1044} {"train_loss": -35.36003112792969, "global_step": 126358, "epoch": 1044} {"train_loss": -30.641210556030273, "global_step": 126359, "epoch": 1044} {"train_loss": -22.907312393188477, "global_step": 126360, "epoch": 1044} {"train_loss": -31.53315544128418, "global_step": 126361, "epoch": 1044} {"train_loss": -35.0380859375, "global_step": 126362, "epoch": 1044} {"train_loss": -32.294559478759766, "global_step": 126363, "epoch": 1044} {"train_loss": -35.208099365234375, "global_step": 126364, "epoch": 1044} {"train_loss": -29.73613929748535, "global_step": 126365, "epoch": 1044} {"train_loss": -37.06618881225586, "global_step": 126366, "epoch": 1044} {"train_loss": -33.76791000366211, "global_step": 126367, "epoch": 1044} {"train_loss": -35.757484436035156, "global_step": 126368, "epoch": 1044} {"train_loss": -36.08110427856445, "global_step": 126369, "epoch": 1044} {"train_loss": -34.21260452270508, "global_step": 126370, "epoch": 1044} {"train_loss": -36.605167388916016, "global_step": 126371, "epoch": 1044} {"train_loss": -36.21240997314453, "global_step": 126372, "epoch": 1044} {"train_loss": -36.42306137084961, "global_step": 126373, "epoch": 1044} {"train_loss": -35.0340576171875, "global_step": 126374, "epoch": 1044} {"train_loss": -36.681640625, "global_step": 126375, "epoch": 1044} {"train_loss": -35.39439392089844, "global_step": 126376, "epoch": 1044} {"train_loss": -34.74741744995117, "global_step": 126377, "epoch": 1044} {"train_loss": -37.184608459472656, "global_step": 126378, "epoch": 1044} {"train_loss": -35.09174346923828, "global_step": 126379, "epoch": 1044} {"train_loss": -36.60880661010742, "global_step": 126380, "epoch": 1044} {"train_loss": -36.852195739746094, "global_step": 126381, "epoch": 1044} {"train_loss": -37.337215423583984, "global_step": 126382, "epoch": 1044} {"train_loss": -36.342529296875, "global_step": 126383, "epoch": 1044} {"train_loss": -36.663082122802734, "global_step": 126384, "epoch": 1044} {"train_loss": -37.3502082824707, "global_step": 126385, "epoch": 1044} {"train_loss": -37.13375473022461, "global_step": 126386, "epoch": 1044} {"train_loss": -37.29817199707031, "global_step": 126387, "epoch": 1044} {"train_loss": -36.24232482910156, "global_step": 126388, "epoch": 1044} {"train_loss": -37.80591583251953, "global_step": 126389, "epoch": 1044} {"train_loss": -37.53940963745117, "global_step": 126390, "epoch": 1044} {"train_loss": -37.60055160522461, "global_step": 126391, "epoch": 1044} {"train_loss": -37.82664108276367, "global_step": 126392, "epoch": 1044} {"train_loss": -37.86172866821289, "global_step": 126393, "epoch": 1044} {"train_loss": -38.20750045776367, "global_step": 126394, "epoch": 1044} {"train_loss": -36.64020538330078, "global_step": 126395, "epoch": 1044} {"train_loss": -38.43531036376953, "global_step": 126396, "epoch": 1044} {"train_loss": -38.15264892578125, "global_step": 126397, "epoch": 1044} {"train_loss": -38.0053825378418, "global_step": 126398, "epoch": 1044} {"train_loss": -38.02765655517578, "global_step": 126399, "epoch": 1044} {"train_loss": -37.4167366027832, "global_step": 126400, "epoch": 1044} {"train_loss": -38.370418548583984, "global_step": 126401, "epoch": 1044} {"train_loss": -38.18052291870117, "global_step": 126402, "epoch": 1044} {"train_loss": -37.89951705932617, "global_step": 126403, "epoch": 1044} {"train_loss": -38.26247787475586, "global_step": 126404, "epoch": 1044} {"train_loss": -38.46186447143555, "global_step": 126405, "epoch": 1044} {"train_loss": -37.70658874511719, "global_step": 126406, "epoch": 1044} {"train_loss": -38.524635314941406, "global_step": 126407, "epoch": 1044} {"train_loss": -38.90102005004883, "global_step": 126408, "epoch": 1044} {"train_loss": -37.912574768066406, "global_step": 126409, "epoch": 1044} {"train_loss": -38.9076042175293, "global_step": 126410, "epoch": 1044} {"train_loss": -38.616336822509766, "global_step": 126411, "epoch": 1044} {"train_loss": -38.57615280151367, "global_step": 126412, "epoch": 1044} {"train_loss": -39.01188659667969, "global_step": 126413, "epoch": 1044} {"train_loss": -38.60722732543945, "global_step": 126414, "epoch": 1044} {"train_loss": -38.88142395019531, "global_step": 126415, "epoch": 1044} {"train_loss": -38.78508758544922, "global_step": 126416, "epoch": 1044} {"train_loss": -39.112098693847656, "global_step": 126417, "epoch": 1044} {"train_loss": -37.743465423583984, "global_step": 126418, "epoch": 1044} {"train_loss": -38.38143539428711, "global_step": 126419, "epoch": 1044} {"train_loss": -38.752723693847656, "global_step": 126420, "epoch": 1044} {"train_loss": -38.89201736450195, "global_step": 126421, "epoch": 1044} {"train_loss": -38.66669464111328, "global_step": 126422, "epoch": 1044} {"train_loss": -38.21952438354492, "global_step": 126423, "epoch": 1044} {"train_loss": -38.572174072265625, "global_step": 126424, "epoch": 1044} {"train_loss": -37.9497184753418, "global_step": 126425, "epoch": 1044} {"train_loss": -39.606788635253906, "global_step": 126426, "epoch": 1044} {"train_loss": -39.25016784667969, "global_step": 126427, "epoch": 1044} {"train_loss": -39.15824508666992, "global_step": 126428, "epoch": 1044} {"train_loss": -39.218841552734375, "global_step": 126429, "epoch": 1044} {"train_loss": -38.87357711791992, "global_step": 126430, "epoch": 1044} {"train_loss": -38.9650993347168, "global_step": 126431, "epoch": 1044} {"train_loss": -37.914649963378906, "global_step": 126432, "epoch": 1044} {"train_loss": -39.03860092163086, "global_step": 126433, "epoch": 1044} {"train_loss": -39.4935302734375, "global_step": 126434, "epoch": 1044} {"train_loss": -38.56444549560547, "global_step": 126435, "epoch": 1044} {"train_loss": -39.48849105834961, "global_step": 126436, "epoch": 1044} {"train_loss": -39.085166931152344, "global_step": 126437, "epoch": 1044} {"train_loss": -37.2514533996582, "global_step": 126438, "epoch": 1044} {"train_loss": -38.242671966552734, "global_step": 126439, "epoch": 1044} {"train_loss": -39.48777389526367, "global_step": 126440, "epoch": 1044} {"train_loss": -38.94446563720703, "global_step": 126441, "epoch": 1044} {"train_loss": -38.60380935668945, "global_step": 126442, "epoch": 1044} {"train_loss": -39.15035629272461, "global_step": 126443, "epoch": 1044} {"train_loss": -37.40643753493128, "global_step": 126444, "epoch": 1044, "val_loss": 2627341.75} {"train_loss": -39.637840270996094, "global_step": 126445, "epoch": 1045} {"train_loss": -39.841732025146484, "global_step": 126446, "epoch": 1045} {"train_loss": -38.54581069946289, "global_step": 126447, "epoch": 1045} {"train_loss": -39.96741485595703, "global_step": 126448, "epoch": 1045} {"train_loss": -39.73637771606445, "global_step": 126449, "epoch": 1045} {"train_loss": -39.16811752319336, "global_step": 126450, "epoch": 1045} {"train_loss": -40.0561408996582, "global_step": 126451, "epoch": 1045} {"train_loss": -38.11050796508789, "global_step": 126452, "epoch": 1045} {"train_loss": -39.02775955200195, "global_step": 126453, "epoch": 1045} {"train_loss": -40.18019104003906, "global_step": 126454, "epoch": 1045} {"train_loss": -38.80070877075195, "global_step": 126455, "epoch": 1045} {"train_loss": -39.63016891479492, "global_step": 126456, "epoch": 1045} {"train_loss": -39.86837387084961, "global_step": 126457, "epoch": 1045} {"train_loss": -39.6245002746582, "global_step": 126458, "epoch": 1045} {"train_loss": -38.474605560302734, "global_step": 126459, "epoch": 1045} {"train_loss": -39.35994338989258, "global_step": 126460, "epoch": 1045} {"train_loss": -37.295345306396484, "global_step": 126461, "epoch": 1045} {"train_loss": -36.68375778198242, "global_step": 126462, "epoch": 1045} {"train_loss": -36.988441467285156, "global_step": 126463, "epoch": 1045} {"train_loss": -33.782012939453125, "global_step": 126464, "epoch": 1045} {"train_loss": -37.43113327026367, "global_step": 126465, "epoch": 1045} {"train_loss": -36.8912239074707, "global_step": 126466, "epoch": 1045} {"train_loss": -37.966346740722656, "global_step": 126467, "epoch": 1045} {"train_loss": -33.958885192871094, "global_step": 126468, "epoch": 1045} {"train_loss": -26.872623443603516, "global_step": 126469, "epoch": 1045} {"train_loss": -31.879491806030273, "global_step": 126470, "epoch": 1045} {"train_loss": -37.12358093261719, "global_step": 126471, "epoch": 1045} {"train_loss": -33.659454345703125, "global_step": 126472, "epoch": 1045} {"train_loss": -36.278045654296875, "global_step": 126473, "epoch": 1045} {"train_loss": -37.65629196166992, "global_step": 126474, "epoch": 1045} {"train_loss": -32.66169357299805, "global_step": 126475, "epoch": 1045} {"train_loss": -38.235130310058594, "global_step": 126476, "epoch": 1045} {"train_loss": -33.54169845581055, "global_step": 126477, "epoch": 1045} {"train_loss": -37.50788116455078, "global_step": 126478, "epoch": 1045} {"train_loss": -31.870874404907227, "global_step": 126479, "epoch": 1045} {"train_loss": -37.79084396362305, "global_step": 126480, "epoch": 1045} {"train_loss": -33.94999694824219, "global_step": 126481, "epoch": 1045} {"train_loss": -37.88956832885742, "global_step": 126482, "epoch": 1045} {"train_loss": -35.94369125366211, "global_step": 126483, "epoch": 1045} {"train_loss": -37.83734130859375, "global_step": 126484, "epoch": 1045} {"train_loss": -36.09465026855469, "global_step": 126485, "epoch": 1045} {"train_loss": -37.930419921875, "global_step": 126486, "epoch": 1045} {"train_loss": -36.502052307128906, "global_step": 126487, "epoch": 1045} {"train_loss": -38.3718147277832, "global_step": 126488, "epoch": 1045} {"train_loss": -37.25083923339844, "global_step": 126489, "epoch": 1045} {"train_loss": -37.46649169921875, "global_step": 126490, "epoch": 1045} {"train_loss": -38.17354965209961, "global_step": 126491, "epoch": 1045} {"train_loss": -37.80744171142578, "global_step": 126492, "epoch": 1045} {"train_loss": -38.14024353027344, "global_step": 126493, "epoch": 1045} {"train_loss": -37.99524688720703, "global_step": 126494, "epoch": 1045} {"train_loss": -37.87279510498047, "global_step": 126495, "epoch": 1045} {"train_loss": -34.34375, "global_step": 126496, "epoch": 1045} {"train_loss": -38.47365951538086, "global_step": 126497, "epoch": 1045} {"train_loss": -38.63037872314453, "global_step": 126498, "epoch": 1045} {"train_loss": -38.99831771850586, "global_step": 126499, "epoch": 1045} {"train_loss": -38.47324752807617, "global_step": 126500, "epoch": 1045} {"train_loss": -37.67647171020508, "global_step": 126501, "epoch": 1045} {"train_loss": -38.64463424682617, "global_step": 126502, "epoch": 1045} {"train_loss": -38.38654327392578, "global_step": 126503, "epoch": 1045} {"train_loss": -39.055023193359375, "global_step": 126504, "epoch": 1045} {"train_loss": -39.308345794677734, "global_step": 126505, "epoch": 1045} {"train_loss": -38.75520706176758, "global_step": 126506, "epoch": 1045} {"train_loss": -38.83005905151367, "global_step": 126507, "epoch": 1045} {"train_loss": -38.82902526855469, "global_step": 126508, "epoch": 1045} {"train_loss": -38.97589111328125, "global_step": 126509, "epoch": 1045} {"train_loss": -38.67875289916992, "global_step": 126510, "epoch": 1045} {"train_loss": -38.37119674682617, "global_step": 126511, "epoch": 1045} {"train_loss": -39.33060836791992, "global_step": 126512, "epoch": 1045} {"train_loss": -39.10782241821289, "global_step": 126513, "epoch": 1045} {"train_loss": -38.476806640625, "global_step": 126514, "epoch": 1045} {"train_loss": -38.96821212768555, "global_step": 126515, "epoch": 1045} {"train_loss": -38.146610260009766, "global_step": 126516, "epoch": 1045} {"train_loss": -38.86932373046875, "global_step": 126517, "epoch": 1045} {"train_loss": -39.398284912109375, "global_step": 126518, "epoch": 1045} {"train_loss": -38.139034271240234, "global_step": 126519, "epoch": 1045} {"train_loss": -38.83888626098633, "global_step": 126520, "epoch": 1045} {"train_loss": -39.11661911010742, "global_step": 126521, "epoch": 1045} {"train_loss": -39.21875, "global_step": 126522, "epoch": 1045} {"train_loss": -39.65261459350586, "global_step": 126523, "epoch": 1045} {"train_loss": -38.688018798828125, "global_step": 126524, "epoch": 1045} {"train_loss": -39.43089294433594, "global_step": 126525, "epoch": 1045} {"train_loss": -39.355953216552734, "global_step": 126526, "epoch": 1045} {"train_loss": -39.64371871948242, "global_step": 126527, "epoch": 1045} {"train_loss": -39.395511627197266, "global_step": 126528, "epoch": 1045} {"train_loss": -39.024818420410156, "global_step": 126529, "epoch": 1045} {"train_loss": -38.027320861816406, "global_step": 126530, "epoch": 1045} {"train_loss": -39.04018020629883, "global_step": 126531, "epoch": 1045} {"train_loss": -38.954383850097656, "global_step": 126532, "epoch": 1045} {"train_loss": -39.76188278198242, "global_step": 126533, "epoch": 1045} {"train_loss": -40.0456428527832, "global_step": 126534, "epoch": 1045} {"train_loss": -39.8986930847168, "global_step": 126535, "epoch": 1045} {"train_loss": -38.67817687988281, "global_step": 126536, "epoch": 1045} {"train_loss": -39.7781867980957, "global_step": 126537, "epoch": 1045} {"train_loss": -39.27602767944336, "global_step": 126538, "epoch": 1045} {"train_loss": -39.28977584838867, "global_step": 126539, "epoch": 1045} {"train_loss": -39.51515579223633, "global_step": 126540, "epoch": 1045} {"train_loss": -39.684566497802734, "global_step": 126541, "epoch": 1045} {"train_loss": -39.843849182128906, "global_step": 126542, "epoch": 1045} {"train_loss": -39.44831466674805, "global_step": 126543, "epoch": 1045} {"train_loss": -39.8587646484375, "global_step": 126544, "epoch": 1045} {"train_loss": -39.253543853759766, "global_step": 126545, "epoch": 1045} {"train_loss": -39.608577728271484, "global_step": 126546, "epoch": 1045} {"train_loss": -39.58415603637695, "global_step": 126547, "epoch": 1045} {"train_loss": -38.70621109008789, "global_step": 126548, "epoch": 1045} {"train_loss": -40.059566497802734, "global_step": 126549, "epoch": 1045} {"train_loss": -39.71590042114258, "global_step": 126550, "epoch": 1045} {"train_loss": -38.19853591918945, "global_step": 126551, "epoch": 1045} {"train_loss": -38.49123764038086, "global_step": 126552, "epoch": 1045} {"train_loss": -37.239959716796875, "global_step": 126553, "epoch": 1045} {"train_loss": -38.308990478515625, "global_step": 126554, "epoch": 1045} {"train_loss": -39.13578414916992, "global_step": 126555, "epoch": 1045} {"train_loss": -39.51469039916992, "global_step": 126556, "epoch": 1045} {"train_loss": -38.98984146118164, "global_step": 126557, "epoch": 1045} {"train_loss": -39.21413803100586, "global_step": 126558, "epoch": 1045} {"train_loss": -39.547027587890625, "global_step": 126559, "epoch": 1045} {"train_loss": -40.102413177490234, "global_step": 126560, "epoch": 1045} {"train_loss": -39.97870635986328, "global_step": 126561, "epoch": 1045} {"train_loss": -39.22751998901367, "global_step": 126562, "epoch": 1045} {"train_loss": -39.559532165527344, "global_step": 126563, "epoch": 1045} {"train_loss": -39.53947830200195, "global_step": 126564, "epoch": 1045} {"train_loss": -38.245206249646905, "global_step": 126565, "epoch": 1045, "val_loss": 2718005.25} {"train_loss": -40.18120193481445, "global_step": 126566, "epoch": 1046} {"train_loss": -40.460243225097656, "global_step": 126567, "epoch": 1046} {"train_loss": -39.316925048828125, "global_step": 126568, "epoch": 1046} {"train_loss": -38.529701232910156, "global_step": 126569, "epoch": 1046} {"train_loss": -39.3675651550293, "global_step": 126570, "epoch": 1046} {"train_loss": -39.92770004272461, "global_step": 126571, "epoch": 1046} {"train_loss": -39.61766052246094, "global_step": 126572, "epoch": 1046} {"train_loss": -39.72357940673828, "global_step": 126573, "epoch": 1046} {"train_loss": -39.670555114746094, "global_step": 126574, "epoch": 1046} {"train_loss": -38.433815002441406, "global_step": 126575, "epoch": 1046} {"train_loss": -40.17236328125, "global_step": 126576, "epoch": 1046} {"train_loss": -39.65433883666992, "global_step": 126577, "epoch": 1046} {"train_loss": -39.88608932495117, "global_step": 126578, "epoch": 1046} {"train_loss": -39.515167236328125, "global_step": 126579, "epoch": 1046} {"train_loss": -39.83180236816406, "global_step": 126580, "epoch": 1046} {"train_loss": -39.91879653930664, "global_step": 126581, "epoch": 1046} {"train_loss": -40.08637619018555, "global_step": 126582, "epoch": 1046} {"train_loss": -40.15951156616211, "global_step": 126583, "epoch": 1046} {"train_loss": -39.37775421142578, "global_step": 126584, "epoch": 1046} {"train_loss": -39.42836380004883, "global_step": 126585, "epoch": 1046} {"train_loss": -40.19540023803711, "global_step": 126586, "epoch": 1046} {"train_loss": -40.945919036865234, "global_step": 126587, "epoch": 1046} {"train_loss": -39.68574142456055, "global_step": 126588, "epoch": 1046} {"train_loss": -38.129127502441406, "global_step": 126589, "epoch": 1046} {"train_loss": -38.65087890625, "global_step": 126590, "epoch": 1046} {"train_loss": -38.8039665222168, "global_step": 126591, "epoch": 1046} {"train_loss": -39.81595993041992, "global_step": 126592, "epoch": 1046} {"train_loss": -39.30588912963867, "global_step": 126593, "epoch": 1046} {"train_loss": -38.49395751953125, "global_step": 126594, "epoch": 1046} {"train_loss": -40.028953552246094, "global_step": 126595, "epoch": 1046} {"train_loss": -39.386268615722656, "global_step": 126596, "epoch": 1046} {"train_loss": -39.67802047729492, "global_step": 126597, "epoch": 1046} {"train_loss": -40.275291442871094, "global_step": 126598, "epoch": 1046} {"train_loss": -39.690673828125, "global_step": 126599, "epoch": 1046} {"train_loss": -39.73756790161133, "global_step": 126600, "epoch": 1046} {"train_loss": -39.45198440551758, "global_step": 126601, "epoch": 1046} {"train_loss": -39.71686935424805, "global_step": 126602, "epoch": 1046} {"train_loss": -39.62439727783203, "global_step": 126603, "epoch": 1046} {"train_loss": -38.87704849243164, "global_step": 126604, "epoch": 1046} {"train_loss": -39.657440185546875, "global_step": 126605, "epoch": 1046} {"train_loss": -40.46087646484375, "global_step": 126606, "epoch": 1046} {"train_loss": -39.39649200439453, "global_step": 126607, "epoch": 1046} {"train_loss": -39.5824089050293, "global_step": 126608, "epoch": 1046} {"train_loss": -39.16860580444336, "global_step": 126609, "epoch": 1046} {"train_loss": -39.8792839050293, "global_step": 126610, "epoch": 1046} {"train_loss": -39.88719177246094, "global_step": 126611, "epoch": 1046} {"train_loss": -39.3276481628418, "global_step": 126612, "epoch": 1046} {"train_loss": -39.4531364440918, "global_step": 126613, "epoch": 1046} {"train_loss": -39.20476150512695, "global_step": 126614, "epoch": 1046} {"train_loss": -39.32627487182617, "global_step": 126615, "epoch": 1046} {"train_loss": -37.59981155395508, "global_step": 126616, "epoch": 1046} {"train_loss": -40.341590881347656, "global_step": 126617, "epoch": 1046} {"train_loss": -38.81789779663086, "global_step": 126618, "epoch": 1046} {"train_loss": -38.826866149902344, "global_step": 126619, "epoch": 1046} {"train_loss": -38.398677825927734, "global_step": 126620, "epoch": 1046} {"train_loss": -38.99797058105469, "global_step": 126621, "epoch": 1046} {"train_loss": -38.37467575073242, "global_step": 126622, "epoch": 1046} {"train_loss": -39.74335861206055, "global_step": 126623, "epoch": 1046} {"train_loss": -39.40393829345703, "global_step": 126624, "epoch": 1046} {"train_loss": -39.6597785949707, "global_step": 126625, "epoch": 1046} {"train_loss": -37.97154998779297, "global_step": 126626, "epoch": 1046} {"train_loss": -38.15371322631836, "global_step": 126627, "epoch": 1046} {"train_loss": -39.70244598388672, "global_step": 126628, "epoch": 1046} {"train_loss": -37.14957046508789, "global_step": 126629, "epoch": 1046} {"train_loss": -38.160072326660156, "global_step": 126630, "epoch": 1046} {"train_loss": -39.46192169189453, "global_step": 126631, "epoch": 1046} {"train_loss": -39.4339485168457, "global_step": 126632, "epoch": 1046} {"train_loss": -39.0167350769043, "global_step": 126633, "epoch": 1046} {"train_loss": -34.69635009765625, "global_step": 126634, "epoch": 1046} {"train_loss": -37.51514434814453, "global_step": 126635, "epoch": 1046} {"train_loss": -33.42681884765625, "global_step": 126636, "epoch": 1046} {"train_loss": -38.04719161987305, "global_step": 126637, "epoch": 1046} {"train_loss": -37.4576530456543, "global_step": 126638, "epoch": 1046} {"train_loss": -37.361141204833984, "global_step": 126639, "epoch": 1046} {"train_loss": -35.47022247314453, "global_step": 126640, "epoch": 1046} {"train_loss": -31.531768798828125, "global_step": 126641, "epoch": 1046} {"train_loss": -36.377437591552734, "global_step": 126642, "epoch": 1046} {"train_loss": -36.679359436035156, "global_step": 126643, "epoch": 1046} {"train_loss": -38.097145080566406, "global_step": 126644, "epoch": 1046} {"train_loss": -35.72120666503906, "global_step": 126645, "epoch": 1046} {"train_loss": -39.17538833618164, "global_step": 126646, "epoch": 1046} {"train_loss": -36.727840423583984, "global_step": 126647, "epoch": 1046} {"train_loss": -36.68220901489258, "global_step": 126648, "epoch": 1046} {"train_loss": -36.347511291503906, "global_step": 126649, "epoch": 1046} {"train_loss": -38.35868453979492, "global_step": 126650, "epoch": 1046} {"train_loss": -37.35681915283203, "global_step": 126651, "epoch": 1046} {"train_loss": -37.3909797668457, "global_step": 126652, "epoch": 1046} {"train_loss": -37.14844512939453, "global_step": 126653, "epoch": 1046} {"train_loss": -38.068790435791016, "global_step": 126654, "epoch": 1046} {"train_loss": -36.71002197265625, "global_step": 126655, "epoch": 1046} {"train_loss": -38.47107696533203, "global_step": 126656, "epoch": 1046} {"train_loss": -37.596187591552734, "global_step": 126657, "epoch": 1046} {"train_loss": -36.39667510986328, "global_step": 126658, "epoch": 1046} {"train_loss": -36.983482360839844, "global_step": 126659, "epoch": 1046} {"train_loss": -39.12034225463867, "global_step": 126660, "epoch": 1046} {"train_loss": -36.96099853515625, "global_step": 126661, "epoch": 1046} {"train_loss": -37.50767135620117, "global_step": 126662, "epoch": 1046} {"train_loss": -37.936309814453125, "global_step": 126663, "epoch": 1046} {"train_loss": -38.79917526245117, "global_step": 126664, "epoch": 1046} {"train_loss": -38.87355422973633, "global_step": 126665, "epoch": 1046} {"train_loss": -37.273372650146484, "global_step": 126666, "epoch": 1046} {"train_loss": -37.73575210571289, "global_step": 126667, "epoch": 1046} {"train_loss": -38.4217529296875, "global_step": 126668, "epoch": 1046} {"train_loss": -37.73389434814453, "global_step": 126669, "epoch": 1046} {"train_loss": -38.51686096191406, "global_step": 126670, "epoch": 1046} {"train_loss": -38.52582550048828, "global_step": 126671, "epoch": 1046} {"train_loss": -39.028663635253906, "global_step": 126672, "epoch": 1046} {"train_loss": -33.79218673706055, "global_step": 126673, "epoch": 1046} {"train_loss": -39.58220291137695, "global_step": 126674, "epoch": 1046} {"train_loss": -38.924007415771484, "global_step": 126675, "epoch": 1046} {"train_loss": -39.3003044128418, "global_step": 126676, "epoch": 1046} {"train_loss": -39.16670227050781, "global_step": 126677, "epoch": 1046} {"train_loss": -38.883358001708984, "global_step": 126678, "epoch": 1046} {"train_loss": -38.93010330200195, "global_step": 126679, "epoch": 1046} {"train_loss": -38.825801849365234, "global_step": 126680, "epoch": 1046} {"train_loss": -38.87580490112305, "global_step": 126681, "epoch": 1046} {"train_loss": -38.91259765625, "global_step": 126682, "epoch": 1046} {"train_loss": -39.17132568359375, "global_step": 126683, "epoch": 1046} {"train_loss": -39.325401306152344, "global_step": 126684, "epoch": 1046} {"train_loss": -39.10521697998047, "global_step": 126685, "epoch": 1046} {"train_loss": -38.6162499356861, "global_step": 126686, "epoch": 1046, "val_loss": 2731314.75} {"train_loss": -39.09977340698242, "global_step": 126687, "epoch": 1047} {"train_loss": -39.16167068481445, "global_step": 126688, "epoch": 1047} {"train_loss": -38.5834846496582, "global_step": 126689, "epoch": 1047} {"train_loss": -39.242427825927734, "global_step": 126690, "epoch": 1047} {"train_loss": -39.38431930541992, "global_step": 126691, "epoch": 1047} {"train_loss": -39.55925369262695, "global_step": 126692, "epoch": 1047} {"train_loss": -39.64227294921875, "global_step": 126693, "epoch": 1047} {"train_loss": -38.644710540771484, "global_step": 126694, "epoch": 1047} {"train_loss": -39.64751052856445, "global_step": 126695, "epoch": 1047} {"train_loss": -38.7276725769043, "global_step": 126696, "epoch": 1047} {"train_loss": -37.2235107421875, "global_step": 126697, "epoch": 1047} {"train_loss": -39.47677230834961, "global_step": 126698, "epoch": 1047} {"train_loss": -39.665916442871094, "global_step": 126699, "epoch": 1047} {"train_loss": -38.5181999206543, "global_step": 126700, "epoch": 1047} {"train_loss": -38.88008499145508, "global_step": 126701, "epoch": 1047} {"train_loss": -38.54105758666992, "global_step": 126702, "epoch": 1047} {"train_loss": -39.66462326049805, "global_step": 126703, "epoch": 1047} {"train_loss": -39.5914306640625, "global_step": 126704, "epoch": 1047} {"train_loss": -40.0867805480957, "global_step": 126705, "epoch": 1047} {"train_loss": -39.659637451171875, "global_step": 126706, "epoch": 1047} {"train_loss": -39.73164749145508, "global_step": 126707, "epoch": 1047} {"train_loss": -39.378318786621094, "global_step": 126708, "epoch": 1047} {"train_loss": -40.03792953491211, "global_step": 126709, "epoch": 1047} {"train_loss": -37.003910064697266, "global_step": 126710, "epoch": 1047} {"train_loss": -35.21843719482422, "global_step": 126711, "epoch": 1047} {"train_loss": -39.904605865478516, "global_step": 126712, "epoch": 1047} {"train_loss": -39.43558120727539, "global_step": 126713, "epoch": 1047} {"train_loss": -40.142425537109375, "global_step": 126714, "epoch": 1047} {"train_loss": -38.546974182128906, "global_step": 126715, "epoch": 1047} {"train_loss": -39.651546478271484, "global_step": 126716, "epoch": 1047} {"train_loss": -39.71562576293945, "global_step": 126717, "epoch": 1047} {"train_loss": -39.89284133911133, "global_step": 126718, "epoch": 1047} {"train_loss": -40.0769157409668, "global_step": 126719, "epoch": 1047} {"train_loss": -40.08002471923828, "global_step": 126720, "epoch": 1047} {"train_loss": -40.3173828125, "global_step": 126721, "epoch": 1047} {"train_loss": -40.123226165771484, "global_step": 126722, "epoch": 1047} {"train_loss": -38.8390007019043, "global_step": 126723, "epoch": 1047} {"train_loss": -39.40687942504883, "global_step": 126724, "epoch": 1047} {"train_loss": -39.97444152832031, "global_step": 126725, "epoch": 1047} {"train_loss": -39.2226448059082, "global_step": 126726, "epoch": 1047} {"train_loss": -39.176605224609375, "global_step": 126727, "epoch": 1047} {"train_loss": -39.93787384033203, "global_step": 126728, "epoch": 1047} {"train_loss": -40.12512969970703, "global_step": 126729, "epoch": 1047} {"train_loss": -39.9747200012207, "global_step": 126730, "epoch": 1047} {"train_loss": -36.08449935913086, "global_step": 126731, "epoch": 1047} {"train_loss": -39.97866439819336, "global_step": 126732, "epoch": 1047} {"train_loss": -40.01613235473633, "global_step": 126733, "epoch": 1047} {"train_loss": -40.203338623046875, "global_step": 126734, "epoch": 1047} {"train_loss": -39.90617752075195, "global_step": 126735, "epoch": 1047} {"train_loss": -39.890316009521484, "global_step": 126736, "epoch": 1047} {"train_loss": -39.81699752807617, "global_step": 126737, "epoch": 1047} {"train_loss": -37.216224670410156, "global_step": 126738, "epoch": 1047} {"train_loss": -37.519195556640625, "global_step": 126739, "epoch": 1047} {"train_loss": -39.27033615112305, "global_step": 126740, "epoch": 1047} {"train_loss": -39.281124114990234, "global_step": 126741, "epoch": 1047} {"train_loss": -39.90700912475586, "global_step": 126742, "epoch": 1047} {"train_loss": -39.1436882019043, "global_step": 126743, "epoch": 1047} {"train_loss": -39.3616943359375, "global_step": 126744, "epoch": 1047} {"train_loss": -36.88831329345703, "global_step": 126745, "epoch": 1047} {"train_loss": -38.057167053222656, "global_step": 126746, "epoch": 1047} {"train_loss": -37.36481475830078, "global_step": 126747, "epoch": 1047} {"train_loss": -36.080631256103516, "global_step": 126748, "epoch": 1047} {"train_loss": -35.84717559814453, "global_step": 126749, "epoch": 1047} {"train_loss": -37.63441467285156, "global_step": 126750, "epoch": 1047} {"train_loss": -39.46345138549805, "global_step": 126751, "epoch": 1047} {"train_loss": -38.734127044677734, "global_step": 126752, "epoch": 1047} {"train_loss": -37.90132141113281, "global_step": 126753, "epoch": 1047} {"train_loss": -33.47025680541992, "global_step": 126754, "epoch": 1047} {"train_loss": -32.849769592285156, "global_step": 126755, "epoch": 1047} {"train_loss": -37.844173431396484, "global_step": 126756, "epoch": 1047} {"train_loss": -39.229793548583984, "global_step": 126757, "epoch": 1047} {"train_loss": -33.8642692565918, "global_step": 126758, "epoch": 1047} {"train_loss": -37.15390396118164, "global_step": 126759, "epoch": 1047} {"train_loss": -39.52363967895508, "global_step": 126760, "epoch": 1047} {"train_loss": -37.235107421875, "global_step": 126761, "epoch": 1047} {"train_loss": -37.44843292236328, "global_step": 126762, "epoch": 1047} {"train_loss": -39.55660629272461, "global_step": 126763, "epoch": 1047} {"train_loss": -37.77631759643555, "global_step": 126764, "epoch": 1047} {"train_loss": -38.22053146362305, "global_step": 126765, "epoch": 1047} {"train_loss": -38.31425857543945, "global_step": 126766, "epoch": 1047} {"train_loss": -37.847984313964844, "global_step": 126767, "epoch": 1047} {"train_loss": -39.683815002441406, "global_step": 126768, "epoch": 1047} {"train_loss": -38.53028106689453, "global_step": 126769, "epoch": 1047} {"train_loss": -38.97358322143555, "global_step": 126770, "epoch": 1047} {"train_loss": -37.48798370361328, "global_step": 126771, "epoch": 1047} {"train_loss": -39.352088928222656, "global_step": 126772, "epoch": 1047} {"train_loss": -39.05447006225586, "global_step": 126773, "epoch": 1047} {"train_loss": -39.04793930053711, "global_step": 126774, "epoch": 1047} {"train_loss": -37.959835052490234, "global_step": 126775, "epoch": 1047} {"train_loss": -39.15348434448242, "global_step": 126776, "epoch": 1047} {"train_loss": -39.249874114990234, "global_step": 126777, "epoch": 1047} {"train_loss": -39.27450180053711, "global_step": 126778, "epoch": 1047} {"train_loss": -39.13796615600586, "global_step": 126779, "epoch": 1047} {"train_loss": -39.25368881225586, "global_step": 126780, "epoch": 1047} {"train_loss": -39.387081146240234, "global_step": 126781, "epoch": 1047} {"train_loss": -37.4702262878418, "global_step": 126782, "epoch": 1047} {"train_loss": -39.82688522338867, "global_step": 126783, "epoch": 1047} {"train_loss": -39.76051330566406, "global_step": 126784, "epoch": 1047} {"train_loss": -38.522315979003906, "global_step": 126785, "epoch": 1047} {"train_loss": -38.540706634521484, "global_step": 126786, "epoch": 1047} {"train_loss": -38.35398483276367, "global_step": 126787, "epoch": 1047} {"train_loss": -39.52777862548828, "global_step": 126788, "epoch": 1047} {"train_loss": -39.611515045166016, "global_step": 126789, "epoch": 1047} {"train_loss": -38.44558334350586, "global_step": 126790, "epoch": 1047} {"train_loss": -38.13627243041992, "global_step": 126791, "epoch": 1047} {"train_loss": -38.84112548828125, "global_step": 126792, "epoch": 1047} {"train_loss": -37.85858917236328, "global_step": 126793, "epoch": 1047} {"train_loss": -38.871280670166016, "global_step": 126794, "epoch": 1047} {"train_loss": -39.046627044677734, "global_step": 126795, "epoch": 1047} {"train_loss": -35.214141845703125, "global_step": 126796, "epoch": 1047} {"train_loss": -36.750545501708984, "global_step": 126797, "epoch": 1047} {"train_loss": -38.37372970581055, "global_step": 126798, "epoch": 1047} {"train_loss": -38.31838607788086, "global_step": 126799, "epoch": 1047} {"train_loss": -33.99033737182617, "global_step": 126800, "epoch": 1047} {"train_loss": -36.096675872802734, "global_step": 126801, "epoch": 1047} {"train_loss": -38.45013427734375, "global_step": 126802, "epoch": 1047} {"train_loss": -35.269039154052734, "global_step": 126803, "epoch": 1047} {"train_loss": -38.574283599853516, "global_step": 126804, "epoch": 1047} {"train_loss": -37.99673080444336, "global_step": 126805, "epoch": 1047} {"train_loss": -37.791717529296875, "global_step": 126806, "epoch": 1047} {"train_loss": -38.57193734035019, "global_step": 126807, "epoch": 1047, "val_loss": 2971818.25} {"train_loss": -36.42433547973633, "global_step": 126808, "epoch": 1048} {"train_loss": -38.01872634887695, "global_step": 126809, "epoch": 1048} {"train_loss": -37.31697463989258, "global_step": 126810, "epoch": 1048} {"train_loss": -37.78667449951172, "global_step": 126811, "epoch": 1048} {"train_loss": -36.61275100708008, "global_step": 126812, "epoch": 1048} {"train_loss": -37.56645202636719, "global_step": 126813, "epoch": 1048} {"train_loss": -36.98155212402344, "global_step": 126814, "epoch": 1048} {"train_loss": -36.344303131103516, "global_step": 126815, "epoch": 1048} {"train_loss": -37.67178726196289, "global_step": 126816, "epoch": 1048} {"train_loss": -37.65688705444336, "global_step": 126817, "epoch": 1048} {"train_loss": -36.827903747558594, "global_step": 126818, "epoch": 1048} {"train_loss": -37.7608757019043, "global_step": 126819, "epoch": 1048} {"train_loss": -37.38306427001953, "global_step": 126820, "epoch": 1048} {"train_loss": -35.062660217285156, "global_step": 126821, "epoch": 1048} {"train_loss": -35.45282745361328, "global_step": 126822, "epoch": 1048} {"train_loss": -37.1613655090332, "global_step": 126823, "epoch": 1048} {"train_loss": -37.2070198059082, "global_step": 126824, "epoch": 1048} {"train_loss": -38.295345306396484, "global_step": 126825, "epoch": 1048} {"train_loss": -34.26801300048828, "global_step": 126826, "epoch": 1048} {"train_loss": -34.138893127441406, "global_step": 126827, "epoch": 1048} {"train_loss": -36.48356246948242, "global_step": 126828, "epoch": 1048} {"train_loss": -35.78900146484375, "global_step": 126829, "epoch": 1048} {"train_loss": -35.301300048828125, "global_step": 126830, "epoch": 1048} {"train_loss": -36.729888916015625, "global_step": 126831, "epoch": 1048} {"train_loss": -35.928218841552734, "global_step": 126832, "epoch": 1048} {"train_loss": -37.653907775878906, "global_step": 126833, "epoch": 1048} {"train_loss": -36.944053649902344, "global_step": 126834, "epoch": 1048} {"train_loss": -31.024641036987305, "global_step": 126835, "epoch": 1048} {"train_loss": -34.67287063598633, "global_step": 126836, "epoch": 1048} {"train_loss": -37.102577209472656, "global_step": 126837, "epoch": 1048} {"train_loss": -33.66945266723633, "global_step": 126838, "epoch": 1048} {"train_loss": -36.79164505004883, "global_step": 126839, "epoch": 1048} {"train_loss": -36.82391357421875, "global_step": 126840, "epoch": 1048} {"train_loss": -34.98081588745117, "global_step": 126841, "epoch": 1048} {"train_loss": -33.961891174316406, "global_step": 126842, "epoch": 1048} {"train_loss": -35.737876892089844, "global_step": 126843, "epoch": 1048} {"train_loss": -37.0428581237793, "global_step": 126844, "epoch": 1048} {"train_loss": -36.503726959228516, "global_step": 126845, "epoch": 1048} {"train_loss": -36.849815368652344, "global_step": 126846, "epoch": 1048} {"train_loss": -37.21709060668945, "global_step": 126847, "epoch": 1048} {"train_loss": -35.64742660522461, "global_step": 126848, "epoch": 1048} {"train_loss": -35.128902435302734, "global_step": 126849, "epoch": 1048} {"train_loss": -36.54956817626953, "global_step": 126850, "epoch": 1048} {"train_loss": -37.18621063232422, "global_step": 126851, "epoch": 1048} {"train_loss": -37.90102005004883, "global_step": 126852, "epoch": 1048} {"train_loss": -35.36395263671875, "global_step": 126853, "epoch": 1048} {"train_loss": -37.736915588378906, "global_step": 126854, "epoch": 1048} {"train_loss": -37.18426513671875, "global_step": 126855, "epoch": 1048} {"train_loss": -37.24250411987305, "global_step": 126856, "epoch": 1048} {"train_loss": -37.334407806396484, "global_step": 126857, "epoch": 1048} {"train_loss": -38.127254486083984, "global_step": 126858, "epoch": 1048} {"train_loss": -37.27080154418945, "global_step": 126859, "epoch": 1048} {"train_loss": -37.1818962097168, "global_step": 126860, "epoch": 1048} {"train_loss": -37.666866302490234, "global_step": 126861, "epoch": 1048} {"train_loss": -37.425392150878906, "global_step": 126862, "epoch": 1048} {"train_loss": -37.56916809082031, "global_step": 126863, "epoch": 1048} {"train_loss": -37.671607971191406, "global_step": 126864, "epoch": 1048} {"train_loss": -37.902565002441406, "global_step": 126865, "epoch": 1048} {"train_loss": -37.78247833251953, "global_step": 126866, "epoch": 1048} {"train_loss": -38.52436447143555, "global_step": 126867, "epoch": 1048} {"train_loss": -37.420623779296875, "global_step": 126868, "epoch": 1048} {"train_loss": -38.1870002746582, "global_step": 126869, "epoch": 1048} {"train_loss": -38.74970626831055, "global_step": 126870, "epoch": 1048} {"train_loss": -38.43061447143555, "global_step": 126871, "epoch": 1048} {"train_loss": -38.051265716552734, "global_step": 126872, "epoch": 1048} {"train_loss": -38.32461929321289, "global_step": 126873, "epoch": 1048} {"train_loss": -38.871131896972656, "global_step": 126874, "epoch": 1048} {"train_loss": -38.342281341552734, "global_step": 126875, "epoch": 1048} {"train_loss": -38.17921447753906, "global_step": 126876, "epoch": 1048} {"train_loss": -38.88372802734375, "global_step": 126877, "epoch": 1048} {"train_loss": -38.34537887573242, "global_step": 126878, "epoch": 1048} {"train_loss": -38.65745162963867, "global_step": 126879, "epoch": 1048} {"train_loss": -38.83964920043945, "global_step": 126880, "epoch": 1048} {"train_loss": -38.5762939453125, "global_step": 126881, "epoch": 1048} {"train_loss": -38.45156478881836, "global_step": 126882, "epoch": 1048} {"train_loss": -38.96744155883789, "global_step": 126883, "epoch": 1048} {"train_loss": -39.062416076660156, "global_step": 126884, "epoch": 1048} {"train_loss": -38.00602722167969, "global_step": 126885, "epoch": 1048} {"train_loss": -39.06877517700195, "global_step": 126886, "epoch": 1048} {"train_loss": -39.10078048706055, "global_step": 126887, "epoch": 1048} {"train_loss": -38.922481536865234, "global_step": 126888, "epoch": 1048} {"train_loss": -39.28499984741211, "global_step": 126889, "epoch": 1048} {"train_loss": -39.299869537353516, "global_step": 126890, "epoch": 1048} {"train_loss": -38.89756774902344, "global_step": 126891, "epoch": 1048} {"train_loss": -38.809139251708984, "global_step": 126892, "epoch": 1048} {"train_loss": -39.43196487426758, "global_step": 126893, "epoch": 1048} {"train_loss": -39.191734313964844, "global_step": 126894, "epoch": 1048} {"train_loss": -38.56892776489258, "global_step": 126895, "epoch": 1048} {"train_loss": -39.32847213745117, "global_step": 126896, "epoch": 1048} {"train_loss": -39.4311637878418, "global_step": 126897, "epoch": 1048} {"train_loss": -39.491329193115234, "global_step": 126898, "epoch": 1048} {"train_loss": -38.44936752319336, "global_step": 126899, "epoch": 1048} {"train_loss": -38.965309143066406, "global_step": 126900, "epoch": 1048} {"train_loss": -38.714263916015625, "global_step": 126901, "epoch": 1048} {"train_loss": -39.342262268066406, "global_step": 126902, "epoch": 1048} {"train_loss": -39.60536575317383, "global_step": 126903, "epoch": 1048} {"train_loss": -38.72068405151367, "global_step": 126904, "epoch": 1048} {"train_loss": -39.5399284362793, "global_step": 126905, "epoch": 1048} {"train_loss": -39.6456298828125, "global_step": 126906, "epoch": 1048} {"train_loss": -39.624813079833984, "global_step": 126907, "epoch": 1048} {"train_loss": -39.812557220458984, "global_step": 126908, "epoch": 1048} {"train_loss": -39.292701721191406, "global_step": 126909, "epoch": 1048} {"train_loss": -39.48473358154297, "global_step": 126910, "epoch": 1048} {"train_loss": -39.853759765625, "global_step": 126911, "epoch": 1048} {"train_loss": -39.652549743652344, "global_step": 126912, "epoch": 1048} {"train_loss": -40.01545333862305, "global_step": 126913, "epoch": 1048} {"train_loss": -39.6030387878418, "global_step": 126914, "epoch": 1048} {"train_loss": -39.9642219543457, "global_step": 126915, "epoch": 1048} {"train_loss": -39.69730758666992, "global_step": 126916, "epoch": 1048} {"train_loss": -40.2097053527832, "global_step": 126917, "epoch": 1048} {"train_loss": -39.8663444519043, "global_step": 126918, "epoch": 1048} {"train_loss": -39.58882522583008, "global_step": 126919, "epoch": 1048} {"train_loss": -38.84194564819336, "global_step": 126920, "epoch": 1048} {"train_loss": -39.87971496582031, "global_step": 126921, "epoch": 1048} {"train_loss": -39.88570022583008, "global_step": 126922, "epoch": 1048} {"train_loss": -39.98173141479492, "global_step": 126923, "epoch": 1048} {"train_loss": -38.953468322753906, "global_step": 126924, "epoch": 1048} {"train_loss": -39.46284866333008, "global_step": 126925, "epoch": 1048} {"train_loss": -39.656822204589844, "global_step": 126926, "epoch": 1048} {"train_loss": -39.79545974731445, "global_step": 126927, "epoch": 1048} {"train_loss": -37.88262010999947, "global_step": 126928, "epoch": 1048, "val_loss": 2743383.25} {"train_loss": -39.97150421142578, "global_step": 126929, "epoch": 1049} {"train_loss": -38.83368682861328, "global_step": 126930, "epoch": 1049} {"train_loss": -38.80350875854492, "global_step": 126931, "epoch": 1049} {"train_loss": -38.97843551635742, "global_step": 126932, "epoch": 1049} {"train_loss": -40.34214401245117, "global_step": 126933, "epoch": 1049} {"train_loss": -39.26026153564453, "global_step": 126934, "epoch": 1049} {"train_loss": -37.62117385864258, "global_step": 126935, "epoch": 1049} {"train_loss": -38.469051361083984, "global_step": 126936, "epoch": 1049} {"train_loss": -37.936256408691406, "global_step": 126937, "epoch": 1049} {"train_loss": -39.51837921142578, "global_step": 126938, "epoch": 1049} {"train_loss": -39.160640716552734, "global_step": 126939, "epoch": 1049} {"train_loss": -40.13400650024414, "global_step": 126940, "epoch": 1049} {"train_loss": -39.50178527832031, "global_step": 126941, "epoch": 1049} {"train_loss": -37.55256271362305, "global_step": 126942, "epoch": 1049} {"train_loss": -40.09554672241211, "global_step": 126943, "epoch": 1049} {"train_loss": -40.0581169128418, "global_step": 126944, "epoch": 1049} {"train_loss": -39.6872444152832, "global_step": 126945, "epoch": 1049} {"train_loss": -38.567420959472656, "global_step": 126946, "epoch": 1049} {"train_loss": -38.796852111816406, "global_step": 126947, "epoch": 1049} {"train_loss": -39.49969482421875, "global_step": 126948, "epoch": 1049} {"train_loss": -39.743717193603516, "global_step": 126949, "epoch": 1049} {"train_loss": -39.727882385253906, "global_step": 126950, "epoch": 1049} {"train_loss": -39.48044967651367, "global_step": 126951, "epoch": 1049} {"train_loss": -39.89703369140625, "global_step": 126952, "epoch": 1049} {"train_loss": -40.0072021484375, "global_step": 126953, "epoch": 1049} {"train_loss": -39.526092529296875, "global_step": 126954, "epoch": 1049} {"train_loss": -38.85139083862305, "global_step": 126955, "epoch": 1049} {"train_loss": -37.4707145690918, "global_step": 126956, "epoch": 1049} {"train_loss": -36.342369079589844, "global_step": 126957, "epoch": 1049} {"train_loss": -36.09484100341797, "global_step": 126958, "epoch": 1049} {"train_loss": -36.6632080078125, "global_step": 126959, "epoch": 1049} {"train_loss": -35.899009704589844, "global_step": 126960, "epoch": 1049} {"train_loss": -37.91030502319336, "global_step": 126961, "epoch": 1049} {"train_loss": -37.60304641723633, "global_step": 126962, "epoch": 1049} {"train_loss": -39.602813720703125, "global_step": 126963, "epoch": 1049} {"train_loss": -36.9285774230957, "global_step": 126964, "epoch": 1049} {"train_loss": -38.58150863647461, "global_step": 126965, "epoch": 1049} {"train_loss": -39.25962829589844, "global_step": 126966, "epoch": 1049} {"train_loss": -37.54724884033203, "global_step": 126967, "epoch": 1049} {"train_loss": -39.003353118896484, "global_step": 126968, "epoch": 1049} {"train_loss": -38.85708236694336, "global_step": 126969, "epoch": 1049} {"train_loss": -39.83181381225586, "global_step": 126970, "epoch": 1049} {"train_loss": -37.94694900512695, "global_step": 126971, "epoch": 1049} {"train_loss": -39.164031982421875, "global_step": 126972, "epoch": 1049} {"train_loss": -39.657142639160156, "global_step": 126973, "epoch": 1049} {"train_loss": -38.95964431762695, "global_step": 126974, "epoch": 1049} {"train_loss": -37.61066818237305, "global_step": 126975, "epoch": 1049} {"train_loss": -38.126834869384766, "global_step": 126976, "epoch": 1049} {"train_loss": -38.739654541015625, "global_step": 126977, "epoch": 1049} {"train_loss": -38.287845611572266, "global_step": 126978, "epoch": 1049} {"train_loss": -37.15867614746094, "global_step": 126979, "epoch": 1049} {"train_loss": -38.63006591796875, "global_step": 126980, "epoch": 1049} {"train_loss": -38.65281295776367, "global_step": 126981, "epoch": 1049} {"train_loss": -39.2086296081543, "global_step": 126982, "epoch": 1049} {"train_loss": -39.16021728515625, "global_step": 126983, "epoch": 1049} {"train_loss": -38.7645149230957, "global_step": 126984, "epoch": 1049} {"train_loss": -39.01506805419922, "global_step": 126985, "epoch": 1049} {"train_loss": -38.27406692504883, "global_step": 126986, "epoch": 1049} {"train_loss": -38.38271713256836, "global_step": 126987, "epoch": 1049} {"train_loss": -38.492889404296875, "global_step": 126988, "epoch": 1049} {"train_loss": -39.13100051879883, "global_step": 126989, "epoch": 1049} {"train_loss": -39.72013473510742, "global_step": 126990, "epoch": 1049} {"train_loss": -38.356048583984375, "global_step": 126991, "epoch": 1049} {"train_loss": -39.82528305053711, "global_step": 126992, "epoch": 1049} {"train_loss": -39.34006881713867, "global_step": 126993, "epoch": 1049} {"train_loss": -39.31634521484375, "global_step": 126994, "epoch": 1049} {"train_loss": -39.341522216796875, "global_step": 126995, "epoch": 1049} {"train_loss": -38.6493034362793, "global_step": 126996, "epoch": 1049} {"train_loss": -37.117431640625, "global_step": 126997, "epoch": 1049} {"train_loss": -37.25224685668945, "global_step": 126998, "epoch": 1049} {"train_loss": -39.37425231933594, "global_step": 126999, "epoch": 1049} {"train_loss": -39.95967483520508, "global_step": 127000, "epoch": 1049} {"train_loss": -39.29389572143555, "global_step": 127001, "epoch": 1049} {"train_loss": -38.29938888549805, "global_step": 127002, "epoch": 1049} {"train_loss": -39.472747802734375, "global_step": 127003, "epoch": 1049} {"train_loss": -39.39613723754883, "global_step": 127004, "epoch": 1049} {"train_loss": -39.647274017333984, "global_step": 127005, "epoch": 1049} {"train_loss": -38.2539176940918, "global_step": 127006, "epoch": 1049} {"train_loss": -38.40071487426758, "global_step": 127007, "epoch": 1049} {"train_loss": -40.172550201416016, "global_step": 127008, "epoch": 1049} {"train_loss": -39.20479965209961, "global_step": 127009, "epoch": 1049} {"train_loss": -39.02144241333008, "global_step": 127010, "epoch": 1049} {"train_loss": -38.40623092651367, "global_step": 127011, "epoch": 1049} {"train_loss": -40.16948318481445, "global_step": 127012, "epoch": 1049} {"train_loss": -39.68154525756836, "global_step": 127013, "epoch": 1049} {"train_loss": -39.373165130615234, "global_step": 127014, "epoch": 1049} {"train_loss": -39.84135055541992, "global_step": 127015, "epoch": 1049} {"train_loss": -40.19731521606445, "global_step": 127016, "epoch": 1049} {"train_loss": -39.36067581176758, "global_step": 127017, "epoch": 1049} {"train_loss": -39.9509162902832, "global_step": 127018, "epoch": 1049} {"train_loss": -38.63120651245117, "global_step": 127019, "epoch": 1049} {"train_loss": -38.67698287963867, "global_step": 127020, "epoch": 1049} {"train_loss": -40.1612434387207, "global_step": 127021, "epoch": 1049} {"train_loss": -39.721614837646484, "global_step": 127022, "epoch": 1049} {"train_loss": -39.29041290283203, "global_step": 127023, "epoch": 1049} {"train_loss": -40.4215087890625, "global_step": 127024, "epoch": 1049} {"train_loss": -39.29659652709961, "global_step": 127025, "epoch": 1049} {"train_loss": -39.54029846191406, "global_step": 127026, "epoch": 1049} {"train_loss": -39.704437255859375, "global_step": 127027, "epoch": 1049} {"train_loss": -39.60406494140625, "global_step": 127028, "epoch": 1049} {"train_loss": -40.10654067993164, "global_step": 127029, "epoch": 1049} {"train_loss": -38.97943878173828, "global_step": 127030, "epoch": 1049} {"train_loss": -39.73075485229492, "global_step": 127031, "epoch": 1049} {"train_loss": -39.652320861816406, "global_step": 127032, "epoch": 1049} {"train_loss": -40.6719856262207, "global_step": 127033, "epoch": 1049} {"train_loss": -39.53557205200195, "global_step": 127034, "epoch": 1049} {"train_loss": -40.53238296508789, "global_step": 127035, "epoch": 1049} {"train_loss": -40.365718841552734, "global_step": 127036, "epoch": 1049} {"train_loss": -39.86085891723633, "global_step": 127037, "epoch": 1049} {"train_loss": -39.6634635925293, "global_step": 127038, "epoch": 1049} {"train_loss": -39.22419357299805, "global_step": 127039, "epoch": 1049} {"train_loss": -40.161293029785156, "global_step": 127040, "epoch": 1049} {"train_loss": -40.23804473876953, "global_step": 127041, "epoch": 1049} {"train_loss": -39.39310836791992, "global_step": 127042, "epoch": 1049} {"train_loss": -39.58399200439453, "global_step": 127043, "epoch": 1049} {"train_loss": -39.747859954833984, "global_step": 127044, "epoch": 1049} {"train_loss": -38.90624237060547, "global_step": 127045, "epoch": 1049} {"train_loss": -40.27625274658203, "global_step": 127046, "epoch": 1049} {"train_loss": -39.64654541015625, "global_step": 127047, "epoch": 1049} {"train_loss": -39.32102966308594, "global_step": 127048, "epoch": 1049} {"train_loss": -39.07503550505835, "global_step": 127049, "epoch": 1049, "val_loss": 2761383.25} {"train_loss": -38.77297592163086, "global_step": 127050, "epoch": 1050} {"train_loss": -39.033935546875, "global_step": 127051, "epoch": 1050} {"train_loss": -40.27893829345703, "global_step": 127052, "epoch": 1050} {"train_loss": -39.0367546081543, "global_step": 127053, "epoch": 1050} {"train_loss": -38.230552673339844, "global_step": 127054, "epoch": 1050} {"train_loss": -39.53596878051758, "global_step": 127055, "epoch": 1050} {"train_loss": -40.06898880004883, "global_step": 127056, "epoch": 1050} {"train_loss": -38.90277862548828, "global_step": 127057, "epoch": 1050} {"train_loss": -39.6328010559082, "global_step": 127058, "epoch": 1050} {"train_loss": -39.700618743896484, "global_step": 127059, "epoch": 1050} {"train_loss": -39.289154052734375, "global_step": 127060, "epoch": 1050} {"train_loss": -38.74795150756836, "global_step": 127061, "epoch": 1050} {"train_loss": -37.68349838256836, "global_step": 127062, "epoch": 1050} {"train_loss": -38.39984130859375, "global_step": 127063, "epoch": 1050} {"train_loss": -39.0212516784668, "global_step": 127064, "epoch": 1050} {"train_loss": -37.61738204956055, "global_step": 127065, "epoch": 1050} {"train_loss": -37.46047592163086, "global_step": 127066, "epoch": 1050} {"train_loss": -35.77809524536133, "global_step": 127067, "epoch": 1050} {"train_loss": -33.0238037109375, "global_step": 127068, "epoch": 1050} {"train_loss": -28.6445255279541, "global_step": 127069, "epoch": 1050} {"train_loss": -30.657690048217773, "global_step": 127070, "epoch": 1050} {"train_loss": -34.378231048583984, "global_step": 127071, "epoch": 1050} {"train_loss": -38.94318389892578, "global_step": 127072, "epoch": 1050} {"train_loss": -35.002357482910156, "global_step": 127073, "epoch": 1050} {"train_loss": -37.54903793334961, "global_step": 127074, "epoch": 1050} {"train_loss": -36.786949157714844, "global_step": 127075, "epoch": 1050} {"train_loss": -36.79274368286133, "global_step": 127076, "epoch": 1050} {"train_loss": -39.03278732299805, "global_step": 127077, "epoch": 1050} {"train_loss": -38.208717346191406, "global_step": 127078, "epoch": 1050} {"train_loss": -39.40190124511719, "global_step": 127079, "epoch": 1050} {"train_loss": -39.009395599365234, "global_step": 127080, "epoch": 1050} {"train_loss": -37.81826400756836, "global_step": 127081, "epoch": 1050} {"train_loss": -38.03498458862305, "global_step": 127082, "epoch": 1050} {"train_loss": -36.914947509765625, "global_step": 127083, "epoch": 1050} {"train_loss": -38.846004486083984, "global_step": 127084, "epoch": 1050} {"train_loss": -37.7707405090332, "global_step": 127085, "epoch": 1050} {"train_loss": -38.74143600463867, "global_step": 127086, "epoch": 1050} {"train_loss": -38.2880859375, "global_step": 127087, "epoch": 1050} {"train_loss": -39.427860260009766, "global_step": 127088, "epoch": 1050} {"train_loss": -38.6826286315918, "global_step": 127089, "epoch": 1050} {"train_loss": -38.63433074951172, "global_step": 127090, "epoch": 1050} {"train_loss": -38.62345886230469, "global_step": 127091, "epoch": 1050} {"train_loss": -39.58372116088867, "global_step": 127092, "epoch": 1050} {"train_loss": -38.00406265258789, "global_step": 127093, "epoch": 1050} {"train_loss": -38.94611358642578, "global_step": 127094, "epoch": 1050} {"train_loss": -38.60063934326172, "global_step": 127095, "epoch": 1050} {"train_loss": -39.698204040527344, "global_step": 127096, "epoch": 1050} {"train_loss": -39.327735900878906, "global_step": 127097, "epoch": 1050} {"train_loss": -38.731380462646484, "global_step": 127098, "epoch": 1050} {"train_loss": -38.59432601928711, "global_step": 127099, "epoch": 1050} {"train_loss": -39.400569915771484, "global_step": 127100, "epoch": 1050} {"train_loss": -38.82098388671875, "global_step": 127101, "epoch": 1050} {"train_loss": -39.042701721191406, "global_step": 127102, "epoch": 1050} {"train_loss": -37.272735595703125, "global_step": 127103, "epoch": 1050} {"train_loss": -37.49688720703125, "global_step": 127104, "epoch": 1050} {"train_loss": -37.991207122802734, "global_step": 127105, "epoch": 1050} {"train_loss": -39.23714065551758, "global_step": 127106, "epoch": 1050} {"train_loss": -38.336578369140625, "global_step": 127107, "epoch": 1050} {"train_loss": -38.99473190307617, "global_step": 127108, "epoch": 1050} {"train_loss": -38.26284408569336, "global_step": 127109, "epoch": 1050} {"train_loss": -38.1969108581543, "global_step": 127110, "epoch": 1050} {"train_loss": -39.04449462890625, "global_step": 127111, "epoch": 1050} {"train_loss": -39.12458038330078, "global_step": 127112, "epoch": 1050} {"train_loss": -39.361141204833984, "global_step": 127113, "epoch": 1050} {"train_loss": -38.824188232421875, "global_step": 127114, "epoch": 1050} {"train_loss": -38.55965805053711, "global_step": 127115, "epoch": 1050} {"train_loss": -37.29193115234375, "global_step": 127116, "epoch": 1050} {"train_loss": -39.381072998046875, "global_step": 127117, "epoch": 1050} {"train_loss": -38.76469802856445, "global_step": 127118, "epoch": 1050} {"train_loss": -39.28790283203125, "global_step": 127119, "epoch": 1050} {"train_loss": -39.01612854003906, "global_step": 127120, "epoch": 1050} {"train_loss": -38.93788528442383, "global_step": 127121, "epoch": 1050} {"train_loss": -39.77573776245117, "global_step": 127122, "epoch": 1050} {"train_loss": -38.50088119506836, "global_step": 127123, "epoch": 1050} {"train_loss": -39.321502685546875, "global_step": 127124, "epoch": 1050} {"train_loss": -38.7677001953125, "global_step": 127125, "epoch": 1050} {"train_loss": -38.744747161865234, "global_step": 127126, "epoch": 1050} {"train_loss": -39.1418571472168, "global_step": 127127, "epoch": 1050} {"train_loss": -38.634456634521484, "global_step": 127128, "epoch": 1050} {"train_loss": -38.83059310913086, "global_step": 127129, "epoch": 1050} {"train_loss": -38.61808395385742, "global_step": 127130, "epoch": 1050} {"train_loss": -39.331459045410156, "global_step": 127131, "epoch": 1050} {"train_loss": -38.41700744628906, "global_step": 127132, "epoch": 1050} {"train_loss": -38.89677047729492, "global_step": 127133, "epoch": 1050} {"train_loss": -38.54438400268555, "global_step": 127134, "epoch": 1050} {"train_loss": -38.74015426635742, "global_step": 127135, "epoch": 1050} {"train_loss": -39.81700134277344, "global_step": 127136, "epoch": 1050} {"train_loss": -39.577125549316406, "global_step": 127137, "epoch": 1050} {"train_loss": -39.57756805419922, "global_step": 127138, "epoch": 1050} {"train_loss": -38.78867721557617, "global_step": 127139, "epoch": 1050} {"train_loss": -39.98746871948242, "global_step": 127140, "epoch": 1050} {"train_loss": -39.6107177734375, "global_step": 127141, "epoch": 1050} {"train_loss": -39.145294189453125, "global_step": 127142, "epoch": 1050} {"train_loss": -38.588897705078125, "global_step": 127143, "epoch": 1050} {"train_loss": -37.978187561035156, "global_step": 127144, "epoch": 1050} {"train_loss": -38.64078903198242, "global_step": 127145, "epoch": 1050} {"train_loss": -38.862979888916016, "global_step": 127146, "epoch": 1050} {"train_loss": -38.357513427734375, "global_step": 127147, "epoch": 1050} {"train_loss": -36.06672286987305, "global_step": 127148, "epoch": 1050} {"train_loss": -37.096588134765625, "global_step": 127149, "epoch": 1050} {"train_loss": -39.1187629699707, "global_step": 127150, "epoch": 1050} {"train_loss": -36.55979537963867, "global_step": 127151, "epoch": 1050} {"train_loss": -39.118751525878906, "global_step": 127152, "epoch": 1050} {"train_loss": -38.55261993408203, "global_step": 127153, "epoch": 1050} {"train_loss": -36.24062728881836, "global_step": 127154, "epoch": 1050} {"train_loss": -39.12493133544922, "global_step": 127155, "epoch": 1050} {"train_loss": -38.60752487182617, "global_step": 127156, "epoch": 1050} {"train_loss": -33.93522262573242, "global_step": 127157, "epoch": 1050} {"train_loss": -39.09994125366211, "global_step": 127158, "epoch": 1050} {"train_loss": -38.85184860229492, "global_step": 127159, "epoch": 1050} {"train_loss": -39.17440414428711, "global_step": 127160, "epoch": 1050} {"train_loss": -38.84502410888672, "global_step": 127161, "epoch": 1050} {"train_loss": -38.17190170288086, "global_step": 127162, "epoch": 1050} {"train_loss": -37.893489837646484, "global_step": 127163, "epoch": 1050} {"train_loss": -38.186397552490234, "global_step": 127164, "epoch": 1050} {"train_loss": -39.16285705566406, "global_step": 127165, "epoch": 1050} {"train_loss": -39.51789474487305, "global_step": 127166, "epoch": 1050} {"train_loss": -39.40349197387695, "global_step": 127167, "epoch": 1050} {"train_loss": -39.3797721862793, "global_step": 127168, "epoch": 1050} {"train_loss": -37.10186767578125, "global_step": 127169, "epoch": 1050} {"train_loss": -38.347830181279456, "global_step": 127170, "epoch": 1050, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4400000": 1.0, "test/sim_max_reward_4400001": 1.0, "test/sim_max_reward_4400002": 1.0, "test/sim_max_reward_4400003": 0.0, "test/sim_max_reward_4400004": 1.0, "test/sim_max_reward_4400005": 1.0, "test/sim_max_reward_4400006": 1.0, "test/sim_max_reward_4400007": 1.0, "test/sim_max_reward_4400008": 1.0, "test/sim_max_reward_4400009": 1.0, "test/sim_max_reward_4400010": 1.0, "test/sim_max_reward_4400011": 1.0, "test/sim_max_reward_4400012": 1.0, "test/sim_max_reward_4400013": 1.0, "test/sim_max_reward_4400014": 1.0, "test/sim_max_reward_4400015": 1.0, "test/sim_max_reward_4400016": 1.0, "test/sim_max_reward_4400017": 1.0, "test/sim_max_reward_4400018": 1.0, "test/sim_max_reward_4400019": 1.0, "test/sim_max_reward_4400020": 1.0, "test/sim_max_reward_4400021": 1.0, "train/mean_score": 1.0, "test/mean_score": 0.9545454545454546, "val_loss": 2761184.75} {"train_loss": -39.20751953125, "global_step": 127171, "epoch": 1051} {"train_loss": -39.014137268066406, "global_step": 127172, "epoch": 1051} {"train_loss": -39.54513931274414, "global_step": 127173, "epoch": 1051} {"train_loss": -38.94987106323242, "global_step": 127174, "epoch": 1051} {"train_loss": -39.70842361450195, "global_step": 127175, "epoch": 1051} {"train_loss": -39.28824996948242, "global_step": 127176, "epoch": 1051} {"train_loss": -39.44464111328125, "global_step": 127177, "epoch": 1051} {"train_loss": -39.56666946411133, "global_step": 127178, "epoch": 1051} {"train_loss": -39.56549835205078, "global_step": 127179, "epoch": 1051} {"train_loss": -39.66140365600586, "global_step": 127180, "epoch": 1051} {"train_loss": -39.24300765991211, "global_step": 127181, "epoch": 1051} {"train_loss": -39.528839111328125, "global_step": 127182, "epoch": 1051} {"train_loss": -39.96318435668945, "global_step": 127183, "epoch": 1051} {"train_loss": -39.417457580566406, "global_step": 127184, "epoch": 1051} {"train_loss": -38.98454666137695, "global_step": 127185, "epoch": 1051} {"train_loss": -39.75631332397461, "global_step": 127186, "epoch": 1051} {"train_loss": -39.898555755615234, "global_step": 127187, "epoch": 1051} {"train_loss": -40.1646842956543, "global_step": 127188, "epoch": 1051} {"train_loss": -38.81234359741211, "global_step": 127189, "epoch": 1051} {"train_loss": -39.53443908691406, "global_step": 127190, "epoch": 1051} {"train_loss": -39.32277297973633, "global_step": 127191, "epoch": 1051} {"train_loss": -40.27386474609375, "global_step": 127192, "epoch": 1051} {"train_loss": -40.3065299987793, "global_step": 127193, "epoch": 1051} {"train_loss": -39.69478988647461, "global_step": 127194, "epoch": 1051} {"train_loss": -39.87417221069336, "global_step": 127195, "epoch": 1051} {"train_loss": -39.77390670776367, "global_step": 127196, "epoch": 1051} {"train_loss": -39.750038146972656, "global_step": 127197, "epoch": 1051} {"train_loss": -39.924556732177734, "global_step": 127198, "epoch": 1051} {"train_loss": -39.05337905883789, "global_step": 127199, "epoch": 1051} {"train_loss": -39.699310302734375, "global_step": 127200, "epoch": 1051} {"train_loss": -39.100833892822266, "global_step": 127201, "epoch": 1051} {"train_loss": -39.471981048583984, "global_step": 127202, "epoch": 1051} {"train_loss": -38.26266860961914, "global_step": 127203, "epoch": 1051} {"train_loss": -39.955116271972656, "global_step": 127204, "epoch": 1051} {"train_loss": -38.064754486083984, "global_step": 127205, "epoch": 1051} {"train_loss": -34.520835876464844, "global_step": 127206, "epoch": 1051} {"train_loss": -30.065397262573242, "global_step": 127207, "epoch": 1051} {"train_loss": -31.12520408630371, "global_step": 127208, "epoch": 1051} {"train_loss": -28.5749568939209, "global_step": 127209, "epoch": 1051} {"train_loss": -35.76050567626953, "global_step": 127210, "epoch": 1051} {"train_loss": -38.13200759887695, "global_step": 127211, "epoch": 1051} {"train_loss": -37.72763442993164, "global_step": 127212, "epoch": 1051} {"train_loss": -34.98520278930664, "global_step": 127213, "epoch": 1051} {"train_loss": -39.459022521972656, "global_step": 127214, "epoch": 1051} {"train_loss": -37.85303497314453, "global_step": 127215, "epoch": 1051} {"train_loss": -38.12420654296875, "global_step": 127216, "epoch": 1051} {"train_loss": -38.53834915161133, "global_step": 127217, "epoch": 1051} {"train_loss": -38.70701217651367, "global_step": 127218, "epoch": 1051} {"train_loss": -38.68607711791992, "global_step": 127219, "epoch": 1051} {"train_loss": -38.61078643798828, "global_step": 127220, "epoch": 1051} {"train_loss": -38.83441162109375, "global_step": 127221, "epoch": 1051} {"train_loss": -38.42280197143555, "global_step": 127222, "epoch": 1051} {"train_loss": -38.3892822265625, "global_step": 127223, "epoch": 1051} {"train_loss": -38.12644577026367, "global_step": 127224, "epoch": 1051} {"train_loss": -39.411903381347656, "global_step": 127225, "epoch": 1051} {"train_loss": -38.25065231323242, "global_step": 127226, "epoch": 1051} {"train_loss": -39.413211822509766, "global_step": 127227, "epoch": 1051} {"train_loss": -38.998046875, "global_step": 127228, "epoch": 1051} {"train_loss": -39.721527099609375, "global_step": 127229, "epoch": 1051} {"train_loss": -36.98988723754883, "global_step": 127230, "epoch": 1051} {"train_loss": -36.738136291503906, "global_step": 127231, "epoch": 1051} {"train_loss": -39.18207550048828, "global_step": 127232, "epoch": 1051} {"train_loss": -39.5463981628418, "global_step": 127233, "epoch": 1051} {"train_loss": -36.054710388183594, "global_step": 127234, "epoch": 1051} {"train_loss": -39.583839416503906, "global_step": 127235, "epoch": 1051} {"train_loss": -37.8647575378418, "global_step": 127236, "epoch": 1051} {"train_loss": -38.792694091796875, "global_step": 127237, "epoch": 1051} {"train_loss": -38.708919525146484, "global_step": 127238, "epoch": 1051} {"train_loss": -37.319976806640625, "global_step": 127239, "epoch": 1051} {"train_loss": -39.80704116821289, "global_step": 127240, "epoch": 1051} {"train_loss": -39.15242385864258, "global_step": 127241, "epoch": 1051} {"train_loss": -40.14923858642578, "global_step": 127242, "epoch": 1051} {"train_loss": -36.9884147644043, "global_step": 127243, "epoch": 1051} {"train_loss": -38.18186950683594, "global_step": 127244, "epoch": 1051} {"train_loss": -39.34196090698242, "global_step": 127245, "epoch": 1051} {"train_loss": -38.637447357177734, "global_step": 127246, "epoch": 1051} {"train_loss": -39.3792610168457, "global_step": 127247, "epoch": 1051} {"train_loss": -39.52714920043945, "global_step": 127248, "epoch": 1051} {"train_loss": -38.81265640258789, "global_step": 127249, "epoch": 1051} {"train_loss": -38.80600357055664, "global_step": 127250, "epoch": 1051} {"train_loss": -39.25228500366211, "global_step": 127251, "epoch": 1051} {"train_loss": -39.29990768432617, "global_step": 127252, "epoch": 1051} {"train_loss": -39.444557189941406, "global_step": 127253, "epoch": 1051} {"train_loss": -40.0393180847168, "global_step": 127254, "epoch": 1051} {"train_loss": -39.557281494140625, "global_step": 127255, "epoch": 1051} {"train_loss": -37.99846649169922, "global_step": 127256, "epoch": 1051} {"train_loss": -37.989688873291016, "global_step": 127257, "epoch": 1051} {"train_loss": -38.2003288269043, "global_step": 127258, "epoch": 1051} {"train_loss": -39.505653381347656, "global_step": 127259, "epoch": 1051} {"train_loss": -39.939449310302734, "global_step": 127260, "epoch": 1051} {"train_loss": -39.1451416015625, "global_step": 127261, "epoch": 1051} {"train_loss": -39.4295768737793, "global_step": 127262, "epoch": 1051} {"train_loss": -39.74884796142578, "global_step": 127263, "epoch": 1051} {"train_loss": -37.68661117553711, "global_step": 127264, "epoch": 1051} {"train_loss": -39.64997482299805, "global_step": 127265, "epoch": 1051} {"train_loss": -39.80397415161133, "global_step": 127266, "epoch": 1051} {"train_loss": -38.93868637084961, "global_step": 127267, "epoch": 1051} {"train_loss": -39.818660736083984, "global_step": 127268, "epoch": 1051} {"train_loss": -39.550514221191406, "global_step": 127269, "epoch": 1051} {"train_loss": -40.156837463378906, "global_step": 127270, "epoch": 1051} {"train_loss": -39.334571838378906, "global_step": 127271, "epoch": 1051} {"train_loss": -40.078529357910156, "global_step": 127272, "epoch": 1051} {"train_loss": -40.12592697143555, "global_step": 127273, "epoch": 1051} {"train_loss": -39.79905319213867, "global_step": 127274, "epoch": 1051} {"train_loss": -39.8497314453125, "global_step": 127275, "epoch": 1051} {"train_loss": -39.1448974609375, "global_step": 127276, "epoch": 1051} {"train_loss": -39.81039047241211, "global_step": 127277, "epoch": 1051} {"train_loss": -39.892242431640625, "global_step": 127278, "epoch": 1051} {"train_loss": -39.247371673583984, "global_step": 127279, "epoch": 1051} {"train_loss": -39.95720291137695, "global_step": 127280, "epoch": 1051} {"train_loss": -40.054443359375, "global_step": 127281, "epoch": 1051} {"train_loss": -39.6480827331543, "global_step": 127282, "epoch": 1051} {"train_loss": -39.83938217163086, "global_step": 127283, "epoch": 1051} {"train_loss": -39.67424392700195, "global_step": 127284, "epoch": 1051} {"train_loss": -39.795631408691406, "global_step": 127285, "epoch": 1051} {"train_loss": -40.06681442260742, "global_step": 127286, "epoch": 1051} {"train_loss": -39.98764419555664, "global_step": 127287, "epoch": 1051} {"train_loss": -38.973697662353516, "global_step": 127288, "epoch": 1051} {"train_loss": -40.47591018676758, "global_step": 127289, "epoch": 1051} {"train_loss": -40.13206100463867, "global_step": 127290, "epoch": 1051} {"train_loss": -38.8709630256842, "global_step": 127291, "epoch": 1051, "val_loss": 2655226.0} {"train_loss": -39.59302520751953, "global_step": 127292, "epoch": 1052} {"train_loss": -39.82505798339844, "global_step": 127293, "epoch": 1052} {"train_loss": -40.189815521240234, "global_step": 127294, "epoch": 1052} {"train_loss": -40.2665901184082, "global_step": 127295, "epoch": 1052} {"train_loss": -39.19010925292969, "global_step": 127296, "epoch": 1052} {"train_loss": -39.92220687866211, "global_step": 127297, "epoch": 1052} {"train_loss": -39.41019058227539, "global_step": 127298, "epoch": 1052} {"train_loss": -39.96857452392578, "global_step": 127299, "epoch": 1052} {"train_loss": -40.1290397644043, "global_step": 127300, "epoch": 1052} {"train_loss": -38.74925994873047, "global_step": 127301, "epoch": 1052} {"train_loss": -34.80082321166992, "global_step": 127302, "epoch": 1052} {"train_loss": -36.03910446166992, "global_step": 127303, "epoch": 1052} {"train_loss": -38.287288665771484, "global_step": 127304, "epoch": 1052} {"train_loss": -36.803768157958984, "global_step": 127305, "epoch": 1052} {"train_loss": -30.194257736206055, "global_step": 127306, "epoch": 1052} {"train_loss": -37.51844024658203, "global_step": 127307, "epoch": 1052} {"train_loss": -38.48981857299805, "global_step": 127308, "epoch": 1052} {"train_loss": -33.47884750366211, "global_step": 127309, "epoch": 1052} {"train_loss": -36.11311721801758, "global_step": 127310, "epoch": 1052} {"train_loss": -33.70108413696289, "global_step": 127311, "epoch": 1052} {"train_loss": -35.32151794433594, "global_step": 127312, "epoch": 1052} {"train_loss": -31.30133056640625, "global_step": 127313, "epoch": 1052} {"train_loss": -28.888620376586914, "global_step": 127314, "epoch": 1052} {"train_loss": -38.13618087768555, "global_step": 127315, "epoch": 1052} {"train_loss": -35.0557746887207, "global_step": 127316, "epoch": 1052} {"train_loss": -28.415067672729492, "global_step": 127317, "epoch": 1052} {"train_loss": -29.256275177001953, "global_step": 127318, "epoch": 1052} {"train_loss": -27.8814640045166, "global_step": 127319, "epoch": 1052} {"train_loss": -34.6563606262207, "global_step": 127320, "epoch": 1052} {"train_loss": -33.99802017211914, "global_step": 127321, "epoch": 1052} {"train_loss": -36.537696838378906, "global_step": 127322, "epoch": 1052} {"train_loss": -34.179710388183594, "global_step": 127323, "epoch": 1052} {"train_loss": -33.71699142456055, "global_step": 127324, "epoch": 1052} {"train_loss": -32.97109603881836, "global_step": 127325, "epoch": 1052} {"train_loss": -34.307865142822266, "global_step": 127326, "epoch": 1052} {"train_loss": -34.13312911987305, "global_step": 127327, "epoch": 1052} {"train_loss": -36.99306106567383, "global_step": 127328, "epoch": 1052} {"train_loss": -36.62376022338867, "global_step": 127329, "epoch": 1052} {"train_loss": -36.1253547668457, "global_step": 127330, "epoch": 1052} {"train_loss": -35.10344314575195, "global_step": 127331, "epoch": 1052} {"train_loss": -36.463478088378906, "global_step": 127332, "epoch": 1052} {"train_loss": -36.97755813598633, "global_step": 127333, "epoch": 1052} {"train_loss": -35.804500579833984, "global_step": 127334, "epoch": 1052} {"train_loss": -36.90178680419922, "global_step": 127335, "epoch": 1052} {"train_loss": -37.88089370727539, "global_step": 127336, "epoch": 1052} {"train_loss": -37.15572738647461, "global_step": 127337, "epoch": 1052} {"train_loss": -37.87226486206055, "global_step": 127338, "epoch": 1052} {"train_loss": -37.4404296875, "global_step": 127339, "epoch": 1052} {"train_loss": -37.7778434753418, "global_step": 127340, "epoch": 1052} {"train_loss": -37.641273498535156, "global_step": 127341, "epoch": 1052} {"train_loss": -38.21342086791992, "global_step": 127342, "epoch": 1052} {"train_loss": -38.09418869018555, "global_step": 127343, "epoch": 1052} {"train_loss": -37.253292083740234, "global_step": 127344, "epoch": 1052} {"train_loss": -37.85580062866211, "global_step": 127345, "epoch": 1052} {"train_loss": -38.16030502319336, "global_step": 127346, "epoch": 1052} {"train_loss": -37.70423126220703, "global_step": 127347, "epoch": 1052} {"train_loss": -39.05693435668945, "global_step": 127348, "epoch": 1052} {"train_loss": -38.001651763916016, "global_step": 127349, "epoch": 1052} {"train_loss": -38.95918655395508, "global_step": 127350, "epoch": 1052} {"train_loss": -38.6416015625, "global_step": 127351, "epoch": 1052} {"train_loss": -38.071807861328125, "global_step": 127352, "epoch": 1052} {"train_loss": -38.596004486083984, "global_step": 127353, "epoch": 1052} {"train_loss": -38.81924057006836, "global_step": 127354, "epoch": 1052} {"train_loss": -38.977638244628906, "global_step": 127355, "epoch": 1052} {"train_loss": -38.67906951904297, "global_step": 127356, "epoch": 1052} {"train_loss": -38.94233703613281, "global_step": 127357, "epoch": 1052} {"train_loss": -39.069087982177734, "global_step": 127358, "epoch": 1052} {"train_loss": -38.81106185913086, "global_step": 127359, "epoch": 1052} {"train_loss": -39.52152633666992, "global_step": 127360, "epoch": 1052} {"train_loss": -38.91443634033203, "global_step": 127361, "epoch": 1052} {"train_loss": -38.86357879638672, "global_step": 127362, "epoch": 1052} {"train_loss": -38.72153854370117, "global_step": 127363, "epoch": 1052} {"train_loss": -39.460201263427734, "global_step": 127364, "epoch": 1052} {"train_loss": -39.58349609375, "global_step": 127365, "epoch": 1052} {"train_loss": -39.366607666015625, "global_step": 127366, "epoch": 1052} {"train_loss": -39.567466735839844, "global_step": 127367, "epoch": 1052} {"train_loss": -39.2874641418457, "global_step": 127368, "epoch": 1052} {"train_loss": -40.156002044677734, "global_step": 127369, "epoch": 1052} {"train_loss": -39.6884880065918, "global_step": 127370, "epoch": 1052} {"train_loss": -39.62510299682617, "global_step": 127371, "epoch": 1052} {"train_loss": -39.91946029663086, "global_step": 127372, "epoch": 1052} {"train_loss": -39.14267349243164, "global_step": 127373, "epoch": 1052} {"train_loss": -39.45951461791992, "global_step": 127374, "epoch": 1052} {"train_loss": -38.6774787902832, "global_step": 127375, "epoch": 1052} {"train_loss": -39.3335075378418, "global_step": 127376, "epoch": 1052} {"train_loss": -39.7854118347168, "global_step": 127377, "epoch": 1052} {"train_loss": -40.292232513427734, "global_step": 127378, "epoch": 1052} {"train_loss": -39.688079833984375, "global_step": 127379, "epoch": 1052} {"train_loss": -39.914669036865234, "global_step": 127380, "epoch": 1052} {"train_loss": -39.76913070678711, "global_step": 127381, "epoch": 1052} {"train_loss": -39.75319290161133, "global_step": 127382, "epoch": 1052} {"train_loss": -40.11227035522461, "global_step": 127383, "epoch": 1052} {"train_loss": -39.92983627319336, "global_step": 127384, "epoch": 1052} {"train_loss": -39.24766159057617, "global_step": 127385, "epoch": 1052} {"train_loss": -39.4348030090332, "global_step": 127386, "epoch": 1052} {"train_loss": -39.68491744995117, "global_step": 127387, "epoch": 1052} {"train_loss": -40.05747604370117, "global_step": 127388, "epoch": 1052} {"train_loss": -38.98986053466797, "global_step": 127389, "epoch": 1052} {"train_loss": -40.36811447143555, "global_step": 127390, "epoch": 1052} {"train_loss": -39.725040435791016, "global_step": 127391, "epoch": 1052} {"train_loss": -39.910125732421875, "global_step": 127392, "epoch": 1052} {"train_loss": -39.91058349609375, "global_step": 127393, "epoch": 1052} {"train_loss": -39.62034606933594, "global_step": 127394, "epoch": 1052} {"train_loss": -39.881649017333984, "global_step": 127395, "epoch": 1052} {"train_loss": -39.66712188720703, "global_step": 127396, "epoch": 1052} {"train_loss": -39.62062454223633, "global_step": 127397, "epoch": 1052} {"train_loss": -38.131324768066406, "global_step": 127398, "epoch": 1052} {"train_loss": -37.90261459350586, "global_step": 127399, "epoch": 1052} {"train_loss": -37.540287017822266, "global_step": 127400, "epoch": 1052} {"train_loss": -37.43330001831055, "global_step": 127401, "epoch": 1052} {"train_loss": -33.704444885253906, "global_step": 127402, "epoch": 1052} {"train_loss": -40.08639144897461, "global_step": 127403, "epoch": 1052} {"train_loss": -36.253875732421875, "global_step": 127404, "epoch": 1052} {"train_loss": -32.55628967285156, "global_step": 127405, "epoch": 1052} {"train_loss": -39.36464309692383, "global_step": 127406, "epoch": 1052} {"train_loss": -34.14077377319336, "global_step": 127407, "epoch": 1052} {"train_loss": -38.95557403564453, "global_step": 127408, "epoch": 1052} {"train_loss": -31.981897354125977, "global_step": 127409, "epoch": 1052} {"train_loss": -38.119503021240234, "global_step": 127410, "epoch": 1052} {"train_loss": -36.42618942260742, "global_step": 127411, "epoch": 1052} {"train_loss": -37.546563881487884, "global_step": 127412, "epoch": 1052, "val_loss": 2629670.25} {"train_loss": -38.96074295043945, "global_step": 127413, "epoch": 1053} {"train_loss": -36.046409606933594, "global_step": 127414, "epoch": 1053} {"train_loss": -36.20608139038086, "global_step": 127415, "epoch": 1053} {"train_loss": -36.089263916015625, "global_step": 127416, "epoch": 1053} {"train_loss": -35.75027084350586, "global_step": 127417, "epoch": 1053} {"train_loss": -36.92343521118164, "global_step": 127418, "epoch": 1053} {"train_loss": -35.47527313232422, "global_step": 127419, "epoch": 1053} {"train_loss": -36.65739059448242, "global_step": 127420, "epoch": 1053} {"train_loss": -36.82318878173828, "global_step": 127421, "epoch": 1053} {"train_loss": -37.026031494140625, "global_step": 127422, "epoch": 1053} {"train_loss": -35.58773422241211, "global_step": 127423, "epoch": 1053} {"train_loss": -35.45505905151367, "global_step": 127424, "epoch": 1053} {"train_loss": -37.911865234375, "global_step": 127425, "epoch": 1053} {"train_loss": -36.62920379638672, "global_step": 127426, "epoch": 1053} {"train_loss": -34.56246566772461, "global_step": 127427, "epoch": 1053} {"train_loss": -36.8201904296875, "global_step": 127428, "epoch": 1053} {"train_loss": -37.18986129760742, "global_step": 127429, "epoch": 1053} {"train_loss": -37.82528305053711, "global_step": 127430, "epoch": 1053} {"train_loss": -37.68455123901367, "global_step": 127431, "epoch": 1053} {"train_loss": -37.65223693847656, "global_step": 127432, "epoch": 1053} {"train_loss": -38.73530197143555, "global_step": 127433, "epoch": 1053} {"train_loss": -38.38452911376953, "global_step": 127434, "epoch": 1053} {"train_loss": -38.89563751220703, "global_step": 127435, "epoch": 1053} {"train_loss": -38.127471923828125, "global_step": 127436, "epoch": 1053} {"train_loss": -37.88837814331055, "global_step": 127437, "epoch": 1053} {"train_loss": -39.19535446166992, "global_step": 127438, "epoch": 1053} {"train_loss": -38.28410720825195, "global_step": 127439, "epoch": 1053} {"train_loss": -38.96747970581055, "global_step": 127440, "epoch": 1053} {"train_loss": -38.51601791381836, "global_step": 127441, "epoch": 1053} {"train_loss": -39.0131721496582, "global_step": 127442, "epoch": 1053} {"train_loss": -39.15839767456055, "global_step": 127443, "epoch": 1053} {"train_loss": -39.28912353515625, "global_step": 127444, "epoch": 1053} {"train_loss": -39.06381607055664, "global_step": 127445, "epoch": 1053} {"train_loss": -39.25602340698242, "global_step": 127446, "epoch": 1053} {"train_loss": -39.36035919189453, "global_step": 127447, "epoch": 1053} {"train_loss": -38.905452728271484, "global_step": 127448, "epoch": 1053} {"train_loss": -39.52922821044922, "global_step": 127449, "epoch": 1053} {"train_loss": -39.21490478515625, "global_step": 127450, "epoch": 1053} {"train_loss": -39.03303146362305, "global_step": 127451, "epoch": 1053} {"train_loss": -38.726356506347656, "global_step": 127452, "epoch": 1053} {"train_loss": -39.0531120300293, "global_step": 127453, "epoch": 1053} {"train_loss": -39.5938835144043, "global_step": 127454, "epoch": 1053} {"train_loss": -39.47385787963867, "global_step": 127455, "epoch": 1053} {"train_loss": -39.74055099487305, "global_step": 127456, "epoch": 1053} {"train_loss": -40.043453216552734, "global_step": 127457, "epoch": 1053} {"train_loss": -39.55207443237305, "global_step": 127458, "epoch": 1053} {"train_loss": -39.46820831298828, "global_step": 127459, "epoch": 1053} {"train_loss": -40.07951736450195, "global_step": 127460, "epoch": 1053} {"train_loss": -39.739105224609375, "global_step": 127461, "epoch": 1053} {"train_loss": -39.409603118896484, "global_step": 127462, "epoch": 1053} {"train_loss": -39.93605422973633, "global_step": 127463, "epoch": 1053} {"train_loss": -40.0883903503418, "global_step": 127464, "epoch": 1053} {"train_loss": -39.50356674194336, "global_step": 127465, "epoch": 1053} {"train_loss": -39.932308197021484, "global_step": 127466, "epoch": 1053} {"train_loss": -39.872406005859375, "global_step": 127467, "epoch": 1053} {"train_loss": -39.758296966552734, "global_step": 127468, "epoch": 1053} {"train_loss": -40.26414108276367, "global_step": 127469, "epoch": 1053} {"train_loss": -39.752052307128906, "global_step": 127470, "epoch": 1053} {"train_loss": -39.98368453979492, "global_step": 127471, "epoch": 1053} {"train_loss": -40.325294494628906, "global_step": 127472, "epoch": 1053} {"train_loss": -40.17387008666992, "global_step": 127473, "epoch": 1053} {"train_loss": -40.496665954589844, "global_step": 127474, "epoch": 1053} {"train_loss": -39.983211517333984, "global_step": 127475, "epoch": 1053} {"train_loss": -39.979339599609375, "global_step": 127476, "epoch": 1053} {"train_loss": -40.2488899230957, "global_step": 127477, "epoch": 1053} {"train_loss": -40.57949447631836, "global_step": 127478, "epoch": 1053} {"train_loss": -40.028717041015625, "global_step": 127479, "epoch": 1053} {"train_loss": -40.136966705322266, "global_step": 127480, "epoch": 1053} {"train_loss": -40.50844192504883, "global_step": 127481, "epoch": 1053} {"train_loss": -40.2842903137207, "global_step": 127482, "epoch": 1053} {"train_loss": -40.48506546020508, "global_step": 127483, "epoch": 1053} {"train_loss": -40.08730697631836, "global_step": 127484, "epoch": 1053} {"train_loss": -40.15741729736328, "global_step": 127485, "epoch": 1053} {"train_loss": -39.76707077026367, "global_step": 127486, "epoch": 1053} {"train_loss": -39.621089935302734, "global_step": 127487, "epoch": 1053} {"train_loss": -40.35946273803711, "global_step": 127488, "epoch": 1053} {"train_loss": -39.975440979003906, "global_step": 127489, "epoch": 1053} {"train_loss": -39.69328308105469, "global_step": 127490, "epoch": 1053} {"train_loss": -40.094085693359375, "global_step": 127491, "epoch": 1053} {"train_loss": -40.037837982177734, "global_step": 127492, "epoch": 1053} {"train_loss": -39.295753479003906, "global_step": 127493, "epoch": 1053} {"train_loss": -39.03479766845703, "global_step": 127494, "epoch": 1053} {"train_loss": -39.62837600708008, "global_step": 127495, "epoch": 1053} {"train_loss": -39.54604721069336, "global_step": 127496, "epoch": 1053} {"train_loss": -40.101985931396484, "global_step": 127497, "epoch": 1053} {"train_loss": -39.84629440307617, "global_step": 127498, "epoch": 1053} {"train_loss": -38.52191162109375, "global_step": 127499, "epoch": 1053} {"train_loss": -37.79657745361328, "global_step": 127500, "epoch": 1053} {"train_loss": -37.03565216064453, "global_step": 127501, "epoch": 1053} {"train_loss": -36.05353546142578, "global_step": 127502, "epoch": 1053} {"train_loss": -35.129432678222656, "global_step": 127503, "epoch": 1053} {"train_loss": -38.18136978149414, "global_step": 127504, "epoch": 1053} {"train_loss": -39.73691940307617, "global_step": 127505, "epoch": 1053} {"train_loss": -39.5477294921875, "global_step": 127506, "epoch": 1053} {"train_loss": -36.512847900390625, "global_step": 127507, "epoch": 1053} {"train_loss": -36.246849060058594, "global_step": 127508, "epoch": 1053} {"train_loss": -36.35396194458008, "global_step": 127509, "epoch": 1053} {"train_loss": -37.76874923706055, "global_step": 127510, "epoch": 1053} {"train_loss": -36.78740310668945, "global_step": 127511, "epoch": 1053} {"train_loss": -35.95595932006836, "global_step": 127512, "epoch": 1053} {"train_loss": -37.604923248291016, "global_step": 127513, "epoch": 1053} {"train_loss": -38.94171905517578, "global_step": 127514, "epoch": 1053} {"train_loss": -38.850765228271484, "global_step": 127515, "epoch": 1053} {"train_loss": -38.84001541137695, "global_step": 127516, "epoch": 1053} {"train_loss": -38.9872932434082, "global_step": 127517, "epoch": 1053} {"train_loss": -38.824886322021484, "global_step": 127518, "epoch": 1053} {"train_loss": -39.59861373901367, "global_step": 127519, "epoch": 1053} {"train_loss": -39.118927001953125, "global_step": 127520, "epoch": 1053} {"train_loss": -38.8254280090332, "global_step": 127521, "epoch": 1053} {"train_loss": -39.272945404052734, "global_step": 127522, "epoch": 1053} {"train_loss": -39.46151351928711, "global_step": 127523, "epoch": 1053} {"train_loss": -38.56410598754883, "global_step": 127524, "epoch": 1053} {"train_loss": -37.8477783203125, "global_step": 127525, "epoch": 1053} {"train_loss": -38.37099838256836, "global_step": 127526, "epoch": 1053} {"train_loss": -38.39988327026367, "global_step": 127527, "epoch": 1053} {"train_loss": -39.70984649658203, "global_step": 127528, "epoch": 1053} {"train_loss": -38.673011779785156, "global_step": 127529, "epoch": 1053} {"train_loss": -39.00020980834961, "global_step": 127530, "epoch": 1053} {"train_loss": -39.784603118896484, "global_step": 127531, "epoch": 1053} {"train_loss": -38.38468933105469, "global_step": 127532, "epoch": 1053} {"train_loss": -38.71409669986441, "global_step": 127533, "epoch": 1053, "val_loss": 2704869.0} {"train_loss": -39.10755157470703, "global_step": 127534, "epoch": 1054} {"train_loss": -38.4708366394043, "global_step": 127535, "epoch": 1054} {"train_loss": -39.85613250732422, "global_step": 127536, "epoch": 1054} {"train_loss": -39.234886169433594, "global_step": 127537, "epoch": 1054} {"train_loss": -39.670223236083984, "global_step": 127538, "epoch": 1054} {"train_loss": -39.396785736083984, "global_step": 127539, "epoch": 1054} {"train_loss": -39.4230842590332, "global_step": 127540, "epoch": 1054} {"train_loss": -39.7094841003418, "global_step": 127541, "epoch": 1054} {"train_loss": -39.6401481628418, "global_step": 127542, "epoch": 1054} {"train_loss": -38.41860580444336, "global_step": 127543, "epoch": 1054} {"train_loss": -39.67390060424805, "global_step": 127544, "epoch": 1054} {"train_loss": -38.17086410522461, "global_step": 127545, "epoch": 1054} {"train_loss": -39.19062423706055, "global_step": 127546, "epoch": 1054} {"train_loss": -37.38329315185547, "global_step": 127547, "epoch": 1054} {"train_loss": -37.29359817504883, "global_step": 127548, "epoch": 1054} {"train_loss": -39.24759292602539, "global_step": 127549, "epoch": 1054} {"train_loss": -37.5531005859375, "global_step": 127550, "epoch": 1054} {"train_loss": -38.63837814331055, "global_step": 127551, "epoch": 1054} {"train_loss": -38.202186584472656, "global_step": 127552, "epoch": 1054} {"train_loss": -39.606815338134766, "global_step": 127553, "epoch": 1054} {"train_loss": -39.00384521484375, "global_step": 127554, "epoch": 1054} {"train_loss": -37.18321228027344, "global_step": 127555, "epoch": 1054} {"train_loss": -37.60686111450195, "global_step": 127556, "epoch": 1054} {"train_loss": -38.08991622924805, "global_step": 127557, "epoch": 1054} {"train_loss": -39.571044921875, "global_step": 127558, "epoch": 1054} {"train_loss": -38.227046966552734, "global_step": 127559, "epoch": 1054} {"train_loss": -38.3674201965332, "global_step": 127560, "epoch": 1054} {"train_loss": -39.57746505737305, "global_step": 127561, "epoch": 1054} {"train_loss": -39.33597183227539, "global_step": 127562, "epoch": 1054} {"train_loss": -38.77927780151367, "global_step": 127563, "epoch": 1054} {"train_loss": -39.05259323120117, "global_step": 127564, "epoch": 1054} {"train_loss": -39.788360595703125, "global_step": 127565, "epoch": 1054} {"train_loss": -38.94088363647461, "global_step": 127566, "epoch": 1054} {"train_loss": -40.22097396850586, "global_step": 127567, "epoch": 1054} {"train_loss": -39.62729263305664, "global_step": 127568, "epoch": 1054} {"train_loss": -39.15632629394531, "global_step": 127569, "epoch": 1054} {"train_loss": -40.41172409057617, "global_step": 127570, "epoch": 1054} {"train_loss": -39.65824890136719, "global_step": 127571, "epoch": 1054} {"train_loss": -39.986846923828125, "global_step": 127572, "epoch": 1054} {"train_loss": -39.582725524902344, "global_step": 127573, "epoch": 1054} {"train_loss": -40.21943664550781, "global_step": 127574, "epoch": 1054} {"train_loss": -39.812294006347656, "global_step": 127575, "epoch": 1054} {"train_loss": -40.49030685424805, "global_step": 127576, "epoch": 1054} {"train_loss": -39.79522705078125, "global_step": 127577, "epoch": 1054} {"train_loss": -40.02546310424805, "global_step": 127578, "epoch": 1054} {"train_loss": -39.34889221191406, "global_step": 127579, "epoch": 1054} {"train_loss": -39.746856689453125, "global_step": 127580, "epoch": 1054} {"train_loss": -40.12563705444336, "global_step": 127581, "epoch": 1054} {"train_loss": -40.31846237182617, "global_step": 127582, "epoch": 1054} {"train_loss": -40.12153244018555, "global_step": 127583, "epoch": 1054} {"train_loss": -40.40778732299805, "global_step": 127584, "epoch": 1054} {"train_loss": -39.97849655151367, "global_step": 127585, "epoch": 1054} {"train_loss": -40.301029205322266, "global_step": 127586, "epoch": 1054} {"train_loss": -40.308921813964844, "global_step": 127587, "epoch": 1054} {"train_loss": -40.20456314086914, "global_step": 127588, "epoch": 1054} {"train_loss": -38.683502197265625, "global_step": 127589, "epoch": 1054} {"train_loss": -40.3332633972168, "global_step": 127590, "epoch": 1054} {"train_loss": -40.57442855834961, "global_step": 127591, "epoch": 1054} {"train_loss": -40.13134765625, "global_step": 127592, "epoch": 1054} {"train_loss": -39.557979583740234, "global_step": 127593, "epoch": 1054} {"train_loss": -37.02344512939453, "global_step": 127594, "epoch": 1054} {"train_loss": -39.82001876831055, "global_step": 127595, "epoch": 1054} {"train_loss": -39.162330627441406, "global_step": 127596, "epoch": 1054} {"train_loss": -38.775665283203125, "global_step": 127597, "epoch": 1054} {"train_loss": -39.66132354736328, "global_step": 127598, "epoch": 1054} {"train_loss": -38.22476577758789, "global_step": 127599, "epoch": 1054} {"train_loss": -39.91006851196289, "global_step": 127600, "epoch": 1054} {"train_loss": -40.149906158447266, "global_step": 127601, "epoch": 1054} {"train_loss": -39.281803131103516, "global_step": 127602, "epoch": 1054} {"train_loss": -39.47239303588867, "global_step": 127603, "epoch": 1054} {"train_loss": -40.048118591308594, "global_step": 127604, "epoch": 1054} {"train_loss": -39.484375, "global_step": 127605, "epoch": 1054} {"train_loss": -40.4254264831543, "global_step": 127606, "epoch": 1054} {"train_loss": -40.239295959472656, "global_step": 127607, "epoch": 1054} {"train_loss": -39.46474838256836, "global_step": 127608, "epoch": 1054} {"train_loss": -39.21266555786133, "global_step": 127609, "epoch": 1054} {"train_loss": -38.7304573059082, "global_step": 127610, "epoch": 1054} {"train_loss": -39.333168029785156, "global_step": 127611, "epoch": 1054} {"train_loss": -39.29523468017578, "global_step": 127612, "epoch": 1054} {"train_loss": -38.2694091796875, "global_step": 127613, "epoch": 1054} {"train_loss": -39.0290641784668, "global_step": 127614, "epoch": 1054} {"train_loss": -36.13172149658203, "global_step": 127615, "epoch": 1054} {"train_loss": -38.5395622253418, "global_step": 127616, "epoch": 1054} {"train_loss": -38.19209289550781, "global_step": 127617, "epoch": 1054} {"train_loss": -39.16225051879883, "global_step": 127618, "epoch": 1054} {"train_loss": -39.0374641418457, "global_step": 127619, "epoch": 1054} {"train_loss": -39.121917724609375, "global_step": 127620, "epoch": 1054} {"train_loss": -39.306827545166016, "global_step": 127621, "epoch": 1054} {"train_loss": -39.38642883300781, "global_step": 127622, "epoch": 1054} {"train_loss": -39.21476364135742, "global_step": 127623, "epoch": 1054} {"train_loss": -38.973209381103516, "global_step": 127624, "epoch": 1054} {"train_loss": -39.06494140625, "global_step": 127625, "epoch": 1054} {"train_loss": -38.52021408081055, "global_step": 127626, "epoch": 1054} {"train_loss": -39.392086029052734, "global_step": 127627, "epoch": 1054} {"train_loss": -39.66819381713867, "global_step": 127628, "epoch": 1054} {"train_loss": -39.556365966796875, "global_step": 127629, "epoch": 1054} {"train_loss": -37.424007415771484, "global_step": 127630, "epoch": 1054} {"train_loss": -38.99518966674805, "global_step": 127631, "epoch": 1054} {"train_loss": -39.210845947265625, "global_step": 127632, "epoch": 1054} {"train_loss": -39.75838851928711, "global_step": 127633, "epoch": 1054} {"train_loss": -39.255367279052734, "global_step": 127634, "epoch": 1054} {"train_loss": -39.631561279296875, "global_step": 127635, "epoch": 1054} {"train_loss": -39.27753829956055, "global_step": 127636, "epoch": 1054} {"train_loss": -39.29129409790039, "global_step": 127637, "epoch": 1054} {"train_loss": -40.21669006347656, "global_step": 127638, "epoch": 1054} {"train_loss": -38.14667892456055, "global_step": 127639, "epoch": 1054} {"train_loss": -40.00556945800781, "global_step": 127640, "epoch": 1054} {"train_loss": -39.42394256591797, "global_step": 127641, "epoch": 1054} {"train_loss": -39.4438362121582, "global_step": 127642, "epoch": 1054} {"train_loss": -39.71299362182617, "global_step": 127643, "epoch": 1054} {"train_loss": -39.538673400878906, "global_step": 127644, "epoch": 1054} {"train_loss": -39.293758392333984, "global_step": 127645, "epoch": 1054} {"train_loss": -39.46978759765625, "global_step": 127646, "epoch": 1054} {"train_loss": -39.28383255004883, "global_step": 127647, "epoch": 1054} {"train_loss": -37.78157424926758, "global_step": 127648, "epoch": 1054} {"train_loss": -38.48150634765625, "global_step": 127649, "epoch": 1054} {"train_loss": -40.03750228881836, "global_step": 127650, "epoch": 1054} {"train_loss": -39.230934143066406, "global_step": 127651, "epoch": 1054} {"train_loss": -40.1237678527832, "global_step": 127652, "epoch": 1054} {"train_loss": -39.98516845703125, "global_step": 127653, "epoch": 1054} {"train_loss": -39.266108268548635, "global_step": 127654, "epoch": 1054, "val_loss": 2752298.25} {"train_loss": -39.83930206298828, "global_step": 127655, "epoch": 1055} {"train_loss": -40.13917922973633, "global_step": 127656, "epoch": 1055} {"train_loss": -40.39799499511719, "global_step": 127657, "epoch": 1055} {"train_loss": -39.142757415771484, "global_step": 127658, "epoch": 1055} {"train_loss": -39.69199752807617, "global_step": 127659, "epoch": 1055} {"train_loss": -39.71674346923828, "global_step": 127660, "epoch": 1055} {"train_loss": -40.28156661987305, "global_step": 127661, "epoch": 1055} {"train_loss": -39.759246826171875, "global_step": 127662, "epoch": 1055} {"train_loss": -40.2053108215332, "global_step": 127663, "epoch": 1055} {"train_loss": -40.29671859741211, "global_step": 127664, "epoch": 1055} {"train_loss": -39.715572357177734, "global_step": 127665, "epoch": 1055} {"train_loss": -39.886138916015625, "global_step": 127666, "epoch": 1055} {"train_loss": -40.16514205932617, "global_step": 127667, "epoch": 1055} {"train_loss": -40.63290023803711, "global_step": 127668, "epoch": 1055} {"train_loss": -40.55271530151367, "global_step": 127669, "epoch": 1055} {"train_loss": -39.75114822387695, "global_step": 127670, "epoch": 1055} {"train_loss": -40.62588119506836, "global_step": 127671, "epoch": 1055} {"train_loss": -40.129703521728516, "global_step": 127672, "epoch": 1055} {"train_loss": -39.923553466796875, "global_step": 127673, "epoch": 1055} {"train_loss": -40.463409423828125, "global_step": 127674, "epoch": 1055} {"train_loss": -40.742225646972656, "global_step": 127675, "epoch": 1055} {"train_loss": -41.10068893432617, "global_step": 127676, "epoch": 1055} {"train_loss": -40.356510162353516, "global_step": 127677, "epoch": 1055} {"train_loss": -40.8021240234375, "global_step": 127678, "epoch": 1055} {"train_loss": -41.010677337646484, "global_step": 127679, "epoch": 1055} {"train_loss": -40.6579704284668, "global_step": 127680, "epoch": 1055} {"train_loss": -41.059814453125, "global_step": 127681, "epoch": 1055} {"train_loss": -41.05569076538086, "global_step": 127682, "epoch": 1055} {"train_loss": -40.485774993896484, "global_step": 127683, "epoch": 1055} {"train_loss": -39.832279205322266, "global_step": 127684, "epoch": 1055} {"train_loss": -38.03165054321289, "global_step": 127685, "epoch": 1055} {"train_loss": -37.10425567626953, "global_step": 127686, "epoch": 1055} {"train_loss": -35.89472198486328, "global_step": 127687, "epoch": 1055} {"train_loss": -35.70756149291992, "global_step": 127688, "epoch": 1055} {"train_loss": -35.708072662353516, "global_step": 127689, "epoch": 1055} {"train_loss": -37.912384033203125, "global_step": 127690, "epoch": 1055} {"train_loss": -38.0726432800293, "global_step": 127691, "epoch": 1055} {"train_loss": -36.21430587768555, "global_step": 127692, "epoch": 1055} {"train_loss": -39.3339729309082, "global_step": 127693, "epoch": 1055} {"train_loss": -37.40855407714844, "global_step": 127694, "epoch": 1055} {"train_loss": -35.74973678588867, "global_step": 127695, "epoch": 1055} {"train_loss": -37.1666259765625, "global_step": 127696, "epoch": 1055} {"train_loss": -39.391109466552734, "global_step": 127697, "epoch": 1055} {"train_loss": -37.3961296081543, "global_step": 127698, "epoch": 1055} {"train_loss": -35.63682174682617, "global_step": 127699, "epoch": 1055} {"train_loss": -38.97245407104492, "global_step": 127700, "epoch": 1055} {"train_loss": -36.096065521240234, "global_step": 127701, "epoch": 1055} {"train_loss": -38.48725509643555, "global_step": 127702, "epoch": 1055} {"train_loss": -37.25005340576172, "global_step": 127703, "epoch": 1055} {"train_loss": -38.788421630859375, "global_step": 127704, "epoch": 1055} {"train_loss": -35.760433197021484, "global_step": 127705, "epoch": 1055} {"train_loss": -39.192138671875, "global_step": 127706, "epoch": 1055} {"train_loss": -37.16992950439453, "global_step": 127707, "epoch": 1055} {"train_loss": -37.90007019042969, "global_step": 127708, "epoch": 1055} {"train_loss": -37.40186309814453, "global_step": 127709, "epoch": 1055} {"train_loss": -39.828861236572266, "global_step": 127710, "epoch": 1055} {"train_loss": -37.610538482666016, "global_step": 127711, "epoch": 1055} {"train_loss": -39.051998138427734, "global_step": 127712, "epoch": 1055} {"train_loss": -38.19833755493164, "global_step": 127713, "epoch": 1055} {"train_loss": -40.076332092285156, "global_step": 127714, "epoch": 1055} {"train_loss": -38.92441177368164, "global_step": 127715, "epoch": 1055} {"train_loss": -38.65938949584961, "global_step": 127716, "epoch": 1055} {"train_loss": -39.235084533691406, "global_step": 127717, "epoch": 1055} {"train_loss": -39.93111801147461, "global_step": 127718, "epoch": 1055} {"train_loss": -39.65400314331055, "global_step": 127719, "epoch": 1055} {"train_loss": -39.40566635131836, "global_step": 127720, "epoch": 1055} {"train_loss": -40.153629302978516, "global_step": 127721, "epoch": 1055} {"train_loss": -39.661170959472656, "global_step": 127722, "epoch": 1055} {"train_loss": -39.609371185302734, "global_step": 127723, "epoch": 1055} {"train_loss": -39.6146125793457, "global_step": 127724, "epoch": 1055} {"train_loss": -39.14345932006836, "global_step": 127725, "epoch": 1055} {"train_loss": -39.78022003173828, "global_step": 127726, "epoch": 1055} {"train_loss": -40.0053596496582, "global_step": 127727, "epoch": 1055} {"train_loss": -39.41158676147461, "global_step": 127728, "epoch": 1055} {"train_loss": -39.81739807128906, "global_step": 127729, "epoch": 1055} {"train_loss": -39.217769622802734, "global_step": 127730, "epoch": 1055} {"train_loss": -40.060691833496094, "global_step": 127731, "epoch": 1055} {"train_loss": -39.597572326660156, "global_step": 127732, "epoch": 1055} {"train_loss": -39.45471954345703, "global_step": 127733, "epoch": 1055} {"train_loss": -40.488216400146484, "global_step": 127734, "epoch": 1055} {"train_loss": -39.79697799682617, "global_step": 127735, "epoch": 1055} {"train_loss": -39.015953063964844, "global_step": 127736, "epoch": 1055} {"train_loss": -39.65243148803711, "global_step": 127737, "epoch": 1055} {"train_loss": -39.859886169433594, "global_step": 127738, "epoch": 1055} {"train_loss": -39.64665222167969, "global_step": 127739, "epoch": 1055} {"train_loss": -39.67266082763672, "global_step": 127740, "epoch": 1055} {"train_loss": -39.626731872558594, "global_step": 127741, "epoch": 1055} {"train_loss": -39.79225540161133, "global_step": 127742, "epoch": 1055} {"train_loss": -38.96662521362305, "global_step": 127743, "epoch": 1055} {"train_loss": -39.8465576171875, "global_step": 127744, "epoch": 1055} {"train_loss": -40.00315856933594, "global_step": 127745, "epoch": 1055} {"train_loss": -40.247005462646484, "global_step": 127746, "epoch": 1055} {"train_loss": -40.34625244140625, "global_step": 127747, "epoch": 1055} {"train_loss": -40.31520462036133, "global_step": 127748, "epoch": 1055} {"train_loss": -39.832969665527344, "global_step": 127749, "epoch": 1055} {"train_loss": -40.17410659790039, "global_step": 127750, "epoch": 1055} {"train_loss": -40.50905990600586, "global_step": 127751, "epoch": 1055} {"train_loss": -40.55172348022461, "global_step": 127752, "epoch": 1055} {"train_loss": -39.791099548339844, "global_step": 127753, "epoch": 1055} {"train_loss": -39.90333938598633, "global_step": 127754, "epoch": 1055} {"train_loss": -40.497127532958984, "global_step": 127755, "epoch": 1055} {"train_loss": -40.17542266845703, "global_step": 127756, "epoch": 1055} {"train_loss": -40.0051155090332, "global_step": 127757, "epoch": 1055} {"train_loss": -39.40497589111328, "global_step": 127758, "epoch": 1055} {"train_loss": -36.44768142700195, "global_step": 127759, "epoch": 1055} {"train_loss": -39.86684036254883, "global_step": 127760, "epoch": 1055} {"train_loss": -40.23794174194336, "global_step": 127761, "epoch": 1055} {"train_loss": -38.46159744262695, "global_step": 127762, "epoch": 1055} {"train_loss": -37.03450012207031, "global_step": 127763, "epoch": 1055} {"train_loss": -38.731781005859375, "global_step": 127764, "epoch": 1055} {"train_loss": -40.142581939697266, "global_step": 127765, "epoch": 1055} {"train_loss": -39.58282470703125, "global_step": 127766, "epoch": 1055} {"train_loss": -39.69829559326172, "global_step": 127767, "epoch": 1055} {"train_loss": -40.49934387207031, "global_step": 127768, "epoch": 1055} {"train_loss": -40.323463439941406, "global_step": 127769, "epoch": 1055} {"train_loss": -39.12635040283203, "global_step": 127770, "epoch": 1055} {"train_loss": -39.65859603881836, "global_step": 127771, "epoch": 1055} {"train_loss": -40.732295989990234, "global_step": 127772, "epoch": 1055} {"train_loss": -37.626304626464844, "global_step": 127773, "epoch": 1055} {"train_loss": -38.672088623046875, "global_step": 127774, "epoch": 1055} {"train_loss": -39.28734386853935, "global_step": 127775, "epoch": 1055, "val_loss": 2726187.0} {"train_loss": -36.80297088623047, "global_step": 127776, "epoch": 1056} {"train_loss": -36.57461166381836, "global_step": 127777, "epoch": 1056} {"train_loss": -39.798519134521484, "global_step": 127778, "epoch": 1056} {"train_loss": -37.3261833190918, "global_step": 127779, "epoch": 1056} {"train_loss": -39.03818893432617, "global_step": 127780, "epoch": 1056} {"train_loss": -39.126522064208984, "global_step": 127781, "epoch": 1056} {"train_loss": -37.65531539916992, "global_step": 127782, "epoch": 1056} {"train_loss": -39.9561882019043, "global_step": 127783, "epoch": 1056} {"train_loss": -38.526981353759766, "global_step": 127784, "epoch": 1056} {"train_loss": -39.048763275146484, "global_step": 127785, "epoch": 1056} {"train_loss": -40.55363464355469, "global_step": 127786, "epoch": 1056} {"train_loss": -40.14133071899414, "global_step": 127787, "epoch": 1056} {"train_loss": -39.74087142944336, "global_step": 127788, "epoch": 1056} {"train_loss": -40.34365463256836, "global_step": 127789, "epoch": 1056} {"train_loss": -39.975250244140625, "global_step": 127790, "epoch": 1056} {"train_loss": -40.226409912109375, "global_step": 127791, "epoch": 1056} {"train_loss": -40.248592376708984, "global_step": 127792, "epoch": 1056} {"train_loss": -39.37775421142578, "global_step": 127793, "epoch": 1056} {"train_loss": -40.94013595581055, "global_step": 127794, "epoch": 1056} {"train_loss": -40.04020690917969, "global_step": 127795, "epoch": 1056} {"train_loss": -40.27630615234375, "global_step": 127796, "epoch": 1056} {"train_loss": -40.2772216796875, "global_step": 127797, "epoch": 1056} {"train_loss": -40.16640853881836, "global_step": 127798, "epoch": 1056} {"train_loss": -40.46708297729492, "global_step": 127799, "epoch": 1056} {"train_loss": -40.246028900146484, "global_step": 127800, "epoch": 1056} {"train_loss": -40.502296447753906, "global_step": 127801, "epoch": 1056} {"train_loss": -40.22026824951172, "global_step": 127802, "epoch": 1056} {"train_loss": -40.43019485473633, "global_step": 127803, "epoch": 1056} {"train_loss": -39.666015625, "global_step": 127804, "epoch": 1056} {"train_loss": -39.65082931518555, "global_step": 127805, "epoch": 1056} {"train_loss": -40.16142654418945, "global_step": 127806, "epoch": 1056} {"train_loss": -40.70787811279297, "global_step": 127807, "epoch": 1056} {"train_loss": -40.55873107910156, "global_step": 127808, "epoch": 1056} {"train_loss": -40.329254150390625, "global_step": 127809, "epoch": 1056} {"train_loss": -40.08913803100586, "global_step": 127810, "epoch": 1056} {"train_loss": -39.74803924560547, "global_step": 127811, "epoch": 1056} {"train_loss": -39.834625244140625, "global_step": 127812, "epoch": 1056} {"train_loss": -39.957786560058594, "global_step": 127813, "epoch": 1056} {"train_loss": -41.0673942565918, "global_step": 127814, "epoch": 1056} {"train_loss": -40.149658203125, "global_step": 127815, "epoch": 1056} {"train_loss": -36.1937370300293, "global_step": 127816, "epoch": 1056} {"train_loss": -38.70441436767578, "global_step": 127817, "epoch": 1056} {"train_loss": -33.823551177978516, "global_step": 127818, "epoch": 1056} {"train_loss": -23.115304946899414, "global_step": 127819, "epoch": 1056} {"train_loss": 24.92700958251953, "global_step": 127820, "epoch": 1056} {"train_loss": -20.916284561157227, "global_step": 127821, "epoch": 1056} {"train_loss": 6.705740451812744, "global_step": 127822, "epoch": 1056} {"train_loss": -29.094818115234375, "global_step": 127823, "epoch": 1056} {"train_loss": -10.299954414367676, "global_step": 127824, "epoch": 1056} {"train_loss": -10.714946746826172, "global_step": 127825, "epoch": 1056} {"train_loss": -26.707538604736328, "global_step": 127826, "epoch": 1056} {"train_loss": -15.482121467590332, "global_step": 127827, "epoch": 1056} {"train_loss": -17.049123764038086, "global_step": 127828, "epoch": 1056} {"train_loss": -29.6513729095459, "global_step": 127829, "epoch": 1056} {"train_loss": -28.453550338745117, "global_step": 127830, "epoch": 1056} {"train_loss": -22.258310317993164, "global_step": 127831, "epoch": 1056} {"train_loss": -26.517969131469727, "global_step": 127832, "epoch": 1056} {"train_loss": -31.44025230407715, "global_step": 127833, "epoch": 1056} {"train_loss": -32.289581298828125, "global_step": 127834, "epoch": 1056} {"train_loss": -30.807565689086914, "global_step": 127835, "epoch": 1056} {"train_loss": -29.10694694519043, "global_step": 127836, "epoch": 1056} {"train_loss": -29.258502960205078, "global_step": 127837, "epoch": 1056} {"train_loss": -32.242130279541016, "global_step": 127838, "epoch": 1056} {"train_loss": -32.67928695678711, "global_step": 127839, "epoch": 1056} {"train_loss": -32.716941833496094, "global_step": 127840, "epoch": 1056} {"train_loss": -32.92704391479492, "global_step": 127841, "epoch": 1056} {"train_loss": -31.8067684173584, "global_step": 127842, "epoch": 1056} {"train_loss": -32.5030632019043, "global_step": 127843, "epoch": 1056} {"train_loss": -34.25373840332031, "global_step": 127844, "epoch": 1056} {"train_loss": -33.85640335083008, "global_step": 127845, "epoch": 1056} {"train_loss": -34.300357818603516, "global_step": 127846, "epoch": 1056} {"train_loss": -34.087646484375, "global_step": 127847, "epoch": 1056} {"train_loss": -33.90234375, "global_step": 127848, "epoch": 1056} {"train_loss": -34.11438751220703, "global_step": 127849, "epoch": 1056} {"train_loss": -34.101722717285156, "global_step": 127850, "epoch": 1056} {"train_loss": -34.76240158081055, "global_step": 127851, "epoch": 1056} {"train_loss": -35.25056838989258, "global_step": 127852, "epoch": 1056} {"train_loss": -34.74915313720703, "global_step": 127853, "epoch": 1056} {"train_loss": -33.97029495239258, "global_step": 127854, "epoch": 1056} {"train_loss": -32.95378494262695, "global_step": 127855, "epoch": 1056} {"train_loss": -34.08176803588867, "global_step": 127856, "epoch": 1056} {"train_loss": -31.906768798828125, "global_step": 127857, "epoch": 1056} {"train_loss": -32.40854263305664, "global_step": 127858, "epoch": 1056} {"train_loss": -34.95099639892578, "global_step": 127859, "epoch": 1056} {"train_loss": -32.20272445678711, "global_step": 127860, "epoch": 1056} {"train_loss": -34.45917892456055, "global_step": 127861, "epoch": 1056} {"train_loss": -34.367095947265625, "global_step": 127862, "epoch": 1056} {"train_loss": -34.23348617553711, "global_step": 127863, "epoch": 1056} {"train_loss": -34.62592315673828, "global_step": 127864, "epoch": 1056} {"train_loss": -35.15107345581055, "global_step": 127865, "epoch": 1056} {"train_loss": -34.65327072143555, "global_step": 127866, "epoch": 1056} {"train_loss": -35.435482025146484, "global_step": 127867, "epoch": 1056} {"train_loss": -35.02730941772461, "global_step": 127868, "epoch": 1056} {"train_loss": -36.092525482177734, "global_step": 127869, "epoch": 1056} {"train_loss": -34.981040954589844, "global_step": 127870, "epoch": 1056} {"train_loss": -35.30910873413086, "global_step": 127871, "epoch": 1056} {"train_loss": -36.288978576660156, "global_step": 127872, "epoch": 1056} {"train_loss": -35.90587615966797, "global_step": 127873, "epoch": 1056} {"train_loss": -36.25927734375, "global_step": 127874, "epoch": 1056} {"train_loss": -36.31104278564453, "global_step": 127875, "epoch": 1056} {"train_loss": -35.90658950805664, "global_step": 127876, "epoch": 1056} {"train_loss": -35.97608947753906, "global_step": 127877, "epoch": 1056} {"train_loss": -36.190757751464844, "global_step": 127878, "epoch": 1056} {"train_loss": -36.76791000366211, "global_step": 127879, "epoch": 1056} {"train_loss": -36.926326751708984, "global_step": 127880, "epoch": 1056} {"train_loss": -36.692466735839844, "global_step": 127881, "epoch": 1056} {"train_loss": -36.94259262084961, "global_step": 127882, "epoch": 1056} {"train_loss": -36.97224426269531, "global_step": 127883, "epoch": 1056} {"train_loss": -36.57351303100586, "global_step": 127884, "epoch": 1056} {"train_loss": -36.315032958984375, "global_step": 127885, "epoch": 1056} {"train_loss": -36.16581344604492, "global_step": 127886, "epoch": 1056} {"train_loss": -36.92033767700195, "global_step": 127887, "epoch": 1056} {"train_loss": -36.65214920043945, "global_step": 127888, "epoch": 1056} {"train_loss": -36.649227142333984, "global_step": 127889, "epoch": 1056} {"train_loss": -36.03167724609375, "global_step": 127890, "epoch": 1056} {"train_loss": -30.64133644104004, "global_step": 127891, "epoch": 1056} {"train_loss": -28.351526260375977, "global_step": 127892, "epoch": 1056} {"train_loss": -36.40375900268555, "global_step": 127893, "epoch": 1056} {"train_loss": -31.31477928161621, "global_step": 127894, "epoch": 1056} {"train_loss": -36.829071044921875, "global_step": 127895, "epoch": 1056} {"train_loss": -34.07881637053056, "global_step": 127896, "epoch": 1056, "val_loss": 2631194.0} {"train_loss": -37.38151550292969, "global_step": 127897, "epoch": 1057} {"train_loss": -33.89289474487305, "global_step": 127898, "epoch": 1057} {"train_loss": -36.88465118408203, "global_step": 127899, "epoch": 1057} {"train_loss": -35.99946212768555, "global_step": 127900, "epoch": 1057} {"train_loss": -36.08259201049805, "global_step": 127901, "epoch": 1057} {"train_loss": -36.55716323852539, "global_step": 127902, "epoch": 1057} {"train_loss": -35.75999069213867, "global_step": 127903, "epoch": 1057} {"train_loss": -36.766841888427734, "global_step": 127904, "epoch": 1057} {"train_loss": -36.48785400390625, "global_step": 127905, "epoch": 1057} {"train_loss": -37.27092361450195, "global_step": 127906, "epoch": 1057} {"train_loss": -36.75449752807617, "global_step": 127907, "epoch": 1057} {"train_loss": -36.98381423950195, "global_step": 127908, "epoch": 1057} {"train_loss": -37.039772033691406, "global_step": 127909, "epoch": 1057} {"train_loss": -36.957523345947266, "global_step": 127910, "epoch": 1057} {"train_loss": -37.29096221923828, "global_step": 127911, "epoch": 1057} {"train_loss": -36.74984359741211, "global_step": 127912, "epoch": 1057} {"train_loss": -37.37131881713867, "global_step": 127913, "epoch": 1057} {"train_loss": -37.4682731628418, "global_step": 127914, "epoch": 1057} {"train_loss": -37.2105712890625, "global_step": 127915, "epoch": 1057} {"train_loss": -37.586978912353516, "global_step": 127916, "epoch": 1057} {"train_loss": -37.0023307800293, "global_step": 127917, "epoch": 1057} {"train_loss": -37.977596282958984, "global_step": 127918, "epoch": 1057} {"train_loss": -37.63138961791992, "global_step": 127919, "epoch": 1057} {"train_loss": -37.77420425415039, "global_step": 127920, "epoch": 1057} {"train_loss": -37.57101058959961, "global_step": 127921, "epoch": 1057} {"train_loss": -38.02243423461914, "global_step": 127922, "epoch": 1057} {"train_loss": -38.063411712646484, "global_step": 127923, "epoch": 1057} {"train_loss": -37.98934555053711, "global_step": 127924, "epoch": 1057} {"train_loss": -38.304420471191406, "global_step": 127925, "epoch": 1057} {"train_loss": -37.83275604248047, "global_step": 127926, "epoch": 1057} {"train_loss": -38.15949249267578, "global_step": 127927, "epoch": 1057} {"train_loss": -37.8726806640625, "global_step": 127928, "epoch": 1057} {"train_loss": -37.154232025146484, "global_step": 127929, "epoch": 1057} {"train_loss": -37.242984771728516, "global_step": 127930, "epoch": 1057} {"train_loss": -36.4495849609375, "global_step": 127931, "epoch": 1057} {"train_loss": -36.53675079345703, "global_step": 127932, "epoch": 1057} {"train_loss": -37.28658676147461, "global_step": 127933, "epoch": 1057} {"train_loss": -38.47724151611328, "global_step": 127934, "epoch": 1057} {"train_loss": -37.58392333984375, "global_step": 127935, "epoch": 1057} {"train_loss": -35.98729705810547, "global_step": 127936, "epoch": 1057} {"train_loss": -36.783809661865234, "global_step": 127937, "epoch": 1057} {"train_loss": -37.44752883911133, "global_step": 127938, "epoch": 1057} {"train_loss": -37.216182708740234, "global_step": 127939, "epoch": 1057} {"train_loss": -37.57100296020508, "global_step": 127940, "epoch": 1057} {"train_loss": -37.546607971191406, "global_step": 127941, "epoch": 1057} {"train_loss": -38.062171936035156, "global_step": 127942, "epoch": 1057} {"train_loss": -37.99013137817383, "global_step": 127943, "epoch": 1057} {"train_loss": -38.58172607421875, "global_step": 127944, "epoch": 1057} {"train_loss": -38.088226318359375, "global_step": 127945, "epoch": 1057} {"train_loss": -36.21759033203125, "global_step": 127946, "epoch": 1057} {"train_loss": -37.673492431640625, "global_step": 127947, "epoch": 1057} {"train_loss": -38.386077880859375, "global_step": 127948, "epoch": 1057} {"train_loss": -38.09246826171875, "global_step": 127949, "epoch": 1057} {"train_loss": -37.58205795288086, "global_step": 127950, "epoch": 1057} {"train_loss": -38.550838470458984, "global_step": 127951, "epoch": 1057} {"train_loss": -37.90220642089844, "global_step": 127952, "epoch": 1057} {"train_loss": -37.621150970458984, "global_step": 127953, "epoch": 1057} {"train_loss": -38.481815338134766, "global_step": 127954, "epoch": 1057} {"train_loss": -38.21395492553711, "global_step": 127955, "epoch": 1057} {"train_loss": -37.738643646240234, "global_step": 127956, "epoch": 1057} {"train_loss": -38.026859283447266, "global_step": 127957, "epoch": 1057} {"train_loss": -38.199501037597656, "global_step": 127958, "epoch": 1057} {"train_loss": -37.7029914855957, "global_step": 127959, "epoch": 1057} {"train_loss": -38.253456115722656, "global_step": 127960, "epoch": 1057} {"train_loss": -38.356727600097656, "global_step": 127961, "epoch": 1057} {"train_loss": -37.93318557739258, "global_step": 127962, "epoch": 1057} {"train_loss": -38.32876205444336, "global_step": 127963, "epoch": 1057} {"train_loss": -37.625823974609375, "global_step": 127964, "epoch": 1057} {"train_loss": -37.9876594543457, "global_step": 127965, "epoch": 1057} {"train_loss": -38.16200637817383, "global_step": 127966, "epoch": 1057} {"train_loss": -38.04389190673828, "global_step": 127967, "epoch": 1057} {"train_loss": -37.575660705566406, "global_step": 127968, "epoch": 1057} {"train_loss": -36.536617279052734, "global_step": 127969, "epoch": 1057} {"train_loss": -37.32465362548828, "global_step": 127970, "epoch": 1057} {"train_loss": -37.937232971191406, "global_step": 127971, "epoch": 1057} {"train_loss": -37.517860412597656, "global_step": 127972, "epoch": 1057} {"train_loss": -38.29372787475586, "global_step": 127973, "epoch": 1057} {"train_loss": -37.9445686340332, "global_step": 127974, "epoch": 1057} {"train_loss": -38.273841857910156, "global_step": 127975, "epoch": 1057} {"train_loss": -38.04047393798828, "global_step": 127976, "epoch": 1057} {"train_loss": -38.2342643737793, "global_step": 127977, "epoch": 1057} {"train_loss": -38.408199310302734, "global_step": 127978, "epoch": 1057} {"train_loss": -37.9825325012207, "global_step": 127979, "epoch": 1057} {"train_loss": -38.394752502441406, "global_step": 127980, "epoch": 1057} {"train_loss": -38.7314567565918, "global_step": 127981, "epoch": 1057} {"train_loss": -38.43849563598633, "global_step": 127982, "epoch": 1057} {"train_loss": -38.831233978271484, "global_step": 127983, "epoch": 1057} {"train_loss": -38.56665802001953, "global_step": 127984, "epoch": 1057} {"train_loss": -38.23221969604492, "global_step": 127985, "epoch": 1057} {"train_loss": -38.735015869140625, "global_step": 127986, "epoch": 1057} {"train_loss": -38.8132209777832, "global_step": 127987, "epoch": 1057} {"train_loss": -38.58647537231445, "global_step": 127988, "epoch": 1057} {"train_loss": -38.2840690612793, "global_step": 127989, "epoch": 1057} {"train_loss": -38.88731002807617, "global_step": 127990, "epoch": 1057} {"train_loss": -38.63872146606445, "global_step": 127991, "epoch": 1057} {"train_loss": -38.0782470703125, "global_step": 127992, "epoch": 1057} {"train_loss": -37.82573318481445, "global_step": 127993, "epoch": 1057} {"train_loss": -37.1914176940918, "global_step": 127994, "epoch": 1057} {"train_loss": -38.18260192871094, "global_step": 127995, "epoch": 1057} {"train_loss": -37.91566848754883, "global_step": 127996, "epoch": 1057} {"train_loss": -37.307960510253906, "global_step": 127997, "epoch": 1057} {"train_loss": -36.84256362915039, "global_step": 127998, "epoch": 1057} {"train_loss": -36.114845275878906, "global_step": 127999, "epoch": 1057} {"train_loss": -38.674015045166016, "global_step": 128000, "epoch": 1057} {"train_loss": -36.7097053527832, "global_step": 128001, "epoch": 1057} {"train_loss": -37.56825637817383, "global_step": 128002, "epoch": 1057} {"train_loss": -38.8927116394043, "global_step": 128003, "epoch": 1057} {"train_loss": -37.9215202331543, "global_step": 128004, "epoch": 1057} {"train_loss": -38.387664794921875, "global_step": 128005, "epoch": 1057} {"train_loss": -39.64748764038086, "global_step": 128006, "epoch": 1057} {"train_loss": -38.204402923583984, "global_step": 128007, "epoch": 1057} {"train_loss": -37.045894622802734, "global_step": 128008, "epoch": 1057} {"train_loss": -38.35396194458008, "global_step": 128009, "epoch": 1057} {"train_loss": -38.61678695678711, "global_step": 128010, "epoch": 1057} {"train_loss": -38.21553421020508, "global_step": 128011, "epoch": 1057} {"train_loss": -38.13405227661133, "global_step": 128012, "epoch": 1057} {"train_loss": -38.399898529052734, "global_step": 128013, "epoch": 1057} {"train_loss": -38.75251388549805, "global_step": 128014, "epoch": 1057} {"train_loss": -38.68589401245117, "global_step": 128015, "epoch": 1057} {"train_loss": -38.958984375, "global_step": 128016, "epoch": 1057} {"train_loss": -37.735943691789615, "global_step": 128017, "epoch": 1057, "val_loss": 2603282.25} {"train_loss": -38.74966049194336, "global_step": 128018, "epoch": 1058} {"train_loss": -37.976749420166016, "global_step": 128019, "epoch": 1058} {"train_loss": -38.2356071472168, "global_step": 128020, "epoch": 1058} {"train_loss": -39.1026611328125, "global_step": 128021, "epoch": 1058} {"train_loss": -38.806610107421875, "global_step": 128022, "epoch": 1058} {"train_loss": -38.39790725708008, "global_step": 128023, "epoch": 1058} {"train_loss": -38.00666427612305, "global_step": 128024, "epoch": 1058} {"train_loss": -37.37117385864258, "global_step": 128025, "epoch": 1058} {"train_loss": -37.18083953857422, "global_step": 128026, "epoch": 1058} {"train_loss": -38.215309143066406, "global_step": 128027, "epoch": 1058} {"train_loss": -37.8229866027832, "global_step": 128028, "epoch": 1058} {"train_loss": -37.40800857543945, "global_step": 128029, "epoch": 1058} {"train_loss": -38.35691452026367, "global_step": 128030, "epoch": 1058} {"train_loss": -37.919044494628906, "global_step": 128031, "epoch": 1058} {"train_loss": -37.804954528808594, "global_step": 128032, "epoch": 1058} {"train_loss": -38.020408630371094, "global_step": 128033, "epoch": 1058} {"train_loss": -37.069305419921875, "global_step": 128034, "epoch": 1058} {"train_loss": -37.43315124511719, "global_step": 128035, "epoch": 1058} {"train_loss": -38.03666305541992, "global_step": 128036, "epoch": 1058} {"train_loss": -37.70587158203125, "global_step": 128037, "epoch": 1058} {"train_loss": -38.35828399658203, "global_step": 128038, "epoch": 1058} {"train_loss": -35.574153900146484, "global_step": 128039, "epoch": 1058} {"train_loss": -37.678680419921875, "global_step": 128040, "epoch": 1058} {"train_loss": -37.62408447265625, "global_step": 128041, "epoch": 1058} {"train_loss": -37.678199768066406, "global_step": 128042, "epoch": 1058} {"train_loss": -38.6239128112793, "global_step": 128043, "epoch": 1058} {"train_loss": -38.43135070800781, "global_step": 128044, "epoch": 1058} {"train_loss": -38.49005889892578, "global_step": 128045, "epoch": 1058} {"train_loss": -38.67075729370117, "global_step": 128046, "epoch": 1058} {"train_loss": -38.549560546875, "global_step": 128047, "epoch": 1058} {"train_loss": -38.8853645324707, "global_step": 128048, "epoch": 1058} {"train_loss": -38.60953903198242, "global_step": 128049, "epoch": 1058} {"train_loss": -38.630191802978516, "global_step": 128050, "epoch": 1058} {"train_loss": -37.93552780151367, "global_step": 128051, "epoch": 1058} {"train_loss": -38.21158981323242, "global_step": 128052, "epoch": 1058} {"train_loss": -38.87604522705078, "global_step": 128053, "epoch": 1058} {"train_loss": -38.203094482421875, "global_step": 128054, "epoch": 1058} {"train_loss": -37.54048156738281, "global_step": 128055, "epoch": 1058} {"train_loss": -38.404632568359375, "global_step": 128056, "epoch": 1058} {"train_loss": -39.15143966674805, "global_step": 128057, "epoch": 1058} {"train_loss": -38.69527053833008, "global_step": 128058, "epoch": 1058} {"train_loss": -38.55235290527344, "global_step": 128059, "epoch": 1058} {"train_loss": -38.19497299194336, "global_step": 128060, "epoch": 1058} {"train_loss": -38.45416259765625, "global_step": 128061, "epoch": 1058} {"train_loss": -37.57106399536133, "global_step": 128062, "epoch": 1058} {"train_loss": -38.163490295410156, "global_step": 128063, "epoch": 1058} {"train_loss": -37.054203033447266, "global_step": 128064, "epoch": 1058} {"train_loss": -38.09651565551758, "global_step": 128065, "epoch": 1058} {"train_loss": -38.40615463256836, "global_step": 128066, "epoch": 1058} {"train_loss": -38.58070755004883, "global_step": 128067, "epoch": 1058} {"train_loss": -39.2718620300293, "global_step": 128068, "epoch": 1058} {"train_loss": -39.326576232910156, "global_step": 128069, "epoch": 1058} {"train_loss": -39.278865814208984, "global_step": 128070, "epoch": 1058} {"train_loss": -38.56511306762695, "global_step": 128071, "epoch": 1058} {"train_loss": -38.80464553833008, "global_step": 128072, "epoch": 1058} {"train_loss": -38.99340057373047, "global_step": 128073, "epoch": 1058} {"train_loss": -39.25025177001953, "global_step": 128074, "epoch": 1058} {"train_loss": -39.35820388793945, "global_step": 128075, "epoch": 1058} {"train_loss": -38.145286560058594, "global_step": 128076, "epoch": 1058} {"train_loss": -38.86091613769531, "global_step": 128077, "epoch": 1058} {"train_loss": -38.27837371826172, "global_step": 128078, "epoch": 1058} {"train_loss": -38.94824981689453, "global_step": 128079, "epoch": 1058} {"train_loss": -38.60858154296875, "global_step": 128080, "epoch": 1058} {"train_loss": -38.42589569091797, "global_step": 128081, "epoch": 1058} {"train_loss": -38.63648986816406, "global_step": 128082, "epoch": 1058} {"train_loss": -37.345703125, "global_step": 128083, "epoch": 1058} {"train_loss": -36.76227569580078, "global_step": 128084, "epoch": 1058} {"train_loss": -39.38998031616211, "global_step": 128085, "epoch": 1058} {"train_loss": -37.85305404663086, "global_step": 128086, "epoch": 1058} {"train_loss": -37.41347885131836, "global_step": 128087, "epoch": 1058} {"train_loss": -37.32981491088867, "global_step": 128088, "epoch": 1058} {"train_loss": -38.39601135253906, "global_step": 128089, "epoch": 1058} {"train_loss": -37.819034576416016, "global_step": 128090, "epoch": 1058} {"train_loss": -37.431541442871094, "global_step": 128091, "epoch": 1058} {"train_loss": -37.32023239135742, "global_step": 128092, "epoch": 1058} {"train_loss": -39.01809310913086, "global_step": 128093, "epoch": 1058} {"train_loss": -38.77657699584961, "global_step": 128094, "epoch": 1058} {"train_loss": -37.23858642578125, "global_step": 128095, "epoch": 1058} {"train_loss": -35.93064880371094, "global_step": 128096, "epoch": 1058} {"train_loss": -38.85232162475586, "global_step": 128097, "epoch": 1058} {"train_loss": -37.141841888427734, "global_step": 128098, "epoch": 1058} {"train_loss": -37.46539306640625, "global_step": 128099, "epoch": 1058} {"train_loss": -38.81850814819336, "global_step": 128100, "epoch": 1058} {"train_loss": -38.074371337890625, "global_step": 128101, "epoch": 1058} {"train_loss": -38.09965515136719, "global_step": 128102, "epoch": 1058} {"train_loss": -38.766082763671875, "global_step": 128103, "epoch": 1058} {"train_loss": -37.61525344848633, "global_step": 128104, "epoch": 1058} {"train_loss": -37.96718978881836, "global_step": 128105, "epoch": 1058} {"train_loss": -38.547203063964844, "global_step": 128106, "epoch": 1058} {"train_loss": -36.75312042236328, "global_step": 128107, "epoch": 1058} {"train_loss": -38.60537338256836, "global_step": 128108, "epoch": 1058} {"train_loss": -38.8609733581543, "global_step": 128109, "epoch": 1058} {"train_loss": -38.25069046020508, "global_step": 128110, "epoch": 1058} {"train_loss": -37.68287658691406, "global_step": 128111, "epoch": 1058} {"train_loss": -36.5184211730957, "global_step": 128112, "epoch": 1058} {"train_loss": -35.249366760253906, "global_step": 128113, "epoch": 1058} {"train_loss": -35.988338470458984, "global_step": 128114, "epoch": 1058} {"train_loss": -35.883731842041016, "global_step": 128115, "epoch": 1058} {"train_loss": -37.8437614440918, "global_step": 128116, "epoch": 1058} {"train_loss": -37.406490325927734, "global_step": 128117, "epoch": 1058} {"train_loss": -34.982940673828125, "global_step": 128118, "epoch": 1058} {"train_loss": -35.167701721191406, "global_step": 128119, "epoch": 1058} {"train_loss": -37.389686584472656, "global_step": 128120, "epoch": 1058} {"train_loss": -38.07990264892578, "global_step": 128121, "epoch": 1058} {"train_loss": -36.06696701049805, "global_step": 128122, "epoch": 1058} {"train_loss": -35.26006317138672, "global_step": 128123, "epoch": 1058} {"train_loss": -34.733463287353516, "global_step": 128124, "epoch": 1058} {"train_loss": -36.277191162109375, "global_step": 128125, "epoch": 1058} {"train_loss": -35.979305267333984, "global_step": 128126, "epoch": 1058} {"train_loss": -37.699058532714844, "global_step": 128127, "epoch": 1058} {"train_loss": -33.86452102661133, "global_step": 128128, "epoch": 1058} {"train_loss": -33.666015625, "global_step": 128129, "epoch": 1058} {"train_loss": -37.032020568847656, "global_step": 128130, "epoch": 1058} {"train_loss": -33.366233825683594, "global_step": 128131, "epoch": 1058} {"train_loss": -33.247901916503906, "global_step": 128132, "epoch": 1058} {"train_loss": -36.24349594116211, "global_step": 128133, "epoch": 1058} {"train_loss": -36.436431884765625, "global_step": 128134, "epoch": 1058} {"train_loss": -36.00997543334961, "global_step": 128135, "epoch": 1058} {"train_loss": -36.7429313659668, "global_step": 128136, "epoch": 1058} {"train_loss": -30.560068130493164, "global_step": 128137, "epoch": 1058} {"train_loss": -37.58736487459545, "global_step": 128138, "epoch": 1058, "val_loss": 2833909.0} {"train_loss": -36.60585021972656, "global_step": 128139, "epoch": 1059} {"train_loss": -33.27199172973633, "global_step": 128140, "epoch": 1059} {"train_loss": -34.789588928222656, "global_step": 128141, "epoch": 1059} {"train_loss": -33.893226623535156, "global_step": 128142, "epoch": 1059} {"train_loss": -32.923500061035156, "global_step": 128143, "epoch": 1059} {"train_loss": -35.0525016784668, "global_step": 128144, "epoch": 1059} {"train_loss": -36.445613861083984, "global_step": 128145, "epoch": 1059} {"train_loss": -34.17905807495117, "global_step": 128146, "epoch": 1059} {"train_loss": -35.1320686340332, "global_step": 128147, "epoch": 1059} {"train_loss": -36.17251968383789, "global_step": 128148, "epoch": 1059} {"train_loss": -32.95904541015625, "global_step": 128149, "epoch": 1059} {"train_loss": -35.66640090942383, "global_step": 128150, "epoch": 1059} {"train_loss": -36.67251205444336, "global_step": 128151, "epoch": 1059} {"train_loss": -35.726966857910156, "global_step": 128152, "epoch": 1059} {"train_loss": -36.13798904418945, "global_step": 128153, "epoch": 1059} {"train_loss": -34.1270866394043, "global_step": 128154, "epoch": 1059} {"train_loss": -37.09598922729492, "global_step": 128155, "epoch": 1059} {"train_loss": -35.581748962402344, "global_step": 128156, "epoch": 1059} {"train_loss": -35.266937255859375, "global_step": 128157, "epoch": 1059} {"train_loss": -35.808013916015625, "global_step": 128158, "epoch": 1059} {"train_loss": -36.54984664916992, "global_step": 128159, "epoch": 1059} {"train_loss": -36.49649429321289, "global_step": 128160, "epoch": 1059} {"train_loss": -37.241004943847656, "global_step": 128161, "epoch": 1059} {"train_loss": -36.94239044189453, "global_step": 128162, "epoch": 1059} {"train_loss": -36.37250518798828, "global_step": 128163, "epoch": 1059} {"train_loss": -36.07979965209961, "global_step": 128164, "epoch": 1059} {"train_loss": -37.0606575012207, "global_step": 128165, "epoch": 1059} {"train_loss": -36.6645393371582, "global_step": 128166, "epoch": 1059} {"train_loss": -37.4675407409668, "global_step": 128167, "epoch": 1059} {"train_loss": -37.065425872802734, "global_step": 128168, "epoch": 1059} {"train_loss": -36.99795913696289, "global_step": 128169, "epoch": 1059} {"train_loss": -37.694576263427734, "global_step": 128170, "epoch": 1059} {"train_loss": -37.882259368896484, "global_step": 128171, "epoch": 1059} {"train_loss": -37.2226448059082, "global_step": 128172, "epoch": 1059} {"train_loss": -37.360530853271484, "global_step": 128173, "epoch": 1059} {"train_loss": -37.09064483642578, "global_step": 128174, "epoch": 1059} {"train_loss": -37.51791000366211, "global_step": 128175, "epoch": 1059} {"train_loss": -37.75086212158203, "global_step": 128176, "epoch": 1059} {"train_loss": -37.5742301940918, "global_step": 128177, "epoch": 1059} {"train_loss": -37.14767074584961, "global_step": 128178, "epoch": 1059} {"train_loss": -37.5811882019043, "global_step": 128179, "epoch": 1059} {"train_loss": -37.32624053955078, "global_step": 128180, "epoch": 1059} {"train_loss": -37.489402770996094, "global_step": 128181, "epoch": 1059} {"train_loss": -37.53458786010742, "global_step": 128182, "epoch": 1059} {"train_loss": -37.928375244140625, "global_step": 128183, "epoch": 1059} {"train_loss": -37.95692825317383, "global_step": 128184, "epoch": 1059} {"train_loss": -38.231693267822266, "global_step": 128185, "epoch": 1059} {"train_loss": -38.07826614379883, "global_step": 128186, "epoch": 1059} {"train_loss": -37.893943786621094, "global_step": 128187, "epoch": 1059} {"train_loss": -38.38267135620117, "global_step": 128188, "epoch": 1059} {"train_loss": -38.22951889038086, "global_step": 128189, "epoch": 1059} {"train_loss": -38.14982223510742, "global_step": 128190, "epoch": 1059} {"train_loss": -38.06461715698242, "global_step": 128191, "epoch": 1059} {"train_loss": -37.93475341796875, "global_step": 128192, "epoch": 1059} {"train_loss": -38.079593658447266, "global_step": 128193, "epoch": 1059} {"train_loss": -37.87681198120117, "global_step": 128194, "epoch": 1059} {"train_loss": -38.353572845458984, "global_step": 128195, "epoch": 1059} {"train_loss": -37.23454666137695, "global_step": 128196, "epoch": 1059} {"train_loss": -38.362545013427734, "global_step": 128197, "epoch": 1059} {"train_loss": -38.13552474975586, "global_step": 128198, "epoch": 1059} {"train_loss": -37.964534759521484, "global_step": 128199, "epoch": 1059} {"train_loss": -37.61335372924805, "global_step": 128200, "epoch": 1059} {"train_loss": -38.067012786865234, "global_step": 128201, "epoch": 1059} {"train_loss": -37.79833984375, "global_step": 128202, "epoch": 1059} {"train_loss": -38.514739990234375, "global_step": 128203, "epoch": 1059} {"train_loss": -38.149784088134766, "global_step": 128204, "epoch": 1059} {"train_loss": -37.86190414428711, "global_step": 128205, "epoch": 1059} {"train_loss": -38.239070892333984, "global_step": 128206, "epoch": 1059} {"train_loss": -37.86449432373047, "global_step": 128207, "epoch": 1059} {"train_loss": -37.98378372192383, "global_step": 128208, "epoch": 1059} {"train_loss": -38.173614501953125, "global_step": 128209, "epoch": 1059} {"train_loss": -38.14841079711914, "global_step": 128210, "epoch": 1059} {"train_loss": -38.94165802001953, "global_step": 128211, "epoch": 1059} {"train_loss": -38.583805084228516, "global_step": 128212, "epoch": 1059} {"train_loss": -38.138057708740234, "global_step": 128213, "epoch": 1059} {"train_loss": -38.771846771240234, "global_step": 128214, "epoch": 1059} {"train_loss": -38.86469650268555, "global_step": 128215, "epoch": 1059} {"train_loss": -38.495948791503906, "global_step": 128216, "epoch": 1059} {"train_loss": -38.624298095703125, "global_step": 128217, "epoch": 1059} {"train_loss": -39.12200927734375, "global_step": 128218, "epoch": 1059} {"train_loss": -38.93844223022461, "global_step": 128219, "epoch": 1059} {"train_loss": -38.05025863647461, "global_step": 128220, "epoch": 1059} {"train_loss": -37.09080123901367, "global_step": 128221, "epoch": 1059} {"train_loss": -34.758602142333984, "global_step": 128222, "epoch": 1059} {"train_loss": -35.78098678588867, "global_step": 128223, "epoch": 1059} {"train_loss": -38.2410888671875, "global_step": 128224, "epoch": 1059} {"train_loss": -38.328369140625, "global_step": 128225, "epoch": 1059} {"train_loss": -37.96611022949219, "global_step": 128226, "epoch": 1059} {"train_loss": -37.714595794677734, "global_step": 128227, "epoch": 1059} {"train_loss": -37.516963958740234, "global_step": 128228, "epoch": 1059} {"train_loss": -37.71416091918945, "global_step": 128229, "epoch": 1059} {"train_loss": -39.10543441772461, "global_step": 128230, "epoch": 1059} {"train_loss": -37.893348693847656, "global_step": 128231, "epoch": 1059} {"train_loss": -38.024898529052734, "global_step": 128232, "epoch": 1059} {"train_loss": -38.260738372802734, "global_step": 128233, "epoch": 1059} {"train_loss": -38.59574508666992, "global_step": 128234, "epoch": 1059} {"train_loss": -37.93277359008789, "global_step": 128235, "epoch": 1059} {"train_loss": -38.073482513427734, "global_step": 128236, "epoch": 1059} {"train_loss": -38.270774841308594, "global_step": 128237, "epoch": 1059} {"train_loss": -37.55784225463867, "global_step": 128238, "epoch": 1059} {"train_loss": -38.64070510864258, "global_step": 128239, "epoch": 1059} {"train_loss": -38.780433654785156, "global_step": 128240, "epoch": 1059} {"train_loss": -38.652008056640625, "global_step": 128241, "epoch": 1059} {"train_loss": -38.687984466552734, "global_step": 128242, "epoch": 1059} {"train_loss": -39.032081604003906, "global_step": 128243, "epoch": 1059} {"train_loss": -38.68465805053711, "global_step": 128244, "epoch": 1059} {"train_loss": -38.266395568847656, "global_step": 128245, "epoch": 1059} {"train_loss": -39.208465576171875, "global_step": 128246, "epoch": 1059} {"train_loss": -38.997650146484375, "global_step": 128247, "epoch": 1059} {"train_loss": -38.613162994384766, "global_step": 128248, "epoch": 1059} {"train_loss": -39.276611328125, "global_step": 128249, "epoch": 1059} {"train_loss": -38.0125846862793, "global_step": 128250, "epoch": 1059} {"train_loss": -38.539058685302734, "global_step": 128251, "epoch": 1059} {"train_loss": -38.98002243041992, "global_step": 128252, "epoch": 1059} {"train_loss": -38.91701126098633, "global_step": 128253, "epoch": 1059} {"train_loss": -38.7036247253418, "global_step": 128254, "epoch": 1059} {"train_loss": -38.605377197265625, "global_step": 128255, "epoch": 1059} {"train_loss": -38.88088607788086, "global_step": 128256, "epoch": 1059} {"train_loss": -39.22397994995117, "global_step": 128257, "epoch": 1059} {"train_loss": -38.30788803100586, "global_step": 128258, "epoch": 1059} {"train_loss": -37.52976352912335, "global_step": 128259, "epoch": 1059, "val_loss": 2731588.75} {"train_loss": -38.46793746948242, "global_step": 128260, "epoch": 1060} {"train_loss": -38.75273513793945, "global_step": 128261, "epoch": 1060} {"train_loss": -39.47021484375, "global_step": 128262, "epoch": 1060} {"train_loss": -39.68217849731445, "global_step": 128263, "epoch": 1060} {"train_loss": -40.0824089050293, "global_step": 128264, "epoch": 1060} {"train_loss": -38.58547592163086, "global_step": 128265, "epoch": 1060} {"train_loss": -39.50358963012695, "global_step": 128266, "epoch": 1060} {"train_loss": -38.69679260253906, "global_step": 128267, "epoch": 1060} {"train_loss": -39.30961990356445, "global_step": 128268, "epoch": 1060} {"train_loss": -39.41844940185547, "global_step": 128269, "epoch": 1060} {"train_loss": -39.71303176879883, "global_step": 128270, "epoch": 1060} {"train_loss": -39.89512252807617, "global_step": 128271, "epoch": 1060} {"train_loss": -39.955902099609375, "global_step": 128272, "epoch": 1060} {"train_loss": -39.317134857177734, "global_step": 128273, "epoch": 1060} {"train_loss": -38.81046676635742, "global_step": 128274, "epoch": 1060} {"train_loss": -38.80224609375, "global_step": 128275, "epoch": 1060} {"train_loss": -38.82151412963867, "global_step": 128276, "epoch": 1060} {"train_loss": -38.45399856567383, "global_step": 128277, "epoch": 1060} {"train_loss": -37.38327407836914, "global_step": 128278, "epoch": 1060} {"train_loss": -38.06245040893555, "global_step": 128279, "epoch": 1060} {"train_loss": -39.51906967163086, "global_step": 128280, "epoch": 1060} {"train_loss": -39.722103118896484, "global_step": 128281, "epoch": 1060} {"train_loss": -37.114253997802734, "global_step": 128282, "epoch": 1060} {"train_loss": -33.77932357788086, "global_step": 128283, "epoch": 1060} {"train_loss": -35.92395782470703, "global_step": 128284, "epoch": 1060} {"train_loss": -36.72316360473633, "global_step": 128285, "epoch": 1060} {"train_loss": -38.47967529296875, "global_step": 128286, "epoch": 1060} {"train_loss": -38.88910675048828, "global_step": 128287, "epoch": 1060} {"train_loss": -38.97760009765625, "global_step": 128288, "epoch": 1060} {"train_loss": -37.59657669067383, "global_step": 128289, "epoch": 1060} {"train_loss": -37.40983963012695, "global_step": 128290, "epoch": 1060} {"train_loss": -37.99187088012695, "global_step": 128291, "epoch": 1060} {"train_loss": -37.86377716064453, "global_step": 128292, "epoch": 1060} {"train_loss": -37.43416976928711, "global_step": 128293, "epoch": 1060} {"train_loss": -38.01051330566406, "global_step": 128294, "epoch": 1060} {"train_loss": -37.593021392822266, "global_step": 128295, "epoch": 1060} {"train_loss": -37.74761962890625, "global_step": 128296, "epoch": 1060} {"train_loss": -38.02608871459961, "global_step": 128297, "epoch": 1060} {"train_loss": -38.36629104614258, "global_step": 128298, "epoch": 1060} {"train_loss": -38.96747970581055, "global_step": 128299, "epoch": 1060} {"train_loss": -37.87783432006836, "global_step": 128300, "epoch": 1060} {"train_loss": -38.0279541015625, "global_step": 128301, "epoch": 1060} {"train_loss": -38.818511962890625, "global_step": 128302, "epoch": 1060} {"train_loss": -38.58915328979492, "global_step": 128303, "epoch": 1060} {"train_loss": -38.89336013793945, "global_step": 128304, "epoch": 1060} {"train_loss": -39.172393798828125, "global_step": 128305, "epoch": 1060} {"train_loss": -38.413055419921875, "global_step": 128306, "epoch": 1060} {"train_loss": -37.701385498046875, "global_step": 128307, "epoch": 1060} {"train_loss": -37.994407653808594, "global_step": 128308, "epoch": 1060} {"train_loss": -38.62717819213867, "global_step": 128309, "epoch": 1060} {"train_loss": -38.763031005859375, "global_step": 128310, "epoch": 1060} {"train_loss": -39.645137786865234, "global_step": 128311, "epoch": 1060} {"train_loss": -39.212158203125, "global_step": 128312, "epoch": 1060} {"train_loss": -39.19797897338867, "global_step": 128313, "epoch": 1060} {"train_loss": -39.26146697998047, "global_step": 128314, "epoch": 1060} {"train_loss": -39.35177230834961, "global_step": 128315, "epoch": 1060} {"train_loss": -39.031375885009766, "global_step": 128316, "epoch": 1060} {"train_loss": -38.95847702026367, "global_step": 128317, "epoch": 1060} {"train_loss": -39.49237060546875, "global_step": 128318, "epoch": 1060} {"train_loss": -38.452693939208984, "global_step": 128319, "epoch": 1060} {"train_loss": -39.64509201049805, "global_step": 128320, "epoch": 1060} {"train_loss": -39.10083770751953, "global_step": 128321, "epoch": 1060} {"train_loss": -40.137393951416016, "global_step": 128322, "epoch": 1060} {"train_loss": -39.730770111083984, "global_step": 128323, "epoch": 1060} {"train_loss": -39.36738204956055, "global_step": 128324, "epoch": 1060} {"train_loss": -39.748565673828125, "global_step": 128325, "epoch": 1060} {"train_loss": -39.490631103515625, "global_step": 128326, "epoch": 1060} {"train_loss": -38.62016677856445, "global_step": 128327, "epoch": 1060} {"train_loss": -39.47825241088867, "global_step": 128328, "epoch": 1060} {"train_loss": -39.25051498413086, "global_step": 128329, "epoch": 1060} {"train_loss": -38.69901657104492, "global_step": 128330, "epoch": 1060} {"train_loss": -39.61186599731445, "global_step": 128331, "epoch": 1060} {"train_loss": -39.39976119995117, "global_step": 128332, "epoch": 1060} {"train_loss": -38.986549377441406, "global_step": 128333, "epoch": 1060} {"train_loss": -40.15608596801758, "global_step": 128334, "epoch": 1060} {"train_loss": -39.133575439453125, "global_step": 128335, "epoch": 1060} {"train_loss": -39.12370681762695, "global_step": 128336, "epoch": 1060} {"train_loss": -39.69103240966797, "global_step": 128337, "epoch": 1060} {"train_loss": -39.223487854003906, "global_step": 128338, "epoch": 1060} {"train_loss": -36.9555778503418, "global_step": 128339, "epoch": 1060} {"train_loss": -38.87002182006836, "global_step": 128340, "epoch": 1060} {"train_loss": -38.836788177490234, "global_step": 128341, "epoch": 1060} {"train_loss": -38.17804718017578, "global_step": 128342, "epoch": 1060} {"train_loss": -38.51396560668945, "global_step": 128343, "epoch": 1060} {"train_loss": -38.891639709472656, "global_step": 128344, "epoch": 1060} {"train_loss": -38.06842803955078, "global_step": 128345, "epoch": 1060} {"train_loss": -36.19108200073242, "global_step": 128346, "epoch": 1060} {"train_loss": -37.69378662109375, "global_step": 128347, "epoch": 1060} {"train_loss": -39.069923400878906, "global_step": 128348, "epoch": 1060} {"train_loss": -39.02700424194336, "global_step": 128349, "epoch": 1060} {"train_loss": -38.646385192871094, "global_step": 128350, "epoch": 1060} {"train_loss": -37.3712272644043, "global_step": 128351, "epoch": 1060} {"train_loss": -37.49440383911133, "global_step": 128352, "epoch": 1060} {"train_loss": -37.954471588134766, "global_step": 128353, "epoch": 1060} {"train_loss": -38.60872268676758, "global_step": 128354, "epoch": 1060} {"train_loss": -38.72273635864258, "global_step": 128355, "epoch": 1060} {"train_loss": -35.51168441772461, "global_step": 128356, "epoch": 1060} {"train_loss": -36.92364501953125, "global_step": 128357, "epoch": 1060} {"train_loss": -38.86666488647461, "global_step": 128358, "epoch": 1060} {"train_loss": -38.54039764404297, "global_step": 128359, "epoch": 1060} {"train_loss": -37.35787582397461, "global_step": 128360, "epoch": 1060} {"train_loss": -39.1015739440918, "global_step": 128361, "epoch": 1060} {"train_loss": -39.0908317565918, "global_step": 128362, "epoch": 1060} {"train_loss": -38.80364227294922, "global_step": 128363, "epoch": 1060} {"train_loss": -39.101478576660156, "global_step": 128364, "epoch": 1060} {"train_loss": -37.96632766723633, "global_step": 128365, "epoch": 1060} {"train_loss": -39.05819320678711, "global_step": 128366, "epoch": 1060} {"train_loss": -39.22693634033203, "global_step": 128367, "epoch": 1060} {"train_loss": -39.03670883178711, "global_step": 128368, "epoch": 1060} {"train_loss": -38.39091110229492, "global_step": 128369, "epoch": 1060} {"train_loss": -38.67326736450195, "global_step": 128370, "epoch": 1060} {"train_loss": -39.193016052246094, "global_step": 128371, "epoch": 1060} {"train_loss": -38.379268646240234, "global_step": 128372, "epoch": 1060} {"train_loss": -39.38532638549805, "global_step": 128373, "epoch": 1060} {"train_loss": -39.248291015625, "global_step": 128374, "epoch": 1060} {"train_loss": -37.1143684387207, "global_step": 128375, "epoch": 1060} {"train_loss": -38.52985763549805, "global_step": 128376, "epoch": 1060} {"train_loss": -38.07767868041992, "global_step": 128377, "epoch": 1060} {"train_loss": -38.426021575927734, "global_step": 128378, "epoch": 1060} {"train_loss": -38.68196487426758, "global_step": 128379, "epoch": 1060} {"train_loss": -38.61028081720526, "global_step": 128380, "epoch": 1060, "val_loss": 2571102.75} {"train_loss": -38.63666915893555, "global_step": 128381, "epoch": 1061} {"train_loss": -38.44599533081055, "global_step": 128382, "epoch": 1061} {"train_loss": -38.41357421875, "global_step": 128383, "epoch": 1061} {"train_loss": -37.620025634765625, "global_step": 128384, "epoch": 1061} {"train_loss": -38.77667236328125, "global_step": 128385, "epoch": 1061} {"train_loss": -37.79984664916992, "global_step": 128386, "epoch": 1061} {"train_loss": -38.90947341918945, "global_step": 128387, "epoch": 1061} {"train_loss": -38.353267669677734, "global_step": 128388, "epoch": 1061} {"train_loss": -39.36387252807617, "global_step": 128389, "epoch": 1061} {"train_loss": -39.35109329223633, "global_step": 128390, "epoch": 1061} {"train_loss": -39.13385009765625, "global_step": 128391, "epoch": 1061} {"train_loss": -39.047142028808594, "global_step": 128392, "epoch": 1061} {"train_loss": -39.146461486816406, "global_step": 128393, "epoch": 1061} {"train_loss": -38.80595016479492, "global_step": 128394, "epoch": 1061} {"train_loss": -39.09267044067383, "global_step": 128395, "epoch": 1061} {"train_loss": -39.44218826293945, "global_step": 128396, "epoch": 1061} {"train_loss": -38.545387268066406, "global_step": 128397, "epoch": 1061} {"train_loss": -35.8028678894043, "global_step": 128398, "epoch": 1061} {"train_loss": -38.50580978393555, "global_step": 128399, "epoch": 1061} {"train_loss": -34.87358474731445, "global_step": 128400, "epoch": 1061} {"train_loss": -36.37004470825195, "global_step": 128401, "epoch": 1061} {"train_loss": -37.86458969116211, "global_step": 128402, "epoch": 1061} {"train_loss": -37.203208923339844, "global_step": 128403, "epoch": 1061} {"train_loss": -33.4138069152832, "global_step": 128404, "epoch": 1061} {"train_loss": -36.28837966918945, "global_step": 128405, "epoch": 1061} {"train_loss": -35.52302169799805, "global_step": 128406, "epoch": 1061} {"train_loss": -37.148380279541016, "global_step": 128407, "epoch": 1061} {"train_loss": -33.7458381652832, "global_step": 128408, "epoch": 1061} {"train_loss": -36.844478607177734, "global_step": 128409, "epoch": 1061} {"train_loss": -37.64161682128906, "global_step": 128410, "epoch": 1061} {"train_loss": -36.653072357177734, "global_step": 128411, "epoch": 1061} {"train_loss": -37.52598190307617, "global_step": 128412, "epoch": 1061} {"train_loss": -35.866764068603516, "global_step": 128413, "epoch": 1061} {"train_loss": -37.3453254699707, "global_step": 128414, "epoch": 1061} {"train_loss": -36.10464096069336, "global_step": 128415, "epoch": 1061} {"train_loss": -36.373043060302734, "global_step": 128416, "epoch": 1061} {"train_loss": -33.290245056152344, "global_step": 128417, "epoch": 1061} {"train_loss": -37.63779830932617, "global_step": 128418, "epoch": 1061} {"train_loss": -37.257991790771484, "global_step": 128419, "epoch": 1061} {"train_loss": -35.44023895263672, "global_step": 128420, "epoch": 1061} {"train_loss": -33.39107131958008, "global_step": 128421, "epoch": 1061} {"train_loss": -36.157691955566406, "global_step": 128422, "epoch": 1061} {"train_loss": -37.160579681396484, "global_step": 128423, "epoch": 1061} {"train_loss": -34.80680465698242, "global_step": 128424, "epoch": 1061} {"train_loss": -37.53305435180664, "global_step": 128425, "epoch": 1061} {"train_loss": -36.64189910888672, "global_step": 128426, "epoch": 1061} {"train_loss": -38.17727279663086, "global_step": 128427, "epoch": 1061} {"train_loss": -36.03133773803711, "global_step": 128428, "epoch": 1061} {"train_loss": -35.913734436035156, "global_step": 128429, "epoch": 1061} {"train_loss": -37.046966552734375, "global_step": 128430, "epoch": 1061} {"train_loss": -37.631683349609375, "global_step": 128431, "epoch": 1061} {"train_loss": -35.06718444824219, "global_step": 128432, "epoch": 1061} {"train_loss": -38.09336471557617, "global_step": 128433, "epoch": 1061} {"train_loss": -36.982357025146484, "global_step": 128434, "epoch": 1061} {"train_loss": -38.48808670043945, "global_step": 128435, "epoch": 1061} {"train_loss": -38.426513671875, "global_step": 128436, "epoch": 1061} {"train_loss": -36.12861251831055, "global_step": 128437, "epoch": 1061} {"train_loss": -38.2177734375, "global_step": 128438, "epoch": 1061} {"train_loss": -37.69895935058594, "global_step": 128439, "epoch": 1061} {"train_loss": -36.63468551635742, "global_step": 128440, "epoch": 1061} {"train_loss": -38.70195388793945, "global_step": 128441, "epoch": 1061} {"train_loss": -38.26981735229492, "global_step": 128442, "epoch": 1061} {"train_loss": -37.82871627807617, "global_step": 128443, "epoch": 1061} {"train_loss": -38.64571762084961, "global_step": 128444, "epoch": 1061} {"train_loss": -38.39393997192383, "global_step": 128445, "epoch": 1061} {"train_loss": -38.51815414428711, "global_step": 128446, "epoch": 1061} {"train_loss": -38.65334701538086, "global_step": 128447, "epoch": 1061} {"train_loss": -38.60960388183594, "global_step": 128448, "epoch": 1061} {"train_loss": -37.89703369140625, "global_step": 128449, "epoch": 1061} {"train_loss": -38.81821823120117, "global_step": 128450, "epoch": 1061} {"train_loss": -39.05959701538086, "global_step": 128451, "epoch": 1061} {"train_loss": -38.91408920288086, "global_step": 128452, "epoch": 1061} {"train_loss": -38.44116973876953, "global_step": 128453, "epoch": 1061} {"train_loss": -38.81914138793945, "global_step": 128454, "epoch": 1061} {"train_loss": -38.30925369262695, "global_step": 128455, "epoch": 1061} {"train_loss": -38.72408676147461, "global_step": 128456, "epoch": 1061} {"train_loss": -39.11092758178711, "global_step": 128457, "epoch": 1061} {"train_loss": -38.816097259521484, "global_step": 128458, "epoch": 1061} {"train_loss": -39.05793380737305, "global_step": 128459, "epoch": 1061} {"train_loss": -39.12919235229492, "global_step": 128460, "epoch": 1061} {"train_loss": -37.853981018066406, "global_step": 128461, "epoch": 1061} {"train_loss": -39.2781982421875, "global_step": 128462, "epoch": 1061} {"train_loss": -38.84098815917969, "global_step": 128463, "epoch": 1061} {"train_loss": -39.02126693725586, "global_step": 128464, "epoch": 1061} {"train_loss": -38.54066467285156, "global_step": 128465, "epoch": 1061} {"train_loss": -37.59579086303711, "global_step": 128466, "epoch": 1061} {"train_loss": -37.422359466552734, "global_step": 128467, "epoch": 1061} {"train_loss": -37.73788070678711, "global_step": 128468, "epoch": 1061} {"train_loss": -38.79746627807617, "global_step": 128469, "epoch": 1061} {"train_loss": -39.062557220458984, "global_step": 128470, "epoch": 1061} {"train_loss": -37.67578125, "global_step": 128471, "epoch": 1061} {"train_loss": -37.32624053955078, "global_step": 128472, "epoch": 1061} {"train_loss": -37.09333038330078, "global_step": 128473, "epoch": 1061} {"train_loss": -38.09206008911133, "global_step": 128474, "epoch": 1061} {"train_loss": -36.995723724365234, "global_step": 128475, "epoch": 1061} {"train_loss": -38.27910614013672, "global_step": 128476, "epoch": 1061} {"train_loss": -38.385066986083984, "global_step": 128477, "epoch": 1061} {"train_loss": -37.53934097290039, "global_step": 128478, "epoch": 1061} {"train_loss": -36.45859909057617, "global_step": 128479, "epoch": 1061} {"train_loss": -37.17277145385742, "global_step": 128480, "epoch": 1061} {"train_loss": -39.138240814208984, "global_step": 128481, "epoch": 1061} {"train_loss": -38.651485443115234, "global_step": 128482, "epoch": 1061} {"train_loss": -38.72492980957031, "global_step": 128483, "epoch": 1061} {"train_loss": -39.0415153503418, "global_step": 128484, "epoch": 1061} {"train_loss": -38.518096923828125, "global_step": 128485, "epoch": 1061} {"train_loss": -37.65222930908203, "global_step": 128486, "epoch": 1061} {"train_loss": -39.05912399291992, "global_step": 128487, "epoch": 1061} {"train_loss": -37.61504364013672, "global_step": 128488, "epoch": 1061} {"train_loss": -38.74506759643555, "global_step": 128489, "epoch": 1061} {"train_loss": -39.35505676269531, "global_step": 128490, "epoch": 1061} {"train_loss": -38.986228942871094, "global_step": 128491, "epoch": 1061} {"train_loss": -39.15536117553711, "global_step": 128492, "epoch": 1061} {"train_loss": -39.004947662353516, "global_step": 128493, "epoch": 1061} {"train_loss": -39.45840072631836, "global_step": 128494, "epoch": 1061} {"train_loss": -39.35056686401367, "global_step": 128495, "epoch": 1061} {"train_loss": -38.9921989440918, "global_step": 128496, "epoch": 1061} {"train_loss": -39.478729248046875, "global_step": 128497, "epoch": 1061} {"train_loss": -39.514984130859375, "global_step": 128498, "epoch": 1061} {"train_loss": -39.38969802856445, "global_step": 128499, "epoch": 1061} {"train_loss": -37.038936614990234, "global_step": 128500, "epoch": 1061} {"train_loss": -37.83344426430946, "global_step": 128501, "epoch": 1061, "val_loss": 2699283.25} {"train_loss": -39.22207260131836, "global_step": 128502, "epoch": 1062} {"train_loss": -39.50761032104492, "global_step": 128503, "epoch": 1062} {"train_loss": -39.04714584350586, "global_step": 128504, "epoch": 1062} {"train_loss": -39.2275276184082, "global_step": 128505, "epoch": 1062} {"train_loss": -39.5073356628418, "global_step": 128506, "epoch": 1062} {"train_loss": -39.70722579956055, "global_step": 128507, "epoch": 1062} {"train_loss": -38.99162292480469, "global_step": 128508, "epoch": 1062} {"train_loss": -39.3574333190918, "global_step": 128509, "epoch": 1062} {"train_loss": -38.68950271606445, "global_step": 128510, "epoch": 1062} {"train_loss": -39.110164642333984, "global_step": 128511, "epoch": 1062} {"train_loss": -39.93495559692383, "global_step": 128512, "epoch": 1062} {"train_loss": -39.03656005859375, "global_step": 128513, "epoch": 1062} {"train_loss": -39.48763656616211, "global_step": 128514, "epoch": 1062} {"train_loss": -39.107845306396484, "global_step": 128515, "epoch": 1062} {"train_loss": -39.1910285949707, "global_step": 128516, "epoch": 1062} {"train_loss": -39.89460372924805, "global_step": 128517, "epoch": 1062} {"train_loss": -38.468135833740234, "global_step": 128518, "epoch": 1062} {"train_loss": -39.4779052734375, "global_step": 128519, "epoch": 1062} {"train_loss": -38.90639114379883, "global_step": 128520, "epoch": 1062} {"train_loss": -39.649505615234375, "global_step": 128521, "epoch": 1062} {"train_loss": -39.2076416015625, "global_step": 128522, "epoch": 1062} {"train_loss": -39.7279052734375, "global_step": 128523, "epoch": 1062} {"train_loss": -39.877559661865234, "global_step": 128524, "epoch": 1062} {"train_loss": -39.99283218383789, "global_step": 128525, "epoch": 1062} {"train_loss": -38.570037841796875, "global_step": 128526, "epoch": 1062} {"train_loss": -40.006446838378906, "global_step": 128527, "epoch": 1062} {"train_loss": -39.23749923706055, "global_step": 128528, "epoch": 1062} {"train_loss": -39.05744171142578, "global_step": 128529, "epoch": 1062} {"train_loss": -35.68587112426758, "global_step": 128530, "epoch": 1062} {"train_loss": -38.48932647705078, "global_step": 128531, "epoch": 1062} {"train_loss": -39.40610885620117, "global_step": 128532, "epoch": 1062} {"train_loss": -37.060821533203125, "global_step": 128533, "epoch": 1062} {"train_loss": -39.68850326538086, "global_step": 128534, "epoch": 1062} {"train_loss": -38.53255081176758, "global_step": 128535, "epoch": 1062} {"train_loss": -38.40009307861328, "global_step": 128536, "epoch": 1062} {"train_loss": -38.18760299682617, "global_step": 128537, "epoch": 1062} {"train_loss": -37.67799758911133, "global_step": 128538, "epoch": 1062} {"train_loss": -33.072120666503906, "global_step": 128539, "epoch": 1062} {"train_loss": -25.906051635742188, "global_step": 128540, "epoch": 1062} {"train_loss": -32.1726188659668, "global_step": 128541, "epoch": 1062} {"train_loss": -37.241390228271484, "global_step": 128542, "epoch": 1062} {"train_loss": -35.77997970581055, "global_step": 128543, "epoch": 1062} {"train_loss": -34.38275909423828, "global_step": 128544, "epoch": 1062} {"train_loss": -32.02793502807617, "global_step": 128545, "epoch": 1062} {"train_loss": -35.488956451416016, "global_step": 128546, "epoch": 1062} {"train_loss": -36.868385314941406, "global_step": 128547, "epoch": 1062} {"train_loss": -32.98867416381836, "global_step": 128548, "epoch": 1062} {"train_loss": -35.609004974365234, "global_step": 128549, "epoch": 1062} {"train_loss": -35.77384567260742, "global_step": 128550, "epoch": 1062} {"train_loss": -38.28615188598633, "global_step": 128551, "epoch": 1062} {"train_loss": -36.38267135620117, "global_step": 128552, "epoch": 1062} {"train_loss": -37.535099029541016, "global_step": 128553, "epoch": 1062} {"train_loss": -34.856788635253906, "global_step": 128554, "epoch": 1062} {"train_loss": -35.50311279296875, "global_step": 128555, "epoch": 1062} {"train_loss": -36.69212341308594, "global_step": 128556, "epoch": 1062} {"train_loss": -37.57314682006836, "global_step": 128557, "epoch": 1062} {"train_loss": -36.890193939208984, "global_step": 128558, "epoch": 1062} {"train_loss": -36.476844787597656, "global_step": 128559, "epoch": 1062} {"train_loss": -35.13766098022461, "global_step": 128560, "epoch": 1062} {"train_loss": -34.26738357543945, "global_step": 128561, "epoch": 1062} {"train_loss": -36.363155364990234, "global_step": 128562, "epoch": 1062} {"train_loss": -35.81291961669922, "global_step": 128563, "epoch": 1062} {"train_loss": -33.64832305908203, "global_step": 128564, "epoch": 1062} {"train_loss": -34.69199752807617, "global_step": 128565, "epoch": 1062} {"train_loss": -35.41187286376953, "global_step": 128566, "epoch": 1062} {"train_loss": -36.25179672241211, "global_step": 128567, "epoch": 1062} {"train_loss": -37.488319396972656, "global_step": 128568, "epoch": 1062} {"train_loss": -35.70008850097656, "global_step": 128569, "epoch": 1062} {"train_loss": -34.4736328125, "global_step": 128570, "epoch": 1062} {"train_loss": -36.223655700683594, "global_step": 128571, "epoch": 1062} {"train_loss": -36.653564453125, "global_step": 128572, "epoch": 1062} {"train_loss": -36.48706817626953, "global_step": 128573, "epoch": 1062} {"train_loss": -37.225502014160156, "global_step": 128574, "epoch": 1062} {"train_loss": -37.49089431762695, "global_step": 128575, "epoch": 1062} {"train_loss": -36.01728057861328, "global_step": 128576, "epoch": 1062} {"train_loss": -38.1646728515625, "global_step": 128577, "epoch": 1062} {"train_loss": -38.22402572631836, "global_step": 128578, "epoch": 1062} {"train_loss": -37.16939163208008, "global_step": 128579, "epoch": 1062} {"train_loss": -38.2977409362793, "global_step": 128580, "epoch": 1062} {"train_loss": -37.59345245361328, "global_step": 128581, "epoch": 1062} {"train_loss": -37.56693649291992, "global_step": 128582, "epoch": 1062} {"train_loss": -37.90052032470703, "global_step": 128583, "epoch": 1062} {"train_loss": -37.04985809326172, "global_step": 128584, "epoch": 1062} {"train_loss": -38.222137451171875, "global_step": 128585, "epoch": 1062} {"train_loss": -37.44065475463867, "global_step": 128586, "epoch": 1062} {"train_loss": -36.332027435302734, "global_step": 128587, "epoch": 1062} {"train_loss": -38.21725845336914, "global_step": 128588, "epoch": 1062} {"train_loss": -37.613521575927734, "global_step": 128589, "epoch": 1062} {"train_loss": -37.62282180786133, "global_step": 128590, "epoch": 1062} {"train_loss": -37.1944580078125, "global_step": 128591, "epoch": 1062} {"train_loss": -37.65998458862305, "global_step": 128592, "epoch": 1062} {"train_loss": -37.89983367919922, "global_step": 128593, "epoch": 1062} {"train_loss": -38.34225082397461, "global_step": 128594, "epoch": 1062} {"train_loss": -38.47146224975586, "global_step": 128595, "epoch": 1062} {"train_loss": -37.82203674316406, "global_step": 128596, "epoch": 1062} {"train_loss": -38.34095001220703, "global_step": 128597, "epoch": 1062} {"train_loss": -37.231353759765625, "global_step": 128598, "epoch": 1062} {"train_loss": -38.02190017700195, "global_step": 128599, "epoch": 1062} {"train_loss": -37.74000930786133, "global_step": 128600, "epoch": 1062} {"train_loss": -38.398353576660156, "global_step": 128601, "epoch": 1062} {"train_loss": -38.115516662597656, "global_step": 128602, "epoch": 1062} {"train_loss": -38.285789489746094, "global_step": 128603, "epoch": 1062} {"train_loss": -38.53798294067383, "global_step": 128604, "epoch": 1062} {"train_loss": -34.972808837890625, "global_step": 128605, "epoch": 1062} {"train_loss": -38.289039611816406, "global_step": 128606, "epoch": 1062} {"train_loss": -38.177120208740234, "global_step": 128607, "epoch": 1062} {"train_loss": -37.86721420288086, "global_step": 128608, "epoch": 1062} {"train_loss": -38.277400970458984, "global_step": 128609, "epoch": 1062} {"train_loss": -38.665687561035156, "global_step": 128610, "epoch": 1062} {"train_loss": -38.37455368041992, "global_step": 128611, "epoch": 1062} {"train_loss": -39.01544189453125, "global_step": 128612, "epoch": 1062} {"train_loss": -38.489219665527344, "global_step": 128613, "epoch": 1062} {"train_loss": -35.78487777709961, "global_step": 128614, "epoch": 1062} {"train_loss": -38.37579345703125, "global_step": 128615, "epoch": 1062} {"train_loss": -38.97299575805664, "global_step": 128616, "epoch": 1062} {"train_loss": -38.3709831237793, "global_step": 128617, "epoch": 1062} {"train_loss": -38.412933349609375, "global_step": 128618, "epoch": 1062} {"train_loss": -39.10132598876953, "global_step": 128619, "epoch": 1062} {"train_loss": -39.49169921875, "global_step": 128620, "epoch": 1062} {"train_loss": -38.73587417602539, "global_step": 128621, "epoch": 1062} {"train_loss": -37.5168469011291, "global_step": 128622, "epoch": 1062, "val_loss": 2705659.25} {"train_loss": -39.08330535888672, "global_step": 128623, "epoch": 1063} {"train_loss": -39.13820266723633, "global_step": 128624, "epoch": 1063} {"train_loss": -39.53972244262695, "global_step": 128625, "epoch": 1063} {"train_loss": -39.374202728271484, "global_step": 128626, "epoch": 1063} {"train_loss": -39.070045471191406, "global_step": 128627, "epoch": 1063} {"train_loss": -38.22159957885742, "global_step": 128628, "epoch": 1063} {"train_loss": -39.62272644042969, "global_step": 128629, "epoch": 1063} {"train_loss": -39.01263427734375, "global_step": 128630, "epoch": 1063} {"train_loss": -39.40446090698242, "global_step": 128631, "epoch": 1063} {"train_loss": -39.310359954833984, "global_step": 128632, "epoch": 1063} {"train_loss": -39.09176254272461, "global_step": 128633, "epoch": 1063} {"train_loss": -39.42733383178711, "global_step": 128634, "epoch": 1063} {"train_loss": -37.912261962890625, "global_step": 128635, "epoch": 1063} {"train_loss": -38.81354904174805, "global_step": 128636, "epoch": 1063} {"train_loss": -38.1695556640625, "global_step": 128637, "epoch": 1063} {"train_loss": -38.16179275512695, "global_step": 128638, "epoch": 1063} {"train_loss": -37.17475509643555, "global_step": 128639, "epoch": 1063} {"train_loss": -37.40322494506836, "global_step": 128640, "epoch": 1063} {"train_loss": -37.690547943115234, "global_step": 128641, "epoch": 1063} {"train_loss": -38.59771728515625, "global_step": 128642, "epoch": 1063} {"train_loss": -39.56341552734375, "global_step": 128643, "epoch": 1063} {"train_loss": -38.280372619628906, "global_step": 128644, "epoch": 1063} {"train_loss": -38.115020751953125, "global_step": 128645, "epoch": 1063} {"train_loss": -39.121002197265625, "global_step": 128646, "epoch": 1063} {"train_loss": -39.54611587524414, "global_step": 128647, "epoch": 1063} {"train_loss": -38.646766662597656, "global_step": 128648, "epoch": 1063} {"train_loss": -38.68549728393555, "global_step": 128649, "epoch": 1063} {"train_loss": -38.25428009033203, "global_step": 128650, "epoch": 1063} {"train_loss": -38.98122787475586, "global_step": 128651, "epoch": 1063} {"train_loss": -39.055965423583984, "global_step": 128652, "epoch": 1063} {"train_loss": -38.25014114379883, "global_step": 128653, "epoch": 1063} {"train_loss": -37.68464660644531, "global_step": 128654, "epoch": 1063} {"train_loss": -39.30096435546875, "global_step": 128655, "epoch": 1063} {"train_loss": -40.077484130859375, "global_step": 128656, "epoch": 1063} {"train_loss": -38.973060607910156, "global_step": 128657, "epoch": 1063} {"train_loss": -38.565406799316406, "global_step": 128658, "epoch": 1063} {"train_loss": -39.5435905456543, "global_step": 128659, "epoch": 1063} {"train_loss": -38.18193817138672, "global_step": 128660, "epoch": 1063} {"train_loss": -39.74763870239258, "global_step": 128661, "epoch": 1063} {"train_loss": -39.575469970703125, "global_step": 128662, "epoch": 1063} {"train_loss": -37.26957321166992, "global_step": 128663, "epoch": 1063} {"train_loss": -38.37322998046875, "global_step": 128664, "epoch": 1063} {"train_loss": -39.365840911865234, "global_step": 128665, "epoch": 1063} {"train_loss": -37.01328659057617, "global_step": 128666, "epoch": 1063} {"train_loss": -38.1959228515625, "global_step": 128667, "epoch": 1063} {"train_loss": -38.42118453979492, "global_step": 128668, "epoch": 1063} {"train_loss": -38.232540130615234, "global_step": 128669, "epoch": 1063} {"train_loss": -39.66791915893555, "global_step": 128670, "epoch": 1063} {"train_loss": -39.34518051147461, "global_step": 128671, "epoch": 1063} {"train_loss": -38.51394271850586, "global_step": 128672, "epoch": 1063} {"train_loss": -38.45793533325195, "global_step": 128673, "epoch": 1063} {"train_loss": -35.63946533203125, "global_step": 128674, "epoch": 1063} {"train_loss": -38.56591796875, "global_step": 128675, "epoch": 1063} {"train_loss": -39.046329498291016, "global_step": 128676, "epoch": 1063} {"train_loss": -38.465538024902344, "global_step": 128677, "epoch": 1063} {"train_loss": -36.643001556396484, "global_step": 128678, "epoch": 1063} {"train_loss": -38.34244918823242, "global_step": 128679, "epoch": 1063} {"train_loss": -39.1209716796875, "global_step": 128680, "epoch": 1063} {"train_loss": -36.15123748779297, "global_step": 128681, "epoch": 1063} {"train_loss": -37.680206298828125, "global_step": 128682, "epoch": 1063} {"train_loss": -38.09358596801758, "global_step": 128683, "epoch": 1063} {"train_loss": -38.29985046386719, "global_step": 128684, "epoch": 1063} {"train_loss": -38.914127349853516, "global_step": 128685, "epoch": 1063} {"train_loss": -39.19963455200195, "global_step": 128686, "epoch": 1063} {"train_loss": -38.60647201538086, "global_step": 128687, "epoch": 1063} {"train_loss": -38.50556564331055, "global_step": 128688, "epoch": 1063} {"train_loss": -39.219749450683594, "global_step": 128689, "epoch": 1063} {"train_loss": -38.385986328125, "global_step": 128690, "epoch": 1063} {"train_loss": -38.985904693603516, "global_step": 128691, "epoch": 1063} {"train_loss": -39.3452033996582, "global_step": 128692, "epoch": 1063} {"train_loss": -38.97785568237305, "global_step": 128693, "epoch": 1063} {"train_loss": -39.090354919433594, "global_step": 128694, "epoch": 1063} {"train_loss": -38.91756820678711, "global_step": 128695, "epoch": 1063} {"train_loss": -39.442684173583984, "global_step": 128696, "epoch": 1063} {"train_loss": -39.45391082763672, "global_step": 128697, "epoch": 1063} {"train_loss": -38.52772903442383, "global_step": 128698, "epoch": 1063} {"train_loss": -39.061153411865234, "global_step": 128699, "epoch": 1063} {"train_loss": -37.94411087036133, "global_step": 128700, "epoch": 1063} {"train_loss": -38.96401596069336, "global_step": 128701, "epoch": 1063} {"train_loss": -39.368934631347656, "global_step": 128702, "epoch": 1063} {"train_loss": -39.40643310546875, "global_step": 128703, "epoch": 1063} {"train_loss": -38.5091552734375, "global_step": 128704, "epoch": 1063} {"train_loss": -38.424278259277344, "global_step": 128705, "epoch": 1063} {"train_loss": -39.06266403198242, "global_step": 128706, "epoch": 1063} {"train_loss": -38.4388542175293, "global_step": 128707, "epoch": 1063} {"train_loss": -39.29000473022461, "global_step": 128708, "epoch": 1063} {"train_loss": -38.7917366027832, "global_step": 128709, "epoch": 1063} {"train_loss": -39.30897521972656, "global_step": 128710, "epoch": 1063} {"train_loss": -38.8247184753418, "global_step": 128711, "epoch": 1063} {"train_loss": -37.61469650268555, "global_step": 128712, "epoch": 1063} {"train_loss": -39.71687316894531, "global_step": 128713, "epoch": 1063} {"train_loss": -39.11637496948242, "global_step": 128714, "epoch": 1063} {"train_loss": -39.038516998291016, "global_step": 128715, "epoch": 1063} {"train_loss": -39.830562591552734, "global_step": 128716, "epoch": 1063} {"train_loss": -37.129066467285156, "global_step": 128717, "epoch": 1063} {"train_loss": -38.62467956542969, "global_step": 128718, "epoch": 1063} {"train_loss": -39.35914611816406, "global_step": 128719, "epoch": 1063} {"train_loss": -39.44667053222656, "global_step": 128720, "epoch": 1063} {"train_loss": -38.10226058959961, "global_step": 128721, "epoch": 1063} {"train_loss": -36.678218841552734, "global_step": 128722, "epoch": 1063} {"train_loss": -35.29240036010742, "global_step": 128723, "epoch": 1063} {"train_loss": -31.948638916015625, "global_step": 128724, "epoch": 1063} {"train_loss": -30.311141967773438, "global_step": 128725, "epoch": 1063} {"train_loss": -35.00040817260742, "global_step": 128726, "epoch": 1063} {"train_loss": -37.994380950927734, "global_step": 128727, "epoch": 1063} {"train_loss": -30.55731773376465, "global_step": 128728, "epoch": 1063} {"train_loss": -35.856685638427734, "global_step": 128729, "epoch": 1063} {"train_loss": -37.243324279785156, "global_step": 128730, "epoch": 1063} {"train_loss": -36.065616607666016, "global_step": 128731, "epoch": 1063} {"train_loss": -36.41560745239258, "global_step": 128732, "epoch": 1063} {"train_loss": -36.365962982177734, "global_step": 128733, "epoch": 1063} {"train_loss": -38.47050094604492, "global_step": 128734, "epoch": 1063} {"train_loss": -36.62352752685547, "global_step": 128735, "epoch": 1063} {"train_loss": -38.022430419921875, "global_step": 128736, "epoch": 1063} {"train_loss": -36.812530517578125, "global_step": 128737, "epoch": 1063} {"train_loss": -36.91837692260742, "global_step": 128738, "epoch": 1063} {"train_loss": -36.34619903564453, "global_step": 128739, "epoch": 1063} {"train_loss": -38.18769454956055, "global_step": 128740, "epoch": 1063} {"train_loss": -38.0160026550293, "global_step": 128741, "epoch": 1063} {"train_loss": -38.83557891845703, "global_step": 128742, "epoch": 1063} {"train_loss": -38.23365848320575, "global_step": 128743, "epoch": 1063, "val_loss": 2696268.75} {"train_loss": -38.98185348510742, "global_step": 128744, "epoch": 1064} {"train_loss": -39.10829544067383, "global_step": 128745, "epoch": 1064} {"train_loss": -38.94120407104492, "global_step": 128746, "epoch": 1064} {"train_loss": -38.48474884033203, "global_step": 128747, "epoch": 1064} {"train_loss": -38.012088775634766, "global_step": 128748, "epoch": 1064} {"train_loss": -38.77531433105469, "global_step": 128749, "epoch": 1064} {"train_loss": -38.314659118652344, "global_step": 128750, "epoch": 1064} {"train_loss": -37.80813217163086, "global_step": 128751, "epoch": 1064} {"train_loss": -38.94136047363281, "global_step": 128752, "epoch": 1064} {"train_loss": -39.364559173583984, "global_step": 128753, "epoch": 1064} {"train_loss": -38.572933197021484, "global_step": 128754, "epoch": 1064} {"train_loss": -38.295711517333984, "global_step": 128755, "epoch": 1064} {"train_loss": -36.64842987060547, "global_step": 128756, "epoch": 1064} {"train_loss": -37.88618087768555, "global_step": 128757, "epoch": 1064} {"train_loss": -38.668609619140625, "global_step": 128758, "epoch": 1064} {"train_loss": -39.437442779541016, "global_step": 128759, "epoch": 1064} {"train_loss": -38.801002502441406, "global_step": 128760, "epoch": 1064} {"train_loss": -38.21442794799805, "global_step": 128761, "epoch": 1064} {"train_loss": -39.02840042114258, "global_step": 128762, "epoch": 1064} {"train_loss": -32.737693786621094, "global_step": 128763, "epoch": 1064} {"train_loss": -38.02120590209961, "global_step": 128764, "epoch": 1064} {"train_loss": -36.5402717590332, "global_step": 128765, "epoch": 1064} {"train_loss": -37.597312927246094, "global_step": 128766, "epoch": 1064} {"train_loss": -35.30160140991211, "global_step": 128767, "epoch": 1064} {"train_loss": -37.81646728515625, "global_step": 128768, "epoch": 1064} {"train_loss": -37.5063591003418, "global_step": 128769, "epoch": 1064} {"train_loss": -35.50706100463867, "global_step": 128770, "epoch": 1064} {"train_loss": -37.02631759643555, "global_step": 128771, "epoch": 1064} {"train_loss": -38.021793365478516, "global_step": 128772, "epoch": 1064} {"train_loss": -38.09153366088867, "global_step": 128773, "epoch": 1064} {"train_loss": -38.46686935424805, "global_step": 128774, "epoch": 1064} {"train_loss": -36.588966369628906, "global_step": 128775, "epoch": 1064} {"train_loss": -38.36764144897461, "global_step": 128776, "epoch": 1064} {"train_loss": -38.5697021484375, "global_step": 128777, "epoch": 1064} {"train_loss": -37.36983871459961, "global_step": 128778, "epoch": 1064} {"train_loss": -38.37895584106445, "global_step": 128779, "epoch": 1064} {"train_loss": -38.4990119934082, "global_step": 128780, "epoch": 1064} {"train_loss": -38.775299072265625, "global_step": 128781, "epoch": 1064} {"train_loss": -38.258460998535156, "global_step": 128782, "epoch": 1064} {"train_loss": -36.900062561035156, "global_step": 128783, "epoch": 1064} {"train_loss": -37.34157180786133, "global_step": 128784, "epoch": 1064} {"train_loss": -37.78578567504883, "global_step": 128785, "epoch": 1064} {"train_loss": -39.04714584350586, "global_step": 128786, "epoch": 1064} {"train_loss": -37.5692138671875, "global_step": 128787, "epoch": 1064} {"train_loss": -37.8443717956543, "global_step": 128788, "epoch": 1064} {"train_loss": -38.39143753051758, "global_step": 128789, "epoch": 1064} {"train_loss": -35.138248443603516, "global_step": 128790, "epoch": 1064} {"train_loss": -37.91233825683594, "global_step": 128791, "epoch": 1064} {"train_loss": -38.33598709106445, "global_step": 128792, "epoch": 1064} {"train_loss": -38.41619873046875, "global_step": 128793, "epoch": 1064} {"train_loss": -38.8696403503418, "global_step": 128794, "epoch": 1064} {"train_loss": -36.16470718383789, "global_step": 128795, "epoch": 1064} {"train_loss": -37.12550735473633, "global_step": 128796, "epoch": 1064} {"train_loss": -38.68050003051758, "global_step": 128797, "epoch": 1064} {"train_loss": -38.53028869628906, "global_step": 128798, "epoch": 1064} {"train_loss": -38.152854919433594, "global_step": 128799, "epoch": 1064} {"train_loss": -38.379146575927734, "global_step": 128800, "epoch": 1064} {"train_loss": -38.73181915283203, "global_step": 128801, "epoch": 1064} {"train_loss": -37.761959075927734, "global_step": 128802, "epoch": 1064} {"train_loss": -38.944942474365234, "global_step": 128803, "epoch": 1064} {"train_loss": -38.03805923461914, "global_step": 128804, "epoch": 1064} {"train_loss": -37.91794967651367, "global_step": 128805, "epoch": 1064} {"train_loss": -37.9506721496582, "global_step": 128806, "epoch": 1064} {"train_loss": -38.777679443359375, "global_step": 128807, "epoch": 1064} {"train_loss": -37.177669525146484, "global_step": 128808, "epoch": 1064} {"train_loss": -38.46855545043945, "global_step": 128809, "epoch": 1064} {"train_loss": -38.304656982421875, "global_step": 128810, "epoch": 1064} {"train_loss": -37.544921875, "global_step": 128811, "epoch": 1064} {"train_loss": -38.96797180175781, "global_step": 128812, "epoch": 1064} {"train_loss": -38.951168060302734, "global_step": 128813, "epoch": 1064} {"train_loss": -38.89740753173828, "global_step": 128814, "epoch": 1064} {"train_loss": -38.95553207397461, "global_step": 128815, "epoch": 1064} {"train_loss": -38.71940231323242, "global_step": 128816, "epoch": 1064} {"train_loss": -38.512672424316406, "global_step": 128817, "epoch": 1064} {"train_loss": -38.778316497802734, "global_step": 128818, "epoch": 1064} {"train_loss": -38.34756088256836, "global_step": 128819, "epoch": 1064} {"train_loss": -39.255706787109375, "global_step": 128820, "epoch": 1064} {"train_loss": -38.36591339111328, "global_step": 128821, "epoch": 1064} {"train_loss": -39.00213623046875, "global_step": 128822, "epoch": 1064} {"train_loss": -38.592620849609375, "global_step": 128823, "epoch": 1064} {"train_loss": -39.14780807495117, "global_step": 128824, "epoch": 1064} {"train_loss": -39.22275924682617, "global_step": 128825, "epoch": 1064} {"train_loss": -38.20583724975586, "global_step": 128826, "epoch": 1064} {"train_loss": -39.2506103515625, "global_step": 128827, "epoch": 1064} {"train_loss": -38.214324951171875, "global_step": 128828, "epoch": 1064} {"train_loss": -38.959354400634766, "global_step": 128829, "epoch": 1064} {"train_loss": -39.08357620239258, "global_step": 128830, "epoch": 1064} {"train_loss": -38.74153518676758, "global_step": 128831, "epoch": 1064} {"train_loss": -39.31941223144531, "global_step": 128832, "epoch": 1064} {"train_loss": -38.86017990112305, "global_step": 128833, "epoch": 1064} {"train_loss": -39.23674392700195, "global_step": 128834, "epoch": 1064} {"train_loss": -38.76876449584961, "global_step": 128835, "epoch": 1064} {"train_loss": -38.307395935058594, "global_step": 128836, "epoch": 1064} {"train_loss": -39.25393295288086, "global_step": 128837, "epoch": 1064} {"train_loss": -38.12236785888672, "global_step": 128838, "epoch": 1064} {"train_loss": -39.34498977661133, "global_step": 128839, "epoch": 1064} {"train_loss": -39.3512077331543, "global_step": 128840, "epoch": 1064} {"train_loss": -39.76179885864258, "global_step": 128841, "epoch": 1064} {"train_loss": -39.22080612182617, "global_step": 128842, "epoch": 1064} {"train_loss": -39.97834014892578, "global_step": 128843, "epoch": 1064} {"train_loss": -38.40532684326172, "global_step": 128844, "epoch": 1064} {"train_loss": -39.67300033569336, "global_step": 128845, "epoch": 1064} {"train_loss": -39.83345413208008, "global_step": 128846, "epoch": 1064} {"train_loss": -40.036495208740234, "global_step": 128847, "epoch": 1064} {"train_loss": -39.52074432373047, "global_step": 128848, "epoch": 1064} {"train_loss": -39.44648361206055, "global_step": 128849, "epoch": 1064} {"train_loss": -39.10382080078125, "global_step": 128850, "epoch": 1064} {"train_loss": -39.42319869995117, "global_step": 128851, "epoch": 1064} {"train_loss": -39.97678756713867, "global_step": 128852, "epoch": 1064} {"train_loss": -38.31140899658203, "global_step": 128853, "epoch": 1064} {"train_loss": -38.567256927490234, "global_step": 128854, "epoch": 1064} {"train_loss": -37.6309928894043, "global_step": 128855, "epoch": 1064} {"train_loss": -35.625911712646484, "global_step": 128856, "epoch": 1064} {"train_loss": -34.30988693237305, "global_step": 128857, "epoch": 1064} {"train_loss": -38.085384368896484, "global_step": 128858, "epoch": 1064} {"train_loss": -39.28915786743164, "global_step": 128859, "epoch": 1064} {"train_loss": -37.86456298828125, "global_step": 128860, "epoch": 1064} {"train_loss": -36.855289459228516, "global_step": 128861, "epoch": 1064} {"train_loss": -39.03950119018555, "global_step": 128862, "epoch": 1064} {"train_loss": -38.972633361816406, "global_step": 128863, "epoch": 1064} {"train_loss": -38.298252042660046, "global_step": 128864, "epoch": 1064, "val_loss": 2709987.75} {"train_loss": -39.55537796020508, "global_step": 128865, "epoch": 1065} {"train_loss": -37.226741790771484, "global_step": 128866, "epoch": 1065} {"train_loss": -36.268287658691406, "global_step": 128867, "epoch": 1065} {"train_loss": -36.531105041503906, "global_step": 128868, "epoch": 1065} {"train_loss": -37.38296127319336, "global_step": 128869, "epoch": 1065} {"train_loss": -37.313133239746094, "global_step": 128870, "epoch": 1065} {"train_loss": -36.89320755004883, "global_step": 128871, "epoch": 1065} {"train_loss": -36.37226104736328, "global_step": 128872, "epoch": 1065} {"train_loss": -38.681190490722656, "global_step": 128873, "epoch": 1065} {"train_loss": -38.00595474243164, "global_step": 128874, "epoch": 1065} {"train_loss": -38.5610237121582, "global_step": 128875, "epoch": 1065} {"train_loss": -38.73264694213867, "global_step": 128876, "epoch": 1065} {"train_loss": -37.48482131958008, "global_step": 128877, "epoch": 1065} {"train_loss": -38.629737854003906, "global_step": 128878, "epoch": 1065} {"train_loss": -38.5095329284668, "global_step": 128879, "epoch": 1065} {"train_loss": -39.25990676879883, "global_step": 128880, "epoch": 1065} {"train_loss": -37.7469596862793, "global_step": 128881, "epoch": 1065} {"train_loss": -39.16724395751953, "global_step": 128882, "epoch": 1065} {"train_loss": -38.026153564453125, "global_step": 128883, "epoch": 1065} {"train_loss": -38.87769317626953, "global_step": 128884, "epoch": 1065} {"train_loss": -39.10161209106445, "global_step": 128885, "epoch": 1065} {"train_loss": -39.02393341064453, "global_step": 128886, "epoch": 1065} {"train_loss": -39.076904296875, "global_step": 128887, "epoch": 1065} {"train_loss": -39.650421142578125, "global_step": 128888, "epoch": 1065} {"train_loss": -38.86311340332031, "global_step": 128889, "epoch": 1065} {"train_loss": -39.665279388427734, "global_step": 128890, "epoch": 1065} {"train_loss": -39.21165466308594, "global_step": 128891, "epoch": 1065} {"train_loss": -38.094051361083984, "global_step": 128892, "epoch": 1065} {"train_loss": -39.422508239746094, "global_step": 128893, "epoch": 1065} {"train_loss": -39.157955169677734, "global_step": 128894, "epoch": 1065} {"train_loss": -38.72929763793945, "global_step": 128895, "epoch": 1065} {"train_loss": -39.568843841552734, "global_step": 128896, "epoch": 1065} {"train_loss": -39.6638298034668, "global_step": 128897, "epoch": 1065} {"train_loss": -39.647335052490234, "global_step": 128898, "epoch": 1065} {"train_loss": -39.38064956665039, "global_step": 128899, "epoch": 1065} {"train_loss": -39.71322250366211, "global_step": 128900, "epoch": 1065} {"train_loss": -39.50822067260742, "global_step": 128901, "epoch": 1065} {"train_loss": -39.74726486206055, "global_step": 128902, "epoch": 1065} {"train_loss": -39.70779800415039, "global_step": 128903, "epoch": 1065} {"train_loss": -39.44517517089844, "global_step": 128904, "epoch": 1065} {"train_loss": -39.814971923828125, "global_step": 128905, "epoch": 1065} {"train_loss": -40.068599700927734, "global_step": 128906, "epoch": 1065} {"train_loss": -39.44076156616211, "global_step": 128907, "epoch": 1065} {"train_loss": -40.2174186706543, "global_step": 128908, "epoch": 1065} {"train_loss": -40.121273040771484, "global_step": 128909, "epoch": 1065} {"train_loss": -39.92080307006836, "global_step": 128910, "epoch": 1065} {"train_loss": -38.88890075683594, "global_step": 128911, "epoch": 1065} {"train_loss": -39.8781623840332, "global_step": 128912, "epoch": 1065} {"train_loss": -39.573875427246094, "global_step": 128913, "epoch": 1065} {"train_loss": -40.33736038208008, "global_step": 128914, "epoch": 1065} {"train_loss": -40.75779342651367, "global_step": 128915, "epoch": 1065} {"train_loss": -39.8233528137207, "global_step": 128916, "epoch": 1065} {"train_loss": -39.9470329284668, "global_step": 128917, "epoch": 1065} {"train_loss": -38.984832763671875, "global_step": 128918, "epoch": 1065} {"train_loss": -37.73048400878906, "global_step": 128919, "epoch": 1065} {"train_loss": -36.47159957885742, "global_step": 128920, "epoch": 1065} {"train_loss": -33.80984115600586, "global_step": 128921, "epoch": 1065} {"train_loss": -33.46140670776367, "global_step": 128922, "epoch": 1065} {"train_loss": -25.31166648864746, "global_step": 128923, "epoch": 1065} {"train_loss": -25.446630477905273, "global_step": 128924, "epoch": 1065} {"train_loss": -38.702152252197266, "global_step": 128925, "epoch": 1065} {"train_loss": -33.88274002075195, "global_step": 128926, "epoch": 1065} {"train_loss": -35.421852111816406, "global_step": 128927, "epoch": 1065} {"train_loss": -38.2789192199707, "global_step": 128928, "epoch": 1065} {"train_loss": -33.70550537109375, "global_step": 128929, "epoch": 1065} {"train_loss": -38.1073112487793, "global_step": 128930, "epoch": 1065} {"train_loss": -35.793373107910156, "global_step": 128931, "epoch": 1065} {"train_loss": -36.714141845703125, "global_step": 128932, "epoch": 1065} {"train_loss": -37.218563079833984, "global_step": 128933, "epoch": 1065} {"train_loss": -38.34028244018555, "global_step": 128934, "epoch": 1065} {"train_loss": -37.56886291503906, "global_step": 128935, "epoch": 1065} {"train_loss": -38.54526901245117, "global_step": 128936, "epoch": 1065} {"train_loss": -37.95606231689453, "global_step": 128937, "epoch": 1065} {"train_loss": -39.16686248779297, "global_step": 128938, "epoch": 1065} {"train_loss": -37.85503005981445, "global_step": 128939, "epoch": 1065} {"train_loss": -39.25326156616211, "global_step": 128940, "epoch": 1065} {"train_loss": -37.9284782409668, "global_step": 128941, "epoch": 1065} {"train_loss": -39.6131706237793, "global_step": 128942, "epoch": 1065} {"train_loss": -38.81085968017578, "global_step": 128943, "epoch": 1065} {"train_loss": -38.310245513916016, "global_step": 128944, "epoch": 1065} {"train_loss": -39.481685638427734, "global_step": 128945, "epoch": 1065} {"train_loss": -38.450191497802734, "global_step": 128946, "epoch": 1065} {"train_loss": -37.804176330566406, "global_step": 128947, "epoch": 1065} {"train_loss": -38.71072006225586, "global_step": 128948, "epoch": 1065} {"train_loss": -38.297054290771484, "global_step": 128949, "epoch": 1065} {"train_loss": -38.335968017578125, "global_step": 128950, "epoch": 1065} {"train_loss": -38.52606201171875, "global_step": 128951, "epoch": 1065} {"train_loss": -37.982452392578125, "global_step": 128952, "epoch": 1065} {"train_loss": -39.214691162109375, "global_step": 128953, "epoch": 1065} {"train_loss": -38.220436096191406, "global_step": 128954, "epoch": 1065} {"train_loss": -39.466064453125, "global_step": 128955, "epoch": 1065} {"train_loss": -38.63313674926758, "global_step": 128956, "epoch": 1065} {"train_loss": -38.84543991088867, "global_step": 128957, "epoch": 1065} {"train_loss": -38.93333053588867, "global_step": 128958, "epoch": 1065} {"train_loss": -38.87998580932617, "global_step": 128959, "epoch": 1065} {"train_loss": -35.801151275634766, "global_step": 128960, "epoch": 1065} {"train_loss": -39.238677978515625, "global_step": 128961, "epoch": 1065} {"train_loss": -39.40500259399414, "global_step": 128962, "epoch": 1065} {"train_loss": -39.53132247924805, "global_step": 128963, "epoch": 1065} {"train_loss": -38.767120361328125, "global_step": 128964, "epoch": 1065} {"train_loss": -38.72641372680664, "global_step": 128965, "epoch": 1065} {"train_loss": -38.80416488647461, "global_step": 128966, "epoch": 1065} {"train_loss": -38.17781448364258, "global_step": 128967, "epoch": 1065} {"train_loss": -39.372833251953125, "global_step": 128968, "epoch": 1065} {"train_loss": -39.461212158203125, "global_step": 128969, "epoch": 1065} {"train_loss": -38.456825256347656, "global_step": 128970, "epoch": 1065} {"train_loss": -38.48200988769531, "global_step": 128971, "epoch": 1065} {"train_loss": -39.18974685668945, "global_step": 128972, "epoch": 1065} {"train_loss": -39.239601135253906, "global_step": 128973, "epoch": 1065} {"train_loss": -39.951778411865234, "global_step": 128974, "epoch": 1065} {"train_loss": -39.48579788208008, "global_step": 128975, "epoch": 1065} {"train_loss": -37.85866165161133, "global_step": 128976, "epoch": 1065} {"train_loss": -39.57569122314453, "global_step": 128977, "epoch": 1065} {"train_loss": -39.52167510986328, "global_step": 128978, "epoch": 1065} {"train_loss": -38.59056091308594, "global_step": 128979, "epoch": 1065} {"train_loss": -39.88624954223633, "global_step": 128980, "epoch": 1065} {"train_loss": -38.37355422973633, "global_step": 128981, "epoch": 1065} {"train_loss": -39.97966384887695, "global_step": 128982, "epoch": 1065} {"train_loss": -39.02293014526367, "global_step": 128983, "epoch": 1065} {"train_loss": -39.146095275878906, "global_step": 128984, "epoch": 1065} {"train_loss": -38.33492080436265, "global_step": 128985, "epoch": 1065, "val_loss": 4033721.75} {"train_loss": -38.75963592529297, "global_step": 128986, "epoch": 1066} {"train_loss": -38.46159744262695, "global_step": 128987, "epoch": 1066} {"train_loss": -38.41624069213867, "global_step": 128988, "epoch": 1066} {"train_loss": -38.361053466796875, "global_step": 128989, "epoch": 1066} {"train_loss": -37.405086517333984, "global_step": 128990, "epoch": 1066} {"train_loss": -37.30265426635742, "global_step": 128991, "epoch": 1066} {"train_loss": -37.56991195678711, "global_step": 128992, "epoch": 1066} {"train_loss": -38.617103576660156, "global_step": 128993, "epoch": 1066} {"train_loss": -38.8838996887207, "global_step": 128994, "epoch": 1066} {"train_loss": -37.80623245239258, "global_step": 128995, "epoch": 1066} {"train_loss": -37.40536117553711, "global_step": 128996, "epoch": 1066} {"train_loss": -36.82073211669922, "global_step": 128997, "epoch": 1066} {"train_loss": -39.128536224365234, "global_step": 128998, "epoch": 1066} {"train_loss": -39.262020111083984, "global_step": 128999, "epoch": 1066} {"train_loss": -39.059181213378906, "global_step": 129000, "epoch": 1066} {"train_loss": -38.1232795715332, "global_step": 129001, "epoch": 1066} {"train_loss": -38.86638259887695, "global_step": 129002, "epoch": 1066} {"train_loss": -38.90787887573242, "global_step": 129003, "epoch": 1066} {"train_loss": -38.83312225341797, "global_step": 129004, "epoch": 1066} {"train_loss": -38.879371643066406, "global_step": 129005, "epoch": 1066} {"train_loss": -39.901954650878906, "global_step": 129006, "epoch": 1066} {"train_loss": -39.01226043701172, "global_step": 129007, "epoch": 1066} {"train_loss": -38.0567741394043, "global_step": 129008, "epoch": 1066} {"train_loss": -39.14136505126953, "global_step": 129009, "epoch": 1066} {"train_loss": -38.700416564941406, "global_step": 129010, "epoch": 1066} {"train_loss": -39.307655334472656, "global_step": 129011, "epoch": 1066} {"train_loss": -35.875938415527344, "global_step": 129012, "epoch": 1066} {"train_loss": -38.8143310546875, "global_step": 129013, "epoch": 1066} {"train_loss": -39.90097427368164, "global_step": 129014, "epoch": 1066} {"train_loss": -39.581295013427734, "global_step": 129015, "epoch": 1066} {"train_loss": -39.38585662841797, "global_step": 129016, "epoch": 1066} {"train_loss": -39.29977798461914, "global_step": 129017, "epoch": 1066} {"train_loss": -39.1182975769043, "global_step": 129018, "epoch": 1066} {"train_loss": -39.39580154418945, "global_step": 129019, "epoch": 1066} {"train_loss": -37.364463806152344, "global_step": 129020, "epoch": 1066} {"train_loss": -39.30880355834961, "global_step": 129021, "epoch": 1066} {"train_loss": -39.51123809814453, "global_step": 129022, "epoch": 1066} {"train_loss": -39.2695198059082, "global_step": 129023, "epoch": 1066} {"train_loss": -39.905120849609375, "global_step": 129024, "epoch": 1066} {"train_loss": -40.09457015991211, "global_step": 129025, "epoch": 1066} {"train_loss": -40.039058685302734, "global_step": 129026, "epoch": 1066} {"train_loss": -38.28597640991211, "global_step": 129027, "epoch": 1066} {"train_loss": -40.04747009277344, "global_step": 129028, "epoch": 1066} {"train_loss": -39.8075065612793, "global_step": 129029, "epoch": 1066} {"train_loss": -39.63375473022461, "global_step": 129030, "epoch": 1066} {"train_loss": -40.17739486694336, "global_step": 129031, "epoch": 1066} {"train_loss": -39.111263275146484, "global_step": 129032, "epoch": 1066} {"train_loss": -39.58536911010742, "global_step": 129033, "epoch": 1066} {"train_loss": -38.72439193725586, "global_step": 129034, "epoch": 1066} {"train_loss": -39.67645263671875, "global_step": 129035, "epoch": 1066} {"train_loss": -39.64865493774414, "global_step": 129036, "epoch": 1066} {"train_loss": -38.76469039916992, "global_step": 129037, "epoch": 1066} {"train_loss": -39.64083480834961, "global_step": 129038, "epoch": 1066} {"train_loss": -39.71541213989258, "global_step": 129039, "epoch": 1066} {"train_loss": -40.037269592285156, "global_step": 129040, "epoch": 1066} {"train_loss": -39.673458099365234, "global_step": 129041, "epoch": 1066} {"train_loss": -39.94840621948242, "global_step": 129042, "epoch": 1066} {"train_loss": -40.080162048339844, "global_step": 129043, "epoch": 1066} {"train_loss": -39.86532211303711, "global_step": 129044, "epoch": 1066} {"train_loss": -40.23512649536133, "global_step": 129045, "epoch": 1066} {"train_loss": -39.339290618896484, "global_step": 129046, "epoch": 1066} {"train_loss": -38.09431457519531, "global_step": 129047, "epoch": 1066} {"train_loss": -34.038089752197266, "global_step": 129048, "epoch": 1066} {"train_loss": -26.71990966796875, "global_step": 129049, "epoch": 1066} {"train_loss": -32.6239013671875, "global_step": 129050, "epoch": 1066} {"train_loss": -36.63532638549805, "global_step": 129051, "epoch": 1066} {"train_loss": -37.358455657958984, "global_step": 129052, "epoch": 1066} {"train_loss": -32.439231872558594, "global_step": 129053, "epoch": 1066} {"train_loss": -38.51826477050781, "global_step": 129054, "epoch": 1066} {"train_loss": -35.033180236816406, "global_step": 129055, "epoch": 1066} {"train_loss": -34.629486083984375, "global_step": 129056, "epoch": 1066} {"train_loss": -38.0095329284668, "global_step": 129057, "epoch": 1066} {"train_loss": -34.815765380859375, "global_step": 129058, "epoch": 1066} {"train_loss": -38.16652297973633, "global_step": 129059, "epoch": 1066} {"train_loss": -32.87583923339844, "global_step": 129060, "epoch": 1066} {"train_loss": -38.052467346191406, "global_step": 129061, "epoch": 1066} {"train_loss": -34.119808197021484, "global_step": 129062, "epoch": 1066} {"train_loss": -36.339454650878906, "global_step": 129063, "epoch": 1066} {"train_loss": -37.46707534790039, "global_step": 129064, "epoch": 1066} {"train_loss": -36.96353530883789, "global_step": 129065, "epoch": 1066} {"train_loss": -38.98011779785156, "global_step": 129066, "epoch": 1066} {"train_loss": -36.868324279785156, "global_step": 129067, "epoch": 1066} {"train_loss": -38.213558197021484, "global_step": 129068, "epoch": 1066} {"train_loss": -37.24285888671875, "global_step": 129069, "epoch": 1066} {"train_loss": -36.82973861694336, "global_step": 129070, "epoch": 1066} {"train_loss": -38.20283126831055, "global_step": 129071, "epoch": 1066} {"train_loss": -37.816158294677734, "global_step": 129072, "epoch": 1066} {"train_loss": -37.733619689941406, "global_step": 129073, "epoch": 1066} {"train_loss": -38.148597717285156, "global_step": 129074, "epoch": 1066} {"train_loss": -36.59099197387695, "global_step": 129075, "epoch": 1066} {"train_loss": -38.044185638427734, "global_step": 129076, "epoch": 1066} {"train_loss": -38.40529251098633, "global_step": 129077, "epoch": 1066} {"train_loss": -36.950439453125, "global_step": 129078, "epoch": 1066} {"train_loss": -37.9301872253418, "global_step": 129079, "epoch": 1066} {"train_loss": -38.80349349975586, "global_step": 129080, "epoch": 1066} {"train_loss": -38.73609161376953, "global_step": 129081, "epoch": 1066} {"train_loss": -38.00371551513672, "global_step": 129082, "epoch": 1066} {"train_loss": -38.27256393432617, "global_step": 129083, "epoch": 1066} {"train_loss": -38.927734375, "global_step": 129084, "epoch": 1066} {"train_loss": -38.85892105102539, "global_step": 129085, "epoch": 1066} {"train_loss": -39.2163200378418, "global_step": 129086, "epoch": 1066} {"train_loss": -38.828487396240234, "global_step": 129087, "epoch": 1066} {"train_loss": -37.34803009033203, "global_step": 129088, "epoch": 1066} {"train_loss": -38.77693557739258, "global_step": 129089, "epoch": 1066} {"train_loss": -38.566226959228516, "global_step": 129090, "epoch": 1066} {"train_loss": -38.72188186645508, "global_step": 129091, "epoch": 1066} {"train_loss": -39.26467514038086, "global_step": 129092, "epoch": 1066} {"train_loss": -38.90584945678711, "global_step": 129093, "epoch": 1066} {"train_loss": -39.0811653137207, "global_step": 129094, "epoch": 1066} {"train_loss": -38.7132682800293, "global_step": 129095, "epoch": 1066} {"train_loss": -39.039306640625, "global_step": 129096, "epoch": 1066} {"train_loss": -38.61300277709961, "global_step": 129097, "epoch": 1066} {"train_loss": -38.020103454589844, "global_step": 129098, "epoch": 1066} {"train_loss": -38.047542572021484, "global_step": 129099, "epoch": 1066} {"train_loss": -38.907894134521484, "global_step": 129100, "epoch": 1066} {"train_loss": -38.70094680786133, "global_step": 129101, "epoch": 1066} {"train_loss": -39.50105667114258, "global_step": 129102, "epoch": 1066} {"train_loss": -39.125728607177734, "global_step": 129103, "epoch": 1066} {"train_loss": -39.138553619384766, "global_step": 129104, "epoch": 1066} {"train_loss": -39.099239349365234, "global_step": 129105, "epoch": 1066} {"train_loss": -38.23673226222519, "global_step": 129106, "epoch": 1066, "val_loss": 2618900.0} {"train_loss": -39.68653869628906, "global_step": 129107, "epoch": 1067} {"train_loss": -38.958282470703125, "global_step": 129108, "epoch": 1067} {"train_loss": -38.64164733886719, "global_step": 129109, "epoch": 1067} {"train_loss": -39.8394660949707, "global_step": 129110, "epoch": 1067} {"train_loss": -38.82345199584961, "global_step": 129111, "epoch": 1067} {"train_loss": -39.14759063720703, "global_step": 129112, "epoch": 1067} {"train_loss": -39.56582260131836, "global_step": 129113, "epoch": 1067} {"train_loss": -39.3636360168457, "global_step": 129114, "epoch": 1067} {"train_loss": -39.47621154785156, "global_step": 129115, "epoch": 1067} {"train_loss": -40.088558197021484, "global_step": 129116, "epoch": 1067} {"train_loss": -39.02374267578125, "global_step": 129117, "epoch": 1067} {"train_loss": -38.09734344482422, "global_step": 129118, "epoch": 1067} {"train_loss": -38.627174377441406, "global_step": 129119, "epoch": 1067} {"train_loss": -39.678192138671875, "global_step": 129120, "epoch": 1067} {"train_loss": -40.01154708862305, "global_step": 129121, "epoch": 1067} {"train_loss": -39.659515380859375, "global_step": 129122, "epoch": 1067} {"train_loss": -40.195003509521484, "global_step": 129123, "epoch": 1067} {"train_loss": -38.96247863769531, "global_step": 129124, "epoch": 1067} {"train_loss": -39.47478103637695, "global_step": 129125, "epoch": 1067} {"train_loss": -38.94296646118164, "global_step": 129126, "epoch": 1067} {"train_loss": -39.38916778564453, "global_step": 129127, "epoch": 1067} {"train_loss": -37.50263595581055, "global_step": 129128, "epoch": 1067} {"train_loss": -38.74665832519531, "global_step": 129129, "epoch": 1067} {"train_loss": -40.089603424072266, "global_step": 129130, "epoch": 1067} {"train_loss": -38.43923568725586, "global_step": 129131, "epoch": 1067} {"train_loss": -38.4605827331543, "global_step": 129132, "epoch": 1067} {"train_loss": -38.31949234008789, "global_step": 129133, "epoch": 1067} {"train_loss": -38.287452697753906, "global_step": 129134, "epoch": 1067} {"train_loss": -39.78606033325195, "global_step": 129135, "epoch": 1067} {"train_loss": -38.90458297729492, "global_step": 129136, "epoch": 1067} {"train_loss": -40.2991943359375, "global_step": 129137, "epoch": 1067} {"train_loss": -39.472835540771484, "global_step": 129138, "epoch": 1067} {"train_loss": -35.99026107788086, "global_step": 129139, "epoch": 1067} {"train_loss": -35.368221282958984, "global_step": 129140, "epoch": 1067} {"train_loss": -31.375268936157227, "global_step": 129141, "epoch": 1067} {"train_loss": -34.04029083251953, "global_step": 129142, "epoch": 1067} {"train_loss": -38.10641098022461, "global_step": 129143, "epoch": 1067} {"train_loss": -39.471370697021484, "global_step": 129144, "epoch": 1067} {"train_loss": -34.66933822631836, "global_step": 129145, "epoch": 1067} {"train_loss": -35.70418167114258, "global_step": 129146, "epoch": 1067} {"train_loss": -38.452613830566406, "global_step": 129147, "epoch": 1067} {"train_loss": -37.428192138671875, "global_step": 129148, "epoch": 1067} {"train_loss": -37.47467803955078, "global_step": 129149, "epoch": 1067} {"train_loss": -38.236244201660156, "global_step": 129150, "epoch": 1067} {"train_loss": -37.41025924682617, "global_step": 129151, "epoch": 1067} {"train_loss": -33.93733596801758, "global_step": 129152, "epoch": 1067} {"train_loss": -37.889068603515625, "global_step": 129153, "epoch": 1067} {"train_loss": -35.59302520751953, "global_step": 129154, "epoch": 1067} {"train_loss": -36.70304489135742, "global_step": 129155, "epoch": 1067} {"train_loss": -37.54054641723633, "global_step": 129156, "epoch": 1067} {"train_loss": -38.25518035888672, "global_step": 129157, "epoch": 1067} {"train_loss": -36.450958251953125, "global_step": 129158, "epoch": 1067} {"train_loss": -38.068660736083984, "global_step": 129159, "epoch": 1067} {"train_loss": -36.90604782104492, "global_step": 129160, "epoch": 1067} {"train_loss": -37.51105880737305, "global_step": 129161, "epoch": 1067} {"train_loss": -37.8565559387207, "global_step": 129162, "epoch": 1067} {"train_loss": -33.25433349609375, "global_step": 129163, "epoch": 1067} {"train_loss": -38.058021545410156, "global_step": 129164, "epoch": 1067} {"train_loss": -37.682613372802734, "global_step": 129165, "epoch": 1067} {"train_loss": -37.648189544677734, "global_step": 129166, "epoch": 1067} {"train_loss": -37.29204559326172, "global_step": 129167, "epoch": 1067} {"train_loss": -37.76507568359375, "global_step": 129168, "epoch": 1067} {"train_loss": -37.88786315917969, "global_step": 129169, "epoch": 1067} {"train_loss": -36.278419494628906, "global_step": 129170, "epoch": 1067} {"train_loss": -37.88300704956055, "global_step": 129171, "epoch": 1067} {"train_loss": -38.23279571533203, "global_step": 129172, "epoch": 1067} {"train_loss": -35.580020904541016, "global_step": 129173, "epoch": 1067} {"train_loss": -32.29541015625, "global_step": 129174, "epoch": 1067} {"train_loss": -36.599857330322266, "global_step": 129175, "epoch": 1067} {"train_loss": -38.535518646240234, "global_step": 129176, "epoch": 1067} {"train_loss": -37.09440231323242, "global_step": 129177, "epoch": 1067} {"train_loss": -35.14131164550781, "global_step": 129178, "epoch": 1067} {"train_loss": -33.84171676635742, "global_step": 129179, "epoch": 1067} {"train_loss": -37.984676361083984, "global_step": 129180, "epoch": 1067} {"train_loss": -38.28987503051758, "global_step": 129181, "epoch": 1067} {"train_loss": -36.53983688354492, "global_step": 129182, "epoch": 1067} {"train_loss": -36.607112884521484, "global_step": 129183, "epoch": 1067} {"train_loss": -32.79327392578125, "global_step": 129184, "epoch": 1067} {"train_loss": -37.355342864990234, "global_step": 129185, "epoch": 1067} {"train_loss": -38.2126579284668, "global_step": 129186, "epoch": 1067} {"train_loss": -37.33543395996094, "global_step": 129187, "epoch": 1067} {"train_loss": -36.68650436401367, "global_step": 129188, "epoch": 1067} {"train_loss": -37.23142623901367, "global_step": 129189, "epoch": 1067} {"train_loss": -37.432472229003906, "global_step": 129190, "epoch": 1067} {"train_loss": -36.14502716064453, "global_step": 129191, "epoch": 1067} {"train_loss": -34.890769958496094, "global_step": 129192, "epoch": 1067} {"train_loss": -37.1737174987793, "global_step": 129193, "epoch": 1067} {"train_loss": -38.10276412963867, "global_step": 129194, "epoch": 1067} {"train_loss": -37.32682418823242, "global_step": 129195, "epoch": 1067} {"train_loss": -37.752315521240234, "global_step": 129196, "epoch": 1067} {"train_loss": -37.77712631225586, "global_step": 129197, "epoch": 1067} {"train_loss": -38.182586669921875, "global_step": 129198, "epoch": 1067} {"train_loss": -38.10040283203125, "global_step": 129199, "epoch": 1067} {"train_loss": -38.12586975097656, "global_step": 129200, "epoch": 1067} {"train_loss": -37.916282653808594, "global_step": 129201, "epoch": 1067} {"train_loss": -37.611175537109375, "global_step": 129202, "epoch": 1067} {"train_loss": -37.575531005859375, "global_step": 129203, "epoch": 1067} {"train_loss": -38.17656326293945, "global_step": 129204, "epoch": 1067} {"train_loss": -37.37125778198242, "global_step": 129205, "epoch": 1067} {"train_loss": -38.20815658569336, "global_step": 129206, "epoch": 1067} {"train_loss": -37.714698791503906, "global_step": 129207, "epoch": 1067} {"train_loss": -36.81443405151367, "global_step": 129208, "epoch": 1067} {"train_loss": -38.29680252075195, "global_step": 129209, "epoch": 1067} {"train_loss": -37.96343994140625, "global_step": 129210, "epoch": 1067} {"train_loss": -37.21522903442383, "global_step": 129211, "epoch": 1067} {"train_loss": -37.2472038269043, "global_step": 129212, "epoch": 1067} {"train_loss": -38.37766647338867, "global_step": 129213, "epoch": 1067} {"train_loss": -39.031341552734375, "global_step": 129214, "epoch": 1067} {"train_loss": -38.268558502197266, "global_step": 129215, "epoch": 1067} {"train_loss": -39.2615966796875, "global_step": 129216, "epoch": 1067} {"train_loss": -38.88149642944336, "global_step": 129217, "epoch": 1067} {"train_loss": -38.63615798950195, "global_step": 129218, "epoch": 1067} {"train_loss": -38.93859100341797, "global_step": 129219, "epoch": 1067} {"train_loss": -39.187992095947266, "global_step": 129220, "epoch": 1067} {"train_loss": -38.76043701171875, "global_step": 129221, "epoch": 1067} {"train_loss": -38.71175003051758, "global_step": 129222, "epoch": 1067} {"train_loss": -38.899742126464844, "global_step": 129223, "epoch": 1067} {"train_loss": -39.378395080566406, "global_step": 129224, "epoch": 1067} {"train_loss": -38.741756439208984, "global_step": 129225, "epoch": 1067} {"train_loss": -39.06638717651367, "global_step": 129226, "epoch": 1067} {"train_loss": -37.77523089637441, "global_step": 129227, "epoch": 1067, "val_loss": 2764033.25} {"train_loss": -39.0281982421875, "global_step": 129228, "epoch": 1068} {"train_loss": -38.57750701904297, "global_step": 129229, "epoch": 1068} {"train_loss": -38.870182037353516, "global_step": 129230, "epoch": 1068} {"train_loss": -38.6279296875, "global_step": 129231, "epoch": 1068} {"train_loss": -38.94585037231445, "global_step": 129232, "epoch": 1068} {"train_loss": -38.94416046142578, "global_step": 129233, "epoch": 1068} {"train_loss": -38.78715133666992, "global_step": 129234, "epoch": 1068} {"train_loss": -39.63271713256836, "global_step": 129235, "epoch": 1068} {"train_loss": -38.875099182128906, "global_step": 129236, "epoch": 1068} {"train_loss": -39.08976364135742, "global_step": 129237, "epoch": 1068} {"train_loss": -38.46882629394531, "global_step": 129238, "epoch": 1068} {"train_loss": -39.019752502441406, "global_step": 129239, "epoch": 1068} {"train_loss": -38.60786056518555, "global_step": 129240, "epoch": 1068} {"train_loss": -38.91923141479492, "global_step": 129241, "epoch": 1068} {"train_loss": -38.91056442260742, "global_step": 129242, "epoch": 1068} {"train_loss": -39.7404670715332, "global_step": 129243, "epoch": 1068} {"train_loss": -38.29225158691406, "global_step": 129244, "epoch": 1068} {"train_loss": -38.50849533081055, "global_step": 129245, "epoch": 1068} {"train_loss": -39.354705810546875, "global_step": 129246, "epoch": 1068} {"train_loss": -38.76935577392578, "global_step": 129247, "epoch": 1068} {"train_loss": -39.44175338745117, "global_step": 129248, "epoch": 1068} {"train_loss": -38.983089447021484, "global_step": 129249, "epoch": 1068} {"train_loss": -39.966182708740234, "global_step": 129250, "epoch": 1068} {"train_loss": -39.350650787353516, "global_step": 129251, "epoch": 1068} {"train_loss": -39.825927734375, "global_step": 129252, "epoch": 1068} {"train_loss": -39.40895462036133, "global_step": 129253, "epoch": 1068} {"train_loss": -39.38970947265625, "global_step": 129254, "epoch": 1068} {"train_loss": -39.2507209777832, "global_step": 129255, "epoch": 1068} {"train_loss": -39.97913360595703, "global_step": 129256, "epoch": 1068} {"train_loss": -39.293392181396484, "global_step": 129257, "epoch": 1068} {"train_loss": -38.32943344116211, "global_step": 129258, "epoch": 1068} {"train_loss": -39.84648513793945, "global_step": 129259, "epoch": 1068} {"train_loss": -38.5253791809082, "global_step": 129260, "epoch": 1068} {"train_loss": -39.16691207885742, "global_step": 129261, "epoch": 1068} {"train_loss": -39.420597076416016, "global_step": 129262, "epoch": 1068} {"train_loss": -38.56016540527344, "global_step": 129263, "epoch": 1068} {"train_loss": -38.944488525390625, "global_step": 129264, "epoch": 1068} {"train_loss": -38.900875091552734, "global_step": 129265, "epoch": 1068} {"train_loss": -38.38153076171875, "global_step": 129266, "epoch": 1068} {"train_loss": -38.556758880615234, "global_step": 129267, "epoch": 1068} {"train_loss": -38.32357406616211, "global_step": 129268, "epoch": 1068} {"train_loss": -39.00642776489258, "global_step": 129269, "epoch": 1068} {"train_loss": -39.17920684814453, "global_step": 129270, "epoch": 1068} {"train_loss": -38.6434211730957, "global_step": 129271, "epoch": 1068} {"train_loss": -38.98170852661133, "global_step": 129272, "epoch": 1068} {"train_loss": -38.07117462158203, "global_step": 129273, "epoch": 1068} {"train_loss": -37.8197135925293, "global_step": 129274, "epoch": 1068} {"train_loss": -38.555965423583984, "global_step": 129275, "epoch": 1068} {"train_loss": -39.30317306518555, "global_step": 129276, "epoch": 1068} {"train_loss": -38.981605529785156, "global_step": 129277, "epoch": 1068} {"train_loss": -38.2357292175293, "global_step": 129278, "epoch": 1068} {"train_loss": -37.17985916137695, "global_step": 129279, "epoch": 1068} {"train_loss": -37.622074127197266, "global_step": 129280, "epoch": 1068} {"train_loss": -38.2753791809082, "global_step": 129281, "epoch": 1068} {"train_loss": -37.85102462768555, "global_step": 129282, "epoch": 1068} {"train_loss": -38.06040573120117, "global_step": 129283, "epoch": 1068} {"train_loss": -38.09395980834961, "global_step": 129284, "epoch": 1068} {"train_loss": -38.222042083740234, "global_step": 129285, "epoch": 1068} {"train_loss": -38.01969528198242, "global_step": 129286, "epoch": 1068} {"train_loss": -39.862144470214844, "global_step": 129287, "epoch": 1068} {"train_loss": -38.449790954589844, "global_step": 129288, "epoch": 1068} {"train_loss": -38.19001007080078, "global_step": 129289, "epoch": 1068} {"train_loss": -38.44684600830078, "global_step": 129290, "epoch": 1068} {"train_loss": -39.200496673583984, "global_step": 129291, "epoch": 1068} {"train_loss": -36.78566360473633, "global_step": 129292, "epoch": 1068} {"train_loss": -38.76253128051758, "global_step": 129293, "epoch": 1068} {"train_loss": -39.339256286621094, "global_step": 129294, "epoch": 1068} {"train_loss": -39.408843994140625, "global_step": 129295, "epoch": 1068} {"train_loss": -39.089725494384766, "global_step": 129296, "epoch": 1068} {"train_loss": -36.32266616821289, "global_step": 129297, "epoch": 1068} {"train_loss": -39.9144401550293, "global_step": 129298, "epoch": 1068} {"train_loss": -37.61135482788086, "global_step": 129299, "epoch": 1068} {"train_loss": -39.4886589050293, "global_step": 129300, "epoch": 1068} {"train_loss": -37.90724182128906, "global_step": 129301, "epoch": 1068} {"train_loss": -39.48032760620117, "global_step": 129302, "epoch": 1068} {"train_loss": -38.798248291015625, "global_step": 129303, "epoch": 1068} {"train_loss": -37.58406448364258, "global_step": 129304, "epoch": 1068} {"train_loss": -37.670345306396484, "global_step": 129305, "epoch": 1068} {"train_loss": -38.66789245605469, "global_step": 129306, "epoch": 1068} {"train_loss": -38.15705490112305, "global_step": 129307, "epoch": 1068} {"train_loss": -38.0378532409668, "global_step": 129308, "epoch": 1068} {"train_loss": -39.178035736083984, "global_step": 129309, "epoch": 1068} {"train_loss": -39.737911224365234, "global_step": 129310, "epoch": 1068} {"train_loss": -38.69247055053711, "global_step": 129311, "epoch": 1068} {"train_loss": -39.07073974609375, "global_step": 129312, "epoch": 1068} {"train_loss": -39.21772384643555, "global_step": 129313, "epoch": 1068} {"train_loss": -38.770118713378906, "global_step": 129314, "epoch": 1068} {"train_loss": -38.43449020385742, "global_step": 129315, "epoch": 1068} {"train_loss": -40.00595474243164, "global_step": 129316, "epoch": 1068} {"train_loss": -39.25149154663086, "global_step": 129317, "epoch": 1068} {"train_loss": -39.213043212890625, "global_step": 129318, "epoch": 1068} {"train_loss": -34.36677169799805, "global_step": 129319, "epoch": 1068} {"train_loss": -39.00100326538086, "global_step": 129320, "epoch": 1068} {"train_loss": -39.74891662597656, "global_step": 129321, "epoch": 1068} {"train_loss": -39.190765380859375, "global_step": 129322, "epoch": 1068} {"train_loss": -39.39984130859375, "global_step": 129323, "epoch": 1068} {"train_loss": -39.56504821777344, "global_step": 129324, "epoch": 1068} {"train_loss": -38.96633529663086, "global_step": 129325, "epoch": 1068} {"train_loss": -39.24558639526367, "global_step": 129326, "epoch": 1068} {"train_loss": -38.62750244140625, "global_step": 129327, "epoch": 1068} {"train_loss": -39.395633697509766, "global_step": 129328, "epoch": 1068} {"train_loss": -38.117061614990234, "global_step": 129329, "epoch": 1068} {"train_loss": -39.07085037231445, "global_step": 129330, "epoch": 1068} {"train_loss": -38.91932678222656, "global_step": 129331, "epoch": 1068} {"train_loss": -39.09109878540039, "global_step": 129332, "epoch": 1068} {"train_loss": -37.94845199584961, "global_step": 129333, "epoch": 1068} {"train_loss": -37.38799285888672, "global_step": 129334, "epoch": 1068} {"train_loss": -39.0598030090332, "global_step": 129335, "epoch": 1068} {"train_loss": -38.89823913574219, "global_step": 129336, "epoch": 1068} {"train_loss": -38.32509994506836, "global_step": 129337, "epoch": 1068} {"train_loss": -38.39203643798828, "global_step": 129338, "epoch": 1068} {"train_loss": -39.20492172241211, "global_step": 129339, "epoch": 1068} {"train_loss": -37.766109466552734, "global_step": 129340, "epoch": 1068} {"train_loss": -38.030723571777344, "global_step": 129341, "epoch": 1068} {"train_loss": -39.90509033203125, "global_step": 129342, "epoch": 1068} {"train_loss": -38.72193145751953, "global_step": 129343, "epoch": 1068} {"train_loss": -38.667884826660156, "global_step": 129344, "epoch": 1068} {"train_loss": -40.087223052978516, "global_step": 129345, "epoch": 1068} {"train_loss": -38.91328048706055, "global_step": 129346, "epoch": 1068} {"train_loss": -39.61262893676758, "global_step": 129347, "epoch": 1068} {"train_loss": -38.77805148668526, "global_step": 129348, "epoch": 1068, "val_loss": 2763792.0} {"train_loss": -39.0131950378418, "global_step": 129349, "epoch": 1069} {"train_loss": -39.443267822265625, "global_step": 129350, "epoch": 1069} {"train_loss": -39.53194808959961, "global_step": 129351, "epoch": 1069} {"train_loss": -39.10133743286133, "global_step": 129352, "epoch": 1069} {"train_loss": -39.456180572509766, "global_step": 129353, "epoch": 1069} {"train_loss": -40.391475677490234, "global_step": 129354, "epoch": 1069} {"train_loss": -39.665260314941406, "global_step": 129355, "epoch": 1069} {"train_loss": -39.2514533996582, "global_step": 129356, "epoch": 1069} {"train_loss": -39.490638732910156, "global_step": 129357, "epoch": 1069} {"train_loss": -39.38407897949219, "global_step": 129358, "epoch": 1069} {"train_loss": -39.47605514526367, "global_step": 129359, "epoch": 1069} {"train_loss": -38.37183380126953, "global_step": 129360, "epoch": 1069} {"train_loss": -37.224090576171875, "global_step": 129361, "epoch": 1069} {"train_loss": -37.53219223022461, "global_step": 129362, "epoch": 1069} {"train_loss": -37.08695602416992, "global_step": 129363, "epoch": 1069} {"train_loss": -38.325286865234375, "global_step": 129364, "epoch": 1069} {"train_loss": -36.123592376708984, "global_step": 129365, "epoch": 1069} {"train_loss": -35.34278106689453, "global_step": 129366, "epoch": 1069} {"train_loss": -29.928592681884766, "global_step": 129367, "epoch": 1069} {"train_loss": -22.951404571533203, "global_step": 129368, "epoch": 1069} {"train_loss": -35.06108474731445, "global_step": 129369, "epoch": 1069} {"train_loss": -35.777374267578125, "global_step": 129370, "epoch": 1069} {"train_loss": -27.672260284423828, "global_step": 129371, "epoch": 1069} {"train_loss": -36.64918518066406, "global_step": 129372, "epoch": 1069} {"train_loss": -35.4511604309082, "global_step": 129373, "epoch": 1069} {"train_loss": -33.437374114990234, "global_step": 129374, "epoch": 1069} {"train_loss": -36.56789779663086, "global_step": 129375, "epoch": 1069} {"train_loss": -34.86577606201172, "global_step": 129376, "epoch": 1069} {"train_loss": -35.61959457397461, "global_step": 129377, "epoch": 1069} {"train_loss": -35.56764602661133, "global_step": 129378, "epoch": 1069} {"train_loss": -37.478939056396484, "global_step": 129379, "epoch": 1069} {"train_loss": -35.88645553588867, "global_step": 129380, "epoch": 1069} {"train_loss": -36.12919235229492, "global_step": 129381, "epoch": 1069} {"train_loss": -36.85137176513672, "global_step": 129382, "epoch": 1069} {"train_loss": -38.33058547973633, "global_step": 129383, "epoch": 1069} {"train_loss": -36.752410888671875, "global_step": 129384, "epoch": 1069} {"train_loss": -38.21848678588867, "global_step": 129385, "epoch": 1069} {"train_loss": -36.65789794921875, "global_step": 129386, "epoch": 1069} {"train_loss": -37.59440231323242, "global_step": 129387, "epoch": 1069} {"train_loss": -38.17380905151367, "global_step": 129388, "epoch": 1069} {"train_loss": -36.735816955566406, "global_step": 129389, "epoch": 1069} {"train_loss": -37.568145751953125, "global_step": 129390, "epoch": 1069} {"train_loss": -38.00395584106445, "global_step": 129391, "epoch": 1069} {"train_loss": -37.912776947021484, "global_step": 129392, "epoch": 1069} {"train_loss": -38.123512268066406, "global_step": 129393, "epoch": 1069} {"train_loss": -37.74650955200195, "global_step": 129394, "epoch": 1069} {"train_loss": -37.196285247802734, "global_step": 129395, "epoch": 1069} {"train_loss": -38.43537521362305, "global_step": 129396, "epoch": 1069} {"train_loss": -38.47023391723633, "global_step": 129397, "epoch": 1069} {"train_loss": -38.59645462036133, "global_step": 129398, "epoch": 1069} {"train_loss": -38.253536224365234, "global_step": 129399, "epoch": 1069} {"train_loss": -38.94816970825195, "global_step": 129400, "epoch": 1069} {"train_loss": -35.04952621459961, "global_step": 129401, "epoch": 1069} {"train_loss": -38.8385124206543, "global_step": 129402, "epoch": 1069} {"train_loss": -37.11417770385742, "global_step": 129403, "epoch": 1069} {"train_loss": -38.705074310302734, "global_step": 129404, "epoch": 1069} {"train_loss": -38.635475158691406, "global_step": 129405, "epoch": 1069} {"train_loss": -37.989723205566406, "global_step": 129406, "epoch": 1069} {"train_loss": -39.16709518432617, "global_step": 129407, "epoch": 1069} {"train_loss": -38.71025466918945, "global_step": 129408, "epoch": 1069} {"train_loss": -32.91190719604492, "global_step": 129409, "epoch": 1069} {"train_loss": -39.25435256958008, "global_step": 129410, "epoch": 1069} {"train_loss": -34.40482711791992, "global_step": 129411, "epoch": 1069} {"train_loss": -38.51056671142578, "global_step": 129412, "epoch": 1069} {"train_loss": -38.47573471069336, "global_step": 129413, "epoch": 1069} {"train_loss": -38.46012496948242, "global_step": 129414, "epoch": 1069} {"train_loss": -37.7028694152832, "global_step": 129415, "epoch": 1069} {"train_loss": -38.45240783691406, "global_step": 129416, "epoch": 1069} {"train_loss": -29.1738338470459, "global_step": 129417, "epoch": 1069} {"train_loss": -38.45924758911133, "global_step": 129418, "epoch": 1069} {"train_loss": -38.31623077392578, "global_step": 129419, "epoch": 1069} {"train_loss": -38.19953155517578, "global_step": 129420, "epoch": 1069} {"train_loss": -38.382240295410156, "global_step": 129421, "epoch": 1069} {"train_loss": -38.8675651550293, "global_step": 129422, "epoch": 1069} {"train_loss": -36.515892028808594, "global_step": 129423, "epoch": 1069} {"train_loss": -37.65851974487305, "global_step": 129424, "epoch": 1069} {"train_loss": -38.251014709472656, "global_step": 129425, "epoch": 1069} {"train_loss": -37.32477569580078, "global_step": 129426, "epoch": 1069} {"train_loss": -38.09013748168945, "global_step": 129427, "epoch": 1069} {"train_loss": -37.94085693359375, "global_step": 129428, "epoch": 1069} {"train_loss": -38.2237548828125, "global_step": 129429, "epoch": 1069} {"train_loss": -38.75843048095703, "global_step": 129430, "epoch": 1069} {"train_loss": -38.73365020751953, "global_step": 129431, "epoch": 1069} {"train_loss": -38.428565979003906, "global_step": 129432, "epoch": 1069} {"train_loss": -37.42458724975586, "global_step": 129433, "epoch": 1069} {"train_loss": -38.00992202758789, "global_step": 129434, "epoch": 1069} {"train_loss": -38.02451705932617, "global_step": 129435, "epoch": 1069} {"train_loss": -39.21025466918945, "global_step": 129436, "epoch": 1069} {"train_loss": -39.09749984741211, "global_step": 129437, "epoch": 1069} {"train_loss": -39.221317291259766, "global_step": 129438, "epoch": 1069} {"train_loss": -38.46638107299805, "global_step": 129439, "epoch": 1069} {"train_loss": -37.23228073120117, "global_step": 129440, "epoch": 1069} {"train_loss": -38.24665451049805, "global_step": 129441, "epoch": 1069} {"train_loss": -38.84815216064453, "global_step": 129442, "epoch": 1069} {"train_loss": -39.66028594970703, "global_step": 129443, "epoch": 1069} {"train_loss": -38.89310836791992, "global_step": 129444, "epoch": 1069} {"train_loss": -38.65281295776367, "global_step": 129445, "epoch": 1069} {"train_loss": -38.66267776489258, "global_step": 129446, "epoch": 1069} {"train_loss": -39.497764587402344, "global_step": 129447, "epoch": 1069} {"train_loss": -39.244930267333984, "global_step": 129448, "epoch": 1069} {"train_loss": -39.666648864746094, "global_step": 129449, "epoch": 1069} {"train_loss": -39.30398178100586, "global_step": 129450, "epoch": 1069} {"train_loss": -38.32627487182617, "global_step": 129451, "epoch": 1069} {"train_loss": -38.808265686035156, "global_step": 129452, "epoch": 1069} {"train_loss": -39.11052322387695, "global_step": 129453, "epoch": 1069} {"train_loss": -39.710906982421875, "global_step": 129454, "epoch": 1069} {"train_loss": -39.66817092895508, "global_step": 129455, "epoch": 1069} {"train_loss": -38.85873794555664, "global_step": 129456, "epoch": 1069} {"train_loss": -39.306705474853516, "global_step": 129457, "epoch": 1069} {"train_loss": -39.640869140625, "global_step": 129458, "epoch": 1069} {"train_loss": -39.320709228515625, "global_step": 129459, "epoch": 1069} {"train_loss": -38.87910079956055, "global_step": 129460, "epoch": 1069} {"train_loss": -39.1842041015625, "global_step": 129461, "epoch": 1069} {"train_loss": -39.18830871582031, "global_step": 129462, "epoch": 1069} {"train_loss": -39.374000549316406, "global_step": 129463, "epoch": 1069} {"train_loss": -39.128013610839844, "global_step": 129464, "epoch": 1069} {"train_loss": -31.0181827545166, "global_step": 129465, "epoch": 1069} {"train_loss": -39.8015022277832, "global_step": 129466, "epoch": 1069} {"train_loss": -39.153228759765625, "global_step": 129467, "epoch": 1069} {"train_loss": -37.16054153442383, "global_step": 129468, "epoch": 1069} {"train_loss": -37.66904045924667, "global_step": 129469, "epoch": 1069, "val_loss": 3197517.25} {"train_loss": -37.59324645996094, "global_step": 129470, "epoch": 1070} {"train_loss": -36.466156005859375, "global_step": 129471, "epoch": 1070} {"train_loss": -38.838478088378906, "global_step": 129472, "epoch": 1070} {"train_loss": -38.501216888427734, "global_step": 129473, "epoch": 1070} {"train_loss": -39.28278732299805, "global_step": 129474, "epoch": 1070} {"train_loss": -38.99877166748047, "global_step": 129475, "epoch": 1070} {"train_loss": -37.96666717529297, "global_step": 129476, "epoch": 1070} {"train_loss": -38.48066329956055, "global_step": 129477, "epoch": 1070} {"train_loss": -37.355770111083984, "global_step": 129478, "epoch": 1070} {"train_loss": -36.35321807861328, "global_step": 129479, "epoch": 1070} {"train_loss": -37.766876220703125, "global_step": 129480, "epoch": 1070} {"train_loss": -38.7021598815918, "global_step": 129481, "epoch": 1070} {"train_loss": -39.0086669921875, "global_step": 129482, "epoch": 1070} {"train_loss": -38.57984924316406, "global_step": 129483, "epoch": 1070} {"train_loss": -37.285560607910156, "global_step": 129484, "epoch": 1070} {"train_loss": -38.0124626159668, "global_step": 129485, "epoch": 1070} {"train_loss": -37.4464225769043, "global_step": 129486, "epoch": 1070} {"train_loss": -38.40017318725586, "global_step": 129487, "epoch": 1070} {"train_loss": -37.61146926879883, "global_step": 129488, "epoch": 1070} {"train_loss": -38.41453170776367, "global_step": 129489, "epoch": 1070} {"train_loss": -37.93097686767578, "global_step": 129490, "epoch": 1070} {"train_loss": -37.9304313659668, "global_step": 129491, "epoch": 1070} {"train_loss": -37.3420524597168, "global_step": 129492, "epoch": 1070} {"train_loss": -38.23140335083008, "global_step": 129493, "epoch": 1070} {"train_loss": -37.9354248046875, "global_step": 129494, "epoch": 1070} {"train_loss": -38.75934600830078, "global_step": 129495, "epoch": 1070} {"train_loss": -38.16834259033203, "global_step": 129496, "epoch": 1070} {"train_loss": -36.135963439941406, "global_step": 129497, "epoch": 1070} {"train_loss": -38.37405776977539, "global_step": 129498, "epoch": 1070} {"train_loss": -37.61039352416992, "global_step": 129499, "epoch": 1070} {"train_loss": -37.22498321533203, "global_step": 129500, "epoch": 1070} {"train_loss": -37.2138557434082, "global_step": 129501, "epoch": 1070} {"train_loss": -38.02393341064453, "global_step": 129502, "epoch": 1070} {"train_loss": -37.132503509521484, "global_step": 129503, "epoch": 1070} {"train_loss": -37.945674896240234, "global_step": 129504, "epoch": 1070} {"train_loss": -37.47762680053711, "global_step": 129505, "epoch": 1070} {"train_loss": -38.19657516479492, "global_step": 129506, "epoch": 1070} {"train_loss": -37.12091064453125, "global_step": 129507, "epoch": 1070} {"train_loss": -38.00611114501953, "global_step": 129508, "epoch": 1070} {"train_loss": -36.70957565307617, "global_step": 129509, "epoch": 1070} {"train_loss": -38.631248474121094, "global_step": 129510, "epoch": 1070} {"train_loss": -38.29537582397461, "global_step": 129511, "epoch": 1070} {"train_loss": -38.06776809692383, "global_step": 129512, "epoch": 1070} {"train_loss": -38.16728210449219, "global_step": 129513, "epoch": 1070} {"train_loss": -38.48615264892578, "global_step": 129514, "epoch": 1070} {"train_loss": -38.43135452270508, "global_step": 129515, "epoch": 1070} {"train_loss": -38.46149826049805, "global_step": 129516, "epoch": 1070} {"train_loss": -37.957275390625, "global_step": 129517, "epoch": 1070} {"train_loss": -37.37425994873047, "global_step": 129518, "epoch": 1070} {"train_loss": -37.60576248168945, "global_step": 129519, "epoch": 1070} {"train_loss": -38.58534240722656, "global_step": 129520, "epoch": 1070} {"train_loss": -37.82459259033203, "global_step": 129521, "epoch": 1070} {"train_loss": -37.013797760009766, "global_step": 129522, "epoch": 1070} {"train_loss": -36.21242904663086, "global_step": 129523, "epoch": 1070} {"train_loss": -38.30411911010742, "global_step": 129524, "epoch": 1070} {"train_loss": -36.1695671081543, "global_step": 129525, "epoch": 1070} {"train_loss": -35.500667572021484, "global_step": 129526, "epoch": 1070} {"train_loss": -37.192264556884766, "global_step": 129527, "epoch": 1070} {"train_loss": -38.56190490722656, "global_step": 129528, "epoch": 1070} {"train_loss": -37.505760192871094, "global_step": 129529, "epoch": 1070} {"train_loss": -37.95858383178711, "global_step": 129530, "epoch": 1070} {"train_loss": -38.37688064575195, "global_step": 129531, "epoch": 1070} {"train_loss": -38.52360916137695, "global_step": 129532, "epoch": 1070} {"train_loss": -39.62221908569336, "global_step": 129533, "epoch": 1070} {"train_loss": -38.511104583740234, "global_step": 129534, "epoch": 1070} {"train_loss": -39.02145004272461, "global_step": 129535, "epoch": 1070} {"train_loss": -38.72447967529297, "global_step": 129536, "epoch": 1070} {"train_loss": -38.93394088745117, "global_step": 129537, "epoch": 1070} {"train_loss": -39.24114990234375, "global_step": 129538, "epoch": 1070} {"train_loss": -38.744930267333984, "global_step": 129539, "epoch": 1070} {"train_loss": -39.584102630615234, "global_step": 129540, "epoch": 1070} {"train_loss": -39.41452407836914, "global_step": 129541, "epoch": 1070} {"train_loss": -37.79374313354492, "global_step": 129542, "epoch": 1070} {"train_loss": -38.13639450073242, "global_step": 129543, "epoch": 1070} {"train_loss": -38.4521598815918, "global_step": 129544, "epoch": 1070} {"train_loss": -39.50185775756836, "global_step": 129545, "epoch": 1070} {"train_loss": -39.116302490234375, "global_step": 129546, "epoch": 1070} {"train_loss": -39.58622360229492, "global_step": 129547, "epoch": 1070} {"train_loss": -38.98298645019531, "global_step": 129548, "epoch": 1070} {"train_loss": -39.06195831298828, "global_step": 129549, "epoch": 1070} {"train_loss": -39.04052734375, "global_step": 129550, "epoch": 1070} {"train_loss": -38.85934066772461, "global_step": 129551, "epoch": 1070} {"train_loss": -39.730899810791016, "global_step": 129552, "epoch": 1070} {"train_loss": -39.128177642822266, "global_step": 129553, "epoch": 1070} {"train_loss": -39.55643844604492, "global_step": 129554, "epoch": 1070} {"train_loss": -39.59844970703125, "global_step": 129555, "epoch": 1070} {"train_loss": -39.61505126953125, "global_step": 129556, "epoch": 1070} {"train_loss": -38.88568115234375, "global_step": 129557, "epoch": 1070} {"train_loss": -39.2425537109375, "global_step": 129558, "epoch": 1070} {"train_loss": -39.41877365112305, "global_step": 129559, "epoch": 1070} {"train_loss": -39.54099655151367, "global_step": 129560, "epoch": 1070} {"train_loss": -39.94514465332031, "global_step": 129561, "epoch": 1070} {"train_loss": -39.52141189575195, "global_step": 129562, "epoch": 1070} {"train_loss": -39.81037521362305, "global_step": 129563, "epoch": 1070} {"train_loss": -39.69399642944336, "global_step": 129564, "epoch": 1070} {"train_loss": -39.21337890625, "global_step": 129565, "epoch": 1070} {"train_loss": -39.030330657958984, "global_step": 129566, "epoch": 1070} {"train_loss": -38.99021911621094, "global_step": 129567, "epoch": 1070} {"train_loss": -39.32432174682617, "global_step": 129568, "epoch": 1070} {"train_loss": -39.817474365234375, "global_step": 129569, "epoch": 1070} {"train_loss": -39.862831115722656, "global_step": 129570, "epoch": 1070} {"train_loss": -39.29588317871094, "global_step": 129571, "epoch": 1070} {"train_loss": -39.00899887084961, "global_step": 129572, "epoch": 1070} {"train_loss": -37.94004821777344, "global_step": 129573, "epoch": 1070} {"train_loss": -38.11056137084961, "global_step": 129574, "epoch": 1070} {"train_loss": -40.104766845703125, "global_step": 129575, "epoch": 1070} {"train_loss": -39.167720794677734, "global_step": 129576, "epoch": 1070} {"train_loss": -38.33076095581055, "global_step": 129577, "epoch": 1070} {"train_loss": -39.20785140991211, "global_step": 129578, "epoch": 1070} {"train_loss": -40.06201934814453, "global_step": 129579, "epoch": 1070} {"train_loss": -39.69734573364258, "global_step": 129580, "epoch": 1070} {"train_loss": -39.08620071411133, "global_step": 129581, "epoch": 1070} {"train_loss": -38.85222625732422, "global_step": 129582, "epoch": 1070} {"train_loss": -39.74369812011719, "global_step": 129583, "epoch": 1070} {"train_loss": -40.047401428222656, "global_step": 129584, "epoch": 1070} {"train_loss": -39.43780517578125, "global_step": 129585, "epoch": 1070} {"train_loss": -39.62834548950195, "global_step": 129586, "epoch": 1070} {"train_loss": -39.82613754272461, "global_step": 129587, "epoch": 1070} {"train_loss": -39.7691764831543, "global_step": 129588, "epoch": 1070} {"train_loss": -39.507511138916016, "global_step": 129589, "epoch": 1070} {"train_loss": -38.51074827209977, "global_step": 129590, "epoch": 1070, "val_loss": 2675916.0} {"train_loss": -40.06025314331055, "global_step": 129591, "epoch": 1071} {"train_loss": -40.01848220825195, "global_step": 129592, "epoch": 1071} {"train_loss": -39.99999237060547, "global_step": 129593, "epoch": 1071} {"train_loss": -39.94407272338867, "global_step": 129594, "epoch": 1071} {"train_loss": -40.501678466796875, "global_step": 129595, "epoch": 1071} {"train_loss": -39.89353561401367, "global_step": 129596, "epoch": 1071} {"train_loss": -40.273719787597656, "global_step": 129597, "epoch": 1071} {"train_loss": -39.62091064453125, "global_step": 129598, "epoch": 1071} {"train_loss": -38.065040588378906, "global_step": 129599, "epoch": 1071} {"train_loss": -39.90155029296875, "global_step": 129600, "epoch": 1071} {"train_loss": -39.730926513671875, "global_step": 129601, "epoch": 1071} {"train_loss": -39.976158142089844, "global_step": 129602, "epoch": 1071} {"train_loss": -40.0355224609375, "global_step": 129603, "epoch": 1071} {"train_loss": -39.34446334838867, "global_step": 129604, "epoch": 1071} {"train_loss": -39.90682601928711, "global_step": 129605, "epoch": 1071} {"train_loss": -40.03142166137695, "global_step": 129606, "epoch": 1071} {"train_loss": -40.11715316772461, "global_step": 129607, "epoch": 1071} {"train_loss": -39.20990753173828, "global_step": 129608, "epoch": 1071} {"train_loss": -38.10185623168945, "global_step": 129609, "epoch": 1071} {"train_loss": -36.82554244995117, "global_step": 129610, "epoch": 1071} {"train_loss": -35.05950164794922, "global_step": 129611, "epoch": 1071} {"train_loss": -35.092620849609375, "global_step": 129612, "epoch": 1071} {"train_loss": -38.9074592590332, "global_step": 129613, "epoch": 1071} {"train_loss": -39.063018798828125, "global_step": 129614, "epoch": 1071} {"train_loss": -36.197052001953125, "global_step": 129615, "epoch": 1071} {"train_loss": -35.16321563720703, "global_step": 129616, "epoch": 1071} {"train_loss": -35.37095260620117, "global_step": 129617, "epoch": 1071} {"train_loss": -38.05550765991211, "global_step": 129618, "epoch": 1071} {"train_loss": -36.68227767944336, "global_step": 129619, "epoch": 1071} {"train_loss": -36.412925720214844, "global_step": 129620, "epoch": 1071} {"train_loss": -36.845699310302734, "global_step": 129621, "epoch": 1071} {"train_loss": -36.37556076049805, "global_step": 129622, "epoch": 1071} {"train_loss": -37.84041213989258, "global_step": 129623, "epoch": 1071} {"train_loss": -39.3767204284668, "global_step": 129624, "epoch": 1071} {"train_loss": -37.98426055908203, "global_step": 129625, "epoch": 1071} {"train_loss": -36.844844818115234, "global_step": 129626, "epoch": 1071} {"train_loss": -38.848819732666016, "global_step": 129627, "epoch": 1071} {"train_loss": -38.03388214111328, "global_step": 129628, "epoch": 1071} {"train_loss": -37.87317657470703, "global_step": 129629, "epoch": 1071} {"train_loss": -36.95978546142578, "global_step": 129630, "epoch": 1071} {"train_loss": -38.18309020996094, "global_step": 129631, "epoch": 1071} {"train_loss": -35.152950286865234, "global_step": 129632, "epoch": 1071} {"train_loss": -38.665992736816406, "global_step": 129633, "epoch": 1071} {"train_loss": -37.6639289855957, "global_step": 129634, "epoch": 1071} {"train_loss": -35.303123474121094, "global_step": 129635, "epoch": 1071} {"train_loss": -38.249488830566406, "global_step": 129636, "epoch": 1071} {"train_loss": -37.831668853759766, "global_step": 129637, "epoch": 1071} {"train_loss": -36.19725799560547, "global_step": 129638, "epoch": 1071} {"train_loss": -37.893672943115234, "global_step": 129639, "epoch": 1071} {"train_loss": -36.79534912109375, "global_step": 129640, "epoch": 1071} {"train_loss": -37.74831771850586, "global_step": 129641, "epoch": 1071} {"train_loss": -38.11592483520508, "global_step": 129642, "epoch": 1071} {"train_loss": -38.3455810546875, "global_step": 129643, "epoch": 1071} {"train_loss": -38.98312759399414, "global_step": 129644, "epoch": 1071} {"train_loss": -37.51797103881836, "global_step": 129645, "epoch": 1071} {"train_loss": -36.567474365234375, "global_step": 129646, "epoch": 1071} {"train_loss": -38.125308990478516, "global_step": 129647, "epoch": 1071} {"train_loss": -35.9492073059082, "global_step": 129648, "epoch": 1071} {"train_loss": -37.123104095458984, "global_step": 129649, "epoch": 1071} {"train_loss": -37.87467575073242, "global_step": 129650, "epoch": 1071} {"train_loss": -37.903560638427734, "global_step": 129651, "epoch": 1071} {"train_loss": -37.40060043334961, "global_step": 129652, "epoch": 1071} {"train_loss": -39.448020935058594, "global_step": 129653, "epoch": 1071} {"train_loss": -36.97756576538086, "global_step": 129654, "epoch": 1071} {"train_loss": -38.49040222167969, "global_step": 129655, "epoch": 1071} {"train_loss": -38.932647705078125, "global_step": 129656, "epoch": 1071} {"train_loss": -38.04707717895508, "global_step": 129657, "epoch": 1071} {"train_loss": -38.74440002441406, "global_step": 129658, "epoch": 1071} {"train_loss": -36.844120025634766, "global_step": 129659, "epoch": 1071} {"train_loss": -39.10506057739258, "global_step": 129660, "epoch": 1071} {"train_loss": -37.10859298706055, "global_step": 129661, "epoch": 1071} {"train_loss": -38.50962829589844, "global_step": 129662, "epoch": 1071} {"train_loss": -37.67426681518555, "global_step": 129663, "epoch": 1071} {"train_loss": -38.19588851928711, "global_step": 129664, "epoch": 1071} {"train_loss": -37.4483642578125, "global_step": 129665, "epoch": 1071} {"train_loss": -37.881629943847656, "global_step": 129666, "epoch": 1071} {"train_loss": -37.3752555847168, "global_step": 129667, "epoch": 1071} {"train_loss": -38.4835319519043, "global_step": 129668, "epoch": 1071} {"train_loss": -38.92902374267578, "global_step": 129669, "epoch": 1071} {"train_loss": -38.8062629699707, "global_step": 129670, "epoch": 1071} {"train_loss": -38.73726272583008, "global_step": 129671, "epoch": 1071} {"train_loss": -39.33262634277344, "global_step": 129672, "epoch": 1071} {"train_loss": -37.91701889038086, "global_step": 129673, "epoch": 1071} {"train_loss": -36.81013870239258, "global_step": 129674, "epoch": 1071} {"train_loss": -39.07267379760742, "global_step": 129675, "epoch": 1071} {"train_loss": -39.40607452392578, "global_step": 129676, "epoch": 1071} {"train_loss": -38.89603805541992, "global_step": 129677, "epoch": 1071} {"train_loss": -38.06708908081055, "global_step": 129678, "epoch": 1071} {"train_loss": -39.54960250854492, "global_step": 129679, "epoch": 1071} {"train_loss": -39.20430374145508, "global_step": 129680, "epoch": 1071} {"train_loss": -38.44760513305664, "global_step": 129681, "epoch": 1071} {"train_loss": -39.703224182128906, "global_step": 129682, "epoch": 1071} {"train_loss": -38.19479751586914, "global_step": 129683, "epoch": 1071} {"train_loss": -39.971168518066406, "global_step": 129684, "epoch": 1071} {"train_loss": -39.38465118408203, "global_step": 129685, "epoch": 1071} {"train_loss": -39.666961669921875, "global_step": 129686, "epoch": 1071} {"train_loss": -37.95336151123047, "global_step": 129687, "epoch": 1071} {"train_loss": -38.466732025146484, "global_step": 129688, "epoch": 1071} {"train_loss": -38.53813552856445, "global_step": 129689, "epoch": 1071} {"train_loss": -39.84938049316406, "global_step": 129690, "epoch": 1071} {"train_loss": -38.66936111450195, "global_step": 129691, "epoch": 1071} {"train_loss": -39.60630416870117, "global_step": 129692, "epoch": 1071} {"train_loss": -40.07185745239258, "global_step": 129693, "epoch": 1071} {"train_loss": -38.017276763916016, "global_step": 129694, "epoch": 1071} {"train_loss": -39.173194885253906, "global_step": 129695, "epoch": 1071} {"train_loss": -39.85752487182617, "global_step": 129696, "epoch": 1071} {"train_loss": -39.27608871459961, "global_step": 129697, "epoch": 1071} {"train_loss": -39.78102493286133, "global_step": 129698, "epoch": 1071} {"train_loss": -40.02116012573242, "global_step": 129699, "epoch": 1071} {"train_loss": -39.68331527709961, "global_step": 129700, "epoch": 1071} {"train_loss": -39.54545211791992, "global_step": 129701, "epoch": 1071} {"train_loss": -39.72356033325195, "global_step": 129702, "epoch": 1071} {"train_loss": -39.59481430053711, "global_step": 129703, "epoch": 1071} {"train_loss": -38.8446044921875, "global_step": 129704, "epoch": 1071} {"train_loss": -39.69731140136719, "global_step": 129705, "epoch": 1071} {"train_loss": -39.35230255126953, "global_step": 129706, "epoch": 1071} {"train_loss": -39.97588348388672, "global_step": 129707, "epoch": 1071} {"train_loss": -39.674373626708984, "global_step": 129708, "epoch": 1071} {"train_loss": -39.33423614501953, "global_step": 129709, "epoch": 1071} {"train_loss": -40.27787399291992, "global_step": 129710, "epoch": 1071} {"train_loss": -38.4498637175757, "global_step": 129711, "epoch": 1071, "val_loss": 2623631.5} {"train_loss": -39.334014892578125, "global_step": 129712, "epoch": 1072} {"train_loss": -40.0140495300293, "global_step": 129713, "epoch": 1072} {"train_loss": -39.96324157714844, "global_step": 129714, "epoch": 1072} {"train_loss": -40.037452697753906, "global_step": 129715, "epoch": 1072} {"train_loss": -40.12530517578125, "global_step": 129716, "epoch": 1072} {"train_loss": -40.15718460083008, "global_step": 129717, "epoch": 1072} {"train_loss": -38.66294479370117, "global_step": 129718, "epoch": 1072} {"train_loss": -38.455989837646484, "global_step": 129719, "epoch": 1072} {"train_loss": -39.36012649536133, "global_step": 129720, "epoch": 1072} {"train_loss": -39.287925720214844, "global_step": 129721, "epoch": 1072} {"train_loss": -37.3517951965332, "global_step": 129722, "epoch": 1072} {"train_loss": -38.845619201660156, "global_step": 129723, "epoch": 1072} {"train_loss": -38.457801818847656, "global_step": 129724, "epoch": 1072} {"train_loss": -38.48500442504883, "global_step": 129725, "epoch": 1072} {"train_loss": -38.85212326049805, "global_step": 129726, "epoch": 1072} {"train_loss": -38.968685150146484, "global_step": 129727, "epoch": 1072} {"train_loss": -39.64197540283203, "global_step": 129728, "epoch": 1072} {"train_loss": -39.88051223754883, "global_step": 129729, "epoch": 1072} {"train_loss": -39.43403244018555, "global_step": 129730, "epoch": 1072} {"train_loss": -38.64240264892578, "global_step": 129731, "epoch": 1072} {"train_loss": -39.81718063354492, "global_step": 129732, "epoch": 1072} {"train_loss": -38.998451232910156, "global_step": 129733, "epoch": 1072} {"train_loss": -38.3202018737793, "global_step": 129734, "epoch": 1072} {"train_loss": -38.797874450683594, "global_step": 129735, "epoch": 1072} {"train_loss": -39.659461975097656, "global_step": 129736, "epoch": 1072} {"train_loss": -39.126007080078125, "global_step": 129737, "epoch": 1072} {"train_loss": -39.47722244262695, "global_step": 129738, "epoch": 1072} {"train_loss": -39.26806640625, "global_step": 129739, "epoch": 1072} {"train_loss": -39.933876037597656, "global_step": 129740, "epoch": 1072} {"train_loss": -38.77185821533203, "global_step": 129741, "epoch": 1072} {"train_loss": -39.3461799621582, "global_step": 129742, "epoch": 1072} {"train_loss": -39.681678771972656, "global_step": 129743, "epoch": 1072} {"train_loss": -38.16800308227539, "global_step": 129744, "epoch": 1072} {"train_loss": -39.654388427734375, "global_step": 129745, "epoch": 1072} {"train_loss": -37.65126419067383, "global_step": 129746, "epoch": 1072} {"train_loss": -38.18635940551758, "global_step": 129747, "epoch": 1072} {"train_loss": -39.794471740722656, "global_step": 129748, "epoch": 1072} {"train_loss": -40.15189743041992, "global_step": 129749, "epoch": 1072} {"train_loss": -39.533790588378906, "global_step": 129750, "epoch": 1072} {"train_loss": -39.77854537963867, "global_step": 129751, "epoch": 1072} {"train_loss": -39.49018478393555, "global_step": 129752, "epoch": 1072} {"train_loss": -39.7958984375, "global_step": 129753, "epoch": 1072} {"train_loss": -38.58732986450195, "global_step": 129754, "epoch": 1072} {"train_loss": -40.30608367919922, "global_step": 129755, "epoch": 1072} {"train_loss": -40.03390121459961, "global_step": 129756, "epoch": 1072} {"train_loss": -39.9399299621582, "global_step": 129757, "epoch": 1072} {"train_loss": -39.253177642822266, "global_step": 129758, "epoch": 1072} {"train_loss": -40.288818359375, "global_step": 129759, "epoch": 1072} {"train_loss": -39.594608306884766, "global_step": 129760, "epoch": 1072} {"train_loss": -39.127349853515625, "global_step": 129761, "epoch": 1072} {"train_loss": -40.06386184692383, "global_step": 129762, "epoch": 1072} {"train_loss": -39.8192253112793, "global_step": 129763, "epoch": 1072} {"train_loss": -39.58457946777344, "global_step": 129764, "epoch": 1072} {"train_loss": -39.8898811340332, "global_step": 129765, "epoch": 1072} {"train_loss": -39.48395919799805, "global_step": 129766, "epoch": 1072} {"train_loss": -38.80519104003906, "global_step": 129767, "epoch": 1072} {"train_loss": -37.95319366455078, "global_step": 129768, "epoch": 1072} {"train_loss": -38.27748489379883, "global_step": 129769, "epoch": 1072} {"train_loss": -38.197967529296875, "global_step": 129770, "epoch": 1072} {"train_loss": -38.036415100097656, "global_step": 129771, "epoch": 1072} {"train_loss": -39.416175842285156, "global_step": 129772, "epoch": 1072} {"train_loss": -39.357086181640625, "global_step": 129773, "epoch": 1072} {"train_loss": -39.21382522583008, "global_step": 129774, "epoch": 1072} {"train_loss": -39.7752799987793, "global_step": 129775, "epoch": 1072} {"train_loss": -39.56422805786133, "global_step": 129776, "epoch": 1072} {"train_loss": -40.14761734008789, "global_step": 129777, "epoch": 1072} {"train_loss": -38.922401428222656, "global_step": 129778, "epoch": 1072} {"train_loss": -39.73780059814453, "global_step": 129779, "epoch": 1072} {"train_loss": -39.26823043823242, "global_step": 129780, "epoch": 1072} {"train_loss": -39.387874603271484, "global_step": 129781, "epoch": 1072} {"train_loss": -38.277259826660156, "global_step": 129782, "epoch": 1072} {"train_loss": -38.15869140625, "global_step": 129783, "epoch": 1072} {"train_loss": -39.252479553222656, "global_step": 129784, "epoch": 1072} {"train_loss": -38.6989860534668, "global_step": 129785, "epoch": 1072} {"train_loss": -38.68377685546875, "global_step": 129786, "epoch": 1072} {"train_loss": -38.131927490234375, "global_step": 129787, "epoch": 1072} {"train_loss": -38.795135498046875, "global_step": 129788, "epoch": 1072} {"train_loss": -39.182472229003906, "global_step": 129789, "epoch": 1072} {"train_loss": -40.35268783569336, "global_step": 129790, "epoch": 1072} {"train_loss": -39.327247619628906, "global_step": 129791, "epoch": 1072} {"train_loss": -39.20516586303711, "global_step": 129792, "epoch": 1072} {"train_loss": -38.75234603881836, "global_step": 129793, "epoch": 1072} {"train_loss": -39.355499267578125, "global_step": 129794, "epoch": 1072} {"train_loss": -39.75571823120117, "global_step": 129795, "epoch": 1072} {"train_loss": -39.22992706298828, "global_step": 129796, "epoch": 1072} {"train_loss": -39.594886779785156, "global_step": 129797, "epoch": 1072} {"train_loss": -39.35618209838867, "global_step": 129798, "epoch": 1072} {"train_loss": -39.09738540649414, "global_step": 129799, "epoch": 1072} {"train_loss": -39.54751205444336, "global_step": 129800, "epoch": 1072} {"train_loss": -39.319087982177734, "global_step": 129801, "epoch": 1072} {"train_loss": -39.729393005371094, "global_step": 129802, "epoch": 1072} {"train_loss": -39.584720611572266, "global_step": 129803, "epoch": 1072} {"train_loss": -39.339691162109375, "global_step": 129804, "epoch": 1072} {"train_loss": -39.771942138671875, "global_step": 129805, "epoch": 1072} {"train_loss": -39.03530502319336, "global_step": 129806, "epoch": 1072} {"train_loss": -39.8484001159668, "global_step": 129807, "epoch": 1072} {"train_loss": -39.9591064453125, "global_step": 129808, "epoch": 1072} {"train_loss": -39.6546516418457, "global_step": 129809, "epoch": 1072} {"train_loss": -40.24353790283203, "global_step": 129810, "epoch": 1072} {"train_loss": -39.331764221191406, "global_step": 129811, "epoch": 1072} {"train_loss": -40.0240478515625, "global_step": 129812, "epoch": 1072} {"train_loss": -39.42277145385742, "global_step": 129813, "epoch": 1072} {"train_loss": -39.849327087402344, "global_step": 129814, "epoch": 1072} {"train_loss": -36.8060302734375, "global_step": 129815, "epoch": 1072} {"train_loss": -38.00504684448242, "global_step": 129816, "epoch": 1072} {"train_loss": -38.61231231689453, "global_step": 129817, "epoch": 1072} {"train_loss": -37.097145080566406, "global_step": 129818, "epoch": 1072} {"train_loss": -38.13862991333008, "global_step": 129819, "epoch": 1072} {"train_loss": -36.37629318237305, "global_step": 129820, "epoch": 1072} {"train_loss": -35.83553695678711, "global_step": 129821, "epoch": 1072} {"train_loss": -38.59159469604492, "global_step": 129822, "epoch": 1072} {"train_loss": -36.946414947509766, "global_step": 129823, "epoch": 1072} {"train_loss": -38.2103271484375, "global_step": 129824, "epoch": 1072} {"train_loss": -35.96098327636719, "global_step": 129825, "epoch": 1072} {"train_loss": -36.279388427734375, "global_step": 129826, "epoch": 1072} {"train_loss": -36.20252227783203, "global_step": 129827, "epoch": 1072} {"train_loss": -36.72447967529297, "global_step": 129828, "epoch": 1072} {"train_loss": -38.46824264526367, "global_step": 129829, "epoch": 1072} {"train_loss": -37.84558868408203, "global_step": 129830, "epoch": 1072} {"train_loss": -35.910030364990234, "global_step": 129831, "epoch": 1072} {"train_loss": -38.98235992557746, "global_step": 129832, "epoch": 1072, "val_loss": 2683076.25} {"train_loss": -38.98301315307617, "global_step": 129833, "epoch": 1073} {"train_loss": -36.76486587524414, "global_step": 129834, "epoch": 1073} {"train_loss": -38.11947250366211, "global_step": 129835, "epoch": 1073} {"train_loss": -38.760009765625, "global_step": 129836, "epoch": 1073} {"train_loss": -39.1981201171875, "global_step": 129837, "epoch": 1073} {"train_loss": -39.33793258666992, "global_step": 129838, "epoch": 1073} {"train_loss": -38.61925506591797, "global_step": 129839, "epoch": 1073} {"train_loss": -39.518978118896484, "global_step": 129840, "epoch": 1073} {"train_loss": -39.436126708984375, "global_step": 129841, "epoch": 1073} {"train_loss": -38.04536819458008, "global_step": 129842, "epoch": 1073} {"train_loss": -39.379371643066406, "global_step": 129843, "epoch": 1073} {"train_loss": -39.242095947265625, "global_step": 129844, "epoch": 1073} {"train_loss": -39.37553787231445, "global_step": 129845, "epoch": 1073} {"train_loss": -38.85152816772461, "global_step": 129846, "epoch": 1073} {"train_loss": -39.22845458984375, "global_step": 129847, "epoch": 1073} {"train_loss": -38.98023223876953, "global_step": 129848, "epoch": 1073} {"train_loss": -39.1236457824707, "global_step": 129849, "epoch": 1073} {"train_loss": -39.17765426635742, "global_step": 129850, "epoch": 1073} {"train_loss": -40.03005599975586, "global_step": 129851, "epoch": 1073} {"train_loss": -39.5562858581543, "global_step": 129852, "epoch": 1073} {"train_loss": -39.96175003051758, "global_step": 129853, "epoch": 1073} {"train_loss": -39.365272521972656, "global_step": 129854, "epoch": 1073} {"train_loss": -39.75360107421875, "global_step": 129855, "epoch": 1073} {"train_loss": -39.46196365356445, "global_step": 129856, "epoch": 1073} {"train_loss": -39.844173431396484, "global_step": 129857, "epoch": 1073} {"train_loss": -39.650577545166016, "global_step": 129858, "epoch": 1073} {"train_loss": -39.96432876586914, "global_step": 129859, "epoch": 1073} {"train_loss": -39.63056182861328, "global_step": 129860, "epoch": 1073} {"train_loss": -39.920654296875, "global_step": 129861, "epoch": 1073} {"train_loss": -39.94858932495117, "global_step": 129862, "epoch": 1073} {"train_loss": -39.735260009765625, "global_step": 129863, "epoch": 1073} {"train_loss": -39.55744171142578, "global_step": 129864, "epoch": 1073} {"train_loss": -38.88914108276367, "global_step": 129865, "epoch": 1073} {"train_loss": -40.574806213378906, "global_step": 129866, "epoch": 1073} {"train_loss": -40.27827835083008, "global_step": 129867, "epoch": 1073} {"train_loss": -40.1601448059082, "global_step": 129868, "epoch": 1073} {"train_loss": -39.75208282470703, "global_step": 129869, "epoch": 1073} {"train_loss": -40.039058685302734, "global_step": 129870, "epoch": 1073} {"train_loss": -40.41219711303711, "global_step": 129871, "epoch": 1073} {"train_loss": -39.79409408569336, "global_step": 129872, "epoch": 1073} {"train_loss": -39.79631042480469, "global_step": 129873, "epoch": 1073} {"train_loss": -40.350685119628906, "global_step": 129874, "epoch": 1073} {"train_loss": -40.401649475097656, "global_step": 129875, "epoch": 1073} {"train_loss": -40.24516296386719, "global_step": 129876, "epoch": 1073} {"train_loss": -40.09648513793945, "global_step": 129877, "epoch": 1073} {"train_loss": -38.933990478515625, "global_step": 129878, "epoch": 1073} {"train_loss": -39.344329833984375, "global_step": 129879, "epoch": 1073} {"train_loss": -39.25822830200195, "global_step": 129880, "epoch": 1073} {"train_loss": -39.98979949951172, "global_step": 129881, "epoch": 1073} {"train_loss": -39.91753005981445, "global_step": 129882, "epoch": 1073} {"train_loss": -39.404296875, "global_step": 129883, "epoch": 1073} {"train_loss": -35.83254623413086, "global_step": 129884, "epoch": 1073} {"train_loss": -33.37031173706055, "global_step": 129885, "epoch": 1073} {"train_loss": -34.054168701171875, "global_step": 129886, "epoch": 1073} {"train_loss": -35.07014083862305, "global_step": 129887, "epoch": 1073} {"train_loss": -36.7698860168457, "global_step": 129888, "epoch": 1073} {"train_loss": -37.01096725463867, "global_step": 129889, "epoch": 1073} {"train_loss": -38.77610397338867, "global_step": 129890, "epoch": 1073} {"train_loss": -39.03642654418945, "global_step": 129891, "epoch": 1073} {"train_loss": -36.76290512084961, "global_step": 129892, "epoch": 1073} {"train_loss": -39.10834503173828, "global_step": 129893, "epoch": 1073} {"train_loss": -38.28468322753906, "global_step": 129894, "epoch": 1073} {"train_loss": -36.62850570678711, "global_step": 129895, "epoch": 1073} {"train_loss": -39.0432243347168, "global_step": 129896, "epoch": 1073} {"train_loss": -38.802162170410156, "global_step": 129897, "epoch": 1073} {"train_loss": -37.04618835449219, "global_step": 129898, "epoch": 1073} {"train_loss": -39.222564697265625, "global_step": 129899, "epoch": 1073} {"train_loss": -38.99747848510742, "global_step": 129900, "epoch": 1073} {"train_loss": -38.365699768066406, "global_step": 129901, "epoch": 1073} {"train_loss": -39.07933807373047, "global_step": 129902, "epoch": 1073} {"train_loss": -38.47823715209961, "global_step": 129903, "epoch": 1073} {"train_loss": -39.23823928833008, "global_step": 129904, "epoch": 1073} {"train_loss": -39.233551025390625, "global_step": 129905, "epoch": 1073} {"train_loss": -38.81222152709961, "global_step": 129906, "epoch": 1073} {"train_loss": -39.91408157348633, "global_step": 129907, "epoch": 1073} {"train_loss": -39.3596305847168, "global_step": 129908, "epoch": 1073} {"train_loss": -38.26227569580078, "global_step": 129909, "epoch": 1073} {"train_loss": -39.355892181396484, "global_step": 129910, "epoch": 1073} {"train_loss": -39.07197189331055, "global_step": 129911, "epoch": 1073} {"train_loss": -39.32750701904297, "global_step": 129912, "epoch": 1073} {"train_loss": -38.924041748046875, "global_step": 129913, "epoch": 1073} {"train_loss": -39.697872161865234, "global_step": 129914, "epoch": 1073} {"train_loss": -39.227535247802734, "global_step": 129915, "epoch": 1073} {"train_loss": -39.178260803222656, "global_step": 129916, "epoch": 1073} {"train_loss": -37.752906799316406, "global_step": 129917, "epoch": 1073} {"train_loss": -39.014225006103516, "global_step": 129918, "epoch": 1073} {"train_loss": -39.558040618896484, "global_step": 129919, "epoch": 1073} {"train_loss": -37.7438850402832, "global_step": 129920, "epoch": 1073} {"train_loss": -38.591007232666016, "global_step": 129921, "epoch": 1073} {"train_loss": -39.23991775512695, "global_step": 129922, "epoch": 1073} {"train_loss": -39.19277572631836, "global_step": 129923, "epoch": 1073} {"train_loss": -39.041038513183594, "global_step": 129924, "epoch": 1073} {"train_loss": -39.35928726196289, "global_step": 129925, "epoch": 1073} {"train_loss": -38.2128791809082, "global_step": 129926, "epoch": 1073} {"train_loss": -39.00199508666992, "global_step": 129927, "epoch": 1073} {"train_loss": -39.08738327026367, "global_step": 129928, "epoch": 1073} {"train_loss": -39.3382453918457, "global_step": 129929, "epoch": 1073} {"train_loss": -39.11563491821289, "global_step": 129930, "epoch": 1073} {"train_loss": -39.11550521850586, "global_step": 129931, "epoch": 1073} {"train_loss": -39.58636474609375, "global_step": 129932, "epoch": 1073} {"train_loss": -40.11176681518555, "global_step": 129933, "epoch": 1073} {"train_loss": -39.54499435424805, "global_step": 129934, "epoch": 1073} {"train_loss": -39.54965591430664, "global_step": 129935, "epoch": 1073} {"train_loss": -40.13980484008789, "global_step": 129936, "epoch": 1073} {"train_loss": -40.01728820800781, "global_step": 129937, "epoch": 1073} {"train_loss": -39.80454635620117, "global_step": 129938, "epoch": 1073} {"train_loss": -40.01926040649414, "global_step": 129939, "epoch": 1073} {"train_loss": -39.63546371459961, "global_step": 129940, "epoch": 1073} {"train_loss": -40.596004486083984, "global_step": 129941, "epoch": 1073} {"train_loss": -40.48638153076172, "global_step": 129942, "epoch": 1073} {"train_loss": -39.7991943359375, "global_step": 129943, "epoch": 1073} {"train_loss": -39.71933364868164, "global_step": 129944, "epoch": 1073} {"train_loss": -40.1442756652832, "global_step": 129945, "epoch": 1073} {"train_loss": -40.05228042602539, "global_step": 129946, "epoch": 1073} {"train_loss": -39.36850357055664, "global_step": 129947, "epoch": 1073} {"train_loss": -39.10022735595703, "global_step": 129948, "epoch": 1073} {"train_loss": -38.84490203857422, "global_step": 129949, "epoch": 1073} {"train_loss": -40.10085678100586, "global_step": 129950, "epoch": 1073} {"train_loss": -38.095985412597656, "global_step": 129951, "epoch": 1073} {"train_loss": -38.064308166503906, "global_step": 129952, "epoch": 1073} {"train_loss": -39.07624870489452, "global_step": 129953, "epoch": 1073, "val_loss": 2625756.75} {"train_loss": -39.2609748840332, "global_step": 129954, "epoch": 1074} {"train_loss": -39.58305740356445, "global_step": 129955, "epoch": 1074} {"train_loss": -40.26713180541992, "global_step": 129956, "epoch": 1074} {"train_loss": -38.884639739990234, "global_step": 129957, "epoch": 1074} {"train_loss": -37.60477828979492, "global_step": 129958, "epoch": 1074} {"train_loss": -38.81232833862305, "global_step": 129959, "epoch": 1074} {"train_loss": -40.55706787109375, "global_step": 129960, "epoch": 1074} {"train_loss": -38.57403564453125, "global_step": 129961, "epoch": 1074} {"train_loss": -35.50519943237305, "global_step": 129962, "epoch": 1074} {"train_loss": -35.19464111328125, "global_step": 129963, "epoch": 1074} {"train_loss": -38.39442825317383, "global_step": 129964, "epoch": 1074} {"train_loss": -39.502071380615234, "global_step": 129965, "epoch": 1074} {"train_loss": -36.85348129272461, "global_step": 129966, "epoch": 1074} {"train_loss": -34.2412223815918, "global_step": 129967, "epoch": 1074} {"train_loss": -36.043148040771484, "global_step": 129968, "epoch": 1074} {"train_loss": -38.51707077026367, "global_step": 129969, "epoch": 1074} {"train_loss": -38.8145637512207, "global_step": 129970, "epoch": 1074} {"train_loss": -38.646461486816406, "global_step": 129971, "epoch": 1074} {"train_loss": -37.483642578125, "global_step": 129972, "epoch": 1074} {"train_loss": -38.804298400878906, "global_step": 129973, "epoch": 1074} {"train_loss": -38.71550369262695, "global_step": 129974, "epoch": 1074} {"train_loss": -38.64723205566406, "global_step": 129975, "epoch": 1074} {"train_loss": -39.244441986083984, "global_step": 129976, "epoch": 1074} {"train_loss": -39.18886947631836, "global_step": 129977, "epoch": 1074} {"train_loss": -38.722286224365234, "global_step": 129978, "epoch": 1074} {"train_loss": -39.7996711730957, "global_step": 129979, "epoch": 1074} {"train_loss": -39.8430290222168, "global_step": 129980, "epoch": 1074} {"train_loss": -39.1075439453125, "global_step": 129981, "epoch": 1074} {"train_loss": -40.33321762084961, "global_step": 129982, "epoch": 1074} {"train_loss": -39.43630599975586, "global_step": 129983, "epoch": 1074} {"train_loss": -39.12131118774414, "global_step": 129984, "epoch": 1074} {"train_loss": -39.78618240356445, "global_step": 129985, "epoch": 1074} {"train_loss": -39.55015182495117, "global_step": 129986, "epoch": 1074} {"train_loss": -40.20008850097656, "global_step": 129987, "epoch": 1074} {"train_loss": -39.904518127441406, "global_step": 129988, "epoch": 1074} {"train_loss": -40.274898529052734, "global_step": 129989, "epoch": 1074} {"train_loss": -39.90740203857422, "global_step": 129990, "epoch": 1074} {"train_loss": -39.93572998046875, "global_step": 129991, "epoch": 1074} {"train_loss": -39.92818832397461, "global_step": 129992, "epoch": 1074} {"train_loss": -39.85227584838867, "global_step": 129993, "epoch": 1074} {"train_loss": -40.308387756347656, "global_step": 129994, "epoch": 1074} {"train_loss": -40.295352935791016, "global_step": 129995, "epoch": 1074} {"train_loss": -39.69232177734375, "global_step": 129996, "epoch": 1074} {"train_loss": -40.15943145751953, "global_step": 129997, "epoch": 1074} {"train_loss": -37.729915618896484, "global_step": 129998, "epoch": 1074} {"train_loss": -39.70549774169922, "global_step": 129999, "epoch": 1074} {"train_loss": -38.613197326660156, "global_step": 130000, "epoch": 1074} {"train_loss": -40.051265716552734, "global_step": 130001, "epoch": 1074} {"train_loss": -39.43681335449219, "global_step": 130002, "epoch": 1074} {"train_loss": -40.30928421020508, "global_step": 130003, "epoch": 1074} {"train_loss": -38.56673049926758, "global_step": 130004, "epoch": 1074} {"train_loss": -40.6627082824707, "global_step": 130005, "epoch": 1074} {"train_loss": -40.130577087402344, "global_step": 130006, "epoch": 1074} {"train_loss": -39.65098190307617, "global_step": 130007, "epoch": 1074} {"train_loss": -40.17075729370117, "global_step": 130008, "epoch": 1074} {"train_loss": -40.00019454956055, "global_step": 130009, "epoch": 1074} {"train_loss": -39.16207504272461, "global_step": 130010, "epoch": 1074} {"train_loss": -40.028900146484375, "global_step": 130011, "epoch": 1074} {"train_loss": -39.1783447265625, "global_step": 130012, "epoch": 1074} {"train_loss": -40.24013900756836, "global_step": 130013, "epoch": 1074} {"train_loss": -39.90574264526367, "global_step": 130014, "epoch": 1074} {"train_loss": -38.96363067626953, "global_step": 130015, "epoch": 1074} {"train_loss": -39.89533615112305, "global_step": 130016, "epoch": 1074} {"train_loss": -38.54625701904297, "global_step": 130017, "epoch": 1074} {"train_loss": -36.9732666015625, "global_step": 130018, "epoch": 1074} {"train_loss": -36.68262481689453, "global_step": 130019, "epoch": 1074} {"train_loss": -35.4824333190918, "global_step": 130020, "epoch": 1074} {"train_loss": -39.670318603515625, "global_step": 130021, "epoch": 1074} {"train_loss": -38.375633239746094, "global_step": 130022, "epoch": 1074} {"train_loss": -38.547340393066406, "global_step": 130023, "epoch": 1074} {"train_loss": -37.012298583984375, "global_step": 130024, "epoch": 1074} {"train_loss": -35.556087493896484, "global_step": 130025, "epoch": 1074} {"train_loss": -33.12306213378906, "global_step": 130026, "epoch": 1074} {"train_loss": -35.731746673583984, "global_step": 130027, "epoch": 1074} {"train_loss": -33.49730682373047, "global_step": 130028, "epoch": 1074} {"train_loss": -37.516090393066406, "global_step": 130029, "epoch": 1074} {"train_loss": -33.023921966552734, "global_step": 130030, "epoch": 1074} {"train_loss": -39.12575149536133, "global_step": 130031, "epoch": 1074} {"train_loss": -35.29035186767578, "global_step": 130032, "epoch": 1074} {"train_loss": -34.752410888671875, "global_step": 130033, "epoch": 1074} {"train_loss": -37.652828216552734, "global_step": 130034, "epoch": 1074} {"train_loss": -35.0677490234375, "global_step": 130035, "epoch": 1074} {"train_loss": -37.18898391723633, "global_step": 130036, "epoch": 1074} {"train_loss": -37.30192184448242, "global_step": 130037, "epoch": 1074} {"train_loss": -37.42476272583008, "global_step": 130038, "epoch": 1074} {"train_loss": -37.447811126708984, "global_step": 130039, "epoch": 1074} {"train_loss": -36.948974609375, "global_step": 130040, "epoch": 1074} {"train_loss": -38.21181869506836, "global_step": 130041, "epoch": 1074} {"train_loss": -36.91010665893555, "global_step": 130042, "epoch": 1074} {"train_loss": -38.34496307373047, "global_step": 130043, "epoch": 1074} {"train_loss": -37.489681243896484, "global_step": 130044, "epoch": 1074} {"train_loss": -35.86476516723633, "global_step": 130045, "epoch": 1074} {"train_loss": -38.449275970458984, "global_step": 130046, "epoch": 1074} {"train_loss": -38.58264923095703, "global_step": 130047, "epoch": 1074} {"train_loss": -38.343719482421875, "global_step": 130048, "epoch": 1074} {"train_loss": -37.3585319519043, "global_step": 130049, "epoch": 1074} {"train_loss": -37.51736831665039, "global_step": 130050, "epoch": 1074} {"train_loss": -38.79586410522461, "global_step": 130051, "epoch": 1074} {"train_loss": -38.47294235229492, "global_step": 130052, "epoch": 1074} {"train_loss": -38.525814056396484, "global_step": 130053, "epoch": 1074} {"train_loss": -39.29924392700195, "global_step": 130054, "epoch": 1074} {"train_loss": -38.59820556640625, "global_step": 130055, "epoch": 1074} {"train_loss": -39.04697799682617, "global_step": 130056, "epoch": 1074} {"train_loss": -39.357887268066406, "global_step": 130057, "epoch": 1074} {"train_loss": -39.007686614990234, "global_step": 130058, "epoch": 1074} {"train_loss": -36.882869720458984, "global_step": 130059, "epoch": 1074} {"train_loss": -38.432037353515625, "global_step": 130060, "epoch": 1074} {"train_loss": -39.233009338378906, "global_step": 130061, "epoch": 1074} {"train_loss": -39.1356315612793, "global_step": 130062, "epoch": 1074} {"train_loss": -39.378475189208984, "global_step": 130063, "epoch": 1074} {"train_loss": -39.16212844848633, "global_step": 130064, "epoch": 1074} {"train_loss": -38.86538314819336, "global_step": 130065, "epoch": 1074} {"train_loss": -39.28895950317383, "global_step": 130066, "epoch": 1074} {"train_loss": -36.46686935424805, "global_step": 130067, "epoch": 1074} {"train_loss": -38.853702545166016, "global_step": 130068, "epoch": 1074} {"train_loss": -39.3654899597168, "global_step": 130069, "epoch": 1074} {"train_loss": -39.54792022705078, "global_step": 130070, "epoch": 1074} {"train_loss": -39.078834533691406, "global_step": 130071, "epoch": 1074} {"train_loss": -38.84514617919922, "global_step": 130072, "epoch": 1074} {"train_loss": -38.5377082824707, "global_step": 130073, "epoch": 1074} {"train_loss": -38.44364932351861, "global_step": 130074, "epoch": 1074, "val_loss": 2755680.25} {"train_loss": -38.725704193115234, "global_step": 130075, "epoch": 1075} {"train_loss": -39.170047760009766, "global_step": 130076, "epoch": 1075} {"train_loss": -39.36184310913086, "global_step": 130077, "epoch": 1075} {"train_loss": -39.79555130004883, "global_step": 130078, "epoch": 1075} {"train_loss": -39.27766799926758, "global_step": 130079, "epoch": 1075} {"train_loss": -39.71096420288086, "global_step": 130080, "epoch": 1075} {"train_loss": -39.81649398803711, "global_step": 130081, "epoch": 1075} {"train_loss": -40.014923095703125, "global_step": 130082, "epoch": 1075} {"train_loss": -40.10103225708008, "global_step": 130083, "epoch": 1075} {"train_loss": -39.46684646606445, "global_step": 130084, "epoch": 1075} {"train_loss": -39.626216888427734, "global_step": 130085, "epoch": 1075} {"train_loss": -39.67186737060547, "global_step": 130086, "epoch": 1075} {"train_loss": -39.89443588256836, "global_step": 130087, "epoch": 1075} {"train_loss": -39.66240310668945, "global_step": 130088, "epoch": 1075} {"train_loss": -36.45438766479492, "global_step": 130089, "epoch": 1075} {"train_loss": -37.803253173828125, "global_step": 130090, "epoch": 1075} {"train_loss": -39.0366325378418, "global_step": 130091, "epoch": 1075} {"train_loss": -39.297523498535156, "global_step": 130092, "epoch": 1075} {"train_loss": -39.96987533569336, "global_step": 130093, "epoch": 1075} {"train_loss": -39.79376220703125, "global_step": 130094, "epoch": 1075} {"train_loss": -37.86029815673828, "global_step": 130095, "epoch": 1075} {"train_loss": -39.609283447265625, "global_step": 130096, "epoch": 1075} {"train_loss": -39.24101638793945, "global_step": 130097, "epoch": 1075} {"train_loss": -39.451377868652344, "global_step": 130098, "epoch": 1075} {"train_loss": -39.42129135131836, "global_step": 130099, "epoch": 1075} {"train_loss": -38.81461715698242, "global_step": 130100, "epoch": 1075} {"train_loss": -37.199951171875, "global_step": 130101, "epoch": 1075} {"train_loss": -39.245277404785156, "global_step": 130102, "epoch": 1075} {"train_loss": -37.92838668823242, "global_step": 130103, "epoch": 1075} {"train_loss": -38.32011795043945, "global_step": 130104, "epoch": 1075} {"train_loss": -39.66321563720703, "global_step": 130105, "epoch": 1075} {"train_loss": -37.846656799316406, "global_step": 130106, "epoch": 1075} {"train_loss": -38.57699966430664, "global_step": 130107, "epoch": 1075} {"train_loss": -36.2701416015625, "global_step": 130108, "epoch": 1075} {"train_loss": -39.151344299316406, "global_step": 130109, "epoch": 1075} {"train_loss": -37.607723236083984, "global_step": 130110, "epoch": 1075} {"train_loss": -38.67875671386719, "global_step": 130111, "epoch": 1075} {"train_loss": -39.01112365722656, "global_step": 130112, "epoch": 1075} {"train_loss": -39.388206481933594, "global_step": 130113, "epoch": 1075} {"train_loss": -37.093299865722656, "global_step": 130114, "epoch": 1075} {"train_loss": -36.36503219604492, "global_step": 130115, "epoch": 1075} {"train_loss": -38.64251708984375, "global_step": 130116, "epoch": 1075} {"train_loss": -39.139503479003906, "global_step": 130117, "epoch": 1075} {"train_loss": -38.54624557495117, "global_step": 130118, "epoch": 1075} {"train_loss": -38.575130462646484, "global_step": 130119, "epoch": 1075} {"train_loss": -36.130245208740234, "global_step": 130120, "epoch": 1075} {"train_loss": -38.5716552734375, "global_step": 130121, "epoch": 1075} {"train_loss": -35.226322174072266, "global_step": 130122, "epoch": 1075} {"train_loss": -38.58304977416992, "global_step": 130123, "epoch": 1075} {"train_loss": -38.91851806640625, "global_step": 130124, "epoch": 1075} {"train_loss": -39.35010528564453, "global_step": 130125, "epoch": 1075} {"train_loss": -36.53095245361328, "global_step": 130126, "epoch": 1075} {"train_loss": -38.53376388549805, "global_step": 130127, "epoch": 1075} {"train_loss": -36.130184173583984, "global_step": 130128, "epoch": 1075} {"train_loss": -34.84058380126953, "global_step": 130129, "epoch": 1075} {"train_loss": -38.5764045715332, "global_step": 130130, "epoch": 1075} {"train_loss": -37.526275634765625, "global_step": 130131, "epoch": 1075} {"train_loss": -39.0245475769043, "global_step": 130132, "epoch": 1075} {"train_loss": -38.02769088745117, "global_step": 130133, "epoch": 1075} {"train_loss": -37.5767822265625, "global_step": 130134, "epoch": 1075} {"train_loss": -38.18212890625, "global_step": 130135, "epoch": 1075} {"train_loss": -36.59177780151367, "global_step": 130136, "epoch": 1075} {"train_loss": -38.292755126953125, "global_step": 130137, "epoch": 1075} {"train_loss": -38.77116012573242, "global_step": 130138, "epoch": 1075} {"train_loss": -38.027706146240234, "global_step": 130139, "epoch": 1075} {"train_loss": -37.379310607910156, "global_step": 130140, "epoch": 1075} {"train_loss": -38.07538604736328, "global_step": 130141, "epoch": 1075} {"train_loss": -38.320770263671875, "global_step": 130142, "epoch": 1075} {"train_loss": -38.841880798339844, "global_step": 130143, "epoch": 1075} {"train_loss": -37.10390853881836, "global_step": 130144, "epoch": 1075} {"train_loss": -37.23508834838867, "global_step": 130145, "epoch": 1075} {"train_loss": -38.61090087890625, "global_step": 130146, "epoch": 1075} {"train_loss": -37.97251510620117, "global_step": 130147, "epoch": 1075} {"train_loss": -37.71303176879883, "global_step": 130148, "epoch": 1075} {"train_loss": -39.37248611450195, "global_step": 130149, "epoch": 1075} {"train_loss": -39.01951599121094, "global_step": 130150, "epoch": 1075} {"train_loss": -38.16632080078125, "global_step": 130151, "epoch": 1075} {"train_loss": -38.59461212158203, "global_step": 130152, "epoch": 1075} {"train_loss": -39.368587493896484, "global_step": 130153, "epoch": 1075} {"train_loss": -38.58728790283203, "global_step": 130154, "epoch": 1075} {"train_loss": -38.10158920288086, "global_step": 130155, "epoch": 1075} {"train_loss": -39.30681228637695, "global_step": 130156, "epoch": 1075} {"train_loss": -38.754756927490234, "global_step": 130157, "epoch": 1075} {"train_loss": -38.04727554321289, "global_step": 130158, "epoch": 1075} {"train_loss": -39.37763595581055, "global_step": 130159, "epoch": 1075} {"train_loss": -38.61453628540039, "global_step": 130160, "epoch": 1075} {"train_loss": -39.7252082824707, "global_step": 130161, "epoch": 1075} {"train_loss": -38.89812469482422, "global_step": 130162, "epoch": 1075} {"train_loss": -36.9826774597168, "global_step": 130163, "epoch": 1075} {"train_loss": -39.16201400756836, "global_step": 130164, "epoch": 1075} {"train_loss": -39.5737419128418, "global_step": 130165, "epoch": 1075} {"train_loss": -39.4132194519043, "global_step": 130166, "epoch": 1075} {"train_loss": -37.96065902709961, "global_step": 130167, "epoch": 1075} {"train_loss": -39.94847869873047, "global_step": 130168, "epoch": 1075} {"train_loss": -38.50693893432617, "global_step": 130169, "epoch": 1075} {"train_loss": -38.67269515991211, "global_step": 130170, "epoch": 1075} {"train_loss": -39.52152633666992, "global_step": 130171, "epoch": 1075} {"train_loss": -38.62474060058594, "global_step": 130172, "epoch": 1075} {"train_loss": -38.96514892578125, "global_step": 130173, "epoch": 1075} {"train_loss": -39.925201416015625, "global_step": 130174, "epoch": 1075} {"train_loss": -39.88142776489258, "global_step": 130175, "epoch": 1075} {"train_loss": -39.410457611083984, "global_step": 130176, "epoch": 1075} {"train_loss": -39.776607513427734, "global_step": 130177, "epoch": 1075} {"train_loss": -39.14403533935547, "global_step": 130178, "epoch": 1075} {"train_loss": -32.73484420776367, "global_step": 130179, "epoch": 1075} {"train_loss": -39.54487991333008, "global_step": 130180, "epoch": 1075} {"train_loss": -37.2828369140625, "global_step": 130181, "epoch": 1075} {"train_loss": -39.20122146606445, "global_step": 130182, "epoch": 1075} {"train_loss": -37.51795196533203, "global_step": 130183, "epoch": 1075} {"train_loss": -35.894771575927734, "global_step": 130184, "epoch": 1075} {"train_loss": -37.03629684448242, "global_step": 130185, "epoch": 1075} {"train_loss": -39.263240814208984, "global_step": 130186, "epoch": 1075} {"train_loss": -38.71839904785156, "global_step": 130187, "epoch": 1075} {"train_loss": -35.032020568847656, "global_step": 130188, "epoch": 1075} {"train_loss": -35.277122497558594, "global_step": 130189, "epoch": 1075} {"train_loss": -39.00503921508789, "global_step": 130190, "epoch": 1075} {"train_loss": -37.618377685546875, "global_step": 130191, "epoch": 1075} {"train_loss": -36.64106369018555, "global_step": 130192, "epoch": 1075} {"train_loss": -38.21411895751953, "global_step": 130193, "epoch": 1075} {"train_loss": -38.2209358215332, "global_step": 130194, "epoch": 1075} {"train_loss": -38.41268561497208, "global_step": 130195, "epoch": 1075, "val_loss": 2729861.0} {"train_loss": -38.01721954345703, "global_step": 130196, "epoch": 1076} {"train_loss": -39.07753372192383, "global_step": 130197, "epoch": 1076} {"train_loss": -37.102508544921875, "global_step": 130198, "epoch": 1076} {"train_loss": -37.143699645996094, "global_step": 130199, "epoch": 1076} {"train_loss": -37.53887939453125, "global_step": 130200, "epoch": 1076} {"train_loss": -38.88264083862305, "global_step": 130201, "epoch": 1076} {"train_loss": -36.694522857666016, "global_step": 130202, "epoch": 1076} {"train_loss": -38.50701904296875, "global_step": 130203, "epoch": 1076} {"train_loss": -35.03243637084961, "global_step": 130204, "epoch": 1076} {"train_loss": -36.72883987426758, "global_step": 130205, "epoch": 1076} {"train_loss": -38.12975311279297, "global_step": 130206, "epoch": 1076} {"train_loss": -37.54901885986328, "global_step": 130207, "epoch": 1076} {"train_loss": -37.95228958129883, "global_step": 130208, "epoch": 1076} {"train_loss": -38.86582946777344, "global_step": 130209, "epoch": 1076} {"train_loss": -36.43982696533203, "global_step": 130210, "epoch": 1076} {"train_loss": -36.72140884399414, "global_step": 130211, "epoch": 1076} {"train_loss": -37.77048873901367, "global_step": 130212, "epoch": 1076} {"train_loss": -37.21828079223633, "global_step": 130213, "epoch": 1076} {"train_loss": -37.6092529296875, "global_step": 130214, "epoch": 1076} {"train_loss": -35.70418930053711, "global_step": 130215, "epoch": 1076} {"train_loss": -36.82883834838867, "global_step": 130216, "epoch": 1076} {"train_loss": -37.66445541381836, "global_step": 130217, "epoch": 1076} {"train_loss": -38.51127243041992, "global_step": 130218, "epoch": 1076} {"train_loss": -38.3229866027832, "global_step": 130219, "epoch": 1076} {"train_loss": -37.34284210205078, "global_step": 130220, "epoch": 1076} {"train_loss": -38.41401290893555, "global_step": 130221, "epoch": 1076} {"train_loss": -37.441829681396484, "global_step": 130222, "epoch": 1076} {"train_loss": -34.3840217590332, "global_step": 130223, "epoch": 1076} {"train_loss": -37.14390182495117, "global_step": 130224, "epoch": 1076} {"train_loss": -37.9177360534668, "global_step": 130225, "epoch": 1076} {"train_loss": -38.5002326965332, "global_step": 130226, "epoch": 1076} {"train_loss": -37.32198715209961, "global_step": 130227, "epoch": 1076} {"train_loss": -36.18778991699219, "global_step": 130228, "epoch": 1076} {"train_loss": -38.02802276611328, "global_step": 130229, "epoch": 1076} {"train_loss": -37.235755920410156, "global_step": 130230, "epoch": 1076} {"train_loss": -36.70718765258789, "global_step": 130231, "epoch": 1076} {"train_loss": -37.806827545166016, "global_step": 130232, "epoch": 1076} {"train_loss": -38.8631591796875, "global_step": 130233, "epoch": 1076} {"train_loss": -37.4084587097168, "global_step": 130234, "epoch": 1076} {"train_loss": -37.6522216796875, "global_step": 130235, "epoch": 1076} {"train_loss": -38.57746505737305, "global_step": 130236, "epoch": 1076} {"train_loss": -37.975006103515625, "global_step": 130237, "epoch": 1076} {"train_loss": -38.33945083618164, "global_step": 130238, "epoch": 1076} {"train_loss": -37.95766830444336, "global_step": 130239, "epoch": 1076} {"train_loss": -37.17464828491211, "global_step": 130240, "epoch": 1076} {"train_loss": -38.225406646728516, "global_step": 130241, "epoch": 1076} {"train_loss": -36.61246109008789, "global_step": 130242, "epoch": 1076} {"train_loss": -37.8033447265625, "global_step": 130243, "epoch": 1076} {"train_loss": -37.56288528442383, "global_step": 130244, "epoch": 1076} {"train_loss": -36.764339447021484, "global_step": 130245, "epoch": 1076} {"train_loss": -37.68024826049805, "global_step": 130246, "epoch": 1076} {"train_loss": -37.56757354736328, "global_step": 130247, "epoch": 1076} {"train_loss": -38.113494873046875, "global_step": 130248, "epoch": 1076} {"train_loss": -37.31757736206055, "global_step": 130249, "epoch": 1076} {"train_loss": -38.19111251831055, "global_step": 130250, "epoch": 1076} {"train_loss": -37.714599609375, "global_step": 130251, "epoch": 1076} {"train_loss": -37.68507766723633, "global_step": 130252, "epoch": 1076} {"train_loss": -38.225826263427734, "global_step": 130253, "epoch": 1076} {"train_loss": -36.780555725097656, "global_step": 130254, "epoch": 1076} {"train_loss": -38.64404296875, "global_step": 130255, "epoch": 1076} {"train_loss": -38.40532302856445, "global_step": 130256, "epoch": 1076} {"train_loss": -38.470943450927734, "global_step": 130257, "epoch": 1076} {"train_loss": -38.1113166809082, "global_step": 130258, "epoch": 1076} {"train_loss": -38.09324264526367, "global_step": 130259, "epoch": 1076} {"train_loss": -38.24723815917969, "global_step": 130260, "epoch": 1076} {"train_loss": -38.552547454833984, "global_step": 130261, "epoch": 1076} {"train_loss": -37.58366012573242, "global_step": 130262, "epoch": 1076} {"train_loss": -38.3814811706543, "global_step": 130263, "epoch": 1076} {"train_loss": -38.25531005859375, "global_step": 130264, "epoch": 1076} {"train_loss": -38.776302337646484, "global_step": 130265, "epoch": 1076} {"train_loss": -38.38140106201172, "global_step": 130266, "epoch": 1076} {"train_loss": -38.86432647705078, "global_step": 130267, "epoch": 1076} {"train_loss": -39.0461311340332, "global_step": 130268, "epoch": 1076} {"train_loss": -38.27729797363281, "global_step": 130269, "epoch": 1076} {"train_loss": -37.28940200805664, "global_step": 130270, "epoch": 1076} {"train_loss": -38.58039474487305, "global_step": 130271, "epoch": 1076} {"train_loss": -36.38795471191406, "global_step": 130272, "epoch": 1076} {"train_loss": -37.421791076660156, "global_step": 130273, "epoch": 1076} {"train_loss": -38.215797424316406, "global_step": 130274, "epoch": 1076} {"train_loss": -38.672332763671875, "global_step": 130275, "epoch": 1076} {"train_loss": -39.3737907409668, "global_step": 130276, "epoch": 1076} {"train_loss": -37.928253173828125, "global_step": 130277, "epoch": 1076} {"train_loss": -38.853736877441406, "global_step": 130278, "epoch": 1076} {"train_loss": -38.446693420410156, "global_step": 130279, "epoch": 1076} {"train_loss": -38.92246627807617, "global_step": 130280, "epoch": 1076} {"train_loss": -38.85726547241211, "global_step": 130281, "epoch": 1076} {"train_loss": -39.64723587036133, "global_step": 130282, "epoch": 1076} {"train_loss": -38.59567642211914, "global_step": 130283, "epoch": 1076} {"train_loss": -38.8810920715332, "global_step": 130284, "epoch": 1076} {"train_loss": -38.88576889038086, "global_step": 130285, "epoch": 1076} {"train_loss": -38.67414093017578, "global_step": 130286, "epoch": 1076} {"train_loss": -38.39536666870117, "global_step": 130287, "epoch": 1076} {"train_loss": -38.72657775878906, "global_step": 130288, "epoch": 1076} {"train_loss": -39.26516342163086, "global_step": 130289, "epoch": 1076} {"train_loss": -39.078948974609375, "global_step": 130290, "epoch": 1076} {"train_loss": -38.06016540527344, "global_step": 130291, "epoch": 1076} {"train_loss": -36.705013275146484, "global_step": 130292, "epoch": 1076} {"train_loss": -38.48191452026367, "global_step": 130293, "epoch": 1076} {"train_loss": -39.19184494018555, "global_step": 130294, "epoch": 1076} {"train_loss": -38.020111083984375, "global_step": 130295, "epoch": 1076} {"train_loss": -36.998165130615234, "global_step": 130296, "epoch": 1076} {"train_loss": -38.41877746582031, "global_step": 130297, "epoch": 1076} {"train_loss": -38.50883102416992, "global_step": 130298, "epoch": 1076} {"train_loss": -37.3390007019043, "global_step": 130299, "epoch": 1076} {"train_loss": -38.405635833740234, "global_step": 130300, "epoch": 1076} {"train_loss": -38.34886169433594, "global_step": 130301, "epoch": 1076} {"train_loss": -38.3328971862793, "global_step": 130302, "epoch": 1076} {"train_loss": -35.740089416503906, "global_step": 130303, "epoch": 1076} {"train_loss": -36.65302658081055, "global_step": 130304, "epoch": 1076} {"train_loss": -38.58315658569336, "global_step": 130305, "epoch": 1076} {"train_loss": -36.12742233276367, "global_step": 130306, "epoch": 1076} {"train_loss": -37.317832946777344, "global_step": 130307, "epoch": 1076} {"train_loss": -37.8275146484375, "global_step": 130308, "epoch": 1076} {"train_loss": -37.333961486816406, "global_step": 130309, "epoch": 1076} {"train_loss": -37.1667366027832, "global_step": 130310, "epoch": 1076} {"train_loss": -36.672706604003906, "global_step": 130311, "epoch": 1076} {"train_loss": -38.578495025634766, "global_step": 130312, "epoch": 1076} {"train_loss": -37.66252517700195, "global_step": 130313, "epoch": 1076} {"train_loss": -38.151241302490234, "global_step": 130314, "epoch": 1076} {"train_loss": -37.031715393066406, "global_step": 130315, "epoch": 1076} {"train_loss": -37.84938777576793, "global_step": 130316, "epoch": 1076, "val_loss": 2658111.25} {"train_loss": -38.135894775390625, "global_step": 130317, "epoch": 1077} {"train_loss": -38.680213928222656, "global_step": 130318, "epoch": 1077} {"train_loss": -37.473201751708984, "global_step": 130319, "epoch": 1077} {"train_loss": -38.93490219116211, "global_step": 130320, "epoch": 1077} {"train_loss": -38.67443084716797, "global_step": 130321, "epoch": 1077} {"train_loss": -38.74453353881836, "global_step": 130322, "epoch": 1077} {"train_loss": -38.96195602416992, "global_step": 130323, "epoch": 1077} {"train_loss": -38.86184310913086, "global_step": 130324, "epoch": 1077} {"train_loss": -39.037872314453125, "global_step": 130325, "epoch": 1077} {"train_loss": -38.51591110229492, "global_step": 130326, "epoch": 1077} {"train_loss": -38.98112106323242, "global_step": 130327, "epoch": 1077} {"train_loss": -39.08449172973633, "global_step": 130328, "epoch": 1077} {"train_loss": -39.2679443359375, "global_step": 130329, "epoch": 1077} {"train_loss": -38.39643096923828, "global_step": 130330, "epoch": 1077} {"train_loss": -39.41108322143555, "global_step": 130331, "epoch": 1077} {"train_loss": -39.39495849609375, "global_step": 130332, "epoch": 1077} {"train_loss": -39.42965316772461, "global_step": 130333, "epoch": 1077} {"train_loss": -38.97692108154297, "global_step": 130334, "epoch": 1077} {"train_loss": -39.31818771362305, "global_step": 130335, "epoch": 1077} {"train_loss": -38.79631042480469, "global_step": 130336, "epoch": 1077} {"train_loss": -39.34060287475586, "global_step": 130337, "epoch": 1077} {"train_loss": -38.974884033203125, "global_step": 130338, "epoch": 1077} {"train_loss": -39.009395599365234, "global_step": 130339, "epoch": 1077} {"train_loss": -38.89302444458008, "global_step": 130340, "epoch": 1077} {"train_loss": -38.46564483642578, "global_step": 130341, "epoch": 1077} {"train_loss": -39.4140739440918, "global_step": 130342, "epoch": 1077} {"train_loss": -37.714866638183594, "global_step": 130343, "epoch": 1077} {"train_loss": -38.11119079589844, "global_step": 130344, "epoch": 1077} {"train_loss": -38.529544830322266, "global_step": 130345, "epoch": 1077} {"train_loss": -39.855438232421875, "global_step": 130346, "epoch": 1077} {"train_loss": -39.15138626098633, "global_step": 130347, "epoch": 1077} {"train_loss": -39.38993453979492, "global_step": 130348, "epoch": 1077} {"train_loss": -39.35508346557617, "global_step": 130349, "epoch": 1077} {"train_loss": -40.08510971069336, "global_step": 130350, "epoch": 1077} {"train_loss": -39.169349670410156, "global_step": 130351, "epoch": 1077} {"train_loss": -38.38092041015625, "global_step": 130352, "epoch": 1077} {"train_loss": -39.15472412109375, "global_step": 130353, "epoch": 1077} {"train_loss": -39.94571304321289, "global_step": 130354, "epoch": 1077} {"train_loss": -39.21900177001953, "global_step": 130355, "epoch": 1077} {"train_loss": -38.287940979003906, "global_step": 130356, "epoch": 1077} {"train_loss": -37.847023010253906, "global_step": 130357, "epoch": 1077} {"train_loss": -38.81647872924805, "global_step": 130358, "epoch": 1077} {"train_loss": -38.765079498291016, "global_step": 130359, "epoch": 1077} {"train_loss": -38.45033645629883, "global_step": 130360, "epoch": 1077} {"train_loss": -37.605323791503906, "global_step": 130361, "epoch": 1077} {"train_loss": -38.423057556152344, "global_step": 130362, "epoch": 1077} {"train_loss": -38.26038360595703, "global_step": 130363, "epoch": 1077} {"train_loss": -35.25448226928711, "global_step": 130364, "epoch": 1077} {"train_loss": -33.388423919677734, "global_step": 130365, "epoch": 1077} {"train_loss": -27.6884765625, "global_step": 130366, "epoch": 1077} {"train_loss": -32.499237060546875, "global_step": 130367, "epoch": 1077} {"train_loss": -38.14896774291992, "global_step": 130368, "epoch": 1077} {"train_loss": -37.5372200012207, "global_step": 130369, "epoch": 1077} {"train_loss": -35.8060417175293, "global_step": 130370, "epoch": 1077} {"train_loss": -37.61788558959961, "global_step": 130371, "epoch": 1077} {"train_loss": -38.39362716674805, "global_step": 130372, "epoch": 1077} {"train_loss": -38.51051712036133, "global_step": 130373, "epoch": 1077} {"train_loss": -36.80607986450195, "global_step": 130374, "epoch": 1077} {"train_loss": -38.20774841308594, "global_step": 130375, "epoch": 1077} {"train_loss": -37.86716842651367, "global_step": 130376, "epoch": 1077} {"train_loss": -36.666053771972656, "global_step": 130377, "epoch": 1077} {"train_loss": -38.8526611328125, "global_step": 130378, "epoch": 1077} {"train_loss": -37.52702713012695, "global_step": 130379, "epoch": 1077} {"train_loss": -38.95147705078125, "global_step": 130380, "epoch": 1077} {"train_loss": -38.09511184692383, "global_step": 130381, "epoch": 1077} {"train_loss": -38.830055236816406, "global_step": 130382, "epoch": 1077} {"train_loss": -37.39301681518555, "global_step": 130383, "epoch": 1077} {"train_loss": -38.97218322753906, "global_step": 130384, "epoch": 1077} {"train_loss": -39.1228141784668, "global_step": 130385, "epoch": 1077} {"train_loss": -39.340850830078125, "global_step": 130386, "epoch": 1077} {"train_loss": -39.828948974609375, "global_step": 130387, "epoch": 1077} {"train_loss": -39.421390533447266, "global_step": 130388, "epoch": 1077} {"train_loss": -39.528018951416016, "global_step": 130389, "epoch": 1077} {"train_loss": -39.40167999267578, "global_step": 130390, "epoch": 1077} {"train_loss": -39.36634826660156, "global_step": 130391, "epoch": 1077} {"train_loss": -39.76400375366211, "global_step": 130392, "epoch": 1077} {"train_loss": -39.59908676147461, "global_step": 130393, "epoch": 1077} {"train_loss": -39.3641471862793, "global_step": 130394, "epoch": 1077} {"train_loss": -38.02932357788086, "global_step": 130395, "epoch": 1077} {"train_loss": -39.64069747924805, "global_step": 130396, "epoch": 1077} {"train_loss": -39.4722785949707, "global_step": 130397, "epoch": 1077} {"train_loss": -39.83552932739258, "global_step": 130398, "epoch": 1077} {"train_loss": -39.88375473022461, "global_step": 130399, "epoch": 1077} {"train_loss": -39.75515365600586, "global_step": 130400, "epoch": 1077} {"train_loss": -39.13389205932617, "global_step": 130401, "epoch": 1077} {"train_loss": -39.739776611328125, "global_step": 130402, "epoch": 1077} {"train_loss": -39.849159240722656, "global_step": 130403, "epoch": 1077} {"train_loss": -39.44990921020508, "global_step": 130404, "epoch": 1077} {"train_loss": -40.354923248291016, "global_step": 130405, "epoch": 1077} {"train_loss": -39.984352111816406, "global_step": 130406, "epoch": 1077} {"train_loss": -39.7010383605957, "global_step": 130407, "epoch": 1077} {"train_loss": -39.95037078857422, "global_step": 130408, "epoch": 1077} {"train_loss": -40.34904098510742, "global_step": 130409, "epoch": 1077} {"train_loss": -39.6993293762207, "global_step": 130410, "epoch": 1077} {"train_loss": -40.366973876953125, "global_step": 130411, "epoch": 1077} {"train_loss": -40.37691116333008, "global_step": 130412, "epoch": 1077} {"train_loss": -40.3205451965332, "global_step": 130413, "epoch": 1077} {"train_loss": -39.98316192626953, "global_step": 130414, "epoch": 1077} {"train_loss": -39.33759689331055, "global_step": 130415, "epoch": 1077} {"train_loss": -39.964656829833984, "global_step": 130416, "epoch": 1077} {"train_loss": -39.85139465332031, "global_step": 130417, "epoch": 1077} {"train_loss": -40.19082260131836, "global_step": 130418, "epoch": 1077} {"train_loss": -39.7351188659668, "global_step": 130419, "epoch": 1077} {"train_loss": -38.24988555908203, "global_step": 130420, "epoch": 1077} {"train_loss": -39.00529098510742, "global_step": 130421, "epoch": 1077} {"train_loss": -40.234718322753906, "global_step": 130422, "epoch": 1077} {"train_loss": -39.80836486816406, "global_step": 130423, "epoch": 1077} {"train_loss": -39.414146423339844, "global_step": 130424, "epoch": 1077} {"train_loss": -38.26961898803711, "global_step": 130425, "epoch": 1077} {"train_loss": -39.963417053222656, "global_step": 130426, "epoch": 1077} {"train_loss": -37.68696975708008, "global_step": 130427, "epoch": 1077} {"train_loss": -39.88608932495117, "global_step": 130428, "epoch": 1077} {"train_loss": -39.019954681396484, "global_step": 130429, "epoch": 1077} {"train_loss": -35.60365295410156, "global_step": 130430, "epoch": 1077} {"train_loss": -39.742713928222656, "global_step": 130431, "epoch": 1077} {"train_loss": -36.19528579711914, "global_step": 130432, "epoch": 1077} {"train_loss": -34.498329162597656, "global_step": 130433, "epoch": 1077} {"train_loss": -38.23126983642578, "global_step": 130434, "epoch": 1077} {"train_loss": -37.98342514038086, "global_step": 130435, "epoch": 1077} {"train_loss": -36.82585144042969, "global_step": 130436, "epoch": 1077} {"train_loss": -38.65893759609254, "global_step": 130437, "epoch": 1077, "val_loss": 2724609.0} {"train_loss": -38.31356430053711, "global_step": 130438, "epoch": 1078} {"train_loss": -37.629310607910156, "global_step": 130439, "epoch": 1078} {"train_loss": -37.82744216918945, "global_step": 130440, "epoch": 1078} {"train_loss": -33.23617935180664, "global_step": 130441, "epoch": 1078} {"train_loss": -37.038997650146484, "global_step": 130442, "epoch": 1078} {"train_loss": -37.78620147705078, "global_step": 130443, "epoch": 1078} {"train_loss": -35.965755462646484, "global_step": 130444, "epoch": 1078} {"train_loss": -31.132705688476562, "global_step": 130445, "epoch": 1078} {"train_loss": -38.04977035522461, "global_step": 130446, "epoch": 1078} {"train_loss": -31.9793701171875, "global_step": 130447, "epoch": 1078} {"train_loss": -34.73386764526367, "global_step": 130448, "epoch": 1078} {"train_loss": -33.386558532714844, "global_step": 130449, "epoch": 1078} {"train_loss": -33.881256103515625, "global_step": 130450, "epoch": 1078} {"train_loss": -36.82883834838867, "global_step": 130451, "epoch": 1078} {"train_loss": -37.83326721191406, "global_step": 130452, "epoch": 1078} {"train_loss": -35.97272491455078, "global_step": 130453, "epoch": 1078} {"train_loss": -37.5568962097168, "global_step": 130454, "epoch": 1078} {"train_loss": -36.81218719482422, "global_step": 130455, "epoch": 1078} {"train_loss": -35.474971771240234, "global_step": 130456, "epoch": 1078} {"train_loss": -36.2474479675293, "global_step": 130457, "epoch": 1078} {"train_loss": -37.22616195678711, "global_step": 130458, "epoch": 1078} {"train_loss": -37.358367919921875, "global_step": 130459, "epoch": 1078} {"train_loss": -35.86988067626953, "global_step": 130460, "epoch": 1078} {"train_loss": -35.83607864379883, "global_step": 130461, "epoch": 1078} {"train_loss": -35.899715423583984, "global_step": 130462, "epoch": 1078} {"train_loss": -37.30418014526367, "global_step": 130463, "epoch": 1078} {"train_loss": -36.919532775878906, "global_step": 130464, "epoch": 1078} {"train_loss": -36.7033805847168, "global_step": 130465, "epoch": 1078} {"train_loss": -36.963069915771484, "global_step": 130466, "epoch": 1078} {"train_loss": -37.03438949584961, "global_step": 130467, "epoch": 1078} {"train_loss": -37.23313522338867, "global_step": 130468, "epoch": 1078} {"train_loss": -37.52862548828125, "global_step": 130469, "epoch": 1078} {"train_loss": -36.47368621826172, "global_step": 130470, "epoch": 1078} {"train_loss": -37.38448715209961, "global_step": 130471, "epoch": 1078} {"train_loss": -37.83831787109375, "global_step": 130472, "epoch": 1078} {"train_loss": -37.89399719238281, "global_step": 130473, "epoch": 1078} {"train_loss": -37.62165832519531, "global_step": 130474, "epoch": 1078} {"train_loss": -37.15406036376953, "global_step": 130475, "epoch": 1078} {"train_loss": -37.474708557128906, "global_step": 130476, "epoch": 1078} {"train_loss": -38.01570510864258, "global_step": 130477, "epoch": 1078} {"train_loss": -38.01328659057617, "global_step": 130478, "epoch": 1078} {"train_loss": -37.118804931640625, "global_step": 130479, "epoch": 1078} {"train_loss": -38.26508712768555, "global_step": 130480, "epoch": 1078} {"train_loss": -38.12554931640625, "global_step": 130481, "epoch": 1078} {"train_loss": -38.56110382080078, "global_step": 130482, "epoch": 1078} {"train_loss": -38.582855224609375, "global_step": 130483, "epoch": 1078} {"train_loss": -36.99055862426758, "global_step": 130484, "epoch": 1078} {"train_loss": -38.6317138671875, "global_step": 130485, "epoch": 1078} {"train_loss": -38.2579460144043, "global_step": 130486, "epoch": 1078} {"train_loss": -38.19588851928711, "global_step": 130487, "epoch": 1078} {"train_loss": -38.81258773803711, "global_step": 130488, "epoch": 1078} {"train_loss": -38.92818069458008, "global_step": 130489, "epoch": 1078} {"train_loss": -37.955928802490234, "global_step": 130490, "epoch": 1078} {"train_loss": -38.683509826660156, "global_step": 130491, "epoch": 1078} {"train_loss": -38.78664779663086, "global_step": 130492, "epoch": 1078} {"train_loss": -38.58051681518555, "global_step": 130493, "epoch": 1078} {"train_loss": -38.502498626708984, "global_step": 130494, "epoch": 1078} {"train_loss": -38.54352951049805, "global_step": 130495, "epoch": 1078} {"train_loss": -39.03561019897461, "global_step": 130496, "epoch": 1078} {"train_loss": -39.132598876953125, "global_step": 130497, "epoch": 1078} {"train_loss": -38.65562057495117, "global_step": 130498, "epoch": 1078} {"train_loss": -38.84214401245117, "global_step": 130499, "epoch": 1078} {"train_loss": -38.775550842285156, "global_step": 130500, "epoch": 1078} {"train_loss": -39.48558807373047, "global_step": 130501, "epoch": 1078} {"train_loss": -39.11948776245117, "global_step": 130502, "epoch": 1078} {"train_loss": -38.66053771972656, "global_step": 130503, "epoch": 1078} {"train_loss": -39.663570404052734, "global_step": 130504, "epoch": 1078} {"train_loss": -39.04783630371094, "global_step": 130505, "epoch": 1078} {"train_loss": -39.03300476074219, "global_step": 130506, "epoch": 1078} {"train_loss": -39.30259704589844, "global_step": 130507, "epoch": 1078} {"train_loss": -39.5201301574707, "global_step": 130508, "epoch": 1078} {"train_loss": -39.43525314331055, "global_step": 130509, "epoch": 1078} {"train_loss": -39.67694854736328, "global_step": 130510, "epoch": 1078} {"train_loss": -39.0914306640625, "global_step": 130511, "epoch": 1078} {"train_loss": -39.6069221496582, "global_step": 130512, "epoch": 1078} {"train_loss": -39.13274383544922, "global_step": 130513, "epoch": 1078} {"train_loss": -39.734214782714844, "global_step": 130514, "epoch": 1078} {"train_loss": -39.57655715942383, "global_step": 130515, "epoch": 1078} {"train_loss": -39.34395217895508, "global_step": 130516, "epoch": 1078} {"train_loss": -39.861061096191406, "global_step": 130517, "epoch": 1078} {"train_loss": -40.04887008666992, "global_step": 130518, "epoch": 1078} {"train_loss": -39.76691818237305, "global_step": 130519, "epoch": 1078} {"train_loss": -39.69813919067383, "global_step": 130520, "epoch": 1078} {"train_loss": -39.75324249267578, "global_step": 130521, "epoch": 1078} {"train_loss": -39.66144561767578, "global_step": 130522, "epoch": 1078} {"train_loss": -39.827171325683594, "global_step": 130523, "epoch": 1078} {"train_loss": -39.06928634643555, "global_step": 130524, "epoch": 1078} {"train_loss": -39.438140869140625, "global_step": 130525, "epoch": 1078} {"train_loss": -40.06639862060547, "global_step": 130526, "epoch": 1078} {"train_loss": -39.67197036743164, "global_step": 130527, "epoch": 1078} {"train_loss": -38.78805160522461, "global_step": 130528, "epoch": 1078} {"train_loss": -39.1842155456543, "global_step": 130529, "epoch": 1078} {"train_loss": -37.791595458984375, "global_step": 130530, "epoch": 1078} {"train_loss": -39.184329986572266, "global_step": 130531, "epoch": 1078} {"train_loss": -38.7030143737793, "global_step": 130532, "epoch": 1078} {"train_loss": -39.428524017333984, "global_step": 130533, "epoch": 1078} {"train_loss": -39.107112884521484, "global_step": 130534, "epoch": 1078} {"train_loss": -37.4150505065918, "global_step": 130535, "epoch": 1078} {"train_loss": -36.324981689453125, "global_step": 130536, "epoch": 1078} {"train_loss": -33.92123794555664, "global_step": 130537, "epoch": 1078} {"train_loss": -33.74510192871094, "global_step": 130538, "epoch": 1078} {"train_loss": -34.176422119140625, "global_step": 130539, "epoch": 1078} {"train_loss": -38.05693435668945, "global_step": 130540, "epoch": 1078} {"train_loss": -38.5316276550293, "global_step": 130541, "epoch": 1078} {"train_loss": -38.238399505615234, "global_step": 130542, "epoch": 1078} {"train_loss": -37.65238571166992, "global_step": 130543, "epoch": 1078} {"train_loss": -38.098358154296875, "global_step": 130544, "epoch": 1078} {"train_loss": -38.10299301147461, "global_step": 130545, "epoch": 1078} {"train_loss": -39.94451904296875, "global_step": 130546, "epoch": 1078} {"train_loss": -37.461856842041016, "global_step": 130547, "epoch": 1078} {"train_loss": -39.189117431640625, "global_step": 130548, "epoch": 1078} {"train_loss": -38.01871871948242, "global_step": 130549, "epoch": 1078} {"train_loss": -38.699432373046875, "global_step": 130550, "epoch": 1078} {"train_loss": -38.11480712890625, "global_step": 130551, "epoch": 1078} {"train_loss": -38.875572204589844, "global_step": 130552, "epoch": 1078} {"train_loss": -39.15134048461914, "global_step": 130553, "epoch": 1078} {"train_loss": -39.48891067504883, "global_step": 130554, "epoch": 1078} {"train_loss": -39.16243362426758, "global_step": 130555, "epoch": 1078} {"train_loss": -39.41386032104492, "global_step": 130556, "epoch": 1078} {"train_loss": -39.31246566772461, "global_step": 130557, "epoch": 1078} {"train_loss": -37.949822008117174, "global_step": 130558, "epoch": 1078, "val_loss": 2638517.0} {"train_loss": -39.26996994018555, "global_step": 130559, "epoch": 1079} {"train_loss": -39.60494613647461, "global_step": 130560, "epoch": 1079} {"train_loss": -39.41660690307617, "global_step": 130561, "epoch": 1079} {"train_loss": -39.98418426513672, "global_step": 130562, "epoch": 1079} {"train_loss": -38.64035415649414, "global_step": 130563, "epoch": 1079} {"train_loss": -39.20746994018555, "global_step": 130564, "epoch": 1079} {"train_loss": -38.45289993286133, "global_step": 130565, "epoch": 1079} {"train_loss": -39.690399169921875, "global_step": 130566, "epoch": 1079} {"train_loss": -39.7421760559082, "global_step": 130567, "epoch": 1079} {"train_loss": -38.41434860229492, "global_step": 130568, "epoch": 1079} {"train_loss": -38.599571228027344, "global_step": 130569, "epoch": 1079} {"train_loss": -39.03716278076172, "global_step": 130570, "epoch": 1079} {"train_loss": -38.94696044921875, "global_step": 130571, "epoch": 1079} {"train_loss": -39.06895065307617, "global_step": 130572, "epoch": 1079} {"train_loss": -37.732666015625, "global_step": 130573, "epoch": 1079} {"train_loss": -39.048316955566406, "global_step": 130574, "epoch": 1079} {"train_loss": -38.460514068603516, "global_step": 130575, "epoch": 1079} {"train_loss": -37.88734817504883, "global_step": 130576, "epoch": 1079} {"train_loss": -38.43108367919922, "global_step": 130577, "epoch": 1079} {"train_loss": -39.14254379272461, "global_step": 130578, "epoch": 1079} {"train_loss": -38.815818786621094, "global_step": 130579, "epoch": 1079} {"train_loss": -39.118682861328125, "global_step": 130580, "epoch": 1079} {"train_loss": -38.890380859375, "global_step": 130581, "epoch": 1079} {"train_loss": -38.79328536987305, "global_step": 130582, "epoch": 1079} {"train_loss": -39.453392028808594, "global_step": 130583, "epoch": 1079} {"train_loss": -38.02217483520508, "global_step": 130584, "epoch": 1079} {"train_loss": -38.64575958251953, "global_step": 130585, "epoch": 1079} {"train_loss": -38.99289321899414, "global_step": 130586, "epoch": 1079} {"train_loss": -38.960723876953125, "global_step": 130587, "epoch": 1079} {"train_loss": -38.784122467041016, "global_step": 130588, "epoch": 1079} {"train_loss": -37.708282470703125, "global_step": 130589, "epoch": 1079} {"train_loss": -38.425655364990234, "global_step": 130590, "epoch": 1079} {"train_loss": -37.49701690673828, "global_step": 130591, "epoch": 1079} {"train_loss": -38.600032806396484, "global_step": 130592, "epoch": 1079} {"train_loss": -38.94734573364258, "global_step": 130593, "epoch": 1079} {"train_loss": -37.9019889831543, "global_step": 130594, "epoch": 1079} {"train_loss": -38.525550842285156, "global_step": 130595, "epoch": 1079} {"train_loss": -38.2513313293457, "global_step": 130596, "epoch": 1079} {"train_loss": -38.99717712402344, "global_step": 130597, "epoch": 1079} {"train_loss": -37.891963958740234, "global_step": 130598, "epoch": 1079} {"train_loss": -38.360755920410156, "global_step": 130599, "epoch": 1079} {"train_loss": -37.3486442565918, "global_step": 130600, "epoch": 1079} {"train_loss": -37.28329086303711, "global_step": 130601, "epoch": 1079} {"train_loss": -38.27368927001953, "global_step": 130602, "epoch": 1079} {"train_loss": -38.107696533203125, "global_step": 130603, "epoch": 1079} {"train_loss": -38.21512222290039, "global_step": 130604, "epoch": 1079} {"train_loss": -37.71247482299805, "global_step": 130605, "epoch": 1079} {"train_loss": -39.018218994140625, "global_step": 130606, "epoch": 1079} {"train_loss": -37.1645622253418, "global_step": 130607, "epoch": 1079} {"train_loss": -38.98228073120117, "global_step": 130608, "epoch": 1079} {"train_loss": -38.96322250366211, "global_step": 130609, "epoch": 1079} {"train_loss": -38.801029205322266, "global_step": 130610, "epoch": 1079} {"train_loss": -38.46047592163086, "global_step": 130611, "epoch": 1079} {"train_loss": -39.76179504394531, "global_step": 130612, "epoch": 1079} {"train_loss": -38.93404769897461, "global_step": 130613, "epoch": 1079} {"train_loss": -39.463226318359375, "global_step": 130614, "epoch": 1079} {"train_loss": -39.37068176269531, "global_step": 130615, "epoch": 1079} {"train_loss": -39.41514205932617, "global_step": 130616, "epoch": 1079} {"train_loss": -39.3793830871582, "global_step": 130617, "epoch": 1079} {"train_loss": -39.5257682800293, "global_step": 130618, "epoch": 1079} {"train_loss": -39.15631866455078, "global_step": 130619, "epoch": 1079} {"train_loss": -38.35158920288086, "global_step": 130620, "epoch": 1079} {"train_loss": -38.33980941772461, "global_step": 130621, "epoch": 1079} {"train_loss": -39.488643646240234, "global_step": 130622, "epoch": 1079} {"train_loss": -38.90308380126953, "global_step": 130623, "epoch": 1079} {"train_loss": -37.75128936767578, "global_step": 130624, "epoch": 1079} {"train_loss": -38.349979400634766, "global_step": 130625, "epoch": 1079} {"train_loss": -39.495391845703125, "global_step": 130626, "epoch": 1079} {"train_loss": -38.6477165222168, "global_step": 130627, "epoch": 1079} {"train_loss": -38.534263610839844, "global_step": 130628, "epoch": 1079} {"train_loss": -38.4615364074707, "global_step": 130629, "epoch": 1079} {"train_loss": -39.35908508300781, "global_step": 130630, "epoch": 1079} {"train_loss": -39.75473403930664, "global_step": 130631, "epoch": 1079} {"train_loss": -39.19953155517578, "global_step": 130632, "epoch": 1079} {"train_loss": -39.583717346191406, "global_step": 130633, "epoch": 1079} {"train_loss": -39.11985397338867, "global_step": 130634, "epoch": 1079} {"train_loss": -39.01389694213867, "global_step": 130635, "epoch": 1079} {"train_loss": -38.59231185913086, "global_step": 130636, "epoch": 1079} {"train_loss": -39.796390533447266, "global_step": 130637, "epoch": 1079} {"train_loss": -39.574790954589844, "global_step": 130638, "epoch": 1079} {"train_loss": -38.69832992553711, "global_step": 130639, "epoch": 1079} {"train_loss": -39.32481002807617, "global_step": 130640, "epoch": 1079} {"train_loss": -40.366085052490234, "global_step": 130641, "epoch": 1079} {"train_loss": -38.564369201660156, "global_step": 130642, "epoch": 1079} {"train_loss": -39.12568283081055, "global_step": 130643, "epoch": 1079} {"train_loss": -39.806053161621094, "global_step": 130644, "epoch": 1079} {"train_loss": -38.97241973876953, "global_step": 130645, "epoch": 1079} {"train_loss": -38.50452423095703, "global_step": 130646, "epoch": 1079} {"train_loss": -39.63119125366211, "global_step": 130647, "epoch": 1079} {"train_loss": -40.06087875366211, "global_step": 130648, "epoch": 1079} {"train_loss": -38.09733963012695, "global_step": 130649, "epoch": 1079} {"train_loss": -39.16848373413086, "global_step": 130650, "epoch": 1079} {"train_loss": -39.0384407043457, "global_step": 130651, "epoch": 1079} {"train_loss": -39.17496871948242, "global_step": 130652, "epoch": 1079} {"train_loss": -38.54765701293945, "global_step": 130653, "epoch": 1079} {"train_loss": -39.53229522705078, "global_step": 130654, "epoch": 1079} {"train_loss": -38.21940612792969, "global_step": 130655, "epoch": 1079} {"train_loss": -38.503597259521484, "global_step": 130656, "epoch": 1079} {"train_loss": -39.1229248046875, "global_step": 130657, "epoch": 1079} {"train_loss": -38.99876022338867, "global_step": 130658, "epoch": 1079} {"train_loss": -37.56246566772461, "global_step": 130659, "epoch": 1079} {"train_loss": -38.294219970703125, "global_step": 130660, "epoch": 1079} {"train_loss": -38.52180099487305, "global_step": 130661, "epoch": 1079} {"train_loss": -37.72495651245117, "global_step": 130662, "epoch": 1079} {"train_loss": -37.92313766479492, "global_step": 130663, "epoch": 1079} {"train_loss": -39.312294006347656, "global_step": 130664, "epoch": 1079} {"train_loss": -38.635986328125, "global_step": 130665, "epoch": 1079} {"train_loss": -36.655635833740234, "global_step": 130666, "epoch": 1079} {"train_loss": -39.06269454956055, "global_step": 130667, "epoch": 1079} {"train_loss": -36.84147262573242, "global_step": 130668, "epoch": 1079} {"train_loss": -38.26374053955078, "global_step": 130669, "epoch": 1079} {"train_loss": -39.49177551269531, "global_step": 130670, "epoch": 1079} {"train_loss": -38.8654899597168, "global_step": 130671, "epoch": 1079} {"train_loss": -39.36394119262695, "global_step": 130672, "epoch": 1079} {"train_loss": -38.959754943847656, "global_step": 130673, "epoch": 1079} {"train_loss": -38.7755126953125, "global_step": 130674, "epoch": 1079} {"train_loss": -39.37205123901367, "global_step": 130675, "epoch": 1079} {"train_loss": -39.222957611083984, "global_step": 130676, "epoch": 1079} {"train_loss": -39.431556701660156, "global_step": 130677, "epoch": 1079} {"train_loss": -38.77498245239258, "global_step": 130678, "epoch": 1079} {"train_loss": -38.79917469497555, "global_step": 130679, "epoch": 1079, "val_loss": 2618896.75} {"train_loss": -38.376976013183594, "global_step": 130680, "epoch": 1080} {"train_loss": -40.06340408325195, "global_step": 130681, "epoch": 1080} {"train_loss": -38.33583068847656, "global_step": 130682, "epoch": 1080} {"train_loss": -39.617733001708984, "global_step": 130683, "epoch": 1080} {"train_loss": -38.651424407958984, "global_step": 130684, "epoch": 1080} {"train_loss": -39.680320739746094, "global_step": 130685, "epoch": 1080} {"train_loss": -39.0601692199707, "global_step": 130686, "epoch": 1080} {"train_loss": -40.07344436645508, "global_step": 130687, "epoch": 1080} {"train_loss": -37.66130065917969, "global_step": 130688, "epoch": 1080} {"train_loss": -39.110111236572266, "global_step": 130689, "epoch": 1080} {"train_loss": -37.78769302368164, "global_step": 130690, "epoch": 1080} {"train_loss": -39.0055046081543, "global_step": 130691, "epoch": 1080} {"train_loss": -37.95858383178711, "global_step": 130692, "epoch": 1080} {"train_loss": -37.388309478759766, "global_step": 130693, "epoch": 1080} {"train_loss": -34.669185638427734, "global_step": 130694, "epoch": 1080} {"train_loss": -35.16898727416992, "global_step": 130695, "epoch": 1080} {"train_loss": -35.69989776611328, "global_step": 130696, "epoch": 1080} {"train_loss": -38.012786865234375, "global_step": 130697, "epoch": 1080} {"train_loss": -39.40631866455078, "global_step": 130698, "epoch": 1080} {"train_loss": -37.92378616333008, "global_step": 130699, "epoch": 1080} {"train_loss": -35.9312858581543, "global_step": 130700, "epoch": 1080} {"train_loss": -33.76250457763672, "global_step": 130701, "epoch": 1080} {"train_loss": -38.955963134765625, "global_step": 130702, "epoch": 1080} {"train_loss": -35.9456672668457, "global_step": 130703, "epoch": 1080} {"train_loss": -34.58621597290039, "global_step": 130704, "epoch": 1080} {"train_loss": -37.05704879760742, "global_step": 130705, "epoch": 1080} {"train_loss": -35.06760787963867, "global_step": 130706, "epoch": 1080} {"train_loss": -37.8455924987793, "global_step": 130707, "epoch": 1080} {"train_loss": -36.436336517333984, "global_step": 130708, "epoch": 1080} {"train_loss": -36.894447326660156, "global_step": 130709, "epoch": 1080} {"train_loss": -37.76681900024414, "global_step": 130710, "epoch": 1080} {"train_loss": -36.3998908996582, "global_step": 130711, "epoch": 1080} {"train_loss": -38.90928268432617, "global_step": 130712, "epoch": 1080} {"train_loss": -38.375762939453125, "global_step": 130713, "epoch": 1080} {"train_loss": -36.788997650146484, "global_step": 130714, "epoch": 1080} {"train_loss": -37.115943908691406, "global_step": 130715, "epoch": 1080} {"train_loss": -37.761932373046875, "global_step": 130716, "epoch": 1080} {"train_loss": -35.89508819580078, "global_step": 130717, "epoch": 1080} {"train_loss": -37.81482696533203, "global_step": 130718, "epoch": 1080} {"train_loss": -38.08883285522461, "global_step": 130719, "epoch": 1080} {"train_loss": -37.60687255859375, "global_step": 130720, "epoch": 1080} {"train_loss": -33.93144607543945, "global_step": 130721, "epoch": 1080} {"train_loss": -36.44765853881836, "global_step": 130722, "epoch": 1080} {"train_loss": -37.30318832397461, "global_step": 130723, "epoch": 1080} {"train_loss": -36.75880813598633, "global_step": 130724, "epoch": 1080} {"train_loss": -38.43134689331055, "global_step": 130725, "epoch": 1080} {"train_loss": -35.57642364501953, "global_step": 130726, "epoch": 1080} {"train_loss": -35.42931365966797, "global_step": 130727, "epoch": 1080} {"train_loss": -36.79145812988281, "global_step": 130728, "epoch": 1080} {"train_loss": -36.51838302612305, "global_step": 130729, "epoch": 1080} {"train_loss": -37.44742965698242, "global_step": 130730, "epoch": 1080} {"train_loss": -37.57064437866211, "global_step": 130731, "epoch": 1080} {"train_loss": -36.086761474609375, "global_step": 130732, "epoch": 1080} {"train_loss": -36.65916061401367, "global_step": 130733, "epoch": 1080} {"train_loss": -34.93314743041992, "global_step": 130734, "epoch": 1080} {"train_loss": -37.55055236816406, "global_step": 130735, "epoch": 1080} {"train_loss": -37.759796142578125, "global_step": 130736, "epoch": 1080} {"train_loss": -37.81403732299805, "global_step": 130737, "epoch": 1080} {"train_loss": -36.85097122192383, "global_step": 130738, "epoch": 1080} {"train_loss": -35.82638168334961, "global_step": 130739, "epoch": 1080} {"train_loss": -37.98177719116211, "global_step": 130740, "epoch": 1080} {"train_loss": -37.07821273803711, "global_step": 130741, "epoch": 1080} {"train_loss": -37.43242263793945, "global_step": 130742, "epoch": 1080} {"train_loss": -37.3902587890625, "global_step": 130743, "epoch": 1080} {"train_loss": -37.56023025512695, "global_step": 130744, "epoch": 1080} {"train_loss": -38.018550872802734, "global_step": 130745, "epoch": 1080} {"train_loss": -37.92905807495117, "global_step": 130746, "epoch": 1080} {"train_loss": -37.03144836425781, "global_step": 130747, "epoch": 1080} {"train_loss": -38.52631759643555, "global_step": 130748, "epoch": 1080} {"train_loss": -38.634273529052734, "global_step": 130749, "epoch": 1080} {"train_loss": -36.67195510864258, "global_step": 130750, "epoch": 1080} {"train_loss": -38.504722595214844, "global_step": 130751, "epoch": 1080} {"train_loss": -37.92717742919922, "global_step": 130752, "epoch": 1080} {"train_loss": -38.1980094909668, "global_step": 130753, "epoch": 1080} {"train_loss": -38.64311599731445, "global_step": 130754, "epoch": 1080} {"train_loss": -38.40133285522461, "global_step": 130755, "epoch": 1080} {"train_loss": -38.91294479370117, "global_step": 130756, "epoch": 1080} {"train_loss": -39.08147048950195, "global_step": 130757, "epoch": 1080} {"train_loss": -38.85641860961914, "global_step": 130758, "epoch": 1080} {"train_loss": -38.941490173339844, "global_step": 130759, "epoch": 1080} {"train_loss": -38.7254753112793, "global_step": 130760, "epoch": 1080} {"train_loss": -39.48213577270508, "global_step": 130761, "epoch": 1080} {"train_loss": -39.11363220214844, "global_step": 130762, "epoch": 1080} {"train_loss": -38.89274215698242, "global_step": 130763, "epoch": 1080} {"train_loss": -38.87535858154297, "global_step": 130764, "epoch": 1080} {"train_loss": -39.20681381225586, "global_step": 130765, "epoch": 1080} {"train_loss": -38.93205642700195, "global_step": 130766, "epoch": 1080} {"train_loss": -38.680145263671875, "global_step": 130767, "epoch": 1080} {"train_loss": -39.10683822631836, "global_step": 130768, "epoch": 1080} {"train_loss": -39.45062255859375, "global_step": 130769, "epoch": 1080} {"train_loss": -38.63542556762695, "global_step": 130770, "epoch": 1080} {"train_loss": -38.980712890625, "global_step": 130771, "epoch": 1080} {"train_loss": -39.16823959350586, "global_step": 130772, "epoch": 1080} {"train_loss": -38.47621154785156, "global_step": 130773, "epoch": 1080} {"train_loss": -38.48897933959961, "global_step": 130774, "epoch": 1080} {"train_loss": -39.294979095458984, "global_step": 130775, "epoch": 1080} {"train_loss": -38.63094711303711, "global_step": 130776, "epoch": 1080} {"train_loss": -39.2276496887207, "global_step": 130777, "epoch": 1080} {"train_loss": -39.56782150268555, "global_step": 130778, "epoch": 1080} {"train_loss": -39.2921028137207, "global_step": 130779, "epoch": 1080} {"train_loss": -39.44490432739258, "global_step": 130780, "epoch": 1080} {"train_loss": -38.98965072631836, "global_step": 130781, "epoch": 1080} {"train_loss": -39.87543869018555, "global_step": 130782, "epoch": 1080} {"train_loss": -38.86542892456055, "global_step": 130783, "epoch": 1080} {"train_loss": -38.83742904663086, "global_step": 130784, "epoch": 1080} {"train_loss": -37.894378662109375, "global_step": 130785, "epoch": 1080} {"train_loss": -37.5009880065918, "global_step": 130786, "epoch": 1080} {"train_loss": -35.079280853271484, "global_step": 130787, "epoch": 1080} {"train_loss": -33.92416000366211, "global_step": 130788, "epoch": 1080} {"train_loss": -37.105255126953125, "global_step": 130789, "epoch": 1080} {"train_loss": -39.86985778808594, "global_step": 130790, "epoch": 1080} {"train_loss": -37.86103057861328, "global_step": 130791, "epoch": 1080} {"train_loss": -36.76154708862305, "global_step": 130792, "epoch": 1080} {"train_loss": -38.332862854003906, "global_step": 130793, "epoch": 1080} {"train_loss": -38.92348098754883, "global_step": 130794, "epoch": 1080} {"train_loss": -38.25787353515625, "global_step": 130795, "epoch": 1080} {"train_loss": -38.218326568603516, "global_step": 130796, "epoch": 1080} {"train_loss": -39.99033737182617, "global_step": 130797, "epoch": 1080} {"train_loss": -39.178104400634766, "global_step": 130798, "epoch": 1080} {"train_loss": -39.072113037109375, "global_step": 130799, "epoch": 1080} {"train_loss": -37.849448653292065, "global_step": 130800, "epoch": 1080, "val_loss": 2629581.25} {"train_loss": -38.140010833740234, "global_step": 130801, "epoch": 1081} {"train_loss": -39.464569091796875, "global_step": 130802, "epoch": 1081} {"train_loss": -38.87187576293945, "global_step": 130803, "epoch": 1081} {"train_loss": -39.4730339050293, "global_step": 130804, "epoch": 1081} {"train_loss": -39.19276428222656, "global_step": 130805, "epoch": 1081} {"train_loss": -39.007503509521484, "global_step": 130806, "epoch": 1081} {"train_loss": -39.85584259033203, "global_step": 130807, "epoch": 1081} {"train_loss": -38.863563537597656, "global_step": 130808, "epoch": 1081} {"train_loss": -39.50209045410156, "global_step": 130809, "epoch": 1081} {"train_loss": -39.079803466796875, "global_step": 130810, "epoch": 1081} {"train_loss": -39.649967193603516, "global_step": 130811, "epoch": 1081} {"train_loss": -38.511497497558594, "global_step": 130812, "epoch": 1081} {"train_loss": -39.39908981323242, "global_step": 130813, "epoch": 1081} {"train_loss": -39.55135726928711, "global_step": 130814, "epoch": 1081} {"train_loss": -40.3015022277832, "global_step": 130815, "epoch": 1081} {"train_loss": -39.617828369140625, "global_step": 130816, "epoch": 1081} {"train_loss": -38.91599655151367, "global_step": 130817, "epoch": 1081} {"train_loss": -36.41167449951172, "global_step": 130818, "epoch": 1081} {"train_loss": -33.738582611083984, "global_step": 130819, "epoch": 1081} {"train_loss": -28.87467384338379, "global_step": 130820, "epoch": 1081} {"train_loss": -25.86834716796875, "global_step": 130821, "epoch": 1081} {"train_loss": -29.481489181518555, "global_step": 130822, "epoch": 1081} {"train_loss": -37.493896484375, "global_step": 130823, "epoch": 1081} {"train_loss": -38.788570404052734, "global_step": 130824, "epoch": 1081} {"train_loss": -37.750144958496094, "global_step": 130825, "epoch": 1081} {"train_loss": -39.05188751220703, "global_step": 130826, "epoch": 1081} {"train_loss": -38.72772979736328, "global_step": 130827, "epoch": 1081} {"train_loss": -38.01125717163086, "global_step": 130828, "epoch": 1081} {"train_loss": -38.27610778808594, "global_step": 130829, "epoch": 1081} {"train_loss": -38.341121673583984, "global_step": 130830, "epoch": 1081} {"train_loss": -39.057132720947266, "global_step": 130831, "epoch": 1081} {"train_loss": -39.15190505981445, "global_step": 130832, "epoch": 1081} {"train_loss": -38.81283187866211, "global_step": 130833, "epoch": 1081} {"train_loss": -39.19482421875, "global_step": 130834, "epoch": 1081} {"train_loss": -39.07686996459961, "global_step": 130835, "epoch": 1081} {"train_loss": -38.99040985107422, "global_step": 130836, "epoch": 1081} {"train_loss": -39.76264572143555, "global_step": 130837, "epoch": 1081} {"train_loss": -38.82879638671875, "global_step": 130838, "epoch": 1081} {"train_loss": -39.8038444519043, "global_step": 130839, "epoch": 1081} {"train_loss": -39.37984085083008, "global_step": 130840, "epoch": 1081} {"train_loss": -39.45402526855469, "global_step": 130841, "epoch": 1081} {"train_loss": -39.89364242553711, "global_step": 130842, "epoch": 1081} {"train_loss": -39.43669509887695, "global_step": 130843, "epoch": 1081} {"train_loss": -39.99142074584961, "global_step": 130844, "epoch": 1081} {"train_loss": -39.40943145751953, "global_step": 130845, "epoch": 1081} {"train_loss": -39.93373107910156, "global_step": 130846, "epoch": 1081} {"train_loss": -39.75455093383789, "global_step": 130847, "epoch": 1081} {"train_loss": -39.57822799682617, "global_step": 130848, "epoch": 1081} {"train_loss": -40.4116325378418, "global_step": 130849, "epoch": 1081} {"train_loss": -39.43225860595703, "global_step": 130850, "epoch": 1081} {"train_loss": -40.18642044067383, "global_step": 130851, "epoch": 1081} {"train_loss": -40.09674072265625, "global_step": 130852, "epoch": 1081} {"train_loss": -39.68075180053711, "global_step": 130853, "epoch": 1081} {"train_loss": -39.913818359375, "global_step": 130854, "epoch": 1081} {"train_loss": -39.7131233215332, "global_step": 130855, "epoch": 1081} {"train_loss": -39.25861740112305, "global_step": 130856, "epoch": 1081} {"train_loss": -38.9363899230957, "global_step": 130857, "epoch": 1081} {"train_loss": -40.06020736694336, "global_step": 130858, "epoch": 1081} {"train_loss": -40.20530700683594, "global_step": 130859, "epoch": 1081} {"train_loss": -40.32020950317383, "global_step": 130860, "epoch": 1081} {"train_loss": -40.186439514160156, "global_step": 130861, "epoch": 1081} {"train_loss": -39.42035675048828, "global_step": 130862, "epoch": 1081} {"train_loss": -38.3754997253418, "global_step": 130863, "epoch": 1081} {"train_loss": -39.159576416015625, "global_step": 130864, "epoch": 1081} {"train_loss": -34.40095138549805, "global_step": 130865, "epoch": 1081} {"train_loss": -39.271175384521484, "global_step": 130866, "epoch": 1081} {"train_loss": -40.09541702270508, "global_step": 130867, "epoch": 1081} {"train_loss": -39.722145080566406, "global_step": 130868, "epoch": 1081} {"train_loss": -37.34855651855469, "global_step": 130869, "epoch": 1081} {"train_loss": -38.62540817260742, "global_step": 130870, "epoch": 1081} {"train_loss": -34.98672103881836, "global_step": 130871, "epoch": 1081} {"train_loss": -37.785377502441406, "global_step": 130872, "epoch": 1081} {"train_loss": -39.817413330078125, "global_step": 130873, "epoch": 1081} {"train_loss": -38.11906051635742, "global_step": 130874, "epoch": 1081} {"train_loss": -38.54730987548828, "global_step": 130875, "epoch": 1081} {"train_loss": -39.0899543762207, "global_step": 130876, "epoch": 1081} {"train_loss": -34.60202407836914, "global_step": 130877, "epoch": 1081} {"train_loss": -38.75820541381836, "global_step": 130878, "epoch": 1081} {"train_loss": -39.43586730957031, "global_step": 130879, "epoch": 1081} {"train_loss": -37.11568832397461, "global_step": 130880, "epoch": 1081} {"train_loss": -38.591590881347656, "global_step": 130881, "epoch": 1081} {"train_loss": -39.159461975097656, "global_step": 130882, "epoch": 1081} {"train_loss": -37.751068115234375, "global_step": 130883, "epoch": 1081} {"train_loss": -38.5262565612793, "global_step": 130884, "epoch": 1081} {"train_loss": -38.227806091308594, "global_step": 130885, "epoch": 1081} {"train_loss": -37.549739837646484, "global_step": 130886, "epoch": 1081} {"train_loss": -38.23926544189453, "global_step": 130887, "epoch": 1081} {"train_loss": -35.663970947265625, "global_step": 130888, "epoch": 1081} {"train_loss": -36.10049057006836, "global_step": 130889, "epoch": 1081} {"train_loss": -36.4907341003418, "global_step": 130890, "epoch": 1081} {"train_loss": -37.032203674316406, "global_step": 130891, "epoch": 1081} {"train_loss": -34.90380859375, "global_step": 130892, "epoch": 1081} {"train_loss": -36.566009521484375, "global_step": 130893, "epoch": 1081} {"train_loss": -35.634395599365234, "global_step": 130894, "epoch": 1081} {"train_loss": -37.73988723754883, "global_step": 130895, "epoch": 1081} {"train_loss": -38.750038146972656, "global_step": 130896, "epoch": 1081} {"train_loss": -35.96072006225586, "global_step": 130897, "epoch": 1081} {"train_loss": -36.15157699584961, "global_step": 130898, "epoch": 1081} {"train_loss": -36.9968147277832, "global_step": 130899, "epoch": 1081} {"train_loss": -36.5307731628418, "global_step": 130900, "epoch": 1081} {"train_loss": -36.8819465637207, "global_step": 130901, "epoch": 1081} {"train_loss": -38.9792366027832, "global_step": 130902, "epoch": 1081} {"train_loss": -38.395259857177734, "global_step": 130903, "epoch": 1081} {"train_loss": -37.38295364379883, "global_step": 130904, "epoch": 1081} {"train_loss": -38.6163444519043, "global_step": 130905, "epoch": 1081} {"train_loss": -38.15190505981445, "global_step": 130906, "epoch": 1081} {"train_loss": -38.918758392333984, "global_step": 130907, "epoch": 1081} {"train_loss": -39.01335525512695, "global_step": 130908, "epoch": 1081} {"train_loss": -37.85262680053711, "global_step": 130909, "epoch": 1081} {"train_loss": -36.55290603637695, "global_step": 130910, "epoch": 1081} {"train_loss": -37.11517333984375, "global_step": 130911, "epoch": 1081} {"train_loss": -37.868324279785156, "global_step": 130912, "epoch": 1081} {"train_loss": -38.75422286987305, "global_step": 130913, "epoch": 1081} {"train_loss": -38.17258834838867, "global_step": 130914, "epoch": 1081} {"train_loss": -39.29133224487305, "global_step": 130915, "epoch": 1081} {"train_loss": -38.30112838745117, "global_step": 130916, "epoch": 1081} {"train_loss": -38.10742950439453, "global_step": 130917, "epoch": 1081} {"train_loss": -38.243812561035156, "global_step": 130918, "epoch": 1081} {"train_loss": -39.065731048583984, "global_step": 130919, "epoch": 1081} {"train_loss": -38.735591888427734, "global_step": 130920, "epoch": 1081} {"train_loss": -38.23863910643522, "global_step": 130921, "epoch": 1081, "val_loss": 2681525.75} {"train_loss": -38.82796859741211, "global_step": 130922, "epoch": 1082} {"train_loss": -38.74372863769531, "global_step": 130923, "epoch": 1082} {"train_loss": -39.263519287109375, "global_step": 130924, "epoch": 1082} {"train_loss": -38.99831771850586, "global_step": 130925, "epoch": 1082} {"train_loss": -39.1662712097168, "global_step": 130926, "epoch": 1082} {"train_loss": -39.42102813720703, "global_step": 130927, "epoch": 1082} {"train_loss": -39.246315002441406, "global_step": 130928, "epoch": 1082} {"train_loss": -38.748008728027344, "global_step": 130929, "epoch": 1082} {"train_loss": -39.14695358276367, "global_step": 130930, "epoch": 1082} {"train_loss": -38.910762786865234, "global_step": 130931, "epoch": 1082} {"train_loss": -39.54767990112305, "global_step": 130932, "epoch": 1082} {"train_loss": -38.869564056396484, "global_step": 130933, "epoch": 1082} {"train_loss": -39.39287567138672, "global_step": 130934, "epoch": 1082} {"train_loss": -39.36664581298828, "global_step": 130935, "epoch": 1082} {"train_loss": -39.674583435058594, "global_step": 130936, "epoch": 1082} {"train_loss": -39.305450439453125, "global_step": 130937, "epoch": 1082} {"train_loss": -39.344242095947266, "global_step": 130938, "epoch": 1082} {"train_loss": -39.784183502197266, "global_step": 130939, "epoch": 1082} {"train_loss": -39.53933334350586, "global_step": 130940, "epoch": 1082} {"train_loss": -39.261226654052734, "global_step": 130941, "epoch": 1082} {"train_loss": -39.933815002441406, "global_step": 130942, "epoch": 1082} {"train_loss": -39.53436279296875, "global_step": 130943, "epoch": 1082} {"train_loss": -39.729671478271484, "global_step": 130944, "epoch": 1082} {"train_loss": -39.38449478149414, "global_step": 130945, "epoch": 1082} {"train_loss": -39.84748077392578, "global_step": 130946, "epoch": 1082} {"train_loss": -39.80252456665039, "global_step": 130947, "epoch": 1082} {"train_loss": -40.14857864379883, "global_step": 130948, "epoch": 1082} {"train_loss": -39.63523483276367, "global_step": 130949, "epoch": 1082} {"train_loss": -39.68302536010742, "global_step": 130950, "epoch": 1082} {"train_loss": -39.90977478027344, "global_step": 130951, "epoch": 1082} {"train_loss": -40.25224304199219, "global_step": 130952, "epoch": 1082} {"train_loss": -40.488704681396484, "global_step": 130953, "epoch": 1082} {"train_loss": -40.26588821411133, "global_step": 130954, "epoch": 1082} {"train_loss": -40.18596267700195, "global_step": 130955, "epoch": 1082} {"train_loss": -40.06964874267578, "global_step": 130956, "epoch": 1082} {"train_loss": -40.057167053222656, "global_step": 130957, "epoch": 1082} {"train_loss": -39.74959945678711, "global_step": 130958, "epoch": 1082} {"train_loss": -40.237972259521484, "global_step": 130959, "epoch": 1082} {"train_loss": -40.401611328125, "global_step": 130960, "epoch": 1082} {"train_loss": -40.247108459472656, "global_step": 130961, "epoch": 1082} {"train_loss": -39.87689208984375, "global_step": 130962, "epoch": 1082} {"train_loss": -40.0466194152832, "global_step": 130963, "epoch": 1082} {"train_loss": -39.868526458740234, "global_step": 130964, "epoch": 1082} {"train_loss": -40.648956298828125, "global_step": 130965, "epoch": 1082} {"train_loss": -40.603675842285156, "global_step": 130966, "epoch": 1082} {"train_loss": -40.40731430053711, "global_step": 130967, "epoch": 1082} {"train_loss": -40.18958282470703, "global_step": 130968, "epoch": 1082} {"train_loss": -40.186363220214844, "global_step": 130969, "epoch": 1082} {"train_loss": -39.00709915161133, "global_step": 130970, "epoch": 1082} {"train_loss": -39.65181350708008, "global_step": 130971, "epoch": 1082} {"train_loss": -40.65192794799805, "global_step": 130972, "epoch": 1082} {"train_loss": -39.91093063354492, "global_step": 130973, "epoch": 1082} {"train_loss": -40.040382385253906, "global_step": 130974, "epoch": 1082} {"train_loss": -39.47800827026367, "global_step": 130975, "epoch": 1082} {"train_loss": -39.46574401855469, "global_step": 130976, "epoch": 1082} {"train_loss": -39.82114791870117, "global_step": 130977, "epoch": 1082} {"train_loss": -38.42258834838867, "global_step": 130978, "epoch": 1082} {"train_loss": -35.7598876953125, "global_step": 130979, "epoch": 1082} {"train_loss": -32.356868743896484, "global_step": 130980, "epoch": 1082} {"train_loss": -29.78070640563965, "global_step": 130981, "epoch": 1082} {"train_loss": -27.864587783813477, "global_step": 130982, "epoch": 1082} {"train_loss": -32.95730209350586, "global_step": 130983, "epoch": 1082} {"train_loss": -34.8896369934082, "global_step": 130984, "epoch": 1082} {"train_loss": -35.62892532348633, "global_step": 130985, "epoch": 1082} {"train_loss": -33.63652420043945, "global_step": 130986, "epoch": 1082} {"train_loss": -38.028358459472656, "global_step": 130987, "epoch": 1082} {"train_loss": -34.529563903808594, "global_step": 130988, "epoch": 1082} {"train_loss": -37.24617385864258, "global_step": 130989, "epoch": 1082} {"train_loss": -34.104454040527344, "global_step": 130990, "epoch": 1082} {"train_loss": -33.888607025146484, "global_step": 130991, "epoch": 1082} {"train_loss": -37.196739196777344, "global_step": 130992, "epoch": 1082} {"train_loss": -35.4723014831543, "global_step": 130993, "epoch": 1082} {"train_loss": -35.0667839050293, "global_step": 130994, "epoch": 1082} {"train_loss": -38.3258056640625, "global_step": 130995, "epoch": 1082} {"train_loss": -35.159889221191406, "global_step": 130996, "epoch": 1082} {"train_loss": -35.45310592651367, "global_step": 130997, "epoch": 1082} {"train_loss": -38.584556579589844, "global_step": 130998, "epoch": 1082} {"train_loss": -38.290828704833984, "global_step": 130999, "epoch": 1082} {"train_loss": -37.033199310302734, "global_step": 131000, "epoch": 1082} {"train_loss": -36.76259994506836, "global_step": 131001, "epoch": 1082} {"train_loss": -39.33778762817383, "global_step": 131002, "epoch": 1082} {"train_loss": -38.97419357299805, "global_step": 131003, "epoch": 1082} {"train_loss": -37.66327667236328, "global_step": 131004, "epoch": 1082} {"train_loss": -37.93589401245117, "global_step": 131005, "epoch": 1082} {"train_loss": -38.60128402709961, "global_step": 131006, "epoch": 1082} {"train_loss": -38.767372131347656, "global_step": 131007, "epoch": 1082} {"train_loss": -38.402095794677734, "global_step": 131008, "epoch": 1082} {"train_loss": -37.31954574584961, "global_step": 131009, "epoch": 1082} {"train_loss": -38.73891830444336, "global_step": 131010, "epoch": 1082} {"train_loss": -38.48013687133789, "global_step": 131011, "epoch": 1082} {"train_loss": -38.942386627197266, "global_step": 131012, "epoch": 1082} {"train_loss": -39.38821029663086, "global_step": 131013, "epoch": 1082} {"train_loss": -38.494136810302734, "global_step": 131014, "epoch": 1082} {"train_loss": -38.73284149169922, "global_step": 131015, "epoch": 1082} {"train_loss": -38.37059783935547, "global_step": 131016, "epoch": 1082} {"train_loss": -39.38981246948242, "global_step": 131017, "epoch": 1082} {"train_loss": -39.3475341796875, "global_step": 131018, "epoch": 1082} {"train_loss": -39.92058181762695, "global_step": 131019, "epoch": 1082} {"train_loss": -38.545562744140625, "global_step": 131020, "epoch": 1082} {"train_loss": -39.53413009643555, "global_step": 131021, "epoch": 1082} {"train_loss": -39.02626419067383, "global_step": 131022, "epoch": 1082} {"train_loss": -39.63851547241211, "global_step": 131023, "epoch": 1082} {"train_loss": -39.84211349487305, "global_step": 131024, "epoch": 1082} {"train_loss": -39.33176803588867, "global_step": 131025, "epoch": 1082} {"train_loss": -39.34770584106445, "global_step": 131026, "epoch": 1082} {"train_loss": -39.67195129394531, "global_step": 131027, "epoch": 1082} {"train_loss": -40.26172637939453, "global_step": 131028, "epoch": 1082} {"train_loss": -39.51591110229492, "global_step": 131029, "epoch": 1082} {"train_loss": -40.23645782470703, "global_step": 131030, "epoch": 1082} {"train_loss": -40.197418212890625, "global_step": 131031, "epoch": 1082} {"train_loss": -40.10353469848633, "global_step": 131032, "epoch": 1082} {"train_loss": -39.6106071472168, "global_step": 131033, "epoch": 1082} {"train_loss": -40.33486557006836, "global_step": 131034, "epoch": 1082} {"train_loss": -39.93659210205078, "global_step": 131035, "epoch": 1082} {"train_loss": -39.86574172973633, "global_step": 131036, "epoch": 1082} {"train_loss": -40.14109420776367, "global_step": 131037, "epoch": 1082} {"train_loss": -40.42707061767578, "global_step": 131038, "epoch": 1082} {"train_loss": -40.032169342041016, "global_step": 131039, "epoch": 1082} {"train_loss": -40.43085479736328, "global_step": 131040, "epoch": 1082} {"train_loss": -39.8763427734375, "global_step": 131041, "epoch": 1082} {"train_loss": -38.70737674807714, "global_step": 131042, "epoch": 1082, "val_loss": 2610482.75} {"train_loss": -40.498634338378906, "global_step": 131043, "epoch": 1083} {"train_loss": -40.90899658203125, "global_step": 131044, "epoch": 1083} {"train_loss": -41.02122497558594, "global_step": 131045, "epoch": 1083} {"train_loss": -40.68842697143555, "global_step": 131046, "epoch": 1083} {"train_loss": -40.43459701538086, "global_step": 131047, "epoch": 1083} {"train_loss": -40.80782699584961, "global_step": 131048, "epoch": 1083} {"train_loss": -40.61630630493164, "global_step": 131049, "epoch": 1083} {"train_loss": -40.28425216674805, "global_step": 131050, "epoch": 1083} {"train_loss": -40.34432601928711, "global_step": 131051, "epoch": 1083} {"train_loss": -40.47877502441406, "global_step": 131052, "epoch": 1083} {"train_loss": -40.54912185668945, "global_step": 131053, "epoch": 1083} {"train_loss": -40.64301300048828, "global_step": 131054, "epoch": 1083} {"train_loss": -40.90558624267578, "global_step": 131055, "epoch": 1083} {"train_loss": -40.306697845458984, "global_step": 131056, "epoch": 1083} {"train_loss": -40.29096603393555, "global_step": 131057, "epoch": 1083} {"train_loss": -39.384666442871094, "global_step": 131058, "epoch": 1083} {"train_loss": -36.708045959472656, "global_step": 131059, "epoch": 1083} {"train_loss": -28.949487686157227, "global_step": 131060, "epoch": 1083} {"train_loss": -18.834016799926758, "global_step": 131061, "epoch": 1083} {"train_loss": -25.25433921813965, "global_step": 131062, "epoch": 1083} {"train_loss": -38.95167541503906, "global_step": 131063, "epoch": 1083} {"train_loss": -29.514318466186523, "global_step": 131064, "epoch": 1083} {"train_loss": -32.8824577331543, "global_step": 131065, "epoch": 1083} {"train_loss": -38.276180267333984, "global_step": 131066, "epoch": 1083} {"train_loss": -33.415016174316406, "global_step": 131067, "epoch": 1083} {"train_loss": -37.44014358520508, "global_step": 131068, "epoch": 1083} {"train_loss": -36.969444274902344, "global_step": 131069, "epoch": 1083} {"train_loss": -37.96826934814453, "global_step": 131070, "epoch": 1083} {"train_loss": -35.514400482177734, "global_step": 131071, "epoch": 1083} {"train_loss": -38.50920486450195, "global_step": 131072, "epoch": 1083} {"train_loss": -37.793331146240234, "global_step": 131073, "epoch": 1083} {"train_loss": -36.20162582397461, "global_step": 131074, "epoch": 1083} {"train_loss": -38.64319610595703, "global_step": 131075, "epoch": 1083} {"train_loss": -37.27576446533203, "global_step": 131076, "epoch": 1083} {"train_loss": -37.79288101196289, "global_step": 131077, "epoch": 1083} {"train_loss": -38.29928970336914, "global_step": 131078, "epoch": 1083} {"train_loss": -37.9210319519043, "global_step": 131079, "epoch": 1083} {"train_loss": -39.02693557739258, "global_step": 131080, "epoch": 1083} {"train_loss": -37.72758865356445, "global_step": 131081, "epoch": 1083} {"train_loss": -38.20835876464844, "global_step": 131082, "epoch": 1083} {"train_loss": -38.54120635986328, "global_step": 131083, "epoch": 1083} {"train_loss": -38.56713104248047, "global_step": 131084, "epoch": 1083} {"train_loss": -39.36909484863281, "global_step": 131085, "epoch": 1083} {"train_loss": -39.18342208862305, "global_step": 131086, "epoch": 1083} {"train_loss": -39.12101745605469, "global_step": 131087, "epoch": 1083} {"train_loss": -39.546974182128906, "global_step": 131088, "epoch": 1083} {"train_loss": -39.09928512573242, "global_step": 131089, "epoch": 1083} {"train_loss": -39.07571029663086, "global_step": 131090, "epoch": 1083} {"train_loss": -38.434608459472656, "global_step": 131091, "epoch": 1083} {"train_loss": -39.73727798461914, "global_step": 131092, "epoch": 1083} {"train_loss": -39.194026947021484, "global_step": 131093, "epoch": 1083} {"train_loss": -38.681640625, "global_step": 131094, "epoch": 1083} {"train_loss": -39.46736526489258, "global_step": 131095, "epoch": 1083} {"train_loss": -39.56003952026367, "global_step": 131096, "epoch": 1083} {"train_loss": -39.4001579284668, "global_step": 131097, "epoch": 1083} {"train_loss": -39.64447784423828, "global_step": 131098, "epoch": 1083} {"train_loss": -39.96247482299805, "global_step": 131099, "epoch": 1083} {"train_loss": -39.78624725341797, "global_step": 131100, "epoch": 1083} {"train_loss": -39.77883529663086, "global_step": 131101, "epoch": 1083} {"train_loss": -39.9952392578125, "global_step": 131102, "epoch": 1083} {"train_loss": -39.719356536865234, "global_step": 131103, "epoch": 1083} {"train_loss": -38.96356201171875, "global_step": 131104, "epoch": 1083} {"train_loss": -39.3468017578125, "global_step": 131105, "epoch": 1083} {"train_loss": -39.8123893737793, "global_step": 131106, "epoch": 1083} {"train_loss": -39.62454605102539, "global_step": 131107, "epoch": 1083} {"train_loss": -39.51105880737305, "global_step": 131108, "epoch": 1083} {"train_loss": -40.08333969116211, "global_step": 131109, "epoch": 1083} {"train_loss": -39.52919387817383, "global_step": 131110, "epoch": 1083} {"train_loss": -39.85274887084961, "global_step": 131111, "epoch": 1083} {"train_loss": -40.4411735534668, "global_step": 131112, "epoch": 1083} {"train_loss": -39.44960403442383, "global_step": 131113, "epoch": 1083} {"train_loss": -39.24946975708008, "global_step": 131114, "epoch": 1083} {"train_loss": -40.084049224853516, "global_step": 131115, "epoch": 1083} {"train_loss": -39.66374588012695, "global_step": 131116, "epoch": 1083} {"train_loss": -39.99235153198242, "global_step": 131117, "epoch": 1083} {"train_loss": -40.098480224609375, "global_step": 131118, "epoch": 1083} {"train_loss": -40.08557891845703, "global_step": 131119, "epoch": 1083} {"train_loss": -40.23215866088867, "global_step": 131120, "epoch": 1083} {"train_loss": -40.45576095581055, "global_step": 131121, "epoch": 1083} {"train_loss": -40.13784408569336, "global_step": 131122, "epoch": 1083} {"train_loss": -40.213993072509766, "global_step": 131123, "epoch": 1083} {"train_loss": -40.813358306884766, "global_step": 131124, "epoch": 1083} {"train_loss": -40.16482925415039, "global_step": 131125, "epoch": 1083} {"train_loss": -40.01154327392578, "global_step": 131126, "epoch": 1083} {"train_loss": -40.64292526245117, "global_step": 131127, "epoch": 1083} {"train_loss": -40.27217483520508, "global_step": 131128, "epoch": 1083} {"train_loss": -40.47641372680664, "global_step": 131129, "epoch": 1083} {"train_loss": -40.548789978027344, "global_step": 131130, "epoch": 1083} {"train_loss": -40.19927978515625, "global_step": 131131, "epoch": 1083} {"train_loss": -40.64667892456055, "global_step": 131132, "epoch": 1083} {"train_loss": -40.608646392822266, "global_step": 131133, "epoch": 1083} {"train_loss": -40.21537780761719, "global_step": 131134, "epoch": 1083} {"train_loss": -39.6568489074707, "global_step": 131135, "epoch": 1083} {"train_loss": -37.3841438293457, "global_step": 131136, "epoch": 1083} {"train_loss": -33.6045036315918, "global_step": 131137, "epoch": 1083} {"train_loss": -26.426773071289062, "global_step": 131138, "epoch": 1083} {"train_loss": -14.764620780944824, "global_step": 131139, "epoch": 1083} {"train_loss": -8.524139404296875, "global_step": 131140, "epoch": 1083} {"train_loss": -36.40890121459961, "global_step": 131141, "epoch": 1083} {"train_loss": -25.330825805664062, "global_step": 131142, "epoch": 1083} {"train_loss": -24.751386642456055, "global_step": 131143, "epoch": 1083} {"train_loss": -31.453510284423828, "global_step": 131144, "epoch": 1083} {"train_loss": -25.433500289916992, "global_step": 131145, "epoch": 1083} {"train_loss": -30.827392578125, "global_step": 131146, "epoch": 1083} {"train_loss": -32.35401153564453, "global_step": 131147, "epoch": 1083} {"train_loss": -26.0590877532959, "global_step": 131148, "epoch": 1083} {"train_loss": -35.61519241333008, "global_step": 131149, "epoch": 1083} {"train_loss": -30.01862144470215, "global_step": 131150, "epoch": 1083} {"train_loss": -33.90556335449219, "global_step": 131151, "epoch": 1083} {"train_loss": -37.58964157104492, "global_step": 131152, "epoch": 1083} {"train_loss": -33.73214340209961, "global_step": 131153, "epoch": 1083} {"train_loss": -35.05507278442383, "global_step": 131154, "epoch": 1083} {"train_loss": -37.87024688720703, "global_step": 131155, "epoch": 1083} {"train_loss": -36.8792724609375, "global_step": 131156, "epoch": 1083} {"train_loss": -35.979156494140625, "global_step": 131157, "epoch": 1083} {"train_loss": -37.77130889892578, "global_step": 131158, "epoch": 1083} {"train_loss": -37.9024543762207, "global_step": 131159, "epoch": 1083} {"train_loss": -37.824947357177734, "global_step": 131160, "epoch": 1083} {"train_loss": -37.388092041015625, "global_step": 131161, "epoch": 1083} {"train_loss": -38.371883392333984, "global_step": 131162, "epoch": 1083} {"train_loss": -37.19685394507794, "global_step": 131163, "epoch": 1083, "val_loss": 2619721.25} {"train_loss": -38.025394439697266, "global_step": 131164, "epoch": 1084} {"train_loss": -38.019222259521484, "global_step": 131165, "epoch": 1084} {"train_loss": -38.19851303100586, "global_step": 131166, "epoch": 1084} {"train_loss": -38.87419509887695, "global_step": 131167, "epoch": 1084} {"train_loss": -38.70906448364258, "global_step": 131168, "epoch": 1084} {"train_loss": -38.24310302734375, "global_step": 131169, "epoch": 1084} {"train_loss": -38.927913665771484, "global_step": 131170, "epoch": 1084} {"train_loss": -38.897212982177734, "global_step": 131171, "epoch": 1084} {"train_loss": -38.58132553100586, "global_step": 131172, "epoch": 1084} {"train_loss": -39.33028793334961, "global_step": 131173, "epoch": 1084} {"train_loss": -38.471187591552734, "global_step": 131174, "epoch": 1084} {"train_loss": -38.564674377441406, "global_step": 131175, "epoch": 1084} {"train_loss": -38.90382385253906, "global_step": 131176, "epoch": 1084} {"train_loss": -39.00933837890625, "global_step": 131177, "epoch": 1084} {"train_loss": -38.81814193725586, "global_step": 131178, "epoch": 1084} {"train_loss": -38.84664535522461, "global_step": 131179, "epoch": 1084} {"train_loss": -38.981082916259766, "global_step": 131180, "epoch": 1084} {"train_loss": -39.418365478515625, "global_step": 131181, "epoch": 1084} {"train_loss": -39.55805206298828, "global_step": 131182, "epoch": 1084} {"train_loss": -38.92940902709961, "global_step": 131183, "epoch": 1084} {"train_loss": -39.07184982299805, "global_step": 131184, "epoch": 1084} {"train_loss": -39.44989013671875, "global_step": 131185, "epoch": 1084} {"train_loss": -39.56517791748047, "global_step": 131186, "epoch": 1084} {"train_loss": -39.25249099731445, "global_step": 131187, "epoch": 1084} {"train_loss": -39.34364700317383, "global_step": 131188, "epoch": 1084} {"train_loss": -39.31034469604492, "global_step": 131189, "epoch": 1084} {"train_loss": -39.518104553222656, "global_step": 131190, "epoch": 1084} {"train_loss": -39.41478729248047, "global_step": 131191, "epoch": 1084} {"train_loss": -39.5123405456543, "global_step": 131192, "epoch": 1084} {"train_loss": -39.618839263916016, "global_step": 131193, "epoch": 1084} {"train_loss": -39.48582077026367, "global_step": 131194, "epoch": 1084} {"train_loss": -39.68966293334961, "global_step": 131195, "epoch": 1084} {"train_loss": -39.59790802001953, "global_step": 131196, "epoch": 1084} {"train_loss": -39.63386917114258, "global_step": 131197, "epoch": 1084} {"train_loss": -39.461143493652344, "global_step": 131198, "epoch": 1084} {"train_loss": -39.73762130737305, "global_step": 131199, "epoch": 1084} {"train_loss": -39.44009780883789, "global_step": 131200, "epoch": 1084} {"train_loss": -39.445491790771484, "global_step": 131201, "epoch": 1084} {"train_loss": -39.80644226074219, "global_step": 131202, "epoch": 1084} {"train_loss": -39.44148635864258, "global_step": 131203, "epoch": 1084} {"train_loss": -39.94313430786133, "global_step": 131204, "epoch": 1084} {"train_loss": -40.204750061035156, "global_step": 131205, "epoch": 1084} {"train_loss": -39.98678207397461, "global_step": 131206, "epoch": 1084} {"train_loss": -40.06924057006836, "global_step": 131207, "epoch": 1084} {"train_loss": -39.769317626953125, "global_step": 131208, "epoch": 1084} {"train_loss": -39.814979553222656, "global_step": 131209, "epoch": 1084} {"train_loss": -39.914554595947266, "global_step": 131210, "epoch": 1084} {"train_loss": -39.71877670288086, "global_step": 131211, "epoch": 1084} {"train_loss": -38.077266693115234, "global_step": 131212, "epoch": 1084} {"train_loss": -39.24496841430664, "global_step": 131213, "epoch": 1084} {"train_loss": -39.71827697753906, "global_step": 131214, "epoch": 1084} {"train_loss": -39.377471923828125, "global_step": 131215, "epoch": 1084} {"train_loss": -39.08753204345703, "global_step": 131216, "epoch": 1084} {"train_loss": -38.88469314575195, "global_step": 131217, "epoch": 1084} {"train_loss": -38.91428756713867, "global_step": 131218, "epoch": 1084} {"train_loss": -39.0468864440918, "global_step": 131219, "epoch": 1084} {"train_loss": -39.38608932495117, "global_step": 131220, "epoch": 1084} {"train_loss": -39.6447868347168, "global_step": 131221, "epoch": 1084} {"train_loss": -39.79376220703125, "global_step": 131222, "epoch": 1084} {"train_loss": -40.24156188964844, "global_step": 131223, "epoch": 1084} {"train_loss": -39.63642120361328, "global_step": 131224, "epoch": 1084} {"train_loss": -39.762691497802734, "global_step": 131225, "epoch": 1084} {"train_loss": -38.955257415771484, "global_step": 131226, "epoch": 1084} {"train_loss": -38.36076354980469, "global_step": 131227, "epoch": 1084} {"train_loss": -36.77219772338867, "global_step": 131228, "epoch": 1084} {"train_loss": -33.43380355834961, "global_step": 131229, "epoch": 1084} {"train_loss": -34.196678161621094, "global_step": 131230, "epoch": 1084} {"train_loss": -37.432064056396484, "global_step": 131231, "epoch": 1084} {"train_loss": -38.69450378417969, "global_step": 131232, "epoch": 1084} {"train_loss": -37.07783889770508, "global_step": 131233, "epoch": 1084} {"train_loss": -34.9347038269043, "global_step": 131234, "epoch": 1084} {"train_loss": -37.33675003051758, "global_step": 131235, "epoch": 1084} {"train_loss": -37.76494216918945, "global_step": 131236, "epoch": 1084} {"train_loss": -38.342254638671875, "global_step": 131237, "epoch": 1084} {"train_loss": -37.19622802734375, "global_step": 131238, "epoch": 1084} {"train_loss": -38.56612777709961, "global_step": 131239, "epoch": 1084} {"train_loss": -38.230525970458984, "global_step": 131240, "epoch": 1084} {"train_loss": -37.86647033691406, "global_step": 131241, "epoch": 1084} {"train_loss": -38.4961051940918, "global_step": 131242, "epoch": 1084} {"train_loss": -37.0308723449707, "global_step": 131243, "epoch": 1084} {"train_loss": -37.0568962097168, "global_step": 131244, "epoch": 1084} {"train_loss": -35.519344329833984, "global_step": 131245, "epoch": 1084} {"train_loss": -37.9157600402832, "global_step": 131246, "epoch": 1084} {"train_loss": -36.9358024597168, "global_step": 131247, "epoch": 1084} {"train_loss": -37.60566329956055, "global_step": 131248, "epoch": 1084} {"train_loss": -37.143089294433594, "global_step": 131249, "epoch": 1084} {"train_loss": -38.18608474731445, "global_step": 131250, "epoch": 1084} {"train_loss": -37.67024230957031, "global_step": 131251, "epoch": 1084} {"train_loss": -37.318485260009766, "global_step": 131252, "epoch": 1084} {"train_loss": -38.789833068847656, "global_step": 131253, "epoch": 1084} {"train_loss": -37.57503890991211, "global_step": 131254, "epoch": 1084} {"train_loss": -39.069313049316406, "global_step": 131255, "epoch": 1084} {"train_loss": -38.948970794677734, "global_step": 131256, "epoch": 1084} {"train_loss": -38.888912200927734, "global_step": 131257, "epoch": 1084} {"train_loss": -39.55161666870117, "global_step": 131258, "epoch": 1084} {"train_loss": -38.73859786987305, "global_step": 131259, "epoch": 1084} {"train_loss": -39.545692443847656, "global_step": 131260, "epoch": 1084} {"train_loss": -38.890140533447266, "global_step": 131261, "epoch": 1084} {"train_loss": -38.76216506958008, "global_step": 131262, "epoch": 1084} {"train_loss": -38.975582122802734, "global_step": 131263, "epoch": 1084} {"train_loss": -38.668678283691406, "global_step": 131264, "epoch": 1084} {"train_loss": -39.15310287475586, "global_step": 131265, "epoch": 1084} {"train_loss": -38.96931838989258, "global_step": 131266, "epoch": 1084} {"train_loss": -39.50109100341797, "global_step": 131267, "epoch": 1084} {"train_loss": -39.25783920288086, "global_step": 131268, "epoch": 1084} {"train_loss": -39.31754684448242, "global_step": 131269, "epoch": 1084} {"train_loss": -38.9190788269043, "global_step": 131270, "epoch": 1084} {"train_loss": -39.410125732421875, "global_step": 131271, "epoch": 1084} {"train_loss": -39.5702018737793, "global_step": 131272, "epoch": 1084} {"train_loss": -39.215003967285156, "global_step": 131273, "epoch": 1084} {"train_loss": -39.68845748901367, "global_step": 131274, "epoch": 1084} {"train_loss": -39.496639251708984, "global_step": 131275, "epoch": 1084} {"train_loss": -39.80839538574219, "global_step": 131276, "epoch": 1084} {"train_loss": -39.452003479003906, "global_step": 131277, "epoch": 1084} {"train_loss": -39.425289154052734, "global_step": 131278, "epoch": 1084} {"train_loss": -39.35309982299805, "global_step": 131279, "epoch": 1084} {"train_loss": -39.58222579956055, "global_step": 131280, "epoch": 1084} {"train_loss": -40.0001335144043, "global_step": 131281, "epoch": 1084} {"train_loss": -38.87868881225586, "global_step": 131282, "epoch": 1084} {"train_loss": -40.04330825805664, "global_step": 131283, "epoch": 1084} {"train_loss": -38.813051176465244, "global_step": 131284, "epoch": 1084, "val_loss": 2549157.0} {"train_loss": -40.090755462646484, "global_step": 131285, "epoch": 1085} {"train_loss": -39.65922164916992, "global_step": 131286, "epoch": 1085} {"train_loss": -40.13020324707031, "global_step": 131287, "epoch": 1085} {"train_loss": -40.44091796875, "global_step": 131288, "epoch": 1085} {"train_loss": -39.8327522277832, "global_step": 131289, "epoch": 1085} {"train_loss": -39.51764678955078, "global_step": 131290, "epoch": 1085} {"train_loss": -38.95703125, "global_step": 131291, "epoch": 1085} {"train_loss": -40.248863220214844, "global_step": 131292, "epoch": 1085} {"train_loss": -40.10691452026367, "global_step": 131293, "epoch": 1085} {"train_loss": -39.57595443725586, "global_step": 131294, "epoch": 1085} {"train_loss": -40.02913284301758, "global_step": 131295, "epoch": 1085} {"train_loss": -40.37411117553711, "global_step": 131296, "epoch": 1085} {"train_loss": -40.33097457885742, "global_step": 131297, "epoch": 1085} {"train_loss": -39.708587646484375, "global_step": 131298, "epoch": 1085} {"train_loss": -39.387481689453125, "global_step": 131299, "epoch": 1085} {"train_loss": -39.142616271972656, "global_step": 131300, "epoch": 1085} {"train_loss": -40.00202560424805, "global_step": 131301, "epoch": 1085} {"train_loss": -40.225040435791016, "global_step": 131302, "epoch": 1085} {"train_loss": -40.45987319946289, "global_step": 131303, "epoch": 1085} {"train_loss": -40.50294876098633, "global_step": 131304, "epoch": 1085} {"train_loss": -40.3315544128418, "global_step": 131305, "epoch": 1085} {"train_loss": -40.30156326293945, "global_step": 131306, "epoch": 1085} {"train_loss": -39.65192794799805, "global_step": 131307, "epoch": 1085} {"train_loss": -40.164581298828125, "global_step": 131308, "epoch": 1085} {"train_loss": -40.44696044921875, "global_step": 131309, "epoch": 1085} {"train_loss": -40.548397064208984, "global_step": 131310, "epoch": 1085} {"train_loss": -40.01573944091797, "global_step": 131311, "epoch": 1085} {"train_loss": -39.9246711730957, "global_step": 131312, "epoch": 1085} {"train_loss": -39.931724548339844, "global_step": 131313, "epoch": 1085} {"train_loss": -39.770206451416016, "global_step": 131314, "epoch": 1085} {"train_loss": -40.60685348510742, "global_step": 131315, "epoch": 1085} {"train_loss": -40.190975189208984, "global_step": 131316, "epoch": 1085} {"train_loss": -40.0037956237793, "global_step": 131317, "epoch": 1085} {"train_loss": -38.24542236328125, "global_step": 131318, "epoch": 1085} {"train_loss": -38.04764938354492, "global_step": 131319, "epoch": 1085} {"train_loss": -39.71824264526367, "global_step": 131320, "epoch": 1085} {"train_loss": -38.722591400146484, "global_step": 131321, "epoch": 1085} {"train_loss": -38.692745208740234, "global_step": 131322, "epoch": 1085} {"train_loss": -37.36800765991211, "global_step": 131323, "epoch": 1085} {"train_loss": -35.78715896606445, "global_step": 131324, "epoch": 1085} {"train_loss": -35.7581901550293, "global_step": 131325, "epoch": 1085} {"train_loss": -35.76227569580078, "global_step": 131326, "epoch": 1085} {"train_loss": -36.54700469970703, "global_step": 131327, "epoch": 1085} {"train_loss": -36.4521369934082, "global_step": 131328, "epoch": 1085} {"train_loss": -37.98820877075195, "global_step": 131329, "epoch": 1085} {"train_loss": -38.6917610168457, "global_step": 131330, "epoch": 1085} {"train_loss": -37.80329513549805, "global_step": 131331, "epoch": 1085} {"train_loss": -35.69227600097656, "global_step": 131332, "epoch": 1085} {"train_loss": -36.33858871459961, "global_step": 131333, "epoch": 1085} {"train_loss": -38.09983444213867, "global_step": 131334, "epoch": 1085} {"train_loss": -39.47103500366211, "global_step": 131335, "epoch": 1085} {"train_loss": -38.13554763793945, "global_step": 131336, "epoch": 1085} {"train_loss": -38.36296463012695, "global_step": 131337, "epoch": 1085} {"train_loss": -39.394309997558594, "global_step": 131338, "epoch": 1085} {"train_loss": -38.8753662109375, "global_step": 131339, "epoch": 1085} {"train_loss": -37.92393493652344, "global_step": 131340, "epoch": 1085} {"train_loss": -38.726253509521484, "global_step": 131341, "epoch": 1085} {"train_loss": -38.49280548095703, "global_step": 131342, "epoch": 1085} {"train_loss": -39.60219192504883, "global_step": 131343, "epoch": 1085} {"train_loss": -38.6227912902832, "global_step": 131344, "epoch": 1085} {"train_loss": -39.53010559082031, "global_step": 131345, "epoch": 1085} {"train_loss": -39.668067932128906, "global_step": 131346, "epoch": 1085} {"train_loss": -39.13225173950195, "global_step": 131347, "epoch": 1085} {"train_loss": -39.233795166015625, "global_step": 131348, "epoch": 1085} {"train_loss": -39.9465446472168, "global_step": 131349, "epoch": 1085} {"train_loss": -39.338809967041016, "global_step": 131350, "epoch": 1085} {"train_loss": -39.90322494506836, "global_step": 131351, "epoch": 1085} {"train_loss": -40.1562614440918, "global_step": 131352, "epoch": 1085} {"train_loss": -39.95829391479492, "global_step": 131353, "epoch": 1085} {"train_loss": -40.08613967895508, "global_step": 131354, "epoch": 1085} {"train_loss": -40.1337890625, "global_step": 131355, "epoch": 1085} {"train_loss": -40.23042678833008, "global_step": 131356, "epoch": 1085} {"train_loss": -39.896766662597656, "global_step": 131357, "epoch": 1085} {"train_loss": -40.2373161315918, "global_step": 131358, "epoch": 1085} {"train_loss": -40.468780517578125, "global_step": 131359, "epoch": 1085} {"train_loss": -40.2839241027832, "global_step": 131360, "epoch": 1085} {"train_loss": -40.072723388671875, "global_step": 131361, "epoch": 1085} {"train_loss": -40.49607467651367, "global_step": 131362, "epoch": 1085} {"train_loss": -40.54026412963867, "global_step": 131363, "epoch": 1085} {"train_loss": -40.406227111816406, "global_step": 131364, "epoch": 1085} {"train_loss": -40.477657318115234, "global_step": 131365, "epoch": 1085} {"train_loss": -40.78153991699219, "global_step": 131366, "epoch": 1085} {"train_loss": -40.47564697265625, "global_step": 131367, "epoch": 1085} {"train_loss": -40.69112777709961, "global_step": 131368, "epoch": 1085} {"train_loss": -40.64691925048828, "global_step": 131369, "epoch": 1085} {"train_loss": -40.711612701416016, "global_step": 131370, "epoch": 1085} {"train_loss": -40.22233963012695, "global_step": 131371, "epoch": 1085} {"train_loss": -40.7102165222168, "global_step": 131372, "epoch": 1085} {"train_loss": -40.70009994506836, "global_step": 131373, "epoch": 1085} {"train_loss": -40.27152633666992, "global_step": 131374, "epoch": 1085} {"train_loss": -40.22260284423828, "global_step": 131375, "epoch": 1085} {"train_loss": -40.98322677612305, "global_step": 131376, "epoch": 1085} {"train_loss": -40.54370880126953, "global_step": 131377, "epoch": 1085} {"train_loss": -39.79575729370117, "global_step": 131378, "epoch": 1085} {"train_loss": -39.4871940612793, "global_step": 131379, "epoch": 1085} {"train_loss": -40.59395217895508, "global_step": 131380, "epoch": 1085} {"train_loss": -40.2956657409668, "global_step": 131381, "epoch": 1085} {"train_loss": -40.355560302734375, "global_step": 131382, "epoch": 1085} {"train_loss": -40.46459197998047, "global_step": 131383, "epoch": 1085} {"train_loss": -40.14091110229492, "global_step": 131384, "epoch": 1085} {"train_loss": -39.99909210205078, "global_step": 131385, "epoch": 1085} {"train_loss": -40.51055908203125, "global_step": 131386, "epoch": 1085} {"train_loss": -40.55994415283203, "global_step": 131387, "epoch": 1085} {"train_loss": -40.53853988647461, "global_step": 131388, "epoch": 1085} {"train_loss": -40.01930618286133, "global_step": 131389, "epoch": 1085} {"train_loss": -40.42920684814453, "global_step": 131390, "epoch": 1085} {"train_loss": -40.79852294921875, "global_step": 131391, "epoch": 1085} {"train_loss": -40.64319610595703, "global_step": 131392, "epoch": 1085} {"train_loss": -39.96340560913086, "global_step": 131393, "epoch": 1085} {"train_loss": -38.40134811401367, "global_step": 131394, "epoch": 1085} {"train_loss": -39.46305465698242, "global_step": 131395, "epoch": 1085} {"train_loss": -38.51526641845703, "global_step": 131396, "epoch": 1085} {"train_loss": -37.501163482666016, "global_step": 131397, "epoch": 1085} {"train_loss": -37.05992889404297, "global_step": 131398, "epoch": 1085} {"train_loss": -38.67264175415039, "global_step": 131399, "epoch": 1085} {"train_loss": -39.7161979675293, "global_step": 131400, "epoch": 1085} {"train_loss": -36.88336944580078, "global_step": 131401, "epoch": 1085} {"train_loss": -34.850555419921875, "global_step": 131402, "epoch": 1085} {"train_loss": -31.980030059814453, "global_step": 131403, "epoch": 1085} {"train_loss": -28.45928955078125, "global_step": 131404, "epoch": 1085} {"train_loss": -39.24637413024902, "global_step": 131405, "epoch": 1085, "val_loss": 2578869.25} {"train_loss": -37.631465911865234, "global_step": 131406, "epoch": 1086} {"train_loss": -31.8265380859375, "global_step": 131407, "epoch": 1086} {"train_loss": -37.85343551635742, "global_step": 131408, "epoch": 1086} {"train_loss": -35.67911911010742, "global_step": 131409, "epoch": 1086} {"train_loss": -35.5324821472168, "global_step": 131410, "epoch": 1086} {"train_loss": -37.8515739440918, "global_step": 131411, "epoch": 1086} {"train_loss": -37.39486312866211, "global_step": 131412, "epoch": 1086} {"train_loss": -36.609580993652344, "global_step": 131413, "epoch": 1086} {"train_loss": -38.224090576171875, "global_step": 131414, "epoch": 1086} {"train_loss": -37.72993850708008, "global_step": 131415, "epoch": 1086} {"train_loss": -35.962059020996094, "global_step": 131416, "epoch": 1086} {"train_loss": -38.69480514526367, "global_step": 131417, "epoch": 1086} {"train_loss": -37.14771270751953, "global_step": 131418, "epoch": 1086} {"train_loss": -37.540931701660156, "global_step": 131419, "epoch": 1086} {"train_loss": -39.10223388671875, "global_step": 131420, "epoch": 1086} {"train_loss": -38.54940414428711, "global_step": 131421, "epoch": 1086} {"train_loss": -37.77561569213867, "global_step": 131422, "epoch": 1086} {"train_loss": -38.86774826049805, "global_step": 131423, "epoch": 1086} {"train_loss": -38.464786529541016, "global_step": 131424, "epoch": 1086} {"train_loss": -38.89198684692383, "global_step": 131425, "epoch": 1086} {"train_loss": -39.13378143310547, "global_step": 131426, "epoch": 1086} {"train_loss": -38.664852142333984, "global_step": 131427, "epoch": 1086} {"train_loss": -39.72671890258789, "global_step": 131428, "epoch": 1086} {"train_loss": -38.805423736572266, "global_step": 131429, "epoch": 1086} {"train_loss": -39.68844223022461, "global_step": 131430, "epoch": 1086} {"train_loss": -39.50642776489258, "global_step": 131431, "epoch": 1086} {"train_loss": -39.3646354675293, "global_step": 131432, "epoch": 1086} {"train_loss": -39.79800796508789, "global_step": 131433, "epoch": 1086} {"train_loss": -39.915828704833984, "global_step": 131434, "epoch": 1086} {"train_loss": -40.18719482421875, "global_step": 131435, "epoch": 1086} {"train_loss": -39.861915588378906, "global_step": 131436, "epoch": 1086} {"train_loss": -39.84150314331055, "global_step": 131437, "epoch": 1086} {"train_loss": -39.7766227722168, "global_step": 131438, "epoch": 1086} {"train_loss": -39.84615707397461, "global_step": 131439, "epoch": 1086} {"train_loss": -40.29034423828125, "global_step": 131440, "epoch": 1086} {"train_loss": -39.41146469116211, "global_step": 131441, "epoch": 1086} {"train_loss": -39.0854377746582, "global_step": 131442, "epoch": 1086} {"train_loss": -40.203636169433594, "global_step": 131443, "epoch": 1086} {"train_loss": -39.38765335083008, "global_step": 131444, "epoch": 1086} {"train_loss": -39.7398681640625, "global_step": 131445, "epoch": 1086} {"train_loss": -40.40550231933594, "global_step": 131446, "epoch": 1086} {"train_loss": -39.779945373535156, "global_step": 131447, "epoch": 1086} {"train_loss": -40.28504180908203, "global_step": 131448, "epoch": 1086} {"train_loss": -40.018218994140625, "global_step": 131449, "epoch": 1086} {"train_loss": -40.29224395751953, "global_step": 131450, "epoch": 1086} {"train_loss": -40.05463790893555, "global_step": 131451, "epoch": 1086} {"train_loss": -40.59572982788086, "global_step": 131452, "epoch": 1086} {"train_loss": -40.37850570678711, "global_step": 131453, "epoch": 1086} {"train_loss": -40.327999114990234, "global_step": 131454, "epoch": 1086} {"train_loss": -40.36860275268555, "global_step": 131455, "epoch": 1086} {"train_loss": -40.15944290161133, "global_step": 131456, "epoch": 1086} {"train_loss": -40.033931732177734, "global_step": 131457, "epoch": 1086} {"train_loss": -40.537200927734375, "global_step": 131458, "epoch": 1086} {"train_loss": -40.55647277832031, "global_step": 131459, "epoch": 1086} {"train_loss": -40.46381759643555, "global_step": 131460, "epoch": 1086} {"train_loss": -40.60686111450195, "global_step": 131461, "epoch": 1086} {"train_loss": -40.06825256347656, "global_step": 131462, "epoch": 1086} {"train_loss": -40.48841094970703, "global_step": 131463, "epoch": 1086} {"train_loss": -40.71688461303711, "global_step": 131464, "epoch": 1086} {"train_loss": -40.156288146972656, "global_step": 131465, "epoch": 1086} {"train_loss": -40.06612777709961, "global_step": 131466, "epoch": 1086} {"train_loss": -40.272926330566406, "global_step": 131467, "epoch": 1086} {"train_loss": -40.952999114990234, "global_step": 131468, "epoch": 1086} {"train_loss": -40.31863021850586, "global_step": 131469, "epoch": 1086} {"train_loss": -40.43442916870117, "global_step": 131470, "epoch": 1086} {"train_loss": -40.8077507019043, "global_step": 131471, "epoch": 1086} {"train_loss": -41.018672943115234, "global_step": 131472, "epoch": 1086} {"train_loss": -40.994720458984375, "global_step": 131473, "epoch": 1086} {"train_loss": -40.830501556396484, "global_step": 131474, "epoch": 1086} {"train_loss": -40.846336364746094, "global_step": 131475, "epoch": 1086} {"train_loss": -40.47114181518555, "global_step": 131476, "epoch": 1086} {"train_loss": -40.635372161865234, "global_step": 131477, "epoch": 1086} {"train_loss": -40.38019561767578, "global_step": 131478, "epoch": 1086} {"train_loss": -40.80424118041992, "global_step": 131479, "epoch": 1086} {"train_loss": -41.21381759643555, "global_step": 131480, "epoch": 1086} {"train_loss": -41.107032775878906, "global_step": 131481, "epoch": 1086} {"train_loss": -40.69569778442383, "global_step": 131482, "epoch": 1086} {"train_loss": -40.47462844848633, "global_step": 131483, "epoch": 1086} {"train_loss": -40.74834060668945, "global_step": 131484, "epoch": 1086} {"train_loss": -41.031288146972656, "global_step": 131485, "epoch": 1086} {"train_loss": -40.277809143066406, "global_step": 131486, "epoch": 1086} {"train_loss": -40.78156661987305, "global_step": 131487, "epoch": 1086} {"train_loss": -40.88304138183594, "global_step": 131488, "epoch": 1086} {"train_loss": -41.00000762939453, "global_step": 131489, "epoch": 1086} {"train_loss": -41.0134391784668, "global_step": 131490, "epoch": 1086} {"train_loss": -40.312904357910156, "global_step": 131491, "epoch": 1086} {"train_loss": -40.73592758178711, "global_step": 131492, "epoch": 1086} {"train_loss": -41.073421478271484, "global_step": 131493, "epoch": 1086} {"train_loss": -40.479610443115234, "global_step": 131494, "epoch": 1086} {"train_loss": -39.639583587646484, "global_step": 131495, "epoch": 1086} {"train_loss": -39.229061126708984, "global_step": 131496, "epoch": 1086} {"train_loss": -38.12641906738281, "global_step": 131497, "epoch": 1086} {"train_loss": -37.495052337646484, "global_step": 131498, "epoch": 1086} {"train_loss": -36.22761154174805, "global_step": 131499, "epoch": 1086} {"train_loss": -37.2749137878418, "global_step": 131500, "epoch": 1086} {"train_loss": -37.85569381713867, "global_step": 131501, "epoch": 1086} {"train_loss": -38.44340896606445, "global_step": 131502, "epoch": 1086} {"train_loss": -40.55657958984375, "global_step": 131503, "epoch": 1086} {"train_loss": -39.22879409790039, "global_step": 131504, "epoch": 1086} {"train_loss": -38.52680587768555, "global_step": 131505, "epoch": 1086} {"train_loss": -39.351558685302734, "global_step": 131506, "epoch": 1086} {"train_loss": -39.64265823364258, "global_step": 131507, "epoch": 1086} {"train_loss": -37.455257415771484, "global_step": 131508, "epoch": 1086} {"train_loss": -37.94179153442383, "global_step": 131509, "epoch": 1086} {"train_loss": -38.83583450317383, "global_step": 131510, "epoch": 1086} {"train_loss": -36.34536361694336, "global_step": 131511, "epoch": 1086} {"train_loss": -37.63542175292969, "global_step": 131512, "epoch": 1086} {"train_loss": -37.87956237792969, "global_step": 131513, "epoch": 1086} {"train_loss": -35.662837982177734, "global_step": 131514, "epoch": 1086} {"train_loss": -38.9673957824707, "global_step": 131515, "epoch": 1086} {"train_loss": -38.708892822265625, "global_step": 131516, "epoch": 1086} {"train_loss": -37.98344421386719, "global_step": 131517, "epoch": 1086} {"train_loss": -39.85498809814453, "global_step": 131518, "epoch": 1086} {"train_loss": -39.73798370361328, "global_step": 131519, "epoch": 1086} {"train_loss": -38.104488372802734, "global_step": 131520, "epoch": 1086} {"train_loss": -37.78909683227539, "global_step": 131521, "epoch": 1086} {"train_loss": -40.21832275390625, "global_step": 131522, "epoch": 1086} {"train_loss": -38.32667541503906, "global_step": 131523, "epoch": 1086} {"train_loss": -38.16388702392578, "global_step": 131524, "epoch": 1086} {"train_loss": -39.247528076171875, "global_step": 131525, "epoch": 1086} {"train_loss": -39.299817235016626, "global_step": 131526, "epoch": 1086, "val_loss": 2622004.75} {"train_loss": -38.16849899291992, "global_step": 131527, "epoch": 1087} {"train_loss": -39.051692962646484, "global_step": 131528, "epoch": 1087} {"train_loss": -39.53986740112305, "global_step": 131529, "epoch": 1087} {"train_loss": -39.73347854614258, "global_step": 131530, "epoch": 1087} {"train_loss": -39.04494094848633, "global_step": 131531, "epoch": 1087} {"train_loss": -39.03565216064453, "global_step": 131532, "epoch": 1087} {"train_loss": -39.81312942504883, "global_step": 131533, "epoch": 1087} {"train_loss": -37.23889923095703, "global_step": 131534, "epoch": 1087} {"train_loss": -38.433589935302734, "global_step": 131535, "epoch": 1087} {"train_loss": -39.857269287109375, "global_step": 131536, "epoch": 1087} {"train_loss": -38.304779052734375, "global_step": 131537, "epoch": 1087} {"train_loss": -39.145233154296875, "global_step": 131538, "epoch": 1087} {"train_loss": -38.89590072631836, "global_step": 131539, "epoch": 1087} {"train_loss": -39.7378044128418, "global_step": 131540, "epoch": 1087} {"train_loss": -39.4480094909668, "global_step": 131541, "epoch": 1087} {"train_loss": -38.857666015625, "global_step": 131542, "epoch": 1087} {"train_loss": -39.57430648803711, "global_step": 131543, "epoch": 1087} {"train_loss": -39.05215072631836, "global_step": 131544, "epoch": 1087} {"train_loss": -38.378875732421875, "global_step": 131545, "epoch": 1087} {"train_loss": -39.09613037109375, "global_step": 131546, "epoch": 1087} {"train_loss": -38.904502868652344, "global_step": 131547, "epoch": 1087} {"train_loss": -37.380828857421875, "global_step": 131548, "epoch": 1087} {"train_loss": -37.53417205810547, "global_step": 131549, "epoch": 1087} {"train_loss": -38.3296012878418, "global_step": 131550, "epoch": 1087} {"train_loss": -38.641441345214844, "global_step": 131551, "epoch": 1087} {"train_loss": -39.45874786376953, "global_step": 131552, "epoch": 1087} {"train_loss": -39.6748046875, "global_step": 131553, "epoch": 1087} {"train_loss": -39.47929382324219, "global_step": 131554, "epoch": 1087} {"train_loss": -39.270965576171875, "global_step": 131555, "epoch": 1087} {"train_loss": -39.02134704589844, "global_step": 131556, "epoch": 1087} {"train_loss": -39.27235794067383, "global_step": 131557, "epoch": 1087} {"train_loss": -36.90007781982422, "global_step": 131558, "epoch": 1087} {"train_loss": -39.743751525878906, "global_step": 131559, "epoch": 1087} {"train_loss": -39.612579345703125, "global_step": 131560, "epoch": 1087} {"train_loss": -38.563995361328125, "global_step": 131561, "epoch": 1087} {"train_loss": -39.51627731323242, "global_step": 131562, "epoch": 1087} {"train_loss": -39.8226432800293, "global_step": 131563, "epoch": 1087} {"train_loss": -37.89230728149414, "global_step": 131564, "epoch": 1087} {"train_loss": -39.576412200927734, "global_step": 131565, "epoch": 1087} {"train_loss": -39.31436538696289, "global_step": 131566, "epoch": 1087} {"train_loss": -39.1796875, "global_step": 131567, "epoch": 1087} {"train_loss": -39.912872314453125, "global_step": 131568, "epoch": 1087} {"train_loss": -39.84294128417969, "global_step": 131569, "epoch": 1087} {"train_loss": -39.57155990600586, "global_step": 131570, "epoch": 1087} {"train_loss": -40.04979705810547, "global_step": 131571, "epoch": 1087} {"train_loss": -39.513587951660156, "global_step": 131572, "epoch": 1087} {"train_loss": -40.110103607177734, "global_step": 131573, "epoch": 1087} {"train_loss": -39.80438995361328, "global_step": 131574, "epoch": 1087} {"train_loss": -40.31325149536133, "global_step": 131575, "epoch": 1087} {"train_loss": -40.3246955871582, "global_step": 131576, "epoch": 1087} {"train_loss": -40.41061019897461, "global_step": 131577, "epoch": 1087} {"train_loss": -39.9893798828125, "global_step": 131578, "epoch": 1087} {"train_loss": -40.30669021606445, "global_step": 131579, "epoch": 1087} {"train_loss": -38.92298126220703, "global_step": 131580, "epoch": 1087} {"train_loss": -39.72260284423828, "global_step": 131581, "epoch": 1087} {"train_loss": -40.35880661010742, "global_step": 131582, "epoch": 1087} {"train_loss": -40.11029052734375, "global_step": 131583, "epoch": 1087} {"train_loss": -40.74620056152344, "global_step": 131584, "epoch": 1087} {"train_loss": -39.9712028503418, "global_step": 131585, "epoch": 1087} {"train_loss": -40.29811477661133, "global_step": 131586, "epoch": 1087} {"train_loss": -40.118812561035156, "global_step": 131587, "epoch": 1087} {"train_loss": -40.46137619018555, "global_step": 131588, "epoch": 1087} {"train_loss": -40.60016632080078, "global_step": 131589, "epoch": 1087} {"train_loss": -40.3589973449707, "global_step": 131590, "epoch": 1087} {"train_loss": -40.28542709350586, "global_step": 131591, "epoch": 1087} {"train_loss": -40.295406341552734, "global_step": 131592, "epoch": 1087} {"train_loss": -40.70726776123047, "global_step": 131593, "epoch": 1087} {"train_loss": -40.43231964111328, "global_step": 131594, "epoch": 1087} {"train_loss": -38.18184280395508, "global_step": 131595, "epoch": 1087} {"train_loss": -40.37105178833008, "global_step": 131596, "epoch": 1087} {"train_loss": -40.3658561706543, "global_step": 131597, "epoch": 1087} {"train_loss": -40.9410400390625, "global_step": 131598, "epoch": 1087} {"train_loss": -38.029972076416016, "global_step": 131599, "epoch": 1087} {"train_loss": -40.6370849609375, "global_step": 131600, "epoch": 1087} {"train_loss": -40.4485969543457, "global_step": 131601, "epoch": 1087} {"train_loss": -40.36273956298828, "global_step": 131602, "epoch": 1087} {"train_loss": -36.211299896240234, "global_step": 131603, "epoch": 1087} {"train_loss": -38.99419021606445, "global_step": 131604, "epoch": 1087} {"train_loss": -40.08651351928711, "global_step": 131605, "epoch": 1087} {"train_loss": -40.76959228515625, "global_step": 131606, "epoch": 1087} {"train_loss": -39.515602111816406, "global_step": 131607, "epoch": 1087} {"train_loss": -40.45653533935547, "global_step": 131608, "epoch": 1087} {"train_loss": -40.631256103515625, "global_step": 131609, "epoch": 1087} {"train_loss": -40.41965866088867, "global_step": 131610, "epoch": 1087} {"train_loss": -40.335323333740234, "global_step": 131611, "epoch": 1087} {"train_loss": -40.46027374267578, "global_step": 131612, "epoch": 1087} {"train_loss": -41.018653869628906, "global_step": 131613, "epoch": 1087} {"train_loss": -40.537506103515625, "global_step": 131614, "epoch": 1087} {"train_loss": -41.11574935913086, "global_step": 131615, "epoch": 1087} {"train_loss": -40.5691032409668, "global_step": 131616, "epoch": 1087} {"train_loss": -40.38509750366211, "global_step": 131617, "epoch": 1087} {"train_loss": -40.708091735839844, "global_step": 131618, "epoch": 1087} {"train_loss": -40.52724075317383, "global_step": 131619, "epoch": 1087} {"train_loss": -39.4765510559082, "global_step": 131620, "epoch": 1087} {"train_loss": -40.572566986083984, "global_step": 131621, "epoch": 1087} {"train_loss": -40.8424186706543, "global_step": 131622, "epoch": 1087} {"train_loss": -40.65940475463867, "global_step": 131623, "epoch": 1087} {"train_loss": -41.03371047973633, "global_step": 131624, "epoch": 1087} {"train_loss": -40.8128662109375, "global_step": 131625, "epoch": 1087} {"train_loss": -39.80080795288086, "global_step": 131626, "epoch": 1087} {"train_loss": -40.67754364013672, "global_step": 131627, "epoch": 1087} {"train_loss": -41.03776168823242, "global_step": 131628, "epoch": 1087} {"train_loss": -39.94842529296875, "global_step": 131629, "epoch": 1087} {"train_loss": -40.826072692871094, "global_step": 131630, "epoch": 1087} {"train_loss": -40.82380676269531, "global_step": 131631, "epoch": 1087} {"train_loss": -40.60432052612305, "global_step": 131632, "epoch": 1087} {"train_loss": -36.301170349121094, "global_step": 131633, "epoch": 1087} {"train_loss": -40.841548919677734, "global_step": 131634, "epoch": 1087} {"train_loss": -40.050575256347656, "global_step": 131635, "epoch": 1087} {"train_loss": -39.65894317626953, "global_step": 131636, "epoch": 1087} {"train_loss": -36.654598236083984, "global_step": 131637, "epoch": 1087} {"train_loss": -34.45731735229492, "global_step": 131638, "epoch": 1087} {"train_loss": -37.429134368896484, "global_step": 131639, "epoch": 1087} {"train_loss": -39.858421325683594, "global_step": 131640, "epoch": 1087} {"train_loss": -39.913516998291016, "global_step": 131641, "epoch": 1087} {"train_loss": -39.61335372924805, "global_step": 131642, "epoch": 1087} {"train_loss": -37.659603118896484, "global_step": 131643, "epoch": 1087} {"train_loss": -39.36967849731445, "global_step": 131644, "epoch": 1087} {"train_loss": -39.896385192871094, "global_step": 131645, "epoch": 1087} {"train_loss": -40.041900634765625, "global_step": 131646, "epoch": 1087} {"train_loss": -39.59606444934183, "global_step": 131647, "epoch": 1087, "val_loss": 2603690.75} {"train_loss": -39.63132858276367, "global_step": 131648, "epoch": 1088} {"train_loss": -40.5504035949707, "global_step": 131649, "epoch": 1088} {"train_loss": -39.89680099487305, "global_step": 131650, "epoch": 1088} {"train_loss": -39.24685287475586, "global_step": 131651, "epoch": 1088} {"train_loss": -40.579124450683594, "global_step": 131652, "epoch": 1088} {"train_loss": -39.56380844116211, "global_step": 131653, "epoch": 1088} {"train_loss": -40.62367630004883, "global_step": 131654, "epoch": 1088} {"train_loss": -39.32157516479492, "global_step": 131655, "epoch": 1088} {"train_loss": -39.835174560546875, "global_step": 131656, "epoch": 1088} {"train_loss": -39.879573822021484, "global_step": 131657, "epoch": 1088} {"train_loss": -39.643394470214844, "global_step": 131658, "epoch": 1088} {"train_loss": -40.15595626831055, "global_step": 131659, "epoch": 1088} {"train_loss": -40.21787643432617, "global_step": 131660, "epoch": 1088} {"train_loss": -40.0748291015625, "global_step": 131661, "epoch": 1088} {"train_loss": -38.37928771972656, "global_step": 131662, "epoch": 1088} {"train_loss": -40.123409271240234, "global_step": 131663, "epoch": 1088} {"train_loss": -40.127349853515625, "global_step": 131664, "epoch": 1088} {"train_loss": -39.31729507446289, "global_step": 131665, "epoch": 1088} {"train_loss": -40.763893127441406, "global_step": 131666, "epoch": 1088} {"train_loss": -40.32590103149414, "global_step": 131667, "epoch": 1088} {"train_loss": -39.68906784057617, "global_step": 131668, "epoch": 1088} {"train_loss": -40.77020263671875, "global_step": 131669, "epoch": 1088} {"train_loss": -40.42722702026367, "global_step": 131670, "epoch": 1088} {"train_loss": -39.32130813598633, "global_step": 131671, "epoch": 1088} {"train_loss": -39.97310256958008, "global_step": 131672, "epoch": 1088} {"train_loss": -40.39912033081055, "global_step": 131673, "epoch": 1088} {"train_loss": -40.07948303222656, "global_step": 131674, "epoch": 1088} {"train_loss": -40.29433059692383, "global_step": 131675, "epoch": 1088} {"train_loss": -35.605648040771484, "global_step": 131676, "epoch": 1088} {"train_loss": -38.808048248291016, "global_step": 131677, "epoch": 1088} {"train_loss": -38.507598876953125, "global_step": 131678, "epoch": 1088} {"train_loss": -37.33866500854492, "global_step": 131679, "epoch": 1088} {"train_loss": -37.3011589050293, "global_step": 131680, "epoch": 1088} {"train_loss": -35.12252426147461, "global_step": 131681, "epoch": 1088} {"train_loss": -39.46816635131836, "global_step": 131682, "epoch": 1088} {"train_loss": -36.2468376159668, "global_step": 131683, "epoch": 1088} {"train_loss": -35.71809768676758, "global_step": 131684, "epoch": 1088} {"train_loss": -37.549442291259766, "global_step": 131685, "epoch": 1088} {"train_loss": -38.269161224365234, "global_step": 131686, "epoch": 1088} {"train_loss": -37.5605583190918, "global_step": 131687, "epoch": 1088} {"train_loss": -38.17195129394531, "global_step": 131688, "epoch": 1088} {"train_loss": -34.806190490722656, "global_step": 131689, "epoch": 1088} {"train_loss": -36.75374221801758, "global_step": 131690, "epoch": 1088} {"train_loss": -37.85053253173828, "global_step": 131691, "epoch": 1088} {"train_loss": -34.728572845458984, "global_step": 131692, "epoch": 1088} {"train_loss": -37.82465744018555, "global_step": 131693, "epoch": 1088} {"train_loss": -34.65877914428711, "global_step": 131694, "epoch": 1088} {"train_loss": -38.44655227661133, "global_step": 131695, "epoch": 1088} {"train_loss": -37.402408599853516, "global_step": 131696, "epoch": 1088} {"train_loss": -36.65754699707031, "global_step": 131697, "epoch": 1088} {"train_loss": -37.11764144897461, "global_step": 131698, "epoch": 1088} {"train_loss": -37.647029876708984, "global_step": 131699, "epoch": 1088} {"train_loss": -35.04903030395508, "global_step": 131700, "epoch": 1088} {"train_loss": -37.45283126831055, "global_step": 131701, "epoch": 1088} {"train_loss": -37.013057708740234, "global_step": 131702, "epoch": 1088} {"train_loss": -38.499229431152344, "global_step": 131703, "epoch": 1088} {"train_loss": -38.09387969970703, "global_step": 131704, "epoch": 1088} {"train_loss": -37.926326751708984, "global_step": 131705, "epoch": 1088} {"train_loss": -36.390464782714844, "global_step": 131706, "epoch": 1088} {"train_loss": -36.785850524902344, "global_step": 131707, "epoch": 1088} {"train_loss": -38.81355667114258, "global_step": 131708, "epoch": 1088} {"train_loss": -37.18093490600586, "global_step": 131709, "epoch": 1088} {"train_loss": -37.553672790527344, "global_step": 131710, "epoch": 1088} {"train_loss": -36.64654541015625, "global_step": 131711, "epoch": 1088} {"train_loss": -39.028621673583984, "global_step": 131712, "epoch": 1088} {"train_loss": -39.25544357299805, "global_step": 131713, "epoch": 1088} {"train_loss": -37.639984130859375, "global_step": 131714, "epoch": 1088} {"train_loss": -38.393463134765625, "global_step": 131715, "epoch": 1088} {"train_loss": -37.88701248168945, "global_step": 131716, "epoch": 1088} {"train_loss": -39.51995849609375, "global_step": 131717, "epoch": 1088} {"train_loss": -38.728572845458984, "global_step": 131718, "epoch": 1088} {"train_loss": -38.94610595703125, "global_step": 131719, "epoch": 1088} {"train_loss": -37.51457214355469, "global_step": 131720, "epoch": 1088} {"train_loss": -37.0450439453125, "global_step": 131721, "epoch": 1088} {"train_loss": -38.99092483520508, "global_step": 131722, "epoch": 1088} {"train_loss": -38.69062042236328, "global_step": 131723, "epoch": 1088} {"train_loss": -39.33614730834961, "global_step": 131724, "epoch": 1088} {"train_loss": -39.80205154418945, "global_step": 131725, "epoch": 1088} {"train_loss": -39.304073333740234, "global_step": 131726, "epoch": 1088} {"train_loss": -39.50703048706055, "global_step": 131727, "epoch": 1088} {"train_loss": -39.57840347290039, "global_step": 131728, "epoch": 1088} {"train_loss": -39.3281135559082, "global_step": 131729, "epoch": 1088} {"train_loss": -39.35819625854492, "global_step": 131730, "epoch": 1088} {"train_loss": -39.31744384765625, "global_step": 131731, "epoch": 1088} {"train_loss": -38.91892623901367, "global_step": 131732, "epoch": 1088} {"train_loss": -40.01951217651367, "global_step": 131733, "epoch": 1088} {"train_loss": -38.90716552734375, "global_step": 131734, "epoch": 1088} {"train_loss": -39.663997650146484, "global_step": 131735, "epoch": 1088} {"train_loss": -38.85969924926758, "global_step": 131736, "epoch": 1088} {"train_loss": -39.236053466796875, "global_step": 131737, "epoch": 1088} {"train_loss": -39.83576965332031, "global_step": 131738, "epoch": 1088} {"train_loss": -39.179534912109375, "global_step": 131739, "epoch": 1088} {"train_loss": -39.752925872802734, "global_step": 131740, "epoch": 1088} {"train_loss": -39.11319351196289, "global_step": 131741, "epoch": 1088} {"train_loss": -39.46453857421875, "global_step": 131742, "epoch": 1088} {"train_loss": -40.016578674316406, "global_step": 131743, "epoch": 1088} {"train_loss": -39.21195602416992, "global_step": 131744, "epoch": 1088} {"train_loss": -39.98029708862305, "global_step": 131745, "epoch": 1088} {"train_loss": -39.22504425048828, "global_step": 131746, "epoch": 1088} {"train_loss": -39.04469299316406, "global_step": 131747, "epoch": 1088} {"train_loss": -39.0643310546875, "global_step": 131748, "epoch": 1088} {"train_loss": -39.59257888793945, "global_step": 131749, "epoch": 1088} {"train_loss": -39.94779968261719, "global_step": 131750, "epoch": 1088} {"train_loss": -39.68062973022461, "global_step": 131751, "epoch": 1088} {"train_loss": -40.29322814941406, "global_step": 131752, "epoch": 1088} {"train_loss": -39.09880447387695, "global_step": 131753, "epoch": 1088} {"train_loss": -39.900978088378906, "global_step": 131754, "epoch": 1088} {"train_loss": -40.04819869995117, "global_step": 131755, "epoch": 1088} {"train_loss": -39.82210922241211, "global_step": 131756, "epoch": 1088} {"train_loss": -40.1964111328125, "global_step": 131757, "epoch": 1088} {"train_loss": -40.130165100097656, "global_step": 131758, "epoch": 1088} {"train_loss": -39.91394805908203, "global_step": 131759, "epoch": 1088} {"train_loss": -40.276649475097656, "global_step": 131760, "epoch": 1088} {"train_loss": -40.64463806152344, "global_step": 131761, "epoch": 1088} {"train_loss": -40.083980560302734, "global_step": 131762, "epoch": 1088} {"train_loss": -39.66279220581055, "global_step": 131763, "epoch": 1088} {"train_loss": -39.80427932739258, "global_step": 131764, "epoch": 1088} {"train_loss": -40.40220260620117, "global_step": 131765, "epoch": 1088} {"train_loss": -40.38497543334961, "global_step": 131766, "epoch": 1088} {"train_loss": -40.489009857177734, "global_step": 131767, "epoch": 1088} {"train_loss": -38.87389982239274, "global_step": 131768, "epoch": 1088, "val_loss": 2586342.0} {"train_loss": -40.4613151550293, "global_step": 131769, "epoch": 1089} {"train_loss": -40.15790557861328, "global_step": 131770, "epoch": 1089} {"train_loss": -40.46802520751953, "global_step": 131771, "epoch": 1089} {"train_loss": -40.704933166503906, "global_step": 131772, "epoch": 1089} {"train_loss": -40.59851837158203, "global_step": 131773, "epoch": 1089} {"train_loss": -40.382293701171875, "global_step": 131774, "epoch": 1089} {"train_loss": -40.83552169799805, "global_step": 131775, "epoch": 1089} {"train_loss": -40.0406379699707, "global_step": 131776, "epoch": 1089} {"train_loss": -40.42694091796875, "global_step": 131777, "epoch": 1089} {"train_loss": -40.869300842285156, "global_step": 131778, "epoch": 1089} {"train_loss": -40.460811614990234, "global_step": 131779, "epoch": 1089} {"train_loss": -39.066017150878906, "global_step": 131780, "epoch": 1089} {"train_loss": -40.419429779052734, "global_step": 131781, "epoch": 1089} {"train_loss": -40.64107894897461, "global_step": 131782, "epoch": 1089} {"train_loss": -40.77178192138672, "global_step": 131783, "epoch": 1089} {"train_loss": -40.68149948120117, "global_step": 131784, "epoch": 1089} {"train_loss": -41.07419967651367, "global_step": 131785, "epoch": 1089} {"train_loss": -41.22148132324219, "global_step": 131786, "epoch": 1089} {"train_loss": -40.77456283569336, "global_step": 131787, "epoch": 1089} {"train_loss": -40.702999114990234, "global_step": 131788, "epoch": 1089} {"train_loss": -40.53767013549805, "global_step": 131789, "epoch": 1089} {"train_loss": -40.680999755859375, "global_step": 131790, "epoch": 1089} {"train_loss": -40.926910400390625, "global_step": 131791, "epoch": 1089} {"train_loss": -40.55364990234375, "global_step": 131792, "epoch": 1089} {"train_loss": -40.7005729675293, "global_step": 131793, "epoch": 1089} {"train_loss": -40.42972946166992, "global_step": 131794, "epoch": 1089} {"train_loss": -39.6324462890625, "global_step": 131795, "epoch": 1089} {"train_loss": -38.76224136352539, "global_step": 131796, "epoch": 1089} {"train_loss": -39.4554557800293, "global_step": 131797, "epoch": 1089} {"train_loss": -40.1524772644043, "global_step": 131798, "epoch": 1089} {"train_loss": -40.66541290283203, "global_step": 131799, "epoch": 1089} {"train_loss": -39.72203063964844, "global_step": 131800, "epoch": 1089} {"train_loss": -39.25310134887695, "global_step": 131801, "epoch": 1089} {"train_loss": -38.884212493896484, "global_step": 131802, "epoch": 1089} {"train_loss": -39.31986618041992, "global_step": 131803, "epoch": 1089} {"train_loss": -39.64143753051758, "global_step": 131804, "epoch": 1089} {"train_loss": -40.593814849853516, "global_step": 131805, "epoch": 1089} {"train_loss": -40.233192443847656, "global_step": 131806, "epoch": 1089} {"train_loss": -39.38418197631836, "global_step": 131807, "epoch": 1089} {"train_loss": -39.70746612548828, "global_step": 131808, "epoch": 1089} {"train_loss": -39.861419677734375, "global_step": 131809, "epoch": 1089} {"train_loss": -40.20345687866211, "global_step": 131810, "epoch": 1089} {"train_loss": -37.9411506652832, "global_step": 131811, "epoch": 1089} {"train_loss": -36.92751693725586, "global_step": 131812, "epoch": 1089} {"train_loss": -36.39426803588867, "global_step": 131813, "epoch": 1089} {"train_loss": -37.03118133544922, "global_step": 131814, "epoch": 1089} {"train_loss": -36.99997329711914, "global_step": 131815, "epoch": 1089} {"train_loss": -36.639617919921875, "global_step": 131816, "epoch": 1089} {"train_loss": -37.55891036987305, "global_step": 131817, "epoch": 1089} {"train_loss": -38.688446044921875, "global_step": 131818, "epoch": 1089} {"train_loss": -37.519588470458984, "global_step": 131819, "epoch": 1089} {"train_loss": -39.840755462646484, "global_step": 131820, "epoch": 1089} {"train_loss": -38.76789474487305, "global_step": 131821, "epoch": 1089} {"train_loss": -36.95654296875, "global_step": 131822, "epoch": 1089} {"train_loss": -36.881587982177734, "global_step": 131823, "epoch": 1089} {"train_loss": -40.4364013671875, "global_step": 131824, "epoch": 1089} {"train_loss": -38.936370849609375, "global_step": 131825, "epoch": 1089} {"train_loss": -37.00797653198242, "global_step": 131826, "epoch": 1089} {"train_loss": -39.11692428588867, "global_step": 131827, "epoch": 1089} {"train_loss": -39.7768440246582, "global_step": 131828, "epoch": 1089} {"train_loss": -39.4127082824707, "global_step": 131829, "epoch": 1089} {"train_loss": -40.341644287109375, "global_step": 131830, "epoch": 1089} {"train_loss": -39.88667297363281, "global_step": 131831, "epoch": 1089} {"train_loss": -40.12868881225586, "global_step": 131832, "epoch": 1089} {"train_loss": -39.64271926879883, "global_step": 131833, "epoch": 1089} {"train_loss": -39.595855712890625, "global_step": 131834, "epoch": 1089} {"train_loss": -37.452880859375, "global_step": 131835, "epoch": 1089} {"train_loss": -39.9714469909668, "global_step": 131836, "epoch": 1089} {"train_loss": -38.791194915771484, "global_step": 131837, "epoch": 1089} {"train_loss": -39.08088302612305, "global_step": 131838, "epoch": 1089} {"train_loss": -39.75608825683594, "global_step": 131839, "epoch": 1089} {"train_loss": -38.82686233520508, "global_step": 131840, "epoch": 1089} {"train_loss": -39.24711990356445, "global_step": 131841, "epoch": 1089} {"train_loss": -39.90271759033203, "global_step": 131842, "epoch": 1089} {"train_loss": -34.9354133605957, "global_step": 131843, "epoch": 1089} {"train_loss": -39.93507766723633, "global_step": 131844, "epoch": 1089} {"train_loss": -39.27693557739258, "global_step": 131845, "epoch": 1089} {"train_loss": -40.2487907409668, "global_step": 131846, "epoch": 1089} {"train_loss": -39.820533752441406, "global_step": 131847, "epoch": 1089} {"train_loss": -39.907806396484375, "global_step": 131848, "epoch": 1089} {"train_loss": -39.8477783203125, "global_step": 131849, "epoch": 1089} {"train_loss": -39.916194915771484, "global_step": 131850, "epoch": 1089} {"train_loss": -39.0364990234375, "global_step": 131851, "epoch": 1089} {"train_loss": -39.65591812133789, "global_step": 131852, "epoch": 1089} {"train_loss": -39.994667053222656, "global_step": 131853, "epoch": 1089} {"train_loss": -39.07758331298828, "global_step": 131854, "epoch": 1089} {"train_loss": -40.445674896240234, "global_step": 131855, "epoch": 1089} {"train_loss": -40.31924057006836, "global_step": 131856, "epoch": 1089} {"train_loss": -38.31435775756836, "global_step": 131857, "epoch": 1089} {"train_loss": -39.967735290527344, "global_step": 131858, "epoch": 1089} {"train_loss": -40.00447463989258, "global_step": 131859, "epoch": 1089} {"train_loss": -40.12952423095703, "global_step": 131860, "epoch": 1089} {"train_loss": -39.49089431762695, "global_step": 131861, "epoch": 1089} {"train_loss": -40.395450592041016, "global_step": 131862, "epoch": 1089} {"train_loss": -39.559085845947266, "global_step": 131863, "epoch": 1089} {"train_loss": -38.967952728271484, "global_step": 131864, "epoch": 1089} {"train_loss": -35.9906005859375, "global_step": 131865, "epoch": 1089} {"train_loss": -39.52764892578125, "global_step": 131866, "epoch": 1089} {"train_loss": -39.53102493286133, "global_step": 131867, "epoch": 1089} {"train_loss": -40.343746185302734, "global_step": 131868, "epoch": 1089} {"train_loss": -40.17224884033203, "global_step": 131869, "epoch": 1089} {"train_loss": -40.32925033569336, "global_step": 131870, "epoch": 1089} {"train_loss": -40.34706497192383, "global_step": 131871, "epoch": 1089} {"train_loss": -40.05545425415039, "global_step": 131872, "epoch": 1089} {"train_loss": -39.71711349487305, "global_step": 131873, "epoch": 1089} {"train_loss": -39.801246643066406, "global_step": 131874, "epoch": 1089} {"train_loss": -39.697608947753906, "global_step": 131875, "epoch": 1089} {"train_loss": -39.67672348022461, "global_step": 131876, "epoch": 1089} {"train_loss": -39.2579345703125, "global_step": 131877, "epoch": 1089} {"train_loss": -38.928585052490234, "global_step": 131878, "epoch": 1089} {"train_loss": -40.25828552246094, "global_step": 131879, "epoch": 1089} {"train_loss": -39.95264434814453, "global_step": 131880, "epoch": 1089} {"train_loss": -38.59136962890625, "global_step": 131881, "epoch": 1089} {"train_loss": -39.76483917236328, "global_step": 131882, "epoch": 1089} {"train_loss": -39.38633346557617, "global_step": 131883, "epoch": 1089} {"train_loss": -40.240848541259766, "global_step": 131884, "epoch": 1089} {"train_loss": -36.77791213989258, "global_step": 131885, "epoch": 1089} {"train_loss": -39.7869987487793, "global_step": 131886, "epoch": 1089} {"train_loss": -39.221473693847656, "global_step": 131887, "epoch": 1089} {"train_loss": -35.749427795410156, "global_step": 131888, "epoch": 1089} {"train_loss": -39.41480794228798, "global_step": 131889, "epoch": 1089, "val_loss": 2617761.0} {"train_loss": -32.4752197265625, "global_step": 131890, "epoch": 1090} {"train_loss": -13.404231071472168, "global_step": 131891, "epoch": 1090} {"train_loss": -37.99311065673828, "global_step": 131892, "epoch": 1090} {"train_loss": -26.014856338500977, "global_step": 131893, "epoch": 1090} {"train_loss": -32.44731521606445, "global_step": 131894, "epoch": 1090} {"train_loss": -16.29495620727539, "global_step": 131895, "epoch": 1090} {"train_loss": -33.43754959106445, "global_step": 131896, "epoch": 1090} {"train_loss": -32.225921630859375, "global_step": 131897, "epoch": 1090} {"train_loss": -35.41046905517578, "global_step": 131898, "epoch": 1090} {"train_loss": -31.256826400756836, "global_step": 131899, "epoch": 1090} {"train_loss": -24.761962890625, "global_step": 131900, "epoch": 1090} {"train_loss": -31.799604415893555, "global_step": 131901, "epoch": 1090} {"train_loss": -34.647735595703125, "global_step": 131902, "epoch": 1090} {"train_loss": -31.75339698791504, "global_step": 131903, "epoch": 1090} {"train_loss": -30.913137435913086, "global_step": 131904, "epoch": 1090} {"train_loss": -30.780054092407227, "global_step": 131905, "epoch": 1090} {"train_loss": -32.53727340698242, "global_step": 131906, "epoch": 1090} {"train_loss": -30.039514541625977, "global_step": 131907, "epoch": 1090} {"train_loss": -31.650970458984375, "global_step": 131908, "epoch": 1090} {"train_loss": -32.7300910949707, "global_step": 131909, "epoch": 1090} {"train_loss": -34.645721435546875, "global_step": 131910, "epoch": 1090} {"train_loss": -34.0355339050293, "global_step": 131911, "epoch": 1090} {"train_loss": -35.31647872924805, "global_step": 131912, "epoch": 1090} {"train_loss": -34.899166107177734, "global_step": 131913, "epoch": 1090} {"train_loss": -35.725154876708984, "global_step": 131914, "epoch": 1090} {"train_loss": -34.5545539855957, "global_step": 131915, "epoch": 1090} {"train_loss": -35.80176544189453, "global_step": 131916, "epoch": 1090} {"train_loss": -34.88914108276367, "global_step": 131917, "epoch": 1090} {"train_loss": -32.8748893737793, "global_step": 131918, "epoch": 1090} {"train_loss": -35.457359313964844, "global_step": 131919, "epoch": 1090} {"train_loss": -35.68365478515625, "global_step": 131920, "epoch": 1090} {"train_loss": -35.063385009765625, "global_step": 131921, "epoch": 1090} {"train_loss": -33.9758186340332, "global_step": 131922, "epoch": 1090} {"train_loss": -35.801719665527344, "global_step": 131923, "epoch": 1090} {"train_loss": -35.91526412963867, "global_step": 131924, "epoch": 1090} {"train_loss": -36.882137298583984, "global_step": 131925, "epoch": 1090} {"train_loss": -35.53559494018555, "global_step": 131926, "epoch": 1090} {"train_loss": -35.311214447021484, "global_step": 131927, "epoch": 1090} {"train_loss": -35.69440841674805, "global_step": 131928, "epoch": 1090} {"train_loss": -36.506874084472656, "global_step": 131929, "epoch": 1090} {"train_loss": -36.43507766723633, "global_step": 131930, "epoch": 1090} {"train_loss": -35.72683334350586, "global_step": 131931, "epoch": 1090} {"train_loss": -36.63739776611328, "global_step": 131932, "epoch": 1090} {"train_loss": -35.40252685546875, "global_step": 131933, "epoch": 1090} {"train_loss": -35.803157806396484, "global_step": 131934, "epoch": 1090} {"train_loss": -34.83378219604492, "global_step": 131935, "epoch": 1090} {"train_loss": -37.9506721496582, "global_step": 131936, "epoch": 1090} {"train_loss": -36.3507080078125, "global_step": 131937, "epoch": 1090} {"train_loss": -36.45803451538086, "global_step": 131938, "epoch": 1090} {"train_loss": -36.163551330566406, "global_step": 131939, "epoch": 1090} {"train_loss": -36.46596908569336, "global_step": 131940, "epoch": 1090} {"train_loss": -36.7358283996582, "global_step": 131941, "epoch": 1090} {"train_loss": -36.46114730834961, "global_step": 131942, "epoch": 1090} {"train_loss": -35.97964859008789, "global_step": 131943, "epoch": 1090} {"train_loss": -37.38690948486328, "global_step": 131944, "epoch": 1090} {"train_loss": -37.13884353637695, "global_step": 131945, "epoch": 1090} {"train_loss": -37.03972244262695, "global_step": 131946, "epoch": 1090} {"train_loss": -37.213130950927734, "global_step": 131947, "epoch": 1090} {"train_loss": -37.11442184448242, "global_step": 131948, "epoch": 1090} {"train_loss": -36.70370101928711, "global_step": 131949, "epoch": 1090} {"train_loss": -37.91669845581055, "global_step": 131950, "epoch": 1090} {"train_loss": -36.85352325439453, "global_step": 131951, "epoch": 1090} {"train_loss": -37.564002990722656, "global_step": 131952, "epoch": 1090} {"train_loss": -37.459835052490234, "global_step": 131953, "epoch": 1090} {"train_loss": -38.4715690612793, "global_step": 131954, "epoch": 1090} {"train_loss": -38.23775100708008, "global_step": 131955, "epoch": 1090} {"train_loss": -37.966426849365234, "global_step": 131956, "epoch": 1090} {"train_loss": -37.66299057006836, "global_step": 131957, "epoch": 1090} {"train_loss": -36.92428207397461, "global_step": 131958, "epoch": 1090} {"train_loss": -37.15009307861328, "global_step": 131959, "epoch": 1090} {"train_loss": -37.952388763427734, "global_step": 131960, "epoch": 1090} {"train_loss": -37.915672302246094, "global_step": 131961, "epoch": 1090} {"train_loss": -37.56855773925781, "global_step": 131962, "epoch": 1090} {"train_loss": -36.74688720703125, "global_step": 131963, "epoch": 1090} {"train_loss": -37.897769927978516, "global_step": 131964, "epoch": 1090} {"train_loss": -38.071075439453125, "global_step": 131965, "epoch": 1090} {"train_loss": -37.907081604003906, "global_step": 131966, "epoch": 1090} {"train_loss": -37.692047119140625, "global_step": 131967, "epoch": 1090} {"train_loss": -37.5296630859375, "global_step": 131968, "epoch": 1090} {"train_loss": -37.52286911010742, "global_step": 131969, "epoch": 1090} {"train_loss": -38.839595794677734, "global_step": 131970, "epoch": 1090} {"train_loss": -38.279300689697266, "global_step": 131971, "epoch": 1090} {"train_loss": -38.38723373413086, "global_step": 131972, "epoch": 1090} {"train_loss": -38.9637451171875, "global_step": 131973, "epoch": 1090} {"train_loss": -38.8476676940918, "global_step": 131974, "epoch": 1090} {"train_loss": -37.81126022338867, "global_step": 131975, "epoch": 1090} {"train_loss": -37.373538970947266, "global_step": 131976, "epoch": 1090} {"train_loss": -37.8682861328125, "global_step": 131977, "epoch": 1090} {"train_loss": -38.65089797973633, "global_step": 131978, "epoch": 1090} {"train_loss": -38.02853012084961, "global_step": 131979, "epoch": 1090} {"train_loss": -37.30295944213867, "global_step": 131980, "epoch": 1090} {"train_loss": -38.412322998046875, "global_step": 131981, "epoch": 1090} {"train_loss": -37.80790328979492, "global_step": 131982, "epoch": 1090} {"train_loss": -39.62001419067383, "global_step": 131983, "epoch": 1090} {"train_loss": -38.5358772277832, "global_step": 131984, "epoch": 1090} {"train_loss": -38.0725212097168, "global_step": 131985, "epoch": 1090} {"train_loss": -38.52777099609375, "global_step": 131986, "epoch": 1090} {"train_loss": -37.81325149536133, "global_step": 131987, "epoch": 1090} {"train_loss": -39.10606002807617, "global_step": 131988, "epoch": 1090} {"train_loss": -38.908180236816406, "global_step": 131989, "epoch": 1090} {"train_loss": -37.22185134887695, "global_step": 131990, "epoch": 1090} {"train_loss": -39.84132385253906, "global_step": 131991, "epoch": 1090} {"train_loss": -38.53555679321289, "global_step": 131992, "epoch": 1090} {"train_loss": -38.57551193237305, "global_step": 131993, "epoch": 1090} {"train_loss": -37.964683532714844, "global_step": 131994, "epoch": 1090} {"train_loss": -39.60476303100586, "global_step": 131995, "epoch": 1090} {"train_loss": -39.1812858581543, "global_step": 131996, "epoch": 1090} {"train_loss": -38.98082733154297, "global_step": 131997, "epoch": 1090} {"train_loss": -39.12801742553711, "global_step": 131998, "epoch": 1090} {"train_loss": -37.821876525878906, "global_step": 131999, "epoch": 1090} {"train_loss": -38.350521087646484, "global_step": 132000, "epoch": 1090} {"train_loss": -39.43501663208008, "global_step": 132001, "epoch": 1090} {"train_loss": -39.13359451293945, "global_step": 132002, "epoch": 1090} {"train_loss": -37.44774627685547, "global_step": 132003, "epoch": 1090} {"train_loss": -37.94400405883789, "global_step": 132004, "epoch": 1090} {"train_loss": -38.413387298583984, "global_step": 132005, "epoch": 1090} {"train_loss": -38.11849594116211, "global_step": 132006, "epoch": 1090} {"train_loss": -38.41944122314453, "global_step": 132007, "epoch": 1090} {"train_loss": -39.993961334228516, "global_step": 132008, "epoch": 1090} {"train_loss": -38.073360443115234, "global_step": 132009, "epoch": 1090} {"train_loss": -36.09570666384106, "global_step": 132010, "epoch": 1090, "val_loss": 2599206.25} {"train_loss": -38.440250396728516, "global_step": 132011, "epoch": 1091} {"train_loss": -39.44430160522461, "global_step": 132012, "epoch": 1091} {"train_loss": -38.6832389831543, "global_step": 132013, "epoch": 1091} {"train_loss": -39.07829666137695, "global_step": 132014, "epoch": 1091} {"train_loss": -39.02726364135742, "global_step": 132015, "epoch": 1091} {"train_loss": -39.3687858581543, "global_step": 132016, "epoch": 1091} {"train_loss": -38.55481719970703, "global_step": 132017, "epoch": 1091} {"train_loss": -39.8671989440918, "global_step": 132018, "epoch": 1091} {"train_loss": -38.29267120361328, "global_step": 132019, "epoch": 1091} {"train_loss": -39.57403564453125, "global_step": 132020, "epoch": 1091} {"train_loss": -39.54965591430664, "global_step": 132021, "epoch": 1091} {"train_loss": -39.00332260131836, "global_step": 132022, "epoch": 1091} {"train_loss": -39.6480827331543, "global_step": 132023, "epoch": 1091} {"train_loss": -39.33525848388672, "global_step": 132024, "epoch": 1091} {"train_loss": -38.883087158203125, "global_step": 132025, "epoch": 1091} {"train_loss": -39.094871520996094, "global_step": 132026, "epoch": 1091} {"train_loss": -39.80835723876953, "global_step": 132027, "epoch": 1091} {"train_loss": -38.893463134765625, "global_step": 132028, "epoch": 1091} {"train_loss": -39.69561767578125, "global_step": 132029, "epoch": 1091} {"train_loss": -39.264251708984375, "global_step": 132030, "epoch": 1091} {"train_loss": -38.93647384643555, "global_step": 132031, "epoch": 1091} {"train_loss": -38.49650573730469, "global_step": 132032, "epoch": 1091} {"train_loss": -39.57041549682617, "global_step": 132033, "epoch": 1091} {"train_loss": -38.1367301940918, "global_step": 132034, "epoch": 1091} {"train_loss": -38.79813766479492, "global_step": 132035, "epoch": 1091} {"train_loss": -39.633445739746094, "global_step": 132036, "epoch": 1091} {"train_loss": -38.6798210144043, "global_step": 132037, "epoch": 1091} {"train_loss": -38.54570770263672, "global_step": 132038, "epoch": 1091} {"train_loss": -37.57318115234375, "global_step": 132039, "epoch": 1091} {"train_loss": -38.983821868896484, "global_step": 132040, "epoch": 1091} {"train_loss": -37.03043746948242, "global_step": 132041, "epoch": 1091} {"train_loss": -39.061370849609375, "global_step": 132042, "epoch": 1091} {"train_loss": -37.81498336791992, "global_step": 132043, "epoch": 1091} {"train_loss": -38.1719970703125, "global_step": 132044, "epoch": 1091} {"train_loss": -39.423797607421875, "global_step": 132045, "epoch": 1091} {"train_loss": -39.22976303100586, "global_step": 132046, "epoch": 1091} {"train_loss": -38.57835006713867, "global_step": 132047, "epoch": 1091} {"train_loss": -39.24813461303711, "global_step": 132048, "epoch": 1091} {"train_loss": -38.763221740722656, "global_step": 132049, "epoch": 1091} {"train_loss": -39.323760986328125, "global_step": 132050, "epoch": 1091} {"train_loss": -39.645442962646484, "global_step": 132051, "epoch": 1091} {"train_loss": -38.72883605957031, "global_step": 132052, "epoch": 1091} {"train_loss": -39.22136306762695, "global_step": 132053, "epoch": 1091} {"train_loss": -39.684383392333984, "global_step": 132054, "epoch": 1091} {"train_loss": -39.4636116027832, "global_step": 132055, "epoch": 1091} {"train_loss": -38.62043380737305, "global_step": 132056, "epoch": 1091} {"train_loss": -38.72318649291992, "global_step": 132057, "epoch": 1091} {"train_loss": -39.020503997802734, "global_step": 132058, "epoch": 1091} {"train_loss": -38.56565475463867, "global_step": 132059, "epoch": 1091} {"train_loss": -37.97146987915039, "global_step": 132060, "epoch": 1091} {"train_loss": -37.480628967285156, "global_step": 132061, "epoch": 1091} {"train_loss": -30.659561157226562, "global_step": 132062, "epoch": 1091} {"train_loss": -19.15877342224121, "global_step": 132063, "epoch": 1091} {"train_loss": -16.934843063354492, "global_step": 132064, "epoch": 1091} {"train_loss": -36.612545013427734, "global_step": 132065, "epoch": 1091} {"train_loss": -29.941085815429688, "global_step": 132066, "epoch": 1091} {"train_loss": -17.763887405395508, "global_step": 132067, "epoch": 1091} {"train_loss": -37.48200607299805, "global_step": 132068, "epoch": 1091} {"train_loss": -29.733251571655273, "global_step": 132069, "epoch": 1091} {"train_loss": -36.81599044799805, "global_step": 132070, "epoch": 1091} {"train_loss": -33.07876968383789, "global_step": 132071, "epoch": 1091} {"train_loss": -37.487972259521484, "global_step": 132072, "epoch": 1091} {"train_loss": -32.84194564819336, "global_step": 132073, "epoch": 1091} {"train_loss": -37.951419830322266, "global_step": 132074, "epoch": 1091} {"train_loss": -35.20059585571289, "global_step": 132075, "epoch": 1091} {"train_loss": -37.5748405456543, "global_step": 132076, "epoch": 1091} {"train_loss": -36.319034576416016, "global_step": 132077, "epoch": 1091} {"train_loss": -37.776611328125, "global_step": 132078, "epoch": 1091} {"train_loss": -38.69930648803711, "global_step": 132079, "epoch": 1091} {"train_loss": -36.73545455932617, "global_step": 132080, "epoch": 1091} {"train_loss": -37.17618942260742, "global_step": 132081, "epoch": 1091} {"train_loss": -38.4896354675293, "global_step": 132082, "epoch": 1091} {"train_loss": -37.48617172241211, "global_step": 132083, "epoch": 1091} {"train_loss": -38.60957717895508, "global_step": 132084, "epoch": 1091} {"train_loss": -36.810062408447266, "global_step": 132085, "epoch": 1091} {"train_loss": -37.544376373291016, "global_step": 132086, "epoch": 1091} {"train_loss": -39.0416374206543, "global_step": 132087, "epoch": 1091} {"train_loss": -37.04475784301758, "global_step": 132088, "epoch": 1091} {"train_loss": -37.50442123413086, "global_step": 132089, "epoch": 1091} {"train_loss": -38.5916862487793, "global_step": 132090, "epoch": 1091} {"train_loss": -38.1691780090332, "global_step": 132091, "epoch": 1091} {"train_loss": -38.748043060302734, "global_step": 132092, "epoch": 1091} {"train_loss": -39.19130325317383, "global_step": 132093, "epoch": 1091} {"train_loss": -38.74357986450195, "global_step": 132094, "epoch": 1091} {"train_loss": -38.50348663330078, "global_step": 132095, "epoch": 1091} {"train_loss": -38.177955627441406, "global_step": 132096, "epoch": 1091} {"train_loss": -38.5012092590332, "global_step": 132097, "epoch": 1091} {"train_loss": -38.61219024658203, "global_step": 132098, "epoch": 1091} {"train_loss": -38.48618698120117, "global_step": 132099, "epoch": 1091} {"train_loss": -39.5252571105957, "global_step": 132100, "epoch": 1091} {"train_loss": -38.543331146240234, "global_step": 132101, "epoch": 1091} {"train_loss": -38.08905792236328, "global_step": 132102, "epoch": 1091} {"train_loss": -39.68500900268555, "global_step": 132103, "epoch": 1091} {"train_loss": -38.764278411865234, "global_step": 132104, "epoch": 1091} {"train_loss": -39.03529739379883, "global_step": 132105, "epoch": 1091} {"train_loss": -38.529354095458984, "global_step": 132106, "epoch": 1091} {"train_loss": -38.27421188354492, "global_step": 132107, "epoch": 1091} {"train_loss": -38.53319549560547, "global_step": 132108, "epoch": 1091} {"train_loss": -38.80784225463867, "global_step": 132109, "epoch": 1091} {"train_loss": -39.111854553222656, "global_step": 132110, "epoch": 1091} {"train_loss": -39.17837142944336, "global_step": 132111, "epoch": 1091} {"train_loss": -38.98366165161133, "global_step": 132112, "epoch": 1091} {"train_loss": -39.250885009765625, "global_step": 132113, "epoch": 1091} {"train_loss": -39.304927825927734, "global_step": 132114, "epoch": 1091} {"train_loss": -39.980995178222656, "global_step": 132115, "epoch": 1091} {"train_loss": -39.07094955444336, "global_step": 132116, "epoch": 1091} {"train_loss": -39.540557861328125, "global_step": 132117, "epoch": 1091} {"train_loss": -38.99249267578125, "global_step": 132118, "epoch": 1091} {"train_loss": -39.96843338012695, "global_step": 132119, "epoch": 1091} {"train_loss": -39.1757926940918, "global_step": 132120, "epoch": 1091} {"train_loss": -39.34029006958008, "global_step": 132121, "epoch": 1091} {"train_loss": -39.90623092651367, "global_step": 132122, "epoch": 1091} {"train_loss": -39.80498123168945, "global_step": 132123, "epoch": 1091} {"train_loss": -39.93006134033203, "global_step": 132124, "epoch": 1091} {"train_loss": -38.93678283691406, "global_step": 132125, "epoch": 1091} {"train_loss": -40.505836486816406, "global_step": 132126, "epoch": 1091} {"train_loss": -40.63550567626953, "global_step": 132127, "epoch": 1091} {"train_loss": -40.23402404785156, "global_step": 132128, "epoch": 1091} {"train_loss": -40.412445068359375, "global_step": 132129, "epoch": 1091} {"train_loss": -40.17025375366211, "global_step": 132130, "epoch": 1091} {"train_loss": -37.9310032552924, "global_step": 132131, "epoch": 1091, "val_loss": 2600738.25} {"train_loss": -39.79230499267578, "global_step": 132132, "epoch": 1092} {"train_loss": -39.60335922241211, "global_step": 132133, "epoch": 1092} {"train_loss": -40.362606048583984, "global_step": 132134, "epoch": 1092} {"train_loss": -39.81720733642578, "global_step": 132135, "epoch": 1092} {"train_loss": -40.62312698364258, "global_step": 132136, "epoch": 1092} {"train_loss": -38.725826263427734, "global_step": 132137, "epoch": 1092} {"train_loss": -39.87075424194336, "global_step": 132138, "epoch": 1092} {"train_loss": -39.24256896972656, "global_step": 132139, "epoch": 1092} {"train_loss": -39.55772018432617, "global_step": 132140, "epoch": 1092} {"train_loss": -40.41482162475586, "global_step": 132141, "epoch": 1092} {"train_loss": -40.4022102355957, "global_step": 132142, "epoch": 1092} {"train_loss": -39.508827209472656, "global_step": 132143, "epoch": 1092} {"train_loss": -38.39162826538086, "global_step": 132144, "epoch": 1092} {"train_loss": -39.38082504272461, "global_step": 132145, "epoch": 1092} {"train_loss": -39.43403244018555, "global_step": 132146, "epoch": 1092} {"train_loss": -39.965606689453125, "global_step": 132147, "epoch": 1092} {"train_loss": -39.97488784790039, "global_step": 132148, "epoch": 1092} {"train_loss": -35.58742904663086, "global_step": 132149, "epoch": 1092} {"train_loss": -39.181434631347656, "global_step": 132150, "epoch": 1092} {"train_loss": -38.0749397277832, "global_step": 132151, "epoch": 1092} {"train_loss": -38.6693229675293, "global_step": 132152, "epoch": 1092} {"train_loss": -33.19068908691406, "global_step": 132153, "epoch": 1092} {"train_loss": -32.73774337768555, "global_step": 132154, "epoch": 1092} {"train_loss": -36.35354995727539, "global_step": 132155, "epoch": 1092} {"train_loss": -37.47015380859375, "global_step": 132156, "epoch": 1092} {"train_loss": -35.9266242980957, "global_step": 132157, "epoch": 1092} {"train_loss": -29.760528564453125, "global_step": 132158, "epoch": 1092} {"train_loss": -31.282812118530273, "global_step": 132159, "epoch": 1092} {"train_loss": -32.1098518371582, "global_step": 132160, "epoch": 1092} {"train_loss": -34.43408203125, "global_step": 132161, "epoch": 1092} {"train_loss": -35.541748046875, "global_step": 132162, "epoch": 1092} {"train_loss": -32.0698356628418, "global_step": 132163, "epoch": 1092} {"train_loss": -33.06360626220703, "global_step": 132164, "epoch": 1092} {"train_loss": -36.13314437866211, "global_step": 132165, "epoch": 1092} {"train_loss": -35.427242279052734, "global_step": 132166, "epoch": 1092} {"train_loss": -35.36680221557617, "global_step": 132167, "epoch": 1092} {"train_loss": -36.219173431396484, "global_step": 132168, "epoch": 1092} {"train_loss": -36.24158477783203, "global_step": 132169, "epoch": 1092} {"train_loss": -36.02832794189453, "global_step": 132170, "epoch": 1092} {"train_loss": -37.327789306640625, "global_step": 132171, "epoch": 1092} {"train_loss": -36.199466705322266, "global_step": 132172, "epoch": 1092} {"train_loss": -31.183948516845703, "global_step": 132173, "epoch": 1092} {"train_loss": -36.05735397338867, "global_step": 132174, "epoch": 1092} {"train_loss": -36.239051818847656, "global_step": 132175, "epoch": 1092} {"train_loss": -34.04999542236328, "global_step": 132176, "epoch": 1092} {"train_loss": -36.18183135986328, "global_step": 132177, "epoch": 1092} {"train_loss": -37.60950469970703, "global_step": 132178, "epoch": 1092} {"train_loss": -35.19551467895508, "global_step": 132179, "epoch": 1092} {"train_loss": -37.417930603027344, "global_step": 132180, "epoch": 1092} {"train_loss": -38.62127685546875, "global_step": 132181, "epoch": 1092} {"train_loss": -37.0344352722168, "global_step": 132182, "epoch": 1092} {"train_loss": -35.34479522705078, "global_step": 132183, "epoch": 1092} {"train_loss": -37.89813232421875, "global_step": 132184, "epoch": 1092} {"train_loss": -37.90873336791992, "global_step": 132185, "epoch": 1092} {"train_loss": -37.75785446166992, "global_step": 132186, "epoch": 1092} {"train_loss": -38.45725631713867, "global_step": 132187, "epoch": 1092} {"train_loss": -38.157257080078125, "global_step": 132188, "epoch": 1092} {"train_loss": -38.483219146728516, "global_step": 132189, "epoch": 1092} {"train_loss": -37.70724105834961, "global_step": 132190, "epoch": 1092} {"train_loss": -34.43610763549805, "global_step": 132191, "epoch": 1092} {"train_loss": -37.46185302734375, "global_step": 132192, "epoch": 1092} {"train_loss": -35.871402740478516, "global_step": 132193, "epoch": 1092} {"train_loss": -38.43003463745117, "global_step": 132194, "epoch": 1092} {"train_loss": -36.8592529296875, "global_step": 132195, "epoch": 1092} {"train_loss": -36.56869125366211, "global_step": 132196, "epoch": 1092} {"train_loss": -38.24857711791992, "global_step": 132197, "epoch": 1092} {"train_loss": -38.627357482910156, "global_step": 132198, "epoch": 1092} {"train_loss": -37.819515228271484, "global_step": 132199, "epoch": 1092} {"train_loss": -36.6427116394043, "global_step": 132200, "epoch": 1092} {"train_loss": -38.412757873535156, "global_step": 132201, "epoch": 1092} {"train_loss": -38.505367279052734, "global_step": 132202, "epoch": 1092} {"train_loss": -38.32783889770508, "global_step": 132203, "epoch": 1092} {"train_loss": -37.41188049316406, "global_step": 132204, "epoch": 1092} {"train_loss": -38.90787124633789, "global_step": 132205, "epoch": 1092} {"train_loss": -37.2744140625, "global_step": 132206, "epoch": 1092} {"train_loss": -37.02395248413086, "global_step": 132207, "epoch": 1092} {"train_loss": -38.173824310302734, "global_step": 132208, "epoch": 1092} {"train_loss": -39.0395393371582, "global_step": 132209, "epoch": 1092} {"train_loss": -38.753517150878906, "global_step": 132210, "epoch": 1092} {"train_loss": -39.462623596191406, "global_step": 132211, "epoch": 1092} {"train_loss": -38.58591842651367, "global_step": 132212, "epoch": 1092} {"train_loss": -39.28976058959961, "global_step": 132213, "epoch": 1092} {"train_loss": -37.64985275268555, "global_step": 132214, "epoch": 1092} {"train_loss": -39.775238037109375, "global_step": 132215, "epoch": 1092} {"train_loss": -39.101436614990234, "global_step": 132216, "epoch": 1092} {"train_loss": -39.57477569580078, "global_step": 132217, "epoch": 1092} {"train_loss": -38.73369598388672, "global_step": 132218, "epoch": 1092} {"train_loss": -38.54228591918945, "global_step": 132219, "epoch": 1092} {"train_loss": -39.15609359741211, "global_step": 132220, "epoch": 1092} {"train_loss": -39.980743408203125, "global_step": 132221, "epoch": 1092} {"train_loss": -39.712806701660156, "global_step": 132222, "epoch": 1092} {"train_loss": -39.52347183227539, "global_step": 132223, "epoch": 1092} {"train_loss": -39.40153121948242, "global_step": 132224, "epoch": 1092} {"train_loss": -38.71599578857422, "global_step": 132225, "epoch": 1092} {"train_loss": -38.88551712036133, "global_step": 132226, "epoch": 1092} {"train_loss": -39.2147216796875, "global_step": 132227, "epoch": 1092} {"train_loss": -39.64411163330078, "global_step": 132228, "epoch": 1092} {"train_loss": -39.14225387573242, "global_step": 132229, "epoch": 1092} {"train_loss": -39.524566650390625, "global_step": 132230, "epoch": 1092} {"train_loss": -39.054622650146484, "global_step": 132231, "epoch": 1092} {"train_loss": -39.47686004638672, "global_step": 132232, "epoch": 1092} {"train_loss": -38.871639251708984, "global_step": 132233, "epoch": 1092} {"train_loss": -39.69547653198242, "global_step": 132234, "epoch": 1092} {"train_loss": -38.93534469604492, "global_step": 132235, "epoch": 1092} {"train_loss": -39.96036148071289, "global_step": 132236, "epoch": 1092} {"train_loss": -40.03548049926758, "global_step": 132237, "epoch": 1092} {"train_loss": -39.54175567626953, "global_step": 132238, "epoch": 1092} {"train_loss": -39.49176788330078, "global_step": 132239, "epoch": 1092} {"train_loss": -39.680965423583984, "global_step": 132240, "epoch": 1092} {"train_loss": -40.04804611206055, "global_step": 132241, "epoch": 1092} {"train_loss": -40.20893096923828, "global_step": 132242, "epoch": 1092} {"train_loss": -40.135337829589844, "global_step": 132243, "epoch": 1092} {"train_loss": -39.75682830810547, "global_step": 132244, "epoch": 1092} {"train_loss": -40.3052978515625, "global_step": 132245, "epoch": 1092} {"train_loss": -39.68535232543945, "global_step": 132246, "epoch": 1092} {"train_loss": -40.24292755126953, "global_step": 132247, "epoch": 1092} {"train_loss": -39.85799789428711, "global_step": 132248, "epoch": 1092} {"train_loss": -39.49351119995117, "global_step": 132249, "epoch": 1092} {"train_loss": -39.94576644897461, "global_step": 132250, "epoch": 1092} {"train_loss": -40.22008514404297, "global_step": 132251, "epoch": 1092} {"train_loss": -37.94896422141839, "global_step": 132252, "epoch": 1092, "val_loss": 2612677.0} {"train_loss": -39.85596466064453, "global_step": 132253, "epoch": 1093} {"train_loss": -40.28084182739258, "global_step": 132254, "epoch": 1093} {"train_loss": -40.64413070678711, "global_step": 132255, "epoch": 1093} {"train_loss": -40.280826568603516, "global_step": 132256, "epoch": 1093} {"train_loss": -40.09957504272461, "global_step": 132257, "epoch": 1093} {"train_loss": -40.18104934692383, "global_step": 132258, "epoch": 1093} {"train_loss": -40.63010787963867, "global_step": 132259, "epoch": 1093} {"train_loss": -40.94511795043945, "global_step": 132260, "epoch": 1093} {"train_loss": -40.57686996459961, "global_step": 132261, "epoch": 1093} {"train_loss": -40.62127685546875, "global_step": 132262, "epoch": 1093} {"train_loss": -39.793174743652344, "global_step": 132263, "epoch": 1093} {"train_loss": -39.795867919921875, "global_step": 132264, "epoch": 1093} {"train_loss": -40.65058135986328, "global_step": 132265, "epoch": 1093} {"train_loss": -40.69027328491211, "global_step": 132266, "epoch": 1093} {"train_loss": -40.995765686035156, "global_step": 132267, "epoch": 1093} {"train_loss": -40.33073043823242, "global_step": 132268, "epoch": 1093} {"train_loss": -39.934814453125, "global_step": 132269, "epoch": 1093} {"train_loss": -40.020660400390625, "global_step": 132270, "epoch": 1093} {"train_loss": -39.350624084472656, "global_step": 132271, "epoch": 1093} {"train_loss": -39.578548431396484, "global_step": 132272, "epoch": 1093} {"train_loss": -40.43937301635742, "global_step": 132273, "epoch": 1093} {"train_loss": -39.896087646484375, "global_step": 132274, "epoch": 1093} {"train_loss": -40.39887619018555, "global_step": 132275, "epoch": 1093} {"train_loss": -40.81956100463867, "global_step": 132276, "epoch": 1093} {"train_loss": -40.80172348022461, "global_step": 132277, "epoch": 1093} {"train_loss": -40.42380142211914, "global_step": 132278, "epoch": 1093} {"train_loss": -40.038177490234375, "global_step": 132279, "epoch": 1093} {"train_loss": -39.84212875366211, "global_step": 132280, "epoch": 1093} {"train_loss": -39.174373626708984, "global_step": 132281, "epoch": 1093} {"train_loss": -39.425933837890625, "global_step": 132282, "epoch": 1093} {"train_loss": -40.6041145324707, "global_step": 132283, "epoch": 1093} {"train_loss": -40.65485763549805, "global_step": 132284, "epoch": 1093} {"train_loss": -40.25928497314453, "global_step": 132285, "epoch": 1093} {"train_loss": -39.91473388671875, "global_step": 132286, "epoch": 1093} {"train_loss": -38.27639389038086, "global_step": 132287, "epoch": 1093} {"train_loss": -37.3034782409668, "global_step": 132288, "epoch": 1093} {"train_loss": -38.94205856323242, "global_step": 132289, "epoch": 1093} {"train_loss": -39.17289352416992, "global_step": 132290, "epoch": 1093} {"train_loss": -37.984554290771484, "global_step": 132291, "epoch": 1093} {"train_loss": -39.193077087402344, "global_step": 132292, "epoch": 1093} {"train_loss": -39.583866119384766, "global_step": 132293, "epoch": 1093} {"train_loss": -39.15663528442383, "global_step": 132294, "epoch": 1093} {"train_loss": -35.96124267578125, "global_step": 132295, "epoch": 1093} {"train_loss": -37.08758544921875, "global_step": 132296, "epoch": 1093} {"train_loss": -39.372005462646484, "global_step": 132297, "epoch": 1093} {"train_loss": -35.085079193115234, "global_step": 132298, "epoch": 1093} {"train_loss": -39.78070068359375, "global_step": 132299, "epoch": 1093} {"train_loss": -33.013126373291016, "global_step": 132300, "epoch": 1093} {"train_loss": -36.904048919677734, "global_step": 132301, "epoch": 1093} {"train_loss": -38.99846649169922, "global_step": 132302, "epoch": 1093} {"train_loss": -37.07634353637695, "global_step": 132303, "epoch": 1093} {"train_loss": -36.7752685546875, "global_step": 132304, "epoch": 1093} {"train_loss": -37.69916915893555, "global_step": 132305, "epoch": 1093} {"train_loss": -32.57149124145508, "global_step": 132306, "epoch": 1093} {"train_loss": -36.34980392456055, "global_step": 132307, "epoch": 1093} {"train_loss": -37.34392547607422, "global_step": 132308, "epoch": 1093} {"train_loss": -34.084312438964844, "global_step": 132309, "epoch": 1093} {"train_loss": -36.03669357299805, "global_step": 132310, "epoch": 1093} {"train_loss": -34.323543548583984, "global_step": 132311, "epoch": 1093} {"train_loss": -37.91738510131836, "global_step": 132312, "epoch": 1093} {"train_loss": -35.25515365600586, "global_step": 132313, "epoch": 1093} {"train_loss": -33.87423324584961, "global_step": 132314, "epoch": 1093} {"train_loss": -37.36391067504883, "global_step": 132315, "epoch": 1093} {"train_loss": -37.9686279296875, "global_step": 132316, "epoch": 1093} {"train_loss": -36.889163970947266, "global_step": 132317, "epoch": 1093} {"train_loss": -37.517635345458984, "global_step": 132318, "epoch": 1093} {"train_loss": -37.96376419067383, "global_step": 132319, "epoch": 1093} {"train_loss": -37.76791763305664, "global_step": 132320, "epoch": 1093} {"train_loss": -38.44966506958008, "global_step": 132321, "epoch": 1093} {"train_loss": -37.98130416870117, "global_step": 132322, "epoch": 1093} {"train_loss": -38.24459457397461, "global_step": 132323, "epoch": 1093} {"train_loss": -37.20589828491211, "global_step": 132324, "epoch": 1093} {"train_loss": -37.75423049926758, "global_step": 132325, "epoch": 1093} {"train_loss": -37.60274887084961, "global_step": 132326, "epoch": 1093} {"train_loss": -38.580684661865234, "global_step": 132327, "epoch": 1093} {"train_loss": -37.38593292236328, "global_step": 132328, "epoch": 1093} {"train_loss": -38.18796157836914, "global_step": 132329, "epoch": 1093} {"train_loss": -37.92450714111328, "global_step": 132330, "epoch": 1093} {"train_loss": -39.30438995361328, "global_step": 132331, "epoch": 1093} {"train_loss": -37.50816345214844, "global_step": 132332, "epoch": 1093} {"train_loss": -38.52429962158203, "global_step": 132333, "epoch": 1093} {"train_loss": -38.86454391479492, "global_step": 132334, "epoch": 1093} {"train_loss": -38.23781967163086, "global_step": 132335, "epoch": 1093} {"train_loss": -38.3038444519043, "global_step": 132336, "epoch": 1093} {"train_loss": -38.998374938964844, "global_step": 132337, "epoch": 1093} {"train_loss": -39.01566696166992, "global_step": 132338, "epoch": 1093} {"train_loss": -39.32449722290039, "global_step": 132339, "epoch": 1093} {"train_loss": -38.25712966918945, "global_step": 132340, "epoch": 1093} {"train_loss": -38.94813919067383, "global_step": 132341, "epoch": 1093} {"train_loss": -39.24903869628906, "global_step": 132342, "epoch": 1093} {"train_loss": -39.2622184753418, "global_step": 132343, "epoch": 1093} {"train_loss": -38.606422424316406, "global_step": 132344, "epoch": 1093} {"train_loss": -39.09621810913086, "global_step": 132345, "epoch": 1093} {"train_loss": -39.230712890625, "global_step": 132346, "epoch": 1093} {"train_loss": -39.43366241455078, "global_step": 132347, "epoch": 1093} {"train_loss": -39.3245849609375, "global_step": 132348, "epoch": 1093} {"train_loss": -39.58955001831055, "global_step": 132349, "epoch": 1093} {"train_loss": -39.6340446472168, "global_step": 132350, "epoch": 1093} {"train_loss": -39.47159957885742, "global_step": 132351, "epoch": 1093} {"train_loss": -39.96543502807617, "global_step": 132352, "epoch": 1093} {"train_loss": -39.04215621948242, "global_step": 132353, "epoch": 1093} {"train_loss": -39.46622848510742, "global_step": 132354, "epoch": 1093} {"train_loss": -39.889461517333984, "global_step": 132355, "epoch": 1093} {"train_loss": -40.076515197753906, "global_step": 132356, "epoch": 1093} {"train_loss": -39.50343322753906, "global_step": 132357, "epoch": 1093} {"train_loss": -39.87644577026367, "global_step": 132358, "epoch": 1093} {"train_loss": -39.749263763427734, "global_step": 132359, "epoch": 1093} {"train_loss": -39.52827453613281, "global_step": 132360, "epoch": 1093} {"train_loss": -39.24603271484375, "global_step": 132361, "epoch": 1093} {"train_loss": -39.43185043334961, "global_step": 132362, "epoch": 1093} {"train_loss": -40.23957824707031, "global_step": 132363, "epoch": 1093} {"train_loss": -40.07598114013672, "global_step": 132364, "epoch": 1093} {"train_loss": -38.98576354980469, "global_step": 132365, "epoch": 1093} {"train_loss": -39.25436019897461, "global_step": 132366, "epoch": 1093} {"train_loss": -39.605403900146484, "global_step": 132367, "epoch": 1093} {"train_loss": -40.344966888427734, "global_step": 132368, "epoch": 1093} {"train_loss": -40.280731201171875, "global_step": 132369, "epoch": 1093} {"train_loss": -39.093441009521484, "global_step": 132370, "epoch": 1093} {"train_loss": -40.447635650634766, "global_step": 132371, "epoch": 1093} {"train_loss": -39.697052001953125, "global_step": 132372, "epoch": 1093} {"train_loss": -38.828951370617574, "global_step": 132373, "epoch": 1093, "val_loss": 2632614.0} {"train_loss": -40.173221588134766, "global_step": 132374, "epoch": 1094} {"train_loss": -40.470848083496094, "global_step": 132375, "epoch": 1094} {"train_loss": -39.71862030029297, "global_step": 132376, "epoch": 1094} {"train_loss": -40.18555450439453, "global_step": 132377, "epoch": 1094} {"train_loss": -40.48057174682617, "global_step": 132378, "epoch": 1094} {"train_loss": -40.204158782958984, "global_step": 132379, "epoch": 1094} {"train_loss": -38.89884567260742, "global_step": 132380, "epoch": 1094} {"train_loss": -40.32261657714844, "global_step": 132381, "epoch": 1094} {"train_loss": -40.23082733154297, "global_step": 132382, "epoch": 1094} {"train_loss": -39.154510498046875, "global_step": 132383, "epoch": 1094} {"train_loss": -39.62795639038086, "global_step": 132384, "epoch": 1094} {"train_loss": -40.76064682006836, "global_step": 132385, "epoch": 1094} {"train_loss": -40.28931427001953, "global_step": 132386, "epoch": 1094} {"train_loss": -39.536468505859375, "global_step": 132387, "epoch": 1094} {"train_loss": -40.070213317871094, "global_step": 132388, "epoch": 1094} {"train_loss": -40.00861358642578, "global_step": 132389, "epoch": 1094} {"train_loss": -40.05315017700195, "global_step": 132390, "epoch": 1094} {"train_loss": -40.04753112792969, "global_step": 132391, "epoch": 1094} {"train_loss": -40.057491302490234, "global_step": 132392, "epoch": 1094} {"train_loss": -39.94879150390625, "global_step": 132393, "epoch": 1094} {"train_loss": -40.42646408081055, "global_step": 132394, "epoch": 1094} {"train_loss": -39.79220199584961, "global_step": 132395, "epoch": 1094} {"train_loss": -40.05995559692383, "global_step": 132396, "epoch": 1094} {"train_loss": -40.51760482788086, "global_step": 132397, "epoch": 1094} {"train_loss": -40.03709030151367, "global_step": 132398, "epoch": 1094} {"train_loss": -40.61094284057617, "global_step": 132399, "epoch": 1094} {"train_loss": -40.61709213256836, "global_step": 132400, "epoch": 1094} {"train_loss": -40.37921142578125, "global_step": 132401, "epoch": 1094} {"train_loss": -40.070003509521484, "global_step": 132402, "epoch": 1094} {"train_loss": -40.2425651550293, "global_step": 132403, "epoch": 1094} {"train_loss": -40.64009475708008, "global_step": 132404, "epoch": 1094} {"train_loss": -39.81101608276367, "global_step": 132405, "epoch": 1094} {"train_loss": -40.7303352355957, "global_step": 132406, "epoch": 1094} {"train_loss": -40.61543273925781, "global_step": 132407, "epoch": 1094} {"train_loss": -40.708900451660156, "global_step": 132408, "epoch": 1094} {"train_loss": -41.020870208740234, "global_step": 132409, "epoch": 1094} {"train_loss": -41.08225631713867, "global_step": 132410, "epoch": 1094} {"train_loss": -40.96855926513672, "global_step": 132411, "epoch": 1094} {"train_loss": -40.27871322631836, "global_step": 132412, "epoch": 1094} {"train_loss": -41.20272445678711, "global_step": 132413, "epoch": 1094} {"train_loss": -40.80479431152344, "global_step": 132414, "epoch": 1094} {"train_loss": -40.49099349975586, "global_step": 132415, "epoch": 1094} {"train_loss": -41.0964469909668, "global_step": 132416, "epoch": 1094} {"train_loss": -40.80958938598633, "global_step": 132417, "epoch": 1094} {"train_loss": -40.16474533081055, "global_step": 132418, "epoch": 1094} {"train_loss": -40.10868453979492, "global_step": 132419, "epoch": 1094} {"train_loss": -40.83064270019531, "global_step": 132420, "epoch": 1094} {"train_loss": -40.57051086425781, "global_step": 132421, "epoch": 1094} {"train_loss": -39.80645751953125, "global_step": 132422, "epoch": 1094} {"train_loss": -39.881256103515625, "global_step": 132423, "epoch": 1094} {"train_loss": -40.0426025390625, "global_step": 132424, "epoch": 1094} {"train_loss": -40.831424713134766, "global_step": 132425, "epoch": 1094} {"train_loss": -39.70957565307617, "global_step": 132426, "epoch": 1094} {"train_loss": -39.527320861816406, "global_step": 132427, "epoch": 1094} {"train_loss": -40.328857421875, "global_step": 132428, "epoch": 1094} {"train_loss": -37.19658660888672, "global_step": 132429, "epoch": 1094} {"train_loss": -36.29179000854492, "global_step": 132430, "epoch": 1094} {"train_loss": -36.51484680175781, "global_step": 132431, "epoch": 1094} {"train_loss": -38.89417266845703, "global_step": 132432, "epoch": 1094} {"train_loss": -32.12649154663086, "global_step": 132433, "epoch": 1094} {"train_loss": -22.584354400634766, "global_step": 132434, "epoch": 1094} {"train_loss": 14.856122016906738, "global_step": 132435, "epoch": 1094} {"train_loss": 70.41227722167969, "global_step": 132436, "epoch": 1094} {"train_loss": -19.3167781829834, "global_step": 132437, "epoch": 1094} {"train_loss": 8.704001426696777, "global_step": 132438, "epoch": 1094} {"train_loss": -25.332366943359375, "global_step": 132439, "epoch": 1094} {"train_loss": -0.8443830609321594, "global_step": 132440, "epoch": 1094} {"train_loss": -27.866138458251953, "global_step": 132441, "epoch": 1094} {"train_loss": -15.209006309509277, "global_step": 132442, "epoch": 1094} {"train_loss": -25.4541015625, "global_step": 132443, "epoch": 1094} {"train_loss": -27.979736328125, "global_step": 132444, "epoch": 1094} {"train_loss": -25.81707191467285, "global_step": 132445, "epoch": 1094} {"train_loss": -29.03143882751465, "global_step": 132446, "epoch": 1094} {"train_loss": -32.39899444580078, "global_step": 132447, "epoch": 1094} {"train_loss": -32.15840530395508, "global_step": 132448, "epoch": 1094} {"train_loss": -31.238895416259766, "global_step": 132449, "epoch": 1094} {"train_loss": -30.461984634399414, "global_step": 132450, "epoch": 1094} {"train_loss": -33.406646728515625, "global_step": 132451, "epoch": 1094} {"train_loss": -33.21735763549805, "global_step": 132452, "epoch": 1094} {"train_loss": -33.83191680908203, "global_step": 132453, "epoch": 1094} {"train_loss": -33.01667785644531, "global_step": 132454, "epoch": 1094} {"train_loss": -33.73336410522461, "global_step": 132455, "epoch": 1094} {"train_loss": -35.451637268066406, "global_step": 132456, "epoch": 1094} {"train_loss": -35.85432815551758, "global_step": 132457, "epoch": 1094} {"train_loss": -34.48724365234375, "global_step": 132458, "epoch": 1094} {"train_loss": -34.59203338623047, "global_step": 132459, "epoch": 1094} {"train_loss": -35.42250442504883, "global_step": 132460, "epoch": 1094} {"train_loss": -36.35185623168945, "global_step": 132461, "epoch": 1094} {"train_loss": -36.02839660644531, "global_step": 132462, "epoch": 1094} {"train_loss": -34.929622650146484, "global_step": 132463, "epoch": 1094} {"train_loss": -33.980045318603516, "global_step": 132464, "epoch": 1094} {"train_loss": -35.89835739135742, "global_step": 132465, "epoch": 1094} {"train_loss": -35.46844482421875, "global_step": 132466, "epoch": 1094} {"train_loss": -36.130401611328125, "global_step": 132467, "epoch": 1094} {"train_loss": -36.07148361206055, "global_step": 132468, "epoch": 1094} {"train_loss": -36.405609130859375, "global_step": 132469, "epoch": 1094} {"train_loss": -36.43178176879883, "global_step": 132470, "epoch": 1094} {"train_loss": -36.56293869018555, "global_step": 132471, "epoch": 1094} {"train_loss": -36.30648422241211, "global_step": 132472, "epoch": 1094} {"train_loss": -36.858299255371094, "global_step": 132473, "epoch": 1094} {"train_loss": -35.87917709350586, "global_step": 132474, "epoch": 1094} {"train_loss": -36.95025634765625, "global_step": 132475, "epoch": 1094} {"train_loss": -36.48922348022461, "global_step": 132476, "epoch": 1094} {"train_loss": -36.60063171386719, "global_step": 132477, "epoch": 1094} {"train_loss": -37.01505661010742, "global_step": 132478, "epoch": 1094} {"train_loss": -37.279598236083984, "global_step": 132479, "epoch": 1094} {"train_loss": -37.154197692871094, "global_step": 132480, "epoch": 1094} {"train_loss": -36.56305694580078, "global_step": 132481, "epoch": 1094} {"train_loss": -36.37327194213867, "global_step": 132482, "epoch": 1094} {"train_loss": -36.86392593383789, "global_step": 132483, "epoch": 1094} {"train_loss": -37.253814697265625, "global_step": 132484, "epoch": 1094} {"train_loss": -37.05403518676758, "global_step": 132485, "epoch": 1094} {"train_loss": -37.36079406738281, "global_step": 132486, "epoch": 1094} {"train_loss": -37.04502487182617, "global_step": 132487, "epoch": 1094} {"train_loss": -37.18265914916992, "global_step": 132488, "epoch": 1094} {"train_loss": -37.493221282958984, "global_step": 132489, "epoch": 1094} {"train_loss": -37.3072395324707, "global_step": 132490, "epoch": 1094} {"train_loss": -37.64738082885742, "global_step": 132491, "epoch": 1094} {"train_loss": -37.739723205566406, "global_step": 132492, "epoch": 1094} {"train_loss": -37.3572998046875, "global_step": 132493, "epoch": 1094} {"train_loss": -35.01449123739211, "global_step": 132494, "epoch": 1094, "val_loss": 2647772.25} {"train_loss": -37.87253952026367, "global_step": 132495, "epoch": 1095} {"train_loss": -38.01100540161133, "global_step": 132496, "epoch": 1095} {"train_loss": -38.00899887084961, "global_step": 132497, "epoch": 1095} {"train_loss": -37.78078842163086, "global_step": 132498, "epoch": 1095} {"train_loss": -37.57790756225586, "global_step": 132499, "epoch": 1095} {"train_loss": -38.145721435546875, "global_step": 132500, "epoch": 1095} {"train_loss": -38.30845260620117, "global_step": 132501, "epoch": 1095} {"train_loss": -38.08799362182617, "global_step": 132502, "epoch": 1095} {"train_loss": -38.25922393798828, "global_step": 132503, "epoch": 1095} {"train_loss": -38.12514877319336, "global_step": 132504, "epoch": 1095} {"train_loss": -38.084716796875, "global_step": 132505, "epoch": 1095} {"train_loss": -37.73869323730469, "global_step": 132506, "epoch": 1095} {"train_loss": -38.533565521240234, "global_step": 132507, "epoch": 1095} {"train_loss": -38.2522087097168, "global_step": 132508, "epoch": 1095} {"train_loss": -38.52754592895508, "global_step": 132509, "epoch": 1095} {"train_loss": -38.36616897583008, "global_step": 132510, "epoch": 1095} {"train_loss": -38.388118743896484, "global_step": 132511, "epoch": 1095} {"train_loss": -38.314308166503906, "global_step": 132512, "epoch": 1095} {"train_loss": -38.1712532043457, "global_step": 132513, "epoch": 1095} {"train_loss": -38.22272872924805, "global_step": 132514, "epoch": 1095} {"train_loss": -39.009159088134766, "global_step": 132515, "epoch": 1095} {"train_loss": -38.33991622924805, "global_step": 132516, "epoch": 1095} {"train_loss": -38.712730407714844, "global_step": 132517, "epoch": 1095} {"train_loss": -38.7703857421875, "global_step": 132518, "epoch": 1095} {"train_loss": -38.762451171875, "global_step": 132519, "epoch": 1095} {"train_loss": -38.6456413269043, "global_step": 132520, "epoch": 1095} {"train_loss": -38.432613372802734, "global_step": 132521, "epoch": 1095} {"train_loss": -38.73184585571289, "global_step": 132522, "epoch": 1095} {"train_loss": -38.645843505859375, "global_step": 132523, "epoch": 1095} {"train_loss": -38.974403381347656, "global_step": 132524, "epoch": 1095} {"train_loss": -38.65686798095703, "global_step": 132525, "epoch": 1095} {"train_loss": -38.935150146484375, "global_step": 132526, "epoch": 1095} {"train_loss": -39.056575775146484, "global_step": 132527, "epoch": 1095} {"train_loss": -38.7685432434082, "global_step": 132528, "epoch": 1095} {"train_loss": -38.95488739013672, "global_step": 132529, "epoch": 1095} {"train_loss": -39.01464080810547, "global_step": 132530, "epoch": 1095} {"train_loss": -39.04248809814453, "global_step": 132531, "epoch": 1095} {"train_loss": -39.19402313232422, "global_step": 132532, "epoch": 1095} {"train_loss": -39.58221435546875, "global_step": 132533, "epoch": 1095} {"train_loss": -39.022377014160156, "global_step": 132534, "epoch": 1095} {"train_loss": -39.12350845336914, "global_step": 132535, "epoch": 1095} {"train_loss": -38.74081039428711, "global_step": 132536, "epoch": 1095} {"train_loss": -39.48679733276367, "global_step": 132537, "epoch": 1095} {"train_loss": -39.66645431518555, "global_step": 132538, "epoch": 1095} {"train_loss": -38.73201370239258, "global_step": 132539, "epoch": 1095} {"train_loss": -39.160152435302734, "global_step": 132540, "epoch": 1095} {"train_loss": -39.60190963745117, "global_step": 132541, "epoch": 1095} {"train_loss": -38.858985900878906, "global_step": 132542, "epoch": 1095} {"train_loss": -39.58314514160156, "global_step": 132543, "epoch": 1095} {"train_loss": -39.617210388183594, "global_step": 132544, "epoch": 1095} {"train_loss": -39.742271423339844, "global_step": 132545, "epoch": 1095} {"train_loss": -39.71879959106445, "global_step": 132546, "epoch": 1095} {"train_loss": -39.70643997192383, "global_step": 132547, "epoch": 1095} {"train_loss": -39.463348388671875, "global_step": 132548, "epoch": 1095} {"train_loss": -39.5267448425293, "global_step": 132549, "epoch": 1095} {"train_loss": -39.97491455078125, "global_step": 132550, "epoch": 1095} {"train_loss": -39.84394454956055, "global_step": 132551, "epoch": 1095} {"train_loss": -39.75712966918945, "global_step": 132552, "epoch": 1095} {"train_loss": -39.7401237487793, "global_step": 132553, "epoch": 1095} {"train_loss": -40.18498229980469, "global_step": 132554, "epoch": 1095} {"train_loss": -39.3906364440918, "global_step": 132555, "epoch": 1095} {"train_loss": -39.673553466796875, "global_step": 132556, "epoch": 1095} {"train_loss": -39.3974723815918, "global_step": 132557, "epoch": 1095} {"train_loss": -39.74728012084961, "global_step": 132558, "epoch": 1095} {"train_loss": -39.96139144897461, "global_step": 132559, "epoch": 1095} {"train_loss": -39.51578903198242, "global_step": 132560, "epoch": 1095} {"train_loss": -39.79558181762695, "global_step": 132561, "epoch": 1095} {"train_loss": -39.32014846801758, "global_step": 132562, "epoch": 1095} {"train_loss": -40.023834228515625, "global_step": 132563, "epoch": 1095} {"train_loss": -39.859397888183594, "global_step": 132564, "epoch": 1095} {"train_loss": -40.20906448364258, "global_step": 132565, "epoch": 1095} {"train_loss": -39.739131927490234, "global_step": 132566, "epoch": 1095} {"train_loss": -39.6753044128418, "global_step": 132567, "epoch": 1095} {"train_loss": -39.43541717529297, "global_step": 132568, "epoch": 1095} {"train_loss": -39.564239501953125, "global_step": 132569, "epoch": 1095} {"train_loss": -39.0476188659668, "global_step": 132570, "epoch": 1095} {"train_loss": -39.758018493652344, "global_step": 132571, "epoch": 1095} {"train_loss": -38.787322998046875, "global_step": 132572, "epoch": 1095} {"train_loss": -39.943904876708984, "global_step": 132573, "epoch": 1095} {"train_loss": -40.02397155761719, "global_step": 132574, "epoch": 1095} {"train_loss": -40.301979064941406, "global_step": 132575, "epoch": 1095} {"train_loss": -39.992244720458984, "global_step": 132576, "epoch": 1095} {"train_loss": -39.896697998046875, "global_step": 132577, "epoch": 1095} {"train_loss": -39.63689422607422, "global_step": 132578, "epoch": 1095} {"train_loss": -39.67584991455078, "global_step": 132579, "epoch": 1095} {"train_loss": -38.999237060546875, "global_step": 132580, "epoch": 1095} {"train_loss": -38.06014633178711, "global_step": 132581, "epoch": 1095} {"train_loss": -38.61787414550781, "global_step": 132582, "epoch": 1095} {"train_loss": -40.27387619018555, "global_step": 132583, "epoch": 1095} {"train_loss": -39.44830322265625, "global_step": 132584, "epoch": 1095} {"train_loss": -38.66943359375, "global_step": 132585, "epoch": 1095} {"train_loss": -38.30625915527344, "global_step": 132586, "epoch": 1095} {"train_loss": -38.72520065307617, "global_step": 132587, "epoch": 1095} {"train_loss": -39.4572868347168, "global_step": 132588, "epoch": 1095} {"train_loss": -39.208003997802734, "global_step": 132589, "epoch": 1095} {"train_loss": -39.58560562133789, "global_step": 132590, "epoch": 1095} {"train_loss": -39.89609909057617, "global_step": 132591, "epoch": 1095} {"train_loss": -37.13766098022461, "global_step": 132592, "epoch": 1095} {"train_loss": -36.94229507446289, "global_step": 132593, "epoch": 1095} {"train_loss": -39.38174819946289, "global_step": 132594, "epoch": 1095} {"train_loss": -39.99102783203125, "global_step": 132595, "epoch": 1095} {"train_loss": -40.52899932861328, "global_step": 132596, "epoch": 1095} {"train_loss": -39.357757568359375, "global_step": 132597, "epoch": 1095} {"train_loss": -38.182098388671875, "global_step": 132598, "epoch": 1095} {"train_loss": -37.69326400756836, "global_step": 132599, "epoch": 1095} {"train_loss": -38.559078216552734, "global_step": 132600, "epoch": 1095} {"train_loss": -37.28519821166992, "global_step": 132601, "epoch": 1095} {"train_loss": -39.90303421020508, "global_step": 132602, "epoch": 1095} {"train_loss": -38.211421966552734, "global_step": 132603, "epoch": 1095} {"train_loss": -38.12641525268555, "global_step": 132604, "epoch": 1095} {"train_loss": -38.795631408691406, "global_step": 132605, "epoch": 1095} {"train_loss": -36.923439025878906, "global_step": 132606, "epoch": 1095} {"train_loss": -38.45931625366211, "global_step": 132607, "epoch": 1095} {"train_loss": -38.976707458496094, "global_step": 132608, "epoch": 1095} {"train_loss": -37.424102783203125, "global_step": 132609, "epoch": 1095} {"train_loss": -38.66484451293945, "global_step": 132610, "epoch": 1095} {"train_loss": -37.8770866394043, "global_step": 132611, "epoch": 1095} {"train_loss": -11.946024894714355, "global_step": 132612, "epoch": 1095} {"train_loss": -35.35798263549805, "global_step": 132613, "epoch": 1095} {"train_loss": -36.23682403564453, "global_step": 132614, "epoch": 1095} {"train_loss": -38.69314063679088, "global_step": 132615, "epoch": 1095, "val_loss": 2644358.25} {"train_loss": -32.79569625854492, "global_step": 132616, "epoch": 1096} {"train_loss": -35.22417068481445, "global_step": 132617, "epoch": 1096} {"train_loss": -36.96308517456055, "global_step": 132618, "epoch": 1096} {"train_loss": -35.2890739440918, "global_step": 132619, "epoch": 1096} {"train_loss": -34.10038375854492, "global_step": 132620, "epoch": 1096} {"train_loss": -34.23474884033203, "global_step": 132621, "epoch": 1096} {"train_loss": -35.95376205444336, "global_step": 132622, "epoch": 1096} {"train_loss": -36.8890266418457, "global_step": 132623, "epoch": 1096} {"train_loss": -36.96322250366211, "global_step": 132624, "epoch": 1096} {"train_loss": -33.70774459838867, "global_step": 132625, "epoch": 1096} {"train_loss": -33.97269821166992, "global_step": 132626, "epoch": 1096} {"train_loss": -34.2555046081543, "global_step": 132627, "epoch": 1096} {"train_loss": -32.70942306518555, "global_step": 132628, "epoch": 1096} {"train_loss": -33.11667251586914, "global_step": 132629, "epoch": 1096} {"train_loss": -36.007198333740234, "global_step": 132630, "epoch": 1096} {"train_loss": -34.2765998840332, "global_step": 132631, "epoch": 1096} {"train_loss": -35.457759857177734, "global_step": 132632, "epoch": 1096} {"train_loss": -35.02664566040039, "global_step": 132633, "epoch": 1096} {"train_loss": -34.211883544921875, "global_step": 132634, "epoch": 1096} {"train_loss": -34.79153060913086, "global_step": 132635, "epoch": 1096} {"train_loss": -36.27743911743164, "global_step": 132636, "epoch": 1096} {"train_loss": -34.40993118286133, "global_step": 132637, "epoch": 1096} {"train_loss": -35.87396240234375, "global_step": 132638, "epoch": 1096} {"train_loss": -33.19558334350586, "global_step": 132639, "epoch": 1096} {"train_loss": -34.91993713378906, "global_step": 132640, "epoch": 1096} {"train_loss": -34.65937805175781, "global_step": 132641, "epoch": 1096} {"train_loss": -37.237464904785156, "global_step": 132642, "epoch": 1096} {"train_loss": -36.88457489013672, "global_step": 132643, "epoch": 1096} {"train_loss": -37.29171371459961, "global_step": 132644, "epoch": 1096} {"train_loss": -37.01190185546875, "global_step": 132645, "epoch": 1096} {"train_loss": -36.38717269897461, "global_step": 132646, "epoch": 1096} {"train_loss": -36.364356994628906, "global_step": 132647, "epoch": 1096} {"train_loss": -36.85833740234375, "global_step": 132648, "epoch": 1096} {"train_loss": -38.07045364379883, "global_step": 132649, "epoch": 1096} {"train_loss": -37.4476203918457, "global_step": 132650, "epoch": 1096} {"train_loss": -37.11747741699219, "global_step": 132651, "epoch": 1096} {"train_loss": -37.84987258911133, "global_step": 132652, "epoch": 1096} {"train_loss": -37.64858627319336, "global_step": 132653, "epoch": 1096} {"train_loss": -36.621768951416016, "global_step": 132654, "epoch": 1096} {"train_loss": -38.174034118652344, "global_step": 132655, "epoch": 1096} {"train_loss": -36.731014251708984, "global_step": 132656, "epoch": 1096} {"train_loss": -37.999755859375, "global_step": 132657, "epoch": 1096} {"train_loss": -38.495758056640625, "global_step": 132658, "epoch": 1096} {"train_loss": -37.76259994506836, "global_step": 132659, "epoch": 1096} {"train_loss": -37.72498321533203, "global_step": 132660, "epoch": 1096} {"train_loss": -38.5736198425293, "global_step": 132661, "epoch": 1096} {"train_loss": -37.79634475708008, "global_step": 132662, "epoch": 1096} {"train_loss": -38.55678176879883, "global_step": 132663, "epoch": 1096} {"train_loss": -38.54230499267578, "global_step": 132664, "epoch": 1096} {"train_loss": -38.859405517578125, "global_step": 132665, "epoch": 1096} {"train_loss": -38.632728576660156, "global_step": 132666, "epoch": 1096} {"train_loss": -38.537166595458984, "global_step": 132667, "epoch": 1096} {"train_loss": -38.68872833251953, "global_step": 132668, "epoch": 1096} {"train_loss": -38.710994720458984, "global_step": 132669, "epoch": 1096} {"train_loss": -37.786258697509766, "global_step": 132670, "epoch": 1096} {"train_loss": -38.97644805908203, "global_step": 132671, "epoch": 1096} {"train_loss": -39.29389953613281, "global_step": 132672, "epoch": 1096} {"train_loss": -38.81687545776367, "global_step": 132673, "epoch": 1096} {"train_loss": -38.70068359375, "global_step": 132674, "epoch": 1096} {"train_loss": -38.98798370361328, "global_step": 132675, "epoch": 1096} {"train_loss": -38.81397247314453, "global_step": 132676, "epoch": 1096} {"train_loss": -39.579811096191406, "global_step": 132677, "epoch": 1096} {"train_loss": -39.29511260986328, "global_step": 132678, "epoch": 1096} {"train_loss": -38.71950149536133, "global_step": 132679, "epoch": 1096} {"train_loss": -39.41579818725586, "global_step": 132680, "epoch": 1096} {"train_loss": -39.19225311279297, "global_step": 132681, "epoch": 1096} {"train_loss": -39.270503997802734, "global_step": 132682, "epoch": 1096} {"train_loss": -39.585384368896484, "global_step": 132683, "epoch": 1096} {"train_loss": -39.04168701171875, "global_step": 132684, "epoch": 1096} {"train_loss": -39.38570785522461, "global_step": 132685, "epoch": 1096} {"train_loss": -39.101158142089844, "global_step": 132686, "epoch": 1096} {"train_loss": -39.26890182495117, "global_step": 132687, "epoch": 1096} {"train_loss": -38.63999557495117, "global_step": 132688, "epoch": 1096} {"train_loss": -39.16204071044922, "global_step": 132689, "epoch": 1096} {"train_loss": -39.373085021972656, "global_step": 132690, "epoch": 1096} {"train_loss": -39.72705078125, "global_step": 132691, "epoch": 1096} {"train_loss": -38.90351486206055, "global_step": 132692, "epoch": 1096} {"train_loss": -39.86091613769531, "global_step": 132693, "epoch": 1096} {"train_loss": -39.74679183959961, "global_step": 132694, "epoch": 1096} {"train_loss": -39.7258415222168, "global_step": 132695, "epoch": 1096} {"train_loss": -39.41206359863281, "global_step": 132696, "epoch": 1096} {"train_loss": -39.4235954284668, "global_step": 132697, "epoch": 1096} {"train_loss": -39.91347885131836, "global_step": 132698, "epoch": 1096} {"train_loss": -39.76646041870117, "global_step": 132699, "epoch": 1096} {"train_loss": -39.97246170043945, "global_step": 132700, "epoch": 1096} {"train_loss": -39.73234939575195, "global_step": 132701, "epoch": 1096} {"train_loss": -40.1067008972168, "global_step": 132702, "epoch": 1096} {"train_loss": -39.68723678588867, "global_step": 132703, "epoch": 1096} {"train_loss": -39.48258590698242, "global_step": 132704, "epoch": 1096} {"train_loss": -39.42002868652344, "global_step": 132705, "epoch": 1096} {"train_loss": -38.771297454833984, "global_step": 132706, "epoch": 1096} {"train_loss": -37.50478744506836, "global_step": 132707, "epoch": 1096} {"train_loss": -35.28852462768555, "global_step": 132708, "epoch": 1096} {"train_loss": -32.525936126708984, "global_step": 132709, "epoch": 1096} {"train_loss": -39.09310531616211, "global_step": 132710, "epoch": 1096} {"train_loss": -30.40018081665039, "global_step": 132711, "epoch": 1096} {"train_loss": -29.57623863220215, "global_step": 132712, "epoch": 1096} {"train_loss": -31.898548126220703, "global_step": 132713, "epoch": 1096} {"train_loss": -30.718412399291992, "global_step": 132714, "epoch": 1096} {"train_loss": -31.000364303588867, "global_step": 132715, "epoch": 1096} {"train_loss": -31.400175094604492, "global_step": 132716, "epoch": 1096} {"train_loss": -31.875751495361328, "global_step": 132717, "epoch": 1096} {"train_loss": -31.337568283081055, "global_step": 132718, "epoch": 1096} {"train_loss": -33.258480072021484, "global_step": 132719, "epoch": 1096} {"train_loss": -31.751571655273438, "global_step": 132720, "epoch": 1096} {"train_loss": -32.67729187011719, "global_step": 132721, "epoch": 1096} {"train_loss": -33.41503143310547, "global_step": 132722, "epoch": 1096} {"train_loss": -33.642024993896484, "global_step": 132723, "epoch": 1096} {"train_loss": -32.42509078979492, "global_step": 132724, "epoch": 1096} {"train_loss": -33.4022331237793, "global_step": 132725, "epoch": 1096} {"train_loss": -34.877830505371094, "global_step": 132726, "epoch": 1096} {"train_loss": -33.471702575683594, "global_step": 132727, "epoch": 1096} {"train_loss": -34.03481674194336, "global_step": 132728, "epoch": 1096} {"train_loss": -34.37183380126953, "global_step": 132729, "epoch": 1096} {"train_loss": -33.73159408569336, "global_step": 132730, "epoch": 1096} {"train_loss": -34.35150146484375, "global_step": 132731, "epoch": 1096} {"train_loss": -35.129825592041016, "global_step": 132732, "epoch": 1096} {"train_loss": -34.841651916503906, "global_step": 132733, "epoch": 1096} {"train_loss": -34.8637580871582, "global_step": 132734, "epoch": 1096} {"train_loss": -35.93954086303711, "global_step": 132735, "epoch": 1096} {"train_loss": -36.527452531924915, "global_step": 132736, "epoch": 1096, "val_loss": 2665806.75} {"train_loss": -35.22455978393555, "global_step": 132737, "epoch": 1097} {"train_loss": -35.676902770996094, "global_step": 132738, "epoch": 1097} {"train_loss": -35.85006332397461, "global_step": 132739, "epoch": 1097} {"train_loss": -35.67582321166992, "global_step": 132740, "epoch": 1097} {"train_loss": -36.09702682495117, "global_step": 132741, "epoch": 1097} {"train_loss": -35.372493743896484, "global_step": 132742, "epoch": 1097} {"train_loss": -36.241119384765625, "global_step": 132743, "epoch": 1097} {"train_loss": -36.885433197021484, "global_step": 132744, "epoch": 1097} {"train_loss": -36.52370834350586, "global_step": 132745, "epoch": 1097} {"train_loss": -36.31545639038086, "global_step": 132746, "epoch": 1097} {"train_loss": -35.95252227783203, "global_step": 132747, "epoch": 1097} {"train_loss": -36.51190185546875, "global_step": 132748, "epoch": 1097} {"train_loss": -37.063453674316406, "global_step": 132749, "epoch": 1097} {"train_loss": -36.767818450927734, "global_step": 132750, "epoch": 1097} {"train_loss": -36.901527404785156, "global_step": 132751, "epoch": 1097} {"train_loss": -36.88062286376953, "global_step": 132752, "epoch": 1097} {"train_loss": -36.996150970458984, "global_step": 132753, "epoch": 1097} {"train_loss": -37.60994338989258, "global_step": 132754, "epoch": 1097} {"train_loss": -37.78704833984375, "global_step": 132755, "epoch": 1097} {"train_loss": -37.07845687866211, "global_step": 132756, "epoch": 1097} {"train_loss": -36.54840087890625, "global_step": 132757, "epoch": 1097} {"train_loss": -35.0584831237793, "global_step": 132758, "epoch": 1097} {"train_loss": -37.07712936401367, "global_step": 132759, "epoch": 1097} {"train_loss": -36.66065979003906, "global_step": 132760, "epoch": 1097} {"train_loss": -35.5980339050293, "global_step": 132761, "epoch": 1097} {"train_loss": -36.12030792236328, "global_step": 132762, "epoch": 1097} {"train_loss": -35.777095794677734, "global_step": 132763, "epoch": 1097} {"train_loss": -37.43756866455078, "global_step": 132764, "epoch": 1097} {"train_loss": -36.309017181396484, "global_step": 132765, "epoch": 1097} {"train_loss": -35.31436538696289, "global_step": 132766, "epoch": 1097} {"train_loss": -35.88225555419922, "global_step": 132767, "epoch": 1097} {"train_loss": -35.60625076293945, "global_step": 132768, "epoch": 1097} {"train_loss": -31.628808975219727, "global_step": 132769, "epoch": 1097} {"train_loss": -36.28535842895508, "global_step": 132770, "epoch": 1097} {"train_loss": -35.58177185058594, "global_step": 132771, "epoch": 1097} {"train_loss": -36.3531379699707, "global_step": 132772, "epoch": 1097} {"train_loss": -36.60901641845703, "global_step": 132773, "epoch": 1097} {"train_loss": -34.527381896972656, "global_step": 132774, "epoch": 1097} {"train_loss": -36.04727554321289, "global_step": 132775, "epoch": 1097} {"train_loss": -35.75004577636719, "global_step": 132776, "epoch": 1097} {"train_loss": -37.10146713256836, "global_step": 132777, "epoch": 1097} {"train_loss": -36.28499221801758, "global_step": 132778, "epoch": 1097} {"train_loss": -36.641754150390625, "global_step": 132779, "epoch": 1097} {"train_loss": -36.09564971923828, "global_step": 132780, "epoch": 1097} {"train_loss": -37.248741149902344, "global_step": 132781, "epoch": 1097} {"train_loss": -37.118648529052734, "global_step": 132782, "epoch": 1097} {"train_loss": -37.75654602050781, "global_step": 132783, "epoch": 1097} {"train_loss": -37.98164749145508, "global_step": 132784, "epoch": 1097} {"train_loss": -37.388824462890625, "global_step": 132785, "epoch": 1097} {"train_loss": -37.85653305053711, "global_step": 132786, "epoch": 1097} {"train_loss": -38.32143020629883, "global_step": 132787, "epoch": 1097} {"train_loss": -38.05836868286133, "global_step": 132788, "epoch": 1097} {"train_loss": -38.15260696411133, "global_step": 132789, "epoch": 1097} {"train_loss": -37.62482452392578, "global_step": 132790, "epoch": 1097} {"train_loss": -37.56621170043945, "global_step": 132791, "epoch": 1097} {"train_loss": -38.55330276489258, "global_step": 132792, "epoch": 1097} {"train_loss": -38.46891403198242, "global_step": 132793, "epoch": 1097} {"train_loss": -38.39898681640625, "global_step": 132794, "epoch": 1097} {"train_loss": -38.08237838745117, "global_step": 132795, "epoch": 1097} {"train_loss": -38.298763275146484, "global_step": 132796, "epoch": 1097} {"train_loss": -38.21169662475586, "global_step": 132797, "epoch": 1097} {"train_loss": -38.20341110229492, "global_step": 132798, "epoch": 1097} {"train_loss": -38.72731018066406, "global_step": 132799, "epoch": 1097} {"train_loss": -38.158504486083984, "global_step": 132800, "epoch": 1097} {"train_loss": -37.92391586303711, "global_step": 132801, "epoch": 1097} {"train_loss": -38.752723693847656, "global_step": 132802, "epoch": 1097} {"train_loss": -38.67649459838867, "global_step": 132803, "epoch": 1097} {"train_loss": -38.99745559692383, "global_step": 132804, "epoch": 1097} {"train_loss": -38.241764068603516, "global_step": 132805, "epoch": 1097} {"train_loss": -37.7369270324707, "global_step": 132806, "epoch": 1097} {"train_loss": -36.60224151611328, "global_step": 132807, "epoch": 1097} {"train_loss": -37.002376556396484, "global_step": 132808, "epoch": 1097} {"train_loss": -38.69843673706055, "global_step": 132809, "epoch": 1097} {"train_loss": -38.63481521606445, "global_step": 132810, "epoch": 1097} {"train_loss": -38.154945373535156, "global_step": 132811, "epoch": 1097} {"train_loss": -38.54368209838867, "global_step": 132812, "epoch": 1097} {"train_loss": -37.44929504394531, "global_step": 132813, "epoch": 1097} {"train_loss": -38.9840087890625, "global_step": 132814, "epoch": 1097} {"train_loss": -38.17380142211914, "global_step": 132815, "epoch": 1097} {"train_loss": -38.195655822753906, "global_step": 132816, "epoch": 1097} {"train_loss": -38.75675582885742, "global_step": 132817, "epoch": 1097} {"train_loss": -39.039302825927734, "global_step": 132818, "epoch": 1097} {"train_loss": -38.34312057495117, "global_step": 132819, "epoch": 1097} {"train_loss": -38.43985366821289, "global_step": 132820, "epoch": 1097} {"train_loss": -39.01082992553711, "global_step": 132821, "epoch": 1097} {"train_loss": -37.839054107666016, "global_step": 132822, "epoch": 1097} {"train_loss": -39.48170852661133, "global_step": 132823, "epoch": 1097} {"train_loss": -38.50565719604492, "global_step": 132824, "epoch": 1097} {"train_loss": -39.21684646606445, "global_step": 132825, "epoch": 1097} {"train_loss": -38.65778350830078, "global_step": 132826, "epoch": 1097} {"train_loss": -38.818416595458984, "global_step": 132827, "epoch": 1097} {"train_loss": -39.18609619140625, "global_step": 132828, "epoch": 1097} {"train_loss": -39.457393646240234, "global_step": 132829, "epoch": 1097} {"train_loss": -39.08007049560547, "global_step": 132830, "epoch": 1097} {"train_loss": -39.60979461669922, "global_step": 132831, "epoch": 1097} {"train_loss": -38.87422561645508, "global_step": 132832, "epoch": 1097} {"train_loss": -38.80720138549805, "global_step": 132833, "epoch": 1097} {"train_loss": -39.7120361328125, "global_step": 132834, "epoch": 1097} {"train_loss": -38.952415466308594, "global_step": 132835, "epoch": 1097} {"train_loss": -37.649314880371094, "global_step": 132836, "epoch": 1097} {"train_loss": -39.017826080322266, "global_step": 132837, "epoch": 1097} {"train_loss": -38.322914123535156, "global_step": 132838, "epoch": 1097} {"train_loss": -37.2829475402832, "global_step": 132839, "epoch": 1097} {"train_loss": -36.53994369506836, "global_step": 132840, "epoch": 1097} {"train_loss": -35.001670837402344, "global_step": 132841, "epoch": 1097} {"train_loss": -36.72652816772461, "global_step": 132842, "epoch": 1097} {"train_loss": -36.86423873901367, "global_step": 132843, "epoch": 1097} {"train_loss": -34.35586929321289, "global_step": 132844, "epoch": 1097} {"train_loss": -36.26713180541992, "global_step": 132845, "epoch": 1097} {"train_loss": -36.56583786010742, "global_step": 132846, "epoch": 1097} {"train_loss": -36.8695182800293, "global_step": 132847, "epoch": 1097} {"train_loss": -38.568077087402344, "global_step": 132848, "epoch": 1097} {"train_loss": -35.27981185913086, "global_step": 132849, "epoch": 1097} {"train_loss": -36.79901885986328, "global_step": 132850, "epoch": 1097} {"train_loss": -37.54132080078125, "global_step": 132851, "epoch": 1097} {"train_loss": -37.31425094604492, "global_step": 132852, "epoch": 1097} {"train_loss": -38.025596618652344, "global_step": 132853, "epoch": 1097} {"train_loss": -37.45769119262695, "global_step": 132854, "epoch": 1097} {"train_loss": -37.19715118408203, "global_step": 132855, "epoch": 1097} {"train_loss": -37.53493881225586, "global_step": 132856, "epoch": 1097} {"train_loss": -37.331516975213674, "global_step": 132857, "epoch": 1097, "val_loss": 2668771.75} {"train_loss": -37.99098205566406, "global_step": 132858, "epoch": 1098} {"train_loss": -37.86920928955078, "global_step": 132859, "epoch": 1098} {"train_loss": -38.84487533569336, "global_step": 132860, "epoch": 1098} {"train_loss": -37.46240234375, "global_step": 132861, "epoch": 1098} {"train_loss": -38.25066375732422, "global_step": 132862, "epoch": 1098} {"train_loss": -37.922996520996094, "global_step": 132863, "epoch": 1098} {"train_loss": -37.716312408447266, "global_step": 132864, "epoch": 1098} {"train_loss": -38.516944885253906, "global_step": 132865, "epoch": 1098} {"train_loss": -38.03723907470703, "global_step": 132866, "epoch": 1098} {"train_loss": -38.8704948425293, "global_step": 132867, "epoch": 1098} {"train_loss": -38.60092544555664, "global_step": 132868, "epoch": 1098} {"train_loss": -38.700233459472656, "global_step": 132869, "epoch": 1098} {"train_loss": -38.504634857177734, "global_step": 132870, "epoch": 1098} {"train_loss": -38.17991256713867, "global_step": 132871, "epoch": 1098} {"train_loss": -38.375667572021484, "global_step": 132872, "epoch": 1098} {"train_loss": -37.7926025390625, "global_step": 132873, "epoch": 1098} {"train_loss": -38.51708984375, "global_step": 132874, "epoch": 1098} {"train_loss": -38.50305938720703, "global_step": 132875, "epoch": 1098} {"train_loss": -38.2212028503418, "global_step": 132876, "epoch": 1098} {"train_loss": -38.23469161987305, "global_step": 132877, "epoch": 1098} {"train_loss": -36.9246940612793, "global_step": 132878, "epoch": 1098} {"train_loss": -38.546573638916016, "global_step": 132879, "epoch": 1098} {"train_loss": -37.37239456176758, "global_step": 132880, "epoch": 1098} {"train_loss": -36.22941970825195, "global_step": 132881, "epoch": 1098} {"train_loss": -38.293121337890625, "global_step": 132882, "epoch": 1098} {"train_loss": -38.27839279174805, "global_step": 132883, "epoch": 1098} {"train_loss": -37.82162094116211, "global_step": 132884, "epoch": 1098} {"train_loss": -33.6351318359375, "global_step": 132885, "epoch": 1098} {"train_loss": -33.245452880859375, "global_step": 132886, "epoch": 1098} {"train_loss": -37.090599060058594, "global_step": 132887, "epoch": 1098} {"train_loss": -38.4539794921875, "global_step": 132888, "epoch": 1098} {"train_loss": -36.45930862426758, "global_step": 132889, "epoch": 1098} {"train_loss": -38.45989990234375, "global_step": 132890, "epoch": 1098} {"train_loss": -38.7335090637207, "global_step": 132891, "epoch": 1098} {"train_loss": -38.386837005615234, "global_step": 132892, "epoch": 1098} {"train_loss": -38.45355224609375, "global_step": 132893, "epoch": 1098} {"train_loss": -38.714107513427734, "global_step": 132894, "epoch": 1098} {"train_loss": -38.92081832885742, "global_step": 132895, "epoch": 1098} {"train_loss": -39.2862434387207, "global_step": 132896, "epoch": 1098} {"train_loss": -38.62102127075195, "global_step": 132897, "epoch": 1098} {"train_loss": -39.29231643676758, "global_step": 132898, "epoch": 1098} {"train_loss": -39.12474060058594, "global_step": 132899, "epoch": 1098} {"train_loss": -39.2181510925293, "global_step": 132900, "epoch": 1098} {"train_loss": -40.06404495239258, "global_step": 132901, "epoch": 1098} {"train_loss": -38.993778228759766, "global_step": 132902, "epoch": 1098} {"train_loss": -39.58564758300781, "global_step": 132903, "epoch": 1098} {"train_loss": -40.107688903808594, "global_step": 132904, "epoch": 1098} {"train_loss": -39.491432189941406, "global_step": 132905, "epoch": 1098} {"train_loss": -39.27988815307617, "global_step": 132906, "epoch": 1098} {"train_loss": -39.243804931640625, "global_step": 132907, "epoch": 1098} {"train_loss": -39.643672943115234, "global_step": 132908, "epoch": 1098} {"train_loss": -39.31525421142578, "global_step": 132909, "epoch": 1098} {"train_loss": -39.26225662231445, "global_step": 132910, "epoch": 1098} {"train_loss": -39.74589920043945, "global_step": 132911, "epoch": 1098} {"train_loss": -39.32620620727539, "global_step": 132912, "epoch": 1098} {"train_loss": -39.124305725097656, "global_step": 132913, "epoch": 1098} {"train_loss": -39.63861083984375, "global_step": 132914, "epoch": 1098} {"train_loss": -39.51128005981445, "global_step": 132915, "epoch": 1098} {"train_loss": -39.913509368896484, "global_step": 132916, "epoch": 1098} {"train_loss": -39.46910858154297, "global_step": 132917, "epoch": 1098} {"train_loss": -39.381675720214844, "global_step": 132918, "epoch": 1098} {"train_loss": -39.31891632080078, "global_step": 132919, "epoch": 1098} {"train_loss": -39.791805267333984, "global_step": 132920, "epoch": 1098} {"train_loss": -39.8743896484375, "global_step": 132921, "epoch": 1098} {"train_loss": -38.805145263671875, "global_step": 132922, "epoch": 1098} {"train_loss": -36.984493255615234, "global_step": 132923, "epoch": 1098} {"train_loss": -34.68017578125, "global_step": 132924, "epoch": 1098} {"train_loss": -32.159637451171875, "global_step": 132925, "epoch": 1098} {"train_loss": -32.57609939575195, "global_step": 132926, "epoch": 1098} {"train_loss": -34.9509391784668, "global_step": 132927, "epoch": 1098} {"train_loss": -35.67060089111328, "global_step": 132928, "epoch": 1098} {"train_loss": -36.05305480957031, "global_step": 132929, "epoch": 1098} {"train_loss": -39.14040756225586, "global_step": 132930, "epoch": 1098} {"train_loss": -36.45216751098633, "global_step": 132931, "epoch": 1098} {"train_loss": -39.08210372924805, "global_step": 132932, "epoch": 1098} {"train_loss": -38.25437545776367, "global_step": 132933, "epoch": 1098} {"train_loss": -38.62385559082031, "global_step": 132934, "epoch": 1098} {"train_loss": -39.4160041809082, "global_step": 132935, "epoch": 1098} {"train_loss": -38.41809844970703, "global_step": 132936, "epoch": 1098} {"train_loss": -37.92284393310547, "global_step": 132937, "epoch": 1098} {"train_loss": -39.6807746887207, "global_step": 132938, "epoch": 1098} {"train_loss": -38.71339797973633, "global_step": 132939, "epoch": 1098} {"train_loss": -38.8485221862793, "global_step": 132940, "epoch": 1098} {"train_loss": -38.767330169677734, "global_step": 132941, "epoch": 1098} {"train_loss": -38.966461181640625, "global_step": 132942, "epoch": 1098} {"train_loss": -38.0928955078125, "global_step": 132943, "epoch": 1098} {"train_loss": -39.433712005615234, "global_step": 132944, "epoch": 1098} {"train_loss": -38.592071533203125, "global_step": 132945, "epoch": 1098} {"train_loss": -38.94849395751953, "global_step": 132946, "epoch": 1098} {"train_loss": -38.92550277709961, "global_step": 132947, "epoch": 1098} {"train_loss": -39.46847152709961, "global_step": 132948, "epoch": 1098} {"train_loss": -38.55439758300781, "global_step": 132949, "epoch": 1098} {"train_loss": -38.97504806518555, "global_step": 132950, "epoch": 1098} {"train_loss": -39.751434326171875, "global_step": 132951, "epoch": 1098} {"train_loss": -38.829891204833984, "global_step": 132952, "epoch": 1098} {"train_loss": -39.69546127319336, "global_step": 132953, "epoch": 1098} {"train_loss": -38.85884094238281, "global_step": 132954, "epoch": 1098} {"train_loss": -39.76399612426758, "global_step": 132955, "epoch": 1098} {"train_loss": -39.494544982910156, "global_step": 132956, "epoch": 1098} {"train_loss": -39.11762237548828, "global_step": 132957, "epoch": 1098} {"train_loss": -39.15676498413086, "global_step": 132958, "epoch": 1098} {"train_loss": -39.347381591796875, "global_step": 132959, "epoch": 1098} {"train_loss": -39.8279914855957, "global_step": 132960, "epoch": 1098} {"train_loss": -39.658599853515625, "global_step": 132961, "epoch": 1098} {"train_loss": -39.505462646484375, "global_step": 132962, "epoch": 1098} {"train_loss": -38.92095184326172, "global_step": 132963, "epoch": 1098} {"train_loss": -39.374210357666016, "global_step": 132964, "epoch": 1098} {"train_loss": -39.57282257080078, "global_step": 132965, "epoch": 1098} {"train_loss": -38.8619499206543, "global_step": 132966, "epoch": 1098} {"train_loss": -37.68446731567383, "global_step": 132967, "epoch": 1098} {"train_loss": -34.54861068725586, "global_step": 132968, "epoch": 1098} {"train_loss": -35.68904495239258, "global_step": 132969, "epoch": 1098} {"train_loss": -37.31913375854492, "global_step": 132970, "epoch": 1098} {"train_loss": -36.16378402709961, "global_step": 132971, "epoch": 1098} {"train_loss": -36.05044174194336, "global_step": 132972, "epoch": 1098} {"train_loss": -39.53567123413086, "global_step": 132973, "epoch": 1098} {"train_loss": -38.58320999145508, "global_step": 132974, "epoch": 1098} {"train_loss": -39.17280197143555, "global_step": 132975, "epoch": 1098} {"train_loss": -38.57462692260742, "global_step": 132976, "epoch": 1098} {"train_loss": -39.05001449584961, "global_step": 132977, "epoch": 1098} {"train_loss": -38.34997772973431, "global_step": 132978, "epoch": 1098, "val_loss": 2632685.25} {"train_loss": -39.38140869140625, "global_step": 132979, "epoch": 1099} {"train_loss": -38.633182525634766, "global_step": 132980, "epoch": 1099} {"train_loss": -39.07792282104492, "global_step": 132981, "epoch": 1099} {"train_loss": -39.06734085083008, "global_step": 132982, "epoch": 1099} {"train_loss": -39.078365325927734, "global_step": 132983, "epoch": 1099} {"train_loss": -38.87163162231445, "global_step": 132984, "epoch": 1099} {"train_loss": -38.69655990600586, "global_step": 132985, "epoch": 1099} {"train_loss": -39.50153732299805, "global_step": 132986, "epoch": 1099} {"train_loss": -39.18928909301758, "global_step": 132987, "epoch": 1099} {"train_loss": -39.33698272705078, "global_step": 132988, "epoch": 1099} {"train_loss": -39.44808578491211, "global_step": 132989, "epoch": 1099} {"train_loss": -39.51105880737305, "global_step": 132990, "epoch": 1099} {"train_loss": -39.658447265625, "global_step": 132991, "epoch": 1099} {"train_loss": -40.14449691772461, "global_step": 132992, "epoch": 1099} {"train_loss": -38.71021270751953, "global_step": 132993, "epoch": 1099} {"train_loss": -39.79415512084961, "global_step": 132994, "epoch": 1099} {"train_loss": -40.4449348449707, "global_step": 132995, "epoch": 1099} {"train_loss": -39.89796447753906, "global_step": 132996, "epoch": 1099} {"train_loss": -39.80437088012695, "global_step": 132997, "epoch": 1099} {"train_loss": -40.11320877075195, "global_step": 132998, "epoch": 1099} {"train_loss": -39.18035125732422, "global_step": 132999, "epoch": 1099} {"train_loss": -39.005943298339844, "global_step": 133000, "epoch": 1099} {"train_loss": -38.66440963745117, "global_step": 133001, "epoch": 1099} {"train_loss": -39.829715728759766, "global_step": 133002, "epoch": 1099} {"train_loss": -40.203887939453125, "global_step": 133003, "epoch": 1099} {"train_loss": -40.05508804321289, "global_step": 133004, "epoch": 1099} {"train_loss": -39.74668502807617, "global_step": 133005, "epoch": 1099} {"train_loss": -40.23733139038086, "global_step": 133006, "epoch": 1099} {"train_loss": -39.70630645751953, "global_step": 133007, "epoch": 1099} {"train_loss": -39.335201263427734, "global_step": 133008, "epoch": 1099} {"train_loss": -37.1083869934082, "global_step": 133009, "epoch": 1099} {"train_loss": -36.14443588256836, "global_step": 133010, "epoch": 1099} {"train_loss": -35.146610260009766, "global_step": 133011, "epoch": 1099} {"train_loss": -37.56629180908203, "global_step": 133012, "epoch": 1099} {"train_loss": -39.79670333862305, "global_step": 133013, "epoch": 1099} {"train_loss": -39.534420013427734, "global_step": 133014, "epoch": 1099} {"train_loss": -38.33974838256836, "global_step": 133015, "epoch": 1099} {"train_loss": -38.278961181640625, "global_step": 133016, "epoch": 1099} {"train_loss": -38.83699417114258, "global_step": 133017, "epoch": 1099} {"train_loss": -38.47783279418945, "global_step": 133018, "epoch": 1099} {"train_loss": -39.58422088623047, "global_step": 133019, "epoch": 1099} {"train_loss": -38.372230529785156, "global_step": 133020, "epoch": 1099} {"train_loss": -39.24229431152344, "global_step": 133021, "epoch": 1099} {"train_loss": -39.289466857910156, "global_step": 133022, "epoch": 1099} {"train_loss": -39.14027786254883, "global_step": 133023, "epoch": 1099} {"train_loss": -39.4507942199707, "global_step": 133024, "epoch": 1099} {"train_loss": -39.7709846496582, "global_step": 133025, "epoch": 1099} {"train_loss": -39.81682586669922, "global_step": 133026, "epoch": 1099} {"train_loss": -40.259925842285156, "global_step": 133027, "epoch": 1099} {"train_loss": -39.9263801574707, "global_step": 133028, "epoch": 1099} {"train_loss": -39.20499801635742, "global_step": 133029, "epoch": 1099} {"train_loss": -39.76386260986328, "global_step": 133030, "epoch": 1099} {"train_loss": -39.49982833862305, "global_step": 133031, "epoch": 1099} {"train_loss": -39.79281234741211, "global_step": 133032, "epoch": 1099} {"train_loss": -40.1396484375, "global_step": 133033, "epoch": 1099} {"train_loss": -39.65385055541992, "global_step": 133034, "epoch": 1099} {"train_loss": -40.46928787231445, "global_step": 133035, "epoch": 1099} {"train_loss": -39.37631607055664, "global_step": 133036, "epoch": 1099} {"train_loss": -39.7024040222168, "global_step": 133037, "epoch": 1099} {"train_loss": -40.01041793823242, "global_step": 133038, "epoch": 1099} {"train_loss": -39.91980743408203, "global_step": 133039, "epoch": 1099} {"train_loss": -38.70074462890625, "global_step": 133040, "epoch": 1099} {"train_loss": -39.21284103393555, "global_step": 133041, "epoch": 1099} {"train_loss": -40.313236236572266, "global_step": 133042, "epoch": 1099} {"train_loss": -38.56881332397461, "global_step": 133043, "epoch": 1099} {"train_loss": -40.212860107421875, "global_step": 133044, "epoch": 1099} {"train_loss": -39.55158615112305, "global_step": 133045, "epoch": 1099} {"train_loss": -39.451637268066406, "global_step": 133046, "epoch": 1099} {"train_loss": -39.447147369384766, "global_step": 133047, "epoch": 1099} {"train_loss": -39.49635696411133, "global_step": 133048, "epoch": 1099} {"train_loss": -38.19419479370117, "global_step": 133049, "epoch": 1099} {"train_loss": -38.718048095703125, "global_step": 133050, "epoch": 1099} {"train_loss": -39.293087005615234, "global_step": 133051, "epoch": 1099} {"train_loss": -39.03775405883789, "global_step": 133052, "epoch": 1099} {"train_loss": -39.21311569213867, "global_step": 133053, "epoch": 1099} {"train_loss": -35.37324142456055, "global_step": 133054, "epoch": 1099} {"train_loss": -38.847389221191406, "global_step": 133055, "epoch": 1099} {"train_loss": -39.75954055786133, "global_step": 133056, "epoch": 1099} {"train_loss": -36.88960647583008, "global_step": 133057, "epoch": 1099} {"train_loss": -38.29814147949219, "global_step": 133058, "epoch": 1099} {"train_loss": -35.4384880065918, "global_step": 133059, "epoch": 1099} {"train_loss": -37.97687530517578, "global_step": 133060, "epoch": 1099} {"train_loss": -32.62467956542969, "global_step": 133061, "epoch": 1099} {"train_loss": -38.55794143676758, "global_step": 133062, "epoch": 1099} {"train_loss": -35.11466598510742, "global_step": 133063, "epoch": 1099} {"train_loss": -36.906150817871094, "global_step": 133064, "epoch": 1099} {"train_loss": -36.408164978027344, "global_step": 133065, "epoch": 1099} {"train_loss": -34.744258880615234, "global_step": 133066, "epoch": 1099} {"train_loss": -36.05244827270508, "global_step": 133067, "epoch": 1099} {"train_loss": -36.09552764892578, "global_step": 133068, "epoch": 1099} {"train_loss": -35.41132354736328, "global_step": 133069, "epoch": 1099} {"train_loss": -37.35608673095703, "global_step": 133070, "epoch": 1099} {"train_loss": -35.5811767578125, "global_step": 133071, "epoch": 1099} {"train_loss": -35.97328567504883, "global_step": 133072, "epoch": 1099} {"train_loss": -38.095375061035156, "global_step": 133073, "epoch": 1099} {"train_loss": -35.15128707885742, "global_step": 133074, "epoch": 1099} {"train_loss": -35.892127990722656, "global_step": 133075, "epoch": 1099} {"train_loss": -34.61439514160156, "global_step": 133076, "epoch": 1099} {"train_loss": -35.4276123046875, "global_step": 133077, "epoch": 1099} {"train_loss": -31.562427520751953, "global_step": 133078, "epoch": 1099} {"train_loss": -35.532447814941406, "global_step": 133079, "epoch": 1099} {"train_loss": -34.86764907836914, "global_step": 133080, "epoch": 1099} {"train_loss": -37.99421691894531, "global_step": 133081, "epoch": 1099} {"train_loss": -34.2724723815918, "global_step": 133082, "epoch": 1099} {"train_loss": -36.65284729003906, "global_step": 133083, "epoch": 1099} {"train_loss": -36.43902587890625, "global_step": 133084, "epoch": 1099} {"train_loss": -33.57493591308594, "global_step": 133085, "epoch": 1099} {"train_loss": -37.85437774658203, "global_step": 133086, "epoch": 1099} {"train_loss": -37.320648193359375, "global_step": 133087, "epoch": 1099} {"train_loss": -37.124183654785156, "global_step": 133088, "epoch": 1099} {"train_loss": -36.215965270996094, "global_step": 133089, "epoch": 1099} {"train_loss": -37.67318344116211, "global_step": 133090, "epoch": 1099} {"train_loss": -37.158382415771484, "global_step": 133091, "epoch": 1099} {"train_loss": -37.8950309753418, "global_step": 133092, "epoch": 1099} {"train_loss": -36.90100860595703, "global_step": 133093, "epoch": 1099} {"train_loss": -37.49688720703125, "global_step": 133094, "epoch": 1099} {"train_loss": -37.89681625366211, "global_step": 133095, "epoch": 1099} {"train_loss": -37.86050796508789, "global_step": 133096, "epoch": 1099} {"train_loss": -37.404850006103516, "global_step": 133097, "epoch": 1099} {"train_loss": -37.98072052001953, "global_step": 133098, "epoch": 1099} {"train_loss": -38.19730752361708, "global_step": 133099, "epoch": 1099, "val_loss": 2564115.25} {"train_loss": -37.48032760620117, "global_step": 133100, "epoch": 1100} {"train_loss": -37.97278594970703, "global_step": 133101, "epoch": 1100} {"train_loss": -38.74689483642578, "global_step": 133102, "epoch": 1100} {"train_loss": -36.32766342163086, "global_step": 133103, "epoch": 1100} {"train_loss": -38.176570892333984, "global_step": 133104, "epoch": 1100} {"train_loss": -37.941741943359375, "global_step": 133105, "epoch": 1100} {"train_loss": -37.83838653564453, "global_step": 133106, "epoch": 1100} {"train_loss": -37.067745208740234, "global_step": 133107, "epoch": 1100} {"train_loss": -38.612274169921875, "global_step": 133108, "epoch": 1100} {"train_loss": -37.132991790771484, "global_step": 133109, "epoch": 1100} {"train_loss": -38.6640510559082, "global_step": 133110, "epoch": 1100} {"train_loss": -37.99047088623047, "global_step": 133111, "epoch": 1100} {"train_loss": -38.193359375, "global_step": 133112, "epoch": 1100} {"train_loss": -38.95878219604492, "global_step": 133113, "epoch": 1100} {"train_loss": -38.23868942260742, "global_step": 133114, "epoch": 1100} {"train_loss": -38.94834518432617, "global_step": 133115, "epoch": 1100} {"train_loss": -38.806236267089844, "global_step": 133116, "epoch": 1100} {"train_loss": -38.04506301879883, "global_step": 133117, "epoch": 1100} {"train_loss": -38.994380950927734, "global_step": 133118, "epoch": 1100} {"train_loss": -38.513099670410156, "global_step": 133119, "epoch": 1100} {"train_loss": -38.959083557128906, "global_step": 133120, "epoch": 1100} {"train_loss": -38.62284851074219, "global_step": 133121, "epoch": 1100} {"train_loss": -38.48134994506836, "global_step": 133122, "epoch": 1100} {"train_loss": -39.334041595458984, "global_step": 133123, "epoch": 1100} {"train_loss": -38.481971740722656, "global_step": 133124, "epoch": 1100} {"train_loss": -38.19506072998047, "global_step": 133125, "epoch": 1100} {"train_loss": -38.73270797729492, "global_step": 133126, "epoch": 1100} {"train_loss": -37.92052459716797, "global_step": 133127, "epoch": 1100} {"train_loss": -38.49076461791992, "global_step": 133128, "epoch": 1100} {"train_loss": -38.811302185058594, "global_step": 133129, "epoch": 1100} {"train_loss": -38.953453063964844, "global_step": 133130, "epoch": 1100} {"train_loss": -38.00859451293945, "global_step": 133131, "epoch": 1100} {"train_loss": -38.94196701049805, "global_step": 133132, "epoch": 1100} {"train_loss": -37.55669021606445, "global_step": 133133, "epoch": 1100} {"train_loss": -38.62578201293945, "global_step": 133134, "epoch": 1100} {"train_loss": -38.48892593383789, "global_step": 133135, "epoch": 1100} {"train_loss": -37.60451126098633, "global_step": 133136, "epoch": 1100} {"train_loss": -38.47861099243164, "global_step": 133137, "epoch": 1100} {"train_loss": -38.79458236694336, "global_step": 133138, "epoch": 1100} {"train_loss": -38.19940948486328, "global_step": 133139, "epoch": 1100} {"train_loss": -38.449764251708984, "global_step": 133140, "epoch": 1100} {"train_loss": -38.304866790771484, "global_step": 133141, "epoch": 1100} {"train_loss": -38.76603317260742, "global_step": 133142, "epoch": 1100} {"train_loss": -37.784664154052734, "global_step": 133143, "epoch": 1100} {"train_loss": -38.21000289916992, "global_step": 133144, "epoch": 1100} {"train_loss": -38.3696403503418, "global_step": 133145, "epoch": 1100} {"train_loss": -37.61496353149414, "global_step": 133146, "epoch": 1100} {"train_loss": -38.99056625366211, "global_step": 133147, "epoch": 1100} {"train_loss": -37.97639465332031, "global_step": 133148, "epoch": 1100} {"train_loss": -38.94393539428711, "global_step": 133149, "epoch": 1100} {"train_loss": -37.3674201965332, "global_step": 133150, "epoch": 1100} {"train_loss": -36.814292907714844, "global_step": 133151, "epoch": 1100} {"train_loss": -37.975624084472656, "global_step": 133152, "epoch": 1100} {"train_loss": -38.58418655395508, "global_step": 133153, "epoch": 1100} {"train_loss": -39.14910888671875, "global_step": 133154, "epoch": 1100} {"train_loss": -38.65796661376953, "global_step": 133155, "epoch": 1100} {"train_loss": -36.88165283203125, "global_step": 133156, "epoch": 1100} {"train_loss": -38.13602828979492, "global_step": 133157, "epoch": 1100} {"train_loss": -38.9859619140625, "global_step": 133158, "epoch": 1100} {"train_loss": -36.89152145385742, "global_step": 133159, "epoch": 1100} {"train_loss": -37.998252868652344, "global_step": 133160, "epoch": 1100} {"train_loss": -38.35321807861328, "global_step": 133161, "epoch": 1100} {"train_loss": -37.48200607299805, "global_step": 133162, "epoch": 1100} {"train_loss": -37.88227844238281, "global_step": 133163, "epoch": 1100} {"train_loss": -37.53722381591797, "global_step": 133164, "epoch": 1100} {"train_loss": -37.163551330566406, "global_step": 133165, "epoch": 1100} {"train_loss": -36.21709442138672, "global_step": 133166, "epoch": 1100} {"train_loss": -38.49951171875, "global_step": 133167, "epoch": 1100} {"train_loss": -37.87093734741211, "global_step": 133168, "epoch": 1100} {"train_loss": -37.73046875, "global_step": 133169, "epoch": 1100} {"train_loss": -38.57181930541992, "global_step": 133170, "epoch": 1100} {"train_loss": -36.819305419921875, "global_step": 133171, "epoch": 1100} {"train_loss": -37.468990325927734, "global_step": 133172, "epoch": 1100} {"train_loss": -37.63462448120117, "global_step": 133173, "epoch": 1100} {"train_loss": -37.07060623168945, "global_step": 133174, "epoch": 1100} {"train_loss": -37.26913070678711, "global_step": 133175, "epoch": 1100} {"train_loss": -38.583351135253906, "global_step": 133176, "epoch": 1100} {"train_loss": -37.531272888183594, "global_step": 133177, "epoch": 1100} {"train_loss": -36.26937484741211, "global_step": 133178, "epoch": 1100} {"train_loss": -37.89614486694336, "global_step": 133179, "epoch": 1100} {"train_loss": -37.48276901245117, "global_step": 133180, "epoch": 1100} {"train_loss": -37.86512756347656, "global_step": 133181, "epoch": 1100} {"train_loss": -38.3377799987793, "global_step": 133182, "epoch": 1100} {"train_loss": -38.153114318847656, "global_step": 133183, "epoch": 1100} {"train_loss": -36.39905548095703, "global_step": 133184, "epoch": 1100} {"train_loss": -36.70343780517578, "global_step": 133185, "epoch": 1100} {"train_loss": -36.26190948486328, "global_step": 133186, "epoch": 1100} {"train_loss": -38.1937255859375, "global_step": 133187, "epoch": 1100} {"train_loss": -38.727352142333984, "global_step": 133188, "epoch": 1100} {"train_loss": -36.75468826293945, "global_step": 133189, "epoch": 1100} {"train_loss": -37.3432731628418, "global_step": 133190, "epoch": 1100} {"train_loss": -38.61753463745117, "global_step": 133191, "epoch": 1100} {"train_loss": -37.23857116699219, "global_step": 133192, "epoch": 1100} {"train_loss": -38.41960906982422, "global_step": 133193, "epoch": 1100} {"train_loss": -38.3179817199707, "global_step": 133194, "epoch": 1100} {"train_loss": -37.250221252441406, "global_step": 133195, "epoch": 1100} {"train_loss": -39.061038970947266, "global_step": 133196, "epoch": 1100} {"train_loss": -38.08672332763672, "global_step": 133197, "epoch": 1100} {"train_loss": -38.69799041748047, "global_step": 133198, "epoch": 1100} {"train_loss": -39.013580322265625, "global_step": 133199, "epoch": 1100} {"train_loss": -39.04615020751953, "global_step": 133200, "epoch": 1100} {"train_loss": -39.65549850463867, "global_step": 133201, "epoch": 1100} {"train_loss": -39.4506950378418, "global_step": 133202, "epoch": 1100} {"train_loss": -39.77473068237305, "global_step": 133203, "epoch": 1100} {"train_loss": -38.80319595336914, "global_step": 133204, "epoch": 1100} {"train_loss": -39.51737594604492, "global_step": 133205, "epoch": 1100} {"train_loss": -39.342769622802734, "global_step": 133206, "epoch": 1100} {"train_loss": -39.80939865112305, "global_step": 133207, "epoch": 1100} {"train_loss": -39.75067138671875, "global_step": 133208, "epoch": 1100} {"train_loss": -39.67548751831055, "global_step": 133209, "epoch": 1100} {"train_loss": -39.71012496948242, "global_step": 133210, "epoch": 1100} {"train_loss": -38.90080642700195, "global_step": 133211, "epoch": 1100} {"train_loss": -40.14824676513672, "global_step": 133212, "epoch": 1100} {"train_loss": -39.59373092651367, "global_step": 133213, "epoch": 1100} {"train_loss": -40.09421920776367, "global_step": 133214, "epoch": 1100} {"train_loss": -39.92437744140625, "global_step": 133215, "epoch": 1100} {"train_loss": -39.479591369628906, "global_step": 133216, "epoch": 1100} {"train_loss": -39.82808303833008, "global_step": 133217, "epoch": 1100} {"train_loss": -40.02006912231445, "global_step": 133218, "epoch": 1100} {"train_loss": -40.076751708984375, "global_step": 133219, "epoch": 1100} {"train_loss": -38.31570557523365, "global_step": 133220, "epoch": 1100, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4400000": 1.0, "test/sim_max_reward_4400001": 1.0, "test/sim_max_reward_4400002": 1.0, "test/sim_max_reward_4400003": 1.0, "test/sim_max_reward_4400004": 1.0, "test/sim_max_reward_4400005": 1.0, "test/sim_max_reward_4400006": 1.0, "test/sim_max_reward_4400007": 1.0, "test/sim_max_reward_4400008": 1.0, "test/sim_max_reward_4400009": 1.0, "test/sim_max_reward_4400010": 1.0, "test/sim_max_reward_4400011": 1.0, "test/sim_max_reward_4400012": 1.0, "test/sim_max_reward_4400013": 1.0, "test/sim_max_reward_4400014": 1.0, "test/sim_max_reward_4400015": 1.0, "test/sim_max_reward_4400016": 1.0, "test/sim_max_reward_4400017": 1.0, "test/sim_max_reward_4400018": 1.0, "test/sim_max_reward_4400019": 1.0, "test/sim_max_reward_4400020": 1.0, "test/sim_max_reward_4400021": 1.0, "train/mean_score": 1.0, "test/mean_score": 1.0, "val_loss": 2581636.0} {"train_loss": -39.9354362487793, "global_step": 133221, "epoch": 1101} {"train_loss": -40.009464263916016, "global_step": 133222, "epoch": 1101} {"train_loss": -40.3422966003418, "global_step": 133223, "epoch": 1101} {"train_loss": -40.16297149658203, "global_step": 133224, "epoch": 1101} {"train_loss": -40.44462203979492, "global_step": 133225, "epoch": 1101} {"train_loss": -40.46185302734375, "global_step": 133226, "epoch": 1101} {"train_loss": -40.35221481323242, "global_step": 133227, "epoch": 1101} {"train_loss": -40.476226806640625, "global_step": 133228, "epoch": 1101} {"train_loss": -39.49216842651367, "global_step": 133229, "epoch": 1101} {"train_loss": -39.342220306396484, "global_step": 133230, "epoch": 1101} {"train_loss": -40.2382926940918, "global_step": 133231, "epoch": 1101} {"train_loss": -40.61372756958008, "global_step": 133232, "epoch": 1101} {"train_loss": -39.98579788208008, "global_step": 133233, "epoch": 1101} {"train_loss": -39.95377731323242, "global_step": 133234, "epoch": 1101} {"train_loss": -40.37794876098633, "global_step": 133235, "epoch": 1101} {"train_loss": -40.54143142700195, "global_step": 133236, "epoch": 1101} {"train_loss": -40.415401458740234, "global_step": 133237, "epoch": 1101} {"train_loss": -40.655029296875, "global_step": 133238, "epoch": 1101} {"train_loss": -40.11794662475586, "global_step": 133239, "epoch": 1101} {"train_loss": -38.876609802246094, "global_step": 133240, "epoch": 1101} {"train_loss": -39.83735275268555, "global_step": 133241, "epoch": 1101} {"train_loss": -39.584442138671875, "global_step": 133242, "epoch": 1101} {"train_loss": -40.01726150512695, "global_step": 133243, "epoch": 1101} {"train_loss": -39.69717025756836, "global_step": 133244, "epoch": 1101} {"train_loss": -38.866485595703125, "global_step": 133245, "epoch": 1101} {"train_loss": -37.035011291503906, "global_step": 133246, "epoch": 1101} {"train_loss": -35.89961624145508, "global_step": 133247, "epoch": 1101} {"train_loss": -34.52775192260742, "global_step": 133248, "epoch": 1101} {"train_loss": -36.836544036865234, "global_step": 133249, "epoch": 1101} {"train_loss": -39.04404067993164, "global_step": 133250, "epoch": 1101} {"train_loss": -38.6689338684082, "global_step": 133251, "epoch": 1101} {"train_loss": -37.73830795288086, "global_step": 133252, "epoch": 1101} {"train_loss": -39.35114288330078, "global_step": 133253, "epoch": 1101} {"train_loss": -39.924556732177734, "global_step": 133254, "epoch": 1101} {"train_loss": -38.95797348022461, "global_step": 133255, "epoch": 1101} {"train_loss": -39.22127914428711, "global_step": 133256, "epoch": 1101} {"train_loss": -39.161376953125, "global_step": 133257, "epoch": 1101} {"train_loss": -40.02946090698242, "global_step": 133258, "epoch": 1101} {"train_loss": -39.09174346923828, "global_step": 133259, "epoch": 1101} {"train_loss": -39.44588851928711, "global_step": 133260, "epoch": 1101} {"train_loss": -39.33315658569336, "global_step": 133261, "epoch": 1101} {"train_loss": -39.5018310546875, "global_step": 133262, "epoch": 1101} {"train_loss": -37.673606872558594, "global_step": 133263, "epoch": 1101} {"train_loss": -39.47922897338867, "global_step": 133264, "epoch": 1101} {"train_loss": -38.48107147216797, "global_step": 133265, "epoch": 1101} {"train_loss": -39.318153381347656, "global_step": 133266, "epoch": 1101} {"train_loss": -38.238162994384766, "global_step": 133267, "epoch": 1101} {"train_loss": -37.602455139160156, "global_step": 133268, "epoch": 1101} {"train_loss": -38.874568939208984, "global_step": 133269, "epoch": 1101} {"train_loss": -39.615474700927734, "global_step": 133270, "epoch": 1101} {"train_loss": -38.0413703918457, "global_step": 133271, "epoch": 1101} {"train_loss": -33.84914016723633, "global_step": 133272, "epoch": 1101} {"train_loss": -37.209877014160156, "global_step": 133273, "epoch": 1101} {"train_loss": -26.982702255249023, "global_step": 133274, "epoch": 1101} {"train_loss": -33.34590530395508, "global_step": 133275, "epoch": 1101} {"train_loss": -36.246986389160156, "global_step": 133276, "epoch": 1101} {"train_loss": -32.31110763549805, "global_step": 133277, "epoch": 1101} {"train_loss": -32.5474853515625, "global_step": 133278, "epoch": 1101} {"train_loss": -30.420499801635742, "global_step": 133279, "epoch": 1101} {"train_loss": -31.743061065673828, "global_step": 133280, "epoch": 1101} {"train_loss": -31.233142852783203, "global_step": 133281, "epoch": 1101} {"train_loss": -34.777503967285156, "global_step": 133282, "epoch": 1101} {"train_loss": -36.13603591918945, "global_step": 133283, "epoch": 1101} {"train_loss": -35.6594352722168, "global_step": 133284, "epoch": 1101} {"train_loss": -31.25324058532715, "global_step": 133285, "epoch": 1101} {"train_loss": -35.237159729003906, "global_step": 133286, "epoch": 1101} {"train_loss": -29.802518844604492, "global_step": 133287, "epoch": 1101} {"train_loss": -35.428070068359375, "global_step": 133288, "epoch": 1101} {"train_loss": -33.93984603881836, "global_step": 133289, "epoch": 1101} {"train_loss": -33.69654083251953, "global_step": 133290, "epoch": 1101} {"train_loss": -34.71879196166992, "global_step": 133291, "epoch": 1101} {"train_loss": -35.568172454833984, "global_step": 133292, "epoch": 1101} {"train_loss": -36.85599899291992, "global_step": 133293, "epoch": 1101} {"train_loss": -34.26485824584961, "global_step": 133294, "epoch": 1101} {"train_loss": -35.73934555053711, "global_step": 133295, "epoch": 1101} {"train_loss": -35.68767547607422, "global_step": 133296, "epoch": 1101} {"train_loss": -36.14970397949219, "global_step": 133297, "epoch": 1101} {"train_loss": -36.9904899597168, "global_step": 133298, "epoch": 1101} {"train_loss": -35.41299057006836, "global_step": 133299, "epoch": 1101} {"train_loss": -37.35246658325195, "global_step": 133300, "epoch": 1101} {"train_loss": -35.316986083984375, "global_step": 133301, "epoch": 1101} {"train_loss": -37.30691909790039, "global_step": 133302, "epoch": 1101} {"train_loss": -36.655609130859375, "global_step": 133303, "epoch": 1101} {"train_loss": -37.2598762512207, "global_step": 133304, "epoch": 1101} {"train_loss": -36.56036376953125, "global_step": 133305, "epoch": 1101} {"train_loss": -36.91162872314453, "global_step": 133306, "epoch": 1101} {"train_loss": -37.34567642211914, "global_step": 133307, "epoch": 1101} {"train_loss": -37.6871223449707, "global_step": 133308, "epoch": 1101} {"train_loss": -38.038997650146484, "global_step": 133309, "epoch": 1101} {"train_loss": -36.8724250793457, "global_step": 133310, "epoch": 1101} {"train_loss": -37.915584564208984, "global_step": 133311, "epoch": 1101} {"train_loss": -36.630348205566406, "global_step": 133312, "epoch": 1101} {"train_loss": -37.78629684448242, "global_step": 133313, "epoch": 1101} {"train_loss": -37.013511657714844, "global_step": 133314, "epoch": 1101} {"train_loss": -38.62559127807617, "global_step": 133315, "epoch": 1101} {"train_loss": -38.43596267700195, "global_step": 133316, "epoch": 1101} {"train_loss": -38.381553649902344, "global_step": 133317, "epoch": 1101} {"train_loss": -37.25148391723633, "global_step": 133318, "epoch": 1101} {"train_loss": -37.976009368896484, "global_step": 133319, "epoch": 1101} {"train_loss": -37.80161666870117, "global_step": 133320, "epoch": 1101} {"train_loss": -37.28712844848633, "global_step": 133321, "epoch": 1101} {"train_loss": -37.82314682006836, "global_step": 133322, "epoch": 1101} {"train_loss": -38.31742858886719, "global_step": 133323, "epoch": 1101} {"train_loss": -38.11920166015625, "global_step": 133324, "epoch": 1101} {"train_loss": -38.63505935668945, "global_step": 133325, "epoch": 1101} {"train_loss": -38.750389099121094, "global_step": 133326, "epoch": 1101} {"train_loss": -38.562042236328125, "global_step": 133327, "epoch": 1101} {"train_loss": -37.636756896972656, "global_step": 133328, "epoch": 1101} {"train_loss": -38.546897888183594, "global_step": 133329, "epoch": 1101} {"train_loss": -39.149349212646484, "global_step": 133330, "epoch": 1101} {"train_loss": -37.6430778503418, "global_step": 133331, "epoch": 1101} {"train_loss": -38.8545036315918, "global_step": 133332, "epoch": 1101} {"train_loss": -37.675331115722656, "global_step": 133333, "epoch": 1101} {"train_loss": -38.6734733581543, "global_step": 133334, "epoch": 1101} {"train_loss": -38.84418487548828, "global_step": 133335, "epoch": 1101} {"train_loss": -38.79726791381836, "global_step": 133336, "epoch": 1101} {"train_loss": -38.38072967529297, "global_step": 133337, "epoch": 1101} {"train_loss": -38.46335220336914, "global_step": 133338, "epoch": 1101} {"train_loss": -38.610755920410156, "global_step": 133339, "epoch": 1101} {"train_loss": -38.694671630859375, "global_step": 133340, "epoch": 1101} {"train_loss": -37.56663131713867, "global_step": 133341, "epoch": 1101, "val_loss": 2612353.75} {"train_loss": -39.12376403808594, "global_step": 133342, "epoch": 1102} {"train_loss": -38.91044235229492, "global_step": 133343, "epoch": 1102} {"train_loss": -39.18624496459961, "global_step": 133344, "epoch": 1102} {"train_loss": -38.965003967285156, "global_step": 133345, "epoch": 1102} {"train_loss": -39.225067138671875, "global_step": 133346, "epoch": 1102} {"train_loss": -38.514888763427734, "global_step": 133347, "epoch": 1102} {"train_loss": -39.26486587524414, "global_step": 133348, "epoch": 1102} {"train_loss": -38.58144760131836, "global_step": 133349, "epoch": 1102} {"train_loss": -38.99432373046875, "global_step": 133350, "epoch": 1102} {"train_loss": -38.39968490600586, "global_step": 133351, "epoch": 1102} {"train_loss": -38.79307174682617, "global_step": 133352, "epoch": 1102} {"train_loss": -38.865047454833984, "global_step": 133353, "epoch": 1102} {"train_loss": -39.448184967041016, "global_step": 133354, "epoch": 1102} {"train_loss": -38.730953216552734, "global_step": 133355, "epoch": 1102} {"train_loss": -38.61655807495117, "global_step": 133356, "epoch": 1102} {"train_loss": -38.35230255126953, "global_step": 133357, "epoch": 1102} {"train_loss": -37.416297912597656, "global_step": 133358, "epoch": 1102} {"train_loss": -39.00175094604492, "global_step": 133359, "epoch": 1102} {"train_loss": -38.96317672729492, "global_step": 133360, "epoch": 1102} {"train_loss": -39.175941467285156, "global_step": 133361, "epoch": 1102} {"train_loss": -38.3111686706543, "global_step": 133362, "epoch": 1102} {"train_loss": -38.6519775390625, "global_step": 133363, "epoch": 1102} {"train_loss": -34.17807388305664, "global_step": 133364, "epoch": 1102} {"train_loss": -37.45382308959961, "global_step": 133365, "epoch": 1102} {"train_loss": -37.23670196533203, "global_step": 133366, "epoch": 1102} {"train_loss": -37.65920639038086, "global_step": 133367, "epoch": 1102} {"train_loss": -38.55461502075195, "global_step": 133368, "epoch": 1102} {"train_loss": -39.2696533203125, "global_step": 133369, "epoch": 1102} {"train_loss": -38.21067428588867, "global_step": 133370, "epoch": 1102} {"train_loss": -39.11968994140625, "global_step": 133371, "epoch": 1102} {"train_loss": -38.229225158691406, "global_step": 133372, "epoch": 1102} {"train_loss": -39.71562576293945, "global_step": 133373, "epoch": 1102} {"train_loss": -38.24340057373047, "global_step": 133374, "epoch": 1102} {"train_loss": -39.18544006347656, "global_step": 133375, "epoch": 1102} {"train_loss": -38.500511169433594, "global_step": 133376, "epoch": 1102} {"train_loss": -39.49671173095703, "global_step": 133377, "epoch": 1102} {"train_loss": -38.80641174316406, "global_step": 133378, "epoch": 1102} {"train_loss": -39.19843673706055, "global_step": 133379, "epoch": 1102} {"train_loss": -38.922332763671875, "global_step": 133380, "epoch": 1102} {"train_loss": -38.86637496948242, "global_step": 133381, "epoch": 1102} {"train_loss": -39.61677169799805, "global_step": 133382, "epoch": 1102} {"train_loss": -39.40815353393555, "global_step": 133383, "epoch": 1102} {"train_loss": -39.02849197387695, "global_step": 133384, "epoch": 1102} {"train_loss": -39.743343353271484, "global_step": 133385, "epoch": 1102} {"train_loss": -39.24534225463867, "global_step": 133386, "epoch": 1102} {"train_loss": -40.03974533081055, "global_step": 133387, "epoch": 1102} {"train_loss": -39.30847930908203, "global_step": 133388, "epoch": 1102} {"train_loss": -39.1286735534668, "global_step": 133389, "epoch": 1102} {"train_loss": -39.56296920776367, "global_step": 133390, "epoch": 1102} {"train_loss": -39.77971649169922, "global_step": 133391, "epoch": 1102} {"train_loss": -39.87109375, "global_step": 133392, "epoch": 1102} {"train_loss": -39.97058868408203, "global_step": 133393, "epoch": 1102} {"train_loss": -39.629249572753906, "global_step": 133394, "epoch": 1102} {"train_loss": -39.54392623901367, "global_step": 133395, "epoch": 1102} {"train_loss": -39.34516143798828, "global_step": 133396, "epoch": 1102} {"train_loss": -38.61189651489258, "global_step": 133397, "epoch": 1102} {"train_loss": -38.23356246948242, "global_step": 133398, "epoch": 1102} {"train_loss": -38.88396072387695, "global_step": 133399, "epoch": 1102} {"train_loss": -39.93465805053711, "global_step": 133400, "epoch": 1102} {"train_loss": -39.93932342529297, "global_step": 133401, "epoch": 1102} {"train_loss": -38.847164154052734, "global_step": 133402, "epoch": 1102} {"train_loss": -38.588653564453125, "global_step": 133403, "epoch": 1102} {"train_loss": -38.72330856323242, "global_step": 133404, "epoch": 1102} {"train_loss": -38.81381607055664, "global_step": 133405, "epoch": 1102} {"train_loss": -39.4469108581543, "global_step": 133406, "epoch": 1102} {"train_loss": -38.56992721557617, "global_step": 133407, "epoch": 1102} {"train_loss": -38.44112014770508, "global_step": 133408, "epoch": 1102} {"train_loss": -38.28659439086914, "global_step": 133409, "epoch": 1102} {"train_loss": -39.88691329956055, "global_step": 133410, "epoch": 1102} {"train_loss": -39.990169525146484, "global_step": 133411, "epoch": 1102} {"train_loss": -38.29499435424805, "global_step": 133412, "epoch": 1102} {"train_loss": -37.76838302612305, "global_step": 133413, "epoch": 1102} {"train_loss": -39.58474349975586, "global_step": 133414, "epoch": 1102} {"train_loss": -38.03672409057617, "global_step": 133415, "epoch": 1102} {"train_loss": -37.923397064208984, "global_step": 133416, "epoch": 1102} {"train_loss": -39.56605911254883, "global_step": 133417, "epoch": 1102} {"train_loss": -37.54780197143555, "global_step": 133418, "epoch": 1102} {"train_loss": -38.7203483581543, "global_step": 133419, "epoch": 1102} {"train_loss": -40.40855407714844, "global_step": 133420, "epoch": 1102} {"train_loss": -38.53044509887695, "global_step": 133421, "epoch": 1102} {"train_loss": -38.80419158935547, "global_step": 133422, "epoch": 1102} {"train_loss": -37.8470458984375, "global_step": 133423, "epoch": 1102} {"train_loss": -37.2115592956543, "global_step": 133424, "epoch": 1102} {"train_loss": -37.37375259399414, "global_step": 133425, "epoch": 1102} {"train_loss": -38.81941223144531, "global_step": 133426, "epoch": 1102} {"train_loss": -39.70848083496094, "global_step": 133427, "epoch": 1102} {"train_loss": -40.31809616088867, "global_step": 133428, "epoch": 1102} {"train_loss": -38.92527389526367, "global_step": 133429, "epoch": 1102} {"train_loss": -38.261104583740234, "global_step": 133430, "epoch": 1102} {"train_loss": -40.71699905395508, "global_step": 133431, "epoch": 1102} {"train_loss": -39.66633224487305, "global_step": 133432, "epoch": 1102} {"train_loss": -38.98733139038086, "global_step": 133433, "epoch": 1102} {"train_loss": -39.81878662109375, "global_step": 133434, "epoch": 1102} {"train_loss": -39.50893783569336, "global_step": 133435, "epoch": 1102} {"train_loss": -39.69308090209961, "global_step": 133436, "epoch": 1102} {"train_loss": -39.587764739990234, "global_step": 133437, "epoch": 1102} {"train_loss": -40.40835189819336, "global_step": 133438, "epoch": 1102} {"train_loss": -39.448116302490234, "global_step": 133439, "epoch": 1102} {"train_loss": -39.68727493286133, "global_step": 133440, "epoch": 1102} {"train_loss": -39.104331970214844, "global_step": 133441, "epoch": 1102} {"train_loss": -40.27103805541992, "global_step": 133442, "epoch": 1102} {"train_loss": -37.61774444580078, "global_step": 133443, "epoch": 1102} {"train_loss": -39.56464385986328, "global_step": 133444, "epoch": 1102} {"train_loss": -38.97542953491211, "global_step": 133445, "epoch": 1102} {"train_loss": -39.54261016845703, "global_step": 133446, "epoch": 1102} {"train_loss": -39.16415023803711, "global_step": 133447, "epoch": 1102} {"train_loss": -38.79133224487305, "global_step": 133448, "epoch": 1102} {"train_loss": -39.663700103759766, "global_step": 133449, "epoch": 1102} {"train_loss": -39.20838928222656, "global_step": 133450, "epoch": 1102} {"train_loss": -38.87471389770508, "global_step": 133451, "epoch": 1102} {"train_loss": -38.88759994506836, "global_step": 133452, "epoch": 1102} {"train_loss": -39.65687942504883, "global_step": 133453, "epoch": 1102} {"train_loss": -38.794593811035156, "global_step": 133454, "epoch": 1102} {"train_loss": -39.22806930541992, "global_step": 133455, "epoch": 1102} {"train_loss": -39.4054069519043, "global_step": 133456, "epoch": 1102} {"train_loss": -40.127689361572266, "global_step": 133457, "epoch": 1102} {"train_loss": -39.48603820800781, "global_step": 133458, "epoch": 1102} {"train_loss": -38.967323303222656, "global_step": 133459, "epoch": 1102} {"train_loss": -37.15699005126953, "global_step": 133460, "epoch": 1102} {"train_loss": -39.892452239990234, "global_step": 133461, "epoch": 1102} {"train_loss": -38.96843208754358, "global_step": 133462, "epoch": 1102, "val_loss": 2658017.0} {"train_loss": -35.2420768737793, "global_step": 133463, "epoch": 1103} {"train_loss": -36.93906784057617, "global_step": 133464, "epoch": 1103} {"train_loss": -39.141998291015625, "global_step": 133465, "epoch": 1103} {"train_loss": -38.919795989990234, "global_step": 133466, "epoch": 1103} {"train_loss": -38.337337493896484, "global_step": 133467, "epoch": 1103} {"train_loss": -39.446022033691406, "global_step": 133468, "epoch": 1103} {"train_loss": -38.81167221069336, "global_step": 133469, "epoch": 1103} {"train_loss": -37.65122604370117, "global_step": 133470, "epoch": 1103} {"train_loss": -38.93638229370117, "global_step": 133471, "epoch": 1103} {"train_loss": -38.912025451660156, "global_step": 133472, "epoch": 1103} {"train_loss": -37.7888069152832, "global_step": 133473, "epoch": 1103} {"train_loss": -38.212249755859375, "global_step": 133474, "epoch": 1103} {"train_loss": -39.02473831176758, "global_step": 133475, "epoch": 1103} {"train_loss": -39.408447265625, "global_step": 133476, "epoch": 1103} {"train_loss": -37.954811096191406, "global_step": 133477, "epoch": 1103} {"train_loss": -38.28751754760742, "global_step": 133478, "epoch": 1103} {"train_loss": -39.22038650512695, "global_step": 133479, "epoch": 1103} {"train_loss": -38.64649200439453, "global_step": 133480, "epoch": 1103} {"train_loss": -38.864349365234375, "global_step": 133481, "epoch": 1103} {"train_loss": -39.688446044921875, "global_step": 133482, "epoch": 1103} {"train_loss": -38.79166793823242, "global_step": 133483, "epoch": 1103} {"train_loss": -39.90208053588867, "global_step": 133484, "epoch": 1103} {"train_loss": -39.731292724609375, "global_step": 133485, "epoch": 1103} {"train_loss": -36.88898849487305, "global_step": 133486, "epoch": 1103} {"train_loss": -40.058658599853516, "global_step": 133487, "epoch": 1103} {"train_loss": -39.18620681762695, "global_step": 133488, "epoch": 1103} {"train_loss": -39.4117431640625, "global_step": 133489, "epoch": 1103} {"train_loss": -38.699440002441406, "global_step": 133490, "epoch": 1103} {"train_loss": -39.395057678222656, "global_step": 133491, "epoch": 1103} {"train_loss": -39.166744232177734, "global_step": 133492, "epoch": 1103} {"train_loss": -40.16792678833008, "global_step": 133493, "epoch": 1103} {"train_loss": -39.253841400146484, "global_step": 133494, "epoch": 1103} {"train_loss": -39.61832046508789, "global_step": 133495, "epoch": 1103} {"train_loss": -38.23246765136719, "global_step": 133496, "epoch": 1103} {"train_loss": -38.794795989990234, "global_step": 133497, "epoch": 1103} {"train_loss": -39.832244873046875, "global_step": 133498, "epoch": 1103} {"train_loss": -39.282371520996094, "global_step": 133499, "epoch": 1103} {"train_loss": -39.03757095336914, "global_step": 133500, "epoch": 1103} {"train_loss": -39.38880920410156, "global_step": 133501, "epoch": 1103} {"train_loss": -39.208274841308594, "global_step": 133502, "epoch": 1103} {"train_loss": -39.798824310302734, "global_step": 133503, "epoch": 1103} {"train_loss": -40.42871856689453, "global_step": 133504, "epoch": 1103} {"train_loss": -40.32770919799805, "global_step": 133505, "epoch": 1103} {"train_loss": -39.814048767089844, "global_step": 133506, "epoch": 1103} {"train_loss": -39.85064697265625, "global_step": 133507, "epoch": 1103} {"train_loss": -39.97758102416992, "global_step": 133508, "epoch": 1103} {"train_loss": -39.16384506225586, "global_step": 133509, "epoch": 1103} {"train_loss": -38.18552780151367, "global_step": 133510, "epoch": 1103} {"train_loss": -39.60380935668945, "global_step": 133511, "epoch": 1103} {"train_loss": -39.95725631713867, "global_step": 133512, "epoch": 1103} {"train_loss": -40.38656997680664, "global_step": 133513, "epoch": 1103} {"train_loss": -36.92557907104492, "global_step": 133514, "epoch": 1103} {"train_loss": -39.82468795776367, "global_step": 133515, "epoch": 1103} {"train_loss": -39.64109420776367, "global_step": 133516, "epoch": 1103} {"train_loss": -39.29093933105469, "global_step": 133517, "epoch": 1103} {"train_loss": -39.583160400390625, "global_step": 133518, "epoch": 1103} {"train_loss": -39.75994110107422, "global_step": 133519, "epoch": 1103} {"train_loss": -39.15957260131836, "global_step": 133520, "epoch": 1103} {"train_loss": -39.78485107421875, "global_step": 133521, "epoch": 1103} {"train_loss": -38.928035736083984, "global_step": 133522, "epoch": 1103} {"train_loss": -40.04209518432617, "global_step": 133523, "epoch": 1103} {"train_loss": -36.46921920776367, "global_step": 133524, "epoch": 1103} {"train_loss": -38.421077728271484, "global_step": 133525, "epoch": 1103} {"train_loss": -38.66746139526367, "global_step": 133526, "epoch": 1103} {"train_loss": -36.23114776611328, "global_step": 133527, "epoch": 1103} {"train_loss": -38.1002311706543, "global_step": 133528, "epoch": 1103} {"train_loss": -38.1714973449707, "global_step": 133529, "epoch": 1103} {"train_loss": -37.12559127807617, "global_step": 133530, "epoch": 1103} {"train_loss": -39.2502326965332, "global_step": 133531, "epoch": 1103} {"train_loss": -37.74336624145508, "global_step": 133532, "epoch": 1103} {"train_loss": -39.40140914916992, "global_step": 133533, "epoch": 1103} {"train_loss": -37.6705436706543, "global_step": 133534, "epoch": 1103} {"train_loss": -36.14231872558594, "global_step": 133535, "epoch": 1103} {"train_loss": -37.95197677612305, "global_step": 133536, "epoch": 1103} {"train_loss": -39.62525939941406, "global_step": 133537, "epoch": 1103} {"train_loss": -38.20559310913086, "global_step": 133538, "epoch": 1103} {"train_loss": -39.02598190307617, "global_step": 133539, "epoch": 1103} {"train_loss": -37.898658752441406, "global_step": 133540, "epoch": 1103} {"train_loss": -38.22301483154297, "global_step": 133541, "epoch": 1103} {"train_loss": -38.43239212036133, "global_step": 133542, "epoch": 1103} {"train_loss": -38.09474563598633, "global_step": 133543, "epoch": 1103} {"train_loss": -35.34213638305664, "global_step": 133544, "epoch": 1103} {"train_loss": -38.83631134033203, "global_step": 133545, "epoch": 1103} {"train_loss": -38.07514572143555, "global_step": 133546, "epoch": 1103} {"train_loss": -38.05828857421875, "global_step": 133547, "epoch": 1103} {"train_loss": -39.57929229736328, "global_step": 133548, "epoch": 1103} {"train_loss": -38.2003173828125, "global_step": 133549, "epoch": 1103} {"train_loss": -38.8044548034668, "global_step": 133550, "epoch": 1103} {"train_loss": -39.359588623046875, "global_step": 133551, "epoch": 1103} {"train_loss": -39.010704040527344, "global_step": 133552, "epoch": 1103} {"train_loss": -39.48882293701172, "global_step": 133553, "epoch": 1103} {"train_loss": -38.22183609008789, "global_step": 133554, "epoch": 1103} {"train_loss": -38.7248420715332, "global_step": 133555, "epoch": 1103} {"train_loss": -39.24490737915039, "global_step": 133556, "epoch": 1103} {"train_loss": -39.19779586791992, "global_step": 133557, "epoch": 1103} {"train_loss": -38.68351364135742, "global_step": 133558, "epoch": 1103} {"train_loss": -40.26748275756836, "global_step": 133559, "epoch": 1103} {"train_loss": -38.97224044799805, "global_step": 133560, "epoch": 1103} {"train_loss": -39.34552001953125, "global_step": 133561, "epoch": 1103} {"train_loss": -39.54937744140625, "global_step": 133562, "epoch": 1103} {"train_loss": -39.37046432495117, "global_step": 133563, "epoch": 1103} {"train_loss": -39.5068244934082, "global_step": 133564, "epoch": 1103} {"train_loss": -39.79996871948242, "global_step": 133565, "epoch": 1103} {"train_loss": -39.706233978271484, "global_step": 133566, "epoch": 1103} {"train_loss": -39.189762115478516, "global_step": 133567, "epoch": 1103} {"train_loss": -38.12660598754883, "global_step": 133568, "epoch": 1103} {"train_loss": -40.26433181762695, "global_step": 133569, "epoch": 1103} {"train_loss": -39.67898178100586, "global_step": 133570, "epoch": 1103} {"train_loss": -38.72144317626953, "global_step": 133571, "epoch": 1103} {"train_loss": -40.20748519897461, "global_step": 133572, "epoch": 1103} {"train_loss": -39.04681396484375, "global_step": 133573, "epoch": 1103} {"train_loss": -38.8802604675293, "global_step": 133574, "epoch": 1103} {"train_loss": -39.79671859741211, "global_step": 133575, "epoch": 1103} {"train_loss": -39.52918243408203, "global_step": 133576, "epoch": 1103} {"train_loss": -39.75522232055664, "global_step": 133577, "epoch": 1103} {"train_loss": -40.39541244506836, "global_step": 133578, "epoch": 1103} {"train_loss": -40.21757125854492, "global_step": 133579, "epoch": 1103} {"train_loss": -39.54246139526367, "global_step": 133580, "epoch": 1103} {"train_loss": -39.90446090698242, "global_step": 133581, "epoch": 1103} {"train_loss": -40.35309982299805, "global_step": 133582, "epoch": 1103} {"train_loss": -38.94885304348528, "global_step": 133583, "epoch": 1103, "val_loss": 2689656.75} {"train_loss": -40.09111022949219, "global_step": 133584, "epoch": 1104} {"train_loss": -39.369075775146484, "global_step": 133585, "epoch": 1104} {"train_loss": -40.33305740356445, "global_step": 133586, "epoch": 1104} {"train_loss": -39.989627838134766, "global_step": 133587, "epoch": 1104} {"train_loss": -39.80885314941406, "global_step": 133588, "epoch": 1104} {"train_loss": -39.679622650146484, "global_step": 133589, "epoch": 1104} {"train_loss": -39.54549789428711, "global_step": 133590, "epoch": 1104} {"train_loss": -38.63225173950195, "global_step": 133591, "epoch": 1104} {"train_loss": -39.451839447021484, "global_step": 133592, "epoch": 1104} {"train_loss": -39.27094650268555, "global_step": 133593, "epoch": 1104} {"train_loss": -38.773597717285156, "global_step": 133594, "epoch": 1104} {"train_loss": -40.04965591430664, "global_step": 133595, "epoch": 1104} {"train_loss": -40.47230911254883, "global_step": 133596, "epoch": 1104} {"train_loss": -39.322792053222656, "global_step": 133597, "epoch": 1104} {"train_loss": -39.096900939941406, "global_step": 133598, "epoch": 1104} {"train_loss": -38.15625, "global_step": 133599, "epoch": 1104} {"train_loss": -35.94363021850586, "global_step": 133600, "epoch": 1104} {"train_loss": -37.28556442260742, "global_step": 133601, "epoch": 1104} {"train_loss": -38.943756103515625, "global_step": 133602, "epoch": 1104} {"train_loss": -39.11198043823242, "global_step": 133603, "epoch": 1104} {"train_loss": -39.86000061035156, "global_step": 133604, "epoch": 1104} {"train_loss": -38.175926208496094, "global_step": 133605, "epoch": 1104} {"train_loss": -38.89875411987305, "global_step": 133606, "epoch": 1104} {"train_loss": -38.86985397338867, "global_step": 133607, "epoch": 1104} {"train_loss": -39.773189544677734, "global_step": 133608, "epoch": 1104} {"train_loss": -39.15812301635742, "global_step": 133609, "epoch": 1104} {"train_loss": -38.67228698730469, "global_step": 133610, "epoch": 1104} {"train_loss": -39.55072021484375, "global_step": 133611, "epoch": 1104} {"train_loss": -39.39251708984375, "global_step": 133612, "epoch": 1104} {"train_loss": -39.259063720703125, "global_step": 133613, "epoch": 1104} {"train_loss": -39.830013275146484, "global_step": 133614, "epoch": 1104} {"train_loss": -38.72245407104492, "global_step": 133615, "epoch": 1104} {"train_loss": -39.3674430847168, "global_step": 133616, "epoch": 1104} {"train_loss": -39.051937103271484, "global_step": 133617, "epoch": 1104} {"train_loss": -39.01578903198242, "global_step": 133618, "epoch": 1104} {"train_loss": -38.62251281738281, "global_step": 133619, "epoch": 1104} {"train_loss": -37.677215576171875, "global_step": 133620, "epoch": 1104} {"train_loss": -39.17621612548828, "global_step": 133621, "epoch": 1104} {"train_loss": -39.67799377441406, "global_step": 133622, "epoch": 1104} {"train_loss": -38.27051544189453, "global_step": 133623, "epoch": 1104} {"train_loss": -38.95332717895508, "global_step": 133624, "epoch": 1104} {"train_loss": -39.5341796875, "global_step": 133625, "epoch": 1104} {"train_loss": -38.80141830444336, "global_step": 133626, "epoch": 1104} {"train_loss": -39.20357894897461, "global_step": 133627, "epoch": 1104} {"train_loss": -39.99137878417969, "global_step": 133628, "epoch": 1104} {"train_loss": -40.02978515625, "global_step": 133629, "epoch": 1104} {"train_loss": -39.47694778442383, "global_step": 133630, "epoch": 1104} {"train_loss": -39.75153732299805, "global_step": 133631, "epoch": 1104} {"train_loss": -38.19279861450195, "global_step": 133632, "epoch": 1104} {"train_loss": -39.725067138671875, "global_step": 133633, "epoch": 1104} {"train_loss": -39.46200180053711, "global_step": 133634, "epoch": 1104} {"train_loss": -38.78395462036133, "global_step": 133635, "epoch": 1104} {"train_loss": -39.106361389160156, "global_step": 133636, "epoch": 1104} {"train_loss": -38.573421478271484, "global_step": 133637, "epoch": 1104} {"train_loss": -38.26137924194336, "global_step": 133638, "epoch": 1104} {"train_loss": -37.446475982666016, "global_step": 133639, "epoch": 1104} {"train_loss": -37.487361907958984, "global_step": 133640, "epoch": 1104} {"train_loss": -38.615882873535156, "global_step": 133641, "epoch": 1104} {"train_loss": -39.5839958190918, "global_step": 133642, "epoch": 1104} {"train_loss": -38.87033462524414, "global_step": 133643, "epoch": 1104} {"train_loss": -38.20664978027344, "global_step": 133644, "epoch": 1104} {"train_loss": -37.724605560302734, "global_step": 133645, "epoch": 1104} {"train_loss": -38.31031036376953, "global_step": 133646, "epoch": 1104} {"train_loss": -39.128822326660156, "global_step": 133647, "epoch": 1104} {"train_loss": -35.73308181762695, "global_step": 133648, "epoch": 1104} {"train_loss": -35.7555046081543, "global_step": 133649, "epoch": 1104} {"train_loss": -39.40134811401367, "global_step": 133650, "epoch": 1104} {"train_loss": -38.01218795776367, "global_step": 133651, "epoch": 1104} {"train_loss": -37.541690826416016, "global_step": 133652, "epoch": 1104} {"train_loss": -39.8045654296875, "global_step": 133653, "epoch": 1104} {"train_loss": -38.339698791503906, "global_step": 133654, "epoch": 1104} {"train_loss": -38.95100784301758, "global_step": 133655, "epoch": 1104} {"train_loss": -37.566043853759766, "global_step": 133656, "epoch": 1104} {"train_loss": -38.0186767578125, "global_step": 133657, "epoch": 1104} {"train_loss": -37.203792572021484, "global_step": 133658, "epoch": 1104} {"train_loss": -38.25764083862305, "global_step": 133659, "epoch": 1104} {"train_loss": -38.56245040893555, "global_step": 133660, "epoch": 1104} {"train_loss": -38.778663635253906, "global_step": 133661, "epoch": 1104} {"train_loss": -39.153778076171875, "global_step": 133662, "epoch": 1104} {"train_loss": -38.673065185546875, "global_step": 133663, "epoch": 1104} {"train_loss": -39.81608963012695, "global_step": 133664, "epoch": 1104} {"train_loss": -39.28944778442383, "global_step": 133665, "epoch": 1104} {"train_loss": -39.247188568115234, "global_step": 133666, "epoch": 1104} {"train_loss": -39.67302703857422, "global_step": 133667, "epoch": 1104} {"train_loss": -39.284820556640625, "global_step": 133668, "epoch": 1104} {"train_loss": -39.769866943359375, "global_step": 133669, "epoch": 1104} {"train_loss": -39.73530960083008, "global_step": 133670, "epoch": 1104} {"train_loss": -39.54041290283203, "global_step": 133671, "epoch": 1104} {"train_loss": -39.28950119018555, "global_step": 133672, "epoch": 1104} {"train_loss": -39.76021194458008, "global_step": 133673, "epoch": 1104} {"train_loss": -39.858070373535156, "global_step": 133674, "epoch": 1104} {"train_loss": -39.686256408691406, "global_step": 133675, "epoch": 1104} {"train_loss": -39.33864974975586, "global_step": 133676, "epoch": 1104} {"train_loss": -39.761512756347656, "global_step": 133677, "epoch": 1104} {"train_loss": -39.47811508178711, "global_step": 133678, "epoch": 1104} {"train_loss": -40.33457565307617, "global_step": 133679, "epoch": 1104} {"train_loss": -39.5919075012207, "global_step": 133680, "epoch": 1104} {"train_loss": -40.32600784301758, "global_step": 133681, "epoch": 1104} {"train_loss": -39.764190673828125, "global_step": 133682, "epoch": 1104} {"train_loss": -39.727230072021484, "global_step": 133683, "epoch": 1104} {"train_loss": -40.2611198425293, "global_step": 133684, "epoch": 1104} {"train_loss": -40.2860107421875, "global_step": 133685, "epoch": 1104} {"train_loss": -38.7172966003418, "global_step": 133686, "epoch": 1104} {"train_loss": -39.55437469482422, "global_step": 133687, "epoch": 1104} {"train_loss": -39.675960540771484, "global_step": 133688, "epoch": 1104} {"train_loss": -40.43471145629883, "global_step": 133689, "epoch": 1104} {"train_loss": -39.96677780151367, "global_step": 133690, "epoch": 1104} {"train_loss": -40.24679183959961, "global_step": 133691, "epoch": 1104} {"train_loss": -40.40192794799805, "global_step": 133692, "epoch": 1104} {"train_loss": -40.634647369384766, "global_step": 133693, "epoch": 1104} {"train_loss": -40.443668365478516, "global_step": 133694, "epoch": 1104} {"train_loss": -39.84740447998047, "global_step": 133695, "epoch": 1104} {"train_loss": -40.465484619140625, "global_step": 133696, "epoch": 1104} {"train_loss": -40.230953216552734, "global_step": 133697, "epoch": 1104} {"train_loss": -40.390987396240234, "global_step": 133698, "epoch": 1104} {"train_loss": -40.02903366088867, "global_step": 133699, "epoch": 1104} {"train_loss": -40.2061882019043, "global_step": 133700, "epoch": 1104} {"train_loss": -39.37315368652344, "global_step": 133701, "epoch": 1104} {"train_loss": -40.419960021972656, "global_step": 133702, "epoch": 1104} {"train_loss": -40.019935607910156, "global_step": 133703, "epoch": 1104} {"train_loss": -39.19651138683981, "global_step": 133704, "epoch": 1104, "val_loss": 2602544.25} {"train_loss": -40.49990463256836, "global_step": 133705, "epoch": 1105} {"train_loss": -40.532325744628906, "global_step": 133706, "epoch": 1105} {"train_loss": -40.85310745239258, "global_step": 133707, "epoch": 1105} {"train_loss": -40.090572357177734, "global_step": 133708, "epoch": 1105} {"train_loss": -40.2735595703125, "global_step": 133709, "epoch": 1105} {"train_loss": -39.030311584472656, "global_step": 133710, "epoch": 1105} {"train_loss": -39.04526901245117, "global_step": 133711, "epoch": 1105} {"train_loss": -39.294471740722656, "global_step": 133712, "epoch": 1105} {"train_loss": -40.132110595703125, "global_step": 133713, "epoch": 1105} {"train_loss": -40.75933074951172, "global_step": 133714, "epoch": 1105} {"train_loss": -39.592262268066406, "global_step": 133715, "epoch": 1105} {"train_loss": -39.31142044067383, "global_step": 133716, "epoch": 1105} {"train_loss": -39.506771087646484, "global_step": 133717, "epoch": 1105} {"train_loss": -37.56397247314453, "global_step": 133718, "epoch": 1105} {"train_loss": -38.79511260986328, "global_step": 133719, "epoch": 1105} {"train_loss": -38.18086624145508, "global_step": 133720, "epoch": 1105} {"train_loss": -38.84845733642578, "global_step": 133721, "epoch": 1105} {"train_loss": -38.11128616333008, "global_step": 133722, "epoch": 1105} {"train_loss": -37.799198150634766, "global_step": 133723, "epoch": 1105} {"train_loss": -40.64603805541992, "global_step": 133724, "epoch": 1105} {"train_loss": -38.697139739990234, "global_step": 133725, "epoch": 1105} {"train_loss": -33.32158660888672, "global_step": 133726, "epoch": 1105} {"train_loss": -32.5389289855957, "global_step": 133727, "epoch": 1105} {"train_loss": -36.803043365478516, "global_step": 133728, "epoch": 1105} {"train_loss": -39.226356506347656, "global_step": 133729, "epoch": 1105} {"train_loss": -37.280941009521484, "global_step": 133730, "epoch": 1105} {"train_loss": -35.78841018676758, "global_step": 133731, "epoch": 1105} {"train_loss": -37.28113555908203, "global_step": 133732, "epoch": 1105} {"train_loss": -33.71272659301758, "global_step": 133733, "epoch": 1105} {"train_loss": -36.345027923583984, "global_step": 133734, "epoch": 1105} {"train_loss": -35.967166900634766, "global_step": 133735, "epoch": 1105} {"train_loss": -34.739540100097656, "global_step": 133736, "epoch": 1105} {"train_loss": -36.66571044921875, "global_step": 133737, "epoch": 1105} {"train_loss": -36.5731315612793, "global_step": 133738, "epoch": 1105} {"train_loss": -36.04833984375, "global_step": 133739, "epoch": 1105} {"train_loss": -30.495925903320312, "global_step": 133740, "epoch": 1105} {"train_loss": -35.66105270385742, "global_step": 133741, "epoch": 1105} {"train_loss": -35.712074279785156, "global_step": 133742, "epoch": 1105} {"train_loss": -35.5634651184082, "global_step": 133743, "epoch": 1105} {"train_loss": -32.953678131103516, "global_step": 133744, "epoch": 1105} {"train_loss": -35.542388916015625, "global_step": 133745, "epoch": 1105} {"train_loss": -35.542022705078125, "global_step": 133746, "epoch": 1105} {"train_loss": -33.8393440246582, "global_step": 133747, "epoch": 1105} {"train_loss": -35.47830581665039, "global_step": 133748, "epoch": 1105} {"train_loss": -34.68913650512695, "global_step": 133749, "epoch": 1105} {"train_loss": -33.93941879272461, "global_step": 133750, "epoch": 1105} {"train_loss": -35.93396759033203, "global_step": 133751, "epoch": 1105} {"train_loss": -36.38029861450195, "global_step": 133752, "epoch": 1105} {"train_loss": -35.20829391479492, "global_step": 133753, "epoch": 1105} {"train_loss": -36.91210174560547, "global_step": 133754, "epoch": 1105} {"train_loss": -36.729705810546875, "global_step": 133755, "epoch": 1105} {"train_loss": -36.92959976196289, "global_step": 133756, "epoch": 1105} {"train_loss": -36.341217041015625, "global_step": 133757, "epoch": 1105} {"train_loss": -37.2823600769043, "global_step": 133758, "epoch": 1105} {"train_loss": -36.816986083984375, "global_step": 133759, "epoch": 1105} {"train_loss": -37.494136810302734, "global_step": 133760, "epoch": 1105} {"train_loss": -36.42106246948242, "global_step": 133761, "epoch": 1105} {"train_loss": -37.04146957397461, "global_step": 133762, "epoch": 1105} {"train_loss": -37.29941940307617, "global_step": 133763, "epoch": 1105} {"train_loss": -35.83333969116211, "global_step": 133764, "epoch": 1105} {"train_loss": -36.610748291015625, "global_step": 133765, "epoch": 1105} {"train_loss": -37.29741287231445, "global_step": 133766, "epoch": 1105} {"train_loss": -37.963436126708984, "global_step": 133767, "epoch": 1105} {"train_loss": -37.65180587768555, "global_step": 133768, "epoch": 1105} {"train_loss": -38.5276985168457, "global_step": 133769, "epoch": 1105} {"train_loss": -37.419288635253906, "global_step": 133770, "epoch": 1105} {"train_loss": -38.16250228881836, "global_step": 133771, "epoch": 1105} {"train_loss": -36.64598083496094, "global_step": 133772, "epoch": 1105} {"train_loss": -37.73999786376953, "global_step": 133773, "epoch": 1105} {"train_loss": -38.04524612426758, "global_step": 133774, "epoch": 1105} {"train_loss": -37.51960372924805, "global_step": 133775, "epoch": 1105} {"train_loss": -37.940731048583984, "global_step": 133776, "epoch": 1105} {"train_loss": -38.31352996826172, "global_step": 133777, "epoch": 1105} {"train_loss": -38.4647331237793, "global_step": 133778, "epoch": 1105} {"train_loss": -38.083526611328125, "global_step": 133779, "epoch": 1105} {"train_loss": -38.54130935668945, "global_step": 133780, "epoch": 1105} {"train_loss": -38.015071868896484, "global_step": 133781, "epoch": 1105} {"train_loss": -38.185428619384766, "global_step": 133782, "epoch": 1105} {"train_loss": -39.21989822387695, "global_step": 133783, "epoch": 1105} {"train_loss": -38.45212936401367, "global_step": 133784, "epoch": 1105} {"train_loss": -39.051918029785156, "global_step": 133785, "epoch": 1105} {"train_loss": -38.73760223388672, "global_step": 133786, "epoch": 1105} {"train_loss": -38.86129379272461, "global_step": 133787, "epoch": 1105} {"train_loss": -38.834102630615234, "global_step": 133788, "epoch": 1105} {"train_loss": -38.89034652709961, "global_step": 133789, "epoch": 1105} {"train_loss": -38.85064697265625, "global_step": 133790, "epoch": 1105} {"train_loss": -37.617950439453125, "global_step": 133791, "epoch": 1105} {"train_loss": -39.20388412475586, "global_step": 133792, "epoch": 1105} {"train_loss": -38.815940856933594, "global_step": 133793, "epoch": 1105} {"train_loss": -38.8315544128418, "global_step": 133794, "epoch": 1105} {"train_loss": -38.96809005737305, "global_step": 133795, "epoch": 1105} {"train_loss": -38.942752838134766, "global_step": 133796, "epoch": 1105} {"train_loss": -39.03413009643555, "global_step": 133797, "epoch": 1105} {"train_loss": -38.75226593017578, "global_step": 133798, "epoch": 1105} {"train_loss": -39.2889404296875, "global_step": 133799, "epoch": 1105} {"train_loss": -39.10390090942383, "global_step": 133800, "epoch": 1105} {"train_loss": -39.6942024230957, "global_step": 133801, "epoch": 1105} {"train_loss": -38.96906280517578, "global_step": 133802, "epoch": 1105} {"train_loss": -38.92936325073242, "global_step": 133803, "epoch": 1105} {"train_loss": -38.81517028808594, "global_step": 133804, "epoch": 1105} {"train_loss": -39.691650390625, "global_step": 133805, "epoch": 1105} {"train_loss": -39.177833557128906, "global_step": 133806, "epoch": 1105} {"train_loss": -38.679744720458984, "global_step": 133807, "epoch": 1105} {"train_loss": -40.02383041381836, "global_step": 133808, "epoch": 1105} {"train_loss": -38.23051834106445, "global_step": 133809, "epoch": 1105} {"train_loss": -39.70745849609375, "global_step": 133810, "epoch": 1105} {"train_loss": -38.31892395019531, "global_step": 133811, "epoch": 1105} {"train_loss": -39.20430374145508, "global_step": 133812, "epoch": 1105} {"train_loss": -39.17759323120117, "global_step": 133813, "epoch": 1105} {"train_loss": -39.40258026123047, "global_step": 133814, "epoch": 1105} {"train_loss": -39.84025192260742, "global_step": 133815, "epoch": 1105} {"train_loss": -39.93785095214844, "global_step": 133816, "epoch": 1105} {"train_loss": -40.33217239379883, "global_step": 133817, "epoch": 1105} {"train_loss": -39.33967208862305, "global_step": 133818, "epoch": 1105} {"train_loss": -39.77908706665039, "global_step": 133819, "epoch": 1105} {"train_loss": -39.68275833129883, "global_step": 133820, "epoch": 1105} {"train_loss": -39.101318359375, "global_step": 133821, "epoch": 1105} {"train_loss": -40.37961196899414, "global_step": 133822, "epoch": 1105} {"train_loss": -40.21635055541992, "global_step": 133823, "epoch": 1105} {"train_loss": -39.74055862426758, "global_step": 133824, "epoch": 1105} {"train_loss": -37.92671257208202, "global_step": 133825, "epoch": 1105, "val_loss": 2660584.75} {"train_loss": -39.92875289916992, "global_step": 133826, "epoch": 1106} {"train_loss": -39.897884368896484, "global_step": 133827, "epoch": 1106} {"train_loss": -39.53837585449219, "global_step": 133828, "epoch": 1106} {"train_loss": -39.75239181518555, "global_step": 133829, "epoch": 1106} {"train_loss": -40.344078063964844, "global_step": 133830, "epoch": 1106} {"train_loss": -39.667537689208984, "global_step": 133831, "epoch": 1106} {"train_loss": -39.1574592590332, "global_step": 133832, "epoch": 1106} {"train_loss": -38.761104583740234, "global_step": 133833, "epoch": 1106} {"train_loss": -38.91999053955078, "global_step": 133834, "epoch": 1106} {"train_loss": -39.43665313720703, "global_step": 133835, "epoch": 1106} {"train_loss": -40.41744613647461, "global_step": 133836, "epoch": 1106} {"train_loss": -40.559303283691406, "global_step": 133837, "epoch": 1106} {"train_loss": -40.06522750854492, "global_step": 133838, "epoch": 1106} {"train_loss": -40.22294998168945, "global_step": 133839, "epoch": 1106} {"train_loss": -39.37004470825195, "global_step": 133840, "epoch": 1106} {"train_loss": -39.34768295288086, "global_step": 133841, "epoch": 1106} {"train_loss": -39.57244873046875, "global_step": 133842, "epoch": 1106} {"train_loss": -39.008846282958984, "global_step": 133843, "epoch": 1106} {"train_loss": -38.76748275756836, "global_step": 133844, "epoch": 1106} {"train_loss": -37.02985382080078, "global_step": 133845, "epoch": 1106} {"train_loss": -35.59779357910156, "global_step": 133846, "epoch": 1106} {"train_loss": -38.7593879699707, "global_step": 133847, "epoch": 1106} {"train_loss": -39.414878845214844, "global_step": 133848, "epoch": 1106} {"train_loss": -37.302494049072266, "global_step": 133849, "epoch": 1106} {"train_loss": -38.682247161865234, "global_step": 133850, "epoch": 1106} {"train_loss": -39.30526351928711, "global_step": 133851, "epoch": 1106} {"train_loss": -38.30167770385742, "global_step": 133852, "epoch": 1106} {"train_loss": -39.233001708984375, "global_step": 133853, "epoch": 1106} {"train_loss": -39.70913314819336, "global_step": 133854, "epoch": 1106} {"train_loss": -38.868675231933594, "global_step": 133855, "epoch": 1106} {"train_loss": -39.37709045410156, "global_step": 133856, "epoch": 1106} {"train_loss": -39.628746032714844, "global_step": 133857, "epoch": 1106} {"train_loss": -38.68608856201172, "global_step": 133858, "epoch": 1106} {"train_loss": -39.13976287841797, "global_step": 133859, "epoch": 1106} {"train_loss": -39.2946891784668, "global_step": 133860, "epoch": 1106} {"train_loss": -40.10853576660156, "global_step": 133861, "epoch": 1106} {"train_loss": -40.27437210083008, "global_step": 133862, "epoch": 1106} {"train_loss": -39.39115524291992, "global_step": 133863, "epoch": 1106} {"train_loss": -39.218753814697266, "global_step": 133864, "epoch": 1106} {"train_loss": -38.800621032714844, "global_step": 133865, "epoch": 1106} {"train_loss": -39.01374816894531, "global_step": 133866, "epoch": 1106} {"train_loss": -39.092220306396484, "global_step": 133867, "epoch": 1106} {"train_loss": -39.285945892333984, "global_step": 133868, "epoch": 1106} {"train_loss": -40.15989303588867, "global_step": 133869, "epoch": 1106} {"train_loss": -39.64691162109375, "global_step": 133870, "epoch": 1106} {"train_loss": -38.4633903503418, "global_step": 133871, "epoch": 1106} {"train_loss": -38.92287063598633, "global_step": 133872, "epoch": 1106} {"train_loss": -38.26226806640625, "global_step": 133873, "epoch": 1106} {"train_loss": -38.15697479248047, "global_step": 133874, "epoch": 1106} {"train_loss": -38.85182571411133, "global_step": 133875, "epoch": 1106} {"train_loss": -38.70266342163086, "global_step": 133876, "epoch": 1106} {"train_loss": -35.61765670776367, "global_step": 133877, "epoch": 1106} {"train_loss": -38.17584991455078, "global_step": 133878, "epoch": 1106} {"train_loss": -34.67644500732422, "global_step": 133879, "epoch": 1106} {"train_loss": -34.474029541015625, "global_step": 133880, "epoch": 1106} {"train_loss": -34.51987838745117, "global_step": 133881, "epoch": 1106} {"train_loss": -38.96076583862305, "global_step": 133882, "epoch": 1106} {"train_loss": -34.227291107177734, "global_step": 133883, "epoch": 1106} {"train_loss": -35.20686721801758, "global_step": 133884, "epoch": 1106} {"train_loss": -36.63357925415039, "global_step": 133885, "epoch": 1106} {"train_loss": -37.911354064941406, "global_step": 133886, "epoch": 1106} {"train_loss": -37.9068717956543, "global_step": 133887, "epoch": 1106} {"train_loss": -38.15964889526367, "global_step": 133888, "epoch": 1106} {"train_loss": -38.688838958740234, "global_step": 133889, "epoch": 1106} {"train_loss": -37.92333984375, "global_step": 133890, "epoch": 1106} {"train_loss": -38.29013442993164, "global_step": 133891, "epoch": 1106} {"train_loss": -37.112762451171875, "global_step": 133892, "epoch": 1106} {"train_loss": -37.483577728271484, "global_step": 133893, "epoch": 1106} {"train_loss": -38.131591796875, "global_step": 133894, "epoch": 1106} {"train_loss": -37.331642150878906, "global_step": 133895, "epoch": 1106} {"train_loss": -38.29049301147461, "global_step": 133896, "epoch": 1106} {"train_loss": -38.644351959228516, "global_step": 133897, "epoch": 1106} {"train_loss": -38.46649932861328, "global_step": 133898, "epoch": 1106} {"train_loss": -38.38193893432617, "global_step": 133899, "epoch": 1106} {"train_loss": -38.761749267578125, "global_step": 133900, "epoch": 1106} {"train_loss": -39.723472595214844, "global_step": 133901, "epoch": 1106} {"train_loss": -38.27171325683594, "global_step": 133902, "epoch": 1106} {"train_loss": -39.52668380737305, "global_step": 133903, "epoch": 1106} {"train_loss": -39.224361419677734, "global_step": 133904, "epoch": 1106} {"train_loss": -38.751251220703125, "global_step": 133905, "epoch": 1106} {"train_loss": -38.65501022338867, "global_step": 133906, "epoch": 1106} {"train_loss": -39.79817581176758, "global_step": 133907, "epoch": 1106} {"train_loss": -39.354068756103516, "global_step": 133908, "epoch": 1106} {"train_loss": -39.07064437866211, "global_step": 133909, "epoch": 1106} {"train_loss": -39.244571685791016, "global_step": 133910, "epoch": 1106} {"train_loss": -39.52424240112305, "global_step": 133911, "epoch": 1106} {"train_loss": -39.410438537597656, "global_step": 133912, "epoch": 1106} {"train_loss": -38.78630828857422, "global_step": 133913, "epoch": 1106} {"train_loss": -39.31972885131836, "global_step": 133914, "epoch": 1106} {"train_loss": -39.74005889892578, "global_step": 133915, "epoch": 1106} {"train_loss": -39.798946380615234, "global_step": 133916, "epoch": 1106} {"train_loss": -38.69157028198242, "global_step": 133917, "epoch": 1106} {"train_loss": -39.87359619140625, "global_step": 133918, "epoch": 1106} {"train_loss": -39.676856994628906, "global_step": 133919, "epoch": 1106} {"train_loss": -39.23895263671875, "global_step": 133920, "epoch": 1106} {"train_loss": -39.707855224609375, "global_step": 133921, "epoch": 1106} {"train_loss": -39.091163635253906, "global_step": 133922, "epoch": 1106} {"train_loss": -40.396942138671875, "global_step": 133923, "epoch": 1106} {"train_loss": -39.88041687011719, "global_step": 133924, "epoch": 1106} {"train_loss": -40.054805755615234, "global_step": 133925, "epoch": 1106} {"train_loss": -39.8786506652832, "global_step": 133926, "epoch": 1106} {"train_loss": -37.90824508666992, "global_step": 133927, "epoch": 1106} {"train_loss": -38.587135314941406, "global_step": 133928, "epoch": 1106} {"train_loss": -39.57009506225586, "global_step": 133929, "epoch": 1106} {"train_loss": -39.777217864990234, "global_step": 133930, "epoch": 1106} {"train_loss": -39.90468215942383, "global_step": 133931, "epoch": 1106} {"train_loss": -39.222171783447266, "global_step": 133932, "epoch": 1106} {"train_loss": -39.82432174682617, "global_step": 133933, "epoch": 1106} {"train_loss": -40.35247802734375, "global_step": 133934, "epoch": 1106} {"train_loss": -39.5802116394043, "global_step": 133935, "epoch": 1106} {"train_loss": -40.29623031616211, "global_step": 133936, "epoch": 1106} {"train_loss": -40.241329193115234, "global_step": 133937, "epoch": 1106} {"train_loss": -38.45191192626953, "global_step": 133938, "epoch": 1106} {"train_loss": -39.699832916259766, "global_step": 133939, "epoch": 1106} {"train_loss": -40.20026779174805, "global_step": 133940, "epoch": 1106} {"train_loss": -40.27385330200195, "global_step": 133941, "epoch": 1106} {"train_loss": -40.080074310302734, "global_step": 133942, "epoch": 1106} {"train_loss": -39.47563934326172, "global_step": 133943, "epoch": 1106} {"train_loss": -40.3851318359375, "global_step": 133944, "epoch": 1106} {"train_loss": -40.04444122314453, "global_step": 133945, "epoch": 1106} {"train_loss": -38.93150793028272, "global_step": 133946, "epoch": 1106, "val_loss": 2608266.75} {"train_loss": -40.21440505981445, "global_step": 133947, "epoch": 1107} {"train_loss": -40.16270065307617, "global_step": 133948, "epoch": 1107} {"train_loss": -36.74382400512695, "global_step": 133949, "epoch": 1107} {"train_loss": -40.07463455200195, "global_step": 133950, "epoch": 1107} {"train_loss": -40.31059646606445, "global_step": 133951, "epoch": 1107} {"train_loss": -39.37131881713867, "global_step": 133952, "epoch": 1107} {"train_loss": -39.205413818359375, "global_step": 133953, "epoch": 1107} {"train_loss": -38.484718322753906, "global_step": 133954, "epoch": 1107} {"train_loss": -39.6596794128418, "global_step": 133955, "epoch": 1107} {"train_loss": -37.67292022705078, "global_step": 133956, "epoch": 1107} {"train_loss": -38.83144760131836, "global_step": 133957, "epoch": 1107} {"train_loss": -39.388423919677734, "global_step": 133958, "epoch": 1107} {"train_loss": -39.80459213256836, "global_step": 133959, "epoch": 1107} {"train_loss": -39.069828033447266, "global_step": 133960, "epoch": 1107} {"train_loss": -39.79273223876953, "global_step": 133961, "epoch": 1107} {"train_loss": -38.097503662109375, "global_step": 133962, "epoch": 1107} {"train_loss": -36.5157356262207, "global_step": 133963, "epoch": 1107} {"train_loss": -36.85273361206055, "global_step": 133964, "epoch": 1107} {"train_loss": -38.27112579345703, "global_step": 133965, "epoch": 1107} {"train_loss": -38.70038604736328, "global_step": 133966, "epoch": 1107} {"train_loss": -39.20146942138672, "global_step": 133967, "epoch": 1107} {"train_loss": -38.07932662963867, "global_step": 133968, "epoch": 1107} {"train_loss": -38.159175872802734, "global_step": 133969, "epoch": 1107} {"train_loss": -38.5462760925293, "global_step": 133970, "epoch": 1107} {"train_loss": -25.045368194580078, "global_step": 133971, "epoch": 1107} {"train_loss": -38.71238708496094, "global_step": 133972, "epoch": 1107} {"train_loss": -37.74996566772461, "global_step": 133973, "epoch": 1107} {"train_loss": -34.79707336425781, "global_step": 133974, "epoch": 1107} {"train_loss": -38.045127868652344, "global_step": 133975, "epoch": 1107} {"train_loss": -37.6302375793457, "global_step": 133976, "epoch": 1107} {"train_loss": -35.71169662475586, "global_step": 133977, "epoch": 1107} {"train_loss": -37.01628494262695, "global_step": 133978, "epoch": 1107} {"train_loss": -37.264949798583984, "global_step": 133979, "epoch": 1107} {"train_loss": -36.7292594909668, "global_step": 133980, "epoch": 1107} {"train_loss": -38.52193832397461, "global_step": 133981, "epoch": 1107} {"train_loss": -36.035919189453125, "global_step": 133982, "epoch": 1107} {"train_loss": -33.72859191894531, "global_step": 133983, "epoch": 1107} {"train_loss": -37.66301727294922, "global_step": 133984, "epoch": 1107} {"train_loss": -35.44730758666992, "global_step": 133985, "epoch": 1107} {"train_loss": -33.23305130004883, "global_step": 133986, "epoch": 1107} {"train_loss": -35.131072998046875, "global_step": 133987, "epoch": 1107} {"train_loss": -37.50333786010742, "global_step": 133988, "epoch": 1107} {"train_loss": -35.70772171020508, "global_step": 133989, "epoch": 1107} {"train_loss": -38.01820755004883, "global_step": 133990, "epoch": 1107} {"train_loss": -35.36697006225586, "global_step": 133991, "epoch": 1107} {"train_loss": -37.1947135925293, "global_step": 133992, "epoch": 1107} {"train_loss": -36.294376373291016, "global_step": 133993, "epoch": 1107} {"train_loss": -36.56446075439453, "global_step": 133994, "epoch": 1107} {"train_loss": -33.87541580200195, "global_step": 133995, "epoch": 1107} {"train_loss": -36.54070281982422, "global_step": 133996, "epoch": 1107} {"train_loss": -37.97685241699219, "global_step": 133997, "epoch": 1107} {"train_loss": -37.2959098815918, "global_step": 133998, "epoch": 1107} {"train_loss": -38.01346969604492, "global_step": 133999, "epoch": 1107} {"train_loss": -38.095882415771484, "global_step": 134000, "epoch": 1107} {"train_loss": -37.317752838134766, "global_step": 134001, "epoch": 1107} {"train_loss": -37.92707061767578, "global_step": 134002, "epoch": 1107} {"train_loss": -37.958213806152344, "global_step": 134003, "epoch": 1107} {"train_loss": -37.684120178222656, "global_step": 134004, "epoch": 1107} {"train_loss": -38.2108268737793, "global_step": 134005, "epoch": 1107} {"train_loss": -38.05030822753906, "global_step": 134006, "epoch": 1107} {"train_loss": -37.41284942626953, "global_step": 134007, "epoch": 1107} {"train_loss": -39.048675537109375, "global_step": 134008, "epoch": 1107} {"train_loss": -37.00553894042969, "global_step": 134009, "epoch": 1107} {"train_loss": -38.476234436035156, "global_step": 134010, "epoch": 1107} {"train_loss": -38.370758056640625, "global_step": 134011, "epoch": 1107} {"train_loss": -38.199615478515625, "global_step": 134012, "epoch": 1107} {"train_loss": -38.25230026245117, "global_step": 134013, "epoch": 1107} {"train_loss": -37.33325958251953, "global_step": 134014, "epoch": 1107} {"train_loss": -37.62428665161133, "global_step": 134015, "epoch": 1107} {"train_loss": -37.8205451965332, "global_step": 134016, "epoch": 1107} {"train_loss": -37.59623336791992, "global_step": 134017, "epoch": 1107} {"train_loss": -38.71303176879883, "global_step": 134018, "epoch": 1107} {"train_loss": -37.02556228637695, "global_step": 134019, "epoch": 1107} {"train_loss": -39.2032585144043, "global_step": 134020, "epoch": 1107} {"train_loss": -37.998077392578125, "global_step": 134021, "epoch": 1107} {"train_loss": -37.99897384643555, "global_step": 134022, "epoch": 1107} {"train_loss": -37.74211502075195, "global_step": 134023, "epoch": 1107} {"train_loss": -38.93031692504883, "global_step": 134024, "epoch": 1107} {"train_loss": -38.656166076660156, "global_step": 134025, "epoch": 1107} {"train_loss": -38.725284576416016, "global_step": 134026, "epoch": 1107} {"train_loss": -38.51785659790039, "global_step": 134027, "epoch": 1107} {"train_loss": -38.7091064453125, "global_step": 134028, "epoch": 1107} {"train_loss": -39.02984619140625, "global_step": 134029, "epoch": 1107} {"train_loss": -37.91154098510742, "global_step": 134030, "epoch": 1107} {"train_loss": -39.073673248291016, "global_step": 134031, "epoch": 1107} {"train_loss": -38.15932846069336, "global_step": 134032, "epoch": 1107} {"train_loss": -39.412322998046875, "global_step": 134033, "epoch": 1107} {"train_loss": -36.55375671386719, "global_step": 134034, "epoch": 1107} {"train_loss": -39.076045989990234, "global_step": 134035, "epoch": 1107} {"train_loss": -38.696266174316406, "global_step": 134036, "epoch": 1107} {"train_loss": -38.21560287475586, "global_step": 134037, "epoch": 1107} {"train_loss": -39.18334197998047, "global_step": 134038, "epoch": 1107} {"train_loss": -39.331783294677734, "global_step": 134039, "epoch": 1107} {"train_loss": -39.29124069213867, "global_step": 134040, "epoch": 1107} {"train_loss": -39.24210739135742, "global_step": 134041, "epoch": 1107} {"train_loss": -39.0408821105957, "global_step": 134042, "epoch": 1107} {"train_loss": -39.451087951660156, "global_step": 134043, "epoch": 1107} {"train_loss": -36.73081588745117, "global_step": 134044, "epoch": 1107} {"train_loss": -39.481300354003906, "global_step": 134045, "epoch": 1107} {"train_loss": -39.213130950927734, "global_step": 134046, "epoch": 1107} {"train_loss": -39.297054290771484, "global_step": 134047, "epoch": 1107} {"train_loss": -39.13329315185547, "global_step": 134048, "epoch": 1107} {"train_loss": -39.77572250366211, "global_step": 134049, "epoch": 1107} {"train_loss": -39.48750686645508, "global_step": 134050, "epoch": 1107} {"train_loss": -38.91653060913086, "global_step": 134051, "epoch": 1107} {"train_loss": -39.72034454345703, "global_step": 134052, "epoch": 1107} {"train_loss": -39.230560302734375, "global_step": 134053, "epoch": 1107} {"train_loss": -39.6673469543457, "global_step": 134054, "epoch": 1107} {"train_loss": -39.3580322265625, "global_step": 134055, "epoch": 1107} {"train_loss": -39.32363510131836, "global_step": 134056, "epoch": 1107} {"train_loss": -39.61334228515625, "global_step": 134057, "epoch": 1107} {"train_loss": -39.512969970703125, "global_step": 134058, "epoch": 1107} {"train_loss": -40.16974639892578, "global_step": 134059, "epoch": 1107} {"train_loss": -39.61508560180664, "global_step": 134060, "epoch": 1107} {"train_loss": -39.47015380859375, "global_step": 134061, "epoch": 1107} {"train_loss": -38.985633850097656, "global_step": 134062, "epoch": 1107} {"train_loss": -39.4428825378418, "global_step": 134063, "epoch": 1107} {"train_loss": -39.741455078125, "global_step": 134064, "epoch": 1107} {"train_loss": -38.38863754272461, "global_step": 134065, "epoch": 1107} {"train_loss": -38.013465881347656, "global_step": 134066, "epoch": 1107} {"train_loss": -38.05171714341345, "global_step": 134067, "epoch": 1107, "val_loss": 2556147.75} {"train_loss": -31.817426681518555, "global_step": 134068, "epoch": 1108} {"train_loss": -30.518293380737305, "global_step": 134069, "epoch": 1108} {"train_loss": -35.7014274597168, "global_step": 134070, "epoch": 1108} {"train_loss": -39.18978500366211, "global_step": 134071, "epoch": 1108} {"train_loss": -38.427486419677734, "global_step": 134072, "epoch": 1108} {"train_loss": -38.671390533447266, "global_step": 134073, "epoch": 1108} {"train_loss": -39.729366302490234, "global_step": 134074, "epoch": 1108} {"train_loss": -38.417781829833984, "global_step": 134075, "epoch": 1108} {"train_loss": -39.20475387573242, "global_step": 134076, "epoch": 1108} {"train_loss": -39.02888107299805, "global_step": 134077, "epoch": 1108} {"train_loss": -39.85034942626953, "global_step": 134078, "epoch": 1108} {"train_loss": -39.55356979370117, "global_step": 134079, "epoch": 1108} {"train_loss": -39.138179779052734, "global_step": 134080, "epoch": 1108} {"train_loss": -39.03322219848633, "global_step": 134081, "epoch": 1108} {"train_loss": -39.03712844848633, "global_step": 134082, "epoch": 1108} {"train_loss": -39.212127685546875, "global_step": 134083, "epoch": 1108} {"train_loss": -39.79347610473633, "global_step": 134084, "epoch": 1108} {"train_loss": -39.48272705078125, "global_step": 134085, "epoch": 1108} {"train_loss": -39.749935150146484, "global_step": 134086, "epoch": 1108} {"train_loss": -39.69306564331055, "global_step": 134087, "epoch": 1108} {"train_loss": -38.76462936401367, "global_step": 134088, "epoch": 1108} {"train_loss": -38.5040397644043, "global_step": 134089, "epoch": 1108} {"train_loss": -40.082271575927734, "global_step": 134090, "epoch": 1108} {"train_loss": -39.48774337768555, "global_step": 134091, "epoch": 1108} {"train_loss": -39.18471908569336, "global_step": 134092, "epoch": 1108} {"train_loss": -38.54841232299805, "global_step": 134093, "epoch": 1108} {"train_loss": -39.72175216674805, "global_step": 134094, "epoch": 1108} {"train_loss": -39.97309494018555, "global_step": 134095, "epoch": 1108} {"train_loss": -37.407386779785156, "global_step": 134096, "epoch": 1108} {"train_loss": -39.35387420654297, "global_step": 134097, "epoch": 1108} {"train_loss": -39.172054290771484, "global_step": 134098, "epoch": 1108} {"train_loss": -39.22465896606445, "global_step": 134099, "epoch": 1108} {"train_loss": -39.51496505737305, "global_step": 134100, "epoch": 1108} {"train_loss": -39.325218200683594, "global_step": 134101, "epoch": 1108} {"train_loss": -39.01655578613281, "global_step": 134102, "epoch": 1108} {"train_loss": -38.21715545654297, "global_step": 134103, "epoch": 1108} {"train_loss": -38.4583854675293, "global_step": 134104, "epoch": 1108} {"train_loss": -39.47631072998047, "global_step": 134105, "epoch": 1108} {"train_loss": -39.59342575073242, "global_step": 134106, "epoch": 1108} {"train_loss": -38.574989318847656, "global_step": 134107, "epoch": 1108} {"train_loss": -35.053863525390625, "global_step": 134108, "epoch": 1108} {"train_loss": -39.31270980834961, "global_step": 134109, "epoch": 1108} {"train_loss": -39.14787673950195, "global_step": 134110, "epoch": 1108} {"train_loss": -38.72864532470703, "global_step": 134111, "epoch": 1108} {"train_loss": -39.0562744140625, "global_step": 134112, "epoch": 1108} {"train_loss": -39.66846466064453, "global_step": 134113, "epoch": 1108} {"train_loss": -40.103511810302734, "global_step": 134114, "epoch": 1108} {"train_loss": -39.230525970458984, "global_step": 134115, "epoch": 1108} {"train_loss": -38.36893844604492, "global_step": 134116, "epoch": 1108} {"train_loss": -39.9091911315918, "global_step": 134117, "epoch": 1108} {"train_loss": -40.06198501586914, "global_step": 134118, "epoch": 1108} {"train_loss": -39.01945114135742, "global_step": 134119, "epoch": 1108} {"train_loss": -39.2045783996582, "global_step": 134120, "epoch": 1108} {"train_loss": -38.078182220458984, "global_step": 134121, "epoch": 1108} {"train_loss": -39.51716232299805, "global_step": 134122, "epoch": 1108} {"train_loss": -37.39570236206055, "global_step": 134123, "epoch": 1108} {"train_loss": -38.926002502441406, "global_step": 134124, "epoch": 1108} {"train_loss": -38.90670394897461, "global_step": 134125, "epoch": 1108} {"train_loss": -39.61808395385742, "global_step": 134126, "epoch": 1108} {"train_loss": -38.989967346191406, "global_step": 134127, "epoch": 1108} {"train_loss": -36.318538665771484, "global_step": 134128, "epoch": 1108} {"train_loss": -39.52245330810547, "global_step": 134129, "epoch": 1108} {"train_loss": -39.31705856323242, "global_step": 134130, "epoch": 1108} {"train_loss": -39.3941650390625, "global_step": 134131, "epoch": 1108} {"train_loss": -39.888458251953125, "global_step": 134132, "epoch": 1108} {"train_loss": -39.06760787963867, "global_step": 134133, "epoch": 1108} {"train_loss": -36.14366149902344, "global_step": 134134, "epoch": 1108} {"train_loss": -39.14557647705078, "global_step": 134135, "epoch": 1108} {"train_loss": -39.73619079589844, "global_step": 134136, "epoch": 1108} {"train_loss": -39.77070236206055, "global_step": 134137, "epoch": 1108} {"train_loss": -39.46595764160156, "global_step": 134138, "epoch": 1108} {"train_loss": -39.394508361816406, "global_step": 134139, "epoch": 1108} {"train_loss": -38.73133087158203, "global_step": 134140, "epoch": 1108} {"train_loss": -39.62543869018555, "global_step": 134141, "epoch": 1108} {"train_loss": -39.488704681396484, "global_step": 134142, "epoch": 1108} {"train_loss": -39.16121292114258, "global_step": 134143, "epoch": 1108} {"train_loss": -37.859291076660156, "global_step": 134144, "epoch": 1108} {"train_loss": -39.74494552612305, "global_step": 134145, "epoch": 1108} {"train_loss": -40.290687561035156, "global_step": 134146, "epoch": 1108} {"train_loss": -39.89069366455078, "global_step": 134147, "epoch": 1108} {"train_loss": -38.61968994140625, "global_step": 134148, "epoch": 1108} {"train_loss": -39.65531539916992, "global_step": 134149, "epoch": 1108} {"train_loss": -35.00869369506836, "global_step": 134150, "epoch": 1108} {"train_loss": -38.89583969116211, "global_step": 134151, "epoch": 1108} {"train_loss": -39.69407272338867, "global_step": 134152, "epoch": 1108} {"train_loss": -37.63826370239258, "global_step": 134153, "epoch": 1108} {"train_loss": -39.07212448120117, "global_step": 134154, "epoch": 1108} {"train_loss": -39.00708770751953, "global_step": 134155, "epoch": 1108} {"train_loss": -39.13874435424805, "global_step": 134156, "epoch": 1108} {"train_loss": -39.64797592163086, "global_step": 134157, "epoch": 1108} {"train_loss": -39.17047882080078, "global_step": 134158, "epoch": 1108} {"train_loss": -39.32659912109375, "global_step": 134159, "epoch": 1108} {"train_loss": -38.53034210205078, "global_step": 134160, "epoch": 1108} {"train_loss": -39.67304229736328, "global_step": 134161, "epoch": 1108} {"train_loss": -39.781551361083984, "global_step": 134162, "epoch": 1108} {"train_loss": -38.519203186035156, "global_step": 134163, "epoch": 1108} {"train_loss": -39.23664474487305, "global_step": 134164, "epoch": 1108} {"train_loss": -39.92948913574219, "global_step": 134165, "epoch": 1108} {"train_loss": -38.67304229736328, "global_step": 134166, "epoch": 1108} {"train_loss": -38.38349914550781, "global_step": 134167, "epoch": 1108} {"train_loss": -39.63832092285156, "global_step": 134168, "epoch": 1108} {"train_loss": -38.728363037109375, "global_step": 134169, "epoch": 1108} {"train_loss": -39.30483627319336, "global_step": 134170, "epoch": 1108} {"train_loss": -39.94662094116211, "global_step": 134171, "epoch": 1108} {"train_loss": -38.06565475463867, "global_step": 134172, "epoch": 1108} {"train_loss": -38.6585693359375, "global_step": 134173, "epoch": 1108} {"train_loss": -39.579017639160156, "global_step": 134174, "epoch": 1108} {"train_loss": -37.96833419799805, "global_step": 134175, "epoch": 1108} {"train_loss": -39.34454345703125, "global_step": 134176, "epoch": 1108} {"train_loss": -39.286746978759766, "global_step": 134177, "epoch": 1108} {"train_loss": -39.832279205322266, "global_step": 134178, "epoch": 1108} {"train_loss": -39.14048767089844, "global_step": 134179, "epoch": 1108} {"train_loss": -40.326045989990234, "global_step": 134180, "epoch": 1108} {"train_loss": -40.13420104980469, "global_step": 134181, "epoch": 1108} {"train_loss": -38.54352951049805, "global_step": 134182, "epoch": 1108} {"train_loss": -39.23293685913086, "global_step": 134183, "epoch": 1108} {"train_loss": -39.38124084472656, "global_step": 134184, "epoch": 1108} {"train_loss": -39.9632682800293, "global_step": 134185, "epoch": 1108} {"train_loss": -38.9699821472168, "global_step": 134186, "epoch": 1108} {"train_loss": -39.83872604370117, "global_step": 134187, "epoch": 1108} {"train_loss": -38.916874341728274, "global_step": 134188, "epoch": 1108, "val_loss": 2712814.75} {"train_loss": -39.54587936401367, "global_step": 134189, "epoch": 1109} {"train_loss": -39.60654067993164, "global_step": 134190, "epoch": 1109} {"train_loss": -40.74892807006836, "global_step": 134191, "epoch": 1109} {"train_loss": -39.88836669921875, "global_step": 134192, "epoch": 1109} {"train_loss": -40.143531799316406, "global_step": 134193, "epoch": 1109} {"train_loss": -40.03696823120117, "global_step": 134194, "epoch": 1109} {"train_loss": -39.9678955078125, "global_step": 134195, "epoch": 1109} {"train_loss": -40.43825149536133, "global_step": 134196, "epoch": 1109} {"train_loss": -39.90656661987305, "global_step": 134197, "epoch": 1109} {"train_loss": -40.27259826660156, "global_step": 134198, "epoch": 1109} {"train_loss": -40.096439361572266, "global_step": 134199, "epoch": 1109} {"train_loss": -39.89976119995117, "global_step": 134200, "epoch": 1109} {"train_loss": -40.350486755371094, "global_step": 134201, "epoch": 1109} {"train_loss": -40.92568588256836, "global_step": 134202, "epoch": 1109} {"train_loss": -40.503807067871094, "global_step": 134203, "epoch": 1109} {"train_loss": -40.74223327636719, "global_step": 134204, "epoch": 1109} {"train_loss": -40.35866928100586, "global_step": 134205, "epoch": 1109} {"train_loss": -39.75508499145508, "global_step": 134206, "epoch": 1109} {"train_loss": -40.12929916381836, "global_step": 134207, "epoch": 1109} {"train_loss": -39.97327423095703, "global_step": 134208, "epoch": 1109} {"train_loss": -39.792720794677734, "global_step": 134209, "epoch": 1109} {"train_loss": -40.31648635864258, "global_step": 134210, "epoch": 1109} {"train_loss": -39.82535171508789, "global_step": 134211, "epoch": 1109} {"train_loss": -40.259033203125, "global_step": 134212, "epoch": 1109} {"train_loss": -40.46403884887695, "global_step": 134213, "epoch": 1109} {"train_loss": -40.95799255371094, "global_step": 134214, "epoch": 1109} {"train_loss": -40.178340911865234, "global_step": 134215, "epoch": 1109} {"train_loss": -40.49287033081055, "global_step": 134216, "epoch": 1109} {"train_loss": -40.242462158203125, "global_step": 134217, "epoch": 1109} {"train_loss": -40.335113525390625, "global_step": 134218, "epoch": 1109} {"train_loss": -40.77309799194336, "global_step": 134219, "epoch": 1109} {"train_loss": -40.14439010620117, "global_step": 134220, "epoch": 1109} {"train_loss": -40.38688278198242, "global_step": 134221, "epoch": 1109} {"train_loss": -40.438777923583984, "global_step": 134222, "epoch": 1109} {"train_loss": -40.830928802490234, "global_step": 134223, "epoch": 1109} {"train_loss": -39.4951057434082, "global_step": 134224, "epoch": 1109} {"train_loss": -39.93729782104492, "global_step": 134225, "epoch": 1109} {"train_loss": -40.46217727661133, "global_step": 134226, "epoch": 1109} {"train_loss": -39.5470085144043, "global_step": 134227, "epoch": 1109} {"train_loss": -39.45437240600586, "global_step": 134228, "epoch": 1109} {"train_loss": -40.1141357421875, "global_step": 134229, "epoch": 1109} {"train_loss": -39.980140686035156, "global_step": 134230, "epoch": 1109} {"train_loss": -38.15668869018555, "global_step": 134231, "epoch": 1109} {"train_loss": -38.567604064941406, "global_step": 134232, "epoch": 1109} {"train_loss": -36.8971061706543, "global_step": 134233, "epoch": 1109} {"train_loss": -35.47384262084961, "global_step": 134234, "epoch": 1109} {"train_loss": -35.072479248046875, "global_step": 134235, "epoch": 1109} {"train_loss": -35.9862174987793, "global_step": 134236, "epoch": 1109} {"train_loss": -38.19802474975586, "global_step": 134237, "epoch": 1109} {"train_loss": -38.84505081176758, "global_step": 134238, "epoch": 1109} {"train_loss": -38.268531799316406, "global_step": 134239, "epoch": 1109} {"train_loss": -38.2220344543457, "global_step": 134240, "epoch": 1109} {"train_loss": -38.8538932800293, "global_step": 134241, "epoch": 1109} {"train_loss": -38.94649124145508, "global_step": 134242, "epoch": 1109} {"train_loss": -37.87251281738281, "global_step": 134243, "epoch": 1109} {"train_loss": -39.521793365478516, "global_step": 134244, "epoch": 1109} {"train_loss": -38.06818771362305, "global_step": 134245, "epoch": 1109} {"train_loss": -37.881866455078125, "global_step": 134246, "epoch": 1109} {"train_loss": -38.956424713134766, "global_step": 134247, "epoch": 1109} {"train_loss": -38.952518463134766, "global_step": 134248, "epoch": 1109} {"train_loss": -38.8928337097168, "global_step": 134249, "epoch": 1109} {"train_loss": -39.84114456176758, "global_step": 134250, "epoch": 1109} {"train_loss": -37.60674285888672, "global_step": 134251, "epoch": 1109} {"train_loss": -37.87648391723633, "global_step": 134252, "epoch": 1109} {"train_loss": -39.14795684814453, "global_step": 134253, "epoch": 1109} {"train_loss": -37.82262420654297, "global_step": 134254, "epoch": 1109} {"train_loss": -37.12725067138672, "global_step": 134255, "epoch": 1109} {"train_loss": -39.36703109741211, "global_step": 134256, "epoch": 1109} {"train_loss": -37.632625579833984, "global_step": 134257, "epoch": 1109} {"train_loss": -38.5118293762207, "global_step": 134258, "epoch": 1109} {"train_loss": -36.805908203125, "global_step": 134259, "epoch": 1109} {"train_loss": -37.83587646484375, "global_step": 134260, "epoch": 1109} {"train_loss": -37.95655059814453, "global_step": 134261, "epoch": 1109} {"train_loss": -38.16933822631836, "global_step": 134262, "epoch": 1109} {"train_loss": -38.731056213378906, "global_step": 134263, "epoch": 1109} {"train_loss": -37.60459518432617, "global_step": 134264, "epoch": 1109} {"train_loss": -37.52091598510742, "global_step": 134265, "epoch": 1109} {"train_loss": -39.328895568847656, "global_step": 134266, "epoch": 1109} {"train_loss": -38.297584533691406, "global_step": 134267, "epoch": 1109} {"train_loss": -39.16389083862305, "global_step": 134268, "epoch": 1109} {"train_loss": -38.12412643432617, "global_step": 134269, "epoch": 1109} {"train_loss": -37.640506744384766, "global_step": 134270, "epoch": 1109} {"train_loss": -38.95759201049805, "global_step": 134271, "epoch": 1109} {"train_loss": -38.81996154785156, "global_step": 134272, "epoch": 1109} {"train_loss": -37.52865219116211, "global_step": 134273, "epoch": 1109} {"train_loss": -39.25761795043945, "global_step": 134274, "epoch": 1109} {"train_loss": -38.88350296020508, "global_step": 134275, "epoch": 1109} {"train_loss": -39.258995056152344, "global_step": 134276, "epoch": 1109} {"train_loss": -39.42402267456055, "global_step": 134277, "epoch": 1109} {"train_loss": -39.772796630859375, "global_step": 134278, "epoch": 1109} {"train_loss": -39.09185791015625, "global_step": 134279, "epoch": 1109} {"train_loss": -38.81247329711914, "global_step": 134280, "epoch": 1109} {"train_loss": -39.84521484375, "global_step": 134281, "epoch": 1109} {"train_loss": -39.81087875366211, "global_step": 134282, "epoch": 1109} {"train_loss": -38.84109878540039, "global_step": 134283, "epoch": 1109} {"train_loss": -39.64492416381836, "global_step": 134284, "epoch": 1109} {"train_loss": -39.933563232421875, "global_step": 134285, "epoch": 1109} {"train_loss": -39.56806564331055, "global_step": 134286, "epoch": 1109} {"train_loss": -39.833984375, "global_step": 134287, "epoch": 1109} {"train_loss": -39.56816482543945, "global_step": 134288, "epoch": 1109} {"train_loss": -36.70096969604492, "global_step": 134289, "epoch": 1109} {"train_loss": -39.45083999633789, "global_step": 134290, "epoch": 1109} {"train_loss": -39.08576583862305, "global_step": 134291, "epoch": 1109} {"train_loss": -39.2738151550293, "global_step": 134292, "epoch": 1109} {"train_loss": -39.36555099487305, "global_step": 134293, "epoch": 1109} {"train_loss": -39.701900482177734, "global_step": 134294, "epoch": 1109} {"train_loss": -40.1258544921875, "global_step": 134295, "epoch": 1109} {"train_loss": -40.01093292236328, "global_step": 134296, "epoch": 1109} {"train_loss": -40.03425216674805, "global_step": 134297, "epoch": 1109} {"train_loss": -39.69656753540039, "global_step": 134298, "epoch": 1109} {"train_loss": -39.40692901611328, "global_step": 134299, "epoch": 1109} {"train_loss": -39.20212936401367, "global_step": 134300, "epoch": 1109} {"train_loss": -36.87954330444336, "global_step": 134301, "epoch": 1109} {"train_loss": -39.62290573120117, "global_step": 134302, "epoch": 1109} {"train_loss": -38.15635299682617, "global_step": 134303, "epoch": 1109} {"train_loss": -38.65034484863281, "global_step": 134304, "epoch": 1109} {"train_loss": -40.33625411987305, "global_step": 134305, "epoch": 1109} {"train_loss": -38.69361877441406, "global_step": 134306, "epoch": 1109} {"train_loss": -39.70408248901367, "global_step": 134307, "epoch": 1109} {"train_loss": -38.73458480834961, "global_step": 134308, "epoch": 1109} {"train_loss": -39.18391361709469, "global_step": 134309, "epoch": 1109, "val_loss": 2510723.5} {"train_loss": -39.46395492553711, "global_step": 134310, "epoch": 1110} {"train_loss": -40.34462356567383, "global_step": 134311, "epoch": 1110} {"train_loss": -39.87916946411133, "global_step": 134312, "epoch": 1110} {"train_loss": -40.059478759765625, "global_step": 134313, "epoch": 1110} {"train_loss": -38.232051849365234, "global_step": 134314, "epoch": 1110} {"train_loss": -39.610992431640625, "global_step": 134315, "epoch": 1110} {"train_loss": -40.14115524291992, "global_step": 134316, "epoch": 1110} {"train_loss": -39.70830154418945, "global_step": 134317, "epoch": 1110} {"train_loss": -40.22575378417969, "global_step": 134318, "epoch": 1110} {"train_loss": -39.83323287963867, "global_step": 134319, "epoch": 1110} {"train_loss": -39.951576232910156, "global_step": 134320, "epoch": 1110} {"train_loss": -39.12810134887695, "global_step": 134321, "epoch": 1110} {"train_loss": -38.83838653564453, "global_step": 134322, "epoch": 1110} {"train_loss": -38.99577713012695, "global_step": 134323, "epoch": 1110} {"train_loss": -39.930458068847656, "global_step": 134324, "epoch": 1110} {"train_loss": -39.281768798828125, "global_step": 134325, "epoch": 1110} {"train_loss": -38.179107666015625, "global_step": 134326, "epoch": 1110} {"train_loss": -39.14310836791992, "global_step": 134327, "epoch": 1110} {"train_loss": -40.11526107788086, "global_step": 134328, "epoch": 1110} {"train_loss": -39.83271026611328, "global_step": 134329, "epoch": 1110} {"train_loss": -39.28643798828125, "global_step": 134330, "epoch": 1110} {"train_loss": -40.166290283203125, "global_step": 134331, "epoch": 1110} {"train_loss": -40.57688522338867, "global_step": 134332, "epoch": 1110} {"train_loss": -40.11740493774414, "global_step": 134333, "epoch": 1110} {"train_loss": -39.913909912109375, "global_step": 134334, "epoch": 1110} {"train_loss": -40.407283782958984, "global_step": 134335, "epoch": 1110} {"train_loss": -39.317787170410156, "global_step": 134336, "epoch": 1110} {"train_loss": -39.75513458251953, "global_step": 134337, "epoch": 1110} {"train_loss": -40.3083610534668, "global_step": 134338, "epoch": 1110} {"train_loss": -39.98799514770508, "global_step": 134339, "epoch": 1110} {"train_loss": -39.24837875366211, "global_step": 134340, "epoch": 1110} {"train_loss": -36.64923858642578, "global_step": 134341, "epoch": 1110} {"train_loss": -35.67988204956055, "global_step": 134342, "epoch": 1110} {"train_loss": -39.20063400268555, "global_step": 134343, "epoch": 1110} {"train_loss": -38.99906539916992, "global_step": 134344, "epoch": 1110} {"train_loss": -37.63124465942383, "global_step": 134345, "epoch": 1110} {"train_loss": -37.70541000366211, "global_step": 134346, "epoch": 1110} {"train_loss": -37.07342529296875, "global_step": 134347, "epoch": 1110} {"train_loss": -40.11792755126953, "global_step": 134348, "epoch": 1110} {"train_loss": -37.72764205932617, "global_step": 134349, "epoch": 1110} {"train_loss": -37.211822509765625, "global_step": 134350, "epoch": 1110} {"train_loss": -37.520511627197266, "global_step": 134351, "epoch": 1110} {"train_loss": -38.59600830078125, "global_step": 134352, "epoch": 1110} {"train_loss": -38.636558532714844, "global_step": 134353, "epoch": 1110} {"train_loss": -37.6343879699707, "global_step": 134354, "epoch": 1110} {"train_loss": -38.128173828125, "global_step": 134355, "epoch": 1110} {"train_loss": -39.91624069213867, "global_step": 134356, "epoch": 1110} {"train_loss": -38.36542510986328, "global_step": 134357, "epoch": 1110} {"train_loss": -39.05927276611328, "global_step": 134358, "epoch": 1110} {"train_loss": -39.33043670654297, "global_step": 134359, "epoch": 1110} {"train_loss": -39.019527435302734, "global_step": 134360, "epoch": 1110} {"train_loss": -39.656620025634766, "global_step": 134361, "epoch": 1110} {"train_loss": -39.126564025878906, "global_step": 134362, "epoch": 1110} {"train_loss": -39.202781677246094, "global_step": 134363, "epoch": 1110} {"train_loss": -38.331783294677734, "global_step": 134364, "epoch": 1110} {"train_loss": -38.58502197265625, "global_step": 134365, "epoch": 1110} {"train_loss": -37.62910079956055, "global_step": 134366, "epoch": 1110} {"train_loss": -40.125545501708984, "global_step": 134367, "epoch": 1110} {"train_loss": -38.450050354003906, "global_step": 134368, "epoch": 1110} {"train_loss": -39.03287887573242, "global_step": 134369, "epoch": 1110} {"train_loss": -39.6660270690918, "global_step": 134370, "epoch": 1110} {"train_loss": -38.8575553894043, "global_step": 134371, "epoch": 1110} {"train_loss": -39.25759506225586, "global_step": 134372, "epoch": 1110} {"train_loss": -39.09133529663086, "global_step": 134373, "epoch": 1110} {"train_loss": -39.45249557495117, "global_step": 134374, "epoch": 1110} {"train_loss": -40.039031982421875, "global_step": 134375, "epoch": 1110} {"train_loss": -40.01296615600586, "global_step": 134376, "epoch": 1110} {"train_loss": -39.946102142333984, "global_step": 134377, "epoch": 1110} {"train_loss": -40.51296615600586, "global_step": 134378, "epoch": 1110} {"train_loss": -39.906463623046875, "global_step": 134379, "epoch": 1110} {"train_loss": -40.22333908081055, "global_step": 134380, "epoch": 1110} {"train_loss": -40.20765686035156, "global_step": 134381, "epoch": 1110} {"train_loss": -40.12070846557617, "global_step": 134382, "epoch": 1110} {"train_loss": -40.06017303466797, "global_step": 134383, "epoch": 1110} {"train_loss": -40.425209045410156, "global_step": 134384, "epoch": 1110} {"train_loss": -40.185791015625, "global_step": 134385, "epoch": 1110} {"train_loss": -40.399166107177734, "global_step": 134386, "epoch": 1110} {"train_loss": -39.80609130859375, "global_step": 134387, "epoch": 1110} {"train_loss": -40.192108154296875, "global_step": 134388, "epoch": 1110} {"train_loss": -39.66457748413086, "global_step": 134389, "epoch": 1110} {"train_loss": -40.81758117675781, "global_step": 134390, "epoch": 1110} {"train_loss": -40.81217956542969, "global_step": 134391, "epoch": 1110} {"train_loss": -40.3458137512207, "global_step": 134392, "epoch": 1110} {"train_loss": -40.49624252319336, "global_step": 134393, "epoch": 1110} {"train_loss": -40.18187713623047, "global_step": 134394, "epoch": 1110} {"train_loss": -37.4079475402832, "global_step": 134395, "epoch": 1110} {"train_loss": -37.4364128112793, "global_step": 134396, "epoch": 1110} {"train_loss": -35.846675872802734, "global_step": 134397, "epoch": 1110} {"train_loss": -31.514968872070312, "global_step": 134398, "epoch": 1110} {"train_loss": -32.9128303527832, "global_step": 134399, "epoch": 1110} {"train_loss": -38.35551071166992, "global_step": 134400, "epoch": 1110} {"train_loss": -39.49058532714844, "global_step": 134401, "epoch": 1110} {"train_loss": -37.711307525634766, "global_step": 134402, "epoch": 1110} {"train_loss": -39.95060729980469, "global_step": 134403, "epoch": 1110} {"train_loss": -39.01968002319336, "global_step": 134404, "epoch": 1110} {"train_loss": -38.95832443237305, "global_step": 134405, "epoch": 1110} {"train_loss": -39.60088348388672, "global_step": 134406, "epoch": 1110} {"train_loss": -38.538055419921875, "global_step": 134407, "epoch": 1110} {"train_loss": -39.969966888427734, "global_step": 134408, "epoch": 1110} {"train_loss": -39.53287887573242, "global_step": 134409, "epoch": 1110} {"train_loss": -40.18741226196289, "global_step": 134410, "epoch": 1110} {"train_loss": -39.58193588256836, "global_step": 134411, "epoch": 1110} {"train_loss": -39.94422149658203, "global_step": 134412, "epoch": 1110} {"train_loss": -39.60736846923828, "global_step": 134413, "epoch": 1110} {"train_loss": -39.740604400634766, "global_step": 134414, "epoch": 1110} {"train_loss": -40.36260986328125, "global_step": 134415, "epoch": 1110} {"train_loss": -40.173439025878906, "global_step": 134416, "epoch": 1110} {"train_loss": -40.28779983520508, "global_step": 134417, "epoch": 1110} {"train_loss": -39.83997344970703, "global_step": 134418, "epoch": 1110} {"train_loss": -39.73850631713867, "global_step": 134419, "epoch": 1110} {"train_loss": -39.25372314453125, "global_step": 134420, "epoch": 1110} {"train_loss": -40.241275787353516, "global_step": 134421, "epoch": 1110} {"train_loss": -40.54197311401367, "global_step": 134422, "epoch": 1110} {"train_loss": -39.00232696533203, "global_step": 134423, "epoch": 1110} {"train_loss": -39.87321090698242, "global_step": 134424, "epoch": 1110} {"train_loss": -38.551597595214844, "global_step": 134425, "epoch": 1110} {"train_loss": -39.66279983520508, "global_step": 134426, "epoch": 1110} {"train_loss": -40.171669006347656, "global_step": 134427, "epoch": 1110} {"train_loss": -39.888309478759766, "global_step": 134428, "epoch": 1110} {"train_loss": -39.711055755615234, "global_step": 134429, "epoch": 1110} {"train_loss": -39.2385738467382, "global_step": 134430, "epoch": 1110, "val_loss": 2668123.0} {"train_loss": -40.20735168457031, "global_step": 134431, "epoch": 1111} {"train_loss": -39.87839889526367, "global_step": 134432, "epoch": 1111} {"train_loss": -39.95487976074219, "global_step": 134433, "epoch": 1111} {"train_loss": -40.247066497802734, "global_step": 134434, "epoch": 1111} {"train_loss": -40.2608642578125, "global_step": 134435, "epoch": 1111} {"train_loss": -40.276973724365234, "global_step": 134436, "epoch": 1111} {"train_loss": -39.57603073120117, "global_step": 134437, "epoch": 1111} {"train_loss": -40.14571762084961, "global_step": 134438, "epoch": 1111} {"train_loss": -40.14148712158203, "global_step": 134439, "epoch": 1111} {"train_loss": -40.05517578125, "global_step": 134440, "epoch": 1111} {"train_loss": -39.807106018066406, "global_step": 134441, "epoch": 1111} {"train_loss": -40.020355224609375, "global_step": 134442, "epoch": 1111} {"train_loss": -40.1549186706543, "global_step": 134443, "epoch": 1111} {"train_loss": -39.65707015991211, "global_step": 134444, "epoch": 1111} {"train_loss": -39.69906997680664, "global_step": 134445, "epoch": 1111} {"train_loss": -39.68889236450195, "global_step": 134446, "epoch": 1111} {"train_loss": -39.77345657348633, "global_step": 134447, "epoch": 1111} {"train_loss": -39.48325729370117, "global_step": 134448, "epoch": 1111} {"train_loss": -39.32183837890625, "global_step": 134449, "epoch": 1111} {"train_loss": -39.759761810302734, "global_step": 134450, "epoch": 1111} {"train_loss": -36.79777908325195, "global_step": 134451, "epoch": 1111} {"train_loss": -36.44023132324219, "global_step": 134452, "epoch": 1111} {"train_loss": -33.55971908569336, "global_step": 134453, "epoch": 1111} {"train_loss": -33.853851318359375, "global_step": 134454, "epoch": 1111} {"train_loss": -35.37135696411133, "global_step": 134455, "epoch": 1111} {"train_loss": -37.66898727416992, "global_step": 134456, "epoch": 1111} {"train_loss": -37.21138381958008, "global_step": 134457, "epoch": 1111} {"train_loss": -38.117733001708984, "global_step": 134458, "epoch": 1111} {"train_loss": -38.29606246948242, "global_step": 134459, "epoch": 1111} {"train_loss": -39.4567756652832, "global_step": 134460, "epoch": 1111} {"train_loss": -37.914588928222656, "global_step": 134461, "epoch": 1111} {"train_loss": -39.55147933959961, "global_step": 134462, "epoch": 1111} {"train_loss": -39.52225875854492, "global_step": 134463, "epoch": 1111} {"train_loss": -39.462013244628906, "global_step": 134464, "epoch": 1111} {"train_loss": -39.50362777709961, "global_step": 134465, "epoch": 1111} {"train_loss": -39.68659973144531, "global_step": 134466, "epoch": 1111} {"train_loss": -39.063289642333984, "global_step": 134467, "epoch": 1111} {"train_loss": -39.370330810546875, "global_step": 134468, "epoch": 1111} {"train_loss": -38.803951263427734, "global_step": 134469, "epoch": 1111} {"train_loss": -39.668888092041016, "global_step": 134470, "epoch": 1111} {"train_loss": -39.62746047973633, "global_step": 134471, "epoch": 1111} {"train_loss": -40.0246696472168, "global_step": 134472, "epoch": 1111} {"train_loss": -39.14533233642578, "global_step": 134473, "epoch": 1111} {"train_loss": -39.53800582885742, "global_step": 134474, "epoch": 1111} {"train_loss": -40.13618850708008, "global_step": 134475, "epoch": 1111} {"train_loss": -40.03852844238281, "global_step": 134476, "epoch": 1111} {"train_loss": -40.6032600402832, "global_step": 134477, "epoch": 1111} {"train_loss": -39.80947494506836, "global_step": 134478, "epoch": 1111} {"train_loss": -39.491065979003906, "global_step": 134479, "epoch": 1111} {"train_loss": -39.467533111572266, "global_step": 134480, "epoch": 1111} {"train_loss": -39.43535232543945, "global_step": 134481, "epoch": 1111} {"train_loss": -39.75859069824219, "global_step": 134482, "epoch": 1111} {"train_loss": -39.636817932128906, "global_step": 134483, "epoch": 1111} {"train_loss": -39.9556884765625, "global_step": 134484, "epoch": 1111} {"train_loss": -39.44021987915039, "global_step": 134485, "epoch": 1111} {"train_loss": -40.07416915893555, "global_step": 134486, "epoch": 1111} {"train_loss": -39.34541702270508, "global_step": 134487, "epoch": 1111} {"train_loss": -39.470458984375, "global_step": 134488, "epoch": 1111} {"train_loss": -40.0584831237793, "global_step": 134489, "epoch": 1111} {"train_loss": -40.0291633605957, "global_step": 134490, "epoch": 1111} {"train_loss": -40.478694915771484, "global_step": 134491, "epoch": 1111} {"train_loss": -39.091609954833984, "global_step": 134492, "epoch": 1111} {"train_loss": -40.38703155517578, "global_step": 134493, "epoch": 1111} {"train_loss": -40.15208053588867, "global_step": 134494, "epoch": 1111} {"train_loss": -40.05660629272461, "global_step": 134495, "epoch": 1111} {"train_loss": -39.592002868652344, "global_step": 134496, "epoch": 1111} {"train_loss": -39.93967819213867, "global_step": 134497, "epoch": 1111} {"train_loss": -39.977840423583984, "global_step": 134498, "epoch": 1111} {"train_loss": -38.33187484741211, "global_step": 134499, "epoch": 1111} {"train_loss": -38.70771408081055, "global_step": 134500, "epoch": 1111} {"train_loss": -39.11295700073242, "global_step": 134501, "epoch": 1111} {"train_loss": -39.165687561035156, "global_step": 134502, "epoch": 1111} {"train_loss": -39.314449310302734, "global_step": 134503, "epoch": 1111} {"train_loss": -40.257503509521484, "global_step": 134504, "epoch": 1111} {"train_loss": -40.39775466918945, "global_step": 134505, "epoch": 1111} {"train_loss": -39.255184173583984, "global_step": 134506, "epoch": 1111} {"train_loss": -40.82601547241211, "global_step": 134507, "epoch": 1111} {"train_loss": -40.622650146484375, "global_step": 134508, "epoch": 1111} {"train_loss": -39.51085662841797, "global_step": 134509, "epoch": 1111} {"train_loss": -39.86617660522461, "global_step": 134510, "epoch": 1111} {"train_loss": -40.32426071166992, "global_step": 134511, "epoch": 1111} {"train_loss": -39.95359420776367, "global_step": 134512, "epoch": 1111} {"train_loss": -36.50515365600586, "global_step": 134513, "epoch": 1111} {"train_loss": -39.703372955322266, "global_step": 134514, "epoch": 1111} {"train_loss": -38.78969955444336, "global_step": 134515, "epoch": 1111} {"train_loss": -39.90141677856445, "global_step": 134516, "epoch": 1111} {"train_loss": -40.06008529663086, "global_step": 134517, "epoch": 1111} {"train_loss": -39.652042388916016, "global_step": 134518, "epoch": 1111} {"train_loss": -39.950050354003906, "global_step": 134519, "epoch": 1111} {"train_loss": -36.91924285888672, "global_step": 134520, "epoch": 1111} {"train_loss": -38.5776481628418, "global_step": 134521, "epoch": 1111} {"train_loss": -39.27415466308594, "global_step": 134522, "epoch": 1111} {"train_loss": -37.7519416809082, "global_step": 134523, "epoch": 1111} {"train_loss": -39.00498580932617, "global_step": 134524, "epoch": 1111} {"train_loss": -38.24151611328125, "global_step": 134525, "epoch": 1111} {"train_loss": -39.09225845336914, "global_step": 134526, "epoch": 1111} {"train_loss": -37.69541931152344, "global_step": 134527, "epoch": 1111} {"train_loss": -39.4033088684082, "global_step": 134528, "epoch": 1111} {"train_loss": -39.65685272216797, "global_step": 134529, "epoch": 1111} {"train_loss": -38.782325744628906, "global_step": 134530, "epoch": 1111} {"train_loss": -38.59711837768555, "global_step": 134531, "epoch": 1111} {"train_loss": -39.34416580200195, "global_step": 134532, "epoch": 1111} {"train_loss": -38.842308044433594, "global_step": 134533, "epoch": 1111} {"train_loss": -38.13833236694336, "global_step": 134534, "epoch": 1111} {"train_loss": -38.848854064941406, "global_step": 134535, "epoch": 1111} {"train_loss": -39.57187271118164, "global_step": 134536, "epoch": 1111} {"train_loss": -38.37073516845703, "global_step": 134537, "epoch": 1111} {"train_loss": -38.751976013183594, "global_step": 134538, "epoch": 1111} {"train_loss": -38.58805847167969, "global_step": 134539, "epoch": 1111} {"train_loss": -39.48452377319336, "global_step": 134540, "epoch": 1111} {"train_loss": -38.33781051635742, "global_step": 134541, "epoch": 1111} {"train_loss": -38.595821380615234, "global_step": 134542, "epoch": 1111} {"train_loss": -39.556854248046875, "global_step": 134543, "epoch": 1111} {"train_loss": -37.51601791381836, "global_step": 134544, "epoch": 1111} {"train_loss": -39.258487701416016, "global_step": 134545, "epoch": 1111} {"train_loss": -39.3752555847168, "global_step": 134546, "epoch": 1111} {"train_loss": -39.17232131958008, "global_step": 134547, "epoch": 1111} {"train_loss": -38.51483917236328, "global_step": 134548, "epoch": 1111} {"train_loss": -39.01338195800781, "global_step": 134549, "epoch": 1111} {"train_loss": -37.16573715209961, "global_step": 134550, "epoch": 1111} {"train_loss": -39.18480102286851, "global_step": 134551, "epoch": 1111, "val_loss": 2572444.75} {"train_loss": -38.098968505859375, "global_step": 134552, "epoch": 1112} {"train_loss": -38.3620491027832, "global_step": 134553, "epoch": 1112} {"train_loss": -37.37076950073242, "global_step": 134554, "epoch": 1112} {"train_loss": -38.30561447143555, "global_step": 134555, "epoch": 1112} {"train_loss": -38.93160629272461, "global_step": 134556, "epoch": 1112} {"train_loss": -38.69380569458008, "global_step": 134557, "epoch": 1112} {"train_loss": -38.85261917114258, "global_step": 134558, "epoch": 1112} {"train_loss": -39.759334564208984, "global_step": 134559, "epoch": 1112} {"train_loss": -39.571468353271484, "global_step": 134560, "epoch": 1112} {"train_loss": -37.022361755371094, "global_step": 134561, "epoch": 1112} {"train_loss": -36.41773223876953, "global_step": 134562, "epoch": 1112} {"train_loss": -37.78203201293945, "global_step": 134563, "epoch": 1112} {"train_loss": -37.915626525878906, "global_step": 134564, "epoch": 1112} {"train_loss": -38.904380798339844, "global_step": 134565, "epoch": 1112} {"train_loss": -38.266143798828125, "global_step": 134566, "epoch": 1112} {"train_loss": -39.045284271240234, "global_step": 134567, "epoch": 1112} {"train_loss": -30.676715850830078, "global_step": 134568, "epoch": 1112} {"train_loss": -38.24272537231445, "global_step": 134569, "epoch": 1112} {"train_loss": -37.455230712890625, "global_step": 134570, "epoch": 1112} {"train_loss": -36.20005416870117, "global_step": 134571, "epoch": 1112} {"train_loss": -36.959468841552734, "global_step": 134572, "epoch": 1112} {"train_loss": -38.89227294921875, "global_step": 134573, "epoch": 1112} {"train_loss": -38.91535568237305, "global_step": 134574, "epoch": 1112} {"train_loss": -36.16015625, "global_step": 134575, "epoch": 1112} {"train_loss": -38.12761688232422, "global_step": 134576, "epoch": 1112} {"train_loss": -38.37255859375, "global_step": 134577, "epoch": 1112} {"train_loss": -38.75596237182617, "global_step": 134578, "epoch": 1112} {"train_loss": -37.790706634521484, "global_step": 134579, "epoch": 1112} {"train_loss": -33.966312408447266, "global_step": 134580, "epoch": 1112} {"train_loss": -39.02525329589844, "global_step": 134581, "epoch": 1112} {"train_loss": -38.79165267944336, "global_step": 134582, "epoch": 1112} {"train_loss": -38.35879135131836, "global_step": 134583, "epoch": 1112} {"train_loss": -39.07950973510742, "global_step": 134584, "epoch": 1112} {"train_loss": -32.84675216674805, "global_step": 134585, "epoch": 1112} {"train_loss": -36.889041900634766, "global_step": 134586, "epoch": 1112} {"train_loss": -34.7767219543457, "global_step": 134587, "epoch": 1112} {"train_loss": -39.602718353271484, "global_step": 134588, "epoch": 1112} {"train_loss": -38.09035873413086, "global_step": 134589, "epoch": 1112} {"train_loss": -39.028377532958984, "global_step": 134590, "epoch": 1112} {"train_loss": -38.88331985473633, "global_step": 134591, "epoch": 1112} {"train_loss": -36.20935821533203, "global_step": 134592, "epoch": 1112} {"train_loss": -37.42839050292969, "global_step": 134593, "epoch": 1112} {"train_loss": -37.92524337768555, "global_step": 134594, "epoch": 1112} {"train_loss": -38.07798385620117, "global_step": 134595, "epoch": 1112} {"train_loss": -36.79681396484375, "global_step": 134596, "epoch": 1112} {"train_loss": -38.76136016845703, "global_step": 134597, "epoch": 1112} {"train_loss": -37.36558151245117, "global_step": 134598, "epoch": 1112} {"train_loss": -36.63916778564453, "global_step": 134599, "epoch": 1112} {"train_loss": -38.1214485168457, "global_step": 134600, "epoch": 1112} {"train_loss": -37.37967300415039, "global_step": 134601, "epoch": 1112} {"train_loss": -37.88314437866211, "global_step": 134602, "epoch": 1112} {"train_loss": -38.7932243347168, "global_step": 134603, "epoch": 1112} {"train_loss": -38.31242752075195, "global_step": 134604, "epoch": 1112} {"train_loss": -38.53499221801758, "global_step": 134605, "epoch": 1112} {"train_loss": -38.580684661865234, "global_step": 134606, "epoch": 1112} {"train_loss": -37.92910385131836, "global_step": 134607, "epoch": 1112} {"train_loss": -38.8507080078125, "global_step": 134608, "epoch": 1112} {"train_loss": -39.5903434753418, "global_step": 134609, "epoch": 1112} {"train_loss": -38.78180694580078, "global_step": 134610, "epoch": 1112} {"train_loss": -38.60995101928711, "global_step": 134611, "epoch": 1112} {"train_loss": -39.13703536987305, "global_step": 134612, "epoch": 1112} {"train_loss": -38.88215637207031, "global_step": 134613, "epoch": 1112} {"train_loss": -39.476444244384766, "global_step": 134614, "epoch": 1112} {"train_loss": -37.882606506347656, "global_step": 134615, "epoch": 1112} {"train_loss": -38.856563568115234, "global_step": 134616, "epoch": 1112} {"train_loss": -39.2877082824707, "global_step": 134617, "epoch": 1112} {"train_loss": -39.64814758300781, "global_step": 134618, "epoch": 1112} {"train_loss": -39.63209915161133, "global_step": 134619, "epoch": 1112} {"train_loss": -39.49615478515625, "global_step": 134620, "epoch": 1112} {"train_loss": -39.8133544921875, "global_step": 134621, "epoch": 1112} {"train_loss": -39.900821685791016, "global_step": 134622, "epoch": 1112} {"train_loss": -39.54890823364258, "global_step": 134623, "epoch": 1112} {"train_loss": -39.92625045776367, "global_step": 134624, "epoch": 1112} {"train_loss": -39.97694396972656, "global_step": 134625, "epoch": 1112} {"train_loss": -39.75968551635742, "global_step": 134626, "epoch": 1112} {"train_loss": -38.783912658691406, "global_step": 134627, "epoch": 1112} {"train_loss": -39.85585403442383, "global_step": 134628, "epoch": 1112} {"train_loss": -39.702430725097656, "global_step": 134629, "epoch": 1112} {"train_loss": -40.27351760864258, "global_step": 134630, "epoch": 1112} {"train_loss": -39.40142822265625, "global_step": 134631, "epoch": 1112} {"train_loss": -39.56526565551758, "global_step": 134632, "epoch": 1112} {"train_loss": -39.61179733276367, "global_step": 134633, "epoch": 1112} {"train_loss": -39.7721061706543, "global_step": 134634, "epoch": 1112} {"train_loss": -39.065181732177734, "global_step": 134635, "epoch": 1112} {"train_loss": -39.835601806640625, "global_step": 134636, "epoch": 1112} {"train_loss": -40.254154205322266, "global_step": 134637, "epoch": 1112} {"train_loss": -40.14216995239258, "global_step": 134638, "epoch": 1112} {"train_loss": -39.5977668762207, "global_step": 134639, "epoch": 1112} {"train_loss": -39.59133529663086, "global_step": 134640, "epoch": 1112} {"train_loss": -40.18976974487305, "global_step": 134641, "epoch": 1112} {"train_loss": -39.9109992980957, "global_step": 134642, "epoch": 1112} {"train_loss": -39.13067626953125, "global_step": 134643, "epoch": 1112} {"train_loss": -39.892364501953125, "global_step": 134644, "epoch": 1112} {"train_loss": -40.1333122253418, "global_step": 134645, "epoch": 1112} {"train_loss": -37.958709716796875, "global_step": 134646, "epoch": 1112} {"train_loss": -40.02747344970703, "global_step": 134647, "epoch": 1112} {"train_loss": -39.300453186035156, "global_step": 134648, "epoch": 1112} {"train_loss": -39.01691436767578, "global_step": 134649, "epoch": 1112} {"train_loss": -39.3167839050293, "global_step": 134650, "epoch": 1112} {"train_loss": -39.05500030517578, "global_step": 134651, "epoch": 1112} {"train_loss": -39.61985397338867, "global_step": 134652, "epoch": 1112} {"train_loss": -40.40130615234375, "global_step": 134653, "epoch": 1112} {"train_loss": -38.1772346496582, "global_step": 134654, "epoch": 1112} {"train_loss": -40.521419525146484, "global_step": 134655, "epoch": 1112} {"train_loss": -38.7678337097168, "global_step": 134656, "epoch": 1112} {"train_loss": -39.34538269042969, "global_step": 134657, "epoch": 1112} {"train_loss": -38.74795913696289, "global_step": 134658, "epoch": 1112} {"train_loss": -38.39617156982422, "global_step": 134659, "epoch": 1112} {"train_loss": -40.16461944580078, "global_step": 134660, "epoch": 1112} {"train_loss": -40.11874771118164, "global_step": 134661, "epoch": 1112} {"train_loss": -38.965721130371094, "global_step": 134662, "epoch": 1112} {"train_loss": -39.373165130615234, "global_step": 134663, "epoch": 1112} {"train_loss": -40.38032150268555, "global_step": 134664, "epoch": 1112} {"train_loss": -39.77537155151367, "global_step": 134665, "epoch": 1112} {"train_loss": -37.35093307495117, "global_step": 134666, "epoch": 1112} {"train_loss": -39.00615692138672, "global_step": 134667, "epoch": 1112} {"train_loss": -39.16660690307617, "global_step": 134668, "epoch": 1112} {"train_loss": -38.462806701660156, "global_step": 134669, "epoch": 1112} {"train_loss": -39.62025451660156, "global_step": 134670, "epoch": 1112} {"train_loss": -38.885833740234375, "global_step": 134671, "epoch": 1112} {"train_loss": -38.63190280504463, "global_step": 134672, "epoch": 1112, "val_loss": 2592932.5} {"train_loss": -38.92780303955078, "global_step": 134673, "epoch": 1113} {"train_loss": -38.93354415893555, "global_step": 134674, "epoch": 1113} {"train_loss": -36.77677917480469, "global_step": 134675, "epoch": 1113} {"train_loss": -38.908729553222656, "global_step": 134676, "epoch": 1113} {"train_loss": -40.16413116455078, "global_step": 134677, "epoch": 1113} {"train_loss": -38.68942642211914, "global_step": 134678, "epoch": 1113} {"train_loss": -38.74230194091797, "global_step": 134679, "epoch": 1113} {"train_loss": -39.4161491394043, "global_step": 134680, "epoch": 1113} {"train_loss": -40.173561096191406, "global_step": 134681, "epoch": 1113} {"train_loss": -39.14384078979492, "global_step": 134682, "epoch": 1113} {"train_loss": -39.6684684753418, "global_step": 134683, "epoch": 1113} {"train_loss": -37.11543655395508, "global_step": 134684, "epoch": 1113} {"train_loss": -37.19791793823242, "global_step": 134685, "epoch": 1113} {"train_loss": -35.119991302490234, "global_step": 134686, "epoch": 1113} {"train_loss": -37.53413009643555, "global_step": 134687, "epoch": 1113} {"train_loss": -36.65117263793945, "global_step": 134688, "epoch": 1113} {"train_loss": -39.71467208862305, "global_step": 134689, "epoch": 1113} {"train_loss": -39.51709747314453, "global_step": 134690, "epoch": 1113} {"train_loss": -38.02425765991211, "global_step": 134691, "epoch": 1113} {"train_loss": -37.59602737426758, "global_step": 134692, "epoch": 1113} {"train_loss": -39.29729461669922, "global_step": 134693, "epoch": 1113} {"train_loss": -38.940940856933594, "global_step": 134694, "epoch": 1113} {"train_loss": -38.376651763916016, "global_step": 134695, "epoch": 1113} {"train_loss": -39.40316390991211, "global_step": 134696, "epoch": 1113} {"train_loss": -39.264705657958984, "global_step": 134697, "epoch": 1113} {"train_loss": -38.34351348876953, "global_step": 134698, "epoch": 1113} {"train_loss": -40.08513641357422, "global_step": 134699, "epoch": 1113} {"train_loss": -39.78718566894531, "global_step": 134700, "epoch": 1113} {"train_loss": -39.908302307128906, "global_step": 134701, "epoch": 1113} {"train_loss": -39.648136138916016, "global_step": 134702, "epoch": 1113} {"train_loss": -37.29069900512695, "global_step": 134703, "epoch": 1113} {"train_loss": -39.5722770690918, "global_step": 134704, "epoch": 1113} {"train_loss": -39.876991271972656, "global_step": 134705, "epoch": 1113} {"train_loss": -39.84351348876953, "global_step": 134706, "epoch": 1113} {"train_loss": -38.81008529663086, "global_step": 134707, "epoch": 1113} {"train_loss": -39.055416107177734, "global_step": 134708, "epoch": 1113} {"train_loss": -39.0507698059082, "global_step": 134709, "epoch": 1113} {"train_loss": -37.87172317504883, "global_step": 134710, "epoch": 1113} {"train_loss": -36.46929931640625, "global_step": 134711, "epoch": 1113} {"train_loss": -38.806121826171875, "global_step": 134712, "epoch": 1113} {"train_loss": -38.27009963989258, "global_step": 134713, "epoch": 1113} {"train_loss": -37.126686096191406, "global_step": 134714, "epoch": 1113} {"train_loss": -32.85637283325195, "global_step": 134715, "epoch": 1113} {"train_loss": -36.74311447143555, "global_step": 134716, "epoch": 1113} {"train_loss": -38.45551681518555, "global_step": 134717, "epoch": 1113} {"train_loss": -36.89557647705078, "global_step": 134718, "epoch": 1113} {"train_loss": -37.56026077270508, "global_step": 134719, "epoch": 1113} {"train_loss": -38.937171936035156, "global_step": 134720, "epoch": 1113} {"train_loss": -36.5518913269043, "global_step": 134721, "epoch": 1113} {"train_loss": -37.42044448852539, "global_step": 134722, "epoch": 1113} {"train_loss": -38.52281188964844, "global_step": 134723, "epoch": 1113} {"train_loss": -38.4004020690918, "global_step": 134724, "epoch": 1113} {"train_loss": -38.93563461303711, "global_step": 134725, "epoch": 1113} {"train_loss": -38.30489730834961, "global_step": 134726, "epoch": 1113} {"train_loss": -38.79836654663086, "global_step": 134727, "epoch": 1113} {"train_loss": -38.90341567993164, "global_step": 134728, "epoch": 1113} {"train_loss": -38.61998748779297, "global_step": 134729, "epoch": 1113} {"train_loss": -39.233524322509766, "global_step": 134730, "epoch": 1113} {"train_loss": -38.88193893432617, "global_step": 134731, "epoch": 1113} {"train_loss": -39.60942459106445, "global_step": 134732, "epoch": 1113} {"train_loss": -39.56629180908203, "global_step": 134733, "epoch": 1113} {"train_loss": -38.76371383666992, "global_step": 134734, "epoch": 1113} {"train_loss": -39.50144577026367, "global_step": 134735, "epoch": 1113} {"train_loss": -38.99101638793945, "global_step": 134736, "epoch": 1113} {"train_loss": -37.76475143432617, "global_step": 134737, "epoch": 1113} {"train_loss": -37.8262939453125, "global_step": 134738, "epoch": 1113} {"train_loss": -39.189453125, "global_step": 134739, "epoch": 1113} {"train_loss": -38.737091064453125, "global_step": 134740, "epoch": 1113} {"train_loss": -39.48594665527344, "global_step": 134741, "epoch": 1113} {"train_loss": -39.20046615600586, "global_step": 134742, "epoch": 1113} {"train_loss": -39.5885124206543, "global_step": 134743, "epoch": 1113} {"train_loss": -38.96875762939453, "global_step": 134744, "epoch": 1113} {"train_loss": -39.89198303222656, "global_step": 134745, "epoch": 1113} {"train_loss": -39.196903228759766, "global_step": 134746, "epoch": 1113} {"train_loss": -39.82239532470703, "global_step": 134747, "epoch": 1113} {"train_loss": -39.0025749206543, "global_step": 134748, "epoch": 1113} {"train_loss": -40.24775314331055, "global_step": 134749, "epoch": 1113} {"train_loss": -38.8537483215332, "global_step": 134750, "epoch": 1113} {"train_loss": -39.513336181640625, "global_step": 134751, "epoch": 1113} {"train_loss": -39.064064025878906, "global_step": 134752, "epoch": 1113} {"train_loss": -39.209835052490234, "global_step": 134753, "epoch": 1113} {"train_loss": -39.43498229980469, "global_step": 134754, "epoch": 1113} {"train_loss": -40.09265899658203, "global_step": 134755, "epoch": 1113} {"train_loss": -39.26760482788086, "global_step": 134756, "epoch": 1113} {"train_loss": -39.51677703857422, "global_step": 134757, "epoch": 1113} {"train_loss": -39.93121337890625, "global_step": 134758, "epoch": 1113} {"train_loss": -40.147743225097656, "global_step": 134759, "epoch": 1113} {"train_loss": -40.08782196044922, "global_step": 134760, "epoch": 1113} {"train_loss": -40.32509231567383, "global_step": 134761, "epoch": 1113} {"train_loss": -39.88792419433594, "global_step": 134762, "epoch": 1113} {"train_loss": -39.943946838378906, "global_step": 134763, "epoch": 1113} {"train_loss": -40.10900115966797, "global_step": 134764, "epoch": 1113} {"train_loss": -39.365211486816406, "global_step": 134765, "epoch": 1113} {"train_loss": -38.649452209472656, "global_step": 134766, "epoch": 1113} {"train_loss": -37.817562103271484, "global_step": 134767, "epoch": 1113} {"train_loss": -38.03871154785156, "global_step": 134768, "epoch": 1113} {"train_loss": -37.1064338684082, "global_step": 134769, "epoch": 1113} {"train_loss": -39.68488693237305, "global_step": 134770, "epoch": 1113} {"train_loss": -39.97291946411133, "global_step": 134771, "epoch": 1113} {"train_loss": -38.57377243041992, "global_step": 134772, "epoch": 1113} {"train_loss": -36.540897369384766, "global_step": 134773, "epoch": 1113} {"train_loss": -38.27458572387695, "global_step": 134774, "epoch": 1113} {"train_loss": -38.88800811767578, "global_step": 134775, "epoch": 1113} {"train_loss": -39.92458724975586, "global_step": 134776, "epoch": 1113} {"train_loss": -40.142513275146484, "global_step": 134777, "epoch": 1113} {"train_loss": -40.5434684753418, "global_step": 134778, "epoch": 1113} {"train_loss": -39.05195236206055, "global_step": 134779, "epoch": 1113} {"train_loss": -39.20587921142578, "global_step": 134780, "epoch": 1113} {"train_loss": -40.09907150268555, "global_step": 134781, "epoch": 1113} {"train_loss": -39.97622299194336, "global_step": 134782, "epoch": 1113} {"train_loss": -40.670345306396484, "global_step": 134783, "epoch": 1113} {"train_loss": -39.82383346557617, "global_step": 134784, "epoch": 1113} {"train_loss": -40.50515365600586, "global_step": 134785, "epoch": 1113} {"train_loss": -33.69072341918945, "global_step": 134786, "epoch": 1113} {"train_loss": -39.21778106689453, "global_step": 134787, "epoch": 1113} {"train_loss": -39.2789306640625, "global_step": 134788, "epoch": 1113} {"train_loss": -39.883052825927734, "global_step": 134789, "epoch": 1113} {"train_loss": -39.0543327331543, "global_step": 134790, "epoch": 1113} {"train_loss": -39.912960052490234, "global_step": 134791, "epoch": 1113} {"train_loss": -39.06716537475586, "global_step": 134792, "epoch": 1113} {"train_loss": -38.845230985278924, "global_step": 134793, "epoch": 1113, "val_loss": 2684988.0} {"train_loss": -39.807533264160156, "global_step": 134794, "epoch": 1114} {"train_loss": -39.90228271484375, "global_step": 134795, "epoch": 1114} {"train_loss": -39.34883499145508, "global_step": 134796, "epoch": 1114} {"train_loss": -39.643062591552734, "global_step": 134797, "epoch": 1114} {"train_loss": -39.57012939453125, "global_step": 134798, "epoch": 1114} {"train_loss": -39.89651107788086, "global_step": 134799, "epoch": 1114} {"train_loss": -38.0953483581543, "global_step": 134800, "epoch": 1114} {"train_loss": -36.916481018066406, "global_step": 134801, "epoch": 1114} {"train_loss": -38.98429870605469, "global_step": 134802, "epoch": 1114} {"train_loss": -39.63201904296875, "global_step": 134803, "epoch": 1114} {"train_loss": -40.19550323486328, "global_step": 134804, "epoch": 1114} {"train_loss": -38.284786224365234, "global_step": 134805, "epoch": 1114} {"train_loss": -39.566768646240234, "global_step": 134806, "epoch": 1114} {"train_loss": -39.47718048095703, "global_step": 134807, "epoch": 1114} {"train_loss": -40.27301788330078, "global_step": 134808, "epoch": 1114} {"train_loss": -40.16459274291992, "global_step": 134809, "epoch": 1114} {"train_loss": -39.2054328918457, "global_step": 134810, "epoch": 1114} {"train_loss": -39.20875930786133, "global_step": 134811, "epoch": 1114} {"train_loss": -36.39912796020508, "global_step": 134812, "epoch": 1114} {"train_loss": -40.16655349731445, "global_step": 134813, "epoch": 1114} {"train_loss": -40.346435546875, "global_step": 134814, "epoch": 1114} {"train_loss": -40.11176300048828, "global_step": 134815, "epoch": 1114} {"train_loss": -40.14944076538086, "global_step": 134816, "epoch": 1114} {"train_loss": -38.44805908203125, "global_step": 134817, "epoch": 1114} {"train_loss": -40.09056091308594, "global_step": 134818, "epoch": 1114} {"train_loss": -40.641517639160156, "global_step": 134819, "epoch": 1114} {"train_loss": -39.64094161987305, "global_step": 134820, "epoch": 1114} {"train_loss": -40.409385681152344, "global_step": 134821, "epoch": 1114} {"train_loss": -39.8584098815918, "global_step": 134822, "epoch": 1114} {"train_loss": -40.21913528442383, "global_step": 134823, "epoch": 1114} {"train_loss": -37.615631103515625, "global_step": 134824, "epoch": 1114} {"train_loss": -39.0648078918457, "global_step": 134825, "epoch": 1114} {"train_loss": -39.78293991088867, "global_step": 134826, "epoch": 1114} {"train_loss": -37.424800872802734, "global_step": 134827, "epoch": 1114} {"train_loss": -40.416748046875, "global_step": 134828, "epoch": 1114} {"train_loss": -40.2485237121582, "global_step": 134829, "epoch": 1114} {"train_loss": -39.72936248779297, "global_step": 134830, "epoch": 1114} {"train_loss": -39.819862365722656, "global_step": 134831, "epoch": 1114} {"train_loss": -39.6761474609375, "global_step": 134832, "epoch": 1114} {"train_loss": -39.98527145385742, "global_step": 134833, "epoch": 1114} {"train_loss": -39.531795501708984, "global_step": 134834, "epoch": 1114} {"train_loss": -40.2015380859375, "global_step": 134835, "epoch": 1114} {"train_loss": -38.62188720703125, "global_step": 134836, "epoch": 1114} {"train_loss": -39.556278228759766, "global_step": 134837, "epoch": 1114} {"train_loss": -38.88325500488281, "global_step": 134838, "epoch": 1114} {"train_loss": -38.39130783081055, "global_step": 134839, "epoch": 1114} {"train_loss": -39.237770080566406, "global_step": 134840, "epoch": 1114} {"train_loss": -39.0329704284668, "global_step": 134841, "epoch": 1114} {"train_loss": -39.33756637573242, "global_step": 134842, "epoch": 1114} {"train_loss": -37.25969314575195, "global_step": 134843, "epoch": 1114} {"train_loss": -39.873260498046875, "global_step": 134844, "epoch": 1114} {"train_loss": -38.77873229980469, "global_step": 134845, "epoch": 1114} {"train_loss": -40.73409652709961, "global_step": 134846, "epoch": 1114} {"train_loss": -40.0676383972168, "global_step": 134847, "epoch": 1114} {"train_loss": -39.93278121948242, "global_step": 134848, "epoch": 1114} {"train_loss": -40.13470458984375, "global_step": 134849, "epoch": 1114} {"train_loss": -40.01310348510742, "global_step": 134850, "epoch": 1114} {"train_loss": -40.903358459472656, "global_step": 134851, "epoch": 1114} {"train_loss": -39.74736404418945, "global_step": 134852, "epoch": 1114} {"train_loss": -39.93703842163086, "global_step": 134853, "epoch": 1114} {"train_loss": -39.4840202331543, "global_step": 134854, "epoch": 1114} {"train_loss": -40.31382369995117, "global_step": 134855, "epoch": 1114} {"train_loss": -39.25960922241211, "global_step": 134856, "epoch": 1114} {"train_loss": -39.335899353027344, "global_step": 134857, "epoch": 1114} {"train_loss": -40.278221130371094, "global_step": 134858, "epoch": 1114} {"train_loss": -39.65971374511719, "global_step": 134859, "epoch": 1114} {"train_loss": -40.44344711303711, "global_step": 134860, "epoch": 1114} {"train_loss": -40.609352111816406, "global_step": 134861, "epoch": 1114} {"train_loss": -40.270545959472656, "global_step": 134862, "epoch": 1114} {"train_loss": -40.18183517456055, "global_step": 134863, "epoch": 1114} {"train_loss": -39.3260383605957, "global_step": 134864, "epoch": 1114} {"train_loss": -39.353214263916016, "global_step": 134865, "epoch": 1114} {"train_loss": -39.77980422973633, "global_step": 134866, "epoch": 1114} {"train_loss": -40.31534957885742, "global_step": 134867, "epoch": 1114} {"train_loss": -40.23566818237305, "global_step": 134868, "epoch": 1114} {"train_loss": -40.010135650634766, "global_step": 134869, "epoch": 1114} {"train_loss": -39.81897735595703, "global_step": 134870, "epoch": 1114} {"train_loss": -39.61013412475586, "global_step": 134871, "epoch": 1114} {"train_loss": -40.48942184448242, "global_step": 134872, "epoch": 1114} {"train_loss": -40.62260055541992, "global_step": 134873, "epoch": 1114} {"train_loss": -39.89296340942383, "global_step": 134874, "epoch": 1114} {"train_loss": -40.35894775390625, "global_step": 134875, "epoch": 1114} {"train_loss": -40.75555419921875, "global_step": 134876, "epoch": 1114} {"train_loss": -40.33232116699219, "global_step": 134877, "epoch": 1114} {"train_loss": -39.9680290222168, "global_step": 134878, "epoch": 1114} {"train_loss": -40.71786880493164, "global_step": 134879, "epoch": 1114} {"train_loss": -40.49958419799805, "global_step": 134880, "epoch": 1114} {"train_loss": -40.131771087646484, "global_step": 134881, "epoch": 1114} {"train_loss": -40.37211990356445, "global_step": 134882, "epoch": 1114} {"train_loss": -39.925018310546875, "global_step": 134883, "epoch": 1114} {"train_loss": -40.20117950439453, "global_step": 134884, "epoch": 1114} {"train_loss": -40.65629196166992, "global_step": 134885, "epoch": 1114} {"train_loss": -40.0750617980957, "global_step": 134886, "epoch": 1114} {"train_loss": -39.89432907104492, "global_step": 134887, "epoch": 1114} {"train_loss": -38.74924850463867, "global_step": 134888, "epoch": 1114} {"train_loss": -39.53194046020508, "global_step": 134889, "epoch": 1114} {"train_loss": -39.10765838623047, "global_step": 134890, "epoch": 1114} {"train_loss": -39.09716796875, "global_step": 134891, "epoch": 1114} {"train_loss": -38.47297286987305, "global_step": 134892, "epoch": 1114} {"train_loss": -35.56367111206055, "global_step": 134893, "epoch": 1114} {"train_loss": -34.11033248901367, "global_step": 134894, "epoch": 1114} {"train_loss": -37.182342529296875, "global_step": 134895, "epoch": 1114} {"train_loss": -37.17621612548828, "global_step": 134896, "epoch": 1114} {"train_loss": -39.04743576049805, "global_step": 134897, "epoch": 1114} {"train_loss": -39.09089279174805, "global_step": 134898, "epoch": 1114} {"train_loss": -39.404964447021484, "global_step": 134899, "epoch": 1114} {"train_loss": -40.53696823120117, "global_step": 134900, "epoch": 1114} {"train_loss": -39.0452995300293, "global_step": 134901, "epoch": 1114} {"train_loss": -38.37009048461914, "global_step": 134902, "epoch": 1114} {"train_loss": -38.65168762207031, "global_step": 134903, "epoch": 1114} {"train_loss": -39.59456253051758, "global_step": 134904, "epoch": 1114} {"train_loss": -39.22903060913086, "global_step": 134905, "epoch": 1114} {"train_loss": -37.7673225402832, "global_step": 134906, "epoch": 1114} {"train_loss": -38.51609420776367, "global_step": 134907, "epoch": 1114} {"train_loss": -38.73688888549805, "global_step": 134908, "epoch": 1114} {"train_loss": -37.658050537109375, "global_step": 134909, "epoch": 1114} {"train_loss": -39.293094635009766, "global_step": 134910, "epoch": 1114} {"train_loss": -39.8258056640625, "global_step": 134911, "epoch": 1114} {"train_loss": -37.9296760559082, "global_step": 134912, "epoch": 1114} {"train_loss": -28.130374908447266, "global_step": 134913, "epoch": 1114} {"train_loss": -39.32458565451882, "global_step": 134914, "epoch": 1114, "val_loss": 2655456.25} {"train_loss": -38.69639205932617, "global_step": 134915, "epoch": 1115} {"train_loss": -39.50020217895508, "global_step": 134916, "epoch": 1115} {"train_loss": -33.4546012878418, "global_step": 134917, "epoch": 1115} {"train_loss": -37.5098991394043, "global_step": 134918, "epoch": 1115} {"train_loss": -37.342872619628906, "global_step": 134919, "epoch": 1115} {"train_loss": -38.329734802246094, "global_step": 134920, "epoch": 1115} {"train_loss": -35.48954772949219, "global_step": 134921, "epoch": 1115} {"train_loss": -38.83173370361328, "global_step": 134922, "epoch": 1115} {"train_loss": -38.81599044799805, "global_step": 134923, "epoch": 1115} {"train_loss": -36.191890716552734, "global_step": 134924, "epoch": 1115} {"train_loss": -37.35847091674805, "global_step": 134925, "epoch": 1115} {"train_loss": -36.5827522277832, "global_step": 134926, "epoch": 1115} {"train_loss": -37.79897689819336, "global_step": 134927, "epoch": 1115} {"train_loss": -36.07902526855469, "global_step": 134928, "epoch": 1115} {"train_loss": -35.615596771240234, "global_step": 134929, "epoch": 1115} {"train_loss": -37.06645965576172, "global_step": 134930, "epoch": 1115} {"train_loss": -38.69112014770508, "global_step": 134931, "epoch": 1115} {"train_loss": -37.27145767211914, "global_step": 134932, "epoch": 1115} {"train_loss": -37.31221389770508, "global_step": 134933, "epoch": 1115} {"train_loss": -33.625816345214844, "global_step": 134934, "epoch": 1115} {"train_loss": -36.1671257019043, "global_step": 134935, "epoch": 1115} {"train_loss": -37.172882080078125, "global_step": 134936, "epoch": 1115} {"train_loss": -38.51997756958008, "global_step": 134937, "epoch": 1115} {"train_loss": -37.9633903503418, "global_step": 134938, "epoch": 1115} {"train_loss": -35.726165771484375, "global_step": 134939, "epoch": 1115} {"train_loss": -36.628570556640625, "global_step": 134940, "epoch": 1115} {"train_loss": -37.83883285522461, "global_step": 134941, "epoch": 1115} {"train_loss": -36.09931945800781, "global_step": 134942, "epoch": 1115} {"train_loss": -33.51723098754883, "global_step": 134943, "epoch": 1115} {"train_loss": -37.83051681518555, "global_step": 134944, "epoch": 1115} {"train_loss": -36.04450607299805, "global_step": 134945, "epoch": 1115} {"train_loss": -37.585060119628906, "global_step": 134946, "epoch": 1115} {"train_loss": -38.98761749267578, "global_step": 134947, "epoch": 1115} {"train_loss": -37.392913818359375, "global_step": 134948, "epoch": 1115} {"train_loss": -38.26633834838867, "global_step": 134949, "epoch": 1115} {"train_loss": -38.454524993896484, "global_step": 134950, "epoch": 1115} {"train_loss": -37.445899963378906, "global_step": 134951, "epoch": 1115} {"train_loss": -36.64360809326172, "global_step": 134952, "epoch": 1115} {"train_loss": -38.3939208984375, "global_step": 134953, "epoch": 1115} {"train_loss": -38.64616012573242, "global_step": 134954, "epoch": 1115} {"train_loss": -38.925048828125, "global_step": 134955, "epoch": 1115} {"train_loss": -39.03085708618164, "global_step": 134956, "epoch": 1115} {"train_loss": -38.931331634521484, "global_step": 134957, "epoch": 1115} {"train_loss": -38.87476348876953, "global_step": 134958, "epoch": 1115} {"train_loss": -38.93256378173828, "global_step": 134959, "epoch": 1115} {"train_loss": -38.88068771362305, "global_step": 134960, "epoch": 1115} {"train_loss": -38.986061096191406, "global_step": 134961, "epoch": 1115} {"train_loss": -38.86843490600586, "global_step": 134962, "epoch": 1115} {"train_loss": -38.9010124206543, "global_step": 134963, "epoch": 1115} {"train_loss": -39.385475158691406, "global_step": 134964, "epoch": 1115} {"train_loss": -39.49872970581055, "global_step": 134965, "epoch": 1115} {"train_loss": -38.93471145629883, "global_step": 134966, "epoch": 1115} {"train_loss": -39.608638763427734, "global_step": 134967, "epoch": 1115} {"train_loss": -39.41179275512695, "global_step": 134968, "epoch": 1115} {"train_loss": -39.73786163330078, "global_step": 134969, "epoch": 1115} {"train_loss": -39.75661849975586, "global_step": 134970, "epoch": 1115} {"train_loss": -39.35490036010742, "global_step": 134971, "epoch": 1115} {"train_loss": -39.377685546875, "global_step": 134972, "epoch": 1115} {"train_loss": -39.28703689575195, "global_step": 134973, "epoch": 1115} {"train_loss": -39.75193405151367, "global_step": 134974, "epoch": 1115} {"train_loss": -40.025550842285156, "global_step": 134975, "epoch": 1115} {"train_loss": -39.625587463378906, "global_step": 134976, "epoch": 1115} {"train_loss": -39.68770217895508, "global_step": 134977, "epoch": 1115} {"train_loss": -39.19193649291992, "global_step": 134978, "epoch": 1115} {"train_loss": -39.44409942626953, "global_step": 134979, "epoch": 1115} {"train_loss": -39.09710693359375, "global_step": 134980, "epoch": 1115} {"train_loss": -39.853275299072266, "global_step": 134981, "epoch": 1115} {"train_loss": -39.07842254638672, "global_step": 134982, "epoch": 1115} {"train_loss": -39.92537307739258, "global_step": 134983, "epoch": 1115} {"train_loss": -39.621734619140625, "global_step": 134984, "epoch": 1115} {"train_loss": -40.383426666259766, "global_step": 134985, "epoch": 1115} {"train_loss": -40.38833236694336, "global_step": 134986, "epoch": 1115} {"train_loss": -40.133522033691406, "global_step": 134987, "epoch": 1115} {"train_loss": -40.21384048461914, "global_step": 134988, "epoch": 1115} {"train_loss": -39.30582809448242, "global_step": 134989, "epoch": 1115} {"train_loss": -39.464576721191406, "global_step": 134990, "epoch": 1115} {"train_loss": -40.41718673706055, "global_step": 134991, "epoch": 1115} {"train_loss": -40.035675048828125, "global_step": 134992, "epoch": 1115} {"train_loss": -40.467010498046875, "global_step": 134993, "epoch": 1115} {"train_loss": -40.3902473449707, "global_step": 134994, "epoch": 1115} {"train_loss": -40.662776947021484, "global_step": 134995, "epoch": 1115} {"train_loss": -40.25779342651367, "global_step": 134996, "epoch": 1115} {"train_loss": -40.42777633666992, "global_step": 134997, "epoch": 1115} {"train_loss": -40.70058059692383, "global_step": 134998, "epoch": 1115} {"train_loss": -40.49153518676758, "global_step": 134999, "epoch": 1115} {"train_loss": -39.710792541503906, "global_step": 135000, "epoch": 1115} {"train_loss": -40.95216369628906, "global_step": 135001, "epoch": 1115} {"train_loss": -40.64945602416992, "global_step": 135002, "epoch": 1115} {"train_loss": -40.630916595458984, "global_step": 135003, "epoch": 1115} {"train_loss": -40.3746452331543, "global_step": 135004, "epoch": 1115} {"train_loss": -40.2173957824707, "global_step": 135005, "epoch": 1115} {"train_loss": -40.48760223388672, "global_step": 135006, "epoch": 1115} {"train_loss": -39.94804000854492, "global_step": 135007, "epoch": 1115} {"train_loss": -39.562015533447266, "global_step": 135008, "epoch": 1115} {"train_loss": -39.91313552856445, "global_step": 135009, "epoch": 1115} {"train_loss": -39.94906234741211, "global_step": 135010, "epoch": 1115} {"train_loss": -39.30324935913086, "global_step": 135011, "epoch": 1115} {"train_loss": -40.25501251220703, "global_step": 135012, "epoch": 1115} {"train_loss": -39.99007034301758, "global_step": 135013, "epoch": 1115} {"train_loss": -40.516117095947266, "global_step": 135014, "epoch": 1115} {"train_loss": -39.151519775390625, "global_step": 135015, "epoch": 1115} {"train_loss": -39.31468963623047, "global_step": 135016, "epoch": 1115} {"train_loss": -37.63072204589844, "global_step": 135017, "epoch": 1115} {"train_loss": -34.842918395996094, "global_step": 135018, "epoch": 1115} {"train_loss": -31.03753089904785, "global_step": 135019, "epoch": 1115} {"train_loss": -34.96320343017578, "global_step": 135020, "epoch": 1115} {"train_loss": -39.355377197265625, "global_step": 135021, "epoch": 1115} {"train_loss": -37.73312759399414, "global_step": 135022, "epoch": 1115} {"train_loss": -37.86738204956055, "global_step": 135023, "epoch": 1115} {"train_loss": -37.533302307128906, "global_step": 135024, "epoch": 1115} {"train_loss": -38.53711700439453, "global_step": 135025, "epoch": 1115} {"train_loss": -38.79415512084961, "global_step": 135026, "epoch": 1115} {"train_loss": -36.60951232910156, "global_step": 135027, "epoch": 1115} {"train_loss": -37.698944091796875, "global_step": 135028, "epoch": 1115} {"train_loss": -39.47819137573242, "global_step": 135029, "epoch": 1115} {"train_loss": -38.98477554321289, "global_step": 135030, "epoch": 1115} {"train_loss": -39.415443420410156, "global_step": 135031, "epoch": 1115} {"train_loss": -39.22587203979492, "global_step": 135032, "epoch": 1115} {"train_loss": -38.78907775878906, "global_step": 135033, "epoch": 1115} {"train_loss": -39.81676483154297, "global_step": 135034, "epoch": 1115} {"train_loss": -38.57715337138531, "global_step": 135035, "epoch": 1115, "val_loss": 2621105.0} {"train_loss": -40.00288009643555, "global_step": 135036, "epoch": 1116} {"train_loss": -40.24558639526367, "global_step": 135037, "epoch": 1116} {"train_loss": -40.112911224365234, "global_step": 135038, "epoch": 1116} {"train_loss": -39.4940299987793, "global_step": 135039, "epoch": 1116} {"train_loss": -40.934993743896484, "global_step": 135040, "epoch": 1116} {"train_loss": -39.842960357666016, "global_step": 135041, "epoch": 1116} {"train_loss": -40.1412353515625, "global_step": 135042, "epoch": 1116} {"train_loss": -40.16358184814453, "global_step": 135043, "epoch": 1116} {"train_loss": -39.182373046875, "global_step": 135044, "epoch": 1116} {"train_loss": -40.07477951049805, "global_step": 135045, "epoch": 1116} {"train_loss": -40.00398635864258, "global_step": 135046, "epoch": 1116} {"train_loss": -40.0396614074707, "global_step": 135047, "epoch": 1116} {"train_loss": -39.45954132080078, "global_step": 135048, "epoch": 1116} {"train_loss": -39.76008224487305, "global_step": 135049, "epoch": 1116} {"train_loss": -39.07271194458008, "global_step": 135050, "epoch": 1116} {"train_loss": -39.5892333984375, "global_step": 135051, "epoch": 1116} {"train_loss": -39.605255126953125, "global_step": 135052, "epoch": 1116} {"train_loss": -39.73763656616211, "global_step": 135053, "epoch": 1116} {"train_loss": -39.38726806640625, "global_step": 135054, "epoch": 1116} {"train_loss": -39.89512634277344, "global_step": 135055, "epoch": 1116} {"train_loss": -39.083160400390625, "global_step": 135056, "epoch": 1116} {"train_loss": -37.96913528442383, "global_step": 135057, "epoch": 1116} {"train_loss": -35.8869514465332, "global_step": 135058, "epoch": 1116} {"train_loss": -36.2519416809082, "global_step": 135059, "epoch": 1116} {"train_loss": -39.425811767578125, "global_step": 135060, "epoch": 1116} {"train_loss": -39.54642868041992, "global_step": 135061, "epoch": 1116} {"train_loss": -39.36847686767578, "global_step": 135062, "epoch": 1116} {"train_loss": -38.99001693725586, "global_step": 135063, "epoch": 1116} {"train_loss": -39.77204513549805, "global_step": 135064, "epoch": 1116} {"train_loss": -39.73637008666992, "global_step": 135065, "epoch": 1116} {"train_loss": -39.95182800292969, "global_step": 135066, "epoch": 1116} {"train_loss": -39.203216552734375, "global_step": 135067, "epoch": 1116} {"train_loss": -40.104103088378906, "global_step": 135068, "epoch": 1116} {"train_loss": -39.28371810913086, "global_step": 135069, "epoch": 1116} {"train_loss": -40.27830123901367, "global_step": 135070, "epoch": 1116} {"train_loss": -39.56989669799805, "global_step": 135071, "epoch": 1116} {"train_loss": -40.3349494934082, "global_step": 135072, "epoch": 1116} {"train_loss": -39.7717170715332, "global_step": 135073, "epoch": 1116} {"train_loss": -38.875308990478516, "global_step": 135074, "epoch": 1116} {"train_loss": -40.41364669799805, "global_step": 135075, "epoch": 1116} {"train_loss": -39.67096710205078, "global_step": 135076, "epoch": 1116} {"train_loss": -39.69086837768555, "global_step": 135077, "epoch": 1116} {"train_loss": -40.0256233215332, "global_step": 135078, "epoch": 1116} {"train_loss": -39.90127182006836, "global_step": 135079, "epoch": 1116} {"train_loss": -40.182342529296875, "global_step": 135080, "epoch": 1116} {"train_loss": -40.3795280456543, "global_step": 135081, "epoch": 1116} {"train_loss": -40.41192626953125, "global_step": 135082, "epoch": 1116} {"train_loss": -40.15983963012695, "global_step": 135083, "epoch": 1116} {"train_loss": -39.101959228515625, "global_step": 135084, "epoch": 1116} {"train_loss": -40.12687683105469, "global_step": 135085, "epoch": 1116} {"train_loss": -39.36775207519531, "global_step": 135086, "epoch": 1116} {"train_loss": -38.992103576660156, "global_step": 135087, "epoch": 1116} {"train_loss": -38.97971725463867, "global_step": 135088, "epoch": 1116} {"train_loss": -37.91762924194336, "global_step": 135089, "epoch": 1116} {"train_loss": -38.31459426879883, "global_step": 135090, "epoch": 1116} {"train_loss": -36.68370819091797, "global_step": 135091, "epoch": 1116} {"train_loss": -38.667171478271484, "global_step": 135092, "epoch": 1116} {"train_loss": -36.452415466308594, "global_step": 135093, "epoch": 1116} {"train_loss": -37.347896575927734, "global_step": 135094, "epoch": 1116} {"train_loss": -36.15570068359375, "global_step": 135095, "epoch": 1116} {"train_loss": -38.8951301574707, "global_step": 135096, "epoch": 1116} {"train_loss": -36.070743560791016, "global_step": 135097, "epoch": 1116} {"train_loss": -38.3448600769043, "global_step": 135098, "epoch": 1116} {"train_loss": -35.64085006713867, "global_step": 135099, "epoch": 1116} {"train_loss": -36.714046478271484, "global_step": 135100, "epoch": 1116} {"train_loss": -35.8951530456543, "global_step": 135101, "epoch": 1116} {"train_loss": -37.67507553100586, "global_step": 135102, "epoch": 1116} {"train_loss": -37.740745544433594, "global_step": 135103, "epoch": 1116} {"train_loss": -39.50167465209961, "global_step": 135104, "epoch": 1116} {"train_loss": -38.42696762084961, "global_step": 135105, "epoch": 1116} {"train_loss": -38.96474838256836, "global_step": 135106, "epoch": 1116} {"train_loss": -39.05964660644531, "global_step": 135107, "epoch": 1116} {"train_loss": -38.45904541015625, "global_step": 135108, "epoch": 1116} {"train_loss": -38.670867919921875, "global_step": 135109, "epoch": 1116} {"train_loss": -39.87259292602539, "global_step": 135110, "epoch": 1116} {"train_loss": -38.341552734375, "global_step": 135111, "epoch": 1116} {"train_loss": -39.32737731933594, "global_step": 135112, "epoch": 1116} {"train_loss": -37.95137023925781, "global_step": 135113, "epoch": 1116} {"train_loss": -39.149410247802734, "global_step": 135114, "epoch": 1116} {"train_loss": -40.1008415222168, "global_step": 135115, "epoch": 1116} {"train_loss": -39.395240783691406, "global_step": 135116, "epoch": 1116} {"train_loss": -38.523189544677734, "global_step": 135117, "epoch": 1116} {"train_loss": -38.871856689453125, "global_step": 135118, "epoch": 1116} {"train_loss": -37.99343490600586, "global_step": 135119, "epoch": 1116} {"train_loss": -39.25678634643555, "global_step": 135120, "epoch": 1116} {"train_loss": -33.07246780395508, "global_step": 135121, "epoch": 1116} {"train_loss": -38.372596740722656, "global_step": 135122, "epoch": 1116} {"train_loss": -34.61122131347656, "global_step": 135123, "epoch": 1116} {"train_loss": -32.931182861328125, "global_step": 135124, "epoch": 1116} {"train_loss": 15.558173179626465, "global_step": 135125, "epoch": 1116} {"train_loss": -31.33005714416504, "global_step": 135126, "epoch": 1116} {"train_loss": -1.6818069219589233, "global_step": 135127, "epoch": 1116} {"train_loss": 11.953424453735352, "global_step": 135128, "epoch": 1116} {"train_loss": -15.891722679138184, "global_step": 135129, "epoch": 1116} {"train_loss": -13.053122520446777, "global_step": 135130, "epoch": 1116} {"train_loss": -19.64468765258789, "global_step": 135131, "epoch": 1116} {"train_loss": -15.944865226745605, "global_step": 135132, "epoch": 1116} {"train_loss": -18.357208251953125, "global_step": 135133, "epoch": 1116} {"train_loss": -18.0308780670166, "global_step": 135134, "epoch": 1116} {"train_loss": -26.84490966796875, "global_step": 135135, "epoch": 1116} {"train_loss": -28.3397274017334, "global_step": 135136, "epoch": 1116} {"train_loss": -26.347997665405273, "global_step": 135137, "epoch": 1116} {"train_loss": -27.22747802734375, "global_step": 135138, "epoch": 1116} {"train_loss": -27.087738037109375, "global_step": 135139, "epoch": 1116} {"train_loss": -29.844831466674805, "global_step": 135140, "epoch": 1116} {"train_loss": -28.733579635620117, "global_step": 135141, "epoch": 1116} {"train_loss": -23.57244300842285, "global_step": 135142, "epoch": 1116} {"train_loss": -28.194995880126953, "global_step": 135143, "epoch": 1116} {"train_loss": -30.836807250976562, "global_step": 135144, "epoch": 1116} {"train_loss": -30.301477432250977, "global_step": 135145, "epoch": 1116} {"train_loss": -31.048614501953125, "global_step": 135146, "epoch": 1116} {"train_loss": -31.80266761779785, "global_step": 135147, "epoch": 1116} {"train_loss": -32.6275520324707, "global_step": 135148, "epoch": 1116} {"train_loss": -30.3123779296875, "global_step": 135149, "epoch": 1116} {"train_loss": -31.23872184753418, "global_step": 135150, "epoch": 1116} {"train_loss": -32.25187301635742, "global_step": 135151, "epoch": 1116} {"train_loss": -32.194862365722656, "global_step": 135152, "epoch": 1116} {"train_loss": -32.659698486328125, "global_step": 135153, "epoch": 1116} {"train_loss": -33.23902130126953, "global_step": 135154, "epoch": 1116} {"train_loss": -33.29359817504883, "global_step": 135155, "epoch": 1116} {"train_loss": -34.91635168386885, "global_step": 135156, "epoch": 1116, "val_loss": 2660797.25} {"train_loss": -32.54395294189453, "global_step": 135157, "epoch": 1117} {"train_loss": -32.49849319458008, "global_step": 135158, "epoch": 1117} {"train_loss": -32.76694869995117, "global_step": 135159, "epoch": 1117} {"train_loss": -32.78377914428711, "global_step": 135160, "epoch": 1117} {"train_loss": -33.55720138549805, "global_step": 135161, "epoch": 1117} {"train_loss": -32.87099838256836, "global_step": 135162, "epoch": 1117} {"train_loss": -33.78386306762695, "global_step": 135163, "epoch": 1117} {"train_loss": -33.281768798828125, "global_step": 135164, "epoch": 1117} {"train_loss": -33.85166931152344, "global_step": 135165, "epoch": 1117} {"train_loss": -32.89934158325195, "global_step": 135166, "epoch": 1117} {"train_loss": -33.17222595214844, "global_step": 135167, "epoch": 1117} {"train_loss": -33.95425033569336, "global_step": 135168, "epoch": 1117} {"train_loss": -32.693695068359375, "global_step": 135169, "epoch": 1117} {"train_loss": -33.70892333984375, "global_step": 135170, "epoch": 1117} {"train_loss": -33.340354919433594, "global_step": 135171, "epoch": 1117} {"train_loss": -33.777809143066406, "global_step": 135172, "epoch": 1117} {"train_loss": -34.44832992553711, "global_step": 135173, "epoch": 1117} {"train_loss": -32.90343475341797, "global_step": 135174, "epoch": 1117} {"train_loss": -34.412574768066406, "global_step": 135175, "epoch": 1117} {"train_loss": -34.5511589050293, "global_step": 135176, "epoch": 1117} {"train_loss": -34.599571228027344, "global_step": 135177, "epoch": 1117} {"train_loss": -34.868221282958984, "global_step": 135178, "epoch": 1117} {"train_loss": -34.404327392578125, "global_step": 135179, "epoch": 1117} {"train_loss": -34.6833610534668, "global_step": 135180, "epoch": 1117} {"train_loss": -34.996883392333984, "global_step": 135181, "epoch": 1117} {"train_loss": -34.97907257080078, "global_step": 135182, "epoch": 1117} {"train_loss": -34.9588737487793, "global_step": 135183, "epoch": 1117} {"train_loss": -34.97550582885742, "global_step": 135184, "epoch": 1117} {"train_loss": -34.78489303588867, "global_step": 135185, "epoch": 1117} {"train_loss": -34.88283157348633, "global_step": 135186, "epoch": 1117} {"train_loss": -34.9423942565918, "global_step": 135187, "epoch": 1117} {"train_loss": -34.33783721923828, "global_step": 135188, "epoch": 1117} {"train_loss": -33.88515090942383, "global_step": 135189, "epoch": 1117} {"train_loss": -34.89927291870117, "global_step": 135190, "epoch": 1117} {"train_loss": -33.58701705932617, "global_step": 135191, "epoch": 1117} {"train_loss": -35.41944122314453, "global_step": 135192, "epoch": 1117} {"train_loss": -35.56925964355469, "global_step": 135193, "epoch": 1117} {"train_loss": -35.47093200683594, "global_step": 135194, "epoch": 1117} {"train_loss": -35.89107131958008, "global_step": 135195, "epoch": 1117} {"train_loss": -34.7723388671875, "global_step": 135196, "epoch": 1117} {"train_loss": -35.974578857421875, "global_step": 135197, "epoch": 1117} {"train_loss": -35.19232940673828, "global_step": 135198, "epoch": 1117} {"train_loss": -34.412654876708984, "global_step": 135199, "epoch": 1117} {"train_loss": -35.338043212890625, "global_step": 135200, "epoch": 1117} {"train_loss": -35.987091064453125, "global_step": 135201, "epoch": 1117} {"train_loss": -35.549354553222656, "global_step": 135202, "epoch": 1117} {"train_loss": -35.52449035644531, "global_step": 135203, "epoch": 1117} {"train_loss": -35.781002044677734, "global_step": 135204, "epoch": 1117} {"train_loss": -35.65800094604492, "global_step": 135205, "epoch": 1117} {"train_loss": -36.076324462890625, "global_step": 135206, "epoch": 1117} {"train_loss": -35.90818405151367, "global_step": 135207, "epoch": 1117} {"train_loss": -36.16340255737305, "global_step": 135208, "epoch": 1117} {"train_loss": -36.32564926147461, "global_step": 135209, "epoch": 1117} {"train_loss": -35.823768615722656, "global_step": 135210, "epoch": 1117} {"train_loss": -36.429420471191406, "global_step": 135211, "epoch": 1117} {"train_loss": -36.54826736450195, "global_step": 135212, "epoch": 1117} {"train_loss": -35.92334747314453, "global_step": 135213, "epoch": 1117} {"train_loss": -36.21516799926758, "global_step": 135214, "epoch": 1117} {"train_loss": -36.355648040771484, "global_step": 135215, "epoch": 1117} {"train_loss": -36.08772659301758, "global_step": 135216, "epoch": 1117} {"train_loss": -35.6911735534668, "global_step": 135217, "epoch": 1117} {"train_loss": -36.553550720214844, "global_step": 135218, "epoch": 1117} {"train_loss": -36.999534606933594, "global_step": 135219, "epoch": 1117} {"train_loss": -36.321598052978516, "global_step": 135220, "epoch": 1117} {"train_loss": -36.498931884765625, "global_step": 135221, "epoch": 1117} {"train_loss": -36.05772018432617, "global_step": 135222, "epoch": 1117} {"train_loss": -36.351234436035156, "global_step": 135223, "epoch": 1117} {"train_loss": -35.710304260253906, "global_step": 135224, "epoch": 1117} {"train_loss": -36.25181579589844, "global_step": 135225, "epoch": 1117} {"train_loss": -36.69158935546875, "global_step": 135226, "epoch": 1117} {"train_loss": -36.81135177612305, "global_step": 135227, "epoch": 1117} {"train_loss": -37.19008255004883, "global_step": 135228, "epoch": 1117} {"train_loss": -36.947383880615234, "global_step": 135229, "epoch": 1117} {"train_loss": -36.82630920410156, "global_step": 135230, "epoch": 1117} {"train_loss": -37.2077522277832, "global_step": 135231, "epoch": 1117} {"train_loss": -36.94917678833008, "global_step": 135232, "epoch": 1117} {"train_loss": -36.893245697021484, "global_step": 135233, "epoch": 1117} {"train_loss": -37.247188568115234, "global_step": 135234, "epoch": 1117} {"train_loss": -36.999446868896484, "global_step": 135235, "epoch": 1117} {"train_loss": -36.96649932861328, "global_step": 135236, "epoch": 1117} {"train_loss": -36.88819122314453, "global_step": 135237, "epoch": 1117} {"train_loss": -36.854408264160156, "global_step": 135238, "epoch": 1117} {"train_loss": -36.98011016845703, "global_step": 135239, "epoch": 1117} {"train_loss": -37.130428314208984, "global_step": 135240, "epoch": 1117} {"train_loss": -37.58607482910156, "global_step": 135241, "epoch": 1117} {"train_loss": -37.67580795288086, "global_step": 135242, "epoch": 1117} {"train_loss": -37.50837326049805, "global_step": 135243, "epoch": 1117} {"train_loss": -37.683937072753906, "global_step": 135244, "epoch": 1117} {"train_loss": -37.2519416809082, "global_step": 135245, "epoch": 1117} {"train_loss": -37.58869552612305, "global_step": 135246, "epoch": 1117} {"train_loss": -36.8310546875, "global_step": 135247, "epoch": 1117} {"train_loss": -37.8387565612793, "global_step": 135248, "epoch": 1117} {"train_loss": -36.9976806640625, "global_step": 135249, "epoch": 1117} {"train_loss": -37.55377197265625, "global_step": 135250, "epoch": 1117} {"train_loss": -37.81959915161133, "global_step": 135251, "epoch": 1117} {"train_loss": -37.56440353393555, "global_step": 135252, "epoch": 1117} {"train_loss": -37.06715393066406, "global_step": 135253, "epoch": 1117} {"train_loss": -37.85342025756836, "global_step": 135254, "epoch": 1117} {"train_loss": -35.972145080566406, "global_step": 135255, "epoch": 1117} {"train_loss": -37.61631774902344, "global_step": 135256, "epoch": 1117} {"train_loss": -37.478187561035156, "global_step": 135257, "epoch": 1117} {"train_loss": -37.74641036987305, "global_step": 135258, "epoch": 1117} {"train_loss": -38.282161712646484, "global_step": 135259, "epoch": 1117} {"train_loss": -37.222450256347656, "global_step": 135260, "epoch": 1117} {"train_loss": -38.247798919677734, "global_step": 135261, "epoch": 1117} {"train_loss": -38.91019821166992, "global_step": 135262, "epoch": 1117} {"train_loss": -38.407596588134766, "global_step": 135263, "epoch": 1117} {"train_loss": -38.3003044128418, "global_step": 135264, "epoch": 1117} {"train_loss": -37.801361083984375, "global_step": 135265, "epoch": 1117} {"train_loss": -38.072120666503906, "global_step": 135266, "epoch": 1117} {"train_loss": -38.18986129760742, "global_step": 135267, "epoch": 1117} {"train_loss": -38.08995056152344, "global_step": 135268, "epoch": 1117} {"train_loss": -37.745174407958984, "global_step": 135269, "epoch": 1117} {"train_loss": -37.94697570800781, "global_step": 135270, "epoch": 1117} {"train_loss": -38.443721771240234, "global_step": 135271, "epoch": 1117} {"train_loss": -37.98177719116211, "global_step": 135272, "epoch": 1117} {"train_loss": -38.246639251708984, "global_step": 135273, "epoch": 1117} {"train_loss": -38.224853515625, "global_step": 135274, "epoch": 1117} {"train_loss": -38.59923553466797, "global_step": 135275, "epoch": 1117} {"train_loss": -38.3249626159668, "global_step": 135276, "epoch": 1117} {"train_loss": -36.04364918480235, "global_step": 135277, "epoch": 1117, "val_loss": 2669279.75} {"train_loss": -38.449729919433594, "global_step": 135278, "epoch": 1118} {"train_loss": -38.210670471191406, "global_step": 135279, "epoch": 1118} {"train_loss": -38.64657974243164, "global_step": 135280, "epoch": 1118} {"train_loss": -38.92607116699219, "global_step": 135281, "epoch": 1118} {"train_loss": -37.96078109741211, "global_step": 135282, "epoch": 1118} {"train_loss": -38.335166931152344, "global_step": 135283, "epoch": 1118} {"train_loss": -38.70344161987305, "global_step": 135284, "epoch": 1118} {"train_loss": -38.00659942626953, "global_step": 135285, "epoch": 1118} {"train_loss": -38.71420669555664, "global_step": 135286, "epoch": 1118} {"train_loss": -39.252830505371094, "global_step": 135287, "epoch": 1118} {"train_loss": -38.61403274536133, "global_step": 135288, "epoch": 1118} {"train_loss": -37.63471984863281, "global_step": 135289, "epoch": 1118} {"train_loss": -38.66970443725586, "global_step": 135290, "epoch": 1118} {"train_loss": -37.82016372680664, "global_step": 135291, "epoch": 1118} {"train_loss": -38.689422607421875, "global_step": 135292, "epoch": 1118} {"train_loss": -38.80795669555664, "global_step": 135293, "epoch": 1118} {"train_loss": -38.208126068115234, "global_step": 135294, "epoch": 1118} {"train_loss": -38.59005355834961, "global_step": 135295, "epoch": 1118} {"train_loss": -39.002784729003906, "global_step": 135296, "epoch": 1118} {"train_loss": -38.748504638671875, "global_step": 135297, "epoch": 1118} {"train_loss": -37.59450912475586, "global_step": 135298, "epoch": 1118} {"train_loss": -36.8029899597168, "global_step": 135299, "epoch": 1118} {"train_loss": -36.965110778808594, "global_step": 135300, "epoch": 1118} {"train_loss": -36.48444747924805, "global_step": 135301, "epoch": 1118} {"train_loss": -35.16372299194336, "global_step": 135302, "epoch": 1118} {"train_loss": -35.27018356323242, "global_step": 135303, "epoch": 1118} {"train_loss": -37.6433219909668, "global_step": 135304, "epoch": 1118} {"train_loss": -38.66645050048828, "global_step": 135305, "epoch": 1118} {"train_loss": -38.33283615112305, "global_step": 135306, "epoch": 1118} {"train_loss": -38.546905517578125, "global_step": 135307, "epoch": 1118} {"train_loss": -39.036502838134766, "global_step": 135308, "epoch": 1118} {"train_loss": -38.578041076660156, "global_step": 135309, "epoch": 1118} {"train_loss": -38.868743896484375, "global_step": 135310, "epoch": 1118} {"train_loss": -38.3178596496582, "global_step": 135311, "epoch": 1118} {"train_loss": -38.4424934387207, "global_step": 135312, "epoch": 1118} {"train_loss": -39.058040618896484, "global_step": 135313, "epoch": 1118} {"train_loss": -38.86872482299805, "global_step": 135314, "epoch": 1118} {"train_loss": -38.61954879760742, "global_step": 135315, "epoch": 1118} {"train_loss": -38.860694885253906, "global_step": 135316, "epoch": 1118} {"train_loss": -39.29877471923828, "global_step": 135317, "epoch": 1118} {"train_loss": -39.008331298828125, "global_step": 135318, "epoch": 1118} {"train_loss": -39.139747619628906, "global_step": 135319, "epoch": 1118} {"train_loss": -39.0679817199707, "global_step": 135320, "epoch": 1118} {"train_loss": -38.477516174316406, "global_step": 135321, "epoch": 1118} {"train_loss": -39.17478561401367, "global_step": 135322, "epoch": 1118} {"train_loss": -39.25859451293945, "global_step": 135323, "epoch": 1118} {"train_loss": -38.94688034057617, "global_step": 135324, "epoch": 1118} {"train_loss": -38.680213928222656, "global_step": 135325, "epoch": 1118} {"train_loss": -39.18305206298828, "global_step": 135326, "epoch": 1118} {"train_loss": -38.72188949584961, "global_step": 135327, "epoch": 1118} {"train_loss": -38.7061882019043, "global_step": 135328, "epoch": 1118} {"train_loss": -39.31917953491211, "global_step": 135329, "epoch": 1118} {"train_loss": -39.13274002075195, "global_step": 135330, "epoch": 1118} {"train_loss": -39.21757125854492, "global_step": 135331, "epoch": 1118} {"train_loss": -39.764766693115234, "global_step": 135332, "epoch": 1118} {"train_loss": -38.648040771484375, "global_step": 135333, "epoch": 1118} {"train_loss": -39.399478912353516, "global_step": 135334, "epoch": 1118} {"train_loss": -39.34560012817383, "global_step": 135335, "epoch": 1118} {"train_loss": -38.15847396850586, "global_step": 135336, "epoch": 1118} {"train_loss": -39.15423583984375, "global_step": 135337, "epoch": 1118} {"train_loss": -38.70085906982422, "global_step": 135338, "epoch": 1118} {"train_loss": -39.886695861816406, "global_step": 135339, "epoch": 1118} {"train_loss": -39.691246032714844, "global_step": 135340, "epoch": 1118} {"train_loss": -39.46552658081055, "global_step": 135341, "epoch": 1118} {"train_loss": -39.59234619140625, "global_step": 135342, "epoch": 1118} {"train_loss": -39.51851272583008, "global_step": 135343, "epoch": 1118} {"train_loss": -39.74949264526367, "global_step": 135344, "epoch": 1118} {"train_loss": -39.175533294677734, "global_step": 135345, "epoch": 1118} {"train_loss": -39.151123046875, "global_step": 135346, "epoch": 1118} {"train_loss": -39.85161590576172, "global_step": 135347, "epoch": 1118} {"train_loss": -39.73426055908203, "global_step": 135348, "epoch": 1118} {"train_loss": -39.906856536865234, "global_step": 135349, "epoch": 1118} {"train_loss": -39.38155746459961, "global_step": 135350, "epoch": 1118} {"train_loss": -38.839935302734375, "global_step": 135351, "epoch": 1118} {"train_loss": -39.7864875793457, "global_step": 135352, "epoch": 1118} {"train_loss": -38.95112228393555, "global_step": 135353, "epoch": 1118} {"train_loss": -39.6694221496582, "global_step": 135354, "epoch": 1118} {"train_loss": -38.85770034790039, "global_step": 135355, "epoch": 1118} {"train_loss": -38.674442291259766, "global_step": 135356, "epoch": 1118} {"train_loss": -38.42494583129883, "global_step": 135357, "epoch": 1118} {"train_loss": -35.50081253051758, "global_step": 135358, "epoch": 1118} {"train_loss": -31.985671997070312, "global_step": 135359, "epoch": 1118} {"train_loss": -29.266469955444336, "global_step": 135360, "epoch": 1118} {"train_loss": -35.28339767456055, "global_step": 135361, "epoch": 1118} {"train_loss": -39.74140167236328, "global_step": 135362, "epoch": 1118} {"train_loss": -33.6965446472168, "global_step": 135363, "epoch": 1118} {"train_loss": -34.98287582397461, "global_step": 135364, "epoch": 1118} {"train_loss": -39.65464401245117, "global_step": 135365, "epoch": 1118} {"train_loss": -34.47732162475586, "global_step": 135366, "epoch": 1118} {"train_loss": -37.33608627319336, "global_step": 135367, "epoch": 1118} {"train_loss": -37.57175827026367, "global_step": 135368, "epoch": 1118} {"train_loss": -36.870765686035156, "global_step": 135369, "epoch": 1118} {"train_loss": -38.35085678100586, "global_step": 135370, "epoch": 1118} {"train_loss": -37.75616455078125, "global_step": 135371, "epoch": 1118} {"train_loss": -38.438228607177734, "global_step": 135372, "epoch": 1118} {"train_loss": -38.034297943115234, "global_step": 135373, "epoch": 1118} {"train_loss": -38.32257843017578, "global_step": 135374, "epoch": 1118} {"train_loss": -37.827484130859375, "global_step": 135375, "epoch": 1118} {"train_loss": -38.98915481567383, "global_step": 135376, "epoch": 1118} {"train_loss": -37.9875373840332, "global_step": 135377, "epoch": 1118} {"train_loss": -39.11174392700195, "global_step": 135378, "epoch": 1118} {"train_loss": -39.21769332885742, "global_step": 135379, "epoch": 1118} {"train_loss": -38.74089050292969, "global_step": 135380, "epoch": 1118} {"train_loss": -38.66971969604492, "global_step": 135381, "epoch": 1118} {"train_loss": -39.0463981628418, "global_step": 135382, "epoch": 1118} {"train_loss": -39.139373779296875, "global_step": 135383, "epoch": 1118} {"train_loss": -39.359859466552734, "global_step": 135384, "epoch": 1118} {"train_loss": -40.01166534423828, "global_step": 135385, "epoch": 1118} {"train_loss": -39.12910079956055, "global_step": 135386, "epoch": 1118} {"train_loss": -39.14481735229492, "global_step": 135387, "epoch": 1118} {"train_loss": -38.89847946166992, "global_step": 135388, "epoch": 1118} {"train_loss": -38.49165725708008, "global_step": 135389, "epoch": 1118} {"train_loss": -38.78733444213867, "global_step": 135390, "epoch": 1118} {"train_loss": -39.468833923339844, "global_step": 135391, "epoch": 1118} {"train_loss": -39.544822692871094, "global_step": 135392, "epoch": 1118} {"train_loss": -39.465118408203125, "global_step": 135393, "epoch": 1118} {"train_loss": -39.03731918334961, "global_step": 135394, "epoch": 1118} {"train_loss": -39.85032272338867, "global_step": 135395, "epoch": 1118} {"train_loss": -39.180355072021484, "global_step": 135396, "epoch": 1118} {"train_loss": -39.67689895629883, "global_step": 135397, "epoch": 1118} {"train_loss": -38.449258362951355, "global_step": 135398, "epoch": 1118, "val_loss": 2636109.75} {"train_loss": -39.3079833984375, "global_step": 135399, "epoch": 1119} {"train_loss": -39.39253616333008, "global_step": 135400, "epoch": 1119} {"train_loss": -39.68955993652344, "global_step": 135401, "epoch": 1119} {"train_loss": -39.800750732421875, "global_step": 135402, "epoch": 1119} {"train_loss": -39.6767578125, "global_step": 135403, "epoch": 1119} {"train_loss": -39.182716369628906, "global_step": 135404, "epoch": 1119} {"train_loss": -39.76350402832031, "global_step": 135405, "epoch": 1119} {"train_loss": -38.49225616455078, "global_step": 135406, "epoch": 1119} {"train_loss": -37.1659049987793, "global_step": 135407, "epoch": 1119} {"train_loss": -34.01179885864258, "global_step": 135408, "epoch": 1119} {"train_loss": -26.600934982299805, "global_step": 135409, "epoch": 1119} {"train_loss": -27.27505874633789, "global_step": 135410, "epoch": 1119} {"train_loss": -37.49547576904297, "global_step": 135411, "epoch": 1119} {"train_loss": -34.27027130126953, "global_step": 135412, "epoch": 1119} {"train_loss": -33.4317512512207, "global_step": 135413, "epoch": 1119} {"train_loss": -38.93617630004883, "global_step": 135414, "epoch": 1119} {"train_loss": -33.8162956237793, "global_step": 135415, "epoch": 1119} {"train_loss": -38.84487533569336, "global_step": 135416, "epoch": 1119} {"train_loss": -36.549922943115234, "global_step": 135417, "epoch": 1119} {"train_loss": -38.0937385559082, "global_step": 135418, "epoch": 1119} {"train_loss": -37.5797004699707, "global_step": 135419, "epoch": 1119} {"train_loss": -37.392250061035156, "global_step": 135420, "epoch": 1119} {"train_loss": -37.6643180847168, "global_step": 135421, "epoch": 1119} {"train_loss": -38.3166618347168, "global_step": 135422, "epoch": 1119} {"train_loss": -37.903968811035156, "global_step": 135423, "epoch": 1119} {"train_loss": -37.970184326171875, "global_step": 135424, "epoch": 1119} {"train_loss": -37.49649429321289, "global_step": 135425, "epoch": 1119} {"train_loss": -38.831146240234375, "global_step": 135426, "epoch": 1119} {"train_loss": -38.381107330322266, "global_step": 135427, "epoch": 1119} {"train_loss": -38.5520133972168, "global_step": 135428, "epoch": 1119} {"train_loss": -38.82633590698242, "global_step": 135429, "epoch": 1119} {"train_loss": -38.98583984375, "global_step": 135430, "epoch": 1119} {"train_loss": -38.88411331176758, "global_step": 135431, "epoch": 1119} {"train_loss": -39.052650451660156, "global_step": 135432, "epoch": 1119} {"train_loss": -39.20475387573242, "global_step": 135433, "epoch": 1119} {"train_loss": -39.77574157714844, "global_step": 135434, "epoch": 1119} {"train_loss": -38.536190032958984, "global_step": 135435, "epoch": 1119} {"train_loss": -38.91463088989258, "global_step": 135436, "epoch": 1119} {"train_loss": -38.7774772644043, "global_step": 135437, "epoch": 1119} {"train_loss": -39.75551223754883, "global_step": 135438, "epoch": 1119} {"train_loss": -38.76030349731445, "global_step": 135439, "epoch": 1119} {"train_loss": -38.66626739501953, "global_step": 135440, "epoch": 1119} {"train_loss": -39.283294677734375, "global_step": 135441, "epoch": 1119} {"train_loss": -39.34135818481445, "global_step": 135442, "epoch": 1119} {"train_loss": -38.95249557495117, "global_step": 135443, "epoch": 1119} {"train_loss": -38.80064010620117, "global_step": 135444, "epoch": 1119} {"train_loss": -38.85620880126953, "global_step": 135445, "epoch": 1119} {"train_loss": -39.47288131713867, "global_step": 135446, "epoch": 1119} {"train_loss": -39.50205612182617, "global_step": 135447, "epoch": 1119} {"train_loss": -38.914119720458984, "global_step": 135448, "epoch": 1119} {"train_loss": -40.03083419799805, "global_step": 135449, "epoch": 1119} {"train_loss": -39.13996124267578, "global_step": 135450, "epoch": 1119} {"train_loss": -39.4810905456543, "global_step": 135451, "epoch": 1119} {"train_loss": -40.04854202270508, "global_step": 135452, "epoch": 1119} {"train_loss": -39.58429718017578, "global_step": 135453, "epoch": 1119} {"train_loss": -39.531394958496094, "global_step": 135454, "epoch": 1119} {"train_loss": -40.1343879699707, "global_step": 135455, "epoch": 1119} {"train_loss": -39.999542236328125, "global_step": 135456, "epoch": 1119} {"train_loss": -39.430110931396484, "global_step": 135457, "epoch": 1119} {"train_loss": -40.03992462158203, "global_step": 135458, "epoch": 1119} {"train_loss": -40.02171325683594, "global_step": 135459, "epoch": 1119} {"train_loss": -39.693092346191406, "global_step": 135460, "epoch": 1119} {"train_loss": -39.53612518310547, "global_step": 135461, "epoch": 1119} {"train_loss": -39.835140228271484, "global_step": 135462, "epoch": 1119} {"train_loss": -39.93354797363281, "global_step": 135463, "epoch": 1119} {"train_loss": -40.00094223022461, "global_step": 135464, "epoch": 1119} {"train_loss": -39.91714096069336, "global_step": 135465, "epoch": 1119} {"train_loss": -38.9908447265625, "global_step": 135466, "epoch": 1119} {"train_loss": -40.289634704589844, "global_step": 135467, "epoch": 1119} {"train_loss": -39.865966796875, "global_step": 135468, "epoch": 1119} {"train_loss": -40.24631881713867, "global_step": 135469, "epoch": 1119} {"train_loss": -39.76653289794922, "global_step": 135470, "epoch": 1119} {"train_loss": -40.57857894897461, "global_step": 135471, "epoch": 1119} {"train_loss": -39.13427734375, "global_step": 135472, "epoch": 1119} {"train_loss": -38.52803039550781, "global_step": 135473, "epoch": 1119} {"train_loss": -39.6381721496582, "global_step": 135474, "epoch": 1119} {"train_loss": -40.07363510131836, "global_step": 135475, "epoch": 1119} {"train_loss": -39.28677749633789, "global_step": 135476, "epoch": 1119} {"train_loss": -39.0821418762207, "global_step": 135477, "epoch": 1119} {"train_loss": -38.721797943115234, "global_step": 135478, "epoch": 1119} {"train_loss": -40.22939682006836, "global_step": 135479, "epoch": 1119} {"train_loss": -39.35588073730469, "global_step": 135480, "epoch": 1119} {"train_loss": -40.15876388549805, "global_step": 135481, "epoch": 1119} {"train_loss": -39.79829025268555, "global_step": 135482, "epoch": 1119} {"train_loss": -40.06296920776367, "global_step": 135483, "epoch": 1119} {"train_loss": -39.76065444946289, "global_step": 135484, "epoch": 1119} {"train_loss": -40.13174819946289, "global_step": 135485, "epoch": 1119} {"train_loss": -40.415924072265625, "global_step": 135486, "epoch": 1119} {"train_loss": -40.39011764526367, "global_step": 135487, "epoch": 1119} {"train_loss": -40.494319915771484, "global_step": 135488, "epoch": 1119} {"train_loss": -40.30167770385742, "global_step": 135489, "epoch": 1119} {"train_loss": -39.92435836791992, "global_step": 135490, "epoch": 1119} {"train_loss": -39.752723693847656, "global_step": 135491, "epoch": 1119} {"train_loss": -40.25850296020508, "global_step": 135492, "epoch": 1119} {"train_loss": -40.230133056640625, "global_step": 135493, "epoch": 1119} {"train_loss": -40.346290588378906, "global_step": 135494, "epoch": 1119} {"train_loss": -40.47749710083008, "global_step": 135495, "epoch": 1119} {"train_loss": -40.084197998046875, "global_step": 135496, "epoch": 1119} {"train_loss": -40.05231475830078, "global_step": 135497, "epoch": 1119} {"train_loss": -39.539180755615234, "global_step": 135498, "epoch": 1119} {"train_loss": -39.85433578491211, "global_step": 135499, "epoch": 1119} {"train_loss": -40.176353454589844, "global_step": 135500, "epoch": 1119} {"train_loss": -40.39802169799805, "global_step": 135501, "epoch": 1119} {"train_loss": -40.30083084106445, "global_step": 135502, "epoch": 1119} {"train_loss": -40.464725494384766, "global_step": 135503, "epoch": 1119} {"train_loss": -40.531917572021484, "global_step": 135504, "epoch": 1119} {"train_loss": -39.926265716552734, "global_step": 135505, "epoch": 1119} {"train_loss": -39.69782257080078, "global_step": 135506, "epoch": 1119} {"train_loss": -39.749977111816406, "global_step": 135507, "epoch": 1119} {"train_loss": -39.953975677490234, "global_step": 135508, "epoch": 1119} {"train_loss": -40.0157585144043, "global_step": 135509, "epoch": 1119} {"train_loss": -39.513710021972656, "global_step": 135510, "epoch": 1119} {"train_loss": -38.6729850769043, "global_step": 135511, "epoch": 1119} {"train_loss": -39.7650146484375, "global_step": 135512, "epoch": 1119} {"train_loss": -39.101051330566406, "global_step": 135513, "epoch": 1119} {"train_loss": -39.364166259765625, "global_step": 135514, "epoch": 1119} {"train_loss": -38.08126449584961, "global_step": 135515, "epoch": 1119} {"train_loss": -38.3590202331543, "global_step": 135516, "epoch": 1119} {"train_loss": -38.95219802856445, "global_step": 135517, "epoch": 1119} {"train_loss": -38.596004486083984, "global_step": 135518, "epoch": 1119} {"train_loss": -38.98566126232305, "global_step": 135519, "epoch": 1119, "val_loss": 2715167.75} {"train_loss": -39.02576446533203, "global_step": 135520, "epoch": 1120} {"train_loss": -38.449398040771484, "global_step": 135521, "epoch": 1120} {"train_loss": -40.49176025390625, "global_step": 135522, "epoch": 1120} {"train_loss": -39.65167999267578, "global_step": 135523, "epoch": 1120} {"train_loss": -38.87763214111328, "global_step": 135524, "epoch": 1120} {"train_loss": -39.995826721191406, "global_step": 135525, "epoch": 1120} {"train_loss": -39.951515197753906, "global_step": 135526, "epoch": 1120} {"train_loss": -39.93518829345703, "global_step": 135527, "epoch": 1120} {"train_loss": -40.14911651611328, "global_step": 135528, "epoch": 1120} {"train_loss": -39.67237091064453, "global_step": 135529, "epoch": 1120} {"train_loss": -39.400421142578125, "global_step": 135530, "epoch": 1120} {"train_loss": -40.35979080200195, "global_step": 135531, "epoch": 1120} {"train_loss": -39.98626708984375, "global_step": 135532, "epoch": 1120} {"train_loss": -40.30415344238281, "global_step": 135533, "epoch": 1120} {"train_loss": -39.97157287597656, "global_step": 135534, "epoch": 1120} {"train_loss": -40.662261962890625, "global_step": 135535, "epoch": 1120} {"train_loss": -40.81059265136719, "global_step": 135536, "epoch": 1120} {"train_loss": -40.59051513671875, "global_step": 135537, "epoch": 1120} {"train_loss": -39.991817474365234, "global_step": 135538, "epoch": 1120} {"train_loss": -40.44541931152344, "global_step": 135539, "epoch": 1120} {"train_loss": -40.00446701049805, "global_step": 135540, "epoch": 1120} {"train_loss": -40.38752365112305, "global_step": 135541, "epoch": 1120} {"train_loss": -40.21340560913086, "global_step": 135542, "epoch": 1120} {"train_loss": -40.44637680053711, "global_step": 135543, "epoch": 1120} {"train_loss": -39.92324447631836, "global_step": 135544, "epoch": 1120} {"train_loss": -39.37893295288086, "global_step": 135545, "epoch": 1120} {"train_loss": -39.52875518798828, "global_step": 135546, "epoch": 1120} {"train_loss": -39.784149169921875, "global_step": 135547, "epoch": 1120} {"train_loss": -40.40125274658203, "global_step": 135548, "epoch": 1120} {"train_loss": -38.832027435302734, "global_step": 135549, "epoch": 1120} {"train_loss": -39.13614273071289, "global_step": 135550, "epoch": 1120} {"train_loss": -38.51099395751953, "global_step": 135551, "epoch": 1120} {"train_loss": -37.71413040161133, "global_step": 135552, "epoch": 1120} {"train_loss": -38.3796501159668, "global_step": 135553, "epoch": 1120} {"train_loss": -39.69332504272461, "global_step": 135554, "epoch": 1120} {"train_loss": -40.31595993041992, "global_step": 135555, "epoch": 1120} {"train_loss": -40.21266555786133, "global_step": 135556, "epoch": 1120} {"train_loss": -40.294795989990234, "global_step": 135557, "epoch": 1120} {"train_loss": -40.16545486450195, "global_step": 135558, "epoch": 1120} {"train_loss": -39.75202560424805, "global_step": 135559, "epoch": 1120} {"train_loss": -40.3752326965332, "global_step": 135560, "epoch": 1120} {"train_loss": -40.19342803955078, "global_step": 135561, "epoch": 1120} {"train_loss": -39.54940414428711, "global_step": 135562, "epoch": 1120} {"train_loss": -40.56934356689453, "global_step": 135563, "epoch": 1120} {"train_loss": -40.21162414550781, "global_step": 135564, "epoch": 1120} {"train_loss": -40.44755172729492, "global_step": 135565, "epoch": 1120} {"train_loss": -39.582977294921875, "global_step": 135566, "epoch": 1120} {"train_loss": -39.341251373291016, "global_step": 135567, "epoch": 1120} {"train_loss": -39.47646713256836, "global_step": 135568, "epoch": 1120} {"train_loss": -40.77248001098633, "global_step": 135569, "epoch": 1120} {"train_loss": -40.250789642333984, "global_step": 135570, "epoch": 1120} {"train_loss": -40.012786865234375, "global_step": 135571, "epoch": 1120} {"train_loss": -40.04179763793945, "global_step": 135572, "epoch": 1120} {"train_loss": -40.569454193115234, "global_step": 135573, "epoch": 1120} {"train_loss": -40.53339767456055, "global_step": 135574, "epoch": 1120} {"train_loss": -40.56398010253906, "global_step": 135575, "epoch": 1120} {"train_loss": -39.869991302490234, "global_step": 135576, "epoch": 1120} {"train_loss": -40.47499465942383, "global_step": 135577, "epoch": 1120} {"train_loss": -40.51997756958008, "global_step": 135578, "epoch": 1120} {"train_loss": -40.16969680786133, "global_step": 135579, "epoch": 1120} {"train_loss": -39.874446868896484, "global_step": 135580, "epoch": 1120} {"train_loss": -40.10140609741211, "global_step": 135581, "epoch": 1120} {"train_loss": -39.4376335144043, "global_step": 135582, "epoch": 1120} {"train_loss": -38.95915985107422, "global_step": 135583, "epoch": 1120} {"train_loss": -38.664485931396484, "global_step": 135584, "epoch": 1120} {"train_loss": -39.30289840698242, "global_step": 135585, "epoch": 1120} {"train_loss": -38.896236419677734, "global_step": 135586, "epoch": 1120} {"train_loss": -40.102088928222656, "global_step": 135587, "epoch": 1120} {"train_loss": -40.13799285888672, "global_step": 135588, "epoch": 1120} {"train_loss": -39.108245849609375, "global_step": 135589, "epoch": 1120} {"train_loss": -39.24824905395508, "global_step": 135590, "epoch": 1120} {"train_loss": -40.04972457885742, "global_step": 135591, "epoch": 1120} {"train_loss": -40.4224739074707, "global_step": 135592, "epoch": 1120} {"train_loss": -38.801605224609375, "global_step": 135593, "epoch": 1120} {"train_loss": -38.074989318847656, "global_step": 135594, "epoch": 1120} {"train_loss": -39.70083236694336, "global_step": 135595, "epoch": 1120} {"train_loss": -39.22290802001953, "global_step": 135596, "epoch": 1120} {"train_loss": -39.00908279418945, "global_step": 135597, "epoch": 1120} {"train_loss": -39.428192138671875, "global_step": 135598, "epoch": 1120} {"train_loss": -39.92353057861328, "global_step": 135599, "epoch": 1120} {"train_loss": -39.413753509521484, "global_step": 135600, "epoch": 1120} {"train_loss": -38.78745651245117, "global_step": 135601, "epoch": 1120} {"train_loss": -38.978050231933594, "global_step": 135602, "epoch": 1120} {"train_loss": -38.80939865112305, "global_step": 135603, "epoch": 1120} {"train_loss": -39.12743377685547, "global_step": 135604, "epoch": 1120} {"train_loss": -39.257205963134766, "global_step": 135605, "epoch": 1120} {"train_loss": -38.527748107910156, "global_step": 135606, "epoch": 1120} {"train_loss": -39.73670196533203, "global_step": 135607, "epoch": 1120} {"train_loss": -39.74917221069336, "global_step": 135608, "epoch": 1120} {"train_loss": -38.200557708740234, "global_step": 135609, "epoch": 1120} {"train_loss": -39.46990966796875, "global_step": 135610, "epoch": 1120} {"train_loss": -39.40394592285156, "global_step": 135611, "epoch": 1120} {"train_loss": -38.90389633178711, "global_step": 135612, "epoch": 1120} {"train_loss": -37.174556732177734, "global_step": 135613, "epoch": 1120} {"train_loss": -39.010318756103516, "global_step": 135614, "epoch": 1120} {"train_loss": -39.29801559448242, "global_step": 135615, "epoch": 1120} {"train_loss": -37.3215217590332, "global_step": 135616, "epoch": 1120} {"train_loss": -39.15781784057617, "global_step": 135617, "epoch": 1120} {"train_loss": -38.53798294067383, "global_step": 135618, "epoch": 1120} {"train_loss": -39.7994384765625, "global_step": 135619, "epoch": 1120} {"train_loss": -38.77665328979492, "global_step": 135620, "epoch": 1120} {"train_loss": -39.242225646972656, "global_step": 135621, "epoch": 1120} {"train_loss": -37.642738342285156, "global_step": 135622, "epoch": 1120} {"train_loss": -38.82986068725586, "global_step": 135623, "epoch": 1120} {"train_loss": -39.40448760986328, "global_step": 135624, "epoch": 1120} {"train_loss": -38.86141586303711, "global_step": 135625, "epoch": 1120} {"train_loss": -40.30219268798828, "global_step": 135626, "epoch": 1120} {"train_loss": -38.47068405151367, "global_step": 135627, "epoch": 1120} {"train_loss": -40.05727767944336, "global_step": 135628, "epoch": 1120} {"train_loss": -39.068580627441406, "global_step": 135629, "epoch": 1120} {"train_loss": -39.632110595703125, "global_step": 135630, "epoch": 1120} {"train_loss": -39.2359619140625, "global_step": 135631, "epoch": 1120} {"train_loss": -39.699623107910156, "global_step": 135632, "epoch": 1120} {"train_loss": -39.99592208862305, "global_step": 135633, "epoch": 1120} {"train_loss": -39.35847091674805, "global_step": 135634, "epoch": 1120} {"train_loss": -39.712921142578125, "global_step": 135635, "epoch": 1120} {"train_loss": -39.887508392333984, "global_step": 135636, "epoch": 1120} {"train_loss": -39.660343170166016, "global_step": 135637, "epoch": 1120} {"train_loss": -39.862239837646484, "global_step": 135638, "epoch": 1120} {"train_loss": -39.83879852294922, "global_step": 135639, "epoch": 1120} {"train_loss": -39.58756230882377, "global_step": 135640, "epoch": 1120, "val_loss": 2672234.75} {"train_loss": -39.7088623046875, "global_step": 135641, "epoch": 1121} {"train_loss": -39.745601654052734, "global_step": 135642, "epoch": 1121} {"train_loss": -40.49882507324219, "global_step": 135643, "epoch": 1121} {"train_loss": -39.24444580078125, "global_step": 135644, "epoch": 1121} {"train_loss": -39.943660736083984, "global_step": 135645, "epoch": 1121} {"train_loss": -40.009273529052734, "global_step": 135646, "epoch": 1121} {"train_loss": -40.27477264404297, "global_step": 135647, "epoch": 1121} {"train_loss": -39.7120246887207, "global_step": 135648, "epoch": 1121} {"train_loss": -40.13291549682617, "global_step": 135649, "epoch": 1121} {"train_loss": -40.183128356933594, "global_step": 135650, "epoch": 1121} {"train_loss": -38.83075714111328, "global_step": 135651, "epoch": 1121} {"train_loss": -39.92466735839844, "global_step": 135652, "epoch": 1121} {"train_loss": -40.71881103515625, "global_step": 135653, "epoch": 1121} {"train_loss": -40.33417892456055, "global_step": 135654, "epoch": 1121} {"train_loss": -39.75374984741211, "global_step": 135655, "epoch": 1121} {"train_loss": -40.0972785949707, "global_step": 135656, "epoch": 1121} {"train_loss": -39.78173065185547, "global_step": 135657, "epoch": 1121} {"train_loss": -39.957828521728516, "global_step": 135658, "epoch": 1121} {"train_loss": -38.78919219970703, "global_step": 135659, "epoch": 1121} {"train_loss": -39.77338790893555, "global_step": 135660, "epoch": 1121} {"train_loss": -39.30428695678711, "global_step": 135661, "epoch": 1121} {"train_loss": -38.1611442565918, "global_step": 135662, "epoch": 1121} {"train_loss": -37.55992889404297, "global_step": 135663, "epoch": 1121} {"train_loss": -26.709211349487305, "global_step": 135664, "epoch": 1121} {"train_loss": -36.2188835144043, "global_step": 135665, "epoch": 1121} {"train_loss": -36.425209045410156, "global_step": 135666, "epoch": 1121} {"train_loss": -34.12070846557617, "global_step": 135667, "epoch": 1121} {"train_loss": -36.02802276611328, "global_step": 135668, "epoch": 1121} {"train_loss": -36.47443771362305, "global_step": 135669, "epoch": 1121} {"train_loss": -38.20487594604492, "global_step": 135670, "epoch": 1121} {"train_loss": -37.40857696533203, "global_step": 135671, "epoch": 1121} {"train_loss": -38.5546989440918, "global_step": 135672, "epoch": 1121} {"train_loss": -38.59296798706055, "global_step": 135673, "epoch": 1121} {"train_loss": -38.1771354675293, "global_step": 135674, "epoch": 1121} {"train_loss": -36.59579849243164, "global_step": 135675, "epoch": 1121} {"train_loss": -30.66366958618164, "global_step": 135676, "epoch": 1121} {"train_loss": -37.85479736328125, "global_step": 135677, "epoch": 1121} {"train_loss": -32.989681243896484, "global_step": 135678, "epoch": 1121} {"train_loss": -35.83730697631836, "global_step": 135679, "epoch": 1121} {"train_loss": -36.807552337646484, "global_step": 135680, "epoch": 1121} {"train_loss": -35.2733039855957, "global_step": 135681, "epoch": 1121} {"train_loss": -20.22243881225586, "global_step": 135682, "epoch": 1121} {"train_loss": -34.41277313232422, "global_step": 135683, "epoch": 1121} {"train_loss": -35.940547943115234, "global_step": 135684, "epoch": 1121} {"train_loss": -19.836811065673828, "global_step": 135685, "epoch": 1121} {"train_loss": -26.864187240600586, "global_step": 135686, "epoch": 1121} {"train_loss": -34.14624786376953, "global_step": 135687, "epoch": 1121} {"train_loss": -28.178668975830078, "global_step": 135688, "epoch": 1121} {"train_loss": -35.055328369140625, "global_step": 135689, "epoch": 1121} {"train_loss": -35.19249725341797, "global_step": 135690, "epoch": 1121} {"train_loss": -29.363794326782227, "global_step": 135691, "epoch": 1121} {"train_loss": -28.883935928344727, "global_step": 135692, "epoch": 1121} {"train_loss": -30.394392013549805, "global_step": 135693, "epoch": 1121} {"train_loss": -32.099063873291016, "global_step": 135694, "epoch": 1121} {"train_loss": -34.81721115112305, "global_step": 135695, "epoch": 1121} {"train_loss": -33.603450775146484, "global_step": 135696, "epoch": 1121} {"train_loss": -32.865535736083984, "global_step": 135697, "epoch": 1121} {"train_loss": -34.64460372924805, "global_step": 135698, "epoch": 1121} {"train_loss": -34.72802734375, "global_step": 135699, "epoch": 1121} {"train_loss": -36.165279388427734, "global_step": 135700, "epoch": 1121} {"train_loss": -31.803674697875977, "global_step": 135701, "epoch": 1121} {"train_loss": -33.27119827270508, "global_step": 135702, "epoch": 1121} {"train_loss": -32.70754623413086, "global_step": 135703, "epoch": 1121} {"train_loss": -36.20962142944336, "global_step": 135704, "epoch": 1121} {"train_loss": -36.5322380065918, "global_step": 135705, "epoch": 1121} {"train_loss": -35.75331497192383, "global_step": 135706, "epoch": 1121} {"train_loss": -36.798885345458984, "global_step": 135707, "epoch": 1121} {"train_loss": -36.316558837890625, "global_step": 135708, "epoch": 1121} {"train_loss": -36.957515716552734, "global_step": 135709, "epoch": 1121} {"train_loss": -34.17803955078125, "global_step": 135710, "epoch": 1121} {"train_loss": -34.697444915771484, "global_step": 135711, "epoch": 1121} {"train_loss": -37.155635833740234, "global_step": 135712, "epoch": 1121} {"train_loss": -36.5891227722168, "global_step": 135713, "epoch": 1121} {"train_loss": -37.2152214050293, "global_step": 135714, "epoch": 1121} {"train_loss": -37.39052963256836, "global_step": 135715, "epoch": 1121} {"train_loss": -35.9150276184082, "global_step": 135716, "epoch": 1121} {"train_loss": -37.465087890625, "global_step": 135717, "epoch": 1121} {"train_loss": -37.18490982055664, "global_step": 135718, "epoch": 1121} {"train_loss": -37.30622100830078, "global_step": 135719, "epoch": 1121} {"train_loss": -37.305110931396484, "global_step": 135720, "epoch": 1121} {"train_loss": -37.95090866088867, "global_step": 135721, "epoch": 1121} {"train_loss": -37.55222702026367, "global_step": 135722, "epoch": 1121} {"train_loss": -37.893619537353516, "global_step": 135723, "epoch": 1121} {"train_loss": -37.38969802856445, "global_step": 135724, "epoch": 1121} {"train_loss": -37.044158935546875, "global_step": 135725, "epoch": 1121} {"train_loss": -37.453643798828125, "global_step": 135726, "epoch": 1121} {"train_loss": -37.6575927734375, "global_step": 135727, "epoch": 1121} {"train_loss": -37.57305908203125, "global_step": 135728, "epoch": 1121} {"train_loss": -38.186946868896484, "global_step": 135729, "epoch": 1121} {"train_loss": -37.464813232421875, "global_step": 135730, "epoch": 1121} {"train_loss": -37.72995376586914, "global_step": 135731, "epoch": 1121} {"train_loss": -37.95357131958008, "global_step": 135732, "epoch": 1121} {"train_loss": -37.1380729675293, "global_step": 135733, "epoch": 1121} {"train_loss": -38.61379623413086, "global_step": 135734, "epoch": 1121} {"train_loss": -37.924198150634766, "global_step": 135735, "epoch": 1121} {"train_loss": -38.14858627319336, "global_step": 135736, "epoch": 1121} {"train_loss": -38.7801628112793, "global_step": 135737, "epoch": 1121} {"train_loss": -37.86627960205078, "global_step": 135738, "epoch": 1121} {"train_loss": -38.573726654052734, "global_step": 135739, "epoch": 1121} {"train_loss": -38.51905059814453, "global_step": 135740, "epoch": 1121} {"train_loss": -37.76125717163086, "global_step": 135741, "epoch": 1121} {"train_loss": -37.07780456542969, "global_step": 135742, "epoch": 1121} {"train_loss": -37.85206985473633, "global_step": 135743, "epoch": 1121} {"train_loss": -38.71314239501953, "global_step": 135744, "epoch": 1121} {"train_loss": -37.99608612060547, "global_step": 135745, "epoch": 1121} {"train_loss": -38.83738708496094, "global_step": 135746, "epoch": 1121} {"train_loss": -38.511024475097656, "global_step": 135747, "epoch": 1121} {"train_loss": -38.73469924926758, "global_step": 135748, "epoch": 1121} {"train_loss": -37.92489242553711, "global_step": 135749, "epoch": 1121} {"train_loss": -37.76616668701172, "global_step": 135750, "epoch": 1121} {"train_loss": -38.42845916748047, "global_step": 135751, "epoch": 1121} {"train_loss": -38.489498138427734, "global_step": 135752, "epoch": 1121} {"train_loss": -38.95096206665039, "global_step": 135753, "epoch": 1121} {"train_loss": -38.38999557495117, "global_step": 135754, "epoch": 1121} {"train_loss": -38.45684814453125, "global_step": 135755, "epoch": 1121} {"train_loss": -38.20881271362305, "global_step": 135756, "epoch": 1121} {"train_loss": -38.739810943603516, "global_step": 135757, "epoch": 1121} {"train_loss": -38.79718017578125, "global_step": 135758, "epoch": 1121} {"train_loss": -38.8413200378418, "global_step": 135759, "epoch": 1121} {"train_loss": -38.582759857177734, "global_step": 135760, "epoch": 1121} {"train_loss": -36.65489171556205, "global_step": 135761, "epoch": 1121, "val_loss": 2642462.25} {"train_loss": -39.56101608276367, "global_step": 135762, "epoch": 1122} {"train_loss": -38.83585739135742, "global_step": 135763, "epoch": 1122} {"train_loss": -39.26314163208008, "global_step": 135764, "epoch": 1122} {"train_loss": -39.11248779296875, "global_step": 135765, "epoch": 1122} {"train_loss": -38.329689025878906, "global_step": 135766, "epoch": 1122} {"train_loss": -39.77333450317383, "global_step": 135767, "epoch": 1122} {"train_loss": -38.1085319519043, "global_step": 135768, "epoch": 1122} {"train_loss": -39.161312103271484, "global_step": 135769, "epoch": 1122} {"train_loss": -39.04537582397461, "global_step": 135770, "epoch": 1122} {"train_loss": -38.85100173950195, "global_step": 135771, "epoch": 1122} {"train_loss": -39.55641555786133, "global_step": 135772, "epoch": 1122} {"train_loss": -39.35882568359375, "global_step": 135773, "epoch": 1122} {"train_loss": -39.424102783203125, "global_step": 135774, "epoch": 1122} {"train_loss": -39.79227828979492, "global_step": 135775, "epoch": 1122} {"train_loss": -39.16811752319336, "global_step": 135776, "epoch": 1122} {"train_loss": -39.38861846923828, "global_step": 135777, "epoch": 1122} {"train_loss": -39.381446838378906, "global_step": 135778, "epoch": 1122} {"train_loss": -39.585479736328125, "global_step": 135779, "epoch": 1122} {"train_loss": -39.44049835205078, "global_step": 135780, "epoch": 1122} {"train_loss": -39.709938049316406, "global_step": 135781, "epoch": 1122} {"train_loss": -39.82892608642578, "global_step": 135782, "epoch": 1122} {"train_loss": -39.597084045410156, "global_step": 135783, "epoch": 1122} {"train_loss": -39.22600173950195, "global_step": 135784, "epoch": 1122} {"train_loss": -39.370845794677734, "global_step": 135785, "epoch": 1122} {"train_loss": -39.88823318481445, "global_step": 135786, "epoch": 1122} {"train_loss": -40.262081146240234, "global_step": 135787, "epoch": 1122} {"train_loss": -39.79506301879883, "global_step": 135788, "epoch": 1122} {"train_loss": -40.02471160888672, "global_step": 135789, "epoch": 1122} {"train_loss": -40.04860305786133, "global_step": 135790, "epoch": 1122} {"train_loss": -40.307525634765625, "global_step": 135791, "epoch": 1122} {"train_loss": -39.77942657470703, "global_step": 135792, "epoch": 1122} {"train_loss": -39.8852424621582, "global_step": 135793, "epoch": 1122} {"train_loss": -39.21964645385742, "global_step": 135794, "epoch": 1122} {"train_loss": -40.165401458740234, "global_step": 135795, "epoch": 1122} {"train_loss": -40.252376556396484, "global_step": 135796, "epoch": 1122} {"train_loss": -39.8375244140625, "global_step": 135797, "epoch": 1122} {"train_loss": -39.971580505371094, "global_step": 135798, "epoch": 1122} {"train_loss": -39.504974365234375, "global_step": 135799, "epoch": 1122} {"train_loss": -39.938079833984375, "global_step": 135800, "epoch": 1122} {"train_loss": -40.2602653503418, "global_step": 135801, "epoch": 1122} {"train_loss": -39.81936264038086, "global_step": 135802, "epoch": 1122} {"train_loss": -39.673583984375, "global_step": 135803, "epoch": 1122} {"train_loss": -39.094486236572266, "global_step": 135804, "epoch": 1122} {"train_loss": -40.000213623046875, "global_step": 135805, "epoch": 1122} {"train_loss": -39.18900680541992, "global_step": 135806, "epoch": 1122} {"train_loss": -38.649105072021484, "global_step": 135807, "epoch": 1122} {"train_loss": -39.23834991455078, "global_step": 135808, "epoch": 1122} {"train_loss": -39.32301712036133, "global_step": 135809, "epoch": 1122} {"train_loss": -39.95301055908203, "global_step": 135810, "epoch": 1122} {"train_loss": -40.22503662109375, "global_step": 135811, "epoch": 1122} {"train_loss": -39.4755973815918, "global_step": 135812, "epoch": 1122} {"train_loss": -39.417415618896484, "global_step": 135813, "epoch": 1122} {"train_loss": -39.11784744262695, "global_step": 135814, "epoch": 1122} {"train_loss": -39.43568420410156, "global_step": 135815, "epoch": 1122} {"train_loss": -36.90609359741211, "global_step": 135816, "epoch": 1122} {"train_loss": -37.128936767578125, "global_step": 135817, "epoch": 1122} {"train_loss": -38.567684173583984, "global_step": 135818, "epoch": 1122} {"train_loss": -38.23788070678711, "global_step": 135819, "epoch": 1122} {"train_loss": -39.209712982177734, "global_step": 135820, "epoch": 1122} {"train_loss": -38.19192123413086, "global_step": 135821, "epoch": 1122} {"train_loss": -39.70484161376953, "global_step": 135822, "epoch": 1122} {"train_loss": -38.29582214355469, "global_step": 135823, "epoch": 1122} {"train_loss": -36.94655990600586, "global_step": 135824, "epoch": 1122} {"train_loss": -39.61243438720703, "global_step": 135825, "epoch": 1122} {"train_loss": -35.966041564941406, "global_step": 135826, "epoch": 1122} {"train_loss": -39.031524658203125, "global_step": 135827, "epoch": 1122} {"train_loss": -38.114837646484375, "global_step": 135828, "epoch": 1122} {"train_loss": -38.887428283691406, "global_step": 135829, "epoch": 1122} {"train_loss": -38.19753646850586, "global_step": 135830, "epoch": 1122} {"train_loss": -38.413291931152344, "global_step": 135831, "epoch": 1122} {"train_loss": -36.33323287963867, "global_step": 135832, "epoch": 1122} {"train_loss": -38.356170654296875, "global_step": 135833, "epoch": 1122} {"train_loss": -37.876895904541016, "global_step": 135834, "epoch": 1122} {"train_loss": -38.13113784790039, "global_step": 135835, "epoch": 1122} {"train_loss": -38.65430450439453, "global_step": 135836, "epoch": 1122} {"train_loss": -37.96733474731445, "global_step": 135837, "epoch": 1122} {"train_loss": -37.54804992675781, "global_step": 135838, "epoch": 1122} {"train_loss": -36.88645553588867, "global_step": 135839, "epoch": 1122} {"train_loss": -38.150177001953125, "global_step": 135840, "epoch": 1122} {"train_loss": -38.3836784362793, "global_step": 135841, "epoch": 1122} {"train_loss": -39.356998443603516, "global_step": 135842, "epoch": 1122} {"train_loss": -39.02399826049805, "global_step": 135843, "epoch": 1122} {"train_loss": -39.62971115112305, "global_step": 135844, "epoch": 1122} {"train_loss": -39.05232620239258, "global_step": 135845, "epoch": 1122} {"train_loss": -39.23262023925781, "global_step": 135846, "epoch": 1122} {"train_loss": -40.2044792175293, "global_step": 135847, "epoch": 1122} {"train_loss": -39.76963424682617, "global_step": 135848, "epoch": 1122} {"train_loss": -39.38004684448242, "global_step": 135849, "epoch": 1122} {"train_loss": -39.7109375, "global_step": 135850, "epoch": 1122} {"train_loss": -39.81298065185547, "global_step": 135851, "epoch": 1122} {"train_loss": -39.383384704589844, "global_step": 135852, "epoch": 1122} {"train_loss": -39.67722702026367, "global_step": 135853, "epoch": 1122} {"train_loss": -39.478485107421875, "global_step": 135854, "epoch": 1122} {"train_loss": -39.726497650146484, "global_step": 135855, "epoch": 1122} {"train_loss": -39.703529357910156, "global_step": 135856, "epoch": 1122} {"train_loss": -39.912715911865234, "global_step": 135857, "epoch": 1122} {"train_loss": -39.0199089050293, "global_step": 135858, "epoch": 1122} {"train_loss": -40.103797912597656, "global_step": 135859, "epoch": 1122} {"train_loss": -40.265682220458984, "global_step": 135860, "epoch": 1122} {"train_loss": -39.88064193725586, "global_step": 135861, "epoch": 1122} {"train_loss": -40.307308197021484, "global_step": 135862, "epoch": 1122} {"train_loss": -39.937843322753906, "global_step": 135863, "epoch": 1122} {"train_loss": -40.04379653930664, "global_step": 135864, "epoch": 1122} {"train_loss": -39.66935348510742, "global_step": 135865, "epoch": 1122} {"train_loss": -39.7659912109375, "global_step": 135866, "epoch": 1122} {"train_loss": -39.15446090698242, "global_step": 135867, "epoch": 1122} {"train_loss": -39.64594268798828, "global_step": 135868, "epoch": 1122} {"train_loss": -38.8309440612793, "global_step": 135869, "epoch": 1122} {"train_loss": -39.68561553955078, "global_step": 135870, "epoch": 1122} {"train_loss": -40.05446243286133, "global_step": 135871, "epoch": 1122} {"train_loss": -39.30802536010742, "global_step": 135872, "epoch": 1122} {"train_loss": -39.744102478027344, "global_step": 135873, "epoch": 1122} {"train_loss": -40.26504135131836, "global_step": 135874, "epoch": 1122} {"train_loss": -39.694271087646484, "global_step": 135875, "epoch": 1122} {"train_loss": -39.49650573730469, "global_step": 135876, "epoch": 1122} {"train_loss": -39.70522689819336, "global_step": 135877, "epoch": 1122} {"train_loss": -40.59489059448242, "global_step": 135878, "epoch": 1122} {"train_loss": -40.11943054199219, "global_step": 135879, "epoch": 1122} {"train_loss": -39.934200286865234, "global_step": 135880, "epoch": 1122} {"train_loss": -40.228111267089844, "global_step": 135881, "epoch": 1122} {"train_loss": -39.28415307919841, "global_step": 135882, "epoch": 1122, "val_loss": 2649900.25} {"train_loss": -40.2939338684082, "global_step": 135883, "epoch": 1123} {"train_loss": -40.06976318359375, "global_step": 135884, "epoch": 1123} {"train_loss": -39.06319046020508, "global_step": 135885, "epoch": 1123} {"train_loss": -38.25176239013672, "global_step": 135886, "epoch": 1123} {"train_loss": -39.65995407104492, "global_step": 135887, "epoch": 1123} {"train_loss": -39.959815979003906, "global_step": 135888, "epoch": 1123} {"train_loss": -39.013282775878906, "global_step": 135889, "epoch": 1123} {"train_loss": -39.118282318115234, "global_step": 135890, "epoch": 1123} {"train_loss": -39.77518844604492, "global_step": 135891, "epoch": 1123} {"train_loss": -38.995849609375, "global_step": 135892, "epoch": 1123} {"train_loss": -35.46955490112305, "global_step": 135893, "epoch": 1123} {"train_loss": -32.7069206237793, "global_step": 135894, "epoch": 1123} {"train_loss": -29.30828857421875, "global_step": 135895, "epoch": 1123} {"train_loss": -33.14094924926758, "global_step": 135896, "epoch": 1123} {"train_loss": -38.34450149536133, "global_step": 135897, "epoch": 1123} {"train_loss": -37.0671501159668, "global_step": 135898, "epoch": 1123} {"train_loss": -34.68946075439453, "global_step": 135899, "epoch": 1123} {"train_loss": -38.58331298828125, "global_step": 135900, "epoch": 1123} {"train_loss": -38.018306732177734, "global_step": 135901, "epoch": 1123} {"train_loss": -35.38324737548828, "global_step": 135902, "epoch": 1123} {"train_loss": -39.01346206665039, "global_step": 135903, "epoch": 1123} {"train_loss": -38.56074905395508, "global_step": 135904, "epoch": 1123} {"train_loss": -38.826683044433594, "global_step": 135905, "epoch": 1123} {"train_loss": -39.03284454345703, "global_step": 135906, "epoch": 1123} {"train_loss": -39.403236389160156, "global_step": 135907, "epoch": 1123} {"train_loss": -39.39970397949219, "global_step": 135908, "epoch": 1123} {"train_loss": -39.775787353515625, "global_step": 135909, "epoch": 1123} {"train_loss": -39.24365234375, "global_step": 135910, "epoch": 1123} {"train_loss": -39.92282485961914, "global_step": 135911, "epoch": 1123} {"train_loss": -39.605098724365234, "global_step": 135912, "epoch": 1123} {"train_loss": -39.42658996582031, "global_step": 135913, "epoch": 1123} {"train_loss": -38.74674606323242, "global_step": 135914, "epoch": 1123} {"train_loss": -39.90397262573242, "global_step": 135915, "epoch": 1123} {"train_loss": -38.89535140991211, "global_step": 135916, "epoch": 1123} {"train_loss": -39.64753341674805, "global_step": 135917, "epoch": 1123} {"train_loss": -39.69191360473633, "global_step": 135918, "epoch": 1123} {"train_loss": -39.747947692871094, "global_step": 135919, "epoch": 1123} {"train_loss": -39.8547477722168, "global_step": 135920, "epoch": 1123} {"train_loss": -39.91240310668945, "global_step": 135921, "epoch": 1123} {"train_loss": -40.31819534301758, "global_step": 135922, "epoch": 1123} {"train_loss": -39.365779876708984, "global_step": 135923, "epoch": 1123} {"train_loss": -39.822940826416016, "global_step": 135924, "epoch": 1123} {"train_loss": -38.148014068603516, "global_step": 135925, "epoch": 1123} {"train_loss": -40.3414192199707, "global_step": 135926, "epoch": 1123} {"train_loss": -39.57969284057617, "global_step": 135927, "epoch": 1123} {"train_loss": -39.914337158203125, "global_step": 135928, "epoch": 1123} {"train_loss": -39.68547821044922, "global_step": 135929, "epoch": 1123} {"train_loss": -39.710994720458984, "global_step": 135930, "epoch": 1123} {"train_loss": -39.56199264526367, "global_step": 135931, "epoch": 1123} {"train_loss": -37.71518325805664, "global_step": 135932, "epoch": 1123} {"train_loss": -38.851165771484375, "global_step": 135933, "epoch": 1123} {"train_loss": -39.567996978759766, "global_step": 135934, "epoch": 1123} {"train_loss": -34.61170196533203, "global_step": 135935, "epoch": 1123} {"train_loss": -39.20310592651367, "global_step": 135936, "epoch": 1123} {"train_loss": -40.10834884643555, "global_step": 135937, "epoch": 1123} {"train_loss": -39.846004486083984, "global_step": 135938, "epoch": 1123} {"train_loss": -38.91222381591797, "global_step": 135939, "epoch": 1123} {"train_loss": -39.5448112487793, "global_step": 135940, "epoch": 1123} {"train_loss": -39.85582733154297, "global_step": 135941, "epoch": 1123} {"train_loss": -38.925899505615234, "global_step": 135942, "epoch": 1123} {"train_loss": -37.12468338012695, "global_step": 135943, "epoch": 1123} {"train_loss": -39.7386589050293, "global_step": 135944, "epoch": 1123} {"train_loss": -39.31118392944336, "global_step": 135945, "epoch": 1123} {"train_loss": -39.59016799926758, "global_step": 135946, "epoch": 1123} {"train_loss": -39.51528549194336, "global_step": 135947, "epoch": 1123} {"train_loss": -39.516605377197266, "global_step": 135948, "epoch": 1123} {"train_loss": -39.771949768066406, "global_step": 135949, "epoch": 1123} {"train_loss": -39.096073150634766, "global_step": 135950, "epoch": 1123} {"train_loss": -40.19072723388672, "global_step": 135951, "epoch": 1123} {"train_loss": -37.76076889038086, "global_step": 135952, "epoch": 1123} {"train_loss": -39.97146987915039, "global_step": 135953, "epoch": 1123} {"train_loss": -39.511070251464844, "global_step": 135954, "epoch": 1123} {"train_loss": -40.42918395996094, "global_step": 135955, "epoch": 1123} {"train_loss": -38.66926193237305, "global_step": 135956, "epoch": 1123} {"train_loss": -35.289920806884766, "global_step": 135957, "epoch": 1123} {"train_loss": -37.7914924621582, "global_step": 135958, "epoch": 1123} {"train_loss": -40.51919174194336, "global_step": 135959, "epoch": 1123} {"train_loss": -39.58256912231445, "global_step": 135960, "epoch": 1123} {"train_loss": -40.11436080932617, "global_step": 135961, "epoch": 1123} {"train_loss": -40.24276351928711, "global_step": 135962, "epoch": 1123} {"train_loss": -38.47645950317383, "global_step": 135963, "epoch": 1123} {"train_loss": -40.085506439208984, "global_step": 135964, "epoch": 1123} {"train_loss": -39.7132568359375, "global_step": 135965, "epoch": 1123} {"train_loss": -39.23066329956055, "global_step": 135966, "epoch": 1123} {"train_loss": -39.76062774658203, "global_step": 135967, "epoch": 1123} {"train_loss": -37.382564544677734, "global_step": 135968, "epoch": 1123} {"train_loss": -39.13692092895508, "global_step": 135969, "epoch": 1123} {"train_loss": -39.806129455566406, "global_step": 135970, "epoch": 1123} {"train_loss": -39.96821594238281, "global_step": 135971, "epoch": 1123} {"train_loss": -39.242549896240234, "global_step": 135972, "epoch": 1123} {"train_loss": -39.785552978515625, "global_step": 135973, "epoch": 1123} {"train_loss": -39.40358352661133, "global_step": 135974, "epoch": 1123} {"train_loss": -36.0882682800293, "global_step": 135975, "epoch": 1123} {"train_loss": -39.89634323120117, "global_step": 135976, "epoch": 1123} {"train_loss": -38.638404846191406, "global_step": 135977, "epoch": 1123} {"train_loss": -39.06870651245117, "global_step": 135978, "epoch": 1123} {"train_loss": -38.395912170410156, "global_step": 135979, "epoch": 1123} {"train_loss": -39.04590606689453, "global_step": 135980, "epoch": 1123} {"train_loss": -37.61389923095703, "global_step": 135981, "epoch": 1123} {"train_loss": -37.98750686645508, "global_step": 135982, "epoch": 1123} {"train_loss": -39.34210968017578, "global_step": 135983, "epoch": 1123} {"train_loss": -39.41686248779297, "global_step": 135984, "epoch": 1123} {"train_loss": -38.51929473876953, "global_step": 135985, "epoch": 1123} {"train_loss": -37.70089340209961, "global_step": 135986, "epoch": 1123} {"train_loss": -37.68007278442383, "global_step": 135987, "epoch": 1123} {"train_loss": -37.06806182861328, "global_step": 135988, "epoch": 1123} {"train_loss": -37.898193359375, "global_step": 135989, "epoch": 1123} {"train_loss": -38.941951751708984, "global_step": 135990, "epoch": 1123} {"train_loss": -27.089506149291992, "global_step": 135991, "epoch": 1123} {"train_loss": -36.86567306518555, "global_step": 135992, "epoch": 1123} {"train_loss": -36.46114730834961, "global_step": 135993, "epoch": 1123} {"train_loss": -39.26374435424805, "global_step": 135994, "epoch": 1123} {"train_loss": -38.47256088256836, "global_step": 135995, "epoch": 1123} {"train_loss": -38.845306396484375, "global_step": 135996, "epoch": 1123} {"train_loss": -38.79966735839844, "global_step": 135997, "epoch": 1123} {"train_loss": -38.43034744262695, "global_step": 135998, "epoch": 1123} {"train_loss": -37.860042572021484, "global_step": 135999, "epoch": 1123} {"train_loss": -36.19795608520508, "global_step": 136000, "epoch": 1123} {"train_loss": -38.95045852661133, "global_step": 136001, "epoch": 1123} {"train_loss": -38.754188537597656, "global_step": 136002, "epoch": 1123} {"train_loss": -38.614811085472425, "global_step": 136003, "epoch": 1123, "val_loss": 2942566.75} {"train_loss": -37.28770065307617, "global_step": 136004, "epoch": 1124} {"train_loss": -38.09564208984375, "global_step": 136005, "epoch": 1124} {"train_loss": -37.664344787597656, "global_step": 136006, "epoch": 1124} {"train_loss": -39.19365310668945, "global_step": 136007, "epoch": 1124} {"train_loss": -38.876976013183594, "global_step": 136008, "epoch": 1124} {"train_loss": -38.72532272338867, "global_step": 136009, "epoch": 1124} {"train_loss": -39.08057403564453, "global_step": 136010, "epoch": 1124} {"train_loss": -38.627105712890625, "global_step": 136011, "epoch": 1124} {"train_loss": -39.62126159667969, "global_step": 136012, "epoch": 1124} {"train_loss": -38.947628021240234, "global_step": 136013, "epoch": 1124} {"train_loss": -39.68000411987305, "global_step": 136014, "epoch": 1124} {"train_loss": -39.04271697998047, "global_step": 136015, "epoch": 1124} {"train_loss": -38.242637634277344, "global_step": 136016, "epoch": 1124} {"train_loss": -38.91964340209961, "global_step": 136017, "epoch": 1124} {"train_loss": -37.28208541870117, "global_step": 136018, "epoch": 1124} {"train_loss": -39.66078567504883, "global_step": 136019, "epoch": 1124} {"train_loss": -38.73114776611328, "global_step": 136020, "epoch": 1124} {"train_loss": -39.25015640258789, "global_step": 136021, "epoch": 1124} {"train_loss": -40.091064453125, "global_step": 136022, "epoch": 1124} {"train_loss": -39.44131088256836, "global_step": 136023, "epoch": 1124} {"train_loss": -39.50994873046875, "global_step": 136024, "epoch": 1124} {"train_loss": -38.73609161376953, "global_step": 136025, "epoch": 1124} {"train_loss": -39.20232009887695, "global_step": 136026, "epoch": 1124} {"train_loss": -39.79243469238281, "global_step": 136027, "epoch": 1124} {"train_loss": -39.549415588378906, "global_step": 136028, "epoch": 1124} {"train_loss": -39.55327224731445, "global_step": 136029, "epoch": 1124} {"train_loss": -39.57082748413086, "global_step": 136030, "epoch": 1124} {"train_loss": -38.326595306396484, "global_step": 136031, "epoch": 1124} {"train_loss": -38.44186019897461, "global_step": 136032, "epoch": 1124} {"train_loss": -39.53015899658203, "global_step": 136033, "epoch": 1124} {"train_loss": -39.79099655151367, "global_step": 136034, "epoch": 1124} {"train_loss": -39.782875061035156, "global_step": 136035, "epoch": 1124} {"train_loss": -39.52541732788086, "global_step": 136036, "epoch": 1124} {"train_loss": -34.471717834472656, "global_step": 136037, "epoch": 1124} {"train_loss": -39.98900604248047, "global_step": 136038, "epoch": 1124} {"train_loss": -39.113521575927734, "global_step": 136039, "epoch": 1124} {"train_loss": -39.19889450073242, "global_step": 136040, "epoch": 1124} {"train_loss": -38.824317932128906, "global_step": 136041, "epoch": 1124} {"train_loss": -38.838043212890625, "global_step": 136042, "epoch": 1124} {"train_loss": -40.081478118896484, "global_step": 136043, "epoch": 1124} {"train_loss": -39.78069305419922, "global_step": 136044, "epoch": 1124} {"train_loss": -40.35231399536133, "global_step": 136045, "epoch": 1124} {"train_loss": -40.056697845458984, "global_step": 136046, "epoch": 1124} {"train_loss": -39.63228988647461, "global_step": 136047, "epoch": 1124} {"train_loss": -40.326263427734375, "global_step": 136048, "epoch": 1124} {"train_loss": -39.60600280761719, "global_step": 136049, "epoch": 1124} {"train_loss": -40.24026870727539, "global_step": 136050, "epoch": 1124} {"train_loss": -39.7823600769043, "global_step": 136051, "epoch": 1124} {"train_loss": -39.37376022338867, "global_step": 136052, "epoch": 1124} {"train_loss": -39.14510726928711, "global_step": 136053, "epoch": 1124} {"train_loss": -38.60906982421875, "global_step": 136054, "epoch": 1124} {"train_loss": -39.662471771240234, "global_step": 136055, "epoch": 1124} {"train_loss": -38.997955322265625, "global_step": 136056, "epoch": 1124} {"train_loss": -37.51406478881836, "global_step": 136057, "epoch": 1124} {"train_loss": -38.623966217041016, "global_step": 136058, "epoch": 1124} {"train_loss": -39.73409652709961, "global_step": 136059, "epoch": 1124} {"train_loss": -39.0636100769043, "global_step": 136060, "epoch": 1124} {"train_loss": -38.9239616394043, "global_step": 136061, "epoch": 1124} {"train_loss": -39.5108642578125, "global_step": 136062, "epoch": 1124} {"train_loss": -39.85408020019531, "global_step": 136063, "epoch": 1124} {"train_loss": -38.951683044433594, "global_step": 136064, "epoch": 1124} {"train_loss": -39.80589294433594, "global_step": 136065, "epoch": 1124} {"train_loss": -39.8271598815918, "global_step": 136066, "epoch": 1124} {"train_loss": -39.8206901550293, "global_step": 136067, "epoch": 1124} {"train_loss": -38.943660736083984, "global_step": 136068, "epoch": 1124} {"train_loss": -39.90808868408203, "global_step": 136069, "epoch": 1124} {"train_loss": -39.873104095458984, "global_step": 136070, "epoch": 1124} {"train_loss": -39.09263229370117, "global_step": 136071, "epoch": 1124} {"train_loss": -38.81239318847656, "global_step": 136072, "epoch": 1124} {"train_loss": -38.808387756347656, "global_step": 136073, "epoch": 1124} {"train_loss": -40.10449981689453, "global_step": 136074, "epoch": 1124} {"train_loss": -38.960060119628906, "global_step": 136075, "epoch": 1124} {"train_loss": -39.34785079956055, "global_step": 136076, "epoch": 1124} {"train_loss": -39.585716247558594, "global_step": 136077, "epoch": 1124} {"train_loss": -39.66805648803711, "global_step": 136078, "epoch": 1124} {"train_loss": -40.15822982788086, "global_step": 136079, "epoch": 1124} {"train_loss": -39.6925163269043, "global_step": 136080, "epoch": 1124} {"train_loss": -39.275123596191406, "global_step": 136081, "epoch": 1124} {"train_loss": -39.81877517700195, "global_step": 136082, "epoch": 1124} {"train_loss": -40.009395599365234, "global_step": 136083, "epoch": 1124} {"train_loss": -38.58041000366211, "global_step": 136084, "epoch": 1124} {"train_loss": -40.36894607543945, "global_step": 136085, "epoch": 1124} {"train_loss": -39.466129302978516, "global_step": 136086, "epoch": 1124} {"train_loss": -39.687198638916016, "global_step": 136087, "epoch": 1124} {"train_loss": -39.464820861816406, "global_step": 136088, "epoch": 1124} {"train_loss": -39.90800857543945, "global_step": 136089, "epoch": 1124} {"train_loss": -39.35420608520508, "global_step": 136090, "epoch": 1124} {"train_loss": -38.062591552734375, "global_step": 136091, "epoch": 1124} {"train_loss": -37.514190673828125, "global_step": 136092, "epoch": 1124} {"train_loss": -38.02224349975586, "global_step": 136093, "epoch": 1124} {"train_loss": -39.38640213012695, "global_step": 136094, "epoch": 1124} {"train_loss": -39.07748031616211, "global_step": 136095, "epoch": 1124} {"train_loss": -39.51521682739258, "global_step": 136096, "epoch": 1124} {"train_loss": -37.95469665527344, "global_step": 136097, "epoch": 1124} {"train_loss": -38.917842864990234, "global_step": 136098, "epoch": 1124} {"train_loss": -39.8798828125, "global_step": 136099, "epoch": 1124} {"train_loss": -39.15426254272461, "global_step": 136100, "epoch": 1124} {"train_loss": -39.838924407958984, "global_step": 136101, "epoch": 1124} {"train_loss": -38.82988357543945, "global_step": 136102, "epoch": 1124} {"train_loss": -39.665565490722656, "global_step": 136103, "epoch": 1124} {"train_loss": -38.165313720703125, "global_step": 136104, "epoch": 1124} {"train_loss": -39.08559036254883, "global_step": 136105, "epoch": 1124} {"train_loss": -39.271942138671875, "global_step": 136106, "epoch": 1124} {"train_loss": -39.16780471801758, "global_step": 136107, "epoch": 1124} {"train_loss": -39.57063674926758, "global_step": 136108, "epoch": 1124} {"train_loss": -39.43110275268555, "global_step": 136109, "epoch": 1124} {"train_loss": -39.80949783325195, "global_step": 136110, "epoch": 1124} {"train_loss": -34.20095443725586, "global_step": 136111, "epoch": 1124} {"train_loss": -38.4732666015625, "global_step": 136112, "epoch": 1124} {"train_loss": -38.45223617553711, "global_step": 136113, "epoch": 1124} {"train_loss": -39.34111404418945, "global_step": 136114, "epoch": 1124} {"train_loss": -36.573116302490234, "global_step": 136115, "epoch": 1124} {"train_loss": -39.39304733276367, "global_step": 136116, "epoch": 1124} {"train_loss": -35.4510498046875, "global_step": 136117, "epoch": 1124} {"train_loss": -38.46879959106445, "global_step": 136118, "epoch": 1124} {"train_loss": -39.04868698120117, "global_step": 136119, "epoch": 1124} {"train_loss": -37.52443313598633, "global_step": 136120, "epoch": 1124} {"train_loss": -38.525516510009766, "global_step": 136121, "epoch": 1124} {"train_loss": -39.44232940673828, "global_step": 136122, "epoch": 1124} {"train_loss": -39.68715286254883, "global_step": 136123, "epoch": 1124} {"train_loss": -39.076167051457176, "global_step": 136124, "epoch": 1124, "val_loss": 2911975.25} {"train_loss": -39.51607131958008, "global_step": 136125, "epoch": 1125} {"train_loss": -36.79037094116211, "global_step": 136126, "epoch": 1125} {"train_loss": -38.95964431762695, "global_step": 136127, "epoch": 1125} {"train_loss": -37.852943420410156, "global_step": 136128, "epoch": 1125} {"train_loss": -38.8878173828125, "global_step": 136129, "epoch": 1125} {"train_loss": -37.542274475097656, "global_step": 136130, "epoch": 1125} {"train_loss": -40.10378646850586, "global_step": 136131, "epoch": 1125} {"train_loss": -39.217647552490234, "global_step": 136132, "epoch": 1125} {"train_loss": -36.712501525878906, "global_step": 136133, "epoch": 1125} {"train_loss": -38.32239532470703, "global_step": 136134, "epoch": 1125} {"train_loss": -39.69175338745117, "global_step": 136135, "epoch": 1125} {"train_loss": -38.652732849121094, "global_step": 136136, "epoch": 1125} {"train_loss": -37.69133377075195, "global_step": 136137, "epoch": 1125} {"train_loss": -38.983619689941406, "global_step": 136138, "epoch": 1125} {"train_loss": -39.48924255371094, "global_step": 136139, "epoch": 1125} {"train_loss": -39.93205642700195, "global_step": 136140, "epoch": 1125} {"train_loss": -39.453643798828125, "global_step": 136141, "epoch": 1125} {"train_loss": -39.2617073059082, "global_step": 136142, "epoch": 1125} {"train_loss": -39.08673095703125, "global_step": 136143, "epoch": 1125} {"train_loss": -38.211578369140625, "global_step": 136144, "epoch": 1125} {"train_loss": -38.65546798706055, "global_step": 136145, "epoch": 1125} {"train_loss": -39.4698600769043, "global_step": 136146, "epoch": 1125} {"train_loss": -38.60595703125, "global_step": 136147, "epoch": 1125} {"train_loss": -38.52578353881836, "global_step": 136148, "epoch": 1125} {"train_loss": -37.36288833618164, "global_step": 136149, "epoch": 1125} {"train_loss": -38.8364143371582, "global_step": 136150, "epoch": 1125} {"train_loss": -35.716243743896484, "global_step": 136151, "epoch": 1125} {"train_loss": -39.1347541809082, "global_step": 136152, "epoch": 1125} {"train_loss": -39.95612335205078, "global_step": 136153, "epoch": 1125} {"train_loss": -37.73210144042969, "global_step": 136154, "epoch": 1125} {"train_loss": -38.53486251831055, "global_step": 136155, "epoch": 1125} {"train_loss": -37.44056701660156, "global_step": 136156, "epoch": 1125} {"train_loss": -38.072288513183594, "global_step": 136157, "epoch": 1125} {"train_loss": -38.6718864440918, "global_step": 136158, "epoch": 1125} {"train_loss": -38.43299102783203, "global_step": 136159, "epoch": 1125} {"train_loss": -39.6044807434082, "global_step": 136160, "epoch": 1125} {"train_loss": -39.129329681396484, "global_step": 136161, "epoch": 1125} {"train_loss": -39.07849884033203, "global_step": 136162, "epoch": 1125} {"train_loss": -39.376407623291016, "global_step": 136163, "epoch": 1125} {"train_loss": -38.58198928833008, "global_step": 136164, "epoch": 1125} {"train_loss": -39.25835037231445, "global_step": 136165, "epoch": 1125} {"train_loss": -39.17254638671875, "global_step": 136166, "epoch": 1125} {"train_loss": -38.81233215332031, "global_step": 136167, "epoch": 1125} {"train_loss": -38.83489990234375, "global_step": 136168, "epoch": 1125} {"train_loss": -38.39998245239258, "global_step": 136169, "epoch": 1125} {"train_loss": -39.566078186035156, "global_step": 136170, "epoch": 1125} {"train_loss": -39.30295944213867, "global_step": 136171, "epoch": 1125} {"train_loss": -39.52616500854492, "global_step": 136172, "epoch": 1125} {"train_loss": -39.56050491333008, "global_step": 136173, "epoch": 1125} {"train_loss": -40.13320541381836, "global_step": 136174, "epoch": 1125} {"train_loss": -39.46282958984375, "global_step": 136175, "epoch": 1125} {"train_loss": -39.704891204833984, "global_step": 136176, "epoch": 1125} {"train_loss": -39.838680267333984, "global_step": 136177, "epoch": 1125} {"train_loss": -39.53945541381836, "global_step": 136178, "epoch": 1125} {"train_loss": -39.217159271240234, "global_step": 136179, "epoch": 1125} {"train_loss": -39.214996337890625, "global_step": 136180, "epoch": 1125} {"train_loss": -35.24531173706055, "global_step": 136181, "epoch": 1125} {"train_loss": -39.5262451171875, "global_step": 136182, "epoch": 1125} {"train_loss": -38.05926513671875, "global_step": 136183, "epoch": 1125} {"train_loss": -38.01333236694336, "global_step": 136184, "epoch": 1125} {"train_loss": -39.92682647705078, "global_step": 136185, "epoch": 1125} {"train_loss": -39.327392578125, "global_step": 136186, "epoch": 1125} {"train_loss": -39.281593322753906, "global_step": 136187, "epoch": 1125} {"train_loss": -38.573448181152344, "global_step": 136188, "epoch": 1125} {"train_loss": -39.005592346191406, "global_step": 136189, "epoch": 1125} {"train_loss": -39.96110916137695, "global_step": 136190, "epoch": 1125} {"train_loss": -39.328773498535156, "global_step": 136191, "epoch": 1125} {"train_loss": -39.47428512573242, "global_step": 136192, "epoch": 1125} {"train_loss": -38.59990310668945, "global_step": 136193, "epoch": 1125} {"train_loss": -40.127052307128906, "global_step": 136194, "epoch": 1125} {"train_loss": -39.59400177001953, "global_step": 136195, "epoch": 1125} {"train_loss": -40.34517288208008, "global_step": 136196, "epoch": 1125} {"train_loss": -40.04850387573242, "global_step": 136197, "epoch": 1125} {"train_loss": -40.18335723876953, "global_step": 136198, "epoch": 1125} {"train_loss": -39.96354293823242, "global_step": 136199, "epoch": 1125} {"train_loss": -40.21052932739258, "global_step": 136200, "epoch": 1125} {"train_loss": -39.850074768066406, "global_step": 136201, "epoch": 1125} {"train_loss": -40.16547775268555, "global_step": 136202, "epoch": 1125} {"train_loss": -40.016639709472656, "global_step": 136203, "epoch": 1125} {"train_loss": -39.685699462890625, "global_step": 136204, "epoch": 1125} {"train_loss": -40.11992263793945, "global_step": 136205, "epoch": 1125} {"train_loss": -39.6965446472168, "global_step": 136206, "epoch": 1125} {"train_loss": -39.780418395996094, "global_step": 136207, "epoch": 1125} {"train_loss": -39.15753936767578, "global_step": 136208, "epoch": 1125} {"train_loss": -38.971839904785156, "global_step": 136209, "epoch": 1125} {"train_loss": -39.63328170776367, "global_step": 136210, "epoch": 1125} {"train_loss": -40.47328567504883, "global_step": 136211, "epoch": 1125} {"train_loss": -39.54747772216797, "global_step": 136212, "epoch": 1125} {"train_loss": -39.30173873901367, "global_step": 136213, "epoch": 1125} {"train_loss": -40.08860397338867, "global_step": 136214, "epoch": 1125} {"train_loss": -39.914100646972656, "global_step": 136215, "epoch": 1125} {"train_loss": -40.32673645019531, "global_step": 136216, "epoch": 1125} {"train_loss": -40.4587516784668, "global_step": 136217, "epoch": 1125} {"train_loss": -39.83486557006836, "global_step": 136218, "epoch": 1125} {"train_loss": -39.98775863647461, "global_step": 136219, "epoch": 1125} {"train_loss": -40.059600830078125, "global_step": 136220, "epoch": 1125} {"train_loss": -40.60415267944336, "global_step": 136221, "epoch": 1125} {"train_loss": -39.626468658447266, "global_step": 136222, "epoch": 1125} {"train_loss": -39.52189254760742, "global_step": 136223, "epoch": 1125} {"train_loss": -39.124664306640625, "global_step": 136224, "epoch": 1125} {"train_loss": -39.840755462646484, "global_step": 136225, "epoch": 1125} {"train_loss": -40.733314514160156, "global_step": 136226, "epoch": 1125} {"train_loss": -40.62823486328125, "global_step": 136227, "epoch": 1125} {"train_loss": -39.514278411865234, "global_step": 136228, "epoch": 1125} {"train_loss": -39.70695877075195, "global_step": 136229, "epoch": 1125} {"train_loss": -39.462459564208984, "global_step": 136230, "epoch": 1125} {"train_loss": -38.95362091064453, "global_step": 136231, "epoch": 1125} {"train_loss": -38.55194091796875, "global_step": 136232, "epoch": 1125} {"train_loss": -39.11894607543945, "global_step": 136233, "epoch": 1125} {"train_loss": -36.93296432495117, "global_step": 136234, "epoch": 1125} {"train_loss": -37.963340759277344, "global_step": 136235, "epoch": 1125} {"train_loss": -38.66554641723633, "global_step": 136236, "epoch": 1125} {"train_loss": -33.790645599365234, "global_step": 136237, "epoch": 1125} {"train_loss": -31.726499557495117, "global_step": 136238, "epoch": 1125} {"train_loss": -36.44221115112305, "global_step": 136239, "epoch": 1125} {"train_loss": -37.75196838378906, "global_step": 136240, "epoch": 1125} {"train_loss": -38.18529510498047, "global_step": 136241, "epoch": 1125} {"train_loss": -37.180233001708984, "global_step": 136242, "epoch": 1125} {"train_loss": -38.1016731262207, "global_step": 136243, "epoch": 1125} {"train_loss": -39.31721115112305, "global_step": 136244, "epoch": 1125} {"train_loss": -38.98151859567185, "global_step": 136245, "epoch": 1125, "val_loss": 2631627.75} {"train_loss": -39.03069305419922, "global_step": 136246, "epoch": 1126} {"train_loss": -38.11292266845703, "global_step": 136247, "epoch": 1126} {"train_loss": -39.169342041015625, "global_step": 136248, "epoch": 1126} {"train_loss": -38.58753204345703, "global_step": 136249, "epoch": 1126} {"train_loss": -37.52104568481445, "global_step": 136250, "epoch": 1126} {"train_loss": -39.16575241088867, "global_step": 136251, "epoch": 1126} {"train_loss": -37.889461517333984, "global_step": 136252, "epoch": 1126} {"train_loss": -38.67546463012695, "global_step": 136253, "epoch": 1126} {"train_loss": -39.22749710083008, "global_step": 136254, "epoch": 1126} {"train_loss": -39.552547454833984, "global_step": 136255, "epoch": 1126} {"train_loss": -38.8645133972168, "global_step": 136256, "epoch": 1126} {"train_loss": -38.340431213378906, "global_step": 136257, "epoch": 1126} {"train_loss": -39.2429313659668, "global_step": 136258, "epoch": 1126} {"train_loss": -37.162574768066406, "global_step": 136259, "epoch": 1126} {"train_loss": -38.912044525146484, "global_step": 136260, "epoch": 1126} {"train_loss": -38.77775192260742, "global_step": 136261, "epoch": 1126} {"train_loss": -39.753536224365234, "global_step": 136262, "epoch": 1126} {"train_loss": -39.25364303588867, "global_step": 136263, "epoch": 1126} {"train_loss": -37.25908279418945, "global_step": 136264, "epoch": 1126} {"train_loss": -39.51288986206055, "global_step": 136265, "epoch": 1126} {"train_loss": -39.398128509521484, "global_step": 136266, "epoch": 1126} {"train_loss": -39.413108825683594, "global_step": 136267, "epoch": 1126} {"train_loss": -39.8514518737793, "global_step": 136268, "epoch": 1126} {"train_loss": -39.84463119506836, "global_step": 136269, "epoch": 1126} {"train_loss": -39.58008575439453, "global_step": 136270, "epoch": 1126} {"train_loss": -40.011810302734375, "global_step": 136271, "epoch": 1126} {"train_loss": -39.623451232910156, "global_step": 136272, "epoch": 1126} {"train_loss": -39.65171432495117, "global_step": 136273, "epoch": 1126} {"train_loss": -39.92197799682617, "global_step": 136274, "epoch": 1126} {"train_loss": -40.07515335083008, "global_step": 136275, "epoch": 1126} {"train_loss": -39.13509750366211, "global_step": 136276, "epoch": 1126} {"train_loss": -40.4106559753418, "global_step": 136277, "epoch": 1126} {"train_loss": -39.50431442260742, "global_step": 136278, "epoch": 1126} {"train_loss": -40.1373405456543, "global_step": 136279, "epoch": 1126} {"train_loss": -40.379737854003906, "global_step": 136280, "epoch": 1126} {"train_loss": -39.848995208740234, "global_step": 136281, "epoch": 1126} {"train_loss": -38.534549713134766, "global_step": 136282, "epoch": 1126} {"train_loss": -40.160945892333984, "global_step": 136283, "epoch": 1126} {"train_loss": -39.89731979370117, "global_step": 136284, "epoch": 1126} {"train_loss": -39.31965637207031, "global_step": 136285, "epoch": 1126} {"train_loss": -40.4715690612793, "global_step": 136286, "epoch": 1126} {"train_loss": -40.36229705810547, "global_step": 136287, "epoch": 1126} {"train_loss": -40.18485641479492, "global_step": 136288, "epoch": 1126} {"train_loss": -40.16303253173828, "global_step": 136289, "epoch": 1126} {"train_loss": -39.801204681396484, "global_step": 136290, "epoch": 1126} {"train_loss": -39.94649887084961, "global_step": 136291, "epoch": 1126} {"train_loss": -40.2903938293457, "global_step": 136292, "epoch": 1126} {"train_loss": -39.877498626708984, "global_step": 136293, "epoch": 1126} {"train_loss": -40.0045166015625, "global_step": 136294, "epoch": 1126} {"train_loss": -40.503238677978516, "global_step": 136295, "epoch": 1126} {"train_loss": -40.73073959350586, "global_step": 136296, "epoch": 1126} {"train_loss": -40.1863899230957, "global_step": 136297, "epoch": 1126} {"train_loss": -40.25713348388672, "global_step": 136298, "epoch": 1126} {"train_loss": -40.351070404052734, "global_step": 136299, "epoch": 1126} {"train_loss": -40.685787200927734, "global_step": 136300, "epoch": 1126} {"train_loss": -40.40779495239258, "global_step": 136301, "epoch": 1126} {"train_loss": -39.92268371582031, "global_step": 136302, "epoch": 1126} {"train_loss": -40.51498031616211, "global_step": 136303, "epoch": 1126} {"train_loss": -40.2989501953125, "global_step": 136304, "epoch": 1126} {"train_loss": -41.110198974609375, "global_step": 136305, "epoch": 1126} {"train_loss": -40.588321685791016, "global_step": 136306, "epoch": 1126} {"train_loss": -40.281890869140625, "global_step": 136307, "epoch": 1126} {"train_loss": -40.60786437988281, "global_step": 136308, "epoch": 1126} {"train_loss": -39.8144645690918, "global_step": 136309, "epoch": 1126} {"train_loss": -39.80843734741211, "global_step": 136310, "epoch": 1126} {"train_loss": -39.929256439208984, "global_step": 136311, "epoch": 1126} {"train_loss": -38.81986618041992, "global_step": 136312, "epoch": 1126} {"train_loss": -39.33414840698242, "global_step": 136313, "epoch": 1126} {"train_loss": -40.452205657958984, "global_step": 136314, "epoch": 1126} {"train_loss": -39.56694793701172, "global_step": 136315, "epoch": 1126} {"train_loss": -39.1572151184082, "global_step": 136316, "epoch": 1126} {"train_loss": -40.02223587036133, "global_step": 136317, "epoch": 1126} {"train_loss": -39.50057601928711, "global_step": 136318, "epoch": 1126} {"train_loss": -40.74640655517578, "global_step": 136319, "epoch": 1126} {"train_loss": -38.44240951538086, "global_step": 136320, "epoch": 1126} {"train_loss": -39.700775146484375, "global_step": 136321, "epoch": 1126} {"train_loss": -39.484588623046875, "global_step": 136322, "epoch": 1126} {"train_loss": -39.414772033691406, "global_step": 136323, "epoch": 1126} {"train_loss": -40.02898025512695, "global_step": 136324, "epoch": 1126} {"train_loss": -40.8062858581543, "global_step": 136325, "epoch": 1126} {"train_loss": -39.69794845581055, "global_step": 136326, "epoch": 1126} {"train_loss": -40.55778503417969, "global_step": 136327, "epoch": 1126} {"train_loss": -40.21870040893555, "global_step": 136328, "epoch": 1126} {"train_loss": -39.830047607421875, "global_step": 136329, "epoch": 1126} {"train_loss": -39.96155548095703, "global_step": 136330, "epoch": 1126} {"train_loss": -39.54856491088867, "global_step": 136331, "epoch": 1126} {"train_loss": -40.57988357543945, "global_step": 136332, "epoch": 1126} {"train_loss": -40.71126937866211, "global_step": 136333, "epoch": 1126} {"train_loss": -39.347957611083984, "global_step": 136334, "epoch": 1126} {"train_loss": -40.76478958129883, "global_step": 136335, "epoch": 1126} {"train_loss": -40.430904388427734, "global_step": 136336, "epoch": 1126} {"train_loss": -39.034698486328125, "global_step": 136337, "epoch": 1126} {"train_loss": -39.501747131347656, "global_step": 136338, "epoch": 1126} {"train_loss": -40.21711730957031, "global_step": 136339, "epoch": 1126} {"train_loss": -39.29706954956055, "global_step": 136340, "epoch": 1126} {"train_loss": -39.981178283691406, "global_step": 136341, "epoch": 1126} {"train_loss": -39.48527908325195, "global_step": 136342, "epoch": 1126} {"train_loss": -39.315467834472656, "global_step": 136343, "epoch": 1126} {"train_loss": -39.40955352783203, "global_step": 136344, "epoch": 1126} {"train_loss": -39.51729965209961, "global_step": 136345, "epoch": 1126} {"train_loss": -39.2870979309082, "global_step": 136346, "epoch": 1126} {"train_loss": -39.54833221435547, "global_step": 136347, "epoch": 1126} {"train_loss": -38.907203674316406, "global_step": 136348, "epoch": 1126} {"train_loss": -38.98232650756836, "global_step": 136349, "epoch": 1126} {"train_loss": -40.227149963378906, "global_step": 136350, "epoch": 1126} {"train_loss": -38.71410369873047, "global_step": 136351, "epoch": 1126} {"train_loss": -39.0418701171875, "global_step": 136352, "epoch": 1126} {"train_loss": -38.02463150024414, "global_step": 136353, "epoch": 1126} {"train_loss": -38.434139251708984, "global_step": 136354, "epoch": 1126} {"train_loss": -38.84828567504883, "global_step": 136355, "epoch": 1126} {"train_loss": -40.01923751831055, "global_step": 136356, "epoch": 1126} {"train_loss": -39.49277877807617, "global_step": 136357, "epoch": 1126} {"train_loss": -40.15052032470703, "global_step": 136358, "epoch": 1126} {"train_loss": -39.78680419921875, "global_step": 136359, "epoch": 1126} {"train_loss": -39.15461730957031, "global_step": 136360, "epoch": 1126} {"train_loss": -39.127891540527344, "global_step": 136361, "epoch": 1126} {"train_loss": -40.629512786865234, "global_step": 136362, "epoch": 1126} {"train_loss": -39.35887908935547, "global_step": 136363, "epoch": 1126} {"train_loss": -39.731990814208984, "global_step": 136364, "epoch": 1126} {"train_loss": -38.74262619018555, "global_step": 136365, "epoch": 1126} {"train_loss": -39.60358845103871, "global_step": 136366, "epoch": 1126, "val_loss": 2588524.0} {"train_loss": -37.92362594604492, "global_step": 136367, "epoch": 1127} {"train_loss": -38.37541198730469, "global_step": 136368, "epoch": 1127} {"train_loss": -38.90660095214844, "global_step": 136369, "epoch": 1127} {"train_loss": -37.970821380615234, "global_step": 136370, "epoch": 1127} {"train_loss": -32.5823860168457, "global_step": 136371, "epoch": 1127} {"train_loss": -37.686737060546875, "global_step": 136372, "epoch": 1127} {"train_loss": -39.20071029663086, "global_step": 136373, "epoch": 1127} {"train_loss": -38.69053649902344, "global_step": 136374, "epoch": 1127} {"train_loss": -38.27859115600586, "global_step": 136375, "epoch": 1127} {"train_loss": -39.29718017578125, "global_step": 136376, "epoch": 1127} {"train_loss": -38.521419525146484, "global_step": 136377, "epoch": 1127} {"train_loss": -39.21064758300781, "global_step": 136378, "epoch": 1127} {"train_loss": -38.57658386230469, "global_step": 136379, "epoch": 1127} {"train_loss": -38.481685638427734, "global_step": 136380, "epoch": 1127} {"train_loss": -39.01643753051758, "global_step": 136381, "epoch": 1127} {"train_loss": -38.341522216796875, "global_step": 136382, "epoch": 1127} {"train_loss": -38.82399368286133, "global_step": 136383, "epoch": 1127} {"train_loss": -38.893272399902344, "global_step": 136384, "epoch": 1127} {"train_loss": -39.19222640991211, "global_step": 136385, "epoch": 1127} {"train_loss": -38.1591796875, "global_step": 136386, "epoch": 1127} {"train_loss": -37.301570892333984, "global_step": 136387, "epoch": 1127} {"train_loss": -36.7730827331543, "global_step": 136388, "epoch": 1127} {"train_loss": -37.13318634033203, "global_step": 136389, "epoch": 1127} {"train_loss": -38.19160079956055, "global_step": 136390, "epoch": 1127} {"train_loss": -37.30703353881836, "global_step": 136391, "epoch": 1127} {"train_loss": -38.579288482666016, "global_step": 136392, "epoch": 1127} {"train_loss": -37.56226348876953, "global_step": 136393, "epoch": 1127} {"train_loss": -39.1719856262207, "global_step": 136394, "epoch": 1127} {"train_loss": -38.115665435791016, "global_step": 136395, "epoch": 1127} {"train_loss": -38.96619415283203, "global_step": 136396, "epoch": 1127} {"train_loss": -34.95566177368164, "global_step": 136397, "epoch": 1127} {"train_loss": -38.83906936645508, "global_step": 136398, "epoch": 1127} {"train_loss": -38.72233963012695, "global_step": 136399, "epoch": 1127} {"train_loss": -37.2421989440918, "global_step": 136400, "epoch": 1127} {"train_loss": -39.40245819091797, "global_step": 136401, "epoch": 1127} {"train_loss": -38.73765182495117, "global_step": 136402, "epoch": 1127} {"train_loss": -39.3392219543457, "global_step": 136403, "epoch": 1127} {"train_loss": -39.43444061279297, "global_step": 136404, "epoch": 1127} {"train_loss": -39.500240325927734, "global_step": 136405, "epoch": 1127} {"train_loss": -39.227352142333984, "global_step": 136406, "epoch": 1127} {"train_loss": -39.937469482421875, "global_step": 136407, "epoch": 1127} {"train_loss": -39.63973617553711, "global_step": 136408, "epoch": 1127} {"train_loss": -40.2519416809082, "global_step": 136409, "epoch": 1127} {"train_loss": -39.62746047973633, "global_step": 136410, "epoch": 1127} {"train_loss": -39.7418098449707, "global_step": 136411, "epoch": 1127} {"train_loss": -38.750972747802734, "global_step": 136412, "epoch": 1127} {"train_loss": -39.56647872924805, "global_step": 136413, "epoch": 1127} {"train_loss": -39.94178009033203, "global_step": 136414, "epoch": 1127} {"train_loss": -39.61867141723633, "global_step": 136415, "epoch": 1127} {"train_loss": -40.1281852722168, "global_step": 136416, "epoch": 1127} {"train_loss": -40.52651596069336, "global_step": 136417, "epoch": 1127} {"train_loss": -39.7475471496582, "global_step": 136418, "epoch": 1127} {"train_loss": -40.002254486083984, "global_step": 136419, "epoch": 1127} {"train_loss": -39.89992141723633, "global_step": 136420, "epoch": 1127} {"train_loss": -40.14483642578125, "global_step": 136421, "epoch": 1127} {"train_loss": -40.290687561035156, "global_step": 136422, "epoch": 1127} {"train_loss": -39.403499603271484, "global_step": 136423, "epoch": 1127} {"train_loss": -39.428924560546875, "global_step": 136424, "epoch": 1127} {"train_loss": -40.594154357910156, "global_step": 136425, "epoch": 1127} {"train_loss": -40.50071334838867, "global_step": 136426, "epoch": 1127} {"train_loss": -40.56818771362305, "global_step": 136427, "epoch": 1127} {"train_loss": -39.843502044677734, "global_step": 136428, "epoch": 1127} {"train_loss": -40.5214958190918, "global_step": 136429, "epoch": 1127} {"train_loss": -40.1899299621582, "global_step": 136430, "epoch": 1127} {"train_loss": -40.565574645996094, "global_step": 136431, "epoch": 1127} {"train_loss": -40.22164535522461, "global_step": 136432, "epoch": 1127} {"train_loss": -39.857078552246094, "global_step": 136433, "epoch": 1127} {"train_loss": -39.35763931274414, "global_step": 136434, "epoch": 1127} {"train_loss": -40.46991729736328, "global_step": 136435, "epoch": 1127} {"train_loss": -40.53800582885742, "global_step": 136436, "epoch": 1127} {"train_loss": -40.49199676513672, "global_step": 136437, "epoch": 1127} {"train_loss": -40.565670013427734, "global_step": 136438, "epoch": 1127} {"train_loss": -39.42423629760742, "global_step": 136439, "epoch": 1127} {"train_loss": -39.70848846435547, "global_step": 136440, "epoch": 1127} {"train_loss": -39.97027587890625, "global_step": 136441, "epoch": 1127} {"train_loss": -40.54189682006836, "global_step": 136442, "epoch": 1127} {"train_loss": -38.834320068359375, "global_step": 136443, "epoch": 1127} {"train_loss": -40.2880973815918, "global_step": 136444, "epoch": 1127} {"train_loss": -40.556396484375, "global_step": 136445, "epoch": 1127} {"train_loss": -39.575286865234375, "global_step": 136446, "epoch": 1127} {"train_loss": -40.52742385864258, "global_step": 136447, "epoch": 1127} {"train_loss": -39.7830696105957, "global_step": 136448, "epoch": 1127} {"train_loss": -40.45595932006836, "global_step": 136449, "epoch": 1127} {"train_loss": -39.88974380493164, "global_step": 136450, "epoch": 1127} {"train_loss": -39.82086944580078, "global_step": 136451, "epoch": 1127} {"train_loss": -39.54729080200195, "global_step": 136452, "epoch": 1127} {"train_loss": -38.819480895996094, "global_step": 136453, "epoch": 1127} {"train_loss": -39.859886169433594, "global_step": 136454, "epoch": 1127} {"train_loss": -39.90644454956055, "global_step": 136455, "epoch": 1127} {"train_loss": -38.295650482177734, "global_step": 136456, "epoch": 1127} {"train_loss": -39.83007049560547, "global_step": 136457, "epoch": 1127} {"train_loss": -38.8148307800293, "global_step": 136458, "epoch": 1127} {"train_loss": -39.057533264160156, "global_step": 136459, "epoch": 1127} {"train_loss": -37.484771728515625, "global_step": 136460, "epoch": 1127} {"train_loss": -36.5303840637207, "global_step": 136461, "epoch": 1127} {"train_loss": -34.537723541259766, "global_step": 136462, "epoch": 1127} {"train_loss": -35.527244567871094, "global_step": 136463, "epoch": 1127} {"train_loss": -37.225563049316406, "global_step": 136464, "epoch": 1127} {"train_loss": -22.64204978942871, "global_step": 136465, "epoch": 1127} {"train_loss": -23.836374282836914, "global_step": 136466, "epoch": 1127} {"train_loss": -34.11537551879883, "global_step": 136467, "epoch": 1127} {"train_loss": -34.429927825927734, "global_step": 136468, "epoch": 1127} {"train_loss": -32.879180908203125, "global_step": 136469, "epoch": 1127} {"train_loss": -36.638755798339844, "global_step": 136470, "epoch": 1127} {"train_loss": -36.091732025146484, "global_step": 136471, "epoch": 1127} {"train_loss": -34.34474182128906, "global_step": 136472, "epoch": 1127} {"train_loss": -37.17107009887695, "global_step": 136473, "epoch": 1127} {"train_loss": -35.68586349487305, "global_step": 136474, "epoch": 1127} {"train_loss": -37.34052658081055, "global_step": 136475, "epoch": 1127} {"train_loss": -37.144901275634766, "global_step": 136476, "epoch": 1127} {"train_loss": -37.770751953125, "global_step": 136477, "epoch": 1127} {"train_loss": -37.75442123413086, "global_step": 136478, "epoch": 1127} {"train_loss": -37.19697189331055, "global_step": 136479, "epoch": 1127} {"train_loss": -38.71873474121094, "global_step": 136480, "epoch": 1127} {"train_loss": -37.8514289855957, "global_step": 136481, "epoch": 1127} {"train_loss": -38.64031219482422, "global_step": 136482, "epoch": 1127} {"train_loss": -38.133846282958984, "global_step": 136483, "epoch": 1127} {"train_loss": -39.164642333984375, "global_step": 136484, "epoch": 1127} {"train_loss": -38.648983001708984, "global_step": 136485, "epoch": 1127} {"train_loss": -38.69731521606445, "global_step": 136486, "epoch": 1127} {"train_loss": -38.42802426046576, "global_step": 136487, "epoch": 1127, "val_loss": 2627352.0} {"train_loss": -38.94721603393555, "global_step": 136488, "epoch": 1128} {"train_loss": -39.38168716430664, "global_step": 136489, "epoch": 1128} {"train_loss": -39.050052642822266, "global_step": 136490, "epoch": 1128} {"train_loss": -39.08494186401367, "global_step": 136491, "epoch": 1128} {"train_loss": -39.371681213378906, "global_step": 136492, "epoch": 1128} {"train_loss": -38.86387252807617, "global_step": 136493, "epoch": 1128} {"train_loss": -39.205787658691406, "global_step": 136494, "epoch": 1128} {"train_loss": -39.42802429199219, "global_step": 136495, "epoch": 1128} {"train_loss": -39.15171813964844, "global_step": 136496, "epoch": 1128} {"train_loss": -38.718536376953125, "global_step": 136497, "epoch": 1128} {"train_loss": -39.165802001953125, "global_step": 136498, "epoch": 1128} {"train_loss": -39.05353927612305, "global_step": 136499, "epoch": 1128} {"train_loss": -39.89007568359375, "global_step": 136500, "epoch": 1128} {"train_loss": -40.140541076660156, "global_step": 136501, "epoch": 1128} {"train_loss": -39.881465911865234, "global_step": 136502, "epoch": 1128} {"train_loss": -39.77641677856445, "global_step": 136503, "epoch": 1128} {"train_loss": -39.75199508666992, "global_step": 136504, "epoch": 1128} {"train_loss": -39.97168731689453, "global_step": 136505, "epoch": 1128} {"train_loss": -39.990028381347656, "global_step": 136506, "epoch": 1128} {"train_loss": -39.77052688598633, "global_step": 136507, "epoch": 1128} {"train_loss": -40.17029571533203, "global_step": 136508, "epoch": 1128} {"train_loss": -39.55253219604492, "global_step": 136509, "epoch": 1128} {"train_loss": -40.14898681640625, "global_step": 136510, "epoch": 1128} {"train_loss": -39.7076530456543, "global_step": 136511, "epoch": 1128} {"train_loss": -39.85854721069336, "global_step": 136512, "epoch": 1128} {"train_loss": -40.095726013183594, "global_step": 136513, "epoch": 1128} {"train_loss": -40.14364242553711, "global_step": 136514, "epoch": 1128} {"train_loss": -40.11161804199219, "global_step": 136515, "epoch": 1128} {"train_loss": -40.342342376708984, "global_step": 136516, "epoch": 1128} {"train_loss": -40.061798095703125, "global_step": 136517, "epoch": 1128} {"train_loss": -40.60041809082031, "global_step": 136518, "epoch": 1128} {"train_loss": -40.23797607421875, "global_step": 136519, "epoch": 1128} {"train_loss": -37.470333099365234, "global_step": 136520, "epoch": 1128} {"train_loss": -40.115333557128906, "global_step": 136521, "epoch": 1128} {"train_loss": -40.02230453491211, "global_step": 136522, "epoch": 1128} {"train_loss": -40.26960372924805, "global_step": 136523, "epoch": 1128} {"train_loss": -40.709800720214844, "global_step": 136524, "epoch": 1128} {"train_loss": -40.03573226928711, "global_step": 136525, "epoch": 1128} {"train_loss": -40.48476028442383, "global_step": 136526, "epoch": 1128} {"train_loss": -39.965667724609375, "global_step": 136527, "epoch": 1128} {"train_loss": -40.0348014831543, "global_step": 136528, "epoch": 1128} {"train_loss": -40.47800827026367, "global_step": 136529, "epoch": 1128} {"train_loss": -39.51833724975586, "global_step": 136530, "epoch": 1128} {"train_loss": -39.689605712890625, "global_step": 136531, "epoch": 1128} {"train_loss": -40.42469787597656, "global_step": 136532, "epoch": 1128} {"train_loss": -37.591880798339844, "global_step": 136533, "epoch": 1128} {"train_loss": -40.19806671142578, "global_step": 136534, "epoch": 1128} {"train_loss": -40.326560974121094, "global_step": 136535, "epoch": 1128} {"train_loss": -40.54793167114258, "global_step": 136536, "epoch": 1128} {"train_loss": -40.254756927490234, "global_step": 136537, "epoch": 1128} {"train_loss": -40.377105712890625, "global_step": 136538, "epoch": 1128} {"train_loss": -40.518836975097656, "global_step": 136539, "epoch": 1128} {"train_loss": -39.977455139160156, "global_step": 136540, "epoch": 1128} {"train_loss": -40.311275482177734, "global_step": 136541, "epoch": 1128} {"train_loss": -40.912384033203125, "global_step": 136542, "epoch": 1128} {"train_loss": -40.14087677001953, "global_step": 136543, "epoch": 1128} {"train_loss": -37.58230972290039, "global_step": 136544, "epoch": 1128} {"train_loss": -40.7409782409668, "global_step": 136545, "epoch": 1128} {"train_loss": -39.55941390991211, "global_step": 136546, "epoch": 1128} {"train_loss": -39.52554702758789, "global_step": 136547, "epoch": 1128} {"train_loss": -40.382015228271484, "global_step": 136548, "epoch": 1128} {"train_loss": -40.21175003051758, "global_step": 136549, "epoch": 1128} {"train_loss": -40.58681869506836, "global_step": 136550, "epoch": 1128} {"train_loss": -40.54903793334961, "global_step": 136551, "epoch": 1128} {"train_loss": -39.8977165222168, "global_step": 136552, "epoch": 1128} {"train_loss": -40.61541748046875, "global_step": 136553, "epoch": 1128} {"train_loss": -39.6716423034668, "global_step": 136554, "epoch": 1128} {"train_loss": -40.07390213012695, "global_step": 136555, "epoch": 1128} {"train_loss": -39.57230758666992, "global_step": 136556, "epoch": 1128} {"train_loss": -40.56637191772461, "global_step": 136557, "epoch": 1128} {"train_loss": -39.7558708190918, "global_step": 136558, "epoch": 1128} {"train_loss": -38.86338424682617, "global_step": 136559, "epoch": 1128} {"train_loss": -39.63481903076172, "global_step": 136560, "epoch": 1128} {"train_loss": -38.87837219238281, "global_step": 136561, "epoch": 1128} {"train_loss": -34.28512191772461, "global_step": 136562, "epoch": 1128} {"train_loss": -32.905757904052734, "global_step": 136563, "epoch": 1128} {"train_loss": -39.097381591796875, "global_step": 136564, "epoch": 1128} {"train_loss": -36.24672317504883, "global_step": 136565, "epoch": 1128} {"train_loss": -37.88288497924805, "global_step": 136566, "epoch": 1128} {"train_loss": -36.11845016479492, "global_step": 136567, "epoch": 1128} {"train_loss": -40.36179733276367, "global_step": 136568, "epoch": 1128} {"train_loss": -34.85093307495117, "global_step": 136569, "epoch": 1128} {"train_loss": -39.43642807006836, "global_step": 136570, "epoch": 1128} {"train_loss": -36.99738693237305, "global_step": 136571, "epoch": 1128} {"train_loss": -37.46653366088867, "global_step": 136572, "epoch": 1128} {"train_loss": -36.842838287353516, "global_step": 136573, "epoch": 1128} {"train_loss": -38.30049133300781, "global_step": 136574, "epoch": 1128} {"train_loss": -39.20824432373047, "global_step": 136575, "epoch": 1128} {"train_loss": -38.176727294921875, "global_step": 136576, "epoch": 1128} {"train_loss": -38.463050842285156, "global_step": 136577, "epoch": 1128} {"train_loss": -39.57454299926758, "global_step": 136578, "epoch": 1128} {"train_loss": -38.34457015991211, "global_step": 136579, "epoch": 1128} {"train_loss": -39.34365463256836, "global_step": 136580, "epoch": 1128} {"train_loss": -39.327850341796875, "global_step": 136581, "epoch": 1128} {"train_loss": -39.30147933959961, "global_step": 136582, "epoch": 1128} {"train_loss": -39.57505416870117, "global_step": 136583, "epoch": 1128} {"train_loss": -38.51971435546875, "global_step": 136584, "epoch": 1128} {"train_loss": -38.70336151123047, "global_step": 136585, "epoch": 1128} {"train_loss": -39.53495788574219, "global_step": 136586, "epoch": 1128} {"train_loss": -39.676979064941406, "global_step": 136587, "epoch": 1128} {"train_loss": -38.40784454345703, "global_step": 136588, "epoch": 1128} {"train_loss": -40.34928512573242, "global_step": 136589, "epoch": 1128} {"train_loss": -39.324031829833984, "global_step": 136590, "epoch": 1128} {"train_loss": -39.92682647705078, "global_step": 136591, "epoch": 1128} {"train_loss": -39.479793548583984, "global_step": 136592, "epoch": 1128} {"train_loss": -39.043731689453125, "global_step": 136593, "epoch": 1128} {"train_loss": -38.407806396484375, "global_step": 136594, "epoch": 1128} {"train_loss": -36.45751190185547, "global_step": 136595, "epoch": 1128} {"train_loss": -37.20977783203125, "global_step": 136596, "epoch": 1128} {"train_loss": -38.81087112426758, "global_step": 136597, "epoch": 1128} {"train_loss": -39.442623138427734, "global_step": 136598, "epoch": 1128} {"train_loss": -39.08323669433594, "global_step": 136599, "epoch": 1128} {"train_loss": -37.96737289428711, "global_step": 136600, "epoch": 1128} {"train_loss": -38.00830078125, "global_step": 136601, "epoch": 1128} {"train_loss": -39.253173828125, "global_step": 136602, "epoch": 1128} {"train_loss": -38.827266693115234, "global_step": 136603, "epoch": 1128} {"train_loss": -38.515602111816406, "global_step": 136604, "epoch": 1128} {"train_loss": -39.49904251098633, "global_step": 136605, "epoch": 1128} {"train_loss": -37.91913986206055, "global_step": 136606, "epoch": 1128} {"train_loss": -39.734432220458984, "global_step": 136607, "epoch": 1128} {"train_loss": -39.257240011672344, "global_step": 136608, "epoch": 1128, "val_loss": 2614308.5} {"train_loss": -39.241241455078125, "global_step": 136609, "epoch": 1129} {"train_loss": -40.086639404296875, "global_step": 136610, "epoch": 1129} {"train_loss": -38.9097900390625, "global_step": 136611, "epoch": 1129} {"train_loss": -39.69778060913086, "global_step": 136612, "epoch": 1129} {"train_loss": -39.17676544189453, "global_step": 136613, "epoch": 1129} {"train_loss": -39.537105560302734, "global_step": 136614, "epoch": 1129} {"train_loss": -39.54874801635742, "global_step": 136615, "epoch": 1129} {"train_loss": -40.181575775146484, "global_step": 136616, "epoch": 1129} {"train_loss": -40.064369201660156, "global_step": 136617, "epoch": 1129} {"train_loss": -39.66279220581055, "global_step": 136618, "epoch": 1129} {"train_loss": -40.03922653198242, "global_step": 136619, "epoch": 1129} {"train_loss": -39.913978576660156, "global_step": 136620, "epoch": 1129} {"train_loss": -40.4165153503418, "global_step": 136621, "epoch": 1129} {"train_loss": -39.91877365112305, "global_step": 136622, "epoch": 1129} {"train_loss": -40.80860900878906, "global_step": 136623, "epoch": 1129} {"train_loss": -39.35065841674805, "global_step": 136624, "epoch": 1129} {"train_loss": -40.681156158447266, "global_step": 136625, "epoch": 1129} {"train_loss": -40.367427825927734, "global_step": 136626, "epoch": 1129} {"train_loss": -39.225799560546875, "global_step": 136627, "epoch": 1129} {"train_loss": -40.47488021850586, "global_step": 136628, "epoch": 1129} {"train_loss": -40.174781799316406, "global_step": 136629, "epoch": 1129} {"train_loss": -40.20273971557617, "global_step": 136630, "epoch": 1129} {"train_loss": -39.735164642333984, "global_step": 136631, "epoch": 1129} {"train_loss": -40.11184310913086, "global_step": 136632, "epoch": 1129} {"train_loss": -39.88887405395508, "global_step": 136633, "epoch": 1129} {"train_loss": -40.303768157958984, "global_step": 136634, "epoch": 1129} {"train_loss": -40.18259811401367, "global_step": 136635, "epoch": 1129} {"train_loss": -38.159576416015625, "global_step": 136636, "epoch": 1129} {"train_loss": -39.726680755615234, "global_step": 136637, "epoch": 1129} {"train_loss": -37.49106216430664, "global_step": 136638, "epoch": 1129} {"train_loss": -38.81235885620117, "global_step": 136639, "epoch": 1129} {"train_loss": -39.058780670166016, "global_step": 136640, "epoch": 1129} {"train_loss": -40.09075164794922, "global_step": 136641, "epoch": 1129} {"train_loss": -40.02854537963867, "global_step": 136642, "epoch": 1129} {"train_loss": -39.481937408447266, "global_step": 136643, "epoch": 1129} {"train_loss": -39.872528076171875, "global_step": 136644, "epoch": 1129} {"train_loss": -39.44643783569336, "global_step": 136645, "epoch": 1129} {"train_loss": -40.413326263427734, "global_step": 136646, "epoch": 1129} {"train_loss": -40.40268325805664, "global_step": 136647, "epoch": 1129} {"train_loss": -40.40636444091797, "global_step": 136648, "epoch": 1129} {"train_loss": -40.17047882080078, "global_step": 136649, "epoch": 1129} {"train_loss": -40.21426773071289, "global_step": 136650, "epoch": 1129} {"train_loss": -40.421424865722656, "global_step": 136651, "epoch": 1129} {"train_loss": -40.94114685058594, "global_step": 136652, "epoch": 1129} {"train_loss": -40.80256271362305, "global_step": 136653, "epoch": 1129} {"train_loss": -40.29385757446289, "global_step": 136654, "epoch": 1129} {"train_loss": -40.82047653198242, "global_step": 136655, "epoch": 1129} {"train_loss": -40.15092086791992, "global_step": 136656, "epoch": 1129} {"train_loss": -39.91632080078125, "global_step": 136657, "epoch": 1129} {"train_loss": -40.398128509521484, "global_step": 136658, "epoch": 1129} {"train_loss": -40.319305419921875, "global_step": 136659, "epoch": 1129} {"train_loss": -41.028133392333984, "global_step": 136660, "epoch": 1129} {"train_loss": -37.282135009765625, "global_step": 136661, "epoch": 1129} {"train_loss": -39.42537307739258, "global_step": 136662, "epoch": 1129} {"train_loss": -40.664093017578125, "global_step": 136663, "epoch": 1129} {"train_loss": -39.768856048583984, "global_step": 136664, "epoch": 1129} {"train_loss": -40.15896987915039, "global_step": 136665, "epoch": 1129} {"train_loss": -39.83461380004883, "global_step": 136666, "epoch": 1129} {"train_loss": -37.06037521362305, "global_step": 136667, "epoch": 1129} {"train_loss": -40.28133773803711, "global_step": 136668, "epoch": 1129} {"train_loss": -39.24911880493164, "global_step": 136669, "epoch": 1129} {"train_loss": -39.02364730834961, "global_step": 136670, "epoch": 1129} {"train_loss": -40.64510726928711, "global_step": 136671, "epoch": 1129} {"train_loss": -39.30715560913086, "global_step": 136672, "epoch": 1129} {"train_loss": -39.49359130859375, "global_step": 136673, "epoch": 1129} {"train_loss": -37.57610321044922, "global_step": 136674, "epoch": 1129} {"train_loss": -38.178401947021484, "global_step": 136675, "epoch": 1129} {"train_loss": -39.05051040649414, "global_step": 136676, "epoch": 1129} {"train_loss": -39.574703216552734, "global_step": 136677, "epoch": 1129} {"train_loss": -38.976200103759766, "global_step": 136678, "epoch": 1129} {"train_loss": -39.38094711303711, "global_step": 136679, "epoch": 1129} {"train_loss": -39.11788558959961, "global_step": 136680, "epoch": 1129} {"train_loss": -40.39016342163086, "global_step": 136681, "epoch": 1129} {"train_loss": -35.38590621948242, "global_step": 136682, "epoch": 1129} {"train_loss": -39.46990966796875, "global_step": 136683, "epoch": 1129} {"train_loss": -38.743709564208984, "global_step": 136684, "epoch": 1129} {"train_loss": -39.746429443359375, "global_step": 136685, "epoch": 1129} {"train_loss": -39.402584075927734, "global_step": 136686, "epoch": 1129} {"train_loss": -39.43549346923828, "global_step": 136687, "epoch": 1129} {"train_loss": -39.52496337890625, "global_step": 136688, "epoch": 1129} {"train_loss": -36.645973205566406, "global_step": 136689, "epoch": 1129} {"train_loss": -39.03330612182617, "global_step": 136690, "epoch": 1129} {"train_loss": -36.26292419433594, "global_step": 136691, "epoch": 1129} {"train_loss": -39.07930374145508, "global_step": 136692, "epoch": 1129} {"train_loss": -38.2743034362793, "global_step": 136693, "epoch": 1129} {"train_loss": -38.686824798583984, "global_step": 136694, "epoch": 1129} {"train_loss": -38.91880416870117, "global_step": 136695, "epoch": 1129} {"train_loss": -39.16541290283203, "global_step": 136696, "epoch": 1129} {"train_loss": -38.46944808959961, "global_step": 136697, "epoch": 1129} {"train_loss": -36.79056930541992, "global_step": 136698, "epoch": 1129} {"train_loss": -39.44623565673828, "global_step": 136699, "epoch": 1129} {"train_loss": -37.20949935913086, "global_step": 136700, "epoch": 1129} {"train_loss": -39.486846923828125, "global_step": 136701, "epoch": 1129} {"train_loss": -39.523231506347656, "global_step": 136702, "epoch": 1129} {"train_loss": -39.499420166015625, "global_step": 136703, "epoch": 1129} {"train_loss": -38.68043518066406, "global_step": 136704, "epoch": 1129} {"train_loss": -38.51791000366211, "global_step": 136705, "epoch": 1129} {"train_loss": -39.1964111328125, "global_step": 136706, "epoch": 1129} {"train_loss": -37.257781982421875, "global_step": 136707, "epoch": 1129} {"train_loss": -39.45381546020508, "global_step": 136708, "epoch": 1129} {"train_loss": -39.105873107910156, "global_step": 136709, "epoch": 1129} {"train_loss": -36.727108001708984, "global_step": 136710, "epoch": 1129} {"train_loss": -39.632171630859375, "global_step": 136711, "epoch": 1129} {"train_loss": -39.923377990722656, "global_step": 136712, "epoch": 1129} {"train_loss": -38.738311767578125, "global_step": 136713, "epoch": 1129} {"train_loss": -37.01784133911133, "global_step": 136714, "epoch": 1129} {"train_loss": -38.1802978515625, "global_step": 136715, "epoch": 1129} {"train_loss": -38.49220275878906, "global_step": 136716, "epoch": 1129} {"train_loss": -39.15839767456055, "global_step": 136717, "epoch": 1129} {"train_loss": -38.493167877197266, "global_step": 136718, "epoch": 1129} {"train_loss": -39.87337875366211, "global_step": 136719, "epoch": 1129} {"train_loss": -38.98245620727539, "global_step": 136720, "epoch": 1129} {"train_loss": -36.493919372558594, "global_step": 136721, "epoch": 1129} {"train_loss": -36.988033294677734, "global_step": 136722, "epoch": 1129} {"train_loss": -36.21166229248047, "global_step": 136723, "epoch": 1129} {"train_loss": -39.52899169921875, "global_step": 136724, "epoch": 1129} {"train_loss": -39.59251022338867, "global_step": 136725, "epoch": 1129} {"train_loss": -36.44732666015625, "global_step": 136726, "epoch": 1129} {"train_loss": -37.92840576171875, "global_step": 136727, "epoch": 1129} {"train_loss": -38.706336975097656, "global_step": 136728, "epoch": 1129} {"train_loss": -39.23293168879738, "global_step": 136729, "epoch": 1129, "val_loss": 2540775.75} {"train_loss": -38.60647964477539, "global_step": 136730, "epoch": 1130} {"train_loss": -38.28428268432617, "global_step": 136731, "epoch": 1130} {"train_loss": -39.29905700683594, "global_step": 136732, "epoch": 1130} {"train_loss": -39.97791290283203, "global_step": 136733, "epoch": 1130} {"train_loss": -38.97591781616211, "global_step": 136734, "epoch": 1130} {"train_loss": -38.40968704223633, "global_step": 136735, "epoch": 1130} {"train_loss": -37.50212478637695, "global_step": 136736, "epoch": 1130} {"train_loss": -39.20014572143555, "global_step": 136737, "epoch": 1130} {"train_loss": -39.34894943237305, "global_step": 136738, "epoch": 1130} {"train_loss": -38.957801818847656, "global_step": 136739, "epoch": 1130} {"train_loss": -37.83303451538086, "global_step": 136740, "epoch": 1130} {"train_loss": -38.60897445678711, "global_step": 136741, "epoch": 1130} {"train_loss": -38.90059280395508, "global_step": 136742, "epoch": 1130} {"train_loss": -37.78954315185547, "global_step": 136743, "epoch": 1130} {"train_loss": -37.92115020751953, "global_step": 136744, "epoch": 1130} {"train_loss": -39.78249740600586, "global_step": 136745, "epoch": 1130} {"train_loss": -38.491756439208984, "global_step": 136746, "epoch": 1130} {"train_loss": -38.63572311401367, "global_step": 136747, "epoch": 1130} {"train_loss": -38.884220123291016, "global_step": 136748, "epoch": 1130} {"train_loss": -39.72255325317383, "global_step": 136749, "epoch": 1130} {"train_loss": -37.97670364379883, "global_step": 136750, "epoch": 1130} {"train_loss": -40.01259994506836, "global_step": 136751, "epoch": 1130} {"train_loss": -39.784324645996094, "global_step": 136752, "epoch": 1130} {"train_loss": -39.5018424987793, "global_step": 136753, "epoch": 1130} {"train_loss": -39.733848571777344, "global_step": 136754, "epoch": 1130} {"train_loss": -40.44919967651367, "global_step": 136755, "epoch": 1130} {"train_loss": -39.67390823364258, "global_step": 136756, "epoch": 1130} {"train_loss": -40.37531280517578, "global_step": 136757, "epoch": 1130} {"train_loss": -40.093143463134766, "global_step": 136758, "epoch": 1130} {"train_loss": -39.88421630859375, "global_step": 136759, "epoch": 1130} {"train_loss": -40.8376579284668, "global_step": 136760, "epoch": 1130} {"train_loss": -39.912200927734375, "global_step": 136761, "epoch": 1130} {"train_loss": -40.35148239135742, "global_step": 136762, "epoch": 1130} {"train_loss": -40.191688537597656, "global_step": 136763, "epoch": 1130} {"train_loss": -40.575008392333984, "global_step": 136764, "epoch": 1130} {"train_loss": -40.69804000854492, "global_step": 136765, "epoch": 1130} {"train_loss": -40.80171585083008, "global_step": 136766, "epoch": 1130} {"train_loss": -40.09182357788086, "global_step": 136767, "epoch": 1130} {"train_loss": -40.1258544921875, "global_step": 136768, "epoch": 1130} {"train_loss": -40.13267135620117, "global_step": 136769, "epoch": 1130} {"train_loss": -40.84732437133789, "global_step": 136770, "epoch": 1130} {"train_loss": -40.49408721923828, "global_step": 136771, "epoch": 1130} {"train_loss": -40.305599212646484, "global_step": 136772, "epoch": 1130} {"train_loss": -41.010616302490234, "global_step": 136773, "epoch": 1130} {"train_loss": -40.458900451660156, "global_step": 136774, "epoch": 1130} {"train_loss": -40.3470573425293, "global_step": 136775, "epoch": 1130} {"train_loss": -40.94135665893555, "global_step": 136776, "epoch": 1130} {"train_loss": -40.49040603637695, "global_step": 136777, "epoch": 1130} {"train_loss": -41.21805953979492, "global_step": 136778, "epoch": 1130} {"train_loss": -41.253074645996094, "global_step": 136779, "epoch": 1130} {"train_loss": -40.57728958129883, "global_step": 136780, "epoch": 1130} {"train_loss": -40.74393844604492, "global_step": 136781, "epoch": 1130} {"train_loss": -40.635284423828125, "global_step": 136782, "epoch": 1130} {"train_loss": -40.77431869506836, "global_step": 136783, "epoch": 1130} {"train_loss": -40.86951446533203, "global_step": 136784, "epoch": 1130} {"train_loss": -40.68254852294922, "global_step": 136785, "epoch": 1130} {"train_loss": -40.76863479614258, "global_step": 136786, "epoch": 1130} {"train_loss": -40.6528434753418, "global_step": 136787, "epoch": 1130} {"train_loss": -40.81907272338867, "global_step": 136788, "epoch": 1130} {"train_loss": -40.617801666259766, "global_step": 136789, "epoch": 1130} {"train_loss": -40.318851470947266, "global_step": 136790, "epoch": 1130} {"train_loss": -40.876827239990234, "global_step": 136791, "epoch": 1130} {"train_loss": -40.87217330932617, "global_step": 136792, "epoch": 1130} {"train_loss": -41.04195785522461, "global_step": 136793, "epoch": 1130} {"train_loss": -40.64057540893555, "global_step": 136794, "epoch": 1130} {"train_loss": -40.223567962646484, "global_step": 136795, "epoch": 1130} {"train_loss": -40.55326843261719, "global_step": 136796, "epoch": 1130} {"train_loss": -39.994407653808594, "global_step": 136797, "epoch": 1130} {"train_loss": -40.09255599975586, "global_step": 136798, "epoch": 1130} {"train_loss": -40.53497314453125, "global_step": 136799, "epoch": 1130} {"train_loss": -39.58799362182617, "global_step": 136800, "epoch": 1130} {"train_loss": -40.31538772583008, "global_step": 136801, "epoch": 1130} {"train_loss": -39.88154220581055, "global_step": 136802, "epoch": 1130} {"train_loss": -40.36664581298828, "global_step": 136803, "epoch": 1130} {"train_loss": -39.47187042236328, "global_step": 136804, "epoch": 1130} {"train_loss": -39.79868698120117, "global_step": 136805, "epoch": 1130} {"train_loss": -40.261234283447266, "global_step": 136806, "epoch": 1130} {"train_loss": -39.422943115234375, "global_step": 136807, "epoch": 1130} {"train_loss": -38.744686126708984, "global_step": 136808, "epoch": 1130} {"train_loss": -39.91518783569336, "global_step": 136809, "epoch": 1130} {"train_loss": -39.30550003051758, "global_step": 136810, "epoch": 1130} {"train_loss": -37.17026901245117, "global_step": 136811, "epoch": 1130} {"train_loss": -39.36911392211914, "global_step": 136812, "epoch": 1130} {"train_loss": -38.734535217285156, "global_step": 136813, "epoch": 1130} {"train_loss": -36.11909866333008, "global_step": 136814, "epoch": 1130} {"train_loss": -37.99028015136719, "global_step": 136815, "epoch": 1130} {"train_loss": -35.730525970458984, "global_step": 136816, "epoch": 1130} {"train_loss": -36.4504508972168, "global_step": 136817, "epoch": 1130} {"train_loss": -39.086891174316406, "global_step": 136818, "epoch": 1130} {"train_loss": -38.17060089111328, "global_step": 136819, "epoch": 1130} {"train_loss": -38.00272750854492, "global_step": 136820, "epoch": 1130} {"train_loss": -37.519935607910156, "global_step": 136821, "epoch": 1130} {"train_loss": -38.28125, "global_step": 136822, "epoch": 1130} {"train_loss": -38.398345947265625, "global_step": 136823, "epoch": 1130} {"train_loss": -38.588226318359375, "global_step": 136824, "epoch": 1130} {"train_loss": -38.15085220336914, "global_step": 136825, "epoch": 1130} {"train_loss": -37.59640121459961, "global_step": 136826, "epoch": 1130} {"train_loss": -38.923458099365234, "global_step": 136827, "epoch": 1130} {"train_loss": -39.469635009765625, "global_step": 136828, "epoch": 1130} {"train_loss": -38.77019119262695, "global_step": 136829, "epoch": 1130} {"train_loss": -38.75777816772461, "global_step": 136830, "epoch": 1130} {"train_loss": -38.83669662475586, "global_step": 136831, "epoch": 1130} {"train_loss": -38.33796310424805, "global_step": 136832, "epoch": 1130} {"train_loss": -39.12997817993164, "global_step": 136833, "epoch": 1130} {"train_loss": -38.55852127075195, "global_step": 136834, "epoch": 1130} {"train_loss": -39.475440979003906, "global_step": 136835, "epoch": 1130} {"train_loss": -39.44174575805664, "global_step": 136836, "epoch": 1130} {"train_loss": -38.910369873046875, "global_step": 136837, "epoch": 1130} {"train_loss": -39.481197357177734, "global_step": 136838, "epoch": 1130} {"train_loss": -38.846900939941406, "global_step": 136839, "epoch": 1130} {"train_loss": -39.94041061401367, "global_step": 136840, "epoch": 1130} {"train_loss": -39.93865966796875, "global_step": 136841, "epoch": 1130} {"train_loss": -39.09308624267578, "global_step": 136842, "epoch": 1130} {"train_loss": -40.26828384399414, "global_step": 136843, "epoch": 1130} {"train_loss": -39.90983200073242, "global_step": 136844, "epoch": 1130} {"train_loss": -39.65377426147461, "global_step": 136845, "epoch": 1130} {"train_loss": -39.43596649169922, "global_step": 136846, "epoch": 1130} {"train_loss": -39.7851676940918, "global_step": 136847, "epoch": 1130} {"train_loss": -40.33057403564453, "global_step": 136848, "epoch": 1130} {"train_loss": -40.076900482177734, "global_step": 136849, "epoch": 1130} {"train_loss": -39.53663430332152, "global_step": 136850, "epoch": 1130, "val_loss": 2599785.5} {"train_loss": -40.5027961730957, "global_step": 136851, "epoch": 1131} {"train_loss": -40.34836959838867, "global_step": 136852, "epoch": 1131} {"train_loss": -40.544578552246094, "global_step": 136853, "epoch": 1131} {"train_loss": -40.28940963745117, "global_step": 136854, "epoch": 1131} {"train_loss": -40.68046188354492, "global_step": 136855, "epoch": 1131} {"train_loss": -40.12164306640625, "global_step": 136856, "epoch": 1131} {"train_loss": -40.998695373535156, "global_step": 136857, "epoch": 1131} {"train_loss": -39.96337127685547, "global_step": 136858, "epoch": 1131} {"train_loss": -40.324256896972656, "global_step": 136859, "epoch": 1131} {"train_loss": -40.69076156616211, "global_step": 136860, "epoch": 1131} {"train_loss": -40.21052932739258, "global_step": 136861, "epoch": 1131} {"train_loss": -40.6360969543457, "global_step": 136862, "epoch": 1131} {"train_loss": -40.57108688354492, "global_step": 136863, "epoch": 1131} {"train_loss": -40.496402740478516, "global_step": 136864, "epoch": 1131} {"train_loss": -40.227046966552734, "global_step": 136865, "epoch": 1131} {"train_loss": -40.4786491394043, "global_step": 136866, "epoch": 1131} {"train_loss": -40.243961334228516, "global_step": 136867, "epoch": 1131} {"train_loss": -40.493629455566406, "global_step": 136868, "epoch": 1131} {"train_loss": -40.793365478515625, "global_step": 136869, "epoch": 1131} {"train_loss": -40.69422149658203, "global_step": 136870, "epoch": 1131} {"train_loss": -40.01493453979492, "global_step": 136871, "epoch": 1131} {"train_loss": -40.956207275390625, "global_step": 136872, "epoch": 1131} {"train_loss": -40.4712028503418, "global_step": 136873, "epoch": 1131} {"train_loss": -40.90370559692383, "global_step": 136874, "epoch": 1131} {"train_loss": -40.4406852722168, "global_step": 136875, "epoch": 1131} {"train_loss": -41.12514877319336, "global_step": 136876, "epoch": 1131} {"train_loss": -41.38557052612305, "global_step": 136877, "epoch": 1131} {"train_loss": -41.310123443603516, "global_step": 136878, "epoch": 1131} {"train_loss": -40.830101013183594, "global_step": 136879, "epoch": 1131} {"train_loss": -40.6813850402832, "global_step": 136880, "epoch": 1131} {"train_loss": -40.45627975463867, "global_step": 136881, "epoch": 1131} {"train_loss": -40.585304260253906, "global_step": 136882, "epoch": 1131} {"train_loss": -39.36656951904297, "global_step": 136883, "epoch": 1131} {"train_loss": -38.16130065917969, "global_step": 136884, "epoch": 1131} {"train_loss": -36.871978759765625, "global_step": 136885, "epoch": 1131} {"train_loss": -35.602882385253906, "global_step": 136886, "epoch": 1131} {"train_loss": -37.27939987182617, "global_step": 136887, "epoch": 1131} {"train_loss": -38.89809036254883, "global_step": 136888, "epoch": 1131} {"train_loss": -31.948272705078125, "global_step": 136889, "epoch": 1131} {"train_loss": -38.072261810302734, "global_step": 136890, "epoch": 1131} {"train_loss": -32.1903190612793, "global_step": 136891, "epoch": 1131} {"train_loss": -27.289447784423828, "global_step": 136892, "epoch": 1131} {"train_loss": -14.717623710632324, "global_step": 136893, "epoch": 1131} {"train_loss": -13.739424705505371, "global_step": 136894, "epoch": 1131} {"train_loss": -16.849275588989258, "global_step": 136895, "epoch": 1131} {"train_loss": -4.915482521057129, "global_step": 136896, "epoch": 1131} {"train_loss": -30.274377822875977, "global_step": 136897, "epoch": 1131} {"train_loss": -18.595767974853516, "global_step": 136898, "epoch": 1131} {"train_loss": -11.543662071228027, "global_step": 136899, "epoch": 1131} {"train_loss": -33.2410774230957, "global_step": 136900, "epoch": 1131} {"train_loss": -22.441232681274414, "global_step": 136901, "epoch": 1131} {"train_loss": -33.1076774597168, "global_step": 136902, "epoch": 1131} {"train_loss": -31.09747314453125, "global_step": 136903, "epoch": 1131} {"train_loss": -29.972639083862305, "global_step": 136904, "epoch": 1131} {"train_loss": -36.124610900878906, "global_step": 136905, "epoch": 1131} {"train_loss": -32.0256462097168, "global_step": 136906, "epoch": 1131} {"train_loss": -35.026283264160156, "global_step": 136907, "epoch": 1131} {"train_loss": -36.723472595214844, "global_step": 136908, "epoch": 1131} {"train_loss": -34.31663513183594, "global_step": 136909, "epoch": 1131} {"train_loss": -34.5833740234375, "global_step": 136910, "epoch": 1131} {"train_loss": -36.68201446533203, "global_step": 136911, "epoch": 1131} {"train_loss": -35.52897262573242, "global_step": 136912, "epoch": 1131} {"train_loss": -35.06504440307617, "global_step": 136913, "epoch": 1131} {"train_loss": -36.39161682128906, "global_step": 136914, "epoch": 1131} {"train_loss": -36.7633171081543, "global_step": 136915, "epoch": 1131} {"train_loss": -36.99058151245117, "global_step": 136916, "epoch": 1131} {"train_loss": -36.03788375854492, "global_step": 136917, "epoch": 1131} {"train_loss": -36.41533660888672, "global_step": 136918, "epoch": 1131} {"train_loss": -37.599388122558594, "global_step": 136919, "epoch": 1131} {"train_loss": -37.647377014160156, "global_step": 136920, "epoch": 1131} {"train_loss": -37.02289962768555, "global_step": 136921, "epoch": 1131} {"train_loss": -37.285579681396484, "global_step": 136922, "epoch": 1131} {"train_loss": -37.85151290893555, "global_step": 136923, "epoch": 1131} {"train_loss": -37.915985107421875, "global_step": 136924, "epoch": 1131} {"train_loss": -37.95367431640625, "global_step": 136925, "epoch": 1131} {"train_loss": -37.2593994140625, "global_step": 136926, "epoch": 1131} {"train_loss": -37.89387893676758, "global_step": 136927, "epoch": 1131} {"train_loss": -38.21235275268555, "global_step": 136928, "epoch": 1131} {"train_loss": -37.78981399536133, "global_step": 136929, "epoch": 1131} {"train_loss": -38.17793273925781, "global_step": 136930, "epoch": 1131} {"train_loss": -38.13983917236328, "global_step": 136931, "epoch": 1131} {"train_loss": -38.3226432800293, "global_step": 136932, "epoch": 1131} {"train_loss": -38.312408447265625, "global_step": 136933, "epoch": 1131} {"train_loss": -38.31698226928711, "global_step": 136934, "epoch": 1131} {"train_loss": -38.501705169677734, "global_step": 136935, "epoch": 1131} {"train_loss": -38.56291580200195, "global_step": 136936, "epoch": 1131} {"train_loss": -38.59661865234375, "global_step": 136937, "epoch": 1131} {"train_loss": -38.54396438598633, "global_step": 136938, "epoch": 1131} {"train_loss": -38.39011001586914, "global_step": 136939, "epoch": 1131} {"train_loss": -38.50654602050781, "global_step": 136940, "epoch": 1131} {"train_loss": -38.72664260864258, "global_step": 136941, "epoch": 1131} {"train_loss": -38.79011917114258, "global_step": 136942, "epoch": 1131} {"train_loss": -38.74184799194336, "global_step": 136943, "epoch": 1131} {"train_loss": -38.5449333190918, "global_step": 136944, "epoch": 1131} {"train_loss": -39.02975845336914, "global_step": 136945, "epoch": 1131} {"train_loss": -38.86350631713867, "global_step": 136946, "epoch": 1131} {"train_loss": -38.80996322631836, "global_step": 136947, "epoch": 1131} {"train_loss": -38.81562805175781, "global_step": 136948, "epoch": 1131} {"train_loss": -39.15524673461914, "global_step": 136949, "epoch": 1131} {"train_loss": -39.30644607543945, "global_step": 136950, "epoch": 1131} {"train_loss": -39.22770309448242, "global_step": 136951, "epoch": 1131} {"train_loss": -38.92728805541992, "global_step": 136952, "epoch": 1131} {"train_loss": -39.19679641723633, "global_step": 136953, "epoch": 1131} {"train_loss": -39.576839447021484, "global_step": 136954, "epoch": 1131} {"train_loss": -39.5591926574707, "global_step": 136955, "epoch": 1131} {"train_loss": -39.36312484741211, "global_step": 136956, "epoch": 1131} {"train_loss": -39.25765609741211, "global_step": 136957, "epoch": 1131} {"train_loss": -39.56494903564453, "global_step": 136958, "epoch": 1131} {"train_loss": -39.66310119628906, "global_step": 136959, "epoch": 1131} {"train_loss": -39.51948547363281, "global_step": 136960, "epoch": 1131} {"train_loss": -39.54978561401367, "global_step": 136961, "epoch": 1131} {"train_loss": -39.538055419921875, "global_step": 136962, "epoch": 1131} {"train_loss": -39.12973403930664, "global_step": 136963, "epoch": 1131} {"train_loss": -39.379638671875, "global_step": 136964, "epoch": 1131} {"train_loss": -39.55842208862305, "global_step": 136965, "epoch": 1131} {"train_loss": -39.99228286743164, "global_step": 136966, "epoch": 1131} {"train_loss": -39.412899017333984, "global_step": 136967, "epoch": 1131} {"train_loss": -40.15521240234375, "global_step": 136968, "epoch": 1131} {"train_loss": -39.90706253051758, "global_step": 136969, "epoch": 1131} {"train_loss": -40.02143478393555, "global_step": 136970, "epoch": 1131} {"train_loss": -36.93211202385012, "global_step": 136971, "epoch": 1131, "val_loss": 2584596.75} {"train_loss": -39.87517547607422, "global_step": 136972, "epoch": 1132} {"train_loss": -40.03152847290039, "global_step": 136973, "epoch": 1132} {"train_loss": -39.95841598510742, "global_step": 136974, "epoch": 1132} {"train_loss": -40.152679443359375, "global_step": 136975, "epoch": 1132} {"train_loss": -40.0102653503418, "global_step": 136976, "epoch": 1132} {"train_loss": -40.171539306640625, "global_step": 136977, "epoch": 1132} {"train_loss": -39.81708908081055, "global_step": 136978, "epoch": 1132} {"train_loss": -40.11555099487305, "global_step": 136979, "epoch": 1132} {"train_loss": -40.16360092163086, "global_step": 136980, "epoch": 1132} {"train_loss": -40.1966552734375, "global_step": 136981, "epoch": 1132} {"train_loss": -40.66547775268555, "global_step": 136982, "epoch": 1132} {"train_loss": -40.24251937866211, "global_step": 136983, "epoch": 1132} {"train_loss": -39.981197357177734, "global_step": 136984, "epoch": 1132} {"train_loss": -40.57878875732422, "global_step": 136985, "epoch": 1132} {"train_loss": -40.0876350402832, "global_step": 136986, "epoch": 1132} {"train_loss": -40.6348991394043, "global_step": 136987, "epoch": 1132} {"train_loss": -40.63196563720703, "global_step": 136988, "epoch": 1132} {"train_loss": -40.54938888549805, "global_step": 136989, "epoch": 1132} {"train_loss": -40.302886962890625, "global_step": 136990, "epoch": 1132} {"train_loss": -40.7907829284668, "global_step": 136991, "epoch": 1132} {"train_loss": -40.1835823059082, "global_step": 136992, "epoch": 1132} {"train_loss": -40.42930603027344, "global_step": 136993, "epoch": 1132} {"train_loss": -40.6810188293457, "global_step": 136994, "epoch": 1132} {"train_loss": -40.366973876953125, "global_step": 136995, "epoch": 1132} {"train_loss": -40.722591400146484, "global_step": 136996, "epoch": 1132} {"train_loss": -40.58396530151367, "global_step": 136997, "epoch": 1132} {"train_loss": -40.47887420654297, "global_step": 136998, "epoch": 1132} {"train_loss": -40.424407958984375, "global_step": 136999, "epoch": 1132} {"train_loss": -39.70438766479492, "global_step": 137000, "epoch": 1132} {"train_loss": -38.832332611083984, "global_step": 137001, "epoch": 1132} {"train_loss": -40.84157943725586, "global_step": 137002, "epoch": 1132} {"train_loss": -40.21541213989258, "global_step": 137003, "epoch": 1132} {"train_loss": -40.241451263427734, "global_step": 137004, "epoch": 1132} {"train_loss": -40.62974166870117, "global_step": 137005, "epoch": 1132} {"train_loss": -40.14971923828125, "global_step": 137006, "epoch": 1132} {"train_loss": -39.54478073120117, "global_step": 137007, "epoch": 1132} {"train_loss": -39.169647216796875, "global_step": 137008, "epoch": 1132} {"train_loss": -39.9566764831543, "global_step": 137009, "epoch": 1132} {"train_loss": -35.54148483276367, "global_step": 137010, "epoch": 1132} {"train_loss": -39.81992721557617, "global_step": 137011, "epoch": 1132} {"train_loss": -38.01039505004883, "global_step": 137012, "epoch": 1132} {"train_loss": -37.248165130615234, "global_step": 137013, "epoch": 1132} {"train_loss": -39.204105377197266, "global_step": 137014, "epoch": 1132} {"train_loss": -38.339412689208984, "global_step": 137015, "epoch": 1132} {"train_loss": -32.287567138671875, "global_step": 137016, "epoch": 1132} {"train_loss": -20.232770919799805, "global_step": 137017, "epoch": 1132} {"train_loss": -19.00878143310547, "global_step": 137018, "epoch": 1132} {"train_loss": -36.779029846191406, "global_step": 137019, "epoch": 1132} {"train_loss": -30.712514877319336, "global_step": 137020, "epoch": 1132} {"train_loss": -34.84271240234375, "global_step": 137021, "epoch": 1132} {"train_loss": -32.79718780517578, "global_step": 137022, "epoch": 1132} {"train_loss": -32.392269134521484, "global_step": 137023, "epoch": 1132} {"train_loss": -37.03782653808594, "global_step": 137024, "epoch": 1132} {"train_loss": -34.67153549194336, "global_step": 137025, "epoch": 1132} {"train_loss": -36.11014175415039, "global_step": 137026, "epoch": 1132} {"train_loss": -35.347084045410156, "global_step": 137027, "epoch": 1132} {"train_loss": -36.6573371887207, "global_step": 137028, "epoch": 1132} {"train_loss": -37.3941764831543, "global_step": 137029, "epoch": 1132} {"train_loss": -37.274105072021484, "global_step": 137030, "epoch": 1132} {"train_loss": -36.11558151245117, "global_step": 137031, "epoch": 1132} {"train_loss": -35.882991790771484, "global_step": 137032, "epoch": 1132} {"train_loss": -35.2318115234375, "global_step": 137033, "epoch": 1132} {"train_loss": -37.411781311035156, "global_step": 137034, "epoch": 1132} {"train_loss": -37.721561431884766, "global_step": 137035, "epoch": 1132} {"train_loss": -37.820072174072266, "global_step": 137036, "epoch": 1132} {"train_loss": -37.97049331665039, "global_step": 137037, "epoch": 1132} {"train_loss": -37.88103103637695, "global_step": 137038, "epoch": 1132} {"train_loss": -38.443721771240234, "global_step": 137039, "epoch": 1132} {"train_loss": -38.37441635131836, "global_step": 137040, "epoch": 1132} {"train_loss": -38.14301300048828, "global_step": 137041, "epoch": 1132} {"train_loss": -34.66286087036133, "global_step": 137042, "epoch": 1132} {"train_loss": -37.90549850463867, "global_step": 137043, "epoch": 1132} {"train_loss": -39.00748825073242, "global_step": 137044, "epoch": 1132} {"train_loss": -38.27124786376953, "global_step": 137045, "epoch": 1132} {"train_loss": -38.87856674194336, "global_step": 137046, "epoch": 1132} {"train_loss": -39.16606521606445, "global_step": 137047, "epoch": 1132} {"train_loss": -37.688507080078125, "global_step": 137048, "epoch": 1132} {"train_loss": -38.1886100769043, "global_step": 137049, "epoch": 1132} {"train_loss": -38.53174591064453, "global_step": 137050, "epoch": 1132} {"train_loss": -32.06511306762695, "global_step": 137051, "epoch": 1132} {"train_loss": -38.412532806396484, "global_step": 137052, "epoch": 1132} {"train_loss": -36.76399612426758, "global_step": 137053, "epoch": 1132} {"train_loss": -38.56557846069336, "global_step": 137054, "epoch": 1132} {"train_loss": -38.92600631713867, "global_step": 137055, "epoch": 1132} {"train_loss": -38.715919494628906, "global_step": 137056, "epoch": 1132} {"train_loss": -26.899017333984375, "global_step": 137057, "epoch": 1132} {"train_loss": -37.960838317871094, "global_step": 137058, "epoch": 1132} {"train_loss": -33.32645797729492, "global_step": 137059, "epoch": 1132} {"train_loss": -32.33695983886719, "global_step": 137060, "epoch": 1132} {"train_loss": -34.57035446166992, "global_step": 137061, "epoch": 1132} {"train_loss": -35.20029830932617, "global_step": 137062, "epoch": 1132} {"train_loss": -35.19155502319336, "global_step": 137063, "epoch": 1132} {"train_loss": -1.5315521955490112, "global_step": 137064, "epoch": 1132} {"train_loss": -34.222808837890625, "global_step": 137065, "epoch": 1132} {"train_loss": -31.868366241455078, "global_step": 137066, "epoch": 1132} {"train_loss": -29.8414249420166, "global_step": 137067, "epoch": 1132} {"train_loss": -33.37146759033203, "global_step": 137068, "epoch": 1132} {"train_loss": -20.946060180664062, "global_step": 137069, "epoch": 1132} {"train_loss": -32.420082092285156, "global_step": 137070, "epoch": 1132} {"train_loss": -33.499515533447266, "global_step": 137071, "epoch": 1132} {"train_loss": -35.381439208984375, "global_step": 137072, "epoch": 1132} {"train_loss": -35.449424743652344, "global_step": 137073, "epoch": 1132} {"train_loss": -35.775543212890625, "global_step": 137074, "epoch": 1132} {"train_loss": -34.18782424926758, "global_step": 137075, "epoch": 1132} {"train_loss": -37.06917190551758, "global_step": 137076, "epoch": 1132} {"train_loss": -35.294376373291016, "global_step": 137077, "epoch": 1132} {"train_loss": -35.90382766723633, "global_step": 137078, "epoch": 1132} {"train_loss": -34.62654495239258, "global_step": 137079, "epoch": 1132} {"train_loss": -35.21273422241211, "global_step": 137080, "epoch": 1132} {"train_loss": -36.089698791503906, "global_step": 137081, "epoch": 1132} {"train_loss": -35.75368881225586, "global_step": 137082, "epoch": 1132} {"train_loss": -34.70884704589844, "global_step": 137083, "epoch": 1132} {"train_loss": -36.62449264526367, "global_step": 137084, "epoch": 1132} {"train_loss": -36.9046516418457, "global_step": 137085, "epoch": 1132} {"train_loss": -33.02860641479492, "global_step": 137086, "epoch": 1132} {"train_loss": -37.08503341674805, "global_step": 137087, "epoch": 1132} {"train_loss": -36.18819808959961, "global_step": 137088, "epoch": 1132} {"train_loss": -36.504310607910156, "global_step": 137089, "epoch": 1132} {"train_loss": -37.26554489135742, "global_step": 137090, "epoch": 1132} {"train_loss": -36.7302131652832, "global_step": 137091, "epoch": 1132} {"train_loss": -36.635642082238, "global_step": 137092, "epoch": 1132, "val_loss": 2700400.5} {"train_loss": -37.79638671875, "global_step": 137093, "epoch": 1133} {"train_loss": -36.3847541809082, "global_step": 137094, "epoch": 1133} {"train_loss": -37.784034729003906, "global_step": 137095, "epoch": 1133} {"train_loss": -37.38460159301758, "global_step": 137096, "epoch": 1133} {"train_loss": -36.994659423828125, "global_step": 137097, "epoch": 1133} {"train_loss": -38.15354537963867, "global_step": 137098, "epoch": 1133} {"train_loss": -37.498382568359375, "global_step": 137099, "epoch": 1133} {"train_loss": -38.226051330566406, "global_step": 137100, "epoch": 1133} {"train_loss": -37.69565963745117, "global_step": 137101, "epoch": 1133} {"train_loss": -37.766536712646484, "global_step": 137102, "epoch": 1133} {"train_loss": -37.81150436401367, "global_step": 137103, "epoch": 1133} {"train_loss": -37.721073150634766, "global_step": 137104, "epoch": 1133} {"train_loss": -37.664588928222656, "global_step": 137105, "epoch": 1133} {"train_loss": -37.90997314453125, "global_step": 137106, "epoch": 1133} {"train_loss": -37.634334564208984, "global_step": 137107, "epoch": 1133} {"train_loss": -37.715911865234375, "global_step": 137108, "epoch": 1133} {"train_loss": -38.23529052734375, "global_step": 137109, "epoch": 1133} {"train_loss": -37.943695068359375, "global_step": 137110, "epoch": 1133} {"train_loss": -38.0087890625, "global_step": 137111, "epoch": 1133} {"train_loss": -38.3913459777832, "global_step": 137112, "epoch": 1133} {"train_loss": -38.193634033203125, "global_step": 137113, "epoch": 1133} {"train_loss": -36.62661361694336, "global_step": 137114, "epoch": 1133} {"train_loss": -38.83543014526367, "global_step": 137115, "epoch": 1133} {"train_loss": -38.350521087646484, "global_step": 137116, "epoch": 1133} {"train_loss": -38.19147872924805, "global_step": 137117, "epoch": 1133} {"train_loss": -38.42091751098633, "global_step": 137118, "epoch": 1133} {"train_loss": -38.7833366394043, "global_step": 137119, "epoch": 1133} {"train_loss": -37.94210433959961, "global_step": 137120, "epoch": 1133} {"train_loss": -38.90190505981445, "global_step": 137121, "epoch": 1133} {"train_loss": -37.96324920654297, "global_step": 137122, "epoch": 1133} {"train_loss": -38.5022087097168, "global_step": 137123, "epoch": 1133} {"train_loss": -39.10311508178711, "global_step": 137124, "epoch": 1133} {"train_loss": -38.8823127746582, "global_step": 137125, "epoch": 1133} {"train_loss": -38.65870666503906, "global_step": 137126, "epoch": 1133} {"train_loss": -38.99799728393555, "global_step": 137127, "epoch": 1133} {"train_loss": -38.876277923583984, "global_step": 137128, "epoch": 1133} {"train_loss": -38.36665344238281, "global_step": 137129, "epoch": 1133} {"train_loss": -38.11617660522461, "global_step": 137130, "epoch": 1133} {"train_loss": -39.08585739135742, "global_step": 137131, "epoch": 1133} {"train_loss": -38.37107467651367, "global_step": 137132, "epoch": 1133} {"train_loss": -38.9692268371582, "global_step": 137133, "epoch": 1133} {"train_loss": -38.677772521972656, "global_step": 137134, "epoch": 1133} {"train_loss": -39.193519592285156, "global_step": 137135, "epoch": 1133} {"train_loss": -39.17229461669922, "global_step": 137136, "epoch": 1133} {"train_loss": -38.95988845825195, "global_step": 137137, "epoch": 1133} {"train_loss": -39.48214340209961, "global_step": 137138, "epoch": 1133} {"train_loss": -39.331520080566406, "global_step": 137139, "epoch": 1133} {"train_loss": -39.347835540771484, "global_step": 137140, "epoch": 1133} {"train_loss": -39.12923049926758, "global_step": 137141, "epoch": 1133} {"train_loss": -38.91704559326172, "global_step": 137142, "epoch": 1133} {"train_loss": -39.27639389038086, "global_step": 137143, "epoch": 1133} {"train_loss": -38.95035934448242, "global_step": 137144, "epoch": 1133} {"train_loss": -39.32874298095703, "global_step": 137145, "epoch": 1133} {"train_loss": -39.34465408325195, "global_step": 137146, "epoch": 1133} {"train_loss": -39.311214447021484, "global_step": 137147, "epoch": 1133} {"train_loss": -39.7094612121582, "global_step": 137148, "epoch": 1133} {"train_loss": -39.62791061401367, "global_step": 137149, "epoch": 1133} {"train_loss": -39.73567581176758, "global_step": 137150, "epoch": 1133} {"train_loss": -38.96626663208008, "global_step": 137151, "epoch": 1133} {"train_loss": -39.8524055480957, "global_step": 137152, "epoch": 1133} {"train_loss": -38.79122543334961, "global_step": 137153, "epoch": 1133} {"train_loss": -38.78034210205078, "global_step": 137154, "epoch": 1133} {"train_loss": -38.92951583862305, "global_step": 137155, "epoch": 1133} {"train_loss": -39.128414154052734, "global_step": 137156, "epoch": 1133} {"train_loss": -37.49365234375, "global_step": 137157, "epoch": 1133} {"train_loss": -36.01768493652344, "global_step": 137158, "epoch": 1133} {"train_loss": -36.53424072265625, "global_step": 137159, "epoch": 1133} {"train_loss": -36.9688606262207, "global_step": 137160, "epoch": 1133} {"train_loss": -35.306968688964844, "global_step": 137161, "epoch": 1133} {"train_loss": -34.529876708984375, "global_step": 137162, "epoch": 1133} {"train_loss": -31.423913955688477, "global_step": 137163, "epoch": 1133} {"train_loss": -30.690414428710938, "global_step": 137164, "epoch": 1133} {"train_loss": -38.79018020629883, "global_step": 137165, "epoch": 1133} {"train_loss": -29.117277145385742, "global_step": 137166, "epoch": 1133} {"train_loss": -32.80470657348633, "global_step": 137167, "epoch": 1133} {"train_loss": -38.346778869628906, "global_step": 137168, "epoch": 1133} {"train_loss": -31.514907836914062, "global_step": 137169, "epoch": 1133} {"train_loss": -37.32444763183594, "global_step": 137170, "epoch": 1133} {"train_loss": -33.77690887451172, "global_step": 137171, "epoch": 1133} {"train_loss": -33.17271041870117, "global_step": 137172, "epoch": 1133} {"train_loss": -35.88372802734375, "global_step": 137173, "epoch": 1133} {"train_loss": -34.77225875854492, "global_step": 137174, "epoch": 1133} {"train_loss": -36.161842346191406, "global_step": 137175, "epoch": 1133} {"train_loss": -37.34453201293945, "global_step": 137176, "epoch": 1133} {"train_loss": -35.765316009521484, "global_step": 137177, "epoch": 1133} {"train_loss": -38.40885543823242, "global_step": 137178, "epoch": 1133} {"train_loss": -36.602535247802734, "global_step": 137179, "epoch": 1133} {"train_loss": -37.874916076660156, "global_step": 137180, "epoch": 1133} {"train_loss": -37.8123893737793, "global_step": 137181, "epoch": 1133} {"train_loss": -37.37887191772461, "global_step": 137182, "epoch": 1133} {"train_loss": -38.62671661376953, "global_step": 137183, "epoch": 1133} {"train_loss": -38.82944107055664, "global_step": 137184, "epoch": 1133} {"train_loss": -37.89729690551758, "global_step": 137185, "epoch": 1133} {"train_loss": -38.245948791503906, "global_step": 137186, "epoch": 1133} {"train_loss": -38.42262268066406, "global_step": 137187, "epoch": 1133} {"train_loss": -38.0908088684082, "global_step": 137188, "epoch": 1133} {"train_loss": -39.3503303527832, "global_step": 137189, "epoch": 1133} {"train_loss": -37.99774932861328, "global_step": 137190, "epoch": 1133} {"train_loss": -38.268959045410156, "global_step": 137191, "epoch": 1133} {"train_loss": -38.41635513305664, "global_step": 137192, "epoch": 1133} {"train_loss": -38.621337890625, "global_step": 137193, "epoch": 1133} {"train_loss": -38.58417510986328, "global_step": 137194, "epoch": 1133} {"train_loss": -39.111732482910156, "global_step": 137195, "epoch": 1133} {"train_loss": -38.44403839111328, "global_step": 137196, "epoch": 1133} {"train_loss": -38.989463806152344, "global_step": 137197, "epoch": 1133} {"train_loss": -39.314666748046875, "global_step": 137198, "epoch": 1133} {"train_loss": -39.104801177978516, "global_step": 137199, "epoch": 1133} {"train_loss": -39.483741760253906, "global_step": 137200, "epoch": 1133} {"train_loss": -39.536651611328125, "global_step": 137201, "epoch": 1133} {"train_loss": -39.2255973815918, "global_step": 137202, "epoch": 1133} {"train_loss": -39.34730911254883, "global_step": 137203, "epoch": 1133} {"train_loss": -39.475067138671875, "global_step": 137204, "epoch": 1133} {"train_loss": -39.135257720947266, "global_step": 137205, "epoch": 1133} {"train_loss": -39.63827133178711, "global_step": 137206, "epoch": 1133} {"train_loss": -39.58051681518555, "global_step": 137207, "epoch": 1133} {"train_loss": -39.40047836303711, "global_step": 137208, "epoch": 1133} {"train_loss": -39.49880599975586, "global_step": 137209, "epoch": 1133} {"train_loss": -39.1326789855957, "global_step": 137210, "epoch": 1133} {"train_loss": -39.32143783569336, "global_step": 137211, "epoch": 1133} {"train_loss": -39.787601470947266, "global_step": 137212, "epoch": 1133} {"train_loss": -37.9659632848314, "global_step": 137213, "epoch": 1133, "val_loss": 2628889.25} {"train_loss": -39.48771286010742, "global_step": 137214, "epoch": 1134} {"train_loss": -39.71553421020508, "global_step": 137215, "epoch": 1134} {"train_loss": -39.517982482910156, "global_step": 137216, "epoch": 1134} {"train_loss": -39.9117546081543, "global_step": 137217, "epoch": 1134} {"train_loss": -38.648712158203125, "global_step": 137218, "epoch": 1134} {"train_loss": -39.21746826171875, "global_step": 137219, "epoch": 1134} {"train_loss": -39.48594284057617, "global_step": 137220, "epoch": 1134} {"train_loss": -39.592506408691406, "global_step": 137221, "epoch": 1134} {"train_loss": -40.16215133666992, "global_step": 137222, "epoch": 1134} {"train_loss": -39.88624572753906, "global_step": 137223, "epoch": 1134} {"train_loss": -40.206661224365234, "global_step": 137224, "epoch": 1134} {"train_loss": -40.35374069213867, "global_step": 137225, "epoch": 1134} {"train_loss": -39.64561080932617, "global_step": 137226, "epoch": 1134} {"train_loss": -39.710418701171875, "global_step": 137227, "epoch": 1134} {"train_loss": -40.267879486083984, "global_step": 137228, "epoch": 1134} {"train_loss": -40.39571762084961, "global_step": 137229, "epoch": 1134} {"train_loss": -39.774871826171875, "global_step": 137230, "epoch": 1134} {"train_loss": -40.397361755371094, "global_step": 137231, "epoch": 1134} {"train_loss": -40.46294021606445, "global_step": 137232, "epoch": 1134} {"train_loss": -39.88209915161133, "global_step": 137233, "epoch": 1134} {"train_loss": -39.82514953613281, "global_step": 137234, "epoch": 1134} {"train_loss": -40.004512786865234, "global_step": 137235, "epoch": 1134} {"train_loss": -40.28724670410156, "global_step": 137236, "epoch": 1134} {"train_loss": -40.1429328918457, "global_step": 137237, "epoch": 1134} {"train_loss": -39.81928253173828, "global_step": 137238, "epoch": 1134} {"train_loss": -40.112361907958984, "global_step": 137239, "epoch": 1134} {"train_loss": -40.35123825073242, "global_step": 137240, "epoch": 1134} {"train_loss": -39.303585052490234, "global_step": 137241, "epoch": 1134} {"train_loss": -39.068878173828125, "global_step": 137242, "epoch": 1134} {"train_loss": -38.96714401245117, "global_step": 137243, "epoch": 1134} {"train_loss": -40.592018127441406, "global_step": 137244, "epoch": 1134} {"train_loss": -40.017059326171875, "global_step": 137245, "epoch": 1134} {"train_loss": -39.560523986816406, "global_step": 137246, "epoch": 1134} {"train_loss": -38.807857513427734, "global_step": 137247, "epoch": 1134} {"train_loss": -40.358131408691406, "global_step": 137248, "epoch": 1134} {"train_loss": -39.60694122314453, "global_step": 137249, "epoch": 1134} {"train_loss": -39.494258880615234, "global_step": 137250, "epoch": 1134} {"train_loss": -38.777442932128906, "global_step": 137251, "epoch": 1134} {"train_loss": -39.097625732421875, "global_step": 137252, "epoch": 1134} {"train_loss": -40.29838943481445, "global_step": 137253, "epoch": 1134} {"train_loss": -39.70896530151367, "global_step": 137254, "epoch": 1134} {"train_loss": -39.89805221557617, "global_step": 137255, "epoch": 1134} {"train_loss": -40.14292526245117, "global_step": 137256, "epoch": 1134} {"train_loss": -40.231807708740234, "global_step": 137257, "epoch": 1134} {"train_loss": -39.94900131225586, "global_step": 137258, "epoch": 1134} {"train_loss": -40.43569564819336, "global_step": 137259, "epoch": 1134} {"train_loss": -40.68577194213867, "global_step": 137260, "epoch": 1134} {"train_loss": -40.269744873046875, "global_step": 137261, "epoch": 1134} {"train_loss": -40.538330078125, "global_step": 137262, "epoch": 1134} {"train_loss": -40.01322555541992, "global_step": 137263, "epoch": 1134} {"train_loss": -40.4208984375, "global_step": 137264, "epoch": 1134} {"train_loss": -40.63212203979492, "global_step": 137265, "epoch": 1134} {"train_loss": -40.62919235229492, "global_step": 137266, "epoch": 1134} {"train_loss": -40.65348815917969, "global_step": 137267, "epoch": 1134} {"train_loss": -40.164886474609375, "global_step": 137268, "epoch": 1134} {"train_loss": -40.715240478515625, "global_step": 137269, "epoch": 1134} {"train_loss": -40.684356689453125, "global_step": 137270, "epoch": 1134} {"train_loss": -39.4689826965332, "global_step": 137271, "epoch": 1134} {"train_loss": -40.66059112548828, "global_step": 137272, "epoch": 1134} {"train_loss": -40.35920333862305, "global_step": 137273, "epoch": 1134} {"train_loss": -40.63856506347656, "global_step": 137274, "epoch": 1134} {"train_loss": -40.7022590637207, "global_step": 137275, "epoch": 1134} {"train_loss": -39.704952239990234, "global_step": 137276, "epoch": 1134} {"train_loss": -40.48939895629883, "global_step": 137277, "epoch": 1134} {"train_loss": -40.9820442199707, "global_step": 137278, "epoch": 1134} {"train_loss": -40.688392639160156, "global_step": 137279, "epoch": 1134} {"train_loss": -40.670372009277344, "global_step": 137280, "epoch": 1134} {"train_loss": -40.42011642456055, "global_step": 137281, "epoch": 1134} {"train_loss": -40.460933685302734, "global_step": 137282, "epoch": 1134} {"train_loss": -40.404232025146484, "global_step": 137283, "epoch": 1134} {"train_loss": -40.8625373840332, "global_step": 137284, "epoch": 1134} {"train_loss": -40.4708366394043, "global_step": 137285, "epoch": 1134} {"train_loss": -40.7305908203125, "global_step": 137286, "epoch": 1134} {"train_loss": -39.957454681396484, "global_step": 137287, "epoch": 1134} {"train_loss": -40.363399505615234, "global_step": 137288, "epoch": 1134} {"train_loss": -40.258033752441406, "global_step": 137289, "epoch": 1134} {"train_loss": -40.34212875366211, "global_step": 137290, "epoch": 1134} {"train_loss": -40.80674362182617, "global_step": 137291, "epoch": 1134} {"train_loss": -40.57318878173828, "global_step": 137292, "epoch": 1134} {"train_loss": -40.24247741699219, "global_step": 137293, "epoch": 1134} {"train_loss": -40.698097229003906, "global_step": 137294, "epoch": 1134} {"train_loss": -40.415042877197266, "global_step": 137295, "epoch": 1134} {"train_loss": -40.51625442504883, "global_step": 137296, "epoch": 1134} {"train_loss": -40.542667388916016, "global_step": 137297, "epoch": 1134} {"train_loss": -39.209407806396484, "global_step": 137298, "epoch": 1134} {"train_loss": -39.71617126464844, "global_step": 137299, "epoch": 1134} {"train_loss": -40.77179718017578, "global_step": 137300, "epoch": 1134} {"train_loss": -39.899044036865234, "global_step": 137301, "epoch": 1134} {"train_loss": -39.476600646972656, "global_step": 137302, "epoch": 1134} {"train_loss": -39.778541564941406, "global_step": 137303, "epoch": 1134} {"train_loss": -39.24524688720703, "global_step": 137304, "epoch": 1134} {"train_loss": -38.837703704833984, "global_step": 137305, "epoch": 1134} {"train_loss": -39.5225830078125, "global_step": 137306, "epoch": 1134} {"train_loss": -39.997989654541016, "global_step": 137307, "epoch": 1134} {"train_loss": -39.73485565185547, "global_step": 137308, "epoch": 1134} {"train_loss": -39.27081298828125, "global_step": 137309, "epoch": 1134} {"train_loss": -38.52571105957031, "global_step": 137310, "epoch": 1134} {"train_loss": -38.34011459350586, "global_step": 137311, "epoch": 1134} {"train_loss": -36.763484954833984, "global_step": 137312, "epoch": 1134} {"train_loss": -34.52850341796875, "global_step": 137313, "epoch": 1134} {"train_loss": -37.87110137939453, "global_step": 137314, "epoch": 1134} {"train_loss": -37.614158630371094, "global_step": 137315, "epoch": 1134} {"train_loss": -33.13649368286133, "global_step": 137316, "epoch": 1134} {"train_loss": -32.8589973449707, "global_step": 137317, "epoch": 1134} {"train_loss": -37.752593994140625, "global_step": 137318, "epoch": 1134} {"train_loss": -28.20942497253418, "global_step": 137319, "epoch": 1134} {"train_loss": -35.1132926940918, "global_step": 137320, "epoch": 1134} {"train_loss": -32.64215850830078, "global_step": 137321, "epoch": 1134} {"train_loss": -35.76139831542969, "global_step": 137322, "epoch": 1134} {"train_loss": -32.48787307739258, "global_step": 137323, "epoch": 1134} {"train_loss": -35.81254959106445, "global_step": 137324, "epoch": 1134} {"train_loss": -30.504343032836914, "global_step": 137325, "epoch": 1134} {"train_loss": -37.670921325683594, "global_step": 137326, "epoch": 1134} {"train_loss": -33.30229949951172, "global_step": 137327, "epoch": 1134} {"train_loss": -35.88050079345703, "global_step": 137328, "epoch": 1134} {"train_loss": -35.6080436706543, "global_step": 137329, "epoch": 1134} {"train_loss": -36.32666778564453, "global_step": 137330, "epoch": 1134} {"train_loss": -35.544029235839844, "global_step": 137331, "epoch": 1134} {"train_loss": -36.80974197387695, "global_step": 137332, "epoch": 1134} {"train_loss": -34.67970657348633, "global_step": 137333, "epoch": 1134} {"train_loss": -39.0601412560329, "global_step": 137334, "epoch": 1134, "val_loss": 2618306.75} {"train_loss": -35.799896240234375, "global_step": 137335, "epoch": 1135} {"train_loss": -38.40989303588867, "global_step": 137336, "epoch": 1135} {"train_loss": -36.560646057128906, "global_step": 137337, "epoch": 1135} {"train_loss": -38.702850341796875, "global_step": 137338, "epoch": 1135} {"train_loss": -36.943946838378906, "global_step": 137339, "epoch": 1135} {"train_loss": -38.23395538330078, "global_step": 137340, "epoch": 1135} {"train_loss": -38.41924285888672, "global_step": 137341, "epoch": 1135} {"train_loss": -38.290504455566406, "global_step": 137342, "epoch": 1135} {"train_loss": -38.937347412109375, "global_step": 137343, "epoch": 1135} {"train_loss": -38.39433288574219, "global_step": 137344, "epoch": 1135} {"train_loss": -38.525238037109375, "global_step": 137345, "epoch": 1135} {"train_loss": -39.14214324951172, "global_step": 137346, "epoch": 1135} {"train_loss": -38.987178802490234, "global_step": 137347, "epoch": 1135} {"train_loss": -38.210933685302734, "global_step": 137348, "epoch": 1135} {"train_loss": -38.92350387573242, "global_step": 137349, "epoch": 1135} {"train_loss": -38.55145263671875, "global_step": 137350, "epoch": 1135} {"train_loss": -39.34437561035156, "global_step": 137351, "epoch": 1135} {"train_loss": -38.867061614990234, "global_step": 137352, "epoch": 1135} {"train_loss": -38.98490524291992, "global_step": 137353, "epoch": 1135} {"train_loss": -39.2345085144043, "global_step": 137354, "epoch": 1135} {"train_loss": -38.60837173461914, "global_step": 137355, "epoch": 1135} {"train_loss": -39.43440628051758, "global_step": 137356, "epoch": 1135} {"train_loss": -38.50710678100586, "global_step": 137357, "epoch": 1135} {"train_loss": -39.80933380126953, "global_step": 137358, "epoch": 1135} {"train_loss": -39.30274200439453, "global_step": 137359, "epoch": 1135} {"train_loss": -39.360877990722656, "global_step": 137360, "epoch": 1135} {"train_loss": -39.214439392089844, "global_step": 137361, "epoch": 1135} {"train_loss": -39.233741760253906, "global_step": 137362, "epoch": 1135} {"train_loss": -38.671138763427734, "global_step": 137363, "epoch": 1135} {"train_loss": -39.84711837768555, "global_step": 137364, "epoch": 1135} {"train_loss": -39.73464584350586, "global_step": 137365, "epoch": 1135} {"train_loss": -39.59577178955078, "global_step": 137366, "epoch": 1135} {"train_loss": -40.03664779663086, "global_step": 137367, "epoch": 1135} {"train_loss": -39.029640197753906, "global_step": 137368, "epoch": 1135} {"train_loss": -39.76630401611328, "global_step": 137369, "epoch": 1135} {"train_loss": -40.31367874145508, "global_step": 137370, "epoch": 1135} {"train_loss": -40.20670700073242, "global_step": 137371, "epoch": 1135} {"train_loss": -39.864933013916016, "global_step": 137372, "epoch": 1135} {"train_loss": -40.00187301635742, "global_step": 137373, "epoch": 1135} {"train_loss": -40.47671127319336, "global_step": 137374, "epoch": 1135} {"train_loss": -40.15084457397461, "global_step": 137375, "epoch": 1135} {"train_loss": -40.03449630737305, "global_step": 137376, "epoch": 1135} {"train_loss": -40.208221435546875, "global_step": 137377, "epoch": 1135} {"train_loss": -40.226444244384766, "global_step": 137378, "epoch": 1135} {"train_loss": -40.285064697265625, "global_step": 137379, "epoch": 1135} {"train_loss": -40.17585372924805, "global_step": 137380, "epoch": 1135} {"train_loss": -40.528106689453125, "global_step": 137381, "epoch": 1135} {"train_loss": -40.276737213134766, "global_step": 137382, "epoch": 1135} {"train_loss": -39.85103225708008, "global_step": 137383, "epoch": 1135} {"train_loss": -40.1373176574707, "global_step": 137384, "epoch": 1135} {"train_loss": -40.382537841796875, "global_step": 137385, "epoch": 1135} {"train_loss": -40.821189880371094, "global_step": 137386, "epoch": 1135} {"train_loss": -40.283470153808594, "global_step": 137387, "epoch": 1135} {"train_loss": -40.41108322143555, "global_step": 137388, "epoch": 1135} {"train_loss": -40.470462799072266, "global_step": 137389, "epoch": 1135} {"train_loss": -40.65570831298828, "global_step": 137390, "epoch": 1135} {"train_loss": -40.4206657409668, "global_step": 137391, "epoch": 1135} {"train_loss": -40.9250373840332, "global_step": 137392, "epoch": 1135} {"train_loss": -40.89431381225586, "global_step": 137393, "epoch": 1135} {"train_loss": -40.564918518066406, "global_step": 137394, "epoch": 1135} {"train_loss": -40.3851318359375, "global_step": 137395, "epoch": 1135} {"train_loss": -40.65949630737305, "global_step": 137396, "epoch": 1135} {"train_loss": -40.62220001220703, "global_step": 137397, "epoch": 1135} {"train_loss": -41.014854431152344, "global_step": 137398, "epoch": 1135} {"train_loss": -40.7723503112793, "global_step": 137399, "epoch": 1135} {"train_loss": -40.80609130859375, "global_step": 137400, "epoch": 1135} {"train_loss": -40.78949737548828, "global_step": 137401, "epoch": 1135} {"train_loss": -40.70431137084961, "global_step": 137402, "epoch": 1135} {"train_loss": -40.82734680175781, "global_step": 137403, "epoch": 1135} {"train_loss": -40.67584228515625, "global_step": 137404, "epoch": 1135} {"train_loss": -40.51206588745117, "global_step": 137405, "epoch": 1135} {"train_loss": -40.30759811401367, "global_step": 137406, "epoch": 1135} {"train_loss": -39.508880615234375, "global_step": 137407, "epoch": 1135} {"train_loss": -36.56061553955078, "global_step": 137408, "epoch": 1135} {"train_loss": -37.941219329833984, "global_step": 137409, "epoch": 1135} {"train_loss": -40.537960052490234, "global_step": 137410, "epoch": 1135} {"train_loss": -39.45113754272461, "global_step": 137411, "epoch": 1135} {"train_loss": -37.93709182739258, "global_step": 137412, "epoch": 1135} {"train_loss": -38.7855110168457, "global_step": 137413, "epoch": 1135} {"train_loss": -40.49060821533203, "global_step": 137414, "epoch": 1135} {"train_loss": -40.38792419433594, "global_step": 137415, "epoch": 1135} {"train_loss": -39.909141540527344, "global_step": 137416, "epoch": 1135} {"train_loss": -40.76782989501953, "global_step": 137417, "epoch": 1135} {"train_loss": -40.31600570678711, "global_step": 137418, "epoch": 1135} {"train_loss": -40.529022216796875, "global_step": 137419, "epoch": 1135} {"train_loss": -40.5040397644043, "global_step": 137420, "epoch": 1135} {"train_loss": -40.24180221557617, "global_step": 137421, "epoch": 1135} {"train_loss": -39.98316192626953, "global_step": 137422, "epoch": 1135} {"train_loss": -40.682891845703125, "global_step": 137423, "epoch": 1135} {"train_loss": -40.4111442565918, "global_step": 137424, "epoch": 1135} {"train_loss": -40.676918029785156, "global_step": 137425, "epoch": 1135} {"train_loss": -40.49782943725586, "global_step": 137426, "epoch": 1135} {"train_loss": -40.605506896972656, "global_step": 137427, "epoch": 1135} {"train_loss": -40.24345016479492, "global_step": 137428, "epoch": 1135} {"train_loss": -40.754695892333984, "global_step": 137429, "epoch": 1135} {"train_loss": -40.43440628051758, "global_step": 137430, "epoch": 1135} {"train_loss": -40.02024459838867, "global_step": 137431, "epoch": 1135} {"train_loss": -40.63249969482422, "global_step": 137432, "epoch": 1135} {"train_loss": -40.1475830078125, "global_step": 137433, "epoch": 1135} {"train_loss": -40.52579879760742, "global_step": 137434, "epoch": 1135} {"train_loss": -40.126380920410156, "global_step": 137435, "epoch": 1135} {"train_loss": -40.29712677001953, "global_step": 137436, "epoch": 1135} {"train_loss": -40.33858871459961, "global_step": 137437, "epoch": 1135} {"train_loss": -40.10102462768555, "global_step": 137438, "epoch": 1135} {"train_loss": -40.82697296142578, "global_step": 137439, "epoch": 1135} {"train_loss": -39.28936004638672, "global_step": 137440, "epoch": 1135} {"train_loss": -39.83776092529297, "global_step": 137441, "epoch": 1135} {"train_loss": -39.12968063354492, "global_step": 137442, "epoch": 1135} {"train_loss": -40.50068283081055, "global_step": 137443, "epoch": 1135} {"train_loss": -40.20429611206055, "global_step": 137444, "epoch": 1135} {"train_loss": -40.90298080444336, "global_step": 137445, "epoch": 1135} {"train_loss": -40.357357025146484, "global_step": 137446, "epoch": 1135} {"train_loss": -40.65253448486328, "global_step": 137447, "epoch": 1135} {"train_loss": -40.67573165893555, "global_step": 137448, "epoch": 1135} {"train_loss": -40.172420501708984, "global_step": 137449, "epoch": 1135} {"train_loss": -39.796875, "global_step": 137450, "epoch": 1135} {"train_loss": -38.85011672973633, "global_step": 137451, "epoch": 1135} {"train_loss": -38.89008331298828, "global_step": 137452, "epoch": 1135} {"train_loss": -38.38273239135742, "global_step": 137453, "epoch": 1135} {"train_loss": -40.476104736328125, "global_step": 137454, "epoch": 1135} {"train_loss": -39.78556978209945, "global_step": 137455, "epoch": 1135, "val_loss": 2718857.25} {"train_loss": -40.22160720825195, "global_step": 137456, "epoch": 1136} {"train_loss": -39.66794204711914, "global_step": 137457, "epoch": 1136} {"train_loss": -40.57515335083008, "global_step": 137458, "epoch": 1136} {"train_loss": -40.5958251953125, "global_step": 137459, "epoch": 1136} {"train_loss": -39.65894317626953, "global_step": 137460, "epoch": 1136} {"train_loss": -38.04274368286133, "global_step": 137461, "epoch": 1136} {"train_loss": -38.79352951049805, "global_step": 137462, "epoch": 1136} {"train_loss": -37.71266555786133, "global_step": 137463, "epoch": 1136} {"train_loss": -34.753692626953125, "global_step": 137464, "epoch": 1136} {"train_loss": -37.68152618408203, "global_step": 137465, "epoch": 1136} {"train_loss": -32.959014892578125, "global_step": 137466, "epoch": 1136} {"train_loss": -28.38275718688965, "global_step": 137467, "epoch": 1136} {"train_loss": -37.560550689697266, "global_step": 137468, "epoch": 1136} {"train_loss": -32.67430114746094, "global_step": 137469, "epoch": 1136} {"train_loss": -35.3785285949707, "global_step": 137470, "epoch": 1136} {"train_loss": -35.35737228393555, "global_step": 137471, "epoch": 1136} {"train_loss": -35.25336837768555, "global_step": 137472, "epoch": 1136} {"train_loss": -36.86869430541992, "global_step": 137473, "epoch": 1136} {"train_loss": -33.754539489746094, "global_step": 137474, "epoch": 1136} {"train_loss": -37.80768966674805, "global_step": 137475, "epoch": 1136} {"train_loss": -35.92222213745117, "global_step": 137476, "epoch": 1136} {"train_loss": -37.70335006713867, "global_step": 137477, "epoch": 1136} {"train_loss": -36.646888732910156, "global_step": 137478, "epoch": 1136} {"train_loss": -38.49142837524414, "global_step": 137479, "epoch": 1136} {"train_loss": -37.901058197021484, "global_step": 137480, "epoch": 1136} {"train_loss": -39.05202102661133, "global_step": 137481, "epoch": 1136} {"train_loss": -38.093196868896484, "global_step": 137482, "epoch": 1136} {"train_loss": -39.202980041503906, "global_step": 137483, "epoch": 1136} {"train_loss": -38.81984329223633, "global_step": 137484, "epoch": 1136} {"train_loss": -38.078338623046875, "global_step": 137485, "epoch": 1136} {"train_loss": -39.00715255737305, "global_step": 137486, "epoch": 1136} {"train_loss": -39.2587776184082, "global_step": 137487, "epoch": 1136} {"train_loss": -39.27528762817383, "global_step": 137488, "epoch": 1136} {"train_loss": -39.4269905090332, "global_step": 137489, "epoch": 1136} {"train_loss": -39.44997024536133, "global_step": 137490, "epoch": 1136} {"train_loss": -39.831241607666016, "global_step": 137491, "epoch": 1136} {"train_loss": -39.980926513671875, "global_step": 137492, "epoch": 1136} {"train_loss": -39.9018669128418, "global_step": 137493, "epoch": 1136} {"train_loss": -39.892147064208984, "global_step": 137494, "epoch": 1136} {"train_loss": -39.72531509399414, "global_step": 137495, "epoch": 1136} {"train_loss": -40.00697708129883, "global_step": 137496, "epoch": 1136} {"train_loss": -39.65406799316406, "global_step": 137497, "epoch": 1136} {"train_loss": -39.8579216003418, "global_step": 137498, "epoch": 1136} {"train_loss": -40.3780517578125, "global_step": 137499, "epoch": 1136} {"train_loss": -40.41694259643555, "global_step": 137500, "epoch": 1136} {"train_loss": -40.16353225708008, "global_step": 137501, "epoch": 1136} {"train_loss": -40.35186767578125, "global_step": 137502, "epoch": 1136} {"train_loss": -40.28596115112305, "global_step": 137503, "epoch": 1136} {"train_loss": -40.16740798950195, "global_step": 137504, "epoch": 1136} {"train_loss": -40.267086029052734, "global_step": 137505, "epoch": 1136} {"train_loss": -40.44600296020508, "global_step": 137506, "epoch": 1136} {"train_loss": -40.191219329833984, "global_step": 137507, "epoch": 1136} {"train_loss": -40.485416412353516, "global_step": 137508, "epoch": 1136} {"train_loss": -40.25156784057617, "global_step": 137509, "epoch": 1136} {"train_loss": -40.35038375854492, "global_step": 137510, "epoch": 1136} {"train_loss": -40.26905059814453, "global_step": 137511, "epoch": 1136} {"train_loss": -40.28934860229492, "global_step": 137512, "epoch": 1136} {"train_loss": -40.796817779541016, "global_step": 137513, "epoch": 1136} {"train_loss": -40.20741271972656, "global_step": 137514, "epoch": 1136} {"train_loss": -40.44710922241211, "global_step": 137515, "epoch": 1136} {"train_loss": -39.97514343261719, "global_step": 137516, "epoch": 1136} {"train_loss": -40.82627487182617, "global_step": 137517, "epoch": 1136} {"train_loss": -40.50045394897461, "global_step": 137518, "epoch": 1136} {"train_loss": -39.16556930541992, "global_step": 137519, "epoch": 1136} {"train_loss": -40.28035354614258, "global_step": 137520, "epoch": 1136} {"train_loss": -40.52436065673828, "global_step": 137521, "epoch": 1136} {"train_loss": -40.63100814819336, "global_step": 137522, "epoch": 1136} {"train_loss": -39.8082389831543, "global_step": 137523, "epoch": 1136} {"train_loss": -39.36933135986328, "global_step": 137524, "epoch": 1136} {"train_loss": -39.253273010253906, "global_step": 137525, "epoch": 1136} {"train_loss": -39.55964660644531, "global_step": 137526, "epoch": 1136} {"train_loss": -40.001190185546875, "global_step": 137527, "epoch": 1136} {"train_loss": -40.75601577758789, "global_step": 137528, "epoch": 1136} {"train_loss": -40.350826263427734, "global_step": 137529, "epoch": 1136} {"train_loss": -39.7452392578125, "global_step": 137530, "epoch": 1136} {"train_loss": -39.338619232177734, "global_step": 137531, "epoch": 1136} {"train_loss": -38.797027587890625, "global_step": 137532, "epoch": 1136} {"train_loss": -39.802345275878906, "global_step": 137533, "epoch": 1136} {"train_loss": -40.82615280151367, "global_step": 137534, "epoch": 1136} {"train_loss": -40.45097732543945, "global_step": 137535, "epoch": 1136} {"train_loss": -40.1031379699707, "global_step": 137536, "epoch": 1136} {"train_loss": -39.713050842285156, "global_step": 137537, "epoch": 1136} {"train_loss": -39.269466400146484, "global_step": 137538, "epoch": 1136} {"train_loss": -39.68964767456055, "global_step": 137539, "epoch": 1136} {"train_loss": -41.083526611328125, "global_step": 137540, "epoch": 1136} {"train_loss": -40.41282272338867, "global_step": 137541, "epoch": 1136} {"train_loss": -40.25809860229492, "global_step": 137542, "epoch": 1136} {"train_loss": -40.44977951049805, "global_step": 137543, "epoch": 1136} {"train_loss": -40.74256896972656, "global_step": 137544, "epoch": 1136} {"train_loss": -40.72455978393555, "global_step": 137545, "epoch": 1136} {"train_loss": -41.16376495361328, "global_step": 137546, "epoch": 1136} {"train_loss": -40.92844772338867, "global_step": 137547, "epoch": 1136} {"train_loss": -40.920509338378906, "global_step": 137548, "epoch": 1136} {"train_loss": -40.98060989379883, "global_step": 137549, "epoch": 1136} {"train_loss": -40.736427307128906, "global_step": 137550, "epoch": 1136} {"train_loss": -39.4044303894043, "global_step": 137551, "epoch": 1136} {"train_loss": -40.1251335144043, "global_step": 137552, "epoch": 1136} {"train_loss": -40.65523910522461, "global_step": 137553, "epoch": 1136} {"train_loss": -40.03595733642578, "global_step": 137554, "epoch": 1136} {"train_loss": -38.95090866088867, "global_step": 137555, "epoch": 1136} {"train_loss": -40.70754623413086, "global_step": 137556, "epoch": 1136} {"train_loss": -40.85692596435547, "global_step": 137557, "epoch": 1136} {"train_loss": -38.22135543823242, "global_step": 137558, "epoch": 1136} {"train_loss": -37.10894775390625, "global_step": 137559, "epoch": 1136} {"train_loss": -38.724098205566406, "global_step": 137560, "epoch": 1136} {"train_loss": -40.416622161865234, "global_step": 137561, "epoch": 1136} {"train_loss": -37.672874450683594, "global_step": 137562, "epoch": 1136} {"train_loss": -37.41022491455078, "global_step": 137563, "epoch": 1136} {"train_loss": -40.59767150878906, "global_step": 137564, "epoch": 1136} {"train_loss": -38.47503662109375, "global_step": 137565, "epoch": 1136} {"train_loss": -40.02968978881836, "global_step": 137566, "epoch": 1136} {"train_loss": -39.97273635864258, "global_step": 137567, "epoch": 1136} {"train_loss": -38.072547912597656, "global_step": 137568, "epoch": 1136} {"train_loss": -40.34271240234375, "global_step": 137569, "epoch": 1136} {"train_loss": -40.00407409667969, "global_step": 137570, "epoch": 1136} {"train_loss": -38.47054672241211, "global_step": 137571, "epoch": 1136} {"train_loss": -40.2707405090332, "global_step": 137572, "epoch": 1136} {"train_loss": -40.116336822509766, "global_step": 137573, "epoch": 1136} {"train_loss": -39.15188980102539, "global_step": 137574, "epoch": 1136} {"train_loss": -40.14472198486328, "global_step": 137575, "epoch": 1136} {"train_loss": -39.241068642986704, "global_step": 137576, "epoch": 1136, "val_loss": 2665647.25} {"train_loss": -37.42494201660156, "global_step": 137577, "epoch": 1137} {"train_loss": -39.11018753051758, "global_step": 137578, "epoch": 1137} {"train_loss": -39.909690856933594, "global_step": 137579, "epoch": 1137} {"train_loss": -38.69562911987305, "global_step": 137580, "epoch": 1137} {"train_loss": -38.995731353759766, "global_step": 137581, "epoch": 1137} {"train_loss": -39.249778747558594, "global_step": 137582, "epoch": 1137} {"train_loss": -37.94356918334961, "global_step": 137583, "epoch": 1137} {"train_loss": -39.5440559387207, "global_step": 137584, "epoch": 1137} {"train_loss": -39.739601135253906, "global_step": 137585, "epoch": 1137} {"train_loss": -38.30213165283203, "global_step": 137586, "epoch": 1137} {"train_loss": -39.51816940307617, "global_step": 137587, "epoch": 1137} {"train_loss": -38.940895080566406, "global_step": 137588, "epoch": 1137} {"train_loss": -39.43285369873047, "global_step": 137589, "epoch": 1137} {"train_loss": -39.76713943481445, "global_step": 137590, "epoch": 1137} {"train_loss": -39.23556137084961, "global_step": 137591, "epoch": 1137} {"train_loss": -40.50550079345703, "global_step": 137592, "epoch": 1137} {"train_loss": -38.50740051269531, "global_step": 137593, "epoch": 1137} {"train_loss": -40.093379974365234, "global_step": 137594, "epoch": 1137} {"train_loss": -38.955623626708984, "global_step": 137595, "epoch": 1137} {"train_loss": -38.833335876464844, "global_step": 137596, "epoch": 1137} {"train_loss": -39.21709060668945, "global_step": 137597, "epoch": 1137} {"train_loss": -38.8466682434082, "global_step": 137598, "epoch": 1137} {"train_loss": -40.25946807861328, "global_step": 137599, "epoch": 1137} {"train_loss": -39.56806564331055, "global_step": 137600, "epoch": 1137} {"train_loss": -39.92875289916992, "global_step": 137601, "epoch": 1137} {"train_loss": -39.230342864990234, "global_step": 137602, "epoch": 1137} {"train_loss": -40.03794479370117, "global_step": 137603, "epoch": 1137} {"train_loss": -39.34318923950195, "global_step": 137604, "epoch": 1137} {"train_loss": -40.4150505065918, "global_step": 137605, "epoch": 1137} {"train_loss": -39.72361373901367, "global_step": 137606, "epoch": 1137} {"train_loss": -39.66082763671875, "global_step": 137607, "epoch": 1137} {"train_loss": -40.05042266845703, "global_step": 137608, "epoch": 1137} {"train_loss": -39.778106689453125, "global_step": 137609, "epoch": 1137} {"train_loss": -40.259307861328125, "global_step": 137610, "epoch": 1137} {"train_loss": -40.39817810058594, "global_step": 137611, "epoch": 1137} {"train_loss": -40.21744918823242, "global_step": 137612, "epoch": 1137} {"train_loss": -40.402217864990234, "global_step": 137613, "epoch": 1137} {"train_loss": -39.50136947631836, "global_step": 137614, "epoch": 1137} {"train_loss": -40.619873046875, "global_step": 137615, "epoch": 1137} {"train_loss": -40.18874740600586, "global_step": 137616, "epoch": 1137} {"train_loss": -40.98720169067383, "global_step": 137617, "epoch": 1137} {"train_loss": -40.6280517578125, "global_step": 137618, "epoch": 1137} {"train_loss": -40.24249267578125, "global_step": 137619, "epoch": 1137} {"train_loss": -40.880924224853516, "global_step": 137620, "epoch": 1137} {"train_loss": -40.73618698120117, "global_step": 137621, "epoch": 1137} {"train_loss": -40.10845947265625, "global_step": 137622, "epoch": 1137} {"train_loss": -40.665496826171875, "global_step": 137623, "epoch": 1137} {"train_loss": -40.38267135620117, "global_step": 137624, "epoch": 1137} {"train_loss": -40.735198974609375, "global_step": 137625, "epoch": 1137} {"train_loss": -41.17129135131836, "global_step": 137626, "epoch": 1137} {"train_loss": -41.16494369506836, "global_step": 137627, "epoch": 1137} {"train_loss": -40.323699951171875, "global_step": 137628, "epoch": 1137} {"train_loss": -40.799957275390625, "global_step": 137629, "epoch": 1137} {"train_loss": -40.58252716064453, "global_step": 137630, "epoch": 1137} {"train_loss": -40.547340393066406, "global_step": 137631, "epoch": 1137} {"train_loss": -40.50004959106445, "global_step": 137632, "epoch": 1137} {"train_loss": -40.456539154052734, "global_step": 137633, "epoch": 1137} {"train_loss": -39.655818939208984, "global_step": 137634, "epoch": 1137} {"train_loss": -39.66301345825195, "global_step": 137635, "epoch": 1137} {"train_loss": -40.05430221557617, "global_step": 137636, "epoch": 1137} {"train_loss": -40.37297058105469, "global_step": 137637, "epoch": 1137} {"train_loss": -39.441341400146484, "global_step": 137638, "epoch": 1137} {"train_loss": -40.38825225830078, "global_step": 137639, "epoch": 1137} {"train_loss": -37.728607177734375, "global_step": 137640, "epoch": 1137} {"train_loss": -40.16292953491211, "global_step": 137641, "epoch": 1137} {"train_loss": -40.49760818481445, "global_step": 137642, "epoch": 1137} {"train_loss": -40.0368537902832, "global_step": 137643, "epoch": 1137} {"train_loss": -40.833927154541016, "global_step": 137644, "epoch": 1137} {"train_loss": -40.5745735168457, "global_step": 137645, "epoch": 1137} {"train_loss": -41.24085235595703, "global_step": 137646, "epoch": 1137} {"train_loss": -40.88271713256836, "global_step": 137647, "epoch": 1137} {"train_loss": -39.89216232299805, "global_step": 137648, "epoch": 1137} {"train_loss": -39.31814193725586, "global_step": 137649, "epoch": 1137} {"train_loss": -40.52411651611328, "global_step": 137650, "epoch": 1137} {"train_loss": -40.69974899291992, "global_step": 137651, "epoch": 1137} {"train_loss": -40.80248260498047, "global_step": 137652, "epoch": 1137} {"train_loss": -41.0239372253418, "global_step": 137653, "epoch": 1137} {"train_loss": -40.46279525756836, "global_step": 137654, "epoch": 1137} {"train_loss": -39.711181640625, "global_step": 137655, "epoch": 1137} {"train_loss": -40.07168197631836, "global_step": 137656, "epoch": 1137} {"train_loss": -38.937801361083984, "global_step": 137657, "epoch": 1137} {"train_loss": -35.90707015991211, "global_step": 137658, "epoch": 1137} {"train_loss": -38.565799713134766, "global_step": 137659, "epoch": 1137} {"train_loss": -39.75458908081055, "global_step": 137660, "epoch": 1137} {"train_loss": -40.90571975708008, "global_step": 137661, "epoch": 1137} {"train_loss": -38.372249603271484, "global_step": 137662, "epoch": 1137} {"train_loss": -39.43730545043945, "global_step": 137663, "epoch": 1137} {"train_loss": -40.10395812988281, "global_step": 137664, "epoch": 1137} {"train_loss": -40.95253372192383, "global_step": 137665, "epoch": 1137} {"train_loss": -41.03738784790039, "global_step": 137666, "epoch": 1137} {"train_loss": -40.86900329589844, "global_step": 137667, "epoch": 1137} {"train_loss": -41.079463958740234, "global_step": 137668, "epoch": 1137} {"train_loss": -41.015228271484375, "global_step": 137669, "epoch": 1137} {"train_loss": -40.749576568603516, "global_step": 137670, "epoch": 1137} {"train_loss": -41.25876998901367, "global_step": 137671, "epoch": 1137} {"train_loss": -41.209869384765625, "global_step": 137672, "epoch": 1137} {"train_loss": -41.35600662231445, "global_step": 137673, "epoch": 1137} {"train_loss": -40.68244552612305, "global_step": 137674, "epoch": 1137} {"train_loss": -40.42868423461914, "global_step": 137675, "epoch": 1137} {"train_loss": -41.19782638549805, "global_step": 137676, "epoch": 1137} {"train_loss": -41.00372314453125, "global_step": 137677, "epoch": 1137} {"train_loss": -39.923492431640625, "global_step": 137678, "epoch": 1137} {"train_loss": -38.575984954833984, "global_step": 137679, "epoch": 1137} {"train_loss": -38.00310516357422, "global_step": 137680, "epoch": 1137} {"train_loss": -36.007137298583984, "global_step": 137681, "epoch": 1137} {"train_loss": -33.738800048828125, "global_step": 137682, "epoch": 1137} {"train_loss": -38.778690338134766, "global_step": 137683, "epoch": 1137} {"train_loss": -38.65937423706055, "global_step": 137684, "epoch": 1137} {"train_loss": -36.61830520629883, "global_step": 137685, "epoch": 1137} {"train_loss": -38.05009078979492, "global_step": 137686, "epoch": 1137} {"train_loss": -39.80757522583008, "global_step": 137687, "epoch": 1137} {"train_loss": -36.07513427734375, "global_step": 137688, "epoch": 1137} {"train_loss": -37.759971618652344, "global_step": 137689, "epoch": 1137} {"train_loss": -39.7142448425293, "global_step": 137690, "epoch": 1137} {"train_loss": -35.479305267333984, "global_step": 137691, "epoch": 1137} {"train_loss": -38.95513153076172, "global_step": 137692, "epoch": 1137} {"train_loss": -33.8670768737793, "global_step": 137693, "epoch": 1137} {"train_loss": -38.266658782958984, "global_step": 137694, "epoch": 1137} {"train_loss": -36.23466873168945, "global_step": 137695, "epoch": 1137} {"train_loss": -37.27540969848633, "global_step": 137696, "epoch": 1137} {"train_loss": -39.56893457460009, "global_step": 137697, "epoch": 1137, "val_loss": 2635279.0} {"train_loss": -37.7381591796875, "global_step": 137698, "epoch": 1138} {"train_loss": -36.776885986328125, "global_step": 137699, "epoch": 1138} {"train_loss": -38.5359001159668, "global_step": 137700, "epoch": 1138} {"train_loss": -39.129886627197266, "global_step": 137701, "epoch": 1138} {"train_loss": -37.47748947143555, "global_step": 137702, "epoch": 1138} {"train_loss": -38.680423736572266, "global_step": 137703, "epoch": 1138} {"train_loss": -39.9071044921875, "global_step": 137704, "epoch": 1138} {"train_loss": -38.27014923095703, "global_step": 137705, "epoch": 1138} {"train_loss": -39.192623138427734, "global_step": 137706, "epoch": 1138} {"train_loss": -39.20140075683594, "global_step": 137707, "epoch": 1138} {"train_loss": -39.51631546020508, "global_step": 137708, "epoch": 1138} {"train_loss": -39.00556564331055, "global_step": 137709, "epoch": 1138} {"train_loss": -40.066986083984375, "global_step": 137710, "epoch": 1138} {"train_loss": -38.595802307128906, "global_step": 137711, "epoch": 1138} {"train_loss": -39.90515899658203, "global_step": 137712, "epoch": 1138} {"train_loss": -39.87394332885742, "global_step": 137713, "epoch": 1138} {"train_loss": -39.84808349609375, "global_step": 137714, "epoch": 1138} {"train_loss": -39.781410217285156, "global_step": 137715, "epoch": 1138} {"train_loss": -40.26951217651367, "global_step": 137716, "epoch": 1138} {"train_loss": -39.79517364501953, "global_step": 137717, "epoch": 1138} {"train_loss": -38.46297073364258, "global_step": 137718, "epoch": 1138} {"train_loss": -39.974853515625, "global_step": 137719, "epoch": 1138} {"train_loss": -40.72726058959961, "global_step": 137720, "epoch": 1138} {"train_loss": -39.40220260620117, "global_step": 137721, "epoch": 1138} {"train_loss": -39.87125015258789, "global_step": 137722, "epoch": 1138} {"train_loss": -40.52116012573242, "global_step": 137723, "epoch": 1138} {"train_loss": -40.88648223876953, "global_step": 137724, "epoch": 1138} {"train_loss": -39.505855560302734, "global_step": 137725, "epoch": 1138} {"train_loss": -39.72732925415039, "global_step": 137726, "epoch": 1138} {"train_loss": -40.37028121948242, "global_step": 137727, "epoch": 1138} {"train_loss": -40.22788619995117, "global_step": 137728, "epoch": 1138} {"train_loss": -40.7180290222168, "global_step": 137729, "epoch": 1138} {"train_loss": -39.68397903442383, "global_step": 137730, "epoch": 1138} {"train_loss": -40.23067855834961, "global_step": 137731, "epoch": 1138} {"train_loss": -40.5168571472168, "global_step": 137732, "epoch": 1138} {"train_loss": -40.808837890625, "global_step": 137733, "epoch": 1138} {"train_loss": -40.52838897705078, "global_step": 137734, "epoch": 1138} {"train_loss": -40.23134994506836, "global_step": 137735, "epoch": 1138} {"train_loss": -40.783287048339844, "global_step": 137736, "epoch": 1138} {"train_loss": -41.0203742980957, "global_step": 137737, "epoch": 1138} {"train_loss": -40.245582580566406, "global_step": 137738, "epoch": 1138} {"train_loss": -40.5853385925293, "global_step": 137739, "epoch": 1138} {"train_loss": -40.03607940673828, "global_step": 137740, "epoch": 1138} {"train_loss": -39.7021369934082, "global_step": 137741, "epoch": 1138} {"train_loss": -39.451866149902344, "global_step": 137742, "epoch": 1138} {"train_loss": -38.88371658325195, "global_step": 137743, "epoch": 1138} {"train_loss": -39.70463943481445, "global_step": 137744, "epoch": 1138} {"train_loss": -40.52640914916992, "global_step": 137745, "epoch": 1138} {"train_loss": -40.14830017089844, "global_step": 137746, "epoch": 1138} {"train_loss": -39.81533432006836, "global_step": 137747, "epoch": 1138} {"train_loss": -39.04799270629883, "global_step": 137748, "epoch": 1138} {"train_loss": -39.24592208862305, "global_step": 137749, "epoch": 1138} {"train_loss": -40.04825973510742, "global_step": 137750, "epoch": 1138} {"train_loss": -39.962337493896484, "global_step": 137751, "epoch": 1138} {"train_loss": -40.23709487915039, "global_step": 137752, "epoch": 1138} {"train_loss": -39.072113037109375, "global_step": 137753, "epoch": 1138} {"train_loss": -38.45198440551758, "global_step": 137754, "epoch": 1138} {"train_loss": -40.10408020019531, "global_step": 137755, "epoch": 1138} {"train_loss": -40.89442825317383, "global_step": 137756, "epoch": 1138} {"train_loss": -40.79689025878906, "global_step": 137757, "epoch": 1138} {"train_loss": -39.626800537109375, "global_step": 137758, "epoch": 1138} {"train_loss": -39.498687744140625, "global_step": 137759, "epoch": 1138} {"train_loss": -40.823890686035156, "global_step": 137760, "epoch": 1138} {"train_loss": -40.93571090698242, "global_step": 137761, "epoch": 1138} {"train_loss": -39.830867767333984, "global_step": 137762, "epoch": 1138} {"train_loss": -38.3345947265625, "global_step": 137763, "epoch": 1138} {"train_loss": -37.590450286865234, "global_step": 137764, "epoch": 1138} {"train_loss": -40.72520065307617, "global_step": 137765, "epoch": 1138} {"train_loss": -38.79526138305664, "global_step": 137766, "epoch": 1138} {"train_loss": -39.47389602661133, "global_step": 137767, "epoch": 1138} {"train_loss": -39.12664794921875, "global_step": 137768, "epoch": 1138} {"train_loss": -38.043697357177734, "global_step": 137769, "epoch": 1138} {"train_loss": -36.60890579223633, "global_step": 137770, "epoch": 1138} {"train_loss": -39.529869079589844, "global_step": 137771, "epoch": 1138} {"train_loss": -39.26969528198242, "global_step": 137772, "epoch": 1138} {"train_loss": -36.157649993896484, "global_step": 137773, "epoch": 1138} {"train_loss": -39.503204345703125, "global_step": 137774, "epoch": 1138} {"train_loss": -39.0702018737793, "global_step": 137775, "epoch": 1138} {"train_loss": -37.216224670410156, "global_step": 137776, "epoch": 1138} {"train_loss": -37.79006576538086, "global_step": 137777, "epoch": 1138} {"train_loss": -37.598846435546875, "global_step": 137778, "epoch": 1138} {"train_loss": -39.449832916259766, "global_step": 137779, "epoch": 1138} {"train_loss": -39.637062072753906, "global_step": 137780, "epoch": 1138} {"train_loss": -38.351417541503906, "global_step": 137781, "epoch": 1138} {"train_loss": -37.883060455322266, "global_step": 137782, "epoch": 1138} {"train_loss": -40.37958526611328, "global_step": 137783, "epoch": 1138} {"train_loss": -39.503360748291016, "global_step": 137784, "epoch": 1138} {"train_loss": -39.97062301635742, "global_step": 137785, "epoch": 1138} {"train_loss": -39.39754104614258, "global_step": 137786, "epoch": 1138} {"train_loss": -40.232852935791016, "global_step": 137787, "epoch": 1138} {"train_loss": -39.75490951538086, "global_step": 137788, "epoch": 1138} {"train_loss": -39.020870208740234, "global_step": 137789, "epoch": 1138} {"train_loss": -39.60588455200195, "global_step": 137790, "epoch": 1138} {"train_loss": -39.66138458251953, "global_step": 137791, "epoch": 1138} {"train_loss": -39.977447509765625, "global_step": 137792, "epoch": 1138} {"train_loss": -39.97020721435547, "global_step": 137793, "epoch": 1138} {"train_loss": -40.00083541870117, "global_step": 137794, "epoch": 1138} {"train_loss": -40.10859298706055, "global_step": 137795, "epoch": 1138} {"train_loss": -39.36445999145508, "global_step": 137796, "epoch": 1138} {"train_loss": -39.95271301269531, "global_step": 137797, "epoch": 1138} {"train_loss": -39.917701721191406, "global_step": 137798, "epoch": 1138} {"train_loss": -39.704742431640625, "global_step": 137799, "epoch": 1138} {"train_loss": -39.70521926879883, "global_step": 137800, "epoch": 1138} {"train_loss": -39.91826629638672, "global_step": 137801, "epoch": 1138} {"train_loss": -40.68107986450195, "global_step": 137802, "epoch": 1138} {"train_loss": -40.369083404541016, "global_step": 137803, "epoch": 1138} {"train_loss": -41.01333236694336, "global_step": 137804, "epoch": 1138} {"train_loss": -40.428977966308594, "global_step": 137805, "epoch": 1138} {"train_loss": -41.05866622924805, "global_step": 137806, "epoch": 1138} {"train_loss": -40.613616943359375, "global_step": 137807, "epoch": 1138} {"train_loss": -41.17085647583008, "global_step": 137808, "epoch": 1138} {"train_loss": -40.76766586303711, "global_step": 137809, "epoch": 1138} {"train_loss": -40.53007507324219, "global_step": 137810, "epoch": 1138} {"train_loss": -41.277523040771484, "global_step": 137811, "epoch": 1138} {"train_loss": -40.80558395385742, "global_step": 137812, "epoch": 1138} {"train_loss": -40.98249435424805, "global_step": 137813, "epoch": 1138} {"train_loss": -40.9911994934082, "global_step": 137814, "epoch": 1138} {"train_loss": -41.33726119995117, "global_step": 137815, "epoch": 1138} {"train_loss": -40.99172592163086, "global_step": 137816, "epoch": 1138} {"train_loss": -40.604820251464844, "global_step": 137817, "epoch": 1138} {"train_loss": -39.70263303015843, "global_step": 137818, "epoch": 1138, "val_loss": 2664150.75} {"train_loss": -41.23923873901367, "global_step": 137819, "epoch": 1139} {"train_loss": -41.51220703125, "global_step": 137820, "epoch": 1139} {"train_loss": -40.89287567138672, "global_step": 137821, "epoch": 1139} {"train_loss": -41.116004943847656, "global_step": 137822, "epoch": 1139} {"train_loss": -41.10771942138672, "global_step": 137823, "epoch": 1139} {"train_loss": -41.38484573364258, "global_step": 137824, "epoch": 1139} {"train_loss": -40.83420181274414, "global_step": 137825, "epoch": 1139} {"train_loss": -40.704830169677734, "global_step": 137826, "epoch": 1139} {"train_loss": -40.7369270324707, "global_step": 137827, "epoch": 1139} {"train_loss": -40.175628662109375, "global_step": 137828, "epoch": 1139} {"train_loss": -40.40253448486328, "global_step": 137829, "epoch": 1139} {"train_loss": -41.13669967651367, "global_step": 137830, "epoch": 1139} {"train_loss": -40.16770553588867, "global_step": 137831, "epoch": 1139} {"train_loss": -40.10487747192383, "global_step": 137832, "epoch": 1139} {"train_loss": -40.93772888183594, "global_step": 137833, "epoch": 1139} {"train_loss": -40.33086395263672, "global_step": 137834, "epoch": 1139} {"train_loss": -40.457984924316406, "global_step": 137835, "epoch": 1139} {"train_loss": -39.81983184814453, "global_step": 137836, "epoch": 1139} {"train_loss": -40.122554779052734, "global_step": 137837, "epoch": 1139} {"train_loss": -40.232147216796875, "global_step": 137838, "epoch": 1139} {"train_loss": -40.646121978759766, "global_step": 137839, "epoch": 1139} {"train_loss": -41.23492431640625, "global_step": 137840, "epoch": 1139} {"train_loss": -40.34343338012695, "global_step": 137841, "epoch": 1139} {"train_loss": -41.00810241699219, "global_step": 137842, "epoch": 1139} {"train_loss": -41.067176818847656, "global_step": 137843, "epoch": 1139} {"train_loss": -40.986995697021484, "global_step": 137844, "epoch": 1139} {"train_loss": -41.219886779785156, "global_step": 137845, "epoch": 1139} {"train_loss": -40.442256927490234, "global_step": 137846, "epoch": 1139} {"train_loss": -39.8286247253418, "global_step": 137847, "epoch": 1139} {"train_loss": -38.58750534057617, "global_step": 137848, "epoch": 1139} {"train_loss": -39.12284469604492, "global_step": 137849, "epoch": 1139} {"train_loss": -39.4596061706543, "global_step": 137850, "epoch": 1139} {"train_loss": -40.2979736328125, "global_step": 137851, "epoch": 1139} {"train_loss": -41.1874885559082, "global_step": 137852, "epoch": 1139} {"train_loss": -40.44488525390625, "global_step": 137853, "epoch": 1139} {"train_loss": -40.41527557373047, "global_step": 137854, "epoch": 1139} {"train_loss": -40.31771469116211, "global_step": 137855, "epoch": 1139} {"train_loss": -40.12970733642578, "global_step": 137856, "epoch": 1139} {"train_loss": -39.84280776977539, "global_step": 137857, "epoch": 1139} {"train_loss": -39.264129638671875, "global_step": 137858, "epoch": 1139} {"train_loss": -39.49581527709961, "global_step": 137859, "epoch": 1139} {"train_loss": -40.12852096557617, "global_step": 137860, "epoch": 1139} {"train_loss": -39.53922653198242, "global_step": 137861, "epoch": 1139} {"train_loss": -40.02387619018555, "global_step": 137862, "epoch": 1139} {"train_loss": -40.778594970703125, "global_step": 137863, "epoch": 1139} {"train_loss": -39.518123626708984, "global_step": 137864, "epoch": 1139} {"train_loss": -37.26310348510742, "global_step": 137865, "epoch": 1139} {"train_loss": -36.757991790771484, "global_step": 137866, "epoch": 1139} {"train_loss": -40.571922302246094, "global_step": 137867, "epoch": 1139} {"train_loss": -37.13761520385742, "global_step": 137868, "epoch": 1139} {"train_loss": -36.692073822021484, "global_step": 137869, "epoch": 1139} {"train_loss": -40.857086181640625, "global_step": 137870, "epoch": 1139} {"train_loss": -36.2937126159668, "global_step": 137871, "epoch": 1139} {"train_loss": -38.438934326171875, "global_step": 137872, "epoch": 1139} {"train_loss": -40.31230545043945, "global_step": 137873, "epoch": 1139} {"train_loss": -38.33707046508789, "global_step": 137874, "epoch": 1139} {"train_loss": -39.456077575683594, "global_step": 137875, "epoch": 1139} {"train_loss": -39.89884567260742, "global_step": 137876, "epoch": 1139} {"train_loss": -38.86865234375, "global_step": 137877, "epoch": 1139} {"train_loss": -40.068904876708984, "global_step": 137878, "epoch": 1139} {"train_loss": -40.25974655151367, "global_step": 137879, "epoch": 1139} {"train_loss": -40.061805725097656, "global_step": 137880, "epoch": 1139} {"train_loss": -40.634090423583984, "global_step": 137881, "epoch": 1139} {"train_loss": -40.62543869018555, "global_step": 137882, "epoch": 1139} {"train_loss": -40.12226486206055, "global_step": 137883, "epoch": 1139} {"train_loss": -40.942718505859375, "global_step": 137884, "epoch": 1139} {"train_loss": -40.102848052978516, "global_step": 137885, "epoch": 1139} {"train_loss": -40.15732955932617, "global_step": 137886, "epoch": 1139} {"train_loss": -40.96635055541992, "global_step": 137887, "epoch": 1139} {"train_loss": -39.888912200927734, "global_step": 137888, "epoch": 1139} {"train_loss": -40.175811767578125, "global_step": 137889, "epoch": 1139} {"train_loss": -39.43265914916992, "global_step": 137890, "epoch": 1139} {"train_loss": -39.33631896972656, "global_step": 137891, "epoch": 1139} {"train_loss": -40.45970916748047, "global_step": 137892, "epoch": 1139} {"train_loss": -40.37839126586914, "global_step": 137893, "epoch": 1139} {"train_loss": -40.001373291015625, "global_step": 137894, "epoch": 1139} {"train_loss": -39.622005462646484, "global_step": 137895, "epoch": 1139} {"train_loss": -39.02058029174805, "global_step": 137896, "epoch": 1139} {"train_loss": -40.18263626098633, "global_step": 137897, "epoch": 1139} {"train_loss": -40.76189422607422, "global_step": 137898, "epoch": 1139} {"train_loss": -40.26078414916992, "global_step": 137899, "epoch": 1139} {"train_loss": -41.04558181762695, "global_step": 137900, "epoch": 1139} {"train_loss": -40.182308197021484, "global_step": 137901, "epoch": 1139} {"train_loss": -40.6735954284668, "global_step": 137902, "epoch": 1139} {"train_loss": -40.439815521240234, "global_step": 137903, "epoch": 1139} {"train_loss": -40.833709716796875, "global_step": 137904, "epoch": 1139} {"train_loss": -40.788185119628906, "global_step": 137905, "epoch": 1139} {"train_loss": -39.12322998046875, "global_step": 137906, "epoch": 1139} {"train_loss": -40.47111129760742, "global_step": 137907, "epoch": 1139} {"train_loss": -40.75017547607422, "global_step": 137908, "epoch": 1139} {"train_loss": -39.50967788696289, "global_step": 137909, "epoch": 1139} {"train_loss": -38.80292892456055, "global_step": 137910, "epoch": 1139} {"train_loss": -39.87993240356445, "global_step": 137911, "epoch": 1139} {"train_loss": -40.79380416870117, "global_step": 137912, "epoch": 1139} {"train_loss": -40.53763961791992, "global_step": 137913, "epoch": 1139} {"train_loss": -40.480255126953125, "global_step": 137914, "epoch": 1139} {"train_loss": -40.2637825012207, "global_step": 137915, "epoch": 1139} {"train_loss": -40.36798858642578, "global_step": 137916, "epoch": 1139} {"train_loss": -40.242889404296875, "global_step": 137917, "epoch": 1139} {"train_loss": -40.21347427368164, "global_step": 137918, "epoch": 1139} {"train_loss": -39.79301071166992, "global_step": 137919, "epoch": 1139} {"train_loss": -40.94318389892578, "global_step": 137920, "epoch": 1139} {"train_loss": -40.286190032958984, "global_step": 137921, "epoch": 1139} {"train_loss": -40.616939544677734, "global_step": 137922, "epoch": 1139} {"train_loss": -40.805606842041016, "global_step": 137923, "epoch": 1139} {"train_loss": -41.15392303466797, "global_step": 137924, "epoch": 1139} {"train_loss": -40.40894317626953, "global_step": 137925, "epoch": 1139} {"train_loss": -40.7031135559082, "global_step": 137926, "epoch": 1139} {"train_loss": -41.31753158569336, "global_step": 137927, "epoch": 1139} {"train_loss": -41.170677185058594, "global_step": 137928, "epoch": 1139} {"train_loss": -41.0727424621582, "global_step": 137929, "epoch": 1139} {"train_loss": -40.58478927612305, "global_step": 137930, "epoch": 1139} {"train_loss": -39.20085525512695, "global_step": 137931, "epoch": 1139} {"train_loss": -39.7852668762207, "global_step": 137932, "epoch": 1139} {"train_loss": -40.81826400756836, "global_step": 137933, "epoch": 1139} {"train_loss": -39.529903411865234, "global_step": 137934, "epoch": 1139} {"train_loss": -36.30366516113281, "global_step": 137935, "epoch": 1139} {"train_loss": -40.16035842895508, "global_step": 137936, "epoch": 1139} {"train_loss": -34.135868072509766, "global_step": 137937, "epoch": 1139} {"train_loss": -38.987247467041016, "global_step": 137938, "epoch": 1139} {"train_loss": -40.02035497239799, "global_step": 137939, "epoch": 1139, "val_loss": 2690405.25} {"train_loss": -39.3475227355957, "global_step": 137940, "epoch": 1140} {"train_loss": -39.592376708984375, "global_step": 137941, "epoch": 1140} {"train_loss": -37.526397705078125, "global_step": 137942, "epoch": 1140} {"train_loss": -38.748695373535156, "global_step": 137943, "epoch": 1140} {"train_loss": -38.20120620727539, "global_step": 137944, "epoch": 1140} {"train_loss": -36.728755950927734, "global_step": 137945, "epoch": 1140} {"train_loss": -39.26201248168945, "global_step": 137946, "epoch": 1140} {"train_loss": -38.8841667175293, "global_step": 137947, "epoch": 1140} {"train_loss": -38.7436637878418, "global_step": 137948, "epoch": 1140} {"train_loss": -39.165340423583984, "global_step": 137949, "epoch": 1140} {"train_loss": -37.93661117553711, "global_step": 137950, "epoch": 1140} {"train_loss": -38.3009033203125, "global_step": 137951, "epoch": 1140} {"train_loss": -39.5085563659668, "global_step": 137952, "epoch": 1140} {"train_loss": -37.474327087402344, "global_step": 137953, "epoch": 1140} {"train_loss": -38.67963409423828, "global_step": 137954, "epoch": 1140} {"train_loss": -38.51259231567383, "global_step": 137955, "epoch": 1140} {"train_loss": -39.49068069458008, "global_step": 137956, "epoch": 1140} {"train_loss": -38.09652328491211, "global_step": 137957, "epoch": 1140} {"train_loss": -39.39583969116211, "global_step": 137958, "epoch": 1140} {"train_loss": -38.52851486206055, "global_step": 137959, "epoch": 1140} {"train_loss": -38.87834548950195, "global_step": 137960, "epoch": 1140} {"train_loss": -37.50596618652344, "global_step": 137961, "epoch": 1140} {"train_loss": -38.7310676574707, "global_step": 137962, "epoch": 1140} {"train_loss": -37.76496505737305, "global_step": 137963, "epoch": 1140} {"train_loss": -40.20454025268555, "global_step": 137964, "epoch": 1140} {"train_loss": -37.151248931884766, "global_step": 137965, "epoch": 1140} {"train_loss": -40.07667922973633, "global_step": 137966, "epoch": 1140} {"train_loss": -37.94655227661133, "global_step": 137967, "epoch": 1140} {"train_loss": -37.939208984375, "global_step": 137968, "epoch": 1140} {"train_loss": -40.00484848022461, "global_step": 137969, "epoch": 1140} {"train_loss": -38.3267707824707, "global_step": 137970, "epoch": 1140} {"train_loss": -39.78212356567383, "global_step": 137971, "epoch": 1140} {"train_loss": -39.23099899291992, "global_step": 137972, "epoch": 1140} {"train_loss": -38.47892379760742, "global_step": 137973, "epoch": 1140} {"train_loss": -40.28020095825195, "global_step": 137974, "epoch": 1140} {"train_loss": -38.629295349121094, "global_step": 137975, "epoch": 1140} {"train_loss": -39.96923828125, "global_step": 137976, "epoch": 1140} {"train_loss": -39.52044677734375, "global_step": 137977, "epoch": 1140} {"train_loss": -39.106849670410156, "global_step": 137978, "epoch": 1140} {"train_loss": -40.25439453125, "global_step": 137979, "epoch": 1140} {"train_loss": -40.17165756225586, "global_step": 137980, "epoch": 1140} {"train_loss": -40.123695373535156, "global_step": 137981, "epoch": 1140} {"train_loss": -39.55205154418945, "global_step": 137982, "epoch": 1140} {"train_loss": -39.664608001708984, "global_step": 137983, "epoch": 1140} {"train_loss": -40.17436218261719, "global_step": 137984, "epoch": 1140} {"train_loss": -39.8296012878418, "global_step": 137985, "epoch": 1140} {"train_loss": -38.41135787963867, "global_step": 137986, "epoch": 1140} {"train_loss": -40.12652587890625, "global_step": 137987, "epoch": 1140} {"train_loss": -39.625511169433594, "global_step": 137988, "epoch": 1140} {"train_loss": -39.455543518066406, "global_step": 137989, "epoch": 1140} {"train_loss": -39.48584747314453, "global_step": 137990, "epoch": 1140} {"train_loss": -39.35774612426758, "global_step": 137991, "epoch": 1140} {"train_loss": -39.97577667236328, "global_step": 137992, "epoch": 1140} {"train_loss": -40.15474319458008, "global_step": 137993, "epoch": 1140} {"train_loss": -38.92509078979492, "global_step": 137994, "epoch": 1140} {"train_loss": -40.505977630615234, "global_step": 137995, "epoch": 1140} {"train_loss": -40.092681884765625, "global_step": 137996, "epoch": 1140} {"train_loss": -40.20562744140625, "global_step": 137997, "epoch": 1140} {"train_loss": -40.06837844848633, "global_step": 137998, "epoch": 1140} {"train_loss": -40.139644622802734, "global_step": 137999, "epoch": 1140} {"train_loss": -39.2830924987793, "global_step": 138000, "epoch": 1140} {"train_loss": -40.471946716308594, "global_step": 138001, "epoch": 1140} {"train_loss": -40.13566207885742, "global_step": 138002, "epoch": 1140} {"train_loss": -40.148094177246094, "global_step": 138003, "epoch": 1140} {"train_loss": -39.91034698486328, "global_step": 138004, "epoch": 1140} {"train_loss": -40.114803314208984, "global_step": 138005, "epoch": 1140} {"train_loss": -40.80127716064453, "global_step": 138006, "epoch": 1140} {"train_loss": -39.87795639038086, "global_step": 138007, "epoch": 1140} {"train_loss": -40.914669036865234, "global_step": 138008, "epoch": 1140} {"train_loss": -40.97181701660156, "global_step": 138009, "epoch": 1140} {"train_loss": -40.900203704833984, "global_step": 138010, "epoch": 1140} {"train_loss": -40.57402420043945, "global_step": 138011, "epoch": 1140} {"train_loss": -40.81201934814453, "global_step": 138012, "epoch": 1140} {"train_loss": -40.834930419921875, "global_step": 138013, "epoch": 1140} {"train_loss": -40.59150695800781, "global_step": 138014, "epoch": 1140} {"train_loss": -40.84716033935547, "global_step": 138015, "epoch": 1140} {"train_loss": -40.911468505859375, "global_step": 138016, "epoch": 1140} {"train_loss": -40.87191390991211, "global_step": 138017, "epoch": 1140} {"train_loss": -41.13263702392578, "global_step": 138018, "epoch": 1140} {"train_loss": -41.166481018066406, "global_step": 138019, "epoch": 1140} {"train_loss": -40.857704162597656, "global_step": 138020, "epoch": 1140} {"train_loss": -40.953365325927734, "global_step": 138021, "epoch": 1140} {"train_loss": -40.847869873046875, "global_step": 138022, "epoch": 1140} {"train_loss": -39.879817962646484, "global_step": 138023, "epoch": 1140} {"train_loss": -40.960968017578125, "global_step": 138024, "epoch": 1140} {"train_loss": -41.237953186035156, "global_step": 138025, "epoch": 1140} {"train_loss": -40.705623626708984, "global_step": 138026, "epoch": 1140} {"train_loss": -38.5651741027832, "global_step": 138027, "epoch": 1140} {"train_loss": -39.574432373046875, "global_step": 138028, "epoch": 1140} {"train_loss": -41.327972412109375, "global_step": 138029, "epoch": 1140} {"train_loss": -40.50202178955078, "global_step": 138030, "epoch": 1140} {"train_loss": -39.8737907409668, "global_step": 138031, "epoch": 1140} {"train_loss": -39.66636276245117, "global_step": 138032, "epoch": 1140} {"train_loss": -41.15589904785156, "global_step": 138033, "epoch": 1140} {"train_loss": -40.69270706176758, "global_step": 138034, "epoch": 1140} {"train_loss": -40.574928283691406, "global_step": 138035, "epoch": 1140} {"train_loss": -40.33839797973633, "global_step": 138036, "epoch": 1140} {"train_loss": -40.15495681762695, "global_step": 138037, "epoch": 1140} {"train_loss": -40.87961959838867, "global_step": 138038, "epoch": 1140} {"train_loss": -40.744842529296875, "global_step": 138039, "epoch": 1140} {"train_loss": -39.97574234008789, "global_step": 138040, "epoch": 1140} {"train_loss": -39.807735443115234, "global_step": 138041, "epoch": 1140} {"train_loss": -40.7094841003418, "global_step": 138042, "epoch": 1140} {"train_loss": -40.727046966552734, "global_step": 138043, "epoch": 1140} {"train_loss": -40.67304992675781, "global_step": 138044, "epoch": 1140} {"train_loss": -39.8017463684082, "global_step": 138045, "epoch": 1140} {"train_loss": -39.653717041015625, "global_step": 138046, "epoch": 1140} {"train_loss": -39.87567138671875, "global_step": 138047, "epoch": 1140} {"train_loss": -40.1837043762207, "global_step": 138048, "epoch": 1140} {"train_loss": -39.64805221557617, "global_step": 138049, "epoch": 1140} {"train_loss": -37.44601058959961, "global_step": 138050, "epoch": 1140} {"train_loss": -38.27150344848633, "global_step": 138051, "epoch": 1140} {"train_loss": -36.91209030151367, "global_step": 138052, "epoch": 1140} {"train_loss": -36.7286262512207, "global_step": 138053, "epoch": 1140} {"train_loss": -40.206024169921875, "global_step": 138054, "epoch": 1140} {"train_loss": -36.907257080078125, "global_step": 138055, "epoch": 1140} {"train_loss": -40.29757308959961, "global_step": 138056, "epoch": 1140} {"train_loss": -37.80252456665039, "global_step": 138057, "epoch": 1140} {"train_loss": -36.570411682128906, "global_step": 138058, "epoch": 1140} {"train_loss": -39.10472106933594, "global_step": 138059, "epoch": 1140} {"train_loss": -39.56916947798295, "global_step": 138060, "epoch": 1140, "val_loss": 2636879.75} {"train_loss": -38.204524993896484, "global_step": 138061, "epoch": 1141} {"train_loss": -37.94416427612305, "global_step": 138062, "epoch": 1141} {"train_loss": -38.76834487915039, "global_step": 138063, "epoch": 1141} {"train_loss": -37.42265319824219, "global_step": 138064, "epoch": 1141} {"train_loss": -39.05168914794922, "global_step": 138065, "epoch": 1141} {"train_loss": -37.85008239746094, "global_step": 138066, "epoch": 1141} {"train_loss": -39.73210906982422, "global_step": 138067, "epoch": 1141} {"train_loss": -38.26093673706055, "global_step": 138068, "epoch": 1141} {"train_loss": -38.30653762817383, "global_step": 138069, "epoch": 1141} {"train_loss": -39.53112030029297, "global_step": 138070, "epoch": 1141} {"train_loss": -37.840206146240234, "global_step": 138071, "epoch": 1141} {"train_loss": -40.30156707763672, "global_step": 138072, "epoch": 1141} {"train_loss": -39.45587158203125, "global_step": 138073, "epoch": 1141} {"train_loss": -38.793701171875, "global_step": 138074, "epoch": 1141} {"train_loss": -40.65739059448242, "global_step": 138075, "epoch": 1141} {"train_loss": -39.10868835449219, "global_step": 138076, "epoch": 1141} {"train_loss": -39.14862823486328, "global_step": 138077, "epoch": 1141} {"train_loss": -39.540340423583984, "global_step": 138078, "epoch": 1141} {"train_loss": -40.20689392089844, "global_step": 138079, "epoch": 1141} {"train_loss": -38.21612548828125, "global_step": 138080, "epoch": 1141} {"train_loss": -40.451900482177734, "global_step": 138081, "epoch": 1141} {"train_loss": -38.78834915161133, "global_step": 138082, "epoch": 1141} {"train_loss": -39.17623519897461, "global_step": 138083, "epoch": 1141} {"train_loss": -39.923667907714844, "global_step": 138084, "epoch": 1141} {"train_loss": -39.869117736816406, "global_step": 138085, "epoch": 1141} {"train_loss": -39.751869201660156, "global_step": 138086, "epoch": 1141} {"train_loss": -38.58256149291992, "global_step": 138087, "epoch": 1141} {"train_loss": -40.005577087402344, "global_step": 138088, "epoch": 1141} {"train_loss": -40.26179504394531, "global_step": 138089, "epoch": 1141} {"train_loss": -38.4600715637207, "global_step": 138090, "epoch": 1141} {"train_loss": -39.90312576293945, "global_step": 138091, "epoch": 1141} {"train_loss": -40.44861602783203, "global_step": 138092, "epoch": 1141} {"train_loss": -40.228797912597656, "global_step": 138093, "epoch": 1141} {"train_loss": -40.08848190307617, "global_step": 138094, "epoch": 1141} {"train_loss": -40.566436767578125, "global_step": 138095, "epoch": 1141} {"train_loss": -40.75596237182617, "global_step": 138096, "epoch": 1141} {"train_loss": -40.73060607910156, "global_step": 138097, "epoch": 1141} {"train_loss": -40.791236877441406, "global_step": 138098, "epoch": 1141} {"train_loss": -41.1861686706543, "global_step": 138099, "epoch": 1141} {"train_loss": -41.11349105834961, "global_step": 138100, "epoch": 1141} {"train_loss": -40.93314743041992, "global_step": 138101, "epoch": 1141} {"train_loss": -41.1345329284668, "global_step": 138102, "epoch": 1141} {"train_loss": -40.80543899536133, "global_step": 138103, "epoch": 1141} {"train_loss": -41.42069625854492, "global_step": 138104, "epoch": 1141} {"train_loss": -40.90777587890625, "global_step": 138105, "epoch": 1141} {"train_loss": -40.318267822265625, "global_step": 138106, "epoch": 1141} {"train_loss": -40.306636810302734, "global_step": 138107, "epoch": 1141} {"train_loss": -40.76141357421875, "global_step": 138108, "epoch": 1141} {"train_loss": -41.05393600463867, "global_step": 138109, "epoch": 1141} {"train_loss": -40.12900161743164, "global_step": 138110, "epoch": 1141} {"train_loss": -39.447139739990234, "global_step": 138111, "epoch": 1141} {"train_loss": -38.05949783325195, "global_step": 138112, "epoch": 1141} {"train_loss": -39.874080657958984, "global_step": 138113, "epoch": 1141} {"train_loss": -40.940738677978516, "global_step": 138114, "epoch": 1141} {"train_loss": -39.38763427734375, "global_step": 138115, "epoch": 1141} {"train_loss": -36.23945999145508, "global_step": 138116, "epoch": 1141} {"train_loss": -40.982879638671875, "global_step": 138117, "epoch": 1141} {"train_loss": -39.39652633666992, "global_step": 138118, "epoch": 1141} {"train_loss": -36.918643951416016, "global_step": 138119, "epoch": 1141} {"train_loss": -40.25482177734375, "global_step": 138120, "epoch": 1141} {"train_loss": -39.240196228027344, "global_step": 138121, "epoch": 1141} {"train_loss": -37.56870651245117, "global_step": 138122, "epoch": 1141} {"train_loss": -40.269344329833984, "global_step": 138123, "epoch": 1141} {"train_loss": -37.59104537963867, "global_step": 138124, "epoch": 1141} {"train_loss": -39.88715362548828, "global_step": 138125, "epoch": 1141} {"train_loss": -35.69017791748047, "global_step": 138126, "epoch": 1141} {"train_loss": -38.06825637817383, "global_step": 138127, "epoch": 1141} {"train_loss": -33.09212875366211, "global_step": 138128, "epoch": 1141} {"train_loss": -40.12385559082031, "global_step": 138129, "epoch": 1141} {"train_loss": -33.22282409667969, "global_step": 138130, "epoch": 1141} {"train_loss": -39.277259826660156, "global_step": 138131, "epoch": 1141} {"train_loss": -36.820491790771484, "global_step": 138132, "epoch": 1141} {"train_loss": -39.318782806396484, "global_step": 138133, "epoch": 1141} {"train_loss": -38.888832092285156, "global_step": 138134, "epoch": 1141} {"train_loss": -39.75861740112305, "global_step": 138135, "epoch": 1141} {"train_loss": -38.93994903564453, "global_step": 138136, "epoch": 1141} {"train_loss": -40.00651931762695, "global_step": 138137, "epoch": 1141} {"train_loss": -39.726661682128906, "global_step": 138138, "epoch": 1141} {"train_loss": -40.48733139038086, "global_step": 138139, "epoch": 1141} {"train_loss": -39.51021957397461, "global_step": 138140, "epoch": 1141} {"train_loss": -40.56769943237305, "global_step": 138141, "epoch": 1141} {"train_loss": -40.05471420288086, "global_step": 138142, "epoch": 1141} {"train_loss": -40.22818374633789, "global_step": 138143, "epoch": 1141} {"train_loss": -40.41218948364258, "global_step": 138144, "epoch": 1141} {"train_loss": -39.704647064208984, "global_step": 138145, "epoch": 1141} {"train_loss": -40.7820930480957, "global_step": 138146, "epoch": 1141} {"train_loss": -40.0330810546875, "global_step": 138147, "epoch": 1141} {"train_loss": -39.963043212890625, "global_step": 138148, "epoch": 1141} {"train_loss": -40.054134368896484, "global_step": 138149, "epoch": 1141} {"train_loss": -40.257259368896484, "global_step": 138150, "epoch": 1141} {"train_loss": -40.5901985168457, "global_step": 138151, "epoch": 1141} {"train_loss": -40.20228958129883, "global_step": 138152, "epoch": 1141} {"train_loss": -40.7081413269043, "global_step": 138153, "epoch": 1141} {"train_loss": -40.36479568481445, "global_step": 138154, "epoch": 1141} {"train_loss": -40.425777435302734, "global_step": 138155, "epoch": 1141} {"train_loss": -40.913848876953125, "global_step": 138156, "epoch": 1141} {"train_loss": -40.31917190551758, "global_step": 138157, "epoch": 1141} {"train_loss": -40.9507942199707, "global_step": 138158, "epoch": 1141} {"train_loss": -40.7885627746582, "global_step": 138159, "epoch": 1141} {"train_loss": -40.72709274291992, "global_step": 138160, "epoch": 1141} {"train_loss": -40.5562858581543, "global_step": 138161, "epoch": 1141} {"train_loss": -40.8621940612793, "global_step": 138162, "epoch": 1141} {"train_loss": -40.66169357299805, "global_step": 138163, "epoch": 1141} {"train_loss": -41.05767822265625, "global_step": 138164, "epoch": 1141} {"train_loss": -40.45869827270508, "global_step": 138165, "epoch": 1141} {"train_loss": -40.3416633605957, "global_step": 138166, "epoch": 1141} {"train_loss": -38.4135627746582, "global_step": 138167, "epoch": 1141} {"train_loss": -33.2949333190918, "global_step": 138168, "epoch": 1141} {"train_loss": -28.563522338867188, "global_step": 138169, "epoch": 1141} {"train_loss": -27.803497314453125, "global_step": 138170, "epoch": 1141} {"train_loss": -37.54495620727539, "global_step": 138171, "epoch": 1141} {"train_loss": -39.295387268066406, "global_step": 138172, "epoch": 1141} {"train_loss": -31.37696647644043, "global_step": 138173, "epoch": 1141} {"train_loss": -39.38871383666992, "global_step": 138174, "epoch": 1141} {"train_loss": -36.36572265625, "global_step": 138175, "epoch": 1141} {"train_loss": -38.051536560058594, "global_step": 138176, "epoch": 1141} {"train_loss": -36.148101806640625, "global_step": 138177, "epoch": 1141} {"train_loss": -39.816497802734375, "global_step": 138178, "epoch": 1141} {"train_loss": -37.169464111328125, "global_step": 138179, "epoch": 1141} {"train_loss": -39.697322845458984, "global_step": 138180, "epoch": 1141} {"train_loss": -39.1537693275893, "global_step": 138181, "epoch": 1141, "val_loss": 2746431.25} {"train_loss": -40.19359588623047, "global_step": 138182, "epoch": 1142} {"train_loss": -37.74165725708008, "global_step": 138183, "epoch": 1142} {"train_loss": -35.27142333984375, "global_step": 138184, "epoch": 1142} {"train_loss": -38.55385971069336, "global_step": 138185, "epoch": 1142} {"train_loss": -40.012306213378906, "global_step": 138186, "epoch": 1142} {"train_loss": -38.980628967285156, "global_step": 138187, "epoch": 1142} {"train_loss": -38.020050048828125, "global_step": 138188, "epoch": 1142} {"train_loss": -39.965450286865234, "global_step": 138189, "epoch": 1142} {"train_loss": -39.35871887207031, "global_step": 138190, "epoch": 1142} {"train_loss": -40.87704086303711, "global_step": 138191, "epoch": 1142} {"train_loss": -39.8678092956543, "global_step": 138192, "epoch": 1142} {"train_loss": -39.98515319824219, "global_step": 138193, "epoch": 1142} {"train_loss": -39.754150390625, "global_step": 138194, "epoch": 1142} {"train_loss": -39.54875183105469, "global_step": 138195, "epoch": 1142} {"train_loss": -40.28092575073242, "global_step": 138196, "epoch": 1142} {"train_loss": -40.64632034301758, "global_step": 138197, "epoch": 1142} {"train_loss": -40.583282470703125, "global_step": 138198, "epoch": 1142} {"train_loss": -40.1936149597168, "global_step": 138199, "epoch": 1142} {"train_loss": -40.53990936279297, "global_step": 138200, "epoch": 1142} {"train_loss": -40.836360931396484, "global_step": 138201, "epoch": 1142} {"train_loss": -40.37794876098633, "global_step": 138202, "epoch": 1142} {"train_loss": -40.427303314208984, "global_step": 138203, "epoch": 1142} {"train_loss": -40.98567581176758, "global_step": 138204, "epoch": 1142} {"train_loss": -40.27771759033203, "global_step": 138205, "epoch": 1142} {"train_loss": -40.813331604003906, "global_step": 138206, "epoch": 1142} {"train_loss": -41.05787658691406, "global_step": 138207, "epoch": 1142} {"train_loss": -40.596343994140625, "global_step": 138208, "epoch": 1142} {"train_loss": -40.906429290771484, "global_step": 138209, "epoch": 1142} {"train_loss": -41.02181625366211, "global_step": 138210, "epoch": 1142} {"train_loss": -40.26057052612305, "global_step": 138211, "epoch": 1142} {"train_loss": -40.9796142578125, "global_step": 138212, "epoch": 1142} {"train_loss": -40.809913635253906, "global_step": 138213, "epoch": 1142} {"train_loss": -40.976810455322266, "global_step": 138214, "epoch": 1142} {"train_loss": -40.528564453125, "global_step": 138215, "epoch": 1142} {"train_loss": -40.72272872924805, "global_step": 138216, "epoch": 1142} {"train_loss": -40.9234733581543, "global_step": 138217, "epoch": 1142} {"train_loss": -41.41810607910156, "global_step": 138218, "epoch": 1142} {"train_loss": -40.570011138916016, "global_step": 138219, "epoch": 1142} {"train_loss": -40.516292572021484, "global_step": 138220, "epoch": 1142} {"train_loss": -41.02372360229492, "global_step": 138221, "epoch": 1142} {"train_loss": -40.9476432800293, "global_step": 138222, "epoch": 1142} {"train_loss": -40.5477294921875, "global_step": 138223, "epoch": 1142} {"train_loss": -40.78766632080078, "global_step": 138224, "epoch": 1142} {"train_loss": -40.38542556762695, "global_step": 138225, "epoch": 1142} {"train_loss": -40.63737106323242, "global_step": 138226, "epoch": 1142} {"train_loss": -40.08989334106445, "global_step": 138227, "epoch": 1142} {"train_loss": -40.56037521362305, "global_step": 138228, "epoch": 1142} {"train_loss": -40.63003921508789, "global_step": 138229, "epoch": 1142} {"train_loss": -40.32163619995117, "global_step": 138230, "epoch": 1142} {"train_loss": -38.82783126831055, "global_step": 138231, "epoch": 1142} {"train_loss": -39.48431396484375, "global_step": 138232, "epoch": 1142} {"train_loss": -40.15865707397461, "global_step": 138233, "epoch": 1142} {"train_loss": -39.808650970458984, "global_step": 138234, "epoch": 1142} {"train_loss": -37.961387634277344, "global_step": 138235, "epoch": 1142} {"train_loss": -37.744319915771484, "global_step": 138236, "epoch": 1142} {"train_loss": -39.983089447021484, "global_step": 138237, "epoch": 1142} {"train_loss": -40.52437973022461, "global_step": 138238, "epoch": 1142} {"train_loss": -38.46299362182617, "global_step": 138239, "epoch": 1142} {"train_loss": -39.0646858215332, "global_step": 138240, "epoch": 1142} {"train_loss": -38.995269775390625, "global_step": 138241, "epoch": 1142} {"train_loss": -37.151512145996094, "global_step": 138242, "epoch": 1142} {"train_loss": -37.00105667114258, "global_step": 138243, "epoch": 1142} {"train_loss": -38.67952346801758, "global_step": 138244, "epoch": 1142} {"train_loss": -40.10414505004883, "global_step": 138245, "epoch": 1142} {"train_loss": -40.87515640258789, "global_step": 138246, "epoch": 1142} {"train_loss": -39.94672393798828, "global_step": 138247, "epoch": 1142} {"train_loss": -38.64908981323242, "global_step": 138248, "epoch": 1142} {"train_loss": -40.421836853027344, "global_step": 138249, "epoch": 1142} {"train_loss": -38.473670959472656, "global_step": 138250, "epoch": 1142} {"train_loss": -39.2458610534668, "global_step": 138251, "epoch": 1142} {"train_loss": -40.05196762084961, "global_step": 138252, "epoch": 1142} {"train_loss": -39.02529525756836, "global_step": 138253, "epoch": 1142} {"train_loss": -38.495574951171875, "global_step": 138254, "epoch": 1142} {"train_loss": -40.00118637084961, "global_step": 138255, "epoch": 1142} {"train_loss": -38.597530364990234, "global_step": 138256, "epoch": 1142} {"train_loss": -39.03104782104492, "global_step": 138257, "epoch": 1142} {"train_loss": -39.00532913208008, "global_step": 138258, "epoch": 1142} {"train_loss": -40.1329231262207, "global_step": 138259, "epoch": 1142} {"train_loss": -39.5890998840332, "global_step": 138260, "epoch": 1142} {"train_loss": -39.28273391723633, "global_step": 138261, "epoch": 1142} {"train_loss": -38.599952697753906, "global_step": 138262, "epoch": 1142} {"train_loss": -39.10081100463867, "global_step": 138263, "epoch": 1142} {"train_loss": -36.595977783203125, "global_step": 138264, "epoch": 1142} {"train_loss": -38.1546516418457, "global_step": 138265, "epoch": 1142} {"train_loss": -39.005550384521484, "global_step": 138266, "epoch": 1142} {"train_loss": -38.88145065307617, "global_step": 138267, "epoch": 1142} {"train_loss": -37.991973876953125, "global_step": 138268, "epoch": 1142} {"train_loss": -38.708656311035156, "global_step": 138269, "epoch": 1142} {"train_loss": -37.409149169921875, "global_step": 138270, "epoch": 1142} {"train_loss": -40.4968376159668, "global_step": 138271, "epoch": 1142} {"train_loss": -38.56451416015625, "global_step": 138272, "epoch": 1142} {"train_loss": -38.8410530090332, "global_step": 138273, "epoch": 1142} {"train_loss": -39.933624267578125, "global_step": 138274, "epoch": 1142} {"train_loss": -39.79029846191406, "global_step": 138275, "epoch": 1142} {"train_loss": -39.830238342285156, "global_step": 138276, "epoch": 1142} {"train_loss": -40.31932067871094, "global_step": 138277, "epoch": 1142} {"train_loss": -39.66367721557617, "global_step": 138278, "epoch": 1142} {"train_loss": -40.23997116088867, "global_step": 138279, "epoch": 1142} {"train_loss": -40.5599365234375, "global_step": 138280, "epoch": 1142} {"train_loss": -40.84638214111328, "global_step": 138281, "epoch": 1142} {"train_loss": -39.90265655517578, "global_step": 138282, "epoch": 1142} {"train_loss": -40.10313034057617, "global_step": 138283, "epoch": 1142} {"train_loss": -41.12696075439453, "global_step": 138284, "epoch": 1142} {"train_loss": -40.26325225830078, "global_step": 138285, "epoch": 1142} {"train_loss": -40.89681625366211, "global_step": 138286, "epoch": 1142} {"train_loss": -40.901947021484375, "global_step": 138287, "epoch": 1142} {"train_loss": -41.076210021972656, "global_step": 138288, "epoch": 1142} {"train_loss": -41.021846771240234, "global_step": 138289, "epoch": 1142} {"train_loss": -41.056060791015625, "global_step": 138290, "epoch": 1142} {"train_loss": -40.65203857421875, "global_step": 138291, "epoch": 1142} {"train_loss": -40.98784637451172, "global_step": 138292, "epoch": 1142} {"train_loss": -41.179405212402344, "global_step": 138293, "epoch": 1142} {"train_loss": -40.87696075439453, "global_step": 138294, "epoch": 1142} {"train_loss": -41.1900634765625, "global_step": 138295, "epoch": 1142} {"train_loss": -41.39253234863281, "global_step": 138296, "epoch": 1142} {"train_loss": -41.326446533203125, "global_step": 138297, "epoch": 1142} {"train_loss": -41.34907150268555, "global_step": 138298, "epoch": 1142} {"train_loss": -41.39288330078125, "global_step": 138299, "epoch": 1142} {"train_loss": -40.880104064941406, "global_step": 138300, "epoch": 1142} {"train_loss": -41.4384880065918, "global_step": 138301, "epoch": 1142} {"train_loss": -39.911932984659494, "global_step": 138302, "epoch": 1142, "val_loss": 2708687.75} {"train_loss": -39.46778106689453, "global_step": 138303, "epoch": 1143} {"train_loss": -39.90203857421875, "global_step": 138304, "epoch": 1143} {"train_loss": -37.540462493896484, "global_step": 138305, "epoch": 1143} {"train_loss": -38.9970588684082, "global_step": 138306, "epoch": 1143} {"train_loss": -40.31150436401367, "global_step": 138307, "epoch": 1143} {"train_loss": -40.20881652832031, "global_step": 138308, "epoch": 1143} {"train_loss": -39.66425704956055, "global_step": 138309, "epoch": 1143} {"train_loss": -40.570526123046875, "global_step": 138310, "epoch": 1143} {"train_loss": -40.53230285644531, "global_step": 138311, "epoch": 1143} {"train_loss": -39.21148681640625, "global_step": 138312, "epoch": 1143} {"train_loss": -40.517818450927734, "global_step": 138313, "epoch": 1143} {"train_loss": -38.557308197021484, "global_step": 138314, "epoch": 1143} {"train_loss": -39.60268783569336, "global_step": 138315, "epoch": 1143} {"train_loss": -41.164241790771484, "global_step": 138316, "epoch": 1143} {"train_loss": -39.74921417236328, "global_step": 138317, "epoch": 1143} {"train_loss": -39.4295654296875, "global_step": 138318, "epoch": 1143} {"train_loss": -39.66056442260742, "global_step": 138319, "epoch": 1143} {"train_loss": -40.44361114501953, "global_step": 138320, "epoch": 1143} {"train_loss": -40.38160705566406, "global_step": 138321, "epoch": 1143} {"train_loss": -40.29389190673828, "global_step": 138322, "epoch": 1143} {"train_loss": -40.33231735229492, "global_step": 138323, "epoch": 1143} {"train_loss": -38.380706787109375, "global_step": 138324, "epoch": 1143} {"train_loss": -40.503883361816406, "global_step": 138325, "epoch": 1143} {"train_loss": -40.44572830200195, "global_step": 138326, "epoch": 1143} {"train_loss": -39.1235466003418, "global_step": 138327, "epoch": 1143} {"train_loss": -39.55009078979492, "global_step": 138328, "epoch": 1143} {"train_loss": -40.106021881103516, "global_step": 138329, "epoch": 1143} {"train_loss": -38.07064437866211, "global_step": 138330, "epoch": 1143} {"train_loss": -39.23012161254883, "global_step": 138331, "epoch": 1143} {"train_loss": -39.67128372192383, "global_step": 138332, "epoch": 1143} {"train_loss": -36.74892044067383, "global_step": 138333, "epoch": 1143} {"train_loss": -39.86054611206055, "global_step": 138334, "epoch": 1143} {"train_loss": -40.31509017944336, "global_step": 138335, "epoch": 1143} {"train_loss": -40.11723709106445, "global_step": 138336, "epoch": 1143} {"train_loss": -38.8606071472168, "global_step": 138337, "epoch": 1143} {"train_loss": -39.38430404663086, "global_step": 138338, "epoch": 1143} {"train_loss": -40.420284271240234, "global_step": 138339, "epoch": 1143} {"train_loss": -38.473114013671875, "global_step": 138340, "epoch": 1143} {"train_loss": -39.57810592651367, "global_step": 138341, "epoch": 1143} {"train_loss": -39.369972229003906, "global_step": 138342, "epoch": 1143} {"train_loss": -40.35771560668945, "global_step": 138343, "epoch": 1143} {"train_loss": -38.88486862182617, "global_step": 138344, "epoch": 1143} {"train_loss": -38.05418014526367, "global_step": 138345, "epoch": 1143} {"train_loss": -40.21973419189453, "global_step": 138346, "epoch": 1143} {"train_loss": -39.630489349365234, "global_step": 138347, "epoch": 1143} {"train_loss": -39.71958541870117, "global_step": 138348, "epoch": 1143} {"train_loss": -40.16804122924805, "global_step": 138349, "epoch": 1143} {"train_loss": -39.671058654785156, "global_step": 138350, "epoch": 1143} {"train_loss": -40.604915618896484, "global_step": 138351, "epoch": 1143} {"train_loss": -39.783172607421875, "global_step": 138352, "epoch": 1143} {"train_loss": -36.80167770385742, "global_step": 138353, "epoch": 1143} {"train_loss": -39.01774978637695, "global_step": 138354, "epoch": 1143} {"train_loss": -39.579654693603516, "global_step": 138355, "epoch": 1143} {"train_loss": -37.32558059692383, "global_step": 138356, "epoch": 1143} {"train_loss": -39.35059356689453, "global_step": 138357, "epoch": 1143} {"train_loss": -39.92599105834961, "global_step": 138358, "epoch": 1143} {"train_loss": -38.522621154785156, "global_step": 138359, "epoch": 1143} {"train_loss": -37.988555908203125, "global_step": 138360, "epoch": 1143} {"train_loss": -40.441871643066406, "global_step": 138361, "epoch": 1143} {"train_loss": -39.1623420715332, "global_step": 138362, "epoch": 1143} {"train_loss": -39.90578079223633, "global_step": 138363, "epoch": 1143} {"train_loss": -39.37425994873047, "global_step": 138364, "epoch": 1143} {"train_loss": -39.97118377685547, "global_step": 138365, "epoch": 1143} {"train_loss": -40.326290130615234, "global_step": 138366, "epoch": 1143} {"train_loss": -40.432125091552734, "global_step": 138367, "epoch": 1143} {"train_loss": -38.67891311645508, "global_step": 138368, "epoch": 1143} {"train_loss": -39.982704162597656, "global_step": 138369, "epoch": 1143} {"train_loss": -40.34379959106445, "global_step": 138370, "epoch": 1143} {"train_loss": -38.030860900878906, "global_step": 138371, "epoch": 1143} {"train_loss": -38.535377502441406, "global_step": 138372, "epoch": 1143} {"train_loss": -39.795101165771484, "global_step": 138373, "epoch": 1143} {"train_loss": -38.870704650878906, "global_step": 138374, "epoch": 1143} {"train_loss": -40.100345611572266, "global_step": 138375, "epoch": 1143} {"train_loss": -36.70172119140625, "global_step": 138376, "epoch": 1143} {"train_loss": -38.792091369628906, "global_step": 138377, "epoch": 1143} {"train_loss": -34.37074661254883, "global_step": 138378, "epoch": 1143} {"train_loss": -38.551063537597656, "global_step": 138379, "epoch": 1143} {"train_loss": -37.200435638427734, "global_step": 138380, "epoch": 1143} {"train_loss": -37.03154373168945, "global_step": 138381, "epoch": 1143} {"train_loss": -38.42219924926758, "global_step": 138382, "epoch": 1143} {"train_loss": -38.12900924682617, "global_step": 138383, "epoch": 1143} {"train_loss": -23.34822654724121, "global_step": 138384, "epoch": 1143} {"train_loss": -38.32036209106445, "global_step": 138385, "epoch": 1143} {"train_loss": -37.84458541870117, "global_step": 138386, "epoch": 1143} {"train_loss": -32.567726135253906, "global_step": 138387, "epoch": 1143} {"train_loss": -37.95648193359375, "global_step": 138388, "epoch": 1143} {"train_loss": -27.10430335998535, "global_step": 138389, "epoch": 1143} {"train_loss": -36.067195892333984, "global_step": 138390, "epoch": 1143} {"train_loss": -34.685462951660156, "global_step": 138391, "epoch": 1143} {"train_loss": -34.92600631713867, "global_step": 138392, "epoch": 1143} {"train_loss": -35.85232162475586, "global_step": 138393, "epoch": 1143} {"train_loss": -36.5234260559082, "global_step": 138394, "epoch": 1143} {"train_loss": -26.074234008789062, "global_step": 138395, "epoch": 1143} {"train_loss": -36.09284973144531, "global_step": 138396, "epoch": 1143} {"train_loss": -35.3265495300293, "global_step": 138397, "epoch": 1143} {"train_loss": -36.16255569458008, "global_step": 138398, "epoch": 1143} {"train_loss": -37.20697784423828, "global_step": 138399, "epoch": 1143} {"train_loss": -37.11249923706055, "global_step": 138400, "epoch": 1143} {"train_loss": -37.65230178833008, "global_step": 138401, "epoch": 1143} {"train_loss": -36.18875503540039, "global_step": 138402, "epoch": 1143} {"train_loss": -35.5587158203125, "global_step": 138403, "epoch": 1143} {"train_loss": -38.338016510009766, "global_step": 138404, "epoch": 1143} {"train_loss": -37.97648239135742, "global_step": 138405, "epoch": 1143} {"train_loss": -37.52175521850586, "global_step": 138406, "epoch": 1143} {"train_loss": -38.605525970458984, "global_step": 138407, "epoch": 1143} {"train_loss": -38.04446029663086, "global_step": 138408, "epoch": 1143} {"train_loss": -38.38594436645508, "global_step": 138409, "epoch": 1143} {"train_loss": -38.34623336791992, "global_step": 138410, "epoch": 1143} {"train_loss": -38.87668991088867, "global_step": 138411, "epoch": 1143} {"train_loss": -37.03681945800781, "global_step": 138412, "epoch": 1143} {"train_loss": -39.45781326293945, "global_step": 138413, "epoch": 1143} {"train_loss": -38.0413703918457, "global_step": 138414, "epoch": 1143} {"train_loss": -38.830379486083984, "global_step": 138415, "epoch": 1143} {"train_loss": -38.726722717285156, "global_step": 138416, "epoch": 1143} {"train_loss": -38.95913314819336, "global_step": 138417, "epoch": 1143} {"train_loss": -38.95649337768555, "global_step": 138418, "epoch": 1143} {"train_loss": -39.11384963989258, "global_step": 138419, "epoch": 1143} {"train_loss": -39.258209228515625, "global_step": 138420, "epoch": 1143} {"train_loss": -38.90888214111328, "global_step": 138421, "epoch": 1143} {"train_loss": -40.02166748046875, "global_step": 138422, "epoch": 1143} {"train_loss": -38.42342023613039, "global_step": 138423, "epoch": 1143, "val_loss": 2545922.25} {"train_loss": -40.15687942504883, "global_step": 138424, "epoch": 1144} {"train_loss": -39.61634826660156, "global_step": 138425, "epoch": 1144} {"train_loss": -39.09607696533203, "global_step": 138426, "epoch": 1144} {"train_loss": -39.97491455078125, "global_step": 138427, "epoch": 1144} {"train_loss": -38.8900260925293, "global_step": 138428, "epoch": 1144} {"train_loss": -38.47945785522461, "global_step": 138429, "epoch": 1144} {"train_loss": -39.206119537353516, "global_step": 138430, "epoch": 1144} {"train_loss": -39.53261184692383, "global_step": 138431, "epoch": 1144} {"train_loss": -39.727420806884766, "global_step": 138432, "epoch": 1144} {"train_loss": -39.815555572509766, "global_step": 138433, "epoch": 1144} {"train_loss": -39.83235168457031, "global_step": 138434, "epoch": 1144} {"train_loss": -39.6323356628418, "global_step": 138435, "epoch": 1144} {"train_loss": -39.70775604248047, "global_step": 138436, "epoch": 1144} {"train_loss": -40.842994689941406, "global_step": 138437, "epoch": 1144} {"train_loss": -40.44630813598633, "global_step": 138438, "epoch": 1144} {"train_loss": -39.396759033203125, "global_step": 138439, "epoch": 1144} {"train_loss": -39.79203414916992, "global_step": 138440, "epoch": 1144} {"train_loss": -40.19928741455078, "global_step": 138441, "epoch": 1144} {"train_loss": -39.358455657958984, "global_step": 138442, "epoch": 1144} {"train_loss": -39.37085723876953, "global_step": 138443, "epoch": 1144} {"train_loss": -39.81409454345703, "global_step": 138444, "epoch": 1144} {"train_loss": -39.91749572753906, "global_step": 138445, "epoch": 1144} {"train_loss": -39.75794219970703, "global_step": 138446, "epoch": 1144} {"train_loss": -39.876739501953125, "global_step": 138447, "epoch": 1144} {"train_loss": -40.649593353271484, "global_step": 138448, "epoch": 1144} {"train_loss": -40.235050201416016, "global_step": 138449, "epoch": 1144} {"train_loss": -39.7313232421875, "global_step": 138450, "epoch": 1144} {"train_loss": -39.60242462158203, "global_step": 138451, "epoch": 1144} {"train_loss": -39.511558532714844, "global_step": 138452, "epoch": 1144} {"train_loss": -39.68376541137695, "global_step": 138453, "epoch": 1144} {"train_loss": -39.97701644897461, "global_step": 138454, "epoch": 1144} {"train_loss": -40.587764739990234, "global_step": 138455, "epoch": 1144} {"train_loss": -40.52631378173828, "global_step": 138456, "epoch": 1144} {"train_loss": -39.9904899597168, "global_step": 138457, "epoch": 1144} {"train_loss": -40.332618713378906, "global_step": 138458, "epoch": 1144} {"train_loss": -40.41756057739258, "global_step": 138459, "epoch": 1144} {"train_loss": -41.09663772583008, "global_step": 138460, "epoch": 1144} {"train_loss": -39.11278533935547, "global_step": 138461, "epoch": 1144} {"train_loss": -40.64085006713867, "global_step": 138462, "epoch": 1144} {"train_loss": -40.38246536254883, "global_step": 138463, "epoch": 1144} {"train_loss": -41.0545539855957, "global_step": 138464, "epoch": 1144} {"train_loss": -40.77276611328125, "global_step": 138465, "epoch": 1144} {"train_loss": -40.94339370727539, "global_step": 138466, "epoch": 1144} {"train_loss": -39.69175338745117, "global_step": 138467, "epoch": 1144} {"train_loss": -38.941749572753906, "global_step": 138468, "epoch": 1144} {"train_loss": -38.255287170410156, "global_step": 138469, "epoch": 1144} {"train_loss": -37.91337966918945, "global_step": 138470, "epoch": 1144} {"train_loss": -39.462257385253906, "global_step": 138471, "epoch": 1144} {"train_loss": -39.441986083984375, "global_step": 138472, "epoch": 1144} {"train_loss": -39.80803298950195, "global_step": 138473, "epoch": 1144} {"train_loss": -39.66188430786133, "global_step": 138474, "epoch": 1144} {"train_loss": -39.77860641479492, "global_step": 138475, "epoch": 1144} {"train_loss": -37.94027328491211, "global_step": 138476, "epoch": 1144} {"train_loss": -38.8191032409668, "global_step": 138477, "epoch": 1144} {"train_loss": -39.72832489013672, "global_step": 138478, "epoch": 1144} {"train_loss": -39.52517318725586, "global_step": 138479, "epoch": 1144} {"train_loss": -40.782310485839844, "global_step": 138480, "epoch": 1144} {"train_loss": -39.961910247802734, "global_step": 138481, "epoch": 1144} {"train_loss": -38.44983673095703, "global_step": 138482, "epoch": 1144} {"train_loss": -38.28792953491211, "global_step": 138483, "epoch": 1144} {"train_loss": -37.92280960083008, "global_step": 138484, "epoch": 1144} {"train_loss": -39.45998764038086, "global_step": 138485, "epoch": 1144} {"train_loss": -39.404170989990234, "global_step": 138486, "epoch": 1144} {"train_loss": -36.482425689697266, "global_step": 138487, "epoch": 1144} {"train_loss": -40.52842330932617, "global_step": 138488, "epoch": 1144} {"train_loss": -38.999549865722656, "global_step": 138489, "epoch": 1144} {"train_loss": -37.50163650512695, "global_step": 138490, "epoch": 1144} {"train_loss": -38.020015716552734, "global_step": 138491, "epoch": 1144} {"train_loss": -39.16447067260742, "global_step": 138492, "epoch": 1144} {"train_loss": -40.22066879272461, "global_step": 138493, "epoch": 1144} {"train_loss": -40.12335968017578, "global_step": 138494, "epoch": 1144} {"train_loss": -38.82209396362305, "global_step": 138495, "epoch": 1144} {"train_loss": -40.03749084472656, "global_step": 138496, "epoch": 1144} {"train_loss": -38.60211944580078, "global_step": 138497, "epoch": 1144} {"train_loss": -38.4292106628418, "global_step": 138498, "epoch": 1144} {"train_loss": -40.07804870605469, "global_step": 138499, "epoch": 1144} {"train_loss": -40.44405746459961, "global_step": 138500, "epoch": 1144} {"train_loss": -37.95311737060547, "global_step": 138501, "epoch": 1144} {"train_loss": -39.764892578125, "global_step": 138502, "epoch": 1144} {"train_loss": -39.05916976928711, "global_step": 138503, "epoch": 1144} {"train_loss": -38.7700309753418, "global_step": 138504, "epoch": 1144} {"train_loss": -40.30764389038086, "global_step": 138505, "epoch": 1144} {"train_loss": -39.21406173706055, "global_step": 138506, "epoch": 1144} {"train_loss": -38.57075119018555, "global_step": 138507, "epoch": 1144} {"train_loss": -40.0446662902832, "global_step": 138508, "epoch": 1144} {"train_loss": -39.38589096069336, "global_step": 138509, "epoch": 1144} {"train_loss": -38.08266067504883, "global_step": 138510, "epoch": 1144} {"train_loss": -38.82192611694336, "global_step": 138511, "epoch": 1144} {"train_loss": -39.931739807128906, "global_step": 138512, "epoch": 1144} {"train_loss": -35.9655647277832, "global_step": 138513, "epoch": 1144} {"train_loss": -40.28229904174805, "global_step": 138514, "epoch": 1144} {"train_loss": -37.50631332397461, "global_step": 138515, "epoch": 1144} {"train_loss": -37.9786491394043, "global_step": 138516, "epoch": 1144} {"train_loss": -39.038021087646484, "global_step": 138517, "epoch": 1144} {"train_loss": -37.92499923706055, "global_step": 138518, "epoch": 1144} {"train_loss": -39.00146484375, "global_step": 138519, "epoch": 1144} {"train_loss": -38.314510345458984, "global_step": 138520, "epoch": 1144} {"train_loss": -39.9938850402832, "global_step": 138521, "epoch": 1144} {"train_loss": -39.17107009887695, "global_step": 138522, "epoch": 1144} {"train_loss": -38.65412139892578, "global_step": 138523, "epoch": 1144} {"train_loss": -39.34971237182617, "global_step": 138524, "epoch": 1144} {"train_loss": -39.10750198364258, "global_step": 138525, "epoch": 1144} {"train_loss": -38.236183166503906, "global_step": 138526, "epoch": 1144} {"train_loss": -39.46173095703125, "global_step": 138527, "epoch": 1144} {"train_loss": -39.04549026489258, "global_step": 138528, "epoch": 1144} {"train_loss": -39.08509826660156, "global_step": 138529, "epoch": 1144} {"train_loss": -38.730194091796875, "global_step": 138530, "epoch": 1144} {"train_loss": -39.77800369262695, "global_step": 138531, "epoch": 1144} {"train_loss": -38.91572189331055, "global_step": 138532, "epoch": 1144} {"train_loss": -38.36785888671875, "global_step": 138533, "epoch": 1144} {"train_loss": -38.49650955200195, "global_step": 138534, "epoch": 1144} {"train_loss": -39.5540885925293, "global_step": 138535, "epoch": 1144} {"train_loss": -39.18115234375, "global_step": 138536, "epoch": 1144} {"train_loss": -37.68220138549805, "global_step": 138537, "epoch": 1144} {"train_loss": -38.10786056518555, "global_step": 138538, "epoch": 1144} {"train_loss": -38.34485626220703, "global_step": 138539, "epoch": 1144} {"train_loss": -38.078277587890625, "global_step": 138540, "epoch": 1144} {"train_loss": -39.26937484741211, "global_step": 138541, "epoch": 1144} {"train_loss": -39.533424377441406, "global_step": 138542, "epoch": 1144} {"train_loss": -39.096988677978516, "global_step": 138543, "epoch": 1144} {"train_loss": -39.323470691018855, "global_step": 138544, "epoch": 1144, "val_loss": 2702097.75} {"train_loss": -38.935523986816406, "global_step": 138545, "epoch": 1145} {"train_loss": -39.481422424316406, "global_step": 138546, "epoch": 1145} {"train_loss": -40.0166130065918, "global_step": 138547, "epoch": 1145} {"train_loss": -38.09523391723633, "global_step": 138548, "epoch": 1145} {"train_loss": -39.094661712646484, "global_step": 138549, "epoch": 1145} {"train_loss": -36.87099075317383, "global_step": 138550, "epoch": 1145} {"train_loss": -39.823299407958984, "global_step": 138551, "epoch": 1145} {"train_loss": -38.395545959472656, "global_step": 138552, "epoch": 1145} {"train_loss": -38.79996871948242, "global_step": 138553, "epoch": 1145} {"train_loss": -39.897613525390625, "global_step": 138554, "epoch": 1145} {"train_loss": -38.11893844604492, "global_step": 138555, "epoch": 1145} {"train_loss": -39.26870346069336, "global_step": 138556, "epoch": 1145} {"train_loss": -39.44289779663086, "global_step": 138557, "epoch": 1145} {"train_loss": -39.360530853271484, "global_step": 138558, "epoch": 1145} {"train_loss": -38.46672439575195, "global_step": 138559, "epoch": 1145} {"train_loss": -39.39899826049805, "global_step": 138560, "epoch": 1145} {"train_loss": -39.018428802490234, "global_step": 138561, "epoch": 1145} {"train_loss": -39.32380676269531, "global_step": 138562, "epoch": 1145} {"train_loss": -39.35283660888672, "global_step": 138563, "epoch": 1145} {"train_loss": -38.144691467285156, "global_step": 138564, "epoch": 1145} {"train_loss": -39.05426788330078, "global_step": 138565, "epoch": 1145} {"train_loss": -38.494564056396484, "global_step": 138566, "epoch": 1145} {"train_loss": -40.17714309692383, "global_step": 138567, "epoch": 1145} {"train_loss": -38.005126953125, "global_step": 138568, "epoch": 1145} {"train_loss": -39.664913177490234, "global_step": 138569, "epoch": 1145} {"train_loss": -38.724586486816406, "global_step": 138570, "epoch": 1145} {"train_loss": -39.470611572265625, "global_step": 138571, "epoch": 1145} {"train_loss": -39.953460693359375, "global_step": 138572, "epoch": 1145} {"train_loss": -39.402374267578125, "global_step": 138573, "epoch": 1145} {"train_loss": -40.12064743041992, "global_step": 138574, "epoch": 1145} {"train_loss": -39.89010238647461, "global_step": 138575, "epoch": 1145} {"train_loss": -39.254207611083984, "global_step": 138576, "epoch": 1145} {"train_loss": -39.69049835205078, "global_step": 138577, "epoch": 1145} {"train_loss": -39.335079193115234, "global_step": 138578, "epoch": 1145} {"train_loss": -39.589229583740234, "global_step": 138579, "epoch": 1145} {"train_loss": -40.12995147705078, "global_step": 138580, "epoch": 1145} {"train_loss": -40.54684066772461, "global_step": 138581, "epoch": 1145} {"train_loss": -39.5860710144043, "global_step": 138582, "epoch": 1145} {"train_loss": -40.27116775512695, "global_step": 138583, "epoch": 1145} {"train_loss": -40.21816635131836, "global_step": 138584, "epoch": 1145} {"train_loss": -40.57307052612305, "global_step": 138585, "epoch": 1145} {"train_loss": -39.7355842590332, "global_step": 138586, "epoch": 1145} {"train_loss": -39.89064025878906, "global_step": 138587, "epoch": 1145} {"train_loss": -40.09603500366211, "global_step": 138588, "epoch": 1145} {"train_loss": -39.766334533691406, "global_step": 138589, "epoch": 1145} {"train_loss": -39.8385124206543, "global_step": 138590, "epoch": 1145} {"train_loss": -39.88296890258789, "global_step": 138591, "epoch": 1145} {"train_loss": -40.4801139831543, "global_step": 138592, "epoch": 1145} {"train_loss": -40.5968132019043, "global_step": 138593, "epoch": 1145} {"train_loss": -40.33305740356445, "global_step": 138594, "epoch": 1145} {"train_loss": -40.352169036865234, "global_step": 138595, "epoch": 1145} {"train_loss": -40.318119049072266, "global_step": 138596, "epoch": 1145} {"train_loss": -40.68349075317383, "global_step": 138597, "epoch": 1145} {"train_loss": -39.893733978271484, "global_step": 138598, "epoch": 1145} {"train_loss": -38.55565643310547, "global_step": 138599, "epoch": 1145} {"train_loss": -37.20301055908203, "global_step": 138600, "epoch": 1145} {"train_loss": -38.91266632080078, "global_step": 138601, "epoch": 1145} {"train_loss": -39.96519088745117, "global_step": 138602, "epoch": 1145} {"train_loss": -38.159393310546875, "global_step": 138603, "epoch": 1145} {"train_loss": -39.26768112182617, "global_step": 138604, "epoch": 1145} {"train_loss": -39.256168365478516, "global_step": 138605, "epoch": 1145} {"train_loss": -35.28186798095703, "global_step": 138606, "epoch": 1145} {"train_loss": -39.16730880737305, "global_step": 138607, "epoch": 1145} {"train_loss": -34.040138244628906, "global_step": 138608, "epoch": 1145} {"train_loss": -32.38990783691406, "global_step": 138609, "epoch": 1145} {"train_loss": -26.57700538635254, "global_step": 138610, "epoch": 1145} {"train_loss": -0.39617758989334106, "global_step": 138611, "epoch": 1145} {"train_loss": -24.34166717529297, "global_step": 138612, "epoch": 1145} {"train_loss": -21.062143325805664, "global_step": 138613, "epoch": 1145} {"train_loss": -30.129846572875977, "global_step": 138614, "epoch": 1145} {"train_loss": -20.24159812927246, "global_step": 138615, "epoch": 1145} {"train_loss": -32.10232162475586, "global_step": 138616, "epoch": 1145} {"train_loss": -27.545917510986328, "global_step": 138617, "epoch": 1145} {"train_loss": -26.581592559814453, "global_step": 138618, "epoch": 1145} {"train_loss": -32.154964447021484, "global_step": 138619, "epoch": 1145} {"train_loss": -29.029027938842773, "global_step": 138620, "epoch": 1145} {"train_loss": -30.89723014831543, "global_step": 138621, "epoch": 1145} {"train_loss": -34.091880798339844, "global_step": 138622, "epoch": 1145} {"train_loss": -33.115760803222656, "global_step": 138623, "epoch": 1145} {"train_loss": -32.220062255859375, "global_step": 138624, "epoch": 1145} {"train_loss": -32.89105224609375, "global_step": 138625, "epoch": 1145} {"train_loss": -34.62575912475586, "global_step": 138626, "epoch": 1145} {"train_loss": -33.91926193237305, "global_step": 138627, "epoch": 1145} {"train_loss": -34.36945343017578, "global_step": 138628, "epoch": 1145} {"train_loss": -35.33487319946289, "global_step": 138629, "epoch": 1145} {"train_loss": -35.53353500366211, "global_step": 138630, "epoch": 1145} {"train_loss": -35.565338134765625, "global_step": 138631, "epoch": 1145} {"train_loss": -35.33509826660156, "global_step": 138632, "epoch": 1145} {"train_loss": -35.96364974975586, "global_step": 138633, "epoch": 1145} {"train_loss": -35.58655548095703, "global_step": 138634, "epoch": 1145} {"train_loss": -36.09698486328125, "global_step": 138635, "epoch": 1145} {"train_loss": -36.64315414428711, "global_step": 138636, "epoch": 1145} {"train_loss": -36.01759719848633, "global_step": 138637, "epoch": 1145} {"train_loss": -35.79243850708008, "global_step": 138638, "epoch": 1145} {"train_loss": -36.63535690307617, "global_step": 138639, "epoch": 1145} {"train_loss": -37.35232925415039, "global_step": 138640, "epoch": 1145} {"train_loss": -36.6801643371582, "global_step": 138641, "epoch": 1145} {"train_loss": -36.780391693115234, "global_step": 138642, "epoch": 1145} {"train_loss": -37.236690521240234, "global_step": 138643, "epoch": 1145} {"train_loss": -38.01118087768555, "global_step": 138644, "epoch": 1145} {"train_loss": -37.45248031616211, "global_step": 138645, "epoch": 1145} {"train_loss": -37.80400466918945, "global_step": 138646, "epoch": 1145} {"train_loss": -37.96980667114258, "global_step": 138647, "epoch": 1145} {"train_loss": -38.040855407714844, "global_step": 138648, "epoch": 1145} {"train_loss": -38.20486831665039, "global_step": 138649, "epoch": 1145} {"train_loss": -38.23102951049805, "global_step": 138650, "epoch": 1145} {"train_loss": -38.31404495239258, "global_step": 138651, "epoch": 1145} {"train_loss": -38.68330001831055, "global_step": 138652, "epoch": 1145} {"train_loss": -39.00606918334961, "global_step": 138653, "epoch": 1145} {"train_loss": -38.73686981201172, "global_step": 138654, "epoch": 1145} {"train_loss": -39.42971420288086, "global_step": 138655, "epoch": 1145} {"train_loss": -39.287235260009766, "global_step": 138656, "epoch": 1145} {"train_loss": -39.043800354003906, "global_step": 138657, "epoch": 1145} {"train_loss": -38.93085479736328, "global_step": 138658, "epoch": 1145} {"train_loss": -39.527099609375, "global_step": 138659, "epoch": 1145} {"train_loss": -39.554203033447266, "global_step": 138660, "epoch": 1145} {"train_loss": -39.5998420715332, "global_step": 138661, "epoch": 1145} {"train_loss": -39.58545684814453, "global_step": 138662, "epoch": 1145} {"train_loss": -39.938167572021484, "global_step": 138663, "epoch": 1145} {"train_loss": -40.089046478271484, "global_step": 138664, "epoch": 1145} {"train_loss": -37.025234745061105, "global_step": 138665, "epoch": 1145, "val_loss": 2707234.0} {"train_loss": -39.694644927978516, "global_step": 138666, "epoch": 1146} {"train_loss": -40.61112594604492, "global_step": 138667, "epoch": 1146} {"train_loss": -40.5697135925293, "global_step": 138668, "epoch": 1146} {"train_loss": -40.32326126098633, "global_step": 138669, "epoch": 1146} {"train_loss": -40.20937728881836, "global_step": 138670, "epoch": 1146} {"train_loss": -40.61371612548828, "global_step": 138671, "epoch": 1146} {"train_loss": -40.30257797241211, "global_step": 138672, "epoch": 1146} {"train_loss": -40.68830490112305, "global_step": 138673, "epoch": 1146} {"train_loss": -40.40830993652344, "global_step": 138674, "epoch": 1146} {"train_loss": -40.508338928222656, "global_step": 138675, "epoch": 1146} {"train_loss": -40.878902435302734, "global_step": 138676, "epoch": 1146} {"train_loss": -40.45295333862305, "global_step": 138677, "epoch": 1146} {"train_loss": -40.56694030761719, "global_step": 138678, "epoch": 1146} {"train_loss": -40.88327407836914, "global_step": 138679, "epoch": 1146} {"train_loss": -40.11793899536133, "global_step": 138680, "epoch": 1146} {"train_loss": -40.76459884643555, "global_step": 138681, "epoch": 1146} {"train_loss": -40.48049545288086, "global_step": 138682, "epoch": 1146} {"train_loss": -41.00381088256836, "global_step": 138683, "epoch": 1146} {"train_loss": -41.3250846862793, "global_step": 138684, "epoch": 1146} {"train_loss": -40.37181091308594, "global_step": 138685, "epoch": 1146} {"train_loss": -40.5245246887207, "global_step": 138686, "epoch": 1146} {"train_loss": -40.96421813964844, "global_step": 138687, "epoch": 1146} {"train_loss": -40.33501052856445, "global_step": 138688, "epoch": 1146} {"train_loss": -40.817298889160156, "global_step": 138689, "epoch": 1146} {"train_loss": -40.876991271972656, "global_step": 138690, "epoch": 1146} {"train_loss": -39.887725830078125, "global_step": 138691, "epoch": 1146} {"train_loss": -40.847511291503906, "global_step": 138692, "epoch": 1146} {"train_loss": -40.889686584472656, "global_step": 138693, "epoch": 1146} {"train_loss": -40.50956726074219, "global_step": 138694, "epoch": 1146} {"train_loss": -41.0798454284668, "global_step": 138695, "epoch": 1146} {"train_loss": -40.79056930541992, "global_step": 138696, "epoch": 1146} {"train_loss": -40.97188949584961, "global_step": 138697, "epoch": 1146} {"train_loss": -41.039306640625, "global_step": 138698, "epoch": 1146} {"train_loss": -41.12066650390625, "global_step": 138699, "epoch": 1146} {"train_loss": -39.08907699584961, "global_step": 138700, "epoch": 1146} {"train_loss": -39.444908142089844, "global_step": 138701, "epoch": 1146} {"train_loss": -40.43971633911133, "global_step": 138702, "epoch": 1146} {"train_loss": -39.86150360107422, "global_step": 138703, "epoch": 1146} {"train_loss": -38.94626998901367, "global_step": 138704, "epoch": 1146} {"train_loss": -38.322052001953125, "global_step": 138705, "epoch": 1146} {"train_loss": -39.70591735839844, "global_step": 138706, "epoch": 1146} {"train_loss": -39.18572998046875, "global_step": 138707, "epoch": 1146} {"train_loss": -39.218788146972656, "global_step": 138708, "epoch": 1146} {"train_loss": -38.74699783325195, "global_step": 138709, "epoch": 1146} {"train_loss": -37.911781311035156, "global_step": 138710, "epoch": 1146} {"train_loss": -38.22257995605469, "global_step": 138711, "epoch": 1146} {"train_loss": -38.79496765136719, "global_step": 138712, "epoch": 1146} {"train_loss": -35.36426544189453, "global_step": 138713, "epoch": 1146} {"train_loss": -35.0388069152832, "global_step": 138714, "epoch": 1146} {"train_loss": -39.30112838745117, "global_step": 138715, "epoch": 1146} {"train_loss": -37.06494903564453, "global_step": 138716, "epoch": 1146} {"train_loss": -37.5665397644043, "global_step": 138717, "epoch": 1146} {"train_loss": -38.22480010986328, "global_step": 138718, "epoch": 1146} {"train_loss": -38.28874588012695, "global_step": 138719, "epoch": 1146} {"train_loss": -37.858863830566406, "global_step": 138720, "epoch": 1146} {"train_loss": -37.03591537475586, "global_step": 138721, "epoch": 1146} {"train_loss": -38.965370178222656, "global_step": 138722, "epoch": 1146} {"train_loss": -38.338294982910156, "global_step": 138723, "epoch": 1146} {"train_loss": -39.15887451171875, "global_step": 138724, "epoch": 1146} {"train_loss": -38.68095397949219, "global_step": 138725, "epoch": 1146} {"train_loss": -39.947906494140625, "global_step": 138726, "epoch": 1146} {"train_loss": -39.02421569824219, "global_step": 138727, "epoch": 1146} {"train_loss": -39.247344970703125, "global_step": 138728, "epoch": 1146} {"train_loss": -39.4529914855957, "global_step": 138729, "epoch": 1146} {"train_loss": -38.704769134521484, "global_step": 138730, "epoch": 1146} {"train_loss": -39.77280044555664, "global_step": 138731, "epoch": 1146} {"train_loss": -38.6451530456543, "global_step": 138732, "epoch": 1146} {"train_loss": -39.840553283691406, "global_step": 138733, "epoch": 1146} {"train_loss": -38.86809158325195, "global_step": 138734, "epoch": 1146} {"train_loss": -40.04804229736328, "global_step": 138735, "epoch": 1146} {"train_loss": -39.193504333496094, "global_step": 138736, "epoch": 1146} {"train_loss": -39.98371124267578, "global_step": 138737, "epoch": 1146} {"train_loss": -40.10811233520508, "global_step": 138738, "epoch": 1146} {"train_loss": -39.42750930786133, "global_step": 138739, "epoch": 1146} {"train_loss": -40.34344482421875, "global_step": 138740, "epoch": 1146} {"train_loss": -40.0638427734375, "global_step": 138741, "epoch": 1146} {"train_loss": -39.68779373168945, "global_step": 138742, "epoch": 1146} {"train_loss": -39.94770431518555, "global_step": 138743, "epoch": 1146} {"train_loss": -40.56406784057617, "global_step": 138744, "epoch": 1146} {"train_loss": -40.27222442626953, "global_step": 138745, "epoch": 1146} {"train_loss": -39.98604202270508, "global_step": 138746, "epoch": 1146} {"train_loss": -39.254791259765625, "global_step": 138747, "epoch": 1146} {"train_loss": -39.5757942199707, "global_step": 138748, "epoch": 1146} {"train_loss": -39.74677658081055, "global_step": 138749, "epoch": 1146} {"train_loss": -40.34906768798828, "global_step": 138750, "epoch": 1146} {"train_loss": -40.53616714477539, "global_step": 138751, "epoch": 1146} {"train_loss": -39.931800842285156, "global_step": 138752, "epoch": 1146} {"train_loss": -39.500274658203125, "global_step": 138753, "epoch": 1146} {"train_loss": -38.01877975463867, "global_step": 138754, "epoch": 1146} {"train_loss": -40.017974853515625, "global_step": 138755, "epoch": 1146} {"train_loss": -37.39429473876953, "global_step": 138756, "epoch": 1146} {"train_loss": -39.75806427001953, "global_step": 138757, "epoch": 1146} {"train_loss": -39.63176345825195, "global_step": 138758, "epoch": 1146} {"train_loss": -38.20939636230469, "global_step": 138759, "epoch": 1146} {"train_loss": -40.31123733520508, "global_step": 138760, "epoch": 1146} {"train_loss": -39.920677185058594, "global_step": 138761, "epoch": 1146} {"train_loss": -39.41357421875, "global_step": 138762, "epoch": 1146} {"train_loss": -39.97880172729492, "global_step": 138763, "epoch": 1146} {"train_loss": -39.583168029785156, "global_step": 138764, "epoch": 1146} {"train_loss": -39.3101806640625, "global_step": 138765, "epoch": 1146} {"train_loss": -39.19091796875, "global_step": 138766, "epoch": 1146} {"train_loss": -39.58156967163086, "global_step": 138767, "epoch": 1146} {"train_loss": -39.61098098754883, "global_step": 138768, "epoch": 1146} {"train_loss": -39.07021713256836, "global_step": 138769, "epoch": 1146} {"train_loss": -40.05944061279297, "global_step": 138770, "epoch": 1146} {"train_loss": -39.21702194213867, "global_step": 138771, "epoch": 1146} {"train_loss": -40.40890884399414, "global_step": 138772, "epoch": 1146} {"train_loss": -38.60801315307617, "global_step": 138773, "epoch": 1146} {"train_loss": -38.59245681762695, "global_step": 138774, "epoch": 1146} {"train_loss": -39.85028839111328, "global_step": 138775, "epoch": 1146} {"train_loss": -39.14834213256836, "global_step": 138776, "epoch": 1146} {"train_loss": -39.9830207824707, "global_step": 138777, "epoch": 1146} {"train_loss": -39.885772705078125, "global_step": 138778, "epoch": 1146} {"train_loss": -40.34417724609375, "global_step": 138779, "epoch": 1146} {"train_loss": -40.17385482788086, "global_step": 138780, "epoch": 1146} {"train_loss": -40.155113220214844, "global_step": 138781, "epoch": 1146} {"train_loss": -39.76995849609375, "global_step": 138782, "epoch": 1146} {"train_loss": -40.7462272644043, "global_step": 138783, "epoch": 1146} {"train_loss": -39.3485107421875, "global_step": 138784, "epoch": 1146} {"train_loss": -40.41591262817383, "global_step": 138785, "epoch": 1146} {"train_loss": -39.65800703064469, "global_step": 138786, "epoch": 1146, "val_loss": 2686682.5} {"train_loss": -40.638816833496094, "global_step": 138787, "epoch": 1147} {"train_loss": -40.990196228027344, "global_step": 138788, "epoch": 1147} {"train_loss": -40.42708969116211, "global_step": 138789, "epoch": 1147} {"train_loss": -40.700782775878906, "global_step": 138790, "epoch": 1147} {"train_loss": -40.50612258911133, "global_step": 138791, "epoch": 1147} {"train_loss": -40.669490814208984, "global_step": 138792, "epoch": 1147} {"train_loss": -40.71364974975586, "global_step": 138793, "epoch": 1147} {"train_loss": -40.2225341796875, "global_step": 138794, "epoch": 1147} {"train_loss": -40.007083892822266, "global_step": 138795, "epoch": 1147} {"train_loss": -40.51300811767578, "global_step": 138796, "epoch": 1147} {"train_loss": -40.4724235534668, "global_step": 138797, "epoch": 1147} {"train_loss": -40.585426330566406, "global_step": 138798, "epoch": 1147} {"train_loss": -40.583492279052734, "global_step": 138799, "epoch": 1147} {"train_loss": -40.99774169921875, "global_step": 138800, "epoch": 1147} {"train_loss": -40.73994064331055, "global_step": 138801, "epoch": 1147} {"train_loss": -39.1473503112793, "global_step": 138802, "epoch": 1147} {"train_loss": -40.39466857910156, "global_step": 138803, "epoch": 1147} {"train_loss": -40.69346618652344, "global_step": 138804, "epoch": 1147} {"train_loss": -40.52183151245117, "global_step": 138805, "epoch": 1147} {"train_loss": -39.710514068603516, "global_step": 138806, "epoch": 1147} {"train_loss": -39.92169189453125, "global_step": 138807, "epoch": 1147} {"train_loss": -40.667789459228516, "global_step": 138808, "epoch": 1147} {"train_loss": -41.088050842285156, "global_step": 138809, "epoch": 1147} {"train_loss": -40.89263916015625, "global_step": 138810, "epoch": 1147} {"train_loss": -41.077667236328125, "global_step": 138811, "epoch": 1147} {"train_loss": -41.01630401611328, "global_step": 138812, "epoch": 1147} {"train_loss": -41.440643310546875, "global_step": 138813, "epoch": 1147} {"train_loss": -40.14655685424805, "global_step": 138814, "epoch": 1147} {"train_loss": -40.69601058959961, "global_step": 138815, "epoch": 1147} {"train_loss": -41.0943717956543, "global_step": 138816, "epoch": 1147} {"train_loss": -41.33445358276367, "global_step": 138817, "epoch": 1147} {"train_loss": -40.252071380615234, "global_step": 138818, "epoch": 1147} {"train_loss": -38.989105224609375, "global_step": 138819, "epoch": 1147} {"train_loss": -40.74693298339844, "global_step": 138820, "epoch": 1147} {"train_loss": -41.000732421875, "global_step": 138821, "epoch": 1147} {"train_loss": -41.30159378051758, "global_step": 138822, "epoch": 1147} {"train_loss": -41.15557861328125, "global_step": 138823, "epoch": 1147} {"train_loss": -40.70535659790039, "global_step": 138824, "epoch": 1147} {"train_loss": -41.18545913696289, "global_step": 138825, "epoch": 1147} {"train_loss": -40.24245834350586, "global_step": 138826, "epoch": 1147} {"train_loss": -40.794891357421875, "global_step": 138827, "epoch": 1147} {"train_loss": -39.59809494018555, "global_step": 138828, "epoch": 1147} {"train_loss": -40.05298614501953, "global_step": 138829, "epoch": 1147} {"train_loss": -40.378028869628906, "global_step": 138830, "epoch": 1147} {"train_loss": -40.61066818237305, "global_step": 138831, "epoch": 1147} {"train_loss": -40.279788970947266, "global_step": 138832, "epoch": 1147} {"train_loss": -39.994728088378906, "global_step": 138833, "epoch": 1147} {"train_loss": -40.064151763916016, "global_step": 138834, "epoch": 1147} {"train_loss": -40.67841339111328, "global_step": 138835, "epoch": 1147} {"train_loss": -40.15598678588867, "global_step": 138836, "epoch": 1147} {"train_loss": -39.441184997558594, "global_step": 138837, "epoch": 1147} {"train_loss": -41.157806396484375, "global_step": 138838, "epoch": 1147} {"train_loss": -39.8934211730957, "global_step": 138839, "epoch": 1147} {"train_loss": -39.57285690307617, "global_step": 138840, "epoch": 1147} {"train_loss": -38.09508514404297, "global_step": 138841, "epoch": 1147} {"train_loss": -38.6503791809082, "global_step": 138842, "epoch": 1147} {"train_loss": -38.1464958190918, "global_step": 138843, "epoch": 1147} {"train_loss": -39.57818603515625, "global_step": 138844, "epoch": 1147} {"train_loss": -36.25883102416992, "global_step": 138845, "epoch": 1147} {"train_loss": -38.50678253173828, "global_step": 138846, "epoch": 1147} {"train_loss": -38.99599838256836, "global_step": 138847, "epoch": 1147} {"train_loss": -37.35540771484375, "global_step": 138848, "epoch": 1147} {"train_loss": -40.986045837402344, "global_step": 138849, "epoch": 1147} {"train_loss": -36.721858978271484, "global_step": 138850, "epoch": 1147} {"train_loss": -39.246456146240234, "global_step": 138851, "epoch": 1147} {"train_loss": -34.11985397338867, "global_step": 138852, "epoch": 1147} {"train_loss": -35.6861686706543, "global_step": 138853, "epoch": 1147} {"train_loss": -31.4092960357666, "global_step": 138854, "epoch": 1147} {"train_loss": -14.916354179382324, "global_step": 138855, "epoch": 1147} {"train_loss": -19.267818450927734, "global_step": 138856, "epoch": 1147} {"train_loss": -25.521320343017578, "global_step": 138857, "epoch": 1147} {"train_loss": -25.64346694946289, "global_step": 138858, "epoch": 1147} {"train_loss": -27.090625762939453, "global_step": 138859, "epoch": 1147} {"train_loss": -32.58557891845703, "global_step": 138860, "epoch": 1147} {"train_loss": -30.04566764831543, "global_step": 138861, "epoch": 1147} {"train_loss": -30.220258712768555, "global_step": 138862, "epoch": 1147} {"train_loss": -31.04291343688965, "global_step": 138863, "epoch": 1147} {"train_loss": -32.702999114990234, "global_step": 138864, "epoch": 1147} {"train_loss": -32.367069244384766, "global_step": 138865, "epoch": 1147} {"train_loss": -36.20439147949219, "global_step": 138866, "epoch": 1147} {"train_loss": -33.2799072265625, "global_step": 138867, "epoch": 1147} {"train_loss": -33.9268684387207, "global_step": 138868, "epoch": 1147} {"train_loss": -33.17435836791992, "global_step": 138869, "epoch": 1147} {"train_loss": -36.39872741699219, "global_step": 138870, "epoch": 1147} {"train_loss": -36.90998458862305, "global_step": 138871, "epoch": 1147} {"train_loss": -36.95400619506836, "global_step": 138872, "epoch": 1147} {"train_loss": -36.00972366333008, "global_step": 138873, "epoch": 1147} {"train_loss": -36.03447341918945, "global_step": 138874, "epoch": 1147} {"train_loss": -36.86695098876953, "global_step": 138875, "epoch": 1147} {"train_loss": -37.1373176574707, "global_step": 138876, "epoch": 1147} {"train_loss": -36.73997116088867, "global_step": 138877, "epoch": 1147} {"train_loss": -36.440460205078125, "global_step": 138878, "epoch": 1147} {"train_loss": -37.824745178222656, "global_step": 138879, "epoch": 1147} {"train_loss": -37.2191276550293, "global_step": 138880, "epoch": 1147} {"train_loss": -37.40431213378906, "global_step": 138881, "epoch": 1147} {"train_loss": -38.54057693481445, "global_step": 138882, "epoch": 1147} {"train_loss": -37.58656311035156, "global_step": 138883, "epoch": 1147} {"train_loss": -37.49336624145508, "global_step": 138884, "epoch": 1147} {"train_loss": -38.00703048706055, "global_step": 138885, "epoch": 1147} {"train_loss": -38.3573112487793, "global_step": 138886, "epoch": 1147} {"train_loss": -38.28293991088867, "global_step": 138887, "epoch": 1147} {"train_loss": -38.2952766418457, "global_step": 138888, "epoch": 1147} {"train_loss": -37.59859848022461, "global_step": 138889, "epoch": 1147} {"train_loss": -38.45764923095703, "global_step": 138890, "epoch": 1147} {"train_loss": -38.69602584838867, "global_step": 138891, "epoch": 1147} {"train_loss": -38.59832000732422, "global_step": 138892, "epoch": 1147} {"train_loss": -39.11072540283203, "global_step": 138893, "epoch": 1147} {"train_loss": -38.472686767578125, "global_step": 138894, "epoch": 1147} {"train_loss": -38.92766571044922, "global_step": 138895, "epoch": 1147} {"train_loss": -38.951473236083984, "global_step": 138896, "epoch": 1147} {"train_loss": -39.336063385009766, "global_step": 138897, "epoch": 1147} {"train_loss": -39.18514633178711, "global_step": 138898, "epoch": 1147} {"train_loss": -38.40391159057617, "global_step": 138899, "epoch": 1147} {"train_loss": -39.48274612426758, "global_step": 138900, "epoch": 1147} {"train_loss": -39.60485076904297, "global_step": 138901, "epoch": 1147} {"train_loss": -39.65394973754883, "global_step": 138902, "epoch": 1147} {"train_loss": -39.340667724609375, "global_step": 138903, "epoch": 1147} {"train_loss": -39.49634552001953, "global_step": 138904, "epoch": 1147} {"train_loss": -39.84678268432617, "global_step": 138905, "epoch": 1147} {"train_loss": -39.60313034057617, "global_step": 138906, "epoch": 1147} {"train_loss": -38.014860728555476, "global_step": 138907, "epoch": 1147, "val_loss": 2498794.25} {"train_loss": -39.9088020324707, "global_step": 138908, "epoch": 1148} {"train_loss": -38.816688537597656, "global_step": 138909, "epoch": 1148} {"train_loss": -39.69738006591797, "global_step": 138910, "epoch": 1148} {"train_loss": -39.12405014038086, "global_step": 138911, "epoch": 1148} {"train_loss": -39.778564453125, "global_step": 138912, "epoch": 1148} {"train_loss": -39.46272277832031, "global_step": 138913, "epoch": 1148} {"train_loss": -40.11075973510742, "global_step": 138914, "epoch": 1148} {"train_loss": -39.61844253540039, "global_step": 138915, "epoch": 1148} {"train_loss": -38.67223358154297, "global_step": 138916, "epoch": 1148} {"train_loss": -39.718849182128906, "global_step": 138917, "epoch": 1148} {"train_loss": -40.1700553894043, "global_step": 138918, "epoch": 1148} {"train_loss": -39.745052337646484, "global_step": 138919, "epoch": 1148} {"train_loss": -40.413516998291016, "global_step": 138920, "epoch": 1148} {"train_loss": -40.21334457397461, "global_step": 138921, "epoch": 1148} {"train_loss": -40.31581497192383, "global_step": 138922, "epoch": 1148} {"train_loss": -39.976383209228516, "global_step": 138923, "epoch": 1148} {"train_loss": -40.17023468017578, "global_step": 138924, "epoch": 1148} {"train_loss": -40.01931381225586, "global_step": 138925, "epoch": 1148} {"train_loss": -40.24813461303711, "global_step": 138926, "epoch": 1148} {"train_loss": -40.80378341674805, "global_step": 138927, "epoch": 1148} {"train_loss": -40.06882858276367, "global_step": 138928, "epoch": 1148} {"train_loss": -40.53791046142578, "global_step": 138929, "epoch": 1148} {"train_loss": -40.355342864990234, "global_step": 138930, "epoch": 1148} {"train_loss": -40.591304779052734, "global_step": 138931, "epoch": 1148} {"train_loss": -40.60334396362305, "global_step": 138932, "epoch": 1148} {"train_loss": -40.83934020996094, "global_step": 138933, "epoch": 1148} {"train_loss": -40.74990463256836, "global_step": 138934, "epoch": 1148} {"train_loss": -40.578853607177734, "global_step": 138935, "epoch": 1148} {"train_loss": -40.45473861694336, "global_step": 138936, "epoch": 1148} {"train_loss": -41.11151885986328, "global_step": 138937, "epoch": 1148} {"train_loss": -40.6472282409668, "global_step": 138938, "epoch": 1148} {"train_loss": -40.31553649902344, "global_step": 138939, "epoch": 1148} {"train_loss": -40.94392013549805, "global_step": 138940, "epoch": 1148} {"train_loss": -40.687889099121094, "global_step": 138941, "epoch": 1148} {"train_loss": -40.99636459350586, "global_step": 138942, "epoch": 1148} {"train_loss": -40.292110443115234, "global_step": 138943, "epoch": 1148} {"train_loss": -40.60464096069336, "global_step": 138944, "epoch": 1148} {"train_loss": -41.039363861083984, "global_step": 138945, "epoch": 1148} {"train_loss": -40.9542121887207, "global_step": 138946, "epoch": 1148} {"train_loss": -40.83842849731445, "global_step": 138947, "epoch": 1148} {"train_loss": -40.85625076293945, "global_step": 138948, "epoch": 1148} {"train_loss": -40.989078521728516, "global_step": 138949, "epoch": 1148} {"train_loss": -40.87052536010742, "global_step": 138950, "epoch": 1148} {"train_loss": -40.63947296142578, "global_step": 138951, "epoch": 1148} {"train_loss": -41.022605895996094, "global_step": 138952, "epoch": 1148} {"train_loss": -40.96371841430664, "global_step": 138953, "epoch": 1148} {"train_loss": -40.719093322753906, "global_step": 138954, "epoch": 1148} {"train_loss": -40.85608673095703, "global_step": 138955, "epoch": 1148} {"train_loss": -40.00841522216797, "global_step": 138956, "epoch": 1148} {"train_loss": -37.63796615600586, "global_step": 138957, "epoch": 1148} {"train_loss": -30.4034423828125, "global_step": 138958, "epoch": 1148} {"train_loss": -2.2323174476623535, "global_step": 138959, "epoch": 1148} {"train_loss": 36.3133659362793, "global_step": 138960, "epoch": 1148} {"train_loss": -35.21863555908203, "global_step": 138961, "epoch": 1148} {"train_loss": 27.36054801940918, "global_step": 138962, "epoch": 1148} {"train_loss": 5.570216655731201, "global_step": 138963, "epoch": 1148} {"train_loss": -23.778329849243164, "global_step": 138964, "epoch": 1148} {"train_loss": -24.76783561706543, "global_step": 138965, "epoch": 1148} {"train_loss": -19.227813720703125, "global_step": 138966, "epoch": 1148} {"train_loss": -27.35329246520996, "global_step": 138967, "epoch": 1148} {"train_loss": -18.60418128967285, "global_step": 138968, "epoch": 1148} {"train_loss": -22.068618774414062, "global_step": 138969, "epoch": 1148} {"train_loss": -28.527252197265625, "global_step": 138970, "epoch": 1148} {"train_loss": -25.55781364440918, "global_step": 138971, "epoch": 1148} {"train_loss": -27.63984489440918, "global_step": 138972, "epoch": 1148} {"train_loss": -31.5246524810791, "global_step": 138973, "epoch": 1148} {"train_loss": -30.657384872436523, "global_step": 138974, "epoch": 1148} {"train_loss": -31.49704360961914, "global_step": 138975, "epoch": 1148} {"train_loss": -31.764368057250977, "global_step": 138976, "epoch": 1148} {"train_loss": -33.8974723815918, "global_step": 138977, "epoch": 1148} {"train_loss": -33.6333122253418, "global_step": 138978, "epoch": 1148} {"train_loss": -34.15087890625, "global_step": 138979, "epoch": 1148} {"train_loss": -34.05328369140625, "global_step": 138980, "epoch": 1148} {"train_loss": -34.819091796875, "global_step": 138981, "epoch": 1148} {"train_loss": -35.586387634277344, "global_step": 138982, "epoch": 1148} {"train_loss": -35.210079193115234, "global_step": 138983, "epoch": 1148} {"train_loss": -35.43290710449219, "global_step": 138984, "epoch": 1148} {"train_loss": -35.47776794433594, "global_step": 138985, "epoch": 1148} {"train_loss": -36.194801330566406, "global_step": 138986, "epoch": 1148} {"train_loss": -36.27527618408203, "global_step": 138987, "epoch": 1148} {"train_loss": -36.1678352355957, "global_step": 138988, "epoch": 1148} {"train_loss": -36.74515914916992, "global_step": 138989, "epoch": 1148} {"train_loss": -37.225181579589844, "global_step": 138990, "epoch": 1148} {"train_loss": -37.32686233520508, "global_step": 138991, "epoch": 1148} {"train_loss": -36.937469482421875, "global_step": 138992, "epoch": 1148} {"train_loss": -37.11891174316406, "global_step": 138993, "epoch": 1148} {"train_loss": -37.49182891845703, "global_step": 138994, "epoch": 1148} {"train_loss": -37.4163932800293, "global_step": 138995, "epoch": 1148} {"train_loss": -37.44681930541992, "global_step": 138996, "epoch": 1148} {"train_loss": -37.2970085144043, "global_step": 138997, "epoch": 1148} {"train_loss": -37.38251876831055, "global_step": 138998, "epoch": 1148} {"train_loss": -37.651119232177734, "global_step": 138999, "epoch": 1148} {"train_loss": -37.69953155517578, "global_step": 139000, "epoch": 1148} {"train_loss": -37.852962493896484, "global_step": 139001, "epoch": 1148} {"train_loss": -37.62778854370117, "global_step": 139002, "epoch": 1148} {"train_loss": -37.77243423461914, "global_step": 139003, "epoch": 1148} {"train_loss": -38.0307502746582, "global_step": 139004, "epoch": 1148} {"train_loss": -37.707183837890625, "global_step": 139005, "epoch": 1148} {"train_loss": -37.84772872924805, "global_step": 139006, "epoch": 1148} {"train_loss": -37.85720443725586, "global_step": 139007, "epoch": 1148} {"train_loss": -38.03525924682617, "global_step": 139008, "epoch": 1148} {"train_loss": -38.03742599487305, "global_step": 139009, "epoch": 1148} {"train_loss": -37.95463943481445, "global_step": 139010, "epoch": 1148} {"train_loss": -38.31785202026367, "global_step": 139011, "epoch": 1148} {"train_loss": -38.279170989990234, "global_step": 139012, "epoch": 1148} {"train_loss": -38.35618209838867, "global_step": 139013, "epoch": 1148} {"train_loss": -38.0796012878418, "global_step": 139014, "epoch": 1148} {"train_loss": -38.41509246826172, "global_step": 139015, "epoch": 1148} {"train_loss": -38.52900314331055, "global_step": 139016, "epoch": 1148} {"train_loss": -38.10114669799805, "global_step": 139017, "epoch": 1148} {"train_loss": -38.64885330200195, "global_step": 139018, "epoch": 1148} {"train_loss": -38.635719299316406, "global_step": 139019, "epoch": 1148} {"train_loss": -38.67257308959961, "global_step": 139020, "epoch": 1148} {"train_loss": -38.6087532043457, "global_step": 139021, "epoch": 1148} {"train_loss": -38.822017669677734, "global_step": 139022, "epoch": 1148} {"train_loss": -38.62788009643555, "global_step": 139023, "epoch": 1148} {"train_loss": -38.89049530029297, "global_step": 139024, "epoch": 1148} {"train_loss": -38.94703674316406, "global_step": 139025, "epoch": 1148} {"train_loss": -38.998897552490234, "global_step": 139026, "epoch": 1148} {"train_loss": -39.03129196166992, "global_step": 139027, "epoch": 1148} {"train_loss": -35.52513903625741, "global_step": 139028, "epoch": 1148, "val_loss": 2591041.75} {"train_loss": -39.18815231323242, "global_step": 139029, "epoch": 1149} {"train_loss": -39.22285842895508, "global_step": 139030, "epoch": 1149} {"train_loss": -39.40647888183594, "global_step": 139031, "epoch": 1149} {"train_loss": -39.11114501953125, "global_step": 139032, "epoch": 1149} {"train_loss": -39.298057556152344, "global_step": 139033, "epoch": 1149} {"train_loss": -39.409759521484375, "global_step": 139034, "epoch": 1149} {"train_loss": -39.40888214111328, "global_step": 139035, "epoch": 1149} {"train_loss": -39.30717086791992, "global_step": 139036, "epoch": 1149} {"train_loss": -39.146263122558594, "global_step": 139037, "epoch": 1149} {"train_loss": -39.22869873046875, "global_step": 139038, "epoch": 1149} {"train_loss": -39.645503997802734, "global_step": 139039, "epoch": 1149} {"train_loss": -39.349639892578125, "global_step": 139040, "epoch": 1149} {"train_loss": -39.65986633300781, "global_step": 139041, "epoch": 1149} {"train_loss": -39.516319274902344, "global_step": 139042, "epoch": 1149} {"train_loss": -39.760860443115234, "global_step": 139043, "epoch": 1149} {"train_loss": -39.917579650878906, "global_step": 139044, "epoch": 1149} {"train_loss": -39.557373046875, "global_step": 139045, "epoch": 1149} {"train_loss": -39.81998825073242, "global_step": 139046, "epoch": 1149} {"train_loss": -39.72417068481445, "global_step": 139047, "epoch": 1149} {"train_loss": -40.037208557128906, "global_step": 139048, "epoch": 1149} {"train_loss": -39.881832122802734, "global_step": 139049, "epoch": 1149} {"train_loss": -39.96516036987305, "global_step": 139050, "epoch": 1149} {"train_loss": -40.134368896484375, "global_step": 139051, "epoch": 1149} {"train_loss": -39.98236846923828, "global_step": 139052, "epoch": 1149} {"train_loss": -39.908321380615234, "global_step": 139053, "epoch": 1149} {"train_loss": -40.325496673583984, "global_step": 139054, "epoch": 1149} {"train_loss": -40.259212493896484, "global_step": 139055, "epoch": 1149} {"train_loss": -40.10604476928711, "global_step": 139056, "epoch": 1149} {"train_loss": -40.3731575012207, "global_step": 139057, "epoch": 1149} {"train_loss": -40.081199645996094, "global_step": 139058, "epoch": 1149} {"train_loss": -40.0726318359375, "global_step": 139059, "epoch": 1149} {"train_loss": -40.289939880371094, "global_step": 139060, "epoch": 1149} {"train_loss": -39.987220764160156, "global_step": 139061, "epoch": 1149} {"train_loss": -40.305030822753906, "global_step": 139062, "epoch": 1149} {"train_loss": -40.333984375, "global_step": 139063, "epoch": 1149} {"train_loss": -40.2225456237793, "global_step": 139064, "epoch": 1149} {"train_loss": -40.25740432739258, "global_step": 139065, "epoch": 1149} {"train_loss": -40.393856048583984, "global_step": 139066, "epoch": 1149} {"train_loss": -40.190284729003906, "global_step": 139067, "epoch": 1149} {"train_loss": -40.295074462890625, "global_step": 139068, "epoch": 1149} {"train_loss": -40.356048583984375, "global_step": 139069, "epoch": 1149} {"train_loss": -40.49345016479492, "global_step": 139070, "epoch": 1149} {"train_loss": -40.44482421875, "global_step": 139071, "epoch": 1149} {"train_loss": -40.448638916015625, "global_step": 139072, "epoch": 1149} {"train_loss": -40.84718704223633, "global_step": 139073, "epoch": 1149} {"train_loss": -40.77397537231445, "global_step": 139074, "epoch": 1149} {"train_loss": -40.75658416748047, "global_step": 139075, "epoch": 1149} {"train_loss": -40.747406005859375, "global_step": 139076, "epoch": 1149} {"train_loss": -40.6337890625, "global_step": 139077, "epoch": 1149} {"train_loss": -40.73126983642578, "global_step": 139078, "epoch": 1149} {"train_loss": -40.92034912109375, "global_step": 139079, "epoch": 1149} {"train_loss": -40.6626091003418, "global_step": 139080, "epoch": 1149} {"train_loss": -40.525550842285156, "global_step": 139081, "epoch": 1149} {"train_loss": -40.56173324584961, "global_step": 139082, "epoch": 1149} {"train_loss": -40.66209030151367, "global_step": 139083, "epoch": 1149} {"train_loss": -40.49380111694336, "global_step": 139084, "epoch": 1149} {"train_loss": -40.171966552734375, "global_step": 139085, "epoch": 1149} {"train_loss": -39.4503173828125, "global_step": 139086, "epoch": 1149} {"train_loss": -38.678462982177734, "global_step": 139087, "epoch": 1149} {"train_loss": -36.62617874145508, "global_step": 139088, "epoch": 1149} {"train_loss": -35.68593978881836, "global_step": 139089, "epoch": 1149} {"train_loss": -35.80546188354492, "global_step": 139090, "epoch": 1149} {"train_loss": -39.05064010620117, "global_step": 139091, "epoch": 1149} {"train_loss": -39.86744689941406, "global_step": 139092, "epoch": 1149} {"train_loss": -38.609596252441406, "global_step": 139093, "epoch": 1149} {"train_loss": -38.71029281616211, "global_step": 139094, "epoch": 1149} {"train_loss": -39.999935150146484, "global_step": 139095, "epoch": 1149} {"train_loss": -39.785945892333984, "global_step": 139096, "epoch": 1149} {"train_loss": -39.679561614990234, "global_step": 139097, "epoch": 1149} {"train_loss": -39.730464935302734, "global_step": 139098, "epoch": 1149} {"train_loss": -40.12483596801758, "global_step": 139099, "epoch": 1149} {"train_loss": -40.19590759277344, "global_step": 139100, "epoch": 1149} {"train_loss": -40.20058822631836, "global_step": 139101, "epoch": 1149} {"train_loss": -39.849002838134766, "global_step": 139102, "epoch": 1149} {"train_loss": -40.12517547607422, "global_step": 139103, "epoch": 1149} {"train_loss": -40.38129806518555, "global_step": 139104, "epoch": 1149} {"train_loss": -40.14875030517578, "global_step": 139105, "epoch": 1149} {"train_loss": -40.05586624145508, "global_step": 139106, "epoch": 1149} {"train_loss": -39.642555236816406, "global_step": 139107, "epoch": 1149} {"train_loss": -39.93498992919922, "global_step": 139108, "epoch": 1149} {"train_loss": -39.7535285949707, "global_step": 139109, "epoch": 1149} {"train_loss": -39.6472282409668, "global_step": 139110, "epoch": 1149} {"train_loss": -40.488433837890625, "global_step": 139111, "epoch": 1149} {"train_loss": -40.237884521484375, "global_step": 139112, "epoch": 1149} {"train_loss": -39.634544372558594, "global_step": 139113, "epoch": 1149} {"train_loss": -39.738094329833984, "global_step": 139114, "epoch": 1149} {"train_loss": -39.00624084472656, "global_step": 139115, "epoch": 1149} {"train_loss": -38.82769775390625, "global_step": 139116, "epoch": 1149} {"train_loss": -38.58878707885742, "global_step": 139117, "epoch": 1149} {"train_loss": -38.989070892333984, "global_step": 139118, "epoch": 1149} {"train_loss": -39.724700927734375, "global_step": 139119, "epoch": 1149} {"train_loss": -40.22661209106445, "global_step": 139120, "epoch": 1149} {"train_loss": -39.84741973876953, "global_step": 139121, "epoch": 1149} {"train_loss": -37.42409896850586, "global_step": 139122, "epoch": 1149} {"train_loss": -33.16575241088867, "global_step": 139123, "epoch": 1149} {"train_loss": -30.197107315063477, "global_step": 139124, "epoch": 1149} {"train_loss": -27.850305557250977, "global_step": 139125, "epoch": 1149} {"train_loss": -33.30500411987305, "global_step": 139126, "epoch": 1149} {"train_loss": -38.66880416870117, "global_step": 139127, "epoch": 1149} {"train_loss": -35.78022384643555, "global_step": 139128, "epoch": 1149} {"train_loss": -35.21950149536133, "global_step": 139129, "epoch": 1149} {"train_loss": -38.296112060546875, "global_step": 139130, "epoch": 1149} {"train_loss": -33.725013732910156, "global_step": 139131, "epoch": 1149} {"train_loss": -36.743865966796875, "global_step": 139132, "epoch": 1149} {"train_loss": -37.2951545715332, "global_step": 139133, "epoch": 1149} {"train_loss": -34.7509880065918, "global_step": 139134, "epoch": 1149} {"train_loss": -39.282413482666016, "global_step": 139135, "epoch": 1149} {"train_loss": -36.26394271850586, "global_step": 139136, "epoch": 1149} {"train_loss": -39.875484466552734, "global_step": 139137, "epoch": 1149} {"train_loss": -37.769775390625, "global_step": 139138, "epoch": 1149} {"train_loss": -39.575889587402344, "global_step": 139139, "epoch": 1149} {"train_loss": -38.22944259643555, "global_step": 139140, "epoch": 1149} {"train_loss": -39.34646224975586, "global_step": 139141, "epoch": 1149} {"train_loss": -38.773460388183594, "global_step": 139142, "epoch": 1149} {"train_loss": -38.58620834350586, "global_step": 139143, "epoch": 1149} {"train_loss": -39.56099319458008, "global_step": 139144, "epoch": 1149} {"train_loss": -39.1329345703125, "global_step": 139145, "epoch": 1149} {"train_loss": -39.476749420166016, "global_step": 139146, "epoch": 1149} {"train_loss": -38.86748123168945, "global_step": 139147, "epoch": 1149} {"train_loss": -38.90749740600586, "global_step": 139148, "epoch": 1149} {"train_loss": -39.140167141748854, "global_step": 139149, "epoch": 1149, "val_loss": 2593245.75} {"train_loss": -39.431427001953125, "global_step": 139150, "epoch": 1150} {"train_loss": -39.9498176574707, "global_step": 139151, "epoch": 1150} {"train_loss": -39.59564971923828, "global_step": 139152, "epoch": 1150} {"train_loss": -39.910369873046875, "global_step": 139153, "epoch": 1150} {"train_loss": -39.34489059448242, "global_step": 139154, "epoch": 1150} {"train_loss": -40.232120513916016, "global_step": 139155, "epoch": 1150} {"train_loss": -39.49808120727539, "global_step": 139156, "epoch": 1150} {"train_loss": -40.05390930175781, "global_step": 139157, "epoch": 1150} {"train_loss": -39.65990447998047, "global_step": 139158, "epoch": 1150} {"train_loss": -40.021087646484375, "global_step": 139159, "epoch": 1150} {"train_loss": -40.29119110107422, "global_step": 139160, "epoch": 1150} {"train_loss": -40.40701675415039, "global_step": 139161, "epoch": 1150} {"train_loss": -40.20659637451172, "global_step": 139162, "epoch": 1150} {"train_loss": -40.54484939575195, "global_step": 139163, "epoch": 1150} {"train_loss": -40.6060905456543, "global_step": 139164, "epoch": 1150} {"train_loss": -40.29198455810547, "global_step": 139165, "epoch": 1150} {"train_loss": -40.396358489990234, "global_step": 139166, "epoch": 1150} {"train_loss": -40.36507034301758, "global_step": 139167, "epoch": 1150} {"train_loss": -40.569252014160156, "global_step": 139168, "epoch": 1150} {"train_loss": -40.61477279663086, "global_step": 139169, "epoch": 1150} {"train_loss": -40.23865509033203, "global_step": 139170, "epoch": 1150} {"train_loss": -40.58677291870117, "global_step": 139171, "epoch": 1150} {"train_loss": -40.4986686706543, "global_step": 139172, "epoch": 1150} {"train_loss": -40.57617950439453, "global_step": 139173, "epoch": 1150} {"train_loss": -40.60902786254883, "global_step": 139174, "epoch": 1150} {"train_loss": -40.438968658447266, "global_step": 139175, "epoch": 1150} {"train_loss": -40.77813720703125, "global_step": 139176, "epoch": 1150} {"train_loss": -40.652015686035156, "global_step": 139177, "epoch": 1150} {"train_loss": -40.469024658203125, "global_step": 139178, "epoch": 1150} {"train_loss": -40.863677978515625, "global_step": 139179, "epoch": 1150} {"train_loss": -40.872737884521484, "global_step": 139180, "epoch": 1150} {"train_loss": -40.781837463378906, "global_step": 139181, "epoch": 1150} {"train_loss": -40.35800552368164, "global_step": 139182, "epoch": 1150} {"train_loss": -40.993038177490234, "global_step": 139183, "epoch": 1150} {"train_loss": -41.099857330322266, "global_step": 139184, "epoch": 1150} {"train_loss": -41.030879974365234, "global_step": 139185, "epoch": 1150} {"train_loss": -41.02618408203125, "global_step": 139186, "epoch": 1150} {"train_loss": -41.1909065246582, "global_step": 139187, "epoch": 1150} {"train_loss": -40.95425033569336, "global_step": 139188, "epoch": 1150} {"train_loss": -41.14482116699219, "global_step": 139189, "epoch": 1150} {"train_loss": -41.03607177734375, "global_step": 139190, "epoch": 1150} {"train_loss": -40.90738296508789, "global_step": 139191, "epoch": 1150} {"train_loss": -41.37260055541992, "global_step": 139192, "epoch": 1150} {"train_loss": -41.17694091796875, "global_step": 139193, "epoch": 1150} {"train_loss": -41.02790069580078, "global_step": 139194, "epoch": 1150} {"train_loss": -40.85687255859375, "global_step": 139195, "epoch": 1150} {"train_loss": -40.74654006958008, "global_step": 139196, "epoch": 1150} {"train_loss": -40.93192672729492, "global_step": 139197, "epoch": 1150} {"train_loss": -41.10952377319336, "global_step": 139198, "epoch": 1150} {"train_loss": -41.240150451660156, "global_step": 139199, "epoch": 1150} {"train_loss": -40.98681640625, "global_step": 139200, "epoch": 1150} {"train_loss": -40.9110107421875, "global_step": 139201, "epoch": 1150} {"train_loss": -40.01233673095703, "global_step": 139202, "epoch": 1150} {"train_loss": -39.365901947021484, "global_step": 139203, "epoch": 1150} {"train_loss": -40.42852783203125, "global_step": 139204, "epoch": 1150} {"train_loss": -40.900203704833984, "global_step": 139205, "epoch": 1150} {"train_loss": -40.34735107421875, "global_step": 139206, "epoch": 1150} {"train_loss": -41.0904655456543, "global_step": 139207, "epoch": 1150} {"train_loss": -39.27604293823242, "global_step": 139208, "epoch": 1150} {"train_loss": -40.37429428100586, "global_step": 139209, "epoch": 1150} {"train_loss": -40.70603561401367, "global_step": 139210, "epoch": 1150} {"train_loss": -38.63462448120117, "global_step": 139211, "epoch": 1150} {"train_loss": -41.02320098876953, "global_step": 139212, "epoch": 1150} {"train_loss": -39.57790756225586, "global_step": 139213, "epoch": 1150} {"train_loss": -40.007808685302734, "global_step": 139214, "epoch": 1150} {"train_loss": -40.2782096862793, "global_step": 139215, "epoch": 1150} {"train_loss": -40.06364822387695, "global_step": 139216, "epoch": 1150} {"train_loss": -39.97541046142578, "global_step": 139217, "epoch": 1150} {"train_loss": -39.78178787231445, "global_step": 139218, "epoch": 1150} {"train_loss": -38.75907516479492, "global_step": 139219, "epoch": 1150} {"train_loss": -37.6993408203125, "global_step": 139220, "epoch": 1150} {"train_loss": -37.82566452026367, "global_step": 139221, "epoch": 1150} {"train_loss": -38.94784164428711, "global_step": 139222, "epoch": 1150} {"train_loss": -40.254512786865234, "global_step": 139223, "epoch": 1150} {"train_loss": -38.60551071166992, "global_step": 139224, "epoch": 1150} {"train_loss": -39.11168670654297, "global_step": 139225, "epoch": 1150} {"train_loss": -40.22404098510742, "global_step": 139226, "epoch": 1150} {"train_loss": -39.701961517333984, "global_step": 139227, "epoch": 1150} {"train_loss": -40.11516571044922, "global_step": 139228, "epoch": 1150} {"train_loss": -39.92913818359375, "global_step": 139229, "epoch": 1150} {"train_loss": -40.413734436035156, "global_step": 139230, "epoch": 1150} {"train_loss": -40.87882614135742, "global_step": 139231, "epoch": 1150} {"train_loss": -40.446533203125, "global_step": 139232, "epoch": 1150} {"train_loss": -39.59065628051758, "global_step": 139233, "epoch": 1150} {"train_loss": -40.29564666748047, "global_step": 139234, "epoch": 1150} {"train_loss": -40.00403594970703, "global_step": 139235, "epoch": 1150} {"train_loss": -39.77122497558594, "global_step": 139236, "epoch": 1150} {"train_loss": -40.15034866333008, "global_step": 139237, "epoch": 1150} {"train_loss": -41.25467300415039, "global_step": 139238, "epoch": 1150} {"train_loss": -39.589900970458984, "global_step": 139239, "epoch": 1150} {"train_loss": -40.69002914428711, "global_step": 139240, "epoch": 1150} {"train_loss": -40.513519287109375, "global_step": 139241, "epoch": 1150} {"train_loss": -40.91865158081055, "global_step": 139242, "epoch": 1150} {"train_loss": -40.075260162353516, "global_step": 139243, "epoch": 1150} {"train_loss": -40.731197357177734, "global_step": 139244, "epoch": 1150} {"train_loss": -40.52358627319336, "global_step": 139245, "epoch": 1150} {"train_loss": -39.834434509277344, "global_step": 139246, "epoch": 1150} {"train_loss": -40.9998893737793, "global_step": 139247, "epoch": 1150} {"train_loss": -39.883609771728516, "global_step": 139248, "epoch": 1150} {"train_loss": -40.422786712646484, "global_step": 139249, "epoch": 1150} {"train_loss": -40.544185638427734, "global_step": 139250, "epoch": 1150} {"train_loss": -39.5694465637207, "global_step": 139251, "epoch": 1150} {"train_loss": -40.043270111083984, "global_step": 139252, "epoch": 1150} {"train_loss": -40.24519729614258, "global_step": 139253, "epoch": 1150} {"train_loss": -39.0018196105957, "global_step": 139254, "epoch": 1150} {"train_loss": -38.24882888793945, "global_step": 139255, "epoch": 1150} {"train_loss": -39.3647575378418, "global_step": 139256, "epoch": 1150} {"train_loss": -40.38899612426758, "global_step": 139257, "epoch": 1150} {"train_loss": -39.7985954284668, "global_step": 139258, "epoch": 1150} {"train_loss": -37.84456253051758, "global_step": 139259, "epoch": 1150} {"train_loss": -38.82539749145508, "global_step": 139260, "epoch": 1150} {"train_loss": -39.27473068237305, "global_step": 139261, "epoch": 1150} {"train_loss": -39.59267807006836, "global_step": 139262, "epoch": 1150} {"train_loss": -39.064735412597656, "global_step": 139263, "epoch": 1150} {"train_loss": -38.56789779663086, "global_step": 139264, "epoch": 1150} {"train_loss": -38.829952239990234, "global_step": 139265, "epoch": 1150} {"train_loss": -39.551513671875, "global_step": 139266, "epoch": 1150} {"train_loss": -38.997867584228516, "global_step": 139267, "epoch": 1150} {"train_loss": -37.47854232788086, "global_step": 139268, "epoch": 1150} {"train_loss": -39.0369987487793, "global_step": 139269, "epoch": 1150} {"train_loss": -40.10007243511105, "global_step": 139270, "epoch": 1150, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4400000": 1.0, "test/sim_max_reward_4400001": 1.0, "test/sim_max_reward_4400002": 1.0, "test/sim_max_reward_4400003": 0.0, "test/sim_max_reward_4400004": 1.0, "test/sim_max_reward_4400005": 1.0, "test/sim_max_reward_4400006": 1.0, "test/sim_max_reward_4400007": 1.0, "test/sim_max_reward_4400008": 1.0, "test/sim_max_reward_4400009": 1.0, "test/sim_max_reward_4400010": 1.0, "test/sim_max_reward_4400011": 1.0, "test/sim_max_reward_4400012": 1.0, "test/sim_max_reward_4400013": 1.0, "test/sim_max_reward_4400014": 1.0, "test/sim_max_reward_4400015": 1.0, "test/sim_max_reward_4400016": 1.0, "test/sim_max_reward_4400017": 1.0, "test/sim_max_reward_4400018": 0.0, "test/sim_max_reward_4400019": 1.0, "test/sim_max_reward_4400020": 1.0, "test/sim_max_reward_4400021": 1.0, "train/mean_score": 1.0, "test/mean_score": 0.9090909090909091, "val_loss": 2516386.5} {"train_loss": -38.37411880493164, "global_step": 139271, "epoch": 1151} {"train_loss": -39.96599197387695, "global_step": 139272, "epoch": 1151} {"train_loss": -38.22663497924805, "global_step": 139273, "epoch": 1151} {"train_loss": -37.72428512573242, "global_step": 139274, "epoch": 1151} {"train_loss": -38.55721664428711, "global_step": 139275, "epoch": 1151} {"train_loss": -38.544612884521484, "global_step": 139276, "epoch": 1151} {"train_loss": -36.519412994384766, "global_step": 139277, "epoch": 1151} {"train_loss": -33.77360916137695, "global_step": 139278, "epoch": 1151} {"train_loss": -37.38942337036133, "global_step": 139279, "epoch": 1151} {"train_loss": -38.7006950378418, "global_step": 139280, "epoch": 1151} {"train_loss": -32.850460052490234, "global_step": 139281, "epoch": 1151} {"train_loss": -36.240726470947266, "global_step": 139282, "epoch": 1151} {"train_loss": -37.479835510253906, "global_step": 139283, "epoch": 1151} {"train_loss": -38.55683517456055, "global_step": 139284, "epoch": 1151} {"train_loss": -37.74077606201172, "global_step": 139285, "epoch": 1151} {"train_loss": -39.11320114135742, "global_step": 139286, "epoch": 1151} {"train_loss": -36.13618469238281, "global_step": 139287, "epoch": 1151} {"train_loss": -38.287593841552734, "global_step": 139288, "epoch": 1151} {"train_loss": -38.291683197021484, "global_step": 139289, "epoch": 1151} {"train_loss": -37.51618194580078, "global_step": 139290, "epoch": 1151} {"train_loss": -36.63545608520508, "global_step": 139291, "epoch": 1151} {"train_loss": -39.17158508300781, "global_step": 139292, "epoch": 1151} {"train_loss": -37.78339385986328, "global_step": 139293, "epoch": 1151} {"train_loss": -38.988525390625, "global_step": 139294, "epoch": 1151} {"train_loss": -38.662574768066406, "global_step": 139295, "epoch": 1151} {"train_loss": -37.34883499145508, "global_step": 139296, "epoch": 1151} {"train_loss": -37.289485931396484, "global_step": 139297, "epoch": 1151} {"train_loss": -38.458587646484375, "global_step": 139298, "epoch": 1151} {"train_loss": -38.91181564331055, "global_step": 139299, "epoch": 1151} {"train_loss": -37.88190460205078, "global_step": 139300, "epoch": 1151} {"train_loss": -39.05436325073242, "global_step": 139301, "epoch": 1151} {"train_loss": -38.4063835144043, "global_step": 139302, "epoch": 1151} {"train_loss": -39.296241760253906, "global_step": 139303, "epoch": 1151} {"train_loss": -38.63240432739258, "global_step": 139304, "epoch": 1151} {"train_loss": -39.309574127197266, "global_step": 139305, "epoch": 1151} {"train_loss": -38.1347770690918, "global_step": 139306, "epoch": 1151} {"train_loss": -37.27733612060547, "global_step": 139307, "epoch": 1151} {"train_loss": -37.06377410888672, "global_step": 139308, "epoch": 1151} {"train_loss": -39.36030197143555, "global_step": 139309, "epoch": 1151} {"train_loss": -39.13483428955078, "global_step": 139310, "epoch": 1151} {"train_loss": -38.49856185913086, "global_step": 139311, "epoch": 1151} {"train_loss": -39.02425003051758, "global_step": 139312, "epoch": 1151} {"train_loss": -39.16693878173828, "global_step": 139313, "epoch": 1151} {"train_loss": -38.49271774291992, "global_step": 139314, "epoch": 1151} {"train_loss": -39.45935821533203, "global_step": 139315, "epoch": 1151} {"train_loss": -39.4707145690918, "global_step": 139316, "epoch": 1151} {"train_loss": -35.87004470825195, "global_step": 139317, "epoch": 1151} {"train_loss": -39.009342193603516, "global_step": 139318, "epoch": 1151} {"train_loss": -39.25642395019531, "global_step": 139319, "epoch": 1151} {"train_loss": -39.306922912597656, "global_step": 139320, "epoch": 1151} {"train_loss": -38.934017181396484, "global_step": 139321, "epoch": 1151} {"train_loss": -39.12191390991211, "global_step": 139322, "epoch": 1151} {"train_loss": -39.96249008178711, "global_step": 139323, "epoch": 1151} {"train_loss": -39.31241989135742, "global_step": 139324, "epoch": 1151} {"train_loss": -39.31659698486328, "global_step": 139325, "epoch": 1151} {"train_loss": -39.99176788330078, "global_step": 139326, "epoch": 1151} {"train_loss": -40.1585693359375, "global_step": 139327, "epoch": 1151} {"train_loss": -40.119930267333984, "global_step": 139328, "epoch": 1151} {"train_loss": -40.1513786315918, "global_step": 139329, "epoch": 1151} {"train_loss": -39.87244415283203, "global_step": 139330, "epoch": 1151} {"train_loss": -39.390865325927734, "global_step": 139331, "epoch": 1151} {"train_loss": -40.0838737487793, "global_step": 139332, "epoch": 1151} {"train_loss": -38.222469329833984, "global_step": 139333, "epoch": 1151} {"train_loss": -39.82968521118164, "global_step": 139334, "epoch": 1151} {"train_loss": -39.67082214355469, "global_step": 139335, "epoch": 1151} {"train_loss": -39.76291275024414, "global_step": 139336, "epoch": 1151} {"train_loss": -40.30481719970703, "global_step": 139337, "epoch": 1151} {"train_loss": -40.181575775146484, "global_step": 139338, "epoch": 1151} {"train_loss": -40.12630081176758, "global_step": 139339, "epoch": 1151} {"train_loss": -40.494300842285156, "global_step": 139340, "epoch": 1151} {"train_loss": -40.071319580078125, "global_step": 139341, "epoch": 1151} {"train_loss": -40.85200881958008, "global_step": 139342, "epoch": 1151} {"train_loss": -40.39851760864258, "global_step": 139343, "epoch": 1151} {"train_loss": -39.797698974609375, "global_step": 139344, "epoch": 1151} {"train_loss": -39.96997833251953, "global_step": 139345, "epoch": 1151} {"train_loss": -39.81276321411133, "global_step": 139346, "epoch": 1151} {"train_loss": -40.93180847167969, "global_step": 139347, "epoch": 1151} {"train_loss": -40.70489501953125, "global_step": 139348, "epoch": 1151} {"train_loss": -40.05894088745117, "global_step": 139349, "epoch": 1151} {"train_loss": -40.52322769165039, "global_step": 139350, "epoch": 1151} {"train_loss": -40.24931716918945, "global_step": 139351, "epoch": 1151} {"train_loss": -40.8781852722168, "global_step": 139352, "epoch": 1151} {"train_loss": -40.55387878417969, "global_step": 139353, "epoch": 1151} {"train_loss": -40.46202850341797, "global_step": 139354, "epoch": 1151} {"train_loss": -41.07107162475586, "global_step": 139355, "epoch": 1151} {"train_loss": -40.73861312866211, "global_step": 139356, "epoch": 1151} {"train_loss": -40.83527374267578, "global_step": 139357, "epoch": 1151} {"train_loss": -40.66765594482422, "global_step": 139358, "epoch": 1151} {"train_loss": -41.41932678222656, "global_step": 139359, "epoch": 1151} {"train_loss": -40.908267974853516, "global_step": 139360, "epoch": 1151} {"train_loss": -40.20302963256836, "global_step": 139361, "epoch": 1151} {"train_loss": -40.62409210205078, "global_step": 139362, "epoch": 1151} {"train_loss": -41.15779495239258, "global_step": 139363, "epoch": 1151} {"train_loss": -41.14014434814453, "global_step": 139364, "epoch": 1151} {"train_loss": -41.22254943847656, "global_step": 139365, "epoch": 1151} {"train_loss": -40.54157257080078, "global_step": 139366, "epoch": 1151} {"train_loss": -41.4049186706543, "global_step": 139367, "epoch": 1151} {"train_loss": -41.175533294677734, "global_step": 139368, "epoch": 1151} {"train_loss": -40.80303192138672, "global_step": 139369, "epoch": 1151} {"train_loss": -41.64057922363281, "global_step": 139370, "epoch": 1151} {"train_loss": -40.600196838378906, "global_step": 139371, "epoch": 1151} {"train_loss": -40.05537796020508, "global_step": 139372, "epoch": 1151} {"train_loss": -40.83443069458008, "global_step": 139373, "epoch": 1151} {"train_loss": -41.0732421875, "global_step": 139374, "epoch": 1151} {"train_loss": -40.726234436035156, "global_step": 139375, "epoch": 1151} {"train_loss": -40.5952262878418, "global_step": 139376, "epoch": 1151} {"train_loss": -39.69700622558594, "global_step": 139377, "epoch": 1151} {"train_loss": -40.25220489501953, "global_step": 139378, "epoch": 1151} {"train_loss": -40.59172058105469, "global_step": 139379, "epoch": 1151} {"train_loss": -40.8108024597168, "global_step": 139380, "epoch": 1151} {"train_loss": -40.26909637451172, "global_step": 139381, "epoch": 1151} {"train_loss": -38.10537338256836, "global_step": 139382, "epoch": 1151} {"train_loss": -35.21660232543945, "global_step": 139383, "epoch": 1151} {"train_loss": -32.15224075317383, "global_step": 139384, "epoch": 1151} {"train_loss": -33.48247146606445, "global_step": 139385, "epoch": 1151} {"train_loss": -40.18040084838867, "global_step": 139386, "epoch": 1151} {"train_loss": -37.99630355834961, "global_step": 139387, "epoch": 1151} {"train_loss": -34.1580696105957, "global_step": 139388, "epoch": 1151} {"train_loss": -33.24732208251953, "global_step": 139389, "epoch": 1151} {"train_loss": -39.25321578979492, "global_step": 139390, "epoch": 1151} {"train_loss": -39.05278822213165, "global_step": 139391, "epoch": 1151, "val_loss": 2574448.25} {"train_loss": -36.415775299072266, "global_step": 139392, "epoch": 1152} {"train_loss": -39.30501174926758, "global_step": 139393, "epoch": 1152} {"train_loss": -37.53277587890625, "global_step": 139394, "epoch": 1152} {"train_loss": -38.46596145629883, "global_step": 139395, "epoch": 1152} {"train_loss": -39.69900131225586, "global_step": 139396, "epoch": 1152} {"train_loss": -39.181697845458984, "global_step": 139397, "epoch": 1152} {"train_loss": -39.68708419799805, "global_step": 139398, "epoch": 1152} {"train_loss": -39.669464111328125, "global_step": 139399, "epoch": 1152} {"train_loss": -39.213226318359375, "global_step": 139400, "epoch": 1152} {"train_loss": -39.880184173583984, "global_step": 139401, "epoch": 1152} {"train_loss": -39.702125549316406, "global_step": 139402, "epoch": 1152} {"train_loss": -39.23749923706055, "global_step": 139403, "epoch": 1152} {"train_loss": -39.01334762573242, "global_step": 139404, "epoch": 1152} {"train_loss": -39.46733856201172, "global_step": 139405, "epoch": 1152} {"train_loss": -40.192710876464844, "global_step": 139406, "epoch": 1152} {"train_loss": -39.824623107910156, "global_step": 139407, "epoch": 1152} {"train_loss": -39.90336227416992, "global_step": 139408, "epoch": 1152} {"train_loss": -40.13581085205078, "global_step": 139409, "epoch": 1152} {"train_loss": -40.26986312866211, "global_step": 139410, "epoch": 1152} {"train_loss": -40.24871826171875, "global_step": 139411, "epoch": 1152} {"train_loss": -39.336029052734375, "global_step": 139412, "epoch": 1152} {"train_loss": -39.62598419189453, "global_step": 139413, "epoch": 1152} {"train_loss": -40.388389587402344, "global_step": 139414, "epoch": 1152} {"train_loss": -39.9879035949707, "global_step": 139415, "epoch": 1152} {"train_loss": -40.37261962890625, "global_step": 139416, "epoch": 1152} {"train_loss": -40.14390182495117, "global_step": 139417, "epoch": 1152} {"train_loss": -39.32183837890625, "global_step": 139418, "epoch": 1152} {"train_loss": -40.299896240234375, "global_step": 139419, "epoch": 1152} {"train_loss": -39.859825134277344, "global_step": 139420, "epoch": 1152} {"train_loss": -40.18308639526367, "global_step": 139421, "epoch": 1152} {"train_loss": -39.855445861816406, "global_step": 139422, "epoch": 1152} {"train_loss": -40.1255989074707, "global_step": 139423, "epoch": 1152} {"train_loss": -39.59098434448242, "global_step": 139424, "epoch": 1152} {"train_loss": -39.45184326171875, "global_step": 139425, "epoch": 1152} {"train_loss": -40.27818298339844, "global_step": 139426, "epoch": 1152} {"train_loss": -39.4640007019043, "global_step": 139427, "epoch": 1152} {"train_loss": -40.1629524230957, "global_step": 139428, "epoch": 1152} {"train_loss": -40.31077575683594, "global_step": 139429, "epoch": 1152} {"train_loss": -40.58268356323242, "global_step": 139430, "epoch": 1152} {"train_loss": -40.51054000854492, "global_step": 139431, "epoch": 1152} {"train_loss": -40.76125717163086, "global_step": 139432, "epoch": 1152} {"train_loss": -40.389278411865234, "global_step": 139433, "epoch": 1152} {"train_loss": -40.32484817504883, "global_step": 139434, "epoch": 1152} {"train_loss": -40.61180114746094, "global_step": 139435, "epoch": 1152} {"train_loss": -40.7744026184082, "global_step": 139436, "epoch": 1152} {"train_loss": -40.10006332397461, "global_step": 139437, "epoch": 1152} {"train_loss": -40.85477828979492, "global_step": 139438, "epoch": 1152} {"train_loss": -40.46644973754883, "global_step": 139439, "epoch": 1152} {"train_loss": -40.112693786621094, "global_step": 139440, "epoch": 1152} {"train_loss": -40.41840744018555, "global_step": 139441, "epoch": 1152} {"train_loss": -40.228694915771484, "global_step": 139442, "epoch": 1152} {"train_loss": -39.83978271484375, "global_step": 139443, "epoch": 1152} {"train_loss": -41.050289154052734, "global_step": 139444, "epoch": 1152} {"train_loss": -40.458709716796875, "global_step": 139445, "epoch": 1152} {"train_loss": -40.6776123046875, "global_step": 139446, "epoch": 1152} {"train_loss": -40.03766632080078, "global_step": 139447, "epoch": 1152} {"train_loss": -40.88044357299805, "global_step": 139448, "epoch": 1152} {"train_loss": -40.91291046142578, "global_step": 139449, "epoch": 1152} {"train_loss": -40.98870849609375, "global_step": 139450, "epoch": 1152} {"train_loss": -40.59524154663086, "global_step": 139451, "epoch": 1152} {"train_loss": -41.209957122802734, "global_step": 139452, "epoch": 1152} {"train_loss": -40.7981071472168, "global_step": 139453, "epoch": 1152} {"train_loss": -40.43292236328125, "global_step": 139454, "epoch": 1152} {"train_loss": -41.118648529052734, "global_step": 139455, "epoch": 1152} {"train_loss": -41.142478942871094, "global_step": 139456, "epoch": 1152} {"train_loss": -40.765960693359375, "global_step": 139457, "epoch": 1152} {"train_loss": -40.611839294433594, "global_step": 139458, "epoch": 1152} {"train_loss": -40.23431396484375, "global_step": 139459, "epoch": 1152} {"train_loss": -41.013526916503906, "global_step": 139460, "epoch": 1152} {"train_loss": -39.99738693237305, "global_step": 139461, "epoch": 1152} {"train_loss": -40.692325592041016, "global_step": 139462, "epoch": 1152} {"train_loss": -40.507568359375, "global_step": 139463, "epoch": 1152} {"train_loss": -40.996551513671875, "global_step": 139464, "epoch": 1152} {"train_loss": -40.78959274291992, "global_step": 139465, "epoch": 1152} {"train_loss": -40.55068588256836, "global_step": 139466, "epoch": 1152} {"train_loss": -40.67123031616211, "global_step": 139467, "epoch": 1152} {"train_loss": -40.51308822631836, "global_step": 139468, "epoch": 1152} {"train_loss": -40.59233474731445, "global_step": 139469, "epoch": 1152} {"train_loss": -40.757652282714844, "global_step": 139470, "epoch": 1152} {"train_loss": -40.2786750793457, "global_step": 139471, "epoch": 1152} {"train_loss": -40.65440368652344, "global_step": 139472, "epoch": 1152} {"train_loss": -40.52376174926758, "global_step": 139473, "epoch": 1152} {"train_loss": -40.3624153137207, "global_step": 139474, "epoch": 1152} {"train_loss": -40.036251068115234, "global_step": 139475, "epoch": 1152} {"train_loss": -40.32937240600586, "global_step": 139476, "epoch": 1152} {"train_loss": -39.81294631958008, "global_step": 139477, "epoch": 1152} {"train_loss": -40.10624313354492, "global_step": 139478, "epoch": 1152} {"train_loss": -38.529510498046875, "global_step": 139479, "epoch": 1152} {"train_loss": -40.42994689941406, "global_step": 139480, "epoch": 1152} {"train_loss": -39.79392623901367, "global_step": 139481, "epoch": 1152} {"train_loss": -38.01076889038086, "global_step": 139482, "epoch": 1152} {"train_loss": -37.60792541503906, "global_step": 139483, "epoch": 1152} {"train_loss": -39.310726165771484, "global_step": 139484, "epoch": 1152} {"train_loss": -40.02543258666992, "global_step": 139485, "epoch": 1152} {"train_loss": -36.11335372924805, "global_step": 139486, "epoch": 1152} {"train_loss": -38.323204040527344, "global_step": 139487, "epoch": 1152} {"train_loss": -38.69949722290039, "global_step": 139488, "epoch": 1152} {"train_loss": -37.7424430847168, "global_step": 139489, "epoch": 1152} {"train_loss": -37.69124984741211, "global_step": 139490, "epoch": 1152} {"train_loss": -38.157958984375, "global_step": 139491, "epoch": 1152} {"train_loss": -37.989158630371094, "global_step": 139492, "epoch": 1152} {"train_loss": -39.53110885620117, "global_step": 139493, "epoch": 1152} {"train_loss": -36.98332214355469, "global_step": 139494, "epoch": 1152} {"train_loss": -38.64551544189453, "global_step": 139495, "epoch": 1152} {"train_loss": -38.45208740234375, "global_step": 139496, "epoch": 1152} {"train_loss": -37.89662551879883, "global_step": 139497, "epoch": 1152} {"train_loss": -39.56812286376953, "global_step": 139498, "epoch": 1152} {"train_loss": -38.90894317626953, "global_step": 139499, "epoch": 1152} {"train_loss": -35.67441177368164, "global_step": 139500, "epoch": 1152} {"train_loss": -39.744625091552734, "global_step": 139501, "epoch": 1152} {"train_loss": -37.06874084472656, "global_step": 139502, "epoch": 1152} {"train_loss": -38.64359664916992, "global_step": 139503, "epoch": 1152} {"train_loss": -39.39653778076172, "global_step": 139504, "epoch": 1152} {"train_loss": -39.59217071533203, "global_step": 139505, "epoch": 1152} {"train_loss": -39.61403274536133, "global_step": 139506, "epoch": 1152} {"train_loss": -39.452693939208984, "global_step": 139507, "epoch": 1152} {"train_loss": -40.4640998840332, "global_step": 139508, "epoch": 1152} {"train_loss": -38.37697982788086, "global_step": 139509, "epoch": 1152} {"train_loss": -40.27188491821289, "global_step": 139510, "epoch": 1152} {"train_loss": -38.72316360473633, "global_step": 139511, "epoch": 1152} {"train_loss": -39.73467323996804, "global_step": 139512, "epoch": 1152, "val_loss": 2622073.25} {"train_loss": -40.2623176574707, "global_step": 139513, "epoch": 1153} {"train_loss": -39.783607482910156, "global_step": 139514, "epoch": 1153} {"train_loss": -39.812679290771484, "global_step": 139515, "epoch": 1153} {"train_loss": -40.41289138793945, "global_step": 139516, "epoch": 1153} {"train_loss": -40.00435256958008, "global_step": 139517, "epoch": 1153} {"train_loss": -40.180755615234375, "global_step": 139518, "epoch": 1153} {"train_loss": -40.27349853515625, "global_step": 139519, "epoch": 1153} {"train_loss": -39.51990509033203, "global_step": 139520, "epoch": 1153} {"train_loss": -40.450984954833984, "global_step": 139521, "epoch": 1153} {"train_loss": -40.46072006225586, "global_step": 139522, "epoch": 1153} {"train_loss": -40.08436965942383, "global_step": 139523, "epoch": 1153} {"train_loss": -40.24271774291992, "global_step": 139524, "epoch": 1153} {"train_loss": -40.479122161865234, "global_step": 139525, "epoch": 1153} {"train_loss": -39.92499542236328, "global_step": 139526, "epoch": 1153} {"train_loss": -40.42022705078125, "global_step": 139527, "epoch": 1153} {"train_loss": -40.23862838745117, "global_step": 139528, "epoch": 1153} {"train_loss": -40.769805908203125, "global_step": 139529, "epoch": 1153} {"train_loss": -40.70954513549805, "global_step": 139530, "epoch": 1153} {"train_loss": -40.76893615722656, "global_step": 139531, "epoch": 1153} {"train_loss": -39.794090270996094, "global_step": 139532, "epoch": 1153} {"train_loss": -40.62552261352539, "global_step": 139533, "epoch": 1153} {"train_loss": -40.42409133911133, "global_step": 139534, "epoch": 1153} {"train_loss": -40.31255340576172, "global_step": 139535, "epoch": 1153} {"train_loss": -40.56278610229492, "global_step": 139536, "epoch": 1153} {"train_loss": -40.47223663330078, "global_step": 139537, "epoch": 1153} {"train_loss": -40.48103332519531, "global_step": 139538, "epoch": 1153} {"train_loss": -40.72306442260742, "global_step": 139539, "epoch": 1153} {"train_loss": -41.11538314819336, "global_step": 139540, "epoch": 1153} {"train_loss": -40.85429763793945, "global_step": 139541, "epoch": 1153} {"train_loss": -40.24745178222656, "global_step": 139542, "epoch": 1153} {"train_loss": -40.45923614501953, "global_step": 139543, "epoch": 1153} {"train_loss": -40.77816390991211, "global_step": 139544, "epoch": 1153} {"train_loss": -40.3358268737793, "global_step": 139545, "epoch": 1153} {"train_loss": -40.50655746459961, "global_step": 139546, "epoch": 1153} {"train_loss": -40.20815658569336, "global_step": 139547, "epoch": 1153} {"train_loss": -40.567962646484375, "global_step": 139548, "epoch": 1153} {"train_loss": -40.17926788330078, "global_step": 139549, "epoch": 1153} {"train_loss": -40.00788116455078, "global_step": 139550, "epoch": 1153} {"train_loss": -40.98429489135742, "global_step": 139551, "epoch": 1153} {"train_loss": -40.04790496826172, "global_step": 139552, "epoch": 1153} {"train_loss": -40.781063079833984, "global_step": 139553, "epoch": 1153} {"train_loss": -40.78556442260742, "global_step": 139554, "epoch": 1153} {"train_loss": -40.78984832763672, "global_step": 139555, "epoch": 1153} {"train_loss": -41.09070587158203, "global_step": 139556, "epoch": 1153} {"train_loss": -40.7082633972168, "global_step": 139557, "epoch": 1153} {"train_loss": -40.225521087646484, "global_step": 139558, "epoch": 1153} {"train_loss": -41.24149703979492, "global_step": 139559, "epoch": 1153} {"train_loss": -40.384552001953125, "global_step": 139560, "epoch": 1153} {"train_loss": -39.8719596862793, "global_step": 139561, "epoch": 1153} {"train_loss": -41.0377197265625, "global_step": 139562, "epoch": 1153} {"train_loss": -41.1865234375, "global_step": 139563, "epoch": 1153} {"train_loss": -40.647090911865234, "global_step": 139564, "epoch": 1153} {"train_loss": -40.89467239379883, "global_step": 139565, "epoch": 1153} {"train_loss": -40.92650604248047, "global_step": 139566, "epoch": 1153} {"train_loss": -40.80113220214844, "global_step": 139567, "epoch": 1153} {"train_loss": -40.63362503051758, "global_step": 139568, "epoch": 1153} {"train_loss": -40.6104850769043, "global_step": 139569, "epoch": 1153} {"train_loss": -40.62608337402344, "global_step": 139570, "epoch": 1153} {"train_loss": -40.72649383544922, "global_step": 139571, "epoch": 1153} {"train_loss": -39.4510498046875, "global_step": 139572, "epoch": 1153} {"train_loss": -38.93488311767578, "global_step": 139573, "epoch": 1153} {"train_loss": -40.4609260559082, "global_step": 139574, "epoch": 1153} {"train_loss": -36.49874496459961, "global_step": 139575, "epoch": 1153} {"train_loss": -40.32033157348633, "global_step": 139576, "epoch": 1153} {"train_loss": -38.25741195678711, "global_step": 139577, "epoch": 1153} {"train_loss": -39.08193588256836, "global_step": 139578, "epoch": 1153} {"train_loss": -40.042213439941406, "global_step": 139579, "epoch": 1153} {"train_loss": -36.173980712890625, "global_step": 139580, "epoch": 1153} {"train_loss": -33.636863708496094, "global_step": 139581, "epoch": 1153} {"train_loss": -39.361236572265625, "global_step": 139582, "epoch": 1153} {"train_loss": -34.36213684082031, "global_step": 139583, "epoch": 1153} {"train_loss": -35.32855224609375, "global_step": 139584, "epoch": 1153} {"train_loss": -39.050567626953125, "global_step": 139585, "epoch": 1153} {"train_loss": -37.32088851928711, "global_step": 139586, "epoch": 1153} {"train_loss": -38.841400146484375, "global_step": 139587, "epoch": 1153} {"train_loss": -39.40229034423828, "global_step": 139588, "epoch": 1153} {"train_loss": -37.40357208251953, "global_step": 139589, "epoch": 1153} {"train_loss": -38.5449333190918, "global_step": 139590, "epoch": 1153} {"train_loss": -39.84975051879883, "global_step": 139591, "epoch": 1153} {"train_loss": -37.73133087158203, "global_step": 139592, "epoch": 1153} {"train_loss": -36.547054290771484, "global_step": 139593, "epoch": 1153} {"train_loss": -39.24819564819336, "global_step": 139594, "epoch": 1153} {"train_loss": -39.2618408203125, "global_step": 139595, "epoch": 1153} {"train_loss": -38.64620590209961, "global_step": 139596, "epoch": 1153} {"train_loss": -40.338958740234375, "global_step": 139597, "epoch": 1153} {"train_loss": -38.549835205078125, "global_step": 139598, "epoch": 1153} {"train_loss": -38.629249572753906, "global_step": 139599, "epoch": 1153} {"train_loss": -37.82148361206055, "global_step": 139600, "epoch": 1153} {"train_loss": -39.51897430419922, "global_step": 139601, "epoch": 1153} {"train_loss": -33.89506912231445, "global_step": 139602, "epoch": 1153} {"train_loss": -39.842525482177734, "global_step": 139603, "epoch": 1153} {"train_loss": -38.1207389831543, "global_step": 139604, "epoch": 1153} {"train_loss": -34.80835723876953, "global_step": 139605, "epoch": 1153} {"train_loss": -38.7353515625, "global_step": 139606, "epoch": 1153} {"train_loss": -35.97136688232422, "global_step": 139607, "epoch": 1153} {"train_loss": -38.542030334472656, "global_step": 139608, "epoch": 1153} {"train_loss": -38.68383026123047, "global_step": 139609, "epoch": 1153} {"train_loss": -37.82865524291992, "global_step": 139610, "epoch": 1153} {"train_loss": -38.19684600830078, "global_step": 139611, "epoch": 1153} {"train_loss": -37.84189987182617, "global_step": 139612, "epoch": 1153} {"train_loss": -38.65390396118164, "global_step": 139613, "epoch": 1153} {"train_loss": -38.0470085144043, "global_step": 139614, "epoch": 1153} {"train_loss": -39.39992141723633, "global_step": 139615, "epoch": 1153} {"train_loss": -38.5152473449707, "global_step": 139616, "epoch": 1153} {"train_loss": -38.99924850463867, "global_step": 139617, "epoch": 1153} {"train_loss": -38.76884460449219, "global_step": 139618, "epoch": 1153} {"train_loss": -39.47140121459961, "global_step": 139619, "epoch": 1153} {"train_loss": -39.20146560668945, "global_step": 139620, "epoch": 1153} {"train_loss": -39.46112060546875, "global_step": 139621, "epoch": 1153} {"train_loss": -38.70105743408203, "global_step": 139622, "epoch": 1153} {"train_loss": -40.1580924987793, "global_step": 139623, "epoch": 1153} {"train_loss": -39.03413009643555, "global_step": 139624, "epoch": 1153} {"train_loss": -39.0166130065918, "global_step": 139625, "epoch": 1153} {"train_loss": -39.73197555541992, "global_step": 139626, "epoch": 1153} {"train_loss": -39.406097412109375, "global_step": 139627, "epoch": 1153} {"train_loss": -39.73486328125, "global_step": 139628, "epoch": 1153} {"train_loss": -39.664608001708984, "global_step": 139629, "epoch": 1153} {"train_loss": -39.92722702026367, "global_step": 139630, "epoch": 1153} {"train_loss": -39.74094009399414, "global_step": 139631, "epoch": 1153} {"train_loss": -40.2867546081543, "global_step": 139632, "epoch": 1153} {"train_loss": -39.46605108592136, "global_step": 139633, "epoch": 1153, "val_loss": 2594788.5} {"train_loss": -40.27289962768555, "global_step": 139634, "epoch": 1154} {"train_loss": -40.13044357299805, "global_step": 139635, "epoch": 1154} {"train_loss": -40.06277847290039, "global_step": 139636, "epoch": 1154} {"train_loss": -40.345638275146484, "global_step": 139637, "epoch": 1154} {"train_loss": -40.25863265991211, "global_step": 139638, "epoch": 1154} {"train_loss": -39.91559600830078, "global_step": 139639, "epoch": 1154} {"train_loss": -39.921390533447266, "global_step": 139640, "epoch": 1154} {"train_loss": -41.02158737182617, "global_step": 139641, "epoch": 1154} {"train_loss": -40.51594924926758, "global_step": 139642, "epoch": 1154} {"train_loss": -40.36330032348633, "global_step": 139643, "epoch": 1154} {"train_loss": -40.04256820678711, "global_step": 139644, "epoch": 1154} {"train_loss": -40.12226104736328, "global_step": 139645, "epoch": 1154} {"train_loss": -40.83431625366211, "global_step": 139646, "epoch": 1154} {"train_loss": -41.190704345703125, "global_step": 139647, "epoch": 1154} {"train_loss": -40.77554702758789, "global_step": 139648, "epoch": 1154} {"train_loss": -41.081912994384766, "global_step": 139649, "epoch": 1154} {"train_loss": -40.59603500366211, "global_step": 139650, "epoch": 1154} {"train_loss": -40.7944450378418, "global_step": 139651, "epoch": 1154} {"train_loss": -40.3464469909668, "global_step": 139652, "epoch": 1154} {"train_loss": -41.16162109375, "global_step": 139653, "epoch": 1154} {"train_loss": -40.74396514892578, "global_step": 139654, "epoch": 1154} {"train_loss": -41.130577087402344, "global_step": 139655, "epoch": 1154} {"train_loss": -40.79988479614258, "global_step": 139656, "epoch": 1154} {"train_loss": -40.850196838378906, "global_step": 139657, "epoch": 1154} {"train_loss": -40.950416564941406, "global_step": 139658, "epoch": 1154} {"train_loss": -40.58659744262695, "global_step": 139659, "epoch": 1154} {"train_loss": -39.9966926574707, "global_step": 139660, "epoch": 1154} {"train_loss": -41.05445861816406, "global_step": 139661, "epoch": 1154} {"train_loss": -40.865753173828125, "global_step": 139662, "epoch": 1154} {"train_loss": -40.609867095947266, "global_step": 139663, "epoch": 1154} {"train_loss": -41.047515869140625, "global_step": 139664, "epoch": 1154} {"train_loss": -41.1038818359375, "global_step": 139665, "epoch": 1154} {"train_loss": -40.39474868774414, "global_step": 139666, "epoch": 1154} {"train_loss": -41.077239990234375, "global_step": 139667, "epoch": 1154} {"train_loss": -40.109344482421875, "global_step": 139668, "epoch": 1154} {"train_loss": -40.736534118652344, "global_step": 139669, "epoch": 1154} {"train_loss": -39.428524017333984, "global_step": 139670, "epoch": 1154} {"train_loss": -40.003013610839844, "global_step": 139671, "epoch": 1154} {"train_loss": -40.61289978027344, "global_step": 139672, "epoch": 1154} {"train_loss": -40.60206985473633, "global_step": 139673, "epoch": 1154} {"train_loss": -40.890960693359375, "global_step": 139674, "epoch": 1154} {"train_loss": -40.897216796875, "global_step": 139675, "epoch": 1154} {"train_loss": -39.644771575927734, "global_step": 139676, "epoch": 1154} {"train_loss": -39.96291732788086, "global_step": 139677, "epoch": 1154} {"train_loss": -39.63536071777344, "global_step": 139678, "epoch": 1154} {"train_loss": -38.609310150146484, "global_step": 139679, "epoch": 1154} {"train_loss": -36.44742965698242, "global_step": 139680, "epoch": 1154} {"train_loss": -39.59553909301758, "global_step": 139681, "epoch": 1154} {"train_loss": -40.01851272583008, "global_step": 139682, "epoch": 1154} {"train_loss": -40.59285354614258, "global_step": 139683, "epoch": 1154} {"train_loss": -39.8914680480957, "global_step": 139684, "epoch": 1154} {"train_loss": -38.30849075317383, "global_step": 139685, "epoch": 1154} {"train_loss": -35.25041580200195, "global_step": 139686, "epoch": 1154} {"train_loss": -39.42665100097656, "global_step": 139687, "epoch": 1154} {"train_loss": -38.69916534423828, "global_step": 139688, "epoch": 1154} {"train_loss": -36.95315170288086, "global_step": 139689, "epoch": 1154} {"train_loss": -39.17056655883789, "global_step": 139690, "epoch": 1154} {"train_loss": -39.25956344604492, "global_step": 139691, "epoch": 1154} {"train_loss": -39.33644104003906, "global_step": 139692, "epoch": 1154} {"train_loss": -38.0767707824707, "global_step": 139693, "epoch": 1154} {"train_loss": -37.97937774658203, "global_step": 139694, "epoch": 1154} {"train_loss": -39.639163970947266, "global_step": 139695, "epoch": 1154} {"train_loss": -39.37868118286133, "global_step": 139696, "epoch": 1154} {"train_loss": -37.32305908203125, "global_step": 139697, "epoch": 1154} {"train_loss": -38.93416976928711, "global_step": 139698, "epoch": 1154} {"train_loss": -39.83779525756836, "global_step": 139699, "epoch": 1154} {"train_loss": -37.39207077026367, "global_step": 139700, "epoch": 1154} {"train_loss": -37.50490188598633, "global_step": 139701, "epoch": 1154} {"train_loss": -38.97224807739258, "global_step": 139702, "epoch": 1154} {"train_loss": -37.42390060424805, "global_step": 139703, "epoch": 1154} {"train_loss": -39.15730667114258, "global_step": 139704, "epoch": 1154} {"train_loss": -40.0427360534668, "global_step": 139705, "epoch": 1154} {"train_loss": -38.08878707885742, "global_step": 139706, "epoch": 1154} {"train_loss": -39.21675109863281, "global_step": 139707, "epoch": 1154} {"train_loss": -40.04663848876953, "global_step": 139708, "epoch": 1154} {"train_loss": -38.724342346191406, "global_step": 139709, "epoch": 1154} {"train_loss": -39.45796585083008, "global_step": 139710, "epoch": 1154} {"train_loss": -38.666744232177734, "global_step": 139711, "epoch": 1154} {"train_loss": -39.00053024291992, "global_step": 139712, "epoch": 1154} {"train_loss": -39.787288665771484, "global_step": 139713, "epoch": 1154} {"train_loss": -40.397926330566406, "global_step": 139714, "epoch": 1154} {"train_loss": -39.699005126953125, "global_step": 139715, "epoch": 1154} {"train_loss": -40.08491134643555, "global_step": 139716, "epoch": 1154} {"train_loss": -40.25078582763672, "global_step": 139717, "epoch": 1154} {"train_loss": -40.42936706542969, "global_step": 139718, "epoch": 1154} {"train_loss": -40.1734733581543, "global_step": 139719, "epoch": 1154} {"train_loss": -40.455745697021484, "global_step": 139720, "epoch": 1154} {"train_loss": -40.8427619934082, "global_step": 139721, "epoch": 1154} {"train_loss": -40.877559661865234, "global_step": 139722, "epoch": 1154} {"train_loss": -40.42582321166992, "global_step": 139723, "epoch": 1154} {"train_loss": -40.5533447265625, "global_step": 139724, "epoch": 1154} {"train_loss": -40.57469177246094, "global_step": 139725, "epoch": 1154} {"train_loss": -40.34269332885742, "global_step": 139726, "epoch": 1154} {"train_loss": -41.20487594604492, "global_step": 139727, "epoch": 1154} {"train_loss": -40.909725189208984, "global_step": 139728, "epoch": 1154} {"train_loss": -40.46772766113281, "global_step": 139729, "epoch": 1154} {"train_loss": -41.16666793823242, "global_step": 139730, "epoch": 1154} {"train_loss": -41.045204162597656, "global_step": 139731, "epoch": 1154} {"train_loss": -41.05633544921875, "global_step": 139732, "epoch": 1154} {"train_loss": -41.486083984375, "global_step": 139733, "epoch": 1154} {"train_loss": -40.67483139038086, "global_step": 139734, "epoch": 1154} {"train_loss": -40.989566802978516, "global_step": 139735, "epoch": 1154} {"train_loss": -41.089962005615234, "global_step": 139736, "epoch": 1154} {"train_loss": -41.29955291748047, "global_step": 139737, "epoch": 1154} {"train_loss": -41.0151252746582, "global_step": 139738, "epoch": 1154} {"train_loss": -41.4141731262207, "global_step": 139739, "epoch": 1154} {"train_loss": -40.85463333129883, "global_step": 139740, "epoch": 1154} {"train_loss": -41.21956253051758, "global_step": 139741, "epoch": 1154} {"train_loss": -40.68057632446289, "global_step": 139742, "epoch": 1154} {"train_loss": -40.57980728149414, "global_step": 139743, "epoch": 1154} {"train_loss": -41.341670989990234, "global_step": 139744, "epoch": 1154} {"train_loss": -41.030025482177734, "global_step": 139745, "epoch": 1154} {"train_loss": -41.107032775878906, "global_step": 139746, "epoch": 1154} {"train_loss": -40.39167404174805, "global_step": 139747, "epoch": 1154} {"train_loss": -41.16685104370117, "global_step": 139748, "epoch": 1154} {"train_loss": -41.3852653503418, "global_step": 139749, "epoch": 1154} {"train_loss": -41.22259521484375, "global_step": 139750, "epoch": 1154} {"train_loss": -41.252113342285156, "global_step": 139751, "epoch": 1154} {"train_loss": -41.232112884521484, "global_step": 139752, "epoch": 1154} {"train_loss": -40.945594787597656, "global_step": 139753, "epoch": 1154} {"train_loss": -40.11078319076664, "global_step": 139754, "epoch": 1154, "val_loss": 2678258.75} {"train_loss": -40.970279693603516, "global_step": 139755, "epoch": 1155} {"train_loss": -41.80237579345703, "global_step": 139756, "epoch": 1155} {"train_loss": -40.75507736206055, "global_step": 139757, "epoch": 1155} {"train_loss": -40.960174560546875, "global_step": 139758, "epoch": 1155} {"train_loss": -41.43281173706055, "global_step": 139759, "epoch": 1155} {"train_loss": -41.017677307128906, "global_step": 139760, "epoch": 1155} {"train_loss": -39.53181838989258, "global_step": 139761, "epoch": 1155} {"train_loss": -40.05113983154297, "global_step": 139762, "epoch": 1155} {"train_loss": -41.145790100097656, "global_step": 139763, "epoch": 1155} {"train_loss": -40.045162200927734, "global_step": 139764, "epoch": 1155} {"train_loss": -40.334598541259766, "global_step": 139765, "epoch": 1155} {"train_loss": -40.74568557739258, "global_step": 139766, "epoch": 1155} {"train_loss": -40.399169921875, "global_step": 139767, "epoch": 1155} {"train_loss": -40.80604934692383, "global_step": 139768, "epoch": 1155} {"train_loss": -41.04864501953125, "global_step": 139769, "epoch": 1155} {"train_loss": -41.01028060913086, "global_step": 139770, "epoch": 1155} {"train_loss": -41.50465393066406, "global_step": 139771, "epoch": 1155} {"train_loss": -40.61845779418945, "global_step": 139772, "epoch": 1155} {"train_loss": -39.924705505371094, "global_step": 139773, "epoch": 1155} {"train_loss": -40.67275619506836, "global_step": 139774, "epoch": 1155} {"train_loss": -40.65080261230469, "global_step": 139775, "epoch": 1155} {"train_loss": -41.2396354675293, "global_step": 139776, "epoch": 1155} {"train_loss": -40.06562805175781, "global_step": 139777, "epoch": 1155} {"train_loss": -39.2046012878418, "global_step": 139778, "epoch": 1155} {"train_loss": -40.42086410522461, "global_step": 139779, "epoch": 1155} {"train_loss": -40.60832214355469, "global_step": 139780, "epoch": 1155} {"train_loss": -39.030765533447266, "global_step": 139781, "epoch": 1155} {"train_loss": -38.62899398803711, "global_step": 139782, "epoch": 1155} {"train_loss": -39.5899772644043, "global_step": 139783, "epoch": 1155} {"train_loss": -40.5118522644043, "global_step": 139784, "epoch": 1155} {"train_loss": -40.444881439208984, "global_step": 139785, "epoch": 1155} {"train_loss": -38.27766036987305, "global_step": 139786, "epoch": 1155} {"train_loss": -37.06563949584961, "global_step": 139787, "epoch": 1155} {"train_loss": -36.31707763671875, "global_step": 139788, "epoch": 1155} {"train_loss": -36.054317474365234, "global_step": 139789, "epoch": 1155} {"train_loss": -36.28728103637695, "global_step": 139790, "epoch": 1155} {"train_loss": -36.90009689331055, "global_step": 139791, "epoch": 1155} {"train_loss": -34.90849304199219, "global_step": 139792, "epoch": 1155} {"train_loss": -36.14910888671875, "global_step": 139793, "epoch": 1155} {"train_loss": -37.39385986328125, "global_step": 139794, "epoch": 1155} {"train_loss": -38.2214469909668, "global_step": 139795, "epoch": 1155} {"train_loss": -37.44232177734375, "global_step": 139796, "epoch": 1155} {"train_loss": -35.88499069213867, "global_step": 139797, "epoch": 1155} {"train_loss": -39.103878021240234, "global_step": 139798, "epoch": 1155} {"train_loss": -37.30605697631836, "global_step": 139799, "epoch": 1155} {"train_loss": -38.42707061767578, "global_step": 139800, "epoch": 1155} {"train_loss": -38.09320068359375, "global_step": 139801, "epoch": 1155} {"train_loss": -38.602149963378906, "global_step": 139802, "epoch": 1155} {"train_loss": -39.44092559814453, "global_step": 139803, "epoch": 1155} {"train_loss": -37.73862838745117, "global_step": 139804, "epoch": 1155} {"train_loss": -38.01969528198242, "global_step": 139805, "epoch": 1155} {"train_loss": -39.56781005859375, "global_step": 139806, "epoch": 1155} {"train_loss": -37.61326217651367, "global_step": 139807, "epoch": 1155} {"train_loss": -39.866188049316406, "global_step": 139808, "epoch": 1155} {"train_loss": -39.12710189819336, "global_step": 139809, "epoch": 1155} {"train_loss": -39.21639633178711, "global_step": 139810, "epoch": 1155} {"train_loss": -40.38539505004883, "global_step": 139811, "epoch": 1155} {"train_loss": -38.51140213012695, "global_step": 139812, "epoch": 1155} {"train_loss": -39.958160400390625, "global_step": 139813, "epoch": 1155} {"train_loss": -39.076473236083984, "global_step": 139814, "epoch": 1155} {"train_loss": -39.09309005737305, "global_step": 139815, "epoch": 1155} {"train_loss": -40.32603073120117, "global_step": 139816, "epoch": 1155} {"train_loss": -39.77928161621094, "global_step": 139817, "epoch": 1155} {"train_loss": -39.562782287597656, "global_step": 139818, "epoch": 1155} {"train_loss": -40.08740234375, "global_step": 139819, "epoch": 1155} {"train_loss": -38.37607955932617, "global_step": 139820, "epoch": 1155} {"train_loss": -40.416988372802734, "global_step": 139821, "epoch": 1155} {"train_loss": -39.35926055908203, "global_step": 139822, "epoch": 1155} {"train_loss": -40.03889846801758, "global_step": 139823, "epoch": 1155} {"train_loss": -40.03009796142578, "global_step": 139824, "epoch": 1155} {"train_loss": -38.853973388671875, "global_step": 139825, "epoch": 1155} {"train_loss": -40.14617156982422, "global_step": 139826, "epoch": 1155} {"train_loss": -39.15383529663086, "global_step": 139827, "epoch": 1155} {"train_loss": -40.148162841796875, "global_step": 139828, "epoch": 1155} {"train_loss": -39.27554702758789, "global_step": 139829, "epoch": 1155} {"train_loss": -40.30826950073242, "global_step": 139830, "epoch": 1155} {"train_loss": -40.16133499145508, "global_step": 139831, "epoch": 1155} {"train_loss": -40.12187576293945, "global_step": 139832, "epoch": 1155} {"train_loss": -40.608428955078125, "global_step": 139833, "epoch": 1155} {"train_loss": -40.65615463256836, "global_step": 139834, "epoch": 1155} {"train_loss": -40.10740280151367, "global_step": 139835, "epoch": 1155} {"train_loss": -40.24055862426758, "global_step": 139836, "epoch": 1155} {"train_loss": -40.18651580810547, "global_step": 139837, "epoch": 1155} {"train_loss": -40.58204650878906, "global_step": 139838, "epoch": 1155} {"train_loss": -41.194156646728516, "global_step": 139839, "epoch": 1155} {"train_loss": -40.29753112792969, "global_step": 139840, "epoch": 1155} {"train_loss": -40.84424591064453, "global_step": 139841, "epoch": 1155} {"train_loss": -40.45635223388672, "global_step": 139842, "epoch": 1155} {"train_loss": -40.724266052246094, "global_step": 139843, "epoch": 1155} {"train_loss": -40.876487731933594, "global_step": 139844, "epoch": 1155} {"train_loss": -41.3173942565918, "global_step": 139845, "epoch": 1155} {"train_loss": -40.2586555480957, "global_step": 139846, "epoch": 1155} {"train_loss": -40.977935791015625, "global_step": 139847, "epoch": 1155} {"train_loss": -40.64486312866211, "global_step": 139848, "epoch": 1155} {"train_loss": -41.0609016418457, "global_step": 139849, "epoch": 1155} {"train_loss": -40.821224212646484, "global_step": 139850, "epoch": 1155} {"train_loss": -41.22152328491211, "global_step": 139851, "epoch": 1155} {"train_loss": -40.909523010253906, "global_step": 139852, "epoch": 1155} {"train_loss": -40.7787971496582, "global_step": 139853, "epoch": 1155} {"train_loss": -41.15590286254883, "global_step": 139854, "epoch": 1155} {"train_loss": -41.13372039794922, "global_step": 139855, "epoch": 1155} {"train_loss": -40.915687561035156, "global_step": 139856, "epoch": 1155} {"train_loss": -40.98448944091797, "global_step": 139857, "epoch": 1155} {"train_loss": -40.561641693115234, "global_step": 139858, "epoch": 1155} {"train_loss": -41.66001892089844, "global_step": 139859, "epoch": 1155} {"train_loss": -40.78646469116211, "global_step": 139860, "epoch": 1155} {"train_loss": -41.62458419799805, "global_step": 139861, "epoch": 1155} {"train_loss": -41.63362503051758, "global_step": 139862, "epoch": 1155} {"train_loss": -41.65679168701172, "global_step": 139863, "epoch": 1155} {"train_loss": -40.97611618041992, "global_step": 139864, "epoch": 1155} {"train_loss": -41.499935150146484, "global_step": 139865, "epoch": 1155} {"train_loss": -41.358028411865234, "global_step": 139866, "epoch": 1155} {"train_loss": -41.5168571472168, "global_step": 139867, "epoch": 1155} {"train_loss": -41.407447814941406, "global_step": 139868, "epoch": 1155} {"train_loss": -41.429718017578125, "global_step": 139869, "epoch": 1155} {"train_loss": -41.60416793823242, "global_step": 139870, "epoch": 1155} {"train_loss": -41.293209075927734, "global_step": 139871, "epoch": 1155} {"train_loss": -40.9598274230957, "global_step": 139872, "epoch": 1155} {"train_loss": -41.17580795288086, "global_step": 139873, "epoch": 1155} {"train_loss": -41.45937728881836, "global_step": 139874, "epoch": 1155} {"train_loss": -39.954963557976335, "global_step": 139875, "epoch": 1155, "val_loss": 2627188.5} {"train_loss": -41.259376525878906, "global_step": 139876, "epoch": 1156} {"train_loss": -41.0316276550293, "global_step": 139877, "epoch": 1156} {"train_loss": -41.27215576171875, "global_step": 139878, "epoch": 1156} {"train_loss": -41.39601516723633, "global_step": 139879, "epoch": 1156} {"train_loss": -41.61223602294922, "global_step": 139880, "epoch": 1156} {"train_loss": -41.191993713378906, "global_step": 139881, "epoch": 1156} {"train_loss": -41.27901840209961, "global_step": 139882, "epoch": 1156} {"train_loss": -40.161354064941406, "global_step": 139883, "epoch": 1156} {"train_loss": -40.22344207763672, "global_step": 139884, "epoch": 1156} {"train_loss": -39.52050018310547, "global_step": 139885, "epoch": 1156} {"train_loss": -41.60264205932617, "global_step": 139886, "epoch": 1156} {"train_loss": -40.90494918823242, "global_step": 139887, "epoch": 1156} {"train_loss": -39.11063003540039, "global_step": 139888, "epoch": 1156} {"train_loss": -40.257259368896484, "global_step": 139889, "epoch": 1156} {"train_loss": -41.70357894897461, "global_step": 139890, "epoch": 1156} {"train_loss": -40.8386344909668, "global_step": 139891, "epoch": 1156} {"train_loss": -41.12696075439453, "global_step": 139892, "epoch": 1156} {"train_loss": -41.2593994140625, "global_step": 139893, "epoch": 1156} {"train_loss": -41.93910217285156, "global_step": 139894, "epoch": 1156} {"train_loss": -41.253387451171875, "global_step": 139895, "epoch": 1156} {"train_loss": -40.625423431396484, "global_step": 139896, "epoch": 1156} {"train_loss": -41.18464660644531, "global_step": 139897, "epoch": 1156} {"train_loss": -40.016815185546875, "global_step": 139898, "epoch": 1156} {"train_loss": -40.56142044067383, "global_step": 139899, "epoch": 1156} {"train_loss": -41.20775604248047, "global_step": 139900, "epoch": 1156} {"train_loss": -38.73295211791992, "global_step": 139901, "epoch": 1156} {"train_loss": -38.52811050415039, "global_step": 139902, "epoch": 1156} {"train_loss": -39.54068374633789, "global_step": 139903, "epoch": 1156} {"train_loss": -39.27939987182617, "global_step": 139904, "epoch": 1156} {"train_loss": -37.41768264770508, "global_step": 139905, "epoch": 1156} {"train_loss": -37.30255889892578, "global_step": 139906, "epoch": 1156} {"train_loss": -33.284461975097656, "global_step": 139907, "epoch": 1156} {"train_loss": -36.24587631225586, "global_step": 139908, "epoch": 1156} {"train_loss": -40.01243209838867, "global_step": 139909, "epoch": 1156} {"train_loss": -40.566383361816406, "global_step": 139910, "epoch": 1156} {"train_loss": -38.62144088745117, "global_step": 139911, "epoch": 1156} {"train_loss": -39.31362533569336, "global_step": 139912, "epoch": 1156} {"train_loss": -39.67010498046875, "global_step": 139913, "epoch": 1156} {"train_loss": -39.728023529052734, "global_step": 139914, "epoch": 1156} {"train_loss": -38.47356033325195, "global_step": 139915, "epoch": 1156} {"train_loss": -39.44853591918945, "global_step": 139916, "epoch": 1156} {"train_loss": -40.03915786743164, "global_step": 139917, "epoch": 1156} {"train_loss": -38.430599212646484, "global_step": 139918, "epoch": 1156} {"train_loss": -39.05574035644531, "global_step": 139919, "epoch": 1156} {"train_loss": -40.56038284301758, "global_step": 139920, "epoch": 1156} {"train_loss": -39.86248016357422, "global_step": 139921, "epoch": 1156} {"train_loss": -38.08491897583008, "global_step": 139922, "epoch": 1156} {"train_loss": -39.459991455078125, "global_step": 139923, "epoch": 1156} {"train_loss": -40.090354919433594, "global_step": 139924, "epoch": 1156} {"train_loss": -39.115577697753906, "global_step": 139925, "epoch": 1156} {"train_loss": -38.82508850097656, "global_step": 139926, "epoch": 1156} {"train_loss": -39.4228630065918, "global_step": 139927, "epoch": 1156} {"train_loss": -40.36780548095703, "global_step": 139928, "epoch": 1156} {"train_loss": -39.306854248046875, "global_step": 139929, "epoch": 1156} {"train_loss": -38.78876876831055, "global_step": 139930, "epoch": 1156} {"train_loss": -40.389373779296875, "global_step": 139931, "epoch": 1156} {"train_loss": -40.546871185302734, "global_step": 139932, "epoch": 1156} {"train_loss": -40.067317962646484, "global_step": 139933, "epoch": 1156} {"train_loss": -40.36629867553711, "global_step": 139934, "epoch": 1156} {"train_loss": -40.832855224609375, "global_step": 139935, "epoch": 1156} {"train_loss": -39.66633987426758, "global_step": 139936, "epoch": 1156} {"train_loss": -39.72169876098633, "global_step": 139937, "epoch": 1156} {"train_loss": -40.62800979614258, "global_step": 139938, "epoch": 1156} {"train_loss": -40.59054183959961, "global_step": 139939, "epoch": 1156} {"train_loss": -39.60227584838867, "global_step": 139940, "epoch": 1156} {"train_loss": -40.67837142944336, "global_step": 139941, "epoch": 1156} {"train_loss": -40.78414535522461, "global_step": 139942, "epoch": 1156} {"train_loss": -39.67041778564453, "global_step": 139943, "epoch": 1156} {"train_loss": -40.8768424987793, "global_step": 139944, "epoch": 1156} {"train_loss": -39.868587493896484, "global_step": 139945, "epoch": 1156} {"train_loss": -38.736358642578125, "global_step": 139946, "epoch": 1156} {"train_loss": -40.060123443603516, "global_step": 139947, "epoch": 1156} {"train_loss": -40.4558219909668, "global_step": 139948, "epoch": 1156} {"train_loss": -39.69037628173828, "global_step": 139949, "epoch": 1156} {"train_loss": -39.60536575317383, "global_step": 139950, "epoch": 1156} {"train_loss": -40.81382369995117, "global_step": 139951, "epoch": 1156} {"train_loss": -40.31228256225586, "global_step": 139952, "epoch": 1156} {"train_loss": -40.28285598754883, "global_step": 139953, "epoch": 1156} {"train_loss": -40.491249084472656, "global_step": 139954, "epoch": 1156} {"train_loss": -40.53247833251953, "global_step": 139955, "epoch": 1156} {"train_loss": -40.5944938659668, "global_step": 139956, "epoch": 1156} {"train_loss": -40.37467575073242, "global_step": 139957, "epoch": 1156} {"train_loss": -40.870296478271484, "global_step": 139958, "epoch": 1156} {"train_loss": -40.04606246948242, "global_step": 139959, "epoch": 1156} {"train_loss": -40.526763916015625, "global_step": 139960, "epoch": 1156} {"train_loss": -40.49094772338867, "global_step": 139961, "epoch": 1156} {"train_loss": -40.54643249511719, "global_step": 139962, "epoch": 1156} {"train_loss": -40.93080520629883, "global_step": 139963, "epoch": 1156} {"train_loss": -40.90747833251953, "global_step": 139964, "epoch": 1156} {"train_loss": -40.11799240112305, "global_step": 139965, "epoch": 1156} {"train_loss": -40.92008590698242, "global_step": 139966, "epoch": 1156} {"train_loss": -40.936641693115234, "global_step": 139967, "epoch": 1156} {"train_loss": -40.70754623413086, "global_step": 139968, "epoch": 1156} {"train_loss": -40.12529754638672, "global_step": 139969, "epoch": 1156} {"train_loss": -41.42177963256836, "global_step": 139970, "epoch": 1156} {"train_loss": -41.2273063659668, "global_step": 139971, "epoch": 1156} {"train_loss": -40.61420440673828, "global_step": 139972, "epoch": 1156} {"train_loss": -40.65196228027344, "global_step": 139973, "epoch": 1156} {"train_loss": -41.24150085449219, "global_step": 139974, "epoch": 1156} {"train_loss": -41.711483001708984, "global_step": 139975, "epoch": 1156} {"train_loss": -40.969730377197266, "global_step": 139976, "epoch": 1156} {"train_loss": -41.32941436767578, "global_step": 139977, "epoch": 1156} {"train_loss": -41.54966354370117, "global_step": 139978, "epoch": 1156} {"train_loss": -40.620704650878906, "global_step": 139979, "epoch": 1156} {"train_loss": -40.28365707397461, "global_step": 139980, "epoch": 1156} {"train_loss": -41.3972282409668, "global_step": 139981, "epoch": 1156} {"train_loss": -41.23269271850586, "global_step": 139982, "epoch": 1156} {"train_loss": -40.58319854736328, "global_step": 139983, "epoch": 1156} {"train_loss": -40.35126495361328, "global_step": 139984, "epoch": 1156} {"train_loss": -41.34476852416992, "global_step": 139985, "epoch": 1156} {"train_loss": -40.33905792236328, "global_step": 139986, "epoch": 1156} {"train_loss": -40.14726638793945, "global_step": 139987, "epoch": 1156} {"train_loss": -41.3751220703125, "global_step": 139988, "epoch": 1156} {"train_loss": -41.29313278198242, "global_step": 139989, "epoch": 1156} {"train_loss": -40.7578010559082, "global_step": 139990, "epoch": 1156} {"train_loss": -39.14263153076172, "global_step": 139991, "epoch": 1156} {"train_loss": -40.86613845825195, "global_step": 139992, "epoch": 1156} {"train_loss": -40.48649978637695, "global_step": 139993, "epoch": 1156} {"train_loss": -39.81748962402344, "global_step": 139994, "epoch": 1156} {"train_loss": -40.14542770385742, "global_step": 139995, "epoch": 1156} {"train_loss": -40.19482907381925, "global_step": 139996, "epoch": 1156, "val_loss": 2657158.75} {"train_loss": -40.065155029296875, "global_step": 139997, "epoch": 1157} {"train_loss": -38.99042892456055, "global_step": 139998, "epoch": 1157} {"train_loss": -40.342403411865234, "global_step": 139999, "epoch": 1157} {"train_loss": -40.820777893066406, "global_step": 140000, "epoch": 1157} {"train_loss": -40.0105094909668, "global_step": 140001, "epoch": 1157} {"train_loss": -39.28948211669922, "global_step": 140002, "epoch": 1157} {"train_loss": -40.19998550415039, "global_step": 140003, "epoch": 1157} {"train_loss": -37.97922134399414, "global_step": 140004, "epoch": 1157} {"train_loss": -40.69607162475586, "global_step": 140005, "epoch": 1157} {"train_loss": -37.72047424316406, "global_step": 140006, "epoch": 1157} {"train_loss": -36.086421966552734, "global_step": 140007, "epoch": 1157} {"train_loss": -35.5975341796875, "global_step": 140008, "epoch": 1157} {"train_loss": -27.10894203186035, "global_step": 140009, "epoch": 1157} {"train_loss": -36.506690979003906, "global_step": 140010, "epoch": 1157} {"train_loss": -28.957834243774414, "global_step": 140011, "epoch": 1157} {"train_loss": -32.05497360229492, "global_step": 140012, "epoch": 1157} {"train_loss": -32.503353118896484, "global_step": 140013, "epoch": 1157} {"train_loss": -31.699329376220703, "global_step": 140014, "epoch": 1157} {"train_loss": -35.01087951660156, "global_step": 140015, "epoch": 1157} {"train_loss": -34.876060485839844, "global_step": 140016, "epoch": 1157} {"train_loss": -35.1934700012207, "global_step": 140017, "epoch": 1157} {"train_loss": -37.55147933959961, "global_step": 140018, "epoch": 1157} {"train_loss": -38.17616271972656, "global_step": 140019, "epoch": 1157} {"train_loss": -35.6192741394043, "global_step": 140020, "epoch": 1157} {"train_loss": -36.76670455932617, "global_step": 140021, "epoch": 1157} {"train_loss": -36.62124252319336, "global_step": 140022, "epoch": 1157} {"train_loss": -38.79352569580078, "global_step": 140023, "epoch": 1157} {"train_loss": -37.007171630859375, "global_step": 140024, "epoch": 1157} {"train_loss": -38.703590393066406, "global_step": 140025, "epoch": 1157} {"train_loss": -38.06254577636719, "global_step": 140026, "epoch": 1157} {"train_loss": -38.4737548828125, "global_step": 140027, "epoch": 1157} {"train_loss": -39.18947219848633, "global_step": 140028, "epoch": 1157} {"train_loss": -37.78654098510742, "global_step": 140029, "epoch": 1157} {"train_loss": -38.667484283447266, "global_step": 140030, "epoch": 1157} {"train_loss": -39.90774917602539, "global_step": 140031, "epoch": 1157} {"train_loss": -39.235328674316406, "global_step": 140032, "epoch": 1157} {"train_loss": -40.06140899658203, "global_step": 140033, "epoch": 1157} {"train_loss": -38.56938934326172, "global_step": 140034, "epoch": 1157} {"train_loss": -39.478309631347656, "global_step": 140035, "epoch": 1157} {"train_loss": -39.6495361328125, "global_step": 140036, "epoch": 1157} {"train_loss": -40.0719108581543, "global_step": 140037, "epoch": 1157} {"train_loss": -40.460662841796875, "global_step": 140038, "epoch": 1157} {"train_loss": -39.70527267456055, "global_step": 140039, "epoch": 1157} {"train_loss": -39.82479476928711, "global_step": 140040, "epoch": 1157} {"train_loss": -40.05925369262695, "global_step": 140041, "epoch": 1157} {"train_loss": -40.20619583129883, "global_step": 140042, "epoch": 1157} {"train_loss": -40.001487731933594, "global_step": 140043, "epoch": 1157} {"train_loss": -40.26862716674805, "global_step": 140044, "epoch": 1157} {"train_loss": -40.0888671875, "global_step": 140045, "epoch": 1157} {"train_loss": -39.54707336425781, "global_step": 140046, "epoch": 1157} {"train_loss": -39.95886993408203, "global_step": 140047, "epoch": 1157} {"train_loss": -40.822017669677734, "global_step": 140048, "epoch": 1157} {"train_loss": -39.37839889526367, "global_step": 140049, "epoch": 1157} {"train_loss": -40.44160842895508, "global_step": 140050, "epoch": 1157} {"train_loss": -40.273414611816406, "global_step": 140051, "epoch": 1157} {"train_loss": -40.21419143676758, "global_step": 140052, "epoch": 1157} {"train_loss": -40.59856033325195, "global_step": 140053, "epoch": 1157} {"train_loss": -39.467811584472656, "global_step": 140054, "epoch": 1157} {"train_loss": -40.33756637573242, "global_step": 140055, "epoch": 1157} {"train_loss": -40.621826171875, "global_step": 140056, "epoch": 1157} {"train_loss": -40.69993209838867, "global_step": 140057, "epoch": 1157} {"train_loss": -40.4747428894043, "global_step": 140058, "epoch": 1157} {"train_loss": -40.118751525878906, "global_step": 140059, "epoch": 1157} {"train_loss": -40.782859802246094, "global_step": 140060, "epoch": 1157} {"train_loss": -40.5903434753418, "global_step": 140061, "epoch": 1157} {"train_loss": -41.021305084228516, "global_step": 140062, "epoch": 1157} {"train_loss": -40.937191009521484, "global_step": 140063, "epoch": 1157} {"train_loss": -40.41792678833008, "global_step": 140064, "epoch": 1157} {"train_loss": -40.837059020996094, "global_step": 140065, "epoch": 1157} {"train_loss": -40.58514404296875, "global_step": 140066, "epoch": 1157} {"train_loss": -40.58759689331055, "global_step": 140067, "epoch": 1157} {"train_loss": -40.8149528503418, "global_step": 140068, "epoch": 1157} {"train_loss": -41.03984451293945, "global_step": 140069, "epoch": 1157} {"train_loss": -40.78807067871094, "global_step": 140070, "epoch": 1157} {"train_loss": -41.312599182128906, "global_step": 140071, "epoch": 1157} {"train_loss": -40.95880889892578, "global_step": 140072, "epoch": 1157} {"train_loss": -40.67547607421875, "global_step": 140073, "epoch": 1157} {"train_loss": -40.72101974487305, "global_step": 140074, "epoch": 1157} {"train_loss": -41.17008590698242, "global_step": 140075, "epoch": 1157} {"train_loss": -40.74930953979492, "global_step": 140076, "epoch": 1157} {"train_loss": -40.17533493041992, "global_step": 140077, "epoch": 1157} {"train_loss": -41.43644332885742, "global_step": 140078, "epoch": 1157} {"train_loss": -40.61457061767578, "global_step": 140079, "epoch": 1157} {"train_loss": -39.800331115722656, "global_step": 140080, "epoch": 1157} {"train_loss": -40.946048736572266, "global_step": 140081, "epoch": 1157} {"train_loss": -41.122989654541016, "global_step": 140082, "epoch": 1157} {"train_loss": -40.222442626953125, "global_step": 140083, "epoch": 1157} {"train_loss": -39.98356628417969, "global_step": 140084, "epoch": 1157} {"train_loss": -39.86469268798828, "global_step": 140085, "epoch": 1157} {"train_loss": -40.054229736328125, "global_step": 140086, "epoch": 1157} {"train_loss": -39.175514221191406, "global_step": 140087, "epoch": 1157} {"train_loss": -40.66384506225586, "global_step": 140088, "epoch": 1157} {"train_loss": -39.45164108276367, "global_step": 140089, "epoch": 1157} {"train_loss": -40.08705520629883, "global_step": 140090, "epoch": 1157} {"train_loss": -38.541751861572266, "global_step": 140091, "epoch": 1157} {"train_loss": -38.00178909301758, "global_step": 140092, "epoch": 1157} {"train_loss": -39.42338180541992, "global_step": 140093, "epoch": 1157} {"train_loss": -40.74917221069336, "global_step": 140094, "epoch": 1157} {"train_loss": -39.713809967041016, "global_step": 140095, "epoch": 1157} {"train_loss": -38.215484619140625, "global_step": 140096, "epoch": 1157} {"train_loss": -39.018882751464844, "global_step": 140097, "epoch": 1157} {"train_loss": -38.57318878173828, "global_step": 140098, "epoch": 1157} {"train_loss": -37.20125961303711, "global_step": 140099, "epoch": 1157} {"train_loss": -39.45945739746094, "global_step": 140100, "epoch": 1157} {"train_loss": -39.39592361450195, "global_step": 140101, "epoch": 1157} {"train_loss": -37.8619499206543, "global_step": 140102, "epoch": 1157} {"train_loss": -36.65958786010742, "global_step": 140103, "epoch": 1157} {"train_loss": -39.9040641784668, "global_step": 140104, "epoch": 1157} {"train_loss": -38.047569274902344, "global_step": 140105, "epoch": 1157} {"train_loss": -36.92414093017578, "global_step": 140106, "epoch": 1157} {"train_loss": -40.28668212890625, "global_step": 140107, "epoch": 1157} {"train_loss": -37.849063873291016, "global_step": 140108, "epoch": 1157} {"train_loss": -37.502227783203125, "global_step": 140109, "epoch": 1157} {"train_loss": -39.93556213378906, "global_step": 140110, "epoch": 1157} {"train_loss": -39.300697326660156, "global_step": 140111, "epoch": 1157} {"train_loss": -38.978668212890625, "global_step": 140112, "epoch": 1157} {"train_loss": -39.216949462890625, "global_step": 140113, "epoch": 1157} {"train_loss": -39.53993606567383, "global_step": 140114, "epoch": 1157} {"train_loss": -39.4334602355957, "global_step": 140115, "epoch": 1157} {"train_loss": -38.83723831176758, "global_step": 140116, "epoch": 1157} {"train_loss": -39.00173193561144, "global_step": 140117, "epoch": 1157, "val_loss": 2573680.75} {"train_loss": -39.062252044677734, "global_step": 140118, "epoch": 1158} {"train_loss": -39.23371505737305, "global_step": 140119, "epoch": 1158} {"train_loss": -40.01642990112305, "global_step": 140120, "epoch": 1158} {"train_loss": -38.0606803894043, "global_step": 140121, "epoch": 1158} {"train_loss": -40.663734436035156, "global_step": 140122, "epoch": 1158} {"train_loss": -37.51961135864258, "global_step": 140123, "epoch": 1158} {"train_loss": -38.55449676513672, "global_step": 140124, "epoch": 1158} {"train_loss": -37.69426727294922, "global_step": 140125, "epoch": 1158} {"train_loss": -39.2495231628418, "global_step": 140126, "epoch": 1158} {"train_loss": -38.39524459838867, "global_step": 140127, "epoch": 1158} {"train_loss": -39.21284103393555, "global_step": 140128, "epoch": 1158} {"train_loss": -38.7010383605957, "global_step": 140129, "epoch": 1158} {"train_loss": -38.810218811035156, "global_step": 140130, "epoch": 1158} {"train_loss": -39.013526916503906, "global_step": 140131, "epoch": 1158} {"train_loss": -38.94092559814453, "global_step": 140132, "epoch": 1158} {"train_loss": -39.827308654785156, "global_step": 140133, "epoch": 1158} {"train_loss": -39.116798400878906, "global_step": 140134, "epoch": 1158} {"train_loss": -39.11151123046875, "global_step": 140135, "epoch": 1158} {"train_loss": -39.68772888183594, "global_step": 140136, "epoch": 1158} {"train_loss": -37.98069763183594, "global_step": 140137, "epoch": 1158} {"train_loss": -38.93156051635742, "global_step": 140138, "epoch": 1158} {"train_loss": -38.73292541503906, "global_step": 140139, "epoch": 1158} {"train_loss": -38.741737365722656, "global_step": 140140, "epoch": 1158} {"train_loss": -39.52573776245117, "global_step": 140141, "epoch": 1158} {"train_loss": -39.19626235961914, "global_step": 140142, "epoch": 1158} {"train_loss": -39.81907272338867, "global_step": 140143, "epoch": 1158} {"train_loss": -39.30537796020508, "global_step": 140144, "epoch": 1158} {"train_loss": -39.901580810546875, "global_step": 140145, "epoch": 1158} {"train_loss": -38.33449172973633, "global_step": 140146, "epoch": 1158} {"train_loss": -38.358036041259766, "global_step": 140147, "epoch": 1158} {"train_loss": -38.337886810302734, "global_step": 140148, "epoch": 1158} {"train_loss": -39.14084243774414, "global_step": 140149, "epoch": 1158} {"train_loss": -38.455299377441406, "global_step": 140150, "epoch": 1158} {"train_loss": -39.20856475830078, "global_step": 140151, "epoch": 1158} {"train_loss": -38.914466857910156, "global_step": 140152, "epoch": 1158} {"train_loss": -38.191261291503906, "global_step": 140153, "epoch": 1158} {"train_loss": -39.07280349731445, "global_step": 140154, "epoch": 1158} {"train_loss": -39.18586349487305, "global_step": 140155, "epoch": 1158} {"train_loss": -39.13845443725586, "global_step": 140156, "epoch": 1158} {"train_loss": -38.14641571044922, "global_step": 140157, "epoch": 1158} {"train_loss": -40.00631332397461, "global_step": 140158, "epoch": 1158} {"train_loss": -39.37378692626953, "global_step": 140159, "epoch": 1158} {"train_loss": -39.11738204956055, "global_step": 140160, "epoch": 1158} {"train_loss": -39.327938079833984, "global_step": 140161, "epoch": 1158} {"train_loss": -39.75191879272461, "global_step": 140162, "epoch": 1158} {"train_loss": -39.65995407104492, "global_step": 140163, "epoch": 1158} {"train_loss": -40.358863830566406, "global_step": 140164, "epoch": 1158} {"train_loss": -39.79606246948242, "global_step": 140165, "epoch": 1158} {"train_loss": -39.89140701293945, "global_step": 140166, "epoch": 1158} {"train_loss": -40.43741989135742, "global_step": 140167, "epoch": 1158} {"train_loss": -39.86343002319336, "global_step": 140168, "epoch": 1158} {"train_loss": -40.21431350708008, "global_step": 140169, "epoch": 1158} {"train_loss": -40.55708694458008, "global_step": 140170, "epoch": 1158} {"train_loss": -40.60948181152344, "global_step": 140171, "epoch": 1158} {"train_loss": -40.38806915283203, "global_step": 140172, "epoch": 1158} {"train_loss": -40.614471435546875, "global_step": 140173, "epoch": 1158} {"train_loss": -40.648193359375, "global_step": 140174, "epoch": 1158} {"train_loss": -40.99125289916992, "global_step": 140175, "epoch": 1158} {"train_loss": -40.6964225769043, "global_step": 140176, "epoch": 1158} {"train_loss": -41.130367279052734, "global_step": 140177, "epoch": 1158} {"train_loss": -40.72484588623047, "global_step": 140178, "epoch": 1158} {"train_loss": -41.07049560546875, "global_step": 140179, "epoch": 1158} {"train_loss": -40.84764862060547, "global_step": 140180, "epoch": 1158} {"train_loss": -40.863739013671875, "global_step": 140181, "epoch": 1158} {"train_loss": -40.61516189575195, "global_step": 140182, "epoch": 1158} {"train_loss": -40.8366584777832, "global_step": 140183, "epoch": 1158} {"train_loss": -40.94548416137695, "global_step": 140184, "epoch": 1158} {"train_loss": -40.836727142333984, "global_step": 140185, "epoch": 1158} {"train_loss": -41.2411003112793, "global_step": 140186, "epoch": 1158} {"train_loss": -40.65595626831055, "global_step": 140187, "epoch": 1158} {"train_loss": -41.26304244995117, "global_step": 140188, "epoch": 1158} {"train_loss": -41.22159957885742, "global_step": 140189, "epoch": 1158} {"train_loss": -41.42013168334961, "global_step": 140190, "epoch": 1158} {"train_loss": -41.4827995300293, "global_step": 140191, "epoch": 1158} {"train_loss": -41.20315170288086, "global_step": 140192, "epoch": 1158} {"train_loss": -40.8009147644043, "global_step": 140193, "epoch": 1158} {"train_loss": -40.793426513671875, "global_step": 140194, "epoch": 1158} {"train_loss": -41.30488204956055, "global_step": 140195, "epoch": 1158} {"train_loss": -41.60543441772461, "global_step": 140196, "epoch": 1158} {"train_loss": -41.08893585205078, "global_step": 140197, "epoch": 1158} {"train_loss": -39.64556884765625, "global_step": 140198, "epoch": 1158} {"train_loss": -40.24790573120117, "global_step": 140199, "epoch": 1158} {"train_loss": -41.02976608276367, "global_step": 140200, "epoch": 1158} {"train_loss": -41.12039566040039, "global_step": 140201, "epoch": 1158} {"train_loss": -41.36248016357422, "global_step": 140202, "epoch": 1158} {"train_loss": -41.013038635253906, "global_step": 140203, "epoch": 1158} {"train_loss": -40.78666305541992, "global_step": 140204, "epoch": 1158} {"train_loss": -41.28538131713867, "global_step": 140205, "epoch": 1158} {"train_loss": -40.90058517456055, "global_step": 140206, "epoch": 1158} {"train_loss": -41.21957015991211, "global_step": 140207, "epoch": 1158} {"train_loss": -41.41366195678711, "global_step": 140208, "epoch": 1158} {"train_loss": -41.44651794433594, "global_step": 140209, "epoch": 1158} {"train_loss": -41.01374053955078, "global_step": 140210, "epoch": 1158} {"train_loss": -41.020355224609375, "global_step": 140211, "epoch": 1158} {"train_loss": -40.42214584350586, "global_step": 140212, "epoch": 1158} {"train_loss": -40.4912109375, "global_step": 140213, "epoch": 1158} {"train_loss": -41.06977081298828, "global_step": 140214, "epoch": 1158} {"train_loss": -41.0537223815918, "global_step": 140215, "epoch": 1158} {"train_loss": -40.1536865234375, "global_step": 140216, "epoch": 1158} {"train_loss": -37.84895324707031, "global_step": 140217, "epoch": 1158} {"train_loss": -37.751953125, "global_step": 140218, "epoch": 1158} {"train_loss": -39.73524856567383, "global_step": 140219, "epoch": 1158} {"train_loss": -37.64527130126953, "global_step": 140220, "epoch": 1158} {"train_loss": -33.59054183959961, "global_step": 140221, "epoch": 1158} {"train_loss": -35.588497161865234, "global_step": 140222, "epoch": 1158} {"train_loss": -36.32218551635742, "global_step": 140223, "epoch": 1158} {"train_loss": -34.73017501831055, "global_step": 140224, "epoch": 1158} {"train_loss": -34.57078170776367, "global_step": 140225, "epoch": 1158} {"train_loss": -35.063629150390625, "global_step": 140226, "epoch": 1158} {"train_loss": -36.546539306640625, "global_step": 140227, "epoch": 1158} {"train_loss": -35.66706848144531, "global_step": 140228, "epoch": 1158} {"train_loss": -35.285579681396484, "global_step": 140229, "epoch": 1158} {"train_loss": -38.71645736694336, "global_step": 140230, "epoch": 1158} {"train_loss": -35.79402542114258, "global_step": 140231, "epoch": 1158} {"train_loss": -37.856056213378906, "global_step": 140232, "epoch": 1158} {"train_loss": -37.756038665771484, "global_step": 140233, "epoch": 1158} {"train_loss": -38.06209945678711, "global_step": 140234, "epoch": 1158} {"train_loss": -39.21067428588867, "global_step": 140235, "epoch": 1158} {"train_loss": -39.46104049682617, "global_step": 140236, "epoch": 1158} {"train_loss": -39.87711715698242, "global_step": 140237, "epoch": 1158} {"train_loss": -39.46114970435781, "global_step": 140238, "epoch": 1158, "val_loss": 2651493.25} {"train_loss": -38.90184020996094, "global_step": 140239, "epoch": 1159} {"train_loss": -39.3567008972168, "global_step": 140240, "epoch": 1159} {"train_loss": -39.2071533203125, "global_step": 140241, "epoch": 1159} {"train_loss": -38.13155746459961, "global_step": 140242, "epoch": 1159} {"train_loss": -39.3382568359375, "global_step": 140243, "epoch": 1159} {"train_loss": -38.79521560668945, "global_step": 140244, "epoch": 1159} {"train_loss": -37.545291900634766, "global_step": 140245, "epoch": 1159} {"train_loss": -39.321712493896484, "global_step": 140246, "epoch": 1159} {"train_loss": -39.09849166870117, "global_step": 140247, "epoch": 1159} {"train_loss": -37.902645111083984, "global_step": 140248, "epoch": 1159} {"train_loss": -37.59836959838867, "global_step": 140249, "epoch": 1159} {"train_loss": -40.26325988769531, "global_step": 140250, "epoch": 1159} {"train_loss": -38.10358810424805, "global_step": 140251, "epoch": 1159} {"train_loss": -37.68412399291992, "global_step": 140252, "epoch": 1159} {"train_loss": -39.98301315307617, "global_step": 140253, "epoch": 1159} {"train_loss": -38.82168197631836, "global_step": 140254, "epoch": 1159} {"train_loss": -39.51627731323242, "global_step": 140255, "epoch": 1159} {"train_loss": -40.05475997924805, "global_step": 140256, "epoch": 1159} {"train_loss": -39.51170349121094, "global_step": 140257, "epoch": 1159} {"train_loss": -39.893226623535156, "global_step": 140258, "epoch": 1159} {"train_loss": -39.876338958740234, "global_step": 140259, "epoch": 1159} {"train_loss": -39.031429290771484, "global_step": 140260, "epoch": 1159} {"train_loss": -40.17837905883789, "global_step": 140261, "epoch": 1159} {"train_loss": -39.894588470458984, "global_step": 140262, "epoch": 1159} {"train_loss": -38.72955322265625, "global_step": 140263, "epoch": 1159} {"train_loss": -39.8554801940918, "global_step": 140264, "epoch": 1159} {"train_loss": -39.94132614135742, "global_step": 140265, "epoch": 1159} {"train_loss": -40.29301452636719, "global_step": 140266, "epoch": 1159} {"train_loss": -40.38956832885742, "global_step": 140267, "epoch": 1159} {"train_loss": -40.27184295654297, "global_step": 140268, "epoch": 1159} {"train_loss": -40.500545501708984, "global_step": 140269, "epoch": 1159} {"train_loss": -40.22882080078125, "global_step": 140270, "epoch": 1159} {"train_loss": -40.14491653442383, "global_step": 140271, "epoch": 1159} {"train_loss": -40.1094970703125, "global_step": 140272, "epoch": 1159} {"train_loss": -40.07011795043945, "global_step": 140273, "epoch": 1159} {"train_loss": -40.32932662963867, "global_step": 140274, "epoch": 1159} {"train_loss": -40.35770797729492, "global_step": 140275, "epoch": 1159} {"train_loss": -40.558753967285156, "global_step": 140276, "epoch": 1159} {"train_loss": -40.75089645385742, "global_step": 140277, "epoch": 1159} {"train_loss": -41.201087951660156, "global_step": 140278, "epoch": 1159} {"train_loss": -40.786048889160156, "global_step": 140279, "epoch": 1159} {"train_loss": -41.23148727416992, "global_step": 140280, "epoch": 1159} {"train_loss": -40.905513763427734, "global_step": 140281, "epoch": 1159} {"train_loss": -41.41067123413086, "global_step": 140282, "epoch": 1159} {"train_loss": -40.561012268066406, "global_step": 140283, "epoch": 1159} {"train_loss": -41.41962814331055, "global_step": 140284, "epoch": 1159} {"train_loss": -40.95701217651367, "global_step": 140285, "epoch": 1159} {"train_loss": -41.12042999267578, "global_step": 140286, "epoch": 1159} {"train_loss": -41.17433547973633, "global_step": 140287, "epoch": 1159} {"train_loss": -40.72951126098633, "global_step": 140288, "epoch": 1159} {"train_loss": -41.17517852783203, "global_step": 140289, "epoch": 1159} {"train_loss": -41.60099411010742, "global_step": 140290, "epoch": 1159} {"train_loss": -41.47493362426758, "global_step": 140291, "epoch": 1159} {"train_loss": -41.30900955200195, "global_step": 140292, "epoch": 1159} {"train_loss": -41.58918380737305, "global_step": 140293, "epoch": 1159} {"train_loss": -40.52507019042969, "global_step": 140294, "epoch": 1159} {"train_loss": -41.30654525756836, "global_step": 140295, "epoch": 1159} {"train_loss": -41.48431396484375, "global_step": 140296, "epoch": 1159} {"train_loss": -39.92267608642578, "global_step": 140297, "epoch": 1159} {"train_loss": -40.23975372314453, "global_step": 140298, "epoch": 1159} {"train_loss": -41.146446228027344, "global_step": 140299, "epoch": 1159} {"train_loss": -40.111167907714844, "global_step": 140300, "epoch": 1159} {"train_loss": -39.57145690917969, "global_step": 140301, "epoch": 1159} {"train_loss": -41.1412467956543, "global_step": 140302, "epoch": 1159} {"train_loss": -40.91569900512695, "global_step": 140303, "epoch": 1159} {"train_loss": -39.8581428527832, "global_step": 140304, "epoch": 1159} {"train_loss": -40.32229232788086, "global_step": 140305, "epoch": 1159} {"train_loss": -40.56657791137695, "global_step": 140306, "epoch": 1159} {"train_loss": -40.56135177612305, "global_step": 140307, "epoch": 1159} {"train_loss": -40.25959396362305, "global_step": 140308, "epoch": 1159} {"train_loss": -40.50590133666992, "global_step": 140309, "epoch": 1159} {"train_loss": -40.615028381347656, "global_step": 140310, "epoch": 1159} {"train_loss": -41.10874938964844, "global_step": 140311, "epoch": 1159} {"train_loss": -41.06793212890625, "global_step": 140312, "epoch": 1159} {"train_loss": -41.15561294555664, "global_step": 140313, "epoch": 1159} {"train_loss": -40.683624267578125, "global_step": 140314, "epoch": 1159} {"train_loss": -40.3516960144043, "global_step": 140315, "epoch": 1159} {"train_loss": -39.993568420410156, "global_step": 140316, "epoch": 1159} {"train_loss": -39.97662353515625, "global_step": 140317, "epoch": 1159} {"train_loss": -39.98873519897461, "global_step": 140318, "epoch": 1159} {"train_loss": -41.184120178222656, "global_step": 140319, "epoch": 1159} {"train_loss": -40.310455322265625, "global_step": 140320, "epoch": 1159} {"train_loss": -39.47805404663086, "global_step": 140321, "epoch": 1159} {"train_loss": -39.6346435546875, "global_step": 140322, "epoch": 1159} {"train_loss": -40.69542694091797, "global_step": 140323, "epoch": 1159} {"train_loss": -41.22622299194336, "global_step": 140324, "epoch": 1159} {"train_loss": -40.126930236816406, "global_step": 140325, "epoch": 1159} {"train_loss": -40.3291130065918, "global_step": 140326, "epoch": 1159} {"train_loss": -40.67319107055664, "global_step": 140327, "epoch": 1159} {"train_loss": -38.5703239440918, "global_step": 140328, "epoch": 1159} {"train_loss": -40.77592086791992, "global_step": 140329, "epoch": 1159} {"train_loss": -40.9304313659668, "global_step": 140330, "epoch": 1159} {"train_loss": -40.341732025146484, "global_step": 140331, "epoch": 1159} {"train_loss": -40.4449348449707, "global_step": 140332, "epoch": 1159} {"train_loss": -40.99226760864258, "global_step": 140333, "epoch": 1159} {"train_loss": -40.76133346557617, "global_step": 140334, "epoch": 1159} {"train_loss": -40.998992919921875, "global_step": 140335, "epoch": 1159} {"train_loss": -41.39115524291992, "global_step": 140336, "epoch": 1159} {"train_loss": -40.78276062011719, "global_step": 140337, "epoch": 1159} {"train_loss": -40.99298095703125, "global_step": 140338, "epoch": 1159} {"train_loss": -40.5031852722168, "global_step": 140339, "epoch": 1159} {"train_loss": -39.20701599121094, "global_step": 140340, "epoch": 1159} {"train_loss": -39.87386703491211, "global_step": 140341, "epoch": 1159} {"train_loss": -40.48786544799805, "global_step": 140342, "epoch": 1159} {"train_loss": -40.72146224975586, "global_step": 140343, "epoch": 1159} {"train_loss": -40.94462585449219, "global_step": 140344, "epoch": 1159} {"train_loss": -40.426753997802734, "global_step": 140345, "epoch": 1159} {"train_loss": -38.903167724609375, "global_step": 140346, "epoch": 1159} {"train_loss": -39.46554183959961, "global_step": 140347, "epoch": 1159} {"train_loss": -38.543331146240234, "global_step": 140348, "epoch": 1159} {"train_loss": -39.2892951965332, "global_step": 140349, "epoch": 1159} {"train_loss": -41.23054122924805, "global_step": 140350, "epoch": 1159} {"train_loss": -41.04241180419922, "global_step": 140351, "epoch": 1159} {"train_loss": -40.49434280395508, "global_step": 140352, "epoch": 1159} {"train_loss": -39.68259811401367, "global_step": 140353, "epoch": 1159} {"train_loss": -39.78824996948242, "global_step": 140354, "epoch": 1159} {"train_loss": -40.183048248291016, "global_step": 140355, "epoch": 1159} {"train_loss": -35.05356979370117, "global_step": 140356, "epoch": 1159} {"train_loss": -40.3297119140625, "global_step": 140357, "epoch": 1159} {"train_loss": -40.073368072509766, "global_step": 140358, "epoch": 1159} {"train_loss": -40.15050673681842, "global_step": 140359, "epoch": 1159, "val_loss": 3678705.25} {"train_loss": -39.26375961303711, "global_step": 140360, "epoch": 1160} {"train_loss": -38.61004638671875, "global_step": 140361, "epoch": 1160} {"train_loss": -34.86040115356445, "global_step": 140362, "epoch": 1160} {"train_loss": -36.67478561401367, "global_step": 140363, "epoch": 1160} {"train_loss": -37.17123031616211, "global_step": 140364, "epoch": 1160} {"train_loss": -36.28094482421875, "global_step": 140365, "epoch": 1160} {"train_loss": -35.56315231323242, "global_step": 140366, "epoch": 1160} {"train_loss": -39.847938537597656, "global_step": 140367, "epoch": 1160} {"train_loss": -38.1504020690918, "global_step": 140368, "epoch": 1160} {"train_loss": -35.9781379699707, "global_step": 140369, "epoch": 1160} {"train_loss": -36.161834716796875, "global_step": 140370, "epoch": 1160} {"train_loss": -39.023597717285156, "global_step": 140371, "epoch": 1160} {"train_loss": -38.768985748291016, "global_step": 140372, "epoch": 1160} {"train_loss": -36.78279495239258, "global_step": 140373, "epoch": 1160} {"train_loss": -38.03675842285156, "global_step": 140374, "epoch": 1160} {"train_loss": -38.14669418334961, "global_step": 140375, "epoch": 1160} {"train_loss": -40.26816940307617, "global_step": 140376, "epoch": 1160} {"train_loss": -37.43733596801758, "global_step": 140377, "epoch": 1160} {"train_loss": -38.703060150146484, "global_step": 140378, "epoch": 1160} {"train_loss": -38.57680892944336, "global_step": 140379, "epoch": 1160} {"train_loss": -39.631813049316406, "global_step": 140380, "epoch": 1160} {"train_loss": -38.755531311035156, "global_step": 140381, "epoch": 1160} {"train_loss": -39.3395881652832, "global_step": 140382, "epoch": 1160} {"train_loss": -39.480751037597656, "global_step": 140383, "epoch": 1160} {"train_loss": -39.06147384643555, "global_step": 140384, "epoch": 1160} {"train_loss": -39.296730041503906, "global_step": 140385, "epoch": 1160} {"train_loss": -38.07406997680664, "global_step": 140386, "epoch": 1160} {"train_loss": -39.05569076538086, "global_step": 140387, "epoch": 1160} {"train_loss": -39.790626525878906, "global_step": 140388, "epoch": 1160} {"train_loss": -39.73405075073242, "global_step": 140389, "epoch": 1160} {"train_loss": -37.25364303588867, "global_step": 140390, "epoch": 1160} {"train_loss": -38.62361526489258, "global_step": 140391, "epoch": 1160} {"train_loss": -39.86641311645508, "global_step": 140392, "epoch": 1160} {"train_loss": -39.11979293823242, "global_step": 140393, "epoch": 1160} {"train_loss": -38.8663330078125, "global_step": 140394, "epoch": 1160} {"train_loss": -40.38210678100586, "global_step": 140395, "epoch": 1160} {"train_loss": -39.307716369628906, "global_step": 140396, "epoch": 1160} {"train_loss": -40.58660888671875, "global_step": 140397, "epoch": 1160} {"train_loss": -40.12958526611328, "global_step": 140398, "epoch": 1160} {"train_loss": -40.59912872314453, "global_step": 140399, "epoch": 1160} {"train_loss": -39.827388763427734, "global_step": 140400, "epoch": 1160} {"train_loss": -40.831783294677734, "global_step": 140401, "epoch": 1160} {"train_loss": -40.14496994018555, "global_step": 140402, "epoch": 1160} {"train_loss": -39.84066390991211, "global_step": 140403, "epoch": 1160} {"train_loss": -40.543575286865234, "global_step": 140404, "epoch": 1160} {"train_loss": -40.76548385620117, "global_step": 140405, "epoch": 1160} {"train_loss": -40.566131591796875, "global_step": 140406, "epoch": 1160} {"train_loss": -41.13129425048828, "global_step": 140407, "epoch": 1160} {"train_loss": -40.948909759521484, "global_step": 140408, "epoch": 1160} {"train_loss": -40.1246452331543, "global_step": 140409, "epoch": 1160} {"train_loss": -40.48362731933594, "global_step": 140410, "epoch": 1160} {"train_loss": -40.240291595458984, "global_step": 140411, "epoch": 1160} {"train_loss": -40.842132568359375, "global_step": 140412, "epoch": 1160} {"train_loss": -39.85373306274414, "global_step": 140413, "epoch": 1160} {"train_loss": -40.906673431396484, "global_step": 140414, "epoch": 1160} {"train_loss": -40.35380172729492, "global_step": 140415, "epoch": 1160} {"train_loss": -40.771240234375, "global_step": 140416, "epoch": 1160} {"train_loss": -40.0414924621582, "global_step": 140417, "epoch": 1160} {"train_loss": -40.86003875732422, "global_step": 140418, "epoch": 1160} {"train_loss": -40.80440139770508, "global_step": 140419, "epoch": 1160} {"train_loss": -40.5332145690918, "global_step": 140420, "epoch": 1160} {"train_loss": -39.81174087524414, "global_step": 140421, "epoch": 1160} {"train_loss": -39.817108154296875, "global_step": 140422, "epoch": 1160} {"train_loss": -40.19283676147461, "global_step": 140423, "epoch": 1160} {"train_loss": -40.843990325927734, "global_step": 140424, "epoch": 1160} {"train_loss": -39.70736312866211, "global_step": 140425, "epoch": 1160} {"train_loss": -39.45414352416992, "global_step": 140426, "epoch": 1160} {"train_loss": -39.88153839111328, "global_step": 140427, "epoch": 1160} {"train_loss": -38.31265640258789, "global_step": 140428, "epoch": 1160} {"train_loss": -40.8112907409668, "global_step": 140429, "epoch": 1160} {"train_loss": -38.57413864135742, "global_step": 140430, "epoch": 1160} {"train_loss": -40.37667465209961, "global_step": 140431, "epoch": 1160} {"train_loss": -39.1334114074707, "global_step": 140432, "epoch": 1160} {"train_loss": -39.49384689331055, "global_step": 140433, "epoch": 1160} {"train_loss": -40.94685363769531, "global_step": 140434, "epoch": 1160} {"train_loss": -39.84363555908203, "global_step": 140435, "epoch": 1160} {"train_loss": -40.68609619140625, "global_step": 140436, "epoch": 1160} {"train_loss": -40.366371154785156, "global_step": 140437, "epoch": 1160} {"train_loss": -40.5521354675293, "global_step": 140438, "epoch": 1160} {"train_loss": -40.80751419067383, "global_step": 140439, "epoch": 1160} {"train_loss": -39.95895004272461, "global_step": 140440, "epoch": 1160} {"train_loss": -40.66958999633789, "global_step": 140441, "epoch": 1160} {"train_loss": -40.373138427734375, "global_step": 140442, "epoch": 1160} {"train_loss": -40.17002487182617, "global_step": 140443, "epoch": 1160} {"train_loss": -40.258949279785156, "global_step": 140444, "epoch": 1160} {"train_loss": -39.86865997314453, "global_step": 140445, "epoch": 1160} {"train_loss": -39.66888427734375, "global_step": 140446, "epoch": 1160} {"train_loss": -40.843360900878906, "global_step": 140447, "epoch": 1160} {"train_loss": -37.69999313354492, "global_step": 140448, "epoch": 1160} {"train_loss": -39.4437370300293, "global_step": 140449, "epoch": 1160} {"train_loss": -40.4160041809082, "global_step": 140450, "epoch": 1160} {"train_loss": -40.64080810546875, "global_step": 140451, "epoch": 1160} {"train_loss": -40.23704147338867, "global_step": 140452, "epoch": 1160} {"train_loss": -40.153690338134766, "global_step": 140453, "epoch": 1160} {"train_loss": -39.97175979614258, "global_step": 140454, "epoch": 1160} {"train_loss": -40.432064056396484, "global_step": 140455, "epoch": 1160} {"train_loss": -40.822723388671875, "global_step": 140456, "epoch": 1160} {"train_loss": -41.12368392944336, "global_step": 140457, "epoch": 1160} {"train_loss": -41.19782257080078, "global_step": 140458, "epoch": 1160} {"train_loss": -40.52657699584961, "global_step": 140459, "epoch": 1160} {"train_loss": -39.959556579589844, "global_step": 140460, "epoch": 1160} {"train_loss": -40.835487365722656, "global_step": 140461, "epoch": 1160} {"train_loss": -41.27364730834961, "global_step": 140462, "epoch": 1160} {"train_loss": -40.515132904052734, "global_step": 140463, "epoch": 1160} {"train_loss": -39.54733657836914, "global_step": 140464, "epoch": 1160} {"train_loss": -38.485618591308594, "global_step": 140465, "epoch": 1160} {"train_loss": -38.1422004699707, "global_step": 140466, "epoch": 1160} {"train_loss": -38.52315902709961, "global_step": 140467, "epoch": 1160} {"train_loss": -39.87346267700195, "global_step": 140468, "epoch": 1160} {"train_loss": -40.8072624206543, "global_step": 140469, "epoch": 1160} {"train_loss": -40.868202209472656, "global_step": 140470, "epoch": 1160} {"train_loss": -38.0233039855957, "global_step": 140471, "epoch": 1160} {"train_loss": -38.420711517333984, "global_step": 140472, "epoch": 1160} {"train_loss": -39.66236114501953, "global_step": 140473, "epoch": 1160} {"train_loss": -40.084224700927734, "global_step": 140474, "epoch": 1160} {"train_loss": -40.02880859375, "global_step": 140475, "epoch": 1160} {"train_loss": -37.2110710144043, "global_step": 140476, "epoch": 1160} {"train_loss": -37.512996673583984, "global_step": 140477, "epoch": 1160} {"train_loss": -38.26457214355469, "global_step": 140478, "epoch": 1160} {"train_loss": -40.40647506713867, "global_step": 140479, "epoch": 1160} {"train_loss": -39.53004004738548, "global_step": 140480, "epoch": 1160, "val_loss": 2580699.25} {"train_loss": -40.53708267211914, "global_step": 140481, "epoch": 1161} {"train_loss": -39.13518142700195, "global_step": 140482, "epoch": 1161} {"train_loss": -38.033180236816406, "global_step": 140483, "epoch": 1161} {"train_loss": -40.4113655090332, "global_step": 140484, "epoch": 1161} {"train_loss": -38.288978576660156, "global_step": 140485, "epoch": 1161} {"train_loss": -37.5703239440918, "global_step": 140486, "epoch": 1161} {"train_loss": -40.14483642578125, "global_step": 140487, "epoch": 1161} {"train_loss": -38.96220779418945, "global_step": 140488, "epoch": 1161} {"train_loss": -39.72329330444336, "global_step": 140489, "epoch": 1161} {"train_loss": -38.445716857910156, "global_step": 140490, "epoch": 1161} {"train_loss": -39.141448974609375, "global_step": 140491, "epoch": 1161} {"train_loss": -38.61624526977539, "global_step": 140492, "epoch": 1161} {"train_loss": -40.75649642944336, "global_step": 140493, "epoch": 1161} {"train_loss": -39.398353576660156, "global_step": 140494, "epoch": 1161} {"train_loss": -39.22230911254883, "global_step": 140495, "epoch": 1161} {"train_loss": -38.5734748840332, "global_step": 140496, "epoch": 1161} {"train_loss": -38.046653747558594, "global_step": 140497, "epoch": 1161} {"train_loss": -39.27339553833008, "global_step": 140498, "epoch": 1161} {"train_loss": -40.03181457519531, "global_step": 140499, "epoch": 1161} {"train_loss": -39.62689208984375, "global_step": 140500, "epoch": 1161} {"train_loss": -40.1519889831543, "global_step": 140501, "epoch": 1161} {"train_loss": -38.58264923095703, "global_step": 140502, "epoch": 1161} {"train_loss": -38.83437728881836, "global_step": 140503, "epoch": 1161} {"train_loss": -38.45728302001953, "global_step": 140504, "epoch": 1161} {"train_loss": -39.24580001831055, "global_step": 140505, "epoch": 1161} {"train_loss": -37.89291000366211, "global_step": 140506, "epoch": 1161} {"train_loss": -39.83720016479492, "global_step": 140507, "epoch": 1161} {"train_loss": -37.710914611816406, "global_step": 140508, "epoch": 1161} {"train_loss": -38.70355224609375, "global_step": 140509, "epoch": 1161} {"train_loss": -39.09297561645508, "global_step": 140510, "epoch": 1161} {"train_loss": -38.57086181640625, "global_step": 140511, "epoch": 1161} {"train_loss": -38.72734832763672, "global_step": 140512, "epoch": 1161} {"train_loss": -39.894893646240234, "global_step": 140513, "epoch": 1161} {"train_loss": -39.0598030090332, "global_step": 140514, "epoch": 1161} {"train_loss": -38.463623046875, "global_step": 140515, "epoch": 1161} {"train_loss": -40.056190490722656, "global_step": 140516, "epoch": 1161} {"train_loss": -39.164581298828125, "global_step": 140517, "epoch": 1161} {"train_loss": -39.8659782409668, "global_step": 140518, "epoch": 1161} {"train_loss": -40.19504928588867, "global_step": 140519, "epoch": 1161} {"train_loss": -38.936527252197266, "global_step": 140520, "epoch": 1161} {"train_loss": -40.248085021972656, "global_step": 140521, "epoch": 1161} {"train_loss": -40.2030029296875, "global_step": 140522, "epoch": 1161} {"train_loss": -39.97097396850586, "global_step": 140523, "epoch": 1161} {"train_loss": -40.463340759277344, "global_step": 140524, "epoch": 1161} {"train_loss": -40.357872009277344, "global_step": 140525, "epoch": 1161} {"train_loss": -40.710968017578125, "global_step": 140526, "epoch": 1161} {"train_loss": -40.32814407348633, "global_step": 140527, "epoch": 1161} {"train_loss": -40.71955490112305, "global_step": 140528, "epoch": 1161} {"train_loss": -40.37407684326172, "global_step": 140529, "epoch": 1161} {"train_loss": -40.89326095581055, "global_step": 140530, "epoch": 1161} {"train_loss": -40.8953742980957, "global_step": 140531, "epoch": 1161} {"train_loss": -41.4775390625, "global_step": 140532, "epoch": 1161} {"train_loss": -40.566410064697266, "global_step": 140533, "epoch": 1161} {"train_loss": -41.042293548583984, "global_step": 140534, "epoch": 1161} {"train_loss": -41.220428466796875, "global_step": 140535, "epoch": 1161} {"train_loss": -40.580413818359375, "global_step": 140536, "epoch": 1161} {"train_loss": -41.479835510253906, "global_step": 140537, "epoch": 1161} {"train_loss": -41.1819953918457, "global_step": 140538, "epoch": 1161} {"train_loss": -40.76347732543945, "global_step": 140539, "epoch": 1161} {"train_loss": -41.4389762878418, "global_step": 140540, "epoch": 1161} {"train_loss": -41.13621139526367, "global_step": 140541, "epoch": 1161} {"train_loss": -40.9743537902832, "global_step": 140542, "epoch": 1161} {"train_loss": -41.360939025878906, "global_step": 140543, "epoch": 1161} {"train_loss": -40.942298889160156, "global_step": 140544, "epoch": 1161} {"train_loss": -40.70124435424805, "global_step": 140545, "epoch": 1161} {"train_loss": -40.9206428527832, "global_step": 140546, "epoch": 1161} {"train_loss": -41.29554748535156, "global_step": 140547, "epoch": 1161} {"train_loss": -40.90424346923828, "global_step": 140548, "epoch": 1161} {"train_loss": -41.28200912475586, "global_step": 140549, "epoch": 1161} {"train_loss": -41.2437858581543, "global_step": 140550, "epoch": 1161} {"train_loss": -41.11837387084961, "global_step": 140551, "epoch": 1161} {"train_loss": -40.600921630859375, "global_step": 140552, "epoch": 1161} {"train_loss": -41.456661224365234, "global_step": 140553, "epoch": 1161} {"train_loss": -41.18319320678711, "global_step": 140554, "epoch": 1161} {"train_loss": -41.18687057495117, "global_step": 140555, "epoch": 1161} {"train_loss": -41.61428451538086, "global_step": 140556, "epoch": 1161} {"train_loss": -41.20832443237305, "global_step": 140557, "epoch": 1161} {"train_loss": -40.773502349853516, "global_step": 140558, "epoch": 1161} {"train_loss": -40.58228302001953, "global_step": 140559, "epoch": 1161} {"train_loss": -41.29091262817383, "global_step": 140560, "epoch": 1161} {"train_loss": -40.98236083984375, "global_step": 140561, "epoch": 1161} {"train_loss": -40.24860382080078, "global_step": 140562, "epoch": 1161} {"train_loss": -40.89417266845703, "global_step": 140563, "epoch": 1161} {"train_loss": -40.63669967651367, "global_step": 140564, "epoch": 1161} {"train_loss": -39.445011138916016, "global_step": 140565, "epoch": 1161} {"train_loss": -39.68805694580078, "global_step": 140566, "epoch": 1161} {"train_loss": -40.52584457397461, "global_step": 140567, "epoch": 1161} {"train_loss": -39.1050910949707, "global_step": 140568, "epoch": 1161} {"train_loss": -39.43895721435547, "global_step": 140569, "epoch": 1161} {"train_loss": -40.41771697998047, "global_step": 140570, "epoch": 1161} {"train_loss": -39.06916427612305, "global_step": 140571, "epoch": 1161} {"train_loss": -39.2651252746582, "global_step": 140572, "epoch": 1161} {"train_loss": -40.43109130859375, "global_step": 140573, "epoch": 1161} {"train_loss": -39.75865173339844, "global_step": 140574, "epoch": 1161} {"train_loss": -37.75580978393555, "global_step": 140575, "epoch": 1161} {"train_loss": -38.69880294799805, "global_step": 140576, "epoch": 1161} {"train_loss": -39.788246154785156, "global_step": 140577, "epoch": 1161} {"train_loss": -38.57802963256836, "global_step": 140578, "epoch": 1161} {"train_loss": -40.47811508178711, "global_step": 140579, "epoch": 1161} {"train_loss": -39.897430419921875, "global_step": 140580, "epoch": 1161} {"train_loss": -37.526153564453125, "global_step": 140581, "epoch": 1161} {"train_loss": -39.619873046875, "global_step": 140582, "epoch": 1161} {"train_loss": -39.416744232177734, "global_step": 140583, "epoch": 1161} {"train_loss": -39.436458587646484, "global_step": 140584, "epoch": 1161} {"train_loss": -38.586116790771484, "global_step": 140585, "epoch": 1161} {"train_loss": -36.517181396484375, "global_step": 140586, "epoch": 1161} {"train_loss": -40.662513732910156, "global_step": 140587, "epoch": 1161} {"train_loss": -36.47904968261719, "global_step": 140588, "epoch": 1161} {"train_loss": -37.62949752807617, "global_step": 140589, "epoch": 1161} {"train_loss": -38.9720344543457, "global_step": 140590, "epoch": 1161} {"train_loss": -38.655982971191406, "global_step": 140591, "epoch": 1161} {"train_loss": -37.85206604003906, "global_step": 140592, "epoch": 1161} {"train_loss": -39.67262268066406, "global_step": 140593, "epoch": 1161} {"train_loss": -38.88264846801758, "global_step": 140594, "epoch": 1161} {"train_loss": -38.28609085083008, "global_step": 140595, "epoch": 1161} {"train_loss": -40.191131591796875, "global_step": 140596, "epoch": 1161} {"train_loss": -37.49679183959961, "global_step": 140597, "epoch": 1161} {"train_loss": -39.53028106689453, "global_step": 140598, "epoch": 1161} {"train_loss": -37.66288757324219, "global_step": 140599, "epoch": 1161} {"train_loss": -38.8111572265625, "global_step": 140600, "epoch": 1161} {"train_loss": -39.73105451095203, "global_step": 140601, "epoch": 1161, "val_loss": 2398655.25} {"train_loss": -37.9849967956543, "global_step": 140602, "epoch": 1162} {"train_loss": -38.960689544677734, "global_step": 140603, "epoch": 1162} {"train_loss": -39.395484924316406, "global_step": 140604, "epoch": 1162} {"train_loss": -38.56852340698242, "global_step": 140605, "epoch": 1162} {"train_loss": -39.28940963745117, "global_step": 140606, "epoch": 1162} {"train_loss": -39.99093246459961, "global_step": 140607, "epoch": 1162} {"train_loss": -38.860042572021484, "global_step": 140608, "epoch": 1162} {"train_loss": -38.856903076171875, "global_step": 140609, "epoch": 1162} {"train_loss": -38.45576477050781, "global_step": 140610, "epoch": 1162} {"train_loss": -39.37531661987305, "global_step": 140611, "epoch": 1162} {"train_loss": -39.76560592651367, "global_step": 140612, "epoch": 1162} {"train_loss": -40.33898162841797, "global_step": 140613, "epoch": 1162} {"train_loss": -39.67824935913086, "global_step": 140614, "epoch": 1162} {"train_loss": -40.64723587036133, "global_step": 140615, "epoch": 1162} {"train_loss": -39.824161529541016, "global_step": 140616, "epoch": 1162} {"train_loss": -40.996315002441406, "global_step": 140617, "epoch": 1162} {"train_loss": -40.163002014160156, "global_step": 140618, "epoch": 1162} {"train_loss": -39.769954681396484, "global_step": 140619, "epoch": 1162} {"train_loss": -40.51007843017578, "global_step": 140620, "epoch": 1162} {"train_loss": -40.4198112487793, "global_step": 140621, "epoch": 1162} {"train_loss": -40.88819885253906, "global_step": 140622, "epoch": 1162} {"train_loss": -40.41800308227539, "global_step": 140623, "epoch": 1162} {"train_loss": -40.88389205932617, "global_step": 140624, "epoch": 1162} {"train_loss": -40.92715072631836, "global_step": 140625, "epoch": 1162} {"train_loss": -40.98258590698242, "global_step": 140626, "epoch": 1162} {"train_loss": -40.54966735839844, "global_step": 140627, "epoch": 1162} {"train_loss": -40.679527282714844, "global_step": 140628, "epoch": 1162} {"train_loss": -40.58488082885742, "global_step": 140629, "epoch": 1162} {"train_loss": -40.9714241027832, "global_step": 140630, "epoch": 1162} {"train_loss": -40.687652587890625, "global_step": 140631, "epoch": 1162} {"train_loss": -40.727394104003906, "global_step": 140632, "epoch": 1162} {"train_loss": -41.0189323425293, "global_step": 140633, "epoch": 1162} {"train_loss": -40.833805084228516, "global_step": 140634, "epoch": 1162} {"train_loss": -40.3421745300293, "global_step": 140635, "epoch": 1162} {"train_loss": -41.256011962890625, "global_step": 140636, "epoch": 1162} {"train_loss": -40.697174072265625, "global_step": 140637, "epoch": 1162} {"train_loss": -40.73670196533203, "global_step": 140638, "epoch": 1162} {"train_loss": -41.34344482421875, "global_step": 140639, "epoch": 1162} {"train_loss": -41.41215896606445, "global_step": 140640, "epoch": 1162} {"train_loss": -40.34688949584961, "global_step": 140641, "epoch": 1162} {"train_loss": -41.0152587890625, "global_step": 140642, "epoch": 1162} {"train_loss": -41.47576904296875, "global_step": 140643, "epoch": 1162} {"train_loss": -40.870479583740234, "global_step": 140644, "epoch": 1162} {"train_loss": -40.78237533569336, "global_step": 140645, "epoch": 1162} {"train_loss": -40.590576171875, "global_step": 140646, "epoch": 1162} {"train_loss": -41.55263900756836, "global_step": 140647, "epoch": 1162} {"train_loss": -41.02471160888672, "global_step": 140648, "epoch": 1162} {"train_loss": -40.93408203125, "global_step": 140649, "epoch": 1162} {"train_loss": -41.483497619628906, "global_step": 140650, "epoch": 1162} {"train_loss": -41.0789680480957, "global_step": 140651, "epoch": 1162} {"train_loss": -40.136104583740234, "global_step": 140652, "epoch": 1162} {"train_loss": -40.119693756103516, "global_step": 140653, "epoch": 1162} {"train_loss": -40.127967834472656, "global_step": 140654, "epoch": 1162} {"train_loss": -40.49147415161133, "global_step": 140655, "epoch": 1162} {"train_loss": -40.219512939453125, "global_step": 140656, "epoch": 1162} {"train_loss": -40.02157211303711, "global_step": 140657, "epoch": 1162} {"train_loss": -40.87567138671875, "global_step": 140658, "epoch": 1162} {"train_loss": -41.9170036315918, "global_step": 140659, "epoch": 1162} {"train_loss": -40.886898040771484, "global_step": 140660, "epoch": 1162} {"train_loss": -40.827999114990234, "global_step": 140661, "epoch": 1162} {"train_loss": -40.6869010925293, "global_step": 140662, "epoch": 1162} {"train_loss": -40.803524017333984, "global_step": 140663, "epoch": 1162} {"train_loss": -40.66592025756836, "global_step": 140664, "epoch": 1162} {"train_loss": -40.46794509887695, "global_step": 140665, "epoch": 1162} {"train_loss": -40.29775619506836, "global_step": 140666, "epoch": 1162} {"train_loss": -40.120697021484375, "global_step": 140667, "epoch": 1162} {"train_loss": -39.19636917114258, "global_step": 140668, "epoch": 1162} {"train_loss": -38.80704879760742, "global_step": 140669, "epoch": 1162} {"train_loss": -39.874515533447266, "global_step": 140670, "epoch": 1162} {"train_loss": -40.330078125, "global_step": 140671, "epoch": 1162} {"train_loss": -41.107818603515625, "global_step": 140672, "epoch": 1162} {"train_loss": -40.71757125854492, "global_step": 140673, "epoch": 1162} {"train_loss": -39.851966857910156, "global_step": 140674, "epoch": 1162} {"train_loss": -39.55731964111328, "global_step": 140675, "epoch": 1162} {"train_loss": -40.5868034362793, "global_step": 140676, "epoch": 1162} {"train_loss": -39.4339485168457, "global_step": 140677, "epoch": 1162} {"train_loss": -37.6233024597168, "global_step": 140678, "epoch": 1162} {"train_loss": -40.41317367553711, "global_step": 140679, "epoch": 1162} {"train_loss": -41.14847946166992, "global_step": 140680, "epoch": 1162} {"train_loss": -40.19271469116211, "global_step": 140681, "epoch": 1162} {"train_loss": -38.80549240112305, "global_step": 140682, "epoch": 1162} {"train_loss": -40.11662673950195, "global_step": 140683, "epoch": 1162} {"train_loss": -41.007930755615234, "global_step": 140684, "epoch": 1162} {"train_loss": -38.91375732421875, "global_step": 140685, "epoch": 1162} {"train_loss": -39.32846450805664, "global_step": 140686, "epoch": 1162} {"train_loss": -40.597023010253906, "global_step": 140687, "epoch": 1162} {"train_loss": -40.85969161987305, "global_step": 140688, "epoch": 1162} {"train_loss": -41.26618194580078, "global_step": 140689, "epoch": 1162} {"train_loss": -40.927528381347656, "global_step": 140690, "epoch": 1162} {"train_loss": -41.04063034057617, "global_step": 140691, "epoch": 1162} {"train_loss": -41.080657958984375, "global_step": 140692, "epoch": 1162} {"train_loss": -41.1357307434082, "global_step": 140693, "epoch": 1162} {"train_loss": -41.19343185424805, "global_step": 140694, "epoch": 1162} {"train_loss": -40.41056823730469, "global_step": 140695, "epoch": 1162} {"train_loss": -40.925724029541016, "global_step": 140696, "epoch": 1162} {"train_loss": -40.94099426269531, "global_step": 140697, "epoch": 1162} {"train_loss": -40.77950668334961, "global_step": 140698, "epoch": 1162} {"train_loss": -40.4265022277832, "global_step": 140699, "epoch": 1162} {"train_loss": -41.13250732421875, "global_step": 140700, "epoch": 1162} {"train_loss": -38.399112701416016, "global_step": 140701, "epoch": 1162} {"train_loss": -39.806861877441406, "global_step": 140702, "epoch": 1162} {"train_loss": -41.496212005615234, "global_step": 140703, "epoch": 1162} {"train_loss": -37.78386306762695, "global_step": 140704, "epoch": 1162} {"train_loss": -35.78266525268555, "global_step": 140705, "epoch": 1162} {"train_loss": -40.31988525390625, "global_step": 140706, "epoch": 1162} {"train_loss": -37.181365966796875, "global_step": 140707, "epoch": 1162} {"train_loss": -37.643341064453125, "global_step": 140708, "epoch": 1162} {"train_loss": -39.88740921020508, "global_step": 140709, "epoch": 1162} {"train_loss": -35.59425735473633, "global_step": 140710, "epoch": 1162} {"train_loss": -40.41617202758789, "global_step": 140711, "epoch": 1162} {"train_loss": -36.34833526611328, "global_step": 140712, "epoch": 1162} {"train_loss": -37.169490814208984, "global_step": 140713, "epoch": 1162} {"train_loss": -38.00710678100586, "global_step": 140714, "epoch": 1162} {"train_loss": -35.70186233520508, "global_step": 140715, "epoch": 1162} {"train_loss": -39.70284652709961, "global_step": 140716, "epoch": 1162} {"train_loss": -37.23244094848633, "global_step": 140717, "epoch": 1162} {"train_loss": -39.176143646240234, "global_step": 140718, "epoch": 1162} {"train_loss": -39.96162414550781, "global_step": 140719, "epoch": 1162} {"train_loss": -39.41146469116211, "global_step": 140720, "epoch": 1162} {"train_loss": -39.694374084472656, "global_step": 140721, "epoch": 1162} {"train_loss": -40.031560882063935, "global_step": 140722, "epoch": 1162, "val_loss": 2732496.0} {"train_loss": -39.49583053588867, "global_step": 140723, "epoch": 1163} {"train_loss": -40.53745651245117, "global_step": 140724, "epoch": 1163} {"train_loss": -39.75941467285156, "global_step": 140725, "epoch": 1163} {"train_loss": -40.73305892944336, "global_step": 140726, "epoch": 1163} {"train_loss": -39.93697738647461, "global_step": 140727, "epoch": 1163} {"train_loss": -40.31648254394531, "global_step": 140728, "epoch": 1163} {"train_loss": -40.66769027709961, "global_step": 140729, "epoch": 1163} {"train_loss": -39.43773651123047, "global_step": 140730, "epoch": 1163} {"train_loss": -41.11720275878906, "global_step": 140731, "epoch": 1163} {"train_loss": -40.061702728271484, "global_step": 140732, "epoch": 1163} {"train_loss": -40.802894592285156, "global_step": 140733, "epoch": 1163} {"train_loss": -39.94004440307617, "global_step": 140734, "epoch": 1163} {"train_loss": -39.803070068359375, "global_step": 140735, "epoch": 1163} {"train_loss": -39.75338363647461, "global_step": 140736, "epoch": 1163} {"train_loss": -39.748531341552734, "global_step": 140737, "epoch": 1163} {"train_loss": -40.15802001953125, "global_step": 140738, "epoch": 1163} {"train_loss": -40.4822998046875, "global_step": 140739, "epoch": 1163} {"train_loss": -39.247859954833984, "global_step": 140740, "epoch": 1163} {"train_loss": -39.9088020324707, "global_step": 140741, "epoch": 1163} {"train_loss": -40.23550033569336, "global_step": 140742, "epoch": 1163} {"train_loss": -40.430908203125, "global_step": 140743, "epoch": 1163} {"train_loss": -39.493553161621094, "global_step": 140744, "epoch": 1163} {"train_loss": -38.709938049316406, "global_step": 140745, "epoch": 1163} {"train_loss": -40.35515213012695, "global_step": 140746, "epoch": 1163} {"train_loss": -40.2331657409668, "global_step": 140747, "epoch": 1163} {"train_loss": -40.0477180480957, "global_step": 140748, "epoch": 1163} {"train_loss": -40.096282958984375, "global_step": 140749, "epoch": 1163} {"train_loss": -40.70137405395508, "global_step": 140750, "epoch": 1163} {"train_loss": -39.96202850341797, "global_step": 140751, "epoch": 1163} {"train_loss": -40.381103515625, "global_step": 140752, "epoch": 1163} {"train_loss": -40.103885650634766, "global_step": 140753, "epoch": 1163} {"train_loss": -40.67885208129883, "global_step": 140754, "epoch": 1163} {"train_loss": -40.656497955322266, "global_step": 140755, "epoch": 1163} {"train_loss": -40.61582946777344, "global_step": 140756, "epoch": 1163} {"train_loss": -40.36344528198242, "global_step": 140757, "epoch": 1163} {"train_loss": -40.88430404663086, "global_step": 140758, "epoch": 1163} {"train_loss": -40.81003189086914, "global_step": 140759, "epoch": 1163} {"train_loss": -40.567955017089844, "global_step": 140760, "epoch": 1163} {"train_loss": -41.03194808959961, "global_step": 140761, "epoch": 1163} {"train_loss": -40.43770217895508, "global_step": 140762, "epoch": 1163} {"train_loss": -40.625892639160156, "global_step": 140763, "epoch": 1163} {"train_loss": -41.39003372192383, "global_step": 140764, "epoch": 1163} {"train_loss": -41.139400482177734, "global_step": 140765, "epoch": 1163} {"train_loss": -41.138668060302734, "global_step": 140766, "epoch": 1163} {"train_loss": -40.69812774658203, "global_step": 140767, "epoch": 1163} {"train_loss": -41.04420852661133, "global_step": 140768, "epoch": 1163} {"train_loss": -40.63996887207031, "global_step": 140769, "epoch": 1163} {"train_loss": -40.90369415283203, "global_step": 140770, "epoch": 1163} {"train_loss": -40.59705352783203, "global_step": 140771, "epoch": 1163} {"train_loss": -41.00094985961914, "global_step": 140772, "epoch": 1163} {"train_loss": -41.61648178100586, "global_step": 140773, "epoch": 1163} {"train_loss": -41.33028793334961, "global_step": 140774, "epoch": 1163} {"train_loss": -40.19514083862305, "global_step": 140775, "epoch": 1163} {"train_loss": -40.82575988769531, "global_step": 140776, "epoch": 1163} {"train_loss": -41.668373107910156, "global_step": 140777, "epoch": 1163} {"train_loss": -41.32505416870117, "global_step": 140778, "epoch": 1163} {"train_loss": -41.215518951416016, "global_step": 140779, "epoch": 1163} {"train_loss": -40.856197357177734, "global_step": 140780, "epoch": 1163} {"train_loss": -40.432918548583984, "global_step": 140781, "epoch": 1163} {"train_loss": -39.938262939453125, "global_step": 140782, "epoch": 1163} {"train_loss": -40.68739700317383, "global_step": 140783, "epoch": 1163} {"train_loss": -41.24000930786133, "global_step": 140784, "epoch": 1163} {"train_loss": -41.101009368896484, "global_step": 140785, "epoch": 1163} {"train_loss": -40.9962043762207, "global_step": 140786, "epoch": 1163} {"train_loss": -40.60961151123047, "global_step": 140787, "epoch": 1163} {"train_loss": -41.30796432495117, "global_step": 140788, "epoch": 1163} {"train_loss": -41.23347854614258, "global_step": 140789, "epoch": 1163} {"train_loss": -41.343605041503906, "global_step": 140790, "epoch": 1163} {"train_loss": -41.368526458740234, "global_step": 140791, "epoch": 1163} {"train_loss": -41.38376998901367, "global_step": 140792, "epoch": 1163} {"train_loss": -41.042293548583984, "global_step": 140793, "epoch": 1163} {"train_loss": -40.743228912353516, "global_step": 140794, "epoch": 1163} {"train_loss": -39.96067428588867, "global_step": 140795, "epoch": 1163} {"train_loss": -40.330238342285156, "global_step": 140796, "epoch": 1163} {"train_loss": -40.53993225097656, "global_step": 140797, "epoch": 1163} {"train_loss": -40.72376251220703, "global_step": 140798, "epoch": 1163} {"train_loss": -41.80916213989258, "global_step": 140799, "epoch": 1163} {"train_loss": -41.784690856933594, "global_step": 140800, "epoch": 1163} {"train_loss": -40.638885498046875, "global_step": 140801, "epoch": 1163} {"train_loss": -40.40244674682617, "global_step": 140802, "epoch": 1163} {"train_loss": -41.34385681152344, "global_step": 140803, "epoch": 1163} {"train_loss": -41.57598876953125, "global_step": 140804, "epoch": 1163} {"train_loss": -41.58456039428711, "global_step": 140805, "epoch": 1163} {"train_loss": -40.230018615722656, "global_step": 140806, "epoch": 1163} {"train_loss": -39.99951171875, "global_step": 140807, "epoch": 1163} {"train_loss": -41.55989456176758, "global_step": 140808, "epoch": 1163} {"train_loss": -41.703460693359375, "global_step": 140809, "epoch": 1163} {"train_loss": -41.775691986083984, "global_step": 140810, "epoch": 1163} {"train_loss": -41.4254035949707, "global_step": 140811, "epoch": 1163} {"train_loss": -41.14040756225586, "global_step": 140812, "epoch": 1163} {"train_loss": -41.52368927001953, "global_step": 140813, "epoch": 1163} {"train_loss": -41.95369338989258, "global_step": 140814, "epoch": 1163} {"train_loss": -41.572792053222656, "global_step": 140815, "epoch": 1163} {"train_loss": -41.8474006652832, "global_step": 140816, "epoch": 1163} {"train_loss": -42.279109954833984, "global_step": 140817, "epoch": 1163} {"train_loss": -42.0452880859375, "global_step": 140818, "epoch": 1163} {"train_loss": -41.77456283569336, "global_step": 140819, "epoch": 1163} {"train_loss": -41.62992477416992, "global_step": 140820, "epoch": 1163} {"train_loss": -41.84641647338867, "global_step": 140821, "epoch": 1163} {"train_loss": -42.15744400024414, "global_step": 140822, "epoch": 1163} {"train_loss": -41.47895431518555, "global_step": 140823, "epoch": 1163} {"train_loss": -41.17789840698242, "global_step": 140824, "epoch": 1163} {"train_loss": -40.794044494628906, "global_step": 140825, "epoch": 1163} {"train_loss": -40.765602111816406, "global_step": 140826, "epoch": 1163} {"train_loss": -40.59833908081055, "global_step": 140827, "epoch": 1163} {"train_loss": -41.32986068725586, "global_step": 140828, "epoch": 1163} {"train_loss": -41.735107421875, "global_step": 140829, "epoch": 1163} {"train_loss": -41.167724609375, "global_step": 140830, "epoch": 1163} {"train_loss": -39.1121711730957, "global_step": 140831, "epoch": 1163} {"train_loss": -37.135738372802734, "global_step": 140832, "epoch": 1163} {"train_loss": -37.77959060668945, "global_step": 140833, "epoch": 1163} {"train_loss": -40.112789154052734, "global_step": 140834, "epoch": 1163} {"train_loss": -40.03095626831055, "global_step": 140835, "epoch": 1163} {"train_loss": -39.16081619262695, "global_step": 140836, "epoch": 1163} {"train_loss": -38.25059127807617, "global_step": 140837, "epoch": 1163} {"train_loss": -39.44364547729492, "global_step": 140838, "epoch": 1163} {"train_loss": -40.80073165893555, "global_step": 140839, "epoch": 1163} {"train_loss": -39.64883041381836, "global_step": 140840, "epoch": 1163} {"train_loss": -36.12765121459961, "global_step": 140841, "epoch": 1163} {"train_loss": -38.26609802246094, "global_step": 140842, "epoch": 1163} {"train_loss": -40.596766290585855, "global_step": 140843, "epoch": 1163, "val_loss": 2493210.25} {"train_loss": -38.43848419189453, "global_step": 140844, "epoch": 1164} {"train_loss": -37.80810546875, "global_step": 140845, "epoch": 1164} {"train_loss": -37.105812072753906, "global_step": 140846, "epoch": 1164} {"train_loss": -38.1378173828125, "global_step": 140847, "epoch": 1164} {"train_loss": -38.59386444091797, "global_step": 140848, "epoch": 1164} {"train_loss": -36.021846771240234, "global_step": 140849, "epoch": 1164} {"train_loss": -34.70352554321289, "global_step": 140850, "epoch": 1164} {"train_loss": -37.8708610534668, "global_step": 140851, "epoch": 1164} {"train_loss": -36.95502853393555, "global_step": 140852, "epoch": 1164} {"train_loss": -37.68278121948242, "global_step": 140853, "epoch": 1164} {"train_loss": -36.039039611816406, "global_step": 140854, "epoch": 1164} {"train_loss": -37.72534942626953, "global_step": 140855, "epoch": 1164} {"train_loss": -39.06034851074219, "global_step": 140856, "epoch": 1164} {"train_loss": -39.288665771484375, "global_step": 140857, "epoch": 1164} {"train_loss": -38.48380661010742, "global_step": 140858, "epoch": 1164} {"train_loss": -39.023048400878906, "global_step": 140859, "epoch": 1164} {"train_loss": -39.78315353393555, "global_step": 140860, "epoch": 1164} {"train_loss": -39.667049407958984, "global_step": 140861, "epoch": 1164} {"train_loss": -39.67427062988281, "global_step": 140862, "epoch": 1164} {"train_loss": -40.08844757080078, "global_step": 140863, "epoch": 1164} {"train_loss": -39.933773040771484, "global_step": 140864, "epoch": 1164} {"train_loss": -39.9206428527832, "global_step": 140865, "epoch": 1164} {"train_loss": -40.28364944458008, "global_step": 140866, "epoch": 1164} {"train_loss": -40.20643997192383, "global_step": 140867, "epoch": 1164} {"train_loss": -39.901161193847656, "global_step": 140868, "epoch": 1164} {"train_loss": -40.06459426879883, "global_step": 140869, "epoch": 1164} {"train_loss": -39.419952392578125, "global_step": 140870, "epoch": 1164} {"train_loss": -39.86819076538086, "global_step": 140871, "epoch": 1164} {"train_loss": -40.26805877685547, "global_step": 140872, "epoch": 1164} {"train_loss": -40.09790802001953, "global_step": 140873, "epoch": 1164} {"train_loss": -40.48450469970703, "global_step": 140874, "epoch": 1164} {"train_loss": -40.480342864990234, "global_step": 140875, "epoch": 1164} {"train_loss": -40.689247131347656, "global_step": 140876, "epoch": 1164} {"train_loss": -40.03632354736328, "global_step": 140877, "epoch": 1164} {"train_loss": -39.905609130859375, "global_step": 140878, "epoch": 1164} {"train_loss": -40.2905387878418, "global_step": 140879, "epoch": 1164} {"train_loss": -40.73438262939453, "global_step": 140880, "epoch": 1164} {"train_loss": -40.6236686706543, "global_step": 140881, "epoch": 1164} {"train_loss": -40.13295364379883, "global_step": 140882, "epoch": 1164} {"train_loss": -40.48430252075195, "global_step": 140883, "epoch": 1164} {"train_loss": -40.85663986206055, "global_step": 140884, "epoch": 1164} {"train_loss": -40.521968841552734, "global_step": 140885, "epoch": 1164} {"train_loss": -41.49440383911133, "global_step": 140886, "epoch": 1164} {"train_loss": -40.588932037353516, "global_step": 140887, "epoch": 1164} {"train_loss": -41.22392654418945, "global_step": 140888, "epoch": 1164} {"train_loss": -39.6417350769043, "global_step": 140889, "epoch": 1164} {"train_loss": -41.1341552734375, "global_step": 140890, "epoch": 1164} {"train_loss": -41.08510971069336, "global_step": 140891, "epoch": 1164} {"train_loss": -41.29613494873047, "global_step": 140892, "epoch": 1164} {"train_loss": -41.25868606567383, "global_step": 140893, "epoch": 1164} {"train_loss": -40.666168212890625, "global_step": 140894, "epoch": 1164} {"train_loss": -41.0091552734375, "global_step": 140895, "epoch": 1164} {"train_loss": -41.36855697631836, "global_step": 140896, "epoch": 1164} {"train_loss": -40.73289108276367, "global_step": 140897, "epoch": 1164} {"train_loss": -41.22846603393555, "global_step": 140898, "epoch": 1164} {"train_loss": -41.14785385131836, "global_step": 140899, "epoch": 1164} {"train_loss": -39.829322814941406, "global_step": 140900, "epoch": 1164} {"train_loss": -41.510135650634766, "global_step": 140901, "epoch": 1164} {"train_loss": -41.68430709838867, "global_step": 140902, "epoch": 1164} {"train_loss": -41.508907318115234, "global_step": 140903, "epoch": 1164} {"train_loss": -41.10360336303711, "global_step": 140904, "epoch": 1164} {"train_loss": -41.63100814819336, "global_step": 140905, "epoch": 1164} {"train_loss": -40.979339599609375, "global_step": 140906, "epoch": 1164} {"train_loss": -41.44940948486328, "global_step": 140907, "epoch": 1164} {"train_loss": -41.13596725463867, "global_step": 140908, "epoch": 1164} {"train_loss": -41.45082092285156, "global_step": 140909, "epoch": 1164} {"train_loss": -41.20109176635742, "global_step": 140910, "epoch": 1164} {"train_loss": -41.236236572265625, "global_step": 140911, "epoch": 1164} {"train_loss": -41.08961868286133, "global_step": 140912, "epoch": 1164} {"train_loss": -40.884708404541016, "global_step": 140913, "epoch": 1164} {"train_loss": -40.81016159057617, "global_step": 140914, "epoch": 1164} {"train_loss": -40.08669662475586, "global_step": 140915, "epoch": 1164} {"train_loss": -40.67644500732422, "global_step": 140916, "epoch": 1164} {"train_loss": -40.523712158203125, "global_step": 140917, "epoch": 1164} {"train_loss": -40.76309585571289, "global_step": 140918, "epoch": 1164} {"train_loss": -40.77419662475586, "global_step": 140919, "epoch": 1164} {"train_loss": -40.592735290527344, "global_step": 140920, "epoch": 1164} {"train_loss": -41.124576568603516, "global_step": 140921, "epoch": 1164} {"train_loss": -40.082210540771484, "global_step": 140922, "epoch": 1164} {"train_loss": -41.747718811035156, "global_step": 140923, "epoch": 1164} {"train_loss": -41.67299270629883, "global_step": 140924, "epoch": 1164} {"train_loss": -41.317684173583984, "global_step": 140925, "epoch": 1164} {"train_loss": -41.36996078491211, "global_step": 140926, "epoch": 1164} {"train_loss": -41.70344924926758, "global_step": 140927, "epoch": 1164} {"train_loss": -40.83466339111328, "global_step": 140928, "epoch": 1164} {"train_loss": -40.408592224121094, "global_step": 140929, "epoch": 1164} {"train_loss": -41.74552536010742, "global_step": 140930, "epoch": 1164} {"train_loss": -41.92578887939453, "global_step": 140931, "epoch": 1164} {"train_loss": -40.983707427978516, "global_step": 140932, "epoch": 1164} {"train_loss": -39.12345504760742, "global_step": 140933, "epoch": 1164} {"train_loss": -36.626399993896484, "global_step": 140934, "epoch": 1164} {"train_loss": -36.57181930541992, "global_step": 140935, "epoch": 1164} {"train_loss": -29.229354858398438, "global_step": 140936, "epoch": 1164} {"train_loss": -40.466590881347656, "global_step": 140937, "epoch": 1164} {"train_loss": -32.47798538208008, "global_step": 140938, "epoch": 1164} {"train_loss": -34.395259857177734, "global_step": 140939, "epoch": 1164} {"train_loss": -33.71525192260742, "global_step": 140940, "epoch": 1164} {"train_loss": -31.838653564453125, "global_step": 140941, "epoch": 1164} {"train_loss": -27.38553237915039, "global_step": 140942, "epoch": 1164} {"train_loss": -27.432764053344727, "global_step": 140943, "epoch": 1164} {"train_loss": -34.71611404418945, "global_step": 140944, "epoch": 1164} {"train_loss": -32.70789337158203, "global_step": 140945, "epoch": 1164} {"train_loss": -28.099035263061523, "global_step": 140946, "epoch": 1164} {"train_loss": -31.526844024658203, "global_step": 140947, "epoch": 1164} {"train_loss": -30.631885528564453, "global_step": 140948, "epoch": 1164} {"train_loss": -36.5655517578125, "global_step": 140949, "epoch": 1164} {"train_loss": -29.361188888549805, "global_step": 140950, "epoch": 1164} {"train_loss": -29.772201538085938, "global_step": 140951, "epoch": 1164} {"train_loss": -31.88419532775879, "global_step": 140952, "epoch": 1164} {"train_loss": -30.05197525024414, "global_step": 140953, "epoch": 1164} {"train_loss": -33.560970306396484, "global_step": 140954, "epoch": 1164} {"train_loss": -32.510772705078125, "global_step": 140955, "epoch": 1164} {"train_loss": -32.679176330566406, "global_step": 140956, "epoch": 1164} {"train_loss": -33.468482971191406, "global_step": 140957, "epoch": 1164} {"train_loss": -34.831199645996094, "global_step": 140958, "epoch": 1164} {"train_loss": -35.57240676879883, "global_step": 140959, "epoch": 1164} {"train_loss": -37.75482940673828, "global_step": 140960, "epoch": 1164} {"train_loss": -36.62224197387695, "global_step": 140961, "epoch": 1164} {"train_loss": -36.63412857055664, "global_step": 140962, "epoch": 1164} {"train_loss": -35.934993743896484, "global_step": 140963, "epoch": 1164} {"train_loss": -38.40730506329497, "global_step": 140964, "epoch": 1164, "val_loss": 2717080.25} {"train_loss": -37.03725814819336, "global_step": 140965, "epoch": 1165} {"train_loss": -36.99629592895508, "global_step": 140966, "epoch": 1165} {"train_loss": -36.14882278442383, "global_step": 140967, "epoch": 1165} {"train_loss": -37.25090026855469, "global_step": 140968, "epoch": 1165} {"train_loss": -36.928016662597656, "global_step": 140969, "epoch": 1165} {"train_loss": -37.69057846069336, "global_step": 140970, "epoch": 1165} {"train_loss": -37.599544525146484, "global_step": 140971, "epoch": 1165} {"train_loss": -38.54722213745117, "global_step": 140972, "epoch": 1165} {"train_loss": -38.14273452758789, "global_step": 140973, "epoch": 1165} {"train_loss": -37.6566047668457, "global_step": 140974, "epoch": 1165} {"train_loss": -38.759071350097656, "global_step": 140975, "epoch": 1165} {"train_loss": -37.22284698486328, "global_step": 140976, "epoch": 1165} {"train_loss": -38.7767448425293, "global_step": 140977, "epoch": 1165} {"train_loss": -38.3637809753418, "global_step": 140978, "epoch": 1165} {"train_loss": -38.50065231323242, "global_step": 140979, "epoch": 1165} {"train_loss": -38.75038146972656, "global_step": 140980, "epoch": 1165} {"train_loss": -38.69707107543945, "global_step": 140981, "epoch": 1165} {"train_loss": -38.944374084472656, "global_step": 140982, "epoch": 1165} {"train_loss": -38.75965881347656, "global_step": 140983, "epoch": 1165} {"train_loss": -39.3212890625, "global_step": 140984, "epoch": 1165} {"train_loss": -37.99725341796875, "global_step": 140985, "epoch": 1165} {"train_loss": -39.228572845458984, "global_step": 140986, "epoch": 1165} {"train_loss": -39.482967376708984, "global_step": 140987, "epoch": 1165} {"train_loss": -39.495826721191406, "global_step": 140988, "epoch": 1165} {"train_loss": -38.96171188354492, "global_step": 140989, "epoch": 1165} {"train_loss": -39.79668045043945, "global_step": 140990, "epoch": 1165} {"train_loss": -39.60258102416992, "global_step": 140991, "epoch": 1165} {"train_loss": -39.58626937866211, "global_step": 140992, "epoch": 1165} {"train_loss": -40.02503204345703, "global_step": 140993, "epoch": 1165} {"train_loss": -39.37439727783203, "global_step": 140994, "epoch": 1165} {"train_loss": -38.76677322387695, "global_step": 140995, "epoch": 1165} {"train_loss": -39.52024459838867, "global_step": 140996, "epoch": 1165} {"train_loss": -40.008079528808594, "global_step": 140997, "epoch": 1165} {"train_loss": -39.93545913696289, "global_step": 140998, "epoch": 1165} {"train_loss": -40.03864669799805, "global_step": 140999, "epoch": 1165} {"train_loss": -39.77029037475586, "global_step": 141000, "epoch": 1165} {"train_loss": -40.369873046875, "global_step": 141001, "epoch": 1165} {"train_loss": -40.3326530456543, "global_step": 141002, "epoch": 1165} {"train_loss": -39.599395751953125, "global_step": 141003, "epoch": 1165} {"train_loss": -40.63166809082031, "global_step": 141004, "epoch": 1165} {"train_loss": -40.741390228271484, "global_step": 141005, "epoch": 1165} {"train_loss": -40.35831069946289, "global_step": 141006, "epoch": 1165} {"train_loss": -40.40446853637695, "global_step": 141007, "epoch": 1165} {"train_loss": -40.63673782348633, "global_step": 141008, "epoch": 1165} {"train_loss": -40.16778564453125, "global_step": 141009, "epoch": 1165} {"train_loss": -40.603511810302734, "global_step": 141010, "epoch": 1165} {"train_loss": -40.53487777709961, "global_step": 141011, "epoch": 1165} {"train_loss": -40.303035736083984, "global_step": 141012, "epoch": 1165} {"train_loss": -40.106571197509766, "global_step": 141013, "epoch": 1165} {"train_loss": -40.45033645629883, "global_step": 141014, "epoch": 1165} {"train_loss": -40.75809097290039, "global_step": 141015, "epoch": 1165} {"train_loss": -40.25019836425781, "global_step": 141016, "epoch": 1165} {"train_loss": -40.31624221801758, "global_step": 141017, "epoch": 1165} {"train_loss": -41.355018615722656, "global_step": 141018, "epoch": 1165} {"train_loss": -40.422889709472656, "global_step": 141019, "epoch": 1165} {"train_loss": -40.485748291015625, "global_step": 141020, "epoch": 1165} {"train_loss": -40.511592864990234, "global_step": 141021, "epoch": 1165} {"train_loss": -40.13971710205078, "global_step": 141022, "epoch": 1165} {"train_loss": -40.38564682006836, "global_step": 141023, "epoch": 1165} {"train_loss": -40.24833679199219, "global_step": 141024, "epoch": 1165} {"train_loss": -40.58606719970703, "global_step": 141025, "epoch": 1165} {"train_loss": -39.880958557128906, "global_step": 141026, "epoch": 1165} {"train_loss": -37.629817962646484, "global_step": 141027, "epoch": 1165} {"train_loss": -39.129730224609375, "global_step": 141028, "epoch": 1165} {"train_loss": -40.38283157348633, "global_step": 141029, "epoch": 1165} {"train_loss": -38.714599609375, "global_step": 141030, "epoch": 1165} {"train_loss": -38.82082748413086, "global_step": 141031, "epoch": 1165} {"train_loss": -38.8130989074707, "global_step": 141032, "epoch": 1165} {"train_loss": -40.749019622802734, "global_step": 141033, "epoch": 1165} {"train_loss": -40.32833480834961, "global_step": 141034, "epoch": 1165} {"train_loss": -39.415016174316406, "global_step": 141035, "epoch": 1165} {"train_loss": -38.963863372802734, "global_step": 141036, "epoch": 1165} {"train_loss": -40.4512825012207, "global_step": 141037, "epoch": 1165} {"train_loss": -40.05622863769531, "global_step": 141038, "epoch": 1165} {"train_loss": -40.566951751708984, "global_step": 141039, "epoch": 1165} {"train_loss": -40.14344024658203, "global_step": 141040, "epoch": 1165} {"train_loss": -40.59224319458008, "global_step": 141041, "epoch": 1165} {"train_loss": -39.96481704711914, "global_step": 141042, "epoch": 1165} {"train_loss": -39.297271728515625, "global_step": 141043, "epoch": 1165} {"train_loss": -37.02155685424805, "global_step": 141044, "epoch": 1165} {"train_loss": -38.44268798828125, "global_step": 141045, "epoch": 1165} {"train_loss": -38.78355026245117, "global_step": 141046, "epoch": 1165} {"train_loss": -37.22872543334961, "global_step": 141047, "epoch": 1165} {"train_loss": -38.2254753112793, "global_step": 141048, "epoch": 1165} {"train_loss": -40.14506149291992, "global_step": 141049, "epoch": 1165} {"train_loss": -38.79960250854492, "global_step": 141050, "epoch": 1165} {"train_loss": -39.115936279296875, "global_step": 141051, "epoch": 1165} {"train_loss": -38.65121078491211, "global_step": 141052, "epoch": 1165} {"train_loss": -38.1856803894043, "global_step": 141053, "epoch": 1165} {"train_loss": -39.16873550415039, "global_step": 141054, "epoch": 1165} {"train_loss": -40.550350189208984, "global_step": 141055, "epoch": 1165} {"train_loss": -39.51450729370117, "global_step": 141056, "epoch": 1165} {"train_loss": -38.3349494934082, "global_step": 141057, "epoch": 1165} {"train_loss": -40.194313049316406, "global_step": 141058, "epoch": 1165} {"train_loss": -39.86785888671875, "global_step": 141059, "epoch": 1165} {"train_loss": -39.57704544067383, "global_step": 141060, "epoch": 1165} {"train_loss": -40.2396125793457, "global_step": 141061, "epoch": 1165} {"train_loss": -40.085693359375, "global_step": 141062, "epoch": 1165} {"train_loss": -40.54069137573242, "global_step": 141063, "epoch": 1165} {"train_loss": -39.76362991333008, "global_step": 141064, "epoch": 1165} {"train_loss": -39.42829132080078, "global_step": 141065, "epoch": 1165} {"train_loss": -40.01713180541992, "global_step": 141066, "epoch": 1165} {"train_loss": -40.81943893432617, "global_step": 141067, "epoch": 1165} {"train_loss": -40.50429916381836, "global_step": 141068, "epoch": 1165} {"train_loss": -40.38669967651367, "global_step": 141069, "epoch": 1165} {"train_loss": -40.6317253112793, "global_step": 141070, "epoch": 1165} {"train_loss": -40.45125961303711, "global_step": 141071, "epoch": 1165} {"train_loss": -40.42388153076172, "global_step": 141072, "epoch": 1165} {"train_loss": -39.942771911621094, "global_step": 141073, "epoch": 1165} {"train_loss": -40.23429870605469, "global_step": 141074, "epoch": 1165} {"train_loss": -40.358924865722656, "global_step": 141075, "epoch": 1165} {"train_loss": -40.126808166503906, "global_step": 141076, "epoch": 1165} {"train_loss": -40.43181610107422, "global_step": 141077, "epoch": 1165} {"train_loss": -40.52315139770508, "global_step": 141078, "epoch": 1165} {"train_loss": -40.1920166015625, "global_step": 141079, "epoch": 1165} {"train_loss": -41.00132369995117, "global_step": 141080, "epoch": 1165} {"train_loss": -40.347267150878906, "global_step": 141081, "epoch": 1165} {"train_loss": -40.464969635009766, "global_step": 141082, "epoch": 1165} {"train_loss": -40.83107376098633, "global_step": 141083, "epoch": 1165} {"train_loss": -40.44802474975586, "global_step": 141084, "epoch": 1165} {"train_loss": -39.56500048676798, "global_step": 141085, "epoch": 1165, "val_loss": 2812080.0} {"train_loss": -40.6973762512207, "global_step": 141086, "epoch": 1166} {"train_loss": -39.84403991699219, "global_step": 141087, "epoch": 1166} {"train_loss": -39.443817138671875, "global_step": 141088, "epoch": 1166} {"train_loss": -36.803871154785156, "global_step": 141089, "epoch": 1166} {"train_loss": -38.8154182434082, "global_step": 141090, "epoch": 1166} {"train_loss": -40.90135192871094, "global_step": 141091, "epoch": 1166} {"train_loss": -35.78626251220703, "global_step": 141092, "epoch": 1166} {"train_loss": -39.95931625366211, "global_step": 141093, "epoch": 1166} {"train_loss": -34.4440803527832, "global_step": 141094, "epoch": 1166} {"train_loss": -39.00358200073242, "global_step": 141095, "epoch": 1166} {"train_loss": -35.17332077026367, "global_step": 141096, "epoch": 1166} {"train_loss": -35.500160217285156, "global_step": 141097, "epoch": 1166} {"train_loss": -39.536251068115234, "global_step": 141098, "epoch": 1166} {"train_loss": -36.01388168334961, "global_step": 141099, "epoch": 1166} {"train_loss": -39.025146484375, "global_step": 141100, "epoch": 1166} {"train_loss": -35.76831817626953, "global_step": 141101, "epoch": 1166} {"train_loss": -34.64716720581055, "global_step": 141102, "epoch": 1166} {"train_loss": -38.91168975830078, "global_step": 141103, "epoch": 1166} {"train_loss": -34.7674674987793, "global_step": 141104, "epoch": 1166} {"train_loss": -34.46189498901367, "global_step": 141105, "epoch": 1166} {"train_loss": -37.31553268432617, "global_step": 141106, "epoch": 1166} {"train_loss": -36.348506927490234, "global_step": 141107, "epoch": 1166} {"train_loss": -35.84172821044922, "global_step": 141108, "epoch": 1166} {"train_loss": -39.2603874206543, "global_step": 141109, "epoch": 1166} {"train_loss": -36.52766036987305, "global_step": 141110, "epoch": 1166} {"train_loss": -38.39386749267578, "global_step": 141111, "epoch": 1166} {"train_loss": -39.38631820678711, "global_step": 141112, "epoch": 1166} {"train_loss": -36.7961311340332, "global_step": 141113, "epoch": 1166} {"train_loss": -39.60792922973633, "global_step": 141114, "epoch": 1166} {"train_loss": -38.84162139892578, "global_step": 141115, "epoch": 1166} {"train_loss": -38.39542770385742, "global_step": 141116, "epoch": 1166} {"train_loss": -39.89246368408203, "global_step": 141117, "epoch": 1166} {"train_loss": -39.22660446166992, "global_step": 141118, "epoch": 1166} {"train_loss": -39.49967956542969, "global_step": 141119, "epoch": 1166} {"train_loss": -39.968238830566406, "global_step": 141120, "epoch": 1166} {"train_loss": -39.79716110229492, "global_step": 141121, "epoch": 1166} {"train_loss": -39.622764587402344, "global_step": 141122, "epoch": 1166} {"train_loss": -40.04090118408203, "global_step": 141123, "epoch": 1166} {"train_loss": -39.84601974487305, "global_step": 141124, "epoch": 1166} {"train_loss": -39.538475036621094, "global_step": 141125, "epoch": 1166} {"train_loss": -40.08768844604492, "global_step": 141126, "epoch": 1166} {"train_loss": -40.0565185546875, "global_step": 141127, "epoch": 1166} {"train_loss": -40.03441619873047, "global_step": 141128, "epoch": 1166} {"train_loss": -39.23360061645508, "global_step": 141129, "epoch": 1166} {"train_loss": -37.76070785522461, "global_step": 141130, "epoch": 1166} {"train_loss": -37.706031799316406, "global_step": 141131, "epoch": 1166} {"train_loss": -38.25117111206055, "global_step": 141132, "epoch": 1166} {"train_loss": -39.32622146606445, "global_step": 141133, "epoch": 1166} {"train_loss": -39.90695571899414, "global_step": 141134, "epoch": 1166} {"train_loss": -39.676788330078125, "global_step": 141135, "epoch": 1166} {"train_loss": -40.17208480834961, "global_step": 141136, "epoch": 1166} {"train_loss": -39.183990478515625, "global_step": 141137, "epoch": 1166} {"train_loss": -39.32456588745117, "global_step": 141138, "epoch": 1166} {"train_loss": -40.14982986450195, "global_step": 141139, "epoch": 1166} {"train_loss": -39.370033264160156, "global_step": 141140, "epoch": 1166} {"train_loss": -39.04194259643555, "global_step": 141141, "epoch": 1166} {"train_loss": -39.95981979370117, "global_step": 141142, "epoch": 1166} {"train_loss": -40.456417083740234, "global_step": 141143, "epoch": 1166} {"train_loss": -40.380184173583984, "global_step": 141144, "epoch": 1166} {"train_loss": -40.44325256347656, "global_step": 141145, "epoch": 1166} {"train_loss": -40.190940856933594, "global_step": 141146, "epoch": 1166} {"train_loss": -40.724735260009766, "global_step": 141147, "epoch": 1166} {"train_loss": -40.26759719848633, "global_step": 141148, "epoch": 1166} {"train_loss": -40.10738754272461, "global_step": 141149, "epoch": 1166} {"train_loss": -39.965980529785156, "global_step": 141150, "epoch": 1166} {"train_loss": -40.176292419433594, "global_step": 141151, "epoch": 1166} {"train_loss": -40.27484130859375, "global_step": 141152, "epoch": 1166} {"train_loss": -39.92873001098633, "global_step": 141153, "epoch": 1166} {"train_loss": -40.91341781616211, "global_step": 141154, "epoch": 1166} {"train_loss": -39.81301498413086, "global_step": 141155, "epoch": 1166} {"train_loss": -39.41665267944336, "global_step": 141156, "epoch": 1166} {"train_loss": -39.95298385620117, "global_step": 141157, "epoch": 1166} {"train_loss": -39.85988235473633, "global_step": 141158, "epoch": 1166} {"train_loss": -38.18031692504883, "global_step": 141159, "epoch": 1166} {"train_loss": -36.47935104370117, "global_step": 141160, "epoch": 1166} {"train_loss": -38.34744644165039, "global_step": 141161, "epoch": 1166} {"train_loss": -37.8160400390625, "global_step": 141162, "epoch": 1166} {"train_loss": -39.67660140991211, "global_step": 141163, "epoch": 1166} {"train_loss": -39.54940414428711, "global_step": 141164, "epoch": 1166} {"train_loss": -38.25864791870117, "global_step": 141165, "epoch": 1166} {"train_loss": -39.89157485961914, "global_step": 141166, "epoch": 1166} {"train_loss": -39.49409484863281, "global_step": 141167, "epoch": 1166} {"train_loss": -38.2336311340332, "global_step": 141168, "epoch": 1166} {"train_loss": -40.33161544799805, "global_step": 141169, "epoch": 1166} {"train_loss": -40.38125228881836, "global_step": 141170, "epoch": 1166} {"train_loss": -38.02052688598633, "global_step": 141171, "epoch": 1166} {"train_loss": -38.17308044433594, "global_step": 141172, "epoch": 1166} {"train_loss": -40.5238151550293, "global_step": 141173, "epoch": 1166} {"train_loss": -40.78908157348633, "global_step": 141174, "epoch": 1166} {"train_loss": -39.76393508911133, "global_step": 141175, "epoch": 1166} {"train_loss": -40.270137786865234, "global_step": 141176, "epoch": 1166} {"train_loss": -40.69826889038086, "global_step": 141177, "epoch": 1166} {"train_loss": -40.65907669067383, "global_step": 141178, "epoch": 1166} {"train_loss": -40.5139045715332, "global_step": 141179, "epoch": 1166} {"train_loss": -40.749549865722656, "global_step": 141180, "epoch": 1166} {"train_loss": -40.76527786254883, "global_step": 141181, "epoch": 1166} {"train_loss": -40.43192672729492, "global_step": 141182, "epoch": 1166} {"train_loss": -40.237037658691406, "global_step": 141183, "epoch": 1166} {"train_loss": -40.05660629272461, "global_step": 141184, "epoch": 1166} {"train_loss": -39.97661209106445, "global_step": 141185, "epoch": 1166} {"train_loss": -39.501991271972656, "global_step": 141186, "epoch": 1166} {"train_loss": -39.400718688964844, "global_step": 141187, "epoch": 1166} {"train_loss": -40.087646484375, "global_step": 141188, "epoch": 1166} {"train_loss": -40.95145797729492, "global_step": 141189, "epoch": 1166} {"train_loss": -39.809417724609375, "global_step": 141190, "epoch": 1166} {"train_loss": -38.289798736572266, "global_step": 141191, "epoch": 1166} {"train_loss": -39.3946418762207, "global_step": 141192, "epoch": 1166} {"train_loss": -40.83220291137695, "global_step": 141193, "epoch": 1166} {"train_loss": -40.52008819580078, "global_step": 141194, "epoch": 1166} {"train_loss": -39.3763542175293, "global_step": 141195, "epoch": 1166} {"train_loss": -39.901641845703125, "global_step": 141196, "epoch": 1166} {"train_loss": -40.147823333740234, "global_step": 141197, "epoch": 1166} {"train_loss": -39.10638427734375, "global_step": 141198, "epoch": 1166} {"train_loss": -39.70217514038086, "global_step": 141199, "epoch": 1166} {"train_loss": -39.753597259521484, "global_step": 141200, "epoch": 1166} {"train_loss": -40.225494384765625, "global_step": 141201, "epoch": 1166} {"train_loss": -40.336666107177734, "global_step": 141202, "epoch": 1166} {"train_loss": -39.570892333984375, "global_step": 141203, "epoch": 1166} {"train_loss": -39.587379455566406, "global_step": 141204, "epoch": 1166} {"train_loss": -39.64860153198242, "global_step": 141205, "epoch": 1166} {"train_loss": -39.170819589914366, "global_step": 141206, "epoch": 1166, "val_loss": 2685931.75} {"train_loss": -40.34648132324219, "global_step": 141207, "epoch": 1167} {"train_loss": -40.2446403503418, "global_step": 141208, "epoch": 1167} {"train_loss": -39.9932975769043, "global_step": 141209, "epoch": 1167} {"train_loss": -39.757484436035156, "global_step": 141210, "epoch": 1167} {"train_loss": -40.85524368286133, "global_step": 141211, "epoch": 1167} {"train_loss": -39.707759857177734, "global_step": 141212, "epoch": 1167} {"train_loss": -38.584861755371094, "global_step": 141213, "epoch": 1167} {"train_loss": -40.88862228393555, "global_step": 141214, "epoch": 1167} {"train_loss": -39.641029357910156, "global_step": 141215, "epoch": 1167} {"train_loss": -39.156490325927734, "global_step": 141216, "epoch": 1167} {"train_loss": -40.49006271362305, "global_step": 141217, "epoch": 1167} {"train_loss": -40.37294006347656, "global_step": 141218, "epoch": 1167} {"train_loss": -38.23121643066406, "global_step": 141219, "epoch": 1167} {"train_loss": -39.0382194519043, "global_step": 141220, "epoch": 1167} {"train_loss": -38.37838363647461, "global_step": 141221, "epoch": 1167} {"train_loss": -36.55811309814453, "global_step": 141222, "epoch": 1167} {"train_loss": -39.89373779296875, "global_step": 141223, "epoch": 1167} {"train_loss": -39.19672393798828, "global_step": 141224, "epoch": 1167} {"train_loss": -38.12856674194336, "global_step": 141225, "epoch": 1167} {"train_loss": -39.57660675048828, "global_step": 141226, "epoch": 1167} {"train_loss": -39.51320266723633, "global_step": 141227, "epoch": 1167} {"train_loss": -38.18636703491211, "global_step": 141228, "epoch": 1167} {"train_loss": -38.25283432006836, "global_step": 141229, "epoch": 1167} {"train_loss": -39.38611602783203, "global_step": 141230, "epoch": 1167} {"train_loss": -36.940467834472656, "global_step": 141231, "epoch": 1167} {"train_loss": -39.89224624633789, "global_step": 141232, "epoch": 1167} {"train_loss": -37.486785888671875, "global_step": 141233, "epoch": 1167} {"train_loss": -39.2059211730957, "global_step": 141234, "epoch": 1167} {"train_loss": -38.46559524536133, "global_step": 141235, "epoch": 1167} {"train_loss": -39.272762298583984, "global_step": 141236, "epoch": 1167} {"train_loss": -36.845787048339844, "global_step": 141237, "epoch": 1167} {"train_loss": -40.52132797241211, "global_step": 141238, "epoch": 1167} {"train_loss": -35.38298416137695, "global_step": 141239, "epoch": 1167} {"train_loss": -40.49843215942383, "global_step": 141240, "epoch": 1167} {"train_loss": -38.004268646240234, "global_step": 141241, "epoch": 1167} {"train_loss": -37.67367172241211, "global_step": 141242, "epoch": 1167} {"train_loss": -40.40644454956055, "global_step": 141243, "epoch": 1167} {"train_loss": -36.61505889892578, "global_step": 141244, "epoch": 1167} {"train_loss": -38.44088363647461, "global_step": 141245, "epoch": 1167} {"train_loss": -40.089111328125, "global_step": 141246, "epoch": 1167} {"train_loss": -38.069366455078125, "global_step": 141247, "epoch": 1167} {"train_loss": -37.3321533203125, "global_step": 141248, "epoch": 1167} {"train_loss": -40.733306884765625, "global_step": 141249, "epoch": 1167} {"train_loss": -36.85871124267578, "global_step": 141250, "epoch": 1167} {"train_loss": -38.08509826660156, "global_step": 141251, "epoch": 1167} {"train_loss": -40.005775451660156, "global_step": 141252, "epoch": 1167} {"train_loss": -39.299617767333984, "global_step": 141253, "epoch": 1167} {"train_loss": -38.48163986206055, "global_step": 141254, "epoch": 1167} {"train_loss": -37.37944412231445, "global_step": 141255, "epoch": 1167} {"train_loss": -40.08924102783203, "global_step": 141256, "epoch": 1167} {"train_loss": -39.43907928466797, "global_step": 141257, "epoch": 1167} {"train_loss": -39.26231002807617, "global_step": 141258, "epoch": 1167} {"train_loss": -38.883056640625, "global_step": 141259, "epoch": 1167} {"train_loss": -40.5204963684082, "global_step": 141260, "epoch": 1167} {"train_loss": -39.563995361328125, "global_step": 141261, "epoch": 1167} {"train_loss": -40.426815032958984, "global_step": 141262, "epoch": 1167} {"train_loss": -40.13777160644531, "global_step": 141263, "epoch": 1167} {"train_loss": -39.12177276611328, "global_step": 141264, "epoch": 1167} {"train_loss": -40.034034729003906, "global_step": 141265, "epoch": 1167} {"train_loss": -39.778377532958984, "global_step": 141266, "epoch": 1167} {"train_loss": -40.51121139526367, "global_step": 141267, "epoch": 1167} {"train_loss": -40.8235969543457, "global_step": 141268, "epoch": 1167} {"train_loss": -40.1282844543457, "global_step": 141269, "epoch": 1167} {"train_loss": -40.09592819213867, "global_step": 141270, "epoch": 1167} {"train_loss": -40.32088851928711, "global_step": 141271, "epoch": 1167} {"train_loss": -40.50152587890625, "global_step": 141272, "epoch": 1167} {"train_loss": -40.01976013183594, "global_step": 141273, "epoch": 1167} {"train_loss": -40.27539825439453, "global_step": 141274, "epoch": 1167} {"train_loss": -40.713199615478516, "global_step": 141275, "epoch": 1167} {"train_loss": -39.80615234375, "global_step": 141276, "epoch": 1167} {"train_loss": -40.54325485229492, "global_step": 141277, "epoch": 1167} {"train_loss": -40.90155029296875, "global_step": 141278, "epoch": 1167} {"train_loss": -39.163917541503906, "global_step": 141279, "epoch": 1167} {"train_loss": -40.0775260925293, "global_step": 141280, "epoch": 1167} {"train_loss": -40.53282928466797, "global_step": 141281, "epoch": 1167} {"train_loss": -39.79159164428711, "global_step": 141282, "epoch": 1167} {"train_loss": -40.72808837890625, "global_step": 141283, "epoch": 1167} {"train_loss": -40.224361419677734, "global_step": 141284, "epoch": 1167} {"train_loss": -40.08506393432617, "global_step": 141285, "epoch": 1167} {"train_loss": -40.797943115234375, "global_step": 141286, "epoch": 1167} {"train_loss": -39.61137771606445, "global_step": 141287, "epoch": 1167} {"train_loss": -39.641326904296875, "global_step": 141288, "epoch": 1167} {"train_loss": -37.8698844909668, "global_step": 141289, "epoch": 1167} {"train_loss": -38.34751510620117, "global_step": 141290, "epoch": 1167} {"train_loss": -38.8553581237793, "global_step": 141291, "epoch": 1167} {"train_loss": -38.92731857299805, "global_step": 141292, "epoch": 1167} {"train_loss": -40.4444465637207, "global_step": 141293, "epoch": 1167} {"train_loss": -40.61888122558594, "global_step": 141294, "epoch": 1167} {"train_loss": -39.235145568847656, "global_step": 141295, "epoch": 1167} {"train_loss": -39.74936294555664, "global_step": 141296, "epoch": 1167} {"train_loss": -40.76731491088867, "global_step": 141297, "epoch": 1167} {"train_loss": -40.811431884765625, "global_step": 141298, "epoch": 1167} {"train_loss": -40.37392044067383, "global_step": 141299, "epoch": 1167} {"train_loss": -40.91511917114258, "global_step": 141300, "epoch": 1167} {"train_loss": -40.773006439208984, "global_step": 141301, "epoch": 1167} {"train_loss": -41.238555908203125, "global_step": 141302, "epoch": 1167} {"train_loss": -41.21343231201172, "global_step": 141303, "epoch": 1167} {"train_loss": -40.00736999511719, "global_step": 141304, "epoch": 1167} {"train_loss": -40.70859909057617, "global_step": 141305, "epoch": 1167} {"train_loss": -40.6469612121582, "global_step": 141306, "epoch": 1167} {"train_loss": -40.24117660522461, "global_step": 141307, "epoch": 1167} {"train_loss": -41.07546615600586, "global_step": 141308, "epoch": 1167} {"train_loss": -41.153717041015625, "global_step": 141309, "epoch": 1167} {"train_loss": -41.4001350402832, "global_step": 141310, "epoch": 1167} {"train_loss": -41.0506706237793, "global_step": 141311, "epoch": 1167} {"train_loss": -41.38975143432617, "global_step": 141312, "epoch": 1167} {"train_loss": -41.42928695678711, "global_step": 141313, "epoch": 1167} {"train_loss": -40.82521438598633, "global_step": 141314, "epoch": 1167} {"train_loss": -41.12775421142578, "global_step": 141315, "epoch": 1167} {"train_loss": -41.41294479370117, "global_step": 141316, "epoch": 1167} {"train_loss": -41.07352066040039, "global_step": 141317, "epoch": 1167} {"train_loss": -41.5484619140625, "global_step": 141318, "epoch": 1167} {"train_loss": -41.6157341003418, "global_step": 141319, "epoch": 1167} {"train_loss": -41.321434020996094, "global_step": 141320, "epoch": 1167} {"train_loss": -41.28022003173828, "global_step": 141321, "epoch": 1167} {"train_loss": -41.23439407348633, "global_step": 141322, "epoch": 1167} {"train_loss": -41.387237548828125, "global_step": 141323, "epoch": 1167} {"train_loss": -41.246150970458984, "global_step": 141324, "epoch": 1167} {"train_loss": -41.23176574707031, "global_step": 141325, "epoch": 1167} {"train_loss": -41.1151008605957, "global_step": 141326, "epoch": 1167} {"train_loss": -39.79990276620408, "global_step": 141327, "epoch": 1167, "val_loss": 2727833.75} {"train_loss": -40.99760055541992, "global_step": 141328, "epoch": 1168} {"train_loss": -40.76787567138672, "global_step": 141329, "epoch": 1168} {"train_loss": -40.42082595825195, "global_step": 141330, "epoch": 1168} {"train_loss": -40.86082077026367, "global_step": 141331, "epoch": 1168} {"train_loss": -40.91859817504883, "global_step": 141332, "epoch": 1168} {"train_loss": -41.36347579956055, "global_step": 141333, "epoch": 1168} {"train_loss": -41.5798225402832, "global_step": 141334, "epoch": 1168} {"train_loss": -40.93571472167969, "global_step": 141335, "epoch": 1168} {"train_loss": -41.767250061035156, "global_step": 141336, "epoch": 1168} {"train_loss": -41.04152297973633, "global_step": 141337, "epoch": 1168} {"train_loss": -39.904605865478516, "global_step": 141338, "epoch": 1168} {"train_loss": -39.9281120300293, "global_step": 141339, "epoch": 1168} {"train_loss": -38.601619720458984, "global_step": 141340, "epoch": 1168} {"train_loss": -37.45864486694336, "global_step": 141341, "epoch": 1168} {"train_loss": -39.187538146972656, "global_step": 141342, "epoch": 1168} {"train_loss": -40.353267669677734, "global_step": 141343, "epoch": 1168} {"train_loss": -39.69145965576172, "global_step": 141344, "epoch": 1168} {"train_loss": -40.70301055908203, "global_step": 141345, "epoch": 1168} {"train_loss": -40.32969284057617, "global_step": 141346, "epoch": 1168} {"train_loss": -38.084590911865234, "global_step": 141347, "epoch": 1168} {"train_loss": -39.90638732910156, "global_step": 141348, "epoch": 1168} {"train_loss": -40.619606018066406, "global_step": 141349, "epoch": 1168} {"train_loss": -39.74856185913086, "global_step": 141350, "epoch": 1168} {"train_loss": -39.43412399291992, "global_step": 141351, "epoch": 1168} {"train_loss": -38.92840576171875, "global_step": 141352, "epoch": 1168} {"train_loss": -40.88408660888672, "global_step": 141353, "epoch": 1168} {"train_loss": -41.43905258178711, "global_step": 141354, "epoch": 1168} {"train_loss": -40.90816116333008, "global_step": 141355, "epoch": 1168} {"train_loss": -39.856544494628906, "global_step": 141356, "epoch": 1168} {"train_loss": -39.6650505065918, "global_step": 141357, "epoch": 1168} {"train_loss": -40.78727722167969, "global_step": 141358, "epoch": 1168} {"train_loss": -40.10222244262695, "global_step": 141359, "epoch": 1168} {"train_loss": -39.13588333129883, "global_step": 141360, "epoch": 1168} {"train_loss": -40.6413459777832, "global_step": 141361, "epoch": 1168} {"train_loss": -40.29194259643555, "global_step": 141362, "epoch": 1168} {"train_loss": -38.19165802001953, "global_step": 141363, "epoch": 1168} {"train_loss": -39.520263671875, "global_step": 141364, "epoch": 1168} {"train_loss": -39.8338508605957, "global_step": 141365, "epoch": 1168} {"train_loss": -40.00380325317383, "global_step": 141366, "epoch": 1168} {"train_loss": -39.73127746582031, "global_step": 141367, "epoch": 1168} {"train_loss": -39.36259078979492, "global_step": 141368, "epoch": 1168} {"train_loss": -39.49924850463867, "global_step": 141369, "epoch": 1168} {"train_loss": -40.04299545288086, "global_step": 141370, "epoch": 1168} {"train_loss": -39.559600830078125, "global_step": 141371, "epoch": 1168} {"train_loss": -40.109840393066406, "global_step": 141372, "epoch": 1168} {"train_loss": -40.7705192565918, "global_step": 141373, "epoch": 1168} {"train_loss": -39.5847282409668, "global_step": 141374, "epoch": 1168} {"train_loss": -38.86606979370117, "global_step": 141375, "epoch": 1168} {"train_loss": -39.777435302734375, "global_step": 141376, "epoch": 1168} {"train_loss": -39.49910354614258, "global_step": 141377, "epoch": 1168} {"train_loss": -39.27737045288086, "global_step": 141378, "epoch": 1168} {"train_loss": -40.41090774536133, "global_step": 141379, "epoch": 1168} {"train_loss": -40.650978088378906, "global_step": 141380, "epoch": 1168} {"train_loss": -39.85348892211914, "global_step": 141381, "epoch": 1168} {"train_loss": -40.918212890625, "global_step": 141382, "epoch": 1168} {"train_loss": -39.914302825927734, "global_step": 141383, "epoch": 1168} {"train_loss": -39.62834167480469, "global_step": 141384, "epoch": 1168} {"train_loss": -40.3820686340332, "global_step": 141385, "epoch": 1168} {"train_loss": -40.63238525390625, "global_step": 141386, "epoch": 1168} {"train_loss": -40.97880172729492, "global_step": 141387, "epoch": 1168} {"train_loss": -40.15531539916992, "global_step": 141388, "epoch": 1168} {"train_loss": -40.785518646240234, "global_step": 141389, "epoch": 1168} {"train_loss": -40.047332763671875, "global_step": 141390, "epoch": 1168} {"train_loss": -39.27994155883789, "global_step": 141391, "epoch": 1168} {"train_loss": -41.008724212646484, "global_step": 141392, "epoch": 1168} {"train_loss": -40.44765090942383, "global_step": 141393, "epoch": 1168} {"train_loss": -39.45221710205078, "global_step": 141394, "epoch": 1168} {"train_loss": -40.822265625, "global_step": 141395, "epoch": 1168} {"train_loss": -39.343994140625, "global_step": 141396, "epoch": 1168} {"train_loss": -39.221885681152344, "global_step": 141397, "epoch": 1168} {"train_loss": -38.55610656738281, "global_step": 141398, "epoch": 1168} {"train_loss": -38.567169189453125, "global_step": 141399, "epoch": 1168} {"train_loss": -41.03273391723633, "global_step": 141400, "epoch": 1168} {"train_loss": -39.64274978637695, "global_step": 141401, "epoch": 1168} {"train_loss": -39.25394058227539, "global_step": 141402, "epoch": 1168} {"train_loss": -39.82915496826172, "global_step": 141403, "epoch": 1168} {"train_loss": -39.384822845458984, "global_step": 141404, "epoch": 1168} {"train_loss": -40.34679412841797, "global_step": 141405, "epoch": 1168} {"train_loss": -40.043697357177734, "global_step": 141406, "epoch": 1168} {"train_loss": -39.94235610961914, "global_step": 141407, "epoch": 1168} {"train_loss": -41.43764877319336, "global_step": 141408, "epoch": 1168} {"train_loss": -41.038814544677734, "global_step": 141409, "epoch": 1168} {"train_loss": -40.45326614379883, "global_step": 141410, "epoch": 1168} {"train_loss": -39.955657958984375, "global_step": 141411, "epoch": 1168} {"train_loss": -40.18137741088867, "global_step": 141412, "epoch": 1168} {"train_loss": -39.92507553100586, "global_step": 141413, "epoch": 1168} {"train_loss": -39.13076400756836, "global_step": 141414, "epoch": 1168} {"train_loss": -40.944679260253906, "global_step": 141415, "epoch": 1168} {"train_loss": -40.065513610839844, "global_step": 141416, "epoch": 1168} {"train_loss": -40.62080001831055, "global_step": 141417, "epoch": 1168} {"train_loss": -40.49165725708008, "global_step": 141418, "epoch": 1168} {"train_loss": -40.51053237915039, "global_step": 141419, "epoch": 1168} {"train_loss": -40.73621368408203, "global_step": 141420, "epoch": 1168} {"train_loss": -40.14222717285156, "global_step": 141421, "epoch": 1168} {"train_loss": -40.731040954589844, "global_step": 141422, "epoch": 1168} {"train_loss": -40.049766540527344, "global_step": 141423, "epoch": 1168} {"train_loss": -39.758846282958984, "global_step": 141424, "epoch": 1168} {"train_loss": -41.14929962158203, "global_step": 141425, "epoch": 1168} {"train_loss": -40.412635803222656, "global_step": 141426, "epoch": 1168} {"train_loss": -40.512413024902344, "global_step": 141427, "epoch": 1168} {"train_loss": -39.936397552490234, "global_step": 141428, "epoch": 1168} {"train_loss": -40.81536865234375, "global_step": 141429, "epoch": 1168} {"train_loss": -40.47168731689453, "global_step": 141430, "epoch": 1168} {"train_loss": -40.45621109008789, "global_step": 141431, "epoch": 1168} {"train_loss": -40.35898971557617, "global_step": 141432, "epoch": 1168} {"train_loss": -40.75789260864258, "global_step": 141433, "epoch": 1168} {"train_loss": -41.20537185668945, "global_step": 141434, "epoch": 1168} {"train_loss": -39.27352523803711, "global_step": 141435, "epoch": 1168} {"train_loss": -40.03215789794922, "global_step": 141436, "epoch": 1168} {"train_loss": -41.124412536621094, "global_step": 141437, "epoch": 1168} {"train_loss": -40.503875732421875, "global_step": 141438, "epoch": 1168} {"train_loss": -40.0801887512207, "global_step": 141439, "epoch": 1168} {"train_loss": -40.894195556640625, "global_step": 141440, "epoch": 1168} {"train_loss": -40.88835525512695, "global_step": 141441, "epoch": 1168} {"train_loss": -40.57040023803711, "global_step": 141442, "epoch": 1168} {"train_loss": -41.021575927734375, "global_step": 141443, "epoch": 1168} {"train_loss": -40.69422149658203, "global_step": 141444, "epoch": 1168} {"train_loss": -39.63410949707031, "global_step": 141445, "epoch": 1168} {"train_loss": -40.43596267700195, "global_step": 141446, "epoch": 1168} {"train_loss": -40.569091796875, "global_step": 141447, "epoch": 1168} {"train_loss": -40.168383637735666, "global_step": 141448, "epoch": 1168, "val_loss": 2642502.25} {"train_loss": -39.95176315307617, "global_step": 141449, "epoch": 1169} {"train_loss": -41.07554244995117, "global_step": 141450, "epoch": 1169} {"train_loss": -40.76801681518555, "global_step": 141451, "epoch": 1169} {"train_loss": -40.76496124267578, "global_step": 141452, "epoch": 1169} {"train_loss": -40.08441162109375, "global_step": 141453, "epoch": 1169} {"train_loss": -40.019195556640625, "global_step": 141454, "epoch": 1169} {"train_loss": -39.87659454345703, "global_step": 141455, "epoch": 1169} {"train_loss": -40.559383392333984, "global_step": 141456, "epoch": 1169} {"train_loss": -40.6384391784668, "global_step": 141457, "epoch": 1169} {"train_loss": -39.413841247558594, "global_step": 141458, "epoch": 1169} {"train_loss": -38.4994010925293, "global_step": 141459, "epoch": 1169} {"train_loss": -40.00605392456055, "global_step": 141460, "epoch": 1169} {"train_loss": -40.223873138427734, "global_step": 141461, "epoch": 1169} {"train_loss": -40.924171447753906, "global_step": 141462, "epoch": 1169} {"train_loss": -40.54444122314453, "global_step": 141463, "epoch": 1169} {"train_loss": -39.786842346191406, "global_step": 141464, "epoch": 1169} {"train_loss": -41.03120803833008, "global_step": 141465, "epoch": 1169} {"train_loss": -40.938751220703125, "global_step": 141466, "epoch": 1169} {"train_loss": -40.624122619628906, "global_step": 141467, "epoch": 1169} {"train_loss": -39.8144645690918, "global_step": 141468, "epoch": 1169} {"train_loss": -39.78647232055664, "global_step": 141469, "epoch": 1169} {"train_loss": -41.2051887512207, "global_step": 141470, "epoch": 1169} {"train_loss": -41.02238464355469, "global_step": 141471, "epoch": 1169} {"train_loss": -40.1912841796875, "global_step": 141472, "epoch": 1169} {"train_loss": -41.0285758972168, "global_step": 141473, "epoch": 1169} {"train_loss": -41.085060119628906, "global_step": 141474, "epoch": 1169} {"train_loss": -40.761512756347656, "global_step": 141475, "epoch": 1169} {"train_loss": -40.98268508911133, "global_step": 141476, "epoch": 1169} {"train_loss": -41.28483963012695, "global_step": 141477, "epoch": 1169} {"train_loss": -41.19474792480469, "global_step": 141478, "epoch": 1169} {"train_loss": -41.242042541503906, "global_step": 141479, "epoch": 1169} {"train_loss": -40.931819915771484, "global_step": 141480, "epoch": 1169} {"train_loss": -41.33671188354492, "global_step": 141481, "epoch": 1169} {"train_loss": -41.38630294799805, "global_step": 141482, "epoch": 1169} {"train_loss": -41.019325256347656, "global_step": 141483, "epoch": 1169} {"train_loss": -41.378658294677734, "global_step": 141484, "epoch": 1169} {"train_loss": -41.88251495361328, "global_step": 141485, "epoch": 1169} {"train_loss": -40.81229782104492, "global_step": 141486, "epoch": 1169} {"train_loss": -40.87178421020508, "global_step": 141487, "epoch": 1169} {"train_loss": -41.45756149291992, "global_step": 141488, "epoch": 1169} {"train_loss": -41.69401550292969, "global_step": 141489, "epoch": 1169} {"train_loss": -41.229976654052734, "global_step": 141490, "epoch": 1169} {"train_loss": -41.18214416503906, "global_step": 141491, "epoch": 1169} {"train_loss": -40.56531524658203, "global_step": 141492, "epoch": 1169} {"train_loss": -39.47468185424805, "global_step": 141493, "epoch": 1169} {"train_loss": -39.57756042480469, "global_step": 141494, "epoch": 1169} {"train_loss": -38.251564025878906, "global_step": 141495, "epoch": 1169} {"train_loss": -34.77170181274414, "global_step": 141496, "epoch": 1169} {"train_loss": -35.67806625366211, "global_step": 141497, "epoch": 1169} {"train_loss": -35.9560546875, "global_step": 141498, "epoch": 1169} {"train_loss": -36.4056282043457, "global_step": 141499, "epoch": 1169} {"train_loss": -36.50751876831055, "global_step": 141500, "epoch": 1169} {"train_loss": -35.92279052734375, "global_step": 141501, "epoch": 1169} {"train_loss": -36.47568893432617, "global_step": 141502, "epoch": 1169} {"train_loss": -35.531166076660156, "global_step": 141503, "epoch": 1169} {"train_loss": -36.9515495300293, "global_step": 141504, "epoch": 1169} {"train_loss": -37.21269607543945, "global_step": 141505, "epoch": 1169} {"train_loss": -38.77119064331055, "global_step": 141506, "epoch": 1169} {"train_loss": -38.8262939453125, "global_step": 141507, "epoch": 1169} {"train_loss": -39.23889923095703, "global_step": 141508, "epoch": 1169} {"train_loss": -38.584991455078125, "global_step": 141509, "epoch": 1169} {"train_loss": -39.175758361816406, "global_step": 141510, "epoch": 1169} {"train_loss": -38.790985107421875, "global_step": 141511, "epoch": 1169} {"train_loss": -38.93850326538086, "global_step": 141512, "epoch": 1169} {"train_loss": -38.76335144042969, "global_step": 141513, "epoch": 1169} {"train_loss": -40.024330139160156, "global_step": 141514, "epoch": 1169} {"train_loss": -38.48736572265625, "global_step": 141515, "epoch": 1169} {"train_loss": -39.9625244140625, "global_step": 141516, "epoch": 1169} {"train_loss": -38.89071273803711, "global_step": 141517, "epoch": 1169} {"train_loss": -40.10535430908203, "global_step": 141518, "epoch": 1169} {"train_loss": -39.6329460144043, "global_step": 141519, "epoch": 1169} {"train_loss": -39.19936752319336, "global_step": 141520, "epoch": 1169} {"train_loss": -39.39533615112305, "global_step": 141521, "epoch": 1169} {"train_loss": -39.51212692260742, "global_step": 141522, "epoch": 1169} {"train_loss": -40.474849700927734, "global_step": 141523, "epoch": 1169} {"train_loss": -39.3972282409668, "global_step": 141524, "epoch": 1169} {"train_loss": -39.47475051879883, "global_step": 141525, "epoch": 1169} {"train_loss": -39.162601470947266, "global_step": 141526, "epoch": 1169} {"train_loss": -40.567726135253906, "global_step": 141527, "epoch": 1169} {"train_loss": -40.04996871948242, "global_step": 141528, "epoch": 1169} {"train_loss": -39.698753356933594, "global_step": 141529, "epoch": 1169} {"train_loss": -38.94498825073242, "global_step": 141530, "epoch": 1169} {"train_loss": -40.45095443725586, "global_step": 141531, "epoch": 1169} {"train_loss": -40.62152099609375, "global_step": 141532, "epoch": 1169} {"train_loss": -40.3644905090332, "global_step": 141533, "epoch": 1169} {"train_loss": -40.362335205078125, "global_step": 141534, "epoch": 1169} {"train_loss": -40.39420700073242, "global_step": 141535, "epoch": 1169} {"train_loss": -40.9062385559082, "global_step": 141536, "epoch": 1169} {"train_loss": -40.03707504272461, "global_step": 141537, "epoch": 1169} {"train_loss": -40.82737350463867, "global_step": 141538, "epoch": 1169} {"train_loss": -41.255313873291016, "global_step": 141539, "epoch": 1169} {"train_loss": -40.81513214111328, "global_step": 141540, "epoch": 1169} {"train_loss": -41.34907150268555, "global_step": 141541, "epoch": 1169} {"train_loss": -41.45158004760742, "global_step": 141542, "epoch": 1169} {"train_loss": -41.36989212036133, "global_step": 141543, "epoch": 1169} {"train_loss": -41.223548889160156, "global_step": 141544, "epoch": 1169} {"train_loss": -41.27108383178711, "global_step": 141545, "epoch": 1169} {"train_loss": -41.47026062011719, "global_step": 141546, "epoch": 1169} {"train_loss": -41.63946533203125, "global_step": 141547, "epoch": 1169} {"train_loss": -41.30290603637695, "global_step": 141548, "epoch": 1169} {"train_loss": -41.22941970825195, "global_step": 141549, "epoch": 1169} {"train_loss": -40.6575813293457, "global_step": 141550, "epoch": 1169} {"train_loss": -40.17095947265625, "global_step": 141551, "epoch": 1169} {"train_loss": -39.95875930786133, "global_step": 141552, "epoch": 1169} {"train_loss": -41.14386749267578, "global_step": 141553, "epoch": 1169} {"train_loss": -41.45136642456055, "global_step": 141554, "epoch": 1169} {"train_loss": -41.17108154296875, "global_step": 141555, "epoch": 1169} {"train_loss": -40.15339279174805, "global_step": 141556, "epoch": 1169} {"train_loss": -38.95845031738281, "global_step": 141557, "epoch": 1169} {"train_loss": -39.95656204223633, "global_step": 141558, "epoch": 1169} {"train_loss": -40.928585052490234, "global_step": 141559, "epoch": 1169} {"train_loss": -41.15309143066406, "global_step": 141560, "epoch": 1169} {"train_loss": -39.925048828125, "global_step": 141561, "epoch": 1169} {"train_loss": -39.67975997924805, "global_step": 141562, "epoch": 1169} {"train_loss": -39.96659469604492, "global_step": 141563, "epoch": 1169} {"train_loss": -40.39691162109375, "global_step": 141564, "epoch": 1169} {"train_loss": -40.22869873046875, "global_step": 141565, "epoch": 1169} {"train_loss": -39.4519157409668, "global_step": 141566, "epoch": 1169} {"train_loss": -40.10246658325195, "global_step": 141567, "epoch": 1169} {"train_loss": -41.328216552734375, "global_step": 141568, "epoch": 1169} {"train_loss": -39.99654817187096, "global_step": 141569, "epoch": 1169, "val_loss": 2734201.0} {"train_loss": -39.60243606567383, "global_step": 141570, "epoch": 1170} {"train_loss": -40.563148498535156, "global_step": 141571, "epoch": 1170} {"train_loss": -40.930728912353516, "global_step": 141572, "epoch": 1170} {"train_loss": -41.16835021972656, "global_step": 141573, "epoch": 1170} {"train_loss": -41.405181884765625, "global_step": 141574, "epoch": 1170} {"train_loss": -41.288421630859375, "global_step": 141575, "epoch": 1170} {"train_loss": -41.269081115722656, "global_step": 141576, "epoch": 1170} {"train_loss": -41.31368637084961, "global_step": 141577, "epoch": 1170} {"train_loss": -40.082881927490234, "global_step": 141578, "epoch": 1170} {"train_loss": -40.33657455444336, "global_step": 141579, "epoch": 1170} {"train_loss": -40.753753662109375, "global_step": 141580, "epoch": 1170} {"train_loss": -40.31394958496094, "global_step": 141581, "epoch": 1170} {"train_loss": -40.68564987182617, "global_step": 141582, "epoch": 1170} {"train_loss": -41.17585372924805, "global_step": 141583, "epoch": 1170} {"train_loss": -40.38827133178711, "global_step": 141584, "epoch": 1170} {"train_loss": -40.432987213134766, "global_step": 141585, "epoch": 1170} {"train_loss": -39.698299407958984, "global_step": 141586, "epoch": 1170} {"train_loss": -40.720863342285156, "global_step": 141587, "epoch": 1170} {"train_loss": -40.11265563964844, "global_step": 141588, "epoch": 1170} {"train_loss": -39.831573486328125, "global_step": 141589, "epoch": 1170} {"train_loss": -39.480648040771484, "global_step": 141590, "epoch": 1170} {"train_loss": -37.96448516845703, "global_step": 141591, "epoch": 1170} {"train_loss": -38.688594818115234, "global_step": 141592, "epoch": 1170} {"train_loss": -39.30645751953125, "global_step": 141593, "epoch": 1170} {"train_loss": -39.126060485839844, "global_step": 141594, "epoch": 1170} {"train_loss": -39.33583450317383, "global_step": 141595, "epoch": 1170} {"train_loss": -39.92950439453125, "global_step": 141596, "epoch": 1170} {"train_loss": -39.98811721801758, "global_step": 141597, "epoch": 1170} {"train_loss": -39.95964813232422, "global_step": 141598, "epoch": 1170} {"train_loss": -40.15814971923828, "global_step": 141599, "epoch": 1170} {"train_loss": -39.64995193481445, "global_step": 141600, "epoch": 1170} {"train_loss": -39.538909912109375, "global_step": 141601, "epoch": 1170} {"train_loss": -38.765869140625, "global_step": 141602, "epoch": 1170} {"train_loss": -40.41904830932617, "global_step": 141603, "epoch": 1170} {"train_loss": -39.903804779052734, "global_step": 141604, "epoch": 1170} {"train_loss": -38.50104904174805, "global_step": 141605, "epoch": 1170} {"train_loss": -38.94941329956055, "global_step": 141606, "epoch": 1170} {"train_loss": -38.80106735229492, "global_step": 141607, "epoch": 1170} {"train_loss": -36.46510696411133, "global_step": 141608, "epoch": 1170} {"train_loss": -39.03899383544922, "global_step": 141609, "epoch": 1170} {"train_loss": -38.50666046142578, "global_step": 141610, "epoch": 1170} {"train_loss": -38.245277404785156, "global_step": 141611, "epoch": 1170} {"train_loss": -38.6409912109375, "global_step": 141612, "epoch": 1170} {"train_loss": -39.200775146484375, "global_step": 141613, "epoch": 1170} {"train_loss": -38.89779281616211, "global_step": 141614, "epoch": 1170} {"train_loss": -40.7850227355957, "global_step": 141615, "epoch": 1170} {"train_loss": -38.0106201171875, "global_step": 141616, "epoch": 1170} {"train_loss": -40.07133483886719, "global_step": 141617, "epoch": 1170} {"train_loss": -39.68575668334961, "global_step": 141618, "epoch": 1170} {"train_loss": -40.540771484375, "global_step": 141619, "epoch": 1170} {"train_loss": -39.70131301879883, "global_step": 141620, "epoch": 1170} {"train_loss": -39.843719482421875, "global_step": 141621, "epoch": 1170} {"train_loss": -39.799190521240234, "global_step": 141622, "epoch": 1170} {"train_loss": -40.22489547729492, "global_step": 141623, "epoch": 1170} {"train_loss": -39.44221115112305, "global_step": 141624, "epoch": 1170} {"train_loss": -40.61043930053711, "global_step": 141625, "epoch": 1170} {"train_loss": -39.37504196166992, "global_step": 141626, "epoch": 1170} {"train_loss": -39.98080062866211, "global_step": 141627, "epoch": 1170} {"train_loss": -40.28652572631836, "global_step": 141628, "epoch": 1170} {"train_loss": -40.65106964111328, "global_step": 141629, "epoch": 1170} {"train_loss": -40.443817138671875, "global_step": 141630, "epoch": 1170} {"train_loss": -40.59906005859375, "global_step": 141631, "epoch": 1170} {"train_loss": -40.14894104003906, "global_step": 141632, "epoch": 1170} {"train_loss": -40.75533676147461, "global_step": 141633, "epoch": 1170} {"train_loss": -40.79219055175781, "global_step": 141634, "epoch": 1170} {"train_loss": -40.31028366088867, "global_step": 141635, "epoch": 1170} {"train_loss": -40.999603271484375, "global_step": 141636, "epoch": 1170} {"train_loss": -39.766151428222656, "global_step": 141637, "epoch": 1170} {"train_loss": -40.62104797363281, "global_step": 141638, "epoch": 1170} {"train_loss": -40.85933303833008, "global_step": 141639, "epoch": 1170} {"train_loss": -40.483070373535156, "global_step": 141640, "epoch": 1170} {"train_loss": -40.87343215942383, "global_step": 141641, "epoch": 1170} {"train_loss": -40.572418212890625, "global_step": 141642, "epoch": 1170} {"train_loss": -40.91611862182617, "global_step": 141643, "epoch": 1170} {"train_loss": -40.51350784301758, "global_step": 141644, "epoch": 1170} {"train_loss": -40.105140686035156, "global_step": 141645, "epoch": 1170} {"train_loss": -41.228179931640625, "global_step": 141646, "epoch": 1170} {"train_loss": -39.985958099365234, "global_step": 141647, "epoch": 1170} {"train_loss": -41.07957077026367, "global_step": 141648, "epoch": 1170} {"train_loss": -40.93330001831055, "global_step": 141649, "epoch": 1170} {"train_loss": -40.270668029785156, "global_step": 141650, "epoch": 1170} {"train_loss": -41.4548454284668, "global_step": 141651, "epoch": 1170} {"train_loss": -40.25877380371094, "global_step": 141652, "epoch": 1170} {"train_loss": -41.23857498168945, "global_step": 141653, "epoch": 1170} {"train_loss": -41.487403869628906, "global_step": 141654, "epoch": 1170} {"train_loss": -41.29105758666992, "global_step": 141655, "epoch": 1170} {"train_loss": -41.38154983520508, "global_step": 141656, "epoch": 1170} {"train_loss": -41.44718551635742, "global_step": 141657, "epoch": 1170} {"train_loss": -41.58485412597656, "global_step": 141658, "epoch": 1170} {"train_loss": -41.643280029296875, "global_step": 141659, "epoch": 1170} {"train_loss": -40.963008880615234, "global_step": 141660, "epoch": 1170} {"train_loss": -41.53219985961914, "global_step": 141661, "epoch": 1170} {"train_loss": -41.0020637512207, "global_step": 141662, "epoch": 1170} {"train_loss": -41.54918670654297, "global_step": 141663, "epoch": 1170} {"train_loss": -41.707923889160156, "global_step": 141664, "epoch": 1170} {"train_loss": -41.22953414916992, "global_step": 141665, "epoch": 1170} {"train_loss": -41.309444427490234, "global_step": 141666, "epoch": 1170} {"train_loss": -41.7130126953125, "global_step": 141667, "epoch": 1170} {"train_loss": -40.89609146118164, "global_step": 141668, "epoch": 1170} {"train_loss": -40.83274459838867, "global_step": 141669, "epoch": 1170} {"train_loss": -40.56471633911133, "global_step": 141670, "epoch": 1170} {"train_loss": -40.65876007080078, "global_step": 141671, "epoch": 1170} {"train_loss": -41.83843994140625, "global_step": 141672, "epoch": 1170} {"train_loss": -40.2024040222168, "global_step": 141673, "epoch": 1170} {"train_loss": -40.41262435913086, "global_step": 141674, "epoch": 1170} {"train_loss": -41.30270004272461, "global_step": 141675, "epoch": 1170} {"train_loss": -40.39060592651367, "global_step": 141676, "epoch": 1170} {"train_loss": -40.81378173828125, "global_step": 141677, "epoch": 1170} {"train_loss": -40.62470626831055, "global_step": 141678, "epoch": 1170} {"train_loss": -40.78528594970703, "global_step": 141679, "epoch": 1170} {"train_loss": -39.97675704956055, "global_step": 141680, "epoch": 1170} {"train_loss": -39.411224365234375, "global_step": 141681, "epoch": 1170} {"train_loss": -39.51959228515625, "global_step": 141682, "epoch": 1170} {"train_loss": -40.147369384765625, "global_step": 141683, "epoch": 1170} {"train_loss": -41.6078987121582, "global_step": 141684, "epoch": 1170} {"train_loss": -41.48430252075195, "global_step": 141685, "epoch": 1170} {"train_loss": -41.7005729675293, "global_step": 141686, "epoch": 1170} {"train_loss": -40.678558349609375, "global_step": 141687, "epoch": 1170} {"train_loss": -39.0855598449707, "global_step": 141688, "epoch": 1170} {"train_loss": -39.99401092529297, "global_step": 141689, "epoch": 1170} {"train_loss": -40.31120060692149, "global_step": 141690, "epoch": 1170, "val_loss": 2691046.25} {"train_loss": -39.22895050048828, "global_step": 141691, "epoch": 1171} {"train_loss": -39.31319808959961, "global_step": 141692, "epoch": 1171} {"train_loss": -40.66560745239258, "global_step": 141693, "epoch": 1171} {"train_loss": -39.931087493896484, "global_step": 141694, "epoch": 1171} {"train_loss": -40.345523834228516, "global_step": 141695, "epoch": 1171} {"train_loss": -41.70027542114258, "global_step": 141696, "epoch": 1171} {"train_loss": -40.04669189453125, "global_step": 141697, "epoch": 1171} {"train_loss": -38.97678756713867, "global_step": 141698, "epoch": 1171} {"train_loss": -40.70712661743164, "global_step": 141699, "epoch": 1171} {"train_loss": -40.1746940612793, "global_step": 141700, "epoch": 1171} {"train_loss": -38.501434326171875, "global_step": 141701, "epoch": 1171} {"train_loss": -39.396663665771484, "global_step": 141702, "epoch": 1171} {"train_loss": -40.659423828125, "global_step": 141703, "epoch": 1171} {"train_loss": -39.180625915527344, "global_step": 141704, "epoch": 1171} {"train_loss": -38.43999481201172, "global_step": 141705, "epoch": 1171} {"train_loss": -40.81220626831055, "global_step": 141706, "epoch": 1171} {"train_loss": -40.63947677612305, "global_step": 141707, "epoch": 1171} {"train_loss": -39.0721321105957, "global_step": 141708, "epoch": 1171} {"train_loss": -38.195865631103516, "global_step": 141709, "epoch": 1171} {"train_loss": -38.66268539428711, "global_step": 141710, "epoch": 1171} {"train_loss": -41.19564437866211, "global_step": 141711, "epoch": 1171} {"train_loss": -39.52155303955078, "global_step": 141712, "epoch": 1171} {"train_loss": -38.39297103881836, "global_step": 141713, "epoch": 1171} {"train_loss": -41.072364807128906, "global_step": 141714, "epoch": 1171} {"train_loss": -38.7789306640625, "global_step": 141715, "epoch": 1171} {"train_loss": -39.482704162597656, "global_step": 141716, "epoch": 1171} {"train_loss": -39.74074935913086, "global_step": 141717, "epoch": 1171} {"train_loss": -40.95998764038086, "global_step": 141718, "epoch": 1171} {"train_loss": -39.527523040771484, "global_step": 141719, "epoch": 1171} {"train_loss": -39.566246032714844, "global_step": 141720, "epoch": 1171} {"train_loss": -40.76693344116211, "global_step": 141721, "epoch": 1171} {"train_loss": -39.642086029052734, "global_step": 141722, "epoch": 1171} {"train_loss": -38.67036819458008, "global_step": 141723, "epoch": 1171} {"train_loss": -40.53656768798828, "global_step": 141724, "epoch": 1171} {"train_loss": -39.73379135131836, "global_step": 141725, "epoch": 1171} {"train_loss": -38.109283447265625, "global_step": 141726, "epoch": 1171} {"train_loss": -40.343788146972656, "global_step": 141727, "epoch": 1171} {"train_loss": -38.1006965637207, "global_step": 141728, "epoch": 1171} {"train_loss": -39.86644744873047, "global_step": 141729, "epoch": 1171} {"train_loss": -40.85578155517578, "global_step": 141730, "epoch": 1171} {"train_loss": -39.901119232177734, "global_step": 141731, "epoch": 1171} {"train_loss": -40.686031341552734, "global_step": 141732, "epoch": 1171} {"train_loss": -40.202632904052734, "global_step": 141733, "epoch": 1171} {"train_loss": -40.322364807128906, "global_step": 141734, "epoch": 1171} {"train_loss": -40.525272369384766, "global_step": 141735, "epoch": 1171} {"train_loss": -40.4593620300293, "global_step": 141736, "epoch": 1171} {"train_loss": -40.574066162109375, "global_step": 141737, "epoch": 1171} {"train_loss": -40.09761428833008, "global_step": 141738, "epoch": 1171} {"train_loss": -40.45564651489258, "global_step": 141739, "epoch": 1171} {"train_loss": -40.324256896972656, "global_step": 141740, "epoch": 1171} {"train_loss": -39.28601837158203, "global_step": 141741, "epoch": 1171} {"train_loss": -40.0549201965332, "global_step": 141742, "epoch": 1171} {"train_loss": -39.911014556884766, "global_step": 141743, "epoch": 1171} {"train_loss": -39.71419906616211, "global_step": 141744, "epoch": 1171} {"train_loss": -40.63587188720703, "global_step": 141745, "epoch": 1171} {"train_loss": -39.46529769897461, "global_step": 141746, "epoch": 1171} {"train_loss": -40.542964935302734, "global_step": 141747, "epoch": 1171} {"train_loss": -40.252655029296875, "global_step": 141748, "epoch": 1171} {"train_loss": -39.867733001708984, "global_step": 141749, "epoch": 1171} {"train_loss": -39.91312789916992, "global_step": 141750, "epoch": 1171} {"train_loss": -39.148406982421875, "global_step": 141751, "epoch": 1171} {"train_loss": -40.7573356628418, "global_step": 141752, "epoch": 1171} {"train_loss": -39.746734619140625, "global_step": 141753, "epoch": 1171} {"train_loss": -39.97079086303711, "global_step": 141754, "epoch": 1171} {"train_loss": -40.108699798583984, "global_step": 141755, "epoch": 1171} {"train_loss": -40.61874008178711, "global_step": 141756, "epoch": 1171} {"train_loss": -40.143672943115234, "global_step": 141757, "epoch": 1171} {"train_loss": -40.564247131347656, "global_step": 141758, "epoch": 1171} {"train_loss": -40.52301788330078, "global_step": 141759, "epoch": 1171} {"train_loss": -40.106910705566406, "global_step": 141760, "epoch": 1171} {"train_loss": -40.76461410522461, "global_step": 141761, "epoch": 1171} {"train_loss": -40.831905364990234, "global_step": 141762, "epoch": 1171} {"train_loss": -40.3182258605957, "global_step": 141763, "epoch": 1171} {"train_loss": -41.01967239379883, "global_step": 141764, "epoch": 1171} {"train_loss": -41.11472702026367, "global_step": 141765, "epoch": 1171} {"train_loss": -40.099220275878906, "global_step": 141766, "epoch": 1171} {"train_loss": -41.06526565551758, "global_step": 141767, "epoch": 1171} {"train_loss": -40.911251068115234, "global_step": 141768, "epoch": 1171} {"train_loss": -40.19376754760742, "global_step": 141769, "epoch": 1171} {"train_loss": -40.92457962036133, "global_step": 141770, "epoch": 1171} {"train_loss": -40.78304672241211, "global_step": 141771, "epoch": 1171} {"train_loss": -40.68595886230469, "global_step": 141772, "epoch": 1171} {"train_loss": -40.872413635253906, "global_step": 141773, "epoch": 1171} {"train_loss": -40.77082443237305, "global_step": 141774, "epoch": 1171} {"train_loss": -40.735355377197266, "global_step": 141775, "epoch": 1171} {"train_loss": -41.03498077392578, "global_step": 141776, "epoch": 1171} {"train_loss": -40.28201675415039, "global_step": 141777, "epoch": 1171} {"train_loss": -40.712947845458984, "global_step": 141778, "epoch": 1171} {"train_loss": -41.30695724487305, "global_step": 141779, "epoch": 1171} {"train_loss": -41.38711166381836, "global_step": 141780, "epoch": 1171} {"train_loss": -40.76808547973633, "global_step": 141781, "epoch": 1171} {"train_loss": -40.714759826660156, "global_step": 141782, "epoch": 1171} {"train_loss": -41.4942741394043, "global_step": 141783, "epoch": 1171} {"train_loss": -40.46833419799805, "global_step": 141784, "epoch": 1171} {"train_loss": -40.42949295043945, "global_step": 141785, "epoch": 1171} {"train_loss": -41.71575927734375, "global_step": 141786, "epoch": 1171} {"train_loss": -41.02241897583008, "global_step": 141787, "epoch": 1171} {"train_loss": -40.94118118286133, "global_step": 141788, "epoch": 1171} {"train_loss": -40.54786682128906, "global_step": 141789, "epoch": 1171} {"train_loss": -41.24299240112305, "global_step": 141790, "epoch": 1171} {"train_loss": -40.88527297973633, "global_step": 141791, "epoch": 1171} {"train_loss": -40.713409423828125, "global_step": 141792, "epoch": 1171} {"train_loss": -41.3689079284668, "global_step": 141793, "epoch": 1171} {"train_loss": -41.254459381103516, "global_step": 141794, "epoch": 1171} {"train_loss": -40.88362503051758, "global_step": 141795, "epoch": 1171} {"train_loss": -41.25189971923828, "global_step": 141796, "epoch": 1171} {"train_loss": -41.617889404296875, "global_step": 141797, "epoch": 1171} {"train_loss": -40.19198226928711, "global_step": 141798, "epoch": 1171} {"train_loss": -39.88007354736328, "global_step": 141799, "epoch": 1171} {"train_loss": -41.09014892578125, "global_step": 141800, "epoch": 1171} {"train_loss": -41.76020431518555, "global_step": 141801, "epoch": 1171} {"train_loss": -40.63427734375, "global_step": 141802, "epoch": 1171} {"train_loss": -39.59028244018555, "global_step": 141803, "epoch": 1171} {"train_loss": -41.375911712646484, "global_step": 141804, "epoch": 1171} {"train_loss": -40.532447814941406, "global_step": 141805, "epoch": 1171} {"train_loss": -40.2302360534668, "global_step": 141806, "epoch": 1171} {"train_loss": -39.94636535644531, "global_step": 141807, "epoch": 1171} {"train_loss": -41.0472412109375, "global_step": 141808, "epoch": 1171} {"train_loss": -40.967124938964844, "global_step": 141809, "epoch": 1171} {"train_loss": -40.27666091918945, "global_step": 141810, "epoch": 1171} {"train_loss": -40.297725362226, "global_step": 141811, "epoch": 1171, "val_loss": 2764673.75} {"train_loss": -41.51202392578125, "global_step": 141812, "epoch": 1172} {"train_loss": -41.0296745300293, "global_step": 141813, "epoch": 1172} {"train_loss": -40.912841796875, "global_step": 141814, "epoch": 1172} {"train_loss": -40.83152389526367, "global_step": 141815, "epoch": 1172} {"train_loss": -40.9325065612793, "global_step": 141816, "epoch": 1172} {"train_loss": -40.52320098876953, "global_step": 141817, "epoch": 1172} {"train_loss": -41.36740493774414, "global_step": 141818, "epoch": 1172} {"train_loss": -41.22049331665039, "global_step": 141819, "epoch": 1172} {"train_loss": -40.0867805480957, "global_step": 141820, "epoch": 1172} {"train_loss": -39.94644546508789, "global_step": 141821, "epoch": 1172} {"train_loss": -39.180294036865234, "global_step": 141822, "epoch": 1172} {"train_loss": -40.15241622924805, "global_step": 141823, "epoch": 1172} {"train_loss": -39.18939971923828, "global_step": 141824, "epoch": 1172} {"train_loss": -40.51057052612305, "global_step": 141825, "epoch": 1172} {"train_loss": -40.02491760253906, "global_step": 141826, "epoch": 1172} {"train_loss": -40.64910125732422, "global_step": 141827, "epoch": 1172} {"train_loss": -41.40900802612305, "global_step": 141828, "epoch": 1172} {"train_loss": -39.059226989746094, "global_step": 141829, "epoch": 1172} {"train_loss": -39.6871223449707, "global_step": 141830, "epoch": 1172} {"train_loss": -40.333885192871094, "global_step": 141831, "epoch": 1172} {"train_loss": -39.78517532348633, "global_step": 141832, "epoch": 1172} {"train_loss": -40.1115608215332, "global_step": 141833, "epoch": 1172} {"train_loss": -40.86284637451172, "global_step": 141834, "epoch": 1172} {"train_loss": -40.01685333251953, "global_step": 141835, "epoch": 1172} {"train_loss": -40.04705047607422, "global_step": 141836, "epoch": 1172} {"train_loss": -41.24784469604492, "global_step": 141837, "epoch": 1172} {"train_loss": -40.05870819091797, "global_step": 141838, "epoch": 1172} {"train_loss": -39.7562141418457, "global_step": 141839, "epoch": 1172} {"train_loss": -38.15232849121094, "global_step": 141840, "epoch": 1172} {"train_loss": -40.79350280761719, "global_step": 141841, "epoch": 1172} {"train_loss": -39.78068161010742, "global_step": 141842, "epoch": 1172} {"train_loss": -37.784523010253906, "global_step": 141843, "epoch": 1172} {"train_loss": -40.257972717285156, "global_step": 141844, "epoch": 1172} {"train_loss": -40.11713790893555, "global_step": 141845, "epoch": 1172} {"train_loss": -39.36335372924805, "global_step": 141846, "epoch": 1172} {"train_loss": -40.758522033691406, "global_step": 141847, "epoch": 1172} {"train_loss": -39.67138671875, "global_step": 141848, "epoch": 1172} {"train_loss": -38.78681564331055, "global_step": 141849, "epoch": 1172} {"train_loss": -41.40487289428711, "global_step": 141850, "epoch": 1172} {"train_loss": -39.821044921875, "global_step": 141851, "epoch": 1172} {"train_loss": -40.178585052490234, "global_step": 141852, "epoch": 1172} {"train_loss": -40.497352600097656, "global_step": 141853, "epoch": 1172} {"train_loss": -40.48646545410156, "global_step": 141854, "epoch": 1172} {"train_loss": -39.743247985839844, "global_step": 141855, "epoch": 1172} {"train_loss": -41.424598693847656, "global_step": 141856, "epoch": 1172} {"train_loss": -40.19413375854492, "global_step": 141857, "epoch": 1172} {"train_loss": -40.89927291870117, "global_step": 141858, "epoch": 1172} {"train_loss": -40.635337829589844, "global_step": 141859, "epoch": 1172} {"train_loss": -40.58316421508789, "global_step": 141860, "epoch": 1172} {"train_loss": -41.34280014038086, "global_step": 141861, "epoch": 1172} {"train_loss": -40.204498291015625, "global_step": 141862, "epoch": 1172} {"train_loss": -40.7077751159668, "global_step": 141863, "epoch": 1172} {"train_loss": -41.165645599365234, "global_step": 141864, "epoch": 1172} {"train_loss": -40.23360824584961, "global_step": 141865, "epoch": 1172} {"train_loss": -41.30841064453125, "global_step": 141866, "epoch": 1172} {"train_loss": -40.10334777832031, "global_step": 141867, "epoch": 1172} {"train_loss": -40.83018112182617, "global_step": 141868, "epoch": 1172} {"train_loss": -40.62500762939453, "global_step": 141869, "epoch": 1172} {"train_loss": -41.35548400878906, "global_step": 141870, "epoch": 1172} {"train_loss": -40.753047943115234, "global_step": 141871, "epoch": 1172} {"train_loss": -40.09071350097656, "global_step": 141872, "epoch": 1172} {"train_loss": -40.167388916015625, "global_step": 141873, "epoch": 1172} {"train_loss": -41.048702239990234, "global_step": 141874, "epoch": 1172} {"train_loss": -41.64297866821289, "global_step": 141875, "epoch": 1172} {"train_loss": -40.391292572021484, "global_step": 141876, "epoch": 1172} {"train_loss": -40.49017333984375, "global_step": 141877, "epoch": 1172} {"train_loss": -40.262359619140625, "global_step": 141878, "epoch": 1172} {"train_loss": -41.051639556884766, "global_step": 141879, "epoch": 1172} {"train_loss": -40.789344787597656, "global_step": 141880, "epoch": 1172} {"train_loss": -41.33726119995117, "global_step": 141881, "epoch": 1172} {"train_loss": -41.509124755859375, "global_step": 141882, "epoch": 1172} {"train_loss": -41.845218658447266, "global_step": 141883, "epoch": 1172} {"train_loss": -41.831329345703125, "global_step": 141884, "epoch": 1172} {"train_loss": -42.01743698120117, "global_step": 141885, "epoch": 1172} {"train_loss": -41.466278076171875, "global_step": 141886, "epoch": 1172} {"train_loss": -41.41765594482422, "global_step": 141887, "epoch": 1172} {"train_loss": -42.03791427612305, "global_step": 141888, "epoch": 1172} {"train_loss": -41.50468063354492, "global_step": 141889, "epoch": 1172} {"train_loss": -41.25168228149414, "global_step": 141890, "epoch": 1172} {"train_loss": -41.50804901123047, "global_step": 141891, "epoch": 1172} {"train_loss": -41.623626708984375, "global_step": 141892, "epoch": 1172} {"train_loss": -41.113014221191406, "global_step": 141893, "epoch": 1172} {"train_loss": -40.67141342163086, "global_step": 141894, "epoch": 1172} {"train_loss": -40.53557205200195, "global_step": 141895, "epoch": 1172} {"train_loss": -40.124610900878906, "global_step": 141896, "epoch": 1172} {"train_loss": -39.646156311035156, "global_step": 141897, "epoch": 1172} {"train_loss": -37.686058044433594, "global_step": 141898, "epoch": 1172} {"train_loss": -41.39466094970703, "global_step": 141899, "epoch": 1172} {"train_loss": -39.780208587646484, "global_step": 141900, "epoch": 1172} {"train_loss": -38.522003173828125, "global_step": 141901, "epoch": 1172} {"train_loss": -40.670204162597656, "global_step": 141902, "epoch": 1172} {"train_loss": -40.58927917480469, "global_step": 141903, "epoch": 1172} {"train_loss": -39.44293975830078, "global_step": 141904, "epoch": 1172} {"train_loss": -40.587860107421875, "global_step": 141905, "epoch": 1172} {"train_loss": -39.34387969970703, "global_step": 141906, "epoch": 1172} {"train_loss": -38.67815017700195, "global_step": 141907, "epoch": 1172} {"train_loss": -40.017635345458984, "global_step": 141908, "epoch": 1172} {"train_loss": -40.752132415771484, "global_step": 141909, "epoch": 1172} {"train_loss": -39.79793167114258, "global_step": 141910, "epoch": 1172} {"train_loss": -39.8883171081543, "global_step": 141911, "epoch": 1172} {"train_loss": -41.08661651611328, "global_step": 141912, "epoch": 1172} {"train_loss": -40.89235305786133, "global_step": 141913, "epoch": 1172} {"train_loss": -40.323699951171875, "global_step": 141914, "epoch": 1172} {"train_loss": -41.202972412109375, "global_step": 141915, "epoch": 1172} {"train_loss": -39.91828536987305, "global_step": 141916, "epoch": 1172} {"train_loss": -40.09231185913086, "global_step": 141917, "epoch": 1172} {"train_loss": -41.08156967163086, "global_step": 141918, "epoch": 1172} {"train_loss": -40.957157135009766, "global_step": 141919, "epoch": 1172} {"train_loss": -41.80084991455078, "global_step": 141920, "epoch": 1172} {"train_loss": -41.21591567993164, "global_step": 141921, "epoch": 1172} {"train_loss": -41.0130500793457, "global_step": 141922, "epoch": 1172} {"train_loss": -40.56659698486328, "global_step": 141923, "epoch": 1172} {"train_loss": -40.3923454284668, "global_step": 141924, "epoch": 1172} {"train_loss": -37.298282623291016, "global_step": 141925, "epoch": 1172} {"train_loss": -39.131996154785156, "global_step": 141926, "epoch": 1172} {"train_loss": -39.532875061035156, "global_step": 141927, "epoch": 1172} {"train_loss": -39.487789154052734, "global_step": 141928, "epoch": 1172} {"train_loss": -40.50413513183594, "global_step": 141929, "epoch": 1172} {"train_loss": -40.45602035522461, "global_step": 141930, "epoch": 1172} {"train_loss": -40.63767623901367, "global_step": 141931, "epoch": 1172} {"train_loss": -40.42951281208637, "global_step": 141932, "epoch": 1172, "val_loss": 2704256.75} {"train_loss": -40.88467788696289, "global_step": 141933, "epoch": 1173} {"train_loss": -40.00251388549805, "global_step": 141934, "epoch": 1173} {"train_loss": -39.223793029785156, "global_step": 141935, "epoch": 1173} {"train_loss": -40.00936508178711, "global_step": 141936, "epoch": 1173} {"train_loss": -40.23685836791992, "global_step": 141937, "epoch": 1173} {"train_loss": -37.53522491455078, "global_step": 141938, "epoch": 1173} {"train_loss": -38.49332809448242, "global_step": 141939, "epoch": 1173} {"train_loss": -38.468292236328125, "global_step": 141940, "epoch": 1173} {"train_loss": -38.98258590698242, "global_step": 141941, "epoch": 1173} {"train_loss": -38.15279769897461, "global_step": 141942, "epoch": 1173} {"train_loss": -40.18585205078125, "global_step": 141943, "epoch": 1173} {"train_loss": -38.375343322753906, "global_step": 141944, "epoch": 1173} {"train_loss": -37.68142318725586, "global_step": 141945, "epoch": 1173} {"train_loss": -39.6306266784668, "global_step": 141946, "epoch": 1173} {"train_loss": -38.85770797729492, "global_step": 141947, "epoch": 1173} {"train_loss": -38.4399528503418, "global_step": 141948, "epoch": 1173} {"train_loss": -39.362335205078125, "global_step": 141949, "epoch": 1173} {"train_loss": -38.87984848022461, "global_step": 141950, "epoch": 1173} {"train_loss": -39.08174514770508, "global_step": 141951, "epoch": 1173} {"train_loss": -40.075286865234375, "global_step": 141952, "epoch": 1173} {"train_loss": -39.72309112548828, "global_step": 141953, "epoch": 1173} {"train_loss": -40.07636260986328, "global_step": 141954, "epoch": 1173} {"train_loss": -40.07236862182617, "global_step": 141955, "epoch": 1173} {"train_loss": -39.5598258972168, "global_step": 141956, "epoch": 1173} {"train_loss": -40.440731048583984, "global_step": 141957, "epoch": 1173} {"train_loss": -40.14644241333008, "global_step": 141958, "epoch": 1173} {"train_loss": -39.893306732177734, "global_step": 141959, "epoch": 1173} {"train_loss": -40.707611083984375, "global_step": 141960, "epoch": 1173} {"train_loss": -40.55780792236328, "global_step": 141961, "epoch": 1173} {"train_loss": -40.14493942260742, "global_step": 141962, "epoch": 1173} {"train_loss": -41.093231201171875, "global_step": 141963, "epoch": 1173} {"train_loss": -41.0157470703125, "global_step": 141964, "epoch": 1173} {"train_loss": -41.36000442504883, "global_step": 141965, "epoch": 1173} {"train_loss": -41.024105072021484, "global_step": 141966, "epoch": 1173} {"train_loss": -40.95044708251953, "global_step": 141967, "epoch": 1173} {"train_loss": -40.74951934814453, "global_step": 141968, "epoch": 1173} {"train_loss": -41.09629440307617, "global_step": 141969, "epoch": 1173} {"train_loss": -40.66130828857422, "global_step": 141970, "epoch": 1173} {"train_loss": -40.928924560546875, "global_step": 141971, "epoch": 1173} {"train_loss": -40.910980224609375, "global_step": 141972, "epoch": 1173} {"train_loss": -41.11498260498047, "global_step": 141973, "epoch": 1173} {"train_loss": -41.04225158691406, "global_step": 141974, "epoch": 1173} {"train_loss": -41.3433952331543, "global_step": 141975, "epoch": 1173} {"train_loss": -41.2323112487793, "global_step": 141976, "epoch": 1173} {"train_loss": -41.38283920288086, "global_step": 141977, "epoch": 1173} {"train_loss": -41.09698486328125, "global_step": 141978, "epoch": 1173} {"train_loss": -41.43973922729492, "global_step": 141979, "epoch": 1173} {"train_loss": -41.28853988647461, "global_step": 141980, "epoch": 1173} {"train_loss": -41.376373291015625, "global_step": 141981, "epoch": 1173} {"train_loss": -41.03947448730469, "global_step": 141982, "epoch": 1173} {"train_loss": -41.494972229003906, "global_step": 141983, "epoch": 1173} {"train_loss": -41.849056243896484, "global_step": 141984, "epoch": 1173} {"train_loss": -41.37824630737305, "global_step": 141985, "epoch": 1173} {"train_loss": -41.429534912109375, "global_step": 141986, "epoch": 1173} {"train_loss": -42.0022087097168, "global_step": 141987, "epoch": 1173} {"train_loss": -41.03544235229492, "global_step": 141988, "epoch": 1173} {"train_loss": -41.79743576049805, "global_step": 141989, "epoch": 1173} {"train_loss": -41.2404899597168, "global_step": 141990, "epoch": 1173} {"train_loss": -41.91064453125, "global_step": 141991, "epoch": 1173} {"train_loss": -41.47903823852539, "global_step": 141992, "epoch": 1173} {"train_loss": -41.140708923339844, "global_step": 141993, "epoch": 1173} {"train_loss": -40.54542541503906, "global_step": 141994, "epoch": 1173} {"train_loss": -41.63121795654297, "global_step": 141995, "epoch": 1173} {"train_loss": -41.6334342956543, "global_step": 141996, "epoch": 1173} {"train_loss": -41.2689094543457, "global_step": 141997, "epoch": 1173} {"train_loss": -41.22225570678711, "global_step": 141998, "epoch": 1173} {"train_loss": -40.85588455200195, "global_step": 141999, "epoch": 1173} {"train_loss": -40.28712844848633, "global_step": 142000, "epoch": 1173} {"train_loss": -40.85842514038086, "global_step": 142001, "epoch": 1173} {"train_loss": -41.33388900756836, "global_step": 142002, "epoch": 1173} {"train_loss": -41.063594818115234, "global_step": 142003, "epoch": 1173} {"train_loss": -38.75785827636719, "global_step": 142004, "epoch": 1173} {"train_loss": -39.463287353515625, "global_step": 142005, "epoch": 1173} {"train_loss": -39.341163635253906, "global_step": 142006, "epoch": 1173} {"train_loss": -39.96411895751953, "global_step": 142007, "epoch": 1173} {"train_loss": -38.022552490234375, "global_step": 142008, "epoch": 1173} {"train_loss": -38.45957565307617, "global_step": 142009, "epoch": 1173} {"train_loss": -40.5816535949707, "global_step": 142010, "epoch": 1173} {"train_loss": -40.25834274291992, "global_step": 142011, "epoch": 1173} {"train_loss": -40.9304313659668, "global_step": 142012, "epoch": 1173} {"train_loss": -39.8247184753418, "global_step": 142013, "epoch": 1173} {"train_loss": -40.37917709350586, "global_step": 142014, "epoch": 1173} {"train_loss": -39.43212127685547, "global_step": 142015, "epoch": 1173} {"train_loss": -41.45689010620117, "global_step": 142016, "epoch": 1173} {"train_loss": -39.61935043334961, "global_step": 142017, "epoch": 1173} {"train_loss": -39.60992431640625, "global_step": 142018, "epoch": 1173} {"train_loss": -39.3300895690918, "global_step": 142019, "epoch": 1173} {"train_loss": -38.51585006713867, "global_step": 142020, "epoch": 1173} {"train_loss": -37.862857818603516, "global_step": 142021, "epoch": 1173} {"train_loss": -38.6492805480957, "global_step": 142022, "epoch": 1173} {"train_loss": -39.57661437988281, "global_step": 142023, "epoch": 1173} {"train_loss": -37.6193962097168, "global_step": 142024, "epoch": 1173} {"train_loss": -38.20363998413086, "global_step": 142025, "epoch": 1173} {"train_loss": -37.42790603637695, "global_step": 142026, "epoch": 1173} {"train_loss": -39.55104446411133, "global_step": 142027, "epoch": 1173} {"train_loss": -37.963863372802734, "global_step": 142028, "epoch": 1173} {"train_loss": -37.71192169189453, "global_step": 142029, "epoch": 1173} {"train_loss": -40.2940673828125, "global_step": 142030, "epoch": 1173} {"train_loss": -37.49851989746094, "global_step": 142031, "epoch": 1173} {"train_loss": -39.6285285949707, "global_step": 142032, "epoch": 1173} {"train_loss": -39.14059066772461, "global_step": 142033, "epoch": 1173} {"train_loss": -39.11686325073242, "global_step": 142034, "epoch": 1173} {"train_loss": -40.56163024902344, "global_step": 142035, "epoch": 1173} {"train_loss": -40.168758392333984, "global_step": 142036, "epoch": 1173} {"train_loss": -38.977596282958984, "global_step": 142037, "epoch": 1173} {"train_loss": -40.73735427856445, "global_step": 142038, "epoch": 1173} {"train_loss": -39.82884979248047, "global_step": 142039, "epoch": 1173} {"train_loss": -40.657997131347656, "global_step": 142040, "epoch": 1173} {"train_loss": -40.074642181396484, "global_step": 142041, "epoch": 1173} {"train_loss": -39.41347885131836, "global_step": 142042, "epoch": 1173} {"train_loss": -40.07650375366211, "global_step": 142043, "epoch": 1173} {"train_loss": -38.926971435546875, "global_step": 142044, "epoch": 1173} {"train_loss": -37.60773849487305, "global_step": 142045, "epoch": 1173} {"train_loss": -39.5333137512207, "global_step": 142046, "epoch": 1173} {"train_loss": -39.25288009643555, "global_step": 142047, "epoch": 1173} {"train_loss": -38.48832321166992, "global_step": 142048, "epoch": 1173} {"train_loss": -39.923152923583984, "global_step": 142049, "epoch": 1173} {"train_loss": -39.90790939331055, "global_step": 142050, "epoch": 1173} {"train_loss": -39.85427474975586, "global_step": 142051, "epoch": 1173} {"train_loss": -39.14751052856445, "global_step": 142052, "epoch": 1173} {"train_loss": -40.011883223352356, "global_step": 142053, "epoch": 1173, "val_loss": 2711158.25} {"train_loss": -39.6042594909668, "global_step": 142054, "epoch": 1174} {"train_loss": -40.07345962524414, "global_step": 142055, "epoch": 1174} {"train_loss": -39.68160629272461, "global_step": 142056, "epoch": 1174} {"train_loss": -40.58498001098633, "global_step": 142057, "epoch": 1174} {"train_loss": -40.67637252807617, "global_step": 142058, "epoch": 1174} {"train_loss": -40.57131576538086, "global_step": 142059, "epoch": 1174} {"train_loss": -40.707088470458984, "global_step": 142060, "epoch": 1174} {"train_loss": -40.388729095458984, "global_step": 142061, "epoch": 1174} {"train_loss": -40.60215759277344, "global_step": 142062, "epoch": 1174} {"train_loss": -40.81985855102539, "global_step": 142063, "epoch": 1174} {"train_loss": -41.181968688964844, "global_step": 142064, "epoch": 1174} {"train_loss": -40.74070358276367, "global_step": 142065, "epoch": 1174} {"train_loss": -41.05471420288086, "global_step": 142066, "epoch": 1174} {"train_loss": -40.990604400634766, "global_step": 142067, "epoch": 1174} {"train_loss": -40.360145568847656, "global_step": 142068, "epoch": 1174} {"train_loss": -41.288875579833984, "global_step": 142069, "epoch": 1174} {"train_loss": -40.769508361816406, "global_step": 142070, "epoch": 1174} {"train_loss": -40.18140411376953, "global_step": 142071, "epoch": 1174} {"train_loss": -40.76811981201172, "global_step": 142072, "epoch": 1174} {"train_loss": -40.86786651611328, "global_step": 142073, "epoch": 1174} {"train_loss": -40.6288948059082, "global_step": 142074, "epoch": 1174} {"train_loss": -40.5634880065918, "global_step": 142075, "epoch": 1174} {"train_loss": -41.259559631347656, "global_step": 142076, "epoch": 1174} {"train_loss": -40.26350784301758, "global_step": 142077, "epoch": 1174} {"train_loss": -41.276954650878906, "global_step": 142078, "epoch": 1174} {"train_loss": -40.9712028503418, "global_step": 142079, "epoch": 1174} {"train_loss": -40.40928649902344, "global_step": 142080, "epoch": 1174} {"train_loss": -41.10896301269531, "global_step": 142081, "epoch": 1174} {"train_loss": -41.21437072753906, "global_step": 142082, "epoch": 1174} {"train_loss": -41.437679290771484, "global_step": 142083, "epoch": 1174} {"train_loss": -40.36513137817383, "global_step": 142084, "epoch": 1174} {"train_loss": -40.20397186279297, "global_step": 142085, "epoch": 1174} {"train_loss": -40.66846466064453, "global_step": 142086, "epoch": 1174} {"train_loss": -40.133121490478516, "global_step": 142087, "epoch": 1174} {"train_loss": -41.09706497192383, "global_step": 142088, "epoch": 1174} {"train_loss": -40.34294891357422, "global_step": 142089, "epoch": 1174} {"train_loss": -40.696990966796875, "global_step": 142090, "epoch": 1174} {"train_loss": -40.42372131347656, "global_step": 142091, "epoch": 1174} {"train_loss": -40.20904541015625, "global_step": 142092, "epoch": 1174} {"train_loss": -40.18693923950195, "global_step": 142093, "epoch": 1174} {"train_loss": -40.68817138671875, "global_step": 142094, "epoch": 1174} {"train_loss": -40.99631881713867, "global_step": 142095, "epoch": 1174} {"train_loss": -40.65420913696289, "global_step": 142096, "epoch": 1174} {"train_loss": -41.88491439819336, "global_step": 142097, "epoch": 1174} {"train_loss": -41.32410430908203, "global_step": 142098, "epoch": 1174} {"train_loss": -41.59684371948242, "global_step": 142099, "epoch": 1174} {"train_loss": -41.26728439331055, "global_step": 142100, "epoch": 1174} {"train_loss": -41.436004638671875, "global_step": 142101, "epoch": 1174} {"train_loss": -41.03754425048828, "global_step": 142102, "epoch": 1174} {"train_loss": -40.52926254272461, "global_step": 142103, "epoch": 1174} {"train_loss": -40.807586669921875, "global_step": 142104, "epoch": 1174} {"train_loss": -42.09811782836914, "global_step": 142105, "epoch": 1174} {"train_loss": -41.35003662109375, "global_step": 142106, "epoch": 1174} {"train_loss": -41.4664421081543, "global_step": 142107, "epoch": 1174} {"train_loss": -40.93958282470703, "global_step": 142108, "epoch": 1174} {"train_loss": -41.63352584838867, "global_step": 142109, "epoch": 1174} {"train_loss": -41.3370246887207, "global_step": 142110, "epoch": 1174} {"train_loss": -41.21046829223633, "global_step": 142111, "epoch": 1174} {"train_loss": -40.64954376220703, "global_step": 142112, "epoch": 1174} {"train_loss": -40.80039596557617, "global_step": 142113, "epoch": 1174} {"train_loss": -39.933319091796875, "global_step": 142114, "epoch": 1174} {"train_loss": -38.64445877075195, "global_step": 142115, "epoch": 1174} {"train_loss": -38.12651824951172, "global_step": 142116, "epoch": 1174} {"train_loss": -40.14969253540039, "global_step": 142117, "epoch": 1174} {"train_loss": -41.2797737121582, "global_step": 142118, "epoch": 1174} {"train_loss": -36.53938293457031, "global_step": 142119, "epoch": 1174} {"train_loss": -40.66917037963867, "global_step": 142120, "epoch": 1174} {"train_loss": -40.664974212646484, "global_step": 142121, "epoch": 1174} {"train_loss": -39.72724533081055, "global_step": 142122, "epoch": 1174} {"train_loss": -40.812740325927734, "global_step": 142123, "epoch": 1174} {"train_loss": -40.889034271240234, "global_step": 142124, "epoch": 1174} {"train_loss": -38.96866989135742, "global_step": 142125, "epoch": 1174} {"train_loss": -38.511474609375, "global_step": 142126, "epoch": 1174} {"train_loss": -39.47686767578125, "global_step": 142127, "epoch": 1174} {"train_loss": -39.54786682128906, "global_step": 142128, "epoch": 1174} {"train_loss": -39.34976577758789, "global_step": 142129, "epoch": 1174} {"train_loss": -38.745113372802734, "global_step": 142130, "epoch": 1174} {"train_loss": -37.61122512817383, "global_step": 142131, "epoch": 1174} {"train_loss": -40.83457565307617, "global_step": 142132, "epoch": 1174} {"train_loss": -36.61857223510742, "global_step": 142133, "epoch": 1174} {"train_loss": -38.16278076171875, "global_step": 142134, "epoch": 1174} {"train_loss": -35.814151763916016, "global_step": 142135, "epoch": 1174} {"train_loss": -38.58945846557617, "global_step": 142136, "epoch": 1174} {"train_loss": -35.343345642089844, "global_step": 142137, "epoch": 1174} {"train_loss": -36.158668518066406, "global_step": 142138, "epoch": 1174} {"train_loss": -36.682464599609375, "global_step": 142139, "epoch": 1174} {"train_loss": -34.27170944213867, "global_step": 142140, "epoch": 1174} {"train_loss": -36.177730560302734, "global_step": 142141, "epoch": 1174} {"train_loss": -36.81682205200195, "global_step": 142142, "epoch": 1174} {"train_loss": -36.96117401123047, "global_step": 142143, "epoch": 1174} {"train_loss": -39.51551055908203, "global_step": 142144, "epoch": 1174} {"train_loss": -37.71876525878906, "global_step": 142145, "epoch": 1174} {"train_loss": -38.92721176147461, "global_step": 142146, "epoch": 1174} {"train_loss": -39.78253936767578, "global_step": 142147, "epoch": 1174} {"train_loss": -38.08053207397461, "global_step": 142148, "epoch": 1174} {"train_loss": -39.589599609375, "global_step": 142149, "epoch": 1174} {"train_loss": -39.38042068481445, "global_step": 142150, "epoch": 1174} {"train_loss": -39.896881103515625, "global_step": 142151, "epoch": 1174} {"train_loss": -39.00489044189453, "global_step": 142152, "epoch": 1174} {"train_loss": -40.60136413574219, "global_step": 142153, "epoch": 1174} {"train_loss": -38.898155212402344, "global_step": 142154, "epoch": 1174} {"train_loss": -39.56769943237305, "global_step": 142155, "epoch": 1174} {"train_loss": -40.61140441894531, "global_step": 142156, "epoch": 1174} {"train_loss": -39.84562301635742, "global_step": 142157, "epoch": 1174} {"train_loss": -39.91146469116211, "global_step": 142158, "epoch": 1174} {"train_loss": -39.86392593383789, "global_step": 142159, "epoch": 1174} {"train_loss": -40.510169982910156, "global_step": 142160, "epoch": 1174} {"train_loss": -40.3861198425293, "global_step": 142161, "epoch": 1174} {"train_loss": -40.381019592285156, "global_step": 142162, "epoch": 1174} {"train_loss": -40.26409149169922, "global_step": 142163, "epoch": 1174} {"train_loss": -40.6976203918457, "global_step": 142164, "epoch": 1174} {"train_loss": -40.49142074584961, "global_step": 142165, "epoch": 1174} {"train_loss": -40.878902435302734, "global_step": 142166, "epoch": 1174} {"train_loss": -40.71198654174805, "global_step": 142167, "epoch": 1174} {"train_loss": -40.61346435546875, "global_step": 142168, "epoch": 1174} {"train_loss": -40.49367904663086, "global_step": 142169, "epoch": 1174} {"train_loss": -40.424747467041016, "global_step": 142170, "epoch": 1174} {"train_loss": -40.758697509765625, "global_step": 142171, "epoch": 1174} {"train_loss": -40.20121383666992, "global_step": 142172, "epoch": 1174} {"train_loss": -39.86943054199219, "global_step": 142173, "epoch": 1174} {"train_loss": -39.99859720025181, "global_step": 142174, "epoch": 1174, "val_loss": 2568997.75} {"train_loss": -40.23633575439453, "global_step": 142175, "epoch": 1175} {"train_loss": -40.79578399658203, "global_step": 142176, "epoch": 1175} {"train_loss": -40.815555572509766, "global_step": 142177, "epoch": 1175} {"train_loss": -40.471107482910156, "global_step": 142178, "epoch": 1175} {"train_loss": -40.198516845703125, "global_step": 142179, "epoch": 1175} {"train_loss": -41.14961624145508, "global_step": 142180, "epoch": 1175} {"train_loss": -41.259056091308594, "global_step": 142181, "epoch": 1175} {"train_loss": -40.400421142578125, "global_step": 142182, "epoch": 1175} {"train_loss": -41.14752960205078, "global_step": 142183, "epoch": 1175} {"train_loss": -40.98663330078125, "global_step": 142184, "epoch": 1175} {"train_loss": -40.5529899597168, "global_step": 142185, "epoch": 1175} {"train_loss": -40.45470428466797, "global_step": 142186, "epoch": 1175} {"train_loss": -41.20449447631836, "global_step": 142187, "epoch": 1175} {"train_loss": -41.338783264160156, "global_step": 142188, "epoch": 1175} {"train_loss": -41.47195816040039, "global_step": 142189, "epoch": 1175} {"train_loss": -41.64813232421875, "global_step": 142190, "epoch": 1175} {"train_loss": -41.022396087646484, "global_step": 142191, "epoch": 1175} {"train_loss": -41.06052017211914, "global_step": 142192, "epoch": 1175} {"train_loss": -40.75572204589844, "global_step": 142193, "epoch": 1175} {"train_loss": -40.17832565307617, "global_step": 142194, "epoch": 1175} {"train_loss": -40.6771354675293, "global_step": 142195, "epoch": 1175} {"train_loss": -40.31846237182617, "global_step": 142196, "epoch": 1175} {"train_loss": -41.93470001220703, "global_step": 142197, "epoch": 1175} {"train_loss": -40.58617401123047, "global_step": 142198, "epoch": 1175} {"train_loss": -40.93912887573242, "global_step": 142199, "epoch": 1175} {"train_loss": -41.57065963745117, "global_step": 142200, "epoch": 1175} {"train_loss": -41.456024169921875, "global_step": 142201, "epoch": 1175} {"train_loss": -39.810794830322266, "global_step": 142202, "epoch": 1175} {"train_loss": -40.51388931274414, "global_step": 142203, "epoch": 1175} {"train_loss": -41.472511291503906, "global_step": 142204, "epoch": 1175} {"train_loss": -41.86699295043945, "global_step": 142205, "epoch": 1175} {"train_loss": -41.352745056152344, "global_step": 142206, "epoch": 1175} {"train_loss": -40.92070007324219, "global_step": 142207, "epoch": 1175} {"train_loss": -40.71307373046875, "global_step": 142208, "epoch": 1175} {"train_loss": -39.185787200927734, "global_step": 142209, "epoch": 1175} {"train_loss": -40.75072479248047, "global_step": 142210, "epoch": 1175} {"train_loss": -41.33509063720703, "global_step": 142211, "epoch": 1175} {"train_loss": -40.30766677856445, "global_step": 142212, "epoch": 1175} {"train_loss": -40.74747848510742, "global_step": 142213, "epoch": 1175} {"train_loss": -40.31442642211914, "global_step": 142214, "epoch": 1175} {"train_loss": -39.25376510620117, "global_step": 142215, "epoch": 1175} {"train_loss": -37.300289154052734, "global_step": 142216, "epoch": 1175} {"train_loss": -41.41603088378906, "global_step": 142217, "epoch": 1175} {"train_loss": -38.22349166870117, "global_step": 142218, "epoch": 1175} {"train_loss": -38.80463790893555, "global_step": 142219, "epoch": 1175} {"train_loss": -39.7119140625, "global_step": 142220, "epoch": 1175} {"train_loss": -39.16705322265625, "global_step": 142221, "epoch": 1175} {"train_loss": -39.647335052490234, "global_step": 142222, "epoch": 1175} {"train_loss": -38.2198486328125, "global_step": 142223, "epoch": 1175} {"train_loss": -39.378353118896484, "global_step": 142224, "epoch": 1175} {"train_loss": -39.78339767456055, "global_step": 142225, "epoch": 1175} {"train_loss": -38.67245101928711, "global_step": 142226, "epoch": 1175} {"train_loss": -39.509796142578125, "global_step": 142227, "epoch": 1175} {"train_loss": -38.8397216796875, "global_step": 142228, "epoch": 1175} {"train_loss": -38.93132019042969, "global_step": 142229, "epoch": 1175} {"train_loss": -37.4276008605957, "global_step": 142230, "epoch": 1175} {"train_loss": -40.30177307128906, "global_step": 142231, "epoch": 1175} {"train_loss": -39.06390380859375, "global_step": 142232, "epoch": 1175} {"train_loss": -39.52675247192383, "global_step": 142233, "epoch": 1175} {"train_loss": -40.00518798828125, "global_step": 142234, "epoch": 1175} {"train_loss": -37.61439514160156, "global_step": 142235, "epoch": 1175} {"train_loss": -39.31982421875, "global_step": 142236, "epoch": 1175} {"train_loss": -38.97074508666992, "global_step": 142237, "epoch": 1175} {"train_loss": -39.0047721862793, "global_step": 142238, "epoch": 1175} {"train_loss": -37.85464859008789, "global_step": 142239, "epoch": 1175} {"train_loss": -39.3785514831543, "global_step": 142240, "epoch": 1175} {"train_loss": -40.097591400146484, "global_step": 142241, "epoch": 1175} {"train_loss": -39.929656982421875, "global_step": 142242, "epoch": 1175} {"train_loss": -38.24578857421875, "global_step": 142243, "epoch": 1175} {"train_loss": -38.056907653808594, "global_step": 142244, "epoch": 1175} {"train_loss": -40.074928283691406, "global_step": 142245, "epoch": 1175} {"train_loss": -37.63935852050781, "global_step": 142246, "epoch": 1175} {"train_loss": -37.86435317993164, "global_step": 142247, "epoch": 1175} {"train_loss": -38.756927490234375, "global_step": 142248, "epoch": 1175} {"train_loss": -38.38914108276367, "global_step": 142249, "epoch": 1175} {"train_loss": -39.00436019897461, "global_step": 142250, "epoch": 1175} {"train_loss": -38.354698181152344, "global_step": 142251, "epoch": 1175} {"train_loss": -37.95307922363281, "global_step": 142252, "epoch": 1175} {"train_loss": -39.23838424682617, "global_step": 142253, "epoch": 1175} {"train_loss": -38.04530334472656, "global_step": 142254, "epoch": 1175} {"train_loss": -38.985755920410156, "global_step": 142255, "epoch": 1175} {"train_loss": -39.47128677368164, "global_step": 142256, "epoch": 1175} {"train_loss": -39.7020378112793, "global_step": 142257, "epoch": 1175} {"train_loss": -39.327144622802734, "global_step": 142258, "epoch": 1175} {"train_loss": -39.02142333984375, "global_step": 142259, "epoch": 1175} {"train_loss": -39.26908493041992, "global_step": 142260, "epoch": 1175} {"train_loss": -39.170291900634766, "global_step": 142261, "epoch": 1175} {"train_loss": -39.13359069824219, "global_step": 142262, "epoch": 1175} {"train_loss": -39.35746383666992, "global_step": 142263, "epoch": 1175} {"train_loss": -38.969818115234375, "global_step": 142264, "epoch": 1175} {"train_loss": -38.299964904785156, "global_step": 142265, "epoch": 1175} {"train_loss": -39.610389709472656, "global_step": 142266, "epoch": 1175} {"train_loss": -39.174800872802734, "global_step": 142267, "epoch": 1175} {"train_loss": -38.04293441772461, "global_step": 142268, "epoch": 1175} {"train_loss": -39.9276123046875, "global_step": 142269, "epoch": 1175} {"train_loss": -39.62046432495117, "global_step": 142270, "epoch": 1175} {"train_loss": -39.578182220458984, "global_step": 142271, "epoch": 1175} {"train_loss": -39.86967468261719, "global_step": 142272, "epoch": 1175} {"train_loss": -40.0632209777832, "global_step": 142273, "epoch": 1175} {"train_loss": -39.053653717041016, "global_step": 142274, "epoch": 1175} {"train_loss": -40.19810485839844, "global_step": 142275, "epoch": 1175} {"train_loss": -39.204925537109375, "global_step": 142276, "epoch": 1175} {"train_loss": -39.10989761352539, "global_step": 142277, "epoch": 1175} {"train_loss": -39.87294387817383, "global_step": 142278, "epoch": 1175} {"train_loss": -39.59556198120117, "global_step": 142279, "epoch": 1175} {"train_loss": -40.743343353271484, "global_step": 142280, "epoch": 1175} {"train_loss": -39.999732971191406, "global_step": 142281, "epoch": 1175} {"train_loss": -40.10581588745117, "global_step": 142282, "epoch": 1175} {"train_loss": -40.21407699584961, "global_step": 142283, "epoch": 1175} {"train_loss": -40.814971923828125, "global_step": 142284, "epoch": 1175} {"train_loss": -40.97467041015625, "global_step": 142285, "epoch": 1175} {"train_loss": -40.91791915893555, "global_step": 142286, "epoch": 1175} {"train_loss": -40.857051849365234, "global_step": 142287, "epoch": 1175} {"train_loss": -40.317195892333984, "global_step": 142288, "epoch": 1175} {"train_loss": -41.334014892578125, "global_step": 142289, "epoch": 1175} {"train_loss": -40.66270065307617, "global_step": 142290, "epoch": 1175} {"train_loss": -41.133399963378906, "global_step": 142291, "epoch": 1175} {"train_loss": -40.92152786254883, "global_step": 142292, "epoch": 1175} {"train_loss": -41.36025619506836, "global_step": 142293, "epoch": 1175} {"train_loss": -40.48917007446289, "global_step": 142294, "epoch": 1175} {"train_loss": -39.89145931527634, "global_step": 142295, "epoch": 1175, "val_loss": 2468170.25} {"train_loss": -40.27073287963867, "global_step": 142296, "epoch": 1176} {"train_loss": -41.06376647949219, "global_step": 142297, "epoch": 1176} {"train_loss": -41.54612350463867, "global_step": 142298, "epoch": 1176} {"train_loss": -41.5988883972168, "global_step": 142299, "epoch": 1176} {"train_loss": -41.10322952270508, "global_step": 142300, "epoch": 1176} {"train_loss": -41.53582763671875, "global_step": 142301, "epoch": 1176} {"train_loss": -40.97233200073242, "global_step": 142302, "epoch": 1176} {"train_loss": -40.945430755615234, "global_step": 142303, "epoch": 1176} {"train_loss": -41.45505905151367, "global_step": 142304, "epoch": 1176} {"train_loss": -40.8047981262207, "global_step": 142305, "epoch": 1176} {"train_loss": -41.271480560302734, "global_step": 142306, "epoch": 1176} {"train_loss": -40.98130416870117, "global_step": 142307, "epoch": 1176} {"train_loss": -41.11793899536133, "global_step": 142308, "epoch": 1176} {"train_loss": -41.354740142822266, "global_step": 142309, "epoch": 1176} {"train_loss": -41.15839385986328, "global_step": 142310, "epoch": 1176} {"train_loss": -40.9394416809082, "global_step": 142311, "epoch": 1176} {"train_loss": -41.566532135009766, "global_step": 142312, "epoch": 1176} {"train_loss": -41.100406646728516, "global_step": 142313, "epoch": 1176} {"train_loss": -40.747100830078125, "global_step": 142314, "epoch": 1176} {"train_loss": -40.98053741455078, "global_step": 142315, "epoch": 1176} {"train_loss": -40.22658920288086, "global_step": 142316, "epoch": 1176} {"train_loss": -38.489810943603516, "global_step": 142317, "epoch": 1176} {"train_loss": -39.63050079345703, "global_step": 142318, "epoch": 1176} {"train_loss": -39.996639251708984, "global_step": 142319, "epoch": 1176} {"train_loss": -40.84189987182617, "global_step": 142320, "epoch": 1176} {"train_loss": -40.673736572265625, "global_step": 142321, "epoch": 1176} {"train_loss": -41.04581832885742, "global_step": 142322, "epoch": 1176} {"train_loss": -41.01569747924805, "global_step": 142323, "epoch": 1176} {"train_loss": -39.9901008605957, "global_step": 142324, "epoch": 1176} {"train_loss": -40.404541015625, "global_step": 142325, "epoch": 1176} {"train_loss": -38.55051803588867, "global_step": 142326, "epoch": 1176} {"train_loss": -40.82218551635742, "global_step": 142327, "epoch": 1176} {"train_loss": -41.045223236083984, "global_step": 142328, "epoch": 1176} {"train_loss": -41.19362258911133, "global_step": 142329, "epoch": 1176} {"train_loss": -39.57024383544922, "global_step": 142330, "epoch": 1176} {"train_loss": -39.318721771240234, "global_step": 142331, "epoch": 1176} {"train_loss": -39.48442459106445, "global_step": 142332, "epoch": 1176} {"train_loss": -39.97235107421875, "global_step": 142333, "epoch": 1176} {"train_loss": -40.35444259643555, "global_step": 142334, "epoch": 1176} {"train_loss": -39.86640930175781, "global_step": 142335, "epoch": 1176} {"train_loss": -41.14617919921875, "global_step": 142336, "epoch": 1176} {"train_loss": -40.53043746948242, "global_step": 142337, "epoch": 1176} {"train_loss": -41.24884796142578, "global_step": 142338, "epoch": 1176} {"train_loss": -41.25038528442383, "global_step": 142339, "epoch": 1176} {"train_loss": -40.40879440307617, "global_step": 142340, "epoch": 1176} {"train_loss": -40.43149948120117, "global_step": 142341, "epoch": 1176} {"train_loss": -41.24508285522461, "global_step": 142342, "epoch": 1176} {"train_loss": -41.05289840698242, "global_step": 142343, "epoch": 1176} {"train_loss": -41.15715026855469, "global_step": 142344, "epoch": 1176} {"train_loss": -41.03337097167969, "global_step": 142345, "epoch": 1176} {"train_loss": -41.708221435546875, "global_step": 142346, "epoch": 1176} {"train_loss": -41.3940544128418, "global_step": 142347, "epoch": 1176} {"train_loss": -40.807037353515625, "global_step": 142348, "epoch": 1176} {"train_loss": -40.29389953613281, "global_step": 142349, "epoch": 1176} {"train_loss": -41.189937591552734, "global_step": 142350, "epoch": 1176} {"train_loss": -40.68742752075195, "global_step": 142351, "epoch": 1176} {"train_loss": -39.417476654052734, "global_step": 142352, "epoch": 1176} {"train_loss": -41.401763916015625, "global_step": 142353, "epoch": 1176} {"train_loss": -41.20412063598633, "global_step": 142354, "epoch": 1176} {"train_loss": -41.3243293762207, "global_step": 142355, "epoch": 1176} {"train_loss": -40.528839111328125, "global_step": 142356, "epoch": 1176} {"train_loss": -40.71010208129883, "global_step": 142357, "epoch": 1176} {"train_loss": -40.639442443847656, "global_step": 142358, "epoch": 1176} {"train_loss": -40.19552230834961, "global_step": 142359, "epoch": 1176} {"train_loss": -40.38416290283203, "global_step": 142360, "epoch": 1176} {"train_loss": -39.32210922241211, "global_step": 142361, "epoch": 1176} {"train_loss": -40.81069564819336, "global_step": 142362, "epoch": 1176} {"train_loss": -38.39561462402344, "global_step": 142363, "epoch": 1176} {"train_loss": -38.3968620300293, "global_step": 142364, "epoch": 1176} {"train_loss": -40.24703598022461, "global_step": 142365, "epoch": 1176} {"train_loss": -37.67728805541992, "global_step": 142366, "epoch": 1176} {"train_loss": -40.08917236328125, "global_step": 142367, "epoch": 1176} {"train_loss": -37.78068542480469, "global_step": 142368, "epoch": 1176} {"train_loss": -40.541866302490234, "global_step": 142369, "epoch": 1176} {"train_loss": -39.605812072753906, "global_step": 142370, "epoch": 1176} {"train_loss": -40.64604568481445, "global_step": 142371, "epoch": 1176} {"train_loss": -38.42560958862305, "global_step": 142372, "epoch": 1176} {"train_loss": -39.3283576965332, "global_step": 142373, "epoch": 1176} {"train_loss": -40.20479965209961, "global_step": 142374, "epoch": 1176} {"train_loss": -40.4046745300293, "global_step": 142375, "epoch": 1176} {"train_loss": -39.106483459472656, "global_step": 142376, "epoch": 1176} {"train_loss": -40.80509948730469, "global_step": 142377, "epoch": 1176} {"train_loss": -39.84138870239258, "global_step": 142378, "epoch": 1176} {"train_loss": -40.45069122314453, "global_step": 142379, "epoch": 1176} {"train_loss": -39.590179443359375, "global_step": 142380, "epoch": 1176} {"train_loss": -39.571102142333984, "global_step": 142381, "epoch": 1176} {"train_loss": -40.8358268737793, "global_step": 142382, "epoch": 1176} {"train_loss": -40.8953971862793, "global_step": 142383, "epoch": 1176} {"train_loss": -40.59373092651367, "global_step": 142384, "epoch": 1176} {"train_loss": -40.4986572265625, "global_step": 142385, "epoch": 1176} {"train_loss": -40.5031623840332, "global_step": 142386, "epoch": 1176} {"train_loss": -41.3204345703125, "global_step": 142387, "epoch": 1176} {"train_loss": -40.472503662109375, "global_step": 142388, "epoch": 1176} {"train_loss": -40.39162063598633, "global_step": 142389, "epoch": 1176} {"train_loss": -41.10980987548828, "global_step": 142390, "epoch": 1176} {"train_loss": -39.84790802001953, "global_step": 142391, "epoch": 1176} {"train_loss": -40.02622604370117, "global_step": 142392, "epoch": 1176} {"train_loss": -40.872520446777344, "global_step": 142393, "epoch": 1176} {"train_loss": -39.381378173828125, "global_step": 142394, "epoch": 1176} {"train_loss": -39.63531494140625, "global_step": 142395, "epoch": 1176} {"train_loss": -40.73872756958008, "global_step": 142396, "epoch": 1176} {"train_loss": -39.07843780517578, "global_step": 142397, "epoch": 1176} {"train_loss": -40.29091262817383, "global_step": 142398, "epoch": 1176} {"train_loss": -39.68581771850586, "global_step": 142399, "epoch": 1176} {"train_loss": -39.94210433959961, "global_step": 142400, "epoch": 1176} {"train_loss": -40.29610061645508, "global_step": 142401, "epoch": 1176} {"train_loss": -40.5826416015625, "global_step": 142402, "epoch": 1176} {"train_loss": -40.65203094482422, "global_step": 142403, "epoch": 1176} {"train_loss": -40.224151611328125, "global_step": 142404, "epoch": 1176} {"train_loss": -41.155174255371094, "global_step": 142405, "epoch": 1176} {"train_loss": -39.958919525146484, "global_step": 142406, "epoch": 1176} {"train_loss": -40.32754135131836, "global_step": 142407, "epoch": 1176} {"train_loss": -41.09005355834961, "global_step": 142408, "epoch": 1176} {"train_loss": -41.22665023803711, "global_step": 142409, "epoch": 1176} {"train_loss": -40.884735107421875, "global_step": 142410, "epoch": 1176} {"train_loss": -41.24798583984375, "global_step": 142411, "epoch": 1176} {"train_loss": -41.05442428588867, "global_step": 142412, "epoch": 1176} {"train_loss": -40.9483757019043, "global_step": 142413, "epoch": 1176} {"train_loss": -40.56447219848633, "global_step": 142414, "epoch": 1176} {"train_loss": -40.95280075073242, "global_step": 142415, "epoch": 1176} {"train_loss": -40.45603583469864, "global_step": 142416, "epoch": 1176, "val_loss": 2668998.25} {"train_loss": -40.696022033691406, "global_step": 142417, "epoch": 1177} {"train_loss": -41.09992599487305, "global_step": 142418, "epoch": 1177} {"train_loss": -41.10544967651367, "global_step": 142419, "epoch": 1177} {"train_loss": -40.74041748046875, "global_step": 142420, "epoch": 1177} {"train_loss": -41.123897552490234, "global_step": 142421, "epoch": 1177} {"train_loss": -40.40165328979492, "global_step": 142422, "epoch": 1177} {"train_loss": -40.351924896240234, "global_step": 142423, "epoch": 1177} {"train_loss": -40.840301513671875, "global_step": 142424, "epoch": 1177} {"train_loss": -41.28846740722656, "global_step": 142425, "epoch": 1177} {"train_loss": -41.46858215332031, "global_step": 142426, "epoch": 1177} {"train_loss": -40.93488311767578, "global_step": 142427, "epoch": 1177} {"train_loss": -40.922725677490234, "global_step": 142428, "epoch": 1177} {"train_loss": -41.49198532104492, "global_step": 142429, "epoch": 1177} {"train_loss": -39.764278411865234, "global_step": 142430, "epoch": 1177} {"train_loss": -40.44837188720703, "global_step": 142431, "epoch": 1177} {"train_loss": -40.52912139892578, "global_step": 142432, "epoch": 1177} {"train_loss": -38.246337890625, "global_step": 142433, "epoch": 1177} {"train_loss": -36.880889892578125, "global_step": 142434, "epoch": 1177} {"train_loss": -39.2789421081543, "global_step": 142435, "epoch": 1177} {"train_loss": -33.60750198364258, "global_step": 142436, "epoch": 1177} {"train_loss": -24.520265579223633, "global_step": 142437, "epoch": 1177} {"train_loss": -28.674148559570312, "global_step": 142438, "epoch": 1177} {"train_loss": -33.630279541015625, "global_step": 142439, "epoch": 1177} {"train_loss": -32.60691452026367, "global_step": 142440, "epoch": 1177} {"train_loss": -31.07893943786621, "global_step": 142441, "epoch": 1177} {"train_loss": -33.74021530151367, "global_step": 142442, "epoch": 1177} {"train_loss": -32.29902267456055, "global_step": 142443, "epoch": 1177} {"train_loss": -33.10078811645508, "global_step": 142444, "epoch": 1177} {"train_loss": -34.3261833190918, "global_step": 142445, "epoch": 1177} {"train_loss": -33.15985870361328, "global_step": 142446, "epoch": 1177} {"train_loss": -33.872406005859375, "global_step": 142447, "epoch": 1177} {"train_loss": -34.70167922973633, "global_step": 142448, "epoch": 1177} {"train_loss": -33.058528900146484, "global_step": 142449, "epoch": 1177} {"train_loss": -35.287109375, "global_step": 142450, "epoch": 1177} {"train_loss": -34.96168899536133, "global_step": 142451, "epoch": 1177} {"train_loss": -34.29458236694336, "global_step": 142452, "epoch": 1177} {"train_loss": -34.491058349609375, "global_step": 142453, "epoch": 1177} {"train_loss": -35.77791213989258, "global_step": 142454, "epoch": 1177} {"train_loss": -34.716400146484375, "global_step": 142455, "epoch": 1177} {"train_loss": -35.54816818237305, "global_step": 142456, "epoch": 1177} {"train_loss": -35.91572189331055, "global_step": 142457, "epoch": 1177} {"train_loss": -35.36636734008789, "global_step": 142458, "epoch": 1177} {"train_loss": -35.90520477294922, "global_step": 142459, "epoch": 1177} {"train_loss": -35.86375045776367, "global_step": 142460, "epoch": 1177} {"train_loss": -36.40537643432617, "global_step": 142461, "epoch": 1177} {"train_loss": -36.96322250366211, "global_step": 142462, "epoch": 1177} {"train_loss": -35.65766906738281, "global_step": 142463, "epoch": 1177} {"train_loss": -35.06626892089844, "global_step": 142464, "epoch": 1177} {"train_loss": -33.91192626953125, "global_step": 142465, "epoch": 1177} {"train_loss": -32.18721008300781, "global_step": 142466, "epoch": 1177} {"train_loss": -35.114742279052734, "global_step": 142467, "epoch": 1177} {"train_loss": -36.15491485595703, "global_step": 142468, "epoch": 1177} {"train_loss": -33.52423858642578, "global_step": 142469, "epoch": 1177} {"train_loss": -36.448360443115234, "global_step": 142470, "epoch": 1177} {"train_loss": -35.8315544128418, "global_step": 142471, "epoch": 1177} {"train_loss": -35.41081619262695, "global_step": 142472, "epoch": 1177} {"train_loss": -37.15869903564453, "global_step": 142473, "epoch": 1177} {"train_loss": -35.68743896484375, "global_step": 142474, "epoch": 1177} {"train_loss": -37.486263275146484, "global_step": 142475, "epoch": 1177} {"train_loss": -35.90227127075195, "global_step": 142476, "epoch": 1177} {"train_loss": -36.56837463378906, "global_step": 142477, "epoch": 1177} {"train_loss": -36.19485855102539, "global_step": 142478, "epoch": 1177} {"train_loss": -36.690433502197266, "global_step": 142479, "epoch": 1177} {"train_loss": -36.76709747314453, "global_step": 142480, "epoch": 1177} {"train_loss": -36.00360107421875, "global_step": 142481, "epoch": 1177} {"train_loss": -35.94533157348633, "global_step": 142482, "epoch": 1177} {"train_loss": -37.044952392578125, "global_step": 142483, "epoch": 1177} {"train_loss": -37.12522506713867, "global_step": 142484, "epoch": 1177} {"train_loss": -36.81494903564453, "global_step": 142485, "epoch": 1177} {"train_loss": -37.34366989135742, "global_step": 142486, "epoch": 1177} {"train_loss": -36.99176025390625, "global_step": 142487, "epoch": 1177} {"train_loss": -37.35064697265625, "global_step": 142488, "epoch": 1177} {"train_loss": -37.14578628540039, "global_step": 142489, "epoch": 1177} {"train_loss": -37.23849105834961, "global_step": 142490, "epoch": 1177} {"train_loss": -37.24446105957031, "global_step": 142491, "epoch": 1177} {"train_loss": -37.17168426513672, "global_step": 142492, "epoch": 1177} {"train_loss": -37.68148422241211, "global_step": 142493, "epoch": 1177} {"train_loss": -37.07150650024414, "global_step": 142494, "epoch": 1177} {"train_loss": -37.442996978759766, "global_step": 142495, "epoch": 1177} {"train_loss": -37.93735885620117, "global_step": 142496, "epoch": 1177} {"train_loss": -37.76904296875, "global_step": 142497, "epoch": 1177} {"train_loss": -38.16447067260742, "global_step": 142498, "epoch": 1177} {"train_loss": -36.39404296875, "global_step": 142499, "epoch": 1177} {"train_loss": -37.60329055786133, "global_step": 142500, "epoch": 1177} {"train_loss": -37.5002555847168, "global_step": 142501, "epoch": 1177} {"train_loss": -37.71089553833008, "global_step": 142502, "epoch": 1177} {"train_loss": -37.082740783691406, "global_step": 142503, "epoch": 1177} {"train_loss": -34.886444091796875, "global_step": 142504, "epoch": 1177} {"train_loss": -36.616661071777344, "global_step": 142505, "epoch": 1177} {"train_loss": -35.43265914916992, "global_step": 142506, "epoch": 1177} {"train_loss": -35.39588928222656, "global_step": 142507, "epoch": 1177} {"train_loss": -37.46421432495117, "global_step": 142508, "epoch": 1177} {"train_loss": -37.3369255065918, "global_step": 142509, "epoch": 1177} {"train_loss": -37.27399444580078, "global_step": 142510, "epoch": 1177} {"train_loss": -37.464210510253906, "global_step": 142511, "epoch": 1177} {"train_loss": -34.21188735961914, "global_step": 142512, "epoch": 1177} {"train_loss": -35.89023971557617, "global_step": 142513, "epoch": 1177} {"train_loss": -37.67855453491211, "global_step": 142514, "epoch": 1177} {"train_loss": -36.0510368347168, "global_step": 142515, "epoch": 1177} {"train_loss": -36.548336029052734, "global_step": 142516, "epoch": 1177} {"train_loss": -36.169734954833984, "global_step": 142517, "epoch": 1177} {"train_loss": -36.14606857299805, "global_step": 142518, "epoch": 1177} {"train_loss": -35.66053009033203, "global_step": 142519, "epoch": 1177} {"train_loss": -35.77782440185547, "global_step": 142520, "epoch": 1177} {"train_loss": -33.888084411621094, "global_step": 142521, "epoch": 1177} {"train_loss": -34.26458740234375, "global_step": 142522, "epoch": 1177} {"train_loss": -36.52862548828125, "global_step": 142523, "epoch": 1177} {"train_loss": -37.00231170654297, "global_step": 142524, "epoch": 1177} {"train_loss": -35.559322357177734, "global_step": 142525, "epoch": 1177} {"train_loss": -36.192989349365234, "global_step": 142526, "epoch": 1177} {"train_loss": -36.46092987060547, "global_step": 142527, "epoch": 1177} {"train_loss": -36.46949005126953, "global_step": 142528, "epoch": 1177} {"train_loss": -37.191768646240234, "global_step": 142529, "epoch": 1177} {"train_loss": -34.36433029174805, "global_step": 142530, "epoch": 1177} {"train_loss": -36.363494873046875, "global_step": 142531, "epoch": 1177} {"train_loss": -36.27597427368164, "global_step": 142532, "epoch": 1177} {"train_loss": -37.738983154296875, "global_step": 142533, "epoch": 1177} {"train_loss": -37.53668212890625, "global_step": 142534, "epoch": 1177} {"train_loss": -32.98203659057617, "global_step": 142535, "epoch": 1177} {"train_loss": -37.173561096191406, "global_step": 142536, "epoch": 1177} {"train_loss": -36.42554442350529, "global_step": 142537, "epoch": 1177, "val_loss": 2801319.0} {"train_loss": -37.465850830078125, "global_step": 142538, "epoch": 1178} {"train_loss": -35.937252044677734, "global_step": 142539, "epoch": 1178} {"train_loss": -37.035953521728516, "global_step": 142540, "epoch": 1178} {"train_loss": -35.75494384765625, "global_step": 142541, "epoch": 1178} {"train_loss": -35.07166290283203, "global_step": 142542, "epoch": 1178} {"train_loss": -35.27567672729492, "global_step": 142543, "epoch": 1178} {"train_loss": -35.495487213134766, "global_step": 142544, "epoch": 1178} {"train_loss": -34.636436462402344, "global_step": 142545, "epoch": 1178} {"train_loss": -28.212121963500977, "global_step": 142546, "epoch": 1178} {"train_loss": -34.58944320678711, "global_step": 142547, "epoch": 1178} {"train_loss": -33.87441635131836, "global_step": 142548, "epoch": 1178} {"train_loss": -34.57149124145508, "global_step": 142549, "epoch": 1178} {"train_loss": -34.96857452392578, "global_step": 142550, "epoch": 1178} {"train_loss": -35.633758544921875, "global_step": 142551, "epoch": 1178} {"train_loss": -32.41591262817383, "global_step": 142552, "epoch": 1178} {"train_loss": -35.1452751159668, "global_step": 142553, "epoch": 1178} {"train_loss": -35.97036361694336, "global_step": 142554, "epoch": 1178} {"train_loss": -35.7220344543457, "global_step": 142555, "epoch": 1178} {"train_loss": -36.11581039428711, "global_step": 142556, "epoch": 1178} {"train_loss": -35.84846496582031, "global_step": 142557, "epoch": 1178} {"train_loss": -35.8062858581543, "global_step": 142558, "epoch": 1178} {"train_loss": -36.10018539428711, "global_step": 142559, "epoch": 1178} {"train_loss": -34.0789794921875, "global_step": 142560, "epoch": 1178} {"train_loss": -35.2619514465332, "global_step": 142561, "epoch": 1178} {"train_loss": -35.79203414916992, "global_step": 142562, "epoch": 1178} {"train_loss": -33.63539123535156, "global_step": 142563, "epoch": 1178} {"train_loss": -37.344112396240234, "global_step": 142564, "epoch": 1178} {"train_loss": -32.744537353515625, "global_step": 142565, "epoch": 1178} {"train_loss": -36.1307487487793, "global_step": 142566, "epoch": 1178} {"train_loss": -35.33980941772461, "global_step": 142567, "epoch": 1178} {"train_loss": -36.638160705566406, "global_step": 142568, "epoch": 1178} {"train_loss": -36.09273147583008, "global_step": 142569, "epoch": 1178} {"train_loss": -35.88588333129883, "global_step": 142570, "epoch": 1178} {"train_loss": -36.49532699584961, "global_step": 142571, "epoch": 1178} {"train_loss": -36.7570915222168, "global_step": 142572, "epoch": 1178} {"train_loss": -34.844635009765625, "global_step": 142573, "epoch": 1178} {"train_loss": -35.52785110473633, "global_step": 142574, "epoch": 1178} {"train_loss": -37.273895263671875, "global_step": 142575, "epoch": 1178} {"train_loss": -36.46465301513672, "global_step": 142576, "epoch": 1178} {"train_loss": -37.04506301879883, "global_step": 142577, "epoch": 1178} {"train_loss": -36.1666374206543, "global_step": 142578, "epoch": 1178} {"train_loss": -37.40189743041992, "global_step": 142579, "epoch": 1178} {"train_loss": -35.92708206176758, "global_step": 142580, "epoch": 1178} {"train_loss": -37.355140686035156, "global_step": 142581, "epoch": 1178} {"train_loss": -36.93020248413086, "global_step": 142582, "epoch": 1178} {"train_loss": -37.005775451660156, "global_step": 142583, "epoch": 1178} {"train_loss": -36.03245162963867, "global_step": 142584, "epoch": 1178} {"train_loss": -34.74065399169922, "global_step": 142585, "epoch": 1178} {"train_loss": -36.16901397705078, "global_step": 142586, "epoch": 1178} {"train_loss": -36.92018127441406, "global_step": 142587, "epoch": 1178} {"train_loss": -36.99794387817383, "global_step": 142588, "epoch": 1178} {"train_loss": -37.683631896972656, "global_step": 142589, "epoch": 1178} {"train_loss": -37.55537796020508, "global_step": 142590, "epoch": 1178} {"train_loss": -37.72499465942383, "global_step": 142591, "epoch": 1178} {"train_loss": -36.204864501953125, "global_step": 142592, "epoch": 1178} {"train_loss": -37.959163665771484, "global_step": 142593, "epoch": 1178} {"train_loss": -37.69099044799805, "global_step": 142594, "epoch": 1178} {"train_loss": -38.12452697753906, "global_step": 142595, "epoch": 1178} {"train_loss": -37.39326095581055, "global_step": 142596, "epoch": 1178} {"train_loss": -37.60209655761719, "global_step": 142597, "epoch": 1178} {"train_loss": -37.89361572265625, "global_step": 142598, "epoch": 1178} {"train_loss": -37.906612396240234, "global_step": 142599, "epoch": 1178} {"train_loss": -37.092872619628906, "global_step": 142600, "epoch": 1178} {"train_loss": -37.37687683105469, "global_step": 142601, "epoch": 1178} {"train_loss": -37.34021759033203, "global_step": 142602, "epoch": 1178} {"train_loss": -37.894649505615234, "global_step": 142603, "epoch": 1178} {"train_loss": -37.64996337890625, "global_step": 142604, "epoch": 1178} {"train_loss": -37.93271255493164, "global_step": 142605, "epoch": 1178} {"train_loss": -36.91053771972656, "global_step": 142606, "epoch": 1178} {"train_loss": -38.594966888427734, "global_step": 142607, "epoch": 1178} {"train_loss": -35.718299865722656, "global_step": 142608, "epoch": 1178} {"train_loss": -38.5797119140625, "global_step": 142609, "epoch": 1178} {"train_loss": -38.1698112487793, "global_step": 142610, "epoch": 1178} {"train_loss": -37.88067626953125, "global_step": 142611, "epoch": 1178} {"train_loss": -37.91017532348633, "global_step": 142612, "epoch": 1178} {"train_loss": -38.357826232910156, "global_step": 142613, "epoch": 1178} {"train_loss": -37.47593307495117, "global_step": 142614, "epoch": 1178} {"train_loss": -36.80575180053711, "global_step": 142615, "epoch": 1178} {"train_loss": -36.534236907958984, "global_step": 142616, "epoch": 1178} {"train_loss": -35.66383743286133, "global_step": 142617, "epoch": 1178} {"train_loss": -35.52164840698242, "global_step": 142618, "epoch": 1178} {"train_loss": -38.27715301513672, "global_step": 142619, "epoch": 1178} {"train_loss": -36.829158782958984, "global_step": 142620, "epoch": 1178} {"train_loss": -37.3217887878418, "global_step": 142621, "epoch": 1178} {"train_loss": -36.62348175048828, "global_step": 142622, "epoch": 1178} {"train_loss": -37.631980895996094, "global_step": 142623, "epoch": 1178} {"train_loss": -36.98411560058594, "global_step": 142624, "epoch": 1178} {"train_loss": -38.444732666015625, "global_step": 142625, "epoch": 1178} {"train_loss": -37.5058708190918, "global_step": 142626, "epoch": 1178} {"train_loss": -38.26481628417969, "global_step": 142627, "epoch": 1178} {"train_loss": -38.10600662231445, "global_step": 142628, "epoch": 1178} {"train_loss": -38.04054641723633, "global_step": 142629, "epoch": 1178} {"train_loss": -37.60237503051758, "global_step": 142630, "epoch": 1178} {"train_loss": -38.177940368652344, "global_step": 142631, "epoch": 1178} {"train_loss": -38.23008346557617, "global_step": 142632, "epoch": 1178} {"train_loss": -37.501094818115234, "global_step": 142633, "epoch": 1178} {"train_loss": -37.23662567138672, "global_step": 142634, "epoch": 1178} {"train_loss": -37.61725616455078, "global_step": 142635, "epoch": 1178} {"train_loss": -36.75221633911133, "global_step": 142636, "epoch": 1178} {"train_loss": -37.63096237182617, "global_step": 142637, "epoch": 1178} {"train_loss": -38.6395263671875, "global_step": 142638, "epoch": 1178} {"train_loss": -37.98727798461914, "global_step": 142639, "epoch": 1178} {"train_loss": -37.142452239990234, "global_step": 142640, "epoch": 1178} {"train_loss": -38.593544006347656, "global_step": 142641, "epoch": 1178} {"train_loss": -38.21476364135742, "global_step": 142642, "epoch": 1178} {"train_loss": -37.49353790283203, "global_step": 142643, "epoch": 1178} {"train_loss": -38.39896774291992, "global_step": 142644, "epoch": 1178} {"train_loss": -38.59025192260742, "global_step": 142645, "epoch": 1178} {"train_loss": -35.198036193847656, "global_step": 142646, "epoch": 1178} {"train_loss": -38.27163314819336, "global_step": 142647, "epoch": 1178} {"train_loss": -38.4649772644043, "global_step": 142648, "epoch": 1178} {"train_loss": -38.082393646240234, "global_step": 142649, "epoch": 1178} {"train_loss": -38.9306755065918, "global_step": 142650, "epoch": 1178} {"train_loss": -38.50399398803711, "global_step": 142651, "epoch": 1178} {"train_loss": -38.00836944580078, "global_step": 142652, "epoch": 1178} {"train_loss": -37.56635284423828, "global_step": 142653, "epoch": 1178} {"train_loss": -38.21088409423828, "global_step": 142654, "epoch": 1178} {"train_loss": -38.399593353271484, "global_step": 142655, "epoch": 1178} {"train_loss": -38.31508255004883, "global_step": 142656, "epoch": 1178} {"train_loss": -37.6679801940918, "global_step": 142657, "epoch": 1178} {"train_loss": -36.80869950538825, "global_step": 142658, "epoch": 1178, "val_loss": 2550230.25} {"train_loss": -38.032958984375, "global_step": 142659, "epoch": 1179} {"train_loss": -38.288753509521484, "global_step": 142660, "epoch": 1179} {"train_loss": -39.268856048583984, "global_step": 142661, "epoch": 1179} {"train_loss": -37.961280822753906, "global_step": 142662, "epoch": 1179} {"train_loss": -38.41817855834961, "global_step": 142663, "epoch": 1179} {"train_loss": -38.801971435546875, "global_step": 142664, "epoch": 1179} {"train_loss": -36.53498458862305, "global_step": 142665, "epoch": 1179} {"train_loss": -38.58186340332031, "global_step": 142666, "epoch": 1179} {"train_loss": -38.93980407714844, "global_step": 142667, "epoch": 1179} {"train_loss": -38.954559326171875, "global_step": 142668, "epoch": 1179} {"train_loss": -38.39382553100586, "global_step": 142669, "epoch": 1179} {"train_loss": -38.10445785522461, "global_step": 142670, "epoch": 1179} {"train_loss": -38.443782806396484, "global_step": 142671, "epoch": 1179} {"train_loss": -38.14738845825195, "global_step": 142672, "epoch": 1179} {"train_loss": -38.99795150756836, "global_step": 142673, "epoch": 1179} {"train_loss": -38.41026306152344, "global_step": 142674, "epoch": 1179} {"train_loss": -37.85943603515625, "global_step": 142675, "epoch": 1179} {"train_loss": -38.759521484375, "global_step": 142676, "epoch": 1179} {"train_loss": -38.14149475097656, "global_step": 142677, "epoch": 1179} {"train_loss": -37.95856475830078, "global_step": 142678, "epoch": 1179} {"train_loss": -39.375396728515625, "global_step": 142679, "epoch": 1179} {"train_loss": -38.28184127807617, "global_step": 142680, "epoch": 1179} {"train_loss": -38.28681564331055, "global_step": 142681, "epoch": 1179} {"train_loss": -38.691375732421875, "global_step": 142682, "epoch": 1179} {"train_loss": -38.635650634765625, "global_step": 142683, "epoch": 1179} {"train_loss": -38.74230194091797, "global_step": 142684, "epoch": 1179} {"train_loss": -37.74979782104492, "global_step": 142685, "epoch": 1179} {"train_loss": -38.395179748535156, "global_step": 142686, "epoch": 1179} {"train_loss": -38.57455062866211, "global_step": 142687, "epoch": 1179} {"train_loss": -39.20952224731445, "global_step": 142688, "epoch": 1179} {"train_loss": -38.554378509521484, "global_step": 142689, "epoch": 1179} {"train_loss": -39.68372344970703, "global_step": 142690, "epoch": 1179} {"train_loss": -39.003822326660156, "global_step": 142691, "epoch": 1179} {"train_loss": -39.7362060546875, "global_step": 142692, "epoch": 1179} {"train_loss": -39.10060501098633, "global_step": 142693, "epoch": 1179} {"train_loss": -38.98616409301758, "global_step": 142694, "epoch": 1179} {"train_loss": -38.9903564453125, "global_step": 142695, "epoch": 1179} {"train_loss": -37.297706604003906, "global_step": 142696, "epoch": 1179} {"train_loss": -39.19977951049805, "global_step": 142697, "epoch": 1179} {"train_loss": -38.12960433959961, "global_step": 142698, "epoch": 1179} {"train_loss": -37.334197998046875, "global_step": 142699, "epoch": 1179} {"train_loss": -39.07070541381836, "global_step": 142700, "epoch": 1179} {"train_loss": -39.180633544921875, "global_step": 142701, "epoch": 1179} {"train_loss": -38.003658294677734, "global_step": 142702, "epoch": 1179} {"train_loss": -38.6569709777832, "global_step": 142703, "epoch": 1179} {"train_loss": -37.346553802490234, "global_step": 142704, "epoch": 1179} {"train_loss": -37.891441345214844, "global_step": 142705, "epoch": 1179} {"train_loss": -37.84769821166992, "global_step": 142706, "epoch": 1179} {"train_loss": -39.21931076049805, "global_step": 142707, "epoch": 1179} {"train_loss": -38.789222717285156, "global_step": 142708, "epoch": 1179} {"train_loss": -38.47267150878906, "global_step": 142709, "epoch": 1179} {"train_loss": -39.07794952392578, "global_step": 142710, "epoch": 1179} {"train_loss": -39.04258346557617, "global_step": 142711, "epoch": 1179} {"train_loss": -38.324241638183594, "global_step": 142712, "epoch": 1179} {"train_loss": -36.208980560302734, "global_step": 142713, "epoch": 1179} {"train_loss": -32.78080368041992, "global_step": 142714, "epoch": 1179} {"train_loss": -26.908578872680664, "global_step": 142715, "epoch": 1179} {"train_loss": -31.536279678344727, "global_step": 142716, "epoch": 1179} {"train_loss": -37.70427703857422, "global_step": 142717, "epoch": 1179} {"train_loss": -32.89670181274414, "global_step": 142718, "epoch": 1179} {"train_loss": -37.439456939697266, "global_step": 142719, "epoch": 1179} {"train_loss": -32.048885345458984, "global_step": 142720, "epoch": 1179} {"train_loss": -37.45583724975586, "global_step": 142721, "epoch": 1179} {"train_loss": -33.0435905456543, "global_step": 142722, "epoch": 1179} {"train_loss": -38.07767105102539, "global_step": 142723, "epoch": 1179} {"train_loss": -35.024993896484375, "global_step": 142724, "epoch": 1179} {"train_loss": -36.94801330566406, "global_step": 142725, "epoch": 1179} {"train_loss": -33.71156311035156, "global_step": 142726, "epoch": 1179} {"train_loss": -38.16164779663086, "global_step": 142727, "epoch": 1179} {"train_loss": -36.65766906738281, "global_step": 142728, "epoch": 1179} {"train_loss": -36.83659362792969, "global_step": 142729, "epoch": 1179} {"train_loss": -37.74772262573242, "global_step": 142730, "epoch": 1179} {"train_loss": -36.239959716796875, "global_step": 142731, "epoch": 1179} {"train_loss": -37.2537727355957, "global_step": 142732, "epoch": 1179} {"train_loss": -36.8741340637207, "global_step": 142733, "epoch": 1179} {"train_loss": -37.0846061706543, "global_step": 142734, "epoch": 1179} {"train_loss": -38.02827072143555, "global_step": 142735, "epoch": 1179} {"train_loss": -35.74689483642578, "global_step": 142736, "epoch": 1179} {"train_loss": -36.38772201538086, "global_step": 142737, "epoch": 1179} {"train_loss": -32.003597259521484, "global_step": 142738, "epoch": 1179} {"train_loss": -36.85462188720703, "global_step": 142739, "epoch": 1179} {"train_loss": -37.77456283569336, "global_step": 142740, "epoch": 1179} {"train_loss": -38.01176834106445, "global_step": 142741, "epoch": 1179} {"train_loss": -37.450897216796875, "global_step": 142742, "epoch": 1179} {"train_loss": -37.334510803222656, "global_step": 142743, "epoch": 1179} {"train_loss": -37.2830696105957, "global_step": 142744, "epoch": 1179} {"train_loss": -34.83965301513672, "global_step": 142745, "epoch": 1179} {"train_loss": -38.684078216552734, "global_step": 142746, "epoch": 1179} {"train_loss": -37.8255615234375, "global_step": 142747, "epoch": 1179} {"train_loss": -38.28160858154297, "global_step": 142748, "epoch": 1179} {"train_loss": -38.61890411376953, "global_step": 142749, "epoch": 1179} {"train_loss": -37.39274978637695, "global_step": 142750, "epoch": 1179} {"train_loss": -37.56709289550781, "global_step": 142751, "epoch": 1179} {"train_loss": -37.95667266845703, "global_step": 142752, "epoch": 1179} {"train_loss": -37.971378326416016, "global_step": 142753, "epoch": 1179} {"train_loss": -36.43207931518555, "global_step": 142754, "epoch": 1179} {"train_loss": -37.8140983581543, "global_step": 142755, "epoch": 1179} {"train_loss": -38.46550369262695, "global_step": 142756, "epoch": 1179} {"train_loss": -37.865779876708984, "global_step": 142757, "epoch": 1179} {"train_loss": -37.92434310913086, "global_step": 142758, "epoch": 1179} {"train_loss": -36.575775146484375, "global_step": 142759, "epoch": 1179} {"train_loss": -33.63397216796875, "global_step": 142760, "epoch": 1179} {"train_loss": -37.29370880126953, "global_step": 142761, "epoch": 1179} {"train_loss": -38.19025802612305, "global_step": 142762, "epoch": 1179} {"train_loss": -36.74599075317383, "global_step": 142763, "epoch": 1179} {"train_loss": -35.74658966064453, "global_step": 142764, "epoch": 1179} {"train_loss": -36.518455505371094, "global_step": 142765, "epoch": 1179} {"train_loss": -34.8856086730957, "global_step": 142766, "epoch": 1179} {"train_loss": -35.1070671081543, "global_step": 142767, "epoch": 1179} {"train_loss": -36.99689865112305, "global_step": 142768, "epoch": 1179} {"train_loss": -37.9822883605957, "global_step": 142769, "epoch": 1179} {"train_loss": -36.38398742675781, "global_step": 142770, "epoch": 1179} {"train_loss": -33.26370620727539, "global_step": 142771, "epoch": 1179} {"train_loss": -36.93894577026367, "global_step": 142772, "epoch": 1179} {"train_loss": -34.920684814453125, "global_step": 142773, "epoch": 1179} {"train_loss": -36.699806213378906, "global_step": 142774, "epoch": 1179} {"train_loss": -37.729957580566406, "global_step": 142775, "epoch": 1179} {"train_loss": -37.79299545288086, "global_step": 142776, "epoch": 1179} {"train_loss": -35.96186447143555, "global_step": 142777, "epoch": 1179} {"train_loss": -35.712310791015625, "global_step": 142778, "epoch": 1179} {"train_loss": -37.32115362498386, "global_step": 142779, "epoch": 1179, "val_loss": 2669982.25} {"train_loss": -37.51923751831055, "global_step": 142780, "epoch": 1180} {"train_loss": -37.042030334472656, "global_step": 142781, "epoch": 1180} {"train_loss": -34.763893127441406, "global_step": 142782, "epoch": 1180} {"train_loss": -36.54977035522461, "global_step": 142783, "epoch": 1180} {"train_loss": -37.926361083984375, "global_step": 142784, "epoch": 1180} {"train_loss": -38.163848876953125, "global_step": 142785, "epoch": 1180} {"train_loss": -36.8752555847168, "global_step": 142786, "epoch": 1180} {"train_loss": -38.488948822021484, "global_step": 142787, "epoch": 1180} {"train_loss": -38.21347427368164, "global_step": 142788, "epoch": 1180} {"train_loss": -38.67753219604492, "global_step": 142789, "epoch": 1180} {"train_loss": -37.080650329589844, "global_step": 142790, "epoch": 1180} {"train_loss": -36.7478141784668, "global_step": 142791, "epoch": 1180} {"train_loss": -37.107032775878906, "global_step": 142792, "epoch": 1180} {"train_loss": -37.83382034301758, "global_step": 142793, "epoch": 1180} {"train_loss": -38.486328125, "global_step": 142794, "epoch": 1180} {"train_loss": -37.94584274291992, "global_step": 142795, "epoch": 1180} {"train_loss": -37.49154281616211, "global_step": 142796, "epoch": 1180} {"train_loss": -37.94253158569336, "global_step": 142797, "epoch": 1180} {"train_loss": -37.71215057373047, "global_step": 142798, "epoch": 1180} {"train_loss": -37.71147537231445, "global_step": 142799, "epoch": 1180} {"train_loss": -38.4073371887207, "global_step": 142800, "epoch": 1180} {"train_loss": -38.33613204956055, "global_step": 142801, "epoch": 1180} {"train_loss": -38.38533020019531, "global_step": 142802, "epoch": 1180} {"train_loss": -38.11492156982422, "global_step": 142803, "epoch": 1180} {"train_loss": -38.23079299926758, "global_step": 142804, "epoch": 1180} {"train_loss": -38.61419677734375, "global_step": 142805, "epoch": 1180} {"train_loss": -39.29155731201172, "global_step": 142806, "epoch": 1180} {"train_loss": -38.392356872558594, "global_step": 142807, "epoch": 1180} {"train_loss": -38.34200668334961, "global_step": 142808, "epoch": 1180} {"train_loss": -38.923091888427734, "global_step": 142809, "epoch": 1180} {"train_loss": -38.73786544799805, "global_step": 142810, "epoch": 1180} {"train_loss": -39.22315216064453, "global_step": 142811, "epoch": 1180} {"train_loss": -38.81562042236328, "global_step": 142812, "epoch": 1180} {"train_loss": -38.635704040527344, "global_step": 142813, "epoch": 1180} {"train_loss": -38.79511642456055, "global_step": 142814, "epoch": 1180} {"train_loss": -39.09823226928711, "global_step": 142815, "epoch": 1180} {"train_loss": -38.535274505615234, "global_step": 142816, "epoch": 1180} {"train_loss": -38.65060043334961, "global_step": 142817, "epoch": 1180} {"train_loss": -38.50375747680664, "global_step": 142818, "epoch": 1180} {"train_loss": -39.27006149291992, "global_step": 142819, "epoch": 1180} {"train_loss": -39.23316955566406, "global_step": 142820, "epoch": 1180} {"train_loss": -39.34339904785156, "global_step": 142821, "epoch": 1180} {"train_loss": -39.56509017944336, "global_step": 142822, "epoch": 1180} {"train_loss": -38.762855529785156, "global_step": 142823, "epoch": 1180} {"train_loss": -39.42610549926758, "global_step": 142824, "epoch": 1180} {"train_loss": -38.79024124145508, "global_step": 142825, "epoch": 1180} {"train_loss": -38.880558013916016, "global_step": 142826, "epoch": 1180} {"train_loss": -39.41196823120117, "global_step": 142827, "epoch": 1180} {"train_loss": -39.62947463989258, "global_step": 142828, "epoch": 1180} {"train_loss": -38.7814826965332, "global_step": 142829, "epoch": 1180} {"train_loss": -38.45990753173828, "global_step": 142830, "epoch": 1180} {"train_loss": -38.3040657043457, "global_step": 142831, "epoch": 1180} {"train_loss": -39.003082275390625, "global_step": 142832, "epoch": 1180} {"train_loss": -39.19971466064453, "global_step": 142833, "epoch": 1180} {"train_loss": -39.23287582397461, "global_step": 142834, "epoch": 1180} {"train_loss": -38.70896530151367, "global_step": 142835, "epoch": 1180} {"train_loss": -37.60918426513672, "global_step": 142836, "epoch": 1180} {"train_loss": -38.411441802978516, "global_step": 142837, "epoch": 1180} {"train_loss": -36.96534729003906, "global_step": 142838, "epoch": 1180} {"train_loss": -31.015731811523438, "global_step": 142839, "epoch": 1180} {"train_loss": -17.094751358032227, "global_step": 142840, "epoch": 1180} {"train_loss": -22.42469596862793, "global_step": 142841, "epoch": 1180} {"train_loss": -38.56768798828125, "global_step": 142842, "epoch": 1180} {"train_loss": -22.21750831604004, "global_step": 142843, "epoch": 1180} {"train_loss": -35.00411605834961, "global_step": 142844, "epoch": 1180} {"train_loss": -34.607479095458984, "global_step": 142845, "epoch": 1180} {"train_loss": -35.770137786865234, "global_step": 142846, "epoch": 1180} {"train_loss": -34.788692474365234, "global_step": 142847, "epoch": 1180} {"train_loss": -35.32368469238281, "global_step": 142848, "epoch": 1180} {"train_loss": -35.7343635559082, "global_step": 142849, "epoch": 1180} {"train_loss": -36.48393249511719, "global_step": 142850, "epoch": 1180} {"train_loss": -36.15304183959961, "global_step": 142851, "epoch": 1180} {"train_loss": -37.44942092895508, "global_step": 142852, "epoch": 1180} {"train_loss": -36.85476303100586, "global_step": 142853, "epoch": 1180} {"train_loss": -37.679847717285156, "global_step": 142854, "epoch": 1180} {"train_loss": -37.90140914916992, "global_step": 142855, "epoch": 1180} {"train_loss": -37.14812088012695, "global_step": 142856, "epoch": 1180} {"train_loss": -38.0762939453125, "global_step": 142857, "epoch": 1180} {"train_loss": -38.15347671508789, "global_step": 142858, "epoch": 1180} {"train_loss": -38.64304733276367, "global_step": 142859, "epoch": 1180} {"train_loss": -37.906986236572266, "global_step": 142860, "epoch": 1180} {"train_loss": -38.19208908081055, "global_step": 142861, "epoch": 1180} {"train_loss": -38.17803955078125, "global_step": 142862, "epoch": 1180} {"train_loss": -38.11798095703125, "global_step": 142863, "epoch": 1180} {"train_loss": -38.964149475097656, "global_step": 142864, "epoch": 1180} {"train_loss": -39.00265121459961, "global_step": 142865, "epoch": 1180} {"train_loss": -38.496212005615234, "global_step": 142866, "epoch": 1180} {"train_loss": -39.2514762878418, "global_step": 142867, "epoch": 1180} {"train_loss": -39.05813217163086, "global_step": 142868, "epoch": 1180} {"train_loss": -38.83062744140625, "global_step": 142869, "epoch": 1180} {"train_loss": -39.655635833740234, "global_step": 142870, "epoch": 1180} {"train_loss": -38.02546310424805, "global_step": 142871, "epoch": 1180} {"train_loss": -39.3468017578125, "global_step": 142872, "epoch": 1180} {"train_loss": -39.57033157348633, "global_step": 142873, "epoch": 1180} {"train_loss": -39.1478271484375, "global_step": 142874, "epoch": 1180} {"train_loss": -39.0555305480957, "global_step": 142875, "epoch": 1180} {"train_loss": -39.438175201416016, "global_step": 142876, "epoch": 1180} {"train_loss": -39.59651565551758, "global_step": 142877, "epoch": 1180} {"train_loss": -39.0897102355957, "global_step": 142878, "epoch": 1180} {"train_loss": -39.65079879760742, "global_step": 142879, "epoch": 1180} {"train_loss": -39.300270080566406, "global_step": 142880, "epoch": 1180} {"train_loss": -39.72357177734375, "global_step": 142881, "epoch": 1180} {"train_loss": -39.60061264038086, "global_step": 142882, "epoch": 1180} {"train_loss": -39.102813720703125, "global_step": 142883, "epoch": 1180} {"train_loss": -39.517242431640625, "global_step": 142884, "epoch": 1180} {"train_loss": -39.31794738769531, "global_step": 142885, "epoch": 1180} {"train_loss": -39.76039505004883, "global_step": 142886, "epoch": 1180} {"train_loss": -39.17594528198242, "global_step": 142887, "epoch": 1180} {"train_loss": -39.614837646484375, "global_step": 142888, "epoch": 1180} {"train_loss": -39.36545944213867, "global_step": 142889, "epoch": 1180} {"train_loss": -39.44694137573242, "global_step": 142890, "epoch": 1180} {"train_loss": -39.77288818359375, "global_step": 142891, "epoch": 1180} {"train_loss": -40.01607894897461, "global_step": 142892, "epoch": 1180} {"train_loss": -39.8494873046875, "global_step": 142893, "epoch": 1180} {"train_loss": -39.622474670410156, "global_step": 142894, "epoch": 1180} {"train_loss": -39.56327438354492, "global_step": 142895, "epoch": 1180} {"train_loss": -39.998287200927734, "global_step": 142896, "epoch": 1180} {"train_loss": -39.839759826660156, "global_step": 142897, "epoch": 1180} {"train_loss": -40.21519088745117, "global_step": 142898, "epoch": 1180} {"train_loss": -40.35491180419922, "global_step": 142899, "epoch": 1180} {"train_loss": -37.934219785958284, "global_step": 142900, "epoch": 1180, "val_loss": 2641751.75} {"train_loss": -39.85262680053711, "global_step": 142901, "epoch": 1181} {"train_loss": -39.17039108276367, "global_step": 142902, "epoch": 1181} {"train_loss": -40.0933952331543, "global_step": 142903, "epoch": 1181} {"train_loss": -39.62889862060547, "global_step": 142904, "epoch": 1181} {"train_loss": -37.874969482421875, "global_step": 142905, "epoch": 1181} {"train_loss": -39.54228210449219, "global_step": 142906, "epoch": 1181} {"train_loss": -39.92624282836914, "global_step": 142907, "epoch": 1181} {"train_loss": -39.494110107421875, "global_step": 142908, "epoch": 1181} {"train_loss": -40.06365203857422, "global_step": 142909, "epoch": 1181} {"train_loss": -39.1817741394043, "global_step": 142910, "epoch": 1181} {"train_loss": -39.353248596191406, "global_step": 142911, "epoch": 1181} {"train_loss": -40.412841796875, "global_step": 142912, "epoch": 1181} {"train_loss": -40.253150939941406, "global_step": 142913, "epoch": 1181} {"train_loss": -40.03327560424805, "global_step": 142914, "epoch": 1181} {"train_loss": -39.96089553833008, "global_step": 142915, "epoch": 1181} {"train_loss": -40.316932678222656, "global_step": 142916, "epoch": 1181} {"train_loss": -38.9459228515625, "global_step": 142917, "epoch": 1181} {"train_loss": -40.234535217285156, "global_step": 142918, "epoch": 1181} {"train_loss": -40.081539154052734, "global_step": 142919, "epoch": 1181} {"train_loss": -40.30507278442383, "global_step": 142920, "epoch": 1181} {"train_loss": -39.90800857543945, "global_step": 142921, "epoch": 1181} {"train_loss": -39.82734680175781, "global_step": 142922, "epoch": 1181} {"train_loss": -37.01688766479492, "global_step": 142923, "epoch": 1181} {"train_loss": -39.1079216003418, "global_step": 142924, "epoch": 1181} {"train_loss": -37.90822982788086, "global_step": 142925, "epoch": 1181} {"train_loss": -34.465065002441406, "global_step": 142926, "epoch": 1181} {"train_loss": -37.02486038208008, "global_step": 142927, "epoch": 1181} {"train_loss": -37.23807144165039, "global_step": 142928, "epoch": 1181} {"train_loss": -35.21417236328125, "global_step": 142929, "epoch": 1181} {"train_loss": -37.58708572387695, "global_step": 142930, "epoch": 1181} {"train_loss": -36.755157470703125, "global_step": 142931, "epoch": 1181} {"train_loss": -38.23160934448242, "global_step": 142932, "epoch": 1181} {"train_loss": -38.06161117553711, "global_step": 142933, "epoch": 1181} {"train_loss": -35.40289306640625, "global_step": 142934, "epoch": 1181} {"train_loss": -39.325130462646484, "global_step": 142935, "epoch": 1181} {"train_loss": -38.13021469116211, "global_step": 142936, "epoch": 1181} {"train_loss": -36.26445770263672, "global_step": 142937, "epoch": 1181} {"train_loss": -36.72156524658203, "global_step": 142938, "epoch": 1181} {"train_loss": -38.086769104003906, "global_step": 142939, "epoch": 1181} {"train_loss": -37.59980392456055, "global_step": 142940, "epoch": 1181} {"train_loss": -34.83417510986328, "global_step": 142941, "epoch": 1181} {"train_loss": -37.12816619873047, "global_step": 142942, "epoch": 1181} {"train_loss": -33.866695404052734, "global_step": 142943, "epoch": 1181} {"train_loss": -37.78574752807617, "global_step": 142944, "epoch": 1181} {"train_loss": -38.152870178222656, "global_step": 142945, "epoch": 1181} {"train_loss": -33.43502426147461, "global_step": 142946, "epoch": 1181} {"train_loss": -37.727516174316406, "global_step": 142947, "epoch": 1181} {"train_loss": -38.57668685913086, "global_step": 142948, "epoch": 1181} {"train_loss": -36.20497512817383, "global_step": 142949, "epoch": 1181} {"train_loss": -38.13242721557617, "global_step": 142950, "epoch": 1181} {"train_loss": -37.59309768676758, "global_step": 142951, "epoch": 1181} {"train_loss": -34.620521545410156, "global_step": 142952, "epoch": 1181} {"train_loss": -37.96697998046875, "global_step": 142953, "epoch": 1181} {"train_loss": -37.6732177734375, "global_step": 142954, "epoch": 1181} {"train_loss": -35.896324157714844, "global_step": 142955, "epoch": 1181} {"train_loss": -37.511226654052734, "global_step": 142956, "epoch": 1181} {"train_loss": -35.875450134277344, "global_step": 142957, "epoch": 1181} {"train_loss": -38.41218948364258, "global_step": 142958, "epoch": 1181} {"train_loss": -38.222259521484375, "global_step": 142959, "epoch": 1181} {"train_loss": -37.26006317138672, "global_step": 142960, "epoch": 1181} {"train_loss": -36.91904067993164, "global_step": 142961, "epoch": 1181} {"train_loss": -38.27182388305664, "global_step": 142962, "epoch": 1181} {"train_loss": -37.86629867553711, "global_step": 142963, "epoch": 1181} {"train_loss": -37.84183883666992, "global_step": 142964, "epoch": 1181} {"train_loss": -37.39716720581055, "global_step": 142965, "epoch": 1181} {"train_loss": -37.59294128417969, "global_step": 142966, "epoch": 1181} {"train_loss": -38.406105041503906, "global_step": 142967, "epoch": 1181} {"train_loss": -38.446807861328125, "global_step": 142968, "epoch": 1181} {"train_loss": -37.26095199584961, "global_step": 142969, "epoch": 1181} {"train_loss": -37.98287582397461, "global_step": 142970, "epoch": 1181} {"train_loss": -38.40583419799805, "global_step": 142971, "epoch": 1181} {"train_loss": -38.63972091674805, "global_step": 142972, "epoch": 1181} {"train_loss": -37.97957992553711, "global_step": 142973, "epoch": 1181} {"train_loss": -36.339115142822266, "global_step": 142974, "epoch": 1181} {"train_loss": -37.51319885253906, "global_step": 142975, "epoch": 1181} {"train_loss": -36.22865676879883, "global_step": 142976, "epoch": 1181} {"train_loss": -37.1451301574707, "global_step": 142977, "epoch": 1181} {"train_loss": -38.15987014770508, "global_step": 142978, "epoch": 1181} {"train_loss": -38.14847946166992, "global_step": 142979, "epoch": 1181} {"train_loss": -38.61030197143555, "global_step": 142980, "epoch": 1181} {"train_loss": -38.04104232788086, "global_step": 142981, "epoch": 1181} {"train_loss": -38.16276168823242, "global_step": 142982, "epoch": 1181} {"train_loss": -38.35653305053711, "global_step": 142983, "epoch": 1181} {"train_loss": -38.58856201171875, "global_step": 142984, "epoch": 1181} {"train_loss": -38.80430221557617, "global_step": 142985, "epoch": 1181} {"train_loss": -37.29664993286133, "global_step": 142986, "epoch": 1181} {"train_loss": -39.219261169433594, "global_step": 142987, "epoch": 1181} {"train_loss": -38.4355583190918, "global_step": 142988, "epoch": 1181} {"train_loss": -38.78364562988281, "global_step": 142989, "epoch": 1181} {"train_loss": -38.288818359375, "global_step": 142990, "epoch": 1181} {"train_loss": -38.41120910644531, "global_step": 142991, "epoch": 1181} {"train_loss": -39.7032356262207, "global_step": 142992, "epoch": 1181} {"train_loss": -38.765602111816406, "global_step": 142993, "epoch": 1181} {"train_loss": -38.80674743652344, "global_step": 142994, "epoch": 1181} {"train_loss": -39.06238555908203, "global_step": 142995, "epoch": 1181} {"train_loss": -38.37847900390625, "global_step": 142996, "epoch": 1181} {"train_loss": -38.478546142578125, "global_step": 142997, "epoch": 1181} {"train_loss": -37.84756851196289, "global_step": 142998, "epoch": 1181} {"train_loss": -36.99220657348633, "global_step": 142999, "epoch": 1181} {"train_loss": -38.731597900390625, "global_step": 143000, "epoch": 1181} {"train_loss": -39.211463928222656, "global_step": 143001, "epoch": 1181} {"train_loss": -39.187129974365234, "global_step": 143002, "epoch": 1181} {"train_loss": -36.63935089111328, "global_step": 143003, "epoch": 1181} {"train_loss": -37.545860290527344, "global_step": 143004, "epoch": 1181} {"train_loss": -38.887447357177734, "global_step": 143005, "epoch": 1181} {"train_loss": -38.219478607177734, "global_step": 143006, "epoch": 1181} {"train_loss": -38.18368148803711, "global_step": 143007, "epoch": 1181} {"train_loss": -39.062015533447266, "global_step": 143008, "epoch": 1181} {"train_loss": -36.50105667114258, "global_step": 143009, "epoch": 1181} {"train_loss": -37.827850341796875, "global_step": 143010, "epoch": 1181} {"train_loss": -38.96102523803711, "global_step": 143011, "epoch": 1181} {"train_loss": -37.81716537475586, "global_step": 143012, "epoch": 1181} {"train_loss": -37.94659423828125, "global_step": 143013, "epoch": 1181} {"train_loss": -38.95319747924805, "global_step": 143014, "epoch": 1181} {"train_loss": -38.17575454711914, "global_step": 143015, "epoch": 1181} {"train_loss": -38.11819076538086, "global_step": 143016, "epoch": 1181} {"train_loss": -39.79703903198242, "global_step": 143017, "epoch": 1181} {"train_loss": -38.401485443115234, "global_step": 143018, "epoch": 1181} {"train_loss": -38.038448333740234, "global_step": 143019, "epoch": 1181} {"train_loss": -38.89531326293945, "global_step": 143020, "epoch": 1181} {"train_loss": -38.084686878298925, "global_step": 143021, "epoch": 1181, "val_loss": 2667648.0} {"train_loss": -38.918357849121094, "global_step": 143022, "epoch": 1182} {"train_loss": -39.73630905151367, "global_step": 143023, "epoch": 1182} {"train_loss": -39.12042236328125, "global_step": 143024, "epoch": 1182} {"train_loss": -38.78108596801758, "global_step": 143025, "epoch": 1182} {"train_loss": -38.32497024536133, "global_step": 143026, "epoch": 1182} {"train_loss": -39.00520324707031, "global_step": 143027, "epoch": 1182} {"train_loss": -38.65083312988281, "global_step": 143028, "epoch": 1182} {"train_loss": -37.236427307128906, "global_step": 143029, "epoch": 1182} {"train_loss": -37.97966384887695, "global_step": 143030, "epoch": 1182} {"train_loss": -38.53118896484375, "global_step": 143031, "epoch": 1182} {"train_loss": -38.16152572631836, "global_step": 143032, "epoch": 1182} {"train_loss": -38.926334381103516, "global_step": 143033, "epoch": 1182} {"train_loss": -38.36611557006836, "global_step": 143034, "epoch": 1182} {"train_loss": -38.40656661987305, "global_step": 143035, "epoch": 1182} {"train_loss": -38.906471252441406, "global_step": 143036, "epoch": 1182} {"train_loss": -38.558837890625, "global_step": 143037, "epoch": 1182} {"train_loss": -38.46269226074219, "global_step": 143038, "epoch": 1182} {"train_loss": -38.79651641845703, "global_step": 143039, "epoch": 1182} {"train_loss": -37.94367599487305, "global_step": 143040, "epoch": 1182} {"train_loss": -38.09843444824219, "global_step": 143041, "epoch": 1182} {"train_loss": -37.398963928222656, "global_step": 143042, "epoch": 1182} {"train_loss": -38.147396087646484, "global_step": 143043, "epoch": 1182} {"train_loss": -38.98064041137695, "global_step": 143044, "epoch": 1182} {"train_loss": -39.31303024291992, "global_step": 143045, "epoch": 1182} {"train_loss": -38.457313537597656, "global_step": 143046, "epoch": 1182} {"train_loss": -38.72303009033203, "global_step": 143047, "epoch": 1182} {"train_loss": -38.785614013671875, "global_step": 143048, "epoch": 1182} {"train_loss": -39.380855560302734, "global_step": 143049, "epoch": 1182} {"train_loss": -38.18107223510742, "global_step": 143050, "epoch": 1182} {"train_loss": -37.73930740356445, "global_step": 143051, "epoch": 1182} {"train_loss": -37.56257629394531, "global_step": 143052, "epoch": 1182} {"train_loss": -38.69975280761719, "global_step": 143053, "epoch": 1182} {"train_loss": -39.06768798828125, "global_step": 143054, "epoch": 1182} {"train_loss": -36.18378829956055, "global_step": 143055, "epoch": 1182} {"train_loss": -36.32746505737305, "global_step": 143056, "epoch": 1182} {"train_loss": -37.25792694091797, "global_step": 143057, "epoch": 1182} {"train_loss": -36.713924407958984, "global_step": 143058, "epoch": 1182} {"train_loss": -37.8870964050293, "global_step": 143059, "epoch": 1182} {"train_loss": -38.828643798828125, "global_step": 143060, "epoch": 1182} {"train_loss": -37.18619918823242, "global_step": 143061, "epoch": 1182} {"train_loss": -38.47134780883789, "global_step": 143062, "epoch": 1182} {"train_loss": -37.165382385253906, "global_step": 143063, "epoch": 1182} {"train_loss": -37.19259262084961, "global_step": 143064, "epoch": 1182} {"train_loss": -35.69602584838867, "global_step": 143065, "epoch": 1182} {"train_loss": -26.621912002563477, "global_step": 143066, "epoch": 1182} {"train_loss": -36.97564697265625, "global_step": 143067, "epoch": 1182} {"train_loss": -24.30423927307129, "global_step": 143068, "epoch": 1182} {"train_loss": -33.08062744140625, "global_step": 143069, "epoch": 1182} {"train_loss": -32.59815216064453, "global_step": 143070, "epoch": 1182} {"train_loss": -35.38998794555664, "global_step": 143071, "epoch": 1182} {"train_loss": -35.73997116088867, "global_step": 143072, "epoch": 1182} {"train_loss": -29.01607322692871, "global_step": 143073, "epoch": 1182} {"train_loss": -32.517738342285156, "global_step": 143074, "epoch": 1182} {"train_loss": -36.171485900878906, "global_step": 143075, "epoch": 1182} {"train_loss": -32.14439010620117, "global_step": 143076, "epoch": 1182} {"train_loss": -30.46013832092285, "global_step": 143077, "epoch": 1182} {"train_loss": -30.949060440063477, "global_step": 143078, "epoch": 1182} {"train_loss": -32.464168548583984, "global_step": 143079, "epoch": 1182} {"train_loss": -30.19403648376465, "global_step": 143080, "epoch": 1182} {"train_loss": -32.39897155761719, "global_step": 143081, "epoch": 1182} {"train_loss": -33.29104232788086, "global_step": 143082, "epoch": 1182} {"train_loss": -35.893306732177734, "global_step": 143083, "epoch": 1182} {"train_loss": -34.77743148803711, "global_step": 143084, "epoch": 1182} {"train_loss": -31.417835235595703, "global_step": 143085, "epoch": 1182} {"train_loss": -35.02459716796875, "global_step": 143086, "epoch": 1182} {"train_loss": -35.904754638671875, "global_step": 143087, "epoch": 1182} {"train_loss": -35.82253646850586, "global_step": 143088, "epoch": 1182} {"train_loss": -34.86316680908203, "global_step": 143089, "epoch": 1182} {"train_loss": -34.83095932006836, "global_step": 143090, "epoch": 1182} {"train_loss": -35.7162971496582, "global_step": 143091, "epoch": 1182} {"train_loss": -35.904335021972656, "global_step": 143092, "epoch": 1182} {"train_loss": -35.431182861328125, "global_step": 143093, "epoch": 1182} {"train_loss": -35.86058044433594, "global_step": 143094, "epoch": 1182} {"train_loss": -35.48323440551758, "global_step": 143095, "epoch": 1182} {"train_loss": -36.4976806640625, "global_step": 143096, "epoch": 1182} {"train_loss": -34.642578125, "global_step": 143097, "epoch": 1182} {"train_loss": -36.4290885925293, "global_step": 143098, "epoch": 1182} {"train_loss": -36.172401428222656, "global_step": 143099, "epoch": 1182} {"train_loss": -37.14864730834961, "global_step": 143100, "epoch": 1182} {"train_loss": -36.643489837646484, "global_step": 143101, "epoch": 1182} {"train_loss": -36.20442581176758, "global_step": 143102, "epoch": 1182} {"train_loss": -37.15517044067383, "global_step": 143103, "epoch": 1182} {"train_loss": -36.906517028808594, "global_step": 143104, "epoch": 1182} {"train_loss": -36.963321685791016, "global_step": 143105, "epoch": 1182} {"train_loss": -36.52143478393555, "global_step": 143106, "epoch": 1182} {"train_loss": -36.909969329833984, "global_step": 143107, "epoch": 1182} {"train_loss": -36.85382080078125, "global_step": 143108, "epoch": 1182} {"train_loss": -37.559967041015625, "global_step": 143109, "epoch": 1182} {"train_loss": -37.411537170410156, "global_step": 143110, "epoch": 1182} {"train_loss": -36.9994010925293, "global_step": 143111, "epoch": 1182} {"train_loss": -37.318790435791016, "global_step": 143112, "epoch": 1182} {"train_loss": -36.6475830078125, "global_step": 143113, "epoch": 1182} {"train_loss": -37.36201858520508, "global_step": 143114, "epoch": 1182} {"train_loss": -37.22446823120117, "global_step": 143115, "epoch": 1182} {"train_loss": -37.305721282958984, "global_step": 143116, "epoch": 1182} {"train_loss": -37.83612060546875, "global_step": 143117, "epoch": 1182} {"train_loss": -37.15086364746094, "global_step": 143118, "epoch": 1182} {"train_loss": -38.256500244140625, "global_step": 143119, "epoch": 1182} {"train_loss": -37.95339584350586, "global_step": 143120, "epoch": 1182} {"train_loss": -38.04275131225586, "global_step": 143121, "epoch": 1182} {"train_loss": -37.57252883911133, "global_step": 143122, "epoch": 1182} {"train_loss": -37.486080169677734, "global_step": 143123, "epoch": 1182} {"train_loss": -37.94282913208008, "global_step": 143124, "epoch": 1182} {"train_loss": -38.21479034423828, "global_step": 143125, "epoch": 1182} {"train_loss": -38.390621185302734, "global_step": 143126, "epoch": 1182} {"train_loss": -37.7321662902832, "global_step": 143127, "epoch": 1182} {"train_loss": -38.04850387573242, "global_step": 143128, "epoch": 1182} {"train_loss": -37.58937454223633, "global_step": 143129, "epoch": 1182} {"train_loss": -38.427284240722656, "global_step": 143130, "epoch": 1182} {"train_loss": -38.6403923034668, "global_step": 143131, "epoch": 1182} {"train_loss": -38.166351318359375, "global_step": 143132, "epoch": 1182} {"train_loss": -38.49809646606445, "global_step": 143133, "epoch": 1182} {"train_loss": -38.33966827392578, "global_step": 143134, "epoch": 1182} {"train_loss": -38.4947509765625, "global_step": 143135, "epoch": 1182} {"train_loss": -38.028472900390625, "global_step": 143136, "epoch": 1182} {"train_loss": -38.65999221801758, "global_step": 143137, "epoch": 1182} {"train_loss": -38.246368408203125, "global_step": 143138, "epoch": 1182} {"train_loss": -38.7552490234375, "global_step": 143139, "epoch": 1182} {"train_loss": -38.62369918823242, "global_step": 143140, "epoch": 1182} {"train_loss": -38.90982437133789, "global_step": 143141, "epoch": 1182} {"train_loss": -36.75282968568408, "global_step": 143142, "epoch": 1182, "val_loss": 2621143.75} {"train_loss": -38.4365348815918, "global_step": 143143, "epoch": 1183} {"train_loss": -39.0512580871582, "global_step": 143144, "epoch": 1183} {"train_loss": -38.99284744262695, "global_step": 143145, "epoch": 1183} {"train_loss": -39.0423698425293, "global_step": 143146, "epoch": 1183} {"train_loss": -39.0205192565918, "global_step": 143147, "epoch": 1183} {"train_loss": -38.957275390625, "global_step": 143148, "epoch": 1183} {"train_loss": -38.468505859375, "global_step": 143149, "epoch": 1183} {"train_loss": -39.28420639038086, "global_step": 143150, "epoch": 1183} {"train_loss": -39.4777946472168, "global_step": 143151, "epoch": 1183} {"train_loss": -39.21053695678711, "global_step": 143152, "epoch": 1183} {"train_loss": -39.342079162597656, "global_step": 143153, "epoch": 1183} {"train_loss": -39.603607177734375, "global_step": 143154, "epoch": 1183} {"train_loss": -38.73582077026367, "global_step": 143155, "epoch": 1183} {"train_loss": -39.16324996948242, "global_step": 143156, "epoch": 1183} {"train_loss": -39.4543571472168, "global_step": 143157, "epoch": 1183} {"train_loss": -39.16399002075195, "global_step": 143158, "epoch": 1183} {"train_loss": -39.32418441772461, "global_step": 143159, "epoch": 1183} {"train_loss": -39.11793899536133, "global_step": 143160, "epoch": 1183} {"train_loss": -39.44356155395508, "global_step": 143161, "epoch": 1183} {"train_loss": -39.00320053100586, "global_step": 143162, "epoch": 1183} {"train_loss": -39.212093353271484, "global_step": 143163, "epoch": 1183} {"train_loss": -38.90625, "global_step": 143164, "epoch": 1183} {"train_loss": -36.6001091003418, "global_step": 143165, "epoch": 1183} {"train_loss": -31.43108558654785, "global_step": 143166, "epoch": 1183} {"train_loss": -26.466327667236328, "global_step": 143167, "epoch": 1183} {"train_loss": -25.028553009033203, "global_step": 143168, "epoch": 1183} {"train_loss": -37.74566650390625, "global_step": 143169, "epoch": 1183} {"train_loss": -29.97408103942871, "global_step": 143170, "epoch": 1183} {"train_loss": -29.17255973815918, "global_step": 143171, "epoch": 1183} {"train_loss": -32.5363655090332, "global_step": 143172, "epoch": 1183} {"train_loss": -34.66105270385742, "global_step": 143173, "epoch": 1183} {"train_loss": -35.59734344482422, "global_step": 143174, "epoch": 1183} {"train_loss": -33.604454040527344, "global_step": 143175, "epoch": 1183} {"train_loss": -36.84067916870117, "global_step": 143176, "epoch": 1183} {"train_loss": -36.5905876159668, "global_step": 143177, "epoch": 1183} {"train_loss": -35.6228141784668, "global_step": 143178, "epoch": 1183} {"train_loss": -37.85858154296875, "global_step": 143179, "epoch": 1183} {"train_loss": -37.4434928894043, "global_step": 143180, "epoch": 1183} {"train_loss": -37.59650421142578, "global_step": 143181, "epoch": 1183} {"train_loss": -37.272735595703125, "global_step": 143182, "epoch": 1183} {"train_loss": -37.345638275146484, "global_step": 143183, "epoch": 1183} {"train_loss": -38.629512786865234, "global_step": 143184, "epoch": 1183} {"train_loss": -38.33469772338867, "global_step": 143185, "epoch": 1183} {"train_loss": -37.9849967956543, "global_step": 143186, "epoch": 1183} {"train_loss": -38.536468505859375, "global_step": 143187, "epoch": 1183} {"train_loss": -38.08498001098633, "global_step": 143188, "epoch": 1183} {"train_loss": -38.30547332763672, "global_step": 143189, "epoch": 1183} {"train_loss": -38.46814727783203, "global_step": 143190, "epoch": 1183} {"train_loss": -38.61225128173828, "global_step": 143191, "epoch": 1183} {"train_loss": -38.38037109375, "global_step": 143192, "epoch": 1183} {"train_loss": -38.348575592041016, "global_step": 143193, "epoch": 1183} {"train_loss": -38.80331039428711, "global_step": 143194, "epoch": 1183} {"train_loss": -38.62272262573242, "global_step": 143195, "epoch": 1183} {"train_loss": -39.04124450683594, "global_step": 143196, "epoch": 1183} {"train_loss": -38.73187255859375, "global_step": 143197, "epoch": 1183} {"train_loss": -38.625396728515625, "global_step": 143198, "epoch": 1183} {"train_loss": -39.607948303222656, "global_step": 143199, "epoch": 1183} {"train_loss": -38.910194396972656, "global_step": 143200, "epoch": 1183} {"train_loss": -38.78556442260742, "global_step": 143201, "epoch": 1183} {"train_loss": -39.02433395385742, "global_step": 143202, "epoch": 1183} {"train_loss": -38.88777542114258, "global_step": 143203, "epoch": 1183} {"train_loss": -39.23691177368164, "global_step": 143204, "epoch": 1183} {"train_loss": -37.607479095458984, "global_step": 143205, "epoch": 1183} {"train_loss": -39.173885345458984, "global_step": 143206, "epoch": 1183} {"train_loss": -39.47117233276367, "global_step": 143207, "epoch": 1183} {"train_loss": -39.5308837890625, "global_step": 143208, "epoch": 1183} {"train_loss": -39.41766357421875, "global_step": 143209, "epoch": 1183} {"train_loss": -39.566829681396484, "global_step": 143210, "epoch": 1183} {"train_loss": -38.68695831298828, "global_step": 143211, "epoch": 1183} {"train_loss": -39.1806755065918, "global_step": 143212, "epoch": 1183} {"train_loss": -39.3604850769043, "global_step": 143213, "epoch": 1183} {"train_loss": -39.4611930847168, "global_step": 143214, "epoch": 1183} {"train_loss": -39.81242752075195, "global_step": 143215, "epoch": 1183} {"train_loss": -39.43610382080078, "global_step": 143216, "epoch": 1183} {"train_loss": -39.72237777709961, "global_step": 143217, "epoch": 1183} {"train_loss": -39.24376678466797, "global_step": 143218, "epoch": 1183} {"train_loss": -39.72079849243164, "global_step": 143219, "epoch": 1183} {"train_loss": -39.6219367980957, "global_step": 143220, "epoch": 1183} {"train_loss": -39.7276725769043, "global_step": 143221, "epoch": 1183} {"train_loss": -39.79650115966797, "global_step": 143222, "epoch": 1183} {"train_loss": -39.04182052612305, "global_step": 143223, "epoch": 1183} {"train_loss": -39.71211242675781, "global_step": 143224, "epoch": 1183} {"train_loss": -38.80204391479492, "global_step": 143225, "epoch": 1183} {"train_loss": -39.660789489746094, "global_step": 143226, "epoch": 1183} {"train_loss": -40.05898666381836, "global_step": 143227, "epoch": 1183} {"train_loss": -39.584861755371094, "global_step": 143228, "epoch": 1183} {"train_loss": -39.5953483581543, "global_step": 143229, "epoch": 1183} {"train_loss": -38.803924560546875, "global_step": 143230, "epoch": 1183} {"train_loss": -36.89033889770508, "global_step": 143231, "epoch": 1183} {"train_loss": -38.53446578979492, "global_step": 143232, "epoch": 1183} {"train_loss": -36.663414001464844, "global_step": 143233, "epoch": 1183} {"train_loss": -36.8549690246582, "global_step": 143234, "epoch": 1183} {"train_loss": -35.349369049072266, "global_step": 143235, "epoch": 1183} {"train_loss": -38.688228607177734, "global_step": 143236, "epoch": 1183} {"train_loss": -38.72530746459961, "global_step": 143237, "epoch": 1183} {"train_loss": -38.616973876953125, "global_step": 143238, "epoch": 1183} {"train_loss": -39.585174560546875, "global_step": 143239, "epoch": 1183} {"train_loss": -38.66121292114258, "global_step": 143240, "epoch": 1183} {"train_loss": -38.427852630615234, "global_step": 143241, "epoch": 1183} {"train_loss": -38.41701889038086, "global_step": 143242, "epoch": 1183} {"train_loss": -37.35816192626953, "global_step": 143243, "epoch": 1183} {"train_loss": -39.060245513916016, "global_step": 143244, "epoch": 1183} {"train_loss": -38.6963996887207, "global_step": 143245, "epoch": 1183} {"train_loss": -39.09337615966797, "global_step": 143246, "epoch": 1183} {"train_loss": -37.377193450927734, "global_step": 143247, "epoch": 1183} {"train_loss": -38.22518539428711, "global_step": 143248, "epoch": 1183} {"train_loss": -38.79291915893555, "global_step": 143249, "epoch": 1183} {"train_loss": -37.88393783569336, "global_step": 143250, "epoch": 1183} {"train_loss": -38.882354736328125, "global_step": 143251, "epoch": 1183} {"train_loss": -38.369483947753906, "global_step": 143252, "epoch": 1183} {"train_loss": -39.65814208984375, "global_step": 143253, "epoch": 1183} {"train_loss": -38.66594696044922, "global_step": 143254, "epoch": 1183} {"train_loss": -39.175411224365234, "global_step": 143255, "epoch": 1183} {"train_loss": -38.7900505065918, "global_step": 143256, "epoch": 1183} {"train_loss": -39.2431526184082, "global_step": 143257, "epoch": 1183} {"train_loss": -39.079078674316406, "global_step": 143258, "epoch": 1183} {"train_loss": -38.68391036987305, "global_step": 143259, "epoch": 1183} {"train_loss": -39.046939849853516, "global_step": 143260, "epoch": 1183} {"train_loss": -38.8238639831543, "global_step": 143261, "epoch": 1183} {"train_loss": -39.7215690612793, "global_step": 143262, "epoch": 1183} {"train_loss": -38.13474981449852, "global_step": 143263, "epoch": 1183, "val_loss": 2689508.75} {"train_loss": -39.58116912841797, "global_step": 143264, "epoch": 1184} {"train_loss": -39.81358337402344, "global_step": 143265, "epoch": 1184} {"train_loss": -39.334693908691406, "global_step": 143266, "epoch": 1184} {"train_loss": -39.685707092285156, "global_step": 143267, "epoch": 1184} {"train_loss": -38.4506950378418, "global_step": 143268, "epoch": 1184} {"train_loss": -39.65509033203125, "global_step": 143269, "epoch": 1184} {"train_loss": -39.38114547729492, "global_step": 143270, "epoch": 1184} {"train_loss": -39.93281173706055, "global_step": 143271, "epoch": 1184} {"train_loss": -39.98285675048828, "global_step": 143272, "epoch": 1184} {"train_loss": -39.957481384277344, "global_step": 143273, "epoch": 1184} {"train_loss": -39.56414794921875, "global_step": 143274, "epoch": 1184} {"train_loss": -39.595848083496094, "global_step": 143275, "epoch": 1184} {"train_loss": -40.510772705078125, "global_step": 143276, "epoch": 1184} {"train_loss": -40.16364669799805, "global_step": 143277, "epoch": 1184} {"train_loss": -40.020538330078125, "global_step": 143278, "epoch": 1184} {"train_loss": -39.968231201171875, "global_step": 143279, "epoch": 1184} {"train_loss": -40.02740478515625, "global_step": 143280, "epoch": 1184} {"train_loss": -39.95901870727539, "global_step": 143281, "epoch": 1184} {"train_loss": -40.159420013427734, "global_step": 143282, "epoch": 1184} {"train_loss": -39.90236282348633, "global_step": 143283, "epoch": 1184} {"train_loss": -40.056427001953125, "global_step": 143284, "epoch": 1184} {"train_loss": -39.86506652832031, "global_step": 143285, "epoch": 1184} {"train_loss": -40.19755935668945, "global_step": 143286, "epoch": 1184} {"train_loss": -40.0564079284668, "global_step": 143287, "epoch": 1184} {"train_loss": -40.44831848144531, "global_step": 143288, "epoch": 1184} {"train_loss": -39.875465393066406, "global_step": 143289, "epoch": 1184} {"train_loss": -40.0877685546875, "global_step": 143290, "epoch": 1184} {"train_loss": -37.56036376953125, "global_step": 143291, "epoch": 1184} {"train_loss": -37.76469039916992, "global_step": 143292, "epoch": 1184} {"train_loss": -39.47731018066406, "global_step": 143293, "epoch": 1184} {"train_loss": -39.42739486694336, "global_step": 143294, "epoch": 1184} {"train_loss": -39.84502410888672, "global_step": 143295, "epoch": 1184} {"train_loss": -39.941715240478516, "global_step": 143296, "epoch": 1184} {"train_loss": -39.84823226928711, "global_step": 143297, "epoch": 1184} {"train_loss": -39.3038215637207, "global_step": 143298, "epoch": 1184} {"train_loss": -39.45173263549805, "global_step": 143299, "epoch": 1184} {"train_loss": -38.09147262573242, "global_step": 143300, "epoch": 1184} {"train_loss": -37.613338470458984, "global_step": 143301, "epoch": 1184} {"train_loss": -39.67928695678711, "global_step": 143302, "epoch": 1184} {"train_loss": -38.74204635620117, "global_step": 143303, "epoch": 1184} {"train_loss": -40.11381912231445, "global_step": 143304, "epoch": 1184} {"train_loss": -39.976009368896484, "global_step": 143305, "epoch": 1184} {"train_loss": -39.30965042114258, "global_step": 143306, "epoch": 1184} {"train_loss": -37.92622756958008, "global_step": 143307, "epoch": 1184} {"train_loss": -38.17940139770508, "global_step": 143308, "epoch": 1184} {"train_loss": -38.99139404296875, "global_step": 143309, "epoch": 1184} {"train_loss": -39.93008041381836, "global_step": 143310, "epoch": 1184} {"train_loss": -39.13140869140625, "global_step": 143311, "epoch": 1184} {"train_loss": -39.02528381347656, "global_step": 143312, "epoch": 1184} {"train_loss": -38.668331146240234, "global_step": 143313, "epoch": 1184} {"train_loss": -36.44961166381836, "global_step": 143314, "epoch": 1184} {"train_loss": -39.28810501098633, "global_step": 143315, "epoch": 1184} {"train_loss": -39.89235305786133, "global_step": 143316, "epoch": 1184} {"train_loss": -39.3633918762207, "global_step": 143317, "epoch": 1184} {"train_loss": -38.51210403442383, "global_step": 143318, "epoch": 1184} {"train_loss": -38.989051818847656, "global_step": 143319, "epoch": 1184} {"train_loss": -38.325103759765625, "global_step": 143320, "epoch": 1184} {"train_loss": -39.657012939453125, "global_step": 143321, "epoch": 1184} {"train_loss": -39.80738067626953, "global_step": 143322, "epoch": 1184} {"train_loss": -39.0296745300293, "global_step": 143323, "epoch": 1184} {"train_loss": -40.00955581665039, "global_step": 143324, "epoch": 1184} {"train_loss": -38.274757385253906, "global_step": 143325, "epoch": 1184} {"train_loss": -40.19417953491211, "global_step": 143326, "epoch": 1184} {"train_loss": -39.49393844604492, "global_step": 143327, "epoch": 1184} {"train_loss": -39.552711486816406, "global_step": 143328, "epoch": 1184} {"train_loss": -38.93989944458008, "global_step": 143329, "epoch": 1184} {"train_loss": -38.640357971191406, "global_step": 143330, "epoch": 1184} {"train_loss": -38.05381393432617, "global_step": 143331, "epoch": 1184} {"train_loss": -37.72909164428711, "global_step": 143332, "epoch": 1184} {"train_loss": -39.95225143432617, "global_step": 143333, "epoch": 1184} {"train_loss": -39.50422286987305, "global_step": 143334, "epoch": 1184} {"train_loss": -38.83159637451172, "global_step": 143335, "epoch": 1184} {"train_loss": -39.064571380615234, "global_step": 143336, "epoch": 1184} {"train_loss": -38.11103439331055, "global_step": 143337, "epoch": 1184} {"train_loss": -37.52564239501953, "global_step": 143338, "epoch": 1184} {"train_loss": -36.6617546081543, "global_step": 143339, "epoch": 1184} {"train_loss": -37.898433685302734, "global_step": 143340, "epoch": 1184} {"train_loss": -39.5916748046875, "global_step": 143341, "epoch": 1184} {"train_loss": -38.04511260986328, "global_step": 143342, "epoch": 1184} {"train_loss": -38.58216094970703, "global_step": 143343, "epoch": 1184} {"train_loss": -39.21952438354492, "global_step": 143344, "epoch": 1184} {"train_loss": -38.679893493652344, "global_step": 143345, "epoch": 1184} {"train_loss": -39.60678482055664, "global_step": 143346, "epoch": 1184} {"train_loss": -38.566612243652344, "global_step": 143347, "epoch": 1184} {"train_loss": -38.63819885253906, "global_step": 143348, "epoch": 1184} {"train_loss": -35.75612258911133, "global_step": 143349, "epoch": 1184} {"train_loss": -39.634578704833984, "global_step": 143350, "epoch": 1184} {"train_loss": -38.049983978271484, "global_step": 143351, "epoch": 1184} {"train_loss": -39.391395568847656, "global_step": 143352, "epoch": 1184} {"train_loss": -37.590484619140625, "global_step": 143353, "epoch": 1184} {"train_loss": -39.39585494995117, "global_step": 143354, "epoch": 1184} {"train_loss": -38.85969924926758, "global_step": 143355, "epoch": 1184} {"train_loss": -37.94487380981445, "global_step": 143356, "epoch": 1184} {"train_loss": -37.52645492553711, "global_step": 143357, "epoch": 1184} {"train_loss": -37.722835540771484, "global_step": 143358, "epoch": 1184} {"train_loss": -36.406349182128906, "global_step": 143359, "epoch": 1184} {"train_loss": -38.395294189453125, "global_step": 143360, "epoch": 1184} {"train_loss": -38.41301345825195, "global_step": 143361, "epoch": 1184} {"train_loss": -36.82612991333008, "global_step": 143362, "epoch": 1184} {"train_loss": -38.0499153137207, "global_step": 143363, "epoch": 1184} {"train_loss": -36.043025970458984, "global_step": 143364, "epoch": 1184} {"train_loss": -38.04572296142578, "global_step": 143365, "epoch": 1184} {"train_loss": -37.319271087646484, "global_step": 143366, "epoch": 1184} {"train_loss": -37.822227478027344, "global_step": 143367, "epoch": 1184} {"train_loss": -38.518577575683594, "global_step": 143368, "epoch": 1184} {"train_loss": -36.6680793762207, "global_step": 143369, "epoch": 1184} {"train_loss": -38.488216400146484, "global_step": 143370, "epoch": 1184} {"train_loss": -38.23603439331055, "global_step": 143371, "epoch": 1184} {"train_loss": -37.09022521972656, "global_step": 143372, "epoch": 1184} {"train_loss": -37.991172790527344, "global_step": 143373, "epoch": 1184} {"train_loss": -38.03433609008789, "global_step": 143374, "epoch": 1184} {"train_loss": -39.59177780151367, "global_step": 143375, "epoch": 1184} {"train_loss": -38.40678787231445, "global_step": 143376, "epoch": 1184} {"train_loss": -39.07855987548828, "global_step": 143377, "epoch": 1184} {"train_loss": -39.03324508666992, "global_step": 143378, "epoch": 1184} {"train_loss": -37.12456512451172, "global_step": 143379, "epoch": 1184} {"train_loss": -38.31171798706055, "global_step": 143380, "epoch": 1184} {"train_loss": -37.7585563659668, "global_step": 143381, "epoch": 1184} {"train_loss": -38.43843460083008, "global_step": 143382, "epoch": 1184} {"train_loss": -38.63710403442383, "global_step": 143383, "epoch": 1184} {"train_loss": -38.86039475370045, "global_step": 143384, "epoch": 1184, "val_loss": 2667871.0} {"train_loss": -38.28565216064453, "global_step": 143385, "epoch": 1185} {"train_loss": -39.325439453125, "global_step": 143386, "epoch": 1185} {"train_loss": -38.801177978515625, "global_step": 143387, "epoch": 1185} {"train_loss": -38.63998031616211, "global_step": 143388, "epoch": 1185} {"train_loss": -39.27726364135742, "global_step": 143389, "epoch": 1185} {"train_loss": -37.83842468261719, "global_step": 143390, "epoch": 1185} {"train_loss": -37.624542236328125, "global_step": 143391, "epoch": 1185} {"train_loss": -38.661346435546875, "global_step": 143392, "epoch": 1185} {"train_loss": -39.152122497558594, "global_step": 143393, "epoch": 1185} {"train_loss": -37.949642181396484, "global_step": 143394, "epoch": 1185} {"train_loss": -38.27887725830078, "global_step": 143395, "epoch": 1185} {"train_loss": -39.22487258911133, "global_step": 143396, "epoch": 1185} {"train_loss": -38.77201461791992, "global_step": 143397, "epoch": 1185} {"train_loss": -39.49531173706055, "global_step": 143398, "epoch": 1185} {"train_loss": -39.13044738769531, "global_step": 143399, "epoch": 1185} {"train_loss": -38.95349884033203, "global_step": 143400, "epoch": 1185} {"train_loss": -39.0477409362793, "global_step": 143401, "epoch": 1185} {"train_loss": -37.510311126708984, "global_step": 143402, "epoch": 1185} {"train_loss": -39.4861946105957, "global_step": 143403, "epoch": 1185} {"train_loss": -38.76381301879883, "global_step": 143404, "epoch": 1185} {"train_loss": -39.77688980102539, "global_step": 143405, "epoch": 1185} {"train_loss": -39.45171356201172, "global_step": 143406, "epoch": 1185} {"train_loss": -39.64500427246094, "global_step": 143407, "epoch": 1185} {"train_loss": -39.836204528808594, "global_step": 143408, "epoch": 1185} {"train_loss": -39.71135330200195, "global_step": 143409, "epoch": 1185} {"train_loss": -38.59503936767578, "global_step": 143410, "epoch": 1185} {"train_loss": -38.86808395385742, "global_step": 143411, "epoch": 1185} {"train_loss": -38.850189208984375, "global_step": 143412, "epoch": 1185} {"train_loss": -39.68811798095703, "global_step": 143413, "epoch": 1185} {"train_loss": -39.091556549072266, "global_step": 143414, "epoch": 1185} {"train_loss": -39.61123275756836, "global_step": 143415, "epoch": 1185} {"train_loss": -38.003665924072266, "global_step": 143416, "epoch": 1185} {"train_loss": -38.615997314453125, "global_step": 143417, "epoch": 1185} {"train_loss": -38.70371627807617, "global_step": 143418, "epoch": 1185} {"train_loss": -39.37311553955078, "global_step": 143419, "epoch": 1185} {"train_loss": -38.83650588989258, "global_step": 143420, "epoch": 1185} {"train_loss": -39.04616928100586, "global_step": 143421, "epoch": 1185} {"train_loss": -39.693119049072266, "global_step": 143422, "epoch": 1185} {"train_loss": -39.86518478393555, "global_step": 143423, "epoch": 1185} {"train_loss": -39.341732025146484, "global_step": 143424, "epoch": 1185} {"train_loss": -39.86418151855469, "global_step": 143425, "epoch": 1185} {"train_loss": -39.676429748535156, "global_step": 143426, "epoch": 1185} {"train_loss": -39.654762268066406, "global_step": 143427, "epoch": 1185} {"train_loss": -40.06657028198242, "global_step": 143428, "epoch": 1185} {"train_loss": -38.891414642333984, "global_step": 143429, "epoch": 1185} {"train_loss": -38.98701858520508, "global_step": 143430, "epoch": 1185} {"train_loss": -39.048851013183594, "global_step": 143431, "epoch": 1185} {"train_loss": -38.733619689941406, "global_step": 143432, "epoch": 1185} {"train_loss": -38.725318908691406, "global_step": 143433, "epoch": 1185} {"train_loss": -38.580013275146484, "global_step": 143434, "epoch": 1185} {"train_loss": -39.892337799072266, "global_step": 143435, "epoch": 1185} {"train_loss": -38.83457946777344, "global_step": 143436, "epoch": 1185} {"train_loss": -38.62873458862305, "global_step": 143437, "epoch": 1185} {"train_loss": -38.0425910949707, "global_step": 143438, "epoch": 1185} {"train_loss": -36.790069580078125, "global_step": 143439, "epoch": 1185} {"train_loss": -37.72312545776367, "global_step": 143440, "epoch": 1185} {"train_loss": -39.29199981689453, "global_step": 143441, "epoch": 1185} {"train_loss": -37.990028381347656, "global_step": 143442, "epoch": 1185} {"train_loss": -38.41291427612305, "global_step": 143443, "epoch": 1185} {"train_loss": -37.49148178100586, "global_step": 143444, "epoch": 1185} {"train_loss": -38.7491569519043, "global_step": 143445, "epoch": 1185} {"train_loss": -38.04652786254883, "global_step": 143446, "epoch": 1185} {"train_loss": -34.6668815612793, "global_step": 143447, "epoch": 1185} {"train_loss": -38.874141693115234, "global_step": 143448, "epoch": 1185} {"train_loss": -36.79513931274414, "global_step": 143449, "epoch": 1185} {"train_loss": -37.533050537109375, "global_step": 143450, "epoch": 1185} {"train_loss": -37.647377014160156, "global_step": 143451, "epoch": 1185} {"train_loss": -37.60637664794922, "global_step": 143452, "epoch": 1185} {"train_loss": -35.455867767333984, "global_step": 143453, "epoch": 1185} {"train_loss": -38.48441696166992, "global_step": 143454, "epoch": 1185} {"train_loss": -38.57304000854492, "global_step": 143455, "epoch": 1185} {"train_loss": -34.916656494140625, "global_step": 143456, "epoch": 1185} {"train_loss": -39.23579025268555, "global_step": 143457, "epoch": 1185} {"train_loss": -35.8981819152832, "global_step": 143458, "epoch": 1185} {"train_loss": -38.16213607788086, "global_step": 143459, "epoch": 1185} {"train_loss": -37.96303176879883, "global_step": 143460, "epoch": 1185} {"train_loss": -38.14552688598633, "global_step": 143461, "epoch": 1185} {"train_loss": -38.38479232788086, "global_step": 143462, "epoch": 1185} {"train_loss": -37.790706634521484, "global_step": 143463, "epoch": 1185} {"train_loss": -39.20600509643555, "global_step": 143464, "epoch": 1185} {"train_loss": -39.088417053222656, "global_step": 143465, "epoch": 1185} {"train_loss": -38.92751693725586, "global_step": 143466, "epoch": 1185} {"train_loss": -39.5779914855957, "global_step": 143467, "epoch": 1185} {"train_loss": -39.24999237060547, "global_step": 143468, "epoch": 1185} {"train_loss": -39.42835235595703, "global_step": 143469, "epoch": 1185} {"train_loss": -38.31171798706055, "global_step": 143470, "epoch": 1185} {"train_loss": -39.104522705078125, "global_step": 143471, "epoch": 1185} {"train_loss": -40.18172836303711, "global_step": 143472, "epoch": 1185} {"train_loss": -39.07678985595703, "global_step": 143473, "epoch": 1185} {"train_loss": -39.29557418823242, "global_step": 143474, "epoch": 1185} {"train_loss": -39.25335693359375, "global_step": 143475, "epoch": 1185} {"train_loss": -39.24595260620117, "global_step": 143476, "epoch": 1185} {"train_loss": -39.66832733154297, "global_step": 143477, "epoch": 1185} {"train_loss": -39.46913528442383, "global_step": 143478, "epoch": 1185} {"train_loss": -39.9661979675293, "global_step": 143479, "epoch": 1185} {"train_loss": -40.109519958496094, "global_step": 143480, "epoch": 1185} {"train_loss": -39.60324478149414, "global_step": 143481, "epoch": 1185} {"train_loss": -39.4249382019043, "global_step": 143482, "epoch": 1185} {"train_loss": -39.94923400878906, "global_step": 143483, "epoch": 1185} {"train_loss": -39.82676315307617, "global_step": 143484, "epoch": 1185} {"train_loss": -38.539791107177734, "global_step": 143485, "epoch": 1185} {"train_loss": -40.090126037597656, "global_step": 143486, "epoch": 1185} {"train_loss": -38.94303894042969, "global_step": 143487, "epoch": 1185} {"train_loss": -38.83393096923828, "global_step": 143488, "epoch": 1185} {"train_loss": -38.62289047241211, "global_step": 143489, "epoch": 1185} {"train_loss": -38.643089294433594, "global_step": 143490, "epoch": 1185} {"train_loss": -38.97675323486328, "global_step": 143491, "epoch": 1185} {"train_loss": -39.4998664855957, "global_step": 143492, "epoch": 1185} {"train_loss": -38.19326400756836, "global_step": 143493, "epoch": 1185} {"train_loss": -37.632537841796875, "global_step": 143494, "epoch": 1185} {"train_loss": -39.99928665161133, "global_step": 143495, "epoch": 1185} {"train_loss": -39.43245315551758, "global_step": 143496, "epoch": 1185} {"train_loss": -37.44224166870117, "global_step": 143497, "epoch": 1185} {"train_loss": -36.42668151855469, "global_step": 143498, "epoch": 1185} {"train_loss": -35.737335205078125, "global_step": 143499, "epoch": 1185} {"train_loss": -39.297115325927734, "global_step": 143500, "epoch": 1185} {"train_loss": -39.28947448730469, "global_step": 143501, "epoch": 1185} {"train_loss": -37.73994064331055, "global_step": 143502, "epoch": 1185} {"train_loss": -38.4615364074707, "global_step": 143503, "epoch": 1185} {"train_loss": -40.06465530395508, "global_step": 143504, "epoch": 1185} {"train_loss": -38.71243500512494, "global_step": 143505, "epoch": 1185, "val_loss": 2590826.75} {"train_loss": -38.95884323120117, "global_step": 143506, "epoch": 1186} {"train_loss": -38.0876579284668, "global_step": 143507, "epoch": 1186} {"train_loss": -38.702056884765625, "global_step": 143508, "epoch": 1186} {"train_loss": -40.30697250366211, "global_step": 143509, "epoch": 1186} {"train_loss": -38.92802810668945, "global_step": 143510, "epoch": 1186} {"train_loss": -39.809730529785156, "global_step": 143511, "epoch": 1186} {"train_loss": -38.78692626953125, "global_step": 143512, "epoch": 1186} {"train_loss": -37.09376907348633, "global_step": 143513, "epoch": 1186} {"train_loss": -40.2069091796875, "global_step": 143514, "epoch": 1186} {"train_loss": -39.22384262084961, "global_step": 143515, "epoch": 1186} {"train_loss": -39.789642333984375, "global_step": 143516, "epoch": 1186} {"train_loss": -39.43584060668945, "global_step": 143517, "epoch": 1186} {"train_loss": -39.40142059326172, "global_step": 143518, "epoch": 1186} {"train_loss": -39.84617233276367, "global_step": 143519, "epoch": 1186} {"train_loss": -39.46085739135742, "global_step": 143520, "epoch": 1186} {"train_loss": -39.39787292480469, "global_step": 143521, "epoch": 1186} {"train_loss": -40.080196380615234, "global_step": 143522, "epoch": 1186} {"train_loss": -39.661319732666016, "global_step": 143523, "epoch": 1186} {"train_loss": -39.961639404296875, "global_step": 143524, "epoch": 1186} {"train_loss": -40.22879409790039, "global_step": 143525, "epoch": 1186} {"train_loss": -40.27250289916992, "global_step": 143526, "epoch": 1186} {"train_loss": -40.394962310791016, "global_step": 143527, "epoch": 1186} {"train_loss": -39.568275451660156, "global_step": 143528, "epoch": 1186} {"train_loss": -40.127071380615234, "global_step": 143529, "epoch": 1186} {"train_loss": -40.33007049560547, "global_step": 143530, "epoch": 1186} {"train_loss": -39.77952194213867, "global_step": 143531, "epoch": 1186} {"train_loss": -39.77774429321289, "global_step": 143532, "epoch": 1186} {"train_loss": -39.17927932739258, "global_step": 143533, "epoch": 1186} {"train_loss": -40.474754333496094, "global_step": 143534, "epoch": 1186} {"train_loss": -40.78609085083008, "global_step": 143535, "epoch": 1186} {"train_loss": -40.781349182128906, "global_step": 143536, "epoch": 1186} {"train_loss": -40.38829803466797, "global_step": 143537, "epoch": 1186} {"train_loss": -39.89997482299805, "global_step": 143538, "epoch": 1186} {"train_loss": -40.639434814453125, "global_step": 143539, "epoch": 1186} {"train_loss": -39.789119720458984, "global_step": 143540, "epoch": 1186} {"train_loss": -39.86102294921875, "global_step": 143541, "epoch": 1186} {"train_loss": -40.46293258666992, "global_step": 143542, "epoch": 1186} {"train_loss": -39.97943115234375, "global_step": 143543, "epoch": 1186} {"train_loss": -37.62929916381836, "global_step": 143544, "epoch": 1186} {"train_loss": -39.31354904174805, "global_step": 143545, "epoch": 1186} {"train_loss": -39.869712829589844, "global_step": 143546, "epoch": 1186} {"train_loss": -39.99164962768555, "global_step": 143547, "epoch": 1186} {"train_loss": -39.974639892578125, "global_step": 143548, "epoch": 1186} {"train_loss": -38.40625762939453, "global_step": 143549, "epoch": 1186} {"train_loss": -39.107357025146484, "global_step": 143550, "epoch": 1186} {"train_loss": -38.40859603881836, "global_step": 143551, "epoch": 1186} {"train_loss": -38.40548324584961, "global_step": 143552, "epoch": 1186} {"train_loss": -38.00830841064453, "global_step": 143553, "epoch": 1186} {"train_loss": -39.562965393066406, "global_step": 143554, "epoch": 1186} {"train_loss": -39.371620178222656, "global_step": 143555, "epoch": 1186} {"train_loss": -39.32113265991211, "global_step": 143556, "epoch": 1186} {"train_loss": -39.04875564575195, "global_step": 143557, "epoch": 1186} {"train_loss": -37.8218879699707, "global_step": 143558, "epoch": 1186} {"train_loss": -39.964210510253906, "global_step": 143559, "epoch": 1186} {"train_loss": -39.05419921875, "global_step": 143560, "epoch": 1186} {"train_loss": -38.83477020263672, "global_step": 143561, "epoch": 1186} {"train_loss": -35.6212272644043, "global_step": 143562, "epoch": 1186} {"train_loss": -31.09236717224121, "global_step": 143563, "epoch": 1186} {"train_loss": -35.932952880859375, "global_step": 143564, "epoch": 1186} {"train_loss": -38.00037384033203, "global_step": 143565, "epoch": 1186} {"train_loss": -23.246007919311523, "global_step": 143566, "epoch": 1186} {"train_loss": -35.450740814208984, "global_step": 143567, "epoch": 1186} {"train_loss": -38.41939163208008, "global_step": 143568, "epoch": 1186} {"train_loss": -36.90519332885742, "global_step": 143569, "epoch": 1186} {"train_loss": -38.390724182128906, "global_step": 143570, "epoch": 1186} {"train_loss": -35.76259231567383, "global_step": 143571, "epoch": 1186} {"train_loss": -37.978485107421875, "global_step": 143572, "epoch": 1186} {"train_loss": -38.202613830566406, "global_step": 143573, "epoch": 1186} {"train_loss": -37.45389938354492, "global_step": 143574, "epoch": 1186} {"train_loss": -36.84705352783203, "global_step": 143575, "epoch": 1186} {"train_loss": -38.0867919921875, "global_step": 143576, "epoch": 1186} {"train_loss": -38.41996383666992, "global_step": 143577, "epoch": 1186} {"train_loss": -37.7226676940918, "global_step": 143578, "epoch": 1186} {"train_loss": -38.83738327026367, "global_step": 143579, "epoch": 1186} {"train_loss": -38.16781234741211, "global_step": 143580, "epoch": 1186} {"train_loss": -35.718963623046875, "global_step": 143581, "epoch": 1186} {"train_loss": -34.0760498046875, "global_step": 143582, "epoch": 1186} {"train_loss": -38.240352630615234, "global_step": 143583, "epoch": 1186} {"train_loss": -37.698699951171875, "global_step": 143584, "epoch": 1186} {"train_loss": -38.056304931640625, "global_step": 143585, "epoch": 1186} {"train_loss": -37.52324295043945, "global_step": 143586, "epoch": 1186} {"train_loss": -37.501102447509766, "global_step": 143587, "epoch": 1186} {"train_loss": -35.8414306640625, "global_step": 143588, "epoch": 1186} {"train_loss": -36.852020263671875, "global_step": 143589, "epoch": 1186} {"train_loss": -37.08984375, "global_step": 143590, "epoch": 1186} {"train_loss": -34.7879638671875, "global_step": 143591, "epoch": 1186} {"train_loss": -35.424598693847656, "global_step": 143592, "epoch": 1186} {"train_loss": -35.6279182434082, "global_step": 143593, "epoch": 1186} {"train_loss": -37.517642974853516, "global_step": 143594, "epoch": 1186} {"train_loss": -37.49100112915039, "global_step": 143595, "epoch": 1186} {"train_loss": -37.2362060546875, "global_step": 143596, "epoch": 1186} {"train_loss": -38.21131134033203, "global_step": 143597, "epoch": 1186} {"train_loss": -36.66708755493164, "global_step": 143598, "epoch": 1186} {"train_loss": -37.80768585205078, "global_step": 143599, "epoch": 1186} {"train_loss": -35.53389358520508, "global_step": 143600, "epoch": 1186} {"train_loss": -37.88283920288086, "global_step": 143601, "epoch": 1186} {"train_loss": -34.54294967651367, "global_step": 143602, "epoch": 1186} {"train_loss": -37.577274322509766, "global_step": 143603, "epoch": 1186} {"train_loss": -38.552921295166016, "global_step": 143604, "epoch": 1186} {"train_loss": -35.5262565612793, "global_step": 143605, "epoch": 1186} {"train_loss": -38.46140670776367, "global_step": 143606, "epoch": 1186} {"train_loss": -36.58463668823242, "global_step": 143607, "epoch": 1186} {"train_loss": -38.41327667236328, "global_step": 143608, "epoch": 1186} {"train_loss": -37.98263168334961, "global_step": 143609, "epoch": 1186} {"train_loss": -39.01900863647461, "global_step": 143610, "epoch": 1186} {"train_loss": -37.934173583984375, "global_step": 143611, "epoch": 1186} {"train_loss": -38.09527587890625, "global_step": 143612, "epoch": 1186} {"train_loss": -37.413082122802734, "global_step": 143613, "epoch": 1186} {"train_loss": -37.49751663208008, "global_step": 143614, "epoch": 1186} {"train_loss": -39.10797119140625, "global_step": 143615, "epoch": 1186} {"train_loss": -38.97593307495117, "global_step": 143616, "epoch": 1186} {"train_loss": -39.289283752441406, "global_step": 143617, "epoch": 1186} {"train_loss": -38.803565979003906, "global_step": 143618, "epoch": 1186} {"train_loss": -38.90537643432617, "global_step": 143619, "epoch": 1186} {"train_loss": -38.716888427734375, "global_step": 143620, "epoch": 1186} {"train_loss": -38.37807083129883, "global_step": 143621, "epoch": 1186} {"train_loss": -39.10676574707031, "global_step": 143622, "epoch": 1186} {"train_loss": -38.4069709777832, "global_step": 143623, "epoch": 1186} {"train_loss": -39.0875358581543, "global_step": 143624, "epoch": 1186} {"train_loss": -38.893348693847656, "global_step": 143625, "epoch": 1186} {"train_loss": -38.26353388384354, "global_step": 143626, "epoch": 1186, "val_loss": 2542800.75} {"train_loss": -38.513572692871094, "global_step": 143627, "epoch": 1187} {"train_loss": -38.86885452270508, "global_step": 143628, "epoch": 1187} {"train_loss": -37.890804290771484, "global_step": 143629, "epoch": 1187} {"train_loss": -38.85076904296875, "global_step": 143630, "epoch": 1187} {"train_loss": -40.09724807739258, "global_step": 143631, "epoch": 1187} {"train_loss": -39.236305236816406, "global_step": 143632, "epoch": 1187} {"train_loss": -39.51491165161133, "global_step": 143633, "epoch": 1187} {"train_loss": -39.909568786621094, "global_step": 143634, "epoch": 1187} {"train_loss": -39.43476104736328, "global_step": 143635, "epoch": 1187} {"train_loss": -39.769309997558594, "global_step": 143636, "epoch": 1187} {"train_loss": -39.74287033081055, "global_step": 143637, "epoch": 1187} {"train_loss": -39.353633880615234, "global_step": 143638, "epoch": 1187} {"train_loss": -39.69411849975586, "global_step": 143639, "epoch": 1187} {"train_loss": -39.704891204833984, "global_step": 143640, "epoch": 1187} {"train_loss": -39.8026237487793, "global_step": 143641, "epoch": 1187} {"train_loss": -38.794960021972656, "global_step": 143642, "epoch": 1187} {"train_loss": -38.46136474609375, "global_step": 143643, "epoch": 1187} {"train_loss": -39.79868698120117, "global_step": 143644, "epoch": 1187} {"train_loss": -40.15403366088867, "global_step": 143645, "epoch": 1187} {"train_loss": -40.038055419921875, "global_step": 143646, "epoch": 1187} {"train_loss": -40.318843841552734, "global_step": 143647, "epoch": 1187} {"train_loss": -40.27522659301758, "global_step": 143648, "epoch": 1187} {"train_loss": -39.89906311035156, "global_step": 143649, "epoch": 1187} {"train_loss": -39.86348342895508, "global_step": 143650, "epoch": 1187} {"train_loss": -39.843772888183594, "global_step": 143651, "epoch": 1187} {"train_loss": -39.82338333129883, "global_step": 143652, "epoch": 1187} {"train_loss": -38.67631912231445, "global_step": 143653, "epoch": 1187} {"train_loss": -39.79235076904297, "global_step": 143654, "epoch": 1187} {"train_loss": -40.30656814575195, "global_step": 143655, "epoch": 1187} {"train_loss": -40.137794494628906, "global_step": 143656, "epoch": 1187} {"train_loss": -39.91084671020508, "global_step": 143657, "epoch": 1187} {"train_loss": -40.34626007080078, "global_step": 143658, "epoch": 1187} {"train_loss": -39.39066696166992, "global_step": 143659, "epoch": 1187} {"train_loss": -39.0590934753418, "global_step": 143660, "epoch": 1187} {"train_loss": -39.95992660522461, "global_step": 143661, "epoch": 1187} {"train_loss": -39.66066360473633, "global_step": 143662, "epoch": 1187} {"train_loss": -40.260372161865234, "global_step": 143663, "epoch": 1187} {"train_loss": -38.012325286865234, "global_step": 143664, "epoch": 1187} {"train_loss": -38.84368896484375, "global_step": 143665, "epoch": 1187} {"train_loss": -37.09074020385742, "global_step": 143666, "epoch": 1187} {"train_loss": -38.17559814453125, "global_step": 143667, "epoch": 1187} {"train_loss": -39.460968017578125, "global_step": 143668, "epoch": 1187} {"train_loss": -39.22343063354492, "global_step": 143669, "epoch": 1187} {"train_loss": -38.741111755371094, "global_step": 143670, "epoch": 1187} {"train_loss": -37.38669967651367, "global_step": 143671, "epoch": 1187} {"train_loss": -33.70612716674805, "global_step": 143672, "epoch": 1187} {"train_loss": -31.2948055267334, "global_step": 143673, "epoch": 1187} {"train_loss": -33.134159088134766, "global_step": 143674, "epoch": 1187} {"train_loss": -37.36960983276367, "global_step": 143675, "epoch": 1187} {"train_loss": -34.886348724365234, "global_step": 143676, "epoch": 1187} {"train_loss": -33.91804122924805, "global_step": 143677, "epoch": 1187} {"train_loss": -39.10639572143555, "global_step": 143678, "epoch": 1187} {"train_loss": -37.58259963989258, "global_step": 143679, "epoch": 1187} {"train_loss": -38.53813552856445, "global_step": 143680, "epoch": 1187} {"train_loss": -38.595375061035156, "global_step": 143681, "epoch": 1187} {"train_loss": -38.0990104675293, "global_step": 143682, "epoch": 1187} {"train_loss": -40.146236419677734, "global_step": 143683, "epoch": 1187} {"train_loss": -38.137359619140625, "global_step": 143684, "epoch": 1187} {"train_loss": -38.485755920410156, "global_step": 143685, "epoch": 1187} {"train_loss": -38.9874382019043, "global_step": 143686, "epoch": 1187} {"train_loss": -38.51701736450195, "global_step": 143687, "epoch": 1187} {"train_loss": -38.56589889526367, "global_step": 143688, "epoch": 1187} {"train_loss": -36.920814514160156, "global_step": 143689, "epoch": 1187} {"train_loss": -39.126853942871094, "global_step": 143690, "epoch": 1187} {"train_loss": -38.63007736206055, "global_step": 143691, "epoch": 1187} {"train_loss": -38.792415618896484, "global_step": 143692, "epoch": 1187} {"train_loss": -39.74437713623047, "global_step": 143693, "epoch": 1187} {"train_loss": -38.399898529052734, "global_step": 143694, "epoch": 1187} {"train_loss": -38.388572692871094, "global_step": 143695, "epoch": 1187} {"train_loss": -39.116756439208984, "global_step": 143696, "epoch": 1187} {"train_loss": -36.88066482543945, "global_step": 143697, "epoch": 1187} {"train_loss": -39.23359298706055, "global_step": 143698, "epoch": 1187} {"train_loss": -38.56066131591797, "global_step": 143699, "epoch": 1187} {"train_loss": -38.36711502075195, "global_step": 143700, "epoch": 1187} {"train_loss": -39.22679138183594, "global_step": 143701, "epoch": 1187} {"train_loss": -39.123817443847656, "global_step": 143702, "epoch": 1187} {"train_loss": -39.83195877075195, "global_step": 143703, "epoch": 1187} {"train_loss": -39.24641799926758, "global_step": 143704, "epoch": 1187} {"train_loss": -39.41362380981445, "global_step": 143705, "epoch": 1187} {"train_loss": -39.2598991394043, "global_step": 143706, "epoch": 1187} {"train_loss": -39.71204376220703, "global_step": 143707, "epoch": 1187} {"train_loss": -39.75829315185547, "global_step": 143708, "epoch": 1187} {"train_loss": -40.24107360839844, "global_step": 143709, "epoch": 1187} {"train_loss": -40.17201614379883, "global_step": 143710, "epoch": 1187} {"train_loss": -40.00189971923828, "global_step": 143711, "epoch": 1187} {"train_loss": -38.82887649536133, "global_step": 143712, "epoch": 1187} {"train_loss": -40.199337005615234, "global_step": 143713, "epoch": 1187} {"train_loss": -39.67550277709961, "global_step": 143714, "epoch": 1187} {"train_loss": -40.08082580566406, "global_step": 143715, "epoch": 1187} {"train_loss": -40.218238830566406, "global_step": 143716, "epoch": 1187} {"train_loss": -39.894344329833984, "global_step": 143717, "epoch": 1187} {"train_loss": -40.126827239990234, "global_step": 143718, "epoch": 1187} {"train_loss": -40.1289176940918, "global_step": 143719, "epoch": 1187} {"train_loss": -40.23933029174805, "global_step": 143720, "epoch": 1187} {"train_loss": -40.356136322021484, "global_step": 143721, "epoch": 1187} {"train_loss": -40.71274948120117, "global_step": 143722, "epoch": 1187} {"train_loss": -40.50989532470703, "global_step": 143723, "epoch": 1187} {"train_loss": -40.67049789428711, "global_step": 143724, "epoch": 1187} {"train_loss": -40.24374771118164, "global_step": 143725, "epoch": 1187} {"train_loss": -40.50312423706055, "global_step": 143726, "epoch": 1187} {"train_loss": -40.44260787963867, "global_step": 143727, "epoch": 1187} {"train_loss": -40.712066650390625, "global_step": 143728, "epoch": 1187} {"train_loss": -40.870540618896484, "global_step": 143729, "epoch": 1187} {"train_loss": -40.38367462158203, "global_step": 143730, "epoch": 1187} {"train_loss": -40.50346755981445, "global_step": 143731, "epoch": 1187} {"train_loss": -40.95945739746094, "global_step": 143732, "epoch": 1187} {"train_loss": -40.57235336303711, "global_step": 143733, "epoch": 1187} {"train_loss": -41.02162551879883, "global_step": 143734, "epoch": 1187} {"train_loss": -40.6841926574707, "global_step": 143735, "epoch": 1187} {"train_loss": -41.16527557373047, "global_step": 143736, "epoch": 1187} {"train_loss": -40.75320053100586, "global_step": 143737, "epoch": 1187} {"train_loss": -40.71444320678711, "global_step": 143738, "epoch": 1187} {"train_loss": -40.53335189819336, "global_step": 143739, "epoch": 1187} {"train_loss": -39.46678924560547, "global_step": 143740, "epoch": 1187} {"train_loss": -38.4506721496582, "global_step": 143741, "epoch": 1187} {"train_loss": -34.29838180541992, "global_step": 143742, "epoch": 1187} {"train_loss": -27.779693603515625, "global_step": 143743, "epoch": 1187} {"train_loss": -30.4375057220459, "global_step": 143744, "epoch": 1187} {"train_loss": -37.599151611328125, "global_step": 143745, "epoch": 1187} {"train_loss": -40.18290328979492, "global_step": 143746, "epoch": 1187} {"train_loss": -38.969663667284756, "global_step": 143747, "epoch": 1187, "val_loss": 2653806.25} {"train_loss": -37.944366455078125, "global_step": 143748, "epoch": 1188} {"train_loss": -39.50652313232422, "global_step": 143749, "epoch": 1188} {"train_loss": -37.47403335571289, "global_step": 143750, "epoch": 1188} {"train_loss": -40.04289627075195, "global_step": 143751, "epoch": 1188} {"train_loss": -38.5372314453125, "global_step": 143752, "epoch": 1188} {"train_loss": -39.739776611328125, "global_step": 143753, "epoch": 1188} {"train_loss": -38.777130126953125, "global_step": 143754, "epoch": 1188} {"train_loss": -39.16337585449219, "global_step": 143755, "epoch": 1188} {"train_loss": -40.178009033203125, "global_step": 143756, "epoch": 1188} {"train_loss": -39.792232513427734, "global_step": 143757, "epoch": 1188} {"train_loss": -40.26137161254883, "global_step": 143758, "epoch": 1188} {"train_loss": -39.47837448120117, "global_step": 143759, "epoch": 1188} {"train_loss": -40.65180587768555, "global_step": 143760, "epoch": 1188} {"train_loss": -39.46226501464844, "global_step": 143761, "epoch": 1188} {"train_loss": -40.0697135925293, "global_step": 143762, "epoch": 1188} {"train_loss": -39.29938507080078, "global_step": 143763, "epoch": 1188} {"train_loss": -39.90238571166992, "global_step": 143764, "epoch": 1188} {"train_loss": -39.531612396240234, "global_step": 143765, "epoch": 1188} {"train_loss": -40.641109466552734, "global_step": 143766, "epoch": 1188} {"train_loss": -40.04825973510742, "global_step": 143767, "epoch": 1188} {"train_loss": -40.04840850830078, "global_step": 143768, "epoch": 1188} {"train_loss": -40.2738037109375, "global_step": 143769, "epoch": 1188} {"train_loss": -40.603946685791016, "global_step": 143770, "epoch": 1188} {"train_loss": -39.64094161987305, "global_step": 143771, "epoch": 1188} {"train_loss": -40.54828643798828, "global_step": 143772, "epoch": 1188} {"train_loss": -40.09467315673828, "global_step": 143773, "epoch": 1188} {"train_loss": -40.55680847167969, "global_step": 143774, "epoch": 1188} {"train_loss": -40.46963119506836, "global_step": 143775, "epoch": 1188} {"train_loss": -40.33034896850586, "global_step": 143776, "epoch": 1188} {"train_loss": -40.70831298828125, "global_step": 143777, "epoch": 1188} {"train_loss": -40.29767608642578, "global_step": 143778, "epoch": 1188} {"train_loss": -40.627376556396484, "global_step": 143779, "epoch": 1188} {"train_loss": -40.540931701660156, "global_step": 143780, "epoch": 1188} {"train_loss": -40.260379791259766, "global_step": 143781, "epoch": 1188} {"train_loss": -39.64524459838867, "global_step": 143782, "epoch": 1188} {"train_loss": -39.31031036376953, "global_step": 143783, "epoch": 1188} {"train_loss": -39.62742614746094, "global_step": 143784, "epoch": 1188} {"train_loss": -38.24215316772461, "global_step": 143785, "epoch": 1188} {"train_loss": -36.45722198486328, "global_step": 143786, "epoch": 1188} {"train_loss": -37.68406295776367, "global_step": 143787, "epoch": 1188} {"train_loss": -38.463157653808594, "global_step": 143788, "epoch": 1188} {"train_loss": -38.4782600402832, "global_step": 143789, "epoch": 1188} {"train_loss": -36.588134765625, "global_step": 143790, "epoch": 1188} {"train_loss": -38.53705978393555, "global_step": 143791, "epoch": 1188} {"train_loss": -38.80352783203125, "global_step": 143792, "epoch": 1188} {"train_loss": -38.003021240234375, "global_step": 143793, "epoch": 1188} {"train_loss": -38.77537536621094, "global_step": 143794, "epoch": 1188} {"train_loss": -39.23323059082031, "global_step": 143795, "epoch": 1188} {"train_loss": -38.92348861694336, "global_step": 143796, "epoch": 1188} {"train_loss": -39.37127685546875, "global_step": 143797, "epoch": 1188} {"train_loss": -39.218017578125, "global_step": 143798, "epoch": 1188} {"train_loss": -38.527889251708984, "global_step": 143799, "epoch": 1188} {"train_loss": -39.25347900390625, "global_step": 143800, "epoch": 1188} {"train_loss": -40.05825424194336, "global_step": 143801, "epoch": 1188} {"train_loss": -39.83359909057617, "global_step": 143802, "epoch": 1188} {"train_loss": -39.52084732055664, "global_step": 143803, "epoch": 1188} {"train_loss": -40.26975631713867, "global_step": 143804, "epoch": 1188} {"train_loss": -39.78457260131836, "global_step": 143805, "epoch": 1188} {"train_loss": -40.16782760620117, "global_step": 143806, "epoch": 1188} {"train_loss": -40.085716247558594, "global_step": 143807, "epoch": 1188} {"train_loss": -39.707374572753906, "global_step": 143808, "epoch": 1188} {"train_loss": -39.84589385986328, "global_step": 143809, "epoch": 1188} {"train_loss": -39.546730041503906, "global_step": 143810, "epoch": 1188} {"train_loss": -38.564388275146484, "global_step": 143811, "epoch": 1188} {"train_loss": -39.65562057495117, "global_step": 143812, "epoch": 1188} {"train_loss": -40.477352142333984, "global_step": 143813, "epoch": 1188} {"train_loss": -40.358253479003906, "global_step": 143814, "epoch": 1188} {"train_loss": -39.93254470825195, "global_step": 143815, "epoch": 1188} {"train_loss": -39.347267150878906, "global_step": 143816, "epoch": 1188} {"train_loss": -39.99233627319336, "global_step": 143817, "epoch": 1188} {"train_loss": -39.416561126708984, "global_step": 143818, "epoch": 1188} {"train_loss": -39.65092849731445, "global_step": 143819, "epoch": 1188} {"train_loss": -40.21700668334961, "global_step": 143820, "epoch": 1188} {"train_loss": -40.23533248901367, "global_step": 143821, "epoch": 1188} {"train_loss": -40.004798889160156, "global_step": 143822, "epoch": 1188} {"train_loss": -39.54340362548828, "global_step": 143823, "epoch": 1188} {"train_loss": -40.55467987060547, "global_step": 143824, "epoch": 1188} {"train_loss": -38.82772445678711, "global_step": 143825, "epoch": 1188} {"train_loss": -39.430641174316406, "global_step": 143826, "epoch": 1188} {"train_loss": -38.754188537597656, "global_step": 143827, "epoch": 1188} {"train_loss": -38.41087341308594, "global_step": 143828, "epoch": 1188} {"train_loss": -39.082923889160156, "global_step": 143829, "epoch": 1188} {"train_loss": -40.08405303955078, "global_step": 143830, "epoch": 1188} {"train_loss": -37.1335334777832, "global_step": 143831, "epoch": 1188} {"train_loss": -38.539485931396484, "global_step": 143832, "epoch": 1188} {"train_loss": -39.59845733642578, "global_step": 143833, "epoch": 1188} {"train_loss": -39.819332122802734, "global_step": 143834, "epoch": 1188} {"train_loss": -39.24862289428711, "global_step": 143835, "epoch": 1188} {"train_loss": -40.2703971862793, "global_step": 143836, "epoch": 1188} {"train_loss": -40.70845413208008, "global_step": 143837, "epoch": 1188} {"train_loss": -38.5647087097168, "global_step": 143838, "epoch": 1188} {"train_loss": -40.23127365112305, "global_step": 143839, "epoch": 1188} {"train_loss": -39.87034225463867, "global_step": 143840, "epoch": 1188} {"train_loss": -40.21488571166992, "global_step": 143841, "epoch": 1188} {"train_loss": -39.99779510498047, "global_step": 143842, "epoch": 1188} {"train_loss": -40.353694915771484, "global_step": 143843, "epoch": 1188} {"train_loss": -40.311920166015625, "global_step": 143844, "epoch": 1188} {"train_loss": -40.14181900024414, "global_step": 143845, "epoch": 1188} {"train_loss": -40.543701171875, "global_step": 143846, "epoch": 1188} {"train_loss": -39.96267318725586, "global_step": 143847, "epoch": 1188} {"train_loss": -39.68848419189453, "global_step": 143848, "epoch": 1188} {"train_loss": -40.335567474365234, "global_step": 143849, "epoch": 1188} {"train_loss": -39.93936538696289, "global_step": 143850, "epoch": 1188} {"train_loss": -40.1456413269043, "global_step": 143851, "epoch": 1188} {"train_loss": -40.09308624267578, "global_step": 143852, "epoch": 1188} {"train_loss": -40.62053298950195, "global_step": 143853, "epoch": 1188} {"train_loss": -39.974666595458984, "global_step": 143854, "epoch": 1188} {"train_loss": -39.27143096923828, "global_step": 143855, "epoch": 1188} {"train_loss": -40.09164047241211, "global_step": 143856, "epoch": 1188} {"train_loss": -40.59204864501953, "global_step": 143857, "epoch": 1188} {"train_loss": -40.02460479736328, "global_step": 143858, "epoch": 1188} {"train_loss": -40.30607223510742, "global_step": 143859, "epoch": 1188} {"train_loss": -40.85089111328125, "global_step": 143860, "epoch": 1188} {"train_loss": -39.952613830566406, "global_step": 143861, "epoch": 1188} {"train_loss": -39.36042404174805, "global_step": 143862, "epoch": 1188} {"train_loss": -40.58564758300781, "global_step": 143863, "epoch": 1188} {"train_loss": -39.113704681396484, "global_step": 143864, "epoch": 1188} {"train_loss": -39.34729766845703, "global_step": 143865, "epoch": 1188} {"train_loss": -40.26771926879883, "global_step": 143866, "epoch": 1188} {"train_loss": -40.159217834472656, "global_step": 143867, "epoch": 1188} {"train_loss": -39.62971253828569, "global_step": 143868, "epoch": 1188, "val_loss": 2602672.5} {"train_loss": -40.319026947021484, "global_step": 143869, "epoch": 1189} {"train_loss": -39.53778839111328, "global_step": 143870, "epoch": 1189} {"train_loss": -39.883453369140625, "global_step": 143871, "epoch": 1189} {"train_loss": -39.413238525390625, "global_step": 143872, "epoch": 1189} {"train_loss": -39.68935775756836, "global_step": 143873, "epoch": 1189} {"train_loss": -38.9190788269043, "global_step": 143874, "epoch": 1189} {"train_loss": -40.08623123168945, "global_step": 143875, "epoch": 1189} {"train_loss": -38.01698303222656, "global_step": 143876, "epoch": 1189} {"train_loss": -38.22308349609375, "global_step": 143877, "epoch": 1189} {"train_loss": -39.07001876831055, "global_step": 143878, "epoch": 1189} {"train_loss": -39.84469223022461, "global_step": 143879, "epoch": 1189} {"train_loss": -40.4501838684082, "global_step": 143880, "epoch": 1189} {"train_loss": -40.20687484741211, "global_step": 143881, "epoch": 1189} {"train_loss": -40.3411750793457, "global_step": 143882, "epoch": 1189} {"train_loss": -39.71812057495117, "global_step": 143883, "epoch": 1189} {"train_loss": -40.02407455444336, "global_step": 143884, "epoch": 1189} {"train_loss": -38.59428024291992, "global_step": 143885, "epoch": 1189} {"train_loss": -39.21799850463867, "global_step": 143886, "epoch": 1189} {"train_loss": -39.207420349121094, "global_step": 143887, "epoch": 1189} {"train_loss": -39.918182373046875, "global_step": 143888, "epoch": 1189} {"train_loss": -38.61953353881836, "global_step": 143889, "epoch": 1189} {"train_loss": -40.926395416259766, "global_step": 143890, "epoch": 1189} {"train_loss": -40.1890869140625, "global_step": 143891, "epoch": 1189} {"train_loss": -39.76063919067383, "global_step": 143892, "epoch": 1189} {"train_loss": -38.1410026550293, "global_step": 143893, "epoch": 1189} {"train_loss": -35.670265197753906, "global_step": 143894, "epoch": 1189} {"train_loss": -37.16796112060547, "global_step": 143895, "epoch": 1189} {"train_loss": -38.45166015625, "global_step": 143896, "epoch": 1189} {"train_loss": -39.583309173583984, "global_step": 143897, "epoch": 1189} {"train_loss": -36.55361557006836, "global_step": 143898, "epoch": 1189} {"train_loss": -36.28947067260742, "global_step": 143899, "epoch": 1189} {"train_loss": -36.9688835144043, "global_step": 143900, "epoch": 1189} {"train_loss": -40.00593185424805, "global_step": 143901, "epoch": 1189} {"train_loss": -37.67299270629883, "global_step": 143902, "epoch": 1189} {"train_loss": -37.14798355102539, "global_step": 143903, "epoch": 1189} {"train_loss": -39.00565719604492, "global_step": 143904, "epoch": 1189} {"train_loss": -39.6280632019043, "global_step": 143905, "epoch": 1189} {"train_loss": -38.70176315307617, "global_step": 143906, "epoch": 1189} {"train_loss": -39.86955642700195, "global_step": 143907, "epoch": 1189} {"train_loss": -39.50584030151367, "global_step": 143908, "epoch": 1189} {"train_loss": -40.090911865234375, "global_step": 143909, "epoch": 1189} {"train_loss": -39.43362045288086, "global_step": 143910, "epoch": 1189} {"train_loss": -40.006465911865234, "global_step": 143911, "epoch": 1189} {"train_loss": -40.01155471801758, "global_step": 143912, "epoch": 1189} {"train_loss": -37.08852767944336, "global_step": 143913, "epoch": 1189} {"train_loss": -38.175086975097656, "global_step": 143914, "epoch": 1189} {"train_loss": -39.63543701171875, "global_step": 143915, "epoch": 1189} {"train_loss": -39.38051223754883, "global_step": 143916, "epoch": 1189} {"train_loss": -39.541770935058594, "global_step": 143917, "epoch": 1189} {"train_loss": -38.9150276184082, "global_step": 143918, "epoch": 1189} {"train_loss": -39.18659210205078, "global_step": 143919, "epoch": 1189} {"train_loss": -38.63676452636719, "global_step": 143920, "epoch": 1189} {"train_loss": -38.53802490234375, "global_step": 143921, "epoch": 1189} {"train_loss": -39.07835006713867, "global_step": 143922, "epoch": 1189} {"train_loss": -37.817745208740234, "global_step": 143923, "epoch": 1189} {"train_loss": -37.48017501831055, "global_step": 143924, "epoch": 1189} {"train_loss": -38.55057907104492, "global_step": 143925, "epoch": 1189} {"train_loss": -37.60982131958008, "global_step": 143926, "epoch": 1189} {"train_loss": -39.0717887878418, "global_step": 143927, "epoch": 1189} {"train_loss": -39.6663932800293, "global_step": 143928, "epoch": 1189} {"train_loss": -39.65178298950195, "global_step": 143929, "epoch": 1189} {"train_loss": -40.56249237060547, "global_step": 143930, "epoch": 1189} {"train_loss": -35.88423538208008, "global_step": 143931, "epoch": 1189} {"train_loss": -39.94883346557617, "global_step": 143932, "epoch": 1189} {"train_loss": -38.836181640625, "global_step": 143933, "epoch": 1189} {"train_loss": -38.16238021850586, "global_step": 143934, "epoch": 1189} {"train_loss": -38.89384841918945, "global_step": 143935, "epoch": 1189} {"train_loss": -39.532508850097656, "global_step": 143936, "epoch": 1189} {"train_loss": -38.97953414916992, "global_step": 143937, "epoch": 1189} {"train_loss": -39.68245315551758, "global_step": 143938, "epoch": 1189} {"train_loss": -38.35785675048828, "global_step": 143939, "epoch": 1189} {"train_loss": -39.9691276550293, "global_step": 143940, "epoch": 1189} {"train_loss": -39.79066848754883, "global_step": 143941, "epoch": 1189} {"train_loss": -39.10560607910156, "global_step": 143942, "epoch": 1189} {"train_loss": -39.954341888427734, "global_step": 143943, "epoch": 1189} {"train_loss": -40.110260009765625, "global_step": 143944, "epoch": 1189} {"train_loss": -39.894718170166016, "global_step": 143945, "epoch": 1189} {"train_loss": -40.42725372314453, "global_step": 143946, "epoch": 1189} {"train_loss": -38.76828384399414, "global_step": 143947, "epoch": 1189} {"train_loss": -39.24858474731445, "global_step": 143948, "epoch": 1189} {"train_loss": -40.13922119140625, "global_step": 143949, "epoch": 1189} {"train_loss": -40.70867919921875, "global_step": 143950, "epoch": 1189} {"train_loss": -38.66892623901367, "global_step": 143951, "epoch": 1189} {"train_loss": -40.290855407714844, "global_step": 143952, "epoch": 1189} {"train_loss": -39.057804107666016, "global_step": 143953, "epoch": 1189} {"train_loss": -39.35000228881836, "global_step": 143954, "epoch": 1189} {"train_loss": -39.56391525268555, "global_step": 143955, "epoch": 1189} {"train_loss": -39.94194793701172, "global_step": 143956, "epoch": 1189} {"train_loss": -40.26423263549805, "global_step": 143957, "epoch": 1189} {"train_loss": -40.1214485168457, "global_step": 143958, "epoch": 1189} {"train_loss": -39.020023345947266, "global_step": 143959, "epoch": 1189} {"train_loss": -39.01438522338867, "global_step": 143960, "epoch": 1189} {"train_loss": -39.1727409362793, "global_step": 143961, "epoch": 1189} {"train_loss": -40.49059295654297, "global_step": 143962, "epoch": 1189} {"train_loss": -38.599056243896484, "global_step": 143963, "epoch": 1189} {"train_loss": -40.33297348022461, "global_step": 143964, "epoch": 1189} {"train_loss": -40.04990768432617, "global_step": 143965, "epoch": 1189} {"train_loss": -38.996788024902344, "global_step": 143966, "epoch": 1189} {"train_loss": -39.417816162109375, "global_step": 143967, "epoch": 1189} {"train_loss": -38.64252471923828, "global_step": 143968, "epoch": 1189} {"train_loss": -39.68824768066406, "global_step": 143969, "epoch": 1189} {"train_loss": -39.11098861694336, "global_step": 143970, "epoch": 1189} {"train_loss": -40.27408981323242, "global_step": 143971, "epoch": 1189} {"train_loss": -39.233619689941406, "global_step": 143972, "epoch": 1189} {"train_loss": -38.716896057128906, "global_step": 143973, "epoch": 1189} {"train_loss": -39.89335250854492, "global_step": 143974, "epoch": 1189} {"train_loss": -40.07594299316406, "global_step": 143975, "epoch": 1189} {"train_loss": -38.284339904785156, "global_step": 143976, "epoch": 1189} {"train_loss": -36.6235237121582, "global_step": 143977, "epoch": 1189} {"train_loss": -38.196136474609375, "global_step": 143978, "epoch": 1189} {"train_loss": -39.399147033691406, "global_step": 143979, "epoch": 1189} {"train_loss": -36.59123611450195, "global_step": 143980, "epoch": 1189} {"train_loss": -39.662696838378906, "global_step": 143981, "epoch": 1189} {"train_loss": -39.619773864746094, "global_step": 143982, "epoch": 1189} {"train_loss": -38.78874588012695, "global_step": 143983, "epoch": 1189} {"train_loss": -40.39384078979492, "global_step": 143984, "epoch": 1189} {"train_loss": -39.37833786010742, "global_step": 143985, "epoch": 1189} {"train_loss": -39.51707077026367, "global_step": 143986, "epoch": 1189} {"train_loss": -40.41950225830078, "global_step": 143987, "epoch": 1189} {"train_loss": -39.40501022338867, "global_step": 143988, "epoch": 1189} {"train_loss": -39.16672345626453, "global_step": 143989, "epoch": 1189, "val_loss": 2531785.5} {"train_loss": -40.14333724975586, "global_step": 143990, "epoch": 1190} {"train_loss": -39.7398681640625, "global_step": 143991, "epoch": 1190} {"train_loss": -40.8003044128418, "global_step": 143992, "epoch": 1190} {"train_loss": -38.04967498779297, "global_step": 143993, "epoch": 1190} {"train_loss": -39.93592071533203, "global_step": 143994, "epoch": 1190} {"train_loss": -40.13900375366211, "global_step": 143995, "epoch": 1190} {"train_loss": -39.263973236083984, "global_step": 143996, "epoch": 1190} {"train_loss": -40.7922248840332, "global_step": 143997, "epoch": 1190} {"train_loss": -38.89115905761719, "global_step": 143998, "epoch": 1190} {"train_loss": -39.913082122802734, "global_step": 143999, "epoch": 1190} {"train_loss": -40.19480514526367, "global_step": 144000, "epoch": 1190} {"train_loss": -40.79751205444336, "global_step": 144001, "epoch": 1190} {"train_loss": -40.14533233642578, "global_step": 144002, "epoch": 1190} {"train_loss": -40.87327194213867, "global_step": 144003, "epoch": 1190} {"train_loss": -39.734371185302734, "global_step": 144004, "epoch": 1190} {"train_loss": -38.6786003112793, "global_step": 144005, "epoch": 1190} {"train_loss": -39.37277603149414, "global_step": 144006, "epoch": 1190} {"train_loss": -36.3018684387207, "global_step": 144007, "epoch": 1190} {"train_loss": -39.81650161743164, "global_step": 144008, "epoch": 1190} {"train_loss": -38.774173736572266, "global_step": 144009, "epoch": 1190} {"train_loss": -39.76682662963867, "global_step": 144010, "epoch": 1190} {"train_loss": -40.0908317565918, "global_step": 144011, "epoch": 1190} {"train_loss": -40.61738967895508, "global_step": 144012, "epoch": 1190} {"train_loss": -38.93662643432617, "global_step": 144013, "epoch": 1190} {"train_loss": -39.77541732788086, "global_step": 144014, "epoch": 1190} {"train_loss": -39.926692962646484, "global_step": 144015, "epoch": 1190} {"train_loss": -39.74522399902344, "global_step": 144016, "epoch": 1190} {"train_loss": -37.41828155517578, "global_step": 144017, "epoch": 1190} {"train_loss": -40.42542266845703, "global_step": 144018, "epoch": 1190} {"train_loss": -39.539249420166016, "global_step": 144019, "epoch": 1190} {"train_loss": -39.48600387573242, "global_step": 144020, "epoch": 1190} {"train_loss": -38.841651916503906, "global_step": 144021, "epoch": 1190} {"train_loss": -39.45408248901367, "global_step": 144022, "epoch": 1190} {"train_loss": -39.75895309448242, "global_step": 144023, "epoch": 1190} {"train_loss": -39.57746505737305, "global_step": 144024, "epoch": 1190} {"train_loss": -39.25919723510742, "global_step": 144025, "epoch": 1190} {"train_loss": -39.87672805786133, "global_step": 144026, "epoch": 1190} {"train_loss": -39.62993240356445, "global_step": 144027, "epoch": 1190} {"train_loss": -40.12175369262695, "global_step": 144028, "epoch": 1190} {"train_loss": -39.804561614990234, "global_step": 144029, "epoch": 1190} {"train_loss": -39.64919662475586, "global_step": 144030, "epoch": 1190} {"train_loss": -39.5501708984375, "global_step": 144031, "epoch": 1190} {"train_loss": -40.08208465576172, "global_step": 144032, "epoch": 1190} {"train_loss": -39.77163314819336, "global_step": 144033, "epoch": 1190} {"train_loss": -40.14498519897461, "global_step": 144034, "epoch": 1190} {"train_loss": -39.16622543334961, "global_step": 144035, "epoch": 1190} {"train_loss": -40.031253814697266, "global_step": 144036, "epoch": 1190} {"train_loss": -40.14470291137695, "global_step": 144037, "epoch": 1190} {"train_loss": -38.401153564453125, "global_step": 144038, "epoch": 1190} {"train_loss": -37.0949821472168, "global_step": 144039, "epoch": 1190} {"train_loss": -39.1236457824707, "global_step": 144040, "epoch": 1190} {"train_loss": -40.429237365722656, "global_step": 144041, "epoch": 1190} {"train_loss": -40.2545051574707, "global_step": 144042, "epoch": 1190} {"train_loss": -40.02824020385742, "global_step": 144043, "epoch": 1190} {"train_loss": -40.4317626953125, "global_step": 144044, "epoch": 1190} {"train_loss": -39.544288635253906, "global_step": 144045, "epoch": 1190} {"train_loss": -39.373512268066406, "global_step": 144046, "epoch": 1190} {"train_loss": -37.695030212402344, "global_step": 144047, "epoch": 1190} {"train_loss": -38.98196029663086, "global_step": 144048, "epoch": 1190} {"train_loss": -40.17625045776367, "global_step": 144049, "epoch": 1190} {"train_loss": -39.574520111083984, "global_step": 144050, "epoch": 1190} {"train_loss": -38.31779861450195, "global_step": 144051, "epoch": 1190} {"train_loss": -38.75996780395508, "global_step": 144052, "epoch": 1190} {"train_loss": -39.33283615112305, "global_step": 144053, "epoch": 1190} {"train_loss": -40.14040756225586, "global_step": 144054, "epoch": 1190} {"train_loss": -38.491512298583984, "global_step": 144055, "epoch": 1190} {"train_loss": -40.16796112060547, "global_step": 144056, "epoch": 1190} {"train_loss": -39.2943000793457, "global_step": 144057, "epoch": 1190} {"train_loss": -39.60449981689453, "global_step": 144058, "epoch": 1190} {"train_loss": -40.216270446777344, "global_step": 144059, "epoch": 1190} {"train_loss": -40.307796478271484, "global_step": 144060, "epoch": 1190} {"train_loss": -39.525665283203125, "global_step": 144061, "epoch": 1190} {"train_loss": -39.90583419799805, "global_step": 144062, "epoch": 1190} {"train_loss": -40.95960998535156, "global_step": 144063, "epoch": 1190} {"train_loss": -39.644874572753906, "global_step": 144064, "epoch": 1190} {"train_loss": -39.817508697509766, "global_step": 144065, "epoch": 1190} {"train_loss": -40.51958084106445, "global_step": 144066, "epoch": 1190} {"train_loss": -39.44674301147461, "global_step": 144067, "epoch": 1190} {"train_loss": -39.67380905151367, "global_step": 144068, "epoch": 1190} {"train_loss": -40.10380935668945, "global_step": 144069, "epoch": 1190} {"train_loss": -40.39545440673828, "global_step": 144070, "epoch": 1190} {"train_loss": -40.95873260498047, "global_step": 144071, "epoch": 1190} {"train_loss": -37.50008773803711, "global_step": 144072, "epoch": 1190} {"train_loss": -38.990234375, "global_step": 144073, "epoch": 1190} {"train_loss": -38.818206787109375, "global_step": 144074, "epoch": 1190} {"train_loss": -38.0025520324707, "global_step": 144075, "epoch": 1190} {"train_loss": -39.636329650878906, "global_step": 144076, "epoch": 1190} {"train_loss": -38.66868209838867, "global_step": 144077, "epoch": 1190} {"train_loss": -39.818782806396484, "global_step": 144078, "epoch": 1190} {"train_loss": -39.24137496948242, "global_step": 144079, "epoch": 1190} {"train_loss": -39.48368453979492, "global_step": 144080, "epoch": 1190} {"train_loss": -40.13251495361328, "global_step": 144081, "epoch": 1190} {"train_loss": -40.19404220581055, "global_step": 144082, "epoch": 1190} {"train_loss": -39.54479217529297, "global_step": 144083, "epoch": 1190} {"train_loss": -39.900325775146484, "global_step": 144084, "epoch": 1190} {"train_loss": -40.95270919799805, "global_step": 144085, "epoch": 1190} {"train_loss": -40.28938674926758, "global_step": 144086, "epoch": 1190} {"train_loss": -39.42412567138672, "global_step": 144087, "epoch": 1190} {"train_loss": -40.45046615600586, "global_step": 144088, "epoch": 1190} {"train_loss": -40.43465042114258, "global_step": 144089, "epoch": 1190} {"train_loss": -39.79996871948242, "global_step": 144090, "epoch": 1190} {"train_loss": -40.427154541015625, "global_step": 144091, "epoch": 1190} {"train_loss": -38.19016647338867, "global_step": 144092, "epoch": 1190} {"train_loss": -39.853370666503906, "global_step": 144093, "epoch": 1190} {"train_loss": -37.29553985595703, "global_step": 144094, "epoch": 1190} {"train_loss": -39.875240325927734, "global_step": 144095, "epoch": 1190} {"train_loss": -40.68124008178711, "global_step": 144096, "epoch": 1190} {"train_loss": -40.3291015625, "global_step": 144097, "epoch": 1190} {"train_loss": -40.40979766845703, "global_step": 144098, "epoch": 1190} {"train_loss": -39.485897064208984, "global_step": 144099, "epoch": 1190} {"train_loss": -40.315345764160156, "global_step": 144100, "epoch": 1190} {"train_loss": -40.36727523803711, "global_step": 144101, "epoch": 1190} {"train_loss": -41.14506912231445, "global_step": 144102, "epoch": 1190} {"train_loss": -39.63228988647461, "global_step": 144103, "epoch": 1190} {"train_loss": -39.96770095825195, "global_step": 144104, "epoch": 1190} {"train_loss": -40.31154251098633, "global_step": 144105, "epoch": 1190} {"train_loss": -38.38141632080078, "global_step": 144106, "epoch": 1190} {"train_loss": -40.0235595703125, "global_step": 144107, "epoch": 1190} {"train_loss": -39.98067855834961, "global_step": 144108, "epoch": 1190} {"train_loss": -39.92924880981445, "global_step": 144109, "epoch": 1190} {"train_loss": -39.644626365220255, "global_step": 144110, "epoch": 1190, "val_loss": 2706256.0} {"train_loss": -39.92354965209961, "global_step": 144111, "epoch": 1191} {"train_loss": -40.32479476928711, "global_step": 144112, "epoch": 1191} {"train_loss": -39.3286018371582, "global_step": 144113, "epoch": 1191} {"train_loss": -39.924598693847656, "global_step": 144114, "epoch": 1191} {"train_loss": -40.5026969909668, "global_step": 144115, "epoch": 1191} {"train_loss": -40.271175384521484, "global_step": 144116, "epoch": 1191} {"train_loss": -39.612060546875, "global_step": 144117, "epoch": 1191} {"train_loss": -39.70992660522461, "global_step": 144118, "epoch": 1191} {"train_loss": -39.46956253051758, "global_step": 144119, "epoch": 1191} {"train_loss": -39.69245529174805, "global_step": 144120, "epoch": 1191} {"train_loss": -40.35347366333008, "global_step": 144121, "epoch": 1191} {"train_loss": -40.474220275878906, "global_step": 144122, "epoch": 1191} {"train_loss": -39.17660140991211, "global_step": 144123, "epoch": 1191} {"train_loss": -39.560035705566406, "global_step": 144124, "epoch": 1191} {"train_loss": -39.69148635864258, "global_step": 144125, "epoch": 1191} {"train_loss": -40.7667236328125, "global_step": 144126, "epoch": 1191} {"train_loss": -40.628807067871094, "global_step": 144127, "epoch": 1191} {"train_loss": -40.49131393432617, "global_step": 144128, "epoch": 1191} {"train_loss": -40.20707702636719, "global_step": 144129, "epoch": 1191} {"train_loss": -40.542030334472656, "global_step": 144130, "epoch": 1191} {"train_loss": -40.16791915893555, "global_step": 144131, "epoch": 1191} {"train_loss": -40.7938346862793, "global_step": 144132, "epoch": 1191} {"train_loss": -39.891998291015625, "global_step": 144133, "epoch": 1191} {"train_loss": -40.54377365112305, "global_step": 144134, "epoch": 1191} {"train_loss": -40.652809143066406, "global_step": 144135, "epoch": 1191} {"train_loss": -39.752471923828125, "global_step": 144136, "epoch": 1191} {"train_loss": -39.981964111328125, "global_step": 144137, "epoch": 1191} {"train_loss": -39.6818962097168, "global_step": 144138, "epoch": 1191} {"train_loss": -41.16313171386719, "global_step": 144139, "epoch": 1191} {"train_loss": -40.529659271240234, "global_step": 144140, "epoch": 1191} {"train_loss": -40.00170135498047, "global_step": 144141, "epoch": 1191} {"train_loss": -39.05295944213867, "global_step": 144142, "epoch": 1191} {"train_loss": -39.4014778137207, "global_step": 144143, "epoch": 1191} {"train_loss": -40.74494552612305, "global_step": 144144, "epoch": 1191} {"train_loss": -40.509727478027344, "global_step": 144145, "epoch": 1191} {"train_loss": -40.74868392944336, "global_step": 144146, "epoch": 1191} {"train_loss": -40.15726852416992, "global_step": 144147, "epoch": 1191} {"train_loss": -38.94352340698242, "global_step": 144148, "epoch": 1191} {"train_loss": -38.37839889526367, "global_step": 144149, "epoch": 1191} {"train_loss": -37.46702194213867, "global_step": 144150, "epoch": 1191} {"train_loss": -38.795841217041016, "global_step": 144151, "epoch": 1191} {"train_loss": -32.598243713378906, "global_step": 144152, "epoch": 1191} {"train_loss": -37.053592681884766, "global_step": 144153, "epoch": 1191} {"train_loss": -38.41795349121094, "global_step": 144154, "epoch": 1191} {"train_loss": -35.357234954833984, "global_step": 144155, "epoch": 1191} {"train_loss": -39.23930740356445, "global_step": 144156, "epoch": 1191} {"train_loss": -36.032501220703125, "global_step": 144157, "epoch": 1191} {"train_loss": -34.61207962036133, "global_step": 144158, "epoch": 1191} {"train_loss": -38.924903869628906, "global_step": 144159, "epoch": 1191} {"train_loss": -36.45443344116211, "global_step": 144160, "epoch": 1191} {"train_loss": -34.783016204833984, "global_step": 144161, "epoch": 1191} {"train_loss": -38.13859558105469, "global_step": 144162, "epoch": 1191} {"train_loss": -38.6626091003418, "global_step": 144163, "epoch": 1191} {"train_loss": -34.24518585205078, "global_step": 144164, "epoch": 1191} {"train_loss": -39.59165573120117, "global_step": 144165, "epoch": 1191} {"train_loss": -37.19646072387695, "global_step": 144166, "epoch": 1191} {"train_loss": -34.789608001708984, "global_step": 144167, "epoch": 1191} {"train_loss": -26.263822555541992, "global_step": 144168, "epoch": 1191} {"train_loss": -37.56633377075195, "global_step": 144169, "epoch": 1191} {"train_loss": -37.760128021240234, "global_step": 144170, "epoch": 1191} {"train_loss": -37.781551361083984, "global_step": 144171, "epoch": 1191} {"train_loss": -30.983844757080078, "global_step": 144172, "epoch": 1191} {"train_loss": -36.08576965332031, "global_step": 144173, "epoch": 1191} {"train_loss": -32.2767333984375, "global_step": 144174, "epoch": 1191} {"train_loss": -37.7656135559082, "global_step": 144175, "epoch": 1191} {"train_loss": -36.7515869140625, "global_step": 144176, "epoch": 1191} {"train_loss": -36.22562789916992, "global_step": 144177, "epoch": 1191} {"train_loss": -24.374771118164062, "global_step": 144178, "epoch": 1191} {"train_loss": -36.222572326660156, "global_step": 144179, "epoch": 1191} {"train_loss": -34.268165588378906, "global_step": 144180, "epoch": 1191} {"train_loss": -37.094581604003906, "global_step": 144181, "epoch": 1191} {"train_loss": -33.95478057861328, "global_step": 144182, "epoch": 1191} {"train_loss": -35.46806716918945, "global_step": 144183, "epoch": 1191} {"train_loss": -32.47615432739258, "global_step": 144184, "epoch": 1191} {"train_loss": -33.925254821777344, "global_step": 144185, "epoch": 1191} {"train_loss": -25.132802963256836, "global_step": 144186, "epoch": 1191} {"train_loss": -34.74485397338867, "global_step": 144187, "epoch": 1191} {"train_loss": -35.26229476928711, "global_step": 144188, "epoch": 1191} {"train_loss": -34.22659683227539, "global_step": 144189, "epoch": 1191} {"train_loss": -33.691856384277344, "global_step": 144190, "epoch": 1191} {"train_loss": -35.267555236816406, "global_step": 144191, "epoch": 1191} {"train_loss": -35.56770706176758, "global_step": 144192, "epoch": 1191} {"train_loss": -36.5611686706543, "global_step": 144193, "epoch": 1191} {"train_loss": -37.359825134277344, "global_step": 144194, "epoch": 1191} {"train_loss": -37.1096076965332, "global_step": 144195, "epoch": 1191} {"train_loss": -37.44677734375, "global_step": 144196, "epoch": 1191} {"train_loss": -37.129817962646484, "global_step": 144197, "epoch": 1191} {"train_loss": -36.77485275268555, "global_step": 144198, "epoch": 1191} {"train_loss": -36.90180587768555, "global_step": 144199, "epoch": 1191} {"train_loss": -35.91770553588867, "global_step": 144200, "epoch": 1191} {"train_loss": -37.404109954833984, "global_step": 144201, "epoch": 1191} {"train_loss": -36.13029861450195, "global_step": 144202, "epoch": 1191} {"train_loss": -38.22365951538086, "global_step": 144203, "epoch": 1191} {"train_loss": -37.90167236328125, "global_step": 144204, "epoch": 1191} {"train_loss": -37.794002532958984, "global_step": 144205, "epoch": 1191} {"train_loss": -38.41079330444336, "global_step": 144206, "epoch": 1191} {"train_loss": -38.579017639160156, "global_step": 144207, "epoch": 1191} {"train_loss": -37.41762924194336, "global_step": 144208, "epoch": 1191} {"train_loss": -38.076717376708984, "global_step": 144209, "epoch": 1191} {"train_loss": -36.72053146362305, "global_step": 144210, "epoch": 1191} {"train_loss": -37.64285659790039, "global_step": 144211, "epoch": 1191} {"train_loss": -38.07879638671875, "global_step": 144212, "epoch": 1191} {"train_loss": -38.210330963134766, "global_step": 144213, "epoch": 1191} {"train_loss": -38.74769973754883, "global_step": 144214, "epoch": 1191} {"train_loss": -38.37640380859375, "global_step": 144215, "epoch": 1191} {"train_loss": -37.20701217651367, "global_step": 144216, "epoch": 1191} {"train_loss": -36.74225616455078, "global_step": 144217, "epoch": 1191} {"train_loss": -36.69513702392578, "global_step": 144218, "epoch": 1191} {"train_loss": -38.499725341796875, "global_step": 144219, "epoch": 1191} {"train_loss": -37.72175979614258, "global_step": 144220, "epoch": 1191} {"train_loss": -38.40792465209961, "global_step": 144221, "epoch": 1191} {"train_loss": -38.5335807800293, "global_step": 144222, "epoch": 1191} {"train_loss": -38.08669662475586, "global_step": 144223, "epoch": 1191} {"train_loss": -38.35603713989258, "global_step": 144224, "epoch": 1191} {"train_loss": -38.38888168334961, "global_step": 144225, "epoch": 1191} {"train_loss": -39.14089584350586, "global_step": 144226, "epoch": 1191} {"train_loss": -38.37577438354492, "global_step": 144227, "epoch": 1191} {"train_loss": -38.938167572021484, "global_step": 144228, "epoch": 1191} {"train_loss": -38.785491943359375, "global_step": 144229, "epoch": 1191} {"train_loss": -37.839874267578125, "global_step": 144230, "epoch": 1191} {"train_loss": -37.584667111231276, "global_step": 144231, "epoch": 1191, "val_loss": 2635143.0} {"train_loss": -39.15354537963867, "global_step": 144232, "epoch": 1192} {"train_loss": -39.52174758911133, "global_step": 144233, "epoch": 1192} {"train_loss": -39.338050842285156, "global_step": 144234, "epoch": 1192} {"train_loss": -38.359615325927734, "global_step": 144235, "epoch": 1192} {"train_loss": -39.507625579833984, "global_step": 144236, "epoch": 1192} {"train_loss": -38.48459243774414, "global_step": 144237, "epoch": 1192} {"train_loss": -39.150665283203125, "global_step": 144238, "epoch": 1192} {"train_loss": -39.516746520996094, "global_step": 144239, "epoch": 1192} {"train_loss": -39.41868209838867, "global_step": 144240, "epoch": 1192} {"train_loss": -38.99656677246094, "global_step": 144241, "epoch": 1192} {"train_loss": -39.23822021484375, "global_step": 144242, "epoch": 1192} {"train_loss": -39.45919418334961, "global_step": 144243, "epoch": 1192} {"train_loss": -37.86875534057617, "global_step": 144244, "epoch": 1192} {"train_loss": -39.6069450378418, "global_step": 144245, "epoch": 1192} {"train_loss": -39.56563186645508, "global_step": 144246, "epoch": 1192} {"train_loss": -39.642066955566406, "global_step": 144247, "epoch": 1192} {"train_loss": -39.31624221801758, "global_step": 144248, "epoch": 1192} {"train_loss": -40.03109359741211, "global_step": 144249, "epoch": 1192} {"train_loss": -39.64866256713867, "global_step": 144250, "epoch": 1192} {"train_loss": -39.91237258911133, "global_step": 144251, "epoch": 1192} {"train_loss": -39.65230941772461, "global_step": 144252, "epoch": 1192} {"train_loss": -39.91556930541992, "global_step": 144253, "epoch": 1192} {"train_loss": -39.70126724243164, "global_step": 144254, "epoch": 1192} {"train_loss": -39.535255432128906, "global_step": 144255, "epoch": 1192} {"train_loss": -39.485286712646484, "global_step": 144256, "epoch": 1192} {"train_loss": -40.076351165771484, "global_step": 144257, "epoch": 1192} {"train_loss": -39.172725677490234, "global_step": 144258, "epoch": 1192} {"train_loss": -39.61616134643555, "global_step": 144259, "epoch": 1192} {"train_loss": -40.01607131958008, "global_step": 144260, "epoch": 1192} {"train_loss": -40.30534744262695, "global_step": 144261, "epoch": 1192} {"train_loss": -40.048316955566406, "global_step": 144262, "epoch": 1192} {"train_loss": -38.571678161621094, "global_step": 144263, "epoch": 1192} {"train_loss": -40.28020477294922, "global_step": 144264, "epoch": 1192} {"train_loss": -40.055477142333984, "global_step": 144265, "epoch": 1192} {"train_loss": -40.565242767333984, "global_step": 144266, "epoch": 1192} {"train_loss": -39.966121673583984, "global_step": 144267, "epoch": 1192} {"train_loss": -39.62794876098633, "global_step": 144268, "epoch": 1192} {"train_loss": -39.78468322753906, "global_step": 144269, "epoch": 1192} {"train_loss": -40.08382797241211, "global_step": 144270, "epoch": 1192} {"train_loss": -39.89284133911133, "global_step": 144271, "epoch": 1192} {"train_loss": -39.85024642944336, "global_step": 144272, "epoch": 1192} {"train_loss": -40.104408264160156, "global_step": 144273, "epoch": 1192} {"train_loss": -39.75087356567383, "global_step": 144274, "epoch": 1192} {"train_loss": -39.91704177856445, "global_step": 144275, "epoch": 1192} {"train_loss": -39.354854583740234, "global_step": 144276, "epoch": 1192} {"train_loss": -38.72284698486328, "global_step": 144277, "epoch": 1192} {"train_loss": -38.72964859008789, "global_step": 144278, "epoch": 1192} {"train_loss": -37.55748748779297, "global_step": 144279, "epoch": 1192} {"train_loss": -39.25675582885742, "global_step": 144280, "epoch": 1192} {"train_loss": -39.42396545410156, "global_step": 144281, "epoch": 1192} {"train_loss": -38.699459075927734, "global_step": 144282, "epoch": 1192} {"train_loss": -40.07693099975586, "global_step": 144283, "epoch": 1192} {"train_loss": -40.521907806396484, "global_step": 144284, "epoch": 1192} {"train_loss": -39.9307861328125, "global_step": 144285, "epoch": 1192} {"train_loss": -38.96418380737305, "global_step": 144286, "epoch": 1192} {"train_loss": -39.329429626464844, "global_step": 144287, "epoch": 1192} {"train_loss": -39.766754150390625, "global_step": 144288, "epoch": 1192} {"train_loss": -39.82149124145508, "global_step": 144289, "epoch": 1192} {"train_loss": -39.96516036987305, "global_step": 144290, "epoch": 1192} {"train_loss": -40.139644622802734, "global_step": 144291, "epoch": 1192} {"train_loss": -39.144309997558594, "global_step": 144292, "epoch": 1192} {"train_loss": -39.495269775390625, "global_step": 144293, "epoch": 1192} {"train_loss": -40.734039306640625, "global_step": 144294, "epoch": 1192} {"train_loss": -40.234954833984375, "global_step": 144295, "epoch": 1192} {"train_loss": -39.21163558959961, "global_step": 144296, "epoch": 1192} {"train_loss": -40.0461311340332, "global_step": 144297, "epoch": 1192} {"train_loss": -39.5608024597168, "global_step": 144298, "epoch": 1192} {"train_loss": -39.94635009765625, "global_step": 144299, "epoch": 1192} {"train_loss": -38.7894287109375, "global_step": 144300, "epoch": 1192} {"train_loss": -39.0604133605957, "global_step": 144301, "epoch": 1192} {"train_loss": -38.92764663696289, "global_step": 144302, "epoch": 1192} {"train_loss": -39.760467529296875, "global_step": 144303, "epoch": 1192} {"train_loss": -40.338409423828125, "global_step": 144304, "epoch": 1192} {"train_loss": -40.065101623535156, "global_step": 144305, "epoch": 1192} {"train_loss": -39.52860641479492, "global_step": 144306, "epoch": 1192} {"train_loss": -39.497196197509766, "global_step": 144307, "epoch": 1192} {"train_loss": -39.5866813659668, "global_step": 144308, "epoch": 1192} {"train_loss": -39.50867462158203, "global_step": 144309, "epoch": 1192} {"train_loss": -39.110260009765625, "global_step": 144310, "epoch": 1192} {"train_loss": -39.90403366088867, "global_step": 144311, "epoch": 1192} {"train_loss": -40.154842376708984, "global_step": 144312, "epoch": 1192} {"train_loss": -40.26774978637695, "global_step": 144313, "epoch": 1192} {"train_loss": -39.695247650146484, "global_step": 144314, "epoch": 1192} {"train_loss": -39.73683547973633, "global_step": 144315, "epoch": 1192} {"train_loss": -40.2526969909668, "global_step": 144316, "epoch": 1192} {"train_loss": -40.88679885864258, "global_step": 144317, "epoch": 1192} {"train_loss": -40.54787826538086, "global_step": 144318, "epoch": 1192} {"train_loss": -39.148983001708984, "global_step": 144319, "epoch": 1192} {"train_loss": -38.98681640625, "global_step": 144320, "epoch": 1192} {"train_loss": -39.55671310424805, "global_step": 144321, "epoch": 1192} {"train_loss": -36.99653625488281, "global_step": 144322, "epoch": 1192} {"train_loss": -36.57343292236328, "global_step": 144323, "epoch": 1192} {"train_loss": -36.73887252807617, "global_step": 144324, "epoch": 1192} {"train_loss": -39.894283294677734, "global_step": 144325, "epoch": 1192} {"train_loss": -38.08122253417969, "global_step": 144326, "epoch": 1192} {"train_loss": -38.54303741455078, "global_step": 144327, "epoch": 1192} {"train_loss": -36.14979934692383, "global_step": 144328, "epoch": 1192} {"train_loss": -38.3725471496582, "global_step": 144329, "epoch": 1192} {"train_loss": -39.82511520385742, "global_step": 144330, "epoch": 1192} {"train_loss": -39.43671417236328, "global_step": 144331, "epoch": 1192} {"train_loss": -37.81172561645508, "global_step": 144332, "epoch": 1192} {"train_loss": -35.953487396240234, "global_step": 144333, "epoch": 1192} {"train_loss": -35.18479919433594, "global_step": 144334, "epoch": 1192} {"train_loss": -39.0463752746582, "global_step": 144335, "epoch": 1192} {"train_loss": -35.546661376953125, "global_step": 144336, "epoch": 1192} {"train_loss": -33.826072692871094, "global_step": 144337, "epoch": 1192} {"train_loss": -34.926666259765625, "global_step": 144338, "epoch": 1192} {"train_loss": -39.64846420288086, "global_step": 144339, "epoch": 1192} {"train_loss": -33.58763122558594, "global_step": 144340, "epoch": 1192} {"train_loss": -36.96355438232422, "global_step": 144341, "epoch": 1192} {"train_loss": -37.10210037231445, "global_step": 144342, "epoch": 1192} {"train_loss": -37.24888229370117, "global_step": 144343, "epoch": 1192} {"train_loss": -38.29769515991211, "global_step": 144344, "epoch": 1192} {"train_loss": -37.65532302856445, "global_step": 144345, "epoch": 1192} {"train_loss": -37.22408676147461, "global_step": 144346, "epoch": 1192} {"train_loss": -38.84589767456055, "global_step": 144347, "epoch": 1192} {"train_loss": -38.00635528564453, "global_step": 144348, "epoch": 1192} {"train_loss": -39.918182373046875, "global_step": 144349, "epoch": 1192} {"train_loss": -38.49220657348633, "global_step": 144350, "epoch": 1192} {"train_loss": -38.19112014770508, "global_step": 144351, "epoch": 1192} {"train_loss": -39.064113553890515, "global_step": 144352, "epoch": 1192, "val_loss": 2686044.25} {"train_loss": -38.30988693237305, "global_step": 144353, "epoch": 1193} {"train_loss": -39.84076690673828, "global_step": 144354, "epoch": 1193} {"train_loss": -39.01144790649414, "global_step": 144355, "epoch": 1193} {"train_loss": -38.72913360595703, "global_step": 144356, "epoch": 1193} {"train_loss": -39.1331672668457, "global_step": 144357, "epoch": 1193} {"train_loss": -39.31403350830078, "global_step": 144358, "epoch": 1193} {"train_loss": -38.81257247924805, "global_step": 144359, "epoch": 1193} {"train_loss": -39.64215850830078, "global_step": 144360, "epoch": 1193} {"train_loss": -38.98501968383789, "global_step": 144361, "epoch": 1193} {"train_loss": -39.38230514526367, "global_step": 144362, "epoch": 1193} {"train_loss": -39.005760192871094, "global_step": 144363, "epoch": 1193} {"train_loss": -38.6553955078125, "global_step": 144364, "epoch": 1193} {"train_loss": -39.12837600708008, "global_step": 144365, "epoch": 1193} {"train_loss": -38.876319885253906, "global_step": 144366, "epoch": 1193} {"train_loss": -39.64547348022461, "global_step": 144367, "epoch": 1193} {"train_loss": -39.914947509765625, "global_step": 144368, "epoch": 1193} {"train_loss": -39.383506774902344, "global_step": 144369, "epoch": 1193} {"train_loss": -40.129188537597656, "global_step": 144370, "epoch": 1193} {"train_loss": -38.71179962158203, "global_step": 144371, "epoch": 1193} {"train_loss": -39.78173065185547, "global_step": 144372, "epoch": 1193} {"train_loss": -39.717872619628906, "global_step": 144373, "epoch": 1193} {"train_loss": -38.29042053222656, "global_step": 144374, "epoch": 1193} {"train_loss": -39.944698333740234, "global_step": 144375, "epoch": 1193} {"train_loss": -39.956016540527344, "global_step": 144376, "epoch": 1193} {"train_loss": -39.88219451904297, "global_step": 144377, "epoch": 1193} {"train_loss": -39.34723663330078, "global_step": 144378, "epoch": 1193} {"train_loss": -39.82729721069336, "global_step": 144379, "epoch": 1193} {"train_loss": -40.26487350463867, "global_step": 144380, "epoch": 1193} {"train_loss": -40.290584564208984, "global_step": 144381, "epoch": 1193} {"train_loss": -40.028656005859375, "global_step": 144382, "epoch": 1193} {"train_loss": -40.11690902709961, "global_step": 144383, "epoch": 1193} {"train_loss": -39.57734298706055, "global_step": 144384, "epoch": 1193} {"train_loss": -40.48843002319336, "global_step": 144385, "epoch": 1193} {"train_loss": -39.71465301513672, "global_step": 144386, "epoch": 1193} {"train_loss": -37.37726593017578, "global_step": 144387, "epoch": 1193} {"train_loss": -35.00492477416992, "global_step": 144388, "epoch": 1193} {"train_loss": -36.96706008911133, "global_step": 144389, "epoch": 1193} {"train_loss": -37.914756774902344, "global_step": 144390, "epoch": 1193} {"train_loss": -39.546199798583984, "global_step": 144391, "epoch": 1193} {"train_loss": -40.25431442260742, "global_step": 144392, "epoch": 1193} {"train_loss": -38.237281799316406, "global_step": 144393, "epoch": 1193} {"train_loss": -36.7525749206543, "global_step": 144394, "epoch": 1193} {"train_loss": -38.67056655883789, "global_step": 144395, "epoch": 1193} {"train_loss": -40.343353271484375, "global_step": 144396, "epoch": 1193} {"train_loss": -37.713836669921875, "global_step": 144397, "epoch": 1193} {"train_loss": -37.1920051574707, "global_step": 144398, "epoch": 1193} {"train_loss": -40.25358200073242, "global_step": 144399, "epoch": 1193} {"train_loss": -38.52360153198242, "global_step": 144400, "epoch": 1193} {"train_loss": -38.502681732177734, "global_step": 144401, "epoch": 1193} {"train_loss": -39.62710189819336, "global_step": 144402, "epoch": 1193} {"train_loss": -39.101806640625, "global_step": 144403, "epoch": 1193} {"train_loss": -40.0853385925293, "global_step": 144404, "epoch": 1193} {"train_loss": -39.9456787109375, "global_step": 144405, "epoch": 1193} {"train_loss": -40.20307540893555, "global_step": 144406, "epoch": 1193} {"train_loss": -40.066307067871094, "global_step": 144407, "epoch": 1193} {"train_loss": -39.42600631713867, "global_step": 144408, "epoch": 1193} {"train_loss": -40.43348693847656, "global_step": 144409, "epoch": 1193} {"train_loss": -40.04286575317383, "global_step": 144410, "epoch": 1193} {"train_loss": -40.46930694580078, "global_step": 144411, "epoch": 1193} {"train_loss": -40.092323303222656, "global_step": 144412, "epoch": 1193} {"train_loss": -40.39692306518555, "global_step": 144413, "epoch": 1193} {"train_loss": -40.36567687988281, "global_step": 144414, "epoch": 1193} {"train_loss": -40.89388656616211, "global_step": 144415, "epoch": 1193} {"train_loss": -40.41706466674805, "global_step": 144416, "epoch": 1193} {"train_loss": -40.06455612182617, "global_step": 144417, "epoch": 1193} {"train_loss": -40.397247314453125, "global_step": 144418, "epoch": 1193} {"train_loss": -39.87270736694336, "global_step": 144419, "epoch": 1193} {"train_loss": -40.76920700073242, "global_step": 144420, "epoch": 1193} {"train_loss": -40.45460510253906, "global_step": 144421, "epoch": 1193} {"train_loss": -40.73613357543945, "global_step": 144422, "epoch": 1193} {"train_loss": -41.151344299316406, "global_step": 144423, "epoch": 1193} {"train_loss": -40.573524475097656, "global_step": 144424, "epoch": 1193} {"train_loss": -40.483829498291016, "global_step": 144425, "epoch": 1193} {"train_loss": -40.79291915893555, "global_step": 144426, "epoch": 1193} {"train_loss": -40.79975128173828, "global_step": 144427, "epoch": 1193} {"train_loss": -41.236690521240234, "global_step": 144428, "epoch": 1193} {"train_loss": -40.86509704589844, "global_step": 144429, "epoch": 1193} {"train_loss": -41.342506408691406, "global_step": 144430, "epoch": 1193} {"train_loss": -41.11130905151367, "global_step": 144431, "epoch": 1193} {"train_loss": -40.935089111328125, "global_step": 144432, "epoch": 1193} {"train_loss": -41.163761138916016, "global_step": 144433, "epoch": 1193} {"train_loss": -41.29609298706055, "global_step": 144434, "epoch": 1193} {"train_loss": -40.11198425292969, "global_step": 144435, "epoch": 1193} {"train_loss": -40.06246566772461, "global_step": 144436, "epoch": 1193} {"train_loss": -40.47423553466797, "global_step": 144437, "epoch": 1193} {"train_loss": -40.546669006347656, "global_step": 144438, "epoch": 1193} {"train_loss": -41.176761627197266, "global_step": 144439, "epoch": 1193} {"train_loss": -40.92332077026367, "global_step": 144440, "epoch": 1193} {"train_loss": -41.18060302734375, "global_step": 144441, "epoch": 1193} {"train_loss": -41.48604965209961, "global_step": 144442, "epoch": 1193} {"train_loss": -40.981964111328125, "global_step": 144443, "epoch": 1193} {"train_loss": -41.195377349853516, "global_step": 144444, "epoch": 1193} {"train_loss": -40.82725143432617, "global_step": 144445, "epoch": 1193} {"train_loss": -40.97426986694336, "global_step": 144446, "epoch": 1193} {"train_loss": -40.22323226928711, "global_step": 144447, "epoch": 1193} {"train_loss": -39.22367477416992, "global_step": 144448, "epoch": 1193} {"train_loss": -40.00868225097656, "global_step": 144449, "epoch": 1193} {"train_loss": -39.61846160888672, "global_step": 144450, "epoch": 1193} {"train_loss": -39.76094436645508, "global_step": 144451, "epoch": 1193} {"train_loss": -38.20192337036133, "global_step": 144452, "epoch": 1193} {"train_loss": -39.1474609375, "global_step": 144453, "epoch": 1193} {"train_loss": -38.36896514892578, "global_step": 144454, "epoch": 1193} {"train_loss": -36.580841064453125, "global_step": 144455, "epoch": 1193} {"train_loss": -35.607879638671875, "global_step": 144456, "epoch": 1193} {"train_loss": -38.17949295043945, "global_step": 144457, "epoch": 1193} {"train_loss": -38.3358039855957, "global_step": 144458, "epoch": 1193} {"train_loss": -36.562801361083984, "global_step": 144459, "epoch": 1193} {"train_loss": -34.7252311706543, "global_step": 144460, "epoch": 1193} {"train_loss": -32.517486572265625, "global_step": 144461, "epoch": 1193} {"train_loss": -35.853370666503906, "global_step": 144462, "epoch": 1193} {"train_loss": -35.749237060546875, "global_step": 144463, "epoch": 1193} {"train_loss": -35.7490234375, "global_step": 144464, "epoch": 1193} {"train_loss": -37.622066497802734, "global_step": 144465, "epoch": 1193} {"train_loss": -34.790992736816406, "global_step": 144466, "epoch": 1193} {"train_loss": -36.74880599975586, "global_step": 144467, "epoch": 1193} {"train_loss": -37.8808708190918, "global_step": 144468, "epoch": 1193} {"train_loss": -37.104854583740234, "global_step": 144469, "epoch": 1193} {"train_loss": -38.65803146362305, "global_step": 144470, "epoch": 1193} {"train_loss": -37.3591423034668, "global_step": 144471, "epoch": 1193} {"train_loss": -39.64216232299805, "global_step": 144472, "epoch": 1193} {"train_loss": -39.27229561293421, "global_step": 144473, "epoch": 1193, "val_loss": 2672721.75} {"train_loss": -38.55257797241211, "global_step": 144474, "epoch": 1194} {"train_loss": -37.692832946777344, "global_step": 144475, "epoch": 1194} {"train_loss": -38.874568939208984, "global_step": 144476, "epoch": 1194} {"train_loss": -39.1328239440918, "global_step": 144477, "epoch": 1194} {"train_loss": -38.535884857177734, "global_step": 144478, "epoch": 1194} {"train_loss": -39.682098388671875, "global_step": 144479, "epoch": 1194} {"train_loss": -39.15446853637695, "global_step": 144480, "epoch": 1194} {"train_loss": -38.459686279296875, "global_step": 144481, "epoch": 1194} {"train_loss": -39.415283203125, "global_step": 144482, "epoch": 1194} {"train_loss": -39.28723907470703, "global_step": 144483, "epoch": 1194} {"train_loss": -39.76497268676758, "global_step": 144484, "epoch": 1194} {"train_loss": -39.83476638793945, "global_step": 144485, "epoch": 1194} {"train_loss": -39.92669677734375, "global_step": 144486, "epoch": 1194} {"train_loss": -40.228858947753906, "global_step": 144487, "epoch": 1194} {"train_loss": -39.688758850097656, "global_step": 144488, "epoch": 1194} {"train_loss": -39.6534309387207, "global_step": 144489, "epoch": 1194} {"train_loss": -39.90644454956055, "global_step": 144490, "epoch": 1194} {"train_loss": -40.068233489990234, "global_step": 144491, "epoch": 1194} {"train_loss": -40.014404296875, "global_step": 144492, "epoch": 1194} {"train_loss": -39.3250732421875, "global_step": 144493, "epoch": 1194} {"train_loss": -39.7100944519043, "global_step": 144494, "epoch": 1194} {"train_loss": -39.867305755615234, "global_step": 144495, "epoch": 1194} {"train_loss": -40.04664993286133, "global_step": 144496, "epoch": 1194} {"train_loss": -40.577301025390625, "global_step": 144497, "epoch": 1194} {"train_loss": -40.18031311035156, "global_step": 144498, "epoch": 1194} {"train_loss": -40.5701904296875, "global_step": 144499, "epoch": 1194} {"train_loss": -40.3530387878418, "global_step": 144500, "epoch": 1194} {"train_loss": -40.58103942871094, "global_step": 144501, "epoch": 1194} {"train_loss": -40.64229965209961, "global_step": 144502, "epoch": 1194} {"train_loss": -40.786842346191406, "global_step": 144503, "epoch": 1194} {"train_loss": -40.49772262573242, "global_step": 144504, "epoch": 1194} {"train_loss": -39.87309646606445, "global_step": 144505, "epoch": 1194} {"train_loss": -40.4543571472168, "global_step": 144506, "epoch": 1194} {"train_loss": -40.65535354614258, "global_step": 144507, "epoch": 1194} {"train_loss": -40.86941146850586, "global_step": 144508, "epoch": 1194} {"train_loss": -40.21022415161133, "global_step": 144509, "epoch": 1194} {"train_loss": -39.264373779296875, "global_step": 144510, "epoch": 1194} {"train_loss": -40.20783615112305, "global_step": 144511, "epoch": 1194} {"train_loss": -40.6171989440918, "global_step": 144512, "epoch": 1194} {"train_loss": -40.557247161865234, "global_step": 144513, "epoch": 1194} {"train_loss": -40.890438079833984, "global_step": 144514, "epoch": 1194} {"train_loss": -41.05080795288086, "global_step": 144515, "epoch": 1194} {"train_loss": -40.90504455566406, "global_step": 144516, "epoch": 1194} {"train_loss": -40.261409759521484, "global_step": 144517, "epoch": 1194} {"train_loss": -39.32588195800781, "global_step": 144518, "epoch": 1194} {"train_loss": -40.5274772644043, "global_step": 144519, "epoch": 1194} {"train_loss": -41.280208587646484, "global_step": 144520, "epoch": 1194} {"train_loss": -40.6754264831543, "global_step": 144521, "epoch": 1194} {"train_loss": -39.331825256347656, "global_step": 144522, "epoch": 1194} {"train_loss": -40.79390335083008, "global_step": 144523, "epoch": 1194} {"train_loss": -41.11300277709961, "global_step": 144524, "epoch": 1194} {"train_loss": -40.274940490722656, "global_step": 144525, "epoch": 1194} {"train_loss": -40.90240478515625, "global_step": 144526, "epoch": 1194} {"train_loss": -40.810462951660156, "global_step": 144527, "epoch": 1194} {"train_loss": -40.48853302001953, "global_step": 144528, "epoch": 1194} {"train_loss": -38.60514450073242, "global_step": 144529, "epoch": 1194} {"train_loss": -40.45109939575195, "global_step": 144530, "epoch": 1194} {"train_loss": -40.5029411315918, "global_step": 144531, "epoch": 1194} {"train_loss": -40.57307815551758, "global_step": 144532, "epoch": 1194} {"train_loss": -39.69776153564453, "global_step": 144533, "epoch": 1194} {"train_loss": -39.62553024291992, "global_step": 144534, "epoch": 1194} {"train_loss": -38.662654876708984, "global_step": 144535, "epoch": 1194} {"train_loss": -38.407684326171875, "global_step": 144536, "epoch": 1194} {"train_loss": -40.45082092285156, "global_step": 144537, "epoch": 1194} {"train_loss": -40.199119567871094, "global_step": 144538, "epoch": 1194} {"train_loss": -40.471343994140625, "global_step": 144539, "epoch": 1194} {"train_loss": -39.42930221557617, "global_step": 144540, "epoch": 1194} {"train_loss": -35.95443344116211, "global_step": 144541, "epoch": 1194} {"train_loss": -36.62315368652344, "global_step": 144542, "epoch": 1194} {"train_loss": -39.57086944580078, "global_step": 144543, "epoch": 1194} {"train_loss": -40.469085693359375, "global_step": 144544, "epoch": 1194} {"train_loss": -36.256954193115234, "global_step": 144545, "epoch": 1194} {"train_loss": -35.95378494262695, "global_step": 144546, "epoch": 1194} {"train_loss": -35.16873550415039, "global_step": 144547, "epoch": 1194} {"train_loss": -35.70475387573242, "global_step": 144548, "epoch": 1194} {"train_loss": -35.40151596069336, "global_step": 144549, "epoch": 1194} {"train_loss": -39.29039001464844, "global_step": 144550, "epoch": 1194} {"train_loss": -37.612674713134766, "global_step": 144551, "epoch": 1194} {"train_loss": -38.50566864013672, "global_step": 144552, "epoch": 1194} {"train_loss": -38.281795501708984, "global_step": 144553, "epoch": 1194} {"train_loss": -37.06909942626953, "global_step": 144554, "epoch": 1194} {"train_loss": -37.821937561035156, "global_step": 144555, "epoch": 1194} {"train_loss": -38.72108459472656, "global_step": 144556, "epoch": 1194} {"train_loss": -38.404354095458984, "global_step": 144557, "epoch": 1194} {"train_loss": -37.039188385009766, "global_step": 144558, "epoch": 1194} {"train_loss": -37.729366302490234, "global_step": 144559, "epoch": 1194} {"train_loss": -37.0406379699707, "global_step": 144560, "epoch": 1194} {"train_loss": -35.83382034301758, "global_step": 144561, "epoch": 1194} {"train_loss": -38.91349411010742, "global_step": 144562, "epoch": 1194} {"train_loss": -39.44538116455078, "global_step": 144563, "epoch": 1194} {"train_loss": -39.15507125854492, "global_step": 144564, "epoch": 1194} {"train_loss": -38.93832015991211, "global_step": 144565, "epoch": 1194} {"train_loss": -38.7595329284668, "global_step": 144566, "epoch": 1194} {"train_loss": -38.57558059692383, "global_step": 144567, "epoch": 1194} {"train_loss": -39.81161117553711, "global_step": 144568, "epoch": 1194} {"train_loss": -37.74569320678711, "global_step": 144569, "epoch": 1194} {"train_loss": -39.789791107177734, "global_step": 144570, "epoch": 1194} {"train_loss": -39.1185188293457, "global_step": 144571, "epoch": 1194} {"train_loss": -39.44378662109375, "global_step": 144572, "epoch": 1194} {"train_loss": -39.04329299926758, "global_step": 144573, "epoch": 1194} {"train_loss": -39.805870056152344, "global_step": 144574, "epoch": 1194} {"train_loss": -38.574092864990234, "global_step": 144575, "epoch": 1194} {"train_loss": -39.90983200073242, "global_step": 144576, "epoch": 1194} {"train_loss": -40.106971740722656, "global_step": 144577, "epoch": 1194} {"train_loss": -39.34614181518555, "global_step": 144578, "epoch": 1194} {"train_loss": -39.564205169677734, "global_step": 144579, "epoch": 1194} {"train_loss": -40.38685989379883, "global_step": 144580, "epoch": 1194} {"train_loss": -38.675262451171875, "global_step": 144581, "epoch": 1194} {"train_loss": -39.59762191772461, "global_step": 144582, "epoch": 1194} {"train_loss": -39.16522216796875, "global_step": 144583, "epoch": 1194} {"train_loss": -40.4345703125, "global_step": 144584, "epoch": 1194} {"train_loss": -39.98186111450195, "global_step": 144585, "epoch": 1194} {"train_loss": -39.72846603393555, "global_step": 144586, "epoch": 1194} {"train_loss": -39.93097686767578, "global_step": 144587, "epoch": 1194} {"train_loss": -40.531612396240234, "global_step": 144588, "epoch": 1194} {"train_loss": -39.809452056884766, "global_step": 144589, "epoch": 1194} {"train_loss": -40.1991081237793, "global_step": 144590, "epoch": 1194} {"train_loss": -40.29682540893555, "global_step": 144591, "epoch": 1194} {"train_loss": -40.06526565551758, "global_step": 144592, "epoch": 1194} {"train_loss": -39.89379119873047, "global_step": 144593, "epoch": 1194} {"train_loss": -39.41509435984714, "global_step": 144594, "epoch": 1194, "val_loss": 2732238.0} {"train_loss": -39.883155822753906, "global_step": 144595, "epoch": 1195} {"train_loss": -39.833675384521484, "global_step": 144596, "epoch": 1195} {"train_loss": -38.8356819152832, "global_step": 144597, "epoch": 1195} {"train_loss": -37.87826156616211, "global_step": 144598, "epoch": 1195} {"train_loss": -40.02533721923828, "global_step": 144599, "epoch": 1195} {"train_loss": -40.322792053222656, "global_step": 144600, "epoch": 1195} {"train_loss": -38.736751556396484, "global_step": 144601, "epoch": 1195} {"train_loss": -37.515602111816406, "global_step": 144602, "epoch": 1195} {"train_loss": -37.832420349121094, "global_step": 144603, "epoch": 1195} {"train_loss": -40.05654525756836, "global_step": 144604, "epoch": 1195} {"train_loss": -40.257179260253906, "global_step": 144605, "epoch": 1195} {"train_loss": -38.60934066772461, "global_step": 144606, "epoch": 1195} {"train_loss": -40.37986373901367, "global_step": 144607, "epoch": 1195} {"train_loss": -39.14582061767578, "global_step": 144608, "epoch": 1195} {"train_loss": -37.28968048095703, "global_step": 144609, "epoch": 1195} {"train_loss": -38.875885009765625, "global_step": 144610, "epoch": 1195} {"train_loss": -40.30100631713867, "global_step": 144611, "epoch": 1195} {"train_loss": -38.44105529785156, "global_step": 144612, "epoch": 1195} {"train_loss": -39.55765914916992, "global_step": 144613, "epoch": 1195} {"train_loss": -40.39312744140625, "global_step": 144614, "epoch": 1195} {"train_loss": -38.58535385131836, "global_step": 144615, "epoch": 1195} {"train_loss": -39.674251556396484, "global_step": 144616, "epoch": 1195} {"train_loss": -40.883056640625, "global_step": 144617, "epoch": 1195} {"train_loss": -38.85401916503906, "global_step": 144618, "epoch": 1195} {"train_loss": -40.168243408203125, "global_step": 144619, "epoch": 1195} {"train_loss": -40.09840774536133, "global_step": 144620, "epoch": 1195} {"train_loss": -39.223236083984375, "global_step": 144621, "epoch": 1195} {"train_loss": -40.07593536376953, "global_step": 144622, "epoch": 1195} {"train_loss": -39.76068878173828, "global_step": 144623, "epoch": 1195} {"train_loss": -39.275569915771484, "global_step": 144624, "epoch": 1195} {"train_loss": -39.46442794799805, "global_step": 144625, "epoch": 1195} {"train_loss": -40.64332962036133, "global_step": 144626, "epoch": 1195} {"train_loss": -39.18463897705078, "global_step": 144627, "epoch": 1195} {"train_loss": -40.297607421875, "global_step": 144628, "epoch": 1195} {"train_loss": -39.2241096496582, "global_step": 144629, "epoch": 1195} {"train_loss": -40.09563064575195, "global_step": 144630, "epoch": 1195} {"train_loss": -39.206390380859375, "global_step": 144631, "epoch": 1195} {"train_loss": -40.34367752075195, "global_step": 144632, "epoch": 1195} {"train_loss": -39.45172119140625, "global_step": 144633, "epoch": 1195} {"train_loss": -40.201351165771484, "global_step": 144634, "epoch": 1195} {"train_loss": -39.77657699584961, "global_step": 144635, "epoch": 1195} {"train_loss": -39.97918701171875, "global_step": 144636, "epoch": 1195} {"train_loss": -40.15949249267578, "global_step": 144637, "epoch": 1195} {"train_loss": -40.035335540771484, "global_step": 144638, "epoch": 1195} {"train_loss": -40.687835693359375, "global_step": 144639, "epoch": 1195} {"train_loss": -40.072147369384766, "global_step": 144640, "epoch": 1195} {"train_loss": -40.01809310913086, "global_step": 144641, "epoch": 1195} {"train_loss": -40.39898681640625, "global_step": 144642, "epoch": 1195} {"train_loss": -39.902278900146484, "global_step": 144643, "epoch": 1195} {"train_loss": -40.58486557006836, "global_step": 144644, "epoch": 1195} {"train_loss": -40.129146575927734, "global_step": 144645, "epoch": 1195} {"train_loss": -40.89533996582031, "global_step": 144646, "epoch": 1195} {"train_loss": -40.13103103637695, "global_step": 144647, "epoch": 1195} {"train_loss": -41.06604766845703, "global_step": 144648, "epoch": 1195} {"train_loss": -40.49113082885742, "global_step": 144649, "epoch": 1195} {"train_loss": -40.4679069519043, "global_step": 144650, "epoch": 1195} {"train_loss": -40.994842529296875, "global_step": 144651, "epoch": 1195} {"train_loss": -40.946022033691406, "global_step": 144652, "epoch": 1195} {"train_loss": -40.76084899902344, "global_step": 144653, "epoch": 1195} {"train_loss": -40.75308609008789, "global_step": 144654, "epoch": 1195} {"train_loss": -41.0925178527832, "global_step": 144655, "epoch": 1195} {"train_loss": -41.0294189453125, "global_step": 144656, "epoch": 1195} {"train_loss": -41.26865005493164, "global_step": 144657, "epoch": 1195} {"train_loss": -40.217369079589844, "global_step": 144658, "epoch": 1195} {"train_loss": -40.84434127807617, "global_step": 144659, "epoch": 1195} {"train_loss": -40.98926544189453, "global_step": 144660, "epoch": 1195} {"train_loss": -40.58530807495117, "global_step": 144661, "epoch": 1195} {"train_loss": -39.89744186401367, "global_step": 144662, "epoch": 1195} {"train_loss": -40.79169845581055, "global_step": 144663, "epoch": 1195} {"train_loss": -40.51625442504883, "global_step": 144664, "epoch": 1195} {"train_loss": -40.94915771484375, "global_step": 144665, "epoch": 1195} {"train_loss": -40.3422737121582, "global_step": 144666, "epoch": 1195} {"train_loss": -40.59551239013672, "global_step": 144667, "epoch": 1195} {"train_loss": -40.63520812988281, "global_step": 144668, "epoch": 1195} {"train_loss": -40.440765380859375, "global_step": 144669, "epoch": 1195} {"train_loss": -40.46489334106445, "global_step": 144670, "epoch": 1195} {"train_loss": -41.072509765625, "global_step": 144671, "epoch": 1195} {"train_loss": -40.054298400878906, "global_step": 144672, "epoch": 1195} {"train_loss": -40.57619857788086, "global_step": 144673, "epoch": 1195} {"train_loss": -40.596866607666016, "global_step": 144674, "epoch": 1195} {"train_loss": -40.80918502807617, "global_step": 144675, "epoch": 1195} {"train_loss": -39.54275131225586, "global_step": 144676, "epoch": 1195} {"train_loss": -40.23033142089844, "global_step": 144677, "epoch": 1195} {"train_loss": -39.0513916015625, "global_step": 144678, "epoch": 1195} {"train_loss": -38.85988235473633, "global_step": 144679, "epoch": 1195} {"train_loss": -40.8536376953125, "global_step": 144680, "epoch": 1195} {"train_loss": -39.59994125366211, "global_step": 144681, "epoch": 1195} {"train_loss": -39.0091438293457, "global_step": 144682, "epoch": 1195} {"train_loss": -38.01674270629883, "global_step": 144683, "epoch": 1195} {"train_loss": -38.47608947753906, "global_step": 144684, "epoch": 1195} {"train_loss": -40.406837463378906, "global_step": 144685, "epoch": 1195} {"train_loss": -38.87579345703125, "global_step": 144686, "epoch": 1195} {"train_loss": -35.55060577392578, "global_step": 144687, "epoch": 1195} {"train_loss": -35.87038040161133, "global_step": 144688, "epoch": 1195} {"train_loss": -37.04694366455078, "global_step": 144689, "epoch": 1195} {"train_loss": -36.84749984741211, "global_step": 144690, "epoch": 1195} {"train_loss": -39.625579833984375, "global_step": 144691, "epoch": 1195} {"train_loss": -37.9985466003418, "global_step": 144692, "epoch": 1195} {"train_loss": -38.36716842651367, "global_step": 144693, "epoch": 1195} {"train_loss": -39.87367248535156, "global_step": 144694, "epoch": 1195} {"train_loss": -39.816612243652344, "global_step": 144695, "epoch": 1195} {"train_loss": -39.994529724121094, "global_step": 144696, "epoch": 1195} {"train_loss": -39.23994064331055, "global_step": 144697, "epoch": 1195} {"train_loss": -39.89583969116211, "global_step": 144698, "epoch": 1195} {"train_loss": -40.85380935668945, "global_step": 144699, "epoch": 1195} {"train_loss": -39.81974411010742, "global_step": 144700, "epoch": 1195} {"train_loss": -40.408531188964844, "global_step": 144701, "epoch": 1195} {"train_loss": -41.05876541137695, "global_step": 144702, "epoch": 1195} {"train_loss": -40.33614730834961, "global_step": 144703, "epoch": 1195} {"train_loss": -40.371891021728516, "global_step": 144704, "epoch": 1195} {"train_loss": -40.75345230102539, "global_step": 144705, "epoch": 1195} {"train_loss": -40.11800765991211, "global_step": 144706, "epoch": 1195} {"train_loss": -40.05585479736328, "global_step": 144707, "epoch": 1195} {"train_loss": -38.984676361083984, "global_step": 144708, "epoch": 1195} {"train_loss": -40.947391510009766, "global_step": 144709, "epoch": 1195} {"train_loss": -40.37007522583008, "global_step": 144710, "epoch": 1195} {"train_loss": -40.97252655029297, "global_step": 144711, "epoch": 1195} {"train_loss": -40.54047775268555, "global_step": 144712, "epoch": 1195} {"train_loss": -40.32141876220703, "global_step": 144713, "epoch": 1195} {"train_loss": -41.08669662475586, "global_step": 144714, "epoch": 1195} {"train_loss": -39.83906788471317, "global_step": 144715, "epoch": 1195, "val_loss": 2659953.0} {"train_loss": -41.14573287963867, "global_step": 144716, "epoch": 1196} {"train_loss": -40.34502410888672, "global_step": 144717, "epoch": 1196} {"train_loss": -40.291439056396484, "global_step": 144718, "epoch": 1196} {"train_loss": -41.16535186767578, "global_step": 144719, "epoch": 1196} {"train_loss": -40.585975646972656, "global_step": 144720, "epoch": 1196} {"train_loss": -40.5062141418457, "global_step": 144721, "epoch": 1196} {"train_loss": -38.72622299194336, "global_step": 144722, "epoch": 1196} {"train_loss": -40.77645492553711, "global_step": 144723, "epoch": 1196} {"train_loss": -39.48674011230469, "global_step": 144724, "epoch": 1196} {"train_loss": -40.657325744628906, "global_step": 144725, "epoch": 1196} {"train_loss": -40.67188262939453, "global_step": 144726, "epoch": 1196} {"train_loss": -40.68826675415039, "global_step": 144727, "epoch": 1196} {"train_loss": -38.73118209838867, "global_step": 144728, "epoch": 1196} {"train_loss": -40.654300689697266, "global_step": 144729, "epoch": 1196} {"train_loss": -39.177955627441406, "global_step": 144730, "epoch": 1196} {"train_loss": -40.0882682800293, "global_step": 144731, "epoch": 1196} {"train_loss": -38.174659729003906, "global_step": 144732, "epoch": 1196} {"train_loss": -39.462520599365234, "global_step": 144733, "epoch": 1196} {"train_loss": -39.023780822753906, "global_step": 144734, "epoch": 1196} {"train_loss": -37.397361755371094, "global_step": 144735, "epoch": 1196} {"train_loss": -38.33170700073242, "global_step": 144736, "epoch": 1196} {"train_loss": -40.08660125732422, "global_step": 144737, "epoch": 1196} {"train_loss": -40.14518356323242, "global_step": 144738, "epoch": 1196} {"train_loss": -39.53644943237305, "global_step": 144739, "epoch": 1196} {"train_loss": -39.24769973754883, "global_step": 144740, "epoch": 1196} {"train_loss": -39.587711334228516, "global_step": 144741, "epoch": 1196} {"train_loss": -40.313018798828125, "global_step": 144742, "epoch": 1196} {"train_loss": -40.21419143676758, "global_step": 144743, "epoch": 1196} {"train_loss": -40.31599044799805, "global_step": 144744, "epoch": 1196} {"train_loss": -39.979305267333984, "global_step": 144745, "epoch": 1196} {"train_loss": -39.92030715942383, "global_step": 144746, "epoch": 1196} {"train_loss": -40.45132064819336, "global_step": 144747, "epoch": 1196} {"train_loss": -39.56698989868164, "global_step": 144748, "epoch": 1196} {"train_loss": -38.469722747802734, "global_step": 144749, "epoch": 1196} {"train_loss": -38.95634460449219, "global_step": 144750, "epoch": 1196} {"train_loss": -38.247772216796875, "global_step": 144751, "epoch": 1196} {"train_loss": -39.446102142333984, "global_step": 144752, "epoch": 1196} {"train_loss": -39.72622299194336, "global_step": 144753, "epoch": 1196} {"train_loss": -39.980777740478516, "global_step": 144754, "epoch": 1196} {"train_loss": -37.367305755615234, "global_step": 144755, "epoch": 1196} {"train_loss": -38.36968994140625, "global_step": 144756, "epoch": 1196} {"train_loss": -40.00508499145508, "global_step": 144757, "epoch": 1196} {"train_loss": -40.041194915771484, "global_step": 144758, "epoch": 1196} {"train_loss": -37.0744514465332, "global_step": 144759, "epoch": 1196} {"train_loss": -36.095970153808594, "global_step": 144760, "epoch": 1196} {"train_loss": -39.3715934753418, "global_step": 144761, "epoch": 1196} {"train_loss": -39.79661560058594, "global_step": 144762, "epoch": 1196} {"train_loss": -39.6849250793457, "global_step": 144763, "epoch": 1196} {"train_loss": -39.528053283691406, "global_step": 144764, "epoch": 1196} {"train_loss": -39.344825744628906, "global_step": 144765, "epoch": 1196} {"train_loss": -38.784095764160156, "global_step": 144766, "epoch": 1196} {"train_loss": -40.64777374267578, "global_step": 144767, "epoch": 1196} {"train_loss": -39.33486557006836, "global_step": 144768, "epoch": 1196} {"train_loss": -39.877723693847656, "global_step": 144769, "epoch": 1196} {"train_loss": -39.15679931640625, "global_step": 144770, "epoch": 1196} {"train_loss": -39.2454719543457, "global_step": 144771, "epoch": 1196} {"train_loss": -38.522918701171875, "global_step": 144772, "epoch": 1196} {"train_loss": -39.93949508666992, "global_step": 144773, "epoch": 1196} {"train_loss": -39.847564697265625, "global_step": 144774, "epoch": 1196} {"train_loss": -38.786800384521484, "global_step": 144775, "epoch": 1196} {"train_loss": -38.54775619506836, "global_step": 144776, "epoch": 1196} {"train_loss": -39.85468292236328, "global_step": 144777, "epoch": 1196} {"train_loss": -39.88359832763672, "global_step": 144778, "epoch": 1196} {"train_loss": -38.589019775390625, "global_step": 144779, "epoch": 1196} {"train_loss": -38.72892379760742, "global_step": 144780, "epoch": 1196} {"train_loss": -40.044708251953125, "global_step": 144781, "epoch": 1196} {"train_loss": -39.28899002075195, "global_step": 144782, "epoch": 1196} {"train_loss": -39.47523880004883, "global_step": 144783, "epoch": 1196} {"train_loss": -39.0474967956543, "global_step": 144784, "epoch": 1196} {"train_loss": -39.196266174316406, "global_step": 144785, "epoch": 1196} {"train_loss": -40.447444915771484, "global_step": 144786, "epoch": 1196} {"train_loss": -40.23797607421875, "global_step": 144787, "epoch": 1196} {"train_loss": -39.193599700927734, "global_step": 144788, "epoch": 1196} {"train_loss": -40.51400375366211, "global_step": 144789, "epoch": 1196} {"train_loss": -40.440547943115234, "global_step": 144790, "epoch": 1196} {"train_loss": -40.477779388427734, "global_step": 144791, "epoch": 1196} {"train_loss": -39.991912841796875, "global_step": 144792, "epoch": 1196} {"train_loss": -40.34353256225586, "global_step": 144793, "epoch": 1196} {"train_loss": -38.880069732666016, "global_step": 144794, "epoch": 1196} {"train_loss": -40.79179000854492, "global_step": 144795, "epoch": 1196} {"train_loss": -41.02225112915039, "global_step": 144796, "epoch": 1196} {"train_loss": -40.40791702270508, "global_step": 144797, "epoch": 1196} {"train_loss": -40.60834884643555, "global_step": 144798, "epoch": 1196} {"train_loss": -41.0191535949707, "global_step": 144799, "epoch": 1196} {"train_loss": -40.883907318115234, "global_step": 144800, "epoch": 1196} {"train_loss": -40.65761184692383, "global_step": 144801, "epoch": 1196} {"train_loss": -40.1346435546875, "global_step": 144802, "epoch": 1196} {"train_loss": -40.28689193725586, "global_step": 144803, "epoch": 1196} {"train_loss": -40.95568084716797, "global_step": 144804, "epoch": 1196} {"train_loss": -40.81696701049805, "global_step": 144805, "epoch": 1196} {"train_loss": -39.11164855957031, "global_step": 144806, "epoch": 1196} {"train_loss": -41.03673553466797, "global_step": 144807, "epoch": 1196} {"train_loss": -40.74713897705078, "global_step": 144808, "epoch": 1196} {"train_loss": -40.7632942199707, "global_step": 144809, "epoch": 1196} {"train_loss": -39.952693939208984, "global_step": 144810, "epoch": 1196} {"train_loss": -40.154293060302734, "global_step": 144811, "epoch": 1196} {"train_loss": -40.75667190551758, "global_step": 144812, "epoch": 1196} {"train_loss": -41.24785232543945, "global_step": 144813, "epoch": 1196} {"train_loss": -39.49990463256836, "global_step": 144814, "epoch": 1196} {"train_loss": -41.009525299072266, "global_step": 144815, "epoch": 1196} {"train_loss": -40.551265716552734, "global_step": 144816, "epoch": 1196} {"train_loss": -40.20878219604492, "global_step": 144817, "epoch": 1196} {"train_loss": -40.78438949584961, "global_step": 144818, "epoch": 1196} {"train_loss": -41.09798049926758, "global_step": 144819, "epoch": 1196} {"train_loss": -40.92929458618164, "global_step": 144820, "epoch": 1196} {"train_loss": -40.26787185668945, "global_step": 144821, "epoch": 1196} {"train_loss": -36.97675704956055, "global_step": 144822, "epoch": 1196} {"train_loss": -38.84065628051758, "global_step": 144823, "epoch": 1196} {"train_loss": -39.342281341552734, "global_step": 144824, "epoch": 1196} {"train_loss": -41.167232513427734, "global_step": 144825, "epoch": 1196} {"train_loss": -39.10715866088867, "global_step": 144826, "epoch": 1196} {"train_loss": -40.104305267333984, "global_step": 144827, "epoch": 1196} {"train_loss": -39.4629020690918, "global_step": 144828, "epoch": 1196} {"train_loss": -40.400386810302734, "global_step": 144829, "epoch": 1196} {"train_loss": -40.616493225097656, "global_step": 144830, "epoch": 1196} {"train_loss": -39.91753005981445, "global_step": 144831, "epoch": 1196} {"train_loss": -40.29018783569336, "global_step": 144832, "epoch": 1196} {"train_loss": -40.05579376220703, "global_step": 144833, "epoch": 1196} {"train_loss": -40.370479583740234, "global_step": 144834, "epoch": 1196} {"train_loss": -39.9620246887207, "global_step": 144835, "epoch": 1196} {"train_loss": -39.7967259115424, "global_step": 144836, "epoch": 1196, "val_loss": 2945368.0} {"train_loss": -35.546852111816406, "global_step": 144837, "epoch": 1197} {"train_loss": -36.48893356323242, "global_step": 144838, "epoch": 1197} {"train_loss": -39.01461410522461, "global_step": 144839, "epoch": 1197} {"train_loss": -39.84690475463867, "global_step": 144840, "epoch": 1197} {"train_loss": -37.3828125, "global_step": 144841, "epoch": 1197} {"train_loss": -36.11832809448242, "global_step": 144842, "epoch": 1197} {"train_loss": -37.340538024902344, "global_step": 144843, "epoch": 1197} {"train_loss": -36.80405807495117, "global_step": 144844, "epoch": 1197} {"train_loss": -38.633277893066406, "global_step": 144845, "epoch": 1197} {"train_loss": -35.38051986694336, "global_step": 144846, "epoch": 1197} {"train_loss": -36.411529541015625, "global_step": 144847, "epoch": 1197} {"train_loss": -36.74262619018555, "global_step": 144848, "epoch": 1197} {"train_loss": -39.76529312133789, "global_step": 144849, "epoch": 1197} {"train_loss": -32.876705169677734, "global_step": 144850, "epoch": 1197} {"train_loss": -33.16764450073242, "global_step": 144851, "epoch": 1197} {"train_loss": -38.72343826293945, "global_step": 144852, "epoch": 1197} {"train_loss": -36.02995300292969, "global_step": 144853, "epoch": 1197} {"train_loss": -33.883338928222656, "global_step": 144854, "epoch": 1197} {"train_loss": -38.7826042175293, "global_step": 144855, "epoch": 1197} {"train_loss": -35.288551330566406, "global_step": 144856, "epoch": 1197} {"train_loss": -35.72161102294922, "global_step": 144857, "epoch": 1197} {"train_loss": -36.76913070678711, "global_step": 144858, "epoch": 1197} {"train_loss": -37.616729736328125, "global_step": 144859, "epoch": 1197} {"train_loss": -36.09434127807617, "global_step": 144860, "epoch": 1197} {"train_loss": -36.50623321533203, "global_step": 144861, "epoch": 1197} {"train_loss": -37.47675323486328, "global_step": 144862, "epoch": 1197} {"train_loss": -37.39019775390625, "global_step": 144863, "epoch": 1197} {"train_loss": -38.09648132324219, "global_step": 144864, "epoch": 1197} {"train_loss": -38.55001449584961, "global_step": 144865, "epoch": 1197} {"train_loss": -36.29480743408203, "global_step": 144866, "epoch": 1197} {"train_loss": -37.626583099365234, "global_step": 144867, "epoch": 1197} {"train_loss": -38.47887420654297, "global_step": 144868, "epoch": 1197} {"train_loss": -37.76053237915039, "global_step": 144869, "epoch": 1197} {"train_loss": -38.61436080932617, "global_step": 144870, "epoch": 1197} {"train_loss": -37.67732620239258, "global_step": 144871, "epoch": 1197} {"train_loss": -38.4178581237793, "global_step": 144872, "epoch": 1197} {"train_loss": -39.62636947631836, "global_step": 144873, "epoch": 1197} {"train_loss": -38.71619415283203, "global_step": 144874, "epoch": 1197} {"train_loss": -39.64302444458008, "global_step": 144875, "epoch": 1197} {"train_loss": -39.09764099121094, "global_step": 144876, "epoch": 1197} {"train_loss": -40.01252746582031, "global_step": 144877, "epoch": 1197} {"train_loss": -39.23540115356445, "global_step": 144878, "epoch": 1197} {"train_loss": -39.594093322753906, "global_step": 144879, "epoch": 1197} {"train_loss": -39.545589447021484, "global_step": 144880, "epoch": 1197} {"train_loss": -39.928951263427734, "global_step": 144881, "epoch": 1197} {"train_loss": -39.50796127319336, "global_step": 144882, "epoch": 1197} {"train_loss": -39.327857971191406, "global_step": 144883, "epoch": 1197} {"train_loss": -39.56736755371094, "global_step": 144884, "epoch": 1197} {"train_loss": -38.86603546142578, "global_step": 144885, "epoch": 1197} {"train_loss": -39.62844467163086, "global_step": 144886, "epoch": 1197} {"train_loss": -40.123138427734375, "global_step": 144887, "epoch": 1197} {"train_loss": -39.771270751953125, "global_step": 144888, "epoch": 1197} {"train_loss": -39.56489944458008, "global_step": 144889, "epoch": 1197} {"train_loss": -39.87786102294922, "global_step": 144890, "epoch": 1197} {"train_loss": -39.47503662109375, "global_step": 144891, "epoch": 1197} {"train_loss": -39.54066848754883, "global_step": 144892, "epoch": 1197} {"train_loss": -40.312042236328125, "global_step": 144893, "epoch": 1197} {"train_loss": -39.990638732910156, "global_step": 144894, "epoch": 1197} {"train_loss": -39.796321868896484, "global_step": 144895, "epoch": 1197} {"train_loss": -40.15156936645508, "global_step": 144896, "epoch": 1197} {"train_loss": -35.31019973754883, "global_step": 144897, "epoch": 1197} {"train_loss": -40.433345794677734, "global_step": 144898, "epoch": 1197} {"train_loss": -39.86851119995117, "global_step": 144899, "epoch": 1197} {"train_loss": -39.76412582397461, "global_step": 144900, "epoch": 1197} {"train_loss": -39.61970520019531, "global_step": 144901, "epoch": 1197} {"train_loss": -40.441585540771484, "global_step": 144902, "epoch": 1197} {"train_loss": -36.5397834777832, "global_step": 144903, "epoch": 1197} {"train_loss": -40.04619598388672, "global_step": 144904, "epoch": 1197} {"train_loss": -40.5549430847168, "global_step": 144905, "epoch": 1197} {"train_loss": -40.531333923339844, "global_step": 144906, "epoch": 1197} {"train_loss": -40.386566162109375, "global_step": 144907, "epoch": 1197} {"train_loss": -39.0062255859375, "global_step": 144908, "epoch": 1197} {"train_loss": -40.86499786376953, "global_step": 144909, "epoch": 1197} {"train_loss": -40.76533126831055, "global_step": 144910, "epoch": 1197} {"train_loss": -40.776485443115234, "global_step": 144911, "epoch": 1197} {"train_loss": -40.7847900390625, "global_step": 144912, "epoch": 1197} {"train_loss": -41.04143142700195, "global_step": 144913, "epoch": 1197} {"train_loss": -40.27812957763672, "global_step": 144914, "epoch": 1197} {"train_loss": -40.89034652709961, "global_step": 144915, "epoch": 1197} {"train_loss": -41.266841888427734, "global_step": 144916, "epoch": 1197} {"train_loss": -39.97358322143555, "global_step": 144917, "epoch": 1197} {"train_loss": -40.74672317504883, "global_step": 144918, "epoch": 1197} {"train_loss": -40.72060012817383, "global_step": 144919, "epoch": 1197} {"train_loss": -40.41299057006836, "global_step": 144920, "epoch": 1197} {"train_loss": -41.07936477661133, "global_step": 144921, "epoch": 1197} {"train_loss": -40.767269134521484, "global_step": 144922, "epoch": 1197} {"train_loss": -40.867645263671875, "global_step": 144923, "epoch": 1197} {"train_loss": -40.93100357055664, "global_step": 144924, "epoch": 1197} {"train_loss": -40.50034713745117, "global_step": 144925, "epoch": 1197} {"train_loss": -39.61594772338867, "global_step": 144926, "epoch": 1197} {"train_loss": -40.64556121826172, "global_step": 144927, "epoch": 1197} {"train_loss": -41.06581497192383, "global_step": 144928, "epoch": 1197} {"train_loss": -41.06101608276367, "global_step": 144929, "epoch": 1197} {"train_loss": -40.86178207397461, "global_step": 144930, "epoch": 1197} {"train_loss": -40.97869873046875, "global_step": 144931, "epoch": 1197} {"train_loss": -41.092132568359375, "global_step": 144932, "epoch": 1197} {"train_loss": -40.996639251708984, "global_step": 144933, "epoch": 1197} {"train_loss": -41.433746337890625, "global_step": 144934, "epoch": 1197} {"train_loss": -40.37078857421875, "global_step": 144935, "epoch": 1197} {"train_loss": -40.06809616088867, "global_step": 144936, "epoch": 1197} {"train_loss": -41.149261474609375, "global_step": 144937, "epoch": 1197} {"train_loss": -40.80632781982422, "global_step": 144938, "epoch": 1197} {"train_loss": -41.23476791381836, "global_step": 144939, "epoch": 1197} {"train_loss": -41.13711166381836, "global_step": 144940, "epoch": 1197} {"train_loss": -40.73480224609375, "global_step": 144941, "epoch": 1197} {"train_loss": -41.0847282409668, "global_step": 144942, "epoch": 1197} {"train_loss": -41.30184555053711, "global_step": 144943, "epoch": 1197} {"train_loss": -40.15937423706055, "global_step": 144944, "epoch": 1197} {"train_loss": -41.43291091918945, "global_step": 144945, "epoch": 1197} {"train_loss": -40.18580627441406, "global_step": 144946, "epoch": 1197} {"train_loss": -40.79131317138672, "global_step": 144947, "epoch": 1197} {"train_loss": -40.84003829956055, "global_step": 144948, "epoch": 1197} {"train_loss": -40.166778564453125, "global_step": 144949, "epoch": 1197} {"train_loss": -41.07598876953125, "global_step": 144950, "epoch": 1197} {"train_loss": -41.097930908203125, "global_step": 144951, "epoch": 1197} {"train_loss": -41.18403244018555, "global_step": 144952, "epoch": 1197} {"train_loss": -39.430931091308594, "global_step": 144953, "epoch": 1197} {"train_loss": -40.10786056518555, "global_step": 144954, "epoch": 1197} {"train_loss": -40.1642951965332, "global_step": 144955, "epoch": 1197} {"train_loss": -41.12168502807617, "global_step": 144956, "epoch": 1197} {"train_loss": -39.28560540695821, "global_step": 144957, "epoch": 1197, "val_loss": 2779542.75} {"train_loss": -40.659786224365234, "global_step": 144958, "epoch": 1198} {"train_loss": -39.87616729736328, "global_step": 144959, "epoch": 1198} {"train_loss": -40.89068603515625, "global_step": 144960, "epoch": 1198} {"train_loss": -39.21128463745117, "global_step": 144961, "epoch": 1198} {"train_loss": -41.279624938964844, "global_step": 144962, "epoch": 1198} {"train_loss": -40.61427688598633, "global_step": 144963, "epoch": 1198} {"train_loss": -39.90348434448242, "global_step": 144964, "epoch": 1198} {"train_loss": -41.029014587402344, "global_step": 144965, "epoch": 1198} {"train_loss": -39.2048454284668, "global_step": 144966, "epoch": 1198} {"train_loss": -37.55879211425781, "global_step": 144967, "epoch": 1198} {"train_loss": -34.06950759887695, "global_step": 144968, "epoch": 1198} {"train_loss": -23.630779266357422, "global_step": 144969, "epoch": 1198} {"train_loss": -21.95137596130371, "global_step": 144970, "epoch": 1198} {"train_loss": -34.131832122802734, "global_step": 144971, "epoch": 1198} {"train_loss": -35.64687728881836, "global_step": 144972, "epoch": 1198} {"train_loss": -29.849475860595703, "global_step": 144973, "epoch": 1198} {"train_loss": -32.69830322265625, "global_step": 144974, "epoch": 1198} {"train_loss": -37.69165802001953, "global_step": 144975, "epoch": 1198} {"train_loss": -32.3688850402832, "global_step": 144976, "epoch": 1198} {"train_loss": -36.572547912597656, "global_step": 144977, "epoch": 1198} {"train_loss": -32.01188278198242, "global_step": 144978, "epoch": 1198} {"train_loss": -35.515960693359375, "global_step": 144979, "epoch": 1198} {"train_loss": -30.48723793029785, "global_step": 144980, "epoch": 1198} {"train_loss": -36.86751937866211, "global_step": 144981, "epoch": 1198} {"train_loss": -32.1514778137207, "global_step": 144982, "epoch": 1198} {"train_loss": -38.118927001953125, "global_step": 144983, "epoch": 1198} {"train_loss": -36.844112396240234, "global_step": 144984, "epoch": 1198} {"train_loss": -35.823883056640625, "global_step": 144985, "epoch": 1198} {"train_loss": -37.4872932434082, "global_step": 144986, "epoch": 1198} {"train_loss": -37.1606330871582, "global_step": 144987, "epoch": 1198} {"train_loss": -35.25997543334961, "global_step": 144988, "epoch": 1198} {"train_loss": -38.303321838378906, "global_step": 144989, "epoch": 1198} {"train_loss": -35.4232292175293, "global_step": 144990, "epoch": 1198} {"train_loss": -35.82871627807617, "global_step": 144991, "epoch": 1198} {"train_loss": -37.83958053588867, "global_step": 144992, "epoch": 1198} {"train_loss": -37.9326286315918, "global_step": 144993, "epoch": 1198} {"train_loss": -38.878196716308594, "global_step": 144994, "epoch": 1198} {"train_loss": -38.30516815185547, "global_step": 144995, "epoch": 1198} {"train_loss": -38.768646240234375, "global_step": 144996, "epoch": 1198} {"train_loss": -38.47437286376953, "global_step": 144997, "epoch": 1198} {"train_loss": -37.73870849609375, "global_step": 144998, "epoch": 1198} {"train_loss": -38.376121520996094, "global_step": 144999, "epoch": 1198} {"train_loss": -38.671966552734375, "global_step": 145000, "epoch": 1198} {"train_loss": -38.11065673828125, "global_step": 145001, "epoch": 1198} {"train_loss": -38.57405090332031, "global_step": 145002, "epoch": 1198} {"train_loss": -38.83916473388672, "global_step": 145003, "epoch": 1198} {"train_loss": -38.843021392822266, "global_step": 145004, "epoch": 1198} {"train_loss": -38.64381790161133, "global_step": 145005, "epoch": 1198} {"train_loss": -39.08645248413086, "global_step": 145006, "epoch": 1198} {"train_loss": -38.039100646972656, "global_step": 145007, "epoch": 1198} {"train_loss": -39.164283752441406, "global_step": 145008, "epoch": 1198} {"train_loss": -39.60966110229492, "global_step": 145009, "epoch": 1198} {"train_loss": -39.83149337768555, "global_step": 145010, "epoch": 1198} {"train_loss": -39.53949737548828, "global_step": 145011, "epoch": 1198} {"train_loss": -39.593807220458984, "global_step": 145012, "epoch": 1198} {"train_loss": -39.49614334106445, "global_step": 145013, "epoch": 1198} {"train_loss": -39.10565948486328, "global_step": 145014, "epoch": 1198} {"train_loss": -39.50129318237305, "global_step": 145015, "epoch": 1198} {"train_loss": -39.44389343261719, "global_step": 145016, "epoch": 1198} {"train_loss": -39.331153869628906, "global_step": 145017, "epoch": 1198} {"train_loss": -39.88919448852539, "global_step": 145018, "epoch": 1198} {"train_loss": -39.188148498535156, "global_step": 145019, "epoch": 1198} {"train_loss": -39.81846618652344, "global_step": 145020, "epoch": 1198} {"train_loss": -40.267852783203125, "global_step": 145021, "epoch": 1198} {"train_loss": -39.62324142456055, "global_step": 145022, "epoch": 1198} {"train_loss": -38.83541488647461, "global_step": 145023, "epoch": 1198} {"train_loss": -40.1915283203125, "global_step": 145024, "epoch": 1198} {"train_loss": -39.53456497192383, "global_step": 145025, "epoch": 1198} {"train_loss": -39.55936050415039, "global_step": 145026, "epoch": 1198} {"train_loss": -40.10022735595703, "global_step": 145027, "epoch": 1198} {"train_loss": -38.63532638549805, "global_step": 145028, "epoch": 1198} {"train_loss": -40.309532165527344, "global_step": 145029, "epoch": 1198} {"train_loss": -39.487056732177734, "global_step": 145030, "epoch": 1198} {"train_loss": -40.05515670776367, "global_step": 145031, "epoch": 1198} {"train_loss": -40.681182861328125, "global_step": 145032, "epoch": 1198} {"train_loss": -40.120304107666016, "global_step": 145033, "epoch": 1198} {"train_loss": -39.418785095214844, "global_step": 145034, "epoch": 1198} {"train_loss": -39.84161376953125, "global_step": 145035, "epoch": 1198} {"train_loss": -40.16987991333008, "global_step": 145036, "epoch": 1198} {"train_loss": -39.942543029785156, "global_step": 145037, "epoch": 1198} {"train_loss": -40.4218864440918, "global_step": 145038, "epoch": 1198} {"train_loss": -39.914703369140625, "global_step": 145039, "epoch": 1198} {"train_loss": -40.67753982543945, "global_step": 145040, "epoch": 1198} {"train_loss": -40.55070114135742, "global_step": 145041, "epoch": 1198} {"train_loss": -40.51478958129883, "global_step": 145042, "epoch": 1198} {"train_loss": -40.121307373046875, "global_step": 145043, "epoch": 1198} {"train_loss": -40.82850646972656, "global_step": 145044, "epoch": 1198} {"train_loss": -40.54722213745117, "global_step": 145045, "epoch": 1198} {"train_loss": -40.18833541870117, "global_step": 145046, "epoch": 1198} {"train_loss": -40.420955657958984, "global_step": 145047, "epoch": 1198} {"train_loss": -41.062171936035156, "global_step": 145048, "epoch": 1198} {"train_loss": -40.85598373413086, "global_step": 145049, "epoch": 1198} {"train_loss": -39.986473083496094, "global_step": 145050, "epoch": 1198} {"train_loss": -39.92593765258789, "global_step": 145051, "epoch": 1198} {"train_loss": -40.978145599365234, "global_step": 145052, "epoch": 1198} {"train_loss": -40.51530838012695, "global_step": 145053, "epoch": 1198} {"train_loss": -39.795196533203125, "global_step": 145054, "epoch": 1198} {"train_loss": -40.96570587158203, "global_step": 145055, "epoch": 1198} {"train_loss": -40.72824478149414, "global_step": 145056, "epoch": 1198} {"train_loss": -39.623779296875, "global_step": 145057, "epoch": 1198} {"train_loss": -40.773712158203125, "global_step": 145058, "epoch": 1198} {"train_loss": -40.04566192626953, "global_step": 145059, "epoch": 1198} {"train_loss": -36.05803298950195, "global_step": 145060, "epoch": 1198} {"train_loss": -25.372756958007812, "global_step": 145061, "epoch": 1198} {"train_loss": -4.837939739227295, "global_step": 145062, "epoch": 1198} {"train_loss": -18.0190486907959, "global_step": 145063, "epoch": 1198} {"train_loss": -38.2205810546875, "global_step": 145064, "epoch": 1198} {"train_loss": -34.696990966796875, "global_step": 145065, "epoch": 1198} {"train_loss": -38.36601257324219, "global_step": 145066, "epoch": 1198} {"train_loss": -36.95942306518555, "global_step": 145067, "epoch": 1198} {"train_loss": -38.24128341674805, "global_step": 145068, "epoch": 1198} {"train_loss": -38.216983795166016, "global_step": 145069, "epoch": 1198} {"train_loss": -38.539669036865234, "global_step": 145070, "epoch": 1198} {"train_loss": -37.74630355834961, "global_step": 145071, "epoch": 1198} {"train_loss": -38.473690032958984, "global_step": 145072, "epoch": 1198} {"train_loss": -38.32571029663086, "global_step": 145073, "epoch": 1198} {"train_loss": -40.20114517211914, "global_step": 145074, "epoch": 1198} {"train_loss": -38.69588851928711, "global_step": 145075, "epoch": 1198} {"train_loss": -39.869773864746094, "global_step": 145076, "epoch": 1198} {"train_loss": -39.18297576904297, "global_step": 145077, "epoch": 1198} {"train_loss": -37.7717574056515, "global_step": 145078, "epoch": 1198, "val_loss": 2479508.25} {"train_loss": -40.01369857788086, "global_step": 145079, "epoch": 1199} {"train_loss": -39.664085388183594, "global_step": 145080, "epoch": 1199} {"train_loss": -40.049102783203125, "global_step": 145081, "epoch": 1199} {"train_loss": -40.24790573120117, "global_step": 145082, "epoch": 1199} {"train_loss": -39.16263961791992, "global_step": 145083, "epoch": 1199} {"train_loss": -40.447471618652344, "global_step": 145084, "epoch": 1199} {"train_loss": -40.17860412597656, "global_step": 145085, "epoch": 1199} {"train_loss": -39.751258850097656, "global_step": 145086, "epoch": 1199} {"train_loss": -40.08000946044922, "global_step": 145087, "epoch": 1199} {"train_loss": -39.840576171875, "global_step": 145088, "epoch": 1199} {"train_loss": -40.166046142578125, "global_step": 145089, "epoch": 1199} {"train_loss": -40.537384033203125, "global_step": 145090, "epoch": 1199} {"train_loss": -39.59685134887695, "global_step": 145091, "epoch": 1199} {"train_loss": -40.33355712890625, "global_step": 145092, "epoch": 1199} {"train_loss": -40.47774124145508, "global_step": 145093, "epoch": 1199} {"train_loss": -39.60929489135742, "global_step": 145094, "epoch": 1199} {"train_loss": -40.315677642822266, "global_step": 145095, "epoch": 1199} {"train_loss": -40.50568771362305, "global_step": 145096, "epoch": 1199} {"train_loss": -40.11962127685547, "global_step": 145097, "epoch": 1199} {"train_loss": -40.93663787841797, "global_step": 145098, "epoch": 1199} {"train_loss": -40.133846282958984, "global_step": 145099, "epoch": 1199} {"train_loss": -40.97468185424805, "global_step": 145100, "epoch": 1199} {"train_loss": -40.80167770385742, "global_step": 145101, "epoch": 1199} {"train_loss": -40.23894119262695, "global_step": 145102, "epoch": 1199} {"train_loss": -40.456966400146484, "global_step": 145103, "epoch": 1199} {"train_loss": -40.9488410949707, "global_step": 145104, "epoch": 1199} {"train_loss": -40.89284896850586, "global_step": 145105, "epoch": 1199} {"train_loss": -40.7442512512207, "global_step": 145106, "epoch": 1199} {"train_loss": -41.09729766845703, "global_step": 145107, "epoch": 1199} {"train_loss": -41.12616729736328, "global_step": 145108, "epoch": 1199} {"train_loss": -41.40913009643555, "global_step": 145109, "epoch": 1199} {"train_loss": -40.9013671875, "global_step": 145110, "epoch": 1199} {"train_loss": -40.63480758666992, "global_step": 145111, "epoch": 1199} {"train_loss": -40.632469177246094, "global_step": 145112, "epoch": 1199} {"train_loss": -40.53303146362305, "global_step": 145113, "epoch": 1199} {"train_loss": -40.645626068115234, "global_step": 145114, "epoch": 1199} {"train_loss": -40.37349319458008, "global_step": 145115, "epoch": 1199} {"train_loss": -40.09353256225586, "global_step": 145116, "epoch": 1199} {"train_loss": -40.43905258178711, "global_step": 145117, "epoch": 1199} {"train_loss": -40.67975616455078, "global_step": 145118, "epoch": 1199} {"train_loss": -40.44674301147461, "global_step": 145119, "epoch": 1199} {"train_loss": -40.79417037963867, "global_step": 145120, "epoch": 1199} {"train_loss": -39.10321044921875, "global_step": 145121, "epoch": 1199} {"train_loss": -40.64031982421875, "global_step": 145122, "epoch": 1199} {"train_loss": -40.059932708740234, "global_step": 145123, "epoch": 1199} {"train_loss": -40.6738166809082, "global_step": 145124, "epoch": 1199} {"train_loss": -40.550601959228516, "global_step": 145125, "epoch": 1199} {"train_loss": -39.561038970947266, "global_step": 145126, "epoch": 1199} {"train_loss": -40.493309020996094, "global_step": 145127, "epoch": 1199} {"train_loss": -40.799800872802734, "global_step": 145128, "epoch": 1199} {"train_loss": -40.59512710571289, "global_step": 145129, "epoch": 1199} {"train_loss": -40.72710418701172, "global_step": 145130, "epoch": 1199} {"train_loss": -41.15791702270508, "global_step": 145131, "epoch": 1199} {"train_loss": -39.83142852783203, "global_step": 145132, "epoch": 1199} {"train_loss": -40.23012924194336, "global_step": 145133, "epoch": 1199} {"train_loss": -40.81270217895508, "global_step": 145134, "epoch": 1199} {"train_loss": -40.63015365600586, "global_step": 145135, "epoch": 1199} {"train_loss": -39.6705436706543, "global_step": 145136, "epoch": 1199} {"train_loss": -40.406036376953125, "global_step": 145137, "epoch": 1199} {"train_loss": -39.82210922241211, "global_step": 145138, "epoch": 1199} {"train_loss": -39.85942459106445, "global_step": 145139, "epoch": 1199} {"train_loss": -38.60694885253906, "global_step": 145140, "epoch": 1199} {"train_loss": -40.40018844604492, "global_step": 145141, "epoch": 1199} {"train_loss": -40.634124755859375, "global_step": 145142, "epoch": 1199} {"train_loss": -39.839622497558594, "global_step": 145143, "epoch": 1199} {"train_loss": -40.397499084472656, "global_step": 145144, "epoch": 1199} {"train_loss": -39.99436569213867, "global_step": 145145, "epoch": 1199} {"train_loss": -39.89472198486328, "global_step": 145146, "epoch": 1199} {"train_loss": -39.065223693847656, "global_step": 145147, "epoch": 1199} {"train_loss": -37.61894989013672, "global_step": 145148, "epoch": 1199} {"train_loss": -37.374061584472656, "global_step": 145149, "epoch": 1199} {"train_loss": -38.21549606323242, "global_step": 145150, "epoch": 1199} {"train_loss": -40.506385803222656, "global_step": 145151, "epoch": 1199} {"train_loss": -40.053306579589844, "global_step": 145152, "epoch": 1199} {"train_loss": -39.43724822998047, "global_step": 145153, "epoch": 1199} {"train_loss": -39.396942138671875, "global_step": 145154, "epoch": 1199} {"train_loss": -38.419185638427734, "global_step": 145155, "epoch": 1199} {"train_loss": -38.89654541015625, "global_step": 145156, "epoch": 1199} {"train_loss": -38.53388214111328, "global_step": 145157, "epoch": 1199} {"train_loss": -40.11715316772461, "global_step": 145158, "epoch": 1199} {"train_loss": -39.163509368896484, "global_step": 145159, "epoch": 1199} {"train_loss": -39.26313400268555, "global_step": 145160, "epoch": 1199} {"train_loss": -39.93363571166992, "global_step": 145161, "epoch": 1199} {"train_loss": -39.89036178588867, "global_step": 145162, "epoch": 1199} {"train_loss": -38.86702346801758, "global_step": 145163, "epoch": 1199} {"train_loss": -39.2716178894043, "global_step": 145164, "epoch": 1199} {"train_loss": -38.647621154785156, "global_step": 145165, "epoch": 1199} {"train_loss": -38.7738151550293, "global_step": 145166, "epoch": 1199} {"train_loss": -40.614471435546875, "global_step": 145167, "epoch": 1199} {"train_loss": -38.25078582763672, "global_step": 145168, "epoch": 1199} {"train_loss": -39.55826950073242, "global_step": 145169, "epoch": 1199} {"train_loss": -39.07003402709961, "global_step": 145170, "epoch": 1199} {"train_loss": -37.71919250488281, "global_step": 145171, "epoch": 1199} {"train_loss": -37.39350509643555, "global_step": 145172, "epoch": 1199} {"train_loss": -38.53489303588867, "global_step": 145173, "epoch": 1199} {"train_loss": -39.536376953125, "global_step": 145174, "epoch": 1199} {"train_loss": -37.2381706237793, "global_step": 145175, "epoch": 1199} {"train_loss": -39.1176872253418, "global_step": 145176, "epoch": 1199} {"train_loss": -39.302974700927734, "global_step": 145177, "epoch": 1199} {"train_loss": -38.508766174316406, "global_step": 145178, "epoch": 1199} {"train_loss": -39.24139404296875, "global_step": 145179, "epoch": 1199} {"train_loss": -39.62311553955078, "global_step": 145180, "epoch": 1199} {"train_loss": -38.88192367553711, "global_step": 145181, "epoch": 1199} {"train_loss": -37.37000274658203, "global_step": 145182, "epoch": 1199} {"train_loss": -38.34481430053711, "global_step": 145183, "epoch": 1199} {"train_loss": -39.49560546875, "global_step": 145184, "epoch": 1199} {"train_loss": -39.157508850097656, "global_step": 145185, "epoch": 1199} {"train_loss": -37.77460479736328, "global_step": 145186, "epoch": 1199} {"train_loss": -37.9864616394043, "global_step": 145187, "epoch": 1199} {"train_loss": -38.91609573364258, "global_step": 145188, "epoch": 1199} {"train_loss": -35.6409912109375, "global_step": 145189, "epoch": 1199} {"train_loss": -38.18693161010742, "global_step": 145190, "epoch": 1199} {"train_loss": -37.508148193359375, "global_step": 145191, "epoch": 1199} {"train_loss": -36.18111801147461, "global_step": 145192, "epoch": 1199} {"train_loss": -37.07192611694336, "global_step": 145193, "epoch": 1199} {"train_loss": -38.039363861083984, "global_step": 145194, "epoch": 1199} {"train_loss": -37.648189544677734, "global_step": 145195, "epoch": 1199} {"train_loss": -34.201412200927734, "global_step": 145196, "epoch": 1199} {"train_loss": -38.0894660949707, "global_step": 145197, "epoch": 1199} {"train_loss": -35.864410400390625, "global_step": 145198, "epoch": 1199} {"train_loss": -39.511447874967715, "global_step": 145199, "epoch": 1199, "val_loss": 2792199.25} {"train_loss": -39.288841247558594, "global_step": 145200, "epoch": 1200} {"train_loss": -37.2491569519043, "global_step": 145201, "epoch": 1200} {"train_loss": -38.06856918334961, "global_step": 145202, "epoch": 1200} {"train_loss": -36.87852096557617, "global_step": 145203, "epoch": 1200} {"train_loss": -32.606292724609375, "global_step": 145204, "epoch": 1200} {"train_loss": -39.0799446105957, "global_step": 145205, "epoch": 1200} {"train_loss": -35.481327056884766, "global_step": 145206, "epoch": 1200} {"train_loss": -39.09029006958008, "global_step": 145207, "epoch": 1200} {"train_loss": -37.99706268310547, "global_step": 145208, "epoch": 1200} {"train_loss": -37.48945236206055, "global_step": 145209, "epoch": 1200} {"train_loss": -38.377357482910156, "global_step": 145210, "epoch": 1200} {"train_loss": -38.947139739990234, "global_step": 145211, "epoch": 1200} {"train_loss": -37.05176544189453, "global_step": 145212, "epoch": 1200} {"train_loss": -38.73407745361328, "global_step": 145213, "epoch": 1200} {"train_loss": -37.458648681640625, "global_step": 145214, "epoch": 1200} {"train_loss": -37.29125213623047, "global_step": 145215, "epoch": 1200} {"train_loss": -40.0383415222168, "global_step": 145216, "epoch": 1200} {"train_loss": -38.557735443115234, "global_step": 145217, "epoch": 1200} {"train_loss": -39.044551849365234, "global_step": 145218, "epoch": 1200} {"train_loss": -39.59320068359375, "global_step": 145219, "epoch": 1200} {"train_loss": -37.053077697753906, "global_step": 145220, "epoch": 1200} {"train_loss": -37.858558654785156, "global_step": 145221, "epoch": 1200} {"train_loss": -37.924537658691406, "global_step": 145222, "epoch": 1200} {"train_loss": -39.91828536987305, "global_step": 145223, "epoch": 1200} {"train_loss": -38.91395950317383, "global_step": 145224, "epoch": 1200} {"train_loss": -39.589046478271484, "global_step": 145225, "epoch": 1200} {"train_loss": -39.368324279785156, "global_step": 145226, "epoch": 1200} {"train_loss": -37.11299133300781, "global_step": 145227, "epoch": 1200} {"train_loss": -39.2946891784668, "global_step": 145228, "epoch": 1200} {"train_loss": -39.5931510925293, "global_step": 145229, "epoch": 1200} {"train_loss": -37.3526496887207, "global_step": 145230, "epoch": 1200} {"train_loss": -39.00613021850586, "global_step": 145231, "epoch": 1200} {"train_loss": -38.809261322021484, "global_step": 145232, "epoch": 1200} {"train_loss": -39.63291931152344, "global_step": 145233, "epoch": 1200} {"train_loss": -39.32332229614258, "global_step": 145234, "epoch": 1200} {"train_loss": -39.28145217895508, "global_step": 145235, "epoch": 1200} {"train_loss": -38.39559555053711, "global_step": 145236, "epoch": 1200} {"train_loss": -39.13934326171875, "global_step": 145237, "epoch": 1200} {"train_loss": -39.44740676879883, "global_step": 145238, "epoch": 1200} {"train_loss": -36.3914794921875, "global_step": 145239, "epoch": 1200} {"train_loss": -39.45752716064453, "global_step": 145240, "epoch": 1200} {"train_loss": -39.86331558227539, "global_step": 145241, "epoch": 1200} {"train_loss": -39.71070098876953, "global_step": 145242, "epoch": 1200} {"train_loss": -39.409767150878906, "global_step": 145243, "epoch": 1200} {"train_loss": -39.614158630371094, "global_step": 145244, "epoch": 1200} {"train_loss": -36.97438430786133, "global_step": 145245, "epoch": 1200} {"train_loss": -36.749542236328125, "global_step": 145246, "epoch": 1200} {"train_loss": -37.01156234741211, "global_step": 145247, "epoch": 1200} {"train_loss": -39.714263916015625, "global_step": 145248, "epoch": 1200} {"train_loss": -39.56666946411133, "global_step": 145249, "epoch": 1200} {"train_loss": -38.857723236083984, "global_step": 145250, "epoch": 1200} {"train_loss": -38.975955963134766, "global_step": 145251, "epoch": 1200} {"train_loss": -39.33692169189453, "global_step": 145252, "epoch": 1200} {"train_loss": -39.86433029174805, "global_step": 145253, "epoch": 1200} {"train_loss": -37.6729850769043, "global_step": 145254, "epoch": 1200} {"train_loss": -39.76861572265625, "global_step": 145255, "epoch": 1200} {"train_loss": -39.19224166870117, "global_step": 145256, "epoch": 1200} {"train_loss": -39.91981506347656, "global_step": 145257, "epoch": 1200} {"train_loss": -39.469635009765625, "global_step": 145258, "epoch": 1200} {"train_loss": -40.081539154052734, "global_step": 145259, "epoch": 1200} {"train_loss": -38.47528839111328, "global_step": 145260, "epoch": 1200} {"train_loss": -37.92658615112305, "global_step": 145261, "epoch": 1200} {"train_loss": -38.89216232299805, "global_step": 145262, "epoch": 1200} {"train_loss": -39.714412689208984, "global_step": 145263, "epoch": 1200} {"train_loss": -39.485687255859375, "global_step": 145264, "epoch": 1200} {"train_loss": -39.74978256225586, "global_step": 145265, "epoch": 1200} {"train_loss": -40.1946907043457, "global_step": 145266, "epoch": 1200} {"train_loss": -38.94773483276367, "global_step": 145267, "epoch": 1200} {"train_loss": -39.0683479309082, "global_step": 145268, "epoch": 1200} {"train_loss": -39.527984619140625, "global_step": 145269, "epoch": 1200} {"train_loss": -39.68818283081055, "global_step": 145270, "epoch": 1200} {"train_loss": -39.52033615112305, "global_step": 145271, "epoch": 1200} {"train_loss": -38.89390563964844, "global_step": 145272, "epoch": 1200} {"train_loss": -39.077064514160156, "global_step": 145273, "epoch": 1200} {"train_loss": -38.44820785522461, "global_step": 145274, "epoch": 1200} {"train_loss": -38.59697341918945, "global_step": 145275, "epoch": 1200} {"train_loss": -40.16632080078125, "global_step": 145276, "epoch": 1200} {"train_loss": -40.01813888549805, "global_step": 145277, "epoch": 1200} {"train_loss": -39.24480056762695, "global_step": 145278, "epoch": 1200} {"train_loss": -39.689422607421875, "global_step": 145279, "epoch": 1200} {"train_loss": -39.066829681396484, "global_step": 145280, "epoch": 1200} {"train_loss": -39.78010177612305, "global_step": 145281, "epoch": 1200} {"train_loss": -39.39687728881836, "global_step": 145282, "epoch": 1200} {"train_loss": -39.18844223022461, "global_step": 145283, "epoch": 1200} {"train_loss": -39.71598434448242, "global_step": 145284, "epoch": 1200} {"train_loss": -39.921356201171875, "global_step": 145285, "epoch": 1200} {"train_loss": -39.3031005859375, "global_step": 145286, "epoch": 1200} {"train_loss": -38.23551559448242, "global_step": 145287, "epoch": 1200} {"train_loss": -40.77676773071289, "global_step": 145288, "epoch": 1200} {"train_loss": -37.74308776855469, "global_step": 145289, "epoch": 1200} {"train_loss": -40.11107635498047, "global_step": 145290, "epoch": 1200} {"train_loss": -39.83834457397461, "global_step": 145291, "epoch": 1200} {"train_loss": -40.03112030029297, "global_step": 145292, "epoch": 1200} {"train_loss": -39.383453369140625, "global_step": 145293, "epoch": 1200} {"train_loss": -39.241180419921875, "global_step": 145294, "epoch": 1200} {"train_loss": -39.68806076049805, "global_step": 145295, "epoch": 1200} {"train_loss": -39.93928146362305, "global_step": 145296, "epoch": 1200} {"train_loss": -39.93693542480469, "global_step": 145297, "epoch": 1200} {"train_loss": -40.30683135986328, "global_step": 145298, "epoch": 1200} {"train_loss": -39.84741973876953, "global_step": 145299, "epoch": 1200} {"train_loss": -40.4799690246582, "global_step": 145300, "epoch": 1200} {"train_loss": -39.45644760131836, "global_step": 145301, "epoch": 1200} {"train_loss": -40.393943786621094, "global_step": 145302, "epoch": 1200} {"train_loss": -39.638065338134766, "global_step": 145303, "epoch": 1200} {"train_loss": -40.34382247924805, "global_step": 145304, "epoch": 1200} {"train_loss": -39.41413497924805, "global_step": 145305, "epoch": 1200} {"train_loss": -39.91437911987305, "global_step": 145306, "epoch": 1200} {"train_loss": -39.55134201049805, "global_step": 145307, "epoch": 1200} {"train_loss": -39.567237854003906, "global_step": 145308, "epoch": 1200} {"train_loss": -39.766258239746094, "global_step": 145309, "epoch": 1200} {"train_loss": -40.2791748046875, "global_step": 145310, "epoch": 1200} {"train_loss": -39.83318328857422, "global_step": 145311, "epoch": 1200} {"train_loss": -36.76335906982422, "global_step": 145312, "epoch": 1200} {"train_loss": -39.27633285522461, "global_step": 145313, "epoch": 1200} {"train_loss": -39.21017837524414, "global_step": 145314, "epoch": 1200} {"train_loss": -39.81568145751953, "global_step": 145315, "epoch": 1200} {"train_loss": -40.31865310668945, "global_step": 145316, "epoch": 1200} {"train_loss": -38.51393508911133, "global_step": 145317, "epoch": 1200} {"train_loss": -35.31441116333008, "global_step": 145318, "epoch": 1200} {"train_loss": -35.075958251953125, "global_step": 145319, "epoch": 1200} {"train_loss": -38.92392913566148, "global_step": 145320, "epoch": 1200, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4400000": 1.0, "test/sim_max_reward_4400001": 1.0, "test/sim_max_reward_4400002": 1.0, "test/sim_max_reward_4400003": 1.0, "test/sim_max_reward_4400004": 1.0, "test/sim_max_reward_4400005": 1.0, "test/sim_max_reward_4400006": 1.0, "test/sim_max_reward_4400007": 1.0, "test/sim_max_reward_4400008": 1.0, "test/sim_max_reward_4400009": 1.0, "test/sim_max_reward_4400010": 1.0, "test/sim_max_reward_4400011": 1.0, "test/sim_max_reward_4400012": 1.0, "test/sim_max_reward_4400013": 1.0, "test/sim_max_reward_4400014": 1.0, "test/sim_max_reward_4400015": 1.0, "test/sim_max_reward_4400016": 1.0, "test/sim_max_reward_4400017": 1.0, "test/sim_max_reward_4400018": 1.0, "test/sim_max_reward_4400019": 1.0, "test/sim_max_reward_4400020": 1.0, "test/sim_max_reward_4400021": 1.0, "train/mean_score": 1.0, "test/mean_score": 1.0, "val_loss": 2582637.0} {"train_loss": -38.29548263549805, "global_step": 145321, "epoch": 1201} {"train_loss": -39.33161544799805, "global_step": 145322, "epoch": 1201} {"train_loss": -37.82404708862305, "global_step": 145323, "epoch": 1201} {"train_loss": -39.511322021484375, "global_step": 145324, "epoch": 1201} {"train_loss": -34.205322265625, "global_step": 145325, "epoch": 1201} {"train_loss": -25.800708770751953, "global_step": 145326, "epoch": 1201} {"train_loss": -31.891544342041016, "global_step": 145327, "epoch": 1201} {"train_loss": -37.1242561340332, "global_step": 145328, "epoch": 1201} {"train_loss": -34.804901123046875, "global_step": 145329, "epoch": 1201} {"train_loss": -38.54530334472656, "global_step": 145330, "epoch": 1201} {"train_loss": -35.73623275756836, "global_step": 145331, "epoch": 1201} {"train_loss": -36.515560150146484, "global_step": 145332, "epoch": 1201} {"train_loss": -37.96578598022461, "global_step": 145333, "epoch": 1201} {"train_loss": -38.61127853393555, "global_step": 145334, "epoch": 1201} {"train_loss": -37.39867401123047, "global_step": 145335, "epoch": 1201} {"train_loss": -38.67613983154297, "global_step": 145336, "epoch": 1201} {"train_loss": -38.04351806640625, "global_step": 145337, "epoch": 1201} {"train_loss": -39.3901252746582, "global_step": 145338, "epoch": 1201} {"train_loss": -38.352291107177734, "global_step": 145339, "epoch": 1201} {"train_loss": -38.7880744934082, "global_step": 145340, "epoch": 1201} {"train_loss": -39.162696838378906, "global_step": 145341, "epoch": 1201} {"train_loss": -38.79938888549805, "global_step": 145342, "epoch": 1201} {"train_loss": -38.47689437866211, "global_step": 145343, "epoch": 1201} {"train_loss": -39.5673942565918, "global_step": 145344, "epoch": 1201} {"train_loss": -39.437496185302734, "global_step": 145345, "epoch": 1201} {"train_loss": -39.77128219604492, "global_step": 145346, "epoch": 1201} {"train_loss": -40.050537109375, "global_step": 145347, "epoch": 1201} {"train_loss": -39.41806411743164, "global_step": 145348, "epoch": 1201} {"train_loss": -39.9898681640625, "global_step": 145349, "epoch": 1201} {"train_loss": -40.09720230102539, "global_step": 145350, "epoch": 1201} {"train_loss": -40.07600021362305, "global_step": 145351, "epoch": 1201} {"train_loss": -39.904354095458984, "global_step": 145352, "epoch": 1201} {"train_loss": -39.658512115478516, "global_step": 145353, "epoch": 1201} {"train_loss": -39.60221481323242, "global_step": 145354, "epoch": 1201} {"train_loss": -40.35926055908203, "global_step": 145355, "epoch": 1201} {"train_loss": -40.44863510131836, "global_step": 145356, "epoch": 1201} {"train_loss": -40.229095458984375, "global_step": 145357, "epoch": 1201} {"train_loss": -40.40427780151367, "global_step": 145358, "epoch": 1201} {"train_loss": -40.576133728027344, "global_step": 145359, "epoch": 1201} {"train_loss": -39.02759552001953, "global_step": 145360, "epoch": 1201} {"train_loss": -40.2469367980957, "global_step": 145361, "epoch": 1201} {"train_loss": -39.4388542175293, "global_step": 145362, "epoch": 1201} {"train_loss": -40.31964111328125, "global_step": 145363, "epoch": 1201} {"train_loss": -40.16945266723633, "global_step": 145364, "epoch": 1201} {"train_loss": -40.36351776123047, "global_step": 145365, "epoch": 1201} {"train_loss": -40.50275421142578, "global_step": 145366, "epoch": 1201} {"train_loss": -40.353118896484375, "global_step": 145367, "epoch": 1201} {"train_loss": -40.50767135620117, "global_step": 145368, "epoch": 1201} {"train_loss": -40.31940841674805, "global_step": 145369, "epoch": 1201} {"train_loss": -40.96221923828125, "global_step": 145370, "epoch": 1201} {"train_loss": -40.73725128173828, "global_step": 145371, "epoch": 1201} {"train_loss": -40.3468132019043, "global_step": 145372, "epoch": 1201} {"train_loss": -40.93421173095703, "global_step": 145373, "epoch": 1201} {"train_loss": -41.21487045288086, "global_step": 145374, "epoch": 1201} {"train_loss": -40.8770637512207, "global_step": 145375, "epoch": 1201} {"train_loss": -40.997066497802734, "global_step": 145376, "epoch": 1201} {"train_loss": -41.041378021240234, "global_step": 145377, "epoch": 1201} {"train_loss": -40.43793869018555, "global_step": 145378, "epoch": 1201} {"train_loss": -40.71073532104492, "global_step": 145379, "epoch": 1201} {"train_loss": -40.70778274536133, "global_step": 145380, "epoch": 1201} {"train_loss": -40.94462203979492, "global_step": 145381, "epoch": 1201} {"train_loss": -40.660396575927734, "global_step": 145382, "epoch": 1201} {"train_loss": -40.94082260131836, "global_step": 145383, "epoch": 1201} {"train_loss": -41.14983367919922, "global_step": 145384, "epoch": 1201} {"train_loss": -40.72593307495117, "global_step": 145385, "epoch": 1201} {"train_loss": -41.09383773803711, "global_step": 145386, "epoch": 1201} {"train_loss": -41.22760772705078, "global_step": 145387, "epoch": 1201} {"train_loss": -40.64284896850586, "global_step": 145388, "epoch": 1201} {"train_loss": -40.777835845947266, "global_step": 145389, "epoch": 1201} {"train_loss": -40.97966384887695, "global_step": 145390, "epoch": 1201} {"train_loss": -40.1764030456543, "global_step": 145391, "epoch": 1201} {"train_loss": -39.4384765625, "global_step": 145392, "epoch": 1201} {"train_loss": -39.09443283081055, "global_step": 145393, "epoch": 1201} {"train_loss": -39.7761344909668, "global_step": 145394, "epoch": 1201} {"train_loss": -41.51131820678711, "global_step": 145395, "epoch": 1201} {"train_loss": -39.35586166381836, "global_step": 145396, "epoch": 1201} {"train_loss": -38.16843795776367, "global_step": 145397, "epoch": 1201} {"train_loss": -38.02653121948242, "global_step": 145398, "epoch": 1201} {"train_loss": -38.01443099975586, "global_step": 145399, "epoch": 1201} {"train_loss": -38.988101959228516, "global_step": 145400, "epoch": 1201} {"train_loss": -40.48588562011719, "global_step": 145401, "epoch": 1201} {"train_loss": -39.713993072509766, "global_step": 145402, "epoch": 1201} {"train_loss": -39.374900817871094, "global_step": 145403, "epoch": 1201} {"train_loss": -40.94961166381836, "global_step": 145404, "epoch": 1201} {"train_loss": -40.128662109375, "global_step": 145405, "epoch": 1201} {"train_loss": -39.35380935668945, "global_step": 145406, "epoch": 1201} {"train_loss": -40.26887893676758, "global_step": 145407, "epoch": 1201} {"train_loss": -40.946128845214844, "global_step": 145408, "epoch": 1201} {"train_loss": -39.40805435180664, "global_step": 145409, "epoch": 1201} {"train_loss": -40.65084457397461, "global_step": 145410, "epoch": 1201} {"train_loss": -39.532691955566406, "global_step": 145411, "epoch": 1201} {"train_loss": -38.57399368286133, "global_step": 145412, "epoch": 1201} {"train_loss": -40.00877380371094, "global_step": 145413, "epoch": 1201} {"train_loss": -40.416866302490234, "global_step": 145414, "epoch": 1201} {"train_loss": -40.61717224121094, "global_step": 145415, "epoch": 1201} {"train_loss": -38.7087287902832, "global_step": 145416, "epoch": 1201} {"train_loss": -40.84798049926758, "global_step": 145417, "epoch": 1201} {"train_loss": -40.6160774230957, "global_step": 145418, "epoch": 1201} {"train_loss": -40.07656478881836, "global_step": 145419, "epoch": 1201} {"train_loss": -40.96548080444336, "global_step": 145420, "epoch": 1201} {"train_loss": -40.76946258544922, "global_step": 145421, "epoch": 1201} {"train_loss": -40.20735549926758, "global_step": 145422, "epoch": 1201} {"train_loss": -40.88103103637695, "global_step": 145423, "epoch": 1201} {"train_loss": -40.9134635925293, "global_step": 145424, "epoch": 1201} {"train_loss": -40.48628616333008, "global_step": 145425, "epoch": 1201} {"train_loss": -40.021400451660156, "global_step": 145426, "epoch": 1201} {"train_loss": -40.2962760925293, "global_step": 145427, "epoch": 1201} {"train_loss": -40.5444221496582, "global_step": 145428, "epoch": 1201} {"train_loss": -39.540645599365234, "global_step": 145429, "epoch": 1201} {"train_loss": -39.8911247253418, "global_step": 145430, "epoch": 1201} {"train_loss": -40.55197525024414, "global_step": 145431, "epoch": 1201} {"train_loss": -40.4434928894043, "global_step": 145432, "epoch": 1201} {"train_loss": -39.032470703125, "global_step": 145433, "epoch": 1201} {"train_loss": -37.525230407714844, "global_step": 145434, "epoch": 1201} {"train_loss": -38.228153228759766, "global_step": 145435, "epoch": 1201} {"train_loss": -36.562774658203125, "global_step": 145436, "epoch": 1201} {"train_loss": -39.3191032409668, "global_step": 145437, "epoch": 1201} {"train_loss": -25.498273849487305, "global_step": 145438, "epoch": 1201} {"train_loss": -26.5932559967041, "global_step": 145439, "epoch": 1201} {"train_loss": 0.10702057182788849, "global_step": 145440, "epoch": 1201} {"train_loss": -38.86620679805594, "global_step": 145441, "epoch": 1201, "val_loss": 2898132.25} {"train_loss": -25.95326805114746, "global_step": 145442, "epoch": 1202} {"train_loss": -27.0439395904541, "global_step": 145443, "epoch": 1202} {"train_loss": -15.089813232421875, "global_step": 145444, "epoch": 1202} {"train_loss": -19.510696411132812, "global_step": 145445, "epoch": 1202} {"train_loss": -22.8819637298584, "global_step": 145446, "epoch": 1202} {"train_loss": -11.412208557128906, "global_step": 145447, "epoch": 1202} {"train_loss": -27.207763671875, "global_step": 145448, "epoch": 1202} {"train_loss": -28.629058837890625, "global_step": 145449, "epoch": 1202} {"train_loss": -16.535123825073242, "global_step": 145450, "epoch": 1202} {"train_loss": -10.874127388000488, "global_step": 145451, "epoch": 1202} {"train_loss": -25.943525314331055, "global_step": 145452, "epoch": 1202} {"train_loss": -24.393348693847656, "global_step": 145453, "epoch": 1202} {"train_loss": -23.91410255432129, "global_step": 145454, "epoch": 1202} {"train_loss": -28.589731216430664, "global_step": 145455, "epoch": 1202} {"train_loss": -29.595922470092773, "global_step": 145456, "epoch": 1202} {"train_loss": -24.33556365966797, "global_step": 145457, "epoch": 1202} {"train_loss": -32.101593017578125, "global_step": 145458, "epoch": 1202} {"train_loss": -29.656103134155273, "global_step": 145459, "epoch": 1202} {"train_loss": -27.69675064086914, "global_step": 145460, "epoch": 1202} {"train_loss": -27.70448112487793, "global_step": 145461, "epoch": 1202} {"train_loss": -30.733274459838867, "global_step": 145462, "epoch": 1202} {"train_loss": -32.07003402709961, "global_step": 145463, "epoch": 1202} {"train_loss": -32.95585250854492, "global_step": 145464, "epoch": 1202} {"train_loss": -31.348663330078125, "global_step": 145465, "epoch": 1202} {"train_loss": -32.66724395751953, "global_step": 145466, "epoch": 1202} {"train_loss": -31.592233657836914, "global_step": 145467, "epoch": 1202} {"train_loss": -32.76030731201172, "global_step": 145468, "epoch": 1202} {"train_loss": -33.55293655395508, "global_step": 145469, "epoch": 1202} {"train_loss": -33.61660385131836, "global_step": 145470, "epoch": 1202} {"train_loss": -34.8423957824707, "global_step": 145471, "epoch": 1202} {"train_loss": -34.03131866455078, "global_step": 145472, "epoch": 1202} {"train_loss": -33.122039794921875, "global_step": 145473, "epoch": 1202} {"train_loss": -33.950130462646484, "global_step": 145474, "epoch": 1202} {"train_loss": -33.710968017578125, "global_step": 145475, "epoch": 1202} {"train_loss": -34.47445297241211, "global_step": 145476, "epoch": 1202} {"train_loss": -34.58667755126953, "global_step": 145477, "epoch": 1202} {"train_loss": -34.705078125, "global_step": 145478, "epoch": 1202} {"train_loss": -35.53688430786133, "global_step": 145479, "epoch": 1202} {"train_loss": -34.4305534362793, "global_step": 145480, "epoch": 1202} {"train_loss": -34.73765182495117, "global_step": 145481, "epoch": 1202} {"train_loss": -34.04458236694336, "global_step": 145482, "epoch": 1202} {"train_loss": -34.761531829833984, "global_step": 145483, "epoch": 1202} {"train_loss": -34.387115478515625, "global_step": 145484, "epoch": 1202} {"train_loss": -35.25586700439453, "global_step": 145485, "epoch": 1202} {"train_loss": -35.52324295043945, "global_step": 145486, "epoch": 1202} {"train_loss": -35.66830062866211, "global_step": 145487, "epoch": 1202} {"train_loss": -35.30024337768555, "global_step": 145488, "epoch": 1202} {"train_loss": -34.620418548583984, "global_step": 145489, "epoch": 1202} {"train_loss": -35.3834342956543, "global_step": 145490, "epoch": 1202} {"train_loss": -35.25152587890625, "global_step": 145491, "epoch": 1202} {"train_loss": -35.4390983581543, "global_step": 145492, "epoch": 1202} {"train_loss": -35.414791107177734, "global_step": 145493, "epoch": 1202} {"train_loss": -35.75246810913086, "global_step": 145494, "epoch": 1202} {"train_loss": -35.93766403198242, "global_step": 145495, "epoch": 1202} {"train_loss": -35.437252044677734, "global_step": 145496, "epoch": 1202} {"train_loss": -35.557212829589844, "global_step": 145497, "epoch": 1202} {"train_loss": -36.375457763671875, "global_step": 145498, "epoch": 1202} {"train_loss": -35.81421661376953, "global_step": 145499, "epoch": 1202} {"train_loss": -35.7596549987793, "global_step": 145500, "epoch": 1202} {"train_loss": -35.95478439331055, "global_step": 145501, "epoch": 1202} {"train_loss": -36.09017562866211, "global_step": 145502, "epoch": 1202} {"train_loss": -36.46491622924805, "global_step": 145503, "epoch": 1202} {"train_loss": -36.090816497802734, "global_step": 145504, "epoch": 1202} {"train_loss": -36.22482681274414, "global_step": 145505, "epoch": 1202} {"train_loss": -36.446346282958984, "global_step": 145506, "epoch": 1202} {"train_loss": -36.720123291015625, "global_step": 145507, "epoch": 1202} {"train_loss": -35.87575912475586, "global_step": 145508, "epoch": 1202} {"train_loss": -36.10104751586914, "global_step": 145509, "epoch": 1202} {"train_loss": -36.307350158691406, "global_step": 145510, "epoch": 1202} {"train_loss": -36.3176383972168, "global_step": 145511, "epoch": 1202} {"train_loss": -36.39315414428711, "global_step": 145512, "epoch": 1202} {"train_loss": -36.32231140136719, "global_step": 145513, "epoch": 1202} {"train_loss": -36.956478118896484, "global_step": 145514, "epoch": 1202} {"train_loss": -36.744232177734375, "global_step": 145515, "epoch": 1202} {"train_loss": -36.93143081665039, "global_step": 145516, "epoch": 1202} {"train_loss": -36.80859375, "global_step": 145517, "epoch": 1202} {"train_loss": -37.01758575439453, "global_step": 145518, "epoch": 1202} {"train_loss": -36.728370666503906, "global_step": 145519, "epoch": 1202} {"train_loss": -37.203369140625, "global_step": 145520, "epoch": 1202} {"train_loss": -36.655189514160156, "global_step": 145521, "epoch": 1202} {"train_loss": -37.18225860595703, "global_step": 145522, "epoch": 1202} {"train_loss": -36.41901397705078, "global_step": 145523, "epoch": 1202} {"train_loss": -37.464927673339844, "global_step": 145524, "epoch": 1202} {"train_loss": -37.36684036254883, "global_step": 145525, "epoch": 1202} {"train_loss": -37.030155181884766, "global_step": 145526, "epoch": 1202} {"train_loss": -37.49824142456055, "global_step": 145527, "epoch": 1202} {"train_loss": -37.817440032958984, "global_step": 145528, "epoch": 1202} {"train_loss": -37.01691436767578, "global_step": 145529, "epoch": 1202} {"train_loss": -37.18147659301758, "global_step": 145530, "epoch": 1202} {"train_loss": -37.00482940673828, "global_step": 145531, "epoch": 1202} {"train_loss": -37.48606872558594, "global_step": 145532, "epoch": 1202} {"train_loss": -37.17281723022461, "global_step": 145533, "epoch": 1202} {"train_loss": -37.737998962402344, "global_step": 145534, "epoch": 1202} {"train_loss": -37.51028060913086, "global_step": 145535, "epoch": 1202} {"train_loss": -36.445369720458984, "global_step": 145536, "epoch": 1202} {"train_loss": -37.91476058959961, "global_step": 145537, "epoch": 1202} {"train_loss": -37.28224563598633, "global_step": 145538, "epoch": 1202} {"train_loss": -37.531471252441406, "global_step": 145539, "epoch": 1202} {"train_loss": -37.36827850341797, "global_step": 145540, "epoch": 1202} {"train_loss": -37.54954147338867, "global_step": 145541, "epoch": 1202} {"train_loss": -37.92753601074219, "global_step": 145542, "epoch": 1202} {"train_loss": -38.046295166015625, "global_step": 145543, "epoch": 1202} {"train_loss": -38.25611114501953, "global_step": 145544, "epoch": 1202} {"train_loss": -37.65437698364258, "global_step": 145545, "epoch": 1202} {"train_loss": -37.81243133544922, "global_step": 145546, "epoch": 1202} {"train_loss": -38.26620864868164, "global_step": 145547, "epoch": 1202} {"train_loss": -37.8912239074707, "global_step": 145548, "epoch": 1202} {"train_loss": -37.85723114013672, "global_step": 145549, "epoch": 1202} {"train_loss": -38.43561935424805, "global_step": 145550, "epoch": 1202} {"train_loss": -37.674922943115234, "global_step": 145551, "epoch": 1202} {"train_loss": -37.684810638427734, "global_step": 145552, "epoch": 1202} {"train_loss": -37.19866180419922, "global_step": 145553, "epoch": 1202} {"train_loss": -37.44121170043945, "global_step": 145554, "epoch": 1202} {"train_loss": -38.44266891479492, "global_step": 145555, "epoch": 1202} {"train_loss": -38.172969818115234, "global_step": 145556, "epoch": 1202} {"train_loss": -38.21294403076172, "global_step": 145557, "epoch": 1202} {"train_loss": -38.47063064575195, "global_step": 145558, "epoch": 1202} {"train_loss": -38.38663864135742, "global_step": 145559, "epoch": 1202} {"train_loss": -38.007110595703125, "global_step": 145560, "epoch": 1202} {"train_loss": -38.53596878051758, "global_step": 145561, "epoch": 1202} {"train_loss": -34.1460309698562, "global_step": 145562, "epoch": 1202, "val_loss": 2734232.75} {"train_loss": -38.47221755981445, "global_step": 145563, "epoch": 1203} {"train_loss": -36.97211837768555, "global_step": 145564, "epoch": 1203} {"train_loss": -38.76861572265625, "global_step": 145565, "epoch": 1203} {"train_loss": -38.22426223754883, "global_step": 145566, "epoch": 1203} {"train_loss": -38.71201705932617, "global_step": 145567, "epoch": 1203} {"train_loss": -38.255977630615234, "global_step": 145568, "epoch": 1203} {"train_loss": -38.951961517333984, "global_step": 145569, "epoch": 1203} {"train_loss": -38.337379455566406, "global_step": 145570, "epoch": 1203} {"train_loss": -38.60138702392578, "global_step": 145571, "epoch": 1203} {"train_loss": -37.549652099609375, "global_step": 145572, "epoch": 1203} {"train_loss": -38.0919303894043, "global_step": 145573, "epoch": 1203} {"train_loss": -38.171443939208984, "global_step": 145574, "epoch": 1203} {"train_loss": -38.78663635253906, "global_step": 145575, "epoch": 1203} {"train_loss": -38.79633712768555, "global_step": 145576, "epoch": 1203} {"train_loss": -38.58397674560547, "global_step": 145577, "epoch": 1203} {"train_loss": -39.02474594116211, "global_step": 145578, "epoch": 1203} {"train_loss": -38.20316696166992, "global_step": 145579, "epoch": 1203} {"train_loss": -38.857513427734375, "global_step": 145580, "epoch": 1203} {"train_loss": -38.99055099487305, "global_step": 145581, "epoch": 1203} {"train_loss": -39.45991516113281, "global_step": 145582, "epoch": 1203} {"train_loss": -39.37929153442383, "global_step": 145583, "epoch": 1203} {"train_loss": -38.82344436645508, "global_step": 145584, "epoch": 1203} {"train_loss": -38.995025634765625, "global_step": 145585, "epoch": 1203} {"train_loss": -38.933135986328125, "global_step": 145586, "epoch": 1203} {"train_loss": -39.262481689453125, "global_step": 145587, "epoch": 1203} {"train_loss": -38.51749801635742, "global_step": 145588, "epoch": 1203} {"train_loss": -38.814842224121094, "global_step": 145589, "epoch": 1203} {"train_loss": -38.75263214111328, "global_step": 145590, "epoch": 1203} {"train_loss": -38.566192626953125, "global_step": 145591, "epoch": 1203} {"train_loss": -38.57068634033203, "global_step": 145592, "epoch": 1203} {"train_loss": -39.36720657348633, "global_step": 145593, "epoch": 1203} {"train_loss": -39.32675552368164, "global_step": 145594, "epoch": 1203} {"train_loss": -39.64461135864258, "global_step": 145595, "epoch": 1203} {"train_loss": -38.936058044433594, "global_step": 145596, "epoch": 1203} {"train_loss": -38.964820861816406, "global_step": 145597, "epoch": 1203} {"train_loss": -39.29584884643555, "global_step": 145598, "epoch": 1203} {"train_loss": -39.21371078491211, "global_step": 145599, "epoch": 1203} {"train_loss": -39.00260925292969, "global_step": 145600, "epoch": 1203} {"train_loss": -39.71724319458008, "global_step": 145601, "epoch": 1203} {"train_loss": -39.62809371948242, "global_step": 145602, "epoch": 1203} {"train_loss": -39.155330657958984, "global_step": 145603, "epoch": 1203} {"train_loss": -39.32402038574219, "global_step": 145604, "epoch": 1203} {"train_loss": -39.537044525146484, "global_step": 145605, "epoch": 1203} {"train_loss": -39.353736877441406, "global_step": 145606, "epoch": 1203} {"train_loss": -39.5624885559082, "global_step": 145607, "epoch": 1203} {"train_loss": -39.292510986328125, "global_step": 145608, "epoch": 1203} {"train_loss": -39.41921615600586, "global_step": 145609, "epoch": 1203} {"train_loss": -39.31001663208008, "global_step": 145610, "epoch": 1203} {"train_loss": -39.65573501586914, "global_step": 145611, "epoch": 1203} {"train_loss": -39.714935302734375, "global_step": 145612, "epoch": 1203} {"train_loss": -39.171016693115234, "global_step": 145613, "epoch": 1203} {"train_loss": -40.14466094970703, "global_step": 145614, "epoch": 1203} {"train_loss": -40.04037857055664, "global_step": 145615, "epoch": 1203} {"train_loss": -39.450923919677734, "global_step": 145616, "epoch": 1203} {"train_loss": -40.174312591552734, "global_step": 145617, "epoch": 1203} {"train_loss": -39.740535736083984, "global_step": 145618, "epoch": 1203} {"train_loss": -39.72990036010742, "global_step": 145619, "epoch": 1203} {"train_loss": -39.72343063354492, "global_step": 145620, "epoch": 1203} {"train_loss": -39.08519744873047, "global_step": 145621, "epoch": 1203} {"train_loss": -39.83058547973633, "global_step": 145622, "epoch": 1203} {"train_loss": -39.98115158081055, "global_step": 145623, "epoch": 1203} {"train_loss": -39.34072494506836, "global_step": 145624, "epoch": 1203} {"train_loss": -39.52912139892578, "global_step": 145625, "epoch": 1203} {"train_loss": -39.773677825927734, "global_step": 145626, "epoch": 1203} {"train_loss": -39.793060302734375, "global_step": 145627, "epoch": 1203} {"train_loss": -40.19769287109375, "global_step": 145628, "epoch": 1203} {"train_loss": -39.080810546875, "global_step": 145629, "epoch": 1203} {"train_loss": -39.83504867553711, "global_step": 145630, "epoch": 1203} {"train_loss": -40.0406494140625, "global_step": 145631, "epoch": 1203} {"train_loss": -39.61267852783203, "global_step": 145632, "epoch": 1203} {"train_loss": -39.77229690551758, "global_step": 145633, "epoch": 1203} {"train_loss": -39.28721237182617, "global_step": 145634, "epoch": 1203} {"train_loss": -39.39281463623047, "global_step": 145635, "epoch": 1203} {"train_loss": -39.70939254760742, "global_step": 145636, "epoch": 1203} {"train_loss": -38.687679290771484, "global_step": 145637, "epoch": 1203} {"train_loss": -40.23963165283203, "global_step": 145638, "epoch": 1203} {"train_loss": -39.47846603393555, "global_step": 145639, "epoch": 1203} {"train_loss": -39.88798904418945, "global_step": 145640, "epoch": 1203} {"train_loss": -39.40028762817383, "global_step": 145641, "epoch": 1203} {"train_loss": -39.894596099853516, "global_step": 145642, "epoch": 1203} {"train_loss": -40.07380676269531, "global_step": 145643, "epoch": 1203} {"train_loss": -39.246150970458984, "global_step": 145644, "epoch": 1203} {"train_loss": -38.470272064208984, "global_step": 145645, "epoch": 1203} {"train_loss": -36.38520050048828, "global_step": 145646, "epoch": 1203} {"train_loss": -38.7088623046875, "global_step": 145647, "epoch": 1203} {"train_loss": -38.780818939208984, "global_step": 145648, "epoch": 1203} {"train_loss": -37.93242263793945, "global_step": 145649, "epoch": 1203} {"train_loss": -38.518592834472656, "global_step": 145650, "epoch": 1203} {"train_loss": -38.89749526977539, "global_step": 145651, "epoch": 1203} {"train_loss": -38.01481628417969, "global_step": 145652, "epoch": 1203} {"train_loss": -38.02241134643555, "global_step": 145653, "epoch": 1203} {"train_loss": -36.729225158691406, "global_step": 145654, "epoch": 1203} {"train_loss": -34.34586715698242, "global_step": 145655, "epoch": 1203} {"train_loss": -37.11549377441406, "global_step": 145656, "epoch": 1203} {"train_loss": -37.21638107299805, "global_step": 145657, "epoch": 1203} {"train_loss": -33.92182922363281, "global_step": 145658, "epoch": 1203} {"train_loss": -32.66722869873047, "global_step": 145659, "epoch": 1203} {"train_loss": -37.788795471191406, "global_step": 145660, "epoch": 1203} {"train_loss": -32.39078140258789, "global_step": 145661, "epoch": 1203} {"train_loss": -32.729427337646484, "global_step": 145662, "epoch": 1203} {"train_loss": -37.01042556762695, "global_step": 145663, "epoch": 1203} {"train_loss": -34.956634521484375, "global_step": 145664, "epoch": 1203} {"train_loss": -34.5672721862793, "global_step": 145665, "epoch": 1203} {"train_loss": -37.519866943359375, "global_step": 145666, "epoch": 1203} {"train_loss": -36.033180236816406, "global_step": 145667, "epoch": 1203} {"train_loss": -37.93120574951172, "global_step": 145668, "epoch": 1203} {"train_loss": -36.081581115722656, "global_step": 145669, "epoch": 1203} {"train_loss": -38.85219955444336, "global_step": 145670, "epoch": 1203} {"train_loss": -36.09214782714844, "global_step": 145671, "epoch": 1203} {"train_loss": -38.63599395751953, "global_step": 145672, "epoch": 1203} {"train_loss": -33.92932891845703, "global_step": 145673, "epoch": 1203} {"train_loss": -38.92696762084961, "global_step": 145674, "epoch": 1203} {"train_loss": -37.03824996948242, "global_step": 145675, "epoch": 1203} {"train_loss": -39.141422271728516, "global_step": 145676, "epoch": 1203} {"train_loss": -37.81135177612305, "global_step": 145677, "epoch": 1203} {"train_loss": -38.889404296875, "global_step": 145678, "epoch": 1203} {"train_loss": -37.8336296081543, "global_step": 145679, "epoch": 1203} {"train_loss": -37.68763732910156, "global_step": 145680, "epoch": 1203} {"train_loss": -38.3104133605957, "global_step": 145681, "epoch": 1203} {"train_loss": -38.246212005615234, "global_step": 145682, "epoch": 1203} {"train_loss": -38.49704200177153, "global_step": 145683, "epoch": 1203, "val_loss": 2776860.75} {"train_loss": -33.34071350097656, "global_step": 145684, "epoch": 1204} {"train_loss": -38.99427795410156, "global_step": 145685, "epoch": 1204} {"train_loss": -39.256935119628906, "global_step": 145686, "epoch": 1204} {"train_loss": -35.83940505981445, "global_step": 145687, "epoch": 1204} {"train_loss": -38.37868881225586, "global_step": 145688, "epoch": 1204} {"train_loss": -39.507476806640625, "global_step": 145689, "epoch": 1204} {"train_loss": -38.31876754760742, "global_step": 145690, "epoch": 1204} {"train_loss": -39.179805755615234, "global_step": 145691, "epoch": 1204} {"train_loss": -38.09041976928711, "global_step": 145692, "epoch": 1204} {"train_loss": -38.5078010559082, "global_step": 145693, "epoch": 1204} {"train_loss": -36.27894973754883, "global_step": 145694, "epoch": 1204} {"train_loss": -38.76888656616211, "global_step": 145695, "epoch": 1204} {"train_loss": -39.58039855957031, "global_step": 145696, "epoch": 1204} {"train_loss": -38.08375930786133, "global_step": 145697, "epoch": 1204} {"train_loss": -38.4226188659668, "global_step": 145698, "epoch": 1204} {"train_loss": -39.60367965698242, "global_step": 145699, "epoch": 1204} {"train_loss": -39.0841064453125, "global_step": 145700, "epoch": 1204} {"train_loss": -38.931915283203125, "global_step": 145701, "epoch": 1204} {"train_loss": -38.70310974121094, "global_step": 145702, "epoch": 1204} {"train_loss": -39.254730224609375, "global_step": 145703, "epoch": 1204} {"train_loss": -39.41830062866211, "global_step": 145704, "epoch": 1204} {"train_loss": -38.8114128112793, "global_step": 145705, "epoch": 1204} {"train_loss": -39.840431213378906, "global_step": 145706, "epoch": 1204} {"train_loss": -39.05519104003906, "global_step": 145707, "epoch": 1204} {"train_loss": -39.311668395996094, "global_step": 145708, "epoch": 1204} {"train_loss": -39.30990219116211, "global_step": 145709, "epoch": 1204} {"train_loss": -39.684791564941406, "global_step": 145710, "epoch": 1204} {"train_loss": -39.750892639160156, "global_step": 145711, "epoch": 1204} {"train_loss": -38.4762077331543, "global_step": 145712, "epoch": 1204} {"train_loss": -39.92387008666992, "global_step": 145713, "epoch": 1204} {"train_loss": -39.260372161865234, "global_step": 145714, "epoch": 1204} {"train_loss": -39.49323272705078, "global_step": 145715, "epoch": 1204} {"train_loss": -39.79160690307617, "global_step": 145716, "epoch": 1204} {"train_loss": -37.499881744384766, "global_step": 145717, "epoch": 1204} {"train_loss": -39.26225662231445, "global_step": 145718, "epoch": 1204} {"train_loss": -39.65175247192383, "global_step": 145719, "epoch": 1204} {"train_loss": -39.73405075073242, "global_step": 145720, "epoch": 1204} {"train_loss": -39.676509857177734, "global_step": 145721, "epoch": 1204} {"train_loss": -39.61479568481445, "global_step": 145722, "epoch": 1204} {"train_loss": -39.130104064941406, "global_step": 145723, "epoch": 1204} {"train_loss": -40.191715240478516, "global_step": 145724, "epoch": 1204} {"train_loss": -39.413448333740234, "global_step": 145725, "epoch": 1204} {"train_loss": -40.06181335449219, "global_step": 145726, "epoch": 1204} {"train_loss": -40.36663818359375, "global_step": 145727, "epoch": 1204} {"train_loss": -39.92206954956055, "global_step": 145728, "epoch": 1204} {"train_loss": -39.673927307128906, "global_step": 145729, "epoch": 1204} {"train_loss": -40.20301055908203, "global_step": 145730, "epoch": 1204} {"train_loss": -39.931312561035156, "global_step": 145731, "epoch": 1204} {"train_loss": -40.31728744506836, "global_step": 145732, "epoch": 1204} {"train_loss": -40.0568962097168, "global_step": 145733, "epoch": 1204} {"train_loss": -40.29616928100586, "global_step": 145734, "epoch": 1204} {"train_loss": -40.328857421875, "global_step": 145735, "epoch": 1204} {"train_loss": -40.093807220458984, "global_step": 145736, "epoch": 1204} {"train_loss": -39.78789138793945, "global_step": 145737, "epoch": 1204} {"train_loss": -39.286842346191406, "global_step": 145738, "epoch": 1204} {"train_loss": -39.3611946105957, "global_step": 145739, "epoch": 1204} {"train_loss": -39.63914489746094, "global_step": 145740, "epoch": 1204} {"train_loss": -40.652400970458984, "global_step": 145741, "epoch": 1204} {"train_loss": -39.22744369506836, "global_step": 145742, "epoch": 1204} {"train_loss": -40.29986572265625, "global_step": 145743, "epoch": 1204} {"train_loss": -38.49947738647461, "global_step": 145744, "epoch": 1204} {"train_loss": -38.980857849121094, "global_step": 145745, "epoch": 1204} {"train_loss": -39.42951202392578, "global_step": 145746, "epoch": 1204} {"train_loss": -39.63032150268555, "global_step": 145747, "epoch": 1204} {"train_loss": -38.38239288330078, "global_step": 145748, "epoch": 1204} {"train_loss": -39.88019561767578, "global_step": 145749, "epoch": 1204} {"train_loss": -39.42194747924805, "global_step": 145750, "epoch": 1204} {"train_loss": -38.34938430786133, "global_step": 145751, "epoch": 1204} {"train_loss": -38.95212936401367, "global_step": 145752, "epoch": 1204} {"train_loss": -38.51056671142578, "global_step": 145753, "epoch": 1204} {"train_loss": -39.78536605834961, "global_step": 145754, "epoch": 1204} {"train_loss": -39.8365364074707, "global_step": 145755, "epoch": 1204} {"train_loss": -40.336971282958984, "global_step": 145756, "epoch": 1204} {"train_loss": -40.21253204345703, "global_step": 145757, "epoch": 1204} {"train_loss": -38.88280487060547, "global_step": 145758, "epoch": 1204} {"train_loss": -38.837547302246094, "global_step": 145759, "epoch": 1204} {"train_loss": -39.5800895690918, "global_step": 145760, "epoch": 1204} {"train_loss": -39.9252815246582, "global_step": 145761, "epoch": 1204} {"train_loss": -39.63535690307617, "global_step": 145762, "epoch": 1204} {"train_loss": -37.66180419921875, "global_step": 145763, "epoch": 1204} {"train_loss": -36.99334716796875, "global_step": 145764, "epoch": 1204} {"train_loss": -39.012943267822266, "global_step": 145765, "epoch": 1204} {"train_loss": -38.933692932128906, "global_step": 145766, "epoch": 1204} {"train_loss": -37.656192779541016, "global_step": 145767, "epoch": 1204} {"train_loss": -37.49176025390625, "global_step": 145768, "epoch": 1204} {"train_loss": -39.9024658203125, "global_step": 145769, "epoch": 1204} {"train_loss": -38.38837814331055, "global_step": 145770, "epoch": 1204} {"train_loss": -38.60606002807617, "global_step": 145771, "epoch": 1204} {"train_loss": -39.4971923828125, "global_step": 145772, "epoch": 1204} {"train_loss": -38.09781265258789, "global_step": 145773, "epoch": 1204} {"train_loss": -37.78070068359375, "global_step": 145774, "epoch": 1204} {"train_loss": -40.287994384765625, "global_step": 145775, "epoch": 1204} {"train_loss": -39.05533218383789, "global_step": 145776, "epoch": 1204} {"train_loss": -39.040130615234375, "global_step": 145777, "epoch": 1204} {"train_loss": -39.7685546875, "global_step": 145778, "epoch": 1204} {"train_loss": -37.74359130859375, "global_step": 145779, "epoch": 1204} {"train_loss": -38.52955627441406, "global_step": 145780, "epoch": 1204} {"train_loss": -39.30082321166992, "global_step": 145781, "epoch": 1204} {"train_loss": -38.6176872253418, "global_step": 145782, "epoch": 1204} {"train_loss": -40.234352111816406, "global_step": 145783, "epoch": 1204} {"train_loss": -39.86358642578125, "global_step": 145784, "epoch": 1204} {"train_loss": -39.16279220581055, "global_step": 145785, "epoch": 1204} {"train_loss": -39.62583541870117, "global_step": 145786, "epoch": 1204} {"train_loss": -39.90985870361328, "global_step": 145787, "epoch": 1204} {"train_loss": -39.46323776245117, "global_step": 145788, "epoch": 1204} {"train_loss": -39.536922454833984, "global_step": 145789, "epoch": 1204} {"train_loss": -39.50107955932617, "global_step": 145790, "epoch": 1204} {"train_loss": -40.24235916137695, "global_step": 145791, "epoch": 1204} {"train_loss": -39.7337760925293, "global_step": 145792, "epoch": 1204} {"train_loss": -40.1500358581543, "global_step": 145793, "epoch": 1204} {"train_loss": -39.803504943847656, "global_step": 145794, "epoch": 1204} {"train_loss": -40.26748275756836, "global_step": 145795, "epoch": 1204} {"train_loss": -38.4863166809082, "global_step": 145796, "epoch": 1204} {"train_loss": -39.929012298583984, "global_step": 145797, "epoch": 1204} {"train_loss": -40.15528106689453, "global_step": 145798, "epoch": 1204} {"train_loss": -39.75131607055664, "global_step": 145799, "epoch": 1204} {"train_loss": -40.05931091308594, "global_step": 145800, "epoch": 1204} {"train_loss": -39.952232360839844, "global_step": 145801, "epoch": 1204} {"train_loss": -40.35539627075195, "global_step": 145802, "epoch": 1204} {"train_loss": -40.742652893066406, "global_step": 145803, "epoch": 1204} {"train_loss": -39.24595865927452, "global_step": 145804, "epoch": 1204, "val_loss": 2696864.75} {"train_loss": -39.17668533325195, "global_step": 145805, "epoch": 1205} {"train_loss": -40.30878829956055, "global_step": 145806, "epoch": 1205} {"train_loss": -39.62540817260742, "global_step": 145807, "epoch": 1205} {"train_loss": -38.64609909057617, "global_step": 145808, "epoch": 1205} {"train_loss": -40.33316421508789, "global_step": 145809, "epoch": 1205} {"train_loss": -39.18801498413086, "global_step": 145810, "epoch": 1205} {"train_loss": -39.40652084350586, "global_step": 145811, "epoch": 1205} {"train_loss": -37.772335052490234, "global_step": 145812, "epoch": 1205} {"train_loss": -39.597042083740234, "global_step": 145813, "epoch": 1205} {"train_loss": -39.9765510559082, "global_step": 145814, "epoch": 1205} {"train_loss": -39.73548889160156, "global_step": 145815, "epoch": 1205} {"train_loss": -40.561458587646484, "global_step": 145816, "epoch": 1205} {"train_loss": -40.28770065307617, "global_step": 145817, "epoch": 1205} {"train_loss": -40.555843353271484, "global_step": 145818, "epoch": 1205} {"train_loss": -40.43442916870117, "global_step": 145819, "epoch": 1205} {"train_loss": -39.98731231689453, "global_step": 145820, "epoch": 1205} {"train_loss": -39.631587982177734, "global_step": 145821, "epoch": 1205} {"train_loss": -39.355445861816406, "global_step": 145822, "epoch": 1205} {"train_loss": -40.316524505615234, "global_step": 145823, "epoch": 1205} {"train_loss": -40.370941162109375, "global_step": 145824, "epoch": 1205} {"train_loss": -38.6512565612793, "global_step": 145825, "epoch": 1205} {"train_loss": -39.59476852416992, "global_step": 145826, "epoch": 1205} {"train_loss": -37.08154296875, "global_step": 145827, "epoch": 1205} {"train_loss": -32.48509216308594, "global_step": 145828, "epoch": 1205} {"train_loss": -30.700239181518555, "global_step": 145829, "epoch": 1205} {"train_loss": -36.999446868896484, "global_step": 145830, "epoch": 1205} {"train_loss": -39.7030143737793, "global_step": 145831, "epoch": 1205} {"train_loss": -37.518226623535156, "global_step": 145832, "epoch": 1205} {"train_loss": -36.894813537597656, "global_step": 145833, "epoch": 1205} {"train_loss": -39.672847747802734, "global_step": 145834, "epoch": 1205} {"train_loss": -39.66096878051758, "global_step": 145835, "epoch": 1205} {"train_loss": -38.552154541015625, "global_step": 145836, "epoch": 1205} {"train_loss": -39.53553009033203, "global_step": 145837, "epoch": 1205} {"train_loss": -39.38462448120117, "global_step": 145838, "epoch": 1205} {"train_loss": -39.379783630371094, "global_step": 145839, "epoch": 1205} {"train_loss": -39.9887809753418, "global_step": 145840, "epoch": 1205} {"train_loss": -39.53691482543945, "global_step": 145841, "epoch": 1205} {"train_loss": -39.76272964477539, "global_step": 145842, "epoch": 1205} {"train_loss": -40.1850471496582, "global_step": 145843, "epoch": 1205} {"train_loss": -39.602874755859375, "global_step": 145844, "epoch": 1205} {"train_loss": -40.217796325683594, "global_step": 145845, "epoch": 1205} {"train_loss": -39.688568115234375, "global_step": 145846, "epoch": 1205} {"train_loss": -39.71535110473633, "global_step": 145847, "epoch": 1205} {"train_loss": -39.422847747802734, "global_step": 145848, "epoch": 1205} {"train_loss": -39.09135818481445, "global_step": 145849, "epoch": 1205} {"train_loss": -40.00466537475586, "global_step": 145850, "epoch": 1205} {"train_loss": -39.847896575927734, "global_step": 145851, "epoch": 1205} {"train_loss": -39.495216369628906, "global_step": 145852, "epoch": 1205} {"train_loss": -40.21864700317383, "global_step": 145853, "epoch": 1205} {"train_loss": -40.451107025146484, "global_step": 145854, "epoch": 1205} {"train_loss": -40.68123245239258, "global_step": 145855, "epoch": 1205} {"train_loss": -40.04624938964844, "global_step": 145856, "epoch": 1205} {"train_loss": -40.621124267578125, "global_step": 145857, "epoch": 1205} {"train_loss": -40.57670211791992, "global_step": 145858, "epoch": 1205} {"train_loss": -40.73662185668945, "global_step": 145859, "epoch": 1205} {"train_loss": -40.265785217285156, "global_step": 145860, "epoch": 1205} {"train_loss": -40.7836799621582, "global_step": 145861, "epoch": 1205} {"train_loss": -39.629638671875, "global_step": 145862, "epoch": 1205} {"train_loss": -40.51587677001953, "global_step": 145863, "epoch": 1205} {"train_loss": -40.351318359375, "global_step": 145864, "epoch": 1205} {"train_loss": -40.874671936035156, "global_step": 145865, "epoch": 1205} {"train_loss": -40.29769515991211, "global_step": 145866, "epoch": 1205} {"train_loss": -41.00436782836914, "global_step": 145867, "epoch": 1205} {"train_loss": -40.95368957519531, "global_step": 145868, "epoch": 1205} {"train_loss": -40.68943405151367, "global_step": 145869, "epoch": 1205} {"train_loss": -40.9852294921875, "global_step": 145870, "epoch": 1205} {"train_loss": -40.355403900146484, "global_step": 145871, "epoch": 1205} {"train_loss": -40.763153076171875, "global_step": 145872, "epoch": 1205} {"train_loss": -40.74398422241211, "global_step": 145873, "epoch": 1205} {"train_loss": -40.453941345214844, "global_step": 145874, "epoch": 1205} {"train_loss": -40.63052749633789, "global_step": 145875, "epoch": 1205} {"train_loss": -40.86814498901367, "global_step": 145876, "epoch": 1205} {"train_loss": -41.2542610168457, "global_step": 145877, "epoch": 1205} {"train_loss": -41.134544372558594, "global_step": 145878, "epoch": 1205} {"train_loss": -41.372314453125, "global_step": 145879, "epoch": 1205} {"train_loss": -40.20683670043945, "global_step": 145880, "epoch": 1205} {"train_loss": -40.678714752197266, "global_step": 145881, "epoch": 1205} {"train_loss": -40.995033264160156, "global_step": 145882, "epoch": 1205} {"train_loss": -40.68392562866211, "global_step": 145883, "epoch": 1205} {"train_loss": -40.834320068359375, "global_step": 145884, "epoch": 1205} {"train_loss": -40.76151657104492, "global_step": 145885, "epoch": 1205} {"train_loss": -41.05762481689453, "global_step": 145886, "epoch": 1205} {"train_loss": -40.95219802856445, "global_step": 145887, "epoch": 1205} {"train_loss": -40.72012710571289, "global_step": 145888, "epoch": 1205} {"train_loss": -40.783687591552734, "global_step": 145889, "epoch": 1205} {"train_loss": -40.62706756591797, "global_step": 145890, "epoch": 1205} {"train_loss": -36.87246322631836, "global_step": 145891, "epoch": 1205} {"train_loss": -33.011863708496094, "global_step": 145892, "epoch": 1205} {"train_loss": -26.2149658203125, "global_step": 145893, "epoch": 1205} {"train_loss": -28.864294052124023, "global_step": 145894, "epoch": 1205} {"train_loss": -38.14954376220703, "global_step": 145895, "epoch": 1205} {"train_loss": -32.4889030456543, "global_step": 145896, "epoch": 1205} {"train_loss": -28.406713485717773, "global_step": 145897, "epoch": 1205} {"train_loss": -36.43866729736328, "global_step": 145898, "epoch": 1205} {"train_loss": -36.6038932800293, "global_step": 145899, "epoch": 1205} {"train_loss": -34.91794967651367, "global_step": 145900, "epoch": 1205} {"train_loss": -37.94912338256836, "global_step": 145901, "epoch": 1205} {"train_loss": -35.69308090209961, "global_step": 145902, "epoch": 1205} {"train_loss": -38.59929656982422, "global_step": 145903, "epoch": 1205} {"train_loss": -35.95124435424805, "global_step": 145904, "epoch": 1205} {"train_loss": -39.39252853393555, "global_step": 145905, "epoch": 1205} {"train_loss": -37.58488082885742, "global_step": 145906, "epoch": 1205} {"train_loss": -39.33870315551758, "global_step": 145907, "epoch": 1205} {"train_loss": -37.65267562866211, "global_step": 145908, "epoch": 1205} {"train_loss": -38.342750549316406, "global_step": 145909, "epoch": 1205} {"train_loss": -39.85314178466797, "global_step": 145910, "epoch": 1205} {"train_loss": -38.50887680053711, "global_step": 145911, "epoch": 1205} {"train_loss": -39.055667877197266, "global_step": 145912, "epoch": 1205} {"train_loss": -38.74922561645508, "global_step": 145913, "epoch": 1205} {"train_loss": -39.18728256225586, "global_step": 145914, "epoch": 1205} {"train_loss": -39.024105072021484, "global_step": 145915, "epoch": 1205} {"train_loss": -38.021968841552734, "global_step": 145916, "epoch": 1205} {"train_loss": -39.918277740478516, "global_step": 145917, "epoch": 1205} {"train_loss": -38.2057991027832, "global_step": 145918, "epoch": 1205} {"train_loss": -39.694881439208984, "global_step": 145919, "epoch": 1205} {"train_loss": -39.6252555847168, "global_step": 145920, "epoch": 1205} {"train_loss": -38.701171875, "global_step": 145921, "epoch": 1205} {"train_loss": -40.280372619628906, "global_step": 145922, "epoch": 1205} {"train_loss": -39.45164489746094, "global_step": 145923, "epoch": 1205} {"train_loss": -39.870201110839844, "global_step": 145924, "epoch": 1205} {"train_loss": -39.0365449416736, "global_step": 145925, "epoch": 1205, "val_loss": 2886467.0} {"train_loss": -39.53232955932617, "global_step": 145926, "epoch": 1206} {"train_loss": -39.84112548828125, "global_step": 145927, "epoch": 1206} {"train_loss": -39.3760986328125, "global_step": 145928, "epoch": 1206} {"train_loss": -38.66402816772461, "global_step": 145929, "epoch": 1206} {"train_loss": -37.461612701416016, "global_step": 145930, "epoch": 1206} {"train_loss": -39.51145935058594, "global_step": 145931, "epoch": 1206} {"train_loss": -40.51078796386719, "global_step": 145932, "epoch": 1206} {"train_loss": -39.64091110229492, "global_step": 145933, "epoch": 1206} {"train_loss": -40.02389144897461, "global_step": 145934, "epoch": 1206} {"train_loss": -40.57709503173828, "global_step": 145935, "epoch": 1206} {"train_loss": -39.9194221496582, "global_step": 145936, "epoch": 1206} {"train_loss": -39.65775680541992, "global_step": 145937, "epoch": 1206} {"train_loss": -39.42679977416992, "global_step": 145938, "epoch": 1206} {"train_loss": -39.30373764038086, "global_step": 145939, "epoch": 1206} {"train_loss": -40.38546371459961, "global_step": 145940, "epoch": 1206} {"train_loss": -39.23979949951172, "global_step": 145941, "epoch": 1206} {"train_loss": -39.905635833740234, "global_step": 145942, "epoch": 1206} {"train_loss": -39.324745178222656, "global_step": 145943, "epoch": 1206} {"train_loss": -40.18427276611328, "global_step": 145944, "epoch": 1206} {"train_loss": -40.453857421875, "global_step": 145945, "epoch": 1206} {"train_loss": -40.092464447021484, "global_step": 145946, "epoch": 1206} {"train_loss": -40.14198303222656, "global_step": 145947, "epoch": 1206} {"train_loss": -40.48530960083008, "global_step": 145948, "epoch": 1206} {"train_loss": -40.639564514160156, "global_step": 145949, "epoch": 1206} {"train_loss": -40.343238830566406, "global_step": 145950, "epoch": 1206} {"train_loss": -40.94059371948242, "global_step": 145951, "epoch": 1206} {"train_loss": -40.385353088378906, "global_step": 145952, "epoch": 1206} {"train_loss": -39.93189239501953, "global_step": 145953, "epoch": 1206} {"train_loss": -40.91530227661133, "global_step": 145954, "epoch": 1206} {"train_loss": -40.943050384521484, "global_step": 145955, "epoch": 1206} {"train_loss": -40.2855339050293, "global_step": 145956, "epoch": 1206} {"train_loss": -40.48284912109375, "global_step": 145957, "epoch": 1206} {"train_loss": -40.39698028564453, "global_step": 145958, "epoch": 1206} {"train_loss": -40.25381088256836, "global_step": 145959, "epoch": 1206} {"train_loss": -41.00661849975586, "global_step": 145960, "epoch": 1206} {"train_loss": -40.50773239135742, "global_step": 145961, "epoch": 1206} {"train_loss": -40.47045135498047, "global_step": 145962, "epoch": 1206} {"train_loss": -40.29520797729492, "global_step": 145963, "epoch": 1206} {"train_loss": -40.53709030151367, "global_step": 145964, "epoch": 1206} {"train_loss": -40.50275421142578, "global_step": 145965, "epoch": 1206} {"train_loss": -40.557491302490234, "global_step": 145966, "epoch": 1206} {"train_loss": -40.5979118347168, "global_step": 145967, "epoch": 1206} {"train_loss": -40.87804412841797, "global_step": 145968, "epoch": 1206} {"train_loss": -41.09837341308594, "global_step": 145969, "epoch": 1206} {"train_loss": -40.83348846435547, "global_step": 145970, "epoch": 1206} {"train_loss": -40.5798225402832, "global_step": 145971, "epoch": 1206} {"train_loss": -40.38017654418945, "global_step": 145972, "epoch": 1206} {"train_loss": -40.3565788269043, "global_step": 145973, "epoch": 1206} {"train_loss": -39.30439376831055, "global_step": 145974, "epoch": 1206} {"train_loss": -40.4592399597168, "global_step": 145975, "epoch": 1206} {"train_loss": -40.261451721191406, "global_step": 145976, "epoch": 1206} {"train_loss": -40.97904968261719, "global_step": 145977, "epoch": 1206} {"train_loss": -40.92049789428711, "global_step": 145978, "epoch": 1206} {"train_loss": -40.8216667175293, "global_step": 145979, "epoch": 1206} {"train_loss": -41.63334274291992, "global_step": 145980, "epoch": 1206} {"train_loss": -41.16880798339844, "global_step": 145981, "epoch": 1206} {"train_loss": -40.37389373779297, "global_step": 145982, "epoch": 1206} {"train_loss": -38.271705627441406, "global_step": 145983, "epoch": 1206} {"train_loss": -38.22040939331055, "global_step": 145984, "epoch": 1206} {"train_loss": -39.425716400146484, "global_step": 145985, "epoch": 1206} {"train_loss": -39.07590866088867, "global_step": 145986, "epoch": 1206} {"train_loss": -38.33622741699219, "global_step": 145987, "epoch": 1206} {"train_loss": -38.30311584472656, "global_step": 145988, "epoch": 1206} {"train_loss": -38.71833801269531, "global_step": 145989, "epoch": 1206} {"train_loss": -40.7064323425293, "global_step": 145990, "epoch": 1206} {"train_loss": -41.060298919677734, "global_step": 145991, "epoch": 1206} {"train_loss": -40.05927276611328, "global_step": 145992, "epoch": 1206} {"train_loss": -40.772701263427734, "global_step": 145993, "epoch": 1206} {"train_loss": -40.117000579833984, "global_step": 145994, "epoch": 1206} {"train_loss": -40.40390396118164, "global_step": 145995, "epoch": 1206} {"train_loss": -39.891475677490234, "global_step": 145996, "epoch": 1206} {"train_loss": -39.532222747802734, "global_step": 145997, "epoch": 1206} {"train_loss": -40.57511520385742, "global_step": 145998, "epoch": 1206} {"train_loss": -38.906768798828125, "global_step": 145999, "epoch": 1206} {"train_loss": -35.98112869262695, "global_step": 146000, "epoch": 1206} {"train_loss": -38.07155227661133, "global_step": 146001, "epoch": 1206} {"train_loss": -39.4711799621582, "global_step": 146002, "epoch": 1206} {"train_loss": -38.719791412353516, "global_step": 146003, "epoch": 1206} {"train_loss": -36.4548454284668, "global_step": 146004, "epoch": 1206} {"train_loss": -39.66254425048828, "global_step": 146005, "epoch": 1206} {"train_loss": -37.933013916015625, "global_step": 146006, "epoch": 1206} {"train_loss": -37.68671417236328, "global_step": 146007, "epoch": 1206} {"train_loss": -39.36454391479492, "global_step": 146008, "epoch": 1206} {"train_loss": -39.54444122314453, "global_step": 146009, "epoch": 1206} {"train_loss": -39.53237533569336, "global_step": 146010, "epoch": 1206} {"train_loss": -37.670013427734375, "global_step": 146011, "epoch": 1206} {"train_loss": -40.06886672973633, "global_step": 146012, "epoch": 1206} {"train_loss": -39.594207763671875, "global_step": 146013, "epoch": 1206} {"train_loss": -38.45756530761719, "global_step": 146014, "epoch": 1206} {"train_loss": -39.20680618286133, "global_step": 146015, "epoch": 1206} {"train_loss": -38.35295104980469, "global_step": 146016, "epoch": 1206} {"train_loss": -39.28487777709961, "global_step": 146017, "epoch": 1206} {"train_loss": -38.20671844482422, "global_step": 146018, "epoch": 1206} {"train_loss": -38.91439437866211, "global_step": 146019, "epoch": 1206} {"train_loss": -39.563716888427734, "global_step": 146020, "epoch": 1206} {"train_loss": -38.68851852416992, "global_step": 146021, "epoch": 1206} {"train_loss": -39.96590042114258, "global_step": 146022, "epoch": 1206} {"train_loss": -39.86605453491211, "global_step": 146023, "epoch": 1206} {"train_loss": -39.928279876708984, "global_step": 146024, "epoch": 1206} {"train_loss": -39.772830963134766, "global_step": 146025, "epoch": 1206} {"train_loss": -40.048744201660156, "global_step": 146026, "epoch": 1206} {"train_loss": -40.18098068237305, "global_step": 146027, "epoch": 1206} {"train_loss": -39.72831344604492, "global_step": 146028, "epoch": 1206} {"train_loss": -38.52578353881836, "global_step": 146029, "epoch": 1206} {"train_loss": -40.1855583190918, "global_step": 146030, "epoch": 1206} {"train_loss": -38.533931732177734, "global_step": 146031, "epoch": 1206} {"train_loss": -39.769996643066406, "global_step": 146032, "epoch": 1206} {"train_loss": -38.04490280151367, "global_step": 146033, "epoch": 1206} {"train_loss": -39.91616439819336, "global_step": 146034, "epoch": 1206} {"train_loss": -31.8552303314209, "global_step": 146035, "epoch": 1206} {"train_loss": -32.91462326049805, "global_step": 146036, "epoch": 1206} {"train_loss": -37.18263244628906, "global_step": 146037, "epoch": 1206} {"train_loss": -33.45703887939453, "global_step": 146038, "epoch": 1206} {"train_loss": -38.436309814453125, "global_step": 146039, "epoch": 1206} {"train_loss": -38.446407318115234, "global_step": 146040, "epoch": 1206} {"train_loss": -37.55809020996094, "global_step": 146041, "epoch": 1206} {"train_loss": -37.81730270385742, "global_step": 146042, "epoch": 1206} {"train_loss": -36.52566146850586, "global_step": 146043, "epoch": 1206} {"train_loss": -37.99332046508789, "global_step": 146044, "epoch": 1206} {"train_loss": -35.21430587768555, "global_step": 146045, "epoch": 1206} {"train_loss": -39.394452260545464, "global_step": 146046, "epoch": 1206, "val_loss": 2741498.0} {"train_loss": -38.4880485534668, "global_step": 146047, "epoch": 1207} {"train_loss": -38.3785400390625, "global_step": 146048, "epoch": 1207} {"train_loss": -36.782958984375, "global_step": 146049, "epoch": 1207} {"train_loss": -37.38539123535156, "global_step": 146050, "epoch": 1207} {"train_loss": -35.430877685546875, "global_step": 146051, "epoch": 1207} {"train_loss": -38.5562744140625, "global_step": 146052, "epoch": 1207} {"train_loss": -33.142616271972656, "global_step": 146053, "epoch": 1207} {"train_loss": -37.60873031616211, "global_step": 146054, "epoch": 1207} {"train_loss": -37.06341552734375, "global_step": 146055, "epoch": 1207} {"train_loss": -37.93590545654297, "global_step": 146056, "epoch": 1207} {"train_loss": -39.35780715942383, "global_step": 146057, "epoch": 1207} {"train_loss": -38.41605758666992, "global_step": 146058, "epoch": 1207} {"train_loss": -38.09697723388672, "global_step": 146059, "epoch": 1207} {"train_loss": -36.72554016113281, "global_step": 146060, "epoch": 1207} {"train_loss": -38.11505889892578, "global_step": 146061, "epoch": 1207} {"train_loss": -38.33625030517578, "global_step": 146062, "epoch": 1207} {"train_loss": -39.16828536987305, "global_step": 146063, "epoch": 1207} {"train_loss": -39.2388916015625, "global_step": 146064, "epoch": 1207} {"train_loss": -38.69707107543945, "global_step": 146065, "epoch": 1207} {"train_loss": -39.050384521484375, "global_step": 146066, "epoch": 1207} {"train_loss": -38.133541107177734, "global_step": 146067, "epoch": 1207} {"train_loss": -39.43698501586914, "global_step": 146068, "epoch": 1207} {"train_loss": -38.521934509277344, "global_step": 146069, "epoch": 1207} {"train_loss": -39.376380920410156, "global_step": 146070, "epoch": 1207} {"train_loss": -39.096981048583984, "global_step": 146071, "epoch": 1207} {"train_loss": -39.844642639160156, "global_step": 146072, "epoch": 1207} {"train_loss": -40.279205322265625, "global_step": 146073, "epoch": 1207} {"train_loss": -38.99283981323242, "global_step": 146074, "epoch": 1207} {"train_loss": -39.23178482055664, "global_step": 146075, "epoch": 1207} {"train_loss": -39.625606536865234, "global_step": 146076, "epoch": 1207} {"train_loss": -39.5329475402832, "global_step": 146077, "epoch": 1207} {"train_loss": -39.53215789794922, "global_step": 146078, "epoch": 1207} {"train_loss": -39.54238510131836, "global_step": 146079, "epoch": 1207} {"train_loss": -39.82826232910156, "global_step": 146080, "epoch": 1207} {"train_loss": -39.463897705078125, "global_step": 146081, "epoch": 1207} {"train_loss": -39.29112243652344, "global_step": 146082, "epoch": 1207} {"train_loss": -39.52206039428711, "global_step": 146083, "epoch": 1207} {"train_loss": -40.245811462402344, "global_step": 146084, "epoch": 1207} {"train_loss": -40.462890625, "global_step": 146085, "epoch": 1207} {"train_loss": -39.27222442626953, "global_step": 146086, "epoch": 1207} {"train_loss": -39.144813537597656, "global_step": 146087, "epoch": 1207} {"train_loss": -39.95516586303711, "global_step": 146088, "epoch": 1207} {"train_loss": -39.35205078125, "global_step": 146089, "epoch": 1207} {"train_loss": -39.336708068847656, "global_step": 146090, "epoch": 1207} {"train_loss": -39.8612174987793, "global_step": 146091, "epoch": 1207} {"train_loss": -39.51078414916992, "global_step": 146092, "epoch": 1207} {"train_loss": -39.849037170410156, "global_step": 146093, "epoch": 1207} {"train_loss": -39.00065994262695, "global_step": 146094, "epoch": 1207} {"train_loss": -38.95307159423828, "global_step": 146095, "epoch": 1207} {"train_loss": -40.363521575927734, "global_step": 146096, "epoch": 1207} {"train_loss": -40.383033752441406, "global_step": 146097, "epoch": 1207} {"train_loss": -40.58317947387695, "global_step": 146098, "epoch": 1207} {"train_loss": -39.04585647583008, "global_step": 146099, "epoch": 1207} {"train_loss": -39.805049896240234, "global_step": 146100, "epoch": 1207} {"train_loss": -40.34193801879883, "global_step": 146101, "epoch": 1207} {"train_loss": -40.07417297363281, "global_step": 146102, "epoch": 1207} {"train_loss": -39.451839447021484, "global_step": 146103, "epoch": 1207} {"train_loss": -40.58957290649414, "global_step": 146104, "epoch": 1207} {"train_loss": -39.33004379272461, "global_step": 146105, "epoch": 1207} {"train_loss": -39.256874084472656, "global_step": 146106, "epoch": 1207} {"train_loss": -38.51367950439453, "global_step": 146107, "epoch": 1207} {"train_loss": -39.47109603881836, "global_step": 146108, "epoch": 1207} {"train_loss": -40.248348236083984, "global_step": 146109, "epoch": 1207} {"train_loss": -39.29000473022461, "global_step": 146110, "epoch": 1207} {"train_loss": -38.623043060302734, "global_step": 146111, "epoch": 1207} {"train_loss": -37.50506591796875, "global_step": 146112, "epoch": 1207} {"train_loss": -37.1180419921875, "global_step": 146113, "epoch": 1207} {"train_loss": -38.448402404785156, "global_step": 146114, "epoch": 1207} {"train_loss": -38.972103118896484, "global_step": 146115, "epoch": 1207} {"train_loss": -40.5899772644043, "global_step": 146116, "epoch": 1207} {"train_loss": -37.06163024902344, "global_step": 146117, "epoch": 1207} {"train_loss": -28.570117950439453, "global_step": 146118, "epoch": 1207} {"train_loss": -29.42535972595215, "global_step": 146119, "epoch": 1207} {"train_loss": -39.54437255859375, "global_step": 146120, "epoch": 1207} {"train_loss": -31.74323081970215, "global_step": 146121, "epoch": 1207} {"train_loss": -30.480976104736328, "global_step": 146122, "epoch": 1207} {"train_loss": -38.752498626708984, "global_step": 146123, "epoch": 1207} {"train_loss": -35.43806457519531, "global_step": 146124, "epoch": 1207} {"train_loss": -33.162715911865234, "global_step": 146125, "epoch": 1207} {"train_loss": -38.65709686279297, "global_step": 146126, "epoch": 1207} {"train_loss": -35.1599235534668, "global_step": 146127, "epoch": 1207} {"train_loss": -39.034584045410156, "global_step": 146128, "epoch": 1207} {"train_loss": -36.2002067565918, "global_step": 146129, "epoch": 1207} {"train_loss": -39.67104721069336, "global_step": 146130, "epoch": 1207} {"train_loss": -38.08465576171875, "global_step": 146131, "epoch": 1207} {"train_loss": -40.03142547607422, "global_step": 146132, "epoch": 1207} {"train_loss": -37.556941986083984, "global_step": 146133, "epoch": 1207} {"train_loss": -39.6946907043457, "global_step": 146134, "epoch": 1207} {"train_loss": -38.40134811401367, "global_step": 146135, "epoch": 1207} {"train_loss": -39.59882736206055, "global_step": 146136, "epoch": 1207} {"train_loss": -38.93198776245117, "global_step": 146137, "epoch": 1207} {"train_loss": -39.091796875, "global_step": 146138, "epoch": 1207} {"train_loss": -39.67570114135742, "global_step": 146139, "epoch": 1207} {"train_loss": -39.031654357910156, "global_step": 146140, "epoch": 1207} {"train_loss": -39.75010299682617, "global_step": 146141, "epoch": 1207} {"train_loss": -39.78940963745117, "global_step": 146142, "epoch": 1207} {"train_loss": -39.62495422363281, "global_step": 146143, "epoch": 1207} {"train_loss": -39.551666259765625, "global_step": 146144, "epoch": 1207} {"train_loss": -39.37273406982422, "global_step": 146145, "epoch": 1207} {"train_loss": -40.392730712890625, "global_step": 146146, "epoch": 1207} {"train_loss": -39.67142868041992, "global_step": 146147, "epoch": 1207} {"train_loss": -40.24728012084961, "global_step": 146148, "epoch": 1207} {"train_loss": -39.829708099365234, "global_step": 146149, "epoch": 1207} {"train_loss": -40.345001220703125, "global_step": 146150, "epoch": 1207} {"train_loss": -39.81467819213867, "global_step": 146151, "epoch": 1207} {"train_loss": -39.95869827270508, "global_step": 146152, "epoch": 1207} {"train_loss": -40.51556396484375, "global_step": 146153, "epoch": 1207} {"train_loss": -40.58429718017578, "global_step": 146154, "epoch": 1207} {"train_loss": -39.94704818725586, "global_step": 146155, "epoch": 1207} {"train_loss": -40.0417366027832, "global_step": 146156, "epoch": 1207} {"train_loss": -40.44246292114258, "global_step": 146157, "epoch": 1207} {"train_loss": -40.731075286865234, "global_step": 146158, "epoch": 1207} {"train_loss": -40.40058517456055, "global_step": 146159, "epoch": 1207} {"train_loss": -40.81653594970703, "global_step": 146160, "epoch": 1207} {"train_loss": -40.38311767578125, "global_step": 146161, "epoch": 1207} {"train_loss": -40.4388542175293, "global_step": 146162, "epoch": 1207} {"train_loss": -40.30256271362305, "global_step": 146163, "epoch": 1207} {"train_loss": -40.15877914428711, "global_step": 146164, "epoch": 1207} {"train_loss": -40.11348342895508, "global_step": 146165, "epoch": 1207} {"train_loss": -40.2285270690918, "global_step": 146166, "epoch": 1207} {"train_loss": -38.80138198600328, "global_step": 146167, "epoch": 1207, "val_loss": 2773517.0} {"train_loss": -39.34070587158203, "global_step": 146168, "epoch": 1208} {"train_loss": -40.01417922973633, "global_step": 146169, "epoch": 1208} {"train_loss": -39.97807693481445, "global_step": 146170, "epoch": 1208} {"train_loss": -38.86087417602539, "global_step": 146171, "epoch": 1208} {"train_loss": -38.81820297241211, "global_step": 146172, "epoch": 1208} {"train_loss": -39.134925842285156, "global_step": 146173, "epoch": 1208} {"train_loss": -40.34498977661133, "global_step": 146174, "epoch": 1208} {"train_loss": -39.48579406738281, "global_step": 146175, "epoch": 1208} {"train_loss": -39.18946075439453, "global_step": 146176, "epoch": 1208} {"train_loss": -40.745391845703125, "global_step": 146177, "epoch": 1208} {"train_loss": -38.92918014526367, "global_step": 146178, "epoch": 1208} {"train_loss": -39.4260139465332, "global_step": 146179, "epoch": 1208} {"train_loss": -40.15763473510742, "global_step": 146180, "epoch": 1208} {"train_loss": -40.179412841796875, "global_step": 146181, "epoch": 1208} {"train_loss": -38.29777145385742, "global_step": 146182, "epoch": 1208} {"train_loss": -39.882232666015625, "global_step": 146183, "epoch": 1208} {"train_loss": -40.594818115234375, "global_step": 146184, "epoch": 1208} {"train_loss": -39.44630813598633, "global_step": 146185, "epoch": 1208} {"train_loss": -40.365570068359375, "global_step": 146186, "epoch": 1208} {"train_loss": -40.73502731323242, "global_step": 146187, "epoch": 1208} {"train_loss": -39.57625961303711, "global_step": 146188, "epoch": 1208} {"train_loss": -40.624183654785156, "global_step": 146189, "epoch": 1208} {"train_loss": -40.696285247802734, "global_step": 146190, "epoch": 1208} {"train_loss": -39.57658386230469, "global_step": 146191, "epoch": 1208} {"train_loss": -41.384986877441406, "global_step": 146192, "epoch": 1208} {"train_loss": -39.95388412475586, "global_step": 146193, "epoch": 1208} {"train_loss": -39.91600036621094, "global_step": 146194, "epoch": 1208} {"train_loss": -40.47191619873047, "global_step": 146195, "epoch": 1208} {"train_loss": -40.5158576965332, "global_step": 146196, "epoch": 1208} {"train_loss": -40.474708557128906, "global_step": 146197, "epoch": 1208} {"train_loss": -41.08797836303711, "global_step": 146198, "epoch": 1208} {"train_loss": -40.431819915771484, "global_step": 146199, "epoch": 1208} {"train_loss": -40.70192337036133, "global_step": 146200, "epoch": 1208} {"train_loss": -40.91079330444336, "global_step": 146201, "epoch": 1208} {"train_loss": -41.00922775268555, "global_step": 146202, "epoch": 1208} {"train_loss": -41.03737258911133, "global_step": 146203, "epoch": 1208} {"train_loss": -41.0655632019043, "global_step": 146204, "epoch": 1208} {"train_loss": -41.15791320800781, "global_step": 146205, "epoch": 1208} {"train_loss": -41.08108139038086, "global_step": 146206, "epoch": 1208} {"train_loss": -41.2252311706543, "global_step": 146207, "epoch": 1208} {"train_loss": -40.88740921020508, "global_step": 146208, "epoch": 1208} {"train_loss": -41.11470413208008, "global_step": 146209, "epoch": 1208} {"train_loss": -40.90702438354492, "global_step": 146210, "epoch": 1208} {"train_loss": -40.60959243774414, "global_step": 146211, "epoch": 1208} {"train_loss": -39.71675491333008, "global_step": 146212, "epoch": 1208} {"train_loss": -39.60643768310547, "global_step": 146213, "epoch": 1208} {"train_loss": -39.87356185913086, "global_step": 146214, "epoch": 1208} {"train_loss": -39.98222732543945, "global_step": 146215, "epoch": 1208} {"train_loss": -40.58648681640625, "global_step": 146216, "epoch": 1208} {"train_loss": -40.933895111083984, "global_step": 146217, "epoch": 1208} {"train_loss": -40.18988800048828, "global_step": 146218, "epoch": 1208} {"train_loss": -39.39023971557617, "global_step": 146219, "epoch": 1208} {"train_loss": -38.61027145385742, "global_step": 146220, "epoch": 1208} {"train_loss": -38.70096206665039, "global_step": 146221, "epoch": 1208} {"train_loss": -38.70041275024414, "global_step": 146222, "epoch": 1208} {"train_loss": -39.98261642456055, "global_step": 146223, "epoch": 1208} {"train_loss": -40.483516693115234, "global_step": 146224, "epoch": 1208} {"train_loss": -39.954002380371094, "global_step": 146225, "epoch": 1208} {"train_loss": -37.7629508972168, "global_step": 146226, "epoch": 1208} {"train_loss": -38.77088165283203, "global_step": 146227, "epoch": 1208} {"train_loss": -39.769561767578125, "global_step": 146228, "epoch": 1208} {"train_loss": -40.09577941894531, "global_step": 146229, "epoch": 1208} {"train_loss": -39.59108352661133, "global_step": 146230, "epoch": 1208} {"train_loss": -40.536346435546875, "global_step": 146231, "epoch": 1208} {"train_loss": -39.867591857910156, "global_step": 146232, "epoch": 1208} {"train_loss": -40.24143600463867, "global_step": 146233, "epoch": 1208} {"train_loss": -39.636024475097656, "global_step": 146234, "epoch": 1208} {"train_loss": -39.7847785949707, "global_step": 146235, "epoch": 1208} {"train_loss": -39.931785583496094, "global_step": 146236, "epoch": 1208} {"train_loss": -40.545894622802734, "global_step": 146237, "epoch": 1208} {"train_loss": -39.51394271850586, "global_step": 146238, "epoch": 1208} {"train_loss": -39.7470703125, "global_step": 146239, "epoch": 1208} {"train_loss": -40.31713104248047, "global_step": 146240, "epoch": 1208} {"train_loss": -40.11091232299805, "global_step": 146241, "epoch": 1208} {"train_loss": -40.21809005737305, "global_step": 146242, "epoch": 1208} {"train_loss": -40.0856819152832, "global_step": 146243, "epoch": 1208} {"train_loss": -40.459014892578125, "global_step": 146244, "epoch": 1208} {"train_loss": -40.17190170288086, "global_step": 146245, "epoch": 1208} {"train_loss": -40.42852783203125, "global_step": 146246, "epoch": 1208} {"train_loss": -40.84517288208008, "global_step": 146247, "epoch": 1208} {"train_loss": -39.957237243652344, "global_step": 146248, "epoch": 1208} {"train_loss": -40.63025665283203, "global_step": 146249, "epoch": 1208} {"train_loss": -39.85955047607422, "global_step": 146250, "epoch": 1208} {"train_loss": -39.991390228271484, "global_step": 146251, "epoch": 1208} {"train_loss": -39.3408317565918, "global_step": 146252, "epoch": 1208} {"train_loss": -38.91608810424805, "global_step": 146253, "epoch": 1208} {"train_loss": -38.65797805786133, "global_step": 146254, "epoch": 1208} {"train_loss": -39.654876708984375, "global_step": 146255, "epoch": 1208} {"train_loss": -40.13924026489258, "global_step": 146256, "epoch": 1208} {"train_loss": -40.935298919677734, "global_step": 146257, "epoch": 1208} {"train_loss": -40.62972640991211, "global_step": 146258, "epoch": 1208} {"train_loss": -40.776851654052734, "global_step": 146259, "epoch": 1208} {"train_loss": -40.18014144897461, "global_step": 146260, "epoch": 1208} {"train_loss": -40.55874252319336, "global_step": 146261, "epoch": 1208} {"train_loss": -40.96169662475586, "global_step": 146262, "epoch": 1208} {"train_loss": -40.72038269042969, "global_step": 146263, "epoch": 1208} {"train_loss": -40.72602462768555, "global_step": 146264, "epoch": 1208} {"train_loss": -40.88579177856445, "global_step": 146265, "epoch": 1208} {"train_loss": -41.01096725463867, "global_step": 146266, "epoch": 1208} {"train_loss": -41.14681625366211, "global_step": 146267, "epoch": 1208} {"train_loss": -40.53817367553711, "global_step": 146268, "epoch": 1208} {"train_loss": -39.62092208862305, "global_step": 146269, "epoch": 1208} {"train_loss": -39.70781326293945, "global_step": 146270, "epoch": 1208} {"train_loss": -41.0009651184082, "global_step": 146271, "epoch": 1208} {"train_loss": -40.85476303100586, "global_step": 146272, "epoch": 1208} {"train_loss": -40.95852279663086, "global_step": 146273, "epoch": 1208} {"train_loss": -40.97685623168945, "global_step": 146274, "epoch": 1208} {"train_loss": -40.609195709228516, "global_step": 146275, "epoch": 1208} {"train_loss": -40.07564926147461, "global_step": 146276, "epoch": 1208} {"train_loss": -40.119258880615234, "global_step": 146277, "epoch": 1208} {"train_loss": -40.54021072387695, "global_step": 146278, "epoch": 1208} {"train_loss": -40.122676849365234, "global_step": 146279, "epoch": 1208} {"train_loss": -39.30398941040039, "global_step": 146280, "epoch": 1208} {"train_loss": -39.910888671875, "global_step": 146281, "epoch": 1208} {"train_loss": -39.33506774902344, "global_step": 146282, "epoch": 1208} {"train_loss": -38.50570297241211, "global_step": 146283, "epoch": 1208} {"train_loss": -40.23706817626953, "global_step": 146284, "epoch": 1208} {"train_loss": -40.470455169677734, "global_step": 146285, "epoch": 1208} {"train_loss": -37.696502685546875, "global_step": 146286, "epoch": 1208} {"train_loss": -40.2146110534668, "global_step": 146287, "epoch": 1208} {"train_loss": -40.085791753343315, "global_step": 146288, "epoch": 1208, "val_loss": 2892122.0} {"train_loss": -37.32064437866211, "global_step": 146289, "epoch": 1209} {"train_loss": -37.664520263671875, "global_step": 146290, "epoch": 1209} {"train_loss": -36.11859893798828, "global_step": 146291, "epoch": 1209} {"train_loss": -39.03641891479492, "global_step": 146292, "epoch": 1209} {"train_loss": -38.457454681396484, "global_step": 146293, "epoch": 1209} {"train_loss": -38.249202728271484, "global_step": 146294, "epoch": 1209} {"train_loss": -38.71168899536133, "global_step": 146295, "epoch": 1209} {"train_loss": -38.57969284057617, "global_step": 146296, "epoch": 1209} {"train_loss": -37.12360763549805, "global_step": 146297, "epoch": 1209} {"train_loss": -38.58487319946289, "global_step": 146298, "epoch": 1209} {"train_loss": -40.2444953918457, "global_step": 146299, "epoch": 1209} {"train_loss": -38.68848419189453, "global_step": 146300, "epoch": 1209} {"train_loss": -39.42098617553711, "global_step": 146301, "epoch": 1209} {"train_loss": -39.746131896972656, "global_step": 146302, "epoch": 1209} {"train_loss": -39.187557220458984, "global_step": 146303, "epoch": 1209} {"train_loss": -39.698455810546875, "global_step": 146304, "epoch": 1209} {"train_loss": -39.17281723022461, "global_step": 146305, "epoch": 1209} {"train_loss": -36.70771408081055, "global_step": 146306, "epoch": 1209} {"train_loss": -39.57422637939453, "global_step": 146307, "epoch": 1209} {"train_loss": -39.9404182434082, "global_step": 146308, "epoch": 1209} {"train_loss": -38.64716720581055, "global_step": 146309, "epoch": 1209} {"train_loss": -39.788997650146484, "global_step": 146310, "epoch": 1209} {"train_loss": -39.931182861328125, "global_step": 146311, "epoch": 1209} {"train_loss": -39.88624954223633, "global_step": 146312, "epoch": 1209} {"train_loss": -40.00330352783203, "global_step": 146313, "epoch": 1209} {"train_loss": -39.733497619628906, "global_step": 146314, "epoch": 1209} {"train_loss": -39.26817321777344, "global_step": 146315, "epoch": 1209} {"train_loss": -40.481075286865234, "global_step": 146316, "epoch": 1209} {"train_loss": -39.437835693359375, "global_step": 146317, "epoch": 1209} {"train_loss": -40.33736801147461, "global_step": 146318, "epoch": 1209} {"train_loss": -40.1959342956543, "global_step": 146319, "epoch": 1209} {"train_loss": -40.371212005615234, "global_step": 146320, "epoch": 1209} {"train_loss": -40.33058166503906, "global_step": 146321, "epoch": 1209} {"train_loss": -40.43777847290039, "global_step": 146322, "epoch": 1209} {"train_loss": -40.105472564697266, "global_step": 146323, "epoch": 1209} {"train_loss": -40.25334548950195, "global_step": 146324, "epoch": 1209} {"train_loss": -40.681800842285156, "global_step": 146325, "epoch": 1209} {"train_loss": -40.613502502441406, "global_step": 146326, "epoch": 1209} {"train_loss": -40.3830451965332, "global_step": 146327, "epoch": 1209} {"train_loss": -40.544647216796875, "global_step": 146328, "epoch": 1209} {"train_loss": -40.887874603271484, "global_step": 146329, "epoch": 1209} {"train_loss": -40.49395751953125, "global_step": 146330, "epoch": 1209} {"train_loss": -40.4710807800293, "global_step": 146331, "epoch": 1209} {"train_loss": -40.90913009643555, "global_step": 146332, "epoch": 1209} {"train_loss": -40.59946060180664, "global_step": 146333, "epoch": 1209} {"train_loss": -40.692115783691406, "global_step": 146334, "epoch": 1209} {"train_loss": -40.7049674987793, "global_step": 146335, "epoch": 1209} {"train_loss": -40.87601852416992, "global_step": 146336, "epoch": 1209} {"train_loss": -40.64262008666992, "global_step": 146337, "epoch": 1209} {"train_loss": -40.90955352783203, "global_step": 146338, "epoch": 1209} {"train_loss": -39.948944091796875, "global_step": 146339, "epoch": 1209} {"train_loss": -40.99430465698242, "global_step": 146340, "epoch": 1209} {"train_loss": -41.077938079833984, "global_step": 146341, "epoch": 1209} {"train_loss": -41.313907623291016, "global_step": 146342, "epoch": 1209} {"train_loss": -40.790382385253906, "global_step": 146343, "epoch": 1209} {"train_loss": -41.03004455566406, "global_step": 146344, "epoch": 1209} {"train_loss": -41.44702911376953, "global_step": 146345, "epoch": 1209} {"train_loss": -41.23461151123047, "global_step": 146346, "epoch": 1209} {"train_loss": -41.7005500793457, "global_step": 146347, "epoch": 1209} {"train_loss": -41.335994720458984, "global_step": 146348, "epoch": 1209} {"train_loss": -41.34244918823242, "global_step": 146349, "epoch": 1209} {"train_loss": -41.210182189941406, "global_step": 146350, "epoch": 1209} {"train_loss": -41.55231857299805, "global_step": 146351, "epoch": 1209} {"train_loss": -41.09635543823242, "global_step": 146352, "epoch": 1209} {"train_loss": -41.49860382080078, "global_step": 146353, "epoch": 1209} {"train_loss": -41.48210906982422, "global_step": 146354, "epoch": 1209} {"train_loss": -41.443634033203125, "global_step": 146355, "epoch": 1209} {"train_loss": -41.65126419067383, "global_step": 146356, "epoch": 1209} {"train_loss": -41.27232360839844, "global_step": 146357, "epoch": 1209} {"train_loss": -41.823646545410156, "global_step": 146358, "epoch": 1209} {"train_loss": -40.79945755004883, "global_step": 146359, "epoch": 1209} {"train_loss": -41.824703216552734, "global_step": 146360, "epoch": 1209} {"train_loss": -40.87679672241211, "global_step": 146361, "epoch": 1209} {"train_loss": -40.91928482055664, "global_step": 146362, "epoch": 1209} {"train_loss": -40.528564453125, "global_step": 146363, "epoch": 1209} {"train_loss": -40.91826629638672, "global_step": 146364, "epoch": 1209} {"train_loss": -40.8900032043457, "global_step": 146365, "epoch": 1209} {"train_loss": -40.87739944458008, "global_step": 146366, "epoch": 1209} {"train_loss": -41.30974578857422, "global_step": 146367, "epoch": 1209} {"train_loss": -40.44511032104492, "global_step": 146368, "epoch": 1209} {"train_loss": -40.198585510253906, "global_step": 146369, "epoch": 1209} {"train_loss": -40.77239227294922, "global_step": 146370, "epoch": 1209} {"train_loss": -39.62596893310547, "global_step": 146371, "epoch": 1209} {"train_loss": -37.932472229003906, "global_step": 146372, "epoch": 1209} {"train_loss": -39.666988372802734, "global_step": 146373, "epoch": 1209} {"train_loss": -38.0699462890625, "global_step": 146374, "epoch": 1209} {"train_loss": -37.45600128173828, "global_step": 146375, "epoch": 1209} {"train_loss": -39.5915412902832, "global_step": 146376, "epoch": 1209} {"train_loss": -37.82756423950195, "global_step": 146377, "epoch": 1209} {"train_loss": -39.699703216552734, "global_step": 146378, "epoch": 1209} {"train_loss": -40.205902099609375, "global_step": 146379, "epoch": 1209} {"train_loss": -39.4444694519043, "global_step": 146380, "epoch": 1209} {"train_loss": -39.779876708984375, "global_step": 146381, "epoch": 1209} {"train_loss": -38.030479431152344, "global_step": 146382, "epoch": 1209} {"train_loss": -37.75788497924805, "global_step": 146383, "epoch": 1209} {"train_loss": -37.84469223022461, "global_step": 146384, "epoch": 1209} {"train_loss": -40.049072265625, "global_step": 146385, "epoch": 1209} {"train_loss": -40.34425354003906, "global_step": 146386, "epoch": 1209} {"train_loss": -37.186092376708984, "global_step": 146387, "epoch": 1209} {"train_loss": -36.8196907043457, "global_step": 146388, "epoch": 1209} {"train_loss": -39.34716796875, "global_step": 146389, "epoch": 1209} {"train_loss": -40.82014846801758, "global_step": 146390, "epoch": 1209} {"train_loss": -38.762149810791016, "global_step": 146391, "epoch": 1209} {"train_loss": -38.133052825927734, "global_step": 146392, "epoch": 1209} {"train_loss": -40.45707321166992, "global_step": 146393, "epoch": 1209} {"train_loss": -39.94894027709961, "global_step": 146394, "epoch": 1209} {"train_loss": -39.265174865722656, "global_step": 146395, "epoch": 1209} {"train_loss": -40.56303024291992, "global_step": 146396, "epoch": 1209} {"train_loss": -39.073421478271484, "global_step": 146397, "epoch": 1209} {"train_loss": -40.243465423583984, "global_step": 146398, "epoch": 1209} {"train_loss": -40.280269622802734, "global_step": 146399, "epoch": 1209} {"train_loss": -39.385337829589844, "global_step": 146400, "epoch": 1209} {"train_loss": -40.8677978515625, "global_step": 146401, "epoch": 1209} {"train_loss": -40.73635482788086, "global_step": 146402, "epoch": 1209} {"train_loss": -39.76409912109375, "global_step": 146403, "epoch": 1209} {"train_loss": -39.549007415771484, "global_step": 146404, "epoch": 1209} {"train_loss": -40.27722930908203, "global_step": 146405, "epoch": 1209} {"train_loss": -40.35866928100586, "global_step": 146406, "epoch": 1209} {"train_loss": -41.05617904663086, "global_step": 146407, "epoch": 1209} {"train_loss": -40.32121276855469, "global_step": 146408, "epoch": 1209} {"train_loss": -39.939936488127906, "global_step": 146409, "epoch": 1209, "val_loss": 2852502.75} {"train_loss": -41.18619918823242, "global_step": 146410, "epoch": 1210} {"train_loss": -39.65287399291992, "global_step": 146411, "epoch": 1210} {"train_loss": -40.66209030151367, "global_step": 146412, "epoch": 1210} {"train_loss": -39.52839279174805, "global_step": 146413, "epoch": 1210} {"train_loss": -40.57080841064453, "global_step": 146414, "epoch": 1210} {"train_loss": -40.66682052612305, "global_step": 146415, "epoch": 1210} {"train_loss": -40.75431442260742, "global_step": 146416, "epoch": 1210} {"train_loss": -40.988826751708984, "global_step": 146417, "epoch": 1210} {"train_loss": -40.535675048828125, "global_step": 146418, "epoch": 1210} {"train_loss": -41.36848068237305, "global_step": 146419, "epoch": 1210} {"train_loss": -41.035701751708984, "global_step": 146420, "epoch": 1210} {"train_loss": -40.676612854003906, "global_step": 146421, "epoch": 1210} {"train_loss": -40.839534759521484, "global_step": 146422, "epoch": 1210} {"train_loss": -40.160221099853516, "global_step": 146423, "epoch": 1210} {"train_loss": -38.269256591796875, "global_step": 146424, "epoch": 1210} {"train_loss": -42.092041015625, "global_step": 146425, "epoch": 1210} {"train_loss": -40.65911865234375, "global_step": 146426, "epoch": 1210} {"train_loss": -41.05953598022461, "global_step": 146427, "epoch": 1210} {"train_loss": -40.2917594909668, "global_step": 146428, "epoch": 1210} {"train_loss": -40.251834869384766, "global_step": 146429, "epoch": 1210} {"train_loss": -38.9421501159668, "global_step": 146430, "epoch": 1210} {"train_loss": -39.57371520996094, "global_step": 146431, "epoch": 1210} {"train_loss": -38.386009216308594, "global_step": 146432, "epoch": 1210} {"train_loss": -38.5513801574707, "global_step": 146433, "epoch": 1210} {"train_loss": -39.5023307800293, "global_step": 146434, "epoch": 1210} {"train_loss": -41.116065979003906, "global_step": 146435, "epoch": 1210} {"train_loss": -40.75373840332031, "global_step": 146436, "epoch": 1210} {"train_loss": -39.39597702026367, "global_step": 146437, "epoch": 1210} {"train_loss": -40.161739349365234, "global_step": 146438, "epoch": 1210} {"train_loss": -39.738983154296875, "global_step": 146439, "epoch": 1210} {"train_loss": -39.93048095703125, "global_step": 146440, "epoch": 1210} {"train_loss": -39.77981185913086, "global_step": 146441, "epoch": 1210} {"train_loss": -41.0853157043457, "global_step": 146442, "epoch": 1210} {"train_loss": -40.20491409301758, "global_step": 146443, "epoch": 1210} {"train_loss": -39.817108154296875, "global_step": 146444, "epoch": 1210} {"train_loss": -40.310665130615234, "global_step": 146445, "epoch": 1210} {"train_loss": -40.6635627746582, "global_step": 146446, "epoch": 1210} {"train_loss": -40.28988265991211, "global_step": 146447, "epoch": 1210} {"train_loss": -40.520668029785156, "global_step": 146448, "epoch": 1210} {"train_loss": -39.813838958740234, "global_step": 146449, "epoch": 1210} {"train_loss": -40.12531661987305, "global_step": 146450, "epoch": 1210} {"train_loss": -38.351497650146484, "global_step": 146451, "epoch": 1210} {"train_loss": -40.18477249145508, "global_step": 146452, "epoch": 1210} {"train_loss": -41.183773040771484, "global_step": 146453, "epoch": 1210} {"train_loss": -39.34224319458008, "global_step": 146454, "epoch": 1210} {"train_loss": -40.11328125, "global_step": 146455, "epoch": 1210} {"train_loss": -40.739845275878906, "global_step": 146456, "epoch": 1210} {"train_loss": -40.681312561035156, "global_step": 146457, "epoch": 1210} {"train_loss": -38.798240661621094, "global_step": 146458, "epoch": 1210} {"train_loss": -39.073394775390625, "global_step": 146459, "epoch": 1210} {"train_loss": -40.83891677856445, "global_step": 146460, "epoch": 1210} {"train_loss": -40.30476379394531, "global_step": 146461, "epoch": 1210} {"train_loss": -38.85207748413086, "global_step": 146462, "epoch": 1210} {"train_loss": -39.06732177734375, "global_step": 146463, "epoch": 1210} {"train_loss": -40.696754455566406, "global_step": 146464, "epoch": 1210} {"train_loss": -40.10325241088867, "global_step": 146465, "epoch": 1210} {"train_loss": -39.88154602050781, "global_step": 146466, "epoch": 1210} {"train_loss": -39.9033088684082, "global_step": 146467, "epoch": 1210} {"train_loss": -41.4124641418457, "global_step": 146468, "epoch": 1210} {"train_loss": -40.06352615356445, "global_step": 146469, "epoch": 1210} {"train_loss": -39.96451950073242, "global_step": 146470, "epoch": 1210} {"train_loss": -40.964962005615234, "global_step": 146471, "epoch": 1210} {"train_loss": -39.35915756225586, "global_step": 146472, "epoch": 1210} {"train_loss": -39.624000549316406, "global_step": 146473, "epoch": 1210} {"train_loss": -40.70219802856445, "global_step": 146474, "epoch": 1210} {"train_loss": -41.01816177368164, "global_step": 146475, "epoch": 1210} {"train_loss": -39.89773178100586, "global_step": 146476, "epoch": 1210} {"train_loss": -40.071346282958984, "global_step": 146477, "epoch": 1210} {"train_loss": -39.9503059387207, "global_step": 146478, "epoch": 1210} {"train_loss": -41.43721389770508, "global_step": 146479, "epoch": 1210} {"train_loss": -40.55714797973633, "global_step": 146480, "epoch": 1210} {"train_loss": -40.66437911987305, "global_step": 146481, "epoch": 1210} {"train_loss": -41.309967041015625, "global_step": 146482, "epoch": 1210} {"train_loss": -40.851375579833984, "global_step": 146483, "epoch": 1210} {"train_loss": -40.98102951049805, "global_step": 146484, "epoch": 1210} {"train_loss": -41.039337158203125, "global_step": 146485, "epoch": 1210} {"train_loss": -40.59365463256836, "global_step": 146486, "epoch": 1210} {"train_loss": -41.389007568359375, "global_step": 146487, "epoch": 1210} {"train_loss": -40.911617279052734, "global_step": 146488, "epoch": 1210} {"train_loss": -39.80230712890625, "global_step": 146489, "epoch": 1210} {"train_loss": -39.96963119506836, "global_step": 146490, "epoch": 1210} {"train_loss": -41.29014205932617, "global_step": 146491, "epoch": 1210} {"train_loss": -40.73223876953125, "global_step": 146492, "epoch": 1210} {"train_loss": -40.312416076660156, "global_step": 146493, "epoch": 1210} {"train_loss": -40.181427001953125, "global_step": 146494, "epoch": 1210} {"train_loss": -39.73299026489258, "global_step": 146495, "epoch": 1210} {"train_loss": -40.34275817871094, "global_step": 146496, "epoch": 1210} {"train_loss": -40.9050407409668, "global_step": 146497, "epoch": 1210} {"train_loss": -41.13263702392578, "global_step": 146498, "epoch": 1210} {"train_loss": -41.05727767944336, "global_step": 146499, "epoch": 1210} {"train_loss": -39.5147705078125, "global_step": 146500, "epoch": 1210} {"train_loss": -40.564571380615234, "global_step": 146501, "epoch": 1210} {"train_loss": -40.61530303955078, "global_step": 146502, "epoch": 1210} {"train_loss": -40.9560432434082, "global_step": 146503, "epoch": 1210} {"train_loss": -41.10451889038086, "global_step": 146504, "epoch": 1210} {"train_loss": -40.87861251831055, "global_step": 146505, "epoch": 1210} {"train_loss": -41.29351806640625, "global_step": 146506, "epoch": 1210} {"train_loss": -41.3062744140625, "global_step": 146507, "epoch": 1210} {"train_loss": -40.821022033691406, "global_step": 146508, "epoch": 1210} {"train_loss": -41.402099609375, "global_step": 146509, "epoch": 1210} {"train_loss": -41.42136001586914, "global_step": 146510, "epoch": 1210} {"train_loss": -41.27029037475586, "global_step": 146511, "epoch": 1210} {"train_loss": -40.36479568481445, "global_step": 146512, "epoch": 1210} {"train_loss": -41.42563247680664, "global_step": 146513, "epoch": 1210} {"train_loss": -39.800716400146484, "global_step": 146514, "epoch": 1210} {"train_loss": -39.6928825378418, "global_step": 146515, "epoch": 1210} {"train_loss": -39.90183639526367, "global_step": 146516, "epoch": 1210} {"train_loss": -40.200706481933594, "global_step": 146517, "epoch": 1210} {"train_loss": -40.23382568359375, "global_step": 146518, "epoch": 1210} {"train_loss": -38.89322280883789, "global_step": 146519, "epoch": 1210} {"train_loss": -38.08064651489258, "global_step": 146520, "epoch": 1210} {"train_loss": -34.77759552001953, "global_step": 146521, "epoch": 1210} {"train_loss": -38.84000778198242, "global_step": 146522, "epoch": 1210} {"train_loss": -41.01772689819336, "global_step": 146523, "epoch": 1210} {"train_loss": -38.76481246948242, "global_step": 146524, "epoch": 1210} {"train_loss": -38.4537353515625, "global_step": 146525, "epoch": 1210} {"train_loss": -39.12213897705078, "global_step": 146526, "epoch": 1210} {"train_loss": -30.12737464904785, "global_step": 146527, "epoch": 1210} {"train_loss": -36.61786651611328, "global_step": 146528, "epoch": 1210} {"train_loss": -38.56172561645508, "global_step": 146529, "epoch": 1210} {"train_loss": -40.0997334472404, "global_step": 146530, "epoch": 1210, "val_loss": 2770804.25} {"train_loss": -36.85322189331055, "global_step": 146531, "epoch": 1211} {"train_loss": -39.87959289550781, "global_step": 146532, "epoch": 1211} {"train_loss": -38.23417282104492, "global_step": 146533, "epoch": 1211} {"train_loss": -39.2447395324707, "global_step": 146534, "epoch": 1211} {"train_loss": -34.00187301635742, "global_step": 146535, "epoch": 1211} {"train_loss": -38.59554672241211, "global_step": 146536, "epoch": 1211} {"train_loss": -38.35917282104492, "global_step": 146537, "epoch": 1211} {"train_loss": -37.94125747680664, "global_step": 146538, "epoch": 1211} {"train_loss": -38.58835983276367, "global_step": 146539, "epoch": 1211} {"train_loss": -39.341793060302734, "global_step": 146540, "epoch": 1211} {"train_loss": -36.519081115722656, "global_step": 146541, "epoch": 1211} {"train_loss": -37.99011993408203, "global_step": 146542, "epoch": 1211} {"train_loss": -38.77082443237305, "global_step": 146543, "epoch": 1211} {"train_loss": -38.727508544921875, "global_step": 146544, "epoch": 1211} {"train_loss": -38.42509078979492, "global_step": 146545, "epoch": 1211} {"train_loss": -38.02216339111328, "global_step": 146546, "epoch": 1211} {"train_loss": -38.011810302734375, "global_step": 146547, "epoch": 1211} {"train_loss": -39.628231048583984, "global_step": 146548, "epoch": 1211} {"train_loss": -38.45761489868164, "global_step": 146549, "epoch": 1211} {"train_loss": -35.958343505859375, "global_step": 146550, "epoch": 1211} {"train_loss": -39.39374923706055, "global_step": 146551, "epoch": 1211} {"train_loss": -38.16428756713867, "global_step": 146552, "epoch": 1211} {"train_loss": -38.733150482177734, "global_step": 146553, "epoch": 1211} {"train_loss": -38.14748001098633, "global_step": 146554, "epoch": 1211} {"train_loss": -38.58217239379883, "global_step": 146555, "epoch": 1211} {"train_loss": -37.30528259277344, "global_step": 146556, "epoch": 1211} {"train_loss": -37.019134521484375, "global_step": 146557, "epoch": 1211} {"train_loss": -38.13597106933594, "global_step": 146558, "epoch": 1211} {"train_loss": -36.94447326660156, "global_step": 146559, "epoch": 1211} {"train_loss": -36.241424560546875, "global_step": 146560, "epoch": 1211} {"train_loss": -36.11436080932617, "global_step": 146561, "epoch": 1211} {"train_loss": -34.42038345336914, "global_step": 146562, "epoch": 1211} {"train_loss": -38.944087982177734, "global_step": 146563, "epoch": 1211} {"train_loss": -37.75806427001953, "global_step": 146564, "epoch": 1211} {"train_loss": -38.43778991699219, "global_step": 146565, "epoch": 1211} {"train_loss": -37.673274993896484, "global_step": 146566, "epoch": 1211} {"train_loss": -39.331905364990234, "global_step": 146567, "epoch": 1211} {"train_loss": -38.93324661254883, "global_step": 146568, "epoch": 1211} {"train_loss": -38.524654388427734, "global_step": 146569, "epoch": 1211} {"train_loss": -36.34804153442383, "global_step": 146570, "epoch": 1211} {"train_loss": -36.23763656616211, "global_step": 146571, "epoch": 1211} {"train_loss": -38.235206604003906, "global_step": 146572, "epoch": 1211} {"train_loss": -38.22507858276367, "global_step": 146573, "epoch": 1211} {"train_loss": -33.965843200683594, "global_step": 146574, "epoch": 1211} {"train_loss": -36.51686477661133, "global_step": 146575, "epoch": 1211} {"train_loss": -38.158721923828125, "global_step": 146576, "epoch": 1211} {"train_loss": -37.90004348754883, "global_step": 146577, "epoch": 1211} {"train_loss": -38.91838073730469, "global_step": 146578, "epoch": 1211} {"train_loss": -38.0474967956543, "global_step": 146579, "epoch": 1211} {"train_loss": -38.66679000854492, "global_step": 146580, "epoch": 1211} {"train_loss": -36.70527267456055, "global_step": 146581, "epoch": 1211} {"train_loss": -39.43620300292969, "global_step": 146582, "epoch": 1211} {"train_loss": -39.05595016479492, "global_step": 146583, "epoch": 1211} {"train_loss": -39.671241760253906, "global_step": 146584, "epoch": 1211} {"train_loss": -37.80144119262695, "global_step": 146585, "epoch": 1211} {"train_loss": -39.077152252197266, "global_step": 146586, "epoch": 1211} {"train_loss": -34.838035583496094, "global_step": 146587, "epoch": 1211} {"train_loss": -38.776588439941406, "global_step": 146588, "epoch": 1211} {"train_loss": -37.9287223815918, "global_step": 146589, "epoch": 1211} {"train_loss": -38.74314498901367, "global_step": 146590, "epoch": 1211} {"train_loss": -37.391075134277344, "global_step": 146591, "epoch": 1211} {"train_loss": -36.00848388671875, "global_step": 146592, "epoch": 1211} {"train_loss": -36.2562370300293, "global_step": 146593, "epoch": 1211} {"train_loss": -37.949676513671875, "global_step": 146594, "epoch": 1211} {"train_loss": -37.661197662353516, "global_step": 146595, "epoch": 1211} {"train_loss": -36.750022888183594, "global_step": 146596, "epoch": 1211} {"train_loss": -36.19727325439453, "global_step": 146597, "epoch": 1211} {"train_loss": -37.718807220458984, "global_step": 146598, "epoch": 1211} {"train_loss": -23.422550201416016, "global_step": 146599, "epoch": 1211} {"train_loss": -37.763309478759766, "global_step": 146600, "epoch": 1211} {"train_loss": -36.985816955566406, "global_step": 146601, "epoch": 1211} {"train_loss": -36.696903228759766, "global_step": 146602, "epoch": 1211} {"train_loss": -32.60602951049805, "global_step": 146603, "epoch": 1211} {"train_loss": -37.716583251953125, "global_step": 146604, "epoch": 1211} {"train_loss": -36.42206954956055, "global_step": 146605, "epoch": 1211} {"train_loss": -38.22333526611328, "global_step": 146606, "epoch": 1211} {"train_loss": -35.93760681152344, "global_step": 146607, "epoch": 1211} {"train_loss": -37.60218048095703, "global_step": 146608, "epoch": 1211} {"train_loss": -35.95559310913086, "global_step": 146609, "epoch": 1211} {"train_loss": -35.748653411865234, "global_step": 146610, "epoch": 1211} {"train_loss": -37.09370803833008, "global_step": 146611, "epoch": 1211} {"train_loss": -37.38928985595703, "global_step": 146612, "epoch": 1211} {"train_loss": -36.003047943115234, "global_step": 146613, "epoch": 1211} {"train_loss": -39.17291259765625, "global_step": 146614, "epoch": 1211} {"train_loss": -38.7167854309082, "global_step": 146615, "epoch": 1211} {"train_loss": -37.109779357910156, "global_step": 146616, "epoch": 1211} {"train_loss": -38.21271514892578, "global_step": 146617, "epoch": 1211} {"train_loss": -37.18081283569336, "global_step": 146618, "epoch": 1211} {"train_loss": -36.420658111572266, "global_step": 146619, "epoch": 1211} {"train_loss": -37.51249313354492, "global_step": 146620, "epoch": 1211} {"train_loss": -38.51874923706055, "global_step": 146621, "epoch": 1211} {"train_loss": -37.50897979736328, "global_step": 146622, "epoch": 1211} {"train_loss": -34.53474044799805, "global_step": 146623, "epoch": 1211} {"train_loss": -36.6251106262207, "global_step": 146624, "epoch": 1211} {"train_loss": -37.92441177368164, "global_step": 146625, "epoch": 1211} {"train_loss": -37.700904846191406, "global_step": 146626, "epoch": 1211} {"train_loss": -37.347747802734375, "global_step": 146627, "epoch": 1211} {"train_loss": -37.977325439453125, "global_step": 146628, "epoch": 1211} {"train_loss": -37.66146469116211, "global_step": 146629, "epoch": 1211} {"train_loss": -37.80970001220703, "global_step": 146630, "epoch": 1211} {"train_loss": -37.77534484863281, "global_step": 146631, "epoch": 1211} {"train_loss": -38.869258880615234, "global_step": 146632, "epoch": 1211} {"train_loss": -39.01911544799805, "global_step": 146633, "epoch": 1211} {"train_loss": -38.56869888305664, "global_step": 146634, "epoch": 1211} {"train_loss": -38.88843536376953, "global_step": 146635, "epoch": 1211} {"train_loss": -38.589046478271484, "global_step": 146636, "epoch": 1211} {"train_loss": -38.81216049194336, "global_step": 146637, "epoch": 1211} {"train_loss": -37.478946685791016, "global_step": 146638, "epoch": 1211} {"train_loss": -37.961116790771484, "global_step": 146639, "epoch": 1211} {"train_loss": -38.59376907348633, "global_step": 146640, "epoch": 1211} {"train_loss": -38.26786422729492, "global_step": 146641, "epoch": 1211} {"train_loss": -38.54551315307617, "global_step": 146642, "epoch": 1211} {"train_loss": -34.19832992553711, "global_step": 146643, "epoch": 1211} {"train_loss": -38.36526870727539, "global_step": 146644, "epoch": 1211} {"train_loss": -38.92413330078125, "global_step": 146645, "epoch": 1211} {"train_loss": -38.91477584838867, "global_step": 146646, "epoch": 1211} {"train_loss": -37.963157653808594, "global_step": 146647, "epoch": 1211} {"train_loss": -34.012107849121094, "global_step": 146648, "epoch": 1211} {"train_loss": -30.473356246948242, "global_step": 146649, "epoch": 1211} {"train_loss": -37.89411544799805, "global_step": 146650, "epoch": 1211} {"train_loss": -37.451688041371746, "global_step": 146651, "epoch": 1211, "val_loss": 3856207.25} {"train_loss": -37.19082260131836, "global_step": 146652, "epoch": 1212} {"train_loss": 24.439550399780273, "global_step": 146653, "epoch": 1212} {"train_loss": -35.19379806518555, "global_step": 146654, "epoch": 1212} {"train_loss": -35.02451705932617, "global_step": 146655, "epoch": 1212} {"train_loss": -31.3584041595459, "global_step": 146656, "epoch": 1212} {"train_loss": -23.961565017700195, "global_step": 146657, "epoch": 1212} {"train_loss": 11.086389541625977, "global_step": 146658, "epoch": 1212} {"train_loss": -35.50168991088867, "global_step": 146659, "epoch": 1212} {"train_loss": -33.56571578979492, "global_step": 146660, "epoch": 1212} {"train_loss": -21.441579818725586, "global_step": 146661, "epoch": 1212} {"train_loss": -26.448810577392578, "global_step": 146662, "epoch": 1212} {"train_loss": -27.652002334594727, "global_step": 146663, "epoch": 1212} {"train_loss": -29.08856773376465, "global_step": 146664, "epoch": 1212} {"train_loss": -29.258108139038086, "global_step": 146665, "epoch": 1212} {"train_loss": -30.065107345581055, "global_step": 146666, "epoch": 1212} {"train_loss": -31.074514389038086, "global_step": 146667, "epoch": 1212} {"train_loss": -33.98857498168945, "global_step": 146668, "epoch": 1212} {"train_loss": -28.633337020874023, "global_step": 146669, "epoch": 1212} {"train_loss": -32.7369270324707, "global_step": 146670, "epoch": 1212} {"train_loss": -30.99851417541504, "global_step": 146671, "epoch": 1212} {"train_loss": -32.55241012573242, "global_step": 146672, "epoch": 1212} {"train_loss": -32.46197509765625, "global_step": 146673, "epoch": 1212} {"train_loss": -33.40401077270508, "global_step": 146674, "epoch": 1212} {"train_loss": -31.06829261779785, "global_step": 146675, "epoch": 1212} {"train_loss": -34.23207473754883, "global_step": 146676, "epoch": 1212} {"train_loss": -33.81083297729492, "global_step": 146677, "epoch": 1212} {"train_loss": -34.98981857299805, "global_step": 146678, "epoch": 1212} {"train_loss": -34.14054489135742, "global_step": 146679, "epoch": 1212} {"train_loss": -33.63959884643555, "global_step": 146680, "epoch": 1212} {"train_loss": -34.33006286621094, "global_step": 146681, "epoch": 1212} {"train_loss": -34.60421371459961, "global_step": 146682, "epoch": 1212} {"train_loss": -35.1157112121582, "global_step": 146683, "epoch": 1212} {"train_loss": -34.5536003112793, "global_step": 146684, "epoch": 1212} {"train_loss": -35.33286666870117, "global_step": 146685, "epoch": 1212} {"train_loss": -35.2420768737793, "global_step": 146686, "epoch": 1212} {"train_loss": -36.18584060668945, "global_step": 146687, "epoch": 1212} {"train_loss": -34.94196319580078, "global_step": 146688, "epoch": 1212} {"train_loss": -35.267005920410156, "global_step": 146689, "epoch": 1212} {"train_loss": -35.40530014038086, "global_step": 146690, "epoch": 1212} {"train_loss": -35.384429931640625, "global_step": 146691, "epoch": 1212} {"train_loss": -36.31449508666992, "global_step": 146692, "epoch": 1212} {"train_loss": -35.39908981323242, "global_step": 146693, "epoch": 1212} {"train_loss": -35.53501510620117, "global_step": 146694, "epoch": 1212} {"train_loss": -35.836421966552734, "global_step": 146695, "epoch": 1212} {"train_loss": -35.75053787231445, "global_step": 146696, "epoch": 1212} {"train_loss": -35.021575927734375, "global_step": 146697, "epoch": 1212} {"train_loss": -35.4969596862793, "global_step": 146698, "epoch": 1212} {"train_loss": -35.42475509643555, "global_step": 146699, "epoch": 1212} {"train_loss": -35.41608428955078, "global_step": 146700, "epoch": 1212} {"train_loss": -35.90837478637695, "global_step": 146701, "epoch": 1212} {"train_loss": -35.888336181640625, "global_step": 146702, "epoch": 1212} {"train_loss": -35.333702087402344, "global_step": 146703, "epoch": 1212} {"train_loss": -35.40866470336914, "global_step": 146704, "epoch": 1212} {"train_loss": -36.418182373046875, "global_step": 146705, "epoch": 1212} {"train_loss": -35.56478500366211, "global_step": 146706, "epoch": 1212} {"train_loss": -35.88943099975586, "global_step": 146707, "epoch": 1212} {"train_loss": -36.408790588378906, "global_step": 146708, "epoch": 1212} {"train_loss": -36.38483810424805, "global_step": 146709, "epoch": 1212} {"train_loss": -37.043174743652344, "global_step": 146710, "epoch": 1212} {"train_loss": -36.5828971862793, "global_step": 146711, "epoch": 1212} {"train_loss": -36.807552337646484, "global_step": 146712, "epoch": 1212} {"train_loss": -35.390689849853516, "global_step": 146713, "epoch": 1212} {"train_loss": -36.752105712890625, "global_step": 146714, "epoch": 1212} {"train_loss": -36.81891632080078, "global_step": 146715, "epoch": 1212} {"train_loss": -36.893226623535156, "global_step": 146716, "epoch": 1212} {"train_loss": -36.14453125, "global_step": 146717, "epoch": 1212} {"train_loss": -36.82740020751953, "global_step": 146718, "epoch": 1212} {"train_loss": -36.90498733520508, "global_step": 146719, "epoch": 1212} {"train_loss": -37.03361892700195, "global_step": 146720, "epoch": 1212} {"train_loss": -36.45289993286133, "global_step": 146721, "epoch": 1212} {"train_loss": -37.775299072265625, "global_step": 146722, "epoch": 1212} {"train_loss": -37.331172943115234, "global_step": 146723, "epoch": 1212} {"train_loss": -36.80064392089844, "global_step": 146724, "epoch": 1212} {"train_loss": -37.03761291503906, "global_step": 146725, "epoch": 1212} {"train_loss": -37.562103271484375, "global_step": 146726, "epoch": 1212} {"train_loss": -36.75525665283203, "global_step": 146727, "epoch": 1212} {"train_loss": -37.62607955932617, "global_step": 146728, "epoch": 1212} {"train_loss": -37.009944915771484, "global_step": 146729, "epoch": 1212} {"train_loss": -38.13939666748047, "global_step": 146730, "epoch": 1212} {"train_loss": -37.68598175048828, "global_step": 146731, "epoch": 1212} {"train_loss": -37.87649154663086, "global_step": 146732, "epoch": 1212} {"train_loss": -37.38082504272461, "global_step": 146733, "epoch": 1212} {"train_loss": -37.63100051879883, "global_step": 146734, "epoch": 1212} {"train_loss": -37.61664962768555, "global_step": 146735, "epoch": 1212} {"train_loss": -38.433345794677734, "global_step": 146736, "epoch": 1212} {"train_loss": -37.588722229003906, "global_step": 146737, "epoch": 1212} {"train_loss": -36.9721794128418, "global_step": 146738, "epoch": 1212} {"train_loss": -37.0438346862793, "global_step": 146739, "epoch": 1212} {"train_loss": -37.43110275268555, "global_step": 146740, "epoch": 1212} {"train_loss": -37.915443420410156, "global_step": 146741, "epoch": 1212} {"train_loss": -38.4295539855957, "global_step": 146742, "epoch": 1212} {"train_loss": -38.172691345214844, "global_step": 146743, "epoch": 1212} {"train_loss": -37.730281829833984, "global_step": 146744, "epoch": 1212} {"train_loss": -37.53413009643555, "global_step": 146745, "epoch": 1212} {"train_loss": -38.02578353881836, "global_step": 146746, "epoch": 1212} {"train_loss": -37.72766876220703, "global_step": 146747, "epoch": 1212} {"train_loss": -38.2366828918457, "global_step": 146748, "epoch": 1212} {"train_loss": -38.96757125854492, "global_step": 146749, "epoch": 1212} {"train_loss": -38.219581604003906, "global_step": 146750, "epoch": 1212} {"train_loss": -37.7366828918457, "global_step": 146751, "epoch": 1212} {"train_loss": -38.01328659057617, "global_step": 146752, "epoch": 1212} {"train_loss": -37.5920524597168, "global_step": 146753, "epoch": 1212} {"train_loss": -37.759666442871094, "global_step": 146754, "epoch": 1212} {"train_loss": -38.39176559448242, "global_step": 146755, "epoch": 1212} {"train_loss": -38.96307373046875, "global_step": 146756, "epoch": 1212} {"train_loss": -38.449459075927734, "global_step": 146757, "epoch": 1212} {"train_loss": -38.50914001464844, "global_step": 146758, "epoch": 1212} {"train_loss": -38.61422348022461, "global_step": 146759, "epoch": 1212} {"train_loss": -38.60647201538086, "global_step": 146760, "epoch": 1212} {"train_loss": -37.782798767089844, "global_step": 146761, "epoch": 1212} {"train_loss": -38.500057220458984, "global_step": 146762, "epoch": 1212} {"train_loss": -38.72113800048828, "global_step": 146763, "epoch": 1212} {"train_loss": -38.48902130126953, "global_step": 146764, "epoch": 1212} {"train_loss": -37.53672409057617, "global_step": 146765, "epoch": 1212} {"train_loss": -38.360530853271484, "global_step": 146766, "epoch": 1212} {"train_loss": -37.30424118041992, "global_step": 146767, "epoch": 1212} {"train_loss": -39.26908874511719, "global_step": 146768, "epoch": 1212} {"train_loss": -39.376808166503906, "global_step": 146769, "epoch": 1212} {"train_loss": -38.9101676940918, "global_step": 146770, "epoch": 1212} {"train_loss": -38.551273345947266, "global_step": 146771, "epoch": 1212} {"train_loss": -34.90448860294563, "global_step": 146772, "epoch": 1212, "val_loss": 2582466.0} {"train_loss": -38.577796936035156, "global_step": 146773, "epoch": 1213} {"train_loss": -39.06513595581055, "global_step": 146774, "epoch": 1213} {"train_loss": -38.67745590209961, "global_step": 146775, "epoch": 1213} {"train_loss": -38.8557243347168, "global_step": 146776, "epoch": 1213} {"train_loss": -37.633941650390625, "global_step": 146777, "epoch": 1213} {"train_loss": -39.366943359375, "global_step": 146778, "epoch": 1213} {"train_loss": -39.409881591796875, "global_step": 146779, "epoch": 1213} {"train_loss": -38.74038314819336, "global_step": 146780, "epoch": 1213} {"train_loss": -39.574188232421875, "global_step": 146781, "epoch": 1213} {"train_loss": -39.37992858886719, "global_step": 146782, "epoch": 1213} {"train_loss": -39.7905158996582, "global_step": 146783, "epoch": 1213} {"train_loss": -38.70417404174805, "global_step": 146784, "epoch": 1213} {"train_loss": -39.74725341796875, "global_step": 146785, "epoch": 1213} {"train_loss": -38.48556137084961, "global_step": 146786, "epoch": 1213} {"train_loss": -39.79466247558594, "global_step": 146787, "epoch": 1213} {"train_loss": -37.266666412353516, "global_step": 146788, "epoch": 1213} {"train_loss": -39.42974853515625, "global_step": 146789, "epoch": 1213} {"train_loss": -38.99605941772461, "global_step": 146790, "epoch": 1213} {"train_loss": -38.91203689575195, "global_step": 146791, "epoch": 1213} {"train_loss": -39.65420150756836, "global_step": 146792, "epoch": 1213} {"train_loss": -39.502845764160156, "global_step": 146793, "epoch": 1213} {"train_loss": -39.21835708618164, "global_step": 146794, "epoch": 1213} {"train_loss": -39.59194564819336, "global_step": 146795, "epoch": 1213} {"train_loss": -39.21821212768555, "global_step": 146796, "epoch": 1213} {"train_loss": -39.3625602722168, "global_step": 146797, "epoch": 1213} {"train_loss": -39.57575225830078, "global_step": 146798, "epoch": 1213} {"train_loss": -38.441802978515625, "global_step": 146799, "epoch": 1213} {"train_loss": -38.874298095703125, "global_step": 146800, "epoch": 1213} {"train_loss": -39.024574279785156, "global_step": 146801, "epoch": 1213} {"train_loss": -38.79338455200195, "global_step": 146802, "epoch": 1213} {"train_loss": -39.42506408691406, "global_step": 146803, "epoch": 1213} {"train_loss": -37.47359848022461, "global_step": 146804, "epoch": 1213} {"train_loss": -35.2711181640625, "global_step": 146805, "epoch": 1213} {"train_loss": -37.583675384521484, "global_step": 146806, "epoch": 1213} {"train_loss": -39.15449905395508, "global_step": 146807, "epoch": 1213} {"train_loss": -36.45319747924805, "global_step": 146808, "epoch": 1213} {"train_loss": -29.893598556518555, "global_step": 146809, "epoch": 1213} {"train_loss": -29.81182289123535, "global_step": 146810, "epoch": 1213} {"train_loss": -34.74909591674805, "global_step": 146811, "epoch": 1213} {"train_loss": -38.543758392333984, "global_step": 146812, "epoch": 1213} {"train_loss": -36.70640182495117, "global_step": 146813, "epoch": 1213} {"train_loss": -37.29508590698242, "global_step": 146814, "epoch": 1213} {"train_loss": -37.81160354614258, "global_step": 146815, "epoch": 1213} {"train_loss": -37.75996780395508, "global_step": 146816, "epoch": 1213} {"train_loss": -38.75347900390625, "global_step": 146817, "epoch": 1213} {"train_loss": -38.57369613647461, "global_step": 146818, "epoch": 1213} {"train_loss": -38.360816955566406, "global_step": 146819, "epoch": 1213} {"train_loss": -38.3646354675293, "global_step": 146820, "epoch": 1213} {"train_loss": -37.80324935913086, "global_step": 146821, "epoch": 1213} {"train_loss": -39.031005859375, "global_step": 146822, "epoch": 1213} {"train_loss": -37.93461227416992, "global_step": 146823, "epoch": 1213} {"train_loss": -39.347320556640625, "global_step": 146824, "epoch": 1213} {"train_loss": -39.04336166381836, "global_step": 146825, "epoch": 1213} {"train_loss": -39.00498580932617, "global_step": 146826, "epoch": 1213} {"train_loss": -39.308170318603516, "global_step": 146827, "epoch": 1213} {"train_loss": -40.21140670776367, "global_step": 146828, "epoch": 1213} {"train_loss": -39.919490814208984, "global_step": 146829, "epoch": 1213} {"train_loss": -38.84035110473633, "global_step": 146830, "epoch": 1213} {"train_loss": -39.14530563354492, "global_step": 146831, "epoch": 1213} {"train_loss": -39.61334991455078, "global_step": 146832, "epoch": 1213} {"train_loss": -39.66130065917969, "global_step": 146833, "epoch": 1213} {"train_loss": -39.304622650146484, "global_step": 146834, "epoch": 1213} {"train_loss": -39.239036560058594, "global_step": 146835, "epoch": 1213} {"train_loss": -39.3017463684082, "global_step": 146836, "epoch": 1213} {"train_loss": -39.198238372802734, "global_step": 146837, "epoch": 1213} {"train_loss": -39.923614501953125, "global_step": 146838, "epoch": 1213} {"train_loss": -39.34351348876953, "global_step": 146839, "epoch": 1213} {"train_loss": -39.916866302490234, "global_step": 146840, "epoch": 1213} {"train_loss": -39.178741455078125, "global_step": 146841, "epoch": 1213} {"train_loss": -38.33502197265625, "global_step": 146842, "epoch": 1213} {"train_loss": -39.620269775390625, "global_step": 146843, "epoch": 1213} {"train_loss": -38.6094970703125, "global_step": 146844, "epoch": 1213} {"train_loss": -39.47444534301758, "global_step": 146845, "epoch": 1213} {"train_loss": -39.31425094604492, "global_step": 146846, "epoch": 1213} {"train_loss": -39.00564956665039, "global_step": 146847, "epoch": 1213} {"train_loss": -39.478946685791016, "global_step": 146848, "epoch": 1213} {"train_loss": -39.499603271484375, "global_step": 146849, "epoch": 1213} {"train_loss": -38.510894775390625, "global_step": 146850, "epoch": 1213} {"train_loss": -40.17402267456055, "global_step": 146851, "epoch": 1213} {"train_loss": -38.882930755615234, "global_step": 146852, "epoch": 1213} {"train_loss": -39.1944580078125, "global_step": 146853, "epoch": 1213} {"train_loss": -39.62595748901367, "global_step": 146854, "epoch": 1213} {"train_loss": -40.07868576049805, "global_step": 146855, "epoch": 1213} {"train_loss": -39.135284423828125, "global_step": 146856, "epoch": 1213} {"train_loss": -39.90401840209961, "global_step": 146857, "epoch": 1213} {"train_loss": -38.750213623046875, "global_step": 146858, "epoch": 1213} {"train_loss": -39.16791534423828, "global_step": 146859, "epoch": 1213} {"train_loss": -39.857826232910156, "global_step": 146860, "epoch": 1213} {"train_loss": -38.98125457763672, "global_step": 146861, "epoch": 1213} {"train_loss": -39.26872253417969, "global_step": 146862, "epoch": 1213} {"train_loss": -39.91693878173828, "global_step": 146863, "epoch": 1213} {"train_loss": -39.991920471191406, "global_step": 146864, "epoch": 1213} {"train_loss": -40.220340728759766, "global_step": 146865, "epoch": 1213} {"train_loss": -38.889801025390625, "global_step": 146866, "epoch": 1213} {"train_loss": -37.54169845581055, "global_step": 146867, "epoch": 1213} {"train_loss": -37.853675842285156, "global_step": 146868, "epoch": 1213} {"train_loss": -39.65128707885742, "global_step": 146869, "epoch": 1213} {"train_loss": -40.05207061767578, "global_step": 146870, "epoch": 1213} {"train_loss": -39.87416458129883, "global_step": 146871, "epoch": 1213} {"train_loss": -39.61227798461914, "global_step": 146872, "epoch": 1213} {"train_loss": -39.861000061035156, "global_step": 146873, "epoch": 1213} {"train_loss": -39.16252517700195, "global_step": 146874, "epoch": 1213} {"train_loss": -38.08252716064453, "global_step": 146875, "epoch": 1213} {"train_loss": -35.693538665771484, "global_step": 146876, "epoch": 1213} {"train_loss": -33.8374137878418, "global_step": 146877, "epoch": 1213} {"train_loss": -34.59017562866211, "global_step": 146878, "epoch": 1213} {"train_loss": -36.842594146728516, "global_step": 146879, "epoch": 1213} {"train_loss": -39.50701904296875, "global_step": 146880, "epoch": 1213} {"train_loss": -39.29660415649414, "global_step": 146881, "epoch": 1213} {"train_loss": -37.7061882019043, "global_step": 146882, "epoch": 1213} {"train_loss": -37.35527420043945, "global_step": 146883, "epoch": 1213} {"train_loss": -40.14512252807617, "global_step": 146884, "epoch": 1213} {"train_loss": -38.41535568237305, "global_step": 146885, "epoch": 1213} {"train_loss": -39.63290786743164, "global_step": 146886, "epoch": 1213} {"train_loss": -39.71947479248047, "global_step": 146887, "epoch": 1213} {"train_loss": -38.311241149902344, "global_step": 146888, "epoch": 1213} {"train_loss": -39.69441223144531, "global_step": 146889, "epoch": 1213} {"train_loss": -39.06531524658203, "global_step": 146890, "epoch": 1213} {"train_loss": -39.138648986816406, "global_step": 146891, "epoch": 1213} {"train_loss": -40.79561233520508, "global_step": 146892, "epoch": 1213} {"train_loss": -38.69368917291815, "global_step": 146893, "epoch": 1213, "val_loss": 2567980.25} {"train_loss": -40.03358840942383, "global_step": 146894, "epoch": 1214} {"train_loss": -39.532806396484375, "global_step": 146895, "epoch": 1214} {"train_loss": -39.40483093261719, "global_step": 146896, "epoch": 1214} {"train_loss": -39.890846252441406, "global_step": 146897, "epoch": 1214} {"train_loss": -39.80683135986328, "global_step": 146898, "epoch": 1214} {"train_loss": -39.57832717895508, "global_step": 146899, "epoch": 1214} {"train_loss": -39.698665618896484, "global_step": 146900, "epoch": 1214} {"train_loss": -40.24262237548828, "global_step": 146901, "epoch": 1214} {"train_loss": -39.792808532714844, "global_step": 146902, "epoch": 1214} {"train_loss": -40.283138275146484, "global_step": 146903, "epoch": 1214} {"train_loss": -40.39776611328125, "global_step": 146904, "epoch": 1214} {"train_loss": -40.490989685058594, "global_step": 146905, "epoch": 1214} {"train_loss": -40.315364837646484, "global_step": 146906, "epoch": 1214} {"train_loss": -40.50455093383789, "global_step": 146907, "epoch": 1214} {"train_loss": -40.5504264831543, "global_step": 146908, "epoch": 1214} {"train_loss": -40.017127990722656, "global_step": 146909, "epoch": 1214} {"train_loss": -40.822513580322266, "global_step": 146910, "epoch": 1214} {"train_loss": -40.89670181274414, "global_step": 146911, "epoch": 1214} {"train_loss": -40.15532302856445, "global_step": 146912, "epoch": 1214} {"train_loss": -39.944435119628906, "global_step": 146913, "epoch": 1214} {"train_loss": -40.759456634521484, "global_step": 146914, "epoch": 1214} {"train_loss": -40.408164978027344, "global_step": 146915, "epoch": 1214} {"train_loss": -40.15067672729492, "global_step": 146916, "epoch": 1214} {"train_loss": -40.55997848510742, "global_step": 146917, "epoch": 1214} {"train_loss": -38.88813400268555, "global_step": 146918, "epoch": 1214} {"train_loss": -40.73065948486328, "global_step": 146919, "epoch": 1214} {"train_loss": -38.81106185913086, "global_step": 146920, "epoch": 1214} {"train_loss": -40.30609130859375, "global_step": 146921, "epoch": 1214} {"train_loss": -40.2396125793457, "global_step": 146922, "epoch": 1214} {"train_loss": -39.69642639160156, "global_step": 146923, "epoch": 1214} {"train_loss": -39.846195220947266, "global_step": 146924, "epoch": 1214} {"train_loss": -40.52864456176758, "global_step": 146925, "epoch": 1214} {"train_loss": -39.937252044677734, "global_step": 146926, "epoch": 1214} {"train_loss": -39.19147491455078, "global_step": 146927, "epoch": 1214} {"train_loss": -40.26033020019531, "global_step": 146928, "epoch": 1214} {"train_loss": -39.71493911743164, "global_step": 146929, "epoch": 1214} {"train_loss": -39.48052978515625, "global_step": 146930, "epoch": 1214} {"train_loss": -40.186981201171875, "global_step": 146931, "epoch": 1214} {"train_loss": -39.65241241455078, "global_step": 146932, "epoch": 1214} {"train_loss": -39.01459503173828, "global_step": 146933, "epoch": 1214} {"train_loss": -38.58565902709961, "global_step": 146934, "epoch": 1214} {"train_loss": -37.78212356567383, "global_step": 146935, "epoch": 1214} {"train_loss": -39.675960540771484, "global_step": 146936, "epoch": 1214} {"train_loss": -39.84978485107422, "global_step": 146937, "epoch": 1214} {"train_loss": -39.21952438354492, "global_step": 146938, "epoch": 1214} {"train_loss": -37.324317932128906, "global_step": 146939, "epoch": 1214} {"train_loss": -37.723934173583984, "global_step": 146940, "epoch": 1214} {"train_loss": -36.0719108581543, "global_step": 146941, "epoch": 1214} {"train_loss": -37.488441467285156, "global_step": 146942, "epoch": 1214} {"train_loss": -38.449623107910156, "global_step": 146943, "epoch": 1214} {"train_loss": -39.13432312011719, "global_step": 146944, "epoch": 1214} {"train_loss": -39.92932891845703, "global_step": 146945, "epoch": 1214} {"train_loss": -39.34320831298828, "global_step": 146946, "epoch": 1214} {"train_loss": -39.30915451049805, "global_step": 146947, "epoch": 1214} {"train_loss": -40.12139892578125, "global_step": 146948, "epoch": 1214} {"train_loss": -38.59824752807617, "global_step": 146949, "epoch": 1214} {"train_loss": -39.15147399902344, "global_step": 146950, "epoch": 1214} {"train_loss": -39.953670501708984, "global_step": 146951, "epoch": 1214} {"train_loss": -39.93190383911133, "global_step": 146952, "epoch": 1214} {"train_loss": -38.732906341552734, "global_step": 146953, "epoch": 1214} {"train_loss": -39.60694122314453, "global_step": 146954, "epoch": 1214} {"train_loss": -39.91068649291992, "global_step": 146955, "epoch": 1214} {"train_loss": -39.54436111450195, "global_step": 146956, "epoch": 1214} {"train_loss": -39.77847671508789, "global_step": 146957, "epoch": 1214} {"train_loss": -40.20233917236328, "global_step": 146958, "epoch": 1214} {"train_loss": -40.27933883666992, "global_step": 146959, "epoch": 1214} {"train_loss": -39.8761100769043, "global_step": 146960, "epoch": 1214} {"train_loss": -39.625892639160156, "global_step": 146961, "epoch": 1214} {"train_loss": -39.85493850708008, "global_step": 146962, "epoch": 1214} {"train_loss": -40.68447494506836, "global_step": 146963, "epoch": 1214} {"train_loss": -40.089229583740234, "global_step": 146964, "epoch": 1214} {"train_loss": -40.26182174682617, "global_step": 146965, "epoch": 1214} {"train_loss": -40.62427520751953, "global_step": 146966, "epoch": 1214} {"train_loss": -40.04628372192383, "global_step": 146967, "epoch": 1214} {"train_loss": -40.31425094604492, "global_step": 146968, "epoch": 1214} {"train_loss": -40.57711410522461, "global_step": 146969, "epoch": 1214} {"train_loss": -40.18715286254883, "global_step": 146970, "epoch": 1214} {"train_loss": -40.592552185058594, "global_step": 146971, "epoch": 1214} {"train_loss": -41.037193298339844, "global_step": 146972, "epoch": 1214} {"train_loss": -40.9694709777832, "global_step": 146973, "epoch": 1214} {"train_loss": -40.91123962402344, "global_step": 146974, "epoch": 1214} {"train_loss": -40.71368408203125, "global_step": 146975, "epoch": 1214} {"train_loss": -40.385738372802734, "global_step": 146976, "epoch": 1214} {"train_loss": -40.41650390625, "global_step": 146977, "epoch": 1214} {"train_loss": -40.05828094482422, "global_step": 146978, "epoch": 1214} {"train_loss": -40.49172592163086, "global_step": 146979, "epoch": 1214} {"train_loss": -40.284690856933594, "global_step": 146980, "epoch": 1214} {"train_loss": -40.77002716064453, "global_step": 146981, "epoch": 1214} {"train_loss": -41.09812545776367, "global_step": 146982, "epoch": 1214} {"train_loss": -40.81101608276367, "global_step": 146983, "epoch": 1214} {"train_loss": -41.177398681640625, "global_step": 146984, "epoch": 1214} {"train_loss": -40.57267379760742, "global_step": 146985, "epoch": 1214} {"train_loss": -40.641639709472656, "global_step": 146986, "epoch": 1214} {"train_loss": -40.40793991088867, "global_step": 146987, "epoch": 1214} {"train_loss": -40.56415939331055, "global_step": 146988, "epoch": 1214} {"train_loss": -40.858497619628906, "global_step": 146989, "epoch": 1214} {"train_loss": -40.0624885559082, "global_step": 146990, "epoch": 1214} {"train_loss": -40.92279815673828, "global_step": 146991, "epoch": 1214} {"train_loss": -40.65421676635742, "global_step": 146992, "epoch": 1214} {"train_loss": -40.65610885620117, "global_step": 146993, "epoch": 1214} {"train_loss": -40.568397521972656, "global_step": 146994, "epoch": 1214} {"train_loss": -40.455230712890625, "global_step": 146995, "epoch": 1214} {"train_loss": -40.44200134277344, "global_step": 146996, "epoch": 1214} {"train_loss": -40.39493942260742, "global_step": 146997, "epoch": 1214} {"train_loss": -40.819801330566406, "global_step": 146998, "epoch": 1214} {"train_loss": -39.93175506591797, "global_step": 146999, "epoch": 1214} {"train_loss": -39.09474563598633, "global_step": 147000, "epoch": 1214} {"train_loss": -40.71731948852539, "global_step": 147001, "epoch": 1214} {"train_loss": -39.17426681518555, "global_step": 147002, "epoch": 1214} {"train_loss": -40.522281646728516, "global_step": 147003, "epoch": 1214} {"train_loss": -40.56223678588867, "global_step": 147004, "epoch": 1214} {"train_loss": -38.78311538696289, "global_step": 147005, "epoch": 1214} {"train_loss": -37.84382247924805, "global_step": 147006, "epoch": 1214} {"train_loss": -38.766475677490234, "global_step": 147007, "epoch": 1214} {"train_loss": -39.09600830078125, "global_step": 147008, "epoch": 1214} {"train_loss": -40.15769958496094, "global_step": 147009, "epoch": 1214} {"train_loss": -40.07183837890625, "global_step": 147010, "epoch": 1214} {"train_loss": -38.39575958251953, "global_step": 147011, "epoch": 1214} {"train_loss": -38.9166374206543, "global_step": 147012, "epoch": 1214} {"train_loss": -40.60868453979492, "global_step": 147013, "epoch": 1214} {"train_loss": -39.90357886070062, "global_step": 147014, "epoch": 1214, "val_loss": 2607808.75} {"train_loss": -39.82121276855469, "global_step": 147015, "epoch": 1215} {"train_loss": -39.77959442138672, "global_step": 147016, "epoch": 1215} {"train_loss": -40.219146728515625, "global_step": 147017, "epoch": 1215} {"train_loss": -40.146427154541016, "global_step": 147018, "epoch": 1215} {"train_loss": -38.96962356567383, "global_step": 147019, "epoch": 1215} {"train_loss": -38.85367965698242, "global_step": 147020, "epoch": 1215} {"train_loss": -39.287452697753906, "global_step": 147021, "epoch": 1215} {"train_loss": -40.548954010009766, "global_step": 147022, "epoch": 1215} {"train_loss": -39.99799346923828, "global_step": 147023, "epoch": 1215} {"train_loss": -38.943111419677734, "global_step": 147024, "epoch": 1215} {"train_loss": -37.9880256652832, "global_step": 147025, "epoch": 1215} {"train_loss": -39.5786247253418, "global_step": 147026, "epoch": 1215} {"train_loss": -40.658531188964844, "global_step": 147027, "epoch": 1215} {"train_loss": -39.44221878051758, "global_step": 147028, "epoch": 1215} {"train_loss": -38.16923141479492, "global_step": 147029, "epoch": 1215} {"train_loss": -38.42296600341797, "global_step": 147030, "epoch": 1215} {"train_loss": -39.6831169128418, "global_step": 147031, "epoch": 1215} {"train_loss": -39.56509017944336, "global_step": 147032, "epoch": 1215} {"train_loss": -36.91132736206055, "global_step": 147033, "epoch": 1215} {"train_loss": -37.89736557006836, "global_step": 147034, "epoch": 1215} {"train_loss": -38.8918571472168, "global_step": 147035, "epoch": 1215} {"train_loss": -39.4443359375, "global_step": 147036, "epoch": 1215} {"train_loss": -39.6373291015625, "global_step": 147037, "epoch": 1215} {"train_loss": -37.59328842163086, "global_step": 147038, "epoch": 1215} {"train_loss": -38.014766693115234, "global_step": 147039, "epoch": 1215} {"train_loss": -39.20669937133789, "global_step": 147040, "epoch": 1215} {"train_loss": -35.3627815246582, "global_step": 147041, "epoch": 1215} {"train_loss": -37.62370300292969, "global_step": 147042, "epoch": 1215} {"train_loss": -38.35879135131836, "global_step": 147043, "epoch": 1215} {"train_loss": -38.420711517333984, "global_step": 147044, "epoch": 1215} {"train_loss": -37.81594467163086, "global_step": 147045, "epoch": 1215} {"train_loss": -38.91356658935547, "global_step": 147046, "epoch": 1215} {"train_loss": -39.35891342163086, "global_step": 147047, "epoch": 1215} {"train_loss": -36.577510833740234, "global_step": 147048, "epoch": 1215} {"train_loss": -38.97705078125, "global_step": 147049, "epoch": 1215} {"train_loss": -39.45512771606445, "global_step": 147050, "epoch": 1215} {"train_loss": -39.178489685058594, "global_step": 147051, "epoch": 1215} {"train_loss": -36.0095329284668, "global_step": 147052, "epoch": 1215} {"train_loss": -38.0343017578125, "global_step": 147053, "epoch": 1215} {"train_loss": -38.25862503051758, "global_step": 147054, "epoch": 1215} {"train_loss": -39.1724967956543, "global_step": 147055, "epoch": 1215} {"train_loss": -38.4765739440918, "global_step": 147056, "epoch": 1215} {"train_loss": -38.6173210144043, "global_step": 147057, "epoch": 1215} {"train_loss": -38.25615310668945, "global_step": 147058, "epoch": 1215} {"train_loss": -39.21161651611328, "global_step": 147059, "epoch": 1215} {"train_loss": -39.161800384521484, "global_step": 147060, "epoch": 1215} {"train_loss": -38.497413635253906, "global_step": 147061, "epoch": 1215} {"train_loss": -39.625640869140625, "global_step": 147062, "epoch": 1215} {"train_loss": -39.48201370239258, "global_step": 147063, "epoch": 1215} {"train_loss": -37.9199333190918, "global_step": 147064, "epoch": 1215} {"train_loss": -38.13237380981445, "global_step": 147065, "epoch": 1215} {"train_loss": -38.872467041015625, "global_step": 147066, "epoch": 1215} {"train_loss": -38.106361389160156, "global_step": 147067, "epoch": 1215} {"train_loss": -30.896682739257812, "global_step": 147068, "epoch": 1215} {"train_loss": -36.0386962890625, "global_step": 147069, "epoch": 1215} {"train_loss": -37.273868560791016, "global_step": 147070, "epoch": 1215} {"train_loss": -37.69984817504883, "global_step": 147071, "epoch": 1215} {"train_loss": -38.82589340209961, "global_step": 147072, "epoch": 1215} {"train_loss": -37.82509994506836, "global_step": 147073, "epoch": 1215} {"train_loss": -37.82405471801758, "global_step": 147074, "epoch": 1215} {"train_loss": -38.22597885131836, "global_step": 147075, "epoch": 1215} {"train_loss": -37.21086502075195, "global_step": 147076, "epoch": 1215} {"train_loss": -38.92301559448242, "global_step": 147077, "epoch": 1215} {"train_loss": -39.023128509521484, "global_step": 147078, "epoch": 1215} {"train_loss": -35.89537048339844, "global_step": 147079, "epoch": 1215} {"train_loss": -38.48615264892578, "global_step": 147080, "epoch": 1215} {"train_loss": -37.17131423950195, "global_step": 147081, "epoch": 1215} {"train_loss": -39.38500213623047, "global_step": 147082, "epoch": 1215} {"train_loss": -38.822120666503906, "global_step": 147083, "epoch": 1215} {"train_loss": -39.504547119140625, "global_step": 147084, "epoch": 1215} {"train_loss": -39.318458557128906, "global_step": 147085, "epoch": 1215} {"train_loss": -39.72968673706055, "global_step": 147086, "epoch": 1215} {"train_loss": -39.61531448364258, "global_step": 147087, "epoch": 1215} {"train_loss": -39.91304016113281, "global_step": 147088, "epoch": 1215} {"train_loss": -39.94765853881836, "global_step": 147089, "epoch": 1215} {"train_loss": -39.74489212036133, "global_step": 147090, "epoch": 1215} {"train_loss": -40.05036544799805, "global_step": 147091, "epoch": 1215} {"train_loss": -39.61652755737305, "global_step": 147092, "epoch": 1215} {"train_loss": -38.75026321411133, "global_step": 147093, "epoch": 1215} {"train_loss": -39.36867904663086, "global_step": 147094, "epoch": 1215} {"train_loss": -39.98201370239258, "global_step": 147095, "epoch": 1215} {"train_loss": -39.7689094543457, "global_step": 147096, "epoch": 1215} {"train_loss": -40.03633499145508, "global_step": 147097, "epoch": 1215} {"train_loss": -40.10992431640625, "global_step": 147098, "epoch": 1215} {"train_loss": -37.4954833984375, "global_step": 147099, "epoch": 1215} {"train_loss": -40.05323028564453, "global_step": 147100, "epoch": 1215} {"train_loss": -40.04741287231445, "global_step": 147101, "epoch": 1215} {"train_loss": -39.591148376464844, "global_step": 147102, "epoch": 1215} {"train_loss": -39.37108612060547, "global_step": 147103, "epoch": 1215} {"train_loss": -39.707454681396484, "global_step": 147104, "epoch": 1215} {"train_loss": -39.247413635253906, "global_step": 147105, "epoch": 1215} {"train_loss": -37.03168869018555, "global_step": 147106, "epoch": 1215} {"train_loss": -40.298583984375, "global_step": 147107, "epoch": 1215} {"train_loss": -40.40278244018555, "global_step": 147108, "epoch": 1215} {"train_loss": -36.1602897644043, "global_step": 147109, "epoch": 1215} {"train_loss": -39.861854553222656, "global_step": 147110, "epoch": 1215} {"train_loss": -40.49294662475586, "global_step": 147111, "epoch": 1215} {"train_loss": -36.99580764770508, "global_step": 147112, "epoch": 1215} {"train_loss": -37.45650863647461, "global_step": 147113, "epoch": 1215} {"train_loss": -40.56143569946289, "global_step": 147114, "epoch": 1215} {"train_loss": -39.26571273803711, "global_step": 147115, "epoch": 1215} {"train_loss": -38.932342529296875, "global_step": 147116, "epoch": 1215} {"train_loss": -40.1748161315918, "global_step": 147117, "epoch": 1215} {"train_loss": -39.061893463134766, "global_step": 147118, "epoch": 1215} {"train_loss": -37.59840774536133, "global_step": 147119, "epoch": 1215} {"train_loss": -38.223854064941406, "global_step": 147120, "epoch": 1215} {"train_loss": -35.201499938964844, "global_step": 147121, "epoch": 1215} {"train_loss": -35.91706466674805, "global_step": 147122, "epoch": 1215} {"train_loss": -37.80896759033203, "global_step": 147123, "epoch": 1215} {"train_loss": -39.32094192504883, "global_step": 147124, "epoch": 1215} {"train_loss": -38.263771057128906, "global_step": 147125, "epoch": 1215} {"train_loss": -38.83332061767578, "global_step": 147126, "epoch": 1215} {"train_loss": -39.83449172973633, "global_step": 147127, "epoch": 1215} {"train_loss": -39.2323112487793, "global_step": 147128, "epoch": 1215} {"train_loss": -39.7348747253418, "global_step": 147129, "epoch": 1215} {"train_loss": -38.73933029174805, "global_step": 147130, "epoch": 1215} {"train_loss": -37.245704650878906, "global_step": 147131, "epoch": 1215} {"train_loss": -38.9145393371582, "global_step": 147132, "epoch": 1215} {"train_loss": -39.91746139526367, "global_step": 147133, "epoch": 1215} {"train_loss": -39.178733825683594, "global_step": 147134, "epoch": 1215} {"train_loss": -38.70066732611538, "global_step": 147135, "epoch": 1215, "val_loss": 2599181.75} {"train_loss": -38.965641021728516, "global_step": 147136, "epoch": 1216} {"train_loss": -38.43781661987305, "global_step": 147137, "epoch": 1216} {"train_loss": -38.573204040527344, "global_step": 147138, "epoch": 1216} {"train_loss": -39.95077133178711, "global_step": 147139, "epoch": 1216} {"train_loss": -38.51387023925781, "global_step": 147140, "epoch": 1216} {"train_loss": -38.54689407348633, "global_step": 147141, "epoch": 1216} {"train_loss": -39.78082275390625, "global_step": 147142, "epoch": 1216} {"train_loss": -39.55327224731445, "global_step": 147143, "epoch": 1216} {"train_loss": -38.316139221191406, "global_step": 147144, "epoch": 1216} {"train_loss": -39.05678939819336, "global_step": 147145, "epoch": 1216} {"train_loss": -38.769832611083984, "global_step": 147146, "epoch": 1216} {"train_loss": -39.037391662597656, "global_step": 147147, "epoch": 1216} {"train_loss": -37.70439529418945, "global_step": 147148, "epoch": 1216} {"train_loss": -38.65274429321289, "global_step": 147149, "epoch": 1216} {"train_loss": -38.89583969116211, "global_step": 147150, "epoch": 1216} {"train_loss": -38.43223190307617, "global_step": 147151, "epoch": 1216} {"train_loss": -38.12900924682617, "global_step": 147152, "epoch": 1216} {"train_loss": -38.97425079345703, "global_step": 147153, "epoch": 1216} {"train_loss": -39.704097747802734, "global_step": 147154, "epoch": 1216} {"train_loss": -39.123870849609375, "global_step": 147155, "epoch": 1216} {"train_loss": -39.192909240722656, "global_step": 147156, "epoch": 1216} {"train_loss": -39.73492431640625, "global_step": 147157, "epoch": 1216} {"train_loss": -39.576419830322266, "global_step": 147158, "epoch": 1216} {"train_loss": -37.91977310180664, "global_step": 147159, "epoch": 1216} {"train_loss": -39.42829132080078, "global_step": 147160, "epoch": 1216} {"train_loss": -39.982574462890625, "global_step": 147161, "epoch": 1216} {"train_loss": -38.48533248901367, "global_step": 147162, "epoch": 1216} {"train_loss": -40.08258819580078, "global_step": 147163, "epoch": 1216} {"train_loss": -39.831787109375, "global_step": 147164, "epoch": 1216} {"train_loss": -39.69416427612305, "global_step": 147165, "epoch": 1216} {"train_loss": -39.6733283996582, "global_step": 147166, "epoch": 1216} {"train_loss": -40.00728988647461, "global_step": 147167, "epoch": 1216} {"train_loss": -39.7802619934082, "global_step": 147168, "epoch": 1216} {"train_loss": -39.2165641784668, "global_step": 147169, "epoch": 1216} {"train_loss": -39.85282897949219, "global_step": 147170, "epoch": 1216} {"train_loss": -38.526973724365234, "global_step": 147171, "epoch": 1216} {"train_loss": -39.0745849609375, "global_step": 147172, "epoch": 1216} {"train_loss": -39.398250579833984, "global_step": 147173, "epoch": 1216} {"train_loss": -38.81632614135742, "global_step": 147174, "epoch": 1216} {"train_loss": -39.14996337890625, "global_step": 147175, "epoch": 1216} {"train_loss": -38.85812759399414, "global_step": 147176, "epoch": 1216} {"train_loss": -39.640560150146484, "global_step": 147177, "epoch": 1216} {"train_loss": -37.84333038330078, "global_step": 147178, "epoch": 1216} {"train_loss": -39.76204299926758, "global_step": 147179, "epoch": 1216} {"train_loss": -39.05959701538086, "global_step": 147180, "epoch": 1216} {"train_loss": -40.08661651611328, "global_step": 147181, "epoch": 1216} {"train_loss": -39.13513946533203, "global_step": 147182, "epoch": 1216} {"train_loss": -39.4661979675293, "global_step": 147183, "epoch": 1216} {"train_loss": -38.744140625, "global_step": 147184, "epoch": 1216} {"train_loss": -38.9520149230957, "global_step": 147185, "epoch": 1216} {"train_loss": -38.74833679199219, "global_step": 147186, "epoch": 1216} {"train_loss": -40.76335525512695, "global_step": 147187, "epoch": 1216} {"train_loss": -39.64498519897461, "global_step": 147188, "epoch": 1216} {"train_loss": -38.24172592163086, "global_step": 147189, "epoch": 1216} {"train_loss": -39.87016296386719, "global_step": 147190, "epoch": 1216} {"train_loss": -38.17302703857422, "global_step": 147191, "epoch": 1216} {"train_loss": -40.03007888793945, "global_step": 147192, "epoch": 1216} {"train_loss": -39.080020904541016, "global_step": 147193, "epoch": 1216} {"train_loss": -40.50661849975586, "global_step": 147194, "epoch": 1216} {"train_loss": -39.33041000366211, "global_step": 147195, "epoch": 1216} {"train_loss": -39.682769775390625, "global_step": 147196, "epoch": 1216} {"train_loss": -38.36668014526367, "global_step": 147197, "epoch": 1216} {"train_loss": -39.83339309692383, "global_step": 147198, "epoch": 1216} {"train_loss": -40.118953704833984, "global_step": 147199, "epoch": 1216} {"train_loss": -39.15165328979492, "global_step": 147200, "epoch": 1216} {"train_loss": -36.582550048828125, "global_step": 147201, "epoch": 1216} {"train_loss": -37.31589889526367, "global_step": 147202, "epoch": 1216} {"train_loss": -38.280426025390625, "global_step": 147203, "epoch": 1216} {"train_loss": -39.988460540771484, "global_step": 147204, "epoch": 1216} {"train_loss": -39.710811614990234, "global_step": 147205, "epoch": 1216} {"train_loss": -38.249324798583984, "global_step": 147206, "epoch": 1216} {"train_loss": -39.01935577392578, "global_step": 147207, "epoch": 1216} {"train_loss": -38.96247863769531, "global_step": 147208, "epoch": 1216} {"train_loss": -39.70612335205078, "global_step": 147209, "epoch": 1216} {"train_loss": -40.310184478759766, "global_step": 147210, "epoch": 1216} {"train_loss": -38.94247055053711, "global_step": 147211, "epoch": 1216} {"train_loss": -37.371803283691406, "global_step": 147212, "epoch": 1216} {"train_loss": -35.08888244628906, "global_step": 147213, "epoch": 1216} {"train_loss": -39.6632194519043, "global_step": 147214, "epoch": 1216} {"train_loss": -38.077877044677734, "global_step": 147215, "epoch": 1216} {"train_loss": -36.122047424316406, "global_step": 147216, "epoch": 1216} {"train_loss": -39.92473220825195, "global_step": 147217, "epoch": 1216} {"train_loss": -37.2495002746582, "global_step": 147218, "epoch": 1216} {"train_loss": -36.72188186645508, "global_step": 147219, "epoch": 1216} {"train_loss": -39.4227409362793, "global_step": 147220, "epoch": 1216} {"train_loss": -39.67637634277344, "global_step": 147221, "epoch": 1216} {"train_loss": -38.81193542480469, "global_step": 147222, "epoch": 1216} {"train_loss": -39.8058967590332, "global_step": 147223, "epoch": 1216} {"train_loss": -40.08456802368164, "global_step": 147224, "epoch": 1216} {"train_loss": -39.86177444458008, "global_step": 147225, "epoch": 1216} {"train_loss": -39.748226165771484, "global_step": 147226, "epoch": 1216} {"train_loss": -40.42742919921875, "global_step": 147227, "epoch": 1216} {"train_loss": -40.01129913330078, "global_step": 147228, "epoch": 1216} {"train_loss": -39.667144775390625, "global_step": 147229, "epoch": 1216} {"train_loss": -39.4930305480957, "global_step": 147230, "epoch": 1216} {"train_loss": -39.66726303100586, "global_step": 147231, "epoch": 1216} {"train_loss": -39.86695098876953, "global_step": 147232, "epoch": 1216} {"train_loss": -39.782020568847656, "global_step": 147233, "epoch": 1216} {"train_loss": -39.890438079833984, "global_step": 147234, "epoch": 1216} {"train_loss": -40.51874542236328, "global_step": 147235, "epoch": 1216} {"train_loss": -40.1430549621582, "global_step": 147236, "epoch": 1216} {"train_loss": -40.05061340332031, "global_step": 147237, "epoch": 1216} {"train_loss": -40.48586654663086, "global_step": 147238, "epoch": 1216} {"train_loss": -40.28654861450195, "global_step": 147239, "epoch": 1216} {"train_loss": -39.8051643371582, "global_step": 147240, "epoch": 1216} {"train_loss": -40.28957748413086, "global_step": 147241, "epoch": 1216} {"train_loss": -40.137367248535156, "global_step": 147242, "epoch": 1216} {"train_loss": -40.534122467041016, "global_step": 147243, "epoch": 1216} {"train_loss": -39.05553436279297, "global_step": 147244, "epoch": 1216} {"train_loss": -40.50674057006836, "global_step": 147245, "epoch": 1216} {"train_loss": -40.40174102783203, "global_step": 147246, "epoch": 1216} {"train_loss": -40.762210845947266, "global_step": 147247, "epoch": 1216} {"train_loss": -40.88593673706055, "global_step": 147248, "epoch": 1216} {"train_loss": -40.6271858215332, "global_step": 147249, "epoch": 1216} {"train_loss": -40.62034225463867, "global_step": 147250, "epoch": 1216} {"train_loss": -40.016334533691406, "global_step": 147251, "epoch": 1216} {"train_loss": -40.23934555053711, "global_step": 147252, "epoch": 1216} {"train_loss": -40.10103988647461, "global_step": 147253, "epoch": 1216} {"train_loss": -40.8968391418457, "global_step": 147254, "epoch": 1216} {"train_loss": -40.17362594604492, "global_step": 147255, "epoch": 1216} {"train_loss": -39.320583879455064, "global_step": 147256, "epoch": 1216, "val_loss": 2646625.25} {"train_loss": -39.79161834716797, "global_step": 147257, "epoch": 1217} {"train_loss": -41.14400863647461, "global_step": 147258, "epoch": 1217} {"train_loss": -40.005916595458984, "global_step": 147259, "epoch": 1217} {"train_loss": -40.4159049987793, "global_step": 147260, "epoch": 1217} {"train_loss": -40.422607421875, "global_step": 147261, "epoch": 1217} {"train_loss": -40.38572311401367, "global_step": 147262, "epoch": 1217} {"train_loss": -40.77676010131836, "global_step": 147263, "epoch": 1217} {"train_loss": -40.58160400390625, "global_step": 147264, "epoch": 1217} {"train_loss": -40.245689392089844, "global_step": 147265, "epoch": 1217} {"train_loss": -40.74798583984375, "global_step": 147266, "epoch": 1217} {"train_loss": -40.7338752746582, "global_step": 147267, "epoch": 1217} {"train_loss": -40.6822395324707, "global_step": 147268, "epoch": 1217} {"train_loss": -41.39002227783203, "global_step": 147269, "epoch": 1217} {"train_loss": -40.5244140625, "global_step": 147270, "epoch": 1217} {"train_loss": -40.74833679199219, "global_step": 147271, "epoch": 1217} {"train_loss": -40.82049560546875, "global_step": 147272, "epoch": 1217} {"train_loss": -40.87940216064453, "global_step": 147273, "epoch": 1217} {"train_loss": -40.52912139892578, "global_step": 147274, "epoch": 1217} {"train_loss": -40.95302200317383, "global_step": 147275, "epoch": 1217} {"train_loss": -41.08749008178711, "global_step": 147276, "epoch": 1217} {"train_loss": -40.95547103881836, "global_step": 147277, "epoch": 1217} {"train_loss": -41.0377311706543, "global_step": 147278, "epoch": 1217} {"train_loss": -40.39352035522461, "global_step": 147279, "epoch": 1217} {"train_loss": -40.96001052856445, "global_step": 147280, "epoch": 1217} {"train_loss": -39.947174072265625, "global_step": 147281, "epoch": 1217} {"train_loss": -39.065277099609375, "global_step": 147282, "epoch": 1217} {"train_loss": -38.15678024291992, "global_step": 147283, "epoch": 1217} {"train_loss": -30.694372177124023, "global_step": 147284, "epoch": 1217} {"train_loss": -18.540620803833008, "global_step": 147285, "epoch": 1217} {"train_loss": -12.9677734375, "global_step": 147286, "epoch": 1217} {"train_loss": -33.351356506347656, "global_step": 147287, "epoch": 1217} {"train_loss": -38.21189498901367, "global_step": 147288, "epoch": 1217} {"train_loss": -28.578784942626953, "global_step": 147289, "epoch": 1217} {"train_loss": -40.077674865722656, "global_step": 147290, "epoch": 1217} {"train_loss": -31.106054306030273, "global_step": 147291, "epoch": 1217} {"train_loss": -35.60498809814453, "global_step": 147292, "epoch": 1217} {"train_loss": -32.52878189086914, "global_step": 147293, "epoch": 1217} {"train_loss": -32.72920608520508, "global_step": 147294, "epoch": 1217} {"train_loss": -35.24452590942383, "global_step": 147295, "epoch": 1217} {"train_loss": -37.571285247802734, "global_step": 147296, "epoch": 1217} {"train_loss": -36.760467529296875, "global_step": 147297, "epoch": 1217} {"train_loss": -39.419551849365234, "global_step": 147298, "epoch": 1217} {"train_loss": -36.91742706298828, "global_step": 147299, "epoch": 1217} {"train_loss": -38.49352264404297, "global_step": 147300, "epoch": 1217} {"train_loss": -38.92584228515625, "global_step": 147301, "epoch": 1217} {"train_loss": -36.637908935546875, "global_step": 147302, "epoch": 1217} {"train_loss": -39.096126556396484, "global_step": 147303, "epoch": 1217} {"train_loss": -38.4583740234375, "global_step": 147304, "epoch": 1217} {"train_loss": -38.952247619628906, "global_step": 147305, "epoch": 1217} {"train_loss": -39.5623893737793, "global_step": 147306, "epoch": 1217} {"train_loss": -39.999420166015625, "global_step": 147307, "epoch": 1217} {"train_loss": -39.22769546508789, "global_step": 147308, "epoch": 1217} {"train_loss": -39.557369232177734, "global_step": 147309, "epoch": 1217} {"train_loss": -39.385494232177734, "global_step": 147310, "epoch": 1217} {"train_loss": -38.80815124511719, "global_step": 147311, "epoch": 1217} {"train_loss": -39.90402603149414, "global_step": 147312, "epoch": 1217} {"train_loss": -39.65658187866211, "global_step": 147313, "epoch": 1217} {"train_loss": -40.218257904052734, "global_step": 147314, "epoch": 1217} {"train_loss": -40.08294677734375, "global_step": 147315, "epoch": 1217} {"train_loss": -40.1762809753418, "global_step": 147316, "epoch": 1217} {"train_loss": -39.75464630126953, "global_step": 147317, "epoch": 1217} {"train_loss": -39.384918212890625, "global_step": 147318, "epoch": 1217} {"train_loss": -40.123409271240234, "global_step": 147319, "epoch": 1217} {"train_loss": -39.852882385253906, "global_step": 147320, "epoch": 1217} {"train_loss": -40.630271911621094, "global_step": 147321, "epoch": 1217} {"train_loss": -40.231353759765625, "global_step": 147322, "epoch": 1217} {"train_loss": -40.25556564331055, "global_step": 147323, "epoch": 1217} {"train_loss": -40.163822174072266, "global_step": 147324, "epoch": 1217} {"train_loss": -40.327789306640625, "global_step": 147325, "epoch": 1217} {"train_loss": -39.951446533203125, "global_step": 147326, "epoch": 1217} {"train_loss": -40.39735794067383, "global_step": 147327, "epoch": 1217} {"train_loss": -40.61650466918945, "global_step": 147328, "epoch": 1217} {"train_loss": -40.55045700073242, "global_step": 147329, "epoch": 1217} {"train_loss": -39.915950775146484, "global_step": 147330, "epoch": 1217} {"train_loss": -40.64182662963867, "global_step": 147331, "epoch": 1217} {"train_loss": -40.326263427734375, "global_step": 147332, "epoch": 1217} {"train_loss": -40.07413101196289, "global_step": 147333, "epoch": 1217} {"train_loss": -40.47182846069336, "global_step": 147334, "epoch": 1217} {"train_loss": -40.524227142333984, "global_step": 147335, "epoch": 1217} {"train_loss": -40.81791305541992, "global_step": 147336, "epoch": 1217} {"train_loss": -40.162837982177734, "global_step": 147337, "epoch": 1217} {"train_loss": -40.72297668457031, "global_step": 147338, "epoch": 1217} {"train_loss": -40.80281448364258, "global_step": 147339, "epoch": 1217} {"train_loss": -40.65560531616211, "global_step": 147340, "epoch": 1217} {"train_loss": -40.60538864135742, "global_step": 147341, "epoch": 1217} {"train_loss": -40.89878845214844, "global_step": 147342, "epoch": 1217} {"train_loss": -41.1554069519043, "global_step": 147343, "epoch": 1217} {"train_loss": -40.9759407043457, "global_step": 147344, "epoch": 1217} {"train_loss": -41.12948226928711, "global_step": 147345, "epoch": 1217} {"train_loss": -40.70762252807617, "global_step": 147346, "epoch": 1217} {"train_loss": -41.02008819580078, "global_step": 147347, "epoch": 1217} {"train_loss": -40.97857666015625, "global_step": 147348, "epoch": 1217} {"train_loss": -40.79876708984375, "global_step": 147349, "epoch": 1217} {"train_loss": -41.201595306396484, "global_step": 147350, "epoch": 1217} {"train_loss": -40.706172943115234, "global_step": 147351, "epoch": 1217} {"train_loss": -40.899757385253906, "global_step": 147352, "epoch": 1217} {"train_loss": -40.761592864990234, "global_step": 147353, "epoch": 1217} {"train_loss": -40.56257629394531, "global_step": 147354, "epoch": 1217} {"train_loss": -41.36260223388672, "global_step": 147355, "epoch": 1217} {"train_loss": -41.393394470214844, "global_step": 147356, "epoch": 1217} {"train_loss": -41.373809814453125, "global_step": 147357, "epoch": 1217} {"train_loss": -40.964298248291016, "global_step": 147358, "epoch": 1217} {"train_loss": -41.3072624206543, "global_step": 147359, "epoch": 1217} {"train_loss": -41.298095703125, "global_step": 147360, "epoch": 1217} {"train_loss": -41.401458740234375, "global_step": 147361, "epoch": 1217} {"train_loss": -40.8375244140625, "global_step": 147362, "epoch": 1217} {"train_loss": -40.7782096862793, "global_step": 147363, "epoch": 1217} {"train_loss": -41.11014175415039, "global_step": 147364, "epoch": 1217} {"train_loss": -40.59708786010742, "global_step": 147365, "epoch": 1217} {"train_loss": -40.34243392944336, "global_step": 147366, "epoch": 1217} {"train_loss": -39.951759338378906, "global_step": 147367, "epoch": 1217} {"train_loss": -39.94841384887695, "global_step": 147368, "epoch": 1217} {"train_loss": -40.056846618652344, "global_step": 147369, "epoch": 1217} {"train_loss": -40.81709671020508, "global_step": 147370, "epoch": 1217} {"train_loss": -40.943992614746094, "global_step": 147371, "epoch": 1217} {"train_loss": -40.965206146240234, "global_step": 147372, "epoch": 1217} {"train_loss": -40.57978057861328, "global_step": 147373, "epoch": 1217} {"train_loss": -40.08887481689453, "global_step": 147374, "epoch": 1217} {"train_loss": -39.72004318237305, "global_step": 147375, "epoch": 1217} {"train_loss": -37.390769958496094, "global_step": 147376, "epoch": 1217} {"train_loss": -39.209458169858316, "global_step": 147377, "epoch": 1217, "val_loss": 2602675.25} {"train_loss": -19.290775299072266, "global_step": 147378, "epoch": 1218} {"train_loss": -20.281375885009766, "global_step": 147379, "epoch": 1218} {"train_loss": -36.25692367553711, "global_step": 147380, "epoch": 1218} {"train_loss": -35.10123825073242, "global_step": 147381, "epoch": 1218} {"train_loss": -28.696043014526367, "global_step": 147382, "epoch": 1218} {"train_loss": -31.400836944580078, "global_step": 147383, "epoch": 1218} {"train_loss": -35.42332077026367, "global_step": 147384, "epoch": 1218} {"train_loss": -34.803199768066406, "global_step": 147385, "epoch": 1218} {"train_loss": -36.385066986083984, "global_step": 147386, "epoch": 1218} {"train_loss": -35.97480392456055, "global_step": 147387, "epoch": 1218} {"train_loss": -36.971923828125, "global_step": 147388, "epoch": 1218} {"train_loss": -37.7957763671875, "global_step": 147389, "epoch": 1218} {"train_loss": -37.8734016418457, "global_step": 147390, "epoch": 1218} {"train_loss": -37.94134521484375, "global_step": 147391, "epoch": 1218} {"train_loss": -36.953304290771484, "global_step": 147392, "epoch": 1218} {"train_loss": -37.9676513671875, "global_step": 147393, "epoch": 1218} {"train_loss": -37.71639633178711, "global_step": 147394, "epoch": 1218} {"train_loss": -37.87583541870117, "global_step": 147395, "epoch": 1218} {"train_loss": -38.21633529663086, "global_step": 147396, "epoch": 1218} {"train_loss": -39.268192291259766, "global_step": 147397, "epoch": 1218} {"train_loss": -37.79418182373047, "global_step": 147398, "epoch": 1218} {"train_loss": -38.6115608215332, "global_step": 147399, "epoch": 1218} {"train_loss": -37.8133430480957, "global_step": 147400, "epoch": 1218} {"train_loss": -38.667972564697266, "global_step": 147401, "epoch": 1218} {"train_loss": -37.602813720703125, "global_step": 147402, "epoch": 1218} {"train_loss": -39.34193801879883, "global_step": 147403, "epoch": 1218} {"train_loss": -39.0616340637207, "global_step": 147404, "epoch": 1218} {"train_loss": -37.02778244018555, "global_step": 147405, "epoch": 1218} {"train_loss": -38.6258430480957, "global_step": 147406, "epoch": 1218} {"train_loss": -39.552188873291016, "global_step": 147407, "epoch": 1218} {"train_loss": -38.50886154174805, "global_step": 147408, "epoch": 1218} {"train_loss": -39.52565002441406, "global_step": 147409, "epoch": 1218} {"train_loss": -38.73567581176758, "global_step": 147410, "epoch": 1218} {"train_loss": -39.443603515625, "global_step": 147411, "epoch": 1218} {"train_loss": -38.99612045288086, "global_step": 147412, "epoch": 1218} {"train_loss": -38.9543571472168, "global_step": 147413, "epoch": 1218} {"train_loss": -39.5687255859375, "global_step": 147414, "epoch": 1218} {"train_loss": -38.99696350097656, "global_step": 147415, "epoch": 1218} {"train_loss": -39.41910934448242, "global_step": 147416, "epoch": 1218} {"train_loss": -39.73508071899414, "global_step": 147417, "epoch": 1218} {"train_loss": -39.92829513549805, "global_step": 147418, "epoch": 1218} {"train_loss": -39.396728515625, "global_step": 147419, "epoch": 1218} {"train_loss": -40.18653106689453, "global_step": 147420, "epoch": 1218} {"train_loss": -39.07341384887695, "global_step": 147421, "epoch": 1218} {"train_loss": -39.88776779174805, "global_step": 147422, "epoch": 1218} {"train_loss": -39.84651565551758, "global_step": 147423, "epoch": 1218} {"train_loss": -39.724246978759766, "global_step": 147424, "epoch": 1218} {"train_loss": -39.35345458984375, "global_step": 147425, "epoch": 1218} {"train_loss": -39.4161491394043, "global_step": 147426, "epoch": 1218} {"train_loss": -39.638153076171875, "global_step": 147427, "epoch": 1218} {"train_loss": -38.297550201416016, "global_step": 147428, "epoch": 1218} {"train_loss": -39.23102569580078, "global_step": 147429, "epoch": 1218} {"train_loss": -39.94358444213867, "global_step": 147430, "epoch": 1218} {"train_loss": -39.791908264160156, "global_step": 147431, "epoch": 1218} {"train_loss": -40.38042068481445, "global_step": 147432, "epoch": 1218} {"train_loss": -40.06997299194336, "global_step": 147433, "epoch": 1218} {"train_loss": -40.735633850097656, "global_step": 147434, "epoch": 1218} {"train_loss": -39.82956314086914, "global_step": 147435, "epoch": 1218} {"train_loss": -40.07341384887695, "global_step": 147436, "epoch": 1218} {"train_loss": -39.83769607543945, "global_step": 147437, "epoch": 1218} {"train_loss": -40.50082778930664, "global_step": 147438, "epoch": 1218} {"train_loss": -40.75594711303711, "global_step": 147439, "epoch": 1218} {"train_loss": -40.41827392578125, "global_step": 147440, "epoch": 1218} {"train_loss": -39.91426467895508, "global_step": 147441, "epoch": 1218} {"train_loss": -40.366756439208984, "global_step": 147442, "epoch": 1218} {"train_loss": -41.16117858886719, "global_step": 147443, "epoch": 1218} {"train_loss": -39.87562942504883, "global_step": 147444, "epoch": 1218} {"train_loss": -40.52688217163086, "global_step": 147445, "epoch": 1218} {"train_loss": -40.42207717895508, "global_step": 147446, "epoch": 1218} {"train_loss": -40.600494384765625, "global_step": 147447, "epoch": 1218} {"train_loss": -40.69376754760742, "global_step": 147448, "epoch": 1218} {"train_loss": -39.91671371459961, "global_step": 147449, "epoch": 1218} {"train_loss": -40.773677825927734, "global_step": 147450, "epoch": 1218} {"train_loss": -40.88672637939453, "global_step": 147451, "epoch": 1218} {"train_loss": -40.73043441772461, "global_step": 147452, "epoch": 1218} {"train_loss": -40.848907470703125, "global_step": 147453, "epoch": 1218} {"train_loss": -40.984004974365234, "global_step": 147454, "epoch": 1218} {"train_loss": -41.0142936706543, "global_step": 147455, "epoch": 1218} {"train_loss": -40.69545364379883, "global_step": 147456, "epoch": 1218} {"train_loss": -39.53519058227539, "global_step": 147457, "epoch": 1218} {"train_loss": -40.902381896972656, "global_step": 147458, "epoch": 1218} {"train_loss": -41.0888786315918, "global_step": 147459, "epoch": 1218} {"train_loss": -40.95398712158203, "global_step": 147460, "epoch": 1218} {"train_loss": -40.806209564208984, "global_step": 147461, "epoch": 1218} {"train_loss": -40.936702728271484, "global_step": 147462, "epoch": 1218} {"train_loss": -41.50456619262695, "global_step": 147463, "epoch": 1218} {"train_loss": -40.8973503112793, "global_step": 147464, "epoch": 1218} {"train_loss": -40.885555267333984, "global_step": 147465, "epoch": 1218} {"train_loss": -41.34318161010742, "global_step": 147466, "epoch": 1218} {"train_loss": -40.75634765625, "global_step": 147467, "epoch": 1218} {"train_loss": -41.49605941772461, "global_step": 147468, "epoch": 1218} {"train_loss": -41.170047760009766, "global_step": 147469, "epoch": 1218} {"train_loss": -40.923587799072266, "global_step": 147470, "epoch": 1218} {"train_loss": -41.08320999145508, "global_step": 147471, "epoch": 1218} {"train_loss": -41.3863410949707, "global_step": 147472, "epoch": 1218} {"train_loss": -41.3028564453125, "global_step": 147473, "epoch": 1218} {"train_loss": -40.50551986694336, "global_step": 147474, "epoch": 1218} {"train_loss": -40.09737014770508, "global_step": 147475, "epoch": 1218} {"train_loss": -40.235713958740234, "global_step": 147476, "epoch": 1218} {"train_loss": -40.47520065307617, "global_step": 147477, "epoch": 1218} {"train_loss": -40.74300765991211, "global_step": 147478, "epoch": 1218} {"train_loss": -40.831661224365234, "global_step": 147479, "epoch": 1218} {"train_loss": -41.14109420776367, "global_step": 147480, "epoch": 1218} {"train_loss": -40.970882415771484, "global_step": 147481, "epoch": 1218} {"train_loss": -39.217803955078125, "global_step": 147482, "epoch": 1218} {"train_loss": -40.697235107421875, "global_step": 147483, "epoch": 1218} {"train_loss": -39.682735443115234, "global_step": 147484, "epoch": 1218} {"train_loss": -40.25138473510742, "global_step": 147485, "epoch": 1218} {"train_loss": -40.260433197021484, "global_step": 147486, "epoch": 1218} {"train_loss": -39.704193115234375, "global_step": 147487, "epoch": 1218} {"train_loss": -39.29401779174805, "global_step": 147488, "epoch": 1218} {"train_loss": -40.133026123046875, "global_step": 147489, "epoch": 1218} {"train_loss": -40.15188217163086, "global_step": 147490, "epoch": 1218} {"train_loss": -40.18960189819336, "global_step": 147491, "epoch": 1218} {"train_loss": -40.26759338378906, "global_step": 147492, "epoch": 1218} {"train_loss": -40.78518295288086, "global_step": 147493, "epoch": 1218} {"train_loss": -40.12103271484375, "global_step": 147494, "epoch": 1218} {"train_loss": -40.05713653564453, "global_step": 147495, "epoch": 1218} {"train_loss": -38.712074279785156, "global_step": 147496, "epoch": 1218} {"train_loss": -38.341033935546875, "global_step": 147497, "epoch": 1218} {"train_loss": -39.129946606218326, "global_step": 147498, "epoch": 1218, "val_loss": 2575090.0} {"train_loss": -38.84370803833008, "global_step": 147499, "epoch": 1219} {"train_loss": -40.093502044677734, "global_step": 147500, "epoch": 1219} {"train_loss": -40.32332992553711, "global_step": 147501, "epoch": 1219} {"train_loss": -39.89023971557617, "global_step": 147502, "epoch": 1219} {"train_loss": -40.56466293334961, "global_step": 147503, "epoch": 1219} {"train_loss": -40.72722244262695, "global_step": 147504, "epoch": 1219} {"train_loss": -39.53439712524414, "global_step": 147505, "epoch": 1219} {"train_loss": -38.40779495239258, "global_step": 147506, "epoch": 1219} {"train_loss": -39.5515251159668, "global_step": 147507, "epoch": 1219} {"train_loss": -38.469905853271484, "global_step": 147508, "epoch": 1219} {"train_loss": -36.2060661315918, "global_step": 147509, "epoch": 1219} {"train_loss": -40.58705520629883, "global_step": 147510, "epoch": 1219} {"train_loss": -37.4863395690918, "global_step": 147511, "epoch": 1219} {"train_loss": -40.172935485839844, "global_step": 147512, "epoch": 1219} {"train_loss": -35.621273040771484, "global_step": 147513, "epoch": 1219} {"train_loss": -38.44171905517578, "global_step": 147514, "epoch": 1219} {"train_loss": -36.346649169921875, "global_step": 147515, "epoch": 1219} {"train_loss": -36.651424407958984, "global_step": 147516, "epoch": 1219} {"train_loss": -39.222286224365234, "global_step": 147517, "epoch": 1219} {"train_loss": -38.6952018737793, "global_step": 147518, "epoch": 1219} {"train_loss": -37.27882385253906, "global_step": 147519, "epoch": 1219} {"train_loss": -38.09203338623047, "global_step": 147520, "epoch": 1219} {"train_loss": -38.065155029296875, "global_step": 147521, "epoch": 1219} {"train_loss": -39.47892379760742, "global_step": 147522, "epoch": 1219} {"train_loss": -38.759124755859375, "global_step": 147523, "epoch": 1219} {"train_loss": -37.89399337768555, "global_step": 147524, "epoch": 1219} {"train_loss": -39.27387237548828, "global_step": 147525, "epoch": 1219} {"train_loss": -39.376136779785156, "global_step": 147526, "epoch": 1219} {"train_loss": -38.94002914428711, "global_step": 147527, "epoch": 1219} {"train_loss": -36.87384796142578, "global_step": 147528, "epoch": 1219} {"train_loss": -36.89267349243164, "global_step": 147529, "epoch": 1219} {"train_loss": -39.777992248535156, "global_step": 147530, "epoch": 1219} {"train_loss": -35.79197311401367, "global_step": 147531, "epoch": 1219} {"train_loss": -27.760557174682617, "global_step": 147532, "epoch": 1219} {"train_loss": -36.04417037963867, "global_step": 147533, "epoch": 1219} {"train_loss": -39.37004852294922, "global_step": 147534, "epoch": 1219} {"train_loss": -34.33176803588867, "global_step": 147535, "epoch": 1219} {"train_loss": -38.16600036621094, "global_step": 147536, "epoch": 1219} {"train_loss": -38.01588821411133, "global_step": 147537, "epoch": 1219} {"train_loss": -38.15714645385742, "global_step": 147538, "epoch": 1219} {"train_loss": -39.31858444213867, "global_step": 147539, "epoch": 1219} {"train_loss": -38.4367561340332, "global_step": 147540, "epoch": 1219} {"train_loss": -39.98031234741211, "global_step": 147541, "epoch": 1219} {"train_loss": -39.49766159057617, "global_step": 147542, "epoch": 1219} {"train_loss": -39.943450927734375, "global_step": 147543, "epoch": 1219} {"train_loss": -39.54490280151367, "global_step": 147544, "epoch": 1219} {"train_loss": -39.97135543823242, "global_step": 147545, "epoch": 1219} {"train_loss": -40.39680099487305, "global_step": 147546, "epoch": 1219} {"train_loss": -40.21174621582031, "global_step": 147547, "epoch": 1219} {"train_loss": -40.170654296875, "global_step": 147548, "epoch": 1219} {"train_loss": -40.195621490478516, "global_step": 147549, "epoch": 1219} {"train_loss": -39.71334457397461, "global_step": 147550, "epoch": 1219} {"train_loss": -40.72076416015625, "global_step": 147551, "epoch": 1219} {"train_loss": -39.81688690185547, "global_step": 147552, "epoch": 1219} {"train_loss": -40.27010726928711, "global_step": 147553, "epoch": 1219} {"train_loss": -40.69265365600586, "global_step": 147554, "epoch": 1219} {"train_loss": -40.887474060058594, "global_step": 147555, "epoch": 1219} {"train_loss": -39.791908264160156, "global_step": 147556, "epoch": 1219} {"train_loss": -40.48112869262695, "global_step": 147557, "epoch": 1219} {"train_loss": -40.27546310424805, "global_step": 147558, "epoch": 1219} {"train_loss": -40.47239685058594, "global_step": 147559, "epoch": 1219} {"train_loss": -40.60673904418945, "global_step": 147560, "epoch": 1219} {"train_loss": -40.439022064208984, "global_step": 147561, "epoch": 1219} {"train_loss": -41.03828048706055, "global_step": 147562, "epoch": 1219} {"train_loss": -40.865753173828125, "global_step": 147563, "epoch": 1219} {"train_loss": -40.50666046142578, "global_step": 147564, "epoch": 1219} {"train_loss": -40.15874481201172, "global_step": 147565, "epoch": 1219} {"train_loss": -40.552547454833984, "global_step": 147566, "epoch": 1219} {"train_loss": -40.51597213745117, "global_step": 147567, "epoch": 1219} {"train_loss": -40.02980422973633, "global_step": 147568, "epoch": 1219} {"train_loss": -41.03795623779297, "global_step": 147569, "epoch": 1219} {"train_loss": -40.38703536987305, "global_step": 147570, "epoch": 1219} {"train_loss": -40.8572998046875, "global_step": 147571, "epoch": 1219} {"train_loss": -40.953556060791016, "global_step": 147572, "epoch": 1219} {"train_loss": -40.42845916748047, "global_step": 147573, "epoch": 1219} {"train_loss": -40.96072006225586, "global_step": 147574, "epoch": 1219} {"train_loss": -40.413516998291016, "global_step": 147575, "epoch": 1219} {"train_loss": -40.97095489501953, "global_step": 147576, "epoch": 1219} {"train_loss": -40.230106353759766, "global_step": 147577, "epoch": 1219} {"train_loss": -40.636173248291016, "global_step": 147578, "epoch": 1219} {"train_loss": -40.746368408203125, "global_step": 147579, "epoch": 1219} {"train_loss": -40.503822326660156, "global_step": 147580, "epoch": 1219} {"train_loss": -40.963558197021484, "global_step": 147581, "epoch": 1219} {"train_loss": -39.94013214111328, "global_step": 147582, "epoch": 1219} {"train_loss": -40.998046875, "global_step": 147583, "epoch": 1219} {"train_loss": -40.814884185791016, "global_step": 147584, "epoch": 1219} {"train_loss": -40.61381149291992, "global_step": 147585, "epoch": 1219} {"train_loss": -40.68803024291992, "global_step": 147586, "epoch": 1219} {"train_loss": -40.548805236816406, "global_step": 147587, "epoch": 1219} {"train_loss": -40.57258987426758, "global_step": 147588, "epoch": 1219} {"train_loss": -41.38962173461914, "global_step": 147589, "epoch": 1219} {"train_loss": -39.98008728027344, "global_step": 147590, "epoch": 1219} {"train_loss": -40.39521026611328, "global_step": 147591, "epoch": 1219} {"train_loss": -41.12486267089844, "global_step": 147592, "epoch": 1219} {"train_loss": -40.66006088256836, "global_step": 147593, "epoch": 1219} {"train_loss": -40.86196517944336, "global_step": 147594, "epoch": 1219} {"train_loss": -40.14377975463867, "global_step": 147595, "epoch": 1219} {"train_loss": -40.382442474365234, "global_step": 147596, "epoch": 1219} {"train_loss": -40.844173431396484, "global_step": 147597, "epoch": 1219} {"train_loss": -40.64728927612305, "global_step": 147598, "epoch": 1219} {"train_loss": -38.84544372558594, "global_step": 147599, "epoch": 1219} {"train_loss": -40.33687210083008, "global_step": 147600, "epoch": 1219} {"train_loss": -40.4052734375, "global_step": 147601, "epoch": 1219} {"train_loss": -40.64298629760742, "global_step": 147602, "epoch": 1219} {"train_loss": -39.81924057006836, "global_step": 147603, "epoch": 1219} {"train_loss": -39.31086730957031, "global_step": 147604, "epoch": 1219} {"train_loss": -38.8558349609375, "global_step": 147605, "epoch": 1219} {"train_loss": -39.81406021118164, "global_step": 147606, "epoch": 1219} {"train_loss": -39.448699951171875, "global_step": 147607, "epoch": 1219} {"train_loss": -39.155086517333984, "global_step": 147608, "epoch": 1219} {"train_loss": -38.755245208740234, "global_step": 147609, "epoch": 1219} {"train_loss": -39.617767333984375, "global_step": 147610, "epoch": 1219} {"train_loss": -39.6834716796875, "global_step": 147611, "epoch": 1219} {"train_loss": -38.917152404785156, "global_step": 147612, "epoch": 1219} {"train_loss": -37.5267333984375, "global_step": 147613, "epoch": 1219} {"train_loss": -35.40937042236328, "global_step": 147614, "epoch": 1219} {"train_loss": -33.27332305908203, "global_step": 147615, "epoch": 1219} {"train_loss": -33.712066650390625, "global_step": 147616, "epoch": 1219} {"train_loss": -36.3642463684082, "global_step": 147617, "epoch": 1219} {"train_loss": -33.939632415771484, "global_step": 147618, "epoch": 1219} {"train_loss": -39.25509011449893, "global_step": 147619, "epoch": 1219, "val_loss": 2843784.25} {"train_loss": -38.01057052612305, "global_step": 147620, "epoch": 1220} {"train_loss": -36.46470260620117, "global_step": 147621, "epoch": 1220} {"train_loss": -34.182472229003906, "global_step": 147622, "epoch": 1220} {"train_loss": -35.77736282348633, "global_step": 147623, "epoch": 1220} {"train_loss": -37.69041061401367, "global_step": 147624, "epoch": 1220} {"train_loss": -36.63531494140625, "global_step": 147625, "epoch": 1220} {"train_loss": -35.993080139160156, "global_step": 147626, "epoch": 1220} {"train_loss": -36.00046920776367, "global_step": 147627, "epoch": 1220} {"train_loss": -35.608001708984375, "global_step": 147628, "epoch": 1220} {"train_loss": -35.60638427734375, "global_step": 147629, "epoch": 1220} {"train_loss": -38.1873893737793, "global_step": 147630, "epoch": 1220} {"train_loss": -36.888885498046875, "global_step": 147631, "epoch": 1220} {"train_loss": -32.86417770385742, "global_step": 147632, "epoch": 1220} {"train_loss": -39.177833557128906, "global_step": 147633, "epoch": 1220} {"train_loss": -36.6436882019043, "global_step": 147634, "epoch": 1220} {"train_loss": -37.08675765991211, "global_step": 147635, "epoch": 1220} {"train_loss": -38.425758361816406, "global_step": 147636, "epoch": 1220} {"train_loss": -38.37677001953125, "global_step": 147637, "epoch": 1220} {"train_loss": -36.693580627441406, "global_step": 147638, "epoch": 1220} {"train_loss": -37.21165084838867, "global_step": 147639, "epoch": 1220} {"train_loss": -38.84677505493164, "global_step": 147640, "epoch": 1220} {"train_loss": -34.356746673583984, "global_step": 147641, "epoch": 1220} {"train_loss": -36.51007080078125, "global_step": 147642, "epoch": 1220} {"train_loss": -39.120826721191406, "global_step": 147643, "epoch": 1220} {"train_loss": -39.08061599731445, "global_step": 147644, "epoch": 1220} {"train_loss": -39.12761306762695, "global_step": 147645, "epoch": 1220} {"train_loss": -38.54628372192383, "global_step": 147646, "epoch": 1220} {"train_loss": -37.1612663269043, "global_step": 147647, "epoch": 1220} {"train_loss": -37.9322395324707, "global_step": 147648, "epoch": 1220} {"train_loss": -38.2490348815918, "global_step": 147649, "epoch": 1220} {"train_loss": -38.62668991088867, "global_step": 147650, "epoch": 1220} {"train_loss": -39.61780548095703, "global_step": 147651, "epoch": 1220} {"train_loss": -38.512054443359375, "global_step": 147652, "epoch": 1220} {"train_loss": -38.23271560668945, "global_step": 147653, "epoch": 1220} {"train_loss": -38.498294830322266, "global_step": 147654, "epoch": 1220} {"train_loss": -39.22657012939453, "global_step": 147655, "epoch": 1220} {"train_loss": -39.22161865234375, "global_step": 147656, "epoch": 1220} {"train_loss": -39.240203857421875, "global_step": 147657, "epoch": 1220} {"train_loss": -39.77996063232422, "global_step": 147658, "epoch": 1220} {"train_loss": -38.244529724121094, "global_step": 147659, "epoch": 1220} {"train_loss": -39.72624969482422, "global_step": 147660, "epoch": 1220} {"train_loss": -39.515743255615234, "global_step": 147661, "epoch": 1220} {"train_loss": -38.270469665527344, "global_step": 147662, "epoch": 1220} {"train_loss": -38.8881950378418, "global_step": 147663, "epoch": 1220} {"train_loss": -39.65012741088867, "global_step": 147664, "epoch": 1220} {"train_loss": -38.05573654174805, "global_step": 147665, "epoch": 1220} {"train_loss": -38.56938171386719, "global_step": 147666, "epoch": 1220} {"train_loss": -39.48676681518555, "global_step": 147667, "epoch": 1220} {"train_loss": -37.525596618652344, "global_step": 147668, "epoch": 1220} {"train_loss": -39.57123565673828, "global_step": 147669, "epoch": 1220} {"train_loss": -39.92488479614258, "global_step": 147670, "epoch": 1220} {"train_loss": -39.388526916503906, "global_step": 147671, "epoch": 1220} {"train_loss": -39.777549743652344, "global_step": 147672, "epoch": 1220} {"train_loss": -39.06877899169922, "global_step": 147673, "epoch": 1220} {"train_loss": -40.046424865722656, "global_step": 147674, "epoch": 1220} {"train_loss": -40.06953430175781, "global_step": 147675, "epoch": 1220} {"train_loss": -39.81037902832031, "global_step": 147676, "epoch": 1220} {"train_loss": -40.18795394897461, "global_step": 147677, "epoch": 1220} {"train_loss": -39.36323928833008, "global_step": 147678, "epoch": 1220} {"train_loss": -40.325050354003906, "global_step": 147679, "epoch": 1220} {"train_loss": -39.27250289916992, "global_step": 147680, "epoch": 1220} {"train_loss": -40.1866569519043, "global_step": 147681, "epoch": 1220} {"train_loss": -40.562042236328125, "global_step": 147682, "epoch": 1220} {"train_loss": -39.74971008300781, "global_step": 147683, "epoch": 1220} {"train_loss": -40.21659469604492, "global_step": 147684, "epoch": 1220} {"train_loss": -40.375152587890625, "global_step": 147685, "epoch": 1220} {"train_loss": -39.028377532958984, "global_step": 147686, "epoch": 1220} {"train_loss": -40.50458908081055, "global_step": 147687, "epoch": 1220} {"train_loss": -40.280174255371094, "global_step": 147688, "epoch": 1220} {"train_loss": -40.136688232421875, "global_step": 147689, "epoch": 1220} {"train_loss": -39.46120071411133, "global_step": 147690, "epoch": 1220} {"train_loss": -40.16651153564453, "global_step": 147691, "epoch": 1220} {"train_loss": -40.570648193359375, "global_step": 147692, "epoch": 1220} {"train_loss": -40.13398361206055, "global_step": 147693, "epoch": 1220} {"train_loss": -40.41569137573242, "global_step": 147694, "epoch": 1220} {"train_loss": -40.63666915893555, "global_step": 147695, "epoch": 1220} {"train_loss": -40.559852600097656, "global_step": 147696, "epoch": 1220} {"train_loss": -40.69880294799805, "global_step": 147697, "epoch": 1220} {"train_loss": -40.83308792114258, "global_step": 147698, "epoch": 1220} {"train_loss": -40.84414291381836, "global_step": 147699, "epoch": 1220} {"train_loss": -39.89726257324219, "global_step": 147700, "epoch": 1220} {"train_loss": -40.232906341552734, "global_step": 147701, "epoch": 1220} {"train_loss": -40.876678466796875, "global_step": 147702, "epoch": 1220} {"train_loss": -41.16262435913086, "global_step": 147703, "epoch": 1220} {"train_loss": -39.80678939819336, "global_step": 147704, "epoch": 1220} {"train_loss": -40.699256896972656, "global_step": 147705, "epoch": 1220} {"train_loss": -40.97442626953125, "global_step": 147706, "epoch": 1220} {"train_loss": -41.11008834838867, "global_step": 147707, "epoch": 1220} {"train_loss": -40.81720733642578, "global_step": 147708, "epoch": 1220} {"train_loss": -40.002986907958984, "global_step": 147709, "epoch": 1220} {"train_loss": -40.83008575439453, "global_step": 147710, "epoch": 1220} {"train_loss": -41.28742980957031, "global_step": 147711, "epoch": 1220} {"train_loss": -39.7346076965332, "global_step": 147712, "epoch": 1220} {"train_loss": -41.0643196105957, "global_step": 147713, "epoch": 1220} {"train_loss": -40.751583099365234, "global_step": 147714, "epoch": 1220} {"train_loss": -41.06262969970703, "global_step": 147715, "epoch": 1220} {"train_loss": -39.371559143066406, "global_step": 147716, "epoch": 1220} {"train_loss": -40.66273880004883, "global_step": 147717, "epoch": 1220} {"train_loss": -40.572322845458984, "global_step": 147718, "epoch": 1220} {"train_loss": -40.0190315246582, "global_step": 147719, "epoch": 1220} {"train_loss": -40.198604583740234, "global_step": 147720, "epoch": 1220} {"train_loss": -40.761653900146484, "global_step": 147721, "epoch": 1220} {"train_loss": -40.55445098876953, "global_step": 147722, "epoch": 1220} {"train_loss": -39.653297424316406, "global_step": 147723, "epoch": 1220} {"train_loss": -40.977352142333984, "global_step": 147724, "epoch": 1220} {"train_loss": -41.28192138671875, "global_step": 147725, "epoch": 1220} {"train_loss": -40.47198486328125, "global_step": 147726, "epoch": 1220} {"train_loss": -39.8006706237793, "global_step": 147727, "epoch": 1220} {"train_loss": -39.26540756225586, "global_step": 147728, "epoch": 1220} {"train_loss": -36.52643585205078, "global_step": 147729, "epoch": 1220} {"train_loss": -33.9059944152832, "global_step": 147730, "epoch": 1220} {"train_loss": -31.63081169128418, "global_step": 147731, "epoch": 1220} {"train_loss": -26.684354782104492, "global_step": 147732, "epoch": 1220} {"train_loss": -30.1385440826416, "global_step": 147733, "epoch": 1220} {"train_loss": -38.77903747558594, "global_step": 147734, "epoch": 1220} {"train_loss": -37.48139190673828, "global_step": 147735, "epoch": 1220} {"train_loss": -34.03681945800781, "global_step": 147736, "epoch": 1220} {"train_loss": -38.94871139526367, "global_step": 147737, "epoch": 1220} {"train_loss": -36.115291595458984, "global_step": 147738, "epoch": 1220} {"train_loss": -32.602272033691406, "global_step": 147739, "epoch": 1220} {"train_loss": -38.70043593792876, "global_step": 147740, "epoch": 1220, "val_loss": 2467755.25} {"train_loss": -35.907894134521484, "global_step": 147741, "epoch": 1221} {"train_loss": -39.41668701171875, "global_step": 147742, "epoch": 1221} {"train_loss": -36.902809143066406, "global_step": 147743, "epoch": 1221} {"train_loss": -39.16096496582031, "global_step": 147744, "epoch": 1221} {"train_loss": -38.08250045776367, "global_step": 147745, "epoch": 1221} {"train_loss": -39.26044464111328, "global_step": 147746, "epoch": 1221} {"train_loss": -37.807430267333984, "global_step": 147747, "epoch": 1221} {"train_loss": -38.77747344970703, "global_step": 147748, "epoch": 1221} {"train_loss": -38.783321380615234, "global_step": 147749, "epoch": 1221} {"train_loss": -37.13174057006836, "global_step": 147750, "epoch": 1221} {"train_loss": -38.75810623168945, "global_step": 147751, "epoch": 1221} {"train_loss": -38.15472412109375, "global_step": 147752, "epoch": 1221} {"train_loss": -32.73933029174805, "global_step": 147753, "epoch": 1221} {"train_loss": -38.66035842895508, "global_step": 147754, "epoch": 1221} {"train_loss": -37.79326248168945, "global_step": 147755, "epoch": 1221} {"train_loss": -37.517635345458984, "global_step": 147756, "epoch": 1221} {"train_loss": -39.665157318115234, "global_step": 147757, "epoch": 1221} {"train_loss": -35.63895034790039, "global_step": 147758, "epoch": 1221} {"train_loss": -39.11771774291992, "global_step": 147759, "epoch": 1221} {"train_loss": -38.67433166503906, "global_step": 147760, "epoch": 1221} {"train_loss": -38.31972122192383, "global_step": 147761, "epoch": 1221} {"train_loss": -37.41255569458008, "global_step": 147762, "epoch": 1221} {"train_loss": -39.26467514038086, "global_step": 147763, "epoch": 1221} {"train_loss": -39.176307678222656, "global_step": 147764, "epoch": 1221} {"train_loss": -38.18878173828125, "global_step": 147765, "epoch": 1221} {"train_loss": -39.008575439453125, "global_step": 147766, "epoch": 1221} {"train_loss": -38.8856086730957, "global_step": 147767, "epoch": 1221} {"train_loss": -35.5276985168457, "global_step": 147768, "epoch": 1221} {"train_loss": -38.650325775146484, "global_step": 147769, "epoch": 1221} {"train_loss": -38.1072883605957, "global_step": 147770, "epoch": 1221} {"train_loss": -37.704524993896484, "global_step": 147771, "epoch": 1221} {"train_loss": -38.73127365112305, "global_step": 147772, "epoch": 1221} {"train_loss": -39.156246185302734, "global_step": 147773, "epoch": 1221} {"train_loss": -38.82095718383789, "global_step": 147774, "epoch": 1221} {"train_loss": -39.984920501708984, "global_step": 147775, "epoch": 1221} {"train_loss": -37.354156494140625, "global_step": 147776, "epoch": 1221} {"train_loss": -39.171783447265625, "global_step": 147777, "epoch": 1221} {"train_loss": -39.46156311035156, "global_step": 147778, "epoch": 1221} {"train_loss": -39.78914260864258, "global_step": 147779, "epoch": 1221} {"train_loss": -39.73139572143555, "global_step": 147780, "epoch": 1221} {"train_loss": -39.234554290771484, "global_step": 147781, "epoch": 1221} {"train_loss": -39.98391342163086, "global_step": 147782, "epoch": 1221} {"train_loss": -39.93475341796875, "global_step": 147783, "epoch": 1221} {"train_loss": -38.19368362426758, "global_step": 147784, "epoch": 1221} {"train_loss": -39.243690490722656, "global_step": 147785, "epoch": 1221} {"train_loss": -39.06349563598633, "global_step": 147786, "epoch": 1221} {"train_loss": -39.19033432006836, "global_step": 147787, "epoch": 1221} {"train_loss": -39.66976547241211, "global_step": 147788, "epoch": 1221} {"train_loss": -39.56043243408203, "global_step": 147789, "epoch": 1221} {"train_loss": -38.249507904052734, "global_step": 147790, "epoch": 1221} {"train_loss": -40.1628532409668, "global_step": 147791, "epoch": 1221} {"train_loss": -39.67631912231445, "global_step": 147792, "epoch": 1221} {"train_loss": -39.932106018066406, "global_step": 147793, "epoch": 1221} {"train_loss": -40.300838470458984, "global_step": 147794, "epoch": 1221} {"train_loss": -36.02800750732422, "global_step": 147795, "epoch": 1221} {"train_loss": -39.920440673828125, "global_step": 147796, "epoch": 1221} {"train_loss": -39.66973876953125, "global_step": 147797, "epoch": 1221} {"train_loss": -40.352294921875, "global_step": 147798, "epoch": 1221} {"train_loss": -39.77136993408203, "global_step": 147799, "epoch": 1221} {"train_loss": -38.4262809753418, "global_step": 147800, "epoch": 1221} {"train_loss": -40.36985397338867, "global_step": 147801, "epoch": 1221} {"train_loss": -38.727813720703125, "global_step": 147802, "epoch": 1221} {"train_loss": -40.00477981567383, "global_step": 147803, "epoch": 1221} {"train_loss": -40.40202713012695, "global_step": 147804, "epoch": 1221} {"train_loss": -40.210018157958984, "global_step": 147805, "epoch": 1221} {"train_loss": -38.680213928222656, "global_step": 147806, "epoch": 1221} {"train_loss": -39.55841827392578, "global_step": 147807, "epoch": 1221} {"train_loss": -40.01142120361328, "global_step": 147808, "epoch": 1221} {"train_loss": -40.335018157958984, "global_step": 147809, "epoch": 1221} {"train_loss": -39.41969680786133, "global_step": 147810, "epoch": 1221} {"train_loss": -39.38169860839844, "global_step": 147811, "epoch": 1221} {"train_loss": -39.35183334350586, "global_step": 147812, "epoch": 1221} {"train_loss": -39.88682174682617, "global_step": 147813, "epoch": 1221} {"train_loss": -39.7581672668457, "global_step": 147814, "epoch": 1221} {"train_loss": -40.48334503173828, "global_step": 147815, "epoch": 1221} {"train_loss": -40.181575775146484, "global_step": 147816, "epoch": 1221} {"train_loss": -40.275970458984375, "global_step": 147817, "epoch": 1221} {"train_loss": -40.8886604309082, "global_step": 147818, "epoch": 1221} {"train_loss": -40.20461654663086, "global_step": 147819, "epoch": 1221} {"train_loss": -39.989288330078125, "global_step": 147820, "epoch": 1221} {"train_loss": -40.205318450927734, "global_step": 147821, "epoch": 1221} {"train_loss": -39.68342971801758, "global_step": 147822, "epoch": 1221} {"train_loss": -34.317020416259766, "global_step": 147823, "epoch": 1221} {"train_loss": -39.61126708984375, "global_step": 147824, "epoch": 1221} {"train_loss": -40.14700698852539, "global_step": 147825, "epoch": 1221} {"train_loss": -39.56752014160156, "global_step": 147826, "epoch": 1221} {"train_loss": -40.34296798706055, "global_step": 147827, "epoch": 1221} {"train_loss": -40.073848724365234, "global_step": 147828, "epoch": 1221} {"train_loss": -39.56406784057617, "global_step": 147829, "epoch": 1221} {"train_loss": -40.384700775146484, "global_step": 147830, "epoch": 1221} {"train_loss": -40.312931060791016, "global_step": 147831, "epoch": 1221} {"train_loss": -40.21311950683594, "global_step": 147832, "epoch": 1221} {"train_loss": -37.68871307373047, "global_step": 147833, "epoch": 1221} {"train_loss": -38.75947189331055, "global_step": 147834, "epoch": 1221} {"train_loss": -38.96892166137695, "global_step": 147835, "epoch": 1221} {"train_loss": -33.497127532958984, "global_step": 147836, "epoch": 1221} {"train_loss": -39.346534729003906, "global_step": 147837, "epoch": 1221} {"train_loss": -36.97284698486328, "global_step": 147838, "epoch": 1221} {"train_loss": -39.02987289428711, "global_step": 147839, "epoch": 1221} {"train_loss": -38.08667755126953, "global_step": 147840, "epoch": 1221} {"train_loss": -39.689239501953125, "global_step": 147841, "epoch": 1221} {"train_loss": -38.347808837890625, "global_step": 147842, "epoch": 1221} {"train_loss": -34.1312370300293, "global_step": 147843, "epoch": 1221} {"train_loss": -34.82355499267578, "global_step": 147844, "epoch": 1221} {"train_loss": -37.75315475463867, "global_step": 147845, "epoch": 1221} {"train_loss": -38.82733917236328, "global_step": 147846, "epoch": 1221} {"train_loss": -38.53469467163086, "global_step": 147847, "epoch": 1221} {"train_loss": -34.63374710083008, "global_step": 147848, "epoch": 1221} {"train_loss": -36.45588302612305, "global_step": 147849, "epoch": 1221} {"train_loss": -32.619537353515625, "global_step": 147850, "epoch": 1221} {"train_loss": -32.37309646606445, "global_step": 147851, "epoch": 1221} {"train_loss": -35.48370361328125, "global_step": 147852, "epoch": 1221} {"train_loss": -36.89316177368164, "global_step": 147853, "epoch": 1221} {"train_loss": -32.82194900512695, "global_step": 147854, "epoch": 1221} {"train_loss": -38.29533004760742, "global_step": 147855, "epoch": 1221} {"train_loss": -28.45077896118164, "global_step": 147856, "epoch": 1221} {"train_loss": -33.784942626953125, "global_step": 147857, "epoch": 1221} {"train_loss": -37.961021423339844, "global_step": 147858, "epoch": 1221} {"train_loss": -32.093849182128906, "global_step": 147859, "epoch": 1221} {"train_loss": -34.0771369934082, "global_step": 147860, "epoch": 1221} {"train_loss": -38.2941990371578, "global_step": 147861, "epoch": 1221, "val_loss": 2626505.25} {"train_loss": -35.703407287597656, "global_step": 147862, "epoch": 1222} {"train_loss": -35.84239196777344, "global_step": 147863, "epoch": 1222} {"train_loss": -36.97429275512695, "global_step": 147864, "epoch": 1222} {"train_loss": -36.71247482299805, "global_step": 147865, "epoch": 1222} {"train_loss": -36.52437973022461, "global_step": 147866, "epoch": 1222} {"train_loss": -37.599945068359375, "global_step": 147867, "epoch": 1222} {"train_loss": -38.2889518737793, "global_step": 147868, "epoch": 1222} {"train_loss": -36.5026741027832, "global_step": 147869, "epoch": 1222} {"train_loss": -36.92009353637695, "global_step": 147870, "epoch": 1222} {"train_loss": -36.79520797729492, "global_step": 147871, "epoch": 1222} {"train_loss": -38.05350875854492, "global_step": 147872, "epoch": 1222} {"train_loss": -37.084285736083984, "global_step": 147873, "epoch": 1222} {"train_loss": -37.21287155151367, "global_step": 147874, "epoch": 1222} {"train_loss": -37.97544860839844, "global_step": 147875, "epoch": 1222} {"train_loss": -37.81954574584961, "global_step": 147876, "epoch": 1222} {"train_loss": -37.08644485473633, "global_step": 147877, "epoch": 1222} {"train_loss": -38.1916389465332, "global_step": 147878, "epoch": 1222} {"train_loss": -38.32087326049805, "global_step": 147879, "epoch": 1222} {"train_loss": -37.93040466308594, "global_step": 147880, "epoch": 1222} {"train_loss": -39.0541877746582, "global_step": 147881, "epoch": 1222} {"train_loss": -38.990474700927734, "global_step": 147882, "epoch": 1222} {"train_loss": -38.542083740234375, "global_step": 147883, "epoch": 1222} {"train_loss": -38.6484489440918, "global_step": 147884, "epoch": 1222} {"train_loss": -39.16383743286133, "global_step": 147885, "epoch": 1222} {"train_loss": -39.18013381958008, "global_step": 147886, "epoch": 1222} {"train_loss": -39.51287841796875, "global_step": 147887, "epoch": 1222} {"train_loss": -39.50814437866211, "global_step": 147888, "epoch": 1222} {"train_loss": -38.99651336669922, "global_step": 147889, "epoch": 1222} {"train_loss": -39.60825729370117, "global_step": 147890, "epoch": 1222} {"train_loss": -39.27231979370117, "global_step": 147891, "epoch": 1222} {"train_loss": -39.301727294921875, "global_step": 147892, "epoch": 1222} {"train_loss": -38.95804214477539, "global_step": 147893, "epoch": 1222} {"train_loss": -39.49134063720703, "global_step": 147894, "epoch": 1222} {"train_loss": -39.490230560302734, "global_step": 147895, "epoch": 1222} {"train_loss": -39.31910705566406, "global_step": 147896, "epoch": 1222} {"train_loss": -38.73659896850586, "global_step": 147897, "epoch": 1222} {"train_loss": -39.82063674926758, "global_step": 147898, "epoch": 1222} {"train_loss": -40.11301803588867, "global_step": 147899, "epoch": 1222} {"train_loss": -39.50590896606445, "global_step": 147900, "epoch": 1222} {"train_loss": -40.1470947265625, "global_step": 147901, "epoch": 1222} {"train_loss": -40.02620315551758, "global_step": 147902, "epoch": 1222} {"train_loss": -39.63680648803711, "global_step": 147903, "epoch": 1222} {"train_loss": -39.96160888671875, "global_step": 147904, "epoch": 1222} {"train_loss": -40.10615539550781, "global_step": 147905, "epoch": 1222} {"train_loss": -40.022396087646484, "global_step": 147906, "epoch": 1222} {"train_loss": -40.14072799682617, "global_step": 147907, "epoch": 1222} {"train_loss": -40.187408447265625, "global_step": 147908, "epoch": 1222} {"train_loss": -39.98177719116211, "global_step": 147909, "epoch": 1222} {"train_loss": -40.409420013427734, "global_step": 147910, "epoch": 1222} {"train_loss": -39.75077819824219, "global_step": 147911, "epoch": 1222} {"train_loss": -40.48881912231445, "global_step": 147912, "epoch": 1222} {"train_loss": -40.224971771240234, "global_step": 147913, "epoch": 1222} {"train_loss": -39.64237976074219, "global_step": 147914, "epoch": 1222} {"train_loss": -39.905174255371094, "global_step": 147915, "epoch": 1222} {"train_loss": -40.00717544555664, "global_step": 147916, "epoch": 1222} {"train_loss": -40.425872802734375, "global_step": 147917, "epoch": 1222} {"train_loss": -40.13113021850586, "global_step": 147918, "epoch": 1222} {"train_loss": -40.70990753173828, "global_step": 147919, "epoch": 1222} {"train_loss": -40.27891159057617, "global_step": 147920, "epoch": 1222} {"train_loss": -39.82763671875, "global_step": 147921, "epoch": 1222} {"train_loss": -39.68406677246094, "global_step": 147922, "epoch": 1222} {"train_loss": -40.25697708129883, "global_step": 147923, "epoch": 1222} {"train_loss": -40.671592712402344, "global_step": 147924, "epoch": 1222} {"train_loss": -40.067474365234375, "global_step": 147925, "epoch": 1222} {"train_loss": -39.6302375793457, "global_step": 147926, "epoch": 1222} {"train_loss": -39.004798889160156, "global_step": 147927, "epoch": 1222} {"train_loss": -40.028743743896484, "global_step": 147928, "epoch": 1222} {"train_loss": -40.322750091552734, "global_step": 147929, "epoch": 1222} {"train_loss": -39.86079406738281, "global_step": 147930, "epoch": 1222} {"train_loss": -39.87855911254883, "global_step": 147931, "epoch": 1222} {"train_loss": -38.54730224609375, "global_step": 147932, "epoch": 1222} {"train_loss": -39.455360412597656, "global_step": 147933, "epoch": 1222} {"train_loss": -39.35905075073242, "global_step": 147934, "epoch": 1222} {"train_loss": -40.052093505859375, "global_step": 147935, "epoch": 1222} {"train_loss": -39.88704299926758, "global_step": 147936, "epoch": 1222} {"train_loss": -37.84989547729492, "global_step": 147937, "epoch": 1222} {"train_loss": -35.52223205566406, "global_step": 147938, "epoch": 1222} {"train_loss": -36.942108154296875, "global_step": 147939, "epoch": 1222} {"train_loss": -38.820430755615234, "global_step": 147940, "epoch": 1222} {"train_loss": -40.15372848510742, "global_step": 147941, "epoch": 1222} {"train_loss": -40.73889923095703, "global_step": 147942, "epoch": 1222} {"train_loss": -40.83216094970703, "global_step": 147943, "epoch": 1222} {"train_loss": -40.602596282958984, "global_step": 147944, "epoch": 1222} {"train_loss": -40.64552307128906, "global_step": 147945, "epoch": 1222} {"train_loss": -39.55332946777344, "global_step": 147946, "epoch": 1222} {"train_loss": -40.34272384643555, "global_step": 147947, "epoch": 1222} {"train_loss": -41.149391174316406, "global_step": 147948, "epoch": 1222} {"train_loss": -40.29277420043945, "global_step": 147949, "epoch": 1222} {"train_loss": -40.121360778808594, "global_step": 147950, "epoch": 1222} {"train_loss": -40.255767822265625, "global_step": 147951, "epoch": 1222} {"train_loss": -40.656158447265625, "global_step": 147952, "epoch": 1222} {"train_loss": -40.45641326904297, "global_step": 147953, "epoch": 1222} {"train_loss": -39.60902786254883, "global_step": 147954, "epoch": 1222} {"train_loss": -40.41025924682617, "global_step": 147955, "epoch": 1222} {"train_loss": -40.558624267578125, "global_step": 147956, "epoch": 1222} {"train_loss": -40.480770111083984, "global_step": 147957, "epoch": 1222} {"train_loss": -40.56034469604492, "global_step": 147958, "epoch": 1222} {"train_loss": -41.055885314941406, "global_step": 147959, "epoch": 1222} {"train_loss": -41.11532211303711, "global_step": 147960, "epoch": 1222} {"train_loss": -40.33688735961914, "global_step": 147961, "epoch": 1222} {"train_loss": -40.65790939331055, "global_step": 147962, "epoch": 1222} {"train_loss": -40.98960494995117, "global_step": 147963, "epoch": 1222} {"train_loss": -41.031192779541016, "global_step": 147964, "epoch": 1222} {"train_loss": -40.2028694152832, "global_step": 147965, "epoch": 1222} {"train_loss": -40.134761810302734, "global_step": 147966, "epoch": 1222} {"train_loss": -40.29640197753906, "global_step": 147967, "epoch": 1222} {"train_loss": -40.95270538330078, "global_step": 147968, "epoch": 1222} {"train_loss": -40.84187698364258, "global_step": 147969, "epoch": 1222} {"train_loss": -40.944828033447266, "global_step": 147970, "epoch": 1222} {"train_loss": -40.86491012573242, "global_step": 147971, "epoch": 1222} {"train_loss": -40.9476432800293, "global_step": 147972, "epoch": 1222} {"train_loss": -41.05924606323242, "global_step": 147973, "epoch": 1222} {"train_loss": -40.71076202392578, "global_step": 147974, "epoch": 1222} {"train_loss": -40.708099365234375, "global_step": 147975, "epoch": 1222} {"train_loss": -39.98868942260742, "global_step": 147976, "epoch": 1222} {"train_loss": -40.151363372802734, "global_step": 147977, "epoch": 1222} {"train_loss": -38.31858444213867, "global_step": 147978, "epoch": 1222} {"train_loss": -36.9537239074707, "global_step": 147979, "epoch": 1222} {"train_loss": -38.518798828125, "global_step": 147980, "epoch": 1222} {"train_loss": -40.40825271606445, "global_step": 147981, "epoch": 1222} {"train_loss": -39.4621647290947, "global_step": 147982, "epoch": 1222, "val_loss": 2716737.75} {"train_loss": -38.577980041503906, "global_step": 147983, "epoch": 1223} {"train_loss": -37.592613220214844, "global_step": 147984, "epoch": 1223} {"train_loss": -35.96437454223633, "global_step": 147985, "epoch": 1223} {"train_loss": -37.151397705078125, "global_step": 147986, "epoch": 1223} {"train_loss": -40.23686599731445, "global_step": 147987, "epoch": 1223} {"train_loss": -38.27254867553711, "global_step": 147988, "epoch": 1223} {"train_loss": -38.710296630859375, "global_step": 147989, "epoch": 1223} {"train_loss": -40.04279708862305, "global_step": 147990, "epoch": 1223} {"train_loss": -37.92625045776367, "global_step": 147991, "epoch": 1223} {"train_loss": -38.634883880615234, "global_step": 147992, "epoch": 1223} {"train_loss": -36.887901306152344, "global_step": 147993, "epoch": 1223} {"train_loss": -35.335994720458984, "global_step": 147994, "epoch": 1223} {"train_loss": -37.80999755859375, "global_step": 147995, "epoch": 1223} {"train_loss": -39.55784225463867, "global_step": 147996, "epoch": 1223} {"train_loss": -39.46052169799805, "global_step": 147997, "epoch": 1223} {"train_loss": -38.554420471191406, "global_step": 147998, "epoch": 1223} {"train_loss": -40.0863037109375, "global_step": 147999, "epoch": 1223} {"train_loss": -39.08565139770508, "global_step": 148000, "epoch": 1223} {"train_loss": -38.90155792236328, "global_step": 148001, "epoch": 1223} {"train_loss": -40.03562545776367, "global_step": 148002, "epoch": 1223} {"train_loss": -38.75541305541992, "global_step": 148003, "epoch": 1223} {"train_loss": -39.2379264831543, "global_step": 148004, "epoch": 1223} {"train_loss": -39.385677337646484, "global_step": 148005, "epoch": 1223} {"train_loss": -38.84931182861328, "global_step": 148006, "epoch": 1223} {"train_loss": -40.08614730834961, "global_step": 148007, "epoch": 1223} {"train_loss": -39.200172424316406, "global_step": 148008, "epoch": 1223} {"train_loss": -39.870689392089844, "global_step": 148009, "epoch": 1223} {"train_loss": -38.64681625366211, "global_step": 148010, "epoch": 1223} {"train_loss": -39.33839797973633, "global_step": 148011, "epoch": 1223} {"train_loss": -39.566829681396484, "global_step": 148012, "epoch": 1223} {"train_loss": -40.3194694519043, "global_step": 148013, "epoch": 1223} {"train_loss": -38.7705078125, "global_step": 148014, "epoch": 1223} {"train_loss": -40.054500579833984, "global_step": 148015, "epoch": 1223} {"train_loss": -39.33597946166992, "global_step": 148016, "epoch": 1223} {"train_loss": -39.338600158691406, "global_step": 148017, "epoch": 1223} {"train_loss": -40.028900146484375, "global_step": 148018, "epoch": 1223} {"train_loss": -39.34794235229492, "global_step": 148019, "epoch": 1223} {"train_loss": -39.65390396118164, "global_step": 148020, "epoch": 1223} {"train_loss": -39.661224365234375, "global_step": 148021, "epoch": 1223} {"train_loss": -39.56290817260742, "global_step": 148022, "epoch": 1223} {"train_loss": -40.20233917236328, "global_step": 148023, "epoch": 1223} {"train_loss": -39.05315017700195, "global_step": 148024, "epoch": 1223} {"train_loss": -40.611427307128906, "global_step": 148025, "epoch": 1223} {"train_loss": -39.799678802490234, "global_step": 148026, "epoch": 1223} {"train_loss": -40.0626106262207, "global_step": 148027, "epoch": 1223} {"train_loss": -40.574867248535156, "global_step": 148028, "epoch": 1223} {"train_loss": -39.977783203125, "global_step": 148029, "epoch": 1223} {"train_loss": -40.3170166015625, "global_step": 148030, "epoch": 1223} {"train_loss": -34.837501525878906, "global_step": 148031, "epoch": 1223} {"train_loss": -39.916473388671875, "global_step": 148032, "epoch": 1223} {"train_loss": -40.44697189331055, "global_step": 148033, "epoch": 1223} {"train_loss": -40.0415153503418, "global_step": 148034, "epoch": 1223} {"train_loss": -40.175148010253906, "global_step": 148035, "epoch": 1223} {"train_loss": -40.38764572143555, "global_step": 148036, "epoch": 1223} {"train_loss": -40.53533172607422, "global_step": 148037, "epoch": 1223} {"train_loss": -40.45624923706055, "global_step": 148038, "epoch": 1223} {"train_loss": -40.52178192138672, "global_step": 148039, "epoch": 1223} {"train_loss": -41.0533447265625, "global_step": 148040, "epoch": 1223} {"train_loss": -39.1719970703125, "global_step": 148041, "epoch": 1223} {"train_loss": -40.28950500488281, "global_step": 148042, "epoch": 1223} {"train_loss": -39.67268753051758, "global_step": 148043, "epoch": 1223} {"train_loss": -40.41582107543945, "global_step": 148044, "epoch": 1223} {"train_loss": -41.246028900146484, "global_step": 148045, "epoch": 1223} {"train_loss": -40.620662689208984, "global_step": 148046, "epoch": 1223} {"train_loss": -40.55265808105469, "global_step": 148047, "epoch": 1223} {"train_loss": -40.52981185913086, "global_step": 148048, "epoch": 1223} {"train_loss": -37.533111572265625, "global_step": 148049, "epoch": 1223} {"train_loss": -40.18486022949219, "global_step": 148050, "epoch": 1223} {"train_loss": -40.76966094970703, "global_step": 148051, "epoch": 1223} {"train_loss": -40.39957046508789, "global_step": 148052, "epoch": 1223} {"train_loss": -40.783241271972656, "global_step": 148053, "epoch": 1223} {"train_loss": -40.27553176879883, "global_step": 148054, "epoch": 1223} {"train_loss": -38.36454772949219, "global_step": 148055, "epoch": 1223} {"train_loss": -38.8751220703125, "global_step": 148056, "epoch": 1223} {"train_loss": -39.58089065551758, "global_step": 148057, "epoch": 1223} {"train_loss": -39.42240524291992, "global_step": 148058, "epoch": 1223} {"train_loss": -40.58283996582031, "global_step": 148059, "epoch": 1223} {"train_loss": -40.58726119995117, "global_step": 148060, "epoch": 1223} {"train_loss": -40.905982971191406, "global_step": 148061, "epoch": 1223} {"train_loss": -39.44070816040039, "global_step": 148062, "epoch": 1223} {"train_loss": -40.68473434448242, "global_step": 148063, "epoch": 1223} {"train_loss": -41.41743850708008, "global_step": 148064, "epoch": 1223} {"train_loss": -40.68125915527344, "global_step": 148065, "epoch": 1223} {"train_loss": -40.4024543762207, "global_step": 148066, "epoch": 1223} {"train_loss": -40.84082794189453, "global_step": 148067, "epoch": 1223} {"train_loss": -40.889217376708984, "global_step": 148068, "epoch": 1223} {"train_loss": -40.46949005126953, "global_step": 148069, "epoch": 1223} {"train_loss": -40.69630432128906, "global_step": 148070, "epoch": 1223} {"train_loss": -40.90437698364258, "global_step": 148071, "epoch": 1223} {"train_loss": -38.289669036865234, "global_step": 148072, "epoch": 1223} {"train_loss": -40.647804260253906, "global_step": 148073, "epoch": 1223} {"train_loss": -38.48153305053711, "global_step": 148074, "epoch": 1223} {"train_loss": -40.612117767333984, "global_step": 148075, "epoch": 1223} {"train_loss": -40.11945343017578, "global_step": 148076, "epoch": 1223} {"train_loss": -40.302005767822266, "global_step": 148077, "epoch": 1223} {"train_loss": -40.332454681396484, "global_step": 148078, "epoch": 1223} {"train_loss": -36.68770217895508, "global_step": 148079, "epoch": 1223} {"train_loss": -40.37995529174805, "global_step": 148080, "epoch": 1223} {"train_loss": -39.39997482299805, "global_step": 148081, "epoch": 1223} {"train_loss": -39.84677505493164, "global_step": 148082, "epoch": 1223} {"train_loss": -39.81551742553711, "global_step": 148083, "epoch": 1223} {"train_loss": -38.99788284301758, "global_step": 148084, "epoch": 1223} {"train_loss": -36.32355880737305, "global_step": 148085, "epoch": 1223} {"train_loss": -38.26324462890625, "global_step": 148086, "epoch": 1223} {"train_loss": -38.4291877746582, "global_step": 148087, "epoch": 1223} {"train_loss": -40.0191764831543, "global_step": 148088, "epoch": 1223} {"train_loss": -38.54859161376953, "global_step": 148089, "epoch": 1223} {"train_loss": -37.64850997924805, "global_step": 148090, "epoch": 1223} {"train_loss": -36.79667282104492, "global_step": 148091, "epoch": 1223} {"train_loss": -27.14755630493164, "global_step": 148092, "epoch": 1223} {"train_loss": -40.24014663696289, "global_step": 148093, "epoch": 1223} {"train_loss": -38.93613815307617, "global_step": 148094, "epoch": 1223} {"train_loss": -39.54529571533203, "global_step": 148095, "epoch": 1223} {"train_loss": -39.186458587646484, "global_step": 148096, "epoch": 1223} {"train_loss": -39.11436080932617, "global_step": 148097, "epoch": 1223} {"train_loss": -38.913963317871094, "global_step": 148098, "epoch": 1223} {"train_loss": -38.13715744018555, "global_step": 148099, "epoch": 1223} {"train_loss": -38.14674758911133, "global_step": 148100, "epoch": 1223} {"train_loss": -38.64720916748047, "global_step": 148101, "epoch": 1223} {"train_loss": -38.80440139770508, "global_step": 148102, "epoch": 1223} {"train_loss": -39.30195305564187, "global_step": 148103, "epoch": 1223, "val_loss": 2479993.5} {"train_loss": -37.512176513671875, "global_step": 148104, "epoch": 1224} {"train_loss": -37.90302276611328, "global_step": 148105, "epoch": 1224} {"train_loss": -35.443843841552734, "global_step": 148106, "epoch": 1224} {"train_loss": -35.48862838745117, "global_step": 148107, "epoch": 1224} {"train_loss": -31.786584854125977, "global_step": 148108, "epoch": 1224} {"train_loss": -34.898616790771484, "global_step": 148109, "epoch": 1224} {"train_loss": -24.801828384399414, "global_step": 148110, "epoch": 1224} {"train_loss": -30.875661849975586, "global_step": 148111, "epoch": 1224} {"train_loss": -28.80389404296875, "global_step": 148112, "epoch": 1224} {"train_loss": -32.210113525390625, "global_step": 148113, "epoch": 1224} {"train_loss": -29.947301864624023, "global_step": 148114, "epoch": 1224} {"train_loss": -36.82191467285156, "global_step": 148115, "epoch": 1224} {"train_loss": -35.5423583984375, "global_step": 148116, "epoch": 1224} {"train_loss": -36.66781997680664, "global_step": 148117, "epoch": 1224} {"train_loss": -30.522846221923828, "global_step": 148118, "epoch": 1224} {"train_loss": -32.41145706176758, "global_step": 148119, "epoch": 1224} {"train_loss": -34.22642135620117, "global_step": 148120, "epoch": 1224} {"train_loss": -34.34499740600586, "global_step": 148121, "epoch": 1224} {"train_loss": -35.3952522277832, "global_step": 148122, "epoch": 1224} {"train_loss": -33.351505279541016, "global_step": 148123, "epoch": 1224} {"train_loss": -32.994720458984375, "global_step": 148124, "epoch": 1224} {"train_loss": -33.27077865600586, "global_step": 148125, "epoch": 1224} {"train_loss": -31.630701065063477, "global_step": 148126, "epoch": 1224} {"train_loss": -35.65251922607422, "global_step": 148127, "epoch": 1224} {"train_loss": -33.54270553588867, "global_step": 148128, "epoch": 1224} {"train_loss": -34.64324951171875, "global_step": 148129, "epoch": 1224} {"train_loss": -35.6013298034668, "global_step": 148130, "epoch": 1224} {"train_loss": -31.146656036376953, "global_step": 148131, "epoch": 1224} {"train_loss": -37.74898147583008, "global_step": 148132, "epoch": 1224} {"train_loss": -37.08420944213867, "global_step": 148133, "epoch": 1224} {"train_loss": -36.26987838745117, "global_step": 148134, "epoch": 1224} {"train_loss": -35.7752799987793, "global_step": 148135, "epoch": 1224} {"train_loss": -34.62064743041992, "global_step": 148136, "epoch": 1224} {"train_loss": -36.75675582885742, "global_step": 148137, "epoch": 1224} {"train_loss": -34.52729034423828, "global_step": 148138, "epoch": 1224} {"train_loss": -36.287261962890625, "global_step": 148139, "epoch": 1224} {"train_loss": -37.6908073425293, "global_step": 148140, "epoch": 1224} {"train_loss": -37.190223693847656, "global_step": 148141, "epoch": 1224} {"train_loss": -35.726722717285156, "global_step": 148142, "epoch": 1224} {"train_loss": -37.60361862182617, "global_step": 148143, "epoch": 1224} {"train_loss": -37.31610870361328, "global_step": 148144, "epoch": 1224} {"train_loss": -38.04417037963867, "global_step": 148145, "epoch": 1224} {"train_loss": -38.31582260131836, "global_step": 148146, "epoch": 1224} {"train_loss": -38.1251106262207, "global_step": 148147, "epoch": 1224} {"train_loss": -37.605899810791016, "global_step": 148148, "epoch": 1224} {"train_loss": -37.47430419921875, "global_step": 148149, "epoch": 1224} {"train_loss": -37.54735565185547, "global_step": 148150, "epoch": 1224} {"train_loss": -38.46112823486328, "global_step": 148151, "epoch": 1224} {"train_loss": -38.177268981933594, "global_step": 148152, "epoch": 1224} {"train_loss": -37.4372673034668, "global_step": 148153, "epoch": 1224} {"train_loss": -38.08018112182617, "global_step": 148154, "epoch": 1224} {"train_loss": -38.32740783691406, "global_step": 148155, "epoch": 1224} {"train_loss": -37.869991302490234, "global_step": 148156, "epoch": 1224} {"train_loss": -38.26705551147461, "global_step": 148157, "epoch": 1224} {"train_loss": -38.49021530151367, "global_step": 148158, "epoch": 1224} {"train_loss": -38.17133712768555, "global_step": 148159, "epoch": 1224} {"train_loss": -38.32538604736328, "global_step": 148160, "epoch": 1224} {"train_loss": -38.370826721191406, "global_step": 148161, "epoch": 1224} {"train_loss": -38.34941482543945, "global_step": 148162, "epoch": 1224} {"train_loss": -38.429805755615234, "global_step": 148163, "epoch": 1224} {"train_loss": -38.23704147338867, "global_step": 148164, "epoch": 1224} {"train_loss": -38.86727523803711, "global_step": 148165, "epoch": 1224} {"train_loss": -39.073486328125, "global_step": 148166, "epoch": 1224} {"train_loss": -39.0282096862793, "global_step": 148167, "epoch": 1224} {"train_loss": -38.90485382080078, "global_step": 148168, "epoch": 1224} {"train_loss": -39.0141716003418, "global_step": 148169, "epoch": 1224} {"train_loss": -38.48586654663086, "global_step": 148170, "epoch": 1224} {"train_loss": -36.869136810302734, "global_step": 148171, "epoch": 1224} {"train_loss": -38.91880416870117, "global_step": 148172, "epoch": 1224} {"train_loss": -39.081520080566406, "global_step": 148173, "epoch": 1224} {"train_loss": -38.921878814697266, "global_step": 148174, "epoch": 1224} {"train_loss": -38.90694808959961, "global_step": 148175, "epoch": 1224} {"train_loss": -38.89119338989258, "global_step": 148176, "epoch": 1224} {"train_loss": -38.76904296875, "global_step": 148177, "epoch": 1224} {"train_loss": -38.61945724487305, "global_step": 148178, "epoch": 1224} {"train_loss": -39.254329681396484, "global_step": 148179, "epoch": 1224} {"train_loss": -39.742671966552734, "global_step": 148180, "epoch": 1224} {"train_loss": -39.56614303588867, "global_step": 148181, "epoch": 1224} {"train_loss": -39.38658905029297, "global_step": 148182, "epoch": 1224} {"train_loss": -39.122493743896484, "global_step": 148183, "epoch": 1224} {"train_loss": -39.71809005737305, "global_step": 148184, "epoch": 1224} {"train_loss": -39.76572036743164, "global_step": 148185, "epoch": 1224} {"train_loss": -39.624267578125, "global_step": 148186, "epoch": 1224} {"train_loss": -39.57892608642578, "global_step": 148187, "epoch": 1224} {"train_loss": -39.18355941772461, "global_step": 148188, "epoch": 1224} {"train_loss": -38.08185958862305, "global_step": 148189, "epoch": 1224} {"train_loss": -39.82501220703125, "global_step": 148190, "epoch": 1224} {"train_loss": -39.13220977783203, "global_step": 148191, "epoch": 1224} {"train_loss": -39.4522819519043, "global_step": 148192, "epoch": 1224} {"train_loss": -39.75141525268555, "global_step": 148193, "epoch": 1224} {"train_loss": -39.37495422363281, "global_step": 148194, "epoch": 1224} {"train_loss": -39.63880157470703, "global_step": 148195, "epoch": 1224} {"train_loss": -39.6208610534668, "global_step": 148196, "epoch": 1224} {"train_loss": -39.757537841796875, "global_step": 148197, "epoch": 1224} {"train_loss": -39.492671966552734, "global_step": 148198, "epoch": 1224} {"train_loss": -39.663368225097656, "global_step": 148199, "epoch": 1224} {"train_loss": -40.135009765625, "global_step": 148200, "epoch": 1224} {"train_loss": -39.791500091552734, "global_step": 148201, "epoch": 1224} {"train_loss": -39.7142219543457, "global_step": 148202, "epoch": 1224} {"train_loss": -40.09024429321289, "global_step": 148203, "epoch": 1224} {"train_loss": -39.91699981689453, "global_step": 148204, "epoch": 1224} {"train_loss": -38.89352035522461, "global_step": 148205, "epoch": 1224} {"train_loss": -40.024696350097656, "global_step": 148206, "epoch": 1224} {"train_loss": -40.03358840942383, "global_step": 148207, "epoch": 1224} {"train_loss": -39.71825408935547, "global_step": 148208, "epoch": 1224} {"train_loss": -40.20692825317383, "global_step": 148209, "epoch": 1224} {"train_loss": -39.93499755859375, "global_step": 148210, "epoch": 1224} {"train_loss": -40.06013107299805, "global_step": 148211, "epoch": 1224} {"train_loss": -38.881465911865234, "global_step": 148212, "epoch": 1224} {"train_loss": -40.19915008544922, "global_step": 148213, "epoch": 1224} {"train_loss": -39.8541259765625, "global_step": 148214, "epoch": 1224} {"train_loss": -40.03995895385742, "global_step": 148215, "epoch": 1224} {"train_loss": -39.988033294677734, "global_step": 148216, "epoch": 1224} {"train_loss": -39.725502014160156, "global_step": 148217, "epoch": 1224} {"train_loss": -40.30823516845703, "global_step": 148218, "epoch": 1224} {"train_loss": -40.427947998046875, "global_step": 148219, "epoch": 1224} {"train_loss": -40.488338470458984, "global_step": 148220, "epoch": 1224} {"train_loss": -40.05854797363281, "global_step": 148221, "epoch": 1224} {"train_loss": -40.181156158447266, "global_step": 148222, "epoch": 1224} {"train_loss": -39.82137680053711, "global_step": 148223, "epoch": 1224} {"train_loss": -37.55355615852293, "global_step": 148224, "epoch": 1224, "val_loss": 2591724.0} {"train_loss": -40.43253707885742, "global_step": 148225, "epoch": 1225} {"train_loss": -40.1128044128418, "global_step": 148226, "epoch": 1225} {"train_loss": -40.78321075439453, "global_step": 148227, "epoch": 1225} {"train_loss": -40.0899772644043, "global_step": 148228, "epoch": 1225} {"train_loss": -40.315711975097656, "global_step": 148229, "epoch": 1225} {"train_loss": -40.230525970458984, "global_step": 148230, "epoch": 1225} {"train_loss": -40.61086654663086, "global_step": 148231, "epoch": 1225} {"train_loss": -40.76862716674805, "global_step": 148232, "epoch": 1225} {"train_loss": -40.042484283447266, "global_step": 148233, "epoch": 1225} {"train_loss": -40.573787689208984, "global_step": 148234, "epoch": 1225} {"train_loss": -41.0350341796875, "global_step": 148235, "epoch": 1225} {"train_loss": -40.38532257080078, "global_step": 148236, "epoch": 1225} {"train_loss": -40.2064323425293, "global_step": 148237, "epoch": 1225} {"train_loss": -39.81952667236328, "global_step": 148238, "epoch": 1225} {"train_loss": -40.845069885253906, "global_step": 148239, "epoch": 1225} {"train_loss": -39.94757843017578, "global_step": 148240, "epoch": 1225} {"train_loss": -40.388729095458984, "global_step": 148241, "epoch": 1225} {"train_loss": -40.32609939575195, "global_step": 148242, "epoch": 1225} {"train_loss": -39.48505783081055, "global_step": 148243, "epoch": 1225} {"train_loss": -39.009986877441406, "global_step": 148244, "epoch": 1225} {"train_loss": -39.11480712890625, "global_step": 148245, "epoch": 1225} {"train_loss": -40.20820617675781, "global_step": 148246, "epoch": 1225} {"train_loss": -38.24843978881836, "global_step": 148247, "epoch": 1225} {"train_loss": -37.660430908203125, "global_step": 148248, "epoch": 1225} {"train_loss": -34.50779342651367, "global_step": 148249, "epoch": 1225} {"train_loss": -32.909088134765625, "global_step": 148250, "epoch": 1225} {"train_loss": -34.41329574584961, "global_step": 148251, "epoch": 1225} {"train_loss": -38.82062911987305, "global_step": 148252, "epoch": 1225} {"train_loss": -38.28999710083008, "global_step": 148253, "epoch": 1225} {"train_loss": -36.26747131347656, "global_step": 148254, "epoch": 1225} {"train_loss": -36.31740188598633, "global_step": 148255, "epoch": 1225} {"train_loss": -39.784725189208984, "global_step": 148256, "epoch": 1225} {"train_loss": -38.00946044921875, "global_step": 148257, "epoch": 1225} {"train_loss": -37.387943267822266, "global_step": 148258, "epoch": 1225} {"train_loss": -40.21102523803711, "global_step": 148259, "epoch": 1225} {"train_loss": -37.801395416259766, "global_step": 148260, "epoch": 1225} {"train_loss": -40.07703399658203, "global_step": 148261, "epoch": 1225} {"train_loss": -38.67119598388672, "global_step": 148262, "epoch": 1225} {"train_loss": -38.318599700927734, "global_step": 148263, "epoch": 1225} {"train_loss": -40.09468078613281, "global_step": 148264, "epoch": 1225} {"train_loss": -37.54878616333008, "global_step": 148265, "epoch": 1225} {"train_loss": -39.515377044677734, "global_step": 148266, "epoch": 1225} {"train_loss": -38.34744644165039, "global_step": 148267, "epoch": 1225} {"train_loss": -40.20344924926758, "global_step": 148268, "epoch": 1225} {"train_loss": -38.38779830932617, "global_step": 148269, "epoch": 1225} {"train_loss": -39.67876434326172, "global_step": 148270, "epoch": 1225} {"train_loss": -39.05835723876953, "global_step": 148271, "epoch": 1225} {"train_loss": -39.82865524291992, "global_step": 148272, "epoch": 1225} {"train_loss": -39.08686065673828, "global_step": 148273, "epoch": 1225} {"train_loss": -39.3283576965332, "global_step": 148274, "epoch": 1225} {"train_loss": -39.279998779296875, "global_step": 148275, "epoch": 1225} {"train_loss": -40.48041534423828, "global_step": 148276, "epoch": 1225} {"train_loss": -39.973873138427734, "global_step": 148277, "epoch": 1225} {"train_loss": -39.89509582519531, "global_step": 148278, "epoch": 1225} {"train_loss": -39.30002212524414, "global_step": 148279, "epoch": 1225} {"train_loss": -39.523529052734375, "global_step": 148280, "epoch": 1225} {"train_loss": -38.558746337890625, "global_step": 148281, "epoch": 1225} {"train_loss": -36.69819259643555, "global_step": 148282, "epoch": 1225} {"train_loss": -38.75577926635742, "global_step": 148283, "epoch": 1225} {"train_loss": -38.451114654541016, "global_step": 148284, "epoch": 1225} {"train_loss": -39.288570404052734, "global_step": 148285, "epoch": 1225} {"train_loss": -39.73714828491211, "global_step": 148286, "epoch": 1225} {"train_loss": -39.38884735107422, "global_step": 148287, "epoch": 1225} {"train_loss": -40.222694396972656, "global_step": 148288, "epoch": 1225} {"train_loss": -38.0233268737793, "global_step": 148289, "epoch": 1225} {"train_loss": -39.98524475097656, "global_step": 148290, "epoch": 1225} {"train_loss": -39.354854583740234, "global_step": 148291, "epoch": 1225} {"train_loss": -39.57978439331055, "global_step": 148292, "epoch": 1225} {"train_loss": -39.6124153137207, "global_step": 148293, "epoch": 1225} {"train_loss": -39.63656234741211, "global_step": 148294, "epoch": 1225} {"train_loss": -39.4524040222168, "global_step": 148295, "epoch": 1225} {"train_loss": -39.17758560180664, "global_step": 148296, "epoch": 1225} {"train_loss": -40.63116455078125, "global_step": 148297, "epoch": 1225} {"train_loss": -40.10981369018555, "global_step": 148298, "epoch": 1225} {"train_loss": -40.22617721557617, "global_step": 148299, "epoch": 1225} {"train_loss": -40.29903030395508, "global_step": 148300, "epoch": 1225} {"train_loss": -40.0478401184082, "global_step": 148301, "epoch": 1225} {"train_loss": -40.30316925048828, "global_step": 148302, "epoch": 1225} {"train_loss": -40.01011276245117, "global_step": 148303, "epoch": 1225} {"train_loss": -40.21528244018555, "global_step": 148304, "epoch": 1225} {"train_loss": -40.34021759033203, "global_step": 148305, "epoch": 1225} {"train_loss": -39.91019821166992, "global_step": 148306, "epoch": 1225} {"train_loss": -40.460182189941406, "global_step": 148307, "epoch": 1225} {"train_loss": -40.023372650146484, "global_step": 148308, "epoch": 1225} {"train_loss": -40.406124114990234, "global_step": 148309, "epoch": 1225} {"train_loss": -40.028076171875, "global_step": 148310, "epoch": 1225} {"train_loss": -40.196102142333984, "global_step": 148311, "epoch": 1225} {"train_loss": -39.25547409057617, "global_step": 148312, "epoch": 1225} {"train_loss": -40.53290939331055, "global_step": 148313, "epoch": 1225} {"train_loss": -40.41677474975586, "global_step": 148314, "epoch": 1225} {"train_loss": -40.035884857177734, "global_step": 148315, "epoch": 1225} {"train_loss": -39.75871658325195, "global_step": 148316, "epoch": 1225} {"train_loss": -40.5268669128418, "global_step": 148317, "epoch": 1225} {"train_loss": -40.812068939208984, "global_step": 148318, "epoch": 1225} {"train_loss": -40.727935791015625, "global_step": 148319, "epoch": 1225} {"train_loss": -38.99715042114258, "global_step": 148320, "epoch": 1225} {"train_loss": -40.545692443847656, "global_step": 148321, "epoch": 1225} {"train_loss": -40.7235221862793, "global_step": 148322, "epoch": 1225} {"train_loss": -40.25722885131836, "global_step": 148323, "epoch": 1225} {"train_loss": -40.21818161010742, "global_step": 148324, "epoch": 1225} {"train_loss": -39.9449348449707, "global_step": 148325, "epoch": 1225} {"train_loss": -40.92576217651367, "global_step": 148326, "epoch": 1225} {"train_loss": -40.894996643066406, "global_step": 148327, "epoch": 1225} {"train_loss": -40.713050842285156, "global_step": 148328, "epoch": 1225} {"train_loss": -39.582454681396484, "global_step": 148329, "epoch": 1225} {"train_loss": -40.97454071044922, "global_step": 148330, "epoch": 1225} {"train_loss": -40.66957473754883, "global_step": 148331, "epoch": 1225} {"train_loss": -41.151851654052734, "global_step": 148332, "epoch": 1225} {"train_loss": -39.90822219848633, "global_step": 148333, "epoch": 1225} {"train_loss": -40.854549407958984, "global_step": 148334, "epoch": 1225} {"train_loss": -40.463130950927734, "global_step": 148335, "epoch": 1225} {"train_loss": -40.4198112487793, "global_step": 148336, "epoch": 1225} {"train_loss": -40.09748458862305, "global_step": 148337, "epoch": 1225} {"train_loss": -41.044837951660156, "global_step": 148338, "epoch": 1225} {"train_loss": -40.018157958984375, "global_step": 148339, "epoch": 1225} {"train_loss": -41.10100173950195, "global_step": 148340, "epoch": 1225} {"train_loss": -40.27959060668945, "global_step": 148341, "epoch": 1225} {"train_loss": -41.3670768737793, "global_step": 148342, "epoch": 1225} {"train_loss": -40.30679702758789, "global_step": 148343, "epoch": 1225} {"train_loss": -39.96184158325195, "global_step": 148344, "epoch": 1225} {"train_loss": -39.62501819074647, "global_step": 148345, "epoch": 1225, "val_loss": 2380634.75} {"train_loss": -39.173484802246094, "global_step": 148346, "epoch": 1226} {"train_loss": -39.876766204833984, "global_step": 148347, "epoch": 1226} {"train_loss": -39.06620788574219, "global_step": 148348, "epoch": 1226} {"train_loss": -36.742034912109375, "global_step": 148349, "epoch": 1226} {"train_loss": -38.86812210083008, "global_step": 148350, "epoch": 1226} {"train_loss": -40.71038818359375, "global_step": 148351, "epoch": 1226} {"train_loss": -41.19953536987305, "global_step": 148352, "epoch": 1226} {"train_loss": -38.88849639892578, "global_step": 148353, "epoch": 1226} {"train_loss": -38.165523529052734, "global_step": 148354, "epoch": 1226} {"train_loss": -39.00062942504883, "global_step": 148355, "epoch": 1226} {"train_loss": -40.78916549682617, "global_step": 148356, "epoch": 1226} {"train_loss": -39.266170501708984, "global_step": 148357, "epoch": 1226} {"train_loss": -38.843666076660156, "global_step": 148358, "epoch": 1226} {"train_loss": -39.898311614990234, "global_step": 148359, "epoch": 1226} {"train_loss": -40.73552322387695, "global_step": 148360, "epoch": 1226} {"train_loss": -37.173309326171875, "global_step": 148361, "epoch": 1226} {"train_loss": -38.19157409667969, "global_step": 148362, "epoch": 1226} {"train_loss": -38.8400993347168, "global_step": 148363, "epoch": 1226} {"train_loss": -39.395668029785156, "global_step": 148364, "epoch": 1226} {"train_loss": -38.98814010620117, "global_step": 148365, "epoch": 1226} {"train_loss": -39.82802200317383, "global_step": 148366, "epoch": 1226} {"train_loss": -40.28205490112305, "global_step": 148367, "epoch": 1226} {"train_loss": -37.98576354980469, "global_step": 148368, "epoch": 1226} {"train_loss": -38.64284896850586, "global_step": 148369, "epoch": 1226} {"train_loss": -38.64823532104492, "global_step": 148370, "epoch": 1226} {"train_loss": -39.87783432006836, "global_step": 148371, "epoch": 1226} {"train_loss": -39.396968841552734, "global_step": 148372, "epoch": 1226} {"train_loss": -40.58221435546875, "global_step": 148373, "epoch": 1226} {"train_loss": -40.45686721801758, "global_step": 148374, "epoch": 1226} {"train_loss": -39.18330764770508, "global_step": 148375, "epoch": 1226} {"train_loss": -41.19010543823242, "global_step": 148376, "epoch": 1226} {"train_loss": -40.481502532958984, "global_step": 148377, "epoch": 1226} {"train_loss": -40.14017868041992, "global_step": 148378, "epoch": 1226} {"train_loss": -40.79012680053711, "global_step": 148379, "epoch": 1226} {"train_loss": -40.20174789428711, "global_step": 148380, "epoch": 1226} {"train_loss": -40.2883415222168, "global_step": 148381, "epoch": 1226} {"train_loss": -39.87659454345703, "global_step": 148382, "epoch": 1226} {"train_loss": -40.14593505859375, "global_step": 148383, "epoch": 1226} {"train_loss": -40.85004806518555, "global_step": 148384, "epoch": 1226} {"train_loss": -39.56071090698242, "global_step": 148385, "epoch": 1226} {"train_loss": -39.599632263183594, "global_step": 148386, "epoch": 1226} {"train_loss": -40.361572265625, "global_step": 148387, "epoch": 1226} {"train_loss": -40.24241256713867, "global_step": 148388, "epoch": 1226} {"train_loss": -38.067466735839844, "global_step": 148389, "epoch": 1226} {"train_loss": -39.65704345703125, "global_step": 148390, "epoch": 1226} {"train_loss": -41.33810806274414, "global_step": 148391, "epoch": 1226} {"train_loss": -39.82960510253906, "global_step": 148392, "epoch": 1226} {"train_loss": -40.2789306640625, "global_step": 148393, "epoch": 1226} {"train_loss": -41.18341827392578, "global_step": 148394, "epoch": 1226} {"train_loss": -40.8464241027832, "global_step": 148395, "epoch": 1226} {"train_loss": -40.21233367919922, "global_step": 148396, "epoch": 1226} {"train_loss": -40.78902816772461, "global_step": 148397, "epoch": 1226} {"train_loss": -40.65694046020508, "global_step": 148398, "epoch": 1226} {"train_loss": -39.572364807128906, "global_step": 148399, "epoch": 1226} {"train_loss": -39.99164962768555, "global_step": 148400, "epoch": 1226} {"train_loss": -39.99644088745117, "global_step": 148401, "epoch": 1226} {"train_loss": -40.694435119628906, "global_step": 148402, "epoch": 1226} {"train_loss": -39.247554779052734, "global_step": 148403, "epoch": 1226} {"train_loss": -39.05225372314453, "global_step": 148404, "epoch": 1226} {"train_loss": -41.02301025390625, "global_step": 148405, "epoch": 1226} {"train_loss": -39.423553466796875, "global_step": 148406, "epoch": 1226} {"train_loss": -39.226016998291016, "global_step": 148407, "epoch": 1226} {"train_loss": -40.138832092285156, "global_step": 148408, "epoch": 1226} {"train_loss": -39.96355056762695, "global_step": 148409, "epoch": 1226} {"train_loss": -38.27022933959961, "global_step": 148410, "epoch": 1226} {"train_loss": -37.02095413208008, "global_step": 148411, "epoch": 1226} {"train_loss": -40.323486328125, "global_step": 148412, "epoch": 1226} {"train_loss": -39.40277099609375, "global_step": 148413, "epoch": 1226} {"train_loss": -39.29970169067383, "global_step": 148414, "epoch": 1226} {"train_loss": -39.591705322265625, "global_step": 148415, "epoch": 1226} {"train_loss": -40.069454193115234, "global_step": 148416, "epoch": 1226} {"train_loss": -39.4169921875, "global_step": 148417, "epoch": 1226} {"train_loss": -39.56056594848633, "global_step": 148418, "epoch": 1226} {"train_loss": -40.49920654296875, "global_step": 148419, "epoch": 1226} {"train_loss": -39.23236083984375, "global_step": 148420, "epoch": 1226} {"train_loss": -39.72909164428711, "global_step": 148421, "epoch": 1226} {"train_loss": -39.95686721801758, "global_step": 148422, "epoch": 1226} {"train_loss": -39.22443389892578, "global_step": 148423, "epoch": 1226} {"train_loss": -40.23286056518555, "global_step": 148424, "epoch": 1226} {"train_loss": -39.67399215698242, "global_step": 148425, "epoch": 1226} {"train_loss": -40.46168899536133, "global_step": 148426, "epoch": 1226} {"train_loss": -40.220802307128906, "global_step": 148427, "epoch": 1226} {"train_loss": -39.205230712890625, "global_step": 148428, "epoch": 1226} {"train_loss": -40.137081146240234, "global_step": 148429, "epoch": 1226} {"train_loss": -40.90359115600586, "global_step": 148430, "epoch": 1226} {"train_loss": -39.65298843383789, "global_step": 148431, "epoch": 1226} {"train_loss": -40.366004943847656, "global_step": 148432, "epoch": 1226} {"train_loss": -40.25330352783203, "global_step": 148433, "epoch": 1226} {"train_loss": -40.95431137084961, "global_step": 148434, "epoch": 1226} {"train_loss": -40.11613845825195, "global_step": 148435, "epoch": 1226} {"train_loss": -39.972312927246094, "global_step": 148436, "epoch": 1226} {"train_loss": -40.04120635986328, "global_step": 148437, "epoch": 1226} {"train_loss": -40.546443939208984, "global_step": 148438, "epoch": 1226} {"train_loss": -40.987884521484375, "global_step": 148439, "epoch": 1226} {"train_loss": -40.34054183959961, "global_step": 148440, "epoch": 1226} {"train_loss": -40.11235809326172, "global_step": 148441, "epoch": 1226} {"train_loss": -39.67311477661133, "global_step": 148442, "epoch": 1226} {"train_loss": -41.00818634033203, "global_step": 148443, "epoch": 1226} {"train_loss": -40.18268966674805, "global_step": 148444, "epoch": 1226} {"train_loss": -40.71253204345703, "global_step": 148445, "epoch": 1226} {"train_loss": -39.894683837890625, "global_step": 148446, "epoch": 1226} {"train_loss": -40.66633224487305, "global_step": 148447, "epoch": 1226} {"train_loss": -40.91614532470703, "global_step": 148448, "epoch": 1226} {"train_loss": -40.996856689453125, "global_step": 148449, "epoch": 1226} {"train_loss": -40.73960494995117, "global_step": 148450, "epoch": 1226} {"train_loss": -41.32879638671875, "global_step": 148451, "epoch": 1226} {"train_loss": -40.73830795288086, "global_step": 148452, "epoch": 1226} {"train_loss": -40.30250930786133, "global_step": 148453, "epoch": 1226} {"train_loss": -41.25152587890625, "global_step": 148454, "epoch": 1226} {"train_loss": -41.173702239990234, "global_step": 148455, "epoch": 1226} {"train_loss": -37.88017654418945, "global_step": 148456, "epoch": 1226} {"train_loss": -40.18196487426758, "global_step": 148457, "epoch": 1226} {"train_loss": -40.81988525390625, "global_step": 148458, "epoch": 1226} {"train_loss": -40.71206283569336, "global_step": 148459, "epoch": 1226} {"train_loss": -40.62575912475586, "global_step": 148460, "epoch": 1226} {"train_loss": -40.44859313964844, "global_step": 148461, "epoch": 1226} {"train_loss": -40.81684494018555, "global_step": 148462, "epoch": 1226} {"train_loss": -40.61771774291992, "global_step": 148463, "epoch": 1226} {"train_loss": -41.16743469238281, "global_step": 148464, "epoch": 1226} {"train_loss": -40.8255729675293, "global_step": 148465, "epoch": 1226} {"train_loss": -39.94755163271565, "global_step": 148466, "epoch": 1226, "val_loss": 2489655.75} {"train_loss": -40.74821472167969, "global_step": 148467, "epoch": 1227} {"train_loss": -39.86359786987305, "global_step": 148468, "epoch": 1227} {"train_loss": -40.899959564208984, "global_step": 148469, "epoch": 1227} {"train_loss": -40.40265655517578, "global_step": 148470, "epoch": 1227} {"train_loss": -40.077301025390625, "global_step": 148471, "epoch": 1227} {"train_loss": -39.624267578125, "global_step": 148472, "epoch": 1227} {"train_loss": -39.839195251464844, "global_step": 148473, "epoch": 1227} {"train_loss": -40.01482009887695, "global_step": 148474, "epoch": 1227} {"train_loss": -40.20147705078125, "global_step": 148475, "epoch": 1227} {"train_loss": -40.98443603515625, "global_step": 148476, "epoch": 1227} {"train_loss": -41.07159423828125, "global_step": 148477, "epoch": 1227} {"train_loss": -39.05326461791992, "global_step": 148478, "epoch": 1227} {"train_loss": -36.476985931396484, "global_step": 148479, "epoch": 1227} {"train_loss": -36.5283317565918, "global_step": 148480, "epoch": 1227} {"train_loss": -38.40645217895508, "global_step": 148481, "epoch": 1227} {"train_loss": -38.85769271850586, "global_step": 148482, "epoch": 1227} {"train_loss": -40.70562744140625, "global_step": 148483, "epoch": 1227} {"train_loss": -40.97953796386719, "global_step": 148484, "epoch": 1227} {"train_loss": -40.02732849121094, "global_step": 148485, "epoch": 1227} {"train_loss": -40.4690055847168, "global_step": 148486, "epoch": 1227} {"train_loss": -41.47832107543945, "global_step": 148487, "epoch": 1227} {"train_loss": -40.635955810546875, "global_step": 148488, "epoch": 1227} {"train_loss": -40.28450012207031, "global_step": 148489, "epoch": 1227} {"train_loss": -40.70643997192383, "global_step": 148490, "epoch": 1227} {"train_loss": -40.49339294433594, "global_step": 148491, "epoch": 1227} {"train_loss": -40.4205436706543, "global_step": 148492, "epoch": 1227} {"train_loss": -40.423133850097656, "global_step": 148493, "epoch": 1227} {"train_loss": -38.57887268066406, "global_step": 148494, "epoch": 1227} {"train_loss": -39.311580657958984, "global_step": 148495, "epoch": 1227} {"train_loss": -40.468257904052734, "global_step": 148496, "epoch": 1227} {"train_loss": -40.50643539428711, "global_step": 148497, "epoch": 1227} {"train_loss": -39.47897720336914, "global_step": 148498, "epoch": 1227} {"train_loss": -39.659393310546875, "global_step": 148499, "epoch": 1227} {"train_loss": -40.35258865356445, "global_step": 148500, "epoch": 1227} {"train_loss": -40.75003433227539, "global_step": 148501, "epoch": 1227} {"train_loss": -40.87925338745117, "global_step": 148502, "epoch": 1227} {"train_loss": -40.31309127807617, "global_step": 148503, "epoch": 1227} {"train_loss": -39.51372146606445, "global_step": 148504, "epoch": 1227} {"train_loss": -39.32981872558594, "global_step": 148505, "epoch": 1227} {"train_loss": -40.40953826904297, "global_step": 148506, "epoch": 1227} {"train_loss": -39.755775451660156, "global_step": 148507, "epoch": 1227} {"train_loss": -39.9929084777832, "global_step": 148508, "epoch": 1227} {"train_loss": -38.29890441894531, "global_step": 148509, "epoch": 1227} {"train_loss": -40.621395111083984, "global_step": 148510, "epoch": 1227} {"train_loss": -40.78643798828125, "global_step": 148511, "epoch": 1227} {"train_loss": -40.02768325805664, "global_step": 148512, "epoch": 1227} {"train_loss": -38.48566436767578, "global_step": 148513, "epoch": 1227} {"train_loss": -40.83566665649414, "global_step": 148514, "epoch": 1227} {"train_loss": -39.3797721862793, "global_step": 148515, "epoch": 1227} {"train_loss": -37.51249313354492, "global_step": 148516, "epoch": 1227} {"train_loss": -38.4016227722168, "global_step": 148517, "epoch": 1227} {"train_loss": -38.843509674072266, "global_step": 148518, "epoch": 1227} {"train_loss": -39.70107650756836, "global_step": 148519, "epoch": 1227} {"train_loss": -38.96631622314453, "global_step": 148520, "epoch": 1227} {"train_loss": -37.44628143310547, "global_step": 148521, "epoch": 1227} {"train_loss": -38.92441940307617, "global_step": 148522, "epoch": 1227} {"train_loss": -38.92267990112305, "global_step": 148523, "epoch": 1227} {"train_loss": -27.449949264526367, "global_step": 148524, "epoch": 1227} {"train_loss": -36.91231918334961, "global_step": 148525, "epoch": 1227} {"train_loss": -37.94968795776367, "global_step": 148526, "epoch": 1227} {"train_loss": -32.9680061340332, "global_step": 148527, "epoch": 1227} {"train_loss": -38.136539459228516, "global_step": 148528, "epoch": 1227} {"train_loss": -32.91652297973633, "global_step": 148529, "epoch": 1227} {"train_loss": -37.2174186706543, "global_step": 148530, "epoch": 1227} {"train_loss": -37.802947998046875, "global_step": 148531, "epoch": 1227} {"train_loss": -32.49724578857422, "global_step": 148532, "epoch": 1227} {"train_loss": -33.82816696166992, "global_step": 148533, "epoch": 1227} {"train_loss": -36.84048843383789, "global_step": 148534, "epoch": 1227} {"train_loss": -31.35348892211914, "global_step": 148535, "epoch": 1227} {"train_loss": -37.631134033203125, "global_step": 148536, "epoch": 1227} {"train_loss": -30.765567779541016, "global_step": 148537, "epoch": 1227} {"train_loss": -37.7148551940918, "global_step": 148538, "epoch": 1227} {"train_loss": -34.85598373413086, "global_step": 148539, "epoch": 1227} {"train_loss": -32.88936233520508, "global_step": 148540, "epoch": 1227} {"train_loss": -35.200687408447266, "global_step": 148541, "epoch": 1227} {"train_loss": -35.3376350402832, "global_step": 148542, "epoch": 1227} {"train_loss": -35.67800521850586, "global_step": 148543, "epoch": 1227} {"train_loss": -37.481231689453125, "global_step": 148544, "epoch": 1227} {"train_loss": -35.80823516845703, "global_step": 148545, "epoch": 1227} {"train_loss": -35.746734619140625, "global_step": 148546, "epoch": 1227} {"train_loss": -34.66221618652344, "global_step": 148547, "epoch": 1227} {"train_loss": -35.28084182739258, "global_step": 148548, "epoch": 1227} {"train_loss": -34.81826400756836, "global_step": 148549, "epoch": 1227} {"train_loss": -30.2696590423584, "global_step": 148550, "epoch": 1227} {"train_loss": -35.25916290283203, "global_step": 148551, "epoch": 1227} {"train_loss": -36.46552276611328, "global_step": 148552, "epoch": 1227} {"train_loss": -36.896297454833984, "global_step": 148553, "epoch": 1227} {"train_loss": -31.8673152923584, "global_step": 148554, "epoch": 1227} {"train_loss": -33.717529296875, "global_step": 148555, "epoch": 1227} {"train_loss": -32.92012405395508, "global_step": 148556, "epoch": 1227} {"train_loss": -36.28773880004883, "global_step": 148557, "epoch": 1227} {"train_loss": -36.98546600341797, "global_step": 148558, "epoch": 1227} {"train_loss": -35.716041564941406, "global_step": 148559, "epoch": 1227} {"train_loss": -37.638389587402344, "global_step": 148560, "epoch": 1227} {"train_loss": -37.193782806396484, "global_step": 148561, "epoch": 1227} {"train_loss": -35.966304779052734, "global_step": 148562, "epoch": 1227} {"train_loss": -35.85554885864258, "global_step": 148563, "epoch": 1227} {"train_loss": -35.57131576538086, "global_step": 148564, "epoch": 1227} {"train_loss": -37.53940963745117, "global_step": 148565, "epoch": 1227} {"train_loss": -36.83597946166992, "global_step": 148566, "epoch": 1227} {"train_loss": -34.58474349975586, "global_step": 148567, "epoch": 1227} {"train_loss": -38.107337951660156, "global_step": 148568, "epoch": 1227} {"train_loss": -36.124141693115234, "global_step": 148569, "epoch": 1227} {"train_loss": -35.94524383544922, "global_step": 148570, "epoch": 1227} {"train_loss": -37.016395568847656, "global_step": 148571, "epoch": 1227} {"train_loss": -36.82536697387695, "global_step": 148572, "epoch": 1227} {"train_loss": -36.3514289855957, "global_step": 148573, "epoch": 1227} {"train_loss": -37.62804412841797, "global_step": 148574, "epoch": 1227} {"train_loss": -37.076637268066406, "global_step": 148575, "epoch": 1227} {"train_loss": -37.98118591308594, "global_step": 148576, "epoch": 1227} {"train_loss": -35.53731155395508, "global_step": 148577, "epoch": 1227} {"train_loss": -38.09310531616211, "global_step": 148578, "epoch": 1227} {"train_loss": -31.632394790649414, "global_step": 148579, "epoch": 1227} {"train_loss": -38.427818298339844, "global_step": 148580, "epoch": 1227} {"train_loss": -37.18880081176758, "global_step": 148581, "epoch": 1227} {"train_loss": -37.72724151611328, "global_step": 148582, "epoch": 1227} {"train_loss": -37.8470458984375, "global_step": 148583, "epoch": 1227} {"train_loss": -37.8868408203125, "global_step": 148584, "epoch": 1227} {"train_loss": -32.018226623535156, "global_step": 148585, "epoch": 1227} {"train_loss": -36.7745475769043, "global_step": 148586, "epoch": 1227} {"train_loss": -37.580604963066165, "global_step": 148587, "epoch": 1227, "val_loss": 2565572.0} {"train_loss": -37.76963424682617, "global_step": 148588, "epoch": 1228} {"train_loss": -38.12360382080078, "global_step": 148589, "epoch": 1228} {"train_loss": -35.92220687866211, "global_step": 148590, "epoch": 1228} {"train_loss": -38.20259475708008, "global_step": 148591, "epoch": 1228} {"train_loss": -37.88035202026367, "global_step": 148592, "epoch": 1228} {"train_loss": -36.41898727416992, "global_step": 148593, "epoch": 1228} {"train_loss": -38.49714660644531, "global_step": 148594, "epoch": 1228} {"train_loss": -37.76786804199219, "global_step": 148595, "epoch": 1228} {"train_loss": -32.07986831665039, "global_step": 148596, "epoch": 1228} {"train_loss": -35.802120208740234, "global_step": 148597, "epoch": 1228} {"train_loss": -37.725685119628906, "global_step": 148598, "epoch": 1228} {"train_loss": -35.24351119995117, "global_step": 148599, "epoch": 1228} {"train_loss": -37.0223274230957, "global_step": 148600, "epoch": 1228} {"train_loss": -37.659881591796875, "global_step": 148601, "epoch": 1228} {"train_loss": -37.74106979370117, "global_step": 148602, "epoch": 1228} {"train_loss": -37.96527099609375, "global_step": 148603, "epoch": 1228} {"train_loss": -37.39073944091797, "global_step": 148604, "epoch": 1228} {"train_loss": -37.46530532836914, "global_step": 148605, "epoch": 1228} {"train_loss": -37.56986618041992, "global_step": 148606, "epoch": 1228} {"train_loss": -37.3789176940918, "global_step": 148607, "epoch": 1228} {"train_loss": -38.12995529174805, "global_step": 148608, "epoch": 1228} {"train_loss": -38.502838134765625, "global_step": 148609, "epoch": 1228} {"train_loss": -37.91278839111328, "global_step": 148610, "epoch": 1228} {"train_loss": -37.720306396484375, "global_step": 148611, "epoch": 1228} {"train_loss": -38.40871810913086, "global_step": 148612, "epoch": 1228} {"train_loss": -37.76237869262695, "global_step": 148613, "epoch": 1228} {"train_loss": -37.6169548034668, "global_step": 148614, "epoch": 1228} {"train_loss": -38.05304718017578, "global_step": 148615, "epoch": 1228} {"train_loss": -38.64068603515625, "global_step": 148616, "epoch": 1228} {"train_loss": -38.16286087036133, "global_step": 148617, "epoch": 1228} {"train_loss": -38.185604095458984, "global_step": 148618, "epoch": 1228} {"train_loss": -38.29359436035156, "global_step": 148619, "epoch": 1228} {"train_loss": -38.46944046020508, "global_step": 148620, "epoch": 1228} {"train_loss": -38.412811279296875, "global_step": 148621, "epoch": 1228} {"train_loss": -38.28236770629883, "global_step": 148622, "epoch": 1228} {"train_loss": -38.49016571044922, "global_step": 148623, "epoch": 1228} {"train_loss": -38.66645431518555, "global_step": 148624, "epoch": 1228} {"train_loss": -37.699951171875, "global_step": 148625, "epoch": 1228} {"train_loss": -38.747894287109375, "global_step": 148626, "epoch": 1228} {"train_loss": -38.37873458862305, "global_step": 148627, "epoch": 1228} {"train_loss": -39.378448486328125, "global_step": 148628, "epoch": 1228} {"train_loss": -39.086456298828125, "global_step": 148629, "epoch": 1228} {"train_loss": -39.648773193359375, "global_step": 148630, "epoch": 1228} {"train_loss": -39.13765335083008, "global_step": 148631, "epoch": 1228} {"train_loss": -38.95223617553711, "global_step": 148632, "epoch": 1228} {"train_loss": -39.31454849243164, "global_step": 148633, "epoch": 1228} {"train_loss": -39.15133285522461, "global_step": 148634, "epoch": 1228} {"train_loss": -39.42867660522461, "global_step": 148635, "epoch": 1228} {"train_loss": -39.37704086303711, "global_step": 148636, "epoch": 1228} {"train_loss": -39.35410690307617, "global_step": 148637, "epoch": 1228} {"train_loss": -39.13118362426758, "global_step": 148638, "epoch": 1228} {"train_loss": -38.913387298583984, "global_step": 148639, "epoch": 1228} {"train_loss": -39.3419189453125, "global_step": 148640, "epoch": 1228} {"train_loss": -39.54790115356445, "global_step": 148641, "epoch": 1228} {"train_loss": -39.49733352661133, "global_step": 148642, "epoch": 1228} {"train_loss": -39.135398864746094, "global_step": 148643, "epoch": 1228} {"train_loss": -39.862579345703125, "global_step": 148644, "epoch": 1228} {"train_loss": -39.54358673095703, "global_step": 148645, "epoch": 1228} {"train_loss": -39.15985107421875, "global_step": 148646, "epoch": 1228} {"train_loss": -39.710323333740234, "global_step": 148647, "epoch": 1228} {"train_loss": -39.72306442260742, "global_step": 148648, "epoch": 1228} {"train_loss": -39.81110763549805, "global_step": 148649, "epoch": 1228} {"train_loss": -39.79439926147461, "global_step": 148650, "epoch": 1228} {"train_loss": -40.04158401489258, "global_step": 148651, "epoch": 1228} {"train_loss": -39.52772903442383, "global_step": 148652, "epoch": 1228} {"train_loss": -39.46173095703125, "global_step": 148653, "epoch": 1228} {"train_loss": -39.2395133972168, "global_step": 148654, "epoch": 1228} {"train_loss": -39.42158508300781, "global_step": 148655, "epoch": 1228} {"train_loss": -40.04539108276367, "global_step": 148656, "epoch": 1228} {"train_loss": -40.0536003112793, "global_step": 148657, "epoch": 1228} {"train_loss": -40.17945861816406, "global_step": 148658, "epoch": 1228} {"train_loss": -40.0596923828125, "global_step": 148659, "epoch": 1228} {"train_loss": -40.48984909057617, "global_step": 148660, "epoch": 1228} {"train_loss": -40.273189544677734, "global_step": 148661, "epoch": 1228} {"train_loss": -40.13138961791992, "global_step": 148662, "epoch": 1228} {"train_loss": -40.19263458251953, "global_step": 148663, "epoch": 1228} {"train_loss": -40.11417007446289, "global_step": 148664, "epoch": 1228} {"train_loss": -40.504032135009766, "global_step": 148665, "epoch": 1228} {"train_loss": -40.3260383605957, "global_step": 148666, "epoch": 1228} {"train_loss": -40.15717697143555, "global_step": 148667, "epoch": 1228} {"train_loss": -40.3118782043457, "global_step": 148668, "epoch": 1228} {"train_loss": -40.33415603637695, "global_step": 148669, "epoch": 1228} {"train_loss": -39.23106002807617, "global_step": 148670, "epoch": 1228} {"train_loss": -39.956764221191406, "global_step": 148671, "epoch": 1228} {"train_loss": -39.84670639038086, "global_step": 148672, "epoch": 1228} {"train_loss": -40.66606140136719, "global_step": 148673, "epoch": 1228} {"train_loss": -40.519962310791016, "global_step": 148674, "epoch": 1228} {"train_loss": -40.445919036865234, "global_step": 148675, "epoch": 1228} {"train_loss": -40.15861892700195, "global_step": 148676, "epoch": 1228} {"train_loss": -39.61848449707031, "global_step": 148677, "epoch": 1228} {"train_loss": -40.442420959472656, "global_step": 148678, "epoch": 1228} {"train_loss": -40.53837203979492, "global_step": 148679, "epoch": 1228} {"train_loss": -40.03547286987305, "global_step": 148680, "epoch": 1228} {"train_loss": -39.692039489746094, "global_step": 148681, "epoch": 1228} {"train_loss": -40.3707160949707, "global_step": 148682, "epoch": 1228} {"train_loss": -40.73740005493164, "global_step": 148683, "epoch": 1228} {"train_loss": -39.98533248901367, "global_step": 148684, "epoch": 1228} {"train_loss": -40.59641647338867, "global_step": 148685, "epoch": 1228} {"train_loss": -40.46744918823242, "global_step": 148686, "epoch": 1228} {"train_loss": -40.68079376220703, "global_step": 148687, "epoch": 1228} {"train_loss": -40.23794937133789, "global_step": 148688, "epoch": 1228} {"train_loss": -40.2425651550293, "global_step": 148689, "epoch": 1228} {"train_loss": -39.79417419433594, "global_step": 148690, "epoch": 1228} {"train_loss": -40.71696090698242, "global_step": 148691, "epoch": 1228} {"train_loss": -40.6103630065918, "global_step": 148692, "epoch": 1228} {"train_loss": -40.45964813232422, "global_step": 148693, "epoch": 1228} {"train_loss": -40.63056564331055, "global_step": 148694, "epoch": 1228} {"train_loss": -40.27109909057617, "global_step": 148695, "epoch": 1228} {"train_loss": -40.085079193115234, "global_step": 148696, "epoch": 1228} {"train_loss": -40.08048629760742, "global_step": 148697, "epoch": 1228} {"train_loss": -40.0998420715332, "global_step": 148698, "epoch": 1228} {"train_loss": -40.29051971435547, "global_step": 148699, "epoch": 1228} {"train_loss": -39.11106491088867, "global_step": 148700, "epoch": 1228} {"train_loss": -39.0558967590332, "global_step": 148701, "epoch": 1228} {"train_loss": -36.82841873168945, "global_step": 148702, "epoch": 1228} {"train_loss": -36.9578742980957, "global_step": 148703, "epoch": 1228} {"train_loss": -36.6919059753418, "global_step": 148704, "epoch": 1228} {"train_loss": -36.2519645690918, "global_step": 148705, "epoch": 1228} {"train_loss": -35.99601364135742, "global_step": 148706, "epoch": 1228} {"train_loss": -37.489627838134766, "global_step": 148707, "epoch": 1228} {"train_loss": -39.00021595600223, "global_step": 148708, "epoch": 1228, "val_loss": 2635470.25} {"train_loss": -37.71677780151367, "global_step": 148709, "epoch": 1229} {"train_loss": -34.763065338134766, "global_step": 148710, "epoch": 1229} {"train_loss": -36.72285079956055, "global_step": 148711, "epoch": 1229} {"train_loss": -38.859371185302734, "global_step": 148712, "epoch": 1229} {"train_loss": -37.633522033691406, "global_step": 148713, "epoch": 1229} {"train_loss": -36.8215446472168, "global_step": 148714, "epoch": 1229} {"train_loss": -35.372806549072266, "global_step": 148715, "epoch": 1229} {"train_loss": -38.7215690612793, "global_step": 148716, "epoch": 1229} {"train_loss": -33.388301849365234, "global_step": 148717, "epoch": 1229} {"train_loss": -36.57440948486328, "global_step": 148718, "epoch": 1229} {"train_loss": -32.71962356567383, "global_step": 148719, "epoch": 1229} {"train_loss": -37.5734977722168, "global_step": 148720, "epoch": 1229} {"train_loss": -34.62067413330078, "global_step": 148721, "epoch": 1229} {"train_loss": -36.03460693359375, "global_step": 148722, "epoch": 1229} {"train_loss": -37.25539016723633, "global_step": 148723, "epoch": 1229} {"train_loss": -36.65269088745117, "global_step": 148724, "epoch": 1229} {"train_loss": -38.72534942626953, "global_step": 148725, "epoch": 1229} {"train_loss": -36.79501724243164, "global_step": 148726, "epoch": 1229} {"train_loss": -37.65433883666992, "global_step": 148727, "epoch": 1229} {"train_loss": -38.79995346069336, "global_step": 148728, "epoch": 1229} {"train_loss": -37.46364974975586, "global_step": 148729, "epoch": 1229} {"train_loss": -38.980712890625, "global_step": 148730, "epoch": 1229} {"train_loss": -37.303768157958984, "global_step": 148731, "epoch": 1229} {"train_loss": -37.647884368896484, "global_step": 148732, "epoch": 1229} {"train_loss": -38.90711975097656, "global_step": 148733, "epoch": 1229} {"train_loss": -38.212890625, "global_step": 148734, "epoch": 1229} {"train_loss": -38.99080276489258, "global_step": 148735, "epoch": 1229} {"train_loss": -38.145423889160156, "global_step": 148736, "epoch": 1229} {"train_loss": -37.88593673706055, "global_step": 148737, "epoch": 1229} {"train_loss": -39.35084915161133, "global_step": 148738, "epoch": 1229} {"train_loss": -39.195858001708984, "global_step": 148739, "epoch": 1229} {"train_loss": -39.27079391479492, "global_step": 148740, "epoch": 1229} {"train_loss": -39.579444885253906, "global_step": 148741, "epoch": 1229} {"train_loss": -39.06728744506836, "global_step": 148742, "epoch": 1229} {"train_loss": -39.226600646972656, "global_step": 148743, "epoch": 1229} {"train_loss": -39.79233932495117, "global_step": 148744, "epoch": 1229} {"train_loss": -39.61750030517578, "global_step": 148745, "epoch": 1229} {"train_loss": -39.90358352661133, "global_step": 148746, "epoch": 1229} {"train_loss": -39.89567947387695, "global_step": 148747, "epoch": 1229} {"train_loss": -40.145118713378906, "global_step": 148748, "epoch": 1229} {"train_loss": -40.05910873413086, "global_step": 148749, "epoch": 1229} {"train_loss": -39.88054275512695, "global_step": 148750, "epoch": 1229} {"train_loss": -40.19940185546875, "global_step": 148751, "epoch": 1229} {"train_loss": -40.21028518676758, "global_step": 148752, "epoch": 1229} {"train_loss": -39.972713470458984, "global_step": 148753, "epoch": 1229} {"train_loss": -40.43337631225586, "global_step": 148754, "epoch": 1229} {"train_loss": -40.59843063354492, "global_step": 148755, "epoch": 1229} {"train_loss": -40.106441497802734, "global_step": 148756, "epoch": 1229} {"train_loss": -40.69855880737305, "global_step": 148757, "epoch": 1229} {"train_loss": -40.06178665161133, "global_step": 148758, "epoch": 1229} {"train_loss": -39.952964782714844, "global_step": 148759, "epoch": 1229} {"train_loss": -39.95722579956055, "global_step": 148760, "epoch": 1229} {"train_loss": -40.53464889526367, "global_step": 148761, "epoch": 1229} {"train_loss": -40.581817626953125, "global_step": 148762, "epoch": 1229} {"train_loss": -40.54316329956055, "global_step": 148763, "epoch": 1229} {"train_loss": -40.59865951538086, "global_step": 148764, "epoch": 1229} {"train_loss": -40.884883880615234, "global_step": 148765, "epoch": 1229} {"train_loss": -40.254146575927734, "global_step": 148766, "epoch": 1229} {"train_loss": -40.287574768066406, "global_step": 148767, "epoch": 1229} {"train_loss": -40.85378646850586, "global_step": 148768, "epoch": 1229} {"train_loss": -40.47439193725586, "global_step": 148769, "epoch": 1229} {"train_loss": -40.888763427734375, "global_step": 148770, "epoch": 1229} {"train_loss": -40.26810836791992, "global_step": 148771, "epoch": 1229} {"train_loss": -40.15399169921875, "global_step": 148772, "epoch": 1229} {"train_loss": -40.9912223815918, "global_step": 148773, "epoch": 1229} {"train_loss": -40.768402099609375, "global_step": 148774, "epoch": 1229} {"train_loss": -40.56969451904297, "global_step": 148775, "epoch": 1229} {"train_loss": -40.29453659057617, "global_step": 148776, "epoch": 1229} {"train_loss": -40.750343322753906, "global_step": 148777, "epoch": 1229} {"train_loss": -40.188758850097656, "global_step": 148778, "epoch": 1229} {"train_loss": -39.9173698425293, "global_step": 148779, "epoch": 1229} {"train_loss": -40.851165771484375, "global_step": 148780, "epoch": 1229} {"train_loss": -40.20424270629883, "global_step": 148781, "epoch": 1229} {"train_loss": -40.54542922973633, "global_step": 148782, "epoch": 1229} {"train_loss": -40.70578384399414, "global_step": 148783, "epoch": 1229} {"train_loss": -40.56052780151367, "global_step": 148784, "epoch": 1229} {"train_loss": -41.34781265258789, "global_step": 148785, "epoch": 1229} {"train_loss": -40.72442626953125, "global_step": 148786, "epoch": 1229} {"train_loss": -40.786251068115234, "global_step": 148787, "epoch": 1229} {"train_loss": -40.62058639526367, "global_step": 148788, "epoch": 1229} {"train_loss": -41.21115493774414, "global_step": 148789, "epoch": 1229} {"train_loss": -40.557247161865234, "global_step": 148790, "epoch": 1229} {"train_loss": -40.76079177856445, "global_step": 148791, "epoch": 1229} {"train_loss": -41.059967041015625, "global_step": 148792, "epoch": 1229} {"train_loss": -40.594703674316406, "global_step": 148793, "epoch": 1229} {"train_loss": -41.001617431640625, "global_step": 148794, "epoch": 1229} {"train_loss": -40.86574935913086, "global_step": 148795, "epoch": 1229} {"train_loss": -41.1100959777832, "global_step": 148796, "epoch": 1229} {"train_loss": -40.50298309326172, "global_step": 148797, "epoch": 1229} {"train_loss": -39.08445358276367, "global_step": 148798, "epoch": 1229} {"train_loss": -40.75461959838867, "global_step": 148799, "epoch": 1229} {"train_loss": -39.974365234375, "global_step": 148800, "epoch": 1229} {"train_loss": -39.5681266784668, "global_step": 148801, "epoch": 1229} {"train_loss": -39.22139358520508, "global_step": 148802, "epoch": 1229} {"train_loss": -38.703399658203125, "global_step": 148803, "epoch": 1229} {"train_loss": -38.88399887084961, "global_step": 148804, "epoch": 1229} {"train_loss": -37.9655876159668, "global_step": 148805, "epoch": 1229} {"train_loss": -35.862525939941406, "global_step": 148806, "epoch": 1229} {"train_loss": -35.39265060424805, "global_step": 148807, "epoch": 1229} {"train_loss": -37.26211166381836, "global_step": 148808, "epoch": 1229} {"train_loss": -37.68745803833008, "global_step": 148809, "epoch": 1229} {"train_loss": -39.918399810791016, "global_step": 148810, "epoch": 1229} {"train_loss": -39.70004653930664, "global_step": 148811, "epoch": 1229} {"train_loss": -39.4517822265625, "global_step": 148812, "epoch": 1229} {"train_loss": -39.23826599121094, "global_step": 148813, "epoch": 1229} {"train_loss": -40.05660629272461, "global_step": 148814, "epoch": 1229} {"train_loss": -40.05141830444336, "global_step": 148815, "epoch": 1229} {"train_loss": -40.000850677490234, "global_step": 148816, "epoch": 1229} {"train_loss": -40.06367492675781, "global_step": 148817, "epoch": 1229} {"train_loss": -39.29781723022461, "global_step": 148818, "epoch": 1229} {"train_loss": -38.49542999267578, "global_step": 148819, "epoch": 1229} {"train_loss": -39.340938568115234, "global_step": 148820, "epoch": 1229} {"train_loss": -40.117950439453125, "global_step": 148821, "epoch": 1229} {"train_loss": -39.53567886352539, "global_step": 148822, "epoch": 1229} {"train_loss": -40.16980743408203, "global_step": 148823, "epoch": 1229} {"train_loss": -39.60630416870117, "global_step": 148824, "epoch": 1229} {"train_loss": -38.76400375366211, "global_step": 148825, "epoch": 1229} {"train_loss": -39.29291534423828, "global_step": 148826, "epoch": 1229} {"train_loss": -40.25444030761719, "global_step": 148827, "epoch": 1229} {"train_loss": -40.8710823059082, "global_step": 148828, "epoch": 1229} {"train_loss": -39.27893167290806, "global_step": 148829, "epoch": 1229, "val_loss": 2593627.25} {"train_loss": -40.16787338256836, "global_step": 148830, "epoch": 1230} {"train_loss": -40.2313117980957, "global_step": 148831, "epoch": 1230} {"train_loss": -37.85078048706055, "global_step": 148832, "epoch": 1230} {"train_loss": -40.58697509765625, "global_step": 148833, "epoch": 1230} {"train_loss": -40.01304626464844, "global_step": 148834, "epoch": 1230} {"train_loss": -39.74174118041992, "global_step": 148835, "epoch": 1230} {"train_loss": -39.878963470458984, "global_step": 148836, "epoch": 1230} {"train_loss": -40.40104293823242, "global_step": 148837, "epoch": 1230} {"train_loss": -36.67649841308594, "global_step": 148838, "epoch": 1230} {"train_loss": -40.0969352722168, "global_step": 148839, "epoch": 1230} {"train_loss": -40.986541748046875, "global_step": 148840, "epoch": 1230} {"train_loss": -39.67904281616211, "global_step": 148841, "epoch": 1230} {"train_loss": -41.0773811340332, "global_step": 148842, "epoch": 1230} {"train_loss": -40.704402923583984, "global_step": 148843, "epoch": 1230} {"train_loss": -40.45616149902344, "global_step": 148844, "epoch": 1230} {"train_loss": -39.795867919921875, "global_step": 148845, "epoch": 1230} {"train_loss": -40.39246368408203, "global_step": 148846, "epoch": 1230} {"train_loss": -40.83913040161133, "global_step": 148847, "epoch": 1230} {"train_loss": -40.209590911865234, "global_step": 148848, "epoch": 1230} {"train_loss": -40.7801513671875, "global_step": 148849, "epoch": 1230} {"train_loss": -40.458797454833984, "global_step": 148850, "epoch": 1230} {"train_loss": -39.634132385253906, "global_step": 148851, "epoch": 1230} {"train_loss": -40.29526901245117, "global_step": 148852, "epoch": 1230} {"train_loss": -40.76803207397461, "global_step": 148853, "epoch": 1230} {"train_loss": -39.487640380859375, "global_step": 148854, "epoch": 1230} {"train_loss": -39.288047790527344, "global_step": 148855, "epoch": 1230} {"train_loss": -39.39210891723633, "global_step": 148856, "epoch": 1230} {"train_loss": -41.0679931640625, "global_step": 148857, "epoch": 1230} {"train_loss": -39.499244689941406, "global_step": 148858, "epoch": 1230} {"train_loss": -40.4765739440918, "global_step": 148859, "epoch": 1230} {"train_loss": -39.55770492553711, "global_step": 148860, "epoch": 1230} {"train_loss": -39.672637939453125, "global_step": 148861, "epoch": 1230} {"train_loss": -41.08747482299805, "global_step": 148862, "epoch": 1230} {"train_loss": -40.7238655090332, "global_step": 148863, "epoch": 1230} {"train_loss": -39.55217361450195, "global_step": 148864, "epoch": 1230} {"train_loss": -39.53770065307617, "global_step": 148865, "epoch": 1230} {"train_loss": -40.8177490234375, "global_step": 148866, "epoch": 1230} {"train_loss": -40.9038200378418, "global_step": 148867, "epoch": 1230} {"train_loss": -40.249671936035156, "global_step": 148868, "epoch": 1230} {"train_loss": -40.34539031982422, "global_step": 148869, "epoch": 1230} {"train_loss": -39.294918060302734, "global_step": 148870, "epoch": 1230} {"train_loss": -38.9589729309082, "global_step": 148871, "epoch": 1230} {"train_loss": -39.930885314941406, "global_step": 148872, "epoch": 1230} {"train_loss": -40.72031784057617, "global_step": 148873, "epoch": 1230} {"train_loss": -41.09967041015625, "global_step": 148874, "epoch": 1230} {"train_loss": -39.83484649658203, "global_step": 148875, "epoch": 1230} {"train_loss": -39.38021469116211, "global_step": 148876, "epoch": 1230} {"train_loss": -38.7148551940918, "global_step": 148877, "epoch": 1230} {"train_loss": -39.600399017333984, "global_step": 148878, "epoch": 1230} {"train_loss": -40.584938049316406, "global_step": 148879, "epoch": 1230} {"train_loss": -40.42853927612305, "global_step": 148880, "epoch": 1230} {"train_loss": -39.98329544067383, "global_step": 148881, "epoch": 1230} {"train_loss": -40.915191650390625, "global_step": 148882, "epoch": 1230} {"train_loss": -40.49810791015625, "global_step": 148883, "epoch": 1230} {"train_loss": -40.5104866027832, "global_step": 148884, "epoch": 1230} {"train_loss": -40.50579071044922, "global_step": 148885, "epoch": 1230} {"train_loss": -40.56301498413086, "global_step": 148886, "epoch": 1230} {"train_loss": -40.20583724975586, "global_step": 148887, "epoch": 1230} {"train_loss": -40.69514846801758, "global_step": 148888, "epoch": 1230} {"train_loss": -36.49473190307617, "global_step": 148889, "epoch": 1230} {"train_loss": -39.6289176940918, "global_step": 148890, "epoch": 1230} {"train_loss": -40.39011764526367, "global_step": 148891, "epoch": 1230} {"train_loss": -40.670284271240234, "global_step": 148892, "epoch": 1230} {"train_loss": -40.56699752807617, "global_step": 148893, "epoch": 1230} {"train_loss": -38.88318634033203, "global_step": 148894, "epoch": 1230} {"train_loss": -40.09199142456055, "global_step": 148895, "epoch": 1230} {"train_loss": -40.07551193237305, "global_step": 148896, "epoch": 1230} {"train_loss": -40.27497100830078, "global_step": 148897, "epoch": 1230} {"train_loss": -39.90873718261719, "global_step": 148898, "epoch": 1230} {"train_loss": -39.68440628051758, "global_step": 148899, "epoch": 1230} {"train_loss": -38.574806213378906, "global_step": 148900, "epoch": 1230} {"train_loss": -37.78955078125, "global_step": 148901, "epoch": 1230} {"train_loss": -37.180816650390625, "global_step": 148902, "epoch": 1230} {"train_loss": -39.98821258544922, "global_step": 148903, "epoch": 1230} {"train_loss": -36.88962936401367, "global_step": 148904, "epoch": 1230} {"train_loss": -33.33585739135742, "global_step": 148905, "epoch": 1230} {"train_loss": -33.18115234375, "global_step": 148906, "epoch": 1230} {"train_loss": -37.98635482788086, "global_step": 148907, "epoch": 1230} {"train_loss": -37.787635803222656, "global_step": 148908, "epoch": 1230} {"train_loss": -35.24649429321289, "global_step": 148909, "epoch": 1230} {"train_loss": -36.34174728393555, "global_step": 148910, "epoch": 1230} {"train_loss": -38.32695388793945, "global_step": 148911, "epoch": 1230} {"train_loss": -38.1485595703125, "global_step": 148912, "epoch": 1230} {"train_loss": -38.02412414550781, "global_step": 148913, "epoch": 1230} {"train_loss": -39.10028076171875, "global_step": 148914, "epoch": 1230} {"train_loss": -37.569000244140625, "global_step": 148915, "epoch": 1230} {"train_loss": -38.42320251464844, "global_step": 148916, "epoch": 1230} {"train_loss": -39.12013626098633, "global_step": 148917, "epoch": 1230} {"train_loss": -36.833431243896484, "global_step": 148918, "epoch": 1230} {"train_loss": -37.952232360839844, "global_step": 148919, "epoch": 1230} {"train_loss": -34.46002960205078, "global_step": 148920, "epoch": 1230} {"train_loss": -38.1859245300293, "global_step": 148921, "epoch": 1230} {"train_loss": -36.51681900024414, "global_step": 148922, "epoch": 1230} {"train_loss": -38.32777786254883, "global_step": 148923, "epoch": 1230} {"train_loss": -37.859100341796875, "global_step": 148924, "epoch": 1230} {"train_loss": -39.772613525390625, "global_step": 148925, "epoch": 1230} {"train_loss": -38.46537399291992, "global_step": 148926, "epoch": 1230} {"train_loss": -39.649078369140625, "global_step": 148927, "epoch": 1230} {"train_loss": -39.18446350097656, "global_step": 148928, "epoch": 1230} {"train_loss": -39.710758209228516, "global_step": 148929, "epoch": 1230} {"train_loss": -39.38271713256836, "global_step": 148930, "epoch": 1230} {"train_loss": -39.25315475463867, "global_step": 148931, "epoch": 1230} {"train_loss": -39.92800521850586, "global_step": 148932, "epoch": 1230} {"train_loss": -38.96387481689453, "global_step": 148933, "epoch": 1230} {"train_loss": -39.52366256713867, "global_step": 148934, "epoch": 1230} {"train_loss": -39.64011764526367, "global_step": 148935, "epoch": 1230} {"train_loss": -40.78475570678711, "global_step": 148936, "epoch": 1230} {"train_loss": -39.37212371826172, "global_step": 148937, "epoch": 1230} {"train_loss": -40.555233001708984, "global_step": 148938, "epoch": 1230} {"train_loss": -40.44431686401367, "global_step": 148939, "epoch": 1230} {"train_loss": -39.48579025268555, "global_step": 148940, "epoch": 1230} {"train_loss": -40.064483642578125, "global_step": 148941, "epoch": 1230} {"train_loss": -40.37136459350586, "global_step": 148942, "epoch": 1230} {"train_loss": -40.525089263916016, "global_step": 148943, "epoch": 1230} {"train_loss": -39.73686599731445, "global_step": 148944, "epoch": 1230} {"train_loss": -41.07627487182617, "global_step": 148945, "epoch": 1230} {"train_loss": -39.80644607543945, "global_step": 148946, "epoch": 1230} {"train_loss": -40.626007080078125, "global_step": 148947, "epoch": 1230} {"train_loss": -40.61868667602539, "global_step": 148948, "epoch": 1230} {"train_loss": -40.38814163208008, "global_step": 148949, "epoch": 1230} {"train_loss": -39.43346411334581, "global_step": 148950, "epoch": 1230, "val_loss": 2429499.75} {"train_loss": -40.270626068115234, "global_step": 148951, "epoch": 1231} {"train_loss": -40.300716400146484, "global_step": 148952, "epoch": 1231} {"train_loss": -40.503684997558594, "global_step": 148953, "epoch": 1231} {"train_loss": -40.76445007324219, "global_step": 148954, "epoch": 1231} {"train_loss": -40.673744201660156, "global_step": 148955, "epoch": 1231} {"train_loss": -40.78529357910156, "global_step": 148956, "epoch": 1231} {"train_loss": -40.555389404296875, "global_step": 148957, "epoch": 1231} {"train_loss": -40.88663864135742, "global_step": 148958, "epoch": 1231} {"train_loss": -40.84500503540039, "global_step": 148959, "epoch": 1231} {"train_loss": -40.11140823364258, "global_step": 148960, "epoch": 1231} {"train_loss": -41.238250732421875, "global_step": 148961, "epoch": 1231} {"train_loss": -40.79583740234375, "global_step": 148962, "epoch": 1231} {"train_loss": -40.72884750366211, "global_step": 148963, "epoch": 1231} {"train_loss": -40.641510009765625, "global_step": 148964, "epoch": 1231} {"train_loss": -40.882080078125, "global_step": 148965, "epoch": 1231} {"train_loss": -40.65330505371094, "global_step": 148966, "epoch": 1231} {"train_loss": -40.94770050048828, "global_step": 148967, "epoch": 1231} {"train_loss": -40.94538116455078, "global_step": 148968, "epoch": 1231} {"train_loss": -40.7323112487793, "global_step": 148969, "epoch": 1231} {"train_loss": -40.218040466308594, "global_step": 148970, "epoch": 1231} {"train_loss": -41.0280876159668, "global_step": 148971, "epoch": 1231} {"train_loss": -41.20005798339844, "global_step": 148972, "epoch": 1231} {"train_loss": -40.799129486083984, "global_step": 148973, "epoch": 1231} {"train_loss": -40.98503494262695, "global_step": 148974, "epoch": 1231} {"train_loss": -40.719146728515625, "global_step": 148975, "epoch": 1231} {"train_loss": -36.07126998901367, "global_step": 148976, "epoch": 1231} {"train_loss": -40.742919921875, "global_step": 148977, "epoch": 1231} {"train_loss": -39.26471710205078, "global_step": 148978, "epoch": 1231} {"train_loss": -40.59286117553711, "global_step": 148979, "epoch": 1231} {"train_loss": -40.47893524169922, "global_step": 148980, "epoch": 1231} {"train_loss": -40.35749435424805, "global_step": 148981, "epoch": 1231} {"train_loss": -37.71668243408203, "global_step": 148982, "epoch": 1231} {"train_loss": -40.64256286621094, "global_step": 148983, "epoch": 1231} {"train_loss": -40.82139205932617, "global_step": 148984, "epoch": 1231} {"train_loss": -39.78217315673828, "global_step": 148985, "epoch": 1231} {"train_loss": -38.20956039428711, "global_step": 148986, "epoch": 1231} {"train_loss": -39.69051742553711, "global_step": 148987, "epoch": 1231} {"train_loss": -31.464696884155273, "global_step": 148988, "epoch": 1231} {"train_loss": -37.30315399169922, "global_step": 148989, "epoch": 1231} {"train_loss": -37.73906326293945, "global_step": 148990, "epoch": 1231} {"train_loss": -38.38456726074219, "global_step": 148991, "epoch": 1231} {"train_loss": -39.54294967651367, "global_step": 148992, "epoch": 1231} {"train_loss": -39.24267578125, "global_step": 148993, "epoch": 1231} {"train_loss": -35.803802490234375, "global_step": 148994, "epoch": 1231} {"train_loss": -34.66947555541992, "global_step": 148995, "epoch": 1231} {"train_loss": -39.098567962646484, "global_step": 148996, "epoch": 1231} {"train_loss": -39.43225860595703, "global_step": 148997, "epoch": 1231} {"train_loss": -37.791507720947266, "global_step": 148998, "epoch": 1231} {"train_loss": -39.65159225463867, "global_step": 148999, "epoch": 1231} {"train_loss": -39.84711456298828, "global_step": 149000, "epoch": 1231} {"train_loss": -39.52286911010742, "global_step": 149001, "epoch": 1231} {"train_loss": -39.02732467651367, "global_step": 149002, "epoch": 1231} {"train_loss": -38.69044494628906, "global_step": 149003, "epoch": 1231} {"train_loss": -40.224082946777344, "global_step": 149004, "epoch": 1231} {"train_loss": -39.617462158203125, "global_step": 149005, "epoch": 1231} {"train_loss": -39.51431655883789, "global_step": 149006, "epoch": 1231} {"train_loss": -38.246150970458984, "global_step": 149007, "epoch": 1231} {"train_loss": -40.232330322265625, "global_step": 149008, "epoch": 1231} {"train_loss": -40.101341247558594, "global_step": 149009, "epoch": 1231} {"train_loss": -39.91355514526367, "global_step": 149010, "epoch": 1231} {"train_loss": -40.148799896240234, "global_step": 149011, "epoch": 1231} {"train_loss": -39.78973388671875, "global_step": 149012, "epoch": 1231} {"train_loss": -40.481082916259766, "global_step": 149013, "epoch": 1231} {"train_loss": -40.0023307800293, "global_step": 149014, "epoch": 1231} {"train_loss": -40.105987548828125, "global_step": 149015, "epoch": 1231} {"train_loss": -41.06112289428711, "global_step": 149016, "epoch": 1231} {"train_loss": -38.1521110534668, "global_step": 149017, "epoch": 1231} {"train_loss": -37.71997833251953, "global_step": 149018, "epoch": 1231} {"train_loss": -39.69297409057617, "global_step": 149019, "epoch": 1231} {"train_loss": -36.73335647583008, "global_step": 149020, "epoch": 1231} {"train_loss": -39.722076416015625, "global_step": 149021, "epoch": 1231} {"train_loss": -38.29067611694336, "global_step": 149022, "epoch": 1231} {"train_loss": -39.29499053955078, "global_step": 149023, "epoch": 1231} {"train_loss": -38.98650360107422, "global_step": 149024, "epoch": 1231} {"train_loss": -38.845191955566406, "global_step": 149025, "epoch": 1231} {"train_loss": -39.644309997558594, "global_step": 149026, "epoch": 1231} {"train_loss": -39.8426628112793, "global_step": 149027, "epoch": 1231} {"train_loss": -40.17057418823242, "global_step": 149028, "epoch": 1231} {"train_loss": -39.8532829284668, "global_step": 149029, "epoch": 1231} {"train_loss": -39.359031677246094, "global_step": 149030, "epoch": 1231} {"train_loss": -40.63671875, "global_step": 149031, "epoch": 1231} {"train_loss": -39.90531539916992, "global_step": 149032, "epoch": 1231} {"train_loss": -40.5982666015625, "global_step": 149033, "epoch": 1231} {"train_loss": -39.688899993896484, "global_step": 149034, "epoch": 1231} {"train_loss": -40.76264572143555, "global_step": 149035, "epoch": 1231} {"train_loss": -39.71427917480469, "global_step": 149036, "epoch": 1231} {"train_loss": -40.41379928588867, "global_step": 149037, "epoch": 1231} {"train_loss": -40.724361419677734, "global_step": 149038, "epoch": 1231} {"train_loss": -40.85693359375, "global_step": 149039, "epoch": 1231} {"train_loss": -40.925323486328125, "global_step": 149040, "epoch": 1231} {"train_loss": -39.751075744628906, "global_step": 149041, "epoch": 1231} {"train_loss": -40.76887130737305, "global_step": 149042, "epoch": 1231} {"train_loss": -39.84752655029297, "global_step": 149043, "epoch": 1231} {"train_loss": -40.15894317626953, "global_step": 149044, "epoch": 1231} {"train_loss": -40.395076751708984, "global_step": 149045, "epoch": 1231} {"train_loss": -41.15264892578125, "global_step": 149046, "epoch": 1231} {"train_loss": -40.76491928100586, "global_step": 149047, "epoch": 1231} {"train_loss": -39.863670349121094, "global_step": 149048, "epoch": 1231} {"train_loss": -40.37349319458008, "global_step": 149049, "epoch": 1231} {"train_loss": -39.76853942871094, "global_step": 149050, "epoch": 1231} {"train_loss": -40.909053802490234, "global_step": 149051, "epoch": 1231} {"train_loss": -40.67008590698242, "global_step": 149052, "epoch": 1231} {"train_loss": -40.523956298828125, "global_step": 149053, "epoch": 1231} {"train_loss": -40.3851203918457, "global_step": 149054, "epoch": 1231} {"train_loss": -40.648338317871094, "global_step": 149055, "epoch": 1231} {"train_loss": -40.25092697143555, "global_step": 149056, "epoch": 1231} {"train_loss": -40.606040954589844, "global_step": 149057, "epoch": 1231} {"train_loss": -40.31697082519531, "global_step": 149058, "epoch": 1231} {"train_loss": -40.51976013183594, "global_step": 149059, "epoch": 1231} {"train_loss": -40.726280212402344, "global_step": 149060, "epoch": 1231} {"train_loss": -41.008148193359375, "global_step": 149061, "epoch": 1231} {"train_loss": -40.35157012939453, "global_step": 149062, "epoch": 1231} {"train_loss": -40.51231002807617, "global_step": 149063, "epoch": 1231} {"train_loss": -40.896053314208984, "global_step": 149064, "epoch": 1231} {"train_loss": -40.5286865234375, "global_step": 149065, "epoch": 1231} {"train_loss": -40.29782485961914, "global_step": 149066, "epoch": 1231} {"train_loss": -40.69219970703125, "global_step": 149067, "epoch": 1231} {"train_loss": -40.292755126953125, "global_step": 149068, "epoch": 1231} {"train_loss": -40.47590255737305, "global_step": 149069, "epoch": 1231} {"train_loss": -41.20685577392578, "global_step": 149070, "epoch": 1231} {"train_loss": -39.88262051984298, "global_step": 149071, "epoch": 1231, "val_loss": 2743384.25} {"train_loss": -39.666316986083984, "global_step": 149072, "epoch": 1232} {"train_loss": -39.90478515625, "global_step": 149073, "epoch": 1232} {"train_loss": -41.238739013671875, "global_step": 149074, "epoch": 1232} {"train_loss": -40.451988220214844, "global_step": 149075, "epoch": 1232} {"train_loss": -41.20636749267578, "global_step": 149076, "epoch": 1232} {"train_loss": -41.583343505859375, "global_step": 149077, "epoch": 1232} {"train_loss": -41.31313705444336, "global_step": 149078, "epoch": 1232} {"train_loss": -40.595088958740234, "global_step": 149079, "epoch": 1232} {"train_loss": -40.380489349365234, "global_step": 149080, "epoch": 1232} {"train_loss": -41.17793655395508, "global_step": 149081, "epoch": 1232} {"train_loss": -41.07381820678711, "global_step": 149082, "epoch": 1232} {"train_loss": -40.86265182495117, "global_step": 149083, "epoch": 1232} {"train_loss": -41.445709228515625, "global_step": 149084, "epoch": 1232} {"train_loss": -41.40250778198242, "global_step": 149085, "epoch": 1232} {"train_loss": -40.3768196105957, "global_step": 149086, "epoch": 1232} {"train_loss": -40.24177932739258, "global_step": 149087, "epoch": 1232} {"train_loss": -40.39746856689453, "global_step": 149088, "epoch": 1232} {"train_loss": -41.11140823364258, "global_step": 149089, "epoch": 1232} {"train_loss": -40.04605484008789, "global_step": 149090, "epoch": 1232} {"train_loss": -40.74468231201172, "global_step": 149091, "epoch": 1232} {"train_loss": -40.10163497924805, "global_step": 149092, "epoch": 1232} {"train_loss": -41.083160400390625, "global_step": 149093, "epoch": 1232} {"train_loss": -41.223934173583984, "global_step": 149094, "epoch": 1232} {"train_loss": -40.026100158691406, "global_step": 149095, "epoch": 1232} {"train_loss": -40.862491607666016, "global_step": 149096, "epoch": 1232} {"train_loss": -41.17665481567383, "global_step": 149097, "epoch": 1232} {"train_loss": -40.88214874267578, "global_step": 149098, "epoch": 1232} {"train_loss": -40.554134368896484, "global_step": 149099, "epoch": 1232} {"train_loss": -40.62040328979492, "global_step": 149100, "epoch": 1232} {"train_loss": -40.251434326171875, "global_step": 149101, "epoch": 1232} {"train_loss": -41.10735321044922, "global_step": 149102, "epoch": 1232} {"train_loss": -41.03856658935547, "global_step": 149103, "epoch": 1232} {"train_loss": -40.8088493347168, "global_step": 149104, "epoch": 1232} {"train_loss": -40.93494415283203, "global_step": 149105, "epoch": 1232} {"train_loss": -40.680763244628906, "global_step": 149106, "epoch": 1232} {"train_loss": -40.37101364135742, "global_step": 149107, "epoch": 1232} {"train_loss": -40.01017379760742, "global_step": 149108, "epoch": 1232} {"train_loss": -40.161434173583984, "global_step": 149109, "epoch": 1232} {"train_loss": -40.001129150390625, "global_step": 149110, "epoch": 1232} {"train_loss": -37.89889907836914, "global_step": 149111, "epoch": 1232} {"train_loss": -38.20026779174805, "global_step": 149112, "epoch": 1232} {"train_loss": -37.16554641723633, "global_step": 149113, "epoch": 1232} {"train_loss": -38.03513717651367, "global_step": 149114, "epoch": 1232} {"train_loss": -37.0897102355957, "global_step": 149115, "epoch": 1232} {"train_loss": -38.998443603515625, "global_step": 149116, "epoch": 1232} {"train_loss": -39.791481018066406, "global_step": 149117, "epoch": 1232} {"train_loss": -40.59493637084961, "global_step": 149118, "epoch": 1232} {"train_loss": -37.46208572387695, "global_step": 149119, "epoch": 1232} {"train_loss": -37.70652389526367, "global_step": 149120, "epoch": 1232} {"train_loss": -36.2177848815918, "global_step": 149121, "epoch": 1232} {"train_loss": -35.3892707824707, "global_step": 149122, "epoch": 1232} {"train_loss": -39.359954833984375, "global_step": 149123, "epoch": 1232} {"train_loss": -37.984371185302734, "global_step": 149124, "epoch": 1232} {"train_loss": -34.36062240600586, "global_step": 149125, "epoch": 1232} {"train_loss": -38.09746170043945, "global_step": 149126, "epoch": 1232} {"train_loss": -36.95955276489258, "global_step": 149127, "epoch": 1232} {"train_loss": -37.58083724975586, "global_step": 149128, "epoch": 1232} {"train_loss": -37.72343063354492, "global_step": 149129, "epoch": 1232} {"train_loss": -38.330875396728516, "global_step": 149130, "epoch": 1232} {"train_loss": -38.720829010009766, "global_step": 149131, "epoch": 1232} {"train_loss": -37.346923828125, "global_step": 149132, "epoch": 1232} {"train_loss": -38.256412506103516, "global_step": 149133, "epoch": 1232} {"train_loss": -38.286190032958984, "global_step": 149134, "epoch": 1232} {"train_loss": -39.9891471862793, "global_step": 149135, "epoch": 1232} {"train_loss": -38.0684928894043, "global_step": 149136, "epoch": 1232} {"train_loss": -36.49862289428711, "global_step": 149137, "epoch": 1232} {"train_loss": -39.82337188720703, "global_step": 149138, "epoch": 1232} {"train_loss": -38.550537109375, "global_step": 149139, "epoch": 1232} {"train_loss": -38.4802360534668, "global_step": 149140, "epoch": 1232} {"train_loss": -39.708282470703125, "global_step": 149141, "epoch": 1232} {"train_loss": -38.3336181640625, "global_step": 149142, "epoch": 1232} {"train_loss": -40.48093032836914, "global_step": 149143, "epoch": 1232} {"train_loss": -40.117366790771484, "global_step": 149144, "epoch": 1232} {"train_loss": -38.91880416870117, "global_step": 149145, "epoch": 1232} {"train_loss": -40.320838928222656, "global_step": 149146, "epoch": 1232} {"train_loss": -40.0706787109375, "global_step": 149147, "epoch": 1232} {"train_loss": -39.93992233276367, "global_step": 149148, "epoch": 1232} {"train_loss": -40.11272048950195, "global_step": 149149, "epoch": 1232} {"train_loss": -40.544795989990234, "global_step": 149150, "epoch": 1232} {"train_loss": -40.323081970214844, "global_step": 149151, "epoch": 1232} {"train_loss": -39.98207473754883, "global_step": 149152, "epoch": 1232} {"train_loss": -40.92963409423828, "global_step": 149153, "epoch": 1232} {"train_loss": -39.997310638427734, "global_step": 149154, "epoch": 1232} {"train_loss": -39.860774993896484, "global_step": 149155, "epoch": 1232} {"train_loss": -41.17702865600586, "global_step": 149156, "epoch": 1232} {"train_loss": -39.88420867919922, "global_step": 149157, "epoch": 1232} {"train_loss": -40.66471481323242, "global_step": 149158, "epoch": 1232} {"train_loss": -40.650230407714844, "global_step": 149159, "epoch": 1232} {"train_loss": -40.42934799194336, "global_step": 149160, "epoch": 1232} {"train_loss": -40.65853500366211, "global_step": 149161, "epoch": 1232} {"train_loss": -40.42848587036133, "global_step": 149162, "epoch": 1232} {"train_loss": -40.57746887207031, "global_step": 149163, "epoch": 1232} {"train_loss": -40.7092170715332, "global_step": 149164, "epoch": 1232} {"train_loss": -40.745399475097656, "global_step": 149165, "epoch": 1232} {"train_loss": -40.37457275390625, "global_step": 149166, "epoch": 1232} {"train_loss": -40.84906768798828, "global_step": 149167, "epoch": 1232} {"train_loss": -40.65285110473633, "global_step": 149168, "epoch": 1232} {"train_loss": -39.991851806640625, "global_step": 149169, "epoch": 1232} {"train_loss": -40.5236701965332, "global_step": 149170, "epoch": 1232} {"train_loss": -41.35859298706055, "global_step": 149171, "epoch": 1232} {"train_loss": -41.03751754760742, "global_step": 149172, "epoch": 1232} {"train_loss": -40.469207763671875, "global_step": 149173, "epoch": 1232} {"train_loss": -40.45003128051758, "global_step": 149174, "epoch": 1232} {"train_loss": -40.8543815612793, "global_step": 149175, "epoch": 1232} {"train_loss": -40.1506462097168, "global_step": 149176, "epoch": 1232} {"train_loss": -40.361690521240234, "global_step": 149177, "epoch": 1232} {"train_loss": -41.18996810913086, "global_step": 149178, "epoch": 1232} {"train_loss": -40.54482650756836, "global_step": 149179, "epoch": 1232} {"train_loss": -40.89541244506836, "global_step": 149180, "epoch": 1232} {"train_loss": -41.0179557800293, "global_step": 149181, "epoch": 1232} {"train_loss": -40.6798095703125, "global_step": 149182, "epoch": 1232} {"train_loss": -40.5880012512207, "global_step": 149183, "epoch": 1232} {"train_loss": -40.81404495239258, "global_step": 149184, "epoch": 1232} {"train_loss": -40.98786163330078, "global_step": 149185, "epoch": 1232} {"train_loss": -41.337791442871094, "global_step": 149186, "epoch": 1232} {"train_loss": -41.01288986206055, "global_step": 149187, "epoch": 1232} {"train_loss": -40.900142669677734, "global_step": 149188, "epoch": 1232} {"train_loss": -41.11726760864258, "global_step": 149189, "epoch": 1232} {"train_loss": -40.69191360473633, "global_step": 149190, "epoch": 1232} {"train_loss": -40.55239486694336, "global_step": 149191, "epoch": 1232} {"train_loss": -39.93465108319747, "global_step": 149192, "epoch": 1232, "val_loss": 2628938.75} {"train_loss": -41.2812385559082, "global_step": 149193, "epoch": 1233} {"train_loss": -41.064327239990234, "global_step": 149194, "epoch": 1233} {"train_loss": -40.67654037475586, "global_step": 149195, "epoch": 1233} {"train_loss": -39.51084518432617, "global_step": 149196, "epoch": 1233} {"train_loss": -40.17530822753906, "global_step": 149197, "epoch": 1233} {"train_loss": -39.86533737182617, "global_step": 149198, "epoch": 1233} {"train_loss": -39.45716094970703, "global_step": 149199, "epoch": 1233} {"train_loss": -40.353607177734375, "global_step": 149200, "epoch": 1233} {"train_loss": -40.81726837158203, "global_step": 149201, "epoch": 1233} {"train_loss": -40.88106155395508, "global_step": 149202, "epoch": 1233} {"train_loss": -41.2119255065918, "global_step": 149203, "epoch": 1233} {"train_loss": -40.497432708740234, "global_step": 149204, "epoch": 1233} {"train_loss": -40.058929443359375, "global_step": 149205, "epoch": 1233} {"train_loss": -41.36486053466797, "global_step": 149206, "epoch": 1233} {"train_loss": -39.971065521240234, "global_step": 149207, "epoch": 1233} {"train_loss": -38.82957458496094, "global_step": 149208, "epoch": 1233} {"train_loss": -38.49618911743164, "global_step": 149209, "epoch": 1233} {"train_loss": -38.03615188598633, "global_step": 149210, "epoch": 1233} {"train_loss": -37.783607482910156, "global_step": 149211, "epoch": 1233} {"train_loss": -38.41301345825195, "global_step": 149212, "epoch": 1233} {"train_loss": -39.19993209838867, "global_step": 149213, "epoch": 1233} {"train_loss": -38.46547317504883, "global_step": 149214, "epoch": 1233} {"train_loss": -39.813053131103516, "global_step": 149215, "epoch": 1233} {"train_loss": -41.18001174926758, "global_step": 149216, "epoch": 1233} {"train_loss": -39.108070373535156, "global_step": 149217, "epoch": 1233} {"train_loss": -38.16738510131836, "global_step": 149218, "epoch": 1233} {"train_loss": -39.76157760620117, "global_step": 149219, "epoch": 1233} {"train_loss": -39.411617279052734, "global_step": 149220, "epoch": 1233} {"train_loss": -37.93001174926758, "global_step": 149221, "epoch": 1233} {"train_loss": -39.36906051635742, "global_step": 149222, "epoch": 1233} {"train_loss": -40.637847900390625, "global_step": 149223, "epoch": 1233} {"train_loss": -39.98351287841797, "global_step": 149224, "epoch": 1233} {"train_loss": -39.57062911987305, "global_step": 149225, "epoch": 1233} {"train_loss": -40.886409759521484, "global_step": 149226, "epoch": 1233} {"train_loss": -40.438358306884766, "global_step": 149227, "epoch": 1233} {"train_loss": -40.020408630371094, "global_step": 149228, "epoch": 1233} {"train_loss": -41.158321380615234, "global_step": 149229, "epoch": 1233} {"train_loss": -40.199920654296875, "global_step": 149230, "epoch": 1233} {"train_loss": -40.525081634521484, "global_step": 149231, "epoch": 1233} {"train_loss": -40.7105827331543, "global_step": 149232, "epoch": 1233} {"train_loss": -40.74333572387695, "global_step": 149233, "epoch": 1233} {"train_loss": -40.78875732421875, "global_step": 149234, "epoch": 1233} {"train_loss": -40.895320892333984, "global_step": 149235, "epoch": 1233} {"train_loss": -40.61201858520508, "global_step": 149236, "epoch": 1233} {"train_loss": -41.576385498046875, "global_step": 149237, "epoch": 1233} {"train_loss": -40.95386505126953, "global_step": 149238, "epoch": 1233} {"train_loss": -41.04684829711914, "global_step": 149239, "epoch": 1233} {"train_loss": -41.47365951538086, "global_step": 149240, "epoch": 1233} {"train_loss": -41.200618743896484, "global_step": 149241, "epoch": 1233} {"train_loss": -41.507659912109375, "global_step": 149242, "epoch": 1233} {"train_loss": -41.014530181884766, "global_step": 149243, "epoch": 1233} {"train_loss": -41.09196472167969, "global_step": 149244, "epoch": 1233} {"train_loss": -40.27812576293945, "global_step": 149245, "epoch": 1233} {"train_loss": -41.34960174560547, "global_step": 149246, "epoch": 1233} {"train_loss": -41.542564392089844, "global_step": 149247, "epoch": 1233} {"train_loss": -40.59719467163086, "global_step": 149248, "epoch": 1233} {"train_loss": -40.283172607421875, "global_step": 149249, "epoch": 1233} {"train_loss": -40.28988265991211, "global_step": 149250, "epoch": 1233} {"train_loss": -41.086036682128906, "global_step": 149251, "epoch": 1233} {"train_loss": -40.61355209350586, "global_step": 149252, "epoch": 1233} {"train_loss": -41.2322998046875, "global_step": 149253, "epoch": 1233} {"train_loss": -40.511531829833984, "global_step": 149254, "epoch": 1233} {"train_loss": -40.15296173095703, "global_step": 149255, "epoch": 1233} {"train_loss": -41.1346321105957, "global_step": 149256, "epoch": 1233} {"train_loss": -40.582183837890625, "global_step": 149257, "epoch": 1233} {"train_loss": -40.992286682128906, "global_step": 149258, "epoch": 1233} {"train_loss": -41.171634674072266, "global_step": 149259, "epoch": 1233} {"train_loss": -40.0478515625, "global_step": 149260, "epoch": 1233} {"train_loss": -38.44122314453125, "global_step": 149261, "epoch": 1233} {"train_loss": -36.650428771972656, "global_step": 149262, "epoch": 1233} {"train_loss": -40.67001724243164, "global_step": 149263, "epoch": 1233} {"train_loss": -40.02754592895508, "global_step": 149264, "epoch": 1233} {"train_loss": -35.80994415283203, "global_step": 149265, "epoch": 1233} {"train_loss": -37.206825256347656, "global_step": 149266, "epoch": 1233} {"train_loss": -39.417640686035156, "global_step": 149267, "epoch": 1233} {"train_loss": -40.353858947753906, "global_step": 149268, "epoch": 1233} {"train_loss": -39.402889251708984, "global_step": 149269, "epoch": 1233} {"train_loss": -39.3978157043457, "global_step": 149270, "epoch": 1233} {"train_loss": -40.51949691772461, "global_step": 149271, "epoch": 1233} {"train_loss": -39.580482482910156, "global_step": 149272, "epoch": 1233} {"train_loss": -38.24858856201172, "global_step": 149273, "epoch": 1233} {"train_loss": -40.4130859375, "global_step": 149274, "epoch": 1233} {"train_loss": -39.64499282836914, "global_step": 149275, "epoch": 1233} {"train_loss": -39.37557601928711, "global_step": 149276, "epoch": 1233} {"train_loss": -40.75596237182617, "global_step": 149277, "epoch": 1233} {"train_loss": -39.85676193237305, "global_step": 149278, "epoch": 1233} {"train_loss": -40.46519088745117, "global_step": 149279, "epoch": 1233} {"train_loss": -40.776790618896484, "global_step": 149280, "epoch": 1233} {"train_loss": -40.33955764770508, "global_step": 149281, "epoch": 1233} {"train_loss": -41.12754440307617, "global_step": 149282, "epoch": 1233} {"train_loss": -40.56655502319336, "global_step": 149283, "epoch": 1233} {"train_loss": -40.279205322265625, "global_step": 149284, "epoch": 1233} {"train_loss": -41.12807846069336, "global_step": 149285, "epoch": 1233} {"train_loss": -40.49785232543945, "global_step": 149286, "epoch": 1233} {"train_loss": -41.15424728393555, "global_step": 149287, "epoch": 1233} {"train_loss": -41.085655212402344, "global_step": 149288, "epoch": 1233} {"train_loss": -40.72230911254883, "global_step": 149289, "epoch": 1233} {"train_loss": -40.89250564575195, "global_step": 149290, "epoch": 1233} {"train_loss": -41.441314697265625, "global_step": 149291, "epoch": 1233} {"train_loss": -41.17411422729492, "global_step": 149292, "epoch": 1233} {"train_loss": -41.00242233276367, "global_step": 149293, "epoch": 1233} {"train_loss": -41.13420104980469, "global_step": 149294, "epoch": 1233} {"train_loss": -40.869049072265625, "global_step": 149295, "epoch": 1233} {"train_loss": -40.32981491088867, "global_step": 149296, "epoch": 1233} {"train_loss": -41.256256103515625, "global_step": 149297, "epoch": 1233} {"train_loss": -41.163673400878906, "global_step": 149298, "epoch": 1233} {"train_loss": -40.514888763427734, "global_step": 149299, "epoch": 1233} {"train_loss": -40.3414421081543, "global_step": 149300, "epoch": 1233} {"train_loss": -40.775699615478516, "global_step": 149301, "epoch": 1233} {"train_loss": -40.7185173034668, "global_step": 149302, "epoch": 1233} {"train_loss": -40.2169189453125, "global_step": 149303, "epoch": 1233} {"train_loss": -41.5230712890625, "global_step": 149304, "epoch": 1233} {"train_loss": -41.25166320800781, "global_step": 149305, "epoch": 1233} {"train_loss": -41.21446228027344, "global_step": 149306, "epoch": 1233} {"train_loss": -41.06859588623047, "global_step": 149307, "epoch": 1233} {"train_loss": -41.56099319458008, "global_step": 149308, "epoch": 1233} {"train_loss": -40.846317291259766, "global_step": 149309, "epoch": 1233} {"train_loss": -40.819488525390625, "global_step": 149310, "epoch": 1233} {"train_loss": -40.8219108581543, "global_step": 149311, "epoch": 1233} {"train_loss": -41.12797164916992, "global_step": 149312, "epoch": 1233} {"train_loss": -40.304157887608554, "global_step": 149313, "epoch": 1233, "val_loss": 2644462.75} {"train_loss": -41.26009750366211, "global_step": 149314, "epoch": 1234} {"train_loss": -40.67997360229492, "global_step": 149315, "epoch": 1234} {"train_loss": -41.72200393676758, "global_step": 149316, "epoch": 1234} {"train_loss": -41.15008544921875, "global_step": 149317, "epoch": 1234} {"train_loss": -39.607749938964844, "global_step": 149318, "epoch": 1234} {"train_loss": -39.09531021118164, "global_step": 149319, "epoch": 1234} {"train_loss": -39.54453659057617, "global_step": 149320, "epoch": 1234} {"train_loss": -41.1063117980957, "global_step": 149321, "epoch": 1234} {"train_loss": -40.90680694580078, "global_step": 149322, "epoch": 1234} {"train_loss": -40.46955490112305, "global_step": 149323, "epoch": 1234} {"train_loss": -40.42079544067383, "global_step": 149324, "epoch": 1234} {"train_loss": -41.22968292236328, "global_step": 149325, "epoch": 1234} {"train_loss": -40.582942962646484, "global_step": 149326, "epoch": 1234} {"train_loss": -40.32854461669922, "global_step": 149327, "epoch": 1234} {"train_loss": -41.20427322387695, "global_step": 149328, "epoch": 1234} {"train_loss": -40.73525619506836, "global_step": 149329, "epoch": 1234} {"train_loss": -40.837982177734375, "global_step": 149330, "epoch": 1234} {"train_loss": -41.39635467529297, "global_step": 149331, "epoch": 1234} {"train_loss": -40.469905853271484, "global_step": 149332, "epoch": 1234} {"train_loss": -41.42686080932617, "global_step": 149333, "epoch": 1234} {"train_loss": -41.3223762512207, "global_step": 149334, "epoch": 1234} {"train_loss": -40.68559646606445, "global_step": 149335, "epoch": 1234} {"train_loss": -41.7222785949707, "global_step": 149336, "epoch": 1234} {"train_loss": -40.825599670410156, "global_step": 149337, "epoch": 1234} {"train_loss": -40.39173889160156, "global_step": 149338, "epoch": 1234} {"train_loss": -40.733150482177734, "global_step": 149339, "epoch": 1234} {"train_loss": -40.5029296875, "global_step": 149340, "epoch": 1234} {"train_loss": -40.664066314697266, "global_step": 149341, "epoch": 1234} {"train_loss": -41.097023010253906, "global_step": 149342, "epoch": 1234} {"train_loss": -40.93928909301758, "global_step": 149343, "epoch": 1234} {"train_loss": -41.23440170288086, "global_step": 149344, "epoch": 1234} {"train_loss": -41.43376922607422, "global_step": 149345, "epoch": 1234} {"train_loss": -41.09305953979492, "global_step": 149346, "epoch": 1234} {"train_loss": -40.40497970581055, "global_step": 149347, "epoch": 1234} {"train_loss": -40.751953125, "global_step": 149348, "epoch": 1234} {"train_loss": -40.511749267578125, "global_step": 149349, "epoch": 1234} {"train_loss": -39.71706771850586, "global_step": 149350, "epoch": 1234} {"train_loss": -40.33552169799805, "global_step": 149351, "epoch": 1234} {"train_loss": -40.17416000366211, "global_step": 149352, "epoch": 1234} {"train_loss": -40.333614349365234, "global_step": 149353, "epoch": 1234} {"train_loss": -40.776519775390625, "global_step": 149354, "epoch": 1234} {"train_loss": -41.305152893066406, "global_step": 149355, "epoch": 1234} {"train_loss": -41.1750373840332, "global_step": 149356, "epoch": 1234} {"train_loss": -41.27907943725586, "global_step": 149357, "epoch": 1234} {"train_loss": -41.083858489990234, "global_step": 149358, "epoch": 1234} {"train_loss": -40.73476791381836, "global_step": 149359, "epoch": 1234} {"train_loss": -41.399288177490234, "global_step": 149360, "epoch": 1234} {"train_loss": -41.065425872802734, "global_step": 149361, "epoch": 1234} {"train_loss": -41.53524398803711, "global_step": 149362, "epoch": 1234} {"train_loss": -40.845115661621094, "global_step": 149363, "epoch": 1234} {"train_loss": -39.37295150756836, "global_step": 149364, "epoch": 1234} {"train_loss": -40.29557418823242, "global_step": 149365, "epoch": 1234} {"train_loss": -40.18276596069336, "global_step": 149366, "epoch": 1234} {"train_loss": -40.97493362426758, "global_step": 149367, "epoch": 1234} {"train_loss": -40.80139923095703, "global_step": 149368, "epoch": 1234} {"train_loss": -41.05880355834961, "global_step": 149369, "epoch": 1234} {"train_loss": -41.04345703125, "global_step": 149370, "epoch": 1234} {"train_loss": -40.968257904052734, "global_step": 149371, "epoch": 1234} {"train_loss": -40.81107711791992, "global_step": 149372, "epoch": 1234} {"train_loss": -39.56118392944336, "global_step": 149373, "epoch": 1234} {"train_loss": -39.24589157104492, "global_step": 149374, "epoch": 1234} {"train_loss": -36.31040954589844, "global_step": 149375, "epoch": 1234} {"train_loss": -38.88639831542969, "global_step": 149376, "epoch": 1234} {"train_loss": -39.6246452331543, "global_step": 149377, "epoch": 1234} {"train_loss": -40.6302375793457, "global_step": 149378, "epoch": 1234} {"train_loss": -39.17291259765625, "global_step": 149379, "epoch": 1234} {"train_loss": -36.313228607177734, "global_step": 149380, "epoch": 1234} {"train_loss": -30.65926170349121, "global_step": 149381, "epoch": 1234} {"train_loss": -23.82077980041504, "global_step": 149382, "epoch": 1234} {"train_loss": -20.486661911010742, "global_step": 149383, "epoch": 1234} {"train_loss": -30.607019424438477, "global_step": 149384, "epoch": 1234} {"train_loss": -38.60609817504883, "global_step": 149385, "epoch": 1234} {"train_loss": -33.055538177490234, "global_step": 149386, "epoch": 1234} {"train_loss": -28.325475692749023, "global_step": 149387, "epoch": 1234} {"train_loss": -38.93451690673828, "global_step": 149388, "epoch": 1234} {"train_loss": -35.37004089355469, "global_step": 149389, "epoch": 1234} {"train_loss": -34.23215866088867, "global_step": 149390, "epoch": 1234} {"train_loss": -38.3208122253418, "global_step": 149391, "epoch": 1234} {"train_loss": -36.89570999145508, "global_step": 149392, "epoch": 1234} {"train_loss": -38.54531478881836, "global_step": 149393, "epoch": 1234} {"train_loss": -37.40192413330078, "global_step": 149394, "epoch": 1234} {"train_loss": -39.5798454284668, "global_step": 149395, "epoch": 1234} {"train_loss": -37.59149932861328, "global_step": 149396, "epoch": 1234} {"train_loss": -39.8563232421875, "global_step": 149397, "epoch": 1234} {"train_loss": -36.69023895263672, "global_step": 149398, "epoch": 1234} {"train_loss": -39.7570686340332, "global_step": 149399, "epoch": 1234} {"train_loss": -38.0924072265625, "global_step": 149400, "epoch": 1234} {"train_loss": -39.519569396972656, "global_step": 149401, "epoch": 1234} {"train_loss": -38.78352355957031, "global_step": 149402, "epoch": 1234} {"train_loss": -39.81637954711914, "global_step": 149403, "epoch": 1234} {"train_loss": -39.107154846191406, "global_step": 149404, "epoch": 1234} {"train_loss": -39.27217483520508, "global_step": 149405, "epoch": 1234} {"train_loss": -39.70032501220703, "global_step": 149406, "epoch": 1234} {"train_loss": -40.08784866333008, "global_step": 149407, "epoch": 1234} {"train_loss": -39.73655319213867, "global_step": 149408, "epoch": 1234} {"train_loss": -40.295806884765625, "global_step": 149409, "epoch": 1234} {"train_loss": -40.001155853271484, "global_step": 149410, "epoch": 1234} {"train_loss": -40.046043395996094, "global_step": 149411, "epoch": 1234} {"train_loss": -40.38015365600586, "global_step": 149412, "epoch": 1234} {"train_loss": -39.94016647338867, "global_step": 149413, "epoch": 1234} {"train_loss": -40.09687423706055, "global_step": 149414, "epoch": 1234} {"train_loss": -40.15638732910156, "global_step": 149415, "epoch": 1234} {"train_loss": -40.416908264160156, "global_step": 149416, "epoch": 1234} {"train_loss": -40.679378509521484, "global_step": 149417, "epoch": 1234} {"train_loss": -40.28811264038086, "global_step": 149418, "epoch": 1234} {"train_loss": -40.8256950378418, "global_step": 149419, "epoch": 1234} {"train_loss": -40.55622100830078, "global_step": 149420, "epoch": 1234} {"train_loss": -40.660125732421875, "global_step": 149421, "epoch": 1234} {"train_loss": -40.63132858276367, "global_step": 149422, "epoch": 1234} {"train_loss": -40.6981315612793, "global_step": 149423, "epoch": 1234} {"train_loss": -40.46845626831055, "global_step": 149424, "epoch": 1234} {"train_loss": -40.8144416809082, "global_step": 149425, "epoch": 1234} {"train_loss": -40.70454788208008, "global_step": 149426, "epoch": 1234} {"train_loss": -40.77094268798828, "global_step": 149427, "epoch": 1234} {"train_loss": -40.69587326049805, "global_step": 149428, "epoch": 1234} {"train_loss": -40.48249053955078, "global_step": 149429, "epoch": 1234} {"train_loss": -40.7508659362793, "global_step": 149430, "epoch": 1234} {"train_loss": -40.60905075073242, "global_step": 149431, "epoch": 1234} {"train_loss": -41.08713912963867, "global_step": 149432, "epoch": 1234} {"train_loss": -40.792152404785156, "global_step": 149433, "epoch": 1234} {"train_loss": -39.52423916966462, "global_step": 149434, "epoch": 1234, "val_loss": 2614875.25} {"train_loss": -41.09486389160156, "global_step": 149435, "epoch": 1235} {"train_loss": -41.251556396484375, "global_step": 149436, "epoch": 1235} {"train_loss": -41.55613327026367, "global_step": 149437, "epoch": 1235} {"train_loss": -41.11894607543945, "global_step": 149438, "epoch": 1235} {"train_loss": -41.47622299194336, "global_step": 149439, "epoch": 1235} {"train_loss": -40.8558235168457, "global_step": 149440, "epoch": 1235} {"train_loss": -41.6268196105957, "global_step": 149441, "epoch": 1235} {"train_loss": -41.40902328491211, "global_step": 149442, "epoch": 1235} {"train_loss": -41.27460861206055, "global_step": 149443, "epoch": 1235} {"train_loss": -41.2718620300293, "global_step": 149444, "epoch": 1235} {"train_loss": -41.37348556518555, "global_step": 149445, "epoch": 1235} {"train_loss": -41.25709915161133, "global_step": 149446, "epoch": 1235} {"train_loss": -41.540184020996094, "global_step": 149447, "epoch": 1235} {"train_loss": -41.47471237182617, "global_step": 149448, "epoch": 1235} {"train_loss": -41.46719741821289, "global_step": 149449, "epoch": 1235} {"train_loss": -41.572174072265625, "global_step": 149450, "epoch": 1235} {"train_loss": -41.660274505615234, "global_step": 149451, "epoch": 1235} {"train_loss": -41.65546417236328, "global_step": 149452, "epoch": 1235} {"train_loss": -41.76003646850586, "global_step": 149453, "epoch": 1235} {"train_loss": -41.707759857177734, "global_step": 149454, "epoch": 1235} {"train_loss": -41.81903839111328, "global_step": 149455, "epoch": 1235} {"train_loss": -41.562164306640625, "global_step": 149456, "epoch": 1235} {"train_loss": -41.96736526489258, "global_step": 149457, "epoch": 1235} {"train_loss": -41.6874885559082, "global_step": 149458, "epoch": 1235} {"train_loss": -41.62805938720703, "global_step": 149459, "epoch": 1235} {"train_loss": -41.441375732421875, "global_step": 149460, "epoch": 1235} {"train_loss": -41.952056884765625, "global_step": 149461, "epoch": 1235} {"train_loss": -41.31563186645508, "global_step": 149462, "epoch": 1235} {"train_loss": -41.96622848510742, "global_step": 149463, "epoch": 1235} {"train_loss": -41.66292190551758, "global_step": 149464, "epoch": 1235} {"train_loss": -41.91939926147461, "global_step": 149465, "epoch": 1235} {"train_loss": -41.30597686767578, "global_step": 149466, "epoch": 1235} {"train_loss": -41.61597442626953, "global_step": 149467, "epoch": 1235} {"train_loss": -41.66840362548828, "global_step": 149468, "epoch": 1235} {"train_loss": -41.641170501708984, "global_step": 149469, "epoch": 1235} {"train_loss": -41.3929443359375, "global_step": 149470, "epoch": 1235} {"train_loss": -41.34926223754883, "global_step": 149471, "epoch": 1235} {"train_loss": -41.27900314331055, "global_step": 149472, "epoch": 1235} {"train_loss": -41.63761520385742, "global_step": 149473, "epoch": 1235} {"train_loss": -42.202537536621094, "global_step": 149474, "epoch": 1235} {"train_loss": -41.446754455566406, "global_step": 149475, "epoch": 1235} {"train_loss": -41.798583984375, "global_step": 149476, "epoch": 1235} {"train_loss": -41.308876037597656, "global_step": 149477, "epoch": 1235} {"train_loss": -40.243656158447266, "global_step": 149478, "epoch": 1235} {"train_loss": -38.276424407958984, "global_step": 149479, "epoch": 1235} {"train_loss": -38.930633544921875, "global_step": 149480, "epoch": 1235} {"train_loss": -40.084373474121094, "global_step": 149481, "epoch": 1235} {"train_loss": -40.38483810424805, "global_step": 149482, "epoch": 1235} {"train_loss": -40.5661735534668, "global_step": 149483, "epoch": 1235} {"train_loss": -40.58195877075195, "global_step": 149484, "epoch": 1235} {"train_loss": -40.02656555175781, "global_step": 149485, "epoch": 1235} {"train_loss": -38.779048919677734, "global_step": 149486, "epoch": 1235} {"train_loss": -40.699222564697266, "global_step": 149487, "epoch": 1235} {"train_loss": -39.91023635864258, "global_step": 149488, "epoch": 1235} {"train_loss": -40.628822326660156, "global_step": 149489, "epoch": 1235} {"train_loss": -41.059261322021484, "global_step": 149490, "epoch": 1235} {"train_loss": -40.008750915527344, "global_step": 149491, "epoch": 1235} {"train_loss": -40.47169876098633, "global_step": 149492, "epoch": 1235} {"train_loss": -41.11859130859375, "global_step": 149493, "epoch": 1235} {"train_loss": -38.51845932006836, "global_step": 149494, "epoch": 1235} {"train_loss": -40.814697265625, "global_step": 149495, "epoch": 1235} {"train_loss": -40.949378967285156, "global_step": 149496, "epoch": 1235} {"train_loss": -41.1732292175293, "global_step": 149497, "epoch": 1235} {"train_loss": -40.41349792480469, "global_step": 149498, "epoch": 1235} {"train_loss": -41.02193832397461, "global_step": 149499, "epoch": 1235} {"train_loss": -40.67646408081055, "global_step": 149500, "epoch": 1235} {"train_loss": -40.203941345214844, "global_step": 149501, "epoch": 1235} {"train_loss": -40.925079345703125, "global_step": 149502, "epoch": 1235} {"train_loss": -41.26604080200195, "global_step": 149503, "epoch": 1235} {"train_loss": -41.375343322753906, "global_step": 149504, "epoch": 1235} {"train_loss": -40.80170440673828, "global_step": 149505, "epoch": 1235} {"train_loss": -41.0529670715332, "global_step": 149506, "epoch": 1235} {"train_loss": -41.21491241455078, "global_step": 149507, "epoch": 1235} {"train_loss": -40.08903503417969, "global_step": 149508, "epoch": 1235} {"train_loss": -41.059452056884766, "global_step": 149509, "epoch": 1235} {"train_loss": -39.07493209838867, "global_step": 149510, "epoch": 1235} {"train_loss": -39.8347282409668, "global_step": 149511, "epoch": 1235} {"train_loss": -38.892738342285156, "global_step": 149512, "epoch": 1235} {"train_loss": -40.499847412109375, "global_step": 149513, "epoch": 1235} {"train_loss": -40.2115364074707, "global_step": 149514, "epoch": 1235} {"train_loss": -39.446102142333984, "global_step": 149515, "epoch": 1235} {"train_loss": -38.665138244628906, "global_step": 149516, "epoch": 1235} {"train_loss": -37.877140045166016, "global_step": 149517, "epoch": 1235} {"train_loss": -38.02736282348633, "global_step": 149518, "epoch": 1235} {"train_loss": -38.552268981933594, "global_step": 149519, "epoch": 1235} {"train_loss": -40.02926254272461, "global_step": 149520, "epoch": 1235} {"train_loss": -39.7834358215332, "global_step": 149521, "epoch": 1235} {"train_loss": -39.28950119018555, "global_step": 149522, "epoch": 1235} {"train_loss": -39.829158782958984, "global_step": 149523, "epoch": 1235} {"train_loss": -40.5421142578125, "global_step": 149524, "epoch": 1235} {"train_loss": -40.55180740356445, "global_step": 149525, "epoch": 1235} {"train_loss": -39.673274993896484, "global_step": 149526, "epoch": 1235} {"train_loss": -40.67226791381836, "global_step": 149527, "epoch": 1235} {"train_loss": -40.89311599731445, "global_step": 149528, "epoch": 1235} {"train_loss": -39.90367889404297, "global_step": 149529, "epoch": 1235} {"train_loss": -40.3831901550293, "global_step": 149530, "epoch": 1235} {"train_loss": -39.981014251708984, "global_step": 149531, "epoch": 1235} {"train_loss": -41.013484954833984, "global_step": 149532, "epoch": 1235} {"train_loss": -40.74898910522461, "global_step": 149533, "epoch": 1235} {"train_loss": -39.286354064941406, "global_step": 149534, "epoch": 1235} {"train_loss": -40.514400482177734, "global_step": 149535, "epoch": 1235} {"train_loss": -40.42436599731445, "global_step": 149536, "epoch": 1235} {"train_loss": -40.912078857421875, "global_step": 149537, "epoch": 1235} {"train_loss": -40.477569580078125, "global_step": 149538, "epoch": 1235} {"train_loss": -41.10795211791992, "global_step": 149539, "epoch": 1235} {"train_loss": -40.89626693725586, "global_step": 149540, "epoch": 1235} {"train_loss": -38.69514083862305, "global_step": 149541, "epoch": 1235} {"train_loss": -39.87879943847656, "global_step": 149542, "epoch": 1235} {"train_loss": -41.133052825927734, "global_step": 149543, "epoch": 1235} {"train_loss": -40.359596252441406, "global_step": 149544, "epoch": 1235} {"train_loss": -40.571353912353516, "global_step": 149545, "epoch": 1235} {"train_loss": -41.30124282836914, "global_step": 149546, "epoch": 1235} {"train_loss": -40.600929260253906, "global_step": 149547, "epoch": 1235} {"train_loss": -40.6052131652832, "global_step": 149548, "epoch": 1235} {"train_loss": -41.378822326660156, "global_step": 149549, "epoch": 1235} {"train_loss": -40.83317184448242, "global_step": 149550, "epoch": 1235} {"train_loss": -40.14064407348633, "global_step": 149551, "epoch": 1235} {"train_loss": -41.3554801940918, "global_step": 149552, "epoch": 1235} {"train_loss": -41.422943115234375, "global_step": 149553, "epoch": 1235} {"train_loss": -40.80781173706055, "global_step": 149554, "epoch": 1235} {"train_loss": -40.72047597711737, "global_step": 149555, "epoch": 1235, "val_loss": 2654232.75} {"train_loss": -40.77838897705078, "global_step": 149556, "epoch": 1236} {"train_loss": -40.493221282958984, "global_step": 149557, "epoch": 1236} {"train_loss": -41.3317985534668, "global_step": 149558, "epoch": 1236} {"train_loss": -40.05289840698242, "global_step": 149559, "epoch": 1236} {"train_loss": -40.23923873901367, "global_step": 149560, "epoch": 1236} {"train_loss": -41.20426559448242, "global_step": 149561, "epoch": 1236} {"train_loss": -41.399017333984375, "global_step": 149562, "epoch": 1236} {"train_loss": -40.80574035644531, "global_step": 149563, "epoch": 1236} {"train_loss": -39.90193557739258, "global_step": 149564, "epoch": 1236} {"train_loss": -40.48307418823242, "global_step": 149565, "epoch": 1236} {"train_loss": -41.249732971191406, "global_step": 149566, "epoch": 1236} {"train_loss": -41.0852165222168, "global_step": 149567, "epoch": 1236} {"train_loss": -39.7487678527832, "global_step": 149568, "epoch": 1236} {"train_loss": -40.50766372680664, "global_step": 149569, "epoch": 1236} {"train_loss": -40.68182373046875, "global_step": 149570, "epoch": 1236} {"train_loss": -40.15971755981445, "global_step": 149571, "epoch": 1236} {"train_loss": -39.13751983642578, "global_step": 149572, "epoch": 1236} {"train_loss": -40.03289794921875, "global_step": 149573, "epoch": 1236} {"train_loss": -40.470638275146484, "global_step": 149574, "epoch": 1236} {"train_loss": -40.78764724731445, "global_step": 149575, "epoch": 1236} {"train_loss": -40.71803665161133, "global_step": 149576, "epoch": 1236} {"train_loss": -40.70524215698242, "global_step": 149577, "epoch": 1236} {"train_loss": -41.35512924194336, "global_step": 149578, "epoch": 1236} {"train_loss": -39.689998626708984, "global_step": 149579, "epoch": 1236} {"train_loss": -39.09665298461914, "global_step": 149580, "epoch": 1236} {"train_loss": -40.5803337097168, "global_step": 149581, "epoch": 1236} {"train_loss": -40.083168029785156, "global_step": 149582, "epoch": 1236} {"train_loss": -39.2921028137207, "global_step": 149583, "epoch": 1236} {"train_loss": -40.26543045043945, "global_step": 149584, "epoch": 1236} {"train_loss": -41.447078704833984, "global_step": 149585, "epoch": 1236} {"train_loss": -39.58796691894531, "global_step": 149586, "epoch": 1236} {"train_loss": -40.47883605957031, "global_step": 149587, "epoch": 1236} {"train_loss": -41.20796203613281, "global_step": 149588, "epoch": 1236} {"train_loss": -40.3327751159668, "global_step": 149589, "epoch": 1236} {"train_loss": -41.006282806396484, "global_step": 149590, "epoch": 1236} {"train_loss": -40.32725143432617, "global_step": 149591, "epoch": 1236} {"train_loss": -40.421852111816406, "global_step": 149592, "epoch": 1236} {"train_loss": -40.68547439575195, "global_step": 149593, "epoch": 1236} {"train_loss": -39.96097946166992, "global_step": 149594, "epoch": 1236} {"train_loss": -40.749080657958984, "global_step": 149595, "epoch": 1236} {"train_loss": -41.36204528808594, "global_step": 149596, "epoch": 1236} {"train_loss": -40.5077018737793, "global_step": 149597, "epoch": 1236} {"train_loss": -40.45728302001953, "global_step": 149598, "epoch": 1236} {"train_loss": -40.3654670715332, "global_step": 149599, "epoch": 1236} {"train_loss": -40.68193817138672, "global_step": 149600, "epoch": 1236} {"train_loss": -39.160518646240234, "global_step": 149601, "epoch": 1236} {"train_loss": -39.635475158691406, "global_step": 149602, "epoch": 1236} {"train_loss": -39.31980895996094, "global_step": 149603, "epoch": 1236} {"train_loss": -39.65291976928711, "global_step": 149604, "epoch": 1236} {"train_loss": -39.66618728637695, "global_step": 149605, "epoch": 1236} {"train_loss": -39.8692741394043, "global_step": 149606, "epoch": 1236} {"train_loss": -39.878570556640625, "global_step": 149607, "epoch": 1236} {"train_loss": -39.4878044128418, "global_step": 149608, "epoch": 1236} {"train_loss": -39.01475143432617, "global_step": 149609, "epoch": 1236} {"train_loss": -40.542823791503906, "global_step": 149610, "epoch": 1236} {"train_loss": -39.73614501953125, "global_step": 149611, "epoch": 1236} {"train_loss": -39.46089553833008, "global_step": 149612, "epoch": 1236} {"train_loss": -39.442134857177734, "global_step": 149613, "epoch": 1236} {"train_loss": -40.89069747924805, "global_step": 149614, "epoch": 1236} {"train_loss": -39.7837028503418, "global_step": 149615, "epoch": 1236} {"train_loss": -38.85703659057617, "global_step": 149616, "epoch": 1236} {"train_loss": -40.61348342895508, "global_step": 149617, "epoch": 1236} {"train_loss": -37.37606430053711, "global_step": 149618, "epoch": 1236} {"train_loss": -37.34694290161133, "global_step": 149619, "epoch": 1236} {"train_loss": -40.27299499511719, "global_step": 149620, "epoch": 1236} {"train_loss": -36.80732727050781, "global_step": 149621, "epoch": 1236} {"train_loss": -39.0616569519043, "global_step": 149622, "epoch": 1236} {"train_loss": -38.83887481689453, "global_step": 149623, "epoch": 1236} {"train_loss": -37.03532028198242, "global_step": 149624, "epoch": 1236} {"train_loss": -40.02640151977539, "global_step": 149625, "epoch": 1236} {"train_loss": -37.19404220581055, "global_step": 149626, "epoch": 1236} {"train_loss": -39.47410202026367, "global_step": 149627, "epoch": 1236} {"train_loss": -38.56020736694336, "global_step": 149628, "epoch": 1236} {"train_loss": -40.25856399536133, "global_step": 149629, "epoch": 1236} {"train_loss": -40.20855712890625, "global_step": 149630, "epoch": 1236} {"train_loss": -39.48269271850586, "global_step": 149631, "epoch": 1236} {"train_loss": -40.84280014038086, "global_step": 149632, "epoch": 1236} {"train_loss": -38.795772552490234, "global_step": 149633, "epoch": 1236} {"train_loss": -39.9586296081543, "global_step": 149634, "epoch": 1236} {"train_loss": -40.04170608520508, "global_step": 149635, "epoch": 1236} {"train_loss": -40.5809440612793, "global_step": 149636, "epoch": 1236} {"train_loss": -40.115203857421875, "global_step": 149637, "epoch": 1236} {"train_loss": -40.7097282409668, "global_step": 149638, "epoch": 1236} {"train_loss": -40.497901916503906, "global_step": 149639, "epoch": 1236} {"train_loss": -41.20698547363281, "global_step": 149640, "epoch": 1236} {"train_loss": -41.157135009765625, "global_step": 149641, "epoch": 1236} {"train_loss": -40.368072509765625, "global_step": 149642, "epoch": 1236} {"train_loss": -40.78208541870117, "global_step": 149643, "epoch": 1236} {"train_loss": -40.9650993347168, "global_step": 149644, "epoch": 1236} {"train_loss": -41.01900863647461, "global_step": 149645, "epoch": 1236} {"train_loss": -41.263214111328125, "global_step": 149646, "epoch": 1236} {"train_loss": -40.87233352661133, "global_step": 149647, "epoch": 1236} {"train_loss": -41.09754943847656, "global_step": 149648, "epoch": 1236} {"train_loss": -41.14767074584961, "global_step": 149649, "epoch": 1236} {"train_loss": -41.45801544189453, "global_step": 149650, "epoch": 1236} {"train_loss": -41.56053161621094, "global_step": 149651, "epoch": 1236} {"train_loss": -41.187843322753906, "global_step": 149652, "epoch": 1236} {"train_loss": -41.63600540161133, "global_step": 149653, "epoch": 1236} {"train_loss": -41.63930892944336, "global_step": 149654, "epoch": 1236} {"train_loss": -41.74967575073242, "global_step": 149655, "epoch": 1236} {"train_loss": -41.461910247802734, "global_step": 149656, "epoch": 1236} {"train_loss": -41.87102127075195, "global_step": 149657, "epoch": 1236} {"train_loss": -41.54065704345703, "global_step": 149658, "epoch": 1236} {"train_loss": -41.261104583740234, "global_step": 149659, "epoch": 1236} {"train_loss": -41.65181350708008, "global_step": 149660, "epoch": 1236} {"train_loss": -41.66489791870117, "global_step": 149661, "epoch": 1236} {"train_loss": -41.69580078125, "global_step": 149662, "epoch": 1236} {"train_loss": -41.88532638549805, "global_step": 149663, "epoch": 1236} {"train_loss": -41.369503021240234, "global_step": 149664, "epoch": 1236} {"train_loss": -41.8609504699707, "global_step": 149665, "epoch": 1236} {"train_loss": -41.7841911315918, "global_step": 149666, "epoch": 1236} {"train_loss": -41.36153030395508, "global_step": 149667, "epoch": 1236} {"train_loss": -41.401058197021484, "global_step": 149668, "epoch": 1236} {"train_loss": -41.58525848388672, "global_step": 149669, "epoch": 1236} {"train_loss": -40.78062057495117, "global_step": 149670, "epoch": 1236} {"train_loss": -41.83836364746094, "global_step": 149671, "epoch": 1236} {"train_loss": -42.00576400756836, "global_step": 149672, "epoch": 1236} {"train_loss": -42.179039001464844, "global_step": 149673, "epoch": 1236} {"train_loss": -40.8585319519043, "global_step": 149674, "epoch": 1236} {"train_loss": -41.47100830078125, "global_step": 149675, "epoch": 1236} {"train_loss": -40.436401304134655, "global_step": 149676, "epoch": 1236, "val_loss": 2636641.5} {"train_loss": -41.9570426940918, "global_step": 149677, "epoch": 1237} {"train_loss": -41.72539138793945, "global_step": 149678, "epoch": 1237} {"train_loss": -41.87943649291992, "global_step": 149679, "epoch": 1237} {"train_loss": -41.51121520996094, "global_step": 149680, "epoch": 1237} {"train_loss": -41.901344299316406, "global_step": 149681, "epoch": 1237} {"train_loss": -41.903602600097656, "global_step": 149682, "epoch": 1237} {"train_loss": -40.505218505859375, "global_step": 149683, "epoch": 1237} {"train_loss": -41.030311584472656, "global_step": 149684, "epoch": 1237} {"train_loss": -41.456573486328125, "global_step": 149685, "epoch": 1237} {"train_loss": -41.445064544677734, "global_step": 149686, "epoch": 1237} {"train_loss": -42.00665283203125, "global_step": 149687, "epoch": 1237} {"train_loss": -41.1146240234375, "global_step": 149688, "epoch": 1237} {"train_loss": -39.58993148803711, "global_step": 149689, "epoch": 1237} {"train_loss": -41.734981536865234, "global_step": 149690, "epoch": 1237} {"train_loss": -41.20306396484375, "global_step": 149691, "epoch": 1237} {"train_loss": -39.251991271972656, "global_step": 149692, "epoch": 1237} {"train_loss": -36.90576934814453, "global_step": 149693, "epoch": 1237} {"train_loss": -37.181121826171875, "global_step": 149694, "epoch": 1237} {"train_loss": -36.80315017700195, "global_step": 149695, "epoch": 1237} {"train_loss": -37.467010498046875, "global_step": 149696, "epoch": 1237} {"train_loss": -39.029109954833984, "global_step": 149697, "epoch": 1237} {"train_loss": -33.64988327026367, "global_step": 149698, "epoch": 1237} {"train_loss": -39.45682907104492, "global_step": 149699, "epoch": 1237} {"train_loss": -31.45466423034668, "global_step": 149700, "epoch": 1237} {"train_loss": -36.972877502441406, "global_step": 149701, "epoch": 1237} {"train_loss": -37.99109649658203, "global_step": 149702, "epoch": 1237} {"train_loss": -34.79757308959961, "global_step": 149703, "epoch": 1237} {"train_loss": -38.675148010253906, "global_step": 149704, "epoch": 1237} {"train_loss": -35.69086456298828, "global_step": 149705, "epoch": 1237} {"train_loss": -38.18319320678711, "global_step": 149706, "epoch": 1237} {"train_loss": -36.518192291259766, "global_step": 149707, "epoch": 1237} {"train_loss": -37.85419845581055, "global_step": 149708, "epoch": 1237} {"train_loss": -38.03352355957031, "global_step": 149709, "epoch": 1237} {"train_loss": -37.3537483215332, "global_step": 149710, "epoch": 1237} {"train_loss": -37.8663444519043, "global_step": 149711, "epoch": 1237} {"train_loss": -38.54181671142578, "global_step": 149712, "epoch": 1237} {"train_loss": -38.46393966674805, "global_step": 149713, "epoch": 1237} {"train_loss": -39.740394592285156, "global_step": 149714, "epoch": 1237} {"train_loss": -38.93552780151367, "global_step": 149715, "epoch": 1237} {"train_loss": -39.15702438354492, "global_step": 149716, "epoch": 1237} {"train_loss": -39.51503372192383, "global_step": 149717, "epoch": 1237} {"train_loss": -39.78707504272461, "global_step": 149718, "epoch": 1237} {"train_loss": -40.266807556152344, "global_step": 149719, "epoch": 1237} {"train_loss": -39.487850189208984, "global_step": 149720, "epoch": 1237} {"train_loss": -39.96321105957031, "global_step": 149721, "epoch": 1237} {"train_loss": -39.81093978881836, "global_step": 149722, "epoch": 1237} {"train_loss": -40.32761764526367, "global_step": 149723, "epoch": 1237} {"train_loss": -40.57693099975586, "global_step": 149724, "epoch": 1237} {"train_loss": -40.00306701660156, "global_step": 149725, "epoch": 1237} {"train_loss": -40.647396087646484, "global_step": 149726, "epoch": 1237} {"train_loss": -40.01081466674805, "global_step": 149727, "epoch": 1237} {"train_loss": -40.657684326171875, "global_step": 149728, "epoch": 1237} {"train_loss": -40.84901428222656, "global_step": 149729, "epoch": 1237} {"train_loss": -40.889244079589844, "global_step": 149730, "epoch": 1237} {"train_loss": -40.96155548095703, "global_step": 149731, "epoch": 1237} {"train_loss": -41.19321823120117, "global_step": 149732, "epoch": 1237} {"train_loss": -40.556636810302734, "global_step": 149733, "epoch": 1237} {"train_loss": -40.666805267333984, "global_step": 149734, "epoch": 1237} {"train_loss": -40.86246109008789, "global_step": 149735, "epoch": 1237} {"train_loss": -40.73820114135742, "global_step": 149736, "epoch": 1237} {"train_loss": -40.81894302368164, "global_step": 149737, "epoch": 1237} {"train_loss": -41.10993576049805, "global_step": 149738, "epoch": 1237} {"train_loss": -40.53230285644531, "global_step": 149739, "epoch": 1237} {"train_loss": -40.61611557006836, "global_step": 149740, "epoch": 1237} {"train_loss": -40.964962005615234, "global_step": 149741, "epoch": 1237} {"train_loss": -41.45082473754883, "global_step": 149742, "epoch": 1237} {"train_loss": -40.979427337646484, "global_step": 149743, "epoch": 1237} {"train_loss": -41.07083511352539, "global_step": 149744, "epoch": 1237} {"train_loss": -40.885860443115234, "global_step": 149745, "epoch": 1237} {"train_loss": -41.160133361816406, "global_step": 149746, "epoch": 1237} {"train_loss": -40.979637145996094, "global_step": 149747, "epoch": 1237} {"train_loss": -40.60783386230469, "global_step": 149748, "epoch": 1237} {"train_loss": -41.34273147583008, "global_step": 149749, "epoch": 1237} {"train_loss": -40.96232223510742, "global_step": 149750, "epoch": 1237} {"train_loss": -40.852149963378906, "global_step": 149751, "epoch": 1237} {"train_loss": -41.32437515258789, "global_step": 149752, "epoch": 1237} {"train_loss": -41.06574630737305, "global_step": 149753, "epoch": 1237} {"train_loss": -41.41267776489258, "global_step": 149754, "epoch": 1237} {"train_loss": -40.04557800292969, "global_step": 149755, "epoch": 1237} {"train_loss": -41.183284759521484, "global_step": 149756, "epoch": 1237} {"train_loss": -40.386024475097656, "global_step": 149757, "epoch": 1237} {"train_loss": -41.5988655090332, "global_step": 149758, "epoch": 1237} {"train_loss": -39.93684768676758, "global_step": 149759, "epoch": 1237} {"train_loss": -41.2279052734375, "global_step": 149760, "epoch": 1237} {"train_loss": -40.000606536865234, "global_step": 149761, "epoch": 1237} {"train_loss": -40.77968978881836, "global_step": 149762, "epoch": 1237} {"train_loss": -39.497371673583984, "global_step": 149763, "epoch": 1237} {"train_loss": -40.59688186645508, "global_step": 149764, "epoch": 1237} {"train_loss": -38.612274169921875, "global_step": 149765, "epoch": 1237} {"train_loss": -40.347496032714844, "global_step": 149766, "epoch": 1237} {"train_loss": -40.29092788696289, "global_step": 149767, "epoch": 1237} {"train_loss": -40.57755661010742, "global_step": 149768, "epoch": 1237} {"train_loss": -40.528995513916016, "global_step": 149769, "epoch": 1237} {"train_loss": -38.50996780395508, "global_step": 149770, "epoch": 1237} {"train_loss": -41.11503982543945, "global_step": 149771, "epoch": 1237} {"train_loss": -39.45600128173828, "global_step": 149772, "epoch": 1237} {"train_loss": -40.31562805175781, "global_step": 149773, "epoch": 1237} {"train_loss": -39.384395599365234, "global_step": 149774, "epoch": 1237} {"train_loss": -40.04126739501953, "global_step": 149775, "epoch": 1237} {"train_loss": -40.48244857788086, "global_step": 149776, "epoch": 1237} {"train_loss": -39.9161491394043, "global_step": 149777, "epoch": 1237} {"train_loss": -39.368831634521484, "global_step": 149778, "epoch": 1237} {"train_loss": -39.727333068847656, "global_step": 149779, "epoch": 1237} {"train_loss": -41.59638595581055, "global_step": 149780, "epoch": 1237} {"train_loss": -40.56390380859375, "global_step": 149781, "epoch": 1237} {"train_loss": -41.1031379699707, "global_step": 149782, "epoch": 1237} {"train_loss": -41.13906478881836, "global_step": 149783, "epoch": 1237} {"train_loss": -40.558197021484375, "global_step": 149784, "epoch": 1237} {"train_loss": -41.6394157409668, "global_step": 149785, "epoch": 1237} {"train_loss": -40.930213928222656, "global_step": 149786, "epoch": 1237} {"train_loss": -40.78285598754883, "global_step": 149787, "epoch": 1237} {"train_loss": -41.620601654052734, "global_step": 149788, "epoch": 1237} {"train_loss": -40.38193893432617, "global_step": 149789, "epoch": 1237} {"train_loss": -40.54616165161133, "global_step": 149790, "epoch": 1237} {"train_loss": -41.56650924682617, "global_step": 149791, "epoch": 1237} {"train_loss": -40.1480712890625, "global_step": 149792, "epoch": 1237} {"train_loss": -40.245697021484375, "global_step": 149793, "epoch": 1237} {"train_loss": -41.44839859008789, "global_step": 149794, "epoch": 1237} {"train_loss": -38.51500701904297, "global_step": 149795, "epoch": 1237} {"train_loss": -40.645912170410156, "global_step": 149796, "epoch": 1237} {"train_loss": -40.00193261706139, "global_step": 149797, "epoch": 1237, "val_loss": 2651733.75} {"train_loss": -39.103450775146484, "global_step": 149798, "epoch": 1238} {"train_loss": -40.13432693481445, "global_step": 149799, "epoch": 1238} {"train_loss": -40.420326232910156, "global_step": 149800, "epoch": 1238} {"train_loss": -41.50431823730469, "global_step": 149801, "epoch": 1238} {"train_loss": -41.15309143066406, "global_step": 149802, "epoch": 1238} {"train_loss": -41.5306510925293, "global_step": 149803, "epoch": 1238} {"train_loss": -39.60665512084961, "global_step": 149804, "epoch": 1238} {"train_loss": -41.166072845458984, "global_step": 149805, "epoch": 1238} {"train_loss": -41.0815315246582, "global_step": 149806, "epoch": 1238} {"train_loss": -40.04365921020508, "global_step": 149807, "epoch": 1238} {"train_loss": -40.77398681640625, "global_step": 149808, "epoch": 1238} {"train_loss": -40.27345657348633, "global_step": 149809, "epoch": 1238} {"train_loss": -40.64944076538086, "global_step": 149810, "epoch": 1238} {"train_loss": -41.1087760925293, "global_step": 149811, "epoch": 1238} {"train_loss": -40.194252014160156, "global_step": 149812, "epoch": 1238} {"train_loss": -41.05669403076172, "global_step": 149813, "epoch": 1238} {"train_loss": -35.010311126708984, "global_step": 149814, "epoch": 1238} {"train_loss": -41.29669952392578, "global_step": 149815, "epoch": 1238} {"train_loss": -41.238155364990234, "global_step": 149816, "epoch": 1238} {"train_loss": -41.12820053100586, "global_step": 149817, "epoch": 1238} {"train_loss": -39.12211608886719, "global_step": 149818, "epoch": 1238} {"train_loss": -40.76121139526367, "global_step": 149819, "epoch": 1238} {"train_loss": -39.7420539855957, "global_step": 149820, "epoch": 1238} {"train_loss": -41.76407241821289, "global_step": 149821, "epoch": 1238} {"train_loss": -40.631072998046875, "global_step": 149822, "epoch": 1238} {"train_loss": -41.141876220703125, "global_step": 149823, "epoch": 1238} {"train_loss": -39.916255950927734, "global_step": 149824, "epoch": 1238} {"train_loss": -39.78303146362305, "global_step": 149825, "epoch": 1238} {"train_loss": -39.2700080871582, "global_step": 149826, "epoch": 1238} {"train_loss": -38.59080123901367, "global_step": 149827, "epoch": 1238} {"train_loss": -40.795223236083984, "global_step": 149828, "epoch": 1238} {"train_loss": -40.88384246826172, "global_step": 149829, "epoch": 1238} {"train_loss": -39.91271209716797, "global_step": 149830, "epoch": 1238} {"train_loss": -40.05518341064453, "global_step": 149831, "epoch": 1238} {"train_loss": -39.58799362182617, "global_step": 149832, "epoch": 1238} {"train_loss": -40.92254638671875, "global_step": 149833, "epoch": 1238} {"train_loss": -40.22066116333008, "global_step": 149834, "epoch": 1238} {"train_loss": -39.440948486328125, "global_step": 149835, "epoch": 1238} {"train_loss": -37.77667236328125, "global_step": 149836, "epoch": 1238} {"train_loss": -39.34916305541992, "global_step": 149837, "epoch": 1238} {"train_loss": -40.10200119018555, "global_step": 149838, "epoch": 1238} {"train_loss": -40.24550247192383, "global_step": 149839, "epoch": 1238} {"train_loss": -40.41986846923828, "global_step": 149840, "epoch": 1238} {"train_loss": -39.53739547729492, "global_step": 149841, "epoch": 1238} {"train_loss": -39.124080657958984, "global_step": 149842, "epoch": 1238} {"train_loss": -35.17942428588867, "global_step": 149843, "epoch": 1238} {"train_loss": -38.87038040161133, "global_step": 149844, "epoch": 1238} {"train_loss": -35.08063888549805, "global_step": 149845, "epoch": 1238} {"train_loss": -39.956329345703125, "global_step": 149846, "epoch": 1238} {"train_loss": -38.4864387512207, "global_step": 149847, "epoch": 1238} {"train_loss": -38.66892623901367, "global_step": 149848, "epoch": 1238} {"train_loss": -37.6287956237793, "global_step": 149849, "epoch": 1238} {"train_loss": -30.94162940979004, "global_step": 149850, "epoch": 1238} {"train_loss": -28.461700439453125, "global_step": 149851, "epoch": 1238} {"train_loss": -38.19279861450195, "global_step": 149852, "epoch": 1238} {"train_loss": -38.804847717285156, "global_step": 149853, "epoch": 1238} {"train_loss": -35.966552734375, "global_step": 149854, "epoch": 1238} {"train_loss": -37.53022384643555, "global_step": 149855, "epoch": 1238} {"train_loss": -34.90058135986328, "global_step": 149856, "epoch": 1238} {"train_loss": -37.477203369140625, "global_step": 149857, "epoch": 1238} {"train_loss": -36.562129974365234, "global_step": 149858, "epoch": 1238} {"train_loss": -36.077972412109375, "global_step": 149859, "epoch": 1238} {"train_loss": -37.1598014831543, "global_step": 149860, "epoch": 1238} {"train_loss": -37.86469650268555, "global_step": 149861, "epoch": 1238} {"train_loss": -38.187530517578125, "global_step": 149862, "epoch": 1238} {"train_loss": -37.88840103149414, "global_step": 149863, "epoch": 1238} {"train_loss": -38.868438720703125, "global_step": 149864, "epoch": 1238} {"train_loss": -38.884490966796875, "global_step": 149865, "epoch": 1238} {"train_loss": -37.03169250488281, "global_step": 149866, "epoch": 1238} {"train_loss": -37.114341735839844, "global_step": 149867, "epoch": 1238} {"train_loss": -37.937583923339844, "global_step": 149868, "epoch": 1238} {"train_loss": -39.12773895263672, "global_step": 149869, "epoch": 1238} {"train_loss": -39.373435974121094, "global_step": 149870, "epoch": 1238} {"train_loss": -39.50666427612305, "global_step": 149871, "epoch": 1238} {"train_loss": -38.8818473815918, "global_step": 149872, "epoch": 1238} {"train_loss": -39.2304801940918, "global_step": 149873, "epoch": 1238} {"train_loss": -38.60905838012695, "global_step": 149874, "epoch": 1238} {"train_loss": -38.5842170715332, "global_step": 149875, "epoch": 1238} {"train_loss": -38.08028793334961, "global_step": 149876, "epoch": 1238} {"train_loss": -39.49897384643555, "global_step": 149877, "epoch": 1238} {"train_loss": -39.55902099609375, "global_step": 149878, "epoch": 1238} {"train_loss": -39.60187530517578, "global_step": 149879, "epoch": 1238} {"train_loss": -40.16229248046875, "global_step": 149880, "epoch": 1238} {"train_loss": -40.23311996459961, "global_step": 149881, "epoch": 1238} {"train_loss": -39.66549301147461, "global_step": 149882, "epoch": 1238} {"train_loss": -40.44951248168945, "global_step": 149883, "epoch": 1238} {"train_loss": -40.019256591796875, "global_step": 149884, "epoch": 1238} {"train_loss": -40.32417297363281, "global_step": 149885, "epoch": 1238} {"train_loss": -39.97488021850586, "global_step": 149886, "epoch": 1238} {"train_loss": -40.567909240722656, "global_step": 149887, "epoch": 1238} {"train_loss": -40.17843246459961, "global_step": 149888, "epoch": 1238} {"train_loss": -40.70450973510742, "global_step": 149889, "epoch": 1238} {"train_loss": -40.513221740722656, "global_step": 149890, "epoch": 1238} {"train_loss": -40.19939422607422, "global_step": 149891, "epoch": 1238} {"train_loss": -40.314666748046875, "global_step": 149892, "epoch": 1238} {"train_loss": -41.011898040771484, "global_step": 149893, "epoch": 1238} {"train_loss": -40.15566635131836, "global_step": 149894, "epoch": 1238} {"train_loss": -40.32766342163086, "global_step": 149895, "epoch": 1238} {"train_loss": -40.786888122558594, "global_step": 149896, "epoch": 1238} {"train_loss": -40.544837951660156, "global_step": 149897, "epoch": 1238} {"train_loss": -41.02286911010742, "global_step": 149898, "epoch": 1238} {"train_loss": -40.71128845214844, "global_step": 149899, "epoch": 1238} {"train_loss": -40.387821197509766, "global_step": 149900, "epoch": 1238} {"train_loss": -40.04273223876953, "global_step": 149901, "epoch": 1238} {"train_loss": -39.946102142333984, "global_step": 149902, "epoch": 1238} {"train_loss": -39.912452697753906, "global_step": 149903, "epoch": 1238} {"train_loss": -40.65581512451172, "global_step": 149904, "epoch": 1238} {"train_loss": -40.27854537963867, "global_step": 149905, "epoch": 1238} {"train_loss": -38.19515609741211, "global_step": 149906, "epoch": 1238} {"train_loss": -40.124114990234375, "global_step": 149907, "epoch": 1238} {"train_loss": -40.93691635131836, "global_step": 149908, "epoch": 1238} {"train_loss": -39.087215423583984, "global_step": 149909, "epoch": 1238} {"train_loss": -38.066715240478516, "global_step": 149910, "epoch": 1238} {"train_loss": -40.1940803527832, "global_step": 149911, "epoch": 1238} {"train_loss": -40.27645492553711, "global_step": 149912, "epoch": 1238} {"train_loss": -39.57949447631836, "global_step": 149913, "epoch": 1238} {"train_loss": -40.20534896850586, "global_step": 149914, "epoch": 1238} {"train_loss": -39.53118896484375, "global_step": 149915, "epoch": 1238} {"train_loss": -40.131046295166016, "global_step": 149916, "epoch": 1238} {"train_loss": -40.698097229003906, "global_step": 149917, "epoch": 1238} {"train_loss": -39.360313147552745, "global_step": 149918, "epoch": 1238, "val_loss": 2786970.0} {"train_loss": -40.29207992553711, "global_step": 149919, "epoch": 1239} {"train_loss": -40.32246017456055, "global_step": 149920, "epoch": 1239} {"train_loss": -40.09540557861328, "global_step": 149921, "epoch": 1239} {"train_loss": -40.44236373901367, "global_step": 149922, "epoch": 1239} {"train_loss": -40.70627975463867, "global_step": 149923, "epoch": 1239} {"train_loss": -40.54777526855469, "global_step": 149924, "epoch": 1239} {"train_loss": -40.76847457885742, "global_step": 149925, "epoch": 1239} {"train_loss": -41.20623779296875, "global_step": 149926, "epoch": 1239} {"train_loss": -40.75916290283203, "global_step": 149927, "epoch": 1239} {"train_loss": -41.13249206542969, "global_step": 149928, "epoch": 1239} {"train_loss": -41.4371223449707, "global_step": 149929, "epoch": 1239} {"train_loss": -40.70907211303711, "global_step": 149930, "epoch": 1239} {"train_loss": -40.50458908081055, "global_step": 149931, "epoch": 1239} {"train_loss": -40.47187805175781, "global_step": 149932, "epoch": 1239} {"train_loss": -40.724849700927734, "global_step": 149933, "epoch": 1239} {"train_loss": -39.685054779052734, "global_step": 149934, "epoch": 1239} {"train_loss": -40.688899993896484, "global_step": 149935, "epoch": 1239} {"train_loss": -40.97541427612305, "global_step": 149936, "epoch": 1239} {"train_loss": -41.18955612182617, "global_step": 149937, "epoch": 1239} {"train_loss": -40.7308349609375, "global_step": 149938, "epoch": 1239} {"train_loss": -40.80296325683594, "global_step": 149939, "epoch": 1239} {"train_loss": -40.512413024902344, "global_step": 149940, "epoch": 1239} {"train_loss": -41.00395202636719, "global_step": 149941, "epoch": 1239} {"train_loss": -39.72565841674805, "global_step": 149942, "epoch": 1239} {"train_loss": -39.1779670715332, "global_step": 149943, "epoch": 1239} {"train_loss": -39.63118362426758, "global_step": 149944, "epoch": 1239} {"train_loss": -40.500465393066406, "global_step": 149945, "epoch": 1239} {"train_loss": -41.279930114746094, "global_step": 149946, "epoch": 1239} {"train_loss": -40.89994430541992, "global_step": 149947, "epoch": 1239} {"train_loss": -39.84322738647461, "global_step": 149948, "epoch": 1239} {"train_loss": -39.90421676635742, "global_step": 149949, "epoch": 1239} {"train_loss": -40.305458068847656, "global_step": 149950, "epoch": 1239} {"train_loss": -40.792144775390625, "global_step": 149951, "epoch": 1239} {"train_loss": -40.97145462036133, "global_step": 149952, "epoch": 1239} {"train_loss": -41.29989242553711, "global_step": 149953, "epoch": 1239} {"train_loss": -40.82444381713867, "global_step": 149954, "epoch": 1239} {"train_loss": -41.096778869628906, "global_step": 149955, "epoch": 1239} {"train_loss": -41.27930450439453, "global_step": 149956, "epoch": 1239} {"train_loss": -41.36821365356445, "global_step": 149957, "epoch": 1239} {"train_loss": -41.026912689208984, "global_step": 149958, "epoch": 1239} {"train_loss": -39.689144134521484, "global_step": 149959, "epoch": 1239} {"train_loss": -39.5131950378418, "global_step": 149960, "epoch": 1239} {"train_loss": -39.52689743041992, "global_step": 149961, "epoch": 1239} {"train_loss": -40.027950286865234, "global_step": 149962, "epoch": 1239} {"train_loss": -40.6452522277832, "global_step": 149963, "epoch": 1239} {"train_loss": -41.20996856689453, "global_step": 149964, "epoch": 1239} {"train_loss": -41.29914474487305, "global_step": 149965, "epoch": 1239} {"train_loss": -40.47841262817383, "global_step": 149966, "epoch": 1239} {"train_loss": -40.696475982666016, "global_step": 149967, "epoch": 1239} {"train_loss": -40.135372161865234, "global_step": 149968, "epoch": 1239} {"train_loss": -40.63833236694336, "global_step": 149969, "epoch": 1239} {"train_loss": -40.49973678588867, "global_step": 149970, "epoch": 1239} {"train_loss": -40.95154571533203, "global_step": 149971, "epoch": 1239} {"train_loss": -41.08784103393555, "global_step": 149972, "epoch": 1239} {"train_loss": -41.09957504272461, "global_step": 149973, "epoch": 1239} {"train_loss": -39.773921966552734, "global_step": 149974, "epoch": 1239} {"train_loss": -40.52576446533203, "global_step": 149975, "epoch": 1239} {"train_loss": -40.29375457763672, "global_step": 149976, "epoch": 1239} {"train_loss": -39.1411018371582, "global_step": 149977, "epoch": 1239} {"train_loss": -38.928016662597656, "global_step": 149978, "epoch": 1239} {"train_loss": -40.22233200073242, "global_step": 149979, "epoch": 1239} {"train_loss": -40.44313430786133, "global_step": 149980, "epoch": 1239} {"train_loss": -40.3023681640625, "global_step": 149981, "epoch": 1239} {"train_loss": -37.683284759521484, "global_step": 149982, "epoch": 1239} {"train_loss": -38.23649215698242, "global_step": 149983, "epoch": 1239} {"train_loss": -41.05101013183594, "global_step": 149984, "epoch": 1239} {"train_loss": -40.41286087036133, "global_step": 149985, "epoch": 1239} {"train_loss": -38.42170333862305, "global_step": 149986, "epoch": 1239} {"train_loss": -38.06624984741211, "global_step": 149987, "epoch": 1239} {"train_loss": -40.36017990112305, "global_step": 149988, "epoch": 1239} {"train_loss": -37.49781036376953, "global_step": 149989, "epoch": 1239} {"train_loss": -38.49013900756836, "global_step": 149990, "epoch": 1239} {"train_loss": -40.394287109375, "global_step": 149991, "epoch": 1239} {"train_loss": -39.72156524658203, "global_step": 149992, "epoch": 1239} {"train_loss": -39.921993255615234, "global_step": 149993, "epoch": 1239} {"train_loss": -40.860347747802734, "global_step": 149994, "epoch": 1239} {"train_loss": -40.018619537353516, "global_step": 149995, "epoch": 1239} {"train_loss": -40.6366081237793, "global_step": 149996, "epoch": 1239} {"train_loss": -40.87158966064453, "global_step": 149997, "epoch": 1239} {"train_loss": -40.50087356567383, "global_step": 149998, "epoch": 1239} {"train_loss": -41.23093795776367, "global_step": 149999, "epoch": 1239} {"train_loss": -39.88217544555664, "global_step": 150000, "epoch": 1239} {"train_loss": -40.06102752685547, "global_step": 150001, "epoch": 1239} {"train_loss": -40.93795394897461, "global_step": 150002, "epoch": 1239} {"train_loss": -40.70219802856445, "global_step": 150003, "epoch": 1239} {"train_loss": -40.14064025878906, "global_step": 150004, "epoch": 1239} {"train_loss": -40.471717834472656, "global_step": 150005, "epoch": 1239} {"train_loss": -40.89535140991211, "global_step": 150006, "epoch": 1239} {"train_loss": -41.044891357421875, "global_step": 150007, "epoch": 1239} {"train_loss": -39.988040924072266, "global_step": 150008, "epoch": 1239} {"train_loss": -40.66699981689453, "global_step": 150009, "epoch": 1239} {"train_loss": -40.605140686035156, "global_step": 150010, "epoch": 1239} {"train_loss": -41.16352462768555, "global_step": 150011, "epoch": 1239} {"train_loss": -40.56184005737305, "global_step": 150012, "epoch": 1239} {"train_loss": -40.671348571777344, "global_step": 150013, "epoch": 1239} {"train_loss": -40.67512512207031, "global_step": 150014, "epoch": 1239} {"train_loss": -41.29168701171875, "global_step": 150015, "epoch": 1239} {"train_loss": -41.3312873840332, "global_step": 150016, "epoch": 1239} {"train_loss": -41.188053131103516, "global_step": 150017, "epoch": 1239} {"train_loss": -41.66184997558594, "global_step": 150018, "epoch": 1239} {"train_loss": -41.0828857421875, "global_step": 150019, "epoch": 1239} {"train_loss": -40.135311126708984, "global_step": 150020, "epoch": 1239} {"train_loss": -40.56907272338867, "global_step": 150021, "epoch": 1239} {"train_loss": -40.533935546875, "global_step": 150022, "epoch": 1239} {"train_loss": -40.766075134277344, "global_step": 150023, "epoch": 1239} {"train_loss": -41.267822265625, "global_step": 150024, "epoch": 1239} {"train_loss": -40.23605728149414, "global_step": 150025, "epoch": 1239} {"train_loss": -40.638858795166016, "global_step": 150026, "epoch": 1239} {"train_loss": -40.0401725769043, "global_step": 150027, "epoch": 1239} {"train_loss": -40.27555847167969, "global_step": 150028, "epoch": 1239} {"train_loss": -39.6531867980957, "global_step": 150029, "epoch": 1239} {"train_loss": -37.81208419799805, "global_step": 150030, "epoch": 1239} {"train_loss": -38.90191650390625, "global_step": 150031, "epoch": 1239} {"train_loss": -39.94902420043945, "global_step": 150032, "epoch": 1239} {"train_loss": -40.1367073059082, "global_step": 150033, "epoch": 1239} {"train_loss": -39.463863372802734, "global_step": 150034, "epoch": 1239} {"train_loss": -39.99420166015625, "global_step": 150035, "epoch": 1239} {"train_loss": -38.363311767578125, "global_step": 150036, "epoch": 1239} {"train_loss": -39.87088394165039, "global_step": 150037, "epoch": 1239} {"train_loss": -40.1671257019043, "global_step": 150038, "epoch": 1239} {"train_loss": -40.334343776229986, "global_step": 150039, "epoch": 1239, "val_loss": 2710927.5} {"train_loss": -39.3022575378418, "global_step": 150040, "epoch": 1240} {"train_loss": -40.50693893432617, "global_step": 150041, "epoch": 1240} {"train_loss": -39.39347457885742, "global_step": 150042, "epoch": 1240} {"train_loss": -39.89876174926758, "global_step": 150043, "epoch": 1240} {"train_loss": -39.177547454833984, "global_step": 150044, "epoch": 1240} {"train_loss": -40.26546859741211, "global_step": 150045, "epoch": 1240} {"train_loss": -40.328582763671875, "global_step": 150046, "epoch": 1240} {"train_loss": -40.16990661621094, "global_step": 150047, "epoch": 1240} {"train_loss": -39.71059799194336, "global_step": 150048, "epoch": 1240} {"train_loss": -40.58503723144531, "global_step": 150049, "epoch": 1240} {"train_loss": -41.09333038330078, "global_step": 150050, "epoch": 1240} {"train_loss": -40.811744689941406, "global_step": 150051, "epoch": 1240} {"train_loss": -39.76190185546875, "global_step": 150052, "epoch": 1240} {"train_loss": -40.58274459838867, "global_step": 150053, "epoch": 1240} {"train_loss": -40.31838607788086, "global_step": 150054, "epoch": 1240} {"train_loss": -41.179115295410156, "global_step": 150055, "epoch": 1240} {"train_loss": -40.51827621459961, "global_step": 150056, "epoch": 1240} {"train_loss": -40.5760612487793, "global_step": 150057, "epoch": 1240} {"train_loss": -40.87102127075195, "global_step": 150058, "epoch": 1240} {"train_loss": -40.675331115722656, "global_step": 150059, "epoch": 1240} {"train_loss": -40.03469467163086, "global_step": 150060, "epoch": 1240} {"train_loss": -41.47929000854492, "global_step": 150061, "epoch": 1240} {"train_loss": -40.52736282348633, "global_step": 150062, "epoch": 1240} {"train_loss": -41.15134048461914, "global_step": 150063, "epoch": 1240} {"train_loss": -41.154212951660156, "global_step": 150064, "epoch": 1240} {"train_loss": -39.97007369995117, "global_step": 150065, "epoch": 1240} {"train_loss": -40.59611892700195, "global_step": 150066, "epoch": 1240} {"train_loss": -40.5264778137207, "global_step": 150067, "epoch": 1240} {"train_loss": -40.890899658203125, "global_step": 150068, "epoch": 1240} {"train_loss": -40.60898208618164, "global_step": 150069, "epoch": 1240} {"train_loss": -41.05356979370117, "global_step": 150070, "epoch": 1240} {"train_loss": -41.6487922668457, "global_step": 150071, "epoch": 1240} {"train_loss": -41.19761276245117, "global_step": 150072, "epoch": 1240} {"train_loss": -40.88045120239258, "global_step": 150073, "epoch": 1240} {"train_loss": -41.853614807128906, "global_step": 150074, "epoch": 1240} {"train_loss": -41.12619400024414, "global_step": 150075, "epoch": 1240} {"train_loss": -40.525474548339844, "global_step": 150076, "epoch": 1240} {"train_loss": -40.86323165893555, "global_step": 150077, "epoch": 1240} {"train_loss": -41.03683090209961, "global_step": 150078, "epoch": 1240} {"train_loss": -40.273468017578125, "global_step": 150079, "epoch": 1240} {"train_loss": -41.034523010253906, "global_step": 150080, "epoch": 1240} {"train_loss": -41.07788848876953, "global_step": 150081, "epoch": 1240} {"train_loss": -40.735530853271484, "global_step": 150082, "epoch": 1240} {"train_loss": -40.021785736083984, "global_step": 150083, "epoch": 1240} {"train_loss": -40.83204650878906, "global_step": 150084, "epoch": 1240} {"train_loss": -40.96705627441406, "global_step": 150085, "epoch": 1240} {"train_loss": -41.35223388671875, "global_step": 150086, "epoch": 1240} {"train_loss": -39.81706619262695, "global_step": 150087, "epoch": 1240} {"train_loss": -38.42625427246094, "global_step": 150088, "epoch": 1240} {"train_loss": -40.883544921875, "global_step": 150089, "epoch": 1240} {"train_loss": -41.36963653564453, "global_step": 150090, "epoch": 1240} {"train_loss": -40.87744903564453, "global_step": 150091, "epoch": 1240} {"train_loss": -41.142757415771484, "global_step": 150092, "epoch": 1240} {"train_loss": -41.57053756713867, "global_step": 150093, "epoch": 1240} {"train_loss": -41.01221466064453, "global_step": 150094, "epoch": 1240} {"train_loss": -39.65766525268555, "global_step": 150095, "epoch": 1240} {"train_loss": -40.05424499511719, "global_step": 150096, "epoch": 1240} {"train_loss": -41.38169479370117, "global_step": 150097, "epoch": 1240} {"train_loss": -41.30887985229492, "global_step": 150098, "epoch": 1240} {"train_loss": -40.45646667480469, "global_step": 150099, "epoch": 1240} {"train_loss": -41.05999755859375, "global_step": 150100, "epoch": 1240} {"train_loss": -41.12910842895508, "global_step": 150101, "epoch": 1240} {"train_loss": -40.981136322021484, "global_step": 150102, "epoch": 1240} {"train_loss": -40.34187698364258, "global_step": 150103, "epoch": 1240} {"train_loss": -39.42558670043945, "global_step": 150104, "epoch": 1240} {"train_loss": -41.162841796875, "global_step": 150105, "epoch": 1240} {"train_loss": -40.70283889770508, "global_step": 150106, "epoch": 1240} {"train_loss": -38.998817443847656, "global_step": 150107, "epoch": 1240} {"train_loss": -40.8887825012207, "global_step": 150108, "epoch": 1240} {"train_loss": -41.34571075439453, "global_step": 150109, "epoch": 1240} {"train_loss": -39.25019454956055, "global_step": 150110, "epoch": 1240} {"train_loss": -41.103267669677734, "global_step": 150111, "epoch": 1240} {"train_loss": -40.88294219970703, "global_step": 150112, "epoch": 1240} {"train_loss": -38.8342399597168, "global_step": 150113, "epoch": 1240} {"train_loss": -40.235591888427734, "global_step": 150114, "epoch": 1240} {"train_loss": -40.98795700073242, "global_step": 150115, "epoch": 1240} {"train_loss": -38.904754638671875, "global_step": 150116, "epoch": 1240} {"train_loss": -40.50929641723633, "global_step": 150117, "epoch": 1240} {"train_loss": -40.88518142700195, "global_step": 150118, "epoch": 1240} {"train_loss": -40.6215934753418, "global_step": 150119, "epoch": 1240} {"train_loss": -40.236083984375, "global_step": 150120, "epoch": 1240} {"train_loss": -41.239078521728516, "global_step": 150121, "epoch": 1240} {"train_loss": -39.52476119995117, "global_step": 150122, "epoch": 1240} {"train_loss": -40.40593338012695, "global_step": 150123, "epoch": 1240} {"train_loss": -39.756866455078125, "global_step": 150124, "epoch": 1240} {"train_loss": -40.0699348449707, "global_step": 150125, "epoch": 1240} {"train_loss": -40.21554946899414, "global_step": 150126, "epoch": 1240} {"train_loss": -39.66046142578125, "global_step": 150127, "epoch": 1240} {"train_loss": -40.04453659057617, "global_step": 150128, "epoch": 1240} {"train_loss": -40.223323822021484, "global_step": 150129, "epoch": 1240} {"train_loss": -38.37966537475586, "global_step": 150130, "epoch": 1240} {"train_loss": -39.73194122314453, "global_step": 150131, "epoch": 1240} {"train_loss": -39.87872314453125, "global_step": 150132, "epoch": 1240} {"train_loss": -39.92169189453125, "global_step": 150133, "epoch": 1240} {"train_loss": -38.526222229003906, "global_step": 150134, "epoch": 1240} {"train_loss": -38.73963928222656, "global_step": 150135, "epoch": 1240} {"train_loss": -36.650367736816406, "global_step": 150136, "epoch": 1240} {"train_loss": -38.252254486083984, "global_step": 150137, "epoch": 1240} {"train_loss": -39.7845573425293, "global_step": 150138, "epoch": 1240} {"train_loss": -38.43890380859375, "global_step": 150139, "epoch": 1240} {"train_loss": -38.2019157409668, "global_step": 150140, "epoch": 1240} {"train_loss": -40.094215393066406, "global_step": 150141, "epoch": 1240} {"train_loss": -40.476470947265625, "global_step": 150142, "epoch": 1240} {"train_loss": -40.33313751220703, "global_step": 150143, "epoch": 1240} {"train_loss": -38.358367919921875, "global_step": 150144, "epoch": 1240} {"train_loss": -38.294288635253906, "global_step": 150145, "epoch": 1240} {"train_loss": -40.44129180908203, "global_step": 150146, "epoch": 1240} {"train_loss": -40.106658935546875, "global_step": 150147, "epoch": 1240} {"train_loss": -39.1436882019043, "global_step": 150148, "epoch": 1240} {"train_loss": -40.095149993896484, "global_step": 150149, "epoch": 1240} {"train_loss": -40.632747650146484, "global_step": 150150, "epoch": 1240} {"train_loss": -39.69131851196289, "global_step": 150151, "epoch": 1240} {"train_loss": -40.158382415771484, "global_step": 150152, "epoch": 1240} {"train_loss": -40.17984390258789, "global_step": 150153, "epoch": 1240} {"train_loss": -40.21025466918945, "global_step": 150154, "epoch": 1240} {"train_loss": -40.04785919189453, "global_step": 150155, "epoch": 1240} {"train_loss": -40.39765167236328, "global_step": 150156, "epoch": 1240} {"train_loss": -40.0936279296875, "global_step": 150157, "epoch": 1240} {"train_loss": -40.61179733276367, "global_step": 150158, "epoch": 1240} {"train_loss": -39.87870407104492, "global_step": 150159, "epoch": 1240} {"train_loss": -40.273405090836455, "global_step": 150160, "epoch": 1240, "val_loss": 2652694.25} {"train_loss": -40.85258483886719, "global_step": 150161, "epoch": 1241} {"train_loss": -40.20736312866211, "global_step": 150162, "epoch": 1241} {"train_loss": -40.99211502075195, "global_step": 150163, "epoch": 1241} {"train_loss": -40.564632415771484, "global_step": 150164, "epoch": 1241} {"train_loss": -40.93574142456055, "global_step": 150165, "epoch": 1241} {"train_loss": -40.59146499633789, "global_step": 150166, "epoch": 1241} {"train_loss": -40.617919921875, "global_step": 150167, "epoch": 1241} {"train_loss": -41.20603561401367, "global_step": 150168, "epoch": 1241} {"train_loss": -40.25654602050781, "global_step": 150169, "epoch": 1241} {"train_loss": -40.96683120727539, "global_step": 150170, "epoch": 1241} {"train_loss": -41.12229919433594, "global_step": 150171, "epoch": 1241} {"train_loss": -41.0893669128418, "global_step": 150172, "epoch": 1241} {"train_loss": -41.28757095336914, "global_step": 150173, "epoch": 1241} {"train_loss": -40.69696807861328, "global_step": 150174, "epoch": 1241} {"train_loss": -41.44091796875, "global_step": 150175, "epoch": 1241} {"train_loss": -40.161468505859375, "global_step": 150176, "epoch": 1241} {"train_loss": -41.12007522583008, "global_step": 150177, "epoch": 1241} {"train_loss": -40.27857208251953, "global_step": 150178, "epoch": 1241} {"train_loss": -40.64297866821289, "global_step": 150179, "epoch": 1241} {"train_loss": -39.72870635986328, "global_step": 150180, "epoch": 1241} {"train_loss": -36.96904373168945, "global_step": 150181, "epoch": 1241} {"train_loss": -39.46382141113281, "global_step": 150182, "epoch": 1241} {"train_loss": -40.529754638671875, "global_step": 150183, "epoch": 1241} {"train_loss": -39.978878021240234, "global_step": 150184, "epoch": 1241} {"train_loss": -39.5773811340332, "global_step": 150185, "epoch": 1241} {"train_loss": -41.61141586303711, "global_step": 150186, "epoch": 1241} {"train_loss": -39.96148681640625, "global_step": 150187, "epoch": 1241} {"train_loss": -40.119686126708984, "global_step": 150188, "epoch": 1241} {"train_loss": -41.07051467895508, "global_step": 150189, "epoch": 1241} {"train_loss": -40.14305877685547, "global_step": 150190, "epoch": 1241} {"train_loss": -40.46277618408203, "global_step": 150191, "epoch": 1241} {"train_loss": -40.850746154785156, "global_step": 150192, "epoch": 1241} {"train_loss": -40.15699005126953, "global_step": 150193, "epoch": 1241} {"train_loss": -40.06064987182617, "global_step": 150194, "epoch": 1241} {"train_loss": -41.147918701171875, "global_step": 150195, "epoch": 1241} {"train_loss": -40.09259033203125, "global_step": 150196, "epoch": 1241} {"train_loss": -41.21856689453125, "global_step": 150197, "epoch": 1241} {"train_loss": -38.755489349365234, "global_step": 150198, "epoch": 1241} {"train_loss": -40.11463928222656, "global_step": 150199, "epoch": 1241} {"train_loss": -39.796104431152344, "global_step": 150200, "epoch": 1241} {"train_loss": -38.91779708862305, "global_step": 150201, "epoch": 1241} {"train_loss": -38.97385787963867, "global_step": 150202, "epoch": 1241} {"train_loss": -39.535152435302734, "global_step": 150203, "epoch": 1241} {"train_loss": -39.20075225830078, "global_step": 150204, "epoch": 1241} {"train_loss": -39.808013916015625, "global_step": 150205, "epoch": 1241} {"train_loss": -39.92106246948242, "global_step": 150206, "epoch": 1241} {"train_loss": -39.117034912109375, "global_step": 150207, "epoch": 1241} {"train_loss": -40.616065979003906, "global_step": 150208, "epoch": 1241} {"train_loss": -40.586822509765625, "global_step": 150209, "epoch": 1241} {"train_loss": -39.33737564086914, "global_step": 150210, "epoch": 1241} {"train_loss": -41.378456115722656, "global_step": 150211, "epoch": 1241} {"train_loss": -40.221824645996094, "global_step": 150212, "epoch": 1241} {"train_loss": -40.60317611694336, "global_step": 150213, "epoch": 1241} {"train_loss": -40.84542465209961, "global_step": 150214, "epoch": 1241} {"train_loss": -40.98564147949219, "global_step": 150215, "epoch": 1241} {"train_loss": -40.701961517333984, "global_step": 150216, "epoch": 1241} {"train_loss": -40.762447357177734, "global_step": 150217, "epoch": 1241} {"train_loss": -40.71046829223633, "global_step": 150218, "epoch": 1241} {"train_loss": -41.0554084777832, "global_step": 150219, "epoch": 1241} {"train_loss": -40.50795364379883, "global_step": 150220, "epoch": 1241} {"train_loss": -41.222267150878906, "global_step": 150221, "epoch": 1241} {"train_loss": -40.78152847290039, "global_step": 150222, "epoch": 1241} {"train_loss": -41.128936767578125, "global_step": 150223, "epoch": 1241} {"train_loss": -41.097930908203125, "global_step": 150224, "epoch": 1241} {"train_loss": -40.78607940673828, "global_step": 150225, "epoch": 1241} {"train_loss": -40.54182052612305, "global_step": 150226, "epoch": 1241} {"train_loss": -41.24262237548828, "global_step": 150227, "epoch": 1241} {"train_loss": -41.34836959838867, "global_step": 150228, "epoch": 1241} {"train_loss": -41.24141311645508, "global_step": 150229, "epoch": 1241} {"train_loss": -41.36394500732422, "global_step": 150230, "epoch": 1241} {"train_loss": -40.7802848815918, "global_step": 150231, "epoch": 1241} {"train_loss": -41.1213493347168, "global_step": 150232, "epoch": 1241} {"train_loss": -41.3120231628418, "global_step": 150233, "epoch": 1241} {"train_loss": -41.56975173950195, "global_step": 150234, "epoch": 1241} {"train_loss": -41.00330352783203, "global_step": 150235, "epoch": 1241} {"train_loss": -41.07094955444336, "global_step": 150236, "epoch": 1241} {"train_loss": -41.01737594604492, "global_step": 150237, "epoch": 1241} {"train_loss": -42.02684020996094, "global_step": 150238, "epoch": 1241} {"train_loss": -41.722633361816406, "global_step": 150239, "epoch": 1241} {"train_loss": -41.350250244140625, "global_step": 150240, "epoch": 1241} {"train_loss": -40.99471664428711, "global_step": 150241, "epoch": 1241} {"train_loss": -39.586463928222656, "global_step": 150242, "epoch": 1241} {"train_loss": -37.0135498046875, "global_step": 150243, "epoch": 1241} {"train_loss": -38.76993942260742, "global_step": 150244, "epoch": 1241} {"train_loss": -39.8807487487793, "global_step": 150245, "epoch": 1241} {"train_loss": -41.64534378051758, "global_step": 150246, "epoch": 1241} {"train_loss": -39.983699798583984, "global_step": 150247, "epoch": 1241} {"train_loss": -36.9197998046875, "global_step": 150248, "epoch": 1241} {"train_loss": -38.393314361572266, "global_step": 150249, "epoch": 1241} {"train_loss": -40.86932373046875, "global_step": 150250, "epoch": 1241} {"train_loss": -40.64866256713867, "global_step": 150251, "epoch": 1241} {"train_loss": -39.33486557006836, "global_step": 150252, "epoch": 1241} {"train_loss": -40.855751037597656, "global_step": 150253, "epoch": 1241} {"train_loss": -41.30940628051758, "global_step": 150254, "epoch": 1241} {"train_loss": -39.46427536010742, "global_step": 150255, "epoch": 1241} {"train_loss": -38.69486618041992, "global_step": 150256, "epoch": 1241} {"train_loss": -41.294795989990234, "global_step": 150257, "epoch": 1241} {"train_loss": -40.45682907104492, "global_step": 150258, "epoch": 1241} {"train_loss": -40.99640655517578, "global_step": 150259, "epoch": 1241} {"train_loss": -41.41250991821289, "global_step": 150260, "epoch": 1241} {"train_loss": -40.37607955932617, "global_step": 150261, "epoch": 1241} {"train_loss": -41.240352630615234, "global_step": 150262, "epoch": 1241} {"train_loss": -41.168128967285156, "global_step": 150263, "epoch": 1241} {"train_loss": -40.94253921508789, "global_step": 150264, "epoch": 1241} {"train_loss": -41.246498107910156, "global_step": 150265, "epoch": 1241} {"train_loss": -41.15811538696289, "global_step": 150266, "epoch": 1241} {"train_loss": -41.66917037963867, "global_step": 150267, "epoch": 1241} {"train_loss": -40.14385986328125, "global_step": 150268, "epoch": 1241} {"train_loss": -40.94978713989258, "global_step": 150269, "epoch": 1241} {"train_loss": -40.75235366821289, "global_step": 150270, "epoch": 1241} {"train_loss": -40.53512191772461, "global_step": 150271, "epoch": 1241} {"train_loss": -41.15470504760742, "global_step": 150272, "epoch": 1241} {"train_loss": -40.70866012573242, "global_step": 150273, "epoch": 1241} {"train_loss": -41.284847259521484, "global_step": 150274, "epoch": 1241} {"train_loss": -40.99616622924805, "global_step": 150275, "epoch": 1241} {"train_loss": -37.85649108886719, "global_step": 150276, "epoch": 1241} {"train_loss": -37.89829635620117, "global_step": 150277, "epoch": 1241} {"train_loss": -39.36408233642578, "global_step": 150278, "epoch": 1241} {"train_loss": -39.10703659057617, "global_step": 150279, "epoch": 1241} {"train_loss": -37.44012451171875, "global_step": 150280, "epoch": 1241} {"train_loss": -40.399908743614006, "global_step": 150281, "epoch": 1241, "val_loss": 2505420.5} {"train_loss": -37.19882583618164, "global_step": 150282, "epoch": 1242} {"train_loss": -33.33803939819336, "global_step": 150283, "epoch": 1242} {"train_loss": -35.85157012939453, "global_step": 150284, "epoch": 1242} {"train_loss": -32.09528350830078, "global_step": 150285, "epoch": 1242} {"train_loss": -35.38489532470703, "global_step": 150286, "epoch": 1242} {"train_loss": -36.21010971069336, "global_step": 150287, "epoch": 1242} {"train_loss": -35.98893356323242, "global_step": 150288, "epoch": 1242} {"train_loss": -34.94380569458008, "global_step": 150289, "epoch": 1242} {"train_loss": -36.90102005004883, "global_step": 150290, "epoch": 1242} {"train_loss": -36.81422424316406, "global_step": 150291, "epoch": 1242} {"train_loss": -38.395957946777344, "global_step": 150292, "epoch": 1242} {"train_loss": -39.088558197021484, "global_step": 150293, "epoch": 1242} {"train_loss": -38.1620979309082, "global_step": 150294, "epoch": 1242} {"train_loss": -39.8183708190918, "global_step": 150295, "epoch": 1242} {"train_loss": -38.13119125366211, "global_step": 150296, "epoch": 1242} {"train_loss": -38.82728958129883, "global_step": 150297, "epoch": 1242} {"train_loss": -39.617645263671875, "global_step": 150298, "epoch": 1242} {"train_loss": -39.61420822143555, "global_step": 150299, "epoch": 1242} {"train_loss": -39.972354888916016, "global_step": 150300, "epoch": 1242} {"train_loss": -37.344940185546875, "global_step": 150301, "epoch": 1242} {"train_loss": -38.670562744140625, "global_step": 150302, "epoch": 1242} {"train_loss": -39.17311477661133, "global_step": 150303, "epoch": 1242} {"train_loss": -40.1946907043457, "global_step": 150304, "epoch": 1242} {"train_loss": -39.64289093017578, "global_step": 150305, "epoch": 1242} {"train_loss": -39.27506637573242, "global_step": 150306, "epoch": 1242} {"train_loss": -40.52549362182617, "global_step": 150307, "epoch": 1242} {"train_loss": -37.687007904052734, "global_step": 150308, "epoch": 1242} {"train_loss": -39.23735809326172, "global_step": 150309, "epoch": 1242} {"train_loss": -40.7082633972168, "global_step": 150310, "epoch": 1242} {"train_loss": -39.813026428222656, "global_step": 150311, "epoch": 1242} {"train_loss": -39.57207107543945, "global_step": 150312, "epoch": 1242} {"train_loss": -40.20038986206055, "global_step": 150313, "epoch": 1242} {"train_loss": -40.756629943847656, "global_step": 150314, "epoch": 1242} {"train_loss": -39.85333251953125, "global_step": 150315, "epoch": 1242} {"train_loss": -40.428165435791016, "global_step": 150316, "epoch": 1242} {"train_loss": -40.641841888427734, "global_step": 150317, "epoch": 1242} {"train_loss": -40.23649215698242, "global_step": 150318, "epoch": 1242} {"train_loss": -39.59736633300781, "global_step": 150319, "epoch": 1242} {"train_loss": -40.54018783569336, "global_step": 150320, "epoch": 1242} {"train_loss": -40.21039962768555, "global_step": 150321, "epoch": 1242} {"train_loss": -38.42145919799805, "global_step": 150322, "epoch": 1242} {"train_loss": -40.95349884033203, "global_step": 150323, "epoch": 1242} {"train_loss": -40.47795486450195, "global_step": 150324, "epoch": 1242} {"train_loss": -38.58794021606445, "global_step": 150325, "epoch": 1242} {"train_loss": -38.974056243896484, "global_step": 150326, "epoch": 1242} {"train_loss": -40.78109359741211, "global_step": 150327, "epoch": 1242} {"train_loss": -40.1740608215332, "global_step": 150328, "epoch": 1242} {"train_loss": -39.91435623168945, "global_step": 150329, "epoch": 1242} {"train_loss": -38.88511276245117, "global_step": 150330, "epoch": 1242} {"train_loss": -40.25808334350586, "global_step": 150331, "epoch": 1242} {"train_loss": -38.454505920410156, "global_step": 150332, "epoch": 1242} {"train_loss": -39.476741790771484, "global_step": 150333, "epoch": 1242} {"train_loss": -39.387996673583984, "global_step": 150334, "epoch": 1242} {"train_loss": -37.20769119262695, "global_step": 150335, "epoch": 1242} {"train_loss": -40.36420822143555, "global_step": 150336, "epoch": 1242} {"train_loss": -37.545928955078125, "global_step": 150337, "epoch": 1242} {"train_loss": -40.215545654296875, "global_step": 150338, "epoch": 1242} {"train_loss": -38.311851501464844, "global_step": 150339, "epoch": 1242} {"train_loss": -39.829139709472656, "global_step": 150340, "epoch": 1242} {"train_loss": -39.01282501220703, "global_step": 150341, "epoch": 1242} {"train_loss": -39.92850875854492, "global_step": 150342, "epoch": 1242} {"train_loss": -40.42293167114258, "global_step": 150343, "epoch": 1242} {"train_loss": -39.6744499206543, "global_step": 150344, "epoch": 1242} {"train_loss": -40.951942443847656, "global_step": 150345, "epoch": 1242} {"train_loss": -38.77506637573242, "global_step": 150346, "epoch": 1242} {"train_loss": -40.665897369384766, "global_step": 150347, "epoch": 1242} {"train_loss": -40.60824203491211, "global_step": 150348, "epoch": 1242} {"train_loss": -40.43734359741211, "global_step": 150349, "epoch": 1242} {"train_loss": -40.68154525756836, "global_step": 150350, "epoch": 1242} {"train_loss": -41.060516357421875, "global_step": 150351, "epoch": 1242} {"train_loss": -39.806915283203125, "global_step": 150352, "epoch": 1242} {"train_loss": -40.72007369995117, "global_step": 150353, "epoch": 1242} {"train_loss": -40.67776870727539, "global_step": 150354, "epoch": 1242} {"train_loss": -40.46516036987305, "global_step": 150355, "epoch": 1242} {"train_loss": -40.858646392822266, "global_step": 150356, "epoch": 1242} {"train_loss": -40.66318893432617, "global_step": 150357, "epoch": 1242} {"train_loss": -40.808067321777344, "global_step": 150358, "epoch": 1242} {"train_loss": -40.26057434082031, "global_step": 150359, "epoch": 1242} {"train_loss": -40.86442184448242, "global_step": 150360, "epoch": 1242} {"train_loss": -40.54664993286133, "global_step": 150361, "epoch": 1242} {"train_loss": -40.23417282104492, "global_step": 150362, "epoch": 1242} {"train_loss": -40.2187385559082, "global_step": 150363, "epoch": 1242} {"train_loss": -40.50957489013672, "global_step": 150364, "epoch": 1242} {"train_loss": -40.37367630004883, "global_step": 150365, "epoch": 1242} {"train_loss": -40.65631866455078, "global_step": 150366, "epoch": 1242} {"train_loss": -40.3940544128418, "global_step": 150367, "epoch": 1242} {"train_loss": -39.273983001708984, "global_step": 150368, "epoch": 1242} {"train_loss": -40.675392150878906, "global_step": 150369, "epoch": 1242} {"train_loss": -40.545745849609375, "global_step": 150370, "epoch": 1242} {"train_loss": -40.51032638549805, "global_step": 150371, "epoch": 1242} {"train_loss": -40.68185043334961, "global_step": 150372, "epoch": 1242} {"train_loss": -40.497535705566406, "global_step": 150373, "epoch": 1242} {"train_loss": -41.07086181640625, "global_step": 150374, "epoch": 1242} {"train_loss": -40.75172805786133, "global_step": 150375, "epoch": 1242} {"train_loss": -40.666748046875, "global_step": 150376, "epoch": 1242} {"train_loss": -41.1864128112793, "global_step": 150377, "epoch": 1242} {"train_loss": -41.06826400756836, "global_step": 150378, "epoch": 1242} {"train_loss": -41.09847640991211, "global_step": 150379, "epoch": 1242} {"train_loss": -41.512943267822266, "global_step": 150380, "epoch": 1242} {"train_loss": -41.564632415771484, "global_step": 150381, "epoch": 1242} {"train_loss": -40.97545623779297, "global_step": 150382, "epoch": 1242} {"train_loss": -41.30685043334961, "global_step": 150383, "epoch": 1242} {"train_loss": -41.2574348449707, "global_step": 150384, "epoch": 1242} {"train_loss": -41.234901428222656, "global_step": 150385, "epoch": 1242} {"train_loss": -41.309295654296875, "global_step": 150386, "epoch": 1242} {"train_loss": -41.56551742553711, "global_step": 150387, "epoch": 1242} {"train_loss": -41.32004928588867, "global_step": 150388, "epoch": 1242} {"train_loss": -41.87236785888672, "global_step": 150389, "epoch": 1242} {"train_loss": -41.19846725463867, "global_step": 150390, "epoch": 1242} {"train_loss": -41.57064437866211, "global_step": 150391, "epoch": 1242} {"train_loss": -40.9422721862793, "global_step": 150392, "epoch": 1242} {"train_loss": -41.748104095458984, "global_step": 150393, "epoch": 1242} {"train_loss": -41.366065979003906, "global_step": 150394, "epoch": 1242} {"train_loss": -41.49803161621094, "global_step": 150395, "epoch": 1242} {"train_loss": -41.742286682128906, "global_step": 150396, "epoch": 1242} {"train_loss": -41.7347526550293, "global_step": 150397, "epoch": 1242} {"train_loss": -40.95783233642578, "global_step": 150398, "epoch": 1242} {"train_loss": -41.42055892944336, "global_step": 150399, "epoch": 1242} {"train_loss": -41.680057525634766, "global_step": 150400, "epoch": 1242} {"train_loss": -41.842735290527344, "global_step": 150401, "epoch": 1242} {"train_loss": -39.836203519963036, "global_step": 150402, "epoch": 1242, "val_loss": 2608580.75} {"train_loss": -41.02980041503906, "global_step": 150403, "epoch": 1243} {"train_loss": -41.78058624267578, "global_step": 150404, "epoch": 1243} {"train_loss": -41.739166259765625, "global_step": 150405, "epoch": 1243} {"train_loss": -41.711605072021484, "global_step": 150406, "epoch": 1243} {"train_loss": -41.8486213684082, "global_step": 150407, "epoch": 1243} {"train_loss": -41.77479934692383, "global_step": 150408, "epoch": 1243} {"train_loss": -41.845916748046875, "global_step": 150409, "epoch": 1243} {"train_loss": -41.84882736206055, "global_step": 150410, "epoch": 1243} {"train_loss": -40.457977294921875, "global_step": 150411, "epoch": 1243} {"train_loss": -41.40253829956055, "global_step": 150412, "epoch": 1243} {"train_loss": -40.75946044921875, "global_step": 150413, "epoch": 1243} {"train_loss": -40.81327438354492, "global_step": 150414, "epoch": 1243} {"train_loss": -41.09592819213867, "global_step": 150415, "epoch": 1243} {"train_loss": -40.78001403808594, "global_step": 150416, "epoch": 1243} {"train_loss": -41.24375534057617, "global_step": 150417, "epoch": 1243} {"train_loss": -39.99264144897461, "global_step": 150418, "epoch": 1243} {"train_loss": -42.084110260009766, "global_step": 150419, "epoch": 1243} {"train_loss": -41.933631896972656, "global_step": 150420, "epoch": 1243} {"train_loss": -40.19514083862305, "global_step": 150421, "epoch": 1243} {"train_loss": -40.2723388671875, "global_step": 150422, "epoch": 1243} {"train_loss": -38.70117950439453, "global_step": 150423, "epoch": 1243} {"train_loss": -38.95677185058594, "global_step": 150424, "epoch": 1243} {"train_loss": -41.539283752441406, "global_step": 150425, "epoch": 1243} {"train_loss": -41.58552169799805, "global_step": 150426, "epoch": 1243} {"train_loss": -41.46718215942383, "global_step": 150427, "epoch": 1243} {"train_loss": -41.52854919433594, "global_step": 150428, "epoch": 1243} {"train_loss": -41.26469421386719, "global_step": 150429, "epoch": 1243} {"train_loss": -40.434261322021484, "global_step": 150430, "epoch": 1243} {"train_loss": -41.40456008911133, "global_step": 150431, "epoch": 1243} {"train_loss": -41.11776351928711, "global_step": 150432, "epoch": 1243} {"train_loss": -38.899600982666016, "global_step": 150433, "epoch": 1243} {"train_loss": -41.24039840698242, "global_step": 150434, "epoch": 1243} {"train_loss": -41.131229400634766, "global_step": 150435, "epoch": 1243} {"train_loss": -40.25804138183594, "global_step": 150436, "epoch": 1243} {"train_loss": -40.06868362426758, "global_step": 150437, "epoch": 1243} {"train_loss": -39.97581100463867, "global_step": 150438, "epoch": 1243} {"train_loss": -38.937007904052734, "global_step": 150439, "epoch": 1243} {"train_loss": -38.34893798828125, "global_step": 150440, "epoch": 1243} {"train_loss": -41.3779182434082, "global_step": 150441, "epoch": 1243} {"train_loss": -39.82148361206055, "global_step": 150442, "epoch": 1243} {"train_loss": -39.100807189941406, "global_step": 150443, "epoch": 1243} {"train_loss": -39.999359130859375, "global_step": 150444, "epoch": 1243} {"train_loss": -39.99420166015625, "global_step": 150445, "epoch": 1243} {"train_loss": -39.67373275756836, "global_step": 150446, "epoch": 1243} {"train_loss": -39.29059982299805, "global_step": 150447, "epoch": 1243} {"train_loss": -40.381919860839844, "global_step": 150448, "epoch": 1243} {"train_loss": -39.583648681640625, "global_step": 150449, "epoch": 1243} {"train_loss": -39.63597869873047, "global_step": 150450, "epoch": 1243} {"train_loss": -41.18051528930664, "global_step": 150451, "epoch": 1243} {"train_loss": -39.456886291503906, "global_step": 150452, "epoch": 1243} {"train_loss": -40.044769287109375, "global_step": 150453, "epoch": 1243} {"train_loss": -40.75246810913086, "global_step": 150454, "epoch": 1243} {"train_loss": -40.09295654296875, "global_step": 150455, "epoch": 1243} {"train_loss": -41.13224792480469, "global_step": 150456, "epoch": 1243} {"train_loss": -39.684112548828125, "global_step": 150457, "epoch": 1243} {"train_loss": -40.89512252807617, "global_step": 150458, "epoch": 1243} {"train_loss": -41.015380859375, "global_step": 150459, "epoch": 1243} {"train_loss": -40.12808609008789, "global_step": 150460, "epoch": 1243} {"train_loss": -40.42179489135742, "global_step": 150461, "epoch": 1243} {"train_loss": -39.319541931152344, "global_step": 150462, "epoch": 1243} {"train_loss": -40.917842864990234, "global_step": 150463, "epoch": 1243} {"train_loss": -40.57012939453125, "global_step": 150464, "epoch": 1243} {"train_loss": -39.626224517822266, "global_step": 150465, "epoch": 1243} {"train_loss": -39.5871696472168, "global_step": 150466, "epoch": 1243} {"train_loss": -35.86696243286133, "global_step": 150467, "epoch": 1243} {"train_loss": -38.269508361816406, "global_step": 150468, "epoch": 1243} {"train_loss": -39.17351150512695, "global_step": 150469, "epoch": 1243} {"train_loss": -37.49696731567383, "global_step": 150470, "epoch": 1243} {"train_loss": -40.05889892578125, "global_step": 150471, "epoch": 1243} {"train_loss": -35.75537109375, "global_step": 150472, "epoch": 1243} {"train_loss": -35.150543212890625, "global_step": 150473, "epoch": 1243} {"train_loss": -36.709842681884766, "global_step": 150474, "epoch": 1243} {"train_loss": -37.123016357421875, "global_step": 150475, "epoch": 1243} {"train_loss": -32.83405685424805, "global_step": 150476, "epoch": 1243} {"train_loss": -37.11664581298828, "global_step": 150477, "epoch": 1243} {"train_loss": -36.442134857177734, "global_step": 150478, "epoch": 1243} {"train_loss": -36.86660385131836, "global_step": 150479, "epoch": 1243} {"train_loss": -39.601314544677734, "global_step": 150480, "epoch": 1243} {"train_loss": -36.4141960144043, "global_step": 150481, "epoch": 1243} {"train_loss": -39.85764694213867, "global_step": 150482, "epoch": 1243} {"train_loss": -36.676090240478516, "global_step": 150483, "epoch": 1243} {"train_loss": -36.887176513671875, "global_step": 150484, "epoch": 1243} {"train_loss": -39.37824630737305, "global_step": 150485, "epoch": 1243} {"train_loss": -38.23316192626953, "global_step": 150486, "epoch": 1243} {"train_loss": -37.93131637573242, "global_step": 150487, "epoch": 1243} {"train_loss": -39.14273452758789, "global_step": 150488, "epoch": 1243} {"train_loss": -39.977046966552734, "global_step": 150489, "epoch": 1243} {"train_loss": -38.736698150634766, "global_step": 150490, "epoch": 1243} {"train_loss": -39.36571502685547, "global_step": 150491, "epoch": 1243} {"train_loss": -39.00106430053711, "global_step": 150492, "epoch": 1243} {"train_loss": -39.67943572998047, "global_step": 150493, "epoch": 1243} {"train_loss": -40.28231430053711, "global_step": 150494, "epoch": 1243} {"train_loss": -40.044464111328125, "global_step": 150495, "epoch": 1243} {"train_loss": -39.545230865478516, "global_step": 150496, "epoch": 1243} {"train_loss": -40.192657470703125, "global_step": 150497, "epoch": 1243} {"train_loss": -39.965614318847656, "global_step": 150498, "epoch": 1243} {"train_loss": -40.069610595703125, "global_step": 150499, "epoch": 1243} {"train_loss": -40.371761322021484, "global_step": 150500, "epoch": 1243} {"train_loss": -40.370182037353516, "global_step": 150501, "epoch": 1243} {"train_loss": -39.72159194946289, "global_step": 150502, "epoch": 1243} {"train_loss": -41.169063568115234, "global_step": 150503, "epoch": 1243} {"train_loss": -39.95587158203125, "global_step": 150504, "epoch": 1243} {"train_loss": -40.15464401245117, "global_step": 150505, "epoch": 1243} {"train_loss": -41.0770263671875, "global_step": 150506, "epoch": 1243} {"train_loss": -40.246456146240234, "global_step": 150507, "epoch": 1243} {"train_loss": -40.86128234863281, "global_step": 150508, "epoch": 1243} {"train_loss": -40.275794982910156, "global_step": 150509, "epoch": 1243} {"train_loss": -40.52480697631836, "global_step": 150510, "epoch": 1243} {"train_loss": -41.00445556640625, "global_step": 150511, "epoch": 1243} {"train_loss": -41.234222412109375, "global_step": 150512, "epoch": 1243} {"train_loss": -40.923500061035156, "global_step": 150513, "epoch": 1243} {"train_loss": -41.4235954284668, "global_step": 150514, "epoch": 1243} {"train_loss": -41.166900634765625, "global_step": 150515, "epoch": 1243} {"train_loss": -40.386051177978516, "global_step": 150516, "epoch": 1243} {"train_loss": -41.285194396972656, "global_step": 150517, "epoch": 1243} {"train_loss": -40.73402786254883, "global_step": 150518, "epoch": 1243} {"train_loss": -40.75886917114258, "global_step": 150519, "epoch": 1243} {"train_loss": -39.02744674682617, "global_step": 150520, "epoch": 1243} {"train_loss": -41.52466583251953, "global_step": 150521, "epoch": 1243} {"train_loss": -41.075801849365234, "global_step": 150522, "epoch": 1243} {"train_loss": -39.92293044161205, "global_step": 150523, "epoch": 1243, "val_loss": 2660738.75} {"train_loss": -41.58925247192383, "global_step": 150524, "epoch": 1244} {"train_loss": -41.32759475708008, "global_step": 150525, "epoch": 1244} {"train_loss": -41.390647888183594, "global_step": 150526, "epoch": 1244} {"train_loss": -41.77321243286133, "global_step": 150527, "epoch": 1244} {"train_loss": -41.84259796142578, "global_step": 150528, "epoch": 1244} {"train_loss": -41.06880569458008, "global_step": 150529, "epoch": 1244} {"train_loss": -39.53800582885742, "global_step": 150530, "epoch": 1244} {"train_loss": -41.04055404663086, "global_step": 150531, "epoch": 1244} {"train_loss": -40.42249298095703, "global_step": 150532, "epoch": 1244} {"train_loss": -40.475772857666016, "global_step": 150533, "epoch": 1244} {"train_loss": -39.656429290771484, "global_step": 150534, "epoch": 1244} {"train_loss": -40.0995979309082, "global_step": 150535, "epoch": 1244} {"train_loss": -41.02006912231445, "global_step": 150536, "epoch": 1244} {"train_loss": -39.86294174194336, "global_step": 150537, "epoch": 1244} {"train_loss": -38.54785919189453, "global_step": 150538, "epoch": 1244} {"train_loss": -41.12220001220703, "global_step": 150539, "epoch": 1244} {"train_loss": -41.06781005859375, "global_step": 150540, "epoch": 1244} {"train_loss": -41.22272872924805, "global_step": 150541, "epoch": 1244} {"train_loss": -40.05194854736328, "global_step": 150542, "epoch": 1244} {"train_loss": -40.57396697998047, "global_step": 150543, "epoch": 1244} {"train_loss": -41.27493667602539, "global_step": 150544, "epoch": 1244} {"train_loss": -38.584720611572266, "global_step": 150545, "epoch": 1244} {"train_loss": -39.37233352661133, "global_step": 150546, "epoch": 1244} {"train_loss": -38.72768020629883, "global_step": 150547, "epoch": 1244} {"train_loss": -38.83695983886719, "global_step": 150548, "epoch": 1244} {"train_loss": -37.45222854614258, "global_step": 150549, "epoch": 1244} {"train_loss": -39.43520736694336, "global_step": 150550, "epoch": 1244} {"train_loss": -38.684288024902344, "global_step": 150551, "epoch": 1244} {"train_loss": -40.29582595825195, "global_step": 150552, "epoch": 1244} {"train_loss": -40.53803253173828, "global_step": 150553, "epoch": 1244} {"train_loss": -40.63358688354492, "global_step": 150554, "epoch": 1244} {"train_loss": -40.20377731323242, "global_step": 150555, "epoch": 1244} {"train_loss": -39.38664627075195, "global_step": 150556, "epoch": 1244} {"train_loss": -39.83042526245117, "global_step": 150557, "epoch": 1244} {"train_loss": -39.86855697631836, "global_step": 150558, "epoch": 1244} {"train_loss": -40.0594367980957, "global_step": 150559, "epoch": 1244} {"train_loss": -38.8070182800293, "global_step": 150560, "epoch": 1244} {"train_loss": -39.62033462524414, "global_step": 150561, "epoch": 1244} {"train_loss": -39.43336868286133, "global_step": 150562, "epoch": 1244} {"train_loss": -40.90939712524414, "global_step": 150563, "epoch": 1244} {"train_loss": -40.068946838378906, "global_step": 150564, "epoch": 1244} {"train_loss": -40.535545349121094, "global_step": 150565, "epoch": 1244} {"train_loss": -41.05696487426758, "global_step": 150566, "epoch": 1244} {"train_loss": -40.918609619140625, "global_step": 150567, "epoch": 1244} {"train_loss": -41.18013000488281, "global_step": 150568, "epoch": 1244} {"train_loss": -41.07432174682617, "global_step": 150569, "epoch": 1244} {"train_loss": -41.03010559082031, "global_step": 150570, "epoch": 1244} {"train_loss": -40.75400924682617, "global_step": 150571, "epoch": 1244} {"train_loss": -40.443084716796875, "global_step": 150572, "epoch": 1244} {"train_loss": -40.680179595947266, "global_step": 150573, "epoch": 1244} {"train_loss": -40.137752532958984, "global_step": 150574, "epoch": 1244} {"train_loss": -40.80264663696289, "global_step": 150575, "epoch": 1244} {"train_loss": -39.83894729614258, "global_step": 150576, "epoch": 1244} {"train_loss": -39.75452423095703, "global_step": 150577, "epoch": 1244} {"train_loss": -41.16132354736328, "global_step": 150578, "epoch": 1244} {"train_loss": -39.65552520751953, "global_step": 150579, "epoch": 1244} {"train_loss": -40.52608108520508, "global_step": 150580, "epoch": 1244} {"train_loss": -41.09412384033203, "global_step": 150581, "epoch": 1244} {"train_loss": -40.621639251708984, "global_step": 150582, "epoch": 1244} {"train_loss": -40.88871383666992, "global_step": 150583, "epoch": 1244} {"train_loss": -41.25355911254883, "global_step": 150584, "epoch": 1244} {"train_loss": -41.075584411621094, "global_step": 150585, "epoch": 1244} {"train_loss": -41.29050827026367, "global_step": 150586, "epoch": 1244} {"train_loss": -41.040283203125, "global_step": 150587, "epoch": 1244} {"train_loss": -41.12152862548828, "global_step": 150588, "epoch": 1244} {"train_loss": -41.2131233215332, "global_step": 150589, "epoch": 1244} {"train_loss": -41.502864837646484, "global_step": 150590, "epoch": 1244} {"train_loss": -41.89665603637695, "global_step": 150591, "epoch": 1244} {"train_loss": -41.804725646972656, "global_step": 150592, "epoch": 1244} {"train_loss": -41.50163650512695, "global_step": 150593, "epoch": 1244} {"train_loss": -41.62992477416992, "global_step": 150594, "epoch": 1244} {"train_loss": -41.43119430541992, "global_step": 150595, "epoch": 1244} {"train_loss": -41.440277099609375, "global_step": 150596, "epoch": 1244} {"train_loss": -41.1871452331543, "global_step": 150597, "epoch": 1244} {"train_loss": -41.19111251831055, "global_step": 150598, "epoch": 1244} {"train_loss": -41.08042526245117, "global_step": 150599, "epoch": 1244} {"train_loss": -41.498050689697266, "global_step": 150600, "epoch": 1244} {"train_loss": -40.81138229370117, "global_step": 150601, "epoch": 1244} {"train_loss": -40.82389450073242, "global_step": 150602, "epoch": 1244} {"train_loss": -40.177059173583984, "global_step": 150603, "epoch": 1244} {"train_loss": -39.87427520751953, "global_step": 150604, "epoch": 1244} {"train_loss": -41.523738861083984, "global_step": 150605, "epoch": 1244} {"train_loss": -40.64583969116211, "global_step": 150606, "epoch": 1244} {"train_loss": -40.13910675048828, "global_step": 150607, "epoch": 1244} {"train_loss": -40.570308685302734, "global_step": 150608, "epoch": 1244} {"train_loss": -41.264549255371094, "global_step": 150609, "epoch": 1244} {"train_loss": -39.60657501220703, "global_step": 150610, "epoch": 1244} {"train_loss": -35.191650390625, "global_step": 150611, "epoch": 1244} {"train_loss": -36.774497985839844, "global_step": 150612, "epoch": 1244} {"train_loss": -33.32052230834961, "global_step": 150613, "epoch": 1244} {"train_loss": -10.835713386535645, "global_step": 150614, "epoch": 1244} {"train_loss": -2.9026057720184326, "global_step": 150615, "epoch": 1244} {"train_loss": -16.520370483398438, "global_step": 150616, "epoch": 1244} {"train_loss": -20.89377784729004, "global_step": 150617, "epoch": 1244} {"train_loss": -16.13149070739746, "global_step": 150618, "epoch": 1244} {"train_loss": -24.05430030822754, "global_step": 150619, "epoch": 1244} {"train_loss": -25.468244552612305, "global_step": 150620, "epoch": 1244} {"train_loss": -23.081140518188477, "global_step": 150621, "epoch": 1244} {"train_loss": -27.1373291015625, "global_step": 150622, "epoch": 1244} {"train_loss": -29.66409683227539, "global_step": 150623, "epoch": 1244} {"train_loss": -29.462173461914062, "global_step": 150624, "epoch": 1244} {"train_loss": -25.35048484802246, "global_step": 150625, "epoch": 1244} {"train_loss": -29.863027572631836, "global_step": 150626, "epoch": 1244} {"train_loss": -32.80721664428711, "global_step": 150627, "epoch": 1244} {"train_loss": -30.9569091796875, "global_step": 150628, "epoch": 1244} {"train_loss": -30.139745712280273, "global_step": 150629, "epoch": 1244} {"train_loss": -31.285886764526367, "global_step": 150630, "epoch": 1244} {"train_loss": -32.12916946411133, "global_step": 150631, "epoch": 1244} {"train_loss": -33.02173614501953, "global_step": 150632, "epoch": 1244} {"train_loss": -32.24522018432617, "global_step": 150633, "epoch": 1244} {"train_loss": -31.640348434448242, "global_step": 150634, "epoch": 1244} {"train_loss": -34.00507736206055, "global_step": 150635, "epoch": 1244} {"train_loss": -34.39390182495117, "global_step": 150636, "epoch": 1244} {"train_loss": -35.14720916748047, "global_step": 150637, "epoch": 1244} {"train_loss": -34.21927261352539, "global_step": 150638, "epoch": 1244} {"train_loss": -33.7425651550293, "global_step": 150639, "epoch": 1244} {"train_loss": -34.090431213378906, "global_step": 150640, "epoch": 1244} {"train_loss": -34.305458068847656, "global_step": 150641, "epoch": 1244} {"train_loss": -35.37476348876953, "global_step": 150642, "epoch": 1244} {"train_loss": -35.17612838745117, "global_step": 150643, "epoch": 1244} {"train_loss": -37.29406274645782, "global_step": 150644, "epoch": 1244, "val_loss": 2661924.75} {"train_loss": -34.50324630737305, "global_step": 150645, "epoch": 1245} {"train_loss": -35.34658432006836, "global_step": 150646, "epoch": 1245} {"train_loss": -35.40468978881836, "global_step": 150647, "epoch": 1245} {"train_loss": -35.42580032348633, "global_step": 150648, "epoch": 1245} {"train_loss": -35.11758041381836, "global_step": 150649, "epoch": 1245} {"train_loss": -35.690574645996094, "global_step": 150650, "epoch": 1245} {"train_loss": -35.924842834472656, "global_step": 150651, "epoch": 1245} {"train_loss": -35.47550582885742, "global_step": 150652, "epoch": 1245} {"train_loss": -35.696292877197266, "global_step": 150653, "epoch": 1245} {"train_loss": -36.03404998779297, "global_step": 150654, "epoch": 1245} {"train_loss": -36.41701889038086, "global_step": 150655, "epoch": 1245} {"train_loss": -36.1175422668457, "global_step": 150656, "epoch": 1245} {"train_loss": -36.510799407958984, "global_step": 150657, "epoch": 1245} {"train_loss": -36.7634162902832, "global_step": 150658, "epoch": 1245} {"train_loss": -35.9738883972168, "global_step": 150659, "epoch": 1245} {"train_loss": -36.41356658935547, "global_step": 150660, "epoch": 1245} {"train_loss": -36.55234909057617, "global_step": 150661, "epoch": 1245} {"train_loss": -36.88630676269531, "global_step": 150662, "epoch": 1245} {"train_loss": -36.383460998535156, "global_step": 150663, "epoch": 1245} {"train_loss": -37.229488372802734, "global_step": 150664, "epoch": 1245} {"train_loss": -36.540077209472656, "global_step": 150665, "epoch": 1245} {"train_loss": -36.68282699584961, "global_step": 150666, "epoch": 1245} {"train_loss": -37.1480712890625, "global_step": 150667, "epoch": 1245} {"train_loss": -36.44482421875, "global_step": 150668, "epoch": 1245} {"train_loss": -37.74372482299805, "global_step": 150669, "epoch": 1245} {"train_loss": -36.47309112548828, "global_step": 150670, "epoch": 1245} {"train_loss": -37.52614974975586, "global_step": 150671, "epoch": 1245} {"train_loss": -37.61050033569336, "global_step": 150672, "epoch": 1245} {"train_loss": -38.115325927734375, "global_step": 150673, "epoch": 1245} {"train_loss": -37.582401275634766, "global_step": 150674, "epoch": 1245} {"train_loss": -37.87888717651367, "global_step": 150675, "epoch": 1245} {"train_loss": -37.92767333984375, "global_step": 150676, "epoch": 1245} {"train_loss": -37.34248352050781, "global_step": 150677, "epoch": 1245} {"train_loss": -36.698890686035156, "global_step": 150678, "epoch": 1245} {"train_loss": -37.65144729614258, "global_step": 150679, "epoch": 1245} {"train_loss": -37.5896110534668, "global_step": 150680, "epoch": 1245} {"train_loss": -37.69253158569336, "global_step": 150681, "epoch": 1245} {"train_loss": -37.56470489501953, "global_step": 150682, "epoch": 1245} {"train_loss": -37.7416877746582, "global_step": 150683, "epoch": 1245} {"train_loss": -36.99592208862305, "global_step": 150684, "epoch": 1245} {"train_loss": -35.84170150756836, "global_step": 150685, "epoch": 1245} {"train_loss": -37.81464767456055, "global_step": 150686, "epoch": 1245} {"train_loss": -38.238014221191406, "global_step": 150687, "epoch": 1245} {"train_loss": -37.2952995300293, "global_step": 150688, "epoch": 1245} {"train_loss": -38.827789306640625, "global_step": 150689, "epoch": 1245} {"train_loss": -37.74687576293945, "global_step": 150690, "epoch": 1245} {"train_loss": -38.74065017700195, "global_step": 150691, "epoch": 1245} {"train_loss": -38.69981002807617, "global_step": 150692, "epoch": 1245} {"train_loss": -38.645320892333984, "global_step": 150693, "epoch": 1245} {"train_loss": -38.46391677856445, "global_step": 150694, "epoch": 1245} {"train_loss": -38.00693893432617, "global_step": 150695, "epoch": 1245} {"train_loss": -38.705806732177734, "global_step": 150696, "epoch": 1245} {"train_loss": -38.66310501098633, "global_step": 150697, "epoch": 1245} {"train_loss": -38.30843734741211, "global_step": 150698, "epoch": 1245} {"train_loss": -38.8164176940918, "global_step": 150699, "epoch": 1245} {"train_loss": -39.35142135620117, "global_step": 150700, "epoch": 1245} {"train_loss": -38.917171478271484, "global_step": 150701, "epoch": 1245} {"train_loss": -38.947078704833984, "global_step": 150702, "epoch": 1245} {"train_loss": -39.01308059692383, "global_step": 150703, "epoch": 1245} {"train_loss": -38.25556564331055, "global_step": 150704, "epoch": 1245} {"train_loss": -37.527191162109375, "global_step": 150705, "epoch": 1245} {"train_loss": -38.292236328125, "global_step": 150706, "epoch": 1245} {"train_loss": -39.32963180541992, "global_step": 150707, "epoch": 1245} {"train_loss": -38.006954193115234, "global_step": 150708, "epoch": 1245} {"train_loss": -38.73945999145508, "global_step": 150709, "epoch": 1245} {"train_loss": -38.6056022644043, "global_step": 150710, "epoch": 1245} {"train_loss": -39.086605072021484, "global_step": 150711, "epoch": 1245} {"train_loss": -38.54087448120117, "global_step": 150712, "epoch": 1245} {"train_loss": -39.12519454956055, "global_step": 150713, "epoch": 1245} {"train_loss": -39.113548278808594, "global_step": 150714, "epoch": 1245} {"train_loss": -38.602474212646484, "global_step": 150715, "epoch": 1245} {"train_loss": -38.596656799316406, "global_step": 150716, "epoch": 1245} {"train_loss": -39.24777603149414, "global_step": 150717, "epoch": 1245} {"train_loss": -38.781829833984375, "global_step": 150718, "epoch": 1245} {"train_loss": -38.9736442565918, "global_step": 150719, "epoch": 1245} {"train_loss": -38.85099411010742, "global_step": 150720, "epoch": 1245} {"train_loss": -39.857791900634766, "global_step": 150721, "epoch": 1245} {"train_loss": -38.876888275146484, "global_step": 150722, "epoch": 1245} {"train_loss": -39.8764762878418, "global_step": 150723, "epoch": 1245} {"train_loss": -40.155677795410156, "global_step": 150724, "epoch": 1245} {"train_loss": -40.139217376708984, "global_step": 150725, "epoch": 1245} {"train_loss": -40.00934982299805, "global_step": 150726, "epoch": 1245} {"train_loss": -40.3053092956543, "global_step": 150727, "epoch": 1245} {"train_loss": -39.983760833740234, "global_step": 150728, "epoch": 1245} {"train_loss": -40.41616439819336, "global_step": 150729, "epoch": 1245} {"train_loss": -40.287384033203125, "global_step": 150730, "epoch": 1245} {"train_loss": -40.51543045043945, "global_step": 150731, "epoch": 1245} {"train_loss": -40.47496032714844, "global_step": 150732, "epoch": 1245} {"train_loss": -40.75733184814453, "global_step": 150733, "epoch": 1245} {"train_loss": -40.3475341796875, "global_step": 150734, "epoch": 1245} {"train_loss": -40.6728630065918, "global_step": 150735, "epoch": 1245} {"train_loss": -40.14252853393555, "global_step": 150736, "epoch": 1245} {"train_loss": -40.749202728271484, "global_step": 150737, "epoch": 1245} {"train_loss": -40.295318603515625, "global_step": 150738, "epoch": 1245} {"train_loss": -40.58454513549805, "global_step": 150739, "epoch": 1245} {"train_loss": -41.217708587646484, "global_step": 150740, "epoch": 1245} {"train_loss": -40.316505432128906, "global_step": 150741, "epoch": 1245} {"train_loss": -40.3352165222168, "global_step": 150742, "epoch": 1245} {"train_loss": -41.01514434814453, "global_step": 150743, "epoch": 1245} {"train_loss": -40.338008880615234, "global_step": 150744, "epoch": 1245} {"train_loss": -40.86880111694336, "global_step": 150745, "epoch": 1245} {"train_loss": -41.2634391784668, "global_step": 150746, "epoch": 1245} {"train_loss": -40.85758590698242, "global_step": 150747, "epoch": 1245} {"train_loss": -40.8228874206543, "global_step": 150748, "epoch": 1245} {"train_loss": -41.63786697387695, "global_step": 150749, "epoch": 1245} {"train_loss": -41.398555755615234, "global_step": 150750, "epoch": 1245} {"train_loss": -40.837799072265625, "global_step": 150751, "epoch": 1245} {"train_loss": -40.91526412963867, "global_step": 150752, "epoch": 1245} {"train_loss": -41.195045471191406, "global_step": 150753, "epoch": 1245} {"train_loss": -40.48164749145508, "global_step": 150754, "epoch": 1245} {"train_loss": -41.42246627807617, "global_step": 150755, "epoch": 1245} {"train_loss": -39.8715705871582, "global_step": 150756, "epoch": 1245} {"train_loss": -40.61562728881836, "global_step": 150757, "epoch": 1245} {"train_loss": -40.98531723022461, "global_step": 150758, "epoch": 1245} {"train_loss": -40.341285705566406, "global_step": 150759, "epoch": 1245} {"train_loss": -41.16561508178711, "global_step": 150760, "epoch": 1245} {"train_loss": -40.16578674316406, "global_step": 150761, "epoch": 1245} {"train_loss": -40.31046676635742, "global_step": 150762, "epoch": 1245} {"train_loss": -40.696205139160156, "global_step": 150763, "epoch": 1245} {"train_loss": -40.27640914916992, "global_step": 150764, "epoch": 1245} {"train_loss": -38.664399895786254, "global_step": 150765, "epoch": 1245, "val_loss": 2622680.75} {"train_loss": -40.875885009765625, "global_step": 150766, "epoch": 1246} {"train_loss": -40.50544357299805, "global_step": 150767, "epoch": 1246} {"train_loss": -40.55729293823242, "global_step": 150768, "epoch": 1246} {"train_loss": -40.82392120361328, "global_step": 150769, "epoch": 1246} {"train_loss": -40.105140686035156, "global_step": 150770, "epoch": 1246} {"train_loss": -40.84595489501953, "global_step": 150771, "epoch": 1246} {"train_loss": -41.48844528198242, "global_step": 150772, "epoch": 1246} {"train_loss": -41.177913665771484, "global_step": 150773, "epoch": 1246} {"train_loss": -39.925655364990234, "global_step": 150774, "epoch": 1246} {"train_loss": -39.53965377807617, "global_step": 150775, "epoch": 1246} {"train_loss": -41.55988311767578, "global_step": 150776, "epoch": 1246} {"train_loss": -40.54487228393555, "global_step": 150777, "epoch": 1246} {"train_loss": -39.56155014038086, "global_step": 150778, "epoch": 1246} {"train_loss": -41.237552642822266, "global_step": 150779, "epoch": 1246} {"train_loss": -39.88271713256836, "global_step": 150780, "epoch": 1246} {"train_loss": -40.34354782104492, "global_step": 150781, "epoch": 1246} {"train_loss": -39.64032745361328, "global_step": 150782, "epoch": 1246} {"train_loss": -40.605186462402344, "global_step": 150783, "epoch": 1246} {"train_loss": -40.49165725708008, "global_step": 150784, "epoch": 1246} {"train_loss": -40.209041595458984, "global_step": 150785, "epoch": 1246} {"train_loss": -39.545711517333984, "global_step": 150786, "epoch": 1246} {"train_loss": -37.240596771240234, "global_step": 150787, "epoch": 1246} {"train_loss": -40.96315383911133, "global_step": 150788, "epoch": 1246} {"train_loss": -37.783447265625, "global_step": 150789, "epoch": 1246} {"train_loss": -38.305641174316406, "global_step": 150790, "epoch": 1246} {"train_loss": -25.402816772460938, "global_step": 150791, "epoch": 1246} {"train_loss": -24.19879722595215, "global_step": 150792, "epoch": 1246} {"train_loss": -26.09303092956543, "global_step": 150793, "epoch": 1246} {"train_loss": -30.14737892150879, "global_step": 150794, "epoch": 1246} {"train_loss": -34.72182846069336, "global_step": 150795, "epoch": 1246} {"train_loss": -33.82489776611328, "global_step": 150796, "epoch": 1246} {"train_loss": -33.41244125366211, "global_step": 150797, "epoch": 1246} {"train_loss": -34.932106018066406, "global_step": 150798, "epoch": 1246} {"train_loss": -35.83053970336914, "global_step": 150799, "epoch": 1246} {"train_loss": -37.18992233276367, "global_step": 150800, "epoch": 1246} {"train_loss": -36.78231430053711, "global_step": 150801, "epoch": 1246} {"train_loss": -37.80260467529297, "global_step": 150802, "epoch": 1246} {"train_loss": -37.15476608276367, "global_step": 150803, "epoch": 1246} {"train_loss": -37.497169494628906, "global_step": 150804, "epoch": 1246} {"train_loss": -37.18809509277344, "global_step": 150805, "epoch": 1246} {"train_loss": -38.24848556518555, "global_step": 150806, "epoch": 1246} {"train_loss": -38.3023681640625, "global_step": 150807, "epoch": 1246} {"train_loss": -38.274417877197266, "global_step": 150808, "epoch": 1246} {"train_loss": -39.292579650878906, "global_step": 150809, "epoch": 1246} {"train_loss": -37.70334243774414, "global_step": 150810, "epoch": 1246} {"train_loss": -39.5579833984375, "global_step": 150811, "epoch": 1246} {"train_loss": -38.695220947265625, "global_step": 150812, "epoch": 1246} {"train_loss": -39.71276092529297, "global_step": 150813, "epoch": 1246} {"train_loss": -38.84049606323242, "global_step": 150814, "epoch": 1246} {"train_loss": -39.800323486328125, "global_step": 150815, "epoch": 1246} {"train_loss": -39.548988342285156, "global_step": 150816, "epoch": 1246} {"train_loss": -39.99580764770508, "global_step": 150817, "epoch": 1246} {"train_loss": -39.732872009277344, "global_step": 150818, "epoch": 1246} {"train_loss": -40.01424026489258, "global_step": 150819, "epoch": 1246} {"train_loss": -39.6953239440918, "global_step": 150820, "epoch": 1246} {"train_loss": -38.86782455444336, "global_step": 150821, "epoch": 1246} {"train_loss": -39.741668701171875, "global_step": 150822, "epoch": 1246} {"train_loss": -39.744529724121094, "global_step": 150823, "epoch": 1246} {"train_loss": -39.93885803222656, "global_step": 150824, "epoch": 1246} {"train_loss": -39.7669792175293, "global_step": 150825, "epoch": 1246} {"train_loss": -39.98043441772461, "global_step": 150826, "epoch": 1246} {"train_loss": -38.82880783081055, "global_step": 150827, "epoch": 1246} {"train_loss": -40.36503219604492, "global_step": 150828, "epoch": 1246} {"train_loss": -40.37975311279297, "global_step": 150829, "epoch": 1246} {"train_loss": -40.43935775756836, "global_step": 150830, "epoch": 1246} {"train_loss": -40.2312126159668, "global_step": 150831, "epoch": 1246} {"train_loss": -40.50068283081055, "global_step": 150832, "epoch": 1246} {"train_loss": -40.68366622924805, "global_step": 150833, "epoch": 1246} {"train_loss": -40.45526123046875, "global_step": 150834, "epoch": 1246} {"train_loss": -39.19672775268555, "global_step": 150835, "epoch": 1246} {"train_loss": -40.3322868347168, "global_step": 150836, "epoch": 1246} {"train_loss": -39.429290771484375, "global_step": 150837, "epoch": 1246} {"train_loss": -38.79031753540039, "global_step": 150838, "epoch": 1246} {"train_loss": -40.593692779541016, "global_step": 150839, "epoch": 1246} {"train_loss": -40.636837005615234, "global_step": 150840, "epoch": 1246} {"train_loss": -40.58201217651367, "global_step": 150841, "epoch": 1246} {"train_loss": -39.969749450683594, "global_step": 150842, "epoch": 1246} {"train_loss": -40.64704132080078, "global_step": 150843, "epoch": 1246} {"train_loss": -39.896278381347656, "global_step": 150844, "epoch": 1246} {"train_loss": -39.71583557128906, "global_step": 150845, "epoch": 1246} {"train_loss": -40.65615463256836, "global_step": 150846, "epoch": 1246} {"train_loss": -40.614627838134766, "global_step": 150847, "epoch": 1246} {"train_loss": -37.944549560546875, "global_step": 150848, "epoch": 1246} {"train_loss": -39.62772750854492, "global_step": 150849, "epoch": 1246} {"train_loss": -40.57075119018555, "global_step": 150850, "epoch": 1246} {"train_loss": -40.420257568359375, "global_step": 150851, "epoch": 1246} {"train_loss": -38.47339630126953, "global_step": 150852, "epoch": 1246} {"train_loss": -40.78544235229492, "global_step": 150853, "epoch": 1246} {"train_loss": -40.490108489990234, "global_step": 150854, "epoch": 1246} {"train_loss": -41.10490417480469, "global_step": 150855, "epoch": 1246} {"train_loss": -40.590309143066406, "global_step": 150856, "epoch": 1246} {"train_loss": -40.43070602416992, "global_step": 150857, "epoch": 1246} {"train_loss": -40.93642044067383, "global_step": 150858, "epoch": 1246} {"train_loss": -41.021888732910156, "global_step": 150859, "epoch": 1246} {"train_loss": -41.09196472167969, "global_step": 150860, "epoch": 1246} {"train_loss": -37.40372848510742, "global_step": 150861, "epoch": 1246} {"train_loss": -40.744667053222656, "global_step": 150862, "epoch": 1246} {"train_loss": -40.742671966552734, "global_step": 150863, "epoch": 1246} {"train_loss": -40.4937858581543, "global_step": 150864, "epoch": 1246} {"train_loss": -40.838600158691406, "global_step": 150865, "epoch": 1246} {"train_loss": -40.83850860595703, "global_step": 150866, "epoch": 1246} {"train_loss": -41.14946365356445, "global_step": 150867, "epoch": 1246} {"train_loss": -39.33233642578125, "global_step": 150868, "epoch": 1246} {"train_loss": -40.79658126831055, "global_step": 150869, "epoch": 1246} {"train_loss": -41.437469482421875, "global_step": 150870, "epoch": 1246} {"train_loss": -40.656490325927734, "global_step": 150871, "epoch": 1246} {"train_loss": -41.45259094238281, "global_step": 150872, "epoch": 1246} {"train_loss": -40.682613372802734, "global_step": 150873, "epoch": 1246} {"train_loss": -40.07720947265625, "global_step": 150874, "epoch": 1246} {"train_loss": -39.20768356323242, "global_step": 150875, "epoch": 1246} {"train_loss": -40.18355178833008, "global_step": 150876, "epoch": 1246} {"train_loss": -39.177886962890625, "global_step": 150877, "epoch": 1246} {"train_loss": -41.23064422607422, "global_step": 150878, "epoch": 1246} {"train_loss": -39.73869705200195, "global_step": 150879, "epoch": 1246} {"train_loss": -38.7070198059082, "global_step": 150880, "epoch": 1246} {"train_loss": -39.75602340698242, "global_step": 150881, "epoch": 1246} {"train_loss": -36.76656723022461, "global_step": 150882, "epoch": 1246} {"train_loss": -40.30495071411133, "global_step": 150883, "epoch": 1246} {"train_loss": -35.8350944519043, "global_step": 150884, "epoch": 1246} {"train_loss": -40.15516662597656, "global_step": 150885, "epoch": 1246} {"train_loss": -39.119113433459574, "global_step": 150886, "epoch": 1246, "val_loss": 4005539.75} {"train_loss": -36.20296859741211, "global_step": 150887, "epoch": 1247} {"train_loss": -27.99360466003418, "global_step": 150888, "epoch": 1247} {"train_loss": -37.35747146606445, "global_step": 150889, "epoch": 1247} {"train_loss": -37.05531311035156, "global_step": 150890, "epoch": 1247} {"train_loss": -34.00553512573242, "global_step": 150891, "epoch": 1247} {"train_loss": -33.330116271972656, "global_step": 150892, "epoch": 1247} {"train_loss": -31.215696334838867, "global_step": 150893, "epoch": 1247} {"train_loss": -34.75812911987305, "global_step": 150894, "epoch": 1247} {"train_loss": -34.375953674316406, "global_step": 150895, "epoch": 1247} {"train_loss": -33.473506927490234, "global_step": 150896, "epoch": 1247} {"train_loss": -27.097126007080078, "global_step": 150897, "epoch": 1247} {"train_loss": -32.364906311035156, "global_step": 150898, "epoch": 1247} {"train_loss": -32.573822021484375, "global_step": 150899, "epoch": 1247} {"train_loss": -35.58413314819336, "global_step": 150900, "epoch": 1247} {"train_loss": -37.375728607177734, "global_step": 150901, "epoch": 1247} {"train_loss": -31.296125411987305, "global_step": 150902, "epoch": 1247} {"train_loss": -36.016700744628906, "global_step": 150903, "epoch": 1247} {"train_loss": -30.775543212890625, "global_step": 150904, "epoch": 1247} {"train_loss": -28.128698348999023, "global_step": 150905, "epoch": 1247} {"train_loss": -34.78581619262695, "global_step": 150906, "epoch": 1247} {"train_loss": -29.325632095336914, "global_step": 150907, "epoch": 1247} {"train_loss": -31.322546005249023, "global_step": 150908, "epoch": 1247} {"train_loss": -32.533363342285156, "global_step": 150909, "epoch": 1247} {"train_loss": -34.517494201660156, "global_step": 150910, "epoch": 1247} {"train_loss": -34.91878890991211, "global_step": 150911, "epoch": 1247} {"train_loss": -36.21932601928711, "global_step": 150912, "epoch": 1247} {"train_loss": -33.29114532470703, "global_step": 150913, "epoch": 1247} {"train_loss": -36.91046905517578, "global_step": 150914, "epoch": 1247} {"train_loss": -35.95905685424805, "global_step": 150915, "epoch": 1247} {"train_loss": -36.6685905456543, "global_step": 150916, "epoch": 1247} {"train_loss": -36.9043083190918, "global_step": 150917, "epoch": 1247} {"train_loss": -36.709197998046875, "global_step": 150918, "epoch": 1247} {"train_loss": -36.89082336425781, "global_step": 150919, "epoch": 1247} {"train_loss": -36.58674240112305, "global_step": 150920, "epoch": 1247} {"train_loss": -37.02884292602539, "global_step": 150921, "epoch": 1247} {"train_loss": -38.36396026611328, "global_step": 150922, "epoch": 1247} {"train_loss": -37.27928161621094, "global_step": 150923, "epoch": 1247} {"train_loss": -36.78569412231445, "global_step": 150924, "epoch": 1247} {"train_loss": -38.262786865234375, "global_step": 150925, "epoch": 1247} {"train_loss": -37.64933776855469, "global_step": 150926, "epoch": 1247} {"train_loss": -38.713138580322266, "global_step": 150927, "epoch": 1247} {"train_loss": -38.13545227050781, "global_step": 150928, "epoch": 1247} {"train_loss": -38.96171188354492, "global_step": 150929, "epoch": 1247} {"train_loss": -38.316280364990234, "global_step": 150930, "epoch": 1247} {"train_loss": -38.77067184448242, "global_step": 150931, "epoch": 1247} {"train_loss": -37.50916290283203, "global_step": 150932, "epoch": 1247} {"train_loss": -38.97299575805664, "global_step": 150933, "epoch": 1247} {"train_loss": -38.62684631347656, "global_step": 150934, "epoch": 1247} {"train_loss": -38.19348907470703, "global_step": 150935, "epoch": 1247} {"train_loss": -38.8872184753418, "global_step": 150936, "epoch": 1247} {"train_loss": -38.57424545288086, "global_step": 150937, "epoch": 1247} {"train_loss": -38.73056411743164, "global_step": 150938, "epoch": 1247} {"train_loss": -38.251869201660156, "global_step": 150939, "epoch": 1247} {"train_loss": -39.062931060791016, "global_step": 150940, "epoch": 1247} {"train_loss": -39.30101013183594, "global_step": 150941, "epoch": 1247} {"train_loss": -38.88039779663086, "global_step": 150942, "epoch": 1247} {"train_loss": -38.85165023803711, "global_step": 150943, "epoch": 1247} {"train_loss": -38.90108108520508, "global_step": 150944, "epoch": 1247} {"train_loss": -39.55792999267578, "global_step": 150945, "epoch": 1247} {"train_loss": -38.76088333129883, "global_step": 150946, "epoch": 1247} {"train_loss": -39.2730598449707, "global_step": 150947, "epoch": 1247} {"train_loss": -38.91250228881836, "global_step": 150948, "epoch": 1247} {"train_loss": -39.84722900390625, "global_step": 150949, "epoch": 1247} {"train_loss": -39.54269027709961, "global_step": 150950, "epoch": 1247} {"train_loss": -39.45718002319336, "global_step": 150951, "epoch": 1247} {"train_loss": -39.67258834838867, "global_step": 150952, "epoch": 1247} {"train_loss": -39.72251510620117, "global_step": 150953, "epoch": 1247} {"train_loss": -39.68734359741211, "global_step": 150954, "epoch": 1247} {"train_loss": -39.764461517333984, "global_step": 150955, "epoch": 1247} {"train_loss": -39.67130661010742, "global_step": 150956, "epoch": 1247} {"train_loss": -39.972774505615234, "global_step": 150957, "epoch": 1247} {"train_loss": -39.98484420776367, "global_step": 150958, "epoch": 1247} {"train_loss": -39.92184066772461, "global_step": 150959, "epoch": 1247} {"train_loss": -39.89973831176758, "global_step": 150960, "epoch": 1247} {"train_loss": -39.40631866455078, "global_step": 150961, "epoch": 1247} {"train_loss": -40.26694869995117, "global_step": 150962, "epoch": 1247} {"train_loss": -40.0646858215332, "global_step": 150963, "epoch": 1247} {"train_loss": -40.08061599731445, "global_step": 150964, "epoch": 1247} {"train_loss": -40.03965377807617, "global_step": 150965, "epoch": 1247} {"train_loss": -40.00562286376953, "global_step": 150966, "epoch": 1247} {"train_loss": -40.19214630126953, "global_step": 150967, "epoch": 1247} {"train_loss": -40.14826965332031, "global_step": 150968, "epoch": 1247} {"train_loss": -40.61712646484375, "global_step": 150969, "epoch": 1247} {"train_loss": -40.23259353637695, "global_step": 150970, "epoch": 1247} {"train_loss": -40.46834945678711, "global_step": 150971, "epoch": 1247} {"train_loss": -40.87262725830078, "global_step": 150972, "epoch": 1247} {"train_loss": -40.280941009521484, "global_step": 150973, "epoch": 1247} {"train_loss": -40.653236389160156, "global_step": 150974, "epoch": 1247} {"train_loss": -40.19991683959961, "global_step": 150975, "epoch": 1247} {"train_loss": -40.98263931274414, "global_step": 150976, "epoch": 1247} {"train_loss": -40.38042449951172, "global_step": 150977, "epoch": 1247} {"train_loss": -40.4456901550293, "global_step": 150978, "epoch": 1247} {"train_loss": -40.808956146240234, "global_step": 150979, "epoch": 1247} {"train_loss": -40.50634002685547, "global_step": 150980, "epoch": 1247} {"train_loss": -41.19224548339844, "global_step": 150981, "epoch": 1247} {"train_loss": -40.5150032043457, "global_step": 150982, "epoch": 1247} {"train_loss": -40.85813522338867, "global_step": 150983, "epoch": 1247} {"train_loss": -40.840816497802734, "global_step": 150984, "epoch": 1247} {"train_loss": -41.01884078979492, "global_step": 150985, "epoch": 1247} {"train_loss": -40.724365234375, "global_step": 150986, "epoch": 1247} {"train_loss": -41.02840042114258, "global_step": 150987, "epoch": 1247} {"train_loss": -41.038265228271484, "global_step": 150988, "epoch": 1247} {"train_loss": -41.540130615234375, "global_step": 150989, "epoch": 1247} {"train_loss": -41.03322219848633, "global_step": 150990, "epoch": 1247} {"train_loss": -41.13430404663086, "global_step": 150991, "epoch": 1247} {"train_loss": -41.092506408691406, "global_step": 150992, "epoch": 1247} {"train_loss": -41.07242965698242, "global_step": 150993, "epoch": 1247} {"train_loss": -41.082862854003906, "global_step": 150994, "epoch": 1247} {"train_loss": -41.143070220947266, "global_step": 150995, "epoch": 1247} {"train_loss": -40.873008728027344, "global_step": 150996, "epoch": 1247} {"train_loss": -41.1546745300293, "global_step": 150997, "epoch": 1247} {"train_loss": -41.227962493896484, "global_step": 150998, "epoch": 1247} {"train_loss": -40.70943832397461, "global_step": 150999, "epoch": 1247} {"train_loss": -40.75849914550781, "global_step": 151000, "epoch": 1247} {"train_loss": -40.18876266479492, "global_step": 151001, "epoch": 1247} {"train_loss": -36.2718620300293, "global_step": 151002, "epoch": 1247} {"train_loss": -41.59077072143555, "global_step": 151003, "epoch": 1247} {"train_loss": -36.37944793701172, "global_step": 151004, "epoch": 1247} {"train_loss": -39.326271057128906, "global_step": 151005, "epoch": 1247} {"train_loss": -35.0394172668457, "global_step": 151006, "epoch": 1247} {"train_loss": -38.01391024628946, "global_step": 151007, "epoch": 1247, "val_loss": 2727148.5} {"train_loss": -35.14036178588867, "global_step": 151008, "epoch": 1248} {"train_loss": -35.43682861328125, "global_step": 151009, "epoch": 1248} {"train_loss": -35.51704788208008, "global_step": 151010, "epoch": 1248} {"train_loss": -35.14611053466797, "global_step": 151011, "epoch": 1248} {"train_loss": -35.465084075927734, "global_step": 151012, "epoch": 1248} {"train_loss": -35.260501861572266, "global_step": 151013, "epoch": 1248} {"train_loss": -35.734230041503906, "global_step": 151014, "epoch": 1248} {"train_loss": -35.46352005004883, "global_step": 151015, "epoch": 1248} {"train_loss": -36.097808837890625, "global_step": 151016, "epoch": 1248} {"train_loss": -35.63315963745117, "global_step": 151017, "epoch": 1248} {"train_loss": -36.104522705078125, "global_step": 151018, "epoch": 1248} {"train_loss": -36.1179084777832, "global_step": 151019, "epoch": 1248} {"train_loss": -34.70801544189453, "global_step": 151020, "epoch": 1248} {"train_loss": -36.4875373840332, "global_step": 151021, "epoch": 1248} {"train_loss": -36.21148681640625, "global_step": 151022, "epoch": 1248} {"train_loss": -35.417808532714844, "global_step": 151023, "epoch": 1248} {"train_loss": -35.342193603515625, "global_step": 151024, "epoch": 1248} {"train_loss": -36.1965446472168, "global_step": 151025, "epoch": 1248} {"train_loss": -35.81324005126953, "global_step": 151026, "epoch": 1248} {"train_loss": -36.06719207763672, "global_step": 151027, "epoch": 1248} {"train_loss": -35.390846252441406, "global_step": 151028, "epoch": 1248} {"train_loss": -34.440425872802734, "global_step": 151029, "epoch": 1248} {"train_loss": -29.229724884033203, "global_step": 151030, "epoch": 1248} {"train_loss": -28.56125259399414, "global_step": 151031, "epoch": 1248} {"train_loss": -35.730316162109375, "global_step": 151032, "epoch": 1248} {"train_loss": -31.1541748046875, "global_step": 151033, "epoch": 1248} {"train_loss": -36.134857177734375, "global_step": 151034, "epoch": 1248} {"train_loss": -31.89849281311035, "global_step": 151035, "epoch": 1248} {"train_loss": -35.622127532958984, "global_step": 151036, "epoch": 1248} {"train_loss": -33.1859016418457, "global_step": 151037, "epoch": 1248} {"train_loss": -36.61613082885742, "global_step": 151038, "epoch": 1248} {"train_loss": -33.31791687011719, "global_step": 151039, "epoch": 1248} {"train_loss": -36.359336853027344, "global_step": 151040, "epoch": 1248} {"train_loss": -33.98995590209961, "global_step": 151041, "epoch": 1248} {"train_loss": -35.619903564453125, "global_step": 151042, "epoch": 1248} {"train_loss": -35.20547866821289, "global_step": 151043, "epoch": 1248} {"train_loss": -34.97246170043945, "global_step": 151044, "epoch": 1248} {"train_loss": -36.977569580078125, "global_step": 151045, "epoch": 1248} {"train_loss": -35.83778762817383, "global_step": 151046, "epoch": 1248} {"train_loss": -35.23334884643555, "global_step": 151047, "epoch": 1248} {"train_loss": -35.93349838256836, "global_step": 151048, "epoch": 1248} {"train_loss": -35.9925422668457, "global_step": 151049, "epoch": 1248} {"train_loss": -35.902034759521484, "global_step": 151050, "epoch": 1248} {"train_loss": -36.433143615722656, "global_step": 151051, "epoch": 1248} {"train_loss": -36.569271087646484, "global_step": 151052, "epoch": 1248} {"train_loss": -36.40262222290039, "global_step": 151053, "epoch": 1248} {"train_loss": -36.50482940673828, "global_step": 151054, "epoch": 1248} {"train_loss": -36.67500686645508, "global_step": 151055, "epoch": 1248} {"train_loss": -36.79386520385742, "global_step": 151056, "epoch": 1248} {"train_loss": -37.284969329833984, "global_step": 151057, "epoch": 1248} {"train_loss": -36.51081848144531, "global_step": 151058, "epoch": 1248} {"train_loss": -36.65031051635742, "global_step": 151059, "epoch": 1248} {"train_loss": -37.360164642333984, "global_step": 151060, "epoch": 1248} {"train_loss": -37.429107666015625, "global_step": 151061, "epoch": 1248} {"train_loss": -37.28319549560547, "global_step": 151062, "epoch": 1248} {"train_loss": -37.746761322021484, "global_step": 151063, "epoch": 1248} {"train_loss": -37.6956672668457, "global_step": 151064, "epoch": 1248} {"train_loss": -37.89817428588867, "global_step": 151065, "epoch": 1248} {"train_loss": -37.79819107055664, "global_step": 151066, "epoch": 1248} {"train_loss": -37.99471664428711, "global_step": 151067, "epoch": 1248} {"train_loss": -37.80870056152344, "global_step": 151068, "epoch": 1248} {"train_loss": -38.062984466552734, "global_step": 151069, "epoch": 1248} {"train_loss": -38.18000411987305, "global_step": 151070, "epoch": 1248} {"train_loss": -37.58108139038086, "global_step": 151071, "epoch": 1248} {"train_loss": -37.73360061645508, "global_step": 151072, "epoch": 1248} {"train_loss": -38.129146575927734, "global_step": 151073, "epoch": 1248} {"train_loss": -37.88037109375, "global_step": 151074, "epoch": 1248} {"train_loss": -38.364253997802734, "global_step": 151075, "epoch": 1248} {"train_loss": -37.94074249267578, "global_step": 151076, "epoch": 1248} {"train_loss": -38.30985641479492, "global_step": 151077, "epoch": 1248} {"train_loss": -37.76871109008789, "global_step": 151078, "epoch": 1248} {"train_loss": -38.790557861328125, "global_step": 151079, "epoch": 1248} {"train_loss": -38.45896530151367, "global_step": 151080, "epoch": 1248} {"train_loss": -38.15884017944336, "global_step": 151081, "epoch": 1248} {"train_loss": -38.76145553588867, "global_step": 151082, "epoch": 1248} {"train_loss": -38.275657653808594, "global_step": 151083, "epoch": 1248} {"train_loss": -37.91187286376953, "global_step": 151084, "epoch": 1248} {"train_loss": -38.461082458496094, "global_step": 151085, "epoch": 1248} {"train_loss": -38.86907958984375, "global_step": 151086, "epoch": 1248} {"train_loss": -38.99940872192383, "global_step": 151087, "epoch": 1248} {"train_loss": -38.526100158691406, "global_step": 151088, "epoch": 1248} {"train_loss": -38.26081466674805, "global_step": 151089, "epoch": 1248} {"train_loss": -38.8131217956543, "global_step": 151090, "epoch": 1248} {"train_loss": -38.5175666809082, "global_step": 151091, "epoch": 1248} {"train_loss": -38.501197814941406, "global_step": 151092, "epoch": 1248} {"train_loss": -39.082637786865234, "global_step": 151093, "epoch": 1248} {"train_loss": -38.8243408203125, "global_step": 151094, "epoch": 1248} {"train_loss": -38.44649887084961, "global_step": 151095, "epoch": 1248} {"train_loss": -38.45082473754883, "global_step": 151096, "epoch": 1248} {"train_loss": -38.886287689208984, "global_step": 151097, "epoch": 1248} {"train_loss": -38.865875244140625, "global_step": 151098, "epoch": 1248} {"train_loss": -39.328853607177734, "global_step": 151099, "epoch": 1248} {"train_loss": -39.37076187133789, "global_step": 151100, "epoch": 1248} {"train_loss": -38.993343353271484, "global_step": 151101, "epoch": 1248} {"train_loss": -39.57485580444336, "global_step": 151102, "epoch": 1248} {"train_loss": -39.08307647705078, "global_step": 151103, "epoch": 1248} {"train_loss": -39.10695266723633, "global_step": 151104, "epoch": 1248} {"train_loss": -38.931495666503906, "global_step": 151105, "epoch": 1248} {"train_loss": -39.536705017089844, "global_step": 151106, "epoch": 1248} {"train_loss": -38.33246994018555, "global_step": 151107, "epoch": 1248} {"train_loss": -39.89571762084961, "global_step": 151108, "epoch": 1248} {"train_loss": -39.71855545043945, "global_step": 151109, "epoch": 1248} {"train_loss": -38.60786056518555, "global_step": 151110, "epoch": 1248} {"train_loss": -39.589263916015625, "global_step": 151111, "epoch": 1248} {"train_loss": -39.43117141723633, "global_step": 151112, "epoch": 1248} {"train_loss": -39.32232666015625, "global_step": 151113, "epoch": 1248} {"train_loss": -38.438480377197266, "global_step": 151114, "epoch": 1248} {"train_loss": -38.95976638793945, "global_step": 151115, "epoch": 1248} {"train_loss": -39.136253356933594, "global_step": 151116, "epoch": 1248} {"train_loss": -39.44607925415039, "global_step": 151117, "epoch": 1248} {"train_loss": -39.287044525146484, "global_step": 151118, "epoch": 1248} {"train_loss": -39.527137756347656, "global_step": 151119, "epoch": 1248} {"train_loss": -38.27151107788086, "global_step": 151120, "epoch": 1248} {"train_loss": -39.50767135620117, "global_step": 151121, "epoch": 1248} {"train_loss": -39.43541717529297, "global_step": 151122, "epoch": 1248} {"train_loss": -39.12856674194336, "global_step": 151123, "epoch": 1248} {"train_loss": -39.50991439819336, "global_step": 151124, "epoch": 1248} {"train_loss": -38.56229782104492, "global_step": 151125, "epoch": 1248} {"train_loss": -38.709739685058594, "global_step": 151126, "epoch": 1248} {"train_loss": -39.6680908203125, "global_step": 151127, "epoch": 1248} {"train_loss": -37.21725859523805, "global_step": 151128, "epoch": 1248, "val_loss": 2628016.25} {"train_loss": -38.9549446105957, "global_step": 151129, "epoch": 1249} {"train_loss": -38.399085998535156, "global_step": 151130, "epoch": 1249} {"train_loss": -39.08219528198242, "global_step": 151131, "epoch": 1249} {"train_loss": -39.66732406616211, "global_step": 151132, "epoch": 1249} {"train_loss": -38.56428909301758, "global_step": 151133, "epoch": 1249} {"train_loss": -39.8429069519043, "global_step": 151134, "epoch": 1249} {"train_loss": -39.49799346923828, "global_step": 151135, "epoch": 1249} {"train_loss": -39.12623977661133, "global_step": 151136, "epoch": 1249} {"train_loss": -39.64226150512695, "global_step": 151137, "epoch": 1249} {"train_loss": -39.978431701660156, "global_step": 151138, "epoch": 1249} {"train_loss": -39.7122917175293, "global_step": 151139, "epoch": 1249} {"train_loss": -39.78137969970703, "global_step": 151140, "epoch": 1249} {"train_loss": -39.43195343017578, "global_step": 151141, "epoch": 1249} {"train_loss": -38.18290328979492, "global_step": 151142, "epoch": 1249} {"train_loss": -39.85880661010742, "global_step": 151143, "epoch": 1249} {"train_loss": -39.1922492980957, "global_step": 151144, "epoch": 1249} {"train_loss": -39.447265625, "global_step": 151145, "epoch": 1249} {"train_loss": -40.12406539916992, "global_step": 151146, "epoch": 1249} {"train_loss": -39.738338470458984, "global_step": 151147, "epoch": 1249} {"train_loss": -39.18119430541992, "global_step": 151148, "epoch": 1249} {"train_loss": -39.36806106567383, "global_step": 151149, "epoch": 1249} {"train_loss": -39.092323303222656, "global_step": 151150, "epoch": 1249} {"train_loss": -39.57345199584961, "global_step": 151151, "epoch": 1249} {"train_loss": -38.99937057495117, "global_step": 151152, "epoch": 1249} {"train_loss": -38.775447845458984, "global_step": 151153, "epoch": 1249} {"train_loss": -39.30502700805664, "global_step": 151154, "epoch": 1249} {"train_loss": -38.41911697387695, "global_step": 151155, "epoch": 1249} {"train_loss": -38.72550582885742, "global_step": 151156, "epoch": 1249} {"train_loss": -38.317588806152344, "global_step": 151157, "epoch": 1249} {"train_loss": -37.48064422607422, "global_step": 151158, "epoch": 1249} {"train_loss": -38.09939193725586, "global_step": 151159, "epoch": 1249} {"train_loss": -38.87370681762695, "global_step": 151160, "epoch": 1249} {"train_loss": -36.716064453125, "global_step": 151161, "epoch": 1249} {"train_loss": -37.98652267456055, "global_step": 151162, "epoch": 1249} {"train_loss": -39.060394287109375, "global_step": 151163, "epoch": 1249} {"train_loss": -35.88157272338867, "global_step": 151164, "epoch": 1249} {"train_loss": -36.764862060546875, "global_step": 151165, "epoch": 1249} {"train_loss": -37.78456115722656, "global_step": 151166, "epoch": 1249} {"train_loss": -38.940338134765625, "global_step": 151167, "epoch": 1249} {"train_loss": -38.57786178588867, "global_step": 151168, "epoch": 1249} {"train_loss": -37.452301025390625, "global_step": 151169, "epoch": 1249} {"train_loss": -38.14932632446289, "global_step": 151170, "epoch": 1249} {"train_loss": -39.162532806396484, "global_step": 151171, "epoch": 1249} {"train_loss": -36.95444107055664, "global_step": 151172, "epoch": 1249} {"train_loss": -35.91632080078125, "global_step": 151173, "epoch": 1249} {"train_loss": -39.18315124511719, "global_step": 151174, "epoch": 1249} {"train_loss": -39.02994918823242, "global_step": 151175, "epoch": 1249} {"train_loss": -38.04850387573242, "global_step": 151176, "epoch": 1249} {"train_loss": -38.02985763549805, "global_step": 151177, "epoch": 1249} {"train_loss": -38.492164611816406, "global_step": 151178, "epoch": 1249} {"train_loss": -38.5621337890625, "global_step": 151179, "epoch": 1249} {"train_loss": -37.61269760131836, "global_step": 151180, "epoch": 1249} {"train_loss": -36.757938385009766, "global_step": 151181, "epoch": 1249} {"train_loss": -38.93379211425781, "global_step": 151182, "epoch": 1249} {"train_loss": -39.089656829833984, "global_step": 151183, "epoch": 1249} {"train_loss": -38.173057556152344, "global_step": 151184, "epoch": 1249} {"train_loss": -38.04943084716797, "global_step": 151185, "epoch": 1249} {"train_loss": -39.147151947021484, "global_step": 151186, "epoch": 1249} {"train_loss": -39.000396728515625, "global_step": 151187, "epoch": 1249} {"train_loss": -37.92577362060547, "global_step": 151188, "epoch": 1249} {"train_loss": -38.47005844116211, "global_step": 151189, "epoch": 1249} {"train_loss": -38.2121696472168, "global_step": 151190, "epoch": 1249} {"train_loss": -38.57576370239258, "global_step": 151191, "epoch": 1249} {"train_loss": -39.13134765625, "global_step": 151192, "epoch": 1249} {"train_loss": -38.9463996887207, "global_step": 151193, "epoch": 1249} {"train_loss": -39.54586410522461, "global_step": 151194, "epoch": 1249} {"train_loss": -37.71284103393555, "global_step": 151195, "epoch": 1249} {"train_loss": -38.867610931396484, "global_step": 151196, "epoch": 1249} {"train_loss": -38.683128356933594, "global_step": 151197, "epoch": 1249} {"train_loss": -39.13496780395508, "global_step": 151198, "epoch": 1249} {"train_loss": -38.83362579345703, "global_step": 151199, "epoch": 1249} {"train_loss": -39.27276611328125, "global_step": 151200, "epoch": 1249} {"train_loss": -38.196998596191406, "global_step": 151201, "epoch": 1249} {"train_loss": -38.94477462768555, "global_step": 151202, "epoch": 1249} {"train_loss": -39.15739059448242, "global_step": 151203, "epoch": 1249} {"train_loss": -39.07786560058594, "global_step": 151204, "epoch": 1249} {"train_loss": -39.19537353515625, "global_step": 151205, "epoch": 1249} {"train_loss": -38.72996520996094, "global_step": 151206, "epoch": 1249} {"train_loss": -38.33073043823242, "global_step": 151207, "epoch": 1249} {"train_loss": -38.89039993286133, "global_step": 151208, "epoch": 1249} {"train_loss": -38.65601348876953, "global_step": 151209, "epoch": 1249} {"train_loss": -38.752994537353516, "global_step": 151210, "epoch": 1249} {"train_loss": -39.56516647338867, "global_step": 151211, "epoch": 1249} {"train_loss": -38.60696029663086, "global_step": 151212, "epoch": 1249} {"train_loss": -38.497493743896484, "global_step": 151213, "epoch": 1249} {"train_loss": -39.38227844238281, "global_step": 151214, "epoch": 1249} {"train_loss": -38.38948440551758, "global_step": 151215, "epoch": 1249} {"train_loss": -38.37405014038086, "global_step": 151216, "epoch": 1249} {"train_loss": -39.57058334350586, "global_step": 151217, "epoch": 1249} {"train_loss": -38.613685607910156, "global_step": 151218, "epoch": 1249} {"train_loss": -39.72715377807617, "global_step": 151219, "epoch": 1249} {"train_loss": -39.58951950073242, "global_step": 151220, "epoch": 1249} {"train_loss": -38.149940490722656, "global_step": 151221, "epoch": 1249} {"train_loss": -36.82108688354492, "global_step": 151222, "epoch": 1249} {"train_loss": -37.031978607177734, "global_step": 151223, "epoch": 1249} {"train_loss": -39.206974029541016, "global_step": 151224, "epoch": 1249} {"train_loss": -39.86326217651367, "global_step": 151225, "epoch": 1249} {"train_loss": -39.04574203491211, "global_step": 151226, "epoch": 1249} {"train_loss": -39.09690475463867, "global_step": 151227, "epoch": 1249} {"train_loss": -39.33443069458008, "global_step": 151228, "epoch": 1249} {"train_loss": -39.718441009521484, "global_step": 151229, "epoch": 1249} {"train_loss": -39.231201171875, "global_step": 151230, "epoch": 1249} {"train_loss": -39.39592361450195, "global_step": 151231, "epoch": 1249} {"train_loss": -39.423641204833984, "global_step": 151232, "epoch": 1249} {"train_loss": -38.24917221069336, "global_step": 151233, "epoch": 1249} {"train_loss": -37.7638053894043, "global_step": 151234, "epoch": 1249} {"train_loss": -39.87689208984375, "global_step": 151235, "epoch": 1249} {"train_loss": -39.19199752807617, "global_step": 151236, "epoch": 1249} {"train_loss": -39.3071403503418, "global_step": 151237, "epoch": 1249} {"train_loss": -40.04838180541992, "global_step": 151238, "epoch": 1249} {"train_loss": -38.63212966918945, "global_step": 151239, "epoch": 1249} {"train_loss": -38.231971740722656, "global_step": 151240, "epoch": 1249} {"train_loss": -37.045101165771484, "global_step": 151241, "epoch": 1249} {"train_loss": -37.21925354003906, "global_step": 151242, "epoch": 1249} {"train_loss": -38.436824798583984, "global_step": 151243, "epoch": 1249} {"train_loss": -38.45588302612305, "global_step": 151244, "epoch": 1249} {"train_loss": -39.46845245361328, "global_step": 151245, "epoch": 1249} {"train_loss": -38.366641998291016, "global_step": 151246, "epoch": 1249} {"train_loss": -38.99737548828125, "global_step": 151247, "epoch": 1249} {"train_loss": -36.920040130615234, "global_step": 151248, "epoch": 1249} {"train_loss": -38.69041133912142, "global_step": 151249, "epoch": 1249, "val_loss": 2501045.0} {"train_loss": -37.89064407348633, "global_step": 151250, "epoch": 1250} {"train_loss": -36.430999755859375, "global_step": 151251, "epoch": 1250} {"train_loss": -39.043434143066406, "global_step": 151252, "epoch": 1250} {"train_loss": -39.62504577636719, "global_step": 151253, "epoch": 1250} {"train_loss": -37.531673431396484, "global_step": 151254, "epoch": 1250} {"train_loss": -37.19785690307617, "global_step": 151255, "epoch": 1250} {"train_loss": -38.61588668823242, "global_step": 151256, "epoch": 1250} {"train_loss": -38.1900749206543, "global_step": 151257, "epoch": 1250} {"train_loss": -38.65126419067383, "global_step": 151258, "epoch": 1250} {"train_loss": -37.340702056884766, "global_step": 151259, "epoch": 1250} {"train_loss": -38.49692916870117, "global_step": 151260, "epoch": 1250} {"train_loss": -37.771297454833984, "global_step": 151261, "epoch": 1250} {"train_loss": -37.96876907348633, "global_step": 151262, "epoch": 1250} {"train_loss": -36.837032318115234, "global_step": 151263, "epoch": 1250} {"train_loss": -36.708595275878906, "global_step": 151264, "epoch": 1250} {"train_loss": -38.047637939453125, "global_step": 151265, "epoch": 1250} {"train_loss": -37.51968002319336, "global_step": 151266, "epoch": 1250} {"train_loss": -37.28654098510742, "global_step": 151267, "epoch": 1250} {"train_loss": -37.879638671875, "global_step": 151268, "epoch": 1250} {"train_loss": -38.100311279296875, "global_step": 151269, "epoch": 1250} {"train_loss": -38.54465866088867, "global_step": 151270, "epoch": 1250} {"train_loss": -39.2534294128418, "global_step": 151271, "epoch": 1250} {"train_loss": -38.62789535522461, "global_step": 151272, "epoch": 1250} {"train_loss": -37.79046630859375, "global_step": 151273, "epoch": 1250} {"train_loss": -38.092655181884766, "global_step": 151274, "epoch": 1250} {"train_loss": -36.859703063964844, "global_step": 151275, "epoch": 1250} {"train_loss": -38.501075744628906, "global_step": 151276, "epoch": 1250} {"train_loss": -39.459571838378906, "global_step": 151277, "epoch": 1250} {"train_loss": -37.7818717956543, "global_step": 151278, "epoch": 1250} {"train_loss": -37.14753341674805, "global_step": 151279, "epoch": 1250} {"train_loss": -37.92849349975586, "global_step": 151280, "epoch": 1250} {"train_loss": -38.17240524291992, "global_step": 151281, "epoch": 1250} {"train_loss": -37.90704345703125, "global_step": 151282, "epoch": 1250} {"train_loss": -39.0058479309082, "global_step": 151283, "epoch": 1250} {"train_loss": -36.23059844970703, "global_step": 151284, "epoch": 1250} {"train_loss": -38.959678649902344, "global_step": 151285, "epoch": 1250} {"train_loss": -38.17323303222656, "global_step": 151286, "epoch": 1250} {"train_loss": -38.469017028808594, "global_step": 151287, "epoch": 1250} {"train_loss": -37.16782760620117, "global_step": 151288, "epoch": 1250} {"train_loss": -38.04742431640625, "global_step": 151289, "epoch": 1250} {"train_loss": -37.354427337646484, "global_step": 151290, "epoch": 1250} {"train_loss": -38.00535202026367, "global_step": 151291, "epoch": 1250} {"train_loss": -39.11436080932617, "global_step": 151292, "epoch": 1250} {"train_loss": -36.33427047729492, "global_step": 151293, "epoch": 1250} {"train_loss": -37.53005599975586, "global_step": 151294, "epoch": 1250} {"train_loss": -36.89598083496094, "global_step": 151295, "epoch": 1250} {"train_loss": -39.04650115966797, "global_step": 151296, "epoch": 1250} {"train_loss": -36.6002311706543, "global_step": 151297, "epoch": 1250} {"train_loss": -37.971832275390625, "global_step": 151298, "epoch": 1250} {"train_loss": -37.3931884765625, "global_step": 151299, "epoch": 1250} {"train_loss": -36.112884521484375, "global_step": 151300, "epoch": 1250} {"train_loss": -37.93856430053711, "global_step": 151301, "epoch": 1250} {"train_loss": -38.23924255371094, "global_step": 151302, "epoch": 1250} {"train_loss": -37.11444091796875, "global_step": 151303, "epoch": 1250} {"train_loss": -35.63987350463867, "global_step": 151304, "epoch": 1250} {"train_loss": -36.22043991088867, "global_step": 151305, "epoch": 1250} {"train_loss": -37.19145584106445, "global_step": 151306, "epoch": 1250} {"train_loss": -37.590065002441406, "global_step": 151307, "epoch": 1250} {"train_loss": -36.52735137939453, "global_step": 151308, "epoch": 1250} {"train_loss": -37.73019027709961, "global_step": 151309, "epoch": 1250} {"train_loss": -37.17167282104492, "global_step": 151310, "epoch": 1250} {"train_loss": -33.91661834716797, "global_step": 151311, "epoch": 1250} {"train_loss": -37.04488754272461, "global_step": 151312, "epoch": 1250} {"train_loss": -35.3595085144043, "global_step": 151313, "epoch": 1250} {"train_loss": -38.32938766479492, "global_step": 151314, "epoch": 1250} {"train_loss": -36.768409729003906, "global_step": 151315, "epoch": 1250} {"train_loss": -37.8647346496582, "global_step": 151316, "epoch": 1250} {"train_loss": -35.08035659790039, "global_step": 151317, "epoch": 1250} {"train_loss": -37.77341842651367, "global_step": 151318, "epoch": 1250} {"train_loss": -35.44906997680664, "global_step": 151319, "epoch": 1250} {"train_loss": -36.053192138671875, "global_step": 151320, "epoch": 1250} {"train_loss": -34.2394905090332, "global_step": 151321, "epoch": 1250} {"train_loss": -37.5179328918457, "global_step": 151322, "epoch": 1250} {"train_loss": -35.21544647216797, "global_step": 151323, "epoch": 1250} {"train_loss": -36.99095153808594, "global_step": 151324, "epoch": 1250} {"train_loss": -36.484676361083984, "global_step": 151325, "epoch": 1250} {"train_loss": -37.39421463012695, "global_step": 151326, "epoch": 1250} {"train_loss": -35.63323974609375, "global_step": 151327, "epoch": 1250} {"train_loss": -37.968238830566406, "global_step": 151328, "epoch": 1250} {"train_loss": -35.28974533081055, "global_step": 151329, "epoch": 1250} {"train_loss": -37.12179183959961, "global_step": 151330, "epoch": 1250} {"train_loss": -36.05469512939453, "global_step": 151331, "epoch": 1250} {"train_loss": -36.86138916015625, "global_step": 151332, "epoch": 1250} {"train_loss": -35.51960372924805, "global_step": 151333, "epoch": 1250} {"train_loss": -37.286346435546875, "global_step": 151334, "epoch": 1250} {"train_loss": -36.4944953918457, "global_step": 151335, "epoch": 1250} {"train_loss": -37.2385368347168, "global_step": 151336, "epoch": 1250} {"train_loss": -38.2142333984375, "global_step": 151337, "epoch": 1250} {"train_loss": -37.57123565673828, "global_step": 151338, "epoch": 1250} {"train_loss": -36.43777084350586, "global_step": 151339, "epoch": 1250} {"train_loss": -35.67656326293945, "global_step": 151340, "epoch": 1250} {"train_loss": -37.80498123168945, "global_step": 151341, "epoch": 1250} {"train_loss": -35.651458740234375, "global_step": 151342, "epoch": 1250} {"train_loss": -36.32121658325195, "global_step": 151343, "epoch": 1250} {"train_loss": -38.191219329833984, "global_step": 151344, "epoch": 1250} {"train_loss": -37.54222869873047, "global_step": 151345, "epoch": 1250} {"train_loss": -36.9259147644043, "global_step": 151346, "epoch": 1250} {"train_loss": -37.524837493896484, "global_step": 151347, "epoch": 1250} {"train_loss": -36.75065612792969, "global_step": 151348, "epoch": 1250} {"train_loss": -37.7180290222168, "global_step": 151349, "epoch": 1250} {"train_loss": -38.05404281616211, "global_step": 151350, "epoch": 1250} {"train_loss": -37.067440032958984, "global_step": 151351, "epoch": 1250} {"train_loss": -37.876922607421875, "global_step": 151352, "epoch": 1250} {"train_loss": -38.1793098449707, "global_step": 151353, "epoch": 1250} {"train_loss": -37.6134147644043, "global_step": 151354, "epoch": 1250} {"train_loss": -37.066646575927734, "global_step": 151355, "epoch": 1250} {"train_loss": -38.11119842529297, "global_step": 151356, "epoch": 1250} {"train_loss": -38.406982421875, "global_step": 151357, "epoch": 1250} {"train_loss": -38.80064010620117, "global_step": 151358, "epoch": 1250} {"train_loss": -38.851890563964844, "global_step": 151359, "epoch": 1250} {"train_loss": -37.21628952026367, "global_step": 151360, "epoch": 1250} {"train_loss": -38.7592887878418, "global_step": 151361, "epoch": 1250} {"train_loss": -38.37360763549805, "global_step": 151362, "epoch": 1250} {"train_loss": -38.18781280517578, "global_step": 151363, "epoch": 1250} {"train_loss": -38.35829544067383, "global_step": 151364, "epoch": 1250} {"train_loss": -38.095149993896484, "global_step": 151365, "epoch": 1250} {"train_loss": -38.3194465637207, "global_step": 151366, "epoch": 1250} {"train_loss": -38.47024154663086, "global_step": 151367, "epoch": 1250} {"train_loss": -38.2009391784668, "global_step": 151368, "epoch": 1250} {"train_loss": -38.33501434326172, "global_step": 151369, "epoch": 1250} {"train_loss": -37.45910345030225, "global_step": 151370, "epoch": 1250, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4400000": 1.0, "test/sim_max_reward_4400001": 1.0, "test/sim_max_reward_4400002": 1.0, "test/sim_max_reward_4400003": 0.0, "test/sim_max_reward_4400004": 1.0, "test/sim_max_reward_4400005": 1.0, "test/sim_max_reward_4400006": 1.0, "test/sim_max_reward_4400007": 1.0, "test/sim_max_reward_4400008": 1.0, "test/sim_max_reward_4400009": 1.0, "test/sim_max_reward_4400010": 1.0, "test/sim_max_reward_4400011": 1.0, "test/sim_max_reward_4400012": 1.0, "test/sim_max_reward_4400013": 1.0, "test/sim_max_reward_4400014": 0.0, "test/sim_max_reward_4400015": 1.0, "test/sim_max_reward_4400016": 1.0, "test/sim_max_reward_4400017": 1.0, "test/sim_max_reward_4400018": 1.0, "test/sim_max_reward_4400019": 1.0, "test/sim_max_reward_4400020": 1.0, "test/sim_max_reward_4400021": 1.0, "train/mean_score": 1.0, "test/mean_score": 0.9090909090909091, "val_loss": 2573524.75} {"train_loss": -38.57639694213867, "global_step": 151371, "epoch": 1251} {"train_loss": -38.76803207397461, "global_step": 151372, "epoch": 1251} {"train_loss": -38.5715217590332, "global_step": 151373, "epoch": 1251} {"train_loss": -39.077266693115234, "global_step": 151374, "epoch": 1251} {"train_loss": -38.776649475097656, "global_step": 151375, "epoch": 1251} {"train_loss": -38.86343002319336, "global_step": 151376, "epoch": 1251} {"train_loss": -38.84223556518555, "global_step": 151377, "epoch": 1251} {"train_loss": -39.02758026123047, "global_step": 151378, "epoch": 1251} {"train_loss": -37.96213150024414, "global_step": 151379, "epoch": 1251} {"train_loss": -37.532039642333984, "global_step": 151380, "epoch": 1251} {"train_loss": -36.14425277709961, "global_step": 151381, "epoch": 1251} {"train_loss": -35.4327507019043, "global_step": 151382, "epoch": 1251} {"train_loss": -36.86560821533203, "global_step": 151383, "epoch": 1251} {"train_loss": -38.536678314208984, "global_step": 151384, "epoch": 1251} {"train_loss": -39.210262298583984, "global_step": 151385, "epoch": 1251} {"train_loss": -36.94346237182617, "global_step": 151386, "epoch": 1251} {"train_loss": -38.34163284301758, "global_step": 151387, "epoch": 1251} {"train_loss": -38.92666244506836, "global_step": 151388, "epoch": 1251} {"train_loss": -37.59591293334961, "global_step": 151389, "epoch": 1251} {"train_loss": -37.10000228881836, "global_step": 151390, "epoch": 1251} {"train_loss": -39.070594787597656, "global_step": 151391, "epoch": 1251} {"train_loss": -38.09835433959961, "global_step": 151392, "epoch": 1251} {"train_loss": -38.887447357177734, "global_step": 151393, "epoch": 1251} {"train_loss": -38.393856048583984, "global_step": 151394, "epoch": 1251} {"train_loss": -38.516510009765625, "global_step": 151395, "epoch": 1251} {"train_loss": -38.57140350341797, "global_step": 151396, "epoch": 1251} {"train_loss": -35.13564682006836, "global_step": 151397, "epoch": 1251} {"train_loss": -38.5384635925293, "global_step": 151398, "epoch": 1251} {"train_loss": -38.082069396972656, "global_step": 151399, "epoch": 1251} {"train_loss": -37.869747161865234, "global_step": 151400, "epoch": 1251} {"train_loss": -38.283470153808594, "global_step": 151401, "epoch": 1251} {"train_loss": -38.42741775512695, "global_step": 151402, "epoch": 1251} {"train_loss": -39.1781120300293, "global_step": 151403, "epoch": 1251} {"train_loss": -38.342105865478516, "global_step": 151404, "epoch": 1251} {"train_loss": -36.35620880126953, "global_step": 151405, "epoch": 1251} {"train_loss": -39.07463073730469, "global_step": 151406, "epoch": 1251} {"train_loss": -35.27474594116211, "global_step": 151407, "epoch": 1251} {"train_loss": -38.75834274291992, "global_step": 151408, "epoch": 1251} {"train_loss": -38.47162628173828, "global_step": 151409, "epoch": 1251} {"train_loss": -35.938899993896484, "global_step": 151410, "epoch": 1251} {"train_loss": -39.1036376953125, "global_step": 151411, "epoch": 1251} {"train_loss": -37.06876754760742, "global_step": 151412, "epoch": 1251} {"train_loss": -38.9871826171875, "global_step": 151413, "epoch": 1251} {"train_loss": -39.083797454833984, "global_step": 151414, "epoch": 1251} {"train_loss": -39.47761154174805, "global_step": 151415, "epoch": 1251} {"train_loss": -38.99287033081055, "global_step": 151416, "epoch": 1251} {"train_loss": -39.0789909362793, "global_step": 151417, "epoch": 1251} {"train_loss": -36.67521286010742, "global_step": 151418, "epoch": 1251} {"train_loss": -38.50959777832031, "global_step": 151419, "epoch": 1251} {"train_loss": -39.04879379272461, "global_step": 151420, "epoch": 1251} {"train_loss": -37.06864929199219, "global_step": 151421, "epoch": 1251} {"train_loss": -38.78498077392578, "global_step": 151422, "epoch": 1251} {"train_loss": -38.05220031738281, "global_step": 151423, "epoch": 1251} {"train_loss": -38.45932388305664, "global_step": 151424, "epoch": 1251} {"train_loss": -36.537349700927734, "global_step": 151425, "epoch": 1251} {"train_loss": -38.87335205078125, "global_step": 151426, "epoch": 1251} {"train_loss": -38.45968246459961, "global_step": 151427, "epoch": 1251} {"train_loss": -37.96030807495117, "global_step": 151428, "epoch": 1251} {"train_loss": -37.52871322631836, "global_step": 151429, "epoch": 1251} {"train_loss": -38.649898529052734, "global_step": 151430, "epoch": 1251} {"train_loss": -38.6582145690918, "global_step": 151431, "epoch": 1251} {"train_loss": -37.020301818847656, "global_step": 151432, "epoch": 1251} {"train_loss": -37.93197250366211, "global_step": 151433, "epoch": 1251} {"train_loss": -38.12133026123047, "global_step": 151434, "epoch": 1251} {"train_loss": -37.882320404052734, "global_step": 151435, "epoch": 1251} {"train_loss": -38.27753448486328, "global_step": 151436, "epoch": 1251} {"train_loss": -36.801876068115234, "global_step": 151437, "epoch": 1251} {"train_loss": -37.407772064208984, "global_step": 151438, "epoch": 1251} {"train_loss": -34.23086929321289, "global_step": 151439, "epoch": 1251} {"train_loss": -39.454681396484375, "global_step": 151440, "epoch": 1251} {"train_loss": -38.492698669433594, "global_step": 151441, "epoch": 1251} {"train_loss": -38.88391876220703, "global_step": 151442, "epoch": 1251} {"train_loss": -38.99421691894531, "global_step": 151443, "epoch": 1251} {"train_loss": -38.55449295043945, "global_step": 151444, "epoch": 1251} {"train_loss": -38.72098159790039, "global_step": 151445, "epoch": 1251} {"train_loss": -38.090389251708984, "global_step": 151446, "epoch": 1251} {"train_loss": -37.49106979370117, "global_step": 151447, "epoch": 1251} {"train_loss": -38.86872482299805, "global_step": 151448, "epoch": 1251} {"train_loss": -39.49055099487305, "global_step": 151449, "epoch": 1251} {"train_loss": -39.2542610168457, "global_step": 151450, "epoch": 1251} {"train_loss": -38.70614242553711, "global_step": 151451, "epoch": 1251} {"train_loss": -39.401920318603516, "global_step": 151452, "epoch": 1251} {"train_loss": -37.96626663208008, "global_step": 151453, "epoch": 1251} {"train_loss": -38.895965576171875, "global_step": 151454, "epoch": 1251} {"train_loss": -38.594390869140625, "global_step": 151455, "epoch": 1251} {"train_loss": -39.335845947265625, "global_step": 151456, "epoch": 1251} {"train_loss": -38.54788589477539, "global_step": 151457, "epoch": 1251} {"train_loss": -38.84922790527344, "global_step": 151458, "epoch": 1251} {"train_loss": -38.543697357177734, "global_step": 151459, "epoch": 1251} {"train_loss": -39.10957336425781, "global_step": 151460, "epoch": 1251} {"train_loss": -38.75930404663086, "global_step": 151461, "epoch": 1251} {"train_loss": -38.238311767578125, "global_step": 151462, "epoch": 1251} {"train_loss": -39.33860397338867, "global_step": 151463, "epoch": 1251} {"train_loss": -39.0740852355957, "global_step": 151464, "epoch": 1251} {"train_loss": -38.53400421142578, "global_step": 151465, "epoch": 1251} {"train_loss": -38.38357162475586, "global_step": 151466, "epoch": 1251} {"train_loss": -39.07463836669922, "global_step": 151467, "epoch": 1251} {"train_loss": -38.68662643432617, "global_step": 151468, "epoch": 1251} {"train_loss": -39.21906280517578, "global_step": 151469, "epoch": 1251} {"train_loss": -39.24796676635742, "global_step": 151470, "epoch": 1251} {"train_loss": -39.206050872802734, "global_step": 151471, "epoch": 1251} {"train_loss": -39.81930160522461, "global_step": 151472, "epoch": 1251} {"train_loss": -39.7656364440918, "global_step": 151473, "epoch": 1251} {"train_loss": -39.20686340332031, "global_step": 151474, "epoch": 1251} {"train_loss": -39.10627365112305, "global_step": 151475, "epoch": 1251} {"train_loss": -39.40230178833008, "global_step": 151476, "epoch": 1251} {"train_loss": -40.11103820800781, "global_step": 151477, "epoch": 1251} {"train_loss": -39.83149337768555, "global_step": 151478, "epoch": 1251} {"train_loss": -38.99260330200195, "global_step": 151479, "epoch": 1251} {"train_loss": -39.964229583740234, "global_step": 151480, "epoch": 1251} {"train_loss": -39.62874221801758, "global_step": 151481, "epoch": 1251} {"train_loss": -39.965152740478516, "global_step": 151482, "epoch": 1251} {"train_loss": -39.340919494628906, "global_step": 151483, "epoch": 1251} {"train_loss": -40.16852569580078, "global_step": 151484, "epoch": 1251} {"train_loss": -40.28736114501953, "global_step": 151485, "epoch": 1251} {"train_loss": -39.664825439453125, "global_step": 151486, "epoch": 1251} {"train_loss": -39.48628616333008, "global_step": 151487, "epoch": 1251} {"train_loss": -37.45746994018555, "global_step": 151488, "epoch": 1251} {"train_loss": -35.8663330078125, "global_step": 151489, "epoch": 1251} {"train_loss": -36.404903411865234, "global_step": 151490, "epoch": 1251} {"train_loss": -38.428572757184995, "global_step": 151491, "epoch": 1251, "val_loss": 2612907.75} {"train_loss": -38.92707061767578, "global_step": 151492, "epoch": 1252} {"train_loss": -37.14234161376953, "global_step": 151493, "epoch": 1252} {"train_loss": -39.18413162231445, "global_step": 151494, "epoch": 1252} {"train_loss": -39.68687057495117, "global_step": 151495, "epoch": 1252} {"train_loss": -37.64370346069336, "global_step": 151496, "epoch": 1252} {"train_loss": -39.1786994934082, "global_step": 151497, "epoch": 1252} {"train_loss": -39.74747848510742, "global_step": 151498, "epoch": 1252} {"train_loss": -38.91707229614258, "global_step": 151499, "epoch": 1252} {"train_loss": -40.057579040527344, "global_step": 151500, "epoch": 1252} {"train_loss": -38.49896240234375, "global_step": 151501, "epoch": 1252} {"train_loss": -39.68321228027344, "global_step": 151502, "epoch": 1252} {"train_loss": -39.17806625366211, "global_step": 151503, "epoch": 1252} {"train_loss": -39.1219596862793, "global_step": 151504, "epoch": 1252} {"train_loss": -39.52903747558594, "global_step": 151505, "epoch": 1252} {"train_loss": -39.35617446899414, "global_step": 151506, "epoch": 1252} {"train_loss": -39.65202331542969, "global_step": 151507, "epoch": 1252} {"train_loss": -39.768978118896484, "global_step": 151508, "epoch": 1252} {"train_loss": -39.15760040283203, "global_step": 151509, "epoch": 1252} {"train_loss": -39.1100959777832, "global_step": 151510, "epoch": 1252} {"train_loss": -39.85151290893555, "global_step": 151511, "epoch": 1252} {"train_loss": -39.85700988769531, "global_step": 151512, "epoch": 1252} {"train_loss": -39.51778030395508, "global_step": 151513, "epoch": 1252} {"train_loss": -39.75071334838867, "global_step": 151514, "epoch": 1252} {"train_loss": -39.989688873291016, "global_step": 151515, "epoch": 1252} {"train_loss": -40.200958251953125, "global_step": 151516, "epoch": 1252} {"train_loss": -40.11402130126953, "global_step": 151517, "epoch": 1252} {"train_loss": -39.7816047668457, "global_step": 151518, "epoch": 1252} {"train_loss": -40.1557731628418, "global_step": 151519, "epoch": 1252} {"train_loss": -40.05070114135742, "global_step": 151520, "epoch": 1252} {"train_loss": -38.99812316894531, "global_step": 151521, "epoch": 1252} {"train_loss": -37.72121047973633, "global_step": 151522, "epoch": 1252} {"train_loss": -39.94111251831055, "global_step": 151523, "epoch": 1252} {"train_loss": -39.72878646850586, "global_step": 151524, "epoch": 1252} {"train_loss": -40.019737243652344, "global_step": 151525, "epoch": 1252} {"train_loss": -40.4128532409668, "global_step": 151526, "epoch": 1252} {"train_loss": -40.15018081665039, "global_step": 151527, "epoch": 1252} {"train_loss": -38.666297912597656, "global_step": 151528, "epoch": 1252} {"train_loss": -37.057674407958984, "global_step": 151529, "epoch": 1252} {"train_loss": -33.75291061401367, "global_step": 151530, "epoch": 1252} {"train_loss": -29.167266845703125, "global_step": 151531, "epoch": 1252} {"train_loss": -31.45206069946289, "global_step": 151532, "epoch": 1252} {"train_loss": -38.32771301269531, "global_step": 151533, "epoch": 1252} {"train_loss": -37.29319381713867, "global_step": 151534, "epoch": 1252} {"train_loss": -37.52019500732422, "global_step": 151535, "epoch": 1252} {"train_loss": -39.45595169067383, "global_step": 151536, "epoch": 1252} {"train_loss": -36.99028396606445, "global_step": 151537, "epoch": 1252} {"train_loss": -38.92979049682617, "global_step": 151538, "epoch": 1252} {"train_loss": -39.34869384765625, "global_step": 151539, "epoch": 1252} {"train_loss": -38.28825378417969, "global_step": 151540, "epoch": 1252} {"train_loss": -39.24259567260742, "global_step": 151541, "epoch": 1252} {"train_loss": -39.00434112548828, "global_step": 151542, "epoch": 1252} {"train_loss": -39.70391845703125, "global_step": 151543, "epoch": 1252} {"train_loss": -38.055938720703125, "global_step": 151544, "epoch": 1252} {"train_loss": -39.69807052612305, "global_step": 151545, "epoch": 1252} {"train_loss": -38.01225662231445, "global_step": 151546, "epoch": 1252} {"train_loss": -38.041778564453125, "global_step": 151547, "epoch": 1252} {"train_loss": -38.594940185546875, "global_step": 151548, "epoch": 1252} {"train_loss": -39.53762435913086, "global_step": 151549, "epoch": 1252} {"train_loss": -37.54334259033203, "global_step": 151550, "epoch": 1252} {"train_loss": -38.993408203125, "global_step": 151551, "epoch": 1252} {"train_loss": -38.55597686767578, "global_step": 151552, "epoch": 1252} {"train_loss": -37.26255798339844, "global_step": 151553, "epoch": 1252} {"train_loss": -38.80863571166992, "global_step": 151554, "epoch": 1252} {"train_loss": -39.16273880004883, "global_step": 151555, "epoch": 1252} {"train_loss": -39.05540466308594, "global_step": 151556, "epoch": 1252} {"train_loss": -38.15838623046875, "global_step": 151557, "epoch": 1252} {"train_loss": -37.31626510620117, "global_step": 151558, "epoch": 1252} {"train_loss": -37.79604721069336, "global_step": 151559, "epoch": 1252} {"train_loss": -39.02692794799805, "global_step": 151560, "epoch": 1252} {"train_loss": -39.25925064086914, "global_step": 151561, "epoch": 1252} {"train_loss": -37.925331115722656, "global_step": 151562, "epoch": 1252} {"train_loss": -35.72944259643555, "global_step": 151563, "epoch": 1252} {"train_loss": -36.71858596801758, "global_step": 151564, "epoch": 1252} {"train_loss": -36.37017059326172, "global_step": 151565, "epoch": 1252} {"train_loss": -28.276676177978516, "global_step": 151566, "epoch": 1252} {"train_loss": -29.9576416015625, "global_step": 151567, "epoch": 1252} {"train_loss": -35.620357513427734, "global_step": 151568, "epoch": 1252} {"train_loss": -22.295774459838867, "global_step": 151569, "epoch": 1252} {"train_loss": -33.52863693237305, "global_step": 151570, "epoch": 1252} {"train_loss": -25.529491424560547, "global_step": 151571, "epoch": 1252} {"train_loss": -15.278635025024414, "global_step": 151572, "epoch": 1252} {"train_loss": -35.328426361083984, "global_step": 151573, "epoch": 1252} {"train_loss": -35.5186882019043, "global_step": 151574, "epoch": 1252} {"train_loss": -14.423033714294434, "global_step": 151575, "epoch": 1252} {"train_loss": -22.383920669555664, "global_step": 151576, "epoch": 1252} {"train_loss": -27.48838233947754, "global_step": 151577, "epoch": 1252} {"train_loss": -31.248571395874023, "global_step": 151578, "epoch": 1252} {"train_loss": -30.222036361694336, "global_step": 151579, "epoch": 1252} {"train_loss": -29.314844131469727, "global_step": 151580, "epoch": 1252} {"train_loss": -26.9172306060791, "global_step": 151581, "epoch": 1252} {"train_loss": -31.2265625, "global_step": 151582, "epoch": 1252} {"train_loss": -27.922727584838867, "global_step": 151583, "epoch": 1252} {"train_loss": -34.5803337097168, "global_step": 151584, "epoch": 1252} {"train_loss": -30.080350875854492, "global_step": 151585, "epoch": 1252} {"train_loss": -32.192874908447266, "global_step": 151586, "epoch": 1252} {"train_loss": -31.878549575805664, "global_step": 151587, "epoch": 1252} {"train_loss": -30.908246994018555, "global_step": 151588, "epoch": 1252} {"train_loss": -32.765281677246094, "global_step": 151589, "epoch": 1252} {"train_loss": -30.3102970123291, "global_step": 151590, "epoch": 1252} {"train_loss": -32.98096466064453, "global_step": 151591, "epoch": 1252} {"train_loss": -34.18305206298828, "global_step": 151592, "epoch": 1252} {"train_loss": -34.67057418823242, "global_step": 151593, "epoch": 1252} {"train_loss": -34.58774948120117, "global_step": 151594, "epoch": 1252} {"train_loss": -34.98789596557617, "global_step": 151595, "epoch": 1252} {"train_loss": -35.660179138183594, "global_step": 151596, "epoch": 1252} {"train_loss": -33.450927734375, "global_step": 151597, "epoch": 1252} {"train_loss": -34.09432601928711, "global_step": 151598, "epoch": 1252} {"train_loss": -34.7916145324707, "global_step": 151599, "epoch": 1252} {"train_loss": -35.387996673583984, "global_step": 151600, "epoch": 1252} {"train_loss": -35.32072830200195, "global_step": 151601, "epoch": 1252} {"train_loss": -36.14501953125, "global_step": 151602, "epoch": 1252} {"train_loss": -35.7067756652832, "global_step": 151603, "epoch": 1252} {"train_loss": -35.601715087890625, "global_step": 151604, "epoch": 1252} {"train_loss": -35.43513107299805, "global_step": 151605, "epoch": 1252} {"train_loss": -34.903263092041016, "global_step": 151606, "epoch": 1252} {"train_loss": -36.09479904174805, "global_step": 151607, "epoch": 1252} {"train_loss": -35.71312713623047, "global_step": 151608, "epoch": 1252} {"train_loss": -36.285640716552734, "global_step": 151609, "epoch": 1252} {"train_loss": -35.42530059814453, "global_step": 151610, "epoch": 1252} {"train_loss": -36.665565490722656, "global_step": 151611, "epoch": 1252} {"train_loss": -35.980177453726775, "global_step": 151612, "epoch": 1252, "val_loss": 2656157.0} {"train_loss": -36.544532775878906, "global_step": 151613, "epoch": 1253} {"train_loss": -36.39588928222656, "global_step": 151614, "epoch": 1253} {"train_loss": -36.80350875854492, "global_step": 151615, "epoch": 1253} {"train_loss": -35.477455139160156, "global_step": 151616, "epoch": 1253} {"train_loss": -36.356441497802734, "global_step": 151617, "epoch": 1253} {"train_loss": -35.977256774902344, "global_step": 151618, "epoch": 1253} {"train_loss": -36.2835578918457, "global_step": 151619, "epoch": 1253} {"train_loss": -36.38533401489258, "global_step": 151620, "epoch": 1253} {"train_loss": -36.415531158447266, "global_step": 151621, "epoch": 1253} {"train_loss": -36.67581558227539, "global_step": 151622, "epoch": 1253} {"train_loss": -36.88633728027344, "global_step": 151623, "epoch": 1253} {"train_loss": -36.85932159423828, "global_step": 151624, "epoch": 1253} {"train_loss": -36.07526397705078, "global_step": 151625, "epoch": 1253} {"train_loss": -36.771141052246094, "global_step": 151626, "epoch": 1253} {"train_loss": -37.1391487121582, "global_step": 151627, "epoch": 1253} {"train_loss": -37.15947723388672, "global_step": 151628, "epoch": 1253} {"train_loss": -37.08173370361328, "global_step": 151629, "epoch": 1253} {"train_loss": -36.92625045776367, "global_step": 151630, "epoch": 1253} {"train_loss": -36.91872787475586, "global_step": 151631, "epoch": 1253} {"train_loss": -37.128902435302734, "global_step": 151632, "epoch": 1253} {"train_loss": -37.31528091430664, "global_step": 151633, "epoch": 1253} {"train_loss": -37.303070068359375, "global_step": 151634, "epoch": 1253} {"train_loss": -37.779048919677734, "global_step": 151635, "epoch": 1253} {"train_loss": -38.078975677490234, "global_step": 151636, "epoch": 1253} {"train_loss": -37.10781478881836, "global_step": 151637, "epoch": 1253} {"train_loss": -37.827056884765625, "global_step": 151638, "epoch": 1253} {"train_loss": -37.532527923583984, "global_step": 151639, "epoch": 1253} {"train_loss": -37.53379440307617, "global_step": 151640, "epoch": 1253} {"train_loss": -37.69450759887695, "global_step": 151641, "epoch": 1253} {"train_loss": -37.69140625, "global_step": 151642, "epoch": 1253} {"train_loss": -37.64553451538086, "global_step": 151643, "epoch": 1253} {"train_loss": -37.63438034057617, "global_step": 151644, "epoch": 1253} {"train_loss": -37.330352783203125, "global_step": 151645, "epoch": 1253} {"train_loss": -38.01278305053711, "global_step": 151646, "epoch": 1253} {"train_loss": -37.91852569580078, "global_step": 151647, "epoch": 1253} {"train_loss": -37.94403839111328, "global_step": 151648, "epoch": 1253} {"train_loss": -38.21588134765625, "global_step": 151649, "epoch": 1253} {"train_loss": -37.64631271362305, "global_step": 151650, "epoch": 1253} {"train_loss": -37.78290939331055, "global_step": 151651, "epoch": 1253} {"train_loss": -38.49482727050781, "global_step": 151652, "epoch": 1253} {"train_loss": -37.90156173706055, "global_step": 151653, "epoch": 1253} {"train_loss": -38.41273880004883, "global_step": 151654, "epoch": 1253} {"train_loss": -38.74242401123047, "global_step": 151655, "epoch": 1253} {"train_loss": -38.305999755859375, "global_step": 151656, "epoch": 1253} {"train_loss": -37.95918655395508, "global_step": 151657, "epoch": 1253} {"train_loss": -38.19720458984375, "global_step": 151658, "epoch": 1253} {"train_loss": -38.59487533569336, "global_step": 151659, "epoch": 1253} {"train_loss": -38.486392974853516, "global_step": 151660, "epoch": 1253} {"train_loss": -38.440155029296875, "global_step": 151661, "epoch": 1253} {"train_loss": -38.65983200073242, "global_step": 151662, "epoch": 1253} {"train_loss": -38.04753112792969, "global_step": 151663, "epoch": 1253} {"train_loss": -38.44386291503906, "global_step": 151664, "epoch": 1253} {"train_loss": -38.705810546875, "global_step": 151665, "epoch": 1253} {"train_loss": -38.56239318847656, "global_step": 151666, "epoch": 1253} {"train_loss": -38.69404983520508, "global_step": 151667, "epoch": 1253} {"train_loss": -38.79276657104492, "global_step": 151668, "epoch": 1253} {"train_loss": -38.5671501159668, "global_step": 151669, "epoch": 1253} {"train_loss": -38.91534423828125, "global_step": 151670, "epoch": 1253} {"train_loss": -38.667457580566406, "global_step": 151671, "epoch": 1253} {"train_loss": -38.50136184692383, "global_step": 151672, "epoch": 1253} {"train_loss": -39.150936126708984, "global_step": 151673, "epoch": 1253} {"train_loss": -38.53751754760742, "global_step": 151674, "epoch": 1253} {"train_loss": -38.622737884521484, "global_step": 151675, "epoch": 1253} {"train_loss": -39.00033187866211, "global_step": 151676, "epoch": 1253} {"train_loss": -38.97399139404297, "global_step": 151677, "epoch": 1253} {"train_loss": -38.890655517578125, "global_step": 151678, "epoch": 1253} {"train_loss": -39.139869689941406, "global_step": 151679, "epoch": 1253} {"train_loss": -39.17433547973633, "global_step": 151680, "epoch": 1253} {"train_loss": -38.76729965209961, "global_step": 151681, "epoch": 1253} {"train_loss": -38.52964401245117, "global_step": 151682, "epoch": 1253} {"train_loss": -39.27943801879883, "global_step": 151683, "epoch": 1253} {"train_loss": -39.0009651184082, "global_step": 151684, "epoch": 1253} {"train_loss": -38.56645965576172, "global_step": 151685, "epoch": 1253} {"train_loss": -39.14377975463867, "global_step": 151686, "epoch": 1253} {"train_loss": -38.60452651977539, "global_step": 151687, "epoch": 1253} {"train_loss": -39.71896743774414, "global_step": 151688, "epoch": 1253} {"train_loss": -38.87040328979492, "global_step": 151689, "epoch": 1253} {"train_loss": -38.85051345825195, "global_step": 151690, "epoch": 1253} {"train_loss": -39.10333251953125, "global_step": 151691, "epoch": 1253} {"train_loss": -39.029354095458984, "global_step": 151692, "epoch": 1253} {"train_loss": -39.053070068359375, "global_step": 151693, "epoch": 1253} {"train_loss": -39.1179313659668, "global_step": 151694, "epoch": 1253} {"train_loss": -38.87388229370117, "global_step": 151695, "epoch": 1253} {"train_loss": -38.84577941894531, "global_step": 151696, "epoch": 1253} {"train_loss": -38.81868362426758, "global_step": 151697, "epoch": 1253} {"train_loss": -39.42268753051758, "global_step": 151698, "epoch": 1253} {"train_loss": -38.56474685668945, "global_step": 151699, "epoch": 1253} {"train_loss": -38.96222686767578, "global_step": 151700, "epoch": 1253} {"train_loss": -38.705806732177734, "global_step": 151701, "epoch": 1253} {"train_loss": -38.40932846069336, "global_step": 151702, "epoch": 1253} {"train_loss": -34.907283782958984, "global_step": 151703, "epoch": 1253} {"train_loss": -32.34055709838867, "global_step": 151704, "epoch": 1253} {"train_loss": -29.3184757232666, "global_step": 151705, "epoch": 1253} {"train_loss": -31.0565128326416, "global_step": 151706, "epoch": 1253} {"train_loss": -37.58264923095703, "global_step": 151707, "epoch": 1253} {"train_loss": -37.144927978515625, "global_step": 151708, "epoch": 1253} {"train_loss": -34.30836868286133, "global_step": 151709, "epoch": 1253} {"train_loss": -36.81926345825195, "global_step": 151710, "epoch": 1253} {"train_loss": -35.415184020996094, "global_step": 151711, "epoch": 1253} {"train_loss": -34.67551803588867, "global_step": 151712, "epoch": 1253} {"train_loss": -37.3643913269043, "global_step": 151713, "epoch": 1253} {"train_loss": -33.04916000366211, "global_step": 151714, "epoch": 1253} {"train_loss": -38.888336181640625, "global_step": 151715, "epoch": 1253} {"train_loss": -35.2023811340332, "global_step": 151716, "epoch": 1253} {"train_loss": -38.21189498901367, "global_step": 151717, "epoch": 1253} {"train_loss": -36.10276794433594, "global_step": 151718, "epoch": 1253} {"train_loss": -38.20268249511719, "global_step": 151719, "epoch": 1253} {"train_loss": -37.6954345703125, "global_step": 151720, "epoch": 1253} {"train_loss": -38.953407287597656, "global_step": 151721, "epoch": 1253} {"train_loss": -37.55912399291992, "global_step": 151722, "epoch": 1253} {"train_loss": -37.316429138183594, "global_step": 151723, "epoch": 1253} {"train_loss": -37.57283401489258, "global_step": 151724, "epoch": 1253} {"train_loss": -38.633758544921875, "global_step": 151725, "epoch": 1253} {"train_loss": -38.940711975097656, "global_step": 151726, "epoch": 1253} {"train_loss": -38.72703552246094, "global_step": 151727, "epoch": 1253} {"train_loss": -39.13747024536133, "global_step": 151728, "epoch": 1253} {"train_loss": -38.39313888549805, "global_step": 151729, "epoch": 1253} {"train_loss": -39.196693420410156, "global_step": 151730, "epoch": 1253} {"train_loss": -39.11450958251953, "global_step": 151731, "epoch": 1253} {"train_loss": -38.93668746948242, "global_step": 151732, "epoch": 1253} {"train_loss": -37.71999885622135, "global_step": 151733, "epoch": 1253, "val_loss": 2756438.0} {"train_loss": -38.952606201171875, "global_step": 151734, "epoch": 1254} {"train_loss": -39.284366607666016, "global_step": 151735, "epoch": 1254} {"train_loss": -38.99440383911133, "global_step": 151736, "epoch": 1254} {"train_loss": -39.24623489379883, "global_step": 151737, "epoch": 1254} {"train_loss": -39.5859489440918, "global_step": 151738, "epoch": 1254} {"train_loss": -39.019866943359375, "global_step": 151739, "epoch": 1254} {"train_loss": -39.32871627807617, "global_step": 151740, "epoch": 1254} {"train_loss": -39.50083541870117, "global_step": 151741, "epoch": 1254} {"train_loss": -39.007904052734375, "global_step": 151742, "epoch": 1254} {"train_loss": -39.232425689697266, "global_step": 151743, "epoch": 1254} {"train_loss": -39.235809326171875, "global_step": 151744, "epoch": 1254} {"train_loss": -39.45185470581055, "global_step": 151745, "epoch": 1254} {"train_loss": -39.9435920715332, "global_step": 151746, "epoch": 1254} {"train_loss": -39.94444274902344, "global_step": 151747, "epoch": 1254} {"train_loss": -39.687652587890625, "global_step": 151748, "epoch": 1254} {"train_loss": -39.91474533081055, "global_step": 151749, "epoch": 1254} {"train_loss": -39.796512603759766, "global_step": 151750, "epoch": 1254} {"train_loss": -39.680145263671875, "global_step": 151751, "epoch": 1254} {"train_loss": -40.0490837097168, "global_step": 151752, "epoch": 1254} {"train_loss": -39.573516845703125, "global_step": 151753, "epoch": 1254} {"train_loss": -39.7542839050293, "global_step": 151754, "epoch": 1254} {"train_loss": -39.9023551940918, "global_step": 151755, "epoch": 1254} {"train_loss": -39.79183578491211, "global_step": 151756, "epoch": 1254} {"train_loss": -40.18461990356445, "global_step": 151757, "epoch": 1254} {"train_loss": -39.62914276123047, "global_step": 151758, "epoch": 1254} {"train_loss": -39.808956146240234, "global_step": 151759, "epoch": 1254} {"train_loss": -39.67087936401367, "global_step": 151760, "epoch": 1254} {"train_loss": -39.833091735839844, "global_step": 151761, "epoch": 1254} {"train_loss": -40.22557067871094, "global_step": 151762, "epoch": 1254} {"train_loss": -39.53302764892578, "global_step": 151763, "epoch": 1254} {"train_loss": -40.09051513671875, "global_step": 151764, "epoch": 1254} {"train_loss": -39.98328399658203, "global_step": 151765, "epoch": 1254} {"train_loss": -40.099761962890625, "global_step": 151766, "epoch": 1254} {"train_loss": -39.65571212768555, "global_step": 151767, "epoch": 1254} {"train_loss": -38.982398986816406, "global_step": 151768, "epoch": 1254} {"train_loss": -39.618812561035156, "global_step": 151769, "epoch": 1254} {"train_loss": -39.72111892700195, "global_step": 151770, "epoch": 1254} {"train_loss": -39.350948333740234, "global_step": 151771, "epoch": 1254} {"train_loss": -39.7130012512207, "global_step": 151772, "epoch": 1254} {"train_loss": -39.79291534423828, "global_step": 151773, "epoch": 1254} {"train_loss": -39.126399993896484, "global_step": 151774, "epoch": 1254} {"train_loss": -39.34469223022461, "global_step": 151775, "epoch": 1254} {"train_loss": -39.85207748413086, "global_step": 151776, "epoch": 1254} {"train_loss": -38.196720123291016, "global_step": 151777, "epoch": 1254} {"train_loss": -36.2978630065918, "global_step": 151778, "epoch": 1254} {"train_loss": -38.33120346069336, "global_step": 151779, "epoch": 1254} {"train_loss": -39.93818664550781, "global_step": 151780, "epoch": 1254} {"train_loss": -39.79592514038086, "global_step": 151781, "epoch": 1254} {"train_loss": -40.135372161865234, "global_step": 151782, "epoch": 1254} {"train_loss": -39.27405548095703, "global_step": 151783, "epoch": 1254} {"train_loss": -39.65788650512695, "global_step": 151784, "epoch": 1254} {"train_loss": -39.05836868286133, "global_step": 151785, "epoch": 1254} {"train_loss": -39.09342956542969, "global_step": 151786, "epoch": 1254} {"train_loss": -39.67477035522461, "global_step": 151787, "epoch": 1254} {"train_loss": -40.469635009765625, "global_step": 151788, "epoch": 1254} {"train_loss": -39.88914108276367, "global_step": 151789, "epoch": 1254} {"train_loss": -40.06842041015625, "global_step": 151790, "epoch": 1254} {"train_loss": -37.9588737487793, "global_step": 151791, "epoch": 1254} {"train_loss": -36.87725830078125, "global_step": 151792, "epoch": 1254} {"train_loss": -33.858150482177734, "global_step": 151793, "epoch": 1254} {"train_loss": -35.62702941894531, "global_step": 151794, "epoch": 1254} {"train_loss": -40.100807189941406, "global_step": 151795, "epoch": 1254} {"train_loss": -37.54813766479492, "global_step": 151796, "epoch": 1254} {"train_loss": -37.84709930419922, "global_step": 151797, "epoch": 1254} {"train_loss": -40.045162200927734, "global_step": 151798, "epoch": 1254} {"train_loss": -39.2758903503418, "global_step": 151799, "epoch": 1254} {"train_loss": -38.4375, "global_step": 151800, "epoch": 1254} {"train_loss": -39.67055892944336, "global_step": 151801, "epoch": 1254} {"train_loss": -38.63856506347656, "global_step": 151802, "epoch": 1254} {"train_loss": -38.136199951171875, "global_step": 151803, "epoch": 1254} {"train_loss": -39.215614318847656, "global_step": 151804, "epoch": 1254} {"train_loss": -39.39789962768555, "global_step": 151805, "epoch": 1254} {"train_loss": -38.497840881347656, "global_step": 151806, "epoch": 1254} {"train_loss": -38.7050666809082, "global_step": 151807, "epoch": 1254} {"train_loss": -38.31929397583008, "global_step": 151808, "epoch": 1254} {"train_loss": -39.89796447753906, "global_step": 151809, "epoch": 1254} {"train_loss": -37.17987823486328, "global_step": 151810, "epoch": 1254} {"train_loss": -37.09943771362305, "global_step": 151811, "epoch": 1254} {"train_loss": -36.512081146240234, "global_step": 151812, "epoch": 1254} {"train_loss": -38.08661651611328, "global_step": 151813, "epoch": 1254} {"train_loss": -38.26072692871094, "global_step": 151814, "epoch": 1254} {"train_loss": -38.4991569519043, "global_step": 151815, "epoch": 1254} {"train_loss": -33.76253890991211, "global_step": 151816, "epoch": 1254} {"train_loss": -38.00986862182617, "global_step": 151817, "epoch": 1254} {"train_loss": -38.126922607421875, "global_step": 151818, "epoch": 1254} {"train_loss": -36.44480895996094, "global_step": 151819, "epoch": 1254} {"train_loss": -37.682098388671875, "global_step": 151820, "epoch": 1254} {"train_loss": -38.75623321533203, "global_step": 151821, "epoch": 1254} {"train_loss": -38.346107482910156, "global_step": 151822, "epoch": 1254} {"train_loss": -37.67791748046875, "global_step": 151823, "epoch": 1254} {"train_loss": -39.07826614379883, "global_step": 151824, "epoch": 1254} {"train_loss": -38.989627838134766, "global_step": 151825, "epoch": 1254} {"train_loss": -37.86037063598633, "global_step": 151826, "epoch": 1254} {"train_loss": -39.89500045776367, "global_step": 151827, "epoch": 1254} {"train_loss": -39.27370071411133, "global_step": 151828, "epoch": 1254} {"train_loss": -39.25864028930664, "global_step": 151829, "epoch": 1254} {"train_loss": -39.98270797729492, "global_step": 151830, "epoch": 1254} {"train_loss": -39.0109748840332, "global_step": 151831, "epoch": 1254} {"train_loss": -39.9034538269043, "global_step": 151832, "epoch": 1254} {"train_loss": -38.891841888427734, "global_step": 151833, "epoch": 1254} {"train_loss": -39.69429397583008, "global_step": 151834, "epoch": 1254} {"train_loss": -38.727210998535156, "global_step": 151835, "epoch": 1254} {"train_loss": -39.48957443237305, "global_step": 151836, "epoch": 1254} {"train_loss": -38.7474250793457, "global_step": 151837, "epoch": 1254} {"train_loss": -39.5799560546875, "global_step": 151838, "epoch": 1254} {"train_loss": -38.56809616088867, "global_step": 151839, "epoch": 1254} {"train_loss": -39.97148513793945, "global_step": 151840, "epoch": 1254} {"train_loss": -38.88644027709961, "global_step": 151841, "epoch": 1254} {"train_loss": -40.225746154785156, "global_step": 151842, "epoch": 1254} {"train_loss": -39.28554916381836, "global_step": 151843, "epoch": 1254} {"train_loss": -40.1064567565918, "global_step": 151844, "epoch": 1254} {"train_loss": -39.44165802001953, "global_step": 151845, "epoch": 1254} {"train_loss": -40.01487731933594, "global_step": 151846, "epoch": 1254} {"train_loss": -39.630428314208984, "global_step": 151847, "epoch": 1254} {"train_loss": -39.94153594970703, "global_step": 151848, "epoch": 1254} {"train_loss": -39.58484649658203, "global_step": 151849, "epoch": 1254} {"train_loss": -39.90724563598633, "global_step": 151850, "epoch": 1254} {"train_loss": -40.00242233276367, "global_step": 151851, "epoch": 1254} {"train_loss": -40.10455322265625, "global_step": 151852, "epoch": 1254} {"train_loss": -39.70486068725586, "global_step": 151853, "epoch": 1254} {"train_loss": -39.08859022786795, "global_step": 151854, "epoch": 1254, "val_loss": 2630458.75} {"train_loss": -39.579402923583984, "global_step": 151855, "epoch": 1255} {"train_loss": -40.30558776855469, "global_step": 151856, "epoch": 1255} {"train_loss": -40.037906646728516, "global_step": 151857, "epoch": 1255} {"train_loss": -40.61402893066406, "global_step": 151858, "epoch": 1255} {"train_loss": -40.59267044067383, "global_step": 151859, "epoch": 1255} {"train_loss": -40.256370544433594, "global_step": 151860, "epoch": 1255} {"train_loss": -40.49894714355469, "global_step": 151861, "epoch": 1255} {"train_loss": -41.009765625, "global_step": 151862, "epoch": 1255} {"train_loss": -40.23080062866211, "global_step": 151863, "epoch": 1255} {"train_loss": -40.66791915893555, "global_step": 151864, "epoch": 1255} {"train_loss": -40.47394943237305, "global_step": 151865, "epoch": 1255} {"train_loss": -40.94242477416992, "global_step": 151866, "epoch": 1255} {"train_loss": -40.65117263793945, "global_step": 151867, "epoch": 1255} {"train_loss": -40.366634368896484, "global_step": 151868, "epoch": 1255} {"train_loss": -40.590248107910156, "global_step": 151869, "epoch": 1255} {"train_loss": -40.4036865234375, "global_step": 151870, "epoch": 1255} {"train_loss": -40.7001953125, "global_step": 151871, "epoch": 1255} {"train_loss": -40.669918060302734, "global_step": 151872, "epoch": 1255} {"train_loss": -40.83966064453125, "global_step": 151873, "epoch": 1255} {"train_loss": -41.055877685546875, "global_step": 151874, "epoch": 1255} {"train_loss": -40.39104080200195, "global_step": 151875, "epoch": 1255} {"train_loss": -40.87910842895508, "global_step": 151876, "epoch": 1255} {"train_loss": -40.586181640625, "global_step": 151877, "epoch": 1255} {"train_loss": -39.156917572021484, "global_step": 151878, "epoch": 1255} {"train_loss": -39.540401458740234, "global_step": 151879, "epoch": 1255} {"train_loss": -40.5742073059082, "global_step": 151880, "epoch": 1255} {"train_loss": -40.531124114990234, "global_step": 151881, "epoch": 1255} {"train_loss": -40.36786651611328, "global_step": 151882, "epoch": 1255} {"train_loss": -40.51762771606445, "global_step": 151883, "epoch": 1255} {"train_loss": -40.82597732543945, "global_step": 151884, "epoch": 1255} {"train_loss": -40.70412826538086, "global_step": 151885, "epoch": 1255} {"train_loss": -41.0797233581543, "global_step": 151886, "epoch": 1255} {"train_loss": -40.970149993896484, "global_step": 151887, "epoch": 1255} {"train_loss": -41.01272201538086, "global_step": 151888, "epoch": 1255} {"train_loss": -40.56724166870117, "global_step": 151889, "epoch": 1255} {"train_loss": -40.20815658569336, "global_step": 151890, "epoch": 1255} {"train_loss": -39.59298324584961, "global_step": 151891, "epoch": 1255} {"train_loss": -38.49787902832031, "global_step": 151892, "epoch": 1255} {"train_loss": -36.58108901977539, "global_step": 151893, "epoch": 1255} {"train_loss": -36.176448822021484, "global_step": 151894, "epoch": 1255} {"train_loss": -38.27199935913086, "global_step": 151895, "epoch": 1255} {"train_loss": -38.20024490356445, "global_step": 151896, "epoch": 1255} {"train_loss": -36.161739349365234, "global_step": 151897, "epoch": 1255} {"train_loss": -38.114437103271484, "global_step": 151898, "epoch": 1255} {"train_loss": -39.73027420043945, "global_step": 151899, "epoch": 1255} {"train_loss": -39.0434455871582, "global_step": 151900, "epoch": 1255} {"train_loss": -38.28220748901367, "global_step": 151901, "epoch": 1255} {"train_loss": -39.376800537109375, "global_step": 151902, "epoch": 1255} {"train_loss": -40.2353515625, "global_step": 151903, "epoch": 1255} {"train_loss": -38.858680725097656, "global_step": 151904, "epoch": 1255} {"train_loss": -39.47518539428711, "global_step": 151905, "epoch": 1255} {"train_loss": -39.36537551879883, "global_step": 151906, "epoch": 1255} {"train_loss": -39.70601272583008, "global_step": 151907, "epoch": 1255} {"train_loss": -39.59230041503906, "global_step": 151908, "epoch": 1255} {"train_loss": -39.318233489990234, "global_step": 151909, "epoch": 1255} {"train_loss": -38.43391036987305, "global_step": 151910, "epoch": 1255} {"train_loss": -40.32314682006836, "global_step": 151911, "epoch": 1255} {"train_loss": -38.412532806396484, "global_step": 151912, "epoch": 1255} {"train_loss": -37.647193908691406, "global_step": 151913, "epoch": 1255} {"train_loss": -38.821014404296875, "global_step": 151914, "epoch": 1255} {"train_loss": -38.9031982421875, "global_step": 151915, "epoch": 1255} {"train_loss": -38.82967758178711, "global_step": 151916, "epoch": 1255} {"train_loss": -38.23226547241211, "global_step": 151917, "epoch": 1255} {"train_loss": -39.09104537963867, "global_step": 151918, "epoch": 1255} {"train_loss": -39.787227630615234, "global_step": 151919, "epoch": 1255} {"train_loss": -39.933319091796875, "global_step": 151920, "epoch": 1255} {"train_loss": -39.139896392822266, "global_step": 151921, "epoch": 1255} {"train_loss": -39.23829650878906, "global_step": 151922, "epoch": 1255} {"train_loss": -38.911495208740234, "global_step": 151923, "epoch": 1255} {"train_loss": -39.04805374145508, "global_step": 151924, "epoch": 1255} {"train_loss": -39.779518127441406, "global_step": 151925, "epoch": 1255} {"train_loss": -39.53056335449219, "global_step": 151926, "epoch": 1255} {"train_loss": -39.582305908203125, "global_step": 151927, "epoch": 1255} {"train_loss": -39.807159423828125, "global_step": 151928, "epoch": 1255} {"train_loss": -39.90800094604492, "global_step": 151929, "epoch": 1255} {"train_loss": -40.4227180480957, "global_step": 151930, "epoch": 1255} {"train_loss": -39.78978729248047, "global_step": 151931, "epoch": 1255} {"train_loss": -40.65707015991211, "global_step": 151932, "epoch": 1255} {"train_loss": -39.79008865356445, "global_step": 151933, "epoch": 1255} {"train_loss": -40.76847839355469, "global_step": 151934, "epoch": 1255} {"train_loss": -40.35905075073242, "global_step": 151935, "epoch": 1255} {"train_loss": -39.72520065307617, "global_step": 151936, "epoch": 1255} {"train_loss": -40.463172912597656, "global_step": 151937, "epoch": 1255} {"train_loss": -39.964595794677734, "global_step": 151938, "epoch": 1255} {"train_loss": -40.8611946105957, "global_step": 151939, "epoch": 1255} {"train_loss": -40.46514892578125, "global_step": 151940, "epoch": 1255} {"train_loss": -41.06867218017578, "global_step": 151941, "epoch": 1255} {"train_loss": -40.951332092285156, "global_step": 151942, "epoch": 1255} {"train_loss": -40.61463165283203, "global_step": 151943, "epoch": 1255} {"train_loss": -40.54951858520508, "global_step": 151944, "epoch": 1255} {"train_loss": -41.23857116699219, "global_step": 151945, "epoch": 1255} {"train_loss": -40.80726623535156, "global_step": 151946, "epoch": 1255} {"train_loss": -40.25173568725586, "global_step": 151947, "epoch": 1255} {"train_loss": -38.27444076538086, "global_step": 151948, "epoch": 1255} {"train_loss": -40.78426742553711, "global_step": 151949, "epoch": 1255} {"train_loss": -39.58148956298828, "global_step": 151950, "epoch": 1255} {"train_loss": -39.93840408325195, "global_step": 151951, "epoch": 1255} {"train_loss": -40.22980880737305, "global_step": 151952, "epoch": 1255} {"train_loss": -39.45681381225586, "global_step": 151953, "epoch": 1255} {"train_loss": -39.30947494506836, "global_step": 151954, "epoch": 1255} {"train_loss": -40.04911422729492, "global_step": 151955, "epoch": 1255} {"train_loss": -40.052398681640625, "global_step": 151956, "epoch": 1255} {"train_loss": -38.862300872802734, "global_step": 151957, "epoch": 1255} {"train_loss": -40.681190490722656, "global_step": 151958, "epoch": 1255} {"train_loss": -39.699398040771484, "global_step": 151959, "epoch": 1255} {"train_loss": -39.74193572998047, "global_step": 151960, "epoch": 1255} {"train_loss": -39.345794677734375, "global_step": 151961, "epoch": 1255} {"train_loss": -37.5399055480957, "global_step": 151962, "epoch": 1255} {"train_loss": -39.035606384277344, "global_step": 151963, "epoch": 1255} {"train_loss": -38.269039154052734, "global_step": 151964, "epoch": 1255} {"train_loss": -36.75812911987305, "global_step": 151965, "epoch": 1255} {"train_loss": -35.6177864074707, "global_step": 151966, "epoch": 1255} {"train_loss": -36.5031852722168, "global_step": 151967, "epoch": 1255} {"train_loss": -36.52378463745117, "global_step": 151968, "epoch": 1255} {"train_loss": -38.446502685546875, "global_step": 151969, "epoch": 1255} {"train_loss": -39.51353073120117, "global_step": 151970, "epoch": 1255} {"train_loss": -39.869388580322266, "global_step": 151971, "epoch": 1255} {"train_loss": -39.513153076171875, "global_step": 151972, "epoch": 1255} {"train_loss": -39.86884689331055, "global_step": 151973, "epoch": 1255} {"train_loss": -39.66189193725586, "global_step": 151974, "epoch": 1255} {"train_loss": -39.64417613636363, "global_step": 151975, "epoch": 1255, "val_loss": 2744834.75} {"train_loss": -39.72602462768555, "global_step": 151976, "epoch": 1256} {"train_loss": -40.03003692626953, "global_step": 151977, "epoch": 1256} {"train_loss": -39.91831588745117, "global_step": 151978, "epoch": 1256} {"train_loss": -39.4869384765625, "global_step": 151979, "epoch": 1256} {"train_loss": -39.17183303833008, "global_step": 151980, "epoch": 1256} {"train_loss": -40.0064582824707, "global_step": 151981, "epoch": 1256} {"train_loss": -39.753658294677734, "global_step": 151982, "epoch": 1256} {"train_loss": -38.647823333740234, "global_step": 151983, "epoch": 1256} {"train_loss": -39.83476638793945, "global_step": 151984, "epoch": 1256} {"train_loss": -40.197628021240234, "global_step": 151985, "epoch": 1256} {"train_loss": -40.06726837158203, "global_step": 151986, "epoch": 1256} {"train_loss": -40.37729263305664, "global_step": 151987, "epoch": 1256} {"train_loss": -40.4749755859375, "global_step": 151988, "epoch": 1256} {"train_loss": -40.129268646240234, "global_step": 151989, "epoch": 1256} {"train_loss": -40.35460662841797, "global_step": 151990, "epoch": 1256} {"train_loss": -39.39541244506836, "global_step": 151991, "epoch": 1256} {"train_loss": -40.54981231689453, "global_step": 151992, "epoch": 1256} {"train_loss": -40.10329818725586, "global_step": 151993, "epoch": 1256} {"train_loss": -40.24306869506836, "global_step": 151994, "epoch": 1256} {"train_loss": -40.37374496459961, "global_step": 151995, "epoch": 1256} {"train_loss": -40.051090240478516, "global_step": 151996, "epoch": 1256} {"train_loss": -40.69881820678711, "global_step": 151997, "epoch": 1256} {"train_loss": -40.865272521972656, "global_step": 151998, "epoch": 1256} {"train_loss": -40.35236740112305, "global_step": 151999, "epoch": 1256} {"train_loss": -40.97042465209961, "global_step": 152000, "epoch": 1256} {"train_loss": -40.80501174926758, "global_step": 152001, "epoch": 1256} {"train_loss": -40.63386535644531, "global_step": 152002, "epoch": 1256} {"train_loss": -41.00328826904297, "global_step": 152003, "epoch": 1256} {"train_loss": -40.06537628173828, "global_step": 152004, "epoch": 1256} {"train_loss": -41.221004486083984, "global_step": 152005, "epoch": 1256} {"train_loss": -41.21794891357422, "global_step": 152006, "epoch": 1256} {"train_loss": -41.06851577758789, "global_step": 152007, "epoch": 1256} {"train_loss": -41.02926254272461, "global_step": 152008, "epoch": 1256} {"train_loss": -39.8267822265625, "global_step": 152009, "epoch": 1256} {"train_loss": -41.365211486816406, "global_step": 152010, "epoch": 1256} {"train_loss": -40.71018600463867, "global_step": 152011, "epoch": 1256} {"train_loss": -39.92203903198242, "global_step": 152012, "epoch": 1256} {"train_loss": -40.23093795776367, "global_step": 152013, "epoch": 1256} {"train_loss": -40.150814056396484, "global_step": 152014, "epoch": 1256} {"train_loss": -40.8271598815918, "global_step": 152015, "epoch": 1256} {"train_loss": -40.46358871459961, "global_step": 152016, "epoch": 1256} {"train_loss": -40.39894485473633, "global_step": 152017, "epoch": 1256} {"train_loss": -40.342159271240234, "global_step": 152018, "epoch": 1256} {"train_loss": -40.29600143432617, "global_step": 152019, "epoch": 1256} {"train_loss": -40.85074234008789, "global_step": 152020, "epoch": 1256} {"train_loss": -39.5966682434082, "global_step": 152021, "epoch": 1256} {"train_loss": -38.47954177856445, "global_step": 152022, "epoch": 1256} {"train_loss": -37.7492790222168, "global_step": 152023, "epoch": 1256} {"train_loss": -38.65862274169922, "global_step": 152024, "epoch": 1256} {"train_loss": -40.35142135620117, "global_step": 152025, "epoch": 1256} {"train_loss": -40.13542938232422, "global_step": 152026, "epoch": 1256} {"train_loss": -40.072628021240234, "global_step": 152027, "epoch": 1256} {"train_loss": -34.84082794189453, "global_step": 152028, "epoch": 1256} {"train_loss": -39.29610824584961, "global_step": 152029, "epoch": 1256} {"train_loss": -40.09187698364258, "global_step": 152030, "epoch": 1256} {"train_loss": -39.09238815307617, "global_step": 152031, "epoch": 1256} {"train_loss": -37.99971008300781, "global_step": 152032, "epoch": 1256} {"train_loss": -38.53965377807617, "global_step": 152033, "epoch": 1256} {"train_loss": -38.11126708984375, "global_step": 152034, "epoch": 1256} {"train_loss": -35.12189483642578, "global_step": 152035, "epoch": 1256} {"train_loss": -39.815650939941406, "global_step": 152036, "epoch": 1256} {"train_loss": -36.85814666748047, "global_step": 152037, "epoch": 1256} {"train_loss": -38.71293258666992, "global_step": 152038, "epoch": 1256} {"train_loss": -38.79579544067383, "global_step": 152039, "epoch": 1256} {"train_loss": -39.22257614135742, "global_step": 152040, "epoch": 1256} {"train_loss": -39.701934814453125, "global_step": 152041, "epoch": 1256} {"train_loss": -39.10051345825195, "global_step": 152042, "epoch": 1256} {"train_loss": -40.07033157348633, "global_step": 152043, "epoch": 1256} {"train_loss": -39.25993728637695, "global_step": 152044, "epoch": 1256} {"train_loss": -39.68941879272461, "global_step": 152045, "epoch": 1256} {"train_loss": -39.76027297973633, "global_step": 152046, "epoch": 1256} {"train_loss": -40.12617492675781, "global_step": 152047, "epoch": 1256} {"train_loss": -39.2982063293457, "global_step": 152048, "epoch": 1256} {"train_loss": -40.18315887451172, "global_step": 152049, "epoch": 1256} {"train_loss": -40.09879684448242, "global_step": 152050, "epoch": 1256} {"train_loss": -39.511226654052734, "global_step": 152051, "epoch": 1256} {"train_loss": -39.6243782043457, "global_step": 152052, "epoch": 1256} {"train_loss": -39.48040771484375, "global_step": 152053, "epoch": 1256} {"train_loss": -40.207916259765625, "global_step": 152054, "epoch": 1256} {"train_loss": -39.151737213134766, "global_step": 152055, "epoch": 1256} {"train_loss": -38.79670333862305, "global_step": 152056, "epoch": 1256} {"train_loss": -39.31605911254883, "global_step": 152057, "epoch": 1256} {"train_loss": -38.989356994628906, "global_step": 152058, "epoch": 1256} {"train_loss": -40.25555419921875, "global_step": 152059, "epoch": 1256} {"train_loss": -38.30159378051758, "global_step": 152060, "epoch": 1256} {"train_loss": -38.16300582885742, "global_step": 152061, "epoch": 1256} {"train_loss": -40.415340423583984, "global_step": 152062, "epoch": 1256} {"train_loss": -39.72713088989258, "global_step": 152063, "epoch": 1256} {"train_loss": -40.371089935302734, "global_step": 152064, "epoch": 1256} {"train_loss": -40.32612609863281, "global_step": 152065, "epoch": 1256} {"train_loss": -38.327388763427734, "global_step": 152066, "epoch": 1256} {"train_loss": -39.71895217895508, "global_step": 152067, "epoch": 1256} {"train_loss": -40.205848693847656, "global_step": 152068, "epoch": 1256} {"train_loss": -38.87876510620117, "global_step": 152069, "epoch": 1256} {"train_loss": -39.863285064697266, "global_step": 152070, "epoch": 1256} {"train_loss": -40.053951263427734, "global_step": 152071, "epoch": 1256} {"train_loss": -39.63779830932617, "global_step": 152072, "epoch": 1256} {"train_loss": -38.882080078125, "global_step": 152073, "epoch": 1256} {"train_loss": -40.166725158691406, "global_step": 152074, "epoch": 1256} {"train_loss": -39.130245208740234, "global_step": 152075, "epoch": 1256} {"train_loss": -40.333858489990234, "global_step": 152076, "epoch": 1256} {"train_loss": -39.251068115234375, "global_step": 152077, "epoch": 1256} {"train_loss": -40.252254486083984, "global_step": 152078, "epoch": 1256} {"train_loss": -39.92509841918945, "global_step": 152079, "epoch": 1256} {"train_loss": -40.00697326660156, "global_step": 152080, "epoch": 1256} {"train_loss": -39.682369232177734, "global_step": 152081, "epoch": 1256} {"train_loss": -39.32980728149414, "global_step": 152082, "epoch": 1256} {"train_loss": -39.501800537109375, "global_step": 152083, "epoch": 1256} {"train_loss": -39.80642318725586, "global_step": 152084, "epoch": 1256} {"train_loss": -40.19219970703125, "global_step": 152085, "epoch": 1256} {"train_loss": -40.38831329345703, "global_step": 152086, "epoch": 1256} {"train_loss": -39.440670013427734, "global_step": 152087, "epoch": 1256} {"train_loss": -40.27386474609375, "global_step": 152088, "epoch": 1256} {"train_loss": -39.241790771484375, "global_step": 152089, "epoch": 1256} {"train_loss": -39.90156173706055, "global_step": 152090, "epoch": 1256} {"train_loss": -40.24593734741211, "global_step": 152091, "epoch": 1256} {"train_loss": -40.119483947753906, "global_step": 152092, "epoch": 1256} {"train_loss": -40.339359283447266, "global_step": 152093, "epoch": 1256} {"train_loss": -39.523799896240234, "global_step": 152094, "epoch": 1256} {"train_loss": -37.852020263671875, "global_step": 152095, "epoch": 1256} {"train_loss": -39.719689802689985, "global_step": 152096, "epoch": 1256, "val_loss": 2956062.0} {"train_loss": -40.128360748291016, "global_step": 152097, "epoch": 1257} {"train_loss": -40.30756759643555, "global_step": 152098, "epoch": 1257} {"train_loss": -40.18931198120117, "global_step": 152099, "epoch": 1257} {"train_loss": -38.40067672729492, "global_step": 152100, "epoch": 1257} {"train_loss": -38.64212417602539, "global_step": 152101, "epoch": 1257} {"train_loss": -40.054351806640625, "global_step": 152102, "epoch": 1257} {"train_loss": -39.40780258178711, "global_step": 152103, "epoch": 1257} {"train_loss": -40.2606315612793, "global_step": 152104, "epoch": 1257} {"train_loss": -39.97687530517578, "global_step": 152105, "epoch": 1257} {"train_loss": -39.46944808959961, "global_step": 152106, "epoch": 1257} {"train_loss": -40.001914978027344, "global_step": 152107, "epoch": 1257} {"train_loss": -39.327972412109375, "global_step": 152108, "epoch": 1257} {"train_loss": -40.74665069580078, "global_step": 152109, "epoch": 1257} {"train_loss": -38.97101974487305, "global_step": 152110, "epoch": 1257} {"train_loss": -38.463069915771484, "global_step": 152111, "epoch": 1257} {"train_loss": -39.07725143432617, "global_step": 152112, "epoch": 1257} {"train_loss": -38.76699447631836, "global_step": 152113, "epoch": 1257} {"train_loss": -37.727622985839844, "global_step": 152114, "epoch": 1257} {"train_loss": -39.76341247558594, "global_step": 152115, "epoch": 1257} {"train_loss": -38.8648796081543, "global_step": 152116, "epoch": 1257} {"train_loss": -39.903968811035156, "global_step": 152117, "epoch": 1257} {"train_loss": -38.01816940307617, "global_step": 152118, "epoch": 1257} {"train_loss": -36.83634567260742, "global_step": 152119, "epoch": 1257} {"train_loss": -39.19210433959961, "global_step": 152120, "epoch": 1257} {"train_loss": -39.16254425048828, "global_step": 152121, "epoch": 1257} {"train_loss": -33.41626739501953, "global_step": 152122, "epoch": 1257} {"train_loss": -37.544986724853516, "global_step": 152123, "epoch": 1257} {"train_loss": -39.3002815246582, "global_step": 152124, "epoch": 1257} {"train_loss": -37.615333557128906, "global_step": 152125, "epoch": 1257} {"train_loss": -36.064388275146484, "global_step": 152126, "epoch": 1257} {"train_loss": -37.52548599243164, "global_step": 152127, "epoch": 1257} {"train_loss": -37.91537094116211, "global_step": 152128, "epoch": 1257} {"train_loss": -39.1235466003418, "global_step": 152129, "epoch": 1257} {"train_loss": -38.874481201171875, "global_step": 152130, "epoch": 1257} {"train_loss": -39.33070755004883, "global_step": 152131, "epoch": 1257} {"train_loss": -37.93061447143555, "global_step": 152132, "epoch": 1257} {"train_loss": -38.82855987548828, "global_step": 152133, "epoch": 1257} {"train_loss": -39.42161178588867, "global_step": 152134, "epoch": 1257} {"train_loss": -39.342308044433594, "global_step": 152135, "epoch": 1257} {"train_loss": -34.274871826171875, "global_step": 152136, "epoch": 1257} {"train_loss": -38.54140853881836, "global_step": 152137, "epoch": 1257} {"train_loss": -39.557891845703125, "global_step": 152138, "epoch": 1257} {"train_loss": -38.16926956176758, "global_step": 152139, "epoch": 1257} {"train_loss": -38.83173751831055, "global_step": 152140, "epoch": 1257} {"train_loss": -38.37474060058594, "global_step": 152141, "epoch": 1257} {"train_loss": -39.799190521240234, "global_step": 152142, "epoch": 1257} {"train_loss": -38.24213790893555, "global_step": 152143, "epoch": 1257} {"train_loss": -38.93696212768555, "global_step": 152144, "epoch": 1257} {"train_loss": -38.05331039428711, "global_step": 152145, "epoch": 1257} {"train_loss": -38.213897705078125, "global_step": 152146, "epoch": 1257} {"train_loss": -38.545440673828125, "global_step": 152147, "epoch": 1257} {"train_loss": -39.03127670288086, "global_step": 152148, "epoch": 1257} {"train_loss": -39.46198654174805, "global_step": 152149, "epoch": 1257} {"train_loss": -39.67176055908203, "global_step": 152150, "epoch": 1257} {"train_loss": -39.82170867919922, "global_step": 152151, "epoch": 1257} {"train_loss": -38.776702880859375, "global_step": 152152, "epoch": 1257} {"train_loss": -39.97146987915039, "global_step": 152153, "epoch": 1257} {"train_loss": -39.115516662597656, "global_step": 152154, "epoch": 1257} {"train_loss": -39.43711471557617, "global_step": 152155, "epoch": 1257} {"train_loss": -39.46517562866211, "global_step": 152156, "epoch": 1257} {"train_loss": -39.93035888671875, "global_step": 152157, "epoch": 1257} {"train_loss": -39.42148208618164, "global_step": 152158, "epoch": 1257} {"train_loss": -39.93352508544922, "global_step": 152159, "epoch": 1257} {"train_loss": -40.41559600830078, "global_step": 152160, "epoch": 1257} {"train_loss": -39.516841888427734, "global_step": 152161, "epoch": 1257} {"train_loss": -40.19044494628906, "global_step": 152162, "epoch": 1257} {"train_loss": -40.18355941772461, "global_step": 152163, "epoch": 1257} {"train_loss": -39.30683517456055, "global_step": 152164, "epoch": 1257} {"train_loss": -39.45390319824219, "global_step": 152165, "epoch": 1257} {"train_loss": -39.3126335144043, "global_step": 152166, "epoch": 1257} {"train_loss": -39.464515686035156, "global_step": 152167, "epoch": 1257} {"train_loss": -40.10601806640625, "global_step": 152168, "epoch": 1257} {"train_loss": -40.39889144897461, "global_step": 152169, "epoch": 1257} {"train_loss": -40.4610710144043, "global_step": 152170, "epoch": 1257} {"train_loss": -39.965553283691406, "global_step": 152171, "epoch": 1257} {"train_loss": -40.3068962097168, "global_step": 152172, "epoch": 1257} {"train_loss": -40.23041915893555, "global_step": 152173, "epoch": 1257} {"train_loss": -40.1370964050293, "global_step": 152174, "epoch": 1257} {"train_loss": -40.21832275390625, "global_step": 152175, "epoch": 1257} {"train_loss": -40.58258819580078, "global_step": 152176, "epoch": 1257} {"train_loss": -39.131282806396484, "global_step": 152177, "epoch": 1257} {"train_loss": -37.44856643676758, "global_step": 152178, "epoch": 1257} {"train_loss": -33.420021057128906, "global_step": 152179, "epoch": 1257} {"train_loss": -33.801204681396484, "global_step": 152180, "epoch": 1257} {"train_loss": -37.263301849365234, "global_step": 152181, "epoch": 1257} {"train_loss": -38.133033752441406, "global_step": 152182, "epoch": 1257} {"train_loss": -35.952178955078125, "global_step": 152183, "epoch": 1257} {"train_loss": -37.420745849609375, "global_step": 152184, "epoch": 1257} {"train_loss": -40.52714157104492, "global_step": 152185, "epoch": 1257} {"train_loss": -38.34184646606445, "global_step": 152186, "epoch": 1257} {"train_loss": -37.227210998535156, "global_step": 152187, "epoch": 1257} {"train_loss": -37.04863357543945, "global_step": 152188, "epoch": 1257} {"train_loss": -39.72990798950195, "global_step": 152189, "epoch": 1257} {"train_loss": -38.85470199584961, "global_step": 152190, "epoch": 1257} {"train_loss": -37.25434494018555, "global_step": 152191, "epoch": 1257} {"train_loss": -38.39693832397461, "global_step": 152192, "epoch": 1257} {"train_loss": -40.12567901611328, "global_step": 152193, "epoch": 1257} {"train_loss": -38.93124008178711, "global_step": 152194, "epoch": 1257} {"train_loss": -39.36349105834961, "global_step": 152195, "epoch": 1257} {"train_loss": -39.50779342651367, "global_step": 152196, "epoch": 1257} {"train_loss": -39.95463180541992, "global_step": 152197, "epoch": 1257} {"train_loss": -39.476505279541016, "global_step": 152198, "epoch": 1257} {"train_loss": -37.540740966796875, "global_step": 152199, "epoch": 1257} {"train_loss": -39.78852462768555, "global_step": 152200, "epoch": 1257} {"train_loss": -38.682594299316406, "global_step": 152201, "epoch": 1257} {"train_loss": -39.59088134765625, "global_step": 152202, "epoch": 1257} {"train_loss": -39.929595947265625, "global_step": 152203, "epoch": 1257} {"train_loss": -39.697383880615234, "global_step": 152204, "epoch": 1257} {"train_loss": -40.691593170166016, "global_step": 152205, "epoch": 1257} {"train_loss": -40.260929107666016, "global_step": 152206, "epoch": 1257} {"train_loss": -40.66041946411133, "global_step": 152207, "epoch": 1257} {"train_loss": -39.762203216552734, "global_step": 152208, "epoch": 1257} {"train_loss": -40.71623611450195, "global_step": 152209, "epoch": 1257} {"train_loss": -39.520423889160156, "global_step": 152210, "epoch": 1257} {"train_loss": -40.64836883544922, "global_step": 152211, "epoch": 1257} {"train_loss": -40.287933349609375, "global_step": 152212, "epoch": 1257} {"train_loss": -40.471797943115234, "global_step": 152213, "epoch": 1257} {"train_loss": -39.931148529052734, "global_step": 152214, "epoch": 1257} {"train_loss": -38.921424865722656, "global_step": 152215, "epoch": 1257} {"train_loss": -40.127906799316406, "global_step": 152216, "epoch": 1257} {"train_loss": -39.01566188591571, "global_step": 152217, "epoch": 1257, "val_loss": 2700167.25} {"train_loss": -40.169281005859375, "global_step": 152218, "epoch": 1258} {"train_loss": -40.1347541809082, "global_step": 152219, "epoch": 1258} {"train_loss": -40.4354362487793, "global_step": 152220, "epoch": 1258} {"train_loss": -38.92366409301758, "global_step": 152221, "epoch": 1258} {"train_loss": -40.436702728271484, "global_step": 152222, "epoch": 1258} {"train_loss": -40.26146697998047, "global_step": 152223, "epoch": 1258} {"train_loss": -40.42728805541992, "global_step": 152224, "epoch": 1258} {"train_loss": -39.409088134765625, "global_step": 152225, "epoch": 1258} {"train_loss": -41.011451721191406, "global_step": 152226, "epoch": 1258} {"train_loss": -40.581268310546875, "global_step": 152227, "epoch": 1258} {"train_loss": -40.54445266723633, "global_step": 152228, "epoch": 1258} {"train_loss": -40.77558517456055, "global_step": 152229, "epoch": 1258} {"train_loss": -40.09634017944336, "global_step": 152230, "epoch": 1258} {"train_loss": -38.70000076293945, "global_step": 152231, "epoch": 1258} {"train_loss": -38.83002853393555, "global_step": 152232, "epoch": 1258} {"train_loss": -38.38163375854492, "global_step": 152233, "epoch": 1258} {"train_loss": -38.829803466796875, "global_step": 152234, "epoch": 1258} {"train_loss": -40.028079986572266, "global_step": 152235, "epoch": 1258} {"train_loss": -40.10169982910156, "global_step": 152236, "epoch": 1258} {"train_loss": -40.338890075683594, "global_step": 152237, "epoch": 1258} {"train_loss": -40.340641021728516, "global_step": 152238, "epoch": 1258} {"train_loss": -40.48065185546875, "global_step": 152239, "epoch": 1258} {"train_loss": -40.45487594604492, "global_step": 152240, "epoch": 1258} {"train_loss": -39.47254180908203, "global_step": 152241, "epoch": 1258} {"train_loss": -40.04606246948242, "global_step": 152242, "epoch": 1258} {"train_loss": -40.505104064941406, "global_step": 152243, "epoch": 1258} {"train_loss": -40.42380905151367, "global_step": 152244, "epoch": 1258} {"train_loss": -40.07424545288086, "global_step": 152245, "epoch": 1258} {"train_loss": -40.81642532348633, "global_step": 152246, "epoch": 1258} {"train_loss": -40.51447296142578, "global_step": 152247, "epoch": 1258} {"train_loss": -40.42879867553711, "global_step": 152248, "epoch": 1258} {"train_loss": -40.33711624145508, "global_step": 152249, "epoch": 1258} {"train_loss": -40.815093994140625, "global_step": 152250, "epoch": 1258} {"train_loss": -40.54731369018555, "global_step": 152251, "epoch": 1258} {"train_loss": -40.73734664916992, "global_step": 152252, "epoch": 1258} {"train_loss": -40.05210494995117, "global_step": 152253, "epoch": 1258} {"train_loss": -40.96358108520508, "global_step": 152254, "epoch": 1258} {"train_loss": -40.04254150390625, "global_step": 152255, "epoch": 1258} {"train_loss": -39.65544891357422, "global_step": 152256, "epoch": 1258} {"train_loss": -40.23969268798828, "global_step": 152257, "epoch": 1258} {"train_loss": -39.539730072021484, "global_step": 152258, "epoch": 1258} {"train_loss": -39.97762680053711, "global_step": 152259, "epoch": 1258} {"train_loss": -39.7940673828125, "global_step": 152260, "epoch": 1258} {"train_loss": -39.88532638549805, "global_step": 152261, "epoch": 1258} {"train_loss": -40.821205139160156, "global_step": 152262, "epoch": 1258} {"train_loss": -39.376983642578125, "global_step": 152263, "epoch": 1258} {"train_loss": -40.9383659362793, "global_step": 152264, "epoch": 1258} {"train_loss": -40.245967864990234, "global_step": 152265, "epoch": 1258} {"train_loss": -39.344966888427734, "global_step": 152266, "epoch": 1258} {"train_loss": -38.118934631347656, "global_step": 152267, "epoch": 1258} {"train_loss": -37.84811019897461, "global_step": 152268, "epoch": 1258} {"train_loss": -38.20294189453125, "global_step": 152269, "epoch": 1258} {"train_loss": -39.57989501953125, "global_step": 152270, "epoch": 1258} {"train_loss": -39.955718994140625, "global_step": 152271, "epoch": 1258} {"train_loss": -39.14435958862305, "global_step": 152272, "epoch": 1258} {"train_loss": -39.74879455566406, "global_step": 152273, "epoch": 1258} {"train_loss": -39.082855224609375, "global_step": 152274, "epoch": 1258} {"train_loss": -39.9488525390625, "global_step": 152275, "epoch": 1258} {"train_loss": -38.687007904052734, "global_step": 152276, "epoch": 1258} {"train_loss": -40.0540771484375, "global_step": 152277, "epoch": 1258} {"train_loss": -37.76646041870117, "global_step": 152278, "epoch": 1258} {"train_loss": -38.3946647644043, "global_step": 152279, "epoch": 1258} {"train_loss": -39.998470306396484, "global_step": 152280, "epoch": 1258} {"train_loss": -40.622413635253906, "global_step": 152281, "epoch": 1258} {"train_loss": -38.66307830810547, "global_step": 152282, "epoch": 1258} {"train_loss": -40.60346603393555, "global_step": 152283, "epoch": 1258} {"train_loss": -39.65845489501953, "global_step": 152284, "epoch": 1258} {"train_loss": -36.096168518066406, "global_step": 152285, "epoch": 1258} {"train_loss": -38.76622009277344, "global_step": 152286, "epoch": 1258} {"train_loss": -39.46529769897461, "global_step": 152287, "epoch": 1258} {"train_loss": -38.983280181884766, "global_step": 152288, "epoch": 1258} {"train_loss": -37.77642059326172, "global_step": 152289, "epoch": 1258} {"train_loss": -36.658321380615234, "global_step": 152290, "epoch": 1258} {"train_loss": -39.239601135253906, "global_step": 152291, "epoch": 1258} {"train_loss": -38.23681640625, "global_step": 152292, "epoch": 1258} {"train_loss": -31.935855865478516, "global_step": 152293, "epoch": 1258} {"train_loss": -37.508522033691406, "global_step": 152294, "epoch": 1258} {"train_loss": -39.928035736083984, "global_step": 152295, "epoch": 1258} {"train_loss": -37.796688079833984, "global_step": 152296, "epoch": 1258} {"train_loss": -37.16004180908203, "global_step": 152297, "epoch": 1258} {"train_loss": -35.51716995239258, "global_step": 152298, "epoch": 1258} {"train_loss": -30.82500648498535, "global_step": 152299, "epoch": 1258} {"train_loss": -34.936920166015625, "global_step": 152300, "epoch": 1258} {"train_loss": -38.181575775146484, "global_step": 152301, "epoch": 1258} {"train_loss": -33.38736343383789, "global_step": 152302, "epoch": 1258} {"train_loss": -36.670711517333984, "global_step": 152303, "epoch": 1258} {"train_loss": -33.875484466552734, "global_step": 152304, "epoch": 1258} {"train_loss": -33.09669876098633, "global_step": 152305, "epoch": 1258} {"train_loss": -36.21479034423828, "global_step": 152306, "epoch": 1258} {"train_loss": -33.11104965209961, "global_step": 152307, "epoch": 1258} {"train_loss": -35.40388107299805, "global_step": 152308, "epoch": 1258} {"train_loss": -37.18050003051758, "global_step": 152309, "epoch": 1258} {"train_loss": -34.7955436706543, "global_step": 152310, "epoch": 1258} {"train_loss": -36.05258560180664, "global_step": 152311, "epoch": 1258} {"train_loss": -37.08401107788086, "global_step": 152312, "epoch": 1258} {"train_loss": -36.391902923583984, "global_step": 152313, "epoch": 1258} {"train_loss": -37.36326217651367, "global_step": 152314, "epoch": 1258} {"train_loss": -36.092403411865234, "global_step": 152315, "epoch": 1258} {"train_loss": -34.306060791015625, "global_step": 152316, "epoch": 1258} {"train_loss": -33.35517501831055, "global_step": 152317, "epoch": 1258} {"train_loss": -35.2144775390625, "global_step": 152318, "epoch": 1258} {"train_loss": -37.876556396484375, "global_step": 152319, "epoch": 1258} {"train_loss": -35.20355224609375, "global_step": 152320, "epoch": 1258} {"train_loss": -36.42771911621094, "global_step": 152321, "epoch": 1258} {"train_loss": -36.94641876220703, "global_step": 152322, "epoch": 1258} {"train_loss": -34.104591369628906, "global_step": 152323, "epoch": 1258} {"train_loss": -37.64985275268555, "global_step": 152324, "epoch": 1258} {"train_loss": -37.12322998046875, "global_step": 152325, "epoch": 1258} {"train_loss": -34.90889358520508, "global_step": 152326, "epoch": 1258} {"train_loss": -37.42633056640625, "global_step": 152327, "epoch": 1258} {"train_loss": -38.64922332763672, "global_step": 152328, "epoch": 1258} {"train_loss": -37.97390365600586, "global_step": 152329, "epoch": 1258} {"train_loss": -37.68496322631836, "global_step": 152330, "epoch": 1258} {"train_loss": -36.56584930419922, "global_step": 152331, "epoch": 1258} {"train_loss": -38.693077087402344, "global_step": 152332, "epoch": 1258} {"train_loss": -38.69131088256836, "global_step": 152333, "epoch": 1258} {"train_loss": -37.6741828918457, "global_step": 152334, "epoch": 1258} {"train_loss": -37.22884750366211, "global_step": 152335, "epoch": 1258} {"train_loss": -37.8582763671875, "global_step": 152336, "epoch": 1258} {"train_loss": -38.66032409667969, "global_step": 152337, "epoch": 1258} {"train_loss": -38.39469775680668, "global_step": 152338, "epoch": 1258, "val_loss": 2578704.25} {"train_loss": -35.944183349609375, "global_step": 152339, "epoch": 1259} {"train_loss": -38.88980484008789, "global_step": 152340, "epoch": 1259} {"train_loss": -38.32155990600586, "global_step": 152341, "epoch": 1259} {"train_loss": -38.03026580810547, "global_step": 152342, "epoch": 1259} {"train_loss": -38.659549713134766, "global_step": 152343, "epoch": 1259} {"train_loss": -38.46065902709961, "global_step": 152344, "epoch": 1259} {"train_loss": -38.18792724609375, "global_step": 152345, "epoch": 1259} {"train_loss": -38.30939865112305, "global_step": 152346, "epoch": 1259} {"train_loss": -39.43056869506836, "global_step": 152347, "epoch": 1259} {"train_loss": -39.05397415161133, "global_step": 152348, "epoch": 1259} {"train_loss": -38.86467361450195, "global_step": 152349, "epoch": 1259} {"train_loss": -38.70156478881836, "global_step": 152350, "epoch": 1259} {"train_loss": -39.1437873840332, "global_step": 152351, "epoch": 1259} {"train_loss": -39.39048385620117, "global_step": 152352, "epoch": 1259} {"train_loss": -38.865047454833984, "global_step": 152353, "epoch": 1259} {"train_loss": -39.39188766479492, "global_step": 152354, "epoch": 1259} {"train_loss": -39.04188919067383, "global_step": 152355, "epoch": 1259} {"train_loss": -38.116485595703125, "global_step": 152356, "epoch": 1259} {"train_loss": -39.239192962646484, "global_step": 152357, "epoch": 1259} {"train_loss": -38.97500991821289, "global_step": 152358, "epoch": 1259} {"train_loss": -39.75399398803711, "global_step": 152359, "epoch": 1259} {"train_loss": -39.17616653442383, "global_step": 152360, "epoch": 1259} {"train_loss": -37.99116134643555, "global_step": 152361, "epoch": 1259} {"train_loss": -39.47160720825195, "global_step": 152362, "epoch": 1259} {"train_loss": -38.89739990234375, "global_step": 152363, "epoch": 1259} {"train_loss": -39.5229606628418, "global_step": 152364, "epoch": 1259} {"train_loss": -39.31746292114258, "global_step": 152365, "epoch": 1259} {"train_loss": -38.909461975097656, "global_step": 152366, "epoch": 1259} {"train_loss": -39.68870162963867, "global_step": 152367, "epoch": 1259} {"train_loss": -39.72210693359375, "global_step": 152368, "epoch": 1259} {"train_loss": -39.230560302734375, "global_step": 152369, "epoch": 1259} {"train_loss": -39.971771240234375, "global_step": 152370, "epoch": 1259} {"train_loss": -39.62429428100586, "global_step": 152371, "epoch": 1259} {"train_loss": -39.26854705810547, "global_step": 152372, "epoch": 1259} {"train_loss": -39.77097702026367, "global_step": 152373, "epoch": 1259} {"train_loss": -39.62052536010742, "global_step": 152374, "epoch": 1259} {"train_loss": -40.08999252319336, "global_step": 152375, "epoch": 1259} {"train_loss": -39.73151779174805, "global_step": 152376, "epoch": 1259} {"train_loss": -39.776302337646484, "global_step": 152377, "epoch": 1259} {"train_loss": -40.09865188598633, "global_step": 152378, "epoch": 1259} {"train_loss": -39.29353332519531, "global_step": 152379, "epoch": 1259} {"train_loss": -39.516944885253906, "global_step": 152380, "epoch": 1259} {"train_loss": -38.930355072021484, "global_step": 152381, "epoch": 1259} {"train_loss": -39.39347839355469, "global_step": 152382, "epoch": 1259} {"train_loss": -39.08543014526367, "global_step": 152383, "epoch": 1259} {"train_loss": -38.715972900390625, "global_step": 152384, "epoch": 1259} {"train_loss": -39.608009338378906, "global_step": 152385, "epoch": 1259} {"train_loss": -38.848690032958984, "global_step": 152386, "epoch": 1259} {"train_loss": -38.885677337646484, "global_step": 152387, "epoch": 1259} {"train_loss": -39.64138412475586, "global_step": 152388, "epoch": 1259} {"train_loss": -38.64544677734375, "global_step": 152389, "epoch": 1259} {"train_loss": -37.16929244995117, "global_step": 152390, "epoch": 1259} {"train_loss": -37.73051834106445, "global_step": 152391, "epoch": 1259} {"train_loss": -38.59896469116211, "global_step": 152392, "epoch": 1259} {"train_loss": -40.214439392089844, "global_step": 152393, "epoch": 1259} {"train_loss": -39.11505889892578, "global_step": 152394, "epoch": 1259} {"train_loss": -36.893856048583984, "global_step": 152395, "epoch": 1259} {"train_loss": -34.42946243286133, "global_step": 152396, "epoch": 1259} {"train_loss": -31.614294052124023, "global_step": 152397, "epoch": 1259} {"train_loss": -33.66276168823242, "global_step": 152398, "epoch": 1259} {"train_loss": -31.75681495666504, "global_step": 152399, "epoch": 1259} {"train_loss": -28.222570419311523, "global_step": 152400, "epoch": 1259} {"train_loss": -19.17616844177246, "global_step": 152401, "epoch": 1259} {"train_loss": -22.264163970947266, "global_step": 152402, "epoch": 1259} {"train_loss": -39.468719482421875, "global_step": 152403, "epoch": 1259} {"train_loss": -22.636045455932617, "global_step": 152404, "epoch": 1259} {"train_loss": -37.079994201660156, "global_step": 152405, "epoch": 1259} {"train_loss": -32.31306076049805, "global_step": 152406, "epoch": 1259} {"train_loss": -36.35209274291992, "global_step": 152407, "epoch": 1259} {"train_loss": -32.78933334350586, "global_step": 152408, "epoch": 1259} {"train_loss": -36.39931106567383, "global_step": 152409, "epoch": 1259} {"train_loss": -34.41992950439453, "global_step": 152410, "epoch": 1259} {"train_loss": -38.39286804199219, "global_step": 152411, "epoch": 1259} {"train_loss": -34.766807556152344, "global_step": 152412, "epoch": 1259} {"train_loss": -37.623451232910156, "global_step": 152413, "epoch": 1259} {"train_loss": -37.85708999633789, "global_step": 152414, "epoch": 1259} {"train_loss": -37.00146484375, "global_step": 152415, "epoch": 1259} {"train_loss": -38.81435775756836, "global_step": 152416, "epoch": 1259} {"train_loss": -36.726688385009766, "global_step": 152417, "epoch": 1259} {"train_loss": -37.87835693359375, "global_step": 152418, "epoch": 1259} {"train_loss": -38.12437057495117, "global_step": 152419, "epoch": 1259} {"train_loss": -38.084632873535156, "global_step": 152420, "epoch": 1259} {"train_loss": -38.607051849365234, "global_step": 152421, "epoch": 1259} {"train_loss": -38.40570068359375, "global_step": 152422, "epoch": 1259} {"train_loss": -38.54604721069336, "global_step": 152423, "epoch": 1259} {"train_loss": -37.981292724609375, "global_step": 152424, "epoch": 1259} {"train_loss": -38.85188293457031, "global_step": 152425, "epoch": 1259} {"train_loss": -38.73802947998047, "global_step": 152426, "epoch": 1259} {"train_loss": -39.342830657958984, "global_step": 152427, "epoch": 1259} {"train_loss": -38.58666229248047, "global_step": 152428, "epoch": 1259} {"train_loss": -39.1054801940918, "global_step": 152429, "epoch": 1259} {"train_loss": -38.525054931640625, "global_step": 152430, "epoch": 1259} {"train_loss": -38.711944580078125, "global_step": 152431, "epoch": 1259} {"train_loss": -38.568241119384766, "global_step": 152432, "epoch": 1259} {"train_loss": -39.08299255371094, "global_step": 152433, "epoch": 1259} {"train_loss": -39.292388916015625, "global_step": 152434, "epoch": 1259} {"train_loss": -39.2624397277832, "global_step": 152435, "epoch": 1259} {"train_loss": -38.53036117553711, "global_step": 152436, "epoch": 1259} {"train_loss": -39.28235626220703, "global_step": 152437, "epoch": 1259} {"train_loss": -39.401302337646484, "global_step": 152438, "epoch": 1259} {"train_loss": -39.30017852783203, "global_step": 152439, "epoch": 1259} {"train_loss": -39.4084587097168, "global_step": 152440, "epoch": 1259} {"train_loss": -39.46426010131836, "global_step": 152441, "epoch": 1259} {"train_loss": -39.592586517333984, "global_step": 152442, "epoch": 1259} {"train_loss": -39.78606414794922, "global_step": 152443, "epoch": 1259} {"train_loss": -39.659278869628906, "global_step": 152444, "epoch": 1259} {"train_loss": -39.41453170776367, "global_step": 152445, "epoch": 1259} {"train_loss": -39.4006233215332, "global_step": 152446, "epoch": 1259} {"train_loss": -39.4218864440918, "global_step": 152447, "epoch": 1259} {"train_loss": -39.95553207397461, "global_step": 152448, "epoch": 1259} {"train_loss": -39.969871520996094, "global_step": 152449, "epoch": 1259} {"train_loss": -39.61387634277344, "global_step": 152450, "epoch": 1259} {"train_loss": -39.66262435913086, "global_step": 152451, "epoch": 1259} {"train_loss": -39.76035690307617, "global_step": 152452, "epoch": 1259} {"train_loss": -39.71748733520508, "global_step": 152453, "epoch": 1259} {"train_loss": -39.8173828125, "global_step": 152454, "epoch": 1259} {"train_loss": -40.179786682128906, "global_step": 152455, "epoch": 1259} {"train_loss": -39.859981536865234, "global_step": 152456, "epoch": 1259} {"train_loss": -39.57441329956055, "global_step": 152457, "epoch": 1259} {"train_loss": -39.82118225097656, "global_step": 152458, "epoch": 1259} {"train_loss": -38.04019888570486, "global_step": 152459, "epoch": 1259, "val_loss": 2661935.0} {"train_loss": -40.392723083496094, "global_step": 152460, "epoch": 1260} {"train_loss": -40.35422897338867, "global_step": 152461, "epoch": 1260} {"train_loss": -40.52639389038086, "global_step": 152462, "epoch": 1260} {"train_loss": -40.226654052734375, "global_step": 152463, "epoch": 1260} {"train_loss": -40.51820755004883, "global_step": 152464, "epoch": 1260} {"train_loss": -40.027278900146484, "global_step": 152465, "epoch": 1260} {"train_loss": -40.311134338378906, "global_step": 152466, "epoch": 1260} {"train_loss": -40.4716682434082, "global_step": 152467, "epoch": 1260} {"train_loss": -40.263702392578125, "global_step": 152468, "epoch": 1260} {"train_loss": -40.178951263427734, "global_step": 152469, "epoch": 1260} {"train_loss": -40.61194610595703, "global_step": 152470, "epoch": 1260} {"train_loss": -40.19468688964844, "global_step": 152471, "epoch": 1260} {"train_loss": -39.828739166259766, "global_step": 152472, "epoch": 1260} {"train_loss": -40.5946044921875, "global_step": 152473, "epoch": 1260} {"train_loss": -40.428096771240234, "global_step": 152474, "epoch": 1260} {"train_loss": -40.51823806762695, "global_step": 152475, "epoch": 1260} {"train_loss": -40.802913665771484, "global_step": 152476, "epoch": 1260} {"train_loss": -40.63037872314453, "global_step": 152477, "epoch": 1260} {"train_loss": -40.867774963378906, "global_step": 152478, "epoch": 1260} {"train_loss": -40.579444885253906, "global_step": 152479, "epoch": 1260} {"train_loss": -40.8492546081543, "global_step": 152480, "epoch": 1260} {"train_loss": -40.57835006713867, "global_step": 152481, "epoch": 1260} {"train_loss": -40.51283645629883, "global_step": 152482, "epoch": 1260} {"train_loss": -40.54301071166992, "global_step": 152483, "epoch": 1260} {"train_loss": -40.79158020019531, "global_step": 152484, "epoch": 1260} {"train_loss": -40.34698486328125, "global_step": 152485, "epoch": 1260} {"train_loss": -40.767608642578125, "global_step": 152486, "epoch": 1260} {"train_loss": -40.13529586791992, "global_step": 152487, "epoch": 1260} {"train_loss": -41.0404167175293, "global_step": 152488, "epoch": 1260} {"train_loss": -40.443641662597656, "global_step": 152489, "epoch": 1260} {"train_loss": -40.554256439208984, "global_step": 152490, "epoch": 1260} {"train_loss": -40.615169525146484, "global_step": 152491, "epoch": 1260} {"train_loss": -41.07310104370117, "global_step": 152492, "epoch": 1260} {"train_loss": -40.26377487182617, "global_step": 152493, "epoch": 1260} {"train_loss": -40.77001953125, "global_step": 152494, "epoch": 1260} {"train_loss": -41.070884704589844, "global_step": 152495, "epoch": 1260} {"train_loss": -41.01385498046875, "global_step": 152496, "epoch": 1260} {"train_loss": -41.06848907470703, "global_step": 152497, "epoch": 1260} {"train_loss": -40.80434036254883, "global_step": 152498, "epoch": 1260} {"train_loss": -40.86703109741211, "global_step": 152499, "epoch": 1260} {"train_loss": -39.975215911865234, "global_step": 152500, "epoch": 1260} {"train_loss": -40.58763122558594, "global_step": 152501, "epoch": 1260} {"train_loss": -38.21739959716797, "global_step": 152502, "epoch": 1260} {"train_loss": -33.441078186035156, "global_step": 152503, "epoch": 1260} {"train_loss": -27.430023193359375, "global_step": 152504, "epoch": 1260} {"train_loss": -23.19112205505371, "global_step": 152505, "epoch": 1260} {"train_loss": -29.852664947509766, "global_step": 152506, "epoch": 1260} {"train_loss": -40.35020065307617, "global_step": 152507, "epoch": 1260} {"train_loss": -31.527149200439453, "global_step": 152508, "epoch": 1260} {"train_loss": -28.770063400268555, "global_step": 152509, "epoch": 1260} {"train_loss": -39.333343505859375, "global_step": 152510, "epoch": 1260} {"train_loss": -30.127960205078125, "global_step": 152511, "epoch": 1260} {"train_loss": -38.51933288574219, "global_step": 152512, "epoch": 1260} {"train_loss": -30.808828353881836, "global_step": 152513, "epoch": 1260} {"train_loss": -39.11083221435547, "global_step": 152514, "epoch": 1260} {"train_loss": -31.29837989807129, "global_step": 152515, "epoch": 1260} {"train_loss": -38.781463623046875, "global_step": 152516, "epoch": 1260} {"train_loss": -36.531158447265625, "global_step": 152517, "epoch": 1260} {"train_loss": -35.46294403076172, "global_step": 152518, "epoch": 1260} {"train_loss": -38.44669723510742, "global_step": 152519, "epoch": 1260} {"train_loss": -37.090938568115234, "global_step": 152520, "epoch": 1260} {"train_loss": -36.96067810058594, "global_step": 152521, "epoch": 1260} {"train_loss": -38.657711029052734, "global_step": 152522, "epoch": 1260} {"train_loss": -38.86586380004883, "global_step": 152523, "epoch": 1260} {"train_loss": -37.9103889465332, "global_step": 152524, "epoch": 1260} {"train_loss": -38.4995231628418, "global_step": 152525, "epoch": 1260} {"train_loss": -39.58789825439453, "global_step": 152526, "epoch": 1260} {"train_loss": -39.86554718017578, "global_step": 152527, "epoch": 1260} {"train_loss": -38.70270919799805, "global_step": 152528, "epoch": 1260} {"train_loss": -39.21236801147461, "global_step": 152529, "epoch": 1260} {"train_loss": -39.469635009765625, "global_step": 152530, "epoch": 1260} {"train_loss": -39.64558029174805, "global_step": 152531, "epoch": 1260} {"train_loss": -39.49870300292969, "global_step": 152532, "epoch": 1260} {"train_loss": -38.556678771972656, "global_step": 152533, "epoch": 1260} {"train_loss": -40.05607223510742, "global_step": 152534, "epoch": 1260} {"train_loss": -39.87332534790039, "global_step": 152535, "epoch": 1260} {"train_loss": -39.63273239135742, "global_step": 152536, "epoch": 1260} {"train_loss": -39.25893020629883, "global_step": 152537, "epoch": 1260} {"train_loss": -39.95930862426758, "global_step": 152538, "epoch": 1260} {"train_loss": -40.256439208984375, "global_step": 152539, "epoch": 1260} {"train_loss": -40.344966888427734, "global_step": 152540, "epoch": 1260} {"train_loss": -40.52417755126953, "global_step": 152541, "epoch": 1260} {"train_loss": -39.75682830810547, "global_step": 152542, "epoch": 1260} {"train_loss": -40.139564514160156, "global_step": 152543, "epoch": 1260} {"train_loss": -40.425323486328125, "global_step": 152544, "epoch": 1260} {"train_loss": -39.73590850830078, "global_step": 152545, "epoch": 1260} {"train_loss": -40.03355026245117, "global_step": 152546, "epoch": 1260} {"train_loss": -40.64698028564453, "global_step": 152547, "epoch": 1260} {"train_loss": -40.313411712646484, "global_step": 152548, "epoch": 1260} {"train_loss": -40.76996612548828, "global_step": 152549, "epoch": 1260} {"train_loss": -40.11188888549805, "global_step": 152550, "epoch": 1260} {"train_loss": -40.65015411376953, "global_step": 152551, "epoch": 1260} {"train_loss": -40.664283752441406, "global_step": 152552, "epoch": 1260} {"train_loss": -40.61891555786133, "global_step": 152553, "epoch": 1260} {"train_loss": -40.594398498535156, "global_step": 152554, "epoch": 1260} {"train_loss": -40.469390869140625, "global_step": 152555, "epoch": 1260} {"train_loss": -40.313262939453125, "global_step": 152556, "epoch": 1260} {"train_loss": -40.16050338745117, "global_step": 152557, "epoch": 1260} {"train_loss": -40.651222229003906, "global_step": 152558, "epoch": 1260} {"train_loss": -40.498130798339844, "global_step": 152559, "epoch": 1260} {"train_loss": -40.68880081176758, "global_step": 152560, "epoch": 1260} {"train_loss": -40.568077087402344, "global_step": 152561, "epoch": 1260} {"train_loss": -40.50240707397461, "global_step": 152562, "epoch": 1260} {"train_loss": -40.83094024658203, "global_step": 152563, "epoch": 1260} {"train_loss": -40.50361251831055, "global_step": 152564, "epoch": 1260} {"train_loss": -40.65571212768555, "global_step": 152565, "epoch": 1260} {"train_loss": -40.827579498291016, "global_step": 152566, "epoch": 1260} {"train_loss": -41.14950180053711, "global_step": 152567, "epoch": 1260} {"train_loss": -40.267982482910156, "global_step": 152568, "epoch": 1260} {"train_loss": -40.68687057495117, "global_step": 152569, "epoch": 1260} {"train_loss": -40.585567474365234, "global_step": 152570, "epoch": 1260} {"train_loss": -40.946163177490234, "global_step": 152571, "epoch": 1260} {"train_loss": -40.9603157043457, "global_step": 152572, "epoch": 1260} {"train_loss": -41.2718391418457, "global_step": 152573, "epoch": 1260} {"train_loss": -40.7502555847168, "global_step": 152574, "epoch": 1260} {"train_loss": -40.176666259765625, "global_step": 152575, "epoch": 1260} {"train_loss": -40.6819953918457, "global_step": 152576, "epoch": 1260} {"train_loss": -40.30226516723633, "global_step": 152577, "epoch": 1260} {"train_loss": -39.736488342285156, "global_step": 152578, "epoch": 1260} {"train_loss": -38.558753967285156, "global_step": 152579, "epoch": 1260} {"train_loss": -39.27056664080659, "global_step": 152580, "epoch": 1260, "val_loss": 2686813.25} {"train_loss": -39.45512008666992, "global_step": 152581, "epoch": 1261} {"train_loss": -38.678260803222656, "global_step": 152582, "epoch": 1261} {"train_loss": -36.545230865478516, "global_step": 152583, "epoch": 1261} {"train_loss": -34.26979064941406, "global_step": 152584, "epoch": 1261} {"train_loss": -36.59273910522461, "global_step": 152585, "epoch": 1261} {"train_loss": -40.02555847167969, "global_step": 152586, "epoch": 1261} {"train_loss": -40.16425323486328, "global_step": 152587, "epoch": 1261} {"train_loss": -39.86689758300781, "global_step": 152588, "epoch": 1261} {"train_loss": -39.786651611328125, "global_step": 152589, "epoch": 1261} {"train_loss": -39.17977523803711, "global_step": 152590, "epoch": 1261} {"train_loss": -40.034461975097656, "global_step": 152591, "epoch": 1261} {"train_loss": -40.4686164855957, "global_step": 152592, "epoch": 1261} {"train_loss": -37.92932891845703, "global_step": 152593, "epoch": 1261} {"train_loss": -39.59855270385742, "global_step": 152594, "epoch": 1261} {"train_loss": -39.408077239990234, "global_step": 152595, "epoch": 1261} {"train_loss": -40.160888671875, "global_step": 152596, "epoch": 1261} {"train_loss": -40.519229888916016, "global_step": 152597, "epoch": 1261} {"train_loss": -40.450050354003906, "global_step": 152598, "epoch": 1261} {"train_loss": -40.440616607666016, "global_step": 152599, "epoch": 1261} {"train_loss": -39.733497619628906, "global_step": 152600, "epoch": 1261} {"train_loss": -40.509803771972656, "global_step": 152601, "epoch": 1261} {"train_loss": -40.198394775390625, "global_step": 152602, "epoch": 1261} {"train_loss": -40.96790313720703, "global_step": 152603, "epoch": 1261} {"train_loss": -39.92192459106445, "global_step": 152604, "epoch": 1261} {"train_loss": -40.322689056396484, "global_step": 152605, "epoch": 1261} {"train_loss": -40.30979919433594, "global_step": 152606, "epoch": 1261} {"train_loss": -40.604888916015625, "global_step": 152607, "epoch": 1261} {"train_loss": -40.572200775146484, "global_step": 152608, "epoch": 1261} {"train_loss": -41.03394317626953, "global_step": 152609, "epoch": 1261} {"train_loss": -40.94077682495117, "global_step": 152610, "epoch": 1261} {"train_loss": -40.813655853271484, "global_step": 152611, "epoch": 1261} {"train_loss": -40.01528549194336, "global_step": 152612, "epoch": 1261} {"train_loss": -40.64000701904297, "global_step": 152613, "epoch": 1261} {"train_loss": -40.823238372802734, "global_step": 152614, "epoch": 1261} {"train_loss": -41.110595703125, "global_step": 152615, "epoch": 1261} {"train_loss": -41.199073791503906, "global_step": 152616, "epoch": 1261} {"train_loss": -40.54037857055664, "global_step": 152617, "epoch": 1261} {"train_loss": -40.022674560546875, "global_step": 152618, "epoch": 1261} {"train_loss": -40.880916595458984, "global_step": 152619, "epoch": 1261} {"train_loss": -40.817684173583984, "global_step": 152620, "epoch": 1261} {"train_loss": -40.28046417236328, "global_step": 152621, "epoch": 1261} {"train_loss": -40.26768112182617, "global_step": 152622, "epoch": 1261} {"train_loss": -40.5744743347168, "global_step": 152623, "epoch": 1261} {"train_loss": -39.69977569580078, "global_step": 152624, "epoch": 1261} {"train_loss": -39.6723518371582, "global_step": 152625, "epoch": 1261} {"train_loss": -39.736793518066406, "global_step": 152626, "epoch": 1261} {"train_loss": -39.69089889526367, "global_step": 152627, "epoch": 1261} {"train_loss": -40.31696701049805, "global_step": 152628, "epoch": 1261} {"train_loss": -38.896148681640625, "global_step": 152629, "epoch": 1261} {"train_loss": -39.1626091003418, "global_step": 152630, "epoch": 1261} {"train_loss": -38.77815628051758, "global_step": 152631, "epoch": 1261} {"train_loss": -40.124488830566406, "global_step": 152632, "epoch": 1261} {"train_loss": -37.62953567504883, "global_step": 152633, "epoch": 1261} {"train_loss": -38.71920394897461, "global_step": 152634, "epoch": 1261} {"train_loss": -39.31515121459961, "global_step": 152635, "epoch": 1261} {"train_loss": -39.121803283691406, "global_step": 152636, "epoch": 1261} {"train_loss": -39.88698196411133, "global_step": 152637, "epoch": 1261} {"train_loss": -39.43050765991211, "global_step": 152638, "epoch": 1261} {"train_loss": -38.73011016845703, "global_step": 152639, "epoch": 1261} {"train_loss": -39.72896957397461, "global_step": 152640, "epoch": 1261} {"train_loss": -38.95134353637695, "global_step": 152641, "epoch": 1261} {"train_loss": -38.457637786865234, "global_step": 152642, "epoch": 1261} {"train_loss": -39.302154541015625, "global_step": 152643, "epoch": 1261} {"train_loss": -38.567073822021484, "global_step": 152644, "epoch": 1261} {"train_loss": -39.06782150268555, "global_step": 152645, "epoch": 1261} {"train_loss": -37.5515022277832, "global_step": 152646, "epoch": 1261} {"train_loss": -38.39223098754883, "global_step": 152647, "epoch": 1261} {"train_loss": -38.138492584228516, "global_step": 152648, "epoch": 1261} {"train_loss": -39.486289978027344, "global_step": 152649, "epoch": 1261} {"train_loss": -38.36431121826172, "global_step": 152650, "epoch": 1261} {"train_loss": -38.89084243774414, "global_step": 152651, "epoch": 1261} {"train_loss": -39.450294494628906, "global_step": 152652, "epoch": 1261} {"train_loss": -40.1807975769043, "global_step": 152653, "epoch": 1261} {"train_loss": -37.96982192993164, "global_step": 152654, "epoch": 1261} {"train_loss": -39.04621505737305, "global_step": 152655, "epoch": 1261} {"train_loss": -38.099456787109375, "global_step": 152656, "epoch": 1261} {"train_loss": -39.342647552490234, "global_step": 152657, "epoch": 1261} {"train_loss": -38.5722541809082, "global_step": 152658, "epoch": 1261} {"train_loss": -39.80954360961914, "global_step": 152659, "epoch": 1261} {"train_loss": -39.11579513549805, "global_step": 152660, "epoch": 1261} {"train_loss": -37.273536682128906, "global_step": 152661, "epoch": 1261} {"train_loss": -38.51334762573242, "global_step": 152662, "epoch": 1261} {"train_loss": -40.03902053833008, "global_step": 152663, "epoch": 1261} {"train_loss": -38.94969177246094, "global_step": 152664, "epoch": 1261} {"train_loss": -39.39490509033203, "global_step": 152665, "epoch": 1261} {"train_loss": -40.168338775634766, "global_step": 152666, "epoch": 1261} {"train_loss": -40.222572326660156, "global_step": 152667, "epoch": 1261} {"train_loss": -39.823944091796875, "global_step": 152668, "epoch": 1261} {"train_loss": -40.206085205078125, "global_step": 152669, "epoch": 1261} {"train_loss": -38.212947845458984, "global_step": 152670, "epoch": 1261} {"train_loss": -35.237789154052734, "global_step": 152671, "epoch": 1261} {"train_loss": -31.58603858947754, "global_step": 152672, "epoch": 1261} {"train_loss": -36.31418228149414, "global_step": 152673, "epoch": 1261} {"train_loss": -39.15614700317383, "global_step": 152674, "epoch": 1261} {"train_loss": -38.921531677246094, "global_step": 152675, "epoch": 1261} {"train_loss": -36.071712493896484, "global_step": 152676, "epoch": 1261} {"train_loss": -37.07218551635742, "global_step": 152677, "epoch": 1261} {"train_loss": -36.282386779785156, "global_step": 152678, "epoch": 1261} {"train_loss": -38.738624572753906, "global_step": 152679, "epoch": 1261} {"train_loss": -38.23466110229492, "global_step": 152680, "epoch": 1261} {"train_loss": -37.10355758666992, "global_step": 152681, "epoch": 1261} {"train_loss": -38.76101303100586, "global_step": 152682, "epoch": 1261} {"train_loss": -35.13098907470703, "global_step": 152683, "epoch": 1261} {"train_loss": -37.992244720458984, "global_step": 152684, "epoch": 1261} {"train_loss": -34.40940475463867, "global_step": 152685, "epoch": 1261} {"train_loss": -37.51081085205078, "global_step": 152686, "epoch": 1261} {"train_loss": -38.402313232421875, "global_step": 152687, "epoch": 1261} {"train_loss": -36.0156135559082, "global_step": 152688, "epoch": 1261} {"train_loss": -33.78278732299805, "global_step": 152689, "epoch": 1261} {"train_loss": -38.23775863647461, "global_step": 152690, "epoch": 1261} {"train_loss": -34.35807418823242, "global_step": 152691, "epoch": 1261} {"train_loss": -30.384052276611328, "global_step": 152692, "epoch": 1261} {"train_loss": -37.43355178833008, "global_step": 152693, "epoch": 1261} {"train_loss": -36.7623176574707, "global_step": 152694, "epoch": 1261} {"train_loss": -36.997650146484375, "global_step": 152695, "epoch": 1261} {"train_loss": -38.73542785644531, "global_step": 152696, "epoch": 1261} {"train_loss": -34.628082275390625, "global_step": 152697, "epoch": 1261} {"train_loss": -35.024452209472656, "global_step": 152698, "epoch": 1261} {"train_loss": -36.3573112487793, "global_step": 152699, "epoch": 1261} {"train_loss": -37.52643966674805, "global_step": 152700, "epoch": 1261} {"train_loss": -38.68706636980546, "global_step": 152701, "epoch": 1261, "val_loss": 2635700.75} {"train_loss": -37.01639175415039, "global_step": 152702, "epoch": 1262} {"train_loss": -38.874603271484375, "global_step": 152703, "epoch": 1262} {"train_loss": -36.43130874633789, "global_step": 152704, "epoch": 1262} {"train_loss": -37.876834869384766, "global_step": 152705, "epoch": 1262} {"train_loss": -35.76190185546875, "global_step": 152706, "epoch": 1262} {"train_loss": -37.4621696472168, "global_step": 152707, "epoch": 1262} {"train_loss": -37.07622528076172, "global_step": 152708, "epoch": 1262} {"train_loss": -34.94688415527344, "global_step": 152709, "epoch": 1262} {"train_loss": -35.90238571166992, "global_step": 152710, "epoch": 1262} {"train_loss": -36.055599212646484, "global_step": 152711, "epoch": 1262} {"train_loss": -38.27927780151367, "global_step": 152712, "epoch": 1262} {"train_loss": -38.691829681396484, "global_step": 152713, "epoch": 1262} {"train_loss": -38.11833572387695, "global_step": 152714, "epoch": 1262} {"train_loss": -35.26865005493164, "global_step": 152715, "epoch": 1262} {"train_loss": -38.29256057739258, "global_step": 152716, "epoch": 1262} {"train_loss": -37.0413818359375, "global_step": 152717, "epoch": 1262} {"train_loss": -39.39838790893555, "global_step": 152718, "epoch": 1262} {"train_loss": -37.99961471557617, "global_step": 152719, "epoch": 1262} {"train_loss": -36.206207275390625, "global_step": 152720, "epoch": 1262} {"train_loss": -38.7036018371582, "global_step": 152721, "epoch": 1262} {"train_loss": -38.35065460205078, "global_step": 152722, "epoch": 1262} {"train_loss": -38.695186614990234, "global_step": 152723, "epoch": 1262} {"train_loss": -37.37396240234375, "global_step": 152724, "epoch": 1262} {"train_loss": -37.42525863647461, "global_step": 152725, "epoch": 1262} {"train_loss": -39.29010772705078, "global_step": 152726, "epoch": 1262} {"train_loss": -39.02458572387695, "global_step": 152727, "epoch": 1262} {"train_loss": -37.652896881103516, "global_step": 152728, "epoch": 1262} {"train_loss": -39.51304244995117, "global_step": 152729, "epoch": 1262} {"train_loss": -39.205955505371094, "global_step": 152730, "epoch": 1262} {"train_loss": -38.95920944213867, "global_step": 152731, "epoch": 1262} {"train_loss": -39.494606018066406, "global_step": 152732, "epoch": 1262} {"train_loss": -38.95389938354492, "global_step": 152733, "epoch": 1262} {"train_loss": -39.56402587890625, "global_step": 152734, "epoch": 1262} {"train_loss": -39.7647705078125, "global_step": 152735, "epoch": 1262} {"train_loss": -39.456382751464844, "global_step": 152736, "epoch": 1262} {"train_loss": -39.33502197265625, "global_step": 152737, "epoch": 1262} {"train_loss": -39.31277847290039, "global_step": 152738, "epoch": 1262} {"train_loss": -39.057090759277344, "global_step": 152739, "epoch": 1262} {"train_loss": -38.06715774536133, "global_step": 152740, "epoch": 1262} {"train_loss": -39.72811508178711, "global_step": 152741, "epoch": 1262} {"train_loss": -38.75539779663086, "global_step": 152742, "epoch": 1262} {"train_loss": -39.09058380126953, "global_step": 152743, "epoch": 1262} {"train_loss": -39.5925407409668, "global_step": 152744, "epoch": 1262} {"train_loss": -39.942840576171875, "global_step": 152745, "epoch": 1262} {"train_loss": -38.040531158447266, "global_step": 152746, "epoch": 1262} {"train_loss": -39.56494140625, "global_step": 152747, "epoch": 1262} {"train_loss": -38.90902328491211, "global_step": 152748, "epoch": 1262} {"train_loss": -39.08065414428711, "global_step": 152749, "epoch": 1262} {"train_loss": -39.62270736694336, "global_step": 152750, "epoch": 1262} {"train_loss": -38.91240692138672, "global_step": 152751, "epoch": 1262} {"train_loss": -39.02790451049805, "global_step": 152752, "epoch": 1262} {"train_loss": -39.168701171875, "global_step": 152753, "epoch": 1262} {"train_loss": -40.01682662963867, "global_step": 152754, "epoch": 1262} {"train_loss": -39.23320007324219, "global_step": 152755, "epoch": 1262} {"train_loss": -40.414031982421875, "global_step": 152756, "epoch": 1262} {"train_loss": -39.64786911010742, "global_step": 152757, "epoch": 1262} {"train_loss": -40.16962814331055, "global_step": 152758, "epoch": 1262} {"train_loss": -40.17536544799805, "global_step": 152759, "epoch": 1262} {"train_loss": -39.98868942260742, "global_step": 152760, "epoch": 1262} {"train_loss": -40.13004684448242, "global_step": 152761, "epoch": 1262} {"train_loss": -40.242469787597656, "global_step": 152762, "epoch": 1262} {"train_loss": -39.9566764831543, "global_step": 152763, "epoch": 1262} {"train_loss": -39.2682991027832, "global_step": 152764, "epoch": 1262} {"train_loss": -40.03719711303711, "global_step": 152765, "epoch": 1262} {"train_loss": -40.11018753051758, "global_step": 152766, "epoch": 1262} {"train_loss": -40.280426025390625, "global_step": 152767, "epoch": 1262} {"train_loss": -39.980064392089844, "global_step": 152768, "epoch": 1262} {"train_loss": -40.596622467041016, "global_step": 152769, "epoch": 1262} {"train_loss": -40.19010543823242, "global_step": 152770, "epoch": 1262} {"train_loss": -40.238983154296875, "global_step": 152771, "epoch": 1262} {"train_loss": -39.852142333984375, "global_step": 152772, "epoch": 1262} {"train_loss": -40.47939682006836, "global_step": 152773, "epoch": 1262} {"train_loss": -40.42219543457031, "global_step": 152774, "epoch": 1262} {"train_loss": -40.24277877807617, "global_step": 152775, "epoch": 1262} {"train_loss": -40.54673385620117, "global_step": 152776, "epoch": 1262} {"train_loss": -38.44150924682617, "global_step": 152777, "epoch": 1262} {"train_loss": -40.00149917602539, "global_step": 152778, "epoch": 1262} {"train_loss": -39.962730407714844, "global_step": 152779, "epoch": 1262} {"train_loss": -40.81404113769531, "global_step": 152780, "epoch": 1262} {"train_loss": -40.0594367980957, "global_step": 152781, "epoch": 1262} {"train_loss": -40.611019134521484, "global_step": 152782, "epoch": 1262} {"train_loss": -39.84756088256836, "global_step": 152783, "epoch": 1262} {"train_loss": -39.81675338745117, "global_step": 152784, "epoch": 1262} {"train_loss": -40.45955276489258, "global_step": 152785, "epoch": 1262} {"train_loss": -40.2119255065918, "global_step": 152786, "epoch": 1262} {"train_loss": -40.571319580078125, "global_step": 152787, "epoch": 1262} {"train_loss": -40.94014358520508, "global_step": 152788, "epoch": 1262} {"train_loss": -40.06912612915039, "global_step": 152789, "epoch": 1262} {"train_loss": -40.093482971191406, "global_step": 152790, "epoch": 1262} {"train_loss": -41.13916015625, "global_step": 152791, "epoch": 1262} {"train_loss": -40.2300910949707, "global_step": 152792, "epoch": 1262} {"train_loss": -40.43303298950195, "global_step": 152793, "epoch": 1262} {"train_loss": -40.51466369628906, "global_step": 152794, "epoch": 1262} {"train_loss": -40.057403564453125, "global_step": 152795, "epoch": 1262} {"train_loss": -40.59264373779297, "global_step": 152796, "epoch": 1262} {"train_loss": -40.588226318359375, "global_step": 152797, "epoch": 1262} {"train_loss": -40.057796478271484, "global_step": 152798, "epoch": 1262} {"train_loss": -39.493202209472656, "global_step": 152799, "epoch": 1262} {"train_loss": -40.1357307434082, "global_step": 152800, "epoch": 1262} {"train_loss": -38.672935485839844, "global_step": 152801, "epoch": 1262} {"train_loss": -39.16188430786133, "global_step": 152802, "epoch": 1262} {"train_loss": -38.56325149536133, "global_step": 152803, "epoch": 1262} {"train_loss": -38.01948547363281, "global_step": 152804, "epoch": 1262} {"train_loss": -37.155635833740234, "global_step": 152805, "epoch": 1262} {"train_loss": -37.378997802734375, "global_step": 152806, "epoch": 1262} {"train_loss": -39.09407424926758, "global_step": 152807, "epoch": 1262} {"train_loss": -37.8558464050293, "global_step": 152808, "epoch": 1262} {"train_loss": -37.9888801574707, "global_step": 152809, "epoch": 1262} {"train_loss": -34.08054733276367, "global_step": 152810, "epoch": 1262} {"train_loss": -38.27333450317383, "global_step": 152811, "epoch": 1262} {"train_loss": -35.444580078125, "global_step": 152812, "epoch": 1262} {"train_loss": -40.13961410522461, "global_step": 152813, "epoch": 1262} {"train_loss": -38.41725540161133, "global_step": 152814, "epoch": 1262} {"train_loss": -39.45249557495117, "global_step": 152815, "epoch": 1262} {"train_loss": -38.372650146484375, "global_step": 152816, "epoch": 1262} {"train_loss": -39.59910202026367, "global_step": 152817, "epoch": 1262} {"train_loss": -39.664546966552734, "global_step": 152818, "epoch": 1262} {"train_loss": -39.509300231933594, "global_step": 152819, "epoch": 1262} {"train_loss": -38.941707611083984, "global_step": 152820, "epoch": 1262} {"train_loss": -39.32526779174805, "global_step": 152821, "epoch": 1262} {"train_loss": -39.052267878508765, "global_step": 152822, "epoch": 1262, "val_loss": 2694821.0} {"train_loss": -39.314308166503906, "global_step": 152823, "epoch": 1263} {"train_loss": -39.9876708984375, "global_step": 152824, "epoch": 1263} {"train_loss": -39.231876373291016, "global_step": 152825, "epoch": 1263} {"train_loss": -40.254371643066406, "global_step": 152826, "epoch": 1263} {"train_loss": -39.847469329833984, "global_step": 152827, "epoch": 1263} {"train_loss": -40.5764274597168, "global_step": 152828, "epoch": 1263} {"train_loss": -40.38056945800781, "global_step": 152829, "epoch": 1263} {"train_loss": -39.93768310546875, "global_step": 152830, "epoch": 1263} {"train_loss": -39.36530303955078, "global_step": 152831, "epoch": 1263} {"train_loss": -39.332794189453125, "global_step": 152832, "epoch": 1263} {"train_loss": -39.37423324584961, "global_step": 152833, "epoch": 1263} {"train_loss": -39.15129089355469, "global_step": 152834, "epoch": 1263} {"train_loss": -38.749263763427734, "global_step": 152835, "epoch": 1263} {"train_loss": -39.2140007019043, "global_step": 152836, "epoch": 1263} {"train_loss": -39.989501953125, "global_step": 152837, "epoch": 1263} {"train_loss": -40.415035247802734, "global_step": 152838, "epoch": 1263} {"train_loss": -40.23656463623047, "global_step": 152839, "epoch": 1263} {"train_loss": -38.690731048583984, "global_step": 152840, "epoch": 1263} {"train_loss": -38.911376953125, "global_step": 152841, "epoch": 1263} {"train_loss": -39.02861022949219, "global_step": 152842, "epoch": 1263} {"train_loss": -39.39081573486328, "global_step": 152843, "epoch": 1263} {"train_loss": -40.9804573059082, "global_step": 152844, "epoch": 1263} {"train_loss": -39.6125373840332, "global_step": 152845, "epoch": 1263} {"train_loss": -40.29879379272461, "global_step": 152846, "epoch": 1263} {"train_loss": -40.3187141418457, "global_step": 152847, "epoch": 1263} {"train_loss": -40.36750030517578, "global_step": 152848, "epoch": 1263} {"train_loss": -39.78961181640625, "global_step": 152849, "epoch": 1263} {"train_loss": -39.5816764831543, "global_step": 152850, "epoch": 1263} {"train_loss": -37.57389450073242, "global_step": 152851, "epoch": 1263} {"train_loss": -40.51726150512695, "global_step": 152852, "epoch": 1263} {"train_loss": -40.455013275146484, "global_step": 152853, "epoch": 1263} {"train_loss": -39.777618408203125, "global_step": 152854, "epoch": 1263} {"train_loss": -39.573486328125, "global_step": 152855, "epoch": 1263} {"train_loss": -39.807491302490234, "global_step": 152856, "epoch": 1263} {"train_loss": -41.028656005859375, "global_step": 152857, "epoch": 1263} {"train_loss": -39.98335266113281, "global_step": 152858, "epoch": 1263} {"train_loss": -40.28361892700195, "global_step": 152859, "epoch": 1263} {"train_loss": -40.1640625, "global_step": 152860, "epoch": 1263} {"train_loss": -40.10767364501953, "global_step": 152861, "epoch": 1263} {"train_loss": -41.13252639770508, "global_step": 152862, "epoch": 1263} {"train_loss": -40.78081130981445, "global_step": 152863, "epoch": 1263} {"train_loss": -40.0571403503418, "global_step": 152864, "epoch": 1263} {"train_loss": -40.290138244628906, "global_step": 152865, "epoch": 1263} {"train_loss": -40.59275436401367, "global_step": 152866, "epoch": 1263} {"train_loss": -40.429359436035156, "global_step": 152867, "epoch": 1263} {"train_loss": -40.23515701293945, "global_step": 152868, "epoch": 1263} {"train_loss": -41.12548828125, "global_step": 152869, "epoch": 1263} {"train_loss": -41.06119155883789, "global_step": 152870, "epoch": 1263} {"train_loss": -40.59518051147461, "global_step": 152871, "epoch": 1263} {"train_loss": -40.58793258666992, "global_step": 152872, "epoch": 1263} {"train_loss": -41.10696029663086, "global_step": 152873, "epoch": 1263} {"train_loss": -40.77999496459961, "global_step": 152874, "epoch": 1263} {"train_loss": -40.077903747558594, "global_step": 152875, "epoch": 1263} {"train_loss": -40.35544967651367, "global_step": 152876, "epoch": 1263} {"train_loss": -40.85074996948242, "global_step": 152877, "epoch": 1263} {"train_loss": -41.050201416015625, "global_step": 152878, "epoch": 1263} {"train_loss": -39.6870002746582, "global_step": 152879, "epoch": 1263} {"train_loss": -40.0103874206543, "global_step": 152880, "epoch": 1263} {"train_loss": -39.010311126708984, "global_step": 152881, "epoch": 1263} {"train_loss": -39.360755920410156, "global_step": 152882, "epoch": 1263} {"train_loss": -40.38729476928711, "global_step": 152883, "epoch": 1263} {"train_loss": -39.964263916015625, "global_step": 152884, "epoch": 1263} {"train_loss": -40.22044372558594, "global_step": 152885, "epoch": 1263} {"train_loss": -38.751766204833984, "global_step": 152886, "epoch": 1263} {"train_loss": -38.282527923583984, "global_step": 152887, "epoch": 1263} {"train_loss": -39.997596740722656, "global_step": 152888, "epoch": 1263} {"train_loss": -40.43775177001953, "global_step": 152889, "epoch": 1263} {"train_loss": -40.40387725830078, "global_step": 152890, "epoch": 1263} {"train_loss": -40.3029670715332, "global_step": 152891, "epoch": 1263} {"train_loss": -40.45243453979492, "global_step": 152892, "epoch": 1263} {"train_loss": -40.415706634521484, "global_step": 152893, "epoch": 1263} {"train_loss": -40.511226654052734, "global_step": 152894, "epoch": 1263} {"train_loss": -40.37781524658203, "global_step": 152895, "epoch": 1263} {"train_loss": -40.33404541015625, "global_step": 152896, "epoch": 1263} {"train_loss": -39.3701057434082, "global_step": 152897, "epoch": 1263} {"train_loss": -41.01313018798828, "global_step": 152898, "epoch": 1263} {"train_loss": -40.87007522583008, "global_step": 152899, "epoch": 1263} {"train_loss": -40.547645568847656, "global_step": 152900, "epoch": 1263} {"train_loss": -40.97999954223633, "global_step": 152901, "epoch": 1263} {"train_loss": -40.38323211669922, "global_step": 152902, "epoch": 1263} {"train_loss": -40.047096252441406, "global_step": 152903, "epoch": 1263} {"train_loss": -40.361419677734375, "global_step": 152904, "epoch": 1263} {"train_loss": -40.502113342285156, "global_step": 152905, "epoch": 1263} {"train_loss": -39.65239715576172, "global_step": 152906, "epoch": 1263} {"train_loss": -39.50290298461914, "global_step": 152907, "epoch": 1263} {"train_loss": -41.2375602722168, "global_step": 152908, "epoch": 1263} {"train_loss": -39.5039176940918, "global_step": 152909, "epoch": 1263} {"train_loss": -40.04585266113281, "global_step": 152910, "epoch": 1263} {"train_loss": -38.2613525390625, "global_step": 152911, "epoch": 1263} {"train_loss": -38.58620071411133, "global_step": 152912, "epoch": 1263} {"train_loss": -39.071109771728516, "global_step": 152913, "epoch": 1263} {"train_loss": -39.311065673828125, "global_step": 152914, "epoch": 1263} {"train_loss": -38.89181137084961, "global_step": 152915, "epoch": 1263} {"train_loss": -35.9041862487793, "global_step": 152916, "epoch": 1263} {"train_loss": -36.05678176879883, "global_step": 152917, "epoch": 1263} {"train_loss": -35.961238861083984, "global_step": 152918, "epoch": 1263} {"train_loss": -36.1936149597168, "global_step": 152919, "epoch": 1263} {"train_loss": -39.00099563598633, "global_step": 152920, "epoch": 1263} {"train_loss": -38.1324577331543, "global_step": 152921, "epoch": 1263} {"train_loss": -38.83475875854492, "global_step": 152922, "epoch": 1263} {"train_loss": -39.38126754760742, "global_step": 152923, "epoch": 1263} {"train_loss": -38.645973205566406, "global_step": 152924, "epoch": 1263} {"train_loss": -39.679359436035156, "global_step": 152925, "epoch": 1263} {"train_loss": -38.61371994018555, "global_step": 152926, "epoch": 1263} {"train_loss": -38.112796783447266, "global_step": 152927, "epoch": 1263} {"train_loss": -39.714317321777344, "global_step": 152928, "epoch": 1263} {"train_loss": -36.40900421142578, "global_step": 152929, "epoch": 1263} {"train_loss": -39.840023040771484, "global_step": 152930, "epoch": 1263} {"train_loss": -39.3862419128418, "global_step": 152931, "epoch": 1263} {"train_loss": -37.29830551147461, "global_step": 152932, "epoch": 1263} {"train_loss": -39.13519287109375, "global_step": 152933, "epoch": 1263} {"train_loss": -39.04413986206055, "global_step": 152934, "epoch": 1263} {"train_loss": -37.746402740478516, "global_step": 152935, "epoch": 1263} {"train_loss": -38.3095703125, "global_step": 152936, "epoch": 1263} {"train_loss": -40.256282806396484, "global_step": 152937, "epoch": 1263} {"train_loss": -39.09489822387695, "global_step": 152938, "epoch": 1263} {"train_loss": -38.980552673339844, "global_step": 152939, "epoch": 1263} {"train_loss": -39.965824127197266, "global_step": 152940, "epoch": 1263} {"train_loss": -39.59340286254883, "global_step": 152941, "epoch": 1263} {"train_loss": -40.4659309387207, "global_step": 152942, "epoch": 1263} {"train_loss": -39.66711142043437, "global_step": 152943, "epoch": 1263, "val_loss": 2681286.75} {"train_loss": -39.12199401855469, "global_step": 152944, "epoch": 1264} {"train_loss": -40.06916427612305, "global_step": 152945, "epoch": 1264} {"train_loss": -40.252925872802734, "global_step": 152946, "epoch": 1264} {"train_loss": -40.33629608154297, "global_step": 152947, "epoch": 1264} {"train_loss": -40.53050231933594, "global_step": 152948, "epoch": 1264} {"train_loss": -40.37881088256836, "global_step": 152949, "epoch": 1264} {"train_loss": -40.44685363769531, "global_step": 152950, "epoch": 1264} {"train_loss": -39.908992767333984, "global_step": 152951, "epoch": 1264} {"train_loss": -40.54189682006836, "global_step": 152952, "epoch": 1264} {"train_loss": -40.300636291503906, "global_step": 152953, "epoch": 1264} {"train_loss": -40.54795837402344, "global_step": 152954, "epoch": 1264} {"train_loss": -40.418907165527344, "global_step": 152955, "epoch": 1264} {"train_loss": -40.926513671875, "global_step": 152956, "epoch": 1264} {"train_loss": -40.86906814575195, "global_step": 152957, "epoch": 1264} {"train_loss": -40.0233154296875, "global_step": 152958, "epoch": 1264} {"train_loss": -39.13811111450195, "global_step": 152959, "epoch": 1264} {"train_loss": -39.38892364501953, "global_step": 152960, "epoch": 1264} {"train_loss": -40.484222412109375, "global_step": 152961, "epoch": 1264} {"train_loss": -38.415138244628906, "global_step": 152962, "epoch": 1264} {"train_loss": -39.60740280151367, "global_step": 152963, "epoch": 1264} {"train_loss": -35.464290618896484, "global_step": 152964, "epoch": 1264} {"train_loss": -40.21818161010742, "global_step": 152965, "epoch": 1264} {"train_loss": -36.42079544067383, "global_step": 152966, "epoch": 1264} {"train_loss": -39.15974044799805, "global_step": 152967, "epoch": 1264} {"train_loss": -37.75067901611328, "global_step": 152968, "epoch": 1264} {"train_loss": -39.8712043762207, "global_step": 152969, "epoch": 1264} {"train_loss": -39.32869338989258, "global_step": 152970, "epoch": 1264} {"train_loss": -38.80323791503906, "global_step": 152971, "epoch": 1264} {"train_loss": -39.339935302734375, "global_step": 152972, "epoch": 1264} {"train_loss": -38.185813903808594, "global_step": 152973, "epoch": 1264} {"train_loss": -35.546119689941406, "global_step": 152974, "epoch": 1264} {"train_loss": -38.29948043823242, "global_step": 152975, "epoch": 1264} {"train_loss": -36.025299072265625, "global_step": 152976, "epoch": 1264} {"train_loss": -38.81986618041992, "global_step": 152977, "epoch": 1264} {"train_loss": -39.44633865356445, "global_step": 152978, "epoch": 1264} {"train_loss": -39.297035217285156, "global_step": 152979, "epoch": 1264} {"train_loss": -39.39553451538086, "global_step": 152980, "epoch": 1264} {"train_loss": -38.36299514770508, "global_step": 152981, "epoch": 1264} {"train_loss": -39.817996978759766, "global_step": 152982, "epoch": 1264} {"train_loss": -38.22126388549805, "global_step": 152983, "epoch": 1264} {"train_loss": -37.833370208740234, "global_step": 152984, "epoch": 1264} {"train_loss": -37.8676872253418, "global_step": 152985, "epoch": 1264} {"train_loss": -39.66707992553711, "global_step": 152986, "epoch": 1264} {"train_loss": -38.0707893371582, "global_step": 152987, "epoch": 1264} {"train_loss": -39.40361785888672, "global_step": 152988, "epoch": 1264} {"train_loss": -38.95996856689453, "global_step": 152989, "epoch": 1264} {"train_loss": -37.0255126953125, "global_step": 152990, "epoch": 1264} {"train_loss": -39.50716781616211, "global_step": 152991, "epoch": 1264} {"train_loss": -39.812164306640625, "global_step": 152992, "epoch": 1264} {"train_loss": -38.0990104675293, "global_step": 152993, "epoch": 1264} {"train_loss": -37.8642578125, "global_step": 152994, "epoch": 1264} {"train_loss": -38.34339904785156, "global_step": 152995, "epoch": 1264} {"train_loss": -33.1603889465332, "global_step": 152996, "epoch": 1264} {"train_loss": -38.26870346069336, "global_step": 152997, "epoch": 1264} {"train_loss": -39.013858795166016, "global_step": 152998, "epoch": 1264} {"train_loss": -36.46372604370117, "global_step": 152999, "epoch": 1264} {"train_loss": -36.45022964477539, "global_step": 153000, "epoch": 1264} {"train_loss": -37.36296463012695, "global_step": 153001, "epoch": 1264} {"train_loss": -37.661476135253906, "global_step": 153002, "epoch": 1264} {"train_loss": -39.433937072753906, "global_step": 153003, "epoch": 1264} {"train_loss": -39.05421447753906, "global_step": 153004, "epoch": 1264} {"train_loss": -39.42220687866211, "global_step": 153005, "epoch": 1264} {"train_loss": -37.174827575683594, "global_step": 153006, "epoch": 1264} {"train_loss": -38.90053939819336, "global_step": 153007, "epoch": 1264} {"train_loss": -37.90363311767578, "global_step": 153008, "epoch": 1264} {"train_loss": -38.98993682861328, "global_step": 153009, "epoch": 1264} {"train_loss": -37.36214828491211, "global_step": 153010, "epoch": 1264} {"train_loss": -39.64657211303711, "global_step": 153011, "epoch": 1264} {"train_loss": -38.43376159667969, "global_step": 153012, "epoch": 1264} {"train_loss": -37.16990280151367, "global_step": 153013, "epoch": 1264} {"train_loss": -39.93050003051758, "global_step": 153014, "epoch": 1264} {"train_loss": -39.455501556396484, "global_step": 153015, "epoch": 1264} {"train_loss": -38.328670501708984, "global_step": 153016, "epoch": 1264} {"train_loss": -39.28398132324219, "global_step": 153017, "epoch": 1264} {"train_loss": -39.37775421142578, "global_step": 153018, "epoch": 1264} {"train_loss": -39.290279388427734, "global_step": 153019, "epoch": 1264} {"train_loss": -38.08726119995117, "global_step": 153020, "epoch": 1264} {"train_loss": -37.50883102416992, "global_step": 153021, "epoch": 1264} {"train_loss": -38.39554214477539, "global_step": 153022, "epoch": 1264} {"train_loss": -39.50675582885742, "global_step": 153023, "epoch": 1264} {"train_loss": -39.19403839111328, "global_step": 153024, "epoch": 1264} {"train_loss": -37.86225509643555, "global_step": 153025, "epoch": 1264} {"train_loss": -39.3316535949707, "global_step": 153026, "epoch": 1264} {"train_loss": -39.493377685546875, "global_step": 153027, "epoch": 1264} {"train_loss": -36.03072738647461, "global_step": 153028, "epoch": 1264} {"train_loss": -36.150146484375, "global_step": 153029, "epoch": 1264} {"train_loss": -37.31081771850586, "global_step": 153030, "epoch": 1264} {"train_loss": -39.58815002441406, "global_step": 153031, "epoch": 1264} {"train_loss": -37.75486755371094, "global_step": 153032, "epoch": 1264} {"train_loss": -38.37247848510742, "global_step": 153033, "epoch": 1264} {"train_loss": -37.76841735839844, "global_step": 153034, "epoch": 1264} {"train_loss": -35.953243255615234, "global_step": 153035, "epoch": 1264} {"train_loss": -39.606781005859375, "global_step": 153036, "epoch": 1264} {"train_loss": -39.148040771484375, "global_step": 153037, "epoch": 1264} {"train_loss": -39.85761642456055, "global_step": 153038, "epoch": 1264} {"train_loss": -39.83573532104492, "global_step": 153039, "epoch": 1264} {"train_loss": -38.81313705444336, "global_step": 153040, "epoch": 1264} {"train_loss": -39.56981658935547, "global_step": 153041, "epoch": 1264} {"train_loss": -40.193843841552734, "global_step": 153042, "epoch": 1264} {"train_loss": -39.65195846557617, "global_step": 153043, "epoch": 1264} {"train_loss": -39.752525329589844, "global_step": 153044, "epoch": 1264} {"train_loss": -39.911678314208984, "global_step": 153045, "epoch": 1264} {"train_loss": -39.69456100463867, "global_step": 153046, "epoch": 1264} {"train_loss": -38.32795333862305, "global_step": 153047, "epoch": 1264} {"train_loss": -40.1645393371582, "global_step": 153048, "epoch": 1264} {"train_loss": -39.91685104370117, "global_step": 153049, "epoch": 1264} {"train_loss": -39.752986907958984, "global_step": 153050, "epoch": 1264} {"train_loss": -39.747310638427734, "global_step": 153051, "epoch": 1264} {"train_loss": -40.07241439819336, "global_step": 153052, "epoch": 1264} {"train_loss": -39.31441879272461, "global_step": 153053, "epoch": 1264} {"train_loss": -40.018455505371094, "global_step": 153054, "epoch": 1264} {"train_loss": -40.39126205444336, "global_step": 153055, "epoch": 1264} {"train_loss": -38.9625244140625, "global_step": 153056, "epoch": 1264} {"train_loss": -39.396751403808594, "global_step": 153057, "epoch": 1264} {"train_loss": -40.10447692871094, "global_step": 153058, "epoch": 1264} {"train_loss": -40.691463470458984, "global_step": 153059, "epoch": 1264} {"train_loss": -40.02299880981445, "global_step": 153060, "epoch": 1264} {"train_loss": -39.92609405517578, "global_step": 153061, "epoch": 1264} {"train_loss": -40.23106002807617, "global_step": 153062, "epoch": 1264} {"train_loss": -40.24213790893555, "global_step": 153063, "epoch": 1264} {"train_loss": -38.942201062667465, "global_step": 153064, "epoch": 1264, "val_loss": 2513224.0} {"train_loss": -40.68484115600586, "global_step": 153065, "epoch": 1265} {"train_loss": -39.69899368286133, "global_step": 153066, "epoch": 1265} {"train_loss": -40.674110412597656, "global_step": 153067, "epoch": 1265} {"train_loss": -40.42649459838867, "global_step": 153068, "epoch": 1265} {"train_loss": -40.296173095703125, "global_step": 153069, "epoch": 1265} {"train_loss": -38.901832580566406, "global_step": 153070, "epoch": 1265} {"train_loss": -39.758644104003906, "global_step": 153071, "epoch": 1265} {"train_loss": -39.64185333251953, "global_step": 153072, "epoch": 1265} {"train_loss": -40.54669952392578, "global_step": 153073, "epoch": 1265} {"train_loss": -40.01420211791992, "global_step": 153074, "epoch": 1265} {"train_loss": -40.60390853881836, "global_step": 153075, "epoch": 1265} {"train_loss": -40.31527328491211, "global_step": 153076, "epoch": 1265} {"train_loss": -40.359981536865234, "global_step": 153077, "epoch": 1265} {"train_loss": -40.52614212036133, "global_step": 153078, "epoch": 1265} {"train_loss": -39.93941879272461, "global_step": 153079, "epoch": 1265} {"train_loss": -36.087684631347656, "global_step": 153080, "epoch": 1265} {"train_loss": -40.06284713745117, "global_step": 153081, "epoch": 1265} {"train_loss": -39.527523040771484, "global_step": 153082, "epoch": 1265} {"train_loss": -35.33481979370117, "global_step": 153083, "epoch": 1265} {"train_loss": -23.958351135253906, "global_step": 153084, "epoch": 1265} {"train_loss": -9.634333610534668, "global_step": 153085, "epoch": 1265} {"train_loss": -4.693070888519287, "global_step": 153086, "epoch": 1265} {"train_loss": -37.15431594848633, "global_step": 153087, "epoch": 1265} {"train_loss": -18.635231018066406, "global_step": 153088, "epoch": 1265} {"train_loss": -24.910449981689453, "global_step": 153089, "epoch": 1265} {"train_loss": -35.97367858886719, "global_step": 153090, "epoch": 1265} {"train_loss": -25.791675567626953, "global_step": 153091, "epoch": 1265} {"train_loss": -37.481712341308594, "global_step": 153092, "epoch": 1265} {"train_loss": -28.14103126525879, "global_step": 153093, "epoch": 1265} {"train_loss": -35.04048538208008, "global_step": 153094, "epoch": 1265} {"train_loss": -32.294647216796875, "global_step": 153095, "epoch": 1265} {"train_loss": -30.751544952392578, "global_step": 153096, "epoch": 1265} {"train_loss": -37.12236404418945, "global_step": 153097, "epoch": 1265} {"train_loss": -29.676380157470703, "global_step": 153098, "epoch": 1265} {"train_loss": -37.57878112792969, "global_step": 153099, "epoch": 1265} {"train_loss": -35.38865661621094, "global_step": 153100, "epoch": 1265} {"train_loss": -36.1593132019043, "global_step": 153101, "epoch": 1265} {"train_loss": -37.30331039428711, "global_step": 153102, "epoch": 1265} {"train_loss": -37.614967346191406, "global_step": 153103, "epoch": 1265} {"train_loss": -35.494258880615234, "global_step": 153104, "epoch": 1265} {"train_loss": -36.98396682739258, "global_step": 153105, "epoch": 1265} {"train_loss": -36.76974868774414, "global_step": 153106, "epoch": 1265} {"train_loss": -37.54948043823242, "global_step": 153107, "epoch": 1265} {"train_loss": -37.68606185913086, "global_step": 153108, "epoch": 1265} {"train_loss": -37.463623046875, "global_step": 153109, "epoch": 1265} {"train_loss": -38.12166976928711, "global_step": 153110, "epoch": 1265} {"train_loss": -37.85398483276367, "global_step": 153111, "epoch": 1265} {"train_loss": -37.15464782714844, "global_step": 153112, "epoch": 1265} {"train_loss": -38.4813346862793, "global_step": 153113, "epoch": 1265} {"train_loss": -38.2299919128418, "global_step": 153114, "epoch": 1265} {"train_loss": -38.367652893066406, "global_step": 153115, "epoch": 1265} {"train_loss": -37.940834045410156, "global_step": 153116, "epoch": 1265} {"train_loss": -38.525909423828125, "global_step": 153117, "epoch": 1265} {"train_loss": -38.09324264526367, "global_step": 153118, "epoch": 1265} {"train_loss": -38.18927764892578, "global_step": 153119, "epoch": 1265} {"train_loss": -38.7876091003418, "global_step": 153120, "epoch": 1265} {"train_loss": -38.724220275878906, "global_step": 153121, "epoch": 1265} {"train_loss": -38.686309814453125, "global_step": 153122, "epoch": 1265} {"train_loss": -39.112831115722656, "global_step": 153123, "epoch": 1265} {"train_loss": -38.76918029785156, "global_step": 153124, "epoch": 1265} {"train_loss": -38.830013275146484, "global_step": 153125, "epoch": 1265} {"train_loss": -38.55864334106445, "global_step": 153126, "epoch": 1265} {"train_loss": -39.09116744995117, "global_step": 153127, "epoch": 1265} {"train_loss": -39.04896926879883, "global_step": 153128, "epoch": 1265} {"train_loss": -38.79508590698242, "global_step": 153129, "epoch": 1265} {"train_loss": -39.044166564941406, "global_step": 153130, "epoch": 1265} {"train_loss": -39.296810150146484, "global_step": 153131, "epoch": 1265} {"train_loss": -39.01221466064453, "global_step": 153132, "epoch": 1265} {"train_loss": -39.501712799072266, "global_step": 153133, "epoch": 1265} {"train_loss": -39.56614303588867, "global_step": 153134, "epoch": 1265} {"train_loss": -39.640785217285156, "global_step": 153135, "epoch": 1265} {"train_loss": -39.64221954345703, "global_step": 153136, "epoch": 1265} {"train_loss": -39.93922424316406, "global_step": 153137, "epoch": 1265} {"train_loss": -39.605621337890625, "global_step": 153138, "epoch": 1265} {"train_loss": -39.37057113647461, "global_step": 153139, "epoch": 1265} {"train_loss": -39.4603385925293, "global_step": 153140, "epoch": 1265} {"train_loss": -39.01320266723633, "global_step": 153141, "epoch": 1265} {"train_loss": -39.997501373291016, "global_step": 153142, "epoch": 1265} {"train_loss": -39.50397872924805, "global_step": 153143, "epoch": 1265} {"train_loss": -39.674346923828125, "global_step": 153144, "epoch": 1265} {"train_loss": -38.5952262878418, "global_step": 153145, "epoch": 1265} {"train_loss": -39.41181564331055, "global_step": 153146, "epoch": 1265} {"train_loss": -39.828678131103516, "global_step": 153147, "epoch": 1265} {"train_loss": -40.35989761352539, "global_step": 153148, "epoch": 1265} {"train_loss": -40.13031768798828, "global_step": 153149, "epoch": 1265} {"train_loss": -39.94698715209961, "global_step": 153150, "epoch": 1265} {"train_loss": -40.14902877807617, "global_step": 153151, "epoch": 1265} {"train_loss": -40.23136520385742, "global_step": 153152, "epoch": 1265} {"train_loss": -39.976558685302734, "global_step": 153153, "epoch": 1265} {"train_loss": -40.180110931396484, "global_step": 153154, "epoch": 1265} {"train_loss": -40.48227310180664, "global_step": 153155, "epoch": 1265} {"train_loss": -39.9123420715332, "global_step": 153156, "epoch": 1265} {"train_loss": -39.76711654663086, "global_step": 153157, "epoch": 1265} {"train_loss": -40.13709259033203, "global_step": 153158, "epoch": 1265} {"train_loss": -40.16633224487305, "global_step": 153159, "epoch": 1265} {"train_loss": -39.85335159301758, "global_step": 153160, "epoch": 1265} {"train_loss": -40.19540023803711, "global_step": 153161, "epoch": 1265} {"train_loss": -39.994258880615234, "global_step": 153162, "epoch": 1265} {"train_loss": -40.226280212402344, "global_step": 153163, "epoch": 1265} {"train_loss": -40.573707580566406, "global_step": 153164, "epoch": 1265} {"train_loss": -40.30990219116211, "global_step": 153165, "epoch": 1265} {"train_loss": -40.475440979003906, "global_step": 153166, "epoch": 1265} {"train_loss": -40.364681243896484, "global_step": 153167, "epoch": 1265} {"train_loss": -40.64866256713867, "global_step": 153168, "epoch": 1265} {"train_loss": -40.163692474365234, "global_step": 153169, "epoch": 1265} {"train_loss": -40.586421966552734, "global_step": 153170, "epoch": 1265} {"train_loss": -40.741973876953125, "global_step": 153171, "epoch": 1265} {"train_loss": -40.73419952392578, "global_step": 153172, "epoch": 1265} {"train_loss": -40.64329147338867, "global_step": 153173, "epoch": 1265} {"train_loss": -40.28904342651367, "global_step": 153174, "epoch": 1265} {"train_loss": -40.15366744995117, "global_step": 153175, "epoch": 1265} {"train_loss": -40.649742126464844, "global_step": 153176, "epoch": 1265} {"train_loss": -40.48015213012695, "global_step": 153177, "epoch": 1265} {"train_loss": -40.223899841308594, "global_step": 153178, "epoch": 1265} {"train_loss": -40.91731643676758, "global_step": 153179, "epoch": 1265} {"train_loss": -40.903480529785156, "global_step": 153180, "epoch": 1265} {"train_loss": -40.29288864135742, "global_step": 153181, "epoch": 1265} {"train_loss": -40.81827926635742, "global_step": 153182, "epoch": 1265} {"train_loss": -40.73359298706055, "global_step": 153183, "epoch": 1265} {"train_loss": -40.75919723510742, "global_step": 153184, "epoch": 1265} {"train_loss": -37.88212644167183, "global_step": 153185, "epoch": 1265, "val_loss": 2600789.75} {"train_loss": -40.703460693359375, "global_step": 153186, "epoch": 1266} {"train_loss": -40.1947135925293, "global_step": 153187, "epoch": 1266} {"train_loss": -40.28098678588867, "global_step": 153188, "epoch": 1266} {"train_loss": -40.390716552734375, "global_step": 153189, "epoch": 1266} {"train_loss": -39.669471740722656, "global_step": 153190, "epoch": 1266} {"train_loss": -39.114688873291016, "global_step": 153191, "epoch": 1266} {"train_loss": -39.46739959716797, "global_step": 153192, "epoch": 1266} {"train_loss": -39.79347610473633, "global_step": 153193, "epoch": 1266} {"train_loss": -40.47540283203125, "global_step": 153194, "epoch": 1266} {"train_loss": -39.59198760986328, "global_step": 153195, "epoch": 1266} {"train_loss": -40.651458740234375, "global_step": 153196, "epoch": 1266} {"train_loss": -40.64427185058594, "global_step": 153197, "epoch": 1266} {"train_loss": -40.25183868408203, "global_step": 153198, "epoch": 1266} {"train_loss": -38.51394271850586, "global_step": 153199, "epoch": 1266} {"train_loss": -36.092140197753906, "global_step": 153200, "epoch": 1266} {"train_loss": -32.15861129760742, "global_step": 153201, "epoch": 1266} {"train_loss": -31.5263614654541, "global_step": 153202, "epoch": 1266} {"train_loss": -37.46335220336914, "global_step": 153203, "epoch": 1266} {"train_loss": -40.76272201538086, "global_step": 153204, "epoch": 1266} {"train_loss": -38.65540313720703, "global_step": 153205, "epoch": 1266} {"train_loss": -38.15871047973633, "global_step": 153206, "epoch": 1266} {"train_loss": -40.263057708740234, "global_step": 153207, "epoch": 1266} {"train_loss": -38.929351806640625, "global_step": 153208, "epoch": 1266} {"train_loss": -39.56775665283203, "global_step": 153209, "epoch": 1266} {"train_loss": -39.984657287597656, "global_step": 153210, "epoch": 1266} {"train_loss": -38.740325927734375, "global_step": 153211, "epoch": 1266} {"train_loss": -39.85191345214844, "global_step": 153212, "epoch": 1266} {"train_loss": -39.28091812133789, "global_step": 153213, "epoch": 1266} {"train_loss": -39.31250762939453, "global_step": 153214, "epoch": 1266} {"train_loss": -40.5716667175293, "global_step": 153215, "epoch": 1266} {"train_loss": -39.93783187866211, "global_step": 153216, "epoch": 1266} {"train_loss": -40.089908599853516, "global_step": 153217, "epoch": 1266} {"train_loss": -40.30526351928711, "global_step": 153218, "epoch": 1266} {"train_loss": -40.73194885253906, "global_step": 153219, "epoch": 1266} {"train_loss": -40.328243255615234, "global_step": 153220, "epoch": 1266} {"train_loss": -40.280921936035156, "global_step": 153221, "epoch": 1266} {"train_loss": -40.6827507019043, "global_step": 153222, "epoch": 1266} {"train_loss": -40.63404083251953, "global_step": 153223, "epoch": 1266} {"train_loss": -39.76481246948242, "global_step": 153224, "epoch": 1266} {"train_loss": -39.64909744262695, "global_step": 153225, "epoch": 1266} {"train_loss": -39.81996154785156, "global_step": 153226, "epoch": 1266} {"train_loss": -40.74958419799805, "global_step": 153227, "epoch": 1266} {"train_loss": -40.45420455932617, "global_step": 153228, "epoch": 1266} {"train_loss": -40.0683479309082, "global_step": 153229, "epoch": 1266} {"train_loss": -40.43581771850586, "global_step": 153230, "epoch": 1266} {"train_loss": -41.15138244628906, "global_step": 153231, "epoch": 1266} {"train_loss": -40.05267333984375, "global_step": 153232, "epoch": 1266} {"train_loss": -40.4466552734375, "global_step": 153233, "epoch": 1266} {"train_loss": -40.67238235473633, "global_step": 153234, "epoch": 1266} {"train_loss": -40.09624099731445, "global_step": 153235, "epoch": 1266} {"train_loss": -39.96177291870117, "global_step": 153236, "epoch": 1266} {"train_loss": -40.75323486328125, "global_step": 153237, "epoch": 1266} {"train_loss": -39.78913879394531, "global_step": 153238, "epoch": 1266} {"train_loss": -40.382205963134766, "global_step": 153239, "epoch": 1266} {"train_loss": -40.3428840637207, "global_step": 153240, "epoch": 1266} {"train_loss": -40.41468048095703, "global_step": 153241, "epoch": 1266} {"train_loss": -39.984535217285156, "global_step": 153242, "epoch": 1266} {"train_loss": -40.069698333740234, "global_step": 153243, "epoch": 1266} {"train_loss": -40.609375, "global_step": 153244, "epoch": 1266} {"train_loss": -40.682823181152344, "global_step": 153245, "epoch": 1266} {"train_loss": -40.99407958984375, "global_step": 153246, "epoch": 1266} {"train_loss": -40.624237060546875, "global_step": 153247, "epoch": 1266} {"train_loss": -40.72122573852539, "global_step": 153248, "epoch": 1266} {"train_loss": -40.39065170288086, "global_step": 153249, "epoch": 1266} {"train_loss": -40.48662185668945, "global_step": 153250, "epoch": 1266} {"train_loss": -39.97038269042969, "global_step": 153251, "epoch": 1266} {"train_loss": -40.17007827758789, "global_step": 153252, "epoch": 1266} {"train_loss": -40.52573776245117, "global_step": 153253, "epoch": 1266} {"train_loss": -38.81757736206055, "global_step": 153254, "epoch": 1266} {"train_loss": -40.5750617980957, "global_step": 153255, "epoch": 1266} {"train_loss": -39.95804977416992, "global_step": 153256, "epoch": 1266} {"train_loss": -40.00175476074219, "global_step": 153257, "epoch": 1266} {"train_loss": -40.52067947387695, "global_step": 153258, "epoch": 1266} {"train_loss": -40.535152435302734, "global_step": 153259, "epoch": 1266} {"train_loss": -40.05051803588867, "global_step": 153260, "epoch": 1266} {"train_loss": -40.95993423461914, "global_step": 153261, "epoch": 1266} {"train_loss": -40.26985549926758, "global_step": 153262, "epoch": 1266} {"train_loss": -40.805458068847656, "global_step": 153263, "epoch": 1266} {"train_loss": -40.47991943359375, "global_step": 153264, "epoch": 1266} {"train_loss": -41.03142166137695, "global_step": 153265, "epoch": 1266} {"train_loss": -40.4200439453125, "global_step": 153266, "epoch": 1266} {"train_loss": -39.5157585144043, "global_step": 153267, "epoch": 1266} {"train_loss": -40.566036224365234, "global_step": 153268, "epoch": 1266} {"train_loss": -39.696956634521484, "global_step": 153269, "epoch": 1266} {"train_loss": -40.42936325073242, "global_step": 153270, "epoch": 1266} {"train_loss": -40.08529281616211, "global_step": 153271, "epoch": 1266} {"train_loss": -40.27964401245117, "global_step": 153272, "epoch": 1266} {"train_loss": -40.74644470214844, "global_step": 153273, "epoch": 1266} {"train_loss": -40.69282150268555, "global_step": 153274, "epoch": 1266} {"train_loss": -40.18368148803711, "global_step": 153275, "epoch": 1266} {"train_loss": -39.72910690307617, "global_step": 153276, "epoch": 1266} {"train_loss": -40.22959518432617, "global_step": 153277, "epoch": 1266} {"train_loss": -40.36362838745117, "global_step": 153278, "epoch": 1266} {"train_loss": -39.41565704345703, "global_step": 153279, "epoch": 1266} {"train_loss": -39.371646881103516, "global_step": 153280, "epoch": 1266} {"train_loss": -38.83408737182617, "global_step": 153281, "epoch": 1266} {"train_loss": -37.727439880371094, "global_step": 153282, "epoch": 1266} {"train_loss": -39.63872146606445, "global_step": 153283, "epoch": 1266} {"train_loss": -40.06635665893555, "global_step": 153284, "epoch": 1266} {"train_loss": -40.80226516723633, "global_step": 153285, "epoch": 1266} {"train_loss": -39.82065200805664, "global_step": 153286, "epoch": 1266} {"train_loss": -39.650047302246094, "global_step": 153287, "epoch": 1266} {"train_loss": -39.925846099853516, "global_step": 153288, "epoch": 1266} {"train_loss": -40.240020751953125, "global_step": 153289, "epoch": 1266} {"train_loss": -39.20395278930664, "global_step": 153290, "epoch": 1266} {"train_loss": -40.5899543762207, "global_step": 153291, "epoch": 1266} {"train_loss": -39.52338790893555, "global_step": 153292, "epoch": 1266} {"train_loss": -40.7061767578125, "global_step": 153293, "epoch": 1266} {"train_loss": -39.97626876831055, "global_step": 153294, "epoch": 1266} {"train_loss": -37.6326904296875, "global_step": 153295, "epoch": 1266} {"train_loss": -39.32417678833008, "global_step": 153296, "epoch": 1266} {"train_loss": -40.03384017944336, "global_step": 153297, "epoch": 1266} {"train_loss": -38.413055419921875, "global_step": 153298, "epoch": 1266} {"train_loss": -38.30632400512695, "global_step": 153299, "epoch": 1266} {"train_loss": -39.25299072265625, "global_step": 153300, "epoch": 1266} {"train_loss": -38.864383697509766, "global_step": 153301, "epoch": 1266} {"train_loss": -38.346736907958984, "global_step": 153302, "epoch": 1266} {"train_loss": -39.88389587402344, "global_step": 153303, "epoch": 1266} {"train_loss": -39.744789123535156, "global_step": 153304, "epoch": 1266} {"train_loss": -39.43463897705078, "global_step": 153305, "epoch": 1266} {"train_loss": -39.79947080690999, "global_step": 153306, "epoch": 1266, "val_loss": 2735767.75} {"train_loss": -37.85775375366211, "global_step": 153307, "epoch": 1267} {"train_loss": -39.56521224975586, "global_step": 153308, "epoch": 1267} {"train_loss": -37.14205551147461, "global_step": 153309, "epoch": 1267} {"train_loss": -38.61777114868164, "global_step": 153310, "epoch": 1267} {"train_loss": -38.67920684814453, "global_step": 153311, "epoch": 1267} {"train_loss": -37.3449821472168, "global_step": 153312, "epoch": 1267} {"train_loss": -34.52450180053711, "global_step": 153313, "epoch": 1267} {"train_loss": -31.89246940612793, "global_step": 153314, "epoch": 1267} {"train_loss": -34.25034713745117, "global_step": 153315, "epoch": 1267} {"train_loss": -33.94936752319336, "global_step": 153316, "epoch": 1267} {"train_loss": -37.84300231933594, "global_step": 153317, "epoch": 1267} {"train_loss": -36.54165267944336, "global_step": 153318, "epoch": 1267} {"train_loss": -34.8106689453125, "global_step": 153319, "epoch": 1267} {"train_loss": -37.691646575927734, "global_step": 153320, "epoch": 1267} {"train_loss": -35.30464553833008, "global_step": 153321, "epoch": 1267} {"train_loss": -27.90500831604004, "global_step": 153322, "epoch": 1267} {"train_loss": -35.78178787231445, "global_step": 153323, "epoch": 1267} {"train_loss": -34.9354362487793, "global_step": 153324, "epoch": 1267} {"train_loss": -28.169397354125977, "global_step": 153325, "epoch": 1267} {"train_loss": -35.76788330078125, "global_step": 153326, "epoch": 1267} {"train_loss": -35.228553771972656, "global_step": 153327, "epoch": 1267} {"train_loss": -36.51711654663086, "global_step": 153328, "epoch": 1267} {"train_loss": -29.816137313842773, "global_step": 153329, "epoch": 1267} {"train_loss": -34.83244705200195, "global_step": 153330, "epoch": 1267} {"train_loss": -33.39105987548828, "global_step": 153331, "epoch": 1267} {"train_loss": -32.01460647583008, "global_step": 153332, "epoch": 1267} {"train_loss": -31.4637508392334, "global_step": 153333, "epoch": 1267} {"train_loss": -36.41358184814453, "global_step": 153334, "epoch": 1267} {"train_loss": -37.32434844970703, "global_step": 153335, "epoch": 1267} {"train_loss": -36.64080047607422, "global_step": 153336, "epoch": 1267} {"train_loss": -35.73133087158203, "global_step": 153337, "epoch": 1267} {"train_loss": -36.5028076171875, "global_step": 153338, "epoch": 1267} {"train_loss": -36.465919494628906, "global_step": 153339, "epoch": 1267} {"train_loss": -37.16154098510742, "global_step": 153340, "epoch": 1267} {"train_loss": -36.702362060546875, "global_step": 153341, "epoch": 1267} {"train_loss": -37.13492965698242, "global_step": 153342, "epoch": 1267} {"train_loss": -36.93518829345703, "global_step": 153343, "epoch": 1267} {"train_loss": -36.55241775512695, "global_step": 153344, "epoch": 1267} {"train_loss": -37.38800048828125, "global_step": 153345, "epoch": 1267} {"train_loss": -38.03886795043945, "global_step": 153346, "epoch": 1267} {"train_loss": -37.18069076538086, "global_step": 153347, "epoch": 1267} {"train_loss": -38.28841781616211, "global_step": 153348, "epoch": 1267} {"train_loss": -37.011940002441406, "global_step": 153349, "epoch": 1267} {"train_loss": -38.492042541503906, "global_step": 153350, "epoch": 1267} {"train_loss": -36.30744934082031, "global_step": 153351, "epoch": 1267} {"train_loss": -37.7395133972168, "global_step": 153352, "epoch": 1267} {"train_loss": -37.995277404785156, "global_step": 153353, "epoch": 1267} {"train_loss": -38.6214714050293, "global_step": 153354, "epoch": 1267} {"train_loss": -38.016822814941406, "global_step": 153355, "epoch": 1267} {"train_loss": -38.74202346801758, "global_step": 153356, "epoch": 1267} {"train_loss": -37.899288177490234, "global_step": 153357, "epoch": 1267} {"train_loss": -38.02484893798828, "global_step": 153358, "epoch": 1267} {"train_loss": -38.030487060546875, "global_step": 153359, "epoch": 1267} {"train_loss": -38.50602340698242, "global_step": 153360, "epoch": 1267} {"train_loss": -38.599945068359375, "global_step": 153361, "epoch": 1267} {"train_loss": -38.92970275878906, "global_step": 153362, "epoch": 1267} {"train_loss": -39.31570053100586, "global_step": 153363, "epoch": 1267} {"train_loss": -38.70920944213867, "global_step": 153364, "epoch": 1267} {"train_loss": -38.44570541381836, "global_step": 153365, "epoch": 1267} {"train_loss": -38.35054397583008, "global_step": 153366, "epoch": 1267} {"train_loss": -39.476985931396484, "global_step": 153367, "epoch": 1267} {"train_loss": -39.12434005737305, "global_step": 153368, "epoch": 1267} {"train_loss": -39.220088958740234, "global_step": 153369, "epoch": 1267} {"train_loss": -39.210391998291016, "global_step": 153370, "epoch": 1267} {"train_loss": -38.5260124206543, "global_step": 153371, "epoch": 1267} {"train_loss": -39.5927848815918, "global_step": 153372, "epoch": 1267} {"train_loss": -39.415462493896484, "global_step": 153373, "epoch": 1267} {"train_loss": -39.826717376708984, "global_step": 153374, "epoch": 1267} {"train_loss": -39.28065872192383, "global_step": 153375, "epoch": 1267} {"train_loss": -39.07610321044922, "global_step": 153376, "epoch": 1267} {"train_loss": -39.77638626098633, "global_step": 153377, "epoch": 1267} {"train_loss": -39.76279067993164, "global_step": 153378, "epoch": 1267} {"train_loss": -39.66975402832031, "global_step": 153379, "epoch": 1267} {"train_loss": -38.81407928466797, "global_step": 153380, "epoch": 1267} {"train_loss": -38.645511627197266, "global_step": 153381, "epoch": 1267} {"train_loss": -38.86479949951172, "global_step": 153382, "epoch": 1267} {"train_loss": -40.06272888183594, "global_step": 153383, "epoch": 1267} {"train_loss": -38.310699462890625, "global_step": 153384, "epoch": 1267} {"train_loss": -39.348785400390625, "global_step": 153385, "epoch": 1267} {"train_loss": -39.953582763671875, "global_step": 153386, "epoch": 1267} {"train_loss": -40.058021545410156, "global_step": 153387, "epoch": 1267} {"train_loss": -39.79853439331055, "global_step": 153388, "epoch": 1267} {"train_loss": -39.65654373168945, "global_step": 153389, "epoch": 1267} {"train_loss": -39.466529846191406, "global_step": 153390, "epoch": 1267} {"train_loss": -39.73721694946289, "global_step": 153391, "epoch": 1267} {"train_loss": -39.9468994140625, "global_step": 153392, "epoch": 1267} {"train_loss": -39.65934371948242, "global_step": 153393, "epoch": 1267} {"train_loss": -39.824825286865234, "global_step": 153394, "epoch": 1267} {"train_loss": -39.7067985534668, "global_step": 153395, "epoch": 1267} {"train_loss": -40.25996017456055, "global_step": 153396, "epoch": 1267} {"train_loss": -38.960052490234375, "global_step": 153397, "epoch": 1267} {"train_loss": -39.55684280395508, "global_step": 153398, "epoch": 1267} {"train_loss": -40.48710250854492, "global_step": 153399, "epoch": 1267} {"train_loss": -39.95641326904297, "global_step": 153400, "epoch": 1267} {"train_loss": -40.288055419921875, "global_step": 153401, "epoch": 1267} {"train_loss": -39.70390701293945, "global_step": 153402, "epoch": 1267} {"train_loss": -39.894126892089844, "global_step": 153403, "epoch": 1267} {"train_loss": -40.182804107666016, "global_step": 153404, "epoch": 1267} {"train_loss": -40.39068603515625, "global_step": 153405, "epoch": 1267} {"train_loss": -40.1410026550293, "global_step": 153406, "epoch": 1267} {"train_loss": -40.1575927734375, "global_step": 153407, "epoch": 1267} {"train_loss": -40.276302337646484, "global_step": 153408, "epoch": 1267} {"train_loss": -40.655731201171875, "global_step": 153409, "epoch": 1267} {"train_loss": -39.95198440551758, "global_step": 153410, "epoch": 1267} {"train_loss": -40.31820297241211, "global_step": 153411, "epoch": 1267} {"train_loss": -40.224281311035156, "global_step": 153412, "epoch": 1267} {"train_loss": -39.91835403442383, "global_step": 153413, "epoch": 1267} {"train_loss": -39.24032211303711, "global_step": 153414, "epoch": 1267} {"train_loss": -40.169830322265625, "global_step": 153415, "epoch": 1267} {"train_loss": -40.32551956176758, "global_step": 153416, "epoch": 1267} {"train_loss": -40.4856071472168, "global_step": 153417, "epoch": 1267} {"train_loss": -39.91998291015625, "global_step": 153418, "epoch": 1267} {"train_loss": -40.59524154663086, "global_step": 153419, "epoch": 1267} {"train_loss": -40.63814926147461, "global_step": 153420, "epoch": 1267} {"train_loss": -40.39329147338867, "global_step": 153421, "epoch": 1267} {"train_loss": -41.01179885864258, "global_step": 153422, "epoch": 1267} {"train_loss": -40.50876998901367, "global_step": 153423, "epoch": 1267} {"train_loss": -40.49322509765625, "global_step": 153424, "epoch": 1267} {"train_loss": -40.40027618408203, "global_step": 153425, "epoch": 1267} {"train_loss": -41.07835388183594, "global_step": 153426, "epoch": 1267} {"train_loss": -38.143121246464, "global_step": 153427, "epoch": 1267, "val_loss": 2761382.0} {"train_loss": -40.56521224975586, "global_step": 153428, "epoch": 1268} {"train_loss": -40.603111267089844, "global_step": 153429, "epoch": 1268} {"train_loss": -41.147762298583984, "global_step": 153430, "epoch": 1268} {"train_loss": -40.443756103515625, "global_step": 153431, "epoch": 1268} {"train_loss": -40.47315979003906, "global_step": 153432, "epoch": 1268} {"train_loss": -40.58573913574219, "global_step": 153433, "epoch": 1268} {"train_loss": -40.67417526245117, "global_step": 153434, "epoch": 1268} {"train_loss": -40.943355560302734, "global_step": 153435, "epoch": 1268} {"train_loss": -40.52727508544922, "global_step": 153436, "epoch": 1268} {"train_loss": -41.062477111816406, "global_step": 153437, "epoch": 1268} {"train_loss": -41.2751579284668, "global_step": 153438, "epoch": 1268} {"train_loss": -41.586334228515625, "global_step": 153439, "epoch": 1268} {"train_loss": -40.835731506347656, "global_step": 153440, "epoch": 1268} {"train_loss": -41.01272201538086, "global_step": 153441, "epoch": 1268} {"train_loss": -40.70609664916992, "global_step": 153442, "epoch": 1268} {"train_loss": -40.99832534790039, "global_step": 153443, "epoch": 1268} {"train_loss": -40.636260986328125, "global_step": 153444, "epoch": 1268} {"train_loss": -40.28255081176758, "global_step": 153445, "epoch": 1268} {"train_loss": -40.75517654418945, "global_step": 153446, "epoch": 1268} {"train_loss": -39.675655364990234, "global_step": 153447, "epoch": 1268} {"train_loss": -40.64551544189453, "global_step": 153448, "epoch": 1268} {"train_loss": -40.34599685668945, "global_step": 153449, "epoch": 1268} {"train_loss": -41.21079635620117, "global_step": 153450, "epoch": 1268} {"train_loss": -40.37998962402344, "global_step": 153451, "epoch": 1268} {"train_loss": -41.287200927734375, "global_step": 153452, "epoch": 1268} {"train_loss": -40.683895111083984, "global_step": 153453, "epoch": 1268} {"train_loss": -40.088829040527344, "global_step": 153454, "epoch": 1268} {"train_loss": -40.4058952331543, "global_step": 153455, "epoch": 1268} {"train_loss": -38.25165557861328, "global_step": 153456, "epoch": 1268} {"train_loss": -38.40543746948242, "global_step": 153457, "epoch": 1268} {"train_loss": -39.245540618896484, "global_step": 153458, "epoch": 1268} {"train_loss": -38.8426628112793, "global_step": 153459, "epoch": 1268} {"train_loss": -34.56783676147461, "global_step": 153460, "epoch": 1268} {"train_loss": -37.34370040893555, "global_step": 153461, "epoch": 1268} {"train_loss": -32.83903121948242, "global_step": 153462, "epoch": 1268} {"train_loss": -27.969345092773438, "global_step": 153463, "epoch": 1268} {"train_loss": -35.29627227783203, "global_step": 153464, "epoch": 1268} {"train_loss": -38.35224914550781, "global_step": 153465, "epoch": 1268} {"train_loss": -35.540748596191406, "global_step": 153466, "epoch": 1268} {"train_loss": -36.52094650268555, "global_step": 153467, "epoch": 1268} {"train_loss": -34.03001403808594, "global_step": 153468, "epoch": 1268} {"train_loss": -36.477542877197266, "global_step": 153469, "epoch": 1268} {"train_loss": -36.800514221191406, "global_step": 153470, "epoch": 1268} {"train_loss": -34.830055236816406, "global_step": 153471, "epoch": 1268} {"train_loss": -32.77350997924805, "global_step": 153472, "epoch": 1268} {"train_loss": -37.10879135131836, "global_step": 153473, "epoch": 1268} {"train_loss": -36.22692108154297, "global_step": 153474, "epoch": 1268} {"train_loss": -33.81918716430664, "global_step": 153475, "epoch": 1268} {"train_loss": -39.0679931640625, "global_step": 153476, "epoch": 1268} {"train_loss": -34.36758041381836, "global_step": 153477, "epoch": 1268} {"train_loss": -36.92560958862305, "global_step": 153478, "epoch": 1268} {"train_loss": -37.90370559692383, "global_step": 153479, "epoch": 1268} {"train_loss": -36.35162353515625, "global_step": 153480, "epoch": 1268} {"train_loss": -39.00056838989258, "global_step": 153481, "epoch": 1268} {"train_loss": -37.81403732299805, "global_step": 153482, "epoch": 1268} {"train_loss": -38.60352325439453, "global_step": 153483, "epoch": 1268} {"train_loss": -36.803199768066406, "global_step": 153484, "epoch": 1268} {"train_loss": -38.26644515991211, "global_step": 153485, "epoch": 1268} {"train_loss": -37.2454833984375, "global_step": 153486, "epoch": 1268} {"train_loss": -38.9277458190918, "global_step": 153487, "epoch": 1268} {"train_loss": -38.3657341003418, "global_step": 153488, "epoch": 1268} {"train_loss": -39.460975646972656, "global_step": 153489, "epoch": 1268} {"train_loss": -37.414363861083984, "global_step": 153490, "epoch": 1268} {"train_loss": -38.84502410888672, "global_step": 153491, "epoch": 1268} {"train_loss": -39.58821487426758, "global_step": 153492, "epoch": 1268} {"train_loss": -39.078590393066406, "global_step": 153493, "epoch": 1268} {"train_loss": -38.87664794921875, "global_step": 153494, "epoch": 1268} {"train_loss": -38.60892105102539, "global_step": 153495, "epoch": 1268} {"train_loss": -38.87208557128906, "global_step": 153496, "epoch": 1268} {"train_loss": -39.347320556640625, "global_step": 153497, "epoch": 1268} {"train_loss": -39.391380310058594, "global_step": 153498, "epoch": 1268} {"train_loss": -39.78242111206055, "global_step": 153499, "epoch": 1268} {"train_loss": -39.15681838989258, "global_step": 153500, "epoch": 1268} {"train_loss": -39.618896484375, "global_step": 153501, "epoch": 1268} {"train_loss": -38.9691047668457, "global_step": 153502, "epoch": 1268} {"train_loss": -39.82536697387695, "global_step": 153503, "epoch": 1268} {"train_loss": -38.64698028564453, "global_step": 153504, "epoch": 1268} {"train_loss": -39.662635803222656, "global_step": 153505, "epoch": 1268} {"train_loss": -40.4085807800293, "global_step": 153506, "epoch": 1268} {"train_loss": -39.176082611083984, "global_step": 153507, "epoch": 1268} {"train_loss": -40.23948287963867, "global_step": 153508, "epoch": 1268} {"train_loss": -39.70685958862305, "global_step": 153509, "epoch": 1268} {"train_loss": -40.0105094909668, "global_step": 153510, "epoch": 1268} {"train_loss": -39.2518310546875, "global_step": 153511, "epoch": 1268} {"train_loss": -39.9510498046875, "global_step": 153512, "epoch": 1268} {"train_loss": -40.093414306640625, "global_step": 153513, "epoch": 1268} {"train_loss": -39.56769561767578, "global_step": 153514, "epoch": 1268} {"train_loss": -40.302242279052734, "global_step": 153515, "epoch": 1268} {"train_loss": -40.065608978271484, "global_step": 153516, "epoch": 1268} {"train_loss": -40.379737854003906, "global_step": 153517, "epoch": 1268} {"train_loss": -40.50391387939453, "global_step": 153518, "epoch": 1268} {"train_loss": -40.377044677734375, "global_step": 153519, "epoch": 1268} {"train_loss": -40.353485107421875, "global_step": 153520, "epoch": 1268} {"train_loss": -40.17377853393555, "global_step": 153521, "epoch": 1268} {"train_loss": -40.16752624511719, "global_step": 153522, "epoch": 1268} {"train_loss": -41.04655075073242, "global_step": 153523, "epoch": 1268} {"train_loss": -40.31711196899414, "global_step": 153524, "epoch": 1268} {"train_loss": -40.6842155456543, "global_step": 153525, "epoch": 1268} {"train_loss": -40.56843185424805, "global_step": 153526, "epoch": 1268} {"train_loss": -40.52910232543945, "global_step": 153527, "epoch": 1268} {"train_loss": -40.88920211791992, "global_step": 153528, "epoch": 1268} {"train_loss": -40.940975189208984, "global_step": 153529, "epoch": 1268} {"train_loss": -39.41888427734375, "global_step": 153530, "epoch": 1268} {"train_loss": -40.676937103271484, "global_step": 153531, "epoch": 1268} {"train_loss": -40.53450012207031, "global_step": 153532, "epoch": 1268} {"train_loss": -40.61626052856445, "global_step": 153533, "epoch": 1268} {"train_loss": -38.670379638671875, "global_step": 153534, "epoch": 1268} {"train_loss": -40.9072151184082, "global_step": 153535, "epoch": 1268} {"train_loss": -40.98778533935547, "global_step": 153536, "epoch": 1268} {"train_loss": -40.72239303588867, "global_step": 153537, "epoch": 1268} {"train_loss": -40.64600372314453, "global_step": 153538, "epoch": 1268} {"train_loss": -40.92695999145508, "global_step": 153539, "epoch": 1268} {"train_loss": -40.375030517578125, "global_step": 153540, "epoch": 1268} {"train_loss": -40.95244216918945, "global_step": 153541, "epoch": 1268} {"train_loss": -40.61606979370117, "global_step": 153542, "epoch": 1268} {"train_loss": -40.885807037353516, "global_step": 153543, "epoch": 1268} {"train_loss": -41.3841667175293, "global_step": 153544, "epoch": 1268} {"train_loss": -40.84675216674805, "global_step": 153545, "epoch": 1268} {"train_loss": -40.873321533203125, "global_step": 153546, "epoch": 1268} {"train_loss": -41.15269088745117, "global_step": 153547, "epoch": 1268} {"train_loss": -39.240470035017026, "global_step": 153548, "epoch": 1268, "val_loss": 2727340.5} {"train_loss": -40.38541793823242, "global_step": 153549, "epoch": 1269} {"train_loss": -41.031288146972656, "global_step": 153550, "epoch": 1269} {"train_loss": -41.08578109741211, "global_step": 153551, "epoch": 1269} {"train_loss": -41.41933059692383, "global_step": 153552, "epoch": 1269} {"train_loss": -40.859928131103516, "global_step": 153553, "epoch": 1269} {"train_loss": -41.420406341552734, "global_step": 153554, "epoch": 1269} {"train_loss": -41.5385856628418, "global_step": 153555, "epoch": 1269} {"train_loss": -41.545387268066406, "global_step": 153556, "epoch": 1269} {"train_loss": -40.93196487426758, "global_step": 153557, "epoch": 1269} {"train_loss": -41.487728118896484, "global_step": 153558, "epoch": 1269} {"train_loss": -41.84254837036133, "global_step": 153559, "epoch": 1269} {"train_loss": -40.95999526977539, "global_step": 153560, "epoch": 1269} {"train_loss": -41.64802932739258, "global_step": 153561, "epoch": 1269} {"train_loss": -41.4796142578125, "global_step": 153562, "epoch": 1269} {"train_loss": -39.8017692565918, "global_step": 153563, "epoch": 1269} {"train_loss": -41.110862731933594, "global_step": 153564, "epoch": 1269} {"train_loss": -41.62771224975586, "global_step": 153565, "epoch": 1269} {"train_loss": -40.37102508544922, "global_step": 153566, "epoch": 1269} {"train_loss": -41.126983642578125, "global_step": 153567, "epoch": 1269} {"train_loss": -41.64069747924805, "global_step": 153568, "epoch": 1269} {"train_loss": -41.62418746948242, "global_step": 153569, "epoch": 1269} {"train_loss": -41.06008529663086, "global_step": 153570, "epoch": 1269} {"train_loss": -41.42991256713867, "global_step": 153571, "epoch": 1269} {"train_loss": -41.44955062866211, "global_step": 153572, "epoch": 1269} {"train_loss": -41.28194046020508, "global_step": 153573, "epoch": 1269} {"train_loss": -39.6922492980957, "global_step": 153574, "epoch": 1269} {"train_loss": -41.13691329956055, "global_step": 153575, "epoch": 1269} {"train_loss": -38.867401123046875, "global_step": 153576, "epoch": 1269} {"train_loss": -41.35409164428711, "global_step": 153577, "epoch": 1269} {"train_loss": -41.742408752441406, "global_step": 153578, "epoch": 1269} {"train_loss": -41.25332260131836, "global_step": 153579, "epoch": 1269} {"train_loss": -41.15678405761719, "global_step": 153580, "epoch": 1269} {"train_loss": -41.26483917236328, "global_step": 153581, "epoch": 1269} {"train_loss": -40.67528533935547, "global_step": 153582, "epoch": 1269} {"train_loss": -40.19326400756836, "global_step": 153583, "epoch": 1269} {"train_loss": -39.84503173828125, "global_step": 153584, "epoch": 1269} {"train_loss": -38.86488723754883, "global_step": 153585, "epoch": 1269} {"train_loss": -35.75399398803711, "global_step": 153586, "epoch": 1269} {"train_loss": -33.6894645690918, "global_step": 153587, "epoch": 1269} {"train_loss": -29.813018798828125, "global_step": 153588, "epoch": 1269} {"train_loss": -34.86296463012695, "global_step": 153589, "epoch": 1269} {"train_loss": -40.39054489135742, "global_step": 153590, "epoch": 1269} {"train_loss": -36.51591110229492, "global_step": 153591, "epoch": 1269} {"train_loss": -38.429622650146484, "global_step": 153592, "epoch": 1269} {"train_loss": -40.6051139831543, "global_step": 153593, "epoch": 1269} {"train_loss": -38.50605392456055, "global_step": 153594, "epoch": 1269} {"train_loss": -39.13595199584961, "global_step": 153595, "epoch": 1269} {"train_loss": -40.427616119384766, "global_step": 153596, "epoch": 1269} {"train_loss": -39.39492416381836, "global_step": 153597, "epoch": 1269} {"train_loss": -40.809043884277344, "global_step": 153598, "epoch": 1269} {"train_loss": -40.33930969238281, "global_step": 153599, "epoch": 1269} {"train_loss": -40.555171966552734, "global_step": 153600, "epoch": 1269} {"train_loss": -39.3638916015625, "global_step": 153601, "epoch": 1269} {"train_loss": -40.42733383178711, "global_step": 153602, "epoch": 1269} {"train_loss": -40.18153381347656, "global_step": 153603, "epoch": 1269} {"train_loss": -40.411834716796875, "global_step": 153604, "epoch": 1269} {"train_loss": -38.54794692993164, "global_step": 153605, "epoch": 1269} {"train_loss": -40.55214309692383, "global_step": 153606, "epoch": 1269} {"train_loss": -40.82283401489258, "global_step": 153607, "epoch": 1269} {"train_loss": -40.17753982543945, "global_step": 153608, "epoch": 1269} {"train_loss": -40.77677536010742, "global_step": 153609, "epoch": 1269} {"train_loss": -40.894073486328125, "global_step": 153610, "epoch": 1269} {"train_loss": -40.56342697143555, "global_step": 153611, "epoch": 1269} {"train_loss": -40.45571517944336, "global_step": 153612, "epoch": 1269} {"train_loss": -40.100257873535156, "global_step": 153613, "epoch": 1269} {"train_loss": -40.9603157043457, "global_step": 153614, "epoch": 1269} {"train_loss": -39.785160064697266, "global_step": 153615, "epoch": 1269} {"train_loss": -40.26640319824219, "global_step": 153616, "epoch": 1269} {"train_loss": -40.95241165161133, "global_step": 153617, "epoch": 1269} {"train_loss": -41.072669982910156, "global_step": 153618, "epoch": 1269} {"train_loss": -40.15970993041992, "global_step": 153619, "epoch": 1269} {"train_loss": -40.38444137573242, "global_step": 153620, "epoch": 1269} {"train_loss": -39.961421966552734, "global_step": 153621, "epoch": 1269} {"train_loss": -40.954833984375, "global_step": 153622, "epoch": 1269} {"train_loss": -39.91996765136719, "global_step": 153623, "epoch": 1269} {"train_loss": -40.57151412963867, "global_step": 153624, "epoch": 1269} {"train_loss": -40.44233322143555, "global_step": 153625, "epoch": 1269} {"train_loss": -40.44424819946289, "global_step": 153626, "epoch": 1269} {"train_loss": -40.41597366333008, "global_step": 153627, "epoch": 1269} {"train_loss": -40.68421173095703, "global_step": 153628, "epoch": 1269} {"train_loss": -40.532962799072266, "global_step": 153629, "epoch": 1269} {"train_loss": -40.19770050048828, "global_step": 153630, "epoch": 1269} {"train_loss": -40.562862396240234, "global_step": 153631, "epoch": 1269} {"train_loss": -40.044715881347656, "global_step": 153632, "epoch": 1269} {"train_loss": -39.44391632080078, "global_step": 153633, "epoch": 1269} {"train_loss": -39.58200454711914, "global_step": 153634, "epoch": 1269} {"train_loss": -40.31256866455078, "global_step": 153635, "epoch": 1269} {"train_loss": -40.57854080200195, "global_step": 153636, "epoch": 1269} {"train_loss": -40.63425827026367, "global_step": 153637, "epoch": 1269} {"train_loss": -39.70490264892578, "global_step": 153638, "epoch": 1269} {"train_loss": -38.74821090698242, "global_step": 153639, "epoch": 1269} {"train_loss": -39.19648361206055, "global_step": 153640, "epoch": 1269} {"train_loss": -38.6795539855957, "global_step": 153641, "epoch": 1269} {"train_loss": -40.51141357421875, "global_step": 153642, "epoch": 1269} {"train_loss": -38.910091400146484, "global_step": 153643, "epoch": 1269} {"train_loss": -39.55828857421875, "global_step": 153644, "epoch": 1269} {"train_loss": -38.941707611083984, "global_step": 153645, "epoch": 1269} {"train_loss": -39.23592758178711, "global_step": 153646, "epoch": 1269} {"train_loss": -40.725433349609375, "global_step": 153647, "epoch": 1269} {"train_loss": -40.592220306396484, "global_step": 153648, "epoch": 1269} {"train_loss": -40.08209991455078, "global_step": 153649, "epoch": 1269} {"train_loss": -40.16931915283203, "global_step": 153650, "epoch": 1269} {"train_loss": -40.26716613769531, "global_step": 153651, "epoch": 1269} {"train_loss": -39.513607025146484, "global_step": 153652, "epoch": 1269} {"train_loss": -39.5643196105957, "global_step": 153653, "epoch": 1269} {"train_loss": -40.49031448364258, "global_step": 153654, "epoch": 1269} {"train_loss": -39.58488464355469, "global_step": 153655, "epoch": 1269} {"train_loss": -39.76681137084961, "global_step": 153656, "epoch": 1269} {"train_loss": -39.115478515625, "global_step": 153657, "epoch": 1269} {"train_loss": -39.37022018432617, "global_step": 153658, "epoch": 1269} {"train_loss": -39.311309814453125, "global_step": 153659, "epoch": 1269} {"train_loss": -40.08642578125, "global_step": 153660, "epoch": 1269} {"train_loss": -40.5751953125, "global_step": 153661, "epoch": 1269} {"train_loss": -40.39020919799805, "global_step": 153662, "epoch": 1269} {"train_loss": -40.62675857543945, "global_step": 153663, "epoch": 1269} {"train_loss": -40.5165901184082, "global_step": 153664, "epoch": 1269} {"train_loss": -40.44447326660156, "global_step": 153665, "epoch": 1269} {"train_loss": -40.997867584228516, "global_step": 153666, "epoch": 1269} {"train_loss": -40.560333251953125, "global_step": 153667, "epoch": 1269} {"train_loss": -39.89683151245117, "global_step": 153668, "epoch": 1269} {"train_loss": -40.12199162254649, "global_step": 153669, "epoch": 1269, "val_loss": 2658797.75} {"train_loss": -41.128719329833984, "global_step": 153670, "epoch": 1270} {"train_loss": -40.8198127746582, "global_step": 153671, "epoch": 1270} {"train_loss": -40.13430404663086, "global_step": 153672, "epoch": 1270} {"train_loss": -40.96099853515625, "global_step": 153673, "epoch": 1270} {"train_loss": -40.933162689208984, "global_step": 153674, "epoch": 1270} {"train_loss": -39.90877914428711, "global_step": 153675, "epoch": 1270} {"train_loss": -39.834991455078125, "global_step": 153676, "epoch": 1270} {"train_loss": -38.63570785522461, "global_step": 153677, "epoch": 1270} {"train_loss": -40.28219985961914, "global_step": 153678, "epoch": 1270} {"train_loss": -40.90972900390625, "global_step": 153679, "epoch": 1270} {"train_loss": -40.69569778442383, "global_step": 153680, "epoch": 1270} {"train_loss": -40.59458923339844, "global_step": 153681, "epoch": 1270} {"train_loss": -39.55770492553711, "global_step": 153682, "epoch": 1270} {"train_loss": -39.81443405151367, "global_step": 153683, "epoch": 1270} {"train_loss": -40.17486572265625, "global_step": 153684, "epoch": 1270} {"train_loss": -41.06564712524414, "global_step": 153685, "epoch": 1270} {"train_loss": -39.59748458862305, "global_step": 153686, "epoch": 1270} {"train_loss": -39.7711296081543, "global_step": 153687, "epoch": 1270} {"train_loss": -38.93975830078125, "global_step": 153688, "epoch": 1270} {"train_loss": -36.724979400634766, "global_step": 153689, "epoch": 1270} {"train_loss": -38.603248596191406, "global_step": 153690, "epoch": 1270} {"train_loss": -40.013301849365234, "global_step": 153691, "epoch": 1270} {"train_loss": -38.671627044677734, "global_step": 153692, "epoch": 1270} {"train_loss": -39.33894729614258, "global_step": 153693, "epoch": 1270} {"train_loss": -38.68520736694336, "global_step": 153694, "epoch": 1270} {"train_loss": -38.891841888427734, "global_step": 153695, "epoch": 1270} {"train_loss": -39.858760833740234, "global_step": 153696, "epoch": 1270} {"train_loss": -38.80489730834961, "global_step": 153697, "epoch": 1270} {"train_loss": -34.77641296386719, "global_step": 153698, "epoch": 1270} {"train_loss": -36.2801399230957, "global_step": 153699, "epoch": 1270} {"train_loss": -38.9023323059082, "global_step": 153700, "epoch": 1270} {"train_loss": -37.97031784057617, "global_step": 153701, "epoch": 1270} {"train_loss": -38.69328689575195, "global_step": 153702, "epoch": 1270} {"train_loss": -37.7644157409668, "global_step": 153703, "epoch": 1270} {"train_loss": -40.29610061645508, "global_step": 153704, "epoch": 1270} {"train_loss": -40.19716262817383, "global_step": 153705, "epoch": 1270} {"train_loss": -40.16714096069336, "global_step": 153706, "epoch": 1270} {"train_loss": -38.72658157348633, "global_step": 153707, "epoch": 1270} {"train_loss": -37.1162223815918, "global_step": 153708, "epoch": 1270} {"train_loss": -39.04585647583008, "global_step": 153709, "epoch": 1270} {"train_loss": -40.059059143066406, "global_step": 153710, "epoch": 1270} {"train_loss": -38.542999267578125, "global_step": 153711, "epoch": 1270} {"train_loss": -35.01017761230469, "global_step": 153712, "epoch": 1270} {"train_loss": -37.29192352294922, "global_step": 153713, "epoch": 1270} {"train_loss": -37.88867950439453, "global_step": 153714, "epoch": 1270} {"train_loss": -37.72990036010742, "global_step": 153715, "epoch": 1270} {"train_loss": -30.57025718688965, "global_step": 153716, "epoch": 1270} {"train_loss": -36.98707962036133, "global_step": 153717, "epoch": 1270} {"train_loss": -37.08363342285156, "global_step": 153718, "epoch": 1270} {"train_loss": -37.54041290283203, "global_step": 153719, "epoch": 1270} {"train_loss": -37.70577621459961, "global_step": 153720, "epoch": 1270} {"train_loss": -38.7241325378418, "global_step": 153721, "epoch": 1270} {"train_loss": -38.753875732421875, "global_step": 153722, "epoch": 1270} {"train_loss": -39.169525146484375, "global_step": 153723, "epoch": 1270} {"train_loss": -39.25533676147461, "global_step": 153724, "epoch": 1270} {"train_loss": -37.800758361816406, "global_step": 153725, "epoch": 1270} {"train_loss": -39.04592514038086, "global_step": 153726, "epoch": 1270} {"train_loss": -34.68007278442383, "global_step": 153727, "epoch": 1270} {"train_loss": -36.84938430786133, "global_step": 153728, "epoch": 1270} {"train_loss": -37.43319320678711, "global_step": 153729, "epoch": 1270} {"train_loss": -36.68825149536133, "global_step": 153730, "epoch": 1270} {"train_loss": -39.306068420410156, "global_step": 153731, "epoch": 1270} {"train_loss": -39.92107009887695, "global_step": 153732, "epoch": 1270} {"train_loss": -37.89038848876953, "global_step": 153733, "epoch": 1270} {"train_loss": -39.75535202026367, "global_step": 153734, "epoch": 1270} {"train_loss": -38.99962615966797, "global_step": 153735, "epoch": 1270} {"train_loss": -37.85763168334961, "global_step": 153736, "epoch": 1270} {"train_loss": -39.325782775878906, "global_step": 153737, "epoch": 1270} {"train_loss": -39.185909271240234, "global_step": 153738, "epoch": 1270} {"train_loss": -39.5574951171875, "global_step": 153739, "epoch": 1270} {"train_loss": -38.6114616394043, "global_step": 153740, "epoch": 1270} {"train_loss": -36.74638748168945, "global_step": 153741, "epoch": 1270} {"train_loss": -37.74909591674805, "global_step": 153742, "epoch": 1270} {"train_loss": -38.96065902709961, "global_step": 153743, "epoch": 1270} {"train_loss": -39.27534484863281, "global_step": 153744, "epoch": 1270} {"train_loss": -38.754085540771484, "global_step": 153745, "epoch": 1270} {"train_loss": -38.5283088684082, "global_step": 153746, "epoch": 1270} {"train_loss": -39.176456451416016, "global_step": 153747, "epoch": 1270} {"train_loss": -38.28445053100586, "global_step": 153748, "epoch": 1270} {"train_loss": -39.74140167236328, "global_step": 153749, "epoch": 1270} {"train_loss": -40.02664566040039, "global_step": 153750, "epoch": 1270} {"train_loss": -39.92705535888672, "global_step": 153751, "epoch": 1270} {"train_loss": -39.271507263183594, "global_step": 153752, "epoch": 1270} {"train_loss": -38.94224548339844, "global_step": 153753, "epoch": 1270} {"train_loss": -39.63676834106445, "global_step": 153754, "epoch": 1270} {"train_loss": -37.448829650878906, "global_step": 153755, "epoch": 1270} {"train_loss": -39.63680648803711, "global_step": 153756, "epoch": 1270} {"train_loss": -38.856475830078125, "global_step": 153757, "epoch": 1270} {"train_loss": -38.99042510986328, "global_step": 153758, "epoch": 1270} {"train_loss": -38.913265228271484, "global_step": 153759, "epoch": 1270} {"train_loss": -39.79253005981445, "global_step": 153760, "epoch": 1270} {"train_loss": -39.331024169921875, "global_step": 153761, "epoch": 1270} {"train_loss": -40.1899528503418, "global_step": 153762, "epoch": 1270} {"train_loss": -39.772762298583984, "global_step": 153763, "epoch": 1270} {"train_loss": -40.41007614135742, "global_step": 153764, "epoch": 1270} {"train_loss": -40.25833511352539, "global_step": 153765, "epoch": 1270} {"train_loss": -39.2133674621582, "global_step": 153766, "epoch": 1270} {"train_loss": -40.047218322753906, "global_step": 153767, "epoch": 1270} {"train_loss": -39.99351501464844, "global_step": 153768, "epoch": 1270} {"train_loss": -40.06165313720703, "global_step": 153769, "epoch": 1270} {"train_loss": -40.464210510253906, "global_step": 153770, "epoch": 1270} {"train_loss": -40.52384567260742, "global_step": 153771, "epoch": 1270} {"train_loss": -40.04608917236328, "global_step": 153772, "epoch": 1270} {"train_loss": -40.85411071777344, "global_step": 153773, "epoch": 1270} {"train_loss": -40.13753890991211, "global_step": 153774, "epoch": 1270} {"train_loss": -40.42564010620117, "global_step": 153775, "epoch": 1270} {"train_loss": -40.76456832885742, "global_step": 153776, "epoch": 1270} {"train_loss": -39.0692253112793, "global_step": 153777, "epoch": 1270} {"train_loss": -40.730587005615234, "global_step": 153778, "epoch": 1270} {"train_loss": -40.81997299194336, "global_step": 153779, "epoch": 1270} {"train_loss": -39.463661193847656, "global_step": 153780, "epoch": 1270} {"train_loss": -40.15188217163086, "global_step": 153781, "epoch": 1270} {"train_loss": -40.35013961791992, "global_step": 153782, "epoch": 1270} {"train_loss": -40.65229034423828, "global_step": 153783, "epoch": 1270} {"train_loss": -40.67808151245117, "global_step": 153784, "epoch": 1270} {"train_loss": -40.2844123840332, "global_step": 153785, "epoch": 1270} {"train_loss": -40.73487854003906, "global_step": 153786, "epoch": 1270} {"train_loss": -40.76909637451172, "global_step": 153787, "epoch": 1270} {"train_loss": -41.214263916015625, "global_step": 153788, "epoch": 1270} {"train_loss": -41.00733184814453, "global_step": 153789, "epoch": 1270} {"train_loss": -39.14573639483491, "global_step": 153790, "epoch": 1270, "val_loss": 2595272.25} {"train_loss": -40.94277572631836, "global_step": 153791, "epoch": 1271} {"train_loss": -39.962013244628906, "global_step": 153792, "epoch": 1271} {"train_loss": -41.12923812866211, "global_step": 153793, "epoch": 1271} {"train_loss": -40.88508224487305, "global_step": 153794, "epoch": 1271} {"train_loss": -40.446624755859375, "global_step": 153795, "epoch": 1271} {"train_loss": -40.40745162963867, "global_step": 153796, "epoch": 1271} {"train_loss": -41.45719528198242, "global_step": 153797, "epoch": 1271} {"train_loss": -40.40924835205078, "global_step": 153798, "epoch": 1271} {"train_loss": -40.6639404296875, "global_step": 153799, "epoch": 1271} {"train_loss": -41.2625846862793, "global_step": 153800, "epoch": 1271} {"train_loss": -40.59282684326172, "global_step": 153801, "epoch": 1271} {"train_loss": -41.23333740234375, "global_step": 153802, "epoch": 1271} {"train_loss": -41.0849609375, "global_step": 153803, "epoch": 1271} {"train_loss": -41.27872848510742, "global_step": 153804, "epoch": 1271} {"train_loss": -41.20232391357422, "global_step": 153805, "epoch": 1271} {"train_loss": -41.241554260253906, "global_step": 153806, "epoch": 1271} {"train_loss": -41.23490524291992, "global_step": 153807, "epoch": 1271} {"train_loss": -41.5015983581543, "global_step": 153808, "epoch": 1271} {"train_loss": -41.030311584472656, "global_step": 153809, "epoch": 1271} {"train_loss": -41.35543441772461, "global_step": 153810, "epoch": 1271} {"train_loss": -40.24396514892578, "global_step": 153811, "epoch": 1271} {"train_loss": -40.98588943481445, "global_step": 153812, "epoch": 1271} {"train_loss": -41.55366897583008, "global_step": 153813, "epoch": 1271} {"train_loss": -40.28036117553711, "global_step": 153814, "epoch": 1271} {"train_loss": -40.52539825439453, "global_step": 153815, "epoch": 1271} {"train_loss": -40.55351257324219, "global_step": 153816, "epoch": 1271} {"train_loss": -39.78725051879883, "global_step": 153817, "epoch": 1271} {"train_loss": -38.04305648803711, "global_step": 153818, "epoch": 1271} {"train_loss": -33.83679962158203, "global_step": 153819, "epoch": 1271} {"train_loss": -21.6630916595459, "global_step": 153820, "epoch": 1271} {"train_loss": -16.629261016845703, "global_step": 153821, "epoch": 1271} {"train_loss": -32.75223922729492, "global_step": 153822, "epoch": 1271} {"train_loss": -39.26854705810547, "global_step": 153823, "epoch": 1271} {"train_loss": -33.03628158569336, "global_step": 153824, "epoch": 1271} {"train_loss": -37.48933029174805, "global_step": 153825, "epoch": 1271} {"train_loss": -38.83476257324219, "global_step": 153826, "epoch": 1271} {"train_loss": -37.31303024291992, "global_step": 153827, "epoch": 1271} {"train_loss": -39.198307037353516, "global_step": 153828, "epoch": 1271} {"train_loss": -35.91004180908203, "global_step": 153829, "epoch": 1271} {"train_loss": -38.863746643066406, "global_step": 153830, "epoch": 1271} {"train_loss": -39.196285247802734, "global_step": 153831, "epoch": 1271} {"train_loss": -37.65681076049805, "global_step": 153832, "epoch": 1271} {"train_loss": -38.566280364990234, "global_step": 153833, "epoch": 1271} {"train_loss": -39.191768646240234, "global_step": 153834, "epoch": 1271} {"train_loss": -37.100502014160156, "global_step": 153835, "epoch": 1271} {"train_loss": -39.486488342285156, "global_step": 153836, "epoch": 1271} {"train_loss": -38.00518798828125, "global_step": 153837, "epoch": 1271} {"train_loss": -39.07832336425781, "global_step": 153838, "epoch": 1271} {"train_loss": -38.30158233642578, "global_step": 153839, "epoch": 1271} {"train_loss": -40.10600662231445, "global_step": 153840, "epoch": 1271} {"train_loss": -38.25347137451172, "global_step": 153841, "epoch": 1271} {"train_loss": -39.16219711303711, "global_step": 153842, "epoch": 1271} {"train_loss": -39.841426849365234, "global_step": 153843, "epoch": 1271} {"train_loss": -38.93857955932617, "global_step": 153844, "epoch": 1271} {"train_loss": -39.49055862426758, "global_step": 153845, "epoch": 1271} {"train_loss": -39.173519134521484, "global_step": 153846, "epoch": 1271} {"train_loss": -39.38256072998047, "global_step": 153847, "epoch": 1271} {"train_loss": -35.48262405395508, "global_step": 153848, "epoch": 1271} {"train_loss": -36.84381103515625, "global_step": 153849, "epoch": 1271} {"train_loss": -37.19829559326172, "global_step": 153850, "epoch": 1271} {"train_loss": -38.89579391479492, "global_step": 153851, "epoch": 1271} {"train_loss": -38.87818145751953, "global_step": 153852, "epoch": 1271} {"train_loss": -39.2154655456543, "global_step": 153853, "epoch": 1271} {"train_loss": -38.732357025146484, "global_step": 153854, "epoch": 1271} {"train_loss": -36.7740592956543, "global_step": 153855, "epoch": 1271} {"train_loss": -36.33081817626953, "global_step": 153856, "epoch": 1271} {"train_loss": -38.522823333740234, "global_step": 153857, "epoch": 1271} {"train_loss": -39.90375900268555, "global_step": 153858, "epoch": 1271} {"train_loss": -37.0497932434082, "global_step": 153859, "epoch": 1271} {"train_loss": -39.2114372253418, "global_step": 153860, "epoch": 1271} {"train_loss": -38.50258255004883, "global_step": 153861, "epoch": 1271} {"train_loss": -38.74626159667969, "global_step": 153862, "epoch": 1271} {"train_loss": -39.61605453491211, "global_step": 153863, "epoch": 1271} {"train_loss": -39.292884826660156, "global_step": 153864, "epoch": 1271} {"train_loss": -35.76234817504883, "global_step": 153865, "epoch": 1271} {"train_loss": -39.00250244140625, "global_step": 153866, "epoch": 1271} {"train_loss": -39.43052291870117, "global_step": 153867, "epoch": 1271} {"train_loss": -37.3192024230957, "global_step": 153868, "epoch": 1271} {"train_loss": -36.0263671875, "global_step": 153869, "epoch": 1271} {"train_loss": -38.39516830444336, "global_step": 153870, "epoch": 1271} {"train_loss": -38.87392807006836, "global_step": 153871, "epoch": 1271} {"train_loss": -38.22524642944336, "global_step": 153872, "epoch": 1271} {"train_loss": -39.235286712646484, "global_step": 153873, "epoch": 1271} {"train_loss": -38.778812408447266, "global_step": 153874, "epoch": 1271} {"train_loss": -39.524051666259766, "global_step": 153875, "epoch": 1271} {"train_loss": -38.48702621459961, "global_step": 153876, "epoch": 1271} {"train_loss": -38.35604476928711, "global_step": 153877, "epoch": 1271} {"train_loss": -39.5120735168457, "global_step": 153878, "epoch": 1271} {"train_loss": -40.06633377075195, "global_step": 153879, "epoch": 1271} {"train_loss": -39.08921432495117, "global_step": 153880, "epoch": 1271} {"train_loss": -38.82883834838867, "global_step": 153881, "epoch": 1271} {"train_loss": -39.5804443359375, "global_step": 153882, "epoch": 1271} {"train_loss": -37.80849838256836, "global_step": 153883, "epoch": 1271} {"train_loss": -39.797821044921875, "global_step": 153884, "epoch": 1271} {"train_loss": -39.977378845214844, "global_step": 153885, "epoch": 1271} {"train_loss": -38.756710052490234, "global_step": 153886, "epoch": 1271} {"train_loss": -39.814144134521484, "global_step": 153887, "epoch": 1271} {"train_loss": -40.035762786865234, "global_step": 153888, "epoch": 1271} {"train_loss": -39.099632263183594, "global_step": 153889, "epoch": 1271} {"train_loss": -39.81428146362305, "global_step": 153890, "epoch": 1271} {"train_loss": -39.688385009765625, "global_step": 153891, "epoch": 1271} {"train_loss": -39.21962356567383, "global_step": 153892, "epoch": 1271} {"train_loss": -39.2628173828125, "global_step": 153893, "epoch": 1271} {"train_loss": -40.563140869140625, "global_step": 153894, "epoch": 1271} {"train_loss": -39.75422286987305, "global_step": 153895, "epoch": 1271} {"train_loss": -39.92450714111328, "global_step": 153896, "epoch": 1271} {"train_loss": -39.18355941772461, "global_step": 153897, "epoch": 1271} {"train_loss": -38.50123977661133, "global_step": 153898, "epoch": 1271} {"train_loss": -38.740108489990234, "global_step": 153899, "epoch": 1271} {"train_loss": -40.40572738647461, "global_step": 153900, "epoch": 1271} {"train_loss": -40.2016487121582, "global_step": 153901, "epoch": 1271} {"train_loss": -40.30218505859375, "global_step": 153902, "epoch": 1271} {"train_loss": -39.40226364135742, "global_step": 153903, "epoch": 1271} {"train_loss": -39.94126510620117, "global_step": 153904, "epoch": 1271} {"train_loss": -38.85081100463867, "global_step": 153905, "epoch": 1271} {"train_loss": -39.94193649291992, "global_step": 153906, "epoch": 1271} {"train_loss": -40.0047492980957, "global_step": 153907, "epoch": 1271} {"train_loss": -38.42875289916992, "global_step": 153908, "epoch": 1271} {"train_loss": -40.3063850402832, "global_step": 153909, "epoch": 1271} {"train_loss": -39.56845474243164, "global_step": 153910, "epoch": 1271} {"train_loss": -38.82290994628402, "global_step": 153911, "epoch": 1271, "val_loss": 2638753.0} {"train_loss": -40.43301010131836, "global_step": 153912, "epoch": 1272} {"train_loss": -39.282440185546875, "global_step": 153913, "epoch": 1272} {"train_loss": -39.961727142333984, "global_step": 153914, "epoch": 1272} {"train_loss": -40.73334884643555, "global_step": 153915, "epoch": 1272} {"train_loss": -39.49864959716797, "global_step": 153916, "epoch": 1272} {"train_loss": -40.327972412109375, "global_step": 153917, "epoch": 1272} {"train_loss": -40.42234420776367, "global_step": 153918, "epoch": 1272} {"train_loss": -38.488380432128906, "global_step": 153919, "epoch": 1272} {"train_loss": -39.83698654174805, "global_step": 153920, "epoch": 1272} {"train_loss": -39.86418914794922, "global_step": 153921, "epoch": 1272} {"train_loss": -40.245948791503906, "global_step": 153922, "epoch": 1272} {"train_loss": -40.77067565917969, "global_step": 153923, "epoch": 1272} {"train_loss": -40.79189682006836, "global_step": 153924, "epoch": 1272} {"train_loss": -40.716949462890625, "global_step": 153925, "epoch": 1272} {"train_loss": -40.59171676635742, "global_step": 153926, "epoch": 1272} {"train_loss": -37.42446517944336, "global_step": 153927, "epoch": 1272} {"train_loss": -40.75055694580078, "global_step": 153928, "epoch": 1272} {"train_loss": -37.99542236328125, "global_step": 153929, "epoch": 1272} {"train_loss": -40.81006622314453, "global_step": 153930, "epoch": 1272} {"train_loss": -40.38529586791992, "global_step": 153931, "epoch": 1272} {"train_loss": -41.032527923583984, "global_step": 153932, "epoch": 1272} {"train_loss": -34.98015594482422, "global_step": 153933, "epoch": 1272} {"train_loss": -40.00556564331055, "global_step": 153934, "epoch": 1272} {"train_loss": -40.30460739135742, "global_step": 153935, "epoch": 1272} {"train_loss": -34.38041687011719, "global_step": 153936, "epoch": 1272} {"train_loss": -38.99066162109375, "global_step": 153937, "epoch": 1272} {"train_loss": -39.4150505065918, "global_step": 153938, "epoch": 1272} {"train_loss": -39.165992736816406, "global_step": 153939, "epoch": 1272} {"train_loss": -39.24470138549805, "global_step": 153940, "epoch": 1272} {"train_loss": -40.9440803527832, "global_step": 153941, "epoch": 1272} {"train_loss": -32.27009201049805, "global_step": 153942, "epoch": 1272} {"train_loss": -39.7652702331543, "global_step": 153943, "epoch": 1272} {"train_loss": -36.898433685302734, "global_step": 153944, "epoch": 1272} {"train_loss": -40.019954681396484, "global_step": 153945, "epoch": 1272} {"train_loss": -39.8382682800293, "global_step": 153946, "epoch": 1272} {"train_loss": -39.23221969604492, "global_step": 153947, "epoch": 1272} {"train_loss": -39.86216354370117, "global_step": 153948, "epoch": 1272} {"train_loss": -38.724491119384766, "global_step": 153949, "epoch": 1272} {"train_loss": -38.664466857910156, "global_step": 153950, "epoch": 1272} {"train_loss": -39.516357421875, "global_step": 153951, "epoch": 1272} {"train_loss": -39.68478012084961, "global_step": 153952, "epoch": 1272} {"train_loss": -39.33014678955078, "global_step": 153953, "epoch": 1272} {"train_loss": -38.282073974609375, "global_step": 153954, "epoch": 1272} {"train_loss": -37.55534362792969, "global_step": 153955, "epoch": 1272} {"train_loss": -35.09766387939453, "global_step": 153956, "epoch": 1272} {"train_loss": -37.59818649291992, "global_step": 153957, "epoch": 1272} {"train_loss": -37.355342864990234, "global_step": 153958, "epoch": 1272} {"train_loss": -37.98098373413086, "global_step": 153959, "epoch": 1272} {"train_loss": -38.31016159057617, "global_step": 153960, "epoch": 1272} {"train_loss": -39.88409423828125, "global_step": 153961, "epoch": 1272} {"train_loss": -35.645259857177734, "global_step": 153962, "epoch": 1272} {"train_loss": -38.085060119628906, "global_step": 153963, "epoch": 1272} {"train_loss": -38.60880661010742, "global_step": 153964, "epoch": 1272} {"train_loss": -38.07733917236328, "global_step": 153965, "epoch": 1272} {"train_loss": -38.4320182800293, "global_step": 153966, "epoch": 1272} {"train_loss": -39.27877426147461, "global_step": 153967, "epoch": 1272} {"train_loss": -39.119197845458984, "global_step": 153968, "epoch": 1272} {"train_loss": -38.03095245361328, "global_step": 153969, "epoch": 1272} {"train_loss": -39.66616439819336, "global_step": 153970, "epoch": 1272} {"train_loss": -40.00645065307617, "global_step": 153971, "epoch": 1272} {"train_loss": -39.90336227416992, "global_step": 153972, "epoch": 1272} {"train_loss": -37.68703842163086, "global_step": 153973, "epoch": 1272} {"train_loss": -39.22842025756836, "global_step": 153974, "epoch": 1272} {"train_loss": -39.992855072021484, "global_step": 153975, "epoch": 1272} {"train_loss": -39.48040771484375, "global_step": 153976, "epoch": 1272} {"train_loss": -39.381385803222656, "global_step": 153977, "epoch": 1272} {"train_loss": -40.03530502319336, "global_step": 153978, "epoch": 1272} {"train_loss": -39.62627029418945, "global_step": 153979, "epoch": 1272} {"train_loss": -38.80256652832031, "global_step": 153980, "epoch": 1272} {"train_loss": -39.96240997314453, "global_step": 153981, "epoch": 1272} {"train_loss": -39.213966369628906, "global_step": 153982, "epoch": 1272} {"train_loss": -39.06294631958008, "global_step": 153983, "epoch": 1272} {"train_loss": -40.429298400878906, "global_step": 153984, "epoch": 1272} {"train_loss": -39.5557746887207, "global_step": 153985, "epoch": 1272} {"train_loss": -37.27547073364258, "global_step": 153986, "epoch": 1272} {"train_loss": -38.967437744140625, "global_step": 153987, "epoch": 1272} {"train_loss": -40.14746856689453, "global_step": 153988, "epoch": 1272} {"train_loss": -38.015438079833984, "global_step": 153989, "epoch": 1272} {"train_loss": -39.70977783203125, "global_step": 153990, "epoch": 1272} {"train_loss": -40.750003814697266, "global_step": 153991, "epoch": 1272} {"train_loss": -39.357398986816406, "global_step": 153992, "epoch": 1272} {"train_loss": -39.7594108581543, "global_step": 153993, "epoch": 1272} {"train_loss": -40.16958236694336, "global_step": 153994, "epoch": 1272} {"train_loss": -39.3895263671875, "global_step": 153995, "epoch": 1272} {"train_loss": -39.43526077270508, "global_step": 153996, "epoch": 1272} {"train_loss": -40.27760696411133, "global_step": 153997, "epoch": 1272} {"train_loss": -39.75032043457031, "global_step": 153998, "epoch": 1272} {"train_loss": -40.69577407836914, "global_step": 153999, "epoch": 1272} {"train_loss": -40.123592376708984, "global_step": 154000, "epoch": 1272} {"train_loss": -40.51304244995117, "global_step": 154001, "epoch": 1272} {"train_loss": -39.72150802612305, "global_step": 154002, "epoch": 1272} {"train_loss": -40.104156494140625, "global_step": 154003, "epoch": 1272} {"train_loss": -40.219703674316406, "global_step": 154004, "epoch": 1272} {"train_loss": -39.6478385925293, "global_step": 154005, "epoch": 1272} {"train_loss": -40.20505142211914, "global_step": 154006, "epoch": 1272} {"train_loss": -40.39462661743164, "global_step": 154007, "epoch": 1272} {"train_loss": -39.97800827026367, "global_step": 154008, "epoch": 1272} {"train_loss": -39.005157470703125, "global_step": 154009, "epoch": 1272} {"train_loss": -40.28484344482422, "global_step": 154010, "epoch": 1272} {"train_loss": -38.553524017333984, "global_step": 154011, "epoch": 1272} {"train_loss": -39.54255294799805, "global_step": 154012, "epoch": 1272} {"train_loss": -38.719600677490234, "global_step": 154013, "epoch": 1272} {"train_loss": -40.31942367553711, "global_step": 154014, "epoch": 1272} {"train_loss": -39.1896858215332, "global_step": 154015, "epoch": 1272} {"train_loss": -38.07987594604492, "global_step": 154016, "epoch": 1272} {"train_loss": -39.77218246459961, "global_step": 154017, "epoch": 1272} {"train_loss": -38.83136749267578, "global_step": 154018, "epoch": 1272} {"train_loss": -40.02394485473633, "global_step": 154019, "epoch": 1272} {"train_loss": -38.50589370727539, "global_step": 154020, "epoch": 1272} {"train_loss": -38.72004318237305, "global_step": 154021, "epoch": 1272} {"train_loss": -38.33827590942383, "global_step": 154022, "epoch": 1272} {"train_loss": -37.59121322631836, "global_step": 154023, "epoch": 1272} {"train_loss": -38.459312438964844, "global_step": 154024, "epoch": 1272} {"train_loss": -40.531768798828125, "global_step": 154025, "epoch": 1272} {"train_loss": -35.8958625793457, "global_step": 154026, "epoch": 1272} {"train_loss": -34.39433288574219, "global_step": 154027, "epoch": 1272} {"train_loss": -36.77949142456055, "global_step": 154028, "epoch": 1272} {"train_loss": -39.12933349609375, "global_step": 154029, "epoch": 1272} {"train_loss": -36.09103012084961, "global_step": 154030, "epoch": 1272} {"train_loss": -33.999305725097656, "global_step": 154031, "epoch": 1272} {"train_loss": -39.05957813105307, "global_step": 154032, "epoch": 1272, "val_loss": 2654203.0} {"train_loss": -36.884437561035156, "global_step": 154033, "epoch": 1273} {"train_loss": -35.42085647583008, "global_step": 154034, "epoch": 1273} {"train_loss": -39.64590072631836, "global_step": 154035, "epoch": 1273} {"train_loss": -36.59831619262695, "global_step": 154036, "epoch": 1273} {"train_loss": -37.33838653564453, "global_step": 154037, "epoch": 1273} {"train_loss": -38.66172409057617, "global_step": 154038, "epoch": 1273} {"train_loss": -37.03254318237305, "global_step": 154039, "epoch": 1273} {"train_loss": -39.12067413330078, "global_step": 154040, "epoch": 1273} {"train_loss": -36.9430046081543, "global_step": 154041, "epoch": 1273} {"train_loss": -39.589263916015625, "global_step": 154042, "epoch": 1273} {"train_loss": -38.5500602722168, "global_step": 154043, "epoch": 1273} {"train_loss": -38.895442962646484, "global_step": 154044, "epoch": 1273} {"train_loss": -38.43925857543945, "global_step": 154045, "epoch": 1273} {"train_loss": -39.72356033325195, "global_step": 154046, "epoch": 1273} {"train_loss": -38.9974479675293, "global_step": 154047, "epoch": 1273} {"train_loss": -38.781829833984375, "global_step": 154048, "epoch": 1273} {"train_loss": -39.09893798828125, "global_step": 154049, "epoch": 1273} {"train_loss": -38.952571868896484, "global_step": 154050, "epoch": 1273} {"train_loss": -40.464019775390625, "global_step": 154051, "epoch": 1273} {"train_loss": -39.73919677734375, "global_step": 154052, "epoch": 1273} {"train_loss": -40.295284271240234, "global_step": 154053, "epoch": 1273} {"train_loss": -40.190773010253906, "global_step": 154054, "epoch": 1273} {"train_loss": -39.89907455444336, "global_step": 154055, "epoch": 1273} {"train_loss": -40.570777893066406, "global_step": 154056, "epoch": 1273} {"train_loss": -39.06766891479492, "global_step": 154057, "epoch": 1273} {"train_loss": -40.124515533447266, "global_step": 154058, "epoch": 1273} {"train_loss": -39.7880744934082, "global_step": 154059, "epoch": 1273} {"train_loss": -39.752662658691406, "global_step": 154060, "epoch": 1273} {"train_loss": -39.90948486328125, "global_step": 154061, "epoch": 1273} {"train_loss": -40.31511306762695, "global_step": 154062, "epoch": 1273} {"train_loss": -40.11204147338867, "global_step": 154063, "epoch": 1273} {"train_loss": -38.26504898071289, "global_step": 154064, "epoch": 1273} {"train_loss": -40.482852935791016, "global_step": 154065, "epoch": 1273} {"train_loss": -40.534423828125, "global_step": 154066, "epoch": 1273} {"train_loss": -40.53150177001953, "global_step": 154067, "epoch": 1273} {"train_loss": -40.395442962646484, "global_step": 154068, "epoch": 1273} {"train_loss": -39.487403869628906, "global_step": 154069, "epoch": 1273} {"train_loss": -40.17621994018555, "global_step": 154070, "epoch": 1273} {"train_loss": -41.100067138671875, "global_step": 154071, "epoch": 1273} {"train_loss": -40.96336364746094, "global_step": 154072, "epoch": 1273} {"train_loss": -40.788421630859375, "global_step": 154073, "epoch": 1273} {"train_loss": -40.3973503112793, "global_step": 154074, "epoch": 1273} {"train_loss": -40.35663604736328, "global_step": 154075, "epoch": 1273} {"train_loss": -40.6313362121582, "global_step": 154076, "epoch": 1273} {"train_loss": -40.7839469909668, "global_step": 154077, "epoch": 1273} {"train_loss": -40.29789352416992, "global_step": 154078, "epoch": 1273} {"train_loss": -39.3502197265625, "global_step": 154079, "epoch": 1273} {"train_loss": -39.626976013183594, "global_step": 154080, "epoch": 1273} {"train_loss": -41.13515090942383, "global_step": 154081, "epoch": 1273} {"train_loss": -40.97738265991211, "global_step": 154082, "epoch": 1273} {"train_loss": -40.56260299682617, "global_step": 154083, "epoch": 1273} {"train_loss": -40.18292999267578, "global_step": 154084, "epoch": 1273} {"train_loss": -41.29039001464844, "global_step": 154085, "epoch": 1273} {"train_loss": -40.392433166503906, "global_step": 154086, "epoch": 1273} {"train_loss": -41.114994049072266, "global_step": 154087, "epoch": 1273} {"train_loss": -40.970703125, "global_step": 154088, "epoch": 1273} {"train_loss": -40.97928237915039, "global_step": 154089, "epoch": 1273} {"train_loss": -41.13776397705078, "global_step": 154090, "epoch": 1273} {"train_loss": -41.21783447265625, "global_step": 154091, "epoch": 1273} {"train_loss": -41.18141555786133, "global_step": 154092, "epoch": 1273} {"train_loss": -40.6739501953125, "global_step": 154093, "epoch": 1273} {"train_loss": -40.91648483276367, "global_step": 154094, "epoch": 1273} {"train_loss": -40.40342712402344, "global_step": 154095, "epoch": 1273} {"train_loss": -41.45354080200195, "global_step": 154096, "epoch": 1273} {"train_loss": -41.23097610473633, "global_step": 154097, "epoch": 1273} {"train_loss": -41.19875717163086, "global_step": 154098, "epoch": 1273} {"train_loss": -41.12592315673828, "global_step": 154099, "epoch": 1273} {"train_loss": -40.211151123046875, "global_step": 154100, "epoch": 1273} {"train_loss": -41.031097412109375, "global_step": 154101, "epoch": 1273} {"train_loss": -40.9593391418457, "global_step": 154102, "epoch": 1273} {"train_loss": -40.70765686035156, "global_step": 154103, "epoch": 1273} {"train_loss": -38.802955627441406, "global_step": 154104, "epoch": 1273} {"train_loss": -39.325130462646484, "global_step": 154105, "epoch": 1273} {"train_loss": -38.008583068847656, "global_step": 154106, "epoch": 1273} {"train_loss": -36.41508865356445, "global_step": 154107, "epoch": 1273} {"train_loss": -30.292566299438477, "global_step": 154108, "epoch": 1273} {"train_loss": -17.91342544555664, "global_step": 154109, "epoch": 1273} {"train_loss": -19.006357192993164, "global_step": 154110, "epoch": 1273} {"train_loss": -36.07268142700195, "global_step": 154111, "epoch": 1273} {"train_loss": -31.538135528564453, "global_step": 154112, "epoch": 1273} {"train_loss": -28.381174087524414, "global_step": 154113, "epoch": 1273} {"train_loss": -38.69863510131836, "global_step": 154114, "epoch": 1273} {"train_loss": -34.65804672241211, "global_step": 154115, "epoch": 1273} {"train_loss": -36.77059555053711, "global_step": 154116, "epoch": 1273} {"train_loss": -36.2720947265625, "global_step": 154117, "epoch": 1273} {"train_loss": -38.15003204345703, "global_step": 154118, "epoch": 1273} {"train_loss": -36.47723388671875, "global_step": 154119, "epoch": 1273} {"train_loss": -38.36714553833008, "global_step": 154120, "epoch": 1273} {"train_loss": -38.17576217651367, "global_step": 154121, "epoch": 1273} {"train_loss": -38.326148986816406, "global_step": 154122, "epoch": 1273} {"train_loss": -39.994789123535156, "global_step": 154123, "epoch": 1273} {"train_loss": -35.90668869018555, "global_step": 154124, "epoch": 1273} {"train_loss": -39.61375045776367, "global_step": 154125, "epoch": 1273} {"train_loss": -39.26224136352539, "global_step": 154126, "epoch": 1273} {"train_loss": -39.53609085083008, "global_step": 154127, "epoch": 1273} {"train_loss": -38.800453186035156, "global_step": 154128, "epoch": 1273} {"train_loss": -39.45831298828125, "global_step": 154129, "epoch": 1273} {"train_loss": -39.4062614440918, "global_step": 154130, "epoch": 1273} {"train_loss": -39.343505859375, "global_step": 154131, "epoch": 1273} {"train_loss": -39.768367767333984, "global_step": 154132, "epoch": 1273} {"train_loss": -39.53260803222656, "global_step": 154133, "epoch": 1273} {"train_loss": -39.995361328125, "global_step": 154134, "epoch": 1273} {"train_loss": -40.052547454833984, "global_step": 154135, "epoch": 1273} {"train_loss": -39.54756164550781, "global_step": 154136, "epoch": 1273} {"train_loss": -39.56576156616211, "global_step": 154137, "epoch": 1273} {"train_loss": -40.520076751708984, "global_step": 154138, "epoch": 1273} {"train_loss": -39.26633834838867, "global_step": 154139, "epoch": 1273} {"train_loss": -40.10810852050781, "global_step": 154140, "epoch": 1273} {"train_loss": -39.765960693359375, "global_step": 154141, "epoch": 1273} {"train_loss": -39.55983352661133, "global_step": 154142, "epoch": 1273} {"train_loss": -40.18667221069336, "global_step": 154143, "epoch": 1273} {"train_loss": -39.64385223388672, "global_step": 154144, "epoch": 1273} {"train_loss": -40.142333984375, "global_step": 154145, "epoch": 1273} {"train_loss": -40.712196350097656, "global_step": 154146, "epoch": 1273} {"train_loss": -40.095252990722656, "global_step": 154147, "epoch": 1273} {"train_loss": -40.452728271484375, "global_step": 154148, "epoch": 1273} {"train_loss": -39.60203170776367, "global_step": 154149, "epoch": 1273} {"train_loss": -40.388607025146484, "global_step": 154150, "epoch": 1273} {"train_loss": -40.56525421142578, "global_step": 154151, "epoch": 1273} {"train_loss": -40.225799560546875, "global_step": 154152, "epoch": 1273} {"train_loss": -38.98625660730787, "global_step": 154153, "epoch": 1273, "val_loss": 2712621.75} {"train_loss": -40.66347885131836, "global_step": 154154, "epoch": 1274} {"train_loss": -40.869205474853516, "global_step": 154155, "epoch": 1274} {"train_loss": -40.58812713623047, "global_step": 154156, "epoch": 1274} {"train_loss": -40.62565994262695, "global_step": 154157, "epoch": 1274} {"train_loss": -41.18037033081055, "global_step": 154158, "epoch": 1274} {"train_loss": -40.97001266479492, "global_step": 154159, "epoch": 1274} {"train_loss": -40.9072265625, "global_step": 154160, "epoch": 1274} {"train_loss": -40.78126907348633, "global_step": 154161, "epoch": 1274} {"train_loss": -41.094749450683594, "global_step": 154162, "epoch": 1274} {"train_loss": -40.19373321533203, "global_step": 154163, "epoch": 1274} {"train_loss": -41.29999923706055, "global_step": 154164, "epoch": 1274} {"train_loss": -41.038814544677734, "global_step": 154165, "epoch": 1274} {"train_loss": -41.10386276245117, "global_step": 154166, "epoch": 1274} {"train_loss": -40.79793930053711, "global_step": 154167, "epoch": 1274} {"train_loss": -41.08112716674805, "global_step": 154168, "epoch": 1274} {"train_loss": -40.82079315185547, "global_step": 154169, "epoch": 1274} {"train_loss": -41.03779220581055, "global_step": 154170, "epoch": 1274} {"train_loss": -41.00697708129883, "global_step": 154171, "epoch": 1274} {"train_loss": -40.565895080566406, "global_step": 154172, "epoch": 1274} {"train_loss": -40.983951568603516, "global_step": 154173, "epoch": 1274} {"train_loss": -41.19301986694336, "global_step": 154174, "epoch": 1274} {"train_loss": -40.929500579833984, "global_step": 154175, "epoch": 1274} {"train_loss": -40.910011291503906, "global_step": 154176, "epoch": 1274} {"train_loss": -40.99169158935547, "global_step": 154177, "epoch": 1274} {"train_loss": -41.033206939697266, "global_step": 154178, "epoch": 1274} {"train_loss": -40.996543884277344, "global_step": 154179, "epoch": 1274} {"train_loss": -41.474525451660156, "global_step": 154180, "epoch": 1274} {"train_loss": -40.90009689331055, "global_step": 154181, "epoch": 1274} {"train_loss": -41.01798629760742, "global_step": 154182, "epoch": 1274} {"train_loss": -41.2005729675293, "global_step": 154183, "epoch": 1274} {"train_loss": -41.17369079589844, "global_step": 154184, "epoch": 1274} {"train_loss": -40.89575958251953, "global_step": 154185, "epoch": 1274} {"train_loss": -41.597110748291016, "global_step": 154186, "epoch": 1274} {"train_loss": -40.925270080566406, "global_step": 154187, "epoch": 1274} {"train_loss": -41.35157775878906, "global_step": 154188, "epoch": 1274} {"train_loss": -41.1525993347168, "global_step": 154189, "epoch": 1274} {"train_loss": -41.28812789916992, "global_step": 154190, "epoch": 1274} {"train_loss": -41.44837188720703, "global_step": 154191, "epoch": 1274} {"train_loss": -40.3000373840332, "global_step": 154192, "epoch": 1274} {"train_loss": -41.842098236083984, "global_step": 154193, "epoch": 1274} {"train_loss": -41.162567138671875, "global_step": 154194, "epoch": 1274} {"train_loss": -41.33775329589844, "global_step": 154195, "epoch": 1274} {"train_loss": -41.26443099975586, "global_step": 154196, "epoch": 1274} {"train_loss": -41.573463439941406, "global_step": 154197, "epoch": 1274} {"train_loss": -40.66828536987305, "global_step": 154198, "epoch": 1274} {"train_loss": -41.34751892089844, "global_step": 154199, "epoch": 1274} {"train_loss": -40.87274932861328, "global_step": 154200, "epoch": 1274} {"train_loss": -41.102447509765625, "global_step": 154201, "epoch": 1274} {"train_loss": -40.66129684448242, "global_step": 154202, "epoch": 1274} {"train_loss": -41.439109802246094, "global_step": 154203, "epoch": 1274} {"train_loss": -41.058162689208984, "global_step": 154204, "epoch": 1274} {"train_loss": -40.81081771850586, "global_step": 154205, "epoch": 1274} {"train_loss": -41.29118728637695, "global_step": 154206, "epoch": 1274} {"train_loss": -41.157020568847656, "global_step": 154207, "epoch": 1274} {"train_loss": -41.40596008300781, "global_step": 154208, "epoch": 1274} {"train_loss": -40.643157958984375, "global_step": 154209, "epoch": 1274} {"train_loss": -40.00497055053711, "global_step": 154210, "epoch": 1274} {"train_loss": -40.42584228515625, "global_step": 154211, "epoch": 1274} {"train_loss": -40.8289909362793, "global_step": 154212, "epoch": 1274} {"train_loss": -41.12467575073242, "global_step": 154213, "epoch": 1274} {"train_loss": -40.077735900878906, "global_step": 154214, "epoch": 1274} {"train_loss": -37.3082275390625, "global_step": 154215, "epoch": 1274} {"train_loss": -38.54830551147461, "global_step": 154216, "epoch": 1274} {"train_loss": -37.646888732910156, "global_step": 154217, "epoch": 1274} {"train_loss": -39.12667465209961, "global_step": 154218, "epoch": 1274} {"train_loss": -38.63975143432617, "global_step": 154219, "epoch": 1274} {"train_loss": -38.365882873535156, "global_step": 154220, "epoch": 1274} {"train_loss": -39.894840240478516, "global_step": 154221, "epoch": 1274} {"train_loss": -39.43042755126953, "global_step": 154222, "epoch": 1274} {"train_loss": -37.93506622314453, "global_step": 154223, "epoch": 1274} {"train_loss": -37.48649215698242, "global_step": 154224, "epoch": 1274} {"train_loss": -39.3179817199707, "global_step": 154225, "epoch": 1274} {"train_loss": -32.17509460449219, "global_step": 154226, "epoch": 1274} {"train_loss": -38.92750549316406, "global_step": 154227, "epoch": 1274} {"train_loss": -39.665157318115234, "global_step": 154228, "epoch": 1274} {"train_loss": -37.81568145751953, "global_step": 154229, "epoch": 1274} {"train_loss": -37.2363395690918, "global_step": 154230, "epoch": 1274} {"train_loss": -38.86909103393555, "global_step": 154231, "epoch": 1274} {"train_loss": -39.651824951171875, "global_step": 154232, "epoch": 1274} {"train_loss": -39.90418243408203, "global_step": 154233, "epoch": 1274} {"train_loss": -38.45970153808594, "global_step": 154234, "epoch": 1274} {"train_loss": -39.82075881958008, "global_step": 154235, "epoch": 1274} {"train_loss": -37.650001525878906, "global_step": 154236, "epoch": 1274} {"train_loss": -40.2083625793457, "global_step": 154237, "epoch": 1274} {"train_loss": -37.662933349609375, "global_step": 154238, "epoch": 1274} {"train_loss": -39.427574157714844, "global_step": 154239, "epoch": 1274} {"train_loss": -39.978790283203125, "global_step": 154240, "epoch": 1274} {"train_loss": -39.2109375, "global_step": 154241, "epoch": 1274} {"train_loss": -39.99405288696289, "global_step": 154242, "epoch": 1274} {"train_loss": -39.689083099365234, "global_step": 154243, "epoch": 1274} {"train_loss": -39.179264068603516, "global_step": 154244, "epoch": 1274} {"train_loss": -38.473175048828125, "global_step": 154245, "epoch": 1274} {"train_loss": -39.35634231567383, "global_step": 154246, "epoch": 1274} {"train_loss": -39.31370162963867, "global_step": 154247, "epoch": 1274} {"train_loss": -39.67759704589844, "global_step": 154248, "epoch": 1274} {"train_loss": -37.73114776611328, "global_step": 154249, "epoch": 1274} {"train_loss": -38.082881927490234, "global_step": 154250, "epoch": 1274} {"train_loss": -40.031829833984375, "global_step": 154251, "epoch": 1274} {"train_loss": -39.76823425292969, "global_step": 154252, "epoch": 1274} {"train_loss": -39.49116897583008, "global_step": 154253, "epoch": 1274} {"train_loss": -39.73860549926758, "global_step": 154254, "epoch": 1274} {"train_loss": -39.94193649291992, "global_step": 154255, "epoch": 1274} {"train_loss": -38.675106048583984, "global_step": 154256, "epoch": 1274} {"train_loss": -39.90751647949219, "global_step": 154257, "epoch": 1274} {"train_loss": -40.30510330200195, "global_step": 154258, "epoch": 1274} {"train_loss": -40.0847053527832, "global_step": 154259, "epoch": 1274} {"train_loss": -40.324790954589844, "global_step": 154260, "epoch": 1274} {"train_loss": -39.97776412963867, "global_step": 154261, "epoch": 1274} {"train_loss": -39.8056640625, "global_step": 154262, "epoch": 1274} {"train_loss": -38.73999786376953, "global_step": 154263, "epoch": 1274} {"train_loss": -39.680110931396484, "global_step": 154264, "epoch": 1274} {"train_loss": -40.100555419921875, "global_step": 154265, "epoch": 1274} {"train_loss": -40.10399627685547, "global_step": 154266, "epoch": 1274} {"train_loss": -38.767478942871094, "global_step": 154267, "epoch": 1274} {"train_loss": -39.923927307128906, "global_step": 154268, "epoch": 1274} {"train_loss": -39.50861358642578, "global_step": 154269, "epoch": 1274} {"train_loss": -39.518306732177734, "global_step": 154270, "epoch": 1274} {"train_loss": -39.54890441894531, "global_step": 154271, "epoch": 1274} {"train_loss": -39.139007568359375, "global_step": 154272, "epoch": 1274} {"train_loss": -39.222320556640625, "global_step": 154273, "epoch": 1274} {"train_loss": -40.036009607236245, "global_step": 154274, "epoch": 1274, "val_loss": 2755341.0} {"train_loss": -39.38041687011719, "global_step": 154275, "epoch": 1275} {"train_loss": -39.993629455566406, "global_step": 154276, "epoch": 1275} {"train_loss": -39.27659225463867, "global_step": 154277, "epoch": 1275} {"train_loss": -40.437252044677734, "global_step": 154278, "epoch": 1275} {"train_loss": -39.719966888427734, "global_step": 154279, "epoch": 1275} {"train_loss": -40.15102767944336, "global_step": 154280, "epoch": 1275} {"train_loss": -40.1564826965332, "global_step": 154281, "epoch": 1275} {"train_loss": -40.4303092956543, "global_step": 154282, "epoch": 1275} {"train_loss": -39.80324935913086, "global_step": 154283, "epoch": 1275} {"train_loss": -40.55753707885742, "global_step": 154284, "epoch": 1275} {"train_loss": -39.9714469909668, "global_step": 154285, "epoch": 1275} {"train_loss": -40.3135986328125, "global_step": 154286, "epoch": 1275} {"train_loss": -39.50222396850586, "global_step": 154287, "epoch": 1275} {"train_loss": -40.33011245727539, "global_step": 154288, "epoch": 1275} {"train_loss": -40.42661666870117, "global_step": 154289, "epoch": 1275} {"train_loss": -40.8087272644043, "global_step": 154290, "epoch": 1275} {"train_loss": -40.26577377319336, "global_step": 154291, "epoch": 1275} {"train_loss": -40.52302551269531, "global_step": 154292, "epoch": 1275} {"train_loss": -41.06576156616211, "global_step": 154293, "epoch": 1275} {"train_loss": -40.87615966796875, "global_step": 154294, "epoch": 1275} {"train_loss": -40.97314453125, "global_step": 154295, "epoch": 1275} {"train_loss": -40.90693283081055, "global_step": 154296, "epoch": 1275} {"train_loss": -40.18048095703125, "global_step": 154297, "epoch": 1275} {"train_loss": -40.28121566772461, "global_step": 154298, "epoch": 1275} {"train_loss": -41.152435302734375, "global_step": 154299, "epoch": 1275} {"train_loss": -40.3133659362793, "global_step": 154300, "epoch": 1275} {"train_loss": -40.5307502746582, "global_step": 154301, "epoch": 1275} {"train_loss": -41.143951416015625, "global_step": 154302, "epoch": 1275} {"train_loss": -40.463722229003906, "global_step": 154303, "epoch": 1275} {"train_loss": -40.724281311035156, "global_step": 154304, "epoch": 1275} {"train_loss": -40.55258560180664, "global_step": 154305, "epoch": 1275} {"train_loss": -40.94325256347656, "global_step": 154306, "epoch": 1275} {"train_loss": -40.778892517089844, "global_step": 154307, "epoch": 1275} {"train_loss": -40.1981086730957, "global_step": 154308, "epoch": 1275} {"train_loss": -40.91349411010742, "global_step": 154309, "epoch": 1275} {"train_loss": -38.90021514892578, "global_step": 154310, "epoch": 1275} {"train_loss": -40.458404541015625, "global_step": 154311, "epoch": 1275} {"train_loss": -40.32279586791992, "global_step": 154312, "epoch": 1275} {"train_loss": -41.43105697631836, "global_step": 154313, "epoch": 1275} {"train_loss": -38.770660400390625, "global_step": 154314, "epoch": 1275} {"train_loss": -39.16714859008789, "global_step": 154315, "epoch": 1275} {"train_loss": -40.41356658935547, "global_step": 154316, "epoch": 1275} {"train_loss": -40.30237579345703, "global_step": 154317, "epoch": 1275} {"train_loss": -40.2579460144043, "global_step": 154318, "epoch": 1275} {"train_loss": -35.2362174987793, "global_step": 154319, "epoch": 1275} {"train_loss": -39.71925735473633, "global_step": 154320, "epoch": 1275} {"train_loss": -41.1850700378418, "global_step": 154321, "epoch": 1275} {"train_loss": -39.48167419433594, "global_step": 154322, "epoch": 1275} {"train_loss": -39.11404037475586, "global_step": 154323, "epoch": 1275} {"train_loss": -40.73952102661133, "global_step": 154324, "epoch": 1275} {"train_loss": -40.47696304321289, "global_step": 154325, "epoch": 1275} {"train_loss": -40.1681022644043, "global_step": 154326, "epoch": 1275} {"train_loss": -41.19511795043945, "global_step": 154327, "epoch": 1275} {"train_loss": -40.61674880981445, "global_step": 154328, "epoch": 1275} {"train_loss": -40.434757232666016, "global_step": 154329, "epoch": 1275} {"train_loss": -40.570892333984375, "global_step": 154330, "epoch": 1275} {"train_loss": -41.2019157409668, "global_step": 154331, "epoch": 1275} {"train_loss": -38.731929779052734, "global_step": 154332, "epoch": 1275} {"train_loss": -40.54998779296875, "global_step": 154333, "epoch": 1275} {"train_loss": -40.90480422973633, "global_step": 154334, "epoch": 1275} {"train_loss": -40.38241195678711, "global_step": 154335, "epoch": 1275} {"train_loss": -40.884857177734375, "global_step": 154336, "epoch": 1275} {"train_loss": -40.20011520385742, "global_step": 154337, "epoch": 1275} {"train_loss": -40.76148223876953, "global_step": 154338, "epoch": 1275} {"train_loss": -40.74294662475586, "global_step": 154339, "epoch": 1275} {"train_loss": -40.896400451660156, "global_step": 154340, "epoch": 1275} {"train_loss": -40.43979263305664, "global_step": 154341, "epoch": 1275} {"train_loss": -38.784637451171875, "global_step": 154342, "epoch": 1275} {"train_loss": -41.09453582763672, "global_step": 154343, "epoch": 1275} {"train_loss": -36.87965774536133, "global_step": 154344, "epoch": 1275} {"train_loss": -38.019569396972656, "global_step": 154345, "epoch": 1275} {"train_loss": -37.48630905151367, "global_step": 154346, "epoch": 1275} {"train_loss": -39.994747161865234, "global_step": 154347, "epoch": 1275} {"train_loss": -39.25809860229492, "global_step": 154348, "epoch": 1275} {"train_loss": -39.455535888671875, "global_step": 154349, "epoch": 1275} {"train_loss": -34.162086486816406, "global_step": 154350, "epoch": 1275} {"train_loss": -39.38249969482422, "global_step": 154351, "epoch": 1275} {"train_loss": -40.419647216796875, "global_step": 154352, "epoch": 1275} {"train_loss": -40.0287971496582, "global_step": 154353, "epoch": 1275} {"train_loss": -38.42310333251953, "global_step": 154354, "epoch": 1275} {"train_loss": -40.201351165771484, "global_step": 154355, "epoch": 1275} {"train_loss": -39.811500549316406, "global_step": 154356, "epoch": 1275} {"train_loss": -38.987972259521484, "global_step": 154357, "epoch": 1275} {"train_loss": -39.48259353637695, "global_step": 154358, "epoch": 1275} {"train_loss": -39.734779357910156, "global_step": 154359, "epoch": 1275} {"train_loss": -39.37022018432617, "global_step": 154360, "epoch": 1275} {"train_loss": -39.256649017333984, "global_step": 154361, "epoch": 1275} {"train_loss": -37.295188903808594, "global_step": 154362, "epoch": 1275} {"train_loss": -39.88092803955078, "global_step": 154363, "epoch": 1275} {"train_loss": -38.19289016723633, "global_step": 154364, "epoch": 1275} {"train_loss": -40.36893081665039, "global_step": 154365, "epoch": 1275} {"train_loss": -38.41730499267578, "global_step": 154366, "epoch": 1275} {"train_loss": -39.17493438720703, "global_step": 154367, "epoch": 1275} {"train_loss": -40.196468353271484, "global_step": 154368, "epoch": 1275} {"train_loss": -40.601905822753906, "global_step": 154369, "epoch": 1275} {"train_loss": -36.408058166503906, "global_step": 154370, "epoch": 1275} {"train_loss": -37.83778762817383, "global_step": 154371, "epoch": 1275} {"train_loss": -39.064937591552734, "global_step": 154372, "epoch": 1275} {"train_loss": -37.80352020263672, "global_step": 154373, "epoch": 1275} {"train_loss": -37.63266372680664, "global_step": 154374, "epoch": 1275} {"train_loss": -40.02345657348633, "global_step": 154375, "epoch": 1275} {"train_loss": -39.42656326293945, "global_step": 154376, "epoch": 1275} {"train_loss": -39.45763397216797, "global_step": 154377, "epoch": 1275} {"train_loss": -40.14775466918945, "global_step": 154378, "epoch": 1275} {"train_loss": -39.990272521972656, "global_step": 154379, "epoch": 1275} {"train_loss": -35.2369499206543, "global_step": 154380, "epoch": 1275} {"train_loss": -39.55350875854492, "global_step": 154381, "epoch": 1275} {"train_loss": -40.74396514892578, "global_step": 154382, "epoch": 1275} {"train_loss": -40.11848068237305, "global_step": 154383, "epoch": 1275} {"train_loss": -39.10620880126953, "global_step": 154384, "epoch": 1275} {"train_loss": -38.599613189697266, "global_step": 154385, "epoch": 1275} {"train_loss": -40.499996185302734, "global_step": 154386, "epoch": 1275} {"train_loss": -39.88799285888672, "global_step": 154387, "epoch": 1275} {"train_loss": -39.850852966308594, "global_step": 154388, "epoch": 1275} {"train_loss": -40.16963577270508, "global_step": 154389, "epoch": 1275} {"train_loss": -39.93754577636719, "global_step": 154390, "epoch": 1275} {"train_loss": -39.33232498168945, "global_step": 154391, "epoch": 1275} {"train_loss": -40.42318344116211, "global_step": 154392, "epoch": 1275} {"train_loss": -36.66518783569336, "global_step": 154393, "epoch": 1275} {"train_loss": -40.036865234375, "global_step": 154394, "epoch": 1275} {"train_loss": -39.75313968500815, "global_step": 154395, "epoch": 1275, "val_loss": 2814549.75} {"train_loss": -40.442745208740234, "global_step": 154396, "epoch": 1276} {"train_loss": -37.936012268066406, "global_step": 154397, "epoch": 1276} {"train_loss": -40.23974609375, "global_step": 154398, "epoch": 1276} {"train_loss": -40.33756637573242, "global_step": 154399, "epoch": 1276} {"train_loss": -40.695640563964844, "global_step": 154400, "epoch": 1276} {"train_loss": -38.53079605102539, "global_step": 154401, "epoch": 1276} {"train_loss": -38.12028121948242, "global_step": 154402, "epoch": 1276} {"train_loss": -34.73366165161133, "global_step": 154403, "epoch": 1276} {"train_loss": -35.739280700683594, "global_step": 154404, "epoch": 1276} {"train_loss": -39.455318450927734, "global_step": 154405, "epoch": 1276} {"train_loss": -39.124794006347656, "global_step": 154406, "epoch": 1276} {"train_loss": -38.264923095703125, "global_step": 154407, "epoch": 1276} {"train_loss": -37.49506378173828, "global_step": 154408, "epoch": 1276} {"train_loss": -36.53985595703125, "global_step": 154409, "epoch": 1276} {"train_loss": -38.37898635864258, "global_step": 154410, "epoch": 1276} {"train_loss": -37.83634567260742, "global_step": 154411, "epoch": 1276} {"train_loss": -36.169227600097656, "global_step": 154412, "epoch": 1276} {"train_loss": -40.00129318237305, "global_step": 154413, "epoch": 1276} {"train_loss": -39.44219970703125, "global_step": 154414, "epoch": 1276} {"train_loss": -38.6259880065918, "global_step": 154415, "epoch": 1276} {"train_loss": -38.590736389160156, "global_step": 154416, "epoch": 1276} {"train_loss": -29.614614486694336, "global_step": 154417, "epoch": 1276} {"train_loss": -40.02236557006836, "global_step": 154418, "epoch": 1276} {"train_loss": -37.581939697265625, "global_step": 154419, "epoch": 1276} {"train_loss": -38.24421310424805, "global_step": 154420, "epoch": 1276} {"train_loss": -39.47718048095703, "global_step": 154421, "epoch": 1276} {"train_loss": -39.10230255126953, "global_step": 154422, "epoch": 1276} {"train_loss": -39.69608688354492, "global_step": 154423, "epoch": 1276} {"train_loss": -38.267372131347656, "global_step": 154424, "epoch": 1276} {"train_loss": -39.253170013427734, "global_step": 154425, "epoch": 1276} {"train_loss": -36.473812103271484, "global_step": 154426, "epoch": 1276} {"train_loss": -39.36711120605469, "global_step": 154427, "epoch": 1276} {"train_loss": -38.27859878540039, "global_step": 154428, "epoch": 1276} {"train_loss": -39.146263122558594, "global_step": 154429, "epoch": 1276} {"train_loss": -39.31298828125, "global_step": 154430, "epoch": 1276} {"train_loss": -39.199432373046875, "global_step": 154431, "epoch": 1276} {"train_loss": -38.95260238647461, "global_step": 154432, "epoch": 1276} {"train_loss": -38.91310501098633, "global_step": 154433, "epoch": 1276} {"train_loss": -40.20113754272461, "global_step": 154434, "epoch": 1276} {"train_loss": -39.55280685424805, "global_step": 154435, "epoch": 1276} {"train_loss": -39.31055450439453, "global_step": 154436, "epoch": 1276} {"train_loss": -39.67283248901367, "global_step": 154437, "epoch": 1276} {"train_loss": -39.58449935913086, "global_step": 154438, "epoch": 1276} {"train_loss": -38.23701095581055, "global_step": 154439, "epoch": 1276} {"train_loss": -40.22005844116211, "global_step": 154440, "epoch": 1276} {"train_loss": -35.95863723754883, "global_step": 154441, "epoch": 1276} {"train_loss": -40.4865837097168, "global_step": 154442, "epoch": 1276} {"train_loss": -37.38466262817383, "global_step": 154443, "epoch": 1276} {"train_loss": -40.34286117553711, "global_step": 154444, "epoch": 1276} {"train_loss": -38.775962829589844, "global_step": 154445, "epoch": 1276} {"train_loss": -39.31023025512695, "global_step": 154446, "epoch": 1276} {"train_loss": -38.29249572753906, "global_step": 154447, "epoch": 1276} {"train_loss": -38.84579849243164, "global_step": 154448, "epoch": 1276} {"train_loss": -39.13118362426758, "global_step": 154449, "epoch": 1276} {"train_loss": -37.78632354736328, "global_step": 154450, "epoch": 1276} {"train_loss": -38.73582458496094, "global_step": 154451, "epoch": 1276} {"train_loss": -39.273048400878906, "global_step": 154452, "epoch": 1276} {"train_loss": -39.59333419799805, "global_step": 154453, "epoch": 1276} {"train_loss": -38.573341369628906, "global_step": 154454, "epoch": 1276} {"train_loss": -39.06535720825195, "global_step": 154455, "epoch": 1276} {"train_loss": -37.10947036743164, "global_step": 154456, "epoch": 1276} {"train_loss": -39.6300048828125, "global_step": 154457, "epoch": 1276} {"train_loss": -38.52871322631836, "global_step": 154458, "epoch": 1276} {"train_loss": -38.08633041381836, "global_step": 154459, "epoch": 1276} {"train_loss": -40.2463493347168, "global_step": 154460, "epoch": 1276} {"train_loss": -39.00704574584961, "global_step": 154461, "epoch": 1276} {"train_loss": -39.5842170715332, "global_step": 154462, "epoch": 1276} {"train_loss": -39.758480072021484, "global_step": 154463, "epoch": 1276} {"train_loss": -40.47321701049805, "global_step": 154464, "epoch": 1276} {"train_loss": -39.8529167175293, "global_step": 154465, "epoch": 1276} {"train_loss": -40.47663497924805, "global_step": 154466, "epoch": 1276} {"train_loss": -40.39453125, "global_step": 154467, "epoch": 1276} {"train_loss": -38.08039093017578, "global_step": 154468, "epoch": 1276} {"train_loss": -39.7303466796875, "global_step": 154469, "epoch": 1276} {"train_loss": -39.92106628417969, "global_step": 154470, "epoch": 1276} {"train_loss": -40.38865661621094, "global_step": 154471, "epoch": 1276} {"train_loss": -38.15339660644531, "global_step": 154472, "epoch": 1276} {"train_loss": -38.30437088012695, "global_step": 154473, "epoch": 1276} {"train_loss": -39.48652267456055, "global_step": 154474, "epoch": 1276} {"train_loss": -39.636837005615234, "global_step": 154475, "epoch": 1276} {"train_loss": -39.66899108886719, "global_step": 154476, "epoch": 1276} {"train_loss": -38.18178176879883, "global_step": 154477, "epoch": 1276} {"train_loss": -40.158729553222656, "global_step": 154478, "epoch": 1276} {"train_loss": -38.33749771118164, "global_step": 154479, "epoch": 1276} {"train_loss": -39.21844482421875, "global_step": 154480, "epoch": 1276} {"train_loss": -39.409027099609375, "global_step": 154481, "epoch": 1276} {"train_loss": -39.77610397338867, "global_step": 154482, "epoch": 1276} {"train_loss": -39.47538757324219, "global_step": 154483, "epoch": 1276} {"train_loss": -39.294307708740234, "global_step": 154484, "epoch": 1276} {"train_loss": -39.53377914428711, "global_step": 154485, "epoch": 1276} {"train_loss": -40.15000534057617, "global_step": 154486, "epoch": 1276} {"train_loss": -39.4127197265625, "global_step": 154487, "epoch": 1276} {"train_loss": -40.246944427490234, "global_step": 154488, "epoch": 1276} {"train_loss": -39.74409866333008, "global_step": 154489, "epoch": 1276} {"train_loss": -40.64910125732422, "global_step": 154490, "epoch": 1276} {"train_loss": -39.43561935424805, "global_step": 154491, "epoch": 1276} {"train_loss": -39.472293853759766, "global_step": 154492, "epoch": 1276} {"train_loss": -38.13730239868164, "global_step": 154493, "epoch": 1276} {"train_loss": -40.124000549316406, "global_step": 154494, "epoch": 1276} {"train_loss": -38.846797943115234, "global_step": 154495, "epoch": 1276} {"train_loss": -39.94797897338867, "global_step": 154496, "epoch": 1276} {"train_loss": -39.75757598876953, "global_step": 154497, "epoch": 1276} {"train_loss": -39.87226104736328, "global_step": 154498, "epoch": 1276} {"train_loss": -40.4944953918457, "global_step": 154499, "epoch": 1276} {"train_loss": -40.07057571411133, "global_step": 154500, "epoch": 1276} {"train_loss": -38.930877685546875, "global_step": 154501, "epoch": 1276} {"train_loss": -39.62013626098633, "global_step": 154502, "epoch": 1276} {"train_loss": -39.93620681762695, "global_step": 154503, "epoch": 1276} {"train_loss": -39.344966888427734, "global_step": 154504, "epoch": 1276} {"train_loss": -40.56462860107422, "global_step": 154505, "epoch": 1276} {"train_loss": -40.80978012084961, "global_step": 154506, "epoch": 1276} {"train_loss": -40.59109115600586, "global_step": 154507, "epoch": 1276} {"train_loss": -39.32303237915039, "global_step": 154508, "epoch": 1276} {"train_loss": -39.97407150268555, "global_step": 154509, "epoch": 1276} {"train_loss": -40.708465576171875, "global_step": 154510, "epoch": 1276} {"train_loss": -40.48918914794922, "global_step": 154511, "epoch": 1276} {"train_loss": -40.274009704589844, "global_step": 154512, "epoch": 1276} {"train_loss": -39.416805267333984, "global_step": 154513, "epoch": 1276} {"train_loss": -39.994895935058594, "global_step": 154514, "epoch": 1276} {"train_loss": -40.925052642822266, "global_step": 154515, "epoch": 1276} {"train_loss": -39.12419297084335, "global_step": 154516, "epoch": 1276, "val_loss": 2660058.0} {"train_loss": -40.09342575073242, "global_step": 154517, "epoch": 1277} {"train_loss": -38.83710861206055, "global_step": 154518, "epoch": 1277} {"train_loss": -38.804683685302734, "global_step": 154519, "epoch": 1277} {"train_loss": -39.08143997192383, "global_step": 154520, "epoch": 1277} {"train_loss": -39.6103630065918, "global_step": 154521, "epoch": 1277} {"train_loss": -38.935035705566406, "global_step": 154522, "epoch": 1277} {"train_loss": -38.63719177246094, "global_step": 154523, "epoch": 1277} {"train_loss": -39.367530822753906, "global_step": 154524, "epoch": 1277} {"train_loss": -40.52524948120117, "global_step": 154525, "epoch": 1277} {"train_loss": -39.740291595458984, "global_step": 154526, "epoch": 1277} {"train_loss": -38.20366287231445, "global_step": 154527, "epoch": 1277} {"train_loss": -35.00312423706055, "global_step": 154528, "epoch": 1277} {"train_loss": -35.24493408203125, "global_step": 154529, "epoch": 1277} {"train_loss": -37.704124450683594, "global_step": 154530, "epoch": 1277} {"train_loss": -40.08790969848633, "global_step": 154531, "epoch": 1277} {"train_loss": -38.18221664428711, "global_step": 154532, "epoch": 1277} {"train_loss": -37.239295959472656, "global_step": 154533, "epoch": 1277} {"train_loss": -37.809505462646484, "global_step": 154534, "epoch": 1277} {"train_loss": -32.415462493896484, "global_step": 154535, "epoch": 1277} {"train_loss": -40.05884552001953, "global_step": 154536, "epoch": 1277} {"train_loss": -39.421119689941406, "global_step": 154537, "epoch": 1277} {"train_loss": -39.99203109741211, "global_step": 154538, "epoch": 1277} {"train_loss": -40.35173034667969, "global_step": 154539, "epoch": 1277} {"train_loss": -39.08386993408203, "global_step": 154540, "epoch": 1277} {"train_loss": -40.076934814453125, "global_step": 154541, "epoch": 1277} {"train_loss": -40.01605987548828, "global_step": 154542, "epoch": 1277} {"train_loss": -39.81415939331055, "global_step": 154543, "epoch": 1277} {"train_loss": -40.20109558105469, "global_step": 154544, "epoch": 1277} {"train_loss": -38.668800354003906, "global_step": 154545, "epoch": 1277} {"train_loss": -39.737545013427734, "global_step": 154546, "epoch": 1277} {"train_loss": -40.24656295776367, "global_step": 154547, "epoch": 1277} {"train_loss": -39.524810791015625, "global_step": 154548, "epoch": 1277} {"train_loss": -40.63613510131836, "global_step": 154549, "epoch": 1277} {"train_loss": -40.412899017333984, "global_step": 154550, "epoch": 1277} {"train_loss": -40.30241012573242, "global_step": 154551, "epoch": 1277} {"train_loss": -40.065032958984375, "global_step": 154552, "epoch": 1277} {"train_loss": -39.16229248046875, "global_step": 154553, "epoch": 1277} {"train_loss": -40.78373718261719, "global_step": 154554, "epoch": 1277} {"train_loss": -40.63405990600586, "global_step": 154555, "epoch": 1277} {"train_loss": -40.392696380615234, "global_step": 154556, "epoch": 1277} {"train_loss": -40.108272552490234, "global_step": 154557, "epoch": 1277} {"train_loss": -40.53567123413086, "global_step": 154558, "epoch": 1277} {"train_loss": -40.442420959472656, "global_step": 154559, "epoch": 1277} {"train_loss": -40.051490783691406, "global_step": 154560, "epoch": 1277} {"train_loss": -39.350101470947266, "global_step": 154561, "epoch": 1277} {"train_loss": -40.93207931518555, "global_step": 154562, "epoch": 1277} {"train_loss": -40.70803451538086, "global_step": 154563, "epoch": 1277} {"train_loss": -40.547210693359375, "global_step": 154564, "epoch": 1277} {"train_loss": -40.674560546875, "global_step": 154565, "epoch": 1277} {"train_loss": -38.538509368896484, "global_step": 154566, "epoch": 1277} {"train_loss": -40.53939437866211, "global_step": 154567, "epoch": 1277} {"train_loss": -40.42972946166992, "global_step": 154568, "epoch": 1277} {"train_loss": -40.654964447021484, "global_step": 154569, "epoch": 1277} {"train_loss": -40.3431282043457, "global_step": 154570, "epoch": 1277} {"train_loss": -41.12879180908203, "global_step": 154571, "epoch": 1277} {"train_loss": -40.5709228515625, "global_step": 154572, "epoch": 1277} {"train_loss": -41.09125900268555, "global_step": 154573, "epoch": 1277} {"train_loss": -40.39539337158203, "global_step": 154574, "epoch": 1277} {"train_loss": -41.057655334472656, "global_step": 154575, "epoch": 1277} {"train_loss": -41.030311584472656, "global_step": 154576, "epoch": 1277} {"train_loss": -39.64608383178711, "global_step": 154577, "epoch": 1277} {"train_loss": -40.9168586730957, "global_step": 154578, "epoch": 1277} {"train_loss": -40.11537551879883, "global_step": 154579, "epoch": 1277} {"train_loss": -41.00320053100586, "global_step": 154580, "epoch": 1277} {"train_loss": -40.48264694213867, "global_step": 154581, "epoch": 1277} {"train_loss": -41.01551055908203, "global_step": 154582, "epoch": 1277} {"train_loss": -40.939876556396484, "global_step": 154583, "epoch": 1277} {"train_loss": -40.176170349121094, "global_step": 154584, "epoch": 1277} {"train_loss": -40.99857711791992, "global_step": 154585, "epoch": 1277} {"train_loss": -39.80160140991211, "global_step": 154586, "epoch": 1277} {"train_loss": -40.81491470336914, "global_step": 154587, "epoch": 1277} {"train_loss": -40.580806732177734, "global_step": 154588, "epoch": 1277} {"train_loss": -40.64468002319336, "global_step": 154589, "epoch": 1277} {"train_loss": -40.6525764465332, "global_step": 154590, "epoch": 1277} {"train_loss": -40.756614685058594, "global_step": 154591, "epoch": 1277} {"train_loss": -40.96875762939453, "global_step": 154592, "epoch": 1277} {"train_loss": -40.69557571411133, "global_step": 154593, "epoch": 1277} {"train_loss": -40.346595764160156, "global_step": 154594, "epoch": 1277} {"train_loss": -38.975765228271484, "global_step": 154595, "epoch": 1277} {"train_loss": -38.5285758972168, "global_step": 154596, "epoch": 1277} {"train_loss": -38.814002990722656, "global_step": 154597, "epoch": 1277} {"train_loss": -40.575958251953125, "global_step": 154598, "epoch": 1277} {"train_loss": -40.22764205932617, "global_step": 154599, "epoch": 1277} {"train_loss": -39.857940673828125, "global_step": 154600, "epoch": 1277} {"train_loss": -40.20445251464844, "global_step": 154601, "epoch": 1277} {"train_loss": -41.684505462646484, "global_step": 154602, "epoch": 1277} {"train_loss": -40.29195022583008, "global_step": 154603, "epoch": 1277} {"train_loss": -40.46151351928711, "global_step": 154604, "epoch": 1277} {"train_loss": -40.47801971435547, "global_step": 154605, "epoch": 1277} {"train_loss": -40.84861373901367, "global_step": 154606, "epoch": 1277} {"train_loss": -40.74772262573242, "global_step": 154607, "epoch": 1277} {"train_loss": -40.70124435424805, "global_step": 154608, "epoch": 1277} {"train_loss": -41.55615234375, "global_step": 154609, "epoch": 1277} {"train_loss": -41.2691650390625, "global_step": 154610, "epoch": 1277} {"train_loss": -40.52126693725586, "global_step": 154611, "epoch": 1277} {"train_loss": -40.44609069824219, "global_step": 154612, "epoch": 1277} {"train_loss": -41.90412902832031, "global_step": 154613, "epoch": 1277} {"train_loss": -41.143367767333984, "global_step": 154614, "epoch": 1277} {"train_loss": -41.35318374633789, "global_step": 154615, "epoch": 1277} {"train_loss": -40.41365051269531, "global_step": 154616, "epoch": 1277} {"train_loss": -40.03343963623047, "global_step": 154617, "epoch": 1277} {"train_loss": -41.16635513305664, "global_step": 154618, "epoch": 1277} {"train_loss": -41.3832893371582, "global_step": 154619, "epoch": 1277} {"train_loss": -40.760162353515625, "global_step": 154620, "epoch": 1277} {"train_loss": -41.15808868408203, "global_step": 154621, "epoch": 1277} {"train_loss": -41.49169921875, "global_step": 154622, "epoch": 1277} {"train_loss": -41.046424865722656, "global_step": 154623, "epoch": 1277} {"train_loss": -41.226898193359375, "global_step": 154624, "epoch": 1277} {"train_loss": -40.19819259643555, "global_step": 154625, "epoch": 1277} {"train_loss": -41.52353286743164, "global_step": 154626, "epoch": 1277} {"train_loss": -41.319976806640625, "global_step": 154627, "epoch": 1277} {"train_loss": -40.63796615600586, "global_step": 154628, "epoch": 1277} {"train_loss": -40.97797393798828, "global_step": 154629, "epoch": 1277} {"train_loss": -41.124794006347656, "global_step": 154630, "epoch": 1277} {"train_loss": -40.89203643798828, "global_step": 154631, "epoch": 1277} {"train_loss": -41.16978073120117, "global_step": 154632, "epoch": 1277} {"train_loss": -40.74080276489258, "global_step": 154633, "epoch": 1277} {"train_loss": -39.78951644897461, "global_step": 154634, "epoch": 1277} {"train_loss": -41.52971649169922, "global_step": 154635, "epoch": 1277} {"train_loss": -40.931541442871094, "global_step": 154636, "epoch": 1277} {"train_loss": -40.13607829070288, "global_step": 154637, "epoch": 1277, "val_loss": 2743749.0} {"train_loss": -40.89921188354492, "global_step": 154638, "epoch": 1278} {"train_loss": -40.40092468261719, "global_step": 154639, "epoch": 1278} {"train_loss": -39.82917022705078, "global_step": 154640, "epoch": 1278} {"train_loss": -39.70271682739258, "global_step": 154641, "epoch": 1278} {"train_loss": -39.972808837890625, "global_step": 154642, "epoch": 1278} {"train_loss": -40.4669189453125, "global_step": 154643, "epoch": 1278} {"train_loss": -41.06819534301758, "global_step": 154644, "epoch": 1278} {"train_loss": -40.57344055175781, "global_step": 154645, "epoch": 1278} {"train_loss": -39.158329010009766, "global_step": 154646, "epoch": 1278} {"train_loss": -39.851478576660156, "global_step": 154647, "epoch": 1278} {"train_loss": -36.63178634643555, "global_step": 154648, "epoch": 1278} {"train_loss": -38.497562408447266, "global_step": 154649, "epoch": 1278} {"train_loss": -38.869197845458984, "global_step": 154650, "epoch": 1278} {"train_loss": -39.02832794189453, "global_step": 154651, "epoch": 1278} {"train_loss": -37.98436737060547, "global_step": 154652, "epoch": 1278} {"train_loss": -36.672096252441406, "global_step": 154653, "epoch": 1278} {"train_loss": -38.655303955078125, "global_step": 154654, "epoch": 1278} {"train_loss": -38.442047119140625, "global_step": 154655, "epoch": 1278} {"train_loss": -38.820884704589844, "global_step": 154656, "epoch": 1278} {"train_loss": -39.184383392333984, "global_step": 154657, "epoch": 1278} {"train_loss": -39.49514389038086, "global_step": 154658, "epoch": 1278} {"train_loss": -37.239986419677734, "global_step": 154659, "epoch": 1278} {"train_loss": -37.827999114990234, "global_step": 154660, "epoch": 1278} {"train_loss": -38.80939483642578, "global_step": 154661, "epoch": 1278} {"train_loss": -39.96019744873047, "global_step": 154662, "epoch": 1278} {"train_loss": -40.13458251953125, "global_step": 154663, "epoch": 1278} {"train_loss": -38.72101974487305, "global_step": 154664, "epoch": 1278} {"train_loss": -40.18741989135742, "global_step": 154665, "epoch": 1278} {"train_loss": -39.07094192504883, "global_step": 154666, "epoch": 1278} {"train_loss": -39.438411712646484, "global_step": 154667, "epoch": 1278} {"train_loss": -39.5299186706543, "global_step": 154668, "epoch": 1278} {"train_loss": -40.455841064453125, "global_step": 154669, "epoch": 1278} {"train_loss": -40.622093200683594, "global_step": 154670, "epoch": 1278} {"train_loss": -40.41524124145508, "global_step": 154671, "epoch": 1278} {"train_loss": -40.698028564453125, "global_step": 154672, "epoch": 1278} {"train_loss": -40.05149459838867, "global_step": 154673, "epoch": 1278} {"train_loss": -40.43219757080078, "global_step": 154674, "epoch": 1278} {"train_loss": -40.363399505615234, "global_step": 154675, "epoch": 1278} {"train_loss": -40.4163818359375, "global_step": 154676, "epoch": 1278} {"train_loss": -40.19552230834961, "global_step": 154677, "epoch": 1278} {"train_loss": -40.333953857421875, "global_step": 154678, "epoch": 1278} {"train_loss": -39.55949020385742, "global_step": 154679, "epoch": 1278} {"train_loss": -40.401878356933594, "global_step": 154680, "epoch": 1278} {"train_loss": -40.257720947265625, "global_step": 154681, "epoch": 1278} {"train_loss": -40.39736557006836, "global_step": 154682, "epoch": 1278} {"train_loss": -39.855224609375, "global_step": 154683, "epoch": 1278} {"train_loss": -40.77669906616211, "global_step": 154684, "epoch": 1278} {"train_loss": -38.94570541381836, "global_step": 154685, "epoch": 1278} {"train_loss": -41.23041534423828, "global_step": 154686, "epoch": 1278} {"train_loss": -40.668663024902344, "global_step": 154687, "epoch": 1278} {"train_loss": -40.53350067138672, "global_step": 154688, "epoch": 1278} {"train_loss": -39.91722869873047, "global_step": 154689, "epoch": 1278} {"train_loss": -41.14357376098633, "global_step": 154690, "epoch": 1278} {"train_loss": -39.25201416015625, "global_step": 154691, "epoch": 1278} {"train_loss": -39.681907653808594, "global_step": 154692, "epoch": 1278} {"train_loss": -41.18396759033203, "global_step": 154693, "epoch": 1278} {"train_loss": -40.686134338378906, "global_step": 154694, "epoch": 1278} {"train_loss": -39.74018478393555, "global_step": 154695, "epoch": 1278} {"train_loss": -39.8654670715332, "global_step": 154696, "epoch": 1278} {"train_loss": -40.87958908081055, "global_step": 154697, "epoch": 1278} {"train_loss": -39.84603500366211, "global_step": 154698, "epoch": 1278} {"train_loss": -40.967525482177734, "global_step": 154699, "epoch": 1278} {"train_loss": -40.601619720458984, "global_step": 154700, "epoch": 1278} {"train_loss": -40.1998176574707, "global_step": 154701, "epoch": 1278} {"train_loss": -40.33004379272461, "global_step": 154702, "epoch": 1278} {"train_loss": -40.88358688354492, "global_step": 154703, "epoch": 1278} {"train_loss": -40.6469612121582, "global_step": 154704, "epoch": 1278} {"train_loss": -40.25110626220703, "global_step": 154705, "epoch": 1278} {"train_loss": -40.927947998046875, "global_step": 154706, "epoch": 1278} {"train_loss": -41.154354095458984, "global_step": 154707, "epoch": 1278} {"train_loss": -41.22077941894531, "global_step": 154708, "epoch": 1278} {"train_loss": -40.84754180908203, "global_step": 154709, "epoch": 1278} {"train_loss": -40.6754264831543, "global_step": 154710, "epoch": 1278} {"train_loss": -41.58952331542969, "global_step": 154711, "epoch": 1278} {"train_loss": -40.94055938720703, "global_step": 154712, "epoch": 1278} {"train_loss": -41.1846809387207, "global_step": 154713, "epoch": 1278} {"train_loss": -41.53605270385742, "global_step": 154714, "epoch": 1278} {"train_loss": -41.034183502197266, "global_step": 154715, "epoch": 1278} {"train_loss": -40.35254669189453, "global_step": 154716, "epoch": 1278} {"train_loss": -40.82698059082031, "global_step": 154717, "epoch": 1278} {"train_loss": -41.40676498413086, "global_step": 154718, "epoch": 1278} {"train_loss": -41.04203414916992, "global_step": 154719, "epoch": 1278} {"train_loss": -41.60127258300781, "global_step": 154720, "epoch": 1278} {"train_loss": -41.07755661010742, "global_step": 154721, "epoch": 1278} {"train_loss": -41.0175666809082, "global_step": 154722, "epoch": 1278} {"train_loss": -41.29164123535156, "global_step": 154723, "epoch": 1278} {"train_loss": -39.95780563354492, "global_step": 154724, "epoch": 1278} {"train_loss": -41.09835433959961, "global_step": 154725, "epoch": 1278} {"train_loss": -40.3883056640625, "global_step": 154726, "epoch": 1278} {"train_loss": -40.712337493896484, "global_step": 154727, "epoch": 1278} {"train_loss": -39.573822021484375, "global_step": 154728, "epoch": 1278} {"train_loss": -41.07786178588867, "global_step": 154729, "epoch": 1278} {"train_loss": -40.523658752441406, "global_step": 154730, "epoch": 1278} {"train_loss": -40.2166633605957, "global_step": 154731, "epoch": 1278} {"train_loss": -40.87540817260742, "global_step": 154732, "epoch": 1278} {"train_loss": -40.09928512573242, "global_step": 154733, "epoch": 1278} {"train_loss": -39.76877975463867, "global_step": 154734, "epoch": 1278} {"train_loss": -40.36674880981445, "global_step": 154735, "epoch": 1278} {"train_loss": -39.708587646484375, "global_step": 154736, "epoch": 1278} {"train_loss": -40.9161262512207, "global_step": 154737, "epoch": 1278} {"train_loss": -41.282569885253906, "global_step": 154738, "epoch": 1278} {"train_loss": -40.35893630981445, "global_step": 154739, "epoch": 1278} {"train_loss": -41.2602653503418, "global_step": 154740, "epoch": 1278} {"train_loss": -40.633941650390625, "global_step": 154741, "epoch": 1278} {"train_loss": -40.853546142578125, "global_step": 154742, "epoch": 1278} {"train_loss": -40.637874603271484, "global_step": 154743, "epoch": 1278} {"train_loss": -40.68825149536133, "global_step": 154744, "epoch": 1278} {"train_loss": -40.65460205078125, "global_step": 154745, "epoch": 1278} {"train_loss": -41.24797821044922, "global_step": 154746, "epoch": 1278} {"train_loss": -41.30347442626953, "global_step": 154747, "epoch": 1278} {"train_loss": -41.0781364440918, "global_step": 154748, "epoch": 1278} {"train_loss": -40.28816604614258, "global_step": 154749, "epoch": 1278} {"train_loss": -41.391822814941406, "global_step": 154750, "epoch": 1278} {"train_loss": -40.295738220214844, "global_step": 154751, "epoch": 1278} {"train_loss": -39.35752487182617, "global_step": 154752, "epoch": 1278} {"train_loss": -40.360984802246094, "global_step": 154753, "epoch": 1278} {"train_loss": -40.68849563598633, "global_step": 154754, "epoch": 1278} {"train_loss": -40.96199417114258, "global_step": 154755, "epoch": 1278} {"train_loss": -40.872806549072266, "global_step": 154756, "epoch": 1278} {"train_loss": -40.684600830078125, "global_step": 154757, "epoch": 1278} {"train_loss": -40.23631702769887, "global_step": 154758, "epoch": 1278, "val_loss": 2655037.5} {"train_loss": -38.77223205566406, "global_step": 154759, "epoch": 1279} {"train_loss": -38.10126876831055, "global_step": 154760, "epoch": 1279} {"train_loss": -37.65131378173828, "global_step": 154761, "epoch": 1279} {"train_loss": -34.58478546142578, "global_step": 154762, "epoch": 1279} {"train_loss": -36.828922271728516, "global_step": 154763, "epoch": 1279} {"train_loss": -38.733131408691406, "global_step": 154764, "epoch": 1279} {"train_loss": -40.79010772705078, "global_step": 154765, "epoch": 1279} {"train_loss": -39.206756591796875, "global_step": 154766, "epoch": 1279} {"train_loss": -38.27519607543945, "global_step": 154767, "epoch": 1279} {"train_loss": -36.62022018432617, "global_step": 154768, "epoch": 1279} {"train_loss": -38.2357063293457, "global_step": 154769, "epoch": 1279} {"train_loss": -37.10641098022461, "global_step": 154770, "epoch": 1279} {"train_loss": -34.366920471191406, "global_step": 154771, "epoch": 1279} {"train_loss": -36.53845977783203, "global_step": 154772, "epoch": 1279} {"train_loss": -39.40546798706055, "global_step": 154773, "epoch": 1279} {"train_loss": -37.105865478515625, "global_step": 154774, "epoch": 1279} {"train_loss": -36.24821853637695, "global_step": 154775, "epoch": 1279} {"train_loss": -39.29111862182617, "global_step": 154776, "epoch": 1279} {"train_loss": -39.43253707885742, "global_step": 154777, "epoch": 1279} {"train_loss": -38.69643783569336, "global_step": 154778, "epoch": 1279} {"train_loss": -39.13865661621094, "global_step": 154779, "epoch": 1279} {"train_loss": -38.75304412841797, "global_step": 154780, "epoch": 1279} {"train_loss": -39.190425872802734, "global_step": 154781, "epoch": 1279} {"train_loss": -38.764556884765625, "global_step": 154782, "epoch": 1279} {"train_loss": -35.511390686035156, "global_step": 154783, "epoch": 1279} {"train_loss": -39.65535354614258, "global_step": 154784, "epoch": 1279} {"train_loss": -39.65053939819336, "global_step": 154785, "epoch": 1279} {"train_loss": -38.52641677856445, "global_step": 154786, "epoch": 1279} {"train_loss": -40.656700134277344, "global_step": 154787, "epoch": 1279} {"train_loss": -40.08832931518555, "global_step": 154788, "epoch": 1279} {"train_loss": -40.131446838378906, "global_step": 154789, "epoch": 1279} {"train_loss": -39.230289459228516, "global_step": 154790, "epoch": 1279} {"train_loss": -39.29567337036133, "global_step": 154791, "epoch": 1279} {"train_loss": -40.34208297729492, "global_step": 154792, "epoch": 1279} {"train_loss": -39.712799072265625, "global_step": 154793, "epoch": 1279} {"train_loss": -39.90969467163086, "global_step": 154794, "epoch": 1279} {"train_loss": -40.142208099365234, "global_step": 154795, "epoch": 1279} {"train_loss": -40.07711410522461, "global_step": 154796, "epoch": 1279} {"train_loss": -40.11375045776367, "global_step": 154797, "epoch": 1279} {"train_loss": -40.01811218261719, "global_step": 154798, "epoch": 1279} {"train_loss": -40.266170501708984, "global_step": 154799, "epoch": 1279} {"train_loss": -39.56343078613281, "global_step": 154800, "epoch": 1279} {"train_loss": -39.32719421386719, "global_step": 154801, "epoch": 1279} {"train_loss": -40.148250579833984, "global_step": 154802, "epoch": 1279} {"train_loss": -40.23052978515625, "global_step": 154803, "epoch": 1279} {"train_loss": -40.66544723510742, "global_step": 154804, "epoch": 1279} {"train_loss": -40.1445426940918, "global_step": 154805, "epoch": 1279} {"train_loss": -40.048519134521484, "global_step": 154806, "epoch": 1279} {"train_loss": -40.28851318359375, "global_step": 154807, "epoch": 1279} {"train_loss": -40.49591064453125, "global_step": 154808, "epoch": 1279} {"train_loss": -40.56760787963867, "global_step": 154809, "epoch": 1279} {"train_loss": -40.67287063598633, "global_step": 154810, "epoch": 1279} {"train_loss": -40.65541458129883, "global_step": 154811, "epoch": 1279} {"train_loss": -40.4517936706543, "global_step": 154812, "epoch": 1279} {"train_loss": -40.619476318359375, "global_step": 154813, "epoch": 1279} {"train_loss": -40.45668029785156, "global_step": 154814, "epoch": 1279} {"train_loss": -40.21281814575195, "global_step": 154815, "epoch": 1279} {"train_loss": -41.538063049316406, "global_step": 154816, "epoch": 1279} {"train_loss": -40.476478576660156, "global_step": 154817, "epoch": 1279} {"train_loss": -41.002506256103516, "global_step": 154818, "epoch": 1279} {"train_loss": -40.48847579956055, "global_step": 154819, "epoch": 1279} {"train_loss": -40.761253356933594, "global_step": 154820, "epoch": 1279} {"train_loss": -40.86406707763672, "global_step": 154821, "epoch": 1279} {"train_loss": -41.64431381225586, "global_step": 154822, "epoch": 1279} {"train_loss": -40.62274169921875, "global_step": 154823, "epoch": 1279} {"train_loss": -40.81142044067383, "global_step": 154824, "epoch": 1279} {"train_loss": -40.49528884887695, "global_step": 154825, "epoch": 1279} {"train_loss": -41.041080474853516, "global_step": 154826, "epoch": 1279} {"train_loss": -41.16316604614258, "global_step": 154827, "epoch": 1279} {"train_loss": -40.99863815307617, "global_step": 154828, "epoch": 1279} {"train_loss": -41.09022903442383, "global_step": 154829, "epoch": 1279} {"train_loss": -40.64847946166992, "global_step": 154830, "epoch": 1279} {"train_loss": -41.46967697143555, "global_step": 154831, "epoch": 1279} {"train_loss": -41.00273513793945, "global_step": 154832, "epoch": 1279} {"train_loss": -40.92902755737305, "global_step": 154833, "epoch": 1279} {"train_loss": -41.01618194580078, "global_step": 154834, "epoch": 1279} {"train_loss": -40.592201232910156, "global_step": 154835, "epoch": 1279} {"train_loss": -40.64262390136719, "global_step": 154836, "epoch": 1279} {"train_loss": -39.78206253051758, "global_step": 154837, "epoch": 1279} {"train_loss": -39.952754974365234, "global_step": 154838, "epoch": 1279} {"train_loss": -38.593990325927734, "global_step": 154839, "epoch": 1279} {"train_loss": -40.64971923828125, "global_step": 154840, "epoch": 1279} {"train_loss": -40.270118713378906, "global_step": 154841, "epoch": 1279} {"train_loss": -38.2501335144043, "global_step": 154842, "epoch": 1279} {"train_loss": -38.913299560546875, "global_step": 154843, "epoch": 1279} {"train_loss": -40.641387939453125, "global_step": 154844, "epoch": 1279} {"train_loss": -39.677978515625, "global_step": 154845, "epoch": 1279} {"train_loss": -39.35111618041992, "global_step": 154846, "epoch": 1279} {"train_loss": -40.263465881347656, "global_step": 154847, "epoch": 1279} {"train_loss": -39.37014389038086, "global_step": 154848, "epoch": 1279} {"train_loss": -39.87062454223633, "global_step": 154849, "epoch": 1279} {"train_loss": -41.04618453979492, "global_step": 154850, "epoch": 1279} {"train_loss": -38.16807556152344, "global_step": 154851, "epoch": 1279} {"train_loss": -40.09564208984375, "global_step": 154852, "epoch": 1279} {"train_loss": -39.984649658203125, "global_step": 154853, "epoch": 1279} {"train_loss": -41.027095794677734, "global_step": 154854, "epoch": 1279} {"train_loss": -39.55869674682617, "global_step": 154855, "epoch": 1279} {"train_loss": -40.111751556396484, "global_step": 154856, "epoch": 1279} {"train_loss": -40.30741500854492, "global_step": 154857, "epoch": 1279} {"train_loss": -39.55104446411133, "global_step": 154858, "epoch": 1279} {"train_loss": -40.439605712890625, "global_step": 154859, "epoch": 1279} {"train_loss": -40.03572463989258, "global_step": 154860, "epoch": 1279} {"train_loss": -37.89081954956055, "global_step": 154861, "epoch": 1279} {"train_loss": -40.580501556396484, "global_step": 154862, "epoch": 1279} {"train_loss": -39.368743896484375, "global_step": 154863, "epoch": 1279} {"train_loss": -39.33485794067383, "global_step": 154864, "epoch": 1279} {"train_loss": -40.42226791381836, "global_step": 154865, "epoch": 1279} {"train_loss": -38.60871124267578, "global_step": 154866, "epoch": 1279} {"train_loss": -39.193050384521484, "global_step": 154867, "epoch": 1279} {"train_loss": -39.18617248535156, "global_step": 154868, "epoch": 1279} {"train_loss": -39.51780319213867, "global_step": 154869, "epoch": 1279} {"train_loss": -40.39164733886719, "global_step": 154870, "epoch": 1279} {"train_loss": -40.111385345458984, "global_step": 154871, "epoch": 1279} {"train_loss": -39.38222885131836, "global_step": 154872, "epoch": 1279} {"train_loss": -40.193965911865234, "global_step": 154873, "epoch": 1279} {"train_loss": -40.22819137573242, "global_step": 154874, "epoch": 1279} {"train_loss": -40.160926818847656, "global_step": 154875, "epoch": 1279} {"train_loss": -39.9709587097168, "global_step": 154876, "epoch": 1279} {"train_loss": -40.36025619506836, "global_step": 154877, "epoch": 1279} {"train_loss": -40.150386810302734, "global_step": 154878, "epoch": 1279} {"train_loss": -39.6653920953924, "global_step": 154879, "epoch": 1279, "val_loss": 2789867.0} {"train_loss": -40.248775482177734, "global_step": 154880, "epoch": 1280} {"train_loss": -39.29670333862305, "global_step": 154881, "epoch": 1280} {"train_loss": -38.91400909423828, "global_step": 154882, "epoch": 1280} {"train_loss": -39.7354850769043, "global_step": 154883, "epoch": 1280} {"train_loss": -40.02336502075195, "global_step": 154884, "epoch": 1280} {"train_loss": -38.853187561035156, "global_step": 154885, "epoch": 1280} {"train_loss": -31.407245635986328, "global_step": 154886, "epoch": 1280} {"train_loss": -39.92904281616211, "global_step": 154887, "epoch": 1280} {"train_loss": -39.31077194213867, "global_step": 154888, "epoch": 1280} {"train_loss": -38.81063461303711, "global_step": 154889, "epoch": 1280} {"train_loss": -35.98570251464844, "global_step": 154890, "epoch": 1280} {"train_loss": -30.04115867614746, "global_step": 154891, "epoch": 1280} {"train_loss": -38.12636947631836, "global_step": 154892, "epoch": 1280} {"train_loss": -37.50368118286133, "global_step": 154893, "epoch": 1280} {"train_loss": -29.624059677124023, "global_step": 154894, "epoch": 1280} {"train_loss": -35.95354080200195, "global_step": 154895, "epoch": 1280} {"train_loss": -34.27937698364258, "global_step": 154896, "epoch": 1280} {"train_loss": -33.48812484741211, "global_step": 154897, "epoch": 1280} {"train_loss": -35.83146286010742, "global_step": 154898, "epoch": 1280} {"train_loss": -35.360809326171875, "global_step": 154899, "epoch": 1280} {"train_loss": -26.749948501586914, "global_step": 154900, "epoch": 1280} {"train_loss": -35.044857025146484, "global_step": 154901, "epoch": 1280} {"train_loss": -34.67518615722656, "global_step": 154902, "epoch": 1280} {"train_loss": -30.476720809936523, "global_step": 154903, "epoch": 1280} {"train_loss": -25.428869247436523, "global_step": 154904, "epoch": 1280} {"train_loss": -35.207611083984375, "global_step": 154905, "epoch": 1280} {"train_loss": -33.819820404052734, "global_step": 154906, "epoch": 1280} {"train_loss": -32.909706115722656, "global_step": 154907, "epoch": 1280} {"train_loss": -32.51563262939453, "global_step": 154908, "epoch": 1280} {"train_loss": -34.12040328979492, "global_step": 154909, "epoch": 1280} {"train_loss": -31.40132713317871, "global_step": 154910, "epoch": 1280} {"train_loss": -34.82916259765625, "global_step": 154911, "epoch": 1280} {"train_loss": -30.680002212524414, "global_step": 154912, "epoch": 1280} {"train_loss": -35.01973342895508, "global_step": 154913, "epoch": 1280} {"train_loss": -34.01112365722656, "global_step": 154914, "epoch": 1280} {"train_loss": -35.22466278076172, "global_step": 154915, "epoch": 1280} {"train_loss": -35.06104278564453, "global_step": 154916, "epoch": 1280} {"train_loss": -35.64211654663086, "global_step": 154917, "epoch": 1280} {"train_loss": -34.85825729370117, "global_step": 154918, "epoch": 1280} {"train_loss": -36.78158187866211, "global_step": 154919, "epoch": 1280} {"train_loss": -36.05343246459961, "global_step": 154920, "epoch": 1280} {"train_loss": -36.47512435913086, "global_step": 154921, "epoch": 1280} {"train_loss": -36.49787139892578, "global_step": 154922, "epoch": 1280} {"train_loss": -36.9080924987793, "global_step": 154923, "epoch": 1280} {"train_loss": -36.98203659057617, "global_step": 154924, "epoch": 1280} {"train_loss": -37.219032287597656, "global_step": 154925, "epoch": 1280} {"train_loss": -37.098018646240234, "global_step": 154926, "epoch": 1280} {"train_loss": -37.48353958129883, "global_step": 154927, "epoch": 1280} {"train_loss": -37.334293365478516, "global_step": 154928, "epoch": 1280} {"train_loss": -37.83875274658203, "global_step": 154929, "epoch": 1280} {"train_loss": -38.1236686706543, "global_step": 154930, "epoch": 1280} {"train_loss": -37.35113525390625, "global_step": 154931, "epoch": 1280} {"train_loss": -37.979061126708984, "global_step": 154932, "epoch": 1280} {"train_loss": -37.117923736572266, "global_step": 154933, "epoch": 1280} {"train_loss": -37.53408432006836, "global_step": 154934, "epoch": 1280} {"train_loss": -37.29677200317383, "global_step": 154935, "epoch": 1280} {"train_loss": -38.10247039794922, "global_step": 154936, "epoch": 1280} {"train_loss": -38.10628128051758, "global_step": 154937, "epoch": 1280} {"train_loss": -37.76607894897461, "global_step": 154938, "epoch": 1280} {"train_loss": -38.69193649291992, "global_step": 154939, "epoch": 1280} {"train_loss": -38.515010833740234, "global_step": 154940, "epoch": 1280} {"train_loss": -38.52439498901367, "global_step": 154941, "epoch": 1280} {"train_loss": -38.002464294433594, "global_step": 154942, "epoch": 1280} {"train_loss": -38.470306396484375, "global_step": 154943, "epoch": 1280} {"train_loss": -37.97282791137695, "global_step": 154944, "epoch": 1280} {"train_loss": -38.59778594970703, "global_step": 154945, "epoch": 1280} {"train_loss": -38.425167083740234, "global_step": 154946, "epoch": 1280} {"train_loss": -38.4616813659668, "global_step": 154947, "epoch": 1280} {"train_loss": -38.60234451293945, "global_step": 154948, "epoch": 1280} {"train_loss": -38.47757339477539, "global_step": 154949, "epoch": 1280} {"train_loss": -38.226646423339844, "global_step": 154950, "epoch": 1280} {"train_loss": -38.40460205078125, "global_step": 154951, "epoch": 1280} {"train_loss": -39.29275131225586, "global_step": 154952, "epoch": 1280} {"train_loss": -39.2090950012207, "global_step": 154953, "epoch": 1280} {"train_loss": -39.364410400390625, "global_step": 154954, "epoch": 1280} {"train_loss": -38.79111099243164, "global_step": 154955, "epoch": 1280} {"train_loss": -38.61964797973633, "global_step": 154956, "epoch": 1280} {"train_loss": -39.17739486694336, "global_step": 154957, "epoch": 1280} {"train_loss": -39.273963928222656, "global_step": 154958, "epoch": 1280} {"train_loss": -39.18849563598633, "global_step": 154959, "epoch": 1280} {"train_loss": -39.41004180908203, "global_step": 154960, "epoch": 1280} {"train_loss": -38.91212463378906, "global_step": 154961, "epoch": 1280} {"train_loss": -39.133419036865234, "global_step": 154962, "epoch": 1280} {"train_loss": -39.63373565673828, "global_step": 154963, "epoch": 1280} {"train_loss": -39.57912063598633, "global_step": 154964, "epoch": 1280} {"train_loss": -38.908782958984375, "global_step": 154965, "epoch": 1280} {"train_loss": -39.62399673461914, "global_step": 154966, "epoch": 1280} {"train_loss": -39.72526931762695, "global_step": 154967, "epoch": 1280} {"train_loss": -39.63557052612305, "global_step": 154968, "epoch": 1280} {"train_loss": -39.533687591552734, "global_step": 154969, "epoch": 1280} {"train_loss": -39.49332809448242, "global_step": 154970, "epoch": 1280} {"train_loss": -40.26709747314453, "global_step": 154971, "epoch": 1280} {"train_loss": -39.8211784362793, "global_step": 154972, "epoch": 1280} {"train_loss": -39.98786163330078, "global_step": 154973, "epoch": 1280} {"train_loss": -39.891990661621094, "global_step": 154974, "epoch": 1280} {"train_loss": -39.85982131958008, "global_step": 154975, "epoch": 1280} {"train_loss": -40.10139846801758, "global_step": 154976, "epoch": 1280} {"train_loss": -40.20885467529297, "global_step": 154977, "epoch": 1280} {"train_loss": -39.844818115234375, "global_step": 154978, "epoch": 1280} {"train_loss": -40.27054214477539, "global_step": 154979, "epoch": 1280} {"train_loss": -39.78023910522461, "global_step": 154980, "epoch": 1280} {"train_loss": -40.35380172729492, "global_step": 154981, "epoch": 1280} {"train_loss": -40.56241989135742, "global_step": 154982, "epoch": 1280} {"train_loss": -40.460609436035156, "global_step": 154983, "epoch": 1280} {"train_loss": -39.92657470703125, "global_step": 154984, "epoch": 1280} {"train_loss": -40.15146255493164, "global_step": 154985, "epoch": 1280} {"train_loss": -40.26309585571289, "global_step": 154986, "epoch": 1280} {"train_loss": -39.757625579833984, "global_step": 154987, "epoch": 1280} {"train_loss": -40.38851547241211, "global_step": 154988, "epoch": 1280} {"train_loss": -40.4404411315918, "global_step": 154989, "epoch": 1280} {"train_loss": -39.62971878051758, "global_step": 154990, "epoch": 1280} {"train_loss": -40.426856994628906, "global_step": 154991, "epoch": 1280} {"train_loss": -40.8464469909668, "global_step": 154992, "epoch": 1280} {"train_loss": -40.88804626464844, "global_step": 154993, "epoch": 1280} {"train_loss": -40.26372146606445, "global_step": 154994, "epoch": 1280} {"train_loss": -40.691650390625, "global_step": 154995, "epoch": 1280} {"train_loss": -40.333892822265625, "global_step": 154996, "epoch": 1280} {"train_loss": -40.48861312866211, "global_step": 154997, "epoch": 1280} {"train_loss": -40.38349151611328, "global_step": 154998, "epoch": 1280} {"train_loss": -40.41992950439453, "global_step": 154999, "epoch": 1280} {"train_loss": -37.67754513764184, "global_step": 155000, "epoch": 1280, "val_loss": 2642620.25} {"train_loss": -40.9342041015625, "global_step": 155001, "epoch": 1281} {"train_loss": -40.98981857299805, "global_step": 155002, "epoch": 1281} {"train_loss": -40.57124710083008, "global_step": 155003, "epoch": 1281} {"train_loss": -40.928558349609375, "global_step": 155004, "epoch": 1281} {"train_loss": -39.84930419921875, "global_step": 155005, "epoch": 1281} {"train_loss": -41.31854248046875, "global_step": 155006, "epoch": 1281} {"train_loss": -40.94138717651367, "global_step": 155007, "epoch": 1281} {"train_loss": -40.94533157348633, "global_step": 155008, "epoch": 1281} {"train_loss": -40.250118255615234, "global_step": 155009, "epoch": 1281} {"train_loss": -40.75161361694336, "global_step": 155010, "epoch": 1281} {"train_loss": -40.388763427734375, "global_step": 155011, "epoch": 1281} {"train_loss": -40.57008743286133, "global_step": 155012, "epoch": 1281} {"train_loss": -40.19097900390625, "global_step": 155013, "epoch": 1281} {"train_loss": -37.800689697265625, "global_step": 155014, "epoch": 1281} {"train_loss": -31.28101921081543, "global_step": 155015, "epoch": 1281} {"train_loss": -23.12312126159668, "global_step": 155016, "epoch": 1281} {"train_loss": -17.983646392822266, "global_step": 155017, "epoch": 1281} {"train_loss": -25.544952392578125, "global_step": 155018, "epoch": 1281} {"train_loss": -37.33306884765625, "global_step": 155019, "epoch": 1281} {"train_loss": -36.82340621948242, "global_step": 155020, "epoch": 1281} {"train_loss": -34.91985321044922, "global_step": 155021, "epoch": 1281} {"train_loss": -38.75210952758789, "global_step": 155022, "epoch": 1281} {"train_loss": -34.69031524658203, "global_step": 155023, "epoch": 1281} {"train_loss": -36.906124114990234, "global_step": 155024, "epoch": 1281} {"train_loss": -36.795833587646484, "global_step": 155025, "epoch": 1281} {"train_loss": -36.5897331237793, "global_step": 155026, "epoch": 1281} {"train_loss": -38.91714096069336, "global_step": 155027, "epoch": 1281} {"train_loss": -35.37180709838867, "global_step": 155028, "epoch": 1281} {"train_loss": -36.73415756225586, "global_step": 155029, "epoch": 1281} {"train_loss": -39.48480987548828, "global_step": 155030, "epoch": 1281} {"train_loss": -36.47878646850586, "global_step": 155031, "epoch": 1281} {"train_loss": -39.453819274902344, "global_step": 155032, "epoch": 1281} {"train_loss": -37.17092514038086, "global_step": 155033, "epoch": 1281} {"train_loss": -38.845149993896484, "global_step": 155034, "epoch": 1281} {"train_loss": -38.6684684753418, "global_step": 155035, "epoch": 1281} {"train_loss": -38.40034866333008, "global_step": 155036, "epoch": 1281} {"train_loss": -39.461143493652344, "global_step": 155037, "epoch": 1281} {"train_loss": -38.85380935668945, "global_step": 155038, "epoch": 1281} {"train_loss": -39.15010452270508, "global_step": 155039, "epoch": 1281} {"train_loss": -39.25742721557617, "global_step": 155040, "epoch": 1281} {"train_loss": -38.63704299926758, "global_step": 155041, "epoch": 1281} {"train_loss": -39.33503341674805, "global_step": 155042, "epoch": 1281} {"train_loss": -39.346439361572266, "global_step": 155043, "epoch": 1281} {"train_loss": -39.260833740234375, "global_step": 155044, "epoch": 1281} {"train_loss": -39.9068603515625, "global_step": 155045, "epoch": 1281} {"train_loss": -39.59111022949219, "global_step": 155046, "epoch": 1281} {"train_loss": -39.48993682861328, "global_step": 155047, "epoch": 1281} {"train_loss": -39.922080993652344, "global_step": 155048, "epoch": 1281} {"train_loss": -39.897125244140625, "global_step": 155049, "epoch": 1281} {"train_loss": -39.62162399291992, "global_step": 155050, "epoch": 1281} {"train_loss": -40.02763748168945, "global_step": 155051, "epoch": 1281} {"train_loss": -39.71263122558594, "global_step": 155052, "epoch": 1281} {"train_loss": -39.74540710449219, "global_step": 155053, "epoch": 1281} {"train_loss": -39.72216796875, "global_step": 155054, "epoch": 1281} {"train_loss": -40.46692657470703, "global_step": 155055, "epoch": 1281} {"train_loss": -40.01081085205078, "global_step": 155056, "epoch": 1281} {"train_loss": -40.46042251586914, "global_step": 155057, "epoch": 1281} {"train_loss": -39.45341110229492, "global_step": 155058, "epoch": 1281} {"train_loss": -39.89702224731445, "global_step": 155059, "epoch": 1281} {"train_loss": -40.08205795288086, "global_step": 155060, "epoch": 1281} {"train_loss": -40.30815505981445, "global_step": 155061, "epoch": 1281} {"train_loss": -40.24467849731445, "global_step": 155062, "epoch": 1281} {"train_loss": -40.860450744628906, "global_step": 155063, "epoch": 1281} {"train_loss": -40.0455436706543, "global_step": 155064, "epoch": 1281} {"train_loss": -40.21048355102539, "global_step": 155065, "epoch": 1281} {"train_loss": -40.21330642700195, "global_step": 155066, "epoch": 1281} {"train_loss": -40.663814544677734, "global_step": 155067, "epoch": 1281} {"train_loss": -40.19759750366211, "global_step": 155068, "epoch": 1281} {"train_loss": -40.44939041137695, "global_step": 155069, "epoch": 1281} {"train_loss": -39.82202911376953, "global_step": 155070, "epoch": 1281} {"train_loss": -40.68015670776367, "global_step": 155071, "epoch": 1281} {"train_loss": -40.89487838745117, "global_step": 155072, "epoch": 1281} {"train_loss": -40.28733444213867, "global_step": 155073, "epoch": 1281} {"train_loss": -40.60085678100586, "global_step": 155074, "epoch": 1281} {"train_loss": -40.67633819580078, "global_step": 155075, "epoch": 1281} {"train_loss": -40.89566421508789, "global_step": 155076, "epoch": 1281} {"train_loss": -40.46037292480469, "global_step": 155077, "epoch": 1281} {"train_loss": -40.81793212890625, "global_step": 155078, "epoch": 1281} {"train_loss": -40.79049301147461, "global_step": 155079, "epoch": 1281} {"train_loss": -40.577880859375, "global_step": 155080, "epoch": 1281} {"train_loss": -40.949031829833984, "global_step": 155081, "epoch": 1281} {"train_loss": -40.66982650756836, "global_step": 155082, "epoch": 1281} {"train_loss": -38.52737045288086, "global_step": 155083, "epoch": 1281} {"train_loss": -40.75689697265625, "global_step": 155084, "epoch": 1281} {"train_loss": -40.872901916503906, "global_step": 155085, "epoch": 1281} {"train_loss": -41.22504806518555, "global_step": 155086, "epoch": 1281} {"train_loss": -40.805049896240234, "global_step": 155087, "epoch": 1281} {"train_loss": -40.77476119995117, "global_step": 155088, "epoch": 1281} {"train_loss": -41.16543960571289, "global_step": 155089, "epoch": 1281} {"train_loss": -41.00492477416992, "global_step": 155090, "epoch": 1281} {"train_loss": -41.32821273803711, "global_step": 155091, "epoch": 1281} {"train_loss": -41.319580078125, "global_step": 155092, "epoch": 1281} {"train_loss": -41.262142181396484, "global_step": 155093, "epoch": 1281} {"train_loss": -41.59619903564453, "global_step": 155094, "epoch": 1281} {"train_loss": -40.9731559753418, "global_step": 155095, "epoch": 1281} {"train_loss": -41.321510314941406, "global_step": 155096, "epoch": 1281} {"train_loss": -41.60125732421875, "global_step": 155097, "epoch": 1281} {"train_loss": -40.587135314941406, "global_step": 155098, "epoch": 1281} {"train_loss": -41.19853973388672, "global_step": 155099, "epoch": 1281} {"train_loss": -41.2581901550293, "global_step": 155100, "epoch": 1281} {"train_loss": -40.243221282958984, "global_step": 155101, "epoch": 1281} {"train_loss": -41.038917541503906, "global_step": 155102, "epoch": 1281} {"train_loss": -41.12550735473633, "global_step": 155103, "epoch": 1281} {"train_loss": -40.643043518066406, "global_step": 155104, "epoch": 1281} {"train_loss": -40.44221115112305, "global_step": 155105, "epoch": 1281} {"train_loss": -40.17904281616211, "global_step": 155106, "epoch": 1281} {"train_loss": -40.81159210205078, "global_step": 155107, "epoch": 1281} {"train_loss": -41.045589447021484, "global_step": 155108, "epoch": 1281} {"train_loss": -41.7293586730957, "global_step": 155109, "epoch": 1281} {"train_loss": -39.5426025390625, "global_step": 155110, "epoch": 1281} {"train_loss": -36.804622650146484, "global_step": 155111, "epoch": 1281} {"train_loss": -39.64938735961914, "global_step": 155112, "epoch": 1281} {"train_loss": -41.407379150390625, "global_step": 155113, "epoch": 1281} {"train_loss": -40.04060745239258, "global_step": 155114, "epoch": 1281} {"train_loss": -39.41278839111328, "global_step": 155115, "epoch": 1281} {"train_loss": -39.95083236694336, "global_step": 155116, "epoch": 1281} {"train_loss": -39.47509765625, "global_step": 155117, "epoch": 1281} {"train_loss": -39.8062858581543, "global_step": 155118, "epoch": 1281} {"train_loss": -40.776065826416016, "global_step": 155119, "epoch": 1281} {"train_loss": -40.8885383605957, "global_step": 155120, "epoch": 1281} {"train_loss": -39.35332583592943, "global_step": 155121, "epoch": 1281, "val_loss": 2634972.75} {"train_loss": -39.26925277709961, "global_step": 155122, "epoch": 1282} {"train_loss": -38.551979064941406, "global_step": 155123, "epoch": 1282} {"train_loss": -38.671932220458984, "global_step": 155124, "epoch": 1282} {"train_loss": -39.70539474487305, "global_step": 155125, "epoch": 1282} {"train_loss": -37.786598205566406, "global_step": 155126, "epoch": 1282} {"train_loss": -39.665340423583984, "global_step": 155127, "epoch": 1282} {"train_loss": -40.136444091796875, "global_step": 155128, "epoch": 1282} {"train_loss": -39.065738677978516, "global_step": 155129, "epoch": 1282} {"train_loss": -39.433349609375, "global_step": 155130, "epoch": 1282} {"train_loss": -39.3972282409668, "global_step": 155131, "epoch": 1282} {"train_loss": -39.21701431274414, "global_step": 155132, "epoch": 1282} {"train_loss": -39.99114990234375, "global_step": 155133, "epoch": 1282} {"train_loss": -37.946319580078125, "global_step": 155134, "epoch": 1282} {"train_loss": -38.238197326660156, "global_step": 155135, "epoch": 1282} {"train_loss": -40.9830436706543, "global_step": 155136, "epoch": 1282} {"train_loss": -39.153926849365234, "global_step": 155137, "epoch": 1282} {"train_loss": -39.29336166381836, "global_step": 155138, "epoch": 1282} {"train_loss": -40.426204681396484, "global_step": 155139, "epoch": 1282} {"train_loss": -40.19663619995117, "global_step": 155140, "epoch": 1282} {"train_loss": -40.29008865356445, "global_step": 155141, "epoch": 1282} {"train_loss": -40.22343826293945, "global_step": 155142, "epoch": 1282} {"train_loss": -40.28281784057617, "global_step": 155143, "epoch": 1282} {"train_loss": -39.5019645690918, "global_step": 155144, "epoch": 1282} {"train_loss": -39.810699462890625, "global_step": 155145, "epoch": 1282} {"train_loss": -40.69810104370117, "global_step": 155146, "epoch": 1282} {"train_loss": -38.9900016784668, "global_step": 155147, "epoch": 1282} {"train_loss": -40.180908203125, "global_step": 155148, "epoch": 1282} {"train_loss": -39.761016845703125, "global_step": 155149, "epoch": 1282} {"train_loss": -40.18697738647461, "global_step": 155150, "epoch": 1282} {"train_loss": -40.040374755859375, "global_step": 155151, "epoch": 1282} {"train_loss": -35.662452697753906, "global_step": 155152, "epoch": 1282} {"train_loss": -39.37858200073242, "global_step": 155153, "epoch": 1282} {"train_loss": -40.484222412109375, "global_step": 155154, "epoch": 1282} {"train_loss": -40.337589263916016, "global_step": 155155, "epoch": 1282} {"train_loss": -40.86681365966797, "global_step": 155156, "epoch": 1282} {"train_loss": -39.15243148803711, "global_step": 155157, "epoch": 1282} {"train_loss": -39.08694076538086, "global_step": 155158, "epoch": 1282} {"train_loss": -40.35422897338867, "global_step": 155159, "epoch": 1282} {"train_loss": -40.00770950317383, "global_step": 155160, "epoch": 1282} {"train_loss": -39.67218780517578, "global_step": 155161, "epoch": 1282} {"train_loss": -40.16965866088867, "global_step": 155162, "epoch": 1282} {"train_loss": -39.747413635253906, "global_step": 155163, "epoch": 1282} {"train_loss": -40.734310150146484, "global_step": 155164, "epoch": 1282} {"train_loss": -40.50056076049805, "global_step": 155165, "epoch": 1282} {"train_loss": -40.06828308105469, "global_step": 155166, "epoch": 1282} {"train_loss": -40.7526969909668, "global_step": 155167, "epoch": 1282} {"train_loss": -39.651123046875, "global_step": 155168, "epoch": 1282} {"train_loss": -40.23407745361328, "global_step": 155169, "epoch": 1282} {"train_loss": -40.42182159423828, "global_step": 155170, "epoch": 1282} {"train_loss": -40.981319427490234, "global_step": 155171, "epoch": 1282} {"train_loss": -36.79014587402344, "global_step": 155172, "epoch": 1282} {"train_loss": -41.078243255615234, "global_step": 155173, "epoch": 1282} {"train_loss": -40.75497817993164, "global_step": 155174, "epoch": 1282} {"train_loss": -40.70998001098633, "global_step": 155175, "epoch": 1282} {"train_loss": -40.967647552490234, "global_step": 155176, "epoch": 1282} {"train_loss": -40.641029357910156, "global_step": 155177, "epoch": 1282} {"train_loss": -40.72963333129883, "global_step": 155178, "epoch": 1282} {"train_loss": -40.66950988769531, "global_step": 155179, "epoch": 1282} {"train_loss": -40.75074005126953, "global_step": 155180, "epoch": 1282} {"train_loss": -37.627071380615234, "global_step": 155181, "epoch": 1282} {"train_loss": -40.395118713378906, "global_step": 155182, "epoch": 1282} {"train_loss": -40.76350021362305, "global_step": 155183, "epoch": 1282} {"train_loss": -40.888710021972656, "global_step": 155184, "epoch": 1282} {"train_loss": -40.673702239990234, "global_step": 155185, "epoch": 1282} {"train_loss": -40.75002670288086, "global_step": 155186, "epoch": 1282} {"train_loss": -40.82750701904297, "global_step": 155187, "epoch": 1282} {"train_loss": -41.179931640625, "global_step": 155188, "epoch": 1282} {"train_loss": -40.56339645385742, "global_step": 155189, "epoch": 1282} {"train_loss": -40.065521240234375, "global_step": 155190, "epoch": 1282} {"train_loss": -41.184234619140625, "global_step": 155191, "epoch": 1282} {"train_loss": -40.63306427001953, "global_step": 155192, "epoch": 1282} {"train_loss": -40.761226654052734, "global_step": 155193, "epoch": 1282} {"train_loss": -40.48698043823242, "global_step": 155194, "epoch": 1282} {"train_loss": -41.079654693603516, "global_step": 155195, "epoch": 1282} {"train_loss": -40.52260208129883, "global_step": 155196, "epoch": 1282} {"train_loss": -40.41653060913086, "global_step": 155197, "epoch": 1282} {"train_loss": -39.48032760620117, "global_step": 155198, "epoch": 1282} {"train_loss": -39.70380783081055, "global_step": 155199, "epoch": 1282} {"train_loss": -39.07155227661133, "global_step": 155200, "epoch": 1282} {"train_loss": -38.35744857788086, "global_step": 155201, "epoch": 1282} {"train_loss": -37.589534759521484, "global_step": 155202, "epoch": 1282} {"train_loss": -40.34100341796875, "global_step": 155203, "epoch": 1282} {"train_loss": -40.39215087890625, "global_step": 155204, "epoch": 1282} {"train_loss": -39.22243118286133, "global_step": 155205, "epoch": 1282} {"train_loss": -38.26398849487305, "global_step": 155206, "epoch": 1282} {"train_loss": -35.6030387878418, "global_step": 155207, "epoch": 1282} {"train_loss": -35.925559997558594, "global_step": 155208, "epoch": 1282} {"train_loss": -35.67006301879883, "global_step": 155209, "epoch": 1282} {"train_loss": -38.91480255126953, "global_step": 155210, "epoch": 1282} {"train_loss": -39.24451446533203, "global_step": 155211, "epoch": 1282} {"train_loss": -39.59370422363281, "global_step": 155212, "epoch": 1282} {"train_loss": -38.54791259765625, "global_step": 155213, "epoch": 1282} {"train_loss": -39.20568084716797, "global_step": 155214, "epoch": 1282} {"train_loss": -40.2968864440918, "global_step": 155215, "epoch": 1282} {"train_loss": -37.424285888671875, "global_step": 155216, "epoch": 1282} {"train_loss": -39.72843933105469, "global_step": 155217, "epoch": 1282} {"train_loss": -37.929725646972656, "global_step": 155218, "epoch": 1282} {"train_loss": -38.04586410522461, "global_step": 155219, "epoch": 1282} {"train_loss": -40.14524459838867, "global_step": 155220, "epoch": 1282} {"train_loss": -37.84278869628906, "global_step": 155221, "epoch": 1282} {"train_loss": -40.68339157104492, "global_step": 155222, "epoch": 1282} {"train_loss": -37.68798828125, "global_step": 155223, "epoch": 1282} {"train_loss": -39.389984130859375, "global_step": 155224, "epoch": 1282} {"train_loss": -40.220890045166016, "global_step": 155225, "epoch": 1282} {"train_loss": -39.41456985473633, "global_step": 155226, "epoch": 1282} {"train_loss": -40.04219436645508, "global_step": 155227, "epoch": 1282} {"train_loss": -39.4285888671875, "global_step": 155228, "epoch": 1282} {"train_loss": -39.62819290161133, "global_step": 155229, "epoch": 1282} {"train_loss": -38.83796310424805, "global_step": 155230, "epoch": 1282} {"train_loss": -39.06241989135742, "global_step": 155231, "epoch": 1282} {"train_loss": -39.91889572143555, "global_step": 155232, "epoch": 1282} {"train_loss": -40.66281509399414, "global_step": 155233, "epoch": 1282} {"train_loss": -39.86184310913086, "global_step": 155234, "epoch": 1282} {"train_loss": -40.96875, "global_step": 155235, "epoch": 1282} {"train_loss": -40.1241569519043, "global_step": 155236, "epoch": 1282} {"train_loss": -40.672420501708984, "global_step": 155237, "epoch": 1282} {"train_loss": -40.36412048339844, "global_step": 155238, "epoch": 1282} {"train_loss": -40.251888275146484, "global_step": 155239, "epoch": 1282} {"train_loss": -40.11013412475586, "global_step": 155240, "epoch": 1282} {"train_loss": -40.44692611694336, "global_step": 155241, "epoch": 1282} {"train_loss": -39.687430957132136, "global_step": 155242, "epoch": 1282, "val_loss": 2595553.0} {"train_loss": -40.6419792175293, "global_step": 155243, "epoch": 1283} {"train_loss": -41.150306701660156, "global_step": 155244, "epoch": 1283} {"train_loss": -40.62640380859375, "global_step": 155245, "epoch": 1283} {"train_loss": -40.64900588989258, "global_step": 155246, "epoch": 1283} {"train_loss": -40.58384323120117, "global_step": 155247, "epoch": 1283} {"train_loss": -41.0144157409668, "global_step": 155248, "epoch": 1283} {"train_loss": -40.9603271484375, "global_step": 155249, "epoch": 1283} {"train_loss": -40.9100456237793, "global_step": 155250, "epoch": 1283} {"train_loss": -39.74773025512695, "global_step": 155251, "epoch": 1283} {"train_loss": -41.19349670410156, "global_step": 155252, "epoch": 1283} {"train_loss": -40.20881271362305, "global_step": 155253, "epoch": 1283} {"train_loss": -41.06509017944336, "global_step": 155254, "epoch": 1283} {"train_loss": -39.54244613647461, "global_step": 155255, "epoch": 1283} {"train_loss": -39.36310958862305, "global_step": 155256, "epoch": 1283} {"train_loss": -40.82914733886719, "global_step": 155257, "epoch": 1283} {"train_loss": -40.899898529052734, "global_step": 155258, "epoch": 1283} {"train_loss": -38.688167572021484, "global_step": 155259, "epoch": 1283} {"train_loss": -40.3101806640625, "global_step": 155260, "epoch": 1283} {"train_loss": -37.234920501708984, "global_step": 155261, "epoch": 1283} {"train_loss": -40.529884338378906, "global_step": 155262, "epoch": 1283} {"train_loss": -39.07912826538086, "global_step": 155263, "epoch": 1283} {"train_loss": -32.41635513305664, "global_step": 155264, "epoch": 1283} {"train_loss": -38.86500549316406, "global_step": 155265, "epoch": 1283} {"train_loss": -40.579978942871094, "global_step": 155266, "epoch": 1283} {"train_loss": -38.39945602416992, "global_step": 155267, "epoch": 1283} {"train_loss": -36.96721267700195, "global_step": 155268, "epoch": 1283} {"train_loss": -38.85073471069336, "global_step": 155269, "epoch": 1283} {"train_loss": -38.195068359375, "global_step": 155270, "epoch": 1283} {"train_loss": -37.8504524230957, "global_step": 155271, "epoch": 1283} {"train_loss": -37.14423751831055, "global_step": 155272, "epoch": 1283} {"train_loss": -36.39252471923828, "global_step": 155273, "epoch": 1283} {"train_loss": -35.90625762939453, "global_step": 155274, "epoch": 1283} {"train_loss": -36.75899887084961, "global_step": 155275, "epoch": 1283} {"train_loss": -37.56768798828125, "global_step": 155276, "epoch": 1283} {"train_loss": -34.75395202636719, "global_step": 155277, "epoch": 1283} {"train_loss": -36.97136688232422, "global_step": 155278, "epoch": 1283} {"train_loss": -37.620391845703125, "global_step": 155279, "epoch": 1283} {"train_loss": -39.20903396606445, "global_step": 155280, "epoch": 1283} {"train_loss": -29.377531051635742, "global_step": 155281, "epoch": 1283} {"train_loss": -37.21486282348633, "global_step": 155282, "epoch": 1283} {"train_loss": -36.4420051574707, "global_step": 155283, "epoch": 1283} {"train_loss": -34.0968017578125, "global_step": 155284, "epoch": 1283} {"train_loss": -31.98322868347168, "global_step": 155285, "epoch": 1283} {"train_loss": -34.258663177490234, "global_step": 155286, "epoch": 1283} {"train_loss": -35.942440032958984, "global_step": 155287, "epoch": 1283} {"train_loss": -38.69363021850586, "global_step": 155288, "epoch": 1283} {"train_loss": -36.4044075012207, "global_step": 155289, "epoch": 1283} {"train_loss": -32.755943298339844, "global_step": 155290, "epoch": 1283} {"train_loss": -37.268592834472656, "global_step": 155291, "epoch": 1283} {"train_loss": -37.91429138183594, "global_step": 155292, "epoch": 1283} {"train_loss": -37.95351028442383, "global_step": 155293, "epoch": 1283} {"train_loss": -36.471923828125, "global_step": 155294, "epoch": 1283} {"train_loss": -37.45786666870117, "global_step": 155295, "epoch": 1283} {"train_loss": -37.78248977661133, "global_step": 155296, "epoch": 1283} {"train_loss": -36.12581253051758, "global_step": 155297, "epoch": 1283} {"train_loss": -36.49979782104492, "global_step": 155298, "epoch": 1283} {"train_loss": -38.25297164916992, "global_step": 155299, "epoch": 1283} {"train_loss": -37.71310043334961, "global_step": 155300, "epoch": 1283} {"train_loss": -36.483917236328125, "global_step": 155301, "epoch": 1283} {"train_loss": -36.9501838684082, "global_step": 155302, "epoch": 1283} {"train_loss": -38.16913604736328, "global_step": 155303, "epoch": 1283} {"train_loss": -38.764190673828125, "global_step": 155304, "epoch": 1283} {"train_loss": -37.42120361328125, "global_step": 155305, "epoch": 1283} {"train_loss": -37.06426239013672, "global_step": 155306, "epoch": 1283} {"train_loss": -37.64710235595703, "global_step": 155307, "epoch": 1283} {"train_loss": -36.56767654418945, "global_step": 155308, "epoch": 1283} {"train_loss": -38.09124755859375, "global_step": 155309, "epoch": 1283} {"train_loss": -38.94907760620117, "global_step": 155310, "epoch": 1283} {"train_loss": -38.49976348876953, "global_step": 155311, "epoch": 1283} {"train_loss": -38.1118278503418, "global_step": 155312, "epoch": 1283} {"train_loss": -39.41941452026367, "global_step": 155313, "epoch": 1283} {"train_loss": -39.05353546142578, "global_step": 155314, "epoch": 1283} {"train_loss": -37.79863357543945, "global_step": 155315, "epoch": 1283} {"train_loss": -38.64582443237305, "global_step": 155316, "epoch": 1283} {"train_loss": -38.302345275878906, "global_step": 155317, "epoch": 1283} {"train_loss": -38.97758102416992, "global_step": 155318, "epoch": 1283} {"train_loss": -38.80452346801758, "global_step": 155319, "epoch": 1283} {"train_loss": -38.6331901550293, "global_step": 155320, "epoch": 1283} {"train_loss": -38.825653076171875, "global_step": 155321, "epoch": 1283} {"train_loss": -39.27893829345703, "global_step": 155322, "epoch": 1283} {"train_loss": -39.1392822265625, "global_step": 155323, "epoch": 1283} {"train_loss": -38.8142204284668, "global_step": 155324, "epoch": 1283} {"train_loss": -38.98121643066406, "global_step": 155325, "epoch": 1283} {"train_loss": -39.64478302001953, "global_step": 155326, "epoch": 1283} {"train_loss": -38.97353744506836, "global_step": 155327, "epoch": 1283} {"train_loss": -38.1950569152832, "global_step": 155328, "epoch": 1283} {"train_loss": -39.08466720581055, "global_step": 155329, "epoch": 1283} {"train_loss": -38.31252670288086, "global_step": 155330, "epoch": 1283} {"train_loss": -39.48408889770508, "global_step": 155331, "epoch": 1283} {"train_loss": -39.5737190246582, "global_step": 155332, "epoch": 1283} {"train_loss": -39.27185821533203, "global_step": 155333, "epoch": 1283} {"train_loss": -39.606475830078125, "global_step": 155334, "epoch": 1283} {"train_loss": -39.574520111083984, "global_step": 155335, "epoch": 1283} {"train_loss": -39.697113037109375, "global_step": 155336, "epoch": 1283} {"train_loss": -39.67815017700195, "global_step": 155337, "epoch": 1283} {"train_loss": -39.272369384765625, "global_step": 155338, "epoch": 1283} {"train_loss": -38.98629379272461, "global_step": 155339, "epoch": 1283} {"train_loss": -39.98456954956055, "global_step": 155340, "epoch": 1283} {"train_loss": -39.10044479370117, "global_step": 155341, "epoch": 1283} {"train_loss": -39.81936264038086, "global_step": 155342, "epoch": 1283} {"train_loss": -39.96125030517578, "global_step": 155343, "epoch": 1283} {"train_loss": -39.85764694213867, "global_step": 155344, "epoch": 1283} {"train_loss": -39.99811553955078, "global_step": 155345, "epoch": 1283} {"train_loss": -39.388938903808594, "global_step": 155346, "epoch": 1283} {"train_loss": -40.29024887084961, "global_step": 155347, "epoch": 1283} {"train_loss": -39.509647369384766, "global_step": 155348, "epoch": 1283} {"train_loss": -39.791988372802734, "global_step": 155349, "epoch": 1283} {"train_loss": -38.99885177612305, "global_step": 155350, "epoch": 1283} {"train_loss": -40.33005142211914, "global_step": 155351, "epoch": 1283} {"train_loss": -39.679908752441406, "global_step": 155352, "epoch": 1283} {"train_loss": -40.29561233520508, "global_step": 155353, "epoch": 1283} {"train_loss": -40.28099822998047, "global_step": 155354, "epoch": 1283} {"train_loss": -40.2529296875, "global_step": 155355, "epoch": 1283} {"train_loss": -40.22338104248047, "global_step": 155356, "epoch": 1283} {"train_loss": -39.78753662109375, "global_step": 155357, "epoch": 1283} {"train_loss": -39.51996612548828, "global_step": 155358, "epoch": 1283} {"train_loss": -39.92703628540039, "global_step": 155359, "epoch": 1283} {"train_loss": -40.58732986450195, "global_step": 155360, "epoch": 1283} {"train_loss": -40.52009201049805, "global_step": 155361, "epoch": 1283} {"train_loss": -40.6525993347168, "global_step": 155362, "epoch": 1283} {"train_loss": -38.56700263535681, "global_step": 155363, "epoch": 1283, "val_loss": 2669300.25} {"train_loss": -40.32477569580078, "global_step": 155364, "epoch": 1284} {"train_loss": -40.686527252197266, "global_step": 155365, "epoch": 1284} {"train_loss": -40.18446731567383, "global_step": 155366, "epoch": 1284} {"train_loss": -40.80049133300781, "global_step": 155367, "epoch": 1284} {"train_loss": -40.31328201293945, "global_step": 155368, "epoch": 1284} {"train_loss": -40.4995231628418, "global_step": 155369, "epoch": 1284} {"train_loss": -40.67151641845703, "global_step": 155370, "epoch": 1284} {"train_loss": -40.411380767822266, "global_step": 155371, "epoch": 1284} {"train_loss": -40.72721862792969, "global_step": 155372, "epoch": 1284} {"train_loss": -40.288970947265625, "global_step": 155373, "epoch": 1284} {"train_loss": -40.67751693725586, "global_step": 155374, "epoch": 1284} {"train_loss": -41.0268669128418, "global_step": 155375, "epoch": 1284} {"train_loss": -40.76072311401367, "global_step": 155376, "epoch": 1284} {"train_loss": -41.07442855834961, "global_step": 155377, "epoch": 1284} {"train_loss": -40.28054428100586, "global_step": 155378, "epoch": 1284} {"train_loss": -40.67148971557617, "global_step": 155379, "epoch": 1284} {"train_loss": -40.32624435424805, "global_step": 155380, "epoch": 1284} {"train_loss": -40.426448822021484, "global_step": 155381, "epoch": 1284} {"train_loss": -40.03043746948242, "global_step": 155382, "epoch": 1284} {"train_loss": -39.899837493896484, "global_step": 155383, "epoch": 1284} {"train_loss": -39.790740966796875, "global_step": 155384, "epoch": 1284} {"train_loss": -40.276573181152344, "global_step": 155385, "epoch": 1284} {"train_loss": -40.10408401489258, "global_step": 155386, "epoch": 1284} {"train_loss": -38.307308197021484, "global_step": 155387, "epoch": 1284} {"train_loss": -37.275455474853516, "global_step": 155388, "epoch": 1284} {"train_loss": -38.401912689208984, "global_step": 155389, "epoch": 1284} {"train_loss": -40.01837921142578, "global_step": 155390, "epoch": 1284} {"train_loss": -41.08863067626953, "global_step": 155391, "epoch": 1284} {"train_loss": -40.06034469604492, "global_step": 155392, "epoch": 1284} {"train_loss": -39.40140151977539, "global_step": 155393, "epoch": 1284} {"train_loss": -38.9508171081543, "global_step": 155394, "epoch": 1284} {"train_loss": -39.10301971435547, "global_step": 155395, "epoch": 1284} {"train_loss": -38.940677642822266, "global_step": 155396, "epoch": 1284} {"train_loss": -39.538875579833984, "global_step": 155397, "epoch": 1284} {"train_loss": -40.41763687133789, "global_step": 155398, "epoch": 1284} {"train_loss": -40.00755310058594, "global_step": 155399, "epoch": 1284} {"train_loss": -40.4096565246582, "global_step": 155400, "epoch": 1284} {"train_loss": -40.0072135925293, "global_step": 155401, "epoch": 1284} {"train_loss": -39.53764343261719, "global_step": 155402, "epoch": 1284} {"train_loss": -39.20808029174805, "global_step": 155403, "epoch": 1284} {"train_loss": -39.28406524658203, "global_step": 155404, "epoch": 1284} {"train_loss": -39.84797286987305, "global_step": 155405, "epoch": 1284} {"train_loss": -40.334571838378906, "global_step": 155406, "epoch": 1284} {"train_loss": -40.70973205566406, "global_step": 155407, "epoch": 1284} {"train_loss": -38.48229217529297, "global_step": 155408, "epoch": 1284} {"train_loss": -39.6151237487793, "global_step": 155409, "epoch": 1284} {"train_loss": -35.846561431884766, "global_step": 155410, "epoch": 1284} {"train_loss": -35.167083740234375, "global_step": 155411, "epoch": 1284} {"train_loss": -35.001380920410156, "global_step": 155412, "epoch": 1284} {"train_loss": -28.34620475769043, "global_step": 155413, "epoch": 1284} {"train_loss": -35.27664566040039, "global_step": 155414, "epoch": 1284} {"train_loss": -31.725446701049805, "global_step": 155415, "epoch": 1284} {"train_loss": -36.65385055541992, "global_step": 155416, "epoch": 1284} {"train_loss": -32.879417419433594, "global_step": 155417, "epoch": 1284} {"train_loss": -36.94196701049805, "global_step": 155418, "epoch": 1284} {"train_loss": -36.92426681518555, "global_step": 155419, "epoch": 1284} {"train_loss": -36.37268829345703, "global_step": 155420, "epoch": 1284} {"train_loss": -37.1826286315918, "global_step": 155421, "epoch": 1284} {"train_loss": -38.07135009765625, "global_step": 155422, "epoch": 1284} {"train_loss": -37.37345504760742, "global_step": 155423, "epoch": 1284} {"train_loss": -38.809173583984375, "global_step": 155424, "epoch": 1284} {"train_loss": -39.79233932495117, "global_step": 155425, "epoch": 1284} {"train_loss": -37.8966178894043, "global_step": 155426, "epoch": 1284} {"train_loss": -39.40296173095703, "global_step": 155427, "epoch": 1284} {"train_loss": -39.291080474853516, "global_step": 155428, "epoch": 1284} {"train_loss": -39.239662170410156, "global_step": 155429, "epoch": 1284} {"train_loss": -37.842655181884766, "global_step": 155430, "epoch": 1284} {"train_loss": -40.250972747802734, "global_step": 155431, "epoch": 1284} {"train_loss": -39.229957580566406, "global_step": 155432, "epoch": 1284} {"train_loss": -39.58445358276367, "global_step": 155433, "epoch": 1284} {"train_loss": -38.76365280151367, "global_step": 155434, "epoch": 1284} {"train_loss": -39.9932861328125, "global_step": 155435, "epoch": 1284} {"train_loss": -39.52281951904297, "global_step": 155436, "epoch": 1284} {"train_loss": -39.083091735839844, "global_step": 155437, "epoch": 1284} {"train_loss": -38.69051742553711, "global_step": 155438, "epoch": 1284} {"train_loss": -39.27244186401367, "global_step": 155439, "epoch": 1284} {"train_loss": -39.82956314086914, "global_step": 155440, "epoch": 1284} {"train_loss": -38.94684982299805, "global_step": 155441, "epoch": 1284} {"train_loss": -39.47275924682617, "global_step": 155442, "epoch": 1284} {"train_loss": -40.45661544799805, "global_step": 155443, "epoch": 1284} {"train_loss": -40.600013732910156, "global_step": 155444, "epoch": 1284} {"train_loss": -40.46181869506836, "global_step": 155445, "epoch": 1284} {"train_loss": -40.10165023803711, "global_step": 155446, "epoch": 1284} {"train_loss": -40.34132766723633, "global_step": 155447, "epoch": 1284} {"train_loss": -40.201629638671875, "global_step": 155448, "epoch": 1284} {"train_loss": -39.062232971191406, "global_step": 155449, "epoch": 1284} {"train_loss": -40.039485931396484, "global_step": 155450, "epoch": 1284} {"train_loss": -39.44255447387695, "global_step": 155451, "epoch": 1284} {"train_loss": -39.920196533203125, "global_step": 155452, "epoch": 1284} {"train_loss": -40.289520263671875, "global_step": 155453, "epoch": 1284} {"train_loss": -40.830074310302734, "global_step": 155454, "epoch": 1284} {"train_loss": -40.364646911621094, "global_step": 155455, "epoch": 1284} {"train_loss": -40.1863899230957, "global_step": 155456, "epoch": 1284} {"train_loss": -40.11220932006836, "global_step": 155457, "epoch": 1284} {"train_loss": -40.60860061645508, "global_step": 155458, "epoch": 1284} {"train_loss": -40.7774772644043, "global_step": 155459, "epoch": 1284} {"train_loss": -40.36661911010742, "global_step": 155460, "epoch": 1284} {"train_loss": -40.56657028198242, "global_step": 155461, "epoch": 1284} {"train_loss": -41.037349700927734, "global_step": 155462, "epoch": 1284} {"train_loss": -41.024295806884766, "global_step": 155463, "epoch": 1284} {"train_loss": -38.90796661376953, "global_step": 155464, "epoch": 1284} {"train_loss": -39.70719909667969, "global_step": 155465, "epoch": 1284} {"train_loss": -40.4752197265625, "global_step": 155466, "epoch": 1284} {"train_loss": -40.77704620361328, "global_step": 155467, "epoch": 1284} {"train_loss": -40.10093688964844, "global_step": 155468, "epoch": 1284} {"train_loss": -40.16564178466797, "global_step": 155469, "epoch": 1284} {"train_loss": -41.07297897338867, "global_step": 155470, "epoch": 1284} {"train_loss": -40.80801010131836, "global_step": 155471, "epoch": 1284} {"train_loss": -40.79976272583008, "global_step": 155472, "epoch": 1284} {"train_loss": -40.46610641479492, "global_step": 155473, "epoch": 1284} {"train_loss": -40.4246711730957, "global_step": 155474, "epoch": 1284} {"train_loss": -41.132232666015625, "global_step": 155475, "epoch": 1284} {"train_loss": -39.81440353393555, "global_step": 155476, "epoch": 1284} {"train_loss": -39.136741638183594, "global_step": 155477, "epoch": 1284} {"train_loss": -40.81882858276367, "global_step": 155478, "epoch": 1284} {"train_loss": -40.37126541137695, "global_step": 155479, "epoch": 1284} {"train_loss": -40.93756103515625, "global_step": 155480, "epoch": 1284} {"train_loss": -41.22004318237305, "global_step": 155481, "epoch": 1284} {"train_loss": -39.99870300292969, "global_step": 155482, "epoch": 1284} {"train_loss": -40.45052719116211, "global_step": 155483, "epoch": 1284} {"train_loss": -39.45182204443561, "global_step": 155484, "epoch": 1284, "val_loss": 2695240.75} {"train_loss": -38.99080276489258, "global_step": 155485, "epoch": 1285} {"train_loss": -40.878292083740234, "global_step": 155486, "epoch": 1285} {"train_loss": -40.617950439453125, "global_step": 155487, "epoch": 1285} {"train_loss": -40.76583480834961, "global_step": 155488, "epoch": 1285} {"train_loss": -40.1749382019043, "global_step": 155489, "epoch": 1285} {"train_loss": -40.53255844116211, "global_step": 155490, "epoch": 1285} {"train_loss": -40.68558883666992, "global_step": 155491, "epoch": 1285} {"train_loss": -41.46092987060547, "global_step": 155492, "epoch": 1285} {"train_loss": -40.921573638916016, "global_step": 155493, "epoch": 1285} {"train_loss": -40.88193130493164, "global_step": 155494, "epoch": 1285} {"train_loss": -41.2495231628418, "global_step": 155495, "epoch": 1285} {"train_loss": -39.46009063720703, "global_step": 155496, "epoch": 1285} {"train_loss": -41.21127700805664, "global_step": 155497, "epoch": 1285} {"train_loss": -40.9296989440918, "global_step": 155498, "epoch": 1285} {"train_loss": -40.55403137207031, "global_step": 155499, "epoch": 1285} {"train_loss": -41.172157287597656, "global_step": 155500, "epoch": 1285} {"train_loss": -40.02677536010742, "global_step": 155501, "epoch": 1285} {"train_loss": -40.060890197753906, "global_step": 155502, "epoch": 1285} {"train_loss": -37.474910736083984, "global_step": 155503, "epoch": 1285} {"train_loss": -36.300533294677734, "global_step": 155504, "epoch": 1285} {"train_loss": -36.34196090698242, "global_step": 155505, "epoch": 1285} {"train_loss": -37.0623779296875, "global_step": 155506, "epoch": 1285} {"train_loss": -39.06037139892578, "global_step": 155507, "epoch": 1285} {"train_loss": -37.55449295043945, "global_step": 155508, "epoch": 1285} {"train_loss": -34.11620330810547, "global_step": 155509, "epoch": 1285} {"train_loss": -34.0201530456543, "global_step": 155510, "epoch": 1285} {"train_loss": -39.49030685424805, "global_step": 155511, "epoch": 1285} {"train_loss": -37.7320556640625, "global_step": 155512, "epoch": 1285} {"train_loss": -36.544246673583984, "global_step": 155513, "epoch": 1285} {"train_loss": -39.4891471862793, "global_step": 155514, "epoch": 1285} {"train_loss": -34.437076568603516, "global_step": 155515, "epoch": 1285} {"train_loss": -32.807735443115234, "global_step": 155516, "epoch": 1285} {"train_loss": -39.56002426147461, "global_step": 155517, "epoch": 1285} {"train_loss": -33.304256439208984, "global_step": 155518, "epoch": 1285} {"train_loss": -37.039608001708984, "global_step": 155519, "epoch": 1285} {"train_loss": -37.089019775390625, "global_step": 155520, "epoch": 1285} {"train_loss": -37.1500358581543, "global_step": 155521, "epoch": 1285} {"train_loss": -36.468788146972656, "global_step": 155522, "epoch": 1285} {"train_loss": -32.4175910949707, "global_step": 155523, "epoch": 1285} {"train_loss": -37.896724700927734, "global_step": 155524, "epoch": 1285} {"train_loss": -38.5160026550293, "global_step": 155525, "epoch": 1285} {"train_loss": -39.02106857299805, "global_step": 155526, "epoch": 1285} {"train_loss": -34.69258499145508, "global_step": 155527, "epoch": 1285} {"train_loss": -35.85883331298828, "global_step": 155528, "epoch": 1285} {"train_loss": -38.11785125732422, "global_step": 155529, "epoch": 1285} {"train_loss": -37.45998764038086, "global_step": 155530, "epoch": 1285} {"train_loss": -38.312923431396484, "global_step": 155531, "epoch": 1285} {"train_loss": -39.25655746459961, "global_step": 155532, "epoch": 1285} {"train_loss": -37.54282760620117, "global_step": 155533, "epoch": 1285} {"train_loss": -37.510250091552734, "global_step": 155534, "epoch": 1285} {"train_loss": -37.86353302001953, "global_step": 155535, "epoch": 1285} {"train_loss": -38.10896682739258, "global_step": 155536, "epoch": 1285} {"train_loss": -38.57632064819336, "global_step": 155537, "epoch": 1285} {"train_loss": -38.38074493408203, "global_step": 155538, "epoch": 1285} {"train_loss": -39.905242919921875, "global_step": 155539, "epoch": 1285} {"train_loss": -38.362728118896484, "global_step": 155540, "epoch": 1285} {"train_loss": -39.429378509521484, "global_step": 155541, "epoch": 1285} {"train_loss": -40.22589874267578, "global_step": 155542, "epoch": 1285} {"train_loss": -36.163330078125, "global_step": 155543, "epoch": 1285} {"train_loss": -39.2786750793457, "global_step": 155544, "epoch": 1285} {"train_loss": -36.10421371459961, "global_step": 155545, "epoch": 1285} {"train_loss": -39.19234085083008, "global_step": 155546, "epoch": 1285} {"train_loss": -39.67478942871094, "global_step": 155547, "epoch": 1285} {"train_loss": -37.59519577026367, "global_step": 155548, "epoch": 1285} {"train_loss": -37.090171813964844, "global_step": 155549, "epoch": 1285} {"train_loss": -38.60042953491211, "global_step": 155550, "epoch": 1285} {"train_loss": -37.92430114746094, "global_step": 155551, "epoch": 1285} {"train_loss": -38.420867919921875, "global_step": 155552, "epoch": 1285} {"train_loss": -35.205101013183594, "global_step": 155553, "epoch": 1285} {"train_loss": -39.96443176269531, "global_step": 155554, "epoch": 1285} {"train_loss": -38.71836471557617, "global_step": 155555, "epoch": 1285} {"train_loss": -39.34407424926758, "global_step": 155556, "epoch": 1285} {"train_loss": -39.453182220458984, "global_step": 155557, "epoch": 1285} {"train_loss": -39.52909851074219, "global_step": 155558, "epoch": 1285} {"train_loss": -38.6561164855957, "global_step": 155559, "epoch": 1285} {"train_loss": -38.62651062011719, "global_step": 155560, "epoch": 1285} {"train_loss": -39.55195236206055, "global_step": 155561, "epoch": 1285} {"train_loss": -38.3418083190918, "global_step": 155562, "epoch": 1285} {"train_loss": -38.72651290893555, "global_step": 155563, "epoch": 1285} {"train_loss": -37.58338165283203, "global_step": 155564, "epoch": 1285} {"train_loss": -39.062835693359375, "global_step": 155565, "epoch": 1285} {"train_loss": -40.27423095703125, "global_step": 155566, "epoch": 1285} {"train_loss": -38.4129753112793, "global_step": 155567, "epoch": 1285} {"train_loss": -40.10900115966797, "global_step": 155568, "epoch": 1285} {"train_loss": -39.5018310546875, "global_step": 155569, "epoch": 1285} {"train_loss": -38.5562858581543, "global_step": 155570, "epoch": 1285} {"train_loss": -39.68710708618164, "global_step": 155571, "epoch": 1285} {"train_loss": -39.02915573120117, "global_step": 155572, "epoch": 1285} {"train_loss": -38.624141693115234, "global_step": 155573, "epoch": 1285} {"train_loss": -37.76243209838867, "global_step": 155574, "epoch": 1285} {"train_loss": -39.894893646240234, "global_step": 155575, "epoch": 1285} {"train_loss": -39.37165451049805, "global_step": 155576, "epoch": 1285} {"train_loss": -38.9757194519043, "global_step": 155577, "epoch": 1285} {"train_loss": -39.69493865966797, "global_step": 155578, "epoch": 1285} {"train_loss": -39.5879020690918, "global_step": 155579, "epoch": 1285} {"train_loss": -39.61904525756836, "global_step": 155580, "epoch": 1285} {"train_loss": -39.38199234008789, "global_step": 155581, "epoch": 1285} {"train_loss": -39.89173126220703, "global_step": 155582, "epoch": 1285} {"train_loss": -40.452484130859375, "global_step": 155583, "epoch": 1285} {"train_loss": -39.956520080566406, "global_step": 155584, "epoch": 1285} {"train_loss": -39.17267990112305, "global_step": 155585, "epoch": 1285} {"train_loss": -39.350791931152344, "global_step": 155586, "epoch": 1285} {"train_loss": -40.08153533935547, "global_step": 155587, "epoch": 1285} {"train_loss": -39.60279846191406, "global_step": 155588, "epoch": 1285} {"train_loss": -40.343013763427734, "global_step": 155589, "epoch": 1285} {"train_loss": -39.690589904785156, "global_step": 155590, "epoch": 1285} {"train_loss": -40.25522994995117, "global_step": 155591, "epoch": 1285} {"train_loss": -40.475345611572266, "global_step": 155592, "epoch": 1285} {"train_loss": -40.08028793334961, "global_step": 155593, "epoch": 1285} {"train_loss": -40.58864974975586, "global_step": 155594, "epoch": 1285} {"train_loss": -40.65496826171875, "global_step": 155595, "epoch": 1285} {"train_loss": -40.49376678466797, "global_step": 155596, "epoch": 1285} {"train_loss": -39.85930252075195, "global_step": 155597, "epoch": 1285} {"train_loss": -40.093746185302734, "global_step": 155598, "epoch": 1285} {"train_loss": -40.630287170410156, "global_step": 155599, "epoch": 1285} {"train_loss": -40.31182098388672, "global_step": 155600, "epoch": 1285} {"train_loss": -39.97431564331055, "global_step": 155601, "epoch": 1285} {"train_loss": -40.09726333618164, "global_step": 155602, "epoch": 1285} {"train_loss": -40.20549392700195, "global_step": 155603, "epoch": 1285} {"train_loss": -40.710121154785156, "global_step": 155604, "epoch": 1285} {"train_loss": -38.80581463269951, "global_step": 155605, "epoch": 1285, "val_loss": 2489672.25} {"train_loss": -40.5988883972168, "global_step": 155606, "epoch": 1286} {"train_loss": -40.02550506591797, "global_step": 155607, "epoch": 1286} {"train_loss": -40.525634765625, "global_step": 155608, "epoch": 1286} {"train_loss": -41.28057098388672, "global_step": 155609, "epoch": 1286} {"train_loss": -41.33056640625, "global_step": 155610, "epoch": 1286} {"train_loss": -41.26399612426758, "global_step": 155611, "epoch": 1286} {"train_loss": -40.54001998901367, "global_step": 155612, "epoch": 1286} {"train_loss": -41.3381462097168, "global_step": 155613, "epoch": 1286} {"train_loss": -41.1091423034668, "global_step": 155614, "epoch": 1286} {"train_loss": -41.21432113647461, "global_step": 155615, "epoch": 1286} {"train_loss": -41.211483001708984, "global_step": 155616, "epoch": 1286} {"train_loss": -40.570125579833984, "global_step": 155617, "epoch": 1286} {"train_loss": -40.351924896240234, "global_step": 155618, "epoch": 1286} {"train_loss": -40.09147262573242, "global_step": 155619, "epoch": 1286} {"train_loss": -40.01218795776367, "global_step": 155620, "epoch": 1286} {"train_loss": -40.25392532348633, "global_step": 155621, "epoch": 1286} {"train_loss": -38.83831787109375, "global_step": 155622, "epoch": 1286} {"train_loss": -37.602203369140625, "global_step": 155623, "epoch": 1286} {"train_loss": -36.67421340942383, "global_step": 155624, "epoch": 1286} {"train_loss": -37.60002517700195, "global_step": 155625, "epoch": 1286} {"train_loss": -40.273258209228516, "global_step": 155626, "epoch": 1286} {"train_loss": -40.027347564697266, "global_step": 155627, "epoch": 1286} {"train_loss": -39.8477897644043, "global_step": 155628, "epoch": 1286} {"train_loss": -37.53447723388672, "global_step": 155629, "epoch": 1286} {"train_loss": -37.718788146972656, "global_step": 155630, "epoch": 1286} {"train_loss": -40.274837493896484, "global_step": 155631, "epoch": 1286} {"train_loss": -38.854591369628906, "global_step": 155632, "epoch": 1286} {"train_loss": -37.470577239990234, "global_step": 155633, "epoch": 1286} {"train_loss": -39.05389404296875, "global_step": 155634, "epoch": 1286} {"train_loss": -39.42558670043945, "global_step": 155635, "epoch": 1286} {"train_loss": -39.00382614135742, "global_step": 155636, "epoch": 1286} {"train_loss": -39.388145446777344, "global_step": 155637, "epoch": 1286} {"train_loss": -40.3406867980957, "global_step": 155638, "epoch": 1286} {"train_loss": -40.39455032348633, "global_step": 155639, "epoch": 1286} {"train_loss": -40.10529327392578, "global_step": 155640, "epoch": 1286} {"train_loss": -40.62641906738281, "global_step": 155641, "epoch": 1286} {"train_loss": -40.10151290893555, "global_step": 155642, "epoch": 1286} {"train_loss": -39.81040573120117, "global_step": 155643, "epoch": 1286} {"train_loss": -40.38030242919922, "global_step": 155644, "epoch": 1286} {"train_loss": -40.35190200805664, "global_step": 155645, "epoch": 1286} {"train_loss": -40.03971862792969, "global_step": 155646, "epoch": 1286} {"train_loss": -40.96754837036133, "global_step": 155647, "epoch": 1286} {"train_loss": -40.45441436767578, "global_step": 155648, "epoch": 1286} {"train_loss": -39.2662467956543, "global_step": 155649, "epoch": 1286} {"train_loss": -40.4832878112793, "global_step": 155650, "epoch": 1286} {"train_loss": -40.65958786010742, "global_step": 155651, "epoch": 1286} {"train_loss": -40.321624755859375, "global_step": 155652, "epoch": 1286} {"train_loss": -39.434444427490234, "global_step": 155653, "epoch": 1286} {"train_loss": -39.91396713256836, "global_step": 155654, "epoch": 1286} {"train_loss": -40.98817825317383, "global_step": 155655, "epoch": 1286} {"train_loss": -38.9601936340332, "global_step": 155656, "epoch": 1286} {"train_loss": -37.705047607421875, "global_step": 155657, "epoch": 1286} {"train_loss": -40.078121185302734, "global_step": 155658, "epoch": 1286} {"train_loss": -40.4876823425293, "global_step": 155659, "epoch": 1286} {"train_loss": -39.90057373046875, "global_step": 155660, "epoch": 1286} {"train_loss": -40.070640563964844, "global_step": 155661, "epoch": 1286} {"train_loss": -37.27606964111328, "global_step": 155662, "epoch": 1286} {"train_loss": -34.81781005859375, "global_step": 155663, "epoch": 1286} {"train_loss": -35.198463439941406, "global_step": 155664, "epoch": 1286} {"train_loss": -36.02546310424805, "global_step": 155665, "epoch": 1286} {"train_loss": -40.60600662231445, "global_step": 155666, "epoch": 1286} {"train_loss": -38.21464157104492, "global_step": 155667, "epoch": 1286} {"train_loss": -39.63859176635742, "global_step": 155668, "epoch": 1286} {"train_loss": -40.537593841552734, "global_step": 155669, "epoch": 1286} {"train_loss": -39.91626739501953, "global_step": 155670, "epoch": 1286} {"train_loss": -40.70402908325195, "global_step": 155671, "epoch": 1286} {"train_loss": -40.59275436401367, "global_step": 155672, "epoch": 1286} {"train_loss": -40.48298263549805, "global_step": 155673, "epoch": 1286} {"train_loss": -40.74617385864258, "global_step": 155674, "epoch": 1286} {"train_loss": -40.71028137207031, "global_step": 155675, "epoch": 1286} {"train_loss": -39.8927001953125, "global_step": 155676, "epoch": 1286} {"train_loss": -40.64655685424805, "global_step": 155677, "epoch": 1286} {"train_loss": -40.442176818847656, "global_step": 155678, "epoch": 1286} {"train_loss": -40.79947280883789, "global_step": 155679, "epoch": 1286} {"train_loss": -39.897605895996094, "global_step": 155680, "epoch": 1286} {"train_loss": -40.77183151245117, "global_step": 155681, "epoch": 1286} {"train_loss": -39.392181396484375, "global_step": 155682, "epoch": 1286} {"train_loss": -41.14411544799805, "global_step": 155683, "epoch": 1286} {"train_loss": -41.0013542175293, "global_step": 155684, "epoch": 1286} {"train_loss": -41.218387603759766, "global_step": 155685, "epoch": 1286} {"train_loss": -40.218788146972656, "global_step": 155686, "epoch": 1286} {"train_loss": -40.80315017700195, "global_step": 155687, "epoch": 1286} {"train_loss": -41.293025970458984, "global_step": 155688, "epoch": 1286} {"train_loss": -40.9138298034668, "global_step": 155689, "epoch": 1286} {"train_loss": -40.70697784423828, "global_step": 155690, "epoch": 1286} {"train_loss": -40.99933624267578, "global_step": 155691, "epoch": 1286} {"train_loss": -41.13243103027344, "global_step": 155692, "epoch": 1286} {"train_loss": -40.431793212890625, "global_step": 155693, "epoch": 1286} {"train_loss": -40.420570373535156, "global_step": 155694, "epoch": 1286} {"train_loss": -40.86920928955078, "global_step": 155695, "epoch": 1286} {"train_loss": -40.58784103393555, "global_step": 155696, "epoch": 1286} {"train_loss": -40.51788330078125, "global_step": 155697, "epoch": 1286} {"train_loss": -40.45711898803711, "global_step": 155698, "epoch": 1286} {"train_loss": -36.8140754699707, "global_step": 155699, "epoch": 1286} {"train_loss": -40.40291213989258, "global_step": 155700, "epoch": 1286} {"train_loss": -36.92497253417969, "global_step": 155701, "epoch": 1286} {"train_loss": -37.52458190917969, "global_step": 155702, "epoch": 1286} {"train_loss": -39.45660400390625, "global_step": 155703, "epoch": 1286} {"train_loss": -40.31978988647461, "global_step": 155704, "epoch": 1286} {"train_loss": -39.4923095703125, "global_step": 155705, "epoch": 1286} {"train_loss": -40.46501541137695, "global_step": 155706, "epoch": 1286} {"train_loss": -40.59456253051758, "global_step": 155707, "epoch": 1286} {"train_loss": -40.090721130371094, "global_step": 155708, "epoch": 1286} {"train_loss": -39.208740234375, "global_step": 155709, "epoch": 1286} {"train_loss": -38.771427154541016, "global_step": 155710, "epoch": 1286} {"train_loss": -39.94849395751953, "global_step": 155711, "epoch": 1286} {"train_loss": -38.74708938598633, "global_step": 155712, "epoch": 1286} {"train_loss": -38.21434783935547, "global_step": 155713, "epoch": 1286} {"train_loss": -40.47561264038086, "global_step": 155714, "epoch": 1286} {"train_loss": -40.92668533325195, "global_step": 155715, "epoch": 1286} {"train_loss": -40.917171478271484, "global_step": 155716, "epoch": 1286} {"train_loss": -40.53243637084961, "global_step": 155717, "epoch": 1286} {"train_loss": -40.59757614135742, "global_step": 155718, "epoch": 1286} {"train_loss": -40.65737533569336, "global_step": 155719, "epoch": 1286} {"train_loss": -39.3521842956543, "global_step": 155720, "epoch": 1286} {"train_loss": -40.7010498046875, "global_step": 155721, "epoch": 1286} {"train_loss": -40.297279357910156, "global_step": 155722, "epoch": 1286} {"train_loss": -40.437129974365234, "global_step": 155723, "epoch": 1286} {"train_loss": -41.02642059326172, "global_step": 155724, "epoch": 1286} {"train_loss": -37.747047424316406, "global_step": 155725, "epoch": 1286} {"train_loss": -39.858804497837035, "global_step": 155726, "epoch": 1286, "val_loss": 2644229.0} {"train_loss": -37.69036865234375, "global_step": 155727, "epoch": 1287} {"train_loss": -40.0208740234375, "global_step": 155728, "epoch": 1287} {"train_loss": -40.09138488769531, "global_step": 155729, "epoch": 1287} {"train_loss": -40.58220672607422, "global_step": 155730, "epoch": 1287} {"train_loss": -40.340091705322266, "global_step": 155731, "epoch": 1287} {"train_loss": -40.7403450012207, "global_step": 155732, "epoch": 1287} {"train_loss": -38.87827682495117, "global_step": 155733, "epoch": 1287} {"train_loss": -41.156089782714844, "global_step": 155734, "epoch": 1287} {"train_loss": -39.60201644897461, "global_step": 155735, "epoch": 1287} {"train_loss": -34.39211654663086, "global_step": 155736, "epoch": 1287} {"train_loss": -38.95011520385742, "global_step": 155737, "epoch": 1287} {"train_loss": -39.10251998901367, "global_step": 155738, "epoch": 1287} {"train_loss": -38.83854293823242, "global_step": 155739, "epoch": 1287} {"train_loss": -39.77958297729492, "global_step": 155740, "epoch": 1287} {"train_loss": -40.411983489990234, "global_step": 155741, "epoch": 1287} {"train_loss": -39.823158264160156, "global_step": 155742, "epoch": 1287} {"train_loss": -38.55230712890625, "global_step": 155743, "epoch": 1287} {"train_loss": -39.91522979736328, "global_step": 155744, "epoch": 1287} {"train_loss": -39.96586990356445, "global_step": 155745, "epoch": 1287} {"train_loss": -39.73565673828125, "global_step": 155746, "epoch": 1287} {"train_loss": -39.48125076293945, "global_step": 155747, "epoch": 1287} {"train_loss": -39.032249450683594, "global_step": 155748, "epoch": 1287} {"train_loss": -36.79512405395508, "global_step": 155749, "epoch": 1287} {"train_loss": -37.56863784790039, "global_step": 155750, "epoch": 1287} {"train_loss": -36.80534744262695, "global_step": 155751, "epoch": 1287} {"train_loss": -36.83567810058594, "global_step": 155752, "epoch": 1287} {"train_loss": -39.17277908325195, "global_step": 155753, "epoch": 1287} {"train_loss": -37.59459686279297, "global_step": 155754, "epoch": 1287} {"train_loss": -39.4033203125, "global_step": 155755, "epoch": 1287} {"train_loss": -38.69742202758789, "global_step": 155756, "epoch": 1287} {"train_loss": -37.3509521484375, "global_step": 155757, "epoch": 1287} {"train_loss": -37.09025192260742, "global_step": 155758, "epoch": 1287} {"train_loss": -39.40970993041992, "global_step": 155759, "epoch": 1287} {"train_loss": -38.513519287109375, "global_step": 155760, "epoch": 1287} {"train_loss": -33.4766845703125, "global_step": 155761, "epoch": 1287} {"train_loss": -39.04395294189453, "global_step": 155762, "epoch": 1287} {"train_loss": -36.0331916809082, "global_step": 155763, "epoch": 1287} {"train_loss": -37.06922912597656, "global_step": 155764, "epoch": 1287} {"train_loss": -37.989009857177734, "global_step": 155765, "epoch": 1287} {"train_loss": -38.45280075073242, "global_step": 155766, "epoch": 1287} {"train_loss": -34.959083557128906, "global_step": 155767, "epoch": 1287} {"train_loss": -38.26537322998047, "global_step": 155768, "epoch": 1287} {"train_loss": -38.81812286376953, "global_step": 155769, "epoch": 1287} {"train_loss": -38.10770797729492, "global_step": 155770, "epoch": 1287} {"train_loss": -38.1148796081543, "global_step": 155771, "epoch": 1287} {"train_loss": -37.26786422729492, "global_step": 155772, "epoch": 1287} {"train_loss": -38.411170959472656, "global_step": 155773, "epoch": 1287} {"train_loss": -37.10901641845703, "global_step": 155774, "epoch": 1287} {"train_loss": -38.974029541015625, "global_step": 155775, "epoch": 1287} {"train_loss": -38.694549560546875, "global_step": 155776, "epoch": 1287} {"train_loss": -37.4176025390625, "global_step": 155777, "epoch": 1287} {"train_loss": -39.43659210205078, "global_step": 155778, "epoch": 1287} {"train_loss": -39.36085510253906, "global_step": 155779, "epoch": 1287} {"train_loss": -39.36385726928711, "global_step": 155780, "epoch": 1287} {"train_loss": -38.56581497192383, "global_step": 155781, "epoch": 1287} {"train_loss": -38.669490814208984, "global_step": 155782, "epoch": 1287} {"train_loss": -38.87977981567383, "global_step": 155783, "epoch": 1287} {"train_loss": -39.58476638793945, "global_step": 155784, "epoch": 1287} {"train_loss": -38.08961486816406, "global_step": 155785, "epoch": 1287} {"train_loss": -39.531951904296875, "global_step": 155786, "epoch": 1287} {"train_loss": -39.24861526489258, "global_step": 155787, "epoch": 1287} {"train_loss": -39.93098068237305, "global_step": 155788, "epoch": 1287} {"train_loss": -39.848731994628906, "global_step": 155789, "epoch": 1287} {"train_loss": -38.02431106567383, "global_step": 155790, "epoch": 1287} {"train_loss": -39.53882598876953, "global_step": 155791, "epoch": 1287} {"train_loss": -39.86233139038086, "global_step": 155792, "epoch": 1287} {"train_loss": -39.30397415161133, "global_step": 155793, "epoch": 1287} {"train_loss": -39.30622482299805, "global_step": 155794, "epoch": 1287} {"train_loss": -39.670467376708984, "global_step": 155795, "epoch": 1287} {"train_loss": -39.72195816040039, "global_step": 155796, "epoch": 1287} {"train_loss": -39.3339958190918, "global_step": 155797, "epoch": 1287} {"train_loss": -40.7569580078125, "global_step": 155798, "epoch": 1287} {"train_loss": -40.09783935546875, "global_step": 155799, "epoch": 1287} {"train_loss": -39.26746368408203, "global_step": 155800, "epoch": 1287} {"train_loss": -39.36826705932617, "global_step": 155801, "epoch": 1287} {"train_loss": -39.546852111816406, "global_step": 155802, "epoch": 1287} {"train_loss": -40.199676513671875, "global_step": 155803, "epoch": 1287} {"train_loss": -38.12691116333008, "global_step": 155804, "epoch": 1287} {"train_loss": -38.24332809448242, "global_step": 155805, "epoch": 1287} {"train_loss": -39.73427963256836, "global_step": 155806, "epoch": 1287} {"train_loss": -40.047298431396484, "global_step": 155807, "epoch": 1287} {"train_loss": -37.95808792114258, "global_step": 155808, "epoch": 1287} {"train_loss": -39.770790100097656, "global_step": 155809, "epoch": 1287} {"train_loss": -38.75776290893555, "global_step": 155810, "epoch": 1287} {"train_loss": -40.467952728271484, "global_step": 155811, "epoch": 1287} {"train_loss": -39.65494918823242, "global_step": 155812, "epoch": 1287} {"train_loss": -36.29645538330078, "global_step": 155813, "epoch": 1287} {"train_loss": -40.165985107421875, "global_step": 155814, "epoch": 1287} {"train_loss": -39.185855865478516, "global_step": 155815, "epoch": 1287} {"train_loss": -39.80284118652344, "global_step": 155816, "epoch": 1287} {"train_loss": -39.93941879272461, "global_step": 155817, "epoch": 1287} {"train_loss": -39.775508880615234, "global_step": 155818, "epoch": 1287} {"train_loss": -40.5186653137207, "global_step": 155819, "epoch": 1287} {"train_loss": -40.33077621459961, "global_step": 155820, "epoch": 1287} {"train_loss": -39.67830276489258, "global_step": 155821, "epoch": 1287} {"train_loss": -40.38471603393555, "global_step": 155822, "epoch": 1287} {"train_loss": -40.42133712768555, "global_step": 155823, "epoch": 1287} {"train_loss": -40.51865005493164, "global_step": 155824, "epoch": 1287} {"train_loss": -40.24485397338867, "global_step": 155825, "epoch": 1287} {"train_loss": -40.24528884887695, "global_step": 155826, "epoch": 1287} {"train_loss": -40.01755905151367, "global_step": 155827, "epoch": 1287} {"train_loss": -38.5340576171875, "global_step": 155828, "epoch": 1287} {"train_loss": -39.777748107910156, "global_step": 155829, "epoch": 1287} {"train_loss": -40.609466552734375, "global_step": 155830, "epoch": 1287} {"train_loss": -37.190608978271484, "global_step": 155831, "epoch": 1287} {"train_loss": -39.7562370300293, "global_step": 155832, "epoch": 1287} {"train_loss": -37.74299240112305, "global_step": 155833, "epoch": 1287} {"train_loss": -38.79822540283203, "global_step": 155834, "epoch": 1287} {"train_loss": -40.21944808959961, "global_step": 155835, "epoch": 1287} {"train_loss": -37.84074020385742, "global_step": 155836, "epoch": 1287} {"train_loss": -39.88701248168945, "global_step": 155837, "epoch": 1287} {"train_loss": -39.71940612792969, "global_step": 155838, "epoch": 1287} {"train_loss": -40.0389404296875, "global_step": 155839, "epoch": 1287} {"train_loss": -40.74467849731445, "global_step": 155840, "epoch": 1287} {"train_loss": -39.73857116699219, "global_step": 155841, "epoch": 1287} {"train_loss": -39.52494812011719, "global_step": 155842, "epoch": 1287} {"train_loss": -40.051971435546875, "global_step": 155843, "epoch": 1287} {"train_loss": -40.1474723815918, "global_step": 155844, "epoch": 1287} {"train_loss": -41.01487350463867, "global_step": 155845, "epoch": 1287} {"train_loss": -39.80290603637695, "global_step": 155846, "epoch": 1287} {"train_loss": -39.064318002748095, "global_step": 155847, "epoch": 1287, "val_loss": 2709075.25} {"train_loss": -40.410308837890625, "global_step": 155848, "epoch": 1288} {"train_loss": -40.54172134399414, "global_step": 155849, "epoch": 1288} {"train_loss": -41.0355110168457, "global_step": 155850, "epoch": 1288} {"train_loss": -40.21134567260742, "global_step": 155851, "epoch": 1288} {"train_loss": -40.28766632080078, "global_step": 155852, "epoch": 1288} {"train_loss": -40.522029876708984, "global_step": 155853, "epoch": 1288} {"train_loss": -40.25833511352539, "global_step": 155854, "epoch": 1288} {"train_loss": -40.5831298828125, "global_step": 155855, "epoch": 1288} {"train_loss": -40.81803512573242, "global_step": 155856, "epoch": 1288} {"train_loss": -40.419857025146484, "global_step": 155857, "epoch": 1288} {"train_loss": -40.59516525268555, "global_step": 155858, "epoch": 1288} {"train_loss": -41.07545852661133, "global_step": 155859, "epoch": 1288} {"train_loss": -40.30828094482422, "global_step": 155860, "epoch": 1288} {"train_loss": -40.29197311401367, "global_step": 155861, "epoch": 1288} {"train_loss": -39.560516357421875, "global_step": 155862, "epoch": 1288} {"train_loss": -37.913055419921875, "global_step": 155863, "epoch": 1288} {"train_loss": -37.277645111083984, "global_step": 155864, "epoch": 1288} {"train_loss": -38.385894775390625, "global_step": 155865, "epoch": 1288} {"train_loss": -39.848445892333984, "global_step": 155866, "epoch": 1288} {"train_loss": -40.7342414855957, "global_step": 155867, "epoch": 1288} {"train_loss": -39.5975341796875, "global_step": 155868, "epoch": 1288} {"train_loss": -38.32509994506836, "global_step": 155869, "epoch": 1288} {"train_loss": -32.994686126708984, "global_step": 155870, "epoch": 1288} {"train_loss": -26.983489990234375, "global_step": 155871, "epoch": 1288} {"train_loss": -33.6261100769043, "global_step": 155872, "epoch": 1288} {"train_loss": -39.2048454284668, "global_step": 155873, "epoch": 1288} {"train_loss": -36.08675765991211, "global_step": 155874, "epoch": 1288} {"train_loss": -36.933876037597656, "global_step": 155875, "epoch": 1288} {"train_loss": -38.66486740112305, "global_step": 155876, "epoch": 1288} {"train_loss": -38.19841384887695, "global_step": 155877, "epoch": 1288} {"train_loss": -39.054412841796875, "global_step": 155878, "epoch": 1288} {"train_loss": -38.42158508300781, "global_step": 155879, "epoch": 1288} {"train_loss": -38.93690872192383, "global_step": 155880, "epoch": 1288} {"train_loss": -39.5213508605957, "global_step": 155881, "epoch": 1288} {"train_loss": -38.71391677856445, "global_step": 155882, "epoch": 1288} {"train_loss": -40.65291976928711, "global_step": 155883, "epoch": 1288} {"train_loss": -38.7302360534668, "global_step": 155884, "epoch": 1288} {"train_loss": -40.24782943725586, "global_step": 155885, "epoch": 1288} {"train_loss": -39.355140686035156, "global_step": 155886, "epoch": 1288} {"train_loss": -39.87331008911133, "global_step": 155887, "epoch": 1288} {"train_loss": -40.337764739990234, "global_step": 155888, "epoch": 1288} {"train_loss": -39.96953582763672, "global_step": 155889, "epoch": 1288} {"train_loss": -39.872901916503906, "global_step": 155890, "epoch": 1288} {"train_loss": -40.56105422973633, "global_step": 155891, "epoch": 1288} {"train_loss": -40.08009719848633, "global_step": 155892, "epoch": 1288} {"train_loss": -40.28457260131836, "global_step": 155893, "epoch": 1288} {"train_loss": -40.55803298950195, "global_step": 155894, "epoch": 1288} {"train_loss": -40.57541275024414, "global_step": 155895, "epoch": 1288} {"train_loss": -40.90317916870117, "global_step": 155896, "epoch": 1288} {"train_loss": -40.80414962768555, "global_step": 155897, "epoch": 1288} {"train_loss": -40.30794143676758, "global_step": 155898, "epoch": 1288} {"train_loss": -40.2215461730957, "global_step": 155899, "epoch": 1288} {"train_loss": -40.441139221191406, "global_step": 155900, "epoch": 1288} {"train_loss": -41.2009162902832, "global_step": 155901, "epoch": 1288} {"train_loss": -40.99075698852539, "global_step": 155902, "epoch": 1288} {"train_loss": -40.75009536743164, "global_step": 155903, "epoch": 1288} {"train_loss": -41.02546310424805, "global_step": 155904, "epoch": 1288} {"train_loss": -40.72822189331055, "global_step": 155905, "epoch": 1288} {"train_loss": -41.187843322753906, "global_step": 155906, "epoch": 1288} {"train_loss": -41.16685104370117, "global_step": 155907, "epoch": 1288} {"train_loss": -41.02204132080078, "global_step": 155908, "epoch": 1288} {"train_loss": -41.112403869628906, "global_step": 155909, "epoch": 1288} {"train_loss": -41.182979583740234, "global_step": 155910, "epoch": 1288} {"train_loss": -41.0255241394043, "global_step": 155911, "epoch": 1288} {"train_loss": -41.450313568115234, "global_step": 155912, "epoch": 1288} {"train_loss": -41.330711364746094, "global_step": 155913, "epoch": 1288} {"train_loss": -41.676143646240234, "global_step": 155914, "epoch": 1288} {"train_loss": -41.39943313598633, "global_step": 155915, "epoch": 1288} {"train_loss": -41.37733459472656, "global_step": 155916, "epoch": 1288} {"train_loss": -40.243438720703125, "global_step": 155917, "epoch": 1288} {"train_loss": -41.3052978515625, "global_step": 155918, "epoch": 1288} {"train_loss": -41.470760345458984, "global_step": 155919, "epoch": 1288} {"train_loss": -40.64992141723633, "global_step": 155920, "epoch": 1288} {"train_loss": -40.58596420288086, "global_step": 155921, "epoch": 1288} {"train_loss": -41.7169189453125, "global_step": 155922, "epoch": 1288} {"train_loss": -41.477264404296875, "global_step": 155923, "epoch": 1288} {"train_loss": -41.64297103881836, "global_step": 155924, "epoch": 1288} {"train_loss": -41.7125358581543, "global_step": 155925, "epoch": 1288} {"train_loss": -41.804134368896484, "global_step": 155926, "epoch": 1288} {"train_loss": -41.76338577270508, "global_step": 155927, "epoch": 1288} {"train_loss": -41.9157600402832, "global_step": 155928, "epoch": 1288} {"train_loss": -41.36529541015625, "global_step": 155929, "epoch": 1288} {"train_loss": -41.066261291503906, "global_step": 155930, "epoch": 1288} {"train_loss": -41.05854034423828, "global_step": 155931, "epoch": 1288} {"train_loss": -40.581687927246094, "global_step": 155932, "epoch": 1288} {"train_loss": -39.989742279052734, "global_step": 155933, "epoch": 1288} {"train_loss": -38.7752799987793, "global_step": 155934, "epoch": 1288} {"train_loss": -38.05443572998047, "global_step": 155935, "epoch": 1288} {"train_loss": -39.13959503173828, "global_step": 155936, "epoch": 1288} {"train_loss": -39.6102180480957, "global_step": 155937, "epoch": 1288} {"train_loss": -41.383880615234375, "global_step": 155938, "epoch": 1288} {"train_loss": -41.07881546020508, "global_step": 155939, "epoch": 1288} {"train_loss": -39.87115478515625, "global_step": 155940, "epoch": 1288} {"train_loss": -39.22319412231445, "global_step": 155941, "epoch": 1288} {"train_loss": -39.58846664428711, "global_step": 155942, "epoch": 1288} {"train_loss": -41.13032531738281, "global_step": 155943, "epoch": 1288} {"train_loss": -39.65247344970703, "global_step": 155944, "epoch": 1288} {"train_loss": -39.290618896484375, "global_step": 155945, "epoch": 1288} {"train_loss": -39.82428741455078, "global_step": 155946, "epoch": 1288} {"train_loss": -40.2387809753418, "global_step": 155947, "epoch": 1288} {"train_loss": -39.376495361328125, "global_step": 155948, "epoch": 1288} {"train_loss": -38.80106735229492, "global_step": 155949, "epoch": 1288} {"train_loss": -39.85691452026367, "global_step": 155950, "epoch": 1288} {"train_loss": -40.6812858581543, "global_step": 155951, "epoch": 1288} {"train_loss": -40.322330474853516, "global_step": 155952, "epoch": 1288} {"train_loss": -39.859092712402344, "global_step": 155953, "epoch": 1288} {"train_loss": -40.667640686035156, "global_step": 155954, "epoch": 1288} {"train_loss": -40.370052337646484, "global_step": 155955, "epoch": 1288} {"train_loss": -39.7393913269043, "global_step": 155956, "epoch": 1288} {"train_loss": -40.438262939453125, "global_step": 155957, "epoch": 1288} {"train_loss": -39.536903381347656, "global_step": 155958, "epoch": 1288} {"train_loss": -41.034603118896484, "global_step": 155959, "epoch": 1288} {"train_loss": -40.42463302612305, "global_step": 155960, "epoch": 1288} {"train_loss": -39.59843063354492, "global_step": 155961, "epoch": 1288} {"train_loss": -40.016109466552734, "global_step": 155962, "epoch": 1288} {"train_loss": -28.92745018005371, "global_step": 155963, "epoch": 1288} {"train_loss": -40.474571228027344, "global_step": 155964, "epoch": 1288} {"train_loss": -38.92991256713867, "global_step": 155965, "epoch": 1288} {"train_loss": -38.373836517333984, "global_step": 155966, "epoch": 1288} {"train_loss": -39.19948959350586, "global_step": 155967, "epoch": 1288} {"train_loss": -39.852674925622864, "global_step": 155968, "epoch": 1288, "val_loss": 2682027.25} {"train_loss": -39.83004379272461, "global_step": 155969, "epoch": 1289} {"train_loss": -37.832855224609375, "global_step": 155970, "epoch": 1289} {"train_loss": -36.970176696777344, "global_step": 155971, "epoch": 1289} {"train_loss": -39.41476821899414, "global_step": 155972, "epoch": 1289} {"train_loss": -39.972679138183594, "global_step": 155973, "epoch": 1289} {"train_loss": -37.60944366455078, "global_step": 155974, "epoch": 1289} {"train_loss": -37.158748626708984, "global_step": 155975, "epoch": 1289} {"train_loss": -39.69822692871094, "global_step": 155976, "epoch": 1289} {"train_loss": -38.18256378173828, "global_step": 155977, "epoch": 1289} {"train_loss": -37.43366622924805, "global_step": 155978, "epoch": 1289} {"train_loss": -39.80072784423828, "global_step": 155979, "epoch": 1289} {"train_loss": -37.69907760620117, "global_step": 155980, "epoch": 1289} {"train_loss": -35.88578414916992, "global_step": 155981, "epoch": 1289} {"train_loss": -40.507442474365234, "global_step": 155982, "epoch": 1289} {"train_loss": -37.98374938964844, "global_step": 155983, "epoch": 1289} {"train_loss": -37.99698257446289, "global_step": 155984, "epoch": 1289} {"train_loss": -39.43208312988281, "global_step": 155985, "epoch": 1289} {"train_loss": -38.96786117553711, "global_step": 155986, "epoch": 1289} {"train_loss": -39.93511962890625, "global_step": 155987, "epoch": 1289} {"train_loss": -37.842132568359375, "global_step": 155988, "epoch": 1289} {"train_loss": -40.15493392944336, "global_step": 155989, "epoch": 1289} {"train_loss": -38.851627349853516, "global_step": 155990, "epoch": 1289} {"train_loss": -39.39512252807617, "global_step": 155991, "epoch": 1289} {"train_loss": -40.39724349975586, "global_step": 155992, "epoch": 1289} {"train_loss": -39.70998001098633, "global_step": 155993, "epoch": 1289} {"train_loss": -39.77836990356445, "global_step": 155994, "epoch": 1289} {"train_loss": -39.73681640625, "global_step": 155995, "epoch": 1289} {"train_loss": -39.78821563720703, "global_step": 155996, "epoch": 1289} {"train_loss": -40.3372917175293, "global_step": 155997, "epoch": 1289} {"train_loss": -39.91423797607422, "global_step": 155998, "epoch": 1289} {"train_loss": -40.10478973388672, "global_step": 155999, "epoch": 1289} {"train_loss": -40.01667022705078, "global_step": 156000, "epoch": 1289} {"train_loss": -40.273441314697266, "global_step": 156001, "epoch": 1289} {"train_loss": -40.33701705932617, "global_step": 156002, "epoch": 1289} {"train_loss": -40.16786575317383, "global_step": 156003, "epoch": 1289} {"train_loss": -40.46751022338867, "global_step": 156004, "epoch": 1289} {"train_loss": -39.450984954833984, "global_step": 156005, "epoch": 1289} {"train_loss": -39.48103332519531, "global_step": 156006, "epoch": 1289} {"train_loss": -40.481021881103516, "global_step": 156007, "epoch": 1289} {"train_loss": -40.18780517578125, "global_step": 156008, "epoch": 1289} {"train_loss": -40.53950500488281, "global_step": 156009, "epoch": 1289} {"train_loss": -40.35636520385742, "global_step": 156010, "epoch": 1289} {"train_loss": -40.9671745300293, "global_step": 156011, "epoch": 1289} {"train_loss": -40.133567810058594, "global_step": 156012, "epoch": 1289} {"train_loss": -40.704158782958984, "global_step": 156013, "epoch": 1289} {"train_loss": -38.462608337402344, "global_step": 156014, "epoch": 1289} {"train_loss": -40.774227142333984, "global_step": 156015, "epoch": 1289} {"train_loss": -40.52435302734375, "global_step": 156016, "epoch": 1289} {"train_loss": -40.396602630615234, "global_step": 156017, "epoch": 1289} {"train_loss": -40.715003967285156, "global_step": 156018, "epoch": 1289} {"train_loss": -41.38916015625, "global_step": 156019, "epoch": 1289} {"train_loss": -39.12548828125, "global_step": 156020, "epoch": 1289} {"train_loss": -41.36893844604492, "global_step": 156021, "epoch": 1289} {"train_loss": -40.89463424682617, "global_step": 156022, "epoch": 1289} {"train_loss": -41.237586975097656, "global_step": 156023, "epoch": 1289} {"train_loss": -40.72492218017578, "global_step": 156024, "epoch": 1289} {"train_loss": -39.86195755004883, "global_step": 156025, "epoch": 1289} {"train_loss": -40.20284652709961, "global_step": 156026, "epoch": 1289} {"train_loss": -40.88755798339844, "global_step": 156027, "epoch": 1289} {"train_loss": -40.82847213745117, "global_step": 156028, "epoch": 1289} {"train_loss": -41.21560287475586, "global_step": 156029, "epoch": 1289} {"train_loss": -40.935638427734375, "global_step": 156030, "epoch": 1289} {"train_loss": -41.42372512817383, "global_step": 156031, "epoch": 1289} {"train_loss": -41.285987854003906, "global_step": 156032, "epoch": 1289} {"train_loss": -40.08830642700195, "global_step": 156033, "epoch": 1289} {"train_loss": -40.81791687011719, "global_step": 156034, "epoch": 1289} {"train_loss": -41.3028678894043, "global_step": 156035, "epoch": 1289} {"train_loss": -41.105350494384766, "global_step": 156036, "epoch": 1289} {"train_loss": -40.416221618652344, "global_step": 156037, "epoch": 1289} {"train_loss": -41.030555725097656, "global_step": 156038, "epoch": 1289} {"train_loss": -41.10637283325195, "global_step": 156039, "epoch": 1289} {"train_loss": -40.869171142578125, "global_step": 156040, "epoch": 1289} {"train_loss": -40.29734420776367, "global_step": 156041, "epoch": 1289} {"train_loss": -41.131656646728516, "global_step": 156042, "epoch": 1289} {"train_loss": -41.229793548583984, "global_step": 156043, "epoch": 1289} {"train_loss": -40.2686882019043, "global_step": 156044, "epoch": 1289} {"train_loss": -41.58687210083008, "global_step": 156045, "epoch": 1289} {"train_loss": -40.793758392333984, "global_step": 156046, "epoch": 1289} {"train_loss": -40.233272552490234, "global_step": 156047, "epoch": 1289} {"train_loss": -41.13029479980469, "global_step": 156048, "epoch": 1289} {"train_loss": -40.76835250854492, "global_step": 156049, "epoch": 1289} {"train_loss": -40.92625045776367, "global_step": 156050, "epoch": 1289} {"train_loss": -41.44806671142578, "global_step": 156051, "epoch": 1289} {"train_loss": -40.8228874206543, "global_step": 156052, "epoch": 1289} {"train_loss": -40.11375045776367, "global_step": 156053, "epoch": 1289} {"train_loss": -41.175697326660156, "global_step": 156054, "epoch": 1289} {"train_loss": -41.29899978637695, "global_step": 156055, "epoch": 1289} {"train_loss": -40.655311584472656, "global_step": 156056, "epoch": 1289} {"train_loss": -40.27564239501953, "global_step": 156057, "epoch": 1289} {"train_loss": -40.504066467285156, "global_step": 156058, "epoch": 1289} {"train_loss": -40.864540100097656, "global_step": 156059, "epoch": 1289} {"train_loss": -40.85017776489258, "global_step": 156060, "epoch": 1289} {"train_loss": -40.271080017089844, "global_step": 156061, "epoch": 1289} {"train_loss": -41.042022705078125, "global_step": 156062, "epoch": 1289} {"train_loss": -40.893775939941406, "global_step": 156063, "epoch": 1289} {"train_loss": -41.92680358886719, "global_step": 156064, "epoch": 1289} {"train_loss": -41.681434631347656, "global_step": 156065, "epoch": 1289} {"train_loss": -41.23957443237305, "global_step": 156066, "epoch": 1289} {"train_loss": -41.42667007446289, "global_step": 156067, "epoch": 1289} {"train_loss": -41.50582504272461, "global_step": 156068, "epoch": 1289} {"train_loss": -40.863433837890625, "global_step": 156069, "epoch": 1289} {"train_loss": -41.24410629272461, "global_step": 156070, "epoch": 1289} {"train_loss": -41.543331146240234, "global_step": 156071, "epoch": 1289} {"train_loss": -36.0295524597168, "global_step": 156072, "epoch": 1289} {"train_loss": -40.964111328125, "global_step": 156073, "epoch": 1289} {"train_loss": -41.18154525756836, "global_step": 156074, "epoch": 1289} {"train_loss": -41.60572814941406, "global_step": 156075, "epoch": 1289} {"train_loss": -40.26052474975586, "global_step": 156076, "epoch": 1289} {"train_loss": -40.39976119995117, "global_step": 156077, "epoch": 1289} {"train_loss": -40.781002044677734, "global_step": 156078, "epoch": 1289} {"train_loss": -39.75636291503906, "global_step": 156079, "epoch": 1289} {"train_loss": -40.3618278503418, "global_step": 156080, "epoch": 1289} {"train_loss": -40.708526611328125, "global_step": 156081, "epoch": 1289} {"train_loss": -40.67844772338867, "global_step": 156082, "epoch": 1289} {"train_loss": -39.51809310913086, "global_step": 156083, "epoch": 1289} {"train_loss": -39.612979888916016, "global_step": 156084, "epoch": 1289} {"train_loss": -38.961891174316406, "global_step": 156085, "epoch": 1289} {"train_loss": -39.790103912353516, "global_step": 156086, "epoch": 1289} {"train_loss": -40.53799057006836, "global_step": 156087, "epoch": 1289} {"train_loss": -40.60932922363281, "global_step": 156088, "epoch": 1289} {"train_loss": -40.19915185092894, "global_step": 156089, "epoch": 1289, "val_loss": 2563705.0} {"train_loss": -40.845497131347656, "global_step": 156090, "epoch": 1290} {"train_loss": -37.51961898803711, "global_step": 156091, "epoch": 1290} {"train_loss": -40.66762924194336, "global_step": 156092, "epoch": 1290} {"train_loss": -39.87412643432617, "global_step": 156093, "epoch": 1290} {"train_loss": -38.786895751953125, "global_step": 156094, "epoch": 1290} {"train_loss": -38.747406005859375, "global_step": 156095, "epoch": 1290} {"train_loss": -39.8336181640625, "global_step": 156096, "epoch": 1290} {"train_loss": -41.43431854248047, "global_step": 156097, "epoch": 1290} {"train_loss": -40.89993667602539, "global_step": 156098, "epoch": 1290} {"train_loss": -40.1048583984375, "global_step": 156099, "epoch": 1290} {"train_loss": -40.5622673034668, "global_step": 156100, "epoch": 1290} {"train_loss": -41.572662353515625, "global_step": 156101, "epoch": 1290} {"train_loss": -40.305294036865234, "global_step": 156102, "epoch": 1290} {"train_loss": -41.065059661865234, "global_step": 156103, "epoch": 1290} {"train_loss": -40.679439544677734, "global_step": 156104, "epoch": 1290} {"train_loss": -40.951229095458984, "global_step": 156105, "epoch": 1290} {"train_loss": -41.15268325805664, "global_step": 156106, "epoch": 1290} {"train_loss": -40.859771728515625, "global_step": 156107, "epoch": 1290} {"train_loss": -40.943077087402344, "global_step": 156108, "epoch": 1290} {"train_loss": -41.40946960449219, "global_step": 156109, "epoch": 1290} {"train_loss": -41.601600646972656, "global_step": 156110, "epoch": 1290} {"train_loss": -41.02754592895508, "global_step": 156111, "epoch": 1290} {"train_loss": -41.23466873168945, "global_step": 156112, "epoch": 1290} {"train_loss": -41.0025520324707, "global_step": 156113, "epoch": 1290} {"train_loss": -41.261878967285156, "global_step": 156114, "epoch": 1290} {"train_loss": -36.88745880126953, "global_step": 156115, "epoch": 1290} {"train_loss": -41.334739685058594, "global_step": 156116, "epoch": 1290} {"train_loss": -40.4407844543457, "global_step": 156117, "epoch": 1290} {"train_loss": -41.10542678833008, "global_step": 156118, "epoch": 1290} {"train_loss": -40.9339599609375, "global_step": 156119, "epoch": 1290} {"train_loss": -40.443599700927734, "global_step": 156120, "epoch": 1290} {"train_loss": -39.58042526245117, "global_step": 156121, "epoch": 1290} {"train_loss": -41.35456466674805, "global_step": 156122, "epoch": 1290} {"train_loss": -40.43682861328125, "global_step": 156123, "epoch": 1290} {"train_loss": -38.81810760498047, "global_step": 156124, "epoch": 1290} {"train_loss": -41.34193420410156, "global_step": 156125, "epoch": 1290} {"train_loss": -40.68760299682617, "global_step": 156126, "epoch": 1290} {"train_loss": -37.81044387817383, "global_step": 156127, "epoch": 1290} {"train_loss": -38.52082061767578, "global_step": 156128, "epoch": 1290} {"train_loss": -37.73712158203125, "global_step": 156129, "epoch": 1290} {"train_loss": -40.822654724121094, "global_step": 156130, "epoch": 1290} {"train_loss": -38.867218017578125, "global_step": 156131, "epoch": 1290} {"train_loss": -39.16830062866211, "global_step": 156132, "epoch": 1290} {"train_loss": -39.95919418334961, "global_step": 156133, "epoch": 1290} {"train_loss": -40.31391525268555, "global_step": 156134, "epoch": 1290} {"train_loss": -39.35909652709961, "global_step": 156135, "epoch": 1290} {"train_loss": -38.25764846801758, "global_step": 156136, "epoch": 1290} {"train_loss": -39.829322814941406, "global_step": 156137, "epoch": 1290} {"train_loss": -40.230316162109375, "global_step": 156138, "epoch": 1290} {"train_loss": -40.041534423828125, "global_step": 156139, "epoch": 1290} {"train_loss": -40.41349411010742, "global_step": 156140, "epoch": 1290} {"train_loss": -40.43900680541992, "global_step": 156141, "epoch": 1290} {"train_loss": -40.34993362426758, "global_step": 156142, "epoch": 1290} {"train_loss": -40.91994094848633, "global_step": 156143, "epoch": 1290} {"train_loss": -41.278076171875, "global_step": 156144, "epoch": 1290} {"train_loss": -40.79238510131836, "global_step": 156145, "epoch": 1290} {"train_loss": -41.18494415283203, "global_step": 156146, "epoch": 1290} {"train_loss": -40.92905807495117, "global_step": 156147, "epoch": 1290} {"train_loss": -40.216888427734375, "global_step": 156148, "epoch": 1290} {"train_loss": -40.940277099609375, "global_step": 156149, "epoch": 1290} {"train_loss": -40.91646957397461, "global_step": 156150, "epoch": 1290} {"train_loss": -40.9393424987793, "global_step": 156151, "epoch": 1290} {"train_loss": -41.33995056152344, "global_step": 156152, "epoch": 1290} {"train_loss": -40.354305267333984, "global_step": 156153, "epoch": 1290} {"train_loss": -37.55549621582031, "global_step": 156154, "epoch": 1290} {"train_loss": -40.80241394042969, "global_step": 156155, "epoch": 1290} {"train_loss": -41.029903411865234, "global_step": 156156, "epoch": 1290} {"train_loss": -40.85519027709961, "global_step": 156157, "epoch": 1290} {"train_loss": -39.75882339477539, "global_step": 156158, "epoch": 1290} {"train_loss": -40.97748565673828, "global_step": 156159, "epoch": 1290} {"train_loss": -39.116058349609375, "global_step": 156160, "epoch": 1290} {"train_loss": -40.737300872802734, "global_step": 156161, "epoch": 1290} {"train_loss": -37.78774642944336, "global_step": 156162, "epoch": 1290} {"train_loss": -40.2862663269043, "global_step": 156163, "epoch": 1290} {"train_loss": -39.01986312866211, "global_step": 156164, "epoch": 1290} {"train_loss": -36.19364929199219, "global_step": 156165, "epoch": 1290} {"train_loss": -39.222286224365234, "global_step": 156166, "epoch": 1290} {"train_loss": -38.18534469604492, "global_step": 156167, "epoch": 1290} {"train_loss": -39.33201217651367, "global_step": 156168, "epoch": 1290} {"train_loss": -39.852657318115234, "global_step": 156169, "epoch": 1290} {"train_loss": -39.29621505737305, "global_step": 156170, "epoch": 1290} {"train_loss": -36.65404510498047, "global_step": 156171, "epoch": 1290} {"train_loss": -37.4700927734375, "global_step": 156172, "epoch": 1290} {"train_loss": -35.70660400390625, "global_step": 156173, "epoch": 1290} {"train_loss": -38.49207305908203, "global_step": 156174, "epoch": 1290} {"train_loss": -38.514835357666016, "global_step": 156175, "epoch": 1290} {"train_loss": -39.12422561645508, "global_step": 156176, "epoch": 1290} {"train_loss": -37.76212692260742, "global_step": 156177, "epoch": 1290} {"train_loss": -39.06477737426758, "global_step": 156178, "epoch": 1290} {"train_loss": -38.18470764160156, "global_step": 156179, "epoch": 1290} {"train_loss": -38.70264434814453, "global_step": 156180, "epoch": 1290} {"train_loss": -39.93833541870117, "global_step": 156181, "epoch": 1290} {"train_loss": -38.02235794067383, "global_step": 156182, "epoch": 1290} {"train_loss": -37.52901840209961, "global_step": 156183, "epoch": 1290} {"train_loss": -38.628639221191406, "global_step": 156184, "epoch": 1290} {"train_loss": -37.68584442138672, "global_step": 156185, "epoch": 1290} {"train_loss": -39.069488525390625, "global_step": 156186, "epoch": 1290} {"train_loss": -39.00358963012695, "global_step": 156187, "epoch": 1290} {"train_loss": -39.375179290771484, "global_step": 156188, "epoch": 1290} {"train_loss": -38.15104675292969, "global_step": 156189, "epoch": 1290} {"train_loss": -38.61017608642578, "global_step": 156190, "epoch": 1290} {"train_loss": -39.13502883911133, "global_step": 156191, "epoch": 1290} {"train_loss": -38.81539535522461, "global_step": 156192, "epoch": 1290} {"train_loss": -39.17214584350586, "global_step": 156193, "epoch": 1290} {"train_loss": -37.78786849975586, "global_step": 156194, "epoch": 1290} {"train_loss": -39.34397506713867, "global_step": 156195, "epoch": 1290} {"train_loss": -40.281063079833984, "global_step": 156196, "epoch": 1290} {"train_loss": -38.981441497802734, "global_step": 156197, "epoch": 1290} {"train_loss": -38.769187927246094, "global_step": 156198, "epoch": 1290} {"train_loss": -40.45038604736328, "global_step": 156199, "epoch": 1290} {"train_loss": -39.17788314819336, "global_step": 156200, "epoch": 1290} {"train_loss": -40.115779876708984, "global_step": 156201, "epoch": 1290} {"train_loss": -39.13384246826172, "global_step": 156202, "epoch": 1290} {"train_loss": -40.2884635925293, "global_step": 156203, "epoch": 1290} {"train_loss": -39.34330368041992, "global_step": 156204, "epoch": 1290} {"train_loss": -39.817195892333984, "global_step": 156205, "epoch": 1290} {"train_loss": -40.521461486816406, "global_step": 156206, "epoch": 1290} {"train_loss": -39.24870300292969, "global_step": 156207, "epoch": 1290} {"train_loss": -39.56726837158203, "global_step": 156208, "epoch": 1290} {"train_loss": -40.52836990356445, "global_step": 156209, "epoch": 1290} {"train_loss": -39.715695814652875, "global_step": 156210, "epoch": 1290, "val_loss": 2665148.25} {"train_loss": -40.55070114135742, "global_step": 156211, "epoch": 1291} {"train_loss": -39.583126068115234, "global_step": 156212, "epoch": 1291} {"train_loss": -39.267494201660156, "global_step": 156213, "epoch": 1291} {"train_loss": -39.92744064331055, "global_step": 156214, "epoch": 1291} {"train_loss": -39.43996810913086, "global_step": 156215, "epoch": 1291} {"train_loss": -40.715057373046875, "global_step": 156216, "epoch": 1291} {"train_loss": -39.72003936767578, "global_step": 156217, "epoch": 1291} {"train_loss": -40.2871208190918, "global_step": 156218, "epoch": 1291} {"train_loss": -40.200416564941406, "global_step": 156219, "epoch": 1291} {"train_loss": -40.6248779296875, "global_step": 156220, "epoch": 1291} {"train_loss": -41.19929122924805, "global_step": 156221, "epoch": 1291} {"train_loss": -39.731197357177734, "global_step": 156222, "epoch": 1291} {"train_loss": -40.19208526611328, "global_step": 156223, "epoch": 1291} {"train_loss": -39.49747848510742, "global_step": 156224, "epoch": 1291} {"train_loss": -40.82522201538086, "global_step": 156225, "epoch": 1291} {"train_loss": -41.05146408081055, "global_step": 156226, "epoch": 1291} {"train_loss": -41.02761459350586, "global_step": 156227, "epoch": 1291} {"train_loss": -40.06864547729492, "global_step": 156228, "epoch": 1291} {"train_loss": -40.98981475830078, "global_step": 156229, "epoch": 1291} {"train_loss": -40.194000244140625, "global_step": 156230, "epoch": 1291} {"train_loss": -40.99818801879883, "global_step": 156231, "epoch": 1291} {"train_loss": -40.193031311035156, "global_step": 156232, "epoch": 1291} {"train_loss": -39.8853645324707, "global_step": 156233, "epoch": 1291} {"train_loss": -39.009212493896484, "global_step": 156234, "epoch": 1291} {"train_loss": -40.66619873046875, "global_step": 156235, "epoch": 1291} {"train_loss": -41.25657653808594, "global_step": 156236, "epoch": 1291} {"train_loss": -41.50705337524414, "global_step": 156237, "epoch": 1291} {"train_loss": -40.92808532714844, "global_step": 156238, "epoch": 1291} {"train_loss": -40.6844596862793, "global_step": 156239, "epoch": 1291} {"train_loss": -40.98701477050781, "global_step": 156240, "epoch": 1291} {"train_loss": -40.41014862060547, "global_step": 156241, "epoch": 1291} {"train_loss": -41.014434814453125, "global_step": 156242, "epoch": 1291} {"train_loss": -40.190345764160156, "global_step": 156243, "epoch": 1291} {"train_loss": -41.432525634765625, "global_step": 156244, "epoch": 1291} {"train_loss": -40.791255950927734, "global_step": 156245, "epoch": 1291} {"train_loss": -41.473934173583984, "global_step": 156246, "epoch": 1291} {"train_loss": -41.14766311645508, "global_step": 156247, "epoch": 1291} {"train_loss": -40.9970588684082, "global_step": 156248, "epoch": 1291} {"train_loss": -41.73261642456055, "global_step": 156249, "epoch": 1291} {"train_loss": -41.02054977416992, "global_step": 156250, "epoch": 1291} {"train_loss": -40.827423095703125, "global_step": 156251, "epoch": 1291} {"train_loss": -40.92612838745117, "global_step": 156252, "epoch": 1291} {"train_loss": -41.22835159301758, "global_step": 156253, "epoch": 1291} {"train_loss": -40.67911911010742, "global_step": 156254, "epoch": 1291} {"train_loss": -41.19744873046875, "global_step": 156255, "epoch": 1291} {"train_loss": -41.1467170715332, "global_step": 156256, "epoch": 1291} {"train_loss": -40.905147552490234, "global_step": 156257, "epoch": 1291} {"train_loss": -40.50490951538086, "global_step": 156258, "epoch": 1291} {"train_loss": -41.07855987548828, "global_step": 156259, "epoch": 1291} {"train_loss": -41.47829055786133, "global_step": 156260, "epoch": 1291} {"train_loss": -40.34788131713867, "global_step": 156261, "epoch": 1291} {"train_loss": -40.44223403930664, "global_step": 156262, "epoch": 1291} {"train_loss": -40.99038314819336, "global_step": 156263, "epoch": 1291} {"train_loss": -41.18939208984375, "global_step": 156264, "epoch": 1291} {"train_loss": -41.037841796875, "global_step": 156265, "epoch": 1291} {"train_loss": -40.331172943115234, "global_step": 156266, "epoch": 1291} {"train_loss": -40.939327239990234, "global_step": 156267, "epoch": 1291} {"train_loss": -41.16506576538086, "global_step": 156268, "epoch": 1291} {"train_loss": -41.10819625854492, "global_step": 156269, "epoch": 1291} {"train_loss": -41.56226348876953, "global_step": 156270, "epoch": 1291} {"train_loss": -39.813262939453125, "global_step": 156271, "epoch": 1291} {"train_loss": -39.2774772644043, "global_step": 156272, "epoch": 1291} {"train_loss": -38.588348388671875, "global_step": 156273, "epoch": 1291} {"train_loss": -37.353370666503906, "global_step": 156274, "epoch": 1291} {"train_loss": -36.71564865112305, "global_step": 156275, "epoch": 1291} {"train_loss": -37.43172073364258, "global_step": 156276, "epoch": 1291} {"train_loss": -40.25798416137695, "global_step": 156277, "epoch": 1291} {"train_loss": -41.2332878112793, "global_step": 156278, "epoch": 1291} {"train_loss": -38.05178451538086, "global_step": 156279, "epoch": 1291} {"train_loss": -38.70518112182617, "global_step": 156280, "epoch": 1291} {"train_loss": -39.8009147644043, "global_step": 156281, "epoch": 1291} {"train_loss": -40.999568939208984, "global_step": 156282, "epoch": 1291} {"train_loss": -40.067012786865234, "global_step": 156283, "epoch": 1291} {"train_loss": -39.0262565612793, "global_step": 156284, "epoch": 1291} {"train_loss": -38.86776351928711, "global_step": 156285, "epoch": 1291} {"train_loss": -38.680904388427734, "global_step": 156286, "epoch": 1291} {"train_loss": -39.72134017944336, "global_step": 156287, "epoch": 1291} {"train_loss": -41.002559661865234, "global_step": 156288, "epoch": 1291} {"train_loss": -40.83390426635742, "global_step": 156289, "epoch": 1291} {"train_loss": -37.38918685913086, "global_step": 156290, "epoch": 1291} {"train_loss": -40.00919723510742, "global_step": 156291, "epoch": 1291} {"train_loss": -40.26951599121094, "global_step": 156292, "epoch": 1291} {"train_loss": -39.342041015625, "global_step": 156293, "epoch": 1291} {"train_loss": -41.21026611328125, "global_step": 156294, "epoch": 1291} {"train_loss": -39.72563552856445, "global_step": 156295, "epoch": 1291} {"train_loss": -39.73751449584961, "global_step": 156296, "epoch": 1291} {"train_loss": -40.926700592041016, "global_step": 156297, "epoch": 1291} {"train_loss": -40.45233917236328, "global_step": 156298, "epoch": 1291} {"train_loss": -39.62624740600586, "global_step": 156299, "epoch": 1291} {"train_loss": -40.17641067504883, "global_step": 156300, "epoch": 1291} {"train_loss": -38.85480499267578, "global_step": 156301, "epoch": 1291} {"train_loss": -40.01198959350586, "global_step": 156302, "epoch": 1291} {"train_loss": -40.408382415771484, "global_step": 156303, "epoch": 1291} {"train_loss": -39.421356201171875, "global_step": 156304, "epoch": 1291} {"train_loss": -39.8729133605957, "global_step": 156305, "epoch": 1291} {"train_loss": -38.396549224853516, "global_step": 156306, "epoch": 1291} {"train_loss": -39.65054702758789, "global_step": 156307, "epoch": 1291} {"train_loss": -38.586151123046875, "global_step": 156308, "epoch": 1291} {"train_loss": -39.26495361328125, "global_step": 156309, "epoch": 1291} {"train_loss": -39.46235275268555, "global_step": 156310, "epoch": 1291} {"train_loss": -40.41919708251953, "global_step": 156311, "epoch": 1291} {"train_loss": -39.614322662353516, "global_step": 156312, "epoch": 1291} {"train_loss": -38.333465576171875, "global_step": 156313, "epoch": 1291} {"train_loss": -39.046566009521484, "global_step": 156314, "epoch": 1291} {"train_loss": -38.8316650390625, "global_step": 156315, "epoch": 1291} {"train_loss": -40.032283782958984, "global_step": 156316, "epoch": 1291} {"train_loss": -38.06966018676758, "global_step": 156317, "epoch": 1291} {"train_loss": -40.12302780151367, "global_step": 156318, "epoch": 1291} {"train_loss": -40.30406188964844, "global_step": 156319, "epoch": 1291} {"train_loss": -39.82639694213867, "global_step": 156320, "epoch": 1291} {"train_loss": -40.639461517333984, "global_step": 156321, "epoch": 1291} {"train_loss": -40.18729782104492, "global_step": 156322, "epoch": 1291} {"train_loss": -40.1263427734375, "global_step": 156323, "epoch": 1291} {"train_loss": -40.73749923706055, "global_step": 156324, "epoch": 1291} {"train_loss": -39.62678146362305, "global_step": 156325, "epoch": 1291} {"train_loss": -39.796226501464844, "global_step": 156326, "epoch": 1291} {"train_loss": -39.60205078125, "global_step": 156327, "epoch": 1291} {"train_loss": -40.03093338012695, "global_step": 156328, "epoch": 1291} {"train_loss": -40.64152145385742, "global_step": 156329, "epoch": 1291} {"train_loss": -41.015602111816406, "global_step": 156330, "epoch": 1291} {"train_loss": -40.133937362797006, "global_step": 156331, "epoch": 1291, "val_loss": 2798814.0} {"train_loss": -40.972572326660156, "global_step": 156332, "epoch": 1292} {"train_loss": -41.2562141418457, "global_step": 156333, "epoch": 1292} {"train_loss": -41.16944122314453, "global_step": 156334, "epoch": 1292} {"train_loss": -40.19254684448242, "global_step": 156335, "epoch": 1292} {"train_loss": -40.4793586730957, "global_step": 156336, "epoch": 1292} {"train_loss": -38.640377044677734, "global_step": 156337, "epoch": 1292} {"train_loss": -40.279293060302734, "global_step": 156338, "epoch": 1292} {"train_loss": -41.89730453491211, "global_step": 156339, "epoch": 1292} {"train_loss": -40.01752853393555, "global_step": 156340, "epoch": 1292} {"train_loss": -41.3308219909668, "global_step": 156341, "epoch": 1292} {"train_loss": -40.680301666259766, "global_step": 156342, "epoch": 1292} {"train_loss": -41.2354621887207, "global_step": 156343, "epoch": 1292} {"train_loss": -41.51709747314453, "global_step": 156344, "epoch": 1292} {"train_loss": -41.31589889526367, "global_step": 156345, "epoch": 1292} {"train_loss": -40.70884704589844, "global_step": 156346, "epoch": 1292} {"train_loss": -39.89130401611328, "global_step": 156347, "epoch": 1292} {"train_loss": -39.80097198486328, "global_step": 156348, "epoch": 1292} {"train_loss": -41.126007080078125, "global_step": 156349, "epoch": 1292} {"train_loss": -40.73762893676758, "global_step": 156350, "epoch": 1292} {"train_loss": -40.94517135620117, "global_step": 156351, "epoch": 1292} {"train_loss": -40.85271072387695, "global_step": 156352, "epoch": 1292} {"train_loss": -41.5523796081543, "global_step": 156353, "epoch": 1292} {"train_loss": -41.296669006347656, "global_step": 156354, "epoch": 1292} {"train_loss": -41.56820297241211, "global_step": 156355, "epoch": 1292} {"train_loss": -41.69444274902344, "global_step": 156356, "epoch": 1292} {"train_loss": -40.621009826660156, "global_step": 156357, "epoch": 1292} {"train_loss": -39.69843292236328, "global_step": 156358, "epoch": 1292} {"train_loss": -41.43850326538086, "global_step": 156359, "epoch": 1292} {"train_loss": -40.382625579833984, "global_step": 156360, "epoch": 1292} {"train_loss": -38.62454605102539, "global_step": 156361, "epoch": 1292} {"train_loss": -39.323455810546875, "global_step": 156362, "epoch": 1292} {"train_loss": -41.049861907958984, "global_step": 156363, "epoch": 1292} {"train_loss": -40.783058166503906, "global_step": 156364, "epoch": 1292} {"train_loss": -39.99020004272461, "global_step": 156365, "epoch": 1292} {"train_loss": -40.876121520996094, "global_step": 156366, "epoch": 1292} {"train_loss": -40.8154411315918, "global_step": 156367, "epoch": 1292} {"train_loss": -41.23603439331055, "global_step": 156368, "epoch": 1292} {"train_loss": -40.04482650756836, "global_step": 156369, "epoch": 1292} {"train_loss": -40.48041915893555, "global_step": 156370, "epoch": 1292} {"train_loss": -39.94041061401367, "global_step": 156371, "epoch": 1292} {"train_loss": -41.591064453125, "global_step": 156372, "epoch": 1292} {"train_loss": -40.963043212890625, "global_step": 156373, "epoch": 1292} {"train_loss": -40.46035385131836, "global_step": 156374, "epoch": 1292} {"train_loss": -41.347633361816406, "global_step": 156375, "epoch": 1292} {"train_loss": -40.84904098510742, "global_step": 156376, "epoch": 1292} {"train_loss": -41.64870834350586, "global_step": 156377, "epoch": 1292} {"train_loss": -40.49713134765625, "global_step": 156378, "epoch": 1292} {"train_loss": -39.33338165283203, "global_step": 156379, "epoch": 1292} {"train_loss": -40.46223068237305, "global_step": 156380, "epoch": 1292} {"train_loss": -40.46039962768555, "global_step": 156381, "epoch": 1292} {"train_loss": -37.39182662963867, "global_step": 156382, "epoch": 1292} {"train_loss": -40.516395568847656, "global_step": 156383, "epoch": 1292} {"train_loss": -40.807395935058594, "global_step": 156384, "epoch": 1292} {"train_loss": -39.1607780456543, "global_step": 156385, "epoch": 1292} {"train_loss": -39.67106246948242, "global_step": 156386, "epoch": 1292} {"train_loss": -39.33655548095703, "global_step": 156387, "epoch": 1292} {"train_loss": -40.29386520385742, "global_step": 156388, "epoch": 1292} {"train_loss": -40.79209899902344, "global_step": 156389, "epoch": 1292} {"train_loss": -40.55173873901367, "global_step": 156390, "epoch": 1292} {"train_loss": -40.22275924682617, "global_step": 156391, "epoch": 1292} {"train_loss": -39.98969650268555, "global_step": 156392, "epoch": 1292} {"train_loss": -40.884151458740234, "global_step": 156393, "epoch": 1292} {"train_loss": -40.883602142333984, "global_step": 156394, "epoch": 1292} {"train_loss": -41.71006393432617, "global_step": 156395, "epoch": 1292} {"train_loss": -41.0707893371582, "global_step": 156396, "epoch": 1292} {"train_loss": -40.94410705566406, "global_step": 156397, "epoch": 1292} {"train_loss": -40.971527099609375, "global_step": 156398, "epoch": 1292} {"train_loss": -39.93544006347656, "global_step": 156399, "epoch": 1292} {"train_loss": -39.45241928100586, "global_step": 156400, "epoch": 1292} {"train_loss": -41.465091705322266, "global_step": 156401, "epoch": 1292} {"train_loss": -40.365291595458984, "global_step": 156402, "epoch": 1292} {"train_loss": -41.42770004272461, "global_step": 156403, "epoch": 1292} {"train_loss": -40.56272506713867, "global_step": 156404, "epoch": 1292} {"train_loss": -39.895877838134766, "global_step": 156405, "epoch": 1292} {"train_loss": -41.44606399536133, "global_step": 156406, "epoch": 1292} {"train_loss": -40.72858428955078, "global_step": 156407, "epoch": 1292} {"train_loss": -39.88213348388672, "global_step": 156408, "epoch": 1292} {"train_loss": -39.81351852416992, "global_step": 156409, "epoch": 1292} {"train_loss": -40.58415222167969, "global_step": 156410, "epoch": 1292} {"train_loss": -40.01375961303711, "global_step": 156411, "epoch": 1292} {"train_loss": -39.97951889038086, "global_step": 156412, "epoch": 1292} {"train_loss": -39.41610336303711, "global_step": 156413, "epoch": 1292} {"train_loss": -39.48036575317383, "global_step": 156414, "epoch": 1292} {"train_loss": -40.35920715332031, "global_step": 156415, "epoch": 1292} {"train_loss": -37.35746765136719, "global_step": 156416, "epoch": 1292} {"train_loss": -39.09649658203125, "global_step": 156417, "epoch": 1292} {"train_loss": -39.155609130859375, "global_step": 156418, "epoch": 1292} {"train_loss": -39.474884033203125, "global_step": 156419, "epoch": 1292} {"train_loss": -34.48493194580078, "global_step": 156420, "epoch": 1292} {"train_loss": -39.36689376831055, "global_step": 156421, "epoch": 1292} {"train_loss": -37.31975173950195, "global_step": 156422, "epoch": 1292} {"train_loss": -37.7779541015625, "global_step": 156423, "epoch": 1292} {"train_loss": -38.52408218383789, "global_step": 156424, "epoch": 1292} {"train_loss": -32.57352828979492, "global_step": 156425, "epoch": 1292} {"train_loss": -31.248071670532227, "global_step": 156426, "epoch": 1292} {"train_loss": -40.0433464050293, "global_step": 156427, "epoch": 1292} {"train_loss": -34.044734954833984, "global_step": 156428, "epoch": 1292} {"train_loss": -38.899375915527344, "global_step": 156429, "epoch": 1292} {"train_loss": -35.8870964050293, "global_step": 156430, "epoch": 1292} {"train_loss": -35.931976318359375, "global_step": 156431, "epoch": 1292} {"train_loss": -29.17578125, "global_step": 156432, "epoch": 1292} {"train_loss": -30.4239501953125, "global_step": 156433, "epoch": 1292} {"train_loss": -36.959529876708984, "global_step": 156434, "epoch": 1292} {"train_loss": -35.688880920410156, "global_step": 156435, "epoch": 1292} {"train_loss": -37.007259368896484, "global_step": 156436, "epoch": 1292} {"train_loss": -37.8596076965332, "global_step": 156437, "epoch": 1292} {"train_loss": -37.657798767089844, "global_step": 156438, "epoch": 1292} {"train_loss": -33.86790084838867, "global_step": 156439, "epoch": 1292} {"train_loss": -31.768224716186523, "global_step": 156440, "epoch": 1292} {"train_loss": -35.48537826538086, "global_step": 156441, "epoch": 1292} {"train_loss": -38.42087936401367, "global_step": 156442, "epoch": 1292} {"train_loss": -36.67135238647461, "global_step": 156443, "epoch": 1292} {"train_loss": -38.132389068603516, "global_step": 156444, "epoch": 1292} {"train_loss": -36.52093505859375, "global_step": 156445, "epoch": 1292} {"train_loss": -35.18547821044922, "global_step": 156446, "epoch": 1292} {"train_loss": -38.66134262084961, "global_step": 156447, "epoch": 1292} {"train_loss": -37.60706329345703, "global_step": 156448, "epoch": 1292} {"train_loss": -38.559139251708984, "global_step": 156449, "epoch": 1292} {"train_loss": -39.3889274597168, "global_step": 156450, "epoch": 1292} {"train_loss": -38.00054931640625, "global_step": 156451, "epoch": 1292} {"train_loss": -39.30231721736183, "global_step": 156452, "epoch": 1292, "val_loss": 2620518.25} {"train_loss": -38.378597259521484, "global_step": 156453, "epoch": 1293} {"train_loss": -36.931480407714844, "global_step": 156454, "epoch": 1293} {"train_loss": -37.655982971191406, "global_step": 156455, "epoch": 1293} {"train_loss": -38.78410720825195, "global_step": 156456, "epoch": 1293} {"train_loss": -38.620296478271484, "global_step": 156457, "epoch": 1293} {"train_loss": -36.04800796508789, "global_step": 156458, "epoch": 1293} {"train_loss": -39.526466369628906, "global_step": 156459, "epoch": 1293} {"train_loss": -37.65129089355469, "global_step": 156460, "epoch": 1293} {"train_loss": -37.74388885498047, "global_step": 156461, "epoch": 1293} {"train_loss": -39.25810623168945, "global_step": 156462, "epoch": 1293} {"train_loss": -38.9747314453125, "global_step": 156463, "epoch": 1293} {"train_loss": -38.16560363769531, "global_step": 156464, "epoch": 1293} {"train_loss": -39.40470886230469, "global_step": 156465, "epoch": 1293} {"train_loss": -39.809295654296875, "global_step": 156466, "epoch": 1293} {"train_loss": -39.21564483642578, "global_step": 156467, "epoch": 1293} {"train_loss": -38.691192626953125, "global_step": 156468, "epoch": 1293} {"train_loss": -38.631282806396484, "global_step": 156469, "epoch": 1293} {"train_loss": -39.45554733276367, "global_step": 156470, "epoch": 1293} {"train_loss": -39.51321029663086, "global_step": 156471, "epoch": 1293} {"train_loss": -39.16958236694336, "global_step": 156472, "epoch": 1293} {"train_loss": -39.17190933227539, "global_step": 156473, "epoch": 1293} {"train_loss": -39.63418197631836, "global_step": 156474, "epoch": 1293} {"train_loss": -36.7220573425293, "global_step": 156475, "epoch": 1293} {"train_loss": -39.90102767944336, "global_step": 156476, "epoch": 1293} {"train_loss": -38.681278228759766, "global_step": 156477, "epoch": 1293} {"train_loss": -39.7747802734375, "global_step": 156478, "epoch": 1293} {"train_loss": -39.89077377319336, "global_step": 156479, "epoch": 1293} {"train_loss": -39.89906692504883, "global_step": 156480, "epoch": 1293} {"train_loss": -39.86798858642578, "global_step": 156481, "epoch": 1293} {"train_loss": -39.51700973510742, "global_step": 156482, "epoch": 1293} {"train_loss": -39.01714324951172, "global_step": 156483, "epoch": 1293} {"train_loss": -39.45113754272461, "global_step": 156484, "epoch": 1293} {"train_loss": -40.216278076171875, "global_step": 156485, "epoch": 1293} {"train_loss": -40.09370803833008, "global_step": 156486, "epoch": 1293} {"train_loss": -36.604610443115234, "global_step": 156487, "epoch": 1293} {"train_loss": -39.89530563354492, "global_step": 156488, "epoch": 1293} {"train_loss": -40.23732376098633, "global_step": 156489, "epoch": 1293} {"train_loss": -40.19739532470703, "global_step": 156490, "epoch": 1293} {"train_loss": -39.76390075683594, "global_step": 156491, "epoch": 1293} {"train_loss": -36.21923828125, "global_step": 156492, "epoch": 1293} {"train_loss": -40.42298889160156, "global_step": 156493, "epoch": 1293} {"train_loss": -39.93144607543945, "global_step": 156494, "epoch": 1293} {"train_loss": -39.649593353271484, "global_step": 156495, "epoch": 1293} {"train_loss": -39.51397705078125, "global_step": 156496, "epoch": 1293} {"train_loss": -38.90000534057617, "global_step": 156497, "epoch": 1293} {"train_loss": -40.523719787597656, "global_step": 156498, "epoch": 1293} {"train_loss": -39.93740463256836, "global_step": 156499, "epoch": 1293} {"train_loss": -40.41011047363281, "global_step": 156500, "epoch": 1293} {"train_loss": -40.11964797973633, "global_step": 156501, "epoch": 1293} {"train_loss": -38.63082504272461, "global_step": 156502, "epoch": 1293} {"train_loss": -39.824703216552734, "global_step": 156503, "epoch": 1293} {"train_loss": -40.52065658569336, "global_step": 156504, "epoch": 1293} {"train_loss": -40.634857177734375, "global_step": 156505, "epoch": 1293} {"train_loss": -39.47807693481445, "global_step": 156506, "epoch": 1293} {"train_loss": -40.83728790283203, "global_step": 156507, "epoch": 1293} {"train_loss": -40.792633056640625, "global_step": 156508, "epoch": 1293} {"train_loss": -40.43927001953125, "global_step": 156509, "epoch": 1293} {"train_loss": -39.343482971191406, "global_step": 156510, "epoch": 1293} {"train_loss": -40.82912826538086, "global_step": 156511, "epoch": 1293} {"train_loss": -40.73305892944336, "global_step": 156512, "epoch": 1293} {"train_loss": -41.22127914428711, "global_step": 156513, "epoch": 1293} {"train_loss": -40.53984451293945, "global_step": 156514, "epoch": 1293} {"train_loss": -39.628517150878906, "global_step": 156515, "epoch": 1293} {"train_loss": -39.94478988647461, "global_step": 156516, "epoch": 1293} {"train_loss": -40.14979934692383, "global_step": 156517, "epoch": 1293} {"train_loss": -39.99581527709961, "global_step": 156518, "epoch": 1293} {"train_loss": -40.94116973876953, "global_step": 156519, "epoch": 1293} {"train_loss": -41.12541961669922, "global_step": 156520, "epoch": 1293} {"train_loss": -40.984954833984375, "global_step": 156521, "epoch": 1293} {"train_loss": -40.54391098022461, "global_step": 156522, "epoch": 1293} {"train_loss": -40.57417678833008, "global_step": 156523, "epoch": 1293} {"train_loss": -40.75112533569336, "global_step": 156524, "epoch": 1293} {"train_loss": -40.628849029541016, "global_step": 156525, "epoch": 1293} {"train_loss": -41.33856964111328, "global_step": 156526, "epoch": 1293} {"train_loss": -40.90816879272461, "global_step": 156527, "epoch": 1293} {"train_loss": -40.445533752441406, "global_step": 156528, "epoch": 1293} {"train_loss": -41.33616256713867, "global_step": 156529, "epoch": 1293} {"train_loss": -41.112274169921875, "global_step": 156530, "epoch": 1293} {"train_loss": -40.612300872802734, "global_step": 156531, "epoch": 1293} {"train_loss": -40.24440383911133, "global_step": 156532, "epoch": 1293} {"train_loss": -40.55849075317383, "global_step": 156533, "epoch": 1293} {"train_loss": -40.748870849609375, "global_step": 156534, "epoch": 1293} {"train_loss": -39.66855239868164, "global_step": 156535, "epoch": 1293} {"train_loss": -41.060691833496094, "global_step": 156536, "epoch": 1293} {"train_loss": -41.56543731689453, "global_step": 156537, "epoch": 1293} {"train_loss": -41.238136291503906, "global_step": 156538, "epoch": 1293} {"train_loss": -40.30226516723633, "global_step": 156539, "epoch": 1293} {"train_loss": -40.89715576171875, "global_step": 156540, "epoch": 1293} {"train_loss": -39.60226058959961, "global_step": 156541, "epoch": 1293} {"train_loss": -40.375083923339844, "global_step": 156542, "epoch": 1293} {"train_loss": -40.19928741455078, "global_step": 156543, "epoch": 1293} {"train_loss": -39.82001876831055, "global_step": 156544, "epoch": 1293} {"train_loss": -40.479949951171875, "global_step": 156545, "epoch": 1293} {"train_loss": -40.14580535888672, "global_step": 156546, "epoch": 1293} {"train_loss": -40.58302688598633, "global_step": 156547, "epoch": 1293} {"train_loss": -39.44008255004883, "global_step": 156548, "epoch": 1293} {"train_loss": -36.78738784790039, "global_step": 156549, "epoch": 1293} {"train_loss": -39.467525482177734, "global_step": 156550, "epoch": 1293} {"train_loss": -40.80845260620117, "global_step": 156551, "epoch": 1293} {"train_loss": -38.80208969116211, "global_step": 156552, "epoch": 1293} {"train_loss": -38.19611358642578, "global_step": 156553, "epoch": 1293} {"train_loss": -37.91781997680664, "global_step": 156554, "epoch": 1293} {"train_loss": -39.367706298828125, "global_step": 156555, "epoch": 1293} {"train_loss": -40.7735595703125, "global_step": 156556, "epoch": 1293} {"train_loss": -38.90755081176758, "global_step": 156557, "epoch": 1293} {"train_loss": -38.77680206298828, "global_step": 156558, "epoch": 1293} {"train_loss": -38.16274642944336, "global_step": 156559, "epoch": 1293} {"train_loss": -39.3562126159668, "global_step": 156560, "epoch": 1293} {"train_loss": -37.21132278442383, "global_step": 156561, "epoch": 1293} {"train_loss": -39.30388259887695, "global_step": 156562, "epoch": 1293} {"train_loss": -40.36886215209961, "global_step": 156563, "epoch": 1293} {"train_loss": -40.11091613769531, "global_step": 156564, "epoch": 1293} {"train_loss": -39.29148483276367, "global_step": 156565, "epoch": 1293} {"train_loss": -39.17200469970703, "global_step": 156566, "epoch": 1293} {"train_loss": -40.113189697265625, "global_step": 156567, "epoch": 1293} {"train_loss": -39.41371536254883, "global_step": 156568, "epoch": 1293} {"train_loss": -37.6209831237793, "global_step": 156569, "epoch": 1293} {"train_loss": -38.07963562011719, "global_step": 156570, "epoch": 1293} {"train_loss": -40.686973571777344, "global_step": 156571, "epoch": 1293} {"train_loss": -37.63801574707031, "global_step": 156572, "epoch": 1293} {"train_loss": -39.61414475874467, "global_step": 156573, "epoch": 1293, "val_loss": 2662453.25} {"train_loss": -39.39986801147461, "global_step": 156574, "epoch": 1294} {"train_loss": -39.65717315673828, "global_step": 156575, "epoch": 1294} {"train_loss": -40.697322845458984, "global_step": 156576, "epoch": 1294} {"train_loss": -40.107887268066406, "global_step": 156577, "epoch": 1294} {"train_loss": -39.75999069213867, "global_step": 156578, "epoch": 1294} {"train_loss": -39.70154571533203, "global_step": 156579, "epoch": 1294} {"train_loss": -39.447872161865234, "global_step": 156580, "epoch": 1294} {"train_loss": -40.378814697265625, "global_step": 156581, "epoch": 1294} {"train_loss": -40.40308380126953, "global_step": 156582, "epoch": 1294} {"train_loss": -40.50898361206055, "global_step": 156583, "epoch": 1294} {"train_loss": -40.461944580078125, "global_step": 156584, "epoch": 1294} {"train_loss": -40.36348342895508, "global_step": 156585, "epoch": 1294} {"train_loss": -41.253421783447266, "global_step": 156586, "epoch": 1294} {"train_loss": -40.62868881225586, "global_step": 156587, "epoch": 1294} {"train_loss": -40.62473678588867, "global_step": 156588, "epoch": 1294} {"train_loss": -41.032325744628906, "global_step": 156589, "epoch": 1294} {"train_loss": -41.170284271240234, "global_step": 156590, "epoch": 1294} {"train_loss": -40.867496490478516, "global_step": 156591, "epoch": 1294} {"train_loss": -40.484676361083984, "global_step": 156592, "epoch": 1294} {"train_loss": -41.08705139160156, "global_step": 156593, "epoch": 1294} {"train_loss": -41.28626251220703, "global_step": 156594, "epoch": 1294} {"train_loss": -40.66960906982422, "global_step": 156595, "epoch": 1294} {"train_loss": -40.440364837646484, "global_step": 156596, "epoch": 1294} {"train_loss": -40.8168830871582, "global_step": 156597, "epoch": 1294} {"train_loss": -40.48273849487305, "global_step": 156598, "epoch": 1294} {"train_loss": -41.01522445678711, "global_step": 156599, "epoch": 1294} {"train_loss": -41.21476745605469, "global_step": 156600, "epoch": 1294} {"train_loss": -40.53495407104492, "global_step": 156601, "epoch": 1294} {"train_loss": -40.92259979248047, "global_step": 156602, "epoch": 1294} {"train_loss": -40.473201751708984, "global_step": 156603, "epoch": 1294} {"train_loss": -40.789424896240234, "global_step": 156604, "epoch": 1294} {"train_loss": -39.50489807128906, "global_step": 156605, "epoch": 1294} {"train_loss": -39.81466293334961, "global_step": 156606, "epoch": 1294} {"train_loss": -39.742958068847656, "global_step": 156607, "epoch": 1294} {"train_loss": -39.835975646972656, "global_step": 156608, "epoch": 1294} {"train_loss": -39.42015075683594, "global_step": 156609, "epoch": 1294} {"train_loss": -40.27312088012695, "global_step": 156610, "epoch": 1294} {"train_loss": -38.8353157043457, "global_step": 156611, "epoch": 1294} {"train_loss": -38.486053466796875, "global_step": 156612, "epoch": 1294} {"train_loss": -40.136531829833984, "global_step": 156613, "epoch": 1294} {"train_loss": -40.3792610168457, "global_step": 156614, "epoch": 1294} {"train_loss": -39.9493408203125, "global_step": 156615, "epoch": 1294} {"train_loss": -39.404052734375, "global_step": 156616, "epoch": 1294} {"train_loss": -39.52009582519531, "global_step": 156617, "epoch": 1294} {"train_loss": -40.18967819213867, "global_step": 156618, "epoch": 1294} {"train_loss": -39.831539154052734, "global_step": 156619, "epoch": 1294} {"train_loss": -40.44989776611328, "global_step": 156620, "epoch": 1294} {"train_loss": -39.912086486816406, "global_step": 156621, "epoch": 1294} {"train_loss": -39.24563217163086, "global_step": 156622, "epoch": 1294} {"train_loss": -39.58228302001953, "global_step": 156623, "epoch": 1294} {"train_loss": -39.970848083496094, "global_step": 156624, "epoch": 1294} {"train_loss": -40.44401168823242, "global_step": 156625, "epoch": 1294} {"train_loss": -39.82677459716797, "global_step": 156626, "epoch": 1294} {"train_loss": -40.207862854003906, "global_step": 156627, "epoch": 1294} {"train_loss": -39.83062744140625, "global_step": 156628, "epoch": 1294} {"train_loss": -40.27712631225586, "global_step": 156629, "epoch": 1294} {"train_loss": -39.71044921875, "global_step": 156630, "epoch": 1294} {"train_loss": -40.14574432373047, "global_step": 156631, "epoch": 1294} {"train_loss": -40.18342208862305, "global_step": 156632, "epoch": 1294} {"train_loss": -37.35411834716797, "global_step": 156633, "epoch": 1294} {"train_loss": -40.27559280395508, "global_step": 156634, "epoch": 1294} {"train_loss": -40.02128219604492, "global_step": 156635, "epoch": 1294} {"train_loss": -39.92843246459961, "global_step": 156636, "epoch": 1294} {"train_loss": -39.97268295288086, "global_step": 156637, "epoch": 1294} {"train_loss": -40.279972076416016, "global_step": 156638, "epoch": 1294} {"train_loss": -41.009273529052734, "global_step": 156639, "epoch": 1294} {"train_loss": -39.62038803100586, "global_step": 156640, "epoch": 1294} {"train_loss": -40.298152923583984, "global_step": 156641, "epoch": 1294} {"train_loss": -40.52447509765625, "global_step": 156642, "epoch": 1294} {"train_loss": -40.63957977294922, "global_step": 156643, "epoch": 1294} {"train_loss": -40.590084075927734, "global_step": 156644, "epoch": 1294} {"train_loss": -40.700496673583984, "global_step": 156645, "epoch": 1294} {"train_loss": -39.591552734375, "global_step": 156646, "epoch": 1294} {"train_loss": -40.15047836303711, "global_step": 156647, "epoch": 1294} {"train_loss": -40.91044235229492, "global_step": 156648, "epoch": 1294} {"train_loss": -40.42778396606445, "global_step": 156649, "epoch": 1294} {"train_loss": -40.10475540161133, "global_step": 156650, "epoch": 1294} {"train_loss": -40.62672805786133, "global_step": 156651, "epoch": 1294} {"train_loss": -40.88981246948242, "global_step": 156652, "epoch": 1294} {"train_loss": -40.969459533691406, "global_step": 156653, "epoch": 1294} {"train_loss": -40.49485397338867, "global_step": 156654, "epoch": 1294} {"train_loss": -40.57249069213867, "global_step": 156655, "epoch": 1294} {"train_loss": -39.839813232421875, "global_step": 156656, "epoch": 1294} {"train_loss": -40.89207077026367, "global_step": 156657, "epoch": 1294} {"train_loss": -40.32100296020508, "global_step": 156658, "epoch": 1294} {"train_loss": -40.56321716308594, "global_step": 156659, "epoch": 1294} {"train_loss": -39.54173278808594, "global_step": 156660, "epoch": 1294} {"train_loss": -39.280269622802734, "global_step": 156661, "epoch": 1294} {"train_loss": -39.28137969970703, "global_step": 156662, "epoch": 1294} {"train_loss": -39.2834587097168, "global_step": 156663, "epoch": 1294} {"train_loss": -37.63753890991211, "global_step": 156664, "epoch": 1294} {"train_loss": -37.0064697265625, "global_step": 156665, "epoch": 1294} {"train_loss": -35.18595504760742, "global_step": 156666, "epoch": 1294} {"train_loss": -38.394622802734375, "global_step": 156667, "epoch": 1294} {"train_loss": -37.9614143371582, "global_step": 156668, "epoch": 1294} {"train_loss": -35.7253303527832, "global_step": 156669, "epoch": 1294} {"train_loss": -34.2315673828125, "global_step": 156670, "epoch": 1294} {"train_loss": -38.61146545410156, "global_step": 156671, "epoch": 1294} {"train_loss": -33.10017013549805, "global_step": 156672, "epoch": 1294} {"train_loss": -34.28928756713867, "global_step": 156673, "epoch": 1294} {"train_loss": -34.753501892089844, "global_step": 156674, "epoch": 1294} {"train_loss": -36.4739990234375, "global_step": 156675, "epoch": 1294} {"train_loss": -33.972450256347656, "global_step": 156676, "epoch": 1294} {"train_loss": -38.47827911376953, "global_step": 156677, "epoch": 1294} {"train_loss": -37.244014739990234, "global_step": 156678, "epoch": 1294} {"train_loss": -37.28178024291992, "global_step": 156679, "epoch": 1294} {"train_loss": -37.0074577331543, "global_step": 156680, "epoch": 1294} {"train_loss": -36.620849609375, "global_step": 156681, "epoch": 1294} {"train_loss": -38.80513381958008, "global_step": 156682, "epoch": 1294} {"train_loss": -32.57084274291992, "global_step": 156683, "epoch": 1294} {"train_loss": -34.1059684753418, "global_step": 156684, "epoch": 1294} {"train_loss": -34.1693000793457, "global_step": 156685, "epoch": 1294} {"train_loss": -37.96599197387695, "global_step": 156686, "epoch": 1294} {"train_loss": -37.139442443847656, "global_step": 156687, "epoch": 1294} {"train_loss": -35.53669357299805, "global_step": 156688, "epoch": 1294} {"train_loss": -36.955318450927734, "global_step": 156689, "epoch": 1294} {"train_loss": -35.121707916259766, "global_step": 156690, "epoch": 1294} {"train_loss": -39.06812286376953, "global_step": 156691, "epoch": 1294} {"train_loss": -36.59882736206055, "global_step": 156692, "epoch": 1294} {"train_loss": -32.493629455566406, "global_step": 156693, "epoch": 1294} {"train_loss": -39.13097116769838, "global_step": 156694, "epoch": 1294, "val_loss": 2494361.0} {"train_loss": -35.27373123168945, "global_step": 156695, "epoch": 1295} {"train_loss": -36.035545349121094, "global_step": 156696, "epoch": 1295} {"train_loss": -32.456661224365234, "global_step": 156697, "epoch": 1295} {"train_loss": -35.160743713378906, "global_step": 156698, "epoch": 1295} {"train_loss": -35.6353645324707, "global_step": 156699, "epoch": 1295} {"train_loss": -36.68716049194336, "global_step": 156700, "epoch": 1295} {"train_loss": -35.66357421875, "global_step": 156701, "epoch": 1295} {"train_loss": -29.813241958618164, "global_step": 156702, "epoch": 1295} {"train_loss": -36.39948654174805, "global_step": 156703, "epoch": 1295} {"train_loss": -31.379196166992188, "global_step": 156704, "epoch": 1295} {"train_loss": -38.07689666748047, "global_step": 156705, "epoch": 1295} {"train_loss": -34.015045166015625, "global_step": 156706, "epoch": 1295} {"train_loss": -37.243709564208984, "global_step": 156707, "epoch": 1295} {"train_loss": -36.9781494140625, "global_step": 156708, "epoch": 1295} {"train_loss": -35.31901168823242, "global_step": 156709, "epoch": 1295} {"train_loss": -37.54653549194336, "global_step": 156710, "epoch": 1295} {"train_loss": -37.02627182006836, "global_step": 156711, "epoch": 1295} {"train_loss": -37.97813034057617, "global_step": 156712, "epoch": 1295} {"train_loss": -37.75782012939453, "global_step": 156713, "epoch": 1295} {"train_loss": -38.49488067626953, "global_step": 156714, "epoch": 1295} {"train_loss": -37.7923583984375, "global_step": 156715, "epoch": 1295} {"train_loss": -38.25648880004883, "global_step": 156716, "epoch": 1295} {"train_loss": -38.614051818847656, "global_step": 156717, "epoch": 1295} {"train_loss": -38.764373779296875, "global_step": 156718, "epoch": 1295} {"train_loss": -38.11686325073242, "global_step": 156719, "epoch": 1295} {"train_loss": -38.78812026977539, "global_step": 156720, "epoch": 1295} {"train_loss": -38.39345932006836, "global_step": 156721, "epoch": 1295} {"train_loss": -39.00492477416992, "global_step": 156722, "epoch": 1295} {"train_loss": -38.7711181640625, "global_step": 156723, "epoch": 1295} {"train_loss": -38.87508773803711, "global_step": 156724, "epoch": 1295} {"train_loss": -39.02777099609375, "global_step": 156725, "epoch": 1295} {"train_loss": -39.20536422729492, "global_step": 156726, "epoch": 1295} {"train_loss": -38.49082565307617, "global_step": 156727, "epoch": 1295} {"train_loss": -39.26680374145508, "global_step": 156728, "epoch": 1295} {"train_loss": -39.284400939941406, "global_step": 156729, "epoch": 1295} {"train_loss": -39.23984146118164, "global_step": 156730, "epoch": 1295} {"train_loss": -38.92433166503906, "global_step": 156731, "epoch": 1295} {"train_loss": -39.58049392700195, "global_step": 156732, "epoch": 1295} {"train_loss": -39.57512283325195, "global_step": 156733, "epoch": 1295} {"train_loss": -39.538719177246094, "global_step": 156734, "epoch": 1295} {"train_loss": -39.303653717041016, "global_step": 156735, "epoch": 1295} {"train_loss": -38.952606201171875, "global_step": 156736, "epoch": 1295} {"train_loss": -39.58186721801758, "global_step": 156737, "epoch": 1295} {"train_loss": -39.7636833190918, "global_step": 156738, "epoch": 1295} {"train_loss": -39.311988830566406, "global_step": 156739, "epoch": 1295} {"train_loss": -34.710384368896484, "global_step": 156740, "epoch": 1295} {"train_loss": -39.90391159057617, "global_step": 156741, "epoch": 1295} {"train_loss": -39.88657760620117, "global_step": 156742, "epoch": 1295} {"train_loss": -39.6888313293457, "global_step": 156743, "epoch": 1295} {"train_loss": -39.90354537963867, "global_step": 156744, "epoch": 1295} {"train_loss": -39.478546142578125, "global_step": 156745, "epoch": 1295} {"train_loss": -39.7337532043457, "global_step": 156746, "epoch": 1295} {"train_loss": -39.49732971191406, "global_step": 156747, "epoch": 1295} {"train_loss": -39.15517044067383, "global_step": 156748, "epoch": 1295} {"train_loss": -39.93229675292969, "global_step": 156749, "epoch": 1295} {"train_loss": -39.06972885131836, "global_step": 156750, "epoch": 1295} {"train_loss": -39.567901611328125, "global_step": 156751, "epoch": 1295} {"train_loss": -39.71113967895508, "global_step": 156752, "epoch": 1295} {"train_loss": -39.631385803222656, "global_step": 156753, "epoch": 1295} {"train_loss": -39.86977767944336, "global_step": 156754, "epoch": 1295} {"train_loss": -39.68533706665039, "global_step": 156755, "epoch": 1295} {"train_loss": -40.220008850097656, "global_step": 156756, "epoch": 1295} {"train_loss": -40.109710693359375, "global_step": 156757, "epoch": 1295} {"train_loss": -39.805171966552734, "global_step": 156758, "epoch": 1295} {"train_loss": -39.96958923339844, "global_step": 156759, "epoch": 1295} {"train_loss": -40.0908088684082, "global_step": 156760, "epoch": 1295} {"train_loss": -39.88212203979492, "global_step": 156761, "epoch": 1295} {"train_loss": -39.902381896972656, "global_step": 156762, "epoch": 1295} {"train_loss": -39.39778518676758, "global_step": 156763, "epoch": 1295} {"train_loss": -40.66550827026367, "global_step": 156764, "epoch": 1295} {"train_loss": -40.53227615356445, "global_step": 156765, "epoch": 1295} {"train_loss": -40.41587829589844, "global_step": 156766, "epoch": 1295} {"train_loss": -39.72441482543945, "global_step": 156767, "epoch": 1295} {"train_loss": -40.51469802856445, "global_step": 156768, "epoch": 1295} {"train_loss": -40.73763656616211, "global_step": 156769, "epoch": 1295} {"train_loss": -40.38796615600586, "global_step": 156770, "epoch": 1295} {"train_loss": -40.44203567504883, "global_step": 156771, "epoch": 1295} {"train_loss": -40.52758026123047, "global_step": 156772, "epoch": 1295} {"train_loss": -39.982765197753906, "global_step": 156773, "epoch": 1295} {"train_loss": -40.275325775146484, "global_step": 156774, "epoch": 1295} {"train_loss": -40.67759323120117, "global_step": 156775, "epoch": 1295} {"train_loss": -40.78147506713867, "global_step": 156776, "epoch": 1295} {"train_loss": -40.81084060668945, "global_step": 156777, "epoch": 1295} {"train_loss": -39.92402267456055, "global_step": 156778, "epoch": 1295} {"train_loss": -39.95524215698242, "global_step": 156779, "epoch": 1295} {"train_loss": -40.3898811340332, "global_step": 156780, "epoch": 1295} {"train_loss": -40.91362380981445, "global_step": 156781, "epoch": 1295} {"train_loss": -40.77704620361328, "global_step": 156782, "epoch": 1295} {"train_loss": -40.76000213623047, "global_step": 156783, "epoch": 1295} {"train_loss": -41.0710563659668, "global_step": 156784, "epoch": 1295} {"train_loss": -40.60148239135742, "global_step": 156785, "epoch": 1295} {"train_loss": -41.12746047973633, "global_step": 156786, "epoch": 1295} {"train_loss": -40.440914154052734, "global_step": 156787, "epoch": 1295} {"train_loss": -41.2041130065918, "global_step": 156788, "epoch": 1295} {"train_loss": -40.97269821166992, "global_step": 156789, "epoch": 1295} {"train_loss": -40.706390380859375, "global_step": 156790, "epoch": 1295} {"train_loss": -40.340126037597656, "global_step": 156791, "epoch": 1295} {"train_loss": -40.291534423828125, "global_step": 156792, "epoch": 1295} {"train_loss": -38.061073303222656, "global_step": 156793, "epoch": 1295} {"train_loss": -37.537353515625, "global_step": 156794, "epoch": 1295} {"train_loss": -37.786354064941406, "global_step": 156795, "epoch": 1295} {"train_loss": -38.4365234375, "global_step": 156796, "epoch": 1295} {"train_loss": -41.259586334228516, "global_step": 156797, "epoch": 1295} {"train_loss": -40.389339447021484, "global_step": 156798, "epoch": 1295} {"train_loss": -40.59886932373047, "global_step": 156799, "epoch": 1295} {"train_loss": -40.07843780517578, "global_step": 156800, "epoch": 1295} {"train_loss": -40.03401565551758, "global_step": 156801, "epoch": 1295} {"train_loss": -39.06635284423828, "global_step": 156802, "epoch": 1295} {"train_loss": -38.5384635925293, "global_step": 156803, "epoch": 1295} {"train_loss": -38.87770080566406, "global_step": 156804, "epoch": 1295} {"train_loss": -39.67226791381836, "global_step": 156805, "epoch": 1295} {"train_loss": -40.97147750854492, "global_step": 156806, "epoch": 1295} {"train_loss": -41.01389694213867, "global_step": 156807, "epoch": 1295} {"train_loss": -40.89288330078125, "global_step": 156808, "epoch": 1295} {"train_loss": -40.18952560424805, "global_step": 156809, "epoch": 1295} {"train_loss": -40.958309173583984, "global_step": 156810, "epoch": 1295} {"train_loss": -40.28524398803711, "global_step": 156811, "epoch": 1295} {"train_loss": -40.03994369506836, "global_step": 156812, "epoch": 1295} {"train_loss": -39.56600570678711, "global_step": 156813, "epoch": 1295} {"train_loss": -40.40632629394531, "global_step": 156814, "epoch": 1295} {"train_loss": -39.08794776664293, "global_step": 156815, "epoch": 1295, "val_loss": 2634719.25} {"train_loss": -40.66804122924805, "global_step": 156816, "epoch": 1296} {"train_loss": -39.98105239868164, "global_step": 156817, "epoch": 1296} {"train_loss": -40.14801025390625, "global_step": 156818, "epoch": 1296} {"train_loss": -40.94807815551758, "global_step": 156819, "epoch": 1296} {"train_loss": -41.10895919799805, "global_step": 156820, "epoch": 1296} {"train_loss": -40.33465576171875, "global_step": 156821, "epoch": 1296} {"train_loss": -40.21744918823242, "global_step": 156822, "epoch": 1296} {"train_loss": -39.57419204711914, "global_step": 156823, "epoch": 1296} {"train_loss": -39.397090911865234, "global_step": 156824, "epoch": 1296} {"train_loss": -40.34147262573242, "global_step": 156825, "epoch": 1296} {"train_loss": -39.476165771484375, "global_step": 156826, "epoch": 1296} {"train_loss": -40.10173416137695, "global_step": 156827, "epoch": 1296} {"train_loss": -40.1620979309082, "global_step": 156828, "epoch": 1296} {"train_loss": -40.446990966796875, "global_step": 156829, "epoch": 1296} {"train_loss": -37.83858108520508, "global_step": 156830, "epoch": 1296} {"train_loss": -40.92971420288086, "global_step": 156831, "epoch": 1296} {"train_loss": -38.28316879272461, "global_step": 156832, "epoch": 1296} {"train_loss": -40.104461669921875, "global_step": 156833, "epoch": 1296} {"train_loss": -39.20532989501953, "global_step": 156834, "epoch": 1296} {"train_loss": -40.293880462646484, "global_step": 156835, "epoch": 1296} {"train_loss": -40.82294845581055, "global_step": 156836, "epoch": 1296} {"train_loss": -40.01112747192383, "global_step": 156837, "epoch": 1296} {"train_loss": -39.05647659301758, "global_step": 156838, "epoch": 1296} {"train_loss": -40.29952621459961, "global_step": 156839, "epoch": 1296} {"train_loss": -39.755104064941406, "global_step": 156840, "epoch": 1296} {"train_loss": -39.818634033203125, "global_step": 156841, "epoch": 1296} {"train_loss": -40.5419921875, "global_step": 156842, "epoch": 1296} {"train_loss": -40.736541748046875, "global_step": 156843, "epoch": 1296} {"train_loss": -40.77695846557617, "global_step": 156844, "epoch": 1296} {"train_loss": -40.347564697265625, "global_step": 156845, "epoch": 1296} {"train_loss": -40.760292053222656, "global_step": 156846, "epoch": 1296} {"train_loss": -40.57761764526367, "global_step": 156847, "epoch": 1296} {"train_loss": -40.52417755126953, "global_step": 156848, "epoch": 1296} {"train_loss": -40.003841400146484, "global_step": 156849, "epoch": 1296} {"train_loss": -40.29203796386719, "global_step": 156850, "epoch": 1296} {"train_loss": -40.912288665771484, "global_step": 156851, "epoch": 1296} {"train_loss": -39.40183639526367, "global_step": 156852, "epoch": 1296} {"train_loss": -39.45841598510742, "global_step": 156853, "epoch": 1296} {"train_loss": -39.87795639038086, "global_step": 156854, "epoch": 1296} {"train_loss": -40.0, "global_step": 156855, "epoch": 1296} {"train_loss": -39.980987548828125, "global_step": 156856, "epoch": 1296} {"train_loss": -38.47508239746094, "global_step": 156857, "epoch": 1296} {"train_loss": -38.83012008666992, "global_step": 156858, "epoch": 1296} {"train_loss": -39.53861618041992, "global_step": 156859, "epoch": 1296} {"train_loss": -39.971412658691406, "global_step": 156860, "epoch": 1296} {"train_loss": -40.62051773071289, "global_step": 156861, "epoch": 1296} {"train_loss": -38.8272819519043, "global_step": 156862, "epoch": 1296} {"train_loss": -39.82516098022461, "global_step": 156863, "epoch": 1296} {"train_loss": -41.12324523925781, "global_step": 156864, "epoch": 1296} {"train_loss": -40.09892654418945, "global_step": 156865, "epoch": 1296} {"train_loss": -40.754390716552734, "global_step": 156866, "epoch": 1296} {"train_loss": -40.641719818115234, "global_step": 156867, "epoch": 1296} {"train_loss": -39.498470306396484, "global_step": 156868, "epoch": 1296} {"train_loss": -40.5372428894043, "global_step": 156869, "epoch": 1296} {"train_loss": -40.502742767333984, "global_step": 156870, "epoch": 1296} {"train_loss": -39.895320892333984, "global_step": 156871, "epoch": 1296} {"train_loss": -39.88535690307617, "global_step": 156872, "epoch": 1296} {"train_loss": -39.78593063354492, "global_step": 156873, "epoch": 1296} {"train_loss": -39.69742965698242, "global_step": 156874, "epoch": 1296} {"train_loss": -40.63947677612305, "global_step": 156875, "epoch": 1296} {"train_loss": -39.697750091552734, "global_step": 156876, "epoch": 1296} {"train_loss": -40.41557693481445, "global_step": 156877, "epoch": 1296} {"train_loss": -39.212257385253906, "global_step": 156878, "epoch": 1296} {"train_loss": -38.80718994140625, "global_step": 156879, "epoch": 1296} {"train_loss": -41.07382583618164, "global_step": 156880, "epoch": 1296} {"train_loss": -39.50517272949219, "global_step": 156881, "epoch": 1296} {"train_loss": -30.104772567749023, "global_step": 156882, "epoch": 1296} {"train_loss": -38.53994369506836, "global_step": 156883, "epoch": 1296} {"train_loss": -40.49522399902344, "global_step": 156884, "epoch": 1296} {"train_loss": -38.51859664916992, "global_step": 156885, "epoch": 1296} {"train_loss": -37.211185455322266, "global_step": 156886, "epoch": 1296} {"train_loss": -37.23714065551758, "global_step": 156887, "epoch": 1296} {"train_loss": -37.19319152832031, "global_step": 156888, "epoch": 1296} {"train_loss": -35.66815185546875, "global_step": 156889, "epoch": 1296} {"train_loss": -39.72343063354492, "global_step": 156890, "epoch": 1296} {"train_loss": -37.64949417114258, "global_step": 156891, "epoch": 1296} {"train_loss": -35.67824172973633, "global_step": 156892, "epoch": 1296} {"train_loss": -37.94483947753906, "global_step": 156893, "epoch": 1296} {"train_loss": -37.93262481689453, "global_step": 156894, "epoch": 1296} {"train_loss": -35.32501220703125, "global_step": 156895, "epoch": 1296} {"train_loss": -38.23653793334961, "global_step": 156896, "epoch": 1296} {"train_loss": -39.20478439331055, "global_step": 156897, "epoch": 1296} {"train_loss": -38.09550857543945, "global_step": 156898, "epoch": 1296} {"train_loss": -36.91170883178711, "global_step": 156899, "epoch": 1296} {"train_loss": -37.3864631652832, "global_step": 156900, "epoch": 1296} {"train_loss": -37.095184326171875, "global_step": 156901, "epoch": 1296} {"train_loss": -39.25649642944336, "global_step": 156902, "epoch": 1296} {"train_loss": -38.1920280456543, "global_step": 156903, "epoch": 1296} {"train_loss": -37.96821212768555, "global_step": 156904, "epoch": 1296} {"train_loss": -38.283287048339844, "global_step": 156905, "epoch": 1296} {"train_loss": -38.9658317565918, "global_step": 156906, "epoch": 1296} {"train_loss": -38.0011100769043, "global_step": 156907, "epoch": 1296} {"train_loss": -39.183441162109375, "global_step": 156908, "epoch": 1296} {"train_loss": -35.536041259765625, "global_step": 156909, "epoch": 1296} {"train_loss": -35.43084716796875, "global_step": 156910, "epoch": 1296} {"train_loss": -37.601531982421875, "global_step": 156911, "epoch": 1296} {"train_loss": -39.14203643798828, "global_step": 156912, "epoch": 1296} {"train_loss": -38.301513671875, "global_step": 156913, "epoch": 1296} {"train_loss": -38.448055267333984, "global_step": 156914, "epoch": 1296} {"train_loss": -37.03456497192383, "global_step": 156915, "epoch": 1296} {"train_loss": -37.315425872802734, "global_step": 156916, "epoch": 1296} {"train_loss": -39.36314010620117, "global_step": 156917, "epoch": 1296} {"train_loss": -38.68877029418945, "global_step": 156918, "epoch": 1296} {"train_loss": -39.189598083496094, "global_step": 156919, "epoch": 1296} {"train_loss": -39.856056213378906, "global_step": 156920, "epoch": 1296} {"train_loss": -38.66688537597656, "global_step": 156921, "epoch": 1296} {"train_loss": -37.2944221496582, "global_step": 156922, "epoch": 1296} {"train_loss": -39.51594924926758, "global_step": 156923, "epoch": 1296} {"train_loss": -38.10466384887695, "global_step": 156924, "epoch": 1296} {"train_loss": -39.24644470214844, "global_step": 156925, "epoch": 1296} {"train_loss": -38.73482131958008, "global_step": 156926, "epoch": 1296} {"train_loss": -39.00055694580078, "global_step": 156927, "epoch": 1296} {"train_loss": -38.83736801147461, "global_step": 156928, "epoch": 1296} {"train_loss": -38.94868850708008, "global_step": 156929, "epoch": 1296} {"train_loss": -38.757530212402344, "global_step": 156930, "epoch": 1296} {"train_loss": -39.282875061035156, "global_step": 156931, "epoch": 1296} {"train_loss": -39.33380889892578, "global_step": 156932, "epoch": 1296} {"train_loss": -38.497676849365234, "global_step": 156933, "epoch": 1296} {"train_loss": -39.30296325683594, "global_step": 156934, "epoch": 1296} {"train_loss": -39.252105712890625, "global_step": 156935, "epoch": 1296} {"train_loss": -39.137696715425854, "global_step": 156936, "epoch": 1296, "val_loss": 2613407.0} {"train_loss": -36.780452728271484, "global_step": 156937, "epoch": 1297} {"train_loss": -39.41526412963867, "global_step": 156938, "epoch": 1297} {"train_loss": -39.12800598144531, "global_step": 156939, "epoch": 1297} {"train_loss": -39.41904830932617, "global_step": 156940, "epoch": 1297} {"train_loss": -38.045772552490234, "global_step": 156941, "epoch": 1297} {"train_loss": -39.463863372802734, "global_step": 156942, "epoch": 1297} {"train_loss": -40.688655853271484, "global_step": 156943, "epoch": 1297} {"train_loss": -39.527706146240234, "global_step": 156944, "epoch": 1297} {"train_loss": -38.976436614990234, "global_step": 156945, "epoch": 1297} {"train_loss": -39.136043548583984, "global_step": 156946, "epoch": 1297} {"train_loss": -39.7067756652832, "global_step": 156947, "epoch": 1297} {"train_loss": -39.77979278564453, "global_step": 156948, "epoch": 1297} {"train_loss": -38.63761520385742, "global_step": 156949, "epoch": 1297} {"train_loss": -40.03963851928711, "global_step": 156950, "epoch": 1297} {"train_loss": -40.12461471557617, "global_step": 156951, "epoch": 1297} {"train_loss": -39.297725677490234, "global_step": 156952, "epoch": 1297} {"train_loss": -40.167572021484375, "global_step": 156953, "epoch": 1297} {"train_loss": -40.1191520690918, "global_step": 156954, "epoch": 1297} {"train_loss": -40.259368896484375, "global_step": 156955, "epoch": 1297} {"train_loss": -39.935367584228516, "global_step": 156956, "epoch": 1297} {"train_loss": -39.63801193237305, "global_step": 156957, "epoch": 1297} {"train_loss": -38.06034469604492, "global_step": 156958, "epoch": 1297} {"train_loss": -40.19725036621094, "global_step": 156959, "epoch": 1297} {"train_loss": -40.725345611572266, "global_step": 156960, "epoch": 1297} {"train_loss": -40.141624450683594, "global_step": 156961, "epoch": 1297} {"train_loss": -40.65705490112305, "global_step": 156962, "epoch": 1297} {"train_loss": -39.68034362792969, "global_step": 156963, "epoch": 1297} {"train_loss": -40.311065673828125, "global_step": 156964, "epoch": 1297} {"train_loss": -39.926429748535156, "global_step": 156965, "epoch": 1297} {"train_loss": -40.47435760498047, "global_step": 156966, "epoch": 1297} {"train_loss": -39.07597351074219, "global_step": 156967, "epoch": 1297} {"train_loss": -39.66233444213867, "global_step": 156968, "epoch": 1297} {"train_loss": -40.03399658203125, "global_step": 156969, "epoch": 1297} {"train_loss": -40.02805709838867, "global_step": 156970, "epoch": 1297} {"train_loss": -39.76696014404297, "global_step": 156971, "epoch": 1297} {"train_loss": -38.31383514404297, "global_step": 156972, "epoch": 1297} {"train_loss": -39.38010787963867, "global_step": 156973, "epoch": 1297} {"train_loss": -40.1346549987793, "global_step": 156974, "epoch": 1297} {"train_loss": -39.720516204833984, "global_step": 156975, "epoch": 1297} {"train_loss": -39.768287658691406, "global_step": 156976, "epoch": 1297} {"train_loss": -39.911407470703125, "global_step": 156977, "epoch": 1297} {"train_loss": -40.28533172607422, "global_step": 156978, "epoch": 1297} {"train_loss": -40.29397201538086, "global_step": 156979, "epoch": 1297} {"train_loss": -40.05965042114258, "global_step": 156980, "epoch": 1297} {"train_loss": -40.609344482421875, "global_step": 156981, "epoch": 1297} {"train_loss": -38.49567794799805, "global_step": 156982, "epoch": 1297} {"train_loss": -40.164127349853516, "global_step": 156983, "epoch": 1297} {"train_loss": -39.4339714050293, "global_step": 156984, "epoch": 1297} {"train_loss": -40.05921173095703, "global_step": 156985, "epoch": 1297} {"train_loss": -39.93562698364258, "global_step": 156986, "epoch": 1297} {"train_loss": -40.577728271484375, "global_step": 156987, "epoch": 1297} {"train_loss": -40.44089889526367, "global_step": 156988, "epoch": 1297} {"train_loss": -37.44734573364258, "global_step": 156989, "epoch": 1297} {"train_loss": -40.114192962646484, "global_step": 156990, "epoch": 1297} {"train_loss": -38.37443923950195, "global_step": 156991, "epoch": 1297} {"train_loss": -40.105377197265625, "global_step": 156992, "epoch": 1297} {"train_loss": -39.202239990234375, "global_step": 156993, "epoch": 1297} {"train_loss": -37.615509033203125, "global_step": 156994, "epoch": 1297} {"train_loss": -38.16604995727539, "global_step": 156995, "epoch": 1297} {"train_loss": -39.73845672607422, "global_step": 156996, "epoch": 1297} {"train_loss": -40.63690185546875, "global_step": 156997, "epoch": 1297} {"train_loss": -39.7574462890625, "global_step": 156998, "epoch": 1297} {"train_loss": -39.46529769897461, "global_step": 156999, "epoch": 1297} {"train_loss": -39.7723503112793, "global_step": 157000, "epoch": 1297} {"train_loss": -40.3409423828125, "global_step": 157001, "epoch": 1297} {"train_loss": -40.50136184692383, "global_step": 157002, "epoch": 1297} {"train_loss": -39.7497444152832, "global_step": 157003, "epoch": 1297} {"train_loss": -40.033355712890625, "global_step": 157004, "epoch": 1297} {"train_loss": -39.38364791870117, "global_step": 157005, "epoch": 1297} {"train_loss": -39.507320404052734, "global_step": 157006, "epoch": 1297} {"train_loss": -38.51749038696289, "global_step": 157007, "epoch": 1297} {"train_loss": -39.529972076416016, "global_step": 157008, "epoch": 1297} {"train_loss": -40.10236358642578, "global_step": 157009, "epoch": 1297} {"train_loss": -39.377235412597656, "global_step": 157010, "epoch": 1297} {"train_loss": -39.033382415771484, "global_step": 157011, "epoch": 1297} {"train_loss": -38.09558868408203, "global_step": 157012, "epoch": 1297} {"train_loss": -39.58425521850586, "global_step": 157013, "epoch": 1297} {"train_loss": -39.11928939819336, "global_step": 157014, "epoch": 1297} {"train_loss": -39.83274841308594, "global_step": 157015, "epoch": 1297} {"train_loss": -39.779029846191406, "global_step": 157016, "epoch": 1297} {"train_loss": -39.9459114074707, "global_step": 157017, "epoch": 1297} {"train_loss": -39.95060348510742, "global_step": 157018, "epoch": 1297} {"train_loss": -40.35006332397461, "global_step": 157019, "epoch": 1297} {"train_loss": -40.54551696777344, "global_step": 157020, "epoch": 1297} {"train_loss": -41.29265213012695, "global_step": 157021, "epoch": 1297} {"train_loss": -40.95355987548828, "global_step": 157022, "epoch": 1297} {"train_loss": -39.48683547973633, "global_step": 157023, "epoch": 1297} {"train_loss": -39.6036491394043, "global_step": 157024, "epoch": 1297} {"train_loss": -40.3623161315918, "global_step": 157025, "epoch": 1297} {"train_loss": -40.17483901977539, "global_step": 157026, "epoch": 1297} {"train_loss": -40.4276123046875, "global_step": 157027, "epoch": 1297} {"train_loss": -40.79549789428711, "global_step": 157028, "epoch": 1297} {"train_loss": -40.902931213378906, "global_step": 157029, "epoch": 1297} {"train_loss": -40.33704376220703, "global_step": 157030, "epoch": 1297} {"train_loss": -40.53437805175781, "global_step": 157031, "epoch": 1297} {"train_loss": -40.77703857421875, "global_step": 157032, "epoch": 1297} {"train_loss": -41.048587799072266, "global_step": 157033, "epoch": 1297} {"train_loss": -40.71816635131836, "global_step": 157034, "epoch": 1297} {"train_loss": -39.665340423583984, "global_step": 157035, "epoch": 1297} {"train_loss": -39.39039993286133, "global_step": 157036, "epoch": 1297} {"train_loss": -38.359310150146484, "global_step": 157037, "epoch": 1297} {"train_loss": -38.2229118347168, "global_step": 157038, "epoch": 1297} {"train_loss": -39.21787643432617, "global_step": 157039, "epoch": 1297} {"train_loss": -39.825660705566406, "global_step": 157040, "epoch": 1297} {"train_loss": -39.869041442871094, "global_step": 157041, "epoch": 1297} {"train_loss": -40.53615951538086, "global_step": 157042, "epoch": 1297} {"train_loss": -40.60529708862305, "global_step": 157043, "epoch": 1297} {"train_loss": -40.602935791015625, "global_step": 157044, "epoch": 1297} {"train_loss": -40.62537384033203, "global_step": 157045, "epoch": 1297} {"train_loss": -40.625091552734375, "global_step": 157046, "epoch": 1297} {"train_loss": -40.5923957824707, "global_step": 157047, "epoch": 1297} {"train_loss": -40.56493377685547, "global_step": 157048, "epoch": 1297} {"train_loss": -40.88033676147461, "global_step": 157049, "epoch": 1297} {"train_loss": -40.8175048828125, "global_step": 157050, "epoch": 1297} {"train_loss": -40.9703483581543, "global_step": 157051, "epoch": 1297} {"train_loss": -39.64304733276367, "global_step": 157052, "epoch": 1297} {"train_loss": -39.5963134765625, "global_step": 157053, "epoch": 1297} {"train_loss": -39.886348724365234, "global_step": 157054, "epoch": 1297} {"train_loss": -39.96621322631836, "global_step": 157055, "epoch": 1297} {"train_loss": -39.6983528137207, "global_step": 157056, "epoch": 1297} {"train_loss": -39.78989798175402, "global_step": 157057, "epoch": 1297, "val_loss": 2633865.75} {"train_loss": -40.278480529785156, "global_step": 157058, "epoch": 1298} {"train_loss": -40.08439254760742, "global_step": 157059, "epoch": 1298} {"train_loss": -39.64326095581055, "global_step": 157060, "epoch": 1298} {"train_loss": -41.198394775390625, "global_step": 157061, "epoch": 1298} {"train_loss": -39.03837966918945, "global_step": 157062, "epoch": 1298} {"train_loss": -39.53390121459961, "global_step": 157063, "epoch": 1298} {"train_loss": -40.6475715637207, "global_step": 157064, "epoch": 1298} {"train_loss": -40.21273422241211, "global_step": 157065, "epoch": 1298} {"train_loss": -40.37428665161133, "global_step": 157066, "epoch": 1298} {"train_loss": -41.19609451293945, "global_step": 157067, "epoch": 1298} {"train_loss": -40.33150863647461, "global_step": 157068, "epoch": 1298} {"train_loss": -41.125118255615234, "global_step": 157069, "epoch": 1298} {"train_loss": -40.96048355102539, "global_step": 157070, "epoch": 1298} {"train_loss": -39.939178466796875, "global_step": 157071, "epoch": 1298} {"train_loss": -40.56562423706055, "global_step": 157072, "epoch": 1298} {"train_loss": -40.99808883666992, "global_step": 157073, "epoch": 1298} {"train_loss": -39.73371887207031, "global_step": 157074, "epoch": 1298} {"train_loss": -40.86573028564453, "global_step": 157075, "epoch": 1298} {"train_loss": -39.56267166137695, "global_step": 157076, "epoch": 1298} {"train_loss": -39.352569580078125, "global_step": 157077, "epoch": 1298} {"train_loss": -41.12730026245117, "global_step": 157078, "epoch": 1298} {"train_loss": -40.01877975463867, "global_step": 157079, "epoch": 1298} {"train_loss": -40.93183135986328, "global_step": 157080, "epoch": 1298} {"train_loss": -40.839149475097656, "global_step": 157081, "epoch": 1298} {"train_loss": -41.175323486328125, "global_step": 157082, "epoch": 1298} {"train_loss": -41.175533294677734, "global_step": 157083, "epoch": 1298} {"train_loss": -40.12580490112305, "global_step": 157084, "epoch": 1298} {"train_loss": -39.63813018798828, "global_step": 157085, "epoch": 1298} {"train_loss": -41.36642074584961, "global_step": 157086, "epoch": 1298} {"train_loss": -40.15897750854492, "global_step": 157087, "epoch": 1298} {"train_loss": -40.587398529052734, "global_step": 157088, "epoch": 1298} {"train_loss": -40.53422164916992, "global_step": 157089, "epoch": 1298} {"train_loss": -41.32025146484375, "global_step": 157090, "epoch": 1298} {"train_loss": -40.67435073852539, "global_step": 157091, "epoch": 1298} {"train_loss": -40.089332580566406, "global_step": 157092, "epoch": 1298} {"train_loss": -39.53070831298828, "global_step": 157093, "epoch": 1298} {"train_loss": -40.88711166381836, "global_step": 157094, "epoch": 1298} {"train_loss": -40.03826904296875, "global_step": 157095, "epoch": 1298} {"train_loss": -39.2413444519043, "global_step": 157096, "epoch": 1298} {"train_loss": -40.97587203979492, "global_step": 157097, "epoch": 1298} {"train_loss": -39.039737701416016, "global_step": 157098, "epoch": 1298} {"train_loss": -39.29163360595703, "global_step": 157099, "epoch": 1298} {"train_loss": -39.00204086303711, "global_step": 157100, "epoch": 1298} {"train_loss": -41.068851470947266, "global_step": 157101, "epoch": 1298} {"train_loss": -32.65195846557617, "global_step": 157102, "epoch": 1298} {"train_loss": -41.41624069213867, "global_step": 157103, "epoch": 1298} {"train_loss": -40.290340423583984, "global_step": 157104, "epoch": 1298} {"train_loss": -39.84798049926758, "global_step": 157105, "epoch": 1298} {"train_loss": -38.216468811035156, "global_step": 157106, "epoch": 1298} {"train_loss": -38.974117279052734, "global_step": 157107, "epoch": 1298} {"train_loss": -37.833351135253906, "global_step": 157108, "epoch": 1298} {"train_loss": -38.2250862121582, "global_step": 157109, "epoch": 1298} {"train_loss": -35.717323303222656, "global_step": 157110, "epoch": 1298} {"train_loss": -37.94442367553711, "global_step": 157111, "epoch": 1298} {"train_loss": -38.292423248291016, "global_step": 157112, "epoch": 1298} {"train_loss": -40.463172912597656, "global_step": 157113, "epoch": 1298} {"train_loss": -40.098548889160156, "global_step": 157114, "epoch": 1298} {"train_loss": -39.68888473510742, "global_step": 157115, "epoch": 1298} {"train_loss": -36.54291915893555, "global_step": 157116, "epoch": 1298} {"train_loss": -37.198585510253906, "global_step": 157117, "epoch": 1298} {"train_loss": -39.61860275268555, "global_step": 157118, "epoch": 1298} {"train_loss": -39.5200309753418, "global_step": 157119, "epoch": 1298} {"train_loss": -35.89207077026367, "global_step": 157120, "epoch": 1298} {"train_loss": -38.790748596191406, "global_step": 157121, "epoch": 1298} {"train_loss": -38.097145080566406, "global_step": 157122, "epoch": 1298} {"train_loss": -37.96549606323242, "global_step": 157123, "epoch": 1298} {"train_loss": -39.52394104003906, "global_step": 157124, "epoch": 1298} {"train_loss": -38.93402099609375, "global_step": 157125, "epoch": 1298} {"train_loss": -39.356929779052734, "global_step": 157126, "epoch": 1298} {"train_loss": -40.291290283203125, "global_step": 157127, "epoch": 1298} {"train_loss": -37.42133331298828, "global_step": 157128, "epoch": 1298} {"train_loss": -36.46100997924805, "global_step": 157129, "epoch": 1298} {"train_loss": -39.57509994506836, "global_step": 157130, "epoch": 1298} {"train_loss": -39.44514846801758, "global_step": 157131, "epoch": 1298} {"train_loss": -39.98128128051758, "global_step": 157132, "epoch": 1298} {"train_loss": -39.70475387573242, "global_step": 157133, "epoch": 1298} {"train_loss": -40.70869064331055, "global_step": 157134, "epoch": 1298} {"train_loss": -39.29120635986328, "global_step": 157135, "epoch": 1298} {"train_loss": -37.03350830078125, "global_step": 157136, "epoch": 1298} {"train_loss": -40.091915130615234, "global_step": 157137, "epoch": 1298} {"train_loss": -39.438880920410156, "global_step": 157138, "epoch": 1298} {"train_loss": -39.208377838134766, "global_step": 157139, "epoch": 1298} {"train_loss": -39.858680725097656, "global_step": 157140, "epoch": 1298} {"train_loss": -39.011749267578125, "global_step": 157141, "epoch": 1298} {"train_loss": -39.59442901611328, "global_step": 157142, "epoch": 1298} {"train_loss": -39.37535858154297, "global_step": 157143, "epoch": 1298} {"train_loss": -38.1406364440918, "global_step": 157144, "epoch": 1298} {"train_loss": -39.28244400024414, "global_step": 157145, "epoch": 1298} {"train_loss": -39.17686080932617, "global_step": 157146, "epoch": 1298} {"train_loss": -39.31814193725586, "global_step": 157147, "epoch": 1298} {"train_loss": -39.657752990722656, "global_step": 157148, "epoch": 1298} {"train_loss": -38.672821044921875, "global_step": 157149, "epoch": 1298} {"train_loss": -39.416542053222656, "global_step": 157150, "epoch": 1298} {"train_loss": -40.6347541809082, "global_step": 157151, "epoch": 1298} {"train_loss": -40.00254440307617, "global_step": 157152, "epoch": 1298} {"train_loss": -38.90480422973633, "global_step": 157153, "epoch": 1298} {"train_loss": -39.02211380004883, "global_step": 157154, "epoch": 1298} {"train_loss": -40.59687042236328, "global_step": 157155, "epoch": 1298} {"train_loss": -40.38236618041992, "global_step": 157156, "epoch": 1298} {"train_loss": -39.34574508666992, "global_step": 157157, "epoch": 1298} {"train_loss": -40.16672897338867, "global_step": 157158, "epoch": 1298} {"train_loss": -41.065582275390625, "global_step": 157159, "epoch": 1298} {"train_loss": -40.756107330322266, "global_step": 157160, "epoch": 1298} {"train_loss": -40.10713577270508, "global_step": 157161, "epoch": 1298} {"train_loss": -40.496185302734375, "global_step": 157162, "epoch": 1298} {"train_loss": -39.80875778198242, "global_step": 157163, "epoch": 1298} {"train_loss": -40.38683319091797, "global_step": 157164, "epoch": 1298} {"train_loss": -40.225746154785156, "global_step": 157165, "epoch": 1298} {"train_loss": -40.67867660522461, "global_step": 157166, "epoch": 1298} {"train_loss": -40.63943862915039, "global_step": 157167, "epoch": 1298} {"train_loss": -38.92511749267578, "global_step": 157168, "epoch": 1298} {"train_loss": -41.06612777709961, "global_step": 157169, "epoch": 1298} {"train_loss": -41.09746170043945, "global_step": 157170, "epoch": 1298} {"train_loss": -40.53721237182617, "global_step": 157171, "epoch": 1298} {"train_loss": -40.30146408081055, "global_step": 157172, "epoch": 1298} {"train_loss": -41.035213470458984, "global_step": 157173, "epoch": 1298} {"train_loss": -40.806373596191406, "global_step": 157174, "epoch": 1298} {"train_loss": -40.6800651550293, "global_step": 157175, "epoch": 1298} {"train_loss": -41.18376922607422, "global_step": 157176, "epoch": 1298} {"train_loss": -40.79131317138672, "global_step": 157177, "epoch": 1298} {"train_loss": -39.713362165719026, "global_step": 157178, "epoch": 1298, "val_loss": 2492113.5} {"train_loss": -39.93726348876953, "global_step": 157179, "epoch": 1299} {"train_loss": -39.90406036376953, "global_step": 157180, "epoch": 1299} {"train_loss": -40.85795211791992, "global_step": 157181, "epoch": 1299} {"train_loss": -39.72817611694336, "global_step": 157182, "epoch": 1299} {"train_loss": -39.78567123413086, "global_step": 157183, "epoch": 1299} {"train_loss": -40.634803771972656, "global_step": 157184, "epoch": 1299} {"train_loss": -39.979644775390625, "global_step": 157185, "epoch": 1299} {"train_loss": -38.925575256347656, "global_step": 157186, "epoch": 1299} {"train_loss": -40.565425872802734, "global_step": 157187, "epoch": 1299} {"train_loss": -41.10419464111328, "global_step": 157188, "epoch": 1299} {"train_loss": -40.0566291809082, "global_step": 157189, "epoch": 1299} {"train_loss": -40.344722747802734, "global_step": 157190, "epoch": 1299} {"train_loss": -40.32291793823242, "global_step": 157191, "epoch": 1299} {"train_loss": -39.870262145996094, "global_step": 157192, "epoch": 1299} {"train_loss": -39.99099349975586, "global_step": 157193, "epoch": 1299} {"train_loss": -40.10184097290039, "global_step": 157194, "epoch": 1299} {"train_loss": -40.13688278198242, "global_step": 157195, "epoch": 1299} {"train_loss": -39.62303161621094, "global_step": 157196, "epoch": 1299} {"train_loss": -40.140724182128906, "global_step": 157197, "epoch": 1299} {"train_loss": -40.735389709472656, "global_step": 157198, "epoch": 1299} {"train_loss": -39.8748893737793, "global_step": 157199, "epoch": 1299} {"train_loss": -40.35343551635742, "global_step": 157200, "epoch": 1299} {"train_loss": -40.46535110473633, "global_step": 157201, "epoch": 1299} {"train_loss": -41.142547607421875, "global_step": 157202, "epoch": 1299} {"train_loss": -39.76821517944336, "global_step": 157203, "epoch": 1299} {"train_loss": -38.617000579833984, "global_step": 157204, "epoch": 1299} {"train_loss": -39.80009841918945, "global_step": 157205, "epoch": 1299} {"train_loss": -36.241615295410156, "global_step": 157206, "epoch": 1299} {"train_loss": -38.595619201660156, "global_step": 157207, "epoch": 1299} {"train_loss": -39.614994049072266, "global_step": 157208, "epoch": 1299} {"train_loss": -39.1429328918457, "global_step": 157209, "epoch": 1299} {"train_loss": -37.302825927734375, "global_step": 157210, "epoch": 1299} {"train_loss": -36.3091926574707, "global_step": 157211, "epoch": 1299} {"train_loss": -36.12226104736328, "global_step": 157212, "epoch": 1299} {"train_loss": -39.32759094238281, "global_step": 157213, "epoch": 1299} {"train_loss": -38.69912338256836, "global_step": 157214, "epoch": 1299} {"train_loss": -38.289031982421875, "global_step": 157215, "epoch": 1299} {"train_loss": -38.7152214050293, "global_step": 157216, "epoch": 1299} {"train_loss": -39.381553649902344, "global_step": 157217, "epoch": 1299} {"train_loss": -39.53217697143555, "global_step": 157218, "epoch": 1299} {"train_loss": -39.191505432128906, "global_step": 157219, "epoch": 1299} {"train_loss": -40.016334533691406, "global_step": 157220, "epoch": 1299} {"train_loss": -38.6158447265625, "global_step": 157221, "epoch": 1299} {"train_loss": -39.70984649658203, "global_step": 157222, "epoch": 1299} {"train_loss": -40.61505126953125, "global_step": 157223, "epoch": 1299} {"train_loss": -40.30654525756836, "global_step": 157224, "epoch": 1299} {"train_loss": -38.92995071411133, "global_step": 157225, "epoch": 1299} {"train_loss": -40.82188034057617, "global_step": 157226, "epoch": 1299} {"train_loss": -40.80195999145508, "global_step": 157227, "epoch": 1299} {"train_loss": -39.58637619018555, "global_step": 157228, "epoch": 1299} {"train_loss": -39.65134811401367, "global_step": 157229, "epoch": 1299} {"train_loss": -40.07894515991211, "global_step": 157230, "epoch": 1299} {"train_loss": -40.50067138671875, "global_step": 157231, "epoch": 1299} {"train_loss": -39.790008544921875, "global_step": 157232, "epoch": 1299} {"train_loss": -40.508033752441406, "global_step": 157233, "epoch": 1299} {"train_loss": -39.875850677490234, "global_step": 157234, "epoch": 1299} {"train_loss": -40.54301071166992, "global_step": 157235, "epoch": 1299} {"train_loss": -40.30202102661133, "global_step": 157236, "epoch": 1299} {"train_loss": -40.12051010131836, "global_step": 157237, "epoch": 1299} {"train_loss": -40.5110969543457, "global_step": 157238, "epoch": 1299} {"train_loss": -38.86173629760742, "global_step": 157239, "epoch": 1299} {"train_loss": -39.92160415649414, "global_step": 157240, "epoch": 1299} {"train_loss": -40.38727951049805, "global_step": 157241, "epoch": 1299} {"train_loss": -40.243656158447266, "global_step": 157242, "epoch": 1299} {"train_loss": -40.670372009277344, "global_step": 157243, "epoch": 1299} {"train_loss": -40.284183502197266, "global_step": 157244, "epoch": 1299} {"train_loss": -39.63680648803711, "global_step": 157245, "epoch": 1299} {"train_loss": -39.765872955322266, "global_step": 157246, "epoch": 1299} {"train_loss": -40.357765197753906, "global_step": 157247, "epoch": 1299} {"train_loss": -40.6832275390625, "global_step": 157248, "epoch": 1299} {"train_loss": -39.73192596435547, "global_step": 157249, "epoch": 1299} {"train_loss": -40.86619567871094, "global_step": 157250, "epoch": 1299} {"train_loss": -40.7462158203125, "global_step": 157251, "epoch": 1299} {"train_loss": -40.177635192871094, "global_step": 157252, "epoch": 1299} {"train_loss": -40.903289794921875, "global_step": 157253, "epoch": 1299} {"train_loss": -39.84291458129883, "global_step": 157254, "epoch": 1299} {"train_loss": -40.01022720336914, "global_step": 157255, "epoch": 1299} {"train_loss": -40.24575424194336, "global_step": 157256, "epoch": 1299} {"train_loss": -40.53126907348633, "global_step": 157257, "epoch": 1299} {"train_loss": -40.91728973388672, "global_step": 157258, "epoch": 1299} {"train_loss": -40.36616516113281, "global_step": 157259, "epoch": 1299} {"train_loss": -40.39595413208008, "global_step": 157260, "epoch": 1299} {"train_loss": -40.77693176269531, "global_step": 157261, "epoch": 1299} {"train_loss": -40.53902816772461, "global_step": 157262, "epoch": 1299} {"train_loss": -40.92060089111328, "global_step": 157263, "epoch": 1299} {"train_loss": -40.704750061035156, "global_step": 157264, "epoch": 1299} {"train_loss": -40.8402099609375, "global_step": 157265, "epoch": 1299} {"train_loss": -39.63505554199219, "global_step": 157266, "epoch": 1299} {"train_loss": -39.26624298095703, "global_step": 157267, "epoch": 1299} {"train_loss": -39.65842056274414, "global_step": 157268, "epoch": 1299} {"train_loss": -40.165687561035156, "global_step": 157269, "epoch": 1299} {"train_loss": -39.590362548828125, "global_step": 157270, "epoch": 1299} {"train_loss": -40.67009353637695, "global_step": 157271, "epoch": 1299} {"train_loss": -39.85671615600586, "global_step": 157272, "epoch": 1299} {"train_loss": -39.268001556396484, "global_step": 157273, "epoch": 1299} {"train_loss": -38.54265213012695, "global_step": 157274, "epoch": 1299} {"train_loss": -40.75725555419922, "global_step": 157275, "epoch": 1299} {"train_loss": -39.78539276123047, "global_step": 157276, "epoch": 1299} {"train_loss": -40.089908599853516, "global_step": 157277, "epoch": 1299} {"train_loss": -40.54452133178711, "global_step": 157278, "epoch": 1299} {"train_loss": -39.7614631652832, "global_step": 157279, "epoch": 1299} {"train_loss": -40.509090423583984, "global_step": 157280, "epoch": 1299} {"train_loss": -40.6019172668457, "global_step": 157281, "epoch": 1299} {"train_loss": -38.829933166503906, "global_step": 157282, "epoch": 1299} {"train_loss": -40.29600143432617, "global_step": 157283, "epoch": 1299} {"train_loss": -40.478271484375, "global_step": 157284, "epoch": 1299} {"train_loss": -40.883453369140625, "global_step": 157285, "epoch": 1299} {"train_loss": -40.01847457885742, "global_step": 157286, "epoch": 1299} {"train_loss": -39.13745880126953, "global_step": 157287, "epoch": 1299} {"train_loss": -40.986488342285156, "global_step": 157288, "epoch": 1299} {"train_loss": -40.690242767333984, "global_step": 157289, "epoch": 1299} {"train_loss": -40.73015594482422, "global_step": 157290, "epoch": 1299} {"train_loss": -39.57779312133789, "global_step": 157291, "epoch": 1299} {"train_loss": -40.277137756347656, "global_step": 157292, "epoch": 1299} {"train_loss": -40.30060958862305, "global_step": 157293, "epoch": 1299} {"train_loss": -39.88713455200195, "global_step": 157294, "epoch": 1299} {"train_loss": -40.5942497253418, "global_step": 157295, "epoch": 1299} {"train_loss": -41.189083099365234, "global_step": 157296, "epoch": 1299} {"train_loss": -40.47876739501953, "global_step": 157297, "epoch": 1299} {"train_loss": -41.40985870361328, "global_step": 157298, "epoch": 1299} {"train_loss": -39.956142866907044, "global_step": 157299, "epoch": 1299, "val_loss": 2534439.5} {"train_loss": -41.574745178222656, "global_step": 157300, "epoch": 1300} {"train_loss": -41.05934143066406, "global_step": 157301, "epoch": 1300} {"train_loss": -41.301055908203125, "global_step": 157302, "epoch": 1300} {"train_loss": -41.757625579833984, "global_step": 157303, "epoch": 1300} {"train_loss": -41.12105941772461, "global_step": 157304, "epoch": 1300} {"train_loss": -41.518428802490234, "global_step": 157305, "epoch": 1300} {"train_loss": -41.1048698425293, "global_step": 157306, "epoch": 1300} {"train_loss": -41.447898864746094, "global_step": 157307, "epoch": 1300} {"train_loss": -41.6607551574707, "global_step": 157308, "epoch": 1300} {"train_loss": -41.644500732421875, "global_step": 157309, "epoch": 1300} {"train_loss": -41.6665153503418, "global_step": 157310, "epoch": 1300} {"train_loss": -41.46064376831055, "global_step": 157311, "epoch": 1300} {"train_loss": -41.41349411010742, "global_step": 157312, "epoch": 1300} {"train_loss": -41.9095458984375, "global_step": 157313, "epoch": 1300} {"train_loss": -41.982975006103516, "global_step": 157314, "epoch": 1300} {"train_loss": -41.598793029785156, "global_step": 157315, "epoch": 1300} {"train_loss": -41.055816650390625, "global_step": 157316, "epoch": 1300} {"train_loss": -41.68870162963867, "global_step": 157317, "epoch": 1300} {"train_loss": -41.48566818237305, "global_step": 157318, "epoch": 1300} {"train_loss": -41.1081657409668, "global_step": 157319, "epoch": 1300} {"train_loss": -39.62620162963867, "global_step": 157320, "epoch": 1300} {"train_loss": -37.95870590209961, "global_step": 157321, "epoch": 1300} {"train_loss": -30.200733184814453, "global_step": 157322, "epoch": 1300} {"train_loss": -21.256088256835938, "global_step": 157323, "epoch": 1300} {"train_loss": -16.057621002197266, "global_step": 157324, "epoch": 1300} {"train_loss": -16.196521759033203, "global_step": 157325, "epoch": 1300} {"train_loss": -36.257904052734375, "global_step": 157326, "epoch": 1300} {"train_loss": -30.66204261779785, "global_step": 157327, "epoch": 1300} {"train_loss": -32.39664077758789, "global_step": 157328, "epoch": 1300} {"train_loss": -37.452003479003906, "global_step": 157329, "epoch": 1300} {"train_loss": -35.9705810546875, "global_step": 157330, "epoch": 1300} {"train_loss": -38.609397888183594, "global_step": 157331, "epoch": 1300} {"train_loss": -36.7459831237793, "global_step": 157332, "epoch": 1300} {"train_loss": -39.10134506225586, "global_step": 157333, "epoch": 1300} {"train_loss": -38.5014533996582, "global_step": 157334, "epoch": 1300} {"train_loss": -39.15910339355469, "global_step": 157335, "epoch": 1300} {"train_loss": -39.90349197387695, "global_step": 157336, "epoch": 1300} {"train_loss": -40.11714172363281, "global_step": 157337, "epoch": 1300} {"train_loss": -39.70905685424805, "global_step": 157338, "epoch": 1300} {"train_loss": -40.256893157958984, "global_step": 157339, "epoch": 1300} {"train_loss": -39.33447265625, "global_step": 157340, "epoch": 1300} {"train_loss": -39.82514190673828, "global_step": 157341, "epoch": 1300} {"train_loss": -39.36980438232422, "global_step": 157342, "epoch": 1300} {"train_loss": -40.476348876953125, "global_step": 157343, "epoch": 1300} {"train_loss": -39.95564651489258, "global_step": 157344, "epoch": 1300} {"train_loss": -40.2608757019043, "global_step": 157345, "epoch": 1300} {"train_loss": -40.73072052001953, "global_step": 157346, "epoch": 1300} {"train_loss": -40.19816589355469, "global_step": 157347, "epoch": 1300} {"train_loss": -40.4870719909668, "global_step": 157348, "epoch": 1300} {"train_loss": -39.13771438598633, "global_step": 157349, "epoch": 1300} {"train_loss": -40.43967819213867, "global_step": 157350, "epoch": 1300} {"train_loss": -40.67241287231445, "global_step": 157351, "epoch": 1300} {"train_loss": -40.2977409362793, "global_step": 157352, "epoch": 1300} {"train_loss": -40.52295684814453, "global_step": 157353, "epoch": 1300} {"train_loss": -40.309730529785156, "global_step": 157354, "epoch": 1300} {"train_loss": -40.69153594970703, "global_step": 157355, "epoch": 1300} {"train_loss": -40.21846389770508, "global_step": 157356, "epoch": 1300} {"train_loss": -40.06679916381836, "global_step": 157357, "epoch": 1300} {"train_loss": -39.759124755859375, "global_step": 157358, "epoch": 1300} {"train_loss": -40.31315231323242, "global_step": 157359, "epoch": 1300} {"train_loss": -39.21925735473633, "global_step": 157360, "epoch": 1300} {"train_loss": -40.76154327392578, "global_step": 157361, "epoch": 1300} {"train_loss": -39.78371810913086, "global_step": 157362, "epoch": 1300} {"train_loss": -40.3656005859375, "global_step": 157363, "epoch": 1300} {"train_loss": -39.790218353271484, "global_step": 157364, "epoch": 1300} {"train_loss": -41.1584358215332, "global_step": 157365, "epoch": 1300} {"train_loss": -40.81794357299805, "global_step": 157366, "epoch": 1300} {"train_loss": -40.5042724609375, "global_step": 157367, "epoch": 1300} {"train_loss": -40.981807708740234, "global_step": 157368, "epoch": 1300} {"train_loss": -41.15739822387695, "global_step": 157369, "epoch": 1300} {"train_loss": -41.14251708984375, "global_step": 157370, "epoch": 1300} {"train_loss": -40.257667541503906, "global_step": 157371, "epoch": 1300} {"train_loss": -40.82661819458008, "global_step": 157372, "epoch": 1300} {"train_loss": -40.66387939453125, "global_step": 157373, "epoch": 1300} {"train_loss": -40.93021774291992, "global_step": 157374, "epoch": 1300} {"train_loss": -41.156036376953125, "global_step": 157375, "epoch": 1300} {"train_loss": -40.98995590209961, "global_step": 157376, "epoch": 1300} {"train_loss": -41.015220642089844, "global_step": 157377, "epoch": 1300} {"train_loss": -41.08501052856445, "global_step": 157378, "epoch": 1300} {"train_loss": -41.13198471069336, "global_step": 157379, "epoch": 1300} {"train_loss": -40.70063400268555, "global_step": 157380, "epoch": 1300} {"train_loss": -41.10419464111328, "global_step": 157381, "epoch": 1300} {"train_loss": -41.5035285949707, "global_step": 157382, "epoch": 1300} {"train_loss": -41.382991790771484, "global_step": 157383, "epoch": 1300} {"train_loss": -41.047603607177734, "global_step": 157384, "epoch": 1300} {"train_loss": -41.733001708984375, "global_step": 157385, "epoch": 1300} {"train_loss": -41.17182540893555, "global_step": 157386, "epoch": 1300} {"train_loss": -40.66378402709961, "global_step": 157387, "epoch": 1300} {"train_loss": -41.14193344116211, "global_step": 157388, "epoch": 1300} {"train_loss": -41.015472412109375, "global_step": 157389, "epoch": 1300} {"train_loss": -41.53659439086914, "global_step": 157390, "epoch": 1300} {"train_loss": -41.574058532714844, "global_step": 157391, "epoch": 1300} {"train_loss": -40.861671447753906, "global_step": 157392, "epoch": 1300} {"train_loss": -41.17584228515625, "global_step": 157393, "epoch": 1300} {"train_loss": -37.38621520996094, "global_step": 157394, "epoch": 1300} {"train_loss": -40.39384841918945, "global_step": 157395, "epoch": 1300} {"train_loss": -38.30845260620117, "global_step": 157396, "epoch": 1300} {"train_loss": -39.22115707397461, "global_step": 157397, "epoch": 1300} {"train_loss": -40.21940994262695, "global_step": 157398, "epoch": 1300} {"train_loss": -40.48696517944336, "global_step": 157399, "epoch": 1300} {"train_loss": -38.77763366699219, "global_step": 157400, "epoch": 1300} {"train_loss": -37.80961608886719, "global_step": 157401, "epoch": 1300} {"train_loss": -39.635250091552734, "global_step": 157402, "epoch": 1300} {"train_loss": -37.893856048583984, "global_step": 157403, "epoch": 1300} {"train_loss": -38.223777770996094, "global_step": 157404, "epoch": 1300} {"train_loss": -39.01676559448242, "global_step": 157405, "epoch": 1300} {"train_loss": -38.901031494140625, "global_step": 157406, "epoch": 1300} {"train_loss": -37.5648078918457, "global_step": 157407, "epoch": 1300} {"train_loss": -39.442562103271484, "global_step": 157408, "epoch": 1300} {"train_loss": -39.86692428588867, "global_step": 157409, "epoch": 1300} {"train_loss": -38.52781677246094, "global_step": 157410, "epoch": 1300} {"train_loss": -38.765113830566406, "global_step": 157411, "epoch": 1300} {"train_loss": -40.28515625, "global_step": 157412, "epoch": 1300} {"train_loss": -39.66511917114258, "global_step": 157413, "epoch": 1300} {"train_loss": -39.53919982910156, "global_step": 157414, "epoch": 1300} {"train_loss": -39.396053314208984, "global_step": 157415, "epoch": 1300} {"train_loss": -38.53724670410156, "global_step": 157416, "epoch": 1300} {"train_loss": -38.53171920776367, "global_step": 157417, "epoch": 1300} {"train_loss": -39.237117767333984, "global_step": 157418, "epoch": 1300} {"train_loss": -39.615142822265625, "global_step": 157419, "epoch": 1300} {"train_loss": -39.36735646586773, "global_step": 157420, "epoch": 1300, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4400000": 1.0, "test/sim_max_reward_4400001": 1.0, "test/sim_max_reward_4400002": 1.0, "test/sim_max_reward_4400003": 1.0, "test/sim_max_reward_4400004": 1.0, "test/sim_max_reward_4400005": 1.0, "test/sim_max_reward_4400006": 1.0, "test/sim_max_reward_4400007": 1.0, "test/sim_max_reward_4400008": 1.0, "test/sim_max_reward_4400009": 1.0, "test/sim_max_reward_4400010": 1.0, "test/sim_max_reward_4400011": 1.0, "test/sim_max_reward_4400012": 1.0, "test/sim_max_reward_4400013": 1.0, "test/sim_max_reward_4400014": 1.0, "test/sim_max_reward_4400015": 1.0, "test/sim_max_reward_4400016": 1.0, "test/sim_max_reward_4400017": 1.0, "test/sim_max_reward_4400018": 1.0, "test/sim_max_reward_4400019": 1.0, "test/sim_max_reward_4400020": 1.0, "test/sim_max_reward_4400021": 1.0, "train/mean_score": 1.0, "test/mean_score": 1.0, "val_loss": 2677305.25} {"train_loss": -41.00334548950195, "global_step": 157421, "epoch": 1301} {"train_loss": -39.6069221496582, "global_step": 157422, "epoch": 1301} {"train_loss": -40.30690383911133, "global_step": 157423, "epoch": 1301} {"train_loss": -39.086181640625, "global_step": 157424, "epoch": 1301} {"train_loss": -39.52581024169922, "global_step": 157425, "epoch": 1301} {"train_loss": -40.167842864990234, "global_step": 157426, "epoch": 1301} {"train_loss": -38.87764358520508, "global_step": 157427, "epoch": 1301} {"train_loss": -40.102718353271484, "global_step": 157428, "epoch": 1301} {"train_loss": -40.993770599365234, "global_step": 157429, "epoch": 1301} {"train_loss": -40.20283889770508, "global_step": 157430, "epoch": 1301} {"train_loss": -40.405303955078125, "global_step": 157431, "epoch": 1301} {"train_loss": -40.7480354309082, "global_step": 157432, "epoch": 1301} {"train_loss": -40.95161056518555, "global_step": 157433, "epoch": 1301} {"train_loss": -40.507015228271484, "global_step": 157434, "epoch": 1301} {"train_loss": -37.78290557861328, "global_step": 157435, "epoch": 1301} {"train_loss": -41.00957489013672, "global_step": 157436, "epoch": 1301} {"train_loss": -40.51543045043945, "global_step": 157437, "epoch": 1301} {"train_loss": -39.84169006347656, "global_step": 157438, "epoch": 1301} {"train_loss": -40.33794021606445, "global_step": 157439, "epoch": 1301} {"train_loss": -40.717201232910156, "global_step": 157440, "epoch": 1301} {"train_loss": -39.91463851928711, "global_step": 157441, "epoch": 1301} {"train_loss": -40.782291412353516, "global_step": 157442, "epoch": 1301} {"train_loss": -40.673583984375, "global_step": 157443, "epoch": 1301} {"train_loss": -40.9004020690918, "global_step": 157444, "epoch": 1301} {"train_loss": -40.49359893798828, "global_step": 157445, "epoch": 1301} {"train_loss": -40.718326568603516, "global_step": 157446, "epoch": 1301} {"train_loss": -40.481849670410156, "global_step": 157447, "epoch": 1301} {"train_loss": -41.342567443847656, "global_step": 157448, "epoch": 1301} {"train_loss": -39.99587631225586, "global_step": 157449, "epoch": 1301} {"train_loss": -40.065670013427734, "global_step": 157450, "epoch": 1301} {"train_loss": -39.68537521362305, "global_step": 157451, "epoch": 1301} {"train_loss": -39.744171142578125, "global_step": 157452, "epoch": 1301} {"train_loss": -40.6727294921875, "global_step": 157453, "epoch": 1301} {"train_loss": -41.376461029052734, "global_step": 157454, "epoch": 1301} {"train_loss": -39.98539733886719, "global_step": 157455, "epoch": 1301} {"train_loss": -39.7747917175293, "global_step": 157456, "epoch": 1301} {"train_loss": -41.54029846191406, "global_step": 157457, "epoch": 1301} {"train_loss": -39.58942794799805, "global_step": 157458, "epoch": 1301} {"train_loss": -40.296852111816406, "global_step": 157459, "epoch": 1301} {"train_loss": -41.324337005615234, "global_step": 157460, "epoch": 1301} {"train_loss": -41.623023986816406, "global_step": 157461, "epoch": 1301} {"train_loss": -40.88808822631836, "global_step": 157462, "epoch": 1301} {"train_loss": -41.17116165161133, "global_step": 157463, "epoch": 1301} {"train_loss": -40.88503646850586, "global_step": 157464, "epoch": 1301} {"train_loss": -41.05107498168945, "global_step": 157465, "epoch": 1301} {"train_loss": -41.21033477783203, "global_step": 157466, "epoch": 1301} {"train_loss": -40.59473419189453, "global_step": 157467, "epoch": 1301} {"train_loss": -40.1322135925293, "global_step": 157468, "epoch": 1301} {"train_loss": -41.14507293701172, "global_step": 157469, "epoch": 1301} {"train_loss": -40.714969635009766, "global_step": 157470, "epoch": 1301} {"train_loss": -41.05038070678711, "global_step": 157471, "epoch": 1301} {"train_loss": -40.74687576293945, "global_step": 157472, "epoch": 1301} {"train_loss": -39.676551818847656, "global_step": 157473, "epoch": 1301} {"train_loss": -40.87053298950195, "global_step": 157474, "epoch": 1301} {"train_loss": -40.227359771728516, "global_step": 157475, "epoch": 1301} {"train_loss": -41.213558197021484, "global_step": 157476, "epoch": 1301} {"train_loss": -39.34299087524414, "global_step": 157477, "epoch": 1301} {"train_loss": -39.906795501708984, "global_step": 157478, "epoch": 1301} {"train_loss": -40.01152038574219, "global_step": 157479, "epoch": 1301} {"train_loss": -40.643436431884766, "global_step": 157480, "epoch": 1301} {"train_loss": -38.949520111083984, "global_step": 157481, "epoch": 1301} {"train_loss": -39.90595626831055, "global_step": 157482, "epoch": 1301} {"train_loss": -39.77701950073242, "global_step": 157483, "epoch": 1301} {"train_loss": -40.309120178222656, "global_step": 157484, "epoch": 1301} {"train_loss": -39.38041305541992, "global_step": 157485, "epoch": 1301} {"train_loss": -40.32879638671875, "global_step": 157486, "epoch": 1301} {"train_loss": -39.92466354370117, "global_step": 157487, "epoch": 1301} {"train_loss": -40.41682815551758, "global_step": 157488, "epoch": 1301} {"train_loss": -39.70589828491211, "global_step": 157489, "epoch": 1301} {"train_loss": -39.6610107421875, "global_step": 157490, "epoch": 1301} {"train_loss": -40.46342849731445, "global_step": 157491, "epoch": 1301} {"train_loss": -39.01387023925781, "global_step": 157492, "epoch": 1301} {"train_loss": -40.33683395385742, "global_step": 157493, "epoch": 1301} {"train_loss": -39.91134262084961, "global_step": 157494, "epoch": 1301} {"train_loss": -40.670318603515625, "global_step": 157495, "epoch": 1301} {"train_loss": -39.61582565307617, "global_step": 157496, "epoch": 1301} {"train_loss": -39.80332946777344, "global_step": 157497, "epoch": 1301} {"train_loss": -37.636878967285156, "global_step": 157498, "epoch": 1301} {"train_loss": -40.64537811279297, "global_step": 157499, "epoch": 1301} {"train_loss": -39.409175872802734, "global_step": 157500, "epoch": 1301} {"train_loss": -39.52463912963867, "global_step": 157501, "epoch": 1301} {"train_loss": -33.47001266479492, "global_step": 157502, "epoch": 1301} {"train_loss": -39.41828918457031, "global_step": 157503, "epoch": 1301} {"train_loss": -40.42987060546875, "global_step": 157504, "epoch": 1301} {"train_loss": -38.28981018066406, "global_step": 157505, "epoch": 1301} {"train_loss": -36.505672454833984, "global_step": 157506, "epoch": 1301} {"train_loss": -28.71795654296875, "global_step": 157507, "epoch": 1301} {"train_loss": -40.327938079833984, "global_step": 157508, "epoch": 1301} {"train_loss": -37.902381896972656, "global_step": 157509, "epoch": 1301} {"train_loss": -36.70231246948242, "global_step": 157510, "epoch": 1301} {"train_loss": -35.16845703125, "global_step": 157511, "epoch": 1301} {"train_loss": -33.873565673828125, "global_step": 157512, "epoch": 1301} {"train_loss": -35.347774505615234, "global_step": 157513, "epoch": 1301} {"train_loss": -36.79677963256836, "global_step": 157514, "epoch": 1301} {"train_loss": -35.264892578125, "global_step": 157515, "epoch": 1301} {"train_loss": -18.53560447692871, "global_step": 157516, "epoch": 1301} {"train_loss": -29.448135375976562, "global_step": 157517, "epoch": 1301} {"train_loss": -38.313228607177734, "global_step": 157518, "epoch": 1301} {"train_loss": -33.317626953125, "global_step": 157519, "epoch": 1301} {"train_loss": -35.043251037597656, "global_step": 157520, "epoch": 1301} {"train_loss": -35.53153610229492, "global_step": 157521, "epoch": 1301} {"train_loss": -36.263668060302734, "global_step": 157522, "epoch": 1301} {"train_loss": -32.90031814575195, "global_step": 157523, "epoch": 1301} {"train_loss": -33.82290267944336, "global_step": 157524, "epoch": 1301} {"train_loss": -36.43654251098633, "global_step": 157525, "epoch": 1301} {"train_loss": -36.64230728149414, "global_step": 157526, "epoch": 1301} {"train_loss": -33.804908752441406, "global_step": 157527, "epoch": 1301} {"train_loss": -36.15317916870117, "global_step": 157528, "epoch": 1301} {"train_loss": -36.45382308959961, "global_step": 157529, "epoch": 1301} {"train_loss": -34.79389953613281, "global_step": 157530, "epoch": 1301} {"train_loss": -37.649375915527344, "global_step": 157531, "epoch": 1301} {"train_loss": -33.18803024291992, "global_step": 157532, "epoch": 1301} {"train_loss": -32.95644760131836, "global_step": 157533, "epoch": 1301} {"train_loss": -36.27141189575195, "global_step": 157534, "epoch": 1301} {"train_loss": -37.090980529785156, "global_step": 157535, "epoch": 1301} {"train_loss": -36.467750549316406, "global_step": 157536, "epoch": 1301} {"train_loss": -37.46187210083008, "global_step": 157537, "epoch": 1301} {"train_loss": -35.50774002075195, "global_step": 157538, "epoch": 1301} {"train_loss": -37.0097770690918, "global_step": 157539, "epoch": 1301} {"train_loss": -38.42799377441406, "global_step": 157540, "epoch": 1301} {"train_loss": -38.64499766767518, "global_step": 157541, "epoch": 1301, "val_loss": 2495267.0} {"train_loss": -34.862281799316406, "global_step": 157542, "epoch": 1302} {"train_loss": -38.110347747802734, "global_step": 157543, "epoch": 1302} {"train_loss": -38.11004638671875, "global_step": 157544, "epoch": 1302} {"train_loss": -36.92839431762695, "global_step": 157545, "epoch": 1302} {"train_loss": -38.18528366088867, "global_step": 157546, "epoch": 1302} {"train_loss": -37.42897033691406, "global_step": 157547, "epoch": 1302} {"train_loss": -38.01542282104492, "global_step": 157548, "epoch": 1302} {"train_loss": -37.48398208618164, "global_step": 157549, "epoch": 1302} {"train_loss": -38.257728576660156, "global_step": 157550, "epoch": 1302} {"train_loss": -38.468875885009766, "global_step": 157551, "epoch": 1302} {"train_loss": -38.79085922241211, "global_step": 157552, "epoch": 1302} {"train_loss": -38.157474517822266, "global_step": 157553, "epoch": 1302} {"train_loss": -37.91101837158203, "global_step": 157554, "epoch": 1302} {"train_loss": -38.69295883178711, "global_step": 157555, "epoch": 1302} {"train_loss": -39.18341064453125, "global_step": 157556, "epoch": 1302} {"train_loss": -39.21052169799805, "global_step": 157557, "epoch": 1302} {"train_loss": -38.975765228271484, "global_step": 157558, "epoch": 1302} {"train_loss": -39.39871597290039, "global_step": 157559, "epoch": 1302} {"train_loss": -39.29133987426758, "global_step": 157560, "epoch": 1302} {"train_loss": -38.9931526184082, "global_step": 157561, "epoch": 1302} {"train_loss": -38.6008415222168, "global_step": 157562, "epoch": 1302} {"train_loss": -39.25320053100586, "global_step": 157563, "epoch": 1302} {"train_loss": -39.296329498291016, "global_step": 157564, "epoch": 1302} {"train_loss": -39.0534553527832, "global_step": 157565, "epoch": 1302} {"train_loss": -39.00461196899414, "global_step": 157566, "epoch": 1302} {"train_loss": -39.751155853271484, "global_step": 157567, "epoch": 1302} {"train_loss": -39.05731964111328, "global_step": 157568, "epoch": 1302} {"train_loss": -39.06756591796875, "global_step": 157569, "epoch": 1302} {"train_loss": -39.15745162963867, "global_step": 157570, "epoch": 1302} {"train_loss": -38.67567825317383, "global_step": 157571, "epoch": 1302} {"train_loss": -39.56608200073242, "global_step": 157572, "epoch": 1302} {"train_loss": -39.650672912597656, "global_step": 157573, "epoch": 1302} {"train_loss": -39.746517181396484, "global_step": 157574, "epoch": 1302} {"train_loss": -39.57735061645508, "global_step": 157575, "epoch": 1302} {"train_loss": -38.99676513671875, "global_step": 157576, "epoch": 1302} {"train_loss": -40.34961700439453, "global_step": 157577, "epoch": 1302} {"train_loss": -39.57254409790039, "global_step": 157578, "epoch": 1302} {"train_loss": -39.57453155517578, "global_step": 157579, "epoch": 1302} {"train_loss": -39.858394622802734, "global_step": 157580, "epoch": 1302} {"train_loss": -39.70835876464844, "global_step": 157581, "epoch": 1302} {"train_loss": -39.46580505371094, "global_step": 157582, "epoch": 1302} {"train_loss": -39.976016998291016, "global_step": 157583, "epoch": 1302} {"train_loss": -40.19940185546875, "global_step": 157584, "epoch": 1302} {"train_loss": -40.14925003051758, "global_step": 157585, "epoch": 1302} {"train_loss": -39.95212936401367, "global_step": 157586, "epoch": 1302} {"train_loss": -40.0291748046875, "global_step": 157587, "epoch": 1302} {"train_loss": -40.28221130371094, "global_step": 157588, "epoch": 1302} {"train_loss": -39.822959899902344, "global_step": 157589, "epoch": 1302} {"train_loss": -39.32856750488281, "global_step": 157590, "epoch": 1302} {"train_loss": -40.219112396240234, "global_step": 157591, "epoch": 1302} {"train_loss": -40.6077880859375, "global_step": 157592, "epoch": 1302} {"train_loss": -40.18889236450195, "global_step": 157593, "epoch": 1302} {"train_loss": -40.21009063720703, "global_step": 157594, "epoch": 1302} {"train_loss": -40.46874237060547, "global_step": 157595, "epoch": 1302} {"train_loss": -39.13728713989258, "global_step": 157596, "epoch": 1302} {"train_loss": -40.510108947753906, "global_step": 157597, "epoch": 1302} {"train_loss": -39.4140739440918, "global_step": 157598, "epoch": 1302} {"train_loss": -40.10703659057617, "global_step": 157599, "epoch": 1302} {"train_loss": -39.98249435424805, "global_step": 157600, "epoch": 1302} {"train_loss": -40.79145812988281, "global_step": 157601, "epoch": 1302} {"train_loss": -40.19118881225586, "global_step": 157602, "epoch": 1302} {"train_loss": -40.31058883666992, "global_step": 157603, "epoch": 1302} {"train_loss": -40.332557678222656, "global_step": 157604, "epoch": 1302} {"train_loss": -40.4345817565918, "global_step": 157605, "epoch": 1302} {"train_loss": -40.31742477416992, "global_step": 157606, "epoch": 1302} {"train_loss": -40.40558624267578, "global_step": 157607, "epoch": 1302} {"train_loss": -40.19508361816406, "global_step": 157608, "epoch": 1302} {"train_loss": -40.499019622802734, "global_step": 157609, "epoch": 1302} {"train_loss": -40.42391586303711, "global_step": 157610, "epoch": 1302} {"train_loss": -39.9387092590332, "global_step": 157611, "epoch": 1302} {"train_loss": -40.57383728027344, "global_step": 157612, "epoch": 1302} {"train_loss": -40.43109130859375, "global_step": 157613, "epoch": 1302} {"train_loss": -40.80947494506836, "global_step": 157614, "epoch": 1302} {"train_loss": -40.34476852416992, "global_step": 157615, "epoch": 1302} {"train_loss": -40.8447380065918, "global_step": 157616, "epoch": 1302} {"train_loss": -40.57065963745117, "global_step": 157617, "epoch": 1302} {"train_loss": -40.34185791015625, "global_step": 157618, "epoch": 1302} {"train_loss": -41.11488723754883, "global_step": 157619, "epoch": 1302} {"train_loss": -40.113468170166016, "global_step": 157620, "epoch": 1302} {"train_loss": -40.33408737182617, "global_step": 157621, "epoch": 1302} {"train_loss": -40.89484405517578, "global_step": 157622, "epoch": 1302} {"train_loss": -40.212154388427734, "global_step": 157623, "epoch": 1302} {"train_loss": -40.89352798461914, "global_step": 157624, "epoch": 1302} {"train_loss": -40.758941650390625, "global_step": 157625, "epoch": 1302} {"train_loss": -40.623291015625, "global_step": 157626, "epoch": 1302} {"train_loss": -40.518104553222656, "global_step": 157627, "epoch": 1302} {"train_loss": -40.82882308959961, "global_step": 157628, "epoch": 1302} {"train_loss": -40.94329833984375, "global_step": 157629, "epoch": 1302} {"train_loss": -40.79564666748047, "global_step": 157630, "epoch": 1302} {"train_loss": -40.404571533203125, "global_step": 157631, "epoch": 1302} {"train_loss": -40.98318099975586, "global_step": 157632, "epoch": 1302} {"train_loss": -40.64405059814453, "global_step": 157633, "epoch": 1302} {"train_loss": -40.01565170288086, "global_step": 157634, "epoch": 1302} {"train_loss": -40.84560775756836, "global_step": 157635, "epoch": 1302} {"train_loss": -40.6317024230957, "global_step": 157636, "epoch": 1302} {"train_loss": -41.194435119628906, "global_step": 157637, "epoch": 1302} {"train_loss": -40.29921340942383, "global_step": 157638, "epoch": 1302} {"train_loss": -40.27912521362305, "global_step": 157639, "epoch": 1302} {"train_loss": -40.45602798461914, "global_step": 157640, "epoch": 1302} {"train_loss": -39.95100021362305, "global_step": 157641, "epoch": 1302} {"train_loss": -37.484153747558594, "global_step": 157642, "epoch": 1302} {"train_loss": -32.87424850463867, "global_step": 157643, "epoch": 1302} {"train_loss": -32.9729118347168, "global_step": 157644, "epoch": 1302} {"train_loss": -37.756752014160156, "global_step": 157645, "epoch": 1302} {"train_loss": -40.387386322021484, "global_step": 157646, "epoch": 1302} {"train_loss": -40.52305221557617, "global_step": 157647, "epoch": 1302} {"train_loss": -39.586605072021484, "global_step": 157648, "epoch": 1302} {"train_loss": -40.4744987487793, "global_step": 157649, "epoch": 1302} {"train_loss": -40.63603591918945, "global_step": 157650, "epoch": 1302} {"train_loss": -38.966373443603516, "global_step": 157651, "epoch": 1302} {"train_loss": -36.798702239990234, "global_step": 157652, "epoch": 1302} {"train_loss": -39.00034713745117, "global_step": 157653, "epoch": 1302} {"train_loss": -39.269344329833984, "global_step": 157654, "epoch": 1302} {"train_loss": -37.66411209106445, "global_step": 157655, "epoch": 1302} {"train_loss": -38.1359977722168, "global_step": 157656, "epoch": 1302} {"train_loss": -39.283050537109375, "global_step": 157657, "epoch": 1302} {"train_loss": -38.419639587402344, "global_step": 157658, "epoch": 1302} {"train_loss": -39.13287353515625, "global_step": 157659, "epoch": 1302} {"train_loss": -38.32853317260742, "global_step": 157660, "epoch": 1302} {"train_loss": -39.838314056396484, "global_step": 157661, "epoch": 1302} {"train_loss": -39.505825673253085, "global_step": 157662, "epoch": 1302, "val_loss": 2542256.75} {"train_loss": -37.33553695678711, "global_step": 157663, "epoch": 1303} {"train_loss": -39.3785400390625, "global_step": 157664, "epoch": 1303} {"train_loss": -38.948707580566406, "global_step": 157665, "epoch": 1303} {"train_loss": -37.59530258178711, "global_step": 157666, "epoch": 1303} {"train_loss": -37.973487854003906, "global_step": 157667, "epoch": 1303} {"train_loss": -38.96509552001953, "global_step": 157668, "epoch": 1303} {"train_loss": -38.74470138549805, "global_step": 157669, "epoch": 1303} {"train_loss": -40.17547607421875, "global_step": 157670, "epoch": 1303} {"train_loss": -39.55202865600586, "global_step": 157671, "epoch": 1303} {"train_loss": -40.2327995300293, "global_step": 157672, "epoch": 1303} {"train_loss": -39.64697265625, "global_step": 157673, "epoch": 1303} {"train_loss": -39.890167236328125, "global_step": 157674, "epoch": 1303} {"train_loss": -40.17887496948242, "global_step": 157675, "epoch": 1303} {"train_loss": -39.92087173461914, "global_step": 157676, "epoch": 1303} {"train_loss": -40.02324295043945, "global_step": 157677, "epoch": 1303} {"train_loss": -39.956878662109375, "global_step": 157678, "epoch": 1303} {"train_loss": -40.99575424194336, "global_step": 157679, "epoch": 1303} {"train_loss": -39.89645004272461, "global_step": 157680, "epoch": 1303} {"train_loss": -40.690582275390625, "global_step": 157681, "epoch": 1303} {"train_loss": -40.59666061401367, "global_step": 157682, "epoch": 1303} {"train_loss": -40.09886169433594, "global_step": 157683, "epoch": 1303} {"train_loss": -40.83063507080078, "global_step": 157684, "epoch": 1303} {"train_loss": -40.191158294677734, "global_step": 157685, "epoch": 1303} {"train_loss": -41.101417541503906, "global_step": 157686, "epoch": 1303} {"train_loss": -40.143123626708984, "global_step": 157687, "epoch": 1303} {"train_loss": -40.69614791870117, "global_step": 157688, "epoch": 1303} {"train_loss": -40.95054244995117, "global_step": 157689, "epoch": 1303} {"train_loss": -40.109230041503906, "global_step": 157690, "epoch": 1303} {"train_loss": -41.092281341552734, "global_step": 157691, "epoch": 1303} {"train_loss": -40.464962005615234, "global_step": 157692, "epoch": 1303} {"train_loss": -40.261959075927734, "global_step": 157693, "epoch": 1303} {"train_loss": -40.685733795166016, "global_step": 157694, "epoch": 1303} {"train_loss": -40.117549896240234, "global_step": 157695, "epoch": 1303} {"train_loss": -40.474063873291016, "global_step": 157696, "epoch": 1303} {"train_loss": -40.905941009521484, "global_step": 157697, "epoch": 1303} {"train_loss": -40.50688934326172, "global_step": 157698, "epoch": 1303} {"train_loss": -40.28361129760742, "global_step": 157699, "epoch": 1303} {"train_loss": -40.899986267089844, "global_step": 157700, "epoch": 1303} {"train_loss": -40.250816345214844, "global_step": 157701, "epoch": 1303} {"train_loss": -40.29904556274414, "global_step": 157702, "epoch": 1303} {"train_loss": -41.16666793823242, "global_step": 157703, "epoch": 1303} {"train_loss": -40.51506805419922, "global_step": 157704, "epoch": 1303} {"train_loss": -40.9145622253418, "global_step": 157705, "epoch": 1303} {"train_loss": -40.6897087097168, "global_step": 157706, "epoch": 1303} {"train_loss": -41.01317596435547, "global_step": 157707, "epoch": 1303} {"train_loss": -41.0346565246582, "global_step": 157708, "epoch": 1303} {"train_loss": -40.53084182739258, "global_step": 157709, "epoch": 1303} {"train_loss": -39.55472946166992, "global_step": 157710, "epoch": 1303} {"train_loss": -40.73798370361328, "global_step": 157711, "epoch": 1303} {"train_loss": -41.24916458129883, "global_step": 157712, "epoch": 1303} {"train_loss": -41.00618362426758, "global_step": 157713, "epoch": 1303} {"train_loss": -41.025203704833984, "global_step": 157714, "epoch": 1303} {"train_loss": -41.211124420166016, "global_step": 157715, "epoch": 1303} {"train_loss": -40.7808837890625, "global_step": 157716, "epoch": 1303} {"train_loss": -40.24729537963867, "global_step": 157717, "epoch": 1303} {"train_loss": -41.04429244995117, "global_step": 157718, "epoch": 1303} {"train_loss": -41.19955825805664, "global_step": 157719, "epoch": 1303} {"train_loss": -39.15713119506836, "global_step": 157720, "epoch": 1303} {"train_loss": -40.55807113647461, "global_step": 157721, "epoch": 1303} {"train_loss": -40.39019775390625, "global_step": 157722, "epoch": 1303} {"train_loss": -39.45040512084961, "global_step": 157723, "epoch": 1303} {"train_loss": -40.5782470703125, "global_step": 157724, "epoch": 1303} {"train_loss": -40.28740692138672, "global_step": 157725, "epoch": 1303} {"train_loss": -40.330535888671875, "global_step": 157726, "epoch": 1303} {"train_loss": -41.23225021362305, "global_step": 157727, "epoch": 1303} {"train_loss": -40.08457565307617, "global_step": 157728, "epoch": 1303} {"train_loss": -40.33460235595703, "global_step": 157729, "epoch": 1303} {"train_loss": -39.26120376586914, "global_step": 157730, "epoch": 1303} {"train_loss": -36.53521728515625, "global_step": 157731, "epoch": 1303} {"train_loss": -39.93938064575195, "global_step": 157732, "epoch": 1303} {"train_loss": -40.61689376831055, "global_step": 157733, "epoch": 1303} {"train_loss": -40.26267623901367, "global_step": 157734, "epoch": 1303} {"train_loss": -38.03998947143555, "global_step": 157735, "epoch": 1303} {"train_loss": -38.358760833740234, "global_step": 157736, "epoch": 1303} {"train_loss": -39.21232986450195, "global_step": 157737, "epoch": 1303} {"train_loss": -39.45871353149414, "global_step": 157738, "epoch": 1303} {"train_loss": -39.818965911865234, "global_step": 157739, "epoch": 1303} {"train_loss": -40.2140007019043, "global_step": 157740, "epoch": 1303} {"train_loss": -39.02005386352539, "global_step": 157741, "epoch": 1303} {"train_loss": -40.152915954589844, "global_step": 157742, "epoch": 1303} {"train_loss": -40.91366195678711, "global_step": 157743, "epoch": 1303} {"train_loss": -39.20733642578125, "global_step": 157744, "epoch": 1303} {"train_loss": -39.604278564453125, "global_step": 157745, "epoch": 1303} {"train_loss": -40.88167190551758, "global_step": 157746, "epoch": 1303} {"train_loss": -37.0255241394043, "global_step": 157747, "epoch": 1303} {"train_loss": -40.206207275390625, "global_step": 157748, "epoch": 1303} {"train_loss": -36.94329833984375, "global_step": 157749, "epoch": 1303} {"train_loss": -39.79548645019531, "global_step": 157750, "epoch": 1303} {"train_loss": -39.68647766113281, "global_step": 157751, "epoch": 1303} {"train_loss": -41.20280075073242, "global_step": 157752, "epoch": 1303} {"train_loss": -39.762794494628906, "global_step": 157753, "epoch": 1303} {"train_loss": -38.88169479370117, "global_step": 157754, "epoch": 1303} {"train_loss": -38.64936447143555, "global_step": 157755, "epoch": 1303} {"train_loss": -39.5777702331543, "global_step": 157756, "epoch": 1303} {"train_loss": -40.7379150390625, "global_step": 157757, "epoch": 1303} {"train_loss": -40.024234771728516, "global_step": 157758, "epoch": 1303} {"train_loss": -40.298248291015625, "global_step": 157759, "epoch": 1303} {"train_loss": -37.021331787109375, "global_step": 157760, "epoch": 1303} {"train_loss": -32.83123779296875, "global_step": 157761, "epoch": 1303} {"train_loss": -38.71908187866211, "global_step": 157762, "epoch": 1303} {"train_loss": -40.39866256713867, "global_step": 157763, "epoch": 1303} {"train_loss": -40.221534729003906, "global_step": 157764, "epoch": 1303} {"train_loss": -37.09245300292969, "global_step": 157765, "epoch": 1303} {"train_loss": -39.57526779174805, "global_step": 157766, "epoch": 1303} {"train_loss": -39.37480926513672, "global_step": 157767, "epoch": 1303} {"train_loss": -40.188289642333984, "global_step": 157768, "epoch": 1303} {"train_loss": -39.321746826171875, "global_step": 157769, "epoch": 1303} {"train_loss": -40.53208923339844, "global_step": 157770, "epoch": 1303} {"train_loss": -38.40744400024414, "global_step": 157771, "epoch": 1303} {"train_loss": -39.18952178955078, "global_step": 157772, "epoch": 1303} {"train_loss": -40.2750358581543, "global_step": 157773, "epoch": 1303} {"train_loss": -40.569393157958984, "global_step": 157774, "epoch": 1303} {"train_loss": -39.84689712524414, "global_step": 157775, "epoch": 1303} {"train_loss": -39.027095794677734, "global_step": 157776, "epoch": 1303} {"train_loss": -39.16521072387695, "global_step": 157777, "epoch": 1303} {"train_loss": -40.52743148803711, "global_step": 157778, "epoch": 1303} {"train_loss": -40.2421875, "global_step": 157779, "epoch": 1303} {"train_loss": -39.639766693115234, "global_step": 157780, "epoch": 1303} {"train_loss": -40.64225387573242, "global_step": 157781, "epoch": 1303} {"train_loss": -40.98728942871094, "global_step": 157782, "epoch": 1303} {"train_loss": -39.87905543303687, "global_step": 157783, "epoch": 1303, "val_loss": 2465728.0} {"train_loss": -39.27370834350586, "global_step": 157784, "epoch": 1304} {"train_loss": -40.7952880859375, "global_step": 157785, "epoch": 1304} {"train_loss": -39.2199592590332, "global_step": 157786, "epoch": 1304} {"train_loss": -39.815589904785156, "global_step": 157787, "epoch": 1304} {"train_loss": -39.77802276611328, "global_step": 157788, "epoch": 1304} {"train_loss": -40.00957489013672, "global_step": 157789, "epoch": 1304} {"train_loss": -40.1712646484375, "global_step": 157790, "epoch": 1304} {"train_loss": -38.272518157958984, "global_step": 157791, "epoch": 1304} {"train_loss": -39.83950424194336, "global_step": 157792, "epoch": 1304} {"train_loss": -40.64223861694336, "global_step": 157793, "epoch": 1304} {"train_loss": -40.569366455078125, "global_step": 157794, "epoch": 1304} {"train_loss": -40.76413345336914, "global_step": 157795, "epoch": 1304} {"train_loss": -39.631771087646484, "global_step": 157796, "epoch": 1304} {"train_loss": -40.66921615600586, "global_step": 157797, "epoch": 1304} {"train_loss": -38.77348327636719, "global_step": 157798, "epoch": 1304} {"train_loss": -39.214012145996094, "global_step": 157799, "epoch": 1304} {"train_loss": -39.17142868041992, "global_step": 157800, "epoch": 1304} {"train_loss": -38.93146514892578, "global_step": 157801, "epoch": 1304} {"train_loss": -38.74653244018555, "global_step": 157802, "epoch": 1304} {"train_loss": -39.33231735229492, "global_step": 157803, "epoch": 1304} {"train_loss": -34.375667572021484, "global_step": 157804, "epoch": 1304} {"train_loss": -39.41326141357422, "global_step": 157805, "epoch": 1304} {"train_loss": -38.04623794555664, "global_step": 157806, "epoch": 1304} {"train_loss": -38.86799240112305, "global_step": 157807, "epoch": 1304} {"train_loss": -38.353050231933594, "global_step": 157808, "epoch": 1304} {"train_loss": -39.56498336791992, "global_step": 157809, "epoch": 1304} {"train_loss": -39.51998519897461, "global_step": 157810, "epoch": 1304} {"train_loss": -38.660926818847656, "global_step": 157811, "epoch": 1304} {"train_loss": -39.489620208740234, "global_step": 157812, "epoch": 1304} {"train_loss": -40.14498519897461, "global_step": 157813, "epoch": 1304} {"train_loss": -36.0184211730957, "global_step": 157814, "epoch": 1304} {"train_loss": -39.39447021484375, "global_step": 157815, "epoch": 1304} {"train_loss": -37.86751174926758, "global_step": 157816, "epoch": 1304} {"train_loss": -36.928749084472656, "global_step": 157817, "epoch": 1304} {"train_loss": -36.62714767456055, "global_step": 157818, "epoch": 1304} {"train_loss": -35.1107063293457, "global_step": 157819, "epoch": 1304} {"train_loss": -36.720455169677734, "global_step": 157820, "epoch": 1304} {"train_loss": -36.69940185546875, "global_step": 157821, "epoch": 1304} {"train_loss": -33.1260871887207, "global_step": 157822, "epoch": 1304} {"train_loss": -34.214019775390625, "global_step": 157823, "epoch": 1304} {"train_loss": -33.49691390991211, "global_step": 157824, "epoch": 1304} {"train_loss": -38.98542404174805, "global_step": 157825, "epoch": 1304} {"train_loss": -34.608829498291016, "global_step": 157826, "epoch": 1304} {"train_loss": -36.2816047668457, "global_step": 157827, "epoch": 1304} {"train_loss": -37.55166244506836, "global_step": 157828, "epoch": 1304} {"train_loss": -33.67137145996094, "global_step": 157829, "epoch": 1304} {"train_loss": -37.642513275146484, "global_step": 157830, "epoch": 1304} {"train_loss": -37.61991500854492, "global_step": 157831, "epoch": 1304} {"train_loss": -38.28086471557617, "global_step": 157832, "epoch": 1304} {"train_loss": -38.41109848022461, "global_step": 157833, "epoch": 1304} {"train_loss": -38.11532974243164, "global_step": 157834, "epoch": 1304} {"train_loss": -38.552181243896484, "global_step": 157835, "epoch": 1304} {"train_loss": -37.712581634521484, "global_step": 157836, "epoch": 1304} {"train_loss": -38.08089065551758, "global_step": 157837, "epoch": 1304} {"train_loss": -37.388771057128906, "global_step": 157838, "epoch": 1304} {"train_loss": -37.88883972167969, "global_step": 157839, "epoch": 1304} {"train_loss": -36.89944076538086, "global_step": 157840, "epoch": 1304} {"train_loss": -37.42158126831055, "global_step": 157841, "epoch": 1304} {"train_loss": -37.21439743041992, "global_step": 157842, "epoch": 1304} {"train_loss": -38.303897857666016, "global_step": 157843, "epoch": 1304} {"train_loss": -37.804683685302734, "global_step": 157844, "epoch": 1304} {"train_loss": -37.671443939208984, "global_step": 157845, "epoch": 1304} {"train_loss": -39.29361343383789, "global_step": 157846, "epoch": 1304} {"train_loss": -39.15909957885742, "global_step": 157847, "epoch": 1304} {"train_loss": -38.47419357299805, "global_step": 157848, "epoch": 1304} {"train_loss": -39.479000091552734, "global_step": 157849, "epoch": 1304} {"train_loss": -38.6377067565918, "global_step": 157850, "epoch": 1304} {"train_loss": -38.59307861328125, "global_step": 157851, "epoch": 1304} {"train_loss": -38.690704345703125, "global_step": 157852, "epoch": 1304} {"train_loss": -39.850101470947266, "global_step": 157853, "epoch": 1304} {"train_loss": -36.97432327270508, "global_step": 157854, "epoch": 1304} {"train_loss": -39.20743942260742, "global_step": 157855, "epoch": 1304} {"train_loss": -39.53116989135742, "global_step": 157856, "epoch": 1304} {"train_loss": -38.59467315673828, "global_step": 157857, "epoch": 1304} {"train_loss": -39.10385513305664, "global_step": 157858, "epoch": 1304} {"train_loss": -39.78825759887695, "global_step": 157859, "epoch": 1304} {"train_loss": -38.24953842163086, "global_step": 157860, "epoch": 1304} {"train_loss": -38.61005401611328, "global_step": 157861, "epoch": 1304} {"train_loss": -40.20859909057617, "global_step": 157862, "epoch": 1304} {"train_loss": -39.48167037963867, "global_step": 157863, "epoch": 1304} {"train_loss": -38.48329544067383, "global_step": 157864, "epoch": 1304} {"train_loss": -39.388423919677734, "global_step": 157865, "epoch": 1304} {"train_loss": -39.5705680847168, "global_step": 157866, "epoch": 1304} {"train_loss": -38.158016204833984, "global_step": 157867, "epoch": 1304} {"train_loss": -40.092201232910156, "global_step": 157868, "epoch": 1304} {"train_loss": -40.28806686401367, "global_step": 157869, "epoch": 1304} {"train_loss": -40.17367172241211, "global_step": 157870, "epoch": 1304} {"train_loss": -39.27999496459961, "global_step": 157871, "epoch": 1304} {"train_loss": -40.31732940673828, "global_step": 157872, "epoch": 1304} {"train_loss": -39.304359436035156, "global_step": 157873, "epoch": 1304} {"train_loss": -39.77574920654297, "global_step": 157874, "epoch": 1304} {"train_loss": -40.692535400390625, "global_step": 157875, "epoch": 1304} {"train_loss": -38.359291076660156, "global_step": 157876, "epoch": 1304} {"train_loss": -39.926979064941406, "global_step": 157877, "epoch": 1304} {"train_loss": -40.467899322509766, "global_step": 157878, "epoch": 1304} {"train_loss": -39.62619400024414, "global_step": 157879, "epoch": 1304} {"train_loss": -40.22341537475586, "global_step": 157880, "epoch": 1304} {"train_loss": -40.42424011230469, "global_step": 157881, "epoch": 1304} {"train_loss": -40.0587043762207, "global_step": 157882, "epoch": 1304} {"train_loss": -39.97220993041992, "global_step": 157883, "epoch": 1304} {"train_loss": -40.87925720214844, "global_step": 157884, "epoch": 1304} {"train_loss": -40.13265609741211, "global_step": 157885, "epoch": 1304} {"train_loss": -36.96925735473633, "global_step": 157886, "epoch": 1304} {"train_loss": -40.41128158569336, "global_step": 157887, "epoch": 1304} {"train_loss": -40.27534866333008, "global_step": 157888, "epoch": 1304} {"train_loss": -40.061458587646484, "global_step": 157889, "epoch": 1304} {"train_loss": -40.530757904052734, "global_step": 157890, "epoch": 1304} {"train_loss": -40.92802810668945, "global_step": 157891, "epoch": 1304} {"train_loss": -39.47357177734375, "global_step": 157892, "epoch": 1304} {"train_loss": -38.992584228515625, "global_step": 157893, "epoch": 1304} {"train_loss": -40.581851959228516, "global_step": 157894, "epoch": 1304} {"train_loss": -40.3804817199707, "global_step": 157895, "epoch": 1304} {"train_loss": -38.97209548950195, "global_step": 157896, "epoch": 1304} {"train_loss": -39.80936050415039, "global_step": 157897, "epoch": 1304} {"train_loss": -39.448604583740234, "global_step": 157898, "epoch": 1304} {"train_loss": -39.66526412963867, "global_step": 157899, "epoch": 1304} {"train_loss": -40.670719146728516, "global_step": 157900, "epoch": 1304} {"train_loss": -40.17916488647461, "global_step": 157901, "epoch": 1304} {"train_loss": -40.1142692565918, "global_step": 157902, "epoch": 1304} {"train_loss": -40.392879486083984, "global_step": 157903, "epoch": 1304} {"train_loss": -38.830590082594185, "global_step": 157904, "epoch": 1304, "val_loss": 2568039.75} {"train_loss": -38.983619689941406, "global_step": 157905, "epoch": 1305} {"train_loss": -37.93584060668945, "global_step": 157906, "epoch": 1305} {"train_loss": -37.56854248046875, "global_step": 157907, "epoch": 1305} {"train_loss": -40.375423431396484, "global_step": 157908, "epoch": 1305} {"train_loss": -40.31061935424805, "global_step": 157909, "epoch": 1305} {"train_loss": -37.813594818115234, "global_step": 157910, "epoch": 1305} {"train_loss": -39.60489273071289, "global_step": 157911, "epoch": 1305} {"train_loss": -40.52574920654297, "global_step": 157912, "epoch": 1305} {"train_loss": -40.06217575073242, "global_step": 157913, "epoch": 1305} {"train_loss": -40.02711868286133, "global_step": 157914, "epoch": 1305} {"train_loss": -40.79150390625, "global_step": 157915, "epoch": 1305} {"train_loss": -39.40436553955078, "global_step": 157916, "epoch": 1305} {"train_loss": -39.88123321533203, "global_step": 157917, "epoch": 1305} {"train_loss": -40.06960678100586, "global_step": 157918, "epoch": 1305} {"train_loss": -39.73183822631836, "global_step": 157919, "epoch": 1305} {"train_loss": -38.63031768798828, "global_step": 157920, "epoch": 1305} {"train_loss": -39.00310134887695, "global_step": 157921, "epoch": 1305} {"train_loss": -40.60659408569336, "global_step": 157922, "epoch": 1305} {"train_loss": -40.40800094604492, "global_step": 157923, "epoch": 1305} {"train_loss": -40.87861251831055, "global_step": 157924, "epoch": 1305} {"train_loss": -40.16453170776367, "global_step": 157925, "epoch": 1305} {"train_loss": -38.7690544128418, "global_step": 157926, "epoch": 1305} {"train_loss": -39.92695236206055, "global_step": 157927, "epoch": 1305} {"train_loss": -41.15373611450195, "global_step": 157928, "epoch": 1305} {"train_loss": -39.85642623901367, "global_step": 157929, "epoch": 1305} {"train_loss": -40.384334564208984, "global_step": 157930, "epoch": 1305} {"train_loss": -41.35946273803711, "global_step": 157931, "epoch": 1305} {"train_loss": -40.574337005615234, "global_step": 157932, "epoch": 1305} {"train_loss": -40.054744720458984, "global_step": 157933, "epoch": 1305} {"train_loss": -40.3285026550293, "global_step": 157934, "epoch": 1305} {"train_loss": -40.93361282348633, "global_step": 157935, "epoch": 1305} {"train_loss": -40.76538848876953, "global_step": 157936, "epoch": 1305} {"train_loss": -40.18748474121094, "global_step": 157937, "epoch": 1305} {"train_loss": -39.891357421875, "global_step": 157938, "epoch": 1305} {"train_loss": -41.00428009033203, "global_step": 157939, "epoch": 1305} {"train_loss": -41.3572883605957, "global_step": 157940, "epoch": 1305} {"train_loss": -40.576507568359375, "global_step": 157941, "epoch": 1305} {"train_loss": -41.020233154296875, "global_step": 157942, "epoch": 1305} {"train_loss": -40.433773040771484, "global_step": 157943, "epoch": 1305} {"train_loss": -41.063087463378906, "global_step": 157944, "epoch": 1305} {"train_loss": -41.09406661987305, "global_step": 157945, "epoch": 1305} {"train_loss": -40.8802604675293, "global_step": 157946, "epoch": 1305} {"train_loss": -40.98543167114258, "global_step": 157947, "epoch": 1305} {"train_loss": -41.30213928222656, "global_step": 157948, "epoch": 1305} {"train_loss": -39.611366271972656, "global_step": 157949, "epoch": 1305} {"train_loss": -40.16013717651367, "global_step": 157950, "epoch": 1305} {"train_loss": -40.2339973449707, "global_step": 157951, "epoch": 1305} {"train_loss": -40.5280876159668, "global_step": 157952, "epoch": 1305} {"train_loss": -41.02409362792969, "global_step": 157953, "epoch": 1305} {"train_loss": -41.50211715698242, "global_step": 157954, "epoch": 1305} {"train_loss": -41.092159271240234, "global_step": 157955, "epoch": 1305} {"train_loss": -40.89285659790039, "global_step": 157956, "epoch": 1305} {"train_loss": -40.820037841796875, "global_step": 157957, "epoch": 1305} {"train_loss": -41.51205062866211, "global_step": 157958, "epoch": 1305} {"train_loss": -41.36212921142578, "global_step": 157959, "epoch": 1305} {"train_loss": -41.37550354003906, "global_step": 157960, "epoch": 1305} {"train_loss": -41.32607650756836, "global_step": 157961, "epoch": 1305} {"train_loss": -41.07155990600586, "global_step": 157962, "epoch": 1305} {"train_loss": -41.77297592163086, "global_step": 157963, "epoch": 1305} {"train_loss": -41.280975341796875, "global_step": 157964, "epoch": 1305} {"train_loss": -41.4614372253418, "global_step": 157965, "epoch": 1305} {"train_loss": -41.22894287109375, "global_step": 157966, "epoch": 1305} {"train_loss": -41.37847900390625, "global_step": 157967, "epoch": 1305} {"train_loss": -41.180320739746094, "global_step": 157968, "epoch": 1305} {"train_loss": -40.693275451660156, "global_step": 157969, "epoch": 1305} {"train_loss": -39.858001708984375, "global_step": 157970, "epoch": 1305} {"train_loss": -40.066341400146484, "global_step": 157971, "epoch": 1305} {"train_loss": -37.24953079223633, "global_step": 157972, "epoch": 1305} {"train_loss": -36.391544342041016, "global_step": 157973, "epoch": 1305} {"train_loss": -38.87662124633789, "global_step": 157974, "epoch": 1305} {"train_loss": -37.6644287109375, "global_step": 157975, "epoch": 1305} {"train_loss": -40.00487518310547, "global_step": 157976, "epoch": 1305} {"train_loss": -39.27262496948242, "global_step": 157977, "epoch": 1305} {"train_loss": -36.75983810424805, "global_step": 157978, "epoch": 1305} {"train_loss": -38.90228271484375, "global_step": 157979, "epoch": 1305} {"train_loss": -39.15696334838867, "global_step": 157980, "epoch": 1305} {"train_loss": -40.0448112487793, "global_step": 157981, "epoch": 1305} {"train_loss": -38.903934478759766, "global_step": 157982, "epoch": 1305} {"train_loss": -38.41595458984375, "global_step": 157983, "epoch": 1305} {"train_loss": -40.0640754699707, "global_step": 157984, "epoch": 1305} {"train_loss": -38.73381423950195, "global_step": 157985, "epoch": 1305} {"train_loss": -38.54045486450195, "global_step": 157986, "epoch": 1305} {"train_loss": -40.381465911865234, "global_step": 157987, "epoch": 1305} {"train_loss": -34.253456115722656, "global_step": 157988, "epoch": 1305} {"train_loss": -39.806297302246094, "global_step": 157989, "epoch": 1305} {"train_loss": -39.509002685546875, "global_step": 157990, "epoch": 1305} {"train_loss": -38.29502487182617, "global_step": 157991, "epoch": 1305} {"train_loss": -40.001808166503906, "global_step": 157992, "epoch": 1305} {"train_loss": -37.72594451904297, "global_step": 157993, "epoch": 1305} {"train_loss": -33.023162841796875, "global_step": 157994, "epoch": 1305} {"train_loss": -38.41279220581055, "global_step": 157995, "epoch": 1305} {"train_loss": -37.31783676147461, "global_step": 157996, "epoch": 1305} {"train_loss": -36.8630256652832, "global_step": 157997, "epoch": 1305} {"train_loss": -37.2486457824707, "global_step": 157998, "epoch": 1305} {"train_loss": -34.39097213745117, "global_step": 157999, "epoch": 1305} {"train_loss": -37.922054290771484, "global_step": 158000, "epoch": 1305} {"train_loss": -38.767642974853516, "global_step": 158001, "epoch": 1305} {"train_loss": -39.5916748046875, "global_step": 158002, "epoch": 1305} {"train_loss": -37.132938385009766, "global_step": 158003, "epoch": 1305} {"train_loss": -15.980917930603027, "global_step": 158004, "epoch": 1305} {"train_loss": -37.870723724365234, "global_step": 158005, "epoch": 1305} {"train_loss": -36.83198165893555, "global_step": 158006, "epoch": 1305} {"train_loss": -37.7065315246582, "global_step": 158007, "epoch": 1305} {"train_loss": -15.73016357421875, "global_step": 158008, "epoch": 1305} {"train_loss": -36.03474044799805, "global_step": 158009, "epoch": 1305} {"train_loss": -32.722076416015625, "global_step": 158010, "epoch": 1305} {"train_loss": -34.594425201416016, "global_step": 158011, "epoch": 1305} {"train_loss": -36.147891998291016, "global_step": 158012, "epoch": 1305} {"train_loss": -33.17719650268555, "global_step": 158013, "epoch": 1305} {"train_loss": -30.617456436157227, "global_step": 158014, "epoch": 1305} {"train_loss": -37.84764862060547, "global_step": 158015, "epoch": 1305} {"train_loss": -36.297847747802734, "global_step": 158016, "epoch": 1305} {"train_loss": -35.39959716796875, "global_step": 158017, "epoch": 1305} {"train_loss": -36.30730438232422, "global_step": 158018, "epoch": 1305} {"train_loss": -34.77224349975586, "global_step": 158019, "epoch": 1305} {"train_loss": -34.74568176269531, "global_step": 158020, "epoch": 1305} {"train_loss": -37.55533218383789, "global_step": 158021, "epoch": 1305} {"train_loss": -31.457300186157227, "global_step": 158022, "epoch": 1305} {"train_loss": -34.643489837646484, "global_step": 158023, "epoch": 1305} {"train_loss": -37.709991455078125, "global_step": 158024, "epoch": 1305} {"train_loss": -38.59021692039553, "global_step": 158025, "epoch": 1305, "val_loss": 2834614.0} {"train_loss": -34.03705978393555, "global_step": 158026, "epoch": 1306} {"train_loss": -37.601444244384766, "global_step": 158027, "epoch": 1306} {"train_loss": -34.69676208496094, "global_step": 158028, "epoch": 1306} {"train_loss": -37.80747604370117, "global_step": 158029, "epoch": 1306} {"train_loss": -38.4195556640625, "global_step": 158030, "epoch": 1306} {"train_loss": -37.882118225097656, "global_step": 158031, "epoch": 1306} {"train_loss": -39.184932708740234, "global_step": 158032, "epoch": 1306} {"train_loss": -33.04627227783203, "global_step": 158033, "epoch": 1306} {"train_loss": -37.1008186340332, "global_step": 158034, "epoch": 1306} {"train_loss": -38.482147216796875, "global_step": 158035, "epoch": 1306} {"train_loss": -37.880470275878906, "global_step": 158036, "epoch": 1306} {"train_loss": -38.96467208862305, "global_step": 158037, "epoch": 1306} {"train_loss": -37.584686279296875, "global_step": 158038, "epoch": 1306} {"train_loss": -37.15678787231445, "global_step": 158039, "epoch": 1306} {"train_loss": -37.15975570678711, "global_step": 158040, "epoch": 1306} {"train_loss": -38.32609558105469, "global_step": 158041, "epoch": 1306} {"train_loss": -37.329498291015625, "global_step": 158042, "epoch": 1306} {"train_loss": -37.401851654052734, "global_step": 158043, "epoch": 1306} {"train_loss": -38.22286605834961, "global_step": 158044, "epoch": 1306} {"train_loss": -37.616943359375, "global_step": 158045, "epoch": 1306} {"train_loss": -38.18178176879883, "global_step": 158046, "epoch": 1306} {"train_loss": -39.07343673706055, "global_step": 158047, "epoch": 1306} {"train_loss": -38.62173843383789, "global_step": 158048, "epoch": 1306} {"train_loss": -37.81155014038086, "global_step": 158049, "epoch": 1306} {"train_loss": -38.852783203125, "global_step": 158050, "epoch": 1306} {"train_loss": -38.87500762939453, "global_step": 158051, "epoch": 1306} {"train_loss": -39.31790542602539, "global_step": 158052, "epoch": 1306} {"train_loss": -38.59517288208008, "global_step": 158053, "epoch": 1306} {"train_loss": -37.99981689453125, "global_step": 158054, "epoch": 1306} {"train_loss": -38.13051986694336, "global_step": 158055, "epoch": 1306} {"train_loss": -38.88093185424805, "global_step": 158056, "epoch": 1306} {"train_loss": -38.21293258666992, "global_step": 158057, "epoch": 1306} {"train_loss": -38.6148567199707, "global_step": 158058, "epoch": 1306} {"train_loss": -38.190284729003906, "global_step": 158059, "epoch": 1306} {"train_loss": -39.11354064941406, "global_step": 158060, "epoch": 1306} {"train_loss": -38.76504135131836, "global_step": 158061, "epoch": 1306} {"train_loss": -39.476478576660156, "global_step": 158062, "epoch": 1306} {"train_loss": -39.45820236206055, "global_step": 158063, "epoch": 1306} {"train_loss": -39.75153732299805, "global_step": 158064, "epoch": 1306} {"train_loss": -38.495235443115234, "global_step": 158065, "epoch": 1306} {"train_loss": -39.36605453491211, "global_step": 158066, "epoch": 1306} {"train_loss": -39.49855041503906, "global_step": 158067, "epoch": 1306} {"train_loss": -39.448646545410156, "global_step": 158068, "epoch": 1306} {"train_loss": -39.97487258911133, "global_step": 158069, "epoch": 1306} {"train_loss": -39.45391845703125, "global_step": 158070, "epoch": 1306} {"train_loss": -39.96419906616211, "global_step": 158071, "epoch": 1306} {"train_loss": -40.058956146240234, "global_step": 158072, "epoch": 1306} {"train_loss": -39.915679931640625, "global_step": 158073, "epoch": 1306} {"train_loss": -39.98861312866211, "global_step": 158074, "epoch": 1306} {"train_loss": -39.9362678527832, "global_step": 158075, "epoch": 1306} {"train_loss": -40.3929443359375, "global_step": 158076, "epoch": 1306} {"train_loss": -39.80060958862305, "global_step": 158077, "epoch": 1306} {"train_loss": -40.01622009277344, "global_step": 158078, "epoch": 1306} {"train_loss": -39.97645950317383, "global_step": 158079, "epoch": 1306} {"train_loss": -40.221309661865234, "global_step": 158080, "epoch": 1306} {"train_loss": -40.04326629638672, "global_step": 158081, "epoch": 1306} {"train_loss": -39.89808654785156, "global_step": 158082, "epoch": 1306} {"train_loss": -40.44511795043945, "global_step": 158083, "epoch": 1306} {"train_loss": -40.35908126831055, "global_step": 158084, "epoch": 1306} {"train_loss": -38.688934326171875, "global_step": 158085, "epoch": 1306} {"train_loss": -40.30253601074219, "global_step": 158086, "epoch": 1306} {"train_loss": -39.11941146850586, "global_step": 158087, "epoch": 1306} {"train_loss": -38.78879165649414, "global_step": 158088, "epoch": 1306} {"train_loss": -40.43558120727539, "global_step": 158089, "epoch": 1306} {"train_loss": -40.50639343261719, "global_step": 158090, "epoch": 1306} {"train_loss": -39.5046501159668, "global_step": 158091, "epoch": 1306} {"train_loss": -40.1752815246582, "global_step": 158092, "epoch": 1306} {"train_loss": -40.11587142944336, "global_step": 158093, "epoch": 1306} {"train_loss": -40.23288345336914, "global_step": 158094, "epoch": 1306} {"train_loss": -40.075660705566406, "global_step": 158095, "epoch": 1306} {"train_loss": -40.30326843261719, "global_step": 158096, "epoch": 1306} {"train_loss": -40.465240478515625, "global_step": 158097, "epoch": 1306} {"train_loss": -39.84442901611328, "global_step": 158098, "epoch": 1306} {"train_loss": -40.6612663269043, "global_step": 158099, "epoch": 1306} {"train_loss": -40.209930419921875, "global_step": 158100, "epoch": 1306} {"train_loss": -39.96776580810547, "global_step": 158101, "epoch": 1306} {"train_loss": -40.23664474487305, "global_step": 158102, "epoch": 1306} {"train_loss": -40.218082427978516, "global_step": 158103, "epoch": 1306} {"train_loss": -39.606849670410156, "global_step": 158104, "epoch": 1306} {"train_loss": -40.451576232910156, "global_step": 158105, "epoch": 1306} {"train_loss": -40.75403594970703, "global_step": 158106, "epoch": 1306} {"train_loss": -40.35294723510742, "global_step": 158107, "epoch": 1306} {"train_loss": -40.4073371887207, "global_step": 158108, "epoch": 1306} {"train_loss": -40.13833999633789, "global_step": 158109, "epoch": 1306} {"train_loss": -40.532535552978516, "global_step": 158110, "epoch": 1306} {"train_loss": -40.523162841796875, "global_step": 158111, "epoch": 1306} {"train_loss": -41.037654876708984, "global_step": 158112, "epoch": 1306} {"train_loss": -40.734375, "global_step": 158113, "epoch": 1306} {"train_loss": -40.55876922607422, "global_step": 158114, "epoch": 1306} {"train_loss": -39.59859085083008, "global_step": 158115, "epoch": 1306} {"train_loss": -40.518184661865234, "global_step": 158116, "epoch": 1306} {"train_loss": -39.673248291015625, "global_step": 158117, "epoch": 1306} {"train_loss": -39.71883010864258, "global_step": 158118, "epoch": 1306} {"train_loss": -38.623592376708984, "global_step": 158119, "epoch": 1306} {"train_loss": -37.85748291015625, "global_step": 158120, "epoch": 1306} {"train_loss": -37.961910247802734, "global_step": 158121, "epoch": 1306} {"train_loss": -40.320281982421875, "global_step": 158122, "epoch": 1306} {"train_loss": -36.806209564208984, "global_step": 158123, "epoch": 1306} {"train_loss": -36.60417556762695, "global_step": 158124, "epoch": 1306} {"train_loss": -31.659778594970703, "global_step": 158125, "epoch": 1306} {"train_loss": -28.9130859375, "global_step": 158126, "epoch": 1306} {"train_loss": -30.9326171875, "global_step": 158127, "epoch": 1306} {"train_loss": -35.30836486816406, "global_step": 158128, "epoch": 1306} {"train_loss": -39.531463623046875, "global_step": 158129, "epoch": 1306} {"train_loss": -36.826385498046875, "global_step": 158130, "epoch": 1306} {"train_loss": -38.34973907470703, "global_step": 158131, "epoch": 1306} {"train_loss": -37.50471115112305, "global_step": 158132, "epoch": 1306} {"train_loss": -39.17060470581055, "global_step": 158133, "epoch": 1306} {"train_loss": -39.86668014526367, "global_step": 158134, "epoch": 1306} {"train_loss": -38.29072189331055, "global_step": 158135, "epoch": 1306} {"train_loss": -40.2291374206543, "global_step": 158136, "epoch": 1306} {"train_loss": -38.89591598510742, "global_step": 158137, "epoch": 1306} {"train_loss": -39.82346725463867, "global_step": 158138, "epoch": 1306} {"train_loss": -38.61043167114258, "global_step": 158139, "epoch": 1306} {"train_loss": -39.629180908203125, "global_step": 158140, "epoch": 1306} {"train_loss": -39.92007064819336, "global_step": 158141, "epoch": 1306} {"train_loss": -40.263267517089844, "global_step": 158142, "epoch": 1306} {"train_loss": -39.97910690307617, "global_step": 158143, "epoch": 1306} {"train_loss": -40.336238861083984, "global_step": 158144, "epoch": 1306} {"train_loss": -39.11804962158203, "global_step": 158145, "epoch": 1306} {"train_loss": -38.88120285538602, "global_step": 158146, "epoch": 1306, "val_loss": 2594236.0} {"train_loss": -40.6052131652832, "global_step": 158147, "epoch": 1307} {"train_loss": -40.584651947021484, "global_step": 158148, "epoch": 1307} {"train_loss": -40.598846435546875, "global_step": 158149, "epoch": 1307} {"train_loss": -40.30559539794922, "global_step": 158150, "epoch": 1307} {"train_loss": -40.17840576171875, "global_step": 158151, "epoch": 1307} {"train_loss": -39.166297912597656, "global_step": 158152, "epoch": 1307} {"train_loss": -40.766090393066406, "global_step": 158153, "epoch": 1307} {"train_loss": -40.79610824584961, "global_step": 158154, "epoch": 1307} {"train_loss": -40.61045455932617, "global_step": 158155, "epoch": 1307} {"train_loss": -40.68935012817383, "global_step": 158156, "epoch": 1307} {"train_loss": -40.13599395751953, "global_step": 158157, "epoch": 1307} {"train_loss": -40.972259521484375, "global_step": 158158, "epoch": 1307} {"train_loss": -40.15217208862305, "global_step": 158159, "epoch": 1307} {"train_loss": -40.17030715942383, "global_step": 158160, "epoch": 1307} {"train_loss": -40.72113037109375, "global_step": 158161, "epoch": 1307} {"train_loss": -40.768795013427734, "global_step": 158162, "epoch": 1307} {"train_loss": -41.06919860839844, "global_step": 158163, "epoch": 1307} {"train_loss": -40.36603546142578, "global_step": 158164, "epoch": 1307} {"train_loss": -40.873504638671875, "global_step": 158165, "epoch": 1307} {"train_loss": -40.474525451660156, "global_step": 158166, "epoch": 1307} {"train_loss": -40.478736877441406, "global_step": 158167, "epoch": 1307} {"train_loss": -40.70909118652344, "global_step": 158168, "epoch": 1307} {"train_loss": -40.518680572509766, "global_step": 158169, "epoch": 1307} {"train_loss": -39.958858489990234, "global_step": 158170, "epoch": 1307} {"train_loss": -40.75384521484375, "global_step": 158171, "epoch": 1307} {"train_loss": -41.16497802734375, "global_step": 158172, "epoch": 1307} {"train_loss": -40.61582946777344, "global_step": 158173, "epoch": 1307} {"train_loss": -41.14178466796875, "global_step": 158174, "epoch": 1307} {"train_loss": -41.400978088378906, "global_step": 158175, "epoch": 1307} {"train_loss": -40.8369140625, "global_step": 158176, "epoch": 1307} {"train_loss": -40.89973068237305, "global_step": 158177, "epoch": 1307} {"train_loss": -40.89129638671875, "global_step": 158178, "epoch": 1307} {"train_loss": -40.563899993896484, "global_step": 158179, "epoch": 1307} {"train_loss": -40.8734245300293, "global_step": 158180, "epoch": 1307} {"train_loss": -40.95455551147461, "global_step": 158181, "epoch": 1307} {"train_loss": -41.192813873291016, "global_step": 158182, "epoch": 1307} {"train_loss": -40.7639274597168, "global_step": 158183, "epoch": 1307} {"train_loss": -40.410865783691406, "global_step": 158184, "epoch": 1307} {"train_loss": -40.54021453857422, "global_step": 158185, "epoch": 1307} {"train_loss": -41.61795425415039, "global_step": 158186, "epoch": 1307} {"train_loss": -40.286094665527344, "global_step": 158187, "epoch": 1307} {"train_loss": -37.930274963378906, "global_step": 158188, "epoch": 1307} {"train_loss": -33.65934371948242, "global_step": 158189, "epoch": 1307} {"train_loss": -35.35367965698242, "global_step": 158190, "epoch": 1307} {"train_loss": -33.70842361450195, "global_step": 158191, "epoch": 1307} {"train_loss": -27.3868465423584, "global_step": 158192, "epoch": 1307} {"train_loss": -33.621707916259766, "global_step": 158193, "epoch": 1307} {"train_loss": -37.57937240600586, "global_step": 158194, "epoch": 1307} {"train_loss": -33.60470199584961, "global_step": 158195, "epoch": 1307} {"train_loss": -33.6619758605957, "global_step": 158196, "epoch": 1307} {"train_loss": -36.6153678894043, "global_step": 158197, "epoch": 1307} {"train_loss": -33.8930549621582, "global_step": 158198, "epoch": 1307} {"train_loss": -38.034400939941406, "global_step": 158199, "epoch": 1307} {"train_loss": -35.74212646484375, "global_step": 158200, "epoch": 1307} {"train_loss": -37.4757080078125, "global_step": 158201, "epoch": 1307} {"train_loss": -37.944759368896484, "global_step": 158202, "epoch": 1307} {"train_loss": -39.06991195678711, "global_step": 158203, "epoch": 1307} {"train_loss": -37.31193923950195, "global_step": 158204, "epoch": 1307} {"train_loss": -38.085350036621094, "global_step": 158205, "epoch": 1307} {"train_loss": -38.101253509521484, "global_step": 158206, "epoch": 1307} {"train_loss": -38.41819381713867, "global_step": 158207, "epoch": 1307} {"train_loss": -38.57063674926758, "global_step": 158208, "epoch": 1307} {"train_loss": -38.10850524902344, "global_step": 158209, "epoch": 1307} {"train_loss": -39.46163558959961, "global_step": 158210, "epoch": 1307} {"train_loss": -38.196754455566406, "global_step": 158211, "epoch": 1307} {"train_loss": -39.49973678588867, "global_step": 158212, "epoch": 1307} {"train_loss": -38.306861877441406, "global_step": 158213, "epoch": 1307} {"train_loss": -39.25927734375, "global_step": 158214, "epoch": 1307} {"train_loss": -39.252079010009766, "global_step": 158215, "epoch": 1307} {"train_loss": -39.328224182128906, "global_step": 158216, "epoch": 1307} {"train_loss": -38.801856994628906, "global_step": 158217, "epoch": 1307} {"train_loss": -40.11232376098633, "global_step": 158218, "epoch": 1307} {"train_loss": -39.383079528808594, "global_step": 158219, "epoch": 1307} {"train_loss": -39.2480354309082, "global_step": 158220, "epoch": 1307} {"train_loss": -40.012813568115234, "global_step": 158221, "epoch": 1307} {"train_loss": -39.525360107421875, "global_step": 158222, "epoch": 1307} {"train_loss": -39.62998580932617, "global_step": 158223, "epoch": 1307} {"train_loss": -39.06773376464844, "global_step": 158224, "epoch": 1307} {"train_loss": -40.04293441772461, "global_step": 158225, "epoch": 1307} {"train_loss": -40.15304946899414, "global_step": 158226, "epoch": 1307} {"train_loss": -39.36410140991211, "global_step": 158227, "epoch": 1307} {"train_loss": -39.63576126098633, "global_step": 158228, "epoch": 1307} {"train_loss": -39.30268859863281, "global_step": 158229, "epoch": 1307} {"train_loss": -39.437740325927734, "global_step": 158230, "epoch": 1307} {"train_loss": -39.63383865356445, "global_step": 158231, "epoch": 1307} {"train_loss": -40.16371536254883, "global_step": 158232, "epoch": 1307} {"train_loss": -39.77264404296875, "global_step": 158233, "epoch": 1307} {"train_loss": -40.12733840942383, "global_step": 158234, "epoch": 1307} {"train_loss": -39.727657318115234, "global_step": 158235, "epoch": 1307} {"train_loss": -40.5157585144043, "global_step": 158236, "epoch": 1307} {"train_loss": -40.04910659790039, "global_step": 158237, "epoch": 1307} {"train_loss": -40.18245315551758, "global_step": 158238, "epoch": 1307} {"train_loss": -40.602630615234375, "global_step": 158239, "epoch": 1307} {"train_loss": -38.96090316772461, "global_step": 158240, "epoch": 1307} {"train_loss": -40.5343132019043, "global_step": 158241, "epoch": 1307} {"train_loss": -39.94625473022461, "global_step": 158242, "epoch": 1307} {"train_loss": -40.7780647277832, "global_step": 158243, "epoch": 1307} {"train_loss": -40.29525375366211, "global_step": 158244, "epoch": 1307} {"train_loss": -40.36869430541992, "global_step": 158245, "epoch": 1307} {"train_loss": -40.38784408569336, "global_step": 158246, "epoch": 1307} {"train_loss": -40.50589370727539, "global_step": 158247, "epoch": 1307} {"train_loss": -40.7176399230957, "global_step": 158248, "epoch": 1307} {"train_loss": -38.160011291503906, "global_step": 158249, "epoch": 1307} {"train_loss": -40.91195297241211, "global_step": 158250, "epoch": 1307} {"train_loss": -40.77760696411133, "global_step": 158251, "epoch": 1307} {"train_loss": -40.623592376708984, "global_step": 158252, "epoch": 1307} {"train_loss": -40.24514389038086, "global_step": 158253, "epoch": 1307} {"train_loss": -40.796180725097656, "global_step": 158254, "epoch": 1307} {"train_loss": -40.83055877685547, "global_step": 158255, "epoch": 1307} {"train_loss": -40.74055099487305, "global_step": 158256, "epoch": 1307} {"train_loss": -40.68251419067383, "global_step": 158257, "epoch": 1307} {"train_loss": -40.790245056152344, "global_step": 158258, "epoch": 1307} {"train_loss": -39.276546478271484, "global_step": 158259, "epoch": 1307} {"train_loss": -40.46595001220703, "global_step": 158260, "epoch": 1307} {"train_loss": -40.825294494628906, "global_step": 158261, "epoch": 1307} {"train_loss": -40.6803092956543, "global_step": 158262, "epoch": 1307} {"train_loss": -39.42220687866211, "global_step": 158263, "epoch": 1307} {"train_loss": -41.33799743652344, "global_step": 158264, "epoch": 1307} {"train_loss": -41.15739059448242, "global_step": 158265, "epoch": 1307} {"train_loss": -41.0488166809082, "global_step": 158266, "epoch": 1307} {"train_loss": -39.50702725560212, "global_step": 158267, "epoch": 1307, "val_loss": 2529442.25} {"train_loss": -41.22848129272461, "global_step": 158268, "epoch": 1308} {"train_loss": -39.06311798095703, "global_step": 158269, "epoch": 1308} {"train_loss": -41.24250411987305, "global_step": 158270, "epoch": 1308} {"train_loss": -41.30323028564453, "global_step": 158271, "epoch": 1308} {"train_loss": -41.030677795410156, "global_step": 158272, "epoch": 1308} {"train_loss": -40.642967224121094, "global_step": 158273, "epoch": 1308} {"train_loss": -41.289306640625, "global_step": 158274, "epoch": 1308} {"train_loss": -40.25189208984375, "global_step": 158275, "epoch": 1308} {"train_loss": -41.430389404296875, "global_step": 158276, "epoch": 1308} {"train_loss": -41.00666427612305, "global_step": 158277, "epoch": 1308} {"train_loss": -39.94684982299805, "global_step": 158278, "epoch": 1308} {"train_loss": -39.95726013183594, "global_step": 158279, "epoch": 1308} {"train_loss": -41.14585494995117, "global_step": 158280, "epoch": 1308} {"train_loss": -38.86642837524414, "global_step": 158281, "epoch": 1308} {"train_loss": -41.03520965576172, "global_step": 158282, "epoch": 1308} {"train_loss": -40.82139587402344, "global_step": 158283, "epoch": 1308} {"train_loss": -41.08270263671875, "global_step": 158284, "epoch": 1308} {"train_loss": -41.0623779296875, "global_step": 158285, "epoch": 1308} {"train_loss": -41.31467819213867, "global_step": 158286, "epoch": 1308} {"train_loss": -39.297969818115234, "global_step": 158287, "epoch": 1308} {"train_loss": -40.3171501159668, "global_step": 158288, "epoch": 1308} {"train_loss": -41.255470275878906, "global_step": 158289, "epoch": 1308} {"train_loss": -41.09232711791992, "global_step": 158290, "epoch": 1308} {"train_loss": -39.041114807128906, "global_step": 158291, "epoch": 1308} {"train_loss": -41.02744674682617, "global_step": 158292, "epoch": 1308} {"train_loss": -40.91276168823242, "global_step": 158293, "epoch": 1308} {"train_loss": -41.0200309753418, "global_step": 158294, "epoch": 1308} {"train_loss": -40.8831787109375, "global_step": 158295, "epoch": 1308} {"train_loss": -39.083831787109375, "global_step": 158296, "epoch": 1308} {"train_loss": -41.02907943725586, "global_step": 158297, "epoch": 1308} {"train_loss": -41.13581466674805, "global_step": 158298, "epoch": 1308} {"train_loss": -40.845367431640625, "global_step": 158299, "epoch": 1308} {"train_loss": -38.4488525390625, "global_step": 158300, "epoch": 1308} {"train_loss": -39.7362060546875, "global_step": 158301, "epoch": 1308} {"train_loss": -40.75779342651367, "global_step": 158302, "epoch": 1308} {"train_loss": -40.577293395996094, "global_step": 158303, "epoch": 1308} {"train_loss": -39.8996696472168, "global_step": 158304, "epoch": 1308} {"train_loss": -39.61283493041992, "global_step": 158305, "epoch": 1308} {"train_loss": -40.678611755371094, "global_step": 158306, "epoch": 1308} {"train_loss": -37.240238189697266, "global_step": 158307, "epoch": 1308} {"train_loss": -39.53355026245117, "global_step": 158308, "epoch": 1308} {"train_loss": -40.40287399291992, "global_step": 158309, "epoch": 1308} {"train_loss": -39.97349166870117, "global_step": 158310, "epoch": 1308} {"train_loss": -38.0031623840332, "global_step": 158311, "epoch": 1308} {"train_loss": -40.75395584106445, "global_step": 158312, "epoch": 1308} {"train_loss": -39.8166618347168, "global_step": 158313, "epoch": 1308} {"train_loss": -40.127525329589844, "global_step": 158314, "epoch": 1308} {"train_loss": -39.538818359375, "global_step": 158315, "epoch": 1308} {"train_loss": -39.42214584350586, "global_step": 158316, "epoch": 1308} {"train_loss": -40.56063461303711, "global_step": 158317, "epoch": 1308} {"train_loss": -41.10175704956055, "global_step": 158318, "epoch": 1308} {"train_loss": -39.27492904663086, "global_step": 158319, "epoch": 1308} {"train_loss": -36.95606231689453, "global_step": 158320, "epoch": 1308} {"train_loss": -39.961666107177734, "global_step": 158321, "epoch": 1308} {"train_loss": -36.97091293334961, "global_step": 158322, "epoch": 1308} {"train_loss": -33.50424575805664, "global_step": 158323, "epoch": 1308} {"train_loss": -37.511985778808594, "global_step": 158324, "epoch": 1308} {"train_loss": -37.9742317199707, "global_step": 158325, "epoch": 1308} {"train_loss": -37.60246658325195, "global_step": 158326, "epoch": 1308} {"train_loss": -38.142738342285156, "global_step": 158327, "epoch": 1308} {"train_loss": -36.65697479248047, "global_step": 158328, "epoch": 1308} {"train_loss": -30.926977157592773, "global_step": 158329, "epoch": 1308} {"train_loss": -37.39915084838867, "global_step": 158330, "epoch": 1308} {"train_loss": -37.06928634643555, "global_step": 158331, "epoch": 1308} {"train_loss": -31.085142135620117, "global_step": 158332, "epoch": 1308} {"train_loss": -27.91834831237793, "global_step": 158333, "epoch": 1308} {"train_loss": -38.4698600769043, "global_step": 158334, "epoch": 1308} {"train_loss": -35.63286209106445, "global_step": 158335, "epoch": 1308} {"train_loss": -38.67783737182617, "global_step": 158336, "epoch": 1308} {"train_loss": -35.530967712402344, "global_step": 158337, "epoch": 1308} {"train_loss": -34.06867599487305, "global_step": 158338, "epoch": 1308} {"train_loss": -35.93345260620117, "global_step": 158339, "epoch": 1308} {"train_loss": -36.9572639465332, "global_step": 158340, "epoch": 1308} {"train_loss": -35.90814971923828, "global_step": 158341, "epoch": 1308} {"train_loss": -38.84696578979492, "global_step": 158342, "epoch": 1308} {"train_loss": -37.98879623413086, "global_step": 158343, "epoch": 1308} {"train_loss": -35.715179443359375, "global_step": 158344, "epoch": 1308} {"train_loss": -38.279396057128906, "global_step": 158345, "epoch": 1308} {"train_loss": -31.756933212280273, "global_step": 158346, "epoch": 1308} {"train_loss": -37.96238327026367, "global_step": 158347, "epoch": 1308} {"train_loss": -35.5181999206543, "global_step": 158348, "epoch": 1308} {"train_loss": -37.560585021972656, "global_step": 158349, "epoch": 1308} {"train_loss": -37.75224685668945, "global_step": 158350, "epoch": 1308} {"train_loss": -37.72010040283203, "global_step": 158351, "epoch": 1308} {"train_loss": -32.38771438598633, "global_step": 158352, "epoch": 1308} {"train_loss": -38.693359375, "global_step": 158353, "epoch": 1308} {"train_loss": -38.105987548828125, "global_step": 158354, "epoch": 1308} {"train_loss": -38.660430908203125, "global_step": 158355, "epoch": 1308} {"train_loss": -37.885196685791016, "global_step": 158356, "epoch": 1308} {"train_loss": -38.45266342163086, "global_step": 158357, "epoch": 1308} {"train_loss": -37.770362854003906, "global_step": 158358, "epoch": 1308} {"train_loss": -38.7728385925293, "global_step": 158359, "epoch": 1308} {"train_loss": -38.92173385620117, "global_step": 158360, "epoch": 1308} {"train_loss": -38.3543815612793, "global_step": 158361, "epoch": 1308} {"train_loss": -39.1539306640625, "global_step": 158362, "epoch": 1308} {"train_loss": -38.83816146850586, "global_step": 158363, "epoch": 1308} {"train_loss": -38.8878288269043, "global_step": 158364, "epoch": 1308} {"train_loss": -39.0606803894043, "global_step": 158365, "epoch": 1308} {"train_loss": -38.58526611328125, "global_step": 158366, "epoch": 1308} {"train_loss": -39.340843200683594, "global_step": 158367, "epoch": 1308} {"train_loss": -38.75562286376953, "global_step": 158368, "epoch": 1308} {"train_loss": -38.59295654296875, "global_step": 158369, "epoch": 1308} {"train_loss": -39.72292709350586, "global_step": 158370, "epoch": 1308} {"train_loss": -39.16212844848633, "global_step": 158371, "epoch": 1308} {"train_loss": -38.611228942871094, "global_step": 158372, "epoch": 1308} {"train_loss": -39.29682540893555, "global_step": 158373, "epoch": 1308} {"train_loss": -39.637664794921875, "global_step": 158374, "epoch": 1308} {"train_loss": -36.8299560546875, "global_step": 158375, "epoch": 1308} {"train_loss": -38.746089935302734, "global_step": 158376, "epoch": 1308} {"train_loss": -36.59269332885742, "global_step": 158377, "epoch": 1308} {"train_loss": -39.3458366394043, "global_step": 158378, "epoch": 1308} {"train_loss": -39.30509567260742, "global_step": 158379, "epoch": 1308} {"train_loss": -38.74903106689453, "global_step": 158380, "epoch": 1308} {"train_loss": -39.87300491333008, "global_step": 158381, "epoch": 1308} {"train_loss": -39.10590362548828, "global_step": 158382, "epoch": 1308} {"train_loss": -39.290443420410156, "global_step": 158383, "epoch": 1308} {"train_loss": -39.31390380859375, "global_step": 158384, "epoch": 1308} {"train_loss": -40.105140686035156, "global_step": 158385, "epoch": 1308} {"train_loss": -39.45152282714844, "global_step": 158386, "epoch": 1308} {"train_loss": -39.555694580078125, "global_step": 158387, "epoch": 1308} {"train_loss": -38.74666885502082, "global_step": 158388, "epoch": 1308, "val_loss": 2680441.0} {"train_loss": -39.83500671386719, "global_step": 158389, "epoch": 1309} {"train_loss": -40.14213943481445, "global_step": 158390, "epoch": 1309} {"train_loss": -40.1482048034668, "global_step": 158391, "epoch": 1309} {"train_loss": -39.8734130859375, "global_step": 158392, "epoch": 1309} {"train_loss": -38.359649658203125, "global_step": 158393, "epoch": 1309} {"train_loss": -39.24127960205078, "global_step": 158394, "epoch": 1309} {"train_loss": -39.91261672973633, "global_step": 158395, "epoch": 1309} {"train_loss": -40.18986129760742, "global_step": 158396, "epoch": 1309} {"train_loss": -40.22314453125, "global_step": 158397, "epoch": 1309} {"train_loss": -39.57277297973633, "global_step": 158398, "epoch": 1309} {"train_loss": -40.232234954833984, "global_step": 158399, "epoch": 1309} {"train_loss": -38.87374496459961, "global_step": 158400, "epoch": 1309} {"train_loss": -40.39521789550781, "global_step": 158401, "epoch": 1309} {"train_loss": -40.1427116394043, "global_step": 158402, "epoch": 1309} {"train_loss": -40.423641204833984, "global_step": 158403, "epoch": 1309} {"train_loss": -40.186336517333984, "global_step": 158404, "epoch": 1309} {"train_loss": -40.326297760009766, "global_step": 158405, "epoch": 1309} {"train_loss": -38.54326248168945, "global_step": 158406, "epoch": 1309} {"train_loss": -40.329647064208984, "global_step": 158407, "epoch": 1309} {"train_loss": -38.7933464050293, "global_step": 158408, "epoch": 1309} {"train_loss": -39.52483367919922, "global_step": 158409, "epoch": 1309} {"train_loss": -40.33720397949219, "global_step": 158410, "epoch": 1309} {"train_loss": -40.16844940185547, "global_step": 158411, "epoch": 1309} {"train_loss": -38.54668045043945, "global_step": 158412, "epoch": 1309} {"train_loss": -40.4399528503418, "global_step": 158413, "epoch": 1309} {"train_loss": -40.14125442504883, "global_step": 158414, "epoch": 1309} {"train_loss": -39.41640090942383, "global_step": 158415, "epoch": 1309} {"train_loss": -40.87346267700195, "global_step": 158416, "epoch": 1309} {"train_loss": -38.3580322265625, "global_step": 158417, "epoch": 1309} {"train_loss": -38.45358657836914, "global_step": 158418, "epoch": 1309} {"train_loss": -40.7835693359375, "global_step": 158419, "epoch": 1309} {"train_loss": -40.052215576171875, "global_step": 158420, "epoch": 1309} {"train_loss": -39.12158203125, "global_step": 158421, "epoch": 1309} {"train_loss": -40.529762268066406, "global_step": 158422, "epoch": 1309} {"train_loss": -40.299556732177734, "global_step": 158423, "epoch": 1309} {"train_loss": -40.11880111694336, "global_step": 158424, "epoch": 1309} {"train_loss": -40.736549377441406, "global_step": 158425, "epoch": 1309} {"train_loss": -40.41858673095703, "global_step": 158426, "epoch": 1309} {"train_loss": -40.348114013671875, "global_step": 158427, "epoch": 1309} {"train_loss": -40.549896240234375, "global_step": 158428, "epoch": 1309} {"train_loss": -39.62702560424805, "global_step": 158429, "epoch": 1309} {"train_loss": -40.71295928955078, "global_step": 158430, "epoch": 1309} {"train_loss": -40.529788970947266, "global_step": 158431, "epoch": 1309} {"train_loss": -40.79452133178711, "global_step": 158432, "epoch": 1309} {"train_loss": -40.32221603393555, "global_step": 158433, "epoch": 1309} {"train_loss": -40.559505462646484, "global_step": 158434, "epoch": 1309} {"train_loss": -40.15385055541992, "global_step": 158435, "epoch": 1309} {"train_loss": -39.087032318115234, "global_step": 158436, "epoch": 1309} {"train_loss": -40.564483642578125, "global_step": 158437, "epoch": 1309} {"train_loss": -40.78765106201172, "global_step": 158438, "epoch": 1309} {"train_loss": -38.909149169921875, "global_step": 158439, "epoch": 1309} {"train_loss": -40.22429656982422, "global_step": 158440, "epoch": 1309} {"train_loss": -40.24524688720703, "global_step": 158441, "epoch": 1309} {"train_loss": -41.0528678894043, "global_step": 158442, "epoch": 1309} {"train_loss": -40.00828170776367, "global_step": 158443, "epoch": 1309} {"train_loss": -40.770179748535156, "global_step": 158444, "epoch": 1309} {"train_loss": -40.64558029174805, "global_step": 158445, "epoch": 1309} {"train_loss": -40.459503173828125, "global_step": 158446, "epoch": 1309} {"train_loss": -40.23106002807617, "global_step": 158447, "epoch": 1309} {"train_loss": -40.33374786376953, "global_step": 158448, "epoch": 1309} {"train_loss": -40.9769401550293, "global_step": 158449, "epoch": 1309} {"train_loss": -40.8316650390625, "global_step": 158450, "epoch": 1309} {"train_loss": -40.406917572021484, "global_step": 158451, "epoch": 1309} {"train_loss": -38.70756912231445, "global_step": 158452, "epoch": 1309} {"train_loss": -35.509700775146484, "global_step": 158453, "epoch": 1309} {"train_loss": -34.992767333984375, "global_step": 158454, "epoch": 1309} {"train_loss": -34.51694869995117, "global_step": 158455, "epoch": 1309} {"train_loss": -40.01736068725586, "global_step": 158456, "epoch": 1309} {"train_loss": -36.996612548828125, "global_step": 158457, "epoch": 1309} {"train_loss": -33.669185638427734, "global_step": 158458, "epoch": 1309} {"train_loss": -38.8853645324707, "global_step": 158459, "epoch": 1309} {"train_loss": -38.98624801635742, "global_step": 158460, "epoch": 1309} {"train_loss": -36.6234016418457, "global_step": 158461, "epoch": 1309} {"train_loss": -39.2591552734375, "global_step": 158462, "epoch": 1309} {"train_loss": -39.050689697265625, "global_step": 158463, "epoch": 1309} {"train_loss": -39.05352783203125, "global_step": 158464, "epoch": 1309} {"train_loss": -39.794715881347656, "global_step": 158465, "epoch": 1309} {"train_loss": -37.95475387573242, "global_step": 158466, "epoch": 1309} {"train_loss": -38.285152435302734, "global_step": 158467, "epoch": 1309} {"train_loss": -39.66523361206055, "global_step": 158468, "epoch": 1309} {"train_loss": -39.238311767578125, "global_step": 158469, "epoch": 1309} {"train_loss": -39.43070983886719, "global_step": 158470, "epoch": 1309} {"train_loss": -39.920658111572266, "global_step": 158471, "epoch": 1309} {"train_loss": -39.46846389770508, "global_step": 158472, "epoch": 1309} {"train_loss": -39.56867599487305, "global_step": 158473, "epoch": 1309} {"train_loss": -40.160072326660156, "global_step": 158474, "epoch": 1309} {"train_loss": -40.431095123291016, "global_step": 158475, "epoch": 1309} {"train_loss": -39.41133499145508, "global_step": 158476, "epoch": 1309} {"train_loss": -39.896907806396484, "global_step": 158477, "epoch": 1309} {"train_loss": -39.117549896240234, "global_step": 158478, "epoch": 1309} {"train_loss": -40.81473922729492, "global_step": 158479, "epoch": 1309} {"train_loss": -40.32627487182617, "global_step": 158480, "epoch": 1309} {"train_loss": -37.869903564453125, "global_step": 158481, "epoch": 1309} {"train_loss": -39.55659866333008, "global_step": 158482, "epoch": 1309} {"train_loss": -40.180076599121094, "global_step": 158483, "epoch": 1309} {"train_loss": -40.163814544677734, "global_step": 158484, "epoch": 1309} {"train_loss": -39.87136459350586, "global_step": 158485, "epoch": 1309} {"train_loss": -40.21846389770508, "global_step": 158486, "epoch": 1309} {"train_loss": -40.44294357299805, "global_step": 158487, "epoch": 1309} {"train_loss": -39.903465270996094, "global_step": 158488, "epoch": 1309} {"train_loss": -40.52418518066406, "global_step": 158489, "epoch": 1309} {"train_loss": -40.19550323486328, "global_step": 158490, "epoch": 1309} {"train_loss": -39.821205139160156, "global_step": 158491, "epoch": 1309} {"train_loss": -40.12657928466797, "global_step": 158492, "epoch": 1309} {"train_loss": -40.19322967529297, "global_step": 158493, "epoch": 1309} {"train_loss": -39.89744186401367, "global_step": 158494, "epoch": 1309} {"train_loss": -40.49116897583008, "global_step": 158495, "epoch": 1309} {"train_loss": -40.31113815307617, "global_step": 158496, "epoch": 1309} {"train_loss": -40.069759368896484, "global_step": 158497, "epoch": 1309} {"train_loss": -40.779998779296875, "global_step": 158498, "epoch": 1309} {"train_loss": -40.838111877441406, "global_step": 158499, "epoch": 1309} {"train_loss": -40.57802963256836, "global_step": 158500, "epoch": 1309} {"train_loss": -40.717628479003906, "global_step": 158501, "epoch": 1309} {"train_loss": -40.314510345458984, "global_step": 158502, "epoch": 1309} {"train_loss": -40.604766845703125, "global_step": 158503, "epoch": 1309} {"train_loss": -38.22807312011719, "global_step": 158504, "epoch": 1309} {"train_loss": -40.75982666015625, "global_step": 158505, "epoch": 1309} {"train_loss": -40.7203483581543, "global_step": 158506, "epoch": 1309} {"train_loss": -40.147457122802734, "global_step": 158507, "epoch": 1309} {"train_loss": -39.798519134521484, "global_step": 158508, "epoch": 1309} {"train_loss": -39.720123890017675, "global_step": 158509, "epoch": 1309, "val_loss": 2602589.25} {"train_loss": -40.73980712890625, "global_step": 158510, "epoch": 1310} {"train_loss": -40.6104850769043, "global_step": 158511, "epoch": 1310} {"train_loss": -40.46078109741211, "global_step": 158512, "epoch": 1310} {"train_loss": -40.72140884399414, "global_step": 158513, "epoch": 1310} {"train_loss": -39.8274040222168, "global_step": 158514, "epoch": 1310} {"train_loss": -40.768436431884766, "global_step": 158515, "epoch": 1310} {"train_loss": -40.59772872924805, "global_step": 158516, "epoch": 1310} {"train_loss": -40.32550048828125, "global_step": 158517, "epoch": 1310} {"train_loss": -40.870670318603516, "global_step": 158518, "epoch": 1310} {"train_loss": -41.26020050048828, "global_step": 158519, "epoch": 1310} {"train_loss": -41.16018295288086, "global_step": 158520, "epoch": 1310} {"train_loss": -41.14799880981445, "global_step": 158521, "epoch": 1310} {"train_loss": -40.45164108276367, "global_step": 158522, "epoch": 1310} {"train_loss": -39.30546188354492, "global_step": 158523, "epoch": 1310} {"train_loss": -40.76832962036133, "global_step": 158524, "epoch": 1310} {"train_loss": -41.12644577026367, "global_step": 158525, "epoch": 1310} {"train_loss": -41.421958923339844, "global_step": 158526, "epoch": 1310} {"train_loss": -40.854026794433594, "global_step": 158527, "epoch": 1310} {"train_loss": -40.96076965332031, "global_step": 158528, "epoch": 1310} {"train_loss": -41.34333038330078, "global_step": 158529, "epoch": 1310} {"train_loss": -40.398075103759766, "global_step": 158530, "epoch": 1310} {"train_loss": -41.324951171875, "global_step": 158531, "epoch": 1310} {"train_loss": -41.66762924194336, "global_step": 158532, "epoch": 1310} {"train_loss": -41.23316192626953, "global_step": 158533, "epoch": 1310} {"train_loss": -40.94038772583008, "global_step": 158534, "epoch": 1310} {"train_loss": -40.66909408569336, "global_step": 158535, "epoch": 1310} {"train_loss": -38.594642639160156, "global_step": 158536, "epoch": 1310} {"train_loss": -35.04034423828125, "global_step": 158537, "epoch": 1310} {"train_loss": -29.982593536376953, "global_step": 158538, "epoch": 1310} {"train_loss": -17.941389083862305, "global_step": 158539, "epoch": 1310} {"train_loss": -26.588598251342773, "global_step": 158540, "epoch": 1310} {"train_loss": -40.62052917480469, "global_step": 158541, "epoch": 1310} {"train_loss": -31.675439834594727, "global_step": 158542, "epoch": 1310} {"train_loss": -30.96900749206543, "global_step": 158543, "epoch": 1310} {"train_loss": -38.70927810668945, "global_step": 158544, "epoch": 1310} {"train_loss": -34.8999137878418, "global_step": 158545, "epoch": 1310} {"train_loss": -37.09123992919922, "global_step": 158546, "epoch": 1310} {"train_loss": -39.04350662231445, "global_step": 158547, "epoch": 1310} {"train_loss": -38.248443603515625, "global_step": 158548, "epoch": 1310} {"train_loss": -39.36914825439453, "global_step": 158549, "epoch": 1310} {"train_loss": -39.10862350463867, "global_step": 158550, "epoch": 1310} {"train_loss": -39.23124313354492, "global_step": 158551, "epoch": 1310} {"train_loss": -38.83374786376953, "global_step": 158552, "epoch": 1310} {"train_loss": -40.58677291870117, "global_step": 158553, "epoch": 1310} {"train_loss": -39.82994079589844, "global_step": 158554, "epoch": 1310} {"train_loss": -39.5096321105957, "global_step": 158555, "epoch": 1310} {"train_loss": -40.21702194213867, "global_step": 158556, "epoch": 1310} {"train_loss": -39.81836700439453, "global_step": 158557, "epoch": 1310} {"train_loss": -40.07041549682617, "global_step": 158558, "epoch": 1310} {"train_loss": -39.80044174194336, "global_step": 158559, "epoch": 1310} {"train_loss": -40.58590316772461, "global_step": 158560, "epoch": 1310} {"train_loss": -40.23043441772461, "global_step": 158561, "epoch": 1310} {"train_loss": -39.9674072265625, "global_step": 158562, "epoch": 1310} {"train_loss": -39.85696029663086, "global_step": 158563, "epoch": 1310} {"train_loss": -39.23405838012695, "global_step": 158564, "epoch": 1310} {"train_loss": -40.352821350097656, "global_step": 158565, "epoch": 1310} {"train_loss": -40.7929801940918, "global_step": 158566, "epoch": 1310} {"train_loss": -37.123374938964844, "global_step": 158567, "epoch": 1310} {"train_loss": -40.9111442565918, "global_step": 158568, "epoch": 1310} {"train_loss": -40.87602615356445, "global_step": 158569, "epoch": 1310} {"train_loss": -39.60372543334961, "global_step": 158570, "epoch": 1310} {"train_loss": -40.94246292114258, "global_step": 158571, "epoch": 1310} {"train_loss": -40.59245681762695, "global_step": 158572, "epoch": 1310} {"train_loss": -40.775428771972656, "global_step": 158573, "epoch": 1310} {"train_loss": -40.41927719116211, "global_step": 158574, "epoch": 1310} {"train_loss": -40.833717346191406, "global_step": 158575, "epoch": 1310} {"train_loss": -40.2218017578125, "global_step": 158576, "epoch": 1310} {"train_loss": -39.173728942871094, "global_step": 158577, "epoch": 1310} {"train_loss": -40.5141716003418, "global_step": 158578, "epoch": 1310} {"train_loss": -40.79856872558594, "global_step": 158579, "epoch": 1310} {"train_loss": -40.25944137573242, "global_step": 158580, "epoch": 1310} {"train_loss": -40.483699798583984, "global_step": 158581, "epoch": 1310} {"train_loss": -39.65651321411133, "global_step": 158582, "epoch": 1310} {"train_loss": -40.086219787597656, "global_step": 158583, "epoch": 1310} {"train_loss": -39.9884033203125, "global_step": 158584, "epoch": 1310} {"train_loss": -40.462059020996094, "global_step": 158585, "epoch": 1310} {"train_loss": -39.94181442260742, "global_step": 158586, "epoch": 1310} {"train_loss": -39.67989730834961, "global_step": 158587, "epoch": 1310} {"train_loss": -40.995113372802734, "global_step": 158588, "epoch": 1310} {"train_loss": -40.72517776489258, "global_step": 158589, "epoch": 1310} {"train_loss": -39.27397155761719, "global_step": 158590, "epoch": 1310} {"train_loss": -40.86356735229492, "global_step": 158591, "epoch": 1310} {"train_loss": -40.22713851928711, "global_step": 158592, "epoch": 1310} {"train_loss": -40.29216384887695, "global_step": 158593, "epoch": 1310} {"train_loss": -40.34027099609375, "global_step": 158594, "epoch": 1310} {"train_loss": -40.59890365600586, "global_step": 158595, "epoch": 1310} {"train_loss": -39.46799850463867, "global_step": 158596, "epoch": 1310} {"train_loss": -40.61897659301758, "global_step": 158597, "epoch": 1310} {"train_loss": -41.04752731323242, "global_step": 158598, "epoch": 1310} {"train_loss": -40.41936111450195, "global_step": 158599, "epoch": 1310} {"train_loss": -40.579742431640625, "global_step": 158600, "epoch": 1310} {"train_loss": -40.26910400390625, "global_step": 158601, "epoch": 1310} {"train_loss": -40.56351852416992, "global_step": 158602, "epoch": 1310} {"train_loss": -41.45296859741211, "global_step": 158603, "epoch": 1310} {"train_loss": -38.803497314453125, "global_step": 158604, "epoch": 1310} {"train_loss": -40.976654052734375, "global_step": 158605, "epoch": 1310} {"train_loss": -40.30253219604492, "global_step": 158606, "epoch": 1310} {"train_loss": -40.97526168823242, "global_step": 158607, "epoch": 1310} {"train_loss": -41.136375427246094, "global_step": 158608, "epoch": 1310} {"train_loss": -40.92499923706055, "global_step": 158609, "epoch": 1310} {"train_loss": -40.62717819213867, "global_step": 158610, "epoch": 1310} {"train_loss": -40.781166076660156, "global_step": 158611, "epoch": 1310} {"train_loss": -39.27815628051758, "global_step": 158612, "epoch": 1310} {"train_loss": -40.232704162597656, "global_step": 158613, "epoch": 1310} {"train_loss": -41.3651008605957, "global_step": 158614, "epoch": 1310} {"train_loss": -40.37144088745117, "global_step": 158615, "epoch": 1310} {"train_loss": -40.8385009765625, "global_step": 158616, "epoch": 1310} {"train_loss": -40.86575698852539, "global_step": 158617, "epoch": 1310} {"train_loss": -40.52486801147461, "global_step": 158618, "epoch": 1310} {"train_loss": -40.86830139160156, "global_step": 158619, "epoch": 1310} {"train_loss": -39.29706954956055, "global_step": 158620, "epoch": 1310} {"train_loss": -39.87970733642578, "global_step": 158621, "epoch": 1310} {"train_loss": -40.67306137084961, "global_step": 158622, "epoch": 1310} {"train_loss": -38.71638870239258, "global_step": 158623, "epoch": 1310} {"train_loss": -40.0185432434082, "global_step": 158624, "epoch": 1310} {"train_loss": -39.54954528808594, "global_step": 158625, "epoch": 1310} {"train_loss": -36.28179931640625, "global_step": 158626, "epoch": 1310} {"train_loss": -37.903404235839844, "global_step": 158627, "epoch": 1310} {"train_loss": -38.60456848144531, "global_step": 158628, "epoch": 1310} {"train_loss": -40.79996871948242, "global_step": 158629, "epoch": 1310} {"train_loss": -39.51236857264495, "global_step": 158630, "epoch": 1310, "val_loss": 2690835.75} {"train_loss": -40.125423431396484, "global_step": 158631, "epoch": 1311} {"train_loss": -38.616912841796875, "global_step": 158632, "epoch": 1311} {"train_loss": -33.96155548095703, "global_step": 158633, "epoch": 1311} {"train_loss": -28.530363082885742, "global_step": 158634, "epoch": 1311} {"train_loss": -34.24980545043945, "global_step": 158635, "epoch": 1311} {"train_loss": -35.63957977294922, "global_step": 158636, "epoch": 1311} {"train_loss": -31.595203399658203, "global_step": 158637, "epoch": 1311} {"train_loss": -31.026884078979492, "global_step": 158638, "epoch": 1311} {"train_loss": -26.13260841369629, "global_step": 158639, "epoch": 1311} {"train_loss": -29.59438133239746, "global_step": 158640, "epoch": 1311} {"train_loss": -31.154455184936523, "global_step": 158641, "epoch": 1311} {"train_loss": -32.2547492980957, "global_step": 158642, "epoch": 1311} {"train_loss": -33.59429931640625, "global_step": 158643, "epoch": 1311} {"train_loss": -29.862396240234375, "global_step": 158644, "epoch": 1311} {"train_loss": -28.148578643798828, "global_step": 158645, "epoch": 1311} {"train_loss": -33.28464889526367, "global_step": 158646, "epoch": 1311} {"train_loss": -34.150638580322266, "global_step": 158647, "epoch": 1311} {"train_loss": -35.58980941772461, "global_step": 158648, "epoch": 1311} {"train_loss": -34.9328727722168, "global_step": 158649, "epoch": 1311} {"train_loss": -35.50773620605469, "global_step": 158650, "epoch": 1311} {"train_loss": -35.894107818603516, "global_step": 158651, "epoch": 1311} {"train_loss": -36.216068267822266, "global_step": 158652, "epoch": 1311} {"train_loss": -36.60335922241211, "global_step": 158653, "epoch": 1311} {"train_loss": -36.77717971801758, "global_step": 158654, "epoch": 1311} {"train_loss": -36.39946746826172, "global_step": 158655, "epoch": 1311} {"train_loss": -37.6612548828125, "global_step": 158656, "epoch": 1311} {"train_loss": -35.353389739990234, "global_step": 158657, "epoch": 1311} {"train_loss": -34.763301849365234, "global_step": 158658, "epoch": 1311} {"train_loss": -33.6128044128418, "global_step": 158659, "epoch": 1311} {"train_loss": -36.46706771850586, "global_step": 158660, "epoch": 1311} {"train_loss": -36.13444900512695, "global_step": 158661, "epoch": 1311} {"train_loss": -37.10883331298828, "global_step": 158662, "epoch": 1311} {"train_loss": -37.596168518066406, "global_step": 158663, "epoch": 1311} {"train_loss": -37.184539794921875, "global_step": 158664, "epoch": 1311} {"train_loss": -37.56910705566406, "global_step": 158665, "epoch": 1311} {"train_loss": -37.056514739990234, "global_step": 158666, "epoch": 1311} {"train_loss": -37.26766586303711, "global_step": 158667, "epoch": 1311} {"train_loss": -37.58194351196289, "global_step": 158668, "epoch": 1311} {"train_loss": -37.35251998901367, "global_step": 158669, "epoch": 1311} {"train_loss": -37.463470458984375, "global_step": 158670, "epoch": 1311} {"train_loss": -36.62970733642578, "global_step": 158671, "epoch": 1311} {"train_loss": -37.30715560913086, "global_step": 158672, "epoch": 1311} {"train_loss": -38.187103271484375, "global_step": 158673, "epoch": 1311} {"train_loss": -37.8092155456543, "global_step": 158674, "epoch": 1311} {"train_loss": -38.21760559082031, "global_step": 158675, "epoch": 1311} {"train_loss": -38.01068115234375, "global_step": 158676, "epoch": 1311} {"train_loss": -38.798683166503906, "global_step": 158677, "epoch": 1311} {"train_loss": -37.97223663330078, "global_step": 158678, "epoch": 1311} {"train_loss": -38.435142517089844, "global_step": 158679, "epoch": 1311} {"train_loss": -39.2996711730957, "global_step": 158680, "epoch": 1311} {"train_loss": -38.098201751708984, "global_step": 158681, "epoch": 1311} {"train_loss": -38.329139709472656, "global_step": 158682, "epoch": 1311} {"train_loss": -38.48922348022461, "global_step": 158683, "epoch": 1311} {"train_loss": -38.70428466796875, "global_step": 158684, "epoch": 1311} {"train_loss": -38.239444732666016, "global_step": 158685, "epoch": 1311} {"train_loss": -38.77129364013672, "global_step": 158686, "epoch": 1311} {"train_loss": -38.189125061035156, "global_step": 158687, "epoch": 1311} {"train_loss": -39.08272933959961, "global_step": 158688, "epoch": 1311} {"train_loss": -38.92219924926758, "global_step": 158689, "epoch": 1311} {"train_loss": -39.20247268676758, "global_step": 158690, "epoch": 1311} {"train_loss": -38.7804069519043, "global_step": 158691, "epoch": 1311} {"train_loss": -38.34251022338867, "global_step": 158692, "epoch": 1311} {"train_loss": -39.18164825439453, "global_step": 158693, "epoch": 1311} {"train_loss": -38.58225631713867, "global_step": 158694, "epoch": 1311} {"train_loss": -39.439937591552734, "global_step": 158695, "epoch": 1311} {"train_loss": -39.27754592895508, "global_step": 158696, "epoch": 1311} {"train_loss": -38.53004455566406, "global_step": 158697, "epoch": 1311} {"train_loss": -39.191619873046875, "global_step": 158698, "epoch": 1311} {"train_loss": -38.845558166503906, "global_step": 158699, "epoch": 1311} {"train_loss": -38.75690460205078, "global_step": 158700, "epoch": 1311} {"train_loss": -39.07352828979492, "global_step": 158701, "epoch": 1311} {"train_loss": -38.56667709350586, "global_step": 158702, "epoch": 1311} {"train_loss": -38.419952392578125, "global_step": 158703, "epoch": 1311} {"train_loss": -40.13953399658203, "global_step": 158704, "epoch": 1311} {"train_loss": -39.58531951904297, "global_step": 158705, "epoch": 1311} {"train_loss": -39.641136169433594, "global_step": 158706, "epoch": 1311} {"train_loss": -38.97908401489258, "global_step": 158707, "epoch": 1311} {"train_loss": -39.86360549926758, "global_step": 158708, "epoch": 1311} {"train_loss": -40.068077087402344, "global_step": 158709, "epoch": 1311} {"train_loss": -39.13435363769531, "global_step": 158710, "epoch": 1311} {"train_loss": -39.482391357421875, "global_step": 158711, "epoch": 1311} {"train_loss": -39.78730010986328, "global_step": 158712, "epoch": 1311} {"train_loss": -38.82212829589844, "global_step": 158713, "epoch": 1311} {"train_loss": -40.275733947753906, "global_step": 158714, "epoch": 1311} {"train_loss": -40.03120040893555, "global_step": 158715, "epoch": 1311} {"train_loss": -39.61264419555664, "global_step": 158716, "epoch": 1311} {"train_loss": -40.0376091003418, "global_step": 158717, "epoch": 1311} {"train_loss": -40.10116195678711, "global_step": 158718, "epoch": 1311} {"train_loss": -39.86471939086914, "global_step": 158719, "epoch": 1311} {"train_loss": -40.1414794921875, "global_step": 158720, "epoch": 1311} {"train_loss": -39.99507522583008, "global_step": 158721, "epoch": 1311} {"train_loss": -39.923439025878906, "global_step": 158722, "epoch": 1311} {"train_loss": -40.563087463378906, "global_step": 158723, "epoch": 1311} {"train_loss": -40.41985321044922, "global_step": 158724, "epoch": 1311} {"train_loss": -40.26505661010742, "global_step": 158725, "epoch": 1311} {"train_loss": -40.107051849365234, "global_step": 158726, "epoch": 1311} {"train_loss": -40.457000732421875, "global_step": 158727, "epoch": 1311} {"train_loss": -40.242706298828125, "global_step": 158728, "epoch": 1311} {"train_loss": -40.18442916870117, "global_step": 158729, "epoch": 1311} {"train_loss": -40.017425537109375, "global_step": 158730, "epoch": 1311} {"train_loss": -39.65309524536133, "global_step": 158731, "epoch": 1311} {"train_loss": -40.790191650390625, "global_step": 158732, "epoch": 1311} {"train_loss": -40.463111877441406, "global_step": 158733, "epoch": 1311} {"train_loss": -40.023677825927734, "global_step": 158734, "epoch": 1311} {"train_loss": -40.23615264892578, "global_step": 158735, "epoch": 1311} {"train_loss": -39.38283920288086, "global_step": 158736, "epoch": 1311} {"train_loss": -39.3968391418457, "global_step": 158737, "epoch": 1311} {"train_loss": -40.6729850769043, "global_step": 158738, "epoch": 1311} {"train_loss": -40.61455154418945, "global_step": 158739, "epoch": 1311} {"train_loss": -40.10044479370117, "global_step": 158740, "epoch": 1311} {"train_loss": -39.1634635925293, "global_step": 158741, "epoch": 1311} {"train_loss": -40.2469367980957, "global_step": 158742, "epoch": 1311} {"train_loss": -39.66340255737305, "global_step": 158743, "epoch": 1311} {"train_loss": -39.74987030029297, "global_step": 158744, "epoch": 1311} {"train_loss": -39.56909942626953, "global_step": 158745, "epoch": 1311} {"train_loss": -39.065589904785156, "global_step": 158746, "epoch": 1311} {"train_loss": -38.6518669128418, "global_step": 158747, "epoch": 1311} {"train_loss": -39.486427307128906, "global_step": 158748, "epoch": 1311} {"train_loss": -39.29490280151367, "global_step": 158749, "epoch": 1311} {"train_loss": -38.84748458862305, "global_step": 158750, "epoch": 1311} {"train_loss": -37.79694651769213, "global_step": 158751, "epoch": 1311, "val_loss": 2731057.0} {"train_loss": -38.5439453125, "global_step": 158752, "epoch": 1312} {"train_loss": -39.57816696166992, "global_step": 158753, "epoch": 1312} {"train_loss": -38.15523910522461, "global_step": 158754, "epoch": 1312} {"train_loss": -37.88262939453125, "global_step": 158755, "epoch": 1312} {"train_loss": -37.97394561767578, "global_step": 158756, "epoch": 1312} {"train_loss": -39.880645751953125, "global_step": 158757, "epoch": 1312} {"train_loss": -36.7688102722168, "global_step": 158758, "epoch": 1312} {"train_loss": -39.106502532958984, "global_step": 158759, "epoch": 1312} {"train_loss": -38.822601318359375, "global_step": 158760, "epoch": 1312} {"train_loss": -39.79690170288086, "global_step": 158761, "epoch": 1312} {"train_loss": -39.61083984375, "global_step": 158762, "epoch": 1312} {"train_loss": -39.09387969970703, "global_step": 158763, "epoch": 1312} {"train_loss": -39.6304931640625, "global_step": 158764, "epoch": 1312} {"train_loss": -39.66850662231445, "global_step": 158765, "epoch": 1312} {"train_loss": -39.74565887451172, "global_step": 158766, "epoch": 1312} {"train_loss": -38.95441818237305, "global_step": 158767, "epoch": 1312} {"train_loss": -39.82665252685547, "global_step": 158768, "epoch": 1312} {"train_loss": -39.09222412109375, "global_step": 158769, "epoch": 1312} {"train_loss": -38.593414306640625, "global_step": 158770, "epoch": 1312} {"train_loss": -39.45890426635742, "global_step": 158771, "epoch": 1312} {"train_loss": -39.7225341796875, "global_step": 158772, "epoch": 1312} {"train_loss": -39.3106575012207, "global_step": 158773, "epoch": 1312} {"train_loss": -38.51931381225586, "global_step": 158774, "epoch": 1312} {"train_loss": -38.705440521240234, "global_step": 158775, "epoch": 1312} {"train_loss": -40.21980667114258, "global_step": 158776, "epoch": 1312} {"train_loss": -36.54124069213867, "global_step": 158777, "epoch": 1312} {"train_loss": -37.6002082824707, "global_step": 158778, "epoch": 1312} {"train_loss": -39.23484420776367, "global_step": 158779, "epoch": 1312} {"train_loss": -37.73099899291992, "global_step": 158780, "epoch": 1312} {"train_loss": -38.60721969604492, "global_step": 158781, "epoch": 1312} {"train_loss": -40.00660705566406, "global_step": 158782, "epoch": 1312} {"train_loss": -38.15273666381836, "global_step": 158783, "epoch": 1312} {"train_loss": -38.44343185424805, "global_step": 158784, "epoch": 1312} {"train_loss": -39.736576080322266, "global_step": 158785, "epoch": 1312} {"train_loss": -37.79161834716797, "global_step": 158786, "epoch": 1312} {"train_loss": -40.08893966674805, "global_step": 158787, "epoch": 1312} {"train_loss": -38.2501106262207, "global_step": 158788, "epoch": 1312} {"train_loss": -39.37777328491211, "global_step": 158789, "epoch": 1312} {"train_loss": -39.1837043762207, "global_step": 158790, "epoch": 1312} {"train_loss": -39.6225700378418, "global_step": 158791, "epoch": 1312} {"train_loss": -39.4556999206543, "global_step": 158792, "epoch": 1312} {"train_loss": -39.027889251708984, "global_step": 158793, "epoch": 1312} {"train_loss": -38.674842834472656, "global_step": 158794, "epoch": 1312} {"train_loss": -40.072059631347656, "global_step": 158795, "epoch": 1312} {"train_loss": -39.5433235168457, "global_step": 158796, "epoch": 1312} {"train_loss": -38.14240264892578, "global_step": 158797, "epoch": 1312} {"train_loss": -40.94244384765625, "global_step": 158798, "epoch": 1312} {"train_loss": -40.21792984008789, "global_step": 158799, "epoch": 1312} {"train_loss": -40.2669563293457, "global_step": 158800, "epoch": 1312} {"train_loss": -40.17127227783203, "global_step": 158801, "epoch": 1312} {"train_loss": -39.062705993652344, "global_step": 158802, "epoch": 1312} {"train_loss": -40.138668060302734, "global_step": 158803, "epoch": 1312} {"train_loss": -41.3628044128418, "global_step": 158804, "epoch": 1312} {"train_loss": -40.20638656616211, "global_step": 158805, "epoch": 1312} {"train_loss": -39.628021240234375, "global_step": 158806, "epoch": 1312} {"train_loss": -40.29543685913086, "global_step": 158807, "epoch": 1312} {"train_loss": -40.135498046875, "global_step": 158808, "epoch": 1312} {"train_loss": -39.29787826538086, "global_step": 158809, "epoch": 1312} {"train_loss": -39.55854415893555, "global_step": 158810, "epoch": 1312} {"train_loss": -40.235713958740234, "global_step": 158811, "epoch": 1312} {"train_loss": -39.96586227416992, "global_step": 158812, "epoch": 1312} {"train_loss": -40.750274658203125, "global_step": 158813, "epoch": 1312} {"train_loss": -40.755897521972656, "global_step": 158814, "epoch": 1312} {"train_loss": -40.65149688720703, "global_step": 158815, "epoch": 1312} {"train_loss": -41.449466705322266, "global_step": 158816, "epoch": 1312} {"train_loss": -40.32352828979492, "global_step": 158817, "epoch": 1312} {"train_loss": -40.75156784057617, "global_step": 158818, "epoch": 1312} {"train_loss": -40.9869384765625, "global_step": 158819, "epoch": 1312} {"train_loss": -40.999855041503906, "global_step": 158820, "epoch": 1312} {"train_loss": -40.962764739990234, "global_step": 158821, "epoch": 1312} {"train_loss": -40.98848342895508, "global_step": 158822, "epoch": 1312} {"train_loss": -41.258846282958984, "global_step": 158823, "epoch": 1312} {"train_loss": -40.865570068359375, "global_step": 158824, "epoch": 1312} {"train_loss": -41.00880432128906, "global_step": 158825, "epoch": 1312} {"train_loss": -41.18665313720703, "global_step": 158826, "epoch": 1312} {"train_loss": -41.505523681640625, "global_step": 158827, "epoch": 1312} {"train_loss": -40.52294921875, "global_step": 158828, "epoch": 1312} {"train_loss": -41.330596923828125, "global_step": 158829, "epoch": 1312} {"train_loss": -41.289981842041016, "global_step": 158830, "epoch": 1312} {"train_loss": -40.262020111083984, "global_step": 158831, "epoch": 1312} {"train_loss": -40.545127868652344, "global_step": 158832, "epoch": 1312} {"train_loss": -40.40583038330078, "global_step": 158833, "epoch": 1312} {"train_loss": -39.59867858886719, "global_step": 158834, "epoch": 1312} {"train_loss": -40.598594665527344, "global_step": 158835, "epoch": 1312} {"train_loss": -39.970672607421875, "global_step": 158836, "epoch": 1312} {"train_loss": -40.37501907348633, "global_step": 158837, "epoch": 1312} {"train_loss": -40.726558685302734, "global_step": 158838, "epoch": 1312} {"train_loss": -40.547576904296875, "global_step": 158839, "epoch": 1312} {"train_loss": -40.413692474365234, "global_step": 158840, "epoch": 1312} {"train_loss": -39.998958587646484, "global_step": 158841, "epoch": 1312} {"train_loss": -39.288387298583984, "global_step": 158842, "epoch": 1312} {"train_loss": -40.63291549682617, "global_step": 158843, "epoch": 1312} {"train_loss": -40.10511016845703, "global_step": 158844, "epoch": 1312} {"train_loss": -40.586116790771484, "global_step": 158845, "epoch": 1312} {"train_loss": -40.47168731689453, "global_step": 158846, "epoch": 1312} {"train_loss": -39.74752426147461, "global_step": 158847, "epoch": 1312} {"train_loss": -40.435054779052734, "global_step": 158848, "epoch": 1312} {"train_loss": -39.60246658325195, "global_step": 158849, "epoch": 1312} {"train_loss": -40.599365234375, "global_step": 158850, "epoch": 1312} {"train_loss": -40.60609436035156, "global_step": 158851, "epoch": 1312} {"train_loss": -40.15760803222656, "global_step": 158852, "epoch": 1312} {"train_loss": -39.8486213684082, "global_step": 158853, "epoch": 1312} {"train_loss": -40.84977340698242, "global_step": 158854, "epoch": 1312} {"train_loss": -40.241859436035156, "global_step": 158855, "epoch": 1312} {"train_loss": -39.693641662597656, "global_step": 158856, "epoch": 1312} {"train_loss": -40.32099533081055, "global_step": 158857, "epoch": 1312} {"train_loss": -39.70182418823242, "global_step": 158858, "epoch": 1312} {"train_loss": -40.45844650268555, "global_step": 158859, "epoch": 1312} {"train_loss": -40.11518859863281, "global_step": 158860, "epoch": 1312} {"train_loss": -40.54816818237305, "global_step": 158861, "epoch": 1312} {"train_loss": -40.12192916870117, "global_step": 158862, "epoch": 1312} {"train_loss": -39.9243278503418, "global_step": 158863, "epoch": 1312} {"train_loss": -37.1089973449707, "global_step": 158864, "epoch": 1312} {"train_loss": -33.51365280151367, "global_step": 158865, "epoch": 1312} {"train_loss": -31.938678741455078, "global_step": 158866, "epoch": 1312} {"train_loss": -34.65375900268555, "global_step": 158867, "epoch": 1312} {"train_loss": -40.7855339050293, "global_step": 158868, "epoch": 1312} {"train_loss": -37.93639373779297, "global_step": 158869, "epoch": 1312} {"train_loss": -37.502197265625, "global_step": 158870, "epoch": 1312} {"train_loss": -38.89593505859375, "global_step": 158871, "epoch": 1312} {"train_loss": -39.583071180611604, "global_step": 158872, "epoch": 1312, "val_loss": 2627360.75} {"train_loss": -37.38705062866211, "global_step": 158873, "epoch": 1313} {"train_loss": -38.22092819213867, "global_step": 158874, "epoch": 1313} {"train_loss": -40.321022033691406, "global_step": 158875, "epoch": 1313} {"train_loss": -39.083656311035156, "global_step": 158876, "epoch": 1313} {"train_loss": -39.718284606933594, "global_step": 158877, "epoch": 1313} {"train_loss": -39.82706069946289, "global_step": 158878, "epoch": 1313} {"train_loss": -39.590576171875, "global_step": 158879, "epoch": 1313} {"train_loss": -39.96107864379883, "global_step": 158880, "epoch": 1313} {"train_loss": -39.555023193359375, "global_step": 158881, "epoch": 1313} {"train_loss": -39.77408218383789, "global_step": 158882, "epoch": 1313} {"train_loss": -40.4771728515625, "global_step": 158883, "epoch": 1313} {"train_loss": -39.83009719848633, "global_step": 158884, "epoch": 1313} {"train_loss": -39.915313720703125, "global_step": 158885, "epoch": 1313} {"train_loss": -39.19639587402344, "global_step": 158886, "epoch": 1313} {"train_loss": -39.5662841796875, "global_step": 158887, "epoch": 1313} {"train_loss": -39.99172592163086, "global_step": 158888, "epoch": 1313} {"train_loss": -40.07227325439453, "global_step": 158889, "epoch": 1313} {"train_loss": -40.611488342285156, "global_step": 158890, "epoch": 1313} {"train_loss": -39.94050216674805, "global_step": 158891, "epoch": 1313} {"train_loss": -40.1899299621582, "global_step": 158892, "epoch": 1313} {"train_loss": -39.37321090698242, "global_step": 158893, "epoch": 1313} {"train_loss": -40.42329025268555, "global_step": 158894, "epoch": 1313} {"train_loss": -40.564266204833984, "global_step": 158895, "epoch": 1313} {"train_loss": -40.68658447265625, "global_step": 158896, "epoch": 1313} {"train_loss": -40.87031173706055, "global_step": 158897, "epoch": 1313} {"train_loss": -40.94826126098633, "global_step": 158898, "epoch": 1313} {"train_loss": -40.49018478393555, "global_step": 158899, "epoch": 1313} {"train_loss": -41.01302719116211, "global_step": 158900, "epoch": 1313} {"train_loss": -40.72746658325195, "global_step": 158901, "epoch": 1313} {"train_loss": -41.06806564331055, "global_step": 158902, "epoch": 1313} {"train_loss": -40.52102279663086, "global_step": 158903, "epoch": 1313} {"train_loss": -40.80573654174805, "global_step": 158904, "epoch": 1313} {"train_loss": -40.17715835571289, "global_step": 158905, "epoch": 1313} {"train_loss": -41.22195053100586, "global_step": 158906, "epoch": 1313} {"train_loss": -40.868507385253906, "global_step": 158907, "epoch": 1313} {"train_loss": -40.63450622558594, "global_step": 158908, "epoch": 1313} {"train_loss": -40.277618408203125, "global_step": 158909, "epoch": 1313} {"train_loss": -41.01030731201172, "global_step": 158910, "epoch": 1313} {"train_loss": -40.9366569519043, "global_step": 158911, "epoch": 1313} {"train_loss": -41.1057014465332, "global_step": 158912, "epoch": 1313} {"train_loss": -40.43189239501953, "global_step": 158913, "epoch": 1313} {"train_loss": -40.58842086791992, "global_step": 158914, "epoch": 1313} {"train_loss": -41.3361930847168, "global_step": 158915, "epoch": 1313} {"train_loss": -40.985958099365234, "global_step": 158916, "epoch": 1313} {"train_loss": -40.81055450439453, "global_step": 158917, "epoch": 1313} {"train_loss": -41.3045539855957, "global_step": 158918, "epoch": 1313} {"train_loss": -41.318965911865234, "global_step": 158919, "epoch": 1313} {"train_loss": -40.96192169189453, "global_step": 158920, "epoch": 1313} {"train_loss": -40.592926025390625, "global_step": 158921, "epoch": 1313} {"train_loss": -41.431453704833984, "global_step": 158922, "epoch": 1313} {"train_loss": -41.05720520019531, "global_step": 158923, "epoch": 1313} {"train_loss": -41.22219467163086, "global_step": 158924, "epoch": 1313} {"train_loss": -41.557769775390625, "global_step": 158925, "epoch": 1313} {"train_loss": -41.023738861083984, "global_step": 158926, "epoch": 1313} {"train_loss": -41.4847526550293, "global_step": 158927, "epoch": 1313} {"train_loss": -41.10667037963867, "global_step": 158928, "epoch": 1313} {"train_loss": -41.3221321105957, "global_step": 158929, "epoch": 1313} {"train_loss": -41.03102493286133, "global_step": 158930, "epoch": 1313} {"train_loss": -41.68871307373047, "global_step": 158931, "epoch": 1313} {"train_loss": -41.493690490722656, "global_step": 158932, "epoch": 1313} {"train_loss": -41.24052429199219, "global_step": 158933, "epoch": 1313} {"train_loss": -41.03731918334961, "global_step": 158934, "epoch": 1313} {"train_loss": -40.977256774902344, "global_step": 158935, "epoch": 1313} {"train_loss": -40.175838470458984, "global_step": 158936, "epoch": 1313} {"train_loss": -39.900081634521484, "global_step": 158937, "epoch": 1313} {"train_loss": -39.571807861328125, "global_step": 158938, "epoch": 1313} {"train_loss": -39.1922721862793, "global_step": 158939, "epoch": 1313} {"train_loss": -40.30257797241211, "global_step": 158940, "epoch": 1313} {"train_loss": -41.15283966064453, "global_step": 158941, "epoch": 1313} {"train_loss": -41.26432800292969, "global_step": 158942, "epoch": 1313} {"train_loss": -38.04627227783203, "global_step": 158943, "epoch": 1313} {"train_loss": -35.966346740722656, "global_step": 158944, "epoch": 1313} {"train_loss": -36.7176628112793, "global_step": 158945, "epoch": 1313} {"train_loss": -41.089447021484375, "global_step": 158946, "epoch": 1313} {"train_loss": -40.09734344482422, "global_step": 158947, "epoch": 1313} {"train_loss": -38.810096740722656, "global_step": 158948, "epoch": 1313} {"train_loss": -37.294551849365234, "global_step": 158949, "epoch": 1313} {"train_loss": -37.1893196105957, "global_step": 158950, "epoch": 1313} {"train_loss": -35.659950256347656, "global_step": 158951, "epoch": 1313} {"train_loss": -40.27595520019531, "global_step": 158952, "epoch": 1313} {"train_loss": -38.59752655029297, "global_step": 158953, "epoch": 1313} {"train_loss": -34.055965423583984, "global_step": 158954, "epoch": 1313} {"train_loss": -37.929779052734375, "global_step": 158955, "epoch": 1313} {"train_loss": -39.315608978271484, "global_step": 158956, "epoch": 1313} {"train_loss": -37.308536529541016, "global_step": 158957, "epoch": 1313} {"train_loss": -39.33706283569336, "global_step": 158958, "epoch": 1313} {"train_loss": -38.7829704284668, "global_step": 158959, "epoch": 1313} {"train_loss": -37.723106384277344, "global_step": 158960, "epoch": 1313} {"train_loss": -39.88679885864258, "global_step": 158961, "epoch": 1313} {"train_loss": -37.521846771240234, "global_step": 158962, "epoch": 1313} {"train_loss": -39.561004638671875, "global_step": 158963, "epoch": 1313} {"train_loss": -37.54214096069336, "global_step": 158964, "epoch": 1313} {"train_loss": -38.66317367553711, "global_step": 158965, "epoch": 1313} {"train_loss": -38.512855529785156, "global_step": 158966, "epoch": 1313} {"train_loss": -39.527854919433594, "global_step": 158967, "epoch": 1313} {"train_loss": -39.45932388305664, "global_step": 158968, "epoch": 1313} {"train_loss": -39.62801742553711, "global_step": 158969, "epoch": 1313} {"train_loss": -38.87630844116211, "global_step": 158970, "epoch": 1313} {"train_loss": -39.219417572021484, "global_step": 158971, "epoch": 1313} {"train_loss": -39.134090423583984, "global_step": 158972, "epoch": 1313} {"train_loss": -39.43502426147461, "global_step": 158973, "epoch": 1313} {"train_loss": -39.472652435302734, "global_step": 158974, "epoch": 1313} {"train_loss": -38.16364669799805, "global_step": 158975, "epoch": 1313} {"train_loss": -38.35830307006836, "global_step": 158976, "epoch": 1313} {"train_loss": -40.19572448730469, "global_step": 158977, "epoch": 1313} {"train_loss": -38.86605453491211, "global_step": 158978, "epoch": 1313} {"train_loss": -40.100555419921875, "global_step": 158979, "epoch": 1313} {"train_loss": -39.69710922241211, "global_step": 158980, "epoch": 1313} {"train_loss": -37.29401779174805, "global_step": 158981, "epoch": 1313} {"train_loss": -39.758766174316406, "global_step": 158982, "epoch": 1313} {"train_loss": -36.82310485839844, "global_step": 158983, "epoch": 1313} {"train_loss": -40.640411376953125, "global_step": 158984, "epoch": 1313} {"train_loss": -38.358333587646484, "global_step": 158985, "epoch": 1313} {"train_loss": -39.578094482421875, "global_step": 158986, "epoch": 1313} {"train_loss": -40.314327239990234, "global_step": 158987, "epoch": 1313} {"train_loss": -38.8039665222168, "global_step": 158988, "epoch": 1313} {"train_loss": -39.74894332885742, "global_step": 158989, "epoch": 1313} {"train_loss": -41.02173614501953, "global_step": 158990, "epoch": 1313} {"train_loss": -38.494056701660156, "global_step": 158991, "epoch": 1313} {"train_loss": -40.71443176269531, "global_step": 158992, "epoch": 1313} {"train_loss": -39.76989251128898, "global_step": 158993, "epoch": 1313, "val_loss": 2669652.75} {"train_loss": -40.223812103271484, "global_step": 158994, "epoch": 1314} {"train_loss": -40.15875244140625, "global_step": 158995, "epoch": 1314} {"train_loss": -40.689022064208984, "global_step": 158996, "epoch": 1314} {"train_loss": -40.56466293334961, "global_step": 158997, "epoch": 1314} {"train_loss": -39.954071044921875, "global_step": 158998, "epoch": 1314} {"train_loss": -40.268218994140625, "global_step": 158999, "epoch": 1314} {"train_loss": -40.62904357910156, "global_step": 159000, "epoch": 1314} {"train_loss": -40.85482406616211, "global_step": 159001, "epoch": 1314} {"train_loss": -40.426815032958984, "global_step": 159002, "epoch": 1314} {"train_loss": -38.83452224731445, "global_step": 159003, "epoch": 1314} {"train_loss": -39.505821228027344, "global_step": 159004, "epoch": 1314} {"train_loss": -36.514251708984375, "global_step": 159005, "epoch": 1314} {"train_loss": -35.1512336730957, "global_step": 159006, "epoch": 1314} {"train_loss": -40.296138763427734, "global_step": 159007, "epoch": 1314} {"train_loss": -39.41413497924805, "global_step": 159008, "epoch": 1314} {"train_loss": -39.391414642333984, "global_step": 159009, "epoch": 1314} {"train_loss": -31.5492000579834, "global_step": 159010, "epoch": 1314} {"train_loss": -30.41849708557129, "global_step": 159011, "epoch": 1314} {"train_loss": -37.1586799621582, "global_step": 159012, "epoch": 1314} {"train_loss": -39.22930145263672, "global_step": 159013, "epoch": 1314} {"train_loss": -34.56752014160156, "global_step": 159014, "epoch": 1314} {"train_loss": -36.50136947631836, "global_step": 159015, "epoch": 1314} {"train_loss": -37.71383285522461, "global_step": 159016, "epoch": 1314} {"train_loss": -27.7419376373291, "global_step": 159017, "epoch": 1314} {"train_loss": -34.86356735229492, "global_step": 159018, "epoch": 1314} {"train_loss": -37.06290817260742, "global_step": 159019, "epoch": 1314} {"train_loss": -36.8101921081543, "global_step": 159020, "epoch": 1314} {"train_loss": -31.007537841796875, "global_step": 159021, "epoch": 1314} {"train_loss": -36.56837844848633, "global_step": 159022, "epoch": 1314} {"train_loss": -31.02088737487793, "global_step": 159023, "epoch": 1314} {"train_loss": -36.11894607543945, "global_step": 159024, "epoch": 1314} {"train_loss": -37.50910186767578, "global_step": 159025, "epoch": 1314} {"train_loss": -38.1950569152832, "global_step": 159026, "epoch": 1314} {"train_loss": -37.92770004272461, "global_step": 159027, "epoch": 1314} {"train_loss": -35.173004150390625, "global_step": 159028, "epoch": 1314} {"train_loss": -35.49375534057617, "global_step": 159029, "epoch": 1314} {"train_loss": -35.58655548095703, "global_step": 159030, "epoch": 1314} {"train_loss": -37.492584228515625, "global_step": 159031, "epoch": 1314} {"train_loss": -37.49773025512695, "global_step": 159032, "epoch": 1314} {"train_loss": -29.867460250854492, "global_step": 159033, "epoch": 1314} {"train_loss": -34.758235931396484, "global_step": 159034, "epoch": 1314} {"train_loss": -36.699607849121094, "global_step": 159035, "epoch": 1314} {"train_loss": -35.495704650878906, "global_step": 159036, "epoch": 1314} {"train_loss": -35.844825744628906, "global_step": 159037, "epoch": 1314} {"train_loss": -36.39323043823242, "global_step": 159038, "epoch": 1314} {"train_loss": -36.693904876708984, "global_step": 159039, "epoch": 1314} {"train_loss": -37.45469665527344, "global_step": 159040, "epoch": 1314} {"train_loss": -38.66353988647461, "global_step": 159041, "epoch": 1314} {"train_loss": -38.58071517944336, "global_step": 159042, "epoch": 1314} {"train_loss": -38.39109420776367, "global_step": 159043, "epoch": 1314} {"train_loss": -38.29997634887695, "global_step": 159044, "epoch": 1314} {"train_loss": -37.73165512084961, "global_step": 159045, "epoch": 1314} {"train_loss": -39.00539779663086, "global_step": 159046, "epoch": 1314} {"train_loss": -38.546546936035156, "global_step": 159047, "epoch": 1314} {"train_loss": -38.22160720825195, "global_step": 159048, "epoch": 1314} {"train_loss": -38.76235580444336, "global_step": 159049, "epoch": 1314} {"train_loss": -38.80851745605469, "global_step": 159050, "epoch": 1314} {"train_loss": -38.293758392333984, "global_step": 159051, "epoch": 1314} {"train_loss": -38.920135498046875, "global_step": 159052, "epoch": 1314} {"train_loss": -38.757720947265625, "global_step": 159053, "epoch": 1314} {"train_loss": -36.70866775512695, "global_step": 159054, "epoch": 1314} {"train_loss": -37.48173904418945, "global_step": 159055, "epoch": 1314} {"train_loss": -39.415401458740234, "global_step": 159056, "epoch": 1314} {"train_loss": -38.077369689941406, "global_step": 159057, "epoch": 1314} {"train_loss": -37.943172454833984, "global_step": 159058, "epoch": 1314} {"train_loss": -38.97479248046875, "global_step": 159059, "epoch": 1314} {"train_loss": -39.799041748046875, "global_step": 159060, "epoch": 1314} {"train_loss": -38.94673538208008, "global_step": 159061, "epoch": 1314} {"train_loss": -39.380706787109375, "global_step": 159062, "epoch": 1314} {"train_loss": -38.54768753051758, "global_step": 159063, "epoch": 1314} {"train_loss": -39.433589935302734, "global_step": 159064, "epoch": 1314} {"train_loss": -39.09543991088867, "global_step": 159065, "epoch": 1314} {"train_loss": -39.35984802246094, "global_step": 159066, "epoch": 1314} {"train_loss": -40.05043029785156, "global_step": 159067, "epoch": 1314} {"train_loss": -37.977027893066406, "global_step": 159068, "epoch": 1314} {"train_loss": -40.01978302001953, "global_step": 159069, "epoch": 1314} {"train_loss": -40.14552688598633, "global_step": 159070, "epoch": 1314} {"train_loss": -39.88013458251953, "global_step": 159071, "epoch": 1314} {"train_loss": -38.75174331665039, "global_step": 159072, "epoch": 1314} {"train_loss": -39.27989959716797, "global_step": 159073, "epoch": 1314} {"train_loss": -39.81230163574219, "global_step": 159074, "epoch": 1314} {"train_loss": -38.8431282043457, "global_step": 159075, "epoch": 1314} {"train_loss": -39.78386306762695, "global_step": 159076, "epoch": 1314} {"train_loss": -40.33170700073242, "global_step": 159077, "epoch": 1314} {"train_loss": -39.83112716674805, "global_step": 159078, "epoch": 1314} {"train_loss": -40.472530364990234, "global_step": 159079, "epoch": 1314} {"train_loss": -39.90261459350586, "global_step": 159080, "epoch": 1314} {"train_loss": -40.39676284790039, "global_step": 159081, "epoch": 1314} {"train_loss": -40.04458999633789, "global_step": 159082, "epoch": 1314} {"train_loss": -40.38145065307617, "global_step": 159083, "epoch": 1314} {"train_loss": -38.87972640991211, "global_step": 159084, "epoch": 1314} {"train_loss": -40.16203689575195, "global_step": 159085, "epoch": 1314} {"train_loss": -40.07039260864258, "global_step": 159086, "epoch": 1314} {"train_loss": -40.35708236694336, "global_step": 159087, "epoch": 1314} {"train_loss": -40.018524169921875, "global_step": 159088, "epoch": 1314} {"train_loss": -40.55868911743164, "global_step": 159089, "epoch": 1314} {"train_loss": -40.2193603515625, "global_step": 159090, "epoch": 1314} {"train_loss": -40.15023422241211, "global_step": 159091, "epoch": 1314} {"train_loss": -40.61843490600586, "global_step": 159092, "epoch": 1314} {"train_loss": -40.50202941894531, "global_step": 159093, "epoch": 1314} {"train_loss": -40.47541427612305, "global_step": 159094, "epoch": 1314} {"train_loss": -40.64174270629883, "global_step": 159095, "epoch": 1314} {"train_loss": -40.654205322265625, "global_step": 159096, "epoch": 1314} {"train_loss": -39.89093780517578, "global_step": 159097, "epoch": 1314} {"train_loss": -40.6551513671875, "global_step": 159098, "epoch": 1314} {"train_loss": -40.028114318847656, "global_step": 159099, "epoch": 1314} {"train_loss": -40.764034271240234, "global_step": 159100, "epoch": 1314} {"train_loss": -40.53163146972656, "global_step": 159101, "epoch": 1314} {"train_loss": -40.58784866333008, "global_step": 159102, "epoch": 1314} {"train_loss": -40.78544235229492, "global_step": 159103, "epoch": 1314} {"train_loss": -40.181270599365234, "global_step": 159104, "epoch": 1314} {"train_loss": -40.487648010253906, "global_step": 159105, "epoch": 1314} {"train_loss": -40.64952087402344, "global_step": 159106, "epoch": 1314} {"train_loss": -40.86627960205078, "global_step": 159107, "epoch": 1314} {"train_loss": -40.73167037963867, "global_step": 159108, "epoch": 1314} {"train_loss": -39.90805435180664, "global_step": 159109, "epoch": 1314} {"train_loss": -40.18788528442383, "global_step": 159110, "epoch": 1314} {"train_loss": -38.67660140991211, "global_step": 159111, "epoch": 1314} {"train_loss": -37.11906051635742, "global_step": 159112, "epoch": 1314} {"train_loss": -38.10722732543945, "global_step": 159113, "epoch": 1314} {"train_loss": -38.44107672005646, "global_step": 159114, "epoch": 1314, "val_loss": 2696692.25} {"train_loss": -38.20798873901367, "global_step": 159115, "epoch": 1315} {"train_loss": -40.41098403930664, "global_step": 159116, "epoch": 1315} {"train_loss": -40.241920471191406, "global_step": 159117, "epoch": 1315} {"train_loss": -39.78517532348633, "global_step": 159118, "epoch": 1315} {"train_loss": -40.3353385925293, "global_step": 159119, "epoch": 1315} {"train_loss": -39.903568267822266, "global_step": 159120, "epoch": 1315} {"train_loss": -37.3151969909668, "global_step": 159121, "epoch": 1315} {"train_loss": -37.77456283569336, "global_step": 159122, "epoch": 1315} {"train_loss": -39.62253189086914, "global_step": 159123, "epoch": 1315} {"train_loss": -38.0610466003418, "global_step": 159124, "epoch": 1315} {"train_loss": -36.70923614501953, "global_step": 159125, "epoch": 1315} {"train_loss": -36.34585952758789, "global_step": 159126, "epoch": 1315} {"train_loss": -39.56562423706055, "global_step": 159127, "epoch": 1315} {"train_loss": -37.287330627441406, "global_step": 159128, "epoch": 1315} {"train_loss": -37.64607620239258, "global_step": 159129, "epoch": 1315} {"train_loss": -39.81374740600586, "global_step": 159130, "epoch": 1315} {"train_loss": -39.08220291137695, "global_step": 159131, "epoch": 1315} {"train_loss": -38.68726348876953, "global_step": 159132, "epoch": 1315} {"train_loss": -39.98344802856445, "global_step": 159133, "epoch": 1315} {"train_loss": -39.391117095947266, "global_step": 159134, "epoch": 1315} {"train_loss": -40.058475494384766, "global_step": 159135, "epoch": 1315} {"train_loss": -39.677101135253906, "global_step": 159136, "epoch": 1315} {"train_loss": -39.84112548828125, "global_step": 159137, "epoch": 1315} {"train_loss": -40.035308837890625, "global_step": 159138, "epoch": 1315} {"train_loss": -40.0839729309082, "global_step": 159139, "epoch": 1315} {"train_loss": -40.32084655761719, "global_step": 159140, "epoch": 1315} {"train_loss": -39.107948303222656, "global_step": 159141, "epoch": 1315} {"train_loss": -40.434906005859375, "global_step": 159142, "epoch": 1315} {"train_loss": -39.16792678833008, "global_step": 159143, "epoch": 1315} {"train_loss": -40.0617790222168, "global_step": 159144, "epoch": 1315} {"train_loss": -38.37330627441406, "global_step": 159145, "epoch": 1315} {"train_loss": -40.505897521972656, "global_step": 159146, "epoch": 1315} {"train_loss": -40.12324142456055, "global_step": 159147, "epoch": 1315} {"train_loss": -40.215919494628906, "global_step": 159148, "epoch": 1315} {"train_loss": -40.65156936645508, "global_step": 159149, "epoch": 1315} {"train_loss": -40.191619873046875, "global_step": 159150, "epoch": 1315} {"train_loss": -40.227108001708984, "global_step": 159151, "epoch": 1315} {"train_loss": -40.47758102416992, "global_step": 159152, "epoch": 1315} {"train_loss": -40.76609802246094, "global_step": 159153, "epoch": 1315} {"train_loss": -40.43656539916992, "global_step": 159154, "epoch": 1315} {"train_loss": -39.85456466674805, "global_step": 159155, "epoch": 1315} {"train_loss": -40.482208251953125, "global_step": 159156, "epoch": 1315} {"train_loss": -40.47916793823242, "global_step": 159157, "epoch": 1315} {"train_loss": -39.89784622192383, "global_step": 159158, "epoch": 1315} {"train_loss": -36.82294464111328, "global_step": 159159, "epoch": 1315} {"train_loss": -33.723968505859375, "global_step": 159160, "epoch": 1315} {"train_loss": -27.098651885986328, "global_step": 159161, "epoch": 1315} {"train_loss": -23.57577896118164, "global_step": 159162, "epoch": 1315} {"train_loss": -27.3917236328125, "global_step": 159163, "epoch": 1315} {"train_loss": -38.338706970214844, "global_step": 159164, "epoch": 1315} {"train_loss": -21.024301528930664, "global_step": 159165, "epoch": 1315} {"train_loss": -28.275033950805664, "global_step": 159166, "epoch": 1315} {"train_loss": -6.397677898406982, "global_step": 159167, "epoch": 1315} {"train_loss": -35.22307205200195, "global_step": 159168, "epoch": 1315} {"train_loss": -0.04873504862189293, "global_step": 159169, "epoch": 1315} {"train_loss": -36.473609924316406, "global_step": 159170, "epoch": 1315} {"train_loss": -13.397006034851074, "global_step": 159171, "epoch": 1315} {"train_loss": -36.548095703125, "global_step": 159172, "epoch": 1315} {"train_loss": -23.884113311767578, "global_step": 159173, "epoch": 1315} {"train_loss": -28.390308380126953, "global_step": 159174, "epoch": 1315} {"train_loss": -37.544036865234375, "global_step": 159175, "epoch": 1315} {"train_loss": -27.902021408081055, "global_step": 159176, "epoch": 1315} {"train_loss": -31.5129337310791, "global_step": 159177, "epoch": 1315} {"train_loss": -36.50432205200195, "global_step": 159178, "epoch": 1315} {"train_loss": -33.05401611328125, "global_step": 159179, "epoch": 1315} {"train_loss": -31.61419677734375, "global_step": 159180, "epoch": 1315} {"train_loss": -37.551513671875, "global_step": 159181, "epoch": 1315} {"train_loss": -37.4135856628418, "global_step": 159182, "epoch": 1315} {"train_loss": -34.48920440673828, "global_step": 159183, "epoch": 1315} {"train_loss": -35.1866569519043, "global_step": 159184, "epoch": 1315} {"train_loss": -37.90415573120117, "global_step": 159185, "epoch": 1315} {"train_loss": -37.52033233642578, "global_step": 159186, "epoch": 1315} {"train_loss": -36.794979095458984, "global_step": 159187, "epoch": 1315} {"train_loss": -36.18094253540039, "global_step": 159188, "epoch": 1315} {"train_loss": -37.339454650878906, "global_step": 159189, "epoch": 1315} {"train_loss": -36.95064163208008, "global_step": 159190, "epoch": 1315} {"train_loss": -37.559051513671875, "global_step": 159191, "epoch": 1315} {"train_loss": -36.85076904296875, "global_step": 159192, "epoch": 1315} {"train_loss": -37.58591842651367, "global_step": 159193, "epoch": 1315} {"train_loss": -38.40565490722656, "global_step": 159194, "epoch": 1315} {"train_loss": -38.6384391784668, "global_step": 159195, "epoch": 1315} {"train_loss": -37.7535400390625, "global_step": 159196, "epoch": 1315} {"train_loss": -38.2440185546875, "global_step": 159197, "epoch": 1315} {"train_loss": -37.978843688964844, "global_step": 159198, "epoch": 1315} {"train_loss": -38.550994873046875, "global_step": 159199, "epoch": 1315} {"train_loss": -38.69271469116211, "global_step": 159200, "epoch": 1315} {"train_loss": -38.68351364135742, "global_step": 159201, "epoch": 1315} {"train_loss": -38.700042724609375, "global_step": 159202, "epoch": 1315} {"train_loss": -38.373626708984375, "global_step": 159203, "epoch": 1315} {"train_loss": -38.81339645385742, "global_step": 159204, "epoch": 1315} {"train_loss": -38.46786117553711, "global_step": 159205, "epoch": 1315} {"train_loss": -38.424861907958984, "global_step": 159206, "epoch": 1315} {"train_loss": -38.93337631225586, "global_step": 159207, "epoch": 1315} {"train_loss": -38.696651458740234, "global_step": 159208, "epoch": 1315} {"train_loss": -39.0925178527832, "global_step": 159209, "epoch": 1315} {"train_loss": -38.86983108520508, "global_step": 159210, "epoch": 1315} {"train_loss": -39.30648422241211, "global_step": 159211, "epoch": 1315} {"train_loss": -39.36288833618164, "global_step": 159212, "epoch": 1315} {"train_loss": -39.040462493896484, "global_step": 159213, "epoch": 1315} {"train_loss": -39.16328430175781, "global_step": 159214, "epoch": 1315} {"train_loss": -39.53430938720703, "global_step": 159215, "epoch": 1315} {"train_loss": -39.73982620239258, "global_step": 159216, "epoch": 1315} {"train_loss": -39.497493743896484, "global_step": 159217, "epoch": 1315} {"train_loss": -39.26149368286133, "global_step": 159218, "epoch": 1315} {"train_loss": -38.965694427490234, "global_step": 159219, "epoch": 1315} {"train_loss": -39.66630172729492, "global_step": 159220, "epoch": 1315} {"train_loss": -39.80808639526367, "global_step": 159221, "epoch": 1315} {"train_loss": -39.702430725097656, "global_step": 159222, "epoch": 1315} {"train_loss": -39.748077392578125, "global_step": 159223, "epoch": 1315} {"train_loss": -40.096778869628906, "global_step": 159224, "epoch": 1315} {"train_loss": -39.606563568115234, "global_step": 159225, "epoch": 1315} {"train_loss": -39.5980110168457, "global_step": 159226, "epoch": 1315} {"train_loss": -39.278839111328125, "global_step": 159227, "epoch": 1315} {"train_loss": -39.8570442199707, "global_step": 159228, "epoch": 1315} {"train_loss": -39.89710235595703, "global_step": 159229, "epoch": 1315} {"train_loss": -39.84546661376953, "global_step": 159230, "epoch": 1315} {"train_loss": -40.1094970703125, "global_step": 159231, "epoch": 1315} {"train_loss": -40.151371002197266, "global_step": 159232, "epoch": 1315} {"train_loss": -40.15519332885742, "global_step": 159233, "epoch": 1315} {"train_loss": -39.3122444152832, "global_step": 159234, "epoch": 1315} {"train_loss": -37.00234068643825, "global_step": 159235, "epoch": 1315, "val_loss": 2579772.75} {"train_loss": -39.88698196411133, "global_step": 159236, "epoch": 1316} {"train_loss": -40.16841506958008, "global_step": 159237, "epoch": 1316} {"train_loss": -40.410518646240234, "global_step": 159238, "epoch": 1316} {"train_loss": -40.2425651550293, "global_step": 159239, "epoch": 1316} {"train_loss": -40.27916717529297, "global_step": 159240, "epoch": 1316} {"train_loss": -40.3759765625, "global_step": 159241, "epoch": 1316} {"train_loss": -40.259761810302734, "global_step": 159242, "epoch": 1316} {"train_loss": -40.16476058959961, "global_step": 159243, "epoch": 1316} {"train_loss": -40.5888557434082, "global_step": 159244, "epoch": 1316} {"train_loss": -40.36579513549805, "global_step": 159245, "epoch": 1316} {"train_loss": -40.693511962890625, "global_step": 159246, "epoch": 1316} {"train_loss": -39.72312545776367, "global_step": 159247, "epoch": 1316} {"train_loss": -40.85871505737305, "global_step": 159248, "epoch": 1316} {"train_loss": -39.963619232177734, "global_step": 159249, "epoch": 1316} {"train_loss": -40.58344650268555, "global_step": 159250, "epoch": 1316} {"train_loss": -40.25860595703125, "global_step": 159251, "epoch": 1316} {"train_loss": -40.521636962890625, "global_step": 159252, "epoch": 1316} {"train_loss": -40.758827209472656, "global_step": 159253, "epoch": 1316} {"train_loss": -40.35586929321289, "global_step": 159254, "epoch": 1316} {"train_loss": -40.92281723022461, "global_step": 159255, "epoch": 1316} {"train_loss": -41.03383255004883, "global_step": 159256, "epoch": 1316} {"train_loss": -40.868099212646484, "global_step": 159257, "epoch": 1316} {"train_loss": -40.9710578918457, "global_step": 159258, "epoch": 1316} {"train_loss": -40.7203483581543, "global_step": 159259, "epoch": 1316} {"train_loss": -40.417415618896484, "global_step": 159260, "epoch": 1316} {"train_loss": -40.92621612548828, "global_step": 159261, "epoch": 1316} {"train_loss": -41.13618087768555, "global_step": 159262, "epoch": 1316} {"train_loss": -40.97846221923828, "global_step": 159263, "epoch": 1316} {"train_loss": -41.33956527709961, "global_step": 159264, "epoch": 1316} {"train_loss": -39.75145721435547, "global_step": 159265, "epoch": 1316} {"train_loss": -40.814170837402344, "global_step": 159266, "epoch": 1316} {"train_loss": -40.86468505859375, "global_step": 159267, "epoch": 1316} {"train_loss": -40.760128021240234, "global_step": 159268, "epoch": 1316} {"train_loss": -40.69357681274414, "global_step": 159269, "epoch": 1316} {"train_loss": -40.87630081176758, "global_step": 159270, "epoch": 1316} {"train_loss": -40.928749084472656, "global_step": 159271, "epoch": 1316} {"train_loss": -40.79698944091797, "global_step": 159272, "epoch": 1316} {"train_loss": -40.806251525878906, "global_step": 159273, "epoch": 1316} {"train_loss": -41.11444091796875, "global_step": 159274, "epoch": 1316} {"train_loss": -40.65346908569336, "global_step": 159275, "epoch": 1316} {"train_loss": -40.67148971557617, "global_step": 159276, "epoch": 1316} {"train_loss": -41.210262298583984, "global_step": 159277, "epoch": 1316} {"train_loss": -41.13922882080078, "global_step": 159278, "epoch": 1316} {"train_loss": -40.885311126708984, "global_step": 159279, "epoch": 1316} {"train_loss": -41.1124382019043, "global_step": 159280, "epoch": 1316} {"train_loss": -39.742713928222656, "global_step": 159281, "epoch": 1316} {"train_loss": -40.38972854614258, "global_step": 159282, "epoch": 1316} {"train_loss": -39.999237060546875, "global_step": 159283, "epoch": 1316} {"train_loss": -40.421302795410156, "global_step": 159284, "epoch": 1316} {"train_loss": -40.896541595458984, "global_step": 159285, "epoch": 1316} {"train_loss": -40.80770492553711, "global_step": 159286, "epoch": 1316} {"train_loss": -40.475521087646484, "global_step": 159287, "epoch": 1316} {"train_loss": -40.10027313232422, "global_step": 159288, "epoch": 1316} {"train_loss": -40.1290283203125, "global_step": 159289, "epoch": 1316} {"train_loss": -40.47282028198242, "global_step": 159290, "epoch": 1316} {"train_loss": -40.165992736816406, "global_step": 159291, "epoch": 1316} {"train_loss": -40.169307708740234, "global_step": 159292, "epoch": 1316} {"train_loss": -40.97160720825195, "global_step": 159293, "epoch": 1316} {"train_loss": -40.143585205078125, "global_step": 159294, "epoch": 1316} {"train_loss": -40.50014877319336, "global_step": 159295, "epoch": 1316} {"train_loss": -40.659767150878906, "global_step": 159296, "epoch": 1316} {"train_loss": -40.61270523071289, "global_step": 159297, "epoch": 1316} {"train_loss": -40.52946090698242, "global_step": 159298, "epoch": 1316} {"train_loss": -40.43387985229492, "global_step": 159299, "epoch": 1316} {"train_loss": -40.96310043334961, "global_step": 159300, "epoch": 1316} {"train_loss": -40.818756103515625, "global_step": 159301, "epoch": 1316} {"train_loss": -40.49717330932617, "global_step": 159302, "epoch": 1316} {"train_loss": -39.4012451171875, "global_step": 159303, "epoch": 1316} {"train_loss": -39.93933868408203, "global_step": 159304, "epoch": 1316} {"train_loss": -38.9385986328125, "global_step": 159305, "epoch": 1316} {"train_loss": -40.56974411010742, "global_step": 159306, "epoch": 1316} {"train_loss": -39.8564338684082, "global_step": 159307, "epoch": 1316} {"train_loss": -40.22688674926758, "global_step": 159308, "epoch": 1316} {"train_loss": -40.460601806640625, "global_step": 159309, "epoch": 1316} {"train_loss": -39.54458236694336, "global_step": 159310, "epoch": 1316} {"train_loss": -39.633174896240234, "global_step": 159311, "epoch": 1316} {"train_loss": -40.345787048339844, "global_step": 159312, "epoch": 1316} {"train_loss": -40.6812629699707, "global_step": 159313, "epoch": 1316} {"train_loss": -39.957977294921875, "global_step": 159314, "epoch": 1316} {"train_loss": -40.09431076049805, "global_step": 159315, "epoch": 1316} {"train_loss": -39.834266662597656, "global_step": 159316, "epoch": 1316} {"train_loss": -38.12347412109375, "global_step": 159317, "epoch": 1316} {"train_loss": -40.62598419189453, "global_step": 159318, "epoch": 1316} {"train_loss": -40.37998580932617, "global_step": 159319, "epoch": 1316} {"train_loss": -39.75760269165039, "global_step": 159320, "epoch": 1316} {"train_loss": -36.66781234741211, "global_step": 159321, "epoch": 1316} {"train_loss": -37.68466567993164, "global_step": 159322, "epoch": 1316} {"train_loss": -36.90861511230469, "global_step": 159323, "epoch": 1316} {"train_loss": -39.2810173034668, "global_step": 159324, "epoch": 1316} {"train_loss": -35.4478759765625, "global_step": 159325, "epoch": 1316} {"train_loss": -34.74971008300781, "global_step": 159326, "epoch": 1316} {"train_loss": -38.453128814697266, "global_step": 159327, "epoch": 1316} {"train_loss": -35.75026321411133, "global_step": 159328, "epoch": 1316} {"train_loss": -37.758819580078125, "global_step": 159329, "epoch": 1316} {"train_loss": -36.14314651489258, "global_step": 159330, "epoch": 1316} {"train_loss": -37.11812973022461, "global_step": 159331, "epoch": 1316} {"train_loss": -35.61848068237305, "global_step": 159332, "epoch": 1316} {"train_loss": -36.60084915161133, "global_step": 159333, "epoch": 1316} {"train_loss": -37.24007034301758, "global_step": 159334, "epoch": 1316} {"train_loss": -33.39829635620117, "global_step": 159335, "epoch": 1316} {"train_loss": -36.95821762084961, "global_step": 159336, "epoch": 1316} {"train_loss": -38.56171417236328, "global_step": 159337, "epoch": 1316} {"train_loss": -37.90855407714844, "global_step": 159338, "epoch": 1316} {"train_loss": -35.74991989135742, "global_step": 159339, "epoch": 1316} {"train_loss": -37.871334075927734, "global_step": 159340, "epoch": 1316} {"train_loss": -37.9774284362793, "global_step": 159341, "epoch": 1316} {"train_loss": -35.790855407714844, "global_step": 159342, "epoch": 1316} {"train_loss": -38.404449462890625, "global_step": 159343, "epoch": 1316} {"train_loss": -35.87958526611328, "global_step": 159344, "epoch": 1316} {"train_loss": -38.5575065612793, "global_step": 159345, "epoch": 1316} {"train_loss": -39.387542724609375, "global_step": 159346, "epoch": 1316} {"train_loss": -37.6245231628418, "global_step": 159347, "epoch": 1316} {"train_loss": -39.1076545715332, "global_step": 159348, "epoch": 1316} {"train_loss": -36.9064826965332, "global_step": 159349, "epoch": 1316} {"train_loss": -37.772666931152344, "global_step": 159350, "epoch": 1316} {"train_loss": -35.439083099365234, "global_step": 159351, "epoch": 1316} {"train_loss": -38.2205924987793, "global_step": 159352, "epoch": 1316} {"train_loss": -38.216156005859375, "global_step": 159353, "epoch": 1316} {"train_loss": -37.838531494140625, "global_step": 159354, "epoch": 1316} {"train_loss": -36.7766227722168, "global_step": 159355, "epoch": 1316} {"train_loss": -39.47913647486158, "global_step": 159356, "epoch": 1316, "val_loss": 2697607.5} {"train_loss": -39.40178680419922, "global_step": 159357, "epoch": 1317} {"train_loss": -39.37702178955078, "global_step": 159358, "epoch": 1317} {"train_loss": -40.039241790771484, "global_step": 159359, "epoch": 1317} {"train_loss": -38.09572219848633, "global_step": 159360, "epoch": 1317} {"train_loss": -39.2203369140625, "global_step": 159361, "epoch": 1317} {"train_loss": -39.49259567260742, "global_step": 159362, "epoch": 1317} {"train_loss": -39.39376449584961, "global_step": 159363, "epoch": 1317} {"train_loss": -39.543731689453125, "global_step": 159364, "epoch": 1317} {"train_loss": -39.92632293701172, "global_step": 159365, "epoch": 1317} {"train_loss": -39.838619232177734, "global_step": 159366, "epoch": 1317} {"train_loss": -39.965450286865234, "global_step": 159367, "epoch": 1317} {"train_loss": -39.7242317199707, "global_step": 159368, "epoch": 1317} {"train_loss": -38.70846939086914, "global_step": 159369, "epoch": 1317} {"train_loss": -39.44793701171875, "global_step": 159370, "epoch": 1317} {"train_loss": -38.18474197387695, "global_step": 159371, "epoch": 1317} {"train_loss": -39.77385330200195, "global_step": 159372, "epoch": 1317} {"train_loss": -39.46021270751953, "global_step": 159373, "epoch": 1317} {"train_loss": -38.09504318237305, "global_step": 159374, "epoch": 1317} {"train_loss": -39.55879592895508, "global_step": 159375, "epoch": 1317} {"train_loss": -39.98238754272461, "global_step": 159376, "epoch": 1317} {"train_loss": -39.53269577026367, "global_step": 159377, "epoch": 1317} {"train_loss": -40.16901779174805, "global_step": 159378, "epoch": 1317} {"train_loss": -39.4575309753418, "global_step": 159379, "epoch": 1317} {"train_loss": -40.06623458862305, "global_step": 159380, "epoch": 1317} {"train_loss": -37.75185775756836, "global_step": 159381, "epoch": 1317} {"train_loss": -40.018646240234375, "global_step": 159382, "epoch": 1317} {"train_loss": -39.08719253540039, "global_step": 159383, "epoch": 1317} {"train_loss": -40.484676361083984, "global_step": 159384, "epoch": 1317} {"train_loss": -39.86558151245117, "global_step": 159385, "epoch": 1317} {"train_loss": -39.839290618896484, "global_step": 159386, "epoch": 1317} {"train_loss": -40.37614059448242, "global_step": 159387, "epoch": 1317} {"train_loss": -40.01917266845703, "global_step": 159388, "epoch": 1317} {"train_loss": -40.54859161376953, "global_step": 159389, "epoch": 1317} {"train_loss": -40.67144775390625, "global_step": 159390, "epoch": 1317} {"train_loss": -39.535484313964844, "global_step": 159391, "epoch": 1317} {"train_loss": -38.17231369018555, "global_step": 159392, "epoch": 1317} {"train_loss": -40.06473922729492, "global_step": 159393, "epoch": 1317} {"train_loss": -37.24709701538086, "global_step": 159394, "epoch": 1317} {"train_loss": -39.93937683105469, "global_step": 159395, "epoch": 1317} {"train_loss": -40.71202087402344, "global_step": 159396, "epoch": 1317} {"train_loss": -40.4052619934082, "global_step": 159397, "epoch": 1317} {"train_loss": -40.329681396484375, "global_step": 159398, "epoch": 1317} {"train_loss": -39.42298126220703, "global_step": 159399, "epoch": 1317} {"train_loss": -39.752532958984375, "global_step": 159400, "epoch": 1317} {"train_loss": -40.261085510253906, "global_step": 159401, "epoch": 1317} {"train_loss": -40.17393112182617, "global_step": 159402, "epoch": 1317} {"train_loss": -40.718544006347656, "global_step": 159403, "epoch": 1317} {"train_loss": -39.607173919677734, "global_step": 159404, "epoch": 1317} {"train_loss": -39.87564468383789, "global_step": 159405, "epoch": 1317} {"train_loss": -39.10659408569336, "global_step": 159406, "epoch": 1317} {"train_loss": -40.66605758666992, "global_step": 159407, "epoch": 1317} {"train_loss": -39.70405960083008, "global_step": 159408, "epoch": 1317} {"train_loss": -40.80224609375, "global_step": 159409, "epoch": 1317} {"train_loss": -40.2932243347168, "global_step": 159410, "epoch": 1317} {"train_loss": -40.20493698120117, "global_step": 159411, "epoch": 1317} {"train_loss": -40.63131332397461, "global_step": 159412, "epoch": 1317} {"train_loss": -40.39694595336914, "global_step": 159413, "epoch": 1317} {"train_loss": -40.59138870239258, "global_step": 159414, "epoch": 1317} {"train_loss": -40.47555160522461, "global_step": 159415, "epoch": 1317} {"train_loss": -40.69246292114258, "global_step": 159416, "epoch": 1317} {"train_loss": -40.03696823120117, "global_step": 159417, "epoch": 1317} {"train_loss": -40.40971755981445, "global_step": 159418, "epoch": 1317} {"train_loss": -39.547359466552734, "global_step": 159419, "epoch": 1317} {"train_loss": -40.437721252441406, "global_step": 159420, "epoch": 1317} {"train_loss": -40.2703971862793, "global_step": 159421, "epoch": 1317} {"train_loss": -38.31873321533203, "global_step": 159422, "epoch": 1317} {"train_loss": -40.59187698364258, "global_step": 159423, "epoch": 1317} {"train_loss": -40.388675689697266, "global_step": 159424, "epoch": 1317} {"train_loss": -39.31000900268555, "global_step": 159425, "epoch": 1317} {"train_loss": -39.772132873535156, "global_step": 159426, "epoch": 1317} {"train_loss": -40.053924560546875, "global_step": 159427, "epoch": 1317} {"train_loss": -40.71710968017578, "global_step": 159428, "epoch": 1317} {"train_loss": -40.01051712036133, "global_step": 159429, "epoch": 1317} {"train_loss": -39.693851470947266, "global_step": 159430, "epoch": 1317} {"train_loss": -39.9791374206543, "global_step": 159431, "epoch": 1317} {"train_loss": -40.474586486816406, "global_step": 159432, "epoch": 1317} {"train_loss": -40.40968704223633, "global_step": 159433, "epoch": 1317} {"train_loss": -39.110382080078125, "global_step": 159434, "epoch": 1317} {"train_loss": -39.469818115234375, "global_step": 159435, "epoch": 1317} {"train_loss": -39.15207290649414, "global_step": 159436, "epoch": 1317} {"train_loss": -39.04490280151367, "global_step": 159437, "epoch": 1317} {"train_loss": -38.997039794921875, "global_step": 159438, "epoch": 1317} {"train_loss": -38.12287139892578, "global_step": 159439, "epoch": 1317} {"train_loss": -39.457340240478516, "global_step": 159440, "epoch": 1317} {"train_loss": -40.32087707519531, "global_step": 159441, "epoch": 1317} {"train_loss": -40.56396484375, "global_step": 159442, "epoch": 1317} {"train_loss": -38.9090576171875, "global_step": 159443, "epoch": 1317} {"train_loss": -36.71657180786133, "global_step": 159444, "epoch": 1317} {"train_loss": -34.403480529785156, "global_step": 159445, "epoch": 1317} {"train_loss": -35.70198440551758, "global_step": 159446, "epoch": 1317} {"train_loss": -38.08146286010742, "global_step": 159447, "epoch": 1317} {"train_loss": -38.4882926940918, "global_step": 159448, "epoch": 1317} {"train_loss": -40.23028564453125, "global_step": 159449, "epoch": 1317} {"train_loss": -39.68244552612305, "global_step": 159450, "epoch": 1317} {"train_loss": -38.08848571777344, "global_step": 159451, "epoch": 1317} {"train_loss": -38.970001220703125, "global_step": 159452, "epoch": 1317} {"train_loss": -39.74454879760742, "global_step": 159453, "epoch": 1317} {"train_loss": -40.41714096069336, "global_step": 159454, "epoch": 1317} {"train_loss": -39.8538818359375, "global_step": 159455, "epoch": 1317} {"train_loss": -40.0904655456543, "global_step": 159456, "epoch": 1317} {"train_loss": -40.48771286010742, "global_step": 159457, "epoch": 1317} {"train_loss": -39.42155838012695, "global_step": 159458, "epoch": 1317} {"train_loss": -40.751678466796875, "global_step": 159459, "epoch": 1317} {"train_loss": -40.190284729003906, "global_step": 159460, "epoch": 1317} {"train_loss": -40.32841491699219, "global_step": 159461, "epoch": 1317} {"train_loss": -39.78788375854492, "global_step": 159462, "epoch": 1317} {"train_loss": -38.02997970581055, "global_step": 159463, "epoch": 1317} {"train_loss": -39.669647216796875, "global_step": 159464, "epoch": 1317} {"train_loss": -39.38185501098633, "global_step": 159465, "epoch": 1317} {"train_loss": -38.474945068359375, "global_step": 159466, "epoch": 1317} {"train_loss": -40.10910415649414, "global_step": 159467, "epoch": 1317} {"train_loss": -37.67097854614258, "global_step": 159468, "epoch": 1317} {"train_loss": -40.05472946166992, "global_step": 159469, "epoch": 1317} {"train_loss": -38.91615676879883, "global_step": 159470, "epoch": 1317} {"train_loss": -39.373043060302734, "global_step": 159471, "epoch": 1317} {"train_loss": -39.71787643432617, "global_step": 159472, "epoch": 1317} {"train_loss": -39.42238235473633, "global_step": 159473, "epoch": 1317} {"train_loss": -40.622283935546875, "global_step": 159474, "epoch": 1317} {"train_loss": -38.77666473388672, "global_step": 159475, "epoch": 1317} {"train_loss": -40.37763595581055, "global_step": 159476, "epoch": 1317} {"train_loss": -39.586792023713926, "global_step": 159477, "epoch": 1317, "val_loss": 2526525.0} {"train_loss": -40.317134857177734, "global_step": 159478, "epoch": 1318} {"train_loss": -40.53648376464844, "global_step": 159479, "epoch": 1318} {"train_loss": -39.62519454956055, "global_step": 159480, "epoch": 1318} {"train_loss": -40.76081466674805, "global_step": 159481, "epoch": 1318} {"train_loss": -40.90982437133789, "global_step": 159482, "epoch": 1318} {"train_loss": -40.870906829833984, "global_step": 159483, "epoch": 1318} {"train_loss": -41.152374267578125, "global_step": 159484, "epoch": 1318} {"train_loss": -40.677364349365234, "global_step": 159485, "epoch": 1318} {"train_loss": -40.649818420410156, "global_step": 159486, "epoch": 1318} {"train_loss": -40.91091537475586, "global_step": 159487, "epoch": 1318} {"train_loss": -40.483882904052734, "global_step": 159488, "epoch": 1318} {"train_loss": -40.088775634765625, "global_step": 159489, "epoch": 1318} {"train_loss": -40.56069564819336, "global_step": 159490, "epoch": 1318} {"train_loss": -40.5092887878418, "global_step": 159491, "epoch": 1318} {"train_loss": -41.116878509521484, "global_step": 159492, "epoch": 1318} {"train_loss": -40.698001861572266, "global_step": 159493, "epoch": 1318} {"train_loss": -41.19301986694336, "global_step": 159494, "epoch": 1318} {"train_loss": -41.0257682800293, "global_step": 159495, "epoch": 1318} {"train_loss": -40.89980697631836, "global_step": 159496, "epoch": 1318} {"train_loss": -41.32818603515625, "global_step": 159497, "epoch": 1318} {"train_loss": -40.95968246459961, "global_step": 159498, "epoch": 1318} {"train_loss": -40.99451446533203, "global_step": 159499, "epoch": 1318} {"train_loss": -41.49615478515625, "global_step": 159500, "epoch": 1318} {"train_loss": -41.28093719482422, "global_step": 159501, "epoch": 1318} {"train_loss": -41.29032516479492, "global_step": 159502, "epoch": 1318} {"train_loss": -41.4320068359375, "global_step": 159503, "epoch": 1318} {"train_loss": -41.35541534423828, "global_step": 159504, "epoch": 1318} {"train_loss": -41.268062591552734, "global_step": 159505, "epoch": 1318} {"train_loss": -41.441463470458984, "global_step": 159506, "epoch": 1318} {"train_loss": -38.46499252319336, "global_step": 159507, "epoch": 1318} {"train_loss": -41.485504150390625, "global_step": 159508, "epoch": 1318} {"train_loss": -41.687591552734375, "global_step": 159509, "epoch": 1318} {"train_loss": -39.875308990478516, "global_step": 159510, "epoch": 1318} {"train_loss": -40.84821319580078, "global_step": 159511, "epoch": 1318} {"train_loss": -40.7088508605957, "global_step": 159512, "epoch": 1318} {"train_loss": -41.287044525146484, "global_step": 159513, "epoch": 1318} {"train_loss": -41.0544319152832, "global_step": 159514, "epoch": 1318} {"train_loss": -40.363922119140625, "global_step": 159515, "epoch": 1318} {"train_loss": -41.03907012939453, "global_step": 159516, "epoch": 1318} {"train_loss": -39.8099250793457, "global_step": 159517, "epoch": 1318} {"train_loss": -40.941200256347656, "global_step": 159518, "epoch": 1318} {"train_loss": -40.910484313964844, "global_step": 159519, "epoch": 1318} {"train_loss": -40.85602951049805, "global_step": 159520, "epoch": 1318} {"train_loss": -39.506622314453125, "global_step": 159521, "epoch": 1318} {"train_loss": -40.55652618408203, "global_step": 159522, "epoch": 1318} {"train_loss": -40.15285873413086, "global_step": 159523, "epoch": 1318} {"train_loss": -40.30139923095703, "global_step": 159524, "epoch": 1318} {"train_loss": -40.221702575683594, "global_step": 159525, "epoch": 1318} {"train_loss": -39.780982971191406, "global_step": 159526, "epoch": 1318} {"train_loss": -40.54395294189453, "global_step": 159527, "epoch": 1318} {"train_loss": -36.71401596069336, "global_step": 159528, "epoch": 1318} {"train_loss": -40.50358200073242, "global_step": 159529, "epoch": 1318} {"train_loss": -38.96841049194336, "global_step": 159530, "epoch": 1318} {"train_loss": -38.63264083862305, "global_step": 159531, "epoch": 1318} {"train_loss": -35.5295295715332, "global_step": 159532, "epoch": 1318} {"train_loss": -29.0037841796875, "global_step": 159533, "epoch": 1318} {"train_loss": -29.31035804748535, "global_step": 159534, "epoch": 1318} {"train_loss": -39.57322311401367, "global_step": 159535, "epoch": 1318} {"train_loss": -36.974849700927734, "global_step": 159536, "epoch": 1318} {"train_loss": -33.41108322143555, "global_step": 159537, "epoch": 1318} {"train_loss": -33.790618896484375, "global_step": 159538, "epoch": 1318} {"train_loss": -39.569820404052734, "global_step": 159539, "epoch": 1318} {"train_loss": -37.4509391784668, "global_step": 159540, "epoch": 1318} {"train_loss": -36.59938430786133, "global_step": 159541, "epoch": 1318} {"train_loss": -39.74922561645508, "global_step": 159542, "epoch": 1318} {"train_loss": -37.15560531616211, "global_step": 159543, "epoch": 1318} {"train_loss": -40.151363372802734, "global_step": 159544, "epoch": 1318} {"train_loss": -38.77350997924805, "global_step": 159545, "epoch": 1318} {"train_loss": -40.08808135986328, "global_step": 159546, "epoch": 1318} {"train_loss": -39.813899993896484, "global_step": 159547, "epoch": 1318} {"train_loss": -39.7027473449707, "global_step": 159548, "epoch": 1318} {"train_loss": -39.860965728759766, "global_step": 159549, "epoch": 1318} {"train_loss": -40.202423095703125, "global_step": 159550, "epoch": 1318} {"train_loss": -39.817901611328125, "global_step": 159551, "epoch": 1318} {"train_loss": -39.92771530151367, "global_step": 159552, "epoch": 1318} {"train_loss": -39.37726593017578, "global_step": 159553, "epoch": 1318} {"train_loss": -40.508758544921875, "global_step": 159554, "epoch": 1318} {"train_loss": -40.1938362121582, "global_step": 159555, "epoch": 1318} {"train_loss": -39.94378662109375, "global_step": 159556, "epoch": 1318} {"train_loss": -40.403316497802734, "global_step": 159557, "epoch": 1318} {"train_loss": -40.32841873168945, "global_step": 159558, "epoch": 1318} {"train_loss": -40.33769989013672, "global_step": 159559, "epoch": 1318} {"train_loss": -40.04032516479492, "global_step": 159560, "epoch": 1318} {"train_loss": -39.59035873413086, "global_step": 159561, "epoch": 1318} {"train_loss": -39.98193359375, "global_step": 159562, "epoch": 1318} {"train_loss": -40.34621810913086, "global_step": 159563, "epoch": 1318} {"train_loss": -40.46255111694336, "global_step": 159564, "epoch": 1318} {"train_loss": -41.02448272705078, "global_step": 159565, "epoch": 1318} {"train_loss": -40.77327346801758, "global_step": 159566, "epoch": 1318} {"train_loss": -40.71848678588867, "global_step": 159567, "epoch": 1318} {"train_loss": -40.8952522277832, "global_step": 159568, "epoch": 1318} {"train_loss": -41.15708541870117, "global_step": 159569, "epoch": 1318} {"train_loss": -40.91292953491211, "global_step": 159570, "epoch": 1318} {"train_loss": -41.08647537231445, "global_step": 159571, "epoch": 1318} {"train_loss": -40.58199691772461, "global_step": 159572, "epoch": 1318} {"train_loss": -40.77401351928711, "global_step": 159573, "epoch": 1318} {"train_loss": -40.571632385253906, "global_step": 159574, "epoch": 1318} {"train_loss": -38.944393157958984, "global_step": 159575, "epoch": 1318} {"train_loss": -40.50403594970703, "global_step": 159576, "epoch": 1318} {"train_loss": -41.01032638549805, "global_step": 159577, "epoch": 1318} {"train_loss": -41.28788375854492, "global_step": 159578, "epoch": 1318} {"train_loss": -40.357208251953125, "global_step": 159579, "epoch": 1318} {"train_loss": -38.71345138549805, "global_step": 159580, "epoch": 1318} {"train_loss": -38.00999069213867, "global_step": 159581, "epoch": 1318} {"train_loss": -38.46141052246094, "global_step": 159582, "epoch": 1318} {"train_loss": -38.513832092285156, "global_step": 159583, "epoch": 1318} {"train_loss": -40.29865646362305, "global_step": 159584, "epoch": 1318} {"train_loss": -40.6483268737793, "global_step": 159585, "epoch": 1318} {"train_loss": -39.37508010864258, "global_step": 159586, "epoch": 1318} {"train_loss": -38.05218505859375, "global_step": 159587, "epoch": 1318} {"train_loss": -38.56413269042969, "global_step": 159588, "epoch": 1318} {"train_loss": -32.91489791870117, "global_step": 159589, "epoch": 1318} {"train_loss": -37.49371337890625, "global_step": 159590, "epoch": 1318} {"train_loss": -39.247398376464844, "global_step": 159591, "epoch": 1318} {"train_loss": -39.0087776184082, "global_step": 159592, "epoch": 1318} {"train_loss": -38.53621292114258, "global_step": 159593, "epoch": 1318} {"train_loss": -39.28136444091797, "global_step": 159594, "epoch": 1318} {"train_loss": -38.71211242675781, "global_step": 159595, "epoch": 1318} {"train_loss": -39.987789154052734, "global_step": 159596, "epoch": 1318} {"train_loss": -38.200313568115234, "global_step": 159597, "epoch": 1318} {"train_loss": -39.69280077406197, "global_step": 159598, "epoch": 1318, "val_loss": 2668038.75} {"train_loss": -38.31226348876953, "global_step": 159599, "epoch": 1319} {"train_loss": -37.22351837158203, "global_step": 159600, "epoch": 1319} {"train_loss": -40.357479095458984, "global_step": 159601, "epoch": 1319} {"train_loss": -40.50958251953125, "global_step": 159602, "epoch": 1319} {"train_loss": -40.41899490356445, "global_step": 159603, "epoch": 1319} {"train_loss": -39.591609954833984, "global_step": 159604, "epoch": 1319} {"train_loss": -40.84992599487305, "global_step": 159605, "epoch": 1319} {"train_loss": -39.466644287109375, "global_step": 159606, "epoch": 1319} {"train_loss": -40.33243942260742, "global_step": 159607, "epoch": 1319} {"train_loss": -40.59627914428711, "global_step": 159608, "epoch": 1319} {"train_loss": -40.21929931640625, "global_step": 159609, "epoch": 1319} {"train_loss": -40.22465133666992, "global_step": 159610, "epoch": 1319} {"train_loss": -40.37971496582031, "global_step": 159611, "epoch": 1319} {"train_loss": -39.847476959228516, "global_step": 159612, "epoch": 1319} {"train_loss": -38.4571533203125, "global_step": 159613, "epoch": 1319} {"train_loss": -39.98090744018555, "global_step": 159614, "epoch": 1319} {"train_loss": -40.62648391723633, "global_step": 159615, "epoch": 1319} {"train_loss": -38.317909240722656, "global_step": 159616, "epoch": 1319} {"train_loss": -39.42146301269531, "global_step": 159617, "epoch": 1319} {"train_loss": -40.28152084350586, "global_step": 159618, "epoch": 1319} {"train_loss": -39.9123420715332, "global_step": 159619, "epoch": 1319} {"train_loss": -40.66053009033203, "global_step": 159620, "epoch": 1319} {"train_loss": -39.2132568359375, "global_step": 159621, "epoch": 1319} {"train_loss": -39.922149658203125, "global_step": 159622, "epoch": 1319} {"train_loss": -38.84511947631836, "global_step": 159623, "epoch": 1319} {"train_loss": -40.11593246459961, "global_step": 159624, "epoch": 1319} {"train_loss": -40.23627471923828, "global_step": 159625, "epoch": 1319} {"train_loss": -39.69377899169922, "global_step": 159626, "epoch": 1319} {"train_loss": -39.457740783691406, "global_step": 159627, "epoch": 1319} {"train_loss": -38.30647277832031, "global_step": 159628, "epoch": 1319} {"train_loss": -40.08418655395508, "global_step": 159629, "epoch": 1319} {"train_loss": -39.56464767456055, "global_step": 159630, "epoch": 1319} {"train_loss": -38.57339096069336, "global_step": 159631, "epoch": 1319} {"train_loss": -40.078590393066406, "global_step": 159632, "epoch": 1319} {"train_loss": -38.61857223510742, "global_step": 159633, "epoch": 1319} {"train_loss": -40.201290130615234, "global_step": 159634, "epoch": 1319} {"train_loss": -39.44826889038086, "global_step": 159635, "epoch": 1319} {"train_loss": -40.21090316772461, "global_step": 159636, "epoch": 1319} {"train_loss": -39.23910140991211, "global_step": 159637, "epoch": 1319} {"train_loss": -39.58710861206055, "global_step": 159638, "epoch": 1319} {"train_loss": -39.002254486083984, "global_step": 159639, "epoch": 1319} {"train_loss": -39.69504928588867, "global_step": 159640, "epoch": 1319} {"train_loss": -39.08907699584961, "global_step": 159641, "epoch": 1319} {"train_loss": -40.2015495300293, "global_step": 159642, "epoch": 1319} {"train_loss": -38.40986251831055, "global_step": 159643, "epoch": 1319} {"train_loss": -39.65212631225586, "global_step": 159644, "epoch": 1319} {"train_loss": -39.813472747802734, "global_step": 159645, "epoch": 1319} {"train_loss": -39.1357536315918, "global_step": 159646, "epoch": 1319} {"train_loss": -38.41200637817383, "global_step": 159647, "epoch": 1319} {"train_loss": -39.855812072753906, "global_step": 159648, "epoch": 1319} {"train_loss": -38.98529815673828, "global_step": 159649, "epoch": 1319} {"train_loss": -39.44260787963867, "global_step": 159650, "epoch": 1319} {"train_loss": -39.6091423034668, "global_step": 159651, "epoch": 1319} {"train_loss": -39.77482223510742, "global_step": 159652, "epoch": 1319} {"train_loss": -37.1219367980957, "global_step": 159653, "epoch": 1319} {"train_loss": -34.85577392578125, "global_step": 159654, "epoch": 1319} {"train_loss": -36.97566604614258, "global_step": 159655, "epoch": 1319} {"train_loss": -39.39278030395508, "global_step": 159656, "epoch": 1319} {"train_loss": -31.47149658203125, "global_step": 159657, "epoch": 1319} {"train_loss": -38.294395446777344, "global_step": 159658, "epoch": 1319} {"train_loss": -36.65302658081055, "global_step": 159659, "epoch": 1319} {"train_loss": -32.28267288208008, "global_step": 159660, "epoch": 1319} {"train_loss": -37.548946380615234, "global_step": 159661, "epoch": 1319} {"train_loss": -36.693355560302734, "global_step": 159662, "epoch": 1319} {"train_loss": -37.763092041015625, "global_step": 159663, "epoch": 1319} {"train_loss": -39.5555305480957, "global_step": 159664, "epoch": 1319} {"train_loss": -37.758724212646484, "global_step": 159665, "epoch": 1319} {"train_loss": -38.47732925415039, "global_step": 159666, "epoch": 1319} {"train_loss": -36.53620529174805, "global_step": 159667, "epoch": 1319} {"train_loss": -39.83795928955078, "global_step": 159668, "epoch": 1319} {"train_loss": -38.260597229003906, "global_step": 159669, "epoch": 1319} {"train_loss": -39.13174819946289, "global_step": 159670, "epoch": 1319} {"train_loss": -38.8692741394043, "global_step": 159671, "epoch": 1319} {"train_loss": -39.829856872558594, "global_step": 159672, "epoch": 1319} {"train_loss": -39.32200241088867, "global_step": 159673, "epoch": 1319} {"train_loss": -39.92850875854492, "global_step": 159674, "epoch": 1319} {"train_loss": -39.86940383911133, "global_step": 159675, "epoch": 1319} {"train_loss": -39.380611419677734, "global_step": 159676, "epoch": 1319} {"train_loss": -39.93251037597656, "global_step": 159677, "epoch": 1319} {"train_loss": -39.75651550292969, "global_step": 159678, "epoch": 1319} {"train_loss": -39.03757858276367, "global_step": 159679, "epoch": 1319} {"train_loss": -39.737754821777344, "global_step": 159680, "epoch": 1319} {"train_loss": -40.384830474853516, "global_step": 159681, "epoch": 1319} {"train_loss": -40.36537170410156, "global_step": 159682, "epoch": 1319} {"train_loss": -39.4890251159668, "global_step": 159683, "epoch": 1319} {"train_loss": -39.34025192260742, "global_step": 159684, "epoch": 1319} {"train_loss": -40.23159408569336, "global_step": 159685, "epoch": 1319} {"train_loss": -40.39670944213867, "global_step": 159686, "epoch": 1319} {"train_loss": -40.27311706542969, "global_step": 159687, "epoch": 1319} {"train_loss": -40.11587142944336, "global_step": 159688, "epoch": 1319} {"train_loss": -40.10606002807617, "global_step": 159689, "epoch": 1319} {"train_loss": -40.37125015258789, "global_step": 159690, "epoch": 1319} {"train_loss": -40.0320930480957, "global_step": 159691, "epoch": 1319} {"train_loss": -40.19362258911133, "global_step": 159692, "epoch": 1319} {"train_loss": -39.59553146362305, "global_step": 159693, "epoch": 1319} {"train_loss": -39.9976921081543, "global_step": 159694, "epoch": 1319} {"train_loss": -38.582637786865234, "global_step": 159695, "epoch": 1319} {"train_loss": -40.586448669433594, "global_step": 159696, "epoch": 1319} {"train_loss": -39.706268310546875, "global_step": 159697, "epoch": 1319} {"train_loss": -40.73073959350586, "global_step": 159698, "epoch": 1319} {"train_loss": -40.26123809814453, "global_step": 159699, "epoch": 1319} {"train_loss": -40.74716567993164, "global_step": 159700, "epoch": 1319} {"train_loss": -40.527278900146484, "global_step": 159701, "epoch": 1319} {"train_loss": -40.59804916381836, "global_step": 159702, "epoch": 1319} {"train_loss": -40.682281494140625, "global_step": 159703, "epoch": 1319} {"train_loss": -40.6829833984375, "global_step": 159704, "epoch": 1319} {"train_loss": -41.00919723510742, "global_step": 159705, "epoch": 1319} {"train_loss": -41.17350769042969, "global_step": 159706, "epoch": 1319} {"train_loss": -41.08970260620117, "global_step": 159707, "epoch": 1319} {"train_loss": -41.22502899169922, "global_step": 159708, "epoch": 1319} {"train_loss": -40.96642303466797, "global_step": 159709, "epoch": 1319} {"train_loss": -40.93349075317383, "global_step": 159710, "epoch": 1319} {"train_loss": -40.91243362426758, "global_step": 159711, "epoch": 1319} {"train_loss": -41.401119232177734, "global_step": 159712, "epoch": 1319} {"train_loss": -41.089141845703125, "global_step": 159713, "epoch": 1319} {"train_loss": -41.14617919921875, "global_step": 159714, "epoch": 1319} {"train_loss": -41.059200286865234, "global_step": 159715, "epoch": 1319} {"train_loss": -41.427467346191406, "global_step": 159716, "epoch": 1319} {"train_loss": -41.14947509765625, "global_step": 159717, "epoch": 1319} {"train_loss": -41.06870651245117, "global_step": 159718, "epoch": 1319} {"train_loss": -39.5333902973774, "global_step": 159719, "epoch": 1319, "val_loss": 2433349.75} {"train_loss": -41.59080123901367, "global_step": 159720, "epoch": 1320} {"train_loss": -41.40169143676758, "global_step": 159721, "epoch": 1320} {"train_loss": -41.554534912109375, "global_step": 159722, "epoch": 1320} {"train_loss": -40.917232513427734, "global_step": 159723, "epoch": 1320} {"train_loss": -41.8624382019043, "global_step": 159724, "epoch": 1320} {"train_loss": -41.66842269897461, "global_step": 159725, "epoch": 1320} {"train_loss": -41.48530960083008, "global_step": 159726, "epoch": 1320} {"train_loss": -41.28852462768555, "global_step": 159727, "epoch": 1320} {"train_loss": -41.7986946105957, "global_step": 159728, "epoch": 1320} {"train_loss": -41.576759338378906, "global_step": 159729, "epoch": 1320} {"train_loss": -41.505775451660156, "global_step": 159730, "epoch": 1320} {"train_loss": -41.56609344482422, "global_step": 159731, "epoch": 1320} {"train_loss": -41.43913650512695, "global_step": 159732, "epoch": 1320} {"train_loss": -41.551021575927734, "global_step": 159733, "epoch": 1320} {"train_loss": -41.53409957885742, "global_step": 159734, "epoch": 1320} {"train_loss": -41.61748123168945, "global_step": 159735, "epoch": 1320} {"train_loss": -41.80669021606445, "global_step": 159736, "epoch": 1320} {"train_loss": -41.7596549987793, "global_step": 159737, "epoch": 1320} {"train_loss": -41.869625091552734, "global_step": 159738, "epoch": 1320} {"train_loss": -41.85100173950195, "global_step": 159739, "epoch": 1320} {"train_loss": -41.57711410522461, "global_step": 159740, "epoch": 1320} {"train_loss": -42.21966552734375, "global_step": 159741, "epoch": 1320} {"train_loss": -41.68793487548828, "global_step": 159742, "epoch": 1320} {"train_loss": -41.19804000854492, "global_step": 159743, "epoch": 1320} {"train_loss": -41.53422164916992, "global_step": 159744, "epoch": 1320} {"train_loss": -41.73551559448242, "global_step": 159745, "epoch": 1320} {"train_loss": -41.94744110107422, "global_step": 159746, "epoch": 1320} {"train_loss": -42.1113395690918, "global_step": 159747, "epoch": 1320} {"train_loss": -41.960018157958984, "global_step": 159748, "epoch": 1320} {"train_loss": -41.36507034301758, "global_step": 159749, "epoch": 1320} {"train_loss": -41.90066146850586, "global_step": 159750, "epoch": 1320} {"train_loss": -41.22209548950195, "global_step": 159751, "epoch": 1320} {"train_loss": -41.77992630004883, "global_step": 159752, "epoch": 1320} {"train_loss": -41.5128173828125, "global_step": 159753, "epoch": 1320} {"train_loss": -41.80979537963867, "global_step": 159754, "epoch": 1320} {"train_loss": -40.06673812866211, "global_step": 159755, "epoch": 1320} {"train_loss": -41.084720611572266, "global_step": 159756, "epoch": 1320} {"train_loss": -40.98812484741211, "global_step": 159757, "epoch": 1320} {"train_loss": -39.796974182128906, "global_step": 159758, "epoch": 1320} {"train_loss": -38.61452865600586, "global_step": 159759, "epoch": 1320} {"train_loss": -37.76629638671875, "global_step": 159760, "epoch": 1320} {"train_loss": -34.530879974365234, "global_step": 159761, "epoch": 1320} {"train_loss": -29.239154815673828, "global_step": 159762, "epoch": 1320} {"train_loss": -24.750911712646484, "global_step": 159763, "epoch": 1320} {"train_loss": -12.243008613586426, "global_step": 159764, "epoch": 1320} {"train_loss": -24.18667984008789, "global_step": 159765, "epoch": 1320} {"train_loss": -38.223445892333984, "global_step": 159766, "epoch": 1320} {"train_loss": -31.638452529907227, "global_step": 159767, "epoch": 1320} {"train_loss": -29.366455078125, "global_step": 159768, "epoch": 1320} {"train_loss": -35.981468200683594, "global_step": 159769, "epoch": 1320} {"train_loss": -31.4774112701416, "global_step": 159770, "epoch": 1320} {"train_loss": -34.58253479003906, "global_step": 159771, "epoch": 1320} {"train_loss": -32.78879928588867, "global_step": 159772, "epoch": 1320} {"train_loss": -38.0748176574707, "global_step": 159773, "epoch": 1320} {"train_loss": -35.31715774536133, "global_step": 159774, "epoch": 1320} {"train_loss": -37.577239990234375, "global_step": 159775, "epoch": 1320} {"train_loss": -38.10160827636719, "global_step": 159776, "epoch": 1320} {"train_loss": -36.76065444946289, "global_step": 159777, "epoch": 1320} {"train_loss": -36.56269454956055, "global_step": 159778, "epoch": 1320} {"train_loss": -37.693302154541016, "global_step": 159779, "epoch": 1320} {"train_loss": -37.53306579589844, "global_step": 159780, "epoch": 1320} {"train_loss": -38.63963317871094, "global_step": 159781, "epoch": 1320} {"train_loss": -37.24957275390625, "global_step": 159782, "epoch": 1320} {"train_loss": -39.20534896850586, "global_step": 159783, "epoch": 1320} {"train_loss": -37.90020751953125, "global_step": 159784, "epoch": 1320} {"train_loss": -38.47785568237305, "global_step": 159785, "epoch": 1320} {"train_loss": -38.66927719116211, "global_step": 159786, "epoch": 1320} {"train_loss": -37.84282302856445, "global_step": 159787, "epoch": 1320} {"train_loss": -39.48283004760742, "global_step": 159788, "epoch": 1320} {"train_loss": -39.207740783691406, "global_step": 159789, "epoch": 1320} {"train_loss": -39.377681732177734, "global_step": 159790, "epoch": 1320} {"train_loss": -38.907379150390625, "global_step": 159791, "epoch": 1320} {"train_loss": -39.08079147338867, "global_step": 159792, "epoch": 1320} {"train_loss": -39.29026794433594, "global_step": 159793, "epoch": 1320} {"train_loss": -39.1480712890625, "global_step": 159794, "epoch": 1320} {"train_loss": -39.648414611816406, "global_step": 159795, "epoch": 1320} {"train_loss": -39.925689697265625, "global_step": 159796, "epoch": 1320} {"train_loss": -38.7477912902832, "global_step": 159797, "epoch": 1320} {"train_loss": -39.18797302246094, "global_step": 159798, "epoch": 1320} {"train_loss": -39.649044036865234, "global_step": 159799, "epoch": 1320} {"train_loss": -39.993892669677734, "global_step": 159800, "epoch": 1320} {"train_loss": -38.623294830322266, "global_step": 159801, "epoch": 1320} {"train_loss": -40.03803634643555, "global_step": 159802, "epoch": 1320} {"train_loss": -40.24186325073242, "global_step": 159803, "epoch": 1320} {"train_loss": -40.055931091308594, "global_step": 159804, "epoch": 1320} {"train_loss": -40.256229400634766, "global_step": 159805, "epoch": 1320} {"train_loss": -39.140193939208984, "global_step": 159806, "epoch": 1320} {"train_loss": -40.004024505615234, "global_step": 159807, "epoch": 1320} {"train_loss": -40.43876266479492, "global_step": 159808, "epoch": 1320} {"train_loss": -39.44805145263672, "global_step": 159809, "epoch": 1320} {"train_loss": -39.824981689453125, "global_step": 159810, "epoch": 1320} {"train_loss": -40.52285385131836, "global_step": 159811, "epoch": 1320} {"train_loss": -40.74342346191406, "global_step": 159812, "epoch": 1320} {"train_loss": -40.56708908081055, "global_step": 159813, "epoch": 1320} {"train_loss": -40.73065185546875, "global_step": 159814, "epoch": 1320} {"train_loss": -40.50264358520508, "global_step": 159815, "epoch": 1320} {"train_loss": -40.86430740356445, "global_step": 159816, "epoch": 1320} {"train_loss": -40.77097702026367, "global_step": 159817, "epoch": 1320} {"train_loss": -40.40426254272461, "global_step": 159818, "epoch": 1320} {"train_loss": -40.57325744628906, "global_step": 159819, "epoch": 1320} {"train_loss": -40.736045837402344, "global_step": 159820, "epoch": 1320} {"train_loss": -40.49290084838867, "global_step": 159821, "epoch": 1320} {"train_loss": -40.546119689941406, "global_step": 159822, "epoch": 1320} {"train_loss": -40.353309631347656, "global_step": 159823, "epoch": 1320} {"train_loss": -40.31309127807617, "global_step": 159824, "epoch": 1320} {"train_loss": -41.056148529052734, "global_step": 159825, "epoch": 1320} {"train_loss": -40.823246002197266, "global_step": 159826, "epoch": 1320} {"train_loss": -40.755615234375, "global_step": 159827, "epoch": 1320} {"train_loss": -40.447391510009766, "global_step": 159828, "epoch": 1320} {"train_loss": -40.927452087402344, "global_step": 159829, "epoch": 1320} {"train_loss": -40.82741928100586, "global_step": 159830, "epoch": 1320} {"train_loss": -40.94623947143555, "global_step": 159831, "epoch": 1320} {"train_loss": -41.39127731323242, "global_step": 159832, "epoch": 1320} {"train_loss": -39.564552307128906, "global_step": 159833, "epoch": 1320} {"train_loss": -40.76858139038086, "global_step": 159834, "epoch": 1320} {"train_loss": -40.920433044433594, "global_step": 159835, "epoch": 1320} {"train_loss": -40.829280853271484, "global_step": 159836, "epoch": 1320} {"train_loss": -40.42207717895508, "global_step": 159837, "epoch": 1320} {"train_loss": -40.61324691772461, "global_step": 159838, "epoch": 1320} {"train_loss": -40.91844177246094, "global_step": 159839, "epoch": 1320} {"train_loss": -39.258132059712054, "global_step": 159840, "epoch": 1320, "val_loss": 2556480.75} {"train_loss": -41.0557861328125, "global_step": 159841, "epoch": 1321} {"train_loss": -40.958309173583984, "global_step": 159842, "epoch": 1321} {"train_loss": -40.9433708190918, "global_step": 159843, "epoch": 1321} {"train_loss": -41.40217208862305, "global_step": 159844, "epoch": 1321} {"train_loss": -41.14570236206055, "global_step": 159845, "epoch": 1321} {"train_loss": -41.340248107910156, "global_step": 159846, "epoch": 1321} {"train_loss": -40.98499298095703, "global_step": 159847, "epoch": 1321} {"train_loss": -41.4671516418457, "global_step": 159848, "epoch": 1321} {"train_loss": -41.15884017944336, "global_step": 159849, "epoch": 1321} {"train_loss": -41.20591354370117, "global_step": 159850, "epoch": 1321} {"train_loss": -41.51426315307617, "global_step": 159851, "epoch": 1321} {"train_loss": -40.736724853515625, "global_step": 159852, "epoch": 1321} {"train_loss": -41.179622650146484, "global_step": 159853, "epoch": 1321} {"train_loss": -40.94132614135742, "global_step": 159854, "epoch": 1321} {"train_loss": -41.75771713256836, "global_step": 159855, "epoch": 1321} {"train_loss": -40.923133850097656, "global_step": 159856, "epoch": 1321} {"train_loss": -41.01434326171875, "global_step": 159857, "epoch": 1321} {"train_loss": -41.915077209472656, "global_step": 159858, "epoch": 1321} {"train_loss": -41.04848098754883, "global_step": 159859, "epoch": 1321} {"train_loss": -40.962120056152344, "global_step": 159860, "epoch": 1321} {"train_loss": -41.560340881347656, "global_step": 159861, "epoch": 1321} {"train_loss": -40.97929000854492, "global_step": 159862, "epoch": 1321} {"train_loss": -40.47823715209961, "global_step": 159863, "epoch": 1321} {"train_loss": -40.75816345214844, "global_step": 159864, "epoch": 1321} {"train_loss": -39.39425277709961, "global_step": 159865, "epoch": 1321} {"train_loss": -39.04793930053711, "global_step": 159866, "epoch": 1321} {"train_loss": -39.81595230102539, "global_step": 159867, "epoch": 1321} {"train_loss": -41.55326461791992, "global_step": 159868, "epoch": 1321} {"train_loss": -40.59745407104492, "global_step": 159869, "epoch": 1321} {"train_loss": -37.5745964050293, "global_step": 159870, "epoch": 1321} {"train_loss": -40.63324737548828, "global_step": 159871, "epoch": 1321} {"train_loss": -40.45671463012695, "global_step": 159872, "epoch": 1321} {"train_loss": -37.396949768066406, "global_step": 159873, "epoch": 1321} {"train_loss": -39.322784423828125, "global_step": 159874, "epoch": 1321} {"train_loss": -39.652095794677734, "global_step": 159875, "epoch": 1321} {"train_loss": -39.6502799987793, "global_step": 159876, "epoch": 1321} {"train_loss": -39.345664978027344, "global_step": 159877, "epoch": 1321} {"train_loss": -40.916316986083984, "global_step": 159878, "epoch": 1321} {"train_loss": -40.88062286376953, "global_step": 159879, "epoch": 1321} {"train_loss": -39.628360748291016, "global_step": 159880, "epoch": 1321} {"train_loss": -39.90988540649414, "global_step": 159881, "epoch": 1321} {"train_loss": -38.52208709716797, "global_step": 159882, "epoch": 1321} {"train_loss": -40.061302185058594, "global_step": 159883, "epoch": 1321} {"train_loss": -40.587890625, "global_step": 159884, "epoch": 1321} {"train_loss": -39.177581787109375, "global_step": 159885, "epoch": 1321} {"train_loss": -39.82335662841797, "global_step": 159886, "epoch": 1321} {"train_loss": -40.92246627807617, "global_step": 159887, "epoch": 1321} {"train_loss": -39.82277297973633, "global_step": 159888, "epoch": 1321} {"train_loss": -41.19293975830078, "global_step": 159889, "epoch": 1321} {"train_loss": -39.5713005065918, "global_step": 159890, "epoch": 1321} {"train_loss": -40.32091522216797, "global_step": 159891, "epoch": 1321} {"train_loss": -39.954254150390625, "global_step": 159892, "epoch": 1321} {"train_loss": -40.83389663696289, "global_step": 159893, "epoch": 1321} {"train_loss": -40.10464096069336, "global_step": 159894, "epoch": 1321} {"train_loss": -40.074642181396484, "global_step": 159895, "epoch": 1321} {"train_loss": -40.202308654785156, "global_step": 159896, "epoch": 1321} {"train_loss": -40.592769622802734, "global_step": 159897, "epoch": 1321} {"train_loss": -40.24385452270508, "global_step": 159898, "epoch": 1321} {"train_loss": -39.98393249511719, "global_step": 159899, "epoch": 1321} {"train_loss": -40.45137023925781, "global_step": 159900, "epoch": 1321} {"train_loss": -39.92759704589844, "global_step": 159901, "epoch": 1321} {"train_loss": -40.5139274597168, "global_step": 159902, "epoch": 1321} {"train_loss": -39.8674430847168, "global_step": 159903, "epoch": 1321} {"train_loss": -41.1990852355957, "global_step": 159904, "epoch": 1321} {"train_loss": -39.98052215576172, "global_step": 159905, "epoch": 1321} {"train_loss": -40.93491744995117, "global_step": 159906, "epoch": 1321} {"train_loss": -39.96657180786133, "global_step": 159907, "epoch": 1321} {"train_loss": -40.27415466308594, "global_step": 159908, "epoch": 1321} {"train_loss": -40.06696319580078, "global_step": 159909, "epoch": 1321} {"train_loss": -39.11882019042969, "global_step": 159910, "epoch": 1321} {"train_loss": -39.32661056518555, "global_step": 159911, "epoch": 1321} {"train_loss": -40.68407440185547, "global_step": 159912, "epoch": 1321} {"train_loss": -40.058223724365234, "global_step": 159913, "epoch": 1321} {"train_loss": -40.84511947631836, "global_step": 159914, "epoch": 1321} {"train_loss": -41.149532318115234, "global_step": 159915, "epoch": 1321} {"train_loss": -39.94742202758789, "global_step": 159916, "epoch": 1321} {"train_loss": -40.755733489990234, "global_step": 159917, "epoch": 1321} {"train_loss": -40.76817321777344, "global_step": 159918, "epoch": 1321} {"train_loss": -40.442176818847656, "global_step": 159919, "epoch": 1321} {"train_loss": -41.18593215942383, "global_step": 159920, "epoch": 1321} {"train_loss": -40.46525573730469, "global_step": 159921, "epoch": 1321} {"train_loss": -40.5684928894043, "global_step": 159922, "epoch": 1321} {"train_loss": -40.62346649169922, "global_step": 159923, "epoch": 1321} {"train_loss": -40.299922943115234, "global_step": 159924, "epoch": 1321} {"train_loss": -40.43518829345703, "global_step": 159925, "epoch": 1321} {"train_loss": -41.19270324707031, "global_step": 159926, "epoch": 1321} {"train_loss": -40.266300201416016, "global_step": 159927, "epoch": 1321} {"train_loss": -40.89901351928711, "global_step": 159928, "epoch": 1321} {"train_loss": -40.897945404052734, "global_step": 159929, "epoch": 1321} {"train_loss": -37.0774040222168, "global_step": 159930, "epoch": 1321} {"train_loss": -40.98789596557617, "global_step": 159931, "epoch": 1321} {"train_loss": -38.95396041870117, "global_step": 159932, "epoch": 1321} {"train_loss": -40.02156066894531, "global_step": 159933, "epoch": 1321} {"train_loss": -41.36788558959961, "global_step": 159934, "epoch": 1321} {"train_loss": -40.76046371459961, "global_step": 159935, "epoch": 1321} {"train_loss": -40.530113220214844, "global_step": 159936, "epoch": 1321} {"train_loss": -40.25883865356445, "global_step": 159937, "epoch": 1321} {"train_loss": -38.93429183959961, "global_step": 159938, "epoch": 1321} {"train_loss": -41.3003044128418, "global_step": 159939, "epoch": 1321} {"train_loss": -40.586753845214844, "global_step": 159940, "epoch": 1321} {"train_loss": -40.37905502319336, "global_step": 159941, "epoch": 1321} {"train_loss": -40.480247497558594, "global_step": 159942, "epoch": 1321} {"train_loss": -40.87672424316406, "global_step": 159943, "epoch": 1321} {"train_loss": -34.81764221191406, "global_step": 159944, "epoch": 1321} {"train_loss": -38.28348159790039, "global_step": 159945, "epoch": 1321} {"train_loss": -39.83979034423828, "global_step": 159946, "epoch": 1321} {"train_loss": -39.84897994995117, "global_step": 159947, "epoch": 1321} {"train_loss": -38.850440979003906, "global_step": 159948, "epoch": 1321} {"train_loss": -40.8037109375, "global_step": 159949, "epoch": 1321} {"train_loss": -37.77061462402344, "global_step": 159950, "epoch": 1321} {"train_loss": -37.0926399230957, "global_step": 159951, "epoch": 1321} {"train_loss": -39.927852630615234, "global_step": 159952, "epoch": 1321} {"train_loss": -39.15001678466797, "global_step": 159953, "epoch": 1321} {"train_loss": -39.800537109375, "global_step": 159954, "epoch": 1321} {"train_loss": -39.4650993347168, "global_step": 159955, "epoch": 1321} {"train_loss": -38.38447570800781, "global_step": 159956, "epoch": 1321} {"train_loss": -38.92910385131836, "global_step": 159957, "epoch": 1321} {"train_loss": -40.178062438964844, "global_step": 159958, "epoch": 1321} {"train_loss": -39.4287223815918, "global_step": 159959, "epoch": 1321} {"train_loss": -40.3386116027832, "global_step": 159960, "epoch": 1321} {"train_loss": -40.19079492111837, "global_step": 159961, "epoch": 1321, "val_loss": 3537353.25} {"train_loss": -40.039302825927734, "global_step": 159962, "epoch": 1322} {"train_loss": -39.850929260253906, "global_step": 159963, "epoch": 1322} {"train_loss": -39.25680160522461, "global_step": 159964, "epoch": 1322} {"train_loss": -37.013614654541016, "global_step": 159965, "epoch": 1322} {"train_loss": -39.809669494628906, "global_step": 159966, "epoch": 1322} {"train_loss": -40.44866180419922, "global_step": 159967, "epoch": 1322} {"train_loss": -40.436500549316406, "global_step": 159968, "epoch": 1322} {"train_loss": -39.65366744995117, "global_step": 159969, "epoch": 1322} {"train_loss": -39.95656967163086, "global_step": 159970, "epoch": 1322} {"train_loss": -38.84477233886719, "global_step": 159971, "epoch": 1322} {"train_loss": -40.353607177734375, "global_step": 159972, "epoch": 1322} {"train_loss": -39.32512664794922, "global_step": 159973, "epoch": 1322} {"train_loss": -40.37784194946289, "global_step": 159974, "epoch": 1322} {"train_loss": -39.29752731323242, "global_step": 159975, "epoch": 1322} {"train_loss": -39.76445388793945, "global_step": 159976, "epoch": 1322} {"train_loss": -40.00871276855469, "global_step": 159977, "epoch": 1322} {"train_loss": -41.12070846557617, "global_step": 159978, "epoch": 1322} {"train_loss": -38.15287399291992, "global_step": 159979, "epoch": 1322} {"train_loss": -39.36395263671875, "global_step": 159980, "epoch": 1322} {"train_loss": -39.680213928222656, "global_step": 159981, "epoch": 1322} {"train_loss": -39.45457458496094, "global_step": 159982, "epoch": 1322} {"train_loss": -40.105098724365234, "global_step": 159983, "epoch": 1322} {"train_loss": -41.153133392333984, "global_step": 159984, "epoch": 1322} {"train_loss": -40.11309814453125, "global_step": 159985, "epoch": 1322} {"train_loss": -40.67866897583008, "global_step": 159986, "epoch": 1322} {"train_loss": -38.914764404296875, "global_step": 159987, "epoch": 1322} {"train_loss": -39.53004837036133, "global_step": 159988, "epoch": 1322} {"train_loss": -40.05656051635742, "global_step": 159989, "epoch": 1322} {"train_loss": -40.182159423828125, "global_step": 159990, "epoch": 1322} {"train_loss": -40.45751953125, "global_step": 159991, "epoch": 1322} {"train_loss": -40.186798095703125, "global_step": 159992, "epoch": 1322} {"train_loss": -40.317752838134766, "global_step": 159993, "epoch": 1322} {"train_loss": -40.319454193115234, "global_step": 159994, "epoch": 1322} {"train_loss": -41.237762451171875, "global_step": 159995, "epoch": 1322} {"train_loss": -40.58968734741211, "global_step": 159996, "epoch": 1322} {"train_loss": -40.92922592163086, "global_step": 159997, "epoch": 1322} {"train_loss": -41.01310729980469, "global_step": 159998, "epoch": 1322} {"train_loss": -41.027442932128906, "global_step": 159999, "epoch": 1322} {"train_loss": -40.73476791381836, "global_step": 160000, "epoch": 1322} {"train_loss": -40.31551742553711, "global_step": 160001, "epoch": 1322} {"train_loss": -40.51128387451172, "global_step": 160002, "epoch": 1322} {"train_loss": -40.78285598754883, "global_step": 160003, "epoch": 1322} {"train_loss": -40.67728805541992, "global_step": 160004, "epoch": 1322} {"train_loss": -40.94451141357422, "global_step": 160005, "epoch": 1322} {"train_loss": -40.96024703979492, "global_step": 160006, "epoch": 1322} {"train_loss": -41.10456848144531, "global_step": 160007, "epoch": 1322} {"train_loss": -40.53017044067383, "global_step": 160008, "epoch": 1322} {"train_loss": -41.44095993041992, "global_step": 160009, "epoch": 1322} {"train_loss": -40.13645553588867, "global_step": 160010, "epoch": 1322} {"train_loss": -41.305946350097656, "global_step": 160011, "epoch": 1322} {"train_loss": -40.97011947631836, "global_step": 160012, "epoch": 1322} {"train_loss": -40.86602783203125, "global_step": 160013, "epoch": 1322} {"train_loss": -41.74473190307617, "global_step": 160014, "epoch": 1322} {"train_loss": -41.3089714050293, "global_step": 160015, "epoch": 1322} {"train_loss": -41.80050277709961, "global_step": 160016, "epoch": 1322} {"train_loss": -41.04931640625, "global_step": 160017, "epoch": 1322} {"train_loss": -41.400146484375, "global_step": 160018, "epoch": 1322} {"train_loss": -41.525550842285156, "global_step": 160019, "epoch": 1322} {"train_loss": -40.057411193847656, "global_step": 160020, "epoch": 1322} {"train_loss": -41.02449417114258, "global_step": 160021, "epoch": 1322} {"train_loss": -40.3961296081543, "global_step": 160022, "epoch": 1322} {"train_loss": -41.14137649536133, "global_step": 160023, "epoch": 1322} {"train_loss": -41.10586929321289, "global_step": 160024, "epoch": 1322} {"train_loss": -41.126495361328125, "global_step": 160025, "epoch": 1322} {"train_loss": -41.11710739135742, "global_step": 160026, "epoch": 1322} {"train_loss": -40.8134765625, "global_step": 160027, "epoch": 1322} {"train_loss": -41.3841667175293, "global_step": 160028, "epoch": 1322} {"train_loss": -41.06016159057617, "global_step": 160029, "epoch": 1322} {"train_loss": -40.94099807739258, "global_step": 160030, "epoch": 1322} {"train_loss": -39.90285110473633, "global_step": 160031, "epoch": 1322} {"train_loss": -40.7225456237793, "global_step": 160032, "epoch": 1322} {"train_loss": -40.366004943847656, "global_step": 160033, "epoch": 1322} {"train_loss": -40.07292175292969, "global_step": 160034, "epoch": 1322} {"train_loss": -40.6504020690918, "global_step": 160035, "epoch": 1322} {"train_loss": -39.267921447753906, "global_step": 160036, "epoch": 1322} {"train_loss": -40.03139877319336, "global_step": 160037, "epoch": 1322} {"train_loss": -41.543373107910156, "global_step": 160038, "epoch": 1322} {"train_loss": -39.97003936767578, "global_step": 160039, "epoch": 1322} {"train_loss": -40.01216506958008, "global_step": 160040, "epoch": 1322} {"train_loss": -40.07548141479492, "global_step": 160041, "epoch": 1322} {"train_loss": -41.35703659057617, "global_step": 160042, "epoch": 1322} {"train_loss": -40.01721954345703, "global_step": 160043, "epoch": 1322} {"train_loss": -40.252933502197266, "global_step": 160044, "epoch": 1322} {"train_loss": -40.158199310302734, "global_step": 160045, "epoch": 1322} {"train_loss": -40.895301818847656, "global_step": 160046, "epoch": 1322} {"train_loss": -39.2664909362793, "global_step": 160047, "epoch": 1322} {"train_loss": -39.0291633605957, "global_step": 160048, "epoch": 1322} {"train_loss": -38.21684646606445, "global_step": 160049, "epoch": 1322} {"train_loss": -41.04741668701172, "global_step": 160050, "epoch": 1322} {"train_loss": -40.41423034667969, "global_step": 160051, "epoch": 1322} {"train_loss": -38.57432174682617, "global_step": 160052, "epoch": 1322} {"train_loss": -39.33047103881836, "global_step": 160053, "epoch": 1322} {"train_loss": -40.618133544921875, "global_step": 160054, "epoch": 1322} {"train_loss": -41.098487854003906, "global_step": 160055, "epoch": 1322} {"train_loss": -40.31644058227539, "global_step": 160056, "epoch": 1322} {"train_loss": -38.85934829711914, "global_step": 160057, "epoch": 1322} {"train_loss": -41.51802444458008, "global_step": 160058, "epoch": 1322} {"train_loss": -41.11381149291992, "global_step": 160059, "epoch": 1322} {"train_loss": -39.9791374206543, "global_step": 160060, "epoch": 1322} {"train_loss": -38.354713439941406, "global_step": 160061, "epoch": 1322} {"train_loss": -40.00373077392578, "global_step": 160062, "epoch": 1322} {"train_loss": -40.13068389892578, "global_step": 160063, "epoch": 1322} {"train_loss": -39.832061767578125, "global_step": 160064, "epoch": 1322} {"train_loss": -40.618743896484375, "global_step": 160065, "epoch": 1322} {"train_loss": -40.483272552490234, "global_step": 160066, "epoch": 1322} {"train_loss": -39.8829460144043, "global_step": 160067, "epoch": 1322} {"train_loss": -38.02289962768555, "global_step": 160068, "epoch": 1322} {"train_loss": -41.385189056396484, "global_step": 160069, "epoch": 1322} {"train_loss": -39.748287200927734, "global_step": 160070, "epoch": 1322} {"train_loss": -37.9098014831543, "global_step": 160071, "epoch": 1322} {"train_loss": -37.988372802734375, "global_step": 160072, "epoch": 1322} {"train_loss": -40.678951263427734, "global_step": 160073, "epoch": 1322} {"train_loss": -37.2381591796875, "global_step": 160074, "epoch": 1322} {"train_loss": -39.946022033691406, "global_step": 160075, "epoch": 1322} {"train_loss": -39.96586990356445, "global_step": 160076, "epoch": 1322} {"train_loss": -39.917686462402344, "global_step": 160077, "epoch": 1322} {"train_loss": -38.99309539794922, "global_step": 160078, "epoch": 1322} {"train_loss": -39.50558090209961, "global_step": 160079, "epoch": 1322} {"train_loss": -39.42290115356445, "global_step": 160080, "epoch": 1322} {"train_loss": -39.60142517089844, "global_step": 160081, "epoch": 1322} {"train_loss": -40.1964381509576, "global_step": 160082, "epoch": 1322, "val_loss": 2427999.75} {"train_loss": -40.796085357666016, "global_step": 160083, "epoch": 1323} {"train_loss": -39.05735397338867, "global_step": 160084, "epoch": 1323} {"train_loss": -39.66473388671875, "global_step": 160085, "epoch": 1323} {"train_loss": -40.19775390625, "global_step": 160086, "epoch": 1323} {"train_loss": -39.31361389160156, "global_step": 160087, "epoch": 1323} {"train_loss": -40.5449333190918, "global_step": 160088, "epoch": 1323} {"train_loss": -40.665748596191406, "global_step": 160089, "epoch": 1323} {"train_loss": -39.314300537109375, "global_step": 160090, "epoch": 1323} {"train_loss": -38.170650482177734, "global_step": 160091, "epoch": 1323} {"train_loss": -38.69496536254883, "global_step": 160092, "epoch": 1323} {"train_loss": -37.03239822387695, "global_step": 160093, "epoch": 1323} {"train_loss": -35.341670989990234, "global_step": 160094, "epoch": 1323} {"train_loss": -38.557674407958984, "global_step": 160095, "epoch": 1323} {"train_loss": -36.6646614074707, "global_step": 160096, "epoch": 1323} {"train_loss": -36.792171478271484, "global_step": 160097, "epoch": 1323} {"train_loss": -36.75130844116211, "global_step": 160098, "epoch": 1323} {"train_loss": -39.289710998535156, "global_step": 160099, "epoch": 1323} {"train_loss": -37.54622268676758, "global_step": 160100, "epoch": 1323} {"train_loss": -38.79206085205078, "global_step": 160101, "epoch": 1323} {"train_loss": -40.01167678833008, "global_step": 160102, "epoch": 1323} {"train_loss": -39.81696701049805, "global_step": 160103, "epoch": 1323} {"train_loss": -39.26628875732422, "global_step": 160104, "epoch": 1323} {"train_loss": -39.577816009521484, "global_step": 160105, "epoch": 1323} {"train_loss": -40.54685974121094, "global_step": 160106, "epoch": 1323} {"train_loss": -40.4650764465332, "global_step": 160107, "epoch": 1323} {"train_loss": -40.00840377807617, "global_step": 160108, "epoch": 1323} {"train_loss": -40.66776657104492, "global_step": 160109, "epoch": 1323} {"train_loss": -39.92119216918945, "global_step": 160110, "epoch": 1323} {"train_loss": -40.85720443725586, "global_step": 160111, "epoch": 1323} {"train_loss": -40.91996383666992, "global_step": 160112, "epoch": 1323} {"train_loss": -40.26295852661133, "global_step": 160113, "epoch": 1323} {"train_loss": -40.997459411621094, "global_step": 160114, "epoch": 1323} {"train_loss": -40.86910629272461, "global_step": 160115, "epoch": 1323} {"train_loss": -40.63948440551758, "global_step": 160116, "epoch": 1323} {"train_loss": -41.13657760620117, "global_step": 160117, "epoch": 1323} {"train_loss": -40.0379753112793, "global_step": 160118, "epoch": 1323} {"train_loss": -40.58730697631836, "global_step": 160119, "epoch": 1323} {"train_loss": -40.735408782958984, "global_step": 160120, "epoch": 1323} {"train_loss": -41.023799896240234, "global_step": 160121, "epoch": 1323} {"train_loss": -40.62670135498047, "global_step": 160122, "epoch": 1323} {"train_loss": -41.398101806640625, "global_step": 160123, "epoch": 1323} {"train_loss": -40.73843002319336, "global_step": 160124, "epoch": 1323} {"train_loss": -41.60181427001953, "global_step": 160125, "epoch": 1323} {"train_loss": -40.97983169555664, "global_step": 160126, "epoch": 1323} {"train_loss": -41.09267807006836, "global_step": 160127, "epoch": 1323} {"train_loss": -41.36211013793945, "global_step": 160128, "epoch": 1323} {"train_loss": -41.58279037475586, "global_step": 160129, "epoch": 1323} {"train_loss": -41.406944274902344, "global_step": 160130, "epoch": 1323} {"train_loss": -40.93428039550781, "global_step": 160131, "epoch": 1323} {"train_loss": -41.60128402709961, "global_step": 160132, "epoch": 1323} {"train_loss": -40.78834915161133, "global_step": 160133, "epoch": 1323} {"train_loss": -41.78084182739258, "global_step": 160134, "epoch": 1323} {"train_loss": -41.43374252319336, "global_step": 160135, "epoch": 1323} {"train_loss": -41.17399597167969, "global_step": 160136, "epoch": 1323} {"train_loss": -40.94025802612305, "global_step": 160137, "epoch": 1323} {"train_loss": -41.91026306152344, "global_step": 160138, "epoch": 1323} {"train_loss": -41.395408630371094, "global_step": 160139, "epoch": 1323} {"train_loss": -41.63079833984375, "global_step": 160140, "epoch": 1323} {"train_loss": -41.48800277709961, "global_step": 160141, "epoch": 1323} {"train_loss": -41.40450668334961, "global_step": 160142, "epoch": 1323} {"train_loss": -41.5971565246582, "global_step": 160143, "epoch": 1323} {"train_loss": -41.760345458984375, "global_step": 160144, "epoch": 1323} {"train_loss": -41.89901351928711, "global_step": 160145, "epoch": 1323} {"train_loss": -41.731449127197266, "global_step": 160146, "epoch": 1323} {"train_loss": -41.766292572021484, "global_step": 160147, "epoch": 1323} {"train_loss": -39.17446517944336, "global_step": 160148, "epoch": 1323} {"train_loss": -41.675567626953125, "global_step": 160149, "epoch": 1323} {"train_loss": -41.86365509033203, "global_step": 160150, "epoch": 1323} {"train_loss": -42.14373779296875, "global_step": 160151, "epoch": 1323} {"train_loss": -41.273860931396484, "global_step": 160152, "epoch": 1323} {"train_loss": -40.24972152709961, "global_step": 160153, "epoch": 1323} {"train_loss": -41.54275894165039, "global_step": 160154, "epoch": 1323} {"train_loss": -41.6417350769043, "global_step": 160155, "epoch": 1323} {"train_loss": -40.590301513671875, "global_step": 160156, "epoch": 1323} {"train_loss": -38.904239654541016, "global_step": 160157, "epoch": 1323} {"train_loss": -38.719276428222656, "global_step": 160158, "epoch": 1323} {"train_loss": -40.54975891113281, "global_step": 160159, "epoch": 1323} {"train_loss": -41.98884963989258, "global_step": 160160, "epoch": 1323} {"train_loss": -40.48269271850586, "global_step": 160161, "epoch": 1323} {"train_loss": -40.72762680053711, "global_step": 160162, "epoch": 1323} {"train_loss": -40.652339935302734, "global_step": 160163, "epoch": 1323} {"train_loss": -41.795833587646484, "global_step": 160164, "epoch": 1323} {"train_loss": -40.480690002441406, "global_step": 160165, "epoch": 1323} {"train_loss": -41.23902130126953, "global_step": 160166, "epoch": 1323} {"train_loss": -40.745849609375, "global_step": 160167, "epoch": 1323} {"train_loss": -39.8277587890625, "global_step": 160168, "epoch": 1323} {"train_loss": -40.671630859375, "global_step": 160169, "epoch": 1323} {"train_loss": -40.910221099853516, "global_step": 160170, "epoch": 1323} {"train_loss": -39.98069763183594, "global_step": 160171, "epoch": 1323} {"train_loss": -41.51958084106445, "global_step": 160172, "epoch": 1323} {"train_loss": -41.20315933227539, "global_step": 160173, "epoch": 1323} {"train_loss": -41.24898910522461, "global_step": 160174, "epoch": 1323} {"train_loss": -41.618141174316406, "global_step": 160175, "epoch": 1323} {"train_loss": -42.00611114501953, "global_step": 160176, "epoch": 1323} {"train_loss": -41.62284469604492, "global_step": 160177, "epoch": 1323} {"train_loss": -41.68846893310547, "global_step": 160178, "epoch": 1323} {"train_loss": -41.859859466552734, "global_step": 160179, "epoch": 1323} {"train_loss": -41.581024169921875, "global_step": 160180, "epoch": 1323} {"train_loss": -41.63924789428711, "global_step": 160181, "epoch": 1323} {"train_loss": -40.966583251953125, "global_step": 160182, "epoch": 1323} {"train_loss": -39.6364631652832, "global_step": 160183, "epoch": 1323} {"train_loss": -34.602352142333984, "global_step": 160184, "epoch": 1323} {"train_loss": -38.3709716796875, "global_step": 160185, "epoch": 1323} {"train_loss": -37.61006546020508, "global_step": 160186, "epoch": 1323} {"train_loss": -39.7334098815918, "global_step": 160187, "epoch": 1323} {"train_loss": -39.581138610839844, "global_step": 160188, "epoch": 1323} {"train_loss": -37.39736557006836, "global_step": 160189, "epoch": 1323} {"train_loss": -14.89365291595459, "global_step": 160190, "epoch": 1323} {"train_loss": -37.634033203125, "global_step": 160191, "epoch": 1323} {"train_loss": -29.48414421081543, "global_step": 160192, "epoch": 1323} {"train_loss": 5.897027492523193, "global_step": 160193, "epoch": 1323} {"train_loss": -7.7826762199401855, "global_step": 160194, "epoch": 1323} {"train_loss": -33.40185546875, "global_step": 160195, "epoch": 1323} {"train_loss": -34.24526596069336, "global_step": 160196, "epoch": 1323} {"train_loss": -22.553173065185547, "global_step": 160197, "epoch": 1323} {"train_loss": -27.472837448120117, "global_step": 160198, "epoch": 1323} {"train_loss": -29.483570098876953, "global_step": 160199, "epoch": 1323} {"train_loss": -31.600055694580078, "global_step": 160200, "epoch": 1323} {"train_loss": -35.2147331237793, "global_step": 160201, "epoch": 1323} {"train_loss": -32.6895866394043, "global_step": 160202, "epoch": 1323} {"train_loss": -38.70616097095584, "global_step": 160203, "epoch": 1323, "val_loss": 2465109.5} {"train_loss": -34.260135650634766, "global_step": 160204, "epoch": 1324} {"train_loss": -33.297454833984375, "global_step": 160205, "epoch": 1324} {"train_loss": -33.906612396240234, "global_step": 160206, "epoch": 1324} {"train_loss": -30.11561393737793, "global_step": 160207, "epoch": 1324} {"train_loss": -34.384803771972656, "global_step": 160208, "epoch": 1324} {"train_loss": -34.27923583984375, "global_step": 160209, "epoch": 1324} {"train_loss": -33.86452865600586, "global_step": 160210, "epoch": 1324} {"train_loss": -35.63958740234375, "global_step": 160211, "epoch": 1324} {"train_loss": -35.85628890991211, "global_step": 160212, "epoch": 1324} {"train_loss": -37.19525146484375, "global_step": 160213, "epoch": 1324} {"train_loss": -37.21973419189453, "global_step": 160214, "epoch": 1324} {"train_loss": -36.18464279174805, "global_step": 160215, "epoch": 1324} {"train_loss": -36.805667877197266, "global_step": 160216, "epoch": 1324} {"train_loss": -36.19509506225586, "global_step": 160217, "epoch": 1324} {"train_loss": -36.233455657958984, "global_step": 160218, "epoch": 1324} {"train_loss": -36.5601806640625, "global_step": 160219, "epoch": 1324} {"train_loss": -34.754905700683594, "global_step": 160220, "epoch": 1324} {"train_loss": -36.19961166381836, "global_step": 160221, "epoch": 1324} {"train_loss": -36.6109619140625, "global_step": 160222, "epoch": 1324} {"train_loss": -36.939247131347656, "global_step": 160223, "epoch": 1324} {"train_loss": -36.08510971069336, "global_step": 160224, "epoch": 1324} {"train_loss": -36.52753448486328, "global_step": 160225, "epoch": 1324} {"train_loss": -38.06842803955078, "global_step": 160226, "epoch": 1324} {"train_loss": -37.46348571777344, "global_step": 160227, "epoch": 1324} {"train_loss": -37.12674331665039, "global_step": 160228, "epoch": 1324} {"train_loss": -37.695125579833984, "global_step": 160229, "epoch": 1324} {"train_loss": -37.40126419067383, "global_step": 160230, "epoch": 1324} {"train_loss": -37.94700241088867, "global_step": 160231, "epoch": 1324} {"train_loss": -37.10538864135742, "global_step": 160232, "epoch": 1324} {"train_loss": -37.828800201416016, "global_step": 160233, "epoch": 1324} {"train_loss": -35.93035125732422, "global_step": 160234, "epoch": 1324} {"train_loss": -38.02470779418945, "global_step": 160235, "epoch": 1324} {"train_loss": -38.4979133605957, "global_step": 160236, "epoch": 1324} {"train_loss": -37.9657096862793, "global_step": 160237, "epoch": 1324} {"train_loss": -37.650264739990234, "global_step": 160238, "epoch": 1324} {"train_loss": -38.54854965209961, "global_step": 160239, "epoch": 1324} {"train_loss": -37.708091735839844, "global_step": 160240, "epoch": 1324} {"train_loss": -38.49079132080078, "global_step": 160241, "epoch": 1324} {"train_loss": -37.93403244018555, "global_step": 160242, "epoch": 1324} {"train_loss": -37.59300994873047, "global_step": 160243, "epoch": 1324} {"train_loss": -38.5380744934082, "global_step": 160244, "epoch": 1324} {"train_loss": -39.13442611694336, "global_step": 160245, "epoch": 1324} {"train_loss": -38.26910400390625, "global_step": 160246, "epoch": 1324} {"train_loss": -38.98604202270508, "global_step": 160247, "epoch": 1324} {"train_loss": -38.89463806152344, "global_step": 160248, "epoch": 1324} {"train_loss": -36.7480583190918, "global_step": 160249, "epoch": 1324} {"train_loss": -38.057857513427734, "global_step": 160250, "epoch": 1324} {"train_loss": -38.86164474487305, "global_step": 160251, "epoch": 1324} {"train_loss": -39.34638977050781, "global_step": 160252, "epoch": 1324} {"train_loss": -38.64118957519531, "global_step": 160253, "epoch": 1324} {"train_loss": -38.79643630981445, "global_step": 160254, "epoch": 1324} {"train_loss": -39.1367073059082, "global_step": 160255, "epoch": 1324} {"train_loss": -38.7343864440918, "global_step": 160256, "epoch": 1324} {"train_loss": -39.29454803466797, "global_step": 160257, "epoch": 1324} {"train_loss": -38.609737396240234, "global_step": 160258, "epoch": 1324} {"train_loss": -39.388484954833984, "global_step": 160259, "epoch": 1324} {"train_loss": -39.49126052856445, "global_step": 160260, "epoch": 1324} {"train_loss": -39.00161361694336, "global_step": 160261, "epoch": 1324} {"train_loss": -38.90971374511719, "global_step": 160262, "epoch": 1324} {"train_loss": -39.2674446105957, "global_step": 160263, "epoch": 1324} {"train_loss": -38.65205764770508, "global_step": 160264, "epoch": 1324} {"train_loss": -38.60519027709961, "global_step": 160265, "epoch": 1324} {"train_loss": -39.327186584472656, "global_step": 160266, "epoch": 1324} {"train_loss": -39.25175857543945, "global_step": 160267, "epoch": 1324} {"train_loss": -40.1422119140625, "global_step": 160268, "epoch": 1324} {"train_loss": -39.946998596191406, "global_step": 160269, "epoch": 1324} {"train_loss": -39.11268615722656, "global_step": 160270, "epoch": 1324} {"train_loss": -38.85885238647461, "global_step": 160271, "epoch": 1324} {"train_loss": -39.8050537109375, "global_step": 160272, "epoch": 1324} {"train_loss": -39.22981643676758, "global_step": 160273, "epoch": 1324} {"train_loss": -38.97239685058594, "global_step": 160274, "epoch": 1324} {"train_loss": -39.56134033203125, "global_step": 160275, "epoch": 1324} {"train_loss": -40.444461822509766, "global_step": 160276, "epoch": 1324} {"train_loss": -39.92888641357422, "global_step": 160277, "epoch": 1324} {"train_loss": -40.41474914550781, "global_step": 160278, "epoch": 1324} {"train_loss": -39.42085647583008, "global_step": 160279, "epoch": 1324} {"train_loss": -39.54737854003906, "global_step": 160280, "epoch": 1324} {"train_loss": -39.78160095214844, "global_step": 160281, "epoch": 1324} {"train_loss": -39.890872955322266, "global_step": 160282, "epoch": 1324} {"train_loss": -40.4147834777832, "global_step": 160283, "epoch": 1324} {"train_loss": -40.58418655395508, "global_step": 160284, "epoch": 1324} {"train_loss": -39.75440216064453, "global_step": 160285, "epoch": 1324} {"train_loss": -39.55361557006836, "global_step": 160286, "epoch": 1324} {"train_loss": -40.341827392578125, "global_step": 160287, "epoch": 1324} {"train_loss": -40.600685119628906, "global_step": 160288, "epoch": 1324} {"train_loss": -40.13080596923828, "global_step": 160289, "epoch": 1324} {"train_loss": -39.93579864501953, "global_step": 160290, "epoch": 1324} {"train_loss": -40.54218673706055, "global_step": 160291, "epoch": 1324} {"train_loss": -39.93280792236328, "global_step": 160292, "epoch": 1324} {"train_loss": -39.950157165527344, "global_step": 160293, "epoch": 1324} {"train_loss": -40.494544982910156, "global_step": 160294, "epoch": 1324} {"train_loss": -40.33857345581055, "global_step": 160295, "epoch": 1324} {"train_loss": -40.3807487487793, "global_step": 160296, "epoch": 1324} {"train_loss": -40.68193054199219, "global_step": 160297, "epoch": 1324} {"train_loss": -40.70540237426758, "global_step": 160298, "epoch": 1324} {"train_loss": -39.66830062866211, "global_step": 160299, "epoch": 1324} {"train_loss": -40.23670959472656, "global_step": 160300, "epoch": 1324} {"train_loss": -40.599571228027344, "global_step": 160301, "epoch": 1324} {"train_loss": -40.288780212402344, "global_step": 160302, "epoch": 1324} {"train_loss": -40.9428825378418, "global_step": 160303, "epoch": 1324} {"train_loss": -41.070560455322266, "global_step": 160304, "epoch": 1324} {"train_loss": -40.377052307128906, "global_step": 160305, "epoch": 1324} {"train_loss": -40.85393142700195, "global_step": 160306, "epoch": 1324} {"train_loss": -40.56756591796875, "global_step": 160307, "epoch": 1324} {"train_loss": -40.63996505737305, "global_step": 160308, "epoch": 1324} {"train_loss": -41.68621826171875, "global_step": 160309, "epoch": 1324} {"train_loss": -40.06002426147461, "global_step": 160310, "epoch": 1324} {"train_loss": -40.74625778198242, "global_step": 160311, "epoch": 1324} {"train_loss": -39.930145263671875, "global_step": 160312, "epoch": 1324} {"train_loss": -39.67118453979492, "global_step": 160313, "epoch": 1324} {"train_loss": -40.877811431884766, "global_step": 160314, "epoch": 1324} {"train_loss": -40.33695602416992, "global_step": 160315, "epoch": 1324} {"train_loss": -40.0219841003418, "global_step": 160316, "epoch": 1324} {"train_loss": -39.39279556274414, "global_step": 160317, "epoch": 1324} {"train_loss": -40.864959716796875, "global_step": 160318, "epoch": 1324} {"train_loss": -40.05657958984375, "global_step": 160319, "epoch": 1324} {"train_loss": -40.47373580932617, "global_step": 160320, "epoch": 1324} {"train_loss": -40.96955490112305, "global_step": 160321, "epoch": 1324} {"train_loss": -39.15950393676758, "global_step": 160322, "epoch": 1324} {"train_loss": -39.41329574584961, "global_step": 160323, "epoch": 1324} {"train_loss": -38.67189550793861, "global_step": 160324, "epoch": 1324, "val_loss": 2466628.5} {"train_loss": -39.897705078125, "global_step": 160325, "epoch": 1325} {"train_loss": -39.124507904052734, "global_step": 160326, "epoch": 1325} {"train_loss": -40.71974182128906, "global_step": 160327, "epoch": 1325} {"train_loss": -39.955875396728516, "global_step": 160328, "epoch": 1325} {"train_loss": -40.6676025390625, "global_step": 160329, "epoch": 1325} {"train_loss": -39.62265396118164, "global_step": 160330, "epoch": 1325} {"train_loss": -40.06313705444336, "global_step": 160331, "epoch": 1325} {"train_loss": -40.70342254638672, "global_step": 160332, "epoch": 1325} {"train_loss": -39.1584358215332, "global_step": 160333, "epoch": 1325} {"train_loss": -40.3092155456543, "global_step": 160334, "epoch": 1325} {"train_loss": -39.261653900146484, "global_step": 160335, "epoch": 1325} {"train_loss": -39.8147087097168, "global_step": 160336, "epoch": 1325} {"train_loss": -39.75694274902344, "global_step": 160337, "epoch": 1325} {"train_loss": -40.527809143066406, "global_step": 160338, "epoch": 1325} {"train_loss": -39.789459228515625, "global_step": 160339, "epoch": 1325} {"train_loss": -40.56904220581055, "global_step": 160340, "epoch": 1325} {"train_loss": -39.40981674194336, "global_step": 160341, "epoch": 1325} {"train_loss": -40.61776351928711, "global_step": 160342, "epoch": 1325} {"train_loss": -40.588287353515625, "global_step": 160343, "epoch": 1325} {"train_loss": -40.72235107421875, "global_step": 160344, "epoch": 1325} {"train_loss": -40.426822662353516, "global_step": 160345, "epoch": 1325} {"train_loss": -40.598419189453125, "global_step": 160346, "epoch": 1325} {"train_loss": -40.739723205566406, "global_step": 160347, "epoch": 1325} {"train_loss": -40.001285552978516, "global_step": 160348, "epoch": 1325} {"train_loss": -40.2706298828125, "global_step": 160349, "epoch": 1325} {"train_loss": -40.05884552001953, "global_step": 160350, "epoch": 1325} {"train_loss": -38.983455657958984, "global_step": 160351, "epoch": 1325} {"train_loss": -38.521968841552734, "global_step": 160352, "epoch": 1325} {"train_loss": -41.234954833984375, "global_step": 160353, "epoch": 1325} {"train_loss": -40.541259765625, "global_step": 160354, "epoch": 1325} {"train_loss": -39.556087493896484, "global_step": 160355, "epoch": 1325} {"train_loss": -38.01939392089844, "global_step": 160356, "epoch": 1325} {"train_loss": -38.66524124145508, "global_step": 160357, "epoch": 1325} {"train_loss": -39.84990310668945, "global_step": 160358, "epoch": 1325} {"train_loss": -40.420814514160156, "global_step": 160359, "epoch": 1325} {"train_loss": -40.080501556396484, "global_step": 160360, "epoch": 1325} {"train_loss": -40.42896270751953, "global_step": 160361, "epoch": 1325} {"train_loss": -40.513668060302734, "global_step": 160362, "epoch": 1325} {"train_loss": -40.52036666870117, "global_step": 160363, "epoch": 1325} {"train_loss": -41.021095275878906, "global_step": 160364, "epoch": 1325} {"train_loss": -40.6776123046875, "global_step": 160365, "epoch": 1325} {"train_loss": -40.88404083251953, "global_step": 160366, "epoch": 1325} {"train_loss": -39.80984115600586, "global_step": 160367, "epoch": 1325} {"train_loss": -40.55330276489258, "global_step": 160368, "epoch": 1325} {"train_loss": -40.434974670410156, "global_step": 160369, "epoch": 1325} {"train_loss": -39.7542724609375, "global_step": 160370, "epoch": 1325} {"train_loss": -40.42954635620117, "global_step": 160371, "epoch": 1325} {"train_loss": -40.76514434814453, "global_step": 160372, "epoch": 1325} {"train_loss": -40.26019287109375, "global_step": 160373, "epoch": 1325} {"train_loss": -37.46194076538086, "global_step": 160374, "epoch": 1325} {"train_loss": -37.112972259521484, "global_step": 160375, "epoch": 1325} {"train_loss": -37.309364318847656, "global_step": 160376, "epoch": 1325} {"train_loss": -39.59833526611328, "global_step": 160377, "epoch": 1325} {"train_loss": -39.53900146484375, "global_step": 160378, "epoch": 1325} {"train_loss": -39.0695915222168, "global_step": 160379, "epoch": 1325} {"train_loss": -36.583106994628906, "global_step": 160380, "epoch": 1325} {"train_loss": -36.38698959350586, "global_step": 160381, "epoch": 1325} {"train_loss": -38.28373336791992, "global_step": 160382, "epoch": 1325} {"train_loss": -38.01923370361328, "global_step": 160383, "epoch": 1325} {"train_loss": -35.73115921020508, "global_step": 160384, "epoch": 1325} {"train_loss": -36.043209075927734, "global_step": 160385, "epoch": 1325} {"train_loss": -38.35749435424805, "global_step": 160386, "epoch": 1325} {"train_loss": -35.271728515625, "global_step": 160387, "epoch": 1325} {"train_loss": -34.799076080322266, "global_step": 160388, "epoch": 1325} {"train_loss": -37.93941879272461, "global_step": 160389, "epoch": 1325} {"train_loss": -38.49863815307617, "global_step": 160390, "epoch": 1325} {"train_loss": -38.205501556396484, "global_step": 160391, "epoch": 1325} {"train_loss": -38.49481201171875, "global_step": 160392, "epoch": 1325} {"train_loss": -39.343631744384766, "global_step": 160393, "epoch": 1325} {"train_loss": -37.2325553894043, "global_step": 160394, "epoch": 1325} {"train_loss": -37.43941116333008, "global_step": 160395, "epoch": 1325} {"train_loss": -39.84725570678711, "global_step": 160396, "epoch": 1325} {"train_loss": -38.6575927734375, "global_step": 160397, "epoch": 1325} {"train_loss": -38.88399124145508, "global_step": 160398, "epoch": 1325} {"train_loss": -39.43108367919922, "global_step": 160399, "epoch": 1325} {"train_loss": -37.995201110839844, "global_step": 160400, "epoch": 1325} {"train_loss": -38.69838333129883, "global_step": 160401, "epoch": 1325} {"train_loss": -39.157344818115234, "global_step": 160402, "epoch": 1325} {"train_loss": -39.10773468017578, "global_step": 160403, "epoch": 1325} {"train_loss": -39.38778305053711, "global_step": 160404, "epoch": 1325} {"train_loss": -39.62063217163086, "global_step": 160405, "epoch": 1325} {"train_loss": -40.13532638549805, "global_step": 160406, "epoch": 1325} {"train_loss": -37.815467834472656, "global_step": 160407, "epoch": 1325} {"train_loss": -39.556396484375, "global_step": 160408, "epoch": 1325} {"train_loss": -40.24503707885742, "global_step": 160409, "epoch": 1325} {"train_loss": -39.26700973510742, "global_step": 160410, "epoch": 1325} {"train_loss": -40.0815544128418, "global_step": 160411, "epoch": 1325} {"train_loss": -40.97309112548828, "global_step": 160412, "epoch": 1325} {"train_loss": -40.15625762939453, "global_step": 160413, "epoch": 1325} {"train_loss": -40.611141204833984, "global_step": 160414, "epoch": 1325} {"train_loss": -40.14139938354492, "global_step": 160415, "epoch": 1325} {"train_loss": -40.4494743347168, "global_step": 160416, "epoch": 1325} {"train_loss": -39.459320068359375, "global_step": 160417, "epoch": 1325} {"train_loss": -40.37832260131836, "global_step": 160418, "epoch": 1325} {"train_loss": -40.43341827392578, "global_step": 160419, "epoch": 1325} {"train_loss": -39.89472198486328, "global_step": 160420, "epoch": 1325} {"train_loss": -40.0152702331543, "global_step": 160421, "epoch": 1325} {"train_loss": -40.39944076538086, "global_step": 160422, "epoch": 1325} {"train_loss": -40.225685119628906, "global_step": 160423, "epoch": 1325} {"train_loss": -40.62154006958008, "global_step": 160424, "epoch": 1325} {"train_loss": -40.6215934753418, "global_step": 160425, "epoch": 1325} {"train_loss": -40.69015121459961, "global_step": 160426, "epoch": 1325} {"train_loss": -40.54021072387695, "global_step": 160427, "epoch": 1325} {"train_loss": -40.57646942138672, "global_step": 160428, "epoch": 1325} {"train_loss": -40.96595001220703, "global_step": 160429, "epoch": 1325} {"train_loss": -40.99253463745117, "global_step": 160430, "epoch": 1325} {"train_loss": -40.976837158203125, "global_step": 160431, "epoch": 1325} {"train_loss": -41.06289291381836, "global_step": 160432, "epoch": 1325} {"train_loss": -41.19162368774414, "global_step": 160433, "epoch": 1325} {"train_loss": -41.08675765991211, "global_step": 160434, "epoch": 1325} {"train_loss": -41.227413177490234, "global_step": 160435, "epoch": 1325} {"train_loss": -41.03635787963867, "global_step": 160436, "epoch": 1325} {"train_loss": -40.99424362182617, "global_step": 160437, "epoch": 1325} {"train_loss": -41.27786636352539, "global_step": 160438, "epoch": 1325} {"train_loss": -41.063453674316406, "global_step": 160439, "epoch": 1325} {"train_loss": -41.581443786621094, "global_step": 160440, "epoch": 1325} {"train_loss": -41.45990753173828, "global_step": 160441, "epoch": 1325} {"train_loss": -41.597572326660156, "global_step": 160442, "epoch": 1325} {"train_loss": -41.29832077026367, "global_step": 160443, "epoch": 1325} {"train_loss": -40.98978805541992, "global_step": 160444, "epoch": 1325} {"train_loss": -39.7167237967499, "global_step": 160445, "epoch": 1325, "val_loss": 2464535.75} {"train_loss": -41.10038375854492, "global_step": 160446, "epoch": 1326} {"train_loss": -41.100406646728516, "global_step": 160447, "epoch": 1326} {"train_loss": -41.283748626708984, "global_step": 160448, "epoch": 1326} {"train_loss": -40.63178634643555, "global_step": 160449, "epoch": 1326} {"train_loss": -39.141387939453125, "global_step": 160450, "epoch": 1326} {"train_loss": -39.239959716796875, "global_step": 160451, "epoch": 1326} {"train_loss": -40.521881103515625, "global_step": 160452, "epoch": 1326} {"train_loss": -40.68534469604492, "global_step": 160453, "epoch": 1326} {"train_loss": -39.29273223876953, "global_step": 160454, "epoch": 1326} {"train_loss": -40.43767166137695, "global_step": 160455, "epoch": 1326} {"train_loss": -40.22676467895508, "global_step": 160456, "epoch": 1326} {"train_loss": -40.883480072021484, "global_step": 160457, "epoch": 1326} {"train_loss": -40.0307731628418, "global_step": 160458, "epoch": 1326} {"train_loss": -40.556793212890625, "global_step": 160459, "epoch": 1326} {"train_loss": -39.957855224609375, "global_step": 160460, "epoch": 1326} {"train_loss": -40.0264778137207, "global_step": 160461, "epoch": 1326} {"train_loss": -39.80316925048828, "global_step": 160462, "epoch": 1326} {"train_loss": -40.28353500366211, "global_step": 160463, "epoch": 1326} {"train_loss": -39.33470153808594, "global_step": 160464, "epoch": 1326} {"train_loss": -39.800960540771484, "global_step": 160465, "epoch": 1326} {"train_loss": -39.97003173828125, "global_step": 160466, "epoch": 1326} {"train_loss": -38.07241439819336, "global_step": 160467, "epoch": 1326} {"train_loss": -38.95235061645508, "global_step": 160468, "epoch": 1326} {"train_loss": -39.2727165222168, "global_step": 160469, "epoch": 1326} {"train_loss": -40.42739486694336, "global_step": 160470, "epoch": 1326} {"train_loss": -40.097900390625, "global_step": 160471, "epoch": 1326} {"train_loss": -37.07070541381836, "global_step": 160472, "epoch": 1326} {"train_loss": -37.52547073364258, "global_step": 160473, "epoch": 1326} {"train_loss": -39.03609848022461, "global_step": 160474, "epoch": 1326} {"train_loss": -39.018375396728516, "global_step": 160475, "epoch": 1326} {"train_loss": -41.01853561401367, "global_step": 160476, "epoch": 1326} {"train_loss": -37.38209915161133, "global_step": 160477, "epoch": 1326} {"train_loss": -38.10926055908203, "global_step": 160478, "epoch": 1326} {"train_loss": -39.9918327331543, "global_step": 160479, "epoch": 1326} {"train_loss": -37.40102005004883, "global_step": 160480, "epoch": 1326} {"train_loss": -39.212459564208984, "global_step": 160481, "epoch": 1326} {"train_loss": -39.50889205932617, "global_step": 160482, "epoch": 1326} {"train_loss": -37.49250411987305, "global_step": 160483, "epoch": 1326} {"train_loss": -40.05703353881836, "global_step": 160484, "epoch": 1326} {"train_loss": -37.90254592895508, "global_step": 160485, "epoch": 1326} {"train_loss": -40.73691940307617, "global_step": 160486, "epoch": 1326} {"train_loss": -38.99069595336914, "global_step": 160487, "epoch": 1326} {"train_loss": -36.68123245239258, "global_step": 160488, "epoch": 1326} {"train_loss": -38.56291580200195, "global_step": 160489, "epoch": 1326} {"train_loss": -37.7517204284668, "global_step": 160490, "epoch": 1326} {"train_loss": -40.09879684448242, "global_step": 160491, "epoch": 1326} {"train_loss": -36.657711029052734, "global_step": 160492, "epoch": 1326} {"train_loss": -36.6976203918457, "global_step": 160493, "epoch": 1326} {"train_loss": -39.83718490600586, "global_step": 160494, "epoch": 1326} {"train_loss": -38.01626205444336, "global_step": 160495, "epoch": 1326} {"train_loss": -38.30218505859375, "global_step": 160496, "epoch": 1326} {"train_loss": -39.156715393066406, "global_step": 160497, "epoch": 1326} {"train_loss": -39.11225509643555, "global_step": 160498, "epoch": 1326} {"train_loss": -38.09104537963867, "global_step": 160499, "epoch": 1326} {"train_loss": -40.105018615722656, "global_step": 160500, "epoch": 1326} {"train_loss": -38.306060791015625, "global_step": 160501, "epoch": 1326} {"train_loss": -40.55892562866211, "global_step": 160502, "epoch": 1326} {"train_loss": -38.15525817871094, "global_step": 160503, "epoch": 1326} {"train_loss": -38.9314079284668, "global_step": 160504, "epoch": 1326} {"train_loss": -40.175655364990234, "global_step": 160505, "epoch": 1326} {"train_loss": -39.141571044921875, "global_step": 160506, "epoch": 1326} {"train_loss": -39.97747802734375, "global_step": 160507, "epoch": 1326} {"train_loss": -39.635231018066406, "global_step": 160508, "epoch": 1326} {"train_loss": -38.72134017944336, "global_step": 160509, "epoch": 1326} {"train_loss": -40.774139404296875, "global_step": 160510, "epoch": 1326} {"train_loss": -39.10181427001953, "global_step": 160511, "epoch": 1326} {"train_loss": -40.283634185791016, "global_step": 160512, "epoch": 1326} {"train_loss": -38.259857177734375, "global_step": 160513, "epoch": 1326} {"train_loss": -40.352230072021484, "global_step": 160514, "epoch": 1326} {"train_loss": -39.6268196105957, "global_step": 160515, "epoch": 1326} {"train_loss": -40.04853439331055, "global_step": 160516, "epoch": 1326} {"train_loss": -40.05881118774414, "global_step": 160517, "epoch": 1326} {"train_loss": -40.234500885009766, "global_step": 160518, "epoch": 1326} {"train_loss": -40.64348220825195, "global_step": 160519, "epoch": 1326} {"train_loss": -39.711944580078125, "global_step": 160520, "epoch": 1326} {"train_loss": -39.580238342285156, "global_step": 160521, "epoch": 1326} {"train_loss": -39.72652053833008, "global_step": 160522, "epoch": 1326} {"train_loss": -39.663429260253906, "global_step": 160523, "epoch": 1326} {"train_loss": -40.29707717895508, "global_step": 160524, "epoch": 1326} {"train_loss": -39.16677474975586, "global_step": 160525, "epoch": 1326} {"train_loss": -40.60723876953125, "global_step": 160526, "epoch": 1326} {"train_loss": -40.067447662353516, "global_step": 160527, "epoch": 1326} {"train_loss": -39.30242919921875, "global_step": 160528, "epoch": 1326} {"train_loss": -40.42378234863281, "global_step": 160529, "epoch": 1326} {"train_loss": -39.29150390625, "global_step": 160530, "epoch": 1326} {"train_loss": -40.037654876708984, "global_step": 160531, "epoch": 1326} {"train_loss": -40.31218338012695, "global_step": 160532, "epoch": 1326} {"train_loss": -40.29315185546875, "global_step": 160533, "epoch": 1326} {"train_loss": -40.35633087158203, "global_step": 160534, "epoch": 1326} {"train_loss": -40.05752182006836, "global_step": 160535, "epoch": 1326} {"train_loss": -40.74188995361328, "global_step": 160536, "epoch": 1326} {"train_loss": -40.70302963256836, "global_step": 160537, "epoch": 1326} {"train_loss": -40.69758987426758, "global_step": 160538, "epoch": 1326} {"train_loss": -40.931182861328125, "global_step": 160539, "epoch": 1326} {"train_loss": -40.64292526245117, "global_step": 160540, "epoch": 1326} {"train_loss": -41.02748489379883, "global_step": 160541, "epoch": 1326} {"train_loss": -41.0976448059082, "global_step": 160542, "epoch": 1326} {"train_loss": -40.983154296875, "global_step": 160543, "epoch": 1326} {"train_loss": -41.120296478271484, "global_step": 160544, "epoch": 1326} {"train_loss": -41.58565902709961, "global_step": 160545, "epoch": 1326} {"train_loss": -41.086181640625, "global_step": 160546, "epoch": 1326} {"train_loss": -40.67707061767578, "global_step": 160547, "epoch": 1326} {"train_loss": -41.179603576660156, "global_step": 160548, "epoch": 1326} {"train_loss": -41.37775802612305, "global_step": 160549, "epoch": 1326} {"train_loss": -41.150081634521484, "global_step": 160550, "epoch": 1326} {"train_loss": -41.24015426635742, "global_step": 160551, "epoch": 1326} {"train_loss": -41.34767532348633, "global_step": 160552, "epoch": 1326} {"train_loss": -41.2249755859375, "global_step": 160553, "epoch": 1326} {"train_loss": -41.715576171875, "global_step": 160554, "epoch": 1326} {"train_loss": -41.514862060546875, "global_step": 160555, "epoch": 1326} {"train_loss": -41.358394622802734, "global_step": 160556, "epoch": 1326} {"train_loss": -41.80975341796875, "global_step": 160557, "epoch": 1326} {"train_loss": -41.3383674621582, "global_step": 160558, "epoch": 1326} {"train_loss": -41.03508377075195, "global_step": 160559, "epoch": 1326} {"train_loss": -41.306697845458984, "global_step": 160560, "epoch": 1326} {"train_loss": -41.01463317871094, "global_step": 160561, "epoch": 1326} {"train_loss": -41.71049499511719, "global_step": 160562, "epoch": 1326} {"train_loss": -41.350589752197266, "global_step": 160563, "epoch": 1326} {"train_loss": -40.8046875, "global_step": 160564, "epoch": 1326} {"train_loss": -40.76266098022461, "global_step": 160565, "epoch": 1326} {"train_loss": -39.90391543679986, "global_step": 160566, "epoch": 1326, "val_loss": 2494954.0} {"train_loss": -41.44783401489258, "global_step": 160567, "epoch": 1327} {"train_loss": -41.372406005859375, "global_step": 160568, "epoch": 1327} {"train_loss": -41.36887741088867, "global_step": 160569, "epoch": 1327} {"train_loss": -40.68705368041992, "global_step": 160570, "epoch": 1327} {"train_loss": -42.18391418457031, "global_step": 160571, "epoch": 1327} {"train_loss": -41.78329086303711, "global_step": 160572, "epoch": 1327} {"train_loss": -41.051063537597656, "global_step": 160573, "epoch": 1327} {"train_loss": -41.324337005615234, "global_step": 160574, "epoch": 1327} {"train_loss": -41.552490234375, "global_step": 160575, "epoch": 1327} {"train_loss": -41.8695182800293, "global_step": 160576, "epoch": 1327} {"train_loss": -41.70917892456055, "global_step": 160577, "epoch": 1327} {"train_loss": -41.1352424621582, "global_step": 160578, "epoch": 1327} {"train_loss": -41.6099739074707, "global_step": 160579, "epoch": 1327} {"train_loss": -40.892303466796875, "global_step": 160580, "epoch": 1327} {"train_loss": -40.59735107421875, "global_step": 160581, "epoch": 1327} {"train_loss": -40.781429290771484, "global_step": 160582, "epoch": 1327} {"train_loss": -41.04677963256836, "global_step": 160583, "epoch": 1327} {"train_loss": -40.331783294677734, "global_step": 160584, "epoch": 1327} {"train_loss": -40.8624267578125, "global_step": 160585, "epoch": 1327} {"train_loss": -39.70159149169922, "global_step": 160586, "epoch": 1327} {"train_loss": -40.6413688659668, "global_step": 160587, "epoch": 1327} {"train_loss": -40.451229095458984, "global_step": 160588, "epoch": 1327} {"train_loss": -40.139156341552734, "global_step": 160589, "epoch": 1327} {"train_loss": -41.326717376708984, "global_step": 160590, "epoch": 1327} {"train_loss": -41.06161117553711, "global_step": 160591, "epoch": 1327} {"train_loss": -40.00156784057617, "global_step": 160592, "epoch": 1327} {"train_loss": -40.89860153198242, "global_step": 160593, "epoch": 1327} {"train_loss": -36.5224723815918, "global_step": 160594, "epoch": 1327} {"train_loss": -39.458316802978516, "global_step": 160595, "epoch": 1327} {"train_loss": -38.829166412353516, "global_step": 160596, "epoch": 1327} {"train_loss": -38.620216369628906, "global_step": 160597, "epoch": 1327} {"train_loss": -40.046539306640625, "global_step": 160598, "epoch": 1327} {"train_loss": -39.280635833740234, "global_step": 160599, "epoch": 1327} {"train_loss": -40.932586669921875, "global_step": 160600, "epoch": 1327} {"train_loss": -38.9911994934082, "global_step": 160601, "epoch": 1327} {"train_loss": -40.00156784057617, "global_step": 160602, "epoch": 1327} {"train_loss": -38.32052230834961, "global_step": 160603, "epoch": 1327} {"train_loss": -39.012359619140625, "global_step": 160604, "epoch": 1327} {"train_loss": -40.75850296020508, "global_step": 160605, "epoch": 1327} {"train_loss": -38.184303283691406, "global_step": 160606, "epoch": 1327} {"train_loss": -40.07719802856445, "global_step": 160607, "epoch": 1327} {"train_loss": -40.32622146606445, "global_step": 160608, "epoch": 1327} {"train_loss": -39.59016036987305, "global_step": 160609, "epoch": 1327} {"train_loss": -40.197357177734375, "global_step": 160610, "epoch": 1327} {"train_loss": -39.94260787963867, "global_step": 160611, "epoch": 1327} {"train_loss": -40.090633392333984, "global_step": 160612, "epoch": 1327} {"train_loss": -39.84836959838867, "global_step": 160613, "epoch": 1327} {"train_loss": -39.359344482421875, "global_step": 160614, "epoch": 1327} {"train_loss": -40.75110626220703, "global_step": 160615, "epoch": 1327} {"train_loss": -41.2051887512207, "global_step": 160616, "epoch": 1327} {"train_loss": -40.44319534301758, "global_step": 160617, "epoch": 1327} {"train_loss": -41.039710998535156, "global_step": 160618, "epoch": 1327} {"train_loss": -39.95771789550781, "global_step": 160619, "epoch": 1327} {"train_loss": -40.68684005737305, "global_step": 160620, "epoch": 1327} {"train_loss": -40.80963897705078, "global_step": 160621, "epoch": 1327} {"train_loss": -40.56367111206055, "global_step": 160622, "epoch": 1327} {"train_loss": -40.952754974365234, "global_step": 160623, "epoch": 1327} {"train_loss": -40.1878776550293, "global_step": 160624, "epoch": 1327} {"train_loss": -39.50366973876953, "global_step": 160625, "epoch": 1327} {"train_loss": -40.88887023925781, "global_step": 160626, "epoch": 1327} {"train_loss": -39.7371940612793, "global_step": 160627, "epoch": 1327} {"train_loss": -40.82427978515625, "global_step": 160628, "epoch": 1327} {"train_loss": -40.85288619995117, "global_step": 160629, "epoch": 1327} {"train_loss": -41.14152145385742, "global_step": 160630, "epoch": 1327} {"train_loss": -40.56374740600586, "global_step": 160631, "epoch": 1327} {"train_loss": -40.02976989746094, "global_step": 160632, "epoch": 1327} {"train_loss": -40.902870178222656, "global_step": 160633, "epoch": 1327} {"train_loss": -41.02384948730469, "global_step": 160634, "epoch": 1327} {"train_loss": -40.65726852416992, "global_step": 160635, "epoch": 1327} {"train_loss": -41.03336715698242, "global_step": 160636, "epoch": 1327} {"train_loss": -41.39995574951172, "global_step": 160637, "epoch": 1327} {"train_loss": -40.49650955200195, "global_step": 160638, "epoch": 1327} {"train_loss": -41.064117431640625, "global_step": 160639, "epoch": 1327} {"train_loss": -41.68434143066406, "global_step": 160640, "epoch": 1327} {"train_loss": -40.57855224609375, "global_step": 160641, "epoch": 1327} {"train_loss": -39.994224548339844, "global_step": 160642, "epoch": 1327} {"train_loss": -39.620845794677734, "global_step": 160643, "epoch": 1327} {"train_loss": -40.6502685546875, "global_step": 160644, "epoch": 1327} {"train_loss": -40.77309799194336, "global_step": 160645, "epoch": 1327} {"train_loss": -39.912227630615234, "global_step": 160646, "epoch": 1327} {"train_loss": -39.875186920166016, "global_step": 160647, "epoch": 1327} {"train_loss": -39.90837478637695, "global_step": 160648, "epoch": 1327} {"train_loss": -39.43808364868164, "global_step": 160649, "epoch": 1327} {"train_loss": -40.862552642822266, "global_step": 160650, "epoch": 1327} {"train_loss": -40.96352767944336, "global_step": 160651, "epoch": 1327} {"train_loss": -40.726253509521484, "global_step": 160652, "epoch": 1327} {"train_loss": -40.98691940307617, "global_step": 160653, "epoch": 1327} {"train_loss": -41.56598663330078, "global_step": 160654, "epoch": 1327} {"train_loss": -40.69208908081055, "global_step": 160655, "epoch": 1327} {"train_loss": -41.23069381713867, "global_step": 160656, "epoch": 1327} {"train_loss": -41.57966995239258, "global_step": 160657, "epoch": 1327} {"train_loss": -40.712890625, "global_step": 160658, "epoch": 1327} {"train_loss": -40.94184112548828, "global_step": 160659, "epoch": 1327} {"train_loss": -41.262996673583984, "global_step": 160660, "epoch": 1327} {"train_loss": -41.69217300415039, "global_step": 160661, "epoch": 1327} {"train_loss": -41.876895904541016, "global_step": 160662, "epoch": 1327} {"train_loss": -41.472389221191406, "global_step": 160663, "epoch": 1327} {"train_loss": -41.575069427490234, "global_step": 160664, "epoch": 1327} {"train_loss": -41.86735916137695, "global_step": 160665, "epoch": 1327} {"train_loss": -41.464534759521484, "global_step": 160666, "epoch": 1327} {"train_loss": -41.28091049194336, "global_step": 160667, "epoch": 1327} {"train_loss": -42.01654815673828, "global_step": 160668, "epoch": 1327} {"train_loss": -41.488075256347656, "global_step": 160669, "epoch": 1327} {"train_loss": -41.46494674682617, "global_step": 160670, "epoch": 1327} {"train_loss": -41.591102600097656, "global_step": 160671, "epoch": 1327} {"train_loss": -41.47848892211914, "global_step": 160672, "epoch": 1327} {"train_loss": -41.4664192199707, "global_step": 160673, "epoch": 1327} {"train_loss": -41.56748580932617, "global_step": 160674, "epoch": 1327} {"train_loss": -41.86183547973633, "global_step": 160675, "epoch": 1327} {"train_loss": -40.6824951171875, "global_step": 160676, "epoch": 1327} {"train_loss": -41.27884292602539, "global_step": 160677, "epoch": 1327} {"train_loss": -41.81113052368164, "global_step": 160678, "epoch": 1327} {"train_loss": -41.202613830566406, "global_step": 160679, "epoch": 1327} {"train_loss": -38.41221237182617, "global_step": 160680, "epoch": 1327} {"train_loss": -38.160579681396484, "global_step": 160681, "epoch": 1327} {"train_loss": -40.19672775268555, "global_step": 160682, "epoch": 1327} {"train_loss": -41.2760124206543, "global_step": 160683, "epoch": 1327} {"train_loss": -40.93024826049805, "global_step": 160684, "epoch": 1327} {"train_loss": -39.87157440185547, "global_step": 160685, "epoch": 1327} {"train_loss": -40.32243728637695, "global_step": 160686, "epoch": 1327} {"train_loss": -40.629936848790194, "global_step": 160687, "epoch": 1327, "val_loss": 2409006.0} {"train_loss": -38.657501220703125, "global_step": 160688, "epoch": 1328} {"train_loss": -39.2183723449707, "global_step": 160689, "epoch": 1328} {"train_loss": -41.07509994506836, "global_step": 160690, "epoch": 1328} {"train_loss": -41.47572708129883, "global_step": 160691, "epoch": 1328} {"train_loss": -39.73183059692383, "global_step": 160692, "epoch": 1328} {"train_loss": -40.125099182128906, "global_step": 160693, "epoch": 1328} {"train_loss": -41.37281799316406, "global_step": 160694, "epoch": 1328} {"train_loss": -39.587501525878906, "global_step": 160695, "epoch": 1328} {"train_loss": -38.04641342163086, "global_step": 160696, "epoch": 1328} {"train_loss": -40.05303955078125, "global_step": 160697, "epoch": 1328} {"train_loss": -40.15595245361328, "global_step": 160698, "epoch": 1328} {"train_loss": -40.17985534667969, "global_step": 160699, "epoch": 1328} {"train_loss": -39.070899963378906, "global_step": 160700, "epoch": 1328} {"train_loss": -34.803688049316406, "global_step": 160701, "epoch": 1328} {"train_loss": -30.088476181030273, "global_step": 160702, "epoch": 1328} {"train_loss": -30.372039794921875, "global_step": 160703, "epoch": 1328} {"train_loss": -34.02931594848633, "global_step": 160704, "epoch": 1328} {"train_loss": -40.24260330200195, "global_step": 160705, "epoch": 1328} {"train_loss": -39.322853088378906, "global_step": 160706, "epoch": 1328} {"train_loss": -38.35239791870117, "global_step": 160707, "epoch": 1328} {"train_loss": -40.65328598022461, "global_step": 160708, "epoch": 1328} {"train_loss": -38.1330680847168, "global_step": 160709, "epoch": 1328} {"train_loss": -39.30195236206055, "global_step": 160710, "epoch": 1328} {"train_loss": -39.82355880737305, "global_step": 160711, "epoch": 1328} {"train_loss": -37.9626350402832, "global_step": 160712, "epoch": 1328} {"train_loss": -39.48401641845703, "global_step": 160713, "epoch": 1328} {"train_loss": -37.14316940307617, "global_step": 160714, "epoch": 1328} {"train_loss": -40.69512939453125, "global_step": 160715, "epoch": 1328} {"train_loss": -36.779293060302734, "global_step": 160716, "epoch": 1328} {"train_loss": -39.55424880981445, "global_step": 160717, "epoch": 1328} {"train_loss": -39.170475006103516, "global_step": 160718, "epoch": 1328} {"train_loss": -38.868186950683594, "global_step": 160719, "epoch": 1328} {"train_loss": -38.90299987792969, "global_step": 160720, "epoch": 1328} {"train_loss": -38.84881591796875, "global_step": 160721, "epoch": 1328} {"train_loss": -38.07606887817383, "global_step": 160722, "epoch": 1328} {"train_loss": -39.893035888671875, "global_step": 160723, "epoch": 1328} {"train_loss": -39.53137969970703, "global_step": 160724, "epoch": 1328} {"train_loss": -40.4547233581543, "global_step": 160725, "epoch": 1328} {"train_loss": -39.108856201171875, "global_step": 160726, "epoch": 1328} {"train_loss": -40.63213348388672, "global_step": 160727, "epoch": 1328} {"train_loss": -38.60256576538086, "global_step": 160728, "epoch": 1328} {"train_loss": -40.298431396484375, "global_step": 160729, "epoch": 1328} {"train_loss": -39.45795822143555, "global_step": 160730, "epoch": 1328} {"train_loss": -39.75344467163086, "global_step": 160731, "epoch": 1328} {"train_loss": -40.15322494506836, "global_step": 160732, "epoch": 1328} {"train_loss": -39.97759246826172, "global_step": 160733, "epoch": 1328} {"train_loss": -40.92356491088867, "global_step": 160734, "epoch": 1328} {"train_loss": -40.997493743896484, "global_step": 160735, "epoch": 1328} {"train_loss": -40.546661376953125, "global_step": 160736, "epoch": 1328} {"train_loss": -40.491817474365234, "global_step": 160737, "epoch": 1328} {"train_loss": -40.460628509521484, "global_step": 160738, "epoch": 1328} {"train_loss": -41.1876106262207, "global_step": 160739, "epoch": 1328} {"train_loss": -40.96128463745117, "global_step": 160740, "epoch": 1328} {"train_loss": -41.30048751831055, "global_step": 160741, "epoch": 1328} {"train_loss": -41.47597885131836, "global_step": 160742, "epoch": 1328} {"train_loss": -40.70536422729492, "global_step": 160743, "epoch": 1328} {"train_loss": -41.25588607788086, "global_step": 160744, "epoch": 1328} {"train_loss": -41.266788482666016, "global_step": 160745, "epoch": 1328} {"train_loss": -41.36901092529297, "global_step": 160746, "epoch": 1328} {"train_loss": -41.23843765258789, "global_step": 160747, "epoch": 1328} {"train_loss": -41.94255828857422, "global_step": 160748, "epoch": 1328} {"train_loss": -41.201904296875, "global_step": 160749, "epoch": 1328} {"train_loss": -41.224239349365234, "global_step": 160750, "epoch": 1328} {"train_loss": -41.41099166870117, "global_step": 160751, "epoch": 1328} {"train_loss": -41.44503402709961, "global_step": 160752, "epoch": 1328} {"train_loss": -41.4058952331543, "global_step": 160753, "epoch": 1328} {"train_loss": -41.97585678100586, "global_step": 160754, "epoch": 1328} {"train_loss": -41.22414016723633, "global_step": 160755, "epoch": 1328} {"train_loss": -41.653621673583984, "global_step": 160756, "epoch": 1328} {"train_loss": -41.35334777832031, "global_step": 160757, "epoch": 1328} {"train_loss": -41.309810638427734, "global_step": 160758, "epoch": 1328} {"train_loss": -41.62173080444336, "global_step": 160759, "epoch": 1328} {"train_loss": -41.74037551879883, "global_step": 160760, "epoch": 1328} {"train_loss": -41.748565673828125, "global_step": 160761, "epoch": 1328} {"train_loss": -41.19352340698242, "global_step": 160762, "epoch": 1328} {"train_loss": -41.55546951293945, "global_step": 160763, "epoch": 1328} {"train_loss": -42.0551872253418, "global_step": 160764, "epoch": 1328} {"train_loss": -41.31877517700195, "global_step": 160765, "epoch": 1328} {"train_loss": -41.487300872802734, "global_step": 160766, "epoch": 1328} {"train_loss": -42.07282638549805, "global_step": 160767, "epoch": 1328} {"train_loss": -41.857303619384766, "global_step": 160768, "epoch": 1328} {"train_loss": -41.73031234741211, "global_step": 160769, "epoch": 1328} {"train_loss": -41.76975631713867, "global_step": 160770, "epoch": 1328} {"train_loss": -41.90421676635742, "global_step": 160771, "epoch": 1328} {"train_loss": -41.41984176635742, "global_step": 160772, "epoch": 1328} {"train_loss": -41.37544631958008, "global_step": 160773, "epoch": 1328} {"train_loss": -41.202144622802734, "global_step": 160774, "epoch": 1328} {"train_loss": -41.216583251953125, "global_step": 160775, "epoch": 1328} {"train_loss": -41.178218841552734, "global_step": 160776, "epoch": 1328} {"train_loss": -42.235713958740234, "global_step": 160777, "epoch": 1328} {"train_loss": -41.725067138671875, "global_step": 160778, "epoch": 1328} {"train_loss": -41.38509750366211, "global_step": 160779, "epoch": 1328} {"train_loss": -41.61940383911133, "global_step": 160780, "epoch": 1328} {"train_loss": -40.70327377319336, "global_step": 160781, "epoch": 1328} {"train_loss": -40.83927536010742, "global_step": 160782, "epoch": 1328} {"train_loss": -41.13984298706055, "global_step": 160783, "epoch": 1328} {"train_loss": -41.5145378112793, "global_step": 160784, "epoch": 1328} {"train_loss": -41.42243957519531, "global_step": 160785, "epoch": 1328} {"train_loss": -39.97005844116211, "global_step": 160786, "epoch": 1328} {"train_loss": -38.76234817504883, "global_step": 160787, "epoch": 1328} {"train_loss": -37.2830696105957, "global_step": 160788, "epoch": 1328} {"train_loss": -38.67208480834961, "global_step": 160789, "epoch": 1328} {"train_loss": -41.02796173095703, "global_step": 160790, "epoch": 1328} {"train_loss": -40.24747848510742, "global_step": 160791, "epoch": 1328} {"train_loss": -36.67643356323242, "global_step": 160792, "epoch": 1328} {"train_loss": -38.677703857421875, "global_step": 160793, "epoch": 1328} {"train_loss": -40.5766716003418, "global_step": 160794, "epoch": 1328} {"train_loss": -38.303768157958984, "global_step": 160795, "epoch": 1328} {"train_loss": -39.89484786987305, "global_step": 160796, "epoch": 1328} {"train_loss": -39.876808166503906, "global_step": 160797, "epoch": 1328} {"train_loss": -38.919822692871094, "global_step": 160798, "epoch": 1328} {"train_loss": -37.590938568115234, "global_step": 160799, "epoch": 1328} {"train_loss": -39.76278305053711, "global_step": 160800, "epoch": 1328} {"train_loss": -38.920284271240234, "global_step": 160801, "epoch": 1328} {"train_loss": -38.3864631652832, "global_step": 160802, "epoch": 1328} {"train_loss": -40.008514404296875, "global_step": 160803, "epoch": 1328} {"train_loss": -37.658607482910156, "global_step": 160804, "epoch": 1328} {"train_loss": -40.12200927734375, "global_step": 160805, "epoch": 1328} {"train_loss": -38.3828125, "global_step": 160806, "epoch": 1328} {"train_loss": -40.47158432006836, "global_step": 160807, "epoch": 1328} {"train_loss": -39.98374436118386, "global_step": 160808, "epoch": 1328, "val_loss": 2382099.25} {"train_loss": -39.75516891479492, "global_step": 160809, "epoch": 1329} {"train_loss": -40.25141143798828, "global_step": 160810, "epoch": 1329} {"train_loss": -39.235408782958984, "global_step": 160811, "epoch": 1329} {"train_loss": -41.16021728515625, "global_step": 160812, "epoch": 1329} {"train_loss": -39.16231918334961, "global_step": 160813, "epoch": 1329} {"train_loss": -40.832454681396484, "global_step": 160814, "epoch": 1329} {"train_loss": -39.027626037597656, "global_step": 160815, "epoch": 1329} {"train_loss": -40.39406967163086, "global_step": 160816, "epoch": 1329} {"train_loss": -38.046051025390625, "global_step": 160817, "epoch": 1329} {"train_loss": -25.77093505859375, "global_step": 160818, "epoch": 1329} {"train_loss": -33.631378173828125, "global_step": 160819, "epoch": 1329} {"train_loss": -39.67367935180664, "global_step": 160820, "epoch": 1329} {"train_loss": -33.44422149658203, "global_step": 160821, "epoch": 1329} {"train_loss": -34.47677230834961, "global_step": 160822, "epoch": 1329} {"train_loss": -18.430038452148438, "global_step": 160823, "epoch": 1329} {"train_loss": -29.388471603393555, "global_step": 160824, "epoch": 1329} {"train_loss": -30.37991714477539, "global_step": 160825, "epoch": 1329} {"train_loss": -31.44113540649414, "global_step": 160826, "epoch": 1329} {"train_loss": -22.560270309448242, "global_step": 160827, "epoch": 1329} {"train_loss": -31.820371627807617, "global_step": 160828, "epoch": 1329} {"train_loss": -30.9847469329834, "global_step": 160829, "epoch": 1329} {"train_loss": -22.872861862182617, "global_step": 160830, "epoch": 1329} {"train_loss": -23.288257598876953, "global_step": 160831, "epoch": 1329} {"train_loss": -20.241735458374023, "global_step": 160832, "epoch": 1329} {"train_loss": -33.86023712158203, "global_step": 160833, "epoch": 1329} {"train_loss": -33.417476654052734, "global_step": 160834, "epoch": 1329} {"train_loss": -29.923431396484375, "global_step": 160835, "epoch": 1329} {"train_loss": -25.800561904907227, "global_step": 160836, "epoch": 1329} {"train_loss": -30.015668869018555, "global_step": 160837, "epoch": 1329} {"train_loss": -30.14092445373535, "global_step": 160838, "epoch": 1329} {"train_loss": -31.8659610748291, "global_step": 160839, "epoch": 1329} {"train_loss": -28.59144401550293, "global_step": 160840, "epoch": 1329} {"train_loss": -31.931842803955078, "global_step": 160841, "epoch": 1329} {"train_loss": -34.563045501708984, "global_step": 160842, "epoch": 1329} {"train_loss": -35.7540168762207, "global_step": 160843, "epoch": 1329} {"train_loss": -31.999059677124023, "global_step": 160844, "epoch": 1329} {"train_loss": -32.92008972167969, "global_step": 160845, "epoch": 1329} {"train_loss": -34.59885787963867, "global_step": 160846, "epoch": 1329} {"train_loss": -33.340450286865234, "global_step": 160847, "epoch": 1329} {"train_loss": -36.619136810302734, "global_step": 160848, "epoch": 1329} {"train_loss": -35.289573669433594, "global_step": 160849, "epoch": 1329} {"train_loss": -32.47140121459961, "global_step": 160850, "epoch": 1329} {"train_loss": -35.06056213378906, "global_step": 160851, "epoch": 1329} {"train_loss": -34.09186935424805, "global_step": 160852, "epoch": 1329} {"train_loss": -34.70697021484375, "global_step": 160853, "epoch": 1329} {"train_loss": -34.98639678955078, "global_step": 160854, "epoch": 1329} {"train_loss": -35.98537826538086, "global_step": 160855, "epoch": 1329} {"train_loss": -36.41133499145508, "global_step": 160856, "epoch": 1329} {"train_loss": -32.97237014770508, "global_step": 160857, "epoch": 1329} {"train_loss": -35.94623947143555, "global_step": 160858, "epoch": 1329} {"train_loss": -37.29170608520508, "global_step": 160859, "epoch": 1329} {"train_loss": -35.864253997802734, "global_step": 160860, "epoch": 1329} {"train_loss": -35.98054122924805, "global_step": 160861, "epoch": 1329} {"train_loss": -36.526153564453125, "global_step": 160862, "epoch": 1329} {"train_loss": -36.50412368774414, "global_step": 160863, "epoch": 1329} {"train_loss": -36.713539123535156, "global_step": 160864, "epoch": 1329} {"train_loss": -36.0471305847168, "global_step": 160865, "epoch": 1329} {"train_loss": -37.136714935302734, "global_step": 160866, "epoch": 1329} {"train_loss": -37.2661247253418, "global_step": 160867, "epoch": 1329} {"train_loss": -35.778533935546875, "global_step": 160868, "epoch": 1329} {"train_loss": -36.46688461303711, "global_step": 160869, "epoch": 1329} {"train_loss": -36.80430603027344, "global_step": 160870, "epoch": 1329} {"train_loss": -37.2252197265625, "global_step": 160871, "epoch": 1329} {"train_loss": -37.48049545288086, "global_step": 160872, "epoch": 1329} {"train_loss": -37.591426849365234, "global_step": 160873, "epoch": 1329} {"train_loss": -37.3829460144043, "global_step": 160874, "epoch": 1329} {"train_loss": -37.55374526977539, "global_step": 160875, "epoch": 1329} {"train_loss": -38.07094955444336, "global_step": 160876, "epoch": 1329} {"train_loss": -36.81282424926758, "global_step": 160877, "epoch": 1329} {"train_loss": -37.64828109741211, "global_step": 160878, "epoch": 1329} {"train_loss": -37.49286651611328, "global_step": 160879, "epoch": 1329} {"train_loss": -37.74728012084961, "global_step": 160880, "epoch": 1329} {"train_loss": -37.60837173461914, "global_step": 160881, "epoch": 1329} {"train_loss": -37.87329864501953, "global_step": 160882, "epoch": 1329} {"train_loss": -36.94525909423828, "global_step": 160883, "epoch": 1329} {"train_loss": -38.38246154785156, "global_step": 160884, "epoch": 1329} {"train_loss": -37.80111312866211, "global_step": 160885, "epoch": 1329} {"train_loss": -38.10793685913086, "global_step": 160886, "epoch": 1329} {"train_loss": -37.93572998046875, "global_step": 160887, "epoch": 1329} {"train_loss": -37.835872650146484, "global_step": 160888, "epoch": 1329} {"train_loss": -37.776092529296875, "global_step": 160889, "epoch": 1329} {"train_loss": -38.39402389526367, "global_step": 160890, "epoch": 1329} {"train_loss": -38.0865478515625, "global_step": 160891, "epoch": 1329} {"train_loss": -38.14655685424805, "global_step": 160892, "epoch": 1329} {"train_loss": -38.33883285522461, "global_step": 160893, "epoch": 1329} {"train_loss": -38.32209777832031, "global_step": 160894, "epoch": 1329} {"train_loss": -38.220977783203125, "global_step": 160895, "epoch": 1329} {"train_loss": -38.83664321899414, "global_step": 160896, "epoch": 1329} {"train_loss": -38.571136474609375, "global_step": 160897, "epoch": 1329} {"train_loss": -38.51459884643555, "global_step": 160898, "epoch": 1329} {"train_loss": -38.54813766479492, "global_step": 160899, "epoch": 1329} {"train_loss": -38.6008415222168, "global_step": 160900, "epoch": 1329} {"train_loss": -38.887237548828125, "global_step": 160901, "epoch": 1329} {"train_loss": -38.64379119873047, "global_step": 160902, "epoch": 1329} {"train_loss": -37.782344818115234, "global_step": 160903, "epoch": 1329} {"train_loss": -37.88227462768555, "global_step": 160904, "epoch": 1329} {"train_loss": -39.21271514892578, "global_step": 160905, "epoch": 1329} {"train_loss": -38.66766357421875, "global_step": 160906, "epoch": 1329} {"train_loss": -39.29441452026367, "global_step": 160907, "epoch": 1329} {"train_loss": -39.39870834350586, "global_step": 160908, "epoch": 1329} {"train_loss": -38.97378158569336, "global_step": 160909, "epoch": 1329} {"train_loss": -38.99043273925781, "global_step": 160910, "epoch": 1329} {"train_loss": -39.15473175048828, "global_step": 160911, "epoch": 1329} {"train_loss": -39.34843826293945, "global_step": 160912, "epoch": 1329} {"train_loss": -39.51552963256836, "global_step": 160913, "epoch": 1329} {"train_loss": -38.90579605102539, "global_step": 160914, "epoch": 1329} {"train_loss": -39.02842712402344, "global_step": 160915, "epoch": 1329} {"train_loss": -39.29936599731445, "global_step": 160916, "epoch": 1329} {"train_loss": -38.76570510864258, "global_step": 160917, "epoch": 1329} {"train_loss": -39.64306640625, "global_step": 160918, "epoch": 1329} {"train_loss": -39.437129974365234, "global_step": 160919, "epoch": 1329} {"train_loss": -39.81498718261719, "global_step": 160920, "epoch": 1329} {"train_loss": -38.92330551147461, "global_step": 160921, "epoch": 1329} {"train_loss": -39.49346923828125, "global_step": 160922, "epoch": 1329} {"train_loss": -39.02418899536133, "global_step": 160923, "epoch": 1329} {"train_loss": -39.160152435302734, "global_step": 160924, "epoch": 1329} {"train_loss": -39.62876510620117, "global_step": 160925, "epoch": 1329} {"train_loss": -39.57086944580078, "global_step": 160926, "epoch": 1329} {"train_loss": -39.79984664916992, "global_step": 160927, "epoch": 1329} {"train_loss": -40.05253219604492, "global_step": 160928, "epoch": 1329} {"train_loss": -36.051104648054135, "global_step": 160929, "epoch": 1329, "val_loss": 2410999.0} {"train_loss": -39.472564697265625, "global_step": 160930, "epoch": 1330} {"train_loss": -39.762935638427734, "global_step": 160931, "epoch": 1330} {"train_loss": -39.6591911315918, "global_step": 160932, "epoch": 1330} {"train_loss": -40.53578567504883, "global_step": 160933, "epoch": 1330} {"train_loss": -40.05531692504883, "global_step": 160934, "epoch": 1330} {"train_loss": -39.76528549194336, "global_step": 160935, "epoch": 1330} {"train_loss": -40.00407028198242, "global_step": 160936, "epoch": 1330} {"train_loss": -40.331947326660156, "global_step": 160937, "epoch": 1330} {"train_loss": -39.72846221923828, "global_step": 160938, "epoch": 1330} {"train_loss": -40.408546447753906, "global_step": 160939, "epoch": 1330} {"train_loss": -40.01816940307617, "global_step": 160940, "epoch": 1330} {"train_loss": -40.23418426513672, "global_step": 160941, "epoch": 1330} {"train_loss": -39.842769622802734, "global_step": 160942, "epoch": 1330} {"train_loss": -40.12582015991211, "global_step": 160943, "epoch": 1330} {"train_loss": -40.184608459472656, "global_step": 160944, "epoch": 1330} {"train_loss": -40.66508102416992, "global_step": 160945, "epoch": 1330} {"train_loss": -40.24580001831055, "global_step": 160946, "epoch": 1330} {"train_loss": -39.927711486816406, "global_step": 160947, "epoch": 1330} {"train_loss": -40.39634704589844, "global_step": 160948, "epoch": 1330} {"train_loss": -39.951568603515625, "global_step": 160949, "epoch": 1330} {"train_loss": -40.248199462890625, "global_step": 160950, "epoch": 1330} {"train_loss": -40.498023986816406, "global_step": 160951, "epoch": 1330} {"train_loss": -40.58904266357422, "global_step": 160952, "epoch": 1330} {"train_loss": -40.0939826965332, "global_step": 160953, "epoch": 1330} {"train_loss": -40.562904357910156, "global_step": 160954, "epoch": 1330} {"train_loss": -40.53506088256836, "global_step": 160955, "epoch": 1330} {"train_loss": -40.45664596557617, "global_step": 160956, "epoch": 1330} {"train_loss": -39.70506286621094, "global_step": 160957, "epoch": 1330} {"train_loss": -40.821922302246094, "global_step": 160958, "epoch": 1330} {"train_loss": -39.949066162109375, "global_step": 160959, "epoch": 1330} {"train_loss": -40.45644760131836, "global_step": 160960, "epoch": 1330} {"train_loss": -40.56309127807617, "global_step": 160961, "epoch": 1330} {"train_loss": -40.36543273925781, "global_step": 160962, "epoch": 1330} {"train_loss": -40.834354400634766, "global_step": 160963, "epoch": 1330} {"train_loss": -40.60490036010742, "global_step": 160964, "epoch": 1330} {"train_loss": -40.64085388183594, "global_step": 160965, "epoch": 1330} {"train_loss": -39.555660247802734, "global_step": 160966, "epoch": 1330} {"train_loss": -40.689666748046875, "global_step": 160967, "epoch": 1330} {"train_loss": -40.808528900146484, "global_step": 160968, "epoch": 1330} {"train_loss": -40.77482223510742, "global_step": 160969, "epoch": 1330} {"train_loss": -40.40812301635742, "global_step": 160970, "epoch": 1330} {"train_loss": -40.74864196777344, "global_step": 160971, "epoch": 1330} {"train_loss": -40.24073791503906, "global_step": 160972, "epoch": 1330} {"train_loss": -40.446041107177734, "global_step": 160973, "epoch": 1330} {"train_loss": -40.86234664916992, "global_step": 160974, "epoch": 1330} {"train_loss": -39.790435791015625, "global_step": 160975, "epoch": 1330} {"train_loss": -40.86016845703125, "global_step": 160976, "epoch": 1330} {"train_loss": -40.40642166137695, "global_step": 160977, "epoch": 1330} {"train_loss": -40.50627517700195, "global_step": 160978, "epoch": 1330} {"train_loss": -40.6876335144043, "global_step": 160979, "epoch": 1330} {"train_loss": -40.76565170288086, "global_step": 160980, "epoch": 1330} {"train_loss": -40.514068603515625, "global_step": 160981, "epoch": 1330} {"train_loss": -40.62199783325195, "global_step": 160982, "epoch": 1330} {"train_loss": -40.3051643371582, "global_step": 160983, "epoch": 1330} {"train_loss": -40.166015625, "global_step": 160984, "epoch": 1330} {"train_loss": -38.87607955932617, "global_step": 160985, "epoch": 1330} {"train_loss": -40.74925994873047, "global_step": 160986, "epoch": 1330} {"train_loss": -40.66620635986328, "global_step": 160987, "epoch": 1330} {"train_loss": -39.735504150390625, "global_step": 160988, "epoch": 1330} {"train_loss": -40.58126449584961, "global_step": 160989, "epoch": 1330} {"train_loss": -40.9205207824707, "global_step": 160990, "epoch": 1330} {"train_loss": -40.27372360229492, "global_step": 160991, "epoch": 1330} {"train_loss": -40.34884262084961, "global_step": 160992, "epoch": 1330} {"train_loss": -39.157142639160156, "global_step": 160993, "epoch": 1330} {"train_loss": -40.868045806884766, "global_step": 160994, "epoch": 1330} {"train_loss": -40.08606719970703, "global_step": 160995, "epoch": 1330} {"train_loss": -38.79813766479492, "global_step": 160996, "epoch": 1330} {"train_loss": -38.708980560302734, "global_step": 160997, "epoch": 1330} {"train_loss": -39.766807556152344, "global_step": 160998, "epoch": 1330} {"train_loss": -39.40668487548828, "global_step": 160999, "epoch": 1330} {"train_loss": -37.8008918762207, "global_step": 161000, "epoch": 1330} {"train_loss": -37.10324478149414, "global_step": 161001, "epoch": 1330} {"train_loss": -37.13520050048828, "global_step": 161002, "epoch": 1330} {"train_loss": -38.32719802856445, "global_step": 161003, "epoch": 1330} {"train_loss": -39.15045166015625, "global_step": 161004, "epoch": 1330} {"train_loss": -37.66878128051758, "global_step": 161005, "epoch": 1330} {"train_loss": -36.88290023803711, "global_step": 161006, "epoch": 1330} {"train_loss": -37.0323486328125, "global_step": 161007, "epoch": 1330} {"train_loss": -38.87020492553711, "global_step": 161008, "epoch": 1330} {"train_loss": -35.87272262573242, "global_step": 161009, "epoch": 1330} {"train_loss": -37.16522979736328, "global_step": 161010, "epoch": 1330} {"train_loss": -38.68598937988281, "global_step": 161011, "epoch": 1330} {"train_loss": -38.06458282470703, "global_step": 161012, "epoch": 1330} {"train_loss": -35.6878776550293, "global_step": 161013, "epoch": 1330} {"train_loss": -39.19406509399414, "global_step": 161014, "epoch": 1330} {"train_loss": -38.62260055541992, "global_step": 161015, "epoch": 1330} {"train_loss": -36.2045783996582, "global_step": 161016, "epoch": 1330} {"train_loss": -38.999603271484375, "global_step": 161017, "epoch": 1330} {"train_loss": -38.09722900390625, "global_step": 161018, "epoch": 1330} {"train_loss": -38.44868087768555, "global_step": 161019, "epoch": 1330} {"train_loss": -39.29885482788086, "global_step": 161020, "epoch": 1330} {"train_loss": -38.72062301635742, "global_step": 161021, "epoch": 1330} {"train_loss": -38.28907775878906, "global_step": 161022, "epoch": 1330} {"train_loss": -38.23017501831055, "global_step": 161023, "epoch": 1330} {"train_loss": -38.94099044799805, "global_step": 161024, "epoch": 1330} {"train_loss": -39.856117248535156, "global_step": 161025, "epoch": 1330} {"train_loss": -38.5347785949707, "global_step": 161026, "epoch": 1330} {"train_loss": -39.25093460083008, "global_step": 161027, "epoch": 1330} {"train_loss": -39.365150451660156, "global_step": 161028, "epoch": 1330} {"train_loss": -38.72794723510742, "global_step": 161029, "epoch": 1330} {"train_loss": -38.47005844116211, "global_step": 161030, "epoch": 1330} {"train_loss": -39.97434616088867, "global_step": 161031, "epoch": 1330} {"train_loss": -38.12116241455078, "global_step": 161032, "epoch": 1330} {"train_loss": -38.513484954833984, "global_step": 161033, "epoch": 1330} {"train_loss": -40.14735412597656, "global_step": 161034, "epoch": 1330} {"train_loss": -38.49935531616211, "global_step": 161035, "epoch": 1330} {"train_loss": -38.1573600769043, "global_step": 161036, "epoch": 1330} {"train_loss": -39.5146598815918, "global_step": 161037, "epoch": 1330} {"train_loss": -40.076576232910156, "global_step": 161038, "epoch": 1330} {"train_loss": -39.655548095703125, "global_step": 161039, "epoch": 1330} {"train_loss": -40.2210807800293, "global_step": 161040, "epoch": 1330} {"train_loss": -40.05375289916992, "global_step": 161041, "epoch": 1330} {"train_loss": -40.09646224975586, "global_step": 161042, "epoch": 1330} {"train_loss": -39.69108200073242, "global_step": 161043, "epoch": 1330} {"train_loss": -39.92387008666992, "global_step": 161044, "epoch": 1330} {"train_loss": -40.973873138427734, "global_step": 161045, "epoch": 1330} {"train_loss": -39.96099853515625, "global_step": 161046, "epoch": 1330} {"train_loss": -40.732051849365234, "global_step": 161047, "epoch": 1330} {"train_loss": -40.529659271240234, "global_step": 161048, "epoch": 1330} {"train_loss": -40.118770599365234, "global_step": 161049, "epoch": 1330} {"train_loss": -39.62857068274632, "global_step": 161050, "epoch": 1330, "val_loss": 2389708.0} {"train_loss": -40.11088180541992, "global_step": 161051, "epoch": 1331} {"train_loss": -40.797637939453125, "global_step": 161052, "epoch": 1331} {"train_loss": -40.824462890625, "global_step": 161053, "epoch": 1331} {"train_loss": -40.83850860595703, "global_step": 161054, "epoch": 1331} {"train_loss": -40.4581413269043, "global_step": 161055, "epoch": 1331} {"train_loss": -40.734867095947266, "global_step": 161056, "epoch": 1331} {"train_loss": -40.9710807800293, "global_step": 161057, "epoch": 1331} {"train_loss": -40.55198287963867, "global_step": 161058, "epoch": 1331} {"train_loss": -40.967830657958984, "global_step": 161059, "epoch": 1331} {"train_loss": -40.94769287109375, "global_step": 161060, "epoch": 1331} {"train_loss": -40.87099075317383, "global_step": 161061, "epoch": 1331} {"train_loss": -40.574188232421875, "global_step": 161062, "epoch": 1331} {"train_loss": -40.96358108520508, "global_step": 161063, "epoch": 1331} {"train_loss": -40.74391174316406, "global_step": 161064, "epoch": 1331} {"train_loss": -40.9435920715332, "global_step": 161065, "epoch": 1331} {"train_loss": -41.003841400146484, "global_step": 161066, "epoch": 1331} {"train_loss": -40.98997116088867, "global_step": 161067, "epoch": 1331} {"train_loss": -41.11790084838867, "global_step": 161068, "epoch": 1331} {"train_loss": -40.77119064331055, "global_step": 161069, "epoch": 1331} {"train_loss": -41.249568939208984, "global_step": 161070, "epoch": 1331} {"train_loss": -41.5915641784668, "global_step": 161071, "epoch": 1331} {"train_loss": -41.060726165771484, "global_step": 161072, "epoch": 1331} {"train_loss": -40.84615707397461, "global_step": 161073, "epoch": 1331} {"train_loss": -40.63319396972656, "global_step": 161074, "epoch": 1331} {"train_loss": -41.2227897644043, "global_step": 161075, "epoch": 1331} {"train_loss": -41.05846405029297, "global_step": 161076, "epoch": 1331} {"train_loss": -41.70048904418945, "global_step": 161077, "epoch": 1331} {"train_loss": -41.36171340942383, "global_step": 161078, "epoch": 1331} {"train_loss": -41.668495178222656, "global_step": 161079, "epoch": 1331} {"train_loss": -41.62656784057617, "global_step": 161080, "epoch": 1331} {"train_loss": -40.681640625, "global_step": 161081, "epoch": 1331} {"train_loss": -41.4551887512207, "global_step": 161082, "epoch": 1331} {"train_loss": -41.55449676513672, "global_step": 161083, "epoch": 1331} {"train_loss": -41.06425094604492, "global_step": 161084, "epoch": 1331} {"train_loss": -41.443363189697266, "global_step": 161085, "epoch": 1331} {"train_loss": -41.3514289855957, "global_step": 161086, "epoch": 1331} {"train_loss": -41.811248779296875, "global_step": 161087, "epoch": 1331} {"train_loss": -41.43210983276367, "global_step": 161088, "epoch": 1331} {"train_loss": -41.73051071166992, "global_step": 161089, "epoch": 1331} {"train_loss": -41.4322624206543, "global_step": 161090, "epoch": 1331} {"train_loss": -41.68824768066406, "global_step": 161091, "epoch": 1331} {"train_loss": -41.3800163269043, "global_step": 161092, "epoch": 1331} {"train_loss": -41.62301254272461, "global_step": 161093, "epoch": 1331} {"train_loss": -41.658653259277344, "global_step": 161094, "epoch": 1331} {"train_loss": -41.58798599243164, "global_step": 161095, "epoch": 1331} {"train_loss": -41.488826751708984, "global_step": 161096, "epoch": 1331} {"train_loss": -41.433189392089844, "global_step": 161097, "epoch": 1331} {"train_loss": -41.26520919799805, "global_step": 161098, "epoch": 1331} {"train_loss": -41.0809440612793, "global_step": 161099, "epoch": 1331} {"train_loss": -40.81612014770508, "global_step": 161100, "epoch": 1331} {"train_loss": -40.897640228271484, "global_step": 161101, "epoch": 1331} {"train_loss": -41.99067306518555, "global_step": 161102, "epoch": 1331} {"train_loss": -41.03144073486328, "global_step": 161103, "epoch": 1331} {"train_loss": -40.92351531982422, "global_step": 161104, "epoch": 1331} {"train_loss": -40.77189636230469, "global_step": 161105, "epoch": 1331} {"train_loss": -39.99061965942383, "global_step": 161106, "epoch": 1331} {"train_loss": -40.49022674560547, "global_step": 161107, "epoch": 1331} {"train_loss": -40.25190353393555, "global_step": 161108, "epoch": 1331} {"train_loss": -41.072261810302734, "global_step": 161109, "epoch": 1331} {"train_loss": -40.94384765625, "global_step": 161110, "epoch": 1331} {"train_loss": -41.03144073486328, "global_step": 161111, "epoch": 1331} {"train_loss": -41.31673049926758, "global_step": 161112, "epoch": 1331} {"train_loss": -41.310543060302734, "global_step": 161113, "epoch": 1331} {"train_loss": -41.19497299194336, "global_step": 161114, "epoch": 1331} {"train_loss": -40.130611419677734, "global_step": 161115, "epoch": 1331} {"train_loss": -39.072906494140625, "global_step": 161116, "epoch": 1331} {"train_loss": -36.75586700439453, "global_step": 161117, "epoch": 1331} {"train_loss": -31.440744400024414, "global_step": 161118, "epoch": 1331} {"train_loss": -24.239852905273438, "global_step": 161119, "epoch": 1331} {"train_loss": -32.853477478027344, "global_step": 161120, "epoch": 1331} {"train_loss": -39.528175354003906, "global_step": 161121, "epoch": 1331} {"train_loss": -39.13633728027344, "global_step": 161122, "epoch": 1331} {"train_loss": -37.1768798828125, "global_step": 161123, "epoch": 1331} {"train_loss": -39.01924514770508, "global_step": 161124, "epoch": 1331} {"train_loss": -38.51206588745117, "global_step": 161125, "epoch": 1331} {"train_loss": -38.821956634521484, "global_step": 161126, "epoch": 1331} {"train_loss": -39.66328048706055, "global_step": 161127, "epoch": 1331} {"train_loss": -38.763858795166016, "global_step": 161128, "epoch": 1331} {"train_loss": -39.21915817260742, "global_step": 161129, "epoch": 1331} {"train_loss": -40.68608474731445, "global_step": 161130, "epoch": 1331} {"train_loss": -37.49859619140625, "global_step": 161131, "epoch": 1331} {"train_loss": -40.294586181640625, "global_step": 161132, "epoch": 1331} {"train_loss": -39.24250411987305, "global_step": 161133, "epoch": 1331} {"train_loss": -38.50093078613281, "global_step": 161134, "epoch": 1331} {"train_loss": -40.173030853271484, "global_step": 161135, "epoch": 1331} {"train_loss": -38.884395599365234, "global_step": 161136, "epoch": 1331} {"train_loss": -39.58878707885742, "global_step": 161137, "epoch": 1331} {"train_loss": -39.147762298583984, "global_step": 161138, "epoch": 1331} {"train_loss": -39.9943962097168, "global_step": 161139, "epoch": 1331} {"train_loss": -40.53155517578125, "global_step": 161140, "epoch": 1331} {"train_loss": -40.42562484741211, "global_step": 161141, "epoch": 1331} {"train_loss": -40.60768508911133, "global_step": 161142, "epoch": 1331} {"train_loss": -40.29866409301758, "global_step": 161143, "epoch": 1331} {"train_loss": -40.63498306274414, "global_step": 161144, "epoch": 1331} {"train_loss": -40.65339279174805, "global_step": 161145, "epoch": 1331} {"train_loss": -40.50944137573242, "global_step": 161146, "epoch": 1331} {"train_loss": -40.74387741088867, "global_step": 161147, "epoch": 1331} {"train_loss": -40.59595489501953, "global_step": 161148, "epoch": 1331} {"train_loss": -39.95050048828125, "global_step": 161149, "epoch": 1331} {"train_loss": -40.922767639160156, "global_step": 161150, "epoch": 1331} {"train_loss": -40.26392364501953, "global_step": 161151, "epoch": 1331} {"train_loss": -40.81599807739258, "global_step": 161152, "epoch": 1331} {"train_loss": -41.07175827026367, "global_step": 161153, "epoch": 1331} {"train_loss": -41.145477294921875, "global_step": 161154, "epoch": 1331} {"train_loss": -40.923828125, "global_step": 161155, "epoch": 1331} {"train_loss": -40.81520462036133, "global_step": 161156, "epoch": 1331} {"train_loss": -40.721168518066406, "global_step": 161157, "epoch": 1331} {"train_loss": -40.67937088012695, "global_step": 161158, "epoch": 1331} {"train_loss": -40.57799530029297, "global_step": 161159, "epoch": 1331} {"train_loss": -41.32001495361328, "global_step": 161160, "epoch": 1331} {"train_loss": -40.95097732543945, "global_step": 161161, "epoch": 1331} {"train_loss": -39.90363693237305, "global_step": 161162, "epoch": 1331} {"train_loss": -41.26893997192383, "global_step": 161163, "epoch": 1331} {"train_loss": -40.22061538696289, "global_step": 161164, "epoch": 1331} {"train_loss": -41.20107650756836, "global_step": 161165, "epoch": 1331} {"train_loss": -41.205684661865234, "global_step": 161166, "epoch": 1331} {"train_loss": -40.78969192504883, "global_step": 161167, "epoch": 1331} {"train_loss": -40.575950622558594, "global_step": 161168, "epoch": 1331} {"train_loss": -40.68695068359375, "global_step": 161169, "epoch": 1331} {"train_loss": -41.25191116333008, "global_step": 161170, "epoch": 1331} {"train_loss": -40.339272286281115, "global_step": 161171, "epoch": 1331, "val_loss": 2395253.25} {"train_loss": -40.483192443847656, "global_step": 161172, "epoch": 1332} {"train_loss": -41.1811637878418, "global_step": 161173, "epoch": 1332} {"train_loss": -40.098854064941406, "global_step": 161174, "epoch": 1332} {"train_loss": -40.9814567565918, "global_step": 161175, "epoch": 1332} {"train_loss": -40.75274658203125, "global_step": 161176, "epoch": 1332} {"train_loss": -40.94617462158203, "global_step": 161177, "epoch": 1332} {"train_loss": -40.98509216308594, "global_step": 161178, "epoch": 1332} {"train_loss": -41.56060791015625, "global_step": 161179, "epoch": 1332} {"train_loss": -41.1879768371582, "global_step": 161180, "epoch": 1332} {"train_loss": -40.966941833496094, "global_step": 161181, "epoch": 1332} {"train_loss": -41.21137237548828, "global_step": 161182, "epoch": 1332} {"train_loss": -41.18819808959961, "global_step": 161183, "epoch": 1332} {"train_loss": -40.8817024230957, "global_step": 161184, "epoch": 1332} {"train_loss": -41.171661376953125, "global_step": 161185, "epoch": 1332} {"train_loss": -41.24545669555664, "global_step": 161186, "epoch": 1332} {"train_loss": -40.78953170776367, "global_step": 161187, "epoch": 1332} {"train_loss": -40.308162689208984, "global_step": 161188, "epoch": 1332} {"train_loss": -40.674713134765625, "global_step": 161189, "epoch": 1332} {"train_loss": -41.3121337890625, "global_step": 161190, "epoch": 1332} {"train_loss": -41.055416107177734, "global_step": 161191, "epoch": 1332} {"train_loss": -40.522682189941406, "global_step": 161192, "epoch": 1332} {"train_loss": -41.27024459838867, "global_step": 161193, "epoch": 1332} {"train_loss": -40.76885986328125, "global_step": 161194, "epoch": 1332} {"train_loss": -40.66326904296875, "global_step": 161195, "epoch": 1332} {"train_loss": -41.372127532958984, "global_step": 161196, "epoch": 1332} {"train_loss": -40.26760482788086, "global_step": 161197, "epoch": 1332} {"train_loss": -40.82678985595703, "global_step": 161198, "epoch": 1332} {"train_loss": -41.4460334777832, "global_step": 161199, "epoch": 1332} {"train_loss": -40.48512268066406, "global_step": 161200, "epoch": 1332} {"train_loss": -41.102821350097656, "global_step": 161201, "epoch": 1332} {"train_loss": -40.577110290527344, "global_step": 161202, "epoch": 1332} {"train_loss": -41.18397903442383, "global_step": 161203, "epoch": 1332} {"train_loss": -41.66690444946289, "global_step": 161204, "epoch": 1332} {"train_loss": -40.03231430053711, "global_step": 161205, "epoch": 1332} {"train_loss": -40.39023208618164, "global_step": 161206, "epoch": 1332} {"train_loss": -41.726890563964844, "global_step": 161207, "epoch": 1332} {"train_loss": -40.727577209472656, "global_step": 161208, "epoch": 1332} {"train_loss": -39.72107696533203, "global_step": 161209, "epoch": 1332} {"train_loss": -39.491798400878906, "global_step": 161210, "epoch": 1332} {"train_loss": -39.99905014038086, "global_step": 161211, "epoch": 1332} {"train_loss": -40.78483963012695, "global_step": 161212, "epoch": 1332} {"train_loss": -40.42793655395508, "global_step": 161213, "epoch": 1332} {"train_loss": -40.290496826171875, "global_step": 161214, "epoch": 1332} {"train_loss": -41.358211517333984, "global_step": 161215, "epoch": 1332} {"train_loss": -40.35546875, "global_step": 161216, "epoch": 1332} {"train_loss": -39.64005661010742, "global_step": 161217, "epoch": 1332} {"train_loss": -39.99030303955078, "global_step": 161218, "epoch": 1332} {"train_loss": -40.59539794921875, "global_step": 161219, "epoch": 1332} {"train_loss": -41.07612991333008, "global_step": 161220, "epoch": 1332} {"train_loss": -40.75983810424805, "global_step": 161221, "epoch": 1332} {"train_loss": -41.1195182800293, "global_step": 161222, "epoch": 1332} {"train_loss": -41.31258773803711, "global_step": 161223, "epoch": 1332} {"train_loss": -40.57338333129883, "global_step": 161224, "epoch": 1332} {"train_loss": -40.611419677734375, "global_step": 161225, "epoch": 1332} {"train_loss": -41.23394775390625, "global_step": 161226, "epoch": 1332} {"train_loss": -39.504417419433594, "global_step": 161227, "epoch": 1332} {"train_loss": -36.74739456176758, "global_step": 161228, "epoch": 1332} {"train_loss": -38.96552276611328, "global_step": 161229, "epoch": 1332} {"train_loss": -40.67914962768555, "global_step": 161230, "epoch": 1332} {"train_loss": -40.97237014770508, "global_step": 161231, "epoch": 1332} {"train_loss": -40.5865592956543, "global_step": 161232, "epoch": 1332} {"train_loss": -40.20038986206055, "global_step": 161233, "epoch": 1332} {"train_loss": -40.30814743041992, "global_step": 161234, "epoch": 1332} {"train_loss": -40.67275619506836, "global_step": 161235, "epoch": 1332} {"train_loss": -40.87259292602539, "global_step": 161236, "epoch": 1332} {"train_loss": -39.451881408691406, "global_step": 161237, "epoch": 1332} {"train_loss": -40.65991973876953, "global_step": 161238, "epoch": 1332} {"train_loss": -40.70853805541992, "global_step": 161239, "epoch": 1332} {"train_loss": -40.53574752807617, "global_step": 161240, "epoch": 1332} {"train_loss": -41.44397735595703, "global_step": 161241, "epoch": 1332} {"train_loss": -40.14706039428711, "global_step": 161242, "epoch": 1332} {"train_loss": -40.84408187866211, "global_step": 161243, "epoch": 1332} {"train_loss": -41.00922775268555, "global_step": 161244, "epoch": 1332} {"train_loss": -41.253265380859375, "global_step": 161245, "epoch": 1332} {"train_loss": -39.79514694213867, "global_step": 161246, "epoch": 1332} {"train_loss": -39.929054260253906, "global_step": 161247, "epoch": 1332} {"train_loss": -41.76762008666992, "global_step": 161248, "epoch": 1332} {"train_loss": -39.66868209838867, "global_step": 161249, "epoch": 1332} {"train_loss": -41.08306884765625, "global_step": 161250, "epoch": 1332} {"train_loss": -40.97182083129883, "global_step": 161251, "epoch": 1332} {"train_loss": -40.187679290771484, "global_step": 161252, "epoch": 1332} {"train_loss": -41.06052780151367, "global_step": 161253, "epoch": 1332} {"train_loss": -41.149776458740234, "global_step": 161254, "epoch": 1332} {"train_loss": -40.64887237548828, "global_step": 161255, "epoch": 1332} {"train_loss": -40.44341278076172, "global_step": 161256, "epoch": 1332} {"train_loss": -41.72467041015625, "global_step": 161257, "epoch": 1332} {"train_loss": -40.72909927368164, "global_step": 161258, "epoch": 1332} {"train_loss": -40.24689865112305, "global_step": 161259, "epoch": 1332} {"train_loss": -41.373775482177734, "global_step": 161260, "epoch": 1332} {"train_loss": -40.509456634521484, "global_step": 161261, "epoch": 1332} {"train_loss": -39.9721565246582, "global_step": 161262, "epoch": 1332} {"train_loss": -40.266746520996094, "global_step": 161263, "epoch": 1332} {"train_loss": -40.597225189208984, "global_step": 161264, "epoch": 1332} {"train_loss": -40.34632110595703, "global_step": 161265, "epoch": 1332} {"train_loss": -41.19159698486328, "global_step": 161266, "epoch": 1332} {"train_loss": -40.67698669433594, "global_step": 161267, "epoch": 1332} {"train_loss": -41.204097747802734, "global_step": 161268, "epoch": 1332} {"train_loss": -41.35005569458008, "global_step": 161269, "epoch": 1332} {"train_loss": -40.910423278808594, "global_step": 161270, "epoch": 1332} {"train_loss": -41.328704833984375, "global_step": 161271, "epoch": 1332} {"train_loss": -41.12091827392578, "global_step": 161272, "epoch": 1332} {"train_loss": -40.118221282958984, "global_step": 161273, "epoch": 1332} {"train_loss": -40.951210021972656, "global_step": 161274, "epoch": 1332} {"train_loss": -41.54435729980469, "global_step": 161275, "epoch": 1332} {"train_loss": -40.6349983215332, "global_step": 161276, "epoch": 1332} {"train_loss": -41.27391052246094, "global_step": 161277, "epoch": 1332} {"train_loss": -41.33634567260742, "global_step": 161278, "epoch": 1332} {"train_loss": -41.11953353881836, "global_step": 161279, "epoch": 1332} {"train_loss": -41.873817443847656, "global_step": 161280, "epoch": 1332} {"train_loss": -41.82875442504883, "global_step": 161281, "epoch": 1332} {"train_loss": -40.54446029663086, "global_step": 161282, "epoch": 1332} {"train_loss": -41.52750778198242, "global_step": 161283, "epoch": 1332} {"train_loss": -41.018245697021484, "global_step": 161284, "epoch": 1332} {"train_loss": -40.76345443725586, "global_step": 161285, "epoch": 1332} {"train_loss": -41.01143264770508, "global_step": 161286, "epoch": 1332} {"train_loss": -40.826995849609375, "global_step": 161287, "epoch": 1332} {"train_loss": -39.85856246948242, "global_step": 161288, "epoch": 1332} {"train_loss": -41.224056243896484, "global_step": 161289, "epoch": 1332} {"train_loss": -39.939796447753906, "global_step": 161290, "epoch": 1332} {"train_loss": -40.43972396850586, "global_step": 161291, "epoch": 1332} {"train_loss": -40.719626276946265, "global_step": 161292, "epoch": 1332, "val_loss": 2396497.25} {"train_loss": -40.99665069580078, "global_step": 161293, "epoch": 1333} {"train_loss": -39.19670104980469, "global_step": 161294, "epoch": 1333} {"train_loss": -39.12775802612305, "global_step": 161295, "epoch": 1333} {"train_loss": -39.73330307006836, "global_step": 161296, "epoch": 1333} {"train_loss": -39.22299575805664, "global_step": 161297, "epoch": 1333} {"train_loss": -39.90533447265625, "global_step": 161298, "epoch": 1333} {"train_loss": -40.36336898803711, "global_step": 161299, "epoch": 1333} {"train_loss": -39.65952682495117, "global_step": 161300, "epoch": 1333} {"train_loss": -41.223541259765625, "global_step": 161301, "epoch": 1333} {"train_loss": -40.31355667114258, "global_step": 161302, "epoch": 1333} {"train_loss": -40.88814163208008, "global_step": 161303, "epoch": 1333} {"train_loss": -40.238189697265625, "global_step": 161304, "epoch": 1333} {"train_loss": -41.23550033569336, "global_step": 161305, "epoch": 1333} {"train_loss": -41.162506103515625, "global_step": 161306, "epoch": 1333} {"train_loss": -39.923946380615234, "global_step": 161307, "epoch": 1333} {"train_loss": -40.853267669677734, "global_step": 161308, "epoch": 1333} {"train_loss": -40.54939651489258, "global_step": 161309, "epoch": 1333} {"train_loss": -39.50828170776367, "global_step": 161310, "epoch": 1333} {"train_loss": -40.528263092041016, "global_step": 161311, "epoch": 1333} {"train_loss": -41.04290771484375, "global_step": 161312, "epoch": 1333} {"train_loss": -40.05915069580078, "global_step": 161313, "epoch": 1333} {"train_loss": -39.546634674072266, "global_step": 161314, "epoch": 1333} {"train_loss": -41.49557113647461, "global_step": 161315, "epoch": 1333} {"train_loss": -40.35040283203125, "global_step": 161316, "epoch": 1333} {"train_loss": -39.92109680175781, "global_step": 161317, "epoch": 1333} {"train_loss": -40.57540512084961, "global_step": 161318, "epoch": 1333} {"train_loss": -41.314186096191406, "global_step": 161319, "epoch": 1333} {"train_loss": -39.66756057739258, "global_step": 161320, "epoch": 1333} {"train_loss": -40.205230712890625, "global_step": 161321, "epoch": 1333} {"train_loss": -41.65157699584961, "global_step": 161322, "epoch": 1333} {"train_loss": -40.7808952331543, "global_step": 161323, "epoch": 1333} {"train_loss": -40.7674446105957, "global_step": 161324, "epoch": 1333} {"train_loss": -41.584999084472656, "global_step": 161325, "epoch": 1333} {"train_loss": -40.74711608886719, "global_step": 161326, "epoch": 1333} {"train_loss": -41.49934005737305, "global_step": 161327, "epoch": 1333} {"train_loss": -40.89274215698242, "global_step": 161328, "epoch": 1333} {"train_loss": -41.36779022216797, "global_step": 161329, "epoch": 1333} {"train_loss": -41.08356857299805, "global_step": 161330, "epoch": 1333} {"train_loss": -41.019569396972656, "global_step": 161331, "epoch": 1333} {"train_loss": -40.86501693725586, "global_step": 161332, "epoch": 1333} {"train_loss": -41.11072540283203, "global_step": 161333, "epoch": 1333} {"train_loss": -41.537200927734375, "global_step": 161334, "epoch": 1333} {"train_loss": -40.72553634643555, "global_step": 161335, "epoch": 1333} {"train_loss": -41.34689712524414, "global_step": 161336, "epoch": 1333} {"train_loss": -41.20333480834961, "global_step": 161337, "epoch": 1333} {"train_loss": -40.852813720703125, "global_step": 161338, "epoch": 1333} {"train_loss": -40.539939880371094, "global_step": 161339, "epoch": 1333} {"train_loss": -41.013336181640625, "global_step": 161340, "epoch": 1333} {"train_loss": -41.515411376953125, "global_step": 161341, "epoch": 1333} {"train_loss": -41.17854309082031, "global_step": 161342, "epoch": 1333} {"train_loss": -41.68079376220703, "global_step": 161343, "epoch": 1333} {"train_loss": -41.112972259521484, "global_step": 161344, "epoch": 1333} {"train_loss": -40.94793701171875, "global_step": 161345, "epoch": 1333} {"train_loss": -41.773658752441406, "global_step": 161346, "epoch": 1333} {"train_loss": -41.74432373046875, "global_step": 161347, "epoch": 1333} {"train_loss": -41.975830078125, "global_step": 161348, "epoch": 1333} {"train_loss": -41.94913864135742, "global_step": 161349, "epoch": 1333} {"train_loss": -41.8442497253418, "global_step": 161350, "epoch": 1333} {"train_loss": -42.26433181762695, "global_step": 161351, "epoch": 1333} {"train_loss": -41.84944534301758, "global_step": 161352, "epoch": 1333} {"train_loss": -41.588287353515625, "global_step": 161353, "epoch": 1333} {"train_loss": -41.50641632080078, "global_step": 161354, "epoch": 1333} {"train_loss": -42.00103759765625, "global_step": 161355, "epoch": 1333} {"train_loss": -41.65108108520508, "global_step": 161356, "epoch": 1333} {"train_loss": -40.37288284301758, "global_step": 161357, "epoch": 1333} {"train_loss": -39.76115798950195, "global_step": 161358, "epoch": 1333} {"train_loss": -39.042144775390625, "global_step": 161359, "epoch": 1333} {"train_loss": -38.950340270996094, "global_step": 161360, "epoch": 1333} {"train_loss": -38.7432975769043, "global_step": 161361, "epoch": 1333} {"train_loss": -39.2922248840332, "global_step": 161362, "epoch": 1333} {"train_loss": -39.36760711669922, "global_step": 161363, "epoch": 1333} {"train_loss": -40.521846771240234, "global_step": 161364, "epoch": 1333} {"train_loss": -39.36800765991211, "global_step": 161365, "epoch": 1333} {"train_loss": -39.75010299682617, "global_step": 161366, "epoch": 1333} {"train_loss": -40.311744689941406, "global_step": 161367, "epoch": 1333} {"train_loss": -40.75048828125, "global_step": 161368, "epoch": 1333} {"train_loss": -39.77836990356445, "global_step": 161369, "epoch": 1333} {"train_loss": -39.1162109375, "global_step": 161370, "epoch": 1333} {"train_loss": -40.8470573425293, "global_step": 161371, "epoch": 1333} {"train_loss": -40.78741455078125, "global_step": 161372, "epoch": 1333} {"train_loss": -39.55364990234375, "global_step": 161373, "epoch": 1333} {"train_loss": -39.77595138549805, "global_step": 161374, "epoch": 1333} {"train_loss": -41.499969482421875, "global_step": 161375, "epoch": 1333} {"train_loss": -39.72401428222656, "global_step": 161376, "epoch": 1333} {"train_loss": -38.655067443847656, "global_step": 161377, "epoch": 1333} {"train_loss": -40.682777404785156, "global_step": 161378, "epoch": 1333} {"train_loss": -40.282196044921875, "global_step": 161379, "epoch": 1333} {"train_loss": -40.629005432128906, "global_step": 161380, "epoch": 1333} {"train_loss": -41.137062072753906, "global_step": 161381, "epoch": 1333} {"train_loss": -40.352020263671875, "global_step": 161382, "epoch": 1333} {"train_loss": -41.129737854003906, "global_step": 161383, "epoch": 1333} {"train_loss": -40.930267333984375, "global_step": 161384, "epoch": 1333} {"train_loss": -40.554508209228516, "global_step": 161385, "epoch": 1333} {"train_loss": -41.03044891357422, "global_step": 161386, "epoch": 1333} {"train_loss": -40.05141067504883, "global_step": 161387, "epoch": 1333} {"train_loss": -40.86521530151367, "global_step": 161388, "epoch": 1333} {"train_loss": -41.319786071777344, "global_step": 161389, "epoch": 1333} {"train_loss": -40.22794723510742, "global_step": 161390, "epoch": 1333} {"train_loss": -40.836910247802734, "global_step": 161391, "epoch": 1333} {"train_loss": -40.78062057495117, "global_step": 161392, "epoch": 1333} {"train_loss": -40.80363464355469, "global_step": 161393, "epoch": 1333} {"train_loss": -40.25244903564453, "global_step": 161394, "epoch": 1333} {"train_loss": -41.10729217529297, "global_step": 161395, "epoch": 1333} {"train_loss": -40.28253173828125, "global_step": 161396, "epoch": 1333} {"train_loss": -41.27911376953125, "global_step": 161397, "epoch": 1333} {"train_loss": -40.85047912597656, "global_step": 161398, "epoch": 1333} {"train_loss": -38.8577766418457, "global_step": 161399, "epoch": 1333} {"train_loss": -41.47867965698242, "global_step": 161400, "epoch": 1333} {"train_loss": -40.85557174682617, "global_step": 161401, "epoch": 1333} {"train_loss": -38.99115753173828, "global_step": 161402, "epoch": 1333} {"train_loss": -38.991294860839844, "global_step": 161403, "epoch": 1333} {"train_loss": -39.705345153808594, "global_step": 161404, "epoch": 1333} {"train_loss": -39.94625473022461, "global_step": 161405, "epoch": 1333} {"train_loss": -40.58185958862305, "global_step": 161406, "epoch": 1333} {"train_loss": -38.12894821166992, "global_step": 161407, "epoch": 1333} {"train_loss": -40.87052536010742, "global_step": 161408, "epoch": 1333} {"train_loss": -40.121150970458984, "global_step": 161409, "epoch": 1333} {"train_loss": -39.48735427856445, "global_step": 161410, "epoch": 1333} {"train_loss": -40.51993179321289, "global_step": 161411, "epoch": 1333} {"train_loss": -39.993587493896484, "global_step": 161412, "epoch": 1333} {"train_loss": -40.551636309663124, "global_step": 161413, "epoch": 1333, "val_loss": 2418642.75} {"train_loss": -39.891517639160156, "global_step": 161414, "epoch": 1334} {"train_loss": -39.64939880371094, "global_step": 161415, "epoch": 1334} {"train_loss": -40.347938537597656, "global_step": 161416, "epoch": 1334} {"train_loss": -40.33039474487305, "global_step": 161417, "epoch": 1334} {"train_loss": -41.0378532409668, "global_step": 161418, "epoch": 1334} {"train_loss": -40.47561264038086, "global_step": 161419, "epoch": 1334} {"train_loss": -40.4272575378418, "global_step": 161420, "epoch": 1334} {"train_loss": -41.19105529785156, "global_step": 161421, "epoch": 1334} {"train_loss": -40.091339111328125, "global_step": 161422, "epoch": 1334} {"train_loss": -41.07337188720703, "global_step": 161423, "epoch": 1334} {"train_loss": -40.97123336791992, "global_step": 161424, "epoch": 1334} {"train_loss": -41.030879974365234, "global_step": 161425, "epoch": 1334} {"train_loss": -40.52263259887695, "global_step": 161426, "epoch": 1334} {"train_loss": -40.788265228271484, "global_step": 161427, "epoch": 1334} {"train_loss": -41.51323699951172, "global_step": 161428, "epoch": 1334} {"train_loss": -41.329376220703125, "global_step": 161429, "epoch": 1334} {"train_loss": -40.838172912597656, "global_step": 161430, "epoch": 1334} {"train_loss": -41.06232833862305, "global_step": 161431, "epoch": 1334} {"train_loss": -41.537715911865234, "global_step": 161432, "epoch": 1334} {"train_loss": -40.53553771972656, "global_step": 161433, "epoch": 1334} {"train_loss": -40.520416259765625, "global_step": 161434, "epoch": 1334} {"train_loss": -40.90019989013672, "global_step": 161435, "epoch": 1334} {"train_loss": -40.81787109375, "global_step": 161436, "epoch": 1334} {"train_loss": -39.99973678588867, "global_step": 161437, "epoch": 1334} {"train_loss": -41.55172348022461, "global_step": 161438, "epoch": 1334} {"train_loss": -39.718563079833984, "global_step": 161439, "epoch": 1334} {"train_loss": -41.34530258178711, "global_step": 161440, "epoch": 1334} {"train_loss": -40.731021881103516, "global_step": 161441, "epoch": 1334} {"train_loss": -39.92219161987305, "global_step": 161442, "epoch": 1334} {"train_loss": -40.113914489746094, "global_step": 161443, "epoch": 1334} {"train_loss": -39.217403411865234, "global_step": 161444, "epoch": 1334} {"train_loss": -39.00333786010742, "global_step": 161445, "epoch": 1334} {"train_loss": -40.317596435546875, "global_step": 161446, "epoch": 1334} {"train_loss": -40.3121337890625, "global_step": 161447, "epoch": 1334} {"train_loss": -40.94011306762695, "global_step": 161448, "epoch": 1334} {"train_loss": -39.200660705566406, "global_step": 161449, "epoch": 1334} {"train_loss": -39.2123908996582, "global_step": 161450, "epoch": 1334} {"train_loss": -40.603309631347656, "global_step": 161451, "epoch": 1334} {"train_loss": -40.34369659423828, "global_step": 161452, "epoch": 1334} {"train_loss": -40.035648345947266, "global_step": 161453, "epoch": 1334} {"train_loss": -39.776248931884766, "global_step": 161454, "epoch": 1334} {"train_loss": -40.19580078125, "global_step": 161455, "epoch": 1334} {"train_loss": -40.84382247924805, "global_step": 161456, "epoch": 1334} {"train_loss": -40.33195114135742, "global_step": 161457, "epoch": 1334} {"train_loss": -39.3486328125, "global_step": 161458, "epoch": 1334} {"train_loss": -40.756011962890625, "global_step": 161459, "epoch": 1334} {"train_loss": -40.98735427856445, "global_step": 161460, "epoch": 1334} {"train_loss": -40.871925354003906, "global_step": 161461, "epoch": 1334} {"train_loss": -40.83541488647461, "global_step": 161462, "epoch": 1334} {"train_loss": -40.943485260009766, "global_step": 161463, "epoch": 1334} {"train_loss": -41.52783966064453, "global_step": 161464, "epoch": 1334} {"train_loss": -39.5921516418457, "global_step": 161465, "epoch": 1334} {"train_loss": -41.989768981933594, "global_step": 161466, "epoch": 1334} {"train_loss": -39.914794921875, "global_step": 161467, "epoch": 1334} {"train_loss": -39.96773910522461, "global_step": 161468, "epoch": 1334} {"train_loss": -41.05988693237305, "global_step": 161469, "epoch": 1334} {"train_loss": -41.07965087890625, "global_step": 161470, "epoch": 1334} {"train_loss": -40.564144134521484, "global_step": 161471, "epoch": 1334} {"train_loss": -40.220699310302734, "global_step": 161472, "epoch": 1334} {"train_loss": -41.863067626953125, "global_step": 161473, "epoch": 1334} {"train_loss": -40.83411407470703, "global_step": 161474, "epoch": 1334} {"train_loss": -40.940696716308594, "global_step": 161475, "epoch": 1334} {"train_loss": -40.98686599731445, "global_step": 161476, "epoch": 1334} {"train_loss": -40.92523193359375, "global_step": 161477, "epoch": 1334} {"train_loss": -41.34711837768555, "global_step": 161478, "epoch": 1334} {"train_loss": -41.39651107788086, "global_step": 161479, "epoch": 1334} {"train_loss": -41.30363082885742, "global_step": 161480, "epoch": 1334} {"train_loss": -40.63907241821289, "global_step": 161481, "epoch": 1334} {"train_loss": -41.208675384521484, "global_step": 161482, "epoch": 1334} {"train_loss": -41.36016845703125, "global_step": 161483, "epoch": 1334} {"train_loss": -41.06637191772461, "global_step": 161484, "epoch": 1334} {"train_loss": -41.071353912353516, "global_step": 161485, "epoch": 1334} {"train_loss": -40.83987045288086, "global_step": 161486, "epoch": 1334} {"train_loss": -41.540828704833984, "global_step": 161487, "epoch": 1334} {"train_loss": -41.128631591796875, "global_step": 161488, "epoch": 1334} {"train_loss": -39.7398796081543, "global_step": 161489, "epoch": 1334} {"train_loss": -39.58778762817383, "global_step": 161490, "epoch": 1334} {"train_loss": -41.18081283569336, "global_step": 161491, "epoch": 1334} {"train_loss": -39.819759368896484, "global_step": 161492, "epoch": 1334} {"train_loss": -39.707027435302734, "global_step": 161493, "epoch": 1334} {"train_loss": -41.38272476196289, "global_step": 161494, "epoch": 1334} {"train_loss": -41.18354034423828, "global_step": 161495, "epoch": 1334} {"train_loss": -40.978736877441406, "global_step": 161496, "epoch": 1334} {"train_loss": -41.36201858520508, "global_step": 161497, "epoch": 1334} {"train_loss": -41.22319412231445, "global_step": 161498, "epoch": 1334} {"train_loss": -40.89511489868164, "global_step": 161499, "epoch": 1334} {"train_loss": -41.59416580200195, "global_step": 161500, "epoch": 1334} {"train_loss": -41.474464416503906, "global_step": 161501, "epoch": 1334} {"train_loss": -41.941402435302734, "global_step": 161502, "epoch": 1334} {"train_loss": -42.014869689941406, "global_step": 161503, "epoch": 1334} {"train_loss": -41.34519577026367, "global_step": 161504, "epoch": 1334} {"train_loss": -41.59281539916992, "global_step": 161505, "epoch": 1334} {"train_loss": -41.816062927246094, "global_step": 161506, "epoch": 1334} {"train_loss": -41.825050354003906, "global_step": 161507, "epoch": 1334} {"train_loss": -42.17535400390625, "global_step": 161508, "epoch": 1334} {"train_loss": -42.02912902832031, "global_step": 161509, "epoch": 1334} {"train_loss": -42.33382034301758, "global_step": 161510, "epoch": 1334} {"train_loss": -42.20040512084961, "global_step": 161511, "epoch": 1334} {"train_loss": -41.81515121459961, "global_step": 161512, "epoch": 1334} {"train_loss": -42.049415588378906, "global_step": 161513, "epoch": 1334} {"train_loss": -42.39084243774414, "global_step": 161514, "epoch": 1334} {"train_loss": -41.89793014526367, "global_step": 161515, "epoch": 1334} {"train_loss": -42.111785888671875, "global_step": 161516, "epoch": 1334} {"train_loss": -42.409080505371094, "global_step": 161517, "epoch": 1334} {"train_loss": -42.30007553100586, "global_step": 161518, "epoch": 1334} {"train_loss": -41.904293060302734, "global_step": 161519, "epoch": 1334} {"train_loss": -42.25453567504883, "global_step": 161520, "epoch": 1334} {"train_loss": -41.9732551574707, "global_step": 161521, "epoch": 1334} {"train_loss": -42.17666244506836, "global_step": 161522, "epoch": 1334} {"train_loss": -42.504722595214844, "global_step": 161523, "epoch": 1334} {"train_loss": -41.22263717651367, "global_step": 161524, "epoch": 1334} {"train_loss": -41.96331024169922, "global_step": 161525, "epoch": 1334} {"train_loss": -42.04557418823242, "global_step": 161526, "epoch": 1334} {"train_loss": -42.251853942871094, "global_step": 161527, "epoch": 1334} {"train_loss": -42.1190299987793, "global_step": 161528, "epoch": 1334} {"train_loss": -42.029937744140625, "global_step": 161529, "epoch": 1334} {"train_loss": -42.09849166870117, "global_step": 161530, "epoch": 1334} {"train_loss": -42.024959564208984, "global_step": 161531, "epoch": 1334} {"train_loss": -42.295562744140625, "global_step": 161532, "epoch": 1334} {"train_loss": -42.04558563232422, "global_step": 161533, "epoch": 1334} {"train_loss": -41.03897797765811, "global_step": 161534, "epoch": 1334, "val_loss": 2465277.5} {"train_loss": -40.87898635864258, "global_step": 161535, "epoch": 1335} {"train_loss": -40.78372573852539, "global_step": 161536, "epoch": 1335} {"train_loss": -41.7307243347168, "global_step": 161537, "epoch": 1335} {"train_loss": -40.65256881713867, "global_step": 161538, "epoch": 1335} {"train_loss": -40.34144973754883, "global_step": 161539, "epoch": 1335} {"train_loss": -39.82874298095703, "global_step": 161540, "epoch": 1335} {"train_loss": -37.96993637084961, "global_step": 161541, "epoch": 1335} {"train_loss": -34.621219635009766, "global_step": 161542, "epoch": 1335} {"train_loss": -31.939727783203125, "global_step": 161543, "epoch": 1335} {"train_loss": -23.926700592041016, "global_step": 161544, "epoch": 1335} {"train_loss": -24.879817962646484, "global_step": 161545, "epoch": 1335} {"train_loss": -37.50580978393555, "global_step": 161546, "epoch": 1335} {"train_loss": -28.981210708618164, "global_step": 161547, "epoch": 1335} {"train_loss": -23.109201431274414, "global_step": 161548, "epoch": 1335} {"train_loss": -34.77698516845703, "global_step": 161549, "epoch": 1335} {"train_loss": -30.52020263671875, "global_step": 161550, "epoch": 1335} {"train_loss": -35.05546951293945, "global_step": 161551, "epoch": 1335} {"train_loss": -27.819721221923828, "global_step": 161552, "epoch": 1335} {"train_loss": -36.636207580566406, "global_step": 161553, "epoch": 1335} {"train_loss": -29.970239639282227, "global_step": 161554, "epoch": 1335} {"train_loss": -36.35273361206055, "global_step": 161555, "epoch": 1335} {"train_loss": -32.626708984375, "global_step": 161556, "epoch": 1335} {"train_loss": -38.55345916748047, "global_step": 161557, "epoch": 1335} {"train_loss": -31.836261749267578, "global_step": 161558, "epoch": 1335} {"train_loss": -37.4445686340332, "global_step": 161559, "epoch": 1335} {"train_loss": -36.12921142578125, "global_step": 161560, "epoch": 1335} {"train_loss": -35.74687194824219, "global_step": 161561, "epoch": 1335} {"train_loss": -38.390621185302734, "global_step": 161562, "epoch": 1335} {"train_loss": -36.78163528442383, "global_step": 161563, "epoch": 1335} {"train_loss": -37.37411117553711, "global_step": 161564, "epoch": 1335} {"train_loss": -38.07487487792969, "global_step": 161565, "epoch": 1335} {"train_loss": -38.506591796875, "global_step": 161566, "epoch": 1335} {"train_loss": -38.21283721923828, "global_step": 161567, "epoch": 1335} {"train_loss": -39.31915283203125, "global_step": 161568, "epoch": 1335} {"train_loss": -38.129154205322266, "global_step": 161569, "epoch": 1335} {"train_loss": -39.47922897338867, "global_step": 161570, "epoch": 1335} {"train_loss": -38.58187484741211, "global_step": 161571, "epoch": 1335} {"train_loss": -39.284305572509766, "global_step": 161572, "epoch": 1335} {"train_loss": -39.35802459716797, "global_step": 161573, "epoch": 1335} {"train_loss": -38.95075988769531, "global_step": 161574, "epoch": 1335} {"train_loss": -39.2181510925293, "global_step": 161575, "epoch": 1335} {"train_loss": -39.34571838378906, "global_step": 161576, "epoch": 1335} {"train_loss": -39.36776351928711, "global_step": 161577, "epoch": 1335} {"train_loss": -39.99856185913086, "global_step": 161578, "epoch": 1335} {"train_loss": -39.959022521972656, "global_step": 161579, "epoch": 1335} {"train_loss": -40.049800872802734, "global_step": 161580, "epoch": 1335} {"train_loss": -39.54753494262695, "global_step": 161581, "epoch": 1335} {"train_loss": -39.9399528503418, "global_step": 161582, "epoch": 1335} {"train_loss": -39.86438751220703, "global_step": 161583, "epoch": 1335} {"train_loss": -40.15647506713867, "global_step": 161584, "epoch": 1335} {"train_loss": -40.350852966308594, "global_step": 161585, "epoch": 1335} {"train_loss": -40.27132797241211, "global_step": 161586, "epoch": 1335} {"train_loss": -40.49542236328125, "global_step": 161587, "epoch": 1335} {"train_loss": -40.48445510864258, "global_step": 161588, "epoch": 1335} {"train_loss": -40.31018829345703, "global_step": 161589, "epoch": 1335} {"train_loss": -40.25510787963867, "global_step": 161590, "epoch": 1335} {"train_loss": -40.57038497924805, "global_step": 161591, "epoch": 1335} {"train_loss": -40.731483459472656, "global_step": 161592, "epoch": 1335} {"train_loss": -40.53878402709961, "global_step": 161593, "epoch": 1335} {"train_loss": -40.74483871459961, "global_step": 161594, "epoch": 1335} {"train_loss": -40.53844451904297, "global_step": 161595, "epoch": 1335} {"train_loss": -40.93722152709961, "global_step": 161596, "epoch": 1335} {"train_loss": -41.27256393432617, "global_step": 161597, "epoch": 1335} {"train_loss": -40.909576416015625, "global_step": 161598, "epoch": 1335} {"train_loss": -41.039058685302734, "global_step": 161599, "epoch": 1335} {"train_loss": -40.96015167236328, "global_step": 161600, "epoch": 1335} {"train_loss": -40.80773162841797, "global_step": 161601, "epoch": 1335} {"train_loss": -41.22577667236328, "global_step": 161602, "epoch": 1335} {"train_loss": -41.050594329833984, "global_step": 161603, "epoch": 1335} {"train_loss": -41.122493743896484, "global_step": 161604, "epoch": 1335} {"train_loss": -41.1938591003418, "global_step": 161605, "epoch": 1335} {"train_loss": -41.44428634643555, "global_step": 161606, "epoch": 1335} {"train_loss": -41.26555252075195, "global_step": 161607, "epoch": 1335} {"train_loss": -41.289588928222656, "global_step": 161608, "epoch": 1335} {"train_loss": -41.52272415161133, "global_step": 161609, "epoch": 1335} {"train_loss": -41.216590881347656, "global_step": 161610, "epoch": 1335} {"train_loss": -41.57977294921875, "global_step": 161611, "epoch": 1335} {"train_loss": -41.35857009887695, "global_step": 161612, "epoch": 1335} {"train_loss": -41.80967330932617, "global_step": 161613, "epoch": 1335} {"train_loss": -41.20406723022461, "global_step": 161614, "epoch": 1335} {"train_loss": -41.54314041137695, "global_step": 161615, "epoch": 1335} {"train_loss": -41.57538604736328, "global_step": 161616, "epoch": 1335} {"train_loss": -41.3074836730957, "global_step": 161617, "epoch": 1335} {"train_loss": -41.44376754760742, "global_step": 161618, "epoch": 1335} {"train_loss": -41.55233383178711, "global_step": 161619, "epoch": 1335} {"train_loss": -41.99721908569336, "global_step": 161620, "epoch": 1335} {"train_loss": -41.45200729370117, "global_step": 161621, "epoch": 1335} {"train_loss": -41.78899002075195, "global_step": 161622, "epoch": 1335} {"train_loss": -41.64920425415039, "global_step": 161623, "epoch": 1335} {"train_loss": -42.066322326660156, "global_step": 161624, "epoch": 1335} {"train_loss": -42.08278274536133, "global_step": 161625, "epoch": 1335} {"train_loss": -41.51031494140625, "global_step": 161626, "epoch": 1335} {"train_loss": -42.3231201171875, "global_step": 161627, "epoch": 1335} {"train_loss": -42.02920913696289, "global_step": 161628, "epoch": 1335} {"train_loss": -41.97414779663086, "global_step": 161629, "epoch": 1335} {"train_loss": -42.16673278808594, "global_step": 161630, "epoch": 1335} {"train_loss": -41.95764923095703, "global_step": 161631, "epoch": 1335} {"train_loss": -42.289424896240234, "global_step": 161632, "epoch": 1335} {"train_loss": -41.9696159362793, "global_step": 161633, "epoch": 1335} {"train_loss": -41.93150329589844, "global_step": 161634, "epoch": 1335} {"train_loss": -42.19730758666992, "global_step": 161635, "epoch": 1335} {"train_loss": -42.03020095825195, "global_step": 161636, "epoch": 1335} {"train_loss": -42.30857467651367, "global_step": 161637, "epoch": 1335} {"train_loss": -41.92767333984375, "global_step": 161638, "epoch": 1335} {"train_loss": -41.96809768676758, "global_step": 161639, "epoch": 1335} {"train_loss": -42.052486419677734, "global_step": 161640, "epoch": 1335} {"train_loss": -42.04408645629883, "global_step": 161641, "epoch": 1335} {"train_loss": -42.43891143798828, "global_step": 161642, "epoch": 1335} {"train_loss": -42.451045989990234, "global_step": 161643, "epoch": 1335} {"train_loss": -42.43540573120117, "global_step": 161644, "epoch": 1335} {"train_loss": -42.41217041015625, "global_step": 161645, "epoch": 1335} {"train_loss": -42.531646728515625, "global_step": 161646, "epoch": 1335} {"train_loss": -42.11736297607422, "global_step": 161647, "epoch": 1335} {"train_loss": -42.45750045776367, "global_step": 161648, "epoch": 1335} {"train_loss": -42.29620361328125, "global_step": 161649, "epoch": 1335} {"train_loss": -42.35920333862305, "global_step": 161650, "epoch": 1335} {"train_loss": -42.76920700073242, "global_step": 161651, "epoch": 1335} {"train_loss": -42.573848724365234, "global_step": 161652, "epoch": 1335} {"train_loss": -42.79522705078125, "global_step": 161653, "epoch": 1335} {"train_loss": -42.316036224365234, "global_step": 161654, "epoch": 1335} {"train_loss": -39.52085171849274, "global_step": 161655, "epoch": 1335, "val_loss": 2462280.25} {"train_loss": -41.500125885009766, "global_step": 161656, "epoch": 1336} {"train_loss": -42.16941452026367, "global_step": 161657, "epoch": 1336} {"train_loss": -42.077491760253906, "global_step": 161658, "epoch": 1336} {"train_loss": -41.9099235534668, "global_step": 161659, "epoch": 1336} {"train_loss": -42.56031036376953, "global_step": 161660, "epoch": 1336} {"train_loss": -42.43959426879883, "global_step": 161661, "epoch": 1336} {"train_loss": -42.11806106567383, "global_step": 161662, "epoch": 1336} {"train_loss": -41.62916564941406, "global_step": 161663, "epoch": 1336} {"train_loss": -41.6325798034668, "global_step": 161664, "epoch": 1336} {"train_loss": -40.9830436706543, "global_step": 161665, "epoch": 1336} {"train_loss": -39.324462890625, "global_step": 161666, "epoch": 1336} {"train_loss": -36.6277961730957, "global_step": 161667, "epoch": 1336} {"train_loss": -35.47182083129883, "global_step": 161668, "epoch": 1336} {"train_loss": -30.54957389831543, "global_step": 161669, "epoch": 1336} {"train_loss": -23.93397331237793, "global_step": 161670, "epoch": 1336} {"train_loss": -26.8577938079834, "global_step": 161671, "epoch": 1336} {"train_loss": -35.37547302246094, "global_step": 161672, "epoch": 1336} {"train_loss": -35.56191635131836, "global_step": 161673, "epoch": 1336} {"train_loss": -31.8460693359375, "global_step": 161674, "epoch": 1336} {"train_loss": -40.20146560668945, "global_step": 161675, "epoch": 1336} {"train_loss": -34.49757766723633, "global_step": 161676, "epoch": 1336} {"train_loss": -39.198341369628906, "global_step": 161677, "epoch": 1336} {"train_loss": -36.65318298339844, "global_step": 161678, "epoch": 1336} {"train_loss": -36.46364974975586, "global_step": 161679, "epoch": 1336} {"train_loss": -38.48310852050781, "global_step": 161680, "epoch": 1336} {"train_loss": -38.3094367980957, "global_step": 161681, "epoch": 1336} {"train_loss": -38.58918762207031, "global_step": 161682, "epoch": 1336} {"train_loss": -38.9903564453125, "global_step": 161683, "epoch": 1336} {"train_loss": -38.37263107299805, "global_step": 161684, "epoch": 1336} {"train_loss": -40.23960876464844, "global_step": 161685, "epoch": 1336} {"train_loss": -38.06730270385742, "global_step": 161686, "epoch": 1336} {"train_loss": -39.80736541748047, "global_step": 161687, "epoch": 1336} {"train_loss": -38.308773040771484, "global_step": 161688, "epoch": 1336} {"train_loss": -40.351680755615234, "global_step": 161689, "epoch": 1336} {"train_loss": -39.4450798034668, "global_step": 161690, "epoch": 1336} {"train_loss": -40.31667709350586, "global_step": 161691, "epoch": 1336} {"train_loss": -39.653133392333984, "global_step": 161692, "epoch": 1336} {"train_loss": -39.65039825439453, "global_step": 161693, "epoch": 1336} {"train_loss": -40.425174713134766, "global_step": 161694, "epoch": 1336} {"train_loss": -39.9700927734375, "global_step": 161695, "epoch": 1336} {"train_loss": -40.84490966796875, "global_step": 161696, "epoch": 1336} {"train_loss": -39.65212631225586, "global_step": 161697, "epoch": 1336} {"train_loss": -41.07902145385742, "global_step": 161698, "epoch": 1336} {"train_loss": -40.84819412231445, "global_step": 161699, "epoch": 1336} {"train_loss": -40.88872528076172, "global_step": 161700, "epoch": 1336} {"train_loss": -40.73270034790039, "global_step": 161701, "epoch": 1336} {"train_loss": -40.92564010620117, "global_step": 161702, "epoch": 1336} {"train_loss": -40.5306282043457, "global_step": 161703, "epoch": 1336} {"train_loss": -41.00223159790039, "global_step": 161704, "epoch": 1336} {"train_loss": -40.84779357910156, "global_step": 161705, "epoch": 1336} {"train_loss": -40.985145568847656, "global_step": 161706, "epoch": 1336} {"train_loss": -41.36408615112305, "global_step": 161707, "epoch": 1336} {"train_loss": -41.19633483886719, "global_step": 161708, "epoch": 1336} {"train_loss": -40.78943634033203, "global_step": 161709, "epoch": 1336} {"train_loss": -41.2327766418457, "global_step": 161710, "epoch": 1336} {"train_loss": -41.41047286987305, "global_step": 161711, "epoch": 1336} {"train_loss": -41.3564453125, "global_step": 161712, "epoch": 1336} {"train_loss": -41.17335510253906, "global_step": 161713, "epoch": 1336} {"train_loss": -41.286346435546875, "global_step": 161714, "epoch": 1336} {"train_loss": -41.38969039916992, "global_step": 161715, "epoch": 1336} {"train_loss": -41.70014572143555, "global_step": 161716, "epoch": 1336} {"train_loss": -41.78743362426758, "global_step": 161717, "epoch": 1336} {"train_loss": -41.523250579833984, "global_step": 161718, "epoch": 1336} {"train_loss": -41.76995849609375, "global_step": 161719, "epoch": 1336} {"train_loss": -41.60911178588867, "global_step": 161720, "epoch": 1336} {"train_loss": -41.5737190246582, "global_step": 161721, "epoch": 1336} {"train_loss": -41.58213424682617, "global_step": 161722, "epoch": 1336} {"train_loss": -41.95621871948242, "global_step": 161723, "epoch": 1336} {"train_loss": -41.38308334350586, "global_step": 161724, "epoch": 1336} {"train_loss": -41.97956848144531, "global_step": 161725, "epoch": 1336} {"train_loss": -41.33709716796875, "global_step": 161726, "epoch": 1336} {"train_loss": -41.62606430053711, "global_step": 161727, "epoch": 1336} {"train_loss": -41.68320846557617, "global_step": 161728, "epoch": 1336} {"train_loss": -42.10288619995117, "global_step": 161729, "epoch": 1336} {"train_loss": -41.976318359375, "global_step": 161730, "epoch": 1336} {"train_loss": -41.41109848022461, "global_step": 161731, "epoch": 1336} {"train_loss": -41.874061584472656, "global_step": 161732, "epoch": 1336} {"train_loss": -41.92447280883789, "global_step": 161733, "epoch": 1336} {"train_loss": -41.67213821411133, "global_step": 161734, "epoch": 1336} {"train_loss": -41.74772262573242, "global_step": 161735, "epoch": 1336} {"train_loss": -42.14187240600586, "global_step": 161736, "epoch": 1336} {"train_loss": -42.495121002197266, "global_step": 161737, "epoch": 1336} {"train_loss": -42.2397575378418, "global_step": 161738, "epoch": 1336} {"train_loss": -42.26251220703125, "global_step": 161739, "epoch": 1336} {"train_loss": -42.26247024536133, "global_step": 161740, "epoch": 1336} {"train_loss": -41.75303649902344, "global_step": 161741, "epoch": 1336} {"train_loss": -41.997886657714844, "global_step": 161742, "epoch": 1336} {"train_loss": -41.59661102294922, "global_step": 161743, "epoch": 1336} {"train_loss": -42.067344665527344, "global_step": 161744, "epoch": 1336} {"train_loss": -41.75008010864258, "global_step": 161745, "epoch": 1336} {"train_loss": -40.4675178527832, "global_step": 161746, "epoch": 1336} {"train_loss": -39.65676498413086, "global_step": 161747, "epoch": 1336} {"train_loss": -39.67984390258789, "global_step": 161748, "epoch": 1336} {"train_loss": -41.453914642333984, "global_step": 161749, "epoch": 1336} {"train_loss": -42.12605285644531, "global_step": 161750, "epoch": 1336} {"train_loss": -39.9553108215332, "global_step": 161751, "epoch": 1336} {"train_loss": -38.78189468383789, "global_step": 161752, "epoch": 1336} {"train_loss": -40.242855072021484, "global_step": 161753, "epoch": 1336} {"train_loss": -41.02643585205078, "global_step": 161754, "epoch": 1336} {"train_loss": -41.52479934692383, "global_step": 161755, "epoch": 1336} {"train_loss": -40.66964340209961, "global_step": 161756, "epoch": 1336} {"train_loss": -41.944793701171875, "global_step": 161757, "epoch": 1336} {"train_loss": -41.4694938659668, "global_step": 161758, "epoch": 1336} {"train_loss": -41.748531341552734, "global_step": 161759, "epoch": 1336} {"train_loss": -41.30428695678711, "global_step": 161760, "epoch": 1336} {"train_loss": -41.975440979003906, "global_step": 161761, "epoch": 1336} {"train_loss": -41.032588958740234, "global_step": 161762, "epoch": 1336} {"train_loss": -41.32247543334961, "global_step": 161763, "epoch": 1336} {"train_loss": -41.645050048828125, "global_step": 161764, "epoch": 1336} {"train_loss": -41.65114974975586, "global_step": 161765, "epoch": 1336} {"train_loss": -41.279823303222656, "global_step": 161766, "epoch": 1336} {"train_loss": -41.77790832519531, "global_step": 161767, "epoch": 1336} {"train_loss": -40.93246078491211, "global_step": 161768, "epoch": 1336} {"train_loss": -41.737361907958984, "global_step": 161769, "epoch": 1336} {"train_loss": -41.44788360595703, "global_step": 161770, "epoch": 1336} {"train_loss": -41.81600570678711, "global_step": 161771, "epoch": 1336} {"train_loss": -41.6939582824707, "global_step": 161772, "epoch": 1336} {"train_loss": -41.25889205932617, "global_step": 161773, "epoch": 1336} {"train_loss": -41.5418815612793, "global_step": 161774, "epoch": 1336} {"train_loss": -41.41583251953125, "global_step": 161775, "epoch": 1336} {"train_loss": -40.33596046699965, "global_step": 161776, "epoch": 1336, "val_loss": 2497670.25} {"train_loss": -41.679222106933594, "global_step": 161777, "epoch": 1337} {"train_loss": -41.836299896240234, "global_step": 161778, "epoch": 1337} {"train_loss": -41.57683181762695, "global_step": 161779, "epoch": 1337} {"train_loss": -42.32688522338867, "global_step": 161780, "epoch": 1337} {"train_loss": -41.83840560913086, "global_step": 161781, "epoch": 1337} {"train_loss": -41.97837448120117, "global_step": 161782, "epoch": 1337} {"train_loss": -41.76420211791992, "global_step": 161783, "epoch": 1337} {"train_loss": -42.25703811645508, "global_step": 161784, "epoch": 1337} {"train_loss": -41.98417282104492, "global_step": 161785, "epoch": 1337} {"train_loss": -42.07159423828125, "global_step": 161786, "epoch": 1337} {"train_loss": -41.68203353881836, "global_step": 161787, "epoch": 1337} {"train_loss": -41.31907272338867, "global_step": 161788, "epoch": 1337} {"train_loss": -42.43610763549805, "global_step": 161789, "epoch": 1337} {"train_loss": -42.064998626708984, "global_step": 161790, "epoch": 1337} {"train_loss": -41.92958450317383, "global_step": 161791, "epoch": 1337} {"train_loss": -42.04092025756836, "global_step": 161792, "epoch": 1337} {"train_loss": -41.96219253540039, "global_step": 161793, "epoch": 1337} {"train_loss": -42.02643966674805, "global_step": 161794, "epoch": 1337} {"train_loss": -42.084110260009766, "global_step": 161795, "epoch": 1337} {"train_loss": -42.086341857910156, "global_step": 161796, "epoch": 1337} {"train_loss": -42.31251907348633, "global_step": 161797, "epoch": 1337} {"train_loss": -42.05177688598633, "global_step": 161798, "epoch": 1337} {"train_loss": -41.64811325073242, "global_step": 161799, "epoch": 1337} {"train_loss": -41.69169235229492, "global_step": 161800, "epoch": 1337} {"train_loss": -39.14385223388672, "global_step": 161801, "epoch": 1337} {"train_loss": -37.51143264770508, "global_step": 161802, "epoch": 1337} {"train_loss": -34.129756927490234, "global_step": 161803, "epoch": 1337} {"train_loss": -23.201208114624023, "global_step": 161804, "epoch": 1337} {"train_loss": -24.827335357666016, "global_step": 161805, "epoch": 1337} {"train_loss": -34.5927619934082, "global_step": 161806, "epoch": 1337} {"train_loss": -19.706090927124023, "global_step": 161807, "epoch": 1337} {"train_loss": -32.71797561645508, "global_step": 161808, "epoch": 1337} {"train_loss": -36.388755798339844, "global_step": 161809, "epoch": 1337} {"train_loss": -30.856042861938477, "global_step": 161810, "epoch": 1337} {"train_loss": -32.947078704833984, "global_step": 161811, "epoch": 1337} {"train_loss": -36.25107955932617, "global_step": 161812, "epoch": 1337} {"train_loss": -35.004730224609375, "global_step": 161813, "epoch": 1337} {"train_loss": -38.75971221923828, "global_step": 161814, "epoch": 1337} {"train_loss": -35.6576042175293, "global_step": 161815, "epoch": 1337} {"train_loss": -38.1434211730957, "global_step": 161816, "epoch": 1337} {"train_loss": -36.93952178955078, "global_step": 161817, "epoch": 1337} {"train_loss": -38.54621124267578, "global_step": 161818, "epoch": 1337} {"train_loss": -39.199974060058594, "global_step": 161819, "epoch": 1337} {"train_loss": -39.420413970947266, "global_step": 161820, "epoch": 1337} {"train_loss": -39.12071990966797, "global_step": 161821, "epoch": 1337} {"train_loss": -38.07133865356445, "global_step": 161822, "epoch": 1337} {"train_loss": -38.601871490478516, "global_step": 161823, "epoch": 1337} {"train_loss": -38.9247932434082, "global_step": 161824, "epoch": 1337} {"train_loss": -39.137451171875, "global_step": 161825, "epoch": 1337} {"train_loss": -39.94868087768555, "global_step": 161826, "epoch": 1337} {"train_loss": -39.642730712890625, "global_step": 161827, "epoch": 1337} {"train_loss": -39.826690673828125, "global_step": 161828, "epoch": 1337} {"train_loss": -40.54669952392578, "global_step": 161829, "epoch": 1337} {"train_loss": -40.24043655395508, "global_step": 161830, "epoch": 1337} {"train_loss": -39.84039306640625, "global_step": 161831, "epoch": 1337} {"train_loss": -40.12832260131836, "global_step": 161832, "epoch": 1337} {"train_loss": -40.1245231628418, "global_step": 161833, "epoch": 1337} {"train_loss": -40.48752975463867, "global_step": 161834, "epoch": 1337} {"train_loss": -40.81132888793945, "global_step": 161835, "epoch": 1337} {"train_loss": -40.3230094909668, "global_step": 161836, "epoch": 1337} {"train_loss": -40.80477523803711, "global_step": 161837, "epoch": 1337} {"train_loss": -40.559444427490234, "global_step": 161838, "epoch": 1337} {"train_loss": -40.45529556274414, "global_step": 161839, "epoch": 1337} {"train_loss": -40.64040756225586, "global_step": 161840, "epoch": 1337} {"train_loss": -40.94025421142578, "global_step": 161841, "epoch": 1337} {"train_loss": -40.686126708984375, "global_step": 161842, "epoch": 1337} {"train_loss": -40.68843460083008, "global_step": 161843, "epoch": 1337} {"train_loss": -40.94258499145508, "global_step": 161844, "epoch": 1337} {"train_loss": -40.94831085205078, "global_step": 161845, "epoch": 1337} {"train_loss": -41.06145477294922, "global_step": 161846, "epoch": 1337} {"train_loss": -41.013153076171875, "global_step": 161847, "epoch": 1337} {"train_loss": -41.047096252441406, "global_step": 161848, "epoch": 1337} {"train_loss": -41.13874435424805, "global_step": 161849, "epoch": 1337} {"train_loss": -40.90314483642578, "global_step": 161850, "epoch": 1337} {"train_loss": -41.032005310058594, "global_step": 161851, "epoch": 1337} {"train_loss": -41.26072311401367, "global_step": 161852, "epoch": 1337} {"train_loss": -41.29265213012695, "global_step": 161853, "epoch": 1337} {"train_loss": -41.35376739501953, "global_step": 161854, "epoch": 1337} {"train_loss": -41.432491302490234, "global_step": 161855, "epoch": 1337} {"train_loss": -41.650848388671875, "global_step": 161856, "epoch": 1337} {"train_loss": -41.60293197631836, "global_step": 161857, "epoch": 1337} {"train_loss": -41.106666564941406, "global_step": 161858, "epoch": 1337} {"train_loss": -41.54665756225586, "global_step": 161859, "epoch": 1337} {"train_loss": -41.639137268066406, "global_step": 161860, "epoch": 1337} {"train_loss": -41.2677001953125, "global_step": 161861, "epoch": 1337} {"train_loss": -41.726619720458984, "global_step": 161862, "epoch": 1337} {"train_loss": -41.716800689697266, "global_step": 161863, "epoch": 1337} {"train_loss": -41.77018737792969, "global_step": 161864, "epoch": 1337} {"train_loss": -41.6400146484375, "global_step": 161865, "epoch": 1337} {"train_loss": -41.717098236083984, "global_step": 161866, "epoch": 1337} {"train_loss": -41.75224685668945, "global_step": 161867, "epoch": 1337} {"train_loss": -41.44050216674805, "global_step": 161868, "epoch": 1337} {"train_loss": -41.709896087646484, "global_step": 161869, "epoch": 1337} {"train_loss": -41.62425231933594, "global_step": 161870, "epoch": 1337} {"train_loss": -41.96332931518555, "global_step": 161871, "epoch": 1337} {"train_loss": -41.53434371948242, "global_step": 161872, "epoch": 1337} {"train_loss": -41.309600830078125, "global_step": 161873, "epoch": 1337} {"train_loss": -41.5494384765625, "global_step": 161874, "epoch": 1337} {"train_loss": -41.38100814819336, "global_step": 161875, "epoch": 1337} {"train_loss": -41.490997314453125, "global_step": 161876, "epoch": 1337} {"train_loss": -41.53925704956055, "global_step": 161877, "epoch": 1337} {"train_loss": -41.52967071533203, "global_step": 161878, "epoch": 1337} {"train_loss": -42.15496826171875, "global_step": 161879, "epoch": 1337} {"train_loss": -41.61663818359375, "global_step": 161880, "epoch": 1337} {"train_loss": -41.30460739135742, "global_step": 161881, "epoch": 1337} {"train_loss": -41.18996810913086, "global_step": 161882, "epoch": 1337} {"train_loss": -41.368507385253906, "global_step": 161883, "epoch": 1337} {"train_loss": -41.311424255371094, "global_step": 161884, "epoch": 1337} {"train_loss": -41.943458557128906, "global_step": 161885, "epoch": 1337} {"train_loss": -41.37154006958008, "global_step": 161886, "epoch": 1337} {"train_loss": -41.5770378112793, "global_step": 161887, "epoch": 1337} {"train_loss": -41.83333969116211, "global_step": 161888, "epoch": 1337} {"train_loss": -41.46601867675781, "global_step": 161889, "epoch": 1337} {"train_loss": -41.4973030090332, "global_step": 161890, "epoch": 1337} {"train_loss": -41.862953186035156, "global_step": 161891, "epoch": 1337} {"train_loss": -41.07488250732422, "global_step": 161892, "epoch": 1337} {"train_loss": -41.80988693237305, "global_step": 161893, "epoch": 1337} {"train_loss": -42.07191848754883, "global_step": 161894, "epoch": 1337} {"train_loss": -42.218109130859375, "global_step": 161895, "epoch": 1337} {"train_loss": -42.53532028198242, "global_step": 161896, "epoch": 1337} {"train_loss": -40.10479110528615, "global_step": 161897, "epoch": 1337, "val_loss": 2586757.25} {"train_loss": -42.2956428527832, "global_step": 161898, "epoch": 1338} {"train_loss": -42.167999267578125, "global_step": 161899, "epoch": 1338} {"train_loss": -41.99153518676758, "global_step": 161900, "epoch": 1338} {"train_loss": -42.19790267944336, "global_step": 161901, "epoch": 1338} {"train_loss": -42.050270080566406, "global_step": 161902, "epoch": 1338} {"train_loss": -41.85674285888672, "global_step": 161903, "epoch": 1338} {"train_loss": -42.14862060546875, "global_step": 161904, "epoch": 1338} {"train_loss": -42.45904541015625, "global_step": 161905, "epoch": 1338} {"train_loss": -42.454036712646484, "global_step": 161906, "epoch": 1338} {"train_loss": -41.989044189453125, "global_step": 161907, "epoch": 1338} {"train_loss": -42.20124435424805, "global_step": 161908, "epoch": 1338} {"train_loss": -41.821441650390625, "global_step": 161909, "epoch": 1338} {"train_loss": -42.006343841552734, "global_step": 161910, "epoch": 1338} {"train_loss": -42.15903854370117, "global_step": 161911, "epoch": 1338} {"train_loss": -41.048194885253906, "global_step": 161912, "epoch": 1338} {"train_loss": -42.45417404174805, "global_step": 161913, "epoch": 1338} {"train_loss": -41.99787139892578, "global_step": 161914, "epoch": 1338} {"train_loss": -41.793426513671875, "global_step": 161915, "epoch": 1338} {"train_loss": -41.12336349487305, "global_step": 161916, "epoch": 1338} {"train_loss": -41.69645690917969, "global_step": 161917, "epoch": 1338} {"train_loss": -40.95964431762695, "global_step": 161918, "epoch": 1338} {"train_loss": -41.657413482666016, "global_step": 161919, "epoch": 1338} {"train_loss": -42.0675048828125, "global_step": 161920, "epoch": 1338} {"train_loss": -41.72589111328125, "global_step": 161921, "epoch": 1338} {"train_loss": -41.45386505126953, "global_step": 161922, "epoch": 1338} {"train_loss": -41.8744010925293, "global_step": 161923, "epoch": 1338} {"train_loss": -42.16592788696289, "global_step": 161924, "epoch": 1338} {"train_loss": -42.145992279052734, "global_step": 161925, "epoch": 1338} {"train_loss": -42.116302490234375, "global_step": 161926, "epoch": 1338} {"train_loss": -42.1006965637207, "global_step": 161927, "epoch": 1338} {"train_loss": -42.21220016479492, "global_step": 161928, "epoch": 1338} {"train_loss": -42.67998504638672, "global_step": 161929, "epoch": 1338} {"train_loss": -42.290225982666016, "global_step": 161930, "epoch": 1338} {"train_loss": -41.33212661743164, "global_step": 161931, "epoch": 1338} {"train_loss": -41.79127883911133, "global_step": 161932, "epoch": 1338} {"train_loss": -41.619529724121094, "global_step": 161933, "epoch": 1338} {"train_loss": -40.902488708496094, "global_step": 161934, "epoch": 1338} {"train_loss": -40.088680267333984, "global_step": 161935, "epoch": 1338} {"train_loss": -39.8192253112793, "global_step": 161936, "epoch": 1338} {"train_loss": -39.032222747802734, "global_step": 161937, "epoch": 1338} {"train_loss": -40.91731262207031, "global_step": 161938, "epoch": 1338} {"train_loss": -40.84220504760742, "global_step": 161939, "epoch": 1338} {"train_loss": -40.68062973022461, "global_step": 161940, "epoch": 1338} {"train_loss": -41.302955627441406, "global_step": 161941, "epoch": 1338} {"train_loss": -40.641475677490234, "global_step": 161942, "epoch": 1338} {"train_loss": -39.90218734741211, "global_step": 161943, "epoch": 1338} {"train_loss": -38.84290313720703, "global_step": 161944, "epoch": 1338} {"train_loss": -37.9658203125, "global_step": 161945, "epoch": 1338} {"train_loss": -37.48529815673828, "global_step": 161946, "epoch": 1338} {"train_loss": -39.058467864990234, "global_step": 161947, "epoch": 1338} {"train_loss": -41.788753509521484, "global_step": 161948, "epoch": 1338} {"train_loss": -41.396968841552734, "global_step": 161949, "epoch": 1338} {"train_loss": -40.75859451293945, "global_step": 161950, "epoch": 1338} {"train_loss": -41.22964096069336, "global_step": 161951, "epoch": 1338} {"train_loss": -40.98440170288086, "global_step": 161952, "epoch": 1338} {"train_loss": -40.49238204956055, "global_step": 161953, "epoch": 1338} {"train_loss": -40.15433120727539, "global_step": 161954, "epoch": 1338} {"train_loss": -40.254920959472656, "global_step": 161955, "epoch": 1338} {"train_loss": -40.21802520751953, "global_step": 161956, "epoch": 1338} {"train_loss": -41.56003952026367, "global_step": 161957, "epoch": 1338} {"train_loss": -38.55814743041992, "global_step": 161958, "epoch": 1338} {"train_loss": -40.358436584472656, "global_step": 161959, "epoch": 1338} {"train_loss": -39.4546012878418, "global_step": 161960, "epoch": 1338} {"train_loss": -40.92094421386719, "global_step": 161961, "epoch": 1338} {"train_loss": -41.279815673828125, "global_step": 161962, "epoch": 1338} {"train_loss": -39.65230178833008, "global_step": 161963, "epoch": 1338} {"train_loss": -38.7469596862793, "global_step": 161964, "epoch": 1338} {"train_loss": -39.2725944519043, "global_step": 161965, "epoch": 1338} {"train_loss": -41.276405334472656, "global_step": 161966, "epoch": 1338} {"train_loss": -40.990325927734375, "global_step": 161967, "epoch": 1338} {"train_loss": -39.24578094482422, "global_step": 161968, "epoch": 1338} {"train_loss": -40.44520950317383, "global_step": 161969, "epoch": 1338} {"train_loss": -40.65517807006836, "global_step": 161970, "epoch": 1338} {"train_loss": -38.63669967651367, "global_step": 161971, "epoch": 1338} {"train_loss": -35.6465950012207, "global_step": 161972, "epoch": 1338} {"train_loss": -38.93922424316406, "global_step": 161973, "epoch": 1338} {"train_loss": -38.33190155029297, "global_step": 161974, "epoch": 1338} {"train_loss": -37.236637115478516, "global_step": 161975, "epoch": 1338} {"train_loss": -40.002113342285156, "global_step": 161976, "epoch": 1338} {"train_loss": -38.10865020751953, "global_step": 161977, "epoch": 1338} {"train_loss": -41.04545974731445, "global_step": 161978, "epoch": 1338} {"train_loss": -39.164459228515625, "global_step": 161979, "epoch": 1338} {"train_loss": -39.3848991394043, "global_step": 161980, "epoch": 1338} {"train_loss": -40.60763168334961, "global_step": 161981, "epoch": 1338} {"train_loss": -41.188045501708984, "global_step": 161982, "epoch": 1338} {"train_loss": -40.67332458496094, "global_step": 161983, "epoch": 1338} {"train_loss": -40.80570602416992, "global_step": 161984, "epoch": 1338} {"train_loss": -41.261146545410156, "global_step": 161985, "epoch": 1338} {"train_loss": -41.00901412963867, "global_step": 161986, "epoch": 1338} {"train_loss": -41.52460861206055, "global_step": 161987, "epoch": 1338} {"train_loss": -41.3900032043457, "global_step": 161988, "epoch": 1338} {"train_loss": -41.22312927246094, "global_step": 161989, "epoch": 1338} {"train_loss": -41.37929153442383, "global_step": 161990, "epoch": 1338} {"train_loss": -41.410404205322266, "global_step": 161991, "epoch": 1338} {"train_loss": -41.058162689208984, "global_step": 161992, "epoch": 1338} {"train_loss": -41.59328079223633, "global_step": 161993, "epoch": 1338} {"train_loss": -41.277313232421875, "global_step": 161994, "epoch": 1338} {"train_loss": -41.337032318115234, "global_step": 161995, "epoch": 1338} {"train_loss": -41.79693603515625, "global_step": 161996, "epoch": 1338} {"train_loss": -41.046234130859375, "global_step": 161997, "epoch": 1338} {"train_loss": -40.596920013427734, "global_step": 161998, "epoch": 1338} {"train_loss": -41.416908264160156, "global_step": 161999, "epoch": 1338} {"train_loss": -41.574859619140625, "global_step": 162000, "epoch": 1338} {"train_loss": -41.60482406616211, "global_step": 162001, "epoch": 1338} {"train_loss": -41.27882385253906, "global_step": 162002, "epoch": 1338} {"train_loss": -42.102333068847656, "global_step": 162003, "epoch": 1338} {"train_loss": -41.67116165161133, "global_step": 162004, "epoch": 1338} {"train_loss": -41.319000244140625, "global_step": 162005, "epoch": 1338} {"train_loss": -41.5229606628418, "global_step": 162006, "epoch": 1338} {"train_loss": -41.84382247924805, "global_step": 162007, "epoch": 1338} {"train_loss": -41.439205169677734, "global_step": 162008, "epoch": 1338} {"train_loss": -41.74774932861328, "global_step": 162009, "epoch": 1338} {"train_loss": -41.919883728027344, "global_step": 162010, "epoch": 1338} {"train_loss": -41.694087982177734, "global_step": 162011, "epoch": 1338} {"train_loss": -41.98988723754883, "global_step": 162012, "epoch": 1338} {"train_loss": -41.7323112487793, "global_step": 162013, "epoch": 1338} {"train_loss": -42.189178466796875, "global_step": 162014, "epoch": 1338} {"train_loss": -41.952186584472656, "global_step": 162015, "epoch": 1338} {"train_loss": -42.04755401611328, "global_step": 162016, "epoch": 1338} {"train_loss": -42.33302688598633, "global_step": 162017, "epoch": 1338} {"train_loss": -40.998369390314274, "global_step": 162018, "epoch": 1338, "val_loss": 2554058.0} {"train_loss": -41.93510818481445, "global_step": 162019, "epoch": 1339} {"train_loss": -42.369686126708984, "global_step": 162020, "epoch": 1339} {"train_loss": -42.200618743896484, "global_step": 162021, "epoch": 1339} {"train_loss": -42.35072708129883, "global_step": 162022, "epoch": 1339} {"train_loss": -42.06635665893555, "global_step": 162023, "epoch": 1339} {"train_loss": -42.10601806640625, "global_step": 162024, "epoch": 1339} {"train_loss": -42.013729095458984, "global_step": 162025, "epoch": 1339} {"train_loss": -42.4250373840332, "global_step": 162026, "epoch": 1339} {"train_loss": -41.77516555786133, "global_step": 162027, "epoch": 1339} {"train_loss": -42.08089828491211, "global_step": 162028, "epoch": 1339} {"train_loss": -42.15920639038086, "global_step": 162029, "epoch": 1339} {"train_loss": -41.84688186645508, "global_step": 162030, "epoch": 1339} {"train_loss": -42.10071563720703, "global_step": 162031, "epoch": 1339} {"train_loss": -41.7230339050293, "global_step": 162032, "epoch": 1339} {"train_loss": -41.66231155395508, "global_step": 162033, "epoch": 1339} {"train_loss": -42.48030471801758, "global_step": 162034, "epoch": 1339} {"train_loss": -41.58366012573242, "global_step": 162035, "epoch": 1339} {"train_loss": -41.92985916137695, "global_step": 162036, "epoch": 1339} {"train_loss": -41.631404876708984, "global_step": 162037, "epoch": 1339} {"train_loss": -41.608795166015625, "global_step": 162038, "epoch": 1339} {"train_loss": -41.64281463623047, "global_step": 162039, "epoch": 1339} {"train_loss": -42.12594223022461, "global_step": 162040, "epoch": 1339} {"train_loss": -41.991905212402344, "global_step": 162041, "epoch": 1339} {"train_loss": -41.887908935546875, "global_step": 162042, "epoch": 1339} {"train_loss": -41.007022857666016, "global_step": 162043, "epoch": 1339} {"train_loss": -41.90052032470703, "global_step": 162044, "epoch": 1339} {"train_loss": -42.423492431640625, "global_step": 162045, "epoch": 1339} {"train_loss": -41.96025085449219, "global_step": 162046, "epoch": 1339} {"train_loss": -41.9453239440918, "global_step": 162047, "epoch": 1339} {"train_loss": -41.93266677856445, "global_step": 162048, "epoch": 1339} {"train_loss": -41.5712890625, "global_step": 162049, "epoch": 1339} {"train_loss": -40.7679443359375, "global_step": 162050, "epoch": 1339} {"train_loss": -41.121009826660156, "global_step": 162051, "epoch": 1339} {"train_loss": -40.000919342041016, "global_step": 162052, "epoch": 1339} {"train_loss": -39.86947250366211, "global_step": 162053, "epoch": 1339} {"train_loss": -41.31205368041992, "global_step": 162054, "epoch": 1339} {"train_loss": -40.500244140625, "global_step": 162055, "epoch": 1339} {"train_loss": -38.19843673706055, "global_step": 162056, "epoch": 1339} {"train_loss": -39.33683395385742, "global_step": 162057, "epoch": 1339} {"train_loss": -41.13025665283203, "global_step": 162058, "epoch": 1339} {"train_loss": -39.84505081176758, "global_step": 162059, "epoch": 1339} {"train_loss": -39.27741622924805, "global_step": 162060, "epoch": 1339} {"train_loss": -41.96089553833008, "global_step": 162061, "epoch": 1339} {"train_loss": -39.58411407470703, "global_step": 162062, "epoch": 1339} {"train_loss": -38.01842498779297, "global_step": 162063, "epoch": 1339} {"train_loss": -38.96062088012695, "global_step": 162064, "epoch": 1339} {"train_loss": -39.87592315673828, "global_step": 162065, "epoch": 1339} {"train_loss": -40.04835891723633, "global_step": 162066, "epoch": 1339} {"train_loss": -39.199134826660156, "global_step": 162067, "epoch": 1339} {"train_loss": -41.12651443481445, "global_step": 162068, "epoch": 1339} {"train_loss": -40.07320022583008, "global_step": 162069, "epoch": 1339} {"train_loss": -39.908050537109375, "global_step": 162070, "epoch": 1339} {"train_loss": -39.755863189697266, "global_step": 162071, "epoch": 1339} {"train_loss": -39.877193450927734, "global_step": 162072, "epoch": 1339} {"train_loss": -41.089988708496094, "global_step": 162073, "epoch": 1339} {"train_loss": -40.88029098510742, "global_step": 162074, "epoch": 1339} {"train_loss": -40.37116241455078, "global_step": 162075, "epoch": 1339} {"train_loss": -40.969703674316406, "global_step": 162076, "epoch": 1339} {"train_loss": -40.25657272338867, "global_step": 162077, "epoch": 1339} {"train_loss": -40.13436508178711, "global_step": 162078, "epoch": 1339} {"train_loss": -39.73834991455078, "global_step": 162079, "epoch": 1339} {"train_loss": -38.803340911865234, "global_step": 162080, "epoch": 1339} {"train_loss": -39.0808219909668, "global_step": 162081, "epoch": 1339} {"train_loss": -41.0254020690918, "global_step": 162082, "epoch": 1339} {"train_loss": -40.50435256958008, "global_step": 162083, "epoch": 1339} {"train_loss": -40.107582092285156, "global_step": 162084, "epoch": 1339} {"train_loss": -41.1358757019043, "global_step": 162085, "epoch": 1339} {"train_loss": -41.8780403137207, "global_step": 162086, "epoch": 1339} {"train_loss": -41.341957092285156, "global_step": 162087, "epoch": 1339} {"train_loss": -40.95746612548828, "global_step": 162088, "epoch": 1339} {"train_loss": -40.18153762817383, "global_step": 162089, "epoch": 1339} {"train_loss": -39.53092575073242, "global_step": 162090, "epoch": 1339} {"train_loss": -41.33311080932617, "global_step": 162091, "epoch": 1339} {"train_loss": -41.197479248046875, "global_step": 162092, "epoch": 1339} {"train_loss": -41.051170349121094, "global_step": 162093, "epoch": 1339} {"train_loss": -40.3642692565918, "global_step": 162094, "epoch": 1339} {"train_loss": -41.719058990478516, "global_step": 162095, "epoch": 1339} {"train_loss": -41.2928581237793, "global_step": 162096, "epoch": 1339} {"train_loss": -40.4818229675293, "global_step": 162097, "epoch": 1339} {"train_loss": -40.10872268676758, "global_step": 162098, "epoch": 1339} {"train_loss": -38.27804946899414, "global_step": 162099, "epoch": 1339} {"train_loss": -40.83789825439453, "global_step": 162100, "epoch": 1339} {"train_loss": -39.48769760131836, "global_step": 162101, "epoch": 1339} {"train_loss": -39.01772689819336, "global_step": 162102, "epoch": 1339} {"train_loss": -41.556575775146484, "global_step": 162103, "epoch": 1339} {"train_loss": -39.07966232299805, "global_step": 162104, "epoch": 1339} {"train_loss": -40.2569465637207, "global_step": 162105, "epoch": 1339} {"train_loss": -40.30780792236328, "global_step": 162106, "epoch": 1339} {"train_loss": -38.9974250793457, "global_step": 162107, "epoch": 1339} {"train_loss": -41.12066650390625, "global_step": 162108, "epoch": 1339} {"train_loss": -39.3603515625, "global_step": 162109, "epoch": 1339} {"train_loss": -40.115325927734375, "global_step": 162110, "epoch": 1339} {"train_loss": -41.7330436706543, "global_step": 162111, "epoch": 1339} {"train_loss": -40.7432861328125, "global_step": 162112, "epoch": 1339} {"train_loss": -41.41593933105469, "global_step": 162113, "epoch": 1339} {"train_loss": -41.27934265136719, "global_step": 162114, "epoch": 1339} {"train_loss": -40.627052307128906, "global_step": 162115, "epoch": 1339} {"train_loss": -41.32564926147461, "global_step": 162116, "epoch": 1339} {"train_loss": -41.6723747253418, "global_step": 162117, "epoch": 1339} {"train_loss": -36.59586715698242, "global_step": 162118, "epoch": 1339} {"train_loss": -40.520992279052734, "global_step": 162119, "epoch": 1339} {"train_loss": -40.23087692260742, "global_step": 162120, "epoch": 1339} {"train_loss": -40.543922424316406, "global_step": 162121, "epoch": 1339} {"train_loss": -40.90237808227539, "global_step": 162122, "epoch": 1339} {"train_loss": -40.299842834472656, "global_step": 162123, "epoch": 1339} {"train_loss": -40.615394592285156, "global_step": 162124, "epoch": 1339} {"train_loss": -41.07842254638672, "global_step": 162125, "epoch": 1339} {"train_loss": -41.07649230957031, "global_step": 162126, "epoch": 1339} {"train_loss": -40.920135498046875, "global_step": 162127, "epoch": 1339} {"train_loss": -41.044952392578125, "global_step": 162128, "epoch": 1339} {"train_loss": -41.30613327026367, "global_step": 162129, "epoch": 1339} {"train_loss": -40.464637756347656, "global_step": 162130, "epoch": 1339} {"train_loss": -38.462947845458984, "global_step": 162131, "epoch": 1339} {"train_loss": -41.27909469604492, "global_step": 162132, "epoch": 1339} {"train_loss": -40.244041442871094, "global_step": 162133, "epoch": 1339} {"train_loss": -39.721431732177734, "global_step": 162134, "epoch": 1339} {"train_loss": -38.38216018676758, "global_step": 162135, "epoch": 1339} {"train_loss": -40.57938003540039, "global_step": 162136, "epoch": 1339} {"train_loss": -40.83114242553711, "global_step": 162137, "epoch": 1339} {"train_loss": -41.27668762207031, "global_step": 162138, "epoch": 1339} {"train_loss": -40.71705829210518, "global_step": 162139, "epoch": 1339, "val_loss": 2765474.75} {"train_loss": -41.30794143676758, "global_step": 162140, "epoch": 1340} {"train_loss": -41.05488586425781, "global_step": 162141, "epoch": 1340} {"train_loss": -40.0914192199707, "global_step": 162142, "epoch": 1340} {"train_loss": -37.433650970458984, "global_step": 162143, "epoch": 1340} {"train_loss": -37.90048599243164, "global_step": 162144, "epoch": 1340} {"train_loss": -34.9920539855957, "global_step": 162145, "epoch": 1340} {"train_loss": -39.22929382324219, "global_step": 162146, "epoch": 1340} {"train_loss": -40.83769607543945, "global_step": 162147, "epoch": 1340} {"train_loss": -41.35280990600586, "global_step": 162148, "epoch": 1340} {"train_loss": -39.83037567138672, "global_step": 162149, "epoch": 1340} {"train_loss": -39.54203796386719, "global_step": 162150, "epoch": 1340} {"train_loss": -37.07520294189453, "global_step": 162151, "epoch": 1340} {"train_loss": -38.99837875366211, "global_step": 162152, "epoch": 1340} {"train_loss": -40.158935546875, "global_step": 162153, "epoch": 1340} {"train_loss": -38.87516403198242, "global_step": 162154, "epoch": 1340} {"train_loss": -40.13329315185547, "global_step": 162155, "epoch": 1340} {"train_loss": -39.93935775756836, "global_step": 162156, "epoch": 1340} {"train_loss": -40.35384750366211, "global_step": 162157, "epoch": 1340} {"train_loss": -39.01435470581055, "global_step": 162158, "epoch": 1340} {"train_loss": -38.45832443237305, "global_step": 162159, "epoch": 1340} {"train_loss": -40.56390380859375, "global_step": 162160, "epoch": 1340} {"train_loss": -40.284461975097656, "global_step": 162161, "epoch": 1340} {"train_loss": -40.73690414428711, "global_step": 162162, "epoch": 1340} {"train_loss": -40.220394134521484, "global_step": 162163, "epoch": 1340} {"train_loss": -40.29059982299805, "global_step": 162164, "epoch": 1340} {"train_loss": -40.16680908203125, "global_step": 162165, "epoch": 1340} {"train_loss": -39.773590087890625, "global_step": 162166, "epoch": 1340} {"train_loss": -41.1807975769043, "global_step": 162167, "epoch": 1340} {"train_loss": -40.1528434753418, "global_step": 162168, "epoch": 1340} {"train_loss": -39.17295455932617, "global_step": 162169, "epoch": 1340} {"train_loss": -41.08577346801758, "global_step": 162170, "epoch": 1340} {"train_loss": -41.1231689453125, "global_step": 162171, "epoch": 1340} {"train_loss": -40.77704620361328, "global_step": 162172, "epoch": 1340} {"train_loss": -40.751564025878906, "global_step": 162173, "epoch": 1340} {"train_loss": -40.591644287109375, "global_step": 162174, "epoch": 1340} {"train_loss": -39.87636947631836, "global_step": 162175, "epoch": 1340} {"train_loss": -40.63351058959961, "global_step": 162176, "epoch": 1340} {"train_loss": -40.86525344848633, "global_step": 162177, "epoch": 1340} {"train_loss": -40.101924896240234, "global_step": 162178, "epoch": 1340} {"train_loss": -41.17741012573242, "global_step": 162179, "epoch": 1340} {"train_loss": -41.03037643432617, "global_step": 162180, "epoch": 1340} {"train_loss": -36.328582763671875, "global_step": 162181, "epoch": 1340} {"train_loss": -41.540523529052734, "global_step": 162182, "epoch": 1340} {"train_loss": -39.74578857421875, "global_step": 162183, "epoch": 1340} {"train_loss": -40.99973678588867, "global_step": 162184, "epoch": 1340} {"train_loss": -39.1143798828125, "global_step": 162185, "epoch": 1340} {"train_loss": -40.32733154296875, "global_step": 162186, "epoch": 1340} {"train_loss": -39.7092399597168, "global_step": 162187, "epoch": 1340} {"train_loss": -41.41957473754883, "global_step": 162188, "epoch": 1340} {"train_loss": -39.654319763183594, "global_step": 162189, "epoch": 1340} {"train_loss": -39.45909118652344, "global_step": 162190, "epoch": 1340} {"train_loss": -39.424007415771484, "global_step": 162191, "epoch": 1340} {"train_loss": -40.06410598754883, "global_step": 162192, "epoch": 1340} {"train_loss": -41.676795959472656, "global_step": 162193, "epoch": 1340} {"train_loss": -41.266998291015625, "global_step": 162194, "epoch": 1340} {"train_loss": -39.21017074584961, "global_step": 162195, "epoch": 1340} {"train_loss": -41.559017181396484, "global_step": 162196, "epoch": 1340} {"train_loss": -41.155330657958984, "global_step": 162197, "epoch": 1340} {"train_loss": -40.98603439331055, "global_step": 162198, "epoch": 1340} {"train_loss": -41.660011291503906, "global_step": 162199, "epoch": 1340} {"train_loss": -40.370235443115234, "global_step": 162200, "epoch": 1340} {"train_loss": -41.18638229370117, "global_step": 162201, "epoch": 1340} {"train_loss": -40.631561279296875, "global_step": 162202, "epoch": 1340} {"train_loss": -40.61568832397461, "global_step": 162203, "epoch": 1340} {"train_loss": -41.60918045043945, "global_step": 162204, "epoch": 1340} {"train_loss": -41.197410583496094, "global_step": 162205, "epoch": 1340} {"train_loss": -40.63112258911133, "global_step": 162206, "epoch": 1340} {"train_loss": -39.892242431640625, "global_step": 162207, "epoch": 1340} {"train_loss": -41.494266510009766, "global_step": 162208, "epoch": 1340} {"train_loss": -40.629859924316406, "global_step": 162209, "epoch": 1340} {"train_loss": -40.64875030517578, "global_step": 162210, "epoch": 1340} {"train_loss": -40.25648880004883, "global_step": 162211, "epoch": 1340} {"train_loss": -40.24264144897461, "global_step": 162212, "epoch": 1340} {"train_loss": -40.345645904541016, "global_step": 162213, "epoch": 1340} {"train_loss": -39.84870910644531, "global_step": 162214, "epoch": 1340} {"train_loss": -41.568294525146484, "global_step": 162215, "epoch": 1340} {"train_loss": -38.55702590942383, "global_step": 162216, "epoch": 1340} {"train_loss": -37.90615463256836, "global_step": 162217, "epoch": 1340} {"train_loss": -37.90497589111328, "global_step": 162218, "epoch": 1340} {"train_loss": -39.7523193359375, "global_step": 162219, "epoch": 1340} {"train_loss": -40.74131393432617, "global_step": 162220, "epoch": 1340} {"train_loss": -39.93659591674805, "global_step": 162221, "epoch": 1340} {"train_loss": -39.76053237915039, "global_step": 162222, "epoch": 1340} {"train_loss": -40.97819900512695, "global_step": 162223, "epoch": 1340} {"train_loss": -40.636287689208984, "global_step": 162224, "epoch": 1340} {"train_loss": -40.26219940185547, "global_step": 162225, "epoch": 1340} {"train_loss": -40.963783264160156, "global_step": 162226, "epoch": 1340} {"train_loss": -41.36759948730469, "global_step": 162227, "epoch": 1340} {"train_loss": -40.887447357177734, "global_step": 162228, "epoch": 1340} {"train_loss": -40.08087158203125, "global_step": 162229, "epoch": 1340} {"train_loss": -40.5211181640625, "global_step": 162230, "epoch": 1340} {"train_loss": -41.174171447753906, "global_step": 162231, "epoch": 1340} {"train_loss": -40.669742584228516, "global_step": 162232, "epoch": 1340} {"train_loss": -41.391502380371094, "global_step": 162233, "epoch": 1340} {"train_loss": -40.99565124511719, "global_step": 162234, "epoch": 1340} {"train_loss": -41.18693161010742, "global_step": 162235, "epoch": 1340} {"train_loss": -40.718326568603516, "global_step": 162236, "epoch": 1340} {"train_loss": -41.21212387084961, "global_step": 162237, "epoch": 1340} {"train_loss": -40.52657699584961, "global_step": 162238, "epoch": 1340} {"train_loss": -40.33173370361328, "global_step": 162239, "epoch": 1340} {"train_loss": -41.649192810058594, "global_step": 162240, "epoch": 1340} {"train_loss": -41.314579010009766, "global_step": 162241, "epoch": 1340} {"train_loss": -40.881919860839844, "global_step": 162242, "epoch": 1340} {"train_loss": -40.75130081176758, "global_step": 162243, "epoch": 1340} {"train_loss": -40.847694396972656, "global_step": 162244, "epoch": 1340} {"train_loss": -41.788787841796875, "global_step": 162245, "epoch": 1340} {"train_loss": -39.81608581542969, "global_step": 162246, "epoch": 1340} {"train_loss": -41.885738372802734, "global_step": 162247, "epoch": 1340} {"train_loss": -40.8843879699707, "global_step": 162248, "epoch": 1340} {"train_loss": -38.70330810546875, "global_step": 162249, "epoch": 1340} {"train_loss": -38.994300842285156, "global_step": 162250, "epoch": 1340} {"train_loss": -40.6517448425293, "global_step": 162251, "epoch": 1340} {"train_loss": -41.179832458496094, "global_step": 162252, "epoch": 1340} {"train_loss": -40.27350616455078, "global_step": 162253, "epoch": 1340} {"train_loss": -40.239654541015625, "global_step": 162254, "epoch": 1340} {"train_loss": -41.177223205566406, "global_step": 162255, "epoch": 1340} {"train_loss": -41.72493362426758, "global_step": 162256, "epoch": 1340} {"train_loss": -40.2336540222168, "global_step": 162257, "epoch": 1340} {"train_loss": -41.11323165893555, "global_step": 162258, "epoch": 1340} {"train_loss": -41.30328369140625, "global_step": 162259, "epoch": 1340} {"train_loss": -40.31391657679534, "global_step": 162260, "epoch": 1340, "val_loss": 2583706.75} {"train_loss": -41.75507354736328, "global_step": 162261, "epoch": 1341} {"train_loss": -41.806419372558594, "global_step": 162262, "epoch": 1341} {"train_loss": -41.41999435424805, "global_step": 162263, "epoch": 1341} {"train_loss": -41.58681106567383, "global_step": 162264, "epoch": 1341} {"train_loss": -41.56257247924805, "global_step": 162265, "epoch": 1341} {"train_loss": -41.62972640991211, "global_step": 162266, "epoch": 1341} {"train_loss": -41.80801773071289, "global_step": 162267, "epoch": 1341} {"train_loss": -41.79541015625, "global_step": 162268, "epoch": 1341} {"train_loss": -41.96492385864258, "global_step": 162269, "epoch": 1341} {"train_loss": -41.52710723876953, "global_step": 162270, "epoch": 1341} {"train_loss": -42.02345657348633, "global_step": 162271, "epoch": 1341} {"train_loss": -41.904422760009766, "global_step": 162272, "epoch": 1341} {"train_loss": -41.229427337646484, "global_step": 162273, "epoch": 1341} {"train_loss": -40.999542236328125, "global_step": 162274, "epoch": 1341} {"train_loss": -41.7501335144043, "global_step": 162275, "epoch": 1341} {"train_loss": -42.073699951171875, "global_step": 162276, "epoch": 1341} {"train_loss": -41.0762939453125, "global_step": 162277, "epoch": 1341} {"train_loss": -41.6518669128418, "global_step": 162278, "epoch": 1341} {"train_loss": -41.3376350402832, "global_step": 162279, "epoch": 1341} {"train_loss": -41.35334014892578, "global_step": 162280, "epoch": 1341} {"train_loss": -40.83842849731445, "global_step": 162281, "epoch": 1341} {"train_loss": -40.99755859375, "global_step": 162282, "epoch": 1341} {"train_loss": -41.6691780090332, "global_step": 162283, "epoch": 1341} {"train_loss": -40.9714469909668, "global_step": 162284, "epoch": 1341} {"train_loss": -41.157325744628906, "global_step": 162285, "epoch": 1341} {"train_loss": -40.40506362915039, "global_step": 162286, "epoch": 1341} {"train_loss": -40.612091064453125, "global_step": 162287, "epoch": 1341} {"train_loss": -39.992977142333984, "global_step": 162288, "epoch": 1341} {"train_loss": -38.66347885131836, "global_step": 162289, "epoch": 1341} {"train_loss": -36.94584274291992, "global_step": 162290, "epoch": 1341} {"train_loss": -38.07816696166992, "global_step": 162291, "epoch": 1341} {"train_loss": -40.640220642089844, "global_step": 162292, "epoch": 1341} {"train_loss": -40.7527961730957, "global_step": 162293, "epoch": 1341} {"train_loss": -37.4228401184082, "global_step": 162294, "epoch": 1341} {"train_loss": -38.105220794677734, "global_step": 162295, "epoch": 1341} {"train_loss": -41.1952018737793, "global_step": 162296, "epoch": 1341} {"train_loss": -39.588348388671875, "global_step": 162297, "epoch": 1341} {"train_loss": -38.67338562011719, "global_step": 162298, "epoch": 1341} {"train_loss": -40.92544937133789, "global_step": 162299, "epoch": 1341} {"train_loss": -40.89803695678711, "global_step": 162300, "epoch": 1341} {"train_loss": -37.00358963012695, "global_step": 162301, "epoch": 1341} {"train_loss": -38.7617301940918, "global_step": 162302, "epoch": 1341} {"train_loss": -40.387489318847656, "global_step": 162303, "epoch": 1341} {"train_loss": -38.451393127441406, "global_step": 162304, "epoch": 1341} {"train_loss": -37.25834274291992, "global_step": 162305, "epoch": 1341} {"train_loss": -40.33320999145508, "global_step": 162306, "epoch": 1341} {"train_loss": -37.538570404052734, "global_step": 162307, "epoch": 1341} {"train_loss": -39.727134704589844, "global_step": 162308, "epoch": 1341} {"train_loss": -39.49026107788086, "global_step": 162309, "epoch": 1341} {"train_loss": -39.395931243896484, "global_step": 162310, "epoch": 1341} {"train_loss": -40.50858688354492, "global_step": 162311, "epoch": 1341} {"train_loss": -40.065486907958984, "global_step": 162312, "epoch": 1341} {"train_loss": -40.02909469604492, "global_step": 162313, "epoch": 1341} {"train_loss": -39.844627380371094, "global_step": 162314, "epoch": 1341} {"train_loss": -40.362030029296875, "global_step": 162315, "epoch": 1341} {"train_loss": -40.31182861328125, "global_step": 162316, "epoch": 1341} {"train_loss": -40.0519905090332, "global_step": 162317, "epoch": 1341} {"train_loss": -40.36602020263672, "global_step": 162318, "epoch": 1341} {"train_loss": -40.831451416015625, "global_step": 162319, "epoch": 1341} {"train_loss": -40.5150260925293, "global_step": 162320, "epoch": 1341} {"train_loss": -40.969696044921875, "global_step": 162321, "epoch": 1341} {"train_loss": -40.77129364013672, "global_step": 162322, "epoch": 1341} {"train_loss": -40.4085578918457, "global_step": 162323, "epoch": 1341} {"train_loss": -40.19259262084961, "global_step": 162324, "epoch": 1341} {"train_loss": -39.97446823120117, "global_step": 162325, "epoch": 1341} {"train_loss": -41.36623764038086, "global_step": 162326, "epoch": 1341} {"train_loss": -40.93742370605469, "global_step": 162327, "epoch": 1341} {"train_loss": -40.153404235839844, "global_step": 162328, "epoch": 1341} {"train_loss": -41.436981201171875, "global_step": 162329, "epoch": 1341} {"train_loss": -40.4088020324707, "global_step": 162330, "epoch": 1341} {"train_loss": -40.72639083862305, "global_step": 162331, "epoch": 1341} {"train_loss": -40.67343521118164, "global_step": 162332, "epoch": 1341} {"train_loss": -39.46723175048828, "global_step": 162333, "epoch": 1341} {"train_loss": -40.6453971862793, "global_step": 162334, "epoch": 1341} {"train_loss": -40.065155029296875, "global_step": 162335, "epoch": 1341} {"train_loss": -41.10354995727539, "global_step": 162336, "epoch": 1341} {"train_loss": -40.004066467285156, "global_step": 162337, "epoch": 1341} {"train_loss": -40.978450775146484, "global_step": 162338, "epoch": 1341} {"train_loss": -39.451416015625, "global_step": 162339, "epoch": 1341} {"train_loss": -41.15443801879883, "global_step": 162340, "epoch": 1341} {"train_loss": -41.099586486816406, "global_step": 162341, "epoch": 1341} {"train_loss": -40.58211898803711, "global_step": 162342, "epoch": 1341} {"train_loss": -41.143653869628906, "global_step": 162343, "epoch": 1341} {"train_loss": -40.67070388793945, "global_step": 162344, "epoch": 1341} {"train_loss": -41.68268585205078, "global_step": 162345, "epoch": 1341} {"train_loss": -40.13267135620117, "global_step": 162346, "epoch": 1341} {"train_loss": -41.54160690307617, "global_step": 162347, "epoch": 1341} {"train_loss": -40.9904670715332, "global_step": 162348, "epoch": 1341} {"train_loss": -40.8914909362793, "global_step": 162349, "epoch": 1341} {"train_loss": -40.5703010559082, "global_step": 162350, "epoch": 1341} {"train_loss": -41.68732833862305, "global_step": 162351, "epoch": 1341} {"train_loss": -40.915069580078125, "global_step": 162352, "epoch": 1341} {"train_loss": -41.06308364868164, "global_step": 162353, "epoch": 1341} {"train_loss": -40.984962463378906, "global_step": 162354, "epoch": 1341} {"train_loss": -40.1530647277832, "global_step": 162355, "epoch": 1341} {"train_loss": -40.169795989990234, "global_step": 162356, "epoch": 1341} {"train_loss": -41.06267166137695, "global_step": 162357, "epoch": 1341} {"train_loss": -39.95233917236328, "global_step": 162358, "epoch": 1341} {"train_loss": -40.46857833862305, "global_step": 162359, "epoch": 1341} {"train_loss": -40.699073791503906, "global_step": 162360, "epoch": 1341} {"train_loss": -40.77530288696289, "global_step": 162361, "epoch": 1341} {"train_loss": -41.04703140258789, "global_step": 162362, "epoch": 1341} {"train_loss": -41.661319732666016, "global_step": 162363, "epoch": 1341} {"train_loss": -40.35397720336914, "global_step": 162364, "epoch": 1341} {"train_loss": -39.88228225708008, "global_step": 162365, "epoch": 1341} {"train_loss": -40.9193229675293, "global_step": 162366, "epoch": 1341} {"train_loss": -40.38296127319336, "global_step": 162367, "epoch": 1341} {"train_loss": -41.033599853515625, "global_step": 162368, "epoch": 1341} {"train_loss": -41.83382034301758, "global_step": 162369, "epoch": 1341} {"train_loss": -41.113990783691406, "global_step": 162370, "epoch": 1341} {"train_loss": -41.52383041381836, "global_step": 162371, "epoch": 1341} {"train_loss": -41.26496887207031, "global_step": 162372, "epoch": 1341} {"train_loss": -41.465511322021484, "global_step": 162373, "epoch": 1341} {"train_loss": -41.181427001953125, "global_step": 162374, "epoch": 1341} {"train_loss": -41.31728744506836, "global_step": 162375, "epoch": 1341} {"train_loss": -41.602291107177734, "global_step": 162376, "epoch": 1341} {"train_loss": -41.74335479736328, "global_step": 162377, "epoch": 1341} {"train_loss": -41.003761291503906, "global_step": 162378, "epoch": 1341} {"train_loss": -42.07772445678711, "global_step": 162379, "epoch": 1341} {"train_loss": -41.074459075927734, "global_step": 162380, "epoch": 1341} {"train_loss": -40.61203759563856, "global_step": 162381, "epoch": 1341, "val_loss": 2621288.75} {"train_loss": -41.29718780517578, "global_step": 162382, "epoch": 1342} {"train_loss": -41.77622604370117, "global_step": 162383, "epoch": 1342} {"train_loss": -41.8909912109375, "global_step": 162384, "epoch": 1342} {"train_loss": -40.88685607910156, "global_step": 162385, "epoch": 1342} {"train_loss": -40.98183822631836, "global_step": 162386, "epoch": 1342} {"train_loss": -40.91012191772461, "global_step": 162387, "epoch": 1342} {"train_loss": -40.36139678955078, "global_step": 162388, "epoch": 1342} {"train_loss": -40.66954803466797, "global_step": 162389, "epoch": 1342} {"train_loss": -41.135929107666016, "global_step": 162390, "epoch": 1342} {"train_loss": -41.95168685913086, "global_step": 162391, "epoch": 1342} {"train_loss": -39.01598358154297, "global_step": 162392, "epoch": 1342} {"train_loss": -37.79151153564453, "global_step": 162393, "epoch": 1342} {"train_loss": -39.33903121948242, "global_step": 162394, "epoch": 1342} {"train_loss": -38.54909133911133, "global_step": 162395, "epoch": 1342} {"train_loss": -40.74536895751953, "global_step": 162396, "epoch": 1342} {"train_loss": -41.9539794921875, "global_step": 162397, "epoch": 1342} {"train_loss": -41.1455192565918, "global_step": 162398, "epoch": 1342} {"train_loss": -41.47336196899414, "global_step": 162399, "epoch": 1342} {"train_loss": -41.41738510131836, "global_step": 162400, "epoch": 1342} {"train_loss": -40.74557113647461, "global_step": 162401, "epoch": 1342} {"train_loss": -40.15218734741211, "global_step": 162402, "epoch": 1342} {"train_loss": -41.2530632019043, "global_step": 162403, "epoch": 1342} {"train_loss": -41.7343635559082, "global_step": 162404, "epoch": 1342} {"train_loss": -40.369598388671875, "global_step": 162405, "epoch": 1342} {"train_loss": -41.09904479980469, "global_step": 162406, "epoch": 1342} {"train_loss": -41.79157638549805, "global_step": 162407, "epoch": 1342} {"train_loss": -38.8940315246582, "global_step": 162408, "epoch": 1342} {"train_loss": -40.620357513427734, "global_step": 162409, "epoch": 1342} {"train_loss": -41.22415542602539, "global_step": 162410, "epoch": 1342} {"train_loss": -40.69062423706055, "global_step": 162411, "epoch": 1342} {"train_loss": -41.6043701171875, "global_step": 162412, "epoch": 1342} {"train_loss": -40.935062408447266, "global_step": 162413, "epoch": 1342} {"train_loss": -41.11030197143555, "global_step": 162414, "epoch": 1342} {"train_loss": -42.04987716674805, "global_step": 162415, "epoch": 1342} {"train_loss": -41.80342102050781, "global_step": 162416, "epoch": 1342} {"train_loss": -41.4743766784668, "global_step": 162417, "epoch": 1342} {"train_loss": -41.56327819824219, "global_step": 162418, "epoch": 1342} {"train_loss": -40.732276916503906, "global_step": 162419, "epoch": 1342} {"train_loss": -41.81276321411133, "global_step": 162420, "epoch": 1342} {"train_loss": -41.63497543334961, "global_step": 162421, "epoch": 1342} {"train_loss": -40.29460525512695, "global_step": 162422, "epoch": 1342} {"train_loss": -37.83833694458008, "global_step": 162423, "epoch": 1342} {"train_loss": -39.554378509521484, "global_step": 162424, "epoch": 1342} {"train_loss": -41.110923767089844, "global_step": 162425, "epoch": 1342} {"train_loss": -41.533409118652344, "global_step": 162426, "epoch": 1342} {"train_loss": -41.376800537109375, "global_step": 162427, "epoch": 1342} {"train_loss": -40.57125473022461, "global_step": 162428, "epoch": 1342} {"train_loss": -41.2131233215332, "global_step": 162429, "epoch": 1342} {"train_loss": -42.21503829956055, "global_step": 162430, "epoch": 1342} {"train_loss": -41.04345703125, "global_step": 162431, "epoch": 1342} {"train_loss": -40.45917892456055, "global_step": 162432, "epoch": 1342} {"train_loss": -41.11457061767578, "global_step": 162433, "epoch": 1342} {"train_loss": -40.98219680786133, "global_step": 162434, "epoch": 1342} {"train_loss": -41.008052825927734, "global_step": 162435, "epoch": 1342} {"train_loss": -39.29790115356445, "global_step": 162436, "epoch": 1342} {"train_loss": -38.72888946533203, "global_step": 162437, "epoch": 1342} {"train_loss": -37.10749435424805, "global_step": 162438, "epoch": 1342} {"train_loss": -38.2943229675293, "global_step": 162439, "epoch": 1342} {"train_loss": -41.56510543823242, "global_step": 162440, "epoch": 1342} {"train_loss": -39.02748489379883, "global_step": 162441, "epoch": 1342} {"train_loss": -40.54160690307617, "global_step": 162442, "epoch": 1342} {"train_loss": -41.42982864379883, "global_step": 162443, "epoch": 1342} {"train_loss": -40.34986114501953, "global_step": 162444, "epoch": 1342} {"train_loss": -39.8689079284668, "global_step": 162445, "epoch": 1342} {"train_loss": -41.496585845947266, "global_step": 162446, "epoch": 1342} {"train_loss": -40.87629318237305, "global_step": 162447, "epoch": 1342} {"train_loss": -40.657806396484375, "global_step": 162448, "epoch": 1342} {"train_loss": -40.158504486083984, "global_step": 162449, "epoch": 1342} {"train_loss": -40.639949798583984, "global_step": 162450, "epoch": 1342} {"train_loss": -41.59763717651367, "global_step": 162451, "epoch": 1342} {"train_loss": -41.518524169921875, "global_step": 162452, "epoch": 1342} {"train_loss": -40.48596954345703, "global_step": 162453, "epoch": 1342} {"train_loss": -41.34351348876953, "global_step": 162454, "epoch": 1342} {"train_loss": -42.27274703979492, "global_step": 162455, "epoch": 1342} {"train_loss": -41.52756881713867, "global_step": 162456, "epoch": 1342} {"train_loss": -42.08677673339844, "global_step": 162457, "epoch": 1342} {"train_loss": -40.5766716003418, "global_step": 162458, "epoch": 1342} {"train_loss": -41.82149887084961, "global_step": 162459, "epoch": 1342} {"train_loss": -41.83407211303711, "global_step": 162460, "epoch": 1342} {"train_loss": -41.80349349975586, "global_step": 162461, "epoch": 1342} {"train_loss": -41.67090606689453, "global_step": 162462, "epoch": 1342} {"train_loss": -41.830650329589844, "global_step": 162463, "epoch": 1342} {"train_loss": -41.8179817199707, "global_step": 162464, "epoch": 1342} {"train_loss": -42.1192741394043, "global_step": 162465, "epoch": 1342} {"train_loss": -41.54679489135742, "global_step": 162466, "epoch": 1342} {"train_loss": -41.77726364135742, "global_step": 162467, "epoch": 1342} {"train_loss": -42.3383903503418, "global_step": 162468, "epoch": 1342} {"train_loss": -42.24046325683594, "global_step": 162469, "epoch": 1342} {"train_loss": -42.22241973876953, "global_step": 162470, "epoch": 1342} {"train_loss": -42.53831100463867, "global_step": 162471, "epoch": 1342} {"train_loss": -42.285091400146484, "global_step": 162472, "epoch": 1342} {"train_loss": -42.35752487182617, "global_step": 162473, "epoch": 1342} {"train_loss": -42.410377502441406, "global_step": 162474, "epoch": 1342} {"train_loss": -41.996315002441406, "global_step": 162475, "epoch": 1342} {"train_loss": -40.98488235473633, "global_step": 162476, "epoch": 1342} {"train_loss": -37.75655746459961, "global_step": 162477, "epoch": 1342} {"train_loss": -36.413631439208984, "global_step": 162478, "epoch": 1342} {"train_loss": -38.286109924316406, "global_step": 162479, "epoch": 1342} {"train_loss": -40.75934982299805, "global_step": 162480, "epoch": 1342} {"train_loss": -37.4243049621582, "global_step": 162481, "epoch": 1342} {"train_loss": -38.24654006958008, "global_step": 162482, "epoch": 1342} {"train_loss": -41.08376693725586, "global_step": 162483, "epoch": 1342} {"train_loss": -40.303768157958984, "global_step": 162484, "epoch": 1342} {"train_loss": -41.12799835205078, "global_step": 162485, "epoch": 1342} {"train_loss": -41.280757904052734, "global_step": 162486, "epoch": 1342} {"train_loss": -40.795494079589844, "global_step": 162487, "epoch": 1342} {"train_loss": -40.502532958984375, "global_step": 162488, "epoch": 1342} {"train_loss": -40.82332992553711, "global_step": 162489, "epoch": 1342} {"train_loss": -40.87413787841797, "global_step": 162490, "epoch": 1342} {"train_loss": -41.14569091796875, "global_step": 162491, "epoch": 1342} {"train_loss": -41.361671447753906, "global_step": 162492, "epoch": 1342} {"train_loss": -41.50112533569336, "global_step": 162493, "epoch": 1342} {"train_loss": -40.69108963012695, "global_step": 162494, "epoch": 1342} {"train_loss": -40.80165481567383, "global_step": 162495, "epoch": 1342} {"train_loss": -41.16597366333008, "global_step": 162496, "epoch": 1342} {"train_loss": -40.572242736816406, "global_step": 162497, "epoch": 1342} {"train_loss": -41.017906188964844, "global_step": 162498, "epoch": 1342} {"train_loss": -41.219688415527344, "global_step": 162499, "epoch": 1342} {"train_loss": -41.26553726196289, "global_step": 162500, "epoch": 1342} {"train_loss": -40.523658752441406, "global_step": 162501, "epoch": 1342} {"train_loss": -40.832763135925795, "global_step": 162502, "epoch": 1342, "val_loss": 2579961.75} {"train_loss": -41.12208938598633, "global_step": 162503, "epoch": 1343} {"train_loss": -40.43196105957031, "global_step": 162504, "epoch": 1343} {"train_loss": -40.59844970703125, "global_step": 162505, "epoch": 1343} {"train_loss": -41.94256591796875, "global_step": 162506, "epoch": 1343} {"train_loss": -40.64813995361328, "global_step": 162507, "epoch": 1343} {"train_loss": -39.28664016723633, "global_step": 162508, "epoch": 1343} {"train_loss": -40.86085510253906, "global_step": 162509, "epoch": 1343} {"train_loss": -41.40761184692383, "global_step": 162510, "epoch": 1343} {"train_loss": -41.07546615600586, "global_step": 162511, "epoch": 1343} {"train_loss": -40.408111572265625, "global_step": 162512, "epoch": 1343} {"train_loss": -40.703487396240234, "global_step": 162513, "epoch": 1343} {"train_loss": -41.771846771240234, "global_step": 162514, "epoch": 1343} {"train_loss": -40.12343215942383, "global_step": 162515, "epoch": 1343} {"train_loss": -40.06589889526367, "global_step": 162516, "epoch": 1343} {"train_loss": -40.81546401977539, "global_step": 162517, "epoch": 1343} {"train_loss": -40.83305740356445, "global_step": 162518, "epoch": 1343} {"train_loss": -40.81819534301758, "global_step": 162519, "epoch": 1343} {"train_loss": -40.685279846191406, "global_step": 162520, "epoch": 1343} {"train_loss": -41.112789154052734, "global_step": 162521, "epoch": 1343} {"train_loss": -40.493595123291016, "global_step": 162522, "epoch": 1343} {"train_loss": -40.94054412841797, "global_step": 162523, "epoch": 1343} {"train_loss": -41.02991485595703, "global_step": 162524, "epoch": 1343} {"train_loss": -40.742069244384766, "global_step": 162525, "epoch": 1343} {"train_loss": -40.684974670410156, "global_step": 162526, "epoch": 1343} {"train_loss": -40.63448715209961, "global_step": 162527, "epoch": 1343} {"train_loss": -40.96635055541992, "global_step": 162528, "epoch": 1343} {"train_loss": -40.537841796875, "global_step": 162529, "epoch": 1343} {"train_loss": -41.139739990234375, "global_step": 162530, "epoch": 1343} {"train_loss": -41.35756301879883, "global_step": 162531, "epoch": 1343} {"train_loss": -39.09674072265625, "global_step": 162532, "epoch": 1343} {"train_loss": -41.725738525390625, "global_step": 162533, "epoch": 1343} {"train_loss": -39.762271881103516, "global_step": 162534, "epoch": 1343} {"train_loss": -39.018463134765625, "global_step": 162535, "epoch": 1343} {"train_loss": -40.40825653076172, "global_step": 162536, "epoch": 1343} {"train_loss": -39.89617919921875, "global_step": 162537, "epoch": 1343} {"train_loss": -40.10239791870117, "global_step": 162538, "epoch": 1343} {"train_loss": -40.48347091674805, "global_step": 162539, "epoch": 1343} {"train_loss": -40.41856002807617, "global_step": 162540, "epoch": 1343} {"train_loss": -40.644065856933594, "global_step": 162541, "epoch": 1343} {"train_loss": -40.85929489135742, "global_step": 162542, "epoch": 1343} {"train_loss": -39.92915725708008, "global_step": 162543, "epoch": 1343} {"train_loss": -41.042022705078125, "global_step": 162544, "epoch": 1343} {"train_loss": -41.48685836791992, "global_step": 162545, "epoch": 1343} {"train_loss": -39.74237060546875, "global_step": 162546, "epoch": 1343} {"train_loss": -40.77657699584961, "global_step": 162547, "epoch": 1343} {"train_loss": -41.106117248535156, "global_step": 162548, "epoch": 1343} {"train_loss": -40.88190460205078, "global_step": 162549, "epoch": 1343} {"train_loss": -40.64075469970703, "global_step": 162550, "epoch": 1343} {"train_loss": -41.409828186035156, "global_step": 162551, "epoch": 1343} {"train_loss": -41.04513168334961, "global_step": 162552, "epoch": 1343} {"train_loss": -40.8048095703125, "global_step": 162553, "epoch": 1343} {"train_loss": -40.622432708740234, "global_step": 162554, "epoch": 1343} {"train_loss": -41.05385208129883, "global_step": 162555, "epoch": 1343} {"train_loss": -40.97251892089844, "global_step": 162556, "epoch": 1343} {"train_loss": -41.92857360839844, "global_step": 162557, "epoch": 1343} {"train_loss": -41.35941696166992, "global_step": 162558, "epoch": 1343} {"train_loss": -41.60901641845703, "global_step": 162559, "epoch": 1343} {"train_loss": -40.95930099487305, "global_step": 162560, "epoch": 1343} {"train_loss": -41.12373733520508, "global_step": 162561, "epoch": 1343} {"train_loss": -41.95206832885742, "global_step": 162562, "epoch": 1343} {"train_loss": -41.44936752319336, "global_step": 162563, "epoch": 1343} {"train_loss": -41.17275619506836, "global_step": 162564, "epoch": 1343} {"train_loss": -41.50075912475586, "global_step": 162565, "epoch": 1343} {"train_loss": -41.468868255615234, "global_step": 162566, "epoch": 1343} {"train_loss": -41.333858489990234, "global_step": 162567, "epoch": 1343} {"train_loss": -41.54180908203125, "global_step": 162568, "epoch": 1343} {"train_loss": -41.6071662902832, "global_step": 162569, "epoch": 1343} {"train_loss": -41.723384857177734, "global_step": 162570, "epoch": 1343} {"train_loss": -41.155029296875, "global_step": 162571, "epoch": 1343} {"train_loss": -41.61814498901367, "global_step": 162572, "epoch": 1343} {"train_loss": -41.92558670043945, "global_step": 162573, "epoch": 1343} {"train_loss": -41.884918212890625, "global_step": 162574, "epoch": 1343} {"train_loss": -41.64955520629883, "global_step": 162575, "epoch": 1343} {"train_loss": -41.484710693359375, "global_step": 162576, "epoch": 1343} {"train_loss": -41.867103576660156, "global_step": 162577, "epoch": 1343} {"train_loss": -41.75887680053711, "global_step": 162578, "epoch": 1343} {"train_loss": -40.749786376953125, "global_step": 162579, "epoch": 1343} {"train_loss": -41.75673294067383, "global_step": 162580, "epoch": 1343} {"train_loss": -41.860591888427734, "global_step": 162581, "epoch": 1343} {"train_loss": -42.41661834716797, "global_step": 162582, "epoch": 1343} {"train_loss": -42.14158630371094, "global_step": 162583, "epoch": 1343} {"train_loss": -42.147132873535156, "global_step": 162584, "epoch": 1343} {"train_loss": -41.079166412353516, "global_step": 162585, "epoch": 1343} {"train_loss": -41.425899505615234, "global_step": 162586, "epoch": 1343} {"train_loss": -41.37761306762695, "global_step": 162587, "epoch": 1343} {"train_loss": -41.16135787963867, "global_step": 162588, "epoch": 1343} {"train_loss": -42.10455322265625, "global_step": 162589, "epoch": 1343} {"train_loss": -42.131595611572266, "global_step": 162590, "epoch": 1343} {"train_loss": -41.922908782958984, "global_step": 162591, "epoch": 1343} {"train_loss": -41.9577751159668, "global_step": 162592, "epoch": 1343} {"train_loss": -42.413448333740234, "global_step": 162593, "epoch": 1343} {"train_loss": -41.84634017944336, "global_step": 162594, "epoch": 1343} {"train_loss": -40.761898040771484, "global_step": 162595, "epoch": 1343} {"train_loss": -38.93952178955078, "global_step": 162596, "epoch": 1343} {"train_loss": -39.98849105834961, "global_step": 162597, "epoch": 1343} {"train_loss": -41.923458099365234, "global_step": 162598, "epoch": 1343} {"train_loss": -42.18354415893555, "global_step": 162599, "epoch": 1343} {"train_loss": -40.86279296875, "global_step": 162600, "epoch": 1343} {"train_loss": -41.716373443603516, "global_step": 162601, "epoch": 1343} {"train_loss": -41.9528923034668, "global_step": 162602, "epoch": 1343} {"train_loss": -40.945831298828125, "global_step": 162603, "epoch": 1343} {"train_loss": -38.800289154052734, "global_step": 162604, "epoch": 1343} {"train_loss": -40.4388542175293, "global_step": 162605, "epoch": 1343} {"train_loss": -41.46166229248047, "global_step": 162606, "epoch": 1343} {"train_loss": -40.63361740112305, "global_step": 162607, "epoch": 1343} {"train_loss": -41.93600082397461, "global_step": 162608, "epoch": 1343} {"train_loss": -41.572872161865234, "global_step": 162609, "epoch": 1343} {"train_loss": -41.96910095214844, "global_step": 162610, "epoch": 1343} {"train_loss": -41.43874740600586, "global_step": 162611, "epoch": 1343} {"train_loss": -41.75566482543945, "global_step": 162612, "epoch": 1343} {"train_loss": -42.0206298828125, "global_step": 162613, "epoch": 1343} {"train_loss": -42.22320556640625, "global_step": 162614, "epoch": 1343} {"train_loss": -41.53754806518555, "global_step": 162615, "epoch": 1343} {"train_loss": -41.75565719604492, "global_step": 162616, "epoch": 1343} {"train_loss": -41.53173065185547, "global_step": 162617, "epoch": 1343} {"train_loss": -41.87752151489258, "global_step": 162618, "epoch": 1343} {"train_loss": -41.477813720703125, "global_step": 162619, "epoch": 1343} {"train_loss": -42.061649322509766, "global_step": 162620, "epoch": 1343} {"train_loss": -41.545318603515625, "global_step": 162621, "epoch": 1343} {"train_loss": -41.18695831298828, "global_step": 162622, "epoch": 1343} {"train_loss": -41.137773655662855, "global_step": 162623, "epoch": 1343, "val_loss": 2590666.0} {"train_loss": -39.67850875854492, "global_step": 162624, "epoch": 1344} {"train_loss": -33.34803771972656, "global_step": 162625, "epoch": 1344} {"train_loss": -40.285926818847656, "global_step": 162626, "epoch": 1344} {"train_loss": -29.995813369750977, "global_step": 162627, "epoch": 1344} {"train_loss": -36.029117584228516, "global_step": 162628, "epoch": 1344} {"train_loss": -36.05060958862305, "global_step": 162629, "epoch": 1344} {"train_loss": -29.596113204956055, "global_step": 162630, "epoch": 1344} {"train_loss": -31.810693740844727, "global_step": 162631, "epoch": 1344} {"train_loss": -36.06559371948242, "global_step": 162632, "epoch": 1344} {"train_loss": -39.059539794921875, "global_step": 162633, "epoch": 1344} {"train_loss": -38.87753677368164, "global_step": 162634, "epoch": 1344} {"train_loss": -39.6999626159668, "global_step": 162635, "epoch": 1344} {"train_loss": -39.30902862548828, "global_step": 162636, "epoch": 1344} {"train_loss": -39.71497344970703, "global_step": 162637, "epoch": 1344} {"train_loss": -38.94245910644531, "global_step": 162638, "epoch": 1344} {"train_loss": -39.46310043334961, "global_step": 162639, "epoch": 1344} {"train_loss": -40.0754508972168, "global_step": 162640, "epoch": 1344} {"train_loss": -40.05681228637695, "global_step": 162641, "epoch": 1344} {"train_loss": -40.2448616027832, "global_step": 162642, "epoch": 1344} {"train_loss": -39.80244064331055, "global_step": 162643, "epoch": 1344} {"train_loss": -40.55629348754883, "global_step": 162644, "epoch": 1344} {"train_loss": -39.2990837097168, "global_step": 162645, "epoch": 1344} {"train_loss": -40.458614349365234, "global_step": 162646, "epoch": 1344} {"train_loss": -39.398685455322266, "global_step": 162647, "epoch": 1344} {"train_loss": -40.540523529052734, "global_step": 162648, "epoch": 1344} {"train_loss": -38.5634880065918, "global_step": 162649, "epoch": 1344} {"train_loss": -40.556678771972656, "global_step": 162650, "epoch": 1344} {"train_loss": -39.59199905395508, "global_step": 162651, "epoch": 1344} {"train_loss": -40.626983642578125, "global_step": 162652, "epoch": 1344} {"train_loss": -39.615169525146484, "global_step": 162653, "epoch": 1344} {"train_loss": -40.530147552490234, "global_step": 162654, "epoch": 1344} {"train_loss": -39.46042251586914, "global_step": 162655, "epoch": 1344} {"train_loss": -40.97915267944336, "global_step": 162656, "epoch": 1344} {"train_loss": -40.46498489379883, "global_step": 162657, "epoch": 1344} {"train_loss": -41.014678955078125, "global_step": 162658, "epoch": 1344} {"train_loss": -40.83698654174805, "global_step": 162659, "epoch": 1344} {"train_loss": -40.48519515991211, "global_step": 162660, "epoch": 1344} {"train_loss": -40.78207778930664, "global_step": 162661, "epoch": 1344} {"train_loss": -41.2853889465332, "global_step": 162662, "epoch": 1344} {"train_loss": -40.891075134277344, "global_step": 162663, "epoch": 1344} {"train_loss": -40.294918060302734, "global_step": 162664, "epoch": 1344} {"train_loss": -40.73226547241211, "global_step": 162665, "epoch": 1344} {"train_loss": -40.975608825683594, "global_step": 162666, "epoch": 1344} {"train_loss": -41.16294860839844, "global_step": 162667, "epoch": 1344} {"train_loss": -40.54596710205078, "global_step": 162668, "epoch": 1344} {"train_loss": -41.9366455078125, "global_step": 162669, "epoch": 1344} {"train_loss": -40.515262603759766, "global_step": 162670, "epoch": 1344} {"train_loss": -41.78949737548828, "global_step": 162671, "epoch": 1344} {"train_loss": -41.45118713378906, "global_step": 162672, "epoch": 1344} {"train_loss": -41.11660385131836, "global_step": 162673, "epoch": 1344} {"train_loss": -41.2678108215332, "global_step": 162674, "epoch": 1344} {"train_loss": -41.698448181152344, "global_step": 162675, "epoch": 1344} {"train_loss": -41.24210739135742, "global_step": 162676, "epoch": 1344} {"train_loss": -41.68390655517578, "global_step": 162677, "epoch": 1344} {"train_loss": -41.25457000732422, "global_step": 162678, "epoch": 1344} {"train_loss": -41.59730529785156, "global_step": 162679, "epoch": 1344} {"train_loss": -41.03776168823242, "global_step": 162680, "epoch": 1344} {"train_loss": -41.94536590576172, "global_step": 162681, "epoch": 1344} {"train_loss": -41.8772087097168, "global_step": 162682, "epoch": 1344} {"train_loss": -40.09751892089844, "global_step": 162683, "epoch": 1344} {"train_loss": -41.69734191894531, "global_step": 162684, "epoch": 1344} {"train_loss": -41.049251556396484, "global_step": 162685, "epoch": 1344} {"train_loss": -41.72823715209961, "global_step": 162686, "epoch": 1344} {"train_loss": -41.66999053955078, "global_step": 162687, "epoch": 1344} {"train_loss": -40.31888961791992, "global_step": 162688, "epoch": 1344} {"train_loss": -41.64101791381836, "global_step": 162689, "epoch": 1344} {"train_loss": -41.77589797973633, "global_step": 162690, "epoch": 1344} {"train_loss": -41.15857696533203, "global_step": 162691, "epoch": 1344} {"train_loss": -41.21890640258789, "global_step": 162692, "epoch": 1344} {"train_loss": -42.0557746887207, "global_step": 162693, "epoch": 1344} {"train_loss": -40.119178771972656, "global_step": 162694, "epoch": 1344} {"train_loss": -41.85892868041992, "global_step": 162695, "epoch": 1344} {"train_loss": -41.504520416259766, "global_step": 162696, "epoch": 1344} {"train_loss": -41.28215026855469, "global_step": 162697, "epoch": 1344} {"train_loss": -41.3087043762207, "global_step": 162698, "epoch": 1344} {"train_loss": -41.568946838378906, "global_step": 162699, "epoch": 1344} {"train_loss": -40.62569046020508, "global_step": 162700, "epoch": 1344} {"train_loss": -41.6986198425293, "global_step": 162701, "epoch": 1344} {"train_loss": -41.2595100402832, "global_step": 162702, "epoch": 1344} {"train_loss": -40.8275146484375, "global_step": 162703, "epoch": 1344} {"train_loss": -41.16875457763672, "global_step": 162704, "epoch": 1344} {"train_loss": -40.81325912475586, "global_step": 162705, "epoch": 1344} {"train_loss": -39.97203826904297, "global_step": 162706, "epoch": 1344} {"train_loss": -41.295135498046875, "global_step": 162707, "epoch": 1344} {"train_loss": -41.2738151550293, "global_step": 162708, "epoch": 1344} {"train_loss": -41.12300491333008, "global_step": 162709, "epoch": 1344} {"train_loss": -41.389217376708984, "global_step": 162710, "epoch": 1344} {"train_loss": -41.58827209472656, "global_step": 162711, "epoch": 1344} {"train_loss": -41.5940055847168, "global_step": 162712, "epoch": 1344} {"train_loss": -41.39116668701172, "global_step": 162713, "epoch": 1344} {"train_loss": -40.869876861572266, "global_step": 162714, "epoch": 1344} {"train_loss": -41.68401336669922, "global_step": 162715, "epoch": 1344} {"train_loss": -41.986419677734375, "global_step": 162716, "epoch": 1344} {"train_loss": -41.877105712890625, "global_step": 162717, "epoch": 1344} {"train_loss": -41.52936553955078, "global_step": 162718, "epoch": 1344} {"train_loss": -40.71455001831055, "global_step": 162719, "epoch": 1344} {"train_loss": -41.791015625, "global_step": 162720, "epoch": 1344} {"train_loss": -41.57014465332031, "global_step": 162721, "epoch": 1344} {"train_loss": -41.408538818359375, "global_step": 162722, "epoch": 1344} {"train_loss": -40.59351348876953, "global_step": 162723, "epoch": 1344} {"train_loss": -41.12659454345703, "global_step": 162724, "epoch": 1344} {"train_loss": -40.749324798583984, "global_step": 162725, "epoch": 1344} {"train_loss": -41.510833740234375, "global_step": 162726, "epoch": 1344} {"train_loss": -41.67511749267578, "global_step": 162727, "epoch": 1344} {"train_loss": -40.72378158569336, "global_step": 162728, "epoch": 1344} {"train_loss": -41.65616989135742, "global_step": 162729, "epoch": 1344} {"train_loss": -41.245357513427734, "global_step": 162730, "epoch": 1344} {"train_loss": -41.7507438659668, "global_step": 162731, "epoch": 1344} {"train_loss": -42.267391204833984, "global_step": 162732, "epoch": 1344} {"train_loss": -41.64289474487305, "global_step": 162733, "epoch": 1344} {"train_loss": -41.90987777709961, "global_step": 162734, "epoch": 1344} {"train_loss": -41.02628707885742, "global_step": 162735, "epoch": 1344} {"train_loss": -41.375762939453125, "global_step": 162736, "epoch": 1344} {"train_loss": -41.07035446166992, "global_step": 162737, "epoch": 1344} {"train_loss": -40.45540237426758, "global_step": 162738, "epoch": 1344} {"train_loss": -40.76935958862305, "global_step": 162739, "epoch": 1344} {"train_loss": -41.68136978149414, "global_step": 162740, "epoch": 1344} {"train_loss": -41.283565521240234, "global_step": 162741, "epoch": 1344} {"train_loss": -41.12520980834961, "global_step": 162742, "epoch": 1344} {"train_loss": -38.83864212036133, "global_step": 162743, "epoch": 1344} {"train_loss": -40.36763257428634, "global_step": 162744, "epoch": 1344, "val_loss": 2564195.75} {"train_loss": -35.67939376831055, "global_step": 162745, "epoch": 1345} {"train_loss": -30.24384117126465, "global_step": 162746, "epoch": 1345} {"train_loss": -33.771759033203125, "global_step": 162747, "epoch": 1345} {"train_loss": -35.94001388549805, "global_step": 162748, "epoch": 1345} {"train_loss": -31.30855369567871, "global_step": 162749, "epoch": 1345} {"train_loss": -31.46575355529785, "global_step": 162750, "epoch": 1345} {"train_loss": -36.73202133178711, "global_step": 162751, "epoch": 1345} {"train_loss": -34.649173736572266, "global_step": 162752, "epoch": 1345} {"train_loss": -36.72703170776367, "global_step": 162753, "epoch": 1345} {"train_loss": -31.689584732055664, "global_step": 162754, "epoch": 1345} {"train_loss": -27.148090362548828, "global_step": 162755, "epoch": 1345} {"train_loss": -32.934844970703125, "global_step": 162756, "epoch": 1345} {"train_loss": -36.54411697387695, "global_step": 162757, "epoch": 1345} {"train_loss": -34.6058235168457, "global_step": 162758, "epoch": 1345} {"train_loss": -36.59550857543945, "global_step": 162759, "epoch": 1345} {"train_loss": -37.047786712646484, "global_step": 162760, "epoch": 1345} {"train_loss": -34.993865966796875, "global_step": 162761, "epoch": 1345} {"train_loss": -37.2109489440918, "global_step": 162762, "epoch": 1345} {"train_loss": -36.0048713684082, "global_step": 162763, "epoch": 1345} {"train_loss": -35.42841720581055, "global_step": 162764, "epoch": 1345} {"train_loss": -34.103675842285156, "global_step": 162765, "epoch": 1345} {"train_loss": -36.99351119995117, "global_step": 162766, "epoch": 1345} {"train_loss": -36.785743713378906, "global_step": 162767, "epoch": 1345} {"train_loss": -38.64739227294922, "global_step": 162768, "epoch": 1345} {"train_loss": -38.032894134521484, "global_step": 162769, "epoch": 1345} {"train_loss": -37.95693588256836, "global_step": 162770, "epoch": 1345} {"train_loss": -38.64103317260742, "global_step": 162771, "epoch": 1345} {"train_loss": -39.36436080932617, "global_step": 162772, "epoch": 1345} {"train_loss": -38.883174896240234, "global_step": 162773, "epoch": 1345} {"train_loss": -39.03876876831055, "global_step": 162774, "epoch": 1345} {"train_loss": -38.86384201049805, "global_step": 162775, "epoch": 1345} {"train_loss": -38.232704162597656, "global_step": 162776, "epoch": 1345} {"train_loss": -38.43141555786133, "global_step": 162777, "epoch": 1345} {"train_loss": -39.452972412109375, "global_step": 162778, "epoch": 1345} {"train_loss": -38.82691192626953, "global_step": 162779, "epoch": 1345} {"train_loss": -39.30246353149414, "global_step": 162780, "epoch": 1345} {"train_loss": -39.27264404296875, "global_step": 162781, "epoch": 1345} {"train_loss": -39.797664642333984, "global_step": 162782, "epoch": 1345} {"train_loss": -40.052886962890625, "global_step": 162783, "epoch": 1345} {"train_loss": -39.51266098022461, "global_step": 162784, "epoch": 1345} {"train_loss": -39.78562545776367, "global_step": 162785, "epoch": 1345} {"train_loss": -38.90529251098633, "global_step": 162786, "epoch": 1345} {"train_loss": -40.07990264892578, "global_step": 162787, "epoch": 1345} {"train_loss": -40.24380111694336, "global_step": 162788, "epoch": 1345} {"train_loss": -39.926185607910156, "global_step": 162789, "epoch": 1345} {"train_loss": -40.59733200073242, "global_step": 162790, "epoch": 1345} {"train_loss": -40.01015853881836, "global_step": 162791, "epoch": 1345} {"train_loss": -39.7783203125, "global_step": 162792, "epoch": 1345} {"train_loss": -40.61263656616211, "global_step": 162793, "epoch": 1345} {"train_loss": -39.278785705566406, "global_step": 162794, "epoch": 1345} {"train_loss": -39.86967086791992, "global_step": 162795, "epoch": 1345} {"train_loss": -40.20931625366211, "global_step": 162796, "epoch": 1345} {"train_loss": -39.95596694946289, "global_step": 162797, "epoch": 1345} {"train_loss": -39.866207122802734, "global_step": 162798, "epoch": 1345} {"train_loss": -40.40607833862305, "global_step": 162799, "epoch": 1345} {"train_loss": -40.359352111816406, "global_step": 162800, "epoch": 1345} {"train_loss": -40.714229583740234, "global_step": 162801, "epoch": 1345} {"train_loss": -40.2335205078125, "global_step": 162802, "epoch": 1345} {"train_loss": -39.77939987182617, "global_step": 162803, "epoch": 1345} {"train_loss": -40.702266693115234, "global_step": 162804, "epoch": 1345} {"train_loss": -40.70575714111328, "global_step": 162805, "epoch": 1345} {"train_loss": -40.71165084838867, "global_step": 162806, "epoch": 1345} {"train_loss": -40.30560302734375, "global_step": 162807, "epoch": 1345} {"train_loss": -40.96112060546875, "global_step": 162808, "epoch": 1345} {"train_loss": -40.26117706298828, "global_step": 162809, "epoch": 1345} {"train_loss": -40.47654342651367, "global_step": 162810, "epoch": 1345} {"train_loss": -41.06162643432617, "global_step": 162811, "epoch": 1345} {"train_loss": -40.89850616455078, "global_step": 162812, "epoch": 1345} {"train_loss": -41.012996673583984, "global_step": 162813, "epoch": 1345} {"train_loss": -40.633338928222656, "global_step": 162814, "epoch": 1345} {"train_loss": -40.771087646484375, "global_step": 162815, "epoch": 1345} {"train_loss": -41.04160690307617, "global_step": 162816, "epoch": 1345} {"train_loss": -40.749778747558594, "global_step": 162817, "epoch": 1345} {"train_loss": -41.16279220581055, "global_step": 162818, "epoch": 1345} {"train_loss": -41.11184310913086, "global_step": 162819, "epoch": 1345} {"train_loss": -40.87860107421875, "global_step": 162820, "epoch": 1345} {"train_loss": -41.09767532348633, "global_step": 162821, "epoch": 1345} {"train_loss": -40.8089485168457, "global_step": 162822, "epoch": 1345} {"train_loss": -41.128440856933594, "global_step": 162823, "epoch": 1345} {"train_loss": -40.9779052734375, "global_step": 162824, "epoch": 1345} {"train_loss": -41.41526794433594, "global_step": 162825, "epoch": 1345} {"train_loss": -41.16231155395508, "global_step": 162826, "epoch": 1345} {"train_loss": -41.695308685302734, "global_step": 162827, "epoch": 1345} {"train_loss": -41.47632598876953, "global_step": 162828, "epoch": 1345} {"train_loss": -41.59942626953125, "global_step": 162829, "epoch": 1345} {"train_loss": -40.74599838256836, "global_step": 162830, "epoch": 1345} {"train_loss": -41.724727630615234, "global_step": 162831, "epoch": 1345} {"train_loss": -41.50807571411133, "global_step": 162832, "epoch": 1345} {"train_loss": -41.470970153808594, "global_step": 162833, "epoch": 1345} {"train_loss": -41.40656661987305, "global_step": 162834, "epoch": 1345} {"train_loss": -41.21926498413086, "global_step": 162835, "epoch": 1345} {"train_loss": -41.52052688598633, "global_step": 162836, "epoch": 1345} {"train_loss": -41.35041427612305, "global_step": 162837, "epoch": 1345} {"train_loss": -41.81064987182617, "global_step": 162838, "epoch": 1345} {"train_loss": -41.80216598510742, "global_step": 162839, "epoch": 1345} {"train_loss": -41.4971923828125, "global_step": 162840, "epoch": 1345} {"train_loss": -41.35081100463867, "global_step": 162841, "epoch": 1345} {"train_loss": -41.35271072387695, "global_step": 162842, "epoch": 1345} {"train_loss": -41.21023178100586, "global_step": 162843, "epoch": 1345} {"train_loss": -41.17171859741211, "global_step": 162844, "epoch": 1345} {"train_loss": -40.609657287597656, "global_step": 162845, "epoch": 1345} {"train_loss": -41.52359390258789, "global_step": 162846, "epoch": 1345} {"train_loss": -40.85982131958008, "global_step": 162847, "epoch": 1345} {"train_loss": -39.94985580444336, "global_step": 162848, "epoch": 1345} {"train_loss": -41.414276123046875, "global_step": 162849, "epoch": 1345} {"train_loss": -40.35944366455078, "global_step": 162850, "epoch": 1345} {"train_loss": -40.0645866394043, "global_step": 162851, "epoch": 1345} {"train_loss": -41.288204193115234, "global_step": 162852, "epoch": 1345} {"train_loss": -39.09304428100586, "global_step": 162853, "epoch": 1345} {"train_loss": -39.24398422241211, "global_step": 162854, "epoch": 1345} {"train_loss": -40.744083404541016, "global_step": 162855, "epoch": 1345} {"train_loss": -40.080169677734375, "global_step": 162856, "epoch": 1345} {"train_loss": -41.12678909301758, "global_step": 162857, "epoch": 1345} {"train_loss": -40.54842758178711, "global_step": 162858, "epoch": 1345} {"train_loss": -39.57075119018555, "global_step": 162859, "epoch": 1345} {"train_loss": -33.15766906738281, "global_step": 162860, "epoch": 1345} {"train_loss": -40.372100830078125, "global_step": 162861, "epoch": 1345} {"train_loss": -39.999359130859375, "global_step": 162862, "epoch": 1345} {"train_loss": -40.0157470703125, "global_step": 162863, "epoch": 1345} {"train_loss": -40.89870834350586, "global_step": 162864, "epoch": 1345} {"train_loss": -39.2029921476506, "global_step": 162865, "epoch": 1345, "val_loss": 2898855.25} {"train_loss": -40.15545654296875, "global_step": 162866, "epoch": 1346} {"train_loss": -39.29446029663086, "global_step": 162867, "epoch": 1346} {"train_loss": -39.22334289550781, "global_step": 162868, "epoch": 1346} {"train_loss": -40.444698333740234, "global_step": 162869, "epoch": 1346} {"train_loss": -40.60055160522461, "global_step": 162870, "epoch": 1346} {"train_loss": -38.94765853881836, "global_step": 162871, "epoch": 1346} {"train_loss": -33.9963493347168, "global_step": 162872, "epoch": 1346} {"train_loss": -38.891456604003906, "global_step": 162873, "epoch": 1346} {"train_loss": -39.38538360595703, "global_step": 162874, "epoch": 1346} {"train_loss": -39.93833923339844, "global_step": 162875, "epoch": 1346} {"train_loss": -39.545379638671875, "global_step": 162876, "epoch": 1346} {"train_loss": -32.304691314697266, "global_step": 162877, "epoch": 1346} {"train_loss": -38.35297775268555, "global_step": 162878, "epoch": 1346} {"train_loss": -38.9205436706543, "global_step": 162879, "epoch": 1346} {"train_loss": -40.50444412231445, "global_step": 162880, "epoch": 1346} {"train_loss": -37.91242599487305, "global_step": 162881, "epoch": 1346} {"train_loss": -40.46619415283203, "global_step": 162882, "epoch": 1346} {"train_loss": -30.701374053955078, "global_step": 162883, "epoch": 1346} {"train_loss": -39.861934661865234, "global_step": 162884, "epoch": 1346} {"train_loss": -37.35270690917969, "global_step": 162885, "epoch": 1346} {"train_loss": -38.79643630981445, "global_step": 162886, "epoch": 1346} {"train_loss": -37.37396240234375, "global_step": 162887, "epoch": 1346} {"train_loss": -39.00081253051758, "global_step": 162888, "epoch": 1346} {"train_loss": -35.45793151855469, "global_step": 162889, "epoch": 1346} {"train_loss": -39.366634368896484, "global_step": 162890, "epoch": 1346} {"train_loss": -37.07257843017578, "global_step": 162891, "epoch": 1346} {"train_loss": -35.10145950317383, "global_step": 162892, "epoch": 1346} {"train_loss": -37.59587478637695, "global_step": 162893, "epoch": 1346} {"train_loss": -38.90450668334961, "global_step": 162894, "epoch": 1346} {"train_loss": -35.93115997314453, "global_step": 162895, "epoch": 1346} {"train_loss": -38.14094161987305, "global_step": 162896, "epoch": 1346} {"train_loss": -38.81831741333008, "global_step": 162897, "epoch": 1346} {"train_loss": -36.34922409057617, "global_step": 162898, "epoch": 1346} {"train_loss": -38.14105987548828, "global_step": 162899, "epoch": 1346} {"train_loss": -38.070281982421875, "global_step": 162900, "epoch": 1346} {"train_loss": -38.54912185668945, "global_step": 162901, "epoch": 1346} {"train_loss": -38.89291763305664, "global_step": 162902, "epoch": 1346} {"train_loss": -39.07979202270508, "global_step": 162903, "epoch": 1346} {"train_loss": -39.51742935180664, "global_step": 162904, "epoch": 1346} {"train_loss": -37.64741134643555, "global_step": 162905, "epoch": 1346} {"train_loss": -39.25852584838867, "global_step": 162906, "epoch": 1346} {"train_loss": -39.775638580322266, "global_step": 162907, "epoch": 1346} {"train_loss": -37.59043502807617, "global_step": 162908, "epoch": 1346} {"train_loss": -39.640316009521484, "global_step": 162909, "epoch": 1346} {"train_loss": -38.378108978271484, "global_step": 162910, "epoch": 1346} {"train_loss": -40.08784103393555, "global_step": 162911, "epoch": 1346} {"train_loss": -38.516876220703125, "global_step": 162912, "epoch": 1346} {"train_loss": -39.09920883178711, "global_step": 162913, "epoch": 1346} {"train_loss": -39.35720443725586, "global_step": 162914, "epoch": 1346} {"train_loss": -40.1795539855957, "global_step": 162915, "epoch": 1346} {"train_loss": -39.998687744140625, "global_step": 162916, "epoch": 1346} {"train_loss": -40.11155700683594, "global_step": 162917, "epoch": 1346} {"train_loss": -40.039119720458984, "global_step": 162918, "epoch": 1346} {"train_loss": -39.406795501708984, "global_step": 162919, "epoch": 1346} {"train_loss": -40.7240104675293, "global_step": 162920, "epoch": 1346} {"train_loss": -39.707340240478516, "global_step": 162921, "epoch": 1346} {"train_loss": -39.74221420288086, "global_step": 162922, "epoch": 1346} {"train_loss": -40.38130569458008, "global_step": 162923, "epoch": 1346} {"train_loss": -40.171138763427734, "global_step": 162924, "epoch": 1346} {"train_loss": -39.38987350463867, "global_step": 162925, "epoch": 1346} {"train_loss": -40.519771575927734, "global_step": 162926, "epoch": 1346} {"train_loss": -40.021175384521484, "global_step": 162927, "epoch": 1346} {"train_loss": -40.79993438720703, "global_step": 162928, "epoch": 1346} {"train_loss": -40.36226272583008, "global_step": 162929, "epoch": 1346} {"train_loss": -40.52839279174805, "global_step": 162930, "epoch": 1346} {"train_loss": -40.46706008911133, "global_step": 162931, "epoch": 1346} {"train_loss": -40.239105224609375, "global_step": 162932, "epoch": 1346} {"train_loss": -40.929664611816406, "global_step": 162933, "epoch": 1346} {"train_loss": -40.04347229003906, "global_step": 162934, "epoch": 1346} {"train_loss": -40.85032272338867, "global_step": 162935, "epoch": 1346} {"train_loss": -41.26774978637695, "global_step": 162936, "epoch": 1346} {"train_loss": -41.34477996826172, "global_step": 162937, "epoch": 1346} {"train_loss": -40.98817443847656, "global_step": 162938, "epoch": 1346} {"train_loss": -40.998348236083984, "global_step": 162939, "epoch": 1346} {"train_loss": -40.72163009643555, "global_step": 162940, "epoch": 1346} {"train_loss": -40.88100051879883, "global_step": 162941, "epoch": 1346} {"train_loss": -40.750885009765625, "global_step": 162942, "epoch": 1346} {"train_loss": -41.144771575927734, "global_step": 162943, "epoch": 1346} {"train_loss": -41.60350036621094, "global_step": 162944, "epoch": 1346} {"train_loss": -41.3198127746582, "global_step": 162945, "epoch": 1346} {"train_loss": -39.98712921142578, "global_step": 162946, "epoch": 1346} {"train_loss": -41.34225082397461, "global_step": 162947, "epoch": 1346} {"train_loss": -40.84371566772461, "global_step": 162948, "epoch": 1346} {"train_loss": -41.534637451171875, "global_step": 162949, "epoch": 1346} {"train_loss": -41.520755767822266, "global_step": 162950, "epoch": 1346} {"train_loss": -41.0465202331543, "global_step": 162951, "epoch": 1346} {"train_loss": -41.10459518432617, "global_step": 162952, "epoch": 1346} {"train_loss": -41.5906867980957, "global_step": 162953, "epoch": 1346} {"train_loss": -41.433834075927734, "global_step": 162954, "epoch": 1346} {"train_loss": -40.713661193847656, "global_step": 162955, "epoch": 1346} {"train_loss": -40.44919967651367, "global_step": 162956, "epoch": 1346} {"train_loss": -39.88824462890625, "global_step": 162957, "epoch": 1346} {"train_loss": -40.091209411621094, "global_step": 162958, "epoch": 1346} {"train_loss": -40.364654541015625, "global_step": 162959, "epoch": 1346} {"train_loss": -40.20720291137695, "global_step": 162960, "epoch": 1346} {"train_loss": -38.89577865600586, "global_step": 162961, "epoch": 1346} {"train_loss": -40.261138916015625, "global_step": 162962, "epoch": 1346} {"train_loss": -41.11689376831055, "global_step": 162963, "epoch": 1346} {"train_loss": -41.69733428955078, "global_step": 162964, "epoch": 1346} {"train_loss": -41.20799255371094, "global_step": 162965, "epoch": 1346} {"train_loss": -40.59208297729492, "global_step": 162966, "epoch": 1346} {"train_loss": -40.524593353271484, "global_step": 162967, "epoch": 1346} {"train_loss": -40.8715934753418, "global_step": 162968, "epoch": 1346} {"train_loss": -40.78437042236328, "global_step": 162969, "epoch": 1346} {"train_loss": -40.67673873901367, "global_step": 162970, "epoch": 1346} {"train_loss": -41.00483322143555, "global_step": 162971, "epoch": 1346} {"train_loss": -41.860652923583984, "global_step": 162972, "epoch": 1346} {"train_loss": -40.7738037109375, "global_step": 162973, "epoch": 1346} {"train_loss": -40.75828552246094, "global_step": 162974, "epoch": 1346} {"train_loss": -41.166194915771484, "global_step": 162975, "epoch": 1346} {"train_loss": -42.15177536010742, "global_step": 162976, "epoch": 1346} {"train_loss": -41.052303314208984, "global_step": 162977, "epoch": 1346} {"train_loss": -40.71538162231445, "global_step": 162978, "epoch": 1346} {"train_loss": -39.94706726074219, "global_step": 162979, "epoch": 1346} {"train_loss": -39.65046310424805, "global_step": 162980, "epoch": 1346} {"train_loss": -40.82882308959961, "global_step": 162981, "epoch": 1346} {"train_loss": -41.486968994140625, "global_step": 162982, "epoch": 1346} {"train_loss": -40.179344177246094, "global_step": 162983, "epoch": 1346} {"train_loss": -40.38633346557617, "global_step": 162984, "epoch": 1346} {"train_loss": -39.426265716552734, "global_step": 162985, "epoch": 1346} {"train_loss": -39.697981337870445, "global_step": 162986, "epoch": 1346, "val_loss": 2557150.75} {"train_loss": -39.80079650878906, "global_step": 162987, "epoch": 1347} {"train_loss": -39.14265823364258, "global_step": 162988, "epoch": 1347} {"train_loss": -41.25794219970703, "global_step": 162989, "epoch": 1347} {"train_loss": -39.5466423034668, "global_step": 162990, "epoch": 1347} {"train_loss": -37.64282989501953, "global_step": 162991, "epoch": 1347} {"train_loss": -38.47218704223633, "global_step": 162992, "epoch": 1347} {"train_loss": -39.65071487426758, "global_step": 162993, "epoch": 1347} {"train_loss": -39.030784606933594, "global_step": 162994, "epoch": 1347} {"train_loss": -38.56581497192383, "global_step": 162995, "epoch": 1347} {"train_loss": -38.33635330200195, "global_step": 162996, "epoch": 1347} {"train_loss": -38.08175277709961, "global_step": 162997, "epoch": 1347} {"train_loss": -40.56734848022461, "global_step": 162998, "epoch": 1347} {"train_loss": -39.989845275878906, "global_step": 162999, "epoch": 1347} {"train_loss": -39.134124755859375, "global_step": 163000, "epoch": 1347} {"train_loss": -39.71904373168945, "global_step": 163001, "epoch": 1347} {"train_loss": -38.870094299316406, "global_step": 163002, "epoch": 1347} {"train_loss": -40.62778091430664, "global_step": 163003, "epoch": 1347} {"train_loss": -39.85157012939453, "global_step": 163004, "epoch": 1347} {"train_loss": -38.636024475097656, "global_step": 163005, "epoch": 1347} {"train_loss": -39.78081130981445, "global_step": 163006, "epoch": 1347} {"train_loss": -39.91236114501953, "global_step": 163007, "epoch": 1347} {"train_loss": -39.67378616333008, "global_step": 163008, "epoch": 1347} {"train_loss": -38.727821350097656, "global_step": 163009, "epoch": 1347} {"train_loss": -39.78532409667969, "global_step": 163010, "epoch": 1347} {"train_loss": -40.73299789428711, "global_step": 163011, "epoch": 1347} {"train_loss": -39.68695831298828, "global_step": 163012, "epoch": 1347} {"train_loss": -38.990447998046875, "global_step": 163013, "epoch": 1347} {"train_loss": -39.39168167114258, "global_step": 163014, "epoch": 1347} {"train_loss": -39.709449768066406, "global_step": 163015, "epoch": 1347} {"train_loss": -40.58827590942383, "global_step": 163016, "epoch": 1347} {"train_loss": -38.94327926635742, "global_step": 163017, "epoch": 1347} {"train_loss": -38.7443962097168, "global_step": 163018, "epoch": 1347} {"train_loss": -41.07621383666992, "global_step": 163019, "epoch": 1347} {"train_loss": -40.489593505859375, "global_step": 163020, "epoch": 1347} {"train_loss": -39.913856506347656, "global_step": 163021, "epoch": 1347} {"train_loss": -41.2177734375, "global_step": 163022, "epoch": 1347} {"train_loss": -40.897247314453125, "global_step": 163023, "epoch": 1347} {"train_loss": -40.62101364135742, "global_step": 163024, "epoch": 1347} {"train_loss": -40.95988082885742, "global_step": 163025, "epoch": 1347} {"train_loss": -40.35626220703125, "global_step": 163026, "epoch": 1347} {"train_loss": -40.307254791259766, "global_step": 163027, "epoch": 1347} {"train_loss": -41.36408615112305, "global_step": 163028, "epoch": 1347} {"train_loss": -40.54493713378906, "global_step": 163029, "epoch": 1347} {"train_loss": -40.90287399291992, "global_step": 163030, "epoch": 1347} {"train_loss": -41.54694366455078, "global_step": 163031, "epoch": 1347} {"train_loss": -39.57985305786133, "global_step": 163032, "epoch": 1347} {"train_loss": -40.53817367553711, "global_step": 163033, "epoch": 1347} {"train_loss": -41.509403228759766, "global_step": 163034, "epoch": 1347} {"train_loss": -40.90819549560547, "global_step": 163035, "epoch": 1347} {"train_loss": -41.25263214111328, "global_step": 163036, "epoch": 1347} {"train_loss": -41.307926177978516, "global_step": 163037, "epoch": 1347} {"train_loss": -41.357078552246094, "global_step": 163038, "epoch": 1347} {"train_loss": -41.49088668823242, "global_step": 163039, "epoch": 1347} {"train_loss": -41.14894485473633, "global_step": 163040, "epoch": 1347} {"train_loss": -41.26838684082031, "global_step": 163041, "epoch": 1347} {"train_loss": -41.17987060546875, "global_step": 163042, "epoch": 1347} {"train_loss": -40.79048538208008, "global_step": 163043, "epoch": 1347} {"train_loss": -41.30959701538086, "global_step": 163044, "epoch": 1347} {"train_loss": -41.14152526855469, "global_step": 163045, "epoch": 1347} {"train_loss": -41.51517868041992, "global_step": 163046, "epoch": 1347} {"train_loss": -41.09561538696289, "global_step": 163047, "epoch": 1347} {"train_loss": -40.873294830322266, "global_step": 163048, "epoch": 1347} {"train_loss": -41.260353088378906, "global_step": 163049, "epoch": 1347} {"train_loss": -40.57148361206055, "global_step": 163050, "epoch": 1347} {"train_loss": -40.44804763793945, "global_step": 163051, "epoch": 1347} {"train_loss": -41.670692443847656, "global_step": 163052, "epoch": 1347} {"train_loss": -40.434146881103516, "global_step": 163053, "epoch": 1347} {"train_loss": -41.405086517333984, "global_step": 163054, "epoch": 1347} {"train_loss": -41.08095932006836, "global_step": 163055, "epoch": 1347} {"train_loss": -41.677703857421875, "global_step": 163056, "epoch": 1347} {"train_loss": -41.5594482421875, "global_step": 163057, "epoch": 1347} {"train_loss": -41.155982971191406, "global_step": 163058, "epoch": 1347} {"train_loss": -41.19978713989258, "global_step": 163059, "epoch": 1347} {"train_loss": -40.935218811035156, "global_step": 163060, "epoch": 1347} {"train_loss": -41.608863830566406, "global_step": 163061, "epoch": 1347} {"train_loss": -40.931636810302734, "global_step": 163062, "epoch": 1347} {"train_loss": -41.49951171875, "global_step": 163063, "epoch": 1347} {"train_loss": -41.645782470703125, "global_step": 163064, "epoch": 1347} {"train_loss": -41.42348861694336, "global_step": 163065, "epoch": 1347} {"train_loss": -41.321990966796875, "global_step": 163066, "epoch": 1347} {"train_loss": -41.24579620361328, "global_step": 163067, "epoch": 1347} {"train_loss": -41.642723083496094, "global_step": 163068, "epoch": 1347} {"train_loss": -40.91700744628906, "global_step": 163069, "epoch": 1347} {"train_loss": -41.127471923828125, "global_step": 163070, "epoch": 1347} {"train_loss": -41.65205764770508, "global_step": 163071, "epoch": 1347} {"train_loss": -41.41107940673828, "global_step": 163072, "epoch": 1347} {"train_loss": -40.4991569519043, "global_step": 163073, "epoch": 1347} {"train_loss": -39.06283187866211, "global_step": 163074, "epoch": 1347} {"train_loss": -40.91826248168945, "global_step": 163075, "epoch": 1347} {"train_loss": -40.7423210144043, "global_step": 163076, "epoch": 1347} {"train_loss": -39.824676513671875, "global_step": 163077, "epoch": 1347} {"train_loss": -39.49765396118164, "global_step": 163078, "epoch": 1347} {"train_loss": -40.45029830932617, "global_step": 163079, "epoch": 1347} {"train_loss": -39.85081100463867, "global_step": 163080, "epoch": 1347} {"train_loss": -39.99033737182617, "global_step": 163081, "epoch": 1347} {"train_loss": -41.39201354980469, "global_step": 163082, "epoch": 1347} {"train_loss": -39.59048080444336, "global_step": 163083, "epoch": 1347} {"train_loss": -38.7379264831543, "global_step": 163084, "epoch": 1347} {"train_loss": -41.538265228271484, "global_step": 163085, "epoch": 1347} {"train_loss": -39.554298400878906, "global_step": 163086, "epoch": 1347} {"train_loss": -38.78117752075195, "global_step": 163087, "epoch": 1347} {"train_loss": -41.0539436340332, "global_step": 163088, "epoch": 1347} {"train_loss": -40.680477142333984, "global_step": 163089, "epoch": 1347} {"train_loss": -41.12727355957031, "global_step": 163090, "epoch": 1347} {"train_loss": -40.69274139404297, "global_step": 163091, "epoch": 1347} {"train_loss": -40.980865478515625, "global_step": 163092, "epoch": 1347} {"train_loss": -40.37514114379883, "global_step": 163093, "epoch": 1347} {"train_loss": -41.05925369262695, "global_step": 163094, "epoch": 1347} {"train_loss": -41.06473922729492, "global_step": 163095, "epoch": 1347} {"train_loss": -40.816253662109375, "global_step": 163096, "epoch": 1347} {"train_loss": -40.096187591552734, "global_step": 163097, "epoch": 1347} {"train_loss": -40.57763671875, "global_step": 163098, "epoch": 1347} {"train_loss": -41.357810974121094, "global_step": 163099, "epoch": 1347} {"train_loss": -40.864051818847656, "global_step": 163100, "epoch": 1347} {"train_loss": -41.038604736328125, "global_step": 163101, "epoch": 1347} {"train_loss": -40.85279846191406, "global_step": 163102, "epoch": 1347} {"train_loss": -40.15241241455078, "global_step": 163103, "epoch": 1347} {"train_loss": -41.0467414855957, "global_step": 163104, "epoch": 1347} {"train_loss": -40.9422721862793, "global_step": 163105, "epoch": 1347} {"train_loss": -41.10274124145508, "global_step": 163106, "epoch": 1347} {"train_loss": -40.466102221780574, "global_step": 163107, "epoch": 1347, "val_loss": 2475226.25} {"train_loss": -41.08895492553711, "global_step": 163108, "epoch": 1348} {"train_loss": -41.209407806396484, "global_step": 163109, "epoch": 1348} {"train_loss": -40.83911895751953, "global_step": 163110, "epoch": 1348} {"train_loss": -41.10165023803711, "global_step": 163111, "epoch": 1348} {"train_loss": -40.86648178100586, "global_step": 163112, "epoch": 1348} {"train_loss": -40.86986541748047, "global_step": 163113, "epoch": 1348} {"train_loss": -41.50210189819336, "global_step": 163114, "epoch": 1348} {"train_loss": -41.120948791503906, "global_step": 163115, "epoch": 1348} {"train_loss": -41.76060485839844, "global_step": 163116, "epoch": 1348} {"train_loss": -41.90451431274414, "global_step": 163117, "epoch": 1348} {"train_loss": -41.85840606689453, "global_step": 163118, "epoch": 1348} {"train_loss": -40.767642974853516, "global_step": 163119, "epoch": 1348} {"train_loss": -41.18464279174805, "global_step": 163120, "epoch": 1348} {"train_loss": -41.58565902709961, "global_step": 163121, "epoch": 1348} {"train_loss": -41.6315803527832, "global_step": 163122, "epoch": 1348} {"train_loss": -41.46995162963867, "global_step": 163123, "epoch": 1348} {"train_loss": -40.74876403808594, "global_step": 163124, "epoch": 1348} {"train_loss": -41.6892204284668, "global_step": 163125, "epoch": 1348} {"train_loss": -41.77822494506836, "global_step": 163126, "epoch": 1348} {"train_loss": -40.1585578918457, "global_step": 163127, "epoch": 1348} {"train_loss": -40.9134635925293, "global_step": 163128, "epoch": 1348} {"train_loss": -42.000816345214844, "global_step": 163129, "epoch": 1348} {"train_loss": -41.46208190917969, "global_step": 163130, "epoch": 1348} {"train_loss": -41.78376770019531, "global_step": 163131, "epoch": 1348} {"train_loss": -41.86493682861328, "global_step": 163132, "epoch": 1348} {"train_loss": -41.614959716796875, "global_step": 163133, "epoch": 1348} {"train_loss": -41.13618087768555, "global_step": 163134, "epoch": 1348} {"train_loss": -41.21103286743164, "global_step": 163135, "epoch": 1348} {"train_loss": -41.91933822631836, "global_step": 163136, "epoch": 1348} {"train_loss": -40.74964141845703, "global_step": 163137, "epoch": 1348} {"train_loss": -40.90908432006836, "global_step": 163138, "epoch": 1348} {"train_loss": -41.77081298828125, "global_step": 163139, "epoch": 1348} {"train_loss": -40.69715118408203, "global_step": 163140, "epoch": 1348} {"train_loss": -40.06616973876953, "global_step": 163141, "epoch": 1348} {"train_loss": -39.178619384765625, "global_step": 163142, "epoch": 1348} {"train_loss": -40.59720230102539, "global_step": 163143, "epoch": 1348} {"train_loss": -42.189002990722656, "global_step": 163144, "epoch": 1348} {"train_loss": -41.4039421081543, "global_step": 163145, "epoch": 1348} {"train_loss": -41.56238555908203, "global_step": 163146, "epoch": 1348} {"train_loss": -40.99397659301758, "global_step": 163147, "epoch": 1348} {"train_loss": -40.56145095825195, "global_step": 163148, "epoch": 1348} {"train_loss": -40.199893951416016, "global_step": 163149, "epoch": 1348} {"train_loss": -40.904563903808594, "global_step": 163150, "epoch": 1348} {"train_loss": -41.12383270263672, "global_step": 163151, "epoch": 1348} {"train_loss": -40.41600036621094, "global_step": 163152, "epoch": 1348} {"train_loss": -40.90291213989258, "global_step": 163153, "epoch": 1348} {"train_loss": -41.54971694946289, "global_step": 163154, "epoch": 1348} {"train_loss": -41.28559112548828, "global_step": 163155, "epoch": 1348} {"train_loss": -41.08116149902344, "global_step": 163156, "epoch": 1348} {"train_loss": -40.74443435668945, "global_step": 163157, "epoch": 1348} {"train_loss": -41.55597686767578, "global_step": 163158, "epoch": 1348} {"train_loss": -40.82571029663086, "global_step": 163159, "epoch": 1348} {"train_loss": -40.376991271972656, "global_step": 163160, "epoch": 1348} {"train_loss": -41.53593444824219, "global_step": 163161, "epoch": 1348} {"train_loss": -41.55524826049805, "global_step": 163162, "epoch": 1348} {"train_loss": -40.74467849731445, "global_step": 163163, "epoch": 1348} {"train_loss": -40.95124435424805, "global_step": 163164, "epoch": 1348} {"train_loss": -41.77585983276367, "global_step": 163165, "epoch": 1348} {"train_loss": -41.6357421875, "global_step": 163166, "epoch": 1348} {"train_loss": -41.55662155151367, "global_step": 163167, "epoch": 1348} {"train_loss": -40.990447998046875, "global_step": 163168, "epoch": 1348} {"train_loss": -41.03731155395508, "global_step": 163169, "epoch": 1348} {"train_loss": -41.63922882080078, "global_step": 163170, "epoch": 1348} {"train_loss": -41.3978157043457, "global_step": 163171, "epoch": 1348} {"train_loss": -40.24970626831055, "global_step": 163172, "epoch": 1348} {"train_loss": -37.337242126464844, "global_step": 163173, "epoch": 1348} {"train_loss": -39.187255859375, "global_step": 163174, "epoch": 1348} {"train_loss": -41.61091232299805, "global_step": 163175, "epoch": 1348} {"train_loss": -41.6187744140625, "global_step": 163176, "epoch": 1348} {"train_loss": -40.72994613647461, "global_step": 163177, "epoch": 1348} {"train_loss": -40.882293701171875, "global_step": 163178, "epoch": 1348} {"train_loss": -41.12299728393555, "global_step": 163179, "epoch": 1348} {"train_loss": -39.30004119873047, "global_step": 163180, "epoch": 1348} {"train_loss": -38.92615509033203, "global_step": 163181, "epoch": 1348} {"train_loss": -41.4125862121582, "global_step": 163182, "epoch": 1348} {"train_loss": -39.625057220458984, "global_step": 163183, "epoch": 1348} {"train_loss": -39.086830139160156, "global_step": 163184, "epoch": 1348} {"train_loss": -41.48039245605469, "global_step": 163185, "epoch": 1348} {"train_loss": -38.197200775146484, "global_step": 163186, "epoch": 1348} {"train_loss": -38.06294631958008, "global_step": 163187, "epoch": 1348} {"train_loss": -41.41408920288086, "global_step": 163188, "epoch": 1348} {"train_loss": -37.59733581542969, "global_step": 163189, "epoch": 1348} {"train_loss": -39.07088851928711, "global_step": 163190, "epoch": 1348} {"train_loss": -40.41761779785156, "global_step": 163191, "epoch": 1348} {"train_loss": -38.8249397277832, "global_step": 163192, "epoch": 1348} {"train_loss": -40.538455963134766, "global_step": 163193, "epoch": 1348} {"train_loss": -38.754390716552734, "global_step": 163194, "epoch": 1348} {"train_loss": -40.8503532409668, "global_step": 163195, "epoch": 1348} {"train_loss": -39.2655143737793, "global_step": 163196, "epoch": 1348} {"train_loss": -39.098140716552734, "global_step": 163197, "epoch": 1348} {"train_loss": -39.041656494140625, "global_step": 163198, "epoch": 1348} {"train_loss": -38.54825973510742, "global_step": 163199, "epoch": 1348} {"train_loss": -40.485137939453125, "global_step": 163200, "epoch": 1348} {"train_loss": -40.02492904663086, "global_step": 163201, "epoch": 1348} {"train_loss": -39.398956298828125, "global_step": 163202, "epoch": 1348} {"train_loss": -37.9986457824707, "global_step": 163203, "epoch": 1348} {"train_loss": -36.24897766113281, "global_step": 163204, "epoch": 1348} {"train_loss": -38.61322021484375, "global_step": 163205, "epoch": 1348} {"train_loss": -40.39509201049805, "global_step": 163206, "epoch": 1348} {"train_loss": -39.417396545410156, "global_step": 163207, "epoch": 1348} {"train_loss": -38.61481475830078, "global_step": 163208, "epoch": 1348} {"train_loss": -40.903533935546875, "global_step": 163209, "epoch": 1348} {"train_loss": -39.61707305908203, "global_step": 163210, "epoch": 1348} {"train_loss": -41.20753479003906, "global_step": 163211, "epoch": 1348} {"train_loss": -40.76988983154297, "global_step": 163212, "epoch": 1348} {"train_loss": -41.1611328125, "global_step": 163213, "epoch": 1348} {"train_loss": -40.69443893432617, "global_step": 163214, "epoch": 1348} {"train_loss": -41.43384552001953, "global_step": 163215, "epoch": 1348} {"train_loss": -40.90176010131836, "global_step": 163216, "epoch": 1348} {"train_loss": -40.84456253051758, "global_step": 163217, "epoch": 1348} {"train_loss": -41.161346435546875, "global_step": 163218, "epoch": 1348} {"train_loss": -40.8305778503418, "global_step": 163219, "epoch": 1348} {"train_loss": -40.956233978271484, "global_step": 163220, "epoch": 1348} {"train_loss": -41.59182357788086, "global_step": 163221, "epoch": 1348} {"train_loss": -40.777652740478516, "global_step": 163222, "epoch": 1348} {"train_loss": -41.373931884765625, "global_step": 163223, "epoch": 1348} {"train_loss": -41.31536865234375, "global_step": 163224, "epoch": 1348} {"train_loss": -41.3249397277832, "global_step": 163225, "epoch": 1348} {"train_loss": -40.520076751708984, "global_step": 163226, "epoch": 1348} {"train_loss": -41.62541580200195, "global_step": 163227, "epoch": 1348} {"train_loss": -40.651743991315854, "global_step": 163228, "epoch": 1348, "val_loss": 2514383.25} {"train_loss": -40.98281478881836, "global_step": 163229, "epoch": 1349} {"train_loss": -41.647254943847656, "global_step": 163230, "epoch": 1349} {"train_loss": -40.618648529052734, "global_step": 163231, "epoch": 1349} {"train_loss": -40.96510314941406, "global_step": 163232, "epoch": 1349} {"train_loss": -41.68319320678711, "global_step": 163233, "epoch": 1349} {"train_loss": -41.26748275756836, "global_step": 163234, "epoch": 1349} {"train_loss": -40.49801254272461, "global_step": 163235, "epoch": 1349} {"train_loss": -40.76081466674805, "global_step": 163236, "epoch": 1349} {"train_loss": -41.67707061767578, "global_step": 163237, "epoch": 1349} {"train_loss": -41.5874137878418, "global_step": 163238, "epoch": 1349} {"train_loss": -41.51444625854492, "global_step": 163239, "epoch": 1349} {"train_loss": -41.598968505859375, "global_step": 163240, "epoch": 1349} {"train_loss": -41.33432388305664, "global_step": 163241, "epoch": 1349} {"train_loss": -41.03815460205078, "global_step": 163242, "epoch": 1349} {"train_loss": -41.539390563964844, "global_step": 163243, "epoch": 1349} {"train_loss": -41.51998519897461, "global_step": 163244, "epoch": 1349} {"train_loss": -41.225032806396484, "global_step": 163245, "epoch": 1349} {"train_loss": -41.11517333984375, "global_step": 163246, "epoch": 1349} {"train_loss": -40.707427978515625, "global_step": 163247, "epoch": 1349} {"train_loss": -40.780757904052734, "global_step": 163248, "epoch": 1349} {"train_loss": -41.43212890625, "global_step": 163249, "epoch": 1349} {"train_loss": -40.6233024597168, "global_step": 163250, "epoch": 1349} {"train_loss": -40.94172286987305, "global_step": 163251, "epoch": 1349} {"train_loss": -41.54399108886719, "global_step": 163252, "epoch": 1349} {"train_loss": -41.38295364379883, "global_step": 163253, "epoch": 1349} {"train_loss": -41.452693939208984, "global_step": 163254, "epoch": 1349} {"train_loss": -41.90102767944336, "global_step": 163255, "epoch": 1349} {"train_loss": -41.90263748168945, "global_step": 163256, "epoch": 1349} {"train_loss": -41.5269775390625, "global_step": 163257, "epoch": 1349} {"train_loss": -41.077972412109375, "global_step": 163258, "epoch": 1349} {"train_loss": -41.108558654785156, "global_step": 163259, "epoch": 1349} {"train_loss": -41.38644027709961, "global_step": 163260, "epoch": 1349} {"train_loss": -41.82999801635742, "global_step": 163261, "epoch": 1349} {"train_loss": -40.89219284057617, "global_step": 163262, "epoch": 1349} {"train_loss": -41.704769134521484, "global_step": 163263, "epoch": 1349} {"train_loss": -41.45439529418945, "global_step": 163264, "epoch": 1349} {"train_loss": -41.19782638549805, "global_step": 163265, "epoch": 1349} {"train_loss": -40.89801025390625, "global_step": 163266, "epoch": 1349} {"train_loss": -41.789581298828125, "global_step": 163267, "epoch": 1349} {"train_loss": -41.83643341064453, "global_step": 163268, "epoch": 1349} {"train_loss": -41.454200744628906, "global_step": 163269, "epoch": 1349} {"train_loss": -41.15653610229492, "global_step": 163270, "epoch": 1349} {"train_loss": -41.21463394165039, "global_step": 163271, "epoch": 1349} {"train_loss": -42.058773040771484, "global_step": 163272, "epoch": 1349} {"train_loss": -41.077938079833984, "global_step": 163273, "epoch": 1349} {"train_loss": -41.662315368652344, "global_step": 163274, "epoch": 1349} {"train_loss": -41.499874114990234, "global_step": 163275, "epoch": 1349} {"train_loss": -42.038551330566406, "global_step": 163276, "epoch": 1349} {"train_loss": -40.50307846069336, "global_step": 163277, "epoch": 1349} {"train_loss": -38.22698974609375, "global_step": 163278, "epoch": 1349} {"train_loss": -39.0616340637207, "global_step": 163279, "epoch": 1349} {"train_loss": -41.91775894165039, "global_step": 163280, "epoch": 1349} {"train_loss": -39.26734161376953, "global_step": 163281, "epoch": 1349} {"train_loss": -39.90078353881836, "global_step": 163282, "epoch": 1349} {"train_loss": -39.552982330322266, "global_step": 163283, "epoch": 1349} {"train_loss": -39.55278396606445, "global_step": 163284, "epoch": 1349} {"train_loss": -39.799232482910156, "global_step": 163285, "epoch": 1349} {"train_loss": -41.28337478637695, "global_step": 163286, "epoch": 1349} {"train_loss": -41.30257797241211, "global_step": 163287, "epoch": 1349} {"train_loss": -40.090999603271484, "global_step": 163288, "epoch": 1349} {"train_loss": -40.68639373779297, "global_step": 163289, "epoch": 1349} {"train_loss": -41.27186965942383, "global_step": 163290, "epoch": 1349} {"train_loss": -40.731746673583984, "global_step": 163291, "epoch": 1349} {"train_loss": -40.59797668457031, "global_step": 163292, "epoch": 1349} {"train_loss": -41.121673583984375, "global_step": 163293, "epoch": 1349} {"train_loss": -40.08610534667969, "global_step": 163294, "epoch": 1349} {"train_loss": -40.967628479003906, "global_step": 163295, "epoch": 1349} {"train_loss": -40.97182846069336, "global_step": 163296, "epoch": 1349} {"train_loss": -40.316505432128906, "global_step": 163297, "epoch": 1349} {"train_loss": -41.027008056640625, "global_step": 163298, "epoch": 1349} {"train_loss": -40.885189056396484, "global_step": 163299, "epoch": 1349} {"train_loss": -40.04773712158203, "global_step": 163300, "epoch": 1349} {"train_loss": -41.28399658203125, "global_step": 163301, "epoch": 1349} {"train_loss": -39.659332275390625, "global_step": 163302, "epoch": 1349} {"train_loss": -40.056312561035156, "global_step": 163303, "epoch": 1349} {"train_loss": -40.737728118896484, "global_step": 163304, "epoch": 1349} {"train_loss": -38.98065948486328, "global_step": 163305, "epoch": 1349} {"train_loss": -41.2384147644043, "global_step": 163306, "epoch": 1349} {"train_loss": -38.314056396484375, "global_step": 163307, "epoch": 1349} {"train_loss": -39.77972412109375, "global_step": 163308, "epoch": 1349} {"train_loss": -39.89024353027344, "global_step": 163309, "epoch": 1349} {"train_loss": -39.03096389770508, "global_step": 163310, "epoch": 1349} {"train_loss": -41.02309799194336, "global_step": 163311, "epoch": 1349} {"train_loss": -39.66279602050781, "global_step": 163312, "epoch": 1349} {"train_loss": -41.32670211791992, "global_step": 163313, "epoch": 1349} {"train_loss": -39.31903076171875, "global_step": 163314, "epoch": 1349} {"train_loss": -41.267005920410156, "global_step": 163315, "epoch": 1349} {"train_loss": -40.624813079833984, "global_step": 163316, "epoch": 1349} {"train_loss": -39.57285690307617, "global_step": 163317, "epoch": 1349} {"train_loss": -40.59010314941406, "global_step": 163318, "epoch": 1349} {"train_loss": -40.90610885620117, "global_step": 163319, "epoch": 1349} {"train_loss": -40.55130386352539, "global_step": 163320, "epoch": 1349} {"train_loss": -40.738033294677734, "global_step": 163321, "epoch": 1349} {"train_loss": -41.178741455078125, "global_step": 163322, "epoch": 1349} {"train_loss": -41.18136215209961, "global_step": 163323, "epoch": 1349} {"train_loss": -40.8804817199707, "global_step": 163324, "epoch": 1349} {"train_loss": -40.03606033325195, "global_step": 163325, "epoch": 1349} {"train_loss": -40.79096603393555, "global_step": 163326, "epoch": 1349} {"train_loss": -41.49578857421875, "global_step": 163327, "epoch": 1349} {"train_loss": -40.40780258178711, "global_step": 163328, "epoch": 1349} {"train_loss": -39.71731185913086, "global_step": 163329, "epoch": 1349} {"train_loss": -39.179683685302734, "global_step": 163330, "epoch": 1349} {"train_loss": -39.46615219116211, "global_step": 163331, "epoch": 1349} {"train_loss": -40.7936897277832, "global_step": 163332, "epoch": 1349} {"train_loss": -40.9068603515625, "global_step": 163333, "epoch": 1349} {"train_loss": -39.95730209350586, "global_step": 163334, "epoch": 1349} {"train_loss": -39.153411865234375, "global_step": 163335, "epoch": 1349} {"train_loss": -40.54046630859375, "global_step": 163336, "epoch": 1349} {"train_loss": -40.1218147277832, "global_step": 163337, "epoch": 1349} {"train_loss": -40.032588958740234, "global_step": 163338, "epoch": 1349} {"train_loss": -38.61726760864258, "global_step": 163339, "epoch": 1349} {"train_loss": -40.97223663330078, "global_step": 163340, "epoch": 1349} {"train_loss": -40.31060791015625, "global_step": 163341, "epoch": 1349} {"train_loss": -40.67353820800781, "global_step": 163342, "epoch": 1349} {"train_loss": -41.06713104248047, "global_step": 163343, "epoch": 1349} {"train_loss": -40.28243637084961, "global_step": 163344, "epoch": 1349} {"train_loss": -39.70626449584961, "global_step": 163345, "epoch": 1349} {"train_loss": -41.2432746887207, "global_step": 163346, "epoch": 1349} {"train_loss": -40.39216232299805, "global_step": 163347, "epoch": 1349} {"train_loss": -40.382137298583984, "global_step": 163348, "epoch": 1349} {"train_loss": -40.714859292526874, "global_step": 163349, "epoch": 1349, "val_loss": 2530137.75} {"train_loss": -40.369102478027344, "global_step": 163350, "epoch": 1350} {"train_loss": -39.79767990112305, "global_step": 163351, "epoch": 1350} {"train_loss": -40.557373046875, "global_step": 163352, "epoch": 1350} {"train_loss": -40.385807037353516, "global_step": 163353, "epoch": 1350} {"train_loss": -41.04920196533203, "global_step": 163354, "epoch": 1350} {"train_loss": -40.625179290771484, "global_step": 163355, "epoch": 1350} {"train_loss": -41.19830322265625, "global_step": 163356, "epoch": 1350} {"train_loss": -41.26893997192383, "global_step": 163357, "epoch": 1350} {"train_loss": -39.695194244384766, "global_step": 163358, "epoch": 1350} {"train_loss": -40.557350158691406, "global_step": 163359, "epoch": 1350} {"train_loss": -39.87177658081055, "global_step": 163360, "epoch": 1350} {"train_loss": -40.59462356567383, "global_step": 163361, "epoch": 1350} {"train_loss": -41.035762786865234, "global_step": 163362, "epoch": 1350} {"train_loss": -39.80028533935547, "global_step": 163363, "epoch": 1350} {"train_loss": -39.606788635253906, "global_step": 163364, "epoch": 1350} {"train_loss": -39.032779693603516, "global_step": 163365, "epoch": 1350} {"train_loss": -39.8111457824707, "global_step": 163366, "epoch": 1350} {"train_loss": -40.3414306640625, "global_step": 163367, "epoch": 1350} {"train_loss": -39.90058135986328, "global_step": 163368, "epoch": 1350} {"train_loss": -40.58466339111328, "global_step": 163369, "epoch": 1350} {"train_loss": -41.250850677490234, "global_step": 163370, "epoch": 1350} {"train_loss": -40.185585021972656, "global_step": 163371, "epoch": 1350} {"train_loss": -40.1630744934082, "global_step": 163372, "epoch": 1350} {"train_loss": -39.88924789428711, "global_step": 163373, "epoch": 1350} {"train_loss": -41.47010040283203, "global_step": 163374, "epoch": 1350} {"train_loss": -39.89634323120117, "global_step": 163375, "epoch": 1350} {"train_loss": -39.91158676147461, "global_step": 163376, "epoch": 1350} {"train_loss": -41.15443801879883, "global_step": 163377, "epoch": 1350} {"train_loss": -40.985809326171875, "global_step": 163378, "epoch": 1350} {"train_loss": -41.2978401184082, "global_step": 163379, "epoch": 1350} {"train_loss": -41.49222183227539, "global_step": 163380, "epoch": 1350} {"train_loss": -41.35126495361328, "global_step": 163381, "epoch": 1350} {"train_loss": -41.60530471801758, "global_step": 163382, "epoch": 1350} {"train_loss": -41.58935546875, "global_step": 163383, "epoch": 1350} {"train_loss": -41.02930450439453, "global_step": 163384, "epoch": 1350} {"train_loss": -41.83740234375, "global_step": 163385, "epoch": 1350} {"train_loss": -40.93386459350586, "global_step": 163386, "epoch": 1350} {"train_loss": -41.65951156616211, "global_step": 163387, "epoch": 1350} {"train_loss": -41.46012496948242, "global_step": 163388, "epoch": 1350} {"train_loss": -41.04502487182617, "global_step": 163389, "epoch": 1350} {"train_loss": -40.82473373413086, "global_step": 163390, "epoch": 1350} {"train_loss": -40.986183166503906, "global_step": 163391, "epoch": 1350} {"train_loss": -41.273189544677734, "global_step": 163392, "epoch": 1350} {"train_loss": -40.66072463989258, "global_step": 163393, "epoch": 1350} {"train_loss": -41.5560417175293, "global_step": 163394, "epoch": 1350} {"train_loss": -41.25442123413086, "global_step": 163395, "epoch": 1350} {"train_loss": -41.9604377746582, "global_step": 163396, "epoch": 1350} {"train_loss": -40.374114990234375, "global_step": 163397, "epoch": 1350} {"train_loss": -41.89542770385742, "global_step": 163398, "epoch": 1350} {"train_loss": -40.876155853271484, "global_step": 163399, "epoch": 1350} {"train_loss": -41.564674377441406, "global_step": 163400, "epoch": 1350} {"train_loss": -41.55646514892578, "global_step": 163401, "epoch": 1350} {"train_loss": -41.330257415771484, "global_step": 163402, "epoch": 1350} {"train_loss": -41.07194519042969, "global_step": 163403, "epoch": 1350} {"train_loss": -41.276737213134766, "global_step": 163404, "epoch": 1350} {"train_loss": -41.88578414916992, "global_step": 163405, "epoch": 1350} {"train_loss": -41.81890869140625, "global_step": 163406, "epoch": 1350} {"train_loss": -42.309932708740234, "global_step": 163407, "epoch": 1350} {"train_loss": -41.53859329223633, "global_step": 163408, "epoch": 1350} {"train_loss": -41.6048583984375, "global_step": 163409, "epoch": 1350} {"train_loss": -39.46781921386719, "global_step": 163410, "epoch": 1350} {"train_loss": -41.82740020751953, "global_step": 163411, "epoch": 1350} {"train_loss": -40.969051361083984, "global_step": 163412, "epoch": 1350} {"train_loss": -40.237457275390625, "global_step": 163413, "epoch": 1350} {"train_loss": -40.48650360107422, "global_step": 163414, "epoch": 1350} {"train_loss": -41.36050033569336, "global_step": 163415, "epoch": 1350} {"train_loss": -40.89360427856445, "global_step": 163416, "epoch": 1350} {"train_loss": -40.662940979003906, "global_step": 163417, "epoch": 1350} {"train_loss": -39.16323471069336, "global_step": 163418, "epoch": 1350} {"train_loss": -38.89625930786133, "global_step": 163419, "epoch": 1350} {"train_loss": -39.278724670410156, "global_step": 163420, "epoch": 1350} {"train_loss": -41.72987365722656, "global_step": 163421, "epoch": 1350} {"train_loss": -39.90517807006836, "global_step": 163422, "epoch": 1350} {"train_loss": -39.8022346496582, "global_step": 163423, "epoch": 1350} {"train_loss": -41.34498596191406, "global_step": 163424, "epoch": 1350} {"train_loss": -41.4779167175293, "global_step": 163425, "epoch": 1350} {"train_loss": -40.561012268066406, "global_step": 163426, "epoch": 1350} {"train_loss": -41.24399948120117, "global_step": 163427, "epoch": 1350} {"train_loss": -41.99017333984375, "global_step": 163428, "epoch": 1350} {"train_loss": -41.24496078491211, "global_step": 163429, "epoch": 1350} {"train_loss": -41.61152267456055, "global_step": 163430, "epoch": 1350} {"train_loss": -41.760189056396484, "global_step": 163431, "epoch": 1350} {"train_loss": -41.07905960083008, "global_step": 163432, "epoch": 1350} {"train_loss": -40.395118713378906, "global_step": 163433, "epoch": 1350} {"train_loss": -42.071205139160156, "global_step": 163434, "epoch": 1350} {"train_loss": -41.403106689453125, "global_step": 163435, "epoch": 1350} {"train_loss": -40.7188835144043, "global_step": 163436, "epoch": 1350} {"train_loss": -41.104061126708984, "global_step": 163437, "epoch": 1350} {"train_loss": -41.90218734741211, "global_step": 163438, "epoch": 1350} {"train_loss": -41.09403610229492, "global_step": 163439, "epoch": 1350} {"train_loss": -41.310394287109375, "global_step": 163440, "epoch": 1350} {"train_loss": -41.171939849853516, "global_step": 163441, "epoch": 1350} {"train_loss": -41.750038146972656, "global_step": 163442, "epoch": 1350} {"train_loss": -40.68598937988281, "global_step": 163443, "epoch": 1350} {"train_loss": -41.02101516723633, "global_step": 163444, "epoch": 1350} {"train_loss": -41.65965270996094, "global_step": 163445, "epoch": 1350} {"train_loss": -41.36725997924805, "global_step": 163446, "epoch": 1350} {"train_loss": -40.60823059082031, "global_step": 163447, "epoch": 1350} {"train_loss": -41.757835388183594, "global_step": 163448, "epoch": 1350} {"train_loss": -41.57687759399414, "global_step": 163449, "epoch": 1350} {"train_loss": -41.5436897277832, "global_step": 163450, "epoch": 1350} {"train_loss": -41.95745849609375, "global_step": 163451, "epoch": 1350} {"train_loss": -41.83720016479492, "global_step": 163452, "epoch": 1350} {"train_loss": -39.844573974609375, "global_step": 163453, "epoch": 1350} {"train_loss": -39.10956573486328, "global_step": 163454, "epoch": 1350} {"train_loss": -39.63994598388672, "global_step": 163455, "epoch": 1350} {"train_loss": -40.41415023803711, "global_step": 163456, "epoch": 1350} {"train_loss": -40.56679153442383, "global_step": 163457, "epoch": 1350} {"train_loss": -40.70969772338867, "global_step": 163458, "epoch": 1350} {"train_loss": -41.16195297241211, "global_step": 163459, "epoch": 1350} {"train_loss": -40.29890060424805, "global_step": 163460, "epoch": 1350} {"train_loss": -40.19575500488281, "global_step": 163461, "epoch": 1350} {"train_loss": -40.96375274658203, "global_step": 163462, "epoch": 1350} {"train_loss": -40.31326675415039, "global_step": 163463, "epoch": 1350} {"train_loss": -40.99981689453125, "global_step": 163464, "epoch": 1350} {"train_loss": -40.6827392578125, "global_step": 163465, "epoch": 1350} {"train_loss": -40.41782760620117, "global_step": 163466, "epoch": 1350} {"train_loss": -38.37258529663086, "global_step": 163467, "epoch": 1350} {"train_loss": -37.59558868408203, "global_step": 163468, "epoch": 1350} {"train_loss": -40.843711853027344, "global_step": 163469, "epoch": 1350} {"train_loss": -40.82326857511662, "global_step": 163470, "epoch": 1350, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4400000": 1.0, "test/sim_max_reward_4400001": 1.0, "test/sim_max_reward_4400002": 1.0, "test/sim_max_reward_4400003": 1.0, "test/sim_max_reward_4400004": 1.0, "test/sim_max_reward_4400005": 1.0, "test/sim_max_reward_4400006": 1.0, "test/sim_max_reward_4400007": 1.0, "test/sim_max_reward_4400008": 1.0, "test/sim_max_reward_4400009": 1.0, "test/sim_max_reward_4400010": 1.0, "test/sim_max_reward_4400011": 1.0, "test/sim_max_reward_4400012": 1.0, "test/sim_max_reward_4400013": 1.0, "test/sim_max_reward_4400014": 1.0, "test/sim_max_reward_4400015": 1.0, "test/sim_max_reward_4400016": 1.0, "test/sim_max_reward_4400017": 1.0, "test/sim_max_reward_4400018": 1.0, "test/sim_max_reward_4400019": 1.0, "test/sim_max_reward_4400020": 1.0, "test/sim_max_reward_4400021": 1.0, "train/mean_score": 1.0, "test/mean_score": 1.0, "val_loss": 2532076.25} {"train_loss": -38.861175537109375, "global_step": 163471, "epoch": 1351} {"train_loss": -40.2237434387207, "global_step": 163472, "epoch": 1351} {"train_loss": -40.37577438354492, "global_step": 163473, "epoch": 1351} {"train_loss": -36.672977447509766, "global_step": 163474, "epoch": 1351} {"train_loss": -39.67774963378906, "global_step": 163475, "epoch": 1351} {"train_loss": -39.508235931396484, "global_step": 163476, "epoch": 1351} {"train_loss": -37.94036102294922, "global_step": 163477, "epoch": 1351} {"train_loss": -37.921871185302734, "global_step": 163478, "epoch": 1351} {"train_loss": -39.35911178588867, "global_step": 163479, "epoch": 1351} {"train_loss": -40.38556671142578, "global_step": 163480, "epoch": 1351} {"train_loss": -36.98102951049805, "global_step": 163481, "epoch": 1351} {"train_loss": -38.50651168823242, "global_step": 163482, "epoch": 1351} {"train_loss": -40.1204948425293, "global_step": 163483, "epoch": 1351} {"train_loss": -36.023372650146484, "global_step": 163484, "epoch": 1351} {"train_loss": -37.7320556640625, "global_step": 163485, "epoch": 1351} {"train_loss": -39.55209732055664, "global_step": 163486, "epoch": 1351} {"train_loss": -35.58332443237305, "global_step": 163487, "epoch": 1351} {"train_loss": -39.638916015625, "global_step": 163488, "epoch": 1351} {"train_loss": -37.2572021484375, "global_step": 163489, "epoch": 1351} {"train_loss": -38.532955169677734, "global_step": 163490, "epoch": 1351} {"train_loss": -38.05024337768555, "global_step": 163491, "epoch": 1351} {"train_loss": -39.44870376586914, "global_step": 163492, "epoch": 1351} {"train_loss": -39.27524948120117, "global_step": 163493, "epoch": 1351} {"train_loss": -39.35585403442383, "global_step": 163494, "epoch": 1351} {"train_loss": -39.92794418334961, "global_step": 163495, "epoch": 1351} {"train_loss": -40.540252685546875, "global_step": 163496, "epoch": 1351} {"train_loss": -40.3931884765625, "global_step": 163497, "epoch": 1351} {"train_loss": -39.2618522644043, "global_step": 163498, "epoch": 1351} {"train_loss": -41.29409408569336, "global_step": 163499, "epoch": 1351} {"train_loss": -40.055274963378906, "global_step": 163500, "epoch": 1351} {"train_loss": -40.54507064819336, "global_step": 163501, "epoch": 1351} {"train_loss": -40.808773040771484, "global_step": 163502, "epoch": 1351} {"train_loss": -40.158782958984375, "global_step": 163503, "epoch": 1351} {"train_loss": -40.68626403808594, "global_step": 163504, "epoch": 1351} {"train_loss": -40.536033630371094, "global_step": 163505, "epoch": 1351} {"train_loss": -40.594058990478516, "global_step": 163506, "epoch": 1351} {"train_loss": -40.847145080566406, "global_step": 163507, "epoch": 1351} {"train_loss": -40.155067443847656, "global_step": 163508, "epoch": 1351} {"train_loss": -40.36336135864258, "global_step": 163509, "epoch": 1351} {"train_loss": -39.89301681518555, "global_step": 163510, "epoch": 1351} {"train_loss": -40.399715423583984, "global_step": 163511, "epoch": 1351} {"train_loss": -39.84503936767578, "global_step": 163512, "epoch": 1351} {"train_loss": -39.714298248291016, "global_step": 163513, "epoch": 1351} {"train_loss": -40.609188079833984, "global_step": 163514, "epoch": 1351} {"train_loss": -39.808876037597656, "global_step": 163515, "epoch": 1351} {"train_loss": -40.91604995727539, "global_step": 163516, "epoch": 1351} {"train_loss": -38.79671096801758, "global_step": 163517, "epoch": 1351} {"train_loss": -40.35175323486328, "global_step": 163518, "epoch": 1351} {"train_loss": -39.96905517578125, "global_step": 163519, "epoch": 1351} {"train_loss": -40.98834991455078, "global_step": 163520, "epoch": 1351} {"train_loss": -38.03060531616211, "global_step": 163521, "epoch": 1351} {"train_loss": -39.76509094238281, "global_step": 163522, "epoch": 1351} {"train_loss": -41.22452926635742, "global_step": 163523, "epoch": 1351} {"train_loss": -40.76824188232422, "global_step": 163524, "epoch": 1351} {"train_loss": -40.66057205200195, "global_step": 163525, "epoch": 1351} {"train_loss": -40.853267669677734, "global_step": 163526, "epoch": 1351} {"train_loss": -40.590511322021484, "global_step": 163527, "epoch": 1351} {"train_loss": -41.13247299194336, "global_step": 163528, "epoch": 1351} {"train_loss": -40.82284164428711, "global_step": 163529, "epoch": 1351} {"train_loss": -42.00065231323242, "global_step": 163530, "epoch": 1351} {"train_loss": -40.68769073486328, "global_step": 163531, "epoch": 1351} {"train_loss": -41.08565902709961, "global_step": 163532, "epoch": 1351} {"train_loss": -41.48154830932617, "global_step": 163533, "epoch": 1351} {"train_loss": -40.347599029541016, "global_step": 163534, "epoch": 1351} {"train_loss": -41.877132415771484, "global_step": 163535, "epoch": 1351} {"train_loss": -41.328880310058594, "global_step": 163536, "epoch": 1351} {"train_loss": -41.03065490722656, "global_step": 163537, "epoch": 1351} {"train_loss": -41.53288650512695, "global_step": 163538, "epoch": 1351} {"train_loss": -41.91865158081055, "global_step": 163539, "epoch": 1351} {"train_loss": -41.5550537109375, "global_step": 163540, "epoch": 1351} {"train_loss": -41.465538024902344, "global_step": 163541, "epoch": 1351} {"train_loss": -41.471405029296875, "global_step": 163542, "epoch": 1351} {"train_loss": -41.54959487915039, "global_step": 163543, "epoch": 1351} {"train_loss": -41.791175842285156, "global_step": 163544, "epoch": 1351} {"train_loss": -41.30808639526367, "global_step": 163545, "epoch": 1351} {"train_loss": -42.35328674316406, "global_step": 163546, "epoch": 1351} {"train_loss": -41.65793991088867, "global_step": 163547, "epoch": 1351} {"train_loss": -41.59968185424805, "global_step": 163548, "epoch": 1351} {"train_loss": -42.178890228271484, "global_step": 163549, "epoch": 1351} {"train_loss": -41.99893569946289, "global_step": 163550, "epoch": 1351} {"train_loss": -41.58045196533203, "global_step": 163551, "epoch": 1351} {"train_loss": -41.61615753173828, "global_step": 163552, "epoch": 1351} {"train_loss": -41.85823440551758, "global_step": 163553, "epoch": 1351} {"train_loss": -41.98250198364258, "global_step": 163554, "epoch": 1351} {"train_loss": -41.09568786621094, "global_step": 163555, "epoch": 1351} {"train_loss": -41.4390983581543, "global_step": 163556, "epoch": 1351} {"train_loss": -40.87846755981445, "global_step": 163557, "epoch": 1351} {"train_loss": -39.46235275268555, "global_step": 163558, "epoch": 1351} {"train_loss": -38.097103118896484, "global_step": 163559, "epoch": 1351} {"train_loss": -38.196624755859375, "global_step": 163560, "epoch": 1351} {"train_loss": -39.56216049194336, "global_step": 163561, "epoch": 1351} {"train_loss": -40.95223617553711, "global_step": 163562, "epoch": 1351} {"train_loss": -42.301082611083984, "global_step": 163563, "epoch": 1351} {"train_loss": -41.0391731262207, "global_step": 163564, "epoch": 1351} {"train_loss": -39.43519973754883, "global_step": 163565, "epoch": 1351} {"train_loss": -41.510765075683594, "global_step": 163566, "epoch": 1351} {"train_loss": -40.50091552734375, "global_step": 163567, "epoch": 1351} {"train_loss": -38.149147033691406, "global_step": 163568, "epoch": 1351} {"train_loss": -38.532508850097656, "global_step": 163569, "epoch": 1351} {"train_loss": -40.783416748046875, "global_step": 163570, "epoch": 1351} {"train_loss": -41.1334114074707, "global_step": 163571, "epoch": 1351} {"train_loss": -40.68319320678711, "global_step": 163572, "epoch": 1351} {"train_loss": -41.00221633911133, "global_step": 163573, "epoch": 1351} {"train_loss": -41.15557861328125, "global_step": 163574, "epoch": 1351} {"train_loss": -40.97030258178711, "global_step": 163575, "epoch": 1351} {"train_loss": -40.5013542175293, "global_step": 163576, "epoch": 1351} {"train_loss": -41.352420806884766, "global_step": 163577, "epoch": 1351} {"train_loss": -40.90658950805664, "global_step": 163578, "epoch": 1351} {"train_loss": -40.13033676147461, "global_step": 163579, "epoch": 1351} {"train_loss": -40.19226837158203, "global_step": 163580, "epoch": 1351} {"train_loss": -41.54924011230469, "global_step": 163581, "epoch": 1351} {"train_loss": -41.21903991699219, "global_step": 163582, "epoch": 1351} {"train_loss": -41.313507080078125, "global_step": 163583, "epoch": 1351} {"train_loss": -41.40288162231445, "global_step": 163584, "epoch": 1351} {"train_loss": -41.527584075927734, "global_step": 163585, "epoch": 1351} {"train_loss": -41.92164611816406, "global_step": 163586, "epoch": 1351} {"train_loss": -41.011146545410156, "global_step": 163587, "epoch": 1351} {"train_loss": -41.364501953125, "global_step": 163588, "epoch": 1351} {"train_loss": -41.790496826171875, "global_step": 163589, "epoch": 1351} {"train_loss": -41.748226165771484, "global_step": 163590, "epoch": 1351} {"train_loss": -40.36412451878067, "global_step": 163591, "epoch": 1351, "val_loss": 2556241.5} {"train_loss": -41.25654602050781, "global_step": 163592, "epoch": 1352} {"train_loss": -41.35808181762695, "global_step": 163593, "epoch": 1352} {"train_loss": -40.468807220458984, "global_step": 163594, "epoch": 1352} {"train_loss": -41.160640716552734, "global_step": 163595, "epoch": 1352} {"train_loss": -36.99855422973633, "global_step": 163596, "epoch": 1352} {"train_loss": -38.688968658447266, "global_step": 163597, "epoch": 1352} {"train_loss": -39.00259017944336, "global_step": 163598, "epoch": 1352} {"train_loss": -40.644325256347656, "global_step": 163599, "epoch": 1352} {"train_loss": -41.9383659362793, "global_step": 163600, "epoch": 1352} {"train_loss": -40.04212188720703, "global_step": 163601, "epoch": 1352} {"train_loss": -38.99581527709961, "global_step": 163602, "epoch": 1352} {"train_loss": -39.81382369995117, "global_step": 163603, "epoch": 1352} {"train_loss": -39.54587936401367, "global_step": 163604, "epoch": 1352} {"train_loss": -36.72349166870117, "global_step": 163605, "epoch": 1352} {"train_loss": -41.7132682800293, "global_step": 163606, "epoch": 1352} {"train_loss": -40.88380813598633, "global_step": 163607, "epoch": 1352} {"train_loss": -41.48236846923828, "global_step": 163608, "epoch": 1352} {"train_loss": -41.60698699951172, "global_step": 163609, "epoch": 1352} {"train_loss": -41.63129425048828, "global_step": 163610, "epoch": 1352} {"train_loss": -41.66999053955078, "global_step": 163611, "epoch": 1352} {"train_loss": -41.610538482666016, "global_step": 163612, "epoch": 1352} {"train_loss": -41.80147171020508, "global_step": 163613, "epoch": 1352} {"train_loss": -40.81573486328125, "global_step": 163614, "epoch": 1352} {"train_loss": -40.69026565551758, "global_step": 163615, "epoch": 1352} {"train_loss": -41.823699951171875, "global_step": 163616, "epoch": 1352} {"train_loss": -41.2364616394043, "global_step": 163617, "epoch": 1352} {"train_loss": -41.4141845703125, "global_step": 163618, "epoch": 1352} {"train_loss": -41.31990432739258, "global_step": 163619, "epoch": 1352} {"train_loss": -41.36433792114258, "global_step": 163620, "epoch": 1352} {"train_loss": -41.52946472167969, "global_step": 163621, "epoch": 1352} {"train_loss": -41.695865631103516, "global_step": 163622, "epoch": 1352} {"train_loss": -40.99253463745117, "global_step": 163623, "epoch": 1352} {"train_loss": -42.0431022644043, "global_step": 163624, "epoch": 1352} {"train_loss": -41.40774154663086, "global_step": 163625, "epoch": 1352} {"train_loss": -41.381587982177734, "global_step": 163626, "epoch": 1352} {"train_loss": -41.246517181396484, "global_step": 163627, "epoch": 1352} {"train_loss": -40.5468864440918, "global_step": 163628, "epoch": 1352} {"train_loss": -41.730506896972656, "global_step": 163629, "epoch": 1352} {"train_loss": -41.351192474365234, "global_step": 163630, "epoch": 1352} {"train_loss": -40.59782791137695, "global_step": 163631, "epoch": 1352} {"train_loss": -41.35367965698242, "global_step": 163632, "epoch": 1352} {"train_loss": -40.7410774230957, "global_step": 163633, "epoch": 1352} {"train_loss": -41.6140022277832, "global_step": 163634, "epoch": 1352} {"train_loss": -41.508480072021484, "global_step": 163635, "epoch": 1352} {"train_loss": -41.50973892211914, "global_step": 163636, "epoch": 1352} {"train_loss": -41.7451286315918, "global_step": 163637, "epoch": 1352} {"train_loss": -41.08606719970703, "global_step": 163638, "epoch": 1352} {"train_loss": -40.73177719116211, "global_step": 163639, "epoch": 1352} {"train_loss": -41.48188400268555, "global_step": 163640, "epoch": 1352} {"train_loss": -41.47097396850586, "global_step": 163641, "epoch": 1352} {"train_loss": -40.96621322631836, "global_step": 163642, "epoch": 1352} {"train_loss": -40.9638786315918, "global_step": 163643, "epoch": 1352} {"train_loss": -41.211673736572266, "global_step": 163644, "epoch": 1352} {"train_loss": -41.61214065551758, "global_step": 163645, "epoch": 1352} {"train_loss": -40.14165496826172, "global_step": 163646, "epoch": 1352} {"train_loss": -41.40475082397461, "global_step": 163647, "epoch": 1352} {"train_loss": -41.40678787231445, "global_step": 163648, "epoch": 1352} {"train_loss": -39.744789123535156, "global_step": 163649, "epoch": 1352} {"train_loss": -40.833213806152344, "global_step": 163650, "epoch": 1352} {"train_loss": -41.30465316772461, "global_step": 163651, "epoch": 1352} {"train_loss": -39.89316940307617, "global_step": 163652, "epoch": 1352} {"train_loss": -39.49703598022461, "global_step": 163653, "epoch": 1352} {"train_loss": -40.890071868896484, "global_step": 163654, "epoch": 1352} {"train_loss": -41.43858337402344, "global_step": 163655, "epoch": 1352} {"train_loss": -41.24079513549805, "global_step": 163656, "epoch": 1352} {"train_loss": -41.70786666870117, "global_step": 163657, "epoch": 1352} {"train_loss": -41.31708526611328, "global_step": 163658, "epoch": 1352} {"train_loss": -40.12458038330078, "global_step": 163659, "epoch": 1352} {"train_loss": -41.87384796142578, "global_step": 163660, "epoch": 1352} {"train_loss": -41.021484375, "global_step": 163661, "epoch": 1352} {"train_loss": -40.57560348510742, "global_step": 163662, "epoch": 1352} {"train_loss": -41.004512786865234, "global_step": 163663, "epoch": 1352} {"train_loss": -40.72064971923828, "global_step": 163664, "epoch": 1352} {"train_loss": -40.27124786376953, "global_step": 163665, "epoch": 1352} {"train_loss": -39.6727409362793, "global_step": 163666, "epoch": 1352} {"train_loss": -37.98386764526367, "global_step": 163667, "epoch": 1352} {"train_loss": -38.30326461791992, "global_step": 163668, "epoch": 1352} {"train_loss": -39.49599075317383, "global_step": 163669, "epoch": 1352} {"train_loss": -41.03608322143555, "global_step": 163670, "epoch": 1352} {"train_loss": -39.54600143432617, "global_step": 163671, "epoch": 1352} {"train_loss": -39.37929916381836, "global_step": 163672, "epoch": 1352} {"train_loss": -41.49284744262695, "global_step": 163673, "epoch": 1352} {"train_loss": -40.94263458251953, "global_step": 163674, "epoch": 1352} {"train_loss": -40.46686553955078, "global_step": 163675, "epoch": 1352} {"train_loss": -40.89504623413086, "global_step": 163676, "epoch": 1352} {"train_loss": -40.2186279296875, "global_step": 163677, "epoch": 1352} {"train_loss": -40.1552848815918, "global_step": 163678, "epoch": 1352} {"train_loss": -40.735198974609375, "global_step": 163679, "epoch": 1352} {"train_loss": -41.031982421875, "global_step": 163680, "epoch": 1352} {"train_loss": -41.4305305480957, "global_step": 163681, "epoch": 1352} {"train_loss": -41.48849868774414, "global_step": 163682, "epoch": 1352} {"train_loss": -42.33528518676758, "global_step": 163683, "epoch": 1352} {"train_loss": -40.727699279785156, "global_step": 163684, "epoch": 1352} {"train_loss": -39.57255172729492, "global_step": 163685, "epoch": 1352} {"train_loss": -41.20476150512695, "global_step": 163686, "epoch": 1352} {"train_loss": -41.537357330322266, "global_step": 163687, "epoch": 1352} {"train_loss": -38.611446380615234, "global_step": 163688, "epoch": 1352} {"train_loss": -41.70792770385742, "global_step": 163689, "epoch": 1352} {"train_loss": -40.058868408203125, "global_step": 163690, "epoch": 1352} {"train_loss": -40.32776641845703, "global_step": 163691, "epoch": 1352} {"train_loss": -41.156166076660156, "global_step": 163692, "epoch": 1352} {"train_loss": -40.77513122558594, "global_step": 163693, "epoch": 1352} {"train_loss": -40.91884994506836, "global_step": 163694, "epoch": 1352} {"train_loss": -40.7564697265625, "global_step": 163695, "epoch": 1352} {"train_loss": -41.54458236694336, "global_step": 163696, "epoch": 1352} {"train_loss": -40.81797409057617, "global_step": 163697, "epoch": 1352} {"train_loss": -40.96733856201172, "global_step": 163698, "epoch": 1352} {"train_loss": -41.74546432495117, "global_step": 163699, "epoch": 1352} {"train_loss": -41.60833740234375, "global_step": 163700, "epoch": 1352} {"train_loss": -40.92471694946289, "global_step": 163701, "epoch": 1352} {"train_loss": -41.76898956298828, "global_step": 163702, "epoch": 1352} {"train_loss": -41.70588684082031, "global_step": 163703, "epoch": 1352} {"train_loss": -40.69480514526367, "global_step": 163704, "epoch": 1352} {"train_loss": -40.509700775146484, "global_step": 163705, "epoch": 1352} {"train_loss": -41.10764694213867, "global_step": 163706, "epoch": 1352} {"train_loss": -41.45299530029297, "global_step": 163707, "epoch": 1352} {"train_loss": -41.6357307434082, "global_step": 163708, "epoch": 1352} {"train_loss": -41.491912841796875, "global_step": 163709, "epoch": 1352} {"train_loss": -41.8464241027832, "global_step": 163710, "epoch": 1352} {"train_loss": -41.56478500366211, "global_step": 163711, "epoch": 1352} {"train_loss": -40.855180913751774, "global_step": 163712, "epoch": 1352, "val_loss": 2636650.75} {"train_loss": -42.40349578857422, "global_step": 163713, "epoch": 1353} {"train_loss": -42.28205490112305, "global_step": 163714, "epoch": 1353} {"train_loss": -41.98908233642578, "global_step": 163715, "epoch": 1353} {"train_loss": -41.56917953491211, "global_step": 163716, "epoch": 1353} {"train_loss": -41.74553298950195, "global_step": 163717, "epoch": 1353} {"train_loss": -41.55632400512695, "global_step": 163718, "epoch": 1353} {"train_loss": -42.33022689819336, "global_step": 163719, "epoch": 1353} {"train_loss": -42.15135192871094, "global_step": 163720, "epoch": 1353} {"train_loss": -42.267940521240234, "global_step": 163721, "epoch": 1353} {"train_loss": -41.788753509521484, "global_step": 163722, "epoch": 1353} {"train_loss": -42.15496063232422, "global_step": 163723, "epoch": 1353} {"train_loss": -41.41675567626953, "global_step": 163724, "epoch": 1353} {"train_loss": -41.46810531616211, "global_step": 163725, "epoch": 1353} {"train_loss": -41.75130844116211, "global_step": 163726, "epoch": 1353} {"train_loss": -40.843013763427734, "global_step": 163727, "epoch": 1353} {"train_loss": -41.99544906616211, "global_step": 163728, "epoch": 1353} {"train_loss": -41.791500091552734, "global_step": 163729, "epoch": 1353} {"train_loss": -38.84987258911133, "global_step": 163730, "epoch": 1353} {"train_loss": -41.22212600708008, "global_step": 163731, "epoch": 1353} {"train_loss": -41.69662094116211, "global_step": 163732, "epoch": 1353} {"train_loss": -40.934539794921875, "global_step": 163733, "epoch": 1353} {"train_loss": -41.60789108276367, "global_step": 163734, "epoch": 1353} {"train_loss": -41.86418151855469, "global_step": 163735, "epoch": 1353} {"train_loss": -41.19144821166992, "global_step": 163736, "epoch": 1353} {"train_loss": -42.19895553588867, "global_step": 163737, "epoch": 1353} {"train_loss": -41.564613342285156, "global_step": 163738, "epoch": 1353} {"train_loss": -41.083980560302734, "global_step": 163739, "epoch": 1353} {"train_loss": -41.24746322631836, "global_step": 163740, "epoch": 1353} {"train_loss": -42.23434066772461, "global_step": 163741, "epoch": 1353} {"train_loss": -37.199031829833984, "global_step": 163742, "epoch": 1353} {"train_loss": -41.483795166015625, "global_step": 163743, "epoch": 1353} {"train_loss": -41.80013656616211, "global_step": 163744, "epoch": 1353} {"train_loss": -41.653263092041016, "global_step": 163745, "epoch": 1353} {"train_loss": -40.97913360595703, "global_step": 163746, "epoch": 1353} {"train_loss": -38.45802688598633, "global_step": 163747, "epoch": 1353} {"train_loss": -41.73991012573242, "global_step": 163748, "epoch": 1353} {"train_loss": -41.761837005615234, "global_step": 163749, "epoch": 1353} {"train_loss": -41.2500114440918, "global_step": 163750, "epoch": 1353} {"train_loss": -41.25038528442383, "global_step": 163751, "epoch": 1353} {"train_loss": -40.50999450683594, "global_step": 163752, "epoch": 1353} {"train_loss": -41.50238037109375, "global_step": 163753, "epoch": 1353} {"train_loss": -39.55301284790039, "global_step": 163754, "epoch": 1353} {"train_loss": -41.09112548828125, "global_step": 163755, "epoch": 1353} {"train_loss": -41.331520080566406, "global_step": 163756, "epoch": 1353} {"train_loss": -41.55485153198242, "global_step": 163757, "epoch": 1353} {"train_loss": -40.5620231628418, "global_step": 163758, "epoch": 1353} {"train_loss": -39.99518966674805, "global_step": 163759, "epoch": 1353} {"train_loss": -40.844512939453125, "global_step": 163760, "epoch": 1353} {"train_loss": -40.33197784423828, "global_step": 163761, "epoch": 1353} {"train_loss": -36.778480529785156, "global_step": 163762, "epoch": 1353} {"train_loss": -39.144432067871094, "global_step": 163763, "epoch": 1353} {"train_loss": -37.58176803588867, "global_step": 163764, "epoch": 1353} {"train_loss": -34.8357048034668, "global_step": 163765, "epoch": 1353} {"train_loss": -35.87312316894531, "global_step": 163766, "epoch": 1353} {"train_loss": -35.74416732788086, "global_step": 163767, "epoch": 1353} {"train_loss": -36.058509826660156, "global_step": 163768, "epoch": 1353} {"train_loss": -38.536128997802734, "global_step": 163769, "epoch": 1353} {"train_loss": -40.59392166137695, "global_step": 163770, "epoch": 1353} {"train_loss": -38.406829833984375, "global_step": 163771, "epoch": 1353} {"train_loss": -38.523597717285156, "global_step": 163772, "epoch": 1353} {"train_loss": -40.401519775390625, "global_step": 163773, "epoch": 1353} {"train_loss": -39.938419342041016, "global_step": 163774, "epoch": 1353} {"train_loss": -38.52257537841797, "global_step": 163775, "epoch": 1353} {"train_loss": -38.5304069519043, "global_step": 163776, "epoch": 1353} {"train_loss": -40.9514274597168, "global_step": 163777, "epoch": 1353} {"train_loss": -39.13275909423828, "global_step": 163778, "epoch": 1353} {"train_loss": -40.648311614990234, "global_step": 163779, "epoch": 1353} {"train_loss": -39.3068733215332, "global_step": 163780, "epoch": 1353} {"train_loss": -39.70386505126953, "global_step": 163781, "epoch": 1353} {"train_loss": -40.92249298095703, "global_step": 163782, "epoch": 1353} {"train_loss": -39.86420440673828, "global_step": 163783, "epoch": 1353} {"train_loss": -40.496437072753906, "global_step": 163784, "epoch": 1353} {"train_loss": -40.372596740722656, "global_step": 163785, "epoch": 1353} {"train_loss": -41.19927215576172, "global_step": 163786, "epoch": 1353} {"train_loss": -41.468990325927734, "global_step": 163787, "epoch": 1353} {"train_loss": -40.40983581542969, "global_step": 163788, "epoch": 1353} {"train_loss": -41.56148147583008, "global_step": 163789, "epoch": 1353} {"train_loss": -40.96529769897461, "global_step": 163790, "epoch": 1353} {"train_loss": -41.60464096069336, "global_step": 163791, "epoch": 1353} {"train_loss": -41.1629638671875, "global_step": 163792, "epoch": 1353} {"train_loss": -42.084712982177734, "global_step": 163793, "epoch": 1353} {"train_loss": -40.5161018371582, "global_step": 163794, "epoch": 1353} {"train_loss": -41.41633987426758, "global_step": 163795, "epoch": 1353} {"train_loss": -41.2125358581543, "global_step": 163796, "epoch": 1353} {"train_loss": -41.88178634643555, "global_step": 163797, "epoch": 1353} {"train_loss": -41.62923812866211, "global_step": 163798, "epoch": 1353} {"train_loss": -40.89063262939453, "global_step": 163799, "epoch": 1353} {"train_loss": -40.5300407409668, "global_step": 163800, "epoch": 1353} {"train_loss": -41.392086029052734, "global_step": 163801, "epoch": 1353} {"train_loss": -41.88199996948242, "global_step": 163802, "epoch": 1353} {"train_loss": -40.52117156982422, "global_step": 163803, "epoch": 1353} {"train_loss": -40.251075744628906, "global_step": 163804, "epoch": 1353} {"train_loss": -41.30607223510742, "global_step": 163805, "epoch": 1353} {"train_loss": -40.73637008666992, "global_step": 163806, "epoch": 1353} {"train_loss": -41.552398681640625, "global_step": 163807, "epoch": 1353} {"train_loss": -40.865379333496094, "global_step": 163808, "epoch": 1353} {"train_loss": -41.00283432006836, "global_step": 163809, "epoch": 1353} {"train_loss": -41.09043502807617, "global_step": 163810, "epoch": 1353} {"train_loss": -38.88471603393555, "global_step": 163811, "epoch": 1353} {"train_loss": -40.79458236694336, "global_step": 163812, "epoch": 1353} {"train_loss": -38.8382682800293, "global_step": 163813, "epoch": 1353} {"train_loss": -40.7119026184082, "global_step": 163814, "epoch": 1353} {"train_loss": -41.48167037963867, "global_step": 163815, "epoch": 1353} {"train_loss": -40.40286636352539, "global_step": 163816, "epoch": 1353} {"train_loss": -40.17517852783203, "global_step": 163817, "epoch": 1353} {"train_loss": -38.967262268066406, "global_step": 163818, "epoch": 1353} {"train_loss": -39.65336227416992, "global_step": 163819, "epoch": 1353} {"train_loss": -38.81459426879883, "global_step": 163820, "epoch": 1353} {"train_loss": -40.869667053222656, "global_step": 163821, "epoch": 1353} {"train_loss": -40.51987838745117, "global_step": 163822, "epoch": 1353} {"train_loss": -37.39841079711914, "global_step": 163823, "epoch": 1353} {"train_loss": -38.704193115234375, "global_step": 163824, "epoch": 1353} {"train_loss": -40.67618942260742, "global_step": 163825, "epoch": 1353} {"train_loss": -38.01288986206055, "global_step": 163826, "epoch": 1353} {"train_loss": -38.086814880371094, "global_step": 163827, "epoch": 1353} {"train_loss": -38.846527099609375, "global_step": 163828, "epoch": 1353} {"train_loss": -40.78257369995117, "global_step": 163829, "epoch": 1353} {"train_loss": -40.001190185546875, "global_step": 163830, "epoch": 1353} {"train_loss": -39.95317840576172, "global_step": 163831, "epoch": 1353} {"train_loss": -40.87929916381836, "global_step": 163832, "epoch": 1353} {"train_loss": -40.46790089883095, "global_step": 163833, "epoch": 1353, "val_loss": 2614092.25} {"train_loss": -41.087318420410156, "global_step": 163834, "epoch": 1354} {"train_loss": -41.16716003417969, "global_step": 163835, "epoch": 1354} {"train_loss": -39.61977767944336, "global_step": 163836, "epoch": 1354} {"train_loss": -38.497528076171875, "global_step": 163837, "epoch": 1354} {"train_loss": -41.102210998535156, "global_step": 163838, "epoch": 1354} {"train_loss": -36.59652328491211, "global_step": 163839, "epoch": 1354} {"train_loss": -40.95115280151367, "global_step": 163840, "epoch": 1354} {"train_loss": -38.42314529418945, "global_step": 163841, "epoch": 1354} {"train_loss": -39.71928787231445, "global_step": 163842, "epoch": 1354} {"train_loss": -40.021820068359375, "global_step": 163843, "epoch": 1354} {"train_loss": -39.08845138549805, "global_step": 163844, "epoch": 1354} {"train_loss": -38.63240432739258, "global_step": 163845, "epoch": 1354} {"train_loss": -40.6256103515625, "global_step": 163846, "epoch": 1354} {"train_loss": -39.463226318359375, "global_step": 163847, "epoch": 1354} {"train_loss": -39.69829177856445, "global_step": 163848, "epoch": 1354} {"train_loss": -40.306068420410156, "global_step": 163849, "epoch": 1354} {"train_loss": -38.7230224609375, "global_step": 163850, "epoch": 1354} {"train_loss": -39.71229934692383, "global_step": 163851, "epoch": 1354} {"train_loss": -39.61412048339844, "global_step": 163852, "epoch": 1354} {"train_loss": -40.331947326660156, "global_step": 163853, "epoch": 1354} {"train_loss": -40.02389144897461, "global_step": 163854, "epoch": 1354} {"train_loss": -39.809017181396484, "global_step": 163855, "epoch": 1354} {"train_loss": -40.2150993347168, "global_step": 163856, "epoch": 1354} {"train_loss": -39.966548919677734, "global_step": 163857, "epoch": 1354} {"train_loss": -40.01337814331055, "global_step": 163858, "epoch": 1354} {"train_loss": -41.17855453491211, "global_step": 163859, "epoch": 1354} {"train_loss": -41.006649017333984, "global_step": 163860, "epoch": 1354} {"train_loss": -41.243709564208984, "global_step": 163861, "epoch": 1354} {"train_loss": -40.55836486816406, "global_step": 163862, "epoch": 1354} {"train_loss": -41.50837707519531, "global_step": 163863, "epoch": 1354} {"train_loss": -41.07578659057617, "global_step": 163864, "epoch": 1354} {"train_loss": -41.541568756103516, "global_step": 163865, "epoch": 1354} {"train_loss": -41.426475524902344, "global_step": 163866, "epoch": 1354} {"train_loss": -41.28486633300781, "global_step": 163867, "epoch": 1354} {"train_loss": -40.977779388427734, "global_step": 163868, "epoch": 1354} {"train_loss": -40.776145935058594, "global_step": 163869, "epoch": 1354} {"train_loss": -41.54718780517578, "global_step": 163870, "epoch": 1354} {"train_loss": -41.26033401489258, "global_step": 163871, "epoch": 1354} {"train_loss": -41.4129524230957, "global_step": 163872, "epoch": 1354} {"train_loss": -41.760467529296875, "global_step": 163873, "epoch": 1354} {"train_loss": -41.44077682495117, "global_step": 163874, "epoch": 1354} {"train_loss": -41.86368942260742, "global_step": 163875, "epoch": 1354} {"train_loss": -41.686553955078125, "global_step": 163876, "epoch": 1354} {"train_loss": -42.0252685546875, "global_step": 163877, "epoch": 1354} {"train_loss": -41.77692413330078, "global_step": 163878, "epoch": 1354} {"train_loss": -41.07034683227539, "global_step": 163879, "epoch": 1354} {"train_loss": -41.89394760131836, "global_step": 163880, "epoch": 1354} {"train_loss": -41.87184143066406, "global_step": 163881, "epoch": 1354} {"train_loss": -41.71709060668945, "global_step": 163882, "epoch": 1354} {"train_loss": -41.900054931640625, "global_step": 163883, "epoch": 1354} {"train_loss": -41.93764114379883, "global_step": 163884, "epoch": 1354} {"train_loss": -42.26438522338867, "global_step": 163885, "epoch": 1354} {"train_loss": -41.589393615722656, "global_step": 163886, "epoch": 1354} {"train_loss": -41.843868255615234, "global_step": 163887, "epoch": 1354} {"train_loss": -42.121700286865234, "global_step": 163888, "epoch": 1354} {"train_loss": -42.02777862548828, "global_step": 163889, "epoch": 1354} {"train_loss": -41.815650939941406, "global_step": 163890, "epoch": 1354} {"train_loss": -41.85345458984375, "global_step": 163891, "epoch": 1354} {"train_loss": -41.91172409057617, "global_step": 163892, "epoch": 1354} {"train_loss": -42.02953338623047, "global_step": 163893, "epoch": 1354} {"train_loss": -41.633705139160156, "global_step": 163894, "epoch": 1354} {"train_loss": -41.90389633178711, "global_step": 163895, "epoch": 1354} {"train_loss": -41.33282470703125, "global_step": 163896, "epoch": 1354} {"train_loss": -41.85732650756836, "global_step": 163897, "epoch": 1354} {"train_loss": -42.01472473144531, "global_step": 163898, "epoch": 1354} {"train_loss": -42.474674224853516, "global_step": 163899, "epoch": 1354} {"train_loss": -41.79459762573242, "global_step": 163900, "epoch": 1354} {"train_loss": -42.02677536010742, "global_step": 163901, "epoch": 1354} {"train_loss": -41.52021408081055, "global_step": 163902, "epoch": 1354} {"train_loss": -42.27572250366211, "global_step": 163903, "epoch": 1354} {"train_loss": -41.687557220458984, "global_step": 163904, "epoch": 1354} {"train_loss": -41.7611198425293, "global_step": 163905, "epoch": 1354} {"train_loss": -41.905391693115234, "global_step": 163906, "epoch": 1354} {"train_loss": -41.378822326660156, "global_step": 163907, "epoch": 1354} {"train_loss": -39.440853118896484, "global_step": 163908, "epoch": 1354} {"train_loss": -40.530311584472656, "global_step": 163909, "epoch": 1354} {"train_loss": -41.35332107543945, "global_step": 163910, "epoch": 1354} {"train_loss": -38.81111526489258, "global_step": 163911, "epoch": 1354} {"train_loss": -39.91401672363281, "global_step": 163912, "epoch": 1354} {"train_loss": -38.28752517700195, "global_step": 163913, "epoch": 1354} {"train_loss": -37.129417419433594, "global_step": 163914, "epoch": 1354} {"train_loss": -37.8121223449707, "global_step": 163915, "epoch": 1354} {"train_loss": -27.830774307250977, "global_step": 163916, "epoch": 1354} {"train_loss": -39.86652755737305, "global_step": 163917, "epoch": 1354} {"train_loss": -32.12893295288086, "global_step": 163918, "epoch": 1354} {"train_loss": -39.403873443603516, "global_step": 163919, "epoch": 1354} {"train_loss": -37.76612091064453, "global_step": 163920, "epoch": 1354} {"train_loss": -33.4414176940918, "global_step": 163921, "epoch": 1354} {"train_loss": -41.06539535522461, "global_step": 163922, "epoch": 1354} {"train_loss": -35.32176208496094, "global_step": 163923, "epoch": 1354} {"train_loss": -37.37801742553711, "global_step": 163924, "epoch": 1354} {"train_loss": -41.20820236206055, "global_step": 163925, "epoch": 1354} {"train_loss": -37.361751556396484, "global_step": 163926, "epoch": 1354} {"train_loss": -36.368221282958984, "global_step": 163927, "epoch": 1354} {"train_loss": -40.19890213012695, "global_step": 163928, "epoch": 1354} {"train_loss": -38.80183410644531, "global_step": 163929, "epoch": 1354} {"train_loss": -37.788063049316406, "global_step": 163930, "epoch": 1354} {"train_loss": -40.768096923828125, "global_step": 163931, "epoch": 1354} {"train_loss": -39.267452239990234, "global_step": 163932, "epoch": 1354} {"train_loss": -40.64145278930664, "global_step": 163933, "epoch": 1354} {"train_loss": -38.6953125, "global_step": 163934, "epoch": 1354} {"train_loss": -39.266231536865234, "global_step": 163935, "epoch": 1354} {"train_loss": -40.839927673339844, "global_step": 163936, "epoch": 1354} {"train_loss": -39.329036712646484, "global_step": 163937, "epoch": 1354} {"train_loss": -40.4337043762207, "global_step": 163938, "epoch": 1354} {"train_loss": -38.158546447753906, "global_step": 163939, "epoch": 1354} {"train_loss": -41.021400451660156, "global_step": 163940, "epoch": 1354} {"train_loss": -41.15909957885742, "global_step": 163941, "epoch": 1354} {"train_loss": -39.89231491088867, "global_step": 163942, "epoch": 1354} {"train_loss": -40.52532196044922, "global_step": 163943, "epoch": 1354} {"train_loss": -40.40168762207031, "global_step": 163944, "epoch": 1354} {"train_loss": -41.62094497680664, "global_step": 163945, "epoch": 1354} {"train_loss": -40.907936096191406, "global_step": 163946, "epoch": 1354} {"train_loss": -41.02773666381836, "global_step": 163947, "epoch": 1354} {"train_loss": -41.14767074584961, "global_step": 163948, "epoch": 1354} {"train_loss": -41.60749435424805, "global_step": 163949, "epoch": 1354} {"train_loss": -41.13999557495117, "global_step": 163950, "epoch": 1354} {"train_loss": -41.1757698059082, "global_step": 163951, "epoch": 1354} {"train_loss": -41.18740463256836, "global_step": 163952, "epoch": 1354} {"train_loss": -40.72957992553711, "global_step": 163953, "epoch": 1354} {"train_loss": -40.29538498240069, "global_step": 163954, "epoch": 1354, "val_loss": 2456200.5} {"train_loss": -40.930294036865234, "global_step": 163955, "epoch": 1355} {"train_loss": -40.98427963256836, "global_step": 163956, "epoch": 1355} {"train_loss": -41.70901107788086, "global_step": 163957, "epoch": 1355} {"train_loss": -41.22426986694336, "global_step": 163958, "epoch": 1355} {"train_loss": -41.60382843017578, "global_step": 163959, "epoch": 1355} {"train_loss": -41.207366943359375, "global_step": 163960, "epoch": 1355} {"train_loss": -41.41486740112305, "global_step": 163961, "epoch": 1355} {"train_loss": -41.076271057128906, "global_step": 163962, "epoch": 1355} {"train_loss": -41.18685531616211, "global_step": 163963, "epoch": 1355} {"train_loss": -40.71090316772461, "global_step": 163964, "epoch": 1355} {"train_loss": -41.74001693725586, "global_step": 163965, "epoch": 1355} {"train_loss": -40.94001388549805, "global_step": 163966, "epoch": 1355} {"train_loss": -41.5130615234375, "global_step": 163967, "epoch": 1355} {"train_loss": -41.916412353515625, "global_step": 163968, "epoch": 1355} {"train_loss": -40.87423324584961, "global_step": 163969, "epoch": 1355} {"train_loss": -39.96077346801758, "global_step": 163970, "epoch": 1355} {"train_loss": -40.09712600708008, "global_step": 163971, "epoch": 1355} {"train_loss": -40.0048828125, "global_step": 163972, "epoch": 1355} {"train_loss": -40.721580505371094, "global_step": 163973, "epoch": 1355} {"train_loss": -42.02323532104492, "global_step": 163974, "epoch": 1355} {"train_loss": -41.79903030395508, "global_step": 163975, "epoch": 1355} {"train_loss": -41.5965576171875, "global_step": 163976, "epoch": 1355} {"train_loss": -42.18781661987305, "global_step": 163977, "epoch": 1355} {"train_loss": -41.903804779052734, "global_step": 163978, "epoch": 1355} {"train_loss": -42.3729133605957, "global_step": 163979, "epoch": 1355} {"train_loss": -41.888771057128906, "global_step": 163980, "epoch": 1355} {"train_loss": -42.037071228027344, "global_step": 163981, "epoch": 1355} {"train_loss": -41.77265548706055, "global_step": 163982, "epoch": 1355} {"train_loss": -41.999881744384766, "global_step": 163983, "epoch": 1355} {"train_loss": -42.47483825683594, "global_step": 163984, "epoch": 1355} {"train_loss": -41.82314682006836, "global_step": 163985, "epoch": 1355} {"train_loss": -41.431640625, "global_step": 163986, "epoch": 1355} {"train_loss": -42.180233001708984, "global_step": 163987, "epoch": 1355} {"train_loss": -41.9393196105957, "global_step": 163988, "epoch": 1355} {"train_loss": -42.02481460571289, "global_step": 163989, "epoch": 1355} {"train_loss": -42.16415023803711, "global_step": 163990, "epoch": 1355} {"train_loss": -42.402034759521484, "global_step": 163991, "epoch": 1355} {"train_loss": -42.34089660644531, "global_step": 163992, "epoch": 1355} {"train_loss": -40.19377899169922, "global_step": 163993, "epoch": 1355} {"train_loss": -39.683631896972656, "global_step": 163994, "epoch": 1355} {"train_loss": -41.59182357788086, "global_step": 163995, "epoch": 1355} {"train_loss": -41.961856842041016, "global_step": 163996, "epoch": 1355} {"train_loss": -41.1283073425293, "global_step": 163997, "epoch": 1355} {"train_loss": -40.68843460083008, "global_step": 163998, "epoch": 1355} {"train_loss": -40.21809768676758, "global_step": 163999, "epoch": 1355} {"train_loss": -39.10331726074219, "global_step": 164000, "epoch": 1355} {"train_loss": -37.18073272705078, "global_step": 164001, "epoch": 1355} {"train_loss": -38.19855880737305, "global_step": 164002, "epoch": 1355} {"train_loss": -37.1218147277832, "global_step": 164003, "epoch": 1355} {"train_loss": -38.62873458862305, "global_step": 164004, "epoch": 1355} {"train_loss": -40.95602035522461, "global_step": 164005, "epoch": 1355} {"train_loss": -41.66748809814453, "global_step": 164006, "epoch": 1355} {"train_loss": -40.497928619384766, "global_step": 164007, "epoch": 1355} {"train_loss": -39.302799224853516, "global_step": 164008, "epoch": 1355} {"train_loss": -40.10541534423828, "global_step": 164009, "epoch": 1355} {"train_loss": -41.10567092895508, "global_step": 164010, "epoch": 1355} {"train_loss": -40.23215866088867, "global_step": 164011, "epoch": 1355} {"train_loss": -38.4586296081543, "global_step": 164012, "epoch": 1355} {"train_loss": -39.69663619995117, "global_step": 164013, "epoch": 1355} {"train_loss": -41.2515983581543, "global_step": 164014, "epoch": 1355} {"train_loss": -39.82461166381836, "global_step": 164015, "epoch": 1355} {"train_loss": -37.00003433227539, "global_step": 164016, "epoch": 1355} {"train_loss": -39.24906921386719, "global_step": 164017, "epoch": 1355} {"train_loss": -41.03729248046875, "global_step": 164018, "epoch": 1355} {"train_loss": -35.276100158691406, "global_step": 164019, "epoch": 1355} {"train_loss": -41.10422897338867, "global_step": 164020, "epoch": 1355} {"train_loss": -39.6300163269043, "global_step": 164021, "epoch": 1355} {"train_loss": -38.51484298706055, "global_step": 164022, "epoch": 1355} {"train_loss": -41.62223434448242, "global_step": 164023, "epoch": 1355} {"train_loss": -38.80524444580078, "global_step": 164024, "epoch": 1355} {"train_loss": -40.10756301879883, "global_step": 164025, "epoch": 1355} {"train_loss": -40.98112869262695, "global_step": 164026, "epoch": 1355} {"train_loss": -39.6695671081543, "global_step": 164027, "epoch": 1355} {"train_loss": -40.58112716674805, "global_step": 164028, "epoch": 1355} {"train_loss": -40.08555221557617, "global_step": 164029, "epoch": 1355} {"train_loss": -41.32540512084961, "global_step": 164030, "epoch": 1355} {"train_loss": -40.593299865722656, "global_step": 164031, "epoch": 1355} {"train_loss": -41.56611251831055, "global_step": 164032, "epoch": 1355} {"train_loss": -40.54783248901367, "global_step": 164033, "epoch": 1355} {"train_loss": -41.61970138549805, "global_step": 164034, "epoch": 1355} {"train_loss": -41.257118225097656, "global_step": 164035, "epoch": 1355} {"train_loss": -40.843650817871094, "global_step": 164036, "epoch": 1355} {"train_loss": -40.83844757080078, "global_step": 164037, "epoch": 1355} {"train_loss": -40.46185302734375, "global_step": 164038, "epoch": 1355} {"train_loss": -41.32509994506836, "global_step": 164039, "epoch": 1355} {"train_loss": -40.867061614990234, "global_step": 164040, "epoch": 1355} {"train_loss": -41.86437225341797, "global_step": 164041, "epoch": 1355} {"train_loss": -40.41569137573242, "global_step": 164042, "epoch": 1355} {"train_loss": -41.77571105957031, "global_step": 164043, "epoch": 1355} {"train_loss": -41.098602294921875, "global_step": 164044, "epoch": 1355} {"train_loss": -41.77578353881836, "global_step": 164045, "epoch": 1355} {"train_loss": -41.6876335144043, "global_step": 164046, "epoch": 1355} {"train_loss": -41.49729537963867, "global_step": 164047, "epoch": 1355} {"train_loss": -39.642547607421875, "global_step": 164048, "epoch": 1355} {"train_loss": -39.18377685546875, "global_step": 164049, "epoch": 1355} {"train_loss": -38.367733001708984, "global_step": 164050, "epoch": 1355} {"train_loss": -35.83015823364258, "global_step": 164051, "epoch": 1355} {"train_loss": -31.4344482421875, "global_step": 164052, "epoch": 1355} {"train_loss": -34.88692092895508, "global_step": 164053, "epoch": 1355} {"train_loss": -3.3803048133850098, "global_step": 164054, "epoch": 1355} {"train_loss": -30.882526397705078, "global_step": 164055, "epoch": 1355} {"train_loss": -33.69098663330078, "global_step": 164056, "epoch": 1355} {"train_loss": -32.1326789855957, "global_step": 164057, "epoch": 1355} {"train_loss": -31.91505241394043, "global_step": 164058, "epoch": 1355} {"train_loss": -32.798500061035156, "global_step": 164059, "epoch": 1355} {"train_loss": -35.743141174316406, "global_step": 164060, "epoch": 1355} {"train_loss": -35.185184478759766, "global_step": 164061, "epoch": 1355} {"train_loss": -38.506507873535156, "global_step": 164062, "epoch": 1355} {"train_loss": -37.60138702392578, "global_step": 164063, "epoch": 1355} {"train_loss": -38.503021240234375, "global_step": 164064, "epoch": 1355} {"train_loss": -36.66702651977539, "global_step": 164065, "epoch": 1355} {"train_loss": -37.7772331237793, "global_step": 164066, "epoch": 1355} {"train_loss": -36.38917922973633, "global_step": 164067, "epoch": 1355} {"train_loss": -38.50230026245117, "global_step": 164068, "epoch": 1355} {"train_loss": -38.2326774597168, "global_step": 164069, "epoch": 1355} {"train_loss": -38.38344955444336, "global_step": 164070, "epoch": 1355} {"train_loss": -39.39547348022461, "global_step": 164071, "epoch": 1355} {"train_loss": -38.15985107421875, "global_step": 164072, "epoch": 1355} {"train_loss": -38.6319694519043, "global_step": 164073, "epoch": 1355} {"train_loss": -38.5438232421875, "global_step": 164074, "epoch": 1355} {"train_loss": -39.517819400661246, "global_step": 164075, "epoch": 1355, "val_loss": 2516512.0} {"train_loss": -39.73076248168945, "global_step": 164076, "epoch": 1356} {"train_loss": -39.39911651611328, "global_step": 164077, "epoch": 1356} {"train_loss": -39.87419891357422, "global_step": 164078, "epoch": 1356} {"train_loss": -39.30074691772461, "global_step": 164079, "epoch": 1356} {"train_loss": -40.318580627441406, "global_step": 164080, "epoch": 1356} {"train_loss": -39.5911979675293, "global_step": 164081, "epoch": 1356} {"train_loss": -39.981624603271484, "global_step": 164082, "epoch": 1356} {"train_loss": -40.18787384033203, "global_step": 164083, "epoch": 1356} {"train_loss": -40.40485763549805, "global_step": 164084, "epoch": 1356} {"train_loss": -40.546634674072266, "global_step": 164085, "epoch": 1356} {"train_loss": -40.65375900268555, "global_step": 164086, "epoch": 1356} {"train_loss": -39.8326530456543, "global_step": 164087, "epoch": 1356} {"train_loss": -40.2744026184082, "global_step": 164088, "epoch": 1356} {"train_loss": -40.30982971191406, "global_step": 164089, "epoch": 1356} {"train_loss": -40.661766052246094, "global_step": 164090, "epoch": 1356} {"train_loss": -41.010955810546875, "global_step": 164091, "epoch": 1356} {"train_loss": -40.97588348388672, "global_step": 164092, "epoch": 1356} {"train_loss": -40.52753829956055, "global_step": 164093, "epoch": 1356} {"train_loss": -40.73041915893555, "global_step": 164094, "epoch": 1356} {"train_loss": -40.94166946411133, "global_step": 164095, "epoch": 1356} {"train_loss": -40.66042709350586, "global_step": 164096, "epoch": 1356} {"train_loss": -41.12112808227539, "global_step": 164097, "epoch": 1356} {"train_loss": -40.99188232421875, "global_step": 164098, "epoch": 1356} {"train_loss": -41.05672836303711, "global_step": 164099, "epoch": 1356} {"train_loss": -41.09728240966797, "global_step": 164100, "epoch": 1356} {"train_loss": -41.363773345947266, "global_step": 164101, "epoch": 1356} {"train_loss": -41.41515350341797, "global_step": 164102, "epoch": 1356} {"train_loss": -41.421871185302734, "global_step": 164103, "epoch": 1356} {"train_loss": -40.90052032470703, "global_step": 164104, "epoch": 1356} {"train_loss": -41.421817779541016, "global_step": 164105, "epoch": 1356} {"train_loss": -41.52061080932617, "global_step": 164106, "epoch": 1356} {"train_loss": -41.08321762084961, "global_step": 164107, "epoch": 1356} {"train_loss": -41.1092414855957, "global_step": 164108, "epoch": 1356} {"train_loss": -41.7492561340332, "global_step": 164109, "epoch": 1356} {"train_loss": -41.11839294433594, "global_step": 164110, "epoch": 1356} {"train_loss": -41.8805046081543, "global_step": 164111, "epoch": 1356} {"train_loss": -41.24711227416992, "global_step": 164112, "epoch": 1356} {"train_loss": -41.26116943359375, "global_step": 164113, "epoch": 1356} {"train_loss": -41.592308044433594, "global_step": 164114, "epoch": 1356} {"train_loss": -41.72272491455078, "global_step": 164115, "epoch": 1356} {"train_loss": -41.45989990234375, "global_step": 164116, "epoch": 1356} {"train_loss": -41.712303161621094, "global_step": 164117, "epoch": 1356} {"train_loss": -41.74595260620117, "global_step": 164118, "epoch": 1356} {"train_loss": -42.029518127441406, "global_step": 164119, "epoch": 1356} {"train_loss": -41.385597229003906, "global_step": 164120, "epoch": 1356} {"train_loss": -42.081520080566406, "global_step": 164121, "epoch": 1356} {"train_loss": -41.76740264892578, "global_step": 164122, "epoch": 1356} {"train_loss": -41.770355224609375, "global_step": 164123, "epoch": 1356} {"train_loss": -42.39287185668945, "global_step": 164124, "epoch": 1356} {"train_loss": -42.2001838684082, "global_step": 164125, "epoch": 1356} {"train_loss": -42.103694915771484, "global_step": 164126, "epoch": 1356} {"train_loss": -42.258453369140625, "global_step": 164127, "epoch": 1356} {"train_loss": -41.861026763916016, "global_step": 164128, "epoch": 1356} {"train_loss": -41.97719955444336, "global_step": 164129, "epoch": 1356} {"train_loss": -42.32960891723633, "global_step": 164130, "epoch": 1356} {"train_loss": -42.172603607177734, "global_step": 164131, "epoch": 1356} {"train_loss": -42.389076232910156, "global_step": 164132, "epoch": 1356} {"train_loss": -42.47780990600586, "global_step": 164133, "epoch": 1356} {"train_loss": -41.96015167236328, "global_step": 164134, "epoch": 1356} {"train_loss": -42.450252532958984, "global_step": 164135, "epoch": 1356} {"train_loss": -42.34259796142578, "global_step": 164136, "epoch": 1356} {"train_loss": -42.5109748840332, "global_step": 164137, "epoch": 1356} {"train_loss": -41.846649169921875, "global_step": 164138, "epoch": 1356} {"train_loss": -42.33188247680664, "global_step": 164139, "epoch": 1356} {"train_loss": -42.49704360961914, "global_step": 164140, "epoch": 1356} {"train_loss": -42.509578704833984, "global_step": 164141, "epoch": 1356} {"train_loss": -42.44533920288086, "global_step": 164142, "epoch": 1356} {"train_loss": -42.156612396240234, "global_step": 164143, "epoch": 1356} {"train_loss": -42.18840408325195, "global_step": 164144, "epoch": 1356} {"train_loss": -42.1413688659668, "global_step": 164145, "epoch": 1356} {"train_loss": -41.953704833984375, "global_step": 164146, "epoch": 1356} {"train_loss": -41.75468063354492, "global_step": 164147, "epoch": 1356} {"train_loss": -42.6133918762207, "global_step": 164148, "epoch": 1356} {"train_loss": -41.61286544799805, "global_step": 164149, "epoch": 1356} {"train_loss": -39.4484748840332, "global_step": 164150, "epoch": 1356} {"train_loss": -38.055965423583984, "global_step": 164151, "epoch": 1356} {"train_loss": -39.51555252075195, "global_step": 164152, "epoch": 1356} {"train_loss": -40.49334716796875, "global_step": 164153, "epoch": 1356} {"train_loss": -38.266639709472656, "global_step": 164154, "epoch": 1356} {"train_loss": -39.12063217163086, "global_step": 164155, "epoch": 1356} {"train_loss": -39.77535629272461, "global_step": 164156, "epoch": 1356} {"train_loss": -35.96125411987305, "global_step": 164157, "epoch": 1356} {"train_loss": -34.01986312866211, "global_step": 164158, "epoch": 1356} {"train_loss": -32.673118591308594, "global_step": 164159, "epoch": 1356} {"train_loss": -35.059715270996094, "global_step": 164160, "epoch": 1356} {"train_loss": -34.652366638183594, "global_step": 164161, "epoch": 1356} {"train_loss": -36.35023880004883, "global_step": 164162, "epoch": 1356} {"train_loss": -35.995479583740234, "global_step": 164163, "epoch": 1356} {"train_loss": -35.4441032409668, "global_step": 164164, "epoch": 1356} {"train_loss": -39.841678619384766, "global_step": 164165, "epoch": 1356} {"train_loss": -36.69862747192383, "global_step": 164166, "epoch": 1356} {"train_loss": -38.7407341003418, "global_step": 164167, "epoch": 1356} {"train_loss": -37.868560791015625, "global_step": 164168, "epoch": 1356} {"train_loss": -37.40388107299805, "global_step": 164169, "epoch": 1356} {"train_loss": -39.88074493408203, "global_step": 164170, "epoch": 1356} {"train_loss": -38.635841369628906, "global_step": 164171, "epoch": 1356} {"train_loss": -40.07716751098633, "global_step": 164172, "epoch": 1356} {"train_loss": -39.45180130004883, "global_step": 164173, "epoch": 1356} {"train_loss": -37.903663635253906, "global_step": 164174, "epoch": 1356} {"train_loss": -41.070064544677734, "global_step": 164175, "epoch": 1356} {"train_loss": -38.69016647338867, "global_step": 164176, "epoch": 1356} {"train_loss": -39.61861038208008, "global_step": 164177, "epoch": 1356} {"train_loss": -40.120914459228516, "global_step": 164178, "epoch": 1356} {"train_loss": -40.41061019897461, "global_step": 164179, "epoch": 1356} {"train_loss": -39.777706146240234, "global_step": 164180, "epoch": 1356} {"train_loss": -40.14042282104492, "global_step": 164181, "epoch": 1356} {"train_loss": -40.99044418334961, "global_step": 164182, "epoch": 1356} {"train_loss": -39.847900390625, "global_step": 164183, "epoch": 1356} {"train_loss": -41.00522994995117, "global_step": 164184, "epoch": 1356} {"train_loss": -40.6909294128418, "global_step": 164185, "epoch": 1356} {"train_loss": -40.89260482788086, "global_step": 164186, "epoch": 1356} {"train_loss": -41.202877044677734, "global_step": 164187, "epoch": 1356} {"train_loss": -41.30678176879883, "global_step": 164188, "epoch": 1356} {"train_loss": -40.93632888793945, "global_step": 164189, "epoch": 1356} {"train_loss": -41.45576095581055, "global_step": 164190, "epoch": 1356} {"train_loss": -41.073055267333984, "global_step": 164191, "epoch": 1356} {"train_loss": -41.512725830078125, "global_step": 164192, "epoch": 1356} {"train_loss": -40.75269317626953, "global_step": 164193, "epoch": 1356} {"train_loss": -40.72878646850586, "global_step": 164194, "epoch": 1356} {"train_loss": -40.75349807739258, "global_step": 164195, "epoch": 1356} {"train_loss": -40.47584653491816, "global_step": 164196, "epoch": 1356, "val_loss": 2626063.75} {"train_loss": -41.0003662109375, "global_step": 164197, "epoch": 1357} {"train_loss": -41.24346160888672, "global_step": 164198, "epoch": 1357} {"train_loss": -41.0758171081543, "global_step": 164199, "epoch": 1357} {"train_loss": -41.84217071533203, "global_step": 164200, "epoch": 1357} {"train_loss": -41.0542106628418, "global_step": 164201, "epoch": 1357} {"train_loss": -41.54618835449219, "global_step": 164202, "epoch": 1357} {"train_loss": -41.679080963134766, "global_step": 164203, "epoch": 1357} {"train_loss": -41.2576789855957, "global_step": 164204, "epoch": 1357} {"train_loss": -41.710548400878906, "global_step": 164205, "epoch": 1357} {"train_loss": -41.608272552490234, "global_step": 164206, "epoch": 1357} {"train_loss": -41.40092086791992, "global_step": 164207, "epoch": 1357} {"train_loss": -42.00026321411133, "global_step": 164208, "epoch": 1357} {"train_loss": -41.943477630615234, "global_step": 164209, "epoch": 1357} {"train_loss": -41.87101364135742, "global_step": 164210, "epoch": 1357} {"train_loss": -40.52094650268555, "global_step": 164211, "epoch": 1357} {"train_loss": -42.13288497924805, "global_step": 164212, "epoch": 1357} {"train_loss": -41.789512634277344, "global_step": 164213, "epoch": 1357} {"train_loss": -41.899166107177734, "global_step": 164214, "epoch": 1357} {"train_loss": -42.1132926940918, "global_step": 164215, "epoch": 1357} {"train_loss": -41.734432220458984, "global_step": 164216, "epoch": 1357} {"train_loss": -42.094940185546875, "global_step": 164217, "epoch": 1357} {"train_loss": -42.30179977416992, "global_step": 164218, "epoch": 1357} {"train_loss": -42.08589553833008, "global_step": 164219, "epoch": 1357} {"train_loss": -42.474578857421875, "global_step": 164220, "epoch": 1357} {"train_loss": -42.25311279296875, "global_step": 164221, "epoch": 1357} {"train_loss": -41.94948196411133, "global_step": 164222, "epoch": 1357} {"train_loss": -41.67692947387695, "global_step": 164223, "epoch": 1357} {"train_loss": -41.06922149658203, "global_step": 164224, "epoch": 1357} {"train_loss": -42.42281723022461, "global_step": 164225, "epoch": 1357} {"train_loss": -41.86772537231445, "global_step": 164226, "epoch": 1357} {"train_loss": -41.2192268371582, "global_step": 164227, "epoch": 1357} {"train_loss": -41.826087951660156, "global_step": 164228, "epoch": 1357} {"train_loss": -41.7105827331543, "global_step": 164229, "epoch": 1357} {"train_loss": -42.2249755859375, "global_step": 164230, "epoch": 1357} {"train_loss": -42.42481231689453, "global_step": 164231, "epoch": 1357} {"train_loss": -41.64204788208008, "global_step": 164232, "epoch": 1357} {"train_loss": -42.23167037963867, "global_step": 164233, "epoch": 1357} {"train_loss": -41.693050384521484, "global_step": 164234, "epoch": 1357} {"train_loss": -41.20319747924805, "global_step": 164235, "epoch": 1357} {"train_loss": -41.8983268737793, "global_step": 164236, "epoch": 1357} {"train_loss": -41.77485656738281, "global_step": 164237, "epoch": 1357} {"train_loss": -42.01852798461914, "global_step": 164238, "epoch": 1357} {"train_loss": -41.619564056396484, "global_step": 164239, "epoch": 1357} {"train_loss": -41.42041015625, "global_step": 164240, "epoch": 1357} {"train_loss": -41.820919036865234, "global_step": 164241, "epoch": 1357} {"train_loss": -41.68839645385742, "global_step": 164242, "epoch": 1357} {"train_loss": -42.2326545715332, "global_step": 164243, "epoch": 1357} {"train_loss": -41.91246032714844, "global_step": 164244, "epoch": 1357} {"train_loss": -41.498504638671875, "global_step": 164245, "epoch": 1357} {"train_loss": -42.065975189208984, "global_step": 164246, "epoch": 1357} {"train_loss": -42.21901321411133, "global_step": 164247, "epoch": 1357} {"train_loss": -42.305294036865234, "global_step": 164248, "epoch": 1357} {"train_loss": -42.215179443359375, "global_step": 164249, "epoch": 1357} {"train_loss": -41.85701370239258, "global_step": 164250, "epoch": 1357} {"train_loss": -42.54305648803711, "global_step": 164251, "epoch": 1357} {"train_loss": -41.41333770751953, "global_step": 164252, "epoch": 1357} {"train_loss": -42.275726318359375, "global_step": 164253, "epoch": 1357} {"train_loss": -42.0262451171875, "global_step": 164254, "epoch": 1357} {"train_loss": -41.434730529785156, "global_step": 164255, "epoch": 1357} {"train_loss": -42.14229202270508, "global_step": 164256, "epoch": 1357} {"train_loss": -42.705047607421875, "global_step": 164257, "epoch": 1357} {"train_loss": -41.95376205444336, "global_step": 164258, "epoch": 1357} {"train_loss": -41.945743560791016, "global_step": 164259, "epoch": 1357} {"train_loss": -41.250091552734375, "global_step": 164260, "epoch": 1357} {"train_loss": -41.68477249145508, "global_step": 164261, "epoch": 1357} {"train_loss": -39.087642669677734, "global_step": 164262, "epoch": 1357} {"train_loss": -38.1775016784668, "global_step": 164263, "epoch": 1357} {"train_loss": -36.490020751953125, "global_step": 164264, "epoch": 1357} {"train_loss": -33.118099212646484, "global_step": 164265, "epoch": 1357} {"train_loss": -36.9354248046875, "global_step": 164266, "epoch": 1357} {"train_loss": -36.118648529052734, "global_step": 164267, "epoch": 1357} {"train_loss": -39.1793327331543, "global_step": 164268, "epoch": 1357} {"train_loss": -38.78913497924805, "global_step": 164269, "epoch": 1357} {"train_loss": -35.94974899291992, "global_step": 164270, "epoch": 1357} {"train_loss": -34.72874069213867, "global_step": 164271, "epoch": 1357} {"train_loss": -39.88689422607422, "global_step": 164272, "epoch": 1357} {"train_loss": -32.18215560913086, "global_step": 164273, "epoch": 1357} {"train_loss": -39.82763671875, "global_step": 164274, "epoch": 1357} {"train_loss": -36.44502639770508, "global_step": 164275, "epoch": 1357} {"train_loss": -37.505096435546875, "global_step": 164276, "epoch": 1357} {"train_loss": -40.18098068237305, "global_step": 164277, "epoch": 1357} {"train_loss": -38.192237854003906, "global_step": 164278, "epoch": 1357} {"train_loss": -40.576656341552734, "global_step": 164279, "epoch": 1357} {"train_loss": -37.78380584716797, "global_step": 164280, "epoch": 1357} {"train_loss": -40.36143112182617, "global_step": 164281, "epoch": 1357} {"train_loss": -40.19054412841797, "global_step": 164282, "epoch": 1357} {"train_loss": -39.920997619628906, "global_step": 164283, "epoch": 1357} {"train_loss": -40.334102630615234, "global_step": 164284, "epoch": 1357} {"train_loss": -39.61784362792969, "global_step": 164285, "epoch": 1357} {"train_loss": -40.418983459472656, "global_step": 164286, "epoch": 1357} {"train_loss": -39.77350616455078, "global_step": 164287, "epoch": 1357} {"train_loss": -41.09023666381836, "global_step": 164288, "epoch": 1357} {"train_loss": -40.637908935546875, "global_step": 164289, "epoch": 1357} {"train_loss": -40.806217193603516, "global_step": 164290, "epoch": 1357} {"train_loss": -40.00019454956055, "global_step": 164291, "epoch": 1357} {"train_loss": -40.365753173828125, "global_step": 164292, "epoch": 1357} {"train_loss": -41.1953239440918, "global_step": 164293, "epoch": 1357} {"train_loss": -39.76206588745117, "global_step": 164294, "epoch": 1357} {"train_loss": -40.769935607910156, "global_step": 164295, "epoch": 1357} {"train_loss": -40.54937744140625, "global_step": 164296, "epoch": 1357} {"train_loss": -39.439388275146484, "global_step": 164297, "epoch": 1357} {"train_loss": -40.63262176513672, "global_step": 164298, "epoch": 1357} {"train_loss": -41.090389251708984, "global_step": 164299, "epoch": 1357} {"train_loss": -39.48597717285156, "global_step": 164300, "epoch": 1357} {"train_loss": -41.6017951965332, "global_step": 164301, "epoch": 1357} {"train_loss": -39.87543869018555, "global_step": 164302, "epoch": 1357} {"train_loss": -40.56343078613281, "global_step": 164303, "epoch": 1357} {"train_loss": -40.48635482788086, "global_step": 164304, "epoch": 1357} {"train_loss": -40.2721061706543, "global_step": 164305, "epoch": 1357} {"train_loss": -40.81808853149414, "global_step": 164306, "epoch": 1357} {"train_loss": -40.72395324707031, "global_step": 164307, "epoch": 1357} {"train_loss": -41.04750442504883, "global_step": 164308, "epoch": 1357} {"train_loss": -40.76670455932617, "global_step": 164309, "epoch": 1357} {"train_loss": -40.777259826660156, "global_step": 164310, "epoch": 1357} {"train_loss": -40.94826126098633, "global_step": 164311, "epoch": 1357} {"train_loss": -41.084529876708984, "global_step": 164312, "epoch": 1357} {"train_loss": -41.612648010253906, "global_step": 164313, "epoch": 1357} {"train_loss": -41.66791915893555, "global_step": 164314, "epoch": 1357} {"train_loss": -40.910247802734375, "global_step": 164315, "epoch": 1357} {"train_loss": -42.00896072387695, "global_step": 164316, "epoch": 1357} {"train_loss": -40.75818744375686, "global_step": 164317, "epoch": 1357, "val_loss": 2573258.25} {"train_loss": -41.2000846862793, "global_step": 164318, "epoch": 1358} {"train_loss": -41.59739303588867, "global_step": 164319, "epoch": 1358} {"train_loss": -41.25593566894531, "global_step": 164320, "epoch": 1358} {"train_loss": -41.3131103515625, "global_step": 164321, "epoch": 1358} {"train_loss": -42.154117584228516, "global_step": 164322, "epoch": 1358} {"train_loss": -41.15373611450195, "global_step": 164323, "epoch": 1358} {"train_loss": -41.73675537109375, "global_step": 164324, "epoch": 1358} {"train_loss": -42.257110595703125, "global_step": 164325, "epoch": 1358} {"train_loss": -41.66278076171875, "global_step": 164326, "epoch": 1358} {"train_loss": -41.70305252075195, "global_step": 164327, "epoch": 1358} {"train_loss": -41.8328742980957, "global_step": 164328, "epoch": 1358} {"train_loss": -41.98358154296875, "global_step": 164329, "epoch": 1358} {"train_loss": -42.27961730957031, "global_step": 164330, "epoch": 1358} {"train_loss": -42.03628158569336, "global_step": 164331, "epoch": 1358} {"train_loss": -42.151893615722656, "global_step": 164332, "epoch": 1358} {"train_loss": -42.22079086303711, "global_step": 164333, "epoch": 1358} {"train_loss": -42.1434440612793, "global_step": 164334, "epoch": 1358} {"train_loss": -42.133148193359375, "global_step": 164335, "epoch": 1358} {"train_loss": -42.24093246459961, "global_step": 164336, "epoch": 1358} {"train_loss": -42.4853401184082, "global_step": 164337, "epoch": 1358} {"train_loss": -42.30283737182617, "global_step": 164338, "epoch": 1358} {"train_loss": -41.92826461791992, "global_step": 164339, "epoch": 1358} {"train_loss": -41.74751281738281, "global_step": 164340, "epoch": 1358} {"train_loss": -42.19857406616211, "global_step": 164341, "epoch": 1358} {"train_loss": -42.1898193359375, "global_step": 164342, "epoch": 1358} {"train_loss": -42.489192962646484, "global_step": 164343, "epoch": 1358} {"train_loss": -42.51488494873047, "global_step": 164344, "epoch": 1358} {"train_loss": -41.84882354736328, "global_step": 164345, "epoch": 1358} {"train_loss": -41.959163665771484, "global_step": 164346, "epoch": 1358} {"train_loss": -41.86067581176758, "global_step": 164347, "epoch": 1358} {"train_loss": -41.61565017700195, "global_step": 164348, "epoch": 1358} {"train_loss": -42.62249755859375, "global_step": 164349, "epoch": 1358} {"train_loss": -42.55607604980469, "global_step": 164350, "epoch": 1358} {"train_loss": -42.35628890991211, "global_step": 164351, "epoch": 1358} {"train_loss": -42.44215774536133, "global_step": 164352, "epoch": 1358} {"train_loss": -42.520042419433594, "global_step": 164353, "epoch": 1358} {"train_loss": -42.71604537963867, "global_step": 164354, "epoch": 1358} {"train_loss": -41.96053695678711, "global_step": 164355, "epoch": 1358} {"train_loss": -41.60836410522461, "global_step": 164356, "epoch": 1358} {"train_loss": -42.025516510009766, "global_step": 164357, "epoch": 1358} {"train_loss": -41.90940856933594, "global_step": 164358, "epoch": 1358} {"train_loss": -41.45949172973633, "global_step": 164359, "epoch": 1358} {"train_loss": -39.55146408081055, "global_step": 164360, "epoch": 1358} {"train_loss": -39.09566879272461, "global_step": 164361, "epoch": 1358} {"train_loss": -38.824947357177734, "global_step": 164362, "epoch": 1358} {"train_loss": -40.339698791503906, "global_step": 164363, "epoch": 1358} {"train_loss": -41.56138229370117, "global_step": 164364, "epoch": 1358} {"train_loss": -41.9095344543457, "global_step": 164365, "epoch": 1358} {"train_loss": -42.20235061645508, "global_step": 164366, "epoch": 1358} {"train_loss": -42.040828704833984, "global_step": 164367, "epoch": 1358} {"train_loss": -41.07627487182617, "global_step": 164368, "epoch": 1358} {"train_loss": -41.36479187011719, "global_step": 164369, "epoch": 1358} {"train_loss": -41.75290298461914, "global_step": 164370, "epoch": 1358} {"train_loss": -41.28404235839844, "global_step": 164371, "epoch": 1358} {"train_loss": -37.87675094604492, "global_step": 164372, "epoch": 1358} {"train_loss": -38.120967864990234, "global_step": 164373, "epoch": 1358} {"train_loss": -41.216896057128906, "global_step": 164374, "epoch": 1358} {"train_loss": -42.1939697265625, "global_step": 164375, "epoch": 1358} {"train_loss": -39.223854064941406, "global_step": 164376, "epoch": 1358} {"train_loss": -38.05695724487305, "global_step": 164377, "epoch": 1358} {"train_loss": -39.89436721801758, "global_step": 164378, "epoch": 1358} {"train_loss": -41.96967315673828, "global_step": 164379, "epoch": 1358} {"train_loss": -40.59071350097656, "global_step": 164380, "epoch": 1358} {"train_loss": -39.00428009033203, "global_step": 164381, "epoch": 1358} {"train_loss": -39.32792282104492, "global_step": 164382, "epoch": 1358} {"train_loss": -41.584102630615234, "global_step": 164383, "epoch": 1358} {"train_loss": -39.824337005615234, "global_step": 164384, "epoch": 1358} {"train_loss": -40.652584075927734, "global_step": 164385, "epoch": 1358} {"train_loss": -41.27265167236328, "global_step": 164386, "epoch": 1358} {"train_loss": -40.69707489013672, "global_step": 164387, "epoch": 1358} {"train_loss": -40.728782653808594, "global_step": 164388, "epoch": 1358} {"train_loss": -40.14594268798828, "global_step": 164389, "epoch": 1358} {"train_loss": -38.63629150390625, "global_step": 164390, "epoch": 1358} {"train_loss": -40.5557746887207, "global_step": 164391, "epoch": 1358} {"train_loss": -39.45858383178711, "global_step": 164392, "epoch": 1358} {"train_loss": -39.55965805053711, "global_step": 164393, "epoch": 1358} {"train_loss": -40.49519348144531, "global_step": 164394, "epoch": 1358} {"train_loss": -38.509071350097656, "global_step": 164395, "epoch": 1358} {"train_loss": -36.10506820678711, "global_step": 164396, "epoch": 1358} {"train_loss": -38.2534065246582, "global_step": 164397, "epoch": 1358} {"train_loss": -38.26371383666992, "global_step": 164398, "epoch": 1358} {"train_loss": -37.3680534362793, "global_step": 164399, "epoch": 1358} {"train_loss": -38.16244125366211, "global_step": 164400, "epoch": 1358} {"train_loss": -38.77099609375, "global_step": 164401, "epoch": 1358} {"train_loss": -37.74445724487305, "global_step": 164402, "epoch": 1358} {"train_loss": -40.094478607177734, "global_step": 164403, "epoch": 1358} {"train_loss": -37.46924591064453, "global_step": 164404, "epoch": 1358} {"train_loss": -38.980995178222656, "global_step": 164405, "epoch": 1358} {"train_loss": -38.69013214111328, "global_step": 164406, "epoch": 1358} {"train_loss": -39.25458908081055, "global_step": 164407, "epoch": 1358} {"train_loss": -38.814659118652344, "global_step": 164408, "epoch": 1358} {"train_loss": -40.0448112487793, "global_step": 164409, "epoch": 1358} {"train_loss": -37.90462875366211, "global_step": 164410, "epoch": 1358} {"train_loss": -40.628597259521484, "global_step": 164411, "epoch": 1358} {"train_loss": -33.635013580322266, "global_step": 164412, "epoch": 1358} {"train_loss": -37.65178680419922, "global_step": 164413, "epoch": 1358} {"train_loss": -39.318878173828125, "global_step": 164414, "epoch": 1358} {"train_loss": -35.32723617553711, "global_step": 164415, "epoch": 1358} {"train_loss": -35.46348190307617, "global_step": 164416, "epoch": 1358} {"train_loss": -38.35004425048828, "global_step": 164417, "epoch": 1358} {"train_loss": -36.57518768310547, "global_step": 164418, "epoch": 1358} {"train_loss": -36.54780197143555, "global_step": 164419, "epoch": 1358} {"train_loss": -35.895790100097656, "global_step": 164420, "epoch": 1358} {"train_loss": -39.792606353759766, "global_step": 164421, "epoch": 1358} {"train_loss": -38.51970291137695, "global_step": 164422, "epoch": 1358} {"train_loss": -39.53190994262695, "global_step": 164423, "epoch": 1358} {"train_loss": -38.73980712890625, "global_step": 164424, "epoch": 1358} {"train_loss": -37.207576751708984, "global_step": 164425, "epoch": 1358} {"train_loss": -38.89994430541992, "global_step": 164426, "epoch": 1358} {"train_loss": -39.076412200927734, "global_step": 164427, "epoch": 1358} {"train_loss": -37.33850860595703, "global_step": 164428, "epoch": 1358} {"train_loss": -39.93455123901367, "global_step": 164429, "epoch": 1358} {"train_loss": -38.621856689453125, "global_step": 164430, "epoch": 1358} {"train_loss": -40.05775833129883, "global_step": 164431, "epoch": 1358} {"train_loss": -38.33647537231445, "global_step": 164432, "epoch": 1358} {"train_loss": -40.362335205078125, "global_step": 164433, "epoch": 1358} {"train_loss": -40.06735610961914, "global_step": 164434, "epoch": 1358} {"train_loss": -39.313228607177734, "global_step": 164435, "epoch": 1358} {"train_loss": -39.54807662963867, "global_step": 164436, "epoch": 1358} {"train_loss": -40.22237777709961, "global_step": 164437, "epoch": 1358} {"train_loss": -40.210510979013996, "global_step": 164438, "epoch": 1358, "val_loss": 2558463.25} {"train_loss": -40.73052978515625, "global_step": 164439, "epoch": 1359} {"train_loss": -40.22383117675781, "global_step": 164440, "epoch": 1359} {"train_loss": -39.732025146484375, "global_step": 164441, "epoch": 1359} {"train_loss": -39.828826904296875, "global_step": 164442, "epoch": 1359} {"train_loss": -40.325435638427734, "global_step": 164443, "epoch": 1359} {"train_loss": -40.47439956665039, "global_step": 164444, "epoch": 1359} {"train_loss": -40.8055305480957, "global_step": 164445, "epoch": 1359} {"train_loss": -40.6121711730957, "global_step": 164446, "epoch": 1359} {"train_loss": -41.02923583984375, "global_step": 164447, "epoch": 1359} {"train_loss": -40.541770935058594, "global_step": 164448, "epoch": 1359} {"train_loss": -41.004234313964844, "global_step": 164449, "epoch": 1359} {"train_loss": -40.81867599487305, "global_step": 164450, "epoch": 1359} {"train_loss": -40.846797943115234, "global_step": 164451, "epoch": 1359} {"train_loss": -40.791961669921875, "global_step": 164452, "epoch": 1359} {"train_loss": -40.149749755859375, "global_step": 164453, "epoch": 1359} {"train_loss": -40.17852783203125, "global_step": 164454, "epoch": 1359} {"train_loss": -41.04513168334961, "global_step": 164455, "epoch": 1359} {"train_loss": -41.51413345336914, "global_step": 164456, "epoch": 1359} {"train_loss": -40.4526481628418, "global_step": 164457, "epoch": 1359} {"train_loss": -41.71018600463867, "global_step": 164458, "epoch": 1359} {"train_loss": -41.44941329956055, "global_step": 164459, "epoch": 1359} {"train_loss": -41.4809455871582, "global_step": 164460, "epoch": 1359} {"train_loss": -41.18870162963867, "global_step": 164461, "epoch": 1359} {"train_loss": -41.41228485107422, "global_step": 164462, "epoch": 1359} {"train_loss": -41.3830680847168, "global_step": 164463, "epoch": 1359} {"train_loss": -41.2857666015625, "global_step": 164464, "epoch": 1359} {"train_loss": -41.68400192260742, "global_step": 164465, "epoch": 1359} {"train_loss": -41.31849670410156, "global_step": 164466, "epoch": 1359} {"train_loss": -41.64093780517578, "global_step": 164467, "epoch": 1359} {"train_loss": -41.59892654418945, "global_step": 164468, "epoch": 1359} {"train_loss": -41.53298568725586, "global_step": 164469, "epoch": 1359} {"train_loss": -41.024776458740234, "global_step": 164470, "epoch": 1359} {"train_loss": -41.260128021240234, "global_step": 164471, "epoch": 1359} {"train_loss": -41.73333740234375, "global_step": 164472, "epoch": 1359} {"train_loss": -41.73606491088867, "global_step": 164473, "epoch": 1359} {"train_loss": -41.79924392700195, "global_step": 164474, "epoch": 1359} {"train_loss": -41.23654556274414, "global_step": 164475, "epoch": 1359} {"train_loss": -41.91759490966797, "global_step": 164476, "epoch": 1359} {"train_loss": -42.25151062011719, "global_step": 164477, "epoch": 1359} {"train_loss": -41.45322036743164, "global_step": 164478, "epoch": 1359} {"train_loss": -41.408809661865234, "global_step": 164479, "epoch": 1359} {"train_loss": -41.88990783691406, "global_step": 164480, "epoch": 1359} {"train_loss": -41.57188034057617, "global_step": 164481, "epoch": 1359} {"train_loss": -41.8189582824707, "global_step": 164482, "epoch": 1359} {"train_loss": -41.05891418457031, "global_step": 164483, "epoch": 1359} {"train_loss": -42.14976119995117, "global_step": 164484, "epoch": 1359} {"train_loss": -40.91529083251953, "global_step": 164485, "epoch": 1359} {"train_loss": -42.27909469604492, "global_step": 164486, "epoch": 1359} {"train_loss": -41.839534759521484, "global_step": 164487, "epoch": 1359} {"train_loss": -42.1711540222168, "global_step": 164488, "epoch": 1359} {"train_loss": -41.50634765625, "global_step": 164489, "epoch": 1359} {"train_loss": -42.41523361206055, "global_step": 164490, "epoch": 1359} {"train_loss": -41.43899154663086, "global_step": 164491, "epoch": 1359} {"train_loss": -41.79798126220703, "global_step": 164492, "epoch": 1359} {"train_loss": -42.10001754760742, "global_step": 164493, "epoch": 1359} {"train_loss": -41.60248947143555, "global_step": 164494, "epoch": 1359} {"train_loss": -40.97638702392578, "global_step": 164495, "epoch": 1359} {"train_loss": -40.55065155029297, "global_step": 164496, "epoch": 1359} {"train_loss": -42.26975631713867, "global_step": 164497, "epoch": 1359} {"train_loss": -41.453651428222656, "global_step": 164498, "epoch": 1359} {"train_loss": -42.20698928833008, "global_step": 164499, "epoch": 1359} {"train_loss": -41.431365966796875, "global_step": 164500, "epoch": 1359} {"train_loss": -42.32744216918945, "global_step": 164501, "epoch": 1359} {"train_loss": -41.97382736206055, "global_step": 164502, "epoch": 1359} {"train_loss": -41.64455795288086, "global_step": 164503, "epoch": 1359} {"train_loss": -41.842037200927734, "global_step": 164504, "epoch": 1359} {"train_loss": -42.358917236328125, "global_step": 164505, "epoch": 1359} {"train_loss": -41.95510482788086, "global_step": 164506, "epoch": 1359} {"train_loss": -42.164546966552734, "global_step": 164507, "epoch": 1359} {"train_loss": -41.7659797668457, "global_step": 164508, "epoch": 1359} {"train_loss": -42.019012451171875, "global_step": 164509, "epoch": 1359} {"train_loss": -42.32412338256836, "global_step": 164510, "epoch": 1359} {"train_loss": -41.88596725463867, "global_step": 164511, "epoch": 1359} {"train_loss": -41.02118682861328, "global_step": 164512, "epoch": 1359} {"train_loss": -40.25965118408203, "global_step": 164513, "epoch": 1359} {"train_loss": -37.67637252807617, "global_step": 164514, "epoch": 1359} {"train_loss": -41.49116516113281, "global_step": 164515, "epoch": 1359} {"train_loss": -40.8355712890625, "global_step": 164516, "epoch": 1359} {"train_loss": -37.13112258911133, "global_step": 164517, "epoch": 1359} {"train_loss": -40.160682678222656, "global_step": 164518, "epoch": 1359} {"train_loss": -41.22509765625, "global_step": 164519, "epoch": 1359} {"train_loss": -41.70840835571289, "global_step": 164520, "epoch": 1359} {"train_loss": -39.774505615234375, "global_step": 164521, "epoch": 1359} {"train_loss": -37.09021759033203, "global_step": 164522, "epoch": 1359} {"train_loss": -39.79255294799805, "global_step": 164523, "epoch": 1359} {"train_loss": -37.685489654541016, "global_step": 164524, "epoch": 1359} {"train_loss": -40.585670471191406, "global_step": 164525, "epoch": 1359} {"train_loss": -39.540287017822266, "global_step": 164526, "epoch": 1359} {"train_loss": -36.54996109008789, "global_step": 164527, "epoch": 1359} {"train_loss": -38.89854049682617, "global_step": 164528, "epoch": 1359} {"train_loss": -38.194427490234375, "global_step": 164529, "epoch": 1359} {"train_loss": -39.576473236083984, "global_step": 164530, "epoch": 1359} {"train_loss": -38.540794372558594, "global_step": 164531, "epoch": 1359} {"train_loss": -38.03968811035156, "global_step": 164532, "epoch": 1359} {"train_loss": -41.249755859375, "global_step": 164533, "epoch": 1359} {"train_loss": -39.687744140625, "global_step": 164534, "epoch": 1359} {"train_loss": -41.185184478759766, "global_step": 164535, "epoch": 1359} {"train_loss": -39.27219772338867, "global_step": 164536, "epoch": 1359} {"train_loss": -39.3189811706543, "global_step": 164537, "epoch": 1359} {"train_loss": -39.743499755859375, "global_step": 164538, "epoch": 1359} {"train_loss": -39.95056915283203, "global_step": 164539, "epoch": 1359} {"train_loss": -38.39717102050781, "global_step": 164540, "epoch": 1359} {"train_loss": -40.3405876159668, "global_step": 164541, "epoch": 1359} {"train_loss": -36.7354850769043, "global_step": 164542, "epoch": 1359} {"train_loss": -39.526397705078125, "global_step": 164543, "epoch": 1359} {"train_loss": -40.25283432006836, "global_step": 164544, "epoch": 1359} {"train_loss": -38.24268341064453, "global_step": 164545, "epoch": 1359} {"train_loss": -40.32729721069336, "global_step": 164546, "epoch": 1359} {"train_loss": -39.65382766723633, "global_step": 164547, "epoch": 1359} {"train_loss": -39.490699768066406, "global_step": 164548, "epoch": 1359} {"train_loss": -40.34920120239258, "global_step": 164549, "epoch": 1359} {"train_loss": -39.93050003051758, "global_step": 164550, "epoch": 1359} {"train_loss": -38.92405700683594, "global_step": 164551, "epoch": 1359} {"train_loss": -40.93442916870117, "global_step": 164552, "epoch": 1359} {"train_loss": -38.38886642456055, "global_step": 164553, "epoch": 1359} {"train_loss": -40.645721435546875, "global_step": 164554, "epoch": 1359} {"train_loss": -39.86261749267578, "global_step": 164555, "epoch": 1359} {"train_loss": -40.13320541381836, "global_step": 164556, "epoch": 1359} {"train_loss": -39.81294631958008, "global_step": 164557, "epoch": 1359} {"train_loss": -40.82961654663086, "global_step": 164558, "epoch": 1359} {"train_loss": -40.6741116736546, "global_step": 164559, "epoch": 1359, "val_loss": 2455628.0} {"train_loss": -40.29496383666992, "global_step": 164560, "epoch": 1360} {"train_loss": -40.60506820678711, "global_step": 164561, "epoch": 1360} {"train_loss": -41.20439529418945, "global_step": 164562, "epoch": 1360} {"train_loss": -40.29631805419922, "global_step": 164563, "epoch": 1360} {"train_loss": -40.714839935302734, "global_step": 164564, "epoch": 1360} {"train_loss": -41.120662689208984, "global_step": 164565, "epoch": 1360} {"train_loss": -41.01008224487305, "global_step": 164566, "epoch": 1360} {"train_loss": -40.80271530151367, "global_step": 164567, "epoch": 1360} {"train_loss": -41.59348678588867, "global_step": 164568, "epoch": 1360} {"train_loss": -41.10640335083008, "global_step": 164569, "epoch": 1360} {"train_loss": -41.0675163269043, "global_step": 164570, "epoch": 1360} {"train_loss": -41.03074645996094, "global_step": 164571, "epoch": 1360} {"train_loss": -41.81572341918945, "global_step": 164572, "epoch": 1360} {"train_loss": -41.5579948425293, "global_step": 164573, "epoch": 1360} {"train_loss": -41.27408218383789, "global_step": 164574, "epoch": 1360} {"train_loss": -41.589237213134766, "global_step": 164575, "epoch": 1360} {"train_loss": -41.7097053527832, "global_step": 164576, "epoch": 1360} {"train_loss": -41.75367736816406, "global_step": 164577, "epoch": 1360} {"train_loss": -41.2466926574707, "global_step": 164578, "epoch": 1360} {"train_loss": -41.13237762451172, "global_step": 164579, "epoch": 1360} {"train_loss": -41.9495849609375, "global_step": 164580, "epoch": 1360} {"train_loss": -42.055171966552734, "global_step": 164581, "epoch": 1360} {"train_loss": -42.05007553100586, "global_step": 164582, "epoch": 1360} {"train_loss": -41.902320861816406, "global_step": 164583, "epoch": 1360} {"train_loss": -41.63917922973633, "global_step": 164584, "epoch": 1360} {"train_loss": -41.85192108154297, "global_step": 164585, "epoch": 1360} {"train_loss": -41.5110969543457, "global_step": 164586, "epoch": 1360} {"train_loss": -42.05876922607422, "global_step": 164587, "epoch": 1360} {"train_loss": -42.057281494140625, "global_step": 164588, "epoch": 1360} {"train_loss": -42.198909759521484, "global_step": 164589, "epoch": 1360} {"train_loss": -41.781185150146484, "global_step": 164590, "epoch": 1360} {"train_loss": -42.16168212890625, "global_step": 164591, "epoch": 1360} {"train_loss": -41.96778106689453, "global_step": 164592, "epoch": 1360} {"train_loss": -41.96112060546875, "global_step": 164593, "epoch": 1360} {"train_loss": -42.109619140625, "global_step": 164594, "epoch": 1360} {"train_loss": -42.13093185424805, "global_step": 164595, "epoch": 1360} {"train_loss": -42.45156478881836, "global_step": 164596, "epoch": 1360} {"train_loss": -42.2346076965332, "global_step": 164597, "epoch": 1360} {"train_loss": -41.80111312866211, "global_step": 164598, "epoch": 1360} {"train_loss": -42.1452522277832, "global_step": 164599, "epoch": 1360} {"train_loss": -41.87207794189453, "global_step": 164600, "epoch": 1360} {"train_loss": -42.45423126220703, "global_step": 164601, "epoch": 1360} {"train_loss": -42.42962646484375, "global_step": 164602, "epoch": 1360} {"train_loss": -42.02344512939453, "global_step": 164603, "epoch": 1360} {"train_loss": -41.56669998168945, "global_step": 164604, "epoch": 1360} {"train_loss": -41.82196044921875, "global_step": 164605, "epoch": 1360} {"train_loss": -41.36506652832031, "global_step": 164606, "epoch": 1360} {"train_loss": -41.89438247680664, "global_step": 164607, "epoch": 1360} {"train_loss": -41.766822814941406, "global_step": 164608, "epoch": 1360} {"train_loss": -42.54081344604492, "global_step": 164609, "epoch": 1360} {"train_loss": -42.1995964050293, "global_step": 164610, "epoch": 1360} {"train_loss": -41.390411376953125, "global_step": 164611, "epoch": 1360} {"train_loss": -39.81580352783203, "global_step": 164612, "epoch": 1360} {"train_loss": -36.063838958740234, "global_step": 164613, "epoch": 1360} {"train_loss": -38.12800216674805, "global_step": 164614, "epoch": 1360} {"train_loss": -38.22901153564453, "global_step": 164615, "epoch": 1360} {"train_loss": -40.03380584716797, "global_step": 164616, "epoch": 1360} {"train_loss": -37.79291534423828, "global_step": 164617, "epoch": 1360} {"train_loss": -38.17499923706055, "global_step": 164618, "epoch": 1360} {"train_loss": -35.62040710449219, "global_step": 164619, "epoch": 1360} {"train_loss": -39.835601806640625, "global_step": 164620, "epoch": 1360} {"train_loss": -41.441917419433594, "global_step": 164621, "epoch": 1360} {"train_loss": -39.03152084350586, "global_step": 164622, "epoch": 1360} {"train_loss": -39.791229248046875, "global_step": 164623, "epoch": 1360} {"train_loss": -41.57558059692383, "global_step": 164624, "epoch": 1360} {"train_loss": -41.18867111206055, "global_step": 164625, "epoch": 1360} {"train_loss": -41.11112976074219, "global_step": 164626, "epoch": 1360} {"train_loss": -41.29823684692383, "global_step": 164627, "epoch": 1360} {"train_loss": -40.93122482299805, "global_step": 164628, "epoch": 1360} {"train_loss": -41.465579986572266, "global_step": 164629, "epoch": 1360} {"train_loss": -40.79964828491211, "global_step": 164630, "epoch": 1360} {"train_loss": -41.05537033081055, "global_step": 164631, "epoch": 1360} {"train_loss": -41.19045639038086, "global_step": 164632, "epoch": 1360} {"train_loss": -40.995853424072266, "global_step": 164633, "epoch": 1360} {"train_loss": -40.87914276123047, "global_step": 164634, "epoch": 1360} {"train_loss": -41.68645095825195, "global_step": 164635, "epoch": 1360} {"train_loss": -41.29600524902344, "global_step": 164636, "epoch": 1360} {"train_loss": -41.572174072265625, "global_step": 164637, "epoch": 1360} {"train_loss": -41.06394577026367, "global_step": 164638, "epoch": 1360} {"train_loss": -40.9499626159668, "global_step": 164639, "epoch": 1360} {"train_loss": -41.67448043823242, "global_step": 164640, "epoch": 1360} {"train_loss": -41.00482940673828, "global_step": 164641, "epoch": 1360} {"train_loss": -41.10885238647461, "global_step": 164642, "epoch": 1360} {"train_loss": -40.227760314941406, "global_step": 164643, "epoch": 1360} {"train_loss": -41.05523681640625, "global_step": 164644, "epoch": 1360} {"train_loss": -41.17667770385742, "global_step": 164645, "epoch": 1360} {"train_loss": -41.18172073364258, "global_step": 164646, "epoch": 1360} {"train_loss": -41.206443786621094, "global_step": 164647, "epoch": 1360} {"train_loss": -42.03593444824219, "global_step": 164648, "epoch": 1360} {"train_loss": -41.95305633544922, "global_step": 164649, "epoch": 1360} {"train_loss": -41.50518798828125, "global_step": 164650, "epoch": 1360} {"train_loss": -41.42768859863281, "global_step": 164651, "epoch": 1360} {"train_loss": -42.313865661621094, "global_step": 164652, "epoch": 1360} {"train_loss": -42.144412994384766, "global_step": 164653, "epoch": 1360} {"train_loss": -41.8687858581543, "global_step": 164654, "epoch": 1360} {"train_loss": -41.88105773925781, "global_step": 164655, "epoch": 1360} {"train_loss": -41.97584915161133, "global_step": 164656, "epoch": 1360} {"train_loss": -41.229156494140625, "global_step": 164657, "epoch": 1360} {"train_loss": -42.012271881103516, "global_step": 164658, "epoch": 1360} {"train_loss": -41.76438522338867, "global_step": 164659, "epoch": 1360} {"train_loss": -41.548919677734375, "global_step": 164660, "epoch": 1360} {"train_loss": -41.02006912231445, "global_step": 164661, "epoch": 1360} {"train_loss": -41.45481872558594, "global_step": 164662, "epoch": 1360} {"train_loss": -41.91130065917969, "global_step": 164663, "epoch": 1360} {"train_loss": -41.96942901611328, "global_step": 164664, "epoch": 1360} {"train_loss": -41.594242095947266, "global_step": 164665, "epoch": 1360} {"train_loss": -42.17889404296875, "global_step": 164666, "epoch": 1360} {"train_loss": -41.85263442993164, "global_step": 164667, "epoch": 1360} {"train_loss": -40.74242401123047, "global_step": 164668, "epoch": 1360} {"train_loss": -41.7363395690918, "global_step": 164669, "epoch": 1360} {"train_loss": -41.60476303100586, "global_step": 164670, "epoch": 1360} {"train_loss": -39.8486328125, "global_step": 164671, "epoch": 1360} {"train_loss": -38.89194869995117, "global_step": 164672, "epoch": 1360} {"train_loss": -40.00954055786133, "global_step": 164673, "epoch": 1360} {"train_loss": -42.24121856689453, "global_step": 164674, "epoch": 1360} {"train_loss": -41.31008529663086, "global_step": 164675, "epoch": 1360} {"train_loss": -40.287940979003906, "global_step": 164676, "epoch": 1360} {"train_loss": -41.562347412109375, "global_step": 164677, "epoch": 1360} {"train_loss": -42.172210693359375, "global_step": 164678, "epoch": 1360} {"train_loss": -42.0129280090332, "global_step": 164679, "epoch": 1360} {"train_loss": -41.22736714891166, "global_step": 164680, "epoch": 1360, "val_loss": 2510899.5} {"train_loss": -42.28763198852539, "global_step": 164681, "epoch": 1361} {"train_loss": -42.05398178100586, "global_step": 164682, "epoch": 1361} {"train_loss": -41.99984359741211, "global_step": 164683, "epoch": 1361} {"train_loss": -42.19664764404297, "global_step": 164684, "epoch": 1361} {"train_loss": -41.746212005615234, "global_step": 164685, "epoch": 1361} {"train_loss": -42.3275032043457, "global_step": 164686, "epoch": 1361} {"train_loss": -42.05484390258789, "global_step": 164687, "epoch": 1361} {"train_loss": -41.509456634521484, "global_step": 164688, "epoch": 1361} {"train_loss": -41.84359359741211, "global_step": 164689, "epoch": 1361} {"train_loss": -42.04431915283203, "global_step": 164690, "epoch": 1361} {"train_loss": -41.94993591308594, "global_step": 164691, "epoch": 1361} {"train_loss": -41.63581085205078, "global_step": 164692, "epoch": 1361} {"train_loss": -42.10911178588867, "global_step": 164693, "epoch": 1361} {"train_loss": -42.00632095336914, "global_step": 164694, "epoch": 1361} {"train_loss": -41.868587493896484, "global_step": 164695, "epoch": 1361} {"train_loss": -42.33045196533203, "global_step": 164696, "epoch": 1361} {"train_loss": -41.878108978271484, "global_step": 164697, "epoch": 1361} {"train_loss": -42.26514434814453, "global_step": 164698, "epoch": 1361} {"train_loss": -41.193397521972656, "global_step": 164699, "epoch": 1361} {"train_loss": -41.72865676879883, "global_step": 164700, "epoch": 1361} {"train_loss": -42.534854888916016, "global_step": 164701, "epoch": 1361} {"train_loss": -40.99024200439453, "global_step": 164702, "epoch": 1361} {"train_loss": -41.462493896484375, "global_step": 164703, "epoch": 1361} {"train_loss": -42.591426849365234, "global_step": 164704, "epoch": 1361} {"train_loss": -41.52976608276367, "global_step": 164705, "epoch": 1361} {"train_loss": -41.74498748779297, "global_step": 164706, "epoch": 1361} {"train_loss": -41.768550872802734, "global_step": 164707, "epoch": 1361} {"train_loss": -42.047882080078125, "global_step": 164708, "epoch": 1361} {"train_loss": -41.77721405029297, "global_step": 164709, "epoch": 1361} {"train_loss": -40.81550598144531, "global_step": 164710, "epoch": 1361} {"train_loss": -40.766544342041016, "global_step": 164711, "epoch": 1361} {"train_loss": -41.57299041748047, "global_step": 164712, "epoch": 1361} {"train_loss": -42.05097579956055, "global_step": 164713, "epoch": 1361} {"train_loss": -42.12992477416992, "global_step": 164714, "epoch": 1361} {"train_loss": -41.27605056762695, "global_step": 164715, "epoch": 1361} {"train_loss": -38.2951774597168, "global_step": 164716, "epoch": 1361} {"train_loss": -38.49982833862305, "global_step": 164717, "epoch": 1361} {"train_loss": -41.499908447265625, "global_step": 164718, "epoch": 1361} {"train_loss": -39.97783279418945, "global_step": 164719, "epoch": 1361} {"train_loss": -37.230342864990234, "global_step": 164720, "epoch": 1361} {"train_loss": -41.29372787475586, "global_step": 164721, "epoch": 1361} {"train_loss": -37.084625244140625, "global_step": 164722, "epoch": 1361} {"train_loss": -36.0123176574707, "global_step": 164723, "epoch": 1361} {"train_loss": -41.62858200073242, "global_step": 164724, "epoch": 1361} {"train_loss": -36.08855056762695, "global_step": 164725, "epoch": 1361} {"train_loss": -40.90730667114258, "global_step": 164726, "epoch": 1361} {"train_loss": -35.94537353515625, "global_step": 164727, "epoch": 1361} {"train_loss": -37.81818389892578, "global_step": 164728, "epoch": 1361} {"train_loss": -38.168704986572266, "global_step": 164729, "epoch": 1361} {"train_loss": -37.0458869934082, "global_step": 164730, "epoch": 1361} {"train_loss": -39.77703094482422, "global_step": 164731, "epoch": 1361} {"train_loss": -37.2734489440918, "global_step": 164732, "epoch": 1361} {"train_loss": -38.44209289550781, "global_step": 164733, "epoch": 1361} {"train_loss": -38.792213439941406, "global_step": 164734, "epoch": 1361} {"train_loss": -36.5300407409668, "global_step": 164735, "epoch": 1361} {"train_loss": -39.09175491333008, "global_step": 164736, "epoch": 1361} {"train_loss": -38.235565185546875, "global_step": 164737, "epoch": 1361} {"train_loss": -38.93937301635742, "global_step": 164738, "epoch": 1361} {"train_loss": -38.72099304199219, "global_step": 164739, "epoch": 1361} {"train_loss": -39.52817916870117, "global_step": 164740, "epoch": 1361} {"train_loss": -39.28985595703125, "global_step": 164741, "epoch": 1361} {"train_loss": -40.072383880615234, "global_step": 164742, "epoch": 1361} {"train_loss": -38.769107818603516, "global_step": 164743, "epoch": 1361} {"train_loss": -38.915645599365234, "global_step": 164744, "epoch": 1361} {"train_loss": -40.26953887939453, "global_step": 164745, "epoch": 1361} {"train_loss": -38.86086654663086, "global_step": 164746, "epoch": 1361} {"train_loss": -40.72532272338867, "global_step": 164747, "epoch": 1361} {"train_loss": -39.663177490234375, "global_step": 164748, "epoch": 1361} {"train_loss": -40.899906158447266, "global_step": 164749, "epoch": 1361} {"train_loss": -40.99735641479492, "global_step": 164750, "epoch": 1361} {"train_loss": -40.62846755981445, "global_step": 164751, "epoch": 1361} {"train_loss": -41.33600997924805, "global_step": 164752, "epoch": 1361} {"train_loss": -40.266170501708984, "global_step": 164753, "epoch": 1361} {"train_loss": -41.084312438964844, "global_step": 164754, "epoch": 1361} {"train_loss": -40.29630661010742, "global_step": 164755, "epoch": 1361} {"train_loss": -41.729644775390625, "global_step": 164756, "epoch": 1361} {"train_loss": -40.57756805419922, "global_step": 164757, "epoch": 1361} {"train_loss": -40.9241828918457, "global_step": 164758, "epoch": 1361} {"train_loss": -41.12740707397461, "global_step": 164759, "epoch": 1361} {"train_loss": -40.751914978027344, "global_step": 164760, "epoch": 1361} {"train_loss": -41.614498138427734, "global_step": 164761, "epoch": 1361} {"train_loss": -40.71274948120117, "global_step": 164762, "epoch": 1361} {"train_loss": -41.88596725463867, "global_step": 164763, "epoch": 1361} {"train_loss": -41.44233322143555, "global_step": 164764, "epoch": 1361} {"train_loss": -41.64658737182617, "global_step": 164765, "epoch": 1361} {"train_loss": -41.78310775756836, "global_step": 164766, "epoch": 1361} {"train_loss": -41.93889236450195, "global_step": 164767, "epoch": 1361} {"train_loss": -42.23551559448242, "global_step": 164768, "epoch": 1361} {"train_loss": -41.52207946777344, "global_step": 164769, "epoch": 1361} {"train_loss": -41.87221908569336, "global_step": 164770, "epoch": 1361} {"train_loss": -41.28805160522461, "global_step": 164771, "epoch": 1361} {"train_loss": -41.52423095703125, "global_step": 164772, "epoch": 1361} {"train_loss": -41.649715423583984, "global_step": 164773, "epoch": 1361} {"train_loss": -41.660728454589844, "global_step": 164774, "epoch": 1361} {"train_loss": -42.118896484375, "global_step": 164775, "epoch": 1361} {"train_loss": -42.29015350341797, "global_step": 164776, "epoch": 1361} {"train_loss": -42.07075500488281, "global_step": 164777, "epoch": 1361} {"train_loss": -42.09423828125, "global_step": 164778, "epoch": 1361} {"train_loss": -42.26079177856445, "global_step": 164779, "epoch": 1361} {"train_loss": -42.68095779418945, "global_step": 164780, "epoch": 1361} {"train_loss": -42.63234329223633, "global_step": 164781, "epoch": 1361} {"train_loss": -42.08430099487305, "global_step": 164782, "epoch": 1361} {"train_loss": -42.42498779296875, "global_step": 164783, "epoch": 1361} {"train_loss": -42.11031723022461, "global_step": 164784, "epoch": 1361} {"train_loss": -42.46232223510742, "global_step": 164785, "epoch": 1361} {"train_loss": -42.356300354003906, "global_step": 164786, "epoch": 1361} {"train_loss": -42.00815963745117, "global_step": 164787, "epoch": 1361} {"train_loss": -42.32850646972656, "global_step": 164788, "epoch": 1361} {"train_loss": -42.5405158996582, "global_step": 164789, "epoch": 1361} {"train_loss": -42.2886962890625, "global_step": 164790, "epoch": 1361} {"train_loss": -42.603328704833984, "global_step": 164791, "epoch": 1361} {"train_loss": -41.86507797241211, "global_step": 164792, "epoch": 1361} {"train_loss": -41.03730010986328, "global_step": 164793, "epoch": 1361} {"train_loss": -41.99592208862305, "global_step": 164794, "epoch": 1361} {"train_loss": -41.18811798095703, "global_step": 164795, "epoch": 1361} {"train_loss": -39.84949493408203, "global_step": 164796, "epoch": 1361} {"train_loss": -38.05287551879883, "global_step": 164797, "epoch": 1361} {"train_loss": -39.38911056518555, "global_step": 164798, "epoch": 1361} {"train_loss": -40.88411331176758, "global_step": 164799, "epoch": 1361} {"train_loss": -41.392303466796875, "global_step": 164800, "epoch": 1361} {"train_loss": -40.85085706474367, "global_step": 164801, "epoch": 1361, "val_loss": 2533193.0} {"train_loss": -41.2385368347168, "global_step": 164802, "epoch": 1362} {"train_loss": -39.77402877807617, "global_step": 164803, "epoch": 1362} {"train_loss": -35.09381866455078, "global_step": 164804, "epoch": 1362} {"train_loss": -34.436126708984375, "global_step": 164805, "epoch": 1362} {"train_loss": -39.73024368286133, "global_step": 164806, "epoch": 1362} {"train_loss": -39.862449645996094, "global_step": 164807, "epoch": 1362} {"train_loss": -40.03232955932617, "global_step": 164808, "epoch": 1362} {"train_loss": -40.44981002807617, "global_step": 164809, "epoch": 1362} {"train_loss": -40.171630859375, "global_step": 164810, "epoch": 1362} {"train_loss": -41.3075065612793, "global_step": 164811, "epoch": 1362} {"train_loss": -39.694549560546875, "global_step": 164812, "epoch": 1362} {"train_loss": -39.47560119628906, "global_step": 164813, "epoch": 1362} {"train_loss": -41.242923736572266, "global_step": 164814, "epoch": 1362} {"train_loss": -38.507530212402344, "global_step": 164815, "epoch": 1362} {"train_loss": -39.789283752441406, "global_step": 164816, "epoch": 1362} {"train_loss": -40.65690994262695, "global_step": 164817, "epoch": 1362} {"train_loss": -37.75482940673828, "global_step": 164818, "epoch": 1362} {"train_loss": -40.224178314208984, "global_step": 164819, "epoch": 1362} {"train_loss": -40.40860366821289, "global_step": 164820, "epoch": 1362} {"train_loss": -36.05619430541992, "global_step": 164821, "epoch": 1362} {"train_loss": -40.14085388183594, "global_step": 164822, "epoch": 1362} {"train_loss": -38.692726135253906, "global_step": 164823, "epoch": 1362} {"train_loss": -37.67704391479492, "global_step": 164824, "epoch": 1362} {"train_loss": -41.1306266784668, "global_step": 164825, "epoch": 1362} {"train_loss": -39.43256378173828, "global_step": 164826, "epoch": 1362} {"train_loss": -41.15656280517578, "global_step": 164827, "epoch": 1362} {"train_loss": -38.91688919067383, "global_step": 164828, "epoch": 1362} {"train_loss": -41.12050247192383, "global_step": 164829, "epoch": 1362} {"train_loss": -39.516597747802734, "global_step": 164830, "epoch": 1362} {"train_loss": -41.46524429321289, "global_step": 164831, "epoch": 1362} {"train_loss": -40.101600646972656, "global_step": 164832, "epoch": 1362} {"train_loss": -41.39065170288086, "global_step": 164833, "epoch": 1362} {"train_loss": -40.6861572265625, "global_step": 164834, "epoch": 1362} {"train_loss": -41.08831787109375, "global_step": 164835, "epoch": 1362} {"train_loss": -39.20930862426758, "global_step": 164836, "epoch": 1362} {"train_loss": -41.77268600463867, "global_step": 164837, "epoch": 1362} {"train_loss": -39.47420883178711, "global_step": 164838, "epoch": 1362} {"train_loss": -40.16943359375, "global_step": 164839, "epoch": 1362} {"train_loss": -40.25247573852539, "global_step": 164840, "epoch": 1362} {"train_loss": -41.0191650390625, "global_step": 164841, "epoch": 1362} {"train_loss": -40.95980453491211, "global_step": 164842, "epoch": 1362} {"train_loss": -40.97896957397461, "global_step": 164843, "epoch": 1362} {"train_loss": -41.59768295288086, "global_step": 164844, "epoch": 1362} {"train_loss": -40.860591888427734, "global_step": 164845, "epoch": 1362} {"train_loss": -41.46458435058594, "global_step": 164846, "epoch": 1362} {"train_loss": -41.05384063720703, "global_step": 164847, "epoch": 1362} {"train_loss": -41.66858673095703, "global_step": 164848, "epoch": 1362} {"train_loss": -41.3426513671875, "global_step": 164849, "epoch": 1362} {"train_loss": -41.3698844909668, "global_step": 164850, "epoch": 1362} {"train_loss": -41.0262336730957, "global_step": 164851, "epoch": 1362} {"train_loss": -41.55294418334961, "global_step": 164852, "epoch": 1362} {"train_loss": -41.14588165283203, "global_step": 164853, "epoch": 1362} {"train_loss": -41.76529312133789, "global_step": 164854, "epoch": 1362} {"train_loss": -41.74160385131836, "global_step": 164855, "epoch": 1362} {"train_loss": -41.66799545288086, "global_step": 164856, "epoch": 1362} {"train_loss": -41.7523307800293, "global_step": 164857, "epoch": 1362} {"train_loss": -41.41218185424805, "global_step": 164858, "epoch": 1362} {"train_loss": -41.57271194458008, "global_step": 164859, "epoch": 1362} {"train_loss": -41.35190963745117, "global_step": 164860, "epoch": 1362} {"train_loss": -42.406463623046875, "global_step": 164861, "epoch": 1362} {"train_loss": -41.21736526489258, "global_step": 164862, "epoch": 1362} {"train_loss": -42.32737350463867, "global_step": 164863, "epoch": 1362} {"train_loss": -41.65193176269531, "global_step": 164864, "epoch": 1362} {"train_loss": -41.776466369628906, "global_step": 164865, "epoch": 1362} {"train_loss": -41.91105651855469, "global_step": 164866, "epoch": 1362} {"train_loss": -41.60122299194336, "global_step": 164867, "epoch": 1362} {"train_loss": -40.846336364746094, "global_step": 164868, "epoch": 1362} {"train_loss": -41.4737663269043, "global_step": 164869, "epoch": 1362} {"train_loss": -41.730918884277344, "global_step": 164870, "epoch": 1362} {"train_loss": -41.98810577392578, "global_step": 164871, "epoch": 1362} {"train_loss": -41.39155578613281, "global_step": 164872, "epoch": 1362} {"train_loss": -40.92201614379883, "global_step": 164873, "epoch": 1362} {"train_loss": -41.92384719848633, "global_step": 164874, "epoch": 1362} {"train_loss": -42.07530975341797, "global_step": 164875, "epoch": 1362} {"train_loss": -41.87032699584961, "global_step": 164876, "epoch": 1362} {"train_loss": -42.221466064453125, "global_step": 164877, "epoch": 1362} {"train_loss": -42.171058654785156, "global_step": 164878, "epoch": 1362} {"train_loss": -42.01068115234375, "global_step": 164879, "epoch": 1362} {"train_loss": -41.97782516479492, "global_step": 164880, "epoch": 1362} {"train_loss": -42.02653121948242, "global_step": 164881, "epoch": 1362} {"train_loss": -41.57252883911133, "global_step": 164882, "epoch": 1362} {"train_loss": -41.903533935546875, "global_step": 164883, "epoch": 1362} {"train_loss": -42.02445602416992, "global_step": 164884, "epoch": 1362} {"train_loss": -41.74312973022461, "global_step": 164885, "epoch": 1362} {"train_loss": -41.973724365234375, "global_step": 164886, "epoch": 1362} {"train_loss": -42.52505111694336, "global_step": 164887, "epoch": 1362} {"train_loss": -42.29145812988281, "global_step": 164888, "epoch": 1362} {"train_loss": -42.03813552856445, "global_step": 164889, "epoch": 1362} {"train_loss": -42.737178802490234, "global_step": 164890, "epoch": 1362} {"train_loss": -42.479122161865234, "global_step": 164891, "epoch": 1362} {"train_loss": -42.10729217529297, "global_step": 164892, "epoch": 1362} {"train_loss": -42.26144027709961, "global_step": 164893, "epoch": 1362} {"train_loss": -41.41128158569336, "global_step": 164894, "epoch": 1362} {"train_loss": -41.712223052978516, "global_step": 164895, "epoch": 1362} {"train_loss": -42.129276275634766, "global_step": 164896, "epoch": 1362} {"train_loss": -41.838966369628906, "global_step": 164897, "epoch": 1362} {"train_loss": -41.78811264038086, "global_step": 164898, "epoch": 1362} {"train_loss": -41.64042282104492, "global_step": 164899, "epoch": 1362} {"train_loss": -42.064491271972656, "global_step": 164900, "epoch": 1362} {"train_loss": -41.56074142456055, "global_step": 164901, "epoch": 1362} {"train_loss": -42.340187072753906, "global_step": 164902, "epoch": 1362} {"train_loss": -42.19564437866211, "global_step": 164903, "epoch": 1362} {"train_loss": -40.67179489135742, "global_step": 164904, "epoch": 1362} {"train_loss": -40.17608642578125, "global_step": 164905, "epoch": 1362} {"train_loss": -38.9577751159668, "global_step": 164906, "epoch": 1362} {"train_loss": -39.28633499145508, "global_step": 164907, "epoch": 1362} {"train_loss": -39.79240417480469, "global_step": 164908, "epoch": 1362} {"train_loss": -40.67193603515625, "global_step": 164909, "epoch": 1362} {"train_loss": -41.61106491088867, "global_step": 164910, "epoch": 1362} {"train_loss": -41.95988845825195, "global_step": 164911, "epoch": 1362} {"train_loss": -40.783653259277344, "global_step": 164912, "epoch": 1362} {"train_loss": -39.70815658569336, "global_step": 164913, "epoch": 1362} {"train_loss": -40.57424545288086, "global_step": 164914, "epoch": 1362} {"train_loss": -40.891639709472656, "global_step": 164915, "epoch": 1362} {"train_loss": -40.45093536376953, "global_step": 164916, "epoch": 1362} {"train_loss": -40.135223388671875, "global_step": 164917, "epoch": 1362} {"train_loss": -36.95759963989258, "global_step": 164918, "epoch": 1362} {"train_loss": -38.55622100830078, "global_step": 164919, "epoch": 1362} {"train_loss": -40.441017150878906, "global_step": 164920, "epoch": 1362} {"train_loss": -37.640342712402344, "global_step": 164921, "epoch": 1362} {"train_loss": -40.761809199309546, "global_step": 164922, "epoch": 1362, "val_loss": 2515376.0} {"train_loss": -41.33606719970703, "global_step": 164923, "epoch": 1363} {"train_loss": -35.2032470703125, "global_step": 164924, "epoch": 1363} {"train_loss": -40.172271728515625, "global_step": 164925, "epoch": 1363} {"train_loss": -38.16032791137695, "global_step": 164926, "epoch": 1363} {"train_loss": -38.1551628112793, "global_step": 164927, "epoch": 1363} {"train_loss": -40.4980354309082, "global_step": 164928, "epoch": 1363} {"train_loss": -37.942138671875, "global_step": 164929, "epoch": 1363} {"train_loss": -40.17316436767578, "global_step": 164930, "epoch": 1363} {"train_loss": -37.34699249267578, "global_step": 164931, "epoch": 1363} {"train_loss": -39.373390197753906, "global_step": 164932, "epoch": 1363} {"train_loss": -39.80764389038086, "global_step": 164933, "epoch": 1363} {"train_loss": -39.35982894897461, "global_step": 164934, "epoch": 1363} {"train_loss": -39.98366928100586, "global_step": 164935, "epoch": 1363} {"train_loss": -40.099830627441406, "global_step": 164936, "epoch": 1363} {"train_loss": -40.57678985595703, "global_step": 164937, "epoch": 1363} {"train_loss": -39.87784194946289, "global_step": 164938, "epoch": 1363} {"train_loss": -40.6634407043457, "global_step": 164939, "epoch": 1363} {"train_loss": -40.55958938598633, "global_step": 164940, "epoch": 1363} {"train_loss": -40.91938400268555, "global_step": 164941, "epoch": 1363} {"train_loss": -40.1770133972168, "global_step": 164942, "epoch": 1363} {"train_loss": -40.92477035522461, "global_step": 164943, "epoch": 1363} {"train_loss": -39.7998161315918, "global_step": 164944, "epoch": 1363} {"train_loss": -40.7594108581543, "global_step": 164945, "epoch": 1363} {"train_loss": -41.2443962097168, "global_step": 164946, "epoch": 1363} {"train_loss": -40.696075439453125, "global_step": 164947, "epoch": 1363} {"train_loss": -41.264190673828125, "global_step": 164948, "epoch": 1363} {"train_loss": -40.77259063720703, "global_step": 164949, "epoch": 1363} {"train_loss": -41.91333770751953, "global_step": 164950, "epoch": 1363} {"train_loss": -40.858497619628906, "global_step": 164951, "epoch": 1363} {"train_loss": -41.54624557495117, "global_step": 164952, "epoch": 1363} {"train_loss": -41.67548751831055, "global_step": 164953, "epoch": 1363} {"train_loss": -42.27764892578125, "global_step": 164954, "epoch": 1363} {"train_loss": -41.5787353515625, "global_step": 164955, "epoch": 1363} {"train_loss": -41.574440002441406, "global_step": 164956, "epoch": 1363} {"train_loss": -41.70899200439453, "global_step": 164957, "epoch": 1363} {"train_loss": -42.14292526245117, "global_step": 164958, "epoch": 1363} {"train_loss": -41.819374084472656, "global_step": 164959, "epoch": 1363} {"train_loss": -41.95974349975586, "global_step": 164960, "epoch": 1363} {"train_loss": -41.41175079345703, "global_step": 164961, "epoch": 1363} {"train_loss": -41.93812942504883, "global_step": 164962, "epoch": 1363} {"train_loss": -41.43972396850586, "global_step": 164963, "epoch": 1363} {"train_loss": -40.7649040222168, "global_step": 164964, "epoch": 1363} {"train_loss": -41.37156295776367, "global_step": 164965, "epoch": 1363} {"train_loss": -41.55270004272461, "global_step": 164966, "epoch": 1363} {"train_loss": -41.82101821899414, "global_step": 164967, "epoch": 1363} {"train_loss": -41.701263427734375, "global_step": 164968, "epoch": 1363} {"train_loss": -41.4205322265625, "global_step": 164969, "epoch": 1363} {"train_loss": -41.07100296020508, "global_step": 164970, "epoch": 1363} {"train_loss": -42.036067962646484, "global_step": 164971, "epoch": 1363} {"train_loss": -41.947113037109375, "global_step": 164972, "epoch": 1363} {"train_loss": -42.18157958984375, "global_step": 164973, "epoch": 1363} {"train_loss": -41.40983200073242, "global_step": 164974, "epoch": 1363} {"train_loss": -41.719879150390625, "global_step": 164975, "epoch": 1363} {"train_loss": -41.217647552490234, "global_step": 164976, "epoch": 1363} {"train_loss": -42.43215560913086, "global_step": 164977, "epoch": 1363} {"train_loss": -41.90792465209961, "global_step": 164978, "epoch": 1363} {"train_loss": -41.99383544921875, "global_step": 164979, "epoch": 1363} {"train_loss": -42.065731048583984, "global_step": 164980, "epoch": 1363} {"train_loss": -42.00324249267578, "global_step": 164981, "epoch": 1363} {"train_loss": -42.17871856689453, "global_step": 164982, "epoch": 1363} {"train_loss": -40.75905990600586, "global_step": 164983, "epoch": 1363} {"train_loss": -40.77804946899414, "global_step": 164984, "epoch": 1363} {"train_loss": -40.72698974609375, "global_step": 164985, "epoch": 1363} {"train_loss": -42.25827407836914, "global_step": 164986, "epoch": 1363} {"train_loss": -41.8574104309082, "global_step": 164987, "epoch": 1363} {"train_loss": -40.75700378417969, "global_step": 164988, "epoch": 1363} {"train_loss": -40.6056022644043, "global_step": 164989, "epoch": 1363} {"train_loss": -41.82624053955078, "global_step": 164990, "epoch": 1363} {"train_loss": -42.56675720214844, "global_step": 164991, "epoch": 1363} {"train_loss": -42.4794921875, "global_step": 164992, "epoch": 1363} {"train_loss": -42.2666015625, "global_step": 164993, "epoch": 1363} {"train_loss": -42.733890533447266, "global_step": 164994, "epoch": 1363} {"train_loss": -42.62825393676758, "global_step": 164995, "epoch": 1363} {"train_loss": -42.421756744384766, "global_step": 164996, "epoch": 1363} {"train_loss": -42.672950744628906, "global_step": 164997, "epoch": 1363} {"train_loss": -42.14137649536133, "global_step": 164998, "epoch": 1363} {"train_loss": -42.2491569519043, "global_step": 164999, "epoch": 1363} {"train_loss": -42.22710037231445, "global_step": 165000, "epoch": 1363} {"train_loss": -42.34459686279297, "global_step": 165001, "epoch": 1363} {"train_loss": -41.75649642944336, "global_step": 165002, "epoch": 1363} {"train_loss": -42.445152282714844, "global_step": 165003, "epoch": 1363} {"train_loss": -42.744686126708984, "global_step": 165004, "epoch": 1363} {"train_loss": -42.8139762878418, "global_step": 165005, "epoch": 1363} {"train_loss": -42.33207321166992, "global_step": 165006, "epoch": 1363} {"train_loss": -42.33795928955078, "global_step": 165007, "epoch": 1363} {"train_loss": -42.49697494506836, "global_step": 165008, "epoch": 1363} {"train_loss": -42.31768798828125, "global_step": 165009, "epoch": 1363} {"train_loss": -42.06321334838867, "global_step": 165010, "epoch": 1363} {"train_loss": -40.98762130737305, "global_step": 165011, "epoch": 1363} {"train_loss": -41.2355842590332, "global_step": 165012, "epoch": 1363} {"train_loss": -41.587947845458984, "global_step": 165013, "epoch": 1363} {"train_loss": -41.194580078125, "global_step": 165014, "epoch": 1363} {"train_loss": -40.80778884887695, "global_step": 165015, "epoch": 1363} {"train_loss": -42.46397018432617, "global_step": 165016, "epoch": 1363} {"train_loss": -41.99654769897461, "global_step": 165017, "epoch": 1363} {"train_loss": -41.45552444458008, "global_step": 165018, "epoch": 1363} {"train_loss": -39.47576904296875, "global_step": 165019, "epoch": 1363} {"train_loss": -38.32426452636719, "global_step": 165020, "epoch": 1363} {"train_loss": -41.143898010253906, "global_step": 165021, "epoch": 1363} {"train_loss": -39.9709587097168, "global_step": 165022, "epoch": 1363} {"train_loss": -37.146575927734375, "global_step": 165023, "epoch": 1363} {"train_loss": -39.43726348876953, "global_step": 165024, "epoch": 1363} {"train_loss": -41.28671646118164, "global_step": 165025, "epoch": 1363} {"train_loss": -38.6485710144043, "global_step": 165026, "epoch": 1363} {"train_loss": -37.797847747802734, "global_step": 165027, "epoch": 1363} {"train_loss": -41.732460021972656, "global_step": 165028, "epoch": 1363} {"train_loss": -39.52284622192383, "global_step": 165029, "epoch": 1363} {"train_loss": -38.29375076293945, "global_step": 165030, "epoch": 1363} {"train_loss": -41.66221237182617, "global_step": 165031, "epoch": 1363} {"train_loss": -38.223228454589844, "global_step": 165032, "epoch": 1363} {"train_loss": -39.285255432128906, "global_step": 165033, "epoch": 1363} {"train_loss": -41.20172882080078, "global_step": 165034, "epoch": 1363} {"train_loss": -39.329402923583984, "global_step": 165035, "epoch": 1363} {"train_loss": -40.1778450012207, "global_step": 165036, "epoch": 1363} {"train_loss": -41.15627670288086, "global_step": 165037, "epoch": 1363} {"train_loss": -38.46648025512695, "global_step": 165038, "epoch": 1363} {"train_loss": -41.134552001953125, "global_step": 165039, "epoch": 1363} {"train_loss": -40.50128173828125, "global_step": 165040, "epoch": 1363} {"train_loss": -40.265987396240234, "global_step": 165041, "epoch": 1363} {"train_loss": -41.31940841674805, "global_step": 165042, "epoch": 1363} {"train_loss": -40.97540623688501, "global_step": 165043, "epoch": 1363, "val_loss": 2502821.25} {"train_loss": -40.79093551635742, "global_step": 165044, "epoch": 1364} {"train_loss": -41.68116760253906, "global_step": 165045, "epoch": 1364} {"train_loss": -41.744873046875, "global_step": 165046, "epoch": 1364} {"train_loss": -41.5029296875, "global_step": 165047, "epoch": 1364} {"train_loss": -41.56848907470703, "global_step": 165048, "epoch": 1364} {"train_loss": -41.157535552978516, "global_step": 165049, "epoch": 1364} {"train_loss": -41.79771041870117, "global_step": 165050, "epoch": 1364} {"train_loss": -41.26914596557617, "global_step": 165051, "epoch": 1364} {"train_loss": -41.507568359375, "global_step": 165052, "epoch": 1364} {"train_loss": -41.371803283691406, "global_step": 165053, "epoch": 1364} {"train_loss": -41.73737716674805, "global_step": 165054, "epoch": 1364} {"train_loss": -42.0023078918457, "global_step": 165055, "epoch": 1364} {"train_loss": -41.749794006347656, "global_step": 165056, "epoch": 1364} {"train_loss": -41.95402145385742, "global_step": 165057, "epoch": 1364} {"train_loss": -42.134517669677734, "global_step": 165058, "epoch": 1364} {"train_loss": -41.70083236694336, "global_step": 165059, "epoch": 1364} {"train_loss": -42.07503128051758, "global_step": 165060, "epoch": 1364} {"train_loss": -41.526458740234375, "global_step": 165061, "epoch": 1364} {"train_loss": -41.6583366394043, "global_step": 165062, "epoch": 1364} {"train_loss": -41.99090576171875, "global_step": 165063, "epoch": 1364} {"train_loss": -42.32172775268555, "global_step": 165064, "epoch": 1364} {"train_loss": -42.17082595825195, "global_step": 165065, "epoch": 1364} {"train_loss": -42.25960922241211, "global_step": 165066, "epoch": 1364} {"train_loss": -42.00224685668945, "global_step": 165067, "epoch": 1364} {"train_loss": -42.667236328125, "global_step": 165068, "epoch": 1364} {"train_loss": -42.249671936035156, "global_step": 165069, "epoch": 1364} {"train_loss": -42.09505844116211, "global_step": 165070, "epoch": 1364} {"train_loss": -42.38227081298828, "global_step": 165071, "epoch": 1364} {"train_loss": -41.8970947265625, "global_step": 165072, "epoch": 1364} {"train_loss": -42.2719612121582, "global_step": 165073, "epoch": 1364} {"train_loss": -42.78776550292969, "global_step": 165074, "epoch": 1364} {"train_loss": -42.0684700012207, "global_step": 165075, "epoch": 1364} {"train_loss": -41.41930389404297, "global_step": 165076, "epoch": 1364} {"train_loss": -41.00776672363281, "global_step": 165077, "epoch": 1364} {"train_loss": -41.067787170410156, "global_step": 165078, "epoch": 1364} {"train_loss": -40.196346282958984, "global_step": 165079, "epoch": 1364} {"train_loss": -40.05881118774414, "global_step": 165080, "epoch": 1364} {"train_loss": -41.4119873046875, "global_step": 165081, "epoch": 1364} {"train_loss": -42.2624397277832, "global_step": 165082, "epoch": 1364} {"train_loss": -42.650447845458984, "global_step": 165083, "epoch": 1364} {"train_loss": -42.18950271606445, "global_step": 165084, "epoch": 1364} {"train_loss": -41.03713607788086, "global_step": 165085, "epoch": 1364} {"train_loss": -39.399139404296875, "global_step": 165086, "epoch": 1364} {"train_loss": -39.59416961669922, "global_step": 165087, "epoch": 1364} {"train_loss": -40.85245895385742, "global_step": 165088, "epoch": 1364} {"train_loss": -41.481319427490234, "global_step": 165089, "epoch": 1364} {"train_loss": -41.41841506958008, "global_step": 165090, "epoch": 1364} {"train_loss": -40.61262130737305, "global_step": 165091, "epoch": 1364} {"train_loss": -39.99264144897461, "global_step": 165092, "epoch": 1364} {"train_loss": -40.137237548828125, "global_step": 165093, "epoch": 1364} {"train_loss": -40.534969329833984, "global_step": 165094, "epoch": 1364} {"train_loss": -41.35783004760742, "global_step": 165095, "epoch": 1364} {"train_loss": -36.81708908081055, "global_step": 165096, "epoch": 1364} {"train_loss": -40.048439025878906, "global_step": 165097, "epoch": 1364} {"train_loss": -40.644805908203125, "global_step": 165098, "epoch": 1364} {"train_loss": -37.951377868652344, "global_step": 165099, "epoch": 1364} {"train_loss": -36.43439865112305, "global_step": 165100, "epoch": 1364} {"train_loss": -37.07798385620117, "global_step": 165101, "epoch": 1364} {"train_loss": -37.68841552734375, "global_step": 165102, "epoch": 1364} {"train_loss": -39.9646110534668, "global_step": 165103, "epoch": 1364} {"train_loss": -39.513160705566406, "global_step": 165104, "epoch": 1364} {"train_loss": -36.45991897583008, "global_step": 165105, "epoch": 1364} {"train_loss": -20.44666862487793, "global_step": 165106, "epoch": 1364} {"train_loss": -37.22106170654297, "global_step": 165107, "epoch": 1364} {"train_loss": -38.766014099121094, "global_step": 165108, "epoch": 1364} {"train_loss": -33.95793151855469, "global_step": 165109, "epoch": 1364} {"train_loss": -38.89398956298828, "global_step": 165110, "epoch": 1364} {"train_loss": -35.505062103271484, "global_step": 165111, "epoch": 1364} {"train_loss": -24.435810089111328, "global_step": 165112, "epoch": 1364} {"train_loss": -35.11845397949219, "global_step": 165113, "epoch": 1364} {"train_loss": -28.612340927124023, "global_step": 165114, "epoch": 1364} {"train_loss": -36.346107482910156, "global_step": 165115, "epoch": 1364} {"train_loss": -35.924896240234375, "global_step": 165116, "epoch": 1364} {"train_loss": -32.44297790527344, "global_step": 165117, "epoch": 1364} {"train_loss": -34.803768157958984, "global_step": 165118, "epoch": 1364} {"train_loss": -31.072988510131836, "global_step": 165119, "epoch": 1364} {"train_loss": -33.57149124145508, "global_step": 165120, "epoch": 1364} {"train_loss": -35.717803955078125, "global_step": 165121, "epoch": 1364} {"train_loss": -34.38420486450195, "global_step": 165122, "epoch": 1364} {"train_loss": -32.02584457397461, "global_step": 165123, "epoch": 1364} {"train_loss": -34.199790954589844, "global_step": 165124, "epoch": 1364} {"train_loss": -36.714595794677734, "global_step": 165125, "epoch": 1364} {"train_loss": -33.07308578491211, "global_step": 165126, "epoch": 1364} {"train_loss": -36.61943435668945, "global_step": 165127, "epoch": 1364} {"train_loss": -34.39422607421875, "global_step": 165128, "epoch": 1364} {"train_loss": -37.827606201171875, "global_step": 165129, "epoch": 1364} {"train_loss": -36.46620559692383, "global_step": 165130, "epoch": 1364} {"train_loss": -37.64190673828125, "global_step": 165131, "epoch": 1364} {"train_loss": -36.937782287597656, "global_step": 165132, "epoch": 1364} {"train_loss": -37.655757904052734, "global_step": 165133, "epoch": 1364} {"train_loss": -37.62939453125, "global_step": 165134, "epoch": 1364} {"train_loss": -38.57656478881836, "global_step": 165135, "epoch": 1364} {"train_loss": -39.234615325927734, "global_step": 165136, "epoch": 1364} {"train_loss": -38.98655700683594, "global_step": 165137, "epoch": 1364} {"train_loss": -39.590431213378906, "global_step": 165138, "epoch": 1364} {"train_loss": -39.59281539916992, "global_step": 165139, "epoch": 1364} {"train_loss": -39.7117805480957, "global_step": 165140, "epoch": 1364} {"train_loss": -39.062232971191406, "global_step": 165141, "epoch": 1364} {"train_loss": -39.503509521484375, "global_step": 165142, "epoch": 1364} {"train_loss": -38.979949951171875, "global_step": 165143, "epoch": 1364} {"train_loss": -39.71578598022461, "global_step": 165144, "epoch": 1364} {"train_loss": -39.91233825683594, "global_step": 165145, "epoch": 1364} {"train_loss": -39.900184631347656, "global_step": 165146, "epoch": 1364} {"train_loss": -40.14666748046875, "global_step": 165147, "epoch": 1364} {"train_loss": -39.70711898803711, "global_step": 165148, "epoch": 1364} {"train_loss": -39.59145736694336, "global_step": 165149, "epoch": 1364} {"train_loss": -40.01945877075195, "global_step": 165150, "epoch": 1364} {"train_loss": -40.15913009643555, "global_step": 165151, "epoch": 1364} {"train_loss": -39.92951965332031, "global_step": 165152, "epoch": 1364} {"train_loss": -40.14870071411133, "global_step": 165153, "epoch": 1364} {"train_loss": -39.778011322021484, "global_step": 165154, "epoch": 1364} {"train_loss": -40.7591438293457, "global_step": 165155, "epoch": 1364} {"train_loss": -39.12919235229492, "global_step": 165156, "epoch": 1364} {"train_loss": -40.042171478271484, "global_step": 165157, "epoch": 1364} {"train_loss": -40.45111846923828, "global_step": 165158, "epoch": 1364} {"train_loss": -41.086429595947266, "global_step": 165159, "epoch": 1364} {"train_loss": -40.78385925292969, "global_step": 165160, "epoch": 1364} {"train_loss": -40.657958984375, "global_step": 165161, "epoch": 1364} {"train_loss": -39.882694244384766, "global_step": 165162, "epoch": 1364} {"train_loss": -40.61341857910156, "global_step": 165163, "epoch": 1364} {"train_loss": -39.139151817510935, "global_step": 165164, "epoch": 1364, "val_loss": 2566911.0} {"train_loss": -40.390445709228516, "global_step": 165165, "epoch": 1365} {"train_loss": -40.078304290771484, "global_step": 165166, "epoch": 1365} {"train_loss": -40.55242919921875, "global_step": 165167, "epoch": 1365} {"train_loss": -40.47444534301758, "global_step": 165168, "epoch": 1365} {"train_loss": -40.819698333740234, "global_step": 165169, "epoch": 1365} {"train_loss": -40.715415954589844, "global_step": 165170, "epoch": 1365} {"train_loss": -40.51094436645508, "global_step": 165171, "epoch": 1365} {"train_loss": -41.22060012817383, "global_step": 165172, "epoch": 1365} {"train_loss": -40.98209762573242, "global_step": 165173, "epoch": 1365} {"train_loss": -41.27656936645508, "global_step": 165174, "epoch": 1365} {"train_loss": -40.83425521850586, "global_step": 165175, "epoch": 1365} {"train_loss": -39.84148025512695, "global_step": 165176, "epoch": 1365} {"train_loss": -40.862300872802734, "global_step": 165177, "epoch": 1365} {"train_loss": -41.23833084106445, "global_step": 165178, "epoch": 1365} {"train_loss": -42.022972106933594, "global_step": 165179, "epoch": 1365} {"train_loss": -41.59429168701172, "global_step": 165180, "epoch": 1365} {"train_loss": -41.734886169433594, "global_step": 165181, "epoch": 1365} {"train_loss": -41.295936584472656, "global_step": 165182, "epoch": 1365} {"train_loss": -40.95512771606445, "global_step": 165183, "epoch": 1365} {"train_loss": -41.46453094482422, "global_step": 165184, "epoch": 1365} {"train_loss": -41.687530517578125, "global_step": 165185, "epoch": 1365} {"train_loss": -40.945892333984375, "global_step": 165186, "epoch": 1365} {"train_loss": -41.629390716552734, "global_step": 165187, "epoch": 1365} {"train_loss": -41.251251220703125, "global_step": 165188, "epoch": 1365} {"train_loss": -41.46623992919922, "global_step": 165189, "epoch": 1365} {"train_loss": -41.83720397949219, "global_step": 165190, "epoch": 1365} {"train_loss": -41.73942947387695, "global_step": 165191, "epoch": 1365} {"train_loss": -41.767913818359375, "global_step": 165192, "epoch": 1365} {"train_loss": -41.1302375793457, "global_step": 165193, "epoch": 1365} {"train_loss": -41.35288619995117, "global_step": 165194, "epoch": 1365} {"train_loss": -41.81449508666992, "global_step": 165195, "epoch": 1365} {"train_loss": -41.880062103271484, "global_step": 165196, "epoch": 1365} {"train_loss": -42.10724639892578, "global_step": 165197, "epoch": 1365} {"train_loss": -41.74778366088867, "global_step": 165198, "epoch": 1365} {"train_loss": -41.00313949584961, "global_step": 165199, "epoch": 1365} {"train_loss": -41.48856735229492, "global_step": 165200, "epoch": 1365} {"train_loss": -42.43169021606445, "global_step": 165201, "epoch": 1365} {"train_loss": -41.928646087646484, "global_step": 165202, "epoch": 1365} {"train_loss": -41.197235107421875, "global_step": 165203, "epoch": 1365} {"train_loss": -41.323116302490234, "global_step": 165204, "epoch": 1365} {"train_loss": -41.24556350708008, "global_step": 165205, "epoch": 1365} {"train_loss": -41.92526626586914, "global_step": 165206, "epoch": 1365} {"train_loss": -40.63441848754883, "global_step": 165207, "epoch": 1365} {"train_loss": -40.084388732910156, "global_step": 165208, "epoch": 1365} {"train_loss": -39.674861907958984, "global_step": 165209, "epoch": 1365} {"train_loss": -36.090911865234375, "global_step": 165210, "epoch": 1365} {"train_loss": -39.7570686340332, "global_step": 165211, "epoch": 1365} {"train_loss": -41.75238800048828, "global_step": 165212, "epoch": 1365} {"train_loss": -42.20575714111328, "global_step": 165213, "epoch": 1365} {"train_loss": -40.500274658203125, "global_step": 165214, "epoch": 1365} {"train_loss": -39.99673080444336, "global_step": 165215, "epoch": 1365} {"train_loss": -40.7325553894043, "global_step": 165216, "epoch": 1365} {"train_loss": -41.53899383544922, "global_step": 165217, "epoch": 1365} {"train_loss": -40.3051643371582, "global_step": 165218, "epoch": 1365} {"train_loss": -39.35897445678711, "global_step": 165219, "epoch": 1365} {"train_loss": -38.56620407104492, "global_step": 165220, "epoch": 1365} {"train_loss": -41.13118362426758, "global_step": 165221, "epoch": 1365} {"train_loss": -38.61210250854492, "global_step": 165222, "epoch": 1365} {"train_loss": -40.11911392211914, "global_step": 165223, "epoch": 1365} {"train_loss": -40.61301803588867, "global_step": 165224, "epoch": 1365} {"train_loss": -40.14310836791992, "global_step": 165225, "epoch": 1365} {"train_loss": -39.00790023803711, "global_step": 165226, "epoch": 1365} {"train_loss": -39.828365325927734, "global_step": 165227, "epoch": 1365} {"train_loss": -40.85206985473633, "global_step": 165228, "epoch": 1365} {"train_loss": -40.48221969604492, "global_step": 165229, "epoch": 1365} {"train_loss": -40.65886688232422, "global_step": 165230, "epoch": 1365} {"train_loss": -40.933380126953125, "global_step": 165231, "epoch": 1365} {"train_loss": -41.524959564208984, "global_step": 165232, "epoch": 1365} {"train_loss": -41.54060745239258, "global_step": 165233, "epoch": 1365} {"train_loss": -40.52952575683594, "global_step": 165234, "epoch": 1365} {"train_loss": -41.38134765625, "global_step": 165235, "epoch": 1365} {"train_loss": -41.62799072265625, "global_step": 165236, "epoch": 1365} {"train_loss": -40.66535949707031, "global_step": 165237, "epoch": 1365} {"train_loss": -40.89145278930664, "global_step": 165238, "epoch": 1365} {"train_loss": -40.75175094604492, "global_step": 165239, "epoch": 1365} {"train_loss": -41.06894302368164, "global_step": 165240, "epoch": 1365} {"train_loss": -39.785465240478516, "global_step": 165241, "epoch": 1365} {"train_loss": -38.9981803894043, "global_step": 165242, "epoch": 1365} {"train_loss": -41.080596923828125, "global_step": 165243, "epoch": 1365} {"train_loss": -41.0228271484375, "global_step": 165244, "epoch": 1365} {"train_loss": -39.91677474975586, "global_step": 165245, "epoch": 1365} {"train_loss": -40.3806037902832, "global_step": 165246, "epoch": 1365} {"train_loss": -40.947784423828125, "global_step": 165247, "epoch": 1365} {"train_loss": -41.534725189208984, "global_step": 165248, "epoch": 1365} {"train_loss": -41.553306579589844, "global_step": 165249, "epoch": 1365} {"train_loss": -41.230224609375, "global_step": 165250, "epoch": 1365} {"train_loss": -41.41862106323242, "global_step": 165251, "epoch": 1365} {"train_loss": -41.10233688354492, "global_step": 165252, "epoch": 1365} {"train_loss": -41.313446044921875, "global_step": 165253, "epoch": 1365} {"train_loss": -41.05510330200195, "global_step": 165254, "epoch": 1365} {"train_loss": -41.13603210449219, "global_step": 165255, "epoch": 1365} {"train_loss": -41.0140495300293, "global_step": 165256, "epoch": 1365} {"train_loss": -41.49911880493164, "global_step": 165257, "epoch": 1365} {"train_loss": -41.17192459106445, "global_step": 165258, "epoch": 1365} {"train_loss": -40.81044006347656, "global_step": 165259, "epoch": 1365} {"train_loss": -40.631526947021484, "global_step": 165260, "epoch": 1365} {"train_loss": -41.320648193359375, "global_step": 165261, "epoch": 1365} {"train_loss": -41.47068786621094, "global_step": 165262, "epoch": 1365} {"train_loss": -41.31683349609375, "global_step": 165263, "epoch": 1365} {"train_loss": -40.272972106933594, "global_step": 165264, "epoch": 1365} {"train_loss": -41.177059173583984, "global_step": 165265, "epoch": 1365} {"train_loss": -41.474918365478516, "global_step": 165266, "epoch": 1365} {"train_loss": -41.43654251098633, "global_step": 165267, "epoch": 1365} {"train_loss": -40.79316329956055, "global_step": 165268, "epoch": 1365} {"train_loss": -41.22501754760742, "global_step": 165269, "epoch": 1365} {"train_loss": -41.12691879272461, "global_step": 165270, "epoch": 1365} {"train_loss": -40.6548957824707, "global_step": 165271, "epoch": 1365} {"train_loss": -41.11555862426758, "global_step": 165272, "epoch": 1365} {"train_loss": -40.41890335083008, "global_step": 165273, "epoch": 1365} {"train_loss": -40.910491943359375, "global_step": 165274, "epoch": 1365} {"train_loss": -41.27810287475586, "global_step": 165275, "epoch": 1365} {"train_loss": -40.44526290893555, "global_step": 165276, "epoch": 1365} {"train_loss": -40.57784652709961, "global_step": 165277, "epoch": 1365} {"train_loss": -40.25861358642578, "global_step": 165278, "epoch": 1365} {"train_loss": -41.0135498046875, "global_step": 165279, "epoch": 1365} {"train_loss": -40.82310104370117, "global_step": 165280, "epoch": 1365} {"train_loss": -40.37649154663086, "global_step": 165281, "epoch": 1365} {"train_loss": -40.52546310424805, "global_step": 165282, "epoch": 1365} {"train_loss": -41.23415756225586, "global_step": 165283, "epoch": 1365} {"train_loss": -40.06620788574219, "global_step": 165284, "epoch": 1365} {"train_loss": -40.87685879794034, "global_step": 165285, "epoch": 1365, "val_loss": 2520549.5} {"train_loss": -40.84383773803711, "global_step": 165286, "epoch": 1366} {"train_loss": -41.81828308105469, "global_step": 165287, "epoch": 1366} {"train_loss": -40.633548736572266, "global_step": 165288, "epoch": 1366} {"train_loss": -40.79747009277344, "global_step": 165289, "epoch": 1366} {"train_loss": -41.40336990356445, "global_step": 165290, "epoch": 1366} {"train_loss": -41.676666259765625, "global_step": 165291, "epoch": 1366} {"train_loss": -40.76405715942383, "global_step": 165292, "epoch": 1366} {"train_loss": -41.606597900390625, "global_step": 165293, "epoch": 1366} {"train_loss": -41.4974479675293, "global_step": 165294, "epoch": 1366} {"train_loss": -41.277034759521484, "global_step": 165295, "epoch": 1366} {"train_loss": -41.49357604980469, "global_step": 165296, "epoch": 1366} {"train_loss": -39.39146041870117, "global_step": 165297, "epoch": 1366} {"train_loss": -41.339515686035156, "global_step": 165298, "epoch": 1366} {"train_loss": -41.41816711425781, "global_step": 165299, "epoch": 1366} {"train_loss": -38.79581832885742, "global_step": 165300, "epoch": 1366} {"train_loss": -41.22489929199219, "global_step": 165301, "epoch": 1366} {"train_loss": -41.297115325927734, "global_step": 165302, "epoch": 1366} {"train_loss": -39.96017074584961, "global_step": 165303, "epoch": 1366} {"train_loss": -41.29020309448242, "global_step": 165304, "epoch": 1366} {"train_loss": -39.77907180786133, "global_step": 165305, "epoch": 1366} {"train_loss": -40.11857986450195, "global_step": 165306, "epoch": 1366} {"train_loss": -39.36467361450195, "global_step": 165307, "epoch": 1366} {"train_loss": -37.20370101928711, "global_step": 165308, "epoch": 1366} {"train_loss": -39.18227005004883, "global_step": 165309, "epoch": 1366} {"train_loss": -40.8730354309082, "global_step": 165310, "epoch": 1366} {"train_loss": -39.6931037902832, "global_step": 165311, "epoch": 1366} {"train_loss": -39.2586784362793, "global_step": 165312, "epoch": 1366} {"train_loss": -40.92986297607422, "global_step": 165313, "epoch": 1366} {"train_loss": -39.6707878112793, "global_step": 165314, "epoch": 1366} {"train_loss": -39.34284591674805, "global_step": 165315, "epoch": 1366} {"train_loss": -40.10476303100586, "global_step": 165316, "epoch": 1366} {"train_loss": -40.82236862182617, "global_step": 165317, "epoch": 1366} {"train_loss": -41.83761978149414, "global_step": 165318, "epoch": 1366} {"train_loss": -40.758026123046875, "global_step": 165319, "epoch": 1366} {"train_loss": -41.12141036987305, "global_step": 165320, "epoch": 1366} {"train_loss": -40.77449417114258, "global_step": 165321, "epoch": 1366} {"train_loss": -41.10123062133789, "global_step": 165322, "epoch": 1366} {"train_loss": -40.94293975830078, "global_step": 165323, "epoch": 1366} {"train_loss": -40.55656051635742, "global_step": 165324, "epoch": 1366} {"train_loss": -41.56013870239258, "global_step": 165325, "epoch": 1366} {"train_loss": -40.81574249267578, "global_step": 165326, "epoch": 1366} {"train_loss": -41.44469451904297, "global_step": 165327, "epoch": 1366} {"train_loss": -40.96924591064453, "global_step": 165328, "epoch": 1366} {"train_loss": -41.20173263549805, "global_step": 165329, "epoch": 1366} {"train_loss": -40.841129302978516, "global_step": 165330, "epoch": 1366} {"train_loss": -41.330379486083984, "global_step": 165331, "epoch": 1366} {"train_loss": -41.30230712890625, "global_step": 165332, "epoch": 1366} {"train_loss": -41.15928649902344, "global_step": 165333, "epoch": 1366} {"train_loss": -40.99125289916992, "global_step": 165334, "epoch": 1366} {"train_loss": -41.539642333984375, "global_step": 165335, "epoch": 1366} {"train_loss": -41.143829345703125, "global_step": 165336, "epoch": 1366} {"train_loss": -41.33283615112305, "global_step": 165337, "epoch": 1366} {"train_loss": -41.956825256347656, "global_step": 165338, "epoch": 1366} {"train_loss": -42.13584518432617, "global_step": 165339, "epoch": 1366} {"train_loss": -41.22431182861328, "global_step": 165340, "epoch": 1366} {"train_loss": -41.7561149597168, "global_step": 165341, "epoch": 1366} {"train_loss": -42.0990104675293, "global_step": 165342, "epoch": 1366} {"train_loss": -41.95207595825195, "global_step": 165343, "epoch": 1366} {"train_loss": -41.81382751464844, "global_step": 165344, "epoch": 1366} {"train_loss": -40.862579345703125, "global_step": 165345, "epoch": 1366} {"train_loss": -41.065303802490234, "global_step": 165346, "epoch": 1366} {"train_loss": -41.32106399536133, "global_step": 165347, "epoch": 1366} {"train_loss": -40.86941146850586, "global_step": 165348, "epoch": 1366} {"train_loss": -41.51739501953125, "global_step": 165349, "epoch": 1366} {"train_loss": -41.39823913574219, "global_step": 165350, "epoch": 1366} {"train_loss": -41.898738861083984, "global_step": 165351, "epoch": 1366} {"train_loss": -41.46784973144531, "global_step": 165352, "epoch": 1366} {"train_loss": -42.062782287597656, "global_step": 165353, "epoch": 1366} {"train_loss": -41.853214263916016, "global_step": 165354, "epoch": 1366} {"train_loss": -41.316158294677734, "global_step": 165355, "epoch": 1366} {"train_loss": -40.9697151184082, "global_step": 165356, "epoch": 1366} {"train_loss": -39.92866516113281, "global_step": 165357, "epoch": 1366} {"train_loss": -38.322425842285156, "global_step": 165358, "epoch": 1366} {"train_loss": -39.90264129638672, "global_step": 165359, "epoch": 1366} {"train_loss": -41.44348907470703, "global_step": 165360, "epoch": 1366} {"train_loss": -41.541221618652344, "global_step": 165361, "epoch": 1366} {"train_loss": -40.53890609741211, "global_step": 165362, "epoch": 1366} {"train_loss": -38.180599212646484, "global_step": 165363, "epoch": 1366} {"train_loss": -37.77252960205078, "global_step": 165364, "epoch": 1366} {"train_loss": -38.67564392089844, "global_step": 165365, "epoch": 1366} {"train_loss": -40.58625411987305, "global_step": 165366, "epoch": 1366} {"train_loss": -41.84879684448242, "global_step": 165367, "epoch": 1366} {"train_loss": -41.14022445678711, "global_step": 165368, "epoch": 1366} {"train_loss": -40.63326644897461, "global_step": 165369, "epoch": 1366} {"train_loss": -41.48895263671875, "global_step": 165370, "epoch": 1366} {"train_loss": -41.438270568847656, "global_step": 165371, "epoch": 1366} {"train_loss": -40.298072814941406, "global_step": 165372, "epoch": 1366} {"train_loss": -41.31624984741211, "global_step": 165373, "epoch": 1366} {"train_loss": -41.843849182128906, "global_step": 165374, "epoch": 1366} {"train_loss": -41.23223876953125, "global_step": 165375, "epoch": 1366} {"train_loss": -41.17512512207031, "global_step": 165376, "epoch": 1366} {"train_loss": -41.468421936035156, "global_step": 165377, "epoch": 1366} {"train_loss": -41.731807708740234, "global_step": 165378, "epoch": 1366} {"train_loss": -40.7991828918457, "global_step": 165379, "epoch": 1366} {"train_loss": -42.112056732177734, "global_step": 165380, "epoch": 1366} {"train_loss": -41.590126037597656, "global_step": 165381, "epoch": 1366} {"train_loss": -40.19868087768555, "global_step": 165382, "epoch": 1366} {"train_loss": -42.00358581542969, "global_step": 165383, "epoch": 1366} {"train_loss": -41.345298767089844, "global_step": 165384, "epoch": 1366} {"train_loss": -40.745697021484375, "global_step": 165385, "epoch": 1366} {"train_loss": -41.92396926879883, "global_step": 165386, "epoch": 1366} {"train_loss": -41.740211486816406, "global_step": 165387, "epoch": 1366} {"train_loss": -41.20703887939453, "global_step": 165388, "epoch": 1366} {"train_loss": -41.51667022705078, "global_step": 165389, "epoch": 1366} {"train_loss": -41.33721923828125, "global_step": 165390, "epoch": 1366} {"train_loss": -41.97697830200195, "global_step": 165391, "epoch": 1366} {"train_loss": -40.749969482421875, "global_step": 165392, "epoch": 1366} {"train_loss": -39.568294525146484, "global_step": 165393, "epoch": 1366} {"train_loss": -40.23079299926758, "global_step": 165394, "epoch": 1366} {"train_loss": -40.47199630737305, "global_step": 165395, "epoch": 1366} {"train_loss": -40.35799789428711, "global_step": 165396, "epoch": 1366} {"train_loss": -41.32180404663086, "global_step": 165397, "epoch": 1366} {"train_loss": -41.46274185180664, "global_step": 165398, "epoch": 1366} {"train_loss": -39.83440399169922, "global_step": 165399, "epoch": 1366} {"train_loss": -40.862483978271484, "global_step": 165400, "epoch": 1366} {"train_loss": -40.2857551574707, "global_step": 165401, "epoch": 1366} {"train_loss": -40.532684326171875, "global_step": 165402, "epoch": 1366} {"train_loss": -40.90867614746094, "global_step": 165403, "epoch": 1366} {"train_loss": -40.73830032348633, "global_step": 165404, "epoch": 1366} {"train_loss": -41.79644775390625, "global_step": 165405, "epoch": 1366} {"train_loss": -40.89624997603992, "global_step": 165406, "epoch": 1366, "val_loss": 2466987.75} {"train_loss": -41.854671478271484, "global_step": 165407, "epoch": 1367} {"train_loss": -42.03791046142578, "global_step": 165408, "epoch": 1367} {"train_loss": -41.60584259033203, "global_step": 165409, "epoch": 1367} {"train_loss": -41.636051177978516, "global_step": 165410, "epoch": 1367} {"train_loss": -41.5432243347168, "global_step": 165411, "epoch": 1367} {"train_loss": -41.37095260620117, "global_step": 165412, "epoch": 1367} {"train_loss": -40.55953598022461, "global_step": 165413, "epoch": 1367} {"train_loss": -41.07695770263672, "global_step": 165414, "epoch": 1367} {"train_loss": -41.69831466674805, "global_step": 165415, "epoch": 1367} {"train_loss": -41.55274200439453, "global_step": 165416, "epoch": 1367} {"train_loss": -40.606807708740234, "global_step": 165417, "epoch": 1367} {"train_loss": -41.235355377197266, "global_step": 165418, "epoch": 1367} {"train_loss": -41.55742263793945, "global_step": 165419, "epoch": 1367} {"train_loss": -41.996070861816406, "global_step": 165420, "epoch": 1367} {"train_loss": -40.57579803466797, "global_step": 165421, "epoch": 1367} {"train_loss": -41.09373474121094, "global_step": 165422, "epoch": 1367} {"train_loss": -40.69970703125, "global_step": 165423, "epoch": 1367} {"train_loss": -40.45479202270508, "global_step": 165424, "epoch": 1367} {"train_loss": -38.716365814208984, "global_step": 165425, "epoch": 1367} {"train_loss": -40.01361846923828, "global_step": 165426, "epoch": 1367} {"train_loss": -42.0026969909668, "global_step": 165427, "epoch": 1367} {"train_loss": -39.807613372802734, "global_step": 165428, "epoch": 1367} {"train_loss": -40.50396728515625, "global_step": 165429, "epoch": 1367} {"train_loss": -41.943382263183594, "global_step": 165430, "epoch": 1367} {"train_loss": -41.354557037353516, "global_step": 165431, "epoch": 1367} {"train_loss": -40.8737907409668, "global_step": 165432, "epoch": 1367} {"train_loss": -42.19866943359375, "global_step": 165433, "epoch": 1367} {"train_loss": -41.84253692626953, "global_step": 165434, "epoch": 1367} {"train_loss": -41.26832580566406, "global_step": 165435, "epoch": 1367} {"train_loss": -41.824256896972656, "global_step": 165436, "epoch": 1367} {"train_loss": -41.58633041381836, "global_step": 165437, "epoch": 1367} {"train_loss": -41.82352828979492, "global_step": 165438, "epoch": 1367} {"train_loss": -41.846824645996094, "global_step": 165439, "epoch": 1367} {"train_loss": -42.22864532470703, "global_step": 165440, "epoch": 1367} {"train_loss": -41.52239227294922, "global_step": 165441, "epoch": 1367} {"train_loss": -42.048282623291016, "global_step": 165442, "epoch": 1367} {"train_loss": -42.080745697021484, "global_step": 165443, "epoch": 1367} {"train_loss": -41.96083450317383, "global_step": 165444, "epoch": 1367} {"train_loss": -41.97590637207031, "global_step": 165445, "epoch": 1367} {"train_loss": -40.975337982177734, "global_step": 165446, "epoch": 1367} {"train_loss": -41.96901321411133, "global_step": 165447, "epoch": 1367} {"train_loss": -41.52418899536133, "global_step": 165448, "epoch": 1367} {"train_loss": -39.836463928222656, "global_step": 165449, "epoch": 1367} {"train_loss": -42.025508880615234, "global_step": 165450, "epoch": 1367} {"train_loss": -40.36897659301758, "global_step": 165451, "epoch": 1367} {"train_loss": -38.404415130615234, "global_step": 165452, "epoch": 1367} {"train_loss": -38.260498046875, "global_step": 165453, "epoch": 1367} {"train_loss": -37.621726989746094, "global_step": 165454, "epoch": 1367} {"train_loss": -36.02889633178711, "global_step": 165455, "epoch": 1367} {"train_loss": -40.90382766723633, "global_step": 165456, "epoch": 1367} {"train_loss": -38.99900817871094, "global_step": 165457, "epoch": 1367} {"train_loss": -36.828121185302734, "global_step": 165458, "epoch": 1367} {"train_loss": -40.88796615600586, "global_step": 165459, "epoch": 1367} {"train_loss": -36.845741271972656, "global_step": 165460, "epoch": 1367} {"train_loss": -38.22945022583008, "global_step": 165461, "epoch": 1367} {"train_loss": -38.58588790893555, "global_step": 165462, "epoch": 1367} {"train_loss": -39.83839797973633, "global_step": 165463, "epoch": 1367} {"train_loss": -37.265594482421875, "global_step": 165464, "epoch": 1367} {"train_loss": -40.55253219604492, "global_step": 165465, "epoch": 1367} {"train_loss": -38.231178283691406, "global_step": 165466, "epoch": 1367} {"train_loss": -40.367942810058594, "global_step": 165467, "epoch": 1367} {"train_loss": -38.81246566772461, "global_step": 165468, "epoch": 1367} {"train_loss": -40.2230339050293, "global_step": 165469, "epoch": 1367} {"train_loss": -39.585628509521484, "global_step": 165470, "epoch": 1367} {"train_loss": -40.53867721557617, "global_step": 165471, "epoch": 1367} {"train_loss": -39.8215217590332, "global_step": 165472, "epoch": 1367} {"train_loss": -40.34635543823242, "global_step": 165473, "epoch": 1367} {"train_loss": -37.8903923034668, "global_step": 165474, "epoch": 1367} {"train_loss": -40.66311264038086, "global_step": 165475, "epoch": 1367} {"train_loss": -40.276817321777344, "global_step": 165476, "epoch": 1367} {"train_loss": -38.890010833740234, "global_step": 165477, "epoch": 1367} {"train_loss": -39.7071533203125, "global_step": 165478, "epoch": 1367} {"train_loss": -40.26021957397461, "global_step": 165479, "epoch": 1367} {"train_loss": -41.3350944519043, "global_step": 165480, "epoch": 1367} {"train_loss": -39.42660903930664, "global_step": 165481, "epoch": 1367} {"train_loss": -40.49473571777344, "global_step": 165482, "epoch": 1367} {"train_loss": -41.3245964050293, "global_step": 165483, "epoch": 1367} {"train_loss": -40.63288116455078, "global_step": 165484, "epoch": 1367} {"train_loss": -40.896785736083984, "global_step": 165485, "epoch": 1367} {"train_loss": -40.92817306518555, "global_step": 165486, "epoch": 1367} {"train_loss": -40.865474700927734, "global_step": 165487, "epoch": 1367} {"train_loss": -41.22113800048828, "global_step": 165488, "epoch": 1367} {"train_loss": -40.49636459350586, "global_step": 165489, "epoch": 1367} {"train_loss": -40.58152770996094, "global_step": 165490, "epoch": 1367} {"train_loss": -41.08901596069336, "global_step": 165491, "epoch": 1367} {"train_loss": -40.81316375732422, "global_step": 165492, "epoch": 1367} {"train_loss": -41.776336669921875, "global_step": 165493, "epoch": 1367} {"train_loss": -41.153480529785156, "global_step": 165494, "epoch": 1367} {"train_loss": -41.2459831237793, "global_step": 165495, "epoch": 1367} {"train_loss": -41.22572708129883, "global_step": 165496, "epoch": 1367} {"train_loss": -41.1854248046875, "global_step": 165497, "epoch": 1367} {"train_loss": -41.17072677612305, "global_step": 165498, "epoch": 1367} {"train_loss": -40.07577133178711, "global_step": 165499, "epoch": 1367} {"train_loss": -41.29446029663086, "global_step": 165500, "epoch": 1367} {"train_loss": -41.871395111083984, "global_step": 165501, "epoch": 1367} {"train_loss": -41.5333137512207, "global_step": 165502, "epoch": 1367} {"train_loss": -41.25800704956055, "global_step": 165503, "epoch": 1367} {"train_loss": -41.44937515258789, "global_step": 165504, "epoch": 1367} {"train_loss": -41.16620635986328, "global_step": 165505, "epoch": 1367} {"train_loss": -41.731239318847656, "global_step": 165506, "epoch": 1367} {"train_loss": -41.66758346557617, "global_step": 165507, "epoch": 1367} {"train_loss": -41.3265380859375, "global_step": 165508, "epoch": 1367} {"train_loss": -40.47274398803711, "global_step": 165509, "epoch": 1367} {"train_loss": -41.32736587524414, "global_step": 165510, "epoch": 1367} {"train_loss": -41.331298828125, "global_step": 165511, "epoch": 1367} {"train_loss": -41.2884521484375, "global_step": 165512, "epoch": 1367} {"train_loss": -40.01960754394531, "global_step": 165513, "epoch": 1367} {"train_loss": -41.023048400878906, "global_step": 165514, "epoch": 1367} {"train_loss": -41.910274505615234, "global_step": 165515, "epoch": 1367} {"train_loss": -41.235774993896484, "global_step": 165516, "epoch": 1367} {"train_loss": -41.42399978637695, "global_step": 165517, "epoch": 1367} {"train_loss": -41.538330078125, "global_step": 165518, "epoch": 1367} {"train_loss": -41.78310775756836, "global_step": 165519, "epoch": 1367} {"train_loss": -41.636051177978516, "global_step": 165520, "epoch": 1367} {"train_loss": -41.881771087646484, "global_step": 165521, "epoch": 1367} {"train_loss": -41.57898712158203, "global_step": 165522, "epoch": 1367} {"train_loss": -42.016353607177734, "global_step": 165523, "epoch": 1367} {"train_loss": -41.24293518066406, "global_step": 165524, "epoch": 1367} {"train_loss": -41.205535888671875, "global_step": 165525, "epoch": 1367} {"train_loss": -41.790802001953125, "global_step": 165526, "epoch": 1367} {"train_loss": -40.760725068651944, "global_step": 165527, "epoch": 1367, "val_loss": 2513638.25} {"train_loss": -41.94951629638672, "global_step": 165528, "epoch": 1368} {"train_loss": -41.723690032958984, "global_step": 165529, "epoch": 1368} {"train_loss": -41.40178298950195, "global_step": 165530, "epoch": 1368} {"train_loss": -42.3270378112793, "global_step": 165531, "epoch": 1368} {"train_loss": -41.99453353881836, "global_step": 165532, "epoch": 1368} {"train_loss": -40.85581588745117, "global_step": 165533, "epoch": 1368} {"train_loss": -41.09015655517578, "global_step": 165534, "epoch": 1368} {"train_loss": -41.48696517944336, "global_step": 165535, "epoch": 1368} {"train_loss": -42.13804244995117, "global_step": 165536, "epoch": 1368} {"train_loss": -41.61959457397461, "global_step": 165537, "epoch": 1368} {"train_loss": -41.9019889831543, "global_step": 165538, "epoch": 1368} {"train_loss": -42.02973175048828, "global_step": 165539, "epoch": 1368} {"train_loss": -41.804542541503906, "global_step": 165540, "epoch": 1368} {"train_loss": -41.73836898803711, "global_step": 165541, "epoch": 1368} {"train_loss": -42.16291046142578, "global_step": 165542, "epoch": 1368} {"train_loss": -41.42518997192383, "global_step": 165543, "epoch": 1368} {"train_loss": -41.02109909057617, "global_step": 165544, "epoch": 1368} {"train_loss": -40.72927474975586, "global_step": 165545, "epoch": 1368} {"train_loss": -42.40171432495117, "global_step": 165546, "epoch": 1368} {"train_loss": -40.77652359008789, "global_step": 165547, "epoch": 1368} {"train_loss": -39.20476531982422, "global_step": 165548, "epoch": 1368} {"train_loss": -41.23122024536133, "global_step": 165549, "epoch": 1368} {"train_loss": -41.653953552246094, "global_step": 165550, "epoch": 1368} {"train_loss": -40.48173904418945, "global_step": 165551, "epoch": 1368} {"train_loss": -40.52669906616211, "global_step": 165552, "epoch": 1368} {"train_loss": -41.17265701293945, "global_step": 165553, "epoch": 1368} {"train_loss": -40.432769775390625, "global_step": 165554, "epoch": 1368} {"train_loss": -40.41447830200195, "global_step": 165555, "epoch": 1368} {"train_loss": -41.107391357421875, "global_step": 165556, "epoch": 1368} {"train_loss": -41.104652404785156, "global_step": 165557, "epoch": 1368} {"train_loss": -40.62791061401367, "global_step": 165558, "epoch": 1368} {"train_loss": -39.59272003173828, "global_step": 165559, "epoch": 1368} {"train_loss": -41.34589385986328, "global_step": 165560, "epoch": 1368} {"train_loss": -40.51561737060547, "global_step": 165561, "epoch": 1368} {"train_loss": -39.562957763671875, "global_step": 165562, "epoch": 1368} {"train_loss": -40.87133026123047, "global_step": 165563, "epoch": 1368} {"train_loss": -41.33781814575195, "global_step": 165564, "epoch": 1368} {"train_loss": -41.249977111816406, "global_step": 165565, "epoch": 1368} {"train_loss": -41.14644241333008, "global_step": 165566, "epoch": 1368} {"train_loss": -40.85492706298828, "global_step": 165567, "epoch": 1368} {"train_loss": -41.55979537963867, "global_step": 165568, "epoch": 1368} {"train_loss": -41.73723220825195, "global_step": 165569, "epoch": 1368} {"train_loss": -41.90998458862305, "global_step": 165570, "epoch": 1368} {"train_loss": -42.08212661743164, "global_step": 165571, "epoch": 1368} {"train_loss": -41.15275192260742, "global_step": 165572, "epoch": 1368} {"train_loss": -41.846500396728516, "global_step": 165573, "epoch": 1368} {"train_loss": -41.621002197265625, "global_step": 165574, "epoch": 1368} {"train_loss": -41.5025634765625, "global_step": 165575, "epoch": 1368} {"train_loss": -41.87862777709961, "global_step": 165576, "epoch": 1368} {"train_loss": -41.407588958740234, "global_step": 165577, "epoch": 1368} {"train_loss": -42.10550308227539, "global_step": 165578, "epoch": 1368} {"train_loss": -41.73942565917969, "global_step": 165579, "epoch": 1368} {"train_loss": -42.01524353027344, "global_step": 165580, "epoch": 1368} {"train_loss": -41.97506332397461, "global_step": 165581, "epoch": 1368} {"train_loss": -41.51040267944336, "global_step": 165582, "epoch": 1368} {"train_loss": -41.39314651489258, "global_step": 165583, "epoch": 1368} {"train_loss": -41.96210479736328, "global_step": 165584, "epoch": 1368} {"train_loss": -41.77839279174805, "global_step": 165585, "epoch": 1368} {"train_loss": -41.82859420776367, "global_step": 165586, "epoch": 1368} {"train_loss": -42.23786163330078, "global_step": 165587, "epoch": 1368} {"train_loss": -41.801239013671875, "global_step": 165588, "epoch": 1368} {"train_loss": -41.65302658081055, "global_step": 165589, "epoch": 1368} {"train_loss": -41.73878479003906, "global_step": 165590, "epoch": 1368} {"train_loss": -41.30096435546875, "global_step": 165591, "epoch": 1368} {"train_loss": -41.5001335144043, "global_step": 165592, "epoch": 1368} {"train_loss": -41.39524841308594, "global_step": 165593, "epoch": 1368} {"train_loss": -41.63107681274414, "global_step": 165594, "epoch": 1368} {"train_loss": -42.338478088378906, "global_step": 165595, "epoch": 1368} {"train_loss": -42.02384948730469, "global_step": 165596, "epoch": 1368} {"train_loss": -42.179542541503906, "global_step": 165597, "epoch": 1368} {"train_loss": -42.43499755859375, "global_step": 165598, "epoch": 1368} {"train_loss": -41.77729034423828, "global_step": 165599, "epoch": 1368} {"train_loss": -41.10546875, "global_step": 165600, "epoch": 1368} {"train_loss": -40.53365707397461, "global_step": 165601, "epoch": 1368} {"train_loss": -41.4417839050293, "global_step": 165602, "epoch": 1368} {"train_loss": -42.290706634521484, "global_step": 165603, "epoch": 1368} {"train_loss": -41.10169219970703, "global_step": 165604, "epoch": 1368} {"train_loss": -38.933773040771484, "global_step": 165605, "epoch": 1368} {"train_loss": -38.20734786987305, "global_step": 165606, "epoch": 1368} {"train_loss": -40.669525146484375, "global_step": 165607, "epoch": 1368} {"train_loss": -41.399471282958984, "global_step": 165608, "epoch": 1368} {"train_loss": -40.72353744506836, "global_step": 165609, "epoch": 1368} {"train_loss": -39.464332580566406, "global_step": 165610, "epoch": 1368} {"train_loss": -40.64046096801758, "global_step": 165611, "epoch": 1368} {"train_loss": -41.568336486816406, "global_step": 165612, "epoch": 1368} {"train_loss": -40.79099655151367, "global_step": 165613, "epoch": 1368} {"train_loss": -40.13496398925781, "global_step": 165614, "epoch": 1368} {"train_loss": -40.54324722290039, "global_step": 165615, "epoch": 1368} {"train_loss": -40.6577262878418, "global_step": 165616, "epoch": 1368} {"train_loss": -39.770992279052734, "global_step": 165617, "epoch": 1368} {"train_loss": -39.5214958190918, "global_step": 165618, "epoch": 1368} {"train_loss": -41.520545959472656, "global_step": 165619, "epoch": 1368} {"train_loss": -40.07106399536133, "global_step": 165620, "epoch": 1368} {"train_loss": -41.19902801513672, "global_step": 165621, "epoch": 1368} {"train_loss": -40.6556510925293, "global_step": 165622, "epoch": 1368} {"train_loss": -39.898014068603516, "global_step": 165623, "epoch": 1368} {"train_loss": -42.00979232788086, "global_step": 165624, "epoch": 1368} {"train_loss": -38.75703048706055, "global_step": 165625, "epoch": 1368} {"train_loss": -38.056182861328125, "global_step": 165626, "epoch": 1368} {"train_loss": -41.185203552246094, "global_step": 165627, "epoch": 1368} {"train_loss": -40.51134490966797, "global_step": 165628, "epoch": 1368} {"train_loss": -39.167537689208984, "global_step": 165629, "epoch": 1368} {"train_loss": -40.839603424072266, "global_step": 165630, "epoch": 1368} {"train_loss": -38.19423294067383, "global_step": 165631, "epoch": 1368} {"train_loss": -39.75787353515625, "global_step": 165632, "epoch": 1368} {"train_loss": -40.18252944946289, "global_step": 165633, "epoch": 1368} {"train_loss": -38.133827209472656, "global_step": 165634, "epoch": 1368} {"train_loss": -39.84618377685547, "global_step": 165635, "epoch": 1368} {"train_loss": -39.05378341674805, "global_step": 165636, "epoch": 1368} {"train_loss": -39.22468185424805, "global_step": 165637, "epoch": 1368} {"train_loss": -40.7064208984375, "global_step": 165638, "epoch": 1368} {"train_loss": -38.9262809753418, "global_step": 165639, "epoch": 1368} {"train_loss": -39.39152908325195, "global_step": 165640, "epoch": 1368} {"train_loss": -40.51203536987305, "global_step": 165641, "epoch": 1368} {"train_loss": -38.717620849609375, "global_step": 165642, "epoch": 1368} {"train_loss": -40.840030670166016, "global_step": 165643, "epoch": 1368} {"train_loss": -39.8285026550293, "global_step": 165644, "epoch": 1368} {"train_loss": -40.51665115356445, "global_step": 165645, "epoch": 1368} {"train_loss": -40.779449462890625, "global_step": 165646, "epoch": 1368} {"train_loss": -40.121089935302734, "global_step": 165647, "epoch": 1368} {"train_loss": -40.92908947526916, "global_step": 165648, "epoch": 1368, "val_loss": 2523309.25} {"train_loss": -38.62321853637695, "global_step": 165649, "epoch": 1369} {"train_loss": -40.770511627197266, "global_step": 165650, "epoch": 1369} {"train_loss": -39.35590744018555, "global_step": 165651, "epoch": 1369} {"train_loss": -40.06983184814453, "global_step": 165652, "epoch": 1369} {"train_loss": -39.86592102050781, "global_step": 165653, "epoch": 1369} {"train_loss": -40.064598083496094, "global_step": 165654, "epoch": 1369} {"train_loss": -39.99654006958008, "global_step": 165655, "epoch": 1369} {"train_loss": -39.5400505065918, "global_step": 165656, "epoch": 1369} {"train_loss": -39.689727783203125, "global_step": 165657, "epoch": 1369} {"train_loss": -39.40341567993164, "global_step": 165658, "epoch": 1369} {"train_loss": -40.1650505065918, "global_step": 165659, "epoch": 1369} {"train_loss": -40.90129470825195, "global_step": 165660, "epoch": 1369} {"train_loss": -40.21397399902344, "global_step": 165661, "epoch": 1369} {"train_loss": -40.166385650634766, "global_step": 165662, "epoch": 1369} {"train_loss": -40.690589904785156, "global_step": 165663, "epoch": 1369} {"train_loss": -40.3675651550293, "global_step": 165664, "epoch": 1369} {"train_loss": -40.86418533325195, "global_step": 165665, "epoch": 1369} {"train_loss": -40.952232360839844, "global_step": 165666, "epoch": 1369} {"train_loss": -40.9599494934082, "global_step": 165667, "epoch": 1369} {"train_loss": -40.94246292114258, "global_step": 165668, "epoch": 1369} {"train_loss": -41.00251388549805, "global_step": 165669, "epoch": 1369} {"train_loss": -41.58650588989258, "global_step": 165670, "epoch": 1369} {"train_loss": -41.37202835083008, "global_step": 165671, "epoch": 1369} {"train_loss": -41.5141487121582, "global_step": 165672, "epoch": 1369} {"train_loss": -41.379146575927734, "global_step": 165673, "epoch": 1369} {"train_loss": -41.78184509277344, "global_step": 165674, "epoch": 1369} {"train_loss": -41.379215240478516, "global_step": 165675, "epoch": 1369} {"train_loss": -41.27356719970703, "global_step": 165676, "epoch": 1369} {"train_loss": -41.70675277709961, "global_step": 165677, "epoch": 1369} {"train_loss": -41.32334518432617, "global_step": 165678, "epoch": 1369} {"train_loss": -41.97262191772461, "global_step": 165679, "epoch": 1369} {"train_loss": -41.8466796875, "global_step": 165680, "epoch": 1369} {"train_loss": -41.65493392944336, "global_step": 165681, "epoch": 1369} {"train_loss": -42.03944396972656, "global_step": 165682, "epoch": 1369} {"train_loss": -41.7067985534668, "global_step": 165683, "epoch": 1369} {"train_loss": -41.35396957397461, "global_step": 165684, "epoch": 1369} {"train_loss": -41.78070831298828, "global_step": 165685, "epoch": 1369} {"train_loss": -41.974388122558594, "global_step": 165686, "epoch": 1369} {"train_loss": -42.12064743041992, "global_step": 165687, "epoch": 1369} {"train_loss": -41.69926071166992, "global_step": 165688, "epoch": 1369} {"train_loss": -42.05656051635742, "global_step": 165689, "epoch": 1369} {"train_loss": -41.25295639038086, "global_step": 165690, "epoch": 1369} {"train_loss": -42.01819610595703, "global_step": 165691, "epoch": 1369} {"train_loss": -41.189876556396484, "global_step": 165692, "epoch": 1369} {"train_loss": -42.148345947265625, "global_step": 165693, "epoch": 1369} {"train_loss": -41.733821868896484, "global_step": 165694, "epoch": 1369} {"train_loss": -42.12543869018555, "global_step": 165695, "epoch": 1369} {"train_loss": -42.047786712646484, "global_step": 165696, "epoch": 1369} {"train_loss": -41.99462890625, "global_step": 165697, "epoch": 1369} {"train_loss": -42.29958724975586, "global_step": 165698, "epoch": 1369} {"train_loss": -42.74724197387695, "global_step": 165699, "epoch": 1369} {"train_loss": -42.22105026245117, "global_step": 165700, "epoch": 1369} {"train_loss": -42.26638412475586, "global_step": 165701, "epoch": 1369} {"train_loss": -42.46516036987305, "global_step": 165702, "epoch": 1369} {"train_loss": -42.486183166503906, "global_step": 165703, "epoch": 1369} {"train_loss": -42.1037483215332, "global_step": 165704, "epoch": 1369} {"train_loss": -42.15049362182617, "global_step": 165705, "epoch": 1369} {"train_loss": -40.815086364746094, "global_step": 165706, "epoch": 1369} {"train_loss": -41.71413803100586, "global_step": 165707, "epoch": 1369} {"train_loss": -42.6788444519043, "global_step": 165708, "epoch": 1369} {"train_loss": -41.95685958862305, "global_step": 165709, "epoch": 1369} {"train_loss": -41.34511947631836, "global_step": 165710, "epoch": 1369} {"train_loss": -40.524471282958984, "global_step": 165711, "epoch": 1369} {"train_loss": -36.48303985595703, "global_step": 165712, "epoch": 1369} {"train_loss": -33.71578598022461, "global_step": 165713, "epoch": 1369} {"train_loss": -30.07172203063965, "global_step": 165714, "epoch": 1369} {"train_loss": -28.031097412109375, "global_step": 165715, "epoch": 1369} {"train_loss": -26.57977867126465, "global_step": 165716, "epoch": 1369} {"train_loss": -30.751256942749023, "global_step": 165717, "epoch": 1369} {"train_loss": -27.463010787963867, "global_step": 165718, "epoch": 1369} {"train_loss": -32.99824523925781, "global_step": 165719, "epoch": 1369} {"train_loss": -28.20308494567871, "global_step": 165720, "epoch": 1369} {"train_loss": -31.227102279663086, "global_step": 165721, "epoch": 1369} {"train_loss": -32.54041290283203, "global_step": 165722, "epoch": 1369} {"train_loss": -32.55564880371094, "global_step": 165723, "epoch": 1369} {"train_loss": -31.240936279296875, "global_step": 165724, "epoch": 1369} {"train_loss": -33.69984817504883, "global_step": 165725, "epoch": 1369} {"train_loss": -31.37689781188965, "global_step": 165726, "epoch": 1369} {"train_loss": -31.74362564086914, "global_step": 165727, "epoch": 1369} {"train_loss": -32.28339385986328, "global_step": 165728, "epoch": 1369} {"train_loss": -32.9235725402832, "global_step": 165729, "epoch": 1369} {"train_loss": -34.183815002441406, "global_step": 165730, "epoch": 1369} {"train_loss": -33.28074264526367, "global_step": 165731, "epoch": 1369} {"train_loss": -32.94657516479492, "global_step": 165732, "epoch": 1369} {"train_loss": -34.01770782470703, "global_step": 165733, "epoch": 1369} {"train_loss": -34.640167236328125, "global_step": 165734, "epoch": 1369} {"train_loss": -34.43781661987305, "global_step": 165735, "epoch": 1369} {"train_loss": -34.43769454956055, "global_step": 165736, "epoch": 1369} {"train_loss": -35.20681381225586, "global_step": 165737, "epoch": 1369} {"train_loss": -34.79753494262695, "global_step": 165738, "epoch": 1369} {"train_loss": -34.72590255737305, "global_step": 165739, "epoch": 1369} {"train_loss": -34.65040969848633, "global_step": 165740, "epoch": 1369} {"train_loss": -33.75702667236328, "global_step": 165741, "epoch": 1369} {"train_loss": -34.47578811645508, "global_step": 165742, "epoch": 1369} {"train_loss": -34.83761215209961, "global_step": 165743, "epoch": 1369} {"train_loss": -34.405330657958984, "global_step": 165744, "epoch": 1369} {"train_loss": -35.16030502319336, "global_step": 165745, "epoch": 1369} {"train_loss": -35.63560104370117, "global_step": 165746, "epoch": 1369} {"train_loss": -35.44536590576172, "global_step": 165747, "epoch": 1369} {"train_loss": -35.854896545410156, "global_step": 165748, "epoch": 1369} {"train_loss": -34.945960998535156, "global_step": 165749, "epoch": 1369} {"train_loss": -36.50780487060547, "global_step": 165750, "epoch": 1369} {"train_loss": -35.77388381958008, "global_step": 165751, "epoch": 1369} {"train_loss": -35.60630798339844, "global_step": 165752, "epoch": 1369} {"train_loss": -35.951412200927734, "global_step": 165753, "epoch": 1369} {"train_loss": -36.24760437011719, "global_step": 165754, "epoch": 1369} {"train_loss": -36.148983001708984, "global_step": 165755, "epoch": 1369} {"train_loss": -37.11241149902344, "global_step": 165756, "epoch": 1369} {"train_loss": -36.156044006347656, "global_step": 165757, "epoch": 1369} {"train_loss": -36.5834846496582, "global_step": 165758, "epoch": 1369} {"train_loss": -37.172733306884766, "global_step": 165759, "epoch": 1369} {"train_loss": -36.79168701171875, "global_step": 165760, "epoch": 1369} {"train_loss": -37.7627067565918, "global_step": 165761, "epoch": 1369} {"train_loss": -36.18400192260742, "global_step": 165762, "epoch": 1369} {"train_loss": -36.90141296386719, "global_step": 165763, "epoch": 1369} {"train_loss": -37.59918975830078, "global_step": 165764, "epoch": 1369} {"train_loss": -36.84954833984375, "global_step": 165765, "epoch": 1369} {"train_loss": -37.598384857177734, "global_step": 165766, "epoch": 1369} {"train_loss": -36.86587142944336, "global_step": 165767, "epoch": 1369} {"train_loss": -37.501220703125, "global_step": 165768, "epoch": 1369} {"train_loss": -37.93802051701822, "global_step": 165769, "epoch": 1369, "val_loss": 2506618.25} {"train_loss": -36.426918029785156, "global_step": 165770, "epoch": 1370} {"train_loss": -36.882816314697266, "global_step": 165771, "epoch": 1370} {"train_loss": -37.38922119140625, "global_step": 165772, "epoch": 1370} {"train_loss": -38.1338005065918, "global_step": 165773, "epoch": 1370} {"train_loss": -36.8609733581543, "global_step": 165774, "epoch": 1370} {"train_loss": -37.74839401245117, "global_step": 165775, "epoch": 1370} {"train_loss": -36.63693618774414, "global_step": 165776, "epoch": 1370} {"train_loss": -38.15070343017578, "global_step": 165777, "epoch": 1370} {"train_loss": -37.98749923706055, "global_step": 165778, "epoch": 1370} {"train_loss": -37.47200393676758, "global_step": 165779, "epoch": 1370} {"train_loss": -36.91740036010742, "global_step": 165780, "epoch": 1370} {"train_loss": -37.95663833618164, "global_step": 165781, "epoch": 1370} {"train_loss": -37.75584030151367, "global_step": 165782, "epoch": 1370} {"train_loss": -38.03204345703125, "global_step": 165783, "epoch": 1370} {"train_loss": -38.65282440185547, "global_step": 165784, "epoch": 1370} {"train_loss": -39.216243743896484, "global_step": 165785, "epoch": 1370} {"train_loss": -38.98191452026367, "global_step": 165786, "epoch": 1370} {"train_loss": -38.624725341796875, "global_step": 165787, "epoch": 1370} {"train_loss": -38.50022506713867, "global_step": 165788, "epoch": 1370} {"train_loss": -38.4874153137207, "global_step": 165789, "epoch": 1370} {"train_loss": -38.880462646484375, "global_step": 165790, "epoch": 1370} {"train_loss": -38.50571823120117, "global_step": 165791, "epoch": 1370} {"train_loss": -38.58169174194336, "global_step": 165792, "epoch": 1370} {"train_loss": -38.25404739379883, "global_step": 165793, "epoch": 1370} {"train_loss": -36.796566009521484, "global_step": 165794, "epoch": 1370} {"train_loss": -39.276519775390625, "global_step": 165795, "epoch": 1370} {"train_loss": -38.32131576538086, "global_step": 165796, "epoch": 1370} {"train_loss": -36.053985595703125, "global_step": 165797, "epoch": 1370} {"train_loss": -38.19033432006836, "global_step": 165798, "epoch": 1370} {"train_loss": -38.30595016479492, "global_step": 165799, "epoch": 1370} {"train_loss": -38.497962951660156, "global_step": 165800, "epoch": 1370} {"train_loss": -38.85348892211914, "global_step": 165801, "epoch": 1370} {"train_loss": -38.7758674621582, "global_step": 165802, "epoch": 1370} {"train_loss": -38.73146438598633, "global_step": 165803, "epoch": 1370} {"train_loss": -37.80113220214844, "global_step": 165804, "epoch": 1370} {"train_loss": -39.37667465209961, "global_step": 165805, "epoch": 1370} {"train_loss": -38.63007736206055, "global_step": 165806, "epoch": 1370} {"train_loss": -39.49949264526367, "global_step": 165807, "epoch": 1370} {"train_loss": -38.182373046875, "global_step": 165808, "epoch": 1370} {"train_loss": -39.42447280883789, "global_step": 165809, "epoch": 1370} {"train_loss": -38.51095199584961, "global_step": 165810, "epoch": 1370} {"train_loss": -39.23391342163086, "global_step": 165811, "epoch": 1370} {"train_loss": -35.62610626220703, "global_step": 165812, "epoch": 1370} {"train_loss": -39.351200103759766, "global_step": 165813, "epoch": 1370} {"train_loss": -34.8814811706543, "global_step": 165814, "epoch": 1370} {"train_loss": -37.67094802856445, "global_step": 165815, "epoch": 1370} {"train_loss": -35.38123321533203, "global_step": 165816, "epoch": 1370} {"train_loss": -38.40853500366211, "global_step": 165817, "epoch": 1370} {"train_loss": -32.761905670166016, "global_step": 165818, "epoch": 1370} {"train_loss": -38.96984100341797, "global_step": 165819, "epoch": 1370} {"train_loss": -36.02183151245117, "global_step": 165820, "epoch": 1370} {"train_loss": -39.14921951293945, "global_step": 165821, "epoch": 1370} {"train_loss": -38.691566467285156, "global_step": 165822, "epoch": 1370} {"train_loss": -38.21920394897461, "global_step": 165823, "epoch": 1370} {"train_loss": -38.85161209106445, "global_step": 165824, "epoch": 1370} {"train_loss": -38.448974609375, "global_step": 165825, "epoch": 1370} {"train_loss": -37.68572235107422, "global_step": 165826, "epoch": 1370} {"train_loss": -38.64562225341797, "global_step": 165827, "epoch": 1370} {"train_loss": -38.10689926147461, "global_step": 165828, "epoch": 1370} {"train_loss": -39.657447814941406, "global_step": 165829, "epoch": 1370} {"train_loss": -39.31095504760742, "global_step": 165830, "epoch": 1370} {"train_loss": -38.53530502319336, "global_step": 165831, "epoch": 1370} {"train_loss": -38.400123596191406, "global_step": 165832, "epoch": 1370} {"train_loss": -38.73490524291992, "global_step": 165833, "epoch": 1370} {"train_loss": -39.061370849609375, "global_step": 165834, "epoch": 1370} {"train_loss": -38.34401321411133, "global_step": 165835, "epoch": 1370} {"train_loss": -38.86128616333008, "global_step": 165836, "epoch": 1370} {"train_loss": -38.14951705932617, "global_step": 165837, "epoch": 1370} {"train_loss": -37.35796356201172, "global_step": 165838, "epoch": 1370} {"train_loss": -39.05141067504883, "global_step": 165839, "epoch": 1370} {"train_loss": -38.8072624206543, "global_step": 165840, "epoch": 1370} {"train_loss": -37.89052200317383, "global_step": 165841, "epoch": 1370} {"train_loss": -39.263668060302734, "global_step": 165842, "epoch": 1370} {"train_loss": -39.36501693725586, "global_step": 165843, "epoch": 1370} {"train_loss": -39.30808639526367, "global_step": 165844, "epoch": 1370} {"train_loss": -39.334041595458984, "global_step": 165845, "epoch": 1370} {"train_loss": -39.49966049194336, "global_step": 165846, "epoch": 1370} {"train_loss": -39.95209503173828, "global_step": 165847, "epoch": 1370} {"train_loss": -40.01988220214844, "global_step": 165848, "epoch": 1370} {"train_loss": -40.3099479675293, "global_step": 165849, "epoch": 1370} {"train_loss": -39.91716384887695, "global_step": 165850, "epoch": 1370} {"train_loss": -39.37750244140625, "global_step": 165851, "epoch": 1370} {"train_loss": -37.61752700805664, "global_step": 165852, "epoch": 1370} {"train_loss": -39.84830856323242, "global_step": 165853, "epoch": 1370} {"train_loss": -39.72450256347656, "global_step": 165854, "epoch": 1370} {"train_loss": -40.40501022338867, "global_step": 165855, "epoch": 1370} {"train_loss": -38.1172981262207, "global_step": 165856, "epoch": 1370} {"train_loss": -38.68996047973633, "global_step": 165857, "epoch": 1370} {"train_loss": -38.99293518066406, "global_step": 165858, "epoch": 1370} {"train_loss": -40.70732498168945, "global_step": 165859, "epoch": 1370} {"train_loss": -39.63225173950195, "global_step": 165860, "epoch": 1370} {"train_loss": -39.593135833740234, "global_step": 165861, "epoch": 1370} {"train_loss": -39.631038665771484, "global_step": 165862, "epoch": 1370} {"train_loss": -39.11445999145508, "global_step": 165863, "epoch": 1370} {"train_loss": -39.301998138427734, "global_step": 165864, "epoch": 1370} {"train_loss": -39.50001907348633, "global_step": 165865, "epoch": 1370} {"train_loss": -39.66022872924805, "global_step": 165866, "epoch": 1370} {"train_loss": -39.47732162475586, "global_step": 165867, "epoch": 1370} {"train_loss": -40.12395095825195, "global_step": 165868, "epoch": 1370} {"train_loss": -39.16535949707031, "global_step": 165869, "epoch": 1370} {"train_loss": -39.49577713012695, "global_step": 165870, "epoch": 1370} {"train_loss": -38.42217254638672, "global_step": 165871, "epoch": 1370} {"train_loss": -39.8969841003418, "global_step": 165872, "epoch": 1370} {"train_loss": -39.50094223022461, "global_step": 165873, "epoch": 1370} {"train_loss": -40.41526794433594, "global_step": 165874, "epoch": 1370} {"train_loss": -39.201351165771484, "global_step": 165875, "epoch": 1370} {"train_loss": -40.20341873168945, "global_step": 165876, "epoch": 1370} {"train_loss": -39.76825714111328, "global_step": 165877, "epoch": 1370} {"train_loss": -39.984371185302734, "global_step": 165878, "epoch": 1370} {"train_loss": -40.57304382324219, "global_step": 165879, "epoch": 1370} {"train_loss": -36.65032958984375, "global_step": 165880, "epoch": 1370} {"train_loss": -39.87299346923828, "global_step": 165881, "epoch": 1370} {"train_loss": -39.41585922241211, "global_step": 165882, "epoch": 1370} {"train_loss": -38.63740539550781, "global_step": 165883, "epoch": 1370} {"train_loss": -38.6526985168457, "global_step": 165884, "epoch": 1370} {"train_loss": -40.2502555847168, "global_step": 165885, "epoch": 1370} {"train_loss": -40.02558517456055, "global_step": 165886, "epoch": 1370} {"train_loss": -39.548744201660156, "global_step": 165887, "epoch": 1370} {"train_loss": -39.21342849731445, "global_step": 165888, "epoch": 1370} {"train_loss": -37.46295166015625, "global_step": 165889, "epoch": 1370} {"train_loss": -38.629607366136284, "global_step": 165890, "epoch": 1370, "val_loss": 2628725.5} {"train_loss": -38.07758331298828, "global_step": 165891, "epoch": 1371} {"train_loss": -40.1100959777832, "global_step": 165892, "epoch": 1371} {"train_loss": -36.103233337402344, "global_step": 165893, "epoch": 1371} {"train_loss": -40.340003967285156, "global_step": 165894, "epoch": 1371} {"train_loss": -37.90303421020508, "global_step": 165895, "epoch": 1371} {"train_loss": -39.87040328979492, "global_step": 165896, "epoch": 1371} {"train_loss": -38.817665100097656, "global_step": 165897, "epoch": 1371} {"train_loss": -32.432674407958984, "global_step": 165898, "epoch": 1371} {"train_loss": -40.086158752441406, "global_step": 165899, "epoch": 1371} {"train_loss": -37.12532424926758, "global_step": 165900, "epoch": 1371} {"train_loss": -36.11024856567383, "global_step": 165901, "epoch": 1371} {"train_loss": -35.49363327026367, "global_step": 165902, "epoch": 1371} {"train_loss": -38.02504348754883, "global_step": 165903, "epoch": 1371} {"train_loss": -36.449485778808594, "global_step": 165904, "epoch": 1371} {"train_loss": -37.91597366333008, "global_step": 165905, "epoch": 1371} {"train_loss": -37.61809158325195, "global_step": 165906, "epoch": 1371} {"train_loss": -35.661617279052734, "global_step": 165907, "epoch": 1371} {"train_loss": -34.35675811767578, "global_step": 165908, "epoch": 1371} {"train_loss": -38.03811264038086, "global_step": 165909, "epoch": 1371} {"train_loss": -38.0235481262207, "global_step": 165910, "epoch": 1371} {"train_loss": -36.3218879699707, "global_step": 165911, "epoch": 1371} {"train_loss": -37.56035232543945, "global_step": 165912, "epoch": 1371} {"train_loss": -30.5305233001709, "global_step": 165913, "epoch": 1371} {"train_loss": -32.95208740234375, "global_step": 165914, "epoch": 1371} {"train_loss": -34.253211975097656, "global_step": 165915, "epoch": 1371} {"train_loss": -31.463459014892578, "global_step": 165916, "epoch": 1371} {"train_loss": -34.81231689453125, "global_step": 165917, "epoch": 1371} {"train_loss": -32.822723388671875, "global_step": 165918, "epoch": 1371} {"train_loss": -36.90177536010742, "global_step": 165919, "epoch": 1371} {"train_loss": -36.25368118286133, "global_step": 165920, "epoch": 1371} {"train_loss": -33.1147575378418, "global_step": 165921, "epoch": 1371} {"train_loss": -34.17754364013672, "global_step": 165922, "epoch": 1371} {"train_loss": -34.107608795166016, "global_step": 165923, "epoch": 1371} {"train_loss": -33.825286865234375, "global_step": 165924, "epoch": 1371} {"train_loss": -36.58217239379883, "global_step": 165925, "epoch": 1371} {"train_loss": -34.031410217285156, "global_step": 165926, "epoch": 1371} {"train_loss": -35.23126983642578, "global_step": 165927, "epoch": 1371} {"train_loss": -37.15134811401367, "global_step": 165928, "epoch": 1371} {"train_loss": -36.73495864868164, "global_step": 165929, "epoch": 1371} {"train_loss": -36.482723236083984, "global_step": 165930, "epoch": 1371} {"train_loss": -37.5697135925293, "global_step": 165931, "epoch": 1371} {"train_loss": -36.054386138916016, "global_step": 165932, "epoch": 1371} {"train_loss": -38.047237396240234, "global_step": 165933, "epoch": 1371} {"train_loss": -36.81049346923828, "global_step": 165934, "epoch": 1371} {"train_loss": -37.44778060913086, "global_step": 165935, "epoch": 1371} {"train_loss": -38.36860275268555, "global_step": 165936, "epoch": 1371} {"train_loss": -36.99229049682617, "global_step": 165937, "epoch": 1371} {"train_loss": -38.4592399597168, "global_step": 165938, "epoch": 1371} {"train_loss": -38.8699951171875, "global_step": 165939, "epoch": 1371} {"train_loss": -38.52152633666992, "global_step": 165940, "epoch": 1371} {"train_loss": -39.47396469116211, "global_step": 165941, "epoch": 1371} {"train_loss": -35.92333984375, "global_step": 165942, "epoch": 1371} {"train_loss": -38.16365051269531, "global_step": 165943, "epoch": 1371} {"train_loss": -38.71122360229492, "global_step": 165944, "epoch": 1371} {"train_loss": -39.31793975830078, "global_step": 165945, "epoch": 1371} {"train_loss": -38.92341232299805, "global_step": 165946, "epoch": 1371} {"train_loss": -38.552852630615234, "global_step": 165947, "epoch": 1371} {"train_loss": -39.26688003540039, "global_step": 165948, "epoch": 1371} {"train_loss": -38.92503356933594, "global_step": 165949, "epoch": 1371} {"train_loss": -39.24357223510742, "global_step": 165950, "epoch": 1371} {"train_loss": -39.56504440307617, "global_step": 165951, "epoch": 1371} {"train_loss": -39.68056869506836, "global_step": 165952, "epoch": 1371} {"train_loss": -39.15183639526367, "global_step": 165953, "epoch": 1371} {"train_loss": -39.797237396240234, "global_step": 165954, "epoch": 1371} {"train_loss": -38.89728546142578, "global_step": 165955, "epoch": 1371} {"train_loss": -39.539947509765625, "global_step": 165956, "epoch": 1371} {"train_loss": -39.819732666015625, "global_step": 165957, "epoch": 1371} {"train_loss": -39.552120208740234, "global_step": 165958, "epoch": 1371} {"train_loss": -39.99935531616211, "global_step": 165959, "epoch": 1371} {"train_loss": -39.4283447265625, "global_step": 165960, "epoch": 1371} {"train_loss": -39.57063674926758, "global_step": 165961, "epoch": 1371} {"train_loss": -38.99833297729492, "global_step": 165962, "epoch": 1371} {"train_loss": -40.18427658081055, "global_step": 165963, "epoch": 1371} {"train_loss": -38.95713424682617, "global_step": 165964, "epoch": 1371} {"train_loss": -40.29811096191406, "global_step": 165965, "epoch": 1371} {"train_loss": -39.20431137084961, "global_step": 165966, "epoch": 1371} {"train_loss": -39.621944427490234, "global_step": 165967, "epoch": 1371} {"train_loss": -40.25129318237305, "global_step": 165968, "epoch": 1371} {"train_loss": -39.849056243896484, "global_step": 165969, "epoch": 1371} {"train_loss": -40.05603790283203, "global_step": 165970, "epoch": 1371} {"train_loss": -40.1875114440918, "global_step": 165971, "epoch": 1371} {"train_loss": -40.58718490600586, "global_step": 165972, "epoch": 1371} {"train_loss": -40.63843536376953, "global_step": 165973, "epoch": 1371} {"train_loss": -40.3509635925293, "global_step": 165974, "epoch": 1371} {"train_loss": -40.96743392944336, "global_step": 165975, "epoch": 1371} {"train_loss": -40.72543716430664, "global_step": 165976, "epoch": 1371} {"train_loss": -41.20736312866211, "global_step": 165977, "epoch": 1371} {"train_loss": -40.989051818847656, "global_step": 165978, "epoch": 1371} {"train_loss": -40.8377799987793, "global_step": 165979, "epoch": 1371} {"train_loss": -40.8731803894043, "global_step": 165980, "epoch": 1371} {"train_loss": -40.48417282104492, "global_step": 165981, "epoch": 1371} {"train_loss": -41.295108795166016, "global_step": 165982, "epoch": 1371} {"train_loss": -41.001216888427734, "global_step": 165983, "epoch": 1371} {"train_loss": -41.29059600830078, "global_step": 165984, "epoch": 1371} {"train_loss": -40.930843353271484, "global_step": 165985, "epoch": 1371} {"train_loss": -40.79158401489258, "global_step": 165986, "epoch": 1371} {"train_loss": -40.98940658569336, "global_step": 165987, "epoch": 1371} {"train_loss": -40.558204650878906, "global_step": 165988, "epoch": 1371} {"train_loss": -41.46491241455078, "global_step": 165989, "epoch": 1371} {"train_loss": -41.1544075012207, "global_step": 165990, "epoch": 1371} {"train_loss": -41.296688079833984, "global_step": 165991, "epoch": 1371} {"train_loss": -41.48253631591797, "global_step": 165992, "epoch": 1371} {"train_loss": -41.43526840209961, "global_step": 165993, "epoch": 1371} {"train_loss": -41.33500289916992, "global_step": 165994, "epoch": 1371} {"train_loss": -42.05292510986328, "global_step": 165995, "epoch": 1371} {"train_loss": -41.08144760131836, "global_step": 165996, "epoch": 1371} {"train_loss": -41.30491256713867, "global_step": 165997, "epoch": 1371} {"train_loss": -41.34756088256836, "global_step": 165998, "epoch": 1371} {"train_loss": -41.88731002807617, "global_step": 165999, "epoch": 1371} {"train_loss": -41.66845703125, "global_step": 166000, "epoch": 1371} {"train_loss": -41.059261322021484, "global_step": 166001, "epoch": 1371} {"train_loss": -41.445556640625, "global_step": 166002, "epoch": 1371} {"train_loss": -41.606964111328125, "global_step": 166003, "epoch": 1371} {"train_loss": -41.239925384521484, "global_step": 166004, "epoch": 1371} {"train_loss": -41.72871017456055, "global_step": 166005, "epoch": 1371} {"train_loss": -41.3995361328125, "global_step": 166006, "epoch": 1371} {"train_loss": -41.594905853271484, "global_step": 166007, "epoch": 1371} {"train_loss": -41.735164642333984, "global_step": 166008, "epoch": 1371} {"train_loss": -41.932430267333984, "global_step": 166009, "epoch": 1371} {"train_loss": -41.90786361694336, "global_step": 166010, "epoch": 1371} {"train_loss": -38.7429907459858, "global_step": 166011, "epoch": 1371, "val_loss": 2564719.5} {"train_loss": -39.79579544067383, "global_step": 166012, "epoch": 1372} {"train_loss": -41.36384963989258, "global_step": 166013, "epoch": 1372} {"train_loss": -42.0683708190918, "global_step": 166014, "epoch": 1372} {"train_loss": -42.39583969116211, "global_step": 166015, "epoch": 1372} {"train_loss": -41.599998474121094, "global_step": 166016, "epoch": 1372} {"train_loss": -41.21249008178711, "global_step": 166017, "epoch": 1372} {"train_loss": -40.57843017578125, "global_step": 166018, "epoch": 1372} {"train_loss": -40.31470489501953, "global_step": 166019, "epoch": 1372} {"train_loss": -42.08864212036133, "global_step": 166020, "epoch": 1372} {"train_loss": -39.48354721069336, "global_step": 166021, "epoch": 1372} {"train_loss": -40.704708099365234, "global_step": 166022, "epoch": 1372} {"train_loss": -41.32252883911133, "global_step": 166023, "epoch": 1372} {"train_loss": -39.589664459228516, "global_step": 166024, "epoch": 1372} {"train_loss": -41.38563919067383, "global_step": 166025, "epoch": 1372} {"train_loss": -40.85424041748047, "global_step": 166026, "epoch": 1372} {"train_loss": -40.329586029052734, "global_step": 166027, "epoch": 1372} {"train_loss": -40.72636032104492, "global_step": 166028, "epoch": 1372} {"train_loss": -41.647789001464844, "global_step": 166029, "epoch": 1372} {"train_loss": -39.718299865722656, "global_step": 166030, "epoch": 1372} {"train_loss": -40.872596740722656, "global_step": 166031, "epoch": 1372} {"train_loss": -41.75026321411133, "global_step": 166032, "epoch": 1372} {"train_loss": -39.95502853393555, "global_step": 166033, "epoch": 1372} {"train_loss": -40.30308532714844, "global_step": 166034, "epoch": 1372} {"train_loss": -40.99797439575195, "global_step": 166035, "epoch": 1372} {"train_loss": -41.03567123413086, "global_step": 166036, "epoch": 1372} {"train_loss": -40.646514892578125, "global_step": 166037, "epoch": 1372} {"train_loss": -39.2863655090332, "global_step": 166038, "epoch": 1372} {"train_loss": -40.909847259521484, "global_step": 166039, "epoch": 1372} {"train_loss": -40.46162033081055, "global_step": 166040, "epoch": 1372} {"train_loss": -39.519771575927734, "global_step": 166041, "epoch": 1372} {"train_loss": -41.67924118041992, "global_step": 166042, "epoch": 1372} {"train_loss": -40.276344299316406, "global_step": 166043, "epoch": 1372} {"train_loss": -41.0847053527832, "global_step": 166044, "epoch": 1372} {"train_loss": -40.40191650390625, "global_step": 166045, "epoch": 1372} {"train_loss": -39.59491729736328, "global_step": 166046, "epoch": 1372} {"train_loss": -40.975643157958984, "global_step": 166047, "epoch": 1372} {"train_loss": -39.95292282104492, "global_step": 166048, "epoch": 1372} {"train_loss": -40.76705551147461, "global_step": 166049, "epoch": 1372} {"train_loss": -38.616249084472656, "global_step": 166050, "epoch": 1372} {"train_loss": -41.42110824584961, "global_step": 166051, "epoch": 1372} {"train_loss": -39.655818939208984, "global_step": 166052, "epoch": 1372} {"train_loss": -40.87824249267578, "global_step": 166053, "epoch": 1372} {"train_loss": -41.0335807800293, "global_step": 166054, "epoch": 1372} {"train_loss": -40.526546478271484, "global_step": 166055, "epoch": 1372} {"train_loss": -40.397335052490234, "global_step": 166056, "epoch": 1372} {"train_loss": -40.86505126953125, "global_step": 166057, "epoch": 1372} {"train_loss": -39.67226028442383, "global_step": 166058, "epoch": 1372} {"train_loss": -41.20952224731445, "global_step": 166059, "epoch": 1372} {"train_loss": -41.33063507080078, "global_step": 166060, "epoch": 1372} {"train_loss": -40.1207389831543, "global_step": 166061, "epoch": 1372} {"train_loss": -40.297550201416016, "global_step": 166062, "epoch": 1372} {"train_loss": -40.54140853881836, "global_step": 166063, "epoch": 1372} {"train_loss": -39.57395553588867, "global_step": 166064, "epoch": 1372} {"train_loss": -40.3663215637207, "global_step": 166065, "epoch": 1372} {"train_loss": -40.408199310302734, "global_step": 166066, "epoch": 1372} {"train_loss": -39.93952560424805, "global_step": 166067, "epoch": 1372} {"train_loss": -40.93331527709961, "global_step": 166068, "epoch": 1372} {"train_loss": -38.95421600341797, "global_step": 166069, "epoch": 1372} {"train_loss": -40.580928802490234, "global_step": 166070, "epoch": 1372} {"train_loss": -40.26334762573242, "global_step": 166071, "epoch": 1372} {"train_loss": -40.3065299987793, "global_step": 166072, "epoch": 1372} {"train_loss": -40.377601623535156, "global_step": 166073, "epoch": 1372} {"train_loss": -40.288421630859375, "global_step": 166074, "epoch": 1372} {"train_loss": -40.906246185302734, "global_step": 166075, "epoch": 1372} {"train_loss": -40.04155731201172, "global_step": 166076, "epoch": 1372} {"train_loss": -41.36954879760742, "global_step": 166077, "epoch": 1372} {"train_loss": -40.15468215942383, "global_step": 166078, "epoch": 1372} {"train_loss": -40.51421356201172, "global_step": 166079, "epoch": 1372} {"train_loss": -40.65087890625, "global_step": 166080, "epoch": 1372} {"train_loss": -40.00461959838867, "global_step": 166081, "epoch": 1372} {"train_loss": -40.03449630737305, "global_step": 166082, "epoch": 1372} {"train_loss": -41.734466552734375, "global_step": 166083, "epoch": 1372} {"train_loss": -39.851234436035156, "global_step": 166084, "epoch": 1372} {"train_loss": -40.92774200439453, "global_step": 166085, "epoch": 1372} {"train_loss": -40.86016082763672, "global_step": 166086, "epoch": 1372} {"train_loss": -40.67684555053711, "global_step": 166087, "epoch": 1372} {"train_loss": -40.762386322021484, "global_step": 166088, "epoch": 1372} {"train_loss": -40.7503776550293, "global_step": 166089, "epoch": 1372} {"train_loss": -40.496150970458984, "global_step": 166090, "epoch": 1372} {"train_loss": -40.16990280151367, "global_step": 166091, "epoch": 1372} {"train_loss": -41.15256881713867, "global_step": 166092, "epoch": 1372} {"train_loss": -41.2396240234375, "global_step": 166093, "epoch": 1372} {"train_loss": -40.90250778198242, "global_step": 166094, "epoch": 1372} {"train_loss": -40.550636291503906, "global_step": 166095, "epoch": 1372} {"train_loss": -40.53641128540039, "global_step": 166096, "epoch": 1372} {"train_loss": -40.18783187866211, "global_step": 166097, "epoch": 1372} {"train_loss": -40.326759338378906, "global_step": 166098, "epoch": 1372} {"train_loss": -39.38554763793945, "global_step": 166099, "epoch": 1372} {"train_loss": -39.417640686035156, "global_step": 166100, "epoch": 1372} {"train_loss": -40.867958068847656, "global_step": 166101, "epoch": 1372} {"train_loss": -39.36820602416992, "global_step": 166102, "epoch": 1372} {"train_loss": -39.650047302246094, "global_step": 166103, "epoch": 1372} {"train_loss": -39.51569366455078, "global_step": 166104, "epoch": 1372} {"train_loss": -41.01497268676758, "global_step": 166105, "epoch": 1372} {"train_loss": -39.8449592590332, "global_step": 166106, "epoch": 1372} {"train_loss": -40.31463623046875, "global_step": 166107, "epoch": 1372} {"train_loss": -40.51346969604492, "global_step": 166108, "epoch": 1372} {"train_loss": -40.451839447021484, "global_step": 166109, "epoch": 1372} {"train_loss": -41.60293197631836, "global_step": 166110, "epoch": 1372} {"train_loss": -41.26150894165039, "global_step": 166111, "epoch": 1372} {"train_loss": -39.912147521972656, "global_step": 166112, "epoch": 1372} {"train_loss": -40.484657287597656, "global_step": 166113, "epoch": 1372} {"train_loss": -39.70481491088867, "global_step": 166114, "epoch": 1372} {"train_loss": -40.23166275024414, "global_step": 166115, "epoch": 1372} {"train_loss": -38.77286911010742, "global_step": 166116, "epoch": 1372} {"train_loss": -40.8011360168457, "global_step": 166117, "epoch": 1372} {"train_loss": -39.18413543701172, "global_step": 166118, "epoch": 1372} {"train_loss": -40.00007629394531, "global_step": 166119, "epoch": 1372} {"train_loss": -39.25539779663086, "global_step": 166120, "epoch": 1372} {"train_loss": -39.83559799194336, "global_step": 166121, "epoch": 1372} {"train_loss": -38.90690231323242, "global_step": 166122, "epoch": 1372} {"train_loss": -38.81022644042969, "global_step": 166123, "epoch": 1372} {"train_loss": -40.49813461303711, "global_step": 166124, "epoch": 1372} {"train_loss": -39.50584030151367, "global_step": 166125, "epoch": 1372} {"train_loss": -40.70068359375, "global_step": 166126, "epoch": 1372} {"train_loss": -39.5374755859375, "global_step": 166127, "epoch": 1372} {"train_loss": -40.923274993896484, "global_step": 166128, "epoch": 1372} {"train_loss": -39.56694793701172, "global_step": 166129, "epoch": 1372} {"train_loss": -41.458526611328125, "global_step": 166130, "epoch": 1372} {"train_loss": -40.068363189697266, "global_step": 166131, "epoch": 1372} {"train_loss": -40.43807961329941, "global_step": 166132, "epoch": 1372, "val_loss": 2633347.25} {"train_loss": -39.18080520629883, "global_step": 166133, "epoch": 1373} {"train_loss": -39.317684173583984, "global_step": 166134, "epoch": 1373} {"train_loss": -40.053585052490234, "global_step": 166135, "epoch": 1373} {"train_loss": -41.18737030029297, "global_step": 166136, "epoch": 1373} {"train_loss": -41.1308479309082, "global_step": 166137, "epoch": 1373} {"train_loss": -40.82655715942383, "global_step": 166138, "epoch": 1373} {"train_loss": -39.58132553100586, "global_step": 166139, "epoch": 1373} {"train_loss": -39.556312561035156, "global_step": 166140, "epoch": 1373} {"train_loss": -40.22967529296875, "global_step": 166141, "epoch": 1373} {"train_loss": -41.112545013427734, "global_step": 166142, "epoch": 1373} {"train_loss": -41.322792053222656, "global_step": 166143, "epoch": 1373} {"train_loss": -41.568626403808594, "global_step": 166144, "epoch": 1373} {"train_loss": -41.28181076049805, "global_step": 166145, "epoch": 1373} {"train_loss": -40.62757110595703, "global_step": 166146, "epoch": 1373} {"train_loss": -41.024898529052734, "global_step": 166147, "epoch": 1373} {"train_loss": -41.620452880859375, "global_step": 166148, "epoch": 1373} {"train_loss": -41.6995849609375, "global_step": 166149, "epoch": 1373} {"train_loss": -41.31583786010742, "global_step": 166150, "epoch": 1373} {"train_loss": -40.4146728515625, "global_step": 166151, "epoch": 1373} {"train_loss": -41.87173080444336, "global_step": 166152, "epoch": 1373} {"train_loss": -41.91394805908203, "global_step": 166153, "epoch": 1373} {"train_loss": -40.76136016845703, "global_step": 166154, "epoch": 1373} {"train_loss": -41.20640182495117, "global_step": 166155, "epoch": 1373} {"train_loss": -41.71659469604492, "global_step": 166156, "epoch": 1373} {"train_loss": -42.05216598510742, "global_step": 166157, "epoch": 1373} {"train_loss": -41.15960693359375, "global_step": 166158, "epoch": 1373} {"train_loss": -40.94731140136719, "global_step": 166159, "epoch": 1373} {"train_loss": -41.76118087768555, "global_step": 166160, "epoch": 1373} {"train_loss": -41.89784622192383, "global_step": 166161, "epoch": 1373} {"train_loss": -42.147071838378906, "global_step": 166162, "epoch": 1373} {"train_loss": -41.44327926635742, "global_step": 166163, "epoch": 1373} {"train_loss": -41.33144760131836, "global_step": 166164, "epoch": 1373} {"train_loss": -41.05072784423828, "global_step": 166165, "epoch": 1373} {"train_loss": -41.125667572021484, "global_step": 166166, "epoch": 1373} {"train_loss": -40.86350631713867, "global_step": 166167, "epoch": 1373} {"train_loss": -40.78239059448242, "global_step": 166168, "epoch": 1373} {"train_loss": -39.032752990722656, "global_step": 166169, "epoch": 1373} {"train_loss": -40.64616775512695, "global_step": 166170, "epoch": 1373} {"train_loss": -40.75460433959961, "global_step": 166171, "epoch": 1373} {"train_loss": -40.68378448486328, "global_step": 166172, "epoch": 1373} {"train_loss": -39.997554779052734, "global_step": 166173, "epoch": 1373} {"train_loss": -39.67031478881836, "global_step": 166174, "epoch": 1373} {"train_loss": -40.78881072998047, "global_step": 166175, "epoch": 1373} {"train_loss": -38.59332275390625, "global_step": 166176, "epoch": 1373} {"train_loss": -41.805625915527344, "global_step": 166177, "epoch": 1373} {"train_loss": -40.36257553100586, "global_step": 166178, "epoch": 1373} {"train_loss": -37.768394470214844, "global_step": 166179, "epoch": 1373} {"train_loss": -37.901344299316406, "global_step": 166180, "epoch": 1373} {"train_loss": -39.153804779052734, "global_step": 166181, "epoch": 1373} {"train_loss": -38.421180725097656, "global_step": 166182, "epoch": 1373} {"train_loss": -38.145259857177734, "global_step": 166183, "epoch": 1373} {"train_loss": -39.4101676940918, "global_step": 166184, "epoch": 1373} {"train_loss": -39.000328063964844, "global_step": 166185, "epoch": 1373} {"train_loss": -39.49300765991211, "global_step": 166186, "epoch": 1373} {"train_loss": -39.584564208984375, "global_step": 166187, "epoch": 1373} {"train_loss": -39.582801818847656, "global_step": 166188, "epoch": 1373} {"train_loss": -39.69278335571289, "global_step": 166189, "epoch": 1373} {"train_loss": -40.1676139831543, "global_step": 166190, "epoch": 1373} {"train_loss": -39.74515151977539, "global_step": 166191, "epoch": 1373} {"train_loss": -40.877742767333984, "global_step": 166192, "epoch": 1373} {"train_loss": -40.32338333129883, "global_step": 166193, "epoch": 1373} {"train_loss": -39.9165153503418, "global_step": 166194, "epoch": 1373} {"train_loss": -41.04145431518555, "global_step": 166195, "epoch": 1373} {"train_loss": -39.97883224487305, "global_step": 166196, "epoch": 1373} {"train_loss": -39.911659240722656, "global_step": 166197, "epoch": 1373} {"train_loss": -40.9196891784668, "global_step": 166198, "epoch": 1373} {"train_loss": -40.359928131103516, "global_step": 166199, "epoch": 1373} {"train_loss": -41.334686279296875, "global_step": 166200, "epoch": 1373} {"train_loss": -41.115875244140625, "global_step": 166201, "epoch": 1373} {"train_loss": -40.83726119995117, "global_step": 166202, "epoch": 1373} {"train_loss": -41.33395004272461, "global_step": 166203, "epoch": 1373} {"train_loss": -41.041194915771484, "global_step": 166204, "epoch": 1373} {"train_loss": -41.30078125, "global_step": 166205, "epoch": 1373} {"train_loss": -40.887359619140625, "global_step": 166206, "epoch": 1373} {"train_loss": -41.58195877075195, "global_step": 166207, "epoch": 1373} {"train_loss": -41.24931716918945, "global_step": 166208, "epoch": 1373} {"train_loss": -41.80055618286133, "global_step": 166209, "epoch": 1373} {"train_loss": -41.71689987182617, "global_step": 166210, "epoch": 1373} {"train_loss": -41.063079833984375, "global_step": 166211, "epoch": 1373} {"train_loss": -41.284706115722656, "global_step": 166212, "epoch": 1373} {"train_loss": -40.57228088378906, "global_step": 166213, "epoch": 1373} {"train_loss": -40.29884338378906, "global_step": 166214, "epoch": 1373} {"train_loss": -41.27330780029297, "global_step": 166215, "epoch": 1373} {"train_loss": -41.87196350097656, "global_step": 166216, "epoch": 1373} {"train_loss": -41.0733642578125, "global_step": 166217, "epoch": 1373} {"train_loss": -41.6097526550293, "global_step": 166218, "epoch": 1373} {"train_loss": -41.299964904785156, "global_step": 166219, "epoch": 1373} {"train_loss": -41.3351936340332, "global_step": 166220, "epoch": 1373} {"train_loss": -41.7408332824707, "global_step": 166221, "epoch": 1373} {"train_loss": -41.17350387573242, "global_step": 166222, "epoch": 1373} {"train_loss": -41.04384231567383, "global_step": 166223, "epoch": 1373} {"train_loss": -41.73625946044922, "global_step": 166224, "epoch": 1373} {"train_loss": -41.38654708862305, "global_step": 166225, "epoch": 1373} {"train_loss": -41.534847259521484, "global_step": 166226, "epoch": 1373} {"train_loss": -41.4312744140625, "global_step": 166227, "epoch": 1373} {"train_loss": -41.57935333251953, "global_step": 166228, "epoch": 1373} {"train_loss": -41.2978401184082, "global_step": 166229, "epoch": 1373} {"train_loss": -41.6442756652832, "global_step": 166230, "epoch": 1373} {"train_loss": -41.95942687988281, "global_step": 166231, "epoch": 1373} {"train_loss": -41.962581634521484, "global_step": 166232, "epoch": 1373} {"train_loss": -41.43994903564453, "global_step": 166233, "epoch": 1373} {"train_loss": -41.332584381103516, "global_step": 166234, "epoch": 1373} {"train_loss": -40.94889450073242, "global_step": 166235, "epoch": 1373} {"train_loss": -40.67140579223633, "global_step": 166236, "epoch": 1373} {"train_loss": -40.00172805786133, "global_step": 166237, "epoch": 1373} {"train_loss": -41.8828010559082, "global_step": 166238, "epoch": 1373} {"train_loss": -41.5596923828125, "global_step": 166239, "epoch": 1373} {"train_loss": -40.95701217651367, "global_step": 166240, "epoch": 1373} {"train_loss": -40.13042449951172, "global_step": 166241, "epoch": 1373} {"train_loss": -41.1962776184082, "global_step": 166242, "epoch": 1373} {"train_loss": -40.90102767944336, "global_step": 166243, "epoch": 1373} {"train_loss": -39.738826751708984, "global_step": 166244, "epoch": 1373} {"train_loss": -41.75947952270508, "global_step": 166245, "epoch": 1373} {"train_loss": -41.255828857421875, "global_step": 166246, "epoch": 1373} {"train_loss": -40.18401336669922, "global_step": 166247, "epoch": 1373} {"train_loss": -41.5791130065918, "global_step": 166248, "epoch": 1373} {"train_loss": -41.38014602661133, "global_step": 166249, "epoch": 1373} {"train_loss": -40.29071044921875, "global_step": 166250, "epoch": 1373} {"train_loss": -41.281707763671875, "global_step": 166251, "epoch": 1373} {"train_loss": -39.7181510925293, "global_step": 166252, "epoch": 1373} {"train_loss": -40.778358175734844, "global_step": 166253, "epoch": 1373, "val_loss": 2571081.75} {"train_loss": -41.222206115722656, "global_step": 166254, "epoch": 1374} {"train_loss": -40.834110260009766, "global_step": 166255, "epoch": 1374} {"train_loss": -41.18516159057617, "global_step": 166256, "epoch": 1374} {"train_loss": -41.43994903564453, "global_step": 166257, "epoch": 1374} {"train_loss": -41.08951950073242, "global_step": 166258, "epoch": 1374} {"train_loss": -40.84954833984375, "global_step": 166259, "epoch": 1374} {"train_loss": -40.81968307495117, "global_step": 166260, "epoch": 1374} {"train_loss": -41.696746826171875, "global_step": 166261, "epoch": 1374} {"train_loss": -41.73125076293945, "global_step": 166262, "epoch": 1374} {"train_loss": -41.15886688232422, "global_step": 166263, "epoch": 1374} {"train_loss": -41.994361877441406, "global_step": 166264, "epoch": 1374} {"train_loss": -41.68684768676758, "global_step": 166265, "epoch": 1374} {"train_loss": -41.81699752807617, "global_step": 166266, "epoch": 1374} {"train_loss": -41.98221206665039, "global_step": 166267, "epoch": 1374} {"train_loss": -41.73802185058594, "global_step": 166268, "epoch": 1374} {"train_loss": -41.7684211730957, "global_step": 166269, "epoch": 1374} {"train_loss": -41.9515495300293, "global_step": 166270, "epoch": 1374} {"train_loss": -42.24943542480469, "global_step": 166271, "epoch": 1374} {"train_loss": -40.03419876098633, "global_step": 166272, "epoch": 1374} {"train_loss": -41.273353576660156, "global_step": 166273, "epoch": 1374} {"train_loss": -41.421478271484375, "global_step": 166274, "epoch": 1374} {"train_loss": -41.193206787109375, "global_step": 166275, "epoch": 1374} {"train_loss": -39.95941162109375, "global_step": 166276, "epoch": 1374} {"train_loss": -41.000667572021484, "global_step": 166277, "epoch": 1374} {"train_loss": -40.3383903503418, "global_step": 166278, "epoch": 1374} {"train_loss": -40.26476287841797, "global_step": 166279, "epoch": 1374} {"train_loss": -39.818416595458984, "global_step": 166280, "epoch": 1374} {"train_loss": -41.281715393066406, "global_step": 166281, "epoch": 1374} {"train_loss": -41.173683166503906, "global_step": 166282, "epoch": 1374} {"train_loss": -41.11280059814453, "global_step": 166283, "epoch": 1374} {"train_loss": -40.764522552490234, "global_step": 166284, "epoch": 1374} {"train_loss": -36.25662612915039, "global_step": 166285, "epoch": 1374} {"train_loss": -40.95293045043945, "global_step": 166286, "epoch": 1374} {"train_loss": -39.54148483276367, "global_step": 166287, "epoch": 1374} {"train_loss": -39.05891418457031, "global_step": 166288, "epoch": 1374} {"train_loss": -39.07243728637695, "global_step": 166289, "epoch": 1374} {"train_loss": -39.8723258972168, "global_step": 166290, "epoch": 1374} {"train_loss": -39.6779670715332, "global_step": 166291, "epoch": 1374} {"train_loss": -37.45021438598633, "global_step": 166292, "epoch": 1374} {"train_loss": -39.5344123840332, "global_step": 166293, "epoch": 1374} {"train_loss": -39.42795944213867, "global_step": 166294, "epoch": 1374} {"train_loss": -39.70844650268555, "global_step": 166295, "epoch": 1374} {"train_loss": -37.97735595703125, "global_step": 166296, "epoch": 1374} {"train_loss": -40.24164581298828, "global_step": 166297, "epoch": 1374} {"train_loss": -38.483123779296875, "global_step": 166298, "epoch": 1374} {"train_loss": -39.107818603515625, "global_step": 166299, "epoch": 1374} {"train_loss": -35.90932846069336, "global_step": 166300, "epoch": 1374} {"train_loss": -39.63422393798828, "global_step": 166301, "epoch": 1374} {"train_loss": -35.31976318359375, "global_step": 166302, "epoch": 1374} {"train_loss": -38.17106246948242, "global_step": 166303, "epoch": 1374} {"train_loss": -37.317169189453125, "global_step": 166304, "epoch": 1374} {"train_loss": -38.03876495361328, "global_step": 166305, "epoch": 1374} {"train_loss": -38.99524688720703, "global_step": 166306, "epoch": 1374} {"train_loss": -39.34455108642578, "global_step": 166307, "epoch": 1374} {"train_loss": -39.6906852722168, "global_step": 166308, "epoch": 1374} {"train_loss": -34.05103302001953, "global_step": 166309, "epoch": 1374} {"train_loss": -39.349422454833984, "global_step": 166310, "epoch": 1374} {"train_loss": -39.91534423828125, "global_step": 166311, "epoch": 1374} {"train_loss": -40.34634017944336, "global_step": 166312, "epoch": 1374} {"train_loss": -39.85874557495117, "global_step": 166313, "epoch": 1374} {"train_loss": -39.98719024658203, "global_step": 166314, "epoch": 1374} {"train_loss": -40.19783020019531, "global_step": 166315, "epoch": 1374} {"train_loss": -40.90974044799805, "global_step": 166316, "epoch": 1374} {"train_loss": -39.02217483520508, "global_step": 166317, "epoch": 1374} {"train_loss": -40.81064987182617, "global_step": 166318, "epoch": 1374} {"train_loss": -40.20290756225586, "global_step": 166319, "epoch": 1374} {"train_loss": -41.242095947265625, "global_step": 166320, "epoch": 1374} {"train_loss": -40.2477912902832, "global_step": 166321, "epoch": 1374} {"train_loss": -40.89311599731445, "global_step": 166322, "epoch": 1374} {"train_loss": -41.188316345214844, "global_step": 166323, "epoch": 1374} {"train_loss": -41.18573760986328, "global_step": 166324, "epoch": 1374} {"train_loss": -41.093204498291016, "global_step": 166325, "epoch": 1374} {"train_loss": -40.3341064453125, "global_step": 166326, "epoch": 1374} {"train_loss": -41.55302047729492, "global_step": 166327, "epoch": 1374} {"train_loss": -40.58495330810547, "global_step": 166328, "epoch": 1374} {"train_loss": -40.78681564331055, "global_step": 166329, "epoch": 1374} {"train_loss": -40.073974609375, "global_step": 166330, "epoch": 1374} {"train_loss": -41.023719787597656, "global_step": 166331, "epoch": 1374} {"train_loss": -41.25456237792969, "global_step": 166332, "epoch": 1374} {"train_loss": -40.964134216308594, "global_step": 166333, "epoch": 1374} {"train_loss": -41.08955001831055, "global_step": 166334, "epoch": 1374} {"train_loss": -41.94972229003906, "global_step": 166335, "epoch": 1374} {"train_loss": -41.00582504272461, "global_step": 166336, "epoch": 1374} {"train_loss": -41.60640335083008, "global_step": 166337, "epoch": 1374} {"train_loss": -41.36753463745117, "global_step": 166338, "epoch": 1374} {"train_loss": -41.72528076171875, "global_step": 166339, "epoch": 1374} {"train_loss": -42.0290412902832, "global_step": 166340, "epoch": 1374} {"train_loss": -41.07307815551758, "global_step": 166341, "epoch": 1374} {"train_loss": -40.2987174987793, "global_step": 166342, "epoch": 1374} {"train_loss": -40.7662353515625, "global_step": 166343, "epoch": 1374} {"train_loss": -41.796630859375, "global_step": 166344, "epoch": 1374} {"train_loss": -40.884639739990234, "global_step": 166345, "epoch": 1374} {"train_loss": -40.055885314941406, "global_step": 166346, "epoch": 1374} {"train_loss": -39.17251205444336, "global_step": 166347, "epoch": 1374} {"train_loss": -40.36865997314453, "global_step": 166348, "epoch": 1374} {"train_loss": -41.34133529663086, "global_step": 166349, "epoch": 1374} {"train_loss": -41.08675003051758, "global_step": 166350, "epoch": 1374} {"train_loss": -39.50141525268555, "global_step": 166351, "epoch": 1374} {"train_loss": -39.11344528198242, "global_step": 166352, "epoch": 1374} {"train_loss": -40.5854377746582, "global_step": 166353, "epoch": 1374} {"train_loss": -41.088661193847656, "global_step": 166354, "epoch": 1374} {"train_loss": -39.102760314941406, "global_step": 166355, "epoch": 1374} {"train_loss": -41.13530349731445, "global_step": 166356, "epoch": 1374} {"train_loss": -40.55813980102539, "global_step": 166357, "epoch": 1374} {"train_loss": -40.18217849731445, "global_step": 166358, "epoch": 1374} {"train_loss": -41.189449310302734, "global_step": 166359, "epoch": 1374} {"train_loss": -41.54834747314453, "global_step": 166360, "epoch": 1374} {"train_loss": -41.6811637878418, "global_step": 166361, "epoch": 1374} {"train_loss": -41.350799560546875, "global_step": 166362, "epoch": 1374} {"train_loss": -41.810401916503906, "global_step": 166363, "epoch": 1374} {"train_loss": -41.273372650146484, "global_step": 166364, "epoch": 1374} {"train_loss": -40.04999542236328, "global_step": 166365, "epoch": 1374} {"train_loss": -40.765052795410156, "global_step": 166366, "epoch": 1374} {"train_loss": -39.91029739379883, "global_step": 166367, "epoch": 1374} {"train_loss": -40.706478118896484, "global_step": 166368, "epoch": 1374} {"train_loss": -41.52976608276367, "global_step": 166369, "epoch": 1374} {"train_loss": -40.714935302734375, "global_step": 166370, "epoch": 1374} {"train_loss": -39.91743850708008, "global_step": 166371, "epoch": 1374} {"train_loss": -39.267730712890625, "global_step": 166372, "epoch": 1374} {"train_loss": -40.74274826049805, "global_step": 166373, "epoch": 1374} {"train_loss": -40.373569646157506, "global_step": 166374, "epoch": 1374, "val_loss": 2623910.0} {"train_loss": -39.310550689697266, "global_step": 166375, "epoch": 1375} {"train_loss": -40.10673904418945, "global_step": 166376, "epoch": 1375} {"train_loss": -40.665374755859375, "global_step": 166377, "epoch": 1375} {"train_loss": -39.21857833862305, "global_step": 166378, "epoch": 1375} {"train_loss": -41.221046447753906, "global_step": 166379, "epoch": 1375} {"train_loss": -40.18821334838867, "global_step": 166380, "epoch": 1375} {"train_loss": -40.76968002319336, "global_step": 166381, "epoch": 1375} {"train_loss": -41.017147064208984, "global_step": 166382, "epoch": 1375} {"train_loss": -40.32754135131836, "global_step": 166383, "epoch": 1375} {"train_loss": -41.5213508605957, "global_step": 166384, "epoch": 1375} {"train_loss": -41.1213493347168, "global_step": 166385, "epoch": 1375} {"train_loss": -40.747928619384766, "global_step": 166386, "epoch": 1375} {"train_loss": -40.57255554199219, "global_step": 166387, "epoch": 1375} {"train_loss": -40.6366081237793, "global_step": 166388, "epoch": 1375} {"train_loss": -40.650386810302734, "global_step": 166389, "epoch": 1375} {"train_loss": -41.46017074584961, "global_step": 166390, "epoch": 1375} {"train_loss": -40.76234817504883, "global_step": 166391, "epoch": 1375} {"train_loss": -41.11243438720703, "global_step": 166392, "epoch": 1375} {"train_loss": -42.04104995727539, "global_step": 166393, "epoch": 1375} {"train_loss": -41.47300338745117, "global_step": 166394, "epoch": 1375} {"train_loss": -41.52451705932617, "global_step": 166395, "epoch": 1375} {"train_loss": -41.610565185546875, "global_step": 166396, "epoch": 1375} {"train_loss": -41.553890228271484, "global_step": 166397, "epoch": 1375} {"train_loss": -41.72617721557617, "global_step": 166398, "epoch": 1375} {"train_loss": -41.64476776123047, "global_step": 166399, "epoch": 1375} {"train_loss": -41.32737350463867, "global_step": 166400, "epoch": 1375} {"train_loss": -41.284061431884766, "global_step": 166401, "epoch": 1375} {"train_loss": -41.60713577270508, "global_step": 166402, "epoch": 1375} {"train_loss": -41.77630615234375, "global_step": 166403, "epoch": 1375} {"train_loss": -41.61589431762695, "global_step": 166404, "epoch": 1375} {"train_loss": -41.92104721069336, "global_step": 166405, "epoch": 1375} {"train_loss": -40.84821701049805, "global_step": 166406, "epoch": 1375} {"train_loss": -41.6572380065918, "global_step": 166407, "epoch": 1375} {"train_loss": -41.02000045776367, "global_step": 166408, "epoch": 1375} {"train_loss": -41.39443588256836, "global_step": 166409, "epoch": 1375} {"train_loss": -42.15774154663086, "global_step": 166410, "epoch": 1375} {"train_loss": -41.23141860961914, "global_step": 166411, "epoch": 1375} {"train_loss": -41.416996002197266, "global_step": 166412, "epoch": 1375} {"train_loss": -41.9989128112793, "global_step": 166413, "epoch": 1375} {"train_loss": -42.13886642456055, "global_step": 166414, "epoch": 1375} {"train_loss": -41.458675384521484, "global_step": 166415, "epoch": 1375} {"train_loss": -41.00767135620117, "global_step": 166416, "epoch": 1375} {"train_loss": -41.62104797363281, "global_step": 166417, "epoch": 1375} {"train_loss": -41.089595794677734, "global_step": 166418, "epoch": 1375} {"train_loss": -41.57955551147461, "global_step": 166419, "epoch": 1375} {"train_loss": -41.6630859375, "global_step": 166420, "epoch": 1375} {"train_loss": -42.04203414916992, "global_step": 166421, "epoch": 1375} {"train_loss": -41.56233215332031, "global_step": 166422, "epoch": 1375} {"train_loss": -40.870845794677734, "global_step": 166423, "epoch": 1375} {"train_loss": -40.63637924194336, "global_step": 166424, "epoch": 1375} {"train_loss": -41.145606994628906, "global_step": 166425, "epoch": 1375} {"train_loss": -42.58222198486328, "global_step": 166426, "epoch": 1375} {"train_loss": -40.41213607788086, "global_step": 166427, "epoch": 1375} {"train_loss": -39.126991271972656, "global_step": 166428, "epoch": 1375} {"train_loss": -41.84893798828125, "global_step": 166429, "epoch": 1375} {"train_loss": -36.58750915527344, "global_step": 166430, "epoch": 1375} {"train_loss": -36.429073333740234, "global_step": 166431, "epoch": 1375} {"train_loss": -33.32177734375, "global_step": 166432, "epoch": 1375} {"train_loss": -35.76060485839844, "global_step": 166433, "epoch": 1375} {"train_loss": -34.0426139831543, "global_step": 166434, "epoch": 1375} {"train_loss": -39.650482177734375, "global_step": 166435, "epoch": 1375} {"train_loss": -35.74222946166992, "global_step": 166436, "epoch": 1375} {"train_loss": -33.742366790771484, "global_step": 166437, "epoch": 1375} {"train_loss": -31.802978515625, "global_step": 166438, "epoch": 1375} {"train_loss": -29.541528701782227, "global_step": 166439, "epoch": 1375} {"train_loss": -37.660491943359375, "global_step": 166440, "epoch": 1375} {"train_loss": -37.79885482788086, "global_step": 166441, "epoch": 1375} {"train_loss": -35.905616760253906, "global_step": 166442, "epoch": 1375} {"train_loss": -37.301734924316406, "global_step": 166443, "epoch": 1375} {"train_loss": -36.33734893798828, "global_step": 166444, "epoch": 1375} {"train_loss": -35.1773796081543, "global_step": 166445, "epoch": 1375} {"train_loss": -35.21773910522461, "global_step": 166446, "epoch": 1375} {"train_loss": -35.82819747924805, "global_step": 166447, "epoch": 1375} {"train_loss": -37.668331146240234, "global_step": 166448, "epoch": 1375} {"train_loss": -37.83953094482422, "global_step": 166449, "epoch": 1375} {"train_loss": -35.23219680786133, "global_step": 166450, "epoch": 1375} {"train_loss": -38.19479751586914, "global_step": 166451, "epoch": 1375} {"train_loss": -37.18507385253906, "global_step": 166452, "epoch": 1375} {"train_loss": -38.01215362548828, "global_step": 166453, "epoch": 1375} {"train_loss": -38.89604568481445, "global_step": 166454, "epoch": 1375} {"train_loss": -39.12141799926758, "global_step": 166455, "epoch": 1375} {"train_loss": -39.19071578979492, "global_step": 166456, "epoch": 1375} {"train_loss": -38.7971305847168, "global_step": 166457, "epoch": 1375} {"train_loss": -40.76019287109375, "global_step": 166458, "epoch": 1375} {"train_loss": -39.665794372558594, "global_step": 166459, "epoch": 1375} {"train_loss": -40.278926849365234, "global_step": 166460, "epoch": 1375} {"train_loss": -38.79885482788086, "global_step": 166461, "epoch": 1375} {"train_loss": -40.692138671875, "global_step": 166462, "epoch": 1375} {"train_loss": -39.48612976074219, "global_step": 166463, "epoch": 1375} {"train_loss": -40.80252456665039, "global_step": 166464, "epoch": 1375} {"train_loss": -40.44190979003906, "global_step": 166465, "epoch": 1375} {"train_loss": -40.40465545654297, "global_step": 166466, "epoch": 1375} {"train_loss": -41.01340866088867, "global_step": 166467, "epoch": 1375} {"train_loss": -40.61555099487305, "global_step": 166468, "epoch": 1375} {"train_loss": -41.19682693481445, "global_step": 166469, "epoch": 1375} {"train_loss": -40.589447021484375, "global_step": 166470, "epoch": 1375} {"train_loss": -41.07872009277344, "global_step": 166471, "epoch": 1375} {"train_loss": -40.819488525390625, "global_step": 166472, "epoch": 1375} {"train_loss": -40.9964485168457, "global_step": 166473, "epoch": 1375} {"train_loss": -40.95695114135742, "global_step": 166474, "epoch": 1375} {"train_loss": -41.22089385986328, "global_step": 166475, "epoch": 1375} {"train_loss": -41.27048873901367, "global_step": 166476, "epoch": 1375} {"train_loss": -41.14948654174805, "global_step": 166477, "epoch": 1375} {"train_loss": -41.78813552856445, "global_step": 166478, "epoch": 1375} {"train_loss": -41.032997131347656, "global_step": 166479, "epoch": 1375} {"train_loss": -41.5903205871582, "global_step": 166480, "epoch": 1375} {"train_loss": -41.25130844116211, "global_step": 166481, "epoch": 1375} {"train_loss": -41.34862518310547, "global_step": 166482, "epoch": 1375} {"train_loss": -41.6860466003418, "global_step": 166483, "epoch": 1375} {"train_loss": -41.12452697753906, "global_step": 166484, "epoch": 1375} {"train_loss": -41.8475227355957, "global_step": 166485, "epoch": 1375} {"train_loss": -41.3944206237793, "global_step": 166486, "epoch": 1375} {"train_loss": -41.56820297241211, "global_step": 166487, "epoch": 1375} {"train_loss": -41.69074630737305, "global_step": 166488, "epoch": 1375} {"train_loss": -41.75162887573242, "global_step": 166489, "epoch": 1375} {"train_loss": -41.50445556640625, "global_step": 166490, "epoch": 1375} {"train_loss": -41.87310791015625, "global_step": 166491, "epoch": 1375} {"train_loss": -41.75370407104492, "global_step": 166492, "epoch": 1375} {"train_loss": -41.87722396850586, "global_step": 166493, "epoch": 1375} {"train_loss": -42.21415328979492, "global_step": 166494, "epoch": 1375} {"train_loss": -40.03537871620872, "global_step": 166495, "epoch": 1375, "val_loss": 2551011.5} {"train_loss": -41.75910186767578, "global_step": 166496, "epoch": 1376} {"train_loss": -41.98590850830078, "global_step": 166497, "epoch": 1376} {"train_loss": -42.09370803833008, "global_step": 166498, "epoch": 1376} {"train_loss": -41.431434631347656, "global_step": 166499, "epoch": 1376} {"train_loss": -41.05271530151367, "global_step": 166500, "epoch": 1376} {"train_loss": -40.880367279052734, "global_step": 166501, "epoch": 1376} {"train_loss": -42.17765426635742, "global_step": 166502, "epoch": 1376} {"train_loss": -41.61194610595703, "global_step": 166503, "epoch": 1376} {"train_loss": -40.5413932800293, "global_step": 166504, "epoch": 1376} {"train_loss": -40.80605697631836, "global_step": 166505, "epoch": 1376} {"train_loss": -41.728126525878906, "global_step": 166506, "epoch": 1376} {"train_loss": -41.34225082397461, "global_step": 166507, "epoch": 1376} {"train_loss": -41.028072357177734, "global_step": 166508, "epoch": 1376} {"train_loss": -40.986572265625, "global_step": 166509, "epoch": 1376} {"train_loss": -42.0740852355957, "global_step": 166510, "epoch": 1376} {"train_loss": -41.5057373046875, "global_step": 166511, "epoch": 1376} {"train_loss": -40.91938781738281, "global_step": 166512, "epoch": 1376} {"train_loss": -41.01599884033203, "global_step": 166513, "epoch": 1376} {"train_loss": -40.165462493896484, "global_step": 166514, "epoch": 1376} {"train_loss": -40.90922164916992, "global_step": 166515, "epoch": 1376} {"train_loss": -42.30595779418945, "global_step": 166516, "epoch": 1376} {"train_loss": -41.69963836669922, "global_step": 166517, "epoch": 1376} {"train_loss": -40.5166130065918, "global_step": 166518, "epoch": 1376} {"train_loss": -41.188541412353516, "global_step": 166519, "epoch": 1376} {"train_loss": -41.71455764770508, "global_step": 166520, "epoch": 1376} {"train_loss": -42.09577178955078, "global_step": 166521, "epoch": 1376} {"train_loss": -41.977935791015625, "global_step": 166522, "epoch": 1376} {"train_loss": -41.78791427612305, "global_step": 166523, "epoch": 1376} {"train_loss": -42.00042724609375, "global_step": 166524, "epoch": 1376} {"train_loss": -41.86445236206055, "global_step": 166525, "epoch": 1376} {"train_loss": -42.17463684082031, "global_step": 166526, "epoch": 1376} {"train_loss": -42.07180404663086, "global_step": 166527, "epoch": 1376} {"train_loss": -41.65541076660156, "global_step": 166528, "epoch": 1376} {"train_loss": -42.160621643066406, "global_step": 166529, "epoch": 1376} {"train_loss": -42.48331832885742, "global_step": 166530, "epoch": 1376} {"train_loss": -41.68979263305664, "global_step": 166531, "epoch": 1376} {"train_loss": -42.10264205932617, "global_step": 166532, "epoch": 1376} {"train_loss": -42.262699127197266, "global_step": 166533, "epoch": 1376} {"train_loss": -42.36149597167969, "global_step": 166534, "epoch": 1376} {"train_loss": -42.076908111572266, "global_step": 166535, "epoch": 1376} {"train_loss": -42.587432861328125, "global_step": 166536, "epoch": 1376} {"train_loss": -42.50094223022461, "global_step": 166537, "epoch": 1376} {"train_loss": -42.118804931640625, "global_step": 166538, "epoch": 1376} {"train_loss": -41.783790588378906, "global_step": 166539, "epoch": 1376} {"train_loss": -41.64387893676758, "global_step": 166540, "epoch": 1376} {"train_loss": -41.20671463012695, "global_step": 166541, "epoch": 1376} {"train_loss": -42.57831573486328, "global_step": 166542, "epoch": 1376} {"train_loss": -42.33416748046875, "global_step": 166543, "epoch": 1376} {"train_loss": -41.84892272949219, "global_step": 166544, "epoch": 1376} {"train_loss": -42.33998489379883, "global_step": 166545, "epoch": 1376} {"train_loss": -42.00545883178711, "global_step": 166546, "epoch": 1376} {"train_loss": -42.102901458740234, "global_step": 166547, "epoch": 1376} {"train_loss": -41.69306182861328, "global_step": 166548, "epoch": 1376} {"train_loss": -42.14432907104492, "global_step": 166549, "epoch": 1376} {"train_loss": -40.6669921875, "global_step": 166550, "epoch": 1376} {"train_loss": -39.596046447753906, "global_step": 166551, "epoch": 1376} {"train_loss": -41.18331527709961, "global_step": 166552, "epoch": 1376} {"train_loss": -41.65717315673828, "global_step": 166553, "epoch": 1376} {"train_loss": -41.188697814941406, "global_step": 166554, "epoch": 1376} {"train_loss": -41.353851318359375, "global_step": 166555, "epoch": 1376} {"train_loss": -41.45337677001953, "global_step": 166556, "epoch": 1376} {"train_loss": -41.9599494934082, "global_step": 166557, "epoch": 1376} {"train_loss": -41.990718841552734, "global_step": 166558, "epoch": 1376} {"train_loss": -41.50819778442383, "global_step": 166559, "epoch": 1376} {"train_loss": -41.52351379394531, "global_step": 166560, "epoch": 1376} {"train_loss": -42.22332763671875, "global_step": 166561, "epoch": 1376} {"train_loss": -41.317867279052734, "global_step": 166562, "epoch": 1376} {"train_loss": -40.52335739135742, "global_step": 166563, "epoch": 1376} {"train_loss": -41.36568069458008, "global_step": 166564, "epoch": 1376} {"train_loss": -40.65874481201172, "global_step": 166565, "epoch": 1376} {"train_loss": -41.97133255004883, "global_step": 166566, "epoch": 1376} {"train_loss": -41.7504997253418, "global_step": 166567, "epoch": 1376} {"train_loss": -40.69405746459961, "global_step": 166568, "epoch": 1376} {"train_loss": -38.90019607543945, "global_step": 166569, "epoch": 1376} {"train_loss": -40.72115707397461, "global_step": 166570, "epoch": 1376} {"train_loss": -41.28290939331055, "global_step": 166571, "epoch": 1376} {"train_loss": -40.97677230834961, "global_step": 166572, "epoch": 1376} {"train_loss": -40.99052429199219, "global_step": 166573, "epoch": 1376} {"train_loss": -40.8947639465332, "global_step": 166574, "epoch": 1376} {"train_loss": -40.46041488647461, "global_step": 166575, "epoch": 1376} {"train_loss": -40.81972885131836, "global_step": 166576, "epoch": 1376} {"train_loss": -40.24079513549805, "global_step": 166577, "epoch": 1376} {"train_loss": -41.08503341674805, "global_step": 166578, "epoch": 1376} {"train_loss": -41.005332946777344, "global_step": 166579, "epoch": 1376} {"train_loss": -41.87919235229492, "global_step": 166580, "epoch": 1376} {"train_loss": -41.5603141784668, "global_step": 166581, "epoch": 1376} {"train_loss": -40.967369079589844, "global_step": 166582, "epoch": 1376} {"train_loss": -41.17753982543945, "global_step": 166583, "epoch": 1376} {"train_loss": -39.377254486083984, "global_step": 166584, "epoch": 1376} {"train_loss": -41.651611328125, "global_step": 166585, "epoch": 1376} {"train_loss": -39.31996536254883, "global_step": 166586, "epoch": 1376} {"train_loss": -41.490447998046875, "global_step": 166587, "epoch": 1376} {"train_loss": -40.34426498413086, "global_step": 166588, "epoch": 1376} {"train_loss": -41.626583099365234, "global_step": 166589, "epoch": 1376} {"train_loss": -40.944068908691406, "global_step": 166590, "epoch": 1376} {"train_loss": -40.84965515136719, "global_step": 166591, "epoch": 1376} {"train_loss": -41.69236373901367, "global_step": 166592, "epoch": 1376} {"train_loss": -40.489803314208984, "global_step": 166593, "epoch": 1376} {"train_loss": -41.065528869628906, "global_step": 166594, "epoch": 1376} {"train_loss": -40.99060821533203, "global_step": 166595, "epoch": 1376} {"train_loss": -40.49504852294922, "global_step": 166596, "epoch": 1376} {"train_loss": -41.66020965576172, "global_step": 166597, "epoch": 1376} {"train_loss": -41.56147384643555, "global_step": 166598, "epoch": 1376} {"train_loss": -40.44589614868164, "global_step": 166599, "epoch": 1376} {"train_loss": -41.4857063293457, "global_step": 166600, "epoch": 1376} {"train_loss": -41.349342346191406, "global_step": 166601, "epoch": 1376} {"train_loss": -40.70330810546875, "global_step": 166602, "epoch": 1376} {"train_loss": -41.326351165771484, "global_step": 166603, "epoch": 1376} {"train_loss": -40.01540756225586, "global_step": 166604, "epoch": 1376} {"train_loss": -41.11416244506836, "global_step": 166605, "epoch": 1376} {"train_loss": -39.967281341552734, "global_step": 166606, "epoch": 1376} {"train_loss": -41.28837966918945, "global_step": 166607, "epoch": 1376} {"train_loss": -41.06122589111328, "global_step": 166608, "epoch": 1376} {"train_loss": -38.053443908691406, "global_step": 166609, "epoch": 1376} {"train_loss": -40.60072326660156, "global_step": 166610, "epoch": 1376} {"train_loss": -40.13622283935547, "global_step": 166611, "epoch": 1376} {"train_loss": -40.9855842590332, "global_step": 166612, "epoch": 1376} {"train_loss": -41.09682083129883, "global_step": 166613, "epoch": 1376} {"train_loss": -39.59596633911133, "global_step": 166614, "epoch": 1376} {"train_loss": -40.51209259033203, "global_step": 166615, "epoch": 1376} {"train_loss": -41.26776690522501, "global_step": 166616, "epoch": 1376, "val_loss": 2527464.75} {"train_loss": -41.79928207397461, "global_step": 166617, "epoch": 1377} {"train_loss": -39.24171829223633, "global_step": 166618, "epoch": 1377} {"train_loss": -40.765159606933594, "global_step": 166619, "epoch": 1377} {"train_loss": -39.5174674987793, "global_step": 166620, "epoch": 1377} {"train_loss": -39.31930160522461, "global_step": 166621, "epoch": 1377} {"train_loss": -39.09894943237305, "global_step": 166622, "epoch": 1377} {"train_loss": -39.99131393432617, "global_step": 166623, "epoch": 1377} {"train_loss": -40.045082092285156, "global_step": 166624, "epoch": 1377} {"train_loss": -38.828853607177734, "global_step": 166625, "epoch": 1377} {"train_loss": -41.74042892456055, "global_step": 166626, "epoch": 1377} {"train_loss": -40.35737991333008, "global_step": 166627, "epoch": 1377} {"train_loss": -39.86129379272461, "global_step": 166628, "epoch": 1377} {"train_loss": -39.776039123535156, "global_step": 166629, "epoch": 1377} {"train_loss": -40.88087463378906, "global_step": 166630, "epoch": 1377} {"train_loss": -41.462059020996094, "global_step": 166631, "epoch": 1377} {"train_loss": -41.49099349975586, "global_step": 166632, "epoch": 1377} {"train_loss": -40.76585388183594, "global_step": 166633, "epoch": 1377} {"train_loss": -40.52388381958008, "global_step": 166634, "epoch": 1377} {"train_loss": -40.82904815673828, "global_step": 166635, "epoch": 1377} {"train_loss": -40.76591491699219, "global_step": 166636, "epoch": 1377} {"train_loss": -41.948978424072266, "global_step": 166637, "epoch": 1377} {"train_loss": -41.56817626953125, "global_step": 166638, "epoch": 1377} {"train_loss": -41.85852813720703, "global_step": 166639, "epoch": 1377} {"train_loss": -41.986690521240234, "global_step": 166640, "epoch": 1377} {"train_loss": -41.80067443847656, "global_step": 166641, "epoch": 1377} {"train_loss": -41.85158920288086, "global_step": 166642, "epoch": 1377} {"train_loss": -42.4427375793457, "global_step": 166643, "epoch": 1377} {"train_loss": -41.2135009765625, "global_step": 166644, "epoch": 1377} {"train_loss": -42.344417572021484, "global_step": 166645, "epoch": 1377} {"train_loss": -41.97175979614258, "global_step": 166646, "epoch": 1377} {"train_loss": -42.27315139770508, "global_step": 166647, "epoch": 1377} {"train_loss": -42.12654495239258, "global_step": 166648, "epoch": 1377} {"train_loss": -42.16634750366211, "global_step": 166649, "epoch": 1377} {"train_loss": -42.2961540222168, "global_step": 166650, "epoch": 1377} {"train_loss": -42.1304817199707, "global_step": 166651, "epoch": 1377} {"train_loss": -41.75562286376953, "global_step": 166652, "epoch": 1377} {"train_loss": -41.812591552734375, "global_step": 166653, "epoch": 1377} {"train_loss": -41.68708419799805, "global_step": 166654, "epoch": 1377} {"train_loss": -41.416378021240234, "global_step": 166655, "epoch": 1377} {"train_loss": -41.570064544677734, "global_step": 166656, "epoch": 1377} {"train_loss": -42.47990417480469, "global_step": 166657, "epoch": 1377} {"train_loss": -41.753414154052734, "global_step": 166658, "epoch": 1377} {"train_loss": -42.297576904296875, "global_step": 166659, "epoch": 1377} {"train_loss": -41.874107360839844, "global_step": 166660, "epoch": 1377} {"train_loss": -42.48346710205078, "global_step": 166661, "epoch": 1377} {"train_loss": -42.444129943847656, "global_step": 166662, "epoch": 1377} {"train_loss": -42.60764694213867, "global_step": 166663, "epoch": 1377} {"train_loss": -42.39672088623047, "global_step": 166664, "epoch": 1377} {"train_loss": -42.190460205078125, "global_step": 166665, "epoch": 1377} {"train_loss": -41.373104095458984, "global_step": 166666, "epoch": 1377} {"train_loss": -41.269466400146484, "global_step": 166667, "epoch": 1377} {"train_loss": -41.2995719909668, "global_step": 166668, "epoch": 1377} {"train_loss": -40.682647705078125, "global_step": 166669, "epoch": 1377} {"train_loss": -37.14664840698242, "global_step": 166670, "epoch": 1377} {"train_loss": -41.05921173095703, "global_step": 166671, "epoch": 1377} {"train_loss": -37.08287811279297, "global_step": 166672, "epoch": 1377} {"train_loss": -41.041343688964844, "global_step": 166673, "epoch": 1377} {"train_loss": -38.55815887451172, "global_step": 166674, "epoch": 1377} {"train_loss": -40.10398483276367, "global_step": 166675, "epoch": 1377} {"train_loss": -40.3007698059082, "global_step": 166676, "epoch": 1377} {"train_loss": -39.529544830322266, "global_step": 166677, "epoch": 1377} {"train_loss": -40.948123931884766, "global_step": 166678, "epoch": 1377} {"train_loss": -40.28471374511719, "global_step": 166679, "epoch": 1377} {"train_loss": -40.514137268066406, "global_step": 166680, "epoch": 1377} {"train_loss": -38.313045501708984, "global_step": 166681, "epoch": 1377} {"train_loss": -40.38776779174805, "global_step": 166682, "epoch": 1377} {"train_loss": -39.698387145996094, "global_step": 166683, "epoch": 1377} {"train_loss": -38.96384811401367, "global_step": 166684, "epoch": 1377} {"train_loss": -41.25547409057617, "global_step": 166685, "epoch": 1377} {"train_loss": -39.17869186401367, "global_step": 166686, "epoch": 1377} {"train_loss": -41.07358932495117, "global_step": 166687, "epoch": 1377} {"train_loss": -37.73621368408203, "global_step": 166688, "epoch": 1377} {"train_loss": -37.69438171386719, "global_step": 166689, "epoch": 1377} {"train_loss": -40.5904655456543, "global_step": 166690, "epoch": 1377} {"train_loss": -35.64262008666992, "global_step": 166691, "epoch": 1377} {"train_loss": -37.400447845458984, "global_step": 166692, "epoch": 1377} {"train_loss": -39.08295822143555, "global_step": 166693, "epoch": 1377} {"train_loss": -37.99068832397461, "global_step": 166694, "epoch": 1377} {"train_loss": -40.059959411621094, "global_step": 166695, "epoch": 1377} {"train_loss": -39.64202880859375, "global_step": 166696, "epoch": 1377} {"train_loss": -38.97411346435547, "global_step": 166697, "epoch": 1377} {"train_loss": -38.30878829956055, "global_step": 166698, "epoch": 1377} {"train_loss": -38.755348205566406, "global_step": 166699, "epoch": 1377} {"train_loss": -40.4196662902832, "global_step": 166700, "epoch": 1377} {"train_loss": -39.82453155517578, "global_step": 166701, "epoch": 1377} {"train_loss": -39.45649337768555, "global_step": 166702, "epoch": 1377} {"train_loss": -40.061397552490234, "global_step": 166703, "epoch": 1377} {"train_loss": -40.55471420288086, "global_step": 166704, "epoch": 1377} {"train_loss": -37.643985748291016, "global_step": 166705, "epoch": 1377} {"train_loss": -39.79545211791992, "global_step": 166706, "epoch": 1377} {"train_loss": -39.86182403564453, "global_step": 166707, "epoch": 1377} {"train_loss": -39.79522705078125, "global_step": 166708, "epoch": 1377} {"train_loss": -40.049381256103516, "global_step": 166709, "epoch": 1377} {"train_loss": -40.5513916015625, "global_step": 166710, "epoch": 1377} {"train_loss": -40.791664123535156, "global_step": 166711, "epoch": 1377} {"train_loss": -40.402217864990234, "global_step": 166712, "epoch": 1377} {"train_loss": -41.17478561401367, "global_step": 166713, "epoch": 1377} {"train_loss": -40.12087631225586, "global_step": 166714, "epoch": 1377} {"train_loss": -40.87089920043945, "global_step": 166715, "epoch": 1377} {"train_loss": -41.37983703613281, "global_step": 166716, "epoch": 1377} {"train_loss": -40.701995849609375, "global_step": 166717, "epoch": 1377} {"train_loss": -40.77362060546875, "global_step": 166718, "epoch": 1377} {"train_loss": -41.10409164428711, "global_step": 166719, "epoch": 1377} {"train_loss": -40.9193229675293, "global_step": 166720, "epoch": 1377} {"train_loss": -41.669403076171875, "global_step": 166721, "epoch": 1377} {"train_loss": -40.75788497924805, "global_step": 166722, "epoch": 1377} {"train_loss": -41.15864944458008, "global_step": 166723, "epoch": 1377} {"train_loss": -41.38932418823242, "global_step": 166724, "epoch": 1377} {"train_loss": -41.29136276245117, "global_step": 166725, "epoch": 1377} {"train_loss": -41.035274505615234, "global_step": 166726, "epoch": 1377} {"train_loss": -40.95577621459961, "global_step": 166727, "epoch": 1377} {"train_loss": -41.36959457397461, "global_step": 166728, "epoch": 1377} {"train_loss": -41.84741973876953, "global_step": 166729, "epoch": 1377} {"train_loss": -40.110713958740234, "global_step": 166730, "epoch": 1377} {"train_loss": -42.0090217590332, "global_step": 166731, "epoch": 1377} {"train_loss": -40.99821472167969, "global_step": 166732, "epoch": 1377} {"train_loss": -41.33686065673828, "global_step": 166733, "epoch": 1377} {"train_loss": -41.78350830078125, "global_step": 166734, "epoch": 1377} {"train_loss": -41.722896575927734, "global_step": 166735, "epoch": 1377} {"train_loss": -41.946632385253906, "global_step": 166736, "epoch": 1377} {"train_loss": -40.637772457658755, "global_step": 166737, "epoch": 1377, "val_loss": 2612226.75} {"train_loss": -40.662227630615234, "global_step": 166738, "epoch": 1378} {"train_loss": -41.23952865600586, "global_step": 166739, "epoch": 1378} {"train_loss": -41.83205032348633, "global_step": 166740, "epoch": 1378} {"train_loss": -42.311065673828125, "global_step": 166741, "epoch": 1378} {"train_loss": -41.67960739135742, "global_step": 166742, "epoch": 1378} {"train_loss": -41.91548156738281, "global_step": 166743, "epoch": 1378} {"train_loss": -41.996578216552734, "global_step": 166744, "epoch": 1378} {"train_loss": -42.2484245300293, "global_step": 166745, "epoch": 1378} {"train_loss": -42.182945251464844, "global_step": 166746, "epoch": 1378} {"train_loss": -42.533042907714844, "global_step": 166747, "epoch": 1378} {"train_loss": -42.03971481323242, "global_step": 166748, "epoch": 1378} {"train_loss": -41.92219161987305, "global_step": 166749, "epoch": 1378} {"train_loss": -41.54502487182617, "global_step": 166750, "epoch": 1378} {"train_loss": -41.91810607910156, "global_step": 166751, "epoch": 1378} {"train_loss": -41.53493881225586, "global_step": 166752, "epoch": 1378} {"train_loss": -41.63385772705078, "global_step": 166753, "epoch": 1378} {"train_loss": -41.87109375, "global_step": 166754, "epoch": 1378} {"train_loss": -41.89601135253906, "global_step": 166755, "epoch": 1378} {"train_loss": -42.33295822143555, "global_step": 166756, "epoch": 1378} {"train_loss": -41.900081634521484, "global_step": 166757, "epoch": 1378} {"train_loss": -41.86196517944336, "global_step": 166758, "epoch": 1378} {"train_loss": -41.76913833618164, "global_step": 166759, "epoch": 1378} {"train_loss": -41.8177604675293, "global_step": 166760, "epoch": 1378} {"train_loss": -42.13044357299805, "global_step": 166761, "epoch": 1378} {"train_loss": -42.26435470581055, "global_step": 166762, "epoch": 1378} {"train_loss": -42.33639144897461, "global_step": 166763, "epoch": 1378} {"train_loss": -42.00687789916992, "global_step": 166764, "epoch": 1378} {"train_loss": -42.29098129272461, "global_step": 166765, "epoch": 1378} {"train_loss": -42.26581954956055, "global_step": 166766, "epoch": 1378} {"train_loss": -41.9193115234375, "global_step": 166767, "epoch": 1378} {"train_loss": -41.93852996826172, "global_step": 166768, "epoch": 1378} {"train_loss": -42.18259811401367, "global_step": 166769, "epoch": 1378} {"train_loss": -42.28816223144531, "global_step": 166770, "epoch": 1378} {"train_loss": -42.9312744140625, "global_step": 166771, "epoch": 1378} {"train_loss": -41.69596481323242, "global_step": 166772, "epoch": 1378} {"train_loss": -42.293087005615234, "global_step": 166773, "epoch": 1378} {"train_loss": -41.62553024291992, "global_step": 166774, "epoch": 1378} {"train_loss": -41.23844528198242, "global_step": 166775, "epoch": 1378} {"train_loss": -41.784542083740234, "global_step": 166776, "epoch": 1378} {"train_loss": -42.03934860229492, "global_step": 166777, "epoch": 1378} {"train_loss": -41.37346267700195, "global_step": 166778, "epoch": 1378} {"train_loss": -42.569210052490234, "global_step": 166779, "epoch": 1378} {"train_loss": -41.75310134887695, "global_step": 166780, "epoch": 1378} {"train_loss": -41.18896484375, "global_step": 166781, "epoch": 1378} {"train_loss": -42.34745407104492, "global_step": 166782, "epoch": 1378} {"train_loss": -41.912899017333984, "global_step": 166783, "epoch": 1378} {"train_loss": -38.30064010620117, "global_step": 166784, "epoch": 1378} {"train_loss": -41.38676834106445, "global_step": 166785, "epoch": 1378} {"train_loss": -42.06391143798828, "global_step": 166786, "epoch": 1378} {"train_loss": -41.51674270629883, "global_step": 166787, "epoch": 1378} {"train_loss": -41.740543365478516, "global_step": 166788, "epoch": 1378} {"train_loss": -41.21418380737305, "global_step": 166789, "epoch": 1378} {"train_loss": -40.16328048706055, "global_step": 166790, "epoch": 1378} {"train_loss": -40.03815841674805, "global_step": 166791, "epoch": 1378} {"train_loss": -39.91259765625, "global_step": 166792, "epoch": 1378} {"train_loss": -39.04082107543945, "global_step": 166793, "epoch": 1378} {"train_loss": -40.207271575927734, "global_step": 166794, "epoch": 1378} {"train_loss": -40.11393356323242, "global_step": 166795, "epoch": 1378} {"train_loss": -39.964622497558594, "global_step": 166796, "epoch": 1378} {"train_loss": -40.889381408691406, "global_step": 166797, "epoch": 1378} {"train_loss": -39.90636444091797, "global_step": 166798, "epoch": 1378} {"train_loss": -41.13186264038086, "global_step": 166799, "epoch": 1378} {"train_loss": -40.32464599609375, "global_step": 166800, "epoch": 1378} {"train_loss": -40.046775817871094, "global_step": 166801, "epoch": 1378} {"train_loss": -40.91962432861328, "global_step": 166802, "epoch": 1378} {"train_loss": -40.746490478515625, "global_step": 166803, "epoch": 1378} {"train_loss": -40.09185791015625, "global_step": 166804, "epoch": 1378} {"train_loss": -40.627723693847656, "global_step": 166805, "epoch": 1378} {"train_loss": -40.63958740234375, "global_step": 166806, "epoch": 1378} {"train_loss": -40.467689514160156, "global_step": 166807, "epoch": 1378} {"train_loss": -36.584877014160156, "global_step": 166808, "epoch": 1378} {"train_loss": -40.88998031616211, "global_step": 166809, "epoch": 1378} {"train_loss": -38.93027877807617, "global_step": 166810, "epoch": 1378} {"train_loss": -39.219539642333984, "global_step": 166811, "epoch": 1378} {"train_loss": -39.923973083496094, "global_step": 166812, "epoch": 1378} {"train_loss": -39.59553146362305, "global_step": 166813, "epoch": 1378} {"train_loss": -41.07725143432617, "global_step": 166814, "epoch": 1378} {"train_loss": -39.55772399902344, "global_step": 166815, "epoch": 1378} {"train_loss": -39.66209030151367, "global_step": 166816, "epoch": 1378} {"train_loss": -40.48977279663086, "global_step": 166817, "epoch": 1378} {"train_loss": -40.365631103515625, "global_step": 166818, "epoch": 1378} {"train_loss": -40.52728271484375, "global_step": 166819, "epoch": 1378} {"train_loss": -39.15113067626953, "global_step": 166820, "epoch": 1378} {"train_loss": -40.13017654418945, "global_step": 166821, "epoch": 1378} {"train_loss": -39.918643951416016, "global_step": 166822, "epoch": 1378} {"train_loss": -41.09283447265625, "global_step": 166823, "epoch": 1378} {"train_loss": -40.39213943481445, "global_step": 166824, "epoch": 1378} {"train_loss": -40.515132904052734, "global_step": 166825, "epoch": 1378} {"train_loss": -40.87409591674805, "global_step": 166826, "epoch": 1378} {"train_loss": -40.672542572021484, "global_step": 166827, "epoch": 1378} {"train_loss": -40.16908645629883, "global_step": 166828, "epoch": 1378} {"train_loss": -41.352901458740234, "global_step": 166829, "epoch": 1378} {"train_loss": -40.563072204589844, "global_step": 166830, "epoch": 1378} {"train_loss": -40.134254455566406, "global_step": 166831, "epoch": 1378} {"train_loss": -40.88276290893555, "global_step": 166832, "epoch": 1378} {"train_loss": -40.085365295410156, "global_step": 166833, "epoch": 1378} {"train_loss": -40.481632232666016, "global_step": 166834, "epoch": 1378} {"train_loss": -41.259159088134766, "global_step": 166835, "epoch": 1378} {"train_loss": -41.01747512817383, "global_step": 166836, "epoch": 1378} {"train_loss": -40.476585388183594, "global_step": 166837, "epoch": 1378} {"train_loss": -41.31608963012695, "global_step": 166838, "epoch": 1378} {"train_loss": -41.725868225097656, "global_step": 166839, "epoch": 1378} {"train_loss": -41.004695892333984, "global_step": 166840, "epoch": 1378} {"train_loss": -41.500553131103516, "global_step": 166841, "epoch": 1378} {"train_loss": -40.88715744018555, "global_step": 166842, "epoch": 1378} {"train_loss": -41.250640869140625, "global_step": 166843, "epoch": 1378} {"train_loss": -40.102935791015625, "global_step": 166844, "epoch": 1378} {"train_loss": -41.86521530151367, "global_step": 166845, "epoch": 1378} {"train_loss": -39.93204879760742, "global_step": 166846, "epoch": 1378} {"train_loss": -39.98392105102539, "global_step": 166847, "epoch": 1378} {"train_loss": -41.344764709472656, "global_step": 166848, "epoch": 1378} {"train_loss": -41.22332763671875, "global_step": 166849, "epoch": 1378} {"train_loss": -41.288818359375, "global_step": 166850, "epoch": 1378} {"train_loss": -41.81581497192383, "global_step": 166851, "epoch": 1378} {"train_loss": -41.84290313720703, "global_step": 166852, "epoch": 1378} {"train_loss": -41.97763442993164, "global_step": 166853, "epoch": 1378} {"train_loss": -41.87226486206055, "global_step": 166854, "epoch": 1378} {"train_loss": -41.45327377319336, "global_step": 166855, "epoch": 1378} {"train_loss": -42.123165130615234, "global_step": 166856, "epoch": 1378} {"train_loss": -41.52534866333008, "global_step": 166857, "epoch": 1378} {"train_loss": -41.1099026892796, "global_step": 166858, "epoch": 1378, "val_loss": 2564050.25} {"train_loss": -42.080810546875, "global_step": 166859, "epoch": 1379} {"train_loss": -41.30379104614258, "global_step": 166860, "epoch": 1379} {"train_loss": -41.67210006713867, "global_step": 166861, "epoch": 1379} {"train_loss": -41.96616744995117, "global_step": 166862, "epoch": 1379} {"train_loss": -40.8404655456543, "global_step": 166863, "epoch": 1379} {"train_loss": -41.80156326293945, "global_step": 166864, "epoch": 1379} {"train_loss": -41.80464172363281, "global_step": 166865, "epoch": 1379} {"train_loss": -41.92927932739258, "global_step": 166866, "epoch": 1379} {"train_loss": -41.07676315307617, "global_step": 166867, "epoch": 1379} {"train_loss": -40.928043365478516, "global_step": 166868, "epoch": 1379} {"train_loss": -40.95705032348633, "global_step": 166869, "epoch": 1379} {"train_loss": -41.3343391418457, "global_step": 166870, "epoch": 1379} {"train_loss": -41.236358642578125, "global_step": 166871, "epoch": 1379} {"train_loss": -39.686885833740234, "global_step": 166872, "epoch": 1379} {"train_loss": -40.93817138671875, "global_step": 166873, "epoch": 1379} {"train_loss": -41.5876350402832, "global_step": 166874, "epoch": 1379} {"train_loss": -40.88365173339844, "global_step": 166875, "epoch": 1379} {"train_loss": -40.40522766113281, "global_step": 166876, "epoch": 1379} {"train_loss": -41.42576599121094, "global_step": 166877, "epoch": 1379} {"train_loss": -41.57844924926758, "global_step": 166878, "epoch": 1379} {"train_loss": -41.13275146484375, "global_step": 166879, "epoch": 1379} {"train_loss": -39.545955657958984, "global_step": 166880, "epoch": 1379} {"train_loss": -41.823646545410156, "global_step": 166881, "epoch": 1379} {"train_loss": -41.25063705444336, "global_step": 166882, "epoch": 1379} {"train_loss": -41.27764892578125, "global_step": 166883, "epoch": 1379} {"train_loss": -41.23878479003906, "global_step": 166884, "epoch": 1379} {"train_loss": -41.92417526245117, "global_step": 166885, "epoch": 1379} {"train_loss": -41.5580940246582, "global_step": 166886, "epoch": 1379} {"train_loss": -40.43898391723633, "global_step": 166887, "epoch": 1379} {"train_loss": -39.761016845703125, "global_step": 166888, "epoch": 1379} {"train_loss": -41.14866256713867, "global_step": 166889, "epoch": 1379} {"train_loss": -41.66797637939453, "global_step": 166890, "epoch": 1379} {"train_loss": -41.462120056152344, "global_step": 166891, "epoch": 1379} {"train_loss": -41.248199462890625, "global_step": 166892, "epoch": 1379} {"train_loss": -40.71515655517578, "global_step": 166893, "epoch": 1379} {"train_loss": -38.667232513427734, "global_step": 166894, "epoch": 1379} {"train_loss": -40.512027740478516, "global_step": 166895, "epoch": 1379} {"train_loss": -38.68745040893555, "global_step": 166896, "epoch": 1379} {"train_loss": -41.1388053894043, "global_step": 166897, "epoch": 1379} {"train_loss": -40.67489242553711, "global_step": 166898, "epoch": 1379} {"train_loss": -41.25640106201172, "global_step": 166899, "epoch": 1379} {"train_loss": -41.47465133666992, "global_step": 166900, "epoch": 1379} {"train_loss": -40.922359466552734, "global_step": 166901, "epoch": 1379} {"train_loss": -41.92074966430664, "global_step": 166902, "epoch": 1379} {"train_loss": -40.77825164794922, "global_step": 166903, "epoch": 1379} {"train_loss": -41.0361328125, "global_step": 166904, "epoch": 1379} {"train_loss": -40.575950622558594, "global_step": 166905, "epoch": 1379} {"train_loss": -40.6098518371582, "global_step": 166906, "epoch": 1379} {"train_loss": -41.49224090576172, "global_step": 166907, "epoch": 1379} {"train_loss": -41.03548812866211, "global_step": 166908, "epoch": 1379} {"train_loss": -41.587913513183594, "global_step": 166909, "epoch": 1379} {"train_loss": -41.132659912109375, "global_step": 166910, "epoch": 1379} {"train_loss": -40.86176300048828, "global_step": 166911, "epoch": 1379} {"train_loss": -42.030574798583984, "global_step": 166912, "epoch": 1379} {"train_loss": -41.73773956298828, "global_step": 166913, "epoch": 1379} {"train_loss": -40.86077117919922, "global_step": 166914, "epoch": 1379} {"train_loss": -40.760921478271484, "global_step": 166915, "epoch": 1379} {"train_loss": -41.888668060302734, "global_step": 166916, "epoch": 1379} {"train_loss": -41.50625991821289, "global_step": 166917, "epoch": 1379} {"train_loss": -40.103668212890625, "global_step": 166918, "epoch": 1379} {"train_loss": -42.3514404296875, "global_step": 166919, "epoch": 1379} {"train_loss": -41.27677536010742, "global_step": 166920, "epoch": 1379} {"train_loss": -41.63066864013672, "global_step": 166921, "epoch": 1379} {"train_loss": -40.56760787963867, "global_step": 166922, "epoch": 1379} {"train_loss": -39.7309684753418, "global_step": 166923, "epoch": 1379} {"train_loss": -40.826473236083984, "global_step": 166924, "epoch": 1379} {"train_loss": -40.469825744628906, "global_step": 166925, "epoch": 1379} {"train_loss": -41.341163635253906, "global_step": 166926, "epoch": 1379} {"train_loss": -40.92183303833008, "global_step": 166927, "epoch": 1379} {"train_loss": -37.43336868286133, "global_step": 166928, "epoch": 1379} {"train_loss": -40.86130905151367, "global_step": 166929, "epoch": 1379} {"train_loss": -35.74424362182617, "global_step": 166930, "epoch": 1379} {"train_loss": -35.18976974487305, "global_step": 166931, "epoch": 1379} {"train_loss": -31.404510498046875, "global_step": 166932, "epoch": 1379} {"train_loss": -33.6073112487793, "global_step": 166933, "epoch": 1379} {"train_loss": -36.234066009521484, "global_step": 166934, "epoch": 1379} {"train_loss": -34.658756256103516, "global_step": 166935, "epoch": 1379} {"train_loss": -35.85469055175781, "global_step": 166936, "epoch": 1379} {"train_loss": -33.92595291137695, "global_step": 166937, "epoch": 1379} {"train_loss": -34.769649505615234, "global_step": 166938, "epoch": 1379} {"train_loss": -36.46994400024414, "global_step": 166939, "epoch": 1379} {"train_loss": -35.21660614013672, "global_step": 166940, "epoch": 1379} {"train_loss": -36.30892562866211, "global_step": 166941, "epoch": 1379} {"train_loss": -35.7237663269043, "global_step": 166942, "epoch": 1379} {"train_loss": -36.435909271240234, "global_step": 166943, "epoch": 1379} {"train_loss": -35.85251998901367, "global_step": 166944, "epoch": 1379} {"train_loss": -36.43848419189453, "global_step": 166945, "epoch": 1379} {"train_loss": -36.17646789550781, "global_step": 166946, "epoch": 1379} {"train_loss": -36.97760772705078, "global_step": 166947, "epoch": 1379} {"train_loss": -36.74331283569336, "global_step": 166948, "epoch": 1379} {"train_loss": -36.33602523803711, "global_step": 166949, "epoch": 1379} {"train_loss": -36.9096794128418, "global_step": 166950, "epoch": 1379} {"train_loss": -37.55863571166992, "global_step": 166951, "epoch": 1379} {"train_loss": -36.66086959838867, "global_step": 166952, "epoch": 1379} {"train_loss": -37.111934661865234, "global_step": 166953, "epoch": 1379} {"train_loss": -37.0384521484375, "global_step": 166954, "epoch": 1379} {"train_loss": -35.35528564453125, "global_step": 166955, "epoch": 1379} {"train_loss": -37.43734359741211, "global_step": 166956, "epoch": 1379} {"train_loss": -37.29453659057617, "global_step": 166957, "epoch": 1379} {"train_loss": -37.25727081298828, "global_step": 166958, "epoch": 1379} {"train_loss": -37.098697662353516, "global_step": 166959, "epoch": 1379} {"train_loss": -36.770790100097656, "global_step": 166960, "epoch": 1379} {"train_loss": -36.31619644165039, "global_step": 166961, "epoch": 1379} {"train_loss": -34.4813117980957, "global_step": 166962, "epoch": 1379} {"train_loss": -36.373897552490234, "global_step": 166963, "epoch": 1379} {"train_loss": -37.22630310058594, "global_step": 166964, "epoch": 1379} {"train_loss": -38.119503021240234, "global_step": 166965, "epoch": 1379} {"train_loss": -37.67435836791992, "global_step": 166966, "epoch": 1379} {"train_loss": -36.927833557128906, "global_step": 166967, "epoch": 1379} {"train_loss": -37.754451751708984, "global_step": 166968, "epoch": 1379} {"train_loss": -37.8569450378418, "global_step": 166969, "epoch": 1379} {"train_loss": -37.979736328125, "global_step": 166970, "epoch": 1379} {"train_loss": -37.66791915893555, "global_step": 166971, "epoch": 1379} {"train_loss": -38.33665084838867, "global_step": 166972, "epoch": 1379} {"train_loss": -38.316741943359375, "global_step": 166973, "epoch": 1379} {"train_loss": -38.66392135620117, "global_step": 166974, "epoch": 1379} {"train_loss": -38.23550033569336, "global_step": 166975, "epoch": 1379} {"train_loss": -38.78873825073242, "global_step": 166976, "epoch": 1379} {"train_loss": -38.136444091796875, "global_step": 166977, "epoch": 1379} {"train_loss": -36.91569137573242, "global_step": 166978, "epoch": 1379} {"train_loss": -39.177868992829126, "global_step": 166979, "epoch": 1379, "val_loss": 2652067.75} {"train_loss": -35.86404800415039, "global_step": 166980, "epoch": 1380} {"train_loss": -38.36491394042969, "global_step": 166981, "epoch": 1380} {"train_loss": -37.939247131347656, "global_step": 166982, "epoch": 1380} {"train_loss": -36.977996826171875, "global_step": 166983, "epoch": 1380} {"train_loss": -39.111183166503906, "global_step": 166984, "epoch": 1380} {"train_loss": -37.62087631225586, "global_step": 166985, "epoch": 1380} {"train_loss": -38.279762268066406, "global_step": 166986, "epoch": 1380} {"train_loss": -38.550880432128906, "global_step": 166987, "epoch": 1380} {"train_loss": -38.41164016723633, "global_step": 166988, "epoch": 1380} {"train_loss": -39.244991302490234, "global_step": 166989, "epoch": 1380} {"train_loss": -39.083717346191406, "global_step": 166990, "epoch": 1380} {"train_loss": -39.375396728515625, "global_step": 166991, "epoch": 1380} {"train_loss": -37.791507720947266, "global_step": 166992, "epoch": 1380} {"train_loss": -38.8375358581543, "global_step": 166993, "epoch": 1380} {"train_loss": -39.361976623535156, "global_step": 166994, "epoch": 1380} {"train_loss": -38.70066452026367, "global_step": 166995, "epoch": 1380} {"train_loss": -37.746700286865234, "global_step": 166996, "epoch": 1380} {"train_loss": -35.83879470825195, "global_step": 166997, "epoch": 1380} {"train_loss": -37.23388671875, "global_step": 166998, "epoch": 1380} {"train_loss": -38.163063049316406, "global_step": 166999, "epoch": 1380} {"train_loss": -35.648590087890625, "global_step": 167000, "epoch": 1380} {"train_loss": -37.39973068237305, "global_step": 167001, "epoch": 1380} {"train_loss": -39.073909759521484, "global_step": 167002, "epoch": 1380} {"train_loss": -36.93071365356445, "global_step": 167003, "epoch": 1380} {"train_loss": -39.602779388427734, "global_step": 167004, "epoch": 1380} {"train_loss": -38.382320404052734, "global_step": 167005, "epoch": 1380} {"train_loss": -39.890419006347656, "global_step": 167006, "epoch": 1380} {"train_loss": -38.672786712646484, "global_step": 167007, "epoch": 1380} {"train_loss": -39.7041130065918, "global_step": 167008, "epoch": 1380} {"train_loss": -38.46128463745117, "global_step": 167009, "epoch": 1380} {"train_loss": -39.76519775390625, "global_step": 167010, "epoch": 1380} {"train_loss": -39.751155853271484, "global_step": 167011, "epoch": 1380} {"train_loss": -39.84810256958008, "global_step": 167012, "epoch": 1380} {"train_loss": -40.13656997680664, "global_step": 167013, "epoch": 1380} {"train_loss": -39.09308624267578, "global_step": 167014, "epoch": 1380} {"train_loss": -39.691253662109375, "global_step": 167015, "epoch": 1380} {"train_loss": -39.07789993286133, "global_step": 167016, "epoch": 1380} {"train_loss": -37.43890380859375, "global_step": 167017, "epoch": 1380} {"train_loss": -36.28164291381836, "global_step": 167018, "epoch": 1380} {"train_loss": -37.51444625854492, "global_step": 167019, "epoch": 1380} {"train_loss": -38.525482177734375, "global_step": 167020, "epoch": 1380} {"train_loss": -36.92023849487305, "global_step": 167021, "epoch": 1380} {"train_loss": -39.60928726196289, "global_step": 167022, "epoch": 1380} {"train_loss": -38.787940979003906, "global_step": 167023, "epoch": 1380} {"train_loss": -39.23393630981445, "global_step": 167024, "epoch": 1380} {"train_loss": -38.839988708496094, "global_step": 167025, "epoch": 1380} {"train_loss": -38.64443588256836, "global_step": 167026, "epoch": 1380} {"train_loss": -38.420249938964844, "global_step": 167027, "epoch": 1380} {"train_loss": -36.73280715942383, "global_step": 167028, "epoch": 1380} {"train_loss": -39.63543701171875, "global_step": 167029, "epoch": 1380} {"train_loss": -39.549957275390625, "global_step": 167030, "epoch": 1380} {"train_loss": -39.251094818115234, "global_step": 167031, "epoch": 1380} {"train_loss": -39.94643020629883, "global_step": 167032, "epoch": 1380} {"train_loss": -39.12593460083008, "global_step": 167033, "epoch": 1380} {"train_loss": -38.842552185058594, "global_step": 167034, "epoch": 1380} {"train_loss": -39.22089385986328, "global_step": 167035, "epoch": 1380} {"train_loss": -40.408809661865234, "global_step": 167036, "epoch": 1380} {"train_loss": -39.062381744384766, "global_step": 167037, "epoch": 1380} {"train_loss": -39.81360626220703, "global_step": 167038, "epoch": 1380} {"train_loss": -40.09213638305664, "global_step": 167039, "epoch": 1380} {"train_loss": -39.845523834228516, "global_step": 167040, "epoch": 1380} {"train_loss": -39.92539596557617, "global_step": 167041, "epoch": 1380} {"train_loss": -39.93313217163086, "global_step": 167042, "epoch": 1380} {"train_loss": -39.211669921875, "global_step": 167043, "epoch": 1380} {"train_loss": -38.50614547729492, "global_step": 167044, "epoch": 1380} {"train_loss": -39.522945404052734, "global_step": 167045, "epoch": 1380} {"train_loss": -38.27702331542969, "global_step": 167046, "epoch": 1380} {"train_loss": -37.689720153808594, "global_step": 167047, "epoch": 1380} {"train_loss": -38.51417922973633, "global_step": 167048, "epoch": 1380} {"train_loss": -39.80927276611328, "global_step": 167049, "epoch": 1380} {"train_loss": -39.54430389404297, "global_step": 167050, "epoch": 1380} {"train_loss": -38.226226806640625, "global_step": 167051, "epoch": 1380} {"train_loss": -38.21696090698242, "global_step": 167052, "epoch": 1380} {"train_loss": -38.050453186035156, "global_step": 167053, "epoch": 1380} {"train_loss": -37.71036148071289, "global_step": 167054, "epoch": 1380} {"train_loss": -37.44943618774414, "global_step": 167055, "epoch": 1380} {"train_loss": -39.00429916381836, "global_step": 167056, "epoch": 1380} {"train_loss": -38.83927536010742, "global_step": 167057, "epoch": 1380} {"train_loss": -34.05006790161133, "global_step": 167058, "epoch": 1380} {"train_loss": -38.59910202026367, "global_step": 167059, "epoch": 1380} {"train_loss": -39.0584602355957, "global_step": 167060, "epoch": 1380} {"train_loss": -39.274600982666016, "global_step": 167061, "epoch": 1380} {"train_loss": -39.69468307495117, "global_step": 167062, "epoch": 1380} {"train_loss": -39.38759231567383, "global_step": 167063, "epoch": 1380} {"train_loss": -38.240264892578125, "global_step": 167064, "epoch": 1380} {"train_loss": -39.112918853759766, "global_step": 167065, "epoch": 1380} {"train_loss": -38.8980712890625, "global_step": 167066, "epoch": 1380} {"train_loss": -39.412899017333984, "global_step": 167067, "epoch": 1380} {"train_loss": -39.25629806518555, "global_step": 167068, "epoch": 1380} {"train_loss": -37.97755813598633, "global_step": 167069, "epoch": 1380} {"train_loss": -38.09518814086914, "global_step": 167070, "epoch": 1380} {"train_loss": -39.82304763793945, "global_step": 167071, "epoch": 1380} {"train_loss": -39.14840316772461, "global_step": 167072, "epoch": 1380} {"train_loss": -39.40342330932617, "global_step": 167073, "epoch": 1380} {"train_loss": -39.904842376708984, "global_step": 167074, "epoch": 1380} {"train_loss": -39.26622009277344, "global_step": 167075, "epoch": 1380} {"train_loss": -39.7425422668457, "global_step": 167076, "epoch": 1380} {"train_loss": -39.1633186340332, "global_step": 167077, "epoch": 1380} {"train_loss": -38.92866516113281, "global_step": 167078, "epoch": 1380} {"train_loss": -38.35091018676758, "global_step": 167079, "epoch": 1380} {"train_loss": -38.72317123413086, "global_step": 167080, "epoch": 1380} {"train_loss": -39.17164993286133, "global_step": 167081, "epoch": 1380} {"train_loss": -38.6002197265625, "global_step": 167082, "epoch": 1380} {"train_loss": -37.10612869262695, "global_step": 167083, "epoch": 1380} {"train_loss": -38.89255905151367, "global_step": 167084, "epoch": 1380} {"train_loss": -38.38747787475586, "global_step": 167085, "epoch": 1380} {"train_loss": -36.01434326171875, "global_step": 167086, "epoch": 1380} {"train_loss": -38.8894157409668, "global_step": 167087, "epoch": 1380} {"train_loss": -38.83828353881836, "global_step": 167088, "epoch": 1380} {"train_loss": -36.99323272705078, "global_step": 167089, "epoch": 1380} {"train_loss": -36.38154983520508, "global_step": 167090, "epoch": 1380} {"train_loss": -35.14856719970703, "global_step": 167091, "epoch": 1380} {"train_loss": -33.1150016784668, "global_step": 167092, "epoch": 1380} {"train_loss": -32.95063400268555, "global_step": 167093, "epoch": 1380} {"train_loss": -25.008148193359375, "global_step": 167094, "epoch": 1380} {"train_loss": -27.360584259033203, "global_step": 167095, "epoch": 1380} {"train_loss": -33.75700759887695, "global_step": 167096, "epoch": 1380} {"train_loss": -29.5091552734375, "global_step": 167097, "epoch": 1380} {"train_loss": -36.03633499145508, "global_step": 167098, "epoch": 1380} {"train_loss": -28.062332153320312, "global_step": 167099, "epoch": 1380} {"train_loss": -38.01695169496142, "global_step": 167100, "epoch": 1380, "val_loss": 2994460.25} {"train_loss": -33.11911392211914, "global_step": 167101, "epoch": 1381} {"train_loss": -37.540740966796875, "global_step": 167102, "epoch": 1381} {"train_loss": -32.713680267333984, "global_step": 167103, "epoch": 1381} {"train_loss": -32.11039733886719, "global_step": 167104, "epoch": 1381} {"train_loss": -33.800636291503906, "global_step": 167105, "epoch": 1381} {"train_loss": -34.600830078125, "global_step": 167106, "epoch": 1381} {"train_loss": -33.560054779052734, "global_step": 167107, "epoch": 1381} {"train_loss": -33.14441680908203, "global_step": 167108, "epoch": 1381} {"train_loss": -34.93419647216797, "global_step": 167109, "epoch": 1381} {"train_loss": -35.779579162597656, "global_step": 167110, "epoch": 1381} {"train_loss": -33.8014030456543, "global_step": 167111, "epoch": 1381} {"train_loss": -34.1202278137207, "global_step": 167112, "epoch": 1381} {"train_loss": -36.590667724609375, "global_step": 167113, "epoch": 1381} {"train_loss": -36.170989990234375, "global_step": 167114, "epoch": 1381} {"train_loss": -37.61287307739258, "global_step": 167115, "epoch": 1381} {"train_loss": -32.49214553833008, "global_step": 167116, "epoch": 1381} {"train_loss": -31.859058380126953, "global_step": 167117, "epoch": 1381} {"train_loss": -31.259906768798828, "global_step": 167118, "epoch": 1381} {"train_loss": -34.665279388427734, "global_step": 167119, "epoch": 1381} {"train_loss": -34.8446044921875, "global_step": 167120, "epoch": 1381} {"train_loss": -34.845245361328125, "global_step": 167121, "epoch": 1381} {"train_loss": -35.48258972167969, "global_step": 167122, "epoch": 1381} {"train_loss": -34.27043151855469, "global_step": 167123, "epoch": 1381} {"train_loss": -34.06570053100586, "global_step": 167124, "epoch": 1381} {"train_loss": -30.158422470092773, "global_step": 167125, "epoch": 1381} {"train_loss": -35.516754150390625, "global_step": 167126, "epoch": 1381} {"train_loss": -33.3044548034668, "global_step": 167127, "epoch": 1381} {"train_loss": -35.78316879272461, "global_step": 167128, "epoch": 1381} {"train_loss": -36.1302604675293, "global_step": 167129, "epoch": 1381} {"train_loss": -34.468929290771484, "global_step": 167130, "epoch": 1381} {"train_loss": -34.67824935913086, "global_step": 167131, "epoch": 1381} {"train_loss": -34.63850021362305, "global_step": 167132, "epoch": 1381} {"train_loss": -34.20576095581055, "global_step": 167133, "epoch": 1381} {"train_loss": -36.490413665771484, "global_step": 167134, "epoch": 1381} {"train_loss": -31.754058837890625, "global_step": 167135, "epoch": 1381} {"train_loss": -34.248382568359375, "global_step": 167136, "epoch": 1381} {"train_loss": -36.61392593383789, "global_step": 167137, "epoch": 1381} {"train_loss": -35.78437042236328, "global_step": 167138, "epoch": 1381} {"train_loss": -33.08258056640625, "global_step": 167139, "epoch": 1381} {"train_loss": -36.46925354003906, "global_step": 167140, "epoch": 1381} {"train_loss": -35.394649505615234, "global_step": 167141, "epoch": 1381} {"train_loss": -36.3397331237793, "global_step": 167142, "epoch": 1381} {"train_loss": -35.61399459838867, "global_step": 167143, "epoch": 1381} {"train_loss": -36.62289047241211, "global_step": 167144, "epoch": 1381} {"train_loss": -36.53507614135742, "global_step": 167145, "epoch": 1381} {"train_loss": -37.14697265625, "global_step": 167146, "epoch": 1381} {"train_loss": -37.047584533691406, "global_step": 167147, "epoch": 1381} {"train_loss": -36.582916259765625, "global_step": 167148, "epoch": 1381} {"train_loss": -36.7483024597168, "global_step": 167149, "epoch": 1381} {"train_loss": -36.68085861206055, "global_step": 167150, "epoch": 1381} {"train_loss": -37.003536224365234, "global_step": 167151, "epoch": 1381} {"train_loss": -37.194400787353516, "global_step": 167152, "epoch": 1381} {"train_loss": -36.99496078491211, "global_step": 167153, "epoch": 1381} {"train_loss": -37.125850677490234, "global_step": 167154, "epoch": 1381} {"train_loss": -36.761085510253906, "global_step": 167155, "epoch": 1381} {"train_loss": -36.27360916137695, "global_step": 167156, "epoch": 1381} {"train_loss": -36.835567474365234, "global_step": 167157, "epoch": 1381} {"train_loss": -37.454898834228516, "global_step": 167158, "epoch": 1381} {"train_loss": -37.421234130859375, "global_step": 167159, "epoch": 1381} {"train_loss": -37.286556243896484, "global_step": 167160, "epoch": 1381} {"train_loss": -37.41994857788086, "global_step": 167161, "epoch": 1381} {"train_loss": -37.4576301574707, "global_step": 167162, "epoch": 1381} {"train_loss": -37.31759262084961, "global_step": 167163, "epoch": 1381} {"train_loss": -37.747432708740234, "global_step": 167164, "epoch": 1381} {"train_loss": -37.391395568847656, "global_step": 167165, "epoch": 1381} {"train_loss": -38.182491302490234, "global_step": 167166, "epoch": 1381} {"train_loss": -37.476524353027344, "global_step": 167167, "epoch": 1381} {"train_loss": -38.1575813293457, "global_step": 167168, "epoch": 1381} {"train_loss": -38.054412841796875, "global_step": 167169, "epoch": 1381} {"train_loss": -38.163631439208984, "global_step": 167170, "epoch": 1381} {"train_loss": -38.073001861572266, "global_step": 167171, "epoch": 1381} {"train_loss": -38.48554611206055, "global_step": 167172, "epoch": 1381} {"train_loss": -38.11727523803711, "global_step": 167173, "epoch": 1381} {"train_loss": -37.74137496948242, "global_step": 167174, "epoch": 1381} {"train_loss": -37.7562255859375, "global_step": 167175, "epoch": 1381} {"train_loss": -38.12553405761719, "global_step": 167176, "epoch": 1381} {"train_loss": -38.50177764892578, "global_step": 167177, "epoch": 1381} {"train_loss": -38.03166961669922, "global_step": 167178, "epoch": 1381} {"train_loss": -38.4847526550293, "global_step": 167179, "epoch": 1381} {"train_loss": -38.33942794799805, "global_step": 167180, "epoch": 1381} {"train_loss": -38.3689079284668, "global_step": 167181, "epoch": 1381} {"train_loss": -38.48592758178711, "global_step": 167182, "epoch": 1381} {"train_loss": -38.40664291381836, "global_step": 167183, "epoch": 1381} {"train_loss": -38.577518463134766, "global_step": 167184, "epoch": 1381} {"train_loss": -38.81836700439453, "global_step": 167185, "epoch": 1381} {"train_loss": -38.28911209106445, "global_step": 167186, "epoch": 1381} {"train_loss": -37.538551330566406, "global_step": 167187, "epoch": 1381} {"train_loss": -36.61872482299805, "global_step": 167188, "epoch": 1381} {"train_loss": -35.83563232421875, "global_step": 167189, "epoch": 1381} {"train_loss": -36.062076568603516, "global_step": 167190, "epoch": 1381} {"train_loss": -37.074989318847656, "global_step": 167191, "epoch": 1381} {"train_loss": -38.19217300415039, "global_step": 167192, "epoch": 1381} {"train_loss": -39.127498626708984, "global_step": 167193, "epoch": 1381} {"train_loss": -38.194271087646484, "global_step": 167194, "epoch": 1381} {"train_loss": -38.80206298828125, "global_step": 167195, "epoch": 1381} {"train_loss": -38.83136749267578, "global_step": 167196, "epoch": 1381} {"train_loss": -38.62089920043945, "global_step": 167197, "epoch": 1381} {"train_loss": -39.19160461425781, "global_step": 167198, "epoch": 1381} {"train_loss": -39.08646774291992, "global_step": 167199, "epoch": 1381} {"train_loss": -38.8232536315918, "global_step": 167200, "epoch": 1381} {"train_loss": -39.2219352722168, "global_step": 167201, "epoch": 1381} {"train_loss": -39.12495040893555, "global_step": 167202, "epoch": 1381} {"train_loss": -38.19868087768555, "global_step": 167203, "epoch": 1381} {"train_loss": -38.962379455566406, "global_step": 167204, "epoch": 1381} {"train_loss": -38.93656539916992, "global_step": 167205, "epoch": 1381} {"train_loss": -39.32927703857422, "global_step": 167206, "epoch": 1381} {"train_loss": -38.99270248413086, "global_step": 167207, "epoch": 1381} {"train_loss": -39.38542556762695, "global_step": 167208, "epoch": 1381} {"train_loss": -39.56167221069336, "global_step": 167209, "epoch": 1381} {"train_loss": -39.209651947021484, "global_step": 167210, "epoch": 1381} {"train_loss": -38.82375717163086, "global_step": 167211, "epoch": 1381} {"train_loss": -39.039947509765625, "global_step": 167212, "epoch": 1381} {"train_loss": -39.27131271362305, "global_step": 167213, "epoch": 1381} {"train_loss": -39.64773178100586, "global_step": 167214, "epoch": 1381} {"train_loss": -38.36373519897461, "global_step": 167215, "epoch": 1381} {"train_loss": -39.662742614746094, "global_step": 167216, "epoch": 1381} {"train_loss": -39.06590270996094, "global_step": 167217, "epoch": 1381} {"train_loss": -39.24967575073242, "global_step": 167218, "epoch": 1381} {"train_loss": -39.42562484741211, "global_step": 167219, "epoch": 1381} {"train_loss": -40.01549530029297, "global_step": 167220, "epoch": 1381} {"train_loss": -36.83533794623761, "global_step": 167221, "epoch": 1381, "val_loss": 2573591.25} {"train_loss": -39.38637161254883, "global_step": 167222, "epoch": 1382} {"train_loss": -39.96209716796875, "global_step": 167223, "epoch": 1382} {"train_loss": -39.05811309814453, "global_step": 167224, "epoch": 1382} {"train_loss": -39.417362213134766, "global_step": 167225, "epoch": 1382} {"train_loss": -39.497562408447266, "global_step": 167226, "epoch": 1382} {"train_loss": -38.9949836730957, "global_step": 167227, "epoch": 1382} {"train_loss": -39.312931060791016, "global_step": 167228, "epoch": 1382} {"train_loss": -39.421321868896484, "global_step": 167229, "epoch": 1382} {"train_loss": -39.42389678955078, "global_step": 167230, "epoch": 1382} {"train_loss": -39.78596115112305, "global_step": 167231, "epoch": 1382} {"train_loss": -39.88906478881836, "global_step": 167232, "epoch": 1382} {"train_loss": -39.35697555541992, "global_step": 167233, "epoch": 1382} {"train_loss": -38.87465286254883, "global_step": 167234, "epoch": 1382} {"train_loss": -39.183624267578125, "global_step": 167235, "epoch": 1382} {"train_loss": -39.61483383178711, "global_step": 167236, "epoch": 1382} {"train_loss": -40.02625274658203, "global_step": 167237, "epoch": 1382} {"train_loss": -40.106388092041016, "global_step": 167238, "epoch": 1382} {"train_loss": -39.37773513793945, "global_step": 167239, "epoch": 1382} {"train_loss": -38.86708450317383, "global_step": 167240, "epoch": 1382} {"train_loss": -38.660499572753906, "global_step": 167241, "epoch": 1382} {"train_loss": -39.08695602416992, "global_step": 167242, "epoch": 1382} {"train_loss": -37.53466033935547, "global_step": 167243, "epoch": 1382} {"train_loss": -36.95292282104492, "global_step": 167244, "epoch": 1382} {"train_loss": -37.64569854736328, "global_step": 167245, "epoch": 1382} {"train_loss": -38.476348876953125, "global_step": 167246, "epoch": 1382} {"train_loss": -39.555381774902344, "global_step": 167247, "epoch": 1382} {"train_loss": -38.76765060424805, "global_step": 167248, "epoch": 1382} {"train_loss": -38.722442626953125, "global_step": 167249, "epoch": 1382} {"train_loss": -39.1525764465332, "global_step": 167250, "epoch": 1382} {"train_loss": -38.63332748413086, "global_step": 167251, "epoch": 1382} {"train_loss": -39.700538635253906, "global_step": 167252, "epoch": 1382} {"train_loss": -38.321773529052734, "global_step": 167253, "epoch": 1382} {"train_loss": -38.564945220947266, "global_step": 167254, "epoch": 1382} {"train_loss": -38.76447677612305, "global_step": 167255, "epoch": 1382} {"train_loss": -38.946311950683594, "global_step": 167256, "epoch": 1382} {"train_loss": -38.09033203125, "global_step": 167257, "epoch": 1382} {"train_loss": -38.87822341918945, "global_step": 167258, "epoch": 1382} {"train_loss": -39.24785232543945, "global_step": 167259, "epoch": 1382} {"train_loss": -39.19267654418945, "global_step": 167260, "epoch": 1382} {"train_loss": -39.895442962646484, "global_step": 167261, "epoch": 1382} {"train_loss": -37.9630126953125, "global_step": 167262, "epoch": 1382} {"train_loss": -39.61586380004883, "global_step": 167263, "epoch": 1382} {"train_loss": -38.918365478515625, "global_step": 167264, "epoch": 1382} {"train_loss": -39.743892669677734, "global_step": 167265, "epoch": 1382} {"train_loss": -37.547393798828125, "global_step": 167266, "epoch": 1382} {"train_loss": -40.26133346557617, "global_step": 167267, "epoch": 1382} {"train_loss": -39.703426361083984, "global_step": 167268, "epoch": 1382} {"train_loss": -39.365928649902344, "global_step": 167269, "epoch": 1382} {"train_loss": -40.14771270751953, "global_step": 167270, "epoch": 1382} {"train_loss": -39.51392364501953, "global_step": 167271, "epoch": 1382} {"train_loss": -38.30440902709961, "global_step": 167272, "epoch": 1382} {"train_loss": -39.74067306518555, "global_step": 167273, "epoch": 1382} {"train_loss": -40.536773681640625, "global_step": 167274, "epoch": 1382} {"train_loss": -38.7614631652832, "global_step": 167275, "epoch": 1382} {"train_loss": -40.093017578125, "global_step": 167276, "epoch": 1382} {"train_loss": -40.03685760498047, "global_step": 167277, "epoch": 1382} {"train_loss": -39.69749450683594, "global_step": 167278, "epoch": 1382} {"train_loss": -39.529029846191406, "global_step": 167279, "epoch": 1382} {"train_loss": -39.086116790771484, "global_step": 167280, "epoch": 1382} {"train_loss": -39.165809631347656, "global_step": 167281, "epoch": 1382} {"train_loss": -39.71751022338867, "global_step": 167282, "epoch": 1382} {"train_loss": -39.397377014160156, "global_step": 167283, "epoch": 1382} {"train_loss": -39.04194259643555, "global_step": 167284, "epoch": 1382} {"train_loss": -39.346527099609375, "global_step": 167285, "epoch": 1382} {"train_loss": -40.10442352294922, "global_step": 167286, "epoch": 1382} {"train_loss": -39.5164794921875, "global_step": 167287, "epoch": 1382} {"train_loss": -39.901832580566406, "global_step": 167288, "epoch": 1382} {"train_loss": -39.92091369628906, "global_step": 167289, "epoch": 1382} {"train_loss": -39.599971771240234, "global_step": 167290, "epoch": 1382} {"train_loss": -40.25191116333008, "global_step": 167291, "epoch": 1382} {"train_loss": -39.81907272338867, "global_step": 167292, "epoch": 1382} {"train_loss": -40.00823211669922, "global_step": 167293, "epoch": 1382} {"train_loss": -40.36060333251953, "global_step": 167294, "epoch": 1382} {"train_loss": -40.065635681152344, "global_step": 167295, "epoch": 1382} {"train_loss": -40.114315032958984, "global_step": 167296, "epoch": 1382} {"train_loss": -40.598506927490234, "global_step": 167297, "epoch": 1382} {"train_loss": -40.0731315612793, "global_step": 167298, "epoch": 1382} {"train_loss": -39.19953155517578, "global_step": 167299, "epoch": 1382} {"train_loss": -40.166046142578125, "global_step": 167300, "epoch": 1382} {"train_loss": -39.34245300292969, "global_step": 167301, "epoch": 1382} {"train_loss": -34.825660705566406, "global_step": 167302, "epoch": 1382} {"train_loss": -39.3447380065918, "global_step": 167303, "epoch": 1382} {"train_loss": -37.16611862182617, "global_step": 167304, "epoch": 1382} {"train_loss": -37.98812484741211, "global_step": 167305, "epoch": 1382} {"train_loss": -38.63100814819336, "global_step": 167306, "epoch": 1382} {"train_loss": -39.05813217163086, "global_step": 167307, "epoch": 1382} {"train_loss": -37.78276443481445, "global_step": 167308, "epoch": 1382} {"train_loss": -39.27117919921875, "global_step": 167309, "epoch": 1382} {"train_loss": -40.50136184692383, "global_step": 167310, "epoch": 1382} {"train_loss": -39.14783477783203, "global_step": 167311, "epoch": 1382} {"train_loss": -37.759456634521484, "global_step": 167312, "epoch": 1382} {"train_loss": -40.07741165161133, "global_step": 167313, "epoch": 1382} {"train_loss": -38.39405059814453, "global_step": 167314, "epoch": 1382} {"train_loss": -39.238826751708984, "global_step": 167315, "epoch": 1382} {"train_loss": -40.187801361083984, "global_step": 167316, "epoch": 1382} {"train_loss": -38.77131271362305, "global_step": 167317, "epoch": 1382} {"train_loss": -39.63693618774414, "global_step": 167318, "epoch": 1382} {"train_loss": -39.43016052246094, "global_step": 167319, "epoch": 1382} {"train_loss": -40.43094253540039, "global_step": 167320, "epoch": 1382} {"train_loss": -39.306880950927734, "global_step": 167321, "epoch": 1382} {"train_loss": -37.98897933959961, "global_step": 167322, "epoch": 1382} {"train_loss": -39.3329963684082, "global_step": 167323, "epoch": 1382} {"train_loss": -38.83953857421875, "global_step": 167324, "epoch": 1382} {"train_loss": -40.68498229980469, "global_step": 167325, "epoch": 1382} {"train_loss": -40.30535888671875, "global_step": 167326, "epoch": 1382} {"train_loss": -40.007686614990234, "global_step": 167327, "epoch": 1382} {"train_loss": -40.225746154785156, "global_step": 167328, "epoch": 1382} {"train_loss": -39.635128021240234, "global_step": 167329, "epoch": 1382} {"train_loss": -39.98147201538086, "global_step": 167330, "epoch": 1382} {"train_loss": -40.70920944213867, "global_step": 167331, "epoch": 1382} {"train_loss": -38.20273208618164, "global_step": 167332, "epoch": 1382} {"train_loss": -38.94456100463867, "global_step": 167333, "epoch": 1382} {"train_loss": -38.099239349365234, "global_step": 167334, "epoch": 1382} {"train_loss": -38.6152229309082, "global_step": 167335, "epoch": 1382} {"train_loss": -39.59716796875, "global_step": 167336, "epoch": 1382} {"train_loss": -38.92359161376953, "global_step": 167337, "epoch": 1382} {"train_loss": -40.25498962402344, "global_step": 167338, "epoch": 1382} {"train_loss": -38.99897003173828, "global_step": 167339, "epoch": 1382} {"train_loss": -39.66709518432617, "global_step": 167340, "epoch": 1382} {"train_loss": -39.446937561035156, "global_step": 167341, "epoch": 1382} {"train_loss": -39.26918783266682, "global_step": 167342, "epoch": 1382, "val_loss": 2648157.25} {"train_loss": -38.636566162109375, "global_step": 167343, "epoch": 1383} {"train_loss": -40.287818908691406, "global_step": 167344, "epoch": 1383} {"train_loss": -39.62102508544922, "global_step": 167345, "epoch": 1383} {"train_loss": -40.22233200073242, "global_step": 167346, "epoch": 1383} {"train_loss": -39.9711799621582, "global_step": 167347, "epoch": 1383} {"train_loss": -40.338314056396484, "global_step": 167348, "epoch": 1383} {"train_loss": -37.79546356201172, "global_step": 167349, "epoch": 1383} {"train_loss": -39.989227294921875, "global_step": 167350, "epoch": 1383} {"train_loss": -40.0808219909668, "global_step": 167351, "epoch": 1383} {"train_loss": -38.54768753051758, "global_step": 167352, "epoch": 1383} {"train_loss": -39.504249572753906, "global_step": 167353, "epoch": 1383} {"train_loss": -39.02309799194336, "global_step": 167354, "epoch": 1383} {"train_loss": -39.74399948120117, "global_step": 167355, "epoch": 1383} {"train_loss": -30.032150268554688, "global_step": 167356, "epoch": 1383} {"train_loss": -37.73017501831055, "global_step": 167357, "epoch": 1383} {"train_loss": -36.87489700317383, "global_step": 167358, "epoch": 1383} {"train_loss": -36.24813461303711, "global_step": 167359, "epoch": 1383} {"train_loss": -39.60922622680664, "global_step": 167360, "epoch": 1383} {"train_loss": -39.51749801635742, "global_step": 167361, "epoch": 1383} {"train_loss": -36.875465393066406, "global_step": 167362, "epoch": 1383} {"train_loss": -38.1426887512207, "global_step": 167363, "epoch": 1383} {"train_loss": -38.08462142944336, "global_step": 167364, "epoch": 1383} {"train_loss": -39.39751052856445, "global_step": 167365, "epoch": 1383} {"train_loss": -39.59649658203125, "global_step": 167366, "epoch": 1383} {"train_loss": -38.39088821411133, "global_step": 167367, "epoch": 1383} {"train_loss": -36.03489303588867, "global_step": 167368, "epoch": 1383} {"train_loss": -35.906673431396484, "global_step": 167369, "epoch": 1383} {"train_loss": -37.900726318359375, "global_step": 167370, "epoch": 1383} {"train_loss": -39.545440673828125, "global_step": 167371, "epoch": 1383} {"train_loss": -36.73428726196289, "global_step": 167372, "epoch": 1383} {"train_loss": -38.49040222167969, "global_step": 167373, "epoch": 1383} {"train_loss": -38.00393295288086, "global_step": 167374, "epoch": 1383} {"train_loss": -37.101234436035156, "global_step": 167375, "epoch": 1383} {"train_loss": -33.8944206237793, "global_step": 167376, "epoch": 1383} {"train_loss": -36.254268646240234, "global_step": 167377, "epoch": 1383} {"train_loss": -36.18268966674805, "global_step": 167378, "epoch": 1383} {"train_loss": -31.309326171875, "global_step": 167379, "epoch": 1383} {"train_loss": -34.49806594848633, "global_step": 167380, "epoch": 1383} {"train_loss": -38.14282989501953, "global_step": 167381, "epoch": 1383} {"train_loss": -38.086483001708984, "global_step": 167382, "epoch": 1383} {"train_loss": -35.53070831298828, "global_step": 167383, "epoch": 1383} {"train_loss": -34.61726379394531, "global_step": 167384, "epoch": 1383} {"train_loss": -31.883031845092773, "global_step": 167385, "epoch": 1383} {"train_loss": -35.50958251953125, "global_step": 167386, "epoch": 1383} {"train_loss": -36.77274703979492, "global_step": 167387, "epoch": 1383} {"train_loss": -37.995601654052734, "global_step": 167388, "epoch": 1383} {"train_loss": -34.754127502441406, "global_step": 167389, "epoch": 1383} {"train_loss": -37.69511032104492, "global_step": 167390, "epoch": 1383} {"train_loss": -37.79679489135742, "global_step": 167391, "epoch": 1383} {"train_loss": -36.00251388549805, "global_step": 167392, "epoch": 1383} {"train_loss": -37.83450698852539, "global_step": 167393, "epoch": 1383} {"train_loss": -39.07136154174805, "global_step": 167394, "epoch": 1383} {"train_loss": -38.125301361083984, "global_step": 167395, "epoch": 1383} {"train_loss": -38.497589111328125, "global_step": 167396, "epoch": 1383} {"train_loss": -37.713600158691406, "global_step": 167397, "epoch": 1383} {"train_loss": -31.608190536499023, "global_step": 167398, "epoch": 1383} {"train_loss": -37.253395080566406, "global_step": 167399, "epoch": 1383} {"train_loss": -38.118499755859375, "global_step": 167400, "epoch": 1383} {"train_loss": -37.61151123046875, "global_step": 167401, "epoch": 1383} {"train_loss": -36.81240463256836, "global_step": 167402, "epoch": 1383} {"train_loss": -37.83974075317383, "global_step": 167403, "epoch": 1383} {"train_loss": -37.79470443725586, "global_step": 167404, "epoch": 1383} {"train_loss": -37.957584381103516, "global_step": 167405, "epoch": 1383} {"train_loss": -37.03125762939453, "global_step": 167406, "epoch": 1383} {"train_loss": -38.42033004760742, "global_step": 167407, "epoch": 1383} {"train_loss": -35.768917083740234, "global_step": 167408, "epoch": 1383} {"train_loss": -36.62297439575195, "global_step": 167409, "epoch": 1383} {"train_loss": -38.20969009399414, "global_step": 167410, "epoch": 1383} {"train_loss": -37.71128463745117, "global_step": 167411, "epoch": 1383} {"train_loss": -37.57746887207031, "global_step": 167412, "epoch": 1383} {"train_loss": -38.976383209228516, "global_step": 167413, "epoch": 1383} {"train_loss": -38.032955169677734, "global_step": 167414, "epoch": 1383} {"train_loss": -36.291358947753906, "global_step": 167415, "epoch": 1383} {"train_loss": -38.52218246459961, "global_step": 167416, "epoch": 1383} {"train_loss": -38.67380905151367, "global_step": 167417, "epoch": 1383} {"train_loss": -38.682498931884766, "global_step": 167418, "epoch": 1383} {"train_loss": -38.33071517944336, "global_step": 167419, "epoch": 1383} {"train_loss": -38.95534133911133, "global_step": 167420, "epoch": 1383} {"train_loss": -38.69655990600586, "global_step": 167421, "epoch": 1383} {"train_loss": -39.15256881713867, "global_step": 167422, "epoch": 1383} {"train_loss": -38.743141174316406, "global_step": 167423, "epoch": 1383} {"train_loss": -37.951168060302734, "global_step": 167424, "epoch": 1383} {"train_loss": -38.69196319580078, "global_step": 167425, "epoch": 1383} {"train_loss": -38.61731719970703, "global_step": 167426, "epoch": 1383} {"train_loss": -38.92397689819336, "global_step": 167427, "epoch": 1383} {"train_loss": -39.26165771484375, "global_step": 167428, "epoch": 1383} {"train_loss": -39.55218505859375, "global_step": 167429, "epoch": 1383} {"train_loss": -39.532344818115234, "global_step": 167430, "epoch": 1383} {"train_loss": -39.5311279296875, "global_step": 167431, "epoch": 1383} {"train_loss": -39.29254150390625, "global_step": 167432, "epoch": 1383} {"train_loss": -39.41426086425781, "global_step": 167433, "epoch": 1383} {"train_loss": -39.292659759521484, "global_step": 167434, "epoch": 1383} {"train_loss": -38.759517669677734, "global_step": 167435, "epoch": 1383} {"train_loss": -39.084049224853516, "global_step": 167436, "epoch": 1383} {"train_loss": -38.67924118041992, "global_step": 167437, "epoch": 1383} {"train_loss": -38.94451904296875, "global_step": 167438, "epoch": 1383} {"train_loss": -39.455867767333984, "global_step": 167439, "epoch": 1383} {"train_loss": -39.27616500854492, "global_step": 167440, "epoch": 1383} {"train_loss": -39.383216857910156, "global_step": 167441, "epoch": 1383} {"train_loss": -39.32957077026367, "global_step": 167442, "epoch": 1383} {"train_loss": -39.32828903198242, "global_step": 167443, "epoch": 1383} {"train_loss": -38.629940032958984, "global_step": 167444, "epoch": 1383} {"train_loss": -39.058773040771484, "global_step": 167445, "epoch": 1383} {"train_loss": -38.28438186645508, "global_step": 167446, "epoch": 1383} {"train_loss": -39.78432846069336, "global_step": 167447, "epoch": 1383} {"train_loss": -39.45315170288086, "global_step": 167448, "epoch": 1383} {"train_loss": -40.15318298339844, "global_step": 167449, "epoch": 1383} {"train_loss": -39.02473068237305, "global_step": 167450, "epoch": 1383} {"train_loss": -39.81765365600586, "global_step": 167451, "epoch": 1383} {"train_loss": -39.578731536865234, "global_step": 167452, "epoch": 1383} {"train_loss": -39.2223014831543, "global_step": 167453, "epoch": 1383} {"train_loss": -39.32062530517578, "global_step": 167454, "epoch": 1383} {"train_loss": -39.8358154296875, "global_step": 167455, "epoch": 1383} {"train_loss": -40.199764251708984, "global_step": 167456, "epoch": 1383} {"train_loss": -39.9229850769043, "global_step": 167457, "epoch": 1383} {"train_loss": -39.61758804321289, "global_step": 167458, "epoch": 1383} {"train_loss": -39.898677825927734, "global_step": 167459, "epoch": 1383} {"train_loss": -40.32990646362305, "global_step": 167460, "epoch": 1383} {"train_loss": -39.965980529785156, "global_step": 167461, "epoch": 1383} {"train_loss": -39.96681594848633, "global_step": 167462, "epoch": 1383} {"train_loss": -38.14597298488144, "global_step": 167463, "epoch": 1383, "val_loss": 2646027.25} {"train_loss": -39.30049133300781, "global_step": 167464, "epoch": 1384} {"train_loss": -40.21842956542969, "global_step": 167465, "epoch": 1384} {"train_loss": -40.548797607421875, "global_step": 167466, "epoch": 1384} {"train_loss": -40.16361999511719, "global_step": 167467, "epoch": 1384} {"train_loss": -39.95893478393555, "global_step": 167468, "epoch": 1384} {"train_loss": -39.77877426147461, "global_step": 167469, "epoch": 1384} {"train_loss": -39.406822204589844, "global_step": 167470, "epoch": 1384} {"train_loss": -40.09507751464844, "global_step": 167471, "epoch": 1384} {"train_loss": -40.335872650146484, "global_step": 167472, "epoch": 1384} {"train_loss": -39.583152770996094, "global_step": 167473, "epoch": 1384} {"train_loss": -40.53764724731445, "global_step": 167474, "epoch": 1384} {"train_loss": -40.01131820678711, "global_step": 167475, "epoch": 1384} {"train_loss": -40.61711120605469, "global_step": 167476, "epoch": 1384} {"train_loss": -40.02092361450195, "global_step": 167477, "epoch": 1384} {"train_loss": -39.84821319580078, "global_step": 167478, "epoch": 1384} {"train_loss": -38.75062561035156, "global_step": 167479, "epoch": 1384} {"train_loss": -33.9998893737793, "global_step": 167480, "epoch": 1384} {"train_loss": -23.015296936035156, "global_step": 167481, "epoch": 1384} {"train_loss": -26.025609970092773, "global_step": 167482, "epoch": 1384} {"train_loss": -39.621681213378906, "global_step": 167483, "epoch": 1384} {"train_loss": -33.610103607177734, "global_step": 167484, "epoch": 1384} {"train_loss": -32.373043060302734, "global_step": 167485, "epoch": 1384} {"train_loss": -38.378509521484375, "global_step": 167486, "epoch": 1384} {"train_loss": -32.837074279785156, "global_step": 167487, "epoch": 1384} {"train_loss": -38.79425811767578, "global_step": 167488, "epoch": 1384} {"train_loss": -34.240169525146484, "global_step": 167489, "epoch": 1384} {"train_loss": -39.15732955932617, "global_step": 167490, "epoch": 1384} {"train_loss": -35.995914459228516, "global_step": 167491, "epoch": 1384} {"train_loss": -39.0009765625, "global_step": 167492, "epoch": 1384} {"train_loss": -37.31669235229492, "global_step": 167493, "epoch": 1384} {"train_loss": -39.42141342163086, "global_step": 167494, "epoch": 1384} {"train_loss": -37.20851516723633, "global_step": 167495, "epoch": 1384} {"train_loss": -39.83200454711914, "global_step": 167496, "epoch": 1384} {"train_loss": -38.67694854736328, "global_step": 167497, "epoch": 1384} {"train_loss": -39.507137298583984, "global_step": 167498, "epoch": 1384} {"train_loss": -37.912017822265625, "global_step": 167499, "epoch": 1384} {"train_loss": -36.82806396484375, "global_step": 167500, "epoch": 1384} {"train_loss": -38.52128982543945, "global_step": 167501, "epoch": 1384} {"train_loss": -36.138275146484375, "global_step": 167502, "epoch": 1384} {"train_loss": -38.505157470703125, "global_step": 167503, "epoch": 1384} {"train_loss": -36.520660400390625, "global_step": 167504, "epoch": 1384} {"train_loss": -39.05858612060547, "global_step": 167505, "epoch": 1384} {"train_loss": -37.36341094970703, "global_step": 167506, "epoch": 1384} {"train_loss": -38.98092269897461, "global_step": 167507, "epoch": 1384} {"train_loss": -38.85272979736328, "global_step": 167508, "epoch": 1384} {"train_loss": -38.09835433959961, "global_step": 167509, "epoch": 1384} {"train_loss": -39.66295623779297, "global_step": 167510, "epoch": 1384} {"train_loss": -39.286685943603516, "global_step": 167511, "epoch": 1384} {"train_loss": -38.098976135253906, "global_step": 167512, "epoch": 1384} {"train_loss": -39.92843246459961, "global_step": 167513, "epoch": 1384} {"train_loss": -38.36277389526367, "global_step": 167514, "epoch": 1384} {"train_loss": -39.173458099365234, "global_step": 167515, "epoch": 1384} {"train_loss": -39.64359664916992, "global_step": 167516, "epoch": 1384} {"train_loss": -38.92879867553711, "global_step": 167517, "epoch": 1384} {"train_loss": -40.00164794921875, "global_step": 167518, "epoch": 1384} {"train_loss": -39.582122802734375, "global_step": 167519, "epoch": 1384} {"train_loss": -40.02106857299805, "global_step": 167520, "epoch": 1384} {"train_loss": -40.55948257446289, "global_step": 167521, "epoch": 1384} {"train_loss": -38.95143508911133, "global_step": 167522, "epoch": 1384} {"train_loss": -39.969520568847656, "global_step": 167523, "epoch": 1384} {"train_loss": -40.021358489990234, "global_step": 167524, "epoch": 1384} {"train_loss": -39.716697692871094, "global_step": 167525, "epoch": 1384} {"train_loss": -39.5830192565918, "global_step": 167526, "epoch": 1384} {"train_loss": -37.56501007080078, "global_step": 167527, "epoch": 1384} {"train_loss": -39.84162521362305, "global_step": 167528, "epoch": 1384} {"train_loss": -39.01740264892578, "global_step": 167529, "epoch": 1384} {"train_loss": -39.23875427246094, "global_step": 167530, "epoch": 1384} {"train_loss": -39.05934524536133, "global_step": 167531, "epoch": 1384} {"train_loss": -37.71493148803711, "global_step": 167532, "epoch": 1384} {"train_loss": -36.34185791015625, "global_step": 167533, "epoch": 1384} {"train_loss": -38.792320251464844, "global_step": 167534, "epoch": 1384} {"train_loss": -39.070587158203125, "global_step": 167535, "epoch": 1384} {"train_loss": -39.91899108886719, "global_step": 167536, "epoch": 1384} {"train_loss": -38.76321792602539, "global_step": 167537, "epoch": 1384} {"train_loss": -37.8735237121582, "global_step": 167538, "epoch": 1384} {"train_loss": -38.62415313720703, "global_step": 167539, "epoch": 1384} {"train_loss": -38.768428802490234, "global_step": 167540, "epoch": 1384} {"train_loss": -38.97291564941406, "global_step": 167541, "epoch": 1384} {"train_loss": -38.98662567138672, "global_step": 167542, "epoch": 1384} {"train_loss": -39.6103515625, "global_step": 167543, "epoch": 1384} {"train_loss": -39.5649299621582, "global_step": 167544, "epoch": 1384} {"train_loss": -38.60148239135742, "global_step": 167545, "epoch": 1384} {"train_loss": -35.00417709350586, "global_step": 167546, "epoch": 1384} {"train_loss": -37.71939468383789, "global_step": 167547, "epoch": 1384} {"train_loss": -39.30994415283203, "global_step": 167548, "epoch": 1384} {"train_loss": -37.08190155029297, "global_step": 167549, "epoch": 1384} {"train_loss": -37.3114128112793, "global_step": 167550, "epoch": 1384} {"train_loss": -37.57495880126953, "global_step": 167551, "epoch": 1384} {"train_loss": -37.13630676269531, "global_step": 167552, "epoch": 1384} {"train_loss": -35.102294921875, "global_step": 167553, "epoch": 1384} {"train_loss": -37.651119232177734, "global_step": 167554, "epoch": 1384} {"train_loss": -36.74551773071289, "global_step": 167555, "epoch": 1384} {"train_loss": -37.05360412597656, "global_step": 167556, "epoch": 1384} {"train_loss": -37.01144027709961, "global_step": 167557, "epoch": 1384} {"train_loss": -33.85004806518555, "global_step": 167558, "epoch": 1384} {"train_loss": -37.22775650024414, "global_step": 167559, "epoch": 1384} {"train_loss": -35.799354553222656, "global_step": 167560, "epoch": 1384} {"train_loss": -33.87102508544922, "global_step": 167561, "epoch": 1384} {"train_loss": -37.65310287475586, "global_step": 167562, "epoch": 1384} {"train_loss": -36.454681396484375, "global_step": 167563, "epoch": 1384} {"train_loss": -37.00322723388672, "global_step": 167564, "epoch": 1384} {"train_loss": -38.37273406982422, "global_step": 167565, "epoch": 1384} {"train_loss": -37.62366485595703, "global_step": 167566, "epoch": 1384} {"train_loss": -37.73979568481445, "global_step": 167567, "epoch": 1384} {"train_loss": -37.654571533203125, "global_step": 167568, "epoch": 1384} {"train_loss": -35.8687744140625, "global_step": 167569, "epoch": 1384} {"train_loss": -36.108856201171875, "global_step": 167570, "epoch": 1384} {"train_loss": -38.7086181640625, "global_step": 167571, "epoch": 1384} {"train_loss": -38.453094482421875, "global_step": 167572, "epoch": 1384} {"train_loss": -38.18210220336914, "global_step": 167573, "epoch": 1384} {"train_loss": -37.15803909301758, "global_step": 167574, "epoch": 1384} {"train_loss": -33.91469192504883, "global_step": 167575, "epoch": 1384} {"train_loss": -38.318992614746094, "global_step": 167576, "epoch": 1384} {"train_loss": -35.9687614440918, "global_step": 167577, "epoch": 1384} {"train_loss": -38.22359085083008, "global_step": 167578, "epoch": 1384} {"train_loss": -38.546688079833984, "global_step": 167579, "epoch": 1384} {"train_loss": -33.16815185546875, "global_step": 167580, "epoch": 1384} {"train_loss": -36.46145248413086, "global_step": 167581, "epoch": 1384} {"train_loss": -37.85144805908203, "global_step": 167582, "epoch": 1384} {"train_loss": -38.20631790161133, "global_step": 167583, "epoch": 1384} {"train_loss": -37.869547016364486, "global_step": 167584, "epoch": 1384, "val_loss": 2711797.75} {"train_loss": -36.23580551147461, "global_step": 167585, "epoch": 1385} {"train_loss": -35.19892883300781, "global_step": 167586, "epoch": 1385} {"train_loss": -36.245849609375, "global_step": 167587, "epoch": 1385} {"train_loss": -36.83150100708008, "global_step": 167588, "epoch": 1385} {"train_loss": -37.58186721801758, "global_step": 167589, "epoch": 1385} {"train_loss": -38.31489181518555, "global_step": 167590, "epoch": 1385} {"train_loss": -37.6351318359375, "global_step": 167591, "epoch": 1385} {"train_loss": -36.5269775390625, "global_step": 167592, "epoch": 1385} {"train_loss": -37.096927642822266, "global_step": 167593, "epoch": 1385} {"train_loss": -35.87403869628906, "global_step": 167594, "epoch": 1385} {"train_loss": -35.05347442626953, "global_step": 167595, "epoch": 1385} {"train_loss": -37.25665283203125, "global_step": 167596, "epoch": 1385} {"train_loss": -37.47054672241211, "global_step": 167597, "epoch": 1385} {"train_loss": -37.74879837036133, "global_step": 167598, "epoch": 1385} {"train_loss": -37.742591857910156, "global_step": 167599, "epoch": 1385} {"train_loss": -38.46181869506836, "global_step": 167600, "epoch": 1385} {"train_loss": -38.600582122802734, "global_step": 167601, "epoch": 1385} {"train_loss": -37.80638122558594, "global_step": 167602, "epoch": 1385} {"train_loss": -35.84795379638672, "global_step": 167603, "epoch": 1385} {"train_loss": -38.42129135131836, "global_step": 167604, "epoch": 1385} {"train_loss": -39.329341888427734, "global_step": 167605, "epoch": 1385} {"train_loss": -37.858154296875, "global_step": 167606, "epoch": 1385} {"train_loss": -38.081050872802734, "global_step": 167607, "epoch": 1385} {"train_loss": -37.323646545410156, "global_step": 167608, "epoch": 1385} {"train_loss": -38.69832229614258, "global_step": 167609, "epoch": 1385} {"train_loss": -39.0312614440918, "global_step": 167610, "epoch": 1385} {"train_loss": -39.19432067871094, "global_step": 167611, "epoch": 1385} {"train_loss": -38.90867233276367, "global_step": 167612, "epoch": 1385} {"train_loss": -39.07253646850586, "global_step": 167613, "epoch": 1385} {"train_loss": -38.85995101928711, "global_step": 167614, "epoch": 1385} {"train_loss": -39.167293548583984, "global_step": 167615, "epoch": 1385} {"train_loss": -38.740135192871094, "global_step": 167616, "epoch": 1385} {"train_loss": -39.22309112548828, "global_step": 167617, "epoch": 1385} {"train_loss": -38.2359504699707, "global_step": 167618, "epoch": 1385} {"train_loss": -39.079795837402344, "global_step": 167619, "epoch": 1385} {"train_loss": -39.52484893798828, "global_step": 167620, "epoch": 1385} {"train_loss": -39.06934356689453, "global_step": 167621, "epoch": 1385} {"train_loss": -39.12102508544922, "global_step": 167622, "epoch": 1385} {"train_loss": -39.29728698730469, "global_step": 167623, "epoch": 1385} {"train_loss": -39.2818489074707, "global_step": 167624, "epoch": 1385} {"train_loss": -39.349945068359375, "global_step": 167625, "epoch": 1385} {"train_loss": -38.48535919189453, "global_step": 167626, "epoch": 1385} {"train_loss": -39.00051498413086, "global_step": 167627, "epoch": 1385} {"train_loss": -39.01001739501953, "global_step": 167628, "epoch": 1385} {"train_loss": -38.9365348815918, "global_step": 167629, "epoch": 1385} {"train_loss": -39.83897018432617, "global_step": 167630, "epoch": 1385} {"train_loss": -39.49480056762695, "global_step": 167631, "epoch": 1385} {"train_loss": -38.579437255859375, "global_step": 167632, "epoch": 1385} {"train_loss": -39.5704345703125, "global_step": 167633, "epoch": 1385} {"train_loss": -39.40071487426758, "global_step": 167634, "epoch": 1385} {"train_loss": -39.27024841308594, "global_step": 167635, "epoch": 1385} {"train_loss": -39.5509147644043, "global_step": 167636, "epoch": 1385} {"train_loss": -39.45502853393555, "global_step": 167637, "epoch": 1385} {"train_loss": -39.90336227416992, "global_step": 167638, "epoch": 1385} {"train_loss": -39.48963928222656, "global_step": 167639, "epoch": 1385} {"train_loss": -39.4080924987793, "global_step": 167640, "epoch": 1385} {"train_loss": -40.06657028198242, "global_step": 167641, "epoch": 1385} {"train_loss": -39.558380126953125, "global_step": 167642, "epoch": 1385} {"train_loss": -39.96021270751953, "global_step": 167643, "epoch": 1385} {"train_loss": -40.1622200012207, "global_step": 167644, "epoch": 1385} {"train_loss": -40.01762771606445, "global_step": 167645, "epoch": 1385} {"train_loss": -40.23210906982422, "global_step": 167646, "epoch": 1385} {"train_loss": -40.26967239379883, "global_step": 167647, "epoch": 1385} {"train_loss": -40.08809280395508, "global_step": 167648, "epoch": 1385} {"train_loss": -40.28347396850586, "global_step": 167649, "epoch": 1385} {"train_loss": -40.006221771240234, "global_step": 167650, "epoch": 1385} {"train_loss": -40.3345947265625, "global_step": 167651, "epoch": 1385} {"train_loss": -40.26193618774414, "global_step": 167652, "epoch": 1385} {"train_loss": -40.05170822143555, "global_step": 167653, "epoch": 1385} {"train_loss": -40.05779266357422, "global_step": 167654, "epoch": 1385} {"train_loss": -40.31843566894531, "global_step": 167655, "epoch": 1385} {"train_loss": -40.25271224975586, "global_step": 167656, "epoch": 1385} {"train_loss": -40.19636535644531, "global_step": 167657, "epoch": 1385} {"train_loss": -40.28742218017578, "global_step": 167658, "epoch": 1385} {"train_loss": -40.40555953979492, "global_step": 167659, "epoch": 1385} {"train_loss": -40.3167839050293, "global_step": 167660, "epoch": 1385} {"train_loss": -40.22673416137695, "global_step": 167661, "epoch": 1385} {"train_loss": -40.21188735961914, "global_step": 167662, "epoch": 1385} {"train_loss": -40.53791809082031, "global_step": 167663, "epoch": 1385} {"train_loss": -39.98094177246094, "global_step": 167664, "epoch": 1385} {"train_loss": -40.18159866333008, "global_step": 167665, "epoch": 1385} {"train_loss": -40.1559944152832, "global_step": 167666, "epoch": 1385} {"train_loss": -39.78619384765625, "global_step": 167667, "epoch": 1385} {"train_loss": -37.73868942260742, "global_step": 167668, "epoch": 1385} {"train_loss": -35.96592712402344, "global_step": 167669, "epoch": 1385} {"train_loss": -36.899078369140625, "global_step": 167670, "epoch": 1385} {"train_loss": -39.30799102783203, "global_step": 167671, "epoch": 1385} {"train_loss": -40.03211975097656, "global_step": 167672, "epoch": 1385} {"train_loss": -40.01179122924805, "global_step": 167673, "epoch": 1385} {"train_loss": -38.777767181396484, "global_step": 167674, "epoch": 1385} {"train_loss": -39.969173431396484, "global_step": 167675, "epoch": 1385} {"train_loss": -40.29149627685547, "global_step": 167676, "epoch": 1385} {"train_loss": -40.0400505065918, "global_step": 167677, "epoch": 1385} {"train_loss": -40.761287689208984, "global_step": 167678, "epoch": 1385} {"train_loss": -40.678192138671875, "global_step": 167679, "epoch": 1385} {"train_loss": -40.71443557739258, "global_step": 167680, "epoch": 1385} {"train_loss": -40.77498245239258, "global_step": 167681, "epoch": 1385} {"train_loss": -40.711021423339844, "global_step": 167682, "epoch": 1385} {"train_loss": -40.556549072265625, "global_step": 167683, "epoch": 1385} {"train_loss": -40.808101654052734, "global_step": 167684, "epoch": 1385} {"train_loss": -40.56757354736328, "global_step": 167685, "epoch": 1385} {"train_loss": -40.76936340332031, "global_step": 167686, "epoch": 1385} {"train_loss": -40.65078353881836, "global_step": 167687, "epoch": 1385} {"train_loss": -40.047725677490234, "global_step": 167688, "epoch": 1385} {"train_loss": -39.414947509765625, "global_step": 167689, "epoch": 1385} {"train_loss": -37.34257125854492, "global_step": 167690, "epoch": 1385} {"train_loss": -28.885150909423828, "global_step": 167691, "epoch": 1385} {"train_loss": -11.483569145202637, "global_step": 167692, "epoch": 1385} {"train_loss": -25.84975242614746, "global_step": 167693, "epoch": 1385} {"train_loss": -39.504695892333984, "global_step": 167694, "epoch": 1385} {"train_loss": -30.140411376953125, "global_step": 167695, "epoch": 1385} {"train_loss": -37.42304229736328, "global_step": 167696, "epoch": 1385} {"train_loss": -33.11310577392578, "global_step": 167697, "epoch": 1385} {"train_loss": -36.500038146972656, "global_step": 167698, "epoch": 1385} {"train_loss": -31.9002628326416, "global_step": 167699, "epoch": 1385} {"train_loss": -37.244319915771484, "global_step": 167700, "epoch": 1385} {"train_loss": -35.95167922973633, "global_step": 167701, "epoch": 1385} {"train_loss": -38.574459075927734, "global_step": 167702, "epoch": 1385} {"train_loss": -36.1823844909668, "global_step": 167703, "epoch": 1385} {"train_loss": -39.11104202270508, "global_step": 167704, "epoch": 1385} {"train_loss": -38.37725845053176, "global_step": 167705, "epoch": 1385, "val_loss": 2662854.0} {"train_loss": -39.24117660522461, "global_step": 167706, "epoch": 1386} {"train_loss": -39.152313232421875, "global_step": 167707, "epoch": 1386} {"train_loss": -38.76585388183594, "global_step": 167708, "epoch": 1386} {"train_loss": -40.106239318847656, "global_step": 167709, "epoch": 1386} {"train_loss": -38.612789154052734, "global_step": 167710, "epoch": 1386} {"train_loss": -39.66605758666992, "global_step": 167711, "epoch": 1386} {"train_loss": -39.509979248046875, "global_step": 167712, "epoch": 1386} {"train_loss": -39.64146041870117, "global_step": 167713, "epoch": 1386} {"train_loss": -39.91762924194336, "global_step": 167714, "epoch": 1386} {"train_loss": -39.93949508666992, "global_step": 167715, "epoch": 1386} {"train_loss": -40.41230392456055, "global_step": 167716, "epoch": 1386} {"train_loss": -39.56606674194336, "global_step": 167717, "epoch": 1386} {"train_loss": -40.25527572631836, "global_step": 167718, "epoch": 1386} {"train_loss": -40.23910140991211, "global_step": 167719, "epoch": 1386} {"train_loss": -40.28522872924805, "global_step": 167720, "epoch": 1386} {"train_loss": -40.195465087890625, "global_step": 167721, "epoch": 1386} {"train_loss": -39.73757553100586, "global_step": 167722, "epoch": 1386} {"train_loss": -40.4520378112793, "global_step": 167723, "epoch": 1386} {"train_loss": -40.372047424316406, "global_step": 167724, "epoch": 1386} {"train_loss": -40.41450881958008, "global_step": 167725, "epoch": 1386} {"train_loss": -40.30012893676758, "global_step": 167726, "epoch": 1386} {"train_loss": -40.66187286376953, "global_step": 167727, "epoch": 1386} {"train_loss": -40.76266860961914, "global_step": 167728, "epoch": 1386} {"train_loss": -40.80568313598633, "global_step": 167729, "epoch": 1386} {"train_loss": -40.82221221923828, "global_step": 167730, "epoch": 1386} {"train_loss": -40.353904724121094, "global_step": 167731, "epoch": 1386} {"train_loss": -40.89793014526367, "global_step": 167732, "epoch": 1386} {"train_loss": -40.82438659667969, "global_step": 167733, "epoch": 1386} {"train_loss": -41.22406768798828, "global_step": 167734, "epoch": 1386} {"train_loss": -40.80364227294922, "global_step": 167735, "epoch": 1386} {"train_loss": -41.214839935302734, "global_step": 167736, "epoch": 1386} {"train_loss": -40.87537384033203, "global_step": 167737, "epoch": 1386} {"train_loss": -41.220943450927734, "global_step": 167738, "epoch": 1386} {"train_loss": -41.13618850708008, "global_step": 167739, "epoch": 1386} {"train_loss": -40.74102783203125, "global_step": 167740, "epoch": 1386} {"train_loss": -41.03717803955078, "global_step": 167741, "epoch": 1386} {"train_loss": -41.51865768432617, "global_step": 167742, "epoch": 1386} {"train_loss": -41.52449417114258, "global_step": 167743, "epoch": 1386} {"train_loss": -40.73727035522461, "global_step": 167744, "epoch": 1386} {"train_loss": -40.90082931518555, "global_step": 167745, "epoch": 1386} {"train_loss": -41.25414276123047, "global_step": 167746, "epoch": 1386} {"train_loss": -40.43231964111328, "global_step": 167747, "epoch": 1386} {"train_loss": -41.238887786865234, "global_step": 167748, "epoch": 1386} {"train_loss": -41.10630416870117, "global_step": 167749, "epoch": 1386} {"train_loss": -40.8835563659668, "global_step": 167750, "epoch": 1386} {"train_loss": -40.875770568847656, "global_step": 167751, "epoch": 1386} {"train_loss": -40.78790283203125, "global_step": 167752, "epoch": 1386} {"train_loss": -40.98340606689453, "global_step": 167753, "epoch": 1386} {"train_loss": -41.2618293762207, "global_step": 167754, "epoch": 1386} {"train_loss": -41.67387008666992, "global_step": 167755, "epoch": 1386} {"train_loss": -40.86393356323242, "global_step": 167756, "epoch": 1386} {"train_loss": -41.09098434448242, "global_step": 167757, "epoch": 1386} {"train_loss": -40.9176025390625, "global_step": 167758, "epoch": 1386} {"train_loss": -41.7033805847168, "global_step": 167759, "epoch": 1386} {"train_loss": -40.93142318725586, "global_step": 167760, "epoch": 1386} {"train_loss": -39.88288497924805, "global_step": 167761, "epoch": 1386} {"train_loss": -39.86537551879883, "global_step": 167762, "epoch": 1386} {"train_loss": -39.44724655151367, "global_step": 167763, "epoch": 1386} {"train_loss": -40.32322692871094, "global_step": 167764, "epoch": 1386} {"train_loss": -40.99669647216797, "global_step": 167765, "epoch": 1386} {"train_loss": -39.28697204589844, "global_step": 167766, "epoch": 1386} {"train_loss": -39.789302825927734, "global_step": 167767, "epoch": 1386} {"train_loss": -40.67636489868164, "global_step": 167768, "epoch": 1386} {"train_loss": -41.12286376953125, "global_step": 167769, "epoch": 1386} {"train_loss": -40.98875045776367, "global_step": 167770, "epoch": 1386} {"train_loss": -40.80442428588867, "global_step": 167771, "epoch": 1386} {"train_loss": -41.53843307495117, "global_step": 167772, "epoch": 1386} {"train_loss": -41.00883102416992, "global_step": 167773, "epoch": 1386} {"train_loss": -40.917083740234375, "global_step": 167774, "epoch": 1386} {"train_loss": -40.21855545043945, "global_step": 167775, "epoch": 1386} {"train_loss": -36.732913970947266, "global_step": 167776, "epoch": 1386} {"train_loss": -23.97901725769043, "global_step": 167777, "epoch": 1386} {"train_loss": -9.091593742370605, "global_step": 167778, "epoch": 1386} {"train_loss": -29.27680015563965, "global_step": 167779, "epoch": 1386} {"train_loss": -37.78303146362305, "global_step": 167780, "epoch": 1386} {"train_loss": -26.16412925720215, "global_step": 167781, "epoch": 1386} {"train_loss": -38.8460578918457, "global_step": 167782, "epoch": 1386} {"train_loss": -26.10987663269043, "global_step": 167783, "epoch": 1386} {"train_loss": -37.058204650878906, "global_step": 167784, "epoch": 1386} {"train_loss": -31.142160415649414, "global_step": 167785, "epoch": 1386} {"train_loss": -37.849002838134766, "global_step": 167786, "epoch": 1386} {"train_loss": -33.186546325683594, "global_step": 167787, "epoch": 1386} {"train_loss": -38.98020553588867, "global_step": 167788, "epoch": 1386} {"train_loss": -34.86823272705078, "global_step": 167789, "epoch": 1386} {"train_loss": -38.9642333984375, "global_step": 167790, "epoch": 1386} {"train_loss": -35.43156814575195, "global_step": 167791, "epoch": 1386} {"train_loss": -37.25035095214844, "global_step": 167792, "epoch": 1386} {"train_loss": -38.51117706298828, "global_step": 167793, "epoch": 1386} {"train_loss": -37.34894943237305, "global_step": 167794, "epoch": 1386} {"train_loss": -38.889801025390625, "global_step": 167795, "epoch": 1386} {"train_loss": -36.91498565673828, "global_step": 167796, "epoch": 1386} {"train_loss": -38.43403244018555, "global_step": 167797, "epoch": 1386} {"train_loss": -38.260536193847656, "global_step": 167798, "epoch": 1386} {"train_loss": -37.83797836303711, "global_step": 167799, "epoch": 1386} {"train_loss": -38.27717971801758, "global_step": 167800, "epoch": 1386} {"train_loss": -38.7828483581543, "global_step": 167801, "epoch": 1386} {"train_loss": -37.229652404785156, "global_step": 167802, "epoch": 1386} {"train_loss": -38.73991775512695, "global_step": 167803, "epoch": 1386} {"train_loss": -39.4074821472168, "global_step": 167804, "epoch": 1386} {"train_loss": -38.580318450927734, "global_step": 167805, "epoch": 1386} {"train_loss": -38.939613342285156, "global_step": 167806, "epoch": 1386} {"train_loss": -39.463191986083984, "global_step": 167807, "epoch": 1386} {"train_loss": -39.410152435302734, "global_step": 167808, "epoch": 1386} {"train_loss": -38.42681884765625, "global_step": 167809, "epoch": 1386} {"train_loss": -39.62604904174805, "global_step": 167810, "epoch": 1386} {"train_loss": -38.592899322509766, "global_step": 167811, "epoch": 1386} {"train_loss": -38.81754684448242, "global_step": 167812, "epoch": 1386} {"train_loss": -39.26373291015625, "global_step": 167813, "epoch": 1386} {"train_loss": -39.26314926147461, "global_step": 167814, "epoch": 1386} {"train_loss": -39.32794189453125, "global_step": 167815, "epoch": 1386} {"train_loss": -40.19789123535156, "global_step": 167816, "epoch": 1386} {"train_loss": -38.42161178588867, "global_step": 167817, "epoch": 1386} {"train_loss": -39.945674896240234, "global_step": 167818, "epoch": 1386} {"train_loss": -39.128936767578125, "global_step": 167819, "epoch": 1386} {"train_loss": -40.06062698364258, "global_step": 167820, "epoch": 1386} {"train_loss": -39.79865646362305, "global_step": 167821, "epoch": 1386} {"train_loss": -40.08184814453125, "global_step": 167822, "epoch": 1386} {"train_loss": -40.16122055053711, "global_step": 167823, "epoch": 1386} {"train_loss": -40.23796844482422, "global_step": 167824, "epoch": 1386} {"train_loss": -39.70954513549805, "global_step": 167825, "epoch": 1386} {"train_loss": -38.97276218666518, "global_step": 167826, "epoch": 1386, "val_loss": 2604956.25} {"train_loss": -40.1168327331543, "global_step": 167827, "epoch": 1387} {"train_loss": -40.4916877746582, "global_step": 167828, "epoch": 1387} {"train_loss": -39.95923614501953, "global_step": 167829, "epoch": 1387} {"train_loss": -39.868751525878906, "global_step": 167830, "epoch": 1387} {"train_loss": -40.15853500366211, "global_step": 167831, "epoch": 1387} {"train_loss": -40.13299560546875, "global_step": 167832, "epoch": 1387} {"train_loss": -40.257057189941406, "global_step": 167833, "epoch": 1387} {"train_loss": -40.508575439453125, "global_step": 167834, "epoch": 1387} {"train_loss": -40.116397857666016, "global_step": 167835, "epoch": 1387} {"train_loss": -40.66189193725586, "global_step": 167836, "epoch": 1387} {"train_loss": -40.08661651611328, "global_step": 167837, "epoch": 1387} {"train_loss": -40.901729583740234, "global_step": 167838, "epoch": 1387} {"train_loss": -40.7780876159668, "global_step": 167839, "epoch": 1387} {"train_loss": -39.808589935302734, "global_step": 167840, "epoch": 1387} {"train_loss": -40.96509552001953, "global_step": 167841, "epoch": 1387} {"train_loss": -40.8153190612793, "global_step": 167842, "epoch": 1387} {"train_loss": -40.974300384521484, "global_step": 167843, "epoch": 1387} {"train_loss": -37.97968673706055, "global_step": 167844, "epoch": 1387} {"train_loss": -40.40892791748047, "global_step": 167845, "epoch": 1387} {"train_loss": -40.63296127319336, "global_step": 167846, "epoch": 1387} {"train_loss": -33.28603744506836, "global_step": 167847, "epoch": 1387} {"train_loss": -38.91614532470703, "global_step": 167848, "epoch": 1387} {"train_loss": -38.90149688720703, "global_step": 167849, "epoch": 1387} {"train_loss": -39.62386703491211, "global_step": 167850, "epoch": 1387} {"train_loss": -40.72314453125, "global_step": 167851, "epoch": 1387} {"train_loss": -39.88557815551758, "global_step": 167852, "epoch": 1387} {"train_loss": -39.660274505615234, "global_step": 167853, "epoch": 1387} {"train_loss": -40.501014709472656, "global_step": 167854, "epoch": 1387} {"train_loss": -40.226173400878906, "global_step": 167855, "epoch": 1387} {"train_loss": -40.53753662109375, "global_step": 167856, "epoch": 1387} {"train_loss": -40.12651824951172, "global_step": 167857, "epoch": 1387} {"train_loss": -35.90478515625, "global_step": 167858, "epoch": 1387} {"train_loss": -38.614013671875, "global_step": 167859, "epoch": 1387} {"train_loss": -39.424007415771484, "global_step": 167860, "epoch": 1387} {"train_loss": -39.906333923339844, "global_step": 167861, "epoch": 1387} {"train_loss": -39.17351150512695, "global_step": 167862, "epoch": 1387} {"train_loss": -38.894371032714844, "global_step": 167863, "epoch": 1387} {"train_loss": -40.637733459472656, "global_step": 167864, "epoch": 1387} {"train_loss": -40.002201080322266, "global_step": 167865, "epoch": 1387} {"train_loss": -39.17555618286133, "global_step": 167866, "epoch": 1387} {"train_loss": -38.798980712890625, "global_step": 167867, "epoch": 1387} {"train_loss": -37.771732330322266, "global_step": 167868, "epoch": 1387} {"train_loss": -38.94913864135742, "global_step": 167869, "epoch": 1387} {"train_loss": -39.67267608642578, "global_step": 167870, "epoch": 1387} {"train_loss": -37.38317108154297, "global_step": 167871, "epoch": 1387} {"train_loss": -38.16508102416992, "global_step": 167872, "epoch": 1387} {"train_loss": -38.5432243347168, "global_step": 167873, "epoch": 1387} {"train_loss": -40.576927185058594, "global_step": 167874, "epoch": 1387} {"train_loss": -39.556182861328125, "global_step": 167875, "epoch": 1387} {"train_loss": -36.28046417236328, "global_step": 167876, "epoch": 1387} {"train_loss": -38.33182907104492, "global_step": 167877, "epoch": 1387} {"train_loss": -37.45878219604492, "global_step": 167878, "epoch": 1387} {"train_loss": -37.18429183959961, "global_step": 167879, "epoch": 1387} {"train_loss": -38.584781646728516, "global_step": 167880, "epoch": 1387} {"train_loss": -36.74209213256836, "global_step": 167881, "epoch": 1387} {"train_loss": -37.49003219604492, "global_step": 167882, "epoch": 1387} {"train_loss": -36.963226318359375, "global_step": 167883, "epoch": 1387} {"train_loss": -37.438899993896484, "global_step": 167884, "epoch": 1387} {"train_loss": -35.94443893432617, "global_step": 167885, "epoch": 1387} {"train_loss": -37.66679763793945, "global_step": 167886, "epoch": 1387} {"train_loss": -35.03544235229492, "global_step": 167887, "epoch": 1387} {"train_loss": -38.20854568481445, "global_step": 167888, "epoch": 1387} {"train_loss": -37.317604064941406, "global_step": 167889, "epoch": 1387} {"train_loss": -38.85859298706055, "global_step": 167890, "epoch": 1387} {"train_loss": -36.084041595458984, "global_step": 167891, "epoch": 1387} {"train_loss": -35.25522994995117, "global_step": 167892, "epoch": 1387} {"train_loss": -38.7081413269043, "global_step": 167893, "epoch": 1387} {"train_loss": -39.440589904785156, "global_step": 167894, "epoch": 1387} {"train_loss": -37.11591720581055, "global_step": 167895, "epoch": 1387} {"train_loss": -36.01578140258789, "global_step": 167896, "epoch": 1387} {"train_loss": -36.658809661865234, "global_step": 167897, "epoch": 1387} {"train_loss": -34.15736770629883, "global_step": 167898, "epoch": 1387} {"train_loss": -38.99092483520508, "global_step": 167899, "epoch": 1387} {"train_loss": -37.49428939819336, "global_step": 167900, "epoch": 1387} {"train_loss": -38.48379135131836, "global_step": 167901, "epoch": 1387} {"train_loss": -36.618831634521484, "global_step": 167902, "epoch": 1387} {"train_loss": -38.29580307006836, "global_step": 167903, "epoch": 1387} {"train_loss": -37.65955352783203, "global_step": 167904, "epoch": 1387} {"train_loss": -38.70960998535156, "global_step": 167905, "epoch": 1387} {"train_loss": -39.216949462890625, "global_step": 167906, "epoch": 1387} {"train_loss": -38.25449752807617, "global_step": 167907, "epoch": 1387} {"train_loss": -38.36732864379883, "global_step": 167908, "epoch": 1387} {"train_loss": -37.819583892822266, "global_step": 167909, "epoch": 1387} {"train_loss": -39.33681106567383, "global_step": 167910, "epoch": 1387} {"train_loss": -38.488948822021484, "global_step": 167911, "epoch": 1387} {"train_loss": -36.37593460083008, "global_step": 167912, "epoch": 1387} {"train_loss": -38.386085510253906, "global_step": 167913, "epoch": 1387} {"train_loss": -38.15951919555664, "global_step": 167914, "epoch": 1387} {"train_loss": -38.897377014160156, "global_step": 167915, "epoch": 1387} {"train_loss": -37.45740509033203, "global_step": 167916, "epoch": 1387} {"train_loss": -38.96140670776367, "global_step": 167917, "epoch": 1387} {"train_loss": -39.49943542480469, "global_step": 167918, "epoch": 1387} {"train_loss": -38.73586654663086, "global_step": 167919, "epoch": 1387} {"train_loss": -39.174591064453125, "global_step": 167920, "epoch": 1387} {"train_loss": -39.31184768676758, "global_step": 167921, "epoch": 1387} {"train_loss": -39.28586959838867, "global_step": 167922, "epoch": 1387} {"train_loss": -39.24709701538086, "global_step": 167923, "epoch": 1387} {"train_loss": -39.0064811706543, "global_step": 167924, "epoch": 1387} {"train_loss": -37.41180419921875, "global_step": 167925, "epoch": 1387} {"train_loss": -39.62577438354492, "global_step": 167926, "epoch": 1387} {"train_loss": -39.32866287231445, "global_step": 167927, "epoch": 1387} {"train_loss": -40.071250915527344, "global_step": 167928, "epoch": 1387} {"train_loss": -39.6152458190918, "global_step": 167929, "epoch": 1387} {"train_loss": -39.35764694213867, "global_step": 167930, "epoch": 1387} {"train_loss": -39.740779876708984, "global_step": 167931, "epoch": 1387} {"train_loss": -38.55734634399414, "global_step": 167932, "epoch": 1387} {"train_loss": -38.702911376953125, "global_step": 167933, "epoch": 1387} {"train_loss": -38.91612243652344, "global_step": 167934, "epoch": 1387} {"train_loss": -38.77449417114258, "global_step": 167935, "epoch": 1387} {"train_loss": -39.76152420043945, "global_step": 167936, "epoch": 1387} {"train_loss": -37.65139389038086, "global_step": 167937, "epoch": 1387} {"train_loss": -39.17060470581055, "global_step": 167938, "epoch": 1387} {"train_loss": -39.42802047729492, "global_step": 167939, "epoch": 1387} {"train_loss": -39.00640869140625, "global_step": 167940, "epoch": 1387} {"train_loss": -39.41815948486328, "global_step": 167941, "epoch": 1387} {"train_loss": -39.63288497924805, "global_step": 167942, "epoch": 1387} {"train_loss": -39.99618148803711, "global_step": 167943, "epoch": 1387} {"train_loss": -37.48615264892578, "global_step": 167944, "epoch": 1387} {"train_loss": -39.907955169677734, "global_step": 167945, "epoch": 1387} {"train_loss": -39.494991302490234, "global_step": 167946, "epoch": 1387} {"train_loss": -38.78060998207282, "global_step": 167947, "epoch": 1387, "val_loss": 2724574.0} {"train_loss": -39.37546920776367, "global_step": 167948, "epoch": 1388} {"train_loss": -39.598793029785156, "global_step": 167949, "epoch": 1388} {"train_loss": -39.14712142944336, "global_step": 167950, "epoch": 1388} {"train_loss": -39.44733428955078, "global_step": 167951, "epoch": 1388} {"train_loss": -39.085426330566406, "global_step": 167952, "epoch": 1388} {"train_loss": -39.4320182800293, "global_step": 167953, "epoch": 1388} {"train_loss": -38.620033264160156, "global_step": 167954, "epoch": 1388} {"train_loss": -39.33436965942383, "global_step": 167955, "epoch": 1388} {"train_loss": -39.67321014404297, "global_step": 167956, "epoch": 1388} {"train_loss": -39.1417121887207, "global_step": 167957, "epoch": 1388} {"train_loss": -38.62372970581055, "global_step": 167958, "epoch": 1388} {"train_loss": -39.73091506958008, "global_step": 167959, "epoch": 1388} {"train_loss": -39.86759948730469, "global_step": 167960, "epoch": 1388} {"train_loss": -39.38454055786133, "global_step": 167961, "epoch": 1388} {"train_loss": -39.47998809814453, "global_step": 167962, "epoch": 1388} {"train_loss": -39.96938705444336, "global_step": 167963, "epoch": 1388} {"train_loss": -39.266910552978516, "global_step": 167964, "epoch": 1388} {"train_loss": -38.795650482177734, "global_step": 167965, "epoch": 1388} {"train_loss": -40.08134841918945, "global_step": 167966, "epoch": 1388} {"train_loss": -40.309993743896484, "global_step": 167967, "epoch": 1388} {"train_loss": -39.631507873535156, "global_step": 167968, "epoch": 1388} {"train_loss": -40.67634201049805, "global_step": 167969, "epoch": 1388} {"train_loss": -39.67292404174805, "global_step": 167970, "epoch": 1388} {"train_loss": -40.23447799682617, "global_step": 167971, "epoch": 1388} {"train_loss": -39.81610870361328, "global_step": 167972, "epoch": 1388} {"train_loss": -39.7814826965332, "global_step": 167973, "epoch": 1388} {"train_loss": -40.46516799926758, "global_step": 167974, "epoch": 1388} {"train_loss": -40.44829177856445, "global_step": 167975, "epoch": 1388} {"train_loss": -38.55134201049805, "global_step": 167976, "epoch": 1388} {"train_loss": -40.30792999267578, "global_step": 167977, "epoch": 1388} {"train_loss": -39.385597229003906, "global_step": 167978, "epoch": 1388} {"train_loss": -40.070526123046875, "global_step": 167979, "epoch": 1388} {"train_loss": -40.343841552734375, "global_step": 167980, "epoch": 1388} {"train_loss": -39.915218353271484, "global_step": 167981, "epoch": 1388} {"train_loss": -40.52256774902344, "global_step": 167982, "epoch": 1388} {"train_loss": -39.6088981628418, "global_step": 167983, "epoch": 1388} {"train_loss": -39.76578903198242, "global_step": 167984, "epoch": 1388} {"train_loss": -38.66638946533203, "global_step": 167985, "epoch": 1388} {"train_loss": -38.62421417236328, "global_step": 167986, "epoch": 1388} {"train_loss": -40.00041961669922, "global_step": 167987, "epoch": 1388} {"train_loss": -40.642147064208984, "global_step": 167988, "epoch": 1388} {"train_loss": -39.74407958984375, "global_step": 167989, "epoch": 1388} {"train_loss": -38.8214225769043, "global_step": 167990, "epoch": 1388} {"train_loss": -36.848445892333984, "global_step": 167991, "epoch": 1388} {"train_loss": -36.55196762084961, "global_step": 167992, "epoch": 1388} {"train_loss": -40.25942611694336, "global_step": 167993, "epoch": 1388} {"train_loss": -37.647308349609375, "global_step": 167994, "epoch": 1388} {"train_loss": -32.5930290222168, "global_step": 167995, "epoch": 1388} {"train_loss": -36.197872161865234, "global_step": 167996, "epoch": 1388} {"train_loss": -39.60694122314453, "global_step": 167997, "epoch": 1388} {"train_loss": -35.185604095458984, "global_step": 167998, "epoch": 1388} {"train_loss": -35.5026969909668, "global_step": 167999, "epoch": 1388} {"train_loss": -39.621089935302734, "global_step": 168000, "epoch": 1388} {"train_loss": -37.02618408203125, "global_step": 168001, "epoch": 1388} {"train_loss": -37.0271110534668, "global_step": 168002, "epoch": 1388} {"train_loss": -38.7968635559082, "global_step": 168003, "epoch": 1388} {"train_loss": -35.54420852661133, "global_step": 168004, "epoch": 1388} {"train_loss": -38.997371673583984, "global_step": 168005, "epoch": 1388} {"train_loss": -39.124942779541016, "global_step": 168006, "epoch": 1388} {"train_loss": -38.01617431640625, "global_step": 168007, "epoch": 1388} {"train_loss": -40.47100067138672, "global_step": 168008, "epoch": 1388} {"train_loss": -37.65606689453125, "global_step": 168009, "epoch": 1388} {"train_loss": -40.196510314941406, "global_step": 168010, "epoch": 1388} {"train_loss": -38.14521026611328, "global_step": 168011, "epoch": 1388} {"train_loss": -38.82364273071289, "global_step": 168012, "epoch": 1388} {"train_loss": -37.60234832763672, "global_step": 168013, "epoch": 1388} {"train_loss": -39.959136962890625, "global_step": 168014, "epoch": 1388} {"train_loss": -38.63292694091797, "global_step": 168015, "epoch": 1388} {"train_loss": -39.713287353515625, "global_step": 168016, "epoch": 1388} {"train_loss": -38.776832580566406, "global_step": 168017, "epoch": 1388} {"train_loss": -40.63352584838867, "global_step": 168018, "epoch": 1388} {"train_loss": -38.63838577270508, "global_step": 168019, "epoch": 1388} {"train_loss": -39.45796585083008, "global_step": 168020, "epoch": 1388} {"train_loss": -38.25209426879883, "global_step": 168021, "epoch": 1388} {"train_loss": -40.227989196777344, "global_step": 168022, "epoch": 1388} {"train_loss": -39.7719841003418, "global_step": 168023, "epoch": 1388} {"train_loss": -40.25874710083008, "global_step": 168024, "epoch": 1388} {"train_loss": -39.60095977783203, "global_step": 168025, "epoch": 1388} {"train_loss": -40.211544036865234, "global_step": 168026, "epoch": 1388} {"train_loss": -39.95260238647461, "global_step": 168027, "epoch": 1388} {"train_loss": -40.288307189941406, "global_step": 168028, "epoch": 1388} {"train_loss": -40.55054473876953, "global_step": 168029, "epoch": 1388} {"train_loss": -39.981319427490234, "global_step": 168030, "epoch": 1388} {"train_loss": -40.40895080566406, "global_step": 168031, "epoch": 1388} {"train_loss": -40.51081085205078, "global_step": 168032, "epoch": 1388} {"train_loss": -40.44008255004883, "global_step": 168033, "epoch": 1388} {"train_loss": -40.59482192993164, "global_step": 168034, "epoch": 1388} {"train_loss": -40.72057342529297, "global_step": 168035, "epoch": 1388} {"train_loss": -39.23073196411133, "global_step": 168036, "epoch": 1388} {"train_loss": -40.64813232421875, "global_step": 168037, "epoch": 1388} {"train_loss": -40.65229034423828, "global_step": 168038, "epoch": 1388} {"train_loss": -39.53049850463867, "global_step": 168039, "epoch": 1388} {"train_loss": -40.811744689941406, "global_step": 168040, "epoch": 1388} {"train_loss": -41.01176834106445, "global_step": 168041, "epoch": 1388} {"train_loss": -40.44415283203125, "global_step": 168042, "epoch": 1388} {"train_loss": -40.129581451416016, "global_step": 168043, "epoch": 1388} {"train_loss": -41.061256408691406, "global_step": 168044, "epoch": 1388} {"train_loss": -40.558067321777344, "global_step": 168045, "epoch": 1388} {"train_loss": -40.46300506591797, "global_step": 168046, "epoch": 1388} {"train_loss": -40.76191711425781, "global_step": 168047, "epoch": 1388} {"train_loss": -40.16495895385742, "global_step": 168048, "epoch": 1388} {"train_loss": -40.64826583862305, "global_step": 168049, "epoch": 1388} {"train_loss": -40.28316879272461, "global_step": 168050, "epoch": 1388} {"train_loss": -41.35251235961914, "global_step": 168051, "epoch": 1388} {"train_loss": -40.34172439575195, "global_step": 168052, "epoch": 1388} {"train_loss": -41.1303825378418, "global_step": 168053, "epoch": 1388} {"train_loss": -39.901187896728516, "global_step": 168054, "epoch": 1388} {"train_loss": -40.17544174194336, "global_step": 168055, "epoch": 1388} {"train_loss": -40.64303970336914, "global_step": 168056, "epoch": 1388} {"train_loss": -40.23105239868164, "global_step": 168057, "epoch": 1388} {"train_loss": -40.983394622802734, "global_step": 168058, "epoch": 1388} {"train_loss": -38.871421813964844, "global_step": 168059, "epoch": 1388} {"train_loss": -39.26947021484375, "global_step": 168060, "epoch": 1388} {"train_loss": -39.51921463012695, "global_step": 168061, "epoch": 1388} {"train_loss": -40.67829132080078, "global_step": 168062, "epoch": 1388} {"train_loss": -39.79441452026367, "global_step": 168063, "epoch": 1388} {"train_loss": -41.09431838989258, "global_step": 168064, "epoch": 1388} {"train_loss": -37.81770324707031, "global_step": 168065, "epoch": 1388} {"train_loss": -40.78867721557617, "global_step": 168066, "epoch": 1388} {"train_loss": -37.31562042236328, "global_step": 168067, "epoch": 1388} {"train_loss": -39.46739493125726, "global_step": 168068, "epoch": 1388, "val_loss": 2608102.75} {"train_loss": -39.28695297241211, "global_step": 168069, "epoch": 1389} {"train_loss": -40.12128829956055, "global_step": 168070, "epoch": 1389} {"train_loss": -36.64780807495117, "global_step": 168071, "epoch": 1389} {"train_loss": -38.10587692260742, "global_step": 168072, "epoch": 1389} {"train_loss": -39.660003662109375, "global_step": 168073, "epoch": 1389} {"train_loss": -36.95222854614258, "global_step": 168074, "epoch": 1389} {"train_loss": -40.45350646972656, "global_step": 168075, "epoch": 1389} {"train_loss": -38.770530700683594, "global_step": 168076, "epoch": 1389} {"train_loss": -39.1916389465332, "global_step": 168077, "epoch": 1389} {"train_loss": -39.64622116088867, "global_step": 168078, "epoch": 1389} {"train_loss": -38.69782257080078, "global_step": 168079, "epoch": 1389} {"train_loss": -39.296504974365234, "global_step": 168080, "epoch": 1389} {"train_loss": -39.34664535522461, "global_step": 168081, "epoch": 1389} {"train_loss": -39.63059616088867, "global_step": 168082, "epoch": 1389} {"train_loss": -39.83230209350586, "global_step": 168083, "epoch": 1389} {"train_loss": -40.4636344909668, "global_step": 168084, "epoch": 1389} {"train_loss": -39.91959762573242, "global_step": 168085, "epoch": 1389} {"train_loss": -40.14921951293945, "global_step": 168086, "epoch": 1389} {"train_loss": -39.693382263183594, "global_step": 168087, "epoch": 1389} {"train_loss": -39.16170883178711, "global_step": 168088, "epoch": 1389} {"train_loss": -40.27084732055664, "global_step": 168089, "epoch": 1389} {"train_loss": -40.10519027709961, "global_step": 168090, "epoch": 1389} {"train_loss": -36.373268127441406, "global_step": 168091, "epoch": 1389} {"train_loss": -39.12801742553711, "global_step": 168092, "epoch": 1389} {"train_loss": -40.24868392944336, "global_step": 168093, "epoch": 1389} {"train_loss": -40.0990104675293, "global_step": 168094, "epoch": 1389} {"train_loss": -40.20781707763672, "global_step": 168095, "epoch": 1389} {"train_loss": -40.61180114746094, "global_step": 168096, "epoch": 1389} {"train_loss": -40.555416107177734, "global_step": 168097, "epoch": 1389} {"train_loss": -38.287410736083984, "global_step": 168098, "epoch": 1389} {"train_loss": -40.487640380859375, "global_step": 168099, "epoch": 1389} {"train_loss": -40.1580696105957, "global_step": 168100, "epoch": 1389} {"train_loss": -40.08977127075195, "global_step": 168101, "epoch": 1389} {"train_loss": -39.836055755615234, "global_step": 168102, "epoch": 1389} {"train_loss": -40.25364303588867, "global_step": 168103, "epoch": 1389} {"train_loss": -40.93113708496094, "global_step": 168104, "epoch": 1389} {"train_loss": -38.951351165771484, "global_step": 168105, "epoch": 1389} {"train_loss": -39.666831970214844, "global_step": 168106, "epoch": 1389} {"train_loss": -40.531982421875, "global_step": 168107, "epoch": 1389} {"train_loss": -40.066585540771484, "global_step": 168108, "epoch": 1389} {"train_loss": -39.645721435546875, "global_step": 168109, "epoch": 1389} {"train_loss": -38.8515625, "global_step": 168110, "epoch": 1389} {"train_loss": -39.94696807861328, "global_step": 168111, "epoch": 1389} {"train_loss": -39.51520538330078, "global_step": 168112, "epoch": 1389} {"train_loss": -39.21278762817383, "global_step": 168113, "epoch": 1389} {"train_loss": -40.79939651489258, "global_step": 168114, "epoch": 1389} {"train_loss": -40.57680130004883, "global_step": 168115, "epoch": 1389} {"train_loss": -41.303409576416016, "global_step": 168116, "epoch": 1389} {"train_loss": -41.09029006958008, "global_step": 168117, "epoch": 1389} {"train_loss": -39.71718215942383, "global_step": 168118, "epoch": 1389} {"train_loss": -40.33829879760742, "global_step": 168119, "epoch": 1389} {"train_loss": -39.94166946411133, "global_step": 168120, "epoch": 1389} {"train_loss": -40.80768585205078, "global_step": 168121, "epoch": 1389} {"train_loss": -40.4089469909668, "global_step": 168122, "epoch": 1389} {"train_loss": -38.7033805847168, "global_step": 168123, "epoch": 1389} {"train_loss": -36.13954162597656, "global_step": 168124, "epoch": 1389} {"train_loss": -37.49020004272461, "global_step": 168125, "epoch": 1389} {"train_loss": -36.3901252746582, "global_step": 168126, "epoch": 1389} {"train_loss": -39.64952087402344, "global_step": 168127, "epoch": 1389} {"train_loss": -38.5753173828125, "global_step": 168128, "epoch": 1389} {"train_loss": -40.29701614379883, "global_step": 168129, "epoch": 1389} {"train_loss": -39.85696792602539, "global_step": 168130, "epoch": 1389} {"train_loss": -39.573280334472656, "global_step": 168131, "epoch": 1389} {"train_loss": -39.58169937133789, "global_step": 168132, "epoch": 1389} {"train_loss": -37.1548957824707, "global_step": 168133, "epoch": 1389} {"train_loss": -37.89413070678711, "global_step": 168134, "epoch": 1389} {"train_loss": -38.664608001708984, "global_step": 168135, "epoch": 1389} {"train_loss": -37.161224365234375, "global_step": 168136, "epoch": 1389} {"train_loss": -36.831207275390625, "global_step": 168137, "epoch": 1389} {"train_loss": -40.924530029296875, "global_step": 168138, "epoch": 1389} {"train_loss": -39.86418914794922, "global_step": 168139, "epoch": 1389} {"train_loss": -39.18875503540039, "global_step": 168140, "epoch": 1389} {"train_loss": -40.03512954711914, "global_step": 168141, "epoch": 1389} {"train_loss": -40.03330612182617, "global_step": 168142, "epoch": 1389} {"train_loss": -40.56763458251953, "global_step": 168143, "epoch": 1389} {"train_loss": -39.89656066894531, "global_step": 168144, "epoch": 1389} {"train_loss": -40.06220245361328, "global_step": 168145, "epoch": 1389} {"train_loss": -39.66105270385742, "global_step": 168146, "epoch": 1389} {"train_loss": -38.21565628051758, "global_step": 168147, "epoch": 1389} {"train_loss": -40.33869552612305, "global_step": 168148, "epoch": 1389} {"train_loss": -40.49908447265625, "global_step": 168149, "epoch": 1389} {"train_loss": -39.53617858886719, "global_step": 168150, "epoch": 1389} {"train_loss": -38.619911193847656, "global_step": 168151, "epoch": 1389} {"train_loss": -39.86921310424805, "global_step": 168152, "epoch": 1389} {"train_loss": -38.25983428955078, "global_step": 168153, "epoch": 1389} {"train_loss": -39.666046142578125, "global_step": 168154, "epoch": 1389} {"train_loss": -39.96260452270508, "global_step": 168155, "epoch": 1389} {"train_loss": -40.56234359741211, "global_step": 168156, "epoch": 1389} {"train_loss": -40.09596252441406, "global_step": 168157, "epoch": 1389} {"train_loss": -40.52164077758789, "global_step": 168158, "epoch": 1389} {"train_loss": -41.0467643737793, "global_step": 168159, "epoch": 1389} {"train_loss": -39.67189407348633, "global_step": 168160, "epoch": 1389} {"train_loss": -38.5760498046875, "global_step": 168161, "epoch": 1389} {"train_loss": -40.42504119873047, "global_step": 168162, "epoch": 1389} {"train_loss": -40.064430236816406, "global_step": 168163, "epoch": 1389} {"train_loss": -41.07467269897461, "global_step": 168164, "epoch": 1389} {"train_loss": -38.245243072509766, "global_step": 168165, "epoch": 1389} {"train_loss": -40.858970642089844, "global_step": 168166, "epoch": 1389} {"train_loss": -40.555110931396484, "global_step": 168167, "epoch": 1389} {"train_loss": -37.890892028808594, "global_step": 168168, "epoch": 1389} {"train_loss": -39.1329460144043, "global_step": 168169, "epoch": 1389} {"train_loss": -40.454368591308594, "global_step": 168170, "epoch": 1389} {"train_loss": -40.52216720581055, "global_step": 168171, "epoch": 1389} {"train_loss": -39.265541076660156, "global_step": 168172, "epoch": 1389} {"train_loss": -40.77627182006836, "global_step": 168173, "epoch": 1389} {"train_loss": -40.375404357910156, "global_step": 168174, "epoch": 1389} {"train_loss": -41.28691864013672, "global_step": 168175, "epoch": 1389} {"train_loss": -41.195762634277344, "global_step": 168176, "epoch": 1389} {"train_loss": -41.085636138916016, "global_step": 168177, "epoch": 1389} {"train_loss": -40.9171257019043, "global_step": 168178, "epoch": 1389} {"train_loss": -40.50119400024414, "global_step": 168179, "epoch": 1389} {"train_loss": -39.420040130615234, "global_step": 168180, "epoch": 1389} {"train_loss": -40.09735870361328, "global_step": 168181, "epoch": 1389} {"train_loss": -39.52033615112305, "global_step": 168182, "epoch": 1389} {"train_loss": -40.42573165893555, "global_step": 168183, "epoch": 1389} {"train_loss": -40.374202728271484, "global_step": 168184, "epoch": 1389} {"train_loss": -40.011714935302734, "global_step": 168185, "epoch": 1389} {"train_loss": -38.35575485229492, "global_step": 168186, "epoch": 1389} {"train_loss": -40.72136306762695, "global_step": 168187, "epoch": 1389} {"train_loss": -40.6384391784668, "global_step": 168188, "epoch": 1389} {"train_loss": -39.65543315036238, "global_step": 168189, "epoch": 1389, "val_loss": 2655825.75} {"train_loss": -39.76192855834961, "global_step": 168190, "epoch": 1390} {"train_loss": -40.37218475341797, "global_step": 168191, "epoch": 1390} {"train_loss": -39.27241516113281, "global_step": 168192, "epoch": 1390} {"train_loss": -40.8323974609375, "global_step": 168193, "epoch": 1390} {"train_loss": -40.22380065917969, "global_step": 168194, "epoch": 1390} {"train_loss": -41.045249938964844, "global_step": 168195, "epoch": 1390} {"train_loss": -39.78451156616211, "global_step": 168196, "epoch": 1390} {"train_loss": -37.81501007080078, "global_step": 168197, "epoch": 1390} {"train_loss": -40.44194793701172, "global_step": 168198, "epoch": 1390} {"train_loss": -40.38582229614258, "global_step": 168199, "epoch": 1390} {"train_loss": -38.43817138671875, "global_step": 168200, "epoch": 1390} {"train_loss": -38.57159423828125, "global_step": 168201, "epoch": 1390} {"train_loss": -40.37336349487305, "global_step": 168202, "epoch": 1390} {"train_loss": -39.402061462402344, "global_step": 168203, "epoch": 1390} {"train_loss": -40.10282516479492, "global_step": 168204, "epoch": 1390} {"train_loss": -40.7943000793457, "global_step": 168205, "epoch": 1390} {"train_loss": -40.332515716552734, "global_step": 168206, "epoch": 1390} {"train_loss": -38.299903869628906, "global_step": 168207, "epoch": 1390} {"train_loss": -37.69854736328125, "global_step": 168208, "epoch": 1390} {"train_loss": -38.70677947998047, "global_step": 168209, "epoch": 1390} {"train_loss": -39.84540939331055, "global_step": 168210, "epoch": 1390} {"train_loss": -39.42374801635742, "global_step": 168211, "epoch": 1390} {"train_loss": -36.821285247802734, "global_step": 168212, "epoch": 1390} {"train_loss": -38.40046310424805, "global_step": 168213, "epoch": 1390} {"train_loss": -40.5989990234375, "global_step": 168214, "epoch": 1390} {"train_loss": -38.05537033081055, "global_step": 168215, "epoch": 1390} {"train_loss": -38.098934173583984, "global_step": 168216, "epoch": 1390} {"train_loss": -39.483211517333984, "global_step": 168217, "epoch": 1390} {"train_loss": -39.876983642578125, "global_step": 168218, "epoch": 1390} {"train_loss": -39.084388732910156, "global_step": 168219, "epoch": 1390} {"train_loss": -38.429134368896484, "global_step": 168220, "epoch": 1390} {"train_loss": -40.261531829833984, "global_step": 168221, "epoch": 1390} {"train_loss": -39.09370422363281, "global_step": 168222, "epoch": 1390} {"train_loss": -40.04313278198242, "global_step": 168223, "epoch": 1390} {"train_loss": -41.15044021606445, "global_step": 168224, "epoch": 1390} {"train_loss": -38.67634963989258, "global_step": 168225, "epoch": 1390} {"train_loss": -39.679012298583984, "global_step": 168226, "epoch": 1390} {"train_loss": -40.38508224487305, "global_step": 168227, "epoch": 1390} {"train_loss": -38.1519889831543, "global_step": 168228, "epoch": 1390} {"train_loss": -39.79708480834961, "global_step": 168229, "epoch": 1390} {"train_loss": -40.781551361083984, "global_step": 168230, "epoch": 1390} {"train_loss": -39.89786148071289, "global_step": 168231, "epoch": 1390} {"train_loss": -40.435760498046875, "global_step": 168232, "epoch": 1390} {"train_loss": -39.1341667175293, "global_step": 168233, "epoch": 1390} {"train_loss": -40.653709411621094, "global_step": 168234, "epoch": 1390} {"train_loss": -40.7909049987793, "global_step": 168235, "epoch": 1390} {"train_loss": -40.169334411621094, "global_step": 168236, "epoch": 1390} {"train_loss": -39.79402160644531, "global_step": 168237, "epoch": 1390} {"train_loss": -40.505210876464844, "global_step": 168238, "epoch": 1390} {"train_loss": -40.2923469543457, "global_step": 168239, "epoch": 1390} {"train_loss": -39.499671936035156, "global_step": 168240, "epoch": 1390} {"train_loss": -40.29499053955078, "global_step": 168241, "epoch": 1390} {"train_loss": -40.252166748046875, "global_step": 168242, "epoch": 1390} {"train_loss": -41.28703689575195, "global_step": 168243, "epoch": 1390} {"train_loss": -40.50414276123047, "global_step": 168244, "epoch": 1390} {"train_loss": -41.181495666503906, "global_step": 168245, "epoch": 1390} {"train_loss": -40.786048889160156, "global_step": 168246, "epoch": 1390} {"train_loss": -41.164241790771484, "global_step": 168247, "epoch": 1390} {"train_loss": -40.769317626953125, "global_step": 168248, "epoch": 1390} {"train_loss": -41.01887512207031, "global_step": 168249, "epoch": 1390} {"train_loss": -40.99016189575195, "global_step": 168250, "epoch": 1390} {"train_loss": -40.80157470703125, "global_step": 168251, "epoch": 1390} {"train_loss": -39.9923095703125, "global_step": 168252, "epoch": 1390} {"train_loss": -40.72841262817383, "global_step": 168253, "epoch": 1390} {"train_loss": -40.4623908996582, "global_step": 168254, "epoch": 1390} {"train_loss": -41.4926872253418, "global_step": 168255, "epoch": 1390} {"train_loss": -40.882408142089844, "global_step": 168256, "epoch": 1390} {"train_loss": -40.62063217163086, "global_step": 168257, "epoch": 1390} {"train_loss": -40.9422721862793, "global_step": 168258, "epoch": 1390} {"train_loss": -41.0391960144043, "global_step": 168259, "epoch": 1390} {"train_loss": -40.789886474609375, "global_step": 168260, "epoch": 1390} {"train_loss": -40.17194747924805, "global_step": 168261, "epoch": 1390} {"train_loss": -40.09790802001953, "global_step": 168262, "epoch": 1390} {"train_loss": -40.98568344116211, "global_step": 168263, "epoch": 1390} {"train_loss": -40.981956481933594, "global_step": 168264, "epoch": 1390} {"train_loss": -39.98176956176758, "global_step": 168265, "epoch": 1390} {"train_loss": -33.59153366088867, "global_step": 168266, "epoch": 1390} {"train_loss": -39.48618698120117, "global_step": 168267, "epoch": 1390} {"train_loss": -40.68197250366211, "global_step": 168268, "epoch": 1390} {"train_loss": -38.088470458984375, "global_step": 168269, "epoch": 1390} {"train_loss": -37.02898025512695, "global_step": 168270, "epoch": 1390} {"train_loss": -40.51972961425781, "global_step": 168271, "epoch": 1390} {"train_loss": -40.70514678955078, "global_step": 168272, "epoch": 1390} {"train_loss": -39.09199142456055, "global_step": 168273, "epoch": 1390} {"train_loss": -40.311824798583984, "global_step": 168274, "epoch": 1390} {"train_loss": -40.88856506347656, "global_step": 168275, "epoch": 1390} {"train_loss": -40.48347091674805, "global_step": 168276, "epoch": 1390} {"train_loss": -38.56842041015625, "global_step": 168277, "epoch": 1390} {"train_loss": -40.89663314819336, "global_step": 168278, "epoch": 1390} {"train_loss": -40.52001953125, "global_step": 168279, "epoch": 1390} {"train_loss": -40.37993240356445, "global_step": 168280, "epoch": 1390} {"train_loss": -41.064144134521484, "global_step": 168281, "epoch": 1390} {"train_loss": -40.950714111328125, "global_step": 168282, "epoch": 1390} {"train_loss": -40.834659576416016, "global_step": 168283, "epoch": 1390} {"train_loss": -39.21784591674805, "global_step": 168284, "epoch": 1390} {"train_loss": -41.127437591552734, "global_step": 168285, "epoch": 1390} {"train_loss": -41.14936828613281, "global_step": 168286, "epoch": 1390} {"train_loss": -40.337188720703125, "global_step": 168287, "epoch": 1390} {"train_loss": -40.60032272338867, "global_step": 168288, "epoch": 1390} {"train_loss": -39.631526947021484, "global_step": 168289, "epoch": 1390} {"train_loss": -41.203426361083984, "global_step": 168290, "epoch": 1390} {"train_loss": -39.052547454833984, "global_step": 168291, "epoch": 1390} {"train_loss": -40.33744430541992, "global_step": 168292, "epoch": 1390} {"train_loss": -40.612640380859375, "global_step": 168293, "epoch": 1390} {"train_loss": -40.36003494262695, "global_step": 168294, "epoch": 1390} {"train_loss": -39.60930633544922, "global_step": 168295, "epoch": 1390} {"train_loss": -40.54171371459961, "global_step": 168296, "epoch": 1390} {"train_loss": -36.41611099243164, "global_step": 168297, "epoch": 1390} {"train_loss": -39.84437942504883, "global_step": 168298, "epoch": 1390} {"train_loss": -39.5556755065918, "global_step": 168299, "epoch": 1390} {"train_loss": -40.92486572265625, "global_step": 168300, "epoch": 1390} {"train_loss": -39.96784591674805, "global_step": 168301, "epoch": 1390} {"train_loss": -40.96825408935547, "global_step": 168302, "epoch": 1390} {"train_loss": -38.90078353881836, "global_step": 168303, "epoch": 1390} {"train_loss": -40.616416931152344, "global_step": 168304, "epoch": 1390} {"train_loss": -40.000282287597656, "global_step": 168305, "epoch": 1390} {"train_loss": -40.91838836669922, "global_step": 168306, "epoch": 1390} {"train_loss": -40.21658706665039, "global_step": 168307, "epoch": 1390} {"train_loss": -39.773231506347656, "global_step": 168308, "epoch": 1390} {"train_loss": -41.19502639770508, "global_step": 168309, "epoch": 1390} {"train_loss": -39.97279846569723, "global_step": 168310, "epoch": 1390, "val_loss": 2744085.75} {"train_loss": -40.971946716308594, "global_step": 168311, "epoch": 1391} {"train_loss": -41.32612228393555, "global_step": 168312, "epoch": 1391} {"train_loss": -40.363277435302734, "global_step": 168313, "epoch": 1391} {"train_loss": -40.994239807128906, "global_step": 168314, "epoch": 1391} {"train_loss": -38.8145637512207, "global_step": 168315, "epoch": 1391} {"train_loss": -39.288124084472656, "global_step": 168316, "epoch": 1391} {"train_loss": -40.13247299194336, "global_step": 168317, "epoch": 1391} {"train_loss": -38.58834457397461, "global_step": 168318, "epoch": 1391} {"train_loss": -40.181671142578125, "global_step": 168319, "epoch": 1391} {"train_loss": -38.13357925415039, "global_step": 168320, "epoch": 1391} {"train_loss": -40.534156799316406, "global_step": 168321, "epoch": 1391} {"train_loss": -39.4050178527832, "global_step": 168322, "epoch": 1391} {"train_loss": -38.95803451538086, "global_step": 168323, "epoch": 1391} {"train_loss": -41.258758544921875, "global_step": 168324, "epoch": 1391} {"train_loss": -40.54362106323242, "global_step": 168325, "epoch": 1391} {"train_loss": -39.8096923828125, "global_step": 168326, "epoch": 1391} {"train_loss": -41.0274543762207, "global_step": 168327, "epoch": 1391} {"train_loss": -40.66407012939453, "global_step": 168328, "epoch": 1391} {"train_loss": -40.31949996948242, "global_step": 168329, "epoch": 1391} {"train_loss": -39.70649337768555, "global_step": 168330, "epoch": 1391} {"train_loss": -39.87788009643555, "global_step": 168331, "epoch": 1391} {"train_loss": -39.64085006713867, "global_step": 168332, "epoch": 1391} {"train_loss": -41.212364196777344, "global_step": 168333, "epoch": 1391} {"train_loss": -40.71251678466797, "global_step": 168334, "epoch": 1391} {"train_loss": -37.598079681396484, "global_step": 168335, "epoch": 1391} {"train_loss": -40.64753341674805, "global_step": 168336, "epoch": 1391} {"train_loss": -41.21155548095703, "global_step": 168337, "epoch": 1391} {"train_loss": -40.528839111328125, "global_step": 168338, "epoch": 1391} {"train_loss": -40.8901481628418, "global_step": 168339, "epoch": 1391} {"train_loss": -40.91978073120117, "global_step": 168340, "epoch": 1391} {"train_loss": -40.47015380859375, "global_step": 168341, "epoch": 1391} {"train_loss": -40.69302749633789, "global_step": 168342, "epoch": 1391} {"train_loss": -40.82114791870117, "global_step": 168343, "epoch": 1391} {"train_loss": -38.79682922363281, "global_step": 168344, "epoch": 1391} {"train_loss": -38.37343978881836, "global_step": 168345, "epoch": 1391} {"train_loss": -41.71675109863281, "global_step": 168346, "epoch": 1391} {"train_loss": -40.9179801940918, "global_step": 168347, "epoch": 1391} {"train_loss": -39.54730224609375, "global_step": 168348, "epoch": 1391} {"train_loss": -40.110633850097656, "global_step": 168349, "epoch": 1391} {"train_loss": -40.97675704956055, "global_step": 168350, "epoch": 1391} {"train_loss": -40.969573974609375, "global_step": 168351, "epoch": 1391} {"train_loss": -41.328216552734375, "global_step": 168352, "epoch": 1391} {"train_loss": -40.91450881958008, "global_step": 168353, "epoch": 1391} {"train_loss": -41.93598556518555, "global_step": 168354, "epoch": 1391} {"train_loss": -39.6404914855957, "global_step": 168355, "epoch": 1391} {"train_loss": -40.428138732910156, "global_step": 168356, "epoch": 1391} {"train_loss": -41.01836395263672, "global_step": 168357, "epoch": 1391} {"train_loss": -40.52775192260742, "global_step": 168358, "epoch": 1391} {"train_loss": -40.67429733276367, "global_step": 168359, "epoch": 1391} {"train_loss": -41.2319221496582, "global_step": 168360, "epoch": 1391} {"train_loss": -41.44660186767578, "global_step": 168361, "epoch": 1391} {"train_loss": -41.54962158203125, "global_step": 168362, "epoch": 1391} {"train_loss": -41.221405029296875, "global_step": 168363, "epoch": 1391} {"train_loss": -41.30415725708008, "global_step": 168364, "epoch": 1391} {"train_loss": -40.92533874511719, "global_step": 168365, "epoch": 1391} {"train_loss": -41.078914642333984, "global_step": 168366, "epoch": 1391} {"train_loss": -39.626564025878906, "global_step": 168367, "epoch": 1391} {"train_loss": -40.7318115234375, "global_step": 168368, "epoch": 1391} {"train_loss": -40.11796188354492, "global_step": 168369, "epoch": 1391} {"train_loss": -39.81965637207031, "global_step": 168370, "epoch": 1391} {"train_loss": -37.85437774658203, "global_step": 168371, "epoch": 1391} {"train_loss": -40.50542449951172, "global_step": 168372, "epoch": 1391} {"train_loss": -40.25033187866211, "global_step": 168373, "epoch": 1391} {"train_loss": -39.89254379272461, "global_step": 168374, "epoch": 1391} {"train_loss": -39.80842971801758, "global_step": 168375, "epoch": 1391} {"train_loss": -34.7850341796875, "global_step": 168376, "epoch": 1391} {"train_loss": -37.345550537109375, "global_step": 168377, "epoch": 1391} {"train_loss": -39.8167724609375, "global_step": 168378, "epoch": 1391} {"train_loss": -40.84477615356445, "global_step": 168379, "epoch": 1391} {"train_loss": -34.58102035522461, "global_step": 168380, "epoch": 1391} {"train_loss": -31.141098022460938, "global_step": 168381, "epoch": 1391} {"train_loss": -39.22989273071289, "global_step": 168382, "epoch": 1391} {"train_loss": -39.59217071533203, "global_step": 168383, "epoch": 1391} {"train_loss": -38.705322265625, "global_step": 168384, "epoch": 1391} {"train_loss": -39.018531799316406, "global_step": 168385, "epoch": 1391} {"train_loss": -38.04571533203125, "global_step": 168386, "epoch": 1391} {"train_loss": -38.38069534301758, "global_step": 168387, "epoch": 1391} {"train_loss": -38.454742431640625, "global_step": 168388, "epoch": 1391} {"train_loss": -26.77332878112793, "global_step": 168389, "epoch": 1391} {"train_loss": -34.82532501220703, "global_step": 168390, "epoch": 1391} {"train_loss": -32.24390411376953, "global_step": 168391, "epoch": 1391} {"train_loss": -31.7213191986084, "global_step": 168392, "epoch": 1391} {"train_loss": -35.56584548950195, "global_step": 168393, "epoch": 1391} {"train_loss": -4.126758575439453, "global_step": 168394, "epoch": 1391} {"train_loss": -29.194692611694336, "global_step": 168395, "epoch": 1391} {"train_loss": -25.0139217376709, "global_step": 168396, "epoch": 1391} {"train_loss": -33.36809158325195, "global_step": 168397, "epoch": 1391} {"train_loss": -24.39872169494629, "global_step": 168398, "epoch": 1391} {"train_loss": -31.140256881713867, "global_step": 168399, "epoch": 1391} {"train_loss": -26.423282623291016, "global_step": 168400, "epoch": 1391} {"train_loss": -27.9331111907959, "global_step": 168401, "epoch": 1391} {"train_loss": -34.17075729370117, "global_step": 168402, "epoch": 1391} {"train_loss": -29.4891300201416, "global_step": 168403, "epoch": 1391} {"train_loss": -26.30271339416504, "global_step": 168404, "epoch": 1391} {"train_loss": -28.88165283203125, "global_step": 168405, "epoch": 1391} {"train_loss": -34.539302825927734, "global_step": 168406, "epoch": 1391} {"train_loss": -32.44837188720703, "global_step": 168407, "epoch": 1391} {"train_loss": -30.980697631835938, "global_step": 168408, "epoch": 1391} {"train_loss": -32.49125289916992, "global_step": 168409, "epoch": 1391} {"train_loss": -33.52119827270508, "global_step": 168410, "epoch": 1391} {"train_loss": -33.989112854003906, "global_step": 168411, "epoch": 1391} {"train_loss": -35.77431106567383, "global_step": 168412, "epoch": 1391} {"train_loss": -35.92958450317383, "global_step": 168413, "epoch": 1391} {"train_loss": -35.53301239013672, "global_step": 168414, "epoch": 1391} {"train_loss": -35.24361801147461, "global_step": 168415, "epoch": 1391} {"train_loss": -34.17594909667969, "global_step": 168416, "epoch": 1391} {"train_loss": -35.21546173095703, "global_step": 168417, "epoch": 1391} {"train_loss": -35.554588317871094, "global_step": 168418, "epoch": 1391} {"train_loss": -35.150238037109375, "global_step": 168419, "epoch": 1391} {"train_loss": -36.402347564697266, "global_step": 168420, "epoch": 1391} {"train_loss": -36.85298538208008, "global_step": 168421, "epoch": 1391} {"train_loss": -36.336238861083984, "global_step": 168422, "epoch": 1391} {"train_loss": -36.051212310791016, "global_step": 168423, "epoch": 1391} {"train_loss": -34.50332260131836, "global_step": 168424, "epoch": 1391} {"train_loss": -35.50286865234375, "global_step": 168425, "epoch": 1391} {"train_loss": -36.01470184326172, "global_step": 168426, "epoch": 1391} {"train_loss": -37.64336013793945, "global_step": 168427, "epoch": 1391} {"train_loss": -36.92350769042969, "global_step": 168428, "epoch": 1391} {"train_loss": -36.70915603637695, "global_step": 168429, "epoch": 1391} {"train_loss": -37.2859001159668, "global_step": 168430, "epoch": 1391} {"train_loss": -37.278080317599716, "global_step": 168431, "epoch": 1391, "val_loss": 2692279.0} {"train_loss": -36.839569091796875, "global_step": 168432, "epoch": 1392} {"train_loss": -36.78139114379883, "global_step": 168433, "epoch": 1392} {"train_loss": -37.96560287475586, "global_step": 168434, "epoch": 1392} {"train_loss": -37.449195861816406, "global_step": 168435, "epoch": 1392} {"train_loss": -37.025264739990234, "global_step": 168436, "epoch": 1392} {"train_loss": -36.49195861816406, "global_step": 168437, "epoch": 1392} {"train_loss": -37.558021545410156, "global_step": 168438, "epoch": 1392} {"train_loss": -37.01418685913086, "global_step": 168439, "epoch": 1392} {"train_loss": -37.02391052246094, "global_step": 168440, "epoch": 1392} {"train_loss": -37.30286407470703, "global_step": 168441, "epoch": 1392} {"train_loss": -38.015621185302734, "global_step": 168442, "epoch": 1392} {"train_loss": -37.17365646362305, "global_step": 168443, "epoch": 1392} {"train_loss": -38.00533676147461, "global_step": 168444, "epoch": 1392} {"train_loss": -38.00446319580078, "global_step": 168445, "epoch": 1392} {"train_loss": -37.931636810302734, "global_step": 168446, "epoch": 1392} {"train_loss": -38.1224479675293, "global_step": 168447, "epoch": 1392} {"train_loss": -37.92340087890625, "global_step": 168448, "epoch": 1392} {"train_loss": -38.227806091308594, "global_step": 168449, "epoch": 1392} {"train_loss": -38.0468635559082, "global_step": 168450, "epoch": 1392} {"train_loss": -38.11182403564453, "global_step": 168451, "epoch": 1392} {"train_loss": -38.227210998535156, "global_step": 168452, "epoch": 1392} {"train_loss": -38.01423263549805, "global_step": 168453, "epoch": 1392} {"train_loss": -38.064022064208984, "global_step": 168454, "epoch": 1392} {"train_loss": -38.7364387512207, "global_step": 168455, "epoch": 1392} {"train_loss": -38.228118896484375, "global_step": 168456, "epoch": 1392} {"train_loss": -38.36872482299805, "global_step": 168457, "epoch": 1392} {"train_loss": -37.980796813964844, "global_step": 168458, "epoch": 1392} {"train_loss": -38.11078643798828, "global_step": 168459, "epoch": 1392} {"train_loss": -38.68440628051758, "global_step": 168460, "epoch": 1392} {"train_loss": -38.82379913330078, "global_step": 168461, "epoch": 1392} {"train_loss": -38.79759979248047, "global_step": 168462, "epoch": 1392} {"train_loss": -38.66730880737305, "global_step": 168463, "epoch": 1392} {"train_loss": -39.002323150634766, "global_step": 168464, "epoch": 1392} {"train_loss": -39.1212158203125, "global_step": 168465, "epoch": 1392} {"train_loss": -37.906795501708984, "global_step": 168466, "epoch": 1392} {"train_loss": -39.141414642333984, "global_step": 168467, "epoch": 1392} {"train_loss": -38.23577880859375, "global_step": 168468, "epoch": 1392} {"train_loss": -38.87465286254883, "global_step": 168469, "epoch": 1392} {"train_loss": -38.31673812866211, "global_step": 168470, "epoch": 1392} {"train_loss": -39.142250061035156, "global_step": 168471, "epoch": 1392} {"train_loss": -38.74587631225586, "global_step": 168472, "epoch": 1392} {"train_loss": -37.9555778503418, "global_step": 168473, "epoch": 1392} {"train_loss": -38.17373275756836, "global_step": 168474, "epoch": 1392} {"train_loss": -39.3049430847168, "global_step": 168475, "epoch": 1392} {"train_loss": -38.64236068725586, "global_step": 168476, "epoch": 1392} {"train_loss": -39.14604187011719, "global_step": 168477, "epoch": 1392} {"train_loss": -39.42203903198242, "global_step": 168478, "epoch": 1392} {"train_loss": -39.51029586791992, "global_step": 168479, "epoch": 1392} {"train_loss": -38.753475189208984, "global_step": 168480, "epoch": 1392} {"train_loss": -38.65255355834961, "global_step": 168481, "epoch": 1392} {"train_loss": -39.37174987792969, "global_step": 168482, "epoch": 1392} {"train_loss": -39.31659698486328, "global_step": 168483, "epoch": 1392} {"train_loss": -39.55521011352539, "global_step": 168484, "epoch": 1392} {"train_loss": -39.40810775756836, "global_step": 168485, "epoch": 1392} {"train_loss": -39.350830078125, "global_step": 168486, "epoch": 1392} {"train_loss": -39.10606002807617, "global_step": 168487, "epoch": 1392} {"train_loss": -38.78078842163086, "global_step": 168488, "epoch": 1392} {"train_loss": -39.51987075805664, "global_step": 168489, "epoch": 1392} {"train_loss": -39.55841827392578, "global_step": 168490, "epoch": 1392} {"train_loss": -39.218448638916016, "global_step": 168491, "epoch": 1392} {"train_loss": -39.759456634521484, "global_step": 168492, "epoch": 1392} {"train_loss": -39.583492279052734, "global_step": 168493, "epoch": 1392} {"train_loss": -39.31260299682617, "global_step": 168494, "epoch": 1392} {"train_loss": -40.458919525146484, "global_step": 168495, "epoch": 1392} {"train_loss": -39.98004913330078, "global_step": 168496, "epoch": 1392} {"train_loss": -39.858394622802734, "global_step": 168497, "epoch": 1392} {"train_loss": -39.958251953125, "global_step": 168498, "epoch": 1392} {"train_loss": -39.98725128173828, "global_step": 168499, "epoch": 1392} {"train_loss": -39.43741226196289, "global_step": 168500, "epoch": 1392} {"train_loss": -39.580421447753906, "global_step": 168501, "epoch": 1392} {"train_loss": -40.204742431640625, "global_step": 168502, "epoch": 1392} {"train_loss": -39.51261901855469, "global_step": 168503, "epoch": 1392} {"train_loss": -39.78831100463867, "global_step": 168504, "epoch": 1392} {"train_loss": -40.1756477355957, "global_step": 168505, "epoch": 1392} {"train_loss": -40.307716369628906, "global_step": 168506, "epoch": 1392} {"train_loss": -39.72732925415039, "global_step": 168507, "epoch": 1392} {"train_loss": -39.604713439941406, "global_step": 168508, "epoch": 1392} {"train_loss": -39.248836517333984, "global_step": 168509, "epoch": 1392} {"train_loss": -39.85736083984375, "global_step": 168510, "epoch": 1392} {"train_loss": -40.273921966552734, "global_step": 168511, "epoch": 1392} {"train_loss": -39.85018539428711, "global_step": 168512, "epoch": 1392} {"train_loss": -40.32418441772461, "global_step": 168513, "epoch": 1392} {"train_loss": -40.08136749267578, "global_step": 168514, "epoch": 1392} {"train_loss": -39.81667709350586, "global_step": 168515, "epoch": 1392} {"train_loss": -39.25828170776367, "global_step": 168516, "epoch": 1392} {"train_loss": -39.01448440551758, "global_step": 168517, "epoch": 1392} {"train_loss": -39.33675765991211, "global_step": 168518, "epoch": 1392} {"train_loss": -40.693424224853516, "global_step": 168519, "epoch": 1392} {"train_loss": -38.97590255737305, "global_step": 168520, "epoch": 1392} {"train_loss": -39.50611114501953, "global_step": 168521, "epoch": 1392} {"train_loss": -39.90342330932617, "global_step": 168522, "epoch": 1392} {"train_loss": -39.52564239501953, "global_step": 168523, "epoch": 1392} {"train_loss": -39.245094299316406, "global_step": 168524, "epoch": 1392} {"train_loss": -38.87214279174805, "global_step": 168525, "epoch": 1392} {"train_loss": -40.37202453613281, "global_step": 168526, "epoch": 1392} {"train_loss": -39.567691802978516, "global_step": 168527, "epoch": 1392} {"train_loss": -39.463253021240234, "global_step": 168528, "epoch": 1392} {"train_loss": -40.139156341552734, "global_step": 168529, "epoch": 1392} {"train_loss": -39.787574768066406, "global_step": 168530, "epoch": 1392} {"train_loss": -39.22587966918945, "global_step": 168531, "epoch": 1392} {"train_loss": -39.20685577392578, "global_step": 168532, "epoch": 1392} {"train_loss": -39.80256271362305, "global_step": 168533, "epoch": 1392} {"train_loss": -38.048213958740234, "global_step": 168534, "epoch": 1392} {"train_loss": -37.29093551635742, "global_step": 168535, "epoch": 1392} {"train_loss": -39.90531921386719, "global_step": 168536, "epoch": 1392} {"train_loss": -39.568092346191406, "global_step": 168537, "epoch": 1392} {"train_loss": -37.11528396606445, "global_step": 168538, "epoch": 1392} {"train_loss": -39.82177734375, "global_step": 168539, "epoch": 1392} {"train_loss": -38.24519348144531, "global_step": 168540, "epoch": 1392} {"train_loss": -37.99493408203125, "global_step": 168541, "epoch": 1392} {"train_loss": -39.099178314208984, "global_step": 168542, "epoch": 1392} {"train_loss": -37.64872360229492, "global_step": 168543, "epoch": 1392} {"train_loss": -38.04714584350586, "global_step": 168544, "epoch": 1392} {"train_loss": -38.801509857177734, "global_step": 168545, "epoch": 1392} {"train_loss": -37.548133850097656, "global_step": 168546, "epoch": 1392} {"train_loss": -39.220523834228516, "global_step": 168547, "epoch": 1392} {"train_loss": -38.55438995361328, "global_step": 168548, "epoch": 1392} {"train_loss": -38.748085021972656, "global_step": 168549, "epoch": 1392} {"train_loss": -39.85286331176758, "global_step": 168550, "epoch": 1392} {"train_loss": -39.37785720825195, "global_step": 168551, "epoch": 1392} {"train_loss": -38.88723228391537, "global_step": 168552, "epoch": 1392, "val_loss": 2644135.25} {"train_loss": -39.710060119628906, "global_step": 168553, "epoch": 1393} {"train_loss": -40.24270248413086, "global_step": 168554, "epoch": 1393} {"train_loss": -38.759490966796875, "global_step": 168555, "epoch": 1393} {"train_loss": -40.26772689819336, "global_step": 168556, "epoch": 1393} {"train_loss": -39.94614791870117, "global_step": 168557, "epoch": 1393} {"train_loss": -38.27387619018555, "global_step": 168558, "epoch": 1393} {"train_loss": -40.3975715637207, "global_step": 168559, "epoch": 1393} {"train_loss": -38.44427490234375, "global_step": 168560, "epoch": 1393} {"train_loss": -39.438385009765625, "global_step": 168561, "epoch": 1393} {"train_loss": -40.14680480957031, "global_step": 168562, "epoch": 1393} {"train_loss": -39.1509895324707, "global_step": 168563, "epoch": 1393} {"train_loss": -40.14002990722656, "global_step": 168564, "epoch": 1393} {"train_loss": -40.413265228271484, "global_step": 168565, "epoch": 1393} {"train_loss": -39.62346267700195, "global_step": 168566, "epoch": 1393} {"train_loss": -38.90597152709961, "global_step": 168567, "epoch": 1393} {"train_loss": -40.33549118041992, "global_step": 168568, "epoch": 1393} {"train_loss": -39.90475082397461, "global_step": 168569, "epoch": 1393} {"train_loss": -40.11646270751953, "global_step": 168570, "epoch": 1393} {"train_loss": -40.52988815307617, "global_step": 168571, "epoch": 1393} {"train_loss": -40.655303955078125, "global_step": 168572, "epoch": 1393} {"train_loss": -39.98701095581055, "global_step": 168573, "epoch": 1393} {"train_loss": -39.69670486450195, "global_step": 168574, "epoch": 1393} {"train_loss": -40.43993377685547, "global_step": 168575, "epoch": 1393} {"train_loss": -40.535762786865234, "global_step": 168576, "epoch": 1393} {"train_loss": -39.93964385986328, "global_step": 168577, "epoch": 1393} {"train_loss": -40.71430206298828, "global_step": 168578, "epoch": 1393} {"train_loss": -39.787559509277344, "global_step": 168579, "epoch": 1393} {"train_loss": -39.151729583740234, "global_step": 168580, "epoch": 1393} {"train_loss": -38.97945785522461, "global_step": 168581, "epoch": 1393} {"train_loss": -40.147071838378906, "global_step": 168582, "epoch": 1393} {"train_loss": -39.42072677612305, "global_step": 168583, "epoch": 1393} {"train_loss": -39.628753662109375, "global_step": 168584, "epoch": 1393} {"train_loss": -39.63538360595703, "global_step": 168585, "epoch": 1393} {"train_loss": -40.382240295410156, "global_step": 168586, "epoch": 1393} {"train_loss": -39.875701904296875, "global_step": 168587, "epoch": 1393} {"train_loss": -39.570980072021484, "global_step": 168588, "epoch": 1393} {"train_loss": -39.5346794128418, "global_step": 168589, "epoch": 1393} {"train_loss": -39.923370361328125, "global_step": 168590, "epoch": 1393} {"train_loss": -40.0466194152832, "global_step": 168591, "epoch": 1393} {"train_loss": -40.89004135131836, "global_step": 168592, "epoch": 1393} {"train_loss": -40.076210021972656, "global_step": 168593, "epoch": 1393} {"train_loss": -40.639156341552734, "global_step": 168594, "epoch": 1393} {"train_loss": -40.53568649291992, "global_step": 168595, "epoch": 1393} {"train_loss": -40.82697677612305, "global_step": 168596, "epoch": 1393} {"train_loss": -40.420467376708984, "global_step": 168597, "epoch": 1393} {"train_loss": -40.69218826293945, "global_step": 168598, "epoch": 1393} {"train_loss": -40.85956573486328, "global_step": 168599, "epoch": 1393} {"train_loss": -40.17783737182617, "global_step": 168600, "epoch": 1393} {"train_loss": -40.7545280456543, "global_step": 168601, "epoch": 1393} {"train_loss": -40.13303756713867, "global_step": 168602, "epoch": 1393} {"train_loss": -40.386287689208984, "global_step": 168603, "epoch": 1393} {"train_loss": -40.80595016479492, "global_step": 168604, "epoch": 1393} {"train_loss": -38.730403900146484, "global_step": 168605, "epoch": 1393} {"train_loss": -40.835304260253906, "global_step": 168606, "epoch": 1393} {"train_loss": -40.178955078125, "global_step": 168607, "epoch": 1393} {"train_loss": -39.80573654174805, "global_step": 168608, "epoch": 1393} {"train_loss": -41.484375, "global_step": 168609, "epoch": 1393} {"train_loss": -40.05900192260742, "global_step": 168610, "epoch": 1393} {"train_loss": -38.381370544433594, "global_step": 168611, "epoch": 1393} {"train_loss": -39.9991455078125, "global_step": 168612, "epoch": 1393} {"train_loss": -39.23128890991211, "global_step": 168613, "epoch": 1393} {"train_loss": -40.341346740722656, "global_step": 168614, "epoch": 1393} {"train_loss": -39.2663459777832, "global_step": 168615, "epoch": 1393} {"train_loss": -40.078556060791016, "global_step": 168616, "epoch": 1393} {"train_loss": -38.8182487487793, "global_step": 168617, "epoch": 1393} {"train_loss": -37.37966537475586, "global_step": 168618, "epoch": 1393} {"train_loss": -39.9731330871582, "global_step": 168619, "epoch": 1393} {"train_loss": -39.411407470703125, "global_step": 168620, "epoch": 1393} {"train_loss": -41.024593353271484, "global_step": 168621, "epoch": 1393} {"train_loss": -39.25600051879883, "global_step": 168622, "epoch": 1393} {"train_loss": -39.77671432495117, "global_step": 168623, "epoch": 1393} {"train_loss": -39.56019973754883, "global_step": 168624, "epoch": 1393} {"train_loss": -39.33887481689453, "global_step": 168625, "epoch": 1393} {"train_loss": -38.49639892578125, "global_step": 168626, "epoch": 1393} {"train_loss": -39.839168548583984, "global_step": 168627, "epoch": 1393} {"train_loss": -40.10724639892578, "global_step": 168628, "epoch": 1393} {"train_loss": -39.27870178222656, "global_step": 168629, "epoch": 1393} {"train_loss": -40.54338455200195, "global_step": 168630, "epoch": 1393} {"train_loss": -40.2598991394043, "global_step": 168631, "epoch": 1393} {"train_loss": -39.62623977661133, "global_step": 168632, "epoch": 1393} {"train_loss": -40.29018020629883, "global_step": 168633, "epoch": 1393} {"train_loss": -38.822303771972656, "global_step": 168634, "epoch": 1393} {"train_loss": -40.86697006225586, "global_step": 168635, "epoch": 1393} {"train_loss": -40.19027328491211, "global_step": 168636, "epoch": 1393} {"train_loss": -40.82035446166992, "global_step": 168637, "epoch": 1393} {"train_loss": -40.251243591308594, "global_step": 168638, "epoch": 1393} {"train_loss": -40.74817657470703, "global_step": 168639, "epoch": 1393} {"train_loss": -38.750732421875, "global_step": 168640, "epoch": 1393} {"train_loss": -40.42848205566406, "global_step": 168641, "epoch": 1393} {"train_loss": -39.65235137939453, "global_step": 168642, "epoch": 1393} {"train_loss": -40.09228515625, "global_step": 168643, "epoch": 1393} {"train_loss": -38.50321960449219, "global_step": 168644, "epoch": 1393} {"train_loss": -39.89915466308594, "global_step": 168645, "epoch": 1393} {"train_loss": -39.8924674987793, "global_step": 168646, "epoch": 1393} {"train_loss": -39.61316680908203, "global_step": 168647, "epoch": 1393} {"train_loss": -39.5078010559082, "global_step": 168648, "epoch": 1393} {"train_loss": -39.19462203979492, "global_step": 168649, "epoch": 1393} {"train_loss": -38.01267623901367, "global_step": 168650, "epoch": 1393} {"train_loss": -35.754119873046875, "global_step": 168651, "epoch": 1393} {"train_loss": -37.950782775878906, "global_step": 168652, "epoch": 1393} {"train_loss": -33.918739318847656, "global_step": 168653, "epoch": 1393} {"train_loss": -39.059600830078125, "global_step": 168654, "epoch": 1393} {"train_loss": -37.42532730102539, "global_step": 168655, "epoch": 1393} {"train_loss": -37.46425247192383, "global_step": 168656, "epoch": 1393} {"train_loss": -37.09981155395508, "global_step": 168657, "epoch": 1393} {"train_loss": -39.8131217956543, "global_step": 168658, "epoch": 1393} {"train_loss": -38.0208625793457, "global_step": 168659, "epoch": 1393} {"train_loss": -38.40531921386719, "global_step": 168660, "epoch": 1393} {"train_loss": -40.35579299926758, "global_step": 168661, "epoch": 1393} {"train_loss": -38.969635009765625, "global_step": 168662, "epoch": 1393} {"train_loss": -38.737545013427734, "global_step": 168663, "epoch": 1393} {"train_loss": -39.770179748535156, "global_step": 168664, "epoch": 1393} {"train_loss": -39.68379592895508, "global_step": 168665, "epoch": 1393} {"train_loss": -39.5748176574707, "global_step": 168666, "epoch": 1393} {"train_loss": -38.074981689453125, "global_step": 168667, "epoch": 1393} {"train_loss": -39.593318939208984, "global_step": 168668, "epoch": 1393} {"train_loss": -39.422584533691406, "global_step": 168669, "epoch": 1393} {"train_loss": -40.26291275024414, "global_step": 168670, "epoch": 1393} {"train_loss": -39.48738479614258, "global_step": 168671, "epoch": 1393} {"train_loss": -40.356204986572266, "global_step": 168672, "epoch": 1393} {"train_loss": -39.62899067776262, "global_step": 168673, "epoch": 1393, "val_loss": 2648485.0} {"train_loss": -39.314361572265625, "global_step": 168674, "epoch": 1394} {"train_loss": -40.0223503112793, "global_step": 168675, "epoch": 1394} {"train_loss": -39.250091552734375, "global_step": 168676, "epoch": 1394} {"train_loss": -40.03703689575195, "global_step": 168677, "epoch": 1394} {"train_loss": -39.84180450439453, "global_step": 168678, "epoch": 1394} {"train_loss": -39.95017623901367, "global_step": 168679, "epoch": 1394} {"train_loss": -39.255489349365234, "global_step": 168680, "epoch": 1394} {"train_loss": -38.06421661376953, "global_step": 168681, "epoch": 1394} {"train_loss": -37.70220947265625, "global_step": 168682, "epoch": 1394} {"train_loss": -39.72461700439453, "global_step": 168683, "epoch": 1394} {"train_loss": -37.963802337646484, "global_step": 168684, "epoch": 1394} {"train_loss": -40.02532196044922, "global_step": 168685, "epoch": 1394} {"train_loss": -36.689064025878906, "global_step": 168686, "epoch": 1394} {"train_loss": -39.917293548583984, "global_step": 168687, "epoch": 1394} {"train_loss": -38.16770553588867, "global_step": 168688, "epoch": 1394} {"train_loss": -39.567840576171875, "global_step": 168689, "epoch": 1394} {"train_loss": -38.995758056640625, "global_step": 168690, "epoch": 1394} {"train_loss": -40.06235885620117, "global_step": 168691, "epoch": 1394} {"train_loss": -39.16416549682617, "global_step": 168692, "epoch": 1394} {"train_loss": -40.2818489074707, "global_step": 168693, "epoch": 1394} {"train_loss": -36.373268127441406, "global_step": 168694, "epoch": 1394} {"train_loss": -39.2287712097168, "global_step": 168695, "epoch": 1394} {"train_loss": -40.262569427490234, "global_step": 168696, "epoch": 1394} {"train_loss": -39.77324676513672, "global_step": 168697, "epoch": 1394} {"train_loss": -39.8773078918457, "global_step": 168698, "epoch": 1394} {"train_loss": -39.86896896362305, "global_step": 168699, "epoch": 1394} {"train_loss": -40.1834831237793, "global_step": 168700, "epoch": 1394} {"train_loss": -40.344383239746094, "global_step": 168701, "epoch": 1394} {"train_loss": -40.14748001098633, "global_step": 168702, "epoch": 1394} {"train_loss": -40.61848068237305, "global_step": 168703, "epoch": 1394} {"train_loss": -40.552120208740234, "global_step": 168704, "epoch": 1394} {"train_loss": -40.3419303894043, "global_step": 168705, "epoch": 1394} {"train_loss": -39.22922897338867, "global_step": 168706, "epoch": 1394} {"train_loss": -40.75825119018555, "global_step": 168707, "epoch": 1394} {"train_loss": -39.55793380737305, "global_step": 168708, "epoch": 1394} {"train_loss": -40.0860595703125, "global_step": 168709, "epoch": 1394} {"train_loss": -39.55575180053711, "global_step": 168710, "epoch": 1394} {"train_loss": -33.5274772644043, "global_step": 168711, "epoch": 1394} {"train_loss": -39.315364837646484, "global_step": 168712, "epoch": 1394} {"train_loss": -39.58143997192383, "global_step": 168713, "epoch": 1394} {"train_loss": -37.314292907714844, "global_step": 168714, "epoch": 1394} {"train_loss": -39.94975662231445, "global_step": 168715, "epoch": 1394} {"train_loss": -38.99453353881836, "global_step": 168716, "epoch": 1394} {"train_loss": -33.13813018798828, "global_step": 168717, "epoch": 1394} {"train_loss": -38.3865852355957, "global_step": 168718, "epoch": 1394} {"train_loss": -32.71881866455078, "global_step": 168719, "epoch": 1394} {"train_loss": -35.60362243652344, "global_step": 168720, "epoch": 1394} {"train_loss": -37.203582763671875, "global_step": 168721, "epoch": 1394} {"train_loss": -37.86166763305664, "global_step": 168722, "epoch": 1394} {"train_loss": -37.27910614013672, "global_step": 168723, "epoch": 1394} {"train_loss": -36.36298751831055, "global_step": 168724, "epoch": 1394} {"train_loss": -34.8720588684082, "global_step": 168725, "epoch": 1394} {"train_loss": -35.88810729980469, "global_step": 168726, "epoch": 1394} {"train_loss": -36.70145797729492, "global_step": 168727, "epoch": 1394} {"train_loss": -36.23978805541992, "global_step": 168728, "epoch": 1394} {"train_loss": -37.91069030761719, "global_step": 168729, "epoch": 1394} {"train_loss": -37.082088470458984, "global_step": 168730, "epoch": 1394} {"train_loss": -35.628761291503906, "global_step": 168731, "epoch": 1394} {"train_loss": -36.79377365112305, "global_step": 168732, "epoch": 1394} {"train_loss": -35.13840866088867, "global_step": 168733, "epoch": 1394} {"train_loss": -37.355770111083984, "global_step": 168734, "epoch": 1394} {"train_loss": -36.821388244628906, "global_step": 168735, "epoch": 1394} {"train_loss": -37.28466796875, "global_step": 168736, "epoch": 1394} {"train_loss": -37.247100830078125, "global_step": 168737, "epoch": 1394} {"train_loss": -37.59217071533203, "global_step": 168738, "epoch": 1394} {"train_loss": -35.74770736694336, "global_step": 168739, "epoch": 1394} {"train_loss": -36.82007598876953, "global_step": 168740, "epoch": 1394} {"train_loss": -35.33625793457031, "global_step": 168741, "epoch": 1394} {"train_loss": -37.688045501708984, "global_step": 168742, "epoch": 1394} {"train_loss": -37.373653411865234, "global_step": 168743, "epoch": 1394} {"train_loss": -37.38724899291992, "global_step": 168744, "epoch": 1394} {"train_loss": -35.428462982177734, "global_step": 168745, "epoch": 1394} {"train_loss": -38.18854904174805, "global_step": 168746, "epoch": 1394} {"train_loss": -36.86907196044922, "global_step": 168747, "epoch": 1394} {"train_loss": -38.2665901184082, "global_step": 168748, "epoch": 1394} {"train_loss": -36.915557861328125, "global_step": 168749, "epoch": 1394} {"train_loss": -38.908538818359375, "global_step": 168750, "epoch": 1394} {"train_loss": -38.3444938659668, "global_step": 168751, "epoch": 1394} {"train_loss": -38.0767707824707, "global_step": 168752, "epoch": 1394} {"train_loss": -36.93422317504883, "global_step": 168753, "epoch": 1394} {"train_loss": -37.41270065307617, "global_step": 168754, "epoch": 1394} {"train_loss": -38.82062530517578, "global_step": 168755, "epoch": 1394} {"train_loss": -39.252498626708984, "global_step": 168756, "epoch": 1394} {"train_loss": -38.525604248046875, "global_step": 168757, "epoch": 1394} {"train_loss": -37.72584915161133, "global_step": 168758, "epoch": 1394} {"train_loss": -38.28519821166992, "global_step": 168759, "epoch": 1394} {"train_loss": -37.94009780883789, "global_step": 168760, "epoch": 1394} {"train_loss": -38.58124923706055, "global_step": 168761, "epoch": 1394} {"train_loss": -38.627662658691406, "global_step": 168762, "epoch": 1394} {"train_loss": -39.558135986328125, "global_step": 168763, "epoch": 1394} {"train_loss": -38.54771041870117, "global_step": 168764, "epoch": 1394} {"train_loss": -38.67818832397461, "global_step": 168765, "epoch": 1394} {"train_loss": -37.34768295288086, "global_step": 168766, "epoch": 1394} {"train_loss": -39.0280876159668, "global_step": 168767, "epoch": 1394} {"train_loss": -39.12131881713867, "global_step": 168768, "epoch": 1394} {"train_loss": -39.76740264892578, "global_step": 168769, "epoch": 1394} {"train_loss": -39.120399475097656, "global_step": 168770, "epoch": 1394} {"train_loss": -39.34356689453125, "global_step": 168771, "epoch": 1394} {"train_loss": -38.04297637939453, "global_step": 168772, "epoch": 1394} {"train_loss": -39.8789176940918, "global_step": 168773, "epoch": 1394} {"train_loss": -39.99785232543945, "global_step": 168774, "epoch": 1394} {"train_loss": -39.57281494140625, "global_step": 168775, "epoch": 1394} {"train_loss": -39.70675277709961, "global_step": 168776, "epoch": 1394} {"train_loss": -39.260833740234375, "global_step": 168777, "epoch": 1394} {"train_loss": -39.52144241333008, "global_step": 168778, "epoch": 1394} {"train_loss": -38.599605560302734, "global_step": 168779, "epoch": 1394} {"train_loss": -39.569129943847656, "global_step": 168780, "epoch": 1394} {"train_loss": -39.34431457519531, "global_step": 168781, "epoch": 1394} {"train_loss": -38.595848083496094, "global_step": 168782, "epoch": 1394} {"train_loss": -38.922298431396484, "global_step": 168783, "epoch": 1394} {"train_loss": -39.55808639526367, "global_step": 168784, "epoch": 1394} {"train_loss": -39.67850875854492, "global_step": 168785, "epoch": 1394} {"train_loss": -40.26569747924805, "global_step": 168786, "epoch": 1394} {"train_loss": -39.57404708862305, "global_step": 168787, "epoch": 1394} {"train_loss": -40.16864013671875, "global_step": 168788, "epoch": 1394} {"train_loss": -39.82551574707031, "global_step": 168789, "epoch": 1394} {"train_loss": -39.98769760131836, "global_step": 168790, "epoch": 1394} {"train_loss": -39.52229690551758, "global_step": 168791, "epoch": 1394} {"train_loss": -40.45383834838867, "global_step": 168792, "epoch": 1394} {"train_loss": -39.91749572753906, "global_step": 168793, "epoch": 1394} {"train_loss": -38.46851241687113, "global_step": 168794, "epoch": 1394, "val_loss": 2746175.0} {"train_loss": -39.94259262084961, "global_step": 168795, "epoch": 1395} {"train_loss": -40.03190231323242, "global_step": 168796, "epoch": 1395} {"train_loss": -40.72236633300781, "global_step": 168797, "epoch": 1395} {"train_loss": -40.1173210144043, "global_step": 168798, "epoch": 1395} {"train_loss": -40.01076126098633, "global_step": 168799, "epoch": 1395} {"train_loss": -40.28643035888672, "global_step": 168800, "epoch": 1395} {"train_loss": -40.326263427734375, "global_step": 168801, "epoch": 1395} {"train_loss": -40.26162338256836, "global_step": 168802, "epoch": 1395} {"train_loss": -40.46275329589844, "global_step": 168803, "epoch": 1395} {"train_loss": -40.869720458984375, "global_step": 168804, "epoch": 1395} {"train_loss": -39.911128997802734, "global_step": 168805, "epoch": 1395} {"train_loss": -39.74860763549805, "global_step": 168806, "epoch": 1395} {"train_loss": -40.165042877197266, "global_step": 168807, "epoch": 1395} {"train_loss": -40.093666076660156, "global_step": 168808, "epoch": 1395} {"train_loss": -40.268131256103516, "global_step": 168809, "epoch": 1395} {"train_loss": -39.80984878540039, "global_step": 168810, "epoch": 1395} {"train_loss": -39.876426696777344, "global_step": 168811, "epoch": 1395} {"train_loss": -40.62859344482422, "global_step": 168812, "epoch": 1395} {"train_loss": -39.52243423461914, "global_step": 168813, "epoch": 1395} {"train_loss": -40.231502532958984, "global_step": 168814, "epoch": 1395} {"train_loss": -41.14704513549805, "global_step": 168815, "epoch": 1395} {"train_loss": -40.596046447753906, "global_step": 168816, "epoch": 1395} {"train_loss": -40.494014739990234, "global_step": 168817, "epoch": 1395} {"train_loss": -40.5462646484375, "global_step": 168818, "epoch": 1395} {"train_loss": -40.983856201171875, "global_step": 168819, "epoch": 1395} {"train_loss": -40.53656005859375, "global_step": 168820, "epoch": 1395} {"train_loss": -41.201934814453125, "global_step": 168821, "epoch": 1395} {"train_loss": -40.41600799560547, "global_step": 168822, "epoch": 1395} {"train_loss": -40.076961517333984, "global_step": 168823, "epoch": 1395} {"train_loss": -40.50401306152344, "global_step": 168824, "epoch": 1395} {"train_loss": -40.36513900756836, "global_step": 168825, "epoch": 1395} {"train_loss": -40.97761535644531, "global_step": 168826, "epoch": 1395} {"train_loss": -40.00379180908203, "global_step": 168827, "epoch": 1395} {"train_loss": -40.412818908691406, "global_step": 168828, "epoch": 1395} {"train_loss": -40.4976806640625, "global_step": 168829, "epoch": 1395} {"train_loss": -38.842323303222656, "global_step": 168830, "epoch": 1395} {"train_loss": -40.53183364868164, "global_step": 168831, "epoch": 1395} {"train_loss": -40.82232666015625, "global_step": 168832, "epoch": 1395} {"train_loss": -41.24676513671875, "global_step": 168833, "epoch": 1395} {"train_loss": -40.4105339050293, "global_step": 168834, "epoch": 1395} {"train_loss": -40.33099365234375, "global_step": 168835, "epoch": 1395} {"train_loss": -39.1728630065918, "global_step": 168836, "epoch": 1395} {"train_loss": -40.03773498535156, "global_step": 168837, "epoch": 1395} {"train_loss": -39.674949645996094, "global_step": 168838, "epoch": 1395} {"train_loss": -39.4800910949707, "global_step": 168839, "epoch": 1395} {"train_loss": -40.11912155151367, "global_step": 168840, "epoch": 1395} {"train_loss": -39.61880111694336, "global_step": 168841, "epoch": 1395} {"train_loss": -40.25787353515625, "global_step": 168842, "epoch": 1395} {"train_loss": -40.29246139526367, "global_step": 168843, "epoch": 1395} {"train_loss": -40.06290817260742, "global_step": 168844, "epoch": 1395} {"train_loss": -39.82405471801758, "global_step": 168845, "epoch": 1395} {"train_loss": -39.31128692626953, "global_step": 168846, "epoch": 1395} {"train_loss": -39.59999084472656, "global_step": 168847, "epoch": 1395} {"train_loss": -39.91677474975586, "global_step": 168848, "epoch": 1395} {"train_loss": -38.73487091064453, "global_step": 168849, "epoch": 1395} {"train_loss": -39.713069915771484, "global_step": 168850, "epoch": 1395} {"train_loss": -38.84207534790039, "global_step": 168851, "epoch": 1395} {"train_loss": -38.958919525146484, "global_step": 168852, "epoch": 1395} {"train_loss": -40.24040222167969, "global_step": 168853, "epoch": 1395} {"train_loss": -39.32655715942383, "global_step": 168854, "epoch": 1395} {"train_loss": -39.68827819824219, "global_step": 168855, "epoch": 1395} {"train_loss": -39.374446868896484, "global_step": 168856, "epoch": 1395} {"train_loss": -39.34912109375, "global_step": 168857, "epoch": 1395} {"train_loss": -40.0288200378418, "global_step": 168858, "epoch": 1395} {"train_loss": -39.22760009765625, "global_step": 168859, "epoch": 1395} {"train_loss": -39.07734680175781, "global_step": 168860, "epoch": 1395} {"train_loss": -39.911014556884766, "global_step": 168861, "epoch": 1395} {"train_loss": -39.932308197021484, "global_step": 168862, "epoch": 1395} {"train_loss": -40.006256103515625, "global_step": 168863, "epoch": 1395} {"train_loss": -39.716758728027344, "global_step": 168864, "epoch": 1395} {"train_loss": -39.6046028137207, "global_step": 168865, "epoch": 1395} {"train_loss": -41.212467193603516, "global_step": 168866, "epoch": 1395} {"train_loss": -40.428321838378906, "global_step": 168867, "epoch": 1395} {"train_loss": -40.18930435180664, "global_step": 168868, "epoch": 1395} {"train_loss": -39.85129165649414, "global_step": 168869, "epoch": 1395} {"train_loss": -39.74703598022461, "global_step": 168870, "epoch": 1395} {"train_loss": -39.80411911010742, "global_step": 168871, "epoch": 1395} {"train_loss": -40.756038665771484, "global_step": 168872, "epoch": 1395} {"train_loss": -40.35938262939453, "global_step": 168873, "epoch": 1395} {"train_loss": -40.183326721191406, "global_step": 168874, "epoch": 1395} {"train_loss": -40.49490737915039, "global_step": 168875, "epoch": 1395} {"train_loss": -41.036800384521484, "global_step": 168876, "epoch": 1395} {"train_loss": -40.48332595825195, "global_step": 168877, "epoch": 1395} {"train_loss": -40.51811981201172, "global_step": 168878, "epoch": 1395} {"train_loss": -40.04037094116211, "global_step": 168879, "epoch": 1395} {"train_loss": -40.24148178100586, "global_step": 168880, "epoch": 1395} {"train_loss": -40.279903411865234, "global_step": 168881, "epoch": 1395} {"train_loss": -38.40314865112305, "global_step": 168882, "epoch": 1395} {"train_loss": -39.31913375854492, "global_step": 168883, "epoch": 1395} {"train_loss": -39.505516052246094, "global_step": 168884, "epoch": 1395} {"train_loss": -39.951107025146484, "global_step": 168885, "epoch": 1395} {"train_loss": -39.9542236328125, "global_step": 168886, "epoch": 1395} {"train_loss": -40.21506881713867, "global_step": 168887, "epoch": 1395} {"train_loss": -40.19598388671875, "global_step": 168888, "epoch": 1395} {"train_loss": -39.9611930847168, "global_step": 168889, "epoch": 1395} {"train_loss": -39.83659744262695, "global_step": 168890, "epoch": 1395} {"train_loss": -40.49046325683594, "global_step": 168891, "epoch": 1395} {"train_loss": -39.761474609375, "global_step": 168892, "epoch": 1395} {"train_loss": -40.15989685058594, "global_step": 168893, "epoch": 1395} {"train_loss": -41.00765609741211, "global_step": 168894, "epoch": 1395} {"train_loss": -40.29893493652344, "global_step": 168895, "epoch": 1395} {"train_loss": -40.7103271484375, "global_step": 168896, "epoch": 1395} {"train_loss": -40.470863342285156, "global_step": 168897, "epoch": 1395} {"train_loss": -39.47589111328125, "global_step": 168898, "epoch": 1395} {"train_loss": -38.69989776611328, "global_step": 168899, "epoch": 1395} {"train_loss": -37.17266845703125, "global_step": 168900, "epoch": 1395} {"train_loss": -34.68947982788086, "global_step": 168901, "epoch": 1395} {"train_loss": -34.773956298828125, "global_step": 168902, "epoch": 1395} {"train_loss": -38.37139892578125, "global_step": 168903, "epoch": 1395} {"train_loss": -39.821937561035156, "global_step": 168904, "epoch": 1395} {"train_loss": -37.47282028198242, "global_step": 168905, "epoch": 1395} {"train_loss": -37.552730560302734, "global_step": 168906, "epoch": 1395} {"train_loss": -38.10627746582031, "global_step": 168907, "epoch": 1395} {"train_loss": -39.7962646484375, "global_step": 168908, "epoch": 1395} {"train_loss": -39.686248779296875, "global_step": 168909, "epoch": 1395} {"train_loss": -37.11491012573242, "global_step": 168910, "epoch": 1395} {"train_loss": -37.35307693481445, "global_step": 168911, "epoch": 1395} {"train_loss": -39.50437545776367, "global_step": 168912, "epoch": 1395} {"train_loss": -39.83854293823242, "global_step": 168913, "epoch": 1395} {"train_loss": -39.9224739074707, "global_step": 168914, "epoch": 1395} {"train_loss": -39.82681882874039, "global_step": 168915, "epoch": 1395, "val_loss": 2716913.5} {"train_loss": -39.958702087402344, "global_step": 168916, "epoch": 1396} {"train_loss": -40.73992919921875, "global_step": 168917, "epoch": 1396} {"train_loss": -40.40331268310547, "global_step": 168918, "epoch": 1396} {"train_loss": -40.826171875, "global_step": 168919, "epoch": 1396} {"train_loss": -40.77752685546875, "global_step": 168920, "epoch": 1396} {"train_loss": -41.0512580871582, "global_step": 168921, "epoch": 1396} {"train_loss": -41.23781204223633, "global_step": 168922, "epoch": 1396} {"train_loss": -40.219276428222656, "global_step": 168923, "epoch": 1396} {"train_loss": -40.9831428527832, "global_step": 168924, "epoch": 1396} {"train_loss": -41.43796157836914, "global_step": 168925, "epoch": 1396} {"train_loss": -40.76380920410156, "global_step": 168926, "epoch": 1396} {"train_loss": -40.83051681518555, "global_step": 168927, "epoch": 1396} {"train_loss": -41.33222198486328, "global_step": 168928, "epoch": 1396} {"train_loss": -40.756622314453125, "global_step": 168929, "epoch": 1396} {"train_loss": -40.805908203125, "global_step": 168930, "epoch": 1396} {"train_loss": -41.08445358276367, "global_step": 168931, "epoch": 1396} {"train_loss": -40.76027297973633, "global_step": 168932, "epoch": 1396} {"train_loss": -40.59763717651367, "global_step": 168933, "epoch": 1396} {"train_loss": -40.053741455078125, "global_step": 168934, "epoch": 1396} {"train_loss": -40.753028869628906, "global_step": 168935, "epoch": 1396} {"train_loss": -40.73542022705078, "global_step": 168936, "epoch": 1396} {"train_loss": -41.32950973510742, "global_step": 168937, "epoch": 1396} {"train_loss": -40.6931266784668, "global_step": 168938, "epoch": 1396} {"train_loss": -39.58938217163086, "global_step": 168939, "epoch": 1396} {"train_loss": -40.26705551147461, "global_step": 168940, "epoch": 1396} {"train_loss": -40.44828414916992, "global_step": 168941, "epoch": 1396} {"train_loss": -39.8175048828125, "global_step": 168942, "epoch": 1396} {"train_loss": -40.51363754272461, "global_step": 168943, "epoch": 1396} {"train_loss": -40.94346237182617, "global_step": 168944, "epoch": 1396} {"train_loss": -40.855342864990234, "global_step": 168945, "epoch": 1396} {"train_loss": -41.024452209472656, "global_step": 168946, "epoch": 1396} {"train_loss": -40.24198532104492, "global_step": 168947, "epoch": 1396} {"train_loss": -40.590248107910156, "global_step": 168948, "epoch": 1396} {"train_loss": -40.199241638183594, "global_step": 168949, "epoch": 1396} {"train_loss": -41.21637725830078, "global_step": 168950, "epoch": 1396} {"train_loss": -40.4001350402832, "global_step": 168951, "epoch": 1396} {"train_loss": -40.870361328125, "global_step": 168952, "epoch": 1396} {"train_loss": -40.415443420410156, "global_step": 168953, "epoch": 1396} {"train_loss": -41.545833587646484, "global_step": 168954, "epoch": 1396} {"train_loss": -41.08735656738281, "global_step": 168955, "epoch": 1396} {"train_loss": -40.7259407043457, "global_step": 168956, "epoch": 1396} {"train_loss": -41.537261962890625, "global_step": 168957, "epoch": 1396} {"train_loss": -40.64289093017578, "global_step": 168958, "epoch": 1396} {"train_loss": -40.80141830444336, "global_step": 168959, "epoch": 1396} {"train_loss": -41.0737419128418, "global_step": 168960, "epoch": 1396} {"train_loss": -40.622894287109375, "global_step": 168961, "epoch": 1396} {"train_loss": -41.034732818603516, "global_step": 168962, "epoch": 1396} {"train_loss": -41.1488151550293, "global_step": 168963, "epoch": 1396} {"train_loss": -41.10187530517578, "global_step": 168964, "epoch": 1396} {"train_loss": -40.60331344604492, "global_step": 168965, "epoch": 1396} {"train_loss": -41.44361877441406, "global_step": 168966, "epoch": 1396} {"train_loss": -41.50001525878906, "global_step": 168967, "epoch": 1396} {"train_loss": -41.01856231689453, "global_step": 168968, "epoch": 1396} {"train_loss": -40.5129508972168, "global_step": 168969, "epoch": 1396} {"train_loss": -40.55011749267578, "global_step": 168970, "epoch": 1396} {"train_loss": -39.220462799072266, "global_step": 168971, "epoch": 1396} {"train_loss": -40.24675369262695, "global_step": 168972, "epoch": 1396} {"train_loss": -37.5620002746582, "global_step": 168973, "epoch": 1396} {"train_loss": -39.2064323425293, "global_step": 168974, "epoch": 1396} {"train_loss": -40.81624984741211, "global_step": 168975, "epoch": 1396} {"train_loss": -40.12599563598633, "global_step": 168976, "epoch": 1396} {"train_loss": -38.824859619140625, "global_step": 168977, "epoch": 1396} {"train_loss": -39.51665115356445, "global_step": 168978, "epoch": 1396} {"train_loss": -39.7271842956543, "global_step": 168979, "epoch": 1396} {"train_loss": -38.323570251464844, "global_step": 168980, "epoch": 1396} {"train_loss": -38.69692611694336, "global_step": 168981, "epoch": 1396} {"train_loss": -39.8958854675293, "global_step": 168982, "epoch": 1396} {"train_loss": -38.825557708740234, "global_step": 168983, "epoch": 1396} {"train_loss": -39.60382843017578, "global_step": 168984, "epoch": 1396} {"train_loss": -40.77392578125, "global_step": 168985, "epoch": 1396} {"train_loss": -40.46369552612305, "global_step": 168986, "epoch": 1396} {"train_loss": -40.74018096923828, "global_step": 168987, "epoch": 1396} {"train_loss": -39.90304946899414, "global_step": 168988, "epoch": 1396} {"train_loss": -40.93933868408203, "global_step": 168989, "epoch": 1396} {"train_loss": -39.99385070800781, "global_step": 168990, "epoch": 1396} {"train_loss": -39.35633087158203, "global_step": 168991, "epoch": 1396} {"train_loss": -39.7901725769043, "global_step": 168992, "epoch": 1396} {"train_loss": -39.96580123901367, "global_step": 168993, "epoch": 1396} {"train_loss": -39.545894622802734, "global_step": 168994, "epoch": 1396} {"train_loss": -38.75413513183594, "global_step": 168995, "epoch": 1396} {"train_loss": -39.706085205078125, "global_step": 168996, "epoch": 1396} {"train_loss": -39.16358947753906, "global_step": 168997, "epoch": 1396} {"train_loss": -38.81765365600586, "global_step": 168998, "epoch": 1396} {"train_loss": -40.398719787597656, "global_step": 168999, "epoch": 1396} {"train_loss": -39.705745697021484, "global_step": 169000, "epoch": 1396} {"train_loss": -40.00079345703125, "global_step": 169001, "epoch": 1396} {"train_loss": -39.85724639892578, "global_step": 169002, "epoch": 1396} {"train_loss": -38.54963684082031, "global_step": 169003, "epoch": 1396} {"train_loss": -40.11577224731445, "global_step": 169004, "epoch": 1396} {"train_loss": -40.5732307434082, "global_step": 169005, "epoch": 1396} {"train_loss": -40.9375, "global_step": 169006, "epoch": 1396} {"train_loss": -39.636573791503906, "global_step": 169007, "epoch": 1396} {"train_loss": -40.02651596069336, "global_step": 169008, "epoch": 1396} {"train_loss": -39.28412628173828, "global_step": 169009, "epoch": 1396} {"train_loss": -40.34929275512695, "global_step": 169010, "epoch": 1396} {"train_loss": -40.309913635253906, "global_step": 169011, "epoch": 1396} {"train_loss": -39.19196701049805, "global_step": 169012, "epoch": 1396} {"train_loss": -39.84946823120117, "global_step": 169013, "epoch": 1396} {"train_loss": -39.81028747558594, "global_step": 169014, "epoch": 1396} {"train_loss": -39.68869400024414, "global_step": 169015, "epoch": 1396} {"train_loss": -40.64529037475586, "global_step": 169016, "epoch": 1396} {"train_loss": -40.5908088684082, "global_step": 169017, "epoch": 1396} {"train_loss": -40.20790481567383, "global_step": 169018, "epoch": 1396} {"train_loss": -40.951934814453125, "global_step": 169019, "epoch": 1396} {"train_loss": -39.5554313659668, "global_step": 169020, "epoch": 1396} {"train_loss": -40.96318435668945, "global_step": 169021, "epoch": 1396} {"train_loss": -40.57133865356445, "global_step": 169022, "epoch": 1396} {"train_loss": -40.44789505004883, "global_step": 169023, "epoch": 1396} {"train_loss": -41.0582275390625, "global_step": 169024, "epoch": 1396} {"train_loss": -40.60805892944336, "global_step": 169025, "epoch": 1396} {"train_loss": -41.37073516845703, "global_step": 169026, "epoch": 1396} {"train_loss": -40.94670486450195, "global_step": 169027, "epoch": 1396} {"train_loss": -40.872711181640625, "global_step": 169028, "epoch": 1396} {"train_loss": -41.022945404052734, "global_step": 169029, "epoch": 1396} {"train_loss": -40.880714416503906, "global_step": 169030, "epoch": 1396} {"train_loss": -40.56713104248047, "global_step": 169031, "epoch": 1396} {"train_loss": -41.22659683227539, "global_step": 169032, "epoch": 1396} {"train_loss": -41.375125885009766, "global_step": 169033, "epoch": 1396} {"train_loss": -41.57833480834961, "global_step": 169034, "epoch": 1396} {"train_loss": -41.37854766845703, "global_step": 169035, "epoch": 1396} {"train_loss": -40.39218571560442, "global_step": 169036, "epoch": 1396, "val_loss": 2659487.25} {"train_loss": -41.11846923828125, "global_step": 169037, "epoch": 1397} {"train_loss": -40.81348419189453, "global_step": 169038, "epoch": 1397} {"train_loss": -41.829471588134766, "global_step": 169039, "epoch": 1397} {"train_loss": -40.684814453125, "global_step": 169040, "epoch": 1397} {"train_loss": -40.23488235473633, "global_step": 169041, "epoch": 1397} {"train_loss": -40.48609161376953, "global_step": 169042, "epoch": 1397} {"train_loss": -41.56926345825195, "global_step": 169043, "epoch": 1397} {"train_loss": -40.44873809814453, "global_step": 169044, "epoch": 1397} {"train_loss": -38.85268783569336, "global_step": 169045, "epoch": 1397} {"train_loss": -40.67203903198242, "global_step": 169046, "epoch": 1397} {"train_loss": -40.14115905761719, "global_step": 169047, "epoch": 1397} {"train_loss": -39.88509750366211, "global_step": 169048, "epoch": 1397} {"train_loss": -39.7061882019043, "global_step": 169049, "epoch": 1397} {"train_loss": -40.965877532958984, "global_step": 169050, "epoch": 1397} {"train_loss": -40.99924850463867, "global_step": 169051, "epoch": 1397} {"train_loss": -39.53430938720703, "global_step": 169052, "epoch": 1397} {"train_loss": -39.243221282958984, "global_step": 169053, "epoch": 1397} {"train_loss": -39.275875091552734, "global_step": 169054, "epoch": 1397} {"train_loss": -40.0802001953125, "global_step": 169055, "epoch": 1397} {"train_loss": -40.93280029296875, "global_step": 169056, "epoch": 1397} {"train_loss": -39.61624526977539, "global_step": 169057, "epoch": 1397} {"train_loss": -39.17116165161133, "global_step": 169058, "epoch": 1397} {"train_loss": -39.51363754272461, "global_step": 169059, "epoch": 1397} {"train_loss": -39.967227935791016, "global_step": 169060, "epoch": 1397} {"train_loss": -40.684242248535156, "global_step": 169061, "epoch": 1397} {"train_loss": -40.480751037597656, "global_step": 169062, "epoch": 1397} {"train_loss": -39.95780563354492, "global_step": 169063, "epoch": 1397} {"train_loss": -39.67423629760742, "global_step": 169064, "epoch": 1397} {"train_loss": -40.99772262573242, "global_step": 169065, "epoch": 1397} {"train_loss": -40.92548370361328, "global_step": 169066, "epoch": 1397} {"train_loss": -40.619110107421875, "global_step": 169067, "epoch": 1397} {"train_loss": -41.344966888427734, "global_step": 169068, "epoch": 1397} {"train_loss": -41.08015060424805, "global_step": 169069, "epoch": 1397} {"train_loss": -41.30549621582031, "global_step": 169070, "epoch": 1397} {"train_loss": -40.8200798034668, "global_step": 169071, "epoch": 1397} {"train_loss": -40.78976058959961, "global_step": 169072, "epoch": 1397} {"train_loss": -40.95186233520508, "global_step": 169073, "epoch": 1397} {"train_loss": -41.51530838012695, "global_step": 169074, "epoch": 1397} {"train_loss": -39.95576858520508, "global_step": 169075, "epoch": 1397} {"train_loss": -40.292022705078125, "global_step": 169076, "epoch": 1397} {"train_loss": -41.05023956298828, "global_step": 169077, "epoch": 1397} {"train_loss": -39.62702178955078, "global_step": 169078, "epoch": 1397} {"train_loss": -39.65645980834961, "global_step": 169079, "epoch": 1397} {"train_loss": -40.551910400390625, "global_step": 169080, "epoch": 1397} {"train_loss": -40.5706787109375, "global_step": 169081, "epoch": 1397} {"train_loss": -39.850093841552734, "global_step": 169082, "epoch": 1397} {"train_loss": -39.306819915771484, "global_step": 169083, "epoch": 1397} {"train_loss": -36.04160690307617, "global_step": 169084, "epoch": 1397} {"train_loss": -38.714332580566406, "global_step": 169085, "epoch": 1397} {"train_loss": -40.898311614990234, "global_step": 169086, "epoch": 1397} {"train_loss": -39.841896057128906, "global_step": 169087, "epoch": 1397} {"train_loss": -39.91167449951172, "global_step": 169088, "epoch": 1397} {"train_loss": -40.19570541381836, "global_step": 169089, "epoch": 1397} {"train_loss": -37.892494201660156, "global_step": 169090, "epoch": 1397} {"train_loss": -38.77994918823242, "global_step": 169091, "epoch": 1397} {"train_loss": -37.41141128540039, "global_step": 169092, "epoch": 1397} {"train_loss": -40.077301025390625, "global_step": 169093, "epoch": 1397} {"train_loss": -38.231868743896484, "global_step": 169094, "epoch": 1397} {"train_loss": -39.80405807495117, "global_step": 169095, "epoch": 1397} {"train_loss": -39.6545524597168, "global_step": 169096, "epoch": 1397} {"train_loss": -38.64657211303711, "global_step": 169097, "epoch": 1397} {"train_loss": -38.69631576538086, "global_step": 169098, "epoch": 1397} {"train_loss": -30.791955947875977, "global_step": 169099, "epoch": 1397} {"train_loss": -37.020931243896484, "global_step": 169100, "epoch": 1397} {"train_loss": -36.434505462646484, "global_step": 169101, "epoch": 1397} {"train_loss": -40.69704055786133, "global_step": 169102, "epoch": 1397} {"train_loss": -38.6049919128418, "global_step": 169103, "epoch": 1397} {"train_loss": -40.16721725463867, "global_step": 169104, "epoch": 1397} {"train_loss": -30.3326358795166, "global_step": 169105, "epoch": 1397} {"train_loss": -33.7202033996582, "global_step": 169106, "epoch": 1397} {"train_loss": -37.06257629394531, "global_step": 169107, "epoch": 1397} {"train_loss": -33.577308654785156, "global_step": 169108, "epoch": 1397} {"train_loss": -39.179683685302734, "global_step": 169109, "epoch": 1397} {"train_loss": -37.554351806640625, "global_step": 169110, "epoch": 1397} {"train_loss": -37.54178237915039, "global_step": 169111, "epoch": 1397} {"train_loss": -36.464725494384766, "global_step": 169112, "epoch": 1397} {"train_loss": -38.13389205932617, "global_step": 169113, "epoch": 1397} {"train_loss": -37.2374382019043, "global_step": 169114, "epoch": 1397} {"train_loss": -38.030860900878906, "global_step": 169115, "epoch": 1397} {"train_loss": -35.531917572021484, "global_step": 169116, "epoch": 1397} {"train_loss": -38.02033615112305, "global_step": 169117, "epoch": 1397} {"train_loss": -37.50919723510742, "global_step": 169118, "epoch": 1397} {"train_loss": -37.26026153564453, "global_step": 169119, "epoch": 1397} {"train_loss": -36.8306999206543, "global_step": 169120, "epoch": 1397} {"train_loss": -39.31742858886719, "global_step": 169121, "epoch": 1397} {"train_loss": -29.544025421142578, "global_step": 169122, "epoch": 1397} {"train_loss": -38.481895446777344, "global_step": 169123, "epoch": 1397} {"train_loss": -30.28912353515625, "global_step": 169124, "epoch": 1397} {"train_loss": -36.523468017578125, "global_step": 169125, "epoch": 1397} {"train_loss": -39.82612991333008, "global_step": 169126, "epoch": 1397} {"train_loss": -35.176124572753906, "global_step": 169127, "epoch": 1397} {"train_loss": -37.56454086303711, "global_step": 169128, "epoch": 1397} {"train_loss": -38.3475456237793, "global_step": 169129, "epoch": 1397} {"train_loss": -39.04396438598633, "global_step": 169130, "epoch": 1397} {"train_loss": -38.09100341796875, "global_step": 169131, "epoch": 1397} {"train_loss": -35.832332611083984, "global_step": 169132, "epoch": 1397} {"train_loss": -37.63003158569336, "global_step": 169133, "epoch": 1397} {"train_loss": -37.824092864990234, "global_step": 169134, "epoch": 1397} {"train_loss": -38.00743865966797, "global_step": 169135, "epoch": 1397} {"train_loss": -37.75526809692383, "global_step": 169136, "epoch": 1397} {"train_loss": -36.398799896240234, "global_step": 169137, "epoch": 1397} {"train_loss": -37.006465911865234, "global_step": 169138, "epoch": 1397} {"train_loss": -37.27546310424805, "global_step": 169139, "epoch": 1397} {"train_loss": -37.98945999145508, "global_step": 169140, "epoch": 1397} {"train_loss": -39.47907638549805, "global_step": 169141, "epoch": 1397} {"train_loss": -38.86550521850586, "global_step": 169142, "epoch": 1397} {"train_loss": -39.15084457397461, "global_step": 169143, "epoch": 1397} {"train_loss": -39.09731674194336, "global_step": 169144, "epoch": 1397} {"train_loss": -37.43431854248047, "global_step": 169145, "epoch": 1397} {"train_loss": -39.216773986816406, "global_step": 169146, "epoch": 1397} {"train_loss": -39.72113037109375, "global_step": 169147, "epoch": 1397} {"train_loss": -39.247982025146484, "global_step": 169148, "epoch": 1397} {"train_loss": -39.3670654296875, "global_step": 169149, "epoch": 1397} {"train_loss": -39.617828369140625, "global_step": 169150, "epoch": 1397} {"train_loss": -39.28622055053711, "global_step": 169151, "epoch": 1397} {"train_loss": -39.244136810302734, "global_step": 169152, "epoch": 1397} {"train_loss": -39.86542892456055, "global_step": 169153, "epoch": 1397} {"train_loss": -39.70685958862305, "global_step": 169154, "epoch": 1397} {"train_loss": -37.42720413208008, "global_step": 169155, "epoch": 1397} {"train_loss": -40.202571868896484, "global_step": 169156, "epoch": 1397} {"train_loss": -38.80059943711462, "global_step": 169157, "epoch": 1397, "val_loss": 2571171.25} {"train_loss": -39.71714401245117, "global_step": 169158, "epoch": 1398} {"train_loss": -38.436485290527344, "global_step": 169159, "epoch": 1398} {"train_loss": -40.09931564331055, "global_step": 169160, "epoch": 1398} {"train_loss": -40.27378463745117, "global_step": 169161, "epoch": 1398} {"train_loss": -39.65095138549805, "global_step": 169162, "epoch": 1398} {"train_loss": -40.02065658569336, "global_step": 169163, "epoch": 1398} {"train_loss": -40.12165451049805, "global_step": 169164, "epoch": 1398} {"train_loss": -40.26264572143555, "global_step": 169165, "epoch": 1398} {"train_loss": -39.47163009643555, "global_step": 169166, "epoch": 1398} {"train_loss": -40.88106155395508, "global_step": 169167, "epoch": 1398} {"train_loss": -38.98362350463867, "global_step": 169168, "epoch": 1398} {"train_loss": -39.5994758605957, "global_step": 169169, "epoch": 1398} {"train_loss": -40.22208786010742, "global_step": 169170, "epoch": 1398} {"train_loss": -39.31209182739258, "global_step": 169171, "epoch": 1398} {"train_loss": -38.892860412597656, "global_step": 169172, "epoch": 1398} {"train_loss": -40.34000778198242, "global_step": 169173, "epoch": 1398} {"train_loss": -39.522377014160156, "global_step": 169174, "epoch": 1398} {"train_loss": -39.79779052734375, "global_step": 169175, "epoch": 1398} {"train_loss": -40.256202697753906, "global_step": 169176, "epoch": 1398} {"train_loss": -38.903724670410156, "global_step": 169177, "epoch": 1398} {"train_loss": -41.17292404174805, "global_step": 169178, "epoch": 1398} {"train_loss": -40.245147705078125, "global_step": 169179, "epoch": 1398} {"train_loss": -40.283077239990234, "global_step": 169180, "epoch": 1398} {"train_loss": -39.91622543334961, "global_step": 169181, "epoch": 1398} {"train_loss": -40.774288177490234, "global_step": 169182, "epoch": 1398} {"train_loss": -40.12201690673828, "global_step": 169183, "epoch": 1398} {"train_loss": -40.33468246459961, "global_step": 169184, "epoch": 1398} {"train_loss": -40.19211959838867, "global_step": 169185, "epoch": 1398} {"train_loss": -40.42950439453125, "global_step": 169186, "epoch": 1398} {"train_loss": -39.4584846496582, "global_step": 169187, "epoch": 1398} {"train_loss": -40.85319137573242, "global_step": 169188, "epoch": 1398} {"train_loss": -40.70156478881836, "global_step": 169189, "epoch": 1398} {"train_loss": -40.42068099975586, "global_step": 169190, "epoch": 1398} {"train_loss": -40.117671966552734, "global_step": 169191, "epoch": 1398} {"train_loss": -39.458560943603516, "global_step": 169192, "epoch": 1398} {"train_loss": -40.52711868286133, "global_step": 169193, "epoch": 1398} {"train_loss": -40.53471755981445, "global_step": 169194, "epoch": 1398} {"train_loss": -40.47941207885742, "global_step": 169195, "epoch": 1398} {"train_loss": -40.99309158325195, "global_step": 169196, "epoch": 1398} {"train_loss": -40.59583282470703, "global_step": 169197, "epoch": 1398} {"train_loss": -40.62839889526367, "global_step": 169198, "epoch": 1398} {"train_loss": -40.3333625793457, "global_step": 169199, "epoch": 1398} {"train_loss": -40.075557708740234, "global_step": 169200, "epoch": 1398} {"train_loss": -39.9121208190918, "global_step": 169201, "epoch": 1398} {"train_loss": -40.42153549194336, "global_step": 169202, "epoch": 1398} {"train_loss": -40.0026741027832, "global_step": 169203, "epoch": 1398} {"train_loss": -41.04390335083008, "global_step": 169204, "epoch": 1398} {"train_loss": -41.00105667114258, "global_step": 169205, "epoch": 1398} {"train_loss": -40.00840377807617, "global_step": 169206, "epoch": 1398} {"train_loss": -39.29254150390625, "global_step": 169207, "epoch": 1398} {"train_loss": -39.525489807128906, "global_step": 169208, "epoch": 1398} {"train_loss": -39.45026397705078, "global_step": 169209, "epoch": 1398} {"train_loss": -41.04813766479492, "global_step": 169210, "epoch": 1398} {"train_loss": -40.715240478515625, "global_step": 169211, "epoch": 1398} {"train_loss": -39.9549674987793, "global_step": 169212, "epoch": 1398} {"train_loss": -38.712890625, "global_step": 169213, "epoch": 1398} {"train_loss": -40.77360153198242, "global_step": 169214, "epoch": 1398} {"train_loss": -40.31757354736328, "global_step": 169215, "epoch": 1398} {"train_loss": -40.228431701660156, "global_step": 169216, "epoch": 1398} {"train_loss": -38.62327575683594, "global_step": 169217, "epoch": 1398} {"train_loss": -39.682010650634766, "global_step": 169218, "epoch": 1398} {"train_loss": -41.09490966796875, "global_step": 169219, "epoch": 1398} {"train_loss": -39.54138946533203, "global_step": 169220, "epoch": 1398} {"train_loss": -37.0579948425293, "global_step": 169221, "epoch": 1398} {"train_loss": -38.48989486694336, "global_step": 169222, "epoch": 1398} {"train_loss": -38.889095306396484, "global_step": 169223, "epoch": 1398} {"train_loss": -41.13070297241211, "global_step": 169224, "epoch": 1398} {"train_loss": -40.01172637939453, "global_step": 169225, "epoch": 1398} {"train_loss": -38.414424896240234, "global_step": 169226, "epoch": 1398} {"train_loss": -34.89364242553711, "global_step": 169227, "epoch": 1398} {"train_loss": -37.8270378112793, "global_step": 169228, "epoch": 1398} {"train_loss": -40.5394287109375, "global_step": 169229, "epoch": 1398} {"train_loss": -38.681251525878906, "global_step": 169230, "epoch": 1398} {"train_loss": -38.493587493896484, "global_step": 169231, "epoch": 1398} {"train_loss": -40.530792236328125, "global_step": 169232, "epoch": 1398} {"train_loss": -39.00008773803711, "global_step": 169233, "epoch": 1398} {"train_loss": -37.09955978393555, "global_step": 169234, "epoch": 1398} {"train_loss": -38.973297119140625, "global_step": 169235, "epoch": 1398} {"train_loss": -38.699073791503906, "global_step": 169236, "epoch": 1398} {"train_loss": -39.26183319091797, "global_step": 169237, "epoch": 1398} {"train_loss": -39.30552291870117, "global_step": 169238, "epoch": 1398} {"train_loss": -38.09595489501953, "global_step": 169239, "epoch": 1398} {"train_loss": -40.99981689453125, "global_step": 169240, "epoch": 1398} {"train_loss": -38.78022003173828, "global_step": 169241, "epoch": 1398} {"train_loss": -37.491214752197266, "global_step": 169242, "epoch": 1398} {"train_loss": -40.003021240234375, "global_step": 169243, "epoch": 1398} {"train_loss": -38.54060745239258, "global_step": 169244, "epoch": 1398} {"train_loss": -39.2069206237793, "global_step": 169245, "epoch": 1398} {"train_loss": -39.36231994628906, "global_step": 169246, "epoch": 1398} {"train_loss": -39.85932540893555, "global_step": 169247, "epoch": 1398} {"train_loss": -38.92776107788086, "global_step": 169248, "epoch": 1398} {"train_loss": -41.047462463378906, "global_step": 169249, "epoch": 1398} {"train_loss": -39.920738220214844, "global_step": 169250, "epoch": 1398} {"train_loss": -40.28092575073242, "global_step": 169251, "epoch": 1398} {"train_loss": -39.747440338134766, "global_step": 169252, "epoch": 1398} {"train_loss": -40.537540435791016, "global_step": 169253, "epoch": 1398} {"train_loss": -40.5749397277832, "global_step": 169254, "epoch": 1398} {"train_loss": -40.17292022705078, "global_step": 169255, "epoch": 1398} {"train_loss": -40.387489318847656, "global_step": 169256, "epoch": 1398} {"train_loss": -39.804718017578125, "global_step": 169257, "epoch": 1398} {"train_loss": -39.214378356933594, "global_step": 169258, "epoch": 1398} {"train_loss": -40.1175422668457, "global_step": 169259, "epoch": 1398} {"train_loss": -39.99764633178711, "global_step": 169260, "epoch": 1398} {"train_loss": -40.222896575927734, "global_step": 169261, "epoch": 1398} {"train_loss": -39.943477630615234, "global_step": 169262, "epoch": 1398} {"train_loss": -40.40614700317383, "global_step": 169263, "epoch": 1398} {"train_loss": -40.81489944458008, "global_step": 169264, "epoch": 1398} {"train_loss": -40.3884391784668, "global_step": 169265, "epoch": 1398} {"train_loss": -40.59478759765625, "global_step": 169266, "epoch": 1398} {"train_loss": -39.87298583984375, "global_step": 169267, "epoch": 1398} {"train_loss": -40.437007904052734, "global_step": 169268, "epoch": 1398} {"train_loss": -39.27729034423828, "global_step": 169269, "epoch": 1398} {"train_loss": -40.490264892578125, "global_step": 169270, "epoch": 1398} {"train_loss": -40.568904876708984, "global_step": 169271, "epoch": 1398} {"train_loss": -40.801029205322266, "global_step": 169272, "epoch": 1398} {"train_loss": -39.672996520996094, "global_step": 169273, "epoch": 1398} {"train_loss": -40.5843391418457, "global_step": 169274, "epoch": 1398} {"train_loss": -41.05642318725586, "global_step": 169275, "epoch": 1398} {"train_loss": -40.66862869262695, "global_step": 169276, "epoch": 1398} {"train_loss": -40.6814079284668, "global_step": 169277, "epoch": 1398} {"train_loss": -39.84955310033373, "global_step": 169278, "epoch": 1398, "val_loss": 2725606.0} {"train_loss": -41.26217269897461, "global_step": 169279, "epoch": 1399} {"train_loss": -41.27356719970703, "global_step": 169280, "epoch": 1399} {"train_loss": -40.86686325073242, "global_step": 169281, "epoch": 1399} {"train_loss": -41.13283920288086, "global_step": 169282, "epoch": 1399} {"train_loss": -40.53436279296875, "global_step": 169283, "epoch": 1399} {"train_loss": -40.038002014160156, "global_step": 169284, "epoch": 1399} {"train_loss": -40.205360412597656, "global_step": 169285, "epoch": 1399} {"train_loss": -40.67641067504883, "global_step": 169286, "epoch": 1399} {"train_loss": -40.85321044921875, "global_step": 169287, "epoch": 1399} {"train_loss": -40.774078369140625, "global_step": 169288, "epoch": 1399} {"train_loss": -38.92938995361328, "global_step": 169289, "epoch": 1399} {"train_loss": -41.07255554199219, "global_step": 169290, "epoch": 1399} {"train_loss": -40.59086227416992, "global_step": 169291, "epoch": 1399} {"train_loss": -40.16878128051758, "global_step": 169292, "epoch": 1399} {"train_loss": -40.609413146972656, "global_step": 169293, "epoch": 1399} {"train_loss": -40.792545318603516, "global_step": 169294, "epoch": 1399} {"train_loss": -40.236568450927734, "global_step": 169295, "epoch": 1399} {"train_loss": -41.47216796875, "global_step": 169296, "epoch": 1399} {"train_loss": -40.20586395263672, "global_step": 169297, "epoch": 1399} {"train_loss": -40.815940856933594, "global_step": 169298, "epoch": 1399} {"train_loss": -41.168067932128906, "global_step": 169299, "epoch": 1399} {"train_loss": -40.811614990234375, "global_step": 169300, "epoch": 1399} {"train_loss": -41.194427490234375, "global_step": 169301, "epoch": 1399} {"train_loss": -41.02939987182617, "global_step": 169302, "epoch": 1399} {"train_loss": -40.64603042602539, "global_step": 169303, "epoch": 1399} {"train_loss": -41.27886199951172, "global_step": 169304, "epoch": 1399} {"train_loss": -41.022369384765625, "global_step": 169305, "epoch": 1399} {"train_loss": -40.85017013549805, "global_step": 169306, "epoch": 1399} {"train_loss": -40.805294036865234, "global_step": 169307, "epoch": 1399} {"train_loss": -40.58167266845703, "global_step": 169308, "epoch": 1399} {"train_loss": -41.48185348510742, "global_step": 169309, "epoch": 1399} {"train_loss": -41.274112701416016, "global_step": 169310, "epoch": 1399} {"train_loss": -40.60120391845703, "global_step": 169311, "epoch": 1399} {"train_loss": -40.425994873046875, "global_step": 169312, "epoch": 1399} {"train_loss": -41.693077087402344, "global_step": 169313, "epoch": 1399} {"train_loss": -39.9631462097168, "global_step": 169314, "epoch": 1399} {"train_loss": -40.87971115112305, "global_step": 169315, "epoch": 1399} {"train_loss": -41.12101364135742, "global_step": 169316, "epoch": 1399} {"train_loss": -41.51682662963867, "global_step": 169317, "epoch": 1399} {"train_loss": -41.310054779052734, "global_step": 169318, "epoch": 1399} {"train_loss": -40.725830078125, "global_step": 169319, "epoch": 1399} {"train_loss": -40.607398986816406, "global_step": 169320, "epoch": 1399} {"train_loss": -40.52349853515625, "global_step": 169321, "epoch": 1399} {"train_loss": -40.88039779663086, "global_step": 169322, "epoch": 1399} {"train_loss": -41.09842300415039, "global_step": 169323, "epoch": 1399} {"train_loss": -40.60154342651367, "global_step": 169324, "epoch": 1399} {"train_loss": -40.6067008972168, "global_step": 169325, "epoch": 1399} {"train_loss": -41.54702377319336, "global_step": 169326, "epoch": 1399} {"train_loss": -39.886104583740234, "global_step": 169327, "epoch": 1399} {"train_loss": -38.49378967285156, "global_step": 169328, "epoch": 1399} {"train_loss": -38.444908142089844, "global_step": 169329, "epoch": 1399} {"train_loss": -37.485469818115234, "global_step": 169330, "epoch": 1399} {"train_loss": -38.19852066040039, "global_step": 169331, "epoch": 1399} {"train_loss": -41.217803955078125, "global_step": 169332, "epoch": 1399} {"train_loss": -40.428890228271484, "global_step": 169333, "epoch": 1399} {"train_loss": -39.08085250854492, "global_step": 169334, "epoch": 1399} {"train_loss": -39.4672737121582, "global_step": 169335, "epoch": 1399} {"train_loss": -40.77126693725586, "global_step": 169336, "epoch": 1399} {"train_loss": -38.213680267333984, "global_step": 169337, "epoch": 1399} {"train_loss": -36.890174865722656, "global_step": 169338, "epoch": 1399} {"train_loss": -40.08735275268555, "global_step": 169339, "epoch": 1399} {"train_loss": -41.221954345703125, "global_step": 169340, "epoch": 1399} {"train_loss": -40.701602935791016, "global_step": 169341, "epoch": 1399} {"train_loss": -40.450538635253906, "global_step": 169342, "epoch": 1399} {"train_loss": -39.79169845581055, "global_step": 169343, "epoch": 1399} {"train_loss": -40.74740219116211, "global_step": 169344, "epoch": 1399} {"train_loss": -40.08807373046875, "global_step": 169345, "epoch": 1399} {"train_loss": -40.713436126708984, "global_step": 169346, "epoch": 1399} {"train_loss": -40.29983901977539, "global_step": 169347, "epoch": 1399} {"train_loss": -39.97286605834961, "global_step": 169348, "epoch": 1399} {"train_loss": -38.85184860229492, "global_step": 169349, "epoch": 1399} {"train_loss": -39.97394943237305, "global_step": 169350, "epoch": 1399} {"train_loss": -40.132686614990234, "global_step": 169351, "epoch": 1399} {"train_loss": -40.00379943847656, "global_step": 169352, "epoch": 1399} {"train_loss": -38.74195098876953, "global_step": 169353, "epoch": 1399} {"train_loss": -39.76975631713867, "global_step": 169354, "epoch": 1399} {"train_loss": -41.164825439453125, "global_step": 169355, "epoch": 1399} {"train_loss": -40.193965911865234, "global_step": 169356, "epoch": 1399} {"train_loss": -38.584205627441406, "global_step": 169357, "epoch": 1399} {"train_loss": -39.90754699707031, "global_step": 169358, "epoch": 1399} {"train_loss": -40.585811614990234, "global_step": 169359, "epoch": 1399} {"train_loss": -40.07294845581055, "global_step": 169360, "epoch": 1399} {"train_loss": -40.52022933959961, "global_step": 169361, "epoch": 1399} {"train_loss": -41.4564323425293, "global_step": 169362, "epoch": 1399} {"train_loss": -40.13656234741211, "global_step": 169363, "epoch": 1399} {"train_loss": -40.079776763916016, "global_step": 169364, "epoch": 1399} {"train_loss": -41.04126739501953, "global_step": 169365, "epoch": 1399} {"train_loss": -40.430416107177734, "global_step": 169366, "epoch": 1399} {"train_loss": -40.66571044921875, "global_step": 169367, "epoch": 1399} {"train_loss": -40.899559020996094, "global_step": 169368, "epoch": 1399} {"train_loss": -39.728519439697266, "global_step": 169369, "epoch": 1399} {"train_loss": -40.65586471557617, "global_step": 169370, "epoch": 1399} {"train_loss": -40.31678009033203, "global_step": 169371, "epoch": 1399} {"train_loss": -39.70744323730469, "global_step": 169372, "epoch": 1399} {"train_loss": -40.53289794921875, "global_step": 169373, "epoch": 1399} {"train_loss": -39.97394943237305, "global_step": 169374, "epoch": 1399} {"train_loss": -40.482906341552734, "global_step": 169375, "epoch": 1399} {"train_loss": -40.6911506652832, "global_step": 169376, "epoch": 1399} {"train_loss": -40.561805725097656, "global_step": 169377, "epoch": 1399} {"train_loss": -40.656005859375, "global_step": 169378, "epoch": 1399} {"train_loss": -40.651729583740234, "global_step": 169379, "epoch": 1399} {"train_loss": -39.464752197265625, "global_step": 169380, "epoch": 1399} {"train_loss": -40.47090530395508, "global_step": 169381, "epoch": 1399} {"train_loss": -40.383880615234375, "global_step": 169382, "epoch": 1399} {"train_loss": -39.07874298095703, "global_step": 169383, "epoch": 1399} {"train_loss": -40.766143798828125, "global_step": 169384, "epoch": 1399} {"train_loss": -40.23466491699219, "global_step": 169385, "epoch": 1399} {"train_loss": -39.76215744018555, "global_step": 169386, "epoch": 1399} {"train_loss": -40.98379898071289, "global_step": 169387, "epoch": 1399} {"train_loss": -40.59343338012695, "global_step": 169388, "epoch": 1399} {"train_loss": -40.21370315551758, "global_step": 169389, "epoch": 1399} {"train_loss": -40.305267333984375, "global_step": 169390, "epoch": 1399} {"train_loss": -40.366207122802734, "global_step": 169391, "epoch": 1399} {"train_loss": -40.92198944091797, "global_step": 169392, "epoch": 1399} {"train_loss": -40.724647521972656, "global_step": 169393, "epoch": 1399} {"train_loss": -41.501407623291016, "global_step": 169394, "epoch": 1399} {"train_loss": -41.456764221191406, "global_step": 169395, "epoch": 1399} {"train_loss": -40.35874938964844, "global_step": 169396, "epoch": 1399} {"train_loss": -41.558624267578125, "global_step": 169397, "epoch": 1399} {"train_loss": -39.78007507324219, "global_step": 169398, "epoch": 1399} {"train_loss": -40.39241049900528, "global_step": 169399, "epoch": 1399, "val_loss": 2703426.0} {"train_loss": -41.39921569824219, "global_step": 169400, "epoch": 1400} {"train_loss": -40.93073654174805, "global_step": 169401, "epoch": 1400} {"train_loss": -41.993385314941406, "global_step": 169402, "epoch": 1400} {"train_loss": -41.198299407958984, "global_step": 169403, "epoch": 1400} {"train_loss": -41.73659133911133, "global_step": 169404, "epoch": 1400} {"train_loss": -40.90537643432617, "global_step": 169405, "epoch": 1400} {"train_loss": -40.32395935058594, "global_step": 169406, "epoch": 1400} {"train_loss": -41.02082061767578, "global_step": 169407, "epoch": 1400} {"train_loss": -40.21792221069336, "global_step": 169408, "epoch": 1400} {"train_loss": -41.14760971069336, "global_step": 169409, "epoch": 1400} {"train_loss": -41.6794319152832, "global_step": 169410, "epoch": 1400} {"train_loss": -39.42952346801758, "global_step": 169411, "epoch": 1400} {"train_loss": -41.018218994140625, "global_step": 169412, "epoch": 1400} {"train_loss": -40.966976165771484, "global_step": 169413, "epoch": 1400} {"train_loss": -41.257354736328125, "global_step": 169414, "epoch": 1400} {"train_loss": -40.37339401245117, "global_step": 169415, "epoch": 1400} {"train_loss": -41.2665901184082, "global_step": 169416, "epoch": 1400} {"train_loss": -41.655372619628906, "global_step": 169417, "epoch": 1400} {"train_loss": -41.286190032958984, "global_step": 169418, "epoch": 1400} {"train_loss": -40.928741455078125, "global_step": 169419, "epoch": 1400} {"train_loss": -40.27260971069336, "global_step": 169420, "epoch": 1400} {"train_loss": -41.62533187866211, "global_step": 169421, "epoch": 1400} {"train_loss": -41.162899017333984, "global_step": 169422, "epoch": 1400} {"train_loss": -40.821834564208984, "global_step": 169423, "epoch": 1400} {"train_loss": -41.08138656616211, "global_step": 169424, "epoch": 1400} {"train_loss": -41.14982604980469, "global_step": 169425, "epoch": 1400} {"train_loss": -40.527400970458984, "global_step": 169426, "epoch": 1400} {"train_loss": -41.37501907348633, "global_step": 169427, "epoch": 1400} {"train_loss": -41.20789337158203, "global_step": 169428, "epoch": 1400} {"train_loss": -39.65232467651367, "global_step": 169429, "epoch": 1400} {"train_loss": -37.850250244140625, "global_step": 169430, "epoch": 1400} {"train_loss": -33.88249588012695, "global_step": 169431, "epoch": 1400} {"train_loss": -31.98967933654785, "global_step": 169432, "epoch": 1400} {"train_loss": -32.190399169921875, "global_step": 169433, "epoch": 1400} {"train_loss": -33.793514251708984, "global_step": 169434, "epoch": 1400} {"train_loss": -36.71732711791992, "global_step": 169435, "epoch": 1400} {"train_loss": -40.71992492675781, "global_step": 169436, "epoch": 1400} {"train_loss": -39.193843841552734, "global_step": 169437, "epoch": 1400} {"train_loss": -39.404144287109375, "global_step": 169438, "epoch": 1400} {"train_loss": -39.98612976074219, "global_step": 169439, "epoch": 1400} {"train_loss": -40.338863372802734, "global_step": 169440, "epoch": 1400} {"train_loss": -40.552764892578125, "global_step": 169441, "epoch": 1400} {"train_loss": -39.80104064941406, "global_step": 169442, "epoch": 1400} {"train_loss": -41.12069320678711, "global_step": 169443, "epoch": 1400} {"train_loss": -40.970699310302734, "global_step": 169444, "epoch": 1400} {"train_loss": -40.92661666870117, "global_step": 169445, "epoch": 1400} {"train_loss": -41.1423454284668, "global_step": 169446, "epoch": 1400} {"train_loss": -40.311317443847656, "global_step": 169447, "epoch": 1400} {"train_loss": -41.16199493408203, "global_step": 169448, "epoch": 1400} {"train_loss": -41.53782272338867, "global_step": 169449, "epoch": 1400} {"train_loss": -40.77096176147461, "global_step": 169450, "epoch": 1400} {"train_loss": -41.52265548706055, "global_step": 169451, "epoch": 1400} {"train_loss": -41.19270706176758, "global_step": 169452, "epoch": 1400} {"train_loss": -41.09391403198242, "global_step": 169453, "epoch": 1400} {"train_loss": -41.50092697143555, "global_step": 169454, "epoch": 1400} {"train_loss": -41.27988815307617, "global_step": 169455, "epoch": 1400} {"train_loss": -41.20719528198242, "global_step": 169456, "epoch": 1400} {"train_loss": -41.7194938659668, "global_step": 169457, "epoch": 1400} {"train_loss": -41.29902648925781, "global_step": 169458, "epoch": 1400} {"train_loss": -40.99060821533203, "global_step": 169459, "epoch": 1400} {"train_loss": -41.63120651245117, "global_step": 169460, "epoch": 1400} {"train_loss": -41.12852096557617, "global_step": 169461, "epoch": 1400} {"train_loss": -41.50456619262695, "global_step": 169462, "epoch": 1400} {"train_loss": -41.527374267578125, "global_step": 169463, "epoch": 1400} {"train_loss": -41.51192855834961, "global_step": 169464, "epoch": 1400} {"train_loss": -41.51093292236328, "global_step": 169465, "epoch": 1400} {"train_loss": -41.41730499267578, "global_step": 169466, "epoch": 1400} {"train_loss": -40.2148551940918, "global_step": 169467, "epoch": 1400} {"train_loss": -38.37693405151367, "global_step": 169468, "epoch": 1400} {"train_loss": -41.43878936767578, "global_step": 169469, "epoch": 1400} {"train_loss": -40.90712356567383, "global_step": 169470, "epoch": 1400} {"train_loss": -39.758201599121094, "global_step": 169471, "epoch": 1400} {"train_loss": -40.469635009765625, "global_step": 169472, "epoch": 1400} {"train_loss": -41.05596923828125, "global_step": 169473, "epoch": 1400} {"train_loss": -38.706581115722656, "global_step": 169474, "epoch": 1400} {"train_loss": -38.57327651977539, "global_step": 169475, "epoch": 1400} {"train_loss": -41.05605697631836, "global_step": 169476, "epoch": 1400} {"train_loss": -40.58881759643555, "global_step": 169477, "epoch": 1400} {"train_loss": -39.72406768798828, "global_step": 169478, "epoch": 1400} {"train_loss": -41.17778778076172, "global_step": 169479, "epoch": 1400} {"train_loss": -39.14094924926758, "global_step": 169480, "epoch": 1400} {"train_loss": -40.042259216308594, "global_step": 169481, "epoch": 1400} {"train_loss": -38.80677795410156, "global_step": 169482, "epoch": 1400} {"train_loss": -38.90699005126953, "global_step": 169483, "epoch": 1400} {"train_loss": -40.350643157958984, "global_step": 169484, "epoch": 1400} {"train_loss": -38.74653625488281, "global_step": 169485, "epoch": 1400} {"train_loss": -40.14629364013672, "global_step": 169486, "epoch": 1400} {"train_loss": -40.1809196472168, "global_step": 169487, "epoch": 1400} {"train_loss": -39.31249237060547, "global_step": 169488, "epoch": 1400} {"train_loss": -38.79193115234375, "global_step": 169489, "epoch": 1400} {"train_loss": -40.17418670654297, "global_step": 169490, "epoch": 1400} {"train_loss": -37.413997650146484, "global_step": 169491, "epoch": 1400} {"train_loss": -40.63721466064453, "global_step": 169492, "epoch": 1400} {"train_loss": -39.3748893737793, "global_step": 169493, "epoch": 1400} {"train_loss": -40.30708694458008, "global_step": 169494, "epoch": 1400} {"train_loss": -39.83333969116211, "global_step": 169495, "epoch": 1400} {"train_loss": -39.0951042175293, "global_step": 169496, "epoch": 1400} {"train_loss": -39.84220886230469, "global_step": 169497, "epoch": 1400} {"train_loss": -38.27796173095703, "global_step": 169498, "epoch": 1400} {"train_loss": -40.55385208129883, "global_step": 169499, "epoch": 1400} {"train_loss": -38.70707321166992, "global_step": 169500, "epoch": 1400} {"train_loss": -39.68153762817383, "global_step": 169501, "epoch": 1400} {"train_loss": -38.33165740966797, "global_step": 169502, "epoch": 1400} {"train_loss": -39.788536071777344, "global_step": 169503, "epoch": 1400} {"train_loss": -38.270790100097656, "global_step": 169504, "epoch": 1400} {"train_loss": -40.7886962890625, "global_step": 169505, "epoch": 1400} {"train_loss": -39.929962158203125, "global_step": 169506, "epoch": 1400} {"train_loss": -39.88078689575195, "global_step": 169507, "epoch": 1400} {"train_loss": -40.04471969604492, "global_step": 169508, "epoch": 1400} {"train_loss": -40.04698181152344, "global_step": 169509, "epoch": 1400} {"train_loss": -40.025882720947266, "global_step": 169510, "epoch": 1400} {"train_loss": -41.13078308105469, "global_step": 169511, "epoch": 1400} {"train_loss": -40.44842529296875, "global_step": 169512, "epoch": 1400} {"train_loss": -40.72190475463867, "global_step": 169513, "epoch": 1400} {"train_loss": -40.07463836669922, "global_step": 169514, "epoch": 1400} {"train_loss": -40.315670013427734, "global_step": 169515, "epoch": 1400} {"train_loss": -40.97939682006836, "global_step": 169516, "epoch": 1400} {"train_loss": -41.08466339111328, "global_step": 169517, "epoch": 1400} {"train_loss": -40.21369171142578, "global_step": 169518, "epoch": 1400} {"train_loss": -40.700130462646484, "global_step": 169519, "epoch": 1400} {"train_loss": -40.15979071688061, "global_step": 169520, "epoch": 1400, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4400000": 1.0, "test/sim_max_reward_4400001": 1.0, "test/sim_max_reward_4400002": 1.0, "test/sim_max_reward_4400003": 0.0, "test/sim_max_reward_4400004": 1.0, "test/sim_max_reward_4400005": 1.0, "test/sim_max_reward_4400006": 1.0, "test/sim_max_reward_4400007": 1.0, "test/sim_max_reward_4400008": 1.0, "test/sim_max_reward_4400009": 1.0, "test/sim_max_reward_4400010": 1.0, "test/sim_max_reward_4400011": 1.0, "test/sim_max_reward_4400012": 1.0, "test/sim_max_reward_4400013": 1.0, "test/sim_max_reward_4400014": 1.0, "test/sim_max_reward_4400015": 1.0, "test/sim_max_reward_4400016": 1.0, "test/sim_max_reward_4400017": 1.0, "test/sim_max_reward_4400018": 1.0, "test/sim_max_reward_4400019": 1.0, "test/sim_max_reward_4400020": 1.0, "test/sim_max_reward_4400021": 1.0, "train/mean_score": 1.0, "test/mean_score": 0.9545454545454546, "val_loss": 2789746.0} {"train_loss": -40.321163177490234, "global_step": 169521, "epoch": 1401} {"train_loss": -40.48154830932617, "global_step": 169522, "epoch": 1401} {"train_loss": -38.206939697265625, "global_step": 169523, "epoch": 1401} {"train_loss": -38.469512939453125, "global_step": 169524, "epoch": 1401} {"train_loss": -39.905311584472656, "global_step": 169525, "epoch": 1401} {"train_loss": -40.123294830322266, "global_step": 169526, "epoch": 1401} {"train_loss": -39.20785903930664, "global_step": 169527, "epoch": 1401} {"train_loss": -38.589149475097656, "global_step": 169528, "epoch": 1401} {"train_loss": -39.80473709106445, "global_step": 169529, "epoch": 1401} {"train_loss": -39.818267822265625, "global_step": 169530, "epoch": 1401} {"train_loss": -38.24073028564453, "global_step": 169531, "epoch": 1401} {"train_loss": -35.15044021606445, "global_step": 169532, "epoch": 1401} {"train_loss": -39.32585525512695, "global_step": 169533, "epoch": 1401} {"train_loss": -38.02330780029297, "global_step": 169534, "epoch": 1401} {"train_loss": -39.83237838745117, "global_step": 169535, "epoch": 1401} {"train_loss": -38.80562973022461, "global_step": 169536, "epoch": 1401} {"train_loss": -40.05493927001953, "global_step": 169537, "epoch": 1401} {"train_loss": -40.58942794799805, "global_step": 169538, "epoch": 1401} {"train_loss": -40.110408782958984, "global_step": 169539, "epoch": 1401} {"train_loss": -40.56050491333008, "global_step": 169540, "epoch": 1401} {"train_loss": -40.07500076293945, "global_step": 169541, "epoch": 1401} {"train_loss": -39.60883712768555, "global_step": 169542, "epoch": 1401} {"train_loss": -38.76813888549805, "global_step": 169543, "epoch": 1401} {"train_loss": -40.71413040161133, "global_step": 169544, "epoch": 1401} {"train_loss": -40.16963577270508, "global_step": 169545, "epoch": 1401} {"train_loss": -32.47535705566406, "global_step": 169546, "epoch": 1401} {"train_loss": -39.41925811767578, "global_step": 169547, "epoch": 1401} {"train_loss": -39.9642448425293, "global_step": 169548, "epoch": 1401} {"train_loss": -38.17975616455078, "global_step": 169549, "epoch": 1401} {"train_loss": -37.22978591918945, "global_step": 169550, "epoch": 1401} {"train_loss": -39.56661605834961, "global_step": 169551, "epoch": 1401} {"train_loss": -40.47126388549805, "global_step": 169552, "epoch": 1401} {"train_loss": -39.6136589050293, "global_step": 169553, "epoch": 1401} {"train_loss": -40.03904724121094, "global_step": 169554, "epoch": 1401} {"train_loss": -39.988372802734375, "global_step": 169555, "epoch": 1401} {"train_loss": -38.772682189941406, "global_step": 169556, "epoch": 1401} {"train_loss": -39.894264221191406, "global_step": 169557, "epoch": 1401} {"train_loss": -38.760799407958984, "global_step": 169558, "epoch": 1401} {"train_loss": -40.45087432861328, "global_step": 169559, "epoch": 1401} {"train_loss": -39.975013732910156, "global_step": 169560, "epoch": 1401} {"train_loss": -39.67832565307617, "global_step": 169561, "epoch": 1401} {"train_loss": -40.13433837890625, "global_step": 169562, "epoch": 1401} {"train_loss": -39.26457595825195, "global_step": 169563, "epoch": 1401} {"train_loss": -37.96421432495117, "global_step": 169564, "epoch": 1401} {"train_loss": -39.70622634887695, "global_step": 169565, "epoch": 1401} {"train_loss": -39.383155822753906, "global_step": 169566, "epoch": 1401} {"train_loss": -36.71512985229492, "global_step": 169567, "epoch": 1401} {"train_loss": -37.71555709838867, "global_step": 169568, "epoch": 1401} {"train_loss": -39.67634201049805, "global_step": 169569, "epoch": 1401} {"train_loss": -38.85247802734375, "global_step": 169570, "epoch": 1401} {"train_loss": -38.908634185791016, "global_step": 169571, "epoch": 1401} {"train_loss": -39.87704086303711, "global_step": 169572, "epoch": 1401} {"train_loss": -39.493553161621094, "global_step": 169573, "epoch": 1401} {"train_loss": -39.68209457397461, "global_step": 169574, "epoch": 1401} {"train_loss": -40.73727035522461, "global_step": 169575, "epoch": 1401} {"train_loss": -38.88362121582031, "global_step": 169576, "epoch": 1401} {"train_loss": -39.07071304321289, "global_step": 169577, "epoch": 1401} {"train_loss": -39.06758499145508, "global_step": 169578, "epoch": 1401} {"train_loss": -39.59988021850586, "global_step": 169579, "epoch": 1401} {"train_loss": -39.42966842651367, "global_step": 169580, "epoch": 1401} {"train_loss": -39.748382568359375, "global_step": 169581, "epoch": 1401} {"train_loss": -37.76609420776367, "global_step": 169582, "epoch": 1401} {"train_loss": -39.0007438659668, "global_step": 169583, "epoch": 1401} {"train_loss": -40.03828811645508, "global_step": 169584, "epoch": 1401} {"train_loss": -40.1507453918457, "global_step": 169585, "epoch": 1401} {"train_loss": -39.4470329284668, "global_step": 169586, "epoch": 1401} {"train_loss": -40.248023986816406, "global_step": 169587, "epoch": 1401} {"train_loss": -38.66332244873047, "global_step": 169588, "epoch": 1401} {"train_loss": -39.7227897644043, "global_step": 169589, "epoch": 1401} {"train_loss": -39.812129974365234, "global_step": 169590, "epoch": 1401} {"train_loss": -39.58107376098633, "global_step": 169591, "epoch": 1401} {"train_loss": -38.416297912597656, "global_step": 169592, "epoch": 1401} {"train_loss": -39.711605072021484, "global_step": 169593, "epoch": 1401} {"train_loss": -38.82611083984375, "global_step": 169594, "epoch": 1401} {"train_loss": -38.46670913696289, "global_step": 169595, "epoch": 1401} {"train_loss": -38.62516403198242, "global_step": 169596, "epoch": 1401} {"train_loss": -39.09613800048828, "global_step": 169597, "epoch": 1401} {"train_loss": -38.23850631713867, "global_step": 169598, "epoch": 1401} {"train_loss": -39.27272415161133, "global_step": 169599, "epoch": 1401} {"train_loss": -39.44883728027344, "global_step": 169600, "epoch": 1401} {"train_loss": -38.797462463378906, "global_step": 169601, "epoch": 1401} {"train_loss": -39.35182571411133, "global_step": 169602, "epoch": 1401} {"train_loss": -39.00769805908203, "global_step": 169603, "epoch": 1401} {"train_loss": -39.33127212524414, "global_step": 169604, "epoch": 1401} {"train_loss": -39.152618408203125, "global_step": 169605, "epoch": 1401} {"train_loss": -39.96647262573242, "global_step": 169606, "epoch": 1401} {"train_loss": -40.29057312011719, "global_step": 169607, "epoch": 1401} {"train_loss": -40.14594650268555, "global_step": 169608, "epoch": 1401} {"train_loss": -39.298641204833984, "global_step": 169609, "epoch": 1401} {"train_loss": -39.9609260559082, "global_step": 169610, "epoch": 1401} {"train_loss": -39.86503219604492, "global_step": 169611, "epoch": 1401} {"train_loss": -40.065120697021484, "global_step": 169612, "epoch": 1401} {"train_loss": -38.46224594116211, "global_step": 169613, "epoch": 1401} {"train_loss": -40.178070068359375, "global_step": 169614, "epoch": 1401} {"train_loss": -40.12939453125, "global_step": 169615, "epoch": 1401} {"train_loss": -40.03658676147461, "global_step": 169616, "epoch": 1401} {"train_loss": -38.360897064208984, "global_step": 169617, "epoch": 1401} {"train_loss": -39.628265380859375, "global_step": 169618, "epoch": 1401} {"train_loss": -40.30353927612305, "global_step": 169619, "epoch": 1401} {"train_loss": -38.709449768066406, "global_step": 169620, "epoch": 1401} {"train_loss": -40.51914596557617, "global_step": 169621, "epoch": 1401} {"train_loss": -39.91291427612305, "global_step": 169622, "epoch": 1401} {"train_loss": -40.00896072387695, "global_step": 169623, "epoch": 1401} {"train_loss": -40.017127990722656, "global_step": 169624, "epoch": 1401} {"train_loss": -40.432857513427734, "global_step": 169625, "epoch": 1401} {"train_loss": -40.159278869628906, "global_step": 169626, "epoch": 1401} {"train_loss": -40.28895950317383, "global_step": 169627, "epoch": 1401} {"train_loss": -40.234779357910156, "global_step": 169628, "epoch": 1401} {"train_loss": -40.2805290222168, "global_step": 169629, "epoch": 1401} {"train_loss": -40.94462203979492, "global_step": 169630, "epoch": 1401} {"train_loss": -40.86078643798828, "global_step": 169631, "epoch": 1401} {"train_loss": -40.32174301147461, "global_step": 169632, "epoch": 1401} {"train_loss": -41.2007942199707, "global_step": 169633, "epoch": 1401} {"train_loss": -40.91791915893555, "global_step": 169634, "epoch": 1401} {"train_loss": -40.992401123046875, "global_step": 169635, "epoch": 1401} {"train_loss": -41.05986022949219, "global_step": 169636, "epoch": 1401} {"train_loss": -40.33945846557617, "global_step": 169637, "epoch": 1401} {"train_loss": -40.71821212768555, "global_step": 169638, "epoch": 1401} {"train_loss": -40.707088470458984, "global_step": 169639, "epoch": 1401} {"train_loss": -40.641170501708984, "global_step": 169640, "epoch": 1401} {"train_loss": -39.50352604133038, "global_step": 169641, "epoch": 1401, "val_loss": 2640056.75} {"train_loss": -41.302494049072266, "global_step": 169642, "epoch": 1402} {"train_loss": -40.73860549926758, "global_step": 169643, "epoch": 1402} {"train_loss": -41.27167510986328, "global_step": 169644, "epoch": 1402} {"train_loss": -40.80526351928711, "global_step": 169645, "epoch": 1402} {"train_loss": -41.1638069152832, "global_step": 169646, "epoch": 1402} {"train_loss": -41.15509033203125, "global_step": 169647, "epoch": 1402} {"train_loss": -40.7791633605957, "global_step": 169648, "epoch": 1402} {"train_loss": -41.18793869018555, "global_step": 169649, "epoch": 1402} {"train_loss": -40.59246063232422, "global_step": 169650, "epoch": 1402} {"train_loss": -41.02692794799805, "global_step": 169651, "epoch": 1402} {"train_loss": -40.67637634277344, "global_step": 169652, "epoch": 1402} {"train_loss": -40.772682189941406, "global_step": 169653, "epoch": 1402} {"train_loss": -38.2927131652832, "global_step": 169654, "epoch": 1402} {"train_loss": -41.16373062133789, "global_step": 169655, "epoch": 1402} {"train_loss": -39.62617111206055, "global_step": 169656, "epoch": 1402} {"train_loss": -41.322242736816406, "global_step": 169657, "epoch": 1402} {"train_loss": -39.94032669067383, "global_step": 169658, "epoch": 1402} {"train_loss": -40.79513168334961, "global_step": 169659, "epoch": 1402} {"train_loss": -39.7479362487793, "global_step": 169660, "epoch": 1402} {"train_loss": -38.82551574707031, "global_step": 169661, "epoch": 1402} {"train_loss": -35.01729965209961, "global_step": 169662, "epoch": 1402} {"train_loss": -33.06827926635742, "global_step": 169663, "epoch": 1402} {"train_loss": -35.55644607543945, "global_step": 169664, "epoch": 1402} {"train_loss": -39.45558547973633, "global_step": 169665, "epoch": 1402} {"train_loss": -38.662784576416016, "global_step": 169666, "epoch": 1402} {"train_loss": -38.71366882324219, "global_step": 169667, "epoch": 1402} {"train_loss": -38.507083892822266, "global_step": 169668, "epoch": 1402} {"train_loss": -39.0286750793457, "global_step": 169669, "epoch": 1402} {"train_loss": -39.15573501586914, "global_step": 169670, "epoch": 1402} {"train_loss": -40.269344329833984, "global_step": 169671, "epoch": 1402} {"train_loss": -39.74536895751953, "global_step": 169672, "epoch": 1402} {"train_loss": -39.04042434692383, "global_step": 169673, "epoch": 1402} {"train_loss": -39.39165115356445, "global_step": 169674, "epoch": 1402} {"train_loss": -40.84209060668945, "global_step": 169675, "epoch": 1402} {"train_loss": -38.56721878051758, "global_step": 169676, "epoch": 1402} {"train_loss": -40.036659240722656, "global_step": 169677, "epoch": 1402} {"train_loss": -39.58295822143555, "global_step": 169678, "epoch": 1402} {"train_loss": -38.88545608520508, "global_step": 169679, "epoch": 1402} {"train_loss": -39.89046859741211, "global_step": 169680, "epoch": 1402} {"train_loss": -39.847023010253906, "global_step": 169681, "epoch": 1402} {"train_loss": -40.301448822021484, "global_step": 169682, "epoch": 1402} {"train_loss": -39.62605667114258, "global_step": 169683, "epoch": 1402} {"train_loss": -38.84242630004883, "global_step": 169684, "epoch": 1402} {"train_loss": -40.534114837646484, "global_step": 169685, "epoch": 1402} {"train_loss": -40.21533966064453, "global_step": 169686, "epoch": 1402} {"train_loss": -39.36651611328125, "global_step": 169687, "epoch": 1402} {"train_loss": -38.10982894897461, "global_step": 169688, "epoch": 1402} {"train_loss": -39.128089904785156, "global_step": 169689, "epoch": 1402} {"train_loss": -40.000667572021484, "global_step": 169690, "epoch": 1402} {"train_loss": -38.318878173828125, "global_step": 169691, "epoch": 1402} {"train_loss": -40.007606506347656, "global_step": 169692, "epoch": 1402} {"train_loss": -39.859718322753906, "global_step": 169693, "epoch": 1402} {"train_loss": -36.84650802612305, "global_step": 169694, "epoch": 1402} {"train_loss": -38.81023025512695, "global_step": 169695, "epoch": 1402} {"train_loss": -38.02459716796875, "global_step": 169696, "epoch": 1402} {"train_loss": -38.049556732177734, "global_step": 169697, "epoch": 1402} {"train_loss": -39.30949401855469, "global_step": 169698, "epoch": 1402} {"train_loss": -38.443023681640625, "global_step": 169699, "epoch": 1402} {"train_loss": -38.42649841308594, "global_step": 169700, "epoch": 1402} {"train_loss": -39.70307159423828, "global_step": 169701, "epoch": 1402} {"train_loss": -38.82173538208008, "global_step": 169702, "epoch": 1402} {"train_loss": -33.92475509643555, "global_step": 169703, "epoch": 1402} {"train_loss": -40.418514251708984, "global_step": 169704, "epoch": 1402} {"train_loss": -37.41895294189453, "global_step": 169705, "epoch": 1402} {"train_loss": -39.12400436401367, "global_step": 169706, "epoch": 1402} {"train_loss": -39.077083587646484, "global_step": 169707, "epoch": 1402} {"train_loss": -38.39365768432617, "global_step": 169708, "epoch": 1402} {"train_loss": -38.7815055847168, "global_step": 169709, "epoch": 1402} {"train_loss": -38.5920524597168, "global_step": 169710, "epoch": 1402} {"train_loss": -39.39332962036133, "global_step": 169711, "epoch": 1402} {"train_loss": -38.863075256347656, "global_step": 169712, "epoch": 1402} {"train_loss": -36.7258415222168, "global_step": 169713, "epoch": 1402} {"train_loss": -39.60598373413086, "global_step": 169714, "epoch": 1402} {"train_loss": -38.329158782958984, "global_step": 169715, "epoch": 1402} {"train_loss": -39.11880111694336, "global_step": 169716, "epoch": 1402} {"train_loss": -39.455631256103516, "global_step": 169717, "epoch": 1402} {"train_loss": -39.499385833740234, "global_step": 169718, "epoch": 1402} {"train_loss": -39.520530700683594, "global_step": 169719, "epoch": 1402} {"train_loss": -39.393707275390625, "global_step": 169720, "epoch": 1402} {"train_loss": -40.32438278198242, "global_step": 169721, "epoch": 1402} {"train_loss": -39.43180847167969, "global_step": 169722, "epoch": 1402} {"train_loss": -39.57941818237305, "global_step": 169723, "epoch": 1402} {"train_loss": -40.56354522705078, "global_step": 169724, "epoch": 1402} {"train_loss": -38.98297882080078, "global_step": 169725, "epoch": 1402} {"train_loss": -39.785850524902344, "global_step": 169726, "epoch": 1402} {"train_loss": -40.27500534057617, "global_step": 169727, "epoch": 1402} {"train_loss": -39.22200012207031, "global_step": 169728, "epoch": 1402} {"train_loss": -38.8842887878418, "global_step": 169729, "epoch": 1402} {"train_loss": -38.1823844909668, "global_step": 169730, "epoch": 1402} {"train_loss": -38.34333038330078, "global_step": 169731, "epoch": 1402} {"train_loss": -39.41228485107422, "global_step": 169732, "epoch": 1402} {"train_loss": -40.5858039855957, "global_step": 169733, "epoch": 1402} {"train_loss": -38.9801025390625, "global_step": 169734, "epoch": 1402} {"train_loss": -39.41459274291992, "global_step": 169735, "epoch": 1402} {"train_loss": -39.62660598754883, "global_step": 169736, "epoch": 1402} {"train_loss": -40.438568115234375, "global_step": 169737, "epoch": 1402} {"train_loss": -39.1690673828125, "global_step": 169738, "epoch": 1402} {"train_loss": -40.67013168334961, "global_step": 169739, "epoch": 1402} {"train_loss": -40.13690185546875, "global_step": 169740, "epoch": 1402} {"train_loss": -40.326107025146484, "global_step": 169741, "epoch": 1402} {"train_loss": -40.783077239990234, "global_step": 169742, "epoch": 1402} {"train_loss": -40.042720794677734, "global_step": 169743, "epoch": 1402} {"train_loss": -40.37732696533203, "global_step": 169744, "epoch": 1402} {"train_loss": -40.005218505859375, "global_step": 169745, "epoch": 1402} {"train_loss": -40.39710998535156, "global_step": 169746, "epoch": 1402} {"train_loss": -40.43380355834961, "global_step": 169747, "epoch": 1402} {"train_loss": -40.28078842163086, "global_step": 169748, "epoch": 1402} {"train_loss": -40.6755256652832, "global_step": 169749, "epoch": 1402} {"train_loss": -40.5035514831543, "global_step": 169750, "epoch": 1402} {"train_loss": -41.07343292236328, "global_step": 169751, "epoch": 1402} {"train_loss": -40.52595520019531, "global_step": 169752, "epoch": 1402} {"train_loss": -41.153438568115234, "global_step": 169753, "epoch": 1402} {"train_loss": -41.075050354003906, "global_step": 169754, "epoch": 1402} {"train_loss": -40.9583854675293, "global_step": 169755, "epoch": 1402} {"train_loss": -40.99652862548828, "global_step": 169756, "epoch": 1402} {"train_loss": -41.18513107299805, "global_step": 169757, "epoch": 1402} {"train_loss": -39.304969787597656, "global_step": 169758, "epoch": 1402} {"train_loss": -41.16146469116211, "global_step": 169759, "epoch": 1402} {"train_loss": -40.973724365234375, "global_step": 169760, "epoch": 1402} {"train_loss": -39.585811614990234, "global_step": 169761, "epoch": 1402} {"train_loss": -39.55119787168897, "global_step": 169762, "epoch": 1402, "val_loss": 2762575.25} {"train_loss": -41.33949279785156, "global_step": 169763, "epoch": 1403} {"train_loss": -40.769168853759766, "global_step": 169764, "epoch": 1403} {"train_loss": -40.23188018798828, "global_step": 169765, "epoch": 1403} {"train_loss": -41.08112335205078, "global_step": 169766, "epoch": 1403} {"train_loss": -41.4483528137207, "global_step": 169767, "epoch": 1403} {"train_loss": -41.194034576416016, "global_step": 169768, "epoch": 1403} {"train_loss": -41.19114685058594, "global_step": 169769, "epoch": 1403} {"train_loss": -41.117713928222656, "global_step": 169770, "epoch": 1403} {"train_loss": -41.50928497314453, "global_step": 169771, "epoch": 1403} {"train_loss": -41.44120407104492, "global_step": 169772, "epoch": 1403} {"train_loss": -41.26241683959961, "global_step": 169773, "epoch": 1403} {"train_loss": -41.302608489990234, "global_step": 169774, "epoch": 1403} {"train_loss": -41.47045135498047, "global_step": 169775, "epoch": 1403} {"train_loss": -41.6213264465332, "global_step": 169776, "epoch": 1403} {"train_loss": -41.03701400756836, "global_step": 169777, "epoch": 1403} {"train_loss": -40.61865997314453, "global_step": 169778, "epoch": 1403} {"train_loss": -40.60316467285156, "global_step": 169779, "epoch": 1403} {"train_loss": -41.04865646362305, "global_step": 169780, "epoch": 1403} {"train_loss": -41.50346755981445, "global_step": 169781, "epoch": 1403} {"train_loss": -41.57257080078125, "global_step": 169782, "epoch": 1403} {"train_loss": -41.477081298828125, "global_step": 169783, "epoch": 1403} {"train_loss": -41.49628829956055, "global_step": 169784, "epoch": 1403} {"train_loss": -41.804622650146484, "global_step": 169785, "epoch": 1403} {"train_loss": -41.6734619140625, "global_step": 169786, "epoch": 1403} {"train_loss": -41.04916000366211, "global_step": 169787, "epoch": 1403} {"train_loss": -40.36562728881836, "global_step": 169788, "epoch": 1403} {"train_loss": -40.05402374267578, "global_step": 169789, "epoch": 1403} {"train_loss": -41.48760986328125, "global_step": 169790, "epoch": 1403} {"train_loss": -41.60549545288086, "global_step": 169791, "epoch": 1403} {"train_loss": -40.80894088745117, "global_step": 169792, "epoch": 1403} {"train_loss": -40.499813079833984, "global_step": 169793, "epoch": 1403} {"train_loss": -40.79221725463867, "global_step": 169794, "epoch": 1403} {"train_loss": -40.993873596191406, "global_step": 169795, "epoch": 1403} {"train_loss": -41.23009490966797, "global_step": 169796, "epoch": 1403} {"train_loss": -41.433319091796875, "global_step": 169797, "epoch": 1403} {"train_loss": -40.988792419433594, "global_step": 169798, "epoch": 1403} {"train_loss": -40.00932312011719, "global_step": 169799, "epoch": 1403} {"train_loss": -40.19606399536133, "global_step": 169800, "epoch": 1403} {"train_loss": -40.67145919799805, "global_step": 169801, "epoch": 1403} {"train_loss": -41.0964469909668, "global_step": 169802, "epoch": 1403} {"train_loss": -40.8565559387207, "global_step": 169803, "epoch": 1403} {"train_loss": -41.28805160522461, "global_step": 169804, "epoch": 1403} {"train_loss": -40.93813705444336, "global_step": 169805, "epoch": 1403} {"train_loss": -41.089508056640625, "global_step": 169806, "epoch": 1403} {"train_loss": -41.142391204833984, "global_step": 169807, "epoch": 1403} {"train_loss": -40.71889877319336, "global_step": 169808, "epoch": 1403} {"train_loss": -40.55723190307617, "global_step": 169809, "epoch": 1403} {"train_loss": -40.879058837890625, "global_step": 169810, "epoch": 1403} {"train_loss": -41.170677185058594, "global_step": 169811, "epoch": 1403} {"train_loss": -40.023101806640625, "global_step": 169812, "epoch": 1403} {"train_loss": -36.61788558959961, "global_step": 169813, "epoch": 1403} {"train_loss": -38.01764678955078, "global_step": 169814, "epoch": 1403} {"train_loss": -40.16254806518555, "global_step": 169815, "epoch": 1403} {"train_loss": -40.1369743347168, "global_step": 169816, "epoch": 1403} {"train_loss": -38.76811599731445, "global_step": 169817, "epoch": 1403} {"train_loss": -39.96859359741211, "global_step": 169818, "epoch": 1403} {"train_loss": -40.153316497802734, "global_step": 169819, "epoch": 1403} {"train_loss": -40.996429443359375, "global_step": 169820, "epoch": 1403} {"train_loss": -39.13372802734375, "global_step": 169821, "epoch": 1403} {"train_loss": -39.15983200073242, "global_step": 169822, "epoch": 1403} {"train_loss": -39.777137756347656, "global_step": 169823, "epoch": 1403} {"train_loss": -40.311702728271484, "global_step": 169824, "epoch": 1403} {"train_loss": -39.77252960205078, "global_step": 169825, "epoch": 1403} {"train_loss": -39.740234375, "global_step": 169826, "epoch": 1403} {"train_loss": -39.19158935546875, "global_step": 169827, "epoch": 1403} {"train_loss": -40.604957580566406, "global_step": 169828, "epoch": 1403} {"train_loss": -39.5518913269043, "global_step": 169829, "epoch": 1403} {"train_loss": -38.8525505065918, "global_step": 169830, "epoch": 1403} {"train_loss": -38.950679779052734, "global_step": 169831, "epoch": 1403} {"train_loss": -40.643070220947266, "global_step": 169832, "epoch": 1403} {"train_loss": -34.94846725463867, "global_step": 169833, "epoch": 1403} {"train_loss": -37.498722076416016, "global_step": 169834, "epoch": 1403} {"train_loss": -40.05305099487305, "global_step": 169835, "epoch": 1403} {"train_loss": -37.98200988769531, "global_step": 169836, "epoch": 1403} {"train_loss": -36.34647750854492, "global_step": 169837, "epoch": 1403} {"train_loss": -39.04736328125, "global_step": 169838, "epoch": 1403} {"train_loss": -38.8597526550293, "global_step": 169839, "epoch": 1403} {"train_loss": -38.183589935302734, "global_step": 169840, "epoch": 1403} {"train_loss": -37.6281852722168, "global_step": 169841, "epoch": 1403} {"train_loss": -37.08845901489258, "global_step": 169842, "epoch": 1403} {"train_loss": -37.37205505371094, "global_step": 169843, "epoch": 1403} {"train_loss": -39.61460494995117, "global_step": 169844, "epoch": 1403} {"train_loss": -35.46828842163086, "global_step": 169845, "epoch": 1403} {"train_loss": -39.6921272277832, "global_step": 169846, "epoch": 1403} {"train_loss": -38.3181266784668, "global_step": 169847, "epoch": 1403} {"train_loss": -37.942569732666016, "global_step": 169848, "epoch": 1403} {"train_loss": -38.27114486694336, "global_step": 169849, "epoch": 1403} {"train_loss": -37.88774108886719, "global_step": 169850, "epoch": 1403} {"train_loss": -39.60791778564453, "global_step": 169851, "epoch": 1403} {"train_loss": -37.63901901245117, "global_step": 169852, "epoch": 1403} {"train_loss": -40.3870849609375, "global_step": 169853, "epoch": 1403} {"train_loss": -38.62217712402344, "global_step": 169854, "epoch": 1403} {"train_loss": -39.87028884887695, "global_step": 169855, "epoch": 1403} {"train_loss": -36.45307540893555, "global_step": 169856, "epoch": 1403} {"train_loss": -39.879364013671875, "global_step": 169857, "epoch": 1403} {"train_loss": -37.162513732910156, "global_step": 169858, "epoch": 1403} {"train_loss": -40.392696380615234, "global_step": 169859, "epoch": 1403} {"train_loss": -38.09444808959961, "global_step": 169860, "epoch": 1403} {"train_loss": -38.48225021362305, "global_step": 169861, "epoch": 1403} {"train_loss": -38.2390251159668, "global_step": 169862, "epoch": 1403} {"train_loss": -39.64435958862305, "global_step": 169863, "epoch": 1403} {"train_loss": -38.931278228759766, "global_step": 169864, "epoch": 1403} {"train_loss": -40.15118408203125, "global_step": 169865, "epoch": 1403} {"train_loss": -39.658599853515625, "global_step": 169866, "epoch": 1403} {"train_loss": -34.145362854003906, "global_step": 169867, "epoch": 1403} {"train_loss": -39.26688766479492, "global_step": 169868, "epoch": 1403} {"train_loss": -36.918697357177734, "global_step": 169869, "epoch": 1403} {"train_loss": -33.811920166015625, "global_step": 169870, "epoch": 1403} {"train_loss": -21.458425521850586, "global_step": 169871, "epoch": 1403} {"train_loss": -39.44088363647461, "global_step": 169872, "epoch": 1403} {"train_loss": -34.90408706665039, "global_step": 169873, "epoch": 1403} {"train_loss": -32.231727600097656, "global_step": 169874, "epoch": 1403} {"train_loss": -21.96820640563965, "global_step": 169875, "epoch": 1403} {"train_loss": -34.968143463134766, "global_step": 169876, "epoch": 1403} {"train_loss": -36.31058883666992, "global_step": 169877, "epoch": 1403} {"train_loss": -37.03620147705078, "global_step": 169878, "epoch": 1403} {"train_loss": -26.88812828063965, "global_step": 169879, "epoch": 1403} {"train_loss": -28.938827514648438, "global_step": 169880, "epoch": 1403} {"train_loss": -30.105512619018555, "global_step": 169881, "epoch": 1403} {"train_loss": -35.05742645263672, "global_step": 169882, "epoch": 1403} {"train_loss": -38.9073994849339, "global_step": 169883, "epoch": 1403, "val_loss": 2707530.75} {"train_loss": -32.638912200927734, "global_step": 169884, "epoch": 1404} {"train_loss": -34.3030891418457, "global_step": 169885, "epoch": 1404} {"train_loss": -32.253387451171875, "global_step": 169886, "epoch": 1404} {"train_loss": -35.37983322143555, "global_step": 169887, "epoch": 1404} {"train_loss": -36.38425064086914, "global_step": 169888, "epoch": 1404} {"train_loss": -32.135650634765625, "global_step": 169889, "epoch": 1404} {"train_loss": -35.07685089111328, "global_step": 169890, "epoch": 1404} {"train_loss": -36.0547981262207, "global_step": 169891, "epoch": 1404} {"train_loss": -36.04771041870117, "global_step": 169892, "epoch": 1404} {"train_loss": -36.923194885253906, "global_step": 169893, "epoch": 1404} {"train_loss": -36.88070297241211, "global_step": 169894, "epoch": 1404} {"train_loss": -36.79658126831055, "global_step": 169895, "epoch": 1404} {"train_loss": -37.2369384765625, "global_step": 169896, "epoch": 1404} {"train_loss": -37.59182357788086, "global_step": 169897, "epoch": 1404} {"train_loss": -38.264251708984375, "global_step": 169898, "epoch": 1404} {"train_loss": -37.04988479614258, "global_step": 169899, "epoch": 1404} {"train_loss": -36.47578811645508, "global_step": 169900, "epoch": 1404} {"train_loss": -37.08171463012695, "global_step": 169901, "epoch": 1404} {"train_loss": -38.013057708740234, "global_step": 169902, "epoch": 1404} {"train_loss": -37.699012756347656, "global_step": 169903, "epoch": 1404} {"train_loss": -37.871334075927734, "global_step": 169904, "epoch": 1404} {"train_loss": -37.9834098815918, "global_step": 169905, "epoch": 1404} {"train_loss": -38.370452880859375, "global_step": 169906, "epoch": 1404} {"train_loss": -37.48512268066406, "global_step": 169907, "epoch": 1404} {"train_loss": -36.10139083862305, "global_step": 169908, "epoch": 1404} {"train_loss": -37.80276107788086, "global_step": 169909, "epoch": 1404} {"train_loss": -38.18931198120117, "global_step": 169910, "epoch": 1404} {"train_loss": -37.97296905517578, "global_step": 169911, "epoch": 1404} {"train_loss": -38.25712966918945, "global_step": 169912, "epoch": 1404} {"train_loss": -38.49756622314453, "global_step": 169913, "epoch": 1404} {"train_loss": -38.350433349609375, "global_step": 169914, "epoch": 1404} {"train_loss": -38.0613899230957, "global_step": 169915, "epoch": 1404} {"train_loss": -38.31342697143555, "global_step": 169916, "epoch": 1404} {"train_loss": -38.176456451416016, "global_step": 169917, "epoch": 1404} {"train_loss": -38.8340950012207, "global_step": 169918, "epoch": 1404} {"train_loss": -38.26333236694336, "global_step": 169919, "epoch": 1404} {"train_loss": -38.727882385253906, "global_step": 169920, "epoch": 1404} {"train_loss": -38.66043472290039, "global_step": 169921, "epoch": 1404} {"train_loss": -38.9245491027832, "global_step": 169922, "epoch": 1404} {"train_loss": -38.59175491333008, "global_step": 169923, "epoch": 1404} {"train_loss": -39.55917739868164, "global_step": 169924, "epoch": 1404} {"train_loss": -39.5043830871582, "global_step": 169925, "epoch": 1404} {"train_loss": -38.64337158203125, "global_step": 169926, "epoch": 1404} {"train_loss": -38.912872314453125, "global_step": 169927, "epoch": 1404} {"train_loss": -38.90395736694336, "global_step": 169928, "epoch": 1404} {"train_loss": -38.622535705566406, "global_step": 169929, "epoch": 1404} {"train_loss": -37.50129318237305, "global_step": 169930, "epoch": 1404} {"train_loss": -38.801673889160156, "global_step": 169931, "epoch": 1404} {"train_loss": -39.91166305541992, "global_step": 169932, "epoch": 1404} {"train_loss": -39.82442092895508, "global_step": 169933, "epoch": 1404} {"train_loss": -39.08417510986328, "global_step": 169934, "epoch": 1404} {"train_loss": -39.68207931518555, "global_step": 169935, "epoch": 1404} {"train_loss": -39.13185119628906, "global_step": 169936, "epoch": 1404} {"train_loss": -39.19093322753906, "global_step": 169937, "epoch": 1404} {"train_loss": -39.43852996826172, "global_step": 169938, "epoch": 1404} {"train_loss": -39.8525276184082, "global_step": 169939, "epoch": 1404} {"train_loss": -39.72488021850586, "global_step": 169940, "epoch": 1404} {"train_loss": -39.26874923706055, "global_step": 169941, "epoch": 1404} {"train_loss": -39.67641830444336, "global_step": 169942, "epoch": 1404} {"train_loss": -39.855342864990234, "global_step": 169943, "epoch": 1404} {"train_loss": -39.31916427612305, "global_step": 169944, "epoch": 1404} {"train_loss": -39.81522750854492, "global_step": 169945, "epoch": 1404} {"train_loss": -40.15620803833008, "global_step": 169946, "epoch": 1404} {"train_loss": -40.46230697631836, "global_step": 169947, "epoch": 1404} {"train_loss": -39.83921813964844, "global_step": 169948, "epoch": 1404} {"train_loss": -39.71217346191406, "global_step": 169949, "epoch": 1404} {"train_loss": -40.469058990478516, "global_step": 169950, "epoch": 1404} {"train_loss": -39.13081741333008, "global_step": 169951, "epoch": 1404} {"train_loss": -40.16874313354492, "global_step": 169952, "epoch": 1404} {"train_loss": -39.61806106567383, "global_step": 169953, "epoch": 1404} {"train_loss": -39.75177001953125, "global_step": 169954, "epoch": 1404} {"train_loss": -40.30071258544922, "global_step": 169955, "epoch": 1404} {"train_loss": -40.201229095458984, "global_step": 169956, "epoch": 1404} {"train_loss": -39.248802185058594, "global_step": 169957, "epoch": 1404} {"train_loss": -40.14492416381836, "global_step": 169958, "epoch": 1404} {"train_loss": -39.68502426147461, "global_step": 169959, "epoch": 1404} {"train_loss": -39.971527099609375, "global_step": 169960, "epoch": 1404} {"train_loss": -40.166568756103516, "global_step": 169961, "epoch": 1404} {"train_loss": -39.973567962646484, "global_step": 169962, "epoch": 1404} {"train_loss": -39.9524040222168, "global_step": 169963, "epoch": 1404} {"train_loss": -39.92853927612305, "global_step": 169964, "epoch": 1404} {"train_loss": -40.14966583251953, "global_step": 169965, "epoch": 1404} {"train_loss": -40.436100006103516, "global_step": 169966, "epoch": 1404} {"train_loss": -40.26948165893555, "global_step": 169967, "epoch": 1404} {"train_loss": -39.9414176940918, "global_step": 169968, "epoch": 1404} {"train_loss": -40.81428909301758, "global_step": 169969, "epoch": 1404} {"train_loss": -39.69089126586914, "global_step": 169970, "epoch": 1404} {"train_loss": -39.5406379699707, "global_step": 169971, "epoch": 1404} {"train_loss": -39.75762939453125, "global_step": 169972, "epoch": 1404} {"train_loss": -40.26813507080078, "global_step": 169973, "epoch": 1404} {"train_loss": -40.681339263916016, "global_step": 169974, "epoch": 1404} {"train_loss": -40.40690231323242, "global_step": 169975, "epoch": 1404} {"train_loss": -40.438575744628906, "global_step": 169976, "epoch": 1404} {"train_loss": -40.40155792236328, "global_step": 169977, "epoch": 1404} {"train_loss": -40.815147399902344, "global_step": 169978, "epoch": 1404} {"train_loss": -40.35592269897461, "global_step": 169979, "epoch": 1404} {"train_loss": -40.02656173706055, "global_step": 169980, "epoch": 1404} {"train_loss": -40.539344787597656, "global_step": 169981, "epoch": 1404} {"train_loss": -40.95518112182617, "global_step": 169982, "epoch": 1404} {"train_loss": -39.51538848876953, "global_step": 169983, "epoch": 1404} {"train_loss": -41.29838562011719, "global_step": 169984, "epoch": 1404} {"train_loss": -40.21452331542969, "global_step": 169985, "epoch": 1404} {"train_loss": -40.799983978271484, "global_step": 169986, "epoch": 1404} {"train_loss": -39.97711181640625, "global_step": 169987, "epoch": 1404} {"train_loss": -40.22144317626953, "global_step": 169988, "epoch": 1404} {"train_loss": -40.400997161865234, "global_step": 169989, "epoch": 1404} {"train_loss": -40.521305084228516, "global_step": 169990, "epoch": 1404} {"train_loss": -40.20565414428711, "global_step": 169991, "epoch": 1404} {"train_loss": -41.1010627746582, "global_step": 169992, "epoch": 1404} {"train_loss": -40.45827865600586, "global_step": 169993, "epoch": 1404} {"train_loss": -40.75605010986328, "global_step": 169994, "epoch": 1404} {"train_loss": -40.24616622924805, "global_step": 169995, "epoch": 1404} {"train_loss": -41.48114776611328, "global_step": 169996, "epoch": 1404} {"train_loss": -40.0919075012207, "global_step": 169997, "epoch": 1404} {"train_loss": -40.155338287353516, "global_step": 169998, "epoch": 1404} {"train_loss": -40.81217575073242, "global_step": 169999, "epoch": 1404} {"train_loss": -41.14993667602539, "global_step": 170000, "epoch": 1404} {"train_loss": -40.3773193359375, "global_step": 170001, "epoch": 1404} {"train_loss": -40.853004455566406, "global_step": 170002, "epoch": 1404} {"train_loss": -40.825355529785156, "global_step": 170003, "epoch": 1404} {"train_loss": -39.04395908954715, "global_step": 170004, "epoch": 1404, "val_loss": 2807702.75} {"train_loss": -41.11167907714844, "global_step": 170005, "epoch": 1405} {"train_loss": -41.00341796875, "global_step": 170006, "epoch": 1405} {"train_loss": -40.47671890258789, "global_step": 170007, "epoch": 1405} {"train_loss": -40.268157958984375, "global_step": 170008, "epoch": 1405} {"train_loss": -40.1578483581543, "global_step": 170009, "epoch": 1405} {"train_loss": -39.4100227355957, "global_step": 170010, "epoch": 1405} {"train_loss": -39.671531677246094, "global_step": 170011, "epoch": 1405} {"train_loss": -39.711124420166016, "global_step": 170012, "epoch": 1405} {"train_loss": -39.78975296020508, "global_step": 170013, "epoch": 1405} {"train_loss": -41.121978759765625, "global_step": 170014, "epoch": 1405} {"train_loss": -41.2069206237793, "global_step": 170015, "epoch": 1405} {"train_loss": -40.29767990112305, "global_step": 170016, "epoch": 1405} {"train_loss": -39.633541107177734, "global_step": 170017, "epoch": 1405} {"train_loss": -38.8181037902832, "global_step": 170018, "epoch": 1405} {"train_loss": -37.94252014160156, "global_step": 170019, "epoch": 1405} {"train_loss": -36.776363372802734, "global_step": 170020, "epoch": 1405} {"train_loss": -34.75364685058594, "global_step": 170021, "epoch": 1405} {"train_loss": -36.627227783203125, "global_step": 170022, "epoch": 1405} {"train_loss": -39.80330276489258, "global_step": 170023, "epoch": 1405} {"train_loss": -39.859954833984375, "global_step": 170024, "epoch": 1405} {"train_loss": -34.913692474365234, "global_step": 170025, "epoch": 1405} {"train_loss": -33.48786544799805, "global_step": 170026, "epoch": 1405} {"train_loss": -40.37913131713867, "global_step": 170027, "epoch": 1405} {"train_loss": -38.65850830078125, "global_step": 170028, "epoch": 1405} {"train_loss": -37.1748161315918, "global_step": 170029, "epoch": 1405} {"train_loss": -40.336299896240234, "global_step": 170030, "epoch": 1405} {"train_loss": -37.6125373840332, "global_step": 170031, "epoch": 1405} {"train_loss": -39.952476501464844, "global_step": 170032, "epoch": 1405} {"train_loss": -38.44188690185547, "global_step": 170033, "epoch": 1405} {"train_loss": -38.2700309753418, "global_step": 170034, "epoch": 1405} {"train_loss": -40.3038330078125, "global_step": 170035, "epoch": 1405} {"train_loss": -37.90925216674805, "global_step": 170036, "epoch": 1405} {"train_loss": -40.495155334472656, "global_step": 170037, "epoch": 1405} {"train_loss": -38.956329345703125, "global_step": 170038, "epoch": 1405} {"train_loss": -38.383522033691406, "global_step": 170039, "epoch": 1405} {"train_loss": -39.08384323120117, "global_step": 170040, "epoch": 1405} {"train_loss": -39.26873779296875, "global_step": 170041, "epoch": 1405} {"train_loss": -39.693275451660156, "global_step": 170042, "epoch": 1405} {"train_loss": -40.20728302001953, "global_step": 170043, "epoch": 1405} {"train_loss": -37.1474494934082, "global_step": 170044, "epoch": 1405} {"train_loss": -39.22201156616211, "global_step": 170045, "epoch": 1405} {"train_loss": -38.13636016845703, "global_step": 170046, "epoch": 1405} {"train_loss": -39.78913497924805, "global_step": 170047, "epoch": 1405} {"train_loss": -39.10024642944336, "global_step": 170048, "epoch": 1405} {"train_loss": -39.98649978637695, "global_step": 170049, "epoch": 1405} {"train_loss": -39.271263122558594, "global_step": 170050, "epoch": 1405} {"train_loss": -39.6152458190918, "global_step": 170051, "epoch": 1405} {"train_loss": -37.74032211303711, "global_step": 170052, "epoch": 1405} {"train_loss": -39.53276824951172, "global_step": 170053, "epoch": 1405} {"train_loss": -37.73537063598633, "global_step": 170054, "epoch": 1405} {"train_loss": -39.287715911865234, "global_step": 170055, "epoch": 1405} {"train_loss": -38.50934982299805, "global_step": 170056, "epoch": 1405} {"train_loss": -38.590511322021484, "global_step": 170057, "epoch": 1405} {"train_loss": -39.11387252807617, "global_step": 170058, "epoch": 1405} {"train_loss": -38.71491622924805, "global_step": 170059, "epoch": 1405} {"train_loss": -39.49835968017578, "global_step": 170060, "epoch": 1405} {"train_loss": -39.158016204833984, "global_step": 170061, "epoch": 1405} {"train_loss": -38.780677795410156, "global_step": 170062, "epoch": 1405} {"train_loss": -40.89599609375, "global_step": 170063, "epoch": 1405} {"train_loss": -39.48714065551758, "global_step": 170064, "epoch": 1405} {"train_loss": -38.802284240722656, "global_step": 170065, "epoch": 1405} {"train_loss": -39.67203903198242, "global_step": 170066, "epoch": 1405} {"train_loss": -40.40815353393555, "global_step": 170067, "epoch": 1405} {"train_loss": -38.714988708496094, "global_step": 170068, "epoch": 1405} {"train_loss": -40.80769729614258, "global_step": 170069, "epoch": 1405} {"train_loss": -39.62272262573242, "global_step": 170070, "epoch": 1405} {"train_loss": -39.87748336791992, "global_step": 170071, "epoch": 1405} {"train_loss": -39.737060546875, "global_step": 170072, "epoch": 1405} {"train_loss": -40.74909210205078, "global_step": 170073, "epoch": 1405} {"train_loss": -39.36615753173828, "global_step": 170074, "epoch": 1405} {"train_loss": -40.11056137084961, "global_step": 170075, "epoch": 1405} {"train_loss": -40.675907135009766, "global_step": 170076, "epoch": 1405} {"train_loss": -40.318992614746094, "global_step": 170077, "epoch": 1405} {"train_loss": -39.96368408203125, "global_step": 170078, "epoch": 1405} {"train_loss": -39.664161682128906, "global_step": 170079, "epoch": 1405} {"train_loss": -39.822505950927734, "global_step": 170080, "epoch": 1405} {"train_loss": -40.1348762512207, "global_step": 170081, "epoch": 1405} {"train_loss": -38.898860931396484, "global_step": 170082, "epoch": 1405} {"train_loss": -40.84110641479492, "global_step": 170083, "epoch": 1405} {"train_loss": -39.95062255859375, "global_step": 170084, "epoch": 1405} {"train_loss": -39.193519592285156, "global_step": 170085, "epoch": 1405} {"train_loss": -40.222900390625, "global_step": 170086, "epoch": 1405} {"train_loss": -40.51102066040039, "global_step": 170087, "epoch": 1405} {"train_loss": -41.02656936645508, "global_step": 170088, "epoch": 1405} {"train_loss": -40.36223602294922, "global_step": 170089, "epoch": 1405} {"train_loss": -40.788856506347656, "global_step": 170090, "epoch": 1405} {"train_loss": -40.45559310913086, "global_step": 170091, "epoch": 1405} {"train_loss": -40.652103424072266, "global_step": 170092, "epoch": 1405} {"train_loss": -40.885860443115234, "global_step": 170093, "epoch": 1405} {"train_loss": -40.51152420043945, "global_step": 170094, "epoch": 1405} {"train_loss": -40.29779052734375, "global_step": 170095, "epoch": 1405} {"train_loss": -40.807247161865234, "global_step": 170096, "epoch": 1405} {"train_loss": -40.24490737915039, "global_step": 170097, "epoch": 1405} {"train_loss": -41.233642578125, "global_step": 170098, "epoch": 1405} {"train_loss": -40.8308219909668, "global_step": 170099, "epoch": 1405} {"train_loss": -41.13022994995117, "global_step": 170100, "epoch": 1405} {"train_loss": -40.732906341552734, "global_step": 170101, "epoch": 1405} {"train_loss": -41.028743743896484, "global_step": 170102, "epoch": 1405} {"train_loss": -40.162452697753906, "global_step": 170103, "epoch": 1405} {"train_loss": -40.95655059814453, "global_step": 170104, "epoch": 1405} {"train_loss": -41.28585433959961, "global_step": 170105, "epoch": 1405} {"train_loss": -41.57789611816406, "global_step": 170106, "epoch": 1405} {"train_loss": -40.11019515991211, "global_step": 170107, "epoch": 1405} {"train_loss": -41.56386947631836, "global_step": 170108, "epoch": 1405} {"train_loss": -41.56666946411133, "global_step": 170109, "epoch": 1405} {"train_loss": -41.438995361328125, "global_step": 170110, "epoch": 1405} {"train_loss": -41.18391799926758, "global_step": 170111, "epoch": 1405} {"train_loss": -40.15034103393555, "global_step": 170112, "epoch": 1405} {"train_loss": -40.346290588378906, "global_step": 170113, "epoch": 1405} {"train_loss": -41.24430847167969, "global_step": 170114, "epoch": 1405} {"train_loss": -41.395851135253906, "global_step": 170115, "epoch": 1405} {"train_loss": -41.315284729003906, "global_step": 170116, "epoch": 1405} {"train_loss": -41.65676498413086, "global_step": 170117, "epoch": 1405} {"train_loss": -41.230804443359375, "global_step": 170118, "epoch": 1405} {"train_loss": -40.64838790893555, "global_step": 170119, "epoch": 1405} {"train_loss": -41.310890197753906, "global_step": 170120, "epoch": 1405} {"train_loss": -40.65768051147461, "global_step": 170121, "epoch": 1405} {"train_loss": -40.80302047729492, "global_step": 170122, "epoch": 1405} {"train_loss": -39.56978988647461, "global_step": 170123, "epoch": 1405} {"train_loss": -40.924659729003906, "global_step": 170124, "epoch": 1405} {"train_loss": -39.769887404008344, "global_step": 170125, "epoch": 1405, "val_loss": 2753871.75} {"train_loss": -41.5301628112793, "global_step": 170126, "epoch": 1406} {"train_loss": -40.8664436340332, "global_step": 170127, "epoch": 1406} {"train_loss": -41.464412689208984, "global_step": 170128, "epoch": 1406} {"train_loss": -41.04392623901367, "global_step": 170129, "epoch": 1406} {"train_loss": -41.39124298095703, "global_step": 170130, "epoch": 1406} {"train_loss": -41.1751823425293, "global_step": 170131, "epoch": 1406} {"train_loss": -42.021827697753906, "global_step": 170132, "epoch": 1406} {"train_loss": -41.52726364135742, "global_step": 170133, "epoch": 1406} {"train_loss": -40.40422058105469, "global_step": 170134, "epoch": 1406} {"train_loss": -40.441017150878906, "global_step": 170135, "epoch": 1406} {"train_loss": -39.9159049987793, "global_step": 170136, "epoch": 1406} {"train_loss": -38.27663040161133, "global_step": 170137, "epoch": 1406} {"train_loss": -33.318267822265625, "global_step": 170138, "epoch": 1406} {"train_loss": -18.426687240600586, "global_step": 170139, "epoch": 1406} {"train_loss": -17.965497970581055, "global_step": 170140, "epoch": 1406} {"train_loss": -32.861812591552734, "global_step": 170141, "epoch": 1406} {"train_loss": -33.30816650390625, "global_step": 170142, "epoch": 1406} {"train_loss": -26.192214965820312, "global_step": 170143, "epoch": 1406} {"train_loss": -34.457244873046875, "global_step": 170144, "epoch": 1406} {"train_loss": -30.376941680908203, "global_step": 170145, "epoch": 1406} {"train_loss": -27.878925323486328, "global_step": 170146, "epoch": 1406} {"train_loss": -38.87528991699219, "global_step": 170147, "epoch": 1406} {"train_loss": -32.278770446777344, "global_step": 170148, "epoch": 1406} {"train_loss": -37.94229507446289, "global_step": 170149, "epoch": 1406} {"train_loss": -33.9150505065918, "global_step": 170150, "epoch": 1406} {"train_loss": -37.08083724975586, "global_step": 170151, "epoch": 1406} {"train_loss": -37.12112045288086, "global_step": 170152, "epoch": 1406} {"train_loss": -35.22597885131836, "global_step": 170153, "epoch": 1406} {"train_loss": -39.06262969970703, "global_step": 170154, "epoch": 1406} {"train_loss": -36.032875061035156, "global_step": 170155, "epoch": 1406} {"train_loss": -39.103878021240234, "global_step": 170156, "epoch": 1406} {"train_loss": -37.622798919677734, "global_step": 170157, "epoch": 1406} {"train_loss": -39.08918380737305, "global_step": 170158, "epoch": 1406} {"train_loss": -37.52710723876953, "global_step": 170159, "epoch": 1406} {"train_loss": -38.724769592285156, "global_step": 170160, "epoch": 1406} {"train_loss": -38.13640213012695, "global_step": 170161, "epoch": 1406} {"train_loss": -38.3077507019043, "global_step": 170162, "epoch": 1406} {"train_loss": -39.16133499145508, "global_step": 170163, "epoch": 1406} {"train_loss": -38.87516403198242, "global_step": 170164, "epoch": 1406} {"train_loss": -39.12746047973633, "global_step": 170165, "epoch": 1406} {"train_loss": -38.812171936035156, "global_step": 170166, "epoch": 1406} {"train_loss": -40.09461212158203, "global_step": 170167, "epoch": 1406} {"train_loss": -38.97504806518555, "global_step": 170168, "epoch": 1406} {"train_loss": -39.32079315185547, "global_step": 170169, "epoch": 1406} {"train_loss": -39.17879104614258, "global_step": 170170, "epoch": 1406} {"train_loss": -39.32892608642578, "global_step": 170171, "epoch": 1406} {"train_loss": -39.9318962097168, "global_step": 170172, "epoch": 1406} {"train_loss": -39.39628219604492, "global_step": 170173, "epoch": 1406} {"train_loss": -40.267669677734375, "global_step": 170174, "epoch": 1406} {"train_loss": -39.06721496582031, "global_step": 170175, "epoch": 1406} {"train_loss": -39.6967658996582, "global_step": 170176, "epoch": 1406} {"train_loss": -39.99589157104492, "global_step": 170177, "epoch": 1406} {"train_loss": -39.162452697753906, "global_step": 170178, "epoch": 1406} {"train_loss": -40.165523529052734, "global_step": 170179, "epoch": 1406} {"train_loss": -40.171852111816406, "global_step": 170180, "epoch": 1406} {"train_loss": -39.97965621948242, "global_step": 170181, "epoch": 1406} {"train_loss": -40.093971252441406, "global_step": 170182, "epoch": 1406} {"train_loss": -40.53514099121094, "global_step": 170183, "epoch": 1406} {"train_loss": -40.027130126953125, "global_step": 170184, "epoch": 1406} {"train_loss": -40.03540802001953, "global_step": 170185, "epoch": 1406} {"train_loss": -40.518733978271484, "global_step": 170186, "epoch": 1406} {"train_loss": -40.176475524902344, "global_step": 170187, "epoch": 1406} {"train_loss": -40.8249397277832, "global_step": 170188, "epoch": 1406} {"train_loss": -40.37180709838867, "global_step": 170189, "epoch": 1406} {"train_loss": -39.08576583862305, "global_step": 170190, "epoch": 1406} {"train_loss": -39.86683654785156, "global_step": 170191, "epoch": 1406} {"train_loss": -40.45913314819336, "global_step": 170192, "epoch": 1406} {"train_loss": -40.86715316772461, "global_step": 170193, "epoch": 1406} {"train_loss": -40.77402877807617, "global_step": 170194, "epoch": 1406} {"train_loss": -40.29661178588867, "global_step": 170195, "epoch": 1406} {"train_loss": -41.15769577026367, "global_step": 170196, "epoch": 1406} {"train_loss": -40.80171585083008, "global_step": 170197, "epoch": 1406} {"train_loss": -40.867279052734375, "global_step": 170198, "epoch": 1406} {"train_loss": -40.83047866821289, "global_step": 170199, "epoch": 1406} {"train_loss": -40.9665641784668, "global_step": 170200, "epoch": 1406} {"train_loss": -41.0183219909668, "global_step": 170201, "epoch": 1406} {"train_loss": -39.82659149169922, "global_step": 170202, "epoch": 1406} {"train_loss": -41.1347770690918, "global_step": 170203, "epoch": 1406} {"train_loss": -40.7419548034668, "global_step": 170204, "epoch": 1406} {"train_loss": -41.07187271118164, "global_step": 170205, "epoch": 1406} {"train_loss": -40.507110595703125, "global_step": 170206, "epoch": 1406} {"train_loss": -40.10221481323242, "global_step": 170207, "epoch": 1406} {"train_loss": -37.477996826171875, "global_step": 170208, "epoch": 1406} {"train_loss": -40.76190185546875, "global_step": 170209, "epoch": 1406} {"train_loss": -41.62565231323242, "global_step": 170210, "epoch": 1406} {"train_loss": -41.1793327331543, "global_step": 170211, "epoch": 1406} {"train_loss": -40.0442008972168, "global_step": 170212, "epoch": 1406} {"train_loss": -40.92033004760742, "global_step": 170213, "epoch": 1406} {"train_loss": -41.40557861328125, "global_step": 170214, "epoch": 1406} {"train_loss": -40.99007797241211, "global_step": 170215, "epoch": 1406} {"train_loss": -40.76877212524414, "global_step": 170216, "epoch": 1406} {"train_loss": -39.69696044921875, "global_step": 170217, "epoch": 1406} {"train_loss": -41.031005859375, "global_step": 170218, "epoch": 1406} {"train_loss": -40.343441009521484, "global_step": 170219, "epoch": 1406} {"train_loss": -40.198486328125, "global_step": 170220, "epoch": 1406} {"train_loss": -39.376441955566406, "global_step": 170221, "epoch": 1406} {"train_loss": -40.67582321166992, "global_step": 170222, "epoch": 1406} {"train_loss": -41.01414489746094, "global_step": 170223, "epoch": 1406} {"train_loss": -40.29196548461914, "global_step": 170224, "epoch": 1406} {"train_loss": -38.500038146972656, "global_step": 170225, "epoch": 1406} {"train_loss": -40.91855239868164, "global_step": 170226, "epoch": 1406} {"train_loss": -39.9713020324707, "global_step": 170227, "epoch": 1406} {"train_loss": -39.59334182739258, "global_step": 170228, "epoch": 1406} {"train_loss": -40.43019485473633, "global_step": 170229, "epoch": 1406} {"train_loss": -41.07094955444336, "global_step": 170230, "epoch": 1406} {"train_loss": -36.907470703125, "global_step": 170231, "epoch": 1406} {"train_loss": -40.748104095458984, "global_step": 170232, "epoch": 1406} {"train_loss": -39.190670013427734, "global_step": 170233, "epoch": 1406} {"train_loss": -35.8018913269043, "global_step": 170234, "epoch": 1406} {"train_loss": -39.0214958190918, "global_step": 170235, "epoch": 1406} {"train_loss": -40.2031364440918, "global_step": 170236, "epoch": 1406} {"train_loss": -39.38591384887695, "global_step": 170237, "epoch": 1406} {"train_loss": -38.989601135253906, "global_step": 170238, "epoch": 1406} {"train_loss": -38.8668212890625, "global_step": 170239, "epoch": 1406} {"train_loss": -34.9433708190918, "global_step": 170240, "epoch": 1406} {"train_loss": -39.88679122924805, "global_step": 170241, "epoch": 1406} {"train_loss": -37.499752044677734, "global_step": 170242, "epoch": 1406} {"train_loss": -35.801387786865234, "global_step": 170243, "epoch": 1406} {"train_loss": -39.02912139892578, "global_step": 170244, "epoch": 1406} {"train_loss": -39.03069305419922, "global_step": 170245, "epoch": 1406} {"train_loss": -38.734768449767564, "global_step": 170246, "epoch": 1406, "val_loss": 2819106.75} {"train_loss": -38.10437774658203, "global_step": 170247, "epoch": 1407} {"train_loss": -36.798274993896484, "global_step": 170248, "epoch": 1407} {"train_loss": -35.287689208984375, "global_step": 170249, "epoch": 1407} {"train_loss": -37.263511657714844, "global_step": 170250, "epoch": 1407} {"train_loss": -35.6446418762207, "global_step": 170251, "epoch": 1407} {"train_loss": -37.18842315673828, "global_step": 170252, "epoch": 1407} {"train_loss": -37.18852615356445, "global_step": 170253, "epoch": 1407} {"train_loss": -38.39512252807617, "global_step": 170254, "epoch": 1407} {"train_loss": -38.09273147583008, "global_step": 170255, "epoch": 1407} {"train_loss": -37.103389739990234, "global_step": 170256, "epoch": 1407} {"train_loss": -37.7620964050293, "global_step": 170257, "epoch": 1407} {"train_loss": -38.53229904174805, "global_step": 170258, "epoch": 1407} {"train_loss": -37.87725830078125, "global_step": 170259, "epoch": 1407} {"train_loss": -37.42498779296875, "global_step": 170260, "epoch": 1407} {"train_loss": -34.690582275390625, "global_step": 170261, "epoch": 1407} {"train_loss": -38.71596908569336, "global_step": 170262, "epoch": 1407} {"train_loss": -37.95550537109375, "global_step": 170263, "epoch": 1407} {"train_loss": -38.39715576171875, "global_step": 170264, "epoch": 1407} {"train_loss": -38.258644104003906, "global_step": 170265, "epoch": 1407} {"train_loss": -36.217315673828125, "global_step": 170266, "epoch": 1407} {"train_loss": -38.589080810546875, "global_step": 170267, "epoch": 1407} {"train_loss": -33.18553924560547, "global_step": 170268, "epoch": 1407} {"train_loss": -36.63609313964844, "global_step": 170269, "epoch": 1407} {"train_loss": -37.30925369262695, "global_step": 170270, "epoch": 1407} {"train_loss": -35.85732650756836, "global_step": 170271, "epoch": 1407} {"train_loss": -39.30045700073242, "global_step": 170272, "epoch": 1407} {"train_loss": -39.1585807800293, "global_step": 170273, "epoch": 1407} {"train_loss": -38.68317794799805, "global_step": 170274, "epoch": 1407} {"train_loss": -38.02334213256836, "global_step": 170275, "epoch": 1407} {"train_loss": -36.83857727050781, "global_step": 170276, "epoch": 1407} {"train_loss": -38.905982971191406, "global_step": 170277, "epoch": 1407} {"train_loss": -37.85663604736328, "global_step": 170278, "epoch": 1407} {"train_loss": -37.61476516723633, "global_step": 170279, "epoch": 1407} {"train_loss": -36.791595458984375, "global_step": 170280, "epoch": 1407} {"train_loss": -35.38840103149414, "global_step": 170281, "epoch": 1407} {"train_loss": -39.4982795715332, "global_step": 170282, "epoch": 1407} {"train_loss": -38.17152404785156, "global_step": 170283, "epoch": 1407} {"train_loss": -38.29752731323242, "global_step": 170284, "epoch": 1407} {"train_loss": -38.37075424194336, "global_step": 170285, "epoch": 1407} {"train_loss": -38.019744873046875, "global_step": 170286, "epoch": 1407} {"train_loss": -37.87424850463867, "global_step": 170287, "epoch": 1407} {"train_loss": -38.317726135253906, "global_step": 170288, "epoch": 1407} {"train_loss": -38.57984924316406, "global_step": 170289, "epoch": 1407} {"train_loss": -39.337982177734375, "global_step": 170290, "epoch": 1407} {"train_loss": -39.615516662597656, "global_step": 170291, "epoch": 1407} {"train_loss": -38.22815704345703, "global_step": 170292, "epoch": 1407} {"train_loss": -38.73311233520508, "global_step": 170293, "epoch": 1407} {"train_loss": -39.090972900390625, "global_step": 170294, "epoch": 1407} {"train_loss": -38.79191970825195, "global_step": 170295, "epoch": 1407} {"train_loss": -38.9722785949707, "global_step": 170296, "epoch": 1407} {"train_loss": -37.9947509765625, "global_step": 170297, "epoch": 1407} {"train_loss": -38.70899200439453, "global_step": 170298, "epoch": 1407} {"train_loss": -39.953426361083984, "global_step": 170299, "epoch": 1407} {"train_loss": -39.48893356323242, "global_step": 170300, "epoch": 1407} {"train_loss": -39.99702835083008, "global_step": 170301, "epoch": 1407} {"train_loss": -39.39910888671875, "global_step": 170302, "epoch": 1407} {"train_loss": -38.84489059448242, "global_step": 170303, "epoch": 1407} {"train_loss": -40.42277526855469, "global_step": 170304, "epoch": 1407} {"train_loss": -39.67108917236328, "global_step": 170305, "epoch": 1407} {"train_loss": -39.86848068237305, "global_step": 170306, "epoch": 1407} {"train_loss": -40.32674789428711, "global_step": 170307, "epoch": 1407} {"train_loss": -39.4110221862793, "global_step": 170308, "epoch": 1407} {"train_loss": -40.83699417114258, "global_step": 170309, "epoch": 1407} {"train_loss": -39.84760284423828, "global_step": 170310, "epoch": 1407} {"train_loss": -40.39820098876953, "global_step": 170311, "epoch": 1407} {"train_loss": -40.0897331237793, "global_step": 170312, "epoch": 1407} {"train_loss": -40.30251693725586, "global_step": 170313, "epoch": 1407} {"train_loss": -40.214717864990234, "global_step": 170314, "epoch": 1407} {"train_loss": -40.1856575012207, "global_step": 170315, "epoch": 1407} {"train_loss": -40.85870361328125, "global_step": 170316, "epoch": 1407} {"train_loss": -40.25408935546875, "global_step": 170317, "epoch": 1407} {"train_loss": -40.50749206542969, "global_step": 170318, "epoch": 1407} {"train_loss": -40.093833923339844, "global_step": 170319, "epoch": 1407} {"train_loss": -40.81201171875, "global_step": 170320, "epoch": 1407} {"train_loss": -40.74961471557617, "global_step": 170321, "epoch": 1407} {"train_loss": -40.99094772338867, "global_step": 170322, "epoch": 1407} {"train_loss": -40.95488739013672, "global_step": 170323, "epoch": 1407} {"train_loss": -40.35576629638672, "global_step": 170324, "epoch": 1407} {"train_loss": -40.3575553894043, "global_step": 170325, "epoch": 1407} {"train_loss": -41.120086669921875, "global_step": 170326, "epoch": 1407} {"train_loss": -40.29594039916992, "global_step": 170327, "epoch": 1407} {"train_loss": -40.04419708251953, "global_step": 170328, "epoch": 1407} {"train_loss": -40.48578643798828, "global_step": 170329, "epoch": 1407} {"train_loss": -41.182533264160156, "global_step": 170330, "epoch": 1407} {"train_loss": -40.469154357910156, "global_step": 170331, "epoch": 1407} {"train_loss": -40.077911376953125, "global_step": 170332, "epoch": 1407} {"train_loss": -40.00625228881836, "global_step": 170333, "epoch": 1407} {"train_loss": -40.1492919921875, "global_step": 170334, "epoch": 1407} {"train_loss": -39.77296447753906, "global_step": 170335, "epoch": 1407} {"train_loss": -40.24688720703125, "global_step": 170336, "epoch": 1407} {"train_loss": -40.721282958984375, "global_step": 170337, "epoch": 1407} {"train_loss": -40.76020050048828, "global_step": 170338, "epoch": 1407} {"train_loss": -40.33529281616211, "global_step": 170339, "epoch": 1407} {"train_loss": -41.00822067260742, "global_step": 170340, "epoch": 1407} {"train_loss": -41.17677688598633, "global_step": 170341, "epoch": 1407} {"train_loss": -40.04840087890625, "global_step": 170342, "epoch": 1407} {"train_loss": -40.750022888183594, "global_step": 170343, "epoch": 1407} {"train_loss": -39.8122444152832, "global_step": 170344, "epoch": 1407} {"train_loss": -41.35032653808594, "global_step": 170345, "epoch": 1407} {"train_loss": -41.226112365722656, "global_step": 170346, "epoch": 1407} {"train_loss": -41.32509994506836, "global_step": 170347, "epoch": 1407} {"train_loss": -40.91508102416992, "global_step": 170348, "epoch": 1407} {"train_loss": -40.32487487792969, "global_step": 170349, "epoch": 1407} {"train_loss": -38.28532028198242, "global_step": 170350, "epoch": 1407} {"train_loss": -37.26848220825195, "global_step": 170351, "epoch": 1407} {"train_loss": -36.5018424987793, "global_step": 170352, "epoch": 1407} {"train_loss": -34.10758590698242, "global_step": 170353, "epoch": 1407} {"train_loss": -37.37336349487305, "global_step": 170354, "epoch": 1407} {"train_loss": -37.779876708984375, "global_step": 170355, "epoch": 1407} {"train_loss": -39.49787902832031, "global_step": 170356, "epoch": 1407} {"train_loss": -38.58806228637695, "global_step": 170357, "epoch": 1407} {"train_loss": -40.5687370300293, "global_step": 170358, "epoch": 1407} {"train_loss": -39.800106048583984, "global_step": 170359, "epoch": 1407} {"train_loss": -40.35432815551758, "global_step": 170360, "epoch": 1407} {"train_loss": -40.54081344604492, "global_step": 170361, "epoch": 1407} {"train_loss": -40.634151458740234, "global_step": 170362, "epoch": 1407} {"train_loss": -39.56958770751953, "global_step": 170363, "epoch": 1407} {"train_loss": -40.12177276611328, "global_step": 170364, "epoch": 1407} {"train_loss": -39.996734619140625, "global_step": 170365, "epoch": 1407} {"train_loss": -40.52238845825195, "global_step": 170366, "epoch": 1407} {"train_loss": -39.04013751952116, "global_step": 170367, "epoch": 1407, "val_loss": 2791579.75} {"train_loss": -40.623870849609375, "global_step": 170368, "epoch": 1408} {"train_loss": -39.9169921875, "global_step": 170369, "epoch": 1408} {"train_loss": -39.602108001708984, "global_step": 170370, "epoch": 1408} {"train_loss": -40.05500411987305, "global_step": 170371, "epoch": 1408} {"train_loss": -39.465702056884766, "global_step": 170372, "epoch": 1408} {"train_loss": -40.137691497802734, "global_step": 170373, "epoch": 1408} {"train_loss": -39.8803825378418, "global_step": 170374, "epoch": 1408} {"train_loss": -41.0420036315918, "global_step": 170375, "epoch": 1408} {"train_loss": -39.51555252075195, "global_step": 170376, "epoch": 1408} {"train_loss": -40.44457244873047, "global_step": 170377, "epoch": 1408} {"train_loss": -40.2406120300293, "global_step": 170378, "epoch": 1408} {"train_loss": -40.13824462890625, "global_step": 170379, "epoch": 1408} {"train_loss": -40.031044006347656, "global_step": 170380, "epoch": 1408} {"train_loss": -40.56061553955078, "global_step": 170381, "epoch": 1408} {"train_loss": -41.007415771484375, "global_step": 170382, "epoch": 1408} {"train_loss": -40.62166213989258, "global_step": 170383, "epoch": 1408} {"train_loss": -40.80853271484375, "global_step": 170384, "epoch": 1408} {"train_loss": -41.14408493041992, "global_step": 170385, "epoch": 1408} {"train_loss": -39.5489501953125, "global_step": 170386, "epoch": 1408} {"train_loss": -39.57166290283203, "global_step": 170387, "epoch": 1408} {"train_loss": -39.3104248046875, "global_step": 170388, "epoch": 1408} {"train_loss": -40.379817962646484, "global_step": 170389, "epoch": 1408} {"train_loss": -41.17002487182617, "global_step": 170390, "epoch": 1408} {"train_loss": -40.386871337890625, "global_step": 170391, "epoch": 1408} {"train_loss": -40.113948822021484, "global_step": 170392, "epoch": 1408} {"train_loss": -41.31597900390625, "global_step": 170393, "epoch": 1408} {"train_loss": -40.14829635620117, "global_step": 170394, "epoch": 1408} {"train_loss": -40.5737190246582, "global_step": 170395, "epoch": 1408} {"train_loss": -40.7587890625, "global_step": 170396, "epoch": 1408} {"train_loss": -41.17695236206055, "global_step": 170397, "epoch": 1408} {"train_loss": -41.09531784057617, "global_step": 170398, "epoch": 1408} {"train_loss": -40.68494415283203, "global_step": 170399, "epoch": 1408} {"train_loss": -41.313323974609375, "global_step": 170400, "epoch": 1408} {"train_loss": -40.12681579589844, "global_step": 170401, "epoch": 1408} {"train_loss": -41.253700256347656, "global_step": 170402, "epoch": 1408} {"train_loss": -40.840187072753906, "global_step": 170403, "epoch": 1408} {"train_loss": -41.37498092651367, "global_step": 170404, "epoch": 1408} {"train_loss": -40.436988830566406, "global_step": 170405, "epoch": 1408} {"train_loss": -40.890316009521484, "global_step": 170406, "epoch": 1408} {"train_loss": -40.81671905517578, "global_step": 170407, "epoch": 1408} {"train_loss": -40.84316635131836, "global_step": 170408, "epoch": 1408} {"train_loss": -40.458919525146484, "global_step": 170409, "epoch": 1408} {"train_loss": -40.584930419921875, "global_step": 170410, "epoch": 1408} {"train_loss": -40.01007843017578, "global_step": 170411, "epoch": 1408} {"train_loss": -40.23634719848633, "global_step": 170412, "epoch": 1408} {"train_loss": -40.05796432495117, "global_step": 170413, "epoch": 1408} {"train_loss": -38.71199417114258, "global_step": 170414, "epoch": 1408} {"train_loss": -40.082942962646484, "global_step": 170415, "epoch": 1408} {"train_loss": -39.57393264770508, "global_step": 170416, "epoch": 1408} {"train_loss": -40.53983688354492, "global_step": 170417, "epoch": 1408} {"train_loss": -40.20991897583008, "global_step": 170418, "epoch": 1408} {"train_loss": -38.45559310913086, "global_step": 170419, "epoch": 1408} {"train_loss": -39.94374465942383, "global_step": 170420, "epoch": 1408} {"train_loss": -40.283817291259766, "global_step": 170421, "epoch": 1408} {"train_loss": -39.21552658081055, "global_step": 170422, "epoch": 1408} {"train_loss": -40.76755142211914, "global_step": 170423, "epoch": 1408} {"train_loss": -38.37797164916992, "global_step": 170424, "epoch": 1408} {"train_loss": -39.96639633178711, "global_step": 170425, "epoch": 1408} {"train_loss": -40.8349494934082, "global_step": 170426, "epoch": 1408} {"train_loss": -39.33820724487305, "global_step": 170427, "epoch": 1408} {"train_loss": -38.73359298706055, "global_step": 170428, "epoch": 1408} {"train_loss": -39.0775146484375, "global_step": 170429, "epoch": 1408} {"train_loss": -40.699607849121094, "global_step": 170430, "epoch": 1408} {"train_loss": -39.46379470825195, "global_step": 170431, "epoch": 1408} {"train_loss": -36.08530044555664, "global_step": 170432, "epoch": 1408} {"train_loss": -40.104488372802734, "global_step": 170433, "epoch": 1408} {"train_loss": -38.555824279785156, "global_step": 170434, "epoch": 1408} {"train_loss": -38.71416091918945, "global_step": 170435, "epoch": 1408} {"train_loss": -39.913639068603516, "global_step": 170436, "epoch": 1408} {"train_loss": -39.404544830322266, "global_step": 170437, "epoch": 1408} {"train_loss": -39.756099700927734, "global_step": 170438, "epoch": 1408} {"train_loss": -39.65253448486328, "global_step": 170439, "epoch": 1408} {"train_loss": -39.94287872314453, "global_step": 170440, "epoch": 1408} {"train_loss": -40.2424430847168, "global_step": 170441, "epoch": 1408} {"train_loss": -39.25873947143555, "global_step": 170442, "epoch": 1408} {"train_loss": -40.53651809692383, "global_step": 170443, "epoch": 1408} {"train_loss": -40.72050476074219, "global_step": 170444, "epoch": 1408} {"train_loss": -39.39742660522461, "global_step": 170445, "epoch": 1408} {"train_loss": -40.530452728271484, "global_step": 170446, "epoch": 1408} {"train_loss": -39.87013244628906, "global_step": 170447, "epoch": 1408} {"train_loss": -39.93837356567383, "global_step": 170448, "epoch": 1408} {"train_loss": -40.14803695678711, "global_step": 170449, "epoch": 1408} {"train_loss": -40.685340881347656, "global_step": 170450, "epoch": 1408} {"train_loss": -38.93837356567383, "global_step": 170451, "epoch": 1408} {"train_loss": -41.02870178222656, "global_step": 170452, "epoch": 1408} {"train_loss": -39.98533248901367, "global_step": 170453, "epoch": 1408} {"train_loss": -41.22696304321289, "global_step": 170454, "epoch": 1408} {"train_loss": -40.20899963378906, "global_step": 170455, "epoch": 1408} {"train_loss": -40.82461929321289, "global_step": 170456, "epoch": 1408} {"train_loss": -40.816200256347656, "global_step": 170457, "epoch": 1408} {"train_loss": -40.18709182739258, "global_step": 170458, "epoch": 1408} {"train_loss": -40.3194465637207, "global_step": 170459, "epoch": 1408} {"train_loss": -41.202552795410156, "global_step": 170460, "epoch": 1408} {"train_loss": -39.73728561401367, "global_step": 170461, "epoch": 1408} {"train_loss": -40.228729248046875, "global_step": 170462, "epoch": 1408} {"train_loss": -40.51226806640625, "global_step": 170463, "epoch": 1408} {"train_loss": -40.08182907104492, "global_step": 170464, "epoch": 1408} {"train_loss": -41.15324401855469, "global_step": 170465, "epoch": 1408} {"train_loss": -40.5396728515625, "global_step": 170466, "epoch": 1408} {"train_loss": -40.53031921386719, "global_step": 170467, "epoch": 1408} {"train_loss": -40.73259353637695, "global_step": 170468, "epoch": 1408} {"train_loss": -40.868587493896484, "global_step": 170469, "epoch": 1408} {"train_loss": -40.942378997802734, "global_step": 170470, "epoch": 1408} {"train_loss": -41.46950912475586, "global_step": 170471, "epoch": 1408} {"train_loss": -36.14817810058594, "global_step": 170472, "epoch": 1408} {"train_loss": -41.14654541015625, "global_step": 170473, "epoch": 1408} {"train_loss": -38.951324462890625, "global_step": 170474, "epoch": 1408} {"train_loss": -41.29692459106445, "global_step": 170475, "epoch": 1408} {"train_loss": -41.571075439453125, "global_step": 170476, "epoch": 1408} {"train_loss": -40.39666748046875, "global_step": 170477, "epoch": 1408} {"train_loss": -41.32379913330078, "global_step": 170478, "epoch": 1408} {"train_loss": -41.21014404296875, "global_step": 170479, "epoch": 1408} {"train_loss": -41.03656768798828, "global_step": 170480, "epoch": 1408} {"train_loss": -40.025508880615234, "global_step": 170481, "epoch": 1408} {"train_loss": -41.47473907470703, "global_step": 170482, "epoch": 1408} {"train_loss": -40.757545471191406, "global_step": 170483, "epoch": 1408} {"train_loss": -41.514556884765625, "global_step": 170484, "epoch": 1408} {"train_loss": -39.96380615234375, "global_step": 170485, "epoch": 1408} {"train_loss": -40.70699691772461, "global_step": 170486, "epoch": 1408} {"train_loss": -41.36323165893555, "global_step": 170487, "epoch": 1408} {"train_loss": -40.24052753921383, "global_step": 170488, "epoch": 1408, "val_loss": 2792525.0} {"train_loss": -41.23592758178711, "global_step": 170489, "epoch": 1409} {"train_loss": -41.269775390625, "global_step": 170490, "epoch": 1409} {"train_loss": -40.15364456176758, "global_step": 170491, "epoch": 1409} {"train_loss": -36.9531135559082, "global_step": 170492, "epoch": 1409} {"train_loss": -40.121795654296875, "global_step": 170493, "epoch": 1409} {"train_loss": -40.0489616394043, "global_step": 170494, "epoch": 1409} {"train_loss": -40.98225021362305, "global_step": 170495, "epoch": 1409} {"train_loss": -38.94814682006836, "global_step": 170496, "epoch": 1409} {"train_loss": -41.31266784667969, "global_step": 170497, "epoch": 1409} {"train_loss": -40.01272201538086, "global_step": 170498, "epoch": 1409} {"train_loss": -39.372196197509766, "global_step": 170499, "epoch": 1409} {"train_loss": -41.49018478393555, "global_step": 170500, "epoch": 1409} {"train_loss": -37.6243782043457, "global_step": 170501, "epoch": 1409} {"train_loss": -40.20530319213867, "global_step": 170502, "epoch": 1409} {"train_loss": -37.13133239746094, "global_step": 170503, "epoch": 1409} {"train_loss": -38.11604690551758, "global_step": 170504, "epoch": 1409} {"train_loss": -40.51601028442383, "global_step": 170505, "epoch": 1409} {"train_loss": -37.184932708740234, "global_step": 170506, "epoch": 1409} {"train_loss": -37.74945068359375, "global_step": 170507, "epoch": 1409} {"train_loss": -38.242061614990234, "global_step": 170508, "epoch": 1409} {"train_loss": -39.83774185180664, "global_step": 170509, "epoch": 1409} {"train_loss": -32.25885009765625, "global_step": 170510, "epoch": 1409} {"train_loss": -39.88552474975586, "global_step": 170511, "epoch": 1409} {"train_loss": -38.96952819824219, "global_step": 170512, "epoch": 1409} {"train_loss": -38.97905349731445, "global_step": 170513, "epoch": 1409} {"train_loss": -39.8858528137207, "global_step": 170514, "epoch": 1409} {"train_loss": -37.997650146484375, "global_step": 170515, "epoch": 1409} {"train_loss": -36.705379486083984, "global_step": 170516, "epoch": 1409} {"train_loss": -35.48586654663086, "global_step": 170517, "epoch": 1409} {"train_loss": -36.94575500488281, "global_step": 170518, "epoch": 1409} {"train_loss": -35.770057678222656, "global_step": 170519, "epoch": 1409} {"train_loss": -37.342315673828125, "global_step": 170520, "epoch": 1409} {"train_loss": -37.88210678100586, "global_step": 170521, "epoch": 1409} {"train_loss": -38.2990608215332, "global_step": 170522, "epoch": 1409} {"train_loss": -39.582061767578125, "global_step": 170523, "epoch": 1409} {"train_loss": -38.12370681762695, "global_step": 170524, "epoch": 1409} {"train_loss": -39.63606643676758, "global_step": 170525, "epoch": 1409} {"train_loss": -38.84944534301758, "global_step": 170526, "epoch": 1409} {"train_loss": -39.87382888793945, "global_step": 170527, "epoch": 1409} {"train_loss": -39.26414108276367, "global_step": 170528, "epoch": 1409} {"train_loss": -40.28960037231445, "global_step": 170529, "epoch": 1409} {"train_loss": -40.267547607421875, "global_step": 170530, "epoch": 1409} {"train_loss": -40.020442962646484, "global_step": 170531, "epoch": 1409} {"train_loss": -40.209083557128906, "global_step": 170532, "epoch": 1409} {"train_loss": -39.910179138183594, "global_step": 170533, "epoch": 1409} {"train_loss": -39.93042755126953, "global_step": 170534, "epoch": 1409} {"train_loss": -40.02394104003906, "global_step": 170535, "epoch": 1409} {"train_loss": -40.59660720825195, "global_step": 170536, "epoch": 1409} {"train_loss": -40.32598114013672, "global_step": 170537, "epoch": 1409} {"train_loss": -40.608036041259766, "global_step": 170538, "epoch": 1409} {"train_loss": -40.358131408691406, "global_step": 170539, "epoch": 1409} {"train_loss": -40.70262145996094, "global_step": 170540, "epoch": 1409} {"train_loss": -40.2039909362793, "global_step": 170541, "epoch": 1409} {"train_loss": -40.371150970458984, "global_step": 170542, "epoch": 1409} {"train_loss": -40.59493637084961, "global_step": 170543, "epoch": 1409} {"train_loss": -40.968196868896484, "global_step": 170544, "epoch": 1409} {"train_loss": -39.38100814819336, "global_step": 170545, "epoch": 1409} {"train_loss": -40.577430725097656, "global_step": 170546, "epoch": 1409} {"train_loss": -40.805667877197266, "global_step": 170547, "epoch": 1409} {"train_loss": -40.29630661010742, "global_step": 170548, "epoch": 1409} {"train_loss": -40.825599670410156, "global_step": 170549, "epoch": 1409} {"train_loss": -40.917476654052734, "global_step": 170550, "epoch": 1409} {"train_loss": -41.02579879760742, "global_step": 170551, "epoch": 1409} {"train_loss": -41.32468795776367, "global_step": 170552, "epoch": 1409} {"train_loss": -39.89802932739258, "global_step": 170553, "epoch": 1409} {"train_loss": -40.78501892089844, "global_step": 170554, "epoch": 1409} {"train_loss": -41.18986129760742, "global_step": 170555, "epoch": 1409} {"train_loss": -40.964324951171875, "global_step": 170556, "epoch": 1409} {"train_loss": -41.02136993408203, "global_step": 170557, "epoch": 1409} {"train_loss": -41.02743148803711, "global_step": 170558, "epoch": 1409} {"train_loss": -38.76359176635742, "global_step": 170559, "epoch": 1409} {"train_loss": -39.61145782470703, "global_step": 170560, "epoch": 1409} {"train_loss": -41.13186264038086, "global_step": 170561, "epoch": 1409} {"train_loss": -40.0650634765625, "global_step": 170562, "epoch": 1409} {"train_loss": -41.1912841796875, "global_step": 170563, "epoch": 1409} {"train_loss": -41.18918991088867, "global_step": 170564, "epoch": 1409} {"train_loss": -40.84405517578125, "global_step": 170565, "epoch": 1409} {"train_loss": -39.97822952270508, "global_step": 170566, "epoch": 1409} {"train_loss": -40.48878479003906, "global_step": 170567, "epoch": 1409} {"train_loss": -40.65103530883789, "global_step": 170568, "epoch": 1409} {"train_loss": -41.4836311340332, "global_step": 170569, "epoch": 1409} {"train_loss": -41.6190299987793, "global_step": 170570, "epoch": 1409} {"train_loss": -38.992149353027344, "global_step": 170571, "epoch": 1409} {"train_loss": -40.8411865234375, "global_step": 170572, "epoch": 1409} {"train_loss": -39.97294235229492, "global_step": 170573, "epoch": 1409} {"train_loss": -41.26717758178711, "global_step": 170574, "epoch": 1409} {"train_loss": -40.858455657958984, "global_step": 170575, "epoch": 1409} {"train_loss": -41.27401351928711, "global_step": 170576, "epoch": 1409} {"train_loss": -40.40338897705078, "global_step": 170577, "epoch": 1409} {"train_loss": -41.31501770019531, "global_step": 170578, "epoch": 1409} {"train_loss": -39.343135833740234, "global_step": 170579, "epoch": 1409} {"train_loss": -38.5267448425293, "global_step": 170580, "epoch": 1409} {"train_loss": -40.61876678466797, "global_step": 170581, "epoch": 1409} {"train_loss": -41.0905647277832, "global_step": 170582, "epoch": 1409} {"train_loss": -38.33332061767578, "global_step": 170583, "epoch": 1409} {"train_loss": -36.0691032409668, "global_step": 170584, "epoch": 1409} {"train_loss": -39.96337890625, "global_step": 170585, "epoch": 1409} {"train_loss": -40.34951400756836, "global_step": 170586, "epoch": 1409} {"train_loss": -39.46926498413086, "global_step": 170587, "epoch": 1409} {"train_loss": -40.43159103393555, "global_step": 170588, "epoch": 1409} {"train_loss": -38.819766998291016, "global_step": 170589, "epoch": 1409} {"train_loss": -40.736602783203125, "global_step": 170590, "epoch": 1409} {"train_loss": -39.977413177490234, "global_step": 170591, "epoch": 1409} {"train_loss": -34.6793327331543, "global_step": 170592, "epoch": 1409} {"train_loss": -38.46895980834961, "global_step": 170593, "epoch": 1409} {"train_loss": -40.090248107910156, "global_step": 170594, "epoch": 1409} {"train_loss": -38.72144317626953, "global_step": 170595, "epoch": 1409} {"train_loss": -38.60567855834961, "global_step": 170596, "epoch": 1409} {"train_loss": -35.589717864990234, "global_step": 170597, "epoch": 1409} {"train_loss": -37.97517013549805, "global_step": 170598, "epoch": 1409} {"train_loss": -38.28059768676758, "global_step": 170599, "epoch": 1409} {"train_loss": -40.19965362548828, "global_step": 170600, "epoch": 1409} {"train_loss": -37.96735382080078, "global_step": 170601, "epoch": 1409} {"train_loss": -40.507083892822266, "global_step": 170602, "epoch": 1409} {"train_loss": -38.51567459106445, "global_step": 170603, "epoch": 1409} {"train_loss": -40.1112174987793, "global_step": 170604, "epoch": 1409} {"train_loss": -36.12789535522461, "global_step": 170605, "epoch": 1409} {"train_loss": -38.947418212890625, "global_step": 170606, "epoch": 1409} {"train_loss": -39.61801528930664, "global_step": 170607, "epoch": 1409} {"train_loss": -36.96430206298828, "global_step": 170608, "epoch": 1409} {"train_loss": -39.50390839379681, "global_step": 170609, "epoch": 1409, "val_loss": 2915302.0} {"train_loss": -39.76051712036133, "global_step": 170610, "epoch": 1410} {"train_loss": -36.61979293823242, "global_step": 170611, "epoch": 1410} {"train_loss": -38.51712417602539, "global_step": 170612, "epoch": 1410} {"train_loss": -39.27518844604492, "global_step": 170613, "epoch": 1410} {"train_loss": -38.824317932128906, "global_step": 170614, "epoch": 1410} {"train_loss": -35.44306945800781, "global_step": 170615, "epoch": 1410} {"train_loss": -37.80955123901367, "global_step": 170616, "epoch": 1410} {"train_loss": -39.09162139892578, "global_step": 170617, "epoch": 1410} {"train_loss": -37.86005401611328, "global_step": 170618, "epoch": 1410} {"train_loss": -35.5712776184082, "global_step": 170619, "epoch": 1410} {"train_loss": -39.3658447265625, "global_step": 170620, "epoch": 1410} {"train_loss": -38.59695053100586, "global_step": 170621, "epoch": 1410} {"train_loss": -37.842315673828125, "global_step": 170622, "epoch": 1410} {"train_loss": -38.633663177490234, "global_step": 170623, "epoch": 1410} {"train_loss": -39.68308639526367, "global_step": 170624, "epoch": 1410} {"train_loss": -39.313785552978516, "global_step": 170625, "epoch": 1410} {"train_loss": -37.921993255615234, "global_step": 170626, "epoch": 1410} {"train_loss": -39.23115921020508, "global_step": 170627, "epoch": 1410} {"train_loss": -39.09406280517578, "global_step": 170628, "epoch": 1410} {"train_loss": -40.238243103027344, "global_step": 170629, "epoch": 1410} {"train_loss": -39.95819091796875, "global_step": 170630, "epoch": 1410} {"train_loss": -39.794673919677734, "global_step": 170631, "epoch": 1410} {"train_loss": -36.19728469848633, "global_step": 170632, "epoch": 1410} {"train_loss": -39.02656173706055, "global_step": 170633, "epoch": 1410} {"train_loss": -39.85152816772461, "global_step": 170634, "epoch": 1410} {"train_loss": -39.59726333618164, "global_step": 170635, "epoch": 1410} {"train_loss": -36.97690200805664, "global_step": 170636, "epoch": 1410} {"train_loss": -39.25852966308594, "global_step": 170637, "epoch": 1410} {"train_loss": -39.37184524536133, "global_step": 170638, "epoch": 1410} {"train_loss": -40.551124572753906, "global_step": 170639, "epoch": 1410} {"train_loss": -39.875770568847656, "global_step": 170640, "epoch": 1410} {"train_loss": -40.25008010864258, "global_step": 170641, "epoch": 1410} {"train_loss": -39.3382682800293, "global_step": 170642, "epoch": 1410} {"train_loss": -37.98012924194336, "global_step": 170643, "epoch": 1410} {"train_loss": -38.886268615722656, "global_step": 170644, "epoch": 1410} {"train_loss": -40.60890579223633, "global_step": 170645, "epoch": 1410} {"train_loss": -40.429420471191406, "global_step": 170646, "epoch": 1410} {"train_loss": -39.28306198120117, "global_step": 170647, "epoch": 1410} {"train_loss": -39.961082458496094, "global_step": 170648, "epoch": 1410} {"train_loss": -40.78239059448242, "global_step": 170649, "epoch": 1410} {"train_loss": -39.9660758972168, "global_step": 170650, "epoch": 1410} {"train_loss": -39.93596267700195, "global_step": 170651, "epoch": 1410} {"train_loss": -38.7523307800293, "global_step": 170652, "epoch": 1410} {"train_loss": -39.6947021484375, "global_step": 170653, "epoch": 1410} {"train_loss": -32.912750244140625, "global_step": 170654, "epoch": 1410} {"train_loss": -37.39274978637695, "global_step": 170655, "epoch": 1410} {"train_loss": -39.634376525878906, "global_step": 170656, "epoch": 1410} {"train_loss": -40.078556060791016, "global_step": 170657, "epoch": 1410} {"train_loss": -39.80941390991211, "global_step": 170658, "epoch": 1410} {"train_loss": -39.79780197143555, "global_step": 170659, "epoch": 1410} {"train_loss": -39.36031723022461, "global_step": 170660, "epoch": 1410} {"train_loss": -38.94159698486328, "global_step": 170661, "epoch": 1410} {"train_loss": -38.06892776489258, "global_step": 170662, "epoch": 1410} {"train_loss": -39.45661544799805, "global_step": 170663, "epoch": 1410} {"train_loss": -38.75687026977539, "global_step": 170664, "epoch": 1410} {"train_loss": -38.1197509765625, "global_step": 170665, "epoch": 1410} {"train_loss": -39.15149688720703, "global_step": 170666, "epoch": 1410} {"train_loss": -39.4326286315918, "global_step": 170667, "epoch": 1410} {"train_loss": -39.63339614868164, "global_step": 170668, "epoch": 1410} {"train_loss": -39.700870513916016, "global_step": 170669, "epoch": 1410} {"train_loss": -39.92311096191406, "global_step": 170670, "epoch": 1410} {"train_loss": -40.505775451660156, "global_step": 170671, "epoch": 1410} {"train_loss": -39.94826889038086, "global_step": 170672, "epoch": 1410} {"train_loss": -40.43391036987305, "global_step": 170673, "epoch": 1410} {"train_loss": -40.1451416015625, "global_step": 170674, "epoch": 1410} {"train_loss": -40.32640838623047, "global_step": 170675, "epoch": 1410} {"train_loss": -39.86181640625, "global_step": 170676, "epoch": 1410} {"train_loss": -39.65918731689453, "global_step": 170677, "epoch": 1410} {"train_loss": -39.2432975769043, "global_step": 170678, "epoch": 1410} {"train_loss": -40.633056640625, "global_step": 170679, "epoch": 1410} {"train_loss": -40.405765533447266, "global_step": 170680, "epoch": 1410} {"train_loss": -39.98679733276367, "global_step": 170681, "epoch": 1410} {"train_loss": -40.439449310302734, "global_step": 170682, "epoch": 1410} {"train_loss": -40.53479766845703, "global_step": 170683, "epoch": 1410} {"train_loss": -39.700042724609375, "global_step": 170684, "epoch": 1410} {"train_loss": -40.82089614868164, "global_step": 170685, "epoch": 1410} {"train_loss": -40.37946319580078, "global_step": 170686, "epoch": 1410} {"train_loss": -40.43556213378906, "global_step": 170687, "epoch": 1410} {"train_loss": -40.2506217956543, "global_step": 170688, "epoch": 1410} {"train_loss": -40.138240814208984, "global_step": 170689, "epoch": 1410} {"train_loss": -40.2058219909668, "global_step": 170690, "epoch": 1410} {"train_loss": -40.86381912231445, "global_step": 170691, "epoch": 1410} {"train_loss": -40.48748016357422, "global_step": 170692, "epoch": 1410} {"train_loss": -40.60367965698242, "global_step": 170693, "epoch": 1410} {"train_loss": -40.771183013916016, "global_step": 170694, "epoch": 1410} {"train_loss": -40.789180755615234, "global_step": 170695, "epoch": 1410} {"train_loss": -40.99403762817383, "global_step": 170696, "epoch": 1410} {"train_loss": -40.38239669799805, "global_step": 170697, "epoch": 1410} {"train_loss": -40.86896896362305, "global_step": 170698, "epoch": 1410} {"train_loss": -40.63711166381836, "global_step": 170699, "epoch": 1410} {"train_loss": -40.90226364135742, "global_step": 170700, "epoch": 1410} {"train_loss": -40.46638107299805, "global_step": 170701, "epoch": 1410} {"train_loss": -41.09912109375, "global_step": 170702, "epoch": 1410} {"train_loss": -40.72551727294922, "global_step": 170703, "epoch": 1410} {"train_loss": -41.02378463745117, "global_step": 170704, "epoch": 1410} {"train_loss": -40.74660110473633, "global_step": 170705, "epoch": 1410} {"train_loss": -40.55188751220703, "global_step": 170706, "epoch": 1410} {"train_loss": -41.333675384521484, "global_step": 170707, "epoch": 1410} {"train_loss": -40.96015930175781, "global_step": 170708, "epoch": 1410} {"train_loss": -40.0009765625, "global_step": 170709, "epoch": 1410} {"train_loss": -40.56269836425781, "global_step": 170710, "epoch": 1410} {"train_loss": -41.01314163208008, "global_step": 170711, "epoch": 1410} {"train_loss": -41.03718948364258, "global_step": 170712, "epoch": 1410} {"train_loss": -40.82258987426758, "global_step": 170713, "epoch": 1410} {"train_loss": -40.09473419189453, "global_step": 170714, "epoch": 1410} {"train_loss": -40.72511672973633, "global_step": 170715, "epoch": 1410} {"train_loss": -39.55560302734375, "global_step": 170716, "epoch": 1410} {"train_loss": -40.52998733520508, "global_step": 170717, "epoch": 1410} {"train_loss": -39.7809944152832, "global_step": 170718, "epoch": 1410} {"train_loss": -41.502044677734375, "global_step": 170719, "epoch": 1410} {"train_loss": -40.36332321166992, "global_step": 170720, "epoch": 1410} {"train_loss": -39.38163375854492, "global_step": 170721, "epoch": 1410} {"train_loss": -38.66619873046875, "global_step": 170722, "epoch": 1410} {"train_loss": -35.74739074707031, "global_step": 170723, "epoch": 1410} {"train_loss": -32.717403411865234, "global_step": 170724, "epoch": 1410} {"train_loss": -32.17584991455078, "global_step": 170725, "epoch": 1410} {"train_loss": -39.28744125366211, "global_step": 170726, "epoch": 1410} {"train_loss": -39.748695373535156, "global_step": 170727, "epoch": 1410} {"train_loss": -35.18618392944336, "global_step": 170728, "epoch": 1410} {"train_loss": -34.519771575927734, "global_step": 170729, "epoch": 1410} {"train_loss": -39.38597034422819, "global_step": 170730, "epoch": 1410, "val_loss": 2679173.0} {"train_loss": -37.5461540222168, "global_step": 170731, "epoch": 1411} {"train_loss": -38.46458053588867, "global_step": 170732, "epoch": 1411} {"train_loss": -39.61408615112305, "global_step": 170733, "epoch": 1411} {"train_loss": -39.792152404785156, "global_step": 170734, "epoch": 1411} {"train_loss": -38.270965576171875, "global_step": 170735, "epoch": 1411} {"train_loss": -38.373443603515625, "global_step": 170736, "epoch": 1411} {"train_loss": -39.47417068481445, "global_step": 170737, "epoch": 1411} {"train_loss": -40.35905838012695, "global_step": 170738, "epoch": 1411} {"train_loss": -39.94659423828125, "global_step": 170739, "epoch": 1411} {"train_loss": -39.54399490356445, "global_step": 170740, "epoch": 1411} {"train_loss": -40.673091888427734, "global_step": 170741, "epoch": 1411} {"train_loss": -39.86539840698242, "global_step": 170742, "epoch": 1411} {"train_loss": -40.771236419677734, "global_step": 170743, "epoch": 1411} {"train_loss": -39.77908706665039, "global_step": 170744, "epoch": 1411} {"train_loss": -38.99549865722656, "global_step": 170745, "epoch": 1411} {"train_loss": -39.33323669433594, "global_step": 170746, "epoch": 1411} {"train_loss": -39.830543518066406, "global_step": 170747, "epoch": 1411} {"train_loss": -39.76068878173828, "global_step": 170748, "epoch": 1411} {"train_loss": -40.33022689819336, "global_step": 170749, "epoch": 1411} {"train_loss": -39.85689926147461, "global_step": 170750, "epoch": 1411} {"train_loss": -39.9394645690918, "global_step": 170751, "epoch": 1411} {"train_loss": -40.052528381347656, "global_step": 170752, "epoch": 1411} {"train_loss": -39.02968978881836, "global_step": 170753, "epoch": 1411} {"train_loss": -40.487525939941406, "global_step": 170754, "epoch": 1411} {"train_loss": -39.456275939941406, "global_step": 170755, "epoch": 1411} {"train_loss": -39.905670166015625, "global_step": 170756, "epoch": 1411} {"train_loss": -39.77589797973633, "global_step": 170757, "epoch": 1411} {"train_loss": -39.966224670410156, "global_step": 170758, "epoch": 1411} {"train_loss": -38.01162338256836, "global_step": 170759, "epoch": 1411} {"train_loss": -39.92947006225586, "global_step": 170760, "epoch": 1411} {"train_loss": -39.86177444458008, "global_step": 170761, "epoch": 1411} {"train_loss": -40.23180389404297, "global_step": 170762, "epoch": 1411} {"train_loss": -40.81217575073242, "global_step": 170763, "epoch": 1411} {"train_loss": -39.45591735839844, "global_step": 170764, "epoch": 1411} {"train_loss": -40.106605529785156, "global_step": 170765, "epoch": 1411} {"train_loss": -40.30265426635742, "global_step": 170766, "epoch": 1411} {"train_loss": -40.15703201293945, "global_step": 170767, "epoch": 1411} {"train_loss": -40.85602951049805, "global_step": 170768, "epoch": 1411} {"train_loss": -40.660762786865234, "global_step": 170769, "epoch": 1411} {"train_loss": -40.79707336425781, "global_step": 170770, "epoch": 1411} {"train_loss": -39.93827438354492, "global_step": 170771, "epoch": 1411} {"train_loss": -40.23989486694336, "global_step": 170772, "epoch": 1411} {"train_loss": -40.77922821044922, "global_step": 170773, "epoch": 1411} {"train_loss": -39.81612014770508, "global_step": 170774, "epoch": 1411} {"train_loss": -40.49216842651367, "global_step": 170775, "epoch": 1411} {"train_loss": -40.989898681640625, "global_step": 170776, "epoch": 1411} {"train_loss": -40.2708854675293, "global_step": 170777, "epoch": 1411} {"train_loss": -41.11054229736328, "global_step": 170778, "epoch": 1411} {"train_loss": -40.67781066894531, "global_step": 170779, "epoch": 1411} {"train_loss": -41.52698516845703, "global_step": 170780, "epoch": 1411} {"train_loss": -40.96548080444336, "global_step": 170781, "epoch": 1411} {"train_loss": -40.44953918457031, "global_step": 170782, "epoch": 1411} {"train_loss": -41.39107894897461, "global_step": 170783, "epoch": 1411} {"train_loss": -41.026363372802734, "global_step": 170784, "epoch": 1411} {"train_loss": -40.52602005004883, "global_step": 170785, "epoch": 1411} {"train_loss": -41.21437454223633, "global_step": 170786, "epoch": 1411} {"train_loss": -40.98902130126953, "global_step": 170787, "epoch": 1411} {"train_loss": -41.44529342651367, "global_step": 170788, "epoch": 1411} {"train_loss": -40.946834564208984, "global_step": 170789, "epoch": 1411} {"train_loss": -41.13275909423828, "global_step": 170790, "epoch": 1411} {"train_loss": -41.255584716796875, "global_step": 170791, "epoch": 1411} {"train_loss": -41.01408004760742, "global_step": 170792, "epoch": 1411} {"train_loss": -41.08218002319336, "global_step": 170793, "epoch": 1411} {"train_loss": -40.73419952392578, "global_step": 170794, "epoch": 1411} {"train_loss": -41.2641487121582, "global_step": 170795, "epoch": 1411} {"train_loss": -41.70015335083008, "global_step": 170796, "epoch": 1411} {"train_loss": -41.517940521240234, "global_step": 170797, "epoch": 1411} {"train_loss": -41.0941276550293, "global_step": 170798, "epoch": 1411} {"train_loss": -41.5776252746582, "global_step": 170799, "epoch": 1411} {"train_loss": -39.86090850830078, "global_step": 170800, "epoch": 1411} {"train_loss": -41.17924880981445, "global_step": 170801, "epoch": 1411} {"train_loss": -41.27396774291992, "global_step": 170802, "epoch": 1411} {"train_loss": -41.573177337646484, "global_step": 170803, "epoch": 1411} {"train_loss": -41.28998947143555, "global_step": 170804, "epoch": 1411} {"train_loss": -41.6265754699707, "global_step": 170805, "epoch": 1411} {"train_loss": -41.370819091796875, "global_step": 170806, "epoch": 1411} {"train_loss": -41.42422866821289, "global_step": 170807, "epoch": 1411} {"train_loss": -41.10614776611328, "global_step": 170808, "epoch": 1411} {"train_loss": -41.2413444519043, "global_step": 170809, "epoch": 1411} {"train_loss": -41.764442443847656, "global_step": 170810, "epoch": 1411} {"train_loss": -41.47237777709961, "global_step": 170811, "epoch": 1411} {"train_loss": -40.76443099975586, "global_step": 170812, "epoch": 1411} {"train_loss": -40.85776901245117, "global_step": 170813, "epoch": 1411} {"train_loss": -41.961402893066406, "global_step": 170814, "epoch": 1411} {"train_loss": -41.8565788269043, "global_step": 170815, "epoch": 1411} {"train_loss": -41.04994583129883, "global_step": 170816, "epoch": 1411} {"train_loss": -40.55207061767578, "global_step": 170817, "epoch": 1411} {"train_loss": -40.697181701660156, "global_step": 170818, "epoch": 1411} {"train_loss": -40.64640426635742, "global_step": 170819, "epoch": 1411} {"train_loss": -39.4120979309082, "global_step": 170820, "epoch": 1411} {"train_loss": -38.811397552490234, "global_step": 170821, "epoch": 1411} {"train_loss": -39.235809326171875, "global_step": 170822, "epoch": 1411} {"train_loss": -39.36628341674805, "global_step": 170823, "epoch": 1411} {"train_loss": -41.0767822265625, "global_step": 170824, "epoch": 1411} {"train_loss": -41.67851257324219, "global_step": 170825, "epoch": 1411} {"train_loss": -39.607784271240234, "global_step": 170826, "epoch": 1411} {"train_loss": -41.121337890625, "global_step": 170827, "epoch": 1411} {"train_loss": -41.138702392578125, "global_step": 170828, "epoch": 1411} {"train_loss": -40.68644332885742, "global_step": 170829, "epoch": 1411} {"train_loss": -41.48230743408203, "global_step": 170830, "epoch": 1411} {"train_loss": -41.485347747802734, "global_step": 170831, "epoch": 1411} {"train_loss": -40.27411651611328, "global_step": 170832, "epoch": 1411} {"train_loss": -39.982093811035156, "global_step": 170833, "epoch": 1411} {"train_loss": -41.429847717285156, "global_step": 170834, "epoch": 1411} {"train_loss": -40.34383010864258, "global_step": 170835, "epoch": 1411} {"train_loss": -39.25711441040039, "global_step": 170836, "epoch": 1411} {"train_loss": -41.48939895629883, "global_step": 170837, "epoch": 1411} {"train_loss": -41.49528884887695, "global_step": 170838, "epoch": 1411} {"train_loss": -39.97921371459961, "global_step": 170839, "epoch": 1411} {"train_loss": -41.41472244262695, "global_step": 170840, "epoch": 1411} {"train_loss": -41.15585708618164, "global_step": 170841, "epoch": 1411} {"train_loss": -40.80397415161133, "global_step": 170842, "epoch": 1411} {"train_loss": -41.22211456298828, "global_step": 170843, "epoch": 1411} {"train_loss": -41.46476364135742, "global_step": 170844, "epoch": 1411} {"train_loss": -41.42477035522461, "global_step": 170845, "epoch": 1411} {"train_loss": -41.38112258911133, "global_step": 170846, "epoch": 1411} {"train_loss": -41.36880111694336, "global_step": 170847, "epoch": 1411} {"train_loss": -41.31196975708008, "global_step": 170848, "epoch": 1411} {"train_loss": -41.250667572021484, "global_step": 170849, "epoch": 1411} {"train_loss": -40.459110260009766, "global_step": 170850, "epoch": 1411} {"train_loss": -40.53531845344985, "global_step": 170851, "epoch": 1411, "val_loss": 2842811.0} {"train_loss": -40.539188385009766, "global_step": 170852, "epoch": 1412} {"train_loss": -40.35452651977539, "global_step": 170853, "epoch": 1412} {"train_loss": -40.92731857299805, "global_step": 170854, "epoch": 1412} {"train_loss": -41.76777267456055, "global_step": 170855, "epoch": 1412} {"train_loss": -40.9468994140625, "global_step": 170856, "epoch": 1412} {"train_loss": -40.913387298583984, "global_step": 170857, "epoch": 1412} {"train_loss": -40.7201042175293, "global_step": 170858, "epoch": 1412} {"train_loss": -38.68915557861328, "global_step": 170859, "epoch": 1412} {"train_loss": -38.227691650390625, "global_step": 170860, "epoch": 1412} {"train_loss": -39.223182678222656, "global_step": 170861, "epoch": 1412} {"train_loss": -40.38576889038086, "global_step": 170862, "epoch": 1412} {"train_loss": -40.699676513671875, "global_step": 170863, "epoch": 1412} {"train_loss": -40.29106140136719, "global_step": 170864, "epoch": 1412} {"train_loss": -37.9890022277832, "global_step": 170865, "epoch": 1412} {"train_loss": -39.14534378051758, "global_step": 170866, "epoch": 1412} {"train_loss": -39.33217239379883, "global_step": 170867, "epoch": 1412} {"train_loss": -40.37376022338867, "global_step": 170868, "epoch": 1412} {"train_loss": -40.3824577331543, "global_step": 170869, "epoch": 1412} {"train_loss": -38.922916412353516, "global_step": 170870, "epoch": 1412} {"train_loss": -40.635467529296875, "global_step": 170871, "epoch": 1412} {"train_loss": -41.767799377441406, "global_step": 170872, "epoch": 1412} {"train_loss": -39.734893798828125, "global_step": 170873, "epoch": 1412} {"train_loss": -39.858306884765625, "global_step": 170874, "epoch": 1412} {"train_loss": -40.726051330566406, "global_step": 170875, "epoch": 1412} {"train_loss": -40.47150421142578, "global_step": 170876, "epoch": 1412} {"train_loss": -40.397945404052734, "global_step": 170877, "epoch": 1412} {"train_loss": -40.39874267578125, "global_step": 170878, "epoch": 1412} {"train_loss": -40.60028839111328, "global_step": 170879, "epoch": 1412} {"train_loss": -40.20182418823242, "global_step": 170880, "epoch": 1412} {"train_loss": -40.74580001831055, "global_step": 170881, "epoch": 1412} {"train_loss": -41.298397064208984, "global_step": 170882, "epoch": 1412} {"train_loss": -39.890926361083984, "global_step": 170883, "epoch": 1412} {"train_loss": -41.023433685302734, "global_step": 170884, "epoch": 1412} {"train_loss": -40.7291145324707, "global_step": 170885, "epoch": 1412} {"train_loss": -41.33192443847656, "global_step": 170886, "epoch": 1412} {"train_loss": -40.875343322753906, "global_step": 170887, "epoch": 1412} {"train_loss": -40.76801300048828, "global_step": 170888, "epoch": 1412} {"train_loss": -40.602657318115234, "global_step": 170889, "epoch": 1412} {"train_loss": -41.208736419677734, "global_step": 170890, "epoch": 1412} {"train_loss": -41.063228607177734, "global_step": 170891, "epoch": 1412} {"train_loss": -41.43134307861328, "global_step": 170892, "epoch": 1412} {"train_loss": -40.81550979614258, "global_step": 170893, "epoch": 1412} {"train_loss": -41.597537994384766, "global_step": 170894, "epoch": 1412} {"train_loss": -40.85844802856445, "global_step": 170895, "epoch": 1412} {"train_loss": -41.678260803222656, "global_step": 170896, "epoch": 1412} {"train_loss": -41.65627670288086, "global_step": 170897, "epoch": 1412} {"train_loss": -41.42135238647461, "global_step": 170898, "epoch": 1412} {"train_loss": -41.17838668823242, "global_step": 170899, "epoch": 1412} {"train_loss": -41.480865478515625, "global_step": 170900, "epoch": 1412} {"train_loss": -40.918880462646484, "global_step": 170901, "epoch": 1412} {"train_loss": -40.82184982299805, "global_step": 170902, "epoch": 1412} {"train_loss": -41.39841842651367, "global_step": 170903, "epoch": 1412} {"train_loss": -41.704254150390625, "global_step": 170904, "epoch": 1412} {"train_loss": -41.32905960083008, "global_step": 170905, "epoch": 1412} {"train_loss": -41.0368537902832, "global_step": 170906, "epoch": 1412} {"train_loss": -41.58659362792969, "global_step": 170907, "epoch": 1412} {"train_loss": -41.05952072143555, "global_step": 170908, "epoch": 1412} {"train_loss": -41.306846618652344, "global_step": 170909, "epoch": 1412} {"train_loss": -41.35988998413086, "global_step": 170910, "epoch": 1412} {"train_loss": -41.45327377319336, "global_step": 170911, "epoch": 1412} {"train_loss": -41.4748420715332, "global_step": 170912, "epoch": 1412} {"train_loss": -41.638946533203125, "global_step": 170913, "epoch": 1412} {"train_loss": -40.60213088989258, "global_step": 170914, "epoch": 1412} {"train_loss": -41.349979400634766, "global_step": 170915, "epoch": 1412} {"train_loss": -41.17853927612305, "global_step": 170916, "epoch": 1412} {"train_loss": -40.799198150634766, "global_step": 170917, "epoch": 1412} {"train_loss": -39.91501998901367, "global_step": 170918, "epoch": 1412} {"train_loss": -40.93703079223633, "global_step": 170919, "epoch": 1412} {"train_loss": -40.063175201416016, "global_step": 170920, "epoch": 1412} {"train_loss": -37.976837158203125, "global_step": 170921, "epoch": 1412} {"train_loss": -38.62482833862305, "global_step": 170922, "epoch": 1412} {"train_loss": -38.42091751098633, "global_step": 170923, "epoch": 1412} {"train_loss": -40.28025436401367, "global_step": 170924, "epoch": 1412} {"train_loss": -35.6855583190918, "global_step": 170925, "epoch": 1412} {"train_loss": -38.12360763549805, "global_step": 170926, "epoch": 1412} {"train_loss": -38.20609664916992, "global_step": 170927, "epoch": 1412} {"train_loss": -38.13643264770508, "global_step": 170928, "epoch": 1412} {"train_loss": -38.10660934448242, "global_step": 170929, "epoch": 1412} {"train_loss": -37.9830322265625, "global_step": 170930, "epoch": 1412} {"train_loss": -40.180816650390625, "global_step": 170931, "epoch": 1412} {"train_loss": -34.581336975097656, "global_step": 170932, "epoch": 1412} {"train_loss": -36.4270133972168, "global_step": 170933, "epoch": 1412} {"train_loss": -37.2712287902832, "global_step": 170934, "epoch": 1412} {"train_loss": -37.89492416381836, "global_step": 170935, "epoch": 1412} {"train_loss": -35.196678161621094, "global_step": 170936, "epoch": 1412} {"train_loss": -39.596500396728516, "global_step": 170937, "epoch": 1412} {"train_loss": -37.538761138916016, "global_step": 170938, "epoch": 1412} {"train_loss": -38.60721969604492, "global_step": 170939, "epoch": 1412} {"train_loss": -37.9762077331543, "global_step": 170940, "epoch": 1412} {"train_loss": -39.848323822021484, "global_step": 170941, "epoch": 1412} {"train_loss": -38.962432861328125, "global_step": 170942, "epoch": 1412} {"train_loss": -40.28578567504883, "global_step": 170943, "epoch": 1412} {"train_loss": -38.67512130737305, "global_step": 170944, "epoch": 1412} {"train_loss": -38.8157958984375, "global_step": 170945, "epoch": 1412} {"train_loss": -40.443397521972656, "global_step": 170946, "epoch": 1412} {"train_loss": -40.530330657958984, "global_step": 170947, "epoch": 1412} {"train_loss": -39.5697135925293, "global_step": 170948, "epoch": 1412} {"train_loss": -40.75001525878906, "global_step": 170949, "epoch": 1412} {"train_loss": -39.5598258972168, "global_step": 170950, "epoch": 1412} {"train_loss": -40.2472038269043, "global_step": 170951, "epoch": 1412} {"train_loss": -38.67280197143555, "global_step": 170952, "epoch": 1412} {"train_loss": -39.8466911315918, "global_step": 170953, "epoch": 1412} {"train_loss": -40.70248031616211, "global_step": 170954, "epoch": 1412} {"train_loss": -40.52439498901367, "global_step": 170955, "epoch": 1412} {"train_loss": -38.3577766418457, "global_step": 170956, "epoch": 1412} {"train_loss": -40.58698272705078, "global_step": 170957, "epoch": 1412} {"train_loss": -39.61637496948242, "global_step": 170958, "epoch": 1412} {"train_loss": -40.3484001159668, "global_step": 170959, "epoch": 1412} {"train_loss": -40.90440368652344, "global_step": 170960, "epoch": 1412} {"train_loss": -39.08575439453125, "global_step": 170961, "epoch": 1412} {"train_loss": -40.511898040771484, "global_step": 170962, "epoch": 1412} {"train_loss": -40.47053146362305, "global_step": 170963, "epoch": 1412} {"train_loss": -40.40639877319336, "global_step": 170964, "epoch": 1412} {"train_loss": -40.2059440612793, "global_step": 170965, "epoch": 1412} {"train_loss": -41.51040267944336, "global_step": 170966, "epoch": 1412} {"train_loss": -40.33149337768555, "global_step": 170967, "epoch": 1412} {"train_loss": -40.84435272216797, "global_step": 170968, "epoch": 1412} {"train_loss": -40.738704681396484, "global_step": 170969, "epoch": 1412} {"train_loss": -39.67424774169922, "global_step": 170970, "epoch": 1412} {"train_loss": -40.98091506958008, "global_step": 170971, "epoch": 1412} {"train_loss": -40.06650685081797, "global_step": 170972, "epoch": 1412, "val_loss": 2897897.75} {"train_loss": -40.946659088134766, "global_step": 170973, "epoch": 1413} {"train_loss": -41.14921188354492, "global_step": 170974, "epoch": 1413} {"train_loss": -41.759159088134766, "global_step": 170975, "epoch": 1413} {"train_loss": -40.11886215209961, "global_step": 170976, "epoch": 1413} {"train_loss": -40.70108413696289, "global_step": 170977, "epoch": 1413} {"train_loss": -40.9984245300293, "global_step": 170978, "epoch": 1413} {"train_loss": -40.86257553100586, "global_step": 170979, "epoch": 1413} {"train_loss": -39.80131149291992, "global_step": 170980, "epoch": 1413} {"train_loss": -40.1407585144043, "global_step": 170981, "epoch": 1413} {"train_loss": -41.26445770263672, "global_step": 170982, "epoch": 1413} {"train_loss": -40.9356575012207, "global_step": 170983, "epoch": 1413} {"train_loss": -41.263221740722656, "global_step": 170984, "epoch": 1413} {"train_loss": -40.78851318359375, "global_step": 170985, "epoch": 1413} {"train_loss": -40.52024841308594, "global_step": 170986, "epoch": 1413} {"train_loss": -41.343502044677734, "global_step": 170987, "epoch": 1413} {"train_loss": -40.31977462768555, "global_step": 170988, "epoch": 1413} {"train_loss": -40.89272689819336, "global_step": 170989, "epoch": 1413} {"train_loss": -40.98659133911133, "global_step": 170990, "epoch": 1413} {"train_loss": -40.938594818115234, "global_step": 170991, "epoch": 1413} {"train_loss": -41.32830047607422, "global_step": 170992, "epoch": 1413} {"train_loss": -41.49154281616211, "global_step": 170993, "epoch": 1413} {"train_loss": -41.23720932006836, "global_step": 170994, "epoch": 1413} {"train_loss": -41.9462776184082, "global_step": 170995, "epoch": 1413} {"train_loss": -40.90574264526367, "global_step": 170996, "epoch": 1413} {"train_loss": -41.09370803833008, "global_step": 170997, "epoch": 1413} {"train_loss": -41.75743103027344, "global_step": 170998, "epoch": 1413} {"train_loss": -40.90574264526367, "global_step": 170999, "epoch": 1413} {"train_loss": -40.90216064453125, "global_step": 171000, "epoch": 1413} {"train_loss": -41.030303955078125, "global_step": 171001, "epoch": 1413} {"train_loss": -39.89875030517578, "global_step": 171002, "epoch": 1413} {"train_loss": -39.97202682495117, "global_step": 171003, "epoch": 1413} {"train_loss": -40.911659240722656, "global_step": 171004, "epoch": 1413} {"train_loss": -41.48978805541992, "global_step": 171005, "epoch": 1413} {"train_loss": -41.08858871459961, "global_step": 171006, "epoch": 1413} {"train_loss": -40.48321533203125, "global_step": 171007, "epoch": 1413} {"train_loss": -40.48384094238281, "global_step": 171008, "epoch": 1413} {"train_loss": -40.835487365722656, "global_step": 171009, "epoch": 1413} {"train_loss": -41.17483139038086, "global_step": 171010, "epoch": 1413} {"train_loss": -39.925960540771484, "global_step": 171011, "epoch": 1413} {"train_loss": -39.169769287109375, "global_step": 171012, "epoch": 1413} {"train_loss": -40.563018798828125, "global_step": 171013, "epoch": 1413} {"train_loss": -41.73310470581055, "global_step": 171014, "epoch": 1413} {"train_loss": -40.56306838989258, "global_step": 171015, "epoch": 1413} {"train_loss": -39.538185119628906, "global_step": 171016, "epoch": 1413} {"train_loss": -39.504844665527344, "global_step": 171017, "epoch": 1413} {"train_loss": -40.71002197265625, "global_step": 171018, "epoch": 1413} {"train_loss": -41.05454635620117, "global_step": 171019, "epoch": 1413} {"train_loss": -40.02998352050781, "global_step": 171020, "epoch": 1413} {"train_loss": -40.80624008178711, "global_step": 171021, "epoch": 1413} {"train_loss": -41.111289978027344, "global_step": 171022, "epoch": 1413} {"train_loss": -40.95089340209961, "global_step": 171023, "epoch": 1413} {"train_loss": -41.25354766845703, "global_step": 171024, "epoch": 1413} {"train_loss": -41.62905502319336, "global_step": 171025, "epoch": 1413} {"train_loss": -41.40577697753906, "global_step": 171026, "epoch": 1413} {"train_loss": -40.25141525268555, "global_step": 171027, "epoch": 1413} {"train_loss": -40.76210021972656, "global_step": 171028, "epoch": 1413} {"train_loss": -40.472755432128906, "global_step": 171029, "epoch": 1413} {"train_loss": -39.42564010620117, "global_step": 171030, "epoch": 1413} {"train_loss": -40.12959289550781, "global_step": 171031, "epoch": 1413} {"train_loss": -39.499080657958984, "global_step": 171032, "epoch": 1413} {"train_loss": -39.71383285522461, "global_step": 171033, "epoch": 1413} {"train_loss": -41.11688995361328, "global_step": 171034, "epoch": 1413} {"train_loss": -40.49628829956055, "global_step": 171035, "epoch": 1413} {"train_loss": -39.582088470458984, "global_step": 171036, "epoch": 1413} {"train_loss": -39.81473922729492, "global_step": 171037, "epoch": 1413} {"train_loss": -40.33338165283203, "global_step": 171038, "epoch": 1413} {"train_loss": -39.38800811767578, "global_step": 171039, "epoch": 1413} {"train_loss": -41.12538146972656, "global_step": 171040, "epoch": 1413} {"train_loss": -39.93748092651367, "global_step": 171041, "epoch": 1413} {"train_loss": -40.80348587036133, "global_step": 171042, "epoch": 1413} {"train_loss": -40.6717529296875, "global_step": 171043, "epoch": 1413} {"train_loss": -40.228065490722656, "global_step": 171044, "epoch": 1413} {"train_loss": -40.37081527709961, "global_step": 171045, "epoch": 1413} {"train_loss": -39.973175048828125, "global_step": 171046, "epoch": 1413} {"train_loss": -41.30805969238281, "global_step": 171047, "epoch": 1413} {"train_loss": -39.6575927734375, "global_step": 171048, "epoch": 1413} {"train_loss": -40.17042922973633, "global_step": 171049, "epoch": 1413} {"train_loss": -41.3311653137207, "global_step": 171050, "epoch": 1413} {"train_loss": -39.344764709472656, "global_step": 171051, "epoch": 1413} {"train_loss": -40.33736801147461, "global_step": 171052, "epoch": 1413} {"train_loss": -40.898799896240234, "global_step": 171053, "epoch": 1413} {"train_loss": -40.30522537231445, "global_step": 171054, "epoch": 1413} {"train_loss": -40.98961639404297, "global_step": 171055, "epoch": 1413} {"train_loss": -41.50617218017578, "global_step": 171056, "epoch": 1413} {"train_loss": -40.380855560302734, "global_step": 171057, "epoch": 1413} {"train_loss": -41.24143600463867, "global_step": 171058, "epoch": 1413} {"train_loss": -41.577674865722656, "global_step": 171059, "epoch": 1413} {"train_loss": -41.19424057006836, "global_step": 171060, "epoch": 1413} {"train_loss": -40.60099792480469, "global_step": 171061, "epoch": 1413} {"train_loss": -40.692352294921875, "global_step": 171062, "epoch": 1413} {"train_loss": -41.2333984375, "global_step": 171063, "epoch": 1413} {"train_loss": -40.68074417114258, "global_step": 171064, "epoch": 1413} {"train_loss": -41.22625732421875, "global_step": 171065, "epoch": 1413} {"train_loss": -40.796112060546875, "global_step": 171066, "epoch": 1413} {"train_loss": -39.5586051940918, "global_step": 171067, "epoch": 1413} {"train_loss": -41.486419677734375, "global_step": 171068, "epoch": 1413} {"train_loss": -41.8385009765625, "global_step": 171069, "epoch": 1413} {"train_loss": -41.63627243041992, "global_step": 171070, "epoch": 1413} {"train_loss": -41.82221221923828, "global_step": 171071, "epoch": 1413} {"train_loss": -41.84683609008789, "global_step": 171072, "epoch": 1413} {"train_loss": -41.77447509765625, "global_step": 171073, "epoch": 1413} {"train_loss": -41.51858139038086, "global_step": 171074, "epoch": 1413} {"train_loss": -40.79634475708008, "global_step": 171075, "epoch": 1413} {"train_loss": -41.9121208190918, "global_step": 171076, "epoch": 1413} {"train_loss": -41.533241271972656, "global_step": 171077, "epoch": 1413} {"train_loss": -40.89926528930664, "global_step": 171078, "epoch": 1413} {"train_loss": -41.652992248535156, "global_step": 171079, "epoch": 1413} {"train_loss": -41.28848648071289, "global_step": 171080, "epoch": 1413} {"train_loss": -39.1232795715332, "global_step": 171081, "epoch": 1413} {"train_loss": -38.34669876098633, "global_step": 171082, "epoch": 1413} {"train_loss": -40.09088134765625, "global_step": 171083, "epoch": 1413} {"train_loss": -41.534820556640625, "global_step": 171084, "epoch": 1413} {"train_loss": -38.03049850463867, "global_step": 171085, "epoch": 1413} {"train_loss": -37.68525314331055, "global_step": 171086, "epoch": 1413} {"train_loss": -39.23112487792969, "global_step": 171087, "epoch": 1413} {"train_loss": -39.08177185058594, "global_step": 171088, "epoch": 1413} {"train_loss": -40.07326126098633, "global_step": 171089, "epoch": 1413} {"train_loss": -40.95912551879883, "global_step": 171090, "epoch": 1413} {"train_loss": -41.03597640991211, "global_step": 171091, "epoch": 1413} {"train_loss": -39.9185676574707, "global_step": 171092, "epoch": 1413} {"train_loss": -40.660753959466604, "global_step": 171093, "epoch": 1413, "val_loss": 2740307.0} {"train_loss": -41.32772445678711, "global_step": 171094, "epoch": 1414} {"train_loss": -41.52684020996094, "global_step": 171095, "epoch": 1414} {"train_loss": -41.067169189453125, "global_step": 171096, "epoch": 1414} {"train_loss": -41.24872589111328, "global_step": 171097, "epoch": 1414} {"train_loss": -41.48688888549805, "global_step": 171098, "epoch": 1414} {"train_loss": -40.438232421875, "global_step": 171099, "epoch": 1414} {"train_loss": -41.64727020263672, "global_step": 171100, "epoch": 1414} {"train_loss": -41.65443801879883, "global_step": 171101, "epoch": 1414} {"train_loss": -41.61357498168945, "global_step": 171102, "epoch": 1414} {"train_loss": -41.544490814208984, "global_step": 171103, "epoch": 1414} {"train_loss": -40.71604919433594, "global_step": 171104, "epoch": 1414} {"train_loss": -41.728309631347656, "global_step": 171105, "epoch": 1414} {"train_loss": -41.914710998535156, "global_step": 171106, "epoch": 1414} {"train_loss": -41.7239875793457, "global_step": 171107, "epoch": 1414} {"train_loss": -41.55706787109375, "global_step": 171108, "epoch": 1414} {"train_loss": -40.80702590942383, "global_step": 171109, "epoch": 1414} {"train_loss": -40.51466751098633, "global_step": 171110, "epoch": 1414} {"train_loss": -41.605098724365234, "global_step": 171111, "epoch": 1414} {"train_loss": -41.29586410522461, "global_step": 171112, "epoch": 1414} {"train_loss": -41.24233627319336, "global_step": 171113, "epoch": 1414} {"train_loss": -41.76967239379883, "global_step": 171114, "epoch": 1414} {"train_loss": -41.474491119384766, "global_step": 171115, "epoch": 1414} {"train_loss": -41.22886276245117, "global_step": 171116, "epoch": 1414} {"train_loss": -41.919551849365234, "global_step": 171117, "epoch": 1414} {"train_loss": -41.43337631225586, "global_step": 171118, "epoch": 1414} {"train_loss": -41.6005973815918, "global_step": 171119, "epoch": 1414} {"train_loss": -41.01760482788086, "global_step": 171120, "epoch": 1414} {"train_loss": -41.47511672973633, "global_step": 171121, "epoch": 1414} {"train_loss": -40.265235900878906, "global_step": 171122, "epoch": 1414} {"train_loss": -39.80837631225586, "global_step": 171123, "epoch": 1414} {"train_loss": -39.10107421875, "global_step": 171124, "epoch": 1414} {"train_loss": -38.49347686767578, "global_step": 171125, "epoch": 1414} {"train_loss": -35.530757904052734, "global_step": 171126, "epoch": 1414} {"train_loss": -34.70326614379883, "global_step": 171127, "epoch": 1414} {"train_loss": -39.4295768737793, "global_step": 171128, "epoch": 1414} {"train_loss": -37.300899505615234, "global_step": 171129, "epoch": 1414} {"train_loss": -32.91083526611328, "global_step": 171130, "epoch": 1414} {"train_loss": -38.3549919128418, "global_step": 171131, "epoch": 1414} {"train_loss": -37.636417388916016, "global_step": 171132, "epoch": 1414} {"train_loss": -33.99014663696289, "global_step": 171133, "epoch": 1414} {"train_loss": -38.0856819152832, "global_step": 171134, "epoch": 1414} {"train_loss": -37.273738861083984, "global_step": 171135, "epoch": 1414} {"train_loss": -38.373291015625, "global_step": 171136, "epoch": 1414} {"train_loss": -37.43378829956055, "global_step": 171137, "epoch": 1414} {"train_loss": -36.723304748535156, "global_step": 171138, "epoch": 1414} {"train_loss": -39.10980224609375, "global_step": 171139, "epoch": 1414} {"train_loss": -40.18317794799805, "global_step": 171140, "epoch": 1414} {"train_loss": -38.42830276489258, "global_step": 171141, "epoch": 1414} {"train_loss": -40.187828063964844, "global_step": 171142, "epoch": 1414} {"train_loss": -39.82842254638672, "global_step": 171143, "epoch": 1414} {"train_loss": -40.44914627075195, "global_step": 171144, "epoch": 1414} {"train_loss": -38.781150817871094, "global_step": 171145, "epoch": 1414} {"train_loss": -40.433685302734375, "global_step": 171146, "epoch": 1414} {"train_loss": -38.72016143798828, "global_step": 171147, "epoch": 1414} {"train_loss": -41.39558029174805, "global_step": 171148, "epoch": 1414} {"train_loss": -38.877986907958984, "global_step": 171149, "epoch": 1414} {"train_loss": -39.94635009765625, "global_step": 171150, "epoch": 1414} {"train_loss": -40.9040641784668, "global_step": 171151, "epoch": 1414} {"train_loss": -40.3372688293457, "global_step": 171152, "epoch": 1414} {"train_loss": -40.638404846191406, "global_step": 171153, "epoch": 1414} {"train_loss": -41.17827606201172, "global_step": 171154, "epoch": 1414} {"train_loss": -40.70053482055664, "global_step": 171155, "epoch": 1414} {"train_loss": -40.47147750854492, "global_step": 171156, "epoch": 1414} {"train_loss": -41.28474807739258, "global_step": 171157, "epoch": 1414} {"train_loss": -41.0804443359375, "global_step": 171158, "epoch": 1414} {"train_loss": -41.114288330078125, "global_step": 171159, "epoch": 1414} {"train_loss": -41.13622283935547, "global_step": 171160, "epoch": 1414} {"train_loss": -41.44458770751953, "global_step": 171161, "epoch": 1414} {"train_loss": -41.36902618408203, "global_step": 171162, "epoch": 1414} {"train_loss": -41.59096908569336, "global_step": 171163, "epoch": 1414} {"train_loss": -41.457969665527344, "global_step": 171164, "epoch": 1414} {"train_loss": -41.442840576171875, "global_step": 171165, "epoch": 1414} {"train_loss": -41.38615798950195, "global_step": 171166, "epoch": 1414} {"train_loss": -41.848140716552734, "global_step": 171167, "epoch": 1414} {"train_loss": -41.14886474609375, "global_step": 171168, "epoch": 1414} {"train_loss": -41.24514389038086, "global_step": 171169, "epoch": 1414} {"train_loss": -41.25770950317383, "global_step": 171170, "epoch": 1414} {"train_loss": -41.8922119140625, "global_step": 171171, "epoch": 1414} {"train_loss": -41.63035202026367, "global_step": 171172, "epoch": 1414} {"train_loss": -41.52785873413086, "global_step": 171173, "epoch": 1414} {"train_loss": -42.029781341552734, "global_step": 171174, "epoch": 1414} {"train_loss": -41.30373764038086, "global_step": 171175, "epoch": 1414} {"train_loss": -41.6851921081543, "global_step": 171176, "epoch": 1414} {"train_loss": -41.694480895996094, "global_step": 171177, "epoch": 1414} {"train_loss": -41.90189743041992, "global_step": 171178, "epoch": 1414} {"train_loss": -41.597068786621094, "global_step": 171179, "epoch": 1414} {"train_loss": -41.65560531616211, "global_step": 171180, "epoch": 1414} {"train_loss": -41.22391891479492, "global_step": 171181, "epoch": 1414} {"train_loss": -41.876461029052734, "global_step": 171182, "epoch": 1414} {"train_loss": -41.82008361816406, "global_step": 171183, "epoch": 1414} {"train_loss": -41.5551872253418, "global_step": 171184, "epoch": 1414} {"train_loss": -42.067535400390625, "global_step": 171185, "epoch": 1414} {"train_loss": -42.138587951660156, "global_step": 171186, "epoch": 1414} {"train_loss": -40.53120040893555, "global_step": 171187, "epoch": 1414} {"train_loss": -41.55654525756836, "global_step": 171188, "epoch": 1414} {"train_loss": -42.016170501708984, "global_step": 171189, "epoch": 1414} {"train_loss": -41.74357223510742, "global_step": 171190, "epoch": 1414} {"train_loss": -41.1072883605957, "global_step": 171191, "epoch": 1414} {"train_loss": -39.79995346069336, "global_step": 171192, "epoch": 1414} {"train_loss": -39.9235954284668, "global_step": 171193, "epoch": 1414} {"train_loss": -39.18571090698242, "global_step": 171194, "epoch": 1414} {"train_loss": -40.886871337890625, "global_step": 171195, "epoch": 1414} {"train_loss": -39.18486785888672, "global_step": 171196, "epoch": 1414} {"train_loss": -36.18777847290039, "global_step": 171197, "epoch": 1414} {"train_loss": -36.551265716552734, "global_step": 171198, "epoch": 1414} {"train_loss": -37.36052322387695, "global_step": 171199, "epoch": 1414} {"train_loss": -36.55160140991211, "global_step": 171200, "epoch": 1414} {"train_loss": -37.57650375366211, "global_step": 171201, "epoch": 1414} {"train_loss": -37.726356506347656, "global_step": 171202, "epoch": 1414} {"train_loss": -37.80615234375, "global_step": 171203, "epoch": 1414} {"train_loss": -39.413997650146484, "global_step": 171204, "epoch": 1414} {"train_loss": -37.63801956176758, "global_step": 171205, "epoch": 1414} {"train_loss": -36.90597152709961, "global_step": 171206, "epoch": 1414} {"train_loss": -38.894283294677734, "global_step": 171207, "epoch": 1414} {"train_loss": -40.76132583618164, "global_step": 171208, "epoch": 1414} {"train_loss": -39.103248596191406, "global_step": 171209, "epoch": 1414} {"train_loss": -39.48164749145508, "global_step": 171210, "epoch": 1414} {"train_loss": -40.3726692199707, "global_step": 171211, "epoch": 1414} {"train_loss": -38.537052154541016, "global_step": 171212, "epoch": 1414} {"train_loss": -39.62405776977539, "global_step": 171213, "epoch": 1414} {"train_loss": -40.09810436658623, "global_step": 171214, "epoch": 1414, "val_loss": 2875019.25} {"train_loss": -39.312255859375, "global_step": 171215, "epoch": 1415} {"train_loss": -40.357147216796875, "global_step": 171216, "epoch": 1415} {"train_loss": -37.42897415161133, "global_step": 171217, "epoch": 1415} {"train_loss": -40.26845932006836, "global_step": 171218, "epoch": 1415} {"train_loss": -36.53353500366211, "global_step": 171219, "epoch": 1415} {"train_loss": -39.5822868347168, "global_step": 171220, "epoch": 1415} {"train_loss": -30.3012752532959, "global_step": 171221, "epoch": 1415} {"train_loss": -39.65464401245117, "global_step": 171222, "epoch": 1415} {"train_loss": -39.840301513671875, "global_step": 171223, "epoch": 1415} {"train_loss": -36.940372467041016, "global_step": 171224, "epoch": 1415} {"train_loss": -34.26504898071289, "global_step": 171225, "epoch": 1415} {"train_loss": -30.646787643432617, "global_step": 171226, "epoch": 1415} {"train_loss": -7.0835700035095215, "global_step": 171227, "epoch": 1415} {"train_loss": -32.38619613647461, "global_step": 171228, "epoch": 1415} {"train_loss": -31.480077743530273, "global_step": 171229, "epoch": 1415} {"train_loss": -32.4370231628418, "global_step": 171230, "epoch": 1415} {"train_loss": -31.0780029296875, "global_step": 171231, "epoch": 1415} {"train_loss": -30.2910213470459, "global_step": 171232, "epoch": 1415} {"train_loss": -27.524078369140625, "global_step": 171233, "epoch": 1415} {"train_loss": -22.635467529296875, "global_step": 171234, "epoch": 1415} {"train_loss": -31.777862548828125, "global_step": 171235, "epoch": 1415} {"train_loss": -35.27067947387695, "global_step": 171236, "epoch": 1415} {"train_loss": -29.771093368530273, "global_step": 171237, "epoch": 1415} {"train_loss": -29.2076473236084, "global_step": 171238, "epoch": 1415} {"train_loss": -32.016536712646484, "global_step": 171239, "epoch": 1415} {"train_loss": -31.47412109375, "global_step": 171240, "epoch": 1415} {"train_loss": -33.2055549621582, "global_step": 171241, "epoch": 1415} {"train_loss": -36.221256256103516, "global_step": 171242, "epoch": 1415} {"train_loss": -36.00027847290039, "global_step": 171243, "epoch": 1415} {"train_loss": -35.768402099609375, "global_step": 171244, "epoch": 1415} {"train_loss": -37.522762298583984, "global_step": 171245, "epoch": 1415} {"train_loss": -36.709007263183594, "global_step": 171246, "epoch": 1415} {"train_loss": -33.535675048828125, "global_step": 171247, "epoch": 1415} {"train_loss": -35.61833190917969, "global_step": 171248, "epoch": 1415} {"train_loss": -35.199554443359375, "global_step": 171249, "epoch": 1415} {"train_loss": -31.90216636657715, "global_step": 171250, "epoch": 1415} {"train_loss": -35.486690521240234, "global_step": 171251, "epoch": 1415} {"train_loss": -37.02756118774414, "global_step": 171252, "epoch": 1415} {"train_loss": -36.63080596923828, "global_step": 171253, "epoch": 1415} {"train_loss": -37.49540328979492, "global_step": 171254, "epoch": 1415} {"train_loss": -37.325706481933594, "global_step": 171255, "epoch": 1415} {"train_loss": -37.61933517456055, "global_step": 171256, "epoch": 1415} {"train_loss": -37.53225326538086, "global_step": 171257, "epoch": 1415} {"train_loss": -35.703277587890625, "global_step": 171258, "epoch": 1415} {"train_loss": -37.76394271850586, "global_step": 171259, "epoch": 1415} {"train_loss": -36.90080642700195, "global_step": 171260, "epoch": 1415} {"train_loss": -37.11008834838867, "global_step": 171261, "epoch": 1415} {"train_loss": -38.05127716064453, "global_step": 171262, "epoch": 1415} {"train_loss": -37.49177169799805, "global_step": 171263, "epoch": 1415} {"train_loss": -37.77272033691406, "global_step": 171264, "epoch": 1415} {"train_loss": -38.2713737487793, "global_step": 171265, "epoch": 1415} {"train_loss": -38.22677230834961, "global_step": 171266, "epoch": 1415} {"train_loss": -37.47504806518555, "global_step": 171267, "epoch": 1415} {"train_loss": -37.78986740112305, "global_step": 171268, "epoch": 1415} {"train_loss": -36.85111999511719, "global_step": 171269, "epoch": 1415} {"train_loss": -38.0041389465332, "global_step": 171270, "epoch": 1415} {"train_loss": -38.011512756347656, "global_step": 171271, "epoch": 1415} {"train_loss": -37.88637161254883, "global_step": 171272, "epoch": 1415} {"train_loss": -38.15544128417969, "global_step": 171273, "epoch": 1415} {"train_loss": -38.28461837768555, "global_step": 171274, "epoch": 1415} {"train_loss": -37.461280822753906, "global_step": 171275, "epoch": 1415} {"train_loss": -38.796817779541016, "global_step": 171276, "epoch": 1415} {"train_loss": -37.769649505615234, "global_step": 171277, "epoch": 1415} {"train_loss": -38.4703483581543, "global_step": 171278, "epoch": 1415} {"train_loss": -38.9351692199707, "global_step": 171279, "epoch": 1415} {"train_loss": -38.33389663696289, "global_step": 171280, "epoch": 1415} {"train_loss": -39.137718200683594, "global_step": 171281, "epoch": 1415} {"train_loss": -38.96946334838867, "global_step": 171282, "epoch": 1415} {"train_loss": -38.37507247924805, "global_step": 171283, "epoch": 1415} {"train_loss": -39.25395965576172, "global_step": 171284, "epoch": 1415} {"train_loss": -38.180606842041016, "global_step": 171285, "epoch": 1415} {"train_loss": -38.92836380004883, "global_step": 171286, "epoch": 1415} {"train_loss": -38.75698471069336, "global_step": 171287, "epoch": 1415} {"train_loss": -38.84700012207031, "global_step": 171288, "epoch": 1415} {"train_loss": -38.34315872192383, "global_step": 171289, "epoch": 1415} {"train_loss": -39.373435974121094, "global_step": 171290, "epoch": 1415} {"train_loss": -38.79895782470703, "global_step": 171291, "epoch": 1415} {"train_loss": -39.598670959472656, "global_step": 171292, "epoch": 1415} {"train_loss": -39.57564926147461, "global_step": 171293, "epoch": 1415} {"train_loss": -39.430870056152344, "global_step": 171294, "epoch": 1415} {"train_loss": -39.14824676513672, "global_step": 171295, "epoch": 1415} {"train_loss": -39.481903076171875, "global_step": 171296, "epoch": 1415} {"train_loss": -39.80308151245117, "global_step": 171297, "epoch": 1415} {"train_loss": -39.00806427001953, "global_step": 171298, "epoch": 1415} {"train_loss": -39.235511779785156, "global_step": 171299, "epoch": 1415} {"train_loss": -39.396358489990234, "global_step": 171300, "epoch": 1415} {"train_loss": -39.708961486816406, "global_step": 171301, "epoch": 1415} {"train_loss": -39.80939865112305, "global_step": 171302, "epoch": 1415} {"train_loss": -39.87255096435547, "global_step": 171303, "epoch": 1415} {"train_loss": -39.23166275024414, "global_step": 171304, "epoch": 1415} {"train_loss": -39.93777084350586, "global_step": 171305, "epoch": 1415} {"train_loss": -38.69218063354492, "global_step": 171306, "epoch": 1415} {"train_loss": -39.689273834228516, "global_step": 171307, "epoch": 1415} {"train_loss": -39.489540100097656, "global_step": 171308, "epoch": 1415} {"train_loss": -39.70580291748047, "global_step": 171309, "epoch": 1415} {"train_loss": -40.06819152832031, "global_step": 171310, "epoch": 1415} {"train_loss": -39.717464447021484, "global_step": 171311, "epoch": 1415} {"train_loss": -39.75431442260742, "global_step": 171312, "epoch": 1415} {"train_loss": -40.01913070678711, "global_step": 171313, "epoch": 1415} {"train_loss": -39.91376495361328, "global_step": 171314, "epoch": 1415} {"train_loss": -40.10723876953125, "global_step": 171315, "epoch": 1415} {"train_loss": -39.82456588745117, "global_step": 171316, "epoch": 1415} {"train_loss": -40.21187973022461, "global_step": 171317, "epoch": 1415} {"train_loss": -40.3568229675293, "global_step": 171318, "epoch": 1415} {"train_loss": -40.1885871887207, "global_step": 171319, "epoch": 1415} {"train_loss": -40.10476303100586, "global_step": 171320, "epoch": 1415} {"train_loss": -40.20668029785156, "global_step": 171321, "epoch": 1415} {"train_loss": -40.08286666870117, "global_step": 171322, "epoch": 1415} {"train_loss": -39.92674255371094, "global_step": 171323, "epoch": 1415} {"train_loss": -40.489986419677734, "global_step": 171324, "epoch": 1415} {"train_loss": -40.526641845703125, "global_step": 171325, "epoch": 1415} {"train_loss": -40.61106491088867, "global_step": 171326, "epoch": 1415} {"train_loss": -39.62270736694336, "global_step": 171327, "epoch": 1415} {"train_loss": -40.26068115234375, "global_step": 171328, "epoch": 1415} {"train_loss": -40.717491149902344, "global_step": 171329, "epoch": 1415} {"train_loss": -40.6309700012207, "global_step": 171330, "epoch": 1415} {"train_loss": -39.47788619995117, "global_step": 171331, "epoch": 1415} {"train_loss": -40.68095016479492, "global_step": 171332, "epoch": 1415} {"train_loss": -40.4905891418457, "global_step": 171333, "epoch": 1415} {"train_loss": -40.35970687866211, "global_step": 171334, "epoch": 1415} {"train_loss": -37.2923870204894, "global_step": 171335, "epoch": 1415, "val_loss": 2875914.75} {"train_loss": -40.41340255737305, "global_step": 171336, "epoch": 1416} {"train_loss": -40.374759674072266, "global_step": 171337, "epoch": 1416} {"train_loss": -40.388465881347656, "global_step": 171338, "epoch": 1416} {"train_loss": -40.65065383911133, "global_step": 171339, "epoch": 1416} {"train_loss": -40.72880172729492, "global_step": 171340, "epoch": 1416} {"train_loss": -40.88704299926758, "global_step": 171341, "epoch": 1416} {"train_loss": -40.44899368286133, "global_step": 171342, "epoch": 1416} {"train_loss": -40.52081298828125, "global_step": 171343, "epoch": 1416} {"train_loss": -40.9379768371582, "global_step": 171344, "epoch": 1416} {"train_loss": -41.064449310302734, "global_step": 171345, "epoch": 1416} {"train_loss": -41.02846908569336, "global_step": 171346, "epoch": 1416} {"train_loss": -40.702518463134766, "global_step": 171347, "epoch": 1416} {"train_loss": -40.710060119628906, "global_step": 171348, "epoch": 1416} {"train_loss": -40.512939453125, "global_step": 171349, "epoch": 1416} {"train_loss": -40.97768783569336, "global_step": 171350, "epoch": 1416} {"train_loss": -41.075653076171875, "global_step": 171351, "epoch": 1416} {"train_loss": -40.88303756713867, "global_step": 171352, "epoch": 1416} {"train_loss": -40.83161544799805, "global_step": 171353, "epoch": 1416} {"train_loss": -41.10700607299805, "global_step": 171354, "epoch": 1416} {"train_loss": -40.62388229370117, "global_step": 171355, "epoch": 1416} {"train_loss": -41.108009338378906, "global_step": 171356, "epoch": 1416} {"train_loss": -40.95173645019531, "global_step": 171357, "epoch": 1416} {"train_loss": -40.75434494018555, "global_step": 171358, "epoch": 1416} {"train_loss": -39.78384017944336, "global_step": 171359, "epoch": 1416} {"train_loss": -40.88897705078125, "global_step": 171360, "epoch": 1416} {"train_loss": -41.047725677490234, "global_step": 171361, "epoch": 1416} {"train_loss": -41.376319885253906, "global_step": 171362, "epoch": 1416} {"train_loss": -40.7470817565918, "global_step": 171363, "epoch": 1416} {"train_loss": -41.30070877075195, "global_step": 171364, "epoch": 1416} {"train_loss": -41.12494659423828, "global_step": 171365, "epoch": 1416} {"train_loss": -41.652156829833984, "global_step": 171366, "epoch": 1416} {"train_loss": -41.017738342285156, "global_step": 171367, "epoch": 1416} {"train_loss": -40.704124450683594, "global_step": 171368, "epoch": 1416} {"train_loss": -40.26810836791992, "global_step": 171369, "epoch": 1416} {"train_loss": -40.904510498046875, "global_step": 171370, "epoch": 1416} {"train_loss": -41.499488830566406, "global_step": 171371, "epoch": 1416} {"train_loss": -40.758522033691406, "global_step": 171372, "epoch": 1416} {"train_loss": -41.37492752075195, "global_step": 171373, "epoch": 1416} {"train_loss": -41.20528030395508, "global_step": 171374, "epoch": 1416} {"train_loss": -40.6303825378418, "global_step": 171375, "epoch": 1416} {"train_loss": -41.120758056640625, "global_step": 171376, "epoch": 1416} {"train_loss": -41.536739349365234, "global_step": 171377, "epoch": 1416} {"train_loss": -41.18880081176758, "global_step": 171378, "epoch": 1416} {"train_loss": -41.00476837158203, "global_step": 171379, "epoch": 1416} {"train_loss": -40.92699432373047, "global_step": 171380, "epoch": 1416} {"train_loss": -41.45396041870117, "global_step": 171381, "epoch": 1416} {"train_loss": -41.09341049194336, "global_step": 171382, "epoch": 1416} {"train_loss": -40.79487609863281, "global_step": 171383, "epoch": 1416} {"train_loss": -41.515594482421875, "global_step": 171384, "epoch": 1416} {"train_loss": -40.44194030761719, "global_step": 171385, "epoch": 1416} {"train_loss": -38.33169174194336, "global_step": 171386, "epoch": 1416} {"train_loss": -36.8901481628418, "global_step": 171387, "epoch": 1416} {"train_loss": -34.91719055175781, "global_step": 171388, "epoch": 1416} {"train_loss": -32.36583709716797, "global_step": 171389, "epoch": 1416} {"train_loss": -34.109375, "global_step": 171390, "epoch": 1416} {"train_loss": -33.410682678222656, "global_step": 171391, "epoch": 1416} {"train_loss": -24.79279899597168, "global_step": 171392, "epoch": 1416} {"train_loss": -27.608673095703125, "global_step": 171393, "epoch": 1416} {"train_loss": -36.363922119140625, "global_step": 171394, "epoch": 1416} {"train_loss": -38.78230667114258, "global_step": 171395, "epoch": 1416} {"train_loss": -34.19266891479492, "global_step": 171396, "epoch": 1416} {"train_loss": -37.69175338745117, "global_step": 171397, "epoch": 1416} {"train_loss": -33.424739837646484, "global_step": 171398, "epoch": 1416} {"train_loss": -35.062034606933594, "global_step": 171399, "epoch": 1416} {"train_loss": -37.11373519897461, "global_step": 171400, "epoch": 1416} {"train_loss": -33.72370529174805, "global_step": 171401, "epoch": 1416} {"train_loss": -38.75174331665039, "global_step": 171402, "epoch": 1416} {"train_loss": -34.76180648803711, "global_step": 171403, "epoch": 1416} {"train_loss": -38.69379425048828, "global_step": 171404, "epoch": 1416} {"train_loss": -37.22529220581055, "global_step": 171405, "epoch": 1416} {"train_loss": -39.04248809814453, "global_step": 171406, "epoch": 1416} {"train_loss": -37.436790466308594, "global_step": 171407, "epoch": 1416} {"train_loss": -39.58711242675781, "global_step": 171408, "epoch": 1416} {"train_loss": -36.73458480834961, "global_step": 171409, "epoch": 1416} {"train_loss": -39.755558013916016, "global_step": 171410, "epoch": 1416} {"train_loss": -38.458980560302734, "global_step": 171411, "epoch": 1416} {"train_loss": -39.550411224365234, "global_step": 171412, "epoch": 1416} {"train_loss": -38.69268798828125, "global_step": 171413, "epoch": 1416} {"train_loss": -38.46812057495117, "global_step": 171414, "epoch": 1416} {"train_loss": -39.42228698730469, "global_step": 171415, "epoch": 1416} {"train_loss": -38.381954193115234, "global_step": 171416, "epoch": 1416} {"train_loss": -39.88764190673828, "global_step": 171417, "epoch": 1416} {"train_loss": -39.68411636352539, "global_step": 171418, "epoch": 1416} {"train_loss": -39.42574691772461, "global_step": 171419, "epoch": 1416} {"train_loss": -40.230072021484375, "global_step": 171420, "epoch": 1416} {"train_loss": -39.6221809387207, "global_step": 171421, "epoch": 1416} {"train_loss": -39.87397766113281, "global_step": 171422, "epoch": 1416} {"train_loss": -39.64036178588867, "global_step": 171423, "epoch": 1416} {"train_loss": -39.702720642089844, "global_step": 171424, "epoch": 1416} {"train_loss": -39.379722595214844, "global_step": 171425, "epoch": 1416} {"train_loss": -40.108219146728516, "global_step": 171426, "epoch": 1416} {"train_loss": -40.53951644897461, "global_step": 171427, "epoch": 1416} {"train_loss": -40.06586456298828, "global_step": 171428, "epoch": 1416} {"train_loss": -40.71322250366211, "global_step": 171429, "epoch": 1416} {"train_loss": -40.33586502075195, "global_step": 171430, "epoch": 1416} {"train_loss": -40.093990325927734, "global_step": 171431, "epoch": 1416} {"train_loss": -40.52560043334961, "global_step": 171432, "epoch": 1416} {"train_loss": -40.75899887084961, "global_step": 171433, "epoch": 1416} {"train_loss": -40.01397705078125, "global_step": 171434, "epoch": 1416} {"train_loss": -40.484798431396484, "global_step": 171435, "epoch": 1416} {"train_loss": -40.68951416015625, "global_step": 171436, "epoch": 1416} {"train_loss": -39.58637619018555, "global_step": 171437, "epoch": 1416} {"train_loss": -40.6199836730957, "global_step": 171438, "epoch": 1416} {"train_loss": -40.25556945800781, "global_step": 171439, "epoch": 1416} {"train_loss": -40.49260330200195, "global_step": 171440, "epoch": 1416} {"train_loss": -40.65419387817383, "global_step": 171441, "epoch": 1416} {"train_loss": -40.83159255981445, "global_step": 171442, "epoch": 1416} {"train_loss": -40.794586181640625, "global_step": 171443, "epoch": 1416} {"train_loss": -40.73757553100586, "global_step": 171444, "epoch": 1416} {"train_loss": -41.013580322265625, "global_step": 171445, "epoch": 1416} {"train_loss": -40.3070182800293, "global_step": 171446, "epoch": 1416} {"train_loss": -40.842586517333984, "global_step": 171447, "epoch": 1416} {"train_loss": -40.53324508666992, "global_step": 171448, "epoch": 1416} {"train_loss": -40.61758041381836, "global_step": 171449, "epoch": 1416} {"train_loss": -40.55177688598633, "global_step": 171450, "epoch": 1416} {"train_loss": -40.963531494140625, "global_step": 171451, "epoch": 1416} {"train_loss": -41.049617767333984, "global_step": 171452, "epoch": 1416} {"train_loss": -40.70597457885742, "global_step": 171453, "epoch": 1416} {"train_loss": -40.983585357666016, "global_step": 171454, "epoch": 1416} {"train_loss": -41.10481643676758, "global_step": 171455, "epoch": 1416} {"train_loss": -39.541618741248264, "global_step": 171456, "epoch": 1416, "val_loss": 2737280.5} {"train_loss": -41.17805480957031, "global_step": 171457, "epoch": 1417} {"train_loss": -40.9534797668457, "global_step": 171458, "epoch": 1417} {"train_loss": -41.353309631347656, "global_step": 171459, "epoch": 1417} {"train_loss": -41.13777542114258, "global_step": 171460, "epoch": 1417} {"train_loss": -41.13043975830078, "global_step": 171461, "epoch": 1417} {"train_loss": -41.18687057495117, "global_step": 171462, "epoch": 1417} {"train_loss": -41.078125, "global_step": 171463, "epoch": 1417} {"train_loss": -40.7567024230957, "global_step": 171464, "epoch": 1417} {"train_loss": -41.41534423828125, "global_step": 171465, "epoch": 1417} {"train_loss": -40.88047409057617, "global_step": 171466, "epoch": 1417} {"train_loss": -41.281124114990234, "global_step": 171467, "epoch": 1417} {"train_loss": -41.50033950805664, "global_step": 171468, "epoch": 1417} {"train_loss": -41.44550704956055, "global_step": 171469, "epoch": 1417} {"train_loss": -41.27817916870117, "global_step": 171470, "epoch": 1417} {"train_loss": -41.12483596801758, "global_step": 171471, "epoch": 1417} {"train_loss": -41.83135986328125, "global_step": 171472, "epoch": 1417} {"train_loss": -41.620635986328125, "global_step": 171473, "epoch": 1417} {"train_loss": -41.203086853027344, "global_step": 171474, "epoch": 1417} {"train_loss": -41.771114349365234, "global_step": 171475, "epoch": 1417} {"train_loss": -41.203914642333984, "global_step": 171476, "epoch": 1417} {"train_loss": -41.24464797973633, "global_step": 171477, "epoch": 1417} {"train_loss": -41.457489013671875, "global_step": 171478, "epoch": 1417} {"train_loss": -41.0960578918457, "global_step": 171479, "epoch": 1417} {"train_loss": -41.87295150756836, "global_step": 171480, "epoch": 1417} {"train_loss": -41.69138717651367, "global_step": 171481, "epoch": 1417} {"train_loss": -41.673213958740234, "global_step": 171482, "epoch": 1417} {"train_loss": -41.26131820678711, "global_step": 171483, "epoch": 1417} {"train_loss": -41.29569625854492, "global_step": 171484, "epoch": 1417} {"train_loss": -39.4537353515625, "global_step": 171485, "epoch": 1417} {"train_loss": -40.0485725402832, "global_step": 171486, "epoch": 1417} {"train_loss": -40.45880889892578, "global_step": 171487, "epoch": 1417} {"train_loss": -40.388221740722656, "global_step": 171488, "epoch": 1417} {"train_loss": -41.59980392456055, "global_step": 171489, "epoch": 1417} {"train_loss": -41.55574417114258, "global_step": 171490, "epoch": 1417} {"train_loss": -39.953548431396484, "global_step": 171491, "epoch": 1417} {"train_loss": -39.09237289428711, "global_step": 171492, "epoch": 1417} {"train_loss": -41.19075393676758, "global_step": 171493, "epoch": 1417} {"train_loss": -41.70969772338867, "global_step": 171494, "epoch": 1417} {"train_loss": -40.71793746948242, "global_step": 171495, "epoch": 1417} {"train_loss": -41.16077423095703, "global_step": 171496, "epoch": 1417} {"train_loss": -40.72388458251953, "global_step": 171497, "epoch": 1417} {"train_loss": -40.45929718017578, "global_step": 171498, "epoch": 1417} {"train_loss": -40.86341094970703, "global_step": 171499, "epoch": 1417} {"train_loss": -41.504180908203125, "global_step": 171500, "epoch": 1417} {"train_loss": -41.08969497680664, "global_step": 171501, "epoch": 1417} {"train_loss": -40.90031433105469, "global_step": 171502, "epoch": 1417} {"train_loss": -42.14324951171875, "global_step": 171503, "epoch": 1417} {"train_loss": -41.09922409057617, "global_step": 171504, "epoch": 1417} {"train_loss": -41.17085647583008, "global_step": 171505, "epoch": 1417} {"train_loss": -41.77558517456055, "global_step": 171506, "epoch": 1417} {"train_loss": -40.69829177856445, "global_step": 171507, "epoch": 1417} {"train_loss": -39.51279830932617, "global_step": 171508, "epoch": 1417} {"train_loss": -39.478057861328125, "global_step": 171509, "epoch": 1417} {"train_loss": -41.10062789916992, "global_step": 171510, "epoch": 1417} {"train_loss": -40.488189697265625, "global_step": 171511, "epoch": 1417} {"train_loss": -41.27687454223633, "global_step": 171512, "epoch": 1417} {"train_loss": -41.85887145996094, "global_step": 171513, "epoch": 1417} {"train_loss": -40.842918395996094, "global_step": 171514, "epoch": 1417} {"train_loss": -40.7390022277832, "global_step": 171515, "epoch": 1417} {"train_loss": -40.235652923583984, "global_step": 171516, "epoch": 1417} {"train_loss": -40.456703186035156, "global_step": 171517, "epoch": 1417} {"train_loss": -41.629920959472656, "global_step": 171518, "epoch": 1417} {"train_loss": -40.34937286376953, "global_step": 171519, "epoch": 1417} {"train_loss": -39.9703254699707, "global_step": 171520, "epoch": 1417} {"train_loss": -40.56254577636719, "global_step": 171521, "epoch": 1417} {"train_loss": -41.44474411010742, "global_step": 171522, "epoch": 1417} {"train_loss": -41.690914154052734, "global_step": 171523, "epoch": 1417} {"train_loss": -40.640541076660156, "global_step": 171524, "epoch": 1417} {"train_loss": -39.818599700927734, "global_step": 171525, "epoch": 1417} {"train_loss": -40.1220703125, "global_step": 171526, "epoch": 1417} {"train_loss": -41.4070930480957, "global_step": 171527, "epoch": 1417} {"train_loss": -40.789852142333984, "global_step": 171528, "epoch": 1417} {"train_loss": -39.6571044921875, "global_step": 171529, "epoch": 1417} {"train_loss": -41.12907791137695, "global_step": 171530, "epoch": 1417} {"train_loss": -41.09248733520508, "global_step": 171531, "epoch": 1417} {"train_loss": -41.05527877807617, "global_step": 171532, "epoch": 1417} {"train_loss": -40.845699310302734, "global_step": 171533, "epoch": 1417} {"train_loss": -41.0205078125, "global_step": 171534, "epoch": 1417} {"train_loss": -39.88911437988281, "global_step": 171535, "epoch": 1417} {"train_loss": -41.000675201416016, "global_step": 171536, "epoch": 1417} {"train_loss": -40.89044952392578, "global_step": 171537, "epoch": 1417} {"train_loss": -41.14501953125, "global_step": 171538, "epoch": 1417} {"train_loss": -41.441402435302734, "global_step": 171539, "epoch": 1417} {"train_loss": -40.840065002441406, "global_step": 171540, "epoch": 1417} {"train_loss": -40.27906036376953, "global_step": 171541, "epoch": 1417} {"train_loss": -40.228538513183594, "global_step": 171542, "epoch": 1417} {"train_loss": -39.469642639160156, "global_step": 171543, "epoch": 1417} {"train_loss": -39.58982467651367, "global_step": 171544, "epoch": 1417} {"train_loss": -40.04157257080078, "global_step": 171545, "epoch": 1417} {"train_loss": -41.0986442565918, "global_step": 171546, "epoch": 1417} {"train_loss": -41.06265640258789, "global_step": 171547, "epoch": 1417} {"train_loss": -40.43850326538086, "global_step": 171548, "epoch": 1417} {"train_loss": -40.34522247314453, "global_step": 171549, "epoch": 1417} {"train_loss": -40.79096603393555, "global_step": 171550, "epoch": 1417} {"train_loss": -39.70170211791992, "global_step": 171551, "epoch": 1417} {"train_loss": -40.48600387573242, "global_step": 171552, "epoch": 1417} {"train_loss": -40.27407455444336, "global_step": 171553, "epoch": 1417} {"train_loss": -41.149024963378906, "global_step": 171554, "epoch": 1417} {"train_loss": -39.59130859375, "global_step": 171555, "epoch": 1417} {"train_loss": -38.723934173583984, "global_step": 171556, "epoch": 1417} {"train_loss": -41.822994232177734, "global_step": 171557, "epoch": 1417} {"train_loss": -39.21369171142578, "global_step": 171558, "epoch": 1417} {"train_loss": -40.47806930541992, "global_step": 171559, "epoch": 1417} {"train_loss": -41.39083480834961, "global_step": 171560, "epoch": 1417} {"train_loss": -39.24675369262695, "global_step": 171561, "epoch": 1417} {"train_loss": -35.421504974365234, "global_step": 171562, "epoch": 1417} {"train_loss": -32.178714752197266, "global_step": 171563, "epoch": 1417} {"train_loss": -38.44230651855469, "global_step": 171564, "epoch": 1417} {"train_loss": -39.41697311401367, "global_step": 171565, "epoch": 1417} {"train_loss": -35.212215423583984, "global_step": 171566, "epoch": 1417} {"train_loss": -34.44960403442383, "global_step": 171567, "epoch": 1417} {"train_loss": -29.5364933013916, "global_step": 171568, "epoch": 1417} {"train_loss": -22.290237426757812, "global_step": 171569, "epoch": 1417} {"train_loss": -34.522483825683594, "global_step": 171570, "epoch": 1417} {"train_loss": -34.83865737915039, "global_step": 171571, "epoch": 1417} {"train_loss": -36.84006881713867, "global_step": 171572, "epoch": 1417} {"train_loss": -35.00472640991211, "global_step": 171573, "epoch": 1417} {"train_loss": -38.02223587036133, "global_step": 171574, "epoch": 1417} {"train_loss": -32.25666046142578, "global_step": 171575, "epoch": 1417} {"train_loss": -36.150814056396484, "global_step": 171576, "epoch": 1417} {"train_loss": -39.9738407450274, "global_step": 171577, "epoch": 1417, "val_loss": 2902110.25} {"train_loss": -34.683021545410156, "global_step": 171578, "epoch": 1418} {"train_loss": -36.01258850097656, "global_step": 171579, "epoch": 1418} {"train_loss": -35.06119918823242, "global_step": 171580, "epoch": 1418} {"train_loss": -35.94038391113281, "global_step": 171581, "epoch": 1418} {"train_loss": -36.74137496948242, "global_step": 171582, "epoch": 1418} {"train_loss": -32.91925048828125, "global_step": 171583, "epoch": 1418} {"train_loss": -25.477296829223633, "global_step": 171584, "epoch": 1418} {"train_loss": -35.052589416503906, "global_step": 171585, "epoch": 1418} {"train_loss": -36.953651428222656, "global_step": 171586, "epoch": 1418} {"train_loss": -37.6065673828125, "global_step": 171587, "epoch": 1418} {"train_loss": -36.88966751098633, "global_step": 171588, "epoch": 1418} {"train_loss": -37.54656982421875, "global_step": 171589, "epoch": 1418} {"train_loss": -37.14448165893555, "global_step": 171590, "epoch": 1418} {"train_loss": -38.317813873291016, "global_step": 171591, "epoch": 1418} {"train_loss": -36.85988235473633, "global_step": 171592, "epoch": 1418} {"train_loss": -37.094032287597656, "global_step": 171593, "epoch": 1418} {"train_loss": -36.45740509033203, "global_step": 171594, "epoch": 1418} {"train_loss": -36.1983757019043, "global_step": 171595, "epoch": 1418} {"train_loss": -38.53133773803711, "global_step": 171596, "epoch": 1418} {"train_loss": -38.258113861083984, "global_step": 171597, "epoch": 1418} {"train_loss": -37.94973373413086, "global_step": 171598, "epoch": 1418} {"train_loss": -33.424591064453125, "global_step": 171599, "epoch": 1418} {"train_loss": -37.93662643432617, "global_step": 171600, "epoch": 1418} {"train_loss": -38.7542610168457, "global_step": 171601, "epoch": 1418} {"train_loss": -38.55806350708008, "global_step": 171602, "epoch": 1418} {"train_loss": -38.074344635009766, "global_step": 171603, "epoch": 1418} {"train_loss": -38.065162658691406, "global_step": 171604, "epoch": 1418} {"train_loss": -37.552528381347656, "global_step": 171605, "epoch": 1418} {"train_loss": -37.48186111450195, "global_step": 171606, "epoch": 1418} {"train_loss": -38.356319427490234, "global_step": 171607, "epoch": 1418} {"train_loss": -37.92878341674805, "global_step": 171608, "epoch": 1418} {"train_loss": -38.875850677490234, "global_step": 171609, "epoch": 1418} {"train_loss": -38.55181884765625, "global_step": 171610, "epoch": 1418} {"train_loss": -38.911983489990234, "global_step": 171611, "epoch": 1418} {"train_loss": -37.30706787109375, "global_step": 171612, "epoch": 1418} {"train_loss": -38.35329818725586, "global_step": 171613, "epoch": 1418} {"train_loss": -38.84822463989258, "global_step": 171614, "epoch": 1418} {"train_loss": -38.98427963256836, "global_step": 171615, "epoch": 1418} {"train_loss": -38.744476318359375, "global_step": 171616, "epoch": 1418} {"train_loss": -38.38092041015625, "global_step": 171617, "epoch": 1418} {"train_loss": -39.21985626220703, "global_step": 171618, "epoch": 1418} {"train_loss": -37.947113037109375, "global_step": 171619, "epoch": 1418} {"train_loss": -39.452816009521484, "global_step": 171620, "epoch": 1418} {"train_loss": -38.75815963745117, "global_step": 171621, "epoch": 1418} {"train_loss": -39.01060104370117, "global_step": 171622, "epoch": 1418} {"train_loss": -38.78034591674805, "global_step": 171623, "epoch": 1418} {"train_loss": -38.9920539855957, "global_step": 171624, "epoch": 1418} {"train_loss": -39.02801513671875, "global_step": 171625, "epoch": 1418} {"train_loss": -39.33003616333008, "global_step": 171626, "epoch": 1418} {"train_loss": -39.675445556640625, "global_step": 171627, "epoch": 1418} {"train_loss": -39.57037353515625, "global_step": 171628, "epoch": 1418} {"train_loss": -39.87577438354492, "global_step": 171629, "epoch": 1418} {"train_loss": -39.8464469909668, "global_step": 171630, "epoch": 1418} {"train_loss": -39.95316696166992, "global_step": 171631, "epoch": 1418} {"train_loss": -40.105865478515625, "global_step": 171632, "epoch": 1418} {"train_loss": -40.235809326171875, "global_step": 171633, "epoch": 1418} {"train_loss": -39.79842758178711, "global_step": 171634, "epoch": 1418} {"train_loss": -39.11396408081055, "global_step": 171635, "epoch": 1418} {"train_loss": -39.53525924682617, "global_step": 171636, "epoch": 1418} {"train_loss": -40.29130172729492, "global_step": 171637, "epoch": 1418} {"train_loss": -39.41414260864258, "global_step": 171638, "epoch": 1418} {"train_loss": -39.80318832397461, "global_step": 171639, "epoch": 1418} {"train_loss": -39.583438873291016, "global_step": 171640, "epoch": 1418} {"train_loss": -39.61763381958008, "global_step": 171641, "epoch": 1418} {"train_loss": -39.873497009277344, "global_step": 171642, "epoch": 1418} {"train_loss": -40.0001335144043, "global_step": 171643, "epoch": 1418} {"train_loss": -40.03220748901367, "global_step": 171644, "epoch": 1418} {"train_loss": -40.29469299316406, "global_step": 171645, "epoch": 1418} {"train_loss": -40.807552337646484, "global_step": 171646, "epoch": 1418} {"train_loss": -40.662841796875, "global_step": 171647, "epoch": 1418} {"train_loss": -40.37598419189453, "global_step": 171648, "epoch": 1418} {"train_loss": -39.22930908203125, "global_step": 171649, "epoch": 1418} {"train_loss": -40.450279235839844, "global_step": 171650, "epoch": 1418} {"train_loss": -40.70886993408203, "global_step": 171651, "epoch": 1418} {"train_loss": -40.742698669433594, "global_step": 171652, "epoch": 1418} {"train_loss": -40.57497024536133, "global_step": 171653, "epoch": 1418} {"train_loss": -40.813079833984375, "global_step": 171654, "epoch": 1418} {"train_loss": -40.64643096923828, "global_step": 171655, "epoch": 1418} {"train_loss": -40.58485794067383, "global_step": 171656, "epoch": 1418} {"train_loss": -40.7687873840332, "global_step": 171657, "epoch": 1418} {"train_loss": -40.742671966552734, "global_step": 171658, "epoch": 1418} {"train_loss": -40.83455276489258, "global_step": 171659, "epoch": 1418} {"train_loss": -40.916053771972656, "global_step": 171660, "epoch": 1418} {"train_loss": -40.77753829956055, "global_step": 171661, "epoch": 1418} {"train_loss": -39.3935432434082, "global_step": 171662, "epoch": 1418} {"train_loss": -40.5069580078125, "global_step": 171663, "epoch": 1418} {"train_loss": -39.64020919799805, "global_step": 171664, "epoch": 1418} {"train_loss": -40.85866928100586, "global_step": 171665, "epoch": 1418} {"train_loss": -40.74520492553711, "global_step": 171666, "epoch": 1418} {"train_loss": -41.06797790527344, "global_step": 171667, "epoch": 1418} {"train_loss": -40.79502487182617, "global_step": 171668, "epoch": 1418} {"train_loss": -41.28184127807617, "global_step": 171669, "epoch": 1418} {"train_loss": -40.78330612182617, "global_step": 171670, "epoch": 1418} {"train_loss": -40.719581604003906, "global_step": 171671, "epoch": 1418} {"train_loss": -41.141021728515625, "global_step": 171672, "epoch": 1418} {"train_loss": -40.94411849975586, "global_step": 171673, "epoch": 1418} {"train_loss": -40.88446044921875, "global_step": 171674, "epoch": 1418} {"train_loss": -40.80695724487305, "global_step": 171675, "epoch": 1418} {"train_loss": -41.3319091796875, "global_step": 171676, "epoch": 1418} {"train_loss": -41.306373596191406, "global_step": 171677, "epoch": 1418} {"train_loss": -40.78009033203125, "global_step": 171678, "epoch": 1418} {"train_loss": -40.59157943725586, "global_step": 171679, "epoch": 1418} {"train_loss": -39.5279655456543, "global_step": 171680, "epoch": 1418} {"train_loss": -40.96920394897461, "global_step": 171681, "epoch": 1418} {"train_loss": -41.20412063598633, "global_step": 171682, "epoch": 1418} {"train_loss": -41.18404769897461, "global_step": 171683, "epoch": 1418} {"train_loss": -40.56010055541992, "global_step": 171684, "epoch": 1418} {"train_loss": -40.818904876708984, "global_step": 171685, "epoch": 1418} {"train_loss": -41.2525520324707, "global_step": 171686, "epoch": 1418} {"train_loss": -41.40966033935547, "global_step": 171687, "epoch": 1418} {"train_loss": -40.59745407104492, "global_step": 171688, "epoch": 1418} {"train_loss": -40.21452713012695, "global_step": 171689, "epoch": 1418} {"train_loss": -40.93121337890625, "global_step": 171690, "epoch": 1418} {"train_loss": -40.641693115234375, "global_step": 171691, "epoch": 1418} {"train_loss": -40.5513916015625, "global_step": 171692, "epoch": 1418} {"train_loss": -40.95978927612305, "global_step": 171693, "epoch": 1418} {"train_loss": -40.915645599365234, "global_step": 171694, "epoch": 1418} {"train_loss": -40.857154846191406, "global_step": 171695, "epoch": 1418} {"train_loss": -41.21647644042969, "global_step": 171696, "epoch": 1418} {"train_loss": -41.16175079345703, "global_step": 171697, "epoch": 1418} {"train_loss": -39.23430915706414, "global_step": 171698, "epoch": 1418, "val_loss": 2839311.0} {"train_loss": -41.22509765625, "global_step": 171699, "epoch": 1419} {"train_loss": -40.275306701660156, "global_step": 171700, "epoch": 1419} {"train_loss": -40.82674789428711, "global_step": 171701, "epoch": 1419} {"train_loss": -40.18213653564453, "global_step": 171702, "epoch": 1419} {"train_loss": -39.394622802734375, "global_step": 171703, "epoch": 1419} {"train_loss": -38.179664611816406, "global_step": 171704, "epoch": 1419} {"train_loss": -35.91725158691406, "global_step": 171705, "epoch": 1419} {"train_loss": -29.864154815673828, "global_step": 171706, "epoch": 1419} {"train_loss": -21.97677993774414, "global_step": 171707, "epoch": 1419} {"train_loss": -19.034334182739258, "global_step": 171708, "epoch": 1419} {"train_loss": -36.37357711791992, "global_step": 171709, "epoch": 1419} {"train_loss": -29.514190673828125, "global_step": 171710, "epoch": 1419} {"train_loss": -25.420862197875977, "global_step": 171711, "epoch": 1419} {"train_loss": -39.92205810546875, "global_step": 171712, "epoch": 1419} {"train_loss": -26.176483154296875, "global_step": 171713, "epoch": 1419} {"train_loss": -38.4139518737793, "global_step": 171714, "epoch": 1419} {"train_loss": -32.39923858642578, "global_step": 171715, "epoch": 1419} {"train_loss": -38.19461441040039, "global_step": 171716, "epoch": 1419} {"train_loss": -31.361364364624023, "global_step": 171717, "epoch": 1419} {"train_loss": -38.3321647644043, "global_step": 171718, "epoch": 1419} {"train_loss": -32.601497650146484, "global_step": 171719, "epoch": 1419} {"train_loss": -36.1513786315918, "global_step": 171720, "epoch": 1419} {"train_loss": -35.44861602783203, "global_step": 171721, "epoch": 1419} {"train_loss": -33.72407150268555, "global_step": 171722, "epoch": 1419} {"train_loss": -37.63179397583008, "global_step": 171723, "epoch": 1419} {"train_loss": -37.48759460449219, "global_step": 171724, "epoch": 1419} {"train_loss": -36.88499450683594, "global_step": 171725, "epoch": 1419} {"train_loss": -39.07495880126953, "global_step": 171726, "epoch": 1419} {"train_loss": -37.54731369018555, "global_step": 171727, "epoch": 1419} {"train_loss": -37.73417663574219, "global_step": 171728, "epoch": 1419} {"train_loss": -38.19873046875, "global_step": 171729, "epoch": 1419} {"train_loss": -37.74568557739258, "global_step": 171730, "epoch": 1419} {"train_loss": -38.027523040771484, "global_step": 171731, "epoch": 1419} {"train_loss": -39.41368103027344, "global_step": 171732, "epoch": 1419} {"train_loss": -38.515907287597656, "global_step": 171733, "epoch": 1419} {"train_loss": -38.57289505004883, "global_step": 171734, "epoch": 1419} {"train_loss": -38.761131286621094, "global_step": 171735, "epoch": 1419} {"train_loss": -39.0145149230957, "global_step": 171736, "epoch": 1419} {"train_loss": -36.140560150146484, "global_step": 171737, "epoch": 1419} {"train_loss": -37.21343994140625, "global_step": 171738, "epoch": 1419} {"train_loss": -38.41915512084961, "global_step": 171739, "epoch": 1419} {"train_loss": -39.157997131347656, "global_step": 171740, "epoch": 1419} {"train_loss": -39.06150436401367, "global_step": 171741, "epoch": 1419} {"train_loss": -39.762508392333984, "global_step": 171742, "epoch": 1419} {"train_loss": -39.495094299316406, "global_step": 171743, "epoch": 1419} {"train_loss": -39.503414154052734, "global_step": 171744, "epoch": 1419} {"train_loss": -39.875484466552734, "global_step": 171745, "epoch": 1419} {"train_loss": -39.85418701171875, "global_step": 171746, "epoch": 1419} {"train_loss": -39.91102981567383, "global_step": 171747, "epoch": 1419} {"train_loss": -39.72602844238281, "global_step": 171748, "epoch": 1419} {"train_loss": -40.18638229370117, "global_step": 171749, "epoch": 1419} {"train_loss": -40.19319152832031, "global_step": 171750, "epoch": 1419} {"train_loss": -39.931800842285156, "global_step": 171751, "epoch": 1419} {"train_loss": -40.367794036865234, "global_step": 171752, "epoch": 1419} {"train_loss": -40.17900085449219, "global_step": 171753, "epoch": 1419} {"train_loss": -40.1834716796875, "global_step": 171754, "epoch": 1419} {"train_loss": -40.327423095703125, "global_step": 171755, "epoch": 1419} {"train_loss": -40.37849044799805, "global_step": 171756, "epoch": 1419} {"train_loss": -39.891780853271484, "global_step": 171757, "epoch": 1419} {"train_loss": -40.20132064819336, "global_step": 171758, "epoch": 1419} {"train_loss": -40.56282424926758, "global_step": 171759, "epoch": 1419} {"train_loss": -40.6097526550293, "global_step": 171760, "epoch": 1419} {"train_loss": -40.5120964050293, "global_step": 171761, "epoch": 1419} {"train_loss": -40.602943420410156, "global_step": 171762, "epoch": 1419} {"train_loss": -40.72672653198242, "global_step": 171763, "epoch": 1419} {"train_loss": -40.47602081298828, "global_step": 171764, "epoch": 1419} {"train_loss": -40.602108001708984, "global_step": 171765, "epoch": 1419} {"train_loss": -40.58469772338867, "global_step": 171766, "epoch": 1419} {"train_loss": -40.580841064453125, "global_step": 171767, "epoch": 1419} {"train_loss": -40.73189163208008, "global_step": 171768, "epoch": 1419} {"train_loss": -41.15255355834961, "global_step": 171769, "epoch": 1419} {"train_loss": -40.871856689453125, "global_step": 171770, "epoch": 1419} {"train_loss": -41.03768539428711, "global_step": 171771, "epoch": 1419} {"train_loss": -40.9832763671875, "global_step": 171772, "epoch": 1419} {"train_loss": -41.06967544555664, "global_step": 171773, "epoch": 1419} {"train_loss": -40.865962982177734, "global_step": 171774, "epoch": 1419} {"train_loss": -40.99544906616211, "global_step": 171775, "epoch": 1419} {"train_loss": -41.21428298950195, "global_step": 171776, "epoch": 1419} {"train_loss": -41.18186569213867, "global_step": 171777, "epoch": 1419} {"train_loss": -41.208221435546875, "global_step": 171778, "epoch": 1419} {"train_loss": -41.45558547973633, "global_step": 171779, "epoch": 1419} {"train_loss": -41.360050201416016, "global_step": 171780, "epoch": 1419} {"train_loss": -41.15068435668945, "global_step": 171781, "epoch": 1419} {"train_loss": -40.834529876708984, "global_step": 171782, "epoch": 1419} {"train_loss": -41.49508285522461, "global_step": 171783, "epoch": 1419} {"train_loss": -40.91086959838867, "global_step": 171784, "epoch": 1419} {"train_loss": -40.959651947021484, "global_step": 171785, "epoch": 1419} {"train_loss": -41.06699752807617, "global_step": 171786, "epoch": 1419} {"train_loss": -40.90528106689453, "global_step": 171787, "epoch": 1419} {"train_loss": -40.26278305053711, "global_step": 171788, "epoch": 1419} {"train_loss": -41.04560089111328, "global_step": 171789, "epoch": 1419} {"train_loss": -40.88468551635742, "global_step": 171790, "epoch": 1419} {"train_loss": -40.445838928222656, "global_step": 171791, "epoch": 1419} {"train_loss": -41.35085678100586, "global_step": 171792, "epoch": 1419} {"train_loss": -41.168487548828125, "global_step": 171793, "epoch": 1419} {"train_loss": -40.57548904418945, "global_step": 171794, "epoch": 1419} {"train_loss": -41.5317268371582, "global_step": 171795, "epoch": 1419} {"train_loss": -41.289493560791016, "global_step": 171796, "epoch": 1419} {"train_loss": -40.62846374511719, "global_step": 171797, "epoch": 1419} {"train_loss": -41.19401168823242, "global_step": 171798, "epoch": 1419} {"train_loss": -41.55573654174805, "global_step": 171799, "epoch": 1419} {"train_loss": -41.26062774658203, "global_step": 171800, "epoch": 1419} {"train_loss": -41.17820358276367, "global_step": 171801, "epoch": 1419} {"train_loss": -40.860450744628906, "global_step": 171802, "epoch": 1419} {"train_loss": -41.0598258972168, "global_step": 171803, "epoch": 1419} {"train_loss": -41.328704833984375, "global_step": 171804, "epoch": 1419} {"train_loss": -41.240989685058594, "global_step": 171805, "epoch": 1419} {"train_loss": -40.932525634765625, "global_step": 171806, "epoch": 1419} {"train_loss": -41.2398567199707, "global_step": 171807, "epoch": 1419} {"train_loss": -40.653072357177734, "global_step": 171808, "epoch": 1419} {"train_loss": -40.0328254699707, "global_step": 171809, "epoch": 1419} {"train_loss": -40.947837829589844, "global_step": 171810, "epoch": 1419} {"train_loss": -41.651485443115234, "global_step": 171811, "epoch": 1419} {"train_loss": -41.591426849365234, "global_step": 171812, "epoch": 1419} {"train_loss": -40.3726921081543, "global_step": 171813, "epoch": 1419} {"train_loss": -40.21615219116211, "global_step": 171814, "epoch": 1419} {"train_loss": -39.86438751220703, "global_step": 171815, "epoch": 1419} {"train_loss": -39.06278991699219, "global_step": 171816, "epoch": 1419} {"train_loss": -41.08174133300781, "global_step": 171817, "epoch": 1419} {"train_loss": -40.930118560791016, "global_step": 171818, "epoch": 1419} {"train_loss": -39.014389621324774, "global_step": 171819, "epoch": 1419, "val_loss": 2775460.25} {"train_loss": -40.00967025756836, "global_step": 171820, "epoch": 1420} {"train_loss": -40.066436767578125, "global_step": 171821, "epoch": 1420} {"train_loss": -40.654510498046875, "global_step": 171822, "epoch": 1420} {"train_loss": -40.71091842651367, "global_step": 171823, "epoch": 1420} {"train_loss": -40.34470748901367, "global_step": 171824, "epoch": 1420} {"train_loss": -40.801292419433594, "global_step": 171825, "epoch": 1420} {"train_loss": -40.027462005615234, "global_step": 171826, "epoch": 1420} {"train_loss": -39.718379974365234, "global_step": 171827, "epoch": 1420} {"train_loss": -39.36220932006836, "global_step": 171828, "epoch": 1420} {"train_loss": -39.928497314453125, "global_step": 171829, "epoch": 1420} {"train_loss": -40.32590866088867, "global_step": 171830, "epoch": 1420} {"train_loss": -40.79403305053711, "global_step": 171831, "epoch": 1420} {"train_loss": -40.17923355102539, "global_step": 171832, "epoch": 1420} {"train_loss": -40.21895217895508, "global_step": 171833, "epoch": 1420} {"train_loss": -40.46559143066406, "global_step": 171834, "epoch": 1420} {"train_loss": -39.4875373840332, "global_step": 171835, "epoch": 1420} {"train_loss": -38.49699020385742, "global_step": 171836, "epoch": 1420} {"train_loss": -41.050697326660156, "global_step": 171837, "epoch": 1420} {"train_loss": -38.028480529785156, "global_step": 171838, "epoch": 1420} {"train_loss": -37.68624496459961, "global_step": 171839, "epoch": 1420} {"train_loss": -40.573463439941406, "global_step": 171840, "epoch": 1420} {"train_loss": -39.20328903198242, "global_step": 171841, "epoch": 1420} {"train_loss": -39.084896087646484, "global_step": 171842, "epoch": 1420} {"train_loss": -38.91158676147461, "global_step": 171843, "epoch": 1420} {"train_loss": -40.10688018798828, "global_step": 171844, "epoch": 1420} {"train_loss": -39.07143020629883, "global_step": 171845, "epoch": 1420} {"train_loss": -38.9346923828125, "global_step": 171846, "epoch": 1420} {"train_loss": -40.01757049560547, "global_step": 171847, "epoch": 1420} {"train_loss": -39.32056427001953, "global_step": 171848, "epoch": 1420} {"train_loss": -40.21090316772461, "global_step": 171849, "epoch": 1420} {"train_loss": -38.84286117553711, "global_step": 171850, "epoch": 1420} {"train_loss": -38.94504928588867, "global_step": 171851, "epoch": 1420} {"train_loss": -40.58654022216797, "global_step": 171852, "epoch": 1420} {"train_loss": -40.57285690307617, "global_step": 171853, "epoch": 1420} {"train_loss": -39.10418701171875, "global_step": 171854, "epoch": 1420} {"train_loss": -39.78955078125, "global_step": 171855, "epoch": 1420} {"train_loss": -40.68626022338867, "global_step": 171856, "epoch": 1420} {"train_loss": -40.30532455444336, "global_step": 171857, "epoch": 1420} {"train_loss": -39.93740463256836, "global_step": 171858, "epoch": 1420} {"train_loss": -40.6930046081543, "global_step": 171859, "epoch": 1420} {"train_loss": -40.884437561035156, "global_step": 171860, "epoch": 1420} {"train_loss": -40.4563102722168, "global_step": 171861, "epoch": 1420} {"train_loss": -40.62845230102539, "global_step": 171862, "epoch": 1420} {"train_loss": -41.23554992675781, "global_step": 171863, "epoch": 1420} {"train_loss": -40.786346435546875, "global_step": 171864, "epoch": 1420} {"train_loss": -41.26754379272461, "global_step": 171865, "epoch": 1420} {"train_loss": -40.48517608642578, "global_step": 171866, "epoch": 1420} {"train_loss": -40.61394119262695, "global_step": 171867, "epoch": 1420} {"train_loss": -41.597381591796875, "global_step": 171868, "epoch": 1420} {"train_loss": -40.744686126708984, "global_step": 171869, "epoch": 1420} {"train_loss": -41.2821159362793, "global_step": 171870, "epoch": 1420} {"train_loss": -40.71381378173828, "global_step": 171871, "epoch": 1420} {"train_loss": -41.05581283569336, "global_step": 171872, "epoch": 1420} {"train_loss": -41.28144454956055, "global_step": 171873, "epoch": 1420} {"train_loss": -40.496307373046875, "global_step": 171874, "epoch": 1420} {"train_loss": -40.787841796875, "global_step": 171875, "epoch": 1420} {"train_loss": -41.332763671875, "global_step": 171876, "epoch": 1420} {"train_loss": -41.47532272338867, "global_step": 171877, "epoch": 1420} {"train_loss": -41.2866325378418, "global_step": 171878, "epoch": 1420} {"train_loss": -41.22055435180664, "global_step": 171879, "epoch": 1420} {"train_loss": -41.32827377319336, "global_step": 171880, "epoch": 1420} {"train_loss": -40.84455490112305, "global_step": 171881, "epoch": 1420} {"train_loss": -41.28028106689453, "global_step": 171882, "epoch": 1420} {"train_loss": -41.577186584472656, "global_step": 171883, "epoch": 1420} {"train_loss": -40.892852783203125, "global_step": 171884, "epoch": 1420} {"train_loss": -41.049476623535156, "global_step": 171885, "epoch": 1420} {"train_loss": -41.572845458984375, "global_step": 171886, "epoch": 1420} {"train_loss": -41.35916519165039, "global_step": 171887, "epoch": 1420} {"train_loss": -41.47209930419922, "global_step": 171888, "epoch": 1420} {"train_loss": -41.50947952270508, "global_step": 171889, "epoch": 1420} {"train_loss": -41.815582275390625, "global_step": 171890, "epoch": 1420} {"train_loss": -41.494354248046875, "global_step": 171891, "epoch": 1420} {"train_loss": -41.849945068359375, "global_step": 171892, "epoch": 1420} {"train_loss": -41.77008819580078, "global_step": 171893, "epoch": 1420} {"train_loss": -41.70277786254883, "global_step": 171894, "epoch": 1420} {"train_loss": -41.72018051147461, "global_step": 171895, "epoch": 1420} {"train_loss": -41.66250228881836, "global_step": 171896, "epoch": 1420} {"train_loss": -41.5518798828125, "global_step": 171897, "epoch": 1420} {"train_loss": -41.82623291015625, "global_step": 171898, "epoch": 1420} {"train_loss": -42.00759506225586, "global_step": 171899, "epoch": 1420} {"train_loss": -41.52128982543945, "global_step": 171900, "epoch": 1420} {"train_loss": -41.2535514831543, "global_step": 171901, "epoch": 1420} {"train_loss": -41.966548919677734, "global_step": 171902, "epoch": 1420} {"train_loss": -41.85818862915039, "global_step": 171903, "epoch": 1420} {"train_loss": -41.56330108642578, "global_step": 171904, "epoch": 1420} {"train_loss": -40.48592758178711, "global_step": 171905, "epoch": 1420} {"train_loss": -40.379878997802734, "global_step": 171906, "epoch": 1420} {"train_loss": -41.678749084472656, "global_step": 171907, "epoch": 1420} {"train_loss": -41.80833053588867, "global_step": 171908, "epoch": 1420} {"train_loss": -41.1137809753418, "global_step": 171909, "epoch": 1420} {"train_loss": -39.94641876220703, "global_step": 171910, "epoch": 1420} {"train_loss": -40.51158142089844, "global_step": 171911, "epoch": 1420} {"train_loss": -40.98371124267578, "global_step": 171912, "epoch": 1420} {"train_loss": -41.76858901977539, "global_step": 171913, "epoch": 1420} {"train_loss": -41.58112335205078, "global_step": 171914, "epoch": 1420} {"train_loss": -41.241939544677734, "global_step": 171915, "epoch": 1420} {"train_loss": -41.47431564331055, "global_step": 171916, "epoch": 1420} {"train_loss": -41.55801773071289, "global_step": 171917, "epoch": 1420} {"train_loss": -41.52943801879883, "global_step": 171918, "epoch": 1420} {"train_loss": -41.23797607421875, "global_step": 171919, "epoch": 1420} {"train_loss": -41.252315521240234, "global_step": 171920, "epoch": 1420} {"train_loss": -41.42086410522461, "global_step": 171921, "epoch": 1420} {"train_loss": -41.97051239013672, "global_step": 171922, "epoch": 1420} {"train_loss": -40.86727523803711, "global_step": 171923, "epoch": 1420} {"train_loss": -40.90279006958008, "global_step": 171924, "epoch": 1420} {"train_loss": -39.31754684448242, "global_step": 171925, "epoch": 1420} {"train_loss": -40.59510040283203, "global_step": 171926, "epoch": 1420} {"train_loss": -40.45873260498047, "global_step": 171927, "epoch": 1420} {"train_loss": -38.77994918823242, "global_step": 171928, "epoch": 1420} {"train_loss": -38.2044792175293, "global_step": 171929, "epoch": 1420} {"train_loss": -39.20832443237305, "global_step": 171930, "epoch": 1420} {"train_loss": -40.05617141723633, "global_step": 171931, "epoch": 1420} {"train_loss": -38.56692123413086, "global_step": 171932, "epoch": 1420} {"train_loss": -29.973190307617188, "global_step": 171933, "epoch": 1420} {"train_loss": -33.52332305908203, "global_step": 171934, "epoch": 1420} {"train_loss": -35.119728088378906, "global_step": 171935, "epoch": 1420} {"train_loss": -39.295745849609375, "global_step": 171936, "epoch": 1420} {"train_loss": -36.010921478271484, "global_step": 171937, "epoch": 1420} {"train_loss": -35.9844856262207, "global_step": 171938, "epoch": 1420} {"train_loss": -35.181304931640625, "global_step": 171939, "epoch": 1420} {"train_loss": -40.261913709404055, "global_step": 171940, "epoch": 1420, "val_loss": 2494352.25} {"train_loss": -35.40574264526367, "global_step": 171941, "epoch": 1421} {"train_loss": -31.615997314453125, "global_step": 171942, "epoch": 1421} {"train_loss": -38.20429229736328, "global_step": 171943, "epoch": 1421} {"train_loss": -36.57540512084961, "global_step": 171944, "epoch": 1421} {"train_loss": -34.18830108642578, "global_step": 171945, "epoch": 1421} {"train_loss": -35.559600830078125, "global_step": 171946, "epoch": 1421} {"train_loss": -33.585994720458984, "global_step": 171947, "epoch": 1421} {"train_loss": -35.985164642333984, "global_step": 171948, "epoch": 1421} {"train_loss": -34.8657341003418, "global_step": 171949, "epoch": 1421} {"train_loss": -35.7000846862793, "global_step": 171950, "epoch": 1421} {"train_loss": -38.64814376831055, "global_step": 171951, "epoch": 1421} {"train_loss": -35.326541900634766, "global_step": 171952, "epoch": 1421} {"train_loss": -35.969146728515625, "global_step": 171953, "epoch": 1421} {"train_loss": -34.50975036621094, "global_step": 171954, "epoch": 1421} {"train_loss": -35.802555084228516, "global_step": 171955, "epoch": 1421} {"train_loss": -35.30302047729492, "global_step": 171956, "epoch": 1421} {"train_loss": -36.23506546020508, "global_step": 171957, "epoch": 1421} {"train_loss": -35.734249114990234, "global_step": 171958, "epoch": 1421} {"train_loss": -36.2137565612793, "global_step": 171959, "epoch": 1421} {"train_loss": -37.56875228881836, "global_step": 171960, "epoch": 1421} {"train_loss": -35.34507369995117, "global_step": 171961, "epoch": 1421} {"train_loss": -37.76496505737305, "global_step": 171962, "epoch": 1421} {"train_loss": -36.29677963256836, "global_step": 171963, "epoch": 1421} {"train_loss": -33.74309158325195, "global_step": 171964, "epoch": 1421} {"train_loss": -37.65141677856445, "global_step": 171965, "epoch": 1421} {"train_loss": -34.885536193847656, "global_step": 171966, "epoch": 1421} {"train_loss": -37.08369827270508, "global_step": 171967, "epoch": 1421} {"train_loss": -37.069881439208984, "global_step": 171968, "epoch": 1421} {"train_loss": -38.48890686035156, "global_step": 171969, "epoch": 1421} {"train_loss": -38.112545013427734, "global_step": 171970, "epoch": 1421} {"train_loss": -37.0088005065918, "global_step": 171971, "epoch": 1421} {"train_loss": -36.36408233642578, "global_step": 171972, "epoch": 1421} {"train_loss": -36.49634552001953, "global_step": 171973, "epoch": 1421} {"train_loss": -36.82105255126953, "global_step": 171974, "epoch": 1421} {"train_loss": -36.16414260864258, "global_step": 171975, "epoch": 1421} {"train_loss": -37.81410598754883, "global_step": 171976, "epoch": 1421} {"train_loss": -37.32109451293945, "global_step": 171977, "epoch": 1421} {"train_loss": -37.1431770324707, "global_step": 171978, "epoch": 1421} {"train_loss": -37.0242919921875, "global_step": 171979, "epoch": 1421} {"train_loss": -38.978153228759766, "global_step": 171980, "epoch": 1421} {"train_loss": -37.3306999206543, "global_step": 171981, "epoch": 1421} {"train_loss": -39.02722930908203, "global_step": 171982, "epoch": 1421} {"train_loss": -37.4073486328125, "global_step": 171983, "epoch": 1421} {"train_loss": -38.0197868347168, "global_step": 171984, "epoch": 1421} {"train_loss": -38.40778350830078, "global_step": 171985, "epoch": 1421} {"train_loss": -37.929603576660156, "global_step": 171986, "epoch": 1421} {"train_loss": -36.689605712890625, "global_step": 171987, "epoch": 1421} {"train_loss": -38.5084114074707, "global_step": 171988, "epoch": 1421} {"train_loss": -38.58355712890625, "global_step": 171989, "epoch": 1421} {"train_loss": -38.754390716552734, "global_step": 171990, "epoch": 1421} {"train_loss": -38.68998336791992, "global_step": 171991, "epoch": 1421} {"train_loss": -38.92245101928711, "global_step": 171992, "epoch": 1421} {"train_loss": -38.7642822265625, "global_step": 171993, "epoch": 1421} {"train_loss": -39.07719039916992, "global_step": 171994, "epoch": 1421} {"train_loss": -39.81037521362305, "global_step": 171995, "epoch": 1421} {"train_loss": -38.7088737487793, "global_step": 171996, "epoch": 1421} {"train_loss": -39.18280029296875, "global_step": 171997, "epoch": 1421} {"train_loss": -39.423805236816406, "global_step": 171998, "epoch": 1421} {"train_loss": -39.05143356323242, "global_step": 171999, "epoch": 1421} {"train_loss": -38.5593376159668, "global_step": 172000, "epoch": 1421} {"train_loss": -39.06525421142578, "global_step": 172001, "epoch": 1421} {"train_loss": -38.336177825927734, "global_step": 172002, "epoch": 1421} {"train_loss": -39.33814239501953, "global_step": 172003, "epoch": 1421} {"train_loss": -39.779083251953125, "global_step": 172004, "epoch": 1421} {"train_loss": -39.96737289428711, "global_step": 172005, "epoch": 1421} {"train_loss": -39.52764892578125, "global_step": 172006, "epoch": 1421} {"train_loss": -39.71559143066406, "global_step": 172007, "epoch": 1421} {"train_loss": -39.165321350097656, "global_step": 172008, "epoch": 1421} {"train_loss": -39.75248336791992, "global_step": 172009, "epoch": 1421} {"train_loss": -39.83077621459961, "global_step": 172010, "epoch": 1421} {"train_loss": -39.616737365722656, "global_step": 172011, "epoch": 1421} {"train_loss": -39.481040954589844, "global_step": 172012, "epoch": 1421} {"train_loss": -39.92648696899414, "global_step": 172013, "epoch": 1421} {"train_loss": -39.3747673034668, "global_step": 172014, "epoch": 1421} {"train_loss": -40.22483444213867, "global_step": 172015, "epoch": 1421} {"train_loss": -40.264244079589844, "global_step": 172016, "epoch": 1421} {"train_loss": -39.710548400878906, "global_step": 172017, "epoch": 1421} {"train_loss": -39.8208122253418, "global_step": 172018, "epoch": 1421} {"train_loss": -40.06318283081055, "global_step": 172019, "epoch": 1421} {"train_loss": -39.81415939331055, "global_step": 172020, "epoch": 1421} {"train_loss": -39.99325942993164, "global_step": 172021, "epoch": 1421} {"train_loss": -40.18141555786133, "global_step": 172022, "epoch": 1421} {"train_loss": -40.03998565673828, "global_step": 172023, "epoch": 1421} {"train_loss": -40.40609359741211, "global_step": 172024, "epoch": 1421} {"train_loss": -40.50946044921875, "global_step": 172025, "epoch": 1421} {"train_loss": -40.73488235473633, "global_step": 172026, "epoch": 1421} {"train_loss": -40.03058624267578, "global_step": 172027, "epoch": 1421} {"train_loss": -40.17705535888672, "global_step": 172028, "epoch": 1421} {"train_loss": -40.611080169677734, "global_step": 172029, "epoch": 1421} {"train_loss": -40.40424728393555, "global_step": 172030, "epoch": 1421} {"train_loss": -40.32171630859375, "global_step": 172031, "epoch": 1421} {"train_loss": -40.55753707885742, "global_step": 172032, "epoch": 1421} {"train_loss": -40.350067138671875, "global_step": 172033, "epoch": 1421} {"train_loss": -40.139427185058594, "global_step": 172034, "epoch": 1421} {"train_loss": -40.451717376708984, "global_step": 172035, "epoch": 1421} {"train_loss": -41.00257110595703, "global_step": 172036, "epoch": 1421} {"train_loss": -40.34224319458008, "global_step": 172037, "epoch": 1421} {"train_loss": -40.5899543762207, "global_step": 172038, "epoch": 1421} {"train_loss": -40.25335693359375, "global_step": 172039, "epoch": 1421} {"train_loss": -40.753822326660156, "global_step": 172040, "epoch": 1421} {"train_loss": -41.14794158935547, "global_step": 172041, "epoch": 1421} {"train_loss": -40.43812561035156, "global_step": 172042, "epoch": 1421} {"train_loss": -40.83201217651367, "global_step": 172043, "epoch": 1421} {"train_loss": -41.329986572265625, "global_step": 172044, "epoch": 1421} {"train_loss": -40.9048957824707, "global_step": 172045, "epoch": 1421} {"train_loss": -40.916927337646484, "global_step": 172046, "epoch": 1421} {"train_loss": -41.16650390625, "global_step": 172047, "epoch": 1421} {"train_loss": -41.27375411987305, "global_step": 172048, "epoch": 1421} {"train_loss": -41.35416793823242, "global_step": 172049, "epoch": 1421} {"train_loss": -40.17495346069336, "global_step": 172050, "epoch": 1421} {"train_loss": -41.19577407836914, "global_step": 172051, "epoch": 1421} {"train_loss": -41.44157028198242, "global_step": 172052, "epoch": 1421} {"train_loss": -41.133087158203125, "global_step": 172053, "epoch": 1421} {"train_loss": -41.28182601928711, "global_step": 172054, "epoch": 1421} {"train_loss": -40.977962493896484, "global_step": 172055, "epoch": 1421} {"train_loss": -41.18891906738281, "global_step": 172056, "epoch": 1421} {"train_loss": -40.92387771606445, "global_step": 172057, "epoch": 1421} {"train_loss": -41.44266891479492, "global_step": 172058, "epoch": 1421} {"train_loss": -41.33712387084961, "global_step": 172059, "epoch": 1421} {"train_loss": -41.022151947021484, "global_step": 172060, "epoch": 1421} {"train_loss": -38.71721854091676, "global_step": 172061, "epoch": 1421, "val_loss": 2738567.25} {"train_loss": -41.51717758178711, "global_step": 172062, "epoch": 1422} {"train_loss": -40.829429626464844, "global_step": 172063, "epoch": 1422} {"train_loss": -40.335872650146484, "global_step": 172064, "epoch": 1422} {"train_loss": -40.638668060302734, "global_step": 172065, "epoch": 1422} {"train_loss": -41.63127899169922, "global_step": 172066, "epoch": 1422} {"train_loss": -41.81209945678711, "global_step": 172067, "epoch": 1422} {"train_loss": -40.70259475708008, "global_step": 172068, "epoch": 1422} {"train_loss": -40.141902923583984, "global_step": 172069, "epoch": 1422} {"train_loss": -38.70445251464844, "global_step": 172070, "epoch": 1422} {"train_loss": -40.2796745300293, "global_step": 172071, "epoch": 1422} {"train_loss": -40.65481185913086, "global_step": 172072, "epoch": 1422} {"train_loss": -40.419307708740234, "global_step": 172073, "epoch": 1422} {"train_loss": -39.134986877441406, "global_step": 172074, "epoch": 1422} {"train_loss": -37.412200927734375, "global_step": 172075, "epoch": 1422} {"train_loss": -34.18178176879883, "global_step": 172076, "epoch": 1422} {"train_loss": -37.73609161376953, "global_step": 172077, "epoch": 1422} {"train_loss": -40.5895881652832, "global_step": 172078, "epoch": 1422} {"train_loss": -35.84914779663086, "global_step": 172079, "epoch": 1422} {"train_loss": -34.551361083984375, "global_step": 172080, "epoch": 1422} {"train_loss": -39.79436492919922, "global_step": 172081, "epoch": 1422} {"train_loss": -39.24748611450195, "global_step": 172082, "epoch": 1422} {"train_loss": -36.535709381103516, "global_step": 172083, "epoch": 1422} {"train_loss": -40.65035629272461, "global_step": 172084, "epoch": 1422} {"train_loss": -37.7843017578125, "global_step": 172085, "epoch": 1422} {"train_loss": -38.02777099609375, "global_step": 172086, "epoch": 1422} {"train_loss": -38.9672737121582, "global_step": 172087, "epoch": 1422} {"train_loss": -39.150787353515625, "global_step": 172088, "epoch": 1422} {"train_loss": -40.95570755004883, "global_step": 172089, "epoch": 1422} {"train_loss": -39.452938079833984, "global_step": 172090, "epoch": 1422} {"train_loss": -40.48249435424805, "global_step": 172091, "epoch": 1422} {"train_loss": -40.167938232421875, "global_step": 172092, "epoch": 1422} {"train_loss": -40.032405853271484, "global_step": 172093, "epoch": 1422} {"train_loss": -40.19588851928711, "global_step": 172094, "epoch": 1422} {"train_loss": -40.378395080566406, "global_step": 172095, "epoch": 1422} {"train_loss": -39.28693771362305, "global_step": 172096, "epoch": 1422} {"train_loss": -40.30160140991211, "global_step": 172097, "epoch": 1422} {"train_loss": -40.03333282470703, "global_step": 172098, "epoch": 1422} {"train_loss": -40.6877326965332, "global_step": 172099, "epoch": 1422} {"train_loss": -40.816139221191406, "global_step": 172100, "epoch": 1422} {"train_loss": -39.530067443847656, "global_step": 172101, "epoch": 1422} {"train_loss": -40.93550491333008, "global_step": 172102, "epoch": 1422} {"train_loss": -40.95961380004883, "global_step": 172103, "epoch": 1422} {"train_loss": -40.862586975097656, "global_step": 172104, "epoch": 1422} {"train_loss": -40.43390655517578, "global_step": 172105, "epoch": 1422} {"train_loss": -40.942596435546875, "global_step": 172106, "epoch": 1422} {"train_loss": -41.221370697021484, "global_step": 172107, "epoch": 1422} {"train_loss": -40.978878021240234, "global_step": 172108, "epoch": 1422} {"train_loss": -40.555389404296875, "global_step": 172109, "epoch": 1422} {"train_loss": -40.111751556396484, "global_step": 172110, "epoch": 1422} {"train_loss": -41.45708084106445, "global_step": 172111, "epoch": 1422} {"train_loss": -40.524810791015625, "global_step": 172112, "epoch": 1422} {"train_loss": -41.267059326171875, "global_step": 172113, "epoch": 1422} {"train_loss": -40.122344970703125, "global_step": 172114, "epoch": 1422} {"train_loss": -40.63105392456055, "global_step": 172115, "epoch": 1422} {"train_loss": -40.13163757324219, "global_step": 172116, "epoch": 1422} {"train_loss": -40.07556915283203, "global_step": 172117, "epoch": 1422} {"train_loss": -41.184913635253906, "global_step": 172118, "epoch": 1422} {"train_loss": -41.5507698059082, "global_step": 172119, "epoch": 1422} {"train_loss": -41.373661041259766, "global_step": 172120, "epoch": 1422} {"train_loss": -40.97966384887695, "global_step": 172121, "epoch": 1422} {"train_loss": -41.0700798034668, "global_step": 172122, "epoch": 1422} {"train_loss": -41.13677215576172, "global_step": 172123, "epoch": 1422} {"train_loss": -40.94903564453125, "global_step": 172124, "epoch": 1422} {"train_loss": -41.289642333984375, "global_step": 172125, "epoch": 1422} {"train_loss": -41.292266845703125, "global_step": 172126, "epoch": 1422} {"train_loss": -41.190155029296875, "global_step": 172127, "epoch": 1422} {"train_loss": -41.2666130065918, "global_step": 172128, "epoch": 1422} {"train_loss": -40.72334671020508, "global_step": 172129, "epoch": 1422} {"train_loss": -41.818023681640625, "global_step": 172130, "epoch": 1422} {"train_loss": -41.35946273803711, "global_step": 172131, "epoch": 1422} {"train_loss": -41.090797424316406, "global_step": 172132, "epoch": 1422} {"train_loss": -41.45253372192383, "global_step": 172133, "epoch": 1422} {"train_loss": -41.04480743408203, "global_step": 172134, "epoch": 1422} {"train_loss": -41.629329681396484, "global_step": 172135, "epoch": 1422} {"train_loss": -40.85882568359375, "global_step": 172136, "epoch": 1422} {"train_loss": -41.77216720581055, "global_step": 172137, "epoch": 1422} {"train_loss": -41.81562805175781, "global_step": 172138, "epoch": 1422} {"train_loss": -41.14531707763672, "global_step": 172139, "epoch": 1422} {"train_loss": -39.96070861816406, "global_step": 172140, "epoch": 1422} {"train_loss": -40.92763137817383, "global_step": 172141, "epoch": 1422} {"train_loss": -39.49262237548828, "global_step": 172142, "epoch": 1422} {"train_loss": -40.90303421020508, "global_step": 172143, "epoch": 1422} {"train_loss": -40.8076286315918, "global_step": 172144, "epoch": 1422} {"train_loss": -40.98929977416992, "global_step": 172145, "epoch": 1422} {"train_loss": -40.80814743041992, "global_step": 172146, "epoch": 1422} {"train_loss": -40.72789764404297, "global_step": 172147, "epoch": 1422} {"train_loss": -40.624385833740234, "global_step": 172148, "epoch": 1422} {"train_loss": -39.40348815917969, "global_step": 172149, "epoch": 1422} {"train_loss": -40.08955001831055, "global_step": 172150, "epoch": 1422} {"train_loss": -40.840484619140625, "global_step": 172151, "epoch": 1422} {"train_loss": -41.09992599487305, "global_step": 172152, "epoch": 1422} {"train_loss": -41.38815689086914, "global_step": 172153, "epoch": 1422} {"train_loss": -39.25148010253906, "global_step": 172154, "epoch": 1422} {"train_loss": -38.42926025390625, "global_step": 172155, "epoch": 1422} {"train_loss": -40.38368606567383, "global_step": 172156, "epoch": 1422} {"train_loss": -39.47395706176758, "global_step": 172157, "epoch": 1422} {"train_loss": -40.677581787109375, "global_step": 172158, "epoch": 1422} {"train_loss": -38.92306137084961, "global_step": 172159, "epoch": 1422} {"train_loss": -36.58244705200195, "global_step": 172160, "epoch": 1422} {"train_loss": -36.72309494018555, "global_step": 172161, "epoch": 1422} {"train_loss": -35.649200439453125, "global_step": 172162, "epoch": 1422} {"train_loss": -35.58585739135742, "global_step": 172163, "epoch": 1422} {"train_loss": -36.73103332519531, "global_step": 172164, "epoch": 1422} {"train_loss": -36.55355453491211, "global_step": 172165, "epoch": 1422} {"train_loss": -39.84039306640625, "global_step": 172166, "epoch": 1422} {"train_loss": -38.9469108581543, "global_step": 172167, "epoch": 1422} {"train_loss": -38.003353118896484, "global_step": 172168, "epoch": 1422} {"train_loss": -39.173038482666016, "global_step": 172169, "epoch": 1422} {"train_loss": -39.55721664428711, "global_step": 172170, "epoch": 1422} {"train_loss": -38.29679489135742, "global_step": 172171, "epoch": 1422} {"train_loss": -38.453006744384766, "global_step": 172172, "epoch": 1422} {"train_loss": -38.6251335144043, "global_step": 172173, "epoch": 1422} {"train_loss": -40.05633544921875, "global_step": 172174, "epoch": 1422} {"train_loss": -39.399139404296875, "global_step": 172175, "epoch": 1422} {"train_loss": -39.410396575927734, "global_step": 172176, "epoch": 1422} {"train_loss": -40.10505294799805, "global_step": 172177, "epoch": 1422} {"train_loss": -39.417720794677734, "global_step": 172178, "epoch": 1422} {"train_loss": -39.742916107177734, "global_step": 172179, "epoch": 1422} {"train_loss": -39.966644287109375, "global_step": 172180, "epoch": 1422} {"train_loss": -40.467098236083984, "global_step": 172181, "epoch": 1422} {"train_loss": -39.9230573669938, "global_step": 172182, "epoch": 1422, "val_loss": 2756949.0} {"train_loss": -39.7938232421875, "global_step": 172183, "epoch": 1423} {"train_loss": -38.89182662963867, "global_step": 172184, "epoch": 1423} {"train_loss": -41.13682174682617, "global_step": 172185, "epoch": 1423} {"train_loss": -39.075809478759766, "global_step": 172186, "epoch": 1423} {"train_loss": -40.35126876831055, "global_step": 172187, "epoch": 1423} {"train_loss": -40.31764602661133, "global_step": 172188, "epoch": 1423} {"train_loss": -39.918270111083984, "global_step": 172189, "epoch": 1423} {"train_loss": -39.16206741333008, "global_step": 172190, "epoch": 1423} {"train_loss": -39.052040100097656, "global_step": 172191, "epoch": 1423} {"train_loss": -39.53583908081055, "global_step": 172192, "epoch": 1423} {"train_loss": -39.600399017333984, "global_step": 172193, "epoch": 1423} {"train_loss": -41.02426528930664, "global_step": 172194, "epoch": 1423} {"train_loss": -40.018531799316406, "global_step": 172195, "epoch": 1423} {"train_loss": -40.70216751098633, "global_step": 172196, "epoch": 1423} {"train_loss": -40.54045486450195, "global_step": 172197, "epoch": 1423} {"train_loss": -40.489662170410156, "global_step": 172198, "epoch": 1423} {"train_loss": -40.687984466552734, "global_step": 172199, "epoch": 1423} {"train_loss": -40.13385009765625, "global_step": 172200, "epoch": 1423} {"train_loss": -40.69517135620117, "global_step": 172201, "epoch": 1423} {"train_loss": -40.4017448425293, "global_step": 172202, "epoch": 1423} {"train_loss": -40.70361328125, "global_step": 172203, "epoch": 1423} {"train_loss": -40.26900863647461, "global_step": 172204, "epoch": 1423} {"train_loss": -40.607723236083984, "global_step": 172205, "epoch": 1423} {"train_loss": -41.27268600463867, "global_step": 172206, "epoch": 1423} {"train_loss": -41.02458572387695, "global_step": 172207, "epoch": 1423} {"train_loss": -41.06318283081055, "global_step": 172208, "epoch": 1423} {"train_loss": -41.17457962036133, "global_step": 172209, "epoch": 1423} {"train_loss": -40.860740661621094, "global_step": 172210, "epoch": 1423} {"train_loss": -40.41945266723633, "global_step": 172211, "epoch": 1423} {"train_loss": -39.911094665527344, "global_step": 172212, "epoch": 1423} {"train_loss": -41.39363098144531, "global_step": 172213, "epoch": 1423} {"train_loss": -41.590980529785156, "global_step": 172214, "epoch": 1423} {"train_loss": -40.36180114746094, "global_step": 172215, "epoch": 1423} {"train_loss": -41.04917526245117, "global_step": 172216, "epoch": 1423} {"train_loss": -41.29828643798828, "global_step": 172217, "epoch": 1423} {"train_loss": -41.4363899230957, "global_step": 172218, "epoch": 1423} {"train_loss": -41.41702651977539, "global_step": 172219, "epoch": 1423} {"train_loss": -38.91750717163086, "global_step": 172220, "epoch": 1423} {"train_loss": -41.00453567504883, "global_step": 172221, "epoch": 1423} {"train_loss": -41.668975830078125, "global_step": 172222, "epoch": 1423} {"train_loss": -41.50823974609375, "global_step": 172223, "epoch": 1423} {"train_loss": -41.46479797363281, "global_step": 172224, "epoch": 1423} {"train_loss": -41.48768997192383, "global_step": 172225, "epoch": 1423} {"train_loss": -39.44536590576172, "global_step": 172226, "epoch": 1423} {"train_loss": -41.28950881958008, "global_step": 172227, "epoch": 1423} {"train_loss": -41.343482971191406, "global_step": 172228, "epoch": 1423} {"train_loss": -41.737037658691406, "global_step": 172229, "epoch": 1423} {"train_loss": -41.56150436401367, "global_step": 172230, "epoch": 1423} {"train_loss": -41.29656982421875, "global_step": 172231, "epoch": 1423} {"train_loss": -41.53164291381836, "global_step": 172232, "epoch": 1423} {"train_loss": -41.47443771362305, "global_step": 172233, "epoch": 1423} {"train_loss": -41.61594772338867, "global_step": 172234, "epoch": 1423} {"train_loss": -41.309295654296875, "global_step": 172235, "epoch": 1423} {"train_loss": -41.724788665771484, "global_step": 172236, "epoch": 1423} {"train_loss": -41.359371185302734, "global_step": 172237, "epoch": 1423} {"train_loss": -41.93699645996094, "global_step": 172238, "epoch": 1423} {"train_loss": -41.72896194458008, "global_step": 172239, "epoch": 1423} {"train_loss": -41.811370849609375, "global_step": 172240, "epoch": 1423} {"train_loss": -41.90403366088867, "global_step": 172241, "epoch": 1423} {"train_loss": -41.059200286865234, "global_step": 172242, "epoch": 1423} {"train_loss": -41.54248046875, "global_step": 172243, "epoch": 1423} {"train_loss": -41.38163375854492, "global_step": 172244, "epoch": 1423} {"train_loss": -40.22536849975586, "global_step": 172245, "epoch": 1423} {"train_loss": -38.55772018432617, "global_step": 172246, "epoch": 1423} {"train_loss": -41.11542892456055, "global_step": 172247, "epoch": 1423} {"train_loss": -40.084434509277344, "global_step": 172248, "epoch": 1423} {"train_loss": -41.1959228515625, "global_step": 172249, "epoch": 1423} {"train_loss": -40.32977294921875, "global_step": 172250, "epoch": 1423} {"train_loss": -38.284942626953125, "global_step": 172251, "epoch": 1423} {"train_loss": -40.70448684692383, "global_step": 172252, "epoch": 1423} {"train_loss": -38.17953109741211, "global_step": 172253, "epoch": 1423} {"train_loss": -38.547462463378906, "global_step": 172254, "epoch": 1423} {"train_loss": -40.39430236816406, "global_step": 172255, "epoch": 1423} {"train_loss": -39.97275924682617, "global_step": 172256, "epoch": 1423} {"train_loss": -40.258243560791016, "global_step": 172257, "epoch": 1423} {"train_loss": -39.6607666015625, "global_step": 172258, "epoch": 1423} {"train_loss": -39.616519927978516, "global_step": 172259, "epoch": 1423} {"train_loss": -41.01513671875, "global_step": 172260, "epoch": 1423} {"train_loss": -39.88479232788086, "global_step": 172261, "epoch": 1423} {"train_loss": -38.82890701293945, "global_step": 172262, "epoch": 1423} {"train_loss": -38.81743621826172, "global_step": 172263, "epoch": 1423} {"train_loss": -40.11117172241211, "global_step": 172264, "epoch": 1423} {"train_loss": -40.4713249206543, "global_step": 172265, "epoch": 1423} {"train_loss": -39.56290817260742, "global_step": 172266, "epoch": 1423} {"train_loss": -40.444297790527344, "global_step": 172267, "epoch": 1423} {"train_loss": -38.94013214111328, "global_step": 172268, "epoch": 1423} {"train_loss": -37.40248489379883, "global_step": 172269, "epoch": 1423} {"train_loss": -40.57451248168945, "global_step": 172270, "epoch": 1423} {"train_loss": -39.8795166015625, "global_step": 172271, "epoch": 1423} {"train_loss": -39.29815673828125, "global_step": 172272, "epoch": 1423} {"train_loss": -39.776737213134766, "global_step": 172273, "epoch": 1423} {"train_loss": -39.63124465942383, "global_step": 172274, "epoch": 1423} {"train_loss": -40.139888763427734, "global_step": 172275, "epoch": 1423} {"train_loss": -40.813114166259766, "global_step": 172276, "epoch": 1423} {"train_loss": -40.86591339111328, "global_step": 172277, "epoch": 1423} {"train_loss": -40.50595474243164, "global_step": 172278, "epoch": 1423} {"train_loss": -39.26258087158203, "global_step": 172279, "epoch": 1423} {"train_loss": -39.61434555053711, "global_step": 172280, "epoch": 1423} {"train_loss": -40.1787109375, "global_step": 172281, "epoch": 1423} {"train_loss": -40.995506286621094, "global_step": 172282, "epoch": 1423} {"train_loss": -40.67265701293945, "global_step": 172283, "epoch": 1423} {"train_loss": -40.68379592895508, "global_step": 172284, "epoch": 1423} {"train_loss": -39.3863410949707, "global_step": 172285, "epoch": 1423} {"train_loss": -40.293575286865234, "global_step": 172286, "epoch": 1423} {"train_loss": -40.276824951171875, "global_step": 172287, "epoch": 1423} {"train_loss": -40.161170959472656, "global_step": 172288, "epoch": 1423} {"train_loss": -40.685516357421875, "global_step": 172289, "epoch": 1423} {"train_loss": -39.8734245300293, "global_step": 172290, "epoch": 1423} {"train_loss": -39.92312240600586, "global_step": 172291, "epoch": 1423} {"train_loss": -40.32084274291992, "global_step": 172292, "epoch": 1423} {"train_loss": -39.92196273803711, "global_step": 172293, "epoch": 1423} {"train_loss": -39.48230743408203, "global_step": 172294, "epoch": 1423} {"train_loss": -40.629878997802734, "global_step": 172295, "epoch": 1423} {"train_loss": -41.08441925048828, "global_step": 172296, "epoch": 1423} {"train_loss": -40.899635314941406, "global_step": 172297, "epoch": 1423} {"train_loss": -40.978206634521484, "global_step": 172298, "epoch": 1423} {"train_loss": -39.02755355834961, "global_step": 172299, "epoch": 1423} {"train_loss": -40.57529067993164, "global_step": 172300, "epoch": 1423} {"train_loss": -38.58043670654297, "global_step": 172301, "epoch": 1423} {"train_loss": -40.15199279785156, "global_step": 172302, "epoch": 1423} {"train_loss": -40.400316033481566, "global_step": 172303, "epoch": 1423, "val_loss": 2758558.5} {"train_loss": -37.629638671875, "global_step": 172304, "epoch": 1424} {"train_loss": -40.23038864135742, "global_step": 172305, "epoch": 1424} {"train_loss": -40.59932327270508, "global_step": 172306, "epoch": 1424} {"train_loss": -40.79877853393555, "global_step": 172307, "epoch": 1424} {"train_loss": -32.847862243652344, "global_step": 172308, "epoch": 1424} {"train_loss": -39.143314361572266, "global_step": 172309, "epoch": 1424} {"train_loss": -39.6239128112793, "global_step": 172310, "epoch": 1424} {"train_loss": -40.390830993652344, "global_step": 172311, "epoch": 1424} {"train_loss": -40.5750617980957, "global_step": 172312, "epoch": 1424} {"train_loss": -38.82063674926758, "global_step": 172313, "epoch": 1424} {"train_loss": -38.97378158569336, "global_step": 172314, "epoch": 1424} {"train_loss": -41.000221252441406, "global_step": 172315, "epoch": 1424} {"train_loss": -37.7532958984375, "global_step": 172316, "epoch": 1424} {"train_loss": -38.17084884643555, "global_step": 172317, "epoch": 1424} {"train_loss": -40.277626037597656, "global_step": 172318, "epoch": 1424} {"train_loss": -40.13511276245117, "global_step": 172319, "epoch": 1424} {"train_loss": -39.05355453491211, "global_step": 172320, "epoch": 1424} {"train_loss": -39.262542724609375, "global_step": 172321, "epoch": 1424} {"train_loss": -39.276126861572266, "global_step": 172322, "epoch": 1424} {"train_loss": -38.75631332397461, "global_step": 172323, "epoch": 1424} {"train_loss": -40.75528335571289, "global_step": 172324, "epoch": 1424} {"train_loss": -39.221954345703125, "global_step": 172325, "epoch": 1424} {"train_loss": -38.42244338989258, "global_step": 172326, "epoch": 1424} {"train_loss": -40.125274658203125, "global_step": 172327, "epoch": 1424} {"train_loss": -37.742427825927734, "global_step": 172328, "epoch": 1424} {"train_loss": -40.02861404418945, "global_step": 172329, "epoch": 1424} {"train_loss": -40.2004508972168, "global_step": 172330, "epoch": 1424} {"train_loss": -40.37510299682617, "global_step": 172331, "epoch": 1424} {"train_loss": -39.6292839050293, "global_step": 172332, "epoch": 1424} {"train_loss": -40.031768798828125, "global_step": 172333, "epoch": 1424} {"train_loss": -38.132423400878906, "global_step": 172334, "epoch": 1424} {"train_loss": -38.34330368041992, "global_step": 172335, "epoch": 1424} {"train_loss": -40.44108200073242, "global_step": 172336, "epoch": 1424} {"train_loss": -40.53803253173828, "global_step": 172337, "epoch": 1424} {"train_loss": -40.137752532958984, "global_step": 172338, "epoch": 1424} {"train_loss": -39.44551467895508, "global_step": 172339, "epoch": 1424} {"train_loss": -39.840850830078125, "global_step": 172340, "epoch": 1424} {"train_loss": -40.637813568115234, "global_step": 172341, "epoch": 1424} {"train_loss": -41.01534652709961, "global_step": 172342, "epoch": 1424} {"train_loss": -39.78003692626953, "global_step": 172343, "epoch": 1424} {"train_loss": -41.17524337768555, "global_step": 172344, "epoch": 1424} {"train_loss": -39.74737548828125, "global_step": 172345, "epoch": 1424} {"train_loss": -40.37862014770508, "global_step": 172346, "epoch": 1424} {"train_loss": -39.975399017333984, "global_step": 172347, "epoch": 1424} {"train_loss": -39.78679275512695, "global_step": 172348, "epoch": 1424} {"train_loss": -40.32789611816406, "global_step": 172349, "epoch": 1424} {"train_loss": -41.02961349487305, "global_step": 172350, "epoch": 1424} {"train_loss": -40.206275939941406, "global_step": 172351, "epoch": 1424} {"train_loss": -37.18084716796875, "global_step": 172352, "epoch": 1424} {"train_loss": -40.75483322143555, "global_step": 172353, "epoch": 1424} {"train_loss": -40.209564208984375, "global_step": 172354, "epoch": 1424} {"train_loss": -38.86533737182617, "global_step": 172355, "epoch": 1424} {"train_loss": -39.18584060668945, "global_step": 172356, "epoch": 1424} {"train_loss": -38.422786712646484, "global_step": 172357, "epoch": 1424} {"train_loss": -38.546783447265625, "global_step": 172358, "epoch": 1424} {"train_loss": -40.554603576660156, "global_step": 172359, "epoch": 1424} {"train_loss": -37.1881217956543, "global_step": 172360, "epoch": 1424} {"train_loss": -37.280338287353516, "global_step": 172361, "epoch": 1424} {"train_loss": -38.71978759765625, "global_step": 172362, "epoch": 1424} {"train_loss": -37.210018157958984, "global_step": 172363, "epoch": 1424} {"train_loss": -38.911373138427734, "global_step": 172364, "epoch": 1424} {"train_loss": -38.49143981933594, "global_step": 172365, "epoch": 1424} {"train_loss": -36.9484748840332, "global_step": 172366, "epoch": 1424} {"train_loss": -40.689903259277344, "global_step": 172367, "epoch": 1424} {"train_loss": -39.11222839355469, "global_step": 172368, "epoch": 1424} {"train_loss": -39.781307220458984, "global_step": 172369, "epoch": 1424} {"train_loss": -39.25170135498047, "global_step": 172370, "epoch": 1424} {"train_loss": -37.403717041015625, "global_step": 172371, "epoch": 1424} {"train_loss": -37.89418411254883, "global_step": 172372, "epoch": 1424} {"train_loss": -38.75598907470703, "global_step": 172373, "epoch": 1424} {"train_loss": -38.39803695678711, "global_step": 172374, "epoch": 1424} {"train_loss": -40.1331787109375, "global_step": 172375, "epoch": 1424} {"train_loss": -39.429073333740234, "global_step": 172376, "epoch": 1424} {"train_loss": -39.838645935058594, "global_step": 172377, "epoch": 1424} {"train_loss": -40.32160186767578, "global_step": 172378, "epoch": 1424} {"train_loss": -39.40087127685547, "global_step": 172379, "epoch": 1424} {"train_loss": -38.79206085205078, "global_step": 172380, "epoch": 1424} {"train_loss": -40.31301498413086, "global_step": 172381, "epoch": 1424} {"train_loss": -40.13805389404297, "global_step": 172382, "epoch": 1424} {"train_loss": -40.78622055053711, "global_step": 172383, "epoch": 1424} {"train_loss": -38.75556564331055, "global_step": 172384, "epoch": 1424} {"train_loss": -37.1522216796875, "global_step": 172385, "epoch": 1424} {"train_loss": -39.812740325927734, "global_step": 172386, "epoch": 1424} {"train_loss": -39.598175048828125, "global_step": 172387, "epoch": 1424} {"train_loss": -39.676998138427734, "global_step": 172388, "epoch": 1424} {"train_loss": -40.08401870727539, "global_step": 172389, "epoch": 1424} {"train_loss": -40.235530853271484, "global_step": 172390, "epoch": 1424} {"train_loss": -38.94388961791992, "global_step": 172391, "epoch": 1424} {"train_loss": -40.36788558959961, "global_step": 172392, "epoch": 1424} {"train_loss": -40.31087875366211, "global_step": 172393, "epoch": 1424} {"train_loss": -39.3174934387207, "global_step": 172394, "epoch": 1424} {"train_loss": -40.33513641357422, "global_step": 172395, "epoch": 1424} {"train_loss": -40.58523941040039, "global_step": 172396, "epoch": 1424} {"train_loss": -40.53208541870117, "global_step": 172397, "epoch": 1424} {"train_loss": -39.87697982788086, "global_step": 172398, "epoch": 1424} {"train_loss": -40.40932083129883, "global_step": 172399, "epoch": 1424} {"train_loss": -40.324432373046875, "global_step": 172400, "epoch": 1424} {"train_loss": -40.2079963684082, "global_step": 172401, "epoch": 1424} {"train_loss": -41.1461296081543, "global_step": 172402, "epoch": 1424} {"train_loss": -39.49809646606445, "global_step": 172403, "epoch": 1424} {"train_loss": -40.56850814819336, "global_step": 172404, "epoch": 1424} {"train_loss": -41.20392990112305, "global_step": 172405, "epoch": 1424} {"train_loss": -40.708614349365234, "global_step": 172406, "epoch": 1424} {"train_loss": -39.67600631713867, "global_step": 172407, "epoch": 1424} {"train_loss": -40.97761154174805, "global_step": 172408, "epoch": 1424} {"train_loss": -39.87577438354492, "global_step": 172409, "epoch": 1424} {"train_loss": -40.7273063659668, "global_step": 172410, "epoch": 1424} {"train_loss": -40.99394607543945, "global_step": 172411, "epoch": 1424} {"train_loss": -40.052974700927734, "global_step": 172412, "epoch": 1424} {"train_loss": -40.81277084350586, "global_step": 172413, "epoch": 1424} {"train_loss": -39.344905853271484, "global_step": 172414, "epoch": 1424} {"train_loss": -40.5103645324707, "global_step": 172415, "epoch": 1424} {"train_loss": -41.10516357421875, "global_step": 172416, "epoch": 1424} {"train_loss": -40.532283782958984, "global_step": 172417, "epoch": 1424} {"train_loss": -40.56955337524414, "global_step": 172418, "epoch": 1424} {"train_loss": -41.27058410644531, "global_step": 172419, "epoch": 1424} {"train_loss": -40.47035217285156, "global_step": 172420, "epoch": 1424} {"train_loss": -40.6976203918457, "global_step": 172421, "epoch": 1424} {"train_loss": -40.6636962890625, "global_step": 172422, "epoch": 1424} {"train_loss": -41.0450553894043, "global_step": 172423, "epoch": 1424} {"train_loss": -39.66343865512816, "global_step": 172424, "epoch": 1424, "val_loss": 2787585.5} {"train_loss": -41.53349685668945, "global_step": 172425, "epoch": 1425} {"train_loss": -41.24599075317383, "global_step": 172426, "epoch": 1425} {"train_loss": -41.176368713378906, "global_step": 172427, "epoch": 1425} {"train_loss": -40.84622573852539, "global_step": 172428, "epoch": 1425} {"train_loss": -41.13934326171875, "global_step": 172429, "epoch": 1425} {"train_loss": -39.96732711791992, "global_step": 172430, "epoch": 1425} {"train_loss": -40.578369140625, "global_step": 172431, "epoch": 1425} {"train_loss": -39.16160202026367, "global_step": 172432, "epoch": 1425} {"train_loss": -36.5036506652832, "global_step": 172433, "epoch": 1425} {"train_loss": -34.656532287597656, "global_step": 172434, "epoch": 1425} {"train_loss": -35.32431411743164, "global_step": 172435, "epoch": 1425} {"train_loss": -38.614864349365234, "global_step": 172436, "epoch": 1425} {"train_loss": -40.34471893310547, "global_step": 172437, "epoch": 1425} {"train_loss": -39.3902473449707, "global_step": 172438, "epoch": 1425} {"train_loss": -37.23647689819336, "global_step": 172439, "epoch": 1425} {"train_loss": -39.3072509765625, "global_step": 172440, "epoch": 1425} {"train_loss": -41.23554992675781, "global_step": 172441, "epoch": 1425} {"train_loss": -39.63962936401367, "global_step": 172442, "epoch": 1425} {"train_loss": -38.513057708740234, "global_step": 172443, "epoch": 1425} {"train_loss": -40.90363311767578, "global_step": 172444, "epoch": 1425} {"train_loss": -37.90153503417969, "global_step": 172445, "epoch": 1425} {"train_loss": -39.55219650268555, "global_step": 172446, "epoch": 1425} {"train_loss": -40.55901336669922, "global_step": 172447, "epoch": 1425} {"train_loss": -40.67797088623047, "global_step": 172448, "epoch": 1425} {"train_loss": -39.74058151245117, "global_step": 172449, "epoch": 1425} {"train_loss": -39.98700714111328, "global_step": 172450, "epoch": 1425} {"train_loss": -39.75201416015625, "global_step": 172451, "epoch": 1425} {"train_loss": -40.01176071166992, "global_step": 172452, "epoch": 1425} {"train_loss": -39.59053421020508, "global_step": 172453, "epoch": 1425} {"train_loss": -39.192169189453125, "global_step": 172454, "epoch": 1425} {"train_loss": -40.796897888183594, "global_step": 172455, "epoch": 1425} {"train_loss": -40.19456100463867, "global_step": 172456, "epoch": 1425} {"train_loss": -39.82924270629883, "global_step": 172457, "epoch": 1425} {"train_loss": -39.712406158447266, "global_step": 172458, "epoch": 1425} {"train_loss": -40.67429733276367, "global_step": 172459, "epoch": 1425} {"train_loss": -40.00962448120117, "global_step": 172460, "epoch": 1425} {"train_loss": -40.81270980834961, "global_step": 172461, "epoch": 1425} {"train_loss": -39.738094329833984, "global_step": 172462, "epoch": 1425} {"train_loss": -39.52471923828125, "global_step": 172463, "epoch": 1425} {"train_loss": -39.91953659057617, "global_step": 172464, "epoch": 1425} {"train_loss": -40.405921936035156, "global_step": 172465, "epoch": 1425} {"train_loss": -40.32114791870117, "global_step": 172466, "epoch": 1425} {"train_loss": -40.37639236450195, "global_step": 172467, "epoch": 1425} {"train_loss": -40.92271041870117, "global_step": 172468, "epoch": 1425} {"train_loss": -38.19204330444336, "global_step": 172469, "epoch": 1425} {"train_loss": -39.959686279296875, "global_step": 172470, "epoch": 1425} {"train_loss": -40.78585433959961, "global_step": 172471, "epoch": 1425} {"train_loss": -38.4477653503418, "global_step": 172472, "epoch": 1425} {"train_loss": -40.10884475708008, "global_step": 172473, "epoch": 1425} {"train_loss": -40.705299377441406, "global_step": 172474, "epoch": 1425} {"train_loss": -40.33289337158203, "global_step": 172475, "epoch": 1425} {"train_loss": -39.774688720703125, "global_step": 172476, "epoch": 1425} {"train_loss": -39.587074279785156, "global_step": 172477, "epoch": 1425} {"train_loss": -39.85496139526367, "global_step": 172478, "epoch": 1425} {"train_loss": -40.167720794677734, "global_step": 172479, "epoch": 1425} {"train_loss": -38.813961029052734, "global_step": 172480, "epoch": 1425} {"train_loss": -40.5970458984375, "global_step": 172481, "epoch": 1425} {"train_loss": -39.88357162475586, "global_step": 172482, "epoch": 1425} {"train_loss": -39.7153205871582, "global_step": 172483, "epoch": 1425} {"train_loss": -40.906673431396484, "global_step": 172484, "epoch": 1425} {"train_loss": -40.34701156616211, "global_step": 172485, "epoch": 1425} {"train_loss": -40.636695861816406, "global_step": 172486, "epoch": 1425} {"train_loss": -41.20441818237305, "global_step": 172487, "epoch": 1425} {"train_loss": -40.85693359375, "global_step": 172488, "epoch": 1425} {"train_loss": -40.4250373840332, "global_step": 172489, "epoch": 1425} {"train_loss": -40.66396713256836, "global_step": 172490, "epoch": 1425} {"train_loss": -40.72837829589844, "global_step": 172491, "epoch": 1425} {"train_loss": -41.02420425415039, "global_step": 172492, "epoch": 1425} {"train_loss": -41.01040267944336, "global_step": 172493, "epoch": 1425} {"train_loss": -40.31986618041992, "global_step": 172494, "epoch": 1425} {"train_loss": -41.57025909423828, "global_step": 172495, "epoch": 1425} {"train_loss": -40.459842681884766, "global_step": 172496, "epoch": 1425} {"train_loss": -41.045196533203125, "global_step": 172497, "epoch": 1425} {"train_loss": -41.032997131347656, "global_step": 172498, "epoch": 1425} {"train_loss": -41.18368148803711, "global_step": 172499, "epoch": 1425} {"train_loss": -40.751258850097656, "global_step": 172500, "epoch": 1425} {"train_loss": -40.96845245361328, "global_step": 172501, "epoch": 1425} {"train_loss": -40.95754623413086, "global_step": 172502, "epoch": 1425} {"train_loss": -40.84870529174805, "global_step": 172503, "epoch": 1425} {"train_loss": -41.44955062866211, "global_step": 172504, "epoch": 1425} {"train_loss": -41.32625961303711, "global_step": 172505, "epoch": 1425} {"train_loss": -40.5334587097168, "global_step": 172506, "epoch": 1425} {"train_loss": -40.78925323486328, "global_step": 172507, "epoch": 1425} {"train_loss": -41.41352081298828, "global_step": 172508, "epoch": 1425} {"train_loss": -41.109256744384766, "global_step": 172509, "epoch": 1425} {"train_loss": -41.234031677246094, "global_step": 172510, "epoch": 1425} {"train_loss": -41.526275634765625, "global_step": 172511, "epoch": 1425} {"train_loss": -41.0054931640625, "global_step": 172512, "epoch": 1425} {"train_loss": -40.597137451171875, "global_step": 172513, "epoch": 1425} {"train_loss": -41.376583099365234, "global_step": 172514, "epoch": 1425} {"train_loss": -41.48775100708008, "global_step": 172515, "epoch": 1425} {"train_loss": -41.13151550292969, "global_step": 172516, "epoch": 1425} {"train_loss": -40.580135345458984, "global_step": 172517, "epoch": 1425} {"train_loss": -41.268898010253906, "global_step": 172518, "epoch": 1425} {"train_loss": -41.30488967895508, "global_step": 172519, "epoch": 1425} {"train_loss": -39.963050842285156, "global_step": 172520, "epoch": 1425} {"train_loss": -40.572425842285156, "global_step": 172521, "epoch": 1425} {"train_loss": -40.925437927246094, "global_step": 172522, "epoch": 1425} {"train_loss": -42.0058708190918, "global_step": 172523, "epoch": 1425} {"train_loss": -41.557891845703125, "global_step": 172524, "epoch": 1425} {"train_loss": -41.57454299926758, "global_step": 172525, "epoch": 1425} {"train_loss": -41.21589279174805, "global_step": 172526, "epoch": 1425} {"train_loss": -42.096099853515625, "global_step": 172527, "epoch": 1425} {"train_loss": -41.57917785644531, "global_step": 172528, "epoch": 1425} {"train_loss": -41.33258819580078, "global_step": 172529, "epoch": 1425} {"train_loss": -41.15385055541992, "global_step": 172530, "epoch": 1425} {"train_loss": -40.93695831298828, "global_step": 172531, "epoch": 1425} {"train_loss": -41.443660736083984, "global_step": 172532, "epoch": 1425} {"train_loss": -41.33600616455078, "global_step": 172533, "epoch": 1425} {"train_loss": -41.459957122802734, "global_step": 172534, "epoch": 1425} {"train_loss": -40.25505447387695, "global_step": 172535, "epoch": 1425} {"train_loss": -40.49454116821289, "global_step": 172536, "epoch": 1425} {"train_loss": -41.58290100097656, "global_step": 172537, "epoch": 1425} {"train_loss": -41.284786224365234, "global_step": 172538, "epoch": 1425} {"train_loss": -41.136688232421875, "global_step": 172539, "epoch": 1425} {"train_loss": -40.29018783569336, "global_step": 172540, "epoch": 1425} {"train_loss": -40.778079986572266, "global_step": 172541, "epoch": 1425} {"train_loss": -41.72468185424805, "global_step": 172542, "epoch": 1425} {"train_loss": -41.59590530395508, "global_step": 172543, "epoch": 1425} {"train_loss": -40.82231521606445, "global_step": 172544, "epoch": 1425} {"train_loss": -40.41091074037158, "global_step": 172545, "epoch": 1425, "val_loss": 2690519.0} {"train_loss": -41.7806510925293, "global_step": 172546, "epoch": 1426} {"train_loss": -41.682308197021484, "global_step": 172547, "epoch": 1426} {"train_loss": -40.79433822631836, "global_step": 172548, "epoch": 1426} {"train_loss": -40.82006072998047, "global_step": 172549, "epoch": 1426} {"train_loss": -40.720947265625, "global_step": 172550, "epoch": 1426} {"train_loss": -41.05703353881836, "global_step": 172551, "epoch": 1426} {"train_loss": -41.76322555541992, "global_step": 172552, "epoch": 1426} {"train_loss": -40.85956954956055, "global_step": 172553, "epoch": 1426} {"train_loss": -39.76670455932617, "global_step": 172554, "epoch": 1426} {"train_loss": -41.752464294433594, "global_step": 172555, "epoch": 1426} {"train_loss": -41.3192253112793, "global_step": 172556, "epoch": 1426} {"train_loss": -40.668270111083984, "global_step": 172557, "epoch": 1426} {"train_loss": -41.27831268310547, "global_step": 172558, "epoch": 1426} {"train_loss": -41.3937873840332, "global_step": 172559, "epoch": 1426} {"train_loss": -39.753761291503906, "global_step": 172560, "epoch": 1426} {"train_loss": -39.508914947509766, "global_step": 172561, "epoch": 1426} {"train_loss": -40.45246505737305, "global_step": 172562, "epoch": 1426} {"train_loss": -40.697078704833984, "global_step": 172563, "epoch": 1426} {"train_loss": -40.01833724975586, "global_step": 172564, "epoch": 1426} {"train_loss": -39.34603500366211, "global_step": 172565, "epoch": 1426} {"train_loss": -38.56794357299805, "global_step": 172566, "epoch": 1426} {"train_loss": -40.07943344116211, "global_step": 172567, "epoch": 1426} {"train_loss": -40.118690490722656, "global_step": 172568, "epoch": 1426} {"train_loss": -40.062862396240234, "global_step": 172569, "epoch": 1426} {"train_loss": -40.321468353271484, "global_step": 172570, "epoch": 1426} {"train_loss": -40.6288948059082, "global_step": 172571, "epoch": 1426} {"train_loss": -40.78588104248047, "global_step": 172572, "epoch": 1426} {"train_loss": -41.01151657104492, "global_step": 172573, "epoch": 1426} {"train_loss": -40.737361907958984, "global_step": 172574, "epoch": 1426} {"train_loss": -39.841312408447266, "global_step": 172575, "epoch": 1426} {"train_loss": -40.590606689453125, "global_step": 172576, "epoch": 1426} {"train_loss": -39.2909049987793, "global_step": 172577, "epoch": 1426} {"train_loss": -39.060665130615234, "global_step": 172578, "epoch": 1426} {"train_loss": -39.65565490722656, "global_step": 172579, "epoch": 1426} {"train_loss": -39.292476654052734, "global_step": 172580, "epoch": 1426} {"train_loss": -38.08669662475586, "global_step": 172581, "epoch": 1426} {"train_loss": -40.00105667114258, "global_step": 172582, "epoch": 1426} {"train_loss": -37.18778991699219, "global_step": 172583, "epoch": 1426} {"train_loss": -39.49759292602539, "global_step": 172584, "epoch": 1426} {"train_loss": -38.99477767944336, "global_step": 172585, "epoch": 1426} {"train_loss": -38.25122833251953, "global_step": 172586, "epoch": 1426} {"train_loss": -39.661094665527344, "global_step": 172587, "epoch": 1426} {"train_loss": -39.6403694152832, "global_step": 172588, "epoch": 1426} {"train_loss": -40.67946243286133, "global_step": 172589, "epoch": 1426} {"train_loss": -40.24143600463867, "global_step": 172590, "epoch": 1426} {"train_loss": -39.74006271362305, "global_step": 172591, "epoch": 1426} {"train_loss": -40.017940521240234, "global_step": 172592, "epoch": 1426} {"train_loss": -40.58689498901367, "global_step": 172593, "epoch": 1426} {"train_loss": -40.9175910949707, "global_step": 172594, "epoch": 1426} {"train_loss": -40.58707809448242, "global_step": 172595, "epoch": 1426} {"train_loss": -40.688533782958984, "global_step": 172596, "epoch": 1426} {"train_loss": -39.42567443847656, "global_step": 172597, "epoch": 1426} {"train_loss": -39.414031982421875, "global_step": 172598, "epoch": 1426} {"train_loss": -40.14651870727539, "global_step": 172599, "epoch": 1426} {"train_loss": -41.09008026123047, "global_step": 172600, "epoch": 1426} {"train_loss": -40.04923629760742, "global_step": 172601, "epoch": 1426} {"train_loss": -40.65436935424805, "global_step": 172602, "epoch": 1426} {"train_loss": -40.9417839050293, "global_step": 172603, "epoch": 1426} {"train_loss": -41.0417594909668, "global_step": 172604, "epoch": 1426} {"train_loss": -40.76616287231445, "global_step": 172605, "epoch": 1426} {"train_loss": -40.220558166503906, "global_step": 172606, "epoch": 1426} {"train_loss": -40.4833984375, "global_step": 172607, "epoch": 1426} {"train_loss": -40.15531921386719, "global_step": 172608, "epoch": 1426} {"train_loss": -41.010433197021484, "global_step": 172609, "epoch": 1426} {"train_loss": -40.87479782104492, "global_step": 172610, "epoch": 1426} {"train_loss": -40.54976272583008, "global_step": 172611, "epoch": 1426} {"train_loss": -41.28004455566406, "global_step": 172612, "epoch": 1426} {"train_loss": -41.03654098510742, "global_step": 172613, "epoch": 1426} {"train_loss": -41.16865921020508, "global_step": 172614, "epoch": 1426} {"train_loss": -41.20038986206055, "global_step": 172615, "epoch": 1426} {"train_loss": -41.70858383178711, "global_step": 172616, "epoch": 1426} {"train_loss": -41.3047981262207, "global_step": 172617, "epoch": 1426} {"train_loss": -41.338958740234375, "global_step": 172618, "epoch": 1426} {"train_loss": -41.55392074584961, "global_step": 172619, "epoch": 1426} {"train_loss": -41.73105239868164, "global_step": 172620, "epoch": 1426} {"train_loss": -41.371246337890625, "global_step": 172621, "epoch": 1426} {"train_loss": -40.74005126953125, "global_step": 172622, "epoch": 1426} {"train_loss": -41.14707946777344, "global_step": 172623, "epoch": 1426} {"train_loss": -41.680419921875, "global_step": 172624, "epoch": 1426} {"train_loss": -40.98685836791992, "global_step": 172625, "epoch": 1426} {"train_loss": -40.63471221923828, "global_step": 172626, "epoch": 1426} {"train_loss": -41.65790939331055, "global_step": 172627, "epoch": 1426} {"train_loss": -41.788272857666016, "global_step": 172628, "epoch": 1426} {"train_loss": -41.27089309692383, "global_step": 172629, "epoch": 1426} {"train_loss": -41.29472732543945, "global_step": 172630, "epoch": 1426} {"train_loss": -41.748138427734375, "global_step": 172631, "epoch": 1426} {"train_loss": -41.465065002441406, "global_step": 172632, "epoch": 1426} {"train_loss": -41.36323165893555, "global_step": 172633, "epoch": 1426} {"train_loss": -42.01029586791992, "global_step": 172634, "epoch": 1426} {"train_loss": -41.85122299194336, "global_step": 172635, "epoch": 1426} {"train_loss": -41.87422561645508, "global_step": 172636, "epoch": 1426} {"train_loss": -42.04833984375, "global_step": 172637, "epoch": 1426} {"train_loss": -41.42262649536133, "global_step": 172638, "epoch": 1426} {"train_loss": -42.09435272216797, "global_step": 172639, "epoch": 1426} {"train_loss": -39.319942474365234, "global_step": 172640, "epoch": 1426} {"train_loss": -41.34474563598633, "global_step": 172641, "epoch": 1426} {"train_loss": -41.65631866455078, "global_step": 172642, "epoch": 1426} {"train_loss": -41.5186882019043, "global_step": 172643, "epoch": 1426} {"train_loss": -41.049171447753906, "global_step": 172644, "epoch": 1426} {"train_loss": -41.540130615234375, "global_step": 172645, "epoch": 1426} {"train_loss": -41.42031478881836, "global_step": 172646, "epoch": 1426} {"train_loss": -41.665096282958984, "global_step": 172647, "epoch": 1426} {"train_loss": -41.42019271850586, "global_step": 172648, "epoch": 1426} {"train_loss": -41.41096878051758, "global_step": 172649, "epoch": 1426} {"train_loss": -41.64917755126953, "global_step": 172650, "epoch": 1426} {"train_loss": -40.96645736694336, "global_step": 172651, "epoch": 1426} {"train_loss": -41.81842803955078, "global_step": 172652, "epoch": 1426} {"train_loss": -41.400577545166016, "global_step": 172653, "epoch": 1426} {"train_loss": -40.534423828125, "global_step": 172654, "epoch": 1426} {"train_loss": -39.377906799316406, "global_step": 172655, "epoch": 1426} {"train_loss": -40.030086517333984, "global_step": 172656, "epoch": 1426} {"train_loss": -40.16401290893555, "global_step": 172657, "epoch": 1426} {"train_loss": -38.79603958129883, "global_step": 172658, "epoch": 1426} {"train_loss": -39.380401611328125, "global_step": 172659, "epoch": 1426} {"train_loss": -41.199642181396484, "global_step": 172660, "epoch": 1426} {"train_loss": -40.88661193847656, "global_step": 172661, "epoch": 1426} {"train_loss": -38.74941635131836, "global_step": 172662, "epoch": 1426} {"train_loss": -38.10067367553711, "global_step": 172663, "epoch": 1426} {"train_loss": -38.67628479003906, "global_step": 172664, "epoch": 1426} {"train_loss": -39.70952224731445, "global_step": 172665, "epoch": 1426} {"train_loss": -40.55770959144782, "global_step": 172666, "epoch": 1426, "val_loss": 2732134.75} {"train_loss": -34.65315628051758, "global_step": 172667, "epoch": 1427} {"train_loss": -39.89969253540039, "global_step": 172668, "epoch": 1427} {"train_loss": -39.018768310546875, "global_step": 172669, "epoch": 1427} {"train_loss": -35.59712600708008, "global_step": 172670, "epoch": 1427} {"train_loss": -41.010318756103516, "global_step": 172671, "epoch": 1427} {"train_loss": -37.854896545410156, "global_step": 172672, "epoch": 1427} {"train_loss": -35.7928581237793, "global_step": 172673, "epoch": 1427} {"train_loss": -37.170711517333984, "global_step": 172674, "epoch": 1427} {"train_loss": -39.28889465332031, "global_step": 172675, "epoch": 1427} {"train_loss": -36.89306640625, "global_step": 172676, "epoch": 1427} {"train_loss": -39.906089782714844, "global_step": 172677, "epoch": 1427} {"train_loss": -37.89457321166992, "global_step": 172678, "epoch": 1427} {"train_loss": -39.83219528198242, "global_step": 172679, "epoch": 1427} {"train_loss": -38.83332443237305, "global_step": 172680, "epoch": 1427} {"train_loss": -39.811519622802734, "global_step": 172681, "epoch": 1427} {"train_loss": -38.233882904052734, "global_step": 172682, "epoch": 1427} {"train_loss": -40.06433868408203, "global_step": 172683, "epoch": 1427} {"train_loss": -38.34257125854492, "global_step": 172684, "epoch": 1427} {"train_loss": -40.54199981689453, "global_step": 172685, "epoch": 1427} {"train_loss": -38.725215911865234, "global_step": 172686, "epoch": 1427} {"train_loss": -40.52956771850586, "global_step": 172687, "epoch": 1427} {"train_loss": -40.67299270629883, "global_step": 172688, "epoch": 1427} {"train_loss": -40.217193603515625, "global_step": 172689, "epoch": 1427} {"train_loss": -40.90228271484375, "global_step": 172690, "epoch": 1427} {"train_loss": -40.73435592651367, "global_step": 172691, "epoch": 1427} {"train_loss": -41.24367141723633, "global_step": 172692, "epoch": 1427} {"train_loss": -40.26408767700195, "global_step": 172693, "epoch": 1427} {"train_loss": -41.19020080566406, "global_step": 172694, "epoch": 1427} {"train_loss": -40.85783004760742, "global_step": 172695, "epoch": 1427} {"train_loss": -41.72622299194336, "global_step": 172696, "epoch": 1427} {"train_loss": -40.993865966796875, "global_step": 172697, "epoch": 1427} {"train_loss": -41.61066818237305, "global_step": 172698, "epoch": 1427} {"train_loss": -41.252410888671875, "global_step": 172699, "epoch": 1427} {"train_loss": -41.28102493286133, "global_step": 172700, "epoch": 1427} {"train_loss": -41.25678253173828, "global_step": 172701, "epoch": 1427} {"train_loss": -41.3751220703125, "global_step": 172702, "epoch": 1427} {"train_loss": -41.1068000793457, "global_step": 172703, "epoch": 1427} {"train_loss": -41.61293411254883, "global_step": 172704, "epoch": 1427} {"train_loss": -41.59889221191406, "global_step": 172705, "epoch": 1427} {"train_loss": -41.389015197753906, "global_step": 172706, "epoch": 1427} {"train_loss": -41.47334671020508, "global_step": 172707, "epoch": 1427} {"train_loss": -41.391700744628906, "global_step": 172708, "epoch": 1427} {"train_loss": -41.3338623046875, "global_step": 172709, "epoch": 1427} {"train_loss": -41.613189697265625, "global_step": 172710, "epoch": 1427} {"train_loss": -41.816768646240234, "global_step": 172711, "epoch": 1427} {"train_loss": -41.051544189453125, "global_step": 172712, "epoch": 1427} {"train_loss": -41.562469482421875, "global_step": 172713, "epoch": 1427} {"train_loss": -41.745296478271484, "global_step": 172714, "epoch": 1427} {"train_loss": -41.60284423828125, "global_step": 172715, "epoch": 1427} {"train_loss": -42.27558517456055, "global_step": 172716, "epoch": 1427} {"train_loss": -41.37192916870117, "global_step": 172717, "epoch": 1427} {"train_loss": -41.749629974365234, "global_step": 172718, "epoch": 1427} {"train_loss": -41.39008712768555, "global_step": 172719, "epoch": 1427} {"train_loss": -41.65324020385742, "global_step": 172720, "epoch": 1427} {"train_loss": -41.654842376708984, "global_step": 172721, "epoch": 1427} {"train_loss": -41.74895095825195, "global_step": 172722, "epoch": 1427} {"train_loss": -41.658668518066406, "global_step": 172723, "epoch": 1427} {"train_loss": -41.468048095703125, "global_step": 172724, "epoch": 1427} {"train_loss": -41.02165603637695, "global_step": 172725, "epoch": 1427} {"train_loss": -40.54570388793945, "global_step": 172726, "epoch": 1427} {"train_loss": -41.166259765625, "global_step": 172727, "epoch": 1427} {"train_loss": -41.49717712402344, "global_step": 172728, "epoch": 1427} {"train_loss": -41.56648254394531, "global_step": 172729, "epoch": 1427} {"train_loss": -41.72795867919922, "global_step": 172730, "epoch": 1427} {"train_loss": -41.78295135498047, "global_step": 172731, "epoch": 1427} {"train_loss": -41.9160270690918, "global_step": 172732, "epoch": 1427} {"train_loss": -41.67951202392578, "global_step": 172733, "epoch": 1427} {"train_loss": -41.55415725708008, "global_step": 172734, "epoch": 1427} {"train_loss": -41.01858139038086, "global_step": 172735, "epoch": 1427} {"train_loss": -41.745216369628906, "global_step": 172736, "epoch": 1427} {"train_loss": -41.50472640991211, "global_step": 172737, "epoch": 1427} {"train_loss": -41.58294677734375, "global_step": 172738, "epoch": 1427} {"train_loss": -41.42911148071289, "global_step": 172739, "epoch": 1427} {"train_loss": -41.89324951171875, "global_step": 172740, "epoch": 1427} {"train_loss": -41.5304069519043, "global_step": 172741, "epoch": 1427} {"train_loss": -41.42909622192383, "global_step": 172742, "epoch": 1427} {"train_loss": -41.57859802246094, "global_step": 172743, "epoch": 1427} {"train_loss": -41.915462493896484, "global_step": 172744, "epoch": 1427} {"train_loss": -39.633853912353516, "global_step": 172745, "epoch": 1427} {"train_loss": -37.753326416015625, "global_step": 172746, "epoch": 1427} {"train_loss": -38.12269592285156, "global_step": 172747, "epoch": 1427} {"train_loss": -40.386741638183594, "global_step": 172748, "epoch": 1427} {"train_loss": -37.58000946044922, "global_step": 172749, "epoch": 1427} {"train_loss": -39.22932815551758, "global_step": 172750, "epoch": 1427} {"train_loss": -37.706581115722656, "global_step": 172751, "epoch": 1427} {"train_loss": -37.85292434692383, "global_step": 172752, "epoch": 1427} {"train_loss": -40.02302169799805, "global_step": 172753, "epoch": 1427} {"train_loss": -39.9566535949707, "global_step": 172754, "epoch": 1427} {"train_loss": -37.205448150634766, "global_step": 172755, "epoch": 1427} {"train_loss": -40.01313018798828, "global_step": 172756, "epoch": 1427} {"train_loss": -35.90523910522461, "global_step": 172757, "epoch": 1427} {"train_loss": -37.09202194213867, "global_step": 172758, "epoch": 1427} {"train_loss": -38.4793815612793, "global_step": 172759, "epoch": 1427} {"train_loss": -37.06464767456055, "global_step": 172760, "epoch": 1427} {"train_loss": -38.498207092285156, "global_step": 172761, "epoch": 1427} {"train_loss": -38.808502197265625, "global_step": 172762, "epoch": 1427} {"train_loss": -36.442718505859375, "global_step": 172763, "epoch": 1427} {"train_loss": -39.47068405151367, "global_step": 172764, "epoch": 1427} {"train_loss": -39.77986526489258, "global_step": 172765, "epoch": 1427} {"train_loss": -39.098079681396484, "global_step": 172766, "epoch": 1427} {"train_loss": -39.09848403930664, "global_step": 172767, "epoch": 1427} {"train_loss": -39.921730041503906, "global_step": 172768, "epoch": 1427} {"train_loss": -40.3045654296875, "global_step": 172769, "epoch": 1427} {"train_loss": -40.22880172729492, "global_step": 172770, "epoch": 1427} {"train_loss": -40.405242919921875, "global_step": 172771, "epoch": 1427} {"train_loss": -40.39744186401367, "global_step": 172772, "epoch": 1427} {"train_loss": -40.765846252441406, "global_step": 172773, "epoch": 1427} {"train_loss": -40.5455322265625, "global_step": 172774, "epoch": 1427} {"train_loss": -40.59066390991211, "global_step": 172775, "epoch": 1427} {"train_loss": -40.20835494995117, "global_step": 172776, "epoch": 1427} {"train_loss": -40.89080810546875, "global_step": 172777, "epoch": 1427} {"train_loss": -41.00344467163086, "global_step": 172778, "epoch": 1427} {"train_loss": -40.35093688964844, "global_step": 172779, "epoch": 1427} {"train_loss": -41.21940994262695, "global_step": 172780, "epoch": 1427} {"train_loss": -41.139034271240234, "global_step": 172781, "epoch": 1427} {"train_loss": -40.824337005615234, "global_step": 172782, "epoch": 1427} {"train_loss": -41.4350700378418, "global_step": 172783, "epoch": 1427} {"train_loss": -41.531166076660156, "global_step": 172784, "epoch": 1427} {"train_loss": -41.375152587890625, "global_step": 172785, "epoch": 1427} {"train_loss": -41.6649169921875, "global_step": 172786, "epoch": 1427} {"train_loss": -40.257218289966424, "global_step": 172787, "epoch": 1427, "val_loss": 2741204.0} {"train_loss": -41.53343963623047, "global_step": 172788, "epoch": 1428} {"train_loss": -41.152748107910156, "global_step": 172789, "epoch": 1428} {"train_loss": -41.744747161865234, "global_step": 172790, "epoch": 1428} {"train_loss": -41.766456604003906, "global_step": 172791, "epoch": 1428} {"train_loss": -41.66877365112305, "global_step": 172792, "epoch": 1428} {"train_loss": -40.9701042175293, "global_step": 172793, "epoch": 1428} {"train_loss": -41.74345016479492, "global_step": 172794, "epoch": 1428} {"train_loss": -41.32465744018555, "global_step": 172795, "epoch": 1428} {"train_loss": -41.16719436645508, "global_step": 172796, "epoch": 1428} {"train_loss": -41.77442169189453, "global_step": 172797, "epoch": 1428} {"train_loss": -42.02401351928711, "global_step": 172798, "epoch": 1428} {"train_loss": -41.78971481323242, "global_step": 172799, "epoch": 1428} {"train_loss": -41.86468505859375, "global_step": 172800, "epoch": 1428} {"train_loss": -42.00482940673828, "global_step": 172801, "epoch": 1428} {"train_loss": -42.297752380371094, "global_step": 172802, "epoch": 1428} {"train_loss": -42.095027923583984, "global_step": 172803, "epoch": 1428} {"train_loss": -41.71978759765625, "global_step": 172804, "epoch": 1428} {"train_loss": -42.052734375, "global_step": 172805, "epoch": 1428} {"train_loss": -41.563289642333984, "global_step": 172806, "epoch": 1428} {"train_loss": -42.1467399597168, "global_step": 172807, "epoch": 1428} {"train_loss": -41.842689514160156, "global_step": 172808, "epoch": 1428} {"train_loss": -41.74741744995117, "global_step": 172809, "epoch": 1428} {"train_loss": -42.22198486328125, "global_step": 172810, "epoch": 1428} {"train_loss": -41.867679595947266, "global_step": 172811, "epoch": 1428} {"train_loss": -41.42686080932617, "global_step": 172812, "epoch": 1428} {"train_loss": -41.8596305847168, "global_step": 172813, "epoch": 1428} {"train_loss": -42.00004196166992, "global_step": 172814, "epoch": 1428} {"train_loss": -41.94712448120117, "global_step": 172815, "epoch": 1428} {"train_loss": -42.52061080932617, "global_step": 172816, "epoch": 1428} {"train_loss": -41.66435623168945, "global_step": 172817, "epoch": 1428} {"train_loss": -42.5324821472168, "global_step": 172818, "epoch": 1428} {"train_loss": -42.25666427612305, "global_step": 172819, "epoch": 1428} {"train_loss": -41.98844909667969, "global_step": 172820, "epoch": 1428} {"train_loss": -42.22047805786133, "global_step": 172821, "epoch": 1428} {"train_loss": -42.15195846557617, "global_step": 172822, "epoch": 1428} {"train_loss": -42.01819610595703, "global_step": 172823, "epoch": 1428} {"train_loss": -42.43842697143555, "global_step": 172824, "epoch": 1428} {"train_loss": -42.655921936035156, "global_step": 172825, "epoch": 1428} {"train_loss": -42.56305694580078, "global_step": 172826, "epoch": 1428} {"train_loss": -42.674476623535156, "global_step": 172827, "epoch": 1428} {"train_loss": -42.09809875488281, "global_step": 172828, "epoch": 1428} {"train_loss": -41.30189514160156, "global_step": 172829, "epoch": 1428} {"train_loss": -40.00808334350586, "global_step": 172830, "epoch": 1428} {"train_loss": -38.442474365234375, "global_step": 172831, "epoch": 1428} {"train_loss": -36.50132369995117, "global_step": 172832, "epoch": 1428} {"train_loss": -38.92204284667969, "global_step": 172833, "epoch": 1428} {"train_loss": -41.66008377075195, "global_step": 172834, "epoch": 1428} {"train_loss": -41.9896354675293, "global_step": 172835, "epoch": 1428} {"train_loss": -41.139503479003906, "global_step": 172836, "epoch": 1428} {"train_loss": -40.8695068359375, "global_step": 172837, "epoch": 1428} {"train_loss": -40.17682647705078, "global_step": 172838, "epoch": 1428} {"train_loss": -40.93647384643555, "global_step": 172839, "epoch": 1428} {"train_loss": -40.68194580078125, "global_step": 172840, "epoch": 1428} {"train_loss": -39.327980041503906, "global_step": 172841, "epoch": 1428} {"train_loss": -39.021705627441406, "global_step": 172842, "epoch": 1428} {"train_loss": -40.26363754272461, "global_step": 172843, "epoch": 1428} {"train_loss": -40.67854690551758, "global_step": 172844, "epoch": 1428} {"train_loss": -40.237159729003906, "global_step": 172845, "epoch": 1428} {"train_loss": -39.61567306518555, "global_step": 172846, "epoch": 1428} {"train_loss": -39.058956146240234, "global_step": 172847, "epoch": 1428} {"train_loss": -39.05164337158203, "global_step": 172848, "epoch": 1428} {"train_loss": -40.642086029052734, "global_step": 172849, "epoch": 1428} {"train_loss": -40.877864837646484, "global_step": 172850, "epoch": 1428} {"train_loss": -39.283477783203125, "global_step": 172851, "epoch": 1428} {"train_loss": -40.78672409057617, "global_step": 172852, "epoch": 1428} {"train_loss": -41.38801193237305, "global_step": 172853, "epoch": 1428} {"train_loss": -39.334747314453125, "global_step": 172854, "epoch": 1428} {"train_loss": -39.8134765625, "global_step": 172855, "epoch": 1428} {"train_loss": -41.47807693481445, "global_step": 172856, "epoch": 1428} {"train_loss": -40.828311920166016, "global_step": 172857, "epoch": 1428} {"train_loss": -40.97746658325195, "global_step": 172858, "epoch": 1428} {"train_loss": -41.388031005859375, "global_step": 172859, "epoch": 1428} {"train_loss": -41.20591354370117, "global_step": 172860, "epoch": 1428} {"train_loss": -41.15583419799805, "global_step": 172861, "epoch": 1428} {"train_loss": -41.41276168823242, "global_step": 172862, "epoch": 1428} {"train_loss": -41.735408782958984, "global_step": 172863, "epoch": 1428} {"train_loss": -41.58372116088867, "global_step": 172864, "epoch": 1428} {"train_loss": -41.751319885253906, "global_step": 172865, "epoch": 1428} {"train_loss": -41.65435791015625, "global_step": 172866, "epoch": 1428} {"train_loss": -41.17307662963867, "global_step": 172867, "epoch": 1428} {"train_loss": -41.72788619995117, "global_step": 172868, "epoch": 1428} {"train_loss": -41.63543701171875, "global_step": 172869, "epoch": 1428} {"train_loss": -41.3212776184082, "global_step": 172870, "epoch": 1428} {"train_loss": -40.64052200317383, "global_step": 172871, "epoch": 1428} {"train_loss": -38.786529541015625, "global_step": 172872, "epoch": 1428} {"train_loss": -38.99916458129883, "global_step": 172873, "epoch": 1428} {"train_loss": -41.03782653808594, "global_step": 172874, "epoch": 1428} {"train_loss": -40.70677185058594, "global_step": 172875, "epoch": 1428} {"train_loss": -39.64399337768555, "global_step": 172876, "epoch": 1428} {"train_loss": -39.4678955078125, "global_step": 172877, "epoch": 1428} {"train_loss": -40.00593948364258, "global_step": 172878, "epoch": 1428} {"train_loss": -40.015377044677734, "global_step": 172879, "epoch": 1428} {"train_loss": -39.94322204589844, "global_step": 172880, "epoch": 1428} {"train_loss": -40.974666595458984, "global_step": 172881, "epoch": 1428} {"train_loss": -40.64964294433594, "global_step": 172882, "epoch": 1428} {"train_loss": -40.90281295776367, "global_step": 172883, "epoch": 1428} {"train_loss": -39.87374496459961, "global_step": 172884, "epoch": 1428} {"train_loss": -40.4140510559082, "global_step": 172885, "epoch": 1428} {"train_loss": -41.088802337646484, "global_step": 172886, "epoch": 1428} {"train_loss": -41.25779342651367, "global_step": 172887, "epoch": 1428} {"train_loss": -40.985679626464844, "global_step": 172888, "epoch": 1428} {"train_loss": -40.94130325317383, "global_step": 172889, "epoch": 1428} {"train_loss": -40.0187873840332, "global_step": 172890, "epoch": 1428} {"train_loss": -42.05399703979492, "global_step": 172891, "epoch": 1428} {"train_loss": -40.7523193359375, "global_step": 172892, "epoch": 1428} {"train_loss": -41.42618942260742, "global_step": 172893, "epoch": 1428} {"train_loss": -41.69733428955078, "global_step": 172894, "epoch": 1428} {"train_loss": -40.3700065612793, "global_step": 172895, "epoch": 1428} {"train_loss": -41.871009826660156, "global_step": 172896, "epoch": 1428} {"train_loss": -40.48331069946289, "global_step": 172897, "epoch": 1428} {"train_loss": -41.86294937133789, "global_step": 172898, "epoch": 1428} {"train_loss": -41.07404708862305, "global_step": 172899, "epoch": 1428} {"train_loss": -41.64924240112305, "global_step": 172900, "epoch": 1428} {"train_loss": -42.067501068115234, "global_step": 172901, "epoch": 1428} {"train_loss": -41.77771759033203, "global_step": 172902, "epoch": 1428} {"train_loss": -41.711666107177734, "global_step": 172903, "epoch": 1428} {"train_loss": -41.39888000488281, "global_step": 172904, "epoch": 1428} {"train_loss": -41.88002395629883, "global_step": 172905, "epoch": 1428} {"train_loss": -41.600181579589844, "global_step": 172906, "epoch": 1428} {"train_loss": -41.748069763183594, "global_step": 172907, "epoch": 1428} {"train_loss": -41.12099349597269, "global_step": 172908, "epoch": 1428, "val_loss": 2734776.25} {"train_loss": -41.595088958740234, "global_step": 172909, "epoch": 1429} {"train_loss": -42.02334213256836, "global_step": 172910, "epoch": 1429} {"train_loss": -42.24001693725586, "global_step": 172911, "epoch": 1429} {"train_loss": -42.426979064941406, "global_step": 172912, "epoch": 1429} {"train_loss": -41.929054260253906, "global_step": 172913, "epoch": 1429} {"train_loss": -41.67580795288086, "global_step": 172914, "epoch": 1429} {"train_loss": -42.61164855957031, "global_step": 172915, "epoch": 1429} {"train_loss": -41.57299041748047, "global_step": 172916, "epoch": 1429} {"train_loss": -41.96458053588867, "global_step": 172917, "epoch": 1429} {"train_loss": -42.075828552246094, "global_step": 172918, "epoch": 1429} {"train_loss": -41.750144958496094, "global_step": 172919, "epoch": 1429} {"train_loss": -41.41312789916992, "global_step": 172920, "epoch": 1429} {"train_loss": -41.2519416809082, "global_step": 172921, "epoch": 1429} {"train_loss": -41.950538635253906, "global_step": 172922, "epoch": 1429} {"train_loss": -42.43988800048828, "global_step": 172923, "epoch": 1429} {"train_loss": -41.92892074584961, "global_step": 172924, "epoch": 1429} {"train_loss": -42.27665710449219, "global_step": 172925, "epoch": 1429} {"train_loss": -42.33499526977539, "global_step": 172926, "epoch": 1429} {"train_loss": -42.14176559448242, "global_step": 172927, "epoch": 1429} {"train_loss": -41.61775588989258, "global_step": 172928, "epoch": 1429} {"train_loss": -41.57664108276367, "global_step": 172929, "epoch": 1429} {"train_loss": -42.54392623901367, "global_step": 172930, "epoch": 1429} {"train_loss": -41.39485168457031, "global_step": 172931, "epoch": 1429} {"train_loss": -40.15122604370117, "global_step": 172932, "epoch": 1429} {"train_loss": -39.94882583618164, "global_step": 172933, "epoch": 1429} {"train_loss": -41.61394119262695, "global_step": 172934, "epoch": 1429} {"train_loss": -42.16677474975586, "global_step": 172935, "epoch": 1429} {"train_loss": -40.562286376953125, "global_step": 172936, "epoch": 1429} {"train_loss": -39.67158508300781, "global_step": 172937, "epoch": 1429} {"train_loss": -40.05255126953125, "global_step": 172938, "epoch": 1429} {"train_loss": -41.87964630126953, "global_step": 172939, "epoch": 1429} {"train_loss": -39.591705322265625, "global_step": 172940, "epoch": 1429} {"train_loss": -39.68864822387695, "global_step": 172941, "epoch": 1429} {"train_loss": -40.911407470703125, "global_step": 172942, "epoch": 1429} {"train_loss": -39.785491943359375, "global_step": 172943, "epoch": 1429} {"train_loss": -39.5770263671875, "global_step": 172944, "epoch": 1429} {"train_loss": -39.885894775390625, "global_step": 172945, "epoch": 1429} {"train_loss": -40.27253341674805, "global_step": 172946, "epoch": 1429} {"train_loss": -41.02022933959961, "global_step": 172947, "epoch": 1429} {"train_loss": -39.52734375, "global_step": 172948, "epoch": 1429} {"train_loss": -41.106807708740234, "global_step": 172949, "epoch": 1429} {"train_loss": -41.360713958740234, "global_step": 172950, "epoch": 1429} {"train_loss": -40.530670166015625, "global_step": 172951, "epoch": 1429} {"train_loss": -41.150211334228516, "global_step": 172952, "epoch": 1429} {"train_loss": -41.16132354736328, "global_step": 172953, "epoch": 1429} {"train_loss": -41.09406661987305, "global_step": 172954, "epoch": 1429} {"train_loss": -41.852813720703125, "global_step": 172955, "epoch": 1429} {"train_loss": -40.99357986450195, "global_step": 172956, "epoch": 1429} {"train_loss": -40.078861236572266, "global_step": 172957, "epoch": 1429} {"train_loss": -40.4986572265625, "global_step": 172958, "epoch": 1429} {"train_loss": -41.97901153564453, "global_step": 172959, "epoch": 1429} {"train_loss": -40.880184173583984, "global_step": 172960, "epoch": 1429} {"train_loss": -39.45786666870117, "global_step": 172961, "epoch": 1429} {"train_loss": -39.50917434692383, "global_step": 172962, "epoch": 1429} {"train_loss": -39.313270568847656, "global_step": 172963, "epoch": 1429} {"train_loss": -38.005184173583984, "global_step": 172964, "epoch": 1429} {"train_loss": -41.26428985595703, "global_step": 172965, "epoch": 1429} {"train_loss": -40.75691604614258, "global_step": 172966, "epoch": 1429} {"train_loss": -40.2713737487793, "global_step": 172967, "epoch": 1429} {"train_loss": -40.02419662475586, "global_step": 172968, "epoch": 1429} {"train_loss": -40.974918365478516, "global_step": 172969, "epoch": 1429} {"train_loss": -38.82120895385742, "global_step": 172970, "epoch": 1429} {"train_loss": -38.23264694213867, "global_step": 172971, "epoch": 1429} {"train_loss": -38.673316955566406, "global_step": 172972, "epoch": 1429} {"train_loss": -39.44316482543945, "global_step": 172973, "epoch": 1429} {"train_loss": -39.702247619628906, "global_step": 172974, "epoch": 1429} {"train_loss": -38.04460144042969, "global_step": 172975, "epoch": 1429} {"train_loss": -38.267906188964844, "global_step": 172976, "epoch": 1429} {"train_loss": -39.73664093017578, "global_step": 172977, "epoch": 1429} {"train_loss": -38.12339401245117, "global_step": 172978, "epoch": 1429} {"train_loss": -36.87818908691406, "global_step": 172979, "epoch": 1429} {"train_loss": -39.67930221557617, "global_step": 172980, "epoch": 1429} {"train_loss": -39.598323822021484, "global_step": 172981, "epoch": 1429} {"train_loss": -39.212013244628906, "global_step": 172982, "epoch": 1429} {"train_loss": -38.46943664550781, "global_step": 172983, "epoch": 1429} {"train_loss": -39.739871978759766, "global_step": 172984, "epoch": 1429} {"train_loss": -40.505462646484375, "global_step": 172985, "epoch": 1429} {"train_loss": -39.335811614990234, "global_step": 172986, "epoch": 1429} {"train_loss": -40.247344970703125, "global_step": 172987, "epoch": 1429} {"train_loss": -41.07587814331055, "global_step": 172988, "epoch": 1429} {"train_loss": -40.431148529052734, "global_step": 172989, "epoch": 1429} {"train_loss": -40.942806243896484, "global_step": 172990, "epoch": 1429} {"train_loss": -40.30765914916992, "global_step": 172991, "epoch": 1429} {"train_loss": -40.65871047973633, "global_step": 172992, "epoch": 1429} {"train_loss": -40.786312103271484, "global_step": 172993, "epoch": 1429} {"train_loss": -40.902191162109375, "global_step": 172994, "epoch": 1429} {"train_loss": -41.7507438659668, "global_step": 172995, "epoch": 1429} {"train_loss": -40.86528778076172, "global_step": 172996, "epoch": 1429} {"train_loss": -41.278724670410156, "global_step": 172997, "epoch": 1429} {"train_loss": -41.039215087890625, "global_step": 172998, "epoch": 1429} {"train_loss": -41.07389450073242, "global_step": 172999, "epoch": 1429} {"train_loss": -41.52410125732422, "global_step": 173000, "epoch": 1429} {"train_loss": -40.657588958740234, "global_step": 173001, "epoch": 1429} {"train_loss": -41.72080612182617, "global_step": 173002, "epoch": 1429} {"train_loss": -41.45655059814453, "global_step": 173003, "epoch": 1429} {"train_loss": -41.55117416381836, "global_step": 173004, "epoch": 1429} {"train_loss": -41.3664436340332, "global_step": 173005, "epoch": 1429} {"train_loss": -41.30533981323242, "global_step": 173006, "epoch": 1429} {"train_loss": -41.27480697631836, "global_step": 173007, "epoch": 1429} {"train_loss": -41.34843444824219, "global_step": 173008, "epoch": 1429} {"train_loss": -41.44234848022461, "global_step": 173009, "epoch": 1429} {"train_loss": -41.12592315673828, "global_step": 173010, "epoch": 1429} {"train_loss": -41.17817306518555, "global_step": 173011, "epoch": 1429} {"train_loss": -42.14231491088867, "global_step": 173012, "epoch": 1429} {"train_loss": -41.296566009521484, "global_step": 173013, "epoch": 1429} {"train_loss": -42.0313835144043, "global_step": 173014, "epoch": 1429} {"train_loss": -41.572628021240234, "global_step": 173015, "epoch": 1429} {"train_loss": -41.66807174682617, "global_step": 173016, "epoch": 1429} {"train_loss": -41.77849197387695, "global_step": 173017, "epoch": 1429} {"train_loss": -42.28609085083008, "global_step": 173018, "epoch": 1429} {"train_loss": -41.637813568115234, "global_step": 173019, "epoch": 1429} {"train_loss": -41.704280853271484, "global_step": 173020, "epoch": 1429} {"train_loss": -41.935848236083984, "global_step": 173021, "epoch": 1429} {"train_loss": -42.236270904541016, "global_step": 173022, "epoch": 1429} {"train_loss": -42.07444381713867, "global_step": 173023, "epoch": 1429} {"train_loss": -42.332401275634766, "global_step": 173024, "epoch": 1429} {"train_loss": -42.29843521118164, "global_step": 173025, "epoch": 1429} {"train_loss": -42.270240783691406, "global_step": 173026, "epoch": 1429} {"train_loss": -42.305938720703125, "global_step": 173027, "epoch": 1429} {"train_loss": -42.132957458496094, "global_step": 173028, "epoch": 1429} {"train_loss": -40.90546158719654, "global_step": 173029, "epoch": 1429, "val_loss": 2649164.75} {"train_loss": -42.28096389770508, "global_step": 173030, "epoch": 1430} {"train_loss": -42.22153854370117, "global_step": 173031, "epoch": 1430} {"train_loss": -42.65520095825195, "global_step": 173032, "epoch": 1430} {"train_loss": -41.74959945678711, "global_step": 173033, "epoch": 1430} {"train_loss": -42.07028579711914, "global_step": 173034, "epoch": 1430} {"train_loss": -42.407501220703125, "global_step": 173035, "epoch": 1430} {"train_loss": -42.0880241394043, "global_step": 173036, "epoch": 1430} {"train_loss": -42.41093063354492, "global_step": 173037, "epoch": 1430} {"train_loss": -41.680084228515625, "global_step": 173038, "epoch": 1430} {"train_loss": -42.26137924194336, "global_step": 173039, "epoch": 1430} {"train_loss": -42.177154541015625, "global_step": 173040, "epoch": 1430} {"train_loss": -41.2270622253418, "global_step": 173041, "epoch": 1430} {"train_loss": -41.94221115112305, "global_step": 173042, "epoch": 1430} {"train_loss": -40.46898651123047, "global_step": 173043, "epoch": 1430} {"train_loss": -39.86184310913086, "global_step": 173044, "epoch": 1430} {"train_loss": -40.648921966552734, "global_step": 173045, "epoch": 1430} {"train_loss": -39.88611602783203, "global_step": 173046, "epoch": 1430} {"train_loss": -41.34122848510742, "global_step": 173047, "epoch": 1430} {"train_loss": -42.28987503051758, "global_step": 173048, "epoch": 1430} {"train_loss": -41.307891845703125, "global_step": 173049, "epoch": 1430} {"train_loss": -40.701263427734375, "global_step": 173050, "epoch": 1430} {"train_loss": -42.09254455566406, "global_step": 173051, "epoch": 1430} {"train_loss": -39.416229248046875, "global_step": 173052, "epoch": 1430} {"train_loss": -39.9395751953125, "global_step": 173053, "epoch": 1430} {"train_loss": -40.29658126831055, "global_step": 173054, "epoch": 1430} {"train_loss": -38.00366973876953, "global_step": 173055, "epoch": 1430} {"train_loss": -39.98540115356445, "global_step": 173056, "epoch": 1430} {"train_loss": -34.61820602416992, "global_step": 173057, "epoch": 1430} {"train_loss": -35.99918746948242, "global_step": 173058, "epoch": 1430} {"train_loss": -36.66459274291992, "global_step": 173059, "epoch": 1430} {"train_loss": -37.8568115234375, "global_step": 173060, "epoch": 1430} {"train_loss": -36.7461051940918, "global_step": 173061, "epoch": 1430} {"train_loss": -37.04598617553711, "global_step": 173062, "epoch": 1430} {"train_loss": -37.873680114746094, "global_step": 173063, "epoch": 1430} {"train_loss": -36.2338981628418, "global_step": 173064, "epoch": 1430} {"train_loss": -37.990718841552734, "global_step": 173065, "epoch": 1430} {"train_loss": -40.07388687133789, "global_step": 173066, "epoch": 1430} {"train_loss": -39.2184944152832, "global_step": 173067, "epoch": 1430} {"train_loss": -38.61355209350586, "global_step": 173068, "epoch": 1430} {"train_loss": -38.990943908691406, "global_step": 173069, "epoch": 1430} {"train_loss": -40.23904800415039, "global_step": 173070, "epoch": 1430} {"train_loss": -40.23208999633789, "global_step": 173071, "epoch": 1430} {"train_loss": -38.7077522277832, "global_step": 173072, "epoch": 1430} {"train_loss": -41.405879974365234, "global_step": 173073, "epoch": 1430} {"train_loss": -39.871604919433594, "global_step": 173074, "epoch": 1430} {"train_loss": -39.29792022705078, "global_step": 173075, "epoch": 1430} {"train_loss": -39.38114929199219, "global_step": 173076, "epoch": 1430} {"train_loss": -40.974666595458984, "global_step": 173077, "epoch": 1430} {"train_loss": -39.8554801940918, "global_step": 173078, "epoch": 1430} {"train_loss": -39.22882080078125, "global_step": 173079, "epoch": 1430} {"train_loss": -40.64976119995117, "global_step": 173080, "epoch": 1430} {"train_loss": -40.70769119262695, "global_step": 173081, "epoch": 1430} {"train_loss": -40.534114837646484, "global_step": 173082, "epoch": 1430} {"train_loss": -41.33356857299805, "global_step": 173083, "epoch": 1430} {"train_loss": -40.22092819213867, "global_step": 173084, "epoch": 1430} {"train_loss": -39.87706756591797, "global_step": 173085, "epoch": 1430} {"train_loss": -41.9515380859375, "global_step": 173086, "epoch": 1430} {"train_loss": -40.064754486083984, "global_step": 173087, "epoch": 1430} {"train_loss": -40.062618255615234, "global_step": 173088, "epoch": 1430} {"train_loss": -41.23040771484375, "global_step": 173089, "epoch": 1430} {"train_loss": -39.77114486694336, "global_step": 173090, "epoch": 1430} {"train_loss": -41.38512420654297, "global_step": 173091, "epoch": 1430} {"train_loss": -40.87665939331055, "global_step": 173092, "epoch": 1430} {"train_loss": -40.573822021484375, "global_step": 173093, "epoch": 1430} {"train_loss": -41.31555938720703, "global_step": 173094, "epoch": 1430} {"train_loss": -40.941078186035156, "global_step": 173095, "epoch": 1430} {"train_loss": -41.454689025878906, "global_step": 173096, "epoch": 1430} {"train_loss": -41.8609733581543, "global_step": 173097, "epoch": 1430} {"train_loss": -41.407161712646484, "global_step": 173098, "epoch": 1430} {"train_loss": -41.843597412109375, "global_step": 173099, "epoch": 1430} {"train_loss": -41.7545051574707, "global_step": 173100, "epoch": 1430} {"train_loss": -41.099300384521484, "global_step": 173101, "epoch": 1430} {"train_loss": -41.886924743652344, "global_step": 173102, "epoch": 1430} {"train_loss": -41.97081756591797, "global_step": 173103, "epoch": 1430} {"train_loss": -41.833763122558594, "global_step": 173104, "epoch": 1430} {"train_loss": -42.21992874145508, "global_step": 173105, "epoch": 1430} {"train_loss": -41.519046783447266, "global_step": 173106, "epoch": 1430} {"train_loss": -41.76933670043945, "global_step": 173107, "epoch": 1430} {"train_loss": -41.829097747802734, "global_step": 173108, "epoch": 1430} {"train_loss": -42.15597152709961, "global_step": 173109, "epoch": 1430} {"train_loss": -42.31370162963867, "global_step": 173110, "epoch": 1430} {"train_loss": -42.17087936401367, "global_step": 173111, "epoch": 1430} {"train_loss": -41.743587493896484, "global_step": 173112, "epoch": 1430} {"train_loss": -42.47453308105469, "global_step": 173113, "epoch": 1430} {"train_loss": -42.49257278442383, "global_step": 173114, "epoch": 1430} {"train_loss": -42.59593200683594, "global_step": 173115, "epoch": 1430} {"train_loss": -42.275787353515625, "global_step": 173116, "epoch": 1430} {"train_loss": -42.542049407958984, "global_step": 173117, "epoch": 1430} {"train_loss": -42.02546691894531, "global_step": 173118, "epoch": 1430} {"train_loss": -42.28812789916992, "global_step": 173119, "epoch": 1430} {"train_loss": -42.269195556640625, "global_step": 173120, "epoch": 1430} {"train_loss": -41.98517608642578, "global_step": 173121, "epoch": 1430} {"train_loss": -41.14048385620117, "global_step": 173122, "epoch": 1430} {"train_loss": -42.063602447509766, "global_step": 173123, "epoch": 1430} {"train_loss": -41.80280685424805, "global_step": 173124, "epoch": 1430} {"train_loss": -41.9373664855957, "global_step": 173125, "epoch": 1430} {"train_loss": -42.41865921020508, "global_step": 173126, "epoch": 1430} {"train_loss": -42.66453170776367, "global_step": 173127, "epoch": 1430} {"train_loss": -41.94314956665039, "global_step": 173128, "epoch": 1430} {"train_loss": -41.736961364746094, "global_step": 173129, "epoch": 1430} {"train_loss": -41.64176559448242, "global_step": 173130, "epoch": 1430} {"train_loss": -42.62895584106445, "global_step": 173131, "epoch": 1430} {"train_loss": -40.08637619018555, "global_step": 173132, "epoch": 1430} {"train_loss": -39.43367385864258, "global_step": 173133, "epoch": 1430} {"train_loss": -40.2130012512207, "global_step": 173134, "epoch": 1430} {"train_loss": -41.623939514160156, "global_step": 173135, "epoch": 1430} {"train_loss": -41.13218688964844, "global_step": 173136, "epoch": 1430} {"train_loss": -39.58770751953125, "global_step": 173137, "epoch": 1430} {"train_loss": -42.2704963684082, "global_step": 173138, "epoch": 1430} {"train_loss": -40.509796142578125, "global_step": 173139, "epoch": 1430} {"train_loss": -39.418548583984375, "global_step": 173140, "epoch": 1430} {"train_loss": -41.196861267089844, "global_step": 173141, "epoch": 1430} {"train_loss": -41.14455795288086, "global_step": 173142, "epoch": 1430} {"train_loss": -40.61393356323242, "global_step": 173143, "epoch": 1430} {"train_loss": -41.388790130615234, "global_step": 173144, "epoch": 1430} {"train_loss": -41.867305755615234, "global_step": 173145, "epoch": 1430} {"train_loss": -40.236873626708984, "global_step": 173146, "epoch": 1430} {"train_loss": -41.725826263427734, "global_step": 173147, "epoch": 1430} {"train_loss": -41.314571380615234, "global_step": 173148, "epoch": 1430} {"train_loss": -41.35083770751953, "global_step": 173149, "epoch": 1430} {"train_loss": -40.829789878908265, "global_step": 173150, "epoch": 1430, "val_loss": 2784042.0} {"train_loss": -41.6906623840332, "global_step": 173151, "epoch": 1431} {"train_loss": -41.742218017578125, "global_step": 173152, "epoch": 1431} {"train_loss": -41.344852447509766, "global_step": 173153, "epoch": 1431} {"train_loss": -41.35993194580078, "global_step": 173154, "epoch": 1431} {"train_loss": -40.577754974365234, "global_step": 173155, "epoch": 1431} {"train_loss": -41.11063766479492, "global_step": 173156, "epoch": 1431} {"train_loss": -41.806758880615234, "global_step": 173157, "epoch": 1431} {"train_loss": -42.72695541381836, "global_step": 173158, "epoch": 1431} {"train_loss": -40.5128288269043, "global_step": 173159, "epoch": 1431} {"train_loss": -34.353858947753906, "global_step": 173160, "epoch": 1431} {"train_loss": -30.989477157592773, "global_step": 173161, "epoch": 1431} {"train_loss": -33.71979522705078, "global_step": 173162, "epoch": 1431} {"train_loss": -41.369300842285156, "global_step": 173163, "epoch": 1431} {"train_loss": -36.455352783203125, "global_step": 173164, "epoch": 1431} {"train_loss": -36.563270568847656, "global_step": 173165, "epoch": 1431} {"train_loss": -38.59018325805664, "global_step": 173166, "epoch": 1431} {"train_loss": -36.96760940551758, "global_step": 173167, "epoch": 1431} {"train_loss": -41.385108947753906, "global_step": 173168, "epoch": 1431} {"train_loss": -38.57633972167969, "global_step": 173169, "epoch": 1431} {"train_loss": -41.390594482421875, "global_step": 173170, "epoch": 1431} {"train_loss": -38.96523666381836, "global_step": 173171, "epoch": 1431} {"train_loss": -40.20769500732422, "global_step": 173172, "epoch": 1431} {"train_loss": -39.88314437866211, "global_step": 173173, "epoch": 1431} {"train_loss": -40.85566711425781, "global_step": 173174, "epoch": 1431} {"train_loss": -36.948909759521484, "global_step": 173175, "epoch": 1431} {"train_loss": -40.79143142700195, "global_step": 173176, "epoch": 1431} {"train_loss": -39.588844299316406, "global_step": 173177, "epoch": 1431} {"train_loss": -40.68589401245117, "global_step": 173178, "epoch": 1431} {"train_loss": -38.04642868041992, "global_step": 173179, "epoch": 1431} {"train_loss": -39.74492263793945, "global_step": 173180, "epoch": 1431} {"train_loss": -40.4327392578125, "global_step": 173181, "epoch": 1431} {"train_loss": -40.60756301879883, "global_step": 173182, "epoch": 1431} {"train_loss": -40.091007232666016, "global_step": 173183, "epoch": 1431} {"train_loss": -41.030574798583984, "global_step": 173184, "epoch": 1431} {"train_loss": -41.50617599487305, "global_step": 173185, "epoch": 1431} {"train_loss": -41.0771369934082, "global_step": 173186, "epoch": 1431} {"train_loss": -37.98374557495117, "global_step": 173187, "epoch": 1431} {"train_loss": -40.5986213684082, "global_step": 173188, "epoch": 1431} {"train_loss": -39.520870208740234, "global_step": 173189, "epoch": 1431} {"train_loss": -40.48598861694336, "global_step": 173190, "epoch": 1431} {"train_loss": -41.162960052490234, "global_step": 173191, "epoch": 1431} {"train_loss": -40.8714714050293, "global_step": 173192, "epoch": 1431} {"train_loss": -40.22927474975586, "global_step": 173193, "epoch": 1431} {"train_loss": -40.275394439697266, "global_step": 173194, "epoch": 1431} {"train_loss": -41.078094482421875, "global_step": 173195, "epoch": 1431} {"train_loss": -41.03690719604492, "global_step": 173196, "epoch": 1431} {"train_loss": -41.24011993408203, "global_step": 173197, "epoch": 1431} {"train_loss": -40.98402404785156, "global_step": 173198, "epoch": 1431} {"train_loss": -40.35322189331055, "global_step": 173199, "epoch": 1431} {"train_loss": -38.01719665527344, "global_step": 173200, "epoch": 1431} {"train_loss": -41.20743942260742, "global_step": 173201, "epoch": 1431} {"train_loss": -41.00589370727539, "global_step": 173202, "epoch": 1431} {"train_loss": -38.3818244934082, "global_step": 173203, "epoch": 1431} {"train_loss": -39.79069519042969, "global_step": 173204, "epoch": 1431} {"train_loss": -41.04924392700195, "global_step": 173205, "epoch": 1431} {"train_loss": -38.892616271972656, "global_step": 173206, "epoch": 1431} {"train_loss": -36.56663131713867, "global_step": 173207, "epoch": 1431} {"train_loss": -33.824214935302734, "global_step": 173208, "epoch": 1431} {"train_loss": -32.861236572265625, "global_step": 173209, "epoch": 1431} {"train_loss": -38.12654113769531, "global_step": 173210, "epoch": 1431} {"train_loss": -36.643245697021484, "global_step": 173211, "epoch": 1431} {"train_loss": -21.155433654785156, "global_step": 173212, "epoch": 1431} {"train_loss": -38.92735290527344, "global_step": 173213, "epoch": 1431} {"train_loss": -39.4544792175293, "global_step": 173214, "epoch": 1431} {"train_loss": -31.68804359436035, "global_step": 173215, "epoch": 1431} {"train_loss": -37.598907470703125, "global_step": 173216, "epoch": 1431} {"train_loss": -18.67507553100586, "global_step": 173217, "epoch": 1431} {"train_loss": -34.833251953125, "global_step": 173218, "epoch": 1431} {"train_loss": -32.8846549987793, "global_step": 173219, "epoch": 1431} {"train_loss": -37.99116897583008, "global_step": 173220, "epoch": 1431} {"train_loss": -37.06059646606445, "global_step": 173221, "epoch": 1431} {"train_loss": -32.06356430053711, "global_step": 173222, "epoch": 1431} {"train_loss": -33.336631774902344, "global_step": 173223, "epoch": 1431} {"train_loss": -29.591001510620117, "global_step": 173224, "epoch": 1431} {"train_loss": -35.56989669799805, "global_step": 173225, "epoch": 1431} {"train_loss": -27.02984619140625, "global_step": 173226, "epoch": 1431} {"train_loss": -34.02558135986328, "global_step": 173227, "epoch": 1431} {"train_loss": -36.96532440185547, "global_step": 173228, "epoch": 1431} {"train_loss": -34.836971282958984, "global_step": 173229, "epoch": 1431} {"train_loss": -36.40816879272461, "global_step": 173230, "epoch": 1431} {"train_loss": -36.132747650146484, "global_step": 173231, "epoch": 1431} {"train_loss": -35.45719909667969, "global_step": 173232, "epoch": 1431} {"train_loss": -35.371185302734375, "global_step": 173233, "epoch": 1431} {"train_loss": -37.86699295043945, "global_step": 173234, "epoch": 1431} {"train_loss": -35.19831466674805, "global_step": 173235, "epoch": 1431} {"train_loss": -36.081695556640625, "global_step": 173236, "epoch": 1431} {"train_loss": -35.088619232177734, "global_step": 173237, "epoch": 1431} {"train_loss": -35.166847229003906, "global_step": 173238, "epoch": 1431} {"train_loss": -36.8870849609375, "global_step": 173239, "epoch": 1431} {"train_loss": -36.450923919677734, "global_step": 173240, "epoch": 1431} {"train_loss": -35.702659606933594, "global_step": 173241, "epoch": 1431} {"train_loss": -36.12272262573242, "global_step": 173242, "epoch": 1431} {"train_loss": -35.8953742980957, "global_step": 173243, "epoch": 1431} {"train_loss": -36.89840316772461, "global_step": 173244, "epoch": 1431} {"train_loss": -36.33005905151367, "global_step": 173245, "epoch": 1431} {"train_loss": -35.950069427490234, "global_step": 173246, "epoch": 1431} {"train_loss": -36.97719192504883, "global_step": 173247, "epoch": 1431} {"train_loss": -36.640079498291016, "global_step": 173248, "epoch": 1431} {"train_loss": -37.65342330932617, "global_step": 173249, "epoch": 1431} {"train_loss": -38.2744255065918, "global_step": 173250, "epoch": 1431} {"train_loss": -38.985679626464844, "global_step": 173251, "epoch": 1431} {"train_loss": -37.489356994628906, "global_step": 173252, "epoch": 1431} {"train_loss": -36.819759368896484, "global_step": 173253, "epoch": 1431} {"train_loss": -38.05998611450195, "global_step": 173254, "epoch": 1431} {"train_loss": -37.56613540649414, "global_step": 173255, "epoch": 1431} {"train_loss": -37.146053314208984, "global_step": 173256, "epoch": 1431} {"train_loss": -38.175392150878906, "global_step": 173257, "epoch": 1431} {"train_loss": -38.222572326660156, "global_step": 173258, "epoch": 1431} {"train_loss": -39.0671501159668, "global_step": 173259, "epoch": 1431} {"train_loss": -38.37193298339844, "global_step": 173260, "epoch": 1431} {"train_loss": -37.983734130859375, "global_step": 173261, "epoch": 1431} {"train_loss": -38.06757736206055, "global_step": 173262, "epoch": 1431} {"train_loss": -39.25032424926758, "global_step": 173263, "epoch": 1431} {"train_loss": -38.009674072265625, "global_step": 173264, "epoch": 1431} {"train_loss": -38.32413864135742, "global_step": 173265, "epoch": 1431} {"train_loss": -39.0255241394043, "global_step": 173266, "epoch": 1431} {"train_loss": -38.85536193847656, "global_step": 173267, "epoch": 1431} {"train_loss": -39.44533157348633, "global_step": 173268, "epoch": 1431} {"train_loss": -38.88828659057617, "global_step": 173269, "epoch": 1431} {"train_loss": -39.2181396484375, "global_step": 173270, "epoch": 1431} {"train_loss": -37.7569995438757, "global_step": 173271, "epoch": 1431, "val_loss": 2734381.75} {"train_loss": -39.24351119995117, "global_step": 173272, "epoch": 1432} {"train_loss": -39.46220016479492, "global_step": 173273, "epoch": 1432} {"train_loss": -39.02910614013672, "global_step": 173274, "epoch": 1432} {"train_loss": -39.514564514160156, "global_step": 173275, "epoch": 1432} {"train_loss": -39.03571701049805, "global_step": 173276, "epoch": 1432} {"train_loss": -38.99348068237305, "global_step": 173277, "epoch": 1432} {"train_loss": -39.793067932128906, "global_step": 173278, "epoch": 1432} {"train_loss": -39.397552490234375, "global_step": 173279, "epoch": 1432} {"train_loss": -39.56770324707031, "global_step": 173280, "epoch": 1432} {"train_loss": -39.47526931762695, "global_step": 173281, "epoch": 1432} {"train_loss": -39.59397506713867, "global_step": 173282, "epoch": 1432} {"train_loss": -39.912818908691406, "global_step": 173283, "epoch": 1432} {"train_loss": -39.153446197509766, "global_step": 173284, "epoch": 1432} {"train_loss": -39.988319396972656, "global_step": 173285, "epoch": 1432} {"train_loss": -40.02700424194336, "global_step": 173286, "epoch": 1432} {"train_loss": -40.12522506713867, "global_step": 173287, "epoch": 1432} {"train_loss": -39.84067916870117, "global_step": 173288, "epoch": 1432} {"train_loss": -40.13666534423828, "global_step": 173289, "epoch": 1432} {"train_loss": -39.69769287109375, "global_step": 173290, "epoch": 1432} {"train_loss": -40.199867248535156, "global_step": 173291, "epoch": 1432} {"train_loss": -40.1618766784668, "global_step": 173292, "epoch": 1432} {"train_loss": -39.77347946166992, "global_step": 173293, "epoch": 1432} {"train_loss": -40.3856315612793, "global_step": 173294, "epoch": 1432} {"train_loss": -40.33759307861328, "global_step": 173295, "epoch": 1432} {"train_loss": -39.78718185424805, "global_step": 173296, "epoch": 1432} {"train_loss": -39.948909759521484, "global_step": 173297, "epoch": 1432} {"train_loss": -40.663902282714844, "global_step": 173298, "epoch": 1432} {"train_loss": -40.38093185424805, "global_step": 173299, "epoch": 1432} {"train_loss": -40.47736740112305, "global_step": 173300, "epoch": 1432} {"train_loss": -40.43807601928711, "global_step": 173301, "epoch": 1432} {"train_loss": -40.019676208496094, "global_step": 173302, "epoch": 1432} {"train_loss": -40.40190505981445, "global_step": 173303, "epoch": 1432} {"train_loss": -40.86995315551758, "global_step": 173304, "epoch": 1432} {"train_loss": -39.924720764160156, "global_step": 173305, "epoch": 1432} {"train_loss": -40.4775505065918, "global_step": 173306, "epoch": 1432} {"train_loss": -40.68293380737305, "global_step": 173307, "epoch": 1432} {"train_loss": -40.11017990112305, "global_step": 173308, "epoch": 1432} {"train_loss": -40.879058837890625, "global_step": 173309, "epoch": 1432} {"train_loss": -40.58656311035156, "global_step": 173310, "epoch": 1432} {"train_loss": -41.04746627807617, "global_step": 173311, "epoch": 1432} {"train_loss": -40.39369583129883, "global_step": 173312, "epoch": 1432} {"train_loss": -40.77350616455078, "global_step": 173313, "epoch": 1432} {"train_loss": -40.68672180175781, "global_step": 173314, "epoch": 1432} {"train_loss": -40.06885528564453, "global_step": 173315, "epoch": 1432} {"train_loss": -41.41572952270508, "global_step": 173316, "epoch": 1432} {"train_loss": -40.33673858642578, "global_step": 173317, "epoch": 1432} {"train_loss": -40.91358947753906, "global_step": 173318, "epoch": 1432} {"train_loss": -41.140838623046875, "global_step": 173319, "epoch": 1432} {"train_loss": -39.80925369262695, "global_step": 173320, "epoch": 1432} {"train_loss": -40.76510238647461, "global_step": 173321, "epoch": 1432} {"train_loss": -40.659732818603516, "global_step": 173322, "epoch": 1432} {"train_loss": -40.69135665893555, "global_step": 173323, "epoch": 1432} {"train_loss": -39.425682067871094, "global_step": 173324, "epoch": 1432} {"train_loss": -40.953975677490234, "global_step": 173325, "epoch": 1432} {"train_loss": -39.703914642333984, "global_step": 173326, "epoch": 1432} {"train_loss": -40.75285720825195, "global_step": 173327, "epoch": 1432} {"train_loss": -41.006038665771484, "global_step": 173328, "epoch": 1432} {"train_loss": -41.00974655151367, "global_step": 173329, "epoch": 1432} {"train_loss": -39.050716400146484, "global_step": 173330, "epoch": 1432} {"train_loss": -40.547393798828125, "global_step": 173331, "epoch": 1432} {"train_loss": -41.12127685546875, "global_step": 173332, "epoch": 1432} {"train_loss": -40.45000076293945, "global_step": 173333, "epoch": 1432} {"train_loss": -40.73627853393555, "global_step": 173334, "epoch": 1432} {"train_loss": -40.652095794677734, "global_step": 173335, "epoch": 1432} {"train_loss": -40.27450180053711, "global_step": 173336, "epoch": 1432} {"train_loss": -40.506710052490234, "global_step": 173337, "epoch": 1432} {"train_loss": -40.596981048583984, "global_step": 173338, "epoch": 1432} {"train_loss": -40.21128463745117, "global_step": 173339, "epoch": 1432} {"train_loss": -41.10912322998047, "global_step": 173340, "epoch": 1432} {"train_loss": -40.152740478515625, "global_step": 173341, "epoch": 1432} {"train_loss": -40.508567810058594, "global_step": 173342, "epoch": 1432} {"train_loss": -41.05997085571289, "global_step": 173343, "epoch": 1432} {"train_loss": -40.85505294799805, "global_step": 173344, "epoch": 1432} {"train_loss": -41.13985061645508, "global_step": 173345, "epoch": 1432} {"train_loss": -39.48695755004883, "global_step": 173346, "epoch": 1432} {"train_loss": -40.90966796875, "global_step": 173347, "epoch": 1432} {"train_loss": -41.2713623046875, "global_step": 173348, "epoch": 1432} {"train_loss": -40.65614700317383, "global_step": 173349, "epoch": 1432} {"train_loss": -41.181396484375, "global_step": 173350, "epoch": 1432} {"train_loss": -41.03295135498047, "global_step": 173351, "epoch": 1432} {"train_loss": -40.564788818359375, "global_step": 173352, "epoch": 1432} {"train_loss": -39.882659912109375, "global_step": 173353, "epoch": 1432} {"train_loss": -40.00425338745117, "global_step": 173354, "epoch": 1432} {"train_loss": -37.833404541015625, "global_step": 173355, "epoch": 1432} {"train_loss": -38.66485595703125, "global_step": 173356, "epoch": 1432} {"train_loss": -38.890316009521484, "global_step": 173357, "epoch": 1432} {"train_loss": -41.0105094909668, "global_step": 173358, "epoch": 1432} {"train_loss": -38.2017936706543, "global_step": 173359, "epoch": 1432} {"train_loss": -40.259613037109375, "global_step": 173360, "epoch": 1432} {"train_loss": -38.50355911254883, "global_step": 173361, "epoch": 1432} {"train_loss": -37.98704147338867, "global_step": 173362, "epoch": 1432} {"train_loss": -37.12260055541992, "global_step": 173363, "epoch": 1432} {"train_loss": -38.35268783569336, "global_step": 173364, "epoch": 1432} {"train_loss": -39.472469329833984, "global_step": 173365, "epoch": 1432} {"train_loss": -40.727603912353516, "global_step": 173366, "epoch": 1432} {"train_loss": -39.341339111328125, "global_step": 173367, "epoch": 1432} {"train_loss": -36.7646598815918, "global_step": 173368, "epoch": 1432} {"train_loss": -39.07100296020508, "global_step": 173369, "epoch": 1432} {"train_loss": -40.87028121948242, "global_step": 173370, "epoch": 1432} {"train_loss": -39.20706558227539, "global_step": 173371, "epoch": 1432} {"train_loss": -39.49641036987305, "global_step": 173372, "epoch": 1432} {"train_loss": -39.33551788330078, "global_step": 173373, "epoch": 1432} {"train_loss": -39.79069900512695, "global_step": 173374, "epoch": 1432} {"train_loss": -40.11207962036133, "global_step": 173375, "epoch": 1432} {"train_loss": -41.30078125, "global_step": 173376, "epoch": 1432} {"train_loss": -40.18075180053711, "global_step": 173377, "epoch": 1432} {"train_loss": -39.811012268066406, "global_step": 173378, "epoch": 1432} {"train_loss": -41.445133209228516, "global_step": 173379, "epoch": 1432} {"train_loss": -40.81852340698242, "global_step": 173380, "epoch": 1432} {"train_loss": -40.49394607543945, "global_step": 173381, "epoch": 1432} {"train_loss": -40.85429763793945, "global_step": 173382, "epoch": 1432} {"train_loss": -40.5833854675293, "global_step": 173383, "epoch": 1432} {"train_loss": -40.641265869140625, "global_step": 173384, "epoch": 1432} {"train_loss": -40.51580810546875, "global_step": 173385, "epoch": 1432} {"train_loss": -39.95687484741211, "global_step": 173386, "epoch": 1432} {"train_loss": -40.904354095458984, "global_step": 173387, "epoch": 1432} {"train_loss": -40.37107467651367, "global_step": 173388, "epoch": 1432} {"train_loss": -41.58291244506836, "global_step": 173389, "epoch": 1432} {"train_loss": -41.1671028137207, "global_step": 173390, "epoch": 1432} {"train_loss": -41.179542541503906, "global_step": 173391, "epoch": 1432} {"train_loss": -40.136130782198315, "global_step": 173392, "epoch": 1432, "val_loss": 2665568.25} {"train_loss": -41.08759307861328, "global_step": 173393, "epoch": 1433} {"train_loss": -41.7771110534668, "global_step": 173394, "epoch": 1433} {"train_loss": -40.80818557739258, "global_step": 173395, "epoch": 1433} {"train_loss": -41.33481979370117, "global_step": 173396, "epoch": 1433} {"train_loss": -41.42324447631836, "global_step": 173397, "epoch": 1433} {"train_loss": -41.07685089111328, "global_step": 173398, "epoch": 1433} {"train_loss": -40.87479782104492, "global_step": 173399, "epoch": 1433} {"train_loss": -41.4047737121582, "global_step": 173400, "epoch": 1433} {"train_loss": -41.0086784362793, "global_step": 173401, "epoch": 1433} {"train_loss": -41.27097702026367, "global_step": 173402, "epoch": 1433} {"train_loss": -40.8776969909668, "global_step": 173403, "epoch": 1433} {"train_loss": -40.38873291015625, "global_step": 173404, "epoch": 1433} {"train_loss": -40.7558708190918, "global_step": 173405, "epoch": 1433} {"train_loss": -40.46253204345703, "global_step": 173406, "epoch": 1433} {"train_loss": -40.78862380981445, "global_step": 173407, "epoch": 1433} {"train_loss": -40.967079162597656, "global_step": 173408, "epoch": 1433} {"train_loss": -40.915191650390625, "global_step": 173409, "epoch": 1433} {"train_loss": -41.154823303222656, "global_step": 173410, "epoch": 1433} {"train_loss": -40.92381286621094, "global_step": 173411, "epoch": 1433} {"train_loss": -40.268218994140625, "global_step": 173412, "epoch": 1433} {"train_loss": -39.359642028808594, "global_step": 173413, "epoch": 1433} {"train_loss": -38.927330017089844, "global_step": 173414, "epoch": 1433} {"train_loss": -39.776527404785156, "global_step": 173415, "epoch": 1433} {"train_loss": -41.72926330566406, "global_step": 173416, "epoch": 1433} {"train_loss": -40.875694274902344, "global_step": 173417, "epoch": 1433} {"train_loss": -40.80875015258789, "global_step": 173418, "epoch": 1433} {"train_loss": -40.61677169799805, "global_step": 173419, "epoch": 1433} {"train_loss": -41.399085998535156, "global_step": 173420, "epoch": 1433} {"train_loss": -40.779354095458984, "global_step": 173421, "epoch": 1433} {"train_loss": -39.27056884765625, "global_step": 173422, "epoch": 1433} {"train_loss": -38.921085357666016, "global_step": 173423, "epoch": 1433} {"train_loss": -40.662776947021484, "global_step": 173424, "epoch": 1433} {"train_loss": -41.186622619628906, "global_step": 173425, "epoch": 1433} {"train_loss": -40.73600387573242, "global_step": 173426, "epoch": 1433} {"train_loss": -40.07091522216797, "global_step": 173427, "epoch": 1433} {"train_loss": -40.678916931152344, "global_step": 173428, "epoch": 1433} {"train_loss": -41.02333450317383, "global_step": 173429, "epoch": 1433} {"train_loss": -41.66754913330078, "global_step": 173430, "epoch": 1433} {"train_loss": -40.23614501953125, "global_step": 173431, "epoch": 1433} {"train_loss": -41.479278564453125, "global_step": 173432, "epoch": 1433} {"train_loss": -40.34952926635742, "global_step": 173433, "epoch": 1433} {"train_loss": -40.07639694213867, "global_step": 173434, "epoch": 1433} {"train_loss": -41.40021896362305, "global_step": 173435, "epoch": 1433} {"train_loss": -41.58039093017578, "global_step": 173436, "epoch": 1433} {"train_loss": -40.7815055847168, "global_step": 173437, "epoch": 1433} {"train_loss": -40.17508316040039, "global_step": 173438, "epoch": 1433} {"train_loss": -41.071067810058594, "global_step": 173439, "epoch": 1433} {"train_loss": -40.65122604370117, "global_step": 173440, "epoch": 1433} {"train_loss": -40.62610626220703, "global_step": 173441, "epoch": 1433} {"train_loss": -40.9304313659668, "global_step": 173442, "epoch": 1433} {"train_loss": -40.96913528442383, "global_step": 173443, "epoch": 1433} {"train_loss": -41.53072738647461, "global_step": 173444, "epoch": 1433} {"train_loss": -41.89524459838867, "global_step": 173445, "epoch": 1433} {"train_loss": -41.864715576171875, "global_step": 173446, "epoch": 1433} {"train_loss": -41.52028274536133, "global_step": 173447, "epoch": 1433} {"train_loss": -41.382503509521484, "global_step": 173448, "epoch": 1433} {"train_loss": -42.09767150878906, "global_step": 173449, "epoch": 1433} {"train_loss": -41.294036865234375, "global_step": 173450, "epoch": 1433} {"train_loss": -41.324432373046875, "global_step": 173451, "epoch": 1433} {"train_loss": -41.44157028198242, "global_step": 173452, "epoch": 1433} {"train_loss": -41.21533203125, "global_step": 173453, "epoch": 1433} {"train_loss": -40.8868522644043, "global_step": 173454, "epoch": 1433} {"train_loss": -41.86879348754883, "global_step": 173455, "epoch": 1433} {"train_loss": -41.67571258544922, "global_step": 173456, "epoch": 1433} {"train_loss": -40.983482360839844, "global_step": 173457, "epoch": 1433} {"train_loss": -40.76780319213867, "global_step": 173458, "epoch": 1433} {"train_loss": -42.25879669189453, "global_step": 173459, "epoch": 1433} {"train_loss": -41.407283782958984, "global_step": 173460, "epoch": 1433} {"train_loss": -39.66115951538086, "global_step": 173461, "epoch": 1433} {"train_loss": -41.10095977783203, "global_step": 173462, "epoch": 1433} {"train_loss": -41.06924057006836, "global_step": 173463, "epoch": 1433} {"train_loss": -41.80524444580078, "global_step": 173464, "epoch": 1433} {"train_loss": -40.77616500854492, "global_step": 173465, "epoch": 1433} {"train_loss": -42.140377044677734, "global_step": 173466, "epoch": 1433} {"train_loss": -41.14493942260742, "global_step": 173467, "epoch": 1433} {"train_loss": -40.86245346069336, "global_step": 173468, "epoch": 1433} {"train_loss": -41.33669662475586, "global_step": 173469, "epoch": 1433} {"train_loss": -41.34735107421875, "global_step": 173470, "epoch": 1433} {"train_loss": -41.12057876586914, "global_step": 173471, "epoch": 1433} {"train_loss": -40.784786224365234, "global_step": 173472, "epoch": 1433} {"train_loss": -40.26239776611328, "global_step": 173473, "epoch": 1433} {"train_loss": -40.22883605957031, "global_step": 173474, "epoch": 1433} {"train_loss": -40.76053237915039, "global_step": 173475, "epoch": 1433} {"train_loss": -40.209896087646484, "global_step": 173476, "epoch": 1433} {"train_loss": -40.245819091796875, "global_step": 173477, "epoch": 1433} {"train_loss": -39.90781784057617, "global_step": 173478, "epoch": 1433} {"train_loss": -40.193359375, "global_step": 173479, "epoch": 1433} {"train_loss": -39.38629913330078, "global_step": 173480, "epoch": 1433} {"train_loss": -37.363094329833984, "global_step": 173481, "epoch": 1433} {"train_loss": -31.300622940063477, "global_step": 173482, "epoch": 1433} {"train_loss": -33.308006286621094, "global_step": 173483, "epoch": 1433} {"train_loss": -37.82051086425781, "global_step": 173484, "epoch": 1433} {"train_loss": -33.7183952331543, "global_step": 173485, "epoch": 1433} {"train_loss": -37.42791748046875, "global_step": 173486, "epoch": 1433} {"train_loss": -37.112728118896484, "global_step": 173487, "epoch": 1433} {"train_loss": -40.32571029663086, "global_step": 173488, "epoch": 1433} {"train_loss": -37.635108947753906, "global_step": 173489, "epoch": 1433} {"train_loss": -39.749549865722656, "global_step": 173490, "epoch": 1433} {"train_loss": -38.28523635864258, "global_step": 173491, "epoch": 1433} {"train_loss": -38.07825469970703, "global_step": 173492, "epoch": 1433} {"train_loss": -40.06460189819336, "global_step": 173493, "epoch": 1433} {"train_loss": -38.242759704589844, "global_step": 173494, "epoch": 1433} {"train_loss": -39.65658187866211, "global_step": 173495, "epoch": 1433} {"train_loss": -38.582122802734375, "global_step": 173496, "epoch": 1433} {"train_loss": -39.44121170043945, "global_step": 173497, "epoch": 1433} {"train_loss": -39.71625900268555, "global_step": 173498, "epoch": 1433} {"train_loss": -40.21921920776367, "global_step": 173499, "epoch": 1433} {"train_loss": -40.394283294677734, "global_step": 173500, "epoch": 1433} {"train_loss": -40.647186279296875, "global_step": 173501, "epoch": 1433} {"train_loss": -40.4675407409668, "global_step": 173502, "epoch": 1433} {"train_loss": -40.78530502319336, "global_step": 173503, "epoch": 1433} {"train_loss": -40.78131103515625, "global_step": 173504, "epoch": 1433} {"train_loss": -41.00124740600586, "global_step": 173505, "epoch": 1433} {"train_loss": -41.07264709472656, "global_step": 173506, "epoch": 1433} {"train_loss": -40.738853454589844, "global_step": 173507, "epoch": 1433} {"train_loss": -40.9913444519043, "global_step": 173508, "epoch": 1433} {"train_loss": -41.174842834472656, "global_step": 173509, "epoch": 1433} {"train_loss": -41.4517936706543, "global_step": 173510, "epoch": 1433} {"train_loss": -41.358489990234375, "global_step": 173511, "epoch": 1433} {"train_loss": -41.213233947753906, "global_step": 173512, "epoch": 1433} {"train_loss": -40.405499812985255, "global_step": 173513, "epoch": 1433, "val_loss": 2801547.25} {"train_loss": -41.58400344848633, "global_step": 173514, "epoch": 1434} {"train_loss": -41.0930290222168, "global_step": 173515, "epoch": 1434} {"train_loss": -41.606327056884766, "global_step": 173516, "epoch": 1434} {"train_loss": -41.12112045288086, "global_step": 173517, "epoch": 1434} {"train_loss": -41.049983978271484, "global_step": 173518, "epoch": 1434} {"train_loss": -41.06388473510742, "global_step": 173519, "epoch": 1434} {"train_loss": -41.45222854614258, "global_step": 173520, "epoch": 1434} {"train_loss": -41.57339859008789, "global_step": 173521, "epoch": 1434} {"train_loss": -41.634334564208984, "global_step": 173522, "epoch": 1434} {"train_loss": -41.461544036865234, "global_step": 173523, "epoch": 1434} {"train_loss": -41.95134353637695, "global_step": 173524, "epoch": 1434} {"train_loss": -41.26356506347656, "global_step": 173525, "epoch": 1434} {"train_loss": -41.66871643066406, "global_step": 173526, "epoch": 1434} {"train_loss": -42.00473403930664, "global_step": 173527, "epoch": 1434} {"train_loss": -41.5863037109375, "global_step": 173528, "epoch": 1434} {"train_loss": -41.35831832885742, "global_step": 173529, "epoch": 1434} {"train_loss": -41.5025520324707, "global_step": 173530, "epoch": 1434} {"train_loss": -41.71260452270508, "global_step": 173531, "epoch": 1434} {"train_loss": -41.98672103881836, "global_step": 173532, "epoch": 1434} {"train_loss": -41.41653060913086, "global_step": 173533, "epoch": 1434} {"train_loss": -41.48209762573242, "global_step": 173534, "epoch": 1434} {"train_loss": -42.28196334838867, "global_step": 173535, "epoch": 1434} {"train_loss": -42.06981658935547, "global_step": 173536, "epoch": 1434} {"train_loss": -42.093299865722656, "global_step": 173537, "epoch": 1434} {"train_loss": -41.818424224853516, "global_step": 173538, "epoch": 1434} {"train_loss": -41.26932144165039, "global_step": 173539, "epoch": 1434} {"train_loss": -42.096092224121094, "global_step": 173540, "epoch": 1434} {"train_loss": -41.887054443359375, "global_step": 173541, "epoch": 1434} {"train_loss": -41.90497970581055, "global_step": 173542, "epoch": 1434} {"train_loss": -41.509559631347656, "global_step": 173543, "epoch": 1434} {"train_loss": -42.18113708496094, "global_step": 173544, "epoch": 1434} {"train_loss": -41.64544677734375, "global_step": 173545, "epoch": 1434} {"train_loss": -41.13876724243164, "global_step": 173546, "epoch": 1434} {"train_loss": -41.32110595703125, "global_step": 173547, "epoch": 1434} {"train_loss": -41.437957763671875, "global_step": 173548, "epoch": 1434} {"train_loss": -41.81793975830078, "global_step": 173549, "epoch": 1434} {"train_loss": -41.2808952331543, "global_step": 173550, "epoch": 1434} {"train_loss": -40.639339447021484, "global_step": 173551, "epoch": 1434} {"train_loss": -41.41302490234375, "global_step": 173552, "epoch": 1434} {"train_loss": -41.89461898803711, "global_step": 173553, "epoch": 1434} {"train_loss": -41.2421760559082, "global_step": 173554, "epoch": 1434} {"train_loss": -41.23179244995117, "global_step": 173555, "epoch": 1434} {"train_loss": -40.98439025878906, "global_step": 173556, "epoch": 1434} {"train_loss": -42.0380973815918, "global_step": 173557, "epoch": 1434} {"train_loss": -41.69277572631836, "global_step": 173558, "epoch": 1434} {"train_loss": -41.41765213012695, "global_step": 173559, "epoch": 1434} {"train_loss": -41.83832931518555, "global_step": 173560, "epoch": 1434} {"train_loss": -41.5989875793457, "global_step": 173561, "epoch": 1434} {"train_loss": -41.56864547729492, "global_step": 173562, "epoch": 1434} {"train_loss": -42.04142379760742, "global_step": 173563, "epoch": 1434} {"train_loss": -41.65962600708008, "global_step": 173564, "epoch": 1434} {"train_loss": -41.66108322143555, "global_step": 173565, "epoch": 1434} {"train_loss": -40.983192443847656, "global_step": 173566, "epoch": 1434} {"train_loss": -40.6749153137207, "global_step": 173567, "epoch": 1434} {"train_loss": -41.523807525634766, "global_step": 173568, "epoch": 1434} {"train_loss": -41.59043884277344, "global_step": 173569, "epoch": 1434} {"train_loss": -39.92434310913086, "global_step": 173570, "epoch": 1434} {"train_loss": -40.16048812866211, "global_step": 173571, "epoch": 1434} {"train_loss": -41.77705001831055, "global_step": 173572, "epoch": 1434} {"train_loss": -40.862762451171875, "global_step": 173573, "epoch": 1434} {"train_loss": -40.84111785888672, "global_step": 173574, "epoch": 1434} {"train_loss": -39.962459564208984, "global_step": 173575, "epoch": 1434} {"train_loss": -40.22307205200195, "global_step": 173576, "epoch": 1434} {"train_loss": -40.36817169189453, "global_step": 173577, "epoch": 1434} {"train_loss": -40.837196350097656, "global_step": 173578, "epoch": 1434} {"train_loss": -41.53931427001953, "global_step": 173579, "epoch": 1434} {"train_loss": -39.106201171875, "global_step": 173580, "epoch": 1434} {"train_loss": -40.92742156982422, "global_step": 173581, "epoch": 1434} {"train_loss": -41.771907806396484, "global_step": 173582, "epoch": 1434} {"train_loss": -40.368919372558594, "global_step": 173583, "epoch": 1434} {"train_loss": -40.8922233581543, "global_step": 173584, "epoch": 1434} {"train_loss": -40.822059631347656, "global_step": 173585, "epoch": 1434} {"train_loss": -41.13978958129883, "global_step": 173586, "epoch": 1434} {"train_loss": -41.58061981201172, "global_step": 173587, "epoch": 1434} {"train_loss": -40.032535552978516, "global_step": 173588, "epoch": 1434} {"train_loss": -40.6262092590332, "global_step": 173589, "epoch": 1434} {"train_loss": -41.92512512207031, "global_step": 173590, "epoch": 1434} {"train_loss": -40.1414680480957, "global_step": 173591, "epoch": 1434} {"train_loss": -40.74927520751953, "global_step": 173592, "epoch": 1434} {"train_loss": -41.3216552734375, "global_step": 173593, "epoch": 1434} {"train_loss": -41.274715423583984, "global_step": 173594, "epoch": 1434} {"train_loss": -39.837093353271484, "global_step": 173595, "epoch": 1434} {"train_loss": -39.191795349121094, "global_step": 173596, "epoch": 1434} {"train_loss": -41.33760452270508, "global_step": 173597, "epoch": 1434} {"train_loss": -41.2658576965332, "global_step": 173598, "epoch": 1434} {"train_loss": -41.425941467285156, "global_step": 173599, "epoch": 1434} {"train_loss": -41.87201690673828, "global_step": 173600, "epoch": 1434} {"train_loss": -40.47062301635742, "global_step": 173601, "epoch": 1434} {"train_loss": -41.379661560058594, "global_step": 173602, "epoch": 1434} {"train_loss": -39.28493881225586, "global_step": 173603, "epoch": 1434} {"train_loss": -41.07950973510742, "global_step": 173604, "epoch": 1434} {"train_loss": -40.50959777832031, "global_step": 173605, "epoch": 1434} {"train_loss": -40.3714714050293, "global_step": 173606, "epoch": 1434} {"train_loss": -40.83015441894531, "global_step": 173607, "epoch": 1434} {"train_loss": -39.688533782958984, "global_step": 173608, "epoch": 1434} {"train_loss": -40.504608154296875, "global_step": 173609, "epoch": 1434} {"train_loss": -41.166107177734375, "global_step": 173610, "epoch": 1434} {"train_loss": -40.47011947631836, "global_step": 173611, "epoch": 1434} {"train_loss": -39.611328125, "global_step": 173612, "epoch": 1434} {"train_loss": -39.92596435546875, "global_step": 173613, "epoch": 1434} {"train_loss": -40.65958023071289, "global_step": 173614, "epoch": 1434} {"train_loss": -39.733978271484375, "global_step": 173615, "epoch": 1434} {"train_loss": -40.91767883300781, "global_step": 173616, "epoch": 1434} {"train_loss": -40.73480224609375, "global_step": 173617, "epoch": 1434} {"train_loss": -40.46696853637695, "global_step": 173618, "epoch": 1434} {"train_loss": -39.384315490722656, "global_step": 173619, "epoch": 1434} {"train_loss": -38.11372756958008, "global_step": 173620, "epoch": 1434} {"train_loss": -39.48233413696289, "global_step": 173621, "epoch": 1434} {"train_loss": -40.47428512573242, "global_step": 173622, "epoch": 1434} {"train_loss": -41.14626693725586, "global_step": 173623, "epoch": 1434} {"train_loss": -40.64264678955078, "global_step": 173624, "epoch": 1434} {"train_loss": -38.88310623168945, "global_step": 173625, "epoch": 1434} {"train_loss": -40.70691680908203, "global_step": 173626, "epoch": 1434} {"train_loss": -40.59029769897461, "global_step": 173627, "epoch": 1434} {"train_loss": -41.20473098754883, "global_step": 173628, "epoch": 1434} {"train_loss": -40.053314208984375, "global_step": 173629, "epoch": 1434} {"train_loss": -40.14506149291992, "global_step": 173630, "epoch": 1434} {"train_loss": -40.63427734375, "global_step": 173631, "epoch": 1434} {"train_loss": -41.366817474365234, "global_step": 173632, "epoch": 1434} {"train_loss": -39.61880111694336, "global_step": 173633, "epoch": 1434} {"train_loss": -41.00131559766029, "global_step": 173634, "epoch": 1434, "val_loss": 2680225.75} {"train_loss": -39.451210021972656, "global_step": 173635, "epoch": 1435} {"train_loss": -39.365936279296875, "global_step": 173636, "epoch": 1435} {"train_loss": -39.830867767333984, "global_step": 173637, "epoch": 1435} {"train_loss": -39.59245681762695, "global_step": 173638, "epoch": 1435} {"train_loss": -39.484920501708984, "global_step": 173639, "epoch": 1435} {"train_loss": -40.983314514160156, "global_step": 173640, "epoch": 1435} {"train_loss": -39.991851806640625, "global_step": 173641, "epoch": 1435} {"train_loss": -41.02467727661133, "global_step": 173642, "epoch": 1435} {"train_loss": -40.65458297729492, "global_step": 173643, "epoch": 1435} {"train_loss": -38.038612365722656, "global_step": 173644, "epoch": 1435} {"train_loss": -36.56380081176758, "global_step": 173645, "epoch": 1435} {"train_loss": -40.26344680786133, "global_step": 173646, "epoch": 1435} {"train_loss": -40.24457931518555, "global_step": 173647, "epoch": 1435} {"train_loss": -40.25898361206055, "global_step": 173648, "epoch": 1435} {"train_loss": -40.942626953125, "global_step": 173649, "epoch": 1435} {"train_loss": -40.95783233642578, "global_step": 173650, "epoch": 1435} {"train_loss": -40.317352294921875, "global_step": 173651, "epoch": 1435} {"train_loss": -39.13467025756836, "global_step": 173652, "epoch": 1435} {"train_loss": -39.713287353515625, "global_step": 173653, "epoch": 1435} {"train_loss": -38.67012405395508, "global_step": 173654, "epoch": 1435} {"train_loss": -24.646821975708008, "global_step": 173655, "epoch": 1435} {"train_loss": -35.91652297973633, "global_step": 173656, "epoch": 1435} {"train_loss": -34.12238693237305, "global_step": 173657, "epoch": 1435} {"train_loss": -39.23482894897461, "global_step": 173658, "epoch": 1435} {"train_loss": -38.66703414916992, "global_step": 173659, "epoch": 1435} {"train_loss": -34.42184066772461, "global_step": 173660, "epoch": 1435} {"train_loss": -35.95798873901367, "global_step": 173661, "epoch": 1435} {"train_loss": -39.94223403930664, "global_step": 173662, "epoch": 1435} {"train_loss": -35.50448226928711, "global_step": 173663, "epoch": 1435} {"train_loss": -35.68404769897461, "global_step": 173664, "epoch": 1435} {"train_loss": -31.138330459594727, "global_step": 173665, "epoch": 1435} {"train_loss": -38.75674057006836, "global_step": 173666, "epoch": 1435} {"train_loss": -39.56734848022461, "global_step": 173667, "epoch": 1435} {"train_loss": -37.8397102355957, "global_step": 173668, "epoch": 1435} {"train_loss": -38.25285339355469, "global_step": 173669, "epoch": 1435} {"train_loss": -34.87110900878906, "global_step": 173670, "epoch": 1435} {"train_loss": -38.9140739440918, "global_step": 173671, "epoch": 1435} {"train_loss": -36.59607696533203, "global_step": 173672, "epoch": 1435} {"train_loss": -36.439334869384766, "global_step": 173673, "epoch": 1435} {"train_loss": -29.281726837158203, "global_step": 173674, "epoch": 1435} {"train_loss": -33.51587677001953, "global_step": 173675, "epoch": 1435} {"train_loss": -34.668060302734375, "global_step": 173676, "epoch": 1435} {"train_loss": -32.38649368286133, "global_step": 173677, "epoch": 1435} {"train_loss": -36.920249938964844, "global_step": 173678, "epoch": 1435} {"train_loss": -36.062355041503906, "global_step": 173679, "epoch": 1435} {"train_loss": -37.80839157104492, "global_step": 173680, "epoch": 1435} {"train_loss": -37.20209884643555, "global_step": 173681, "epoch": 1435} {"train_loss": -35.9262809753418, "global_step": 173682, "epoch": 1435} {"train_loss": -36.536922454833984, "global_step": 173683, "epoch": 1435} {"train_loss": -36.4553337097168, "global_step": 173684, "epoch": 1435} {"train_loss": -37.60332107543945, "global_step": 173685, "epoch": 1435} {"train_loss": -38.23829650878906, "global_step": 173686, "epoch": 1435} {"train_loss": -37.35720443725586, "global_step": 173687, "epoch": 1435} {"train_loss": -38.92489242553711, "global_step": 173688, "epoch": 1435} {"train_loss": -38.735652923583984, "global_step": 173689, "epoch": 1435} {"train_loss": -39.494834899902344, "global_step": 173690, "epoch": 1435} {"train_loss": -38.984676361083984, "global_step": 173691, "epoch": 1435} {"train_loss": -37.61893844604492, "global_step": 173692, "epoch": 1435} {"train_loss": -39.021671295166016, "global_step": 173693, "epoch": 1435} {"train_loss": -38.635536193847656, "global_step": 173694, "epoch": 1435} {"train_loss": -38.9697380065918, "global_step": 173695, "epoch": 1435} {"train_loss": -38.97135543823242, "global_step": 173696, "epoch": 1435} {"train_loss": -39.34406661987305, "global_step": 173697, "epoch": 1435} {"train_loss": -39.61859893798828, "global_step": 173698, "epoch": 1435} {"train_loss": -39.59083557128906, "global_step": 173699, "epoch": 1435} {"train_loss": -38.26935577392578, "global_step": 173700, "epoch": 1435} {"train_loss": -38.831790924072266, "global_step": 173701, "epoch": 1435} {"train_loss": -39.24097442626953, "global_step": 173702, "epoch": 1435} {"train_loss": -37.45880889892578, "global_step": 173703, "epoch": 1435} {"train_loss": -38.448829650878906, "global_step": 173704, "epoch": 1435} {"train_loss": -38.24542236328125, "global_step": 173705, "epoch": 1435} {"train_loss": -39.37134552001953, "global_step": 173706, "epoch": 1435} {"train_loss": -39.068336486816406, "global_step": 173707, "epoch": 1435} {"train_loss": -39.39076614379883, "global_step": 173708, "epoch": 1435} {"train_loss": -39.91532516479492, "global_step": 173709, "epoch": 1435} {"train_loss": -38.950740814208984, "global_step": 173710, "epoch": 1435} {"train_loss": -40.062477111816406, "global_step": 173711, "epoch": 1435} {"train_loss": -40.01344680786133, "global_step": 173712, "epoch": 1435} {"train_loss": -40.28091049194336, "global_step": 173713, "epoch": 1435} {"train_loss": -38.101985931396484, "global_step": 173714, "epoch": 1435} {"train_loss": -39.930519104003906, "global_step": 173715, "epoch": 1435} {"train_loss": -40.24159622192383, "global_step": 173716, "epoch": 1435} {"train_loss": -39.296669006347656, "global_step": 173717, "epoch": 1435} {"train_loss": -40.23152160644531, "global_step": 173718, "epoch": 1435} {"train_loss": -39.23977279663086, "global_step": 173719, "epoch": 1435} {"train_loss": -39.73952865600586, "global_step": 173720, "epoch": 1435} {"train_loss": -40.9144172668457, "global_step": 173721, "epoch": 1435} {"train_loss": -40.85197067260742, "global_step": 173722, "epoch": 1435} {"train_loss": -40.510189056396484, "global_step": 173723, "epoch": 1435} {"train_loss": -40.28492736816406, "global_step": 173724, "epoch": 1435} {"train_loss": -40.621681213378906, "global_step": 173725, "epoch": 1435} {"train_loss": -39.40963363647461, "global_step": 173726, "epoch": 1435} {"train_loss": -40.73287582397461, "global_step": 173727, "epoch": 1435} {"train_loss": -40.457061767578125, "global_step": 173728, "epoch": 1435} {"train_loss": -40.280269622802734, "global_step": 173729, "epoch": 1435} {"train_loss": -41.24027633666992, "global_step": 173730, "epoch": 1435} {"train_loss": -40.45296859741211, "global_step": 173731, "epoch": 1435} {"train_loss": -40.46843338012695, "global_step": 173732, "epoch": 1435} {"train_loss": -40.34606170654297, "global_step": 173733, "epoch": 1435} {"train_loss": -40.150146484375, "global_step": 173734, "epoch": 1435} {"train_loss": -40.76224899291992, "global_step": 173735, "epoch": 1435} {"train_loss": -40.24613571166992, "global_step": 173736, "epoch": 1435} {"train_loss": -40.8475227355957, "global_step": 173737, "epoch": 1435} {"train_loss": -41.24998092651367, "global_step": 173738, "epoch": 1435} {"train_loss": -40.30445098876953, "global_step": 173739, "epoch": 1435} {"train_loss": -40.76243209838867, "global_step": 173740, "epoch": 1435} {"train_loss": -40.480865478515625, "global_step": 173741, "epoch": 1435} {"train_loss": -40.29125213623047, "global_step": 173742, "epoch": 1435} {"train_loss": -40.90234375, "global_step": 173743, "epoch": 1435} {"train_loss": -39.70891189575195, "global_step": 173744, "epoch": 1435} {"train_loss": -41.2783317565918, "global_step": 173745, "epoch": 1435} {"train_loss": -41.0621452331543, "global_step": 173746, "epoch": 1435} {"train_loss": -40.986751556396484, "global_step": 173747, "epoch": 1435} {"train_loss": -41.261470794677734, "global_step": 173748, "epoch": 1435} {"train_loss": -41.2327766418457, "global_step": 173749, "epoch": 1435} {"train_loss": -41.331539154052734, "global_step": 173750, "epoch": 1435} {"train_loss": -39.859310150146484, "global_step": 173751, "epoch": 1435} {"train_loss": -41.56321334838867, "global_step": 173752, "epoch": 1435} {"train_loss": -39.89799499511719, "global_step": 173753, "epoch": 1435} {"train_loss": -40.782989501953125, "global_step": 173754, "epoch": 1435} {"train_loss": -38.80696187925733, "global_step": 173755, "epoch": 1435, "val_loss": 2686661.25} {"train_loss": -41.35704040527344, "global_step": 173756, "epoch": 1436} {"train_loss": -40.955108642578125, "global_step": 173757, "epoch": 1436} {"train_loss": -41.54103469848633, "global_step": 173758, "epoch": 1436} {"train_loss": -40.68634796142578, "global_step": 173759, "epoch": 1436} {"train_loss": -40.9857177734375, "global_step": 173760, "epoch": 1436} {"train_loss": -40.81412887573242, "global_step": 173761, "epoch": 1436} {"train_loss": -41.290855407714844, "global_step": 173762, "epoch": 1436} {"train_loss": -41.43394470214844, "global_step": 173763, "epoch": 1436} {"train_loss": -39.795143127441406, "global_step": 173764, "epoch": 1436} {"train_loss": -40.512237548828125, "global_step": 173765, "epoch": 1436} {"train_loss": -42.037105560302734, "global_step": 173766, "epoch": 1436} {"train_loss": -41.031063079833984, "global_step": 173767, "epoch": 1436} {"train_loss": -40.5635871887207, "global_step": 173768, "epoch": 1436} {"train_loss": -39.47515106201172, "global_step": 173769, "epoch": 1436} {"train_loss": -40.708595275878906, "global_step": 173770, "epoch": 1436} {"train_loss": -41.15830612182617, "global_step": 173771, "epoch": 1436} {"train_loss": -41.61592483520508, "global_step": 173772, "epoch": 1436} {"train_loss": -40.66572189331055, "global_step": 173773, "epoch": 1436} {"train_loss": -39.672908782958984, "global_step": 173774, "epoch": 1436} {"train_loss": -41.38348388671875, "global_step": 173775, "epoch": 1436} {"train_loss": -41.127349853515625, "global_step": 173776, "epoch": 1436} {"train_loss": -40.67679214477539, "global_step": 173777, "epoch": 1436} {"train_loss": -39.89384841918945, "global_step": 173778, "epoch": 1436} {"train_loss": -40.06107711791992, "global_step": 173779, "epoch": 1436} {"train_loss": -40.790706634521484, "global_step": 173780, "epoch": 1436} {"train_loss": -40.156150817871094, "global_step": 173781, "epoch": 1436} {"train_loss": -41.14536666870117, "global_step": 173782, "epoch": 1436} {"train_loss": -40.38066482543945, "global_step": 173783, "epoch": 1436} {"train_loss": -40.69552230834961, "global_step": 173784, "epoch": 1436} {"train_loss": -41.605552673339844, "global_step": 173785, "epoch": 1436} {"train_loss": -41.25741195678711, "global_step": 173786, "epoch": 1436} {"train_loss": -40.882537841796875, "global_step": 173787, "epoch": 1436} {"train_loss": -41.45987319946289, "global_step": 173788, "epoch": 1436} {"train_loss": -40.750545501708984, "global_step": 173789, "epoch": 1436} {"train_loss": -39.381568908691406, "global_step": 173790, "epoch": 1436} {"train_loss": -41.136863708496094, "global_step": 173791, "epoch": 1436} {"train_loss": -41.2900505065918, "global_step": 173792, "epoch": 1436} {"train_loss": -39.733577728271484, "global_step": 173793, "epoch": 1436} {"train_loss": -41.52314376831055, "global_step": 173794, "epoch": 1436} {"train_loss": -41.45861053466797, "global_step": 173795, "epoch": 1436} {"train_loss": -40.85531234741211, "global_step": 173796, "epoch": 1436} {"train_loss": -41.23740768432617, "global_step": 173797, "epoch": 1436} {"train_loss": -41.461307525634766, "global_step": 173798, "epoch": 1436} {"train_loss": -39.058345794677734, "global_step": 173799, "epoch": 1436} {"train_loss": -39.23019027709961, "global_step": 173800, "epoch": 1436} {"train_loss": -41.09245681762695, "global_step": 173801, "epoch": 1436} {"train_loss": -37.912593841552734, "global_step": 173802, "epoch": 1436} {"train_loss": -39.725860595703125, "global_step": 173803, "epoch": 1436} {"train_loss": -42.040252685546875, "global_step": 173804, "epoch": 1436} {"train_loss": -40.65421676635742, "global_step": 173805, "epoch": 1436} {"train_loss": -40.670082092285156, "global_step": 173806, "epoch": 1436} {"train_loss": -41.95396041870117, "global_step": 173807, "epoch": 1436} {"train_loss": -40.16758346557617, "global_step": 173808, "epoch": 1436} {"train_loss": -40.376800537109375, "global_step": 173809, "epoch": 1436} {"train_loss": -40.30430221557617, "global_step": 173810, "epoch": 1436} {"train_loss": -40.65037155151367, "global_step": 173811, "epoch": 1436} {"train_loss": -39.6682243347168, "global_step": 173812, "epoch": 1436} {"train_loss": -39.51054382324219, "global_step": 173813, "epoch": 1436} {"train_loss": -38.381935119628906, "global_step": 173814, "epoch": 1436} {"train_loss": -38.39059066772461, "global_step": 173815, "epoch": 1436} {"train_loss": -39.84932327270508, "global_step": 173816, "epoch": 1436} {"train_loss": -40.81436538696289, "global_step": 173817, "epoch": 1436} {"train_loss": -38.65571594238281, "global_step": 173818, "epoch": 1436} {"train_loss": -39.58225631713867, "global_step": 173819, "epoch": 1436} {"train_loss": -39.28168869018555, "global_step": 173820, "epoch": 1436} {"train_loss": -39.99567794799805, "global_step": 173821, "epoch": 1436} {"train_loss": -38.36211013793945, "global_step": 173822, "epoch": 1436} {"train_loss": -37.58162307739258, "global_step": 173823, "epoch": 1436} {"train_loss": -35.98435592651367, "global_step": 173824, "epoch": 1436} {"train_loss": -37.594482421875, "global_step": 173825, "epoch": 1436} {"train_loss": -40.81279373168945, "global_step": 173826, "epoch": 1436} {"train_loss": -39.64370346069336, "global_step": 173827, "epoch": 1436} {"train_loss": -38.28794479370117, "global_step": 173828, "epoch": 1436} {"train_loss": -39.15583419799805, "global_step": 173829, "epoch": 1436} {"train_loss": -37.27705383300781, "global_step": 173830, "epoch": 1436} {"train_loss": -36.413631439208984, "global_step": 173831, "epoch": 1436} {"train_loss": -34.033966064453125, "global_step": 173832, "epoch": 1436} {"train_loss": -37.9110107421875, "global_step": 173833, "epoch": 1436} {"train_loss": -38.93513870239258, "global_step": 173834, "epoch": 1436} {"train_loss": -38.371070861816406, "global_step": 173835, "epoch": 1436} {"train_loss": -40.22563171386719, "global_step": 173836, "epoch": 1436} {"train_loss": -38.40230178833008, "global_step": 173837, "epoch": 1436} {"train_loss": -39.08395004272461, "global_step": 173838, "epoch": 1436} {"train_loss": -36.855342864990234, "global_step": 173839, "epoch": 1436} {"train_loss": -32.790748596191406, "global_step": 173840, "epoch": 1436} {"train_loss": -34.59926223754883, "global_step": 173841, "epoch": 1436} {"train_loss": -32.91172790527344, "global_step": 173842, "epoch": 1436} {"train_loss": -38.5222053527832, "global_step": 173843, "epoch": 1436} {"train_loss": -37.7669563293457, "global_step": 173844, "epoch": 1436} {"train_loss": -39.709896087646484, "global_step": 173845, "epoch": 1436} {"train_loss": -39.125911712646484, "global_step": 173846, "epoch": 1436} {"train_loss": -38.218685150146484, "global_step": 173847, "epoch": 1436} {"train_loss": -36.13383483886719, "global_step": 173848, "epoch": 1436} {"train_loss": -38.80010223388672, "global_step": 173849, "epoch": 1436} {"train_loss": -37.5639762878418, "global_step": 173850, "epoch": 1436} {"train_loss": -38.83013153076172, "global_step": 173851, "epoch": 1436} {"train_loss": -39.4807243347168, "global_step": 173852, "epoch": 1436} {"train_loss": -38.91778564453125, "global_step": 173853, "epoch": 1436} {"train_loss": -39.224609375, "global_step": 173854, "epoch": 1436} {"train_loss": -39.0382194519043, "global_step": 173855, "epoch": 1436} {"train_loss": -39.18803024291992, "global_step": 173856, "epoch": 1436} {"train_loss": -36.635982513427734, "global_step": 173857, "epoch": 1436} {"train_loss": -40.0794677734375, "global_step": 173858, "epoch": 1436} {"train_loss": -39.50264358520508, "global_step": 173859, "epoch": 1436} {"train_loss": -40.9879035949707, "global_step": 173860, "epoch": 1436} {"train_loss": -39.102935791015625, "global_step": 173861, "epoch": 1436} {"train_loss": -40.222373962402344, "global_step": 173862, "epoch": 1436} {"train_loss": -40.5583610534668, "global_step": 173863, "epoch": 1436} {"train_loss": -39.79905700683594, "global_step": 173864, "epoch": 1436} {"train_loss": -40.29435729980469, "global_step": 173865, "epoch": 1436} {"train_loss": -39.75970458984375, "global_step": 173866, "epoch": 1436} {"train_loss": -39.863525390625, "global_step": 173867, "epoch": 1436} {"train_loss": -40.53647232055664, "global_step": 173868, "epoch": 1436} {"train_loss": -40.29313278198242, "global_step": 173869, "epoch": 1436} {"train_loss": -39.064693450927734, "global_step": 173870, "epoch": 1436} {"train_loss": -39.06781768798828, "global_step": 173871, "epoch": 1436} {"train_loss": -40.14933395385742, "global_step": 173872, "epoch": 1436} {"train_loss": -40.22563171386719, "global_step": 173873, "epoch": 1436} {"train_loss": -40.524574279785156, "global_step": 173874, "epoch": 1436} {"train_loss": -39.82316207885742, "global_step": 173875, "epoch": 1436} {"train_loss": -39.65124410834194, "global_step": 173876, "epoch": 1436, "val_loss": 2602021.75} {"train_loss": -40.51469802856445, "global_step": 173877, "epoch": 1437} {"train_loss": -40.91648864746094, "global_step": 173878, "epoch": 1437} {"train_loss": -41.02488327026367, "global_step": 173879, "epoch": 1437} {"train_loss": -40.01210021972656, "global_step": 173880, "epoch": 1437} {"train_loss": -39.74174118041992, "global_step": 173881, "epoch": 1437} {"train_loss": -40.63761520385742, "global_step": 173882, "epoch": 1437} {"train_loss": -40.394996643066406, "global_step": 173883, "epoch": 1437} {"train_loss": -40.55945587158203, "global_step": 173884, "epoch": 1437} {"train_loss": -41.248512268066406, "global_step": 173885, "epoch": 1437} {"train_loss": -41.32593536376953, "global_step": 173886, "epoch": 1437} {"train_loss": -39.995731353759766, "global_step": 173887, "epoch": 1437} {"train_loss": -41.3162956237793, "global_step": 173888, "epoch": 1437} {"train_loss": -41.215633392333984, "global_step": 173889, "epoch": 1437} {"train_loss": -38.766075134277344, "global_step": 173890, "epoch": 1437} {"train_loss": -40.89191436767578, "global_step": 173891, "epoch": 1437} {"train_loss": -41.025062561035156, "global_step": 173892, "epoch": 1437} {"train_loss": -37.75295639038086, "global_step": 173893, "epoch": 1437} {"train_loss": -40.75736618041992, "global_step": 173894, "epoch": 1437} {"train_loss": -41.08894729614258, "global_step": 173895, "epoch": 1437} {"train_loss": -40.51449203491211, "global_step": 173896, "epoch": 1437} {"train_loss": -39.718177795410156, "global_step": 173897, "epoch": 1437} {"train_loss": -40.157142639160156, "global_step": 173898, "epoch": 1437} {"train_loss": -40.8946647644043, "global_step": 173899, "epoch": 1437} {"train_loss": -39.58378219604492, "global_step": 173900, "epoch": 1437} {"train_loss": -39.046749114990234, "global_step": 173901, "epoch": 1437} {"train_loss": -40.06617736816406, "global_step": 173902, "epoch": 1437} {"train_loss": -40.79429626464844, "global_step": 173903, "epoch": 1437} {"train_loss": -40.7413330078125, "global_step": 173904, "epoch": 1437} {"train_loss": -40.645477294921875, "global_step": 173905, "epoch": 1437} {"train_loss": -39.728111267089844, "global_step": 173906, "epoch": 1437} {"train_loss": -39.89030456542969, "global_step": 173907, "epoch": 1437} {"train_loss": -41.11452865600586, "global_step": 173908, "epoch": 1437} {"train_loss": -37.69582748413086, "global_step": 173909, "epoch": 1437} {"train_loss": -41.11452102661133, "global_step": 173910, "epoch": 1437} {"train_loss": -40.71046829223633, "global_step": 173911, "epoch": 1437} {"train_loss": -40.73842239379883, "global_step": 173912, "epoch": 1437} {"train_loss": -40.45103073120117, "global_step": 173913, "epoch": 1437} {"train_loss": -40.856693267822266, "global_step": 173914, "epoch": 1437} {"train_loss": -40.9646110534668, "global_step": 173915, "epoch": 1437} {"train_loss": -41.238582611083984, "global_step": 173916, "epoch": 1437} {"train_loss": -40.94285202026367, "global_step": 173917, "epoch": 1437} {"train_loss": -39.952144622802734, "global_step": 173918, "epoch": 1437} {"train_loss": -41.34906005859375, "global_step": 173919, "epoch": 1437} {"train_loss": -41.1010856628418, "global_step": 173920, "epoch": 1437} {"train_loss": -41.24740219116211, "global_step": 173921, "epoch": 1437} {"train_loss": -39.30161666870117, "global_step": 173922, "epoch": 1437} {"train_loss": -40.98025131225586, "global_step": 173923, "epoch": 1437} {"train_loss": -40.29282760620117, "global_step": 173924, "epoch": 1437} {"train_loss": -40.53242111206055, "global_step": 173925, "epoch": 1437} {"train_loss": -41.31135559082031, "global_step": 173926, "epoch": 1437} {"train_loss": -40.20066452026367, "global_step": 173927, "epoch": 1437} {"train_loss": -40.750247955322266, "global_step": 173928, "epoch": 1437} {"train_loss": -40.817134857177734, "global_step": 173929, "epoch": 1437} {"train_loss": -41.5999870300293, "global_step": 173930, "epoch": 1437} {"train_loss": -40.9317626953125, "global_step": 173931, "epoch": 1437} {"train_loss": -41.14778518676758, "global_step": 173932, "epoch": 1437} {"train_loss": -41.301849365234375, "global_step": 173933, "epoch": 1437} {"train_loss": -41.017311096191406, "global_step": 173934, "epoch": 1437} {"train_loss": -40.32246398925781, "global_step": 173935, "epoch": 1437} {"train_loss": -38.50593566894531, "global_step": 173936, "epoch": 1437} {"train_loss": -36.362693786621094, "global_step": 173937, "epoch": 1437} {"train_loss": -39.56428146362305, "global_step": 173938, "epoch": 1437} {"train_loss": -39.91514205932617, "global_step": 173939, "epoch": 1437} {"train_loss": -40.66722106933594, "global_step": 173940, "epoch": 1437} {"train_loss": -40.76742172241211, "global_step": 173941, "epoch": 1437} {"train_loss": -39.869728088378906, "global_step": 173942, "epoch": 1437} {"train_loss": -39.34904098510742, "global_step": 173943, "epoch": 1437} {"train_loss": -37.5883674621582, "global_step": 173944, "epoch": 1437} {"train_loss": -39.95328903198242, "global_step": 173945, "epoch": 1437} {"train_loss": -39.42457580566406, "global_step": 173946, "epoch": 1437} {"train_loss": -40.43587875366211, "global_step": 173947, "epoch": 1437} {"train_loss": -39.81995391845703, "global_step": 173948, "epoch": 1437} {"train_loss": -38.84973907470703, "global_step": 173949, "epoch": 1437} {"train_loss": -40.25407028198242, "global_step": 173950, "epoch": 1437} {"train_loss": -39.56809997558594, "global_step": 173951, "epoch": 1437} {"train_loss": -40.229000091552734, "global_step": 173952, "epoch": 1437} {"train_loss": -38.891117095947266, "global_step": 173953, "epoch": 1437} {"train_loss": -41.171504974365234, "global_step": 173954, "epoch": 1437} {"train_loss": -40.38059616088867, "global_step": 173955, "epoch": 1437} {"train_loss": -39.78944778442383, "global_step": 173956, "epoch": 1437} {"train_loss": -40.33378219604492, "global_step": 173957, "epoch": 1437} {"train_loss": -41.01887893676758, "global_step": 173958, "epoch": 1437} {"train_loss": -39.484169006347656, "global_step": 173959, "epoch": 1437} {"train_loss": -40.36153030395508, "global_step": 173960, "epoch": 1437} {"train_loss": -40.13491439819336, "global_step": 173961, "epoch": 1437} {"train_loss": -40.271297454833984, "global_step": 173962, "epoch": 1437} {"train_loss": -41.27006530761719, "global_step": 173963, "epoch": 1437} {"train_loss": -40.91588592529297, "global_step": 173964, "epoch": 1437} {"train_loss": -41.43505859375, "global_step": 173965, "epoch": 1437} {"train_loss": -41.39303207397461, "global_step": 173966, "epoch": 1437} {"train_loss": -40.25923538208008, "global_step": 173967, "epoch": 1437} {"train_loss": -40.8656120300293, "global_step": 173968, "epoch": 1437} {"train_loss": -40.6581916809082, "global_step": 173969, "epoch": 1437} {"train_loss": -40.295833587646484, "global_step": 173970, "epoch": 1437} {"train_loss": -40.58991241455078, "global_step": 173971, "epoch": 1437} {"train_loss": -40.761775970458984, "global_step": 173972, "epoch": 1437} {"train_loss": -39.852718353271484, "global_step": 173973, "epoch": 1437} {"train_loss": -40.92713165283203, "global_step": 173974, "epoch": 1437} {"train_loss": -40.744667053222656, "global_step": 173975, "epoch": 1437} {"train_loss": -40.8830451965332, "global_step": 173976, "epoch": 1437} {"train_loss": -40.559879302978516, "global_step": 173977, "epoch": 1437} {"train_loss": -41.16286849975586, "global_step": 173978, "epoch": 1437} {"train_loss": -41.78036880493164, "global_step": 173979, "epoch": 1437} {"train_loss": -40.46623611450195, "global_step": 173980, "epoch": 1437} {"train_loss": -40.66203689575195, "global_step": 173981, "epoch": 1437} {"train_loss": -41.10572052001953, "global_step": 173982, "epoch": 1437} {"train_loss": -40.93572998046875, "global_step": 173983, "epoch": 1437} {"train_loss": -41.172237396240234, "global_step": 173984, "epoch": 1437} {"train_loss": -40.923851013183594, "global_step": 173985, "epoch": 1437} {"train_loss": -41.21540451049805, "global_step": 173986, "epoch": 1437} {"train_loss": -40.81527328491211, "global_step": 173987, "epoch": 1437} {"train_loss": -41.1243896484375, "global_step": 173988, "epoch": 1437} {"train_loss": -41.284603118896484, "global_step": 173989, "epoch": 1437} {"train_loss": -41.64461135864258, "global_step": 173990, "epoch": 1437} {"train_loss": -41.83124923706055, "global_step": 173991, "epoch": 1437} {"train_loss": -41.413028717041016, "global_step": 173992, "epoch": 1437} {"train_loss": -41.12211227416992, "global_step": 173993, "epoch": 1437} {"train_loss": -41.5023307800293, "global_step": 173994, "epoch": 1437} {"train_loss": -41.6768913269043, "global_step": 173995, "epoch": 1437} {"train_loss": -41.96194839477539, "global_step": 173996, "epoch": 1437} {"train_loss": -40.49982720367179, "global_step": 173997, "epoch": 1437, "val_loss": 2571998.25} {"train_loss": -42.08600616455078, "global_step": 173998, "epoch": 1438} {"train_loss": -40.682132720947266, "global_step": 173999, "epoch": 1438} {"train_loss": -41.477561950683594, "global_step": 174000, "epoch": 1438} {"train_loss": -41.33217239379883, "global_step": 174001, "epoch": 1438} {"train_loss": -40.75728988647461, "global_step": 174002, "epoch": 1438} {"train_loss": -39.12021255493164, "global_step": 174003, "epoch": 1438} {"train_loss": -41.28855895996094, "global_step": 174004, "epoch": 1438} {"train_loss": -40.83929443359375, "global_step": 174005, "epoch": 1438} {"train_loss": -40.79157257080078, "global_step": 174006, "epoch": 1438} {"train_loss": -41.44150161743164, "global_step": 174007, "epoch": 1438} {"train_loss": -41.80385971069336, "global_step": 174008, "epoch": 1438} {"train_loss": -41.785701751708984, "global_step": 174009, "epoch": 1438} {"train_loss": -41.45270919799805, "global_step": 174010, "epoch": 1438} {"train_loss": -41.974151611328125, "global_step": 174011, "epoch": 1438} {"train_loss": -41.411197662353516, "global_step": 174012, "epoch": 1438} {"train_loss": -41.66130447387695, "global_step": 174013, "epoch": 1438} {"train_loss": -41.69123458862305, "global_step": 174014, "epoch": 1438} {"train_loss": -41.89418029785156, "global_step": 174015, "epoch": 1438} {"train_loss": -41.88865280151367, "global_step": 174016, "epoch": 1438} {"train_loss": -41.77064895629883, "global_step": 174017, "epoch": 1438} {"train_loss": -41.95109176635742, "global_step": 174018, "epoch": 1438} {"train_loss": -42.218379974365234, "global_step": 174019, "epoch": 1438} {"train_loss": -41.36564254760742, "global_step": 174020, "epoch": 1438} {"train_loss": -41.64619827270508, "global_step": 174021, "epoch": 1438} {"train_loss": -40.46071243286133, "global_step": 174022, "epoch": 1438} {"train_loss": -39.67005157470703, "global_step": 174023, "epoch": 1438} {"train_loss": -39.40209197998047, "global_step": 174024, "epoch": 1438} {"train_loss": -37.87889862060547, "global_step": 174025, "epoch": 1438} {"train_loss": -33.538726806640625, "global_step": 174026, "epoch": 1438} {"train_loss": -24.715404510498047, "global_step": 174027, "epoch": 1438} {"train_loss": -22.969375610351562, "global_step": 174028, "epoch": 1438} {"train_loss": -30.61689567565918, "global_step": 174029, "epoch": 1438} {"train_loss": -38.54435729980469, "global_step": 174030, "epoch": 1438} {"train_loss": -26.962743759155273, "global_step": 174031, "epoch": 1438} {"train_loss": -31.978559494018555, "global_step": 174032, "epoch": 1438} {"train_loss": -39.24720764160156, "global_step": 174033, "epoch": 1438} {"train_loss": -28.606826782226562, "global_step": 174034, "epoch": 1438} {"train_loss": -38.18720245361328, "global_step": 174035, "epoch": 1438} {"train_loss": -32.60609817504883, "global_step": 174036, "epoch": 1438} {"train_loss": -39.12672805786133, "global_step": 174037, "epoch": 1438} {"train_loss": -34.81246566772461, "global_step": 174038, "epoch": 1438} {"train_loss": -38.59011459350586, "global_step": 174039, "epoch": 1438} {"train_loss": -37.69948196411133, "global_step": 174040, "epoch": 1438} {"train_loss": -36.9288444519043, "global_step": 174041, "epoch": 1438} {"train_loss": -38.82612228393555, "global_step": 174042, "epoch": 1438} {"train_loss": -36.79949951171875, "global_step": 174043, "epoch": 1438} {"train_loss": -39.04035949707031, "global_step": 174044, "epoch": 1438} {"train_loss": -39.34312057495117, "global_step": 174045, "epoch": 1438} {"train_loss": -39.22499465942383, "global_step": 174046, "epoch": 1438} {"train_loss": -38.880149841308594, "global_step": 174047, "epoch": 1438} {"train_loss": -38.94655990600586, "global_step": 174048, "epoch": 1438} {"train_loss": -39.825782775878906, "global_step": 174049, "epoch": 1438} {"train_loss": -38.769256591796875, "global_step": 174050, "epoch": 1438} {"train_loss": -40.459999084472656, "global_step": 174051, "epoch": 1438} {"train_loss": -38.56827926635742, "global_step": 174052, "epoch": 1438} {"train_loss": -39.49076461791992, "global_step": 174053, "epoch": 1438} {"train_loss": -39.60736083984375, "global_step": 174054, "epoch": 1438} {"train_loss": -39.19419479370117, "global_step": 174055, "epoch": 1438} {"train_loss": -40.30031204223633, "global_step": 174056, "epoch": 1438} {"train_loss": -39.702980041503906, "global_step": 174057, "epoch": 1438} {"train_loss": -39.480220794677734, "global_step": 174058, "epoch": 1438} {"train_loss": -39.6405029296875, "global_step": 174059, "epoch": 1438} {"train_loss": -39.994197845458984, "global_step": 174060, "epoch": 1438} {"train_loss": -40.1386833190918, "global_step": 174061, "epoch": 1438} {"train_loss": -39.98860549926758, "global_step": 174062, "epoch": 1438} {"train_loss": -40.25514602661133, "global_step": 174063, "epoch": 1438} {"train_loss": -40.2598876953125, "global_step": 174064, "epoch": 1438} {"train_loss": -40.50751495361328, "global_step": 174065, "epoch": 1438} {"train_loss": -40.60128402709961, "global_step": 174066, "epoch": 1438} {"train_loss": -40.86117172241211, "global_step": 174067, "epoch": 1438} {"train_loss": -40.613014221191406, "global_step": 174068, "epoch": 1438} {"train_loss": -40.239532470703125, "global_step": 174069, "epoch": 1438} {"train_loss": -40.84579086303711, "global_step": 174070, "epoch": 1438} {"train_loss": -40.74776840209961, "global_step": 174071, "epoch": 1438} {"train_loss": -41.40961837768555, "global_step": 174072, "epoch": 1438} {"train_loss": -40.97312545776367, "global_step": 174073, "epoch": 1438} {"train_loss": -41.35319137573242, "global_step": 174074, "epoch": 1438} {"train_loss": -40.7746696472168, "global_step": 174075, "epoch": 1438} {"train_loss": -41.207374572753906, "global_step": 174076, "epoch": 1438} {"train_loss": -40.859291076660156, "global_step": 174077, "epoch": 1438} {"train_loss": -41.014278411865234, "global_step": 174078, "epoch": 1438} {"train_loss": -41.23508834838867, "global_step": 174079, "epoch": 1438} {"train_loss": -40.70315170288086, "global_step": 174080, "epoch": 1438} {"train_loss": -40.429630279541016, "global_step": 174081, "epoch": 1438} {"train_loss": -40.60756301879883, "global_step": 174082, "epoch": 1438} {"train_loss": -40.96723556518555, "global_step": 174083, "epoch": 1438} {"train_loss": -41.27628707885742, "global_step": 174084, "epoch": 1438} {"train_loss": -41.26202392578125, "global_step": 174085, "epoch": 1438} {"train_loss": -41.288265228271484, "global_step": 174086, "epoch": 1438} {"train_loss": -41.0605583190918, "global_step": 174087, "epoch": 1438} {"train_loss": -41.35276412963867, "global_step": 174088, "epoch": 1438} {"train_loss": -41.41864013671875, "global_step": 174089, "epoch": 1438} {"train_loss": -41.400569915771484, "global_step": 174090, "epoch": 1438} {"train_loss": -41.538475036621094, "global_step": 174091, "epoch": 1438} {"train_loss": -41.30479049682617, "global_step": 174092, "epoch": 1438} {"train_loss": -40.86342239379883, "global_step": 174093, "epoch": 1438} {"train_loss": -41.52399826049805, "global_step": 174094, "epoch": 1438} {"train_loss": -41.715694427490234, "global_step": 174095, "epoch": 1438} {"train_loss": -41.608333587646484, "global_step": 174096, "epoch": 1438} {"train_loss": -42.117088317871094, "global_step": 174097, "epoch": 1438} {"train_loss": -42.120086669921875, "global_step": 174098, "epoch": 1438} {"train_loss": -42.25725173950195, "global_step": 174099, "epoch": 1438} {"train_loss": -41.993011474609375, "global_step": 174100, "epoch": 1438} {"train_loss": -42.00471878051758, "global_step": 174101, "epoch": 1438} {"train_loss": -42.17243576049805, "global_step": 174102, "epoch": 1438} {"train_loss": -42.270748138427734, "global_step": 174103, "epoch": 1438} {"train_loss": -41.52500534057617, "global_step": 174104, "epoch": 1438} {"train_loss": -41.97970962524414, "global_step": 174105, "epoch": 1438} {"train_loss": -42.03887939453125, "global_step": 174106, "epoch": 1438} {"train_loss": -41.90510559082031, "global_step": 174107, "epoch": 1438} {"train_loss": -42.00082015991211, "global_step": 174108, "epoch": 1438} {"train_loss": -42.156982421875, "global_step": 174109, "epoch": 1438} {"train_loss": -42.14321517944336, "global_step": 174110, "epoch": 1438} {"train_loss": -42.250728607177734, "global_step": 174111, "epoch": 1438} {"train_loss": -42.15238571166992, "global_step": 174112, "epoch": 1438} {"train_loss": -42.06742477416992, "global_step": 174113, "epoch": 1438} {"train_loss": -42.30070877075195, "global_step": 174114, "epoch": 1438} {"train_loss": -42.560245513916016, "global_step": 174115, "epoch": 1438} {"train_loss": -42.07606506347656, "global_step": 174116, "epoch": 1438} {"train_loss": -42.08316421508789, "global_step": 174117, "epoch": 1438} {"train_loss": -39.94802602657602, "global_step": 174118, "epoch": 1438, "val_loss": 2502718.75} {"train_loss": -42.16945266723633, "global_step": 174119, "epoch": 1439} {"train_loss": -42.48601150512695, "global_step": 174120, "epoch": 1439} {"train_loss": -42.43941879272461, "global_step": 174121, "epoch": 1439} {"train_loss": -41.89799118041992, "global_step": 174122, "epoch": 1439} {"train_loss": -40.726016998291016, "global_step": 174123, "epoch": 1439} {"train_loss": -38.92252731323242, "global_step": 174124, "epoch": 1439} {"train_loss": -34.962886810302734, "global_step": 174125, "epoch": 1439} {"train_loss": -27.042652130126953, "global_step": 174126, "epoch": 1439} {"train_loss": -27.408252716064453, "global_step": 174127, "epoch": 1439} {"train_loss": -35.91580581665039, "global_step": 174128, "epoch": 1439} {"train_loss": -39.30510330200195, "global_step": 174129, "epoch": 1439} {"train_loss": -36.524085998535156, "global_step": 174130, "epoch": 1439} {"train_loss": -40.58769226074219, "global_step": 174131, "epoch": 1439} {"train_loss": -36.587005615234375, "global_step": 174132, "epoch": 1439} {"train_loss": -36.00210189819336, "global_step": 174133, "epoch": 1439} {"train_loss": -38.33451843261719, "global_step": 174134, "epoch": 1439} {"train_loss": -39.125030517578125, "global_step": 174135, "epoch": 1439} {"train_loss": -38.53623580932617, "global_step": 174136, "epoch": 1439} {"train_loss": -39.789974212646484, "global_step": 174137, "epoch": 1439} {"train_loss": -38.76357650756836, "global_step": 174138, "epoch": 1439} {"train_loss": -40.62192916870117, "global_step": 174139, "epoch": 1439} {"train_loss": -39.648616790771484, "global_step": 174140, "epoch": 1439} {"train_loss": -39.5700798034668, "global_step": 174141, "epoch": 1439} {"train_loss": -38.39638137817383, "global_step": 174142, "epoch": 1439} {"train_loss": -40.1706428527832, "global_step": 174143, "epoch": 1439} {"train_loss": -39.14358139038086, "global_step": 174144, "epoch": 1439} {"train_loss": -40.15314483642578, "global_step": 174145, "epoch": 1439} {"train_loss": -40.19309616088867, "global_step": 174146, "epoch": 1439} {"train_loss": -40.24238586425781, "global_step": 174147, "epoch": 1439} {"train_loss": -39.77647018432617, "global_step": 174148, "epoch": 1439} {"train_loss": -40.055904388427734, "global_step": 174149, "epoch": 1439} {"train_loss": -39.81040954589844, "global_step": 174150, "epoch": 1439} {"train_loss": -39.98585510253906, "global_step": 174151, "epoch": 1439} {"train_loss": -39.71302032470703, "global_step": 174152, "epoch": 1439} {"train_loss": -40.610042572021484, "global_step": 174153, "epoch": 1439} {"train_loss": -39.635963439941406, "global_step": 174154, "epoch": 1439} {"train_loss": -41.02593231201172, "global_step": 174155, "epoch": 1439} {"train_loss": -40.1613883972168, "global_step": 174156, "epoch": 1439} {"train_loss": -40.97920608520508, "global_step": 174157, "epoch": 1439} {"train_loss": -40.48221969604492, "global_step": 174158, "epoch": 1439} {"train_loss": -41.466827392578125, "global_step": 174159, "epoch": 1439} {"train_loss": -40.87716293334961, "global_step": 174160, "epoch": 1439} {"train_loss": -41.141326904296875, "global_step": 174161, "epoch": 1439} {"train_loss": -41.249114990234375, "global_step": 174162, "epoch": 1439} {"train_loss": -41.06789016723633, "global_step": 174163, "epoch": 1439} {"train_loss": -41.056941986083984, "global_step": 174164, "epoch": 1439} {"train_loss": -41.43843460083008, "global_step": 174165, "epoch": 1439} {"train_loss": -41.18793869018555, "global_step": 174166, "epoch": 1439} {"train_loss": -41.2303466796875, "global_step": 174167, "epoch": 1439} {"train_loss": -41.53319549560547, "global_step": 174168, "epoch": 1439} {"train_loss": -41.74220657348633, "global_step": 174169, "epoch": 1439} {"train_loss": -41.460697174072266, "global_step": 174170, "epoch": 1439} {"train_loss": -41.55244064331055, "global_step": 174171, "epoch": 1439} {"train_loss": -41.69588088989258, "global_step": 174172, "epoch": 1439} {"train_loss": -41.186092376708984, "global_step": 174173, "epoch": 1439} {"train_loss": -41.320533752441406, "global_step": 174174, "epoch": 1439} {"train_loss": -41.82300567626953, "global_step": 174175, "epoch": 1439} {"train_loss": -42.00944137573242, "global_step": 174176, "epoch": 1439} {"train_loss": -41.58656692504883, "global_step": 174177, "epoch": 1439} {"train_loss": -40.887325286865234, "global_step": 174178, "epoch": 1439} {"train_loss": -41.126991271972656, "global_step": 174179, "epoch": 1439} {"train_loss": -41.28847885131836, "global_step": 174180, "epoch": 1439} {"train_loss": -41.55115509033203, "global_step": 174181, "epoch": 1439} {"train_loss": -41.809783935546875, "global_step": 174182, "epoch": 1439} {"train_loss": -40.92984390258789, "global_step": 174183, "epoch": 1439} {"train_loss": -41.03023910522461, "global_step": 174184, "epoch": 1439} {"train_loss": -41.93904495239258, "global_step": 174185, "epoch": 1439} {"train_loss": -41.32443618774414, "global_step": 174186, "epoch": 1439} {"train_loss": -41.54113006591797, "global_step": 174187, "epoch": 1439} {"train_loss": -41.5782470703125, "global_step": 174188, "epoch": 1439} {"train_loss": -40.68308639526367, "global_step": 174189, "epoch": 1439} {"train_loss": -41.412139892578125, "global_step": 174190, "epoch": 1439} {"train_loss": -41.41046142578125, "global_step": 174191, "epoch": 1439} {"train_loss": -39.9791259765625, "global_step": 174192, "epoch": 1439} {"train_loss": -41.861148834228516, "global_step": 174193, "epoch": 1439} {"train_loss": -41.85002517700195, "global_step": 174194, "epoch": 1439} {"train_loss": -40.78189468383789, "global_step": 174195, "epoch": 1439} {"train_loss": -41.368995666503906, "global_step": 174196, "epoch": 1439} {"train_loss": -41.729122161865234, "global_step": 174197, "epoch": 1439} {"train_loss": -41.5185661315918, "global_step": 174198, "epoch": 1439} {"train_loss": -40.985347747802734, "global_step": 174199, "epoch": 1439} {"train_loss": -41.65496063232422, "global_step": 174200, "epoch": 1439} {"train_loss": -41.03200912475586, "global_step": 174201, "epoch": 1439} {"train_loss": -40.93581008911133, "global_step": 174202, "epoch": 1439} {"train_loss": -40.09859085083008, "global_step": 174203, "epoch": 1439} {"train_loss": -37.50614547729492, "global_step": 174204, "epoch": 1439} {"train_loss": -37.095191955566406, "global_step": 174205, "epoch": 1439} {"train_loss": -35.9143180847168, "global_step": 174206, "epoch": 1439} {"train_loss": -38.60358810424805, "global_step": 174207, "epoch": 1439} {"train_loss": -40.876522064208984, "global_step": 174208, "epoch": 1439} {"train_loss": -37.16924285888672, "global_step": 174209, "epoch": 1439} {"train_loss": -33.7789192199707, "global_step": 174210, "epoch": 1439} {"train_loss": -38.89533615112305, "global_step": 174211, "epoch": 1439} {"train_loss": -40.35805892944336, "global_step": 174212, "epoch": 1439} {"train_loss": -39.229400634765625, "global_step": 174213, "epoch": 1439} {"train_loss": -40.15088653564453, "global_step": 174214, "epoch": 1439} {"train_loss": -40.87118148803711, "global_step": 174215, "epoch": 1439} {"train_loss": -41.339534759521484, "global_step": 174216, "epoch": 1439} {"train_loss": -40.86518478393555, "global_step": 174217, "epoch": 1439} {"train_loss": -39.97850036621094, "global_step": 174218, "epoch": 1439} {"train_loss": -41.040897369384766, "global_step": 174219, "epoch": 1439} {"train_loss": -40.20790100097656, "global_step": 174220, "epoch": 1439} {"train_loss": -40.697959899902344, "global_step": 174221, "epoch": 1439} {"train_loss": -41.4138298034668, "global_step": 174222, "epoch": 1439} {"train_loss": -39.47700119018555, "global_step": 174223, "epoch": 1439} {"train_loss": -40.94601058959961, "global_step": 174224, "epoch": 1439} {"train_loss": -40.78535079956055, "global_step": 174225, "epoch": 1439} {"train_loss": -40.34510803222656, "global_step": 174226, "epoch": 1439} {"train_loss": -40.382080078125, "global_step": 174227, "epoch": 1439} {"train_loss": -39.964881896972656, "global_step": 174228, "epoch": 1439} {"train_loss": -41.02862548828125, "global_step": 174229, "epoch": 1439} {"train_loss": -40.4395637512207, "global_step": 174230, "epoch": 1439} {"train_loss": -40.37534713745117, "global_step": 174231, "epoch": 1439} {"train_loss": -41.164085388183594, "global_step": 174232, "epoch": 1439} {"train_loss": -40.415321350097656, "global_step": 174233, "epoch": 1439} {"train_loss": -39.94939041137695, "global_step": 174234, "epoch": 1439} {"train_loss": -41.056427001953125, "global_step": 174235, "epoch": 1439} {"train_loss": -39.9456787109375, "global_step": 174236, "epoch": 1439} {"train_loss": -40.12360382080078, "global_step": 174237, "epoch": 1439} {"train_loss": -41.18874740600586, "global_step": 174238, "epoch": 1439} {"train_loss": -40.0882042498628, "global_step": 174239, "epoch": 1439, "val_loss": 2634300.25} {"train_loss": -41.3834342956543, "global_step": 174240, "epoch": 1440} {"train_loss": -40.78779220581055, "global_step": 174241, "epoch": 1440} {"train_loss": -41.161319732666016, "global_step": 174242, "epoch": 1440} {"train_loss": -41.68086242675781, "global_step": 174243, "epoch": 1440} {"train_loss": -40.95969009399414, "global_step": 174244, "epoch": 1440} {"train_loss": -41.80521774291992, "global_step": 174245, "epoch": 1440} {"train_loss": -40.9318962097168, "global_step": 174246, "epoch": 1440} {"train_loss": -41.0218620300293, "global_step": 174247, "epoch": 1440} {"train_loss": -41.35354995727539, "global_step": 174248, "epoch": 1440} {"train_loss": -41.76673126220703, "global_step": 174249, "epoch": 1440} {"train_loss": -41.173614501953125, "global_step": 174250, "epoch": 1440} {"train_loss": -40.93413162231445, "global_step": 174251, "epoch": 1440} {"train_loss": -41.76249313354492, "global_step": 174252, "epoch": 1440} {"train_loss": -41.29884338378906, "global_step": 174253, "epoch": 1440} {"train_loss": -41.43901443481445, "global_step": 174254, "epoch": 1440} {"train_loss": -41.619232177734375, "global_step": 174255, "epoch": 1440} {"train_loss": -41.52058792114258, "global_step": 174256, "epoch": 1440} {"train_loss": -41.24751663208008, "global_step": 174257, "epoch": 1440} {"train_loss": -41.785804748535156, "global_step": 174258, "epoch": 1440} {"train_loss": -41.512245178222656, "global_step": 174259, "epoch": 1440} {"train_loss": -42.12960433959961, "global_step": 174260, "epoch": 1440} {"train_loss": -41.749778747558594, "global_step": 174261, "epoch": 1440} {"train_loss": -41.84804916381836, "global_step": 174262, "epoch": 1440} {"train_loss": -41.607337951660156, "global_step": 174263, "epoch": 1440} {"train_loss": -41.30575180053711, "global_step": 174264, "epoch": 1440} {"train_loss": -42.04991912841797, "global_step": 174265, "epoch": 1440} {"train_loss": -40.946937561035156, "global_step": 174266, "epoch": 1440} {"train_loss": -42.17970657348633, "global_step": 174267, "epoch": 1440} {"train_loss": -41.89693069458008, "global_step": 174268, "epoch": 1440} {"train_loss": -41.36629867553711, "global_step": 174269, "epoch": 1440} {"train_loss": -41.746131896972656, "global_step": 174270, "epoch": 1440} {"train_loss": -41.80427169799805, "global_step": 174271, "epoch": 1440} {"train_loss": -41.875526428222656, "global_step": 174272, "epoch": 1440} {"train_loss": -41.8018913269043, "global_step": 174273, "epoch": 1440} {"train_loss": -41.67744445800781, "global_step": 174274, "epoch": 1440} {"train_loss": -41.767269134521484, "global_step": 174275, "epoch": 1440} {"train_loss": -41.896026611328125, "global_step": 174276, "epoch": 1440} {"train_loss": -41.689422607421875, "global_step": 174277, "epoch": 1440} {"train_loss": -41.934043884277344, "global_step": 174278, "epoch": 1440} {"train_loss": -41.78972625732422, "global_step": 174279, "epoch": 1440} {"train_loss": -41.97933578491211, "global_step": 174280, "epoch": 1440} {"train_loss": -41.35369873046875, "global_step": 174281, "epoch": 1440} {"train_loss": -41.57169723510742, "global_step": 174282, "epoch": 1440} {"train_loss": -41.41252899169922, "global_step": 174283, "epoch": 1440} {"train_loss": -41.44675827026367, "global_step": 174284, "epoch": 1440} {"train_loss": -42.10913848876953, "global_step": 174285, "epoch": 1440} {"train_loss": -40.65120315551758, "global_step": 174286, "epoch": 1440} {"train_loss": -39.69282150268555, "global_step": 174287, "epoch": 1440} {"train_loss": -40.14678192138672, "global_step": 174288, "epoch": 1440} {"train_loss": -40.06068420410156, "global_step": 174289, "epoch": 1440} {"train_loss": -41.80674743652344, "global_step": 174290, "epoch": 1440} {"train_loss": -39.78358840942383, "global_step": 174291, "epoch": 1440} {"train_loss": -39.415428161621094, "global_step": 174292, "epoch": 1440} {"train_loss": -37.680049896240234, "global_step": 174293, "epoch": 1440} {"train_loss": -37.35566329956055, "global_step": 174294, "epoch": 1440} {"train_loss": -38.64594650268555, "global_step": 174295, "epoch": 1440} {"train_loss": -37.43376159667969, "global_step": 174296, "epoch": 1440} {"train_loss": -39.791500091552734, "global_step": 174297, "epoch": 1440} {"train_loss": -41.02094650268555, "global_step": 174298, "epoch": 1440} {"train_loss": -40.11322021484375, "global_step": 174299, "epoch": 1440} {"train_loss": -39.2025146484375, "global_step": 174300, "epoch": 1440} {"train_loss": -40.41215133666992, "global_step": 174301, "epoch": 1440} {"train_loss": -40.64934158325195, "global_step": 174302, "epoch": 1440} {"train_loss": -40.210269927978516, "global_step": 174303, "epoch": 1440} {"train_loss": -40.1177864074707, "global_step": 174304, "epoch": 1440} {"train_loss": -40.29206085205078, "global_step": 174305, "epoch": 1440} {"train_loss": -40.26275634765625, "global_step": 174306, "epoch": 1440} {"train_loss": -39.850791931152344, "global_step": 174307, "epoch": 1440} {"train_loss": -39.67377471923828, "global_step": 174308, "epoch": 1440} {"train_loss": -39.38188552856445, "global_step": 174309, "epoch": 1440} {"train_loss": -39.35709762573242, "global_step": 174310, "epoch": 1440} {"train_loss": -39.46620178222656, "global_step": 174311, "epoch": 1440} {"train_loss": -39.178035736083984, "global_step": 174312, "epoch": 1440} {"train_loss": -39.771881103515625, "global_step": 174313, "epoch": 1440} {"train_loss": -40.420860290527344, "global_step": 174314, "epoch": 1440} {"train_loss": -39.436885833740234, "global_step": 174315, "epoch": 1440} {"train_loss": -40.94804763793945, "global_step": 174316, "epoch": 1440} {"train_loss": -40.13530349731445, "global_step": 174317, "epoch": 1440} {"train_loss": -40.607791900634766, "global_step": 174318, "epoch": 1440} {"train_loss": -40.85159683227539, "global_step": 174319, "epoch": 1440} {"train_loss": -41.37135314941406, "global_step": 174320, "epoch": 1440} {"train_loss": -41.233680725097656, "global_step": 174321, "epoch": 1440} {"train_loss": -40.621517181396484, "global_step": 174322, "epoch": 1440} {"train_loss": -40.798553466796875, "global_step": 174323, "epoch": 1440} {"train_loss": -40.65424728393555, "global_step": 174324, "epoch": 1440} {"train_loss": -41.050018310546875, "global_step": 174325, "epoch": 1440} {"train_loss": -41.22600555419922, "global_step": 174326, "epoch": 1440} {"train_loss": -41.266845703125, "global_step": 174327, "epoch": 1440} {"train_loss": -41.357154846191406, "global_step": 174328, "epoch": 1440} {"train_loss": -41.16630172729492, "global_step": 174329, "epoch": 1440} {"train_loss": -41.48704147338867, "global_step": 174330, "epoch": 1440} {"train_loss": -41.402008056640625, "global_step": 174331, "epoch": 1440} {"train_loss": -41.930328369140625, "global_step": 174332, "epoch": 1440} {"train_loss": -41.30941390991211, "global_step": 174333, "epoch": 1440} {"train_loss": -41.13241958618164, "global_step": 174334, "epoch": 1440} {"train_loss": -41.68976974487305, "global_step": 174335, "epoch": 1440} {"train_loss": -40.7533073425293, "global_step": 174336, "epoch": 1440} {"train_loss": -41.86513900756836, "global_step": 174337, "epoch": 1440} {"train_loss": -41.34064483642578, "global_step": 174338, "epoch": 1440} {"train_loss": -41.375518798828125, "global_step": 174339, "epoch": 1440} {"train_loss": -41.2266845703125, "global_step": 174340, "epoch": 1440} {"train_loss": -41.3912353515625, "global_step": 174341, "epoch": 1440} {"train_loss": -41.086238861083984, "global_step": 174342, "epoch": 1440} {"train_loss": -41.68485641479492, "global_step": 174343, "epoch": 1440} {"train_loss": -41.301265716552734, "global_step": 174344, "epoch": 1440} {"train_loss": -41.21613693237305, "global_step": 174345, "epoch": 1440} {"train_loss": -41.90909957885742, "global_step": 174346, "epoch": 1440} {"train_loss": -41.41701126098633, "global_step": 174347, "epoch": 1440} {"train_loss": -42.01987838745117, "global_step": 174348, "epoch": 1440} {"train_loss": -41.964229583740234, "global_step": 174349, "epoch": 1440} {"train_loss": -42.283287048339844, "global_step": 174350, "epoch": 1440} {"train_loss": -41.626522064208984, "global_step": 174351, "epoch": 1440} {"train_loss": -42.05043411254883, "global_step": 174352, "epoch": 1440} {"train_loss": -41.920658111572266, "global_step": 174353, "epoch": 1440} {"train_loss": -41.9381217956543, "global_step": 174354, "epoch": 1440} {"train_loss": -41.77165603637695, "global_step": 174355, "epoch": 1440} {"train_loss": -41.8208122253418, "global_step": 174356, "epoch": 1440} {"train_loss": -41.80542755126953, "global_step": 174357, "epoch": 1440} {"train_loss": -42.12422561645508, "global_step": 174358, "epoch": 1440} {"train_loss": -41.94978713989258, "global_step": 174359, "epoch": 1440} {"train_loss": -41.05247377758184, "global_step": 174360, "epoch": 1440, "val_loss": 2612353.75} {"train_loss": -42.376914978027344, "global_step": 174361, "epoch": 1441} {"train_loss": -41.97382736206055, "global_step": 174362, "epoch": 1441} {"train_loss": -42.06113815307617, "global_step": 174363, "epoch": 1441} {"train_loss": -41.606719970703125, "global_step": 174364, "epoch": 1441} {"train_loss": -41.053504943847656, "global_step": 174365, "epoch": 1441} {"train_loss": -42.07047653198242, "global_step": 174366, "epoch": 1441} {"train_loss": -41.70985794067383, "global_step": 174367, "epoch": 1441} {"train_loss": -41.70208740234375, "global_step": 174368, "epoch": 1441} {"train_loss": -41.792728424072266, "global_step": 174369, "epoch": 1441} {"train_loss": -41.756587982177734, "global_step": 174370, "epoch": 1441} {"train_loss": -41.86378860473633, "global_step": 174371, "epoch": 1441} {"train_loss": -42.17441940307617, "global_step": 174372, "epoch": 1441} {"train_loss": -41.68886184692383, "global_step": 174373, "epoch": 1441} {"train_loss": -41.8987922668457, "global_step": 174374, "epoch": 1441} {"train_loss": -42.05791091918945, "global_step": 174375, "epoch": 1441} {"train_loss": -41.69989013671875, "global_step": 174376, "epoch": 1441} {"train_loss": -42.43467712402344, "global_step": 174377, "epoch": 1441} {"train_loss": -42.101524353027344, "global_step": 174378, "epoch": 1441} {"train_loss": -42.4068717956543, "global_step": 174379, "epoch": 1441} {"train_loss": -42.4202995300293, "global_step": 174380, "epoch": 1441} {"train_loss": -42.02434539794922, "global_step": 174381, "epoch": 1441} {"train_loss": -42.76402282714844, "global_step": 174382, "epoch": 1441} {"train_loss": -42.342838287353516, "global_step": 174383, "epoch": 1441} {"train_loss": -42.25118637084961, "global_step": 174384, "epoch": 1441} {"train_loss": -42.3184700012207, "global_step": 174385, "epoch": 1441} {"train_loss": -42.35110855102539, "global_step": 174386, "epoch": 1441} {"train_loss": -42.45302200317383, "global_step": 174387, "epoch": 1441} {"train_loss": -42.03761672973633, "global_step": 174388, "epoch": 1441} {"train_loss": -42.41004180908203, "global_step": 174389, "epoch": 1441} {"train_loss": -42.21110916137695, "global_step": 174390, "epoch": 1441} {"train_loss": -40.4730339050293, "global_step": 174391, "epoch": 1441} {"train_loss": -38.582881927490234, "global_step": 174392, "epoch": 1441} {"train_loss": -32.83195877075195, "global_step": 174393, "epoch": 1441} {"train_loss": -31.66814613342285, "global_step": 174394, "epoch": 1441} {"train_loss": -34.16385269165039, "global_step": 174395, "epoch": 1441} {"train_loss": -40.29880905151367, "global_step": 174396, "epoch": 1441} {"train_loss": -41.49124526977539, "global_step": 174397, "epoch": 1441} {"train_loss": -40.14133834838867, "global_step": 174398, "epoch": 1441} {"train_loss": -40.001651763916016, "global_step": 174399, "epoch": 1441} {"train_loss": -40.74293899536133, "global_step": 174400, "epoch": 1441} {"train_loss": -41.41644287109375, "global_step": 174401, "epoch": 1441} {"train_loss": -39.3471794128418, "global_step": 174402, "epoch": 1441} {"train_loss": -40.1213493347168, "global_step": 174403, "epoch": 1441} {"train_loss": -41.50808334350586, "global_step": 174404, "epoch": 1441} {"train_loss": -39.701698303222656, "global_step": 174405, "epoch": 1441} {"train_loss": -41.07123565673828, "global_step": 174406, "epoch": 1441} {"train_loss": -41.01713943481445, "global_step": 174407, "epoch": 1441} {"train_loss": -39.70823287963867, "global_step": 174408, "epoch": 1441} {"train_loss": -41.583919525146484, "global_step": 174409, "epoch": 1441} {"train_loss": -40.713191986083984, "global_step": 174410, "epoch": 1441} {"train_loss": -40.26823806762695, "global_step": 174411, "epoch": 1441} {"train_loss": -41.532379150390625, "global_step": 174412, "epoch": 1441} {"train_loss": -40.855506896972656, "global_step": 174413, "epoch": 1441} {"train_loss": -41.300636291503906, "global_step": 174414, "epoch": 1441} {"train_loss": -40.836666107177734, "global_step": 174415, "epoch": 1441} {"train_loss": -41.700740814208984, "global_step": 174416, "epoch": 1441} {"train_loss": -40.129676818847656, "global_step": 174417, "epoch": 1441} {"train_loss": -41.8635368347168, "global_step": 174418, "epoch": 1441} {"train_loss": -40.69369125366211, "global_step": 174419, "epoch": 1441} {"train_loss": -41.430477142333984, "global_step": 174420, "epoch": 1441} {"train_loss": -40.99563217163086, "global_step": 174421, "epoch": 1441} {"train_loss": -41.15754699707031, "global_step": 174422, "epoch": 1441} {"train_loss": -40.931373596191406, "global_step": 174423, "epoch": 1441} {"train_loss": -40.88004684448242, "global_step": 174424, "epoch": 1441} {"train_loss": -41.413116455078125, "global_step": 174425, "epoch": 1441} {"train_loss": -41.23685836791992, "global_step": 174426, "epoch": 1441} {"train_loss": -42.1106071472168, "global_step": 174427, "epoch": 1441} {"train_loss": -42.01332092285156, "global_step": 174428, "epoch": 1441} {"train_loss": -41.34082794189453, "global_step": 174429, "epoch": 1441} {"train_loss": -41.68449020385742, "global_step": 174430, "epoch": 1441} {"train_loss": -41.8944206237793, "global_step": 174431, "epoch": 1441} {"train_loss": -41.53125, "global_step": 174432, "epoch": 1441} {"train_loss": -42.18247604370117, "global_step": 174433, "epoch": 1441} {"train_loss": -41.694984436035156, "global_step": 174434, "epoch": 1441} {"train_loss": -41.872901916503906, "global_step": 174435, "epoch": 1441} {"train_loss": -42.15440368652344, "global_step": 174436, "epoch": 1441} {"train_loss": -42.160499572753906, "global_step": 174437, "epoch": 1441} {"train_loss": -41.39630889892578, "global_step": 174438, "epoch": 1441} {"train_loss": -41.91859817504883, "global_step": 174439, "epoch": 1441} {"train_loss": -41.18590545654297, "global_step": 174440, "epoch": 1441} {"train_loss": -41.776824951171875, "global_step": 174441, "epoch": 1441} {"train_loss": -42.3513298034668, "global_step": 174442, "epoch": 1441} {"train_loss": -41.220298767089844, "global_step": 174443, "epoch": 1441} {"train_loss": -40.54457473754883, "global_step": 174444, "epoch": 1441} {"train_loss": -41.048614501953125, "global_step": 174445, "epoch": 1441} {"train_loss": -42.44837188720703, "global_step": 174446, "epoch": 1441} {"train_loss": -41.557159423828125, "global_step": 174447, "epoch": 1441} {"train_loss": -41.142601013183594, "global_step": 174448, "epoch": 1441} {"train_loss": -41.553138732910156, "global_step": 174449, "epoch": 1441} {"train_loss": -41.51045608520508, "global_step": 174450, "epoch": 1441} {"train_loss": -41.61045455932617, "global_step": 174451, "epoch": 1441} {"train_loss": -41.468868255615234, "global_step": 174452, "epoch": 1441} {"train_loss": -42.103370666503906, "global_step": 174453, "epoch": 1441} {"train_loss": -41.10064697265625, "global_step": 174454, "epoch": 1441} {"train_loss": -41.47480392456055, "global_step": 174455, "epoch": 1441} {"train_loss": -41.8316764831543, "global_step": 174456, "epoch": 1441} {"train_loss": -40.022037506103516, "global_step": 174457, "epoch": 1441} {"train_loss": -40.91465759277344, "global_step": 174458, "epoch": 1441} {"train_loss": -41.221435546875, "global_step": 174459, "epoch": 1441} {"train_loss": -41.65688705444336, "global_step": 174460, "epoch": 1441} {"train_loss": -41.258541107177734, "global_step": 174461, "epoch": 1441} {"train_loss": -41.013851165771484, "global_step": 174462, "epoch": 1441} {"train_loss": -40.74441909790039, "global_step": 174463, "epoch": 1441} {"train_loss": -39.634613037109375, "global_step": 174464, "epoch": 1441} {"train_loss": -39.645538330078125, "global_step": 174465, "epoch": 1441} {"train_loss": -41.881954193115234, "global_step": 174466, "epoch": 1441} {"train_loss": -41.53290557861328, "global_step": 174467, "epoch": 1441} {"train_loss": -39.10200500488281, "global_step": 174468, "epoch": 1441} {"train_loss": -38.777889251708984, "global_step": 174469, "epoch": 1441} {"train_loss": -40.749752044677734, "global_step": 174470, "epoch": 1441} {"train_loss": -41.32182693481445, "global_step": 174471, "epoch": 1441} {"train_loss": -39.63501739501953, "global_step": 174472, "epoch": 1441} {"train_loss": -40.515316009521484, "global_step": 174473, "epoch": 1441} {"train_loss": -41.2111930847168, "global_step": 174474, "epoch": 1441} {"train_loss": -40.10148239135742, "global_step": 174475, "epoch": 1441} {"train_loss": -40.29627990722656, "global_step": 174476, "epoch": 1441} {"train_loss": -41.04769515991211, "global_step": 174477, "epoch": 1441} {"train_loss": -40.382564544677734, "global_step": 174478, "epoch": 1441} {"train_loss": -41.397090911865234, "global_step": 174479, "epoch": 1441} {"train_loss": -40.95286178588867, "global_step": 174480, "epoch": 1441} {"train_loss": -41.091029821348585, "global_step": 174481, "epoch": 1441, "val_loss": 2595580.0} {"train_loss": -41.304420471191406, "global_step": 174482, "epoch": 1442} {"train_loss": -41.37187957763672, "global_step": 174483, "epoch": 1442} {"train_loss": -41.51494598388672, "global_step": 174484, "epoch": 1442} {"train_loss": -41.835079193115234, "global_step": 174485, "epoch": 1442} {"train_loss": -41.373165130615234, "global_step": 174486, "epoch": 1442} {"train_loss": -42.20668029785156, "global_step": 174487, "epoch": 1442} {"train_loss": -41.520320892333984, "global_step": 174488, "epoch": 1442} {"train_loss": -41.01736068725586, "global_step": 174489, "epoch": 1442} {"train_loss": -41.78236770629883, "global_step": 174490, "epoch": 1442} {"train_loss": -41.71066665649414, "global_step": 174491, "epoch": 1442} {"train_loss": -41.92184066772461, "global_step": 174492, "epoch": 1442} {"train_loss": -41.978939056396484, "global_step": 174493, "epoch": 1442} {"train_loss": -41.675533294677734, "global_step": 174494, "epoch": 1442} {"train_loss": -41.389366149902344, "global_step": 174495, "epoch": 1442} {"train_loss": -42.28248977661133, "global_step": 174496, "epoch": 1442} {"train_loss": -41.899044036865234, "global_step": 174497, "epoch": 1442} {"train_loss": -41.51042175292969, "global_step": 174498, "epoch": 1442} {"train_loss": -41.73591613769531, "global_step": 174499, "epoch": 1442} {"train_loss": -41.9344596862793, "global_step": 174500, "epoch": 1442} {"train_loss": -41.77385330200195, "global_step": 174501, "epoch": 1442} {"train_loss": -41.167415618896484, "global_step": 174502, "epoch": 1442} {"train_loss": -40.28811264038086, "global_step": 174503, "epoch": 1442} {"train_loss": -40.13801193237305, "global_step": 174504, "epoch": 1442} {"train_loss": -41.134822845458984, "global_step": 174505, "epoch": 1442} {"train_loss": -40.53742599487305, "global_step": 174506, "epoch": 1442} {"train_loss": -41.423866271972656, "global_step": 174507, "epoch": 1442} {"train_loss": -40.50261306762695, "global_step": 174508, "epoch": 1442} {"train_loss": -41.08248519897461, "global_step": 174509, "epoch": 1442} {"train_loss": -40.59819412231445, "global_step": 174510, "epoch": 1442} {"train_loss": -41.00083541870117, "global_step": 174511, "epoch": 1442} {"train_loss": -40.01704406738281, "global_step": 174512, "epoch": 1442} {"train_loss": -39.812904357910156, "global_step": 174513, "epoch": 1442} {"train_loss": -40.93168258666992, "global_step": 174514, "epoch": 1442} {"train_loss": -37.680511474609375, "global_step": 174515, "epoch": 1442} {"train_loss": -41.592166900634766, "global_step": 174516, "epoch": 1442} {"train_loss": -40.53580856323242, "global_step": 174517, "epoch": 1442} {"train_loss": -40.901485443115234, "global_step": 174518, "epoch": 1442} {"train_loss": -39.295326232910156, "global_step": 174519, "epoch": 1442} {"train_loss": -41.01310729980469, "global_step": 174520, "epoch": 1442} {"train_loss": -41.57042694091797, "global_step": 174521, "epoch": 1442} {"train_loss": -38.18767166137695, "global_step": 174522, "epoch": 1442} {"train_loss": -39.42036819458008, "global_step": 174523, "epoch": 1442} {"train_loss": -40.973445892333984, "global_step": 174524, "epoch": 1442} {"train_loss": -41.01864242553711, "global_step": 174525, "epoch": 1442} {"train_loss": -37.275733947753906, "global_step": 174526, "epoch": 1442} {"train_loss": -40.767311096191406, "global_step": 174527, "epoch": 1442} {"train_loss": -40.25532531738281, "global_step": 174528, "epoch": 1442} {"train_loss": -38.22922897338867, "global_step": 174529, "epoch": 1442} {"train_loss": -41.20306396484375, "global_step": 174530, "epoch": 1442} {"train_loss": -40.017635345458984, "global_step": 174531, "epoch": 1442} {"train_loss": -40.89613342285156, "global_step": 174532, "epoch": 1442} {"train_loss": -41.06846237182617, "global_step": 174533, "epoch": 1442} {"train_loss": -40.51106262207031, "global_step": 174534, "epoch": 1442} {"train_loss": -41.49568557739258, "global_step": 174535, "epoch": 1442} {"train_loss": -41.15840530395508, "global_step": 174536, "epoch": 1442} {"train_loss": -40.162811279296875, "global_step": 174537, "epoch": 1442} {"train_loss": -41.37331771850586, "global_step": 174538, "epoch": 1442} {"train_loss": -41.31533432006836, "global_step": 174539, "epoch": 1442} {"train_loss": -41.25557327270508, "global_step": 174540, "epoch": 1442} {"train_loss": -41.4364128112793, "global_step": 174541, "epoch": 1442} {"train_loss": -41.75299835205078, "global_step": 174542, "epoch": 1442} {"train_loss": -41.45783996582031, "global_step": 174543, "epoch": 1442} {"train_loss": -41.60243606567383, "global_step": 174544, "epoch": 1442} {"train_loss": -41.265968322753906, "global_step": 174545, "epoch": 1442} {"train_loss": -41.50114440917969, "global_step": 174546, "epoch": 1442} {"train_loss": -42.048606872558594, "global_step": 174547, "epoch": 1442} {"train_loss": -41.521568298339844, "global_step": 174548, "epoch": 1442} {"train_loss": -41.43259811401367, "global_step": 174549, "epoch": 1442} {"train_loss": -41.017826080322266, "global_step": 174550, "epoch": 1442} {"train_loss": -41.15565872192383, "global_step": 174551, "epoch": 1442} {"train_loss": -41.0667839050293, "global_step": 174552, "epoch": 1442} {"train_loss": -41.36481857299805, "global_step": 174553, "epoch": 1442} {"train_loss": -41.161312103271484, "global_step": 174554, "epoch": 1442} {"train_loss": -41.0745849609375, "global_step": 174555, "epoch": 1442} {"train_loss": -41.858577728271484, "global_step": 174556, "epoch": 1442} {"train_loss": -40.37871551513672, "global_step": 174557, "epoch": 1442} {"train_loss": -40.40324401855469, "global_step": 174558, "epoch": 1442} {"train_loss": -41.567562103271484, "global_step": 174559, "epoch": 1442} {"train_loss": -42.36284255981445, "global_step": 174560, "epoch": 1442} {"train_loss": -41.8373908996582, "global_step": 174561, "epoch": 1442} {"train_loss": -41.18292999267578, "global_step": 174562, "epoch": 1442} {"train_loss": -41.16376876831055, "global_step": 174563, "epoch": 1442} {"train_loss": -41.55939865112305, "global_step": 174564, "epoch": 1442} {"train_loss": -42.489418029785156, "global_step": 174565, "epoch": 1442} {"train_loss": -41.93753433227539, "global_step": 174566, "epoch": 1442} {"train_loss": -41.28697967529297, "global_step": 174567, "epoch": 1442} {"train_loss": -40.973079681396484, "global_step": 174568, "epoch": 1442} {"train_loss": -41.466766357421875, "global_step": 174569, "epoch": 1442} {"train_loss": -41.47636032104492, "global_step": 174570, "epoch": 1442} {"train_loss": -42.059730529785156, "global_step": 174571, "epoch": 1442} {"train_loss": -41.55451202392578, "global_step": 174572, "epoch": 1442} {"train_loss": -40.71382522583008, "global_step": 174573, "epoch": 1442} {"train_loss": -40.586830139160156, "global_step": 174574, "epoch": 1442} {"train_loss": -41.6566276550293, "global_step": 174575, "epoch": 1442} {"train_loss": -40.758514404296875, "global_step": 174576, "epoch": 1442} {"train_loss": -40.88981246948242, "global_step": 174577, "epoch": 1442} {"train_loss": -41.655967712402344, "global_step": 174578, "epoch": 1442} {"train_loss": -40.85324478149414, "global_step": 174579, "epoch": 1442} {"train_loss": -41.56416702270508, "global_step": 174580, "epoch": 1442} {"train_loss": -41.090023040771484, "global_step": 174581, "epoch": 1442} {"train_loss": -40.593658447265625, "global_step": 174582, "epoch": 1442} {"train_loss": -41.91636276245117, "global_step": 174583, "epoch": 1442} {"train_loss": -40.284149169921875, "global_step": 174584, "epoch": 1442} {"train_loss": -39.98698806762695, "global_step": 174585, "epoch": 1442} {"train_loss": -41.222652435302734, "global_step": 174586, "epoch": 1442} {"train_loss": -40.27909469604492, "global_step": 174587, "epoch": 1442} {"train_loss": -41.38966751098633, "global_step": 174588, "epoch": 1442} {"train_loss": -41.891021728515625, "global_step": 174589, "epoch": 1442} {"train_loss": -42.14470291137695, "global_step": 174590, "epoch": 1442} {"train_loss": -41.369083404541016, "global_step": 174591, "epoch": 1442} {"train_loss": -41.128944396972656, "global_step": 174592, "epoch": 1442} {"train_loss": -41.0702018737793, "global_step": 174593, "epoch": 1442} {"train_loss": -40.57452392578125, "global_step": 174594, "epoch": 1442} {"train_loss": -41.99264144897461, "global_step": 174595, "epoch": 1442} {"train_loss": -41.507362365722656, "global_step": 174596, "epoch": 1442} {"train_loss": -41.43067932128906, "global_step": 174597, "epoch": 1442} {"train_loss": -41.11825180053711, "global_step": 174598, "epoch": 1442} {"train_loss": -40.9656867980957, "global_step": 174599, "epoch": 1442} {"train_loss": -41.13439178466797, "global_step": 174600, "epoch": 1442} {"train_loss": -42.136104583740234, "global_step": 174601, "epoch": 1442} {"train_loss": -41.09641319464061, "global_step": 174602, "epoch": 1442, "val_loss": 2669917.25} {"train_loss": -38.55088424682617, "global_step": 174603, "epoch": 1443} {"train_loss": -39.07719039916992, "global_step": 174604, "epoch": 1443} {"train_loss": -41.18598175048828, "global_step": 174605, "epoch": 1443} {"train_loss": -40.14900207519531, "global_step": 174606, "epoch": 1443} {"train_loss": -38.96312713623047, "global_step": 174607, "epoch": 1443} {"train_loss": -39.71176528930664, "global_step": 174608, "epoch": 1443} {"train_loss": -40.846893310546875, "global_step": 174609, "epoch": 1443} {"train_loss": -39.36832809448242, "global_step": 174610, "epoch": 1443} {"train_loss": -40.375404357910156, "global_step": 174611, "epoch": 1443} {"train_loss": -40.68162536621094, "global_step": 174612, "epoch": 1443} {"train_loss": -39.080055236816406, "global_step": 174613, "epoch": 1443} {"train_loss": -38.82881546020508, "global_step": 174614, "epoch": 1443} {"train_loss": -40.77743911743164, "global_step": 174615, "epoch": 1443} {"train_loss": -41.594173431396484, "global_step": 174616, "epoch": 1443} {"train_loss": -40.984920501708984, "global_step": 174617, "epoch": 1443} {"train_loss": -41.057945251464844, "global_step": 174618, "epoch": 1443} {"train_loss": -41.76225662231445, "global_step": 174619, "epoch": 1443} {"train_loss": -41.38507843017578, "global_step": 174620, "epoch": 1443} {"train_loss": -41.26543426513672, "global_step": 174621, "epoch": 1443} {"train_loss": -41.00185775756836, "global_step": 174622, "epoch": 1443} {"train_loss": -41.35831069946289, "global_step": 174623, "epoch": 1443} {"train_loss": -41.375770568847656, "global_step": 174624, "epoch": 1443} {"train_loss": -41.88343048095703, "global_step": 174625, "epoch": 1443} {"train_loss": -41.897945404052734, "global_step": 174626, "epoch": 1443} {"train_loss": -41.261898040771484, "global_step": 174627, "epoch": 1443} {"train_loss": -41.5169563293457, "global_step": 174628, "epoch": 1443} {"train_loss": -41.63582992553711, "global_step": 174629, "epoch": 1443} {"train_loss": -42.216278076171875, "global_step": 174630, "epoch": 1443} {"train_loss": -41.476627349853516, "global_step": 174631, "epoch": 1443} {"train_loss": -41.82808303833008, "global_step": 174632, "epoch": 1443} {"train_loss": -40.906707763671875, "global_step": 174633, "epoch": 1443} {"train_loss": -38.6392822265625, "global_step": 174634, "epoch": 1443} {"train_loss": -37.73137664794922, "global_step": 174635, "epoch": 1443} {"train_loss": -41.645198822021484, "global_step": 174636, "epoch": 1443} {"train_loss": -37.55708694458008, "global_step": 174637, "epoch": 1443} {"train_loss": -38.946407318115234, "global_step": 174638, "epoch": 1443} {"train_loss": -40.42416763305664, "global_step": 174639, "epoch": 1443} {"train_loss": -39.230621337890625, "global_step": 174640, "epoch": 1443} {"train_loss": -38.983238220214844, "global_step": 174641, "epoch": 1443} {"train_loss": -40.00361251831055, "global_step": 174642, "epoch": 1443} {"train_loss": -39.31010437011719, "global_step": 174643, "epoch": 1443} {"train_loss": -41.95745086669922, "global_step": 174644, "epoch": 1443} {"train_loss": -38.86167907714844, "global_step": 174645, "epoch": 1443} {"train_loss": -41.12110137939453, "global_step": 174646, "epoch": 1443} {"train_loss": -41.05442428588867, "global_step": 174647, "epoch": 1443} {"train_loss": -41.254032135009766, "global_step": 174648, "epoch": 1443} {"train_loss": -40.20742416381836, "global_step": 174649, "epoch": 1443} {"train_loss": -41.52384948730469, "global_step": 174650, "epoch": 1443} {"train_loss": -39.564971923828125, "global_step": 174651, "epoch": 1443} {"train_loss": -42.1296501159668, "global_step": 174652, "epoch": 1443} {"train_loss": -41.257232666015625, "global_step": 174653, "epoch": 1443} {"train_loss": -41.078514099121094, "global_step": 174654, "epoch": 1443} {"train_loss": -41.716529846191406, "global_step": 174655, "epoch": 1443} {"train_loss": -41.691165924072266, "global_step": 174656, "epoch": 1443} {"train_loss": -41.334259033203125, "global_step": 174657, "epoch": 1443} {"train_loss": -41.517555236816406, "global_step": 174658, "epoch": 1443} {"train_loss": -41.14037322998047, "global_step": 174659, "epoch": 1443} {"train_loss": -42.12461853027344, "global_step": 174660, "epoch": 1443} {"train_loss": -41.27880859375, "global_step": 174661, "epoch": 1443} {"train_loss": -42.2246208190918, "global_step": 174662, "epoch": 1443} {"train_loss": -41.4213752746582, "global_step": 174663, "epoch": 1443} {"train_loss": -40.94655990600586, "global_step": 174664, "epoch": 1443} {"train_loss": -41.66768264770508, "global_step": 174665, "epoch": 1443} {"train_loss": -39.272674560546875, "global_step": 174666, "epoch": 1443} {"train_loss": -41.65845489501953, "global_step": 174667, "epoch": 1443} {"train_loss": -41.215179443359375, "global_step": 174668, "epoch": 1443} {"train_loss": -41.09403610229492, "global_step": 174669, "epoch": 1443} {"train_loss": -41.4713134765625, "global_step": 174670, "epoch": 1443} {"train_loss": -41.49769592285156, "global_step": 174671, "epoch": 1443} {"train_loss": -41.2117805480957, "global_step": 174672, "epoch": 1443} {"train_loss": -41.201995849609375, "global_step": 174673, "epoch": 1443} {"train_loss": -41.734962463378906, "global_step": 174674, "epoch": 1443} {"train_loss": -39.5220832824707, "global_step": 174675, "epoch": 1443} {"train_loss": -41.10630798339844, "global_step": 174676, "epoch": 1443} {"train_loss": -40.87298583984375, "global_step": 174677, "epoch": 1443} {"train_loss": -39.96895217895508, "global_step": 174678, "epoch": 1443} {"train_loss": -41.55221176147461, "global_step": 174679, "epoch": 1443} {"train_loss": -40.935585021972656, "global_step": 174680, "epoch": 1443} {"train_loss": -40.69992446899414, "global_step": 174681, "epoch": 1443} {"train_loss": -42.3781623840332, "global_step": 174682, "epoch": 1443} {"train_loss": -41.75843048095703, "global_step": 174683, "epoch": 1443} {"train_loss": -41.7034912109375, "global_step": 174684, "epoch": 1443} {"train_loss": -42.3193359375, "global_step": 174685, "epoch": 1443} {"train_loss": -41.190670013427734, "global_step": 174686, "epoch": 1443} {"train_loss": -41.65924072265625, "global_step": 174687, "epoch": 1443} {"train_loss": -41.57886505126953, "global_step": 174688, "epoch": 1443} {"train_loss": -41.457763671875, "global_step": 174689, "epoch": 1443} {"train_loss": -42.24715805053711, "global_step": 174690, "epoch": 1443} {"train_loss": -40.37717819213867, "global_step": 174691, "epoch": 1443} {"train_loss": -40.60990905761719, "global_step": 174692, "epoch": 1443} {"train_loss": -41.705535888671875, "global_step": 174693, "epoch": 1443} {"train_loss": -38.45060348510742, "global_step": 174694, "epoch": 1443} {"train_loss": -41.911956787109375, "global_step": 174695, "epoch": 1443} {"train_loss": -40.84590530395508, "global_step": 174696, "epoch": 1443} {"train_loss": -39.659969329833984, "global_step": 174697, "epoch": 1443} {"train_loss": -41.868812561035156, "global_step": 174698, "epoch": 1443} {"train_loss": -40.4183235168457, "global_step": 174699, "epoch": 1443} {"train_loss": -41.16767501831055, "global_step": 174700, "epoch": 1443} {"train_loss": -40.71260070800781, "global_step": 174701, "epoch": 1443} {"train_loss": -41.90283966064453, "global_step": 174702, "epoch": 1443} {"train_loss": -41.88958740234375, "global_step": 174703, "epoch": 1443} {"train_loss": -41.3127326965332, "global_step": 174704, "epoch": 1443} {"train_loss": -41.739742279052734, "global_step": 174705, "epoch": 1443} {"train_loss": -41.066131591796875, "global_step": 174706, "epoch": 1443} {"train_loss": -41.80693435668945, "global_step": 174707, "epoch": 1443} {"train_loss": -42.195430755615234, "global_step": 174708, "epoch": 1443} {"train_loss": -41.54443359375, "global_step": 174709, "epoch": 1443} {"train_loss": -42.294769287109375, "global_step": 174710, "epoch": 1443} {"train_loss": -41.80576705932617, "global_step": 174711, "epoch": 1443} {"train_loss": -42.22441482543945, "global_step": 174712, "epoch": 1443} {"train_loss": -41.38749313354492, "global_step": 174713, "epoch": 1443} {"train_loss": -41.79247283935547, "global_step": 174714, "epoch": 1443} {"train_loss": -41.70186996459961, "global_step": 174715, "epoch": 1443} {"train_loss": -41.81551742553711, "global_step": 174716, "epoch": 1443} {"train_loss": -41.46281051635742, "global_step": 174717, "epoch": 1443} {"train_loss": -41.04944610595703, "global_step": 174718, "epoch": 1443} {"train_loss": -42.265892028808594, "global_step": 174719, "epoch": 1443} {"train_loss": -41.88593673706055, "global_step": 174720, "epoch": 1443} {"train_loss": -41.09519577026367, "global_step": 174721, "epoch": 1443} {"train_loss": -41.7918701171875, "global_step": 174722, "epoch": 1443} {"train_loss": -40.99079478870738, "global_step": 174723, "epoch": 1443, "val_loss": 2663658.75} {"train_loss": -41.67007064819336, "global_step": 174724, "epoch": 1444} {"train_loss": -41.73895263671875, "global_step": 174725, "epoch": 1444} {"train_loss": -41.16903305053711, "global_step": 174726, "epoch": 1444} {"train_loss": -41.690059661865234, "global_step": 174727, "epoch": 1444} {"train_loss": -41.87725830078125, "global_step": 174728, "epoch": 1444} {"train_loss": -41.344417572021484, "global_step": 174729, "epoch": 1444} {"train_loss": -41.32780838012695, "global_step": 174730, "epoch": 1444} {"train_loss": -42.16362380981445, "global_step": 174731, "epoch": 1444} {"train_loss": -41.55908203125, "global_step": 174732, "epoch": 1444} {"train_loss": -41.5019645690918, "global_step": 174733, "epoch": 1444} {"train_loss": -41.89299392700195, "global_step": 174734, "epoch": 1444} {"train_loss": -41.478145599365234, "global_step": 174735, "epoch": 1444} {"train_loss": -42.26706314086914, "global_step": 174736, "epoch": 1444} {"train_loss": -41.910579681396484, "global_step": 174737, "epoch": 1444} {"train_loss": -41.536678314208984, "global_step": 174738, "epoch": 1444} {"train_loss": -42.101470947265625, "global_step": 174739, "epoch": 1444} {"train_loss": -41.838191986083984, "global_step": 174740, "epoch": 1444} {"train_loss": -41.7178955078125, "global_step": 174741, "epoch": 1444} {"train_loss": -41.592529296875, "global_step": 174742, "epoch": 1444} {"train_loss": -41.683536529541016, "global_step": 174743, "epoch": 1444} {"train_loss": -41.846641540527344, "global_step": 174744, "epoch": 1444} {"train_loss": -42.06562042236328, "global_step": 174745, "epoch": 1444} {"train_loss": -41.55576705932617, "global_step": 174746, "epoch": 1444} {"train_loss": -41.630126953125, "global_step": 174747, "epoch": 1444} {"train_loss": -41.78408432006836, "global_step": 174748, "epoch": 1444} {"train_loss": -41.174800872802734, "global_step": 174749, "epoch": 1444} {"train_loss": -41.55658721923828, "global_step": 174750, "epoch": 1444} {"train_loss": -41.609798431396484, "global_step": 174751, "epoch": 1444} {"train_loss": -42.17617416381836, "global_step": 174752, "epoch": 1444} {"train_loss": -42.32795333862305, "global_step": 174753, "epoch": 1444} {"train_loss": -41.92814254760742, "global_step": 174754, "epoch": 1444} {"train_loss": -41.05552291870117, "global_step": 174755, "epoch": 1444} {"train_loss": -40.80653762817383, "global_step": 174756, "epoch": 1444} {"train_loss": -41.4393196105957, "global_step": 174757, "epoch": 1444} {"train_loss": -42.23273468017578, "global_step": 174758, "epoch": 1444} {"train_loss": -41.61182403564453, "global_step": 174759, "epoch": 1444} {"train_loss": -42.114654541015625, "global_step": 174760, "epoch": 1444} {"train_loss": -41.5283088684082, "global_step": 174761, "epoch": 1444} {"train_loss": -41.5577392578125, "global_step": 174762, "epoch": 1444} {"train_loss": -41.9776725769043, "global_step": 174763, "epoch": 1444} {"train_loss": -42.45775604248047, "global_step": 174764, "epoch": 1444} {"train_loss": -42.1068229675293, "global_step": 174765, "epoch": 1444} {"train_loss": -42.48786544799805, "global_step": 174766, "epoch": 1444} {"train_loss": -42.54426193237305, "global_step": 174767, "epoch": 1444} {"train_loss": -42.177734375, "global_step": 174768, "epoch": 1444} {"train_loss": -41.762149810791016, "global_step": 174769, "epoch": 1444} {"train_loss": -40.73247146606445, "global_step": 174770, "epoch": 1444} {"train_loss": -41.53789138793945, "global_step": 174771, "epoch": 1444} {"train_loss": -41.2609748840332, "global_step": 174772, "epoch": 1444} {"train_loss": -41.06439971923828, "global_step": 174773, "epoch": 1444} {"train_loss": -40.17436599731445, "global_step": 174774, "epoch": 1444} {"train_loss": -38.096282958984375, "global_step": 174775, "epoch": 1444} {"train_loss": -35.106666564941406, "global_step": 174776, "epoch": 1444} {"train_loss": -40.15841293334961, "global_step": 174777, "epoch": 1444} {"train_loss": -38.99188232421875, "global_step": 174778, "epoch": 1444} {"train_loss": -38.87681579589844, "global_step": 174779, "epoch": 1444} {"train_loss": -39.86360168457031, "global_step": 174780, "epoch": 1444} {"train_loss": -39.21418762207031, "global_step": 174781, "epoch": 1444} {"train_loss": -39.727294921875, "global_step": 174782, "epoch": 1444} {"train_loss": -38.90082931518555, "global_step": 174783, "epoch": 1444} {"train_loss": -40.146358489990234, "global_step": 174784, "epoch": 1444} {"train_loss": -40.400657653808594, "global_step": 174785, "epoch": 1444} {"train_loss": -40.37297058105469, "global_step": 174786, "epoch": 1444} {"train_loss": -40.44136428833008, "global_step": 174787, "epoch": 1444} {"train_loss": -39.11463165283203, "global_step": 174788, "epoch": 1444} {"train_loss": -40.88447189331055, "global_step": 174789, "epoch": 1444} {"train_loss": -40.158687591552734, "global_step": 174790, "epoch": 1444} {"train_loss": -39.8828125, "global_step": 174791, "epoch": 1444} {"train_loss": -40.2231330871582, "global_step": 174792, "epoch": 1444} {"train_loss": -40.17379379272461, "global_step": 174793, "epoch": 1444} {"train_loss": -40.71528244018555, "global_step": 174794, "epoch": 1444} {"train_loss": -40.239498138427734, "global_step": 174795, "epoch": 1444} {"train_loss": -40.65000915527344, "global_step": 174796, "epoch": 1444} {"train_loss": -40.789119720458984, "global_step": 174797, "epoch": 1444} {"train_loss": -40.52056121826172, "global_step": 174798, "epoch": 1444} {"train_loss": -41.02775192260742, "global_step": 174799, "epoch": 1444} {"train_loss": -40.45961380004883, "global_step": 174800, "epoch": 1444} {"train_loss": -40.02753829956055, "global_step": 174801, "epoch": 1444} {"train_loss": -41.48676681518555, "global_step": 174802, "epoch": 1444} {"train_loss": -40.21492385864258, "global_step": 174803, "epoch": 1444} {"train_loss": -41.170875549316406, "global_step": 174804, "epoch": 1444} {"train_loss": -40.58407974243164, "global_step": 174805, "epoch": 1444} {"train_loss": -41.11488723754883, "global_step": 174806, "epoch": 1444} {"train_loss": -40.380855560302734, "global_step": 174807, "epoch": 1444} {"train_loss": -40.40515899658203, "global_step": 174808, "epoch": 1444} {"train_loss": -41.04069519042969, "global_step": 174809, "epoch": 1444} {"train_loss": -39.99379348754883, "global_step": 174810, "epoch": 1444} {"train_loss": -41.8903694152832, "global_step": 174811, "epoch": 1444} {"train_loss": -40.95402145385742, "global_step": 174812, "epoch": 1444} {"train_loss": -41.47801208496094, "global_step": 174813, "epoch": 1444} {"train_loss": -41.66153335571289, "global_step": 174814, "epoch": 1444} {"train_loss": -41.28761672973633, "global_step": 174815, "epoch": 1444} {"train_loss": -41.286434173583984, "global_step": 174816, "epoch": 1444} {"train_loss": -41.30891036987305, "global_step": 174817, "epoch": 1444} {"train_loss": -42.101131439208984, "global_step": 174818, "epoch": 1444} {"train_loss": -41.810482025146484, "global_step": 174819, "epoch": 1444} {"train_loss": -40.8403434753418, "global_step": 174820, "epoch": 1444} {"train_loss": -41.820194244384766, "global_step": 174821, "epoch": 1444} {"train_loss": -41.355350494384766, "global_step": 174822, "epoch": 1444} {"train_loss": -41.511138916015625, "global_step": 174823, "epoch": 1444} {"train_loss": -41.95074462890625, "global_step": 174824, "epoch": 1444} {"train_loss": -41.564876556396484, "global_step": 174825, "epoch": 1444} {"train_loss": -41.29549026489258, "global_step": 174826, "epoch": 1444} {"train_loss": -41.695858001708984, "global_step": 174827, "epoch": 1444} {"train_loss": -42.44877243041992, "global_step": 174828, "epoch": 1444} {"train_loss": -41.49031448364258, "global_step": 174829, "epoch": 1444} {"train_loss": -42.1703987121582, "global_step": 174830, "epoch": 1444} {"train_loss": -41.093318939208984, "global_step": 174831, "epoch": 1444} {"train_loss": -40.857051849365234, "global_step": 174832, "epoch": 1444} {"train_loss": -41.60964584350586, "global_step": 174833, "epoch": 1444} {"train_loss": -41.03480911254883, "global_step": 174834, "epoch": 1444} {"train_loss": -40.85403060913086, "global_step": 174835, "epoch": 1444} {"train_loss": -41.389095306396484, "global_step": 174836, "epoch": 1444} {"train_loss": -41.81635284423828, "global_step": 174837, "epoch": 1444} {"train_loss": -41.21925354003906, "global_step": 174838, "epoch": 1444} {"train_loss": -40.64624786376953, "global_step": 174839, "epoch": 1444} {"train_loss": -42.182186126708984, "global_step": 174840, "epoch": 1444} {"train_loss": -41.868858337402344, "global_step": 174841, "epoch": 1444} {"train_loss": -41.501617431640625, "global_step": 174842, "epoch": 1444} {"train_loss": -41.54104232788086, "global_step": 174843, "epoch": 1444} {"train_loss": -41.15314076951713, "global_step": 174844, "epoch": 1444, "val_loss": 2585505.0} {"train_loss": -41.37595748901367, "global_step": 174845, "epoch": 1445} {"train_loss": -40.790401458740234, "global_step": 174846, "epoch": 1445} {"train_loss": -42.348514556884766, "global_step": 174847, "epoch": 1445} {"train_loss": -40.473228454589844, "global_step": 174848, "epoch": 1445} {"train_loss": -40.669307708740234, "global_step": 174849, "epoch": 1445} {"train_loss": -39.619327545166016, "global_step": 174850, "epoch": 1445} {"train_loss": -40.589290618896484, "global_step": 174851, "epoch": 1445} {"train_loss": -41.40096664428711, "global_step": 174852, "epoch": 1445} {"train_loss": -41.357967376708984, "global_step": 174853, "epoch": 1445} {"train_loss": -40.53890609741211, "global_step": 174854, "epoch": 1445} {"train_loss": -42.058834075927734, "global_step": 174855, "epoch": 1445} {"train_loss": -39.98274612426758, "global_step": 174856, "epoch": 1445} {"train_loss": -41.18758773803711, "global_step": 174857, "epoch": 1445} {"train_loss": -41.44400405883789, "global_step": 174858, "epoch": 1445} {"train_loss": -40.7107048034668, "global_step": 174859, "epoch": 1445} {"train_loss": -40.074100494384766, "global_step": 174860, "epoch": 1445} {"train_loss": -41.53143310546875, "global_step": 174861, "epoch": 1445} {"train_loss": -40.92724609375, "global_step": 174862, "epoch": 1445} {"train_loss": -41.80965805053711, "global_step": 174863, "epoch": 1445} {"train_loss": -41.67097854614258, "global_step": 174864, "epoch": 1445} {"train_loss": -41.237483978271484, "global_step": 174865, "epoch": 1445} {"train_loss": -42.13250732421875, "global_step": 174866, "epoch": 1445} {"train_loss": -41.52914810180664, "global_step": 174867, "epoch": 1445} {"train_loss": -41.61787033081055, "global_step": 174868, "epoch": 1445} {"train_loss": -41.66962814331055, "global_step": 174869, "epoch": 1445} {"train_loss": -42.10603332519531, "global_step": 174870, "epoch": 1445} {"train_loss": -41.67100143432617, "global_step": 174871, "epoch": 1445} {"train_loss": -41.61573028564453, "global_step": 174872, "epoch": 1445} {"train_loss": -42.077232360839844, "global_step": 174873, "epoch": 1445} {"train_loss": -41.837642669677734, "global_step": 174874, "epoch": 1445} {"train_loss": -41.916969299316406, "global_step": 174875, "epoch": 1445} {"train_loss": -41.788597106933594, "global_step": 174876, "epoch": 1445} {"train_loss": -41.83994674682617, "global_step": 174877, "epoch": 1445} {"train_loss": -42.0048828125, "global_step": 174878, "epoch": 1445} {"train_loss": -42.33127975463867, "global_step": 174879, "epoch": 1445} {"train_loss": -42.15692901611328, "global_step": 174880, "epoch": 1445} {"train_loss": -42.31014633178711, "global_step": 174881, "epoch": 1445} {"train_loss": -42.41074752807617, "global_step": 174882, "epoch": 1445} {"train_loss": -42.32804870605469, "global_step": 174883, "epoch": 1445} {"train_loss": -42.201358795166016, "global_step": 174884, "epoch": 1445} {"train_loss": -42.004085540771484, "global_step": 174885, "epoch": 1445} {"train_loss": -42.19845962524414, "global_step": 174886, "epoch": 1445} {"train_loss": -42.62540817260742, "global_step": 174887, "epoch": 1445} {"train_loss": -41.81828308105469, "global_step": 174888, "epoch": 1445} {"train_loss": -42.12125778198242, "global_step": 174889, "epoch": 1445} {"train_loss": -41.645782470703125, "global_step": 174890, "epoch": 1445} {"train_loss": -42.53672409057617, "global_step": 174891, "epoch": 1445} {"train_loss": -41.9039421081543, "global_step": 174892, "epoch": 1445} {"train_loss": -41.39868927001953, "global_step": 174893, "epoch": 1445} {"train_loss": -42.444881439208984, "global_step": 174894, "epoch": 1445} {"train_loss": -42.247718811035156, "global_step": 174895, "epoch": 1445} {"train_loss": -42.2131462097168, "global_step": 174896, "epoch": 1445} {"train_loss": -41.8660774230957, "global_step": 174897, "epoch": 1445} {"train_loss": -40.111717224121094, "global_step": 174898, "epoch": 1445} {"train_loss": -41.77861022949219, "global_step": 174899, "epoch": 1445} {"train_loss": -39.46743392944336, "global_step": 174900, "epoch": 1445} {"train_loss": -39.58646774291992, "global_step": 174901, "epoch": 1445} {"train_loss": -41.003746032714844, "global_step": 174902, "epoch": 1445} {"train_loss": -40.81067657470703, "global_step": 174903, "epoch": 1445} {"train_loss": -41.33637619018555, "global_step": 174904, "epoch": 1445} {"train_loss": -41.27678298950195, "global_step": 174905, "epoch": 1445} {"train_loss": -42.01450729370117, "global_step": 174906, "epoch": 1445} {"train_loss": -41.30914306640625, "global_step": 174907, "epoch": 1445} {"train_loss": -40.875484466552734, "global_step": 174908, "epoch": 1445} {"train_loss": -40.25999069213867, "global_step": 174909, "epoch": 1445} {"train_loss": -40.955604553222656, "global_step": 174910, "epoch": 1445} {"train_loss": -41.82107925415039, "global_step": 174911, "epoch": 1445} {"train_loss": -40.48275375366211, "global_step": 174912, "epoch": 1445} {"train_loss": -40.1796989440918, "global_step": 174913, "epoch": 1445} {"train_loss": -40.80384063720703, "global_step": 174914, "epoch": 1445} {"train_loss": -40.53791046142578, "global_step": 174915, "epoch": 1445} {"train_loss": -39.317874908447266, "global_step": 174916, "epoch": 1445} {"train_loss": -39.216636657714844, "global_step": 174917, "epoch": 1445} {"train_loss": -39.07769012451172, "global_step": 174918, "epoch": 1445} {"train_loss": -40.4293327331543, "global_step": 174919, "epoch": 1445} {"train_loss": -40.47493362426758, "global_step": 174920, "epoch": 1445} {"train_loss": -38.67252731323242, "global_step": 174921, "epoch": 1445} {"train_loss": -39.2781982421875, "global_step": 174922, "epoch": 1445} {"train_loss": -39.495216369628906, "global_step": 174923, "epoch": 1445} {"train_loss": -39.079185485839844, "global_step": 174924, "epoch": 1445} {"train_loss": -40.83958053588867, "global_step": 174925, "epoch": 1445} {"train_loss": -40.49920654296875, "global_step": 174926, "epoch": 1445} {"train_loss": -41.06458282470703, "global_step": 174927, "epoch": 1445} {"train_loss": -40.881858825683594, "global_step": 174928, "epoch": 1445} {"train_loss": -41.28155517578125, "global_step": 174929, "epoch": 1445} {"train_loss": -40.941715240478516, "global_step": 174930, "epoch": 1445} {"train_loss": -41.26991653442383, "global_step": 174931, "epoch": 1445} {"train_loss": -41.986454010009766, "global_step": 174932, "epoch": 1445} {"train_loss": -40.55831527709961, "global_step": 174933, "epoch": 1445} {"train_loss": -40.89519119262695, "global_step": 174934, "epoch": 1445} {"train_loss": -41.45182418823242, "global_step": 174935, "epoch": 1445} {"train_loss": -40.50319290161133, "global_step": 174936, "epoch": 1445} {"train_loss": -42.18105697631836, "global_step": 174937, "epoch": 1445} {"train_loss": -41.44386672973633, "global_step": 174938, "epoch": 1445} {"train_loss": -41.36881637573242, "global_step": 174939, "epoch": 1445} {"train_loss": -41.105796813964844, "global_step": 174940, "epoch": 1445} {"train_loss": -41.94928741455078, "global_step": 174941, "epoch": 1445} {"train_loss": -42.12202453613281, "global_step": 174942, "epoch": 1445} {"train_loss": -41.861629486083984, "global_step": 174943, "epoch": 1445} {"train_loss": -42.152225494384766, "global_step": 174944, "epoch": 1445} {"train_loss": -42.199851989746094, "global_step": 174945, "epoch": 1445} {"train_loss": -41.90788650512695, "global_step": 174946, "epoch": 1445} {"train_loss": -42.38656234741211, "global_step": 174947, "epoch": 1445} {"train_loss": -41.60700225830078, "global_step": 174948, "epoch": 1445} {"train_loss": -41.80441665649414, "global_step": 174949, "epoch": 1445} {"train_loss": -42.21982192993164, "global_step": 174950, "epoch": 1445} {"train_loss": -42.23861312866211, "global_step": 174951, "epoch": 1445} {"train_loss": -41.77829360961914, "global_step": 174952, "epoch": 1445} {"train_loss": -42.39323806762695, "global_step": 174953, "epoch": 1445} {"train_loss": -42.45337677001953, "global_step": 174954, "epoch": 1445} {"train_loss": -41.9770622253418, "global_step": 174955, "epoch": 1445} {"train_loss": -42.16876983642578, "global_step": 174956, "epoch": 1445} {"train_loss": -42.253334045410156, "global_step": 174957, "epoch": 1445} {"train_loss": -40.288455963134766, "global_step": 174958, "epoch": 1445} {"train_loss": -41.87879180908203, "global_step": 174959, "epoch": 1445} {"train_loss": -41.97263717651367, "global_step": 174960, "epoch": 1445} {"train_loss": -42.40998840332031, "global_step": 174961, "epoch": 1445} {"train_loss": -42.1261100769043, "global_step": 174962, "epoch": 1445} {"train_loss": -42.37794876098633, "global_step": 174963, "epoch": 1445} {"train_loss": -41.891414642333984, "global_step": 174964, "epoch": 1445} {"train_loss": -41.35532394913602, "global_step": 174965, "epoch": 1445, "val_loss": 2733989.5} {"train_loss": -41.71427536010742, "global_step": 174966, "epoch": 1446} {"train_loss": -41.62655258178711, "global_step": 174967, "epoch": 1446} {"train_loss": -41.07841110229492, "global_step": 174968, "epoch": 1446} {"train_loss": -40.43067169189453, "global_step": 174969, "epoch": 1446} {"train_loss": -41.639892578125, "global_step": 174970, "epoch": 1446} {"train_loss": -40.55305480957031, "global_step": 174971, "epoch": 1446} {"train_loss": -40.270328521728516, "global_step": 174972, "epoch": 1446} {"train_loss": -40.77434158325195, "global_step": 174973, "epoch": 1446} {"train_loss": -41.98493576049805, "global_step": 174974, "epoch": 1446} {"train_loss": -39.62652587890625, "global_step": 174975, "epoch": 1446} {"train_loss": -37.598365783691406, "global_step": 174976, "epoch": 1446} {"train_loss": -38.64948272705078, "global_step": 174977, "epoch": 1446} {"train_loss": -38.43465042114258, "global_step": 174978, "epoch": 1446} {"train_loss": -36.8084716796875, "global_step": 174979, "epoch": 1446} {"train_loss": -41.33403396606445, "global_step": 174980, "epoch": 1446} {"train_loss": -36.40753936767578, "global_step": 174981, "epoch": 1446} {"train_loss": -37.44956588745117, "global_step": 174982, "epoch": 1446} {"train_loss": -37.96276092529297, "global_step": 174983, "epoch": 1446} {"train_loss": -37.730323791503906, "global_step": 174984, "epoch": 1446} {"train_loss": -36.91585922241211, "global_step": 174985, "epoch": 1446} {"train_loss": -39.66152572631836, "global_step": 174986, "epoch": 1446} {"train_loss": -33.88856887817383, "global_step": 174987, "epoch": 1446} {"train_loss": -39.096534729003906, "global_step": 174988, "epoch": 1446} {"train_loss": -37.05836486816406, "global_step": 174989, "epoch": 1446} {"train_loss": -39.13491439819336, "global_step": 174990, "epoch": 1446} {"train_loss": -38.16789627075195, "global_step": 174991, "epoch": 1446} {"train_loss": -38.16858673095703, "global_step": 174992, "epoch": 1446} {"train_loss": -37.84865951538086, "global_step": 174993, "epoch": 1446} {"train_loss": -37.494144439697266, "global_step": 174994, "epoch": 1446} {"train_loss": -38.720008850097656, "global_step": 174995, "epoch": 1446} {"train_loss": -38.13520431518555, "global_step": 174996, "epoch": 1446} {"train_loss": -38.958778381347656, "global_step": 174997, "epoch": 1446} {"train_loss": -39.83896255493164, "global_step": 174998, "epoch": 1446} {"train_loss": -38.64421081542969, "global_step": 174999, "epoch": 1446} {"train_loss": -39.304710388183594, "global_step": 175000, "epoch": 1446} {"train_loss": -38.72719955444336, "global_step": 175001, "epoch": 1446} {"train_loss": -39.767635345458984, "global_step": 175002, "epoch": 1446} {"train_loss": -39.12484359741211, "global_step": 175003, "epoch": 1446} {"train_loss": -37.40833282470703, "global_step": 175004, "epoch": 1446} {"train_loss": -40.265625, "global_step": 175005, "epoch": 1446} {"train_loss": -38.798561096191406, "global_step": 175006, "epoch": 1446} {"train_loss": -38.203704833984375, "global_step": 175007, "epoch": 1446} {"train_loss": -39.858150482177734, "global_step": 175008, "epoch": 1446} {"train_loss": -38.188079833984375, "global_step": 175009, "epoch": 1446} {"train_loss": -40.3770637512207, "global_step": 175010, "epoch": 1446} {"train_loss": -39.88252639770508, "global_step": 175011, "epoch": 1446} {"train_loss": -40.3306884765625, "global_step": 175012, "epoch": 1446} {"train_loss": -38.218074798583984, "global_step": 175013, "epoch": 1446} {"train_loss": -40.59062194824219, "global_step": 175014, "epoch": 1446} {"train_loss": -40.714412689208984, "global_step": 175015, "epoch": 1446} {"train_loss": -40.283138275146484, "global_step": 175016, "epoch": 1446} {"train_loss": -40.96714401245117, "global_step": 175017, "epoch": 1446} {"train_loss": -40.05284881591797, "global_step": 175018, "epoch": 1446} {"train_loss": -39.23774337768555, "global_step": 175019, "epoch": 1446} {"train_loss": -40.165740966796875, "global_step": 175020, "epoch": 1446} {"train_loss": -40.92890548706055, "global_step": 175021, "epoch": 1446} {"train_loss": -40.84554672241211, "global_step": 175022, "epoch": 1446} {"train_loss": -40.71445083618164, "global_step": 175023, "epoch": 1446} {"train_loss": -40.44807815551758, "global_step": 175024, "epoch": 1446} {"train_loss": -40.975921630859375, "global_step": 175025, "epoch": 1446} {"train_loss": -39.65830612182617, "global_step": 175026, "epoch": 1446} {"train_loss": -40.59682083129883, "global_step": 175027, "epoch": 1446} {"train_loss": -40.72696304321289, "global_step": 175028, "epoch": 1446} {"train_loss": -40.05488967895508, "global_step": 175029, "epoch": 1446} {"train_loss": -41.17354965209961, "global_step": 175030, "epoch": 1446} {"train_loss": -40.76127243041992, "global_step": 175031, "epoch": 1446} {"train_loss": -41.04479217529297, "global_step": 175032, "epoch": 1446} {"train_loss": -40.640342712402344, "global_step": 175033, "epoch": 1446} {"train_loss": -41.00667953491211, "global_step": 175034, "epoch": 1446} {"train_loss": -41.10789108276367, "global_step": 175035, "epoch": 1446} {"train_loss": -41.15937423706055, "global_step": 175036, "epoch": 1446} {"train_loss": -41.18231201171875, "global_step": 175037, "epoch": 1446} {"train_loss": -41.227291107177734, "global_step": 175038, "epoch": 1446} {"train_loss": -41.52842330932617, "global_step": 175039, "epoch": 1446} {"train_loss": -40.686302185058594, "global_step": 175040, "epoch": 1446} {"train_loss": -40.8735237121582, "global_step": 175041, "epoch": 1446} {"train_loss": -41.83749008178711, "global_step": 175042, "epoch": 1446} {"train_loss": -41.79268264770508, "global_step": 175043, "epoch": 1446} {"train_loss": -41.12075424194336, "global_step": 175044, "epoch": 1446} {"train_loss": -41.59932327270508, "global_step": 175045, "epoch": 1446} {"train_loss": -41.42855453491211, "global_step": 175046, "epoch": 1446} {"train_loss": -41.176937103271484, "global_step": 175047, "epoch": 1446} {"train_loss": -41.2492561340332, "global_step": 175048, "epoch": 1446} {"train_loss": -41.76805114746094, "global_step": 175049, "epoch": 1446} {"train_loss": -41.85100173950195, "global_step": 175050, "epoch": 1446} {"train_loss": -41.11249923706055, "global_step": 175051, "epoch": 1446} {"train_loss": -41.52820587158203, "global_step": 175052, "epoch": 1446} {"train_loss": -41.79145431518555, "global_step": 175053, "epoch": 1446} {"train_loss": -41.72572708129883, "global_step": 175054, "epoch": 1446} {"train_loss": -41.39970016479492, "global_step": 175055, "epoch": 1446} {"train_loss": -41.50345993041992, "global_step": 175056, "epoch": 1446} {"train_loss": -41.56354904174805, "global_step": 175057, "epoch": 1446} {"train_loss": -41.57760238647461, "global_step": 175058, "epoch": 1446} {"train_loss": -41.787071228027344, "global_step": 175059, "epoch": 1446} {"train_loss": -41.42197799682617, "global_step": 175060, "epoch": 1446} {"train_loss": -41.994873046875, "global_step": 175061, "epoch": 1446} {"train_loss": -42.304229736328125, "global_step": 175062, "epoch": 1446} {"train_loss": -41.2000846862793, "global_step": 175063, "epoch": 1446} {"train_loss": -42.360443115234375, "global_step": 175064, "epoch": 1446} {"train_loss": -41.7152099609375, "global_step": 175065, "epoch": 1446} {"train_loss": -42.12367248535156, "global_step": 175066, "epoch": 1446} {"train_loss": -41.939632415771484, "global_step": 175067, "epoch": 1446} {"train_loss": -42.08940505981445, "global_step": 175068, "epoch": 1446} {"train_loss": -42.21928787231445, "global_step": 175069, "epoch": 1446} {"train_loss": -41.7824821472168, "global_step": 175070, "epoch": 1446} {"train_loss": -41.93707275390625, "global_step": 175071, "epoch": 1446} {"train_loss": -41.99197769165039, "global_step": 175072, "epoch": 1446} {"train_loss": -42.190460205078125, "global_step": 175073, "epoch": 1446} {"train_loss": -42.28646469116211, "global_step": 175074, "epoch": 1446} {"train_loss": -42.58693313598633, "global_step": 175075, "epoch": 1446} {"train_loss": -42.3531608581543, "global_step": 175076, "epoch": 1446} {"train_loss": -42.452980041503906, "global_step": 175077, "epoch": 1446} {"train_loss": -42.104251861572266, "global_step": 175078, "epoch": 1446} {"train_loss": -41.890926361083984, "global_step": 175079, "epoch": 1446} {"train_loss": -41.34429931640625, "global_step": 175080, "epoch": 1446} {"train_loss": -41.220314025878906, "global_step": 175081, "epoch": 1446} {"train_loss": -42.05088424682617, "global_step": 175082, "epoch": 1446} {"train_loss": -41.866119384765625, "global_step": 175083, "epoch": 1446} {"train_loss": -42.15105056762695, "global_step": 175084, "epoch": 1446} {"train_loss": -42.69669723510742, "global_step": 175085, "epoch": 1446} {"train_loss": -40.44498311192536, "global_step": 175086, "epoch": 1446, "val_loss": 2681826.75} {"train_loss": -41.37272262573242, "global_step": 175087, "epoch": 1447} {"train_loss": -40.98733139038086, "global_step": 175088, "epoch": 1447} {"train_loss": -42.00799560546875, "global_step": 175089, "epoch": 1447} {"train_loss": -41.45376205444336, "global_step": 175090, "epoch": 1447} {"train_loss": -40.51087188720703, "global_step": 175091, "epoch": 1447} {"train_loss": -42.386695861816406, "global_step": 175092, "epoch": 1447} {"train_loss": -41.035133361816406, "global_step": 175093, "epoch": 1447} {"train_loss": -40.130035400390625, "global_step": 175094, "epoch": 1447} {"train_loss": -42.19236755371094, "global_step": 175095, "epoch": 1447} {"train_loss": -40.81509017944336, "global_step": 175096, "epoch": 1447} {"train_loss": -38.734130859375, "global_step": 175097, "epoch": 1447} {"train_loss": -41.78390121459961, "global_step": 175098, "epoch": 1447} {"train_loss": -41.46889877319336, "global_step": 175099, "epoch": 1447} {"train_loss": -41.362850189208984, "global_step": 175100, "epoch": 1447} {"train_loss": -39.443641662597656, "global_step": 175101, "epoch": 1447} {"train_loss": -39.57502365112305, "global_step": 175102, "epoch": 1447} {"train_loss": -40.71977233886719, "global_step": 175103, "epoch": 1447} {"train_loss": -37.50477600097656, "global_step": 175104, "epoch": 1447} {"train_loss": -41.42550277709961, "global_step": 175105, "epoch": 1447} {"train_loss": -40.96527862548828, "global_step": 175106, "epoch": 1447} {"train_loss": -40.55570602416992, "global_step": 175107, "epoch": 1447} {"train_loss": -39.960113525390625, "global_step": 175108, "epoch": 1447} {"train_loss": -40.3487663269043, "global_step": 175109, "epoch": 1447} {"train_loss": -40.27836608886719, "global_step": 175110, "epoch": 1447} {"train_loss": -39.32428741455078, "global_step": 175111, "epoch": 1447} {"train_loss": -39.769874572753906, "global_step": 175112, "epoch": 1447} {"train_loss": -40.41868209838867, "global_step": 175113, "epoch": 1447} {"train_loss": -39.21489715576172, "global_step": 175114, "epoch": 1447} {"train_loss": -39.53912353515625, "global_step": 175115, "epoch": 1447} {"train_loss": -39.687068939208984, "global_step": 175116, "epoch": 1447} {"train_loss": -39.704803466796875, "global_step": 175117, "epoch": 1447} {"train_loss": -39.5245475769043, "global_step": 175118, "epoch": 1447} {"train_loss": -39.48490524291992, "global_step": 175119, "epoch": 1447} {"train_loss": -38.953311920166016, "global_step": 175120, "epoch": 1447} {"train_loss": -39.606773376464844, "global_step": 175121, "epoch": 1447} {"train_loss": -39.591190338134766, "global_step": 175122, "epoch": 1447} {"train_loss": -39.333984375, "global_step": 175123, "epoch": 1447} {"train_loss": -39.13105010986328, "global_step": 175124, "epoch": 1447} {"train_loss": -39.36979293823242, "global_step": 175125, "epoch": 1447} {"train_loss": -40.73806381225586, "global_step": 175126, "epoch": 1447} {"train_loss": -39.76267623901367, "global_step": 175127, "epoch": 1447} {"train_loss": -40.36049270629883, "global_step": 175128, "epoch": 1447} {"train_loss": -40.07920837402344, "global_step": 175129, "epoch": 1447} {"train_loss": -41.06415557861328, "global_step": 175130, "epoch": 1447} {"train_loss": -40.75199890136719, "global_step": 175131, "epoch": 1447} {"train_loss": -40.11967468261719, "global_step": 175132, "epoch": 1447} {"train_loss": -41.03040313720703, "global_step": 175133, "epoch": 1447} {"train_loss": -40.919979095458984, "global_step": 175134, "epoch": 1447} {"train_loss": -40.67407989501953, "global_step": 175135, "epoch": 1447} {"train_loss": -41.2598876953125, "global_step": 175136, "epoch": 1447} {"train_loss": -39.737884521484375, "global_step": 175137, "epoch": 1447} {"train_loss": -40.84572982788086, "global_step": 175138, "epoch": 1447} {"train_loss": -41.45028305053711, "global_step": 175139, "epoch": 1447} {"train_loss": -40.34455108642578, "global_step": 175140, "epoch": 1447} {"train_loss": -39.447261810302734, "global_step": 175141, "epoch": 1447} {"train_loss": -40.288143157958984, "global_step": 175142, "epoch": 1447} {"train_loss": -39.52947235107422, "global_step": 175143, "epoch": 1447} {"train_loss": -40.97520065307617, "global_step": 175144, "epoch": 1447} {"train_loss": -39.93573760986328, "global_step": 175145, "epoch": 1447} {"train_loss": -39.258697509765625, "global_step": 175146, "epoch": 1447} {"train_loss": -41.1848030090332, "global_step": 175147, "epoch": 1447} {"train_loss": -41.05772399902344, "global_step": 175148, "epoch": 1447} {"train_loss": -39.84328079223633, "global_step": 175149, "epoch": 1447} {"train_loss": -40.95170211791992, "global_step": 175150, "epoch": 1447} {"train_loss": -40.11702346801758, "global_step": 175151, "epoch": 1447} {"train_loss": -39.91059875488281, "global_step": 175152, "epoch": 1447} {"train_loss": -40.289669036865234, "global_step": 175153, "epoch": 1447} {"train_loss": -41.322715759277344, "global_step": 175154, "epoch": 1447} {"train_loss": -39.79547119140625, "global_step": 175155, "epoch": 1447} {"train_loss": -39.058712005615234, "global_step": 175156, "epoch": 1447} {"train_loss": -40.48141098022461, "global_step": 175157, "epoch": 1447} {"train_loss": -40.976985931396484, "global_step": 175158, "epoch": 1447} {"train_loss": -38.53335189819336, "global_step": 175159, "epoch": 1447} {"train_loss": -39.8526611328125, "global_step": 175160, "epoch": 1447} {"train_loss": -41.87178421020508, "global_step": 175161, "epoch": 1447} {"train_loss": -39.96489334106445, "global_step": 175162, "epoch": 1447} {"train_loss": -40.0195426940918, "global_step": 175163, "epoch": 1447} {"train_loss": -41.622859954833984, "global_step": 175164, "epoch": 1447} {"train_loss": -40.33309555053711, "global_step": 175165, "epoch": 1447} {"train_loss": -41.69512176513672, "global_step": 175166, "epoch": 1447} {"train_loss": -41.186336517333984, "global_step": 175167, "epoch": 1447} {"train_loss": -40.78074264526367, "global_step": 175168, "epoch": 1447} {"train_loss": -41.735416412353516, "global_step": 175169, "epoch": 1447} {"train_loss": -41.49588394165039, "global_step": 175170, "epoch": 1447} {"train_loss": -40.669681549072266, "global_step": 175171, "epoch": 1447} {"train_loss": -41.418853759765625, "global_step": 175172, "epoch": 1447} {"train_loss": -41.07069396972656, "global_step": 175173, "epoch": 1447} {"train_loss": -41.59092330932617, "global_step": 175174, "epoch": 1447} {"train_loss": -40.922584533691406, "global_step": 175175, "epoch": 1447} {"train_loss": -41.298702239990234, "global_step": 175176, "epoch": 1447} {"train_loss": -41.846614837646484, "global_step": 175177, "epoch": 1447} {"train_loss": -41.9286003112793, "global_step": 175178, "epoch": 1447} {"train_loss": -41.66075134277344, "global_step": 175179, "epoch": 1447} {"train_loss": -41.68953323364258, "global_step": 175180, "epoch": 1447} {"train_loss": -41.607810974121094, "global_step": 175181, "epoch": 1447} {"train_loss": -41.77694320678711, "global_step": 175182, "epoch": 1447} {"train_loss": -41.74609375, "global_step": 175183, "epoch": 1447} {"train_loss": -41.69731140136719, "global_step": 175184, "epoch": 1447} {"train_loss": -41.6899299621582, "global_step": 175185, "epoch": 1447} {"train_loss": -41.57297897338867, "global_step": 175186, "epoch": 1447} {"train_loss": -41.44443893432617, "global_step": 175187, "epoch": 1447} {"train_loss": -41.50335693359375, "global_step": 175188, "epoch": 1447} {"train_loss": -41.893829345703125, "global_step": 175189, "epoch": 1447} {"train_loss": -42.05717849731445, "global_step": 175190, "epoch": 1447} {"train_loss": -42.172054290771484, "global_step": 175191, "epoch": 1447} {"train_loss": -41.50450897216797, "global_step": 175192, "epoch": 1447} {"train_loss": -41.31404113769531, "global_step": 175193, "epoch": 1447} {"train_loss": -41.8996696472168, "global_step": 175194, "epoch": 1447} {"train_loss": -41.32464599609375, "global_step": 175195, "epoch": 1447} {"train_loss": -41.697750091552734, "global_step": 175196, "epoch": 1447} {"train_loss": -42.22284698486328, "global_step": 175197, "epoch": 1447} {"train_loss": -41.4305419921875, "global_step": 175198, "epoch": 1447} {"train_loss": -41.93901443481445, "global_step": 175199, "epoch": 1447} {"train_loss": -41.85148239135742, "global_step": 175200, "epoch": 1447} {"train_loss": -41.378700256347656, "global_step": 175201, "epoch": 1447} {"train_loss": -42.01921463012695, "global_step": 175202, "epoch": 1447} {"train_loss": -42.116790771484375, "global_step": 175203, "epoch": 1447} {"train_loss": -42.11846923828125, "global_step": 175204, "epoch": 1447} {"train_loss": -41.2767333984375, "global_step": 175205, "epoch": 1447} {"train_loss": -40.6754264831543, "global_step": 175206, "epoch": 1447} {"train_loss": -40.75539896310853, "global_step": 175207, "epoch": 1447, "val_loss": 2644318.75} {"train_loss": -42.128963470458984, "global_step": 175208, "epoch": 1448} {"train_loss": -40.70068359375, "global_step": 175209, "epoch": 1448} {"train_loss": -40.19814682006836, "global_step": 175210, "epoch": 1448} {"train_loss": -42.16965866088867, "global_step": 175211, "epoch": 1448} {"train_loss": -41.30636978149414, "global_step": 175212, "epoch": 1448} {"train_loss": -40.75815963745117, "global_step": 175213, "epoch": 1448} {"train_loss": -41.52833938598633, "global_step": 175214, "epoch": 1448} {"train_loss": -41.238887786865234, "global_step": 175215, "epoch": 1448} {"train_loss": -42.009735107421875, "global_step": 175216, "epoch": 1448} {"train_loss": -41.7541618347168, "global_step": 175217, "epoch": 1448} {"train_loss": -41.33821105957031, "global_step": 175218, "epoch": 1448} {"train_loss": -42.09138870239258, "global_step": 175219, "epoch": 1448} {"train_loss": -40.4279899597168, "global_step": 175220, "epoch": 1448} {"train_loss": -39.60072326660156, "global_step": 175221, "epoch": 1448} {"train_loss": -41.63627624511719, "global_step": 175222, "epoch": 1448} {"train_loss": -40.526512145996094, "global_step": 175223, "epoch": 1448} {"train_loss": -41.448116302490234, "global_step": 175224, "epoch": 1448} {"train_loss": -40.413997650146484, "global_step": 175225, "epoch": 1448} {"train_loss": -40.05791091918945, "global_step": 175226, "epoch": 1448} {"train_loss": -41.295040130615234, "global_step": 175227, "epoch": 1448} {"train_loss": -41.423744201660156, "global_step": 175228, "epoch": 1448} {"train_loss": -38.66347122192383, "global_step": 175229, "epoch": 1448} {"train_loss": -39.87622833251953, "global_step": 175230, "epoch": 1448} {"train_loss": -41.75999450683594, "global_step": 175231, "epoch": 1448} {"train_loss": -41.14156723022461, "global_step": 175232, "epoch": 1448} {"train_loss": -40.76852798461914, "global_step": 175233, "epoch": 1448} {"train_loss": -41.54990005493164, "global_step": 175234, "epoch": 1448} {"train_loss": -41.45967483520508, "global_step": 175235, "epoch": 1448} {"train_loss": -40.993133544921875, "global_step": 175236, "epoch": 1448} {"train_loss": -41.29788589477539, "global_step": 175237, "epoch": 1448} {"train_loss": -41.23688888549805, "global_step": 175238, "epoch": 1448} {"train_loss": -41.49705505371094, "global_step": 175239, "epoch": 1448} {"train_loss": -40.151039123535156, "global_step": 175240, "epoch": 1448} {"train_loss": -39.852272033691406, "global_step": 175241, "epoch": 1448} {"train_loss": -38.9412956237793, "global_step": 175242, "epoch": 1448} {"train_loss": -39.30276107788086, "global_step": 175243, "epoch": 1448} {"train_loss": -40.1680793762207, "global_step": 175244, "epoch": 1448} {"train_loss": -40.714759826660156, "global_step": 175245, "epoch": 1448} {"train_loss": -41.064247131347656, "global_step": 175246, "epoch": 1448} {"train_loss": -40.3288688659668, "global_step": 175247, "epoch": 1448} {"train_loss": -39.92327880859375, "global_step": 175248, "epoch": 1448} {"train_loss": -40.241512298583984, "global_step": 175249, "epoch": 1448} {"train_loss": -40.20286178588867, "global_step": 175250, "epoch": 1448} {"train_loss": -39.812252044677734, "global_step": 175251, "epoch": 1448} {"train_loss": -41.05878829956055, "global_step": 175252, "epoch": 1448} {"train_loss": -35.42734909057617, "global_step": 175253, "epoch": 1448} {"train_loss": -41.235591888427734, "global_step": 175254, "epoch": 1448} {"train_loss": -36.79886245727539, "global_step": 175255, "epoch": 1448} {"train_loss": -37.2826042175293, "global_step": 175256, "epoch": 1448} {"train_loss": -40.943336486816406, "global_step": 175257, "epoch": 1448} {"train_loss": -39.427223205566406, "global_step": 175258, "epoch": 1448} {"train_loss": -37.747501373291016, "global_step": 175259, "epoch": 1448} {"train_loss": -39.453773498535156, "global_step": 175260, "epoch": 1448} {"train_loss": -40.484718322753906, "global_step": 175261, "epoch": 1448} {"train_loss": -39.355350494384766, "global_step": 175262, "epoch": 1448} {"train_loss": -41.03809356689453, "global_step": 175263, "epoch": 1448} {"train_loss": -39.570430755615234, "global_step": 175264, "epoch": 1448} {"train_loss": -39.943702697753906, "global_step": 175265, "epoch": 1448} {"train_loss": -40.25200271606445, "global_step": 175266, "epoch": 1448} {"train_loss": -40.396053314208984, "global_step": 175267, "epoch": 1448} {"train_loss": -39.99577331542969, "global_step": 175268, "epoch": 1448} {"train_loss": -41.380409240722656, "global_step": 175269, "epoch": 1448} {"train_loss": -41.019142150878906, "global_step": 175270, "epoch": 1448} {"train_loss": -40.38396453857422, "global_step": 175271, "epoch": 1448} {"train_loss": -41.48326110839844, "global_step": 175272, "epoch": 1448} {"train_loss": -40.011905670166016, "global_step": 175273, "epoch": 1448} {"train_loss": -40.78122329711914, "global_step": 175274, "epoch": 1448} {"train_loss": -40.7490348815918, "global_step": 175275, "epoch": 1448} {"train_loss": -41.19619369506836, "global_step": 175276, "epoch": 1448} {"train_loss": -40.16497802734375, "global_step": 175277, "epoch": 1448} {"train_loss": -41.12921905517578, "global_step": 175278, "epoch": 1448} {"train_loss": -40.94460678100586, "global_step": 175279, "epoch": 1448} {"train_loss": -41.17599105834961, "global_step": 175280, "epoch": 1448} {"train_loss": -40.58545684814453, "global_step": 175281, "epoch": 1448} {"train_loss": -41.076316833496094, "global_step": 175282, "epoch": 1448} {"train_loss": -41.84710693359375, "global_step": 175283, "epoch": 1448} {"train_loss": -41.37933349609375, "global_step": 175284, "epoch": 1448} {"train_loss": -41.63460922241211, "global_step": 175285, "epoch": 1448} {"train_loss": -41.16392517089844, "global_step": 175286, "epoch": 1448} {"train_loss": -41.86576461791992, "global_step": 175287, "epoch": 1448} {"train_loss": -41.485755920410156, "global_step": 175288, "epoch": 1448} {"train_loss": -41.561893463134766, "global_step": 175289, "epoch": 1448} {"train_loss": -41.040565490722656, "global_step": 175290, "epoch": 1448} {"train_loss": -41.165523529052734, "global_step": 175291, "epoch": 1448} {"train_loss": -41.43476486206055, "global_step": 175292, "epoch": 1448} {"train_loss": -41.036190032958984, "global_step": 175293, "epoch": 1448} {"train_loss": -42.5267333984375, "global_step": 175294, "epoch": 1448} {"train_loss": -41.06281661987305, "global_step": 175295, "epoch": 1448} {"train_loss": -42.16062545776367, "global_step": 175296, "epoch": 1448} {"train_loss": -41.82136154174805, "global_step": 175297, "epoch": 1448} {"train_loss": -42.0933952331543, "global_step": 175298, "epoch": 1448} {"train_loss": -41.553314208984375, "global_step": 175299, "epoch": 1448} {"train_loss": -42.28523254394531, "global_step": 175300, "epoch": 1448} {"train_loss": -41.67348861694336, "global_step": 175301, "epoch": 1448} {"train_loss": -42.42301559448242, "global_step": 175302, "epoch": 1448} {"train_loss": -42.09029769897461, "global_step": 175303, "epoch": 1448} {"train_loss": -42.56488037109375, "global_step": 175304, "epoch": 1448} {"train_loss": -42.27806854248047, "global_step": 175305, "epoch": 1448} {"train_loss": -42.3786735534668, "global_step": 175306, "epoch": 1448} {"train_loss": -42.23005294799805, "global_step": 175307, "epoch": 1448} {"train_loss": -41.91419219970703, "global_step": 175308, "epoch": 1448} {"train_loss": -42.07961654663086, "global_step": 175309, "epoch": 1448} {"train_loss": -42.69450378417969, "global_step": 175310, "epoch": 1448} {"train_loss": -42.32501220703125, "global_step": 175311, "epoch": 1448} {"train_loss": -42.05012130737305, "global_step": 175312, "epoch": 1448} {"train_loss": -41.67561721801758, "global_step": 175313, "epoch": 1448} {"train_loss": -42.154354095458984, "global_step": 175314, "epoch": 1448} {"train_loss": -42.163814544677734, "global_step": 175315, "epoch": 1448} {"train_loss": -41.35661697387695, "global_step": 175316, "epoch": 1448} {"train_loss": -40.92960739135742, "global_step": 175317, "epoch": 1448} {"train_loss": -42.27669143676758, "global_step": 175318, "epoch": 1448} {"train_loss": -42.170936584472656, "global_step": 175319, "epoch": 1448} {"train_loss": -40.56208419799805, "global_step": 175320, "epoch": 1448} {"train_loss": -40.662109375, "global_step": 175321, "epoch": 1448} {"train_loss": -41.93457794189453, "global_step": 175322, "epoch": 1448} {"train_loss": -40.86920166015625, "global_step": 175323, "epoch": 1448} {"train_loss": -41.23249053955078, "global_step": 175324, "epoch": 1448} {"train_loss": -42.157623291015625, "global_step": 175325, "epoch": 1448} {"train_loss": -40.72209548950195, "global_step": 175326, "epoch": 1448} {"train_loss": -39.27256393432617, "global_step": 175327, "epoch": 1448} {"train_loss": -40.95008601038909, "global_step": 175328, "epoch": 1448, "val_loss": 2630557.5} {"train_loss": -41.262367248535156, "global_step": 175329, "epoch": 1449} {"train_loss": -40.01996994018555, "global_step": 175330, "epoch": 1449} {"train_loss": -40.655311584472656, "global_step": 175331, "epoch": 1449} {"train_loss": -41.56065368652344, "global_step": 175332, "epoch": 1449} {"train_loss": -41.185611724853516, "global_step": 175333, "epoch": 1449} {"train_loss": -41.03281784057617, "global_step": 175334, "epoch": 1449} {"train_loss": -39.8416862487793, "global_step": 175335, "epoch": 1449} {"train_loss": -42.157222747802734, "global_step": 175336, "epoch": 1449} {"train_loss": -42.095062255859375, "global_step": 175337, "epoch": 1449} {"train_loss": -41.11750411987305, "global_step": 175338, "epoch": 1449} {"train_loss": -39.96015167236328, "global_step": 175339, "epoch": 1449} {"train_loss": -41.42011260986328, "global_step": 175340, "epoch": 1449} {"train_loss": -41.22202682495117, "global_step": 175341, "epoch": 1449} {"train_loss": -42.137569427490234, "global_step": 175342, "epoch": 1449} {"train_loss": -41.44562911987305, "global_step": 175343, "epoch": 1449} {"train_loss": -41.73312759399414, "global_step": 175344, "epoch": 1449} {"train_loss": -41.82135009765625, "global_step": 175345, "epoch": 1449} {"train_loss": -41.88801193237305, "global_step": 175346, "epoch": 1449} {"train_loss": -41.43876266479492, "global_step": 175347, "epoch": 1449} {"train_loss": -40.90285873413086, "global_step": 175348, "epoch": 1449} {"train_loss": -41.703834533691406, "global_step": 175349, "epoch": 1449} {"train_loss": -40.75813674926758, "global_step": 175350, "epoch": 1449} {"train_loss": -39.94374465942383, "global_step": 175351, "epoch": 1449} {"train_loss": -40.32737350463867, "global_step": 175352, "epoch": 1449} {"train_loss": -42.026668548583984, "global_step": 175353, "epoch": 1449} {"train_loss": -41.37138748168945, "global_step": 175354, "epoch": 1449} {"train_loss": -41.755428314208984, "global_step": 175355, "epoch": 1449} {"train_loss": -41.74630355834961, "global_step": 175356, "epoch": 1449} {"train_loss": -42.07289505004883, "global_step": 175357, "epoch": 1449} {"train_loss": -42.383506774902344, "global_step": 175358, "epoch": 1449} {"train_loss": -41.514766693115234, "global_step": 175359, "epoch": 1449} {"train_loss": -40.925148010253906, "global_step": 175360, "epoch": 1449} {"train_loss": -40.446571350097656, "global_step": 175361, "epoch": 1449} {"train_loss": -40.50070571899414, "global_step": 175362, "epoch": 1449} {"train_loss": -41.435157775878906, "global_step": 175363, "epoch": 1449} {"train_loss": -41.72904586791992, "global_step": 175364, "epoch": 1449} {"train_loss": -40.92631912231445, "global_step": 175365, "epoch": 1449} {"train_loss": -41.36631393432617, "global_step": 175366, "epoch": 1449} {"train_loss": -39.72166061401367, "global_step": 175367, "epoch": 1449} {"train_loss": -41.52202606201172, "global_step": 175368, "epoch": 1449} {"train_loss": -42.509490966796875, "global_step": 175369, "epoch": 1449} {"train_loss": -40.57735061645508, "global_step": 175370, "epoch": 1449} {"train_loss": -40.55978012084961, "global_step": 175371, "epoch": 1449} {"train_loss": -41.628662109375, "global_step": 175372, "epoch": 1449} {"train_loss": -42.151039123535156, "global_step": 175373, "epoch": 1449} {"train_loss": -41.48612594604492, "global_step": 175374, "epoch": 1449} {"train_loss": -41.838626861572266, "global_step": 175375, "epoch": 1449} {"train_loss": -41.69259262084961, "global_step": 175376, "epoch": 1449} {"train_loss": -41.447757720947266, "global_step": 175377, "epoch": 1449} {"train_loss": -41.83087921142578, "global_step": 175378, "epoch": 1449} {"train_loss": -41.69118881225586, "global_step": 175379, "epoch": 1449} {"train_loss": -41.58064651489258, "global_step": 175380, "epoch": 1449} {"train_loss": -41.82163619995117, "global_step": 175381, "epoch": 1449} {"train_loss": -42.365535736083984, "global_step": 175382, "epoch": 1449} {"train_loss": -41.89057540893555, "global_step": 175383, "epoch": 1449} {"train_loss": -41.55269241333008, "global_step": 175384, "epoch": 1449} {"train_loss": -42.28844451904297, "global_step": 175385, "epoch": 1449} {"train_loss": -42.104774475097656, "global_step": 175386, "epoch": 1449} {"train_loss": -41.21147918701172, "global_step": 175387, "epoch": 1449} {"train_loss": -41.80611038208008, "global_step": 175388, "epoch": 1449} {"train_loss": -42.21504592895508, "global_step": 175389, "epoch": 1449} {"train_loss": -41.564491271972656, "global_step": 175390, "epoch": 1449} {"train_loss": -42.464717864990234, "global_step": 175391, "epoch": 1449} {"train_loss": -41.579345703125, "global_step": 175392, "epoch": 1449} {"train_loss": -42.197662353515625, "global_step": 175393, "epoch": 1449} {"train_loss": -42.6524772644043, "global_step": 175394, "epoch": 1449} {"train_loss": -41.7951545715332, "global_step": 175395, "epoch": 1449} {"train_loss": -41.71468734741211, "global_step": 175396, "epoch": 1449} {"train_loss": -42.05546188354492, "global_step": 175397, "epoch": 1449} {"train_loss": -41.45333480834961, "global_step": 175398, "epoch": 1449} {"train_loss": -41.03186798095703, "global_step": 175399, "epoch": 1449} {"train_loss": -42.723670959472656, "global_step": 175400, "epoch": 1449} {"train_loss": -41.75630569458008, "global_step": 175401, "epoch": 1449} {"train_loss": -40.98508834838867, "global_step": 175402, "epoch": 1449} {"train_loss": -41.748199462890625, "global_step": 175403, "epoch": 1449} {"train_loss": -41.877540588378906, "global_step": 175404, "epoch": 1449} {"train_loss": -40.98168182373047, "global_step": 175405, "epoch": 1449} {"train_loss": -42.12568283081055, "global_step": 175406, "epoch": 1449} {"train_loss": -41.83244323730469, "global_step": 175407, "epoch": 1449} {"train_loss": -40.79401779174805, "global_step": 175408, "epoch": 1449} {"train_loss": -41.27779769897461, "global_step": 175409, "epoch": 1449} {"train_loss": -41.997291564941406, "global_step": 175410, "epoch": 1449} {"train_loss": -40.48725509643555, "global_step": 175411, "epoch": 1449} {"train_loss": -41.99114990234375, "global_step": 175412, "epoch": 1449} {"train_loss": -40.122215270996094, "global_step": 175413, "epoch": 1449} {"train_loss": -38.543670654296875, "global_step": 175414, "epoch": 1449} {"train_loss": -40.71997833251953, "global_step": 175415, "epoch": 1449} {"train_loss": -38.54813766479492, "global_step": 175416, "epoch": 1449} {"train_loss": -38.9328727722168, "global_step": 175417, "epoch": 1449} {"train_loss": -40.405029296875, "global_step": 175418, "epoch": 1449} {"train_loss": -41.17774963378906, "global_step": 175419, "epoch": 1449} {"train_loss": -41.70779800415039, "global_step": 175420, "epoch": 1449} {"train_loss": -42.20537185668945, "global_step": 175421, "epoch": 1449} {"train_loss": -41.15137481689453, "global_step": 175422, "epoch": 1449} {"train_loss": -40.25261306762695, "global_step": 175423, "epoch": 1449} {"train_loss": -39.22426986694336, "global_step": 175424, "epoch": 1449} {"train_loss": -40.3163948059082, "global_step": 175425, "epoch": 1449} {"train_loss": -40.2492561340332, "global_step": 175426, "epoch": 1449} {"train_loss": -40.53129959106445, "global_step": 175427, "epoch": 1449} {"train_loss": -41.56466293334961, "global_step": 175428, "epoch": 1449} {"train_loss": -40.985809326171875, "global_step": 175429, "epoch": 1449} {"train_loss": -40.506431579589844, "global_step": 175430, "epoch": 1449} {"train_loss": -40.80718994140625, "global_step": 175431, "epoch": 1449} {"train_loss": -42.080963134765625, "global_step": 175432, "epoch": 1449} {"train_loss": -41.2095832824707, "global_step": 175433, "epoch": 1449} {"train_loss": -41.017494201660156, "global_step": 175434, "epoch": 1449} {"train_loss": -41.55953598022461, "global_step": 175435, "epoch": 1449} {"train_loss": -41.33762741088867, "global_step": 175436, "epoch": 1449} {"train_loss": -40.44195556640625, "global_step": 175437, "epoch": 1449} {"train_loss": -41.058807373046875, "global_step": 175438, "epoch": 1449} {"train_loss": -40.91071319580078, "global_step": 175439, "epoch": 1449} {"train_loss": -41.76578903198242, "global_step": 175440, "epoch": 1449} {"train_loss": -41.73093032836914, "global_step": 175441, "epoch": 1449} {"train_loss": -40.48989486694336, "global_step": 175442, "epoch": 1449} {"train_loss": -40.71263885498047, "global_step": 175443, "epoch": 1449} {"train_loss": -40.8388786315918, "global_step": 175444, "epoch": 1449} {"train_loss": -41.4339714050293, "global_step": 175445, "epoch": 1449} {"train_loss": -41.25214385986328, "global_step": 175446, "epoch": 1449} {"train_loss": -40.026649475097656, "global_step": 175447, "epoch": 1449} {"train_loss": -41.65439987182617, "global_step": 175448, "epoch": 1449} {"train_loss": -41.27075283586486, "global_step": 175449, "epoch": 1449, "val_loss": 2702672.25} {"train_loss": -40.31062698364258, "global_step": 175450, "epoch": 1450} {"train_loss": -39.7068977355957, "global_step": 175451, "epoch": 1450} {"train_loss": -42.03459548950195, "global_step": 175452, "epoch": 1450} {"train_loss": -39.92081832885742, "global_step": 175453, "epoch": 1450} {"train_loss": -38.83169174194336, "global_step": 175454, "epoch": 1450} {"train_loss": -41.66301345825195, "global_step": 175455, "epoch": 1450} {"train_loss": -40.49872970581055, "global_step": 175456, "epoch": 1450} {"train_loss": -40.928871154785156, "global_step": 175457, "epoch": 1450} {"train_loss": -41.12890625, "global_step": 175458, "epoch": 1450} {"train_loss": -41.53904342651367, "global_step": 175459, "epoch": 1450} {"train_loss": -40.869598388671875, "global_step": 175460, "epoch": 1450} {"train_loss": -41.07411575317383, "global_step": 175461, "epoch": 1450} {"train_loss": -41.26765441894531, "global_step": 175462, "epoch": 1450} {"train_loss": -41.92499542236328, "global_step": 175463, "epoch": 1450} {"train_loss": -41.673152923583984, "global_step": 175464, "epoch": 1450} {"train_loss": -41.81801223754883, "global_step": 175465, "epoch": 1450} {"train_loss": -41.55711364746094, "global_step": 175466, "epoch": 1450} {"train_loss": -42.07075881958008, "global_step": 175467, "epoch": 1450} {"train_loss": -41.74892044067383, "global_step": 175468, "epoch": 1450} {"train_loss": -42.3081169128418, "global_step": 175469, "epoch": 1450} {"train_loss": -41.01457977294922, "global_step": 175470, "epoch": 1450} {"train_loss": -40.581878662109375, "global_step": 175471, "epoch": 1450} {"train_loss": -41.40571975708008, "global_step": 175472, "epoch": 1450} {"train_loss": -41.040828704833984, "global_step": 175473, "epoch": 1450} {"train_loss": -41.93549728393555, "global_step": 175474, "epoch": 1450} {"train_loss": -42.2395133972168, "global_step": 175475, "epoch": 1450} {"train_loss": -41.8199577331543, "global_step": 175476, "epoch": 1450} {"train_loss": -41.59027862548828, "global_step": 175477, "epoch": 1450} {"train_loss": -42.17484664916992, "global_step": 175478, "epoch": 1450} {"train_loss": -42.3301887512207, "global_step": 175479, "epoch": 1450} {"train_loss": -41.595577239990234, "global_step": 175480, "epoch": 1450} {"train_loss": -42.31587219238281, "global_step": 175481, "epoch": 1450} {"train_loss": -40.88212203979492, "global_step": 175482, "epoch": 1450} {"train_loss": -42.30857467651367, "global_step": 175483, "epoch": 1450} {"train_loss": -42.532840728759766, "global_step": 175484, "epoch": 1450} {"train_loss": -42.79066467285156, "global_step": 175485, "epoch": 1450} {"train_loss": -42.71492004394531, "global_step": 175486, "epoch": 1450} {"train_loss": -42.335853576660156, "global_step": 175487, "epoch": 1450} {"train_loss": -42.38451385498047, "global_step": 175488, "epoch": 1450} {"train_loss": -41.321170806884766, "global_step": 175489, "epoch": 1450} {"train_loss": -42.76249313354492, "global_step": 175490, "epoch": 1450} {"train_loss": -42.10988998413086, "global_step": 175491, "epoch": 1450} {"train_loss": -42.364234924316406, "global_step": 175492, "epoch": 1450} {"train_loss": -41.879058837890625, "global_step": 175493, "epoch": 1450} {"train_loss": -41.96904373168945, "global_step": 175494, "epoch": 1450} {"train_loss": -41.59952926635742, "global_step": 175495, "epoch": 1450} {"train_loss": -41.84991455078125, "global_step": 175496, "epoch": 1450} {"train_loss": -41.714447021484375, "global_step": 175497, "epoch": 1450} {"train_loss": -40.44285202026367, "global_step": 175498, "epoch": 1450} {"train_loss": -39.65468215942383, "global_step": 175499, "epoch": 1450} {"train_loss": -41.590633392333984, "global_step": 175500, "epoch": 1450} {"train_loss": -39.78591537475586, "global_step": 175501, "epoch": 1450} {"train_loss": -36.902992248535156, "global_step": 175502, "epoch": 1450} {"train_loss": -39.96871566772461, "global_step": 175503, "epoch": 1450} {"train_loss": -38.90363693237305, "global_step": 175504, "epoch": 1450} {"train_loss": -36.73394775390625, "global_step": 175505, "epoch": 1450} {"train_loss": -38.199275970458984, "global_step": 175506, "epoch": 1450} {"train_loss": -39.698936462402344, "global_step": 175507, "epoch": 1450} {"train_loss": -37.238216400146484, "global_step": 175508, "epoch": 1450} {"train_loss": -40.66484451293945, "global_step": 175509, "epoch": 1450} {"train_loss": -37.99142837524414, "global_step": 175510, "epoch": 1450} {"train_loss": -37.46896743774414, "global_step": 175511, "epoch": 1450} {"train_loss": -39.27488327026367, "global_step": 175512, "epoch": 1450} {"train_loss": -35.02824401855469, "global_step": 175513, "epoch": 1450} {"train_loss": -39.6895751953125, "global_step": 175514, "epoch": 1450} {"train_loss": -39.06193161010742, "global_step": 175515, "epoch": 1450} {"train_loss": -40.10993576049805, "global_step": 175516, "epoch": 1450} {"train_loss": -39.36393356323242, "global_step": 175517, "epoch": 1450} {"train_loss": -40.40788650512695, "global_step": 175518, "epoch": 1450} {"train_loss": -40.707000732421875, "global_step": 175519, "epoch": 1450} {"train_loss": -40.60000228881836, "global_step": 175520, "epoch": 1450} {"train_loss": -40.3585319519043, "global_step": 175521, "epoch": 1450} {"train_loss": -40.298057556152344, "global_step": 175522, "epoch": 1450} {"train_loss": -39.73206329345703, "global_step": 175523, "epoch": 1450} {"train_loss": -40.982784271240234, "global_step": 175524, "epoch": 1450} {"train_loss": -40.34861755371094, "global_step": 175525, "epoch": 1450} {"train_loss": -39.832672119140625, "global_step": 175526, "epoch": 1450} {"train_loss": -41.45402145385742, "global_step": 175527, "epoch": 1450} {"train_loss": -40.27754592895508, "global_step": 175528, "epoch": 1450} {"train_loss": -41.19233322143555, "global_step": 175529, "epoch": 1450} {"train_loss": -40.565120697021484, "global_step": 175530, "epoch": 1450} {"train_loss": -41.04826736450195, "global_step": 175531, "epoch": 1450} {"train_loss": -40.66292190551758, "global_step": 175532, "epoch": 1450} {"train_loss": -39.99711608886719, "global_step": 175533, "epoch": 1450} {"train_loss": -40.880889892578125, "global_step": 175534, "epoch": 1450} {"train_loss": -41.928993225097656, "global_step": 175535, "epoch": 1450} {"train_loss": -40.77312088012695, "global_step": 175536, "epoch": 1450} {"train_loss": -42.25818634033203, "global_step": 175537, "epoch": 1450} {"train_loss": -40.93561553955078, "global_step": 175538, "epoch": 1450} {"train_loss": -41.651702880859375, "global_step": 175539, "epoch": 1450} {"train_loss": -41.10785675048828, "global_step": 175540, "epoch": 1450} {"train_loss": -41.3692512512207, "global_step": 175541, "epoch": 1450} {"train_loss": -41.42006301879883, "global_step": 175542, "epoch": 1450} {"train_loss": -41.659088134765625, "global_step": 175543, "epoch": 1450} {"train_loss": -41.31631088256836, "global_step": 175544, "epoch": 1450} {"train_loss": -41.45986557006836, "global_step": 175545, "epoch": 1450} {"train_loss": -41.89314651489258, "global_step": 175546, "epoch": 1450} {"train_loss": -41.770042419433594, "global_step": 175547, "epoch": 1450} {"train_loss": -41.943603515625, "global_step": 175548, "epoch": 1450} {"train_loss": -41.7680778503418, "global_step": 175549, "epoch": 1450} {"train_loss": -42.14276123046875, "global_step": 175550, "epoch": 1450} {"train_loss": -41.8583984375, "global_step": 175551, "epoch": 1450} {"train_loss": -41.70791244506836, "global_step": 175552, "epoch": 1450} {"train_loss": -41.8083381652832, "global_step": 175553, "epoch": 1450} {"train_loss": -41.99717330932617, "global_step": 175554, "epoch": 1450} {"train_loss": -41.579647064208984, "global_step": 175555, "epoch": 1450} {"train_loss": -42.16858673095703, "global_step": 175556, "epoch": 1450} {"train_loss": -42.016475677490234, "global_step": 175557, "epoch": 1450} {"train_loss": -41.79283142089844, "global_step": 175558, "epoch": 1450} {"train_loss": -41.85201644897461, "global_step": 175559, "epoch": 1450} {"train_loss": -42.448631286621094, "global_step": 175560, "epoch": 1450} {"train_loss": -42.16388702392578, "global_step": 175561, "epoch": 1450} {"train_loss": -41.9578971862793, "global_step": 175562, "epoch": 1450} {"train_loss": -42.69068908691406, "global_step": 175563, "epoch": 1450} {"train_loss": -42.40217971801758, "global_step": 175564, "epoch": 1450} {"train_loss": -42.337318420410156, "global_step": 175565, "epoch": 1450} {"train_loss": -42.697486877441406, "global_step": 175566, "epoch": 1450} {"train_loss": -41.96937942504883, "global_step": 175567, "epoch": 1450} {"train_loss": -42.82461166381836, "global_step": 175568, "epoch": 1450} {"train_loss": -42.53538513183594, "global_step": 175569, "epoch": 1450} {"train_loss": -41.09204322247466, "global_step": 175570, "epoch": 1450, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 0.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4400000": 1.0, "test/sim_max_reward_4400001": 1.0, "test/sim_max_reward_4400002": 1.0, "test/sim_max_reward_4400003": 1.0, "test/sim_max_reward_4400004": 1.0, "test/sim_max_reward_4400005": 1.0, "test/sim_max_reward_4400006": 1.0, "test/sim_max_reward_4400007": 1.0, "test/sim_max_reward_4400008": 1.0, "test/sim_max_reward_4400009": 1.0, "test/sim_max_reward_4400010": 1.0, "test/sim_max_reward_4400011": 1.0, "test/sim_max_reward_4400012": 1.0, "test/sim_max_reward_4400013": 1.0, "test/sim_max_reward_4400014": 1.0, "test/sim_max_reward_4400015": 1.0, "test/sim_max_reward_4400016": 1.0, "test/sim_max_reward_4400017": 1.0, "test/sim_max_reward_4400018": 1.0, "test/sim_max_reward_4400019": 1.0, "test/sim_max_reward_4400020": 1.0, "test/sim_max_reward_4400021": 1.0, "train/mean_score": 0.8333333333333334, "test/mean_score": 1.0, "val_loss": 2675777.25} {"train_loss": -42.41162109375, "global_step": 175571, "epoch": 1451} {"train_loss": -42.169124603271484, "global_step": 175572, "epoch": 1451} {"train_loss": -42.0849723815918, "global_step": 175573, "epoch": 1451} {"train_loss": -42.57664108276367, "global_step": 175574, "epoch": 1451} {"train_loss": -42.9837532043457, "global_step": 175575, "epoch": 1451} {"train_loss": -42.64146041870117, "global_step": 175576, "epoch": 1451} {"train_loss": -42.377479553222656, "global_step": 175577, "epoch": 1451} {"train_loss": -42.12047576904297, "global_step": 175578, "epoch": 1451} {"train_loss": -38.418479919433594, "global_step": 175579, "epoch": 1451} {"train_loss": -40.910247802734375, "global_step": 175580, "epoch": 1451} {"train_loss": -40.4599609375, "global_step": 175581, "epoch": 1451} {"train_loss": -32.327247619628906, "global_step": 175582, "epoch": 1451} {"train_loss": -39.079097747802734, "global_step": 175583, "epoch": 1451} {"train_loss": -33.658748626708984, "global_step": 175584, "epoch": 1451} {"train_loss": -39.71910095214844, "global_step": 175585, "epoch": 1451} {"train_loss": -37.67256546020508, "global_step": 175586, "epoch": 1451} {"train_loss": -33.67119216918945, "global_step": 175587, "epoch": 1451} {"train_loss": -35.5726318359375, "global_step": 175588, "epoch": 1451} {"train_loss": -39.652706146240234, "global_step": 175589, "epoch": 1451} {"train_loss": -39.46278762817383, "global_step": 175590, "epoch": 1451} {"train_loss": -38.687984466552734, "global_step": 175591, "epoch": 1451} {"train_loss": -33.627655029296875, "global_step": 175592, "epoch": 1451} {"train_loss": -38.25632858276367, "global_step": 175593, "epoch": 1451} {"train_loss": -37.7584114074707, "global_step": 175594, "epoch": 1451} {"train_loss": -34.23916244506836, "global_step": 175595, "epoch": 1451} {"train_loss": -37.27101135253906, "global_step": 175596, "epoch": 1451} {"train_loss": -39.01327133178711, "global_step": 175597, "epoch": 1451} {"train_loss": -39.52328109741211, "global_step": 175598, "epoch": 1451} {"train_loss": -39.043575286865234, "global_step": 175599, "epoch": 1451} {"train_loss": -39.1447639465332, "global_step": 175600, "epoch": 1451} {"train_loss": -38.82839584350586, "global_step": 175601, "epoch": 1451} {"train_loss": -38.74462890625, "global_step": 175602, "epoch": 1451} {"train_loss": -38.480194091796875, "global_step": 175603, "epoch": 1451} {"train_loss": -39.900787353515625, "global_step": 175604, "epoch": 1451} {"train_loss": -38.55509948730469, "global_step": 175605, "epoch": 1451} {"train_loss": -40.127052307128906, "global_step": 175606, "epoch": 1451} {"train_loss": -39.58518981933594, "global_step": 175607, "epoch": 1451} {"train_loss": -39.79780960083008, "global_step": 175608, "epoch": 1451} {"train_loss": -40.0701789855957, "global_step": 175609, "epoch": 1451} {"train_loss": -39.986328125, "global_step": 175610, "epoch": 1451} {"train_loss": -40.49876022338867, "global_step": 175611, "epoch": 1451} {"train_loss": -40.805946350097656, "global_step": 175612, "epoch": 1451} {"train_loss": -40.95803451538086, "global_step": 175613, "epoch": 1451} {"train_loss": -39.730987548828125, "global_step": 175614, "epoch": 1451} {"train_loss": -39.935176849365234, "global_step": 175615, "epoch": 1451} {"train_loss": -40.6374626159668, "global_step": 175616, "epoch": 1451} {"train_loss": -40.429405212402344, "global_step": 175617, "epoch": 1451} {"train_loss": -41.007728576660156, "global_step": 175618, "epoch": 1451} {"train_loss": -40.25545120239258, "global_step": 175619, "epoch": 1451} {"train_loss": -41.71760177612305, "global_step": 175620, "epoch": 1451} {"train_loss": -40.949684143066406, "global_step": 175621, "epoch": 1451} {"train_loss": -40.459598541259766, "global_step": 175622, "epoch": 1451} {"train_loss": -41.47766876220703, "global_step": 175623, "epoch": 1451} {"train_loss": -41.47932052612305, "global_step": 175624, "epoch": 1451} {"train_loss": -41.87893295288086, "global_step": 175625, "epoch": 1451} {"train_loss": -40.44246292114258, "global_step": 175626, "epoch": 1451} {"train_loss": -41.457698822021484, "global_step": 175627, "epoch": 1451} {"train_loss": -41.220489501953125, "global_step": 175628, "epoch": 1451} {"train_loss": -41.18919372558594, "global_step": 175629, "epoch": 1451} {"train_loss": -41.85887908935547, "global_step": 175630, "epoch": 1451} {"train_loss": -41.416404724121094, "global_step": 175631, "epoch": 1451} {"train_loss": -41.52748489379883, "global_step": 175632, "epoch": 1451} {"train_loss": -41.4940071105957, "global_step": 175633, "epoch": 1451} {"train_loss": -40.73929214477539, "global_step": 175634, "epoch": 1451} {"train_loss": -41.49363708496094, "global_step": 175635, "epoch": 1451} {"train_loss": -41.88362503051758, "global_step": 175636, "epoch": 1451} {"train_loss": -41.0349235534668, "global_step": 175637, "epoch": 1451} {"train_loss": -42.17547607421875, "global_step": 175638, "epoch": 1451} {"train_loss": -42.395015716552734, "global_step": 175639, "epoch": 1451} {"train_loss": -40.9193229675293, "global_step": 175640, "epoch": 1451} {"train_loss": -41.684017181396484, "global_step": 175641, "epoch": 1451} {"train_loss": -42.22840881347656, "global_step": 175642, "epoch": 1451} {"train_loss": -41.80803680419922, "global_step": 175643, "epoch": 1451} {"train_loss": -41.64804458618164, "global_step": 175644, "epoch": 1451} {"train_loss": -42.17317581176758, "global_step": 175645, "epoch": 1451} {"train_loss": -42.35358810424805, "global_step": 175646, "epoch": 1451} {"train_loss": -42.09229278564453, "global_step": 175647, "epoch": 1451} {"train_loss": -42.35425567626953, "global_step": 175648, "epoch": 1451} {"train_loss": -41.998165130615234, "global_step": 175649, "epoch": 1451} {"train_loss": -41.55464553833008, "global_step": 175650, "epoch": 1451} {"train_loss": -42.0944938659668, "global_step": 175651, "epoch": 1451} {"train_loss": -42.28493881225586, "global_step": 175652, "epoch": 1451} {"train_loss": -42.378570556640625, "global_step": 175653, "epoch": 1451} {"train_loss": -42.390193939208984, "global_step": 175654, "epoch": 1451} {"train_loss": -42.40128707885742, "global_step": 175655, "epoch": 1451} {"train_loss": -42.17832946777344, "global_step": 175656, "epoch": 1451} {"train_loss": -41.571876525878906, "global_step": 175657, "epoch": 1451} {"train_loss": -42.15049743652344, "global_step": 175658, "epoch": 1451} {"train_loss": -42.51654815673828, "global_step": 175659, "epoch": 1451} {"train_loss": -41.99391555786133, "global_step": 175660, "epoch": 1451} {"train_loss": -41.05364227294922, "global_step": 175661, "epoch": 1451} {"train_loss": -40.31621551513672, "global_step": 175662, "epoch": 1451} {"train_loss": -41.96321105957031, "global_step": 175663, "epoch": 1451} {"train_loss": -42.53939437866211, "global_step": 175664, "epoch": 1451} {"train_loss": -42.5457763671875, "global_step": 175665, "epoch": 1451} {"train_loss": -41.38704299926758, "global_step": 175666, "epoch": 1451} {"train_loss": -39.34649658203125, "global_step": 175667, "epoch": 1451} {"train_loss": -36.13820266723633, "global_step": 175668, "epoch": 1451} {"train_loss": -42.18699264526367, "global_step": 175669, "epoch": 1451} {"train_loss": -40.8119010925293, "global_step": 175670, "epoch": 1451} {"train_loss": -36.254425048828125, "global_step": 175671, "epoch": 1451} {"train_loss": -37.61260986328125, "global_step": 175672, "epoch": 1451} {"train_loss": -42.000179290771484, "global_step": 175673, "epoch": 1451} {"train_loss": -38.968963623046875, "global_step": 175674, "epoch": 1451} {"train_loss": -35.9372444152832, "global_step": 175675, "epoch": 1451} {"train_loss": -40.56868362426758, "global_step": 175676, "epoch": 1451} {"train_loss": -40.300960540771484, "global_step": 175677, "epoch": 1451} {"train_loss": -39.033241271972656, "global_step": 175678, "epoch": 1451} {"train_loss": -41.164276123046875, "global_step": 175679, "epoch": 1451} {"train_loss": -41.20450210571289, "global_step": 175680, "epoch": 1451} {"train_loss": -40.414608001708984, "global_step": 175681, "epoch": 1451} {"train_loss": -41.20375061035156, "global_step": 175682, "epoch": 1451} {"train_loss": -41.121517181396484, "global_step": 175683, "epoch": 1451} {"train_loss": -40.36164474487305, "global_step": 175684, "epoch": 1451} {"train_loss": -40.44203186035156, "global_step": 175685, "epoch": 1451} {"train_loss": -40.873626708984375, "global_step": 175686, "epoch": 1451} {"train_loss": -39.91134262084961, "global_step": 175687, "epoch": 1451} {"train_loss": -40.77247619628906, "global_step": 175688, "epoch": 1451} {"train_loss": -39.88943099975586, "global_step": 175689, "epoch": 1451} {"train_loss": -36.5733757019043, "global_step": 175690, "epoch": 1451} {"train_loss": -40.26380148012776, "global_step": 175691, "epoch": 1451, "val_loss": 2604240.25} {"train_loss": -26.285505294799805, "global_step": 175692, "epoch": 1452} {"train_loss": -26.60188865661621, "global_step": 175693, "epoch": 1452} {"train_loss": -32.5389404296875, "global_step": 175694, "epoch": 1452} {"train_loss": -30.64058494567871, "global_step": 175695, "epoch": 1452} {"train_loss": -30.798358917236328, "global_step": 175696, "epoch": 1452} {"train_loss": -36.38621139526367, "global_step": 175697, "epoch": 1452} {"train_loss": -36.27078628540039, "global_step": 175698, "epoch": 1452} {"train_loss": -38.89638900756836, "global_step": 175699, "epoch": 1452} {"train_loss": -36.40790939331055, "global_step": 175700, "epoch": 1452} {"train_loss": -38.26223373413086, "global_step": 175701, "epoch": 1452} {"train_loss": -34.82102584838867, "global_step": 175702, "epoch": 1452} {"train_loss": -38.2333869934082, "global_step": 175703, "epoch": 1452} {"train_loss": -36.67744827270508, "global_step": 175704, "epoch": 1452} {"train_loss": -38.6682243347168, "global_step": 175705, "epoch": 1452} {"train_loss": -38.9050407409668, "global_step": 175706, "epoch": 1452} {"train_loss": -39.283912658691406, "global_step": 175707, "epoch": 1452} {"train_loss": -39.19316482543945, "global_step": 175708, "epoch": 1452} {"train_loss": -39.444793701171875, "global_step": 175709, "epoch": 1452} {"train_loss": -39.87478256225586, "global_step": 175710, "epoch": 1452} {"train_loss": -39.34202194213867, "global_step": 175711, "epoch": 1452} {"train_loss": -40.30149459838867, "global_step": 175712, "epoch": 1452} {"train_loss": -40.53009796142578, "global_step": 175713, "epoch": 1452} {"train_loss": -40.6917610168457, "global_step": 175714, "epoch": 1452} {"train_loss": -40.56955337524414, "global_step": 175715, "epoch": 1452} {"train_loss": -40.81400680541992, "global_step": 175716, "epoch": 1452} {"train_loss": -40.49856948852539, "global_step": 175717, "epoch": 1452} {"train_loss": -40.59029006958008, "global_step": 175718, "epoch": 1452} {"train_loss": -41.12363815307617, "global_step": 175719, "epoch": 1452} {"train_loss": -40.71883773803711, "global_step": 175720, "epoch": 1452} {"train_loss": -41.07313919067383, "global_step": 175721, "epoch": 1452} {"train_loss": -41.3415412902832, "global_step": 175722, "epoch": 1452} {"train_loss": -40.98303985595703, "global_step": 175723, "epoch": 1452} {"train_loss": -41.068450927734375, "global_step": 175724, "epoch": 1452} {"train_loss": -41.22664260864258, "global_step": 175725, "epoch": 1452} {"train_loss": -40.76860809326172, "global_step": 175726, "epoch": 1452} {"train_loss": -40.4798583984375, "global_step": 175727, "epoch": 1452} {"train_loss": -41.30369186401367, "global_step": 175728, "epoch": 1452} {"train_loss": -40.37560272216797, "global_step": 175729, "epoch": 1452} {"train_loss": -41.10356140136719, "global_step": 175730, "epoch": 1452} {"train_loss": -41.79001998901367, "global_step": 175731, "epoch": 1452} {"train_loss": -40.9425163269043, "global_step": 175732, "epoch": 1452} {"train_loss": -41.074947357177734, "global_step": 175733, "epoch": 1452} {"train_loss": -41.23883056640625, "global_step": 175734, "epoch": 1452} {"train_loss": -41.18522262573242, "global_step": 175735, "epoch": 1452} {"train_loss": -41.52467346191406, "global_step": 175736, "epoch": 1452} {"train_loss": -41.111881256103516, "global_step": 175737, "epoch": 1452} {"train_loss": -41.071163177490234, "global_step": 175738, "epoch": 1452} {"train_loss": -41.2040901184082, "global_step": 175739, "epoch": 1452} {"train_loss": -41.435455322265625, "global_step": 175740, "epoch": 1452} {"train_loss": -41.024898529052734, "global_step": 175741, "epoch": 1452} {"train_loss": -41.43526840209961, "global_step": 175742, "epoch": 1452} {"train_loss": -40.97888946533203, "global_step": 175743, "epoch": 1452} {"train_loss": -41.71625900268555, "global_step": 175744, "epoch": 1452} {"train_loss": -41.82033920288086, "global_step": 175745, "epoch": 1452} {"train_loss": -41.754085540771484, "global_step": 175746, "epoch": 1452} {"train_loss": -41.683074951171875, "global_step": 175747, "epoch": 1452} {"train_loss": -41.7340202331543, "global_step": 175748, "epoch": 1452} {"train_loss": -41.951812744140625, "global_step": 175749, "epoch": 1452} {"train_loss": -41.543094635009766, "global_step": 175750, "epoch": 1452} {"train_loss": -42.273521423339844, "global_step": 175751, "epoch": 1452} {"train_loss": -42.32756423950195, "global_step": 175752, "epoch": 1452} {"train_loss": -41.787174224853516, "global_step": 175753, "epoch": 1452} {"train_loss": -41.993656158447266, "global_step": 175754, "epoch": 1452} {"train_loss": -41.96209716796875, "global_step": 175755, "epoch": 1452} {"train_loss": -41.96561813354492, "global_step": 175756, "epoch": 1452} {"train_loss": -42.10002517700195, "global_step": 175757, "epoch": 1452} {"train_loss": -42.1772346496582, "global_step": 175758, "epoch": 1452} {"train_loss": -42.57616424560547, "global_step": 175759, "epoch": 1452} {"train_loss": -42.15363693237305, "global_step": 175760, "epoch": 1452} {"train_loss": -41.923500061035156, "global_step": 175761, "epoch": 1452} {"train_loss": -42.22596740722656, "global_step": 175762, "epoch": 1452} {"train_loss": -42.09055709838867, "global_step": 175763, "epoch": 1452} {"train_loss": -42.3297119140625, "global_step": 175764, "epoch": 1452} {"train_loss": -42.16181564331055, "global_step": 175765, "epoch": 1452} {"train_loss": -41.64693832397461, "global_step": 175766, "epoch": 1452} {"train_loss": -41.41603469848633, "global_step": 175767, "epoch": 1452} {"train_loss": -42.42765426635742, "global_step": 175768, "epoch": 1452} {"train_loss": -42.49689483642578, "global_step": 175769, "epoch": 1452} {"train_loss": -41.862667083740234, "global_step": 175770, "epoch": 1452} {"train_loss": -41.91282272338867, "global_step": 175771, "epoch": 1452} {"train_loss": -42.14213180541992, "global_step": 175772, "epoch": 1452} {"train_loss": -42.06272506713867, "global_step": 175773, "epoch": 1452} {"train_loss": -42.31243896484375, "global_step": 175774, "epoch": 1452} {"train_loss": -42.41083908081055, "global_step": 175775, "epoch": 1452} {"train_loss": -42.01020431518555, "global_step": 175776, "epoch": 1452} {"train_loss": -41.62027359008789, "global_step": 175777, "epoch": 1452} {"train_loss": -40.85980224609375, "global_step": 175778, "epoch": 1452} {"train_loss": -40.852718353271484, "global_step": 175779, "epoch": 1452} {"train_loss": -41.401729583740234, "global_step": 175780, "epoch": 1452} {"train_loss": -42.10842514038086, "global_step": 175781, "epoch": 1452} {"train_loss": -42.1566162109375, "global_step": 175782, "epoch": 1452} {"train_loss": -42.44683837890625, "global_step": 175783, "epoch": 1452} {"train_loss": -41.92731857299805, "global_step": 175784, "epoch": 1452} {"train_loss": -41.66023635864258, "global_step": 175785, "epoch": 1452} {"train_loss": -40.9268913269043, "global_step": 175786, "epoch": 1452} {"train_loss": -42.360111236572266, "global_step": 175787, "epoch": 1452} {"train_loss": -42.309139251708984, "global_step": 175788, "epoch": 1452} {"train_loss": -40.8287467956543, "global_step": 175789, "epoch": 1452} {"train_loss": -41.06734848022461, "global_step": 175790, "epoch": 1452} {"train_loss": -40.49568557739258, "global_step": 175791, "epoch": 1452} {"train_loss": -40.91898727416992, "global_step": 175792, "epoch": 1452} {"train_loss": -42.17158126831055, "global_step": 175793, "epoch": 1452} {"train_loss": -41.5324821472168, "global_step": 175794, "epoch": 1452} {"train_loss": -42.108882904052734, "global_step": 175795, "epoch": 1452} {"train_loss": -41.37990951538086, "global_step": 175796, "epoch": 1452} {"train_loss": -41.8635139465332, "global_step": 175797, "epoch": 1452} {"train_loss": -41.71757125854492, "global_step": 175798, "epoch": 1452} {"train_loss": -41.36783218383789, "global_step": 175799, "epoch": 1452} {"train_loss": -40.928367614746094, "global_step": 175800, "epoch": 1452} {"train_loss": -41.0791015625, "global_step": 175801, "epoch": 1452} {"train_loss": -41.70262908935547, "global_step": 175802, "epoch": 1452} {"train_loss": -41.56081771850586, "global_step": 175803, "epoch": 1452} {"train_loss": -41.254737854003906, "global_step": 175804, "epoch": 1452} {"train_loss": -41.29602813720703, "global_step": 175805, "epoch": 1452} {"train_loss": -40.35673904418945, "global_step": 175806, "epoch": 1452} {"train_loss": -40.4085807800293, "global_step": 175807, "epoch": 1452} {"train_loss": -41.5907096862793, "global_step": 175808, "epoch": 1452} {"train_loss": -40.90017318725586, "global_step": 175809, "epoch": 1452} {"train_loss": -41.59639358520508, "global_step": 175810, "epoch": 1452} {"train_loss": -41.1535758972168, "global_step": 175811, "epoch": 1452} {"train_loss": -40.557495006845016, "global_step": 175812, "epoch": 1452, "val_loss": 2734155.75} {"train_loss": -41.05042266845703, "global_step": 175813, "epoch": 1453} {"train_loss": -40.35760498046875, "global_step": 175814, "epoch": 1453} {"train_loss": -40.33427047729492, "global_step": 175815, "epoch": 1453} {"train_loss": -41.18498611450195, "global_step": 175816, "epoch": 1453} {"train_loss": -40.555538177490234, "global_step": 175817, "epoch": 1453} {"train_loss": -39.924407958984375, "global_step": 175818, "epoch": 1453} {"train_loss": -42.35755157470703, "global_step": 175819, "epoch": 1453} {"train_loss": -40.67878341674805, "global_step": 175820, "epoch": 1453} {"train_loss": -40.38697052001953, "global_step": 175821, "epoch": 1453} {"train_loss": -40.71509552001953, "global_step": 175822, "epoch": 1453} {"train_loss": -42.333152770996094, "global_step": 175823, "epoch": 1453} {"train_loss": -39.61601257324219, "global_step": 175824, "epoch": 1453} {"train_loss": -41.19259262084961, "global_step": 175825, "epoch": 1453} {"train_loss": -40.80769729614258, "global_step": 175826, "epoch": 1453} {"train_loss": -39.2926139831543, "global_step": 175827, "epoch": 1453} {"train_loss": -40.45151138305664, "global_step": 175828, "epoch": 1453} {"train_loss": -41.015987396240234, "global_step": 175829, "epoch": 1453} {"train_loss": -40.987728118896484, "global_step": 175830, "epoch": 1453} {"train_loss": -40.924835205078125, "global_step": 175831, "epoch": 1453} {"train_loss": -41.82729721069336, "global_step": 175832, "epoch": 1453} {"train_loss": -41.10664749145508, "global_step": 175833, "epoch": 1453} {"train_loss": -41.30025863647461, "global_step": 175834, "epoch": 1453} {"train_loss": -41.528377532958984, "global_step": 175835, "epoch": 1453} {"train_loss": -40.76888656616211, "global_step": 175836, "epoch": 1453} {"train_loss": -41.31071853637695, "global_step": 175837, "epoch": 1453} {"train_loss": -40.790924072265625, "global_step": 175838, "epoch": 1453} {"train_loss": -41.10133743286133, "global_step": 175839, "epoch": 1453} {"train_loss": -41.605560302734375, "global_step": 175840, "epoch": 1453} {"train_loss": -41.05839920043945, "global_step": 175841, "epoch": 1453} {"train_loss": -41.04779052734375, "global_step": 175842, "epoch": 1453} {"train_loss": -40.68650436401367, "global_step": 175843, "epoch": 1453} {"train_loss": -40.64960479736328, "global_step": 175844, "epoch": 1453} {"train_loss": -41.08794021606445, "global_step": 175845, "epoch": 1453} {"train_loss": -40.3840446472168, "global_step": 175846, "epoch": 1453} {"train_loss": -41.53472900390625, "global_step": 175847, "epoch": 1453} {"train_loss": -41.341468811035156, "global_step": 175848, "epoch": 1453} {"train_loss": -41.80438995361328, "global_step": 175849, "epoch": 1453} {"train_loss": -40.341949462890625, "global_step": 175850, "epoch": 1453} {"train_loss": -41.326045989990234, "global_step": 175851, "epoch": 1453} {"train_loss": -42.16006088256836, "global_step": 175852, "epoch": 1453} {"train_loss": -40.79403305053711, "global_step": 175853, "epoch": 1453} {"train_loss": -40.81476974487305, "global_step": 175854, "epoch": 1453} {"train_loss": -40.518436431884766, "global_step": 175855, "epoch": 1453} {"train_loss": -41.55769729614258, "global_step": 175856, "epoch": 1453} {"train_loss": -40.025997161865234, "global_step": 175857, "epoch": 1453} {"train_loss": -41.34333801269531, "global_step": 175858, "epoch": 1453} {"train_loss": -39.864845275878906, "global_step": 175859, "epoch": 1453} {"train_loss": -41.39321517944336, "global_step": 175860, "epoch": 1453} {"train_loss": -41.40269088745117, "global_step": 175861, "epoch": 1453} {"train_loss": -41.254180908203125, "global_step": 175862, "epoch": 1453} {"train_loss": -41.54075241088867, "global_step": 175863, "epoch": 1453} {"train_loss": -41.89068603515625, "global_step": 175864, "epoch": 1453} {"train_loss": -41.7462043762207, "global_step": 175865, "epoch": 1453} {"train_loss": -41.38526916503906, "global_step": 175866, "epoch": 1453} {"train_loss": -42.035926818847656, "global_step": 175867, "epoch": 1453} {"train_loss": -41.660797119140625, "global_step": 175868, "epoch": 1453} {"train_loss": -42.09263229370117, "global_step": 175869, "epoch": 1453} {"train_loss": -41.7306022644043, "global_step": 175870, "epoch": 1453} {"train_loss": -42.264801025390625, "global_step": 175871, "epoch": 1453} {"train_loss": -42.033504486083984, "global_step": 175872, "epoch": 1453} {"train_loss": -42.38397216796875, "global_step": 175873, "epoch": 1453} {"train_loss": -41.43430709838867, "global_step": 175874, "epoch": 1453} {"train_loss": -41.448822021484375, "global_step": 175875, "epoch": 1453} {"train_loss": -42.13628387451172, "global_step": 175876, "epoch": 1453} {"train_loss": -40.971126556396484, "global_step": 175877, "epoch": 1453} {"train_loss": -41.13066864013672, "global_step": 175878, "epoch": 1453} {"train_loss": -42.05302810668945, "global_step": 175879, "epoch": 1453} {"train_loss": -41.6783332824707, "global_step": 175880, "epoch": 1453} {"train_loss": -40.962379455566406, "global_step": 175881, "epoch": 1453} {"train_loss": -41.75092315673828, "global_step": 175882, "epoch": 1453} {"train_loss": -41.4687614440918, "global_step": 175883, "epoch": 1453} {"train_loss": -41.61849594116211, "global_step": 175884, "epoch": 1453} {"train_loss": -41.22857666015625, "global_step": 175885, "epoch": 1453} {"train_loss": -41.6802978515625, "global_step": 175886, "epoch": 1453} {"train_loss": -41.62285614013672, "global_step": 175887, "epoch": 1453} {"train_loss": -41.10029220581055, "global_step": 175888, "epoch": 1453} {"train_loss": -41.50286865234375, "global_step": 175889, "epoch": 1453} {"train_loss": -42.2086067199707, "global_step": 175890, "epoch": 1453} {"train_loss": -39.81826400756836, "global_step": 175891, "epoch": 1453} {"train_loss": -41.06205368041992, "global_step": 175892, "epoch": 1453} {"train_loss": -40.48612594604492, "global_step": 175893, "epoch": 1453} {"train_loss": -40.37322998046875, "global_step": 175894, "epoch": 1453} {"train_loss": -39.452239990234375, "global_step": 175895, "epoch": 1453} {"train_loss": -41.79572296142578, "global_step": 175896, "epoch": 1453} {"train_loss": -39.36870193481445, "global_step": 175897, "epoch": 1453} {"train_loss": -40.77008819580078, "global_step": 175898, "epoch": 1453} {"train_loss": -40.275447845458984, "global_step": 175899, "epoch": 1453} {"train_loss": -40.88155746459961, "global_step": 175900, "epoch": 1453} {"train_loss": -40.716121673583984, "global_step": 175901, "epoch": 1453} {"train_loss": -40.89606475830078, "global_step": 175902, "epoch": 1453} {"train_loss": -40.68019485473633, "global_step": 175903, "epoch": 1453} {"train_loss": -40.46064376831055, "global_step": 175904, "epoch": 1453} {"train_loss": -40.97911834716797, "global_step": 175905, "epoch": 1453} {"train_loss": -40.768795013427734, "global_step": 175906, "epoch": 1453} {"train_loss": -40.32168197631836, "global_step": 175907, "epoch": 1453} {"train_loss": -41.60614013671875, "global_step": 175908, "epoch": 1453} {"train_loss": -40.25673294067383, "global_step": 175909, "epoch": 1453} {"train_loss": -41.25899887084961, "global_step": 175910, "epoch": 1453} {"train_loss": -40.96366500854492, "global_step": 175911, "epoch": 1453} {"train_loss": -40.521690368652344, "global_step": 175912, "epoch": 1453} {"train_loss": -41.85195541381836, "global_step": 175913, "epoch": 1453} {"train_loss": -40.85508346557617, "global_step": 175914, "epoch": 1453} {"train_loss": -41.23517990112305, "global_step": 175915, "epoch": 1453} {"train_loss": -41.41248321533203, "global_step": 175916, "epoch": 1453} {"train_loss": -41.922664642333984, "global_step": 175917, "epoch": 1453} {"train_loss": -42.063446044921875, "global_step": 175918, "epoch": 1453} {"train_loss": -41.30674743652344, "global_step": 175919, "epoch": 1453} {"train_loss": -40.16731643676758, "global_step": 175920, "epoch": 1453} {"train_loss": -41.58351516723633, "global_step": 175921, "epoch": 1453} {"train_loss": -40.93471908569336, "global_step": 175922, "epoch": 1453} {"train_loss": -41.9718017578125, "global_step": 175923, "epoch": 1453} {"train_loss": -41.10847091674805, "global_step": 175924, "epoch": 1453} {"train_loss": -41.225833892822266, "global_step": 175925, "epoch": 1453} {"train_loss": -42.2325439453125, "global_step": 175926, "epoch": 1453} {"train_loss": -41.24430847167969, "global_step": 175927, "epoch": 1453} {"train_loss": -41.938636779785156, "global_step": 175928, "epoch": 1453} {"train_loss": -41.65275955200195, "global_step": 175929, "epoch": 1453} {"train_loss": -41.059444427490234, "global_step": 175930, "epoch": 1453} {"train_loss": -42.13664627075195, "global_step": 175931, "epoch": 1453} {"train_loss": -42.34971237182617, "global_step": 175932, "epoch": 1453} {"train_loss": -41.16398551247337, "global_step": 175933, "epoch": 1453, "val_loss": 2690091.75} {"train_loss": -41.92082977294922, "global_step": 175934, "epoch": 1454} {"train_loss": -42.1048698425293, "global_step": 175935, "epoch": 1454} {"train_loss": -42.1136474609375, "global_step": 175936, "epoch": 1454} {"train_loss": -42.2781982421875, "global_step": 175937, "epoch": 1454} {"train_loss": -42.41848373413086, "global_step": 175938, "epoch": 1454} {"train_loss": -42.17249298095703, "global_step": 175939, "epoch": 1454} {"train_loss": -42.338836669921875, "global_step": 175940, "epoch": 1454} {"train_loss": -41.90401840209961, "global_step": 175941, "epoch": 1454} {"train_loss": -41.934906005859375, "global_step": 175942, "epoch": 1454} {"train_loss": -42.00971984863281, "global_step": 175943, "epoch": 1454} {"train_loss": -42.38312911987305, "global_step": 175944, "epoch": 1454} {"train_loss": -42.706825256347656, "global_step": 175945, "epoch": 1454} {"train_loss": -42.2832145690918, "global_step": 175946, "epoch": 1454} {"train_loss": -42.668006896972656, "global_step": 175947, "epoch": 1454} {"train_loss": -42.03413772583008, "global_step": 175948, "epoch": 1454} {"train_loss": -42.22834777832031, "global_step": 175949, "epoch": 1454} {"train_loss": -42.31987380981445, "global_step": 175950, "epoch": 1454} {"train_loss": -42.6333122253418, "global_step": 175951, "epoch": 1454} {"train_loss": -42.47706985473633, "global_step": 175952, "epoch": 1454} {"train_loss": -42.72924041748047, "global_step": 175953, "epoch": 1454} {"train_loss": -41.554134368896484, "global_step": 175954, "epoch": 1454} {"train_loss": -40.49687957763672, "global_step": 175955, "epoch": 1454} {"train_loss": -40.561073303222656, "global_step": 175956, "epoch": 1454} {"train_loss": -41.128501892089844, "global_step": 175957, "epoch": 1454} {"train_loss": -39.84202194213867, "global_step": 175958, "epoch": 1454} {"train_loss": -38.928585052490234, "global_step": 175959, "epoch": 1454} {"train_loss": -41.249610900878906, "global_step": 175960, "epoch": 1454} {"train_loss": -42.4641227722168, "global_step": 175961, "epoch": 1454} {"train_loss": -42.00284957885742, "global_step": 175962, "epoch": 1454} {"train_loss": -40.68793869018555, "global_step": 175963, "epoch": 1454} {"train_loss": -39.63245391845703, "global_step": 175964, "epoch": 1454} {"train_loss": -41.252716064453125, "global_step": 175965, "epoch": 1454} {"train_loss": -42.31972122192383, "global_step": 175966, "epoch": 1454} {"train_loss": -42.444210052490234, "global_step": 175967, "epoch": 1454} {"train_loss": -41.636775970458984, "global_step": 175968, "epoch": 1454} {"train_loss": -42.23592758178711, "global_step": 175969, "epoch": 1454} {"train_loss": -42.057796478271484, "global_step": 175970, "epoch": 1454} {"train_loss": -42.33087158203125, "global_step": 175971, "epoch": 1454} {"train_loss": -42.34867477416992, "global_step": 175972, "epoch": 1454} {"train_loss": -42.628509521484375, "global_step": 175973, "epoch": 1454} {"train_loss": -42.30251693725586, "global_step": 175974, "epoch": 1454} {"train_loss": -42.25718307495117, "global_step": 175975, "epoch": 1454} {"train_loss": -42.65217208862305, "global_step": 175976, "epoch": 1454} {"train_loss": -42.00088119506836, "global_step": 175977, "epoch": 1454} {"train_loss": -42.01467514038086, "global_step": 175978, "epoch": 1454} {"train_loss": -42.14937210083008, "global_step": 175979, "epoch": 1454} {"train_loss": -41.845497131347656, "global_step": 175980, "epoch": 1454} {"train_loss": -41.72450637817383, "global_step": 175981, "epoch": 1454} {"train_loss": -41.60459518432617, "global_step": 175982, "epoch": 1454} {"train_loss": -42.024871826171875, "global_step": 175983, "epoch": 1454} {"train_loss": -42.0467643737793, "global_step": 175984, "epoch": 1454} {"train_loss": -40.56455993652344, "global_step": 175985, "epoch": 1454} {"train_loss": -38.706241607666016, "global_step": 175986, "epoch": 1454} {"train_loss": -41.82593536376953, "global_step": 175987, "epoch": 1454} {"train_loss": -41.228538513183594, "global_step": 175988, "epoch": 1454} {"train_loss": -39.90166473388672, "global_step": 175989, "epoch": 1454} {"train_loss": -38.74375534057617, "global_step": 175990, "epoch": 1454} {"train_loss": -35.25106430053711, "global_step": 175991, "epoch": 1454} {"train_loss": -41.84153366088867, "global_step": 175992, "epoch": 1454} {"train_loss": -33.04753875732422, "global_step": 175993, "epoch": 1454} {"train_loss": -33.00217819213867, "global_step": 175994, "epoch": 1454} {"train_loss": -35.334259033203125, "global_step": 175995, "epoch": 1454} {"train_loss": -37.8084831237793, "global_step": 175996, "epoch": 1454} {"train_loss": -37.60908126831055, "global_step": 175997, "epoch": 1454} {"train_loss": -35.157981872558594, "global_step": 175998, "epoch": 1454} {"train_loss": -35.07050704956055, "global_step": 175999, "epoch": 1454} {"train_loss": -35.27566146850586, "global_step": 176000, "epoch": 1454} {"train_loss": -35.5366325378418, "global_step": 176001, "epoch": 1454} {"train_loss": -35.850074768066406, "global_step": 176002, "epoch": 1454} {"train_loss": -36.910762786865234, "global_step": 176003, "epoch": 1454} {"train_loss": -36.13806915283203, "global_step": 176004, "epoch": 1454} {"train_loss": -36.88408279418945, "global_step": 176005, "epoch": 1454} {"train_loss": -36.232967376708984, "global_step": 176006, "epoch": 1454} {"train_loss": -36.61069107055664, "global_step": 176007, "epoch": 1454} {"train_loss": -37.5689697265625, "global_step": 176008, "epoch": 1454} {"train_loss": -38.457820892333984, "global_step": 176009, "epoch": 1454} {"train_loss": -38.454524993896484, "global_step": 176010, "epoch": 1454} {"train_loss": -38.781856536865234, "global_step": 176011, "epoch": 1454} {"train_loss": -39.234859466552734, "global_step": 176012, "epoch": 1454} {"train_loss": -40.57527542114258, "global_step": 176013, "epoch": 1454} {"train_loss": -40.754913330078125, "global_step": 176014, "epoch": 1454} {"train_loss": -40.88755416870117, "global_step": 176015, "epoch": 1454} {"train_loss": -41.04648971557617, "global_step": 176016, "epoch": 1454} {"train_loss": -41.116783142089844, "global_step": 176017, "epoch": 1454} {"train_loss": -40.66070556640625, "global_step": 176018, "epoch": 1454} {"train_loss": -41.21087646484375, "global_step": 176019, "epoch": 1454} {"train_loss": -40.968502044677734, "global_step": 176020, "epoch": 1454} {"train_loss": -40.81171417236328, "global_step": 176021, "epoch": 1454} {"train_loss": -40.9522705078125, "global_step": 176022, "epoch": 1454} {"train_loss": -41.46659469604492, "global_step": 176023, "epoch": 1454} {"train_loss": -40.484432220458984, "global_step": 176024, "epoch": 1454} {"train_loss": -41.47932052612305, "global_step": 176025, "epoch": 1454} {"train_loss": -41.91643142700195, "global_step": 176026, "epoch": 1454} {"train_loss": -42.003501892089844, "global_step": 176027, "epoch": 1454} {"train_loss": -41.075469970703125, "global_step": 176028, "epoch": 1454} {"train_loss": -40.9417724609375, "global_step": 176029, "epoch": 1454} {"train_loss": -41.845436096191406, "global_step": 176030, "epoch": 1454} {"train_loss": -41.373023986816406, "global_step": 176031, "epoch": 1454} {"train_loss": -40.54051208496094, "global_step": 176032, "epoch": 1454} {"train_loss": -41.37910079956055, "global_step": 176033, "epoch": 1454} {"train_loss": -41.958251953125, "global_step": 176034, "epoch": 1454} {"train_loss": -41.72272872924805, "global_step": 176035, "epoch": 1454} {"train_loss": -41.939029693603516, "global_step": 176036, "epoch": 1454} {"train_loss": -41.1546630859375, "global_step": 176037, "epoch": 1454} {"train_loss": -41.48848342895508, "global_step": 176038, "epoch": 1454} {"train_loss": -42.54933547973633, "global_step": 176039, "epoch": 1454} {"train_loss": -42.20208740234375, "global_step": 176040, "epoch": 1454} {"train_loss": -41.78300857543945, "global_step": 176041, "epoch": 1454} {"train_loss": -42.14005661010742, "global_step": 176042, "epoch": 1454} {"train_loss": -42.23238754272461, "global_step": 176043, "epoch": 1454} {"train_loss": -42.53031921386719, "global_step": 176044, "epoch": 1454} {"train_loss": -42.423301696777344, "global_step": 176045, "epoch": 1454} {"train_loss": -42.02290725708008, "global_step": 176046, "epoch": 1454} {"train_loss": -41.28241729736328, "global_step": 176047, "epoch": 1454} {"train_loss": -41.7369270324707, "global_step": 176048, "epoch": 1454} {"train_loss": -42.59017562866211, "global_step": 176049, "epoch": 1454} {"train_loss": -41.78350830078125, "global_step": 176050, "epoch": 1454} {"train_loss": -40.42803955078125, "global_step": 176051, "epoch": 1454} {"train_loss": -40.84950637817383, "global_step": 176052, "epoch": 1454} {"train_loss": -39.94264221191406, "global_step": 176053, "epoch": 1454} {"train_loss": -40.66413879394531, "global_step": 176054, "epoch": 1454, "val_loss": 2623035.25} {"train_loss": -36.8347282409668, "global_step": 176055, "epoch": 1455} {"train_loss": -41.063533782958984, "global_step": 176056, "epoch": 1455} {"train_loss": -33.284725189208984, "global_step": 176057, "epoch": 1455} {"train_loss": -30.337512969970703, "global_step": 176058, "epoch": 1455} {"train_loss": -33.84183883666992, "global_step": 176059, "epoch": 1455} {"train_loss": -32.183349609375, "global_step": 176060, "epoch": 1455} {"train_loss": -34.72480010986328, "global_step": 176061, "epoch": 1455} {"train_loss": -32.386348724365234, "global_step": 176062, "epoch": 1455} {"train_loss": -35.353065490722656, "global_step": 176063, "epoch": 1455} {"train_loss": -33.401145935058594, "global_step": 176064, "epoch": 1455} {"train_loss": -34.4863166809082, "global_step": 176065, "epoch": 1455} {"train_loss": -34.998043060302734, "global_step": 176066, "epoch": 1455} {"train_loss": -34.79842758178711, "global_step": 176067, "epoch": 1455} {"train_loss": -36.15442657470703, "global_step": 176068, "epoch": 1455} {"train_loss": -33.85028076171875, "global_step": 176069, "epoch": 1455} {"train_loss": -36.189971923828125, "global_step": 176070, "epoch": 1455} {"train_loss": -34.02846145629883, "global_step": 176071, "epoch": 1455} {"train_loss": -34.34222412109375, "global_step": 176072, "epoch": 1455} {"train_loss": -35.86063766479492, "global_step": 176073, "epoch": 1455} {"train_loss": -34.77021408081055, "global_step": 176074, "epoch": 1455} {"train_loss": -34.480648040771484, "global_step": 176075, "epoch": 1455} {"train_loss": -36.85772705078125, "global_step": 176076, "epoch": 1455} {"train_loss": -35.65647888183594, "global_step": 176077, "epoch": 1455} {"train_loss": -35.73812484741211, "global_step": 176078, "epoch": 1455} {"train_loss": -35.951480865478516, "global_step": 176079, "epoch": 1455} {"train_loss": -36.236759185791016, "global_step": 176080, "epoch": 1455} {"train_loss": -36.57163619995117, "global_step": 176081, "epoch": 1455} {"train_loss": -37.022769927978516, "global_step": 176082, "epoch": 1455} {"train_loss": -36.93572235107422, "global_step": 176083, "epoch": 1455} {"train_loss": -36.851444244384766, "global_step": 176084, "epoch": 1455} {"train_loss": -36.960693359375, "global_step": 176085, "epoch": 1455} {"train_loss": -37.41145324707031, "global_step": 176086, "epoch": 1455} {"train_loss": -37.18484115600586, "global_step": 176087, "epoch": 1455} {"train_loss": -37.37146759033203, "global_step": 176088, "epoch": 1455} {"train_loss": -37.063350677490234, "global_step": 176089, "epoch": 1455} {"train_loss": -37.19448471069336, "global_step": 176090, "epoch": 1455} {"train_loss": -37.677284240722656, "global_step": 176091, "epoch": 1455} {"train_loss": -37.800933837890625, "global_step": 176092, "epoch": 1455} {"train_loss": -38.24544143676758, "global_step": 176093, "epoch": 1455} {"train_loss": -37.395233154296875, "global_step": 176094, "epoch": 1455} {"train_loss": -38.16476821899414, "global_step": 176095, "epoch": 1455} {"train_loss": -38.726871490478516, "global_step": 176096, "epoch": 1455} {"train_loss": -38.7856330871582, "global_step": 176097, "epoch": 1455} {"train_loss": -38.16786575317383, "global_step": 176098, "epoch": 1455} {"train_loss": -38.448516845703125, "global_step": 176099, "epoch": 1455} {"train_loss": -38.12846374511719, "global_step": 176100, "epoch": 1455} {"train_loss": -38.57892990112305, "global_step": 176101, "epoch": 1455} {"train_loss": -38.313232421875, "global_step": 176102, "epoch": 1455} {"train_loss": -38.45648193359375, "global_step": 176103, "epoch": 1455} {"train_loss": -38.40785598754883, "global_step": 176104, "epoch": 1455} {"train_loss": -38.81142044067383, "global_step": 176105, "epoch": 1455} {"train_loss": -38.55820846557617, "global_step": 176106, "epoch": 1455} {"train_loss": -37.455726623535156, "global_step": 176107, "epoch": 1455} {"train_loss": -36.45394515991211, "global_step": 176108, "epoch": 1455} {"train_loss": -35.47997283935547, "global_step": 176109, "epoch": 1455} {"train_loss": -33.6214714050293, "global_step": 176110, "epoch": 1455} {"train_loss": -30.819448471069336, "global_step": 176111, "epoch": 1455} {"train_loss": -36.06307601928711, "global_step": 176112, "epoch": 1455} {"train_loss": -33.77460861206055, "global_step": 176113, "epoch": 1455} {"train_loss": -37.707275390625, "global_step": 176114, "epoch": 1455} {"train_loss": -34.86738204956055, "global_step": 176115, "epoch": 1455} {"train_loss": -38.07198715209961, "global_step": 176116, "epoch": 1455} {"train_loss": -35.83476257324219, "global_step": 176117, "epoch": 1455} {"train_loss": -36.9957389831543, "global_step": 176118, "epoch": 1455} {"train_loss": -38.53860092163086, "global_step": 176119, "epoch": 1455} {"train_loss": -36.74392318725586, "global_step": 176120, "epoch": 1455} {"train_loss": -38.431365966796875, "global_step": 176121, "epoch": 1455} {"train_loss": -36.6042594909668, "global_step": 176122, "epoch": 1455} {"train_loss": -36.86029815673828, "global_step": 176123, "epoch": 1455} {"train_loss": -38.654170989990234, "global_step": 176124, "epoch": 1455} {"train_loss": -38.71174240112305, "global_step": 176125, "epoch": 1455} {"train_loss": -37.90676498413086, "global_step": 176126, "epoch": 1455} {"train_loss": -38.63129425048828, "global_step": 176127, "epoch": 1455} {"train_loss": -38.59957504272461, "global_step": 176128, "epoch": 1455} {"train_loss": -38.70762252807617, "global_step": 176129, "epoch": 1455} {"train_loss": -38.9013671875, "global_step": 176130, "epoch": 1455} {"train_loss": -38.41570281982422, "global_step": 176131, "epoch": 1455} {"train_loss": -38.61869430541992, "global_step": 176132, "epoch": 1455} {"train_loss": -39.07312774658203, "global_step": 176133, "epoch": 1455} {"train_loss": -39.10564041137695, "global_step": 176134, "epoch": 1455} {"train_loss": -38.2867546081543, "global_step": 176135, "epoch": 1455} {"train_loss": -38.74467086791992, "global_step": 176136, "epoch": 1455} {"train_loss": -38.82442855834961, "global_step": 176137, "epoch": 1455} {"train_loss": -37.66474533081055, "global_step": 176138, "epoch": 1455} {"train_loss": -36.6649055480957, "global_step": 176139, "epoch": 1455} {"train_loss": -35.830055236816406, "global_step": 176140, "epoch": 1455} {"train_loss": -39.28603744506836, "global_step": 176141, "epoch": 1455} {"train_loss": -37.40208053588867, "global_step": 176142, "epoch": 1455} {"train_loss": -37.744140625, "global_step": 176143, "epoch": 1455} {"train_loss": -39.301570892333984, "global_step": 176144, "epoch": 1455} {"train_loss": -37.82033157348633, "global_step": 176145, "epoch": 1455} {"train_loss": -39.41579055786133, "global_step": 176146, "epoch": 1455} {"train_loss": -37.70002365112305, "global_step": 176147, "epoch": 1455} {"train_loss": -38.56977462768555, "global_step": 176148, "epoch": 1455} {"train_loss": -38.525386810302734, "global_step": 176149, "epoch": 1455} {"train_loss": -39.12699508666992, "global_step": 176150, "epoch": 1455} {"train_loss": -39.770484924316406, "global_step": 176151, "epoch": 1455} {"train_loss": -38.530548095703125, "global_step": 176152, "epoch": 1455} {"train_loss": -39.4460563659668, "global_step": 176153, "epoch": 1455} {"train_loss": -38.12382507324219, "global_step": 176154, "epoch": 1455} {"train_loss": -37.93681335449219, "global_step": 176155, "epoch": 1455} {"train_loss": -35.72309875488281, "global_step": 176156, "epoch": 1455} {"train_loss": -38.335296630859375, "global_step": 176157, "epoch": 1455} {"train_loss": -38.56191635131836, "global_step": 176158, "epoch": 1455} {"train_loss": -36.91420364379883, "global_step": 176159, "epoch": 1455} {"train_loss": -38.49003219604492, "global_step": 176160, "epoch": 1455} {"train_loss": -37.30548095703125, "global_step": 176161, "epoch": 1455} {"train_loss": -35.767147064208984, "global_step": 176162, "epoch": 1455} {"train_loss": -33.055904388427734, "global_step": 176163, "epoch": 1455} {"train_loss": -32.13682174682617, "global_step": 176164, "epoch": 1455} {"train_loss": -38.67213821411133, "global_step": 176165, "epoch": 1455} {"train_loss": -37.184486389160156, "global_step": 176166, "epoch": 1455} {"train_loss": -37.46834182739258, "global_step": 176167, "epoch": 1455} {"train_loss": -38.723609924316406, "global_step": 176168, "epoch": 1455} {"train_loss": -37.62955856323242, "global_step": 176169, "epoch": 1455} {"train_loss": -39.078529357910156, "global_step": 176170, "epoch": 1455} {"train_loss": -38.15031433105469, "global_step": 176171, "epoch": 1455} {"train_loss": -38.86841583251953, "global_step": 176172, "epoch": 1455} {"train_loss": -38.59161376953125, "global_step": 176173, "epoch": 1455} {"train_loss": -39.36714172363281, "global_step": 176174, "epoch": 1455} {"train_loss": -37.05960819149806, "global_step": 176175, "epoch": 1455, "val_loss": 2499632.75} {"train_loss": -39.06884002685547, "global_step": 176176, "epoch": 1456} {"train_loss": -39.028289794921875, "global_step": 176177, "epoch": 1456} {"train_loss": -39.7398681640625, "global_step": 176178, "epoch": 1456} {"train_loss": -39.16957473754883, "global_step": 176179, "epoch": 1456} {"train_loss": -39.45878982543945, "global_step": 176180, "epoch": 1456} {"train_loss": -39.64213180541992, "global_step": 176181, "epoch": 1456} {"train_loss": -38.967498779296875, "global_step": 176182, "epoch": 1456} {"train_loss": -40.1035270690918, "global_step": 176183, "epoch": 1456} {"train_loss": -39.30851745605469, "global_step": 176184, "epoch": 1456} {"train_loss": -39.93447494506836, "global_step": 176185, "epoch": 1456} {"train_loss": -37.84705352783203, "global_step": 176186, "epoch": 1456} {"train_loss": -40.02179718017578, "global_step": 176187, "epoch": 1456} {"train_loss": -39.18854904174805, "global_step": 176188, "epoch": 1456} {"train_loss": -39.4433479309082, "global_step": 176189, "epoch": 1456} {"train_loss": -38.55463409423828, "global_step": 176190, "epoch": 1456} {"train_loss": -38.593509674072266, "global_step": 176191, "epoch": 1456} {"train_loss": -39.12360763549805, "global_step": 176192, "epoch": 1456} {"train_loss": -39.596981048583984, "global_step": 176193, "epoch": 1456} {"train_loss": -39.10530090332031, "global_step": 176194, "epoch": 1456} {"train_loss": -38.89997482299805, "global_step": 176195, "epoch": 1456} {"train_loss": -39.816165924072266, "global_step": 176196, "epoch": 1456} {"train_loss": -40.30462646484375, "global_step": 176197, "epoch": 1456} {"train_loss": -38.251800537109375, "global_step": 176198, "epoch": 1456} {"train_loss": -39.38459396362305, "global_step": 176199, "epoch": 1456} {"train_loss": -39.717369079589844, "global_step": 176200, "epoch": 1456} {"train_loss": -40.23179244995117, "global_step": 176201, "epoch": 1456} {"train_loss": -40.08248519897461, "global_step": 176202, "epoch": 1456} {"train_loss": -40.285423278808594, "global_step": 176203, "epoch": 1456} {"train_loss": -40.632015228271484, "global_step": 176204, "epoch": 1456} {"train_loss": -40.347984313964844, "global_step": 176205, "epoch": 1456} {"train_loss": -40.48177719116211, "global_step": 176206, "epoch": 1456} {"train_loss": -40.624446868896484, "global_step": 176207, "epoch": 1456} {"train_loss": -40.823997497558594, "global_step": 176208, "epoch": 1456} {"train_loss": -40.42707443237305, "global_step": 176209, "epoch": 1456} {"train_loss": -40.615455627441406, "global_step": 176210, "epoch": 1456} {"train_loss": -40.23960494995117, "global_step": 176211, "epoch": 1456} {"train_loss": -39.60871124267578, "global_step": 176212, "epoch": 1456} {"train_loss": -39.917137145996094, "global_step": 176213, "epoch": 1456} {"train_loss": -40.52467346191406, "global_step": 176214, "epoch": 1456} {"train_loss": -40.50612258911133, "global_step": 176215, "epoch": 1456} {"train_loss": -40.451908111572266, "global_step": 176216, "epoch": 1456} {"train_loss": -40.22257995605469, "global_step": 176217, "epoch": 1456} {"train_loss": -37.50313949584961, "global_step": 176218, "epoch": 1456} {"train_loss": -36.87588119506836, "global_step": 176219, "epoch": 1456} {"train_loss": -39.747406005859375, "global_step": 176220, "epoch": 1456} {"train_loss": -39.20952224731445, "global_step": 176221, "epoch": 1456} {"train_loss": -37.628639221191406, "global_step": 176222, "epoch": 1456} {"train_loss": -40.219154357910156, "global_step": 176223, "epoch": 1456} {"train_loss": -36.9531135559082, "global_step": 176224, "epoch": 1456} {"train_loss": -39.79908752441406, "global_step": 176225, "epoch": 1456} {"train_loss": -39.09841537475586, "global_step": 176226, "epoch": 1456} {"train_loss": -38.97254180908203, "global_step": 176227, "epoch": 1456} {"train_loss": -39.76701736450195, "global_step": 176228, "epoch": 1456} {"train_loss": -40.0696907043457, "global_step": 176229, "epoch": 1456} {"train_loss": -39.80209732055664, "global_step": 176230, "epoch": 1456} {"train_loss": -39.80097579956055, "global_step": 176231, "epoch": 1456} {"train_loss": -40.324031829833984, "global_step": 176232, "epoch": 1456} {"train_loss": -40.532196044921875, "global_step": 176233, "epoch": 1456} {"train_loss": -40.32307052612305, "global_step": 176234, "epoch": 1456} {"train_loss": -41.01433563232422, "global_step": 176235, "epoch": 1456} {"train_loss": -40.0247688293457, "global_step": 176236, "epoch": 1456} {"train_loss": -39.492759704589844, "global_step": 176237, "epoch": 1456} {"train_loss": -39.70783615112305, "global_step": 176238, "epoch": 1456} {"train_loss": -40.634552001953125, "global_step": 176239, "epoch": 1456} {"train_loss": -40.46213150024414, "global_step": 176240, "epoch": 1456} {"train_loss": -40.64093017578125, "global_step": 176241, "epoch": 1456} {"train_loss": -40.711517333984375, "global_step": 176242, "epoch": 1456} {"train_loss": -40.23524856567383, "global_step": 176243, "epoch": 1456} {"train_loss": -39.359474182128906, "global_step": 176244, "epoch": 1456} {"train_loss": -40.65729522705078, "global_step": 176245, "epoch": 1456} {"train_loss": -40.38518524169922, "global_step": 176246, "epoch": 1456} {"train_loss": -38.044593811035156, "global_step": 176247, "epoch": 1456} {"train_loss": -40.322242736816406, "global_step": 176248, "epoch": 1456} {"train_loss": -40.50504684448242, "global_step": 176249, "epoch": 1456} {"train_loss": -39.79899978637695, "global_step": 176250, "epoch": 1456} {"train_loss": -38.72133255004883, "global_step": 176251, "epoch": 1456} {"train_loss": -38.4296760559082, "global_step": 176252, "epoch": 1456} {"train_loss": -38.44230270385742, "global_step": 176253, "epoch": 1456} {"train_loss": -40.5877571105957, "global_step": 176254, "epoch": 1456} {"train_loss": -40.23046112060547, "global_step": 176255, "epoch": 1456} {"train_loss": -39.16089630126953, "global_step": 176256, "epoch": 1456} {"train_loss": -40.32882308959961, "global_step": 176257, "epoch": 1456} {"train_loss": -40.8931999206543, "global_step": 176258, "epoch": 1456} {"train_loss": -38.08475875854492, "global_step": 176259, "epoch": 1456} {"train_loss": -39.91280746459961, "global_step": 176260, "epoch": 1456} {"train_loss": -41.17753219604492, "global_step": 176261, "epoch": 1456} {"train_loss": -39.04488754272461, "global_step": 176262, "epoch": 1456} {"train_loss": -39.561824798583984, "global_step": 176263, "epoch": 1456} {"train_loss": -40.53005599975586, "global_step": 176264, "epoch": 1456} {"train_loss": -40.24705505371094, "global_step": 176265, "epoch": 1456} {"train_loss": -40.50739669799805, "global_step": 176266, "epoch": 1456} {"train_loss": -39.06647872924805, "global_step": 176267, "epoch": 1456} {"train_loss": -39.30059814453125, "global_step": 176268, "epoch": 1456} {"train_loss": -40.1309928894043, "global_step": 176269, "epoch": 1456} {"train_loss": -40.53768539428711, "global_step": 176270, "epoch": 1456} {"train_loss": -38.56504440307617, "global_step": 176271, "epoch": 1456} {"train_loss": -39.45947265625, "global_step": 176272, "epoch": 1456} {"train_loss": -38.97855758666992, "global_step": 176273, "epoch": 1456} {"train_loss": -39.103187561035156, "global_step": 176274, "epoch": 1456} {"train_loss": -37.34775924682617, "global_step": 176275, "epoch": 1456} {"train_loss": -40.07036209106445, "global_step": 176276, "epoch": 1456} {"train_loss": -40.10834884643555, "global_step": 176277, "epoch": 1456} {"train_loss": -39.61381912231445, "global_step": 176278, "epoch": 1456} {"train_loss": -27.192020416259766, "global_step": 176279, "epoch": 1456} {"train_loss": -36.81285095214844, "global_step": 176280, "epoch": 1456} {"train_loss": -37.34735870361328, "global_step": 176281, "epoch": 1456} {"train_loss": -37.693416595458984, "global_step": 176282, "epoch": 1456} {"train_loss": -37.91455078125, "global_step": 176283, "epoch": 1456} {"train_loss": -25.33070945739746, "global_step": 176284, "epoch": 1456} {"train_loss": -32.70429229736328, "global_step": 176285, "epoch": 1456} {"train_loss": -32.591163635253906, "global_step": 176286, "epoch": 1456} {"train_loss": -36.43461227416992, "global_step": 176287, "epoch": 1456} {"train_loss": -21.989307403564453, "global_step": 176288, "epoch": 1456} {"train_loss": -32.213958740234375, "global_step": 176289, "epoch": 1456} {"train_loss": -31.681385040283203, "global_step": 176290, "epoch": 1456} {"train_loss": -18.306488037109375, "global_step": 176291, "epoch": 1456} {"train_loss": -30.233591079711914, "global_step": 176292, "epoch": 1456} {"train_loss": -22.856950759887695, "global_step": 176293, "epoch": 1456} {"train_loss": -29.87013053894043, "global_step": 176294, "epoch": 1456} {"train_loss": -27.2519588470459, "global_step": 176295, "epoch": 1456} {"train_loss": -38.30603623193158, "global_step": 176296, "epoch": 1456, "val_loss": 2816621.0} {"train_loss": -25.783432006835938, "global_step": 176297, "epoch": 1457} {"train_loss": -29.650537490844727, "global_step": 176298, "epoch": 1457} {"train_loss": -24.31034278869629, "global_step": 176299, "epoch": 1457} {"train_loss": -31.504323959350586, "global_step": 176300, "epoch": 1457} {"train_loss": -29.86231803894043, "global_step": 176301, "epoch": 1457} {"train_loss": -25.891050338745117, "global_step": 176302, "epoch": 1457} {"train_loss": -34.281341552734375, "global_step": 176303, "epoch": 1457} {"train_loss": -33.353004455566406, "global_step": 176304, "epoch": 1457} {"train_loss": -30.110370635986328, "global_step": 176305, "epoch": 1457} {"train_loss": -31.695148468017578, "global_step": 176306, "epoch": 1457} {"train_loss": -31.812427520751953, "global_step": 176307, "epoch": 1457} {"train_loss": -36.38041305541992, "global_step": 176308, "epoch": 1457} {"train_loss": -30.83271598815918, "global_step": 176309, "epoch": 1457} {"train_loss": -35.74271774291992, "global_step": 176310, "epoch": 1457} {"train_loss": -34.899261474609375, "global_step": 176311, "epoch": 1457} {"train_loss": -35.60205078125, "global_step": 176312, "epoch": 1457} {"train_loss": -34.461181640625, "global_step": 176313, "epoch": 1457} {"train_loss": -35.38599395751953, "global_step": 176314, "epoch": 1457} {"train_loss": -29.560306549072266, "global_step": 176315, "epoch": 1457} {"train_loss": -36.510047912597656, "global_step": 176316, "epoch": 1457} {"train_loss": -34.806243896484375, "global_step": 176317, "epoch": 1457} {"train_loss": -35.806827545166016, "global_step": 176318, "epoch": 1457} {"train_loss": -34.173988342285156, "global_step": 176319, "epoch": 1457} {"train_loss": -35.4729118347168, "global_step": 176320, "epoch": 1457} {"train_loss": -35.83277130126953, "global_step": 176321, "epoch": 1457} {"train_loss": -34.91038513183594, "global_step": 176322, "epoch": 1457} {"train_loss": -35.21857452392578, "global_step": 176323, "epoch": 1457} {"train_loss": -36.24689483642578, "global_step": 176324, "epoch": 1457} {"train_loss": -36.02394485473633, "global_step": 176325, "epoch": 1457} {"train_loss": -36.472835540771484, "global_step": 176326, "epoch": 1457} {"train_loss": -34.99342727661133, "global_step": 176327, "epoch": 1457} {"train_loss": -36.677154541015625, "global_step": 176328, "epoch": 1457} {"train_loss": -35.8018684387207, "global_step": 176329, "epoch": 1457} {"train_loss": -35.71382522583008, "global_step": 176330, "epoch": 1457} {"train_loss": -36.74753952026367, "global_step": 176331, "epoch": 1457} {"train_loss": -36.09475326538086, "global_step": 176332, "epoch": 1457} {"train_loss": -36.51205825805664, "global_step": 176333, "epoch": 1457} {"train_loss": -35.85133743286133, "global_step": 176334, "epoch": 1457} {"train_loss": -36.745323181152344, "global_step": 176335, "epoch": 1457} {"train_loss": -35.583065032958984, "global_step": 176336, "epoch": 1457} {"train_loss": -37.079898834228516, "global_step": 176337, "epoch": 1457} {"train_loss": -37.126983642578125, "global_step": 176338, "epoch": 1457} {"train_loss": -37.293434143066406, "global_step": 176339, "epoch": 1457} {"train_loss": -36.62229537963867, "global_step": 176340, "epoch": 1457} {"train_loss": -37.168392181396484, "global_step": 176341, "epoch": 1457} {"train_loss": -36.42791748046875, "global_step": 176342, "epoch": 1457} {"train_loss": -37.05497360229492, "global_step": 176343, "epoch": 1457} {"train_loss": -37.25321578979492, "global_step": 176344, "epoch": 1457} {"train_loss": -36.758399963378906, "global_step": 176345, "epoch": 1457} {"train_loss": -37.551021575927734, "global_step": 176346, "epoch": 1457} {"train_loss": -37.1944694519043, "global_step": 176347, "epoch": 1457} {"train_loss": -36.5504150390625, "global_step": 176348, "epoch": 1457} {"train_loss": -37.101715087890625, "global_step": 176349, "epoch": 1457} {"train_loss": -37.382972717285156, "global_step": 176350, "epoch": 1457} {"train_loss": -37.71240997314453, "global_step": 176351, "epoch": 1457} {"train_loss": -37.637657165527344, "global_step": 176352, "epoch": 1457} {"train_loss": -37.34675216674805, "global_step": 176353, "epoch": 1457} {"train_loss": -37.35449981689453, "global_step": 176354, "epoch": 1457} {"train_loss": -37.85587692260742, "global_step": 176355, "epoch": 1457} {"train_loss": -37.510738372802734, "global_step": 176356, "epoch": 1457} {"train_loss": -37.70856857299805, "global_step": 176357, "epoch": 1457} {"train_loss": -38.0744743347168, "global_step": 176358, "epoch": 1457} {"train_loss": -36.716590881347656, "global_step": 176359, "epoch": 1457} {"train_loss": -37.525291442871094, "global_step": 176360, "epoch": 1457} {"train_loss": -37.40333938598633, "global_step": 176361, "epoch": 1457} {"train_loss": -37.510536193847656, "global_step": 176362, "epoch": 1457} {"train_loss": -38.12512969970703, "global_step": 176363, "epoch": 1457} {"train_loss": -37.50384521484375, "global_step": 176364, "epoch": 1457} {"train_loss": -37.58963394165039, "global_step": 176365, "epoch": 1457} {"train_loss": -37.97129440307617, "global_step": 176366, "epoch": 1457} {"train_loss": -38.1163215637207, "global_step": 176367, "epoch": 1457} {"train_loss": -37.25843811035156, "global_step": 176368, "epoch": 1457} {"train_loss": -38.547977447509766, "global_step": 176369, "epoch": 1457} {"train_loss": -38.1528434753418, "global_step": 176370, "epoch": 1457} {"train_loss": -38.32294845581055, "global_step": 176371, "epoch": 1457} {"train_loss": -37.851314544677734, "global_step": 176372, "epoch": 1457} {"train_loss": -38.74272918701172, "global_step": 176373, "epoch": 1457} {"train_loss": -38.36599349975586, "global_step": 176374, "epoch": 1457} {"train_loss": -38.30477523803711, "global_step": 176375, "epoch": 1457} {"train_loss": -38.16018295288086, "global_step": 176376, "epoch": 1457} {"train_loss": -38.758174896240234, "global_step": 176377, "epoch": 1457} {"train_loss": -38.67893600463867, "global_step": 176378, "epoch": 1457} {"train_loss": -38.05690383911133, "global_step": 176379, "epoch": 1457} {"train_loss": -37.533992767333984, "global_step": 176380, "epoch": 1457} {"train_loss": -39.28093338012695, "global_step": 176381, "epoch": 1457} {"train_loss": -38.132301330566406, "global_step": 176382, "epoch": 1457} {"train_loss": -38.31502914428711, "global_step": 176383, "epoch": 1457} {"train_loss": -38.053810119628906, "global_step": 176384, "epoch": 1457} {"train_loss": -38.28900909423828, "global_step": 176385, "epoch": 1457} {"train_loss": -38.85465621948242, "global_step": 176386, "epoch": 1457} {"train_loss": -39.204532623291016, "global_step": 176387, "epoch": 1457} {"train_loss": -38.012142181396484, "global_step": 176388, "epoch": 1457} {"train_loss": -38.95193099975586, "global_step": 176389, "epoch": 1457} {"train_loss": -38.73651123046875, "global_step": 176390, "epoch": 1457} {"train_loss": -39.55303955078125, "global_step": 176391, "epoch": 1457} {"train_loss": -38.531497955322266, "global_step": 176392, "epoch": 1457} {"train_loss": -38.54136276245117, "global_step": 176393, "epoch": 1457} {"train_loss": -38.83130645751953, "global_step": 176394, "epoch": 1457} {"train_loss": -38.761070251464844, "global_step": 176395, "epoch": 1457} {"train_loss": -38.76983642578125, "global_step": 176396, "epoch": 1457} {"train_loss": -39.036067962646484, "global_step": 176397, "epoch": 1457} {"train_loss": -38.62439727783203, "global_step": 176398, "epoch": 1457} {"train_loss": -39.81631088256836, "global_step": 176399, "epoch": 1457} {"train_loss": -38.9039421081543, "global_step": 176400, "epoch": 1457} {"train_loss": -39.44491958618164, "global_step": 176401, "epoch": 1457} {"train_loss": -37.694725036621094, "global_step": 176402, "epoch": 1457} {"train_loss": -34.90180587768555, "global_step": 176403, "epoch": 1457} {"train_loss": -30.241424560546875, "global_step": 176404, "epoch": 1457} {"train_loss": -22.125974655151367, "global_step": 176405, "epoch": 1457} {"train_loss": -24.3239803314209, "global_step": 176406, "epoch": 1457} {"train_loss": -39.358577728271484, "global_step": 176407, "epoch": 1457} {"train_loss": -26.581003189086914, "global_step": 176408, "epoch": 1457} {"train_loss": -35.63465118408203, "global_step": 176409, "epoch": 1457} {"train_loss": -32.49521255493164, "global_step": 176410, "epoch": 1457} {"train_loss": -35.313209533691406, "global_step": 176411, "epoch": 1457} {"train_loss": -34.5540657043457, "global_step": 176412, "epoch": 1457} {"train_loss": -37.42686080932617, "global_step": 176413, "epoch": 1457} {"train_loss": -34.548439025878906, "global_step": 176414, "epoch": 1457} {"train_loss": -37.57783889770508, "global_step": 176415, "epoch": 1457} {"train_loss": -35.61475372314453, "global_step": 176416, "epoch": 1457} {"train_loss": -36.02505728035919, "global_step": 176417, "epoch": 1457, "val_loss": 2671627.5} {"train_loss": -38.12314987182617, "global_step": 176418, "epoch": 1458} {"train_loss": -37.593421936035156, "global_step": 176419, "epoch": 1458} {"train_loss": -38.18349075317383, "global_step": 176420, "epoch": 1458} {"train_loss": -37.165618896484375, "global_step": 176421, "epoch": 1458} {"train_loss": -38.2468147277832, "global_step": 176422, "epoch": 1458} {"train_loss": -38.31720733642578, "global_step": 176423, "epoch": 1458} {"train_loss": -38.12961196899414, "global_step": 176424, "epoch": 1458} {"train_loss": -38.70492935180664, "global_step": 176425, "epoch": 1458} {"train_loss": -38.364471435546875, "global_step": 176426, "epoch": 1458} {"train_loss": -38.59214401245117, "global_step": 176427, "epoch": 1458} {"train_loss": -38.40066146850586, "global_step": 176428, "epoch": 1458} {"train_loss": -38.75458526611328, "global_step": 176429, "epoch": 1458} {"train_loss": -38.51436233520508, "global_step": 176430, "epoch": 1458} {"train_loss": -38.31058883666992, "global_step": 176431, "epoch": 1458} {"train_loss": -38.42597579956055, "global_step": 176432, "epoch": 1458} {"train_loss": -38.63972854614258, "global_step": 176433, "epoch": 1458} {"train_loss": -38.755462646484375, "global_step": 176434, "epoch": 1458} {"train_loss": -39.02898025512695, "global_step": 176435, "epoch": 1458} {"train_loss": -38.67487716674805, "global_step": 176436, "epoch": 1458} {"train_loss": -38.94654083251953, "global_step": 176437, "epoch": 1458} {"train_loss": -38.78582000732422, "global_step": 176438, "epoch": 1458} {"train_loss": -38.90036392211914, "global_step": 176439, "epoch": 1458} {"train_loss": -39.1472053527832, "global_step": 176440, "epoch": 1458} {"train_loss": -39.1749153137207, "global_step": 176441, "epoch": 1458} {"train_loss": -39.30998611450195, "global_step": 176442, "epoch": 1458} {"train_loss": -39.42788314819336, "global_step": 176443, "epoch": 1458} {"train_loss": -39.0366325378418, "global_step": 176444, "epoch": 1458} {"train_loss": -38.840187072753906, "global_step": 176445, "epoch": 1458} {"train_loss": -39.15406036376953, "global_step": 176446, "epoch": 1458} {"train_loss": -39.31528854370117, "global_step": 176447, "epoch": 1458} {"train_loss": -39.0172233581543, "global_step": 176448, "epoch": 1458} {"train_loss": -39.106666564941406, "global_step": 176449, "epoch": 1458} {"train_loss": -39.13753890991211, "global_step": 176450, "epoch": 1458} {"train_loss": -39.09428405761719, "global_step": 176451, "epoch": 1458} {"train_loss": -39.44221496582031, "global_step": 176452, "epoch": 1458} {"train_loss": -39.0886116027832, "global_step": 176453, "epoch": 1458} {"train_loss": -39.20154571533203, "global_step": 176454, "epoch": 1458} {"train_loss": -39.0811767578125, "global_step": 176455, "epoch": 1458} {"train_loss": -39.435359954833984, "global_step": 176456, "epoch": 1458} {"train_loss": -40.0920295715332, "global_step": 176457, "epoch": 1458} {"train_loss": -39.25617599487305, "global_step": 176458, "epoch": 1458} {"train_loss": -39.54093551635742, "global_step": 176459, "epoch": 1458} {"train_loss": -40.167964935302734, "global_step": 176460, "epoch": 1458} {"train_loss": -39.7281608581543, "global_step": 176461, "epoch": 1458} {"train_loss": -40.460689544677734, "global_step": 176462, "epoch": 1458} {"train_loss": -39.89397048950195, "global_step": 176463, "epoch": 1458} {"train_loss": -39.49079513549805, "global_step": 176464, "epoch": 1458} {"train_loss": -39.88753890991211, "global_step": 176465, "epoch": 1458} {"train_loss": -39.40391159057617, "global_step": 176466, "epoch": 1458} {"train_loss": -39.373077392578125, "global_step": 176467, "epoch": 1458} {"train_loss": -40.4226188659668, "global_step": 176468, "epoch": 1458} {"train_loss": -39.89057540893555, "global_step": 176469, "epoch": 1458} {"train_loss": -40.040958404541016, "global_step": 176470, "epoch": 1458} {"train_loss": -39.46661376953125, "global_step": 176471, "epoch": 1458} {"train_loss": -39.65005874633789, "global_step": 176472, "epoch": 1458} {"train_loss": -39.66460037231445, "global_step": 176473, "epoch": 1458} {"train_loss": -39.246612548828125, "global_step": 176474, "epoch": 1458} {"train_loss": -39.71751022338867, "global_step": 176475, "epoch": 1458} {"train_loss": -39.0796012878418, "global_step": 176476, "epoch": 1458} {"train_loss": -39.24524688720703, "global_step": 176477, "epoch": 1458} {"train_loss": -39.278011322021484, "global_step": 176478, "epoch": 1458} {"train_loss": -38.915340423583984, "global_step": 176479, "epoch": 1458} {"train_loss": -38.83037567138672, "global_step": 176480, "epoch": 1458} {"train_loss": -39.69607162475586, "global_step": 176481, "epoch": 1458} {"train_loss": -40.20536422729492, "global_step": 176482, "epoch": 1458} {"train_loss": -39.78854751586914, "global_step": 176483, "epoch": 1458} {"train_loss": -38.60622787475586, "global_step": 176484, "epoch": 1458} {"train_loss": -38.62594223022461, "global_step": 176485, "epoch": 1458} {"train_loss": -39.16236114501953, "global_step": 176486, "epoch": 1458} {"train_loss": -38.64136505126953, "global_step": 176487, "epoch": 1458} {"train_loss": -39.6227912902832, "global_step": 176488, "epoch": 1458} {"train_loss": -39.877864837646484, "global_step": 176489, "epoch": 1458} {"train_loss": -40.85280227661133, "global_step": 176490, "epoch": 1458} {"train_loss": -39.16270065307617, "global_step": 176491, "epoch": 1458} {"train_loss": -38.21281051635742, "global_step": 176492, "epoch": 1458} {"train_loss": -39.91582107543945, "global_step": 176493, "epoch": 1458} {"train_loss": -39.28963851928711, "global_step": 176494, "epoch": 1458} {"train_loss": -38.329280853271484, "global_step": 176495, "epoch": 1458} {"train_loss": -37.401458740234375, "global_step": 176496, "epoch": 1458} {"train_loss": -40.09351348876953, "global_step": 176497, "epoch": 1458} {"train_loss": -38.69855880737305, "global_step": 176498, "epoch": 1458} {"train_loss": -37.26253128051758, "global_step": 176499, "epoch": 1458} {"train_loss": -38.49690628051758, "global_step": 176500, "epoch": 1458} {"train_loss": -38.610816955566406, "global_step": 176501, "epoch": 1458} {"train_loss": -37.51041793823242, "global_step": 176502, "epoch": 1458} {"train_loss": -39.01545333862305, "global_step": 176503, "epoch": 1458} {"train_loss": -39.364925384521484, "global_step": 176504, "epoch": 1458} {"train_loss": -38.822349548339844, "global_step": 176505, "epoch": 1458} {"train_loss": -39.70018768310547, "global_step": 176506, "epoch": 1458} {"train_loss": -38.84442901611328, "global_step": 176507, "epoch": 1458} {"train_loss": -39.69827651977539, "global_step": 176508, "epoch": 1458} {"train_loss": -37.96702194213867, "global_step": 176509, "epoch": 1458} {"train_loss": -38.96776580810547, "global_step": 176510, "epoch": 1458} {"train_loss": -39.10601806640625, "global_step": 176511, "epoch": 1458} {"train_loss": -39.709808349609375, "global_step": 176512, "epoch": 1458} {"train_loss": -39.368892669677734, "global_step": 176513, "epoch": 1458} {"train_loss": -39.01642990112305, "global_step": 176514, "epoch": 1458} {"train_loss": -39.72591781616211, "global_step": 176515, "epoch": 1458} {"train_loss": -39.00050354003906, "global_step": 176516, "epoch": 1458} {"train_loss": -39.978797912597656, "global_step": 176517, "epoch": 1458} {"train_loss": -39.155269622802734, "global_step": 176518, "epoch": 1458} {"train_loss": -40.37522506713867, "global_step": 176519, "epoch": 1458} {"train_loss": -38.61579513549805, "global_step": 176520, "epoch": 1458} {"train_loss": -38.59804153442383, "global_step": 176521, "epoch": 1458} {"train_loss": -38.50411605834961, "global_step": 176522, "epoch": 1458} {"train_loss": -38.87770462036133, "global_step": 176523, "epoch": 1458} {"train_loss": -39.5063591003418, "global_step": 176524, "epoch": 1458} {"train_loss": -39.31960678100586, "global_step": 176525, "epoch": 1458} {"train_loss": -38.98429870605469, "global_step": 176526, "epoch": 1458} {"train_loss": -40.239315032958984, "global_step": 176527, "epoch": 1458} {"train_loss": -40.07816696166992, "global_step": 176528, "epoch": 1458} {"train_loss": -38.93600082397461, "global_step": 176529, "epoch": 1458} {"train_loss": -40.227333068847656, "global_step": 176530, "epoch": 1458} {"train_loss": -40.563575744628906, "global_step": 176531, "epoch": 1458} {"train_loss": -40.437347412109375, "global_step": 176532, "epoch": 1458} {"train_loss": -40.5281867980957, "global_step": 176533, "epoch": 1458} {"train_loss": -40.25350570678711, "global_step": 176534, "epoch": 1458} {"train_loss": -40.24697494506836, "global_step": 176535, "epoch": 1458} {"train_loss": -40.418338775634766, "global_step": 176536, "epoch": 1458} {"train_loss": -40.638484954833984, "global_step": 176537, "epoch": 1458} {"train_loss": -39.19615507519935, "global_step": 176538, "epoch": 1458, "val_loss": 2539844.25} {"train_loss": -40.71714401245117, "global_step": 176539, "epoch": 1459} {"train_loss": -38.06639862060547, "global_step": 176540, "epoch": 1459} {"train_loss": -40.810768127441406, "global_step": 176541, "epoch": 1459} {"train_loss": -40.672786712646484, "global_step": 176542, "epoch": 1459} {"train_loss": -40.23112106323242, "global_step": 176543, "epoch": 1459} {"train_loss": -39.077571868896484, "global_step": 176544, "epoch": 1459} {"train_loss": -39.645931243896484, "global_step": 176545, "epoch": 1459} {"train_loss": -38.89450454711914, "global_step": 176546, "epoch": 1459} {"train_loss": -39.994781494140625, "global_step": 176547, "epoch": 1459} {"train_loss": -41.07823944091797, "global_step": 176548, "epoch": 1459} {"train_loss": -40.30424118041992, "global_step": 176549, "epoch": 1459} {"train_loss": -41.155250549316406, "global_step": 176550, "epoch": 1459} {"train_loss": -40.09423065185547, "global_step": 176551, "epoch": 1459} {"train_loss": -41.055118560791016, "global_step": 176552, "epoch": 1459} {"train_loss": -40.507110595703125, "global_step": 176553, "epoch": 1459} {"train_loss": -40.9108772277832, "global_step": 176554, "epoch": 1459} {"train_loss": -39.34628677368164, "global_step": 176555, "epoch": 1459} {"train_loss": -40.22190475463867, "global_step": 176556, "epoch": 1459} {"train_loss": -38.483943939208984, "global_step": 176557, "epoch": 1459} {"train_loss": -40.32001876831055, "global_step": 176558, "epoch": 1459} {"train_loss": -40.45357894897461, "global_step": 176559, "epoch": 1459} {"train_loss": -40.32485580444336, "global_step": 176560, "epoch": 1459} {"train_loss": -40.58040237426758, "global_step": 176561, "epoch": 1459} {"train_loss": -40.61399459838867, "global_step": 176562, "epoch": 1459} {"train_loss": -41.20820236206055, "global_step": 176563, "epoch": 1459} {"train_loss": -40.96505355834961, "global_step": 176564, "epoch": 1459} {"train_loss": -41.10950469970703, "global_step": 176565, "epoch": 1459} {"train_loss": -40.0670280456543, "global_step": 176566, "epoch": 1459} {"train_loss": -40.1683349609375, "global_step": 176567, "epoch": 1459} {"train_loss": -40.81075668334961, "global_step": 176568, "epoch": 1459} {"train_loss": -39.791744232177734, "global_step": 176569, "epoch": 1459} {"train_loss": -40.42155075073242, "global_step": 176570, "epoch": 1459} {"train_loss": -40.40353012084961, "global_step": 176571, "epoch": 1459} {"train_loss": -40.497745513916016, "global_step": 176572, "epoch": 1459} {"train_loss": -40.98798751831055, "global_step": 176573, "epoch": 1459} {"train_loss": -40.473995208740234, "global_step": 176574, "epoch": 1459} {"train_loss": -41.10918426513672, "global_step": 176575, "epoch": 1459} {"train_loss": -38.905921936035156, "global_step": 176576, "epoch": 1459} {"train_loss": -40.02510452270508, "global_step": 176577, "epoch": 1459} {"train_loss": -38.523590087890625, "global_step": 176578, "epoch": 1459} {"train_loss": -39.00910186767578, "global_step": 176579, "epoch": 1459} {"train_loss": -35.737667083740234, "global_step": 176580, "epoch": 1459} {"train_loss": -35.30068588256836, "global_step": 176581, "epoch": 1459} {"train_loss": -36.83286666870117, "global_step": 176582, "epoch": 1459} {"train_loss": -38.95855712890625, "global_step": 176583, "epoch": 1459} {"train_loss": -39.47529602050781, "global_step": 176584, "epoch": 1459} {"train_loss": -38.29314041137695, "global_step": 176585, "epoch": 1459} {"train_loss": -37.2265739440918, "global_step": 176586, "epoch": 1459} {"train_loss": -36.392242431640625, "global_step": 176587, "epoch": 1459} {"train_loss": -39.7694206237793, "global_step": 176588, "epoch": 1459} {"train_loss": -39.25228500366211, "global_step": 176589, "epoch": 1459} {"train_loss": -38.27048873901367, "global_step": 176590, "epoch": 1459} {"train_loss": -39.62472915649414, "global_step": 176591, "epoch": 1459} {"train_loss": -39.95780563354492, "global_step": 176592, "epoch": 1459} {"train_loss": -33.482479095458984, "global_step": 176593, "epoch": 1459} {"train_loss": -33.627044677734375, "global_step": 176594, "epoch": 1459} {"train_loss": -36.579345703125, "global_step": 176595, "epoch": 1459} {"train_loss": -37.92284393310547, "global_step": 176596, "epoch": 1459} {"train_loss": -37.79642868041992, "global_step": 176597, "epoch": 1459} {"train_loss": -37.41111755371094, "global_step": 176598, "epoch": 1459} {"train_loss": -38.22895431518555, "global_step": 176599, "epoch": 1459} {"train_loss": -37.31167984008789, "global_step": 176600, "epoch": 1459} {"train_loss": -37.2530403137207, "global_step": 176601, "epoch": 1459} {"train_loss": -39.06898880004883, "global_step": 176602, "epoch": 1459} {"train_loss": -38.58723449707031, "global_step": 176603, "epoch": 1459} {"train_loss": -38.7285041809082, "global_step": 176604, "epoch": 1459} {"train_loss": -38.7425537109375, "global_step": 176605, "epoch": 1459} {"train_loss": -39.07124328613281, "global_step": 176606, "epoch": 1459} {"train_loss": -39.137306213378906, "global_step": 176607, "epoch": 1459} {"train_loss": -38.512691497802734, "global_step": 176608, "epoch": 1459} {"train_loss": -38.90113830566406, "global_step": 176609, "epoch": 1459} {"train_loss": -38.12548065185547, "global_step": 176610, "epoch": 1459} {"train_loss": -37.836830139160156, "global_step": 176611, "epoch": 1459} {"train_loss": -38.153350830078125, "global_step": 176612, "epoch": 1459} {"train_loss": -39.06604766845703, "global_step": 176613, "epoch": 1459} {"train_loss": -38.709232330322266, "global_step": 176614, "epoch": 1459} {"train_loss": -39.20905685424805, "global_step": 176615, "epoch": 1459} {"train_loss": -39.549530029296875, "global_step": 176616, "epoch": 1459} {"train_loss": -37.9178352355957, "global_step": 176617, "epoch": 1459} {"train_loss": -40.31980895996094, "global_step": 176618, "epoch": 1459} {"train_loss": -37.90887451171875, "global_step": 176619, "epoch": 1459} {"train_loss": -38.76646041870117, "global_step": 176620, "epoch": 1459} {"train_loss": -38.59565353393555, "global_step": 176621, "epoch": 1459} {"train_loss": -38.47587585449219, "global_step": 176622, "epoch": 1459} {"train_loss": -39.959285736083984, "global_step": 176623, "epoch": 1459} {"train_loss": -39.035614013671875, "global_step": 176624, "epoch": 1459} {"train_loss": -38.73846435546875, "global_step": 176625, "epoch": 1459} {"train_loss": -39.53690719604492, "global_step": 176626, "epoch": 1459} {"train_loss": -39.94930648803711, "global_step": 176627, "epoch": 1459} {"train_loss": -39.0191535949707, "global_step": 176628, "epoch": 1459} {"train_loss": -39.41752243041992, "global_step": 176629, "epoch": 1459} {"train_loss": -39.488868713378906, "global_step": 176630, "epoch": 1459} {"train_loss": -38.968135833740234, "global_step": 176631, "epoch": 1459} {"train_loss": -40.07817840576172, "global_step": 176632, "epoch": 1459} {"train_loss": -39.450321197509766, "global_step": 176633, "epoch": 1459} {"train_loss": -39.471778869628906, "global_step": 176634, "epoch": 1459} {"train_loss": -39.578392028808594, "global_step": 176635, "epoch": 1459} {"train_loss": -40.2647590637207, "global_step": 176636, "epoch": 1459} {"train_loss": -40.229740142822266, "global_step": 176637, "epoch": 1459} {"train_loss": -38.9173698425293, "global_step": 176638, "epoch": 1459} {"train_loss": -40.104248046875, "global_step": 176639, "epoch": 1459} {"train_loss": -40.381591796875, "global_step": 176640, "epoch": 1459} {"train_loss": -40.03595733642578, "global_step": 176641, "epoch": 1459} {"train_loss": -40.123016357421875, "global_step": 176642, "epoch": 1459} {"train_loss": -39.656124114990234, "global_step": 176643, "epoch": 1459} {"train_loss": -39.43241500854492, "global_step": 176644, "epoch": 1459} {"train_loss": -39.7782096862793, "global_step": 176645, "epoch": 1459} {"train_loss": -40.90810012817383, "global_step": 176646, "epoch": 1459} {"train_loss": -39.784454345703125, "global_step": 176647, "epoch": 1459} {"train_loss": -37.65629577636719, "global_step": 176648, "epoch": 1459} {"train_loss": -37.21320343017578, "global_step": 176649, "epoch": 1459} {"train_loss": -40.74989700317383, "global_step": 176650, "epoch": 1459} {"train_loss": -40.176368713378906, "global_step": 176651, "epoch": 1459} {"train_loss": -40.86159896850586, "global_step": 176652, "epoch": 1459} {"train_loss": -40.89146423339844, "global_step": 176653, "epoch": 1459} {"train_loss": -40.69362258911133, "global_step": 176654, "epoch": 1459} {"train_loss": -40.103580474853516, "global_step": 176655, "epoch": 1459} {"train_loss": -40.780860900878906, "global_step": 176656, "epoch": 1459} {"train_loss": -40.016334533691406, "global_step": 176657, "epoch": 1459} {"train_loss": -39.896507263183594, "global_step": 176658, "epoch": 1459} {"train_loss": -39.32577461053517, "global_step": 176659, "epoch": 1459, "val_loss": 2649056.0} {"train_loss": -41.0046501159668, "global_step": 176660, "epoch": 1460} {"train_loss": -40.769039154052734, "global_step": 176661, "epoch": 1460} {"train_loss": -40.3489875793457, "global_step": 176662, "epoch": 1460} {"train_loss": -41.04364776611328, "global_step": 176663, "epoch": 1460} {"train_loss": -40.67121124267578, "global_step": 176664, "epoch": 1460} {"train_loss": -38.63348388671875, "global_step": 176665, "epoch": 1460} {"train_loss": -39.40766906738281, "global_step": 176666, "epoch": 1460} {"train_loss": -40.81966018676758, "global_step": 176667, "epoch": 1460} {"train_loss": -41.31940460205078, "global_step": 176668, "epoch": 1460} {"train_loss": -41.13297653198242, "global_step": 176669, "epoch": 1460} {"train_loss": -39.3809928894043, "global_step": 176670, "epoch": 1460} {"train_loss": -39.00729751586914, "global_step": 176671, "epoch": 1460} {"train_loss": -37.16512680053711, "global_step": 176672, "epoch": 1460} {"train_loss": -33.91048812866211, "global_step": 176673, "epoch": 1460} {"train_loss": -37.79523468017578, "global_step": 176674, "epoch": 1460} {"train_loss": -39.011077880859375, "global_step": 176675, "epoch": 1460} {"train_loss": -37.31731033325195, "global_step": 176676, "epoch": 1460} {"train_loss": -39.85140609741211, "global_step": 176677, "epoch": 1460} {"train_loss": -39.76142501831055, "global_step": 176678, "epoch": 1460} {"train_loss": -40.54832077026367, "global_step": 176679, "epoch": 1460} {"train_loss": -39.63209915161133, "global_step": 176680, "epoch": 1460} {"train_loss": -39.27920913696289, "global_step": 176681, "epoch": 1460} {"train_loss": -39.49508285522461, "global_step": 176682, "epoch": 1460} {"train_loss": -40.03860092163086, "global_step": 176683, "epoch": 1460} {"train_loss": -40.69044876098633, "global_step": 176684, "epoch": 1460} {"train_loss": -39.81425094604492, "global_step": 176685, "epoch": 1460} {"train_loss": -40.16303634643555, "global_step": 176686, "epoch": 1460} {"train_loss": -39.364356994628906, "global_step": 176687, "epoch": 1460} {"train_loss": -40.23873519897461, "global_step": 176688, "epoch": 1460} {"train_loss": -40.39506912231445, "global_step": 176689, "epoch": 1460} {"train_loss": -40.858577728271484, "global_step": 176690, "epoch": 1460} {"train_loss": -40.47974395751953, "global_step": 176691, "epoch": 1460} {"train_loss": -39.010108947753906, "global_step": 176692, "epoch": 1460} {"train_loss": -40.75018310546875, "global_step": 176693, "epoch": 1460} {"train_loss": -41.12453842163086, "global_step": 176694, "epoch": 1460} {"train_loss": -41.0085334777832, "global_step": 176695, "epoch": 1460} {"train_loss": -40.24485397338867, "global_step": 176696, "epoch": 1460} {"train_loss": -40.04695510864258, "global_step": 176697, "epoch": 1460} {"train_loss": -39.75114822387695, "global_step": 176698, "epoch": 1460} {"train_loss": -39.342201232910156, "global_step": 176699, "epoch": 1460} {"train_loss": -39.902706146240234, "global_step": 176700, "epoch": 1460} {"train_loss": -40.05430221557617, "global_step": 176701, "epoch": 1460} {"train_loss": -40.79310989379883, "global_step": 176702, "epoch": 1460} {"train_loss": -40.14700698852539, "global_step": 176703, "epoch": 1460} {"train_loss": -38.29298782348633, "global_step": 176704, "epoch": 1460} {"train_loss": -37.464263916015625, "global_step": 176705, "epoch": 1460} {"train_loss": -38.75236892700195, "global_step": 176706, "epoch": 1460} {"train_loss": -39.19002914428711, "global_step": 176707, "epoch": 1460} {"train_loss": -39.73703384399414, "global_step": 176708, "epoch": 1460} {"train_loss": -40.22544479370117, "global_step": 176709, "epoch": 1460} {"train_loss": -34.33515167236328, "global_step": 176710, "epoch": 1460} {"train_loss": -38.04541778564453, "global_step": 176711, "epoch": 1460} {"train_loss": -39.60799789428711, "global_step": 176712, "epoch": 1460} {"train_loss": -38.58278274536133, "global_step": 176713, "epoch": 1460} {"train_loss": -39.21894454956055, "global_step": 176714, "epoch": 1460} {"train_loss": -38.866764068603516, "global_step": 176715, "epoch": 1460} {"train_loss": -40.475059509277344, "global_step": 176716, "epoch": 1460} {"train_loss": -39.33833312988281, "global_step": 176717, "epoch": 1460} {"train_loss": -36.9797477722168, "global_step": 176718, "epoch": 1460} {"train_loss": -38.88134002685547, "global_step": 176719, "epoch": 1460} {"train_loss": -40.01641082763672, "global_step": 176720, "epoch": 1460} {"train_loss": -34.90943145751953, "global_step": 176721, "epoch": 1460} {"train_loss": -39.980533599853516, "global_step": 176722, "epoch": 1460} {"train_loss": -39.22810363769531, "global_step": 176723, "epoch": 1460} {"train_loss": -38.93153762817383, "global_step": 176724, "epoch": 1460} {"train_loss": -31.251392364501953, "global_step": 176725, "epoch": 1460} {"train_loss": -37.43598937988281, "global_step": 176726, "epoch": 1460} {"train_loss": -38.1678466796875, "global_step": 176727, "epoch": 1460} {"train_loss": -39.30339813232422, "global_step": 176728, "epoch": 1460} {"train_loss": -39.413429260253906, "global_step": 176729, "epoch": 1460} {"train_loss": -40.156158447265625, "global_step": 176730, "epoch": 1460} {"train_loss": -38.6547737121582, "global_step": 176731, "epoch": 1460} {"train_loss": -39.30877685546875, "global_step": 176732, "epoch": 1460} {"train_loss": -37.88810348510742, "global_step": 176733, "epoch": 1460} {"train_loss": -39.3512077331543, "global_step": 176734, "epoch": 1460} {"train_loss": -38.75983428955078, "global_step": 176735, "epoch": 1460} {"train_loss": -32.03084945678711, "global_step": 176736, "epoch": 1460} {"train_loss": -39.37590408325195, "global_step": 176737, "epoch": 1460} {"train_loss": -38.58998489379883, "global_step": 176738, "epoch": 1460} {"train_loss": -37.31003952026367, "global_step": 176739, "epoch": 1460} {"train_loss": -36.53191375732422, "global_step": 176740, "epoch": 1460} {"train_loss": -39.8306999206543, "global_step": 176741, "epoch": 1460} {"train_loss": -39.65083694458008, "global_step": 176742, "epoch": 1460} {"train_loss": -38.11075973510742, "global_step": 176743, "epoch": 1460} {"train_loss": -39.281192779541016, "global_step": 176744, "epoch": 1460} {"train_loss": -39.00568771362305, "global_step": 176745, "epoch": 1460} {"train_loss": -38.3444709777832, "global_step": 176746, "epoch": 1460} {"train_loss": -40.073116302490234, "global_step": 176747, "epoch": 1460} {"train_loss": -39.688232421875, "global_step": 176748, "epoch": 1460} {"train_loss": -36.78744125366211, "global_step": 176749, "epoch": 1460} {"train_loss": -39.7008056640625, "global_step": 176750, "epoch": 1460} {"train_loss": -39.127662658691406, "global_step": 176751, "epoch": 1460} {"train_loss": -38.779170989990234, "global_step": 176752, "epoch": 1460} {"train_loss": -40.27885055541992, "global_step": 176753, "epoch": 1460} {"train_loss": -39.66500473022461, "global_step": 176754, "epoch": 1460} {"train_loss": -38.98061752319336, "global_step": 176755, "epoch": 1460} {"train_loss": -40.19313049316406, "global_step": 176756, "epoch": 1460} {"train_loss": -34.28925704956055, "global_step": 176757, "epoch": 1460} {"train_loss": -39.29624557495117, "global_step": 176758, "epoch": 1460} {"train_loss": -39.910064697265625, "global_step": 176759, "epoch": 1460} {"train_loss": -38.32257080078125, "global_step": 176760, "epoch": 1460} {"train_loss": -40.011470794677734, "global_step": 176761, "epoch": 1460} {"train_loss": -39.79182815551758, "global_step": 176762, "epoch": 1460} {"train_loss": -39.835994720458984, "global_step": 176763, "epoch": 1460} {"train_loss": -31.452392578125, "global_step": 176764, "epoch": 1460} {"train_loss": -38.32204818725586, "global_step": 176765, "epoch": 1460} {"train_loss": -34.564849853515625, "global_step": 176766, "epoch": 1460} {"train_loss": -39.50186538696289, "global_step": 176767, "epoch": 1460} {"train_loss": -39.32312774658203, "global_step": 176768, "epoch": 1460} {"train_loss": -38.3442268371582, "global_step": 176769, "epoch": 1460} {"train_loss": -38.60044860839844, "global_step": 176770, "epoch": 1460} {"train_loss": -38.5649299621582, "global_step": 176771, "epoch": 1460} {"train_loss": -39.51359176635742, "global_step": 176772, "epoch": 1460} {"train_loss": -35.69282531738281, "global_step": 176773, "epoch": 1460} {"train_loss": -39.838680267333984, "global_step": 176774, "epoch": 1460} {"train_loss": -34.679588317871094, "global_step": 176775, "epoch": 1460} {"train_loss": -38.47452926635742, "global_step": 176776, "epoch": 1460} {"train_loss": -39.62470626831055, "global_step": 176777, "epoch": 1460} {"train_loss": -38.78321075439453, "global_step": 176778, "epoch": 1460} {"train_loss": -39.9587287902832, "global_step": 176779, "epoch": 1460} {"train_loss": -38.90246623015601, "global_step": 176780, "epoch": 1460, "val_loss": 2555772.0} {"train_loss": -40.08217239379883, "global_step": 176781, "epoch": 1461} {"train_loss": -40.04047775268555, "global_step": 176782, "epoch": 1461} {"train_loss": -37.57568359375, "global_step": 176783, "epoch": 1461} {"train_loss": -39.368831634521484, "global_step": 176784, "epoch": 1461} {"train_loss": -38.02924728393555, "global_step": 176785, "epoch": 1461} {"train_loss": -36.11454391479492, "global_step": 176786, "epoch": 1461} {"train_loss": -37.719844818115234, "global_step": 176787, "epoch": 1461} {"train_loss": -39.258827209472656, "global_step": 176788, "epoch": 1461} {"train_loss": -37.64663314819336, "global_step": 176789, "epoch": 1461} {"train_loss": -36.35871505737305, "global_step": 176790, "epoch": 1461} {"train_loss": -39.36983108520508, "global_step": 176791, "epoch": 1461} {"train_loss": -35.98906326293945, "global_step": 176792, "epoch": 1461} {"train_loss": -38.57477951049805, "global_step": 176793, "epoch": 1461} {"train_loss": -39.83943176269531, "global_step": 176794, "epoch": 1461} {"train_loss": -36.77189254760742, "global_step": 176795, "epoch": 1461} {"train_loss": -32.47483444213867, "global_step": 176796, "epoch": 1461} {"train_loss": -38.07366943359375, "global_step": 176797, "epoch": 1461} {"train_loss": -38.00309371948242, "global_step": 176798, "epoch": 1461} {"train_loss": -38.914939880371094, "global_step": 176799, "epoch": 1461} {"train_loss": -37.072696685791016, "global_step": 176800, "epoch": 1461} {"train_loss": -38.836387634277344, "global_step": 176801, "epoch": 1461} {"train_loss": -35.33028030395508, "global_step": 176802, "epoch": 1461} {"train_loss": -38.08979034423828, "global_step": 176803, "epoch": 1461} {"train_loss": -38.40346908569336, "global_step": 176804, "epoch": 1461} {"train_loss": -35.629817962646484, "global_step": 176805, "epoch": 1461} {"train_loss": -37.51337814331055, "global_step": 176806, "epoch": 1461} {"train_loss": -39.242374420166016, "global_step": 176807, "epoch": 1461} {"train_loss": -38.16077423095703, "global_step": 176808, "epoch": 1461} {"train_loss": -39.04803466796875, "global_step": 176809, "epoch": 1461} {"train_loss": -37.2886962890625, "global_step": 176810, "epoch": 1461} {"train_loss": -38.77779769897461, "global_step": 176811, "epoch": 1461} {"train_loss": -38.95115280151367, "global_step": 176812, "epoch": 1461} {"train_loss": -37.96320724487305, "global_step": 176813, "epoch": 1461} {"train_loss": -38.83135223388672, "global_step": 176814, "epoch": 1461} {"train_loss": -37.48610305786133, "global_step": 176815, "epoch": 1461} {"train_loss": -39.30836486816406, "global_step": 176816, "epoch": 1461} {"train_loss": -38.40220260620117, "global_step": 176817, "epoch": 1461} {"train_loss": -39.89103317260742, "global_step": 176818, "epoch": 1461} {"train_loss": -39.089542388916016, "global_step": 176819, "epoch": 1461} {"train_loss": -36.252437591552734, "global_step": 176820, "epoch": 1461} {"train_loss": -39.004817962646484, "global_step": 176821, "epoch": 1461} {"train_loss": -38.84772491455078, "global_step": 176822, "epoch": 1461} {"train_loss": -36.81079864501953, "global_step": 176823, "epoch": 1461} {"train_loss": -38.674652099609375, "global_step": 176824, "epoch": 1461} {"train_loss": -39.37186813354492, "global_step": 176825, "epoch": 1461} {"train_loss": -39.84010696411133, "global_step": 176826, "epoch": 1461} {"train_loss": -39.139991760253906, "global_step": 176827, "epoch": 1461} {"train_loss": -36.387943267822266, "global_step": 176828, "epoch": 1461} {"train_loss": -35.69240951538086, "global_step": 176829, "epoch": 1461} {"train_loss": -39.564483642578125, "global_step": 176830, "epoch": 1461} {"train_loss": -38.05465316772461, "global_step": 176831, "epoch": 1461} {"train_loss": -38.94862747192383, "global_step": 176832, "epoch": 1461} {"train_loss": -38.9232177734375, "global_step": 176833, "epoch": 1461} {"train_loss": -39.1771125793457, "global_step": 176834, "epoch": 1461} {"train_loss": -37.76909255981445, "global_step": 176835, "epoch": 1461} {"train_loss": -39.20283889770508, "global_step": 176836, "epoch": 1461} {"train_loss": -37.732139587402344, "global_step": 176837, "epoch": 1461} {"train_loss": -39.64899444580078, "global_step": 176838, "epoch": 1461} {"train_loss": -37.99868392944336, "global_step": 176839, "epoch": 1461} {"train_loss": -36.538997650146484, "global_step": 176840, "epoch": 1461} {"train_loss": -39.16358184814453, "global_step": 176841, "epoch": 1461} {"train_loss": -39.328758239746094, "global_step": 176842, "epoch": 1461} {"train_loss": -39.82155227661133, "global_step": 176843, "epoch": 1461} {"train_loss": -38.88351058959961, "global_step": 176844, "epoch": 1461} {"train_loss": -38.32404327392578, "global_step": 176845, "epoch": 1461} {"train_loss": -38.329776763916016, "global_step": 176846, "epoch": 1461} {"train_loss": -39.7484245300293, "global_step": 176847, "epoch": 1461} {"train_loss": -39.11042022705078, "global_step": 176848, "epoch": 1461} {"train_loss": -40.110939025878906, "global_step": 176849, "epoch": 1461} {"train_loss": -39.865604400634766, "global_step": 176850, "epoch": 1461} {"train_loss": -39.37852478027344, "global_step": 176851, "epoch": 1461} {"train_loss": -39.767311096191406, "global_step": 176852, "epoch": 1461} {"train_loss": -40.09632110595703, "global_step": 176853, "epoch": 1461} {"train_loss": -39.1422004699707, "global_step": 176854, "epoch": 1461} {"train_loss": -39.541473388671875, "global_step": 176855, "epoch": 1461} {"train_loss": -39.67546463012695, "global_step": 176856, "epoch": 1461} {"train_loss": -39.65024948120117, "global_step": 176857, "epoch": 1461} {"train_loss": -39.548072814941406, "global_step": 176858, "epoch": 1461} {"train_loss": -37.501953125, "global_step": 176859, "epoch": 1461} {"train_loss": -39.98452377319336, "global_step": 176860, "epoch": 1461} {"train_loss": -38.97353744506836, "global_step": 176861, "epoch": 1461} {"train_loss": -39.50654220581055, "global_step": 176862, "epoch": 1461} {"train_loss": -39.19838333129883, "global_step": 176863, "epoch": 1461} {"train_loss": -37.6640739440918, "global_step": 176864, "epoch": 1461} {"train_loss": -39.020301818847656, "global_step": 176865, "epoch": 1461} {"train_loss": -40.22589874267578, "global_step": 176866, "epoch": 1461} {"train_loss": -39.5348014831543, "global_step": 176867, "epoch": 1461} {"train_loss": -39.21631622314453, "global_step": 176868, "epoch": 1461} {"train_loss": -39.81201171875, "global_step": 176869, "epoch": 1461} {"train_loss": -40.11756896972656, "global_step": 176870, "epoch": 1461} {"train_loss": -39.36052703857422, "global_step": 176871, "epoch": 1461} {"train_loss": -39.6192626953125, "global_step": 176872, "epoch": 1461} {"train_loss": -40.031185150146484, "global_step": 176873, "epoch": 1461} {"train_loss": -39.726322174072266, "global_step": 176874, "epoch": 1461} {"train_loss": -38.47785568237305, "global_step": 176875, "epoch": 1461} {"train_loss": -39.15037536621094, "global_step": 176876, "epoch": 1461} {"train_loss": -38.71504211425781, "global_step": 176877, "epoch": 1461} {"train_loss": -39.014678955078125, "global_step": 176878, "epoch": 1461} {"train_loss": -38.64823913574219, "global_step": 176879, "epoch": 1461} {"train_loss": -39.852012634277344, "global_step": 176880, "epoch": 1461} {"train_loss": -39.66981887817383, "global_step": 176881, "epoch": 1461} {"train_loss": -39.129974365234375, "global_step": 176882, "epoch": 1461} {"train_loss": -38.9879264831543, "global_step": 176883, "epoch": 1461} {"train_loss": -40.20826721191406, "global_step": 176884, "epoch": 1461} {"train_loss": -40.19527053833008, "global_step": 176885, "epoch": 1461} {"train_loss": -39.76593017578125, "global_step": 176886, "epoch": 1461} {"train_loss": -40.383846282958984, "global_step": 176887, "epoch": 1461} {"train_loss": -40.56150436401367, "global_step": 176888, "epoch": 1461} {"train_loss": -39.2839241027832, "global_step": 176889, "epoch": 1461} {"train_loss": -39.16399002075195, "global_step": 176890, "epoch": 1461} {"train_loss": -40.230712890625, "global_step": 176891, "epoch": 1461} {"train_loss": -40.1646842956543, "global_step": 176892, "epoch": 1461} {"train_loss": -39.60560989379883, "global_step": 176893, "epoch": 1461} {"train_loss": -39.93513107299805, "global_step": 176894, "epoch": 1461} {"train_loss": -40.07318878173828, "global_step": 176895, "epoch": 1461} {"train_loss": -39.9814453125, "global_step": 176896, "epoch": 1461} {"train_loss": -40.37122344970703, "global_step": 176897, "epoch": 1461} {"train_loss": -40.253204345703125, "global_step": 176898, "epoch": 1461} {"train_loss": -40.63187026977539, "global_step": 176899, "epoch": 1461} {"train_loss": -39.46440505981445, "global_step": 176900, "epoch": 1461} {"train_loss": -38.82877239511033, "global_step": 176901, "epoch": 1461, "val_loss": 2599458.0} {"train_loss": -40.41252517700195, "global_step": 176902, "epoch": 1462} {"train_loss": -40.21213912963867, "global_step": 176903, "epoch": 1462} {"train_loss": -40.54012680053711, "global_step": 176904, "epoch": 1462} {"train_loss": -40.305389404296875, "global_step": 176905, "epoch": 1462} {"train_loss": -39.6988639831543, "global_step": 176906, "epoch": 1462} {"train_loss": -39.05611038208008, "global_step": 176907, "epoch": 1462} {"train_loss": -40.262001037597656, "global_step": 176908, "epoch": 1462} {"train_loss": -39.217193603515625, "global_step": 176909, "epoch": 1462} {"train_loss": -39.362369537353516, "global_step": 176910, "epoch": 1462} {"train_loss": -40.46931457519531, "global_step": 176911, "epoch": 1462} {"train_loss": -39.03116226196289, "global_step": 176912, "epoch": 1462} {"train_loss": -39.13277053833008, "global_step": 176913, "epoch": 1462} {"train_loss": -39.46257019042969, "global_step": 176914, "epoch": 1462} {"train_loss": -40.01647186279297, "global_step": 176915, "epoch": 1462} {"train_loss": -39.838233947753906, "global_step": 176916, "epoch": 1462} {"train_loss": -40.861507415771484, "global_step": 176917, "epoch": 1462} {"train_loss": -39.413055419921875, "global_step": 176918, "epoch": 1462} {"train_loss": -39.654327392578125, "global_step": 176919, "epoch": 1462} {"train_loss": -39.0590705871582, "global_step": 176920, "epoch": 1462} {"train_loss": -39.498287200927734, "global_step": 176921, "epoch": 1462} {"train_loss": -38.967525482177734, "global_step": 176922, "epoch": 1462} {"train_loss": -39.19405746459961, "global_step": 176923, "epoch": 1462} {"train_loss": -39.49205017089844, "global_step": 176924, "epoch": 1462} {"train_loss": -39.294029235839844, "global_step": 176925, "epoch": 1462} {"train_loss": -38.297542572021484, "global_step": 176926, "epoch": 1462} {"train_loss": -36.143959045410156, "global_step": 176927, "epoch": 1462} {"train_loss": -36.71467208862305, "global_step": 176928, "epoch": 1462} {"train_loss": -38.603111267089844, "global_step": 176929, "epoch": 1462} {"train_loss": -40.42396926879883, "global_step": 176930, "epoch": 1462} {"train_loss": -40.32550048828125, "global_step": 176931, "epoch": 1462} {"train_loss": -39.83230209350586, "global_step": 176932, "epoch": 1462} {"train_loss": -40.551509857177734, "global_step": 176933, "epoch": 1462} {"train_loss": -40.6580810546875, "global_step": 176934, "epoch": 1462} {"train_loss": -38.263206481933594, "global_step": 176935, "epoch": 1462} {"train_loss": -39.4941291809082, "global_step": 176936, "epoch": 1462} {"train_loss": -40.088748931884766, "global_step": 176937, "epoch": 1462} {"train_loss": -39.878395080566406, "global_step": 176938, "epoch": 1462} {"train_loss": -40.8519401550293, "global_step": 176939, "epoch": 1462} {"train_loss": -40.3398551940918, "global_step": 176940, "epoch": 1462} {"train_loss": -39.05743408203125, "global_step": 176941, "epoch": 1462} {"train_loss": -39.553863525390625, "global_step": 176942, "epoch": 1462} {"train_loss": -40.274871826171875, "global_step": 176943, "epoch": 1462} {"train_loss": -40.439064025878906, "global_step": 176944, "epoch": 1462} {"train_loss": -39.395294189453125, "global_step": 176945, "epoch": 1462} {"train_loss": -40.12230682373047, "global_step": 176946, "epoch": 1462} {"train_loss": -40.90341567993164, "global_step": 176947, "epoch": 1462} {"train_loss": -39.450462341308594, "global_step": 176948, "epoch": 1462} {"train_loss": -40.100440979003906, "global_step": 176949, "epoch": 1462} {"train_loss": -40.63481521606445, "global_step": 176950, "epoch": 1462} {"train_loss": -40.229225158691406, "global_step": 176951, "epoch": 1462} {"train_loss": -40.63296127319336, "global_step": 176952, "epoch": 1462} {"train_loss": -40.82340621948242, "global_step": 176953, "epoch": 1462} {"train_loss": -39.77131271362305, "global_step": 176954, "epoch": 1462} {"train_loss": -40.05446243286133, "global_step": 176955, "epoch": 1462} {"train_loss": -40.6156005859375, "global_step": 176956, "epoch": 1462} {"train_loss": -40.223201751708984, "global_step": 176957, "epoch": 1462} {"train_loss": -40.536312103271484, "global_step": 176958, "epoch": 1462} {"train_loss": -40.97591018676758, "global_step": 176959, "epoch": 1462} {"train_loss": -40.765838623046875, "global_step": 176960, "epoch": 1462} {"train_loss": -40.67749786376953, "global_step": 176961, "epoch": 1462} {"train_loss": -40.730316162109375, "global_step": 176962, "epoch": 1462} {"train_loss": -40.97455978393555, "global_step": 176963, "epoch": 1462} {"train_loss": -41.14565658569336, "global_step": 176964, "epoch": 1462} {"train_loss": -40.75788116455078, "global_step": 176965, "epoch": 1462} {"train_loss": -40.012481689453125, "global_step": 176966, "epoch": 1462} {"train_loss": -40.9958610534668, "global_step": 176967, "epoch": 1462} {"train_loss": -40.55621337890625, "global_step": 176968, "epoch": 1462} {"train_loss": -40.93624496459961, "global_step": 176969, "epoch": 1462} {"train_loss": -40.270050048828125, "global_step": 176970, "epoch": 1462} {"train_loss": -39.181453704833984, "global_step": 176971, "epoch": 1462} {"train_loss": -37.57231521606445, "global_step": 176972, "epoch": 1462} {"train_loss": -35.308143615722656, "global_step": 176973, "epoch": 1462} {"train_loss": -34.15792465209961, "global_step": 176974, "epoch": 1462} {"train_loss": -37.22801208496094, "global_step": 176975, "epoch": 1462} {"train_loss": -38.60786819458008, "global_step": 176976, "epoch": 1462} {"train_loss": -38.91005325317383, "global_step": 176977, "epoch": 1462} {"train_loss": -38.87382888793945, "global_step": 176978, "epoch": 1462} {"train_loss": -33.55270004272461, "global_step": 176979, "epoch": 1462} {"train_loss": -39.848388671875, "global_step": 176980, "epoch": 1462} {"train_loss": -35.58683395385742, "global_step": 176981, "epoch": 1462} {"train_loss": -39.24326705932617, "global_step": 176982, "epoch": 1462} {"train_loss": -37.097412109375, "global_step": 176983, "epoch": 1462} {"train_loss": -38.7883415222168, "global_step": 176984, "epoch": 1462} {"train_loss": -39.03369140625, "global_step": 176985, "epoch": 1462} {"train_loss": -36.916664123535156, "global_step": 176986, "epoch": 1462} {"train_loss": -39.639015197753906, "global_step": 176987, "epoch": 1462} {"train_loss": -37.88249969482422, "global_step": 176988, "epoch": 1462} {"train_loss": -37.902008056640625, "global_step": 176989, "epoch": 1462} {"train_loss": -39.73496627807617, "global_step": 176990, "epoch": 1462} {"train_loss": -39.32625961303711, "global_step": 176991, "epoch": 1462} {"train_loss": -38.40730667114258, "global_step": 176992, "epoch": 1462} {"train_loss": -39.78278732299805, "global_step": 176993, "epoch": 1462} {"train_loss": -39.724849700927734, "global_step": 176994, "epoch": 1462} {"train_loss": -38.920265197753906, "global_step": 176995, "epoch": 1462} {"train_loss": -38.863338470458984, "global_step": 176996, "epoch": 1462} {"train_loss": -40.67706298828125, "global_step": 176997, "epoch": 1462} {"train_loss": -39.625728607177734, "global_step": 176998, "epoch": 1462} {"train_loss": -40.13945007324219, "global_step": 176999, "epoch": 1462} {"train_loss": -40.56843566894531, "global_step": 177000, "epoch": 1462} {"train_loss": -40.750396728515625, "global_step": 177001, "epoch": 1462} {"train_loss": -40.39801025390625, "global_step": 177002, "epoch": 1462} {"train_loss": -40.44557571411133, "global_step": 177003, "epoch": 1462} {"train_loss": -40.37577819824219, "global_step": 177004, "epoch": 1462} {"train_loss": -40.4036865234375, "global_step": 177005, "epoch": 1462} {"train_loss": -40.39876937866211, "global_step": 177006, "epoch": 1462} {"train_loss": -40.31458282470703, "global_step": 177007, "epoch": 1462} {"train_loss": -40.911170959472656, "global_step": 177008, "epoch": 1462} {"train_loss": -40.719181060791016, "global_step": 177009, "epoch": 1462} {"train_loss": -41.127166748046875, "global_step": 177010, "epoch": 1462} {"train_loss": -40.950836181640625, "global_step": 177011, "epoch": 1462} {"train_loss": -40.95850372314453, "global_step": 177012, "epoch": 1462} {"train_loss": -39.937599182128906, "global_step": 177013, "epoch": 1462} {"train_loss": -40.96725082397461, "global_step": 177014, "epoch": 1462} {"train_loss": -40.851680755615234, "global_step": 177015, "epoch": 1462} {"train_loss": -40.923152923583984, "global_step": 177016, "epoch": 1462} {"train_loss": -40.68192672729492, "global_step": 177017, "epoch": 1462} {"train_loss": -37.83695983886719, "global_step": 177018, "epoch": 1462} {"train_loss": -41.2332763671875, "global_step": 177019, "epoch": 1462} {"train_loss": -40.471527099609375, "global_step": 177020, "epoch": 1462} {"train_loss": -40.777042388916016, "global_step": 177021, "epoch": 1462} {"train_loss": -39.64611570500145, "global_step": 177022, "epoch": 1462, "val_loss": 2484404.5} {"train_loss": -40.68587112426758, "global_step": 177023, "epoch": 1463} {"train_loss": -40.576072692871094, "global_step": 177024, "epoch": 1463} {"train_loss": -41.1935920715332, "global_step": 177025, "epoch": 1463} {"train_loss": -41.03791046142578, "global_step": 177026, "epoch": 1463} {"train_loss": -39.64980697631836, "global_step": 177027, "epoch": 1463} {"train_loss": -39.98747634887695, "global_step": 177028, "epoch": 1463} {"train_loss": -39.52781295776367, "global_step": 177029, "epoch": 1463} {"train_loss": -41.183746337890625, "global_step": 177030, "epoch": 1463} {"train_loss": -41.549110412597656, "global_step": 177031, "epoch": 1463} {"train_loss": -41.53895950317383, "global_step": 177032, "epoch": 1463} {"train_loss": -41.18655014038086, "global_step": 177033, "epoch": 1463} {"train_loss": -41.398006439208984, "global_step": 177034, "epoch": 1463} {"train_loss": -41.223567962646484, "global_step": 177035, "epoch": 1463} {"train_loss": -39.44801712036133, "global_step": 177036, "epoch": 1463} {"train_loss": -37.556488037109375, "global_step": 177037, "epoch": 1463} {"train_loss": -39.33005905151367, "global_step": 177038, "epoch": 1463} {"train_loss": -40.27497100830078, "global_step": 177039, "epoch": 1463} {"train_loss": -38.39503860473633, "global_step": 177040, "epoch": 1463} {"train_loss": -38.783199310302734, "global_step": 177041, "epoch": 1463} {"train_loss": -37.948116302490234, "global_step": 177042, "epoch": 1463} {"train_loss": -36.17440414428711, "global_step": 177043, "epoch": 1463} {"train_loss": -38.013790130615234, "global_step": 177044, "epoch": 1463} {"train_loss": -38.94587326049805, "global_step": 177045, "epoch": 1463} {"train_loss": -35.81760787963867, "global_step": 177046, "epoch": 1463} {"train_loss": -37.2301139831543, "global_step": 177047, "epoch": 1463} {"train_loss": -36.41045379638672, "global_step": 177048, "epoch": 1463} {"train_loss": -39.51996994018555, "global_step": 177049, "epoch": 1463} {"train_loss": -38.3797607421875, "global_step": 177050, "epoch": 1463} {"train_loss": -39.72385787963867, "global_step": 177051, "epoch": 1463} {"train_loss": -39.5052604675293, "global_step": 177052, "epoch": 1463} {"train_loss": -37.76606369018555, "global_step": 177053, "epoch": 1463} {"train_loss": -40.101234436035156, "global_step": 177054, "epoch": 1463} {"train_loss": -37.876461029052734, "global_step": 177055, "epoch": 1463} {"train_loss": -38.431331634521484, "global_step": 177056, "epoch": 1463} {"train_loss": -38.01088333129883, "global_step": 177057, "epoch": 1463} {"train_loss": -39.93657302856445, "global_step": 177058, "epoch": 1463} {"train_loss": -38.56014633178711, "global_step": 177059, "epoch": 1463} {"train_loss": -33.70380783081055, "global_step": 177060, "epoch": 1463} {"train_loss": -40.43611526489258, "global_step": 177061, "epoch": 1463} {"train_loss": -36.55099105834961, "global_step": 177062, "epoch": 1463} {"train_loss": -37.51930618286133, "global_step": 177063, "epoch": 1463} {"train_loss": -39.842464447021484, "global_step": 177064, "epoch": 1463} {"train_loss": -33.459075927734375, "global_step": 177065, "epoch": 1463} {"train_loss": -38.71632385253906, "global_step": 177066, "epoch": 1463} {"train_loss": -37.31052780151367, "global_step": 177067, "epoch": 1463} {"train_loss": -38.547019958496094, "global_step": 177068, "epoch": 1463} {"train_loss": -39.11200714111328, "global_step": 177069, "epoch": 1463} {"train_loss": -38.11640548706055, "global_step": 177070, "epoch": 1463} {"train_loss": -36.72412872314453, "global_step": 177071, "epoch": 1463} {"train_loss": -35.02656173706055, "global_step": 177072, "epoch": 1463} {"train_loss": -37.85342788696289, "global_step": 177073, "epoch": 1463} {"train_loss": -37.79061508178711, "global_step": 177074, "epoch": 1463} {"train_loss": -32.97792053222656, "global_step": 177075, "epoch": 1463} {"train_loss": -38.99723434448242, "global_step": 177076, "epoch": 1463} {"train_loss": -39.416015625, "global_step": 177077, "epoch": 1463} {"train_loss": -36.281436920166016, "global_step": 177078, "epoch": 1463} {"train_loss": -39.36567687988281, "global_step": 177079, "epoch": 1463} {"train_loss": -38.12411880493164, "global_step": 177080, "epoch": 1463} {"train_loss": -38.99577713012695, "global_step": 177081, "epoch": 1463} {"train_loss": -39.336273193359375, "global_step": 177082, "epoch": 1463} {"train_loss": -39.14942169189453, "global_step": 177083, "epoch": 1463} {"train_loss": -38.83480453491211, "global_step": 177084, "epoch": 1463} {"train_loss": -38.157470703125, "global_step": 177085, "epoch": 1463} {"train_loss": -37.73206329345703, "global_step": 177086, "epoch": 1463} {"train_loss": -40.11550521850586, "global_step": 177087, "epoch": 1463} {"train_loss": -39.48585510253906, "global_step": 177088, "epoch": 1463} {"train_loss": -38.0937614440918, "global_step": 177089, "epoch": 1463} {"train_loss": -39.57844161987305, "global_step": 177090, "epoch": 1463} {"train_loss": -39.132347106933594, "global_step": 177091, "epoch": 1463} {"train_loss": -38.69637680053711, "global_step": 177092, "epoch": 1463} {"train_loss": -37.43537139892578, "global_step": 177093, "epoch": 1463} {"train_loss": -39.29702377319336, "global_step": 177094, "epoch": 1463} {"train_loss": -38.268272399902344, "global_step": 177095, "epoch": 1463} {"train_loss": -39.361473083496094, "global_step": 177096, "epoch": 1463} {"train_loss": -39.30162811279297, "global_step": 177097, "epoch": 1463} {"train_loss": -39.038326263427734, "global_step": 177098, "epoch": 1463} {"train_loss": -39.96688461303711, "global_step": 177099, "epoch": 1463} {"train_loss": -39.37760543823242, "global_step": 177100, "epoch": 1463} {"train_loss": -39.7842903137207, "global_step": 177101, "epoch": 1463} {"train_loss": -40.54533767700195, "global_step": 177102, "epoch": 1463} {"train_loss": -39.4266471862793, "global_step": 177103, "epoch": 1463} {"train_loss": -39.043548583984375, "global_step": 177104, "epoch": 1463} {"train_loss": -40.45258712768555, "global_step": 177105, "epoch": 1463} {"train_loss": -40.18321228027344, "global_step": 177106, "epoch": 1463} {"train_loss": -39.19799041748047, "global_step": 177107, "epoch": 1463} {"train_loss": -39.454837799072266, "global_step": 177108, "epoch": 1463} {"train_loss": -39.92666244506836, "global_step": 177109, "epoch": 1463} {"train_loss": -40.65437316894531, "global_step": 177110, "epoch": 1463} {"train_loss": -40.38883972167969, "global_step": 177111, "epoch": 1463} {"train_loss": -40.488739013671875, "global_step": 177112, "epoch": 1463} {"train_loss": -38.867733001708984, "global_step": 177113, "epoch": 1463} {"train_loss": -40.625282287597656, "global_step": 177114, "epoch": 1463} {"train_loss": -40.576446533203125, "global_step": 177115, "epoch": 1463} {"train_loss": -40.48445510864258, "global_step": 177116, "epoch": 1463} {"train_loss": -40.57334518432617, "global_step": 177117, "epoch": 1463} {"train_loss": -40.31657028198242, "global_step": 177118, "epoch": 1463} {"train_loss": -40.29705810546875, "global_step": 177119, "epoch": 1463} {"train_loss": -39.853302001953125, "global_step": 177120, "epoch": 1463} {"train_loss": -40.666229248046875, "global_step": 177121, "epoch": 1463} {"train_loss": -40.49199295043945, "global_step": 177122, "epoch": 1463} {"train_loss": -40.4682731628418, "global_step": 177123, "epoch": 1463} {"train_loss": -40.035701751708984, "global_step": 177124, "epoch": 1463} {"train_loss": -40.168785095214844, "global_step": 177125, "epoch": 1463} {"train_loss": -40.90373992919922, "global_step": 177126, "epoch": 1463} {"train_loss": -40.52448654174805, "global_step": 177127, "epoch": 1463} {"train_loss": -40.24382781982422, "global_step": 177128, "epoch": 1463} {"train_loss": -40.26184844970703, "global_step": 177129, "epoch": 1463} {"train_loss": -40.27149963378906, "global_step": 177130, "epoch": 1463} {"train_loss": -40.710601806640625, "global_step": 177131, "epoch": 1463} {"train_loss": -39.98627471923828, "global_step": 177132, "epoch": 1463} {"train_loss": -40.91416549682617, "global_step": 177133, "epoch": 1463} {"train_loss": -41.374752044677734, "global_step": 177134, "epoch": 1463} {"train_loss": -41.447288513183594, "global_step": 177135, "epoch": 1463} {"train_loss": -40.85023880004883, "global_step": 177136, "epoch": 1463} {"train_loss": -40.69390106201172, "global_step": 177137, "epoch": 1463} {"train_loss": -40.14563751220703, "global_step": 177138, "epoch": 1463} {"train_loss": -40.392887115478516, "global_step": 177139, "epoch": 1463} {"train_loss": -40.231956481933594, "global_step": 177140, "epoch": 1463} {"train_loss": -40.53096389770508, "global_step": 177141, "epoch": 1463} {"train_loss": -40.760128021240234, "global_step": 177142, "epoch": 1463} {"train_loss": -39.27416774655177, "global_step": 177143, "epoch": 1463, "val_loss": 2612361.25} {"train_loss": -40.22426986694336, "global_step": 177144, "epoch": 1464} {"train_loss": -40.378631591796875, "global_step": 177145, "epoch": 1464} {"train_loss": -40.95549774169922, "global_step": 177146, "epoch": 1464} {"train_loss": -40.51943588256836, "global_step": 177147, "epoch": 1464} {"train_loss": -39.36630630493164, "global_step": 177148, "epoch": 1464} {"train_loss": -38.4800910949707, "global_step": 177149, "epoch": 1464} {"train_loss": -34.811710357666016, "global_step": 177150, "epoch": 1464} {"train_loss": -34.36226272583008, "global_step": 177151, "epoch": 1464} {"train_loss": -30.772022247314453, "global_step": 177152, "epoch": 1464} {"train_loss": -31.106550216674805, "global_step": 177153, "epoch": 1464} {"train_loss": -30.537353515625, "global_step": 177154, "epoch": 1464} {"train_loss": -35.12186050415039, "global_step": 177155, "epoch": 1464} {"train_loss": -39.57511520385742, "global_step": 177156, "epoch": 1464} {"train_loss": -36.22803497314453, "global_step": 177157, "epoch": 1464} {"train_loss": -37.337886810302734, "global_step": 177158, "epoch": 1464} {"train_loss": -39.38624954223633, "global_step": 177159, "epoch": 1464} {"train_loss": -36.080162048339844, "global_step": 177160, "epoch": 1464} {"train_loss": -40.035667419433594, "global_step": 177161, "epoch": 1464} {"train_loss": -37.683956146240234, "global_step": 177162, "epoch": 1464} {"train_loss": -37.71157455444336, "global_step": 177163, "epoch": 1464} {"train_loss": -37.58736801147461, "global_step": 177164, "epoch": 1464} {"train_loss": -39.53028106689453, "global_step": 177165, "epoch": 1464} {"train_loss": -37.72816848754883, "global_step": 177166, "epoch": 1464} {"train_loss": -38.9231071472168, "global_step": 177167, "epoch": 1464} {"train_loss": -37.82270050048828, "global_step": 177168, "epoch": 1464} {"train_loss": -39.86857604980469, "global_step": 177169, "epoch": 1464} {"train_loss": -38.45624923706055, "global_step": 177170, "epoch": 1464} {"train_loss": -38.466033935546875, "global_step": 177171, "epoch": 1464} {"train_loss": -38.92975997924805, "global_step": 177172, "epoch": 1464} {"train_loss": -39.3135986328125, "global_step": 177173, "epoch": 1464} {"train_loss": -39.919246673583984, "global_step": 177174, "epoch": 1464} {"train_loss": -39.13642120361328, "global_step": 177175, "epoch": 1464} {"train_loss": -39.989009857177734, "global_step": 177176, "epoch": 1464} {"train_loss": -40.4260139465332, "global_step": 177177, "epoch": 1464} {"train_loss": -39.560302734375, "global_step": 177178, "epoch": 1464} {"train_loss": -40.441131591796875, "global_step": 177179, "epoch": 1464} {"train_loss": -39.616390228271484, "global_step": 177180, "epoch": 1464} {"train_loss": -38.61669158935547, "global_step": 177181, "epoch": 1464} {"train_loss": -39.940364837646484, "global_step": 177182, "epoch": 1464} {"train_loss": -39.83491134643555, "global_step": 177183, "epoch": 1464} {"train_loss": -40.2563362121582, "global_step": 177184, "epoch": 1464} {"train_loss": -40.0650634765625, "global_step": 177185, "epoch": 1464} {"train_loss": -39.216068267822266, "global_step": 177186, "epoch": 1464} {"train_loss": -41.13521957397461, "global_step": 177187, "epoch": 1464} {"train_loss": -40.62567138671875, "global_step": 177188, "epoch": 1464} {"train_loss": -40.871089935302734, "global_step": 177189, "epoch": 1464} {"train_loss": -40.5564079284668, "global_step": 177190, "epoch": 1464} {"train_loss": -40.82037353515625, "global_step": 177191, "epoch": 1464} {"train_loss": -40.954036712646484, "global_step": 177192, "epoch": 1464} {"train_loss": -41.061195373535156, "global_step": 177193, "epoch": 1464} {"train_loss": -40.54846954345703, "global_step": 177194, "epoch": 1464} {"train_loss": -40.442623138427734, "global_step": 177195, "epoch": 1464} {"train_loss": -39.5994758605957, "global_step": 177196, "epoch": 1464} {"train_loss": -40.48771286010742, "global_step": 177197, "epoch": 1464} {"train_loss": -39.67851638793945, "global_step": 177198, "epoch": 1464} {"train_loss": -41.25932693481445, "global_step": 177199, "epoch": 1464} {"train_loss": -41.1070671081543, "global_step": 177200, "epoch": 1464} {"train_loss": -41.02972412109375, "global_step": 177201, "epoch": 1464} {"train_loss": -40.9096565246582, "global_step": 177202, "epoch": 1464} {"train_loss": -40.883766174316406, "global_step": 177203, "epoch": 1464} {"train_loss": -40.68571853637695, "global_step": 177204, "epoch": 1464} {"train_loss": -40.86735153198242, "global_step": 177205, "epoch": 1464} {"train_loss": -40.520565032958984, "global_step": 177206, "epoch": 1464} {"train_loss": -41.45814895629883, "global_step": 177207, "epoch": 1464} {"train_loss": -40.54111099243164, "global_step": 177208, "epoch": 1464} {"train_loss": -40.99077224731445, "global_step": 177209, "epoch": 1464} {"train_loss": -40.68491744995117, "global_step": 177210, "epoch": 1464} {"train_loss": -41.021480560302734, "global_step": 177211, "epoch": 1464} {"train_loss": -41.03398513793945, "global_step": 177212, "epoch": 1464} {"train_loss": -40.752620697021484, "global_step": 177213, "epoch": 1464} {"train_loss": -40.5425910949707, "global_step": 177214, "epoch": 1464} {"train_loss": -40.98360824584961, "global_step": 177215, "epoch": 1464} {"train_loss": -41.010440826416016, "global_step": 177216, "epoch": 1464} {"train_loss": -41.31583023071289, "global_step": 177217, "epoch": 1464} {"train_loss": -41.29529571533203, "global_step": 177218, "epoch": 1464} {"train_loss": -40.770137786865234, "global_step": 177219, "epoch": 1464} {"train_loss": -40.572357177734375, "global_step": 177220, "epoch": 1464} {"train_loss": -41.5892333984375, "global_step": 177221, "epoch": 1464} {"train_loss": -40.85296630859375, "global_step": 177222, "epoch": 1464} {"train_loss": -41.13216018676758, "global_step": 177223, "epoch": 1464} {"train_loss": -40.857688903808594, "global_step": 177224, "epoch": 1464} {"train_loss": -40.319854736328125, "global_step": 177225, "epoch": 1464} {"train_loss": -37.42657470703125, "global_step": 177226, "epoch": 1464} {"train_loss": -33.54345703125, "global_step": 177227, "epoch": 1464} {"train_loss": -32.013160705566406, "global_step": 177228, "epoch": 1464} {"train_loss": -37.09406280517578, "global_step": 177229, "epoch": 1464} {"train_loss": -40.68213653564453, "global_step": 177230, "epoch": 1464} {"train_loss": -38.16650390625, "global_step": 177231, "epoch": 1464} {"train_loss": -36.478065490722656, "global_step": 177232, "epoch": 1464} {"train_loss": -40.74333190917969, "global_step": 177233, "epoch": 1464} {"train_loss": -39.9499626159668, "global_step": 177234, "epoch": 1464} {"train_loss": -38.06122970581055, "global_step": 177235, "epoch": 1464} {"train_loss": -40.51298522949219, "global_step": 177236, "epoch": 1464} {"train_loss": -38.73575210571289, "global_step": 177237, "epoch": 1464} {"train_loss": -38.957725524902344, "global_step": 177238, "epoch": 1464} {"train_loss": -39.932960510253906, "global_step": 177239, "epoch": 1464} {"train_loss": -38.923927307128906, "global_step": 177240, "epoch": 1464} {"train_loss": -39.122291564941406, "global_step": 177241, "epoch": 1464} {"train_loss": -39.12904357910156, "global_step": 177242, "epoch": 1464} {"train_loss": -38.88423156738281, "global_step": 177243, "epoch": 1464} {"train_loss": -40.5521354675293, "global_step": 177244, "epoch": 1464} {"train_loss": -38.845821380615234, "global_step": 177245, "epoch": 1464} {"train_loss": -39.784847259521484, "global_step": 177246, "epoch": 1464} {"train_loss": -39.51740646362305, "global_step": 177247, "epoch": 1464} {"train_loss": -40.581275939941406, "global_step": 177248, "epoch": 1464} {"train_loss": -39.602725982666016, "global_step": 177249, "epoch": 1464} {"train_loss": -40.533966064453125, "global_step": 177250, "epoch": 1464} {"train_loss": -38.780364990234375, "global_step": 177251, "epoch": 1464} {"train_loss": -40.22608947753906, "global_step": 177252, "epoch": 1464} {"train_loss": -41.00526809692383, "global_step": 177253, "epoch": 1464} {"train_loss": -39.93770980834961, "global_step": 177254, "epoch": 1464} {"train_loss": -40.61944580078125, "global_step": 177255, "epoch": 1464} {"train_loss": -40.654823303222656, "global_step": 177256, "epoch": 1464} {"train_loss": -40.68137741088867, "global_step": 177257, "epoch": 1464} {"train_loss": -40.67363739013672, "global_step": 177258, "epoch": 1464} {"train_loss": -40.88371276855469, "global_step": 177259, "epoch": 1464} {"train_loss": -40.288177490234375, "global_step": 177260, "epoch": 1464} {"train_loss": -40.949676513671875, "global_step": 177261, "epoch": 1464} {"train_loss": -40.77211380004883, "global_step": 177262, "epoch": 1464} {"train_loss": -41.02328109741211, "global_step": 177263, "epoch": 1464} {"train_loss": -39.429269885228685, "global_step": 177264, "epoch": 1464, "val_loss": 2614988.75} {"train_loss": -40.9506950378418, "global_step": 177265, "epoch": 1465} {"train_loss": -40.448402404785156, "global_step": 177266, "epoch": 1465} {"train_loss": -38.35665512084961, "global_step": 177267, "epoch": 1465} {"train_loss": -38.994205474853516, "global_step": 177268, "epoch": 1465} {"train_loss": -40.72205352783203, "global_step": 177269, "epoch": 1465} {"train_loss": -40.71619415283203, "global_step": 177270, "epoch": 1465} {"train_loss": -40.69771957397461, "global_step": 177271, "epoch": 1465} {"train_loss": -41.34284210205078, "global_step": 177272, "epoch": 1465} {"train_loss": -40.90814208984375, "global_step": 177273, "epoch": 1465} {"train_loss": -40.42842102050781, "global_step": 177274, "epoch": 1465} {"train_loss": -40.9347038269043, "global_step": 177275, "epoch": 1465} {"train_loss": -40.77717208862305, "global_step": 177276, "epoch": 1465} {"train_loss": -38.43158721923828, "global_step": 177277, "epoch": 1465} {"train_loss": -41.02823257446289, "global_step": 177278, "epoch": 1465} {"train_loss": -41.21876525878906, "global_step": 177279, "epoch": 1465} {"train_loss": -41.26749038696289, "global_step": 177280, "epoch": 1465} {"train_loss": -40.13795471191406, "global_step": 177281, "epoch": 1465} {"train_loss": -41.51945877075195, "global_step": 177282, "epoch": 1465} {"train_loss": -41.07430648803711, "global_step": 177283, "epoch": 1465} {"train_loss": -40.494285583496094, "global_step": 177284, "epoch": 1465} {"train_loss": -41.2923469543457, "global_step": 177285, "epoch": 1465} {"train_loss": -39.98966598510742, "global_step": 177286, "epoch": 1465} {"train_loss": -40.821292877197266, "global_step": 177287, "epoch": 1465} {"train_loss": -39.20697784423828, "global_step": 177288, "epoch": 1465} {"train_loss": -41.56390380859375, "global_step": 177289, "epoch": 1465} {"train_loss": -41.159908294677734, "global_step": 177290, "epoch": 1465} {"train_loss": -41.25260543823242, "global_step": 177291, "epoch": 1465} {"train_loss": -38.59782791137695, "global_step": 177292, "epoch": 1465} {"train_loss": -40.2281379699707, "global_step": 177293, "epoch": 1465} {"train_loss": -39.676204681396484, "global_step": 177294, "epoch": 1465} {"train_loss": -38.64760971069336, "global_step": 177295, "epoch": 1465} {"train_loss": -36.85521697998047, "global_step": 177296, "epoch": 1465} {"train_loss": -37.86320114135742, "global_step": 177297, "epoch": 1465} {"train_loss": -36.97623062133789, "global_step": 177298, "epoch": 1465} {"train_loss": -35.71361541748047, "global_step": 177299, "epoch": 1465} {"train_loss": -36.93195343017578, "global_step": 177300, "epoch": 1465} {"train_loss": -39.797237396240234, "global_step": 177301, "epoch": 1465} {"train_loss": -36.483131408691406, "global_step": 177302, "epoch": 1465} {"train_loss": -37.35986328125, "global_step": 177303, "epoch": 1465} {"train_loss": -40.25399398803711, "global_step": 177304, "epoch": 1465} {"train_loss": -40.07685470581055, "global_step": 177305, "epoch": 1465} {"train_loss": -38.40194320678711, "global_step": 177306, "epoch": 1465} {"train_loss": -39.54507064819336, "global_step": 177307, "epoch": 1465} {"train_loss": -40.24103546142578, "global_step": 177308, "epoch": 1465} {"train_loss": -37.80320358276367, "global_step": 177309, "epoch": 1465} {"train_loss": -37.43846893310547, "global_step": 177310, "epoch": 1465} {"train_loss": -38.764862060546875, "global_step": 177311, "epoch": 1465} {"train_loss": -38.340572357177734, "global_step": 177312, "epoch": 1465} {"train_loss": -40.540157318115234, "global_step": 177313, "epoch": 1465} {"train_loss": -35.79920196533203, "global_step": 177314, "epoch": 1465} {"train_loss": -39.668975830078125, "global_step": 177315, "epoch": 1465} {"train_loss": -40.66033172607422, "global_step": 177316, "epoch": 1465} {"train_loss": -40.43608093261719, "global_step": 177317, "epoch": 1465} {"train_loss": -40.605712890625, "global_step": 177318, "epoch": 1465} {"train_loss": -38.80475997924805, "global_step": 177319, "epoch": 1465} {"train_loss": -39.61497497558594, "global_step": 177320, "epoch": 1465} {"train_loss": -40.085723876953125, "global_step": 177321, "epoch": 1465} {"train_loss": -40.601680755615234, "global_step": 177322, "epoch": 1465} {"train_loss": -38.59553146362305, "global_step": 177323, "epoch": 1465} {"train_loss": -36.7635498046875, "global_step": 177324, "epoch": 1465} {"train_loss": -38.03499221801758, "global_step": 177325, "epoch": 1465} {"train_loss": -39.895057678222656, "global_step": 177326, "epoch": 1465} {"train_loss": -39.7591438293457, "global_step": 177327, "epoch": 1465} {"train_loss": -36.93266296386719, "global_step": 177328, "epoch": 1465} {"train_loss": -40.114288330078125, "global_step": 177329, "epoch": 1465} {"train_loss": -38.61116409301758, "global_step": 177330, "epoch": 1465} {"train_loss": -39.6456298828125, "global_step": 177331, "epoch": 1465} {"train_loss": -39.27277755737305, "global_step": 177332, "epoch": 1465} {"train_loss": -39.589595794677734, "global_step": 177333, "epoch": 1465} {"train_loss": -35.11505126953125, "global_step": 177334, "epoch": 1465} {"train_loss": -40.3145866394043, "global_step": 177335, "epoch": 1465} {"train_loss": -40.265350341796875, "global_step": 177336, "epoch": 1465} {"train_loss": -39.47858428955078, "global_step": 177337, "epoch": 1465} {"train_loss": -40.236331939697266, "global_step": 177338, "epoch": 1465} {"train_loss": -36.81244659423828, "global_step": 177339, "epoch": 1465} {"train_loss": -39.4002685546875, "global_step": 177340, "epoch": 1465} {"train_loss": -39.4867057800293, "global_step": 177341, "epoch": 1465} {"train_loss": -38.31208038330078, "global_step": 177342, "epoch": 1465} {"train_loss": -38.97724533081055, "global_step": 177343, "epoch": 1465} {"train_loss": -40.12758255004883, "global_step": 177344, "epoch": 1465} {"train_loss": -39.712745666503906, "global_step": 177345, "epoch": 1465} {"train_loss": -40.85698699951172, "global_step": 177346, "epoch": 1465} {"train_loss": -39.947444915771484, "global_step": 177347, "epoch": 1465} {"train_loss": -39.038082122802734, "global_step": 177348, "epoch": 1465} {"train_loss": -39.25917053222656, "global_step": 177349, "epoch": 1465} {"train_loss": -40.23179244995117, "global_step": 177350, "epoch": 1465} {"train_loss": -40.725948333740234, "global_step": 177351, "epoch": 1465} {"train_loss": -39.73095703125, "global_step": 177352, "epoch": 1465} {"train_loss": -40.31466293334961, "global_step": 177353, "epoch": 1465} {"train_loss": -39.30654525756836, "global_step": 177354, "epoch": 1465} {"train_loss": -40.27778244018555, "global_step": 177355, "epoch": 1465} {"train_loss": -38.73789596557617, "global_step": 177356, "epoch": 1465} {"train_loss": -39.25620651245117, "global_step": 177357, "epoch": 1465} {"train_loss": -41.1290397644043, "global_step": 177358, "epoch": 1465} {"train_loss": -40.37889099121094, "global_step": 177359, "epoch": 1465} {"train_loss": -39.42293930053711, "global_step": 177360, "epoch": 1465} {"train_loss": -40.090904235839844, "global_step": 177361, "epoch": 1465} {"train_loss": -40.54122543334961, "global_step": 177362, "epoch": 1465} {"train_loss": -40.19443130493164, "global_step": 177363, "epoch": 1465} {"train_loss": -40.5224494934082, "global_step": 177364, "epoch": 1465} {"train_loss": -39.407623291015625, "global_step": 177365, "epoch": 1465} {"train_loss": -37.847564697265625, "global_step": 177366, "epoch": 1465} {"train_loss": -41.032833099365234, "global_step": 177367, "epoch": 1465} {"train_loss": -40.41176986694336, "global_step": 177368, "epoch": 1465} {"train_loss": -40.22750473022461, "global_step": 177369, "epoch": 1465} {"train_loss": -40.702239990234375, "global_step": 177370, "epoch": 1465} {"train_loss": -40.61560821533203, "global_step": 177371, "epoch": 1465} {"train_loss": -40.41606903076172, "global_step": 177372, "epoch": 1465} {"train_loss": -41.12117385864258, "global_step": 177373, "epoch": 1465} {"train_loss": -40.730812072753906, "global_step": 177374, "epoch": 1465} {"train_loss": -40.7710075378418, "global_step": 177375, "epoch": 1465} {"train_loss": -40.90983581542969, "global_step": 177376, "epoch": 1465} {"train_loss": -39.471099853515625, "global_step": 177377, "epoch": 1465} {"train_loss": -39.974884033203125, "global_step": 177378, "epoch": 1465} {"train_loss": -40.58823013305664, "global_step": 177379, "epoch": 1465} {"train_loss": -40.74525833129883, "global_step": 177380, "epoch": 1465} {"train_loss": -40.45864486694336, "global_step": 177381, "epoch": 1465} {"train_loss": -40.034027099609375, "global_step": 177382, "epoch": 1465} {"train_loss": -39.85691452026367, "global_step": 177383, "epoch": 1465} {"train_loss": -40.57129669189453, "global_step": 177384, "epoch": 1465} {"train_loss": -39.676880923184484, "global_step": 177385, "epoch": 1465, "val_loss": 2629259.75} {"train_loss": -40.8828125, "global_step": 177386, "epoch": 1466} {"train_loss": -40.572906494140625, "global_step": 177387, "epoch": 1466} {"train_loss": -40.60426712036133, "global_step": 177388, "epoch": 1466} {"train_loss": -41.07746505737305, "global_step": 177389, "epoch": 1466} {"train_loss": -40.24319839477539, "global_step": 177390, "epoch": 1466} {"train_loss": -40.82309341430664, "global_step": 177391, "epoch": 1466} {"train_loss": -40.34070587158203, "global_step": 177392, "epoch": 1466} {"train_loss": -40.204261779785156, "global_step": 177393, "epoch": 1466} {"train_loss": -40.60213088989258, "global_step": 177394, "epoch": 1466} {"train_loss": -41.094688415527344, "global_step": 177395, "epoch": 1466} {"train_loss": -38.131805419921875, "global_step": 177396, "epoch": 1466} {"train_loss": -41.1644172668457, "global_step": 177397, "epoch": 1466} {"train_loss": -40.050174713134766, "global_step": 177398, "epoch": 1466} {"train_loss": -40.999385833740234, "global_step": 177399, "epoch": 1466} {"train_loss": -39.5612678527832, "global_step": 177400, "epoch": 1466} {"train_loss": -40.82830810546875, "global_step": 177401, "epoch": 1466} {"train_loss": -40.21516799926758, "global_step": 177402, "epoch": 1466} {"train_loss": -40.5916633605957, "global_step": 177403, "epoch": 1466} {"train_loss": -39.108428955078125, "global_step": 177404, "epoch": 1466} {"train_loss": -41.219825744628906, "global_step": 177405, "epoch": 1466} {"train_loss": -39.982845306396484, "global_step": 177406, "epoch": 1466} {"train_loss": -40.70766830444336, "global_step": 177407, "epoch": 1466} {"train_loss": -40.981475830078125, "global_step": 177408, "epoch": 1466} {"train_loss": -40.8269157409668, "global_step": 177409, "epoch": 1466} {"train_loss": -40.573516845703125, "global_step": 177410, "epoch": 1466} {"train_loss": -40.168846130371094, "global_step": 177411, "epoch": 1466} {"train_loss": -39.78818893432617, "global_step": 177412, "epoch": 1466} {"train_loss": -40.5604133605957, "global_step": 177413, "epoch": 1466} {"train_loss": -40.88348388671875, "global_step": 177414, "epoch": 1466} {"train_loss": -40.60293197631836, "global_step": 177415, "epoch": 1466} {"train_loss": -40.766387939453125, "global_step": 177416, "epoch": 1466} {"train_loss": -39.9995231628418, "global_step": 177417, "epoch": 1466} {"train_loss": -38.20116424560547, "global_step": 177418, "epoch": 1466} {"train_loss": -39.745235443115234, "global_step": 177419, "epoch": 1466} {"train_loss": -40.10007858276367, "global_step": 177420, "epoch": 1466} {"train_loss": -39.454383850097656, "global_step": 177421, "epoch": 1466} {"train_loss": -40.796302795410156, "global_step": 177422, "epoch": 1466} {"train_loss": -37.73226547241211, "global_step": 177423, "epoch": 1466} {"train_loss": -39.41972732543945, "global_step": 177424, "epoch": 1466} {"train_loss": -38.74613571166992, "global_step": 177425, "epoch": 1466} {"train_loss": -39.178340911865234, "global_step": 177426, "epoch": 1466} {"train_loss": -40.15623092651367, "global_step": 177427, "epoch": 1466} {"train_loss": -40.97567367553711, "global_step": 177428, "epoch": 1466} {"train_loss": -38.35740280151367, "global_step": 177429, "epoch": 1466} {"train_loss": -39.828060150146484, "global_step": 177430, "epoch": 1466} {"train_loss": -40.075523376464844, "global_step": 177431, "epoch": 1466} {"train_loss": -40.754783630371094, "global_step": 177432, "epoch": 1466} {"train_loss": -40.91236114501953, "global_step": 177433, "epoch": 1466} {"train_loss": -39.94422149658203, "global_step": 177434, "epoch": 1466} {"train_loss": -40.81500244140625, "global_step": 177435, "epoch": 1466} {"train_loss": -40.276180267333984, "global_step": 177436, "epoch": 1466} {"train_loss": -39.15058898925781, "global_step": 177437, "epoch": 1466} {"train_loss": -40.67294692993164, "global_step": 177438, "epoch": 1466} {"train_loss": -41.15707015991211, "global_step": 177439, "epoch": 1466} {"train_loss": -41.08216094970703, "global_step": 177440, "epoch": 1466} {"train_loss": -40.83597946166992, "global_step": 177441, "epoch": 1466} {"train_loss": -40.662147521972656, "global_step": 177442, "epoch": 1466} {"train_loss": -39.629676818847656, "global_step": 177443, "epoch": 1466} {"train_loss": -40.66230010986328, "global_step": 177444, "epoch": 1466} {"train_loss": -40.72501754760742, "global_step": 177445, "epoch": 1466} {"train_loss": -40.42591857910156, "global_step": 177446, "epoch": 1466} {"train_loss": -40.5078010559082, "global_step": 177447, "epoch": 1466} {"train_loss": -40.63081741333008, "global_step": 177448, "epoch": 1466} {"train_loss": -41.098724365234375, "global_step": 177449, "epoch": 1466} {"train_loss": -40.63007736206055, "global_step": 177450, "epoch": 1466} {"train_loss": -41.0385627746582, "global_step": 177451, "epoch": 1466} {"train_loss": -40.87895965576172, "global_step": 177452, "epoch": 1466} {"train_loss": -40.94325256347656, "global_step": 177453, "epoch": 1466} {"train_loss": -41.692230224609375, "global_step": 177454, "epoch": 1466} {"train_loss": -40.98575973510742, "global_step": 177455, "epoch": 1466} {"train_loss": -41.07075119018555, "global_step": 177456, "epoch": 1466} {"train_loss": -40.82835006713867, "global_step": 177457, "epoch": 1466} {"train_loss": -41.08953094482422, "global_step": 177458, "epoch": 1466} {"train_loss": -41.181941986083984, "global_step": 177459, "epoch": 1466} {"train_loss": -40.28295135498047, "global_step": 177460, "epoch": 1466} {"train_loss": -39.54128646850586, "global_step": 177461, "epoch": 1466} {"train_loss": -40.70227813720703, "global_step": 177462, "epoch": 1466} {"train_loss": -41.53770065307617, "global_step": 177463, "epoch": 1466} {"train_loss": -40.0564079284668, "global_step": 177464, "epoch": 1466} {"train_loss": -37.03677749633789, "global_step": 177465, "epoch": 1466} {"train_loss": -36.19454574584961, "global_step": 177466, "epoch": 1466} {"train_loss": -39.839656829833984, "global_step": 177467, "epoch": 1466} {"train_loss": -41.05176544189453, "global_step": 177468, "epoch": 1466} {"train_loss": -40.307228088378906, "global_step": 177469, "epoch": 1466} {"train_loss": -40.308815002441406, "global_step": 177470, "epoch": 1466} {"train_loss": -41.0015983581543, "global_step": 177471, "epoch": 1466} {"train_loss": -40.26707458496094, "global_step": 177472, "epoch": 1466} {"train_loss": -41.16270065307617, "global_step": 177473, "epoch": 1466} {"train_loss": -41.006591796875, "global_step": 177474, "epoch": 1466} {"train_loss": -41.17473602294922, "global_step": 177475, "epoch": 1466} {"train_loss": -40.777862548828125, "global_step": 177476, "epoch": 1466} {"train_loss": -39.78075408935547, "global_step": 177477, "epoch": 1466} {"train_loss": -40.749237060546875, "global_step": 177478, "epoch": 1466} {"train_loss": -40.609127044677734, "global_step": 177479, "epoch": 1466} {"train_loss": -41.1379508972168, "global_step": 177480, "epoch": 1466} {"train_loss": -40.6619873046875, "global_step": 177481, "epoch": 1466} {"train_loss": -40.30230712890625, "global_step": 177482, "epoch": 1466} {"train_loss": -41.307395935058594, "global_step": 177483, "epoch": 1466} {"train_loss": -41.11619186401367, "global_step": 177484, "epoch": 1466} {"train_loss": -40.16954803466797, "global_step": 177485, "epoch": 1466} {"train_loss": -38.63894271850586, "global_step": 177486, "epoch": 1466} {"train_loss": -39.444637298583984, "global_step": 177487, "epoch": 1466} {"train_loss": -39.92836380004883, "global_step": 177488, "epoch": 1466} {"train_loss": -39.89352035522461, "global_step": 177489, "epoch": 1466} {"train_loss": -39.47340774536133, "global_step": 177490, "epoch": 1466} {"train_loss": -39.43294906616211, "global_step": 177491, "epoch": 1466} {"train_loss": -39.093719482421875, "global_step": 177492, "epoch": 1466} {"train_loss": -38.78452682495117, "global_step": 177493, "epoch": 1466} {"train_loss": -40.52033233642578, "global_step": 177494, "epoch": 1466} {"train_loss": -39.306209564208984, "global_step": 177495, "epoch": 1466} {"train_loss": -40.30027389526367, "global_step": 177496, "epoch": 1466} {"train_loss": -41.34524154663086, "global_step": 177497, "epoch": 1466} {"train_loss": -41.52962112426758, "global_step": 177498, "epoch": 1466} {"train_loss": -41.190364837646484, "global_step": 177499, "epoch": 1466} {"train_loss": -40.57011795043945, "global_step": 177500, "epoch": 1466} {"train_loss": -41.45318603515625, "global_step": 177501, "epoch": 1466} {"train_loss": -41.22211837768555, "global_step": 177502, "epoch": 1466} {"train_loss": -41.34507369995117, "global_step": 177503, "epoch": 1466} {"train_loss": -41.02836990356445, "global_step": 177504, "epoch": 1466} {"train_loss": -41.864986419677734, "global_step": 177505, "epoch": 1466} {"train_loss": -40.35904558039894, "global_step": 177506, "epoch": 1466, "val_loss": 2814582.0} {"train_loss": -41.725830078125, "global_step": 177507, "epoch": 1467} {"train_loss": -41.334407806396484, "global_step": 177508, "epoch": 1467} {"train_loss": -41.65410232543945, "global_step": 177509, "epoch": 1467} {"train_loss": -41.88572311401367, "global_step": 177510, "epoch": 1467} {"train_loss": -41.440467834472656, "global_step": 177511, "epoch": 1467} {"train_loss": -41.19036865234375, "global_step": 177512, "epoch": 1467} {"train_loss": -41.49977493286133, "global_step": 177513, "epoch": 1467} {"train_loss": -41.797157287597656, "global_step": 177514, "epoch": 1467} {"train_loss": -40.47259521484375, "global_step": 177515, "epoch": 1467} {"train_loss": -41.73794174194336, "global_step": 177516, "epoch": 1467} {"train_loss": -41.05559158325195, "global_step": 177517, "epoch": 1467} {"train_loss": -40.65116882324219, "global_step": 177518, "epoch": 1467} {"train_loss": -41.357276916503906, "global_step": 177519, "epoch": 1467} {"train_loss": -41.660377502441406, "global_step": 177520, "epoch": 1467} {"train_loss": -41.2835693359375, "global_step": 177521, "epoch": 1467} {"train_loss": -41.61527633666992, "global_step": 177522, "epoch": 1467} {"train_loss": -40.781715393066406, "global_step": 177523, "epoch": 1467} {"train_loss": -41.44762420654297, "global_step": 177524, "epoch": 1467} {"train_loss": -40.59553146362305, "global_step": 177525, "epoch": 1467} {"train_loss": -41.79188919067383, "global_step": 177526, "epoch": 1467} {"train_loss": -41.29475402832031, "global_step": 177527, "epoch": 1467} {"train_loss": -41.3001594543457, "global_step": 177528, "epoch": 1467} {"train_loss": -41.87237548828125, "global_step": 177529, "epoch": 1467} {"train_loss": -40.94293975830078, "global_step": 177530, "epoch": 1467} {"train_loss": -41.92899703979492, "global_step": 177531, "epoch": 1467} {"train_loss": -41.14597702026367, "global_step": 177532, "epoch": 1467} {"train_loss": -40.939632415771484, "global_step": 177533, "epoch": 1467} {"train_loss": -39.815547943115234, "global_step": 177534, "epoch": 1467} {"train_loss": -40.45144271850586, "global_step": 177535, "epoch": 1467} {"train_loss": -41.39866256713867, "global_step": 177536, "epoch": 1467} {"train_loss": -41.68951416015625, "global_step": 177537, "epoch": 1467} {"train_loss": -40.03676986694336, "global_step": 177538, "epoch": 1467} {"train_loss": -38.7622184753418, "global_step": 177539, "epoch": 1467} {"train_loss": -37.620628356933594, "global_step": 177540, "epoch": 1467} {"train_loss": -38.7704963684082, "global_step": 177541, "epoch": 1467} {"train_loss": -37.16615676879883, "global_step": 177542, "epoch": 1467} {"train_loss": -37.88075637817383, "global_step": 177543, "epoch": 1467} {"train_loss": -39.86890411376953, "global_step": 177544, "epoch": 1467} {"train_loss": -40.26590347290039, "global_step": 177545, "epoch": 1467} {"train_loss": -37.65583038330078, "global_step": 177546, "epoch": 1467} {"train_loss": -32.06012725830078, "global_step": 177547, "epoch": 1467} {"train_loss": -30.1148681640625, "global_step": 177548, "epoch": 1467} {"train_loss": -38.506126403808594, "global_step": 177549, "epoch": 1467} {"train_loss": -37.349979400634766, "global_step": 177550, "epoch": 1467} {"train_loss": -32.17794418334961, "global_step": 177551, "epoch": 1467} {"train_loss": -38.295326232910156, "global_step": 177552, "epoch": 1467} {"train_loss": -36.57210159301758, "global_step": 177553, "epoch": 1467} {"train_loss": -34.418270111083984, "global_step": 177554, "epoch": 1467} {"train_loss": -39.85859680175781, "global_step": 177555, "epoch": 1467} {"train_loss": -33.63676834106445, "global_step": 177556, "epoch": 1467} {"train_loss": -39.56988525390625, "global_step": 177557, "epoch": 1467} {"train_loss": -36.689537048339844, "global_step": 177558, "epoch": 1467} {"train_loss": -40.896705627441406, "global_step": 177559, "epoch": 1467} {"train_loss": -37.971351623535156, "global_step": 177560, "epoch": 1467} {"train_loss": -40.563716888427734, "global_step": 177561, "epoch": 1467} {"train_loss": -38.73619842529297, "global_step": 177562, "epoch": 1467} {"train_loss": -40.55430221557617, "global_step": 177563, "epoch": 1467} {"train_loss": -39.322853088378906, "global_step": 177564, "epoch": 1467} {"train_loss": -40.10554885864258, "global_step": 177565, "epoch": 1467} {"train_loss": -40.502662658691406, "global_step": 177566, "epoch": 1467} {"train_loss": -39.26861572265625, "global_step": 177567, "epoch": 1467} {"train_loss": -40.65574264526367, "global_step": 177568, "epoch": 1467} {"train_loss": -39.829891204833984, "global_step": 177569, "epoch": 1467} {"train_loss": -40.20453643798828, "global_step": 177570, "epoch": 1467} {"train_loss": -40.27692413330078, "global_step": 177571, "epoch": 1467} {"train_loss": -39.94865798950195, "global_step": 177572, "epoch": 1467} {"train_loss": -40.9537467956543, "global_step": 177573, "epoch": 1467} {"train_loss": -40.0943489074707, "global_step": 177574, "epoch": 1467} {"train_loss": -40.53217697143555, "global_step": 177575, "epoch": 1467} {"train_loss": -40.74430847167969, "global_step": 177576, "epoch": 1467} {"train_loss": -39.923255920410156, "global_step": 177577, "epoch": 1467} {"train_loss": -40.83349609375, "global_step": 177578, "epoch": 1467} {"train_loss": -40.80610275268555, "global_step": 177579, "epoch": 1467} {"train_loss": -40.82635498046875, "global_step": 177580, "epoch": 1467} {"train_loss": -41.119991302490234, "global_step": 177581, "epoch": 1467} {"train_loss": -40.99325180053711, "global_step": 177582, "epoch": 1467} {"train_loss": -41.127716064453125, "global_step": 177583, "epoch": 1467} {"train_loss": -40.910255432128906, "global_step": 177584, "epoch": 1467} {"train_loss": -40.79412841796875, "global_step": 177585, "epoch": 1467} {"train_loss": -41.34934997558594, "global_step": 177586, "epoch": 1467} {"train_loss": -40.939090728759766, "global_step": 177587, "epoch": 1467} {"train_loss": -41.34804916381836, "global_step": 177588, "epoch": 1467} {"train_loss": -41.117393493652344, "global_step": 177589, "epoch": 1467} {"train_loss": -41.43129348754883, "global_step": 177590, "epoch": 1467} {"train_loss": -40.96953201293945, "global_step": 177591, "epoch": 1467} {"train_loss": -40.843536376953125, "global_step": 177592, "epoch": 1467} {"train_loss": -40.7286491394043, "global_step": 177593, "epoch": 1467} {"train_loss": -41.50209045410156, "global_step": 177594, "epoch": 1467} {"train_loss": -40.668678283691406, "global_step": 177595, "epoch": 1467} {"train_loss": -40.98643112182617, "global_step": 177596, "epoch": 1467} {"train_loss": -41.43291091918945, "global_step": 177597, "epoch": 1467} {"train_loss": -40.83573532104492, "global_step": 177598, "epoch": 1467} {"train_loss": -40.50025177001953, "global_step": 177599, "epoch": 1467} {"train_loss": -39.22231674194336, "global_step": 177600, "epoch": 1467} {"train_loss": -40.5598258972168, "global_step": 177601, "epoch": 1467} {"train_loss": -39.868404388427734, "global_step": 177602, "epoch": 1467} {"train_loss": -41.544734954833984, "global_step": 177603, "epoch": 1467} {"train_loss": -40.927955627441406, "global_step": 177604, "epoch": 1467} {"train_loss": -38.130775451660156, "global_step": 177605, "epoch": 1467} {"train_loss": -40.22407150268555, "global_step": 177606, "epoch": 1467} {"train_loss": -40.265933990478516, "global_step": 177607, "epoch": 1467} {"train_loss": -40.5414924621582, "global_step": 177608, "epoch": 1467} {"train_loss": -38.622711181640625, "global_step": 177609, "epoch": 1467} {"train_loss": -36.51005172729492, "global_step": 177610, "epoch": 1467} {"train_loss": -34.146697998046875, "global_step": 177611, "epoch": 1467} {"train_loss": -38.163116455078125, "global_step": 177612, "epoch": 1467} {"train_loss": -27.60906410217285, "global_step": 177613, "epoch": 1467} {"train_loss": -32.143611907958984, "global_step": 177614, "epoch": 1467} {"train_loss": -21.47791862487793, "global_step": 177615, "epoch": 1467} {"train_loss": -31.46759605407715, "global_step": 177616, "epoch": 1467} {"train_loss": -27.583654403686523, "global_step": 177617, "epoch": 1467} {"train_loss": -29.681127548217773, "global_step": 177618, "epoch": 1467} {"train_loss": -30.278512954711914, "global_step": 177619, "epoch": 1467} {"train_loss": -31.564672470092773, "global_step": 177620, "epoch": 1467} {"train_loss": -28.51657485961914, "global_step": 177621, "epoch": 1467} {"train_loss": -24.61172866821289, "global_step": 177622, "epoch": 1467} {"train_loss": -26.336029052734375, "global_step": 177623, "epoch": 1467} {"train_loss": -29.56500816345215, "global_step": 177624, "epoch": 1467} {"train_loss": -27.281545639038086, "global_step": 177625, "epoch": 1467} {"train_loss": -33.6745719909668, "global_step": 177626, "epoch": 1467} {"train_loss": -38.504412107231204, "global_step": 177627, "epoch": 1467, "val_loss": 2801347.0} {"train_loss": -33.969268798828125, "global_step": 177628, "epoch": 1468} {"train_loss": -29.251073837280273, "global_step": 177629, "epoch": 1468} {"train_loss": -32.568050384521484, "global_step": 177630, "epoch": 1468} {"train_loss": -33.67218017578125, "global_step": 177631, "epoch": 1468} {"train_loss": -32.450618743896484, "global_step": 177632, "epoch": 1468} {"train_loss": -31.853424072265625, "global_step": 177633, "epoch": 1468} {"train_loss": -30.088239669799805, "global_step": 177634, "epoch": 1468} {"train_loss": -34.773807525634766, "global_step": 177635, "epoch": 1468} {"train_loss": -33.60642623901367, "global_step": 177636, "epoch": 1468} {"train_loss": -34.2812385559082, "global_step": 177637, "epoch": 1468} {"train_loss": -34.50737762451172, "global_step": 177638, "epoch": 1468} {"train_loss": -34.36442947387695, "global_step": 177639, "epoch": 1468} {"train_loss": -36.86518478393555, "global_step": 177640, "epoch": 1468} {"train_loss": -34.229339599609375, "global_step": 177641, "epoch": 1468} {"train_loss": -35.01611328125, "global_step": 177642, "epoch": 1468} {"train_loss": -35.0179443359375, "global_step": 177643, "epoch": 1468} {"train_loss": -35.843929290771484, "global_step": 177644, "epoch": 1468} {"train_loss": -35.767086029052734, "global_step": 177645, "epoch": 1468} {"train_loss": -35.92639923095703, "global_step": 177646, "epoch": 1468} {"train_loss": -35.724422454833984, "global_step": 177647, "epoch": 1468} {"train_loss": -37.143585205078125, "global_step": 177648, "epoch": 1468} {"train_loss": -36.30528259277344, "global_step": 177649, "epoch": 1468} {"train_loss": -37.37859344482422, "global_step": 177650, "epoch": 1468} {"train_loss": -37.144596099853516, "global_step": 177651, "epoch": 1468} {"train_loss": -36.22419357299805, "global_step": 177652, "epoch": 1468} {"train_loss": -37.20603561401367, "global_step": 177653, "epoch": 1468} {"train_loss": -37.74870300292969, "global_step": 177654, "epoch": 1468} {"train_loss": -37.42776870727539, "global_step": 177655, "epoch": 1468} {"train_loss": -35.84950256347656, "global_step": 177656, "epoch": 1468} {"train_loss": -36.65543746948242, "global_step": 177657, "epoch": 1468} {"train_loss": -36.57716369628906, "global_step": 177658, "epoch": 1468} {"train_loss": -37.11670684814453, "global_step": 177659, "epoch": 1468} {"train_loss": -37.12892532348633, "global_step": 177660, "epoch": 1468} {"train_loss": -37.57982635498047, "global_step": 177661, "epoch": 1468} {"train_loss": -37.57161331176758, "global_step": 177662, "epoch": 1468} {"train_loss": -37.49871826171875, "global_step": 177663, "epoch": 1468} {"train_loss": -37.79692077636719, "global_step": 177664, "epoch": 1468} {"train_loss": -38.09283447265625, "global_step": 177665, "epoch": 1468} {"train_loss": -36.89427947998047, "global_step": 177666, "epoch": 1468} {"train_loss": -38.13887405395508, "global_step": 177667, "epoch": 1468} {"train_loss": -38.02583694458008, "global_step": 177668, "epoch": 1468} {"train_loss": -37.86756134033203, "global_step": 177669, "epoch": 1468} {"train_loss": -36.4776725769043, "global_step": 177670, "epoch": 1468} {"train_loss": -37.89239501953125, "global_step": 177671, "epoch": 1468} {"train_loss": -38.56432342529297, "global_step": 177672, "epoch": 1468} {"train_loss": -38.31398391723633, "global_step": 177673, "epoch": 1468} {"train_loss": -38.68455505371094, "global_step": 177674, "epoch": 1468} {"train_loss": -38.72101974487305, "global_step": 177675, "epoch": 1468} {"train_loss": -36.96731185913086, "global_step": 177676, "epoch": 1468} {"train_loss": -38.47903060913086, "global_step": 177677, "epoch": 1468} {"train_loss": -38.47026443481445, "global_step": 177678, "epoch": 1468} {"train_loss": -38.5168571472168, "global_step": 177679, "epoch": 1468} {"train_loss": -38.32748031616211, "global_step": 177680, "epoch": 1468} {"train_loss": -38.95498275756836, "global_step": 177681, "epoch": 1468} {"train_loss": -38.512916564941406, "global_step": 177682, "epoch": 1468} {"train_loss": -38.5419807434082, "global_step": 177683, "epoch": 1468} {"train_loss": -38.90894317626953, "global_step": 177684, "epoch": 1468} {"train_loss": -38.50704574584961, "global_step": 177685, "epoch": 1468} {"train_loss": -38.48796844482422, "global_step": 177686, "epoch": 1468} {"train_loss": -38.5815544128418, "global_step": 177687, "epoch": 1468} {"train_loss": -38.950435638427734, "global_step": 177688, "epoch": 1468} {"train_loss": -39.21712875366211, "global_step": 177689, "epoch": 1468} {"train_loss": -38.793922424316406, "global_step": 177690, "epoch": 1468} {"train_loss": -39.34299850463867, "global_step": 177691, "epoch": 1468} {"train_loss": -38.76628494262695, "global_step": 177692, "epoch": 1468} {"train_loss": -38.99077224731445, "global_step": 177693, "epoch": 1468} {"train_loss": -39.37489700317383, "global_step": 177694, "epoch": 1468} {"train_loss": -38.29103088378906, "global_step": 177695, "epoch": 1468} {"train_loss": -39.060359954833984, "global_step": 177696, "epoch": 1468} {"train_loss": -39.214698791503906, "global_step": 177697, "epoch": 1468} {"train_loss": -39.706912994384766, "global_step": 177698, "epoch": 1468} {"train_loss": -38.13975143432617, "global_step": 177699, "epoch": 1468} {"train_loss": -39.766361236572266, "global_step": 177700, "epoch": 1468} {"train_loss": -39.080604553222656, "global_step": 177701, "epoch": 1468} {"train_loss": -38.83224105834961, "global_step": 177702, "epoch": 1468} {"train_loss": -39.306758880615234, "global_step": 177703, "epoch": 1468} {"train_loss": -39.25972366333008, "global_step": 177704, "epoch": 1468} {"train_loss": -39.24093246459961, "global_step": 177705, "epoch": 1468} {"train_loss": -38.821571350097656, "global_step": 177706, "epoch": 1468} {"train_loss": -39.698829650878906, "global_step": 177707, "epoch": 1468} {"train_loss": -39.591033935546875, "global_step": 177708, "epoch": 1468} {"train_loss": -39.49222183227539, "global_step": 177709, "epoch": 1468} {"train_loss": -39.9835319519043, "global_step": 177710, "epoch": 1468} {"train_loss": -39.67958450317383, "global_step": 177711, "epoch": 1468} {"train_loss": -39.11994171142578, "global_step": 177712, "epoch": 1468} {"train_loss": -39.430198669433594, "global_step": 177713, "epoch": 1468} {"train_loss": -39.46333694458008, "global_step": 177714, "epoch": 1468} {"train_loss": -39.71438217163086, "global_step": 177715, "epoch": 1468} {"train_loss": -39.89520263671875, "global_step": 177716, "epoch": 1468} {"train_loss": -38.97119903564453, "global_step": 177717, "epoch": 1468} {"train_loss": -39.56585693359375, "global_step": 177718, "epoch": 1468} {"train_loss": -40.08414840698242, "global_step": 177719, "epoch": 1468} {"train_loss": -40.24298858642578, "global_step": 177720, "epoch": 1468} {"train_loss": -39.959136962890625, "global_step": 177721, "epoch": 1468} {"train_loss": -40.1620979309082, "global_step": 177722, "epoch": 1468} {"train_loss": -39.8963508605957, "global_step": 177723, "epoch": 1468} {"train_loss": -40.43560791015625, "global_step": 177724, "epoch": 1468} {"train_loss": -39.73940658569336, "global_step": 177725, "epoch": 1468} {"train_loss": -39.82640838623047, "global_step": 177726, "epoch": 1468} {"train_loss": -40.27339553833008, "global_step": 177727, "epoch": 1468} {"train_loss": -40.104103088378906, "global_step": 177728, "epoch": 1468} {"train_loss": -40.24067306518555, "global_step": 177729, "epoch": 1468} {"train_loss": -40.38448715209961, "global_step": 177730, "epoch": 1468} {"train_loss": -40.384586334228516, "global_step": 177731, "epoch": 1468} {"train_loss": -40.74068832397461, "global_step": 177732, "epoch": 1468} {"train_loss": -40.05010986328125, "global_step": 177733, "epoch": 1468} {"train_loss": -40.43467330932617, "global_step": 177734, "epoch": 1468} {"train_loss": -39.971736907958984, "global_step": 177735, "epoch": 1468} {"train_loss": -39.736915588378906, "global_step": 177736, "epoch": 1468} {"train_loss": -39.7319450378418, "global_step": 177737, "epoch": 1468} {"train_loss": -40.42771911621094, "global_step": 177738, "epoch": 1468} {"train_loss": -40.46559524536133, "global_step": 177739, "epoch": 1468} {"train_loss": -40.12092208862305, "global_step": 177740, "epoch": 1468} {"train_loss": -39.91162109375, "global_step": 177741, "epoch": 1468} {"train_loss": -40.83382034301758, "global_step": 177742, "epoch": 1468} {"train_loss": -40.82936477661133, "global_step": 177743, "epoch": 1468} {"train_loss": -40.30675506591797, "global_step": 177744, "epoch": 1468} {"train_loss": -39.50712203979492, "global_step": 177745, "epoch": 1468} {"train_loss": -40.8548469543457, "global_step": 177746, "epoch": 1468} {"train_loss": -40.298744201660156, "global_step": 177747, "epoch": 1468} {"train_loss": -38.1189497325046, "global_step": 177748, "epoch": 1468, "val_loss": 2600842.0} {"train_loss": -39.942901611328125, "global_step": 177749, "epoch": 1469} {"train_loss": -38.52866744995117, "global_step": 177750, "epoch": 1469} {"train_loss": -39.234107971191406, "global_step": 177751, "epoch": 1469} {"train_loss": -39.549400329589844, "global_step": 177752, "epoch": 1469} {"train_loss": -40.22208786010742, "global_step": 177753, "epoch": 1469} {"train_loss": -40.300682067871094, "global_step": 177754, "epoch": 1469} {"train_loss": -40.471710205078125, "global_step": 177755, "epoch": 1469} {"train_loss": -40.47072982788086, "global_step": 177756, "epoch": 1469} {"train_loss": -39.96095657348633, "global_step": 177757, "epoch": 1469} {"train_loss": -40.32651901245117, "global_step": 177758, "epoch": 1469} {"train_loss": -39.812294006347656, "global_step": 177759, "epoch": 1469} {"train_loss": -40.46649169921875, "global_step": 177760, "epoch": 1469} {"train_loss": -40.3640251159668, "global_step": 177761, "epoch": 1469} {"train_loss": -39.421356201171875, "global_step": 177762, "epoch": 1469} {"train_loss": -40.00978469848633, "global_step": 177763, "epoch": 1469} {"train_loss": -39.3022575378418, "global_step": 177764, "epoch": 1469} {"train_loss": -38.23624801635742, "global_step": 177765, "epoch": 1469} {"train_loss": -39.7492561340332, "global_step": 177766, "epoch": 1469} {"train_loss": -38.94386672973633, "global_step": 177767, "epoch": 1469} {"train_loss": -37.445220947265625, "global_step": 177768, "epoch": 1469} {"train_loss": -37.50790023803711, "global_step": 177769, "epoch": 1469} {"train_loss": -37.856990814208984, "global_step": 177770, "epoch": 1469} {"train_loss": -38.6855354309082, "global_step": 177771, "epoch": 1469} {"train_loss": -40.3207893371582, "global_step": 177772, "epoch": 1469} {"train_loss": -38.419395446777344, "global_step": 177773, "epoch": 1469} {"train_loss": -37.43964767456055, "global_step": 177774, "epoch": 1469} {"train_loss": -38.506229400634766, "global_step": 177775, "epoch": 1469} {"train_loss": -40.05526351928711, "global_step": 177776, "epoch": 1469} {"train_loss": -36.850257873535156, "global_step": 177777, "epoch": 1469} {"train_loss": -38.472686767578125, "global_step": 177778, "epoch": 1469} {"train_loss": -40.334320068359375, "global_step": 177779, "epoch": 1469} {"train_loss": -35.90517044067383, "global_step": 177780, "epoch": 1469} {"train_loss": -36.76237869262695, "global_step": 177781, "epoch": 1469} {"train_loss": -39.01401901245117, "global_step": 177782, "epoch": 1469} {"train_loss": -36.9930305480957, "global_step": 177783, "epoch": 1469} {"train_loss": -38.25896072387695, "global_step": 177784, "epoch": 1469} {"train_loss": -38.82637405395508, "global_step": 177785, "epoch": 1469} {"train_loss": -39.20650863647461, "global_step": 177786, "epoch": 1469} {"train_loss": -39.06167221069336, "global_step": 177787, "epoch": 1469} {"train_loss": -39.1077995300293, "global_step": 177788, "epoch": 1469} {"train_loss": -39.85150146484375, "global_step": 177789, "epoch": 1469} {"train_loss": -39.034175872802734, "global_step": 177790, "epoch": 1469} {"train_loss": -40.021461486816406, "global_step": 177791, "epoch": 1469} {"train_loss": -37.38328170776367, "global_step": 177792, "epoch": 1469} {"train_loss": -39.930477142333984, "global_step": 177793, "epoch": 1469} {"train_loss": -40.47477722167969, "global_step": 177794, "epoch": 1469} {"train_loss": -39.9212646484375, "global_step": 177795, "epoch": 1469} {"train_loss": -40.213623046875, "global_step": 177796, "epoch": 1469} {"train_loss": -40.52314758300781, "global_step": 177797, "epoch": 1469} {"train_loss": -39.680606842041016, "global_step": 177798, "epoch": 1469} {"train_loss": -40.233367919921875, "global_step": 177799, "epoch": 1469} {"train_loss": -40.19961166381836, "global_step": 177800, "epoch": 1469} {"train_loss": -40.06758499145508, "global_step": 177801, "epoch": 1469} {"train_loss": -40.6389045715332, "global_step": 177802, "epoch": 1469} {"train_loss": -40.504207611083984, "global_step": 177803, "epoch": 1469} {"train_loss": -40.506996154785156, "global_step": 177804, "epoch": 1469} {"train_loss": -39.552310943603516, "global_step": 177805, "epoch": 1469} {"train_loss": -40.58222579956055, "global_step": 177806, "epoch": 1469} {"train_loss": -40.920989990234375, "global_step": 177807, "epoch": 1469} {"train_loss": -40.88071823120117, "global_step": 177808, "epoch": 1469} {"train_loss": -40.71753692626953, "global_step": 177809, "epoch": 1469} {"train_loss": -41.01081466674805, "global_step": 177810, "epoch": 1469} {"train_loss": -40.953365325927734, "global_step": 177811, "epoch": 1469} {"train_loss": -41.123260498046875, "global_step": 177812, "epoch": 1469} {"train_loss": -40.85425567626953, "global_step": 177813, "epoch": 1469} {"train_loss": -40.89085006713867, "global_step": 177814, "epoch": 1469} {"train_loss": -40.776485443115234, "global_step": 177815, "epoch": 1469} {"train_loss": -40.93231201171875, "global_step": 177816, "epoch": 1469} {"train_loss": -41.17147445678711, "global_step": 177817, "epoch": 1469} {"train_loss": -40.10227966308594, "global_step": 177818, "epoch": 1469} {"train_loss": -41.40669250488281, "global_step": 177819, "epoch": 1469} {"train_loss": -41.087554931640625, "global_step": 177820, "epoch": 1469} {"train_loss": -41.261878967285156, "global_step": 177821, "epoch": 1469} {"train_loss": -41.8936767578125, "global_step": 177822, "epoch": 1469} {"train_loss": -41.3785514831543, "global_step": 177823, "epoch": 1469} {"train_loss": -41.54173278808594, "global_step": 177824, "epoch": 1469} {"train_loss": -40.9149284362793, "global_step": 177825, "epoch": 1469} {"train_loss": -41.81124496459961, "global_step": 177826, "epoch": 1469} {"train_loss": -41.6029167175293, "global_step": 177827, "epoch": 1469} {"train_loss": -41.264305114746094, "global_step": 177828, "epoch": 1469} {"train_loss": -41.54612350463867, "global_step": 177829, "epoch": 1469} {"train_loss": -41.630245208740234, "global_step": 177830, "epoch": 1469} {"train_loss": -41.65110778808594, "global_step": 177831, "epoch": 1469} {"train_loss": -41.469329833984375, "global_step": 177832, "epoch": 1469} {"train_loss": -41.22722244262695, "global_step": 177833, "epoch": 1469} {"train_loss": -41.519283294677734, "global_step": 177834, "epoch": 1469} {"train_loss": -41.541927337646484, "global_step": 177835, "epoch": 1469} {"train_loss": -41.16093063354492, "global_step": 177836, "epoch": 1469} {"train_loss": -41.40118408203125, "global_step": 177837, "epoch": 1469} {"train_loss": -41.72144317626953, "global_step": 177838, "epoch": 1469} {"train_loss": -40.72774887084961, "global_step": 177839, "epoch": 1469} {"train_loss": -41.413997650146484, "global_step": 177840, "epoch": 1469} {"train_loss": -41.62346267700195, "global_step": 177841, "epoch": 1469} {"train_loss": -41.394561767578125, "global_step": 177842, "epoch": 1469} {"train_loss": -40.16289138793945, "global_step": 177843, "epoch": 1469} {"train_loss": -41.355995178222656, "global_step": 177844, "epoch": 1469} {"train_loss": -41.16535186767578, "global_step": 177845, "epoch": 1469} {"train_loss": -40.609954833984375, "global_step": 177846, "epoch": 1469} {"train_loss": -38.96220779418945, "global_step": 177847, "epoch": 1469} {"train_loss": -39.31496047973633, "global_step": 177848, "epoch": 1469} {"train_loss": -38.40825271606445, "global_step": 177849, "epoch": 1469} {"train_loss": -37.20327377319336, "global_step": 177850, "epoch": 1469} {"train_loss": -39.08614730834961, "global_step": 177851, "epoch": 1469} {"train_loss": -39.030609130859375, "global_step": 177852, "epoch": 1469} {"train_loss": -38.868560791015625, "global_step": 177853, "epoch": 1469} {"train_loss": -39.182472229003906, "global_step": 177854, "epoch": 1469} {"train_loss": -39.75111770629883, "global_step": 177855, "epoch": 1469} {"train_loss": -40.57383346557617, "global_step": 177856, "epoch": 1469} {"train_loss": -40.120849609375, "global_step": 177857, "epoch": 1469} {"train_loss": -38.472145080566406, "global_step": 177858, "epoch": 1469} {"train_loss": -40.209007263183594, "global_step": 177859, "epoch": 1469} {"train_loss": -40.797725677490234, "global_step": 177860, "epoch": 1469} {"train_loss": -38.894203186035156, "global_step": 177861, "epoch": 1469} {"train_loss": -40.18325424194336, "global_step": 177862, "epoch": 1469} {"train_loss": -38.549232482910156, "global_step": 177863, "epoch": 1469} {"train_loss": -40.12480545043945, "global_step": 177864, "epoch": 1469} {"train_loss": -40.0120849609375, "global_step": 177865, "epoch": 1469} {"train_loss": -39.058837890625, "global_step": 177866, "epoch": 1469} {"train_loss": -39.18256759643555, "global_step": 177867, "epoch": 1469} {"train_loss": -35.27674102783203, "global_step": 177868, "epoch": 1469} {"train_loss": -39.88253200940849, "global_step": 177869, "epoch": 1469, "val_loss": 2574494.75} {"train_loss": -37.836849212646484, "global_step": 177870, "epoch": 1470} {"train_loss": -40.513946533203125, "global_step": 177871, "epoch": 1470} {"train_loss": -38.75655746459961, "global_step": 177872, "epoch": 1470} {"train_loss": -39.120361328125, "global_step": 177873, "epoch": 1470} {"train_loss": -40.27865982055664, "global_step": 177874, "epoch": 1470} {"train_loss": -36.52285385131836, "global_step": 177875, "epoch": 1470} {"train_loss": -39.293704986572266, "global_step": 177876, "epoch": 1470} {"train_loss": -39.33033752441406, "global_step": 177877, "epoch": 1470} {"train_loss": -36.70000457763672, "global_step": 177878, "epoch": 1470} {"train_loss": -40.12041091918945, "global_step": 177879, "epoch": 1470} {"train_loss": -39.2216911315918, "global_step": 177880, "epoch": 1470} {"train_loss": -40.13990020751953, "global_step": 177881, "epoch": 1470} {"train_loss": -40.53166961669922, "global_step": 177882, "epoch": 1470} {"train_loss": -40.19929122924805, "global_step": 177883, "epoch": 1470} {"train_loss": -40.15675735473633, "global_step": 177884, "epoch": 1470} {"train_loss": -40.83534622192383, "global_step": 177885, "epoch": 1470} {"train_loss": -38.95146179199219, "global_step": 177886, "epoch": 1470} {"train_loss": -40.725460052490234, "global_step": 177887, "epoch": 1470} {"train_loss": -40.66501235961914, "global_step": 177888, "epoch": 1470} {"train_loss": -40.65499496459961, "global_step": 177889, "epoch": 1470} {"train_loss": -40.7940788269043, "global_step": 177890, "epoch": 1470} {"train_loss": -40.74746322631836, "global_step": 177891, "epoch": 1470} {"train_loss": -40.52816390991211, "global_step": 177892, "epoch": 1470} {"train_loss": -41.19023513793945, "global_step": 177893, "epoch": 1470} {"train_loss": -40.910804748535156, "global_step": 177894, "epoch": 1470} {"train_loss": -40.784786224365234, "global_step": 177895, "epoch": 1470} {"train_loss": -40.73386764526367, "global_step": 177896, "epoch": 1470} {"train_loss": -40.747955322265625, "global_step": 177897, "epoch": 1470} {"train_loss": -40.862422943115234, "global_step": 177898, "epoch": 1470} {"train_loss": -40.93956756591797, "global_step": 177899, "epoch": 1470} {"train_loss": -40.36106491088867, "global_step": 177900, "epoch": 1470} {"train_loss": -39.76654815673828, "global_step": 177901, "epoch": 1470} {"train_loss": -40.4616813659668, "global_step": 177902, "epoch": 1470} {"train_loss": -40.52448654174805, "global_step": 177903, "epoch": 1470} {"train_loss": -41.167694091796875, "global_step": 177904, "epoch": 1470} {"train_loss": -40.47550582885742, "global_step": 177905, "epoch": 1470} {"train_loss": -41.16108322143555, "global_step": 177906, "epoch": 1470} {"train_loss": -41.5073356628418, "global_step": 177907, "epoch": 1470} {"train_loss": -41.202911376953125, "global_step": 177908, "epoch": 1470} {"train_loss": -41.514625549316406, "global_step": 177909, "epoch": 1470} {"train_loss": -41.602420806884766, "global_step": 177910, "epoch": 1470} {"train_loss": -41.05214309692383, "global_step": 177911, "epoch": 1470} {"train_loss": -41.38513946533203, "global_step": 177912, "epoch": 1470} {"train_loss": -41.664920806884766, "global_step": 177913, "epoch": 1470} {"train_loss": -41.00250244140625, "global_step": 177914, "epoch": 1470} {"train_loss": -41.31940460205078, "global_step": 177915, "epoch": 1470} {"train_loss": -41.01176071166992, "global_step": 177916, "epoch": 1470} {"train_loss": -41.79168701171875, "global_step": 177917, "epoch": 1470} {"train_loss": -41.634063720703125, "global_step": 177918, "epoch": 1470} {"train_loss": -40.466331481933594, "global_step": 177919, "epoch": 1470} {"train_loss": -40.06687545776367, "global_step": 177920, "epoch": 1470} {"train_loss": -42.000152587890625, "global_step": 177921, "epoch": 1470} {"train_loss": -41.69156265258789, "global_step": 177922, "epoch": 1470} {"train_loss": -41.100650787353516, "global_step": 177923, "epoch": 1470} {"train_loss": -42.0390625, "global_step": 177924, "epoch": 1470} {"train_loss": -41.49029541015625, "global_step": 177925, "epoch": 1470} {"train_loss": -41.037574768066406, "global_step": 177926, "epoch": 1470} {"train_loss": -40.31217575073242, "global_step": 177927, "epoch": 1470} {"train_loss": -40.91825485229492, "global_step": 177928, "epoch": 1470} {"train_loss": -41.3557243347168, "global_step": 177929, "epoch": 1470} {"train_loss": -41.01555252075195, "global_step": 177930, "epoch": 1470} {"train_loss": -39.079017639160156, "global_step": 177931, "epoch": 1470} {"train_loss": -41.011016845703125, "global_step": 177932, "epoch": 1470} {"train_loss": -41.160091400146484, "global_step": 177933, "epoch": 1470} {"train_loss": -40.77949142456055, "global_step": 177934, "epoch": 1470} {"train_loss": -40.800506591796875, "global_step": 177935, "epoch": 1470} {"train_loss": -40.58242416381836, "global_step": 177936, "epoch": 1470} {"train_loss": -41.022125244140625, "global_step": 177937, "epoch": 1470} {"train_loss": -41.63932800292969, "global_step": 177938, "epoch": 1470} {"train_loss": -41.76259231567383, "global_step": 177939, "epoch": 1470} {"train_loss": -41.62527084350586, "global_step": 177940, "epoch": 1470} {"train_loss": -41.20536804199219, "global_step": 177941, "epoch": 1470} {"train_loss": -41.03899002075195, "global_step": 177942, "epoch": 1470} {"train_loss": -40.69369125366211, "global_step": 177943, "epoch": 1470} {"train_loss": -41.68342208862305, "global_step": 177944, "epoch": 1470} {"train_loss": -40.20357894897461, "global_step": 177945, "epoch": 1470} {"train_loss": -40.970821380615234, "global_step": 177946, "epoch": 1470} {"train_loss": -40.908599853515625, "global_step": 177947, "epoch": 1470} {"train_loss": -41.112953186035156, "global_step": 177948, "epoch": 1470} {"train_loss": -41.041011810302734, "global_step": 177949, "epoch": 1470} {"train_loss": -40.50014877319336, "global_step": 177950, "epoch": 1470} {"train_loss": -41.095062255859375, "global_step": 177951, "epoch": 1470} {"train_loss": -41.60578155517578, "global_step": 177952, "epoch": 1470} {"train_loss": -41.07658004760742, "global_step": 177953, "epoch": 1470} {"train_loss": -41.40105056762695, "global_step": 177954, "epoch": 1470} {"train_loss": -41.38172149658203, "global_step": 177955, "epoch": 1470} {"train_loss": -41.485713958740234, "global_step": 177956, "epoch": 1470} {"train_loss": -40.27480697631836, "global_step": 177957, "epoch": 1470} {"train_loss": -40.56162643432617, "global_step": 177958, "epoch": 1470} {"train_loss": -41.14278030395508, "global_step": 177959, "epoch": 1470} {"train_loss": -41.04743576049805, "global_step": 177960, "epoch": 1470} {"train_loss": -41.39188003540039, "global_step": 177961, "epoch": 1470} {"train_loss": -41.42258834838867, "global_step": 177962, "epoch": 1470} {"train_loss": -41.54949951171875, "global_step": 177963, "epoch": 1470} {"train_loss": -41.58021926879883, "global_step": 177964, "epoch": 1470} {"train_loss": -41.76178741455078, "global_step": 177965, "epoch": 1470} {"train_loss": -41.45354080200195, "global_step": 177966, "epoch": 1470} {"train_loss": -41.20811080932617, "global_step": 177967, "epoch": 1470} {"train_loss": -41.13216018676758, "global_step": 177968, "epoch": 1470} {"train_loss": -39.78446578979492, "global_step": 177969, "epoch": 1470} {"train_loss": -39.83887481689453, "global_step": 177970, "epoch": 1470} {"train_loss": -40.35979080200195, "global_step": 177971, "epoch": 1470} {"train_loss": -39.667110443115234, "global_step": 177972, "epoch": 1470} {"train_loss": -38.0767936706543, "global_step": 177973, "epoch": 1470} {"train_loss": -33.595802307128906, "global_step": 177974, "epoch": 1470} {"train_loss": -17.90057373046875, "global_step": 177975, "epoch": 1470} {"train_loss": -4.397977352142334, "global_step": 177976, "epoch": 1470} {"train_loss": -25.4490909576416, "global_step": 177977, "epoch": 1470} {"train_loss": -33.02058029174805, "global_step": 177978, "epoch": 1470} {"train_loss": -15.391717910766602, "global_step": 177979, "epoch": 1470} {"train_loss": -34.45699691772461, "global_step": 177980, "epoch": 1470} {"train_loss": -25.905261993408203, "global_step": 177981, "epoch": 1470} {"train_loss": -31.728574752807617, "global_step": 177982, "epoch": 1470} {"train_loss": -33.61362838745117, "global_step": 177983, "epoch": 1470} {"train_loss": -35.99628829956055, "global_step": 177984, "epoch": 1470} {"train_loss": -32.892425537109375, "global_step": 177985, "epoch": 1470} {"train_loss": -36.64828109741211, "global_step": 177986, "epoch": 1470} {"train_loss": -35.429298400878906, "global_step": 177987, "epoch": 1470} {"train_loss": -34.20819854736328, "global_step": 177988, "epoch": 1470} {"train_loss": -36.27716827392578, "global_step": 177989, "epoch": 1470} {"train_loss": -39.107606742007675, "global_step": 177990, "epoch": 1470, "val_loss": 2570893.75} {"train_loss": -34.41647720336914, "global_step": 177991, "epoch": 1471} {"train_loss": -37.72496795654297, "global_step": 177992, "epoch": 1471} {"train_loss": -36.022796630859375, "global_step": 177993, "epoch": 1471} {"train_loss": -36.02075958251953, "global_step": 177994, "epoch": 1471} {"train_loss": -38.505916595458984, "global_step": 177995, "epoch": 1471} {"train_loss": -36.143043518066406, "global_step": 177996, "epoch": 1471} {"train_loss": -35.93546676635742, "global_step": 177997, "epoch": 1471} {"train_loss": -37.70204544067383, "global_step": 177998, "epoch": 1471} {"train_loss": -37.45179748535156, "global_step": 177999, "epoch": 1471} {"train_loss": -38.345672607421875, "global_step": 178000, "epoch": 1471} {"train_loss": -37.534881591796875, "global_step": 178001, "epoch": 1471} {"train_loss": -38.61007308959961, "global_step": 178002, "epoch": 1471} {"train_loss": -39.12680435180664, "global_step": 178003, "epoch": 1471} {"train_loss": -38.020057678222656, "global_step": 178004, "epoch": 1471} {"train_loss": -38.6294059753418, "global_step": 178005, "epoch": 1471} {"train_loss": -38.99113082885742, "global_step": 178006, "epoch": 1471} {"train_loss": -39.05497360229492, "global_step": 178007, "epoch": 1471} {"train_loss": -38.743804931640625, "global_step": 178008, "epoch": 1471} {"train_loss": -38.9784049987793, "global_step": 178009, "epoch": 1471} {"train_loss": -39.23423385620117, "global_step": 178010, "epoch": 1471} {"train_loss": -39.30314254760742, "global_step": 178011, "epoch": 1471} {"train_loss": -39.16073226928711, "global_step": 178012, "epoch": 1471} {"train_loss": -39.13050079345703, "global_step": 178013, "epoch": 1471} {"train_loss": -39.77019119262695, "global_step": 178014, "epoch": 1471} {"train_loss": -39.77912521362305, "global_step": 178015, "epoch": 1471} {"train_loss": -39.2144660949707, "global_step": 178016, "epoch": 1471} {"train_loss": -39.27968978881836, "global_step": 178017, "epoch": 1471} {"train_loss": -40.05044937133789, "global_step": 178018, "epoch": 1471} {"train_loss": -39.46073913574219, "global_step": 178019, "epoch": 1471} {"train_loss": -39.72965621948242, "global_step": 178020, "epoch": 1471} {"train_loss": -39.817665100097656, "global_step": 178021, "epoch": 1471} {"train_loss": -40.207279205322266, "global_step": 178022, "epoch": 1471} {"train_loss": -40.20719528198242, "global_step": 178023, "epoch": 1471} {"train_loss": -40.12437057495117, "global_step": 178024, "epoch": 1471} {"train_loss": -40.38618087768555, "global_step": 178025, "epoch": 1471} {"train_loss": -40.03181076049805, "global_step": 178026, "epoch": 1471} {"train_loss": -39.019752502441406, "global_step": 178027, "epoch": 1471} {"train_loss": -40.60469055175781, "global_step": 178028, "epoch": 1471} {"train_loss": -39.94912338256836, "global_step": 178029, "epoch": 1471} {"train_loss": -40.53160858154297, "global_step": 178030, "epoch": 1471} {"train_loss": -40.63857650756836, "global_step": 178031, "epoch": 1471} {"train_loss": -40.165077209472656, "global_step": 178032, "epoch": 1471} {"train_loss": -40.43410110473633, "global_step": 178033, "epoch": 1471} {"train_loss": -40.30568313598633, "global_step": 178034, "epoch": 1471} {"train_loss": -40.80933380126953, "global_step": 178035, "epoch": 1471} {"train_loss": -40.37485122680664, "global_step": 178036, "epoch": 1471} {"train_loss": -40.3578987121582, "global_step": 178037, "epoch": 1471} {"train_loss": -40.758331298828125, "global_step": 178038, "epoch": 1471} {"train_loss": -41.14478302001953, "global_step": 178039, "epoch": 1471} {"train_loss": -40.472869873046875, "global_step": 178040, "epoch": 1471} {"train_loss": -40.937538146972656, "global_step": 178041, "epoch": 1471} {"train_loss": -41.00138854980469, "global_step": 178042, "epoch": 1471} {"train_loss": -40.98520278930664, "global_step": 178043, "epoch": 1471} {"train_loss": -40.89179611206055, "global_step": 178044, "epoch": 1471} {"train_loss": -41.176570892333984, "global_step": 178045, "epoch": 1471} {"train_loss": -41.014930725097656, "global_step": 178046, "epoch": 1471} {"train_loss": -41.15974807739258, "global_step": 178047, "epoch": 1471} {"train_loss": -40.774658203125, "global_step": 178048, "epoch": 1471} {"train_loss": -41.03242492675781, "global_step": 178049, "epoch": 1471} {"train_loss": -41.17970275878906, "global_step": 178050, "epoch": 1471} {"train_loss": -41.30532455444336, "global_step": 178051, "epoch": 1471} {"train_loss": -41.5704460144043, "global_step": 178052, "epoch": 1471} {"train_loss": -41.45054244995117, "global_step": 178053, "epoch": 1471} {"train_loss": -41.3852653503418, "global_step": 178054, "epoch": 1471} {"train_loss": -41.003700256347656, "global_step": 178055, "epoch": 1471} {"train_loss": -41.10636520385742, "global_step": 178056, "epoch": 1471} {"train_loss": -41.12746810913086, "global_step": 178057, "epoch": 1471} {"train_loss": -41.14238357543945, "global_step": 178058, "epoch": 1471} {"train_loss": -41.17533874511719, "global_step": 178059, "epoch": 1471} {"train_loss": -41.43156814575195, "global_step": 178060, "epoch": 1471} {"train_loss": -41.51631164550781, "global_step": 178061, "epoch": 1471} {"train_loss": -41.378448486328125, "global_step": 178062, "epoch": 1471} {"train_loss": -41.5633430480957, "global_step": 178063, "epoch": 1471} {"train_loss": -41.270687103271484, "global_step": 178064, "epoch": 1471} {"train_loss": -41.29726791381836, "global_step": 178065, "epoch": 1471} {"train_loss": -41.34782028198242, "global_step": 178066, "epoch": 1471} {"train_loss": -41.57161331176758, "global_step": 178067, "epoch": 1471} {"train_loss": -41.472599029541016, "global_step": 178068, "epoch": 1471} {"train_loss": -41.59660720825195, "global_step": 178069, "epoch": 1471} {"train_loss": -41.4849853515625, "global_step": 178070, "epoch": 1471} {"train_loss": -41.38145065307617, "global_step": 178071, "epoch": 1471} {"train_loss": -41.47367477416992, "global_step": 178072, "epoch": 1471} {"train_loss": -41.52610397338867, "global_step": 178073, "epoch": 1471} {"train_loss": -41.143165588378906, "global_step": 178074, "epoch": 1471} {"train_loss": -41.71749496459961, "global_step": 178075, "epoch": 1471} {"train_loss": -41.45817947387695, "global_step": 178076, "epoch": 1471} {"train_loss": -42.01824951171875, "global_step": 178077, "epoch": 1471} {"train_loss": -41.621944427490234, "global_step": 178078, "epoch": 1471} {"train_loss": -41.85014724731445, "global_step": 178079, "epoch": 1471} {"train_loss": -41.6895866394043, "global_step": 178080, "epoch": 1471} {"train_loss": -42.182899475097656, "global_step": 178081, "epoch": 1471} {"train_loss": -41.973873138427734, "global_step": 178082, "epoch": 1471} {"train_loss": -41.32008743286133, "global_step": 178083, "epoch": 1471} {"train_loss": -41.8039436340332, "global_step": 178084, "epoch": 1471} {"train_loss": -41.75669860839844, "global_step": 178085, "epoch": 1471} {"train_loss": -41.6633415222168, "global_step": 178086, "epoch": 1471} {"train_loss": -41.4802360534668, "global_step": 178087, "epoch": 1471} {"train_loss": -41.857967376708984, "global_step": 178088, "epoch": 1471} {"train_loss": -41.978912353515625, "global_step": 178089, "epoch": 1471} {"train_loss": -41.737709045410156, "global_step": 178090, "epoch": 1471} {"train_loss": -41.45146560668945, "global_step": 178091, "epoch": 1471} {"train_loss": -40.78615188598633, "global_step": 178092, "epoch": 1471} {"train_loss": -38.31976318359375, "global_step": 178093, "epoch": 1471} {"train_loss": -32.84382247924805, "global_step": 178094, "epoch": 1471} {"train_loss": -16.109718322753906, "global_step": 178095, "epoch": 1471} {"train_loss": 15.336321830749512, "global_step": 178096, "epoch": 1471} {"train_loss": 12.220253944396973, "global_step": 178097, "epoch": 1471} {"train_loss": -27.631122589111328, "global_step": 178098, "epoch": 1471} {"train_loss": 8.685419082641602, "global_step": 178099, "epoch": 1471} {"train_loss": -13.252571105957031, "global_step": 178100, "epoch": 1471} {"train_loss": -18.145954132080078, "global_step": 178101, "epoch": 1471} {"train_loss": -25.8308048248291, "global_step": 178102, "epoch": 1471} {"train_loss": -22.974567413330078, "global_step": 178103, "epoch": 1471} {"train_loss": -27.179792404174805, "global_step": 178104, "epoch": 1471} {"train_loss": -32.639095306396484, "global_step": 178105, "epoch": 1471} {"train_loss": -24.266752243041992, "global_step": 178106, "epoch": 1471} {"train_loss": -33.36434555053711, "global_step": 178107, "epoch": 1471} {"train_loss": -33.2762565612793, "global_step": 178108, "epoch": 1471} {"train_loss": -29.377017974853516, "global_step": 178109, "epoch": 1471} {"train_loss": -33.48934555053711, "global_step": 178110, "epoch": 1471} {"train_loss": -37.338306616160494, "global_step": 178111, "epoch": 1471, "val_loss": 2621806.0} {"train_loss": -32.9573974609375, "global_step": 178112, "epoch": 1472} {"train_loss": -34.56797409057617, "global_step": 178113, "epoch": 1472} {"train_loss": -35.61207962036133, "global_step": 178114, "epoch": 1472} {"train_loss": -36.21955108642578, "global_step": 178115, "epoch": 1472} {"train_loss": -35.671051025390625, "global_step": 178116, "epoch": 1472} {"train_loss": -36.23102951049805, "global_step": 178117, "epoch": 1472} {"train_loss": -36.0442008972168, "global_step": 178118, "epoch": 1472} {"train_loss": -37.519535064697266, "global_step": 178119, "epoch": 1472} {"train_loss": -37.462493896484375, "global_step": 178120, "epoch": 1472} {"train_loss": -37.454402923583984, "global_step": 178121, "epoch": 1472} {"train_loss": -36.76972579956055, "global_step": 178122, "epoch": 1472} {"train_loss": -37.0023078918457, "global_step": 178123, "epoch": 1472} {"train_loss": -37.66053771972656, "global_step": 178124, "epoch": 1472} {"train_loss": -38.017391204833984, "global_step": 178125, "epoch": 1472} {"train_loss": -37.74580764770508, "global_step": 178126, "epoch": 1472} {"train_loss": -37.6650505065918, "global_step": 178127, "epoch": 1472} {"train_loss": -37.57882308959961, "global_step": 178128, "epoch": 1472} {"train_loss": -38.20095443725586, "global_step": 178129, "epoch": 1472} {"train_loss": -38.05145263671875, "global_step": 178130, "epoch": 1472} {"train_loss": -38.40389633178711, "global_step": 178131, "epoch": 1472} {"train_loss": -37.89210891723633, "global_step": 178132, "epoch": 1472} {"train_loss": -38.07843780517578, "global_step": 178133, "epoch": 1472} {"train_loss": -38.27265548706055, "global_step": 178134, "epoch": 1472} {"train_loss": -38.64597702026367, "global_step": 178135, "epoch": 1472} {"train_loss": -38.7155876159668, "global_step": 178136, "epoch": 1472} {"train_loss": -38.299129486083984, "global_step": 178137, "epoch": 1472} {"train_loss": -38.39186477661133, "global_step": 178138, "epoch": 1472} {"train_loss": -38.765724182128906, "global_step": 178139, "epoch": 1472} {"train_loss": -38.71266555786133, "global_step": 178140, "epoch": 1472} {"train_loss": -38.77926254272461, "global_step": 178141, "epoch": 1472} {"train_loss": -38.5809440612793, "global_step": 178142, "epoch": 1472} {"train_loss": -38.674434661865234, "global_step": 178143, "epoch": 1472} {"train_loss": -38.83429718017578, "global_step": 178144, "epoch": 1472} {"train_loss": -38.72801208496094, "global_step": 178145, "epoch": 1472} {"train_loss": -39.04670333862305, "global_step": 178146, "epoch": 1472} {"train_loss": -39.022605895996094, "global_step": 178147, "epoch": 1472} {"train_loss": -38.91546630859375, "global_step": 178148, "epoch": 1472} {"train_loss": -38.97237014770508, "global_step": 178149, "epoch": 1472} {"train_loss": -39.2463264465332, "global_step": 178150, "epoch": 1472} {"train_loss": -39.3712272644043, "global_step": 178151, "epoch": 1472} {"train_loss": -39.15972900390625, "global_step": 178152, "epoch": 1472} {"train_loss": -39.22290802001953, "global_step": 178153, "epoch": 1472} {"train_loss": -39.263145446777344, "global_step": 178154, "epoch": 1472} {"train_loss": -39.359249114990234, "global_step": 178155, "epoch": 1472} {"train_loss": -39.62976837158203, "global_step": 178156, "epoch": 1472} {"train_loss": -39.66733932495117, "global_step": 178157, "epoch": 1472} {"train_loss": -39.54249954223633, "global_step": 178158, "epoch": 1472} {"train_loss": -39.523921966552734, "global_step": 178159, "epoch": 1472} {"train_loss": -39.56444549560547, "global_step": 178160, "epoch": 1472} {"train_loss": -39.757022857666016, "global_step": 178161, "epoch": 1472} {"train_loss": -39.76479721069336, "global_step": 178162, "epoch": 1472} {"train_loss": -39.596858978271484, "global_step": 178163, "epoch": 1472} {"train_loss": -39.78957748413086, "global_step": 178164, "epoch": 1472} {"train_loss": -40.285884857177734, "global_step": 178165, "epoch": 1472} {"train_loss": -39.86513900756836, "global_step": 178166, "epoch": 1472} {"train_loss": -39.81393051147461, "global_step": 178167, "epoch": 1472} {"train_loss": -40.2579345703125, "global_step": 178168, "epoch": 1472} {"train_loss": -40.13902282714844, "global_step": 178169, "epoch": 1472} {"train_loss": -40.00657272338867, "global_step": 178170, "epoch": 1472} {"train_loss": -39.77350997924805, "global_step": 178171, "epoch": 1472} {"train_loss": -40.2164421081543, "global_step": 178172, "epoch": 1472} {"train_loss": -40.0904426574707, "global_step": 178173, "epoch": 1472} {"train_loss": -40.059112548828125, "global_step": 178174, "epoch": 1472} {"train_loss": -40.14377212524414, "global_step": 178175, "epoch": 1472} {"train_loss": -40.3142204284668, "global_step": 178176, "epoch": 1472} {"train_loss": -40.24329376220703, "global_step": 178177, "epoch": 1472} {"train_loss": -40.45042419433594, "global_step": 178178, "epoch": 1472} {"train_loss": -40.19660186767578, "global_step": 178179, "epoch": 1472} {"train_loss": -40.23519515991211, "global_step": 178180, "epoch": 1472} {"train_loss": -40.5228157043457, "global_step": 178181, "epoch": 1472} {"train_loss": -40.19600296020508, "global_step": 178182, "epoch": 1472} {"train_loss": -40.28371810913086, "global_step": 178183, "epoch": 1472} {"train_loss": -40.62677764892578, "global_step": 178184, "epoch": 1472} {"train_loss": -40.87174987792969, "global_step": 178185, "epoch": 1472} {"train_loss": -40.819820404052734, "global_step": 178186, "epoch": 1472} {"train_loss": -40.50780487060547, "global_step": 178187, "epoch": 1472} {"train_loss": -40.75810623168945, "global_step": 178188, "epoch": 1472} {"train_loss": -40.93941116333008, "global_step": 178189, "epoch": 1472} {"train_loss": -40.688446044921875, "global_step": 178190, "epoch": 1472} {"train_loss": -40.7047233581543, "global_step": 178191, "epoch": 1472} {"train_loss": -40.474769592285156, "global_step": 178192, "epoch": 1472} {"train_loss": -40.95241928100586, "global_step": 178193, "epoch": 1472} {"train_loss": -41.06826400756836, "global_step": 178194, "epoch": 1472} {"train_loss": -40.59754180908203, "global_step": 178195, "epoch": 1472} {"train_loss": -41.00761795043945, "global_step": 178196, "epoch": 1472} {"train_loss": -40.672420501708984, "global_step": 178197, "epoch": 1472} {"train_loss": -41.23019027709961, "global_step": 178198, "epoch": 1472} {"train_loss": -41.3119010925293, "global_step": 178199, "epoch": 1472} {"train_loss": -40.89424514770508, "global_step": 178200, "epoch": 1472} {"train_loss": -40.83502197265625, "global_step": 178201, "epoch": 1472} {"train_loss": -41.15724563598633, "global_step": 178202, "epoch": 1472} {"train_loss": -41.35648727416992, "global_step": 178203, "epoch": 1472} {"train_loss": -41.00418472290039, "global_step": 178204, "epoch": 1472} {"train_loss": -40.70095443725586, "global_step": 178205, "epoch": 1472} {"train_loss": -41.33061218261719, "global_step": 178206, "epoch": 1472} {"train_loss": -40.96487045288086, "global_step": 178207, "epoch": 1472} {"train_loss": -40.98310470581055, "global_step": 178208, "epoch": 1472} {"train_loss": -41.16484451293945, "global_step": 178209, "epoch": 1472} {"train_loss": -41.327938079833984, "global_step": 178210, "epoch": 1472} {"train_loss": -41.24870681762695, "global_step": 178211, "epoch": 1472} {"train_loss": -41.31645584106445, "global_step": 178212, "epoch": 1472} {"train_loss": -41.492183685302734, "global_step": 178213, "epoch": 1472} {"train_loss": -41.498817443847656, "global_step": 178214, "epoch": 1472} {"train_loss": -40.96798324584961, "global_step": 178215, "epoch": 1472} {"train_loss": -41.22196578979492, "global_step": 178216, "epoch": 1472} {"train_loss": -41.17477035522461, "global_step": 178217, "epoch": 1472} {"train_loss": -41.29063415527344, "global_step": 178218, "epoch": 1472} {"train_loss": -41.68259811401367, "global_step": 178219, "epoch": 1472} {"train_loss": -41.00285720825195, "global_step": 178220, "epoch": 1472} {"train_loss": -40.95808792114258, "global_step": 178221, "epoch": 1472} {"train_loss": -41.66740798950195, "global_step": 178222, "epoch": 1472} {"train_loss": -41.490318298339844, "global_step": 178223, "epoch": 1472} {"train_loss": -40.99721908569336, "global_step": 178224, "epoch": 1472} {"train_loss": -41.00645065307617, "global_step": 178225, "epoch": 1472} {"train_loss": -40.87819290161133, "global_step": 178226, "epoch": 1472} {"train_loss": -40.9037971496582, "global_step": 178227, "epoch": 1472} {"train_loss": -41.3402214050293, "global_step": 178228, "epoch": 1472} {"train_loss": -40.7967643737793, "global_step": 178229, "epoch": 1472} {"train_loss": -40.7832145690918, "global_step": 178230, "epoch": 1472} {"train_loss": -40.291011810302734, "global_step": 178231, "epoch": 1472} {"train_loss": -39.64957415367946, "global_step": 178232, "epoch": 1472, "val_loss": 2590121.25} {"train_loss": -41.03329086303711, "global_step": 178233, "epoch": 1473} {"train_loss": -40.89486312866211, "global_step": 178234, "epoch": 1473} {"train_loss": -40.24067687988281, "global_step": 178235, "epoch": 1473} {"train_loss": -39.345436096191406, "global_step": 178236, "epoch": 1473} {"train_loss": -37.569217681884766, "global_step": 178237, "epoch": 1473} {"train_loss": -36.02043914794922, "global_step": 178238, "epoch": 1473} {"train_loss": -35.71181869506836, "global_step": 178239, "epoch": 1473} {"train_loss": -38.40537643432617, "global_step": 178240, "epoch": 1473} {"train_loss": -40.53022003173828, "global_step": 178241, "epoch": 1473} {"train_loss": -39.815887451171875, "global_step": 178242, "epoch": 1473} {"train_loss": -39.066871643066406, "global_step": 178243, "epoch": 1473} {"train_loss": -40.17851638793945, "global_step": 178244, "epoch": 1473} {"train_loss": -40.17625045776367, "global_step": 178245, "epoch": 1473} {"train_loss": -38.44267654418945, "global_step": 178246, "epoch": 1473} {"train_loss": -40.56869125366211, "global_step": 178247, "epoch": 1473} {"train_loss": -40.70336151123047, "global_step": 178248, "epoch": 1473} {"train_loss": -40.046512603759766, "global_step": 178249, "epoch": 1473} {"train_loss": -40.63497543334961, "global_step": 178250, "epoch": 1473} {"train_loss": -40.69279861450195, "global_step": 178251, "epoch": 1473} {"train_loss": -40.65088653564453, "global_step": 178252, "epoch": 1473} {"train_loss": -39.81527328491211, "global_step": 178253, "epoch": 1473} {"train_loss": -40.229583740234375, "global_step": 178254, "epoch": 1473} {"train_loss": -40.470699310302734, "global_step": 178255, "epoch": 1473} {"train_loss": -40.57434844970703, "global_step": 178256, "epoch": 1473} {"train_loss": -40.907264709472656, "global_step": 178257, "epoch": 1473} {"train_loss": -40.24565124511719, "global_step": 178258, "epoch": 1473} {"train_loss": -40.300811767578125, "global_step": 178259, "epoch": 1473} {"train_loss": -40.423519134521484, "global_step": 178260, "epoch": 1473} {"train_loss": -40.29897689819336, "global_step": 178261, "epoch": 1473} {"train_loss": -40.36240005493164, "global_step": 178262, "epoch": 1473} {"train_loss": -40.124717712402344, "global_step": 178263, "epoch": 1473} {"train_loss": -40.13717269897461, "global_step": 178264, "epoch": 1473} {"train_loss": -40.450401306152344, "global_step": 178265, "epoch": 1473} {"train_loss": -40.62693786621094, "global_step": 178266, "epoch": 1473} {"train_loss": -40.97685623168945, "global_step": 178267, "epoch": 1473} {"train_loss": -40.54481506347656, "global_step": 178268, "epoch": 1473} {"train_loss": -40.87443161010742, "global_step": 178269, "epoch": 1473} {"train_loss": -40.4494514465332, "global_step": 178270, "epoch": 1473} {"train_loss": -40.19940948486328, "global_step": 178271, "epoch": 1473} {"train_loss": -40.14358139038086, "global_step": 178272, "epoch": 1473} {"train_loss": -40.8404655456543, "global_step": 178273, "epoch": 1473} {"train_loss": -40.77337646484375, "global_step": 178274, "epoch": 1473} {"train_loss": -40.877933502197266, "global_step": 178275, "epoch": 1473} {"train_loss": -40.719940185546875, "global_step": 178276, "epoch": 1473} {"train_loss": -41.09657669067383, "global_step": 178277, "epoch": 1473} {"train_loss": -40.050323486328125, "global_step": 178278, "epoch": 1473} {"train_loss": -39.26825714111328, "global_step": 178279, "epoch": 1473} {"train_loss": -40.24076843261719, "global_step": 178280, "epoch": 1473} {"train_loss": -40.853118896484375, "global_step": 178281, "epoch": 1473} {"train_loss": -40.20646286010742, "global_step": 178282, "epoch": 1473} {"train_loss": -39.97794723510742, "global_step": 178283, "epoch": 1473} {"train_loss": -40.09833908081055, "global_step": 178284, "epoch": 1473} {"train_loss": -40.82394790649414, "global_step": 178285, "epoch": 1473} {"train_loss": -40.1865234375, "global_step": 178286, "epoch": 1473} {"train_loss": -40.10653305053711, "global_step": 178287, "epoch": 1473} {"train_loss": -41.11806106567383, "global_step": 178288, "epoch": 1473} {"train_loss": -40.91119384765625, "global_step": 178289, "epoch": 1473} {"train_loss": -40.4207878112793, "global_step": 178290, "epoch": 1473} {"train_loss": -41.394134521484375, "global_step": 178291, "epoch": 1473} {"train_loss": -40.42234420776367, "global_step": 178292, "epoch": 1473} {"train_loss": -40.673431396484375, "global_step": 178293, "epoch": 1473} {"train_loss": -39.5230712890625, "global_step": 178294, "epoch": 1473} {"train_loss": -40.854957580566406, "global_step": 178295, "epoch": 1473} {"train_loss": -40.85503005981445, "global_step": 178296, "epoch": 1473} {"train_loss": -39.37854766845703, "global_step": 178297, "epoch": 1473} {"train_loss": -40.960227966308594, "global_step": 178298, "epoch": 1473} {"train_loss": -39.72951889038086, "global_step": 178299, "epoch": 1473} {"train_loss": -39.494136810302734, "global_step": 178300, "epoch": 1473} {"train_loss": -40.50455856323242, "global_step": 178301, "epoch": 1473} {"train_loss": -40.62803268432617, "global_step": 178302, "epoch": 1473} {"train_loss": -39.51375961303711, "global_step": 178303, "epoch": 1473} {"train_loss": -40.52488327026367, "global_step": 178304, "epoch": 1473} {"train_loss": -40.73271560668945, "global_step": 178305, "epoch": 1473} {"train_loss": -38.81083297729492, "global_step": 178306, "epoch": 1473} {"train_loss": -39.791717529296875, "global_step": 178307, "epoch": 1473} {"train_loss": -37.756587982177734, "global_step": 178308, "epoch": 1473} {"train_loss": -33.52878189086914, "global_step": 178309, "epoch": 1473} {"train_loss": -40.080501556396484, "global_step": 178310, "epoch": 1473} {"train_loss": -34.956722259521484, "global_step": 178311, "epoch": 1473} {"train_loss": -38.28989028930664, "global_step": 178312, "epoch": 1473} {"train_loss": -39.81881332397461, "global_step": 178313, "epoch": 1473} {"train_loss": -37.8952751159668, "global_step": 178314, "epoch": 1473} {"train_loss": -40.22011947631836, "global_step": 178315, "epoch": 1473} {"train_loss": -39.23238754272461, "global_step": 178316, "epoch": 1473} {"train_loss": -39.39445114135742, "global_step": 178317, "epoch": 1473} {"train_loss": -39.43485641479492, "global_step": 178318, "epoch": 1473} {"train_loss": -40.54501724243164, "global_step": 178319, "epoch": 1473} {"train_loss": -39.09856033325195, "global_step": 178320, "epoch": 1473} {"train_loss": -39.864707946777344, "global_step": 178321, "epoch": 1473} {"train_loss": -40.24277877807617, "global_step": 178322, "epoch": 1473} {"train_loss": -40.2034912109375, "global_step": 178323, "epoch": 1473} {"train_loss": -39.784271240234375, "global_step": 178324, "epoch": 1473} {"train_loss": -40.78688049316406, "global_step": 178325, "epoch": 1473} {"train_loss": -40.518131256103516, "global_step": 178326, "epoch": 1473} {"train_loss": -39.99677276611328, "global_step": 178327, "epoch": 1473} {"train_loss": -40.55877685546875, "global_step": 178328, "epoch": 1473} {"train_loss": -40.155147552490234, "global_step": 178329, "epoch": 1473} {"train_loss": -40.56782150268555, "global_step": 178330, "epoch": 1473} {"train_loss": -38.7509880065918, "global_step": 178331, "epoch": 1473} {"train_loss": -40.24489212036133, "global_step": 178332, "epoch": 1473} {"train_loss": -40.891963958740234, "global_step": 178333, "epoch": 1473} {"train_loss": -40.17995071411133, "global_step": 178334, "epoch": 1473} {"train_loss": -40.84833526611328, "global_step": 178335, "epoch": 1473} {"train_loss": -40.32653045654297, "global_step": 178336, "epoch": 1473} {"train_loss": -40.96196746826172, "global_step": 178337, "epoch": 1473} {"train_loss": -40.44363021850586, "global_step": 178338, "epoch": 1473} {"train_loss": -40.90362548828125, "global_step": 178339, "epoch": 1473} {"train_loss": -40.631099700927734, "global_step": 178340, "epoch": 1473} {"train_loss": -40.85780715942383, "global_step": 178341, "epoch": 1473} {"train_loss": -41.05038070678711, "global_step": 178342, "epoch": 1473} {"train_loss": -40.96768569946289, "global_step": 178343, "epoch": 1473} {"train_loss": -41.008331298828125, "global_step": 178344, "epoch": 1473} {"train_loss": -40.742340087890625, "global_step": 178345, "epoch": 1473} {"train_loss": -41.17534255981445, "global_step": 178346, "epoch": 1473} {"train_loss": -41.1025505065918, "global_step": 178347, "epoch": 1473} {"train_loss": -41.31782150268555, "global_step": 178348, "epoch": 1473} {"train_loss": -40.94204330444336, "global_step": 178349, "epoch": 1473} {"train_loss": -40.747833251953125, "global_step": 178350, "epoch": 1473} {"train_loss": -41.581214904785156, "global_step": 178351, "epoch": 1473} {"train_loss": -39.205177307128906, "global_step": 178352, "epoch": 1473} {"train_loss": -40.08383657912577, "global_step": 178353, "epoch": 1473, "val_loss": 2587612.75} {"train_loss": -40.639404296875, "global_step": 178354, "epoch": 1474} {"train_loss": -40.924922943115234, "global_step": 178355, "epoch": 1474} {"train_loss": -40.68798828125, "global_step": 178356, "epoch": 1474} {"train_loss": -40.92940902709961, "global_step": 178357, "epoch": 1474} {"train_loss": -41.56703186035156, "global_step": 178358, "epoch": 1474} {"train_loss": -40.4073600769043, "global_step": 178359, "epoch": 1474} {"train_loss": -41.348812103271484, "global_step": 178360, "epoch": 1474} {"train_loss": -40.71662521362305, "global_step": 178361, "epoch": 1474} {"train_loss": -41.33736038208008, "global_step": 178362, "epoch": 1474} {"train_loss": -39.78940963745117, "global_step": 178363, "epoch": 1474} {"train_loss": -41.21611022949219, "global_step": 178364, "epoch": 1474} {"train_loss": -41.0299072265625, "global_step": 178365, "epoch": 1474} {"train_loss": -40.734493255615234, "global_step": 178366, "epoch": 1474} {"train_loss": -40.58597946166992, "global_step": 178367, "epoch": 1474} {"train_loss": -40.88054656982422, "global_step": 178368, "epoch": 1474} {"train_loss": -41.082637786865234, "global_step": 178369, "epoch": 1474} {"train_loss": -40.4644889831543, "global_step": 178370, "epoch": 1474} {"train_loss": -41.54521560668945, "global_step": 178371, "epoch": 1474} {"train_loss": -41.015296936035156, "global_step": 178372, "epoch": 1474} {"train_loss": -40.99422836303711, "global_step": 178373, "epoch": 1474} {"train_loss": -34.467437744140625, "global_step": 178374, "epoch": 1474} {"train_loss": -40.82200241088867, "global_step": 178375, "epoch": 1474} {"train_loss": -39.38505554199219, "global_step": 178376, "epoch": 1474} {"train_loss": -40.13179016113281, "global_step": 178377, "epoch": 1474} {"train_loss": -39.84549331665039, "global_step": 178378, "epoch": 1474} {"train_loss": -41.09757995605469, "global_step": 178379, "epoch": 1474} {"train_loss": -39.1554069519043, "global_step": 178380, "epoch": 1474} {"train_loss": -40.92362594604492, "global_step": 178381, "epoch": 1474} {"train_loss": -39.741634368896484, "global_step": 178382, "epoch": 1474} {"train_loss": -40.8942985534668, "global_step": 178383, "epoch": 1474} {"train_loss": -40.388328552246094, "global_step": 178384, "epoch": 1474} {"train_loss": -40.42428970336914, "global_step": 178385, "epoch": 1474} {"train_loss": -40.606563568115234, "global_step": 178386, "epoch": 1474} {"train_loss": -36.951107025146484, "global_step": 178387, "epoch": 1474} {"train_loss": -39.81062316894531, "global_step": 178388, "epoch": 1474} {"train_loss": -39.063350677490234, "global_step": 178389, "epoch": 1474} {"train_loss": -39.60848617553711, "global_step": 178390, "epoch": 1474} {"train_loss": -40.754432678222656, "global_step": 178391, "epoch": 1474} {"train_loss": -36.47956466674805, "global_step": 178392, "epoch": 1474} {"train_loss": -39.571041107177734, "global_step": 178393, "epoch": 1474} {"train_loss": -40.637184143066406, "global_step": 178394, "epoch": 1474} {"train_loss": -40.103511810302734, "global_step": 178395, "epoch": 1474} {"train_loss": -40.48115158081055, "global_step": 178396, "epoch": 1474} {"train_loss": -40.548370361328125, "global_step": 178397, "epoch": 1474} {"train_loss": -41.298458099365234, "global_step": 178398, "epoch": 1474} {"train_loss": -40.270660400390625, "global_step": 178399, "epoch": 1474} {"train_loss": -40.761837005615234, "global_step": 178400, "epoch": 1474} {"train_loss": -40.209144592285156, "global_step": 178401, "epoch": 1474} {"train_loss": -40.452999114990234, "global_step": 178402, "epoch": 1474} {"train_loss": -38.63798904418945, "global_step": 178403, "epoch": 1474} {"train_loss": -40.60554885864258, "global_step": 178404, "epoch": 1474} {"train_loss": -41.12113952636719, "global_step": 178405, "epoch": 1474} {"train_loss": -38.248878479003906, "global_step": 178406, "epoch": 1474} {"train_loss": -38.94679641723633, "global_step": 178407, "epoch": 1474} {"train_loss": -40.75457763671875, "global_step": 178408, "epoch": 1474} {"train_loss": -40.212677001953125, "global_step": 178409, "epoch": 1474} {"train_loss": -41.294490814208984, "global_step": 178410, "epoch": 1474} {"train_loss": -41.04044723510742, "global_step": 178411, "epoch": 1474} {"train_loss": -39.720943450927734, "global_step": 178412, "epoch": 1474} {"train_loss": -39.21918487548828, "global_step": 178413, "epoch": 1474} {"train_loss": -40.9052734375, "global_step": 178414, "epoch": 1474} {"train_loss": -40.15385055541992, "global_step": 178415, "epoch": 1474} {"train_loss": -40.3036003112793, "global_step": 178416, "epoch": 1474} {"train_loss": -40.28529739379883, "global_step": 178417, "epoch": 1474} {"train_loss": -41.441558837890625, "global_step": 178418, "epoch": 1474} {"train_loss": -41.05363082885742, "global_step": 178419, "epoch": 1474} {"train_loss": -41.52261734008789, "global_step": 178420, "epoch": 1474} {"train_loss": -40.48582077026367, "global_step": 178421, "epoch": 1474} {"train_loss": -41.28437805175781, "global_step": 178422, "epoch": 1474} {"train_loss": -36.5817985534668, "global_step": 178423, "epoch": 1474} {"train_loss": -40.94954299926758, "global_step": 178424, "epoch": 1474} {"train_loss": -40.084774017333984, "global_step": 178425, "epoch": 1474} {"train_loss": -40.84632110595703, "global_step": 178426, "epoch": 1474} {"train_loss": -39.80451583862305, "global_step": 178427, "epoch": 1474} {"train_loss": -41.2399787902832, "global_step": 178428, "epoch": 1474} {"train_loss": -41.869850158691406, "global_step": 178429, "epoch": 1474} {"train_loss": -41.290340423583984, "global_step": 178430, "epoch": 1474} {"train_loss": -41.41566467285156, "global_step": 178431, "epoch": 1474} {"train_loss": -41.25896072387695, "global_step": 178432, "epoch": 1474} {"train_loss": -41.6689567565918, "global_step": 178433, "epoch": 1474} {"train_loss": -41.026676177978516, "global_step": 178434, "epoch": 1474} {"train_loss": -41.31582260131836, "global_step": 178435, "epoch": 1474} {"train_loss": -41.518001556396484, "global_step": 178436, "epoch": 1474} {"train_loss": -41.647212982177734, "global_step": 178437, "epoch": 1474} {"train_loss": -41.55818557739258, "global_step": 178438, "epoch": 1474} {"train_loss": -41.432952880859375, "global_step": 178439, "epoch": 1474} {"train_loss": -40.43830490112305, "global_step": 178440, "epoch": 1474} {"train_loss": -41.59358596801758, "global_step": 178441, "epoch": 1474} {"train_loss": -40.80391311645508, "global_step": 178442, "epoch": 1474} {"train_loss": -41.66142654418945, "global_step": 178443, "epoch": 1474} {"train_loss": -41.74855041503906, "global_step": 178444, "epoch": 1474} {"train_loss": -41.60085678100586, "global_step": 178445, "epoch": 1474} {"train_loss": -41.45159912109375, "global_step": 178446, "epoch": 1474} {"train_loss": -41.827392578125, "global_step": 178447, "epoch": 1474} {"train_loss": -41.260921478271484, "global_step": 178448, "epoch": 1474} {"train_loss": -41.33771514892578, "global_step": 178449, "epoch": 1474} {"train_loss": -41.49384307861328, "global_step": 178450, "epoch": 1474} {"train_loss": -41.38211441040039, "global_step": 178451, "epoch": 1474} {"train_loss": -41.406307220458984, "global_step": 178452, "epoch": 1474} {"train_loss": -41.889827728271484, "global_step": 178453, "epoch": 1474} {"train_loss": -41.092220306396484, "global_step": 178454, "epoch": 1474} {"train_loss": -41.653865814208984, "global_step": 178455, "epoch": 1474} {"train_loss": -41.50038146972656, "global_step": 178456, "epoch": 1474} {"train_loss": -41.57578659057617, "global_step": 178457, "epoch": 1474} {"train_loss": -41.52082061767578, "global_step": 178458, "epoch": 1474} {"train_loss": -41.84192657470703, "global_step": 178459, "epoch": 1474} {"train_loss": -41.60541915893555, "global_step": 178460, "epoch": 1474} {"train_loss": -40.91561508178711, "global_step": 178461, "epoch": 1474} {"train_loss": -40.29728317260742, "global_step": 178462, "epoch": 1474} {"train_loss": -40.21754837036133, "global_step": 178463, "epoch": 1474} {"train_loss": -40.396663665771484, "global_step": 178464, "epoch": 1474} {"train_loss": -41.163543701171875, "global_step": 178465, "epoch": 1474} {"train_loss": -40.64800262451172, "global_step": 178466, "epoch": 1474} {"train_loss": -40.530879974365234, "global_step": 178467, "epoch": 1474} {"train_loss": -41.30374526977539, "global_step": 178468, "epoch": 1474} {"train_loss": -40.950923919677734, "global_step": 178469, "epoch": 1474} {"train_loss": -41.27887725830078, "global_step": 178470, "epoch": 1474} {"train_loss": -41.79982376098633, "global_step": 178471, "epoch": 1474} {"train_loss": -40.90635299682617, "global_step": 178472, "epoch": 1474} {"train_loss": -41.38702392578125, "global_step": 178473, "epoch": 1474} {"train_loss": -40.65518286208476, "global_step": 178474, "epoch": 1474, "val_loss": 2524044.0} {"train_loss": -41.33301544189453, "global_step": 178475, "epoch": 1475} {"train_loss": -41.567806243896484, "global_step": 178476, "epoch": 1475} {"train_loss": -41.68278121948242, "global_step": 178477, "epoch": 1475} {"train_loss": -40.73567581176758, "global_step": 178478, "epoch": 1475} {"train_loss": -40.934661865234375, "global_step": 178479, "epoch": 1475} {"train_loss": -40.81710433959961, "global_step": 178480, "epoch": 1475} {"train_loss": -41.01174545288086, "global_step": 178481, "epoch": 1475} {"train_loss": -42.00850296020508, "global_step": 178482, "epoch": 1475} {"train_loss": -41.986061096191406, "global_step": 178483, "epoch": 1475} {"train_loss": -42.17243576049805, "global_step": 178484, "epoch": 1475} {"train_loss": -41.93988800048828, "global_step": 178485, "epoch": 1475} {"train_loss": -41.05086898803711, "global_step": 178486, "epoch": 1475} {"train_loss": -41.17119216918945, "global_step": 178487, "epoch": 1475} {"train_loss": -41.277793884277344, "global_step": 178488, "epoch": 1475} {"train_loss": -40.9367790222168, "global_step": 178489, "epoch": 1475} {"train_loss": -40.762081146240234, "global_step": 178490, "epoch": 1475} {"train_loss": -41.50446319580078, "global_step": 178491, "epoch": 1475} {"train_loss": -39.84062576293945, "global_step": 178492, "epoch": 1475} {"train_loss": -40.522151947021484, "global_step": 178493, "epoch": 1475} {"train_loss": -41.634193420410156, "global_step": 178494, "epoch": 1475} {"train_loss": -41.59504318237305, "global_step": 178495, "epoch": 1475} {"train_loss": -41.00938034057617, "global_step": 178496, "epoch": 1475} {"train_loss": -41.465126037597656, "global_step": 178497, "epoch": 1475} {"train_loss": -41.71108627319336, "global_step": 178498, "epoch": 1475} {"train_loss": -40.13015365600586, "global_step": 178499, "epoch": 1475} {"train_loss": -40.765663146972656, "global_step": 178500, "epoch": 1475} {"train_loss": -40.11831283569336, "global_step": 178501, "epoch": 1475} {"train_loss": -42.04377365112305, "global_step": 178502, "epoch": 1475} {"train_loss": -40.627567291259766, "global_step": 178503, "epoch": 1475} {"train_loss": -39.065120697021484, "global_step": 178504, "epoch": 1475} {"train_loss": -41.51102828979492, "global_step": 178505, "epoch": 1475} {"train_loss": -40.739322662353516, "global_step": 178506, "epoch": 1475} {"train_loss": -41.72266387939453, "global_step": 178507, "epoch": 1475} {"train_loss": -40.706058502197266, "global_step": 178508, "epoch": 1475} {"train_loss": -41.04265213012695, "global_step": 178509, "epoch": 1475} {"train_loss": -40.56622314453125, "global_step": 178510, "epoch": 1475} {"train_loss": -40.82135009765625, "global_step": 178511, "epoch": 1475} {"train_loss": -41.212615966796875, "global_step": 178512, "epoch": 1475} {"train_loss": -41.41860580444336, "global_step": 178513, "epoch": 1475} {"train_loss": -41.91970443725586, "global_step": 178514, "epoch": 1475} {"train_loss": -41.34314727783203, "global_step": 178515, "epoch": 1475} {"train_loss": -41.76540756225586, "global_step": 178516, "epoch": 1475} {"train_loss": -40.803985595703125, "global_step": 178517, "epoch": 1475} {"train_loss": -28.787073135375977, "global_step": 178518, "epoch": 1475} {"train_loss": -40.66385269165039, "global_step": 178519, "epoch": 1475} {"train_loss": -40.914405822753906, "global_step": 178520, "epoch": 1475} {"train_loss": -40.9747428894043, "global_step": 178521, "epoch": 1475} {"train_loss": -42.086544036865234, "global_step": 178522, "epoch": 1475} {"train_loss": -41.04575729370117, "global_step": 178523, "epoch": 1475} {"train_loss": -41.363250732421875, "global_step": 178524, "epoch": 1475} {"train_loss": -41.2781982421875, "global_step": 178525, "epoch": 1475} {"train_loss": -40.680084228515625, "global_step": 178526, "epoch": 1475} {"train_loss": -40.55473709106445, "global_step": 178527, "epoch": 1475} {"train_loss": -40.004302978515625, "global_step": 178528, "epoch": 1475} {"train_loss": -40.729774475097656, "global_step": 178529, "epoch": 1475} {"train_loss": -41.37487030029297, "global_step": 178530, "epoch": 1475} {"train_loss": -39.849334716796875, "global_step": 178531, "epoch": 1475} {"train_loss": -40.43473434448242, "global_step": 178532, "epoch": 1475} {"train_loss": -40.92034912109375, "global_step": 178533, "epoch": 1475} {"train_loss": -38.9520378112793, "global_step": 178534, "epoch": 1475} {"train_loss": -39.33192443847656, "global_step": 178535, "epoch": 1475} {"train_loss": -37.465484619140625, "global_step": 178536, "epoch": 1475} {"train_loss": -39.69672775268555, "global_step": 178537, "epoch": 1475} {"train_loss": -39.38645553588867, "global_step": 178538, "epoch": 1475} {"train_loss": -40.421607971191406, "global_step": 178539, "epoch": 1475} {"train_loss": -38.483516693115234, "global_step": 178540, "epoch": 1475} {"train_loss": -40.24610900878906, "global_step": 178541, "epoch": 1475} {"train_loss": -40.75798416137695, "global_step": 178542, "epoch": 1475} {"train_loss": -38.95470428466797, "global_step": 178543, "epoch": 1475} {"train_loss": -39.99772262573242, "global_step": 178544, "epoch": 1475} {"train_loss": -36.9712028503418, "global_step": 178545, "epoch": 1475} {"train_loss": -39.6716194152832, "global_step": 178546, "epoch": 1475} {"train_loss": -40.78913497924805, "global_step": 178547, "epoch": 1475} {"train_loss": -40.29290008544922, "global_step": 178548, "epoch": 1475} {"train_loss": -39.53924560546875, "global_step": 178549, "epoch": 1475} {"train_loss": -36.75470733642578, "global_step": 178550, "epoch": 1475} {"train_loss": -39.24005889892578, "global_step": 178551, "epoch": 1475} {"train_loss": -38.824188232421875, "global_step": 178552, "epoch": 1475} {"train_loss": -38.43238067626953, "global_step": 178553, "epoch": 1475} {"train_loss": -40.37841033935547, "global_step": 178554, "epoch": 1475} {"train_loss": -39.35184097290039, "global_step": 178555, "epoch": 1475} {"train_loss": -30.164688110351562, "global_step": 178556, "epoch": 1475} {"train_loss": -40.13010787963867, "global_step": 178557, "epoch": 1475} {"train_loss": -40.348079681396484, "global_step": 178558, "epoch": 1475} {"train_loss": -38.987281799316406, "global_step": 178559, "epoch": 1475} {"train_loss": -37.77604293823242, "global_step": 178560, "epoch": 1475} {"train_loss": -33.44561767578125, "global_step": 178561, "epoch": 1475} {"train_loss": -37.179561614990234, "global_step": 178562, "epoch": 1475} {"train_loss": -37.8845329284668, "global_step": 178563, "epoch": 1475} {"train_loss": -38.53611755371094, "global_step": 178564, "epoch": 1475} {"train_loss": -38.22610092163086, "global_step": 178565, "epoch": 1475} {"train_loss": -39.40841293334961, "global_step": 178566, "epoch": 1475} {"train_loss": -37.27134323120117, "global_step": 178567, "epoch": 1475} {"train_loss": -38.682640075683594, "global_step": 178568, "epoch": 1475} {"train_loss": -37.60749435424805, "global_step": 178569, "epoch": 1475} {"train_loss": -38.1992301940918, "global_step": 178570, "epoch": 1475} {"train_loss": -37.956642150878906, "global_step": 178571, "epoch": 1475} {"train_loss": -39.69404220581055, "global_step": 178572, "epoch": 1475} {"train_loss": -39.9193000793457, "global_step": 178573, "epoch": 1475} {"train_loss": -39.38962173461914, "global_step": 178574, "epoch": 1475} {"train_loss": -36.74626541137695, "global_step": 178575, "epoch": 1475} {"train_loss": -39.29833221435547, "global_step": 178576, "epoch": 1475} {"train_loss": -39.39908981323242, "global_step": 178577, "epoch": 1475} {"train_loss": -39.493133544921875, "global_step": 178578, "epoch": 1475} {"train_loss": -39.996124267578125, "global_step": 178579, "epoch": 1475} {"train_loss": -38.70448303222656, "global_step": 178580, "epoch": 1475} {"train_loss": -38.83251953125, "global_step": 178581, "epoch": 1475} {"train_loss": -39.57313537597656, "global_step": 178582, "epoch": 1475} {"train_loss": -40.19114303588867, "global_step": 178583, "epoch": 1475} {"train_loss": -39.901824951171875, "global_step": 178584, "epoch": 1475} {"train_loss": -39.67873001098633, "global_step": 178585, "epoch": 1475} {"train_loss": -38.6014404296875, "global_step": 178586, "epoch": 1475} {"train_loss": -39.52042007446289, "global_step": 178587, "epoch": 1475} {"train_loss": -39.422420501708984, "global_step": 178588, "epoch": 1475} {"train_loss": -40.1344108581543, "global_step": 178589, "epoch": 1475} {"train_loss": -37.17466735839844, "global_step": 178590, "epoch": 1475} {"train_loss": -39.57359313964844, "global_step": 178591, "epoch": 1475} {"train_loss": -40.671512603759766, "global_step": 178592, "epoch": 1475} {"train_loss": -38.68788528442383, "global_step": 178593, "epoch": 1475} {"train_loss": -39.30540084838867, "global_step": 178594, "epoch": 1475} {"train_loss": -39.83508217236227, "global_step": 178595, "epoch": 1475, "val_loss": 2724614.25} {"train_loss": -38.534881591796875, "global_step": 178596, "epoch": 1476} {"train_loss": -38.39768600463867, "global_step": 178597, "epoch": 1476} {"train_loss": -38.8413200378418, "global_step": 178598, "epoch": 1476} {"train_loss": -37.85770797729492, "global_step": 178599, "epoch": 1476} {"train_loss": -39.86604690551758, "global_step": 178600, "epoch": 1476} {"train_loss": -38.281654357910156, "global_step": 178601, "epoch": 1476} {"train_loss": -39.46311569213867, "global_step": 178602, "epoch": 1476} {"train_loss": -40.428890228271484, "global_step": 178603, "epoch": 1476} {"train_loss": -38.8184814453125, "global_step": 178604, "epoch": 1476} {"train_loss": -39.19976043701172, "global_step": 178605, "epoch": 1476} {"train_loss": -40.05341339111328, "global_step": 178606, "epoch": 1476} {"train_loss": -41.00946044921875, "global_step": 178607, "epoch": 1476} {"train_loss": -37.310359954833984, "global_step": 178608, "epoch": 1476} {"train_loss": -39.94514846801758, "global_step": 178609, "epoch": 1476} {"train_loss": -38.79898452758789, "global_step": 178610, "epoch": 1476} {"train_loss": -39.27139663696289, "global_step": 178611, "epoch": 1476} {"train_loss": -39.97711181640625, "global_step": 178612, "epoch": 1476} {"train_loss": -40.0664176940918, "global_step": 178613, "epoch": 1476} {"train_loss": -40.17719268798828, "global_step": 178614, "epoch": 1476} {"train_loss": -39.842445373535156, "global_step": 178615, "epoch": 1476} {"train_loss": -40.42726516723633, "global_step": 178616, "epoch": 1476} {"train_loss": -37.91351318359375, "global_step": 178617, "epoch": 1476} {"train_loss": -39.802223205566406, "global_step": 178618, "epoch": 1476} {"train_loss": -40.90986251831055, "global_step": 178619, "epoch": 1476} {"train_loss": -39.75860595703125, "global_step": 178620, "epoch": 1476} {"train_loss": -40.10075759887695, "global_step": 178621, "epoch": 1476} {"train_loss": -40.90629196166992, "global_step": 178622, "epoch": 1476} {"train_loss": -38.470149993896484, "global_step": 178623, "epoch": 1476} {"train_loss": -40.58602523803711, "global_step": 178624, "epoch": 1476} {"train_loss": -39.16109085083008, "global_step": 178625, "epoch": 1476} {"train_loss": -39.91366195678711, "global_step": 178626, "epoch": 1476} {"train_loss": -40.65922927856445, "global_step": 178627, "epoch": 1476} {"train_loss": -39.675785064697266, "global_step": 178628, "epoch": 1476} {"train_loss": -40.188751220703125, "global_step": 178629, "epoch": 1476} {"train_loss": -40.27622604370117, "global_step": 178630, "epoch": 1476} {"train_loss": -40.74474334716797, "global_step": 178631, "epoch": 1476} {"train_loss": -39.45308303833008, "global_step": 178632, "epoch": 1476} {"train_loss": -40.1479606628418, "global_step": 178633, "epoch": 1476} {"train_loss": -39.7294807434082, "global_step": 178634, "epoch": 1476} {"train_loss": -40.798683166503906, "global_step": 178635, "epoch": 1476} {"train_loss": -40.394432067871094, "global_step": 178636, "epoch": 1476} {"train_loss": -38.654598236083984, "global_step": 178637, "epoch": 1476} {"train_loss": -41.01958084106445, "global_step": 178638, "epoch": 1476} {"train_loss": -40.98659896850586, "global_step": 178639, "epoch": 1476} {"train_loss": -40.52655792236328, "global_step": 178640, "epoch": 1476} {"train_loss": -40.510459899902344, "global_step": 178641, "epoch": 1476} {"train_loss": -40.097713470458984, "global_step": 178642, "epoch": 1476} {"train_loss": -40.45676040649414, "global_step": 178643, "epoch": 1476} {"train_loss": -40.4119758605957, "global_step": 178644, "epoch": 1476} {"train_loss": -41.08435821533203, "global_step": 178645, "epoch": 1476} {"train_loss": -40.387203216552734, "global_step": 178646, "epoch": 1476} {"train_loss": -40.754642486572266, "global_step": 178647, "epoch": 1476} {"train_loss": -40.30329513549805, "global_step": 178648, "epoch": 1476} {"train_loss": -40.60089111328125, "global_step": 178649, "epoch": 1476} {"train_loss": -40.87660598754883, "global_step": 178650, "epoch": 1476} {"train_loss": -40.87089157104492, "global_step": 178651, "epoch": 1476} {"train_loss": -41.03333282470703, "global_step": 178652, "epoch": 1476} {"train_loss": -39.86863327026367, "global_step": 178653, "epoch": 1476} {"train_loss": -41.22880935668945, "global_step": 178654, "epoch": 1476} {"train_loss": -41.441986083984375, "global_step": 178655, "epoch": 1476} {"train_loss": -41.07339096069336, "global_step": 178656, "epoch": 1476} {"train_loss": -41.359676361083984, "global_step": 178657, "epoch": 1476} {"train_loss": -41.23679733276367, "global_step": 178658, "epoch": 1476} {"train_loss": -40.951839447021484, "global_step": 178659, "epoch": 1476} {"train_loss": -41.345306396484375, "global_step": 178660, "epoch": 1476} {"train_loss": -41.13002014160156, "global_step": 178661, "epoch": 1476} {"train_loss": -41.10441207885742, "global_step": 178662, "epoch": 1476} {"train_loss": -41.76017379760742, "global_step": 178663, "epoch": 1476} {"train_loss": -41.270137786865234, "global_step": 178664, "epoch": 1476} {"train_loss": -41.2131233215332, "global_step": 178665, "epoch": 1476} {"train_loss": -41.715641021728516, "global_step": 178666, "epoch": 1476} {"train_loss": -40.90277099609375, "global_step": 178667, "epoch": 1476} {"train_loss": -41.57322311401367, "global_step": 178668, "epoch": 1476} {"train_loss": -41.52523422241211, "global_step": 178669, "epoch": 1476} {"train_loss": -40.52897262573242, "global_step": 178670, "epoch": 1476} {"train_loss": -41.24715042114258, "global_step": 178671, "epoch": 1476} {"train_loss": -41.53213882446289, "global_step": 178672, "epoch": 1476} {"train_loss": -41.394775390625, "global_step": 178673, "epoch": 1476} {"train_loss": -41.810848236083984, "global_step": 178674, "epoch": 1476} {"train_loss": -41.56150436401367, "global_step": 178675, "epoch": 1476} {"train_loss": -41.42604446411133, "global_step": 178676, "epoch": 1476} {"train_loss": -41.04081344604492, "global_step": 178677, "epoch": 1476} {"train_loss": -40.80535125732422, "global_step": 178678, "epoch": 1476} {"train_loss": -41.105751037597656, "global_step": 178679, "epoch": 1476} {"train_loss": -41.337013244628906, "global_step": 178680, "epoch": 1476} {"train_loss": -41.711666107177734, "global_step": 178681, "epoch": 1476} {"train_loss": -41.851417541503906, "global_step": 178682, "epoch": 1476} {"train_loss": -40.723690032958984, "global_step": 178683, "epoch": 1476} {"train_loss": -41.73099899291992, "global_step": 178684, "epoch": 1476} {"train_loss": -41.8124885559082, "global_step": 178685, "epoch": 1476} {"train_loss": -40.95636749267578, "global_step": 178686, "epoch": 1476} {"train_loss": -41.49634552001953, "global_step": 178687, "epoch": 1476} {"train_loss": -41.477394104003906, "global_step": 178688, "epoch": 1476} {"train_loss": -41.134765625, "global_step": 178689, "epoch": 1476} {"train_loss": -41.650054931640625, "global_step": 178690, "epoch": 1476} {"train_loss": -40.69218063354492, "global_step": 178691, "epoch": 1476} {"train_loss": -40.81670379638672, "global_step": 178692, "epoch": 1476} {"train_loss": -40.27702331542969, "global_step": 178693, "epoch": 1476} {"train_loss": -40.24325180053711, "global_step": 178694, "epoch": 1476} {"train_loss": -40.69024658203125, "global_step": 178695, "epoch": 1476} {"train_loss": -40.7109375, "global_step": 178696, "epoch": 1476} {"train_loss": -39.08298110961914, "global_step": 178697, "epoch": 1476} {"train_loss": -40.31511306762695, "global_step": 178698, "epoch": 1476} {"train_loss": -39.53861618041992, "global_step": 178699, "epoch": 1476} {"train_loss": -40.42766189575195, "global_step": 178700, "epoch": 1476} {"train_loss": -39.85334014892578, "global_step": 178701, "epoch": 1476} {"train_loss": -39.66114044189453, "global_step": 178702, "epoch": 1476} {"train_loss": -40.37063980102539, "global_step": 178703, "epoch": 1476} {"train_loss": -40.475341796875, "global_step": 178704, "epoch": 1476} {"train_loss": -40.59434127807617, "global_step": 178705, "epoch": 1476} {"train_loss": -40.611236572265625, "global_step": 178706, "epoch": 1476} {"train_loss": -39.70554733276367, "global_step": 178707, "epoch": 1476} {"train_loss": -40.32375717163086, "global_step": 178708, "epoch": 1476} {"train_loss": -37.195980072021484, "global_step": 178709, "epoch": 1476} {"train_loss": -34.82008743286133, "global_step": 178710, "epoch": 1476} {"train_loss": -37.55975341796875, "global_step": 178711, "epoch": 1476} {"train_loss": -32.61997604370117, "global_step": 178712, "epoch": 1476} {"train_loss": -36.99481964111328, "global_step": 178713, "epoch": 1476} {"train_loss": -38.31021499633789, "global_step": 178714, "epoch": 1476} {"train_loss": -38.48112487792969, "global_step": 178715, "epoch": 1476} {"train_loss": -40.171055376037096, "global_step": 178716, "epoch": 1476, "val_loss": 2595877.0} {"train_loss": -36.54072189331055, "global_step": 178717, "epoch": 1477} {"train_loss": -38.11753845214844, "global_step": 178718, "epoch": 1477} {"train_loss": -39.77352523803711, "global_step": 178719, "epoch": 1477} {"train_loss": -37.85725784301758, "global_step": 178720, "epoch": 1477} {"train_loss": -38.33180618286133, "global_step": 178721, "epoch": 1477} {"train_loss": -40.07761764526367, "global_step": 178722, "epoch": 1477} {"train_loss": -35.197425842285156, "global_step": 178723, "epoch": 1477} {"train_loss": -39.64432907104492, "global_step": 178724, "epoch": 1477} {"train_loss": -37.860572814941406, "global_step": 178725, "epoch": 1477} {"train_loss": -37.8544807434082, "global_step": 178726, "epoch": 1477} {"train_loss": -38.5537109375, "global_step": 178727, "epoch": 1477} {"train_loss": -39.50316619873047, "global_step": 178728, "epoch": 1477} {"train_loss": -39.51628494262695, "global_step": 178729, "epoch": 1477} {"train_loss": -39.4113655090332, "global_step": 178730, "epoch": 1477} {"train_loss": -39.453407287597656, "global_step": 178731, "epoch": 1477} {"train_loss": -40.26993942260742, "global_step": 178732, "epoch": 1477} {"train_loss": -39.05837631225586, "global_step": 178733, "epoch": 1477} {"train_loss": -40.430084228515625, "global_step": 178734, "epoch": 1477} {"train_loss": -40.097469329833984, "global_step": 178735, "epoch": 1477} {"train_loss": -40.734954833984375, "global_step": 178736, "epoch": 1477} {"train_loss": -40.78203201293945, "global_step": 178737, "epoch": 1477} {"train_loss": -40.2573356628418, "global_step": 178738, "epoch": 1477} {"train_loss": -40.31044387817383, "global_step": 178739, "epoch": 1477} {"train_loss": -39.647735595703125, "global_step": 178740, "epoch": 1477} {"train_loss": -40.209320068359375, "global_step": 178741, "epoch": 1477} {"train_loss": -39.983158111572266, "global_step": 178742, "epoch": 1477} {"train_loss": -40.710235595703125, "global_step": 178743, "epoch": 1477} {"train_loss": -37.14448928833008, "global_step": 178744, "epoch": 1477} {"train_loss": -40.55727767944336, "global_step": 178745, "epoch": 1477} {"train_loss": -39.65604019165039, "global_step": 178746, "epoch": 1477} {"train_loss": -40.34480667114258, "global_step": 178747, "epoch": 1477} {"train_loss": -40.533302307128906, "global_step": 178748, "epoch": 1477} {"train_loss": -37.979339599609375, "global_step": 178749, "epoch": 1477} {"train_loss": -40.36963653564453, "global_step": 178750, "epoch": 1477} {"train_loss": -40.31978225708008, "global_step": 178751, "epoch": 1477} {"train_loss": -39.834205627441406, "global_step": 178752, "epoch": 1477} {"train_loss": -40.86019515991211, "global_step": 178753, "epoch": 1477} {"train_loss": -40.304473876953125, "global_step": 178754, "epoch": 1477} {"train_loss": -40.465553283691406, "global_step": 178755, "epoch": 1477} {"train_loss": -37.29030990600586, "global_step": 178756, "epoch": 1477} {"train_loss": -39.860870361328125, "global_step": 178757, "epoch": 1477} {"train_loss": -40.35065460205078, "global_step": 178758, "epoch": 1477} {"train_loss": -40.31437301635742, "global_step": 178759, "epoch": 1477} {"train_loss": -38.93077850341797, "global_step": 178760, "epoch": 1477} {"train_loss": -40.252044677734375, "global_step": 178761, "epoch": 1477} {"train_loss": -40.08070373535156, "global_step": 178762, "epoch": 1477} {"train_loss": -34.64274978637695, "global_step": 178763, "epoch": 1477} {"train_loss": -37.14278793334961, "global_step": 178764, "epoch": 1477} {"train_loss": -38.65671920776367, "global_step": 178765, "epoch": 1477} {"train_loss": -37.53628921508789, "global_step": 178766, "epoch": 1477} {"train_loss": -39.72329330444336, "global_step": 178767, "epoch": 1477} {"train_loss": -38.990882873535156, "global_step": 178768, "epoch": 1477} {"train_loss": -40.13208770751953, "global_step": 178769, "epoch": 1477} {"train_loss": -39.70205307006836, "global_step": 178770, "epoch": 1477} {"train_loss": -39.22602081298828, "global_step": 178771, "epoch": 1477} {"train_loss": -40.21183395385742, "global_step": 178772, "epoch": 1477} {"train_loss": -38.52229690551758, "global_step": 178773, "epoch": 1477} {"train_loss": -39.59306716918945, "global_step": 178774, "epoch": 1477} {"train_loss": -39.358455657958984, "global_step": 178775, "epoch": 1477} {"train_loss": -39.86933517456055, "global_step": 178776, "epoch": 1477} {"train_loss": -39.15964889526367, "global_step": 178777, "epoch": 1477} {"train_loss": -40.65903854370117, "global_step": 178778, "epoch": 1477} {"train_loss": -39.38637161254883, "global_step": 178779, "epoch": 1477} {"train_loss": -39.93293380737305, "global_step": 178780, "epoch": 1477} {"train_loss": -40.35404968261719, "global_step": 178781, "epoch": 1477} {"train_loss": -39.93773651123047, "global_step": 178782, "epoch": 1477} {"train_loss": -39.9692497253418, "global_step": 178783, "epoch": 1477} {"train_loss": -39.85763931274414, "global_step": 178784, "epoch": 1477} {"train_loss": -41.02226638793945, "global_step": 178785, "epoch": 1477} {"train_loss": -39.139522552490234, "global_step": 178786, "epoch": 1477} {"train_loss": -40.87187576293945, "global_step": 178787, "epoch": 1477} {"train_loss": -41.1503791809082, "global_step": 178788, "epoch": 1477} {"train_loss": -40.86823654174805, "global_step": 178789, "epoch": 1477} {"train_loss": -36.75968551635742, "global_step": 178790, "epoch": 1477} {"train_loss": -40.883338928222656, "global_step": 178791, "epoch": 1477} {"train_loss": -40.0441780090332, "global_step": 178792, "epoch": 1477} {"train_loss": -40.50533676147461, "global_step": 178793, "epoch": 1477} {"train_loss": -40.963134765625, "global_step": 178794, "epoch": 1477} {"train_loss": -41.625850677490234, "global_step": 178795, "epoch": 1477} {"train_loss": -39.6749267578125, "global_step": 178796, "epoch": 1477} {"train_loss": -39.84900665283203, "global_step": 178797, "epoch": 1477} {"train_loss": -35.33543395996094, "global_step": 178798, "epoch": 1477} {"train_loss": -39.12415313720703, "global_step": 178799, "epoch": 1477} {"train_loss": -39.131011962890625, "global_step": 178800, "epoch": 1477} {"train_loss": -40.59299087524414, "global_step": 178801, "epoch": 1477} {"train_loss": -41.135494232177734, "global_step": 178802, "epoch": 1477} {"train_loss": -39.290138244628906, "global_step": 178803, "epoch": 1477} {"train_loss": -39.614349365234375, "global_step": 178804, "epoch": 1477} {"train_loss": -39.55491256713867, "global_step": 178805, "epoch": 1477} {"train_loss": -39.96013641357422, "global_step": 178806, "epoch": 1477} {"train_loss": -40.26897430419922, "global_step": 178807, "epoch": 1477} {"train_loss": -40.1951789855957, "global_step": 178808, "epoch": 1477} {"train_loss": -39.67926788330078, "global_step": 178809, "epoch": 1477} {"train_loss": -40.60581970214844, "global_step": 178810, "epoch": 1477} {"train_loss": -40.096187591552734, "global_step": 178811, "epoch": 1477} {"train_loss": -39.57212448120117, "global_step": 178812, "epoch": 1477} {"train_loss": -40.6822624206543, "global_step": 178813, "epoch": 1477} {"train_loss": -37.9254150390625, "global_step": 178814, "epoch": 1477} {"train_loss": -38.523983001708984, "global_step": 178815, "epoch": 1477} {"train_loss": -40.65583038330078, "global_step": 178816, "epoch": 1477} {"train_loss": -39.466609954833984, "global_step": 178817, "epoch": 1477} {"train_loss": -38.11239242553711, "global_step": 178818, "epoch": 1477} {"train_loss": -41.02132797241211, "global_step": 178819, "epoch": 1477} {"train_loss": -39.924407958984375, "global_step": 178820, "epoch": 1477} {"train_loss": -40.29350662231445, "global_step": 178821, "epoch": 1477} {"train_loss": -40.94609832763672, "global_step": 178822, "epoch": 1477} {"train_loss": -40.744293212890625, "global_step": 178823, "epoch": 1477} {"train_loss": -40.96919250488281, "global_step": 178824, "epoch": 1477} {"train_loss": -41.22566223144531, "global_step": 178825, "epoch": 1477} {"train_loss": -40.302093505859375, "global_step": 178826, "epoch": 1477} {"train_loss": -41.17289352416992, "global_step": 178827, "epoch": 1477} {"train_loss": -40.5438346862793, "global_step": 178828, "epoch": 1477} {"train_loss": -36.73566818237305, "global_step": 178829, "epoch": 1477} {"train_loss": -40.47794723510742, "global_step": 178830, "epoch": 1477} {"train_loss": -39.56510543823242, "global_step": 178831, "epoch": 1477} {"train_loss": -40.918758392333984, "global_step": 178832, "epoch": 1477} {"train_loss": -40.369606018066406, "global_step": 178833, "epoch": 1477} {"train_loss": -41.192596435546875, "global_step": 178834, "epoch": 1477} {"train_loss": -40.800174713134766, "global_step": 178835, "epoch": 1477} {"train_loss": -40.47956466674805, "global_step": 178836, "epoch": 1477} {"train_loss": -39.64121839034656, "global_step": 178837, "epoch": 1477, "val_loss": 2596018.5} {"train_loss": -40.8691291809082, "global_step": 178838, "epoch": 1478} {"train_loss": -39.772216796875, "global_step": 178839, "epoch": 1478} {"train_loss": -38.93272018432617, "global_step": 178840, "epoch": 1478} {"train_loss": -39.269508361816406, "global_step": 178841, "epoch": 1478} {"train_loss": -40.63747787475586, "global_step": 178842, "epoch": 1478} {"train_loss": -41.04289627075195, "global_step": 178843, "epoch": 1478} {"train_loss": -40.910804748535156, "global_step": 178844, "epoch": 1478} {"train_loss": -40.33707046508789, "global_step": 178845, "epoch": 1478} {"train_loss": -41.205108642578125, "global_step": 178846, "epoch": 1478} {"train_loss": -40.28505325317383, "global_step": 178847, "epoch": 1478} {"train_loss": -40.95307540893555, "global_step": 178848, "epoch": 1478} {"train_loss": -39.744964599609375, "global_step": 178849, "epoch": 1478} {"train_loss": -39.91057205200195, "global_step": 178850, "epoch": 1478} {"train_loss": -40.69218826293945, "global_step": 178851, "epoch": 1478} {"train_loss": -40.78293991088867, "global_step": 178852, "epoch": 1478} {"train_loss": -41.32857131958008, "global_step": 178853, "epoch": 1478} {"train_loss": -40.75338363647461, "global_step": 178854, "epoch": 1478} {"train_loss": -41.00777816772461, "global_step": 178855, "epoch": 1478} {"train_loss": -41.080535888671875, "global_step": 178856, "epoch": 1478} {"train_loss": -40.1484375, "global_step": 178857, "epoch": 1478} {"train_loss": -41.15552520751953, "global_step": 178858, "epoch": 1478} {"train_loss": -40.965538024902344, "global_step": 178859, "epoch": 1478} {"train_loss": -40.557167053222656, "global_step": 178860, "epoch": 1478} {"train_loss": -39.280399322509766, "global_step": 178861, "epoch": 1478} {"train_loss": -41.247352600097656, "global_step": 178862, "epoch": 1478} {"train_loss": -40.370826721191406, "global_step": 178863, "epoch": 1478} {"train_loss": -41.03035354614258, "global_step": 178864, "epoch": 1478} {"train_loss": -40.2450065612793, "global_step": 178865, "epoch": 1478} {"train_loss": -38.71546936035156, "global_step": 178866, "epoch": 1478} {"train_loss": -38.684627532958984, "global_step": 178867, "epoch": 1478} {"train_loss": -38.94000244140625, "global_step": 178868, "epoch": 1478} {"train_loss": -40.07229232788086, "global_step": 178869, "epoch": 1478} {"train_loss": -40.613258361816406, "global_step": 178870, "epoch": 1478} {"train_loss": -39.67548751831055, "global_step": 178871, "epoch": 1478} {"train_loss": -38.489654541015625, "global_step": 178872, "epoch": 1478} {"train_loss": -39.226680755615234, "global_step": 178873, "epoch": 1478} {"train_loss": -38.91138458251953, "global_step": 178874, "epoch": 1478} {"train_loss": -37.32023239135742, "global_step": 178875, "epoch": 1478} {"train_loss": -39.83753967285156, "global_step": 178876, "epoch": 1478} {"train_loss": -39.58771896362305, "global_step": 178877, "epoch": 1478} {"train_loss": -37.083065032958984, "global_step": 178878, "epoch": 1478} {"train_loss": -37.13731384277344, "global_step": 178879, "epoch": 1478} {"train_loss": -40.530296325683594, "global_step": 178880, "epoch": 1478} {"train_loss": -39.245418548583984, "global_step": 178881, "epoch": 1478} {"train_loss": -34.93194580078125, "global_step": 178882, "epoch": 1478} {"train_loss": -38.70294952392578, "global_step": 178883, "epoch": 1478} {"train_loss": -40.19755172729492, "global_step": 178884, "epoch": 1478} {"train_loss": -37.411712646484375, "global_step": 178885, "epoch": 1478} {"train_loss": -39.14724349975586, "global_step": 178886, "epoch": 1478} {"train_loss": -40.69108581542969, "global_step": 178887, "epoch": 1478} {"train_loss": -38.90789794921875, "global_step": 178888, "epoch": 1478} {"train_loss": -41.13862228393555, "global_step": 178889, "epoch": 1478} {"train_loss": -38.43589401245117, "global_step": 178890, "epoch": 1478} {"train_loss": -40.041053771972656, "global_step": 178891, "epoch": 1478} {"train_loss": -40.264408111572266, "global_step": 178892, "epoch": 1478} {"train_loss": -37.67928695678711, "global_step": 178893, "epoch": 1478} {"train_loss": -40.083534240722656, "global_step": 178894, "epoch": 1478} {"train_loss": -39.03346633911133, "global_step": 178895, "epoch": 1478} {"train_loss": -38.926570892333984, "global_step": 178896, "epoch": 1478} {"train_loss": -40.73118209838867, "global_step": 178897, "epoch": 1478} {"train_loss": -39.712032318115234, "global_step": 178898, "epoch": 1478} {"train_loss": -39.9586067199707, "global_step": 178899, "epoch": 1478} {"train_loss": -40.22442626953125, "global_step": 178900, "epoch": 1478} {"train_loss": -39.83756637573242, "global_step": 178901, "epoch": 1478} {"train_loss": -40.44498825073242, "global_step": 178902, "epoch": 1478} {"train_loss": -39.59190368652344, "global_step": 178903, "epoch": 1478} {"train_loss": -40.64556121826172, "global_step": 178904, "epoch": 1478} {"train_loss": -40.70025634765625, "global_step": 178905, "epoch": 1478} {"train_loss": -40.96296310424805, "global_step": 178906, "epoch": 1478} {"train_loss": -40.66325759887695, "global_step": 178907, "epoch": 1478} {"train_loss": -40.80904006958008, "global_step": 178908, "epoch": 1478} {"train_loss": -40.28730392456055, "global_step": 178909, "epoch": 1478} {"train_loss": -40.77080535888672, "global_step": 178910, "epoch": 1478} {"train_loss": -40.62742233276367, "global_step": 178911, "epoch": 1478} {"train_loss": -40.926429748535156, "global_step": 178912, "epoch": 1478} {"train_loss": -40.74541473388672, "global_step": 178913, "epoch": 1478} {"train_loss": -40.945045471191406, "global_step": 178914, "epoch": 1478} {"train_loss": -40.95280075073242, "global_step": 178915, "epoch": 1478} {"train_loss": -40.14266586303711, "global_step": 178916, "epoch": 1478} {"train_loss": -40.99605941772461, "global_step": 178917, "epoch": 1478} {"train_loss": -41.1983757019043, "global_step": 178918, "epoch": 1478} {"train_loss": -41.31022262573242, "global_step": 178919, "epoch": 1478} {"train_loss": -39.66559600830078, "global_step": 178920, "epoch": 1478} {"train_loss": -40.292537689208984, "global_step": 178921, "epoch": 1478} {"train_loss": -40.680904388427734, "global_step": 178922, "epoch": 1478} {"train_loss": -40.96358871459961, "global_step": 178923, "epoch": 1478} {"train_loss": -41.10439682006836, "global_step": 178924, "epoch": 1478} {"train_loss": -41.28114318847656, "global_step": 178925, "epoch": 1478} {"train_loss": -40.862281799316406, "global_step": 178926, "epoch": 1478} {"train_loss": -40.97249984741211, "global_step": 178927, "epoch": 1478} {"train_loss": -40.69466018676758, "global_step": 178928, "epoch": 1478} {"train_loss": -37.52867126464844, "global_step": 178929, "epoch": 1478} {"train_loss": -40.483394622802734, "global_step": 178930, "epoch": 1478} {"train_loss": -40.50948715209961, "global_step": 178931, "epoch": 1478} {"train_loss": -41.58425521850586, "global_step": 178932, "epoch": 1478} {"train_loss": -41.00311279296875, "global_step": 178933, "epoch": 1478} {"train_loss": -40.16251754760742, "global_step": 178934, "epoch": 1478} {"train_loss": -40.87104415893555, "global_step": 178935, "epoch": 1478} {"train_loss": -35.25822067260742, "global_step": 178936, "epoch": 1478} {"train_loss": -39.216888427734375, "global_step": 178937, "epoch": 1478} {"train_loss": -36.21383285522461, "global_step": 178938, "epoch": 1478} {"train_loss": -39.30018997192383, "global_step": 178939, "epoch": 1478} {"train_loss": -38.40601348876953, "global_step": 178940, "epoch": 1478} {"train_loss": -38.58712387084961, "global_step": 178941, "epoch": 1478} {"train_loss": -39.15409469604492, "global_step": 178942, "epoch": 1478} {"train_loss": -40.07377243041992, "global_step": 178943, "epoch": 1478} {"train_loss": -37.727691650390625, "global_step": 178944, "epoch": 1478} {"train_loss": -36.45785140991211, "global_step": 178945, "epoch": 1478} {"train_loss": -40.408138275146484, "global_step": 178946, "epoch": 1478} {"train_loss": -38.22529220581055, "global_step": 178947, "epoch": 1478} {"train_loss": -37.510719299316406, "global_step": 178948, "epoch": 1478} {"train_loss": -33.529964447021484, "global_step": 178949, "epoch": 1478} {"train_loss": -34.90786361694336, "global_step": 178950, "epoch": 1478} {"train_loss": -30.82086753845215, "global_step": 178951, "epoch": 1478} {"train_loss": -35.712989807128906, "global_step": 178952, "epoch": 1478} {"train_loss": -35.920379638671875, "global_step": 178953, "epoch": 1478} {"train_loss": -27.807172775268555, "global_step": 178954, "epoch": 1478} {"train_loss": -33.33759307861328, "global_step": 178955, "epoch": 1478} {"train_loss": -33.53120040893555, "global_step": 178956, "epoch": 1478} {"train_loss": -36.734893798828125, "global_step": 178957, "epoch": 1478} {"train_loss": -39.242842603320916, "global_step": 178958, "epoch": 1478, "val_loss": 2956592.0} {"train_loss": -37.860164642333984, "global_step": 178959, "epoch": 1479} {"train_loss": -35.87446212768555, "global_step": 178960, "epoch": 1479} {"train_loss": -38.22745895385742, "global_step": 178961, "epoch": 1479} {"train_loss": -36.1553840637207, "global_step": 178962, "epoch": 1479} {"train_loss": -31.691608428955078, "global_step": 178963, "epoch": 1479} {"train_loss": -35.103424072265625, "global_step": 178964, "epoch": 1479} {"train_loss": -33.867652893066406, "global_step": 178965, "epoch": 1479} {"train_loss": -28.592926025390625, "global_step": 178966, "epoch": 1479} {"train_loss": -34.99844741821289, "global_step": 178967, "epoch": 1479} {"train_loss": -34.266273498535156, "global_step": 178968, "epoch": 1479} {"train_loss": -37.19122314453125, "global_step": 178969, "epoch": 1479} {"train_loss": -36.111751556396484, "global_step": 178970, "epoch": 1479} {"train_loss": -36.60903549194336, "global_step": 178971, "epoch": 1479} {"train_loss": -37.869319915771484, "global_step": 178972, "epoch": 1479} {"train_loss": -36.387725830078125, "global_step": 178973, "epoch": 1479} {"train_loss": -37.363502502441406, "global_step": 178974, "epoch": 1479} {"train_loss": -34.80973434448242, "global_step": 178975, "epoch": 1479} {"train_loss": -34.809974670410156, "global_step": 178976, "epoch": 1479} {"train_loss": -37.631900787353516, "global_step": 178977, "epoch": 1479} {"train_loss": -37.96210479736328, "global_step": 178978, "epoch": 1479} {"train_loss": -36.57470703125, "global_step": 178979, "epoch": 1479} {"train_loss": -37.77903366088867, "global_step": 178980, "epoch": 1479} {"train_loss": -38.043758392333984, "global_step": 178981, "epoch": 1479} {"train_loss": -37.05124282836914, "global_step": 178982, "epoch": 1479} {"train_loss": -38.71555709838867, "global_step": 178983, "epoch": 1479} {"train_loss": -38.134185791015625, "global_step": 178984, "epoch": 1479} {"train_loss": -36.849578857421875, "global_step": 178985, "epoch": 1479} {"train_loss": -39.12093734741211, "global_step": 178986, "epoch": 1479} {"train_loss": -37.4115104675293, "global_step": 178987, "epoch": 1479} {"train_loss": -38.51216506958008, "global_step": 178988, "epoch": 1479} {"train_loss": -38.55454635620117, "global_step": 178989, "epoch": 1479} {"train_loss": -38.572566986083984, "global_step": 178990, "epoch": 1479} {"train_loss": -38.50254440307617, "global_step": 178991, "epoch": 1479} {"train_loss": -37.93106460571289, "global_step": 178992, "epoch": 1479} {"train_loss": -38.95724105834961, "global_step": 178993, "epoch": 1479} {"train_loss": -38.28672409057617, "global_step": 178994, "epoch": 1479} {"train_loss": -38.413970947265625, "global_step": 178995, "epoch": 1479} {"train_loss": -39.05814743041992, "global_step": 178996, "epoch": 1479} {"train_loss": -38.39168167114258, "global_step": 178997, "epoch": 1479} {"train_loss": -38.18412399291992, "global_step": 178998, "epoch": 1479} {"train_loss": -39.19538497924805, "global_step": 178999, "epoch": 1479} {"train_loss": -39.04248809814453, "global_step": 179000, "epoch": 1479} {"train_loss": -39.07026290893555, "global_step": 179001, "epoch": 1479} {"train_loss": -38.84382247924805, "global_step": 179002, "epoch": 1479} {"train_loss": -38.831111907958984, "global_step": 179003, "epoch": 1479} {"train_loss": -38.71439743041992, "global_step": 179004, "epoch": 1479} {"train_loss": -39.41781234741211, "global_step": 179005, "epoch": 1479} {"train_loss": -38.10915756225586, "global_step": 179006, "epoch": 1479} {"train_loss": -39.346187591552734, "global_step": 179007, "epoch": 1479} {"train_loss": -39.60079574584961, "global_step": 179008, "epoch": 1479} {"train_loss": -39.141448974609375, "global_step": 179009, "epoch": 1479} {"train_loss": -39.960506439208984, "global_step": 179010, "epoch": 1479} {"train_loss": -39.755558013916016, "global_step": 179011, "epoch": 1479} {"train_loss": -39.65363693237305, "global_step": 179012, "epoch": 1479} {"train_loss": -39.38544845581055, "global_step": 179013, "epoch": 1479} {"train_loss": -40.13692092895508, "global_step": 179014, "epoch": 1479} {"train_loss": -40.149871826171875, "global_step": 179015, "epoch": 1479} {"train_loss": -39.89608383178711, "global_step": 179016, "epoch": 1479} {"train_loss": -39.8902587890625, "global_step": 179017, "epoch": 1479} {"train_loss": -38.577301025390625, "global_step": 179018, "epoch": 1479} {"train_loss": -38.73148727416992, "global_step": 179019, "epoch": 1479} {"train_loss": -39.516475677490234, "global_step": 179020, "epoch": 1479} {"train_loss": -39.84735870361328, "global_step": 179021, "epoch": 1479} {"train_loss": -40.02387619018555, "global_step": 179022, "epoch": 1479} {"train_loss": -40.122947692871094, "global_step": 179023, "epoch": 1479} {"train_loss": -40.05122756958008, "global_step": 179024, "epoch": 1479} {"train_loss": -39.300819396972656, "global_step": 179025, "epoch": 1479} {"train_loss": -39.7823600769043, "global_step": 179026, "epoch": 1479} {"train_loss": -40.32792663574219, "global_step": 179027, "epoch": 1479} {"train_loss": -40.325313568115234, "global_step": 179028, "epoch": 1479} {"train_loss": -37.4381217956543, "global_step": 179029, "epoch": 1479} {"train_loss": -39.7384147644043, "global_step": 179030, "epoch": 1479} {"train_loss": -40.39607620239258, "global_step": 179031, "epoch": 1479} {"train_loss": -39.66065216064453, "global_step": 179032, "epoch": 1479} {"train_loss": -39.76874542236328, "global_step": 179033, "epoch": 1479} {"train_loss": -39.93341064453125, "global_step": 179034, "epoch": 1479} {"train_loss": -39.90481185913086, "global_step": 179035, "epoch": 1479} {"train_loss": -40.53575134277344, "global_step": 179036, "epoch": 1479} {"train_loss": -39.62179183959961, "global_step": 179037, "epoch": 1479} {"train_loss": -39.90700149536133, "global_step": 179038, "epoch": 1479} {"train_loss": -40.047550201416016, "global_step": 179039, "epoch": 1479} {"train_loss": -40.83104705810547, "global_step": 179040, "epoch": 1479} {"train_loss": -40.149166107177734, "global_step": 179041, "epoch": 1479} {"train_loss": -40.50429916381836, "global_step": 179042, "epoch": 1479} {"train_loss": -39.036842346191406, "global_step": 179043, "epoch": 1479} {"train_loss": -40.302146911621094, "global_step": 179044, "epoch": 1479} {"train_loss": -41.1233024597168, "global_step": 179045, "epoch": 1479} {"train_loss": -40.09386444091797, "global_step": 179046, "epoch": 1479} {"train_loss": -40.1291389465332, "global_step": 179047, "epoch": 1479} {"train_loss": -40.710723876953125, "global_step": 179048, "epoch": 1479} {"train_loss": -40.741966247558594, "global_step": 179049, "epoch": 1479} {"train_loss": -40.3150520324707, "global_step": 179050, "epoch": 1479} {"train_loss": -40.63277816772461, "global_step": 179051, "epoch": 1479} {"train_loss": -40.49259948730469, "global_step": 179052, "epoch": 1479} {"train_loss": -40.61627197265625, "global_step": 179053, "epoch": 1479} {"train_loss": -40.83313751220703, "global_step": 179054, "epoch": 1479} {"train_loss": -40.77088928222656, "global_step": 179055, "epoch": 1479} {"train_loss": -41.47727966308594, "global_step": 179056, "epoch": 1479} {"train_loss": -41.451107025146484, "global_step": 179057, "epoch": 1479} {"train_loss": -40.631351470947266, "global_step": 179058, "epoch": 1479} {"train_loss": -40.429412841796875, "global_step": 179059, "epoch": 1479} {"train_loss": -40.155860900878906, "global_step": 179060, "epoch": 1479} {"train_loss": -40.52092361450195, "global_step": 179061, "epoch": 1479} {"train_loss": -39.878108978271484, "global_step": 179062, "epoch": 1479} {"train_loss": -41.1925163269043, "global_step": 179063, "epoch": 1479} {"train_loss": -41.31692123413086, "global_step": 179064, "epoch": 1479} {"train_loss": -40.80374526977539, "global_step": 179065, "epoch": 1479} {"train_loss": -40.49516677856445, "global_step": 179066, "epoch": 1479} {"train_loss": -41.06879425048828, "global_step": 179067, "epoch": 1479} {"train_loss": -40.75489044189453, "global_step": 179068, "epoch": 1479} {"train_loss": -40.87137985229492, "global_step": 179069, "epoch": 1479} {"train_loss": -41.077980041503906, "global_step": 179070, "epoch": 1479} {"train_loss": -41.39689636230469, "global_step": 179071, "epoch": 1479} {"train_loss": -40.685054779052734, "global_step": 179072, "epoch": 1479} {"train_loss": -41.08182907104492, "global_step": 179073, "epoch": 1479} {"train_loss": -40.4061279296875, "global_step": 179074, "epoch": 1479} {"train_loss": -40.48185348510742, "global_step": 179075, "epoch": 1479} {"train_loss": -40.7489128112793, "global_step": 179076, "epoch": 1479} {"train_loss": -40.06770706176758, "global_step": 179077, "epoch": 1479} {"train_loss": -41.55463409423828, "global_step": 179078, "epoch": 1479} {"train_loss": -39.04522374050676, "global_step": 179079, "epoch": 1479, "val_loss": 2667686.0} {"train_loss": -40.66864013671875, "global_step": 179080, "epoch": 1480} {"train_loss": -41.07821273803711, "global_step": 179081, "epoch": 1480} {"train_loss": -41.10076141357422, "global_step": 179082, "epoch": 1480} {"train_loss": -40.826263427734375, "global_step": 179083, "epoch": 1480} {"train_loss": -40.604400634765625, "global_step": 179084, "epoch": 1480} {"train_loss": -40.81826400756836, "global_step": 179085, "epoch": 1480} {"train_loss": -40.71554183959961, "global_step": 179086, "epoch": 1480} {"train_loss": -40.942317962646484, "global_step": 179087, "epoch": 1480} {"train_loss": -40.9002799987793, "global_step": 179088, "epoch": 1480} {"train_loss": -41.1107177734375, "global_step": 179089, "epoch": 1480} {"train_loss": -41.07685470581055, "global_step": 179090, "epoch": 1480} {"train_loss": -41.042598724365234, "global_step": 179091, "epoch": 1480} {"train_loss": -41.93299102783203, "global_step": 179092, "epoch": 1480} {"train_loss": -40.584083557128906, "global_step": 179093, "epoch": 1480} {"train_loss": -40.55091094970703, "global_step": 179094, "epoch": 1480} {"train_loss": -41.19169235229492, "global_step": 179095, "epoch": 1480} {"train_loss": -41.06667709350586, "global_step": 179096, "epoch": 1480} {"train_loss": -41.16842269897461, "global_step": 179097, "epoch": 1480} {"train_loss": -40.59711837768555, "global_step": 179098, "epoch": 1480} {"train_loss": -41.195858001708984, "global_step": 179099, "epoch": 1480} {"train_loss": -40.411956787109375, "global_step": 179100, "epoch": 1480} {"train_loss": -41.52071762084961, "global_step": 179101, "epoch": 1480} {"train_loss": -40.43009567260742, "global_step": 179102, "epoch": 1480} {"train_loss": -40.76359939575195, "global_step": 179103, "epoch": 1480} {"train_loss": -40.63770294189453, "global_step": 179104, "epoch": 1480} {"train_loss": -40.73443603515625, "global_step": 179105, "epoch": 1480} {"train_loss": -41.140403747558594, "global_step": 179106, "epoch": 1480} {"train_loss": -40.029579162597656, "global_step": 179107, "epoch": 1480} {"train_loss": -37.86848068237305, "global_step": 179108, "epoch": 1480} {"train_loss": -39.98433303833008, "global_step": 179109, "epoch": 1480} {"train_loss": -39.82075119018555, "global_step": 179110, "epoch": 1480} {"train_loss": -40.916683197021484, "global_step": 179111, "epoch": 1480} {"train_loss": -40.486488342285156, "global_step": 179112, "epoch": 1480} {"train_loss": -40.198760986328125, "global_step": 179113, "epoch": 1480} {"train_loss": -39.16424560546875, "global_step": 179114, "epoch": 1480} {"train_loss": -38.427528381347656, "global_step": 179115, "epoch": 1480} {"train_loss": -40.384117126464844, "global_step": 179116, "epoch": 1480} {"train_loss": -40.40437698364258, "global_step": 179117, "epoch": 1480} {"train_loss": -40.0442008972168, "global_step": 179118, "epoch": 1480} {"train_loss": -39.339027404785156, "global_step": 179119, "epoch": 1480} {"train_loss": -38.026798248291016, "global_step": 179120, "epoch": 1480} {"train_loss": -34.60122299194336, "global_step": 179121, "epoch": 1480} {"train_loss": -36.50199508666992, "global_step": 179122, "epoch": 1480} {"train_loss": -39.67948532104492, "global_step": 179123, "epoch": 1480} {"train_loss": -39.41554260253906, "global_step": 179124, "epoch": 1480} {"train_loss": -38.2931022644043, "global_step": 179125, "epoch": 1480} {"train_loss": -37.431880950927734, "global_step": 179126, "epoch": 1480} {"train_loss": -37.70859909057617, "global_step": 179127, "epoch": 1480} {"train_loss": -40.9312629699707, "global_step": 179128, "epoch": 1480} {"train_loss": -39.50510787963867, "global_step": 179129, "epoch": 1480} {"train_loss": -39.125457763671875, "global_step": 179130, "epoch": 1480} {"train_loss": -39.97279357910156, "global_step": 179131, "epoch": 1480} {"train_loss": -39.390602111816406, "global_step": 179132, "epoch": 1480} {"train_loss": -38.47773361206055, "global_step": 179133, "epoch": 1480} {"train_loss": -40.35346221923828, "global_step": 179134, "epoch": 1480} {"train_loss": -40.100582122802734, "global_step": 179135, "epoch": 1480} {"train_loss": -39.861141204833984, "global_step": 179136, "epoch": 1480} {"train_loss": -40.26241683959961, "global_step": 179137, "epoch": 1480} {"train_loss": -40.48714065551758, "global_step": 179138, "epoch": 1480} {"train_loss": -39.895751953125, "global_step": 179139, "epoch": 1480} {"train_loss": -40.25263595581055, "global_step": 179140, "epoch": 1480} {"train_loss": -40.20813751220703, "global_step": 179141, "epoch": 1480} {"train_loss": -40.63237380981445, "global_step": 179142, "epoch": 1480} {"train_loss": -40.084590911865234, "global_step": 179143, "epoch": 1480} {"train_loss": -40.15769577026367, "global_step": 179144, "epoch": 1480} {"train_loss": -39.970703125, "global_step": 179145, "epoch": 1480} {"train_loss": -40.74134826660156, "global_step": 179146, "epoch": 1480} {"train_loss": -40.097747802734375, "global_step": 179147, "epoch": 1480} {"train_loss": -40.5860710144043, "global_step": 179148, "epoch": 1480} {"train_loss": -40.39632797241211, "global_step": 179149, "epoch": 1480} {"train_loss": -40.4820671081543, "global_step": 179150, "epoch": 1480} {"train_loss": -39.84713363647461, "global_step": 179151, "epoch": 1480} {"train_loss": -41.01552200317383, "global_step": 179152, "epoch": 1480} {"train_loss": -40.328060150146484, "global_step": 179153, "epoch": 1480} {"train_loss": -40.843055725097656, "global_step": 179154, "epoch": 1480} {"train_loss": -39.84919357299805, "global_step": 179155, "epoch": 1480} {"train_loss": -40.535400390625, "global_step": 179156, "epoch": 1480} {"train_loss": -40.23377990722656, "global_step": 179157, "epoch": 1480} {"train_loss": -40.327728271484375, "global_step": 179158, "epoch": 1480} {"train_loss": -41.345760345458984, "global_step": 179159, "epoch": 1480} {"train_loss": -41.24711227416992, "global_step": 179160, "epoch": 1480} {"train_loss": -40.96522903442383, "global_step": 179161, "epoch": 1480} {"train_loss": -41.36550521850586, "global_step": 179162, "epoch": 1480} {"train_loss": -40.96996307373047, "global_step": 179163, "epoch": 1480} {"train_loss": -40.44619369506836, "global_step": 179164, "epoch": 1480} {"train_loss": -41.67071533203125, "global_step": 179165, "epoch": 1480} {"train_loss": -40.21211624145508, "global_step": 179166, "epoch": 1480} {"train_loss": -39.206024169921875, "global_step": 179167, "epoch": 1480} {"train_loss": -40.70002365112305, "global_step": 179168, "epoch": 1480} {"train_loss": -41.088165283203125, "global_step": 179169, "epoch": 1480} {"train_loss": -40.513710021972656, "global_step": 179170, "epoch": 1480} {"train_loss": -39.8900260925293, "global_step": 179171, "epoch": 1480} {"train_loss": -40.79173278808594, "global_step": 179172, "epoch": 1480} {"train_loss": -40.72727966308594, "global_step": 179173, "epoch": 1480} {"train_loss": -41.17823028564453, "global_step": 179174, "epoch": 1480} {"train_loss": -39.62815475463867, "global_step": 179175, "epoch": 1480} {"train_loss": -39.55500411987305, "global_step": 179176, "epoch": 1480} {"train_loss": -40.3529052734375, "global_step": 179177, "epoch": 1480} {"train_loss": -40.95497512817383, "global_step": 179178, "epoch": 1480} {"train_loss": -41.58053207397461, "global_step": 179179, "epoch": 1480} {"train_loss": -40.22722244262695, "global_step": 179180, "epoch": 1480} {"train_loss": -40.0677490234375, "global_step": 179181, "epoch": 1480} {"train_loss": -39.51611328125, "global_step": 179182, "epoch": 1480} {"train_loss": -39.5704460144043, "global_step": 179183, "epoch": 1480} {"train_loss": -39.634273529052734, "global_step": 179184, "epoch": 1480} {"train_loss": -40.05086135864258, "global_step": 179185, "epoch": 1480} {"train_loss": -41.163551330566406, "global_step": 179186, "epoch": 1480} {"train_loss": -39.427215576171875, "global_step": 179187, "epoch": 1480} {"train_loss": -40.3215217590332, "global_step": 179188, "epoch": 1480} {"train_loss": -40.864749908447266, "global_step": 179189, "epoch": 1480} {"train_loss": -40.67023468017578, "global_step": 179190, "epoch": 1480} {"train_loss": -38.29258346557617, "global_step": 179191, "epoch": 1480} {"train_loss": -40.810543060302734, "global_step": 179192, "epoch": 1480} {"train_loss": -41.261043548583984, "global_step": 179193, "epoch": 1480} {"train_loss": -40.525081634521484, "global_step": 179194, "epoch": 1480} {"train_loss": -41.36350631713867, "global_step": 179195, "epoch": 1480} {"train_loss": -40.675716400146484, "global_step": 179196, "epoch": 1480} {"train_loss": -41.1769905090332, "global_step": 179197, "epoch": 1480} {"train_loss": -41.77775573730469, "global_step": 179198, "epoch": 1480} {"train_loss": -40.75624465942383, "global_step": 179199, "epoch": 1480} {"train_loss": -40.25800008222091, "global_step": 179200, "epoch": 1480, "val_loss": 2769796.75} {"train_loss": -41.62826156616211, "global_step": 179201, "epoch": 1481} {"train_loss": -41.270118713378906, "global_step": 179202, "epoch": 1481} {"train_loss": -39.52467346191406, "global_step": 179203, "epoch": 1481} {"train_loss": -41.64741516113281, "global_step": 179204, "epoch": 1481} {"train_loss": -40.6097297668457, "global_step": 179205, "epoch": 1481} {"train_loss": -41.05347442626953, "global_step": 179206, "epoch": 1481} {"train_loss": -39.90553665161133, "global_step": 179207, "epoch": 1481} {"train_loss": -40.0331916809082, "global_step": 179208, "epoch": 1481} {"train_loss": -41.321533203125, "global_step": 179209, "epoch": 1481} {"train_loss": -41.25361251831055, "global_step": 179210, "epoch": 1481} {"train_loss": -40.83711624145508, "global_step": 179211, "epoch": 1481} {"train_loss": -40.13968276977539, "global_step": 179212, "epoch": 1481} {"train_loss": -41.48188400268555, "global_step": 179213, "epoch": 1481} {"train_loss": -40.52928161621094, "global_step": 179214, "epoch": 1481} {"train_loss": -41.29539108276367, "global_step": 179215, "epoch": 1481} {"train_loss": -40.697811126708984, "global_step": 179216, "epoch": 1481} {"train_loss": -40.81416702270508, "global_step": 179217, "epoch": 1481} {"train_loss": -41.662994384765625, "global_step": 179218, "epoch": 1481} {"train_loss": -41.06980514526367, "global_step": 179219, "epoch": 1481} {"train_loss": -40.4284782409668, "global_step": 179220, "epoch": 1481} {"train_loss": -39.802730560302734, "global_step": 179221, "epoch": 1481} {"train_loss": -41.17428970336914, "global_step": 179222, "epoch": 1481} {"train_loss": -41.280147552490234, "global_step": 179223, "epoch": 1481} {"train_loss": -40.26557540893555, "global_step": 179224, "epoch": 1481} {"train_loss": -41.80419921875, "global_step": 179225, "epoch": 1481} {"train_loss": -40.030181884765625, "global_step": 179226, "epoch": 1481} {"train_loss": -41.50995635986328, "global_step": 179227, "epoch": 1481} {"train_loss": -40.73992156982422, "global_step": 179228, "epoch": 1481} {"train_loss": -39.84151840209961, "global_step": 179229, "epoch": 1481} {"train_loss": -40.878143310546875, "global_step": 179230, "epoch": 1481} {"train_loss": -39.786556243896484, "global_step": 179231, "epoch": 1481} {"train_loss": -37.72370147705078, "global_step": 179232, "epoch": 1481} {"train_loss": -38.89929962158203, "global_step": 179233, "epoch": 1481} {"train_loss": -38.31064987182617, "global_step": 179234, "epoch": 1481} {"train_loss": -40.00859451293945, "global_step": 179235, "epoch": 1481} {"train_loss": -39.48270797729492, "global_step": 179236, "epoch": 1481} {"train_loss": -40.02924728393555, "global_step": 179237, "epoch": 1481} {"train_loss": -40.6665153503418, "global_step": 179238, "epoch": 1481} {"train_loss": -35.0687370300293, "global_step": 179239, "epoch": 1481} {"train_loss": -39.508541107177734, "global_step": 179240, "epoch": 1481} {"train_loss": -39.35517501831055, "global_step": 179241, "epoch": 1481} {"train_loss": -39.793338775634766, "global_step": 179242, "epoch": 1481} {"train_loss": -34.81406784057617, "global_step": 179243, "epoch": 1481} {"train_loss": -34.60178756713867, "global_step": 179244, "epoch": 1481} {"train_loss": -38.1297607421875, "global_step": 179245, "epoch": 1481} {"train_loss": -40.489192962646484, "global_step": 179246, "epoch": 1481} {"train_loss": -39.02244567871094, "global_step": 179247, "epoch": 1481} {"train_loss": -39.20149612426758, "global_step": 179248, "epoch": 1481} {"train_loss": -32.74030685424805, "global_step": 179249, "epoch": 1481} {"train_loss": -37.2761116027832, "global_step": 179250, "epoch": 1481} {"train_loss": -38.90719223022461, "global_step": 179251, "epoch": 1481} {"train_loss": -39.87174606323242, "global_step": 179252, "epoch": 1481} {"train_loss": -39.517757415771484, "global_step": 179253, "epoch": 1481} {"train_loss": -40.546722412109375, "global_step": 179254, "epoch": 1481} {"train_loss": -38.36833572387695, "global_step": 179255, "epoch": 1481} {"train_loss": -40.822959899902344, "global_step": 179256, "epoch": 1481} {"train_loss": -38.96964645385742, "global_step": 179257, "epoch": 1481} {"train_loss": -39.80752944946289, "global_step": 179258, "epoch": 1481} {"train_loss": -39.7033805847168, "global_step": 179259, "epoch": 1481} {"train_loss": -38.69987106323242, "global_step": 179260, "epoch": 1481} {"train_loss": -40.12056350708008, "global_step": 179261, "epoch": 1481} {"train_loss": -39.120235443115234, "global_step": 179262, "epoch": 1481} {"train_loss": -39.65725326538086, "global_step": 179263, "epoch": 1481} {"train_loss": -35.27401351928711, "global_step": 179264, "epoch": 1481} {"train_loss": -38.40578842163086, "global_step": 179265, "epoch": 1481} {"train_loss": -39.74280548095703, "global_step": 179266, "epoch": 1481} {"train_loss": -37.153587341308594, "global_step": 179267, "epoch": 1481} {"train_loss": -40.39364242553711, "global_step": 179268, "epoch": 1481} {"train_loss": -39.16590118408203, "global_step": 179269, "epoch": 1481} {"train_loss": -37.28248977661133, "global_step": 179270, "epoch": 1481} {"train_loss": -40.106231689453125, "global_step": 179271, "epoch": 1481} {"train_loss": -38.39961624145508, "global_step": 179272, "epoch": 1481} {"train_loss": -37.97393035888672, "global_step": 179273, "epoch": 1481} {"train_loss": -39.100563049316406, "global_step": 179274, "epoch": 1481} {"train_loss": -39.63295364379883, "global_step": 179275, "epoch": 1481} {"train_loss": -39.62895202636719, "global_step": 179276, "epoch": 1481} {"train_loss": -39.518096923828125, "global_step": 179277, "epoch": 1481} {"train_loss": -40.74964141845703, "global_step": 179278, "epoch": 1481} {"train_loss": -38.223880767822266, "global_step": 179279, "epoch": 1481} {"train_loss": -39.088775634765625, "global_step": 179280, "epoch": 1481} {"train_loss": -38.90097427368164, "global_step": 179281, "epoch": 1481} {"train_loss": -40.78125, "global_step": 179282, "epoch": 1481} {"train_loss": -40.03345489501953, "global_step": 179283, "epoch": 1481} {"train_loss": -39.942012786865234, "global_step": 179284, "epoch": 1481} {"train_loss": -39.37384796142578, "global_step": 179285, "epoch": 1481} {"train_loss": -40.31596755981445, "global_step": 179286, "epoch": 1481} {"train_loss": -40.10418701171875, "global_step": 179287, "epoch": 1481} {"train_loss": -40.21254348754883, "global_step": 179288, "epoch": 1481} {"train_loss": -40.53387451171875, "global_step": 179289, "epoch": 1481} {"train_loss": -40.21120834350586, "global_step": 179290, "epoch": 1481} {"train_loss": -39.32146453857422, "global_step": 179291, "epoch": 1481} {"train_loss": -39.89934158325195, "global_step": 179292, "epoch": 1481} {"train_loss": -40.26291275024414, "global_step": 179293, "epoch": 1481} {"train_loss": -39.261226654052734, "global_step": 179294, "epoch": 1481} {"train_loss": -39.97848129272461, "global_step": 179295, "epoch": 1481} {"train_loss": -39.98100280761719, "global_step": 179296, "epoch": 1481} {"train_loss": -40.25044631958008, "global_step": 179297, "epoch": 1481} {"train_loss": -39.749820709228516, "global_step": 179298, "epoch": 1481} {"train_loss": -40.323158264160156, "global_step": 179299, "epoch": 1481} {"train_loss": -39.81116485595703, "global_step": 179300, "epoch": 1481} {"train_loss": -39.93278121948242, "global_step": 179301, "epoch": 1481} {"train_loss": -40.57666778564453, "global_step": 179302, "epoch": 1481} {"train_loss": -40.43349075317383, "global_step": 179303, "epoch": 1481} {"train_loss": -39.990787506103516, "global_step": 179304, "epoch": 1481} {"train_loss": -40.641963958740234, "global_step": 179305, "epoch": 1481} {"train_loss": -41.04054641723633, "global_step": 179306, "epoch": 1481} {"train_loss": -40.52848434448242, "global_step": 179307, "epoch": 1481} {"train_loss": -40.8388786315918, "global_step": 179308, "epoch": 1481} {"train_loss": -40.75513458251953, "global_step": 179309, "epoch": 1481} {"train_loss": -40.717193603515625, "global_step": 179310, "epoch": 1481} {"train_loss": -40.71626663208008, "global_step": 179311, "epoch": 1481} {"train_loss": -40.771114349365234, "global_step": 179312, "epoch": 1481} {"train_loss": -40.23686218261719, "global_step": 179313, "epoch": 1481} {"train_loss": -40.55268478393555, "global_step": 179314, "epoch": 1481} {"train_loss": -39.147220611572266, "global_step": 179315, "epoch": 1481} {"train_loss": -41.20478057861328, "global_step": 179316, "epoch": 1481} {"train_loss": -39.85007858276367, "global_step": 179317, "epoch": 1481} {"train_loss": -39.83713912963867, "global_step": 179318, "epoch": 1481} {"train_loss": -41.09525680541992, "global_step": 179319, "epoch": 1481} {"train_loss": -41.252281188964844, "global_step": 179320, "epoch": 1481} {"train_loss": -39.77723693847656, "global_step": 179321, "epoch": 1481, "val_loss": 3284796.75} {"train_loss": -39.687740325927734, "global_step": 179322, "epoch": 1482} {"train_loss": -40.806922912597656, "global_step": 179323, "epoch": 1482} {"train_loss": -41.0407829284668, "global_step": 179324, "epoch": 1482} {"train_loss": -40.62809371948242, "global_step": 179325, "epoch": 1482} {"train_loss": -40.6622428894043, "global_step": 179326, "epoch": 1482} {"train_loss": -40.72910690307617, "global_step": 179327, "epoch": 1482} {"train_loss": -38.99207305908203, "global_step": 179328, "epoch": 1482} {"train_loss": -41.44504928588867, "global_step": 179329, "epoch": 1482} {"train_loss": -39.55670928955078, "global_step": 179330, "epoch": 1482} {"train_loss": -40.915382385253906, "global_step": 179331, "epoch": 1482} {"train_loss": -39.180206298828125, "global_step": 179332, "epoch": 1482} {"train_loss": -40.69159698486328, "global_step": 179333, "epoch": 1482} {"train_loss": -41.8255615234375, "global_step": 179334, "epoch": 1482} {"train_loss": -40.25594711303711, "global_step": 179335, "epoch": 1482} {"train_loss": -40.224334716796875, "global_step": 179336, "epoch": 1482} {"train_loss": -41.468727111816406, "global_step": 179337, "epoch": 1482} {"train_loss": -40.90671920776367, "global_step": 179338, "epoch": 1482} {"train_loss": -41.08005905151367, "global_step": 179339, "epoch": 1482} {"train_loss": -39.99870681762695, "global_step": 179340, "epoch": 1482} {"train_loss": -40.8627815246582, "global_step": 179341, "epoch": 1482} {"train_loss": -41.44348907470703, "global_step": 179342, "epoch": 1482} {"train_loss": -41.1021842956543, "global_step": 179343, "epoch": 1482} {"train_loss": -40.96024703979492, "global_step": 179344, "epoch": 1482} {"train_loss": -39.45116424560547, "global_step": 179345, "epoch": 1482} {"train_loss": -36.84349060058594, "global_step": 179346, "epoch": 1482} {"train_loss": -40.272499084472656, "global_step": 179347, "epoch": 1482} {"train_loss": -40.247718811035156, "global_step": 179348, "epoch": 1482} {"train_loss": -40.94065475463867, "global_step": 179349, "epoch": 1482} {"train_loss": -40.8348388671875, "global_step": 179350, "epoch": 1482} {"train_loss": -40.58753204345703, "global_step": 179351, "epoch": 1482} {"train_loss": -39.85618209838867, "global_step": 179352, "epoch": 1482} {"train_loss": -39.75328826904297, "global_step": 179353, "epoch": 1482} {"train_loss": -41.39075469970703, "global_step": 179354, "epoch": 1482} {"train_loss": -40.41315460205078, "global_step": 179355, "epoch": 1482} {"train_loss": -40.4209098815918, "global_step": 179356, "epoch": 1482} {"train_loss": -40.9201774597168, "global_step": 179357, "epoch": 1482} {"train_loss": -39.792945861816406, "global_step": 179358, "epoch": 1482} {"train_loss": -40.786983489990234, "global_step": 179359, "epoch": 1482} {"train_loss": -40.04407501220703, "global_step": 179360, "epoch": 1482} {"train_loss": -40.85245895385742, "global_step": 179361, "epoch": 1482} {"train_loss": -40.58895492553711, "global_step": 179362, "epoch": 1482} {"train_loss": -41.30441665649414, "global_step": 179363, "epoch": 1482} {"train_loss": -41.050594329833984, "global_step": 179364, "epoch": 1482} {"train_loss": -39.11260986328125, "global_step": 179365, "epoch": 1482} {"train_loss": -39.29343795776367, "global_step": 179366, "epoch": 1482} {"train_loss": -39.41317367553711, "global_step": 179367, "epoch": 1482} {"train_loss": -39.766387939453125, "global_step": 179368, "epoch": 1482} {"train_loss": -40.478843688964844, "global_step": 179369, "epoch": 1482} {"train_loss": -40.472652435302734, "global_step": 179370, "epoch": 1482} {"train_loss": -40.58653259277344, "global_step": 179371, "epoch": 1482} {"train_loss": -39.286231994628906, "global_step": 179372, "epoch": 1482} {"train_loss": -40.72376251220703, "global_step": 179373, "epoch": 1482} {"train_loss": -40.225318908691406, "global_step": 179374, "epoch": 1482} {"train_loss": -40.0203857421875, "global_step": 179375, "epoch": 1482} {"train_loss": -37.98878860473633, "global_step": 179376, "epoch": 1482} {"train_loss": -37.10863494873047, "global_step": 179377, "epoch": 1482} {"train_loss": -38.29750442504883, "global_step": 179378, "epoch": 1482} {"train_loss": -38.87812423706055, "global_step": 179379, "epoch": 1482} {"train_loss": -37.529876708984375, "global_step": 179380, "epoch": 1482} {"train_loss": -36.62309646606445, "global_step": 179381, "epoch": 1482} {"train_loss": -38.843013763427734, "global_step": 179382, "epoch": 1482} {"train_loss": -37.9264030456543, "global_step": 179383, "epoch": 1482} {"train_loss": -39.1028938293457, "global_step": 179384, "epoch": 1482} {"train_loss": -39.3145637512207, "global_step": 179385, "epoch": 1482} {"train_loss": -38.89649963378906, "global_step": 179386, "epoch": 1482} {"train_loss": -38.63825607299805, "global_step": 179387, "epoch": 1482} {"train_loss": -40.21097946166992, "global_step": 179388, "epoch": 1482} {"train_loss": -38.3510627746582, "global_step": 179389, "epoch": 1482} {"train_loss": -37.94285202026367, "global_step": 179390, "epoch": 1482} {"train_loss": -38.92132568359375, "global_step": 179391, "epoch": 1482} {"train_loss": -38.94474792480469, "global_step": 179392, "epoch": 1482} {"train_loss": -40.54122543334961, "global_step": 179393, "epoch": 1482} {"train_loss": -36.6056022644043, "global_step": 179394, "epoch": 1482} {"train_loss": -40.67307662963867, "global_step": 179395, "epoch": 1482} {"train_loss": -40.60491180419922, "global_step": 179396, "epoch": 1482} {"train_loss": -40.28154373168945, "global_step": 179397, "epoch": 1482} {"train_loss": -35.75724411010742, "global_step": 179398, "epoch": 1482} {"train_loss": -40.52104568481445, "global_step": 179399, "epoch": 1482} {"train_loss": -37.90406036376953, "global_step": 179400, "epoch": 1482} {"train_loss": -39.298828125, "global_step": 179401, "epoch": 1482} {"train_loss": -40.17440414428711, "global_step": 179402, "epoch": 1482} {"train_loss": -38.5434684753418, "global_step": 179403, "epoch": 1482} {"train_loss": -40.59418487548828, "global_step": 179404, "epoch": 1482} {"train_loss": -40.12382888793945, "global_step": 179405, "epoch": 1482} {"train_loss": -38.782588958740234, "global_step": 179406, "epoch": 1482} {"train_loss": -40.37067794799805, "global_step": 179407, "epoch": 1482} {"train_loss": -39.86745834350586, "global_step": 179408, "epoch": 1482} {"train_loss": -39.854644775390625, "global_step": 179409, "epoch": 1482} {"train_loss": -39.945796966552734, "global_step": 179410, "epoch": 1482} {"train_loss": -40.32155990600586, "global_step": 179411, "epoch": 1482} {"train_loss": -39.9382438659668, "global_step": 179412, "epoch": 1482} {"train_loss": -39.867469787597656, "global_step": 179413, "epoch": 1482} {"train_loss": -40.54368209838867, "global_step": 179414, "epoch": 1482} {"train_loss": -40.70084762573242, "global_step": 179415, "epoch": 1482} {"train_loss": -39.95709991455078, "global_step": 179416, "epoch": 1482} {"train_loss": -40.64669418334961, "global_step": 179417, "epoch": 1482} {"train_loss": -40.972530364990234, "global_step": 179418, "epoch": 1482} {"train_loss": -40.306209564208984, "global_step": 179419, "epoch": 1482} {"train_loss": -40.49705505371094, "global_step": 179420, "epoch": 1482} {"train_loss": -41.14774703979492, "global_step": 179421, "epoch": 1482} {"train_loss": -40.713844299316406, "global_step": 179422, "epoch": 1482} {"train_loss": -40.74525833129883, "global_step": 179423, "epoch": 1482} {"train_loss": -41.265865325927734, "global_step": 179424, "epoch": 1482} {"train_loss": -40.73112106323242, "global_step": 179425, "epoch": 1482} {"train_loss": -41.10139846801758, "global_step": 179426, "epoch": 1482} {"train_loss": -40.69771957397461, "global_step": 179427, "epoch": 1482} {"train_loss": -40.06376266479492, "global_step": 179428, "epoch": 1482} {"train_loss": -32.446163177490234, "global_step": 179429, "epoch": 1482} {"train_loss": -40.2148551940918, "global_step": 179430, "epoch": 1482} {"train_loss": -39.48433303833008, "global_step": 179431, "epoch": 1482} {"train_loss": -40.20322036743164, "global_step": 179432, "epoch": 1482} {"train_loss": -40.57522201538086, "global_step": 179433, "epoch": 1482} {"train_loss": -39.68308639526367, "global_step": 179434, "epoch": 1482} {"train_loss": -36.03969192504883, "global_step": 179435, "epoch": 1482} {"train_loss": -36.728912353515625, "global_step": 179436, "epoch": 1482} {"train_loss": -40.489810943603516, "global_step": 179437, "epoch": 1482} {"train_loss": -38.06922149658203, "global_step": 179438, "epoch": 1482} {"train_loss": -40.09090042114258, "global_step": 179439, "epoch": 1482} {"train_loss": -39.405086517333984, "global_step": 179440, "epoch": 1482} {"train_loss": -39.34743118286133, "global_step": 179441, "epoch": 1482} {"train_loss": -39.80673246147219, "global_step": 179442, "epoch": 1482, "val_loss": 2790280.25} {"train_loss": -39.24457550048828, "global_step": 179443, "epoch": 1483} {"train_loss": -40.33865737915039, "global_step": 179444, "epoch": 1483} {"train_loss": -40.2616081237793, "global_step": 179445, "epoch": 1483} {"train_loss": -38.64239501953125, "global_step": 179446, "epoch": 1483} {"train_loss": -40.22522735595703, "global_step": 179447, "epoch": 1483} {"train_loss": -41.32696533203125, "global_step": 179448, "epoch": 1483} {"train_loss": -40.19353103637695, "global_step": 179449, "epoch": 1483} {"train_loss": -39.62647247314453, "global_step": 179450, "epoch": 1483} {"train_loss": -39.89183044433594, "global_step": 179451, "epoch": 1483} {"train_loss": -38.9883918762207, "global_step": 179452, "epoch": 1483} {"train_loss": -34.725093841552734, "global_step": 179453, "epoch": 1483} {"train_loss": -35.32894515991211, "global_step": 179454, "epoch": 1483} {"train_loss": -35.05890655517578, "global_step": 179455, "epoch": 1483} {"train_loss": -38.62866973876953, "global_step": 179456, "epoch": 1483} {"train_loss": -39.46061325073242, "global_step": 179457, "epoch": 1483} {"train_loss": -38.98602294921875, "global_step": 179458, "epoch": 1483} {"train_loss": -38.08042526245117, "global_step": 179459, "epoch": 1483} {"train_loss": -38.69664764404297, "global_step": 179460, "epoch": 1483} {"train_loss": -37.93218231201172, "global_step": 179461, "epoch": 1483} {"train_loss": -39.275394439697266, "global_step": 179462, "epoch": 1483} {"train_loss": -39.28167724609375, "global_step": 179463, "epoch": 1483} {"train_loss": -39.10087966918945, "global_step": 179464, "epoch": 1483} {"train_loss": -33.08596420288086, "global_step": 179465, "epoch": 1483} {"train_loss": -40.53397750854492, "global_step": 179466, "epoch": 1483} {"train_loss": -38.01870346069336, "global_step": 179467, "epoch": 1483} {"train_loss": -38.98128890991211, "global_step": 179468, "epoch": 1483} {"train_loss": -38.31892776489258, "global_step": 179469, "epoch": 1483} {"train_loss": -38.92451477050781, "global_step": 179470, "epoch": 1483} {"train_loss": -38.70042419433594, "global_step": 179471, "epoch": 1483} {"train_loss": -38.394771575927734, "global_step": 179472, "epoch": 1483} {"train_loss": -38.43974304199219, "global_step": 179473, "epoch": 1483} {"train_loss": -38.34866714477539, "global_step": 179474, "epoch": 1483} {"train_loss": -39.32870101928711, "global_step": 179475, "epoch": 1483} {"train_loss": -39.48108673095703, "global_step": 179476, "epoch": 1483} {"train_loss": -40.446895599365234, "global_step": 179477, "epoch": 1483} {"train_loss": -38.8866081237793, "global_step": 179478, "epoch": 1483} {"train_loss": -39.55786895751953, "global_step": 179479, "epoch": 1483} {"train_loss": -38.08216094970703, "global_step": 179480, "epoch": 1483} {"train_loss": -39.70269775390625, "global_step": 179481, "epoch": 1483} {"train_loss": -39.97408676147461, "global_step": 179482, "epoch": 1483} {"train_loss": -39.75116729736328, "global_step": 179483, "epoch": 1483} {"train_loss": -40.3900260925293, "global_step": 179484, "epoch": 1483} {"train_loss": -39.42277526855469, "global_step": 179485, "epoch": 1483} {"train_loss": -38.90988540649414, "global_step": 179486, "epoch": 1483} {"train_loss": -40.24528121948242, "global_step": 179487, "epoch": 1483} {"train_loss": -39.411922454833984, "global_step": 179488, "epoch": 1483} {"train_loss": -38.86414337158203, "global_step": 179489, "epoch": 1483} {"train_loss": -40.2576789855957, "global_step": 179490, "epoch": 1483} {"train_loss": -40.358917236328125, "global_step": 179491, "epoch": 1483} {"train_loss": -39.59470748901367, "global_step": 179492, "epoch": 1483} {"train_loss": -40.32126998901367, "global_step": 179493, "epoch": 1483} {"train_loss": -40.13292694091797, "global_step": 179494, "epoch": 1483} {"train_loss": -38.823482513427734, "global_step": 179495, "epoch": 1483} {"train_loss": -40.72590255737305, "global_step": 179496, "epoch": 1483} {"train_loss": -39.331722259521484, "global_step": 179497, "epoch": 1483} {"train_loss": -40.46596908569336, "global_step": 179498, "epoch": 1483} {"train_loss": -40.5066032409668, "global_step": 179499, "epoch": 1483} {"train_loss": -39.94709014892578, "global_step": 179500, "epoch": 1483} {"train_loss": -39.234230041503906, "global_step": 179501, "epoch": 1483} {"train_loss": -40.54658126831055, "global_step": 179502, "epoch": 1483} {"train_loss": -39.6103630065918, "global_step": 179503, "epoch": 1483} {"train_loss": -41.023536682128906, "global_step": 179504, "epoch": 1483} {"train_loss": -40.64011764526367, "global_step": 179505, "epoch": 1483} {"train_loss": -40.63829803466797, "global_step": 179506, "epoch": 1483} {"train_loss": -40.868648529052734, "global_step": 179507, "epoch": 1483} {"train_loss": -40.66975402832031, "global_step": 179508, "epoch": 1483} {"train_loss": -40.86450958251953, "global_step": 179509, "epoch": 1483} {"train_loss": -40.553524017333984, "global_step": 179510, "epoch": 1483} {"train_loss": -39.83882141113281, "global_step": 179511, "epoch": 1483} {"train_loss": -40.875282287597656, "global_step": 179512, "epoch": 1483} {"train_loss": -41.24485778808594, "global_step": 179513, "epoch": 1483} {"train_loss": -41.84366989135742, "global_step": 179514, "epoch": 1483} {"train_loss": -40.905235290527344, "global_step": 179515, "epoch": 1483} {"train_loss": -41.26168441772461, "global_step": 179516, "epoch": 1483} {"train_loss": -40.4123649597168, "global_step": 179517, "epoch": 1483} {"train_loss": -41.307708740234375, "global_step": 179518, "epoch": 1483} {"train_loss": -40.595760345458984, "global_step": 179519, "epoch": 1483} {"train_loss": -40.57562255859375, "global_step": 179520, "epoch": 1483} {"train_loss": -41.0175895690918, "global_step": 179521, "epoch": 1483} {"train_loss": -40.20063400268555, "global_step": 179522, "epoch": 1483} {"train_loss": -39.586830139160156, "global_step": 179523, "epoch": 1483} {"train_loss": -39.711639404296875, "global_step": 179524, "epoch": 1483} {"train_loss": -40.2786979675293, "global_step": 179525, "epoch": 1483} {"train_loss": -37.78375244140625, "global_step": 179526, "epoch": 1483} {"train_loss": -40.249244689941406, "global_step": 179527, "epoch": 1483} {"train_loss": -39.568965911865234, "global_step": 179528, "epoch": 1483} {"train_loss": -40.465003967285156, "global_step": 179529, "epoch": 1483} {"train_loss": -40.94913101196289, "global_step": 179530, "epoch": 1483} {"train_loss": -40.24640655517578, "global_step": 179531, "epoch": 1483} {"train_loss": -39.92877197265625, "global_step": 179532, "epoch": 1483} {"train_loss": -39.417030334472656, "global_step": 179533, "epoch": 1483} {"train_loss": -38.00361251831055, "global_step": 179534, "epoch": 1483} {"train_loss": -37.110286712646484, "global_step": 179535, "epoch": 1483} {"train_loss": -36.90082931518555, "global_step": 179536, "epoch": 1483} {"train_loss": -35.557552337646484, "global_step": 179537, "epoch": 1483} {"train_loss": -35.089324951171875, "global_step": 179538, "epoch": 1483} {"train_loss": -36.06428146362305, "global_step": 179539, "epoch": 1483} {"train_loss": -40.486942291259766, "global_step": 179540, "epoch": 1483} {"train_loss": -38.44137191772461, "global_step": 179541, "epoch": 1483} {"train_loss": -33.284423828125, "global_step": 179542, "epoch": 1483} {"train_loss": -37.25463104248047, "global_step": 179543, "epoch": 1483} {"train_loss": -40.34823226928711, "global_step": 179544, "epoch": 1483} {"train_loss": -36.52150344848633, "global_step": 179545, "epoch": 1483} {"train_loss": -36.883365631103516, "global_step": 179546, "epoch": 1483} {"train_loss": -39.06781005859375, "global_step": 179547, "epoch": 1483} {"train_loss": -39.08856201171875, "global_step": 179548, "epoch": 1483} {"train_loss": -36.96651077270508, "global_step": 179549, "epoch": 1483} {"train_loss": -39.35810470581055, "global_step": 179550, "epoch": 1483} {"train_loss": -27.817901611328125, "global_step": 179551, "epoch": 1483} {"train_loss": -31.48419189453125, "global_step": 179552, "epoch": 1483} {"train_loss": -38.46836853027344, "global_step": 179553, "epoch": 1483} {"train_loss": -38.19564437866211, "global_step": 179554, "epoch": 1483} {"train_loss": -38.9171257019043, "global_step": 179555, "epoch": 1483} {"train_loss": -38.216102600097656, "global_step": 179556, "epoch": 1483} {"train_loss": -39.10014724731445, "global_step": 179557, "epoch": 1483} {"train_loss": -37.92081832885742, "global_step": 179558, "epoch": 1483} {"train_loss": -39.2863883972168, "global_step": 179559, "epoch": 1483} {"train_loss": -37.77035140991211, "global_step": 179560, "epoch": 1483} {"train_loss": -38.932106018066406, "global_step": 179561, "epoch": 1483} {"train_loss": -38.72391891479492, "global_step": 179562, "epoch": 1483} {"train_loss": -39.02103591162311, "global_step": 179563, "epoch": 1483, "val_loss": 2737893.25} {"train_loss": -38.525630950927734, "global_step": 179564, "epoch": 1484} {"train_loss": -36.77167510986328, "global_step": 179565, "epoch": 1484} {"train_loss": -38.353981018066406, "global_step": 179566, "epoch": 1484} {"train_loss": -38.260128021240234, "global_step": 179567, "epoch": 1484} {"train_loss": -38.630672454833984, "global_step": 179568, "epoch": 1484} {"train_loss": -37.923583984375, "global_step": 179569, "epoch": 1484} {"train_loss": -39.28275680541992, "global_step": 179570, "epoch": 1484} {"train_loss": -38.649635314941406, "global_step": 179571, "epoch": 1484} {"train_loss": -39.29072952270508, "global_step": 179572, "epoch": 1484} {"train_loss": -39.711116790771484, "global_step": 179573, "epoch": 1484} {"train_loss": -38.544029235839844, "global_step": 179574, "epoch": 1484} {"train_loss": -39.65233612060547, "global_step": 179575, "epoch": 1484} {"train_loss": -38.73600387573242, "global_step": 179576, "epoch": 1484} {"train_loss": -39.31720733642578, "global_step": 179577, "epoch": 1484} {"train_loss": -39.05068588256836, "global_step": 179578, "epoch": 1484} {"train_loss": -39.424442291259766, "global_step": 179579, "epoch": 1484} {"train_loss": -39.395992279052734, "global_step": 179580, "epoch": 1484} {"train_loss": -39.50312805175781, "global_step": 179581, "epoch": 1484} {"train_loss": -39.20630645751953, "global_step": 179582, "epoch": 1484} {"train_loss": -38.419376373291016, "global_step": 179583, "epoch": 1484} {"train_loss": -39.40484619140625, "global_step": 179584, "epoch": 1484} {"train_loss": -39.71327209472656, "global_step": 179585, "epoch": 1484} {"train_loss": -40.13859176635742, "global_step": 179586, "epoch": 1484} {"train_loss": -40.129695892333984, "global_step": 179587, "epoch": 1484} {"train_loss": -40.074337005615234, "global_step": 179588, "epoch": 1484} {"train_loss": -40.36751937866211, "global_step": 179589, "epoch": 1484} {"train_loss": -40.23054122924805, "global_step": 179590, "epoch": 1484} {"train_loss": -39.96016311645508, "global_step": 179591, "epoch": 1484} {"train_loss": -40.05311965942383, "global_step": 179592, "epoch": 1484} {"train_loss": -37.346160888671875, "global_step": 179593, "epoch": 1484} {"train_loss": -39.54315948486328, "global_step": 179594, "epoch": 1484} {"train_loss": -39.78739547729492, "global_step": 179595, "epoch": 1484} {"train_loss": -38.61195373535156, "global_step": 179596, "epoch": 1484} {"train_loss": -40.402984619140625, "global_step": 179597, "epoch": 1484} {"train_loss": -40.13562774658203, "global_step": 179598, "epoch": 1484} {"train_loss": -39.95846176147461, "global_step": 179599, "epoch": 1484} {"train_loss": -41.02477264404297, "global_step": 179600, "epoch": 1484} {"train_loss": -40.10371398925781, "global_step": 179601, "epoch": 1484} {"train_loss": -41.04171371459961, "global_step": 179602, "epoch": 1484} {"train_loss": -39.56243896484375, "global_step": 179603, "epoch": 1484} {"train_loss": -40.783382415771484, "global_step": 179604, "epoch": 1484} {"train_loss": -40.56466293334961, "global_step": 179605, "epoch": 1484} {"train_loss": -40.5844841003418, "global_step": 179606, "epoch": 1484} {"train_loss": -40.32875061035156, "global_step": 179607, "epoch": 1484} {"train_loss": -41.06980514526367, "global_step": 179608, "epoch": 1484} {"train_loss": -40.32991027832031, "global_step": 179609, "epoch": 1484} {"train_loss": -41.294677734375, "global_step": 179610, "epoch": 1484} {"train_loss": -38.993865966796875, "global_step": 179611, "epoch": 1484} {"train_loss": -41.05388259887695, "global_step": 179612, "epoch": 1484} {"train_loss": -41.29098129272461, "global_step": 179613, "epoch": 1484} {"train_loss": -41.789730072021484, "global_step": 179614, "epoch": 1484} {"train_loss": -41.167381286621094, "global_step": 179615, "epoch": 1484} {"train_loss": -40.687313079833984, "global_step": 179616, "epoch": 1484} {"train_loss": -40.933265686035156, "global_step": 179617, "epoch": 1484} {"train_loss": -41.17230224609375, "global_step": 179618, "epoch": 1484} {"train_loss": -41.53144073486328, "global_step": 179619, "epoch": 1484} {"train_loss": -41.347923278808594, "global_step": 179620, "epoch": 1484} {"train_loss": -41.32490158081055, "global_step": 179621, "epoch": 1484} {"train_loss": -41.370216369628906, "global_step": 179622, "epoch": 1484} {"train_loss": -41.291316986083984, "global_step": 179623, "epoch": 1484} {"train_loss": -41.360843658447266, "global_step": 179624, "epoch": 1484} {"train_loss": -41.04347610473633, "global_step": 179625, "epoch": 1484} {"train_loss": -40.81361770629883, "global_step": 179626, "epoch": 1484} {"train_loss": -41.552791595458984, "global_step": 179627, "epoch": 1484} {"train_loss": -41.68754196166992, "global_step": 179628, "epoch": 1484} {"train_loss": -41.83419418334961, "global_step": 179629, "epoch": 1484} {"train_loss": -41.22004318237305, "global_step": 179630, "epoch": 1484} {"train_loss": -42.065059661865234, "global_step": 179631, "epoch": 1484} {"train_loss": -41.313262939453125, "global_step": 179632, "epoch": 1484} {"train_loss": -41.22583770751953, "global_step": 179633, "epoch": 1484} {"train_loss": -42.10544967651367, "global_step": 179634, "epoch": 1484} {"train_loss": -41.329776763916016, "global_step": 179635, "epoch": 1484} {"train_loss": -41.932029724121094, "global_step": 179636, "epoch": 1484} {"train_loss": -41.60770797729492, "global_step": 179637, "epoch": 1484} {"train_loss": -40.95195770263672, "global_step": 179638, "epoch": 1484} {"train_loss": -41.92844772338867, "global_step": 179639, "epoch": 1484} {"train_loss": -41.23347854614258, "global_step": 179640, "epoch": 1484} {"train_loss": -41.46503448486328, "global_step": 179641, "epoch": 1484} {"train_loss": -40.83218002319336, "global_step": 179642, "epoch": 1484} {"train_loss": -40.9455451965332, "global_step": 179643, "epoch": 1484} {"train_loss": -39.75710678100586, "global_step": 179644, "epoch": 1484} {"train_loss": -41.4370002746582, "global_step": 179645, "epoch": 1484} {"train_loss": -41.665870666503906, "global_step": 179646, "epoch": 1484} {"train_loss": -41.34011459350586, "global_step": 179647, "epoch": 1484} {"train_loss": -39.908294677734375, "global_step": 179648, "epoch": 1484} {"train_loss": -38.94724655151367, "global_step": 179649, "epoch": 1484} {"train_loss": -37.96051025390625, "global_step": 179650, "epoch": 1484} {"train_loss": -38.78184127807617, "global_step": 179651, "epoch": 1484} {"train_loss": -41.50688934326172, "global_step": 179652, "epoch": 1484} {"train_loss": -41.80188751220703, "global_step": 179653, "epoch": 1484} {"train_loss": -41.7422981262207, "global_step": 179654, "epoch": 1484} {"train_loss": -40.15541458129883, "global_step": 179655, "epoch": 1484} {"train_loss": -38.95881271362305, "global_step": 179656, "epoch": 1484} {"train_loss": -36.545692443847656, "global_step": 179657, "epoch": 1484} {"train_loss": -39.8996467590332, "global_step": 179658, "epoch": 1484} {"train_loss": -41.01433563232422, "global_step": 179659, "epoch": 1484} {"train_loss": -38.753231048583984, "global_step": 179660, "epoch": 1484} {"train_loss": -36.353485107421875, "global_step": 179661, "epoch": 1484} {"train_loss": -37.44956588745117, "global_step": 179662, "epoch": 1484} {"train_loss": -40.9033203125, "global_step": 179663, "epoch": 1484} {"train_loss": -38.22408676147461, "global_step": 179664, "epoch": 1484} {"train_loss": -38.69145584106445, "global_step": 179665, "epoch": 1484} {"train_loss": -41.221431732177734, "global_step": 179666, "epoch": 1484} {"train_loss": -39.0944938659668, "global_step": 179667, "epoch": 1484} {"train_loss": -40.49342727661133, "global_step": 179668, "epoch": 1484} {"train_loss": -39.53007125854492, "global_step": 179669, "epoch": 1484} {"train_loss": -38.277095794677734, "global_step": 179670, "epoch": 1484} {"train_loss": -40.34749221801758, "global_step": 179671, "epoch": 1484} {"train_loss": -38.90244674682617, "global_step": 179672, "epoch": 1484} {"train_loss": -40.50971984863281, "global_step": 179673, "epoch": 1484} {"train_loss": -38.9090576171875, "global_step": 179674, "epoch": 1484} {"train_loss": -39.55744552612305, "global_step": 179675, "epoch": 1484} {"train_loss": -40.5716667175293, "global_step": 179676, "epoch": 1484} {"train_loss": -37.70806884765625, "global_step": 179677, "epoch": 1484} {"train_loss": -38.44166946411133, "global_step": 179678, "epoch": 1484} {"train_loss": -39.39176559448242, "global_step": 179679, "epoch": 1484} {"train_loss": -38.78969192504883, "global_step": 179680, "epoch": 1484} {"train_loss": -36.265159606933594, "global_step": 179681, "epoch": 1484} {"train_loss": -40.2476921081543, "global_step": 179682, "epoch": 1484} {"train_loss": -39.3471794128418, "global_step": 179683, "epoch": 1484} {"train_loss": -39.99759919978371, "global_step": 179684, "epoch": 1484, "val_loss": 2607790.25} {"train_loss": -39.87865447998047, "global_step": 179685, "epoch": 1485} {"train_loss": -40.35890579223633, "global_step": 179686, "epoch": 1485} {"train_loss": -38.401283264160156, "global_step": 179687, "epoch": 1485} {"train_loss": -39.72541046142578, "global_step": 179688, "epoch": 1485} {"train_loss": -40.320980072021484, "global_step": 179689, "epoch": 1485} {"train_loss": -39.973548889160156, "global_step": 179690, "epoch": 1485} {"train_loss": -39.595821380615234, "global_step": 179691, "epoch": 1485} {"train_loss": -41.1142463684082, "global_step": 179692, "epoch": 1485} {"train_loss": -40.132843017578125, "global_step": 179693, "epoch": 1485} {"train_loss": -40.130287170410156, "global_step": 179694, "epoch": 1485} {"train_loss": -41.103057861328125, "global_step": 179695, "epoch": 1485} {"train_loss": -40.920318603515625, "global_step": 179696, "epoch": 1485} {"train_loss": -41.13827133178711, "global_step": 179697, "epoch": 1485} {"train_loss": -40.633949279785156, "global_step": 179698, "epoch": 1485} {"train_loss": -41.364051818847656, "global_step": 179699, "epoch": 1485} {"train_loss": -41.27278518676758, "global_step": 179700, "epoch": 1485} {"train_loss": -40.49619674682617, "global_step": 179701, "epoch": 1485} {"train_loss": -40.3880729675293, "global_step": 179702, "epoch": 1485} {"train_loss": -41.187416076660156, "global_step": 179703, "epoch": 1485} {"train_loss": -41.05881881713867, "global_step": 179704, "epoch": 1485} {"train_loss": -40.309181213378906, "global_step": 179705, "epoch": 1485} {"train_loss": -41.26300811767578, "global_step": 179706, "epoch": 1485} {"train_loss": -41.45528793334961, "global_step": 179707, "epoch": 1485} {"train_loss": -41.577919006347656, "global_step": 179708, "epoch": 1485} {"train_loss": -40.938232421875, "global_step": 179709, "epoch": 1485} {"train_loss": -41.004554748535156, "global_step": 179710, "epoch": 1485} {"train_loss": -41.60207748413086, "global_step": 179711, "epoch": 1485} {"train_loss": -41.56048583984375, "global_step": 179712, "epoch": 1485} {"train_loss": -40.896217346191406, "global_step": 179713, "epoch": 1485} {"train_loss": -41.803340911865234, "global_step": 179714, "epoch": 1485} {"train_loss": -41.65657043457031, "global_step": 179715, "epoch": 1485} {"train_loss": -41.90843200683594, "global_step": 179716, "epoch": 1485} {"train_loss": -41.598609924316406, "global_step": 179717, "epoch": 1485} {"train_loss": -41.45759582519531, "global_step": 179718, "epoch": 1485} {"train_loss": -41.89801788330078, "global_step": 179719, "epoch": 1485} {"train_loss": -41.595985412597656, "global_step": 179720, "epoch": 1485} {"train_loss": -42.097557067871094, "global_step": 179721, "epoch": 1485} {"train_loss": -41.45893478393555, "global_step": 179722, "epoch": 1485} {"train_loss": -41.961856842041016, "global_step": 179723, "epoch": 1485} {"train_loss": -41.5223274230957, "global_step": 179724, "epoch": 1485} {"train_loss": -41.44316101074219, "global_step": 179725, "epoch": 1485} {"train_loss": -41.65369415283203, "global_step": 179726, "epoch": 1485} {"train_loss": -41.389068603515625, "global_step": 179727, "epoch": 1485} {"train_loss": -41.62494659423828, "global_step": 179728, "epoch": 1485} {"train_loss": -41.920326232910156, "global_step": 179729, "epoch": 1485} {"train_loss": -41.87928009033203, "global_step": 179730, "epoch": 1485} {"train_loss": -42.00122833251953, "global_step": 179731, "epoch": 1485} {"train_loss": -42.03133010864258, "global_step": 179732, "epoch": 1485} {"train_loss": -41.997886657714844, "global_step": 179733, "epoch": 1485} {"train_loss": -41.06743240356445, "global_step": 179734, "epoch": 1485} {"train_loss": -41.63679885864258, "global_step": 179735, "epoch": 1485} {"train_loss": -40.145015716552734, "global_step": 179736, "epoch": 1485} {"train_loss": -38.78642272949219, "global_step": 179737, "epoch": 1485} {"train_loss": -34.4709358215332, "global_step": 179738, "epoch": 1485} {"train_loss": -33.43044662475586, "global_step": 179739, "epoch": 1485} {"train_loss": -37.91115951538086, "global_step": 179740, "epoch": 1485} {"train_loss": -40.60918045043945, "global_step": 179741, "epoch": 1485} {"train_loss": -37.52629089355469, "global_step": 179742, "epoch": 1485} {"train_loss": -39.027320861816406, "global_step": 179743, "epoch": 1485} {"train_loss": -40.35578536987305, "global_step": 179744, "epoch": 1485} {"train_loss": -39.37526321411133, "global_step": 179745, "epoch": 1485} {"train_loss": -39.35438919067383, "global_step": 179746, "epoch": 1485} {"train_loss": -38.20841598510742, "global_step": 179747, "epoch": 1485} {"train_loss": -40.58121109008789, "global_step": 179748, "epoch": 1485} {"train_loss": -39.43531799316406, "global_step": 179749, "epoch": 1485} {"train_loss": -39.16975021362305, "global_step": 179750, "epoch": 1485} {"train_loss": -39.69765853881836, "global_step": 179751, "epoch": 1485} {"train_loss": -39.49245071411133, "global_step": 179752, "epoch": 1485} {"train_loss": -39.873592376708984, "global_step": 179753, "epoch": 1485} {"train_loss": -40.07589340209961, "global_step": 179754, "epoch": 1485} {"train_loss": -39.06897735595703, "global_step": 179755, "epoch": 1485} {"train_loss": -40.367244720458984, "global_step": 179756, "epoch": 1485} {"train_loss": -39.64299392700195, "global_step": 179757, "epoch": 1485} {"train_loss": -41.04401779174805, "global_step": 179758, "epoch": 1485} {"train_loss": -39.0504035949707, "global_step": 179759, "epoch": 1485} {"train_loss": -39.581722259521484, "global_step": 179760, "epoch": 1485} {"train_loss": -40.5588264465332, "global_step": 179761, "epoch": 1485} {"train_loss": -39.96855545043945, "global_step": 179762, "epoch": 1485} {"train_loss": -39.08919906616211, "global_step": 179763, "epoch": 1485} {"train_loss": -40.20610427856445, "global_step": 179764, "epoch": 1485} {"train_loss": -40.48139572143555, "global_step": 179765, "epoch": 1485} {"train_loss": -39.256431579589844, "global_step": 179766, "epoch": 1485} {"train_loss": -39.45840072631836, "global_step": 179767, "epoch": 1485} {"train_loss": -40.19993209838867, "global_step": 179768, "epoch": 1485} {"train_loss": -40.272071838378906, "global_step": 179769, "epoch": 1485} {"train_loss": -39.091487884521484, "global_step": 179770, "epoch": 1485} {"train_loss": -40.9859504699707, "global_step": 179771, "epoch": 1485} {"train_loss": -40.12185287475586, "global_step": 179772, "epoch": 1485} {"train_loss": -39.86683654785156, "global_step": 179773, "epoch": 1485} {"train_loss": -39.20284652709961, "global_step": 179774, "epoch": 1485} {"train_loss": -40.70088577270508, "global_step": 179775, "epoch": 1485} {"train_loss": -39.629329681396484, "global_step": 179776, "epoch": 1485} {"train_loss": -38.41445541381836, "global_step": 179777, "epoch": 1485} {"train_loss": -40.96036911010742, "global_step": 179778, "epoch": 1485} {"train_loss": -40.31975173950195, "global_step": 179779, "epoch": 1485} {"train_loss": -39.83852767944336, "global_step": 179780, "epoch": 1485} {"train_loss": -40.365478515625, "global_step": 179781, "epoch": 1485} {"train_loss": -40.79250717163086, "global_step": 179782, "epoch": 1485} {"train_loss": -39.99578857421875, "global_step": 179783, "epoch": 1485} {"train_loss": -39.727237701416016, "global_step": 179784, "epoch": 1485} {"train_loss": -40.979408264160156, "global_step": 179785, "epoch": 1485} {"train_loss": -41.27843475341797, "global_step": 179786, "epoch": 1485} {"train_loss": -41.29973602294922, "global_step": 179787, "epoch": 1485} {"train_loss": -41.195404052734375, "global_step": 179788, "epoch": 1485} {"train_loss": -40.97038269042969, "global_step": 179789, "epoch": 1485} {"train_loss": -41.3948974609375, "global_step": 179790, "epoch": 1485} {"train_loss": -40.10200119018555, "global_step": 179791, "epoch": 1485} {"train_loss": -41.13686752319336, "global_step": 179792, "epoch": 1485} {"train_loss": -41.72322463989258, "global_step": 179793, "epoch": 1485} {"train_loss": -40.365543365478516, "global_step": 179794, "epoch": 1485} {"train_loss": -41.37091827392578, "global_step": 179795, "epoch": 1485} {"train_loss": -41.12223434448242, "global_step": 179796, "epoch": 1485} {"train_loss": -41.0174674987793, "global_step": 179797, "epoch": 1485} {"train_loss": -39.898555755615234, "global_step": 179798, "epoch": 1485} {"train_loss": -41.055477142333984, "global_step": 179799, "epoch": 1485} {"train_loss": -40.55244827270508, "global_step": 179800, "epoch": 1485} {"train_loss": -40.40291976928711, "global_step": 179801, "epoch": 1485} {"train_loss": -40.92216110229492, "global_step": 179802, "epoch": 1485} {"train_loss": -41.25136947631836, "global_step": 179803, "epoch": 1485} {"train_loss": -40.6178092956543, "global_step": 179804, "epoch": 1485} {"train_loss": -40.43482365884071, "global_step": 179805, "epoch": 1485, "val_loss": 2676083.75} {"train_loss": -41.01828384399414, "global_step": 179806, "epoch": 1486} {"train_loss": -40.97255325317383, "global_step": 179807, "epoch": 1486} {"train_loss": -40.63851547241211, "global_step": 179808, "epoch": 1486} {"train_loss": -41.923126220703125, "global_step": 179809, "epoch": 1486} {"train_loss": -41.12208557128906, "global_step": 179810, "epoch": 1486} {"train_loss": -41.209712982177734, "global_step": 179811, "epoch": 1486} {"train_loss": -42.1423225402832, "global_step": 179812, "epoch": 1486} {"train_loss": -41.28901290893555, "global_step": 179813, "epoch": 1486} {"train_loss": -41.526302337646484, "global_step": 179814, "epoch": 1486} {"train_loss": -41.4664192199707, "global_step": 179815, "epoch": 1486} {"train_loss": -41.41291046142578, "global_step": 179816, "epoch": 1486} {"train_loss": -40.64962387084961, "global_step": 179817, "epoch": 1486} {"train_loss": -41.72874069213867, "global_step": 179818, "epoch": 1486} {"train_loss": -41.69843673706055, "global_step": 179819, "epoch": 1486} {"train_loss": -41.88344192504883, "global_step": 179820, "epoch": 1486} {"train_loss": -41.48968505859375, "global_step": 179821, "epoch": 1486} {"train_loss": -42.18887710571289, "global_step": 179822, "epoch": 1486} {"train_loss": -40.828102111816406, "global_step": 179823, "epoch": 1486} {"train_loss": -40.988624572753906, "global_step": 179824, "epoch": 1486} {"train_loss": -41.407527923583984, "global_step": 179825, "epoch": 1486} {"train_loss": -41.5214958190918, "global_step": 179826, "epoch": 1486} {"train_loss": -41.59971618652344, "global_step": 179827, "epoch": 1486} {"train_loss": -42.282405853271484, "global_step": 179828, "epoch": 1486} {"train_loss": -41.816505432128906, "global_step": 179829, "epoch": 1486} {"train_loss": -41.67572021484375, "global_step": 179830, "epoch": 1486} {"train_loss": -40.5718994140625, "global_step": 179831, "epoch": 1486} {"train_loss": -40.51675033569336, "global_step": 179832, "epoch": 1486} {"train_loss": -41.856529235839844, "global_step": 179833, "epoch": 1486} {"train_loss": -41.8422966003418, "global_step": 179834, "epoch": 1486} {"train_loss": -40.97916793823242, "global_step": 179835, "epoch": 1486} {"train_loss": -39.46134567260742, "global_step": 179836, "epoch": 1486} {"train_loss": -40.79963302612305, "global_step": 179837, "epoch": 1486} {"train_loss": -41.80247116088867, "global_step": 179838, "epoch": 1486} {"train_loss": -40.41377639770508, "global_step": 179839, "epoch": 1486} {"train_loss": -39.37826156616211, "global_step": 179840, "epoch": 1486} {"train_loss": -40.6920051574707, "global_step": 179841, "epoch": 1486} {"train_loss": -41.19491195678711, "global_step": 179842, "epoch": 1486} {"train_loss": -40.60205078125, "global_step": 179843, "epoch": 1486} {"train_loss": -39.64777374267578, "global_step": 179844, "epoch": 1486} {"train_loss": -40.25307846069336, "global_step": 179845, "epoch": 1486} {"train_loss": -40.696590423583984, "global_step": 179846, "epoch": 1486} {"train_loss": -40.592376708984375, "global_step": 179847, "epoch": 1486} {"train_loss": -39.326385498046875, "global_step": 179848, "epoch": 1486} {"train_loss": -40.831111907958984, "global_step": 179849, "epoch": 1486} {"train_loss": -41.340938568115234, "global_step": 179850, "epoch": 1486} {"train_loss": -40.550254821777344, "global_step": 179851, "epoch": 1486} {"train_loss": -40.7198600769043, "global_step": 179852, "epoch": 1486} {"train_loss": -41.34245681762695, "global_step": 179853, "epoch": 1486} {"train_loss": -41.00954055786133, "global_step": 179854, "epoch": 1486} {"train_loss": -41.77177810668945, "global_step": 179855, "epoch": 1486} {"train_loss": -40.74086380004883, "global_step": 179856, "epoch": 1486} {"train_loss": -40.92373275756836, "global_step": 179857, "epoch": 1486} {"train_loss": -41.16172409057617, "global_step": 179858, "epoch": 1486} {"train_loss": -40.73249053955078, "global_step": 179859, "epoch": 1486} {"train_loss": -40.832542419433594, "global_step": 179860, "epoch": 1486} {"train_loss": -41.76129150390625, "global_step": 179861, "epoch": 1486} {"train_loss": -41.388248443603516, "global_step": 179862, "epoch": 1486} {"train_loss": -41.28097152709961, "global_step": 179863, "epoch": 1486} {"train_loss": -41.12290573120117, "global_step": 179864, "epoch": 1486} {"train_loss": -39.03230667114258, "global_step": 179865, "epoch": 1486} {"train_loss": -41.51839065551758, "global_step": 179866, "epoch": 1486} {"train_loss": -39.95004653930664, "global_step": 179867, "epoch": 1486} {"train_loss": -36.625545501708984, "global_step": 179868, "epoch": 1486} {"train_loss": -37.80015182495117, "global_step": 179869, "epoch": 1486} {"train_loss": -37.3213005065918, "global_step": 179870, "epoch": 1486} {"train_loss": -29.9008846282959, "global_step": 179871, "epoch": 1486} {"train_loss": -35.53920364379883, "global_step": 179872, "epoch": 1486} {"train_loss": -37.0115966796875, "global_step": 179873, "epoch": 1486} {"train_loss": -34.93355178833008, "global_step": 179874, "epoch": 1486} {"train_loss": -35.581886291503906, "global_step": 179875, "epoch": 1486} {"train_loss": -35.42189407348633, "global_step": 179876, "epoch": 1486} {"train_loss": -34.00178527832031, "global_step": 179877, "epoch": 1486} {"train_loss": -36.87566375732422, "global_step": 179878, "epoch": 1486} {"train_loss": -36.2201042175293, "global_step": 179879, "epoch": 1486} {"train_loss": -38.55233383178711, "global_step": 179880, "epoch": 1486} {"train_loss": -38.47114944458008, "global_step": 179881, "epoch": 1486} {"train_loss": -37.44460678100586, "global_step": 179882, "epoch": 1486} {"train_loss": -38.86460494995117, "global_step": 179883, "epoch": 1486} {"train_loss": -36.284088134765625, "global_step": 179884, "epoch": 1486} {"train_loss": -39.32491683959961, "global_step": 179885, "epoch": 1486} {"train_loss": -39.580623626708984, "global_step": 179886, "epoch": 1486} {"train_loss": -36.2371940612793, "global_step": 179887, "epoch": 1486} {"train_loss": -40.41387176513672, "global_step": 179888, "epoch": 1486} {"train_loss": -38.998287200927734, "global_step": 179889, "epoch": 1486} {"train_loss": -36.83359909057617, "global_step": 179890, "epoch": 1486} {"train_loss": -39.52708053588867, "global_step": 179891, "epoch": 1486} {"train_loss": -40.04203414916992, "global_step": 179892, "epoch": 1486} {"train_loss": -38.094322204589844, "global_step": 179893, "epoch": 1486} {"train_loss": -39.745967864990234, "global_step": 179894, "epoch": 1486} {"train_loss": -39.810218811035156, "global_step": 179895, "epoch": 1486} {"train_loss": -37.85749053955078, "global_step": 179896, "epoch": 1486} {"train_loss": -40.44765853881836, "global_step": 179897, "epoch": 1486} {"train_loss": -39.04774856567383, "global_step": 179898, "epoch": 1486} {"train_loss": -39.8115348815918, "global_step": 179899, "epoch": 1486} {"train_loss": -40.70258331298828, "global_step": 179900, "epoch": 1486} {"train_loss": -40.281429290771484, "global_step": 179901, "epoch": 1486} {"train_loss": -40.648738861083984, "global_step": 179902, "epoch": 1486} {"train_loss": -40.248600006103516, "global_step": 179903, "epoch": 1486} {"train_loss": -40.46787643432617, "global_step": 179904, "epoch": 1486} {"train_loss": -41.153564453125, "global_step": 179905, "epoch": 1486} {"train_loss": -40.418182373046875, "global_step": 179906, "epoch": 1486} {"train_loss": -40.8300666809082, "global_step": 179907, "epoch": 1486} {"train_loss": -40.72915267944336, "global_step": 179908, "epoch": 1486} {"train_loss": -40.5881233215332, "global_step": 179909, "epoch": 1486} {"train_loss": -40.45895004272461, "global_step": 179910, "epoch": 1486} {"train_loss": -41.185638427734375, "global_step": 179911, "epoch": 1486} {"train_loss": -40.739654541015625, "global_step": 179912, "epoch": 1486} {"train_loss": -40.766029357910156, "global_step": 179913, "epoch": 1486} {"train_loss": -41.58319091796875, "global_step": 179914, "epoch": 1486} {"train_loss": -41.199214935302734, "global_step": 179915, "epoch": 1486} {"train_loss": -41.32908248901367, "global_step": 179916, "epoch": 1486} {"train_loss": -40.45134735107422, "global_step": 179917, "epoch": 1486} {"train_loss": -41.654449462890625, "global_step": 179918, "epoch": 1486} {"train_loss": -41.10691452026367, "global_step": 179919, "epoch": 1486} {"train_loss": -41.41170120239258, "global_step": 179920, "epoch": 1486} {"train_loss": -41.31081008911133, "global_step": 179921, "epoch": 1486} {"train_loss": -41.701045989990234, "global_step": 179922, "epoch": 1486} {"train_loss": -41.17559051513672, "global_step": 179923, "epoch": 1486} {"train_loss": -41.87087631225586, "global_step": 179924, "epoch": 1486} {"train_loss": -41.79656982421875, "global_step": 179925, "epoch": 1486} {"train_loss": -40.1266111421191, "global_step": 179926, "epoch": 1486, "val_loss": 2628549.25} {"train_loss": -41.665645599365234, "global_step": 179927, "epoch": 1487} {"train_loss": -41.79273223876953, "global_step": 179928, "epoch": 1487} {"train_loss": -41.4366455078125, "global_step": 179929, "epoch": 1487} {"train_loss": -41.512237548828125, "global_step": 179930, "epoch": 1487} {"train_loss": -41.87329864501953, "global_step": 179931, "epoch": 1487} {"train_loss": -42.0019416809082, "global_step": 179932, "epoch": 1487} {"train_loss": -40.55866622924805, "global_step": 179933, "epoch": 1487} {"train_loss": -41.52663803100586, "global_step": 179934, "epoch": 1487} {"train_loss": -41.62164306640625, "global_step": 179935, "epoch": 1487} {"train_loss": -40.96860885620117, "global_step": 179936, "epoch": 1487} {"train_loss": -42.037513732910156, "global_step": 179937, "epoch": 1487} {"train_loss": -41.891685485839844, "global_step": 179938, "epoch": 1487} {"train_loss": -41.98305892944336, "global_step": 179939, "epoch": 1487} {"train_loss": -42.22623825073242, "global_step": 179940, "epoch": 1487} {"train_loss": -41.855690002441406, "global_step": 179941, "epoch": 1487} {"train_loss": -42.05290985107422, "global_step": 179942, "epoch": 1487} {"train_loss": -41.9905891418457, "global_step": 179943, "epoch": 1487} {"train_loss": -41.00537109375, "global_step": 179944, "epoch": 1487} {"train_loss": -42.116153717041016, "global_step": 179945, "epoch": 1487} {"train_loss": -42.22222137451172, "global_step": 179946, "epoch": 1487} {"train_loss": -41.44797897338867, "global_step": 179947, "epoch": 1487} {"train_loss": -42.08257293701172, "global_step": 179948, "epoch": 1487} {"train_loss": -41.906494140625, "global_step": 179949, "epoch": 1487} {"train_loss": -42.401092529296875, "global_step": 179950, "epoch": 1487} {"train_loss": -42.314048767089844, "global_step": 179951, "epoch": 1487} {"train_loss": -41.91012954711914, "global_step": 179952, "epoch": 1487} {"train_loss": -41.91634750366211, "global_step": 179953, "epoch": 1487} {"train_loss": -42.00165939331055, "global_step": 179954, "epoch": 1487} {"train_loss": -41.80460739135742, "global_step": 179955, "epoch": 1487} {"train_loss": -41.50849151611328, "global_step": 179956, "epoch": 1487} {"train_loss": -41.69095993041992, "global_step": 179957, "epoch": 1487} {"train_loss": -41.69535446166992, "global_step": 179958, "epoch": 1487} {"train_loss": -41.478904724121094, "global_step": 179959, "epoch": 1487} {"train_loss": -42.08927536010742, "global_step": 179960, "epoch": 1487} {"train_loss": -41.090126037597656, "global_step": 179961, "epoch": 1487} {"train_loss": -38.53232955932617, "global_step": 179962, "epoch": 1487} {"train_loss": -37.290584564208984, "global_step": 179963, "epoch": 1487} {"train_loss": -35.63417434692383, "global_step": 179964, "epoch": 1487} {"train_loss": -31.515121459960938, "global_step": 179965, "epoch": 1487} {"train_loss": -29.409936904907227, "global_step": 179966, "epoch": 1487} {"train_loss": -35.39057159423828, "global_step": 179967, "epoch": 1487} {"train_loss": -39.0534782409668, "global_step": 179968, "epoch": 1487} {"train_loss": -26.803293228149414, "global_step": 179969, "epoch": 1487} {"train_loss": -32.522762298583984, "global_step": 179970, "epoch": 1487} {"train_loss": -37.7038688659668, "global_step": 179971, "epoch": 1487} {"train_loss": -34.49081039428711, "global_step": 179972, "epoch": 1487} {"train_loss": -36.80972671508789, "global_step": 179973, "epoch": 1487} {"train_loss": -37.5236701965332, "global_step": 179974, "epoch": 1487} {"train_loss": -37.49787521362305, "global_step": 179975, "epoch": 1487} {"train_loss": -38.14717483520508, "global_step": 179976, "epoch": 1487} {"train_loss": -38.14301681518555, "global_step": 179977, "epoch": 1487} {"train_loss": -40.293212890625, "global_step": 179978, "epoch": 1487} {"train_loss": -38.12583541870117, "global_step": 179979, "epoch": 1487} {"train_loss": -39.315181732177734, "global_step": 179980, "epoch": 1487} {"train_loss": -39.359310150146484, "global_step": 179981, "epoch": 1487} {"train_loss": -39.99805450439453, "global_step": 179982, "epoch": 1487} {"train_loss": -39.38077926635742, "global_step": 179983, "epoch": 1487} {"train_loss": -40.134098052978516, "global_step": 179984, "epoch": 1487} {"train_loss": -40.67478561401367, "global_step": 179985, "epoch": 1487} {"train_loss": -40.51142120361328, "global_step": 179986, "epoch": 1487} {"train_loss": -40.3158073425293, "global_step": 179987, "epoch": 1487} {"train_loss": -40.50178909301758, "global_step": 179988, "epoch": 1487} {"train_loss": -41.02210998535156, "global_step": 179989, "epoch": 1487} {"train_loss": -40.57133102416992, "global_step": 179990, "epoch": 1487} {"train_loss": -41.3465576171875, "global_step": 179991, "epoch": 1487} {"train_loss": -41.014015197753906, "global_step": 179992, "epoch": 1487} {"train_loss": -40.9608154296875, "global_step": 179993, "epoch": 1487} {"train_loss": -41.0334587097168, "global_step": 179994, "epoch": 1487} {"train_loss": -41.082794189453125, "global_step": 179995, "epoch": 1487} {"train_loss": -40.949703216552734, "global_step": 179996, "epoch": 1487} {"train_loss": -41.52205276489258, "global_step": 179997, "epoch": 1487} {"train_loss": -40.86720657348633, "global_step": 179998, "epoch": 1487} {"train_loss": -41.660823822021484, "global_step": 179999, "epoch": 1487} {"train_loss": -40.89812088012695, "global_step": 180000, "epoch": 1487} {"train_loss": -41.52263641357422, "global_step": 180001, "epoch": 1487} {"train_loss": -41.54236602783203, "global_step": 180002, "epoch": 1487} {"train_loss": -41.48725509643555, "global_step": 180003, "epoch": 1487} {"train_loss": -41.41787338256836, "global_step": 180004, "epoch": 1487} {"train_loss": -41.980201721191406, "global_step": 180005, "epoch": 1487} {"train_loss": -41.70081329345703, "global_step": 180006, "epoch": 1487} {"train_loss": -41.49787902832031, "global_step": 180007, "epoch": 1487} {"train_loss": -41.77933120727539, "global_step": 180008, "epoch": 1487} {"train_loss": -41.80910873413086, "global_step": 180009, "epoch": 1487} {"train_loss": -41.77022171020508, "global_step": 180010, "epoch": 1487} {"train_loss": -42.12114715576172, "global_step": 180011, "epoch": 1487} {"train_loss": -42.01565170288086, "global_step": 180012, "epoch": 1487} {"train_loss": -41.98823165893555, "global_step": 180013, "epoch": 1487} {"train_loss": -42.071754455566406, "global_step": 180014, "epoch": 1487} {"train_loss": -42.16071319580078, "global_step": 180015, "epoch": 1487} {"train_loss": -42.27771759033203, "global_step": 180016, "epoch": 1487} {"train_loss": -41.653621673583984, "global_step": 180017, "epoch": 1487} {"train_loss": -42.23023223876953, "global_step": 180018, "epoch": 1487} {"train_loss": -42.369789123535156, "global_step": 180019, "epoch": 1487} {"train_loss": -42.16176223754883, "global_step": 180020, "epoch": 1487} {"train_loss": -41.9266242980957, "global_step": 180021, "epoch": 1487} {"train_loss": -42.1990966796875, "global_step": 180022, "epoch": 1487} {"train_loss": -42.05583572387695, "global_step": 180023, "epoch": 1487} {"train_loss": -42.00701904296875, "global_step": 180024, "epoch": 1487} {"train_loss": -42.343055725097656, "global_step": 180025, "epoch": 1487} {"train_loss": -42.125152587890625, "global_step": 180026, "epoch": 1487} {"train_loss": -42.44626998901367, "global_step": 180027, "epoch": 1487} {"train_loss": -42.117000579833984, "global_step": 180028, "epoch": 1487} {"train_loss": -42.39228439331055, "global_step": 180029, "epoch": 1487} {"train_loss": -42.3050651550293, "global_step": 180030, "epoch": 1487} {"train_loss": -42.52948760986328, "global_step": 180031, "epoch": 1487} {"train_loss": -42.15278244018555, "global_step": 180032, "epoch": 1487} {"train_loss": -41.986915588378906, "global_step": 180033, "epoch": 1487} {"train_loss": -42.65771484375, "global_step": 180034, "epoch": 1487} {"train_loss": -42.530029296875, "global_step": 180035, "epoch": 1487} {"train_loss": -42.61810302734375, "global_step": 180036, "epoch": 1487} {"train_loss": -42.537445068359375, "global_step": 180037, "epoch": 1487} {"train_loss": -42.27541732788086, "global_step": 180038, "epoch": 1487} {"train_loss": -42.702449798583984, "global_step": 180039, "epoch": 1487} {"train_loss": -42.71892166137695, "global_step": 180040, "epoch": 1487} {"train_loss": -42.00292205810547, "global_step": 180041, "epoch": 1487} {"train_loss": -41.73219680786133, "global_step": 180042, "epoch": 1487} {"train_loss": -40.483150482177734, "global_step": 180043, "epoch": 1487} {"train_loss": -42.538936614990234, "global_step": 180044, "epoch": 1487} {"train_loss": -41.77313232421875, "global_step": 180045, "epoch": 1487} {"train_loss": -40.61760330200195, "global_step": 180046, "epoch": 1487} {"train_loss": -40.77259145689405, "global_step": 180047, "epoch": 1487, "val_loss": 2709959.25} {"train_loss": -39.967262268066406, "global_step": 180048, "epoch": 1488} {"train_loss": -40.8983268737793, "global_step": 180049, "epoch": 1488} {"train_loss": -41.80105972290039, "global_step": 180050, "epoch": 1488} {"train_loss": -42.43827438354492, "global_step": 180051, "epoch": 1488} {"train_loss": -41.763153076171875, "global_step": 180052, "epoch": 1488} {"train_loss": -40.94160079956055, "global_step": 180053, "epoch": 1488} {"train_loss": -40.572479248046875, "global_step": 180054, "epoch": 1488} {"train_loss": -39.99573516845703, "global_step": 180055, "epoch": 1488} {"train_loss": -41.964107513427734, "global_step": 180056, "epoch": 1488} {"train_loss": -41.35914993286133, "global_step": 180057, "epoch": 1488} {"train_loss": -39.73610305786133, "global_step": 180058, "epoch": 1488} {"train_loss": -38.32271957397461, "global_step": 180059, "epoch": 1488} {"train_loss": -40.84535598754883, "global_step": 180060, "epoch": 1488} {"train_loss": -40.45914840698242, "global_step": 180061, "epoch": 1488} {"train_loss": -39.73340606689453, "global_step": 180062, "epoch": 1488} {"train_loss": -39.615779876708984, "global_step": 180063, "epoch": 1488} {"train_loss": -38.12772750854492, "global_step": 180064, "epoch": 1488} {"train_loss": -37.758419036865234, "global_step": 180065, "epoch": 1488} {"train_loss": -38.57644271850586, "global_step": 180066, "epoch": 1488} {"train_loss": -41.035919189453125, "global_step": 180067, "epoch": 1488} {"train_loss": -36.311248779296875, "global_step": 180068, "epoch": 1488} {"train_loss": -35.5613899230957, "global_step": 180069, "epoch": 1488} {"train_loss": -38.61283493041992, "global_step": 180070, "epoch": 1488} {"train_loss": -37.091102600097656, "global_step": 180071, "epoch": 1488} {"train_loss": -37.26166915893555, "global_step": 180072, "epoch": 1488} {"train_loss": -40.49566650390625, "global_step": 180073, "epoch": 1488} {"train_loss": -39.40227127075195, "global_step": 180074, "epoch": 1488} {"train_loss": -39.57855224609375, "global_step": 180075, "epoch": 1488} {"train_loss": -40.8802375793457, "global_step": 180076, "epoch": 1488} {"train_loss": -39.633644104003906, "global_step": 180077, "epoch": 1488} {"train_loss": -40.9273567199707, "global_step": 180078, "epoch": 1488} {"train_loss": -40.841495513916016, "global_step": 180079, "epoch": 1488} {"train_loss": -39.853187561035156, "global_step": 180080, "epoch": 1488} {"train_loss": -41.11371994018555, "global_step": 180081, "epoch": 1488} {"train_loss": -39.91386795043945, "global_step": 180082, "epoch": 1488} {"train_loss": -41.05027770996094, "global_step": 180083, "epoch": 1488} {"train_loss": -40.73111343383789, "global_step": 180084, "epoch": 1488} {"train_loss": -41.04338073730469, "global_step": 180085, "epoch": 1488} {"train_loss": -40.46059799194336, "global_step": 180086, "epoch": 1488} {"train_loss": -39.77936553955078, "global_step": 180087, "epoch": 1488} {"train_loss": -40.08184051513672, "global_step": 180088, "epoch": 1488} {"train_loss": -40.746246337890625, "global_step": 180089, "epoch": 1488} {"train_loss": -40.6818733215332, "global_step": 180090, "epoch": 1488} {"train_loss": -40.44246292114258, "global_step": 180091, "epoch": 1488} {"train_loss": -40.797607421875, "global_step": 180092, "epoch": 1488} {"train_loss": -40.88688278198242, "global_step": 180093, "epoch": 1488} {"train_loss": -40.385616302490234, "global_step": 180094, "epoch": 1488} {"train_loss": -41.85932159423828, "global_step": 180095, "epoch": 1488} {"train_loss": -41.11152267456055, "global_step": 180096, "epoch": 1488} {"train_loss": -41.42835998535156, "global_step": 180097, "epoch": 1488} {"train_loss": -41.1974983215332, "global_step": 180098, "epoch": 1488} {"train_loss": -41.789058685302734, "global_step": 180099, "epoch": 1488} {"train_loss": -41.82114791870117, "global_step": 180100, "epoch": 1488} {"train_loss": -41.30488967895508, "global_step": 180101, "epoch": 1488} {"train_loss": -41.86151123046875, "global_step": 180102, "epoch": 1488} {"train_loss": -41.756988525390625, "global_step": 180103, "epoch": 1488} {"train_loss": -41.47096633911133, "global_step": 180104, "epoch": 1488} {"train_loss": -41.579376220703125, "global_step": 180105, "epoch": 1488} {"train_loss": -41.572654724121094, "global_step": 180106, "epoch": 1488} {"train_loss": -41.958919525146484, "global_step": 180107, "epoch": 1488} {"train_loss": -41.46472930908203, "global_step": 180108, "epoch": 1488} {"train_loss": -41.43034744262695, "global_step": 180109, "epoch": 1488} {"train_loss": -41.94881820678711, "global_step": 180110, "epoch": 1488} {"train_loss": -41.375892639160156, "global_step": 180111, "epoch": 1488} {"train_loss": -41.40568923950195, "global_step": 180112, "epoch": 1488} {"train_loss": -41.640907287597656, "global_step": 180113, "epoch": 1488} {"train_loss": -41.62205123901367, "global_step": 180114, "epoch": 1488} {"train_loss": -42.16185760498047, "global_step": 180115, "epoch": 1488} {"train_loss": -41.79623031616211, "global_step": 180116, "epoch": 1488} {"train_loss": -41.761234283447266, "global_step": 180117, "epoch": 1488} {"train_loss": -41.982669830322266, "global_step": 180118, "epoch": 1488} {"train_loss": -41.85280227661133, "global_step": 180119, "epoch": 1488} {"train_loss": -42.044002532958984, "global_step": 180120, "epoch": 1488} {"train_loss": -42.09278869628906, "global_step": 180121, "epoch": 1488} {"train_loss": -42.117530822753906, "global_step": 180122, "epoch": 1488} {"train_loss": -42.14406204223633, "global_step": 180123, "epoch": 1488} {"train_loss": -41.20851516723633, "global_step": 180124, "epoch": 1488} {"train_loss": -42.38084030151367, "global_step": 180125, "epoch": 1488} {"train_loss": -42.30564880371094, "global_step": 180126, "epoch": 1488} {"train_loss": -42.000953674316406, "global_step": 180127, "epoch": 1488} {"train_loss": -42.0678596496582, "global_step": 180128, "epoch": 1488} {"train_loss": -42.207393646240234, "global_step": 180129, "epoch": 1488} {"train_loss": -41.88762283325195, "global_step": 180130, "epoch": 1488} {"train_loss": -41.90871810913086, "global_step": 180131, "epoch": 1488} {"train_loss": -42.007781982421875, "global_step": 180132, "epoch": 1488} {"train_loss": -42.09929275512695, "global_step": 180133, "epoch": 1488} {"train_loss": -41.683250427246094, "global_step": 180134, "epoch": 1488} {"train_loss": -40.77509307861328, "global_step": 180135, "epoch": 1488} {"train_loss": -40.7260627746582, "global_step": 180136, "epoch": 1488} {"train_loss": -40.5477409362793, "global_step": 180137, "epoch": 1488} {"train_loss": -41.521827697753906, "global_step": 180138, "epoch": 1488} {"train_loss": -42.58476638793945, "global_step": 180139, "epoch": 1488} {"train_loss": -41.24585723876953, "global_step": 180140, "epoch": 1488} {"train_loss": -40.6812858581543, "global_step": 180141, "epoch": 1488} {"train_loss": -41.07870101928711, "global_step": 180142, "epoch": 1488} {"train_loss": -41.65275192260742, "global_step": 180143, "epoch": 1488} {"train_loss": -41.56986618041992, "global_step": 180144, "epoch": 1488} {"train_loss": -41.6030158996582, "global_step": 180145, "epoch": 1488} {"train_loss": -41.43780517578125, "global_step": 180146, "epoch": 1488} {"train_loss": -41.92873001098633, "global_step": 180147, "epoch": 1488} {"train_loss": -41.969539642333984, "global_step": 180148, "epoch": 1488} {"train_loss": -41.88360595703125, "global_step": 180149, "epoch": 1488} {"train_loss": -41.94267654418945, "global_step": 180150, "epoch": 1488} {"train_loss": -42.04945373535156, "global_step": 180151, "epoch": 1488} {"train_loss": -42.4815559387207, "global_step": 180152, "epoch": 1488} {"train_loss": -41.48592758178711, "global_step": 180153, "epoch": 1488} {"train_loss": -40.40114974975586, "global_step": 180154, "epoch": 1488} {"train_loss": -40.49616241455078, "global_step": 180155, "epoch": 1488} {"train_loss": -41.480010986328125, "global_step": 180156, "epoch": 1488} {"train_loss": -42.165042877197266, "global_step": 180157, "epoch": 1488} {"train_loss": -40.244022369384766, "global_step": 180158, "epoch": 1488} {"train_loss": -37.71906280517578, "global_step": 180159, "epoch": 1488} {"train_loss": -39.8011589050293, "global_step": 180160, "epoch": 1488} {"train_loss": -41.79621124267578, "global_step": 180161, "epoch": 1488} {"train_loss": -40.83479690551758, "global_step": 180162, "epoch": 1488} {"train_loss": -40.526954650878906, "global_step": 180163, "epoch": 1488} {"train_loss": -42.05158615112305, "global_step": 180164, "epoch": 1488} {"train_loss": -40.324493408203125, "global_step": 180165, "epoch": 1488} {"train_loss": -40.27497100830078, "global_step": 180166, "epoch": 1488} {"train_loss": -41.76951217651367, "global_step": 180167, "epoch": 1488} {"train_loss": -40.92255965934312, "global_step": 180168, "epoch": 1488, "val_loss": 2705661.75} {"train_loss": -40.50592041015625, "global_step": 180169, "epoch": 1489} {"train_loss": -41.29207992553711, "global_step": 180170, "epoch": 1489} {"train_loss": -42.090087890625, "global_step": 180171, "epoch": 1489} {"train_loss": -42.01960754394531, "global_step": 180172, "epoch": 1489} {"train_loss": -42.107826232910156, "global_step": 180173, "epoch": 1489} {"train_loss": -41.397064208984375, "global_step": 180174, "epoch": 1489} {"train_loss": -42.101356506347656, "global_step": 180175, "epoch": 1489} {"train_loss": -42.074623107910156, "global_step": 180176, "epoch": 1489} {"train_loss": -42.059967041015625, "global_step": 180177, "epoch": 1489} {"train_loss": -42.2243766784668, "global_step": 180178, "epoch": 1489} {"train_loss": -42.012969970703125, "global_step": 180179, "epoch": 1489} {"train_loss": -41.92000961303711, "global_step": 180180, "epoch": 1489} {"train_loss": -42.03297805786133, "global_step": 180181, "epoch": 1489} {"train_loss": -41.38038635253906, "global_step": 180182, "epoch": 1489} {"train_loss": -41.91020584106445, "global_step": 180183, "epoch": 1489} {"train_loss": -41.338741302490234, "global_step": 180184, "epoch": 1489} {"train_loss": -41.91759490966797, "global_step": 180185, "epoch": 1489} {"train_loss": -41.75086975097656, "global_step": 180186, "epoch": 1489} {"train_loss": -40.846832275390625, "global_step": 180187, "epoch": 1489} {"train_loss": -41.435367584228516, "global_step": 180188, "epoch": 1489} {"train_loss": -41.65520477294922, "global_step": 180189, "epoch": 1489} {"train_loss": -41.254425048828125, "global_step": 180190, "epoch": 1489} {"train_loss": -41.45557403564453, "global_step": 180191, "epoch": 1489} {"train_loss": -41.67988586425781, "global_step": 180192, "epoch": 1489} {"train_loss": -41.1036376953125, "global_step": 180193, "epoch": 1489} {"train_loss": -41.77042770385742, "global_step": 180194, "epoch": 1489} {"train_loss": -41.318458557128906, "global_step": 180195, "epoch": 1489} {"train_loss": -41.85857009887695, "global_step": 180196, "epoch": 1489} {"train_loss": -41.7052116394043, "global_step": 180197, "epoch": 1489} {"train_loss": -41.59061813354492, "global_step": 180198, "epoch": 1489} {"train_loss": -40.80603790283203, "global_step": 180199, "epoch": 1489} {"train_loss": -41.457855224609375, "global_step": 180200, "epoch": 1489} {"train_loss": -42.092567443847656, "global_step": 180201, "epoch": 1489} {"train_loss": -41.20486068725586, "global_step": 180202, "epoch": 1489} {"train_loss": -41.300960540771484, "global_step": 180203, "epoch": 1489} {"train_loss": -40.500526428222656, "global_step": 180204, "epoch": 1489} {"train_loss": -41.0555305480957, "global_step": 180205, "epoch": 1489} {"train_loss": -41.08384323120117, "global_step": 180206, "epoch": 1489} {"train_loss": -41.8602180480957, "global_step": 180207, "epoch": 1489} {"train_loss": -41.9880256652832, "global_step": 180208, "epoch": 1489} {"train_loss": -40.43549728393555, "global_step": 180209, "epoch": 1489} {"train_loss": -39.809478759765625, "global_step": 180210, "epoch": 1489} {"train_loss": -39.690120697021484, "global_step": 180211, "epoch": 1489} {"train_loss": -40.70643997192383, "global_step": 180212, "epoch": 1489} {"train_loss": -42.00385665893555, "global_step": 180213, "epoch": 1489} {"train_loss": -41.466705322265625, "global_step": 180214, "epoch": 1489} {"train_loss": -38.93898391723633, "global_step": 180215, "epoch": 1489} {"train_loss": -39.739227294921875, "global_step": 180216, "epoch": 1489} {"train_loss": -40.89058303833008, "global_step": 180217, "epoch": 1489} {"train_loss": -41.925167083740234, "global_step": 180218, "epoch": 1489} {"train_loss": -40.6187744140625, "global_step": 180219, "epoch": 1489} {"train_loss": -39.250301361083984, "global_step": 180220, "epoch": 1489} {"train_loss": -37.965545654296875, "global_step": 180221, "epoch": 1489} {"train_loss": -40.588287353515625, "global_step": 180222, "epoch": 1489} {"train_loss": -37.61919021606445, "global_step": 180223, "epoch": 1489} {"train_loss": -40.8642692565918, "global_step": 180224, "epoch": 1489} {"train_loss": -37.27470016479492, "global_step": 180225, "epoch": 1489} {"train_loss": -40.14394760131836, "global_step": 180226, "epoch": 1489} {"train_loss": -38.07619857788086, "global_step": 180227, "epoch": 1489} {"train_loss": -39.016841888427734, "global_step": 180228, "epoch": 1489} {"train_loss": -39.8609733581543, "global_step": 180229, "epoch": 1489} {"train_loss": -36.017391204833984, "global_step": 180230, "epoch": 1489} {"train_loss": -36.4181022644043, "global_step": 180231, "epoch": 1489} {"train_loss": -33.8410530090332, "global_step": 180232, "epoch": 1489} {"train_loss": -39.89188766479492, "global_step": 180233, "epoch": 1489} {"train_loss": -34.04012680053711, "global_step": 180234, "epoch": 1489} {"train_loss": -39.09436798095703, "global_step": 180235, "epoch": 1489} {"train_loss": -36.762939453125, "global_step": 180236, "epoch": 1489} {"train_loss": -35.47081756591797, "global_step": 180237, "epoch": 1489} {"train_loss": -39.88663864135742, "global_step": 180238, "epoch": 1489} {"train_loss": -33.69348907470703, "global_step": 180239, "epoch": 1489} {"train_loss": -37.96796798706055, "global_step": 180240, "epoch": 1489} {"train_loss": -35.360965728759766, "global_step": 180241, "epoch": 1489} {"train_loss": -28.106306076049805, "global_step": 180242, "epoch": 1489} {"train_loss": -35.006019592285156, "global_step": 180243, "epoch": 1489} {"train_loss": -34.19545364379883, "global_step": 180244, "epoch": 1489} {"train_loss": -33.0534782409668, "global_step": 180245, "epoch": 1489} {"train_loss": -34.955440521240234, "global_step": 180246, "epoch": 1489} {"train_loss": -37.300960540771484, "global_step": 180247, "epoch": 1489} {"train_loss": -33.91093826293945, "global_step": 180248, "epoch": 1489} {"train_loss": -35.636898040771484, "global_step": 180249, "epoch": 1489} {"train_loss": -36.17617416381836, "global_step": 180250, "epoch": 1489} {"train_loss": -39.333251953125, "global_step": 180251, "epoch": 1489} {"train_loss": -34.62477493286133, "global_step": 180252, "epoch": 1489} {"train_loss": -37.86362838745117, "global_step": 180253, "epoch": 1489} {"train_loss": -36.836700439453125, "global_step": 180254, "epoch": 1489} {"train_loss": -38.697139739990234, "global_step": 180255, "epoch": 1489} {"train_loss": -38.348052978515625, "global_step": 180256, "epoch": 1489} {"train_loss": -38.96223068237305, "global_step": 180257, "epoch": 1489} {"train_loss": -37.84962844848633, "global_step": 180258, "epoch": 1489} {"train_loss": -39.40313720703125, "global_step": 180259, "epoch": 1489} {"train_loss": -39.24128723144531, "global_step": 180260, "epoch": 1489} {"train_loss": -38.3817253112793, "global_step": 180261, "epoch": 1489} {"train_loss": -38.98990249633789, "global_step": 180262, "epoch": 1489} {"train_loss": -38.59894561767578, "global_step": 180263, "epoch": 1489} {"train_loss": -40.017189025878906, "global_step": 180264, "epoch": 1489} {"train_loss": -38.64751052856445, "global_step": 180265, "epoch": 1489} {"train_loss": -39.39744186401367, "global_step": 180266, "epoch": 1489} {"train_loss": -39.47947311401367, "global_step": 180267, "epoch": 1489} {"train_loss": -39.76209259033203, "global_step": 180268, "epoch": 1489} {"train_loss": -39.87978744506836, "global_step": 180269, "epoch": 1489} {"train_loss": -40.73539733886719, "global_step": 180270, "epoch": 1489} {"train_loss": -39.8056755065918, "global_step": 180271, "epoch": 1489} {"train_loss": -40.796627044677734, "global_step": 180272, "epoch": 1489} {"train_loss": -40.517005920410156, "global_step": 180273, "epoch": 1489} {"train_loss": -40.43960189819336, "global_step": 180274, "epoch": 1489} {"train_loss": -40.94609451293945, "global_step": 180275, "epoch": 1489} {"train_loss": -40.8948974609375, "global_step": 180276, "epoch": 1489} {"train_loss": -40.78879928588867, "global_step": 180277, "epoch": 1489} {"train_loss": -40.964115142822266, "global_step": 180278, "epoch": 1489} {"train_loss": -41.04944610595703, "global_step": 180279, "epoch": 1489} {"train_loss": -40.727760314941406, "global_step": 180280, "epoch": 1489} {"train_loss": -41.41514205932617, "global_step": 180281, "epoch": 1489} {"train_loss": -41.098751068115234, "global_step": 180282, "epoch": 1489} {"train_loss": -41.04922103881836, "global_step": 180283, "epoch": 1489} {"train_loss": -41.37998580932617, "global_step": 180284, "epoch": 1489} {"train_loss": -41.36927032470703, "global_step": 180285, "epoch": 1489} {"train_loss": -41.30358123779297, "global_step": 180286, "epoch": 1489} {"train_loss": -41.13550567626953, "global_step": 180287, "epoch": 1489} {"train_loss": -41.23094940185547, "global_step": 180288, "epoch": 1489} {"train_loss": -39.667971729247036, "global_step": 180289, "epoch": 1489, "val_loss": 2686738.25} {"train_loss": -41.53019714355469, "global_step": 180290, "epoch": 1490} {"train_loss": -41.51543045043945, "global_step": 180291, "epoch": 1490} {"train_loss": -41.58077621459961, "global_step": 180292, "epoch": 1490} {"train_loss": -42.02238082885742, "global_step": 180293, "epoch": 1490} {"train_loss": -41.65199661254883, "global_step": 180294, "epoch": 1490} {"train_loss": -41.422237396240234, "global_step": 180295, "epoch": 1490} {"train_loss": -41.8117561340332, "global_step": 180296, "epoch": 1490} {"train_loss": -41.5398063659668, "global_step": 180297, "epoch": 1490} {"train_loss": -41.75471878051758, "global_step": 180298, "epoch": 1490} {"train_loss": -41.66672897338867, "global_step": 180299, "epoch": 1490} {"train_loss": -41.62105178833008, "global_step": 180300, "epoch": 1490} {"train_loss": -42.14226150512695, "global_step": 180301, "epoch": 1490} {"train_loss": -41.926937103271484, "global_step": 180302, "epoch": 1490} {"train_loss": -41.81170654296875, "global_step": 180303, "epoch": 1490} {"train_loss": -42.035282135009766, "global_step": 180304, "epoch": 1490} {"train_loss": -41.89825439453125, "global_step": 180305, "epoch": 1490} {"train_loss": -42.220699310302734, "global_step": 180306, "epoch": 1490} {"train_loss": -42.06692123413086, "global_step": 180307, "epoch": 1490} {"train_loss": -41.94234085083008, "global_step": 180308, "epoch": 1490} {"train_loss": -42.27203369140625, "global_step": 180309, "epoch": 1490} {"train_loss": -41.966278076171875, "global_step": 180310, "epoch": 1490} {"train_loss": -42.08342742919922, "global_step": 180311, "epoch": 1490} {"train_loss": -42.27067947387695, "global_step": 180312, "epoch": 1490} {"train_loss": -42.152130126953125, "global_step": 180313, "epoch": 1490} {"train_loss": -42.316932678222656, "global_step": 180314, "epoch": 1490} {"train_loss": -42.224822998046875, "global_step": 180315, "epoch": 1490} {"train_loss": -42.246700286865234, "global_step": 180316, "epoch": 1490} {"train_loss": -42.10527038574219, "global_step": 180317, "epoch": 1490} {"train_loss": -42.434017181396484, "global_step": 180318, "epoch": 1490} {"train_loss": -42.22016525268555, "global_step": 180319, "epoch": 1490} {"train_loss": -42.48252868652344, "global_step": 180320, "epoch": 1490} {"train_loss": -42.12062072753906, "global_step": 180321, "epoch": 1490} {"train_loss": -42.55292892456055, "global_step": 180322, "epoch": 1490} {"train_loss": -42.723445892333984, "global_step": 180323, "epoch": 1490} {"train_loss": -42.44538497924805, "global_step": 180324, "epoch": 1490} {"train_loss": -42.065128326416016, "global_step": 180325, "epoch": 1490} {"train_loss": -42.787845611572266, "global_step": 180326, "epoch": 1490} {"train_loss": -42.562957763671875, "global_step": 180327, "epoch": 1490} {"train_loss": -41.7816162109375, "global_step": 180328, "epoch": 1490} {"train_loss": -42.57110595703125, "global_step": 180329, "epoch": 1490} {"train_loss": -42.547576904296875, "global_step": 180330, "epoch": 1490} {"train_loss": -42.306392669677734, "global_step": 180331, "epoch": 1490} {"train_loss": -41.57831954956055, "global_step": 180332, "epoch": 1490} {"train_loss": -41.494163513183594, "global_step": 180333, "epoch": 1490} {"train_loss": -40.807796478271484, "global_step": 180334, "epoch": 1490} {"train_loss": -41.34220504760742, "global_step": 180335, "epoch": 1490} {"train_loss": -42.289913177490234, "global_step": 180336, "epoch": 1490} {"train_loss": -42.579280853271484, "global_step": 180337, "epoch": 1490} {"train_loss": -42.01074981689453, "global_step": 180338, "epoch": 1490} {"train_loss": -41.214210510253906, "global_step": 180339, "epoch": 1490} {"train_loss": -42.133811950683594, "global_step": 180340, "epoch": 1490} {"train_loss": -42.084808349609375, "global_step": 180341, "epoch": 1490} {"train_loss": -41.36227035522461, "global_step": 180342, "epoch": 1490} {"train_loss": -41.41892623901367, "global_step": 180343, "epoch": 1490} {"train_loss": -42.44883346557617, "global_step": 180344, "epoch": 1490} {"train_loss": -41.39814376831055, "global_step": 180345, "epoch": 1490} {"train_loss": -41.05630874633789, "global_step": 180346, "epoch": 1490} {"train_loss": -40.866851806640625, "global_step": 180347, "epoch": 1490} {"train_loss": -40.6251106262207, "global_step": 180348, "epoch": 1490} {"train_loss": -40.7265510559082, "global_step": 180349, "epoch": 1490} {"train_loss": -40.99302291870117, "global_step": 180350, "epoch": 1490} {"train_loss": -41.77039337158203, "global_step": 180351, "epoch": 1490} {"train_loss": -40.46300506591797, "global_step": 180352, "epoch": 1490} {"train_loss": -39.88458251953125, "global_step": 180353, "epoch": 1490} {"train_loss": -37.93906784057617, "global_step": 180354, "epoch": 1490} {"train_loss": -39.63749313354492, "global_step": 180355, "epoch": 1490} {"train_loss": -41.13456344604492, "global_step": 180356, "epoch": 1490} {"train_loss": -38.06850814819336, "global_step": 180357, "epoch": 1490} {"train_loss": -40.682743072509766, "global_step": 180358, "epoch": 1490} {"train_loss": -40.15560531616211, "global_step": 180359, "epoch": 1490} {"train_loss": -39.546504974365234, "global_step": 180360, "epoch": 1490} {"train_loss": -39.802547454833984, "global_step": 180361, "epoch": 1490} {"train_loss": -41.31184768676758, "global_step": 180362, "epoch": 1490} {"train_loss": -40.528900146484375, "global_step": 180363, "epoch": 1490} {"train_loss": -39.69737243652344, "global_step": 180364, "epoch": 1490} {"train_loss": -40.55458450317383, "global_step": 180365, "epoch": 1490} {"train_loss": -40.12220001220703, "global_step": 180366, "epoch": 1490} {"train_loss": -41.468326568603516, "global_step": 180367, "epoch": 1490} {"train_loss": -40.91689682006836, "global_step": 180368, "epoch": 1490} {"train_loss": -39.086544036865234, "global_step": 180369, "epoch": 1490} {"train_loss": -39.8739013671875, "global_step": 180370, "epoch": 1490} {"train_loss": -40.945919036865234, "global_step": 180371, "epoch": 1490} {"train_loss": -41.526283264160156, "global_step": 180372, "epoch": 1490} {"train_loss": -40.780296325683594, "global_step": 180373, "epoch": 1490} {"train_loss": -40.83064651489258, "global_step": 180374, "epoch": 1490} {"train_loss": -41.074764251708984, "global_step": 180375, "epoch": 1490} {"train_loss": -41.43557357788086, "global_step": 180376, "epoch": 1490} {"train_loss": -41.765045166015625, "global_step": 180377, "epoch": 1490} {"train_loss": -40.9510612487793, "global_step": 180378, "epoch": 1490} {"train_loss": -41.30410385131836, "global_step": 180379, "epoch": 1490} {"train_loss": -42.08233642578125, "global_step": 180380, "epoch": 1490} {"train_loss": -41.5352897644043, "global_step": 180381, "epoch": 1490} {"train_loss": -42.0555534362793, "global_step": 180382, "epoch": 1490} {"train_loss": -41.761417388916016, "global_step": 180383, "epoch": 1490} {"train_loss": -41.59621810913086, "global_step": 180384, "epoch": 1490} {"train_loss": -41.64146041870117, "global_step": 180385, "epoch": 1490} {"train_loss": -41.74689865112305, "global_step": 180386, "epoch": 1490} {"train_loss": -41.114898681640625, "global_step": 180387, "epoch": 1490} {"train_loss": -41.454463958740234, "global_step": 180388, "epoch": 1490} {"train_loss": -41.92136764526367, "global_step": 180389, "epoch": 1490} {"train_loss": -42.010921478271484, "global_step": 180390, "epoch": 1490} {"train_loss": -41.815181732177734, "global_step": 180391, "epoch": 1490} {"train_loss": -41.85459518432617, "global_step": 180392, "epoch": 1490} {"train_loss": -41.408477783203125, "global_step": 180393, "epoch": 1490} {"train_loss": -42.08132553100586, "global_step": 180394, "epoch": 1490} {"train_loss": -41.87738800048828, "global_step": 180395, "epoch": 1490} {"train_loss": -41.80754470825195, "global_step": 180396, "epoch": 1490} {"train_loss": -41.755489349365234, "global_step": 180397, "epoch": 1490} {"train_loss": -41.58843994140625, "global_step": 180398, "epoch": 1490} {"train_loss": -41.38676071166992, "global_step": 180399, "epoch": 1490} {"train_loss": -42.332523345947266, "global_step": 180400, "epoch": 1490} {"train_loss": -41.71120834350586, "global_step": 180401, "epoch": 1490} {"train_loss": -42.48683166503906, "global_step": 180402, "epoch": 1490} {"train_loss": -41.961936950683594, "global_step": 180403, "epoch": 1490} {"train_loss": -41.62366485595703, "global_step": 180404, "epoch": 1490} {"train_loss": -42.07943344116211, "global_step": 180405, "epoch": 1490} {"train_loss": -42.31218338012695, "global_step": 180406, "epoch": 1490} {"train_loss": -42.25678634643555, "global_step": 180407, "epoch": 1490} {"train_loss": -42.39644241333008, "global_step": 180408, "epoch": 1490} {"train_loss": -42.64201354980469, "global_step": 180409, "epoch": 1490} {"train_loss": -41.545547264666595, "global_step": 180410, "epoch": 1490, "val_loss": 2681511.25} {"train_loss": -42.05998611450195, "global_step": 180411, "epoch": 1491} {"train_loss": -41.5949592590332, "global_step": 180412, "epoch": 1491} {"train_loss": -42.58159255981445, "global_step": 180413, "epoch": 1491} {"train_loss": -41.834999084472656, "global_step": 180414, "epoch": 1491} {"train_loss": -41.80230712890625, "global_step": 180415, "epoch": 1491} {"train_loss": -40.952274322509766, "global_step": 180416, "epoch": 1491} {"train_loss": -41.395416259765625, "global_step": 180417, "epoch": 1491} {"train_loss": -41.60060501098633, "global_step": 180418, "epoch": 1491} {"train_loss": -41.06406784057617, "global_step": 180419, "epoch": 1491} {"train_loss": -39.1526985168457, "global_step": 180420, "epoch": 1491} {"train_loss": -40.77519989013672, "global_step": 180421, "epoch": 1491} {"train_loss": -41.562679290771484, "global_step": 180422, "epoch": 1491} {"train_loss": -40.686824798583984, "global_step": 180423, "epoch": 1491} {"train_loss": -40.25106430053711, "global_step": 180424, "epoch": 1491} {"train_loss": -39.81135177612305, "global_step": 180425, "epoch": 1491} {"train_loss": -39.48911666870117, "global_step": 180426, "epoch": 1491} {"train_loss": -38.78071975708008, "global_step": 180427, "epoch": 1491} {"train_loss": -40.54288864135742, "global_step": 180428, "epoch": 1491} {"train_loss": -41.11091995239258, "global_step": 180429, "epoch": 1491} {"train_loss": -40.34206008911133, "global_step": 180430, "epoch": 1491} {"train_loss": -40.51133346557617, "global_step": 180431, "epoch": 1491} {"train_loss": -40.339691162109375, "global_step": 180432, "epoch": 1491} {"train_loss": -39.81982421875, "global_step": 180433, "epoch": 1491} {"train_loss": -40.90263366699219, "global_step": 180434, "epoch": 1491} {"train_loss": -40.83924102783203, "global_step": 180435, "epoch": 1491} {"train_loss": -39.31995391845703, "global_step": 180436, "epoch": 1491} {"train_loss": -40.82651138305664, "global_step": 180437, "epoch": 1491} {"train_loss": -38.97074890136719, "global_step": 180438, "epoch": 1491} {"train_loss": -40.280311584472656, "global_step": 180439, "epoch": 1491} {"train_loss": -41.311763763427734, "global_step": 180440, "epoch": 1491} {"train_loss": -39.9608268737793, "global_step": 180441, "epoch": 1491} {"train_loss": -41.2502326965332, "global_step": 180442, "epoch": 1491} {"train_loss": -41.4173698425293, "global_step": 180443, "epoch": 1491} {"train_loss": -41.262847900390625, "global_step": 180444, "epoch": 1491} {"train_loss": -40.88053512573242, "global_step": 180445, "epoch": 1491} {"train_loss": -42.08869552612305, "global_step": 180446, "epoch": 1491} {"train_loss": -41.0825309753418, "global_step": 180447, "epoch": 1491} {"train_loss": -41.54328155517578, "global_step": 180448, "epoch": 1491} {"train_loss": -41.460960388183594, "global_step": 180449, "epoch": 1491} {"train_loss": -41.262691497802734, "global_step": 180450, "epoch": 1491} {"train_loss": -41.366455078125, "global_step": 180451, "epoch": 1491} {"train_loss": -42.126251220703125, "global_step": 180452, "epoch": 1491} {"train_loss": -40.9804801940918, "global_step": 180453, "epoch": 1491} {"train_loss": -42.16701126098633, "global_step": 180454, "epoch": 1491} {"train_loss": -41.3458251953125, "global_step": 180455, "epoch": 1491} {"train_loss": -41.083187103271484, "global_step": 180456, "epoch": 1491} {"train_loss": -41.58937072753906, "global_step": 180457, "epoch": 1491} {"train_loss": -41.85819625854492, "global_step": 180458, "epoch": 1491} {"train_loss": -41.60065460205078, "global_step": 180459, "epoch": 1491} {"train_loss": -41.742340087890625, "global_step": 180460, "epoch": 1491} {"train_loss": -41.86513137817383, "global_step": 180461, "epoch": 1491} {"train_loss": -42.10747146606445, "global_step": 180462, "epoch": 1491} {"train_loss": -41.71200180053711, "global_step": 180463, "epoch": 1491} {"train_loss": -42.13394546508789, "global_step": 180464, "epoch": 1491} {"train_loss": -41.59613800048828, "global_step": 180465, "epoch": 1491} {"train_loss": -41.316497802734375, "global_step": 180466, "epoch": 1491} {"train_loss": -41.29039001464844, "global_step": 180467, "epoch": 1491} {"train_loss": -41.6092643737793, "global_step": 180468, "epoch": 1491} {"train_loss": -40.42139434814453, "global_step": 180469, "epoch": 1491} {"train_loss": -41.28547668457031, "global_step": 180470, "epoch": 1491} {"train_loss": -41.392860412597656, "global_step": 180471, "epoch": 1491} {"train_loss": -40.86349105834961, "global_step": 180472, "epoch": 1491} {"train_loss": -40.5917854309082, "global_step": 180473, "epoch": 1491} {"train_loss": -41.30816650390625, "global_step": 180474, "epoch": 1491} {"train_loss": -41.14203643798828, "global_step": 180475, "epoch": 1491} {"train_loss": -40.99170684814453, "global_step": 180476, "epoch": 1491} {"train_loss": -41.664424896240234, "global_step": 180477, "epoch": 1491} {"train_loss": -40.09293746948242, "global_step": 180478, "epoch": 1491} {"train_loss": -40.452613830566406, "global_step": 180479, "epoch": 1491} {"train_loss": -39.116607666015625, "global_step": 180480, "epoch": 1491} {"train_loss": -40.07314682006836, "global_step": 180481, "epoch": 1491} {"train_loss": -40.08286666870117, "global_step": 180482, "epoch": 1491} {"train_loss": -41.19361114501953, "global_step": 180483, "epoch": 1491} {"train_loss": -40.10590744018555, "global_step": 180484, "epoch": 1491} {"train_loss": -40.06597900390625, "global_step": 180485, "epoch": 1491} {"train_loss": -39.72358322143555, "global_step": 180486, "epoch": 1491} {"train_loss": -41.22883224487305, "global_step": 180487, "epoch": 1491} {"train_loss": -39.89427185058594, "global_step": 180488, "epoch": 1491} {"train_loss": -38.205177307128906, "global_step": 180489, "epoch": 1491} {"train_loss": -41.59201431274414, "global_step": 180490, "epoch": 1491} {"train_loss": -38.53732681274414, "global_step": 180491, "epoch": 1491} {"train_loss": -38.7493782043457, "global_step": 180492, "epoch": 1491} {"train_loss": -40.060935974121094, "global_step": 180493, "epoch": 1491} {"train_loss": -40.9638786315918, "global_step": 180494, "epoch": 1491} {"train_loss": -39.20645523071289, "global_step": 180495, "epoch": 1491} {"train_loss": -40.760658264160156, "global_step": 180496, "epoch": 1491} {"train_loss": -39.71076202392578, "global_step": 180497, "epoch": 1491} {"train_loss": -39.709800720214844, "global_step": 180498, "epoch": 1491} {"train_loss": -41.833866119384766, "global_step": 180499, "epoch": 1491} {"train_loss": -40.50873947143555, "global_step": 180500, "epoch": 1491} {"train_loss": -41.37590408325195, "global_step": 180501, "epoch": 1491} {"train_loss": -41.96110153198242, "global_step": 180502, "epoch": 1491} {"train_loss": -41.815040588378906, "global_step": 180503, "epoch": 1491} {"train_loss": -42.28062057495117, "global_step": 180504, "epoch": 1491} {"train_loss": -41.40855407714844, "global_step": 180505, "epoch": 1491} {"train_loss": -41.866146087646484, "global_step": 180506, "epoch": 1491} {"train_loss": -41.996131896972656, "global_step": 180507, "epoch": 1491} {"train_loss": -41.1115608215332, "global_step": 180508, "epoch": 1491} {"train_loss": -40.51697540283203, "global_step": 180509, "epoch": 1491} {"train_loss": -41.47236251831055, "global_step": 180510, "epoch": 1491} {"train_loss": -41.19559860229492, "global_step": 180511, "epoch": 1491} {"train_loss": -41.264808654785156, "global_step": 180512, "epoch": 1491} {"train_loss": -39.904048919677734, "global_step": 180513, "epoch": 1491} {"train_loss": -38.555904388427734, "global_step": 180514, "epoch": 1491} {"train_loss": -39.336910247802734, "global_step": 180515, "epoch": 1491} {"train_loss": -41.230350494384766, "global_step": 180516, "epoch": 1491} {"train_loss": -41.30243682861328, "global_step": 180517, "epoch": 1491} {"train_loss": -39.22904968261719, "global_step": 180518, "epoch": 1491} {"train_loss": -39.365325927734375, "global_step": 180519, "epoch": 1491} {"train_loss": -41.143310546875, "global_step": 180520, "epoch": 1491} {"train_loss": -42.12937545776367, "global_step": 180521, "epoch": 1491} {"train_loss": -40.37949752807617, "global_step": 180522, "epoch": 1491} {"train_loss": -40.33869552612305, "global_step": 180523, "epoch": 1491} {"train_loss": -41.973419189453125, "global_step": 180524, "epoch": 1491} {"train_loss": -41.58169174194336, "global_step": 180525, "epoch": 1491} {"train_loss": -41.722389221191406, "global_step": 180526, "epoch": 1491} {"train_loss": -42.38345718383789, "global_step": 180527, "epoch": 1491} {"train_loss": -41.64375686645508, "global_step": 180528, "epoch": 1491} {"train_loss": -41.246742248535156, "global_step": 180529, "epoch": 1491} {"train_loss": -42.37893295288086, "global_step": 180530, "epoch": 1491} {"train_loss": -40.9069154597511, "global_step": 180531, "epoch": 1491, "val_loss": 2723402.75} {"train_loss": -41.58496856689453, "global_step": 180532, "epoch": 1492} {"train_loss": -42.638858795166016, "global_step": 180533, "epoch": 1492} {"train_loss": -41.482845306396484, "global_step": 180534, "epoch": 1492} {"train_loss": -41.84189987182617, "global_step": 180535, "epoch": 1492} {"train_loss": -42.461456298828125, "global_step": 180536, "epoch": 1492} {"train_loss": -41.1791877746582, "global_step": 180537, "epoch": 1492} {"train_loss": -42.201393127441406, "global_step": 180538, "epoch": 1492} {"train_loss": -41.65876388549805, "global_step": 180539, "epoch": 1492} {"train_loss": -41.42100143432617, "global_step": 180540, "epoch": 1492} {"train_loss": -41.91838455200195, "global_step": 180541, "epoch": 1492} {"train_loss": -41.172828674316406, "global_step": 180542, "epoch": 1492} {"train_loss": -40.59952163696289, "global_step": 180543, "epoch": 1492} {"train_loss": -40.73474884033203, "global_step": 180544, "epoch": 1492} {"train_loss": -41.11606979370117, "global_step": 180545, "epoch": 1492} {"train_loss": -41.13591384887695, "global_step": 180546, "epoch": 1492} {"train_loss": -42.41675567626953, "global_step": 180547, "epoch": 1492} {"train_loss": -42.03815841674805, "global_step": 180548, "epoch": 1492} {"train_loss": -39.3961067199707, "global_step": 180549, "epoch": 1492} {"train_loss": -41.773040771484375, "global_step": 180550, "epoch": 1492} {"train_loss": -40.603214263916016, "global_step": 180551, "epoch": 1492} {"train_loss": -40.557029724121094, "global_step": 180552, "epoch": 1492} {"train_loss": -40.70412826538086, "global_step": 180553, "epoch": 1492} {"train_loss": -41.049434661865234, "global_step": 180554, "epoch": 1492} {"train_loss": -42.25187301635742, "global_step": 180555, "epoch": 1492} {"train_loss": -40.327449798583984, "global_step": 180556, "epoch": 1492} {"train_loss": -39.53968048095703, "global_step": 180557, "epoch": 1492} {"train_loss": -41.46793746948242, "global_step": 180558, "epoch": 1492} {"train_loss": -40.65803146362305, "global_step": 180559, "epoch": 1492} {"train_loss": -41.24732208251953, "global_step": 180560, "epoch": 1492} {"train_loss": -41.891780853271484, "global_step": 180561, "epoch": 1492} {"train_loss": -41.671852111816406, "global_step": 180562, "epoch": 1492} {"train_loss": -37.43626022338867, "global_step": 180563, "epoch": 1492} {"train_loss": -39.483158111572266, "global_step": 180564, "epoch": 1492} {"train_loss": -42.16522216796875, "global_step": 180565, "epoch": 1492} {"train_loss": -42.4089469909668, "global_step": 180566, "epoch": 1492} {"train_loss": -42.06689453125, "global_step": 180567, "epoch": 1492} {"train_loss": -41.61248779296875, "global_step": 180568, "epoch": 1492} {"train_loss": -41.170284271240234, "global_step": 180569, "epoch": 1492} {"train_loss": -42.224422454833984, "global_step": 180570, "epoch": 1492} {"train_loss": -41.82618713378906, "global_step": 180571, "epoch": 1492} {"train_loss": -41.145904541015625, "global_step": 180572, "epoch": 1492} {"train_loss": -41.3223762512207, "global_step": 180573, "epoch": 1492} {"train_loss": -42.642757415771484, "global_step": 180574, "epoch": 1492} {"train_loss": -42.17002487182617, "global_step": 180575, "epoch": 1492} {"train_loss": -41.18887710571289, "global_step": 180576, "epoch": 1492} {"train_loss": -40.61831283569336, "global_step": 180577, "epoch": 1492} {"train_loss": -40.750709533691406, "global_step": 180578, "epoch": 1492} {"train_loss": -41.39430618286133, "global_step": 180579, "epoch": 1492} {"train_loss": -42.0860710144043, "global_step": 180580, "epoch": 1492} {"train_loss": -41.589725494384766, "global_step": 180581, "epoch": 1492} {"train_loss": -41.962440490722656, "global_step": 180582, "epoch": 1492} {"train_loss": -40.88401412963867, "global_step": 180583, "epoch": 1492} {"train_loss": -40.793304443359375, "global_step": 180584, "epoch": 1492} {"train_loss": -41.25927734375, "global_step": 180585, "epoch": 1492} {"train_loss": -42.0092887878418, "global_step": 180586, "epoch": 1492} {"train_loss": -41.87227249145508, "global_step": 180587, "epoch": 1492} {"train_loss": -41.63548278808594, "global_step": 180588, "epoch": 1492} {"train_loss": -41.25764846801758, "global_step": 180589, "epoch": 1492} {"train_loss": -42.331581115722656, "global_step": 180590, "epoch": 1492} {"train_loss": -41.8076286315918, "global_step": 180591, "epoch": 1492} {"train_loss": -41.28091812133789, "global_step": 180592, "epoch": 1492} {"train_loss": -42.626747131347656, "global_step": 180593, "epoch": 1492} {"train_loss": -42.362648010253906, "global_step": 180594, "epoch": 1492} {"train_loss": -41.58366012573242, "global_step": 180595, "epoch": 1492} {"train_loss": -41.86836624145508, "global_step": 180596, "epoch": 1492} {"train_loss": -42.443782806396484, "global_step": 180597, "epoch": 1492} {"train_loss": -41.851837158203125, "global_step": 180598, "epoch": 1492} {"train_loss": -41.61101150512695, "global_step": 180599, "epoch": 1492} {"train_loss": -42.35003662109375, "global_step": 180600, "epoch": 1492} {"train_loss": -42.00139236450195, "global_step": 180601, "epoch": 1492} {"train_loss": -42.4788932800293, "global_step": 180602, "epoch": 1492} {"train_loss": -42.055599212646484, "global_step": 180603, "epoch": 1492} {"train_loss": -41.3070068359375, "global_step": 180604, "epoch": 1492} {"train_loss": -42.2337646484375, "global_step": 180605, "epoch": 1492} {"train_loss": -41.792240142822266, "global_step": 180606, "epoch": 1492} {"train_loss": -40.24397659301758, "global_step": 180607, "epoch": 1492} {"train_loss": -42.49119567871094, "global_step": 180608, "epoch": 1492} {"train_loss": -41.24279022216797, "global_step": 180609, "epoch": 1492} {"train_loss": -40.597835540771484, "global_step": 180610, "epoch": 1492} {"train_loss": -41.72678756713867, "global_step": 180611, "epoch": 1492} {"train_loss": -41.1866569519043, "global_step": 180612, "epoch": 1492} {"train_loss": -41.58036422729492, "global_step": 180613, "epoch": 1492} {"train_loss": -41.2127799987793, "global_step": 180614, "epoch": 1492} {"train_loss": -40.81884002685547, "global_step": 180615, "epoch": 1492} {"train_loss": -42.2027587890625, "global_step": 180616, "epoch": 1492} {"train_loss": -41.36705017089844, "global_step": 180617, "epoch": 1492} {"train_loss": -41.11009979248047, "global_step": 180618, "epoch": 1492} {"train_loss": -41.21440505981445, "global_step": 180619, "epoch": 1492} {"train_loss": -42.23518371582031, "global_step": 180620, "epoch": 1492} {"train_loss": -42.039737701416016, "global_step": 180621, "epoch": 1492} {"train_loss": -41.023170471191406, "global_step": 180622, "epoch": 1492} {"train_loss": -41.12323760986328, "global_step": 180623, "epoch": 1492} {"train_loss": -42.147945404052734, "global_step": 180624, "epoch": 1492} {"train_loss": -42.34417724609375, "global_step": 180625, "epoch": 1492} {"train_loss": -41.127532958984375, "global_step": 180626, "epoch": 1492} {"train_loss": -40.691219329833984, "global_step": 180627, "epoch": 1492} {"train_loss": -40.74239730834961, "global_step": 180628, "epoch": 1492} {"train_loss": -41.96612548828125, "global_step": 180629, "epoch": 1492} {"train_loss": -42.02454376220703, "global_step": 180630, "epoch": 1492} {"train_loss": -41.613468170166016, "global_step": 180631, "epoch": 1492} {"train_loss": -41.66366195678711, "global_step": 180632, "epoch": 1492} {"train_loss": -41.87042999267578, "global_step": 180633, "epoch": 1492} {"train_loss": -41.16071701049805, "global_step": 180634, "epoch": 1492} {"train_loss": -40.803096771240234, "global_step": 180635, "epoch": 1492} {"train_loss": -41.87568283081055, "global_step": 180636, "epoch": 1492} {"train_loss": -42.09577178955078, "global_step": 180637, "epoch": 1492} {"train_loss": -41.36208724975586, "global_step": 180638, "epoch": 1492} {"train_loss": -41.999107360839844, "global_step": 180639, "epoch": 1492} {"train_loss": -41.82987594604492, "global_step": 180640, "epoch": 1492} {"train_loss": -41.42885208129883, "global_step": 180641, "epoch": 1492} {"train_loss": -39.31606674194336, "global_step": 180642, "epoch": 1492} {"train_loss": -40.026859283447266, "global_step": 180643, "epoch": 1492} {"train_loss": -41.34218978881836, "global_step": 180644, "epoch": 1492} {"train_loss": -41.395320892333984, "global_step": 180645, "epoch": 1492} {"train_loss": -39.927852630615234, "global_step": 180646, "epoch": 1492} {"train_loss": -40.501731872558594, "global_step": 180647, "epoch": 1492} {"train_loss": -37.93195724487305, "global_step": 180648, "epoch": 1492} {"train_loss": -41.846038818359375, "global_step": 180649, "epoch": 1492} {"train_loss": -35.913875579833984, "global_step": 180650, "epoch": 1492} {"train_loss": -36.42409133911133, "global_step": 180651, "epoch": 1492} {"train_loss": -41.226513728622564, "global_step": 180652, "epoch": 1492, "val_loss": 2707704.0} {"train_loss": -33.8336296081543, "global_step": 180653, "epoch": 1493} {"train_loss": -24.206281661987305, "global_step": 180654, "epoch": 1493} {"train_loss": 46.67314147949219, "global_step": 180655, "epoch": 1493} {"train_loss": 29.831357955932617, "global_step": 180656, "epoch": 1493} {"train_loss": 1.2299976348876953, "global_step": 180657, "epoch": 1493} {"train_loss": 8.654643058776855, "global_step": 180658, "epoch": 1493} {"train_loss": -3.2664456367492676, "global_step": 180659, "epoch": 1493} {"train_loss": -11.482086181640625, "global_step": 180660, "epoch": 1493} {"train_loss": -6.743592739105225, "global_step": 180661, "epoch": 1493} {"train_loss": -10.849539756774902, "global_step": 180662, "epoch": 1493} {"train_loss": -24.606685638427734, "global_step": 180663, "epoch": 1493} {"train_loss": -26.16861915588379, "global_step": 180664, "epoch": 1493} {"train_loss": -17.7817440032959, "global_step": 180665, "epoch": 1493} {"train_loss": -21.875654220581055, "global_step": 180666, "epoch": 1493} {"train_loss": -29.64423179626465, "global_step": 180667, "epoch": 1493} {"train_loss": -30.79949951171875, "global_step": 180668, "epoch": 1493} {"train_loss": -27.54180908203125, "global_step": 180669, "epoch": 1493} {"train_loss": -27.178747177124023, "global_step": 180670, "epoch": 1493} {"train_loss": -29.744922637939453, "global_step": 180671, "epoch": 1493} {"train_loss": -30.39999771118164, "global_step": 180672, "epoch": 1493} {"train_loss": -32.56645965576172, "global_step": 180673, "epoch": 1493} {"train_loss": -32.24836349487305, "global_step": 180674, "epoch": 1493} {"train_loss": -33.1898307800293, "global_step": 180675, "epoch": 1493} {"train_loss": -32.68085479736328, "global_step": 180676, "epoch": 1493} {"train_loss": -31.39446449279785, "global_step": 180677, "epoch": 1493} {"train_loss": -31.736724853515625, "global_step": 180678, "epoch": 1493} {"train_loss": -33.034481048583984, "global_step": 180679, "epoch": 1493} {"train_loss": -34.4079704284668, "global_step": 180680, "epoch": 1493} {"train_loss": -34.72427749633789, "global_step": 180681, "epoch": 1493} {"train_loss": -35.02985382080078, "global_step": 180682, "epoch": 1493} {"train_loss": -35.71187973022461, "global_step": 180683, "epoch": 1493} {"train_loss": -34.93264389038086, "global_step": 180684, "epoch": 1493} {"train_loss": -35.27273941040039, "global_step": 180685, "epoch": 1493} {"train_loss": -35.39899826049805, "global_step": 180686, "epoch": 1493} {"train_loss": -34.00804138183594, "global_step": 180687, "epoch": 1493} {"train_loss": -34.3739013671875, "global_step": 180688, "epoch": 1493} {"train_loss": -34.96833419799805, "global_step": 180689, "epoch": 1493} {"train_loss": -36.105613708496094, "global_step": 180690, "epoch": 1493} {"train_loss": -35.992244720458984, "global_step": 180691, "epoch": 1493} {"train_loss": -36.08578109741211, "global_step": 180692, "epoch": 1493} {"train_loss": -36.054988861083984, "global_step": 180693, "epoch": 1493} {"train_loss": -36.36416244506836, "global_step": 180694, "epoch": 1493} {"train_loss": -35.988582611083984, "global_step": 180695, "epoch": 1493} {"train_loss": -35.9676513671875, "global_step": 180696, "epoch": 1493} {"train_loss": -35.66864013671875, "global_step": 180697, "epoch": 1493} {"train_loss": -36.44025421142578, "global_step": 180698, "epoch": 1493} {"train_loss": -36.524024963378906, "global_step": 180699, "epoch": 1493} {"train_loss": -36.53006362915039, "global_step": 180700, "epoch": 1493} {"train_loss": -36.84836959838867, "global_step": 180701, "epoch": 1493} {"train_loss": -37.129730224609375, "global_step": 180702, "epoch": 1493} {"train_loss": -37.491363525390625, "global_step": 180703, "epoch": 1493} {"train_loss": -37.06474685668945, "global_step": 180704, "epoch": 1493} {"train_loss": -37.37555694580078, "global_step": 180705, "epoch": 1493} {"train_loss": -37.07990264892578, "global_step": 180706, "epoch": 1493} {"train_loss": -37.31376647949219, "global_step": 180707, "epoch": 1493} {"train_loss": -37.298492431640625, "global_step": 180708, "epoch": 1493} {"train_loss": -37.77099609375, "global_step": 180709, "epoch": 1493} {"train_loss": -37.135658264160156, "global_step": 180710, "epoch": 1493} {"train_loss": -38.094512939453125, "global_step": 180711, "epoch": 1493} {"train_loss": -38.188697814941406, "global_step": 180712, "epoch": 1493} {"train_loss": -37.97578811645508, "global_step": 180713, "epoch": 1493} {"train_loss": -37.81935119628906, "global_step": 180714, "epoch": 1493} {"train_loss": -38.69674301147461, "global_step": 180715, "epoch": 1493} {"train_loss": -38.4695930480957, "global_step": 180716, "epoch": 1493} {"train_loss": -38.45060729980469, "global_step": 180717, "epoch": 1493} {"train_loss": -37.8848991394043, "global_step": 180718, "epoch": 1493} {"train_loss": -38.324119567871094, "global_step": 180719, "epoch": 1493} {"train_loss": -37.79365158081055, "global_step": 180720, "epoch": 1493} {"train_loss": -38.47352981567383, "global_step": 180721, "epoch": 1493} {"train_loss": -39.04823684692383, "global_step": 180722, "epoch": 1493} {"train_loss": -38.33805465698242, "global_step": 180723, "epoch": 1493} {"train_loss": -38.5481071472168, "global_step": 180724, "epoch": 1493} {"train_loss": -38.92607116699219, "global_step": 180725, "epoch": 1493} {"train_loss": -39.043148040771484, "global_step": 180726, "epoch": 1493} {"train_loss": -38.6839714050293, "global_step": 180727, "epoch": 1493} {"train_loss": -38.80322265625, "global_step": 180728, "epoch": 1493} {"train_loss": -38.520790100097656, "global_step": 180729, "epoch": 1493} {"train_loss": -39.052730560302734, "global_step": 180730, "epoch": 1493} {"train_loss": -39.19942092895508, "global_step": 180731, "epoch": 1493} {"train_loss": -39.33875274658203, "global_step": 180732, "epoch": 1493} {"train_loss": -39.04926681518555, "global_step": 180733, "epoch": 1493} {"train_loss": -39.59885787963867, "global_step": 180734, "epoch": 1493} {"train_loss": -39.22612380981445, "global_step": 180735, "epoch": 1493} {"train_loss": -39.4357795715332, "global_step": 180736, "epoch": 1493} {"train_loss": -39.352569580078125, "global_step": 180737, "epoch": 1493} {"train_loss": -39.981231689453125, "global_step": 180738, "epoch": 1493} {"train_loss": -39.79888916015625, "global_step": 180739, "epoch": 1493} {"train_loss": -39.50936508178711, "global_step": 180740, "epoch": 1493} {"train_loss": -39.71613693237305, "global_step": 180741, "epoch": 1493} {"train_loss": -39.449398040771484, "global_step": 180742, "epoch": 1493} {"train_loss": -40.22136306762695, "global_step": 180743, "epoch": 1493} {"train_loss": -39.85380935668945, "global_step": 180744, "epoch": 1493} {"train_loss": -39.832942962646484, "global_step": 180745, "epoch": 1493} {"train_loss": -39.62485885620117, "global_step": 180746, "epoch": 1493} {"train_loss": -40.17823028564453, "global_step": 180747, "epoch": 1493} {"train_loss": -39.847633361816406, "global_step": 180748, "epoch": 1493} {"train_loss": -40.25069046020508, "global_step": 180749, "epoch": 1493} {"train_loss": -40.60321807861328, "global_step": 180750, "epoch": 1493} {"train_loss": -40.438167572021484, "global_step": 180751, "epoch": 1493} {"train_loss": -40.401912689208984, "global_step": 180752, "epoch": 1493} {"train_loss": -40.297115325927734, "global_step": 180753, "epoch": 1493} {"train_loss": -40.022850036621094, "global_step": 180754, "epoch": 1493} {"train_loss": -40.14789962768555, "global_step": 180755, "epoch": 1493} {"train_loss": -40.62836456298828, "global_step": 180756, "epoch": 1493} {"train_loss": -40.73720932006836, "global_step": 180757, "epoch": 1493} {"train_loss": -40.94678497314453, "global_step": 180758, "epoch": 1493} {"train_loss": -40.61088180541992, "global_step": 180759, "epoch": 1493} {"train_loss": -40.34060287475586, "global_step": 180760, "epoch": 1493} {"train_loss": -40.86753463745117, "global_step": 180761, "epoch": 1493} {"train_loss": -40.749114990234375, "global_step": 180762, "epoch": 1493} {"train_loss": -40.9495735168457, "global_step": 180763, "epoch": 1493} {"train_loss": -40.72181701660156, "global_step": 180764, "epoch": 1493} {"train_loss": -40.604183197021484, "global_step": 180765, "epoch": 1493} {"train_loss": -40.839534759521484, "global_step": 180766, "epoch": 1493} {"train_loss": -40.80842208862305, "global_step": 180767, "epoch": 1493} {"train_loss": -41.29081344604492, "global_step": 180768, "epoch": 1493} {"train_loss": -41.17546463012695, "global_step": 180769, "epoch": 1493} {"train_loss": -41.1087646484375, "global_step": 180770, "epoch": 1493} {"train_loss": -40.958675384521484, "global_step": 180771, "epoch": 1493} {"train_loss": -40.907249450683594, "global_step": 180772, "epoch": 1493} {"train_loss": -34.014239319099865, "global_step": 180773, "epoch": 1493, "val_loss": 2712458.75} {"train_loss": -41.11488342285156, "global_step": 180774, "epoch": 1494} {"train_loss": -41.2032585144043, "global_step": 180775, "epoch": 1494} {"train_loss": -41.2153434753418, "global_step": 180776, "epoch": 1494} {"train_loss": -41.36468505859375, "global_step": 180777, "epoch": 1494} {"train_loss": -41.482418060302734, "global_step": 180778, "epoch": 1494} {"train_loss": -41.2354850769043, "global_step": 180779, "epoch": 1494} {"train_loss": -41.24994659423828, "global_step": 180780, "epoch": 1494} {"train_loss": -41.76271438598633, "global_step": 180781, "epoch": 1494} {"train_loss": -41.501014709472656, "global_step": 180782, "epoch": 1494} {"train_loss": -41.6039924621582, "global_step": 180783, "epoch": 1494} {"train_loss": -41.40190505981445, "global_step": 180784, "epoch": 1494} {"train_loss": -41.667903900146484, "global_step": 180785, "epoch": 1494} {"train_loss": -41.69855880737305, "global_step": 180786, "epoch": 1494} {"train_loss": -41.976497650146484, "global_step": 180787, "epoch": 1494} {"train_loss": -41.65729522705078, "global_step": 180788, "epoch": 1494} {"train_loss": -41.904815673828125, "global_step": 180789, "epoch": 1494} {"train_loss": -41.882747650146484, "global_step": 180790, "epoch": 1494} {"train_loss": -41.96175003051758, "global_step": 180791, "epoch": 1494} {"train_loss": -41.714569091796875, "global_step": 180792, "epoch": 1494} {"train_loss": -41.85284423828125, "global_step": 180793, "epoch": 1494} {"train_loss": -41.9421501159668, "global_step": 180794, "epoch": 1494} {"train_loss": -41.70676803588867, "global_step": 180795, "epoch": 1494} {"train_loss": -41.94932174682617, "global_step": 180796, "epoch": 1494} {"train_loss": -41.6612663269043, "global_step": 180797, "epoch": 1494} {"train_loss": -41.91006088256836, "global_step": 180798, "epoch": 1494} {"train_loss": -42.20979690551758, "global_step": 180799, "epoch": 1494} {"train_loss": -42.20264434814453, "global_step": 180800, "epoch": 1494} {"train_loss": -42.09952926635742, "global_step": 180801, "epoch": 1494} {"train_loss": -41.7619743347168, "global_step": 180802, "epoch": 1494} {"train_loss": -41.993221282958984, "global_step": 180803, "epoch": 1494} {"train_loss": -42.12401580810547, "global_step": 180804, "epoch": 1494} {"train_loss": -41.03255844116211, "global_step": 180805, "epoch": 1494} {"train_loss": -42.13172912597656, "global_step": 180806, "epoch": 1494} {"train_loss": -41.785274505615234, "global_step": 180807, "epoch": 1494} {"train_loss": -41.72176742553711, "global_step": 180808, "epoch": 1494} {"train_loss": -42.2069206237793, "global_step": 180809, "epoch": 1494} {"train_loss": -42.14041519165039, "global_step": 180810, "epoch": 1494} {"train_loss": -42.361976623535156, "global_step": 180811, "epoch": 1494} {"train_loss": -42.388580322265625, "global_step": 180812, "epoch": 1494} {"train_loss": -41.88916015625, "global_step": 180813, "epoch": 1494} {"train_loss": -42.37226486206055, "global_step": 180814, "epoch": 1494} {"train_loss": -41.93547439575195, "global_step": 180815, "epoch": 1494} {"train_loss": -42.1204833984375, "global_step": 180816, "epoch": 1494} {"train_loss": -42.2502326965332, "global_step": 180817, "epoch": 1494} {"train_loss": -42.51585006713867, "global_step": 180818, "epoch": 1494} {"train_loss": -42.16719055175781, "global_step": 180819, "epoch": 1494} {"train_loss": -41.4304313659668, "global_step": 180820, "epoch": 1494} {"train_loss": -41.32136154174805, "global_step": 180821, "epoch": 1494} {"train_loss": -41.41439437866211, "global_step": 180822, "epoch": 1494} {"train_loss": -42.088890075683594, "global_step": 180823, "epoch": 1494} {"train_loss": -42.23939514160156, "global_step": 180824, "epoch": 1494} {"train_loss": -41.24671173095703, "global_step": 180825, "epoch": 1494} {"train_loss": -40.41693878173828, "global_step": 180826, "epoch": 1494} {"train_loss": -39.574867248535156, "global_step": 180827, "epoch": 1494} {"train_loss": -38.61522674560547, "global_step": 180828, "epoch": 1494} {"train_loss": -41.539363861083984, "global_step": 180829, "epoch": 1494} {"train_loss": -38.59293746948242, "global_step": 180830, "epoch": 1494} {"train_loss": -37.746124267578125, "global_step": 180831, "epoch": 1494} {"train_loss": -39.73085403442383, "global_step": 180832, "epoch": 1494} {"train_loss": -39.9072380065918, "global_step": 180833, "epoch": 1494} {"train_loss": -38.21699142456055, "global_step": 180834, "epoch": 1494} {"train_loss": -36.89619445800781, "global_step": 180835, "epoch": 1494} {"train_loss": -39.60258102416992, "global_step": 180836, "epoch": 1494} {"train_loss": -40.08786392211914, "global_step": 180837, "epoch": 1494} {"train_loss": -36.424476623535156, "global_step": 180838, "epoch": 1494} {"train_loss": -39.79821014404297, "global_step": 180839, "epoch": 1494} {"train_loss": -39.544368743896484, "global_step": 180840, "epoch": 1494} {"train_loss": -38.18084716796875, "global_step": 180841, "epoch": 1494} {"train_loss": -40.116912841796875, "global_step": 180842, "epoch": 1494} {"train_loss": -39.6051025390625, "global_step": 180843, "epoch": 1494} {"train_loss": -39.64396286010742, "global_step": 180844, "epoch": 1494} {"train_loss": -39.64856719970703, "global_step": 180845, "epoch": 1494} {"train_loss": -39.26337814331055, "global_step": 180846, "epoch": 1494} {"train_loss": -39.88833236694336, "global_step": 180847, "epoch": 1494} {"train_loss": -39.35951614379883, "global_step": 180848, "epoch": 1494} {"train_loss": -39.83515548706055, "global_step": 180849, "epoch": 1494} {"train_loss": -40.0933952331543, "global_step": 180850, "epoch": 1494} {"train_loss": -40.21830368041992, "global_step": 180851, "epoch": 1494} {"train_loss": -38.545021057128906, "global_step": 180852, "epoch": 1494} {"train_loss": -41.168209075927734, "global_step": 180853, "epoch": 1494} {"train_loss": -39.092552185058594, "global_step": 180854, "epoch": 1494} {"train_loss": -40.8623046875, "global_step": 180855, "epoch": 1494} {"train_loss": -39.57693862915039, "global_step": 180856, "epoch": 1494} {"train_loss": -40.9455680847168, "global_step": 180857, "epoch": 1494} {"train_loss": -40.4658203125, "global_step": 180858, "epoch": 1494} {"train_loss": -40.88393783569336, "global_step": 180859, "epoch": 1494} {"train_loss": -39.421775817871094, "global_step": 180860, "epoch": 1494} {"train_loss": -40.8770866394043, "global_step": 180861, "epoch": 1494} {"train_loss": -40.524410247802734, "global_step": 180862, "epoch": 1494} {"train_loss": -39.24250411987305, "global_step": 180863, "epoch": 1494} {"train_loss": -40.45014190673828, "global_step": 180864, "epoch": 1494} {"train_loss": -40.83650588989258, "global_step": 180865, "epoch": 1494} {"train_loss": -40.08876419067383, "global_step": 180866, "epoch": 1494} {"train_loss": -41.18299102783203, "global_step": 180867, "epoch": 1494} {"train_loss": -40.455238342285156, "global_step": 180868, "epoch": 1494} {"train_loss": -41.26457977294922, "global_step": 180869, "epoch": 1494} {"train_loss": -41.33042526245117, "global_step": 180870, "epoch": 1494} {"train_loss": -40.94123077392578, "global_step": 180871, "epoch": 1494} {"train_loss": -41.590938568115234, "global_step": 180872, "epoch": 1494} {"train_loss": -41.76932907104492, "global_step": 180873, "epoch": 1494} {"train_loss": -41.75507736206055, "global_step": 180874, "epoch": 1494} {"train_loss": -41.3210563659668, "global_step": 180875, "epoch": 1494} {"train_loss": -41.285945892333984, "global_step": 180876, "epoch": 1494} {"train_loss": -41.4279899597168, "global_step": 180877, "epoch": 1494} {"train_loss": -41.79369354248047, "global_step": 180878, "epoch": 1494} {"train_loss": -41.22076416015625, "global_step": 180879, "epoch": 1494} {"train_loss": -40.99660110473633, "global_step": 180880, "epoch": 1494} {"train_loss": -41.51186752319336, "global_step": 180881, "epoch": 1494} {"train_loss": -41.3499870300293, "global_step": 180882, "epoch": 1494} {"train_loss": -42.01520538330078, "global_step": 180883, "epoch": 1494} {"train_loss": -42.03911209106445, "global_step": 180884, "epoch": 1494} {"train_loss": -42.03215408325195, "global_step": 180885, "epoch": 1494} {"train_loss": -41.698822021484375, "global_step": 180886, "epoch": 1494} {"train_loss": -41.826107025146484, "global_step": 180887, "epoch": 1494} {"train_loss": -42.26919174194336, "global_step": 180888, "epoch": 1494} {"train_loss": -42.330745697021484, "global_step": 180889, "epoch": 1494} {"train_loss": -42.2169075012207, "global_step": 180890, "epoch": 1494} {"train_loss": -42.36764144897461, "global_step": 180891, "epoch": 1494} {"train_loss": -42.074214935302734, "global_step": 180892, "epoch": 1494} {"train_loss": -42.099082946777344, "global_step": 180893, "epoch": 1494} {"train_loss": -41.04062526482196, "global_step": 180894, "epoch": 1494, "val_loss": 2721948.75} {"train_loss": -42.74042892456055, "global_step": 180895, "epoch": 1495} {"train_loss": -41.7183837890625, "global_step": 180896, "epoch": 1495} {"train_loss": -42.13245391845703, "global_step": 180897, "epoch": 1495} {"train_loss": -41.94181823730469, "global_step": 180898, "epoch": 1495} {"train_loss": -42.042579650878906, "global_step": 180899, "epoch": 1495} {"train_loss": -41.98701858520508, "global_step": 180900, "epoch": 1495} {"train_loss": -42.18610382080078, "global_step": 180901, "epoch": 1495} {"train_loss": -41.762306213378906, "global_step": 180902, "epoch": 1495} {"train_loss": -41.26408004760742, "global_step": 180903, "epoch": 1495} {"train_loss": -42.553367614746094, "global_step": 180904, "epoch": 1495} {"train_loss": -40.916954040527344, "global_step": 180905, "epoch": 1495} {"train_loss": -41.148868560791016, "global_step": 180906, "epoch": 1495} {"train_loss": -41.98651123046875, "global_step": 180907, "epoch": 1495} {"train_loss": -40.82319641113281, "global_step": 180908, "epoch": 1495} {"train_loss": -41.534271240234375, "global_step": 180909, "epoch": 1495} {"train_loss": -40.222267150878906, "global_step": 180910, "epoch": 1495} {"train_loss": -42.071632385253906, "global_step": 180911, "epoch": 1495} {"train_loss": -41.53585433959961, "global_step": 180912, "epoch": 1495} {"train_loss": -41.23728561401367, "global_step": 180913, "epoch": 1495} {"train_loss": -41.24906539916992, "global_step": 180914, "epoch": 1495} {"train_loss": -39.48529815673828, "global_step": 180915, "epoch": 1495} {"train_loss": -38.71273422241211, "global_step": 180916, "epoch": 1495} {"train_loss": -39.74576950073242, "global_step": 180917, "epoch": 1495} {"train_loss": -39.485496520996094, "global_step": 180918, "epoch": 1495} {"train_loss": -40.523841857910156, "global_step": 180919, "epoch": 1495} {"train_loss": -40.746089935302734, "global_step": 180920, "epoch": 1495} {"train_loss": -39.6158561706543, "global_step": 180921, "epoch": 1495} {"train_loss": -41.02598571777344, "global_step": 180922, "epoch": 1495} {"train_loss": -41.37690353393555, "global_step": 180923, "epoch": 1495} {"train_loss": -41.164764404296875, "global_step": 180924, "epoch": 1495} {"train_loss": -41.18516540527344, "global_step": 180925, "epoch": 1495} {"train_loss": -40.77822494506836, "global_step": 180926, "epoch": 1495} {"train_loss": -41.82135772705078, "global_step": 180927, "epoch": 1495} {"train_loss": -40.456207275390625, "global_step": 180928, "epoch": 1495} {"train_loss": -41.72500228881836, "global_step": 180929, "epoch": 1495} {"train_loss": -41.64204025268555, "global_step": 180930, "epoch": 1495} {"train_loss": -41.2811279296875, "global_step": 180931, "epoch": 1495} {"train_loss": -41.94106674194336, "global_step": 180932, "epoch": 1495} {"train_loss": -40.9288444519043, "global_step": 180933, "epoch": 1495} {"train_loss": -41.675018310546875, "global_step": 180934, "epoch": 1495} {"train_loss": -41.594085693359375, "global_step": 180935, "epoch": 1495} {"train_loss": -41.8983039855957, "global_step": 180936, "epoch": 1495} {"train_loss": -41.95914840698242, "global_step": 180937, "epoch": 1495} {"train_loss": -41.99351119995117, "global_step": 180938, "epoch": 1495} {"train_loss": -41.79340744018555, "global_step": 180939, "epoch": 1495} {"train_loss": -41.9286003112793, "global_step": 180940, "epoch": 1495} {"train_loss": -41.73481369018555, "global_step": 180941, "epoch": 1495} {"train_loss": -41.21624755859375, "global_step": 180942, "epoch": 1495} {"train_loss": -41.55401611328125, "global_step": 180943, "epoch": 1495} {"train_loss": -41.90321350097656, "global_step": 180944, "epoch": 1495} {"train_loss": -41.66075897216797, "global_step": 180945, "epoch": 1495} {"train_loss": -41.54453659057617, "global_step": 180946, "epoch": 1495} {"train_loss": -42.088157653808594, "global_step": 180947, "epoch": 1495} {"train_loss": -41.682525634765625, "global_step": 180948, "epoch": 1495} {"train_loss": -41.658634185791016, "global_step": 180949, "epoch": 1495} {"train_loss": -41.291969299316406, "global_step": 180950, "epoch": 1495} {"train_loss": -40.52384567260742, "global_step": 180951, "epoch": 1495} {"train_loss": -39.189796447753906, "global_step": 180952, "epoch": 1495} {"train_loss": -38.17048645019531, "global_step": 180953, "epoch": 1495} {"train_loss": -40.49665451049805, "global_step": 180954, "epoch": 1495} {"train_loss": -42.529441833496094, "global_step": 180955, "epoch": 1495} {"train_loss": -41.4780387878418, "global_step": 180956, "epoch": 1495} {"train_loss": -39.50571060180664, "global_step": 180957, "epoch": 1495} {"train_loss": -40.28707504272461, "global_step": 180958, "epoch": 1495} {"train_loss": -42.247520446777344, "global_step": 180959, "epoch": 1495} {"train_loss": -39.219112396240234, "global_step": 180960, "epoch": 1495} {"train_loss": -35.0059814453125, "global_step": 180961, "epoch": 1495} {"train_loss": -41.15306091308594, "global_step": 180962, "epoch": 1495} {"train_loss": -41.136104583740234, "global_step": 180963, "epoch": 1495} {"train_loss": -36.845069885253906, "global_step": 180964, "epoch": 1495} {"train_loss": -35.52403259277344, "global_step": 180965, "epoch": 1495} {"train_loss": -40.654823303222656, "global_step": 180966, "epoch": 1495} {"train_loss": -37.855831146240234, "global_step": 180967, "epoch": 1495} {"train_loss": -33.65983963012695, "global_step": 180968, "epoch": 1495} {"train_loss": -41.39387893676758, "global_step": 180969, "epoch": 1495} {"train_loss": -38.77235794067383, "global_step": 180970, "epoch": 1495} {"train_loss": -40.51301574707031, "global_step": 180971, "epoch": 1495} {"train_loss": -37.8713493347168, "global_step": 180972, "epoch": 1495} {"train_loss": -38.181640625, "global_step": 180973, "epoch": 1495} {"train_loss": -39.92831039428711, "global_step": 180974, "epoch": 1495} {"train_loss": -36.0153694152832, "global_step": 180975, "epoch": 1495} {"train_loss": -41.26054000854492, "global_step": 180976, "epoch": 1495} {"train_loss": -37.974544525146484, "global_step": 180977, "epoch": 1495} {"train_loss": -41.21887969970703, "global_step": 180978, "epoch": 1495} {"train_loss": -38.11269760131836, "global_step": 180979, "epoch": 1495} {"train_loss": -41.45817184448242, "global_step": 180980, "epoch": 1495} {"train_loss": -39.63969421386719, "global_step": 180981, "epoch": 1495} {"train_loss": -41.697750091552734, "global_step": 180982, "epoch": 1495} {"train_loss": -40.10544204711914, "global_step": 180983, "epoch": 1495} {"train_loss": -41.71805191040039, "global_step": 180984, "epoch": 1495} {"train_loss": -40.6591796875, "global_step": 180985, "epoch": 1495} {"train_loss": -41.299617767333984, "global_step": 180986, "epoch": 1495} {"train_loss": -40.98708724975586, "global_step": 180987, "epoch": 1495} {"train_loss": -41.2499885559082, "global_step": 180988, "epoch": 1495} {"train_loss": -41.4827995300293, "global_step": 180989, "epoch": 1495} {"train_loss": -41.34022903442383, "global_step": 180990, "epoch": 1495} {"train_loss": -41.958740234375, "global_step": 180991, "epoch": 1495} {"train_loss": -41.58039474487305, "global_step": 180992, "epoch": 1495} {"train_loss": -41.73395919799805, "global_step": 180993, "epoch": 1495} {"train_loss": -41.351802825927734, "global_step": 180994, "epoch": 1495} {"train_loss": -41.7578010559082, "global_step": 180995, "epoch": 1495} {"train_loss": -41.64316940307617, "global_step": 180996, "epoch": 1495} {"train_loss": -41.08356857299805, "global_step": 180997, "epoch": 1495} {"train_loss": -41.48503875732422, "global_step": 180998, "epoch": 1495} {"train_loss": -41.81950378417969, "global_step": 180999, "epoch": 1495} {"train_loss": -41.62162399291992, "global_step": 181000, "epoch": 1495} {"train_loss": -41.71133041381836, "global_step": 181001, "epoch": 1495} {"train_loss": -42.2734489440918, "global_step": 181002, "epoch": 1495} {"train_loss": -41.89293670654297, "global_step": 181003, "epoch": 1495} {"train_loss": -42.02920913696289, "global_step": 181004, "epoch": 1495} {"train_loss": -41.89443588256836, "global_step": 181005, "epoch": 1495} {"train_loss": -42.34108352661133, "global_step": 181006, "epoch": 1495} {"train_loss": -41.94377517700195, "global_step": 181007, "epoch": 1495} {"train_loss": -42.22040939331055, "global_step": 181008, "epoch": 1495} {"train_loss": -42.116695404052734, "global_step": 181009, "epoch": 1495} {"train_loss": -42.41845703125, "global_step": 181010, "epoch": 1495} {"train_loss": -42.3541259765625, "global_step": 181011, "epoch": 1495} {"train_loss": -41.802616119384766, "global_step": 181012, "epoch": 1495} {"train_loss": -42.1571159362793, "global_step": 181013, "epoch": 1495} {"train_loss": -42.25738525390625, "global_step": 181014, "epoch": 1495} {"train_loss": -40.925406936771616, "global_step": 181015, "epoch": 1495, "val_loss": 2716464.5} {"train_loss": -42.23382568359375, "global_step": 181016, "epoch": 1496} {"train_loss": -42.67183303833008, "global_step": 181017, "epoch": 1496} {"train_loss": -42.242431640625, "global_step": 181018, "epoch": 1496} {"train_loss": -42.114376068115234, "global_step": 181019, "epoch": 1496} {"train_loss": -42.40456771850586, "global_step": 181020, "epoch": 1496} {"train_loss": -42.79051971435547, "global_step": 181021, "epoch": 1496} {"train_loss": -41.98924255371094, "global_step": 181022, "epoch": 1496} {"train_loss": -42.706390380859375, "global_step": 181023, "epoch": 1496} {"train_loss": -42.64631271362305, "global_step": 181024, "epoch": 1496} {"train_loss": -42.7158317565918, "global_step": 181025, "epoch": 1496} {"train_loss": -42.3636360168457, "global_step": 181026, "epoch": 1496} {"train_loss": -41.9950065612793, "global_step": 181027, "epoch": 1496} {"train_loss": -41.7781982421875, "global_step": 181028, "epoch": 1496} {"train_loss": -41.636653900146484, "global_step": 181029, "epoch": 1496} {"train_loss": -42.47064971923828, "global_step": 181030, "epoch": 1496} {"train_loss": -42.42783737182617, "global_step": 181031, "epoch": 1496} {"train_loss": -42.07377243041992, "global_step": 181032, "epoch": 1496} {"train_loss": -42.13637161254883, "global_step": 181033, "epoch": 1496} {"train_loss": -42.32745361328125, "global_step": 181034, "epoch": 1496} {"train_loss": -40.82877731323242, "global_step": 181035, "epoch": 1496} {"train_loss": -40.751808166503906, "global_step": 181036, "epoch": 1496} {"train_loss": -40.52540588378906, "global_step": 181037, "epoch": 1496} {"train_loss": -40.1224479675293, "global_step": 181038, "epoch": 1496} {"train_loss": -41.60689163208008, "global_step": 181039, "epoch": 1496} {"train_loss": -41.55490493774414, "global_step": 181040, "epoch": 1496} {"train_loss": -41.586666107177734, "global_step": 181041, "epoch": 1496} {"train_loss": -41.17665481567383, "global_step": 181042, "epoch": 1496} {"train_loss": -41.30292892456055, "global_step": 181043, "epoch": 1496} {"train_loss": -41.97727584838867, "global_step": 181044, "epoch": 1496} {"train_loss": -38.27363967895508, "global_step": 181045, "epoch": 1496} {"train_loss": -40.83743667602539, "global_step": 181046, "epoch": 1496} {"train_loss": -41.56248474121094, "global_step": 181047, "epoch": 1496} {"train_loss": -38.97561264038086, "global_step": 181048, "epoch": 1496} {"train_loss": -42.0074462890625, "global_step": 181049, "epoch": 1496} {"train_loss": -39.505035400390625, "global_step": 181050, "epoch": 1496} {"train_loss": -38.95651626586914, "global_step": 181051, "epoch": 1496} {"train_loss": -41.800472259521484, "global_step": 181052, "epoch": 1496} {"train_loss": -39.54774475097656, "global_step": 181053, "epoch": 1496} {"train_loss": -36.74987030029297, "global_step": 181054, "epoch": 1496} {"train_loss": -41.12052917480469, "global_step": 181055, "epoch": 1496} {"train_loss": -39.50033187866211, "global_step": 181056, "epoch": 1496} {"train_loss": -39.41938400268555, "global_step": 181057, "epoch": 1496} {"train_loss": -40.5886344909668, "global_step": 181058, "epoch": 1496} {"train_loss": -39.862457275390625, "global_step": 181059, "epoch": 1496} {"train_loss": -39.95425033569336, "global_step": 181060, "epoch": 1496} {"train_loss": -40.3186149597168, "global_step": 181061, "epoch": 1496} {"train_loss": -40.98948287963867, "global_step": 181062, "epoch": 1496} {"train_loss": -40.4527702331543, "global_step": 181063, "epoch": 1496} {"train_loss": -41.187129974365234, "global_step": 181064, "epoch": 1496} {"train_loss": -39.74018478393555, "global_step": 181065, "epoch": 1496} {"train_loss": -40.1366081237793, "global_step": 181066, "epoch": 1496} {"train_loss": -41.37415313720703, "global_step": 181067, "epoch": 1496} {"train_loss": -41.20499801635742, "global_step": 181068, "epoch": 1496} {"train_loss": -40.62518310546875, "global_step": 181069, "epoch": 1496} {"train_loss": -41.8910026550293, "global_step": 181070, "epoch": 1496} {"train_loss": -40.05598068237305, "global_step": 181071, "epoch": 1496} {"train_loss": -41.40966796875, "global_step": 181072, "epoch": 1496} {"train_loss": -41.566673278808594, "global_step": 181073, "epoch": 1496} {"train_loss": -41.85453414916992, "global_step": 181074, "epoch": 1496} {"train_loss": -41.15169906616211, "global_step": 181075, "epoch": 1496} {"train_loss": -41.40642166137695, "global_step": 181076, "epoch": 1496} {"train_loss": -41.62073516845703, "global_step": 181077, "epoch": 1496} {"train_loss": -41.42477035522461, "global_step": 181078, "epoch": 1496} {"train_loss": -42.35469055175781, "global_step": 181079, "epoch": 1496} {"train_loss": -41.61164093017578, "global_step": 181080, "epoch": 1496} {"train_loss": -41.65044021606445, "global_step": 181081, "epoch": 1496} {"train_loss": -42.0588264465332, "global_step": 181082, "epoch": 1496} {"train_loss": -41.38665771484375, "global_step": 181083, "epoch": 1496} {"train_loss": -40.96403121948242, "global_step": 181084, "epoch": 1496} {"train_loss": -42.0912971496582, "global_step": 181085, "epoch": 1496} {"train_loss": -41.515872955322266, "global_step": 181086, "epoch": 1496} {"train_loss": -41.25288772583008, "global_step": 181087, "epoch": 1496} {"train_loss": -40.544281005859375, "global_step": 181088, "epoch": 1496} {"train_loss": -41.98861312866211, "global_step": 181089, "epoch": 1496} {"train_loss": -41.34553146362305, "global_step": 181090, "epoch": 1496} {"train_loss": -41.94304275512695, "global_step": 181091, "epoch": 1496} {"train_loss": -42.4813232421875, "global_step": 181092, "epoch": 1496} {"train_loss": -42.15659713745117, "global_step": 181093, "epoch": 1496} {"train_loss": -42.41884994506836, "global_step": 181094, "epoch": 1496} {"train_loss": -41.91162872314453, "global_step": 181095, "epoch": 1496} {"train_loss": -41.67877960205078, "global_step": 181096, "epoch": 1496} {"train_loss": -41.70316696166992, "global_step": 181097, "epoch": 1496} {"train_loss": -41.81214904785156, "global_step": 181098, "epoch": 1496} {"train_loss": -42.04816818237305, "global_step": 181099, "epoch": 1496} {"train_loss": -41.939910888671875, "global_step": 181100, "epoch": 1496} {"train_loss": -42.499122619628906, "global_step": 181101, "epoch": 1496} {"train_loss": -42.37764358520508, "global_step": 181102, "epoch": 1496} {"train_loss": -41.397377014160156, "global_step": 181103, "epoch": 1496} {"train_loss": -42.25020980834961, "global_step": 181104, "epoch": 1496} {"train_loss": -41.89051055908203, "global_step": 181105, "epoch": 1496} {"train_loss": -42.49573516845703, "global_step": 181106, "epoch": 1496} {"train_loss": -42.14154052734375, "global_step": 181107, "epoch": 1496} {"train_loss": -42.36162185668945, "global_step": 181108, "epoch": 1496} {"train_loss": -42.3322868347168, "global_step": 181109, "epoch": 1496} {"train_loss": -42.13432693481445, "global_step": 181110, "epoch": 1496} {"train_loss": -42.10602951049805, "global_step": 181111, "epoch": 1496} {"train_loss": -41.91407012939453, "global_step": 181112, "epoch": 1496} {"train_loss": -41.980655670166016, "global_step": 181113, "epoch": 1496} {"train_loss": -40.9709358215332, "global_step": 181114, "epoch": 1496} {"train_loss": -41.59666442871094, "global_step": 181115, "epoch": 1496} {"train_loss": -41.87289047241211, "global_step": 181116, "epoch": 1496} {"train_loss": -41.13639450073242, "global_step": 181117, "epoch": 1496} {"train_loss": -42.17673873901367, "global_step": 181118, "epoch": 1496} {"train_loss": -42.1614990234375, "global_step": 181119, "epoch": 1496} {"train_loss": -41.36568832397461, "global_step": 181120, "epoch": 1496} {"train_loss": -42.37897491455078, "global_step": 181121, "epoch": 1496} {"train_loss": -42.21857833862305, "global_step": 181122, "epoch": 1496} {"train_loss": -41.00492858886719, "global_step": 181123, "epoch": 1496} {"train_loss": -40.055057525634766, "global_step": 181124, "epoch": 1496} {"train_loss": -41.87009048461914, "global_step": 181125, "epoch": 1496} {"train_loss": -39.31527328491211, "global_step": 181126, "epoch": 1496} {"train_loss": -41.300636291503906, "global_step": 181127, "epoch": 1496} {"train_loss": -41.8381462097168, "global_step": 181128, "epoch": 1496} {"train_loss": -40.3194580078125, "global_step": 181129, "epoch": 1496} {"train_loss": -41.556068420410156, "global_step": 181130, "epoch": 1496} {"train_loss": -42.22052001953125, "global_step": 181131, "epoch": 1496} {"train_loss": -41.63942337036133, "global_step": 181132, "epoch": 1496} {"train_loss": -42.19859313964844, "global_step": 181133, "epoch": 1496} {"train_loss": -41.45056915283203, "global_step": 181134, "epoch": 1496} {"train_loss": -41.609222412109375, "global_step": 181135, "epoch": 1496} {"train_loss": -41.419714431132164, "global_step": 181136, "epoch": 1496, "val_loss": 2744505.75} {"train_loss": -42.42713928222656, "global_step": 181137, "epoch": 1497} {"train_loss": -41.49064636230469, "global_step": 181138, "epoch": 1497} {"train_loss": -40.972957611083984, "global_step": 181139, "epoch": 1497} {"train_loss": -41.6705322265625, "global_step": 181140, "epoch": 1497} {"train_loss": -42.17637252807617, "global_step": 181141, "epoch": 1497} {"train_loss": -41.7407112121582, "global_step": 181142, "epoch": 1497} {"train_loss": -41.89165115356445, "global_step": 181143, "epoch": 1497} {"train_loss": -42.0944938659668, "global_step": 181144, "epoch": 1497} {"train_loss": -42.375892639160156, "global_step": 181145, "epoch": 1497} {"train_loss": -41.97665023803711, "global_step": 181146, "epoch": 1497} {"train_loss": -42.27705001831055, "global_step": 181147, "epoch": 1497} {"train_loss": -42.522010803222656, "global_step": 181148, "epoch": 1497} {"train_loss": -41.563507080078125, "global_step": 181149, "epoch": 1497} {"train_loss": -42.19565963745117, "global_step": 181150, "epoch": 1497} {"train_loss": -41.6379508972168, "global_step": 181151, "epoch": 1497} {"train_loss": -41.853878021240234, "global_step": 181152, "epoch": 1497} {"train_loss": -42.27154541015625, "global_step": 181153, "epoch": 1497} {"train_loss": -41.739410400390625, "global_step": 181154, "epoch": 1497} {"train_loss": -41.78419494628906, "global_step": 181155, "epoch": 1497} {"train_loss": -41.807899475097656, "global_step": 181156, "epoch": 1497} {"train_loss": -41.476844787597656, "global_step": 181157, "epoch": 1497} {"train_loss": -40.416378021240234, "global_step": 181158, "epoch": 1497} {"train_loss": -41.89882278442383, "global_step": 181159, "epoch": 1497} {"train_loss": -41.01776885986328, "global_step": 181160, "epoch": 1497} {"train_loss": -39.68473815917969, "global_step": 181161, "epoch": 1497} {"train_loss": -42.26544189453125, "global_step": 181162, "epoch": 1497} {"train_loss": -41.77190017700195, "global_step": 181163, "epoch": 1497} {"train_loss": -40.43394470214844, "global_step": 181164, "epoch": 1497} {"train_loss": -40.00790786743164, "global_step": 181165, "epoch": 1497} {"train_loss": -40.94856643676758, "global_step": 181166, "epoch": 1497} {"train_loss": -41.78594970703125, "global_step": 181167, "epoch": 1497} {"train_loss": -42.1309700012207, "global_step": 181168, "epoch": 1497} {"train_loss": -40.97951126098633, "global_step": 181169, "epoch": 1497} {"train_loss": -39.65375900268555, "global_step": 181170, "epoch": 1497} {"train_loss": -40.97991943359375, "global_step": 181171, "epoch": 1497} {"train_loss": -39.845455169677734, "global_step": 181172, "epoch": 1497} {"train_loss": -40.53913116455078, "global_step": 181173, "epoch": 1497} {"train_loss": -40.72233581542969, "global_step": 181174, "epoch": 1497} {"train_loss": -40.52998733520508, "global_step": 181175, "epoch": 1497} {"train_loss": -41.72267150878906, "global_step": 181176, "epoch": 1497} {"train_loss": -41.213985443115234, "global_step": 181177, "epoch": 1497} {"train_loss": -41.1679801940918, "global_step": 181178, "epoch": 1497} {"train_loss": -40.58012390136719, "global_step": 181179, "epoch": 1497} {"train_loss": -40.92578887939453, "global_step": 181180, "epoch": 1497} {"train_loss": -40.53024673461914, "global_step": 181181, "epoch": 1497} {"train_loss": -40.53553009033203, "global_step": 181182, "epoch": 1497} {"train_loss": -40.51162338256836, "global_step": 181183, "epoch": 1497} {"train_loss": -40.20622634887695, "global_step": 181184, "epoch": 1497} {"train_loss": -40.69105911254883, "global_step": 181185, "epoch": 1497} {"train_loss": -41.401092529296875, "global_step": 181186, "epoch": 1497} {"train_loss": -40.72542953491211, "global_step": 181187, "epoch": 1497} {"train_loss": -40.97389602661133, "global_step": 181188, "epoch": 1497} {"train_loss": -40.37910842895508, "global_step": 181189, "epoch": 1497} {"train_loss": -41.01638412475586, "global_step": 181190, "epoch": 1497} {"train_loss": -41.10516357421875, "global_step": 181191, "epoch": 1497} {"train_loss": -40.76866149902344, "global_step": 181192, "epoch": 1497} {"train_loss": -41.27716064453125, "global_step": 181193, "epoch": 1497} {"train_loss": -39.73624801635742, "global_step": 181194, "epoch": 1497} {"train_loss": -41.2817268371582, "global_step": 181195, "epoch": 1497} {"train_loss": -41.668128967285156, "global_step": 181196, "epoch": 1497} {"train_loss": -40.32011795043945, "global_step": 181197, "epoch": 1497} {"train_loss": -41.890907287597656, "global_step": 181198, "epoch": 1497} {"train_loss": -41.57760238647461, "global_step": 181199, "epoch": 1497} {"train_loss": -41.610347747802734, "global_step": 181200, "epoch": 1497} {"train_loss": -41.8654899597168, "global_step": 181201, "epoch": 1497} {"train_loss": -41.335296630859375, "global_step": 181202, "epoch": 1497} {"train_loss": -41.485321044921875, "global_step": 181203, "epoch": 1497} {"train_loss": -41.659664154052734, "global_step": 181204, "epoch": 1497} {"train_loss": -41.25075149536133, "global_step": 181205, "epoch": 1497} {"train_loss": -41.69239044189453, "global_step": 181206, "epoch": 1497} {"train_loss": -41.74388885498047, "global_step": 181207, "epoch": 1497} {"train_loss": -42.016510009765625, "global_step": 181208, "epoch": 1497} {"train_loss": -42.14280319213867, "global_step": 181209, "epoch": 1497} {"train_loss": -41.9835319519043, "global_step": 181210, "epoch": 1497} {"train_loss": -41.901695251464844, "global_step": 181211, "epoch": 1497} {"train_loss": -42.17255783081055, "global_step": 181212, "epoch": 1497} {"train_loss": -42.23310089111328, "global_step": 181213, "epoch": 1497} {"train_loss": -42.32101058959961, "global_step": 181214, "epoch": 1497} {"train_loss": -36.82387924194336, "global_step": 181215, "epoch": 1497} {"train_loss": -41.400543212890625, "global_step": 181216, "epoch": 1497} {"train_loss": -41.46790313720703, "global_step": 181217, "epoch": 1497} {"train_loss": -42.22709655761719, "global_step": 181218, "epoch": 1497} {"train_loss": -40.891357421875, "global_step": 181219, "epoch": 1497} {"train_loss": -41.12199020385742, "global_step": 181220, "epoch": 1497} {"train_loss": -40.82381057739258, "global_step": 181221, "epoch": 1497} {"train_loss": -41.534523010253906, "global_step": 181222, "epoch": 1497} {"train_loss": -39.67154312133789, "global_step": 181223, "epoch": 1497} {"train_loss": -40.81746292114258, "global_step": 181224, "epoch": 1497} {"train_loss": -40.4177360534668, "global_step": 181225, "epoch": 1497} {"train_loss": -41.23230743408203, "global_step": 181226, "epoch": 1497} {"train_loss": -40.84670639038086, "global_step": 181227, "epoch": 1497} {"train_loss": -39.630645751953125, "global_step": 181228, "epoch": 1497} {"train_loss": -41.274017333984375, "global_step": 181229, "epoch": 1497} {"train_loss": -38.061744689941406, "global_step": 181230, "epoch": 1497} {"train_loss": -38.03594207763672, "global_step": 181231, "epoch": 1497} {"train_loss": -39.567073822021484, "global_step": 181232, "epoch": 1497} {"train_loss": -30.689611434936523, "global_step": 181233, "epoch": 1497} {"train_loss": -39.443565368652344, "global_step": 181234, "epoch": 1497} {"train_loss": -40.4720458984375, "global_step": 181235, "epoch": 1497} {"train_loss": -39.728084564208984, "global_step": 181236, "epoch": 1497} {"train_loss": -40.49019241333008, "global_step": 181237, "epoch": 1497} {"train_loss": -40.971229553222656, "global_step": 181238, "epoch": 1497} {"train_loss": -39.19389724731445, "global_step": 181239, "epoch": 1497} {"train_loss": -40.28886795043945, "global_step": 181240, "epoch": 1497} {"train_loss": -40.458160400390625, "global_step": 181241, "epoch": 1497} {"train_loss": -40.31356430053711, "global_step": 181242, "epoch": 1497} {"train_loss": -40.788509368896484, "global_step": 181243, "epoch": 1497} {"train_loss": -39.24723434448242, "global_step": 181244, "epoch": 1497} {"train_loss": -40.71182632446289, "global_step": 181245, "epoch": 1497} {"train_loss": -40.37105941772461, "global_step": 181246, "epoch": 1497} {"train_loss": -39.94939422607422, "global_step": 181247, "epoch": 1497} {"train_loss": -38.97877502441406, "global_step": 181248, "epoch": 1497} {"train_loss": -41.37312698364258, "global_step": 181249, "epoch": 1497} {"train_loss": -40.3499641418457, "global_step": 181250, "epoch": 1497} {"train_loss": -41.04499053955078, "global_step": 181251, "epoch": 1497} {"train_loss": -40.49525833129883, "global_step": 181252, "epoch": 1497} {"train_loss": -35.54215621948242, "global_step": 181253, "epoch": 1497} {"train_loss": -41.31084060668945, "global_step": 181254, "epoch": 1497} {"train_loss": -41.49958038330078, "global_step": 181255, "epoch": 1497} {"train_loss": -39.71113967895508, "global_step": 181256, "epoch": 1497} {"train_loss": -40.86603919730699, "global_step": 181257, "epoch": 1497, "val_loss": 2782436.25} {"train_loss": -41.66025924682617, "global_step": 181258, "epoch": 1498} {"train_loss": -40.650997161865234, "global_step": 181259, "epoch": 1498} {"train_loss": -41.117794036865234, "global_step": 181260, "epoch": 1498} {"train_loss": -41.321441650390625, "global_step": 181261, "epoch": 1498} {"train_loss": -41.48018264770508, "global_step": 181262, "epoch": 1498} {"train_loss": -41.533714294433594, "global_step": 181263, "epoch": 1498} {"train_loss": -40.6478385925293, "global_step": 181264, "epoch": 1498} {"train_loss": -37.533485412597656, "global_step": 181265, "epoch": 1498} {"train_loss": -39.7965202331543, "global_step": 181266, "epoch": 1498} {"train_loss": -40.7878532409668, "global_step": 181267, "epoch": 1498} {"train_loss": -40.776214599609375, "global_step": 181268, "epoch": 1498} {"train_loss": -41.433467864990234, "global_step": 181269, "epoch": 1498} {"train_loss": -41.29704284667969, "global_step": 181270, "epoch": 1498} {"train_loss": -41.69818115234375, "global_step": 181271, "epoch": 1498} {"train_loss": -40.16987991333008, "global_step": 181272, "epoch": 1498} {"train_loss": -41.209861755371094, "global_step": 181273, "epoch": 1498} {"train_loss": -40.955543518066406, "global_step": 181274, "epoch": 1498} {"train_loss": -40.858856201171875, "global_step": 181275, "epoch": 1498} {"train_loss": -41.72704315185547, "global_step": 181276, "epoch": 1498} {"train_loss": -41.30286407470703, "global_step": 181277, "epoch": 1498} {"train_loss": -40.90217971801758, "global_step": 181278, "epoch": 1498} {"train_loss": -41.22850799560547, "global_step": 181279, "epoch": 1498} {"train_loss": -40.814632415771484, "global_step": 181280, "epoch": 1498} {"train_loss": -41.28718948364258, "global_step": 181281, "epoch": 1498} {"train_loss": -41.66561508178711, "global_step": 181282, "epoch": 1498} {"train_loss": -42.068756103515625, "global_step": 181283, "epoch": 1498} {"train_loss": -40.79446792602539, "global_step": 181284, "epoch": 1498} {"train_loss": -42.17789840698242, "global_step": 181285, "epoch": 1498} {"train_loss": -41.69544982910156, "global_step": 181286, "epoch": 1498} {"train_loss": -41.328426361083984, "global_step": 181287, "epoch": 1498} {"train_loss": -42.31406784057617, "global_step": 181288, "epoch": 1498} {"train_loss": -42.14896011352539, "global_step": 181289, "epoch": 1498} {"train_loss": -41.69000244140625, "global_step": 181290, "epoch": 1498} {"train_loss": -41.88412857055664, "global_step": 181291, "epoch": 1498} {"train_loss": -40.0395622253418, "global_step": 181292, "epoch": 1498} {"train_loss": -41.58002471923828, "global_step": 181293, "epoch": 1498} {"train_loss": -40.278743743896484, "global_step": 181294, "epoch": 1498} {"train_loss": -41.47201156616211, "global_step": 181295, "epoch": 1498} {"train_loss": -34.65805435180664, "global_step": 181296, "epoch": 1498} {"train_loss": -41.3553581237793, "global_step": 181297, "epoch": 1498} {"train_loss": -40.81681442260742, "global_step": 181298, "epoch": 1498} {"train_loss": -38.370880126953125, "global_step": 181299, "epoch": 1498} {"train_loss": -35.98025131225586, "global_step": 181300, "epoch": 1498} {"train_loss": -36.96639633178711, "global_step": 181301, "epoch": 1498} {"train_loss": -41.42866134643555, "global_step": 181302, "epoch": 1498} {"train_loss": -39.22074508666992, "global_step": 181303, "epoch": 1498} {"train_loss": -40.000484466552734, "global_step": 181304, "epoch": 1498} {"train_loss": -40.53127670288086, "global_step": 181305, "epoch": 1498} {"train_loss": -39.88225555419922, "global_step": 181306, "epoch": 1498} {"train_loss": -36.53181838989258, "global_step": 181307, "epoch": 1498} {"train_loss": -40.693756103515625, "global_step": 181308, "epoch": 1498} {"train_loss": -39.72290802001953, "global_step": 181309, "epoch": 1498} {"train_loss": -41.130149841308594, "global_step": 181310, "epoch": 1498} {"train_loss": -39.61152267456055, "global_step": 181311, "epoch": 1498} {"train_loss": -41.451454162597656, "global_step": 181312, "epoch": 1498} {"train_loss": -41.4509162902832, "global_step": 181313, "epoch": 1498} {"train_loss": -40.61261749267578, "global_step": 181314, "epoch": 1498} {"train_loss": -41.86166000366211, "global_step": 181315, "epoch": 1498} {"train_loss": -39.08094024658203, "global_step": 181316, "epoch": 1498} {"train_loss": -40.4676513671875, "global_step": 181317, "epoch": 1498} {"train_loss": -39.97003936767578, "global_step": 181318, "epoch": 1498} {"train_loss": -41.713802337646484, "global_step": 181319, "epoch": 1498} {"train_loss": -40.853946685791016, "global_step": 181320, "epoch": 1498} {"train_loss": -41.47368621826172, "global_step": 181321, "epoch": 1498} {"train_loss": -41.53498458862305, "global_step": 181322, "epoch": 1498} {"train_loss": -41.67501449584961, "global_step": 181323, "epoch": 1498} {"train_loss": -39.56666564941406, "global_step": 181324, "epoch": 1498} {"train_loss": -40.91300964355469, "global_step": 181325, "epoch": 1498} {"train_loss": -41.24916076660156, "global_step": 181326, "epoch": 1498} {"train_loss": -41.59810256958008, "global_step": 181327, "epoch": 1498} {"train_loss": -40.66499710083008, "global_step": 181328, "epoch": 1498} {"train_loss": -41.348297119140625, "global_step": 181329, "epoch": 1498} {"train_loss": -40.941707611083984, "global_step": 181330, "epoch": 1498} {"train_loss": -41.96401596069336, "global_step": 181331, "epoch": 1498} {"train_loss": -40.41828918457031, "global_step": 181332, "epoch": 1498} {"train_loss": -40.11777114868164, "global_step": 181333, "epoch": 1498} {"train_loss": -40.80123519897461, "global_step": 181334, "epoch": 1498} {"train_loss": -40.35103225708008, "global_step": 181335, "epoch": 1498} {"train_loss": -40.29705047607422, "global_step": 181336, "epoch": 1498} {"train_loss": -39.072444915771484, "global_step": 181337, "epoch": 1498} {"train_loss": -40.9924430847168, "global_step": 181338, "epoch": 1498} {"train_loss": -40.91426086425781, "global_step": 181339, "epoch": 1498} {"train_loss": -38.692359924316406, "global_step": 181340, "epoch": 1498} {"train_loss": -37.220924377441406, "global_step": 181341, "epoch": 1498} {"train_loss": -40.717498779296875, "global_step": 181342, "epoch": 1498} {"train_loss": -37.16024398803711, "global_step": 181343, "epoch": 1498} {"train_loss": -37.50221252441406, "global_step": 181344, "epoch": 1498} {"train_loss": -40.058040618896484, "global_step": 181345, "epoch": 1498} {"train_loss": -36.558998107910156, "global_step": 181346, "epoch": 1498} {"train_loss": -40.21809005737305, "global_step": 181347, "epoch": 1498} {"train_loss": -35.741119384765625, "global_step": 181348, "epoch": 1498} {"train_loss": -38.58722686767578, "global_step": 181349, "epoch": 1498} {"train_loss": -36.960235595703125, "global_step": 181350, "epoch": 1498} {"train_loss": -37.226287841796875, "global_step": 181351, "epoch": 1498} {"train_loss": -39.17798614501953, "global_step": 181352, "epoch": 1498} {"train_loss": -36.09037780761719, "global_step": 181353, "epoch": 1498} {"train_loss": -36.85578536987305, "global_step": 181354, "epoch": 1498} {"train_loss": -38.722412109375, "global_step": 181355, "epoch": 1498} {"train_loss": -36.978675842285156, "global_step": 181356, "epoch": 1498} {"train_loss": -39.03791427612305, "global_step": 181357, "epoch": 1498} {"train_loss": -37.4043083190918, "global_step": 181358, "epoch": 1498} {"train_loss": -38.55571746826172, "global_step": 181359, "epoch": 1498} {"train_loss": -36.960567474365234, "global_step": 181360, "epoch": 1498} {"train_loss": -37.46686935424805, "global_step": 181361, "epoch": 1498} {"train_loss": -38.03879928588867, "global_step": 181362, "epoch": 1498} {"train_loss": -36.495304107666016, "global_step": 181363, "epoch": 1498} {"train_loss": -36.84153366088867, "global_step": 181364, "epoch": 1498} {"train_loss": -37.743648529052734, "global_step": 181365, "epoch": 1498} {"train_loss": -36.3875732421875, "global_step": 181366, "epoch": 1498} {"train_loss": -38.04745101928711, "global_step": 181367, "epoch": 1498} {"train_loss": -37.55818557739258, "global_step": 181368, "epoch": 1498} {"train_loss": -37.581512451171875, "global_step": 181369, "epoch": 1498} {"train_loss": -40.10030746459961, "global_step": 181370, "epoch": 1498} {"train_loss": -37.3672981262207, "global_step": 181371, "epoch": 1498} {"train_loss": -40.65576934814453, "global_step": 181372, "epoch": 1498} {"train_loss": -38.39622497558594, "global_step": 181373, "epoch": 1498} {"train_loss": -39.06746292114258, "global_step": 181374, "epoch": 1498} {"train_loss": -39.88349533081055, "global_step": 181375, "epoch": 1498} {"train_loss": -39.3071403503418, "global_step": 181376, "epoch": 1498} {"train_loss": -38.99766159057617, "global_step": 181377, "epoch": 1498} {"train_loss": -39.83693578420592, "global_step": 181378, "epoch": 1498, "val_loss": 2594798.75} {"train_loss": -39.05933380126953, "global_step": 181379, "epoch": 1499} {"train_loss": -40.10968780517578, "global_step": 181380, "epoch": 1499} {"train_loss": -40.13387680053711, "global_step": 181381, "epoch": 1499} {"train_loss": -40.2104606628418, "global_step": 181382, "epoch": 1499} {"train_loss": -39.824188232421875, "global_step": 181383, "epoch": 1499} {"train_loss": -40.747005462646484, "global_step": 181384, "epoch": 1499} {"train_loss": -40.87323760986328, "global_step": 181385, "epoch": 1499} {"train_loss": -40.25600814819336, "global_step": 181386, "epoch": 1499} {"train_loss": -40.52494430541992, "global_step": 181387, "epoch": 1499} {"train_loss": -41.006744384765625, "global_step": 181388, "epoch": 1499} {"train_loss": -40.4359130859375, "global_step": 181389, "epoch": 1499} {"train_loss": -41.43391799926758, "global_step": 181390, "epoch": 1499} {"train_loss": -40.793548583984375, "global_step": 181391, "epoch": 1499} {"train_loss": -41.355838775634766, "global_step": 181392, "epoch": 1499} {"train_loss": -41.24312210083008, "global_step": 181393, "epoch": 1499} {"train_loss": -40.81666946411133, "global_step": 181394, "epoch": 1499} {"train_loss": -41.36225509643555, "global_step": 181395, "epoch": 1499} {"train_loss": -41.52619552612305, "global_step": 181396, "epoch": 1499} {"train_loss": -41.19533920288086, "global_step": 181397, "epoch": 1499} {"train_loss": -41.23244094848633, "global_step": 181398, "epoch": 1499} {"train_loss": -41.62302780151367, "global_step": 181399, "epoch": 1499} {"train_loss": -41.993751525878906, "global_step": 181400, "epoch": 1499} {"train_loss": -41.47012710571289, "global_step": 181401, "epoch": 1499} {"train_loss": -41.070369720458984, "global_step": 181402, "epoch": 1499} {"train_loss": -40.899776458740234, "global_step": 181403, "epoch": 1499} {"train_loss": -41.690425872802734, "global_step": 181404, "epoch": 1499} {"train_loss": -42.0570182800293, "global_step": 181405, "epoch": 1499} {"train_loss": -41.786739349365234, "global_step": 181406, "epoch": 1499} {"train_loss": -42.01607131958008, "global_step": 181407, "epoch": 1499} {"train_loss": -41.28165817260742, "global_step": 181408, "epoch": 1499} {"train_loss": -41.73030471801758, "global_step": 181409, "epoch": 1499} {"train_loss": -41.77529525756836, "global_step": 181410, "epoch": 1499} {"train_loss": -42.033817291259766, "global_step": 181411, "epoch": 1499} {"train_loss": -41.9123420715332, "global_step": 181412, "epoch": 1499} {"train_loss": -42.380393981933594, "global_step": 181413, "epoch": 1499} {"train_loss": -41.9871826171875, "global_step": 181414, "epoch": 1499} {"train_loss": -42.2296257019043, "global_step": 181415, "epoch": 1499} {"train_loss": -42.2442626953125, "global_step": 181416, "epoch": 1499} {"train_loss": -41.878028869628906, "global_step": 181417, "epoch": 1499} {"train_loss": -42.21086502075195, "global_step": 181418, "epoch": 1499} {"train_loss": -41.904144287109375, "global_step": 181419, "epoch": 1499} {"train_loss": -42.154537200927734, "global_step": 181420, "epoch": 1499} {"train_loss": -42.56083297729492, "global_step": 181421, "epoch": 1499} {"train_loss": -41.836978912353516, "global_step": 181422, "epoch": 1499} {"train_loss": -42.071651458740234, "global_step": 181423, "epoch": 1499} {"train_loss": -42.614322662353516, "global_step": 181424, "epoch": 1499} {"train_loss": -42.473968505859375, "global_step": 181425, "epoch": 1499} {"train_loss": -41.901153564453125, "global_step": 181426, "epoch": 1499} {"train_loss": -42.06912612915039, "global_step": 181427, "epoch": 1499} {"train_loss": -42.107662200927734, "global_step": 181428, "epoch": 1499} {"train_loss": -42.0234489440918, "global_step": 181429, "epoch": 1499} {"train_loss": -42.29501724243164, "global_step": 181430, "epoch": 1499} {"train_loss": -42.15159606933594, "global_step": 181431, "epoch": 1499} {"train_loss": -41.3339958190918, "global_step": 181432, "epoch": 1499} {"train_loss": -41.74148941040039, "global_step": 181433, "epoch": 1499} {"train_loss": -41.424560546875, "global_step": 181434, "epoch": 1499} {"train_loss": -40.707008361816406, "global_step": 181435, "epoch": 1499} {"train_loss": -41.764373779296875, "global_step": 181436, "epoch": 1499} {"train_loss": -41.028072357177734, "global_step": 181437, "epoch": 1499} {"train_loss": -40.53507995605469, "global_step": 181438, "epoch": 1499} {"train_loss": -38.57880401611328, "global_step": 181439, "epoch": 1499} {"train_loss": -41.90171432495117, "global_step": 181440, "epoch": 1499} {"train_loss": -41.758033752441406, "global_step": 181441, "epoch": 1499} {"train_loss": -40.405208587646484, "global_step": 181442, "epoch": 1499} {"train_loss": -41.89175796508789, "global_step": 181443, "epoch": 1499} {"train_loss": -41.23289108276367, "global_step": 181444, "epoch": 1499} {"train_loss": -41.73944091796875, "global_step": 181445, "epoch": 1499} {"train_loss": -41.688629150390625, "global_step": 181446, "epoch": 1499} {"train_loss": -38.950958251953125, "global_step": 181447, "epoch": 1499} {"train_loss": -40.14860916137695, "global_step": 181448, "epoch": 1499} {"train_loss": -40.95551300048828, "global_step": 181449, "epoch": 1499} {"train_loss": -40.96733856201172, "global_step": 181450, "epoch": 1499} {"train_loss": -40.910926818847656, "global_step": 181451, "epoch": 1499} {"train_loss": -40.40672302246094, "global_step": 181452, "epoch": 1499} {"train_loss": -39.66340255737305, "global_step": 181453, "epoch": 1499} {"train_loss": -39.08110809326172, "global_step": 181454, "epoch": 1499} {"train_loss": -39.984859466552734, "global_step": 181455, "epoch": 1499} {"train_loss": -41.34159469604492, "global_step": 181456, "epoch": 1499} {"train_loss": -40.803245544433594, "global_step": 181457, "epoch": 1499} {"train_loss": -41.06157302856445, "global_step": 181458, "epoch": 1499} {"train_loss": -38.479515075683594, "global_step": 181459, "epoch": 1499} {"train_loss": -38.902732849121094, "global_step": 181460, "epoch": 1499} {"train_loss": -40.926780700683594, "global_step": 181461, "epoch": 1499} {"train_loss": -37.17384719848633, "global_step": 181462, "epoch": 1499} {"train_loss": -38.09698486328125, "global_step": 181463, "epoch": 1499} {"train_loss": -39.13547134399414, "global_step": 181464, "epoch": 1499} {"train_loss": -40.29240798950195, "global_step": 181465, "epoch": 1499} {"train_loss": -38.0444221496582, "global_step": 181466, "epoch": 1499} {"train_loss": -37.441566467285156, "global_step": 181467, "epoch": 1499} {"train_loss": -38.229888916015625, "global_step": 181468, "epoch": 1499} {"train_loss": -39.54928207397461, "global_step": 181469, "epoch": 1499} {"train_loss": -36.71003341674805, "global_step": 181470, "epoch": 1499} {"train_loss": -38.483089447021484, "global_step": 181471, "epoch": 1499} {"train_loss": -39.2607536315918, "global_step": 181472, "epoch": 1499} {"train_loss": -38.08652877807617, "global_step": 181473, "epoch": 1499} {"train_loss": -38.48927688598633, "global_step": 181474, "epoch": 1499} {"train_loss": -39.74249267578125, "global_step": 181475, "epoch": 1499} {"train_loss": -40.55031967163086, "global_step": 181476, "epoch": 1499} {"train_loss": -39.44032287597656, "global_step": 181477, "epoch": 1499} {"train_loss": -41.1264533996582, "global_step": 181478, "epoch": 1499} {"train_loss": -41.35557556152344, "global_step": 181479, "epoch": 1499} {"train_loss": -40.63916015625, "global_step": 181480, "epoch": 1499} {"train_loss": -40.628265380859375, "global_step": 181481, "epoch": 1499} {"train_loss": -40.79384994506836, "global_step": 181482, "epoch": 1499} {"train_loss": -40.12082290649414, "global_step": 181483, "epoch": 1499} {"train_loss": -40.44015884399414, "global_step": 181484, "epoch": 1499} {"train_loss": -39.16023635864258, "global_step": 181485, "epoch": 1499} {"train_loss": -40.525169372558594, "global_step": 181486, "epoch": 1499} {"train_loss": -39.85271453857422, "global_step": 181487, "epoch": 1499} {"train_loss": -41.56246566772461, "global_step": 181488, "epoch": 1499} {"train_loss": -39.732608795166016, "global_step": 181489, "epoch": 1499} {"train_loss": -40.811195373535156, "global_step": 181490, "epoch": 1499} {"train_loss": -41.18596649169922, "global_step": 181491, "epoch": 1499} {"train_loss": -41.10017013549805, "global_step": 181492, "epoch": 1499} {"train_loss": -40.724876403808594, "global_step": 181493, "epoch": 1499} {"train_loss": -40.43897247314453, "global_step": 181494, "epoch": 1499} {"train_loss": -41.412330627441406, "global_step": 181495, "epoch": 1499} {"train_loss": -41.694801330566406, "global_step": 181496, "epoch": 1499} {"train_loss": -41.62449645996094, "global_step": 181497, "epoch": 1499} {"train_loss": -42.00286102294922, "global_step": 181498, "epoch": 1499} {"train_loss": -40.792808122871335, "global_step": 181499, "epoch": 1499, "val_loss": 2705349.25} {"train_loss": -40.58858871459961, "global_step": 181500, "epoch": 1500} {"train_loss": -40.30959701538086, "global_step": 181501, "epoch": 1500} {"train_loss": -41.57670211791992, "global_step": 181502, "epoch": 1500} {"train_loss": -41.424556732177734, "global_step": 181503, "epoch": 1500} {"train_loss": -41.426387786865234, "global_step": 181504, "epoch": 1500} {"train_loss": -39.91569137573242, "global_step": 181505, "epoch": 1500} {"train_loss": -41.85885238647461, "global_step": 181506, "epoch": 1500} {"train_loss": -41.5455436706543, "global_step": 181507, "epoch": 1500} {"train_loss": -41.09442138671875, "global_step": 181508, "epoch": 1500} {"train_loss": -42.11544418334961, "global_step": 181509, "epoch": 1500} {"train_loss": -42.382972717285156, "global_step": 181510, "epoch": 1500} {"train_loss": -41.52062225341797, "global_step": 181511, "epoch": 1500} {"train_loss": -41.692665100097656, "global_step": 181512, "epoch": 1500} {"train_loss": -41.847564697265625, "global_step": 181513, "epoch": 1500} {"train_loss": -42.013912200927734, "global_step": 181514, "epoch": 1500} {"train_loss": -40.85264205932617, "global_step": 181515, "epoch": 1500} {"train_loss": -41.35197830200195, "global_step": 181516, "epoch": 1500} {"train_loss": -42.393436431884766, "global_step": 181517, "epoch": 1500} {"train_loss": -40.987056732177734, "global_step": 181518, "epoch": 1500} {"train_loss": -42.31122970581055, "global_step": 181519, "epoch": 1500} {"train_loss": -42.1297492980957, "global_step": 181520, "epoch": 1500} {"train_loss": -41.69411087036133, "global_step": 181521, "epoch": 1500} {"train_loss": -41.77241134643555, "global_step": 181522, "epoch": 1500} {"train_loss": -42.09901809692383, "global_step": 181523, "epoch": 1500} {"train_loss": -41.79986572265625, "global_step": 181524, "epoch": 1500} {"train_loss": -42.0904655456543, "global_step": 181525, "epoch": 1500} {"train_loss": -42.083412170410156, "global_step": 181526, "epoch": 1500} {"train_loss": -42.5201530456543, "global_step": 181527, "epoch": 1500} {"train_loss": -41.89583206176758, "global_step": 181528, "epoch": 1500} {"train_loss": -42.167274475097656, "global_step": 181529, "epoch": 1500} {"train_loss": -42.184879302978516, "global_step": 181530, "epoch": 1500} {"train_loss": -42.492488861083984, "global_step": 181531, "epoch": 1500} {"train_loss": -42.215206146240234, "global_step": 181532, "epoch": 1500} {"train_loss": -41.581214904785156, "global_step": 181533, "epoch": 1500} {"train_loss": -40.507110595703125, "global_step": 181534, "epoch": 1500} {"train_loss": -39.78253173828125, "global_step": 181535, "epoch": 1500} {"train_loss": -42.653778076171875, "global_step": 181536, "epoch": 1500} {"train_loss": -40.22498321533203, "global_step": 181537, "epoch": 1500} {"train_loss": -40.236061096191406, "global_step": 181538, "epoch": 1500} {"train_loss": -42.157623291015625, "global_step": 181539, "epoch": 1500} {"train_loss": -41.55189514160156, "global_step": 181540, "epoch": 1500} {"train_loss": -40.14742660522461, "global_step": 181541, "epoch": 1500} {"train_loss": -42.10480880737305, "global_step": 181542, "epoch": 1500} {"train_loss": -37.635799407958984, "global_step": 181543, "epoch": 1500} {"train_loss": -41.796958923339844, "global_step": 181544, "epoch": 1500} {"train_loss": -39.87057876586914, "global_step": 181545, "epoch": 1500} {"train_loss": -39.651634216308594, "global_step": 181546, "epoch": 1500} {"train_loss": -40.46146774291992, "global_step": 181547, "epoch": 1500} {"train_loss": -34.85578536987305, "global_step": 181548, "epoch": 1500} {"train_loss": -39.93795394897461, "global_step": 181549, "epoch": 1500} {"train_loss": -38.79609298706055, "global_step": 181550, "epoch": 1500} {"train_loss": -39.02817916870117, "global_step": 181551, "epoch": 1500} {"train_loss": -40.9534912109375, "global_step": 181552, "epoch": 1500} {"train_loss": -38.814231872558594, "global_step": 181553, "epoch": 1500} {"train_loss": -41.076515197753906, "global_step": 181554, "epoch": 1500} {"train_loss": -39.99882888793945, "global_step": 181555, "epoch": 1500} {"train_loss": -41.04124069213867, "global_step": 181556, "epoch": 1500} {"train_loss": -40.61653518676758, "global_step": 181557, "epoch": 1500} {"train_loss": -41.24428176879883, "global_step": 181558, "epoch": 1500} {"train_loss": -40.813270568847656, "global_step": 181559, "epoch": 1500} {"train_loss": -41.87457275390625, "global_step": 181560, "epoch": 1500} {"train_loss": -41.24263381958008, "global_step": 181561, "epoch": 1500} {"train_loss": -41.43531799316406, "global_step": 181562, "epoch": 1500} {"train_loss": -40.602169036865234, "global_step": 181563, "epoch": 1500} {"train_loss": -41.95156478881836, "global_step": 181564, "epoch": 1500} {"train_loss": -40.53205490112305, "global_step": 181565, "epoch": 1500} {"train_loss": -41.706172943115234, "global_step": 181566, "epoch": 1500} {"train_loss": -40.60551071166992, "global_step": 181567, "epoch": 1500} {"train_loss": -41.52433395385742, "global_step": 181568, "epoch": 1500} {"train_loss": -40.829795837402344, "global_step": 181569, "epoch": 1500} {"train_loss": -41.32398223876953, "global_step": 181570, "epoch": 1500} {"train_loss": -40.58665084838867, "global_step": 181571, "epoch": 1500} {"train_loss": -41.554290771484375, "global_step": 181572, "epoch": 1500} {"train_loss": -41.3809700012207, "global_step": 181573, "epoch": 1500} {"train_loss": -41.169673919677734, "global_step": 181574, "epoch": 1500} {"train_loss": -41.887367248535156, "global_step": 181575, "epoch": 1500} {"train_loss": -40.849945068359375, "global_step": 181576, "epoch": 1500} {"train_loss": -41.529449462890625, "global_step": 181577, "epoch": 1500} {"train_loss": -40.97998046875, "global_step": 181578, "epoch": 1500} {"train_loss": -41.217628479003906, "global_step": 181579, "epoch": 1500} {"train_loss": -41.556495666503906, "global_step": 181580, "epoch": 1500} {"train_loss": -41.867794036865234, "global_step": 181581, "epoch": 1500} {"train_loss": -40.2607421875, "global_step": 181582, "epoch": 1500} {"train_loss": -40.07648849487305, "global_step": 181583, "epoch": 1500} {"train_loss": -42.16596603393555, "global_step": 181584, "epoch": 1500} {"train_loss": -39.77006912231445, "global_step": 181585, "epoch": 1500} {"train_loss": -40.93862533569336, "global_step": 181586, "epoch": 1500} {"train_loss": -41.390647888183594, "global_step": 181587, "epoch": 1500} {"train_loss": -41.15949630737305, "global_step": 181588, "epoch": 1500} {"train_loss": -40.65255355834961, "global_step": 181589, "epoch": 1500} {"train_loss": -41.34137725830078, "global_step": 181590, "epoch": 1500} {"train_loss": -41.81563949584961, "global_step": 181591, "epoch": 1500} {"train_loss": -41.34699630737305, "global_step": 181592, "epoch": 1500} {"train_loss": -41.2276496887207, "global_step": 181593, "epoch": 1500} {"train_loss": -41.96027374267578, "global_step": 181594, "epoch": 1500} {"train_loss": -41.57920455932617, "global_step": 181595, "epoch": 1500} {"train_loss": -40.91473388671875, "global_step": 181596, "epoch": 1500} {"train_loss": -41.46294021606445, "global_step": 181597, "epoch": 1500} {"train_loss": -41.967403411865234, "global_step": 181598, "epoch": 1500} {"train_loss": -42.422508239746094, "global_step": 181599, "epoch": 1500} {"train_loss": -41.1756477355957, "global_step": 181600, "epoch": 1500} {"train_loss": -41.80551528930664, "global_step": 181601, "epoch": 1500} {"train_loss": -41.85337448120117, "global_step": 181602, "epoch": 1500} {"train_loss": -41.38128662109375, "global_step": 181603, "epoch": 1500} {"train_loss": -41.50131607055664, "global_step": 181604, "epoch": 1500} {"train_loss": -41.238365173339844, "global_step": 181605, "epoch": 1500} {"train_loss": -42.08096694946289, "global_step": 181606, "epoch": 1500} {"train_loss": -41.455657958984375, "global_step": 181607, "epoch": 1500} {"train_loss": -41.19419479370117, "global_step": 181608, "epoch": 1500} {"train_loss": -41.253658294677734, "global_step": 181609, "epoch": 1500} {"train_loss": -41.62800216674805, "global_step": 181610, "epoch": 1500} {"train_loss": -42.41910934448242, "global_step": 181611, "epoch": 1500} {"train_loss": -41.774696350097656, "global_step": 181612, "epoch": 1500} {"train_loss": -41.5432014465332, "global_step": 181613, "epoch": 1500} {"train_loss": -40.82383728027344, "global_step": 181614, "epoch": 1500} {"train_loss": -42.2769889831543, "global_step": 181615, "epoch": 1500} {"train_loss": -42.43967819213867, "global_step": 181616, "epoch": 1500} {"train_loss": -41.74192428588867, "global_step": 181617, "epoch": 1500} {"train_loss": -42.1241569519043, "global_step": 181618, "epoch": 1500} {"train_loss": -42.20020294189453, "global_step": 181619, "epoch": 1500} {"train_loss": -41.24360726096413, "global_step": 181620, "epoch": 1500, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4400000": 1.0, "test/sim_max_reward_4400001": 1.0, "test/sim_max_reward_4400002": 1.0, "test/sim_max_reward_4400003": 1.0, "test/sim_max_reward_4400004": 1.0, "test/sim_max_reward_4400005": 1.0, "test/sim_max_reward_4400006": 1.0, "test/sim_max_reward_4400007": 1.0, "test/sim_max_reward_4400008": 1.0, "test/sim_max_reward_4400009": 1.0, "test/sim_max_reward_4400010": 1.0, "test/sim_max_reward_4400011": 1.0, "test/sim_max_reward_4400012": 1.0, "test/sim_max_reward_4400013": 1.0, "test/sim_max_reward_4400014": 1.0, "test/sim_max_reward_4400015": 1.0, "test/sim_max_reward_4400016": 1.0, "test/sim_max_reward_4400017": 1.0, "test/sim_max_reward_4400018": 1.0, "test/sim_max_reward_4400019": 1.0, "test/sim_max_reward_4400020": 1.0, "test/sim_max_reward_4400021": 1.0, "train/mean_score": 1.0, "test/mean_score": 1.0, "val_loss": 2668589.25} {"train_loss": -42.85376739501953, "global_step": 181621, "epoch": 1501} {"train_loss": -42.34663009643555, "global_step": 181622, "epoch": 1501} {"train_loss": -42.50556182861328, "global_step": 181623, "epoch": 1501} {"train_loss": -42.66133117675781, "global_step": 181624, "epoch": 1501} {"train_loss": -42.31728744506836, "global_step": 181625, "epoch": 1501} {"train_loss": -42.6053466796875, "global_step": 181626, "epoch": 1501} {"train_loss": -42.063323974609375, "global_step": 181627, "epoch": 1501} {"train_loss": -42.66682052612305, "global_step": 181628, "epoch": 1501} {"train_loss": -42.220008850097656, "global_step": 181629, "epoch": 1501} {"train_loss": -41.036842346191406, "global_step": 181630, "epoch": 1501} {"train_loss": -41.04340362548828, "global_step": 181631, "epoch": 1501} {"train_loss": -42.542415618896484, "global_step": 181632, "epoch": 1501} {"train_loss": -39.80746078491211, "global_step": 181633, "epoch": 1501} {"train_loss": -42.069183349609375, "global_step": 181634, "epoch": 1501} {"train_loss": -39.62192916870117, "global_step": 181635, "epoch": 1501} {"train_loss": -41.7019157409668, "global_step": 181636, "epoch": 1501} {"train_loss": -41.305538177490234, "global_step": 181637, "epoch": 1501} {"train_loss": -41.33515930175781, "global_step": 181638, "epoch": 1501} {"train_loss": -41.866573333740234, "global_step": 181639, "epoch": 1501} {"train_loss": -41.770538330078125, "global_step": 181640, "epoch": 1501} {"train_loss": -41.65621566772461, "global_step": 181641, "epoch": 1501} {"train_loss": -42.141380310058594, "global_step": 181642, "epoch": 1501} {"train_loss": -41.080013275146484, "global_step": 181643, "epoch": 1501} {"train_loss": -41.40592575073242, "global_step": 181644, "epoch": 1501} {"train_loss": -42.338436126708984, "global_step": 181645, "epoch": 1501} {"train_loss": -41.07612609863281, "global_step": 181646, "epoch": 1501} {"train_loss": -41.98828125, "global_step": 181647, "epoch": 1501} {"train_loss": -41.92026901245117, "global_step": 181648, "epoch": 1501} {"train_loss": -41.53359603881836, "global_step": 181649, "epoch": 1501} {"train_loss": -42.5637321472168, "global_step": 181650, "epoch": 1501} {"train_loss": -39.48040771484375, "global_step": 181651, "epoch": 1501} {"train_loss": -41.99123764038086, "global_step": 181652, "epoch": 1501} {"train_loss": -41.47343063354492, "global_step": 181653, "epoch": 1501} {"train_loss": -41.579524993896484, "global_step": 181654, "epoch": 1501} {"train_loss": -41.18842315673828, "global_step": 181655, "epoch": 1501} {"train_loss": -40.73857498168945, "global_step": 181656, "epoch": 1501} {"train_loss": -41.211734771728516, "global_step": 181657, "epoch": 1501} {"train_loss": -42.23855209350586, "global_step": 181658, "epoch": 1501} {"train_loss": -41.89399337768555, "global_step": 181659, "epoch": 1501} {"train_loss": -42.27616500854492, "global_step": 181660, "epoch": 1501} {"train_loss": -42.350765228271484, "global_step": 181661, "epoch": 1501} {"train_loss": -41.26076889038086, "global_step": 181662, "epoch": 1501} {"train_loss": -40.87117385864258, "global_step": 181663, "epoch": 1501} {"train_loss": -40.7305793762207, "global_step": 181664, "epoch": 1501} {"train_loss": -41.97170639038086, "global_step": 181665, "epoch": 1501} {"train_loss": -41.00880813598633, "global_step": 181666, "epoch": 1501} {"train_loss": -40.45993423461914, "global_step": 181667, "epoch": 1501} {"train_loss": -40.032657623291016, "global_step": 181668, "epoch": 1501} {"train_loss": -41.16911697387695, "global_step": 181669, "epoch": 1501} {"train_loss": -40.635433197021484, "global_step": 181670, "epoch": 1501} {"train_loss": -39.25934982299805, "global_step": 181671, "epoch": 1501} {"train_loss": -42.031429290771484, "global_step": 181672, "epoch": 1501} {"train_loss": -41.258689880371094, "global_step": 181673, "epoch": 1501} {"train_loss": -40.09359359741211, "global_step": 181674, "epoch": 1501} {"train_loss": -37.37458419799805, "global_step": 181675, "epoch": 1501} {"train_loss": -40.61392593383789, "global_step": 181676, "epoch": 1501} {"train_loss": -35.286407470703125, "global_step": 181677, "epoch": 1501} {"train_loss": -35.327980041503906, "global_step": 181678, "epoch": 1501} {"train_loss": -36.46665573120117, "global_step": 181679, "epoch": 1501} {"train_loss": -35.65428161621094, "global_step": 181680, "epoch": 1501} {"train_loss": -36.6302375793457, "global_step": 181681, "epoch": 1501} {"train_loss": -36.41119384765625, "global_step": 181682, "epoch": 1501} {"train_loss": -35.86003494262695, "global_step": 181683, "epoch": 1501} {"train_loss": -36.83118438720703, "global_step": 181684, "epoch": 1501} {"train_loss": -36.34022903442383, "global_step": 181685, "epoch": 1501} {"train_loss": -36.35517883300781, "global_step": 181686, "epoch": 1501} {"train_loss": -36.691375732421875, "global_step": 181687, "epoch": 1501} {"train_loss": -36.95151901245117, "global_step": 181688, "epoch": 1501} {"train_loss": -36.93015670776367, "global_step": 181689, "epoch": 1501} {"train_loss": -36.51206588745117, "global_step": 181690, "epoch": 1501} {"train_loss": -37.23799514770508, "global_step": 181691, "epoch": 1501} {"train_loss": -36.93568420410156, "global_step": 181692, "epoch": 1501} {"train_loss": -34.47581100463867, "global_step": 181693, "epoch": 1501} {"train_loss": -37.98966598510742, "global_step": 181694, "epoch": 1501} {"train_loss": -36.97278594970703, "global_step": 181695, "epoch": 1501} {"train_loss": -34.0275993347168, "global_step": 181696, "epoch": 1501} {"train_loss": -35.133480072021484, "global_step": 181697, "epoch": 1501} {"train_loss": -37.74201583862305, "global_step": 181698, "epoch": 1501} {"train_loss": -33.67009735107422, "global_step": 181699, "epoch": 1501} {"train_loss": -36.27821731567383, "global_step": 181700, "epoch": 1501} {"train_loss": -36.899940490722656, "global_step": 181701, "epoch": 1501} {"train_loss": -34.237709045410156, "global_step": 181702, "epoch": 1501} {"train_loss": -37.86330032348633, "global_step": 181703, "epoch": 1501} {"train_loss": -36.22368240356445, "global_step": 181704, "epoch": 1501} {"train_loss": -36.37663269042969, "global_step": 181705, "epoch": 1501} {"train_loss": -34.13179397583008, "global_step": 181706, "epoch": 1501} {"train_loss": -31.40203857421875, "global_step": 181707, "epoch": 1501} {"train_loss": -34.84931182861328, "global_step": 181708, "epoch": 1501} {"train_loss": -35.373863220214844, "global_step": 181709, "epoch": 1501} {"train_loss": -34.737449645996094, "global_step": 181710, "epoch": 1501} {"train_loss": -31.84214210510254, "global_step": 181711, "epoch": 1501} {"train_loss": -34.262840270996094, "global_step": 181712, "epoch": 1501} {"train_loss": -36.713714599609375, "global_step": 181713, "epoch": 1501} {"train_loss": -34.183074951171875, "global_step": 181714, "epoch": 1501} {"train_loss": -30.5895938873291, "global_step": 181715, "epoch": 1501} {"train_loss": -33.88271713256836, "global_step": 181716, "epoch": 1501} {"train_loss": -29.9572811126709, "global_step": 181717, "epoch": 1501} {"train_loss": -36.553184509277344, "global_step": 181718, "epoch": 1501} {"train_loss": -33.167266845703125, "global_step": 181719, "epoch": 1501} {"train_loss": -36.42332077026367, "global_step": 181720, "epoch": 1501} {"train_loss": -35.10291290283203, "global_step": 181721, "epoch": 1501} {"train_loss": -34.3448486328125, "global_step": 181722, "epoch": 1501} {"train_loss": -33.76668167114258, "global_step": 181723, "epoch": 1501} {"train_loss": -35.71321487426758, "global_step": 181724, "epoch": 1501} {"train_loss": -35.969146728515625, "global_step": 181725, "epoch": 1501} {"train_loss": -34.55183792114258, "global_step": 181726, "epoch": 1501} {"train_loss": -35.15912628173828, "global_step": 181727, "epoch": 1501} {"train_loss": -34.9792366027832, "global_step": 181728, "epoch": 1501} {"train_loss": -32.786861419677734, "global_step": 181729, "epoch": 1501} {"train_loss": -36.47096252441406, "global_step": 181730, "epoch": 1501} {"train_loss": -35.5523681640625, "global_step": 181731, "epoch": 1501} {"train_loss": -36.881160736083984, "global_step": 181732, "epoch": 1501} {"train_loss": -35.45285415649414, "global_step": 181733, "epoch": 1501} {"train_loss": -35.93441390991211, "global_step": 181734, "epoch": 1501} {"train_loss": -34.20049285888672, "global_step": 181735, "epoch": 1501} {"train_loss": -36.62430953979492, "global_step": 181736, "epoch": 1501} {"train_loss": -37.297210693359375, "global_step": 181737, "epoch": 1501} {"train_loss": -36.627891540527344, "global_step": 181738, "epoch": 1501} {"train_loss": -35.49782943725586, "global_step": 181739, "epoch": 1501} {"train_loss": -36.417293548583984, "global_step": 181740, "epoch": 1501} {"train_loss": -38.20765233630976, "global_step": 181741, "epoch": 1501, "val_loss": 2757613.25} {"train_loss": -34.330074310302734, "global_step": 181742, "epoch": 1502} {"train_loss": -37.504215240478516, "global_step": 181743, "epoch": 1502} {"train_loss": -36.810699462890625, "global_step": 181744, "epoch": 1502} {"train_loss": -36.42885971069336, "global_step": 181745, "epoch": 1502} {"train_loss": -37.32382583618164, "global_step": 181746, "epoch": 1502} {"train_loss": -37.11376190185547, "global_step": 181747, "epoch": 1502} {"train_loss": -36.48482131958008, "global_step": 181748, "epoch": 1502} {"train_loss": -36.94511795043945, "global_step": 181749, "epoch": 1502} {"train_loss": -36.40808868408203, "global_step": 181750, "epoch": 1502} {"train_loss": -37.887306213378906, "global_step": 181751, "epoch": 1502} {"train_loss": -37.38766860961914, "global_step": 181752, "epoch": 1502} {"train_loss": -38.363739013671875, "global_step": 181753, "epoch": 1502} {"train_loss": -35.58138656616211, "global_step": 181754, "epoch": 1502} {"train_loss": -37.532283782958984, "global_step": 181755, "epoch": 1502} {"train_loss": -36.0691032409668, "global_step": 181756, "epoch": 1502} {"train_loss": -38.1009635925293, "global_step": 181757, "epoch": 1502} {"train_loss": -38.25741195678711, "global_step": 181758, "epoch": 1502} {"train_loss": -37.08906173706055, "global_step": 181759, "epoch": 1502} {"train_loss": -38.12324142456055, "global_step": 181760, "epoch": 1502} {"train_loss": -38.135528564453125, "global_step": 181761, "epoch": 1502} {"train_loss": -38.13100814819336, "global_step": 181762, "epoch": 1502} {"train_loss": -37.52297592163086, "global_step": 181763, "epoch": 1502} {"train_loss": -38.69642639160156, "global_step": 181764, "epoch": 1502} {"train_loss": -38.834571838378906, "global_step": 181765, "epoch": 1502} {"train_loss": -38.16556930541992, "global_step": 181766, "epoch": 1502} {"train_loss": -37.8067741394043, "global_step": 181767, "epoch": 1502} {"train_loss": -38.21809768676758, "global_step": 181768, "epoch": 1502} {"train_loss": -38.55416488647461, "global_step": 181769, "epoch": 1502} {"train_loss": -39.020233154296875, "global_step": 181770, "epoch": 1502} {"train_loss": -38.500953674316406, "global_step": 181771, "epoch": 1502} {"train_loss": -38.90415573120117, "global_step": 181772, "epoch": 1502} {"train_loss": -38.3115119934082, "global_step": 181773, "epoch": 1502} {"train_loss": -38.93740463256836, "global_step": 181774, "epoch": 1502} {"train_loss": -38.926177978515625, "global_step": 181775, "epoch": 1502} {"train_loss": -39.312744140625, "global_step": 181776, "epoch": 1502} {"train_loss": -39.21657943725586, "global_step": 181777, "epoch": 1502} {"train_loss": -39.228515625, "global_step": 181778, "epoch": 1502} {"train_loss": -38.530982971191406, "global_step": 181779, "epoch": 1502} {"train_loss": -38.91126251220703, "global_step": 181780, "epoch": 1502} {"train_loss": -38.7670783996582, "global_step": 181781, "epoch": 1502} {"train_loss": -39.436363220214844, "global_step": 181782, "epoch": 1502} {"train_loss": -39.61851119995117, "global_step": 181783, "epoch": 1502} {"train_loss": -37.6246223449707, "global_step": 181784, "epoch": 1502} {"train_loss": -39.128902435302734, "global_step": 181785, "epoch": 1502} {"train_loss": -39.572357177734375, "global_step": 181786, "epoch": 1502} {"train_loss": -37.93767166137695, "global_step": 181787, "epoch": 1502} {"train_loss": -34.02872085571289, "global_step": 181788, "epoch": 1502} {"train_loss": -28.61759376525879, "global_step": 181789, "epoch": 1502} {"train_loss": -32.12687301635742, "global_step": 181790, "epoch": 1502} {"train_loss": -39.94920349121094, "global_step": 181791, "epoch": 1502} {"train_loss": -34.91706085205078, "global_step": 181792, "epoch": 1502} {"train_loss": -38.05353927612305, "global_step": 181793, "epoch": 1502} {"train_loss": -37.151912689208984, "global_step": 181794, "epoch": 1502} {"train_loss": -38.99787521362305, "global_step": 181795, "epoch": 1502} {"train_loss": -37.42300033569336, "global_step": 181796, "epoch": 1502} {"train_loss": -39.249244689941406, "global_step": 181797, "epoch": 1502} {"train_loss": -37.66067123413086, "global_step": 181798, "epoch": 1502} {"train_loss": -39.76264953613281, "global_step": 181799, "epoch": 1502} {"train_loss": -38.27269744873047, "global_step": 181800, "epoch": 1502} {"train_loss": -38.976104736328125, "global_step": 181801, "epoch": 1502} {"train_loss": -38.82491683959961, "global_step": 181802, "epoch": 1502} {"train_loss": -39.453670501708984, "global_step": 181803, "epoch": 1502} {"train_loss": -39.278419494628906, "global_step": 181804, "epoch": 1502} {"train_loss": -39.35337829589844, "global_step": 181805, "epoch": 1502} {"train_loss": -39.5943717956543, "global_step": 181806, "epoch": 1502} {"train_loss": -39.23714828491211, "global_step": 181807, "epoch": 1502} {"train_loss": -38.59334945678711, "global_step": 181808, "epoch": 1502} {"train_loss": -39.06856155395508, "global_step": 181809, "epoch": 1502} {"train_loss": -39.884334564208984, "global_step": 181810, "epoch": 1502} {"train_loss": -39.54769515991211, "global_step": 181811, "epoch": 1502} {"train_loss": -39.37158203125, "global_step": 181812, "epoch": 1502} {"train_loss": -39.59844970703125, "global_step": 181813, "epoch": 1502} {"train_loss": -38.275611877441406, "global_step": 181814, "epoch": 1502} {"train_loss": -39.98683547973633, "global_step": 181815, "epoch": 1502} {"train_loss": -40.109859466552734, "global_step": 181816, "epoch": 1502} {"train_loss": -40.04806900024414, "global_step": 181817, "epoch": 1502} {"train_loss": -40.230224609375, "global_step": 181818, "epoch": 1502} {"train_loss": -39.768489837646484, "global_step": 181819, "epoch": 1502} {"train_loss": -39.62157440185547, "global_step": 181820, "epoch": 1502} {"train_loss": -36.4815559387207, "global_step": 181821, "epoch": 1502} {"train_loss": -32.62910079956055, "global_step": 181822, "epoch": 1502} {"train_loss": -37.84574508666992, "global_step": 181823, "epoch": 1502} {"train_loss": -36.50878143310547, "global_step": 181824, "epoch": 1502} {"train_loss": -37.83869552612305, "global_step": 181825, "epoch": 1502} {"train_loss": -39.05683517456055, "global_step": 181826, "epoch": 1502} {"train_loss": -38.46541213989258, "global_step": 181827, "epoch": 1502} {"train_loss": -39.75227355957031, "global_step": 181828, "epoch": 1502} {"train_loss": -38.19851303100586, "global_step": 181829, "epoch": 1502} {"train_loss": -39.485713958740234, "global_step": 181830, "epoch": 1502} {"train_loss": -39.18278884887695, "global_step": 181831, "epoch": 1502} {"train_loss": -39.20489501953125, "global_step": 181832, "epoch": 1502} {"train_loss": -39.026268005371094, "global_step": 181833, "epoch": 1502} {"train_loss": -39.468719482421875, "global_step": 181834, "epoch": 1502} {"train_loss": -39.100318908691406, "global_step": 181835, "epoch": 1502} {"train_loss": -39.53532791137695, "global_step": 181836, "epoch": 1502} {"train_loss": -39.56591796875, "global_step": 181837, "epoch": 1502} {"train_loss": -39.64352798461914, "global_step": 181838, "epoch": 1502} {"train_loss": -38.9615364074707, "global_step": 181839, "epoch": 1502} {"train_loss": -39.57992172241211, "global_step": 181840, "epoch": 1502} {"train_loss": -40.21479415893555, "global_step": 181841, "epoch": 1502} {"train_loss": -39.24761962890625, "global_step": 181842, "epoch": 1502} {"train_loss": -40.12898635864258, "global_step": 181843, "epoch": 1502} {"train_loss": -39.232906341552734, "global_step": 181844, "epoch": 1502} {"train_loss": -38.236358642578125, "global_step": 181845, "epoch": 1502} {"train_loss": -39.50407028198242, "global_step": 181846, "epoch": 1502} {"train_loss": -38.447261810302734, "global_step": 181847, "epoch": 1502} {"train_loss": -39.3554801940918, "global_step": 181848, "epoch": 1502} {"train_loss": -39.220489501953125, "global_step": 181849, "epoch": 1502} {"train_loss": -38.55147933959961, "global_step": 181850, "epoch": 1502} {"train_loss": -40.05109405517578, "global_step": 181851, "epoch": 1502} {"train_loss": -38.870033264160156, "global_step": 181852, "epoch": 1502} {"train_loss": -40.1356086730957, "global_step": 181853, "epoch": 1502} {"train_loss": -39.23314666748047, "global_step": 181854, "epoch": 1502} {"train_loss": -39.88956832885742, "global_step": 181855, "epoch": 1502} {"train_loss": -37.68023681640625, "global_step": 181856, "epoch": 1502} {"train_loss": -39.11440658569336, "global_step": 181857, "epoch": 1502} {"train_loss": -39.05472183227539, "global_step": 181858, "epoch": 1502} {"train_loss": -38.052513122558594, "global_step": 181859, "epoch": 1502} {"train_loss": -35.76978302001953, "global_step": 181860, "epoch": 1502} {"train_loss": -38.58209228515625, "global_step": 181861, "epoch": 1502} {"train_loss": -38.3534687609712, "global_step": 181862, "epoch": 1502, "val_loss": 2680050.5} {"train_loss": -37.00995635986328, "global_step": 181863, "epoch": 1503} {"train_loss": -36.38277053833008, "global_step": 181864, "epoch": 1503} {"train_loss": -35.682952880859375, "global_step": 181865, "epoch": 1503} {"train_loss": -37.24395751953125, "global_step": 181866, "epoch": 1503} {"train_loss": -38.65114974975586, "global_step": 181867, "epoch": 1503} {"train_loss": -37.891387939453125, "global_step": 181868, "epoch": 1503} {"train_loss": -35.21242904663086, "global_step": 181869, "epoch": 1503} {"train_loss": -34.959957122802734, "global_step": 181870, "epoch": 1503} {"train_loss": -39.06643295288086, "global_step": 181871, "epoch": 1503} {"train_loss": -38.509033203125, "global_step": 181872, "epoch": 1503} {"train_loss": -38.1773796081543, "global_step": 181873, "epoch": 1503} {"train_loss": -35.73047637939453, "global_step": 181874, "epoch": 1503} {"train_loss": -38.7401237487793, "global_step": 181875, "epoch": 1503} {"train_loss": -38.3598518371582, "global_step": 181876, "epoch": 1503} {"train_loss": -36.5445671081543, "global_step": 181877, "epoch": 1503} {"train_loss": -37.5258903503418, "global_step": 181878, "epoch": 1503} {"train_loss": -31.451520919799805, "global_step": 181879, "epoch": 1503} {"train_loss": -37.386199951171875, "global_step": 181880, "epoch": 1503} {"train_loss": -38.16150665283203, "global_step": 181881, "epoch": 1503} {"train_loss": -38.74087142944336, "global_step": 181882, "epoch": 1503} {"train_loss": -35.857757568359375, "global_step": 181883, "epoch": 1503} {"train_loss": -35.92219924926758, "global_step": 181884, "epoch": 1503} {"train_loss": -35.26968765258789, "global_step": 181885, "epoch": 1503} {"train_loss": -35.339874267578125, "global_step": 181886, "epoch": 1503} {"train_loss": -36.78043746948242, "global_step": 181887, "epoch": 1503} {"train_loss": -37.83073806762695, "global_step": 181888, "epoch": 1503} {"train_loss": -37.81843185424805, "global_step": 181889, "epoch": 1503} {"train_loss": -37.10807418823242, "global_step": 181890, "epoch": 1503} {"train_loss": -37.564300537109375, "global_step": 181891, "epoch": 1503} {"train_loss": -31.65872573852539, "global_step": 181892, "epoch": 1503} {"train_loss": -36.162025451660156, "global_step": 181893, "epoch": 1503} {"train_loss": -36.666988372802734, "global_step": 181894, "epoch": 1503} {"train_loss": -38.091278076171875, "global_step": 181895, "epoch": 1503} {"train_loss": -37.115848541259766, "global_step": 181896, "epoch": 1503} {"train_loss": -37.95436096191406, "global_step": 181897, "epoch": 1503} {"train_loss": -38.12580490112305, "global_step": 181898, "epoch": 1503} {"train_loss": -37.790889739990234, "global_step": 181899, "epoch": 1503} {"train_loss": -36.86759567260742, "global_step": 181900, "epoch": 1503} {"train_loss": -37.12224197387695, "global_step": 181901, "epoch": 1503} {"train_loss": -38.41180419921875, "global_step": 181902, "epoch": 1503} {"train_loss": -36.40082931518555, "global_step": 181903, "epoch": 1503} {"train_loss": -37.07441711425781, "global_step": 181904, "epoch": 1503} {"train_loss": -37.368064880371094, "global_step": 181905, "epoch": 1503} {"train_loss": -37.82951736450195, "global_step": 181906, "epoch": 1503} {"train_loss": -38.7659797668457, "global_step": 181907, "epoch": 1503} {"train_loss": -38.366302490234375, "global_step": 181908, "epoch": 1503} {"train_loss": -37.9296760559082, "global_step": 181909, "epoch": 1503} {"train_loss": -38.7706298828125, "global_step": 181910, "epoch": 1503} {"train_loss": -38.554481506347656, "global_step": 181911, "epoch": 1503} {"train_loss": -38.044063568115234, "global_step": 181912, "epoch": 1503} {"train_loss": -38.940555572509766, "global_step": 181913, "epoch": 1503} {"train_loss": -37.47105026245117, "global_step": 181914, "epoch": 1503} {"train_loss": -37.724273681640625, "global_step": 181915, "epoch": 1503} {"train_loss": -38.24946212768555, "global_step": 181916, "epoch": 1503} {"train_loss": -39.18032455444336, "global_step": 181917, "epoch": 1503} {"train_loss": -39.06493377685547, "global_step": 181918, "epoch": 1503} {"train_loss": -38.54891586303711, "global_step": 181919, "epoch": 1503} {"train_loss": -37.941810607910156, "global_step": 181920, "epoch": 1503} {"train_loss": -38.94672393798828, "global_step": 181921, "epoch": 1503} {"train_loss": -39.21709442138672, "global_step": 181922, "epoch": 1503} {"train_loss": -38.380104064941406, "global_step": 181923, "epoch": 1503} {"train_loss": -38.68620681762695, "global_step": 181924, "epoch": 1503} {"train_loss": -37.731380462646484, "global_step": 181925, "epoch": 1503} {"train_loss": -39.340126037597656, "global_step": 181926, "epoch": 1503} {"train_loss": -39.543338775634766, "global_step": 181927, "epoch": 1503} {"train_loss": -33.12486267089844, "global_step": 181928, "epoch": 1503} {"train_loss": -37.97282791137695, "global_step": 181929, "epoch": 1503} {"train_loss": -39.04557800292969, "global_step": 181930, "epoch": 1503} {"train_loss": -37.902591705322266, "global_step": 181931, "epoch": 1503} {"train_loss": -38.758365631103516, "global_step": 181932, "epoch": 1503} {"train_loss": -38.964080810546875, "global_step": 181933, "epoch": 1503} {"train_loss": -39.428829193115234, "global_step": 181934, "epoch": 1503} {"train_loss": -38.7940559387207, "global_step": 181935, "epoch": 1503} {"train_loss": -38.38638687133789, "global_step": 181936, "epoch": 1503} {"train_loss": -38.510440826416016, "global_step": 181937, "epoch": 1503} {"train_loss": -39.20590591430664, "global_step": 181938, "epoch": 1503} {"train_loss": -38.132694244384766, "global_step": 181939, "epoch": 1503} {"train_loss": -38.44871139526367, "global_step": 181940, "epoch": 1503} {"train_loss": -38.126556396484375, "global_step": 181941, "epoch": 1503} {"train_loss": -38.74324417114258, "global_step": 181942, "epoch": 1503} {"train_loss": -38.876800537109375, "global_step": 181943, "epoch": 1503} {"train_loss": -39.14370346069336, "global_step": 181944, "epoch": 1503} {"train_loss": -39.44015884399414, "global_step": 181945, "epoch": 1503} {"train_loss": -38.570980072021484, "global_step": 181946, "epoch": 1503} {"train_loss": -38.997413635253906, "global_step": 181947, "epoch": 1503} {"train_loss": -39.28498077392578, "global_step": 181948, "epoch": 1503} {"train_loss": -38.791316986083984, "global_step": 181949, "epoch": 1503} {"train_loss": -38.442413330078125, "global_step": 181950, "epoch": 1503} {"train_loss": -39.31319808959961, "global_step": 181951, "epoch": 1503} {"train_loss": -39.49319076538086, "global_step": 181952, "epoch": 1503} {"train_loss": -38.243038177490234, "global_step": 181953, "epoch": 1503} {"train_loss": -39.7575569152832, "global_step": 181954, "epoch": 1503} {"train_loss": -39.53965377807617, "global_step": 181955, "epoch": 1503} {"train_loss": -39.217315673828125, "global_step": 181956, "epoch": 1503} {"train_loss": -39.37373733520508, "global_step": 181957, "epoch": 1503} {"train_loss": -39.33022689819336, "global_step": 181958, "epoch": 1503} {"train_loss": -40.072044372558594, "global_step": 181959, "epoch": 1503} {"train_loss": -39.82595443725586, "global_step": 181960, "epoch": 1503} {"train_loss": -39.31608963012695, "global_step": 181961, "epoch": 1503} {"train_loss": -39.3297233581543, "global_step": 181962, "epoch": 1503} {"train_loss": -38.44257736206055, "global_step": 181963, "epoch": 1503} {"train_loss": -39.56425094604492, "global_step": 181964, "epoch": 1503} {"train_loss": -39.40547561645508, "global_step": 181965, "epoch": 1503} {"train_loss": -40.04873275756836, "global_step": 181966, "epoch": 1503} {"train_loss": -39.51603317260742, "global_step": 181967, "epoch": 1503} {"train_loss": -39.37655258178711, "global_step": 181968, "epoch": 1503} {"train_loss": -39.7678337097168, "global_step": 181969, "epoch": 1503} {"train_loss": -39.79887771606445, "global_step": 181970, "epoch": 1503} {"train_loss": -39.843441009521484, "global_step": 181971, "epoch": 1503} {"train_loss": -40.1668815612793, "global_step": 181972, "epoch": 1503} {"train_loss": -39.561180114746094, "global_step": 181973, "epoch": 1503} {"train_loss": -39.88147735595703, "global_step": 181974, "epoch": 1503} {"train_loss": -40.68603515625, "global_step": 181975, "epoch": 1503} {"train_loss": -40.20909881591797, "global_step": 181976, "epoch": 1503} {"train_loss": -39.63543701171875, "global_step": 181977, "epoch": 1503} {"train_loss": -40.296607971191406, "global_step": 181978, "epoch": 1503} {"train_loss": -39.72488021850586, "global_step": 181979, "epoch": 1503} {"train_loss": -40.42540740966797, "global_step": 181980, "epoch": 1503} {"train_loss": -39.57368850708008, "global_step": 181981, "epoch": 1503} {"train_loss": -39.774200439453125, "global_step": 181982, "epoch": 1503} {"train_loss": -38.252330827318936, "global_step": 181983, "epoch": 1503, "val_loss": 2678643.0} {"train_loss": -39.440425872802734, "global_step": 181984, "epoch": 1504} {"train_loss": -39.635902404785156, "global_step": 181985, "epoch": 1504} {"train_loss": -40.24859619140625, "global_step": 181986, "epoch": 1504} {"train_loss": -39.48228454589844, "global_step": 181987, "epoch": 1504} {"train_loss": -38.317604064941406, "global_step": 181988, "epoch": 1504} {"train_loss": -38.09235763549805, "global_step": 181989, "epoch": 1504} {"train_loss": -39.20695877075195, "global_step": 181990, "epoch": 1504} {"train_loss": -39.81315231323242, "global_step": 181991, "epoch": 1504} {"train_loss": -40.43410110473633, "global_step": 181992, "epoch": 1504} {"train_loss": -39.76332092285156, "global_step": 181993, "epoch": 1504} {"train_loss": -39.877593994140625, "global_step": 181994, "epoch": 1504} {"train_loss": -40.18988800048828, "global_step": 181995, "epoch": 1504} {"train_loss": -40.245784759521484, "global_step": 181996, "epoch": 1504} {"train_loss": -40.18628692626953, "global_step": 181997, "epoch": 1504} {"train_loss": -39.864105224609375, "global_step": 181998, "epoch": 1504} {"train_loss": -40.47364807128906, "global_step": 181999, "epoch": 1504} {"train_loss": -40.37885665893555, "global_step": 182000, "epoch": 1504} {"train_loss": -40.537864685058594, "global_step": 182001, "epoch": 1504} {"train_loss": -40.85908126831055, "global_step": 182002, "epoch": 1504} {"train_loss": -40.312782287597656, "global_step": 182003, "epoch": 1504} {"train_loss": -40.823585510253906, "global_step": 182004, "epoch": 1504} {"train_loss": -40.780433654785156, "global_step": 182005, "epoch": 1504} {"train_loss": -41.12494659423828, "global_step": 182006, "epoch": 1504} {"train_loss": -40.48928451538086, "global_step": 182007, "epoch": 1504} {"train_loss": -40.075252532958984, "global_step": 182008, "epoch": 1504} {"train_loss": -40.82756423950195, "global_step": 182009, "epoch": 1504} {"train_loss": -41.00638961791992, "global_step": 182010, "epoch": 1504} {"train_loss": -40.93037796020508, "global_step": 182011, "epoch": 1504} {"train_loss": -41.02993392944336, "global_step": 182012, "epoch": 1504} {"train_loss": -40.906349182128906, "global_step": 182013, "epoch": 1504} {"train_loss": -41.0272216796875, "global_step": 182014, "epoch": 1504} {"train_loss": -41.13797378540039, "global_step": 182015, "epoch": 1504} {"train_loss": -40.99052047729492, "global_step": 182016, "epoch": 1504} {"train_loss": -41.11541748046875, "global_step": 182017, "epoch": 1504} {"train_loss": -41.25452423095703, "global_step": 182018, "epoch": 1504} {"train_loss": -40.70683670043945, "global_step": 182019, "epoch": 1504} {"train_loss": -40.92854690551758, "global_step": 182020, "epoch": 1504} {"train_loss": -40.41590118408203, "global_step": 182021, "epoch": 1504} {"train_loss": -41.57377243041992, "global_step": 182022, "epoch": 1504} {"train_loss": -40.7241096496582, "global_step": 182023, "epoch": 1504} {"train_loss": -40.97352600097656, "global_step": 182024, "epoch": 1504} {"train_loss": -40.542091369628906, "global_step": 182025, "epoch": 1504} {"train_loss": -41.42903137207031, "global_step": 182026, "epoch": 1504} {"train_loss": -41.01699447631836, "global_step": 182027, "epoch": 1504} {"train_loss": -40.74002456665039, "global_step": 182028, "epoch": 1504} {"train_loss": -40.095489501953125, "global_step": 182029, "epoch": 1504} {"train_loss": -40.477012634277344, "global_step": 182030, "epoch": 1504} {"train_loss": -40.5482292175293, "global_step": 182031, "epoch": 1504} {"train_loss": -40.8442497253418, "global_step": 182032, "epoch": 1504} {"train_loss": -40.06611633300781, "global_step": 182033, "epoch": 1504} {"train_loss": -38.62868118286133, "global_step": 182034, "epoch": 1504} {"train_loss": -39.70071029663086, "global_step": 182035, "epoch": 1504} {"train_loss": -39.61629867553711, "global_step": 182036, "epoch": 1504} {"train_loss": -39.60213851928711, "global_step": 182037, "epoch": 1504} {"train_loss": -39.072059631347656, "global_step": 182038, "epoch": 1504} {"train_loss": -39.993534088134766, "global_step": 182039, "epoch": 1504} {"train_loss": -39.12281799316406, "global_step": 182040, "epoch": 1504} {"train_loss": -38.093868255615234, "global_step": 182041, "epoch": 1504} {"train_loss": -34.76510238647461, "global_step": 182042, "epoch": 1504} {"train_loss": -36.728912353515625, "global_step": 182043, "epoch": 1504} {"train_loss": -35.532535552978516, "global_step": 182044, "epoch": 1504} {"train_loss": -34.202640533447266, "global_step": 182045, "epoch": 1504} {"train_loss": -38.3951416015625, "global_step": 182046, "epoch": 1504} {"train_loss": -39.09072494506836, "global_step": 182047, "epoch": 1504} {"train_loss": -39.7962760925293, "global_step": 182048, "epoch": 1504} {"train_loss": -37.5028076171875, "global_step": 182049, "epoch": 1504} {"train_loss": -37.65971755981445, "global_step": 182050, "epoch": 1504} {"train_loss": -39.2391357421875, "global_step": 182051, "epoch": 1504} {"train_loss": -38.89522171020508, "global_step": 182052, "epoch": 1504} {"train_loss": -37.69057846069336, "global_step": 182053, "epoch": 1504} {"train_loss": -37.40700912475586, "global_step": 182054, "epoch": 1504} {"train_loss": -38.03805160522461, "global_step": 182055, "epoch": 1504} {"train_loss": -38.66361618041992, "global_step": 182056, "epoch": 1504} {"train_loss": -38.0926513671875, "global_step": 182057, "epoch": 1504} {"train_loss": -39.21269989013672, "global_step": 182058, "epoch": 1504} {"train_loss": -38.59519577026367, "global_step": 182059, "epoch": 1504} {"train_loss": -38.39429473876953, "global_step": 182060, "epoch": 1504} {"train_loss": -38.06584548950195, "global_step": 182061, "epoch": 1504} {"train_loss": -39.13399124145508, "global_step": 182062, "epoch": 1504} {"train_loss": -35.5325813293457, "global_step": 182063, "epoch": 1504} {"train_loss": -36.8823127746582, "global_step": 182064, "epoch": 1504} {"train_loss": -38.263763427734375, "global_step": 182065, "epoch": 1504} {"train_loss": -37.62904739379883, "global_step": 182066, "epoch": 1504} {"train_loss": -38.91749572753906, "global_step": 182067, "epoch": 1504} {"train_loss": -37.762020111083984, "global_step": 182068, "epoch": 1504} {"train_loss": -36.86863327026367, "global_step": 182069, "epoch": 1504} {"train_loss": -29.500091552734375, "global_step": 182070, "epoch": 1504} {"train_loss": -37.723915100097656, "global_step": 182071, "epoch": 1504} {"train_loss": -37.522560119628906, "global_step": 182072, "epoch": 1504} {"train_loss": -37.978031158447266, "global_step": 182073, "epoch": 1504} {"train_loss": -38.642555236816406, "global_step": 182074, "epoch": 1504} {"train_loss": -38.712032318115234, "global_step": 182075, "epoch": 1504} {"train_loss": -34.19356155395508, "global_step": 182076, "epoch": 1504} {"train_loss": -36.60287094116211, "global_step": 182077, "epoch": 1504} {"train_loss": -37.99813461303711, "global_step": 182078, "epoch": 1504} {"train_loss": -37.32340621948242, "global_step": 182079, "epoch": 1504} {"train_loss": -38.76143264770508, "global_step": 182080, "epoch": 1504} {"train_loss": -39.723026275634766, "global_step": 182081, "epoch": 1504} {"train_loss": -37.39325714111328, "global_step": 182082, "epoch": 1504} {"train_loss": -39.42348861694336, "global_step": 182083, "epoch": 1504} {"train_loss": -37.97782516479492, "global_step": 182084, "epoch": 1504} {"train_loss": -36.89066696166992, "global_step": 182085, "epoch": 1504} {"train_loss": -39.401100158691406, "global_step": 182086, "epoch": 1504} {"train_loss": -39.135040283203125, "global_step": 182087, "epoch": 1504} {"train_loss": -39.126190185546875, "global_step": 182088, "epoch": 1504} {"train_loss": -37.686336517333984, "global_step": 182089, "epoch": 1504} {"train_loss": -38.7952995300293, "global_step": 182090, "epoch": 1504} {"train_loss": -38.7578239440918, "global_step": 182091, "epoch": 1504} {"train_loss": -39.7009391784668, "global_step": 182092, "epoch": 1504} {"train_loss": -37.53385543823242, "global_step": 182093, "epoch": 1504} {"train_loss": -39.10110092163086, "global_step": 182094, "epoch": 1504} {"train_loss": -39.597412109375, "global_step": 182095, "epoch": 1504} {"train_loss": -39.6623420715332, "global_step": 182096, "epoch": 1504} {"train_loss": -38.76730728149414, "global_step": 182097, "epoch": 1504} {"train_loss": -39.38431167602539, "global_step": 182098, "epoch": 1504} {"train_loss": -39.481689453125, "global_step": 182099, "epoch": 1504} {"train_loss": -39.20927810668945, "global_step": 182100, "epoch": 1504} {"train_loss": -39.31366729736328, "global_step": 182101, "epoch": 1504} {"train_loss": -39.54609298706055, "global_step": 182102, "epoch": 1504} {"train_loss": -39.40949630737305, "global_step": 182103, "epoch": 1504} {"train_loss": -39.102191578258164, "global_step": 182104, "epoch": 1504, "val_loss": 2699643.25} {"train_loss": -39.99515914916992, "global_step": 182105, "epoch": 1505} {"train_loss": -39.89446258544922, "global_step": 182106, "epoch": 1505} {"train_loss": -40.007144927978516, "global_step": 182107, "epoch": 1505} {"train_loss": -39.5792350769043, "global_step": 182108, "epoch": 1505} {"train_loss": -39.48605728149414, "global_step": 182109, "epoch": 1505} {"train_loss": -39.1682014465332, "global_step": 182110, "epoch": 1505} {"train_loss": -39.98428726196289, "global_step": 182111, "epoch": 1505} {"train_loss": -39.59072494506836, "global_step": 182112, "epoch": 1505} {"train_loss": -39.09250259399414, "global_step": 182113, "epoch": 1505} {"train_loss": -39.2213020324707, "global_step": 182114, "epoch": 1505} {"train_loss": -40.035308837890625, "global_step": 182115, "epoch": 1505} {"train_loss": -39.45676803588867, "global_step": 182116, "epoch": 1505} {"train_loss": -39.421913146972656, "global_step": 182117, "epoch": 1505} {"train_loss": -40.00010299682617, "global_step": 182118, "epoch": 1505} {"train_loss": -39.50034713745117, "global_step": 182119, "epoch": 1505} {"train_loss": -40.30093002319336, "global_step": 182120, "epoch": 1505} {"train_loss": -39.60183334350586, "global_step": 182121, "epoch": 1505} {"train_loss": -40.343082427978516, "global_step": 182122, "epoch": 1505} {"train_loss": -39.530372619628906, "global_step": 182123, "epoch": 1505} {"train_loss": -39.88979721069336, "global_step": 182124, "epoch": 1505} {"train_loss": -39.31940841674805, "global_step": 182125, "epoch": 1505} {"train_loss": -40.43546676635742, "global_step": 182126, "epoch": 1505} {"train_loss": -39.9228401184082, "global_step": 182127, "epoch": 1505} {"train_loss": -40.02235794067383, "global_step": 182128, "epoch": 1505} {"train_loss": -39.2623405456543, "global_step": 182129, "epoch": 1505} {"train_loss": -39.91944885253906, "global_step": 182130, "epoch": 1505} {"train_loss": -40.12190246582031, "global_step": 182131, "epoch": 1505} {"train_loss": -40.29606246948242, "global_step": 182132, "epoch": 1505} {"train_loss": -40.42401123046875, "global_step": 182133, "epoch": 1505} {"train_loss": -39.57137680053711, "global_step": 182134, "epoch": 1505} {"train_loss": -39.364620208740234, "global_step": 182135, "epoch": 1505} {"train_loss": -40.38811111450195, "global_step": 182136, "epoch": 1505} {"train_loss": -40.54024887084961, "global_step": 182137, "epoch": 1505} {"train_loss": -40.98970413208008, "global_step": 182138, "epoch": 1505} {"train_loss": -40.26066589355469, "global_step": 182139, "epoch": 1505} {"train_loss": -40.46714782714844, "global_step": 182140, "epoch": 1505} {"train_loss": -40.66010284423828, "global_step": 182141, "epoch": 1505} {"train_loss": -40.18543243408203, "global_step": 182142, "epoch": 1505} {"train_loss": -40.388336181640625, "global_step": 182143, "epoch": 1505} {"train_loss": -40.44668197631836, "global_step": 182144, "epoch": 1505} {"train_loss": -40.33864212036133, "global_step": 182145, "epoch": 1505} {"train_loss": -40.67011642456055, "global_step": 182146, "epoch": 1505} {"train_loss": -40.19312286376953, "global_step": 182147, "epoch": 1505} {"train_loss": -40.73795700073242, "global_step": 182148, "epoch": 1505} {"train_loss": -40.1539192199707, "global_step": 182149, "epoch": 1505} {"train_loss": -39.84374237060547, "global_step": 182150, "epoch": 1505} {"train_loss": -40.82483673095703, "global_step": 182151, "epoch": 1505} {"train_loss": -40.789798736572266, "global_step": 182152, "epoch": 1505} {"train_loss": -40.997314453125, "global_step": 182153, "epoch": 1505} {"train_loss": -40.74155807495117, "global_step": 182154, "epoch": 1505} {"train_loss": -40.506072998046875, "global_step": 182155, "epoch": 1505} {"train_loss": -39.41787338256836, "global_step": 182156, "epoch": 1505} {"train_loss": -38.920223236083984, "global_step": 182157, "epoch": 1505} {"train_loss": -40.28097152709961, "global_step": 182158, "epoch": 1505} {"train_loss": -40.615909576416016, "global_step": 182159, "epoch": 1505} {"train_loss": -39.096046447753906, "global_step": 182160, "epoch": 1505} {"train_loss": -40.62716293334961, "global_step": 182161, "epoch": 1505} {"train_loss": -40.384315490722656, "global_step": 182162, "epoch": 1505} {"train_loss": -40.20882797241211, "global_step": 182163, "epoch": 1505} {"train_loss": -40.7775993347168, "global_step": 182164, "epoch": 1505} {"train_loss": -40.34040451049805, "global_step": 182165, "epoch": 1505} {"train_loss": -41.050086975097656, "global_step": 182166, "epoch": 1505} {"train_loss": -40.67961502075195, "global_step": 182167, "epoch": 1505} {"train_loss": -40.79880905151367, "global_step": 182168, "epoch": 1505} {"train_loss": -40.10427474975586, "global_step": 182169, "epoch": 1505} {"train_loss": -40.32832717895508, "global_step": 182170, "epoch": 1505} {"train_loss": -40.587989807128906, "global_step": 182171, "epoch": 1505} {"train_loss": -38.354896545410156, "global_step": 182172, "epoch": 1505} {"train_loss": -36.8005485534668, "global_step": 182173, "epoch": 1505} {"train_loss": -40.24358367919922, "global_step": 182174, "epoch": 1505} {"train_loss": -38.558013916015625, "global_step": 182175, "epoch": 1505} {"train_loss": -40.61020278930664, "global_step": 182176, "epoch": 1505} {"train_loss": -37.21604537963867, "global_step": 182177, "epoch": 1505} {"train_loss": -38.517295837402344, "global_step": 182178, "epoch": 1505} {"train_loss": -39.40139389038086, "global_step": 182179, "epoch": 1505} {"train_loss": -40.12639236450195, "global_step": 182180, "epoch": 1505} {"train_loss": -39.5001335144043, "global_step": 182181, "epoch": 1505} {"train_loss": -40.13848876953125, "global_step": 182182, "epoch": 1505} {"train_loss": -38.55999755859375, "global_step": 182183, "epoch": 1505} {"train_loss": -40.389217376708984, "global_step": 182184, "epoch": 1505} {"train_loss": -39.46556854248047, "global_step": 182185, "epoch": 1505} {"train_loss": -39.685569763183594, "global_step": 182186, "epoch": 1505} {"train_loss": -39.76467514038086, "global_step": 182187, "epoch": 1505} {"train_loss": -40.44034957885742, "global_step": 182188, "epoch": 1505} {"train_loss": -38.705257415771484, "global_step": 182189, "epoch": 1505} {"train_loss": -39.66097640991211, "global_step": 182190, "epoch": 1505} {"train_loss": -38.870479583740234, "global_step": 182191, "epoch": 1505} {"train_loss": -39.575923919677734, "global_step": 182192, "epoch": 1505} {"train_loss": -34.18406295776367, "global_step": 182193, "epoch": 1505} {"train_loss": -38.27552032470703, "global_step": 182194, "epoch": 1505} {"train_loss": -38.803436279296875, "global_step": 182195, "epoch": 1505} {"train_loss": -39.08388900756836, "global_step": 182196, "epoch": 1505} {"train_loss": -39.08195114135742, "global_step": 182197, "epoch": 1505} {"train_loss": -39.23191452026367, "global_step": 182198, "epoch": 1505} {"train_loss": -39.6213493347168, "global_step": 182199, "epoch": 1505} {"train_loss": -38.136051177978516, "global_step": 182200, "epoch": 1505} {"train_loss": -39.38723373413086, "global_step": 182201, "epoch": 1505} {"train_loss": -38.37385559082031, "global_step": 182202, "epoch": 1505} {"train_loss": -38.75975799560547, "global_step": 182203, "epoch": 1505} {"train_loss": -37.43706130981445, "global_step": 182204, "epoch": 1505} {"train_loss": -40.04581832885742, "global_step": 182205, "epoch": 1505} {"train_loss": -38.72097396850586, "global_step": 182206, "epoch": 1505} {"train_loss": -37.5984992980957, "global_step": 182207, "epoch": 1505} {"train_loss": -39.816383361816406, "global_step": 182208, "epoch": 1505} {"train_loss": -39.79792022705078, "global_step": 182209, "epoch": 1505} {"train_loss": -39.19571304321289, "global_step": 182210, "epoch": 1505} {"train_loss": -38.708892822265625, "global_step": 182211, "epoch": 1505} {"train_loss": -40.18400955200195, "global_step": 182212, "epoch": 1505} {"train_loss": -37.771759033203125, "global_step": 182213, "epoch": 1505} {"train_loss": -39.574256896972656, "global_step": 182214, "epoch": 1505} {"train_loss": -40.061519622802734, "global_step": 182215, "epoch": 1505} {"train_loss": -40.025550842285156, "global_step": 182216, "epoch": 1505} {"train_loss": -40.24749755859375, "global_step": 182217, "epoch": 1505} {"train_loss": -39.980648040771484, "global_step": 182218, "epoch": 1505} {"train_loss": -39.630733489990234, "global_step": 182219, "epoch": 1505} {"train_loss": -39.067970275878906, "global_step": 182220, "epoch": 1505} {"train_loss": -40.144775390625, "global_step": 182221, "epoch": 1505} {"train_loss": -39.08829879760742, "global_step": 182222, "epoch": 1505} {"train_loss": -39.615535736083984, "global_step": 182223, "epoch": 1505} {"train_loss": -40.190914154052734, "global_step": 182224, "epoch": 1505} {"train_loss": -39.68106425892223, "global_step": 182225, "epoch": 1505, "val_loss": 2655420.75} {"train_loss": -39.23131561279297, "global_step": 182226, "epoch": 1506} {"train_loss": -40.05259323120117, "global_step": 182227, "epoch": 1506} {"train_loss": -40.67341613769531, "global_step": 182228, "epoch": 1506} {"train_loss": -39.212642669677734, "global_step": 182229, "epoch": 1506} {"train_loss": -39.841636657714844, "global_step": 182230, "epoch": 1506} {"train_loss": -39.70859909057617, "global_step": 182231, "epoch": 1506} {"train_loss": -41.07807159423828, "global_step": 182232, "epoch": 1506} {"train_loss": -40.16051483154297, "global_step": 182233, "epoch": 1506} {"train_loss": -39.81217575073242, "global_step": 182234, "epoch": 1506} {"train_loss": -35.73037338256836, "global_step": 182235, "epoch": 1506} {"train_loss": -39.00166320800781, "global_step": 182236, "epoch": 1506} {"train_loss": -38.43719482421875, "global_step": 182237, "epoch": 1506} {"train_loss": -39.79021453857422, "global_step": 182238, "epoch": 1506} {"train_loss": -37.27657699584961, "global_step": 182239, "epoch": 1506} {"train_loss": -37.092193603515625, "global_step": 182240, "epoch": 1506} {"train_loss": -36.530052185058594, "global_step": 182241, "epoch": 1506} {"train_loss": -37.35426330566406, "global_step": 182242, "epoch": 1506} {"train_loss": -38.462093353271484, "global_step": 182243, "epoch": 1506} {"train_loss": -35.21898651123047, "global_step": 182244, "epoch": 1506} {"train_loss": -38.349891662597656, "global_step": 182245, "epoch": 1506} {"train_loss": -36.30493927001953, "global_step": 182246, "epoch": 1506} {"train_loss": -36.97245788574219, "global_step": 182247, "epoch": 1506} {"train_loss": -34.700008392333984, "global_step": 182248, "epoch": 1506} {"train_loss": -39.713417053222656, "global_step": 182249, "epoch": 1506} {"train_loss": -38.917259216308594, "global_step": 182250, "epoch": 1506} {"train_loss": -38.3506965637207, "global_step": 182251, "epoch": 1506} {"train_loss": -37.79728317260742, "global_step": 182252, "epoch": 1506} {"train_loss": -38.841495513916016, "global_step": 182253, "epoch": 1506} {"train_loss": -36.516109466552734, "global_step": 182254, "epoch": 1506} {"train_loss": -38.97468566894531, "global_step": 182255, "epoch": 1506} {"train_loss": -38.86332702636719, "global_step": 182256, "epoch": 1506} {"train_loss": -39.79448699951172, "global_step": 182257, "epoch": 1506} {"train_loss": -39.67409896850586, "global_step": 182258, "epoch": 1506} {"train_loss": -39.0802001953125, "global_step": 182259, "epoch": 1506} {"train_loss": -38.94343185424805, "global_step": 182260, "epoch": 1506} {"train_loss": -38.62786865234375, "global_step": 182261, "epoch": 1506} {"train_loss": -39.49467468261719, "global_step": 182262, "epoch": 1506} {"train_loss": -38.58891677856445, "global_step": 182263, "epoch": 1506} {"train_loss": -39.657169342041016, "global_step": 182264, "epoch": 1506} {"train_loss": -39.0813102722168, "global_step": 182265, "epoch": 1506} {"train_loss": -39.499298095703125, "global_step": 182266, "epoch": 1506} {"train_loss": -39.81669616699219, "global_step": 182267, "epoch": 1506} {"train_loss": -38.738372802734375, "global_step": 182268, "epoch": 1506} {"train_loss": -37.213314056396484, "global_step": 182269, "epoch": 1506} {"train_loss": -38.19596481323242, "global_step": 182270, "epoch": 1506} {"train_loss": -39.550113677978516, "global_step": 182271, "epoch": 1506} {"train_loss": -40.2647705078125, "global_step": 182272, "epoch": 1506} {"train_loss": -39.85628890991211, "global_step": 182273, "epoch": 1506} {"train_loss": -39.77156448364258, "global_step": 182274, "epoch": 1506} {"train_loss": -40.03607177734375, "global_step": 182275, "epoch": 1506} {"train_loss": -39.77760696411133, "global_step": 182276, "epoch": 1506} {"train_loss": -39.52241897583008, "global_step": 182277, "epoch": 1506} {"train_loss": -40.01957702636719, "global_step": 182278, "epoch": 1506} {"train_loss": -39.79036331176758, "global_step": 182279, "epoch": 1506} {"train_loss": -39.26327133178711, "global_step": 182280, "epoch": 1506} {"train_loss": -39.89937210083008, "global_step": 182281, "epoch": 1506} {"train_loss": -39.39965057373047, "global_step": 182282, "epoch": 1506} {"train_loss": -40.5509033203125, "global_step": 182283, "epoch": 1506} {"train_loss": -40.70338821411133, "global_step": 182284, "epoch": 1506} {"train_loss": -40.4657096862793, "global_step": 182285, "epoch": 1506} {"train_loss": -40.24857711791992, "global_step": 182286, "epoch": 1506} {"train_loss": -40.26777267456055, "global_step": 182287, "epoch": 1506} {"train_loss": -40.582191467285156, "global_step": 182288, "epoch": 1506} {"train_loss": -40.08308029174805, "global_step": 182289, "epoch": 1506} {"train_loss": -40.483154296875, "global_step": 182290, "epoch": 1506} {"train_loss": -38.80255889892578, "global_step": 182291, "epoch": 1506} {"train_loss": -39.644989013671875, "global_step": 182292, "epoch": 1506} {"train_loss": -40.2908935546875, "global_step": 182293, "epoch": 1506} {"train_loss": -40.17646408081055, "global_step": 182294, "epoch": 1506} {"train_loss": -39.68429946899414, "global_step": 182295, "epoch": 1506} {"train_loss": -39.86539840698242, "global_step": 182296, "epoch": 1506} {"train_loss": -40.3177490234375, "global_step": 182297, "epoch": 1506} {"train_loss": -40.441444396972656, "global_step": 182298, "epoch": 1506} {"train_loss": -40.50680160522461, "global_step": 182299, "epoch": 1506} {"train_loss": -39.58203887939453, "global_step": 182300, "epoch": 1506} {"train_loss": -39.55814743041992, "global_step": 182301, "epoch": 1506} {"train_loss": -39.74028396606445, "global_step": 182302, "epoch": 1506} {"train_loss": -40.163719177246094, "global_step": 182303, "epoch": 1506} {"train_loss": -38.95249938964844, "global_step": 182304, "epoch": 1506} {"train_loss": -40.88283157348633, "global_step": 182305, "epoch": 1506} {"train_loss": -40.63473129272461, "global_step": 182306, "epoch": 1506} {"train_loss": -40.50968551635742, "global_step": 182307, "epoch": 1506} {"train_loss": -39.80274963378906, "global_step": 182308, "epoch": 1506} {"train_loss": -40.36223602294922, "global_step": 182309, "epoch": 1506} {"train_loss": -39.87828063964844, "global_step": 182310, "epoch": 1506} {"train_loss": -40.52433395385742, "global_step": 182311, "epoch": 1506} {"train_loss": -39.9453010559082, "global_step": 182312, "epoch": 1506} {"train_loss": -39.98316192626953, "global_step": 182313, "epoch": 1506} {"train_loss": -39.96384811401367, "global_step": 182314, "epoch": 1506} {"train_loss": -40.06959533691406, "global_step": 182315, "epoch": 1506} {"train_loss": -39.646968841552734, "global_step": 182316, "epoch": 1506} {"train_loss": -40.30021667480469, "global_step": 182317, "epoch": 1506} {"train_loss": -40.196937561035156, "global_step": 182318, "epoch": 1506} {"train_loss": -39.69852828979492, "global_step": 182319, "epoch": 1506} {"train_loss": -40.75270080566406, "global_step": 182320, "epoch": 1506} {"train_loss": -40.64554977416992, "global_step": 182321, "epoch": 1506} {"train_loss": -38.7935791015625, "global_step": 182322, "epoch": 1506} {"train_loss": -40.11053466796875, "global_step": 182323, "epoch": 1506} {"train_loss": -39.89360427856445, "global_step": 182324, "epoch": 1506} {"train_loss": -40.14415740966797, "global_step": 182325, "epoch": 1506} {"train_loss": -40.80595016479492, "global_step": 182326, "epoch": 1506} {"train_loss": -39.74109649658203, "global_step": 182327, "epoch": 1506} {"train_loss": -40.29140090942383, "global_step": 182328, "epoch": 1506} {"train_loss": -39.963680267333984, "global_step": 182329, "epoch": 1506} {"train_loss": -40.700653076171875, "global_step": 182330, "epoch": 1506} {"train_loss": -39.25398635864258, "global_step": 182331, "epoch": 1506} {"train_loss": -39.59614944458008, "global_step": 182332, "epoch": 1506} {"train_loss": -40.15570831298828, "global_step": 182333, "epoch": 1506} {"train_loss": -39.46395492553711, "global_step": 182334, "epoch": 1506} {"train_loss": -39.742774963378906, "global_step": 182335, "epoch": 1506} {"train_loss": -40.87499237060547, "global_step": 182336, "epoch": 1506} {"train_loss": -39.99972152709961, "global_step": 182337, "epoch": 1506} {"train_loss": -40.33755874633789, "global_step": 182338, "epoch": 1506} {"train_loss": -40.05146026611328, "global_step": 182339, "epoch": 1506} {"train_loss": -39.69313049316406, "global_step": 182340, "epoch": 1506} {"train_loss": -40.78129959106445, "global_step": 182341, "epoch": 1506} {"train_loss": -39.91468048095703, "global_step": 182342, "epoch": 1506} {"train_loss": -41.4175910949707, "global_step": 182343, "epoch": 1506} {"train_loss": -39.797115325927734, "global_step": 182344, "epoch": 1506} {"train_loss": -40.50861740112305, "global_step": 182345, "epoch": 1506} {"train_loss": -39.50158521163562, "global_step": 182346, "epoch": 1506, "val_loss": 2583595.0} {"train_loss": -39.76789855957031, "global_step": 182347, "epoch": 1507} {"train_loss": -39.1113166809082, "global_step": 182348, "epoch": 1507} {"train_loss": -40.34444808959961, "global_step": 182349, "epoch": 1507} {"train_loss": -40.62483596801758, "global_step": 182350, "epoch": 1507} {"train_loss": -41.002891540527344, "global_step": 182351, "epoch": 1507} {"train_loss": -39.802425384521484, "global_step": 182352, "epoch": 1507} {"train_loss": -41.03989791870117, "global_step": 182353, "epoch": 1507} {"train_loss": -40.052284240722656, "global_step": 182354, "epoch": 1507} {"train_loss": -40.32400131225586, "global_step": 182355, "epoch": 1507} {"train_loss": -40.31064987182617, "global_step": 182356, "epoch": 1507} {"train_loss": -40.21566390991211, "global_step": 182357, "epoch": 1507} {"train_loss": -39.86769485473633, "global_step": 182358, "epoch": 1507} {"train_loss": -40.49020004272461, "global_step": 182359, "epoch": 1507} {"train_loss": -40.92900848388672, "global_step": 182360, "epoch": 1507} {"train_loss": -40.876495361328125, "global_step": 182361, "epoch": 1507} {"train_loss": -40.46320724487305, "global_step": 182362, "epoch": 1507} {"train_loss": -40.805843353271484, "global_step": 182363, "epoch": 1507} {"train_loss": -41.4637565612793, "global_step": 182364, "epoch": 1507} {"train_loss": -39.86069869995117, "global_step": 182365, "epoch": 1507} {"train_loss": -40.04867935180664, "global_step": 182366, "epoch": 1507} {"train_loss": -40.02549743652344, "global_step": 182367, "epoch": 1507} {"train_loss": -40.51240921020508, "global_step": 182368, "epoch": 1507} {"train_loss": -41.12112045288086, "global_step": 182369, "epoch": 1507} {"train_loss": -40.219139099121094, "global_step": 182370, "epoch": 1507} {"train_loss": -39.668556213378906, "global_step": 182371, "epoch": 1507} {"train_loss": -40.236183166503906, "global_step": 182372, "epoch": 1507} {"train_loss": -39.98627853393555, "global_step": 182373, "epoch": 1507} {"train_loss": -39.97395324707031, "global_step": 182374, "epoch": 1507} {"train_loss": -40.4948844909668, "global_step": 182375, "epoch": 1507} {"train_loss": -38.31879806518555, "global_step": 182376, "epoch": 1507} {"train_loss": -38.28322982788086, "global_step": 182377, "epoch": 1507} {"train_loss": -38.10334014892578, "global_step": 182378, "epoch": 1507} {"train_loss": -37.28239059448242, "global_step": 182379, "epoch": 1507} {"train_loss": -40.16131591796875, "global_step": 182380, "epoch": 1507} {"train_loss": -39.534358978271484, "global_step": 182381, "epoch": 1507} {"train_loss": -40.233665466308594, "global_step": 182382, "epoch": 1507} {"train_loss": -40.22468566894531, "global_step": 182383, "epoch": 1507} {"train_loss": -39.359310150146484, "global_step": 182384, "epoch": 1507} {"train_loss": -40.103485107421875, "global_step": 182385, "epoch": 1507} {"train_loss": -39.07394790649414, "global_step": 182386, "epoch": 1507} {"train_loss": -40.48347473144531, "global_step": 182387, "epoch": 1507} {"train_loss": -39.66854476928711, "global_step": 182388, "epoch": 1507} {"train_loss": -40.791500091552734, "global_step": 182389, "epoch": 1507} {"train_loss": -40.18381881713867, "global_step": 182390, "epoch": 1507} {"train_loss": -40.241737365722656, "global_step": 182391, "epoch": 1507} {"train_loss": -39.61226272583008, "global_step": 182392, "epoch": 1507} {"train_loss": -39.46874237060547, "global_step": 182393, "epoch": 1507} {"train_loss": -39.485042572021484, "global_step": 182394, "epoch": 1507} {"train_loss": -36.33837890625, "global_step": 182395, "epoch": 1507} {"train_loss": -39.70515060424805, "global_step": 182396, "epoch": 1507} {"train_loss": -38.423316955566406, "global_step": 182397, "epoch": 1507} {"train_loss": -40.02207565307617, "global_step": 182398, "epoch": 1507} {"train_loss": -40.161407470703125, "global_step": 182399, "epoch": 1507} {"train_loss": -39.966590881347656, "global_step": 182400, "epoch": 1507} {"train_loss": -38.8815803527832, "global_step": 182401, "epoch": 1507} {"train_loss": -40.580360412597656, "global_step": 182402, "epoch": 1507} {"train_loss": -38.838191986083984, "global_step": 182403, "epoch": 1507} {"train_loss": -40.564449310302734, "global_step": 182404, "epoch": 1507} {"train_loss": -40.17081832885742, "global_step": 182405, "epoch": 1507} {"train_loss": -39.94525146484375, "global_step": 182406, "epoch": 1507} {"train_loss": -39.82258224487305, "global_step": 182407, "epoch": 1507} {"train_loss": -38.02729415893555, "global_step": 182408, "epoch": 1507} {"train_loss": -39.93264389038086, "global_step": 182409, "epoch": 1507} {"train_loss": -38.63859176635742, "global_step": 182410, "epoch": 1507} {"train_loss": -40.38711166381836, "global_step": 182411, "epoch": 1507} {"train_loss": -39.16022872924805, "global_step": 182412, "epoch": 1507} {"train_loss": -40.74463653564453, "global_step": 182413, "epoch": 1507} {"train_loss": -38.622657775878906, "global_step": 182414, "epoch": 1507} {"train_loss": -39.61135482788086, "global_step": 182415, "epoch": 1507} {"train_loss": -39.07170486450195, "global_step": 182416, "epoch": 1507} {"train_loss": -39.81034851074219, "global_step": 182417, "epoch": 1507} {"train_loss": -39.57404327392578, "global_step": 182418, "epoch": 1507} {"train_loss": -39.44514846801758, "global_step": 182419, "epoch": 1507} {"train_loss": -40.3829231262207, "global_step": 182420, "epoch": 1507} {"train_loss": -39.501461029052734, "global_step": 182421, "epoch": 1507} {"train_loss": -40.03048324584961, "global_step": 182422, "epoch": 1507} {"train_loss": -39.32587814331055, "global_step": 182423, "epoch": 1507} {"train_loss": -40.80116653442383, "global_step": 182424, "epoch": 1507} {"train_loss": -40.261695861816406, "global_step": 182425, "epoch": 1507} {"train_loss": -39.98131561279297, "global_step": 182426, "epoch": 1507} {"train_loss": -40.303646087646484, "global_step": 182427, "epoch": 1507} {"train_loss": -40.69856262207031, "global_step": 182428, "epoch": 1507} {"train_loss": -40.499603271484375, "global_step": 182429, "epoch": 1507} {"train_loss": -39.489601135253906, "global_step": 182430, "epoch": 1507} {"train_loss": -41.601654052734375, "global_step": 182431, "epoch": 1507} {"train_loss": -40.66996383666992, "global_step": 182432, "epoch": 1507} {"train_loss": -40.609745025634766, "global_step": 182433, "epoch": 1507} {"train_loss": -40.35160827636719, "global_step": 182434, "epoch": 1507} {"train_loss": -41.24439239501953, "global_step": 182435, "epoch": 1507} {"train_loss": -41.200294494628906, "global_step": 182436, "epoch": 1507} {"train_loss": -40.95756149291992, "global_step": 182437, "epoch": 1507} {"train_loss": -40.75265884399414, "global_step": 182438, "epoch": 1507} {"train_loss": -41.15532302856445, "global_step": 182439, "epoch": 1507} {"train_loss": -41.094032287597656, "global_step": 182440, "epoch": 1507} {"train_loss": -39.708831787109375, "global_step": 182441, "epoch": 1507} {"train_loss": -41.27385330200195, "global_step": 182442, "epoch": 1507} {"train_loss": -40.731842041015625, "global_step": 182443, "epoch": 1507} {"train_loss": -40.400108337402344, "global_step": 182444, "epoch": 1507} {"train_loss": -41.28449249267578, "global_step": 182445, "epoch": 1507} {"train_loss": -41.0010871887207, "global_step": 182446, "epoch": 1507} {"train_loss": -41.65755081176758, "global_step": 182447, "epoch": 1507} {"train_loss": -39.458621978759766, "global_step": 182448, "epoch": 1507} {"train_loss": -40.45791244506836, "global_step": 182449, "epoch": 1507} {"train_loss": -40.72329330444336, "global_step": 182450, "epoch": 1507} {"train_loss": -40.7888298034668, "global_step": 182451, "epoch": 1507} {"train_loss": -41.539527893066406, "global_step": 182452, "epoch": 1507} {"train_loss": -40.83579635620117, "global_step": 182453, "epoch": 1507} {"train_loss": -38.237632751464844, "global_step": 182454, "epoch": 1507} {"train_loss": -41.158721923828125, "global_step": 182455, "epoch": 1507} {"train_loss": -40.89186096191406, "global_step": 182456, "epoch": 1507} {"train_loss": -40.61513900756836, "global_step": 182457, "epoch": 1507} {"train_loss": -40.794921875, "global_step": 182458, "epoch": 1507} {"train_loss": -41.48269271850586, "global_step": 182459, "epoch": 1507} {"train_loss": -40.946258544921875, "global_step": 182460, "epoch": 1507} {"train_loss": -41.12519073486328, "global_step": 182461, "epoch": 1507} {"train_loss": -40.743038177490234, "global_step": 182462, "epoch": 1507} {"train_loss": -40.60002517700195, "global_step": 182463, "epoch": 1507} {"train_loss": -41.32492446899414, "global_step": 182464, "epoch": 1507} {"train_loss": -41.26599884033203, "global_step": 182465, "epoch": 1507} {"train_loss": -40.8863525390625, "global_step": 182466, "epoch": 1507} {"train_loss": -40.14248244230412, "global_step": 182467, "epoch": 1507, "val_loss": 2833879.0} {"train_loss": -40.099464416503906, "global_step": 182468, "epoch": 1508} {"train_loss": -36.858367919921875, "global_step": 182469, "epoch": 1508} {"train_loss": -39.28609848022461, "global_step": 182470, "epoch": 1508} {"train_loss": -40.06367111206055, "global_step": 182471, "epoch": 1508} {"train_loss": -40.267555236816406, "global_step": 182472, "epoch": 1508} {"train_loss": -40.88445281982422, "global_step": 182473, "epoch": 1508} {"train_loss": -38.949188232421875, "global_step": 182474, "epoch": 1508} {"train_loss": -37.89437484741211, "global_step": 182475, "epoch": 1508} {"train_loss": -38.182308197021484, "global_step": 182476, "epoch": 1508} {"train_loss": -39.80354690551758, "global_step": 182477, "epoch": 1508} {"train_loss": -38.74061584472656, "global_step": 182478, "epoch": 1508} {"train_loss": -38.9570426940918, "global_step": 182479, "epoch": 1508} {"train_loss": -40.42081832885742, "global_step": 182480, "epoch": 1508} {"train_loss": -35.54618453979492, "global_step": 182481, "epoch": 1508} {"train_loss": -37.80207443237305, "global_step": 182482, "epoch": 1508} {"train_loss": -38.8975830078125, "global_step": 182483, "epoch": 1508} {"train_loss": -40.83737564086914, "global_step": 182484, "epoch": 1508} {"train_loss": -40.65974807739258, "global_step": 182485, "epoch": 1508} {"train_loss": -40.90072250366211, "global_step": 182486, "epoch": 1508} {"train_loss": -39.69985580444336, "global_step": 182487, "epoch": 1508} {"train_loss": -38.13616943359375, "global_step": 182488, "epoch": 1508} {"train_loss": -39.59981155395508, "global_step": 182489, "epoch": 1508} {"train_loss": -38.793731689453125, "global_step": 182490, "epoch": 1508} {"train_loss": -36.36756896972656, "global_step": 182491, "epoch": 1508} {"train_loss": -37.22893142700195, "global_step": 182492, "epoch": 1508} {"train_loss": -38.353939056396484, "global_step": 182493, "epoch": 1508} {"train_loss": -38.81202697753906, "global_step": 182494, "epoch": 1508} {"train_loss": -35.03450393676758, "global_step": 182495, "epoch": 1508} {"train_loss": -38.25371170043945, "global_step": 182496, "epoch": 1508} {"train_loss": -39.46323776245117, "global_step": 182497, "epoch": 1508} {"train_loss": -39.693172454833984, "global_step": 182498, "epoch": 1508} {"train_loss": -36.778011322021484, "global_step": 182499, "epoch": 1508} {"train_loss": -38.994361877441406, "global_step": 182500, "epoch": 1508} {"train_loss": -40.480438232421875, "global_step": 182501, "epoch": 1508} {"train_loss": -37.939945220947266, "global_step": 182502, "epoch": 1508} {"train_loss": -36.699764251708984, "global_step": 182503, "epoch": 1508} {"train_loss": -37.5145263671875, "global_step": 182504, "epoch": 1508} {"train_loss": -39.22388458251953, "global_step": 182505, "epoch": 1508} {"train_loss": -37.51304626464844, "global_step": 182506, "epoch": 1508} {"train_loss": -38.88399887084961, "global_step": 182507, "epoch": 1508} {"train_loss": -37.12852096557617, "global_step": 182508, "epoch": 1508} {"train_loss": -35.40968704223633, "global_step": 182509, "epoch": 1508} {"train_loss": -38.676605224609375, "global_step": 182510, "epoch": 1508} {"train_loss": -39.31698226928711, "global_step": 182511, "epoch": 1508} {"train_loss": -37.65436935424805, "global_step": 182512, "epoch": 1508} {"train_loss": -38.65614700317383, "global_step": 182513, "epoch": 1508} {"train_loss": -34.81734848022461, "global_step": 182514, "epoch": 1508} {"train_loss": -39.234859466552734, "global_step": 182515, "epoch": 1508} {"train_loss": -38.51301193237305, "global_step": 182516, "epoch": 1508} {"train_loss": -37.866703033447266, "global_step": 182517, "epoch": 1508} {"train_loss": -39.02842712402344, "global_step": 182518, "epoch": 1508} {"train_loss": -39.90324020385742, "global_step": 182519, "epoch": 1508} {"train_loss": -39.42011642456055, "global_step": 182520, "epoch": 1508} {"train_loss": -38.353599548339844, "global_step": 182521, "epoch": 1508} {"train_loss": -39.30459213256836, "global_step": 182522, "epoch": 1508} {"train_loss": -37.135860443115234, "global_step": 182523, "epoch": 1508} {"train_loss": -39.62012481689453, "global_step": 182524, "epoch": 1508} {"train_loss": -39.19694519042969, "global_step": 182525, "epoch": 1508} {"train_loss": -39.74334716796875, "global_step": 182526, "epoch": 1508} {"train_loss": -39.29113006591797, "global_step": 182527, "epoch": 1508} {"train_loss": -39.94057846069336, "global_step": 182528, "epoch": 1508} {"train_loss": -40.367652893066406, "global_step": 182529, "epoch": 1508} {"train_loss": -40.079620361328125, "global_step": 182530, "epoch": 1508} {"train_loss": -38.76961135864258, "global_step": 182531, "epoch": 1508} {"train_loss": -39.5395622253418, "global_step": 182532, "epoch": 1508} {"train_loss": -39.412139892578125, "global_step": 182533, "epoch": 1508} {"train_loss": -38.501583099365234, "global_step": 182534, "epoch": 1508} {"train_loss": -39.64622497558594, "global_step": 182535, "epoch": 1508} {"train_loss": -39.76322555541992, "global_step": 182536, "epoch": 1508} {"train_loss": -39.78619384765625, "global_step": 182537, "epoch": 1508} {"train_loss": -40.56169509887695, "global_step": 182538, "epoch": 1508} {"train_loss": -40.33633041381836, "global_step": 182539, "epoch": 1508} {"train_loss": -40.385475158691406, "global_step": 182540, "epoch": 1508} {"train_loss": -40.124671936035156, "global_step": 182541, "epoch": 1508} {"train_loss": -39.60000228881836, "global_step": 182542, "epoch": 1508} {"train_loss": -39.630714416503906, "global_step": 182543, "epoch": 1508} {"train_loss": -40.4898567199707, "global_step": 182544, "epoch": 1508} {"train_loss": -40.812198638916016, "global_step": 182545, "epoch": 1508} {"train_loss": -40.23213195800781, "global_step": 182546, "epoch": 1508} {"train_loss": -40.187744140625, "global_step": 182547, "epoch": 1508} {"train_loss": -41.061248779296875, "global_step": 182548, "epoch": 1508} {"train_loss": -40.67780303955078, "global_step": 182549, "epoch": 1508} {"train_loss": -40.59701156616211, "global_step": 182550, "epoch": 1508} {"train_loss": -39.60788345336914, "global_step": 182551, "epoch": 1508} {"train_loss": -41.31210708618164, "global_step": 182552, "epoch": 1508} {"train_loss": -40.807586669921875, "global_step": 182553, "epoch": 1508} {"train_loss": -39.279258728027344, "global_step": 182554, "epoch": 1508} {"train_loss": -39.68500900268555, "global_step": 182555, "epoch": 1508} {"train_loss": -40.3270149230957, "global_step": 182556, "epoch": 1508} {"train_loss": -41.15886688232422, "global_step": 182557, "epoch": 1508} {"train_loss": -40.83526611328125, "global_step": 182558, "epoch": 1508} {"train_loss": -39.612300872802734, "global_step": 182559, "epoch": 1508} {"train_loss": -40.6526985168457, "global_step": 182560, "epoch": 1508} {"train_loss": -40.715728759765625, "global_step": 182561, "epoch": 1508} {"train_loss": -40.427669525146484, "global_step": 182562, "epoch": 1508} {"train_loss": -40.47169876098633, "global_step": 182563, "epoch": 1508} {"train_loss": -40.48820114135742, "global_step": 182564, "epoch": 1508} {"train_loss": -39.84407424926758, "global_step": 182565, "epoch": 1508} {"train_loss": -40.48843002319336, "global_step": 182566, "epoch": 1508} {"train_loss": -41.08980941772461, "global_step": 182567, "epoch": 1508} {"train_loss": -41.23337936401367, "global_step": 182568, "epoch": 1508} {"train_loss": -40.06584548950195, "global_step": 182569, "epoch": 1508} {"train_loss": -40.73289108276367, "global_step": 182570, "epoch": 1508} {"train_loss": -41.23531723022461, "global_step": 182571, "epoch": 1508} {"train_loss": -40.36978530883789, "global_step": 182572, "epoch": 1508} {"train_loss": -39.850860595703125, "global_step": 182573, "epoch": 1508} {"train_loss": -40.86933517456055, "global_step": 182574, "epoch": 1508} {"train_loss": -39.8304443359375, "global_step": 182575, "epoch": 1508} {"train_loss": -39.70463943481445, "global_step": 182576, "epoch": 1508} {"train_loss": -38.44623947143555, "global_step": 182577, "epoch": 1508} {"train_loss": -40.70048141479492, "global_step": 182578, "epoch": 1508} {"train_loss": -40.365501403808594, "global_step": 182579, "epoch": 1508} {"train_loss": -38.99072265625, "global_step": 182580, "epoch": 1508} {"train_loss": -39.85654067993164, "global_step": 182581, "epoch": 1508} {"train_loss": -40.063655853271484, "global_step": 182582, "epoch": 1508} {"train_loss": -38.38711166381836, "global_step": 182583, "epoch": 1508} {"train_loss": -39.3551139831543, "global_step": 182584, "epoch": 1508} {"train_loss": -39.7269287109375, "global_step": 182585, "epoch": 1508} {"train_loss": -38.764713287353516, "global_step": 182586, "epoch": 1508} {"train_loss": -38.0042724609375, "global_step": 182587, "epoch": 1508} {"train_loss": -39.3086331580296, "global_step": 182588, "epoch": 1508, "val_loss": 2727684.25} {"train_loss": -38.26778793334961, "global_step": 182589, "epoch": 1509} {"train_loss": -39.799678802490234, "global_step": 182590, "epoch": 1509} {"train_loss": -35.552345275878906, "global_step": 182591, "epoch": 1509} {"train_loss": -31.538904190063477, "global_step": 182592, "epoch": 1509} {"train_loss": -32.034523010253906, "global_step": 182593, "epoch": 1509} {"train_loss": -39.62636947631836, "global_step": 182594, "epoch": 1509} {"train_loss": -38.36207962036133, "global_step": 182595, "epoch": 1509} {"train_loss": -37.46470642089844, "global_step": 182596, "epoch": 1509} {"train_loss": -40.49480438232422, "global_step": 182597, "epoch": 1509} {"train_loss": -39.383358001708984, "global_step": 182598, "epoch": 1509} {"train_loss": -40.193946838378906, "global_step": 182599, "epoch": 1509} {"train_loss": -39.408111572265625, "global_step": 182600, "epoch": 1509} {"train_loss": -38.866790771484375, "global_step": 182601, "epoch": 1509} {"train_loss": -39.90034484863281, "global_step": 182602, "epoch": 1509} {"train_loss": -39.03181838989258, "global_step": 182603, "epoch": 1509} {"train_loss": -40.514976501464844, "global_step": 182604, "epoch": 1509} {"train_loss": -39.97462844848633, "global_step": 182605, "epoch": 1509} {"train_loss": -39.44677734375, "global_step": 182606, "epoch": 1509} {"train_loss": -40.005435943603516, "global_step": 182607, "epoch": 1509} {"train_loss": -40.672203063964844, "global_step": 182608, "epoch": 1509} {"train_loss": -40.211280822753906, "global_step": 182609, "epoch": 1509} {"train_loss": -40.160213470458984, "global_step": 182610, "epoch": 1509} {"train_loss": -40.325767517089844, "global_step": 182611, "epoch": 1509} {"train_loss": -41.21232986450195, "global_step": 182612, "epoch": 1509} {"train_loss": -40.74058151245117, "global_step": 182613, "epoch": 1509} {"train_loss": -39.48183822631836, "global_step": 182614, "epoch": 1509} {"train_loss": -40.39219284057617, "global_step": 182615, "epoch": 1509} {"train_loss": -40.371009826660156, "global_step": 182616, "epoch": 1509} {"train_loss": -41.35679244995117, "global_step": 182617, "epoch": 1509} {"train_loss": -40.821590423583984, "global_step": 182618, "epoch": 1509} {"train_loss": -41.389244079589844, "global_step": 182619, "epoch": 1509} {"train_loss": -40.93876266479492, "global_step": 182620, "epoch": 1509} {"train_loss": -41.01676559448242, "global_step": 182621, "epoch": 1509} {"train_loss": -41.122127532958984, "global_step": 182622, "epoch": 1509} {"train_loss": -41.456783294677734, "global_step": 182623, "epoch": 1509} {"train_loss": -39.81965255737305, "global_step": 182624, "epoch": 1509} {"train_loss": -41.455814361572266, "global_step": 182625, "epoch": 1509} {"train_loss": -40.501853942871094, "global_step": 182626, "epoch": 1509} {"train_loss": -41.41746139526367, "global_step": 182627, "epoch": 1509} {"train_loss": -41.5025749206543, "global_step": 182628, "epoch": 1509} {"train_loss": -41.69247055053711, "global_step": 182629, "epoch": 1509} {"train_loss": -39.8320426940918, "global_step": 182630, "epoch": 1509} {"train_loss": -41.28239059448242, "global_step": 182631, "epoch": 1509} {"train_loss": -41.4628791809082, "global_step": 182632, "epoch": 1509} {"train_loss": -41.240745544433594, "global_step": 182633, "epoch": 1509} {"train_loss": -41.07709884643555, "global_step": 182634, "epoch": 1509} {"train_loss": -40.411197662353516, "global_step": 182635, "epoch": 1509} {"train_loss": -40.66501998901367, "global_step": 182636, "epoch": 1509} {"train_loss": -41.37036895751953, "global_step": 182637, "epoch": 1509} {"train_loss": -41.30180740356445, "global_step": 182638, "epoch": 1509} {"train_loss": -41.4473991394043, "global_step": 182639, "epoch": 1509} {"train_loss": -41.53561019897461, "global_step": 182640, "epoch": 1509} {"train_loss": -40.6501350402832, "global_step": 182641, "epoch": 1509} {"train_loss": -41.0756721496582, "global_step": 182642, "epoch": 1509} {"train_loss": -41.789817810058594, "global_step": 182643, "epoch": 1509} {"train_loss": -40.897647857666016, "global_step": 182644, "epoch": 1509} {"train_loss": -40.87112045288086, "global_step": 182645, "epoch": 1509} {"train_loss": -41.93777847290039, "global_step": 182646, "epoch": 1509} {"train_loss": -41.518184661865234, "global_step": 182647, "epoch": 1509} {"train_loss": -41.31508255004883, "global_step": 182648, "epoch": 1509} {"train_loss": -40.002437591552734, "global_step": 182649, "epoch": 1509} {"train_loss": -41.05170822143555, "global_step": 182650, "epoch": 1509} {"train_loss": -41.470943450927734, "global_step": 182651, "epoch": 1509} {"train_loss": -40.046287536621094, "global_step": 182652, "epoch": 1509} {"train_loss": -40.6850700378418, "global_step": 182653, "epoch": 1509} {"train_loss": -39.504432678222656, "global_step": 182654, "epoch": 1509} {"train_loss": -41.74402618408203, "global_step": 182655, "epoch": 1509} {"train_loss": -40.65760803222656, "global_step": 182656, "epoch": 1509} {"train_loss": -40.86372756958008, "global_step": 182657, "epoch": 1509} {"train_loss": -39.2238883972168, "global_step": 182658, "epoch": 1509} {"train_loss": -39.25069808959961, "global_step": 182659, "epoch": 1509} {"train_loss": -38.747840881347656, "global_step": 182660, "epoch": 1509} {"train_loss": -35.660194396972656, "global_step": 182661, "epoch": 1509} {"train_loss": -34.221065521240234, "global_step": 182662, "epoch": 1509} {"train_loss": -35.60238265991211, "global_step": 182663, "epoch": 1509} {"train_loss": -32.945133209228516, "global_step": 182664, "epoch": 1509} {"train_loss": -32.268489837646484, "global_step": 182665, "epoch": 1509} {"train_loss": -36.906612396240234, "global_step": 182666, "epoch": 1509} {"train_loss": -35.48710250854492, "global_step": 182667, "epoch": 1509} {"train_loss": -38.83245086669922, "global_step": 182668, "epoch": 1509} {"train_loss": -36.37937545776367, "global_step": 182669, "epoch": 1509} {"train_loss": -28.68985939025879, "global_step": 182670, "epoch": 1509} {"train_loss": -31.06855583190918, "global_step": 182671, "epoch": 1509} {"train_loss": -34.71798324584961, "global_step": 182672, "epoch": 1509} {"train_loss": -32.30817413330078, "global_step": 182673, "epoch": 1509} {"train_loss": -38.35239791870117, "global_step": 182674, "epoch": 1509} {"train_loss": -32.4646110534668, "global_step": 182675, "epoch": 1509} {"train_loss": -37.797698974609375, "global_step": 182676, "epoch": 1509} {"train_loss": -37.00568771362305, "global_step": 182677, "epoch": 1509} {"train_loss": -36.145530700683594, "global_step": 182678, "epoch": 1509} {"train_loss": -31.38722038269043, "global_step": 182679, "epoch": 1509} {"train_loss": -36.517269134521484, "global_step": 182680, "epoch": 1509} {"train_loss": -37.5731315612793, "global_step": 182681, "epoch": 1509} {"train_loss": -37.43343734741211, "global_step": 182682, "epoch": 1509} {"train_loss": -37.87961196899414, "global_step": 182683, "epoch": 1509} {"train_loss": -38.040306091308594, "global_step": 182684, "epoch": 1509} {"train_loss": -37.9021110534668, "global_step": 182685, "epoch": 1509} {"train_loss": -38.17258071899414, "global_step": 182686, "epoch": 1509} {"train_loss": -37.40218734741211, "global_step": 182687, "epoch": 1509} {"train_loss": -38.9348030090332, "global_step": 182688, "epoch": 1509} {"train_loss": -37.318328857421875, "global_step": 182689, "epoch": 1509} {"train_loss": -39.06982421875, "global_step": 182690, "epoch": 1509} {"train_loss": -36.92812728881836, "global_step": 182691, "epoch": 1509} {"train_loss": -39.0404167175293, "global_step": 182692, "epoch": 1509} {"train_loss": -38.91652297973633, "global_step": 182693, "epoch": 1509} {"train_loss": -39.2822380065918, "global_step": 182694, "epoch": 1509} {"train_loss": -37.54703903198242, "global_step": 182695, "epoch": 1509} {"train_loss": -39.15135192871094, "global_step": 182696, "epoch": 1509} {"train_loss": -39.492305755615234, "global_step": 182697, "epoch": 1509} {"train_loss": -36.08362579345703, "global_step": 182698, "epoch": 1509} {"train_loss": -38.13905334472656, "global_step": 182699, "epoch": 1509} {"train_loss": -39.36246871948242, "global_step": 182700, "epoch": 1509} {"train_loss": -39.06293487548828, "global_step": 182701, "epoch": 1509} {"train_loss": -39.33729934692383, "global_step": 182702, "epoch": 1509} {"train_loss": -39.581729888916016, "global_step": 182703, "epoch": 1509} {"train_loss": -39.55907440185547, "global_step": 182704, "epoch": 1509} {"train_loss": -39.06780242919922, "global_step": 182705, "epoch": 1509} {"train_loss": -38.037593841552734, "global_step": 182706, "epoch": 1509} {"train_loss": -39.40863037109375, "global_step": 182707, "epoch": 1509} {"train_loss": -39.28066635131836, "global_step": 182708, "epoch": 1509} {"train_loss": -38.873695688799394, "global_step": 182709, "epoch": 1509, "val_loss": 2601003.0} {"train_loss": -39.374942779541016, "global_step": 182710, "epoch": 1510} {"train_loss": -40.0308952331543, "global_step": 182711, "epoch": 1510} {"train_loss": -39.03251647949219, "global_step": 182712, "epoch": 1510} {"train_loss": -39.27501678466797, "global_step": 182713, "epoch": 1510} {"train_loss": -39.974918365478516, "global_step": 182714, "epoch": 1510} {"train_loss": -39.81950759887695, "global_step": 182715, "epoch": 1510} {"train_loss": -39.025630950927734, "global_step": 182716, "epoch": 1510} {"train_loss": -39.80855941772461, "global_step": 182717, "epoch": 1510} {"train_loss": -40.31599044799805, "global_step": 182718, "epoch": 1510} {"train_loss": -39.82304000854492, "global_step": 182719, "epoch": 1510} {"train_loss": -40.2298583984375, "global_step": 182720, "epoch": 1510} {"train_loss": -39.293251037597656, "global_step": 182721, "epoch": 1510} {"train_loss": -40.361305236816406, "global_step": 182722, "epoch": 1510} {"train_loss": -40.13424301147461, "global_step": 182723, "epoch": 1510} {"train_loss": -40.608760833740234, "global_step": 182724, "epoch": 1510} {"train_loss": -39.56842041015625, "global_step": 182725, "epoch": 1510} {"train_loss": -41.081844329833984, "global_step": 182726, "epoch": 1510} {"train_loss": -39.12175369262695, "global_step": 182727, "epoch": 1510} {"train_loss": -39.99359130859375, "global_step": 182728, "epoch": 1510} {"train_loss": -39.9759521484375, "global_step": 182729, "epoch": 1510} {"train_loss": -40.531959533691406, "global_step": 182730, "epoch": 1510} {"train_loss": -39.209224700927734, "global_step": 182731, "epoch": 1510} {"train_loss": -41.00483322143555, "global_step": 182732, "epoch": 1510} {"train_loss": -40.84479522705078, "global_step": 182733, "epoch": 1510} {"train_loss": -40.79091262817383, "global_step": 182734, "epoch": 1510} {"train_loss": -40.96614456176758, "global_step": 182735, "epoch": 1510} {"train_loss": -40.60989761352539, "global_step": 182736, "epoch": 1510} {"train_loss": -41.454559326171875, "global_step": 182737, "epoch": 1510} {"train_loss": -40.321983337402344, "global_step": 182738, "epoch": 1510} {"train_loss": -41.03620910644531, "global_step": 182739, "epoch": 1510} {"train_loss": -40.629730224609375, "global_step": 182740, "epoch": 1510} {"train_loss": -40.6660270690918, "global_step": 182741, "epoch": 1510} {"train_loss": -40.02985763549805, "global_step": 182742, "epoch": 1510} {"train_loss": -40.1289176940918, "global_step": 182743, "epoch": 1510} {"train_loss": -40.63407516479492, "global_step": 182744, "epoch": 1510} {"train_loss": -40.49219512939453, "global_step": 182745, "epoch": 1510} {"train_loss": -40.58256912231445, "global_step": 182746, "epoch": 1510} {"train_loss": -40.69865036010742, "global_step": 182747, "epoch": 1510} {"train_loss": -40.47846603393555, "global_step": 182748, "epoch": 1510} {"train_loss": -41.098976135253906, "global_step": 182749, "epoch": 1510} {"train_loss": -41.24811935424805, "global_step": 182750, "epoch": 1510} {"train_loss": -40.98854064941406, "global_step": 182751, "epoch": 1510} {"train_loss": -41.228118896484375, "global_step": 182752, "epoch": 1510} {"train_loss": -41.15317916870117, "global_step": 182753, "epoch": 1510} {"train_loss": -41.037506103515625, "global_step": 182754, "epoch": 1510} {"train_loss": -41.60307312011719, "global_step": 182755, "epoch": 1510} {"train_loss": -41.56898880004883, "global_step": 182756, "epoch": 1510} {"train_loss": -41.444576263427734, "global_step": 182757, "epoch": 1510} {"train_loss": -41.43891525268555, "global_step": 182758, "epoch": 1510} {"train_loss": -41.58910369873047, "global_step": 182759, "epoch": 1510} {"train_loss": -39.882564544677734, "global_step": 182760, "epoch": 1510} {"train_loss": -39.60790252685547, "global_step": 182761, "epoch": 1510} {"train_loss": -41.46446228027344, "global_step": 182762, "epoch": 1510} {"train_loss": -41.662601470947266, "global_step": 182763, "epoch": 1510} {"train_loss": -40.384002685546875, "global_step": 182764, "epoch": 1510} {"train_loss": -40.8573112487793, "global_step": 182765, "epoch": 1510} {"train_loss": -41.2547721862793, "global_step": 182766, "epoch": 1510} {"train_loss": -41.4150390625, "global_step": 182767, "epoch": 1510} {"train_loss": -40.94001007080078, "global_step": 182768, "epoch": 1510} {"train_loss": -40.569091796875, "global_step": 182769, "epoch": 1510} {"train_loss": -40.969730377197266, "global_step": 182770, "epoch": 1510} {"train_loss": -41.25151443481445, "global_step": 182771, "epoch": 1510} {"train_loss": -41.12582015991211, "global_step": 182772, "epoch": 1510} {"train_loss": -41.682403564453125, "global_step": 182773, "epoch": 1510} {"train_loss": -40.93019485473633, "global_step": 182774, "epoch": 1510} {"train_loss": -41.40009307861328, "global_step": 182775, "epoch": 1510} {"train_loss": -41.42477035522461, "global_step": 182776, "epoch": 1510} {"train_loss": -40.805885314941406, "global_step": 182777, "epoch": 1510} {"train_loss": -41.99843978881836, "global_step": 182778, "epoch": 1510} {"train_loss": -40.57429122924805, "global_step": 182779, "epoch": 1510} {"train_loss": -41.52177429199219, "global_step": 182780, "epoch": 1510} {"train_loss": -41.18140411376953, "global_step": 182781, "epoch": 1510} {"train_loss": -40.987789154052734, "global_step": 182782, "epoch": 1510} {"train_loss": -40.980865478515625, "global_step": 182783, "epoch": 1510} {"train_loss": -41.17491912841797, "global_step": 182784, "epoch": 1510} {"train_loss": -41.45180892944336, "global_step": 182785, "epoch": 1510} {"train_loss": -41.86082077026367, "global_step": 182786, "epoch": 1510} {"train_loss": -40.93709945678711, "global_step": 182787, "epoch": 1510} {"train_loss": -39.18622970581055, "global_step": 182788, "epoch": 1510} {"train_loss": -40.86564254760742, "global_step": 182789, "epoch": 1510} {"train_loss": -41.64443588256836, "global_step": 182790, "epoch": 1510} {"train_loss": -40.737510681152344, "global_step": 182791, "epoch": 1510} {"train_loss": -41.27183532714844, "global_step": 182792, "epoch": 1510} {"train_loss": -41.37890625, "global_step": 182793, "epoch": 1510} {"train_loss": -40.559078216552734, "global_step": 182794, "epoch": 1510} {"train_loss": -39.80096435546875, "global_step": 182795, "epoch": 1510} {"train_loss": -40.2241325378418, "global_step": 182796, "epoch": 1510} {"train_loss": -40.40132522583008, "global_step": 182797, "epoch": 1510} {"train_loss": -40.912628173828125, "global_step": 182798, "epoch": 1510} {"train_loss": -40.96651077270508, "global_step": 182799, "epoch": 1510} {"train_loss": -38.89266586303711, "global_step": 182800, "epoch": 1510} {"train_loss": -39.14031982421875, "global_step": 182801, "epoch": 1510} {"train_loss": -35.9479866027832, "global_step": 182802, "epoch": 1510} {"train_loss": -26.7973690032959, "global_step": 182803, "epoch": 1510} {"train_loss": -18.41170310974121, "global_step": 182804, "epoch": 1510} {"train_loss": -14.414410591125488, "global_step": 182805, "epoch": 1510} {"train_loss": -37.06585693359375, "global_step": 182806, "epoch": 1510} {"train_loss": -29.895261764526367, "global_step": 182807, "epoch": 1510} {"train_loss": -33.176246643066406, "global_step": 182808, "epoch": 1510} {"train_loss": -31.92498779296875, "global_step": 182809, "epoch": 1510} {"train_loss": -35.0986442565918, "global_step": 182810, "epoch": 1510} {"train_loss": -33.39399337768555, "global_step": 182811, "epoch": 1510} {"train_loss": -37.85385513305664, "global_step": 182812, "epoch": 1510} {"train_loss": -33.53071975708008, "global_step": 182813, "epoch": 1510} {"train_loss": -36.9847526550293, "global_step": 182814, "epoch": 1510} {"train_loss": -35.58757019042969, "global_step": 182815, "epoch": 1510} {"train_loss": -33.544166564941406, "global_step": 182816, "epoch": 1510} {"train_loss": -37.83476638793945, "global_step": 182817, "epoch": 1510} {"train_loss": -33.604305267333984, "global_step": 182818, "epoch": 1510} {"train_loss": -37.768245697021484, "global_step": 182819, "epoch": 1510} {"train_loss": -35.302703857421875, "global_step": 182820, "epoch": 1510} {"train_loss": -35.6679573059082, "global_step": 182821, "epoch": 1510} {"train_loss": -36.01611328125, "global_step": 182822, "epoch": 1510} {"train_loss": -38.911773681640625, "global_step": 182823, "epoch": 1510} {"train_loss": -36.753849029541016, "global_step": 182824, "epoch": 1510} {"train_loss": -36.69668960571289, "global_step": 182825, "epoch": 1510} {"train_loss": -38.360286712646484, "global_step": 182826, "epoch": 1510} {"train_loss": -37.27975082397461, "global_step": 182827, "epoch": 1510} {"train_loss": -37.85179901123047, "global_step": 182828, "epoch": 1510} {"train_loss": -39.3862190246582, "global_step": 182829, "epoch": 1510} {"train_loss": -39.106106931513004, "global_step": 182830, "epoch": 1510, "val_loss": 2583456.75} {"train_loss": -36.69752883911133, "global_step": 182831, "epoch": 1511} {"train_loss": -39.077945709228516, "global_step": 182832, "epoch": 1511} {"train_loss": -39.02942657470703, "global_step": 182833, "epoch": 1511} {"train_loss": -38.80378723144531, "global_step": 182834, "epoch": 1511} {"train_loss": -39.23681640625, "global_step": 182835, "epoch": 1511} {"train_loss": -39.120643615722656, "global_step": 182836, "epoch": 1511} {"train_loss": -38.58441925048828, "global_step": 182837, "epoch": 1511} {"train_loss": -38.87583541870117, "global_step": 182838, "epoch": 1511} {"train_loss": -38.76401138305664, "global_step": 182839, "epoch": 1511} {"train_loss": -38.81415557861328, "global_step": 182840, "epoch": 1511} {"train_loss": -38.89473342895508, "global_step": 182841, "epoch": 1511} {"train_loss": -39.55913162231445, "global_step": 182842, "epoch": 1511} {"train_loss": -39.84560012817383, "global_step": 182843, "epoch": 1511} {"train_loss": -38.81442642211914, "global_step": 182844, "epoch": 1511} {"train_loss": -39.948665618896484, "global_step": 182845, "epoch": 1511} {"train_loss": -39.10158920288086, "global_step": 182846, "epoch": 1511} {"train_loss": -39.9200439453125, "global_step": 182847, "epoch": 1511} {"train_loss": -39.980743408203125, "global_step": 182848, "epoch": 1511} {"train_loss": -38.98512268066406, "global_step": 182849, "epoch": 1511} {"train_loss": -37.382606506347656, "global_step": 182850, "epoch": 1511} {"train_loss": -40.012691497802734, "global_step": 182851, "epoch": 1511} {"train_loss": -39.711055755615234, "global_step": 182852, "epoch": 1511} {"train_loss": -39.26454544067383, "global_step": 182853, "epoch": 1511} {"train_loss": -39.71110153198242, "global_step": 182854, "epoch": 1511} {"train_loss": -38.96302032470703, "global_step": 182855, "epoch": 1511} {"train_loss": -40.08781433105469, "global_step": 182856, "epoch": 1511} {"train_loss": -38.76907730102539, "global_step": 182857, "epoch": 1511} {"train_loss": -39.94218063354492, "global_step": 182858, "epoch": 1511} {"train_loss": -40.07009506225586, "global_step": 182859, "epoch": 1511} {"train_loss": -38.85844039916992, "global_step": 182860, "epoch": 1511} {"train_loss": -39.65073776245117, "global_step": 182861, "epoch": 1511} {"train_loss": -40.796600341796875, "global_step": 182862, "epoch": 1511} {"train_loss": -39.30753707885742, "global_step": 182863, "epoch": 1511} {"train_loss": -40.29449462890625, "global_step": 182864, "epoch": 1511} {"train_loss": -40.337955474853516, "global_step": 182865, "epoch": 1511} {"train_loss": -38.85529327392578, "global_step": 182866, "epoch": 1511} {"train_loss": -40.10041046142578, "global_step": 182867, "epoch": 1511} {"train_loss": -38.32802963256836, "global_step": 182868, "epoch": 1511} {"train_loss": -40.42108154296875, "global_step": 182869, "epoch": 1511} {"train_loss": -40.34504318237305, "global_step": 182870, "epoch": 1511} {"train_loss": -39.745826721191406, "global_step": 182871, "epoch": 1511} {"train_loss": -40.80485916137695, "global_step": 182872, "epoch": 1511} {"train_loss": -39.893043518066406, "global_step": 182873, "epoch": 1511} {"train_loss": -34.52179718017578, "global_step": 182874, "epoch": 1511} {"train_loss": -40.166500091552734, "global_step": 182875, "epoch": 1511} {"train_loss": -38.141212463378906, "global_step": 182876, "epoch": 1511} {"train_loss": -36.974403381347656, "global_step": 182877, "epoch": 1511} {"train_loss": -34.60331726074219, "global_step": 182878, "epoch": 1511} {"train_loss": -26.83406639099121, "global_step": 182879, "epoch": 1511} {"train_loss": -38.568843841552734, "global_step": 182880, "epoch": 1511} {"train_loss": -25.75214195251465, "global_step": 182881, "epoch": 1511} {"train_loss": -37.29084396362305, "global_step": 182882, "epoch": 1511} {"train_loss": -31.977109909057617, "global_step": 182883, "epoch": 1511} {"train_loss": -34.30425262451172, "global_step": 182884, "epoch": 1511} {"train_loss": -36.2065315246582, "global_step": 182885, "epoch": 1511} {"train_loss": -38.2911491394043, "global_step": 182886, "epoch": 1511} {"train_loss": -33.87788772583008, "global_step": 182887, "epoch": 1511} {"train_loss": -35.12416076660156, "global_step": 182888, "epoch": 1511} {"train_loss": -36.653663635253906, "global_step": 182889, "epoch": 1511} {"train_loss": -37.29353713989258, "global_step": 182890, "epoch": 1511} {"train_loss": -38.7509651184082, "global_step": 182891, "epoch": 1511} {"train_loss": -33.48063278198242, "global_step": 182892, "epoch": 1511} {"train_loss": -37.55217361450195, "global_step": 182893, "epoch": 1511} {"train_loss": -36.771514892578125, "global_step": 182894, "epoch": 1511} {"train_loss": -35.972900390625, "global_step": 182895, "epoch": 1511} {"train_loss": -36.20139694213867, "global_step": 182896, "epoch": 1511} {"train_loss": -38.78017807006836, "global_step": 182897, "epoch": 1511} {"train_loss": -36.31266403198242, "global_step": 182898, "epoch": 1511} {"train_loss": -36.86674880981445, "global_step": 182899, "epoch": 1511} {"train_loss": -37.29655075073242, "global_step": 182900, "epoch": 1511} {"train_loss": -37.5605583190918, "global_step": 182901, "epoch": 1511} {"train_loss": -38.29557418823242, "global_step": 182902, "epoch": 1511} {"train_loss": -38.281368255615234, "global_step": 182903, "epoch": 1511} {"train_loss": -38.96904373168945, "global_step": 182904, "epoch": 1511} {"train_loss": -38.93478012084961, "global_step": 182905, "epoch": 1511} {"train_loss": -37.9720344543457, "global_step": 182906, "epoch": 1511} {"train_loss": -35.361141204833984, "global_step": 182907, "epoch": 1511} {"train_loss": -36.560604095458984, "global_step": 182908, "epoch": 1511} {"train_loss": -38.93659210205078, "global_step": 182909, "epoch": 1511} {"train_loss": -39.013458251953125, "global_step": 182910, "epoch": 1511} {"train_loss": -38.80695343017578, "global_step": 182911, "epoch": 1511} {"train_loss": -39.276947021484375, "global_step": 182912, "epoch": 1511} {"train_loss": -37.40174102783203, "global_step": 182913, "epoch": 1511} {"train_loss": -37.96072769165039, "global_step": 182914, "epoch": 1511} {"train_loss": -38.79530715942383, "global_step": 182915, "epoch": 1511} {"train_loss": -35.897315979003906, "global_step": 182916, "epoch": 1511} {"train_loss": -38.007667541503906, "global_step": 182917, "epoch": 1511} {"train_loss": -36.57914352416992, "global_step": 182918, "epoch": 1511} {"train_loss": -37.84033203125, "global_step": 182919, "epoch": 1511} {"train_loss": -39.003936767578125, "global_step": 182920, "epoch": 1511} {"train_loss": -38.45988082885742, "global_step": 182921, "epoch": 1511} {"train_loss": -38.41311264038086, "global_step": 182922, "epoch": 1511} {"train_loss": -39.142738342285156, "global_step": 182923, "epoch": 1511} {"train_loss": -39.00758361816406, "global_step": 182924, "epoch": 1511} {"train_loss": -37.834102630615234, "global_step": 182925, "epoch": 1511} {"train_loss": -39.46107864379883, "global_step": 182926, "epoch": 1511} {"train_loss": -39.4296875, "global_step": 182927, "epoch": 1511} {"train_loss": -38.829349517822266, "global_step": 182928, "epoch": 1511} {"train_loss": -39.44466781616211, "global_step": 182929, "epoch": 1511} {"train_loss": -39.543033599853516, "global_step": 182930, "epoch": 1511} {"train_loss": -39.54307174682617, "global_step": 182931, "epoch": 1511} {"train_loss": -39.53181076049805, "global_step": 182932, "epoch": 1511} {"train_loss": -39.863460540771484, "global_step": 182933, "epoch": 1511} {"train_loss": -39.256038665771484, "global_step": 182934, "epoch": 1511} {"train_loss": -39.8179931640625, "global_step": 182935, "epoch": 1511} {"train_loss": -39.40080261230469, "global_step": 182936, "epoch": 1511} {"train_loss": -39.697628021240234, "global_step": 182937, "epoch": 1511} {"train_loss": -39.36042404174805, "global_step": 182938, "epoch": 1511} {"train_loss": -39.88761520385742, "global_step": 182939, "epoch": 1511} {"train_loss": -39.672943115234375, "global_step": 182940, "epoch": 1511} {"train_loss": -39.905372619628906, "global_step": 182941, "epoch": 1511} {"train_loss": -39.89034652709961, "global_step": 182942, "epoch": 1511} {"train_loss": -40.00339889526367, "global_step": 182943, "epoch": 1511} {"train_loss": -39.532081604003906, "global_step": 182944, "epoch": 1511} {"train_loss": -40.21100997924805, "global_step": 182945, "epoch": 1511} {"train_loss": -39.8746452331543, "global_step": 182946, "epoch": 1511} {"train_loss": -39.0887451171875, "global_step": 182947, "epoch": 1511} {"train_loss": -39.52244186401367, "global_step": 182948, "epoch": 1511} {"train_loss": -40.30540084838867, "global_step": 182949, "epoch": 1511} {"train_loss": -40.07471466064453, "global_step": 182950, "epoch": 1511} {"train_loss": -38.36659254909547, "global_step": 182951, "epoch": 1511, "val_loss": 2699579.75} {"train_loss": -40.25380325317383, "global_step": 182952, "epoch": 1512} {"train_loss": -38.85697555541992, "global_step": 182953, "epoch": 1512} {"train_loss": -39.53848648071289, "global_step": 182954, "epoch": 1512} {"train_loss": -40.421180725097656, "global_step": 182955, "epoch": 1512} {"train_loss": -39.63954162597656, "global_step": 182956, "epoch": 1512} {"train_loss": -40.81440353393555, "global_step": 182957, "epoch": 1512} {"train_loss": -39.701393127441406, "global_step": 182958, "epoch": 1512} {"train_loss": -40.623809814453125, "global_step": 182959, "epoch": 1512} {"train_loss": -40.14419174194336, "global_step": 182960, "epoch": 1512} {"train_loss": -40.3873405456543, "global_step": 182961, "epoch": 1512} {"train_loss": -40.585350036621094, "global_step": 182962, "epoch": 1512} {"train_loss": -40.3865966796875, "global_step": 182963, "epoch": 1512} {"train_loss": -40.48527145385742, "global_step": 182964, "epoch": 1512} {"train_loss": -39.468318939208984, "global_step": 182965, "epoch": 1512} {"train_loss": -39.707672119140625, "global_step": 182966, "epoch": 1512} {"train_loss": -39.85660934448242, "global_step": 182967, "epoch": 1512} {"train_loss": -40.09162521362305, "global_step": 182968, "epoch": 1512} {"train_loss": -39.499176025390625, "global_step": 182969, "epoch": 1512} {"train_loss": -40.64435958862305, "global_step": 182970, "epoch": 1512} {"train_loss": -40.22200393676758, "global_step": 182971, "epoch": 1512} {"train_loss": -39.22999572753906, "global_step": 182972, "epoch": 1512} {"train_loss": -40.23139572143555, "global_step": 182973, "epoch": 1512} {"train_loss": -40.37382888793945, "global_step": 182974, "epoch": 1512} {"train_loss": -39.44672393798828, "global_step": 182975, "epoch": 1512} {"train_loss": -40.42528533935547, "global_step": 182976, "epoch": 1512} {"train_loss": -39.95998764038086, "global_step": 182977, "epoch": 1512} {"train_loss": -40.5671501159668, "global_step": 182978, "epoch": 1512} {"train_loss": -40.336055755615234, "global_step": 182979, "epoch": 1512} {"train_loss": -40.045284271240234, "global_step": 182980, "epoch": 1512} {"train_loss": -40.630760192871094, "global_step": 182981, "epoch": 1512} {"train_loss": -40.804439544677734, "global_step": 182982, "epoch": 1512} {"train_loss": -39.98352813720703, "global_step": 182983, "epoch": 1512} {"train_loss": -40.3292236328125, "global_step": 182984, "epoch": 1512} {"train_loss": -40.087257385253906, "global_step": 182985, "epoch": 1512} {"train_loss": -39.46073913574219, "global_step": 182986, "epoch": 1512} {"train_loss": -39.96442413330078, "global_step": 182987, "epoch": 1512} {"train_loss": -40.51702880859375, "global_step": 182988, "epoch": 1512} {"train_loss": -38.575408935546875, "global_step": 182989, "epoch": 1512} {"train_loss": -40.685604095458984, "global_step": 182990, "epoch": 1512} {"train_loss": -40.221004486083984, "global_step": 182991, "epoch": 1512} {"train_loss": -40.66679000854492, "global_step": 182992, "epoch": 1512} {"train_loss": -39.80725860595703, "global_step": 182993, "epoch": 1512} {"train_loss": -39.2092399597168, "global_step": 182994, "epoch": 1512} {"train_loss": -39.546730041503906, "global_step": 182995, "epoch": 1512} {"train_loss": -41.12034225463867, "global_step": 182996, "epoch": 1512} {"train_loss": -40.66666793823242, "global_step": 182997, "epoch": 1512} {"train_loss": -40.38610076904297, "global_step": 182998, "epoch": 1512} {"train_loss": -41.089561462402344, "global_step": 182999, "epoch": 1512} {"train_loss": -39.90406036376953, "global_step": 183000, "epoch": 1512} {"train_loss": -40.65793991088867, "global_step": 183001, "epoch": 1512} {"train_loss": -39.87376022338867, "global_step": 183002, "epoch": 1512} {"train_loss": -40.4172248840332, "global_step": 183003, "epoch": 1512} {"train_loss": -40.14650344848633, "global_step": 183004, "epoch": 1512} {"train_loss": -39.87031173706055, "global_step": 183005, "epoch": 1512} {"train_loss": -39.3853874206543, "global_step": 183006, "epoch": 1512} {"train_loss": -40.60894012451172, "global_step": 183007, "epoch": 1512} {"train_loss": -39.87203598022461, "global_step": 183008, "epoch": 1512} {"train_loss": -39.17646026611328, "global_step": 183009, "epoch": 1512} {"train_loss": -40.061580657958984, "global_step": 183010, "epoch": 1512} {"train_loss": -37.77117919921875, "global_step": 183011, "epoch": 1512} {"train_loss": -39.27317428588867, "global_step": 183012, "epoch": 1512} {"train_loss": -40.791744232177734, "global_step": 183013, "epoch": 1512} {"train_loss": -40.75510787963867, "global_step": 183014, "epoch": 1512} {"train_loss": -40.89812088012695, "global_step": 183015, "epoch": 1512} {"train_loss": -40.49985122680664, "global_step": 183016, "epoch": 1512} {"train_loss": -38.66176223754883, "global_step": 183017, "epoch": 1512} {"train_loss": -40.70606231689453, "global_step": 183018, "epoch": 1512} {"train_loss": -40.99923324584961, "global_step": 183019, "epoch": 1512} {"train_loss": -39.4788932800293, "global_step": 183020, "epoch": 1512} {"train_loss": -40.68027877807617, "global_step": 183021, "epoch": 1512} {"train_loss": -40.59876251220703, "global_step": 183022, "epoch": 1512} {"train_loss": -40.04952621459961, "global_step": 183023, "epoch": 1512} {"train_loss": -39.494571685791016, "global_step": 183024, "epoch": 1512} {"train_loss": -40.625946044921875, "global_step": 183025, "epoch": 1512} {"train_loss": -40.35889434814453, "global_step": 183026, "epoch": 1512} {"train_loss": -40.263885498046875, "global_step": 183027, "epoch": 1512} {"train_loss": -40.38047409057617, "global_step": 183028, "epoch": 1512} {"train_loss": -40.61473846435547, "global_step": 183029, "epoch": 1512} {"train_loss": -40.91053771972656, "global_step": 183030, "epoch": 1512} {"train_loss": -41.145503997802734, "global_step": 183031, "epoch": 1512} {"train_loss": -40.99946594238281, "global_step": 183032, "epoch": 1512} {"train_loss": -40.90667724609375, "global_step": 183033, "epoch": 1512} {"train_loss": -40.75916290283203, "global_step": 183034, "epoch": 1512} {"train_loss": -39.77010726928711, "global_step": 183035, "epoch": 1512} {"train_loss": -40.75401306152344, "global_step": 183036, "epoch": 1512} {"train_loss": -40.784847259521484, "global_step": 183037, "epoch": 1512} {"train_loss": -39.09177780151367, "global_step": 183038, "epoch": 1512} {"train_loss": -39.57284164428711, "global_step": 183039, "epoch": 1512} {"train_loss": -40.01662063598633, "global_step": 183040, "epoch": 1512} {"train_loss": -40.34144973754883, "global_step": 183041, "epoch": 1512} {"train_loss": -40.94061279296875, "global_step": 183042, "epoch": 1512} {"train_loss": -39.01731491088867, "global_step": 183043, "epoch": 1512} {"train_loss": -40.175209045410156, "global_step": 183044, "epoch": 1512} {"train_loss": -38.84650421142578, "global_step": 183045, "epoch": 1512} {"train_loss": -35.295654296875, "global_step": 183046, "epoch": 1512} {"train_loss": -31.281137466430664, "global_step": 183047, "epoch": 1512} {"train_loss": -36.42069625854492, "global_step": 183048, "epoch": 1512} {"train_loss": -40.62579345703125, "global_step": 183049, "epoch": 1512} {"train_loss": -34.72442626953125, "global_step": 183050, "epoch": 1512} {"train_loss": -32.7531623840332, "global_step": 183051, "epoch": 1512} {"train_loss": -39.43788146972656, "global_step": 183052, "epoch": 1512} {"train_loss": -36.54853439331055, "global_step": 183053, "epoch": 1512} {"train_loss": -36.27205276489258, "global_step": 183054, "epoch": 1512} {"train_loss": -39.16416549682617, "global_step": 183055, "epoch": 1512} {"train_loss": -37.40206527709961, "global_step": 183056, "epoch": 1512} {"train_loss": -39.1924934387207, "global_step": 183057, "epoch": 1512} {"train_loss": -39.38923645019531, "global_step": 183058, "epoch": 1512} {"train_loss": -38.94263458251953, "global_step": 183059, "epoch": 1512} {"train_loss": -40.371246337890625, "global_step": 183060, "epoch": 1512} {"train_loss": -39.43878173828125, "global_step": 183061, "epoch": 1512} {"train_loss": -40.27808380126953, "global_step": 183062, "epoch": 1512} {"train_loss": -39.84712600708008, "global_step": 183063, "epoch": 1512} {"train_loss": -40.215694427490234, "global_step": 183064, "epoch": 1512} {"train_loss": -40.04630661010742, "global_step": 183065, "epoch": 1512} {"train_loss": -39.959041595458984, "global_step": 183066, "epoch": 1512} {"train_loss": -40.103633880615234, "global_step": 183067, "epoch": 1512} {"train_loss": -40.36161422729492, "global_step": 183068, "epoch": 1512} {"train_loss": -38.8978271484375, "global_step": 183069, "epoch": 1512} {"train_loss": -40.650516510009766, "global_step": 183070, "epoch": 1512} {"train_loss": -39.82918167114258, "global_step": 183071, "epoch": 1512} {"train_loss": -39.748721114860096, "global_step": 183072, "epoch": 1512, "val_loss": 2633179.0} {"train_loss": -40.45288848876953, "global_step": 183073, "epoch": 1513} {"train_loss": -40.80335998535156, "global_step": 183074, "epoch": 1513} {"train_loss": -39.8956184387207, "global_step": 183075, "epoch": 1513} {"train_loss": -40.53463363647461, "global_step": 183076, "epoch": 1513} {"train_loss": -40.329872131347656, "global_step": 183077, "epoch": 1513} {"train_loss": -41.225563049316406, "global_step": 183078, "epoch": 1513} {"train_loss": -40.950469970703125, "global_step": 183079, "epoch": 1513} {"train_loss": -41.255462646484375, "global_step": 183080, "epoch": 1513} {"train_loss": -40.987274169921875, "global_step": 183081, "epoch": 1513} {"train_loss": -41.004661560058594, "global_step": 183082, "epoch": 1513} {"train_loss": -41.36343002319336, "global_step": 183083, "epoch": 1513} {"train_loss": -41.18270492553711, "global_step": 183084, "epoch": 1513} {"train_loss": -40.68593215942383, "global_step": 183085, "epoch": 1513} {"train_loss": -40.937217712402344, "global_step": 183086, "epoch": 1513} {"train_loss": -41.18879318237305, "global_step": 183087, "epoch": 1513} {"train_loss": -41.32585525512695, "global_step": 183088, "epoch": 1513} {"train_loss": -37.836212158203125, "global_step": 183089, "epoch": 1513} {"train_loss": -41.2705078125, "global_step": 183090, "epoch": 1513} {"train_loss": -41.228118896484375, "global_step": 183091, "epoch": 1513} {"train_loss": -40.75836181640625, "global_step": 183092, "epoch": 1513} {"train_loss": -40.6016960144043, "global_step": 183093, "epoch": 1513} {"train_loss": -41.32959747314453, "global_step": 183094, "epoch": 1513} {"train_loss": -39.62178039550781, "global_step": 183095, "epoch": 1513} {"train_loss": -41.40035629272461, "global_step": 183096, "epoch": 1513} {"train_loss": -41.292362213134766, "global_step": 183097, "epoch": 1513} {"train_loss": -41.35471725463867, "global_step": 183098, "epoch": 1513} {"train_loss": -40.893890380859375, "global_step": 183099, "epoch": 1513} {"train_loss": -40.49831771850586, "global_step": 183100, "epoch": 1513} {"train_loss": -40.80047607421875, "global_step": 183101, "epoch": 1513} {"train_loss": -40.35979080200195, "global_step": 183102, "epoch": 1513} {"train_loss": -40.670040130615234, "global_step": 183103, "epoch": 1513} {"train_loss": -39.90910339355469, "global_step": 183104, "epoch": 1513} {"train_loss": -40.54426574707031, "global_step": 183105, "epoch": 1513} {"train_loss": -41.15904998779297, "global_step": 183106, "epoch": 1513} {"train_loss": -41.148460388183594, "global_step": 183107, "epoch": 1513} {"train_loss": -40.78227996826172, "global_step": 183108, "epoch": 1513} {"train_loss": -40.90427780151367, "global_step": 183109, "epoch": 1513} {"train_loss": -41.17094802856445, "global_step": 183110, "epoch": 1513} {"train_loss": -41.07414627075195, "global_step": 183111, "epoch": 1513} {"train_loss": -41.08016586303711, "global_step": 183112, "epoch": 1513} {"train_loss": -41.0968132019043, "global_step": 183113, "epoch": 1513} {"train_loss": -41.08985137939453, "global_step": 183114, "epoch": 1513} {"train_loss": -41.45582962036133, "global_step": 183115, "epoch": 1513} {"train_loss": -40.8487434387207, "global_step": 183116, "epoch": 1513} {"train_loss": -40.13547134399414, "global_step": 183117, "epoch": 1513} {"train_loss": -41.125885009765625, "global_step": 183118, "epoch": 1513} {"train_loss": -41.33162307739258, "global_step": 183119, "epoch": 1513} {"train_loss": -40.737030029296875, "global_step": 183120, "epoch": 1513} {"train_loss": -41.01707077026367, "global_step": 183121, "epoch": 1513} {"train_loss": -40.431976318359375, "global_step": 183122, "epoch": 1513} {"train_loss": -36.69936752319336, "global_step": 183123, "epoch": 1513} {"train_loss": -37.35551452636719, "global_step": 183124, "epoch": 1513} {"train_loss": -37.00991439819336, "global_step": 183125, "epoch": 1513} {"train_loss": -37.59853744506836, "global_step": 183126, "epoch": 1513} {"train_loss": -36.287593841552734, "global_step": 183127, "epoch": 1513} {"train_loss": -39.82273483276367, "global_step": 183128, "epoch": 1513} {"train_loss": -39.94327926635742, "global_step": 183129, "epoch": 1513} {"train_loss": -37.98850631713867, "global_step": 183130, "epoch": 1513} {"train_loss": -34.42924118041992, "global_step": 183131, "epoch": 1513} {"train_loss": -34.10840606689453, "global_step": 183132, "epoch": 1513} {"train_loss": -35.37662887573242, "global_step": 183133, "epoch": 1513} {"train_loss": -40.441017150878906, "global_step": 183134, "epoch": 1513} {"train_loss": -36.23628234863281, "global_step": 183135, "epoch": 1513} {"train_loss": -34.6995964050293, "global_step": 183136, "epoch": 1513} {"train_loss": -40.4383544921875, "global_step": 183137, "epoch": 1513} {"train_loss": -35.590450286865234, "global_step": 183138, "epoch": 1513} {"train_loss": -33.36918258666992, "global_step": 183139, "epoch": 1513} {"train_loss": -38.67621994018555, "global_step": 183140, "epoch": 1513} {"train_loss": -37.923423767089844, "global_step": 183141, "epoch": 1513} {"train_loss": -39.646854400634766, "global_step": 183142, "epoch": 1513} {"train_loss": -38.1756591796875, "global_step": 183143, "epoch": 1513} {"train_loss": -36.55971145629883, "global_step": 183144, "epoch": 1513} {"train_loss": -39.2441291809082, "global_step": 183145, "epoch": 1513} {"train_loss": -36.24570846557617, "global_step": 183146, "epoch": 1513} {"train_loss": -39.3172607421875, "global_step": 183147, "epoch": 1513} {"train_loss": -38.545501708984375, "global_step": 183148, "epoch": 1513} {"train_loss": -39.9580192565918, "global_step": 183149, "epoch": 1513} {"train_loss": -39.64152908325195, "global_step": 183150, "epoch": 1513} {"train_loss": -39.09877395629883, "global_step": 183151, "epoch": 1513} {"train_loss": -39.72353744506836, "global_step": 183152, "epoch": 1513} {"train_loss": -37.11371612548828, "global_step": 183153, "epoch": 1513} {"train_loss": -39.473052978515625, "global_step": 183154, "epoch": 1513} {"train_loss": -38.938899993896484, "global_step": 183155, "epoch": 1513} {"train_loss": -38.920936584472656, "global_step": 183156, "epoch": 1513} {"train_loss": -37.692176818847656, "global_step": 183157, "epoch": 1513} {"train_loss": -39.397430419921875, "global_step": 183158, "epoch": 1513} {"train_loss": -38.402008056640625, "global_step": 183159, "epoch": 1513} {"train_loss": -39.54056930541992, "global_step": 183160, "epoch": 1513} {"train_loss": -31.769500732421875, "global_step": 183161, "epoch": 1513} {"train_loss": -39.41776657104492, "global_step": 183162, "epoch": 1513} {"train_loss": -39.35056686401367, "global_step": 183163, "epoch": 1513} {"train_loss": -40.394813537597656, "global_step": 183164, "epoch": 1513} {"train_loss": -39.30004119873047, "global_step": 183165, "epoch": 1513} {"train_loss": -35.69837951660156, "global_step": 183166, "epoch": 1513} {"train_loss": -39.51778030395508, "global_step": 183167, "epoch": 1513} {"train_loss": -38.83382034301758, "global_step": 183168, "epoch": 1513} {"train_loss": -39.167236328125, "global_step": 183169, "epoch": 1513} {"train_loss": -39.29838943481445, "global_step": 183170, "epoch": 1513} {"train_loss": -40.04427719116211, "global_step": 183171, "epoch": 1513} {"train_loss": -40.15846633911133, "global_step": 183172, "epoch": 1513} {"train_loss": -39.92854309082031, "global_step": 183173, "epoch": 1513} {"train_loss": -39.22563171386719, "global_step": 183174, "epoch": 1513} {"train_loss": -39.05093002319336, "global_step": 183175, "epoch": 1513} {"train_loss": -37.454891204833984, "global_step": 183176, "epoch": 1513} {"train_loss": -39.11957931518555, "global_step": 183177, "epoch": 1513} {"train_loss": -37.65591812133789, "global_step": 183178, "epoch": 1513} {"train_loss": -36.3040885925293, "global_step": 183179, "epoch": 1513} {"train_loss": -38.97239303588867, "global_step": 183180, "epoch": 1513} {"train_loss": -39.98984909057617, "global_step": 183181, "epoch": 1513} {"train_loss": -39.041927337646484, "global_step": 183182, "epoch": 1513} {"train_loss": -38.92985534667969, "global_step": 183183, "epoch": 1513} {"train_loss": -39.8024787902832, "global_step": 183184, "epoch": 1513} {"train_loss": -39.576515197753906, "global_step": 183185, "epoch": 1513} {"train_loss": -39.28947067260742, "global_step": 183186, "epoch": 1513} {"train_loss": -39.8919563293457, "global_step": 183187, "epoch": 1513} {"train_loss": -37.695735931396484, "global_step": 183188, "epoch": 1513} {"train_loss": -40.28485870361328, "global_step": 183189, "epoch": 1513} {"train_loss": -40.46253967285156, "global_step": 183190, "epoch": 1513} {"train_loss": -40.17583465576172, "global_step": 183191, "epoch": 1513} {"train_loss": -40.17871856689453, "global_step": 183192, "epoch": 1513} {"train_loss": -39.397403811620286, "global_step": 183193, "epoch": 1513, "val_loss": 2832687.25} {"train_loss": -40.58985137939453, "global_step": 183194, "epoch": 1514} {"train_loss": -40.40693283081055, "global_step": 183195, "epoch": 1514} {"train_loss": -40.75407028198242, "global_step": 183196, "epoch": 1514} {"train_loss": -40.110225677490234, "global_step": 183197, "epoch": 1514} {"train_loss": -40.745521545410156, "global_step": 183198, "epoch": 1514} {"train_loss": -40.1909294128418, "global_step": 183199, "epoch": 1514} {"train_loss": -40.07451629638672, "global_step": 183200, "epoch": 1514} {"train_loss": -40.912994384765625, "global_step": 183201, "epoch": 1514} {"train_loss": -40.49517059326172, "global_step": 183202, "epoch": 1514} {"train_loss": -40.563133239746094, "global_step": 183203, "epoch": 1514} {"train_loss": -41.04879379272461, "global_step": 183204, "epoch": 1514} {"train_loss": -40.892513275146484, "global_step": 183205, "epoch": 1514} {"train_loss": -41.16337203979492, "global_step": 183206, "epoch": 1514} {"train_loss": -40.70283889770508, "global_step": 183207, "epoch": 1514} {"train_loss": -40.99095916748047, "global_step": 183208, "epoch": 1514} {"train_loss": -40.483768463134766, "global_step": 183209, "epoch": 1514} {"train_loss": -40.86669921875, "global_step": 183210, "epoch": 1514} {"train_loss": -41.07290267944336, "global_step": 183211, "epoch": 1514} {"train_loss": -40.613983154296875, "global_step": 183212, "epoch": 1514} {"train_loss": -40.286190032958984, "global_step": 183213, "epoch": 1514} {"train_loss": -39.91920852661133, "global_step": 183214, "epoch": 1514} {"train_loss": -39.88138198852539, "global_step": 183215, "epoch": 1514} {"train_loss": -41.184627532958984, "global_step": 183216, "epoch": 1514} {"train_loss": -40.72587966918945, "global_step": 183217, "epoch": 1514} {"train_loss": -41.074798583984375, "global_step": 183218, "epoch": 1514} {"train_loss": -40.96979904174805, "global_step": 183219, "epoch": 1514} {"train_loss": -40.964202880859375, "global_step": 183220, "epoch": 1514} {"train_loss": -41.21488952636719, "global_step": 183221, "epoch": 1514} {"train_loss": -39.663692474365234, "global_step": 183222, "epoch": 1514} {"train_loss": -41.2198600769043, "global_step": 183223, "epoch": 1514} {"train_loss": -39.00777053833008, "global_step": 183224, "epoch": 1514} {"train_loss": -39.87216567993164, "global_step": 183225, "epoch": 1514} {"train_loss": -41.23472595214844, "global_step": 183226, "epoch": 1514} {"train_loss": -41.32700729370117, "global_step": 183227, "epoch": 1514} {"train_loss": -41.38322830200195, "global_step": 183228, "epoch": 1514} {"train_loss": -36.102291107177734, "global_step": 183229, "epoch": 1514} {"train_loss": -40.0886344909668, "global_step": 183230, "epoch": 1514} {"train_loss": -39.30721664428711, "global_step": 183231, "epoch": 1514} {"train_loss": -39.905853271484375, "global_step": 183232, "epoch": 1514} {"train_loss": -41.25453186035156, "global_step": 183233, "epoch": 1514} {"train_loss": -41.006282806396484, "global_step": 183234, "epoch": 1514} {"train_loss": -40.18524932861328, "global_step": 183235, "epoch": 1514} {"train_loss": -41.297088623046875, "global_step": 183236, "epoch": 1514} {"train_loss": -40.39633560180664, "global_step": 183237, "epoch": 1514} {"train_loss": -41.50948715209961, "global_step": 183238, "epoch": 1514} {"train_loss": -38.277530670166016, "global_step": 183239, "epoch": 1514} {"train_loss": -39.890655517578125, "global_step": 183240, "epoch": 1514} {"train_loss": -40.821876525878906, "global_step": 183241, "epoch": 1514} {"train_loss": -41.242069244384766, "global_step": 183242, "epoch": 1514} {"train_loss": -40.91222381591797, "global_step": 183243, "epoch": 1514} {"train_loss": -41.476863861083984, "global_step": 183244, "epoch": 1514} {"train_loss": -40.36064529418945, "global_step": 183245, "epoch": 1514} {"train_loss": -41.16816329956055, "global_step": 183246, "epoch": 1514} {"train_loss": -41.26142120361328, "global_step": 183247, "epoch": 1514} {"train_loss": -41.52803421020508, "global_step": 183248, "epoch": 1514} {"train_loss": -41.25431442260742, "global_step": 183249, "epoch": 1514} {"train_loss": -41.44115447998047, "global_step": 183250, "epoch": 1514} {"train_loss": -41.262176513671875, "global_step": 183251, "epoch": 1514} {"train_loss": -40.1024055480957, "global_step": 183252, "epoch": 1514} {"train_loss": -41.37631607055664, "global_step": 183253, "epoch": 1514} {"train_loss": -41.15297317504883, "global_step": 183254, "epoch": 1514} {"train_loss": -41.13730239868164, "global_step": 183255, "epoch": 1514} {"train_loss": -41.62153244018555, "global_step": 183256, "epoch": 1514} {"train_loss": -38.63241195678711, "global_step": 183257, "epoch": 1514} {"train_loss": -39.827144622802734, "global_step": 183258, "epoch": 1514} {"train_loss": -40.56882858276367, "global_step": 183259, "epoch": 1514} {"train_loss": -39.7895622253418, "global_step": 183260, "epoch": 1514} {"train_loss": -41.0830078125, "global_step": 183261, "epoch": 1514} {"train_loss": -41.796566009521484, "global_step": 183262, "epoch": 1514} {"train_loss": -40.034461975097656, "global_step": 183263, "epoch": 1514} {"train_loss": -40.578365325927734, "global_step": 183264, "epoch": 1514} {"train_loss": -41.3918342590332, "global_step": 183265, "epoch": 1514} {"train_loss": -41.14907455444336, "global_step": 183266, "epoch": 1514} {"train_loss": -40.66975021362305, "global_step": 183267, "epoch": 1514} {"train_loss": -40.28493118286133, "global_step": 183268, "epoch": 1514} {"train_loss": -40.698707580566406, "global_step": 183269, "epoch": 1514} {"train_loss": -39.45498275756836, "global_step": 183270, "epoch": 1514} {"train_loss": -40.60599899291992, "global_step": 183271, "epoch": 1514} {"train_loss": -40.933502197265625, "global_step": 183272, "epoch": 1514} {"train_loss": -39.926605224609375, "global_step": 183273, "epoch": 1514} {"train_loss": -38.24455642700195, "global_step": 183274, "epoch": 1514} {"train_loss": -41.527122497558594, "global_step": 183275, "epoch": 1514} {"train_loss": -41.097572326660156, "global_step": 183276, "epoch": 1514} {"train_loss": -40.198577880859375, "global_step": 183277, "epoch": 1514} {"train_loss": -39.47844696044922, "global_step": 183278, "epoch": 1514} {"train_loss": -40.794986724853516, "global_step": 183279, "epoch": 1514} {"train_loss": -39.60676956176758, "global_step": 183280, "epoch": 1514} {"train_loss": -40.54777145385742, "global_step": 183281, "epoch": 1514} {"train_loss": -39.94108200073242, "global_step": 183282, "epoch": 1514} {"train_loss": -38.3792724609375, "global_step": 183283, "epoch": 1514} {"train_loss": -38.306068420410156, "global_step": 183284, "epoch": 1514} {"train_loss": -41.67059326171875, "global_step": 183285, "epoch": 1514} {"train_loss": -40.29985809326172, "global_step": 183286, "epoch": 1514} {"train_loss": -40.20756530761719, "global_step": 183287, "epoch": 1514} {"train_loss": -38.56516647338867, "global_step": 183288, "epoch": 1514} {"train_loss": -39.59803009033203, "global_step": 183289, "epoch": 1514} {"train_loss": -40.1853141784668, "global_step": 183290, "epoch": 1514} {"train_loss": -40.7304573059082, "global_step": 183291, "epoch": 1514} {"train_loss": -39.839656829833984, "global_step": 183292, "epoch": 1514} {"train_loss": -37.951759338378906, "global_step": 183293, "epoch": 1514} {"train_loss": -39.792701721191406, "global_step": 183294, "epoch": 1514} {"train_loss": -40.267608642578125, "global_step": 183295, "epoch": 1514} {"train_loss": -39.17562484741211, "global_step": 183296, "epoch": 1514} {"train_loss": -41.34016036987305, "global_step": 183297, "epoch": 1514} {"train_loss": -39.44179153442383, "global_step": 183298, "epoch": 1514} {"train_loss": -34.14533615112305, "global_step": 183299, "epoch": 1514} {"train_loss": -40.35920333862305, "global_step": 183300, "epoch": 1514} {"train_loss": -39.737060546875, "global_step": 183301, "epoch": 1514} {"train_loss": -40.67184066772461, "global_step": 183302, "epoch": 1514} {"train_loss": -39.8036003112793, "global_step": 183303, "epoch": 1514} {"train_loss": -40.503536224365234, "global_step": 183304, "epoch": 1514} {"train_loss": -37.9592170715332, "global_step": 183305, "epoch": 1514} {"train_loss": -37.421112060546875, "global_step": 183306, "epoch": 1514} {"train_loss": -33.57782745361328, "global_step": 183307, "epoch": 1514} {"train_loss": -36.419227600097656, "global_step": 183308, "epoch": 1514} {"train_loss": -40.5875129699707, "global_step": 183309, "epoch": 1514} {"train_loss": -39.55338668823242, "global_step": 183310, "epoch": 1514} {"train_loss": -38.53820037841797, "global_step": 183311, "epoch": 1514} {"train_loss": -39.333580017089844, "global_step": 183312, "epoch": 1514} {"train_loss": -36.89326858520508, "global_step": 183313, "epoch": 1514} {"train_loss": -40.13981010500065, "global_step": 183314, "epoch": 1514, "val_loss": 3209919.0} {"train_loss": -37.55658721923828, "global_step": 183315, "epoch": 1515} {"train_loss": -32.086761474609375, "global_step": 183316, "epoch": 1515} {"train_loss": -39.05592727661133, "global_step": 183317, "epoch": 1515} {"train_loss": -39.709964752197266, "global_step": 183318, "epoch": 1515} {"train_loss": -35.5592155456543, "global_step": 183319, "epoch": 1515} {"train_loss": -38.23421096801758, "global_step": 183320, "epoch": 1515} {"train_loss": -37.43709182739258, "global_step": 183321, "epoch": 1515} {"train_loss": -39.325523376464844, "global_step": 183322, "epoch": 1515} {"train_loss": -37.144439697265625, "global_step": 183323, "epoch": 1515} {"train_loss": -28.311655044555664, "global_step": 183324, "epoch": 1515} {"train_loss": -35.44136428833008, "global_step": 183325, "epoch": 1515} {"train_loss": -37.47576904296875, "global_step": 183326, "epoch": 1515} {"train_loss": -38.541316986083984, "global_step": 183327, "epoch": 1515} {"train_loss": -38.80525588989258, "global_step": 183328, "epoch": 1515} {"train_loss": -36.47370529174805, "global_step": 183329, "epoch": 1515} {"train_loss": -34.21736526489258, "global_step": 183330, "epoch": 1515} {"train_loss": -36.60285568237305, "global_step": 183331, "epoch": 1515} {"train_loss": -36.04385757446289, "global_step": 183332, "epoch": 1515} {"train_loss": -37.0214958190918, "global_step": 183333, "epoch": 1515} {"train_loss": -36.824615478515625, "global_step": 183334, "epoch": 1515} {"train_loss": -36.53919219970703, "global_step": 183335, "epoch": 1515} {"train_loss": -36.882568359375, "global_step": 183336, "epoch": 1515} {"train_loss": -36.81935119628906, "global_step": 183337, "epoch": 1515} {"train_loss": -37.46722412109375, "global_step": 183338, "epoch": 1515} {"train_loss": -35.500999450683594, "global_step": 183339, "epoch": 1515} {"train_loss": -36.940940856933594, "global_step": 183340, "epoch": 1515} {"train_loss": -38.004608154296875, "global_step": 183341, "epoch": 1515} {"train_loss": -37.37107467651367, "global_step": 183342, "epoch": 1515} {"train_loss": -36.854915618896484, "global_step": 183343, "epoch": 1515} {"train_loss": -38.969093322753906, "global_step": 183344, "epoch": 1515} {"train_loss": -37.59328079223633, "global_step": 183345, "epoch": 1515} {"train_loss": -38.704402923583984, "global_step": 183346, "epoch": 1515} {"train_loss": -38.1955680847168, "global_step": 183347, "epoch": 1515} {"train_loss": -37.96711349487305, "global_step": 183348, "epoch": 1515} {"train_loss": -39.45639419555664, "global_step": 183349, "epoch": 1515} {"train_loss": -38.50593185424805, "global_step": 183350, "epoch": 1515} {"train_loss": -38.8756217956543, "global_step": 183351, "epoch": 1515} {"train_loss": -38.782936096191406, "global_step": 183352, "epoch": 1515} {"train_loss": -38.03483200073242, "global_step": 183353, "epoch": 1515} {"train_loss": -37.81306838989258, "global_step": 183354, "epoch": 1515} {"train_loss": -38.86767578125, "global_step": 183355, "epoch": 1515} {"train_loss": -39.23590087890625, "global_step": 183356, "epoch": 1515} {"train_loss": -39.22024154663086, "global_step": 183357, "epoch": 1515} {"train_loss": -39.5130500793457, "global_step": 183358, "epoch": 1515} {"train_loss": -39.67242431640625, "global_step": 183359, "epoch": 1515} {"train_loss": -39.792354583740234, "global_step": 183360, "epoch": 1515} {"train_loss": -39.268402099609375, "global_step": 183361, "epoch": 1515} {"train_loss": -39.94110107421875, "global_step": 183362, "epoch": 1515} {"train_loss": -39.158870697021484, "global_step": 183363, "epoch": 1515} {"train_loss": -40.171016693115234, "global_step": 183364, "epoch": 1515} {"train_loss": -39.171417236328125, "global_step": 183365, "epoch": 1515} {"train_loss": -39.946937561035156, "global_step": 183366, "epoch": 1515} {"train_loss": -39.59424591064453, "global_step": 183367, "epoch": 1515} {"train_loss": -39.95906066894531, "global_step": 183368, "epoch": 1515} {"train_loss": -39.62541198730469, "global_step": 183369, "epoch": 1515} {"train_loss": -40.482757568359375, "global_step": 183370, "epoch": 1515} {"train_loss": -40.051544189453125, "global_step": 183371, "epoch": 1515} {"train_loss": -40.09202194213867, "global_step": 183372, "epoch": 1515} {"train_loss": -39.7703857421875, "global_step": 183373, "epoch": 1515} {"train_loss": -39.91217041015625, "global_step": 183374, "epoch": 1515} {"train_loss": -39.78278732299805, "global_step": 183375, "epoch": 1515} {"train_loss": -40.728912353515625, "global_step": 183376, "epoch": 1515} {"train_loss": -40.20629119873047, "global_step": 183377, "epoch": 1515} {"train_loss": -40.239376068115234, "global_step": 183378, "epoch": 1515} {"train_loss": -39.72273635864258, "global_step": 183379, "epoch": 1515} {"train_loss": -39.92129135131836, "global_step": 183380, "epoch": 1515} {"train_loss": -40.80137634277344, "global_step": 183381, "epoch": 1515} {"train_loss": -41.04898452758789, "global_step": 183382, "epoch": 1515} {"train_loss": -40.62467575073242, "global_step": 183383, "epoch": 1515} {"train_loss": -40.39076614379883, "global_step": 183384, "epoch": 1515} {"train_loss": -40.139949798583984, "global_step": 183385, "epoch": 1515} {"train_loss": -40.81393051147461, "global_step": 183386, "epoch": 1515} {"train_loss": -40.63787841796875, "global_step": 183387, "epoch": 1515} {"train_loss": -40.94931411743164, "global_step": 183388, "epoch": 1515} {"train_loss": -40.08432388305664, "global_step": 183389, "epoch": 1515} {"train_loss": -40.52836227416992, "global_step": 183390, "epoch": 1515} {"train_loss": -41.037288665771484, "global_step": 183391, "epoch": 1515} {"train_loss": -41.21563720703125, "global_step": 183392, "epoch": 1515} {"train_loss": -41.10078048706055, "global_step": 183393, "epoch": 1515} {"train_loss": -40.938934326171875, "global_step": 183394, "epoch": 1515} {"train_loss": -41.11145782470703, "global_step": 183395, "epoch": 1515} {"train_loss": -41.06533432006836, "global_step": 183396, "epoch": 1515} {"train_loss": -40.423824310302734, "global_step": 183397, "epoch": 1515} {"train_loss": -41.27043914794922, "global_step": 183398, "epoch": 1515} {"train_loss": -41.215850830078125, "global_step": 183399, "epoch": 1515} {"train_loss": -40.89751434326172, "global_step": 183400, "epoch": 1515} {"train_loss": -41.26913070678711, "global_step": 183401, "epoch": 1515} {"train_loss": -40.79685974121094, "global_step": 183402, "epoch": 1515} {"train_loss": -41.05781555175781, "global_step": 183403, "epoch": 1515} {"train_loss": -40.645408630371094, "global_step": 183404, "epoch": 1515} {"train_loss": -41.5894660949707, "global_step": 183405, "epoch": 1515} {"train_loss": -41.5908088684082, "global_step": 183406, "epoch": 1515} {"train_loss": -41.172027587890625, "global_step": 183407, "epoch": 1515} {"train_loss": -40.614349365234375, "global_step": 183408, "epoch": 1515} {"train_loss": -40.8027229309082, "global_step": 183409, "epoch": 1515} {"train_loss": -39.30156707763672, "global_step": 183410, "epoch": 1515} {"train_loss": -40.88869857788086, "global_step": 183411, "epoch": 1515} {"train_loss": -40.581268310546875, "global_step": 183412, "epoch": 1515} {"train_loss": -41.244537353515625, "global_step": 183413, "epoch": 1515} {"train_loss": -41.319793701171875, "global_step": 183414, "epoch": 1515} {"train_loss": -41.791744232177734, "global_step": 183415, "epoch": 1515} {"train_loss": -40.134361267089844, "global_step": 183416, "epoch": 1515} {"train_loss": -40.28882598876953, "global_step": 183417, "epoch": 1515} {"train_loss": -41.40031814575195, "global_step": 183418, "epoch": 1515} {"train_loss": -41.21812057495117, "global_step": 183419, "epoch": 1515} {"train_loss": -41.72359085083008, "global_step": 183420, "epoch": 1515} {"train_loss": -40.59795379638672, "global_step": 183421, "epoch": 1515} {"train_loss": -41.78078842163086, "global_step": 183422, "epoch": 1515} {"train_loss": -41.220821380615234, "global_step": 183423, "epoch": 1515} {"train_loss": -41.62936019897461, "global_step": 183424, "epoch": 1515} {"train_loss": -41.13409423828125, "global_step": 183425, "epoch": 1515} {"train_loss": -40.86464309692383, "global_step": 183426, "epoch": 1515} {"train_loss": -40.7910041809082, "global_step": 183427, "epoch": 1515} {"train_loss": -41.364498138427734, "global_step": 183428, "epoch": 1515} {"train_loss": -41.715999603271484, "global_step": 183429, "epoch": 1515} {"train_loss": -42.01555252075195, "global_step": 183430, "epoch": 1515} {"train_loss": -41.94527053833008, "global_step": 183431, "epoch": 1515} {"train_loss": -41.177242279052734, "global_step": 183432, "epoch": 1515} {"train_loss": -40.65494918823242, "global_step": 183433, "epoch": 1515} {"train_loss": -40.9865608215332, "global_step": 183434, "epoch": 1515} {"train_loss": -39.470695290683715, "global_step": 183435, "epoch": 1515, "val_loss": 2843935.25} {"train_loss": -41.258392333984375, "global_step": 183436, "epoch": 1516} {"train_loss": -40.829715728759766, "global_step": 183437, "epoch": 1516} {"train_loss": -40.979736328125, "global_step": 183438, "epoch": 1516} {"train_loss": -40.806434631347656, "global_step": 183439, "epoch": 1516} {"train_loss": -36.39791488647461, "global_step": 183440, "epoch": 1516} {"train_loss": -34.3811149597168, "global_step": 183441, "epoch": 1516} {"train_loss": -32.43647003173828, "global_step": 183442, "epoch": 1516} {"train_loss": -35.744659423828125, "global_step": 183443, "epoch": 1516} {"train_loss": -39.59555435180664, "global_step": 183444, "epoch": 1516} {"train_loss": -37.84931945800781, "global_step": 183445, "epoch": 1516} {"train_loss": -39.785335540771484, "global_step": 183446, "epoch": 1516} {"train_loss": -40.362545013427734, "global_step": 183447, "epoch": 1516} {"train_loss": -39.993080139160156, "global_step": 183448, "epoch": 1516} {"train_loss": -39.17476272583008, "global_step": 183449, "epoch": 1516} {"train_loss": -39.764766693115234, "global_step": 183450, "epoch": 1516} {"train_loss": -40.63335037231445, "global_step": 183451, "epoch": 1516} {"train_loss": -41.1327018737793, "global_step": 183452, "epoch": 1516} {"train_loss": -41.16591262817383, "global_step": 183453, "epoch": 1516} {"train_loss": -40.320674896240234, "global_step": 183454, "epoch": 1516} {"train_loss": -40.31328201293945, "global_step": 183455, "epoch": 1516} {"train_loss": -40.87443161010742, "global_step": 183456, "epoch": 1516} {"train_loss": -39.754364013671875, "global_step": 183457, "epoch": 1516} {"train_loss": -40.4732780456543, "global_step": 183458, "epoch": 1516} {"train_loss": -40.31059646606445, "global_step": 183459, "epoch": 1516} {"train_loss": -40.227909088134766, "global_step": 183460, "epoch": 1516} {"train_loss": -40.963680267333984, "global_step": 183461, "epoch": 1516} {"train_loss": -40.580352783203125, "global_step": 183462, "epoch": 1516} {"train_loss": -40.4507942199707, "global_step": 183463, "epoch": 1516} {"train_loss": -40.24951934814453, "global_step": 183464, "epoch": 1516} {"train_loss": -40.684661865234375, "global_step": 183465, "epoch": 1516} {"train_loss": -40.718082427978516, "global_step": 183466, "epoch": 1516} {"train_loss": -41.4848747253418, "global_step": 183467, "epoch": 1516} {"train_loss": -40.81941604614258, "global_step": 183468, "epoch": 1516} {"train_loss": -40.465492248535156, "global_step": 183469, "epoch": 1516} {"train_loss": -41.382686614990234, "global_step": 183470, "epoch": 1516} {"train_loss": -41.429901123046875, "global_step": 183471, "epoch": 1516} {"train_loss": -41.22867965698242, "global_step": 183472, "epoch": 1516} {"train_loss": -40.98027420043945, "global_step": 183473, "epoch": 1516} {"train_loss": -41.66340255737305, "global_step": 183474, "epoch": 1516} {"train_loss": -41.32982635498047, "global_step": 183475, "epoch": 1516} {"train_loss": -41.555938720703125, "global_step": 183476, "epoch": 1516} {"train_loss": -41.16333770751953, "global_step": 183477, "epoch": 1516} {"train_loss": -41.2000846862793, "global_step": 183478, "epoch": 1516} {"train_loss": -41.70136260986328, "global_step": 183479, "epoch": 1516} {"train_loss": -41.48797607421875, "global_step": 183480, "epoch": 1516} {"train_loss": -40.65868377685547, "global_step": 183481, "epoch": 1516} {"train_loss": -40.62223434448242, "global_step": 183482, "epoch": 1516} {"train_loss": -40.80620193481445, "global_step": 183483, "epoch": 1516} {"train_loss": -41.44386672973633, "global_step": 183484, "epoch": 1516} {"train_loss": -41.30754470825195, "global_step": 183485, "epoch": 1516} {"train_loss": -41.133323669433594, "global_step": 183486, "epoch": 1516} {"train_loss": -40.72141647338867, "global_step": 183487, "epoch": 1516} {"train_loss": -41.75593185424805, "global_step": 183488, "epoch": 1516} {"train_loss": -41.31364059448242, "global_step": 183489, "epoch": 1516} {"train_loss": -40.62821578979492, "global_step": 183490, "epoch": 1516} {"train_loss": -41.125911712646484, "global_step": 183491, "epoch": 1516} {"train_loss": -41.55855941772461, "global_step": 183492, "epoch": 1516} {"train_loss": -41.20062255859375, "global_step": 183493, "epoch": 1516} {"train_loss": -40.43650817871094, "global_step": 183494, "epoch": 1516} {"train_loss": -40.63094711303711, "global_step": 183495, "epoch": 1516} {"train_loss": -41.86875534057617, "global_step": 183496, "epoch": 1516} {"train_loss": -40.4530029296875, "global_step": 183497, "epoch": 1516} {"train_loss": -41.34574508666992, "global_step": 183498, "epoch": 1516} {"train_loss": -41.92380905151367, "global_step": 183499, "epoch": 1516} {"train_loss": -41.12411117553711, "global_step": 183500, "epoch": 1516} {"train_loss": -41.15141677856445, "global_step": 183501, "epoch": 1516} {"train_loss": -40.99283981323242, "global_step": 183502, "epoch": 1516} {"train_loss": -40.07087326049805, "global_step": 183503, "epoch": 1516} {"train_loss": -41.40928649902344, "global_step": 183504, "epoch": 1516} {"train_loss": -40.046817779541016, "global_step": 183505, "epoch": 1516} {"train_loss": -40.82472229003906, "global_step": 183506, "epoch": 1516} {"train_loss": -41.54520797729492, "global_step": 183507, "epoch": 1516} {"train_loss": -41.487178802490234, "global_step": 183508, "epoch": 1516} {"train_loss": -41.63845443725586, "global_step": 183509, "epoch": 1516} {"train_loss": -41.444515228271484, "global_step": 183510, "epoch": 1516} {"train_loss": -40.817970275878906, "global_step": 183511, "epoch": 1516} {"train_loss": -40.50175857543945, "global_step": 183512, "epoch": 1516} {"train_loss": -39.65363311767578, "global_step": 183513, "epoch": 1516} {"train_loss": -39.27643966674805, "global_step": 183514, "epoch": 1516} {"train_loss": -38.781341552734375, "global_step": 183515, "epoch": 1516} {"train_loss": -38.19096755981445, "global_step": 183516, "epoch": 1516} {"train_loss": -40.018157958984375, "global_step": 183517, "epoch": 1516} {"train_loss": -41.28976058959961, "global_step": 183518, "epoch": 1516} {"train_loss": -40.90824508666992, "global_step": 183519, "epoch": 1516} {"train_loss": -39.781307220458984, "global_step": 183520, "epoch": 1516} {"train_loss": -39.494544982910156, "global_step": 183521, "epoch": 1516} {"train_loss": -41.1928825378418, "global_step": 183522, "epoch": 1516} {"train_loss": -40.2807502746582, "global_step": 183523, "epoch": 1516} {"train_loss": -39.67915344238281, "global_step": 183524, "epoch": 1516} {"train_loss": -40.64144515991211, "global_step": 183525, "epoch": 1516} {"train_loss": -40.18027114868164, "global_step": 183526, "epoch": 1516} {"train_loss": -39.94717025756836, "global_step": 183527, "epoch": 1516} {"train_loss": -40.963680267333984, "global_step": 183528, "epoch": 1516} {"train_loss": -41.343196868896484, "global_step": 183529, "epoch": 1516} {"train_loss": -39.45835494995117, "global_step": 183530, "epoch": 1516} {"train_loss": -39.47804641723633, "global_step": 183531, "epoch": 1516} {"train_loss": -40.57967758178711, "global_step": 183532, "epoch": 1516} {"train_loss": -39.5240478515625, "global_step": 183533, "epoch": 1516} {"train_loss": -39.09316635131836, "global_step": 183534, "epoch": 1516} {"train_loss": -39.296016693115234, "global_step": 183535, "epoch": 1516} {"train_loss": -39.944400787353516, "global_step": 183536, "epoch": 1516} {"train_loss": -40.077510833740234, "global_step": 183537, "epoch": 1516} {"train_loss": -40.24441146850586, "global_step": 183538, "epoch": 1516} {"train_loss": -40.25682830810547, "global_step": 183539, "epoch": 1516} {"train_loss": -40.78856658935547, "global_step": 183540, "epoch": 1516} {"train_loss": -38.12811279296875, "global_step": 183541, "epoch": 1516} {"train_loss": -40.82780075073242, "global_step": 183542, "epoch": 1516} {"train_loss": -41.42219924926758, "global_step": 183543, "epoch": 1516} {"train_loss": -40.98550033569336, "global_step": 183544, "epoch": 1516} {"train_loss": -39.936649322509766, "global_step": 183545, "epoch": 1516} {"train_loss": -40.439178466796875, "global_step": 183546, "epoch": 1516} {"train_loss": -40.36260986328125, "global_step": 183547, "epoch": 1516} {"train_loss": -41.01905059814453, "global_step": 183548, "epoch": 1516} {"train_loss": -41.319087982177734, "global_step": 183549, "epoch": 1516} {"train_loss": -40.83675003051758, "global_step": 183550, "epoch": 1516} {"train_loss": -40.574066162109375, "global_step": 183551, "epoch": 1516} {"train_loss": -41.33921432495117, "global_step": 183552, "epoch": 1516} {"train_loss": -40.83781814575195, "global_step": 183553, "epoch": 1516} {"train_loss": -41.828216552734375, "global_step": 183554, "epoch": 1516} {"train_loss": -40.796810150146484, "global_step": 183555, "epoch": 1516} {"train_loss": -40.43081497949017, "global_step": 183556, "epoch": 1516, "val_loss": 2764010.0} {"train_loss": -41.08561325073242, "global_step": 183557, "epoch": 1517} {"train_loss": -40.236846923828125, "global_step": 183558, "epoch": 1517} {"train_loss": -41.50660705566406, "global_step": 183559, "epoch": 1517} {"train_loss": -40.53889083862305, "global_step": 183560, "epoch": 1517} {"train_loss": -40.701507568359375, "global_step": 183561, "epoch": 1517} {"train_loss": -40.57501220703125, "global_step": 183562, "epoch": 1517} {"train_loss": -40.5601692199707, "global_step": 183563, "epoch": 1517} {"train_loss": -40.066463470458984, "global_step": 183564, "epoch": 1517} {"train_loss": -39.661468505859375, "global_step": 183565, "epoch": 1517} {"train_loss": -40.01646423339844, "global_step": 183566, "epoch": 1517} {"train_loss": -41.45766067504883, "global_step": 183567, "epoch": 1517} {"train_loss": -40.11604690551758, "global_step": 183568, "epoch": 1517} {"train_loss": -39.57783126831055, "global_step": 183569, "epoch": 1517} {"train_loss": -39.62348556518555, "global_step": 183570, "epoch": 1517} {"train_loss": -40.60165023803711, "global_step": 183571, "epoch": 1517} {"train_loss": -37.20344924926758, "global_step": 183572, "epoch": 1517} {"train_loss": -36.85797119140625, "global_step": 183573, "epoch": 1517} {"train_loss": -34.69729232788086, "global_step": 183574, "epoch": 1517} {"train_loss": -38.93862533569336, "global_step": 183575, "epoch": 1517} {"train_loss": -39.63711166381836, "global_step": 183576, "epoch": 1517} {"train_loss": -38.418758392333984, "global_step": 183577, "epoch": 1517} {"train_loss": -38.18712615966797, "global_step": 183578, "epoch": 1517} {"train_loss": -40.4617919921875, "global_step": 183579, "epoch": 1517} {"train_loss": -36.521602630615234, "global_step": 183580, "epoch": 1517} {"train_loss": -39.148643493652344, "global_step": 183581, "epoch": 1517} {"train_loss": -40.07451248168945, "global_step": 183582, "epoch": 1517} {"train_loss": -40.143009185791016, "global_step": 183583, "epoch": 1517} {"train_loss": -40.31038284301758, "global_step": 183584, "epoch": 1517} {"train_loss": -40.747352600097656, "global_step": 183585, "epoch": 1517} {"train_loss": -38.73488235473633, "global_step": 183586, "epoch": 1517} {"train_loss": -39.95930099487305, "global_step": 183587, "epoch": 1517} {"train_loss": -39.390289306640625, "global_step": 183588, "epoch": 1517} {"train_loss": -39.9871711730957, "global_step": 183589, "epoch": 1517} {"train_loss": -38.13184356689453, "global_step": 183590, "epoch": 1517} {"train_loss": -39.701507568359375, "global_step": 183591, "epoch": 1517} {"train_loss": -39.99171829223633, "global_step": 183592, "epoch": 1517} {"train_loss": -40.03220748901367, "global_step": 183593, "epoch": 1517} {"train_loss": -40.168556213378906, "global_step": 183594, "epoch": 1517} {"train_loss": -40.564369201660156, "global_step": 183595, "epoch": 1517} {"train_loss": -40.292720794677734, "global_step": 183596, "epoch": 1517} {"train_loss": -40.950740814208984, "global_step": 183597, "epoch": 1517} {"train_loss": -40.62128448486328, "global_step": 183598, "epoch": 1517} {"train_loss": -41.519073486328125, "global_step": 183599, "epoch": 1517} {"train_loss": -41.051998138427734, "global_step": 183600, "epoch": 1517} {"train_loss": -40.87113571166992, "global_step": 183601, "epoch": 1517} {"train_loss": -40.94816207885742, "global_step": 183602, "epoch": 1517} {"train_loss": -41.31256866455078, "global_step": 183603, "epoch": 1517} {"train_loss": -41.09260559082031, "global_step": 183604, "epoch": 1517} {"train_loss": -41.64226150512695, "global_step": 183605, "epoch": 1517} {"train_loss": -40.77666473388672, "global_step": 183606, "epoch": 1517} {"train_loss": -40.65887451171875, "global_step": 183607, "epoch": 1517} {"train_loss": -41.473575592041016, "global_step": 183608, "epoch": 1517} {"train_loss": -41.291839599609375, "global_step": 183609, "epoch": 1517} {"train_loss": -41.74542236328125, "global_step": 183610, "epoch": 1517} {"train_loss": -41.59846878051758, "global_step": 183611, "epoch": 1517} {"train_loss": -41.07868576049805, "global_step": 183612, "epoch": 1517} {"train_loss": -41.31745529174805, "global_step": 183613, "epoch": 1517} {"train_loss": -41.19729232788086, "global_step": 183614, "epoch": 1517} {"train_loss": -41.91543197631836, "global_step": 183615, "epoch": 1517} {"train_loss": -41.91838836669922, "global_step": 183616, "epoch": 1517} {"train_loss": -41.84465408325195, "global_step": 183617, "epoch": 1517} {"train_loss": -41.38834762573242, "global_step": 183618, "epoch": 1517} {"train_loss": -41.88581085205078, "global_step": 183619, "epoch": 1517} {"train_loss": -41.6285514831543, "global_step": 183620, "epoch": 1517} {"train_loss": -41.88810348510742, "global_step": 183621, "epoch": 1517} {"train_loss": -41.320770263671875, "global_step": 183622, "epoch": 1517} {"train_loss": -41.58312225341797, "global_step": 183623, "epoch": 1517} {"train_loss": -42.01215744018555, "global_step": 183624, "epoch": 1517} {"train_loss": -41.92761993408203, "global_step": 183625, "epoch": 1517} {"train_loss": -41.87507629394531, "global_step": 183626, "epoch": 1517} {"train_loss": -42.03657150268555, "global_step": 183627, "epoch": 1517} {"train_loss": -41.697505950927734, "global_step": 183628, "epoch": 1517} {"train_loss": -42.02273178100586, "global_step": 183629, "epoch": 1517} {"train_loss": -41.89470291137695, "global_step": 183630, "epoch": 1517} {"train_loss": -42.278255462646484, "global_step": 183631, "epoch": 1517} {"train_loss": -41.481727600097656, "global_step": 183632, "epoch": 1517} {"train_loss": -41.750396728515625, "global_step": 183633, "epoch": 1517} {"train_loss": -41.515777587890625, "global_step": 183634, "epoch": 1517} {"train_loss": -41.0842399597168, "global_step": 183635, "epoch": 1517} {"train_loss": -41.69829177856445, "global_step": 183636, "epoch": 1517} {"train_loss": -41.9864501953125, "global_step": 183637, "epoch": 1517} {"train_loss": -37.774261474609375, "global_step": 183638, "epoch": 1517} {"train_loss": -42.12630844116211, "global_step": 183639, "epoch": 1517} {"train_loss": -41.029052734375, "global_step": 183640, "epoch": 1517} {"train_loss": -41.62559127807617, "global_step": 183641, "epoch": 1517} {"train_loss": -41.65365219116211, "global_step": 183642, "epoch": 1517} {"train_loss": -42.09743118286133, "global_step": 183643, "epoch": 1517} {"train_loss": -41.46187210083008, "global_step": 183644, "epoch": 1517} {"train_loss": -41.808937072753906, "global_step": 183645, "epoch": 1517} {"train_loss": -42.540794372558594, "global_step": 183646, "epoch": 1517} {"train_loss": -41.099884033203125, "global_step": 183647, "epoch": 1517} {"train_loss": -41.27909469604492, "global_step": 183648, "epoch": 1517} {"train_loss": -38.287139892578125, "global_step": 183649, "epoch": 1517} {"train_loss": -41.050968170166016, "global_step": 183650, "epoch": 1517} {"train_loss": -38.9742431640625, "global_step": 183651, "epoch": 1517} {"train_loss": -38.109954833984375, "global_step": 183652, "epoch": 1517} {"train_loss": -40.135250091552734, "global_step": 183653, "epoch": 1517} {"train_loss": -39.384620666503906, "global_step": 183654, "epoch": 1517} {"train_loss": -40.12343215942383, "global_step": 183655, "epoch": 1517} {"train_loss": -39.110328674316406, "global_step": 183656, "epoch": 1517} {"train_loss": -36.8409309387207, "global_step": 183657, "epoch": 1517} {"train_loss": -32.79264450073242, "global_step": 183658, "epoch": 1517} {"train_loss": -35.74067306518555, "global_step": 183659, "epoch": 1517} {"train_loss": -32.284210205078125, "global_step": 183660, "epoch": 1517} {"train_loss": -29.759313583374023, "global_step": 183661, "epoch": 1517} {"train_loss": -37.315093994140625, "global_step": 183662, "epoch": 1517} {"train_loss": -39.22792053222656, "global_step": 183663, "epoch": 1517} {"train_loss": -37.05221176147461, "global_step": 183664, "epoch": 1517} {"train_loss": -36.740699768066406, "global_step": 183665, "epoch": 1517} {"train_loss": -40.039119720458984, "global_step": 183666, "epoch": 1517} {"train_loss": -36.039161682128906, "global_step": 183667, "epoch": 1517} {"train_loss": -39.36124801635742, "global_step": 183668, "epoch": 1517} {"train_loss": -36.65532684326172, "global_step": 183669, "epoch": 1517} {"train_loss": -37.972312927246094, "global_step": 183670, "epoch": 1517} {"train_loss": -38.87232208251953, "global_step": 183671, "epoch": 1517} {"train_loss": -38.10541534423828, "global_step": 183672, "epoch": 1517} {"train_loss": -39.049720764160156, "global_step": 183673, "epoch": 1517} {"train_loss": -38.81903839111328, "global_step": 183674, "epoch": 1517} {"train_loss": -39.63336181640625, "global_step": 183675, "epoch": 1517} {"train_loss": -38.56649398803711, "global_step": 183676, "epoch": 1517} {"train_loss": -39.972422938701534, "global_step": 183677, "epoch": 1517, "val_loss": 2681069.25} {"train_loss": -38.64919662475586, "global_step": 183678, "epoch": 1518} {"train_loss": -39.5773811340332, "global_step": 183679, "epoch": 1518} {"train_loss": -38.72939682006836, "global_step": 183680, "epoch": 1518} {"train_loss": -40.10213088989258, "global_step": 183681, "epoch": 1518} {"train_loss": -38.93459701538086, "global_step": 183682, "epoch": 1518} {"train_loss": -40.32844924926758, "global_step": 183683, "epoch": 1518} {"train_loss": -38.70486068725586, "global_step": 183684, "epoch": 1518} {"train_loss": -40.129058837890625, "global_step": 183685, "epoch": 1518} {"train_loss": -39.42690658569336, "global_step": 183686, "epoch": 1518} {"train_loss": -39.7967529296875, "global_step": 183687, "epoch": 1518} {"train_loss": -38.724700927734375, "global_step": 183688, "epoch": 1518} {"train_loss": -39.747657775878906, "global_step": 183689, "epoch": 1518} {"train_loss": -40.154476165771484, "global_step": 183690, "epoch": 1518} {"train_loss": -39.81964874267578, "global_step": 183691, "epoch": 1518} {"train_loss": -39.41632843017578, "global_step": 183692, "epoch": 1518} {"train_loss": -40.33103561401367, "global_step": 183693, "epoch": 1518} {"train_loss": -40.06700134277344, "global_step": 183694, "epoch": 1518} {"train_loss": -39.487545013427734, "global_step": 183695, "epoch": 1518} {"train_loss": -41.16638946533203, "global_step": 183696, "epoch": 1518} {"train_loss": -40.60903549194336, "global_step": 183697, "epoch": 1518} {"train_loss": -40.24650955200195, "global_step": 183698, "epoch": 1518} {"train_loss": -40.978118896484375, "global_step": 183699, "epoch": 1518} {"train_loss": -38.50556564331055, "global_step": 183700, "epoch": 1518} {"train_loss": -40.175559997558594, "global_step": 183701, "epoch": 1518} {"train_loss": -40.97617721557617, "global_step": 183702, "epoch": 1518} {"train_loss": -37.223690032958984, "global_step": 183703, "epoch": 1518} {"train_loss": -40.45939636230469, "global_step": 183704, "epoch": 1518} {"train_loss": -40.62372589111328, "global_step": 183705, "epoch": 1518} {"train_loss": -38.85006332397461, "global_step": 183706, "epoch": 1518} {"train_loss": -40.406185150146484, "global_step": 183707, "epoch": 1518} {"train_loss": -41.14045715332031, "global_step": 183708, "epoch": 1518} {"train_loss": -40.50661849975586, "global_step": 183709, "epoch": 1518} {"train_loss": -36.45732498168945, "global_step": 183710, "epoch": 1518} {"train_loss": -38.300106048583984, "global_step": 183711, "epoch": 1518} {"train_loss": -40.182029724121094, "global_step": 183712, "epoch": 1518} {"train_loss": -40.766761779785156, "global_step": 183713, "epoch": 1518} {"train_loss": -40.7476806640625, "global_step": 183714, "epoch": 1518} {"train_loss": -39.74034118652344, "global_step": 183715, "epoch": 1518} {"train_loss": -40.36202621459961, "global_step": 183716, "epoch": 1518} {"train_loss": -39.43137741088867, "global_step": 183717, "epoch": 1518} {"train_loss": -40.79677200317383, "global_step": 183718, "epoch": 1518} {"train_loss": -39.36753463745117, "global_step": 183719, "epoch": 1518} {"train_loss": -41.315120697021484, "global_step": 183720, "epoch": 1518} {"train_loss": -40.954444885253906, "global_step": 183721, "epoch": 1518} {"train_loss": -40.71381378173828, "global_step": 183722, "epoch": 1518} {"train_loss": -40.175086975097656, "global_step": 183723, "epoch": 1518} {"train_loss": -40.637821197509766, "global_step": 183724, "epoch": 1518} {"train_loss": -40.27659606933594, "global_step": 183725, "epoch": 1518} {"train_loss": -40.522518157958984, "global_step": 183726, "epoch": 1518} {"train_loss": -41.44259262084961, "global_step": 183727, "epoch": 1518} {"train_loss": -39.992828369140625, "global_step": 183728, "epoch": 1518} {"train_loss": -40.37254333496094, "global_step": 183729, "epoch": 1518} {"train_loss": -41.46015548706055, "global_step": 183730, "epoch": 1518} {"train_loss": -40.91666030883789, "global_step": 183731, "epoch": 1518} {"train_loss": -41.616310119628906, "global_step": 183732, "epoch": 1518} {"train_loss": -38.269283294677734, "global_step": 183733, "epoch": 1518} {"train_loss": -38.835350036621094, "global_step": 183734, "epoch": 1518} {"train_loss": -40.328826904296875, "global_step": 183735, "epoch": 1518} {"train_loss": -40.2376823425293, "global_step": 183736, "epoch": 1518} {"train_loss": -39.632789611816406, "global_step": 183737, "epoch": 1518} {"train_loss": -40.96228790283203, "global_step": 183738, "epoch": 1518} {"train_loss": -39.317138671875, "global_step": 183739, "epoch": 1518} {"train_loss": -40.02947998046875, "global_step": 183740, "epoch": 1518} {"train_loss": -39.9912223815918, "global_step": 183741, "epoch": 1518} {"train_loss": -41.35349655151367, "global_step": 183742, "epoch": 1518} {"train_loss": -40.78589630126953, "global_step": 183743, "epoch": 1518} {"train_loss": -40.81319046020508, "global_step": 183744, "epoch": 1518} {"train_loss": -41.249446868896484, "global_step": 183745, "epoch": 1518} {"train_loss": -41.06405258178711, "global_step": 183746, "epoch": 1518} {"train_loss": -39.54977035522461, "global_step": 183747, "epoch": 1518} {"train_loss": -40.80828857421875, "global_step": 183748, "epoch": 1518} {"train_loss": -41.51279830932617, "global_step": 183749, "epoch": 1518} {"train_loss": -40.23458480834961, "global_step": 183750, "epoch": 1518} {"train_loss": -40.790748596191406, "global_step": 183751, "epoch": 1518} {"train_loss": -41.472530364990234, "global_step": 183752, "epoch": 1518} {"train_loss": -40.84733200073242, "global_step": 183753, "epoch": 1518} {"train_loss": -40.80320358276367, "global_step": 183754, "epoch": 1518} {"train_loss": -41.77363204956055, "global_step": 183755, "epoch": 1518} {"train_loss": -41.69762420654297, "global_step": 183756, "epoch": 1518} {"train_loss": -41.286434173583984, "global_step": 183757, "epoch": 1518} {"train_loss": -40.42399978637695, "global_step": 183758, "epoch": 1518} {"train_loss": -40.60246658325195, "global_step": 183759, "epoch": 1518} {"train_loss": -41.18386459350586, "global_step": 183760, "epoch": 1518} {"train_loss": -41.22509765625, "global_step": 183761, "epoch": 1518} {"train_loss": -41.526588439941406, "global_step": 183762, "epoch": 1518} {"train_loss": -40.64268493652344, "global_step": 183763, "epoch": 1518} {"train_loss": -40.542724609375, "global_step": 183764, "epoch": 1518} {"train_loss": -40.72015380859375, "global_step": 183765, "epoch": 1518} {"train_loss": -41.672950744628906, "global_step": 183766, "epoch": 1518} {"train_loss": -39.316314697265625, "global_step": 183767, "epoch": 1518} {"train_loss": -40.80389404296875, "global_step": 183768, "epoch": 1518} {"train_loss": -40.940364837646484, "global_step": 183769, "epoch": 1518} {"train_loss": -40.01509094238281, "global_step": 183770, "epoch": 1518} {"train_loss": -41.04311752319336, "global_step": 183771, "epoch": 1518} {"train_loss": -40.6680908203125, "global_step": 183772, "epoch": 1518} {"train_loss": -39.14344787597656, "global_step": 183773, "epoch": 1518} {"train_loss": -40.92688751220703, "global_step": 183774, "epoch": 1518} {"train_loss": -41.3291130065918, "global_step": 183775, "epoch": 1518} {"train_loss": -41.35207748413086, "global_step": 183776, "epoch": 1518} {"train_loss": -40.67705154418945, "global_step": 183777, "epoch": 1518} {"train_loss": -40.964176177978516, "global_step": 183778, "epoch": 1518} {"train_loss": -41.59539794921875, "global_step": 183779, "epoch": 1518} {"train_loss": -39.98142623901367, "global_step": 183780, "epoch": 1518} {"train_loss": -41.54913330078125, "global_step": 183781, "epoch": 1518} {"train_loss": -41.61735534667969, "global_step": 183782, "epoch": 1518} {"train_loss": -41.50764083862305, "global_step": 183783, "epoch": 1518} {"train_loss": -40.59708786010742, "global_step": 183784, "epoch": 1518} {"train_loss": -40.909950256347656, "global_step": 183785, "epoch": 1518} {"train_loss": -41.97700119018555, "global_step": 183786, "epoch": 1518} {"train_loss": -40.75600051879883, "global_step": 183787, "epoch": 1518} {"train_loss": -39.941749572753906, "global_step": 183788, "epoch": 1518} {"train_loss": -37.37146759033203, "global_step": 183789, "epoch": 1518} {"train_loss": -39.58186721801758, "global_step": 183790, "epoch": 1518} {"train_loss": -40.985164642333984, "global_step": 183791, "epoch": 1518} {"train_loss": -38.78779983520508, "global_step": 183792, "epoch": 1518} {"train_loss": -41.5345573425293, "global_step": 183793, "epoch": 1518} {"train_loss": -38.647735595703125, "global_step": 183794, "epoch": 1518} {"train_loss": -40.75505447387695, "global_step": 183795, "epoch": 1518} {"train_loss": -40.28123092651367, "global_step": 183796, "epoch": 1518} {"train_loss": -39.339324951171875, "global_step": 183797, "epoch": 1518} {"train_loss": -40.31728993565583, "global_step": 183798, "epoch": 1518, "val_loss": 2713130.0} {"train_loss": -41.027400970458984, "global_step": 183799, "epoch": 1519} {"train_loss": -40.95160675048828, "global_step": 183800, "epoch": 1519} {"train_loss": -39.51438522338867, "global_step": 183801, "epoch": 1519} {"train_loss": -40.27882385253906, "global_step": 183802, "epoch": 1519} {"train_loss": -41.02108383178711, "global_step": 183803, "epoch": 1519} {"train_loss": -41.374603271484375, "global_step": 183804, "epoch": 1519} {"train_loss": -41.29621124267578, "global_step": 183805, "epoch": 1519} {"train_loss": -41.296653747558594, "global_step": 183806, "epoch": 1519} {"train_loss": -40.88045120239258, "global_step": 183807, "epoch": 1519} {"train_loss": -40.73269271850586, "global_step": 183808, "epoch": 1519} {"train_loss": -39.138118743896484, "global_step": 183809, "epoch": 1519} {"train_loss": -38.15205001831055, "global_step": 183810, "epoch": 1519} {"train_loss": -39.95451736450195, "global_step": 183811, "epoch": 1519} {"train_loss": -41.90386962890625, "global_step": 183812, "epoch": 1519} {"train_loss": -39.98551559448242, "global_step": 183813, "epoch": 1519} {"train_loss": -36.965938568115234, "global_step": 183814, "epoch": 1519} {"train_loss": -40.16602325439453, "global_step": 183815, "epoch": 1519} {"train_loss": -39.64347457885742, "global_step": 183816, "epoch": 1519} {"train_loss": -40.1081657409668, "global_step": 183817, "epoch": 1519} {"train_loss": -39.8725471496582, "global_step": 183818, "epoch": 1519} {"train_loss": -40.630226135253906, "global_step": 183819, "epoch": 1519} {"train_loss": -39.51976013183594, "global_step": 183820, "epoch": 1519} {"train_loss": -39.7623291015625, "global_step": 183821, "epoch": 1519} {"train_loss": -40.76003646850586, "global_step": 183822, "epoch": 1519} {"train_loss": -38.267173767089844, "global_step": 183823, "epoch": 1519} {"train_loss": -40.10871124267578, "global_step": 183824, "epoch": 1519} {"train_loss": -41.3911247253418, "global_step": 183825, "epoch": 1519} {"train_loss": -39.236854553222656, "global_step": 183826, "epoch": 1519} {"train_loss": -39.99517822265625, "global_step": 183827, "epoch": 1519} {"train_loss": -40.89494705200195, "global_step": 183828, "epoch": 1519} {"train_loss": -41.08562469482422, "global_step": 183829, "epoch": 1519} {"train_loss": -40.1901969909668, "global_step": 183830, "epoch": 1519} {"train_loss": -41.16707992553711, "global_step": 183831, "epoch": 1519} {"train_loss": -39.757843017578125, "global_step": 183832, "epoch": 1519} {"train_loss": -40.44446563720703, "global_step": 183833, "epoch": 1519} {"train_loss": -41.407958984375, "global_step": 183834, "epoch": 1519} {"train_loss": -41.45417785644531, "global_step": 183835, "epoch": 1519} {"train_loss": -41.33842086791992, "global_step": 183836, "epoch": 1519} {"train_loss": -40.0326042175293, "global_step": 183837, "epoch": 1519} {"train_loss": -40.593833923339844, "global_step": 183838, "epoch": 1519} {"train_loss": -40.4010124206543, "global_step": 183839, "epoch": 1519} {"train_loss": -39.575462341308594, "global_step": 183840, "epoch": 1519} {"train_loss": -38.58939743041992, "global_step": 183841, "epoch": 1519} {"train_loss": -40.6849479675293, "global_step": 183842, "epoch": 1519} {"train_loss": -39.80666732788086, "global_step": 183843, "epoch": 1519} {"train_loss": -39.269996643066406, "global_step": 183844, "epoch": 1519} {"train_loss": -39.88801956176758, "global_step": 183845, "epoch": 1519} {"train_loss": -38.29191589355469, "global_step": 183846, "epoch": 1519} {"train_loss": -40.677818298339844, "global_step": 183847, "epoch": 1519} {"train_loss": -40.002864837646484, "global_step": 183848, "epoch": 1519} {"train_loss": -39.68122100830078, "global_step": 183849, "epoch": 1519} {"train_loss": -39.7002067565918, "global_step": 183850, "epoch": 1519} {"train_loss": -41.277198791503906, "global_step": 183851, "epoch": 1519} {"train_loss": -38.306705474853516, "global_step": 183852, "epoch": 1519} {"train_loss": -38.040252685546875, "global_step": 183853, "epoch": 1519} {"train_loss": -40.58046340942383, "global_step": 183854, "epoch": 1519} {"train_loss": -41.2069206237793, "global_step": 183855, "epoch": 1519} {"train_loss": -37.224853515625, "global_step": 183856, "epoch": 1519} {"train_loss": -40.40544509887695, "global_step": 183857, "epoch": 1519} {"train_loss": -39.79314041137695, "global_step": 183858, "epoch": 1519} {"train_loss": -39.82949447631836, "global_step": 183859, "epoch": 1519} {"train_loss": -40.064117431640625, "global_step": 183860, "epoch": 1519} {"train_loss": -37.99580764770508, "global_step": 183861, "epoch": 1519} {"train_loss": -38.500221252441406, "global_step": 183862, "epoch": 1519} {"train_loss": -40.70781326293945, "global_step": 183863, "epoch": 1519} {"train_loss": -40.287010192871094, "global_step": 183864, "epoch": 1519} {"train_loss": -38.19081497192383, "global_step": 183865, "epoch": 1519} {"train_loss": -39.13909912109375, "global_step": 183866, "epoch": 1519} {"train_loss": -40.53969955444336, "global_step": 183867, "epoch": 1519} {"train_loss": -37.478755950927734, "global_step": 183868, "epoch": 1519} {"train_loss": -37.13623046875, "global_step": 183869, "epoch": 1519} {"train_loss": -39.903175354003906, "global_step": 183870, "epoch": 1519} {"train_loss": -37.4886589050293, "global_step": 183871, "epoch": 1519} {"train_loss": -37.66307067871094, "global_step": 183872, "epoch": 1519} {"train_loss": -40.026939392089844, "global_step": 183873, "epoch": 1519} {"train_loss": -39.3826789855957, "global_step": 183874, "epoch": 1519} {"train_loss": -35.86707305908203, "global_step": 183875, "epoch": 1519} {"train_loss": -38.403316497802734, "global_step": 183876, "epoch": 1519} {"train_loss": -38.12467575073242, "global_step": 183877, "epoch": 1519} {"train_loss": -38.49922561645508, "global_step": 183878, "epoch": 1519} {"train_loss": -39.50410461425781, "global_step": 183879, "epoch": 1519} {"train_loss": -38.00825119018555, "global_step": 183880, "epoch": 1519} {"train_loss": -38.21549606323242, "global_step": 183881, "epoch": 1519} {"train_loss": -39.554988861083984, "global_step": 183882, "epoch": 1519} {"train_loss": -34.670326232910156, "global_step": 183883, "epoch": 1519} {"train_loss": -38.224151611328125, "global_step": 183884, "epoch": 1519} {"train_loss": -36.33710861206055, "global_step": 183885, "epoch": 1519} {"train_loss": -38.36837387084961, "global_step": 183886, "epoch": 1519} {"train_loss": -37.68284606933594, "global_step": 183887, "epoch": 1519} {"train_loss": -37.41904830932617, "global_step": 183888, "epoch": 1519} {"train_loss": -36.64609146118164, "global_step": 183889, "epoch": 1519} {"train_loss": -38.54777908325195, "global_step": 183890, "epoch": 1519} {"train_loss": -38.67229461669922, "global_step": 183891, "epoch": 1519} {"train_loss": -37.83756637573242, "global_step": 183892, "epoch": 1519} {"train_loss": -39.09666061401367, "global_step": 183893, "epoch": 1519} {"train_loss": -38.39604949951172, "global_step": 183894, "epoch": 1519} {"train_loss": -38.80648422241211, "global_step": 183895, "epoch": 1519} {"train_loss": -34.00272750854492, "global_step": 183896, "epoch": 1519} {"train_loss": -38.72867965698242, "global_step": 183897, "epoch": 1519} {"train_loss": -38.330352783203125, "global_step": 183898, "epoch": 1519} {"train_loss": -39.5670280456543, "global_step": 183899, "epoch": 1519} {"train_loss": -33.44226837158203, "global_step": 183900, "epoch": 1519} {"train_loss": -35.72072982788086, "global_step": 183901, "epoch": 1519} {"train_loss": -36.5038948059082, "global_step": 183902, "epoch": 1519} {"train_loss": -38.14486312866211, "global_step": 183903, "epoch": 1519} {"train_loss": -33.555030822753906, "global_step": 183904, "epoch": 1519} {"train_loss": -37.69269943237305, "global_step": 183905, "epoch": 1519} {"train_loss": -36.580078125, "global_step": 183906, "epoch": 1519} {"train_loss": -37.62141036987305, "global_step": 183907, "epoch": 1519} {"train_loss": -37.679054260253906, "global_step": 183908, "epoch": 1519} {"train_loss": -37.17490768432617, "global_step": 183909, "epoch": 1519} {"train_loss": -38.472408294677734, "global_step": 183910, "epoch": 1519} {"train_loss": -37.908382415771484, "global_step": 183911, "epoch": 1519} {"train_loss": -35.19104766845703, "global_step": 183912, "epoch": 1519} {"train_loss": -37.199432373046875, "global_step": 183913, "epoch": 1519} {"train_loss": -38.556941986083984, "global_step": 183914, "epoch": 1519} {"train_loss": -34.520748138427734, "global_step": 183915, "epoch": 1519} {"train_loss": -37.92728805541992, "global_step": 183916, "epoch": 1519} {"train_loss": -36.921443939208984, "global_step": 183917, "epoch": 1519} {"train_loss": -36.94308090209961, "global_step": 183918, "epoch": 1519} {"train_loss": -38.943001140247695, "global_step": 183919, "epoch": 1519, "val_loss": 2656558.25} {"train_loss": -38.80216598510742, "global_step": 183920, "epoch": 1520} {"train_loss": -38.491973876953125, "global_step": 183921, "epoch": 1520} {"train_loss": -38.8887825012207, "global_step": 183922, "epoch": 1520} {"train_loss": -38.3848762512207, "global_step": 183923, "epoch": 1520} {"train_loss": -37.31562423706055, "global_step": 183924, "epoch": 1520} {"train_loss": -38.89857864379883, "global_step": 183925, "epoch": 1520} {"train_loss": -38.30068588256836, "global_step": 183926, "epoch": 1520} {"train_loss": -37.749019622802734, "global_step": 183927, "epoch": 1520} {"train_loss": -37.58975601196289, "global_step": 183928, "epoch": 1520} {"train_loss": -37.67047882080078, "global_step": 183929, "epoch": 1520} {"train_loss": -39.27827835083008, "global_step": 183930, "epoch": 1520} {"train_loss": -37.03392791748047, "global_step": 183931, "epoch": 1520} {"train_loss": -36.60444259643555, "global_step": 183932, "epoch": 1520} {"train_loss": -38.25145721435547, "global_step": 183933, "epoch": 1520} {"train_loss": -39.796112060546875, "global_step": 183934, "epoch": 1520} {"train_loss": -38.281368255615234, "global_step": 183935, "epoch": 1520} {"train_loss": -38.30592727661133, "global_step": 183936, "epoch": 1520} {"train_loss": -37.39136505126953, "global_step": 183937, "epoch": 1520} {"train_loss": -39.66151809692383, "global_step": 183938, "epoch": 1520} {"train_loss": -39.64686584472656, "global_step": 183939, "epoch": 1520} {"train_loss": -39.95140075683594, "global_step": 183940, "epoch": 1520} {"train_loss": -38.8388786315918, "global_step": 183941, "epoch": 1520} {"train_loss": -39.34158706665039, "global_step": 183942, "epoch": 1520} {"train_loss": -39.056640625, "global_step": 183943, "epoch": 1520} {"train_loss": -38.75728225708008, "global_step": 183944, "epoch": 1520} {"train_loss": -39.187530517578125, "global_step": 183945, "epoch": 1520} {"train_loss": -40.04280471801758, "global_step": 183946, "epoch": 1520} {"train_loss": -39.64763259887695, "global_step": 183947, "epoch": 1520} {"train_loss": -39.97359848022461, "global_step": 183948, "epoch": 1520} {"train_loss": -40.12594223022461, "global_step": 183949, "epoch": 1520} {"train_loss": -39.205379486083984, "global_step": 183950, "epoch": 1520} {"train_loss": -39.652198791503906, "global_step": 183951, "epoch": 1520} {"train_loss": -39.663875579833984, "global_step": 183952, "epoch": 1520} {"train_loss": -39.10482406616211, "global_step": 183953, "epoch": 1520} {"train_loss": -40.00858688354492, "global_step": 183954, "epoch": 1520} {"train_loss": -39.68012237548828, "global_step": 183955, "epoch": 1520} {"train_loss": -39.276329040527344, "global_step": 183956, "epoch": 1520} {"train_loss": -38.908382415771484, "global_step": 183957, "epoch": 1520} {"train_loss": -39.1041374206543, "global_step": 183958, "epoch": 1520} {"train_loss": -40.100852966308594, "global_step": 183959, "epoch": 1520} {"train_loss": -40.295936584472656, "global_step": 183960, "epoch": 1520} {"train_loss": -40.06061553955078, "global_step": 183961, "epoch": 1520} {"train_loss": -38.438507080078125, "global_step": 183962, "epoch": 1520} {"train_loss": -39.7906608581543, "global_step": 183963, "epoch": 1520} {"train_loss": -39.07698440551758, "global_step": 183964, "epoch": 1520} {"train_loss": -40.2309684753418, "global_step": 183965, "epoch": 1520} {"train_loss": -40.05351257324219, "global_step": 183966, "epoch": 1520} {"train_loss": -39.73955154418945, "global_step": 183967, "epoch": 1520} {"train_loss": -40.410369873046875, "global_step": 183968, "epoch": 1520} {"train_loss": -39.66840362548828, "global_step": 183969, "epoch": 1520} {"train_loss": -40.28812789916992, "global_step": 183970, "epoch": 1520} {"train_loss": -40.899505615234375, "global_step": 183971, "epoch": 1520} {"train_loss": -40.035430908203125, "global_step": 183972, "epoch": 1520} {"train_loss": -40.65427017211914, "global_step": 183973, "epoch": 1520} {"train_loss": -40.592830657958984, "global_step": 183974, "epoch": 1520} {"train_loss": -40.60166931152344, "global_step": 183975, "epoch": 1520} {"train_loss": -40.349578857421875, "global_step": 183976, "epoch": 1520} {"train_loss": -39.871395111083984, "global_step": 183977, "epoch": 1520} {"train_loss": -40.446197509765625, "global_step": 183978, "epoch": 1520} {"train_loss": -39.493621826171875, "global_step": 183979, "epoch": 1520} {"train_loss": -41.05046081542969, "global_step": 183980, "epoch": 1520} {"train_loss": -40.48025131225586, "global_step": 183981, "epoch": 1520} {"train_loss": -40.79010009765625, "global_step": 183982, "epoch": 1520} {"train_loss": -40.118228912353516, "global_step": 183983, "epoch": 1520} {"train_loss": -40.3594970703125, "global_step": 183984, "epoch": 1520} {"train_loss": -41.142704010009766, "global_step": 183985, "epoch": 1520} {"train_loss": -38.93101119995117, "global_step": 183986, "epoch": 1520} {"train_loss": -40.694374084472656, "global_step": 183987, "epoch": 1520} {"train_loss": -40.47174835205078, "global_step": 183988, "epoch": 1520} {"train_loss": -41.284027099609375, "global_step": 183989, "epoch": 1520} {"train_loss": -40.3858757019043, "global_step": 183990, "epoch": 1520} {"train_loss": -40.500518798828125, "global_step": 183991, "epoch": 1520} {"train_loss": -40.22084426879883, "global_step": 183992, "epoch": 1520} {"train_loss": -41.20585250854492, "global_step": 183993, "epoch": 1520} {"train_loss": -40.83045196533203, "global_step": 183994, "epoch": 1520} {"train_loss": -40.50926208496094, "global_step": 183995, "epoch": 1520} {"train_loss": -41.26422119140625, "global_step": 183996, "epoch": 1520} {"train_loss": -40.406795501708984, "global_step": 183997, "epoch": 1520} {"train_loss": -41.00815200805664, "global_step": 183998, "epoch": 1520} {"train_loss": -40.26185989379883, "global_step": 183999, "epoch": 1520} {"train_loss": -40.93328094482422, "global_step": 184000, "epoch": 1520} {"train_loss": -40.867340087890625, "global_step": 184001, "epoch": 1520} {"train_loss": -41.033138275146484, "global_step": 184002, "epoch": 1520} {"train_loss": -40.51032638549805, "global_step": 184003, "epoch": 1520} {"train_loss": -41.35650634765625, "global_step": 184004, "epoch": 1520} {"train_loss": -41.0701789855957, "global_step": 184005, "epoch": 1520} {"train_loss": -41.558616638183594, "global_step": 184006, "epoch": 1520} {"train_loss": -41.67403793334961, "global_step": 184007, "epoch": 1520} {"train_loss": -41.28121566772461, "global_step": 184008, "epoch": 1520} {"train_loss": -40.930110931396484, "global_step": 184009, "epoch": 1520} {"train_loss": -40.993324279785156, "global_step": 184010, "epoch": 1520} {"train_loss": -41.056854248046875, "global_step": 184011, "epoch": 1520} {"train_loss": -41.38587188720703, "global_step": 184012, "epoch": 1520} {"train_loss": -41.785037994384766, "global_step": 184013, "epoch": 1520} {"train_loss": -41.141998291015625, "global_step": 184014, "epoch": 1520} {"train_loss": -41.42129135131836, "global_step": 184015, "epoch": 1520} {"train_loss": -41.64250946044922, "global_step": 184016, "epoch": 1520} {"train_loss": -41.43208694458008, "global_step": 184017, "epoch": 1520} {"train_loss": -41.208370208740234, "global_step": 184018, "epoch": 1520} {"train_loss": -40.768245697021484, "global_step": 184019, "epoch": 1520} {"train_loss": -40.90143585205078, "global_step": 184020, "epoch": 1520} {"train_loss": -41.15078353881836, "global_step": 184021, "epoch": 1520} {"train_loss": -41.72543716430664, "global_step": 184022, "epoch": 1520} {"train_loss": -41.10854721069336, "global_step": 184023, "epoch": 1520} {"train_loss": -41.798709869384766, "global_step": 184024, "epoch": 1520} {"train_loss": -41.122589111328125, "global_step": 184025, "epoch": 1520} {"train_loss": -41.659976959228516, "global_step": 184026, "epoch": 1520} {"train_loss": -41.283416748046875, "global_step": 184027, "epoch": 1520} {"train_loss": -41.65371322631836, "global_step": 184028, "epoch": 1520} {"train_loss": -41.30647277832031, "global_step": 184029, "epoch": 1520} {"train_loss": -41.12567138671875, "global_step": 184030, "epoch": 1520} {"train_loss": -41.959510803222656, "global_step": 184031, "epoch": 1520} {"train_loss": -42.108375549316406, "global_step": 184032, "epoch": 1520} {"train_loss": -41.545467376708984, "global_step": 184033, "epoch": 1520} {"train_loss": -41.61265182495117, "global_step": 184034, "epoch": 1520} {"train_loss": -41.15808868408203, "global_step": 184035, "epoch": 1520} {"train_loss": -41.61885070800781, "global_step": 184036, "epoch": 1520} {"train_loss": -40.708961486816406, "global_step": 184037, "epoch": 1520} {"train_loss": -41.38389587402344, "global_step": 184038, "epoch": 1520} {"train_loss": -41.53251647949219, "global_step": 184039, "epoch": 1520} {"train_loss": -40.17530687190285, "global_step": 184040, "epoch": 1520, "val_loss": 2744342.5} {"train_loss": -39.79899215698242, "global_step": 184041, "epoch": 1521} {"train_loss": -38.37982940673828, "global_step": 184042, "epoch": 1521} {"train_loss": -34.77131271362305, "global_step": 184043, "epoch": 1521} {"train_loss": -31.11317253112793, "global_step": 184044, "epoch": 1521} {"train_loss": -20.016319274902344, "global_step": 184045, "epoch": 1521} {"train_loss": -13.404437065124512, "global_step": 184046, "epoch": 1521} {"train_loss": -29.586095809936523, "global_step": 184047, "epoch": 1521} {"train_loss": -33.41420364379883, "global_step": 184048, "epoch": 1521} {"train_loss": -35.05942153930664, "global_step": 184049, "epoch": 1521} {"train_loss": -37.86201858520508, "global_step": 184050, "epoch": 1521} {"train_loss": -34.58172607421875, "global_step": 184051, "epoch": 1521} {"train_loss": -35.4605598449707, "global_step": 184052, "epoch": 1521} {"train_loss": -36.40300750732422, "global_step": 184053, "epoch": 1521} {"train_loss": -35.25472640991211, "global_step": 184054, "epoch": 1521} {"train_loss": -36.2440185546875, "global_step": 184055, "epoch": 1521} {"train_loss": -35.7900505065918, "global_step": 184056, "epoch": 1521} {"train_loss": -36.270477294921875, "global_step": 184057, "epoch": 1521} {"train_loss": -37.22270202636719, "global_step": 184058, "epoch": 1521} {"train_loss": -36.97388458251953, "global_step": 184059, "epoch": 1521} {"train_loss": -37.02402877807617, "global_step": 184060, "epoch": 1521} {"train_loss": -38.932891845703125, "global_step": 184061, "epoch": 1521} {"train_loss": -38.708370208740234, "global_step": 184062, "epoch": 1521} {"train_loss": -38.06884765625, "global_step": 184063, "epoch": 1521} {"train_loss": -38.750038146972656, "global_step": 184064, "epoch": 1521} {"train_loss": -37.22272872924805, "global_step": 184065, "epoch": 1521} {"train_loss": -37.88751983642578, "global_step": 184066, "epoch": 1521} {"train_loss": -37.86163330078125, "global_step": 184067, "epoch": 1521} {"train_loss": -37.97467803955078, "global_step": 184068, "epoch": 1521} {"train_loss": -39.55281448364258, "global_step": 184069, "epoch": 1521} {"train_loss": -39.94110107421875, "global_step": 184070, "epoch": 1521} {"train_loss": -39.333187103271484, "global_step": 184071, "epoch": 1521} {"train_loss": -39.739070892333984, "global_step": 184072, "epoch": 1521} {"train_loss": -37.72220993041992, "global_step": 184073, "epoch": 1521} {"train_loss": -39.23886489868164, "global_step": 184074, "epoch": 1521} {"train_loss": -39.51823425292969, "global_step": 184075, "epoch": 1521} {"train_loss": -39.70547866821289, "global_step": 184076, "epoch": 1521} {"train_loss": -39.17803955078125, "global_step": 184077, "epoch": 1521} {"train_loss": -39.6047248840332, "global_step": 184078, "epoch": 1521} {"train_loss": -39.6044921875, "global_step": 184079, "epoch": 1521} {"train_loss": -39.56855010986328, "global_step": 184080, "epoch": 1521} {"train_loss": -38.52887725830078, "global_step": 184081, "epoch": 1521} {"train_loss": -39.103240966796875, "global_step": 184082, "epoch": 1521} {"train_loss": -39.011043548583984, "global_step": 184083, "epoch": 1521} {"train_loss": -39.13993453979492, "global_step": 184084, "epoch": 1521} {"train_loss": -40.00857162475586, "global_step": 184085, "epoch": 1521} {"train_loss": -40.274993896484375, "global_step": 184086, "epoch": 1521} {"train_loss": -39.05833053588867, "global_step": 184087, "epoch": 1521} {"train_loss": -39.748199462890625, "global_step": 184088, "epoch": 1521} {"train_loss": -40.15717315673828, "global_step": 184089, "epoch": 1521} {"train_loss": -39.527767181396484, "global_step": 184090, "epoch": 1521} {"train_loss": -39.26293182373047, "global_step": 184091, "epoch": 1521} {"train_loss": -39.17974090576172, "global_step": 184092, "epoch": 1521} {"train_loss": -39.719764709472656, "global_step": 184093, "epoch": 1521} {"train_loss": -40.12677001953125, "global_step": 184094, "epoch": 1521} {"train_loss": -39.60479736328125, "global_step": 184095, "epoch": 1521} {"train_loss": -38.676727294921875, "global_step": 184096, "epoch": 1521} {"train_loss": -40.13576126098633, "global_step": 184097, "epoch": 1521} {"train_loss": -39.91789245605469, "global_step": 184098, "epoch": 1521} {"train_loss": -39.700069427490234, "global_step": 184099, "epoch": 1521} {"train_loss": -40.21970748901367, "global_step": 184100, "epoch": 1521} {"train_loss": -40.21035385131836, "global_step": 184101, "epoch": 1521} {"train_loss": -40.30611038208008, "global_step": 184102, "epoch": 1521} {"train_loss": -35.601531982421875, "global_step": 184103, "epoch": 1521} {"train_loss": -39.13641357421875, "global_step": 184104, "epoch": 1521} {"train_loss": -39.45449447631836, "global_step": 184105, "epoch": 1521} {"train_loss": -40.254920959472656, "global_step": 184106, "epoch": 1521} {"train_loss": -35.36232376098633, "global_step": 184107, "epoch": 1521} {"train_loss": -40.701515197753906, "global_step": 184108, "epoch": 1521} {"train_loss": -40.333778381347656, "global_step": 184109, "epoch": 1521} {"train_loss": -40.442928314208984, "global_step": 184110, "epoch": 1521} {"train_loss": -39.3389892578125, "global_step": 184111, "epoch": 1521} {"train_loss": -40.302799224853516, "global_step": 184112, "epoch": 1521} {"train_loss": -38.84597396850586, "global_step": 184113, "epoch": 1521} {"train_loss": -40.169898986816406, "global_step": 184114, "epoch": 1521} {"train_loss": -39.365901947021484, "global_step": 184115, "epoch": 1521} {"train_loss": -39.9670524597168, "global_step": 184116, "epoch": 1521} {"train_loss": -39.2523078918457, "global_step": 184117, "epoch": 1521} {"train_loss": -39.39551544189453, "global_step": 184118, "epoch": 1521} {"train_loss": -40.617828369140625, "global_step": 184119, "epoch": 1521} {"train_loss": -40.23246765136719, "global_step": 184120, "epoch": 1521} {"train_loss": -40.563018798828125, "global_step": 184121, "epoch": 1521} {"train_loss": -39.86743927001953, "global_step": 184122, "epoch": 1521} {"train_loss": -40.6131477355957, "global_step": 184123, "epoch": 1521} {"train_loss": -40.102821350097656, "global_step": 184124, "epoch": 1521} {"train_loss": -40.64776611328125, "global_step": 184125, "epoch": 1521} {"train_loss": -38.71547317504883, "global_step": 184126, "epoch": 1521} {"train_loss": -38.80297088623047, "global_step": 184127, "epoch": 1521} {"train_loss": -39.92323303222656, "global_step": 184128, "epoch": 1521} {"train_loss": -40.499427795410156, "global_step": 184129, "epoch": 1521} {"train_loss": -40.17594528198242, "global_step": 184130, "epoch": 1521} {"train_loss": -39.951316833496094, "global_step": 184131, "epoch": 1521} {"train_loss": -39.90558624267578, "global_step": 184132, "epoch": 1521} {"train_loss": -40.325557708740234, "global_step": 184133, "epoch": 1521} {"train_loss": -40.2883415222168, "global_step": 184134, "epoch": 1521} {"train_loss": -40.872615814208984, "global_step": 184135, "epoch": 1521} {"train_loss": -40.117431640625, "global_step": 184136, "epoch": 1521} {"train_loss": -40.61947250366211, "global_step": 184137, "epoch": 1521} {"train_loss": -41.03022384643555, "global_step": 184138, "epoch": 1521} {"train_loss": -40.00006866455078, "global_step": 184139, "epoch": 1521} {"train_loss": -39.91669845581055, "global_step": 184140, "epoch": 1521} {"train_loss": -39.58274459838867, "global_step": 184141, "epoch": 1521} {"train_loss": -41.14102554321289, "global_step": 184142, "epoch": 1521} {"train_loss": -40.42384719848633, "global_step": 184143, "epoch": 1521} {"train_loss": -40.60563278198242, "global_step": 184144, "epoch": 1521} {"train_loss": -41.34344482421875, "global_step": 184145, "epoch": 1521} {"train_loss": -41.02669143676758, "global_step": 184146, "epoch": 1521} {"train_loss": -40.503204345703125, "global_step": 184147, "epoch": 1521} {"train_loss": -40.46994400024414, "global_step": 184148, "epoch": 1521} {"train_loss": -41.07263946533203, "global_step": 184149, "epoch": 1521} {"train_loss": -40.12008285522461, "global_step": 184150, "epoch": 1521} {"train_loss": -40.680145263671875, "global_step": 184151, "epoch": 1521} {"train_loss": -41.27117919921875, "global_step": 184152, "epoch": 1521} {"train_loss": -41.23855209350586, "global_step": 184153, "epoch": 1521} {"train_loss": -41.16876220703125, "global_step": 184154, "epoch": 1521} {"train_loss": -41.56629180908203, "global_step": 184155, "epoch": 1521} {"train_loss": -40.76786422729492, "global_step": 184156, "epoch": 1521} {"train_loss": -41.27685546875, "global_step": 184157, "epoch": 1521} {"train_loss": -40.05572509765625, "global_step": 184158, "epoch": 1521} {"train_loss": -41.002601623535156, "global_step": 184159, "epoch": 1521} {"train_loss": -40.89697265625, "global_step": 184160, "epoch": 1521} {"train_loss": -38.7786372712821, "global_step": 184161, "epoch": 1521, "val_loss": 2702942.25} {"train_loss": -41.067047119140625, "global_step": 184162, "epoch": 1522} {"train_loss": -41.14911651611328, "global_step": 184163, "epoch": 1522} {"train_loss": -41.480167388916016, "global_step": 184164, "epoch": 1522} {"train_loss": -40.67930603027344, "global_step": 184165, "epoch": 1522} {"train_loss": -40.99690628051758, "global_step": 184166, "epoch": 1522} {"train_loss": -41.560882568359375, "global_step": 184167, "epoch": 1522} {"train_loss": -41.22242736816406, "global_step": 184168, "epoch": 1522} {"train_loss": -40.8386116027832, "global_step": 184169, "epoch": 1522} {"train_loss": -40.4399299621582, "global_step": 184170, "epoch": 1522} {"train_loss": -37.667694091796875, "global_step": 184171, "epoch": 1522} {"train_loss": -40.5308837890625, "global_step": 184172, "epoch": 1522} {"train_loss": -41.47309112548828, "global_step": 184173, "epoch": 1522} {"train_loss": -41.65193557739258, "global_step": 184174, "epoch": 1522} {"train_loss": -40.581024169921875, "global_step": 184175, "epoch": 1522} {"train_loss": -37.94944381713867, "global_step": 184176, "epoch": 1522} {"train_loss": -41.24118423461914, "global_step": 184177, "epoch": 1522} {"train_loss": -41.33890914916992, "global_step": 184178, "epoch": 1522} {"train_loss": -41.56401443481445, "global_step": 184179, "epoch": 1522} {"train_loss": -41.72268295288086, "global_step": 184180, "epoch": 1522} {"train_loss": -41.85768127441406, "global_step": 184181, "epoch": 1522} {"train_loss": -41.260169982910156, "global_step": 184182, "epoch": 1522} {"train_loss": -41.44926071166992, "global_step": 184183, "epoch": 1522} {"train_loss": -41.86857986450195, "global_step": 184184, "epoch": 1522} {"train_loss": -41.363006591796875, "global_step": 184185, "epoch": 1522} {"train_loss": -41.1624870300293, "global_step": 184186, "epoch": 1522} {"train_loss": -41.67025375366211, "global_step": 184187, "epoch": 1522} {"train_loss": -41.584266662597656, "global_step": 184188, "epoch": 1522} {"train_loss": -41.748634338378906, "global_step": 184189, "epoch": 1522} {"train_loss": -41.7591667175293, "global_step": 184190, "epoch": 1522} {"train_loss": -41.565521240234375, "global_step": 184191, "epoch": 1522} {"train_loss": -41.420166015625, "global_step": 184192, "epoch": 1522} {"train_loss": -41.551597595214844, "global_step": 184193, "epoch": 1522} {"train_loss": -40.27689743041992, "global_step": 184194, "epoch": 1522} {"train_loss": -41.85303497314453, "global_step": 184195, "epoch": 1522} {"train_loss": -41.26581573486328, "global_step": 184196, "epoch": 1522} {"train_loss": -42.07436752319336, "global_step": 184197, "epoch": 1522} {"train_loss": -41.65853500366211, "global_step": 184198, "epoch": 1522} {"train_loss": -42.030921936035156, "global_step": 184199, "epoch": 1522} {"train_loss": -41.8546028137207, "global_step": 184200, "epoch": 1522} {"train_loss": -41.47397232055664, "global_step": 184201, "epoch": 1522} {"train_loss": -40.831298828125, "global_step": 184202, "epoch": 1522} {"train_loss": -39.228824615478516, "global_step": 184203, "epoch": 1522} {"train_loss": -36.93453598022461, "global_step": 184204, "epoch": 1522} {"train_loss": -34.4222412109375, "global_step": 184205, "epoch": 1522} {"train_loss": -31.47163200378418, "global_step": 184206, "epoch": 1522} {"train_loss": -33.75642776489258, "global_step": 184207, "epoch": 1522} {"train_loss": -40.01923751831055, "global_step": 184208, "epoch": 1522} {"train_loss": -38.65229415893555, "global_step": 184209, "epoch": 1522} {"train_loss": -36.073089599609375, "global_step": 184210, "epoch": 1522} {"train_loss": -37.044883728027344, "global_step": 184211, "epoch": 1522} {"train_loss": -40.69578552246094, "global_step": 184212, "epoch": 1522} {"train_loss": -38.498695373535156, "global_step": 184213, "epoch": 1522} {"train_loss": -37.6892204284668, "global_step": 184214, "epoch": 1522} {"train_loss": -39.70185089111328, "global_step": 184215, "epoch": 1522} {"train_loss": -38.31031036376953, "global_step": 184216, "epoch": 1522} {"train_loss": -40.033329010009766, "global_step": 184217, "epoch": 1522} {"train_loss": -38.50520706176758, "global_step": 184218, "epoch": 1522} {"train_loss": -38.917755126953125, "global_step": 184219, "epoch": 1522} {"train_loss": -40.46800994873047, "global_step": 184220, "epoch": 1522} {"train_loss": -38.600746154785156, "global_step": 184221, "epoch": 1522} {"train_loss": -40.00602722167969, "global_step": 184222, "epoch": 1522} {"train_loss": -39.63969039916992, "global_step": 184223, "epoch": 1522} {"train_loss": -40.51595687866211, "global_step": 184224, "epoch": 1522} {"train_loss": -38.59931945800781, "global_step": 184225, "epoch": 1522} {"train_loss": -39.97098922729492, "global_step": 184226, "epoch": 1522} {"train_loss": -39.17337417602539, "global_step": 184227, "epoch": 1522} {"train_loss": -40.28104019165039, "global_step": 184228, "epoch": 1522} {"train_loss": -38.779754638671875, "global_step": 184229, "epoch": 1522} {"train_loss": -39.38600158691406, "global_step": 184230, "epoch": 1522} {"train_loss": -37.45293045043945, "global_step": 184231, "epoch": 1522} {"train_loss": -37.62090301513672, "global_step": 184232, "epoch": 1522} {"train_loss": -38.22855758666992, "global_step": 184233, "epoch": 1522} {"train_loss": -38.17057418823242, "global_step": 184234, "epoch": 1522} {"train_loss": -37.646114349365234, "global_step": 184235, "epoch": 1522} {"train_loss": -38.78960037231445, "global_step": 184236, "epoch": 1522} {"train_loss": -38.15260314941406, "global_step": 184237, "epoch": 1522} {"train_loss": -38.51575469970703, "global_step": 184238, "epoch": 1522} {"train_loss": -37.85067367553711, "global_step": 184239, "epoch": 1522} {"train_loss": -39.48866653442383, "global_step": 184240, "epoch": 1522} {"train_loss": -39.709266662597656, "global_step": 184241, "epoch": 1522} {"train_loss": -39.7126579284668, "global_step": 184242, "epoch": 1522} {"train_loss": -40.835140228271484, "global_step": 184243, "epoch": 1522} {"train_loss": -39.34337615966797, "global_step": 184244, "epoch": 1522} {"train_loss": -40.58221435546875, "global_step": 184245, "epoch": 1522} {"train_loss": -39.649147033691406, "global_step": 184246, "epoch": 1522} {"train_loss": -39.768714904785156, "global_step": 184247, "epoch": 1522} {"train_loss": -40.61616134643555, "global_step": 184248, "epoch": 1522} {"train_loss": -39.66122055053711, "global_step": 184249, "epoch": 1522} {"train_loss": -39.189945220947266, "global_step": 184250, "epoch": 1522} {"train_loss": -40.8501091003418, "global_step": 184251, "epoch": 1522} {"train_loss": -40.46413803100586, "global_step": 184252, "epoch": 1522} {"train_loss": -39.41891098022461, "global_step": 184253, "epoch": 1522} {"train_loss": -39.81909942626953, "global_step": 184254, "epoch": 1522} {"train_loss": -40.34552764892578, "global_step": 184255, "epoch": 1522} {"train_loss": -40.470096588134766, "global_step": 184256, "epoch": 1522} {"train_loss": -40.583187103271484, "global_step": 184257, "epoch": 1522} {"train_loss": -41.10102081298828, "global_step": 184258, "epoch": 1522} {"train_loss": -41.22159957885742, "global_step": 184259, "epoch": 1522} {"train_loss": -40.92745590209961, "global_step": 184260, "epoch": 1522} {"train_loss": -40.78519821166992, "global_step": 184261, "epoch": 1522} {"train_loss": -41.3476448059082, "global_step": 184262, "epoch": 1522} {"train_loss": -41.027130126953125, "global_step": 184263, "epoch": 1522} {"train_loss": -41.06919860839844, "global_step": 184264, "epoch": 1522} {"train_loss": -41.20164108276367, "global_step": 184265, "epoch": 1522} {"train_loss": -39.98047637939453, "global_step": 184266, "epoch": 1522} {"train_loss": -41.59450912475586, "global_step": 184267, "epoch": 1522} {"train_loss": -41.29021072387695, "global_step": 184268, "epoch": 1522} {"train_loss": -40.98643112182617, "global_step": 184269, "epoch": 1522} {"train_loss": -40.992671966552734, "global_step": 184270, "epoch": 1522} {"train_loss": -41.37592697143555, "global_step": 184271, "epoch": 1522} {"train_loss": -40.00031280517578, "global_step": 184272, "epoch": 1522} {"train_loss": -39.42842102050781, "global_step": 184273, "epoch": 1522} {"train_loss": -41.54865264892578, "global_step": 184274, "epoch": 1522} {"train_loss": -41.419185638427734, "global_step": 184275, "epoch": 1522} {"train_loss": -41.46935272216797, "global_step": 184276, "epoch": 1522} {"train_loss": -41.86481857299805, "global_step": 184277, "epoch": 1522} {"train_loss": -41.169166564941406, "global_step": 184278, "epoch": 1522} {"train_loss": -41.19139862060547, "global_step": 184279, "epoch": 1522} {"train_loss": -41.17731857299805, "global_step": 184280, "epoch": 1522} {"train_loss": -39.95109176635742, "global_step": 184281, "epoch": 1522} {"train_loss": -40.102923133156516, "global_step": 184282, "epoch": 1522, "val_loss": 2698180.25} {"train_loss": -41.38999557495117, "global_step": 184283, "epoch": 1523} {"train_loss": -41.65961456298828, "global_step": 184284, "epoch": 1523} {"train_loss": -41.53474044799805, "global_step": 184285, "epoch": 1523} {"train_loss": -41.703243255615234, "global_step": 184286, "epoch": 1523} {"train_loss": -41.826087951660156, "global_step": 184287, "epoch": 1523} {"train_loss": -41.66776657104492, "global_step": 184288, "epoch": 1523} {"train_loss": -41.811458587646484, "global_step": 184289, "epoch": 1523} {"train_loss": -41.500587463378906, "global_step": 184290, "epoch": 1523} {"train_loss": -41.51597595214844, "global_step": 184291, "epoch": 1523} {"train_loss": -37.0421257019043, "global_step": 184292, "epoch": 1523} {"train_loss": -41.17951965332031, "global_step": 184293, "epoch": 1523} {"train_loss": -40.55083084106445, "global_step": 184294, "epoch": 1523} {"train_loss": -40.9169921875, "global_step": 184295, "epoch": 1523} {"train_loss": -41.4875373840332, "global_step": 184296, "epoch": 1523} {"train_loss": -41.42183303833008, "global_step": 184297, "epoch": 1523} {"train_loss": -38.36555480957031, "global_step": 184298, "epoch": 1523} {"train_loss": -39.257965087890625, "global_step": 184299, "epoch": 1523} {"train_loss": -38.346736907958984, "global_step": 184300, "epoch": 1523} {"train_loss": -40.21498489379883, "global_step": 184301, "epoch": 1523} {"train_loss": -39.54273223876953, "global_step": 184302, "epoch": 1523} {"train_loss": -36.591583251953125, "global_step": 184303, "epoch": 1523} {"train_loss": -35.4761962890625, "global_step": 184304, "epoch": 1523} {"train_loss": -36.76405334472656, "global_step": 184305, "epoch": 1523} {"train_loss": -39.55126953125, "global_step": 184306, "epoch": 1523} {"train_loss": -37.924617767333984, "global_step": 184307, "epoch": 1523} {"train_loss": -37.670162200927734, "global_step": 184308, "epoch": 1523} {"train_loss": -37.48956298828125, "global_step": 184309, "epoch": 1523} {"train_loss": -39.55980682373047, "global_step": 184310, "epoch": 1523} {"train_loss": -38.83879852294922, "global_step": 184311, "epoch": 1523} {"train_loss": -39.13801193237305, "global_step": 184312, "epoch": 1523} {"train_loss": -37.83435821533203, "global_step": 184313, "epoch": 1523} {"train_loss": -38.38513946533203, "global_step": 184314, "epoch": 1523} {"train_loss": -37.00239181518555, "global_step": 184315, "epoch": 1523} {"train_loss": -36.72462844848633, "global_step": 184316, "epoch": 1523} {"train_loss": -39.643428802490234, "global_step": 184317, "epoch": 1523} {"train_loss": -40.49594497680664, "global_step": 184318, "epoch": 1523} {"train_loss": -40.18762969970703, "global_step": 184319, "epoch": 1523} {"train_loss": -39.964202880859375, "global_step": 184320, "epoch": 1523} {"train_loss": -37.988460540771484, "global_step": 184321, "epoch": 1523} {"train_loss": -39.60490036010742, "global_step": 184322, "epoch": 1523} {"train_loss": -38.9188117980957, "global_step": 184323, "epoch": 1523} {"train_loss": -36.05168914794922, "global_step": 184324, "epoch": 1523} {"train_loss": -36.84029769897461, "global_step": 184325, "epoch": 1523} {"train_loss": -39.85685348510742, "global_step": 184326, "epoch": 1523} {"train_loss": -37.97261047363281, "global_step": 184327, "epoch": 1523} {"train_loss": -39.73275375366211, "global_step": 184328, "epoch": 1523} {"train_loss": -34.90542221069336, "global_step": 184329, "epoch": 1523} {"train_loss": -39.568424224853516, "global_step": 184330, "epoch": 1523} {"train_loss": -39.82157516479492, "global_step": 184331, "epoch": 1523} {"train_loss": -38.22935104370117, "global_step": 184332, "epoch": 1523} {"train_loss": -37.60920333862305, "global_step": 184333, "epoch": 1523} {"train_loss": -39.847877502441406, "global_step": 184334, "epoch": 1523} {"train_loss": -38.89527130126953, "global_step": 184335, "epoch": 1523} {"train_loss": -36.64768600463867, "global_step": 184336, "epoch": 1523} {"train_loss": -40.382049560546875, "global_step": 184337, "epoch": 1523} {"train_loss": -40.73444747924805, "global_step": 184338, "epoch": 1523} {"train_loss": -39.59624099731445, "global_step": 184339, "epoch": 1523} {"train_loss": -39.76443099975586, "global_step": 184340, "epoch": 1523} {"train_loss": -40.46458053588867, "global_step": 184341, "epoch": 1523} {"train_loss": -40.64971923828125, "global_step": 184342, "epoch": 1523} {"train_loss": -40.53532409667969, "global_step": 184343, "epoch": 1523} {"train_loss": -39.33698654174805, "global_step": 184344, "epoch": 1523} {"train_loss": -40.435020446777344, "global_step": 184345, "epoch": 1523} {"train_loss": -40.762996673583984, "global_step": 184346, "epoch": 1523} {"train_loss": -39.27726364135742, "global_step": 184347, "epoch": 1523} {"train_loss": -40.822994232177734, "global_step": 184348, "epoch": 1523} {"train_loss": -40.13007736206055, "global_step": 184349, "epoch": 1523} {"train_loss": -40.87653350830078, "global_step": 184350, "epoch": 1523} {"train_loss": -40.43962478637695, "global_step": 184351, "epoch": 1523} {"train_loss": -39.77364730834961, "global_step": 184352, "epoch": 1523} {"train_loss": -40.789424896240234, "global_step": 184353, "epoch": 1523} {"train_loss": -40.55009460449219, "global_step": 184354, "epoch": 1523} {"train_loss": -41.23552322387695, "global_step": 184355, "epoch": 1523} {"train_loss": -39.930267333984375, "global_step": 184356, "epoch": 1523} {"train_loss": -40.68378448486328, "global_step": 184357, "epoch": 1523} {"train_loss": -40.98149490356445, "global_step": 184358, "epoch": 1523} {"train_loss": -40.90703201293945, "global_step": 184359, "epoch": 1523} {"train_loss": -39.909400939941406, "global_step": 184360, "epoch": 1523} {"train_loss": -40.96405029296875, "global_step": 184361, "epoch": 1523} {"train_loss": -39.30144119262695, "global_step": 184362, "epoch": 1523} {"train_loss": -40.34163284301758, "global_step": 184363, "epoch": 1523} {"train_loss": -40.44817352294922, "global_step": 184364, "epoch": 1523} {"train_loss": -40.2284049987793, "global_step": 184365, "epoch": 1523} {"train_loss": -40.90462875366211, "global_step": 184366, "epoch": 1523} {"train_loss": -40.59498977661133, "global_step": 184367, "epoch": 1523} {"train_loss": -40.398807525634766, "global_step": 184368, "epoch": 1523} {"train_loss": -41.40610885620117, "global_step": 184369, "epoch": 1523} {"train_loss": -41.53082275390625, "global_step": 184370, "epoch": 1523} {"train_loss": -38.963348388671875, "global_step": 184371, "epoch": 1523} {"train_loss": -39.63240051269531, "global_step": 184372, "epoch": 1523} {"train_loss": -41.285701751708984, "global_step": 184373, "epoch": 1523} {"train_loss": -41.25429916381836, "global_step": 184374, "epoch": 1523} {"train_loss": -39.8275260925293, "global_step": 184375, "epoch": 1523} {"train_loss": -39.7672233581543, "global_step": 184376, "epoch": 1523} {"train_loss": -40.813899993896484, "global_step": 184377, "epoch": 1523} {"train_loss": -40.43328094482422, "global_step": 184378, "epoch": 1523} {"train_loss": -37.61245346069336, "global_step": 184379, "epoch": 1523} {"train_loss": -38.275779724121094, "global_step": 184380, "epoch": 1523} {"train_loss": -37.67399978637695, "global_step": 184381, "epoch": 1523} {"train_loss": -39.5083122253418, "global_step": 184382, "epoch": 1523} {"train_loss": -40.92116165161133, "global_step": 184383, "epoch": 1523} {"train_loss": -40.84060287475586, "global_step": 184384, "epoch": 1523} {"train_loss": -38.97981262207031, "global_step": 184385, "epoch": 1523} {"train_loss": -38.022247314453125, "global_step": 184386, "epoch": 1523} {"train_loss": -37.94368362426758, "global_step": 184387, "epoch": 1523} {"train_loss": -39.860111236572266, "global_step": 184388, "epoch": 1523} {"train_loss": -39.622230529785156, "global_step": 184389, "epoch": 1523} {"train_loss": -39.240150451660156, "global_step": 184390, "epoch": 1523} {"train_loss": -38.16665267944336, "global_step": 184391, "epoch": 1523} {"train_loss": -41.1662483215332, "global_step": 184392, "epoch": 1523} {"train_loss": -37.98207473754883, "global_step": 184393, "epoch": 1523} {"train_loss": -37.2491569519043, "global_step": 184394, "epoch": 1523} {"train_loss": -40.38881301879883, "global_step": 184395, "epoch": 1523} {"train_loss": -38.536224365234375, "global_step": 184396, "epoch": 1523} {"train_loss": -34.6999626159668, "global_step": 184397, "epoch": 1523} {"train_loss": -39.57893371582031, "global_step": 184398, "epoch": 1523} {"train_loss": -40.58663558959961, "global_step": 184399, "epoch": 1523} {"train_loss": -38.48480987548828, "global_step": 184400, "epoch": 1523} {"train_loss": -40.49109649658203, "global_step": 184401, "epoch": 1523} {"train_loss": -38.26115036010742, "global_step": 184402, "epoch": 1523} {"train_loss": -39.55483012554074, "global_step": 184403, "epoch": 1523, "val_loss": 2687353.75} {"train_loss": -39.818214416503906, "global_step": 184404, "epoch": 1524} {"train_loss": -40.65155792236328, "global_step": 184405, "epoch": 1524} {"train_loss": -39.01569747924805, "global_step": 184406, "epoch": 1524} {"train_loss": -39.83931350708008, "global_step": 184407, "epoch": 1524} {"train_loss": -40.36042022705078, "global_step": 184408, "epoch": 1524} {"train_loss": -38.90858840942383, "global_step": 184409, "epoch": 1524} {"train_loss": -37.28499221801758, "global_step": 184410, "epoch": 1524} {"train_loss": -39.52080154418945, "global_step": 184411, "epoch": 1524} {"train_loss": -40.7969856262207, "global_step": 184412, "epoch": 1524} {"train_loss": -39.89777374267578, "global_step": 184413, "epoch": 1524} {"train_loss": -41.271480560302734, "global_step": 184414, "epoch": 1524} {"train_loss": -40.0212287902832, "global_step": 184415, "epoch": 1524} {"train_loss": -40.0174446105957, "global_step": 184416, "epoch": 1524} {"train_loss": -40.07651901245117, "global_step": 184417, "epoch": 1524} {"train_loss": -41.24782943725586, "global_step": 184418, "epoch": 1524} {"train_loss": -39.96697998046875, "global_step": 184419, "epoch": 1524} {"train_loss": -40.659828186035156, "global_step": 184420, "epoch": 1524} {"train_loss": -40.04250717163086, "global_step": 184421, "epoch": 1524} {"train_loss": -41.0449104309082, "global_step": 184422, "epoch": 1524} {"train_loss": -40.825252532958984, "global_step": 184423, "epoch": 1524} {"train_loss": -41.39841842651367, "global_step": 184424, "epoch": 1524} {"train_loss": -41.1190071105957, "global_step": 184425, "epoch": 1524} {"train_loss": -40.20010757446289, "global_step": 184426, "epoch": 1524} {"train_loss": -41.26813507080078, "global_step": 184427, "epoch": 1524} {"train_loss": -40.68811798095703, "global_step": 184428, "epoch": 1524} {"train_loss": -41.43561935424805, "global_step": 184429, "epoch": 1524} {"train_loss": -41.153114318847656, "global_step": 184430, "epoch": 1524} {"train_loss": -41.16486740112305, "global_step": 184431, "epoch": 1524} {"train_loss": -41.32474899291992, "global_step": 184432, "epoch": 1524} {"train_loss": -41.373504638671875, "global_step": 184433, "epoch": 1524} {"train_loss": -41.25693893432617, "global_step": 184434, "epoch": 1524} {"train_loss": -41.816200256347656, "global_step": 184435, "epoch": 1524} {"train_loss": -41.272369384765625, "global_step": 184436, "epoch": 1524} {"train_loss": -41.336883544921875, "global_step": 184437, "epoch": 1524} {"train_loss": -41.16530227661133, "global_step": 184438, "epoch": 1524} {"train_loss": -41.199981689453125, "global_step": 184439, "epoch": 1524} {"train_loss": -41.35319519042969, "global_step": 184440, "epoch": 1524} {"train_loss": -41.41813278198242, "global_step": 184441, "epoch": 1524} {"train_loss": -40.84402084350586, "global_step": 184442, "epoch": 1524} {"train_loss": -41.61138153076172, "global_step": 184443, "epoch": 1524} {"train_loss": -41.53049087524414, "global_step": 184444, "epoch": 1524} {"train_loss": -41.23914337158203, "global_step": 184445, "epoch": 1524} {"train_loss": -41.139930725097656, "global_step": 184446, "epoch": 1524} {"train_loss": -41.3381233215332, "global_step": 184447, "epoch": 1524} {"train_loss": -41.25556182861328, "global_step": 184448, "epoch": 1524} {"train_loss": -41.522308349609375, "global_step": 184449, "epoch": 1524} {"train_loss": -41.759254455566406, "global_step": 184450, "epoch": 1524} {"train_loss": -42.069149017333984, "global_step": 184451, "epoch": 1524} {"train_loss": -41.94172668457031, "global_step": 184452, "epoch": 1524} {"train_loss": -42.06078338623047, "global_step": 184453, "epoch": 1524} {"train_loss": -41.317626953125, "global_step": 184454, "epoch": 1524} {"train_loss": -41.13044738769531, "global_step": 184455, "epoch": 1524} {"train_loss": -41.803138732910156, "global_step": 184456, "epoch": 1524} {"train_loss": -41.71652603149414, "global_step": 184457, "epoch": 1524} {"train_loss": -41.57367706298828, "global_step": 184458, "epoch": 1524} {"train_loss": -41.55244827270508, "global_step": 184459, "epoch": 1524} {"train_loss": -41.64777755737305, "global_step": 184460, "epoch": 1524} {"train_loss": -41.69841766357422, "global_step": 184461, "epoch": 1524} {"train_loss": -41.62372589111328, "global_step": 184462, "epoch": 1524} {"train_loss": -41.00598907470703, "global_step": 184463, "epoch": 1524} {"train_loss": -41.72419738769531, "global_step": 184464, "epoch": 1524} {"train_loss": -41.17799758911133, "global_step": 184465, "epoch": 1524} {"train_loss": -39.90607833862305, "global_step": 184466, "epoch": 1524} {"train_loss": -38.84328842163086, "global_step": 184467, "epoch": 1524} {"train_loss": -38.16215515136719, "global_step": 184468, "epoch": 1524} {"train_loss": -39.056007385253906, "global_step": 184469, "epoch": 1524} {"train_loss": -40.13020706176758, "global_step": 184470, "epoch": 1524} {"train_loss": -39.57089614868164, "global_step": 184471, "epoch": 1524} {"train_loss": -40.01358413696289, "global_step": 184472, "epoch": 1524} {"train_loss": -40.69767379760742, "global_step": 184473, "epoch": 1524} {"train_loss": -39.90237808227539, "global_step": 184474, "epoch": 1524} {"train_loss": -39.184783935546875, "global_step": 184475, "epoch": 1524} {"train_loss": -37.868743896484375, "global_step": 184476, "epoch": 1524} {"train_loss": -41.25764846801758, "global_step": 184477, "epoch": 1524} {"train_loss": -39.34811019897461, "global_step": 184478, "epoch": 1524} {"train_loss": -38.02596664428711, "global_step": 184479, "epoch": 1524} {"train_loss": -40.63371658325195, "global_step": 184480, "epoch": 1524} {"train_loss": -39.5104866027832, "global_step": 184481, "epoch": 1524} {"train_loss": -38.863365173339844, "global_step": 184482, "epoch": 1524} {"train_loss": -39.893043518066406, "global_step": 184483, "epoch": 1524} {"train_loss": -38.31204605102539, "global_step": 184484, "epoch": 1524} {"train_loss": -40.26345443725586, "global_step": 184485, "epoch": 1524} {"train_loss": -37.96455001831055, "global_step": 184486, "epoch": 1524} {"train_loss": -38.10356521606445, "global_step": 184487, "epoch": 1524} {"train_loss": -38.848663330078125, "global_step": 184488, "epoch": 1524} {"train_loss": -38.73942565917969, "global_step": 184489, "epoch": 1524} {"train_loss": -37.92433547973633, "global_step": 184490, "epoch": 1524} {"train_loss": -38.817989349365234, "global_step": 184491, "epoch": 1524} {"train_loss": -39.30801010131836, "global_step": 184492, "epoch": 1524} {"train_loss": -39.6822624206543, "global_step": 184493, "epoch": 1524} {"train_loss": -39.08024978637695, "global_step": 184494, "epoch": 1524} {"train_loss": -40.18656921386719, "global_step": 184495, "epoch": 1524} {"train_loss": -39.21584701538086, "global_step": 184496, "epoch": 1524} {"train_loss": -39.98683547973633, "global_step": 184497, "epoch": 1524} {"train_loss": -39.69738006591797, "global_step": 184498, "epoch": 1524} {"train_loss": -40.0786247253418, "global_step": 184499, "epoch": 1524} {"train_loss": -40.354854583740234, "global_step": 184500, "epoch": 1524} {"train_loss": -40.06521224975586, "global_step": 184501, "epoch": 1524} {"train_loss": -40.57965850830078, "global_step": 184502, "epoch": 1524} {"train_loss": -40.26194381713867, "global_step": 184503, "epoch": 1524} {"train_loss": -40.648216247558594, "global_step": 184504, "epoch": 1524} {"train_loss": -40.52111053466797, "global_step": 184505, "epoch": 1524} {"train_loss": -40.37789535522461, "global_step": 184506, "epoch": 1524} {"train_loss": -40.9007453918457, "global_step": 184507, "epoch": 1524} {"train_loss": -40.75819778442383, "global_step": 184508, "epoch": 1524} {"train_loss": -40.336769104003906, "global_step": 184509, "epoch": 1524} {"train_loss": -41.290775299072266, "global_step": 184510, "epoch": 1524} {"train_loss": -40.922367095947266, "global_step": 184511, "epoch": 1524} {"train_loss": -40.672279357910156, "global_step": 184512, "epoch": 1524} {"train_loss": -40.81534957885742, "global_step": 184513, "epoch": 1524} {"train_loss": -40.93294906616211, "global_step": 184514, "epoch": 1524} {"train_loss": -40.793399810791016, "global_step": 184515, "epoch": 1524} {"train_loss": -40.775390625, "global_step": 184516, "epoch": 1524} {"train_loss": -40.8155517578125, "global_step": 184517, "epoch": 1524} {"train_loss": -41.3012580871582, "global_step": 184518, "epoch": 1524} {"train_loss": -40.53589630126953, "global_step": 184519, "epoch": 1524} {"train_loss": -41.233882904052734, "global_step": 184520, "epoch": 1524} {"train_loss": -40.90875244140625, "global_step": 184521, "epoch": 1524} {"train_loss": -41.306068420410156, "global_step": 184522, "epoch": 1524} {"train_loss": -39.39093780517578, "global_step": 184523, "epoch": 1524} {"train_loss": -40.4464792929405, "global_step": 184524, "epoch": 1524, "val_loss": 2625490.75} {"train_loss": -41.16071701049805, "global_step": 184525, "epoch": 1525} {"train_loss": -41.29303741455078, "global_step": 184526, "epoch": 1525} {"train_loss": -40.49406814575195, "global_step": 184527, "epoch": 1525} {"train_loss": -41.16526412963867, "global_step": 184528, "epoch": 1525} {"train_loss": -41.449005126953125, "global_step": 184529, "epoch": 1525} {"train_loss": -41.570594787597656, "global_step": 184530, "epoch": 1525} {"train_loss": -37.6460075378418, "global_step": 184531, "epoch": 1525} {"train_loss": -41.17376708984375, "global_step": 184532, "epoch": 1525} {"train_loss": -41.23319625854492, "global_step": 184533, "epoch": 1525} {"train_loss": -41.04874801635742, "global_step": 184534, "epoch": 1525} {"train_loss": -41.32027816772461, "global_step": 184535, "epoch": 1525} {"train_loss": -40.85325241088867, "global_step": 184536, "epoch": 1525} {"train_loss": -41.67104721069336, "global_step": 184537, "epoch": 1525} {"train_loss": -38.0616455078125, "global_step": 184538, "epoch": 1525} {"train_loss": -39.66328811645508, "global_step": 184539, "epoch": 1525} {"train_loss": -41.3692626953125, "global_step": 184540, "epoch": 1525} {"train_loss": -41.3541259765625, "global_step": 184541, "epoch": 1525} {"train_loss": -40.972633361816406, "global_step": 184542, "epoch": 1525} {"train_loss": -41.302589416503906, "global_step": 184543, "epoch": 1525} {"train_loss": -41.36724853515625, "global_step": 184544, "epoch": 1525} {"train_loss": -40.87907028198242, "global_step": 184545, "epoch": 1525} {"train_loss": -41.14107894897461, "global_step": 184546, "epoch": 1525} {"train_loss": -41.51762008666992, "global_step": 184547, "epoch": 1525} {"train_loss": -41.48147201538086, "global_step": 184548, "epoch": 1525} {"train_loss": -41.47999954223633, "global_step": 184549, "epoch": 1525} {"train_loss": -41.576759338378906, "global_step": 184550, "epoch": 1525} {"train_loss": -41.753334045410156, "global_step": 184551, "epoch": 1525} {"train_loss": -41.5982780456543, "global_step": 184552, "epoch": 1525} {"train_loss": -40.1922721862793, "global_step": 184553, "epoch": 1525} {"train_loss": -41.74560546875, "global_step": 184554, "epoch": 1525} {"train_loss": -41.621559143066406, "global_step": 184555, "epoch": 1525} {"train_loss": -39.64787673950195, "global_step": 184556, "epoch": 1525} {"train_loss": -41.52158737182617, "global_step": 184557, "epoch": 1525} {"train_loss": -40.967506408691406, "global_step": 184558, "epoch": 1525} {"train_loss": -40.551368713378906, "global_step": 184559, "epoch": 1525} {"train_loss": -41.96455001831055, "global_step": 184560, "epoch": 1525} {"train_loss": -41.2790641784668, "global_step": 184561, "epoch": 1525} {"train_loss": -41.141265869140625, "global_step": 184562, "epoch": 1525} {"train_loss": -41.08555221557617, "global_step": 184563, "epoch": 1525} {"train_loss": -41.23982620239258, "global_step": 184564, "epoch": 1525} {"train_loss": -42.0579948425293, "global_step": 184565, "epoch": 1525} {"train_loss": -41.00128173828125, "global_step": 184566, "epoch": 1525} {"train_loss": -40.69412612915039, "global_step": 184567, "epoch": 1525} {"train_loss": -41.06293869018555, "global_step": 184568, "epoch": 1525} {"train_loss": -40.98096466064453, "global_step": 184569, "epoch": 1525} {"train_loss": -39.288299560546875, "global_step": 184570, "epoch": 1525} {"train_loss": -37.50236511230469, "global_step": 184571, "epoch": 1525} {"train_loss": -33.4239616394043, "global_step": 184572, "epoch": 1525} {"train_loss": -33.13391876220703, "global_step": 184573, "epoch": 1525} {"train_loss": -35.857696533203125, "global_step": 184574, "epoch": 1525} {"train_loss": -39.71546173095703, "global_step": 184575, "epoch": 1525} {"train_loss": -40.112037658691406, "global_step": 184576, "epoch": 1525} {"train_loss": -37.29264450073242, "global_step": 184577, "epoch": 1525} {"train_loss": -36.96537399291992, "global_step": 184578, "epoch": 1525} {"train_loss": -39.74756622314453, "global_step": 184579, "epoch": 1525} {"train_loss": -39.0831413269043, "global_step": 184580, "epoch": 1525} {"train_loss": -38.6666259765625, "global_step": 184581, "epoch": 1525} {"train_loss": -40.617652893066406, "global_step": 184582, "epoch": 1525} {"train_loss": -40.66111755371094, "global_step": 184583, "epoch": 1525} {"train_loss": -40.6160774230957, "global_step": 184584, "epoch": 1525} {"train_loss": -40.68428039550781, "global_step": 184585, "epoch": 1525} {"train_loss": -40.70387268066406, "global_step": 184586, "epoch": 1525} {"train_loss": -41.14238739013672, "global_step": 184587, "epoch": 1525} {"train_loss": -40.25130844116211, "global_step": 184588, "epoch": 1525} {"train_loss": -40.71331024169922, "global_step": 184589, "epoch": 1525} {"train_loss": -41.16259765625, "global_step": 184590, "epoch": 1525} {"train_loss": -40.91202926635742, "global_step": 184591, "epoch": 1525} {"train_loss": -41.5312614440918, "global_step": 184592, "epoch": 1525} {"train_loss": -41.11521530151367, "global_step": 184593, "epoch": 1525} {"train_loss": -40.50356674194336, "global_step": 184594, "epoch": 1525} {"train_loss": -41.24955368041992, "global_step": 184595, "epoch": 1525} {"train_loss": -40.93257522583008, "global_step": 184596, "epoch": 1525} {"train_loss": -41.419673919677734, "global_step": 184597, "epoch": 1525} {"train_loss": -40.794471740722656, "global_step": 184598, "epoch": 1525} {"train_loss": -40.740394592285156, "global_step": 184599, "epoch": 1525} {"train_loss": -41.25238800048828, "global_step": 184600, "epoch": 1525} {"train_loss": -41.30369186401367, "global_step": 184601, "epoch": 1525} {"train_loss": -40.452911376953125, "global_step": 184602, "epoch": 1525} {"train_loss": -41.73971176147461, "global_step": 184603, "epoch": 1525} {"train_loss": -41.30617141723633, "global_step": 184604, "epoch": 1525} {"train_loss": -40.75128173828125, "global_step": 184605, "epoch": 1525} {"train_loss": -41.09052658081055, "global_step": 184606, "epoch": 1525} {"train_loss": -41.10306930541992, "global_step": 184607, "epoch": 1525} {"train_loss": -41.42328643798828, "global_step": 184608, "epoch": 1525} {"train_loss": -41.54121398925781, "global_step": 184609, "epoch": 1525} {"train_loss": -41.05833053588867, "global_step": 184610, "epoch": 1525} {"train_loss": -41.37637710571289, "global_step": 184611, "epoch": 1525} {"train_loss": -41.191158294677734, "global_step": 184612, "epoch": 1525} {"train_loss": -41.0823974609375, "global_step": 184613, "epoch": 1525} {"train_loss": -41.465267181396484, "global_step": 184614, "epoch": 1525} {"train_loss": -39.93817901611328, "global_step": 184615, "epoch": 1525} {"train_loss": -40.937557220458984, "global_step": 184616, "epoch": 1525} {"train_loss": -40.775421142578125, "global_step": 184617, "epoch": 1525} {"train_loss": -41.521461486816406, "global_step": 184618, "epoch": 1525} {"train_loss": -40.9864501953125, "global_step": 184619, "epoch": 1525} {"train_loss": -41.217918395996094, "global_step": 184620, "epoch": 1525} {"train_loss": -40.348114013671875, "global_step": 184621, "epoch": 1525} {"train_loss": -41.034393310546875, "global_step": 184622, "epoch": 1525} {"train_loss": -41.115234375, "global_step": 184623, "epoch": 1525} {"train_loss": -41.30305862426758, "global_step": 184624, "epoch": 1525} {"train_loss": -40.65681076049805, "global_step": 184625, "epoch": 1525} {"train_loss": -40.357177734375, "global_step": 184626, "epoch": 1525} {"train_loss": -41.006187438964844, "global_step": 184627, "epoch": 1525} {"train_loss": -41.525238037109375, "global_step": 184628, "epoch": 1525} {"train_loss": -37.83999252319336, "global_step": 184629, "epoch": 1525} {"train_loss": -40.77242660522461, "global_step": 184630, "epoch": 1525} {"train_loss": -40.244258880615234, "global_step": 184631, "epoch": 1525} {"train_loss": -40.74570846557617, "global_step": 184632, "epoch": 1525} {"train_loss": -40.62467575073242, "global_step": 184633, "epoch": 1525} {"train_loss": -41.197845458984375, "global_step": 184634, "epoch": 1525} {"train_loss": -41.328338623046875, "global_step": 184635, "epoch": 1525} {"train_loss": -40.90175247192383, "global_step": 184636, "epoch": 1525} {"train_loss": -41.32954406738281, "global_step": 184637, "epoch": 1525} {"train_loss": -40.811805725097656, "global_step": 184638, "epoch": 1525} {"train_loss": -40.907318115234375, "global_step": 184639, "epoch": 1525} {"train_loss": -41.8411750793457, "global_step": 184640, "epoch": 1525} {"train_loss": -41.670379638671875, "global_step": 184641, "epoch": 1525} {"train_loss": -41.045684814453125, "global_step": 184642, "epoch": 1525} {"train_loss": -41.19464874267578, "global_step": 184643, "epoch": 1525} {"train_loss": -40.60872268676758, "global_step": 184644, "epoch": 1525} {"train_loss": -40.64731008356268, "global_step": 184645, "epoch": 1525, "val_loss": 2602582.0} {"train_loss": -40.698944091796875, "global_step": 184646, "epoch": 1526} {"train_loss": -40.66537094116211, "global_step": 184647, "epoch": 1526} {"train_loss": -40.06243896484375, "global_step": 184648, "epoch": 1526} {"train_loss": -41.2435302734375, "global_step": 184649, "epoch": 1526} {"train_loss": -39.5473747253418, "global_step": 184650, "epoch": 1526} {"train_loss": -40.08313751220703, "global_step": 184651, "epoch": 1526} {"train_loss": -40.05335235595703, "global_step": 184652, "epoch": 1526} {"train_loss": -41.26235580444336, "global_step": 184653, "epoch": 1526} {"train_loss": -41.27103805541992, "global_step": 184654, "epoch": 1526} {"train_loss": -40.929962158203125, "global_step": 184655, "epoch": 1526} {"train_loss": -40.5880241394043, "global_step": 184656, "epoch": 1526} {"train_loss": -41.2719841003418, "global_step": 184657, "epoch": 1526} {"train_loss": -41.643226623535156, "global_step": 184658, "epoch": 1526} {"train_loss": -40.94417190551758, "global_step": 184659, "epoch": 1526} {"train_loss": -41.4493522644043, "global_step": 184660, "epoch": 1526} {"train_loss": -39.2459602355957, "global_step": 184661, "epoch": 1526} {"train_loss": -41.16666793823242, "global_step": 184662, "epoch": 1526} {"train_loss": -40.816524505615234, "global_step": 184663, "epoch": 1526} {"train_loss": -39.86916732788086, "global_step": 184664, "epoch": 1526} {"train_loss": -39.552120208740234, "global_step": 184665, "epoch": 1526} {"train_loss": -40.5051155090332, "global_step": 184666, "epoch": 1526} {"train_loss": -40.691749572753906, "global_step": 184667, "epoch": 1526} {"train_loss": -40.59562301635742, "global_step": 184668, "epoch": 1526} {"train_loss": -36.09121322631836, "global_step": 184669, "epoch": 1526} {"train_loss": -37.04467010498047, "global_step": 184670, "epoch": 1526} {"train_loss": -39.514808654785156, "global_step": 184671, "epoch": 1526} {"train_loss": -39.1627197265625, "global_step": 184672, "epoch": 1526} {"train_loss": -38.3680305480957, "global_step": 184673, "epoch": 1526} {"train_loss": -40.18785095214844, "global_step": 184674, "epoch": 1526} {"train_loss": -39.752540588378906, "global_step": 184675, "epoch": 1526} {"train_loss": -39.03755187988281, "global_step": 184676, "epoch": 1526} {"train_loss": -40.167354583740234, "global_step": 184677, "epoch": 1526} {"train_loss": -37.40425491333008, "global_step": 184678, "epoch": 1526} {"train_loss": -38.14034652709961, "global_step": 184679, "epoch": 1526} {"train_loss": -40.92218017578125, "global_step": 184680, "epoch": 1526} {"train_loss": -38.29527282714844, "global_step": 184681, "epoch": 1526} {"train_loss": -39.88938522338867, "global_step": 184682, "epoch": 1526} {"train_loss": -40.76283645629883, "global_step": 184683, "epoch": 1526} {"train_loss": -38.49311447143555, "global_step": 184684, "epoch": 1526} {"train_loss": -40.8323860168457, "global_step": 184685, "epoch": 1526} {"train_loss": -38.631195068359375, "global_step": 184686, "epoch": 1526} {"train_loss": -40.89508819580078, "global_step": 184687, "epoch": 1526} {"train_loss": -39.551239013671875, "global_step": 184688, "epoch": 1526} {"train_loss": -40.952545166015625, "global_step": 184689, "epoch": 1526} {"train_loss": -39.633575439453125, "global_step": 184690, "epoch": 1526} {"train_loss": -41.75400161743164, "global_step": 184691, "epoch": 1526} {"train_loss": -39.63739776611328, "global_step": 184692, "epoch": 1526} {"train_loss": -41.4139518737793, "global_step": 184693, "epoch": 1526} {"train_loss": -40.96778106689453, "global_step": 184694, "epoch": 1526} {"train_loss": -40.17951202392578, "global_step": 184695, "epoch": 1526} {"train_loss": -41.29212188720703, "global_step": 184696, "epoch": 1526} {"train_loss": -41.37237548828125, "global_step": 184697, "epoch": 1526} {"train_loss": -41.1162223815918, "global_step": 184698, "epoch": 1526} {"train_loss": -41.42420196533203, "global_step": 184699, "epoch": 1526} {"train_loss": -41.18764877319336, "global_step": 184700, "epoch": 1526} {"train_loss": -41.25223922729492, "global_step": 184701, "epoch": 1526} {"train_loss": -41.652618408203125, "global_step": 184702, "epoch": 1526} {"train_loss": -41.00661849975586, "global_step": 184703, "epoch": 1526} {"train_loss": -41.47896957397461, "global_step": 184704, "epoch": 1526} {"train_loss": -41.671749114990234, "global_step": 184705, "epoch": 1526} {"train_loss": -41.76681137084961, "global_step": 184706, "epoch": 1526} {"train_loss": -41.56838607788086, "global_step": 184707, "epoch": 1526} {"train_loss": -41.63504409790039, "global_step": 184708, "epoch": 1526} {"train_loss": -41.730072021484375, "global_step": 184709, "epoch": 1526} {"train_loss": -41.82350540161133, "global_step": 184710, "epoch": 1526} {"train_loss": -41.77598571777344, "global_step": 184711, "epoch": 1526} {"train_loss": -41.99508285522461, "global_step": 184712, "epoch": 1526} {"train_loss": -41.72633743286133, "global_step": 184713, "epoch": 1526} {"train_loss": -41.58860397338867, "global_step": 184714, "epoch": 1526} {"train_loss": -42.26713943481445, "global_step": 184715, "epoch": 1526} {"train_loss": -41.95760726928711, "global_step": 184716, "epoch": 1526} {"train_loss": -42.206275939941406, "global_step": 184717, "epoch": 1526} {"train_loss": -41.63470458984375, "global_step": 184718, "epoch": 1526} {"train_loss": -42.23257064819336, "global_step": 184719, "epoch": 1526} {"train_loss": -41.93288803100586, "global_step": 184720, "epoch": 1526} {"train_loss": -42.539894104003906, "global_step": 184721, "epoch": 1526} {"train_loss": -42.021881103515625, "global_step": 184722, "epoch": 1526} {"train_loss": -41.5404167175293, "global_step": 184723, "epoch": 1526} {"train_loss": -41.70082473754883, "global_step": 184724, "epoch": 1526} {"train_loss": -42.17753219604492, "global_step": 184725, "epoch": 1526} {"train_loss": -41.63612365722656, "global_step": 184726, "epoch": 1526} {"train_loss": -40.678585052490234, "global_step": 184727, "epoch": 1526} {"train_loss": -39.94517135620117, "global_step": 184728, "epoch": 1526} {"train_loss": -42.21181106567383, "global_step": 184729, "epoch": 1526} {"train_loss": -41.60260009765625, "global_step": 184730, "epoch": 1526} {"train_loss": -39.17698669433594, "global_step": 184731, "epoch": 1526} {"train_loss": -37.591102600097656, "global_step": 184732, "epoch": 1526} {"train_loss": -38.2922248840332, "global_step": 184733, "epoch": 1526} {"train_loss": -39.54234313964844, "global_step": 184734, "epoch": 1526} {"train_loss": -42.02406692504883, "global_step": 184735, "epoch": 1526} {"train_loss": -39.92522430419922, "global_step": 184736, "epoch": 1526} {"train_loss": -37.91765213012695, "global_step": 184737, "epoch": 1526} {"train_loss": -40.69533920288086, "global_step": 184738, "epoch": 1526} {"train_loss": -40.79969787597656, "global_step": 184739, "epoch": 1526} {"train_loss": -40.76820755004883, "global_step": 184740, "epoch": 1526} {"train_loss": -41.28165817260742, "global_step": 184741, "epoch": 1526} {"train_loss": -39.736427307128906, "global_step": 184742, "epoch": 1526} {"train_loss": -39.92108917236328, "global_step": 184743, "epoch": 1526} {"train_loss": -41.09982681274414, "global_step": 184744, "epoch": 1526} {"train_loss": -41.29153060913086, "global_step": 184745, "epoch": 1526} {"train_loss": -41.13867950439453, "global_step": 184746, "epoch": 1526} {"train_loss": -41.18059539794922, "global_step": 184747, "epoch": 1526} {"train_loss": -41.74568557739258, "global_step": 184748, "epoch": 1526} {"train_loss": -41.55610275268555, "global_step": 184749, "epoch": 1526} {"train_loss": -41.76255416870117, "global_step": 184750, "epoch": 1526} {"train_loss": -41.71170425415039, "global_step": 184751, "epoch": 1526} {"train_loss": -40.311370849609375, "global_step": 184752, "epoch": 1526} {"train_loss": -41.763729095458984, "global_step": 184753, "epoch": 1526} {"train_loss": -41.20048141479492, "global_step": 184754, "epoch": 1526} {"train_loss": -39.51827621459961, "global_step": 184755, "epoch": 1526} {"train_loss": -40.38604736328125, "global_step": 184756, "epoch": 1526} {"train_loss": -41.65920639038086, "global_step": 184757, "epoch": 1526} {"train_loss": -39.567298889160156, "global_step": 184758, "epoch": 1526} {"train_loss": -37.074676513671875, "global_step": 184759, "epoch": 1526} {"train_loss": -39.7705078125, "global_step": 184760, "epoch": 1526} {"train_loss": -40.91133499145508, "global_step": 184761, "epoch": 1526} {"train_loss": -39.95087432861328, "global_step": 184762, "epoch": 1526} {"train_loss": -40.230018615722656, "global_step": 184763, "epoch": 1526} {"train_loss": -41.2555046081543, "global_step": 184764, "epoch": 1526} {"train_loss": -39.69113540649414, "global_step": 184765, "epoch": 1526} {"train_loss": -40.59669516697403, "global_step": 184766, "epoch": 1526, "val_loss": 2662211.75} {"train_loss": -38.28407669067383, "global_step": 184767, "epoch": 1527} {"train_loss": -40.40729522705078, "global_step": 184768, "epoch": 1527} {"train_loss": -39.22310256958008, "global_step": 184769, "epoch": 1527} {"train_loss": -38.0735969543457, "global_step": 184770, "epoch": 1527} {"train_loss": -39.72978973388672, "global_step": 184771, "epoch": 1527} {"train_loss": -38.91730499267578, "global_step": 184772, "epoch": 1527} {"train_loss": -39.761470794677734, "global_step": 184773, "epoch": 1527} {"train_loss": -40.293609619140625, "global_step": 184774, "epoch": 1527} {"train_loss": -40.24586868286133, "global_step": 184775, "epoch": 1527} {"train_loss": -40.97206115722656, "global_step": 184776, "epoch": 1527} {"train_loss": -39.29991149902344, "global_step": 184777, "epoch": 1527} {"train_loss": -41.092262268066406, "global_step": 184778, "epoch": 1527} {"train_loss": -39.978858947753906, "global_step": 184779, "epoch": 1527} {"train_loss": -40.784732818603516, "global_step": 184780, "epoch": 1527} {"train_loss": -40.70366668701172, "global_step": 184781, "epoch": 1527} {"train_loss": -39.181854248046875, "global_step": 184782, "epoch": 1527} {"train_loss": -41.4720458984375, "global_step": 184783, "epoch": 1527} {"train_loss": -40.05763626098633, "global_step": 184784, "epoch": 1527} {"train_loss": -41.47368621826172, "global_step": 184785, "epoch": 1527} {"train_loss": -40.53940963745117, "global_step": 184786, "epoch": 1527} {"train_loss": -41.2774772644043, "global_step": 184787, "epoch": 1527} {"train_loss": -41.59326171875, "global_step": 184788, "epoch": 1527} {"train_loss": -40.88175964355469, "global_step": 184789, "epoch": 1527} {"train_loss": -41.423316955566406, "global_step": 184790, "epoch": 1527} {"train_loss": -41.17702102661133, "global_step": 184791, "epoch": 1527} {"train_loss": -41.300209045410156, "global_step": 184792, "epoch": 1527} {"train_loss": -41.5403938293457, "global_step": 184793, "epoch": 1527} {"train_loss": -41.78748321533203, "global_step": 184794, "epoch": 1527} {"train_loss": -40.954383850097656, "global_step": 184795, "epoch": 1527} {"train_loss": -41.509796142578125, "global_step": 184796, "epoch": 1527} {"train_loss": -41.623783111572266, "global_step": 184797, "epoch": 1527} {"train_loss": -41.33385467529297, "global_step": 184798, "epoch": 1527} {"train_loss": -41.6947135925293, "global_step": 184799, "epoch": 1527} {"train_loss": -41.78878402709961, "global_step": 184800, "epoch": 1527} {"train_loss": -41.893795013427734, "global_step": 184801, "epoch": 1527} {"train_loss": -41.80567169189453, "global_step": 184802, "epoch": 1527} {"train_loss": -41.9984130859375, "global_step": 184803, "epoch": 1527} {"train_loss": -42.13119125366211, "global_step": 184804, "epoch": 1527} {"train_loss": -41.62687301635742, "global_step": 184805, "epoch": 1527} {"train_loss": -41.80485916137695, "global_step": 184806, "epoch": 1527} {"train_loss": -42.42527389526367, "global_step": 184807, "epoch": 1527} {"train_loss": -41.66733169555664, "global_step": 184808, "epoch": 1527} {"train_loss": -42.12022018432617, "global_step": 184809, "epoch": 1527} {"train_loss": -42.241756439208984, "global_step": 184810, "epoch": 1527} {"train_loss": -42.154541015625, "global_step": 184811, "epoch": 1527} {"train_loss": -42.45344161987305, "global_step": 184812, "epoch": 1527} {"train_loss": -41.84619903564453, "global_step": 184813, "epoch": 1527} {"train_loss": -41.81411361694336, "global_step": 184814, "epoch": 1527} {"train_loss": -42.41340637207031, "global_step": 184815, "epoch": 1527} {"train_loss": -42.30302810668945, "global_step": 184816, "epoch": 1527} {"train_loss": -42.18891143798828, "global_step": 184817, "epoch": 1527} {"train_loss": -42.54865646362305, "global_step": 184818, "epoch": 1527} {"train_loss": -41.78868865966797, "global_step": 184819, "epoch": 1527} {"train_loss": -42.435455322265625, "global_step": 184820, "epoch": 1527} {"train_loss": -41.062644958496094, "global_step": 184821, "epoch": 1527} {"train_loss": -42.20082473754883, "global_step": 184822, "epoch": 1527} {"train_loss": -40.82246398925781, "global_step": 184823, "epoch": 1527} {"train_loss": -42.21104431152344, "global_step": 184824, "epoch": 1527} {"train_loss": -42.05302047729492, "global_step": 184825, "epoch": 1527} {"train_loss": -42.32425308227539, "global_step": 184826, "epoch": 1527} {"train_loss": -41.96940231323242, "global_step": 184827, "epoch": 1527} {"train_loss": -40.71466827392578, "global_step": 184828, "epoch": 1527} {"train_loss": -42.07817840576172, "global_step": 184829, "epoch": 1527} {"train_loss": -42.61680603027344, "global_step": 184830, "epoch": 1527} {"train_loss": -41.43758773803711, "global_step": 184831, "epoch": 1527} {"train_loss": -41.239524841308594, "global_step": 184832, "epoch": 1527} {"train_loss": -41.830406188964844, "global_step": 184833, "epoch": 1527} {"train_loss": -40.91593551635742, "global_step": 184834, "epoch": 1527} {"train_loss": -41.2321891784668, "global_step": 184835, "epoch": 1527} {"train_loss": -41.2561149597168, "global_step": 184836, "epoch": 1527} {"train_loss": -41.36234664916992, "global_step": 184837, "epoch": 1527} {"train_loss": -39.308284759521484, "global_step": 184838, "epoch": 1527} {"train_loss": -40.75483322143555, "global_step": 184839, "epoch": 1527} {"train_loss": -37.87233352661133, "global_step": 184840, "epoch": 1527} {"train_loss": -38.56526565551758, "global_step": 184841, "epoch": 1527} {"train_loss": -39.41215133666992, "global_step": 184842, "epoch": 1527} {"train_loss": -37.578426361083984, "global_step": 184843, "epoch": 1527} {"train_loss": -38.593116760253906, "global_step": 184844, "epoch": 1527} {"train_loss": -40.87088394165039, "global_step": 184845, "epoch": 1527} {"train_loss": -39.73347091674805, "global_step": 184846, "epoch": 1527} {"train_loss": -39.594581604003906, "global_step": 184847, "epoch": 1527} {"train_loss": -40.36103820800781, "global_step": 184848, "epoch": 1527} {"train_loss": -39.79771423339844, "global_step": 184849, "epoch": 1527} {"train_loss": -41.18423080444336, "global_step": 184850, "epoch": 1527} {"train_loss": -39.85720443725586, "global_step": 184851, "epoch": 1527} {"train_loss": -38.737239837646484, "global_step": 184852, "epoch": 1527} {"train_loss": -40.11912536621094, "global_step": 184853, "epoch": 1527} {"train_loss": -41.2010612487793, "global_step": 184854, "epoch": 1527} {"train_loss": -41.16689682006836, "global_step": 184855, "epoch": 1527} {"train_loss": -41.377254486083984, "global_step": 184856, "epoch": 1527} {"train_loss": -38.193031311035156, "global_step": 184857, "epoch": 1527} {"train_loss": -40.5875244140625, "global_step": 184858, "epoch": 1527} {"train_loss": -41.8469352722168, "global_step": 184859, "epoch": 1527} {"train_loss": -40.81062316894531, "global_step": 184860, "epoch": 1527} {"train_loss": -41.50115966796875, "global_step": 184861, "epoch": 1527} {"train_loss": -41.622581481933594, "global_step": 184862, "epoch": 1527} {"train_loss": -41.422508239746094, "global_step": 184863, "epoch": 1527} {"train_loss": -41.305686950683594, "global_step": 184864, "epoch": 1527} {"train_loss": -40.0532341003418, "global_step": 184865, "epoch": 1527} {"train_loss": -39.48127365112305, "global_step": 184866, "epoch": 1527} {"train_loss": -39.83482360839844, "global_step": 184867, "epoch": 1527} {"train_loss": -35.8605842590332, "global_step": 184868, "epoch": 1527} {"train_loss": -40.42548751831055, "global_step": 184869, "epoch": 1527} {"train_loss": -41.1904411315918, "global_step": 184870, "epoch": 1527} {"train_loss": -39.47170639038086, "global_step": 184871, "epoch": 1527} {"train_loss": -40.30424118041992, "global_step": 184872, "epoch": 1527} {"train_loss": -38.17644119262695, "global_step": 184873, "epoch": 1527} {"train_loss": -41.03523635864258, "global_step": 184874, "epoch": 1527} {"train_loss": -41.01104736328125, "global_step": 184875, "epoch": 1527} {"train_loss": -34.18730545043945, "global_step": 184876, "epoch": 1527} {"train_loss": -37.77095413208008, "global_step": 184877, "epoch": 1527} {"train_loss": -37.90302276611328, "global_step": 184878, "epoch": 1527} {"train_loss": -40.83679962158203, "global_step": 184879, "epoch": 1527} {"train_loss": -40.43726348876953, "global_step": 184880, "epoch": 1527} {"train_loss": -41.23651123046875, "global_step": 184881, "epoch": 1527} {"train_loss": -38.460113525390625, "global_step": 184882, "epoch": 1527} {"train_loss": -39.531612396240234, "global_step": 184883, "epoch": 1527} {"train_loss": -36.37102127075195, "global_step": 184884, "epoch": 1527} {"train_loss": -38.84977340698242, "global_step": 184885, "epoch": 1527} {"train_loss": -39.40858840942383, "global_step": 184886, "epoch": 1527} {"train_loss": -40.534468627173055, "global_step": 184887, "epoch": 1527, "val_loss": 3611822.75} {"train_loss": -40.686126708984375, "global_step": 184888, "epoch": 1528} {"train_loss": -38.50928497314453, "global_step": 184889, "epoch": 1528} {"train_loss": -39.284053802490234, "global_step": 184890, "epoch": 1528} {"train_loss": -36.25629425048828, "global_step": 184891, "epoch": 1528} {"train_loss": -40.25774002075195, "global_step": 184892, "epoch": 1528} {"train_loss": -36.49052047729492, "global_step": 184893, "epoch": 1528} {"train_loss": -35.76019287109375, "global_step": 184894, "epoch": 1528} {"train_loss": -38.90053939819336, "global_step": 184895, "epoch": 1528} {"train_loss": -34.073211669921875, "global_step": 184896, "epoch": 1528} {"train_loss": -38.27857208251953, "global_step": 184897, "epoch": 1528} {"train_loss": -35.7262077331543, "global_step": 184898, "epoch": 1528} {"train_loss": -37.90675354003906, "global_step": 184899, "epoch": 1528} {"train_loss": -36.35432815551758, "global_step": 184900, "epoch": 1528} {"train_loss": -35.99306869506836, "global_step": 184901, "epoch": 1528} {"train_loss": -36.56778335571289, "global_step": 184902, "epoch": 1528} {"train_loss": -38.8008918762207, "global_step": 184903, "epoch": 1528} {"train_loss": -40.00569534301758, "global_step": 184904, "epoch": 1528} {"train_loss": -38.08582305908203, "global_step": 184905, "epoch": 1528} {"train_loss": -36.188716888427734, "global_step": 184906, "epoch": 1528} {"train_loss": -35.96661376953125, "global_step": 184907, "epoch": 1528} {"train_loss": -32.42251205444336, "global_step": 184908, "epoch": 1528} {"train_loss": -40.35071563720703, "global_step": 184909, "epoch": 1528} {"train_loss": -37.419158935546875, "global_step": 184910, "epoch": 1528} {"train_loss": -38.3825798034668, "global_step": 184911, "epoch": 1528} {"train_loss": -40.19960021972656, "global_step": 184912, "epoch": 1528} {"train_loss": -38.7824592590332, "global_step": 184913, "epoch": 1528} {"train_loss": -39.2813720703125, "global_step": 184914, "epoch": 1528} {"train_loss": -32.51401901245117, "global_step": 184915, "epoch": 1528} {"train_loss": -38.72980880737305, "global_step": 184916, "epoch": 1528} {"train_loss": -37.75898361206055, "global_step": 184917, "epoch": 1528} {"train_loss": -39.77749252319336, "global_step": 184918, "epoch": 1528} {"train_loss": -38.88576889038086, "global_step": 184919, "epoch": 1528} {"train_loss": -37.99561309814453, "global_step": 184920, "epoch": 1528} {"train_loss": -38.88676834106445, "global_step": 184921, "epoch": 1528} {"train_loss": -39.43841552734375, "global_step": 184922, "epoch": 1528} {"train_loss": -37.58503341674805, "global_step": 184923, "epoch": 1528} {"train_loss": -39.323219299316406, "global_step": 184924, "epoch": 1528} {"train_loss": -39.302467346191406, "global_step": 184925, "epoch": 1528} {"train_loss": -40.47184371948242, "global_step": 184926, "epoch": 1528} {"train_loss": -39.76729965209961, "global_step": 184927, "epoch": 1528} {"train_loss": -38.68662643432617, "global_step": 184928, "epoch": 1528} {"train_loss": -39.30952835083008, "global_step": 184929, "epoch": 1528} {"train_loss": -38.721248626708984, "global_step": 184930, "epoch": 1528} {"train_loss": -39.96805953979492, "global_step": 184931, "epoch": 1528} {"train_loss": -40.368953704833984, "global_step": 184932, "epoch": 1528} {"train_loss": -40.06720733642578, "global_step": 184933, "epoch": 1528} {"train_loss": -37.64437484741211, "global_step": 184934, "epoch": 1528} {"train_loss": -39.980995178222656, "global_step": 184935, "epoch": 1528} {"train_loss": -38.54543685913086, "global_step": 184936, "epoch": 1528} {"train_loss": -40.316314697265625, "global_step": 184937, "epoch": 1528} {"train_loss": -40.40363311767578, "global_step": 184938, "epoch": 1528} {"train_loss": -39.17630386352539, "global_step": 184939, "epoch": 1528} {"train_loss": -40.054168701171875, "global_step": 184940, "epoch": 1528} {"train_loss": -40.05958938598633, "global_step": 184941, "epoch": 1528} {"train_loss": -40.16750717163086, "global_step": 184942, "epoch": 1528} {"train_loss": -39.726417541503906, "global_step": 184943, "epoch": 1528} {"train_loss": -39.55117416381836, "global_step": 184944, "epoch": 1528} {"train_loss": -40.16057586669922, "global_step": 184945, "epoch": 1528} {"train_loss": -40.48265838623047, "global_step": 184946, "epoch": 1528} {"train_loss": -40.56233596801758, "global_step": 184947, "epoch": 1528} {"train_loss": -40.757503509521484, "global_step": 184948, "epoch": 1528} {"train_loss": -39.72026062011719, "global_step": 184949, "epoch": 1528} {"train_loss": -39.45368194580078, "global_step": 184950, "epoch": 1528} {"train_loss": -39.97660446166992, "global_step": 184951, "epoch": 1528} {"train_loss": -40.60315704345703, "global_step": 184952, "epoch": 1528} {"train_loss": -39.0999755859375, "global_step": 184953, "epoch": 1528} {"train_loss": -41.28831481933594, "global_step": 184954, "epoch": 1528} {"train_loss": -39.42167282104492, "global_step": 184955, "epoch": 1528} {"train_loss": -40.57020950317383, "global_step": 184956, "epoch": 1528} {"train_loss": -40.73960494995117, "global_step": 184957, "epoch": 1528} {"train_loss": -40.8790283203125, "global_step": 184958, "epoch": 1528} {"train_loss": -40.14423370361328, "global_step": 184959, "epoch": 1528} {"train_loss": -39.95277786254883, "global_step": 184960, "epoch": 1528} {"train_loss": -39.90332794189453, "global_step": 184961, "epoch": 1528} {"train_loss": -40.51399612426758, "global_step": 184962, "epoch": 1528} {"train_loss": -39.97379684448242, "global_step": 184963, "epoch": 1528} {"train_loss": -41.07141876220703, "global_step": 184964, "epoch": 1528} {"train_loss": -40.430641174316406, "global_step": 184965, "epoch": 1528} {"train_loss": -40.3486213684082, "global_step": 184966, "epoch": 1528} {"train_loss": -40.043556213378906, "global_step": 184967, "epoch": 1528} {"train_loss": -40.973236083984375, "global_step": 184968, "epoch": 1528} {"train_loss": -40.90073776245117, "global_step": 184969, "epoch": 1528} {"train_loss": -41.412330627441406, "global_step": 184970, "epoch": 1528} {"train_loss": -40.894569396972656, "global_step": 184971, "epoch": 1528} {"train_loss": -40.02094650268555, "global_step": 184972, "epoch": 1528} {"train_loss": -40.77406311035156, "global_step": 184973, "epoch": 1528} {"train_loss": -40.50642013549805, "global_step": 184974, "epoch": 1528} {"train_loss": -39.05475616455078, "global_step": 184975, "epoch": 1528} {"train_loss": -40.20769119262695, "global_step": 184976, "epoch": 1528} {"train_loss": -40.439998626708984, "global_step": 184977, "epoch": 1528} {"train_loss": -34.24248123168945, "global_step": 184978, "epoch": 1528} {"train_loss": -39.222286224365234, "global_step": 184979, "epoch": 1528} {"train_loss": -38.699790954589844, "global_step": 184980, "epoch": 1528} {"train_loss": -40.830684661865234, "global_step": 184981, "epoch": 1528} {"train_loss": -39.75716781616211, "global_step": 184982, "epoch": 1528} {"train_loss": -41.3138542175293, "global_step": 184983, "epoch": 1528} {"train_loss": -39.58871078491211, "global_step": 184984, "epoch": 1528} {"train_loss": -39.897281646728516, "global_step": 184985, "epoch": 1528} {"train_loss": -40.54661178588867, "global_step": 184986, "epoch": 1528} {"train_loss": -40.42832565307617, "global_step": 184987, "epoch": 1528} {"train_loss": -40.096343994140625, "global_step": 184988, "epoch": 1528} {"train_loss": -40.74287796020508, "global_step": 184989, "epoch": 1528} {"train_loss": -40.29911422729492, "global_step": 184990, "epoch": 1528} {"train_loss": -40.31096267700195, "global_step": 184991, "epoch": 1528} {"train_loss": -39.49597930908203, "global_step": 184992, "epoch": 1528} {"train_loss": -40.413551330566406, "global_step": 184993, "epoch": 1528} {"train_loss": -40.2772331237793, "global_step": 184994, "epoch": 1528} {"train_loss": -40.92019271850586, "global_step": 184995, "epoch": 1528} {"train_loss": -39.38376998901367, "global_step": 184996, "epoch": 1528} {"train_loss": -40.772987365722656, "global_step": 184997, "epoch": 1528} {"train_loss": -36.65614700317383, "global_step": 184998, "epoch": 1528} {"train_loss": -39.594886779785156, "global_step": 184999, "epoch": 1528} {"train_loss": -40.28849792480469, "global_step": 185000, "epoch": 1528} {"train_loss": -39.10028076171875, "global_step": 185001, "epoch": 1528} {"train_loss": -40.74098587036133, "global_step": 185002, "epoch": 1528} {"train_loss": -39.59392166137695, "global_step": 185003, "epoch": 1528} {"train_loss": -40.81276321411133, "global_step": 185004, "epoch": 1528} {"train_loss": -39.28175735473633, "global_step": 185005, "epoch": 1528} {"train_loss": -38.901275634765625, "global_step": 185006, "epoch": 1528} {"train_loss": -38.31095504760742, "global_step": 185007, "epoch": 1528} {"train_loss": -39.27335250476175, "global_step": 185008, "epoch": 1528, "val_loss": 2675790.75} {"train_loss": -41.410770416259766, "global_step": 185009, "epoch": 1529} {"train_loss": -40.210384368896484, "global_step": 185010, "epoch": 1529} {"train_loss": -41.383094787597656, "global_step": 185011, "epoch": 1529} {"train_loss": -41.118995666503906, "global_step": 185012, "epoch": 1529} {"train_loss": -41.01959228515625, "global_step": 185013, "epoch": 1529} {"train_loss": -41.2547607421875, "global_step": 185014, "epoch": 1529} {"train_loss": -40.06011962890625, "global_step": 185015, "epoch": 1529} {"train_loss": -38.821407318115234, "global_step": 185016, "epoch": 1529} {"train_loss": -40.654998779296875, "global_step": 185017, "epoch": 1529} {"train_loss": -40.098426818847656, "global_step": 185018, "epoch": 1529} {"train_loss": -40.58662033081055, "global_step": 185019, "epoch": 1529} {"train_loss": -40.23586654663086, "global_step": 185020, "epoch": 1529} {"train_loss": -36.039146423339844, "global_step": 185021, "epoch": 1529} {"train_loss": -40.100257873535156, "global_step": 185022, "epoch": 1529} {"train_loss": -39.750362396240234, "global_step": 185023, "epoch": 1529} {"train_loss": -37.16450119018555, "global_step": 185024, "epoch": 1529} {"train_loss": -38.61959457397461, "global_step": 185025, "epoch": 1529} {"train_loss": -37.52817916870117, "global_step": 185026, "epoch": 1529} {"train_loss": -39.78335189819336, "global_step": 185027, "epoch": 1529} {"train_loss": -40.36981201171875, "global_step": 185028, "epoch": 1529} {"train_loss": -34.55312728881836, "global_step": 185029, "epoch": 1529} {"train_loss": -36.14152145385742, "global_step": 185030, "epoch": 1529} {"train_loss": -39.063350677490234, "global_step": 185031, "epoch": 1529} {"train_loss": -35.44439697265625, "global_step": 185032, "epoch": 1529} {"train_loss": -40.0577278137207, "global_step": 185033, "epoch": 1529} {"train_loss": -39.77391052246094, "global_step": 185034, "epoch": 1529} {"train_loss": -39.273799896240234, "global_step": 185035, "epoch": 1529} {"train_loss": -39.972808837890625, "global_step": 185036, "epoch": 1529} {"train_loss": -39.38901901245117, "global_step": 185037, "epoch": 1529} {"train_loss": -37.624267578125, "global_step": 185038, "epoch": 1529} {"train_loss": -39.32997131347656, "global_step": 185039, "epoch": 1529} {"train_loss": -40.70061111450195, "global_step": 185040, "epoch": 1529} {"train_loss": -39.81264877319336, "global_step": 185041, "epoch": 1529} {"train_loss": -39.37778854370117, "global_step": 185042, "epoch": 1529} {"train_loss": -40.76616287231445, "global_step": 185043, "epoch": 1529} {"train_loss": -40.189144134521484, "global_step": 185044, "epoch": 1529} {"train_loss": -40.14788818359375, "global_step": 185045, "epoch": 1529} {"train_loss": -40.36988067626953, "global_step": 185046, "epoch": 1529} {"train_loss": -40.813232421875, "global_step": 185047, "epoch": 1529} {"train_loss": -40.32107925415039, "global_step": 185048, "epoch": 1529} {"train_loss": -40.22024154663086, "global_step": 185049, "epoch": 1529} {"train_loss": -40.15081787109375, "global_step": 185050, "epoch": 1529} {"train_loss": -39.46560287475586, "global_step": 185051, "epoch": 1529} {"train_loss": -40.19729232788086, "global_step": 185052, "epoch": 1529} {"train_loss": -40.24190139770508, "global_step": 185053, "epoch": 1529} {"train_loss": -39.8570671081543, "global_step": 185054, "epoch": 1529} {"train_loss": -38.746795654296875, "global_step": 185055, "epoch": 1529} {"train_loss": -39.700462341308594, "global_step": 185056, "epoch": 1529} {"train_loss": -40.53652572631836, "global_step": 185057, "epoch": 1529} {"train_loss": -41.27373504638672, "global_step": 185058, "epoch": 1529} {"train_loss": -39.559452056884766, "global_step": 185059, "epoch": 1529} {"train_loss": -39.65151596069336, "global_step": 185060, "epoch": 1529} {"train_loss": -38.82563400268555, "global_step": 185061, "epoch": 1529} {"train_loss": -38.10163497924805, "global_step": 185062, "epoch": 1529} {"train_loss": -40.977142333984375, "global_step": 185063, "epoch": 1529} {"train_loss": -40.855342864990234, "global_step": 185064, "epoch": 1529} {"train_loss": -41.016387939453125, "global_step": 185065, "epoch": 1529} {"train_loss": -41.099308013916016, "global_step": 185066, "epoch": 1529} {"train_loss": -40.763153076171875, "global_step": 185067, "epoch": 1529} {"train_loss": -40.60106658935547, "global_step": 185068, "epoch": 1529} {"train_loss": -40.902931213378906, "global_step": 185069, "epoch": 1529} {"train_loss": -41.36561965942383, "global_step": 185070, "epoch": 1529} {"train_loss": -40.85418701171875, "global_step": 185071, "epoch": 1529} {"train_loss": -40.87916946411133, "global_step": 185072, "epoch": 1529} {"train_loss": -41.361732482910156, "global_step": 185073, "epoch": 1529} {"train_loss": -41.3991813659668, "global_step": 185074, "epoch": 1529} {"train_loss": -41.0948600769043, "global_step": 185075, "epoch": 1529} {"train_loss": -40.71816635131836, "global_step": 185076, "epoch": 1529} {"train_loss": -41.330833435058594, "global_step": 185077, "epoch": 1529} {"train_loss": -41.24494552612305, "global_step": 185078, "epoch": 1529} {"train_loss": -40.724422454833984, "global_step": 185079, "epoch": 1529} {"train_loss": -41.64372634887695, "global_step": 185080, "epoch": 1529} {"train_loss": -40.79683303833008, "global_step": 185081, "epoch": 1529} {"train_loss": -41.32476806640625, "global_step": 185082, "epoch": 1529} {"train_loss": -40.84766387939453, "global_step": 185083, "epoch": 1529} {"train_loss": -41.00855255126953, "global_step": 185084, "epoch": 1529} {"train_loss": -40.640682220458984, "global_step": 185085, "epoch": 1529} {"train_loss": -39.551021575927734, "global_step": 185086, "epoch": 1529} {"train_loss": -37.71945571899414, "global_step": 185087, "epoch": 1529} {"train_loss": -31.883405685424805, "global_step": 185088, "epoch": 1529} {"train_loss": -21.495655059814453, "global_step": 185089, "epoch": 1529} {"train_loss": -17.419689178466797, "global_step": 185090, "epoch": 1529} {"train_loss": -35.17677307128906, "global_step": 185091, "epoch": 1529} {"train_loss": -36.7009391784668, "global_step": 185092, "epoch": 1529} {"train_loss": -29.128652572631836, "global_step": 185093, "epoch": 1529} {"train_loss": -39.28866195678711, "global_step": 185094, "epoch": 1529} {"train_loss": -34.766578674316406, "global_step": 185095, "epoch": 1529} {"train_loss": -38.41463851928711, "global_step": 185096, "epoch": 1529} {"train_loss": -34.053627014160156, "global_step": 185097, "epoch": 1529} {"train_loss": -36.72683334350586, "global_step": 185098, "epoch": 1529} {"train_loss": -38.470394134521484, "global_step": 185099, "epoch": 1529} {"train_loss": -37.10882568359375, "global_step": 185100, "epoch": 1529} {"train_loss": -37.43916320800781, "global_step": 185101, "epoch": 1529} {"train_loss": -37.76758575439453, "global_step": 185102, "epoch": 1529} {"train_loss": -37.788028717041016, "global_step": 185103, "epoch": 1529} {"train_loss": -38.121368408203125, "global_step": 185104, "epoch": 1529} {"train_loss": -38.656063079833984, "global_step": 185105, "epoch": 1529} {"train_loss": -39.21694564819336, "global_step": 185106, "epoch": 1529} {"train_loss": -38.7331657409668, "global_step": 185107, "epoch": 1529} {"train_loss": -39.5933837890625, "global_step": 185108, "epoch": 1529} {"train_loss": -38.061275482177734, "global_step": 185109, "epoch": 1529} {"train_loss": -39.470367431640625, "global_step": 185110, "epoch": 1529} {"train_loss": -38.99201583862305, "global_step": 185111, "epoch": 1529} {"train_loss": -39.003761291503906, "global_step": 185112, "epoch": 1529} {"train_loss": -39.7279052734375, "global_step": 185113, "epoch": 1529} {"train_loss": -39.50710678100586, "global_step": 185114, "epoch": 1529} {"train_loss": -39.77174377441406, "global_step": 185115, "epoch": 1529} {"train_loss": -39.57192611694336, "global_step": 185116, "epoch": 1529} {"train_loss": -39.35566711425781, "global_step": 185117, "epoch": 1529} {"train_loss": -40.53139114379883, "global_step": 185118, "epoch": 1529} {"train_loss": -40.11355209350586, "global_step": 185119, "epoch": 1529} {"train_loss": -40.13941192626953, "global_step": 185120, "epoch": 1529} {"train_loss": -40.03532028198242, "global_step": 185121, "epoch": 1529} {"train_loss": -40.106040954589844, "global_step": 185122, "epoch": 1529} {"train_loss": -40.27693557739258, "global_step": 185123, "epoch": 1529} {"train_loss": -40.46079635620117, "global_step": 185124, "epoch": 1529} {"train_loss": -40.03822708129883, "global_step": 185125, "epoch": 1529} {"train_loss": -40.343265533447266, "global_step": 185126, "epoch": 1529} {"train_loss": -40.66548538208008, "global_step": 185127, "epoch": 1529} {"train_loss": -39.73870086669922, "global_step": 185128, "epoch": 1529} {"train_loss": -39.09495910140109, "global_step": 185129, "epoch": 1529, "val_loss": 2636273.0} {"train_loss": -40.52828598022461, "global_step": 185130, "epoch": 1530} {"train_loss": -40.91864013671875, "global_step": 185131, "epoch": 1530} {"train_loss": -40.28678512573242, "global_step": 185132, "epoch": 1530} {"train_loss": -40.8854866027832, "global_step": 185133, "epoch": 1530} {"train_loss": -40.80392074584961, "global_step": 185134, "epoch": 1530} {"train_loss": -41.237178802490234, "global_step": 185135, "epoch": 1530} {"train_loss": -40.595069885253906, "global_step": 185136, "epoch": 1530} {"train_loss": -40.632049560546875, "global_step": 185137, "epoch": 1530} {"train_loss": -40.78329086303711, "global_step": 185138, "epoch": 1530} {"train_loss": -40.7508544921875, "global_step": 185139, "epoch": 1530} {"train_loss": -40.958404541015625, "global_step": 185140, "epoch": 1530} {"train_loss": -41.23368453979492, "global_step": 185141, "epoch": 1530} {"train_loss": -41.205657958984375, "global_step": 185142, "epoch": 1530} {"train_loss": -41.25681686401367, "global_step": 185143, "epoch": 1530} {"train_loss": -41.41892623901367, "global_step": 185144, "epoch": 1530} {"train_loss": -40.925296783447266, "global_step": 185145, "epoch": 1530} {"train_loss": -40.53697204589844, "global_step": 185146, "epoch": 1530} {"train_loss": -41.53630447387695, "global_step": 185147, "epoch": 1530} {"train_loss": -41.44777297973633, "global_step": 185148, "epoch": 1530} {"train_loss": -41.21071243286133, "global_step": 185149, "epoch": 1530} {"train_loss": -41.300960540771484, "global_step": 185150, "epoch": 1530} {"train_loss": -41.83514404296875, "global_step": 185151, "epoch": 1530} {"train_loss": -41.35456466674805, "global_step": 185152, "epoch": 1530} {"train_loss": -41.026283264160156, "global_step": 185153, "epoch": 1530} {"train_loss": -41.50979232788086, "global_step": 185154, "epoch": 1530} {"train_loss": -41.818389892578125, "global_step": 185155, "epoch": 1530} {"train_loss": -40.8614616394043, "global_step": 185156, "epoch": 1530} {"train_loss": -41.87474822998047, "global_step": 185157, "epoch": 1530} {"train_loss": -41.76628875732422, "global_step": 185158, "epoch": 1530} {"train_loss": -41.1435661315918, "global_step": 185159, "epoch": 1530} {"train_loss": -41.55858612060547, "global_step": 185160, "epoch": 1530} {"train_loss": -41.40582275390625, "global_step": 185161, "epoch": 1530} {"train_loss": -41.33241653442383, "global_step": 185162, "epoch": 1530} {"train_loss": -42.03977584838867, "global_step": 185163, "epoch": 1530} {"train_loss": -41.85331344604492, "global_step": 185164, "epoch": 1530} {"train_loss": -41.94168472290039, "global_step": 185165, "epoch": 1530} {"train_loss": -42.181453704833984, "global_step": 185166, "epoch": 1530} {"train_loss": -41.947227478027344, "global_step": 185167, "epoch": 1530} {"train_loss": -41.788551330566406, "global_step": 185168, "epoch": 1530} {"train_loss": -42.055335998535156, "global_step": 185169, "epoch": 1530} {"train_loss": -41.388607025146484, "global_step": 185170, "epoch": 1530} {"train_loss": -41.93204879760742, "global_step": 185171, "epoch": 1530} {"train_loss": -42.09444046020508, "global_step": 185172, "epoch": 1530} {"train_loss": -42.26681137084961, "global_step": 185173, "epoch": 1530} {"train_loss": -41.788063049316406, "global_step": 185174, "epoch": 1530} {"train_loss": -41.91994857788086, "global_step": 185175, "epoch": 1530} {"train_loss": -41.964210510253906, "global_step": 185176, "epoch": 1530} {"train_loss": -42.50729751586914, "global_step": 185177, "epoch": 1530} {"train_loss": -42.31624984741211, "global_step": 185178, "epoch": 1530} {"train_loss": -42.3390007019043, "global_step": 185179, "epoch": 1530} {"train_loss": -40.64892578125, "global_step": 185180, "epoch": 1530} {"train_loss": -42.38291549682617, "global_step": 185181, "epoch": 1530} {"train_loss": -42.04045486450195, "global_step": 185182, "epoch": 1530} {"train_loss": -42.38828659057617, "global_step": 185183, "epoch": 1530} {"train_loss": -42.35459518432617, "global_step": 185184, "epoch": 1530} {"train_loss": -40.14688491821289, "global_step": 185185, "epoch": 1530} {"train_loss": -39.867759704589844, "global_step": 185186, "epoch": 1530} {"train_loss": -40.99622344970703, "global_step": 185187, "epoch": 1530} {"train_loss": -41.24312973022461, "global_step": 185188, "epoch": 1530} {"train_loss": -41.612640380859375, "global_step": 185189, "epoch": 1530} {"train_loss": -41.33743667602539, "global_step": 185190, "epoch": 1530} {"train_loss": -42.09967803955078, "global_step": 185191, "epoch": 1530} {"train_loss": -42.440040588378906, "global_step": 185192, "epoch": 1530} {"train_loss": -42.06209182739258, "global_step": 185193, "epoch": 1530} {"train_loss": -41.65000915527344, "global_step": 185194, "epoch": 1530} {"train_loss": -39.49355697631836, "global_step": 185195, "epoch": 1530} {"train_loss": -38.449161529541016, "global_step": 185196, "epoch": 1530} {"train_loss": -38.918251037597656, "global_step": 185197, "epoch": 1530} {"train_loss": -39.39864730834961, "global_step": 185198, "epoch": 1530} {"train_loss": -38.589595794677734, "global_step": 185199, "epoch": 1530} {"train_loss": -33.36807632446289, "global_step": 185200, "epoch": 1530} {"train_loss": -30.255407333374023, "global_step": 185201, "epoch": 1530} {"train_loss": -34.62165832519531, "global_step": 185202, "epoch": 1530} {"train_loss": -37.03217697143555, "global_step": 185203, "epoch": 1530} {"train_loss": -38.08945846557617, "global_step": 185204, "epoch": 1530} {"train_loss": -39.365509033203125, "global_step": 185205, "epoch": 1530} {"train_loss": -37.33453369140625, "global_step": 185206, "epoch": 1530} {"train_loss": -37.42950439453125, "global_step": 185207, "epoch": 1530} {"train_loss": -41.01327896118164, "global_step": 185208, "epoch": 1530} {"train_loss": -37.43885040283203, "global_step": 185209, "epoch": 1530} {"train_loss": -39.391815185546875, "global_step": 185210, "epoch": 1530} {"train_loss": -40.29941940307617, "global_step": 185211, "epoch": 1530} {"train_loss": -39.101680755615234, "global_step": 185212, "epoch": 1530} {"train_loss": -40.408042907714844, "global_step": 185213, "epoch": 1530} {"train_loss": -39.3804817199707, "global_step": 185214, "epoch": 1530} {"train_loss": -39.290679931640625, "global_step": 185215, "epoch": 1530} {"train_loss": -38.16483688354492, "global_step": 185216, "epoch": 1530} {"train_loss": -38.45261764526367, "global_step": 185217, "epoch": 1530} {"train_loss": -39.35845947265625, "global_step": 185218, "epoch": 1530} {"train_loss": -36.924713134765625, "global_step": 185219, "epoch": 1530} {"train_loss": -40.118038177490234, "global_step": 185220, "epoch": 1530} {"train_loss": -38.712032318115234, "global_step": 185221, "epoch": 1530} {"train_loss": -40.98369598388672, "global_step": 185222, "epoch": 1530} {"train_loss": -38.54726791381836, "global_step": 185223, "epoch": 1530} {"train_loss": -40.17094039916992, "global_step": 185224, "epoch": 1530} {"train_loss": -39.714202880859375, "global_step": 185225, "epoch": 1530} {"train_loss": -39.307708740234375, "global_step": 185226, "epoch": 1530} {"train_loss": -40.261348724365234, "global_step": 185227, "epoch": 1530} {"train_loss": -39.09305953979492, "global_step": 185228, "epoch": 1530} {"train_loss": -39.97402572631836, "global_step": 185229, "epoch": 1530} {"train_loss": -40.19244384765625, "global_step": 185230, "epoch": 1530} {"train_loss": -40.1928825378418, "global_step": 185231, "epoch": 1530} {"train_loss": -40.24223709106445, "global_step": 185232, "epoch": 1530} {"train_loss": -41.208702087402344, "global_step": 185233, "epoch": 1530} {"train_loss": -40.4879264831543, "global_step": 185234, "epoch": 1530} {"train_loss": -40.93369674682617, "global_step": 185235, "epoch": 1530} {"train_loss": -40.67629623413086, "global_step": 185236, "epoch": 1530} {"train_loss": -41.2588996887207, "global_step": 185237, "epoch": 1530} {"train_loss": -40.8237419128418, "global_step": 185238, "epoch": 1530} {"train_loss": -41.339962005615234, "global_step": 185239, "epoch": 1530} {"train_loss": -41.09648895263672, "global_step": 185240, "epoch": 1530} {"train_loss": -41.0788688659668, "global_step": 185241, "epoch": 1530} {"train_loss": -40.39432907104492, "global_step": 185242, "epoch": 1530} {"train_loss": -41.46479415893555, "global_step": 185243, "epoch": 1530} {"train_loss": -41.07207107543945, "global_step": 185244, "epoch": 1530} {"train_loss": -41.418392181396484, "global_step": 185245, "epoch": 1530} {"train_loss": -41.42960739135742, "global_step": 185246, "epoch": 1530} {"train_loss": -41.356781005859375, "global_step": 185247, "epoch": 1530} {"train_loss": -41.7228889465332, "global_step": 185248, "epoch": 1530} {"train_loss": -41.200496673583984, "global_step": 185249, "epoch": 1530} {"train_loss": -40.53853120094489, "global_step": 185250, "epoch": 1530, "val_loss": 2664270.25} {"train_loss": -41.80108642578125, "global_step": 185251, "epoch": 1531} {"train_loss": -41.6290283203125, "global_step": 185252, "epoch": 1531} {"train_loss": -41.22761154174805, "global_step": 185253, "epoch": 1531} {"train_loss": -41.611236572265625, "global_step": 185254, "epoch": 1531} {"train_loss": -41.00509262084961, "global_step": 185255, "epoch": 1531} {"train_loss": -41.742225646972656, "global_step": 185256, "epoch": 1531} {"train_loss": -40.8264045715332, "global_step": 185257, "epoch": 1531} {"train_loss": -41.621002197265625, "global_step": 185258, "epoch": 1531} {"train_loss": -41.2638053894043, "global_step": 185259, "epoch": 1531} {"train_loss": -41.66227340698242, "global_step": 185260, "epoch": 1531} {"train_loss": -41.57071304321289, "global_step": 185261, "epoch": 1531} {"train_loss": -41.91014099121094, "global_step": 185262, "epoch": 1531} {"train_loss": -42.06728744506836, "global_step": 185263, "epoch": 1531} {"train_loss": -40.224666595458984, "global_step": 185264, "epoch": 1531} {"train_loss": -41.38056564331055, "global_step": 185265, "epoch": 1531} {"train_loss": -41.63532638549805, "global_step": 185266, "epoch": 1531} {"train_loss": -42.1203498840332, "global_step": 185267, "epoch": 1531} {"train_loss": -42.078704833984375, "global_step": 185268, "epoch": 1531} {"train_loss": -38.75411605834961, "global_step": 185269, "epoch": 1531} {"train_loss": -42.02763748168945, "global_step": 185270, "epoch": 1531} {"train_loss": -42.09733581542969, "global_step": 185271, "epoch": 1531} {"train_loss": -41.7885627746582, "global_step": 185272, "epoch": 1531} {"train_loss": -41.394832611083984, "global_step": 185273, "epoch": 1531} {"train_loss": -41.806190490722656, "global_step": 185274, "epoch": 1531} {"train_loss": -40.97579574584961, "global_step": 185275, "epoch": 1531} {"train_loss": -41.8949089050293, "global_step": 185276, "epoch": 1531} {"train_loss": -41.84535598754883, "global_step": 185277, "epoch": 1531} {"train_loss": -42.00087356567383, "global_step": 185278, "epoch": 1531} {"train_loss": -42.23252487182617, "global_step": 185279, "epoch": 1531} {"train_loss": -41.66242599487305, "global_step": 185280, "epoch": 1531} {"train_loss": -40.44618606567383, "global_step": 185281, "epoch": 1531} {"train_loss": -41.93049621582031, "global_step": 185282, "epoch": 1531} {"train_loss": -42.11927795410156, "global_step": 185283, "epoch": 1531} {"train_loss": -41.41485595703125, "global_step": 185284, "epoch": 1531} {"train_loss": -41.96372604370117, "global_step": 185285, "epoch": 1531} {"train_loss": -42.285194396972656, "global_step": 185286, "epoch": 1531} {"train_loss": -39.27898406982422, "global_step": 185287, "epoch": 1531} {"train_loss": -41.6239128112793, "global_step": 185288, "epoch": 1531} {"train_loss": -41.67477035522461, "global_step": 185289, "epoch": 1531} {"train_loss": -41.3682746887207, "global_step": 185290, "epoch": 1531} {"train_loss": -37.5721435546875, "global_step": 185291, "epoch": 1531} {"train_loss": -40.900150299072266, "global_step": 185292, "epoch": 1531} {"train_loss": -38.77730178833008, "global_step": 185293, "epoch": 1531} {"train_loss": -41.57011795043945, "global_step": 185294, "epoch": 1531} {"train_loss": -38.195709228515625, "global_step": 185295, "epoch": 1531} {"train_loss": -40.18217086791992, "global_step": 185296, "epoch": 1531} {"train_loss": -39.417640686035156, "global_step": 185297, "epoch": 1531} {"train_loss": -39.313575744628906, "global_step": 185298, "epoch": 1531} {"train_loss": -39.3274040222168, "global_step": 185299, "epoch": 1531} {"train_loss": -40.22676467895508, "global_step": 185300, "epoch": 1531} {"train_loss": -40.92459487915039, "global_step": 185301, "epoch": 1531} {"train_loss": -39.06600570678711, "global_step": 185302, "epoch": 1531} {"train_loss": -37.33393478393555, "global_step": 185303, "epoch": 1531} {"train_loss": -39.69646453857422, "global_step": 185304, "epoch": 1531} {"train_loss": -40.88510513305664, "global_step": 185305, "epoch": 1531} {"train_loss": -37.1601448059082, "global_step": 185306, "epoch": 1531} {"train_loss": -40.57585906982422, "global_step": 185307, "epoch": 1531} {"train_loss": -40.3918571472168, "global_step": 185308, "epoch": 1531} {"train_loss": -33.8471794128418, "global_step": 185309, "epoch": 1531} {"train_loss": -36.9995002746582, "global_step": 185310, "epoch": 1531} {"train_loss": -41.253360748291016, "global_step": 185311, "epoch": 1531} {"train_loss": -40.91659164428711, "global_step": 185312, "epoch": 1531} {"train_loss": -40.17201614379883, "global_step": 185313, "epoch": 1531} {"train_loss": -39.412086486816406, "global_step": 185314, "epoch": 1531} {"train_loss": -39.7552490234375, "global_step": 185315, "epoch": 1531} {"train_loss": -41.0916633605957, "global_step": 185316, "epoch": 1531} {"train_loss": -40.310455322265625, "global_step": 185317, "epoch": 1531} {"train_loss": -40.77737808227539, "global_step": 185318, "epoch": 1531} {"train_loss": -40.85026550292969, "global_step": 185319, "epoch": 1531} {"train_loss": -41.2922477722168, "global_step": 185320, "epoch": 1531} {"train_loss": -41.106781005859375, "global_step": 185321, "epoch": 1531} {"train_loss": -38.30954360961914, "global_step": 185322, "epoch": 1531} {"train_loss": -40.26429748535156, "global_step": 185323, "epoch": 1531} {"train_loss": -40.78657913208008, "global_step": 185324, "epoch": 1531} {"train_loss": -37.689430236816406, "global_step": 185325, "epoch": 1531} {"train_loss": -41.729827880859375, "global_step": 185326, "epoch": 1531} {"train_loss": -40.7698860168457, "global_step": 185327, "epoch": 1531} {"train_loss": -41.56829833984375, "global_step": 185328, "epoch": 1531} {"train_loss": -41.0265007019043, "global_step": 185329, "epoch": 1531} {"train_loss": -41.240386962890625, "global_step": 185330, "epoch": 1531} {"train_loss": -41.07707595825195, "global_step": 185331, "epoch": 1531} {"train_loss": -41.559181213378906, "global_step": 185332, "epoch": 1531} {"train_loss": -39.685489654541016, "global_step": 185333, "epoch": 1531} {"train_loss": -40.26200485229492, "global_step": 185334, "epoch": 1531} {"train_loss": -40.80024337768555, "global_step": 185335, "epoch": 1531} {"train_loss": -40.69068145751953, "global_step": 185336, "epoch": 1531} {"train_loss": -40.8036994934082, "global_step": 185337, "epoch": 1531} {"train_loss": -41.034515380859375, "global_step": 185338, "epoch": 1531} {"train_loss": -41.574642181396484, "global_step": 185339, "epoch": 1531} {"train_loss": -41.69266891479492, "global_step": 185340, "epoch": 1531} {"train_loss": -40.583099365234375, "global_step": 185341, "epoch": 1531} {"train_loss": -40.81467819213867, "global_step": 185342, "epoch": 1531} {"train_loss": -40.9264030456543, "global_step": 185343, "epoch": 1531} {"train_loss": -41.10791778564453, "global_step": 185344, "epoch": 1531} {"train_loss": -39.8040771484375, "global_step": 185345, "epoch": 1531} {"train_loss": -41.122859954833984, "global_step": 185346, "epoch": 1531} {"train_loss": -41.30949401855469, "global_step": 185347, "epoch": 1531} {"train_loss": -41.267818450927734, "global_step": 185348, "epoch": 1531} {"train_loss": -37.67348861694336, "global_step": 185349, "epoch": 1531} {"train_loss": -40.99520492553711, "global_step": 185350, "epoch": 1531} {"train_loss": -41.69931411743164, "global_step": 185351, "epoch": 1531} {"train_loss": -40.725948333740234, "global_step": 185352, "epoch": 1531} {"train_loss": -39.99002456665039, "global_step": 185353, "epoch": 1531} {"train_loss": -40.66586685180664, "global_step": 185354, "epoch": 1531} {"train_loss": -39.419776916503906, "global_step": 185355, "epoch": 1531} {"train_loss": -39.632293701171875, "global_step": 185356, "epoch": 1531} {"train_loss": -40.36810302734375, "global_step": 185357, "epoch": 1531} {"train_loss": -40.70784378051758, "global_step": 185358, "epoch": 1531} {"train_loss": -40.085758209228516, "global_step": 185359, "epoch": 1531} {"train_loss": -39.56031799316406, "global_step": 185360, "epoch": 1531} {"train_loss": -41.51740646362305, "global_step": 185361, "epoch": 1531} {"train_loss": -40.019893646240234, "global_step": 185362, "epoch": 1531} {"train_loss": -40.33415603637695, "global_step": 185363, "epoch": 1531} {"train_loss": -40.69063949584961, "global_step": 185364, "epoch": 1531} {"train_loss": -40.339263916015625, "global_step": 185365, "epoch": 1531} {"train_loss": -41.33550262451172, "global_step": 185366, "epoch": 1531} {"train_loss": -40.6385383605957, "global_step": 185367, "epoch": 1531} {"train_loss": -41.16808319091797, "global_step": 185368, "epoch": 1531} {"train_loss": -39.58420944213867, "global_step": 185369, "epoch": 1531} {"train_loss": -40.7408332824707, "global_step": 185370, "epoch": 1531} {"train_loss": -40.635610438575426, "global_step": 185371, "epoch": 1531, "val_loss": 2599222.25} {"train_loss": -39.901947021484375, "global_step": 185372, "epoch": 1532} {"train_loss": -40.04021453857422, "global_step": 185373, "epoch": 1532} {"train_loss": -40.526947021484375, "global_step": 185374, "epoch": 1532} {"train_loss": -39.8491096496582, "global_step": 185375, "epoch": 1532} {"train_loss": -37.0345344543457, "global_step": 185376, "epoch": 1532} {"train_loss": -38.6461181640625, "global_step": 185377, "epoch": 1532} {"train_loss": -40.399478912353516, "global_step": 185378, "epoch": 1532} {"train_loss": -39.920528411865234, "global_step": 185379, "epoch": 1532} {"train_loss": -40.83745193481445, "global_step": 185380, "epoch": 1532} {"train_loss": -39.18129348754883, "global_step": 185381, "epoch": 1532} {"train_loss": -41.54541015625, "global_step": 185382, "epoch": 1532} {"train_loss": -39.37113571166992, "global_step": 185383, "epoch": 1532} {"train_loss": -40.479469299316406, "global_step": 185384, "epoch": 1532} {"train_loss": -38.49878692626953, "global_step": 185385, "epoch": 1532} {"train_loss": -40.90351867675781, "global_step": 185386, "epoch": 1532} {"train_loss": -39.80449295043945, "global_step": 185387, "epoch": 1532} {"train_loss": -40.670265197753906, "global_step": 185388, "epoch": 1532} {"train_loss": -40.31306838989258, "global_step": 185389, "epoch": 1532} {"train_loss": -40.8013801574707, "global_step": 185390, "epoch": 1532} {"train_loss": -40.64323806762695, "global_step": 185391, "epoch": 1532} {"train_loss": -39.12314987182617, "global_step": 185392, "epoch": 1532} {"train_loss": -39.694793701171875, "global_step": 185393, "epoch": 1532} {"train_loss": -36.61696243286133, "global_step": 185394, "epoch": 1532} {"train_loss": -40.791343688964844, "global_step": 185395, "epoch": 1532} {"train_loss": -40.782588958740234, "global_step": 185396, "epoch": 1532} {"train_loss": -40.86625289916992, "global_step": 185397, "epoch": 1532} {"train_loss": -40.316463470458984, "global_step": 185398, "epoch": 1532} {"train_loss": -33.98081588745117, "global_step": 185399, "epoch": 1532} {"train_loss": -38.526607513427734, "global_step": 185400, "epoch": 1532} {"train_loss": -39.79470443725586, "global_step": 185401, "epoch": 1532} {"train_loss": -36.67823028564453, "global_step": 185402, "epoch": 1532} {"train_loss": -38.502960205078125, "global_step": 185403, "epoch": 1532} {"train_loss": -40.20612335205078, "global_step": 185404, "epoch": 1532} {"train_loss": -36.9777946472168, "global_step": 185405, "epoch": 1532} {"train_loss": -38.74226760864258, "global_step": 185406, "epoch": 1532} {"train_loss": -39.12611389160156, "global_step": 185407, "epoch": 1532} {"train_loss": -39.1241569519043, "global_step": 185408, "epoch": 1532} {"train_loss": -37.02120590209961, "global_step": 185409, "epoch": 1532} {"train_loss": -35.3665771484375, "global_step": 185410, "epoch": 1532} {"train_loss": -38.92708969116211, "global_step": 185411, "epoch": 1532} {"train_loss": -38.95868682861328, "global_step": 185412, "epoch": 1532} {"train_loss": -40.026546478271484, "global_step": 185413, "epoch": 1532} {"train_loss": -38.08845138549805, "global_step": 185414, "epoch": 1532} {"train_loss": -38.99428176879883, "global_step": 185415, "epoch": 1532} {"train_loss": -40.057289123535156, "global_step": 185416, "epoch": 1532} {"train_loss": -38.967994689941406, "global_step": 185417, "epoch": 1532} {"train_loss": -37.69022750854492, "global_step": 185418, "epoch": 1532} {"train_loss": -39.151145935058594, "global_step": 185419, "epoch": 1532} {"train_loss": -38.56816864013672, "global_step": 185420, "epoch": 1532} {"train_loss": -38.73969650268555, "global_step": 185421, "epoch": 1532} {"train_loss": -38.99119186401367, "global_step": 185422, "epoch": 1532} {"train_loss": -40.47335433959961, "global_step": 185423, "epoch": 1532} {"train_loss": -40.40894317626953, "global_step": 185424, "epoch": 1532} {"train_loss": -40.509090423583984, "global_step": 185425, "epoch": 1532} {"train_loss": -40.59916305541992, "global_step": 185426, "epoch": 1532} {"train_loss": -39.250335693359375, "global_step": 185427, "epoch": 1532} {"train_loss": -37.155941009521484, "global_step": 185428, "epoch": 1532} {"train_loss": -40.40864181518555, "global_step": 185429, "epoch": 1532} {"train_loss": -37.51217269897461, "global_step": 185430, "epoch": 1532} {"train_loss": -39.6318473815918, "global_step": 185431, "epoch": 1532} {"train_loss": -39.392066955566406, "global_step": 185432, "epoch": 1532} {"train_loss": -37.92576217651367, "global_step": 185433, "epoch": 1532} {"train_loss": -39.5590934753418, "global_step": 185434, "epoch": 1532} {"train_loss": -39.7901725769043, "global_step": 185435, "epoch": 1532} {"train_loss": -40.09897994995117, "global_step": 185436, "epoch": 1532} {"train_loss": -40.1665153503418, "global_step": 185437, "epoch": 1532} {"train_loss": -40.270992279052734, "global_step": 185438, "epoch": 1532} {"train_loss": -41.01658248901367, "global_step": 185439, "epoch": 1532} {"train_loss": -38.332637786865234, "global_step": 185440, "epoch": 1532} {"train_loss": -40.89915084838867, "global_step": 185441, "epoch": 1532} {"train_loss": -40.555023193359375, "global_step": 185442, "epoch": 1532} {"train_loss": -39.37879180908203, "global_step": 185443, "epoch": 1532} {"train_loss": -40.78763961791992, "global_step": 185444, "epoch": 1532} {"train_loss": -39.88938903808594, "global_step": 185445, "epoch": 1532} {"train_loss": -40.58539962768555, "global_step": 185446, "epoch": 1532} {"train_loss": -40.475276947021484, "global_step": 185447, "epoch": 1532} {"train_loss": -38.75333786010742, "global_step": 185448, "epoch": 1532} {"train_loss": -40.30604934692383, "global_step": 185449, "epoch": 1532} {"train_loss": -40.33864974975586, "global_step": 185450, "epoch": 1532} {"train_loss": -40.812294006347656, "global_step": 185451, "epoch": 1532} {"train_loss": -39.39176940917969, "global_step": 185452, "epoch": 1532} {"train_loss": -40.56610870361328, "global_step": 185453, "epoch": 1532} {"train_loss": -39.71416091918945, "global_step": 185454, "epoch": 1532} {"train_loss": -40.82293701171875, "global_step": 185455, "epoch": 1532} {"train_loss": -40.87434387207031, "global_step": 185456, "epoch": 1532} {"train_loss": -39.238529205322266, "global_step": 185457, "epoch": 1532} {"train_loss": -41.36897277832031, "global_step": 185458, "epoch": 1532} {"train_loss": -41.210243225097656, "global_step": 185459, "epoch": 1532} {"train_loss": -40.83409881591797, "global_step": 185460, "epoch": 1532} {"train_loss": -40.35184860229492, "global_step": 185461, "epoch": 1532} {"train_loss": -40.87614059448242, "global_step": 185462, "epoch": 1532} {"train_loss": -41.366519927978516, "global_step": 185463, "epoch": 1532} {"train_loss": -41.226375579833984, "global_step": 185464, "epoch": 1532} {"train_loss": -41.0460090637207, "global_step": 185465, "epoch": 1532} {"train_loss": -40.735504150390625, "global_step": 185466, "epoch": 1532} {"train_loss": -39.30219650268555, "global_step": 185467, "epoch": 1532} {"train_loss": -38.52717971801758, "global_step": 185468, "epoch": 1532} {"train_loss": -40.579769134521484, "global_step": 185469, "epoch": 1532} {"train_loss": -40.93756866455078, "global_step": 185470, "epoch": 1532} {"train_loss": -41.3719596862793, "global_step": 185471, "epoch": 1532} {"train_loss": -40.5648078918457, "global_step": 185472, "epoch": 1532} {"train_loss": -41.61726379394531, "global_step": 185473, "epoch": 1532} {"train_loss": -40.23304748535156, "global_step": 185474, "epoch": 1532} {"train_loss": -40.558258056640625, "global_step": 185475, "epoch": 1532} {"train_loss": -40.72206497192383, "global_step": 185476, "epoch": 1532} {"train_loss": -41.095680236816406, "global_step": 185477, "epoch": 1532} {"train_loss": -41.49401092529297, "global_step": 185478, "epoch": 1532} {"train_loss": -41.31772994995117, "global_step": 185479, "epoch": 1532} {"train_loss": -41.301692962646484, "global_step": 185480, "epoch": 1532} {"train_loss": -41.1801872253418, "global_step": 185481, "epoch": 1532} {"train_loss": -41.195350646972656, "global_step": 185482, "epoch": 1532} {"train_loss": -40.4438591003418, "global_step": 185483, "epoch": 1532} {"train_loss": -39.9527702331543, "global_step": 185484, "epoch": 1532} {"train_loss": -41.01218795776367, "global_step": 185485, "epoch": 1532} {"train_loss": -40.13652801513672, "global_step": 185486, "epoch": 1532} {"train_loss": -40.462459564208984, "global_step": 185487, "epoch": 1532} {"train_loss": -39.64518356323242, "global_step": 185488, "epoch": 1532} {"train_loss": -39.364105224609375, "global_step": 185489, "epoch": 1532} {"train_loss": -40.24091720581055, "global_step": 185490, "epoch": 1532} {"train_loss": -40.500267028808594, "global_step": 185491, "epoch": 1532} {"train_loss": -39.81788247478895, "global_step": 185492, "epoch": 1532, "val_loss": 2660781.25} {"train_loss": -40.170166015625, "global_step": 185493, "epoch": 1533} {"train_loss": -41.14683532714844, "global_step": 185494, "epoch": 1533} {"train_loss": -41.03696823120117, "global_step": 185495, "epoch": 1533} {"train_loss": -40.36759567260742, "global_step": 185496, "epoch": 1533} {"train_loss": -40.26408004760742, "global_step": 185497, "epoch": 1533} {"train_loss": -40.55022048950195, "global_step": 185498, "epoch": 1533} {"train_loss": -40.84957504272461, "global_step": 185499, "epoch": 1533} {"train_loss": -41.084041595458984, "global_step": 185500, "epoch": 1533} {"train_loss": -41.445045471191406, "global_step": 185501, "epoch": 1533} {"train_loss": -41.40296173095703, "global_step": 185502, "epoch": 1533} {"train_loss": -40.46179962158203, "global_step": 185503, "epoch": 1533} {"train_loss": -38.86265182495117, "global_step": 185504, "epoch": 1533} {"train_loss": -38.096981048583984, "global_step": 185505, "epoch": 1533} {"train_loss": -39.808258056640625, "global_step": 185506, "epoch": 1533} {"train_loss": -41.33860397338867, "global_step": 185507, "epoch": 1533} {"train_loss": -40.5149040222168, "global_step": 185508, "epoch": 1533} {"train_loss": -38.38022994995117, "global_step": 185509, "epoch": 1533} {"train_loss": -39.820613861083984, "global_step": 185510, "epoch": 1533} {"train_loss": -40.76509475708008, "global_step": 185511, "epoch": 1533} {"train_loss": -34.18592071533203, "global_step": 185512, "epoch": 1533} {"train_loss": -40.15652084350586, "global_step": 185513, "epoch": 1533} {"train_loss": -40.57523727416992, "global_step": 185514, "epoch": 1533} {"train_loss": -37.76357650756836, "global_step": 185515, "epoch": 1533} {"train_loss": -39.76394271850586, "global_step": 185516, "epoch": 1533} {"train_loss": -40.39019012451172, "global_step": 185517, "epoch": 1533} {"train_loss": -39.81988525390625, "global_step": 185518, "epoch": 1533} {"train_loss": -40.20603561401367, "global_step": 185519, "epoch": 1533} {"train_loss": -39.17998504638672, "global_step": 185520, "epoch": 1533} {"train_loss": -39.48210906982422, "global_step": 185521, "epoch": 1533} {"train_loss": -38.713069915771484, "global_step": 185522, "epoch": 1533} {"train_loss": -38.3010139465332, "global_step": 185523, "epoch": 1533} {"train_loss": -38.97119903564453, "global_step": 185524, "epoch": 1533} {"train_loss": -40.535850524902344, "global_step": 185525, "epoch": 1533} {"train_loss": -39.14229202270508, "global_step": 185526, "epoch": 1533} {"train_loss": -36.74756622314453, "global_step": 185527, "epoch": 1533} {"train_loss": -37.85501480102539, "global_step": 185528, "epoch": 1533} {"train_loss": -41.03410720825195, "global_step": 185529, "epoch": 1533} {"train_loss": -37.90810012817383, "global_step": 185530, "epoch": 1533} {"train_loss": -39.635738372802734, "global_step": 185531, "epoch": 1533} {"train_loss": -40.16624069213867, "global_step": 185532, "epoch": 1533} {"train_loss": -39.68079376220703, "global_step": 185533, "epoch": 1533} {"train_loss": -38.49934005737305, "global_step": 185534, "epoch": 1533} {"train_loss": -37.891395568847656, "global_step": 185535, "epoch": 1533} {"train_loss": -40.157958984375, "global_step": 185536, "epoch": 1533} {"train_loss": -38.16292953491211, "global_step": 185537, "epoch": 1533} {"train_loss": -39.36228561401367, "global_step": 185538, "epoch": 1533} {"train_loss": -39.358062744140625, "global_step": 185539, "epoch": 1533} {"train_loss": -40.2929573059082, "global_step": 185540, "epoch": 1533} {"train_loss": -39.75138473510742, "global_step": 185541, "epoch": 1533} {"train_loss": -40.307552337646484, "global_step": 185542, "epoch": 1533} {"train_loss": -40.013851165771484, "global_step": 185543, "epoch": 1533} {"train_loss": -40.339698791503906, "global_step": 185544, "epoch": 1533} {"train_loss": -40.085872650146484, "global_step": 185545, "epoch": 1533} {"train_loss": -40.11336898803711, "global_step": 185546, "epoch": 1533} {"train_loss": -40.07742691040039, "global_step": 185547, "epoch": 1533} {"train_loss": -40.11121368408203, "global_step": 185548, "epoch": 1533} {"train_loss": -39.54875564575195, "global_step": 185549, "epoch": 1533} {"train_loss": -40.69675827026367, "global_step": 185550, "epoch": 1533} {"train_loss": -41.156837463378906, "global_step": 185551, "epoch": 1533} {"train_loss": -40.14841079711914, "global_step": 185552, "epoch": 1533} {"train_loss": -40.72530746459961, "global_step": 185553, "epoch": 1533} {"train_loss": -40.5446662902832, "global_step": 185554, "epoch": 1533} {"train_loss": -40.67264938354492, "global_step": 185555, "epoch": 1533} {"train_loss": -40.82304000854492, "global_step": 185556, "epoch": 1533} {"train_loss": -40.96464157104492, "global_step": 185557, "epoch": 1533} {"train_loss": -40.35358810424805, "global_step": 185558, "epoch": 1533} {"train_loss": -41.444759368896484, "global_step": 185559, "epoch": 1533} {"train_loss": -40.4144401550293, "global_step": 185560, "epoch": 1533} {"train_loss": -41.09481430053711, "global_step": 185561, "epoch": 1533} {"train_loss": -41.01564025878906, "global_step": 185562, "epoch": 1533} {"train_loss": -41.19082260131836, "global_step": 185563, "epoch": 1533} {"train_loss": -38.13353729248047, "global_step": 185564, "epoch": 1533} {"train_loss": -41.26437759399414, "global_step": 185565, "epoch": 1533} {"train_loss": -41.47843551635742, "global_step": 185566, "epoch": 1533} {"train_loss": -41.4898796081543, "global_step": 185567, "epoch": 1533} {"train_loss": -41.037139892578125, "global_step": 185568, "epoch": 1533} {"train_loss": -41.29482650756836, "global_step": 185569, "epoch": 1533} {"train_loss": -40.94434356689453, "global_step": 185570, "epoch": 1533} {"train_loss": -41.39992141723633, "global_step": 185571, "epoch": 1533} {"train_loss": -41.17551803588867, "global_step": 185572, "epoch": 1533} {"train_loss": -41.83999252319336, "global_step": 185573, "epoch": 1533} {"train_loss": -41.065242767333984, "global_step": 185574, "epoch": 1533} {"train_loss": -40.301082611083984, "global_step": 185575, "epoch": 1533} {"train_loss": -40.42930221557617, "global_step": 185576, "epoch": 1533} {"train_loss": -40.88724899291992, "global_step": 185577, "epoch": 1533} {"train_loss": -41.451534271240234, "global_step": 185578, "epoch": 1533} {"train_loss": -40.808231353759766, "global_step": 185579, "epoch": 1533} {"train_loss": -38.94260787963867, "global_step": 185580, "epoch": 1533} {"train_loss": -40.10183334350586, "global_step": 185581, "epoch": 1533} {"train_loss": -41.252994537353516, "global_step": 185582, "epoch": 1533} {"train_loss": -39.52558898925781, "global_step": 185583, "epoch": 1533} {"train_loss": -39.08171463012695, "global_step": 185584, "epoch": 1533} {"train_loss": -40.12662124633789, "global_step": 185585, "epoch": 1533} {"train_loss": -40.19684982299805, "global_step": 185586, "epoch": 1533} {"train_loss": -41.2870979309082, "global_step": 185587, "epoch": 1533} {"train_loss": -41.5007209777832, "global_step": 185588, "epoch": 1533} {"train_loss": -41.60188674926758, "global_step": 185589, "epoch": 1533} {"train_loss": -41.52782440185547, "global_step": 185590, "epoch": 1533} {"train_loss": -41.98102951049805, "global_step": 185591, "epoch": 1533} {"train_loss": -41.548255920410156, "global_step": 185592, "epoch": 1533} {"train_loss": -40.502349853515625, "global_step": 185593, "epoch": 1533} {"train_loss": -41.7332763671875, "global_step": 185594, "epoch": 1533} {"train_loss": -41.89445877075195, "global_step": 185595, "epoch": 1533} {"train_loss": -40.95442199707031, "global_step": 185596, "epoch": 1533} {"train_loss": -41.94972229003906, "global_step": 185597, "epoch": 1533} {"train_loss": -41.961666107177734, "global_step": 185598, "epoch": 1533} {"train_loss": -41.309200286865234, "global_step": 185599, "epoch": 1533} {"train_loss": -41.79413604736328, "global_step": 185600, "epoch": 1533} {"train_loss": -41.94426727294922, "global_step": 185601, "epoch": 1533} {"train_loss": -41.889339447021484, "global_step": 185602, "epoch": 1533} {"train_loss": -42.06878662109375, "global_step": 185603, "epoch": 1533} {"train_loss": -42.05323028564453, "global_step": 185604, "epoch": 1533} {"train_loss": -41.600460052490234, "global_step": 185605, "epoch": 1533} {"train_loss": -41.5091667175293, "global_step": 185606, "epoch": 1533} {"train_loss": -41.45941925048828, "global_step": 185607, "epoch": 1533} {"train_loss": -41.96303176879883, "global_step": 185608, "epoch": 1533} {"train_loss": -42.023067474365234, "global_step": 185609, "epoch": 1533} {"train_loss": -41.2756462097168, "global_step": 185610, "epoch": 1533} {"train_loss": -41.6537971496582, "global_step": 185611, "epoch": 1533} {"train_loss": -41.76064682006836, "global_step": 185612, "epoch": 1533} {"train_loss": -40.4231783654079, "global_step": 185613, "epoch": 1533, "val_loss": 2631252.75} {"train_loss": -41.983097076416016, "global_step": 185614, "epoch": 1534} {"train_loss": -42.23551940917969, "global_step": 185615, "epoch": 1534} {"train_loss": -42.02164840698242, "global_step": 185616, "epoch": 1534} {"train_loss": -41.97966384887695, "global_step": 185617, "epoch": 1534} {"train_loss": -41.13847732543945, "global_step": 185618, "epoch": 1534} {"train_loss": -41.47694778442383, "global_step": 185619, "epoch": 1534} {"train_loss": -41.9925422668457, "global_step": 185620, "epoch": 1534} {"train_loss": -41.84869384765625, "global_step": 185621, "epoch": 1534} {"train_loss": -41.47954177856445, "global_step": 185622, "epoch": 1534} {"train_loss": -41.12380599975586, "global_step": 185623, "epoch": 1534} {"train_loss": -41.584720611572266, "global_step": 185624, "epoch": 1534} {"train_loss": -41.92287826538086, "global_step": 185625, "epoch": 1534} {"train_loss": -41.47567367553711, "global_step": 185626, "epoch": 1534} {"train_loss": -41.85888671875, "global_step": 185627, "epoch": 1534} {"train_loss": -41.982818603515625, "global_step": 185628, "epoch": 1534} {"train_loss": -41.65559387207031, "global_step": 185629, "epoch": 1534} {"train_loss": -42.183006286621094, "global_step": 185630, "epoch": 1534} {"train_loss": -41.88764572143555, "global_step": 185631, "epoch": 1534} {"train_loss": -42.25935745239258, "global_step": 185632, "epoch": 1534} {"train_loss": -41.6649284362793, "global_step": 185633, "epoch": 1534} {"train_loss": -41.695228576660156, "global_step": 185634, "epoch": 1534} {"train_loss": -41.84721374511719, "global_step": 185635, "epoch": 1534} {"train_loss": -41.28559112548828, "global_step": 185636, "epoch": 1534} {"train_loss": -39.538368225097656, "global_step": 185637, "epoch": 1534} {"train_loss": -34.502418518066406, "global_step": 185638, "epoch": 1534} {"train_loss": -30.542133331298828, "global_step": 185639, "epoch": 1534} {"train_loss": -36.76599884033203, "global_step": 185640, "epoch": 1534} {"train_loss": -40.13842010498047, "global_step": 185641, "epoch": 1534} {"train_loss": -38.494842529296875, "global_step": 185642, "epoch": 1534} {"train_loss": -33.80636978149414, "global_step": 185643, "epoch": 1534} {"train_loss": -34.51123809814453, "global_step": 185644, "epoch": 1534} {"train_loss": -36.380348205566406, "global_step": 185645, "epoch": 1534} {"train_loss": -36.004302978515625, "global_step": 185646, "epoch": 1534} {"train_loss": -36.637020111083984, "global_step": 185647, "epoch": 1534} {"train_loss": -39.682186126708984, "global_step": 185648, "epoch": 1534} {"train_loss": -34.08207702636719, "global_step": 185649, "epoch": 1534} {"train_loss": -38.9356803894043, "global_step": 185650, "epoch": 1534} {"train_loss": -35.862056732177734, "global_step": 185651, "epoch": 1534} {"train_loss": -37.251190185546875, "global_step": 185652, "epoch": 1534} {"train_loss": -35.89621353149414, "global_step": 185653, "epoch": 1534} {"train_loss": -39.490718841552734, "global_step": 185654, "epoch": 1534} {"train_loss": -36.27119827270508, "global_step": 185655, "epoch": 1534} {"train_loss": -40.546138763427734, "global_step": 185656, "epoch": 1534} {"train_loss": -36.11538314819336, "global_step": 185657, "epoch": 1534} {"train_loss": -37.7404670715332, "global_step": 185658, "epoch": 1534} {"train_loss": -38.35361862182617, "global_step": 185659, "epoch": 1534} {"train_loss": -36.30227279663086, "global_step": 185660, "epoch": 1534} {"train_loss": -38.73342514038086, "global_step": 185661, "epoch": 1534} {"train_loss": -37.10782241821289, "global_step": 185662, "epoch": 1534} {"train_loss": -37.42133331298828, "global_step": 185663, "epoch": 1534} {"train_loss": -39.88066482543945, "global_step": 185664, "epoch": 1534} {"train_loss": -38.20117950439453, "global_step": 185665, "epoch": 1534} {"train_loss": -40.4368896484375, "global_step": 185666, "epoch": 1534} {"train_loss": -38.31604766845703, "global_step": 185667, "epoch": 1534} {"train_loss": -40.07938766479492, "global_step": 185668, "epoch": 1534} {"train_loss": -39.20565414428711, "global_step": 185669, "epoch": 1534} {"train_loss": -39.212371826171875, "global_step": 185670, "epoch": 1534} {"train_loss": -39.00554275512695, "global_step": 185671, "epoch": 1534} {"train_loss": -39.53466033935547, "global_step": 185672, "epoch": 1534} {"train_loss": -39.74675750732422, "global_step": 185673, "epoch": 1534} {"train_loss": -40.418575286865234, "global_step": 185674, "epoch": 1534} {"train_loss": -39.99139404296875, "global_step": 185675, "epoch": 1534} {"train_loss": -40.354400634765625, "global_step": 185676, "epoch": 1534} {"train_loss": -39.75913619995117, "global_step": 185677, "epoch": 1534} {"train_loss": -40.494754791259766, "global_step": 185678, "epoch": 1534} {"train_loss": -39.275394439697266, "global_step": 185679, "epoch": 1534} {"train_loss": -40.636165618896484, "global_step": 185680, "epoch": 1534} {"train_loss": -39.95168685913086, "global_step": 185681, "epoch": 1534} {"train_loss": -40.7674560546875, "global_step": 185682, "epoch": 1534} {"train_loss": -40.45183181762695, "global_step": 185683, "epoch": 1534} {"train_loss": -40.87163162231445, "global_step": 185684, "epoch": 1534} {"train_loss": -40.05848693847656, "global_step": 185685, "epoch": 1534} {"train_loss": -40.80744934082031, "global_step": 185686, "epoch": 1534} {"train_loss": -40.1771354675293, "global_step": 185687, "epoch": 1534} {"train_loss": -41.40018844604492, "global_step": 185688, "epoch": 1534} {"train_loss": -40.36410140991211, "global_step": 185689, "epoch": 1534} {"train_loss": -40.88843536376953, "global_step": 185690, "epoch": 1534} {"train_loss": -40.56265640258789, "global_step": 185691, "epoch": 1534} {"train_loss": -41.41438674926758, "global_step": 185692, "epoch": 1534} {"train_loss": -40.75685119628906, "global_step": 185693, "epoch": 1534} {"train_loss": -41.24277877807617, "global_step": 185694, "epoch": 1534} {"train_loss": -40.72504425048828, "global_step": 185695, "epoch": 1534} {"train_loss": -41.2537841796875, "global_step": 185696, "epoch": 1534} {"train_loss": -41.20864486694336, "global_step": 185697, "epoch": 1534} {"train_loss": -41.02333450317383, "global_step": 185698, "epoch": 1534} {"train_loss": -41.349910736083984, "global_step": 185699, "epoch": 1534} {"train_loss": -40.80858612060547, "global_step": 185700, "epoch": 1534} {"train_loss": -41.4291877746582, "global_step": 185701, "epoch": 1534} {"train_loss": -41.32064437866211, "global_step": 185702, "epoch": 1534} {"train_loss": -41.48086929321289, "global_step": 185703, "epoch": 1534} {"train_loss": -41.71611785888672, "global_step": 185704, "epoch": 1534} {"train_loss": -41.17170715332031, "global_step": 185705, "epoch": 1534} {"train_loss": -41.36171340942383, "global_step": 185706, "epoch": 1534} {"train_loss": -41.174591064453125, "global_step": 185707, "epoch": 1534} {"train_loss": -41.18107223510742, "global_step": 185708, "epoch": 1534} {"train_loss": -41.42848205566406, "global_step": 185709, "epoch": 1534} {"train_loss": -41.62337112426758, "global_step": 185710, "epoch": 1534} {"train_loss": -41.763763427734375, "global_step": 185711, "epoch": 1534} {"train_loss": -41.96534729003906, "global_step": 185712, "epoch": 1534} {"train_loss": -41.58338165283203, "global_step": 185713, "epoch": 1534} {"train_loss": -41.37115478515625, "global_step": 185714, "epoch": 1534} {"train_loss": -41.594993591308594, "global_step": 185715, "epoch": 1534} {"train_loss": -41.7032470703125, "global_step": 185716, "epoch": 1534} {"train_loss": -42.076717376708984, "global_step": 185717, "epoch": 1534} {"train_loss": -41.668949127197266, "global_step": 185718, "epoch": 1534} {"train_loss": -42.072486877441406, "global_step": 185719, "epoch": 1534} {"train_loss": -41.91991424560547, "global_step": 185720, "epoch": 1534} {"train_loss": -41.36968994140625, "global_step": 185721, "epoch": 1534} {"train_loss": -41.79845428466797, "global_step": 185722, "epoch": 1534} {"train_loss": -42.333377838134766, "global_step": 185723, "epoch": 1534} {"train_loss": -41.71559143066406, "global_step": 185724, "epoch": 1534} {"train_loss": -42.061981201171875, "global_step": 185725, "epoch": 1534} {"train_loss": -41.985958099365234, "global_step": 185726, "epoch": 1534} {"train_loss": -41.92496871948242, "global_step": 185727, "epoch": 1534} {"train_loss": -42.30599594116211, "global_step": 185728, "epoch": 1534} {"train_loss": -42.4409065246582, "global_step": 185729, "epoch": 1534} {"train_loss": -42.11400604248047, "global_step": 185730, "epoch": 1534} {"train_loss": -42.26932144165039, "global_step": 185731, "epoch": 1534} {"train_loss": -41.176326751708984, "global_step": 185732, "epoch": 1534} {"train_loss": -41.842681884765625, "global_step": 185733, "epoch": 1534} {"train_loss": -40.22768061614234, "global_step": 185734, "epoch": 1534, "val_loss": 2679744.0} {"train_loss": -42.034461975097656, "global_step": 185735, "epoch": 1535} {"train_loss": -41.82415008544922, "global_step": 185736, "epoch": 1535} {"train_loss": -42.141048431396484, "global_step": 185737, "epoch": 1535} {"train_loss": -42.261260986328125, "global_step": 185738, "epoch": 1535} {"train_loss": -40.89717483520508, "global_step": 185739, "epoch": 1535} {"train_loss": -41.50901412963867, "global_step": 185740, "epoch": 1535} {"train_loss": -41.437225341796875, "global_step": 185741, "epoch": 1535} {"train_loss": -41.77388381958008, "global_step": 185742, "epoch": 1535} {"train_loss": -42.54949188232422, "global_step": 185743, "epoch": 1535} {"train_loss": -41.72120666503906, "global_step": 185744, "epoch": 1535} {"train_loss": -40.790008544921875, "global_step": 185745, "epoch": 1535} {"train_loss": -41.45376205444336, "global_step": 185746, "epoch": 1535} {"train_loss": -41.24580383300781, "global_step": 185747, "epoch": 1535} {"train_loss": -42.16797637939453, "global_step": 185748, "epoch": 1535} {"train_loss": -41.50177001953125, "global_step": 185749, "epoch": 1535} {"train_loss": -41.28272247314453, "global_step": 185750, "epoch": 1535} {"train_loss": -41.71985626220703, "global_step": 185751, "epoch": 1535} {"train_loss": -41.51425552368164, "global_step": 185752, "epoch": 1535} {"train_loss": -41.31695556640625, "global_step": 185753, "epoch": 1535} {"train_loss": -41.7829475402832, "global_step": 185754, "epoch": 1535} {"train_loss": -40.415321350097656, "global_step": 185755, "epoch": 1535} {"train_loss": -40.7346305847168, "global_step": 185756, "epoch": 1535} {"train_loss": -41.67006301879883, "global_step": 185757, "epoch": 1535} {"train_loss": -41.94478988647461, "global_step": 185758, "epoch": 1535} {"train_loss": -42.04193878173828, "global_step": 185759, "epoch": 1535} {"train_loss": -42.36955261230469, "global_step": 185760, "epoch": 1535} {"train_loss": -41.77229309082031, "global_step": 185761, "epoch": 1535} {"train_loss": -41.25958251953125, "global_step": 185762, "epoch": 1535} {"train_loss": -41.35372543334961, "global_step": 185763, "epoch": 1535} {"train_loss": -41.467384338378906, "global_step": 185764, "epoch": 1535} {"train_loss": -42.090511322021484, "global_step": 185765, "epoch": 1535} {"train_loss": -41.759761810302734, "global_step": 185766, "epoch": 1535} {"train_loss": -41.868160247802734, "global_step": 185767, "epoch": 1535} {"train_loss": -41.209659576416016, "global_step": 185768, "epoch": 1535} {"train_loss": -41.09882736206055, "global_step": 185769, "epoch": 1535} {"train_loss": -38.76274871826172, "global_step": 185770, "epoch": 1535} {"train_loss": -41.831607818603516, "global_step": 185771, "epoch": 1535} {"train_loss": -41.6925048828125, "global_step": 185772, "epoch": 1535} {"train_loss": -37.890865325927734, "global_step": 185773, "epoch": 1535} {"train_loss": -37.91842269897461, "global_step": 185774, "epoch": 1535} {"train_loss": -37.9107780456543, "global_step": 185775, "epoch": 1535} {"train_loss": -39.081260681152344, "global_step": 185776, "epoch": 1535} {"train_loss": -40.764469146728516, "global_step": 185777, "epoch": 1535} {"train_loss": -40.27714157104492, "global_step": 185778, "epoch": 1535} {"train_loss": -39.980072021484375, "global_step": 185779, "epoch": 1535} {"train_loss": -29.123550415039062, "global_step": 185780, "epoch": 1535} {"train_loss": -36.71982955932617, "global_step": 185781, "epoch": 1535} {"train_loss": -36.968597412109375, "global_step": 185782, "epoch": 1535} {"train_loss": -37.4761848449707, "global_step": 185783, "epoch": 1535} {"train_loss": -30.714008331298828, "global_step": 185784, "epoch": 1535} {"train_loss": -38.568687438964844, "global_step": 185785, "epoch": 1535} {"train_loss": -36.8647575378418, "global_step": 185786, "epoch": 1535} {"train_loss": -32.60667037963867, "global_step": 185787, "epoch": 1535} {"train_loss": -35.48586654663086, "global_step": 185788, "epoch": 1535} {"train_loss": -32.37785720825195, "global_step": 185789, "epoch": 1535} {"train_loss": -34.23191452026367, "global_step": 185790, "epoch": 1535} {"train_loss": -33.09237289428711, "global_step": 185791, "epoch": 1535} {"train_loss": -29.166372299194336, "global_step": 185792, "epoch": 1535} {"train_loss": -32.414859771728516, "global_step": 185793, "epoch": 1535} {"train_loss": -32.45841979980469, "global_step": 185794, "epoch": 1535} {"train_loss": -34.014278411865234, "global_step": 185795, "epoch": 1535} {"train_loss": -35.69620895385742, "global_step": 185796, "epoch": 1535} {"train_loss": -34.247291564941406, "global_step": 185797, "epoch": 1535} {"train_loss": -28.785741806030273, "global_step": 185798, "epoch": 1535} {"train_loss": -35.893409729003906, "global_step": 185799, "epoch": 1535} {"train_loss": -36.67379379272461, "global_step": 185800, "epoch": 1535} {"train_loss": -35.535804748535156, "global_step": 185801, "epoch": 1535} {"train_loss": -36.27149963378906, "global_step": 185802, "epoch": 1535} {"train_loss": -35.98897933959961, "global_step": 185803, "epoch": 1535} {"train_loss": -35.5196533203125, "global_step": 185804, "epoch": 1535} {"train_loss": -33.90269088745117, "global_step": 185805, "epoch": 1535} {"train_loss": -34.302371978759766, "global_step": 185806, "epoch": 1535} {"train_loss": -37.79296875, "global_step": 185807, "epoch": 1535} {"train_loss": -36.47162628173828, "global_step": 185808, "epoch": 1535} {"train_loss": -38.04827880859375, "global_step": 185809, "epoch": 1535} {"train_loss": -38.549400329589844, "global_step": 185810, "epoch": 1535} {"train_loss": -36.532867431640625, "global_step": 185811, "epoch": 1535} {"train_loss": -37.43220901489258, "global_step": 185812, "epoch": 1535} {"train_loss": -34.53603744506836, "global_step": 185813, "epoch": 1535} {"train_loss": -36.94009017944336, "global_step": 185814, "epoch": 1535} {"train_loss": -37.67499542236328, "global_step": 185815, "epoch": 1535} {"train_loss": -36.233978271484375, "global_step": 185816, "epoch": 1535} {"train_loss": -38.5086669921875, "global_step": 185817, "epoch": 1535} {"train_loss": -37.92685317993164, "global_step": 185818, "epoch": 1535} {"train_loss": -38.497310638427734, "global_step": 185819, "epoch": 1535} {"train_loss": -35.07890701293945, "global_step": 185820, "epoch": 1535} {"train_loss": -38.404449462890625, "global_step": 185821, "epoch": 1535} {"train_loss": -37.51816940307617, "global_step": 185822, "epoch": 1535} {"train_loss": -38.2538948059082, "global_step": 185823, "epoch": 1535} {"train_loss": -38.10612487792969, "global_step": 185824, "epoch": 1535} {"train_loss": -37.27286148071289, "global_step": 185825, "epoch": 1535} {"train_loss": -38.348960876464844, "global_step": 185826, "epoch": 1535} {"train_loss": -38.924800872802734, "global_step": 185827, "epoch": 1535} {"train_loss": -38.543636322021484, "global_step": 185828, "epoch": 1535} {"train_loss": -38.716957092285156, "global_step": 185829, "epoch": 1535} {"train_loss": -39.09382629394531, "global_step": 185830, "epoch": 1535} {"train_loss": -37.824703216552734, "global_step": 185831, "epoch": 1535} {"train_loss": -39.11318588256836, "global_step": 185832, "epoch": 1535} {"train_loss": -39.08951950073242, "global_step": 185833, "epoch": 1535} {"train_loss": -38.16219711303711, "global_step": 185834, "epoch": 1535} {"train_loss": -38.42678451538086, "global_step": 185835, "epoch": 1535} {"train_loss": -38.660804748535156, "global_step": 185836, "epoch": 1535} {"train_loss": -39.22121810913086, "global_step": 185837, "epoch": 1535} {"train_loss": -38.6950798034668, "global_step": 185838, "epoch": 1535} {"train_loss": -39.47772979736328, "global_step": 185839, "epoch": 1535} {"train_loss": -39.29677200317383, "global_step": 185840, "epoch": 1535} {"train_loss": -39.28386306762695, "global_step": 185841, "epoch": 1535} {"train_loss": -39.21631622314453, "global_step": 185842, "epoch": 1535} {"train_loss": -39.331668853759766, "global_step": 185843, "epoch": 1535} {"train_loss": -39.528236389160156, "global_step": 185844, "epoch": 1535} {"train_loss": -39.25372314453125, "global_step": 185845, "epoch": 1535} {"train_loss": -39.83120346069336, "global_step": 185846, "epoch": 1535} {"train_loss": -39.70082473754883, "global_step": 185847, "epoch": 1535} {"train_loss": -39.81740188598633, "global_step": 185848, "epoch": 1535} {"train_loss": -39.93813705444336, "global_step": 185849, "epoch": 1535} {"train_loss": -40.46549606323242, "global_step": 185850, "epoch": 1535} {"train_loss": -40.337581634521484, "global_step": 185851, "epoch": 1535} {"train_loss": -39.088287353515625, "global_step": 185852, "epoch": 1535} {"train_loss": -40.46631622314453, "global_step": 185853, "epoch": 1535} {"train_loss": -40.51287841796875, "global_step": 185854, "epoch": 1535} {"train_loss": -38.55322070161173, "global_step": 185855, "epoch": 1535, "val_loss": 2602133.25} {"train_loss": -39.86214065551758, "global_step": 185856, "epoch": 1536} {"train_loss": -40.251258850097656, "global_step": 185857, "epoch": 1536} {"train_loss": -40.38911056518555, "global_step": 185858, "epoch": 1536} {"train_loss": -40.47779083251953, "global_step": 185859, "epoch": 1536} {"train_loss": -40.47258377075195, "global_step": 185860, "epoch": 1536} {"train_loss": -40.62830352783203, "global_step": 185861, "epoch": 1536} {"train_loss": -40.10844802856445, "global_step": 185862, "epoch": 1536} {"train_loss": -40.13432693481445, "global_step": 185863, "epoch": 1536} {"train_loss": -40.76408004760742, "global_step": 185864, "epoch": 1536} {"train_loss": -40.489356994628906, "global_step": 185865, "epoch": 1536} {"train_loss": -40.76102828979492, "global_step": 185866, "epoch": 1536} {"train_loss": -39.76276397705078, "global_step": 185867, "epoch": 1536} {"train_loss": -40.60563278198242, "global_step": 185868, "epoch": 1536} {"train_loss": -40.84685134887695, "global_step": 185869, "epoch": 1536} {"train_loss": -40.467254638671875, "global_step": 185870, "epoch": 1536} {"train_loss": -40.45489501953125, "global_step": 185871, "epoch": 1536} {"train_loss": -41.59321212768555, "global_step": 185872, "epoch": 1536} {"train_loss": -40.46601486206055, "global_step": 185873, "epoch": 1536} {"train_loss": -40.85974884033203, "global_step": 185874, "epoch": 1536} {"train_loss": -40.92936325073242, "global_step": 185875, "epoch": 1536} {"train_loss": -41.042728424072266, "global_step": 185876, "epoch": 1536} {"train_loss": -40.93475341796875, "global_step": 185877, "epoch": 1536} {"train_loss": -41.033321380615234, "global_step": 185878, "epoch": 1536} {"train_loss": -40.494873046875, "global_step": 185879, "epoch": 1536} {"train_loss": -40.47905349731445, "global_step": 185880, "epoch": 1536} {"train_loss": -40.71120071411133, "global_step": 185881, "epoch": 1536} {"train_loss": -41.0689697265625, "global_step": 185882, "epoch": 1536} {"train_loss": -40.859676361083984, "global_step": 185883, "epoch": 1536} {"train_loss": -40.87190628051758, "global_step": 185884, "epoch": 1536} {"train_loss": -40.72095489501953, "global_step": 185885, "epoch": 1536} {"train_loss": -41.22251510620117, "global_step": 185886, "epoch": 1536} {"train_loss": -41.16923904418945, "global_step": 185887, "epoch": 1536} {"train_loss": -40.7921028137207, "global_step": 185888, "epoch": 1536} {"train_loss": -41.3069953918457, "global_step": 185889, "epoch": 1536} {"train_loss": -41.06695556640625, "global_step": 185890, "epoch": 1536} {"train_loss": -41.08803176879883, "global_step": 185891, "epoch": 1536} {"train_loss": -41.26679229736328, "global_step": 185892, "epoch": 1536} {"train_loss": -41.31953048706055, "global_step": 185893, "epoch": 1536} {"train_loss": -40.99599838256836, "global_step": 185894, "epoch": 1536} {"train_loss": -41.25331497192383, "global_step": 185895, "epoch": 1536} {"train_loss": -41.3880729675293, "global_step": 185896, "epoch": 1536} {"train_loss": -41.14130783081055, "global_step": 185897, "epoch": 1536} {"train_loss": -41.472557067871094, "global_step": 185898, "epoch": 1536} {"train_loss": -41.08488082885742, "global_step": 185899, "epoch": 1536} {"train_loss": -41.410133361816406, "global_step": 185900, "epoch": 1536} {"train_loss": -41.61811447143555, "global_step": 185901, "epoch": 1536} {"train_loss": -41.598602294921875, "global_step": 185902, "epoch": 1536} {"train_loss": -41.41780471801758, "global_step": 185903, "epoch": 1536} {"train_loss": -41.494930267333984, "global_step": 185904, "epoch": 1536} {"train_loss": -41.62031936645508, "global_step": 185905, "epoch": 1536} {"train_loss": -41.294979095458984, "global_step": 185906, "epoch": 1536} {"train_loss": -41.36071014404297, "global_step": 185907, "epoch": 1536} {"train_loss": -41.311439514160156, "global_step": 185908, "epoch": 1536} {"train_loss": -41.291015625, "global_step": 185909, "epoch": 1536} {"train_loss": -39.69549560546875, "global_step": 185910, "epoch": 1536} {"train_loss": -41.06870651245117, "global_step": 185911, "epoch": 1536} {"train_loss": -40.39980697631836, "global_step": 185912, "epoch": 1536} {"train_loss": -40.14578628540039, "global_step": 185913, "epoch": 1536} {"train_loss": -40.14710235595703, "global_step": 185914, "epoch": 1536} {"train_loss": -39.96163558959961, "global_step": 185915, "epoch": 1536} {"train_loss": -39.04427719116211, "global_step": 185916, "epoch": 1536} {"train_loss": -40.79392623901367, "global_step": 185917, "epoch": 1536} {"train_loss": -38.41551208496094, "global_step": 185918, "epoch": 1536} {"train_loss": -38.72612762451172, "global_step": 185919, "epoch": 1536} {"train_loss": -40.826900482177734, "global_step": 185920, "epoch": 1536} {"train_loss": -39.84668731689453, "global_step": 185921, "epoch": 1536} {"train_loss": -40.9014778137207, "global_step": 185922, "epoch": 1536} {"train_loss": -39.79220199584961, "global_step": 185923, "epoch": 1536} {"train_loss": -39.8428840637207, "global_step": 185924, "epoch": 1536} {"train_loss": -41.34798812866211, "global_step": 185925, "epoch": 1536} {"train_loss": -41.12504196166992, "global_step": 185926, "epoch": 1536} {"train_loss": -41.40666580200195, "global_step": 185927, "epoch": 1536} {"train_loss": -40.71968460083008, "global_step": 185928, "epoch": 1536} {"train_loss": -38.954219818115234, "global_step": 185929, "epoch": 1536} {"train_loss": -36.3892707824707, "global_step": 185930, "epoch": 1536} {"train_loss": -38.4940185546875, "global_step": 185931, "epoch": 1536} {"train_loss": -40.04194259643555, "global_step": 185932, "epoch": 1536} {"train_loss": -37.619483947753906, "global_step": 185933, "epoch": 1536} {"train_loss": -35.196956634521484, "global_step": 185934, "epoch": 1536} {"train_loss": -38.25175094604492, "global_step": 185935, "epoch": 1536} {"train_loss": -39.922306060791016, "global_step": 185936, "epoch": 1536} {"train_loss": -39.826995849609375, "global_step": 185937, "epoch": 1536} {"train_loss": -38.5593376159668, "global_step": 185938, "epoch": 1536} {"train_loss": -40.17387771606445, "global_step": 185939, "epoch": 1536} {"train_loss": -40.5389404296875, "global_step": 185940, "epoch": 1536} {"train_loss": -37.287960052490234, "global_step": 185941, "epoch": 1536} {"train_loss": -38.18751525878906, "global_step": 185942, "epoch": 1536} {"train_loss": -40.594024658203125, "global_step": 185943, "epoch": 1536} {"train_loss": -39.0601921081543, "global_step": 185944, "epoch": 1536} {"train_loss": -38.29305648803711, "global_step": 185945, "epoch": 1536} {"train_loss": -41.21440505981445, "global_step": 185946, "epoch": 1536} {"train_loss": -38.597755432128906, "global_step": 185947, "epoch": 1536} {"train_loss": -39.227500915527344, "global_step": 185948, "epoch": 1536} {"train_loss": -40.49274826049805, "global_step": 185949, "epoch": 1536} {"train_loss": -37.766998291015625, "global_step": 185950, "epoch": 1536} {"train_loss": -40.72254180908203, "global_step": 185951, "epoch": 1536} {"train_loss": -39.35530471801758, "global_step": 185952, "epoch": 1536} {"train_loss": -38.60026168823242, "global_step": 185953, "epoch": 1536} {"train_loss": -39.81028366088867, "global_step": 185954, "epoch": 1536} {"train_loss": -39.264404296875, "global_step": 185955, "epoch": 1536} {"train_loss": -39.32648849487305, "global_step": 185956, "epoch": 1536} {"train_loss": -39.28731918334961, "global_step": 185957, "epoch": 1536} {"train_loss": -36.928157806396484, "global_step": 185958, "epoch": 1536} {"train_loss": -39.878929138183594, "global_step": 185959, "epoch": 1536} {"train_loss": -35.093563079833984, "global_step": 185960, "epoch": 1536} {"train_loss": -37.08558654785156, "global_step": 185961, "epoch": 1536} {"train_loss": -37.14286422729492, "global_step": 185962, "epoch": 1536} {"train_loss": -38.90989303588867, "global_step": 185963, "epoch": 1536} {"train_loss": -38.77911376953125, "global_step": 185964, "epoch": 1536} {"train_loss": -38.88942337036133, "global_step": 185965, "epoch": 1536} {"train_loss": -39.82465744018555, "global_step": 185966, "epoch": 1536} {"train_loss": -39.25811004638672, "global_step": 185967, "epoch": 1536} {"train_loss": -39.20499801635742, "global_step": 185968, "epoch": 1536} {"train_loss": -38.477508544921875, "global_step": 185969, "epoch": 1536} {"train_loss": -40.04850387573242, "global_step": 185970, "epoch": 1536} {"train_loss": -40.127742767333984, "global_step": 185971, "epoch": 1536} {"train_loss": -39.3277702331543, "global_step": 185972, "epoch": 1536} {"train_loss": -39.192710876464844, "global_step": 185973, "epoch": 1536} {"train_loss": -40.18442916870117, "global_step": 185974, "epoch": 1536} {"train_loss": -39.707027435302734, "global_step": 185975, "epoch": 1536} {"train_loss": -40.02648569532662, "global_step": 185976, "epoch": 1536, "val_loss": 2614996.5} {"train_loss": -40.51829147338867, "global_step": 185977, "epoch": 1537} {"train_loss": -40.747467041015625, "global_step": 185978, "epoch": 1537} {"train_loss": -36.641387939453125, "global_step": 185979, "epoch": 1537} {"train_loss": -39.9107780456543, "global_step": 185980, "epoch": 1537} {"train_loss": -40.53972244262695, "global_step": 185981, "epoch": 1537} {"train_loss": -40.67406463623047, "global_step": 185982, "epoch": 1537} {"train_loss": -40.36135482788086, "global_step": 185983, "epoch": 1537} {"train_loss": -40.75375747680664, "global_step": 185984, "epoch": 1537} {"train_loss": -40.941871643066406, "global_step": 185985, "epoch": 1537} {"train_loss": -40.88654327392578, "global_step": 185986, "epoch": 1537} {"train_loss": -41.32012939453125, "global_step": 185987, "epoch": 1537} {"train_loss": -41.12104034423828, "global_step": 185988, "epoch": 1537} {"train_loss": -38.13295364379883, "global_step": 185989, "epoch": 1537} {"train_loss": -40.85365676879883, "global_step": 185990, "epoch": 1537} {"train_loss": -40.89691925048828, "global_step": 185991, "epoch": 1537} {"train_loss": -40.786346435546875, "global_step": 185992, "epoch": 1537} {"train_loss": -41.26032638549805, "global_step": 185993, "epoch": 1537} {"train_loss": -40.62168502807617, "global_step": 185994, "epoch": 1537} {"train_loss": -41.5697021484375, "global_step": 185995, "epoch": 1537} {"train_loss": -41.06472396850586, "global_step": 185996, "epoch": 1537} {"train_loss": -41.20981979370117, "global_step": 185997, "epoch": 1537} {"train_loss": -41.05257797241211, "global_step": 185998, "epoch": 1537} {"train_loss": -41.19266891479492, "global_step": 185999, "epoch": 1537} {"train_loss": -41.228973388671875, "global_step": 186000, "epoch": 1537} {"train_loss": -39.42422103881836, "global_step": 186001, "epoch": 1537} {"train_loss": -41.073211669921875, "global_step": 186002, "epoch": 1537} {"train_loss": -41.69375228881836, "global_step": 186003, "epoch": 1537} {"train_loss": -41.49834060668945, "global_step": 186004, "epoch": 1537} {"train_loss": -40.581478118896484, "global_step": 186005, "epoch": 1537} {"train_loss": -41.38471221923828, "global_step": 186006, "epoch": 1537} {"train_loss": -40.803768157958984, "global_step": 186007, "epoch": 1537} {"train_loss": -41.58687973022461, "global_step": 186008, "epoch": 1537} {"train_loss": -41.13465118408203, "global_step": 186009, "epoch": 1537} {"train_loss": -41.05538558959961, "global_step": 186010, "epoch": 1537} {"train_loss": -41.47233963012695, "global_step": 186011, "epoch": 1537} {"train_loss": -41.103389739990234, "global_step": 186012, "epoch": 1537} {"train_loss": -41.27760314941406, "global_step": 186013, "epoch": 1537} {"train_loss": -41.27752685546875, "global_step": 186014, "epoch": 1537} {"train_loss": -40.58956527709961, "global_step": 186015, "epoch": 1537} {"train_loss": -41.48627853393555, "global_step": 186016, "epoch": 1537} {"train_loss": -40.97343444824219, "global_step": 186017, "epoch": 1537} {"train_loss": -41.62399673461914, "global_step": 186018, "epoch": 1537} {"train_loss": -41.5276985168457, "global_step": 186019, "epoch": 1537} {"train_loss": -40.67775344848633, "global_step": 186020, "epoch": 1537} {"train_loss": -40.8668327331543, "global_step": 186021, "epoch": 1537} {"train_loss": -41.79063034057617, "global_step": 186022, "epoch": 1537} {"train_loss": -40.40968704223633, "global_step": 186023, "epoch": 1537} {"train_loss": -41.469635009765625, "global_step": 186024, "epoch": 1537} {"train_loss": -41.281558990478516, "global_step": 186025, "epoch": 1537} {"train_loss": -40.996639251708984, "global_step": 186026, "epoch": 1537} {"train_loss": -41.60642623901367, "global_step": 186027, "epoch": 1537} {"train_loss": -41.63950729370117, "global_step": 186028, "epoch": 1537} {"train_loss": -40.459266662597656, "global_step": 186029, "epoch": 1537} {"train_loss": -41.1640510559082, "global_step": 186030, "epoch": 1537} {"train_loss": -41.32236862182617, "global_step": 186031, "epoch": 1537} {"train_loss": -41.0980110168457, "global_step": 186032, "epoch": 1537} {"train_loss": -41.801692962646484, "global_step": 186033, "epoch": 1537} {"train_loss": -41.558162689208984, "global_step": 186034, "epoch": 1537} {"train_loss": -41.58345413208008, "global_step": 186035, "epoch": 1537} {"train_loss": -41.38899230957031, "global_step": 186036, "epoch": 1537} {"train_loss": -42.09729766845703, "global_step": 186037, "epoch": 1537} {"train_loss": -42.080352783203125, "global_step": 186038, "epoch": 1537} {"train_loss": -41.5661735534668, "global_step": 186039, "epoch": 1537} {"train_loss": -41.06219482421875, "global_step": 186040, "epoch": 1537} {"train_loss": -42.1136589050293, "global_step": 186041, "epoch": 1537} {"train_loss": -41.44374465942383, "global_step": 186042, "epoch": 1537} {"train_loss": -42.07027816772461, "global_step": 186043, "epoch": 1537} {"train_loss": -41.7455940246582, "global_step": 186044, "epoch": 1537} {"train_loss": -42.047096252441406, "global_step": 186045, "epoch": 1537} {"train_loss": -41.11103057861328, "global_step": 186046, "epoch": 1537} {"train_loss": -42.0593376159668, "global_step": 186047, "epoch": 1537} {"train_loss": -41.92170333862305, "global_step": 186048, "epoch": 1537} {"train_loss": -42.1629638671875, "global_step": 186049, "epoch": 1537} {"train_loss": -41.367733001708984, "global_step": 186050, "epoch": 1537} {"train_loss": -41.52153396606445, "global_step": 186051, "epoch": 1537} {"train_loss": -41.347686767578125, "global_step": 186052, "epoch": 1537} {"train_loss": -40.668006896972656, "global_step": 186053, "epoch": 1537} {"train_loss": -41.24829864501953, "global_step": 186054, "epoch": 1537} {"train_loss": -41.6237907409668, "global_step": 186055, "epoch": 1537} {"train_loss": -40.94966506958008, "global_step": 186056, "epoch": 1537} {"train_loss": -40.4645881652832, "global_step": 186057, "epoch": 1537} {"train_loss": -41.45151901245117, "global_step": 186058, "epoch": 1537} {"train_loss": -41.02659225463867, "global_step": 186059, "epoch": 1537} {"train_loss": -40.87126541137695, "global_step": 186060, "epoch": 1537} {"train_loss": -41.92991638183594, "global_step": 186061, "epoch": 1537} {"train_loss": -42.00216293334961, "global_step": 186062, "epoch": 1537} {"train_loss": -39.79950714111328, "global_step": 186063, "epoch": 1537} {"train_loss": -39.46674346923828, "global_step": 186064, "epoch": 1537} {"train_loss": -39.715335845947266, "global_step": 186065, "epoch": 1537} {"train_loss": -37.18959045410156, "global_step": 186066, "epoch": 1537} {"train_loss": -33.62929153442383, "global_step": 186067, "epoch": 1537} {"train_loss": -32.353416442871094, "global_step": 186068, "epoch": 1537} {"train_loss": -31.894041061401367, "global_step": 186069, "epoch": 1537} {"train_loss": -38.00571823120117, "global_step": 186070, "epoch": 1537} {"train_loss": -41.55170822143555, "global_step": 186071, "epoch": 1537} {"train_loss": -39.839473724365234, "global_step": 186072, "epoch": 1537} {"train_loss": -38.356258392333984, "global_step": 186073, "epoch": 1537} {"train_loss": -39.35979080200195, "global_step": 186074, "epoch": 1537} {"train_loss": -41.12508773803711, "global_step": 186075, "epoch": 1537} {"train_loss": -39.83831787109375, "global_step": 186076, "epoch": 1537} {"train_loss": -40.0477409362793, "global_step": 186077, "epoch": 1537} {"train_loss": -40.72993087768555, "global_step": 186078, "epoch": 1537} {"train_loss": -40.44167709350586, "global_step": 186079, "epoch": 1537} {"train_loss": -39.24066162109375, "global_step": 186080, "epoch": 1537} {"train_loss": -40.69243240356445, "global_step": 186081, "epoch": 1537} {"train_loss": -39.37152099609375, "global_step": 186082, "epoch": 1537} {"train_loss": -40.32804489135742, "global_step": 186083, "epoch": 1537} {"train_loss": -41.05698776245117, "global_step": 186084, "epoch": 1537} {"train_loss": -40.76477813720703, "global_step": 186085, "epoch": 1537} {"train_loss": -41.03943634033203, "global_step": 186086, "epoch": 1537} {"train_loss": -40.77712631225586, "global_step": 186087, "epoch": 1537} {"train_loss": -39.0717658996582, "global_step": 186088, "epoch": 1537} {"train_loss": -41.50952911376953, "global_step": 186089, "epoch": 1537} {"train_loss": -40.26848220825195, "global_step": 186090, "epoch": 1537} {"train_loss": -40.74079513549805, "global_step": 186091, "epoch": 1537} {"train_loss": -40.76933670043945, "global_step": 186092, "epoch": 1537} {"train_loss": -40.05231475830078, "global_step": 186093, "epoch": 1537} {"train_loss": -39.18387985229492, "global_step": 186094, "epoch": 1537} {"train_loss": -40.377906799316406, "global_step": 186095, "epoch": 1537} {"train_loss": -40.82590866088867, "global_step": 186096, "epoch": 1537} {"train_loss": -40.63885253717091, "global_step": 186097, "epoch": 1537, "val_loss": 2601282.75} {"train_loss": -40.81167221069336, "global_step": 186098, "epoch": 1538} {"train_loss": -41.4089241027832, "global_step": 186099, "epoch": 1538} {"train_loss": -41.26370620727539, "global_step": 186100, "epoch": 1538} {"train_loss": -41.09706497192383, "global_step": 186101, "epoch": 1538} {"train_loss": -41.3561897277832, "global_step": 186102, "epoch": 1538} {"train_loss": -41.20890426635742, "global_step": 186103, "epoch": 1538} {"train_loss": -42.097164154052734, "global_step": 186104, "epoch": 1538} {"train_loss": -40.9200553894043, "global_step": 186105, "epoch": 1538} {"train_loss": -41.634490966796875, "global_step": 186106, "epoch": 1538} {"train_loss": -41.679534912109375, "global_step": 186107, "epoch": 1538} {"train_loss": -40.973934173583984, "global_step": 186108, "epoch": 1538} {"train_loss": -41.85517120361328, "global_step": 186109, "epoch": 1538} {"train_loss": -41.598785400390625, "global_step": 186110, "epoch": 1538} {"train_loss": -41.97514724731445, "global_step": 186111, "epoch": 1538} {"train_loss": -41.5048713684082, "global_step": 186112, "epoch": 1538} {"train_loss": -41.61796569824219, "global_step": 186113, "epoch": 1538} {"train_loss": -41.971805572509766, "global_step": 186114, "epoch": 1538} {"train_loss": -41.25575637817383, "global_step": 186115, "epoch": 1538} {"train_loss": -42.30475997924805, "global_step": 186116, "epoch": 1538} {"train_loss": -41.895477294921875, "global_step": 186117, "epoch": 1538} {"train_loss": -41.58663558959961, "global_step": 186118, "epoch": 1538} {"train_loss": -42.186580657958984, "global_step": 186119, "epoch": 1538} {"train_loss": -42.317626953125, "global_step": 186120, "epoch": 1538} {"train_loss": -42.07140350341797, "global_step": 186121, "epoch": 1538} {"train_loss": -41.93305206298828, "global_step": 186122, "epoch": 1538} {"train_loss": -42.531105041503906, "global_step": 186123, "epoch": 1538} {"train_loss": -42.191627502441406, "global_step": 186124, "epoch": 1538} {"train_loss": -42.02839279174805, "global_step": 186125, "epoch": 1538} {"train_loss": -42.12476348876953, "global_step": 186126, "epoch": 1538} {"train_loss": -42.24702072143555, "global_step": 186127, "epoch": 1538} {"train_loss": -42.275390625, "global_step": 186128, "epoch": 1538} {"train_loss": -42.39272689819336, "global_step": 186129, "epoch": 1538} {"train_loss": -42.588558197021484, "global_step": 186130, "epoch": 1538} {"train_loss": -41.73044204711914, "global_step": 186131, "epoch": 1538} {"train_loss": -42.58003616333008, "global_step": 186132, "epoch": 1538} {"train_loss": -42.087520599365234, "global_step": 186133, "epoch": 1538} {"train_loss": -39.65353012084961, "global_step": 186134, "epoch": 1538} {"train_loss": -42.15538024902344, "global_step": 186135, "epoch": 1538} {"train_loss": -40.2813835144043, "global_step": 186136, "epoch": 1538} {"train_loss": -41.9734992980957, "global_step": 186137, "epoch": 1538} {"train_loss": -42.01987838745117, "global_step": 186138, "epoch": 1538} {"train_loss": -41.8008918762207, "global_step": 186139, "epoch": 1538} {"train_loss": -42.16646194458008, "global_step": 186140, "epoch": 1538} {"train_loss": -41.747352600097656, "global_step": 186141, "epoch": 1538} {"train_loss": -42.271636962890625, "global_step": 186142, "epoch": 1538} {"train_loss": -41.945247650146484, "global_step": 186143, "epoch": 1538} {"train_loss": -40.60824203491211, "global_step": 186144, "epoch": 1538} {"train_loss": -40.48507308959961, "global_step": 186145, "epoch": 1538} {"train_loss": -41.87459945678711, "global_step": 186146, "epoch": 1538} {"train_loss": -41.99851608276367, "global_step": 186147, "epoch": 1538} {"train_loss": -41.53071975708008, "global_step": 186148, "epoch": 1538} {"train_loss": -40.994136810302734, "global_step": 186149, "epoch": 1538} {"train_loss": -41.41249465942383, "global_step": 186150, "epoch": 1538} {"train_loss": -41.19031524658203, "global_step": 186151, "epoch": 1538} {"train_loss": -40.76970672607422, "global_step": 186152, "epoch": 1538} {"train_loss": -40.848995208740234, "global_step": 186153, "epoch": 1538} {"train_loss": -36.0352783203125, "global_step": 186154, "epoch": 1538} {"train_loss": -37.6002311706543, "global_step": 186155, "epoch": 1538} {"train_loss": -41.417694091796875, "global_step": 186156, "epoch": 1538} {"train_loss": -38.96730422973633, "global_step": 186157, "epoch": 1538} {"train_loss": -38.03253936767578, "global_step": 186158, "epoch": 1538} {"train_loss": -40.46770477294922, "global_step": 186159, "epoch": 1538} {"train_loss": -40.71781539916992, "global_step": 186160, "epoch": 1538} {"train_loss": -41.02460479736328, "global_step": 186161, "epoch": 1538} {"train_loss": -36.40517807006836, "global_step": 186162, "epoch": 1538} {"train_loss": -38.182106018066406, "global_step": 186163, "epoch": 1538} {"train_loss": -40.6701545715332, "global_step": 186164, "epoch": 1538} {"train_loss": -40.15161895751953, "global_step": 186165, "epoch": 1538} {"train_loss": -39.22725296020508, "global_step": 186166, "epoch": 1538} {"train_loss": -39.626468658447266, "global_step": 186167, "epoch": 1538} {"train_loss": -39.157161712646484, "global_step": 186168, "epoch": 1538} {"train_loss": -39.4167594909668, "global_step": 186169, "epoch": 1538} {"train_loss": -39.67485427856445, "global_step": 186170, "epoch": 1538} {"train_loss": -40.608131408691406, "global_step": 186171, "epoch": 1538} {"train_loss": -40.609928131103516, "global_step": 186172, "epoch": 1538} {"train_loss": -39.46814727783203, "global_step": 186173, "epoch": 1538} {"train_loss": -38.92922592163086, "global_step": 186174, "epoch": 1538} {"train_loss": -37.35472106933594, "global_step": 186175, "epoch": 1538} {"train_loss": -40.85503387451172, "global_step": 186176, "epoch": 1538} {"train_loss": -39.97524642944336, "global_step": 186177, "epoch": 1538} {"train_loss": -38.581275939941406, "global_step": 186178, "epoch": 1538} {"train_loss": -40.25410461425781, "global_step": 186179, "epoch": 1538} {"train_loss": -40.17667770385742, "global_step": 186180, "epoch": 1538} {"train_loss": -37.62461471557617, "global_step": 186181, "epoch": 1538} {"train_loss": -40.26580047607422, "global_step": 186182, "epoch": 1538} {"train_loss": -39.08058547973633, "global_step": 186183, "epoch": 1538} {"train_loss": -37.95835494995117, "global_step": 186184, "epoch": 1538} {"train_loss": -37.64473342895508, "global_step": 186185, "epoch": 1538} {"train_loss": -39.68143844604492, "global_step": 186186, "epoch": 1538} {"train_loss": -37.4032096862793, "global_step": 186187, "epoch": 1538} {"train_loss": -39.92873001098633, "global_step": 186188, "epoch": 1538} {"train_loss": -39.99605941772461, "global_step": 186189, "epoch": 1538} {"train_loss": -40.07207107543945, "global_step": 186190, "epoch": 1538} {"train_loss": -39.997901916503906, "global_step": 186191, "epoch": 1538} {"train_loss": -40.88900375366211, "global_step": 186192, "epoch": 1538} {"train_loss": -39.158172607421875, "global_step": 186193, "epoch": 1538} {"train_loss": -40.68269729614258, "global_step": 186194, "epoch": 1538} {"train_loss": -40.73067855834961, "global_step": 186195, "epoch": 1538} {"train_loss": -38.18807601928711, "global_step": 186196, "epoch": 1538} {"train_loss": -40.041927337646484, "global_step": 186197, "epoch": 1538} {"train_loss": -39.96183395385742, "global_step": 186198, "epoch": 1538} {"train_loss": -39.30837631225586, "global_step": 186199, "epoch": 1538} {"train_loss": -40.2528076171875, "global_step": 186200, "epoch": 1538} {"train_loss": -40.1489372253418, "global_step": 186201, "epoch": 1538} {"train_loss": -41.013973236083984, "global_step": 186202, "epoch": 1538} {"train_loss": -40.652801513671875, "global_step": 186203, "epoch": 1538} {"train_loss": -39.417537689208984, "global_step": 186204, "epoch": 1538} {"train_loss": -36.65976333618164, "global_step": 186205, "epoch": 1538} {"train_loss": -39.63154220581055, "global_step": 186206, "epoch": 1538} {"train_loss": -39.951473236083984, "global_step": 186207, "epoch": 1538} {"train_loss": -40.371212005615234, "global_step": 186208, "epoch": 1538} {"train_loss": -39.942501068115234, "global_step": 186209, "epoch": 1538} {"train_loss": -40.04624557495117, "global_step": 186210, "epoch": 1538} {"train_loss": -41.44434356689453, "global_step": 186211, "epoch": 1538} {"train_loss": -39.226131439208984, "global_step": 186212, "epoch": 1538} {"train_loss": -41.27104187011719, "global_step": 186213, "epoch": 1538} {"train_loss": -41.04435729980469, "global_step": 186214, "epoch": 1538} {"train_loss": -41.553871154785156, "global_step": 186215, "epoch": 1538} {"train_loss": -38.768463134765625, "global_step": 186216, "epoch": 1538} {"train_loss": -40.32381057739258, "global_step": 186217, "epoch": 1538} {"train_loss": -40.56259426400681, "global_step": 186218, "epoch": 1538, "val_loss": 2685995.75} {"train_loss": -39.4755973815918, "global_step": 186219, "epoch": 1539} {"train_loss": -39.63398742675781, "global_step": 186220, "epoch": 1539} {"train_loss": -40.75741958618164, "global_step": 186221, "epoch": 1539} {"train_loss": -40.82137680053711, "global_step": 186222, "epoch": 1539} {"train_loss": -40.778045654296875, "global_step": 186223, "epoch": 1539} {"train_loss": -39.3477668762207, "global_step": 186224, "epoch": 1539} {"train_loss": -40.00333023071289, "global_step": 186225, "epoch": 1539} {"train_loss": -41.36193084716797, "global_step": 186226, "epoch": 1539} {"train_loss": -41.116085052490234, "global_step": 186227, "epoch": 1539} {"train_loss": -41.4747314453125, "global_step": 186228, "epoch": 1539} {"train_loss": -39.10428237915039, "global_step": 186229, "epoch": 1539} {"train_loss": -40.80070877075195, "global_step": 186230, "epoch": 1539} {"train_loss": -36.644893646240234, "global_step": 186231, "epoch": 1539} {"train_loss": -40.80845260620117, "global_step": 186232, "epoch": 1539} {"train_loss": -40.28898620605469, "global_step": 186233, "epoch": 1539} {"train_loss": -40.4359016418457, "global_step": 186234, "epoch": 1539} {"train_loss": -41.419708251953125, "global_step": 186235, "epoch": 1539} {"train_loss": -39.526466369628906, "global_step": 186236, "epoch": 1539} {"train_loss": -40.90535354614258, "global_step": 186237, "epoch": 1539} {"train_loss": -39.80168151855469, "global_step": 186238, "epoch": 1539} {"train_loss": -41.69720458984375, "global_step": 186239, "epoch": 1539} {"train_loss": -40.97471237182617, "global_step": 186240, "epoch": 1539} {"train_loss": -40.93574142456055, "global_step": 186241, "epoch": 1539} {"train_loss": -40.62129592895508, "global_step": 186242, "epoch": 1539} {"train_loss": -40.325416564941406, "global_step": 186243, "epoch": 1539} {"train_loss": -42.22493362426758, "global_step": 186244, "epoch": 1539} {"train_loss": -41.352783203125, "global_step": 186245, "epoch": 1539} {"train_loss": -38.5535888671875, "global_step": 186246, "epoch": 1539} {"train_loss": -41.17378234863281, "global_step": 186247, "epoch": 1539} {"train_loss": -40.7187385559082, "global_step": 186248, "epoch": 1539} {"train_loss": -41.68010330200195, "global_step": 186249, "epoch": 1539} {"train_loss": -41.86836624145508, "global_step": 186250, "epoch": 1539} {"train_loss": -41.41830062866211, "global_step": 186251, "epoch": 1539} {"train_loss": -41.958045959472656, "global_step": 186252, "epoch": 1539} {"train_loss": -40.2554817199707, "global_step": 186253, "epoch": 1539} {"train_loss": -41.81546401977539, "global_step": 186254, "epoch": 1539} {"train_loss": -41.727779388427734, "global_step": 186255, "epoch": 1539} {"train_loss": -41.516719818115234, "global_step": 186256, "epoch": 1539} {"train_loss": -41.71596908569336, "global_step": 186257, "epoch": 1539} {"train_loss": -41.89348220825195, "global_step": 186258, "epoch": 1539} {"train_loss": -41.80910110473633, "global_step": 186259, "epoch": 1539} {"train_loss": -41.66992950439453, "global_step": 186260, "epoch": 1539} {"train_loss": -41.917083740234375, "global_step": 186261, "epoch": 1539} {"train_loss": -41.89077377319336, "global_step": 186262, "epoch": 1539} {"train_loss": -40.3082275390625, "global_step": 186263, "epoch": 1539} {"train_loss": -40.761287689208984, "global_step": 186264, "epoch": 1539} {"train_loss": -41.84095001220703, "global_step": 186265, "epoch": 1539} {"train_loss": -41.34381103515625, "global_step": 186266, "epoch": 1539} {"train_loss": -41.21728515625, "global_step": 186267, "epoch": 1539} {"train_loss": -42.09374237060547, "global_step": 186268, "epoch": 1539} {"train_loss": -41.0324821472168, "global_step": 186269, "epoch": 1539} {"train_loss": -41.14033889770508, "global_step": 186270, "epoch": 1539} {"train_loss": -41.420711517333984, "global_step": 186271, "epoch": 1539} {"train_loss": -42.22991943359375, "global_step": 186272, "epoch": 1539} {"train_loss": -39.9832649230957, "global_step": 186273, "epoch": 1539} {"train_loss": -40.749629974365234, "global_step": 186274, "epoch": 1539} {"train_loss": -41.60612106323242, "global_step": 186275, "epoch": 1539} {"train_loss": -41.85932540893555, "global_step": 186276, "epoch": 1539} {"train_loss": -40.80078125, "global_step": 186277, "epoch": 1539} {"train_loss": -38.87358093261719, "global_step": 186278, "epoch": 1539} {"train_loss": -39.04336929321289, "global_step": 186279, "epoch": 1539} {"train_loss": -39.168338775634766, "global_step": 186280, "epoch": 1539} {"train_loss": -38.97257614135742, "global_step": 186281, "epoch": 1539} {"train_loss": -41.67252731323242, "global_step": 186282, "epoch": 1539} {"train_loss": -39.69682312011719, "global_step": 186283, "epoch": 1539} {"train_loss": -39.26424789428711, "global_step": 186284, "epoch": 1539} {"train_loss": -40.9136962890625, "global_step": 186285, "epoch": 1539} {"train_loss": -41.46894073486328, "global_step": 186286, "epoch": 1539} {"train_loss": -41.278900146484375, "global_step": 186287, "epoch": 1539} {"train_loss": -39.43016815185547, "global_step": 186288, "epoch": 1539} {"train_loss": -37.3640251159668, "global_step": 186289, "epoch": 1539} {"train_loss": -41.55630111694336, "global_step": 186290, "epoch": 1539} {"train_loss": -41.03208541870117, "global_step": 186291, "epoch": 1539} {"train_loss": -40.59968948364258, "global_step": 186292, "epoch": 1539} {"train_loss": -40.819007873535156, "global_step": 186293, "epoch": 1539} {"train_loss": -41.197914123535156, "global_step": 186294, "epoch": 1539} {"train_loss": -39.970314025878906, "global_step": 186295, "epoch": 1539} {"train_loss": -39.548824310302734, "global_step": 186296, "epoch": 1539} {"train_loss": -40.9702262878418, "global_step": 186297, "epoch": 1539} {"train_loss": -39.8917121887207, "global_step": 186298, "epoch": 1539} {"train_loss": -40.20001220703125, "global_step": 186299, "epoch": 1539} {"train_loss": -40.93349838256836, "global_step": 186300, "epoch": 1539} {"train_loss": -37.75788497924805, "global_step": 186301, "epoch": 1539} {"train_loss": -39.271175384521484, "global_step": 186302, "epoch": 1539} {"train_loss": -40.3209114074707, "global_step": 186303, "epoch": 1539} {"train_loss": -40.64638900756836, "global_step": 186304, "epoch": 1539} {"train_loss": -36.20137023925781, "global_step": 186305, "epoch": 1539} {"train_loss": -38.212608337402344, "global_step": 186306, "epoch": 1539} {"train_loss": -39.6722297668457, "global_step": 186307, "epoch": 1539} {"train_loss": -38.58430480957031, "global_step": 186308, "epoch": 1539} {"train_loss": -39.1473274230957, "global_step": 186309, "epoch": 1539} {"train_loss": -39.44172286987305, "global_step": 186310, "epoch": 1539} {"train_loss": -39.4013671875, "global_step": 186311, "epoch": 1539} {"train_loss": -38.38051986694336, "global_step": 186312, "epoch": 1539} {"train_loss": -39.33107376098633, "global_step": 186313, "epoch": 1539} {"train_loss": -37.395545959472656, "global_step": 186314, "epoch": 1539} {"train_loss": -40.27212905883789, "global_step": 186315, "epoch": 1539} {"train_loss": -40.259239196777344, "global_step": 186316, "epoch": 1539} {"train_loss": -40.05668258666992, "global_step": 186317, "epoch": 1539} {"train_loss": -40.51633071899414, "global_step": 186318, "epoch": 1539} {"train_loss": -40.245582580566406, "global_step": 186319, "epoch": 1539} {"train_loss": -40.19857406616211, "global_step": 186320, "epoch": 1539} {"train_loss": -39.934688568115234, "global_step": 186321, "epoch": 1539} {"train_loss": -39.47150421142578, "global_step": 186322, "epoch": 1539} {"train_loss": -39.581050872802734, "global_step": 186323, "epoch": 1539} {"train_loss": -40.64923095703125, "global_step": 186324, "epoch": 1539} {"train_loss": -39.77206039428711, "global_step": 186325, "epoch": 1539} {"train_loss": -39.12295150756836, "global_step": 186326, "epoch": 1539} {"train_loss": -40.15177917480469, "global_step": 186327, "epoch": 1539} {"train_loss": -40.21906280517578, "global_step": 186328, "epoch": 1539} {"train_loss": -39.33039474487305, "global_step": 186329, "epoch": 1539} {"train_loss": -40.33968734741211, "global_step": 186330, "epoch": 1539} {"train_loss": -40.780799865722656, "global_step": 186331, "epoch": 1539} {"train_loss": -40.557647705078125, "global_step": 186332, "epoch": 1539} {"train_loss": -41.260372161865234, "global_step": 186333, "epoch": 1539} {"train_loss": -41.03353500366211, "global_step": 186334, "epoch": 1539} {"train_loss": -41.07505416870117, "global_step": 186335, "epoch": 1539} {"train_loss": -40.60670852661133, "global_step": 186336, "epoch": 1539} {"train_loss": -40.67774963378906, "global_step": 186337, "epoch": 1539} {"train_loss": -41.10095977783203, "global_step": 186338, "epoch": 1539} {"train_loss": -40.421676288951524, "global_step": 186339, "epoch": 1539, "val_loss": 2608827.75} {"train_loss": -40.20181655883789, "global_step": 186340, "epoch": 1540} {"train_loss": -41.28325653076172, "global_step": 186341, "epoch": 1540} {"train_loss": -40.48000717163086, "global_step": 186342, "epoch": 1540} {"train_loss": -41.234066009521484, "global_step": 186343, "epoch": 1540} {"train_loss": -40.79753494262695, "global_step": 186344, "epoch": 1540} {"train_loss": -40.571624755859375, "global_step": 186345, "epoch": 1540} {"train_loss": -40.89813995361328, "global_step": 186346, "epoch": 1540} {"train_loss": -39.88778305053711, "global_step": 186347, "epoch": 1540} {"train_loss": -41.993446350097656, "global_step": 186348, "epoch": 1540} {"train_loss": -41.237892150878906, "global_step": 186349, "epoch": 1540} {"train_loss": -41.61970138549805, "global_step": 186350, "epoch": 1540} {"train_loss": -41.498531341552734, "global_step": 186351, "epoch": 1540} {"train_loss": -40.19765853881836, "global_step": 186352, "epoch": 1540} {"train_loss": -40.19339370727539, "global_step": 186353, "epoch": 1540} {"train_loss": -41.15612030029297, "global_step": 186354, "epoch": 1540} {"train_loss": -38.96274948120117, "global_step": 186355, "epoch": 1540} {"train_loss": -41.00297164916992, "global_step": 186356, "epoch": 1540} {"train_loss": -41.434608459472656, "global_step": 186357, "epoch": 1540} {"train_loss": -38.13010787963867, "global_step": 186358, "epoch": 1540} {"train_loss": -41.185829162597656, "global_step": 186359, "epoch": 1540} {"train_loss": -40.367984771728516, "global_step": 186360, "epoch": 1540} {"train_loss": -40.29852294921875, "global_step": 186361, "epoch": 1540} {"train_loss": -40.8188362121582, "global_step": 186362, "epoch": 1540} {"train_loss": -40.642417907714844, "global_step": 186363, "epoch": 1540} {"train_loss": -40.7150764465332, "global_step": 186364, "epoch": 1540} {"train_loss": -39.89658737182617, "global_step": 186365, "epoch": 1540} {"train_loss": -40.240047454833984, "global_step": 186366, "epoch": 1540} {"train_loss": -40.812843322753906, "global_step": 186367, "epoch": 1540} {"train_loss": -41.281497955322266, "global_step": 186368, "epoch": 1540} {"train_loss": -38.8621826171875, "global_step": 186369, "epoch": 1540} {"train_loss": -41.46337890625, "global_step": 186370, "epoch": 1540} {"train_loss": -40.84991455078125, "global_step": 186371, "epoch": 1540} {"train_loss": -41.67879867553711, "global_step": 186372, "epoch": 1540} {"train_loss": -41.08028793334961, "global_step": 186373, "epoch": 1540} {"train_loss": -39.4890022277832, "global_step": 186374, "epoch": 1540} {"train_loss": -36.12548065185547, "global_step": 186375, "epoch": 1540} {"train_loss": -39.35672378540039, "global_step": 186376, "epoch": 1540} {"train_loss": -41.42556381225586, "global_step": 186377, "epoch": 1540} {"train_loss": -40.118160247802734, "global_step": 186378, "epoch": 1540} {"train_loss": -40.77756881713867, "global_step": 186379, "epoch": 1540} {"train_loss": -38.576351165771484, "global_step": 186380, "epoch": 1540} {"train_loss": -41.16023254394531, "global_step": 186381, "epoch": 1540} {"train_loss": -37.45976257324219, "global_step": 186382, "epoch": 1540} {"train_loss": -41.2142448425293, "global_step": 186383, "epoch": 1540} {"train_loss": -41.78536605834961, "global_step": 186384, "epoch": 1540} {"train_loss": -40.3943977355957, "global_step": 186385, "epoch": 1540} {"train_loss": -41.05287551879883, "global_step": 186386, "epoch": 1540} {"train_loss": -41.445743560791016, "global_step": 186387, "epoch": 1540} {"train_loss": -34.28048324584961, "global_step": 186388, "epoch": 1540} {"train_loss": -41.088314056396484, "global_step": 186389, "epoch": 1540} {"train_loss": -41.285274505615234, "global_step": 186390, "epoch": 1540} {"train_loss": -40.689117431640625, "global_step": 186391, "epoch": 1540} {"train_loss": -40.805702209472656, "global_step": 186392, "epoch": 1540} {"train_loss": -40.240142822265625, "global_step": 186393, "epoch": 1540} {"train_loss": -41.75495147705078, "global_step": 186394, "epoch": 1540} {"train_loss": -41.260433197021484, "global_step": 186395, "epoch": 1540} {"train_loss": -39.15941619873047, "global_step": 186396, "epoch": 1540} {"train_loss": -40.61271286010742, "global_step": 186397, "epoch": 1540} {"train_loss": -38.96639633178711, "global_step": 186398, "epoch": 1540} {"train_loss": -39.99598693847656, "global_step": 186399, "epoch": 1540} {"train_loss": -40.315608978271484, "global_step": 186400, "epoch": 1540} {"train_loss": -40.49085235595703, "global_step": 186401, "epoch": 1540} {"train_loss": -40.60061264038086, "global_step": 186402, "epoch": 1540} {"train_loss": -37.99128341674805, "global_step": 186403, "epoch": 1540} {"train_loss": -41.301429748535156, "global_step": 186404, "epoch": 1540} {"train_loss": -40.931053161621094, "global_step": 186405, "epoch": 1540} {"train_loss": -40.523494720458984, "global_step": 186406, "epoch": 1540} {"train_loss": -41.089962005615234, "global_step": 186407, "epoch": 1540} {"train_loss": -41.496456146240234, "global_step": 186408, "epoch": 1540} {"train_loss": -41.32563400268555, "global_step": 186409, "epoch": 1540} {"train_loss": -40.1157341003418, "global_step": 186410, "epoch": 1540} {"train_loss": -41.316131591796875, "global_step": 186411, "epoch": 1540} {"train_loss": -41.40964889526367, "global_step": 186412, "epoch": 1540} {"train_loss": -40.3330192565918, "global_step": 186413, "epoch": 1540} {"train_loss": -40.71541213989258, "global_step": 186414, "epoch": 1540} {"train_loss": -39.346717834472656, "global_step": 186415, "epoch": 1540} {"train_loss": -38.61658477783203, "global_step": 186416, "epoch": 1540} {"train_loss": -40.46234130859375, "global_step": 186417, "epoch": 1540} {"train_loss": -39.05735397338867, "global_step": 186418, "epoch": 1540} {"train_loss": -40.27376937866211, "global_step": 186419, "epoch": 1540} {"train_loss": -39.8978157043457, "global_step": 186420, "epoch": 1540} {"train_loss": -39.882904052734375, "global_step": 186421, "epoch": 1540} {"train_loss": -40.94636917114258, "global_step": 186422, "epoch": 1540} {"train_loss": -40.56303787231445, "global_step": 186423, "epoch": 1540} {"train_loss": -39.091426849365234, "global_step": 186424, "epoch": 1540} {"train_loss": -40.778377532958984, "global_step": 186425, "epoch": 1540} {"train_loss": -40.7216682434082, "global_step": 186426, "epoch": 1540} {"train_loss": -40.544918060302734, "global_step": 186427, "epoch": 1540} {"train_loss": -39.871456146240234, "global_step": 186428, "epoch": 1540} {"train_loss": -37.7247428894043, "global_step": 186429, "epoch": 1540} {"train_loss": -38.63459777832031, "global_step": 186430, "epoch": 1540} {"train_loss": -40.15692138671875, "global_step": 186431, "epoch": 1540} {"train_loss": -38.15816116333008, "global_step": 186432, "epoch": 1540} {"train_loss": -34.719764709472656, "global_step": 186433, "epoch": 1540} {"train_loss": -40.58744812011719, "global_step": 186434, "epoch": 1540} {"train_loss": -39.22556686401367, "global_step": 186435, "epoch": 1540} {"train_loss": -38.09889221191406, "global_step": 186436, "epoch": 1540} {"train_loss": -39.15436935424805, "global_step": 186437, "epoch": 1540} {"train_loss": -41.319393157958984, "global_step": 186438, "epoch": 1540} {"train_loss": -39.583614349365234, "global_step": 186439, "epoch": 1540} {"train_loss": -39.59284210205078, "global_step": 186440, "epoch": 1540} {"train_loss": -39.31106185913086, "global_step": 186441, "epoch": 1540} {"train_loss": -38.44337844848633, "global_step": 186442, "epoch": 1540} {"train_loss": -39.944244384765625, "global_step": 186443, "epoch": 1540} {"train_loss": -40.52478790283203, "global_step": 186444, "epoch": 1540} {"train_loss": -40.785430908203125, "global_step": 186445, "epoch": 1540} {"train_loss": -40.944435119628906, "global_step": 186446, "epoch": 1540} {"train_loss": -40.46397018432617, "global_step": 186447, "epoch": 1540} {"train_loss": -40.78937530517578, "global_step": 186448, "epoch": 1540} {"train_loss": -40.069942474365234, "global_step": 186449, "epoch": 1540} {"train_loss": -40.713314056396484, "global_step": 186450, "epoch": 1540} {"train_loss": -33.16102981567383, "global_step": 186451, "epoch": 1540} {"train_loss": -40.31412887573242, "global_step": 186452, "epoch": 1540} {"train_loss": -40.103729248046875, "global_step": 186453, "epoch": 1540} {"train_loss": -40.10710525512695, "global_step": 186454, "epoch": 1540} {"train_loss": -40.78489303588867, "global_step": 186455, "epoch": 1540} {"train_loss": -41.35287094116211, "global_step": 186456, "epoch": 1540} {"train_loss": -39.699581146240234, "global_step": 186457, "epoch": 1540} {"train_loss": -40.25661849975586, "global_step": 186458, "epoch": 1540} {"train_loss": -40.56789016723633, "global_step": 186459, "epoch": 1540} {"train_loss": -40.15691760354791, "global_step": 186460, "epoch": 1540, "val_loss": 2601353.25} {"train_loss": -40.258113861083984, "global_step": 186461, "epoch": 1541} {"train_loss": -41.31108093261719, "global_step": 186462, "epoch": 1541} {"train_loss": -40.970027923583984, "global_step": 186463, "epoch": 1541} {"train_loss": -41.24879455566406, "global_step": 186464, "epoch": 1541} {"train_loss": -40.630821228027344, "global_step": 186465, "epoch": 1541} {"train_loss": -39.847808837890625, "global_step": 186466, "epoch": 1541} {"train_loss": -40.86579132080078, "global_step": 186467, "epoch": 1541} {"train_loss": -41.64008331298828, "global_step": 186468, "epoch": 1541} {"train_loss": -41.270545959472656, "global_step": 186469, "epoch": 1541} {"train_loss": -40.652687072753906, "global_step": 186470, "epoch": 1541} {"train_loss": -41.67888259887695, "global_step": 186471, "epoch": 1541} {"train_loss": -41.28080368041992, "global_step": 186472, "epoch": 1541} {"train_loss": -41.5484619140625, "global_step": 186473, "epoch": 1541} {"train_loss": -40.897335052490234, "global_step": 186474, "epoch": 1541} {"train_loss": -41.02499008178711, "global_step": 186475, "epoch": 1541} {"train_loss": -40.85894775390625, "global_step": 186476, "epoch": 1541} {"train_loss": -41.73220443725586, "global_step": 186477, "epoch": 1541} {"train_loss": -41.33916473388672, "global_step": 186478, "epoch": 1541} {"train_loss": -41.80202102661133, "global_step": 186479, "epoch": 1541} {"train_loss": -41.2681884765625, "global_step": 186480, "epoch": 1541} {"train_loss": -40.69522476196289, "global_step": 186481, "epoch": 1541} {"train_loss": -41.61056137084961, "global_step": 186482, "epoch": 1541} {"train_loss": -41.354061126708984, "global_step": 186483, "epoch": 1541} {"train_loss": -40.536983489990234, "global_step": 186484, "epoch": 1541} {"train_loss": -41.43781280517578, "global_step": 186485, "epoch": 1541} {"train_loss": -41.63580322265625, "global_step": 186486, "epoch": 1541} {"train_loss": -41.046546936035156, "global_step": 186487, "epoch": 1541} {"train_loss": -41.63968276977539, "global_step": 186488, "epoch": 1541} {"train_loss": -41.96160125732422, "global_step": 186489, "epoch": 1541} {"train_loss": -41.9061393737793, "global_step": 186490, "epoch": 1541} {"train_loss": -41.50494384765625, "global_step": 186491, "epoch": 1541} {"train_loss": -41.746681213378906, "global_step": 186492, "epoch": 1541} {"train_loss": -40.63901138305664, "global_step": 186493, "epoch": 1541} {"train_loss": -41.57194137573242, "global_step": 186494, "epoch": 1541} {"train_loss": -41.20862579345703, "global_step": 186495, "epoch": 1541} {"train_loss": -40.66361618041992, "global_step": 186496, "epoch": 1541} {"train_loss": -41.23736572265625, "global_step": 186497, "epoch": 1541} {"train_loss": -41.61517333984375, "global_step": 186498, "epoch": 1541} {"train_loss": -41.626564025878906, "global_step": 186499, "epoch": 1541} {"train_loss": -42.09159851074219, "global_step": 186500, "epoch": 1541} {"train_loss": -41.39201736450195, "global_step": 186501, "epoch": 1541} {"train_loss": -41.04016876220703, "global_step": 186502, "epoch": 1541} {"train_loss": -40.392852783203125, "global_step": 186503, "epoch": 1541} {"train_loss": -41.15975570678711, "global_step": 186504, "epoch": 1541} {"train_loss": -41.26618194580078, "global_step": 186505, "epoch": 1541} {"train_loss": -41.83893966674805, "global_step": 186506, "epoch": 1541} {"train_loss": -41.58259582519531, "global_step": 186507, "epoch": 1541} {"train_loss": -40.54946517944336, "global_step": 186508, "epoch": 1541} {"train_loss": -40.40650177001953, "global_step": 186509, "epoch": 1541} {"train_loss": -42.01190185546875, "global_step": 186510, "epoch": 1541} {"train_loss": -40.21332550048828, "global_step": 186511, "epoch": 1541} {"train_loss": -38.336177825927734, "global_step": 186512, "epoch": 1541} {"train_loss": -37.05397415161133, "global_step": 186513, "epoch": 1541} {"train_loss": -35.04627990722656, "global_step": 186514, "epoch": 1541} {"train_loss": -40.085174560546875, "global_step": 186515, "epoch": 1541} {"train_loss": -41.683677673339844, "global_step": 186516, "epoch": 1541} {"train_loss": -39.80168914794922, "global_step": 186517, "epoch": 1541} {"train_loss": -34.854469299316406, "global_step": 186518, "epoch": 1541} {"train_loss": -31.508289337158203, "global_step": 186519, "epoch": 1541} {"train_loss": -34.04290771484375, "global_step": 186520, "epoch": 1541} {"train_loss": -39.190162658691406, "global_step": 186521, "epoch": 1541} {"train_loss": -37.18872833251953, "global_step": 186522, "epoch": 1541} {"train_loss": -36.49778366088867, "global_step": 186523, "epoch": 1541} {"train_loss": -36.75595474243164, "global_step": 186524, "epoch": 1541} {"train_loss": -38.809085845947266, "global_step": 186525, "epoch": 1541} {"train_loss": -38.6531867980957, "global_step": 186526, "epoch": 1541} {"train_loss": -38.28762435913086, "global_step": 186527, "epoch": 1541} {"train_loss": -40.1151123046875, "global_step": 186528, "epoch": 1541} {"train_loss": -38.5167236328125, "global_step": 186529, "epoch": 1541} {"train_loss": -37.475921630859375, "global_step": 186530, "epoch": 1541} {"train_loss": -39.768959045410156, "global_step": 186531, "epoch": 1541} {"train_loss": -37.6810302734375, "global_step": 186532, "epoch": 1541} {"train_loss": -40.632606506347656, "global_step": 186533, "epoch": 1541} {"train_loss": -39.0306510925293, "global_step": 186534, "epoch": 1541} {"train_loss": -40.092315673828125, "global_step": 186535, "epoch": 1541} {"train_loss": -39.65859603881836, "global_step": 186536, "epoch": 1541} {"train_loss": -40.600250244140625, "global_step": 186537, "epoch": 1541} {"train_loss": -39.48772048950195, "global_step": 186538, "epoch": 1541} {"train_loss": -40.649566650390625, "global_step": 186539, "epoch": 1541} {"train_loss": -40.385902404785156, "global_step": 186540, "epoch": 1541} {"train_loss": -40.844932556152344, "global_step": 186541, "epoch": 1541} {"train_loss": -40.20184326171875, "global_step": 186542, "epoch": 1541} {"train_loss": -40.9915771484375, "global_step": 186543, "epoch": 1541} {"train_loss": -39.91120529174805, "global_step": 186544, "epoch": 1541} {"train_loss": -41.127254486083984, "global_step": 186545, "epoch": 1541} {"train_loss": -40.8314208984375, "global_step": 186546, "epoch": 1541} {"train_loss": -40.925270080566406, "global_step": 186547, "epoch": 1541} {"train_loss": -40.83474349975586, "global_step": 186548, "epoch": 1541} {"train_loss": -40.59037399291992, "global_step": 186549, "epoch": 1541} {"train_loss": -40.562782287597656, "global_step": 186550, "epoch": 1541} {"train_loss": -41.29988479614258, "global_step": 186551, "epoch": 1541} {"train_loss": -40.317813873291016, "global_step": 186552, "epoch": 1541} {"train_loss": -40.426021575927734, "global_step": 186553, "epoch": 1541} {"train_loss": -41.29225540161133, "global_step": 186554, "epoch": 1541} {"train_loss": -40.850830078125, "global_step": 186555, "epoch": 1541} {"train_loss": -41.570194244384766, "global_step": 186556, "epoch": 1541} {"train_loss": -41.2130126953125, "global_step": 186557, "epoch": 1541} {"train_loss": -41.704647064208984, "global_step": 186558, "epoch": 1541} {"train_loss": -41.60529327392578, "global_step": 186559, "epoch": 1541} {"train_loss": -41.396915435791016, "global_step": 186560, "epoch": 1541} {"train_loss": -41.12788009643555, "global_step": 186561, "epoch": 1541} {"train_loss": -41.700225830078125, "global_step": 186562, "epoch": 1541} {"train_loss": -41.47610092163086, "global_step": 186563, "epoch": 1541} {"train_loss": -41.40464401245117, "global_step": 186564, "epoch": 1541} {"train_loss": -41.31960678100586, "global_step": 186565, "epoch": 1541} {"train_loss": -42.05144119262695, "global_step": 186566, "epoch": 1541} {"train_loss": -41.47122573852539, "global_step": 186567, "epoch": 1541} {"train_loss": -41.6186637878418, "global_step": 186568, "epoch": 1541} {"train_loss": -41.973812103271484, "global_step": 186569, "epoch": 1541} {"train_loss": -41.67293930053711, "global_step": 186570, "epoch": 1541} {"train_loss": -41.93076705932617, "global_step": 186571, "epoch": 1541} {"train_loss": -42.0706672668457, "global_step": 186572, "epoch": 1541} {"train_loss": -41.85480499267578, "global_step": 186573, "epoch": 1541} {"train_loss": -42.458431243896484, "global_step": 186574, "epoch": 1541} {"train_loss": -42.121543884277344, "global_step": 186575, "epoch": 1541} {"train_loss": -41.970924377441406, "global_step": 186576, "epoch": 1541} {"train_loss": -41.89019775390625, "global_step": 186577, "epoch": 1541} {"train_loss": -41.812232971191406, "global_step": 186578, "epoch": 1541} {"train_loss": -42.10453414916992, "global_step": 186579, "epoch": 1541} {"train_loss": -42.35209274291992, "global_step": 186580, "epoch": 1541} {"train_loss": -40.58090187892441, "global_step": 186581, "epoch": 1541, "val_loss": 2684375.25} {"train_loss": -42.44810104370117, "global_step": 186582, "epoch": 1542} {"train_loss": -42.0404167175293, "global_step": 186583, "epoch": 1542} {"train_loss": -41.617061614990234, "global_step": 186584, "epoch": 1542} {"train_loss": -41.75271224975586, "global_step": 186585, "epoch": 1542} {"train_loss": -41.57313919067383, "global_step": 186586, "epoch": 1542} {"train_loss": -41.3018798828125, "global_step": 186587, "epoch": 1542} {"train_loss": -40.82386779785156, "global_step": 186588, "epoch": 1542} {"train_loss": -42.37949752807617, "global_step": 186589, "epoch": 1542} {"train_loss": -42.11745834350586, "global_step": 186590, "epoch": 1542} {"train_loss": -41.201663970947266, "global_step": 186591, "epoch": 1542} {"train_loss": -39.909183502197266, "global_step": 186592, "epoch": 1542} {"train_loss": -40.5782470703125, "global_step": 186593, "epoch": 1542} {"train_loss": -42.24102020263672, "global_step": 186594, "epoch": 1542} {"train_loss": -41.58106231689453, "global_step": 186595, "epoch": 1542} {"train_loss": -39.06563186645508, "global_step": 186596, "epoch": 1542} {"train_loss": -34.847930908203125, "global_step": 186597, "epoch": 1542} {"train_loss": -37.65776062011719, "global_step": 186598, "epoch": 1542} {"train_loss": -41.09744644165039, "global_step": 186599, "epoch": 1542} {"train_loss": -40.969757080078125, "global_step": 186600, "epoch": 1542} {"train_loss": -38.575416564941406, "global_step": 186601, "epoch": 1542} {"train_loss": -37.99071502685547, "global_step": 186602, "epoch": 1542} {"train_loss": -39.34391403198242, "global_step": 186603, "epoch": 1542} {"train_loss": -40.07441329956055, "global_step": 186604, "epoch": 1542} {"train_loss": -40.073299407958984, "global_step": 186605, "epoch": 1542} {"train_loss": -40.64411926269531, "global_step": 186606, "epoch": 1542} {"train_loss": -40.956600189208984, "global_step": 186607, "epoch": 1542} {"train_loss": -40.68397903442383, "global_step": 186608, "epoch": 1542} {"train_loss": -40.5511589050293, "global_step": 186609, "epoch": 1542} {"train_loss": -40.76188278198242, "global_step": 186610, "epoch": 1542} {"train_loss": -41.41178894042969, "global_step": 186611, "epoch": 1542} {"train_loss": -40.16199493408203, "global_step": 186612, "epoch": 1542} {"train_loss": -40.48727035522461, "global_step": 186613, "epoch": 1542} {"train_loss": -40.71922302246094, "global_step": 186614, "epoch": 1542} {"train_loss": -40.76505661010742, "global_step": 186615, "epoch": 1542} {"train_loss": -41.80736541748047, "global_step": 186616, "epoch": 1542} {"train_loss": -41.20061111450195, "global_step": 186617, "epoch": 1542} {"train_loss": -40.59170150756836, "global_step": 186618, "epoch": 1542} {"train_loss": -38.98590850830078, "global_step": 186619, "epoch": 1542} {"train_loss": -40.35053253173828, "global_step": 186620, "epoch": 1542} {"train_loss": -39.42096710205078, "global_step": 186621, "epoch": 1542} {"train_loss": -41.32077407836914, "global_step": 186622, "epoch": 1542} {"train_loss": -40.83466720581055, "global_step": 186623, "epoch": 1542} {"train_loss": -41.02940368652344, "global_step": 186624, "epoch": 1542} {"train_loss": -42.121822357177734, "global_step": 186625, "epoch": 1542} {"train_loss": -40.333534240722656, "global_step": 186626, "epoch": 1542} {"train_loss": -40.804603576660156, "global_step": 186627, "epoch": 1542} {"train_loss": -41.40574645996094, "global_step": 186628, "epoch": 1542} {"train_loss": -38.54307174682617, "global_step": 186629, "epoch": 1542} {"train_loss": -39.556129455566406, "global_step": 186630, "epoch": 1542} {"train_loss": -41.32694625854492, "global_step": 186631, "epoch": 1542} {"train_loss": -38.4363899230957, "global_step": 186632, "epoch": 1542} {"train_loss": -39.866676330566406, "global_step": 186633, "epoch": 1542} {"train_loss": -40.22408676147461, "global_step": 186634, "epoch": 1542} {"train_loss": -39.80870819091797, "global_step": 186635, "epoch": 1542} {"train_loss": -38.03772735595703, "global_step": 186636, "epoch": 1542} {"train_loss": -34.81438064575195, "global_step": 186637, "epoch": 1542} {"train_loss": -40.609222412109375, "global_step": 186638, "epoch": 1542} {"train_loss": -39.16121292114258, "global_step": 186639, "epoch": 1542} {"train_loss": -38.585323333740234, "global_step": 186640, "epoch": 1542} {"train_loss": -39.38644790649414, "global_step": 186641, "epoch": 1542} {"train_loss": -37.26139450073242, "global_step": 186642, "epoch": 1542} {"train_loss": -39.8331184387207, "global_step": 186643, "epoch": 1542} {"train_loss": -38.636627197265625, "global_step": 186644, "epoch": 1542} {"train_loss": -39.408302307128906, "global_step": 186645, "epoch": 1542} {"train_loss": -37.2897834777832, "global_step": 186646, "epoch": 1542} {"train_loss": -38.24274444580078, "global_step": 186647, "epoch": 1542} {"train_loss": -39.4726448059082, "global_step": 186648, "epoch": 1542} {"train_loss": -34.38241195678711, "global_step": 186649, "epoch": 1542} {"train_loss": -40.206336975097656, "global_step": 186650, "epoch": 1542} {"train_loss": -40.3782958984375, "global_step": 186651, "epoch": 1542} {"train_loss": -34.046478271484375, "global_step": 186652, "epoch": 1542} {"train_loss": -38.37469482421875, "global_step": 186653, "epoch": 1542} {"train_loss": -40.29880905151367, "global_step": 186654, "epoch": 1542} {"train_loss": -38.70101547241211, "global_step": 186655, "epoch": 1542} {"train_loss": -37.73075485229492, "global_step": 186656, "epoch": 1542} {"train_loss": -39.79925537109375, "global_step": 186657, "epoch": 1542} {"train_loss": -39.72615051269531, "global_step": 186658, "epoch": 1542} {"train_loss": -40.366859436035156, "global_step": 186659, "epoch": 1542} {"train_loss": -39.12733840942383, "global_step": 186660, "epoch": 1542} {"train_loss": -39.77338409423828, "global_step": 186661, "epoch": 1542} {"train_loss": -32.918365478515625, "global_step": 186662, "epoch": 1542} {"train_loss": -40.09619140625, "global_step": 186663, "epoch": 1542} {"train_loss": -39.5181770324707, "global_step": 186664, "epoch": 1542} {"train_loss": -40.57503890991211, "global_step": 186665, "epoch": 1542} {"train_loss": -37.602577209472656, "global_step": 186666, "epoch": 1542} {"train_loss": -40.86849594116211, "global_step": 186667, "epoch": 1542} {"train_loss": -39.22733688354492, "global_step": 186668, "epoch": 1542} {"train_loss": -39.695594787597656, "global_step": 186669, "epoch": 1542} {"train_loss": -40.0279655456543, "global_step": 186670, "epoch": 1542} {"train_loss": -35.5787353515625, "global_step": 186671, "epoch": 1542} {"train_loss": -39.92820358276367, "global_step": 186672, "epoch": 1542} {"train_loss": -39.20054244995117, "global_step": 186673, "epoch": 1542} {"train_loss": -39.97261428833008, "global_step": 186674, "epoch": 1542} {"train_loss": -39.805023193359375, "global_step": 186675, "epoch": 1542} {"train_loss": -37.85776138305664, "global_step": 186676, "epoch": 1542} {"train_loss": -38.491371154785156, "global_step": 186677, "epoch": 1542} {"train_loss": -40.538848876953125, "global_step": 186678, "epoch": 1542} {"train_loss": -40.55329132080078, "global_step": 186679, "epoch": 1542} {"train_loss": -40.27349853515625, "global_step": 186680, "epoch": 1542} {"train_loss": -40.97774887084961, "global_step": 186681, "epoch": 1542} {"train_loss": -38.91313552856445, "global_step": 186682, "epoch": 1542} {"train_loss": -40.06642532348633, "global_step": 186683, "epoch": 1542} {"train_loss": -40.83608627319336, "global_step": 186684, "epoch": 1542} {"train_loss": -40.02138137817383, "global_step": 186685, "epoch": 1542} {"train_loss": -39.483154296875, "global_step": 186686, "epoch": 1542} {"train_loss": -38.859649658203125, "global_step": 186687, "epoch": 1542} {"train_loss": -39.510772705078125, "global_step": 186688, "epoch": 1542} {"train_loss": -40.02786636352539, "global_step": 186689, "epoch": 1542} {"train_loss": -39.56743240356445, "global_step": 186690, "epoch": 1542} {"train_loss": -40.12395095825195, "global_step": 186691, "epoch": 1542} {"train_loss": -40.96770477294922, "global_step": 186692, "epoch": 1542} {"train_loss": -40.37667465209961, "global_step": 186693, "epoch": 1542} {"train_loss": -41.000946044921875, "global_step": 186694, "epoch": 1542} {"train_loss": -41.38401412963867, "global_step": 186695, "epoch": 1542} {"train_loss": -40.62766647338867, "global_step": 186696, "epoch": 1542} {"train_loss": -40.99229049682617, "global_step": 186697, "epoch": 1542} {"train_loss": -41.559017181396484, "global_step": 186698, "epoch": 1542} {"train_loss": -41.06116485595703, "global_step": 186699, "epoch": 1542} {"train_loss": -41.2136344909668, "global_step": 186700, "epoch": 1542} {"train_loss": -41.20504379272461, "global_step": 186701, "epoch": 1542} {"train_loss": -39.85317996316705, "global_step": 186702, "epoch": 1542, "val_loss": 2745756.5} {"train_loss": -41.18739700317383, "global_step": 186703, "epoch": 1543} {"train_loss": -41.28034591674805, "global_step": 186704, "epoch": 1543} {"train_loss": -40.43879318237305, "global_step": 186705, "epoch": 1543} {"train_loss": -41.19243621826172, "global_step": 186706, "epoch": 1543} {"train_loss": -41.2286491394043, "global_step": 186707, "epoch": 1543} {"train_loss": -40.6713981628418, "global_step": 186708, "epoch": 1543} {"train_loss": -41.17055130004883, "global_step": 186709, "epoch": 1543} {"train_loss": -41.84200668334961, "global_step": 186710, "epoch": 1543} {"train_loss": -41.3510856628418, "global_step": 186711, "epoch": 1543} {"train_loss": -41.59482955932617, "global_step": 186712, "epoch": 1543} {"train_loss": -41.75922393798828, "global_step": 186713, "epoch": 1543} {"train_loss": -40.45490646362305, "global_step": 186714, "epoch": 1543} {"train_loss": -41.17202377319336, "global_step": 186715, "epoch": 1543} {"train_loss": -41.42306137084961, "global_step": 186716, "epoch": 1543} {"train_loss": -42.16497039794922, "global_step": 186717, "epoch": 1543} {"train_loss": -41.358821868896484, "global_step": 186718, "epoch": 1543} {"train_loss": -42.094696044921875, "global_step": 186719, "epoch": 1543} {"train_loss": -42.011207580566406, "global_step": 186720, "epoch": 1543} {"train_loss": -41.122779846191406, "global_step": 186721, "epoch": 1543} {"train_loss": -42.265159606933594, "global_step": 186722, "epoch": 1543} {"train_loss": -41.7611198425293, "global_step": 186723, "epoch": 1543} {"train_loss": -41.61774826049805, "global_step": 186724, "epoch": 1543} {"train_loss": -41.76237869262695, "global_step": 186725, "epoch": 1543} {"train_loss": -41.46744155883789, "global_step": 186726, "epoch": 1543} {"train_loss": -41.528194427490234, "global_step": 186727, "epoch": 1543} {"train_loss": -40.52439498901367, "global_step": 186728, "epoch": 1543} {"train_loss": -40.82463455200195, "global_step": 186729, "epoch": 1543} {"train_loss": -41.91298294067383, "global_step": 186730, "epoch": 1543} {"train_loss": -41.43709945678711, "global_step": 186731, "epoch": 1543} {"train_loss": -40.98411178588867, "global_step": 186732, "epoch": 1543} {"train_loss": -40.97056198120117, "global_step": 186733, "epoch": 1543} {"train_loss": -40.94639205932617, "global_step": 186734, "epoch": 1543} {"train_loss": -41.39126205444336, "global_step": 186735, "epoch": 1543} {"train_loss": -41.445247650146484, "global_step": 186736, "epoch": 1543} {"train_loss": -40.77106857299805, "global_step": 186737, "epoch": 1543} {"train_loss": -40.393157958984375, "global_step": 186738, "epoch": 1543} {"train_loss": -40.59944152832031, "global_step": 186739, "epoch": 1543} {"train_loss": -40.702266693115234, "global_step": 186740, "epoch": 1543} {"train_loss": -40.33560562133789, "global_step": 186741, "epoch": 1543} {"train_loss": -41.72118377685547, "global_step": 186742, "epoch": 1543} {"train_loss": -41.68971633911133, "global_step": 186743, "epoch": 1543} {"train_loss": -40.9909782409668, "global_step": 186744, "epoch": 1543} {"train_loss": -41.279052734375, "global_step": 186745, "epoch": 1543} {"train_loss": -41.296016693115234, "global_step": 186746, "epoch": 1543} {"train_loss": -41.03971481323242, "global_step": 186747, "epoch": 1543} {"train_loss": -41.7902717590332, "global_step": 186748, "epoch": 1543} {"train_loss": -41.15468978881836, "global_step": 186749, "epoch": 1543} {"train_loss": -41.15912628173828, "global_step": 186750, "epoch": 1543} {"train_loss": -41.51264572143555, "global_step": 186751, "epoch": 1543} {"train_loss": -41.742523193359375, "global_step": 186752, "epoch": 1543} {"train_loss": -40.56333541870117, "global_step": 186753, "epoch": 1543} {"train_loss": -40.90278625488281, "global_step": 186754, "epoch": 1543} {"train_loss": -39.73726272583008, "global_step": 186755, "epoch": 1543} {"train_loss": -38.24999237060547, "global_step": 186756, "epoch": 1543} {"train_loss": -39.40343475341797, "global_step": 186757, "epoch": 1543} {"train_loss": -40.657711029052734, "global_step": 186758, "epoch": 1543} {"train_loss": -40.847503662109375, "global_step": 186759, "epoch": 1543} {"train_loss": -39.57888412475586, "global_step": 186760, "epoch": 1543} {"train_loss": -39.453369140625, "global_step": 186761, "epoch": 1543} {"train_loss": -40.31534957885742, "global_step": 186762, "epoch": 1543} {"train_loss": -40.98529815673828, "global_step": 186763, "epoch": 1543} {"train_loss": -39.058349609375, "global_step": 186764, "epoch": 1543} {"train_loss": -38.41459274291992, "global_step": 186765, "epoch": 1543} {"train_loss": -40.335662841796875, "global_step": 186766, "epoch": 1543} {"train_loss": -39.98203659057617, "global_step": 186767, "epoch": 1543} {"train_loss": -38.23246383666992, "global_step": 186768, "epoch": 1543} {"train_loss": -40.10824203491211, "global_step": 186769, "epoch": 1543} {"train_loss": -39.51109313964844, "global_step": 186770, "epoch": 1543} {"train_loss": -39.32725143432617, "global_step": 186771, "epoch": 1543} {"train_loss": -39.30623245239258, "global_step": 186772, "epoch": 1543} {"train_loss": -40.994258880615234, "global_step": 186773, "epoch": 1543} {"train_loss": -39.42865753173828, "global_step": 186774, "epoch": 1543} {"train_loss": -39.24463653564453, "global_step": 186775, "epoch": 1543} {"train_loss": -39.774044036865234, "global_step": 186776, "epoch": 1543} {"train_loss": -39.75848388671875, "global_step": 186777, "epoch": 1543} {"train_loss": -40.256229400634766, "global_step": 186778, "epoch": 1543} {"train_loss": -40.75087356567383, "global_step": 186779, "epoch": 1543} {"train_loss": -40.755897521972656, "global_step": 186780, "epoch": 1543} {"train_loss": -41.25321578979492, "global_step": 186781, "epoch": 1543} {"train_loss": -41.21549606323242, "global_step": 186782, "epoch": 1543} {"train_loss": -41.500831604003906, "global_step": 186783, "epoch": 1543} {"train_loss": -41.639984130859375, "global_step": 186784, "epoch": 1543} {"train_loss": -41.47914505004883, "global_step": 186785, "epoch": 1543} {"train_loss": -41.9246711730957, "global_step": 186786, "epoch": 1543} {"train_loss": -41.43527603149414, "global_step": 186787, "epoch": 1543} {"train_loss": -41.27834701538086, "global_step": 186788, "epoch": 1543} {"train_loss": -41.78499984741211, "global_step": 186789, "epoch": 1543} {"train_loss": -41.51778030395508, "global_step": 186790, "epoch": 1543} {"train_loss": -41.0528678894043, "global_step": 186791, "epoch": 1543} {"train_loss": -41.76613998413086, "global_step": 186792, "epoch": 1543} {"train_loss": -40.8513069152832, "global_step": 186793, "epoch": 1543} {"train_loss": -41.60717010498047, "global_step": 186794, "epoch": 1543} {"train_loss": -41.7360954284668, "global_step": 186795, "epoch": 1543} {"train_loss": -41.72983932495117, "global_step": 186796, "epoch": 1543} {"train_loss": -40.85675811767578, "global_step": 186797, "epoch": 1543} {"train_loss": -41.831207275390625, "global_step": 186798, "epoch": 1543} {"train_loss": -37.47365951538086, "global_step": 186799, "epoch": 1543} {"train_loss": -41.155452728271484, "global_step": 186800, "epoch": 1543} {"train_loss": -41.35871505737305, "global_step": 186801, "epoch": 1543} {"train_loss": -41.66676330566406, "global_step": 186802, "epoch": 1543} {"train_loss": -40.747886657714844, "global_step": 186803, "epoch": 1543} {"train_loss": -41.351558685302734, "global_step": 186804, "epoch": 1543} {"train_loss": -39.55562973022461, "global_step": 186805, "epoch": 1543} {"train_loss": -41.50907516479492, "global_step": 186806, "epoch": 1543} {"train_loss": -41.15530014038086, "global_step": 186807, "epoch": 1543} {"train_loss": -40.706268310546875, "global_step": 186808, "epoch": 1543} {"train_loss": -39.783870697021484, "global_step": 186809, "epoch": 1543} {"train_loss": -40.018577575683594, "global_step": 186810, "epoch": 1543} {"train_loss": -41.05129623413086, "global_step": 186811, "epoch": 1543} {"train_loss": -40.78516387939453, "global_step": 186812, "epoch": 1543} {"train_loss": -40.82020950317383, "global_step": 186813, "epoch": 1543} {"train_loss": -39.512149810791016, "global_step": 186814, "epoch": 1543} {"train_loss": -39.58433532714844, "global_step": 186815, "epoch": 1543} {"train_loss": -40.94172286987305, "global_step": 186816, "epoch": 1543} {"train_loss": -39.61603927612305, "global_step": 186817, "epoch": 1543} {"train_loss": -38.87899398803711, "global_step": 186818, "epoch": 1543} {"train_loss": -40.6345329284668, "global_step": 186819, "epoch": 1543} {"train_loss": -41.077640533447266, "global_step": 186820, "epoch": 1543} {"train_loss": -38.73408889770508, "global_step": 186821, "epoch": 1543} {"train_loss": -39.6049690246582, "global_step": 186822, "epoch": 1543} {"train_loss": -40.78849546574364, "global_step": 186823, "epoch": 1543, "val_loss": 2673999.75} {"train_loss": -37.103477478027344, "global_step": 186824, "epoch": 1544} {"train_loss": -40.6750602722168, "global_step": 186825, "epoch": 1544} {"train_loss": -39.676483154296875, "global_step": 186826, "epoch": 1544} {"train_loss": -36.79989242553711, "global_step": 186827, "epoch": 1544} {"train_loss": -40.23600387573242, "global_step": 186828, "epoch": 1544} {"train_loss": -39.243560791015625, "global_step": 186829, "epoch": 1544} {"train_loss": -37.507381439208984, "global_step": 186830, "epoch": 1544} {"train_loss": -40.26803207397461, "global_step": 186831, "epoch": 1544} {"train_loss": -39.24738693237305, "global_step": 186832, "epoch": 1544} {"train_loss": -39.58359909057617, "global_step": 186833, "epoch": 1544} {"train_loss": -40.05947494506836, "global_step": 186834, "epoch": 1544} {"train_loss": -38.3619384765625, "global_step": 186835, "epoch": 1544} {"train_loss": -39.84638214111328, "global_step": 186836, "epoch": 1544} {"train_loss": -40.2275390625, "global_step": 186837, "epoch": 1544} {"train_loss": -39.32307052612305, "global_step": 186838, "epoch": 1544} {"train_loss": -40.18262481689453, "global_step": 186839, "epoch": 1544} {"train_loss": -41.129817962646484, "global_step": 186840, "epoch": 1544} {"train_loss": -39.667110443115234, "global_step": 186841, "epoch": 1544} {"train_loss": -40.699790954589844, "global_step": 186842, "epoch": 1544} {"train_loss": -39.43599319458008, "global_step": 186843, "epoch": 1544} {"train_loss": -36.7894287109375, "global_step": 186844, "epoch": 1544} {"train_loss": -40.719844818115234, "global_step": 186845, "epoch": 1544} {"train_loss": -39.166072845458984, "global_step": 186846, "epoch": 1544} {"train_loss": -38.37579345703125, "global_step": 186847, "epoch": 1544} {"train_loss": -40.33314895629883, "global_step": 186848, "epoch": 1544} {"train_loss": -39.517616271972656, "global_step": 186849, "epoch": 1544} {"train_loss": -39.56333541870117, "global_step": 186850, "epoch": 1544} {"train_loss": -40.73097610473633, "global_step": 186851, "epoch": 1544} {"train_loss": -39.62237548828125, "global_step": 186852, "epoch": 1544} {"train_loss": -40.62435531616211, "global_step": 186853, "epoch": 1544} {"train_loss": -39.145851135253906, "global_step": 186854, "epoch": 1544} {"train_loss": -40.618377685546875, "global_step": 186855, "epoch": 1544} {"train_loss": -39.59662628173828, "global_step": 186856, "epoch": 1544} {"train_loss": -39.264923095703125, "global_step": 186857, "epoch": 1544} {"train_loss": -40.67223358154297, "global_step": 186858, "epoch": 1544} {"train_loss": -38.716835021972656, "global_step": 186859, "epoch": 1544} {"train_loss": -40.5587272644043, "global_step": 186860, "epoch": 1544} {"train_loss": -40.43292999267578, "global_step": 186861, "epoch": 1544} {"train_loss": -40.98698043823242, "global_step": 186862, "epoch": 1544} {"train_loss": -40.86660385131836, "global_step": 186863, "epoch": 1544} {"train_loss": -40.920867919921875, "global_step": 186864, "epoch": 1544} {"train_loss": -41.04785919189453, "global_step": 186865, "epoch": 1544} {"train_loss": -41.02071762084961, "global_step": 186866, "epoch": 1544} {"train_loss": -41.06290817260742, "global_step": 186867, "epoch": 1544} {"train_loss": -41.16284942626953, "global_step": 186868, "epoch": 1544} {"train_loss": -40.957557678222656, "global_step": 186869, "epoch": 1544} {"train_loss": -41.63214874267578, "global_step": 186870, "epoch": 1544} {"train_loss": -41.395023345947266, "global_step": 186871, "epoch": 1544} {"train_loss": -41.420047760009766, "global_step": 186872, "epoch": 1544} {"train_loss": -41.204647064208984, "global_step": 186873, "epoch": 1544} {"train_loss": -41.73768997192383, "global_step": 186874, "epoch": 1544} {"train_loss": -41.8536491394043, "global_step": 186875, "epoch": 1544} {"train_loss": -41.313289642333984, "global_step": 186876, "epoch": 1544} {"train_loss": -41.54542541503906, "global_step": 186877, "epoch": 1544} {"train_loss": -41.500457763671875, "global_step": 186878, "epoch": 1544} {"train_loss": -42.00520706176758, "global_step": 186879, "epoch": 1544} {"train_loss": -41.619178771972656, "global_step": 186880, "epoch": 1544} {"train_loss": -41.77251434326172, "global_step": 186881, "epoch": 1544} {"train_loss": -41.804168701171875, "global_step": 186882, "epoch": 1544} {"train_loss": -41.67995834350586, "global_step": 186883, "epoch": 1544} {"train_loss": -41.64854431152344, "global_step": 186884, "epoch": 1544} {"train_loss": -41.59939193725586, "global_step": 186885, "epoch": 1544} {"train_loss": -41.89834976196289, "global_step": 186886, "epoch": 1544} {"train_loss": -42.243221282958984, "global_step": 186887, "epoch": 1544} {"train_loss": -42.018714904785156, "global_step": 186888, "epoch": 1544} {"train_loss": -41.98540115356445, "global_step": 186889, "epoch": 1544} {"train_loss": -42.09364700317383, "global_step": 186890, "epoch": 1544} {"train_loss": -42.209835052490234, "global_step": 186891, "epoch": 1544} {"train_loss": -41.472171783447266, "global_step": 186892, "epoch": 1544} {"train_loss": -41.774436950683594, "global_step": 186893, "epoch": 1544} {"train_loss": -41.970123291015625, "global_step": 186894, "epoch": 1544} {"train_loss": -41.7223014831543, "global_step": 186895, "epoch": 1544} {"train_loss": -42.476837158203125, "global_step": 186896, "epoch": 1544} {"train_loss": -41.7067985534668, "global_step": 186897, "epoch": 1544} {"train_loss": -42.15707015991211, "global_step": 186898, "epoch": 1544} {"train_loss": -42.31338119506836, "global_step": 186899, "epoch": 1544} {"train_loss": -42.38351058959961, "global_step": 186900, "epoch": 1544} {"train_loss": -42.34281539916992, "global_step": 186901, "epoch": 1544} {"train_loss": -42.39012908935547, "global_step": 186902, "epoch": 1544} {"train_loss": -42.47334671020508, "global_step": 186903, "epoch": 1544} {"train_loss": -42.043434143066406, "global_step": 186904, "epoch": 1544} {"train_loss": -41.66384506225586, "global_step": 186905, "epoch": 1544} {"train_loss": -42.31169509887695, "global_step": 186906, "epoch": 1544} {"train_loss": -42.186031341552734, "global_step": 186907, "epoch": 1544} {"train_loss": -41.920074462890625, "global_step": 186908, "epoch": 1544} {"train_loss": -42.1750602722168, "global_step": 186909, "epoch": 1544} {"train_loss": -41.15703201293945, "global_step": 186910, "epoch": 1544} {"train_loss": -41.08153533935547, "global_step": 186911, "epoch": 1544} {"train_loss": -42.2205810546875, "global_step": 186912, "epoch": 1544} {"train_loss": -42.75220489501953, "global_step": 186913, "epoch": 1544} {"train_loss": -42.55376434326172, "global_step": 186914, "epoch": 1544} {"train_loss": -41.87228012084961, "global_step": 186915, "epoch": 1544} {"train_loss": -38.29526901245117, "global_step": 186916, "epoch": 1544} {"train_loss": -41.982967376708984, "global_step": 186917, "epoch": 1544} {"train_loss": -41.83185958862305, "global_step": 186918, "epoch": 1544} {"train_loss": -42.304443359375, "global_step": 186919, "epoch": 1544} {"train_loss": -41.727569580078125, "global_step": 186920, "epoch": 1544} {"train_loss": -40.61362838745117, "global_step": 186921, "epoch": 1544} {"train_loss": -41.70561599731445, "global_step": 186922, "epoch": 1544} {"train_loss": -41.7713508605957, "global_step": 186923, "epoch": 1544} {"train_loss": -40.858760833740234, "global_step": 186924, "epoch": 1544} {"train_loss": -40.85894012451172, "global_step": 186925, "epoch": 1544} {"train_loss": -40.291465759277344, "global_step": 186926, "epoch": 1544} {"train_loss": -39.931392669677734, "global_step": 186927, "epoch": 1544} {"train_loss": -39.74934768676758, "global_step": 186928, "epoch": 1544} {"train_loss": -40.21870040893555, "global_step": 186929, "epoch": 1544} {"train_loss": -40.60834884643555, "global_step": 186930, "epoch": 1544} {"train_loss": -38.964351654052734, "global_step": 186931, "epoch": 1544} {"train_loss": -38.183712005615234, "global_step": 186932, "epoch": 1544} {"train_loss": -41.720680236816406, "global_step": 186933, "epoch": 1544} {"train_loss": -41.54179000854492, "global_step": 186934, "epoch": 1544} {"train_loss": -37.51596450805664, "global_step": 186935, "epoch": 1544} {"train_loss": -40.39860534667969, "global_step": 186936, "epoch": 1544} {"train_loss": -39.954166412353516, "global_step": 186937, "epoch": 1544} {"train_loss": -39.883480072021484, "global_step": 186938, "epoch": 1544} {"train_loss": -41.228790283203125, "global_step": 186939, "epoch": 1544} {"train_loss": -41.30867385864258, "global_step": 186940, "epoch": 1544} {"train_loss": -39.32720184326172, "global_step": 186941, "epoch": 1544} {"train_loss": -39.36262893676758, "global_step": 186942, "epoch": 1544} {"train_loss": -39.15230941772461, "global_step": 186943, "epoch": 1544} {"train_loss": -40.74628202580223, "global_step": 186944, "epoch": 1544, "val_loss": 2650745.75} {"train_loss": -40.38597869873047, "global_step": 186945, "epoch": 1545} {"train_loss": -40.27949142456055, "global_step": 186946, "epoch": 1545} {"train_loss": -39.504920959472656, "global_step": 186947, "epoch": 1545} {"train_loss": -39.005714416503906, "global_step": 186948, "epoch": 1545} {"train_loss": -40.49459457397461, "global_step": 186949, "epoch": 1545} {"train_loss": -39.84942626953125, "global_step": 186950, "epoch": 1545} {"train_loss": -39.536983489990234, "global_step": 186951, "epoch": 1545} {"train_loss": -39.69854736328125, "global_step": 186952, "epoch": 1545} {"train_loss": -40.826072692871094, "global_step": 186953, "epoch": 1545} {"train_loss": -39.869388580322266, "global_step": 186954, "epoch": 1545} {"train_loss": -39.01428985595703, "global_step": 186955, "epoch": 1545} {"train_loss": -39.813819885253906, "global_step": 186956, "epoch": 1545} {"train_loss": -41.257564544677734, "global_step": 186957, "epoch": 1545} {"train_loss": -41.42678451538086, "global_step": 186958, "epoch": 1545} {"train_loss": -40.744606018066406, "global_step": 186959, "epoch": 1545} {"train_loss": -40.378883361816406, "global_step": 186960, "epoch": 1545} {"train_loss": -40.8395881652832, "global_step": 186961, "epoch": 1545} {"train_loss": -39.98628616333008, "global_step": 186962, "epoch": 1545} {"train_loss": -40.0242805480957, "global_step": 186963, "epoch": 1545} {"train_loss": -41.223140716552734, "global_step": 186964, "epoch": 1545} {"train_loss": -40.48723220825195, "global_step": 186965, "epoch": 1545} {"train_loss": -41.194183349609375, "global_step": 186966, "epoch": 1545} {"train_loss": -40.52138900756836, "global_step": 186967, "epoch": 1545} {"train_loss": -40.4705696105957, "global_step": 186968, "epoch": 1545} {"train_loss": -40.4592399597168, "global_step": 186969, "epoch": 1545} {"train_loss": -41.59572982788086, "global_step": 186970, "epoch": 1545} {"train_loss": -40.35363006591797, "global_step": 186971, "epoch": 1545} {"train_loss": -41.05255126953125, "global_step": 186972, "epoch": 1545} {"train_loss": -40.270809173583984, "global_step": 186973, "epoch": 1545} {"train_loss": -39.89044189453125, "global_step": 186974, "epoch": 1545} {"train_loss": -39.00643539428711, "global_step": 186975, "epoch": 1545} {"train_loss": -39.56861114501953, "global_step": 186976, "epoch": 1545} {"train_loss": -36.55786895751953, "global_step": 186977, "epoch": 1545} {"train_loss": -40.93998336791992, "global_step": 186978, "epoch": 1545} {"train_loss": -38.6947021484375, "global_step": 186979, "epoch": 1545} {"train_loss": -40.79535675048828, "global_step": 186980, "epoch": 1545} {"train_loss": -39.60471725463867, "global_step": 186981, "epoch": 1545} {"train_loss": -39.47930908203125, "global_step": 186982, "epoch": 1545} {"train_loss": -40.24497604370117, "global_step": 186983, "epoch": 1545} {"train_loss": -40.86263656616211, "global_step": 186984, "epoch": 1545} {"train_loss": -41.21759796142578, "global_step": 186985, "epoch": 1545} {"train_loss": -40.09334945678711, "global_step": 186986, "epoch": 1545} {"train_loss": -41.473567962646484, "global_step": 186987, "epoch": 1545} {"train_loss": -40.22256088256836, "global_step": 186988, "epoch": 1545} {"train_loss": -41.40974426269531, "global_step": 186989, "epoch": 1545} {"train_loss": -39.64877700805664, "global_step": 186990, "epoch": 1545} {"train_loss": -40.40290451049805, "global_step": 186991, "epoch": 1545} {"train_loss": -41.20444107055664, "global_step": 186992, "epoch": 1545} {"train_loss": -34.301025390625, "global_step": 186993, "epoch": 1545} {"train_loss": -35.83391189575195, "global_step": 186994, "epoch": 1545} {"train_loss": -40.7916259765625, "global_step": 186995, "epoch": 1545} {"train_loss": -40.50983810424805, "global_step": 186996, "epoch": 1545} {"train_loss": -39.95026779174805, "global_step": 186997, "epoch": 1545} {"train_loss": -41.35427474975586, "global_step": 186998, "epoch": 1545} {"train_loss": -40.97309112548828, "global_step": 186999, "epoch": 1545} {"train_loss": -41.08590316772461, "global_step": 187000, "epoch": 1545} {"train_loss": -41.0041389465332, "global_step": 187001, "epoch": 1545} {"train_loss": -41.047462463378906, "global_step": 187002, "epoch": 1545} {"train_loss": -41.74330520629883, "global_step": 187003, "epoch": 1545} {"train_loss": -37.83909606933594, "global_step": 187004, "epoch": 1545} {"train_loss": -38.91832733154297, "global_step": 187005, "epoch": 1545} {"train_loss": -40.93525314331055, "global_step": 187006, "epoch": 1545} {"train_loss": -41.10895538330078, "global_step": 187007, "epoch": 1545} {"train_loss": -41.319454193115234, "global_step": 187008, "epoch": 1545} {"train_loss": -41.075714111328125, "global_step": 187009, "epoch": 1545} {"train_loss": -41.06747817993164, "global_step": 187010, "epoch": 1545} {"train_loss": -41.807472229003906, "global_step": 187011, "epoch": 1545} {"train_loss": -41.39479064941406, "global_step": 187012, "epoch": 1545} {"train_loss": -41.829689025878906, "global_step": 187013, "epoch": 1545} {"train_loss": -41.57616424560547, "global_step": 187014, "epoch": 1545} {"train_loss": -41.88396072387695, "global_step": 187015, "epoch": 1545} {"train_loss": -41.51556396484375, "global_step": 187016, "epoch": 1545} {"train_loss": -42.24488067626953, "global_step": 187017, "epoch": 1545} {"train_loss": -41.5798225402832, "global_step": 187018, "epoch": 1545} {"train_loss": -40.90633773803711, "global_step": 187019, "epoch": 1545} {"train_loss": -41.67955017089844, "global_step": 187020, "epoch": 1545} {"train_loss": -41.88069152832031, "global_step": 187021, "epoch": 1545} {"train_loss": -41.72597122192383, "global_step": 187022, "epoch": 1545} {"train_loss": -42.08242416381836, "global_step": 187023, "epoch": 1545} {"train_loss": -41.46778106689453, "global_step": 187024, "epoch": 1545} {"train_loss": -41.029510498046875, "global_step": 187025, "epoch": 1545} {"train_loss": -40.60166931152344, "global_step": 187026, "epoch": 1545} {"train_loss": -42.23262405395508, "global_step": 187027, "epoch": 1545} {"train_loss": -40.85301208496094, "global_step": 187028, "epoch": 1545} {"train_loss": -41.01223373413086, "global_step": 187029, "epoch": 1545} {"train_loss": -41.28228759765625, "global_step": 187030, "epoch": 1545} {"train_loss": -40.800167083740234, "global_step": 187031, "epoch": 1545} {"train_loss": -38.66744613647461, "global_step": 187032, "epoch": 1545} {"train_loss": -39.19198226928711, "global_step": 187033, "epoch": 1545} {"train_loss": -41.82332992553711, "global_step": 187034, "epoch": 1545} {"train_loss": -38.2437744140625, "global_step": 187035, "epoch": 1545} {"train_loss": -38.687538146972656, "global_step": 187036, "epoch": 1545} {"train_loss": -38.215187072753906, "global_step": 187037, "epoch": 1545} {"train_loss": -41.07009506225586, "global_step": 187038, "epoch": 1545} {"train_loss": -40.36344528198242, "global_step": 187039, "epoch": 1545} {"train_loss": -39.8298454284668, "global_step": 187040, "epoch": 1545} {"train_loss": -39.89352035522461, "global_step": 187041, "epoch": 1545} {"train_loss": -39.98093032836914, "global_step": 187042, "epoch": 1545} {"train_loss": -40.95429229736328, "global_step": 187043, "epoch": 1545} {"train_loss": -37.57669448852539, "global_step": 187044, "epoch": 1545} {"train_loss": -41.39155960083008, "global_step": 187045, "epoch": 1545} {"train_loss": -40.71312713623047, "global_step": 187046, "epoch": 1545} {"train_loss": -38.16312789916992, "global_step": 187047, "epoch": 1545} {"train_loss": -40.14449691772461, "global_step": 187048, "epoch": 1545} {"train_loss": -37.10065460205078, "global_step": 187049, "epoch": 1545} {"train_loss": -40.47140884399414, "global_step": 187050, "epoch": 1545} {"train_loss": -38.71107864379883, "global_step": 187051, "epoch": 1545} {"train_loss": -39.43534469604492, "global_step": 187052, "epoch": 1545} {"train_loss": -38.65874481201172, "global_step": 187053, "epoch": 1545} {"train_loss": -36.5536003112793, "global_step": 187054, "epoch": 1545} {"train_loss": -36.82827377319336, "global_step": 187055, "epoch": 1545} {"train_loss": -40.582244873046875, "global_step": 187056, "epoch": 1545} {"train_loss": -37.414306640625, "global_step": 187057, "epoch": 1545} {"train_loss": -39.63543701171875, "global_step": 187058, "epoch": 1545} {"train_loss": -39.82575607299805, "global_step": 187059, "epoch": 1545} {"train_loss": -40.67194366455078, "global_step": 187060, "epoch": 1545} {"train_loss": -37.27471923828125, "global_step": 187061, "epoch": 1545} {"train_loss": -39.54853057861328, "global_step": 187062, "epoch": 1545} {"train_loss": -36.48201370239258, "global_step": 187063, "epoch": 1545} {"train_loss": -36.39259719848633, "global_step": 187064, "epoch": 1545} {"train_loss": -40.10691590742631, "global_step": 187065, "epoch": 1545, "val_loss": 3556063.0} {"train_loss": -39.544090270996094, "global_step": 187066, "epoch": 1546} {"train_loss": -40.3250846862793, "global_step": 187067, "epoch": 1546} {"train_loss": -39.100990295410156, "global_step": 187068, "epoch": 1546} {"train_loss": -40.406288146972656, "global_step": 187069, "epoch": 1546} {"train_loss": -38.17192459106445, "global_step": 187070, "epoch": 1546} {"train_loss": -31.42597007751465, "global_step": 187071, "epoch": 1546} {"train_loss": -37.723079681396484, "global_step": 187072, "epoch": 1546} {"train_loss": -36.979774475097656, "global_step": 187073, "epoch": 1546} {"train_loss": -37.33893966674805, "global_step": 187074, "epoch": 1546} {"train_loss": -27.753942489624023, "global_step": 187075, "epoch": 1546} {"train_loss": -33.79661178588867, "global_step": 187076, "epoch": 1546} {"train_loss": -34.837677001953125, "global_step": 187077, "epoch": 1546} {"train_loss": -36.506351470947266, "global_step": 187078, "epoch": 1546} {"train_loss": -27.675750732421875, "global_step": 187079, "epoch": 1546} {"train_loss": -33.95752716064453, "global_step": 187080, "epoch": 1546} {"train_loss": -37.1200065612793, "global_step": 187081, "epoch": 1546} {"train_loss": -38.33675765991211, "global_step": 187082, "epoch": 1546} {"train_loss": -38.22793197631836, "global_step": 187083, "epoch": 1546} {"train_loss": -37.807613372802734, "global_step": 187084, "epoch": 1546} {"train_loss": -38.73744583129883, "global_step": 187085, "epoch": 1546} {"train_loss": -35.3375358581543, "global_step": 187086, "epoch": 1546} {"train_loss": -32.87852096557617, "global_step": 187087, "epoch": 1546} {"train_loss": -36.83810043334961, "global_step": 187088, "epoch": 1546} {"train_loss": -38.46099090576172, "global_step": 187089, "epoch": 1546} {"train_loss": -35.64573287963867, "global_step": 187090, "epoch": 1546} {"train_loss": -38.09542465209961, "global_step": 187091, "epoch": 1546} {"train_loss": -38.5642204284668, "global_step": 187092, "epoch": 1546} {"train_loss": -37.93374252319336, "global_step": 187093, "epoch": 1546} {"train_loss": -36.323699951171875, "global_step": 187094, "epoch": 1546} {"train_loss": -38.0727653503418, "global_step": 187095, "epoch": 1546} {"train_loss": -35.19935989379883, "global_step": 187096, "epoch": 1546} {"train_loss": -35.40220260620117, "global_step": 187097, "epoch": 1546} {"train_loss": -36.938541412353516, "global_step": 187098, "epoch": 1546} {"train_loss": -38.77797317504883, "global_step": 187099, "epoch": 1546} {"train_loss": -39.11442184448242, "global_step": 187100, "epoch": 1546} {"train_loss": -38.59084701538086, "global_step": 187101, "epoch": 1546} {"train_loss": -35.37141799926758, "global_step": 187102, "epoch": 1546} {"train_loss": -36.69786834716797, "global_step": 187103, "epoch": 1546} {"train_loss": -38.83622360229492, "global_step": 187104, "epoch": 1546} {"train_loss": -38.80458450317383, "global_step": 187105, "epoch": 1546} {"train_loss": -38.4199333190918, "global_step": 187106, "epoch": 1546} {"train_loss": -38.96334457397461, "global_step": 187107, "epoch": 1546} {"train_loss": -39.63163375854492, "global_step": 187108, "epoch": 1546} {"train_loss": -37.502723693847656, "global_step": 187109, "epoch": 1546} {"train_loss": -38.815364837646484, "global_step": 187110, "epoch": 1546} {"train_loss": -39.570098876953125, "global_step": 187111, "epoch": 1546} {"train_loss": -39.4810676574707, "global_step": 187112, "epoch": 1546} {"train_loss": -39.34721755981445, "global_step": 187113, "epoch": 1546} {"train_loss": -39.191505432128906, "global_step": 187114, "epoch": 1546} {"train_loss": -38.844520568847656, "global_step": 187115, "epoch": 1546} {"train_loss": -39.5413932800293, "global_step": 187116, "epoch": 1546} {"train_loss": -39.17246627807617, "global_step": 187117, "epoch": 1546} {"train_loss": -39.29946517944336, "global_step": 187118, "epoch": 1546} {"train_loss": -39.63371658325195, "global_step": 187119, "epoch": 1546} {"train_loss": -39.73995590209961, "global_step": 187120, "epoch": 1546} {"train_loss": -40.11613082885742, "global_step": 187121, "epoch": 1546} {"train_loss": -39.83219528198242, "global_step": 187122, "epoch": 1546} {"train_loss": -40.25875473022461, "global_step": 187123, "epoch": 1546} {"train_loss": -39.53937911987305, "global_step": 187124, "epoch": 1546} {"train_loss": -40.28004837036133, "global_step": 187125, "epoch": 1546} {"train_loss": -39.67710494995117, "global_step": 187126, "epoch": 1546} {"train_loss": -40.101009368896484, "global_step": 187127, "epoch": 1546} {"train_loss": -39.58150100708008, "global_step": 187128, "epoch": 1546} {"train_loss": -40.111358642578125, "global_step": 187129, "epoch": 1546} {"train_loss": -39.761329650878906, "global_step": 187130, "epoch": 1546} {"train_loss": -39.45656204223633, "global_step": 187131, "epoch": 1546} {"train_loss": -40.46717071533203, "global_step": 187132, "epoch": 1546} {"train_loss": -40.15543746948242, "global_step": 187133, "epoch": 1546} {"train_loss": -40.65505599975586, "global_step": 187134, "epoch": 1546} {"train_loss": -40.328853607177734, "global_step": 187135, "epoch": 1546} {"train_loss": -40.58717727661133, "global_step": 187136, "epoch": 1546} {"train_loss": -40.15545654296875, "global_step": 187137, "epoch": 1546} {"train_loss": -40.79091262817383, "global_step": 187138, "epoch": 1546} {"train_loss": -39.50686264038086, "global_step": 187139, "epoch": 1546} {"train_loss": -40.45768737792969, "global_step": 187140, "epoch": 1546} {"train_loss": -40.69338607788086, "global_step": 187141, "epoch": 1546} {"train_loss": -40.788368225097656, "global_step": 187142, "epoch": 1546} {"train_loss": -40.38984298706055, "global_step": 187143, "epoch": 1546} {"train_loss": -40.71531295776367, "global_step": 187144, "epoch": 1546} {"train_loss": -40.63749313354492, "global_step": 187145, "epoch": 1546} {"train_loss": -40.52363204956055, "global_step": 187146, "epoch": 1546} {"train_loss": -41.21559143066406, "global_step": 187147, "epoch": 1546} {"train_loss": -40.22401809692383, "global_step": 187148, "epoch": 1546} {"train_loss": -40.89655303955078, "global_step": 187149, "epoch": 1546} {"train_loss": -41.1493034362793, "global_step": 187150, "epoch": 1546} {"train_loss": -41.02642059326172, "global_step": 187151, "epoch": 1546} {"train_loss": -41.00920104980469, "global_step": 187152, "epoch": 1546} {"train_loss": -41.44917678833008, "global_step": 187153, "epoch": 1546} {"train_loss": -41.02602767944336, "global_step": 187154, "epoch": 1546} {"train_loss": -41.187896728515625, "global_step": 187155, "epoch": 1546} {"train_loss": -40.820701599121094, "global_step": 187156, "epoch": 1546} {"train_loss": -41.108829498291016, "global_step": 187157, "epoch": 1546} {"train_loss": -41.257972717285156, "global_step": 187158, "epoch": 1546} {"train_loss": -41.075191497802734, "global_step": 187159, "epoch": 1546} {"train_loss": -41.45301055908203, "global_step": 187160, "epoch": 1546} {"train_loss": -41.177040100097656, "global_step": 187161, "epoch": 1546} {"train_loss": -41.18406677246094, "global_step": 187162, "epoch": 1546} {"train_loss": -41.44057846069336, "global_step": 187163, "epoch": 1546} {"train_loss": -40.806819915771484, "global_step": 187164, "epoch": 1546} {"train_loss": -41.451271057128906, "global_step": 187165, "epoch": 1546} {"train_loss": -41.252891540527344, "global_step": 187166, "epoch": 1546} {"train_loss": -41.37940216064453, "global_step": 187167, "epoch": 1546} {"train_loss": -41.72980880737305, "global_step": 187168, "epoch": 1546} {"train_loss": -41.02614212036133, "global_step": 187169, "epoch": 1546} {"train_loss": -41.14128494262695, "global_step": 187170, "epoch": 1546} {"train_loss": -41.32075119018555, "global_step": 187171, "epoch": 1546} {"train_loss": -41.772518157958984, "global_step": 187172, "epoch": 1546} {"train_loss": -41.439205169677734, "global_step": 187173, "epoch": 1546} {"train_loss": -41.12100601196289, "global_step": 187174, "epoch": 1546} {"train_loss": -40.2680778503418, "global_step": 187175, "epoch": 1546} {"train_loss": -41.16944122314453, "global_step": 187176, "epoch": 1546} {"train_loss": -41.56174850463867, "global_step": 187177, "epoch": 1546} {"train_loss": -41.09286117553711, "global_step": 187178, "epoch": 1546} {"train_loss": -41.35150909423828, "global_step": 187179, "epoch": 1546} {"train_loss": -41.16459274291992, "global_step": 187180, "epoch": 1546} {"train_loss": -40.8712272644043, "global_step": 187181, "epoch": 1546} {"train_loss": -39.19309997558594, "global_step": 187182, "epoch": 1546} {"train_loss": -35.414058685302734, "global_step": 187183, "epoch": 1546} {"train_loss": -33.89835739135742, "global_step": 187184, "epoch": 1546} {"train_loss": -35.5906982421875, "global_step": 187185, "epoch": 1546} {"train_loss": -39.02324370707362, "global_step": 187186, "epoch": 1546, "val_loss": 2541650.25} {"train_loss": -37.10326385498047, "global_step": 187187, "epoch": 1547} {"train_loss": -31.63153076171875, "global_step": 187188, "epoch": 1547} {"train_loss": -36.41157150268555, "global_step": 187189, "epoch": 1547} {"train_loss": -36.65434646606445, "global_step": 187190, "epoch": 1547} {"train_loss": -36.68718338012695, "global_step": 187191, "epoch": 1547} {"train_loss": -32.79439926147461, "global_step": 187192, "epoch": 1547} {"train_loss": -38.32527542114258, "global_step": 187193, "epoch": 1547} {"train_loss": -35.903106689453125, "global_step": 187194, "epoch": 1547} {"train_loss": -38.82453918457031, "global_step": 187195, "epoch": 1547} {"train_loss": -36.263763427734375, "global_step": 187196, "epoch": 1547} {"train_loss": -38.217628479003906, "global_step": 187197, "epoch": 1547} {"train_loss": -39.23090744018555, "global_step": 187198, "epoch": 1547} {"train_loss": -38.64468002319336, "global_step": 187199, "epoch": 1547} {"train_loss": -37.68034744262695, "global_step": 187200, "epoch": 1547} {"train_loss": -40.45135498046875, "global_step": 187201, "epoch": 1547} {"train_loss": -37.17726516723633, "global_step": 187202, "epoch": 1547} {"train_loss": -39.6937141418457, "global_step": 187203, "epoch": 1547} {"train_loss": -40.01705551147461, "global_step": 187204, "epoch": 1547} {"train_loss": -38.075531005859375, "global_step": 187205, "epoch": 1547} {"train_loss": -39.134098052978516, "global_step": 187206, "epoch": 1547} {"train_loss": -40.600868225097656, "global_step": 187207, "epoch": 1547} {"train_loss": -38.6656494140625, "global_step": 187208, "epoch": 1547} {"train_loss": -38.777626037597656, "global_step": 187209, "epoch": 1547} {"train_loss": -40.133331298828125, "global_step": 187210, "epoch": 1547} {"train_loss": -38.37201690673828, "global_step": 187211, "epoch": 1547} {"train_loss": -40.58112716674805, "global_step": 187212, "epoch": 1547} {"train_loss": -38.90742111206055, "global_step": 187213, "epoch": 1547} {"train_loss": -39.88412094116211, "global_step": 187214, "epoch": 1547} {"train_loss": -40.5125732421875, "global_step": 187215, "epoch": 1547} {"train_loss": -39.64113998413086, "global_step": 187216, "epoch": 1547} {"train_loss": -40.238155364990234, "global_step": 187217, "epoch": 1547} {"train_loss": -40.36776351928711, "global_step": 187218, "epoch": 1547} {"train_loss": -40.50613021850586, "global_step": 187219, "epoch": 1547} {"train_loss": -39.991973876953125, "global_step": 187220, "epoch": 1547} {"train_loss": -40.34886169433594, "global_step": 187221, "epoch": 1547} {"train_loss": -40.37761306762695, "global_step": 187222, "epoch": 1547} {"train_loss": -40.56510925292969, "global_step": 187223, "epoch": 1547} {"train_loss": -41.07912063598633, "global_step": 187224, "epoch": 1547} {"train_loss": -40.68216323852539, "global_step": 187225, "epoch": 1547} {"train_loss": -40.89182662963867, "global_step": 187226, "epoch": 1547} {"train_loss": -41.00732421875, "global_step": 187227, "epoch": 1547} {"train_loss": -40.76259231567383, "global_step": 187228, "epoch": 1547} {"train_loss": -41.063087463378906, "global_step": 187229, "epoch": 1547} {"train_loss": -41.24831008911133, "global_step": 187230, "epoch": 1547} {"train_loss": -41.04368209838867, "global_step": 187231, "epoch": 1547} {"train_loss": -41.26255416870117, "global_step": 187232, "epoch": 1547} {"train_loss": -41.43534469604492, "global_step": 187233, "epoch": 1547} {"train_loss": -41.0738410949707, "global_step": 187234, "epoch": 1547} {"train_loss": -41.32172775268555, "global_step": 187235, "epoch": 1547} {"train_loss": -40.93018341064453, "global_step": 187236, "epoch": 1547} {"train_loss": -41.04339599609375, "global_step": 187237, "epoch": 1547} {"train_loss": -41.10842514038086, "global_step": 187238, "epoch": 1547} {"train_loss": -40.986942291259766, "global_step": 187239, "epoch": 1547} {"train_loss": -41.35833740234375, "global_step": 187240, "epoch": 1547} {"train_loss": -41.463836669921875, "global_step": 187241, "epoch": 1547} {"train_loss": -41.27265548706055, "global_step": 187242, "epoch": 1547} {"train_loss": -41.04823303222656, "global_step": 187243, "epoch": 1547} {"train_loss": -41.70935821533203, "global_step": 187244, "epoch": 1547} {"train_loss": -41.612056732177734, "global_step": 187245, "epoch": 1547} {"train_loss": -41.123355865478516, "global_step": 187246, "epoch": 1547} {"train_loss": -41.64244842529297, "global_step": 187247, "epoch": 1547} {"train_loss": -41.65545654296875, "global_step": 187248, "epoch": 1547} {"train_loss": -41.697261810302734, "global_step": 187249, "epoch": 1547} {"train_loss": -41.66184997558594, "global_step": 187250, "epoch": 1547} {"train_loss": -41.494266510009766, "global_step": 187251, "epoch": 1547} {"train_loss": -41.4701042175293, "global_step": 187252, "epoch": 1547} {"train_loss": -41.499053955078125, "global_step": 187253, "epoch": 1547} {"train_loss": -41.73627853393555, "global_step": 187254, "epoch": 1547} {"train_loss": -41.6433219909668, "global_step": 187255, "epoch": 1547} {"train_loss": -42.19086837768555, "global_step": 187256, "epoch": 1547} {"train_loss": -41.329689025878906, "global_step": 187257, "epoch": 1547} {"train_loss": -42.04639434814453, "global_step": 187258, "epoch": 1547} {"train_loss": -41.57289505004883, "global_step": 187259, "epoch": 1547} {"train_loss": -40.125694274902344, "global_step": 187260, "epoch": 1547} {"train_loss": -41.24181365966797, "global_step": 187261, "epoch": 1547} {"train_loss": -41.814083099365234, "global_step": 187262, "epoch": 1547} {"train_loss": -41.8514518737793, "global_step": 187263, "epoch": 1547} {"train_loss": -40.84318161010742, "global_step": 187264, "epoch": 1547} {"train_loss": -39.55620193481445, "global_step": 187265, "epoch": 1547} {"train_loss": -41.45833969116211, "global_step": 187266, "epoch": 1547} {"train_loss": -42.02728271484375, "global_step": 187267, "epoch": 1547} {"train_loss": -41.17786407470703, "global_step": 187268, "epoch": 1547} {"train_loss": -40.78580856323242, "global_step": 187269, "epoch": 1547} {"train_loss": -41.67229080200195, "global_step": 187270, "epoch": 1547} {"train_loss": -41.92414474487305, "global_step": 187271, "epoch": 1547} {"train_loss": -41.330177307128906, "global_step": 187272, "epoch": 1547} {"train_loss": -38.721527099609375, "global_step": 187273, "epoch": 1547} {"train_loss": -38.16438674926758, "global_step": 187274, "epoch": 1547} {"train_loss": -41.469539642333984, "global_step": 187275, "epoch": 1547} {"train_loss": -39.368080139160156, "global_step": 187276, "epoch": 1547} {"train_loss": -39.974178314208984, "global_step": 187277, "epoch": 1547} {"train_loss": -41.70545196533203, "global_step": 187278, "epoch": 1547} {"train_loss": -40.86166000366211, "global_step": 187279, "epoch": 1547} {"train_loss": -39.70508575439453, "global_step": 187280, "epoch": 1547} {"train_loss": -40.38679885864258, "global_step": 187281, "epoch": 1547} {"train_loss": -40.975704193115234, "global_step": 187282, "epoch": 1547} {"train_loss": -40.70408248901367, "global_step": 187283, "epoch": 1547} {"train_loss": -40.27077865600586, "global_step": 187284, "epoch": 1547} {"train_loss": -41.833621978759766, "global_step": 187285, "epoch": 1547} {"train_loss": -41.08065414428711, "global_step": 187286, "epoch": 1547} {"train_loss": -41.171173095703125, "global_step": 187287, "epoch": 1547} {"train_loss": -41.7989501953125, "global_step": 187288, "epoch": 1547} {"train_loss": -38.5485954284668, "global_step": 187289, "epoch": 1547} {"train_loss": -39.076271057128906, "global_step": 187290, "epoch": 1547} {"train_loss": -41.83445358276367, "global_step": 187291, "epoch": 1547} {"train_loss": -39.94586944580078, "global_step": 187292, "epoch": 1547} {"train_loss": -40.5831413269043, "global_step": 187293, "epoch": 1547} {"train_loss": -41.42264938354492, "global_step": 187294, "epoch": 1547} {"train_loss": -40.862152099609375, "global_step": 187295, "epoch": 1547} {"train_loss": -39.96223068237305, "global_step": 187296, "epoch": 1547} {"train_loss": -40.510372161865234, "global_step": 187297, "epoch": 1547} {"train_loss": -41.7441291809082, "global_step": 187298, "epoch": 1547} {"train_loss": -41.218109130859375, "global_step": 187299, "epoch": 1547} {"train_loss": -41.01947784423828, "global_step": 187300, "epoch": 1547} {"train_loss": -41.89353561401367, "global_step": 187301, "epoch": 1547} {"train_loss": -40.908050537109375, "global_step": 187302, "epoch": 1547} {"train_loss": -40.58254623413086, "global_step": 187303, "epoch": 1547} {"train_loss": -41.5569953918457, "global_step": 187304, "epoch": 1547} {"train_loss": -41.44313430786133, "global_step": 187305, "epoch": 1547} {"train_loss": -39.464962005615234, "global_step": 187306, "epoch": 1547} {"train_loss": -40.26444168721349, "global_step": 187307, "epoch": 1547, "val_loss": 2547528.0} {"train_loss": -40.80452346801758, "global_step": 187308, "epoch": 1548} {"train_loss": -40.4910774230957, "global_step": 187309, "epoch": 1548} {"train_loss": -40.857330322265625, "global_step": 187310, "epoch": 1548} {"train_loss": -41.074562072753906, "global_step": 187311, "epoch": 1548} {"train_loss": -39.15839767456055, "global_step": 187312, "epoch": 1548} {"train_loss": -39.019927978515625, "global_step": 187313, "epoch": 1548} {"train_loss": -37.65814208984375, "global_step": 187314, "epoch": 1548} {"train_loss": -39.25630569458008, "global_step": 187315, "epoch": 1548} {"train_loss": -40.405208587646484, "global_step": 187316, "epoch": 1548} {"train_loss": -40.58560562133789, "global_step": 187317, "epoch": 1548} {"train_loss": -40.511043548583984, "global_step": 187318, "epoch": 1548} {"train_loss": -40.68292236328125, "global_step": 187319, "epoch": 1548} {"train_loss": -39.88295364379883, "global_step": 187320, "epoch": 1548} {"train_loss": -41.08134460449219, "global_step": 187321, "epoch": 1548} {"train_loss": -41.212581634521484, "global_step": 187322, "epoch": 1548} {"train_loss": -41.01273727416992, "global_step": 187323, "epoch": 1548} {"train_loss": -41.416595458984375, "global_step": 187324, "epoch": 1548} {"train_loss": -40.88050842285156, "global_step": 187325, "epoch": 1548} {"train_loss": -40.65665054321289, "global_step": 187326, "epoch": 1548} {"train_loss": -41.09650802612305, "global_step": 187327, "epoch": 1548} {"train_loss": -41.550289154052734, "global_step": 187328, "epoch": 1548} {"train_loss": -40.52037048339844, "global_step": 187329, "epoch": 1548} {"train_loss": -40.03989028930664, "global_step": 187330, "epoch": 1548} {"train_loss": -41.312591552734375, "global_step": 187331, "epoch": 1548} {"train_loss": -41.251155853271484, "global_step": 187332, "epoch": 1548} {"train_loss": -40.88766860961914, "global_step": 187333, "epoch": 1548} {"train_loss": -40.35154342651367, "global_step": 187334, "epoch": 1548} {"train_loss": -40.85770034790039, "global_step": 187335, "epoch": 1548} {"train_loss": -41.49018096923828, "global_step": 187336, "epoch": 1548} {"train_loss": -41.719757080078125, "global_step": 187337, "epoch": 1548} {"train_loss": -41.16390609741211, "global_step": 187338, "epoch": 1548} {"train_loss": -41.4904670715332, "global_step": 187339, "epoch": 1548} {"train_loss": -40.81074905395508, "global_step": 187340, "epoch": 1548} {"train_loss": -40.58236312866211, "global_step": 187341, "epoch": 1548} {"train_loss": -41.49021530151367, "global_step": 187342, "epoch": 1548} {"train_loss": -41.06855392456055, "global_step": 187343, "epoch": 1548} {"train_loss": -39.45082473754883, "global_step": 187344, "epoch": 1548} {"train_loss": -40.47093200683594, "global_step": 187345, "epoch": 1548} {"train_loss": -39.5833854675293, "global_step": 187346, "epoch": 1548} {"train_loss": -39.96340560913086, "global_step": 187347, "epoch": 1548} {"train_loss": -41.59475326538086, "global_step": 187348, "epoch": 1548} {"train_loss": -40.320953369140625, "global_step": 187349, "epoch": 1548} {"train_loss": -40.216468811035156, "global_step": 187350, "epoch": 1548} {"train_loss": -41.02373123168945, "global_step": 187351, "epoch": 1548} {"train_loss": -41.14821243286133, "global_step": 187352, "epoch": 1548} {"train_loss": -41.072200775146484, "global_step": 187353, "epoch": 1548} {"train_loss": -41.3568000793457, "global_step": 187354, "epoch": 1548} {"train_loss": -41.50222396850586, "global_step": 187355, "epoch": 1548} {"train_loss": -41.45981979370117, "global_step": 187356, "epoch": 1548} {"train_loss": -42.07305145263672, "global_step": 187357, "epoch": 1548} {"train_loss": -41.4185905456543, "global_step": 187358, "epoch": 1548} {"train_loss": -41.06088638305664, "global_step": 187359, "epoch": 1548} {"train_loss": -40.583526611328125, "global_step": 187360, "epoch": 1548} {"train_loss": -41.598297119140625, "global_step": 187361, "epoch": 1548} {"train_loss": -41.50814437866211, "global_step": 187362, "epoch": 1548} {"train_loss": -41.6779899597168, "global_step": 187363, "epoch": 1548} {"train_loss": -41.708614349365234, "global_step": 187364, "epoch": 1548} {"train_loss": -40.472530364990234, "global_step": 187365, "epoch": 1548} {"train_loss": -39.94993209838867, "global_step": 187366, "epoch": 1548} {"train_loss": -41.80955123901367, "global_step": 187367, "epoch": 1548} {"train_loss": -41.12724685668945, "global_step": 187368, "epoch": 1548} {"train_loss": -41.77998352050781, "global_step": 187369, "epoch": 1548} {"train_loss": -41.76930618286133, "global_step": 187370, "epoch": 1548} {"train_loss": -40.370731353759766, "global_step": 187371, "epoch": 1548} {"train_loss": -41.991310119628906, "global_step": 187372, "epoch": 1548} {"train_loss": -41.027095794677734, "global_step": 187373, "epoch": 1548} {"train_loss": -41.6864128112793, "global_step": 187374, "epoch": 1548} {"train_loss": -41.5755500793457, "global_step": 187375, "epoch": 1548} {"train_loss": -40.93830490112305, "global_step": 187376, "epoch": 1548} {"train_loss": -41.140037536621094, "global_step": 187377, "epoch": 1548} {"train_loss": -42.170928955078125, "global_step": 187378, "epoch": 1548} {"train_loss": -40.42536544799805, "global_step": 187379, "epoch": 1548} {"train_loss": -41.13747024536133, "global_step": 187380, "epoch": 1548} {"train_loss": -41.61484909057617, "global_step": 187381, "epoch": 1548} {"train_loss": -41.63290023803711, "global_step": 187382, "epoch": 1548} {"train_loss": -40.91423416137695, "global_step": 187383, "epoch": 1548} {"train_loss": -41.394535064697266, "global_step": 187384, "epoch": 1548} {"train_loss": -41.215484619140625, "global_step": 187385, "epoch": 1548} {"train_loss": -40.770668029785156, "global_step": 187386, "epoch": 1548} {"train_loss": -41.123321533203125, "global_step": 187387, "epoch": 1548} {"train_loss": -40.154205322265625, "global_step": 187388, "epoch": 1548} {"train_loss": -41.518280029296875, "global_step": 187389, "epoch": 1548} {"train_loss": -39.71820831298828, "global_step": 187390, "epoch": 1548} {"train_loss": -41.439456939697266, "global_step": 187391, "epoch": 1548} {"train_loss": -40.61960983276367, "global_step": 187392, "epoch": 1548} {"train_loss": -40.92863082885742, "global_step": 187393, "epoch": 1548} {"train_loss": -41.10028839111328, "global_step": 187394, "epoch": 1548} {"train_loss": -39.98759078979492, "global_step": 187395, "epoch": 1548} {"train_loss": -38.76231384277344, "global_step": 187396, "epoch": 1548} {"train_loss": -40.78757858276367, "global_step": 187397, "epoch": 1548} {"train_loss": -41.01777648925781, "global_step": 187398, "epoch": 1548} {"train_loss": -40.18278121948242, "global_step": 187399, "epoch": 1548} {"train_loss": -40.73095703125, "global_step": 187400, "epoch": 1548} {"train_loss": -40.63726806640625, "global_step": 187401, "epoch": 1548} {"train_loss": -39.736175537109375, "global_step": 187402, "epoch": 1548} {"train_loss": -41.082618713378906, "global_step": 187403, "epoch": 1548} {"train_loss": -40.51788330078125, "global_step": 187404, "epoch": 1548} {"train_loss": -40.473724365234375, "global_step": 187405, "epoch": 1548} {"train_loss": -40.30779266357422, "global_step": 187406, "epoch": 1548} {"train_loss": -39.83407211303711, "global_step": 187407, "epoch": 1548} {"train_loss": -39.374019622802734, "global_step": 187408, "epoch": 1548} {"train_loss": -40.17022705078125, "global_step": 187409, "epoch": 1548} {"train_loss": -37.90925216674805, "global_step": 187410, "epoch": 1548} {"train_loss": -40.61357498168945, "global_step": 187411, "epoch": 1548} {"train_loss": -39.047462463378906, "global_step": 187412, "epoch": 1548} {"train_loss": -40.741851806640625, "global_step": 187413, "epoch": 1548} {"train_loss": -39.500038146972656, "global_step": 187414, "epoch": 1548} {"train_loss": -39.669647216796875, "global_step": 187415, "epoch": 1548} {"train_loss": -39.58980178833008, "global_step": 187416, "epoch": 1548} {"train_loss": -40.179805755615234, "global_step": 187417, "epoch": 1548} {"train_loss": -40.3006591796875, "global_step": 187418, "epoch": 1548} {"train_loss": -40.75275421142578, "global_step": 187419, "epoch": 1548} {"train_loss": -41.11674499511719, "global_step": 187420, "epoch": 1548} {"train_loss": -40.51984405517578, "global_step": 187421, "epoch": 1548} {"train_loss": -40.36708450317383, "global_step": 187422, "epoch": 1548} {"train_loss": -39.83598709106445, "global_step": 187423, "epoch": 1548} {"train_loss": -41.71394729614258, "global_step": 187424, "epoch": 1548} {"train_loss": -40.686805725097656, "global_step": 187425, "epoch": 1548} {"train_loss": -41.713661193847656, "global_step": 187426, "epoch": 1548} {"train_loss": -41.45612716674805, "global_step": 187427, "epoch": 1548} {"train_loss": -40.74001482498547, "global_step": 187428, "epoch": 1548, "val_loss": 2597889.25} {"train_loss": -41.36370086669922, "global_step": 187429, "epoch": 1549} {"train_loss": -41.2600212097168, "global_step": 187430, "epoch": 1549} {"train_loss": -41.58229446411133, "global_step": 187431, "epoch": 1549} {"train_loss": -41.56599807739258, "global_step": 187432, "epoch": 1549} {"train_loss": -41.6993522644043, "global_step": 187433, "epoch": 1549} {"train_loss": -41.49067306518555, "global_step": 187434, "epoch": 1549} {"train_loss": -41.79542541503906, "global_step": 187435, "epoch": 1549} {"train_loss": -40.75117111206055, "global_step": 187436, "epoch": 1549} {"train_loss": -41.02192306518555, "global_step": 187437, "epoch": 1549} {"train_loss": -41.022457122802734, "global_step": 187438, "epoch": 1549} {"train_loss": -39.189544677734375, "global_step": 187439, "epoch": 1549} {"train_loss": -38.0671272277832, "global_step": 187440, "epoch": 1549} {"train_loss": -40.933284759521484, "global_step": 187441, "epoch": 1549} {"train_loss": -40.10517501831055, "global_step": 187442, "epoch": 1549} {"train_loss": -38.45832061767578, "global_step": 187443, "epoch": 1549} {"train_loss": -39.317935943603516, "global_step": 187444, "epoch": 1549} {"train_loss": -38.927734375, "global_step": 187445, "epoch": 1549} {"train_loss": -39.718345642089844, "global_step": 187446, "epoch": 1549} {"train_loss": -40.56339645385742, "global_step": 187447, "epoch": 1549} {"train_loss": -40.08131790161133, "global_step": 187448, "epoch": 1549} {"train_loss": -39.768856048583984, "global_step": 187449, "epoch": 1549} {"train_loss": -40.3683967590332, "global_step": 187450, "epoch": 1549} {"train_loss": -40.915802001953125, "global_step": 187451, "epoch": 1549} {"train_loss": -40.571468353271484, "global_step": 187452, "epoch": 1549} {"train_loss": -41.53310012817383, "global_step": 187453, "epoch": 1549} {"train_loss": -40.52970504760742, "global_step": 187454, "epoch": 1549} {"train_loss": -39.13581466674805, "global_step": 187455, "epoch": 1549} {"train_loss": -40.70795822143555, "global_step": 187456, "epoch": 1549} {"train_loss": -41.06989288330078, "global_step": 187457, "epoch": 1549} {"train_loss": -41.244327545166016, "global_step": 187458, "epoch": 1549} {"train_loss": -41.46693420410156, "global_step": 187459, "epoch": 1549} {"train_loss": -40.15930938720703, "global_step": 187460, "epoch": 1549} {"train_loss": -39.58154296875, "global_step": 187461, "epoch": 1549} {"train_loss": -39.75689697265625, "global_step": 187462, "epoch": 1549} {"train_loss": -41.3499641418457, "global_step": 187463, "epoch": 1549} {"train_loss": -39.064510345458984, "global_step": 187464, "epoch": 1549} {"train_loss": -37.80662155151367, "global_step": 187465, "epoch": 1549} {"train_loss": -41.08561325073242, "global_step": 187466, "epoch": 1549} {"train_loss": -38.80793380737305, "global_step": 187467, "epoch": 1549} {"train_loss": -38.708126068115234, "global_step": 187468, "epoch": 1549} {"train_loss": -40.93427658081055, "global_step": 187469, "epoch": 1549} {"train_loss": -39.171875, "global_step": 187470, "epoch": 1549} {"train_loss": -37.45012664794922, "global_step": 187471, "epoch": 1549} {"train_loss": -39.93210983276367, "global_step": 187472, "epoch": 1549} {"train_loss": -39.51504135131836, "global_step": 187473, "epoch": 1549} {"train_loss": -40.382965087890625, "global_step": 187474, "epoch": 1549} {"train_loss": -40.52334213256836, "global_step": 187475, "epoch": 1549} {"train_loss": -39.95459747314453, "global_step": 187476, "epoch": 1549} {"train_loss": -41.21293258666992, "global_step": 187477, "epoch": 1549} {"train_loss": -40.53071975708008, "global_step": 187478, "epoch": 1549} {"train_loss": -40.52558135986328, "global_step": 187479, "epoch": 1549} {"train_loss": -41.163631439208984, "global_step": 187480, "epoch": 1549} {"train_loss": -40.473060607910156, "global_step": 187481, "epoch": 1549} {"train_loss": -40.80216598510742, "global_step": 187482, "epoch": 1549} {"train_loss": -40.25270462036133, "global_step": 187483, "epoch": 1549} {"train_loss": -40.957393646240234, "global_step": 187484, "epoch": 1549} {"train_loss": -41.306739807128906, "global_step": 187485, "epoch": 1549} {"train_loss": -41.67403793334961, "global_step": 187486, "epoch": 1549} {"train_loss": -40.93746566772461, "global_step": 187487, "epoch": 1549} {"train_loss": -39.6416130065918, "global_step": 187488, "epoch": 1549} {"train_loss": -41.55827713012695, "global_step": 187489, "epoch": 1549} {"train_loss": -41.321754455566406, "global_step": 187490, "epoch": 1549} {"train_loss": -41.3890380859375, "global_step": 187491, "epoch": 1549} {"train_loss": -40.02706527709961, "global_step": 187492, "epoch": 1549} {"train_loss": -41.63679885864258, "global_step": 187493, "epoch": 1549} {"train_loss": -40.64997482299805, "global_step": 187494, "epoch": 1549} {"train_loss": -41.1659049987793, "global_step": 187495, "epoch": 1549} {"train_loss": -42.11906814575195, "global_step": 187496, "epoch": 1549} {"train_loss": -41.50844192504883, "global_step": 187497, "epoch": 1549} {"train_loss": -41.238521575927734, "global_step": 187498, "epoch": 1549} {"train_loss": -41.5914421081543, "global_step": 187499, "epoch": 1549} {"train_loss": -41.77851104736328, "global_step": 187500, "epoch": 1549} {"train_loss": -41.76319122314453, "global_step": 187501, "epoch": 1549} {"train_loss": -40.70864486694336, "global_step": 187502, "epoch": 1549} {"train_loss": -40.66549301147461, "global_step": 187503, "epoch": 1549} {"train_loss": -41.702903747558594, "global_step": 187504, "epoch": 1549} {"train_loss": -41.64890670776367, "global_step": 187505, "epoch": 1549} {"train_loss": -41.95622253417969, "global_step": 187506, "epoch": 1549} {"train_loss": -41.77888107299805, "global_step": 187507, "epoch": 1549} {"train_loss": -41.64252853393555, "global_step": 187508, "epoch": 1549} {"train_loss": -41.281715393066406, "global_step": 187509, "epoch": 1549} {"train_loss": -41.034114837646484, "global_step": 187510, "epoch": 1549} {"train_loss": -41.449615478515625, "global_step": 187511, "epoch": 1549} {"train_loss": -41.295257568359375, "global_step": 187512, "epoch": 1549} {"train_loss": -41.33803939819336, "global_step": 187513, "epoch": 1549} {"train_loss": -41.60833740234375, "global_step": 187514, "epoch": 1549} {"train_loss": -41.19956588745117, "global_step": 187515, "epoch": 1549} {"train_loss": -41.745697021484375, "global_step": 187516, "epoch": 1549} {"train_loss": -41.24700927734375, "global_step": 187517, "epoch": 1549} {"train_loss": -40.8740119934082, "global_step": 187518, "epoch": 1549} {"train_loss": -40.90925979614258, "global_step": 187519, "epoch": 1549} {"train_loss": -41.26217269897461, "global_step": 187520, "epoch": 1549} {"train_loss": -41.483882904052734, "global_step": 187521, "epoch": 1549} {"train_loss": -41.85915756225586, "global_step": 187522, "epoch": 1549} {"train_loss": -41.227169036865234, "global_step": 187523, "epoch": 1549} {"train_loss": -42.03240203857422, "global_step": 187524, "epoch": 1549} {"train_loss": -42.26997756958008, "global_step": 187525, "epoch": 1549} {"train_loss": -42.0384521484375, "global_step": 187526, "epoch": 1549} {"train_loss": -41.9640998840332, "global_step": 187527, "epoch": 1549} {"train_loss": -41.54618453979492, "global_step": 187528, "epoch": 1549} {"train_loss": -41.43449401855469, "global_step": 187529, "epoch": 1549} {"train_loss": -41.15102767944336, "global_step": 187530, "epoch": 1549} {"train_loss": -42.19672775268555, "global_step": 187531, "epoch": 1549} {"train_loss": -42.41100311279297, "global_step": 187532, "epoch": 1549} {"train_loss": -41.08156967163086, "global_step": 187533, "epoch": 1549} {"train_loss": -41.56821823120117, "global_step": 187534, "epoch": 1549} {"train_loss": -41.69553756713867, "global_step": 187535, "epoch": 1549} {"train_loss": -40.933467864990234, "global_step": 187536, "epoch": 1549} {"train_loss": -41.502037048339844, "global_step": 187537, "epoch": 1549} {"train_loss": -41.78825759887695, "global_step": 187538, "epoch": 1549} {"train_loss": -41.74215316772461, "global_step": 187539, "epoch": 1549} {"train_loss": -40.7537956237793, "global_step": 187540, "epoch": 1549} {"train_loss": -41.56635284423828, "global_step": 187541, "epoch": 1549} {"train_loss": -42.01515579223633, "global_step": 187542, "epoch": 1549} {"train_loss": -41.66731643676758, "global_step": 187543, "epoch": 1549} {"train_loss": -40.31185531616211, "global_step": 187544, "epoch": 1549} {"train_loss": -40.78688430786133, "global_step": 187545, "epoch": 1549} {"train_loss": -41.48897171020508, "global_step": 187546, "epoch": 1549} {"train_loss": -42.23469161987305, "global_step": 187547, "epoch": 1549} {"train_loss": -41.70597457885742, "global_step": 187548, "epoch": 1549} {"train_loss": -40.90226739300184, "global_step": 187549, "epoch": 1549, "val_loss": 2591385.5} {"train_loss": -40.795448303222656, "global_step": 187550, "epoch": 1550} {"train_loss": -41.015926361083984, "global_step": 187551, "epoch": 1550} {"train_loss": -40.647193908691406, "global_step": 187552, "epoch": 1550} {"train_loss": -40.63344955444336, "global_step": 187553, "epoch": 1550} {"train_loss": -40.43388366699219, "global_step": 187554, "epoch": 1550} {"train_loss": -41.621551513671875, "global_step": 187555, "epoch": 1550} {"train_loss": -40.602272033691406, "global_step": 187556, "epoch": 1550} {"train_loss": -39.72461700439453, "global_step": 187557, "epoch": 1550} {"train_loss": -40.9759635925293, "global_step": 187558, "epoch": 1550} {"train_loss": -40.64230728149414, "global_step": 187559, "epoch": 1550} {"train_loss": -41.31987380981445, "global_step": 187560, "epoch": 1550} {"train_loss": -41.182254791259766, "global_step": 187561, "epoch": 1550} {"train_loss": -40.378929138183594, "global_step": 187562, "epoch": 1550} {"train_loss": -40.81089782714844, "global_step": 187563, "epoch": 1550} {"train_loss": -40.62376022338867, "global_step": 187564, "epoch": 1550} {"train_loss": -41.1607780456543, "global_step": 187565, "epoch": 1550} {"train_loss": -39.12032699584961, "global_step": 187566, "epoch": 1550} {"train_loss": -40.214027404785156, "global_step": 187567, "epoch": 1550} {"train_loss": -41.40044021606445, "global_step": 187568, "epoch": 1550} {"train_loss": -40.88208770751953, "global_step": 187569, "epoch": 1550} {"train_loss": -40.957923889160156, "global_step": 187570, "epoch": 1550} {"train_loss": -41.47079086303711, "global_step": 187571, "epoch": 1550} {"train_loss": -41.5894889831543, "global_step": 187572, "epoch": 1550} {"train_loss": -41.81502914428711, "global_step": 187573, "epoch": 1550} {"train_loss": -42.067378997802734, "global_step": 187574, "epoch": 1550} {"train_loss": -40.710853576660156, "global_step": 187575, "epoch": 1550} {"train_loss": -41.689510345458984, "global_step": 187576, "epoch": 1550} {"train_loss": -42.10750961303711, "global_step": 187577, "epoch": 1550} {"train_loss": -41.46842575073242, "global_step": 187578, "epoch": 1550} {"train_loss": -41.871456146240234, "global_step": 187579, "epoch": 1550} {"train_loss": -41.382057189941406, "global_step": 187580, "epoch": 1550} {"train_loss": -42.20201110839844, "global_step": 187581, "epoch": 1550} {"train_loss": -42.11556625366211, "global_step": 187582, "epoch": 1550} {"train_loss": -42.50795364379883, "global_step": 187583, "epoch": 1550} {"train_loss": -41.89967346191406, "global_step": 187584, "epoch": 1550} {"train_loss": -41.49387741088867, "global_step": 187585, "epoch": 1550} {"train_loss": -41.955177307128906, "global_step": 187586, "epoch": 1550} {"train_loss": -42.19584274291992, "global_step": 187587, "epoch": 1550} {"train_loss": -42.105506896972656, "global_step": 187588, "epoch": 1550} {"train_loss": -41.13202667236328, "global_step": 187589, "epoch": 1550} {"train_loss": -41.70661163330078, "global_step": 187590, "epoch": 1550} {"train_loss": -42.1203727722168, "global_step": 187591, "epoch": 1550} {"train_loss": -42.34047317504883, "global_step": 187592, "epoch": 1550} {"train_loss": -42.224456787109375, "global_step": 187593, "epoch": 1550} {"train_loss": -42.16661834716797, "global_step": 187594, "epoch": 1550} {"train_loss": -42.00071716308594, "global_step": 187595, "epoch": 1550} {"train_loss": -41.41801071166992, "global_step": 187596, "epoch": 1550} {"train_loss": -41.61370849609375, "global_step": 187597, "epoch": 1550} {"train_loss": -41.56711959838867, "global_step": 187598, "epoch": 1550} {"train_loss": -42.3731689453125, "global_step": 187599, "epoch": 1550} {"train_loss": -42.394325256347656, "global_step": 187600, "epoch": 1550} {"train_loss": -41.2044563293457, "global_step": 187601, "epoch": 1550} {"train_loss": -39.75869369506836, "global_step": 187602, "epoch": 1550} {"train_loss": -38.57548522949219, "global_step": 187603, "epoch": 1550} {"train_loss": -41.13783645629883, "global_step": 187604, "epoch": 1550} {"train_loss": -33.76190185546875, "global_step": 187605, "epoch": 1550} {"train_loss": -22.31422233581543, "global_step": 187606, "epoch": 1550} {"train_loss": -30.488529205322266, "global_step": 187607, "epoch": 1550} {"train_loss": -36.45026397705078, "global_step": 187608, "epoch": 1550} {"train_loss": -35.44741439819336, "global_step": 187609, "epoch": 1550} {"train_loss": -32.01850128173828, "global_step": 187610, "epoch": 1550} {"train_loss": -35.43848419189453, "global_step": 187611, "epoch": 1550} {"train_loss": -38.984310150146484, "global_step": 187612, "epoch": 1550} {"train_loss": -35.44981002807617, "global_step": 187613, "epoch": 1550} {"train_loss": -39.65397262573242, "global_step": 187614, "epoch": 1550} {"train_loss": -36.14066696166992, "global_step": 187615, "epoch": 1550} {"train_loss": -34.41754150390625, "global_step": 187616, "epoch": 1550} {"train_loss": -40.649261474609375, "global_step": 187617, "epoch": 1550} {"train_loss": -37.220985412597656, "global_step": 187618, "epoch": 1550} {"train_loss": -39.40134048461914, "global_step": 187619, "epoch": 1550} {"train_loss": -37.81040573120117, "global_step": 187620, "epoch": 1550} {"train_loss": -39.77126693725586, "global_step": 187621, "epoch": 1550} {"train_loss": -39.042236328125, "global_step": 187622, "epoch": 1550} {"train_loss": -40.97367858886719, "global_step": 187623, "epoch": 1550} {"train_loss": -38.718929290771484, "global_step": 187624, "epoch": 1550} {"train_loss": -40.26900863647461, "global_step": 187625, "epoch": 1550} {"train_loss": -39.248634338378906, "global_step": 187626, "epoch": 1550} {"train_loss": -40.4712028503418, "global_step": 187627, "epoch": 1550} {"train_loss": -40.1900749206543, "global_step": 187628, "epoch": 1550} {"train_loss": -40.13387680053711, "global_step": 187629, "epoch": 1550} {"train_loss": -40.6396484375, "global_step": 187630, "epoch": 1550} {"train_loss": -40.45947265625, "global_step": 187631, "epoch": 1550} {"train_loss": -40.581642150878906, "global_step": 187632, "epoch": 1550} {"train_loss": -40.177345275878906, "global_step": 187633, "epoch": 1550} {"train_loss": -41.11564254760742, "global_step": 187634, "epoch": 1550} {"train_loss": -39.8190803527832, "global_step": 187635, "epoch": 1550} {"train_loss": -41.00978088378906, "global_step": 187636, "epoch": 1550} {"train_loss": -40.621822357177734, "global_step": 187637, "epoch": 1550} {"train_loss": -40.88295364379883, "global_step": 187638, "epoch": 1550} {"train_loss": -41.111968994140625, "global_step": 187639, "epoch": 1550} {"train_loss": -41.13759231567383, "global_step": 187640, "epoch": 1550} {"train_loss": -40.73443603515625, "global_step": 187641, "epoch": 1550} {"train_loss": -41.254215240478516, "global_step": 187642, "epoch": 1550} {"train_loss": -41.253604888916016, "global_step": 187643, "epoch": 1550} {"train_loss": -40.03019332885742, "global_step": 187644, "epoch": 1550} {"train_loss": -41.561241149902344, "global_step": 187645, "epoch": 1550} {"train_loss": -41.530609130859375, "global_step": 187646, "epoch": 1550} {"train_loss": -41.258670806884766, "global_step": 187647, "epoch": 1550} {"train_loss": -41.596290588378906, "global_step": 187648, "epoch": 1550} {"train_loss": -41.529090881347656, "global_step": 187649, "epoch": 1550} {"train_loss": -41.59837341308594, "global_step": 187650, "epoch": 1550} {"train_loss": -41.581600189208984, "global_step": 187651, "epoch": 1550} {"train_loss": -41.50947189331055, "global_step": 187652, "epoch": 1550} {"train_loss": -41.12750244140625, "global_step": 187653, "epoch": 1550} {"train_loss": -41.55115509033203, "global_step": 187654, "epoch": 1550} {"train_loss": -41.87158966064453, "global_step": 187655, "epoch": 1550} {"train_loss": -41.6755256652832, "global_step": 187656, "epoch": 1550} {"train_loss": -41.453956604003906, "global_step": 187657, "epoch": 1550} {"train_loss": -41.97294998168945, "global_step": 187658, "epoch": 1550} {"train_loss": -41.13741683959961, "global_step": 187659, "epoch": 1550} {"train_loss": -41.68429183959961, "global_step": 187660, "epoch": 1550} {"train_loss": -42.07497787475586, "global_step": 187661, "epoch": 1550} {"train_loss": -41.89842224121094, "global_step": 187662, "epoch": 1550} {"train_loss": -40.79801559448242, "global_step": 187663, "epoch": 1550} {"train_loss": -41.90279769897461, "global_step": 187664, "epoch": 1550} {"train_loss": -42.16081237792969, "global_step": 187665, "epoch": 1550} {"train_loss": -42.31313705444336, "global_step": 187666, "epoch": 1550} {"train_loss": -41.884521484375, "global_step": 187667, "epoch": 1550} {"train_loss": -41.5880241394043, "global_step": 187668, "epoch": 1550} {"train_loss": -41.52002716064453, "global_step": 187669, "epoch": 1550} {"train_loss": -40.40889618613503, "global_step": 187670, "epoch": 1550, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4400000": 1.0, "test/sim_max_reward_4400001": 1.0, "test/sim_max_reward_4400002": 1.0, "test/sim_max_reward_4400003": 1.0, "test/sim_max_reward_4400004": 1.0, "test/sim_max_reward_4400005": 1.0, "test/sim_max_reward_4400006": 1.0, "test/sim_max_reward_4400007": 1.0, "test/sim_max_reward_4400008": 1.0, "test/sim_max_reward_4400009": 1.0, "test/sim_max_reward_4400010": 1.0, "test/sim_max_reward_4400011": 1.0, "test/sim_max_reward_4400012": 1.0, "test/sim_max_reward_4400013": 1.0, "test/sim_max_reward_4400014": 1.0, "test/sim_max_reward_4400015": 1.0, "test/sim_max_reward_4400016": 1.0, "test/sim_max_reward_4400017": 1.0, "test/sim_max_reward_4400018": 1.0, "test/sim_max_reward_4400019": 1.0, "test/sim_max_reward_4400020": 1.0, "test/sim_max_reward_4400021": 1.0, "train/mean_score": 1.0, "test/mean_score": 1.0, "val_loss": 2634916.75} {"train_loss": -42.561275482177734, "global_step": 187671, "epoch": 1551} {"train_loss": -41.9135627746582, "global_step": 187672, "epoch": 1551} {"train_loss": -41.28187942504883, "global_step": 187673, "epoch": 1551} {"train_loss": -40.85440444946289, "global_step": 187674, "epoch": 1551} {"train_loss": -41.0087890625, "global_step": 187675, "epoch": 1551} {"train_loss": -41.24634552001953, "global_step": 187676, "epoch": 1551} {"train_loss": -42.30107879638672, "global_step": 187677, "epoch": 1551} {"train_loss": -41.530696868896484, "global_step": 187678, "epoch": 1551} {"train_loss": -41.4167594909668, "global_step": 187679, "epoch": 1551} {"train_loss": -41.27192687988281, "global_step": 187680, "epoch": 1551} {"train_loss": -41.696258544921875, "global_step": 187681, "epoch": 1551} {"train_loss": -41.427947998046875, "global_step": 187682, "epoch": 1551} {"train_loss": -41.81441879272461, "global_step": 187683, "epoch": 1551} {"train_loss": -42.04018020629883, "global_step": 187684, "epoch": 1551} {"train_loss": -41.54263687133789, "global_step": 187685, "epoch": 1551} {"train_loss": -41.92336654663086, "global_step": 187686, "epoch": 1551} {"train_loss": -41.72634506225586, "global_step": 187687, "epoch": 1551} {"train_loss": -41.86797332763672, "global_step": 187688, "epoch": 1551} {"train_loss": -42.51738357543945, "global_step": 187689, "epoch": 1551} {"train_loss": -39.75501251220703, "global_step": 187690, "epoch": 1551} {"train_loss": -40.9782600402832, "global_step": 187691, "epoch": 1551} {"train_loss": -40.88959884643555, "global_step": 187692, "epoch": 1551} {"train_loss": -41.2657585144043, "global_step": 187693, "epoch": 1551} {"train_loss": -42.11564254760742, "global_step": 187694, "epoch": 1551} {"train_loss": -41.6279296875, "global_step": 187695, "epoch": 1551} {"train_loss": -41.03379440307617, "global_step": 187696, "epoch": 1551} {"train_loss": -41.964508056640625, "global_step": 187697, "epoch": 1551} {"train_loss": -41.82714080810547, "global_step": 187698, "epoch": 1551} {"train_loss": -41.2474250793457, "global_step": 187699, "epoch": 1551} {"train_loss": -40.798133850097656, "global_step": 187700, "epoch": 1551} {"train_loss": -41.75439453125, "global_step": 187701, "epoch": 1551} {"train_loss": -40.99552536010742, "global_step": 187702, "epoch": 1551} {"train_loss": -39.5998649597168, "global_step": 187703, "epoch": 1551} {"train_loss": -36.269771575927734, "global_step": 187704, "epoch": 1551} {"train_loss": -40.6572380065918, "global_step": 187705, "epoch": 1551} {"train_loss": -38.29591751098633, "global_step": 187706, "epoch": 1551} {"train_loss": -38.48261260986328, "global_step": 187707, "epoch": 1551} {"train_loss": -39.35816192626953, "global_step": 187708, "epoch": 1551} {"train_loss": -39.19105911254883, "global_step": 187709, "epoch": 1551} {"train_loss": -40.99789047241211, "global_step": 187710, "epoch": 1551} {"train_loss": -37.052791595458984, "global_step": 187711, "epoch": 1551} {"train_loss": -40.0961799621582, "global_step": 187712, "epoch": 1551} {"train_loss": -40.36133575439453, "global_step": 187713, "epoch": 1551} {"train_loss": -38.35813522338867, "global_step": 187714, "epoch": 1551} {"train_loss": -40.03680419921875, "global_step": 187715, "epoch": 1551} {"train_loss": -40.267173767089844, "global_step": 187716, "epoch": 1551} {"train_loss": -40.46304702758789, "global_step": 187717, "epoch": 1551} {"train_loss": -40.367637634277344, "global_step": 187718, "epoch": 1551} {"train_loss": -39.3992919921875, "global_step": 187719, "epoch": 1551} {"train_loss": -38.787723541259766, "global_step": 187720, "epoch": 1551} {"train_loss": -40.0548210144043, "global_step": 187721, "epoch": 1551} {"train_loss": -40.728580474853516, "global_step": 187722, "epoch": 1551} {"train_loss": -41.134090423583984, "global_step": 187723, "epoch": 1551} {"train_loss": -40.90293502807617, "global_step": 187724, "epoch": 1551} {"train_loss": -39.9614143371582, "global_step": 187725, "epoch": 1551} {"train_loss": -41.32406234741211, "global_step": 187726, "epoch": 1551} {"train_loss": -41.246986389160156, "global_step": 187727, "epoch": 1551} {"train_loss": -41.01994323730469, "global_step": 187728, "epoch": 1551} {"train_loss": -41.206356048583984, "global_step": 187729, "epoch": 1551} {"train_loss": -40.589263916015625, "global_step": 187730, "epoch": 1551} {"train_loss": -39.84072494506836, "global_step": 187731, "epoch": 1551} {"train_loss": -41.36888885498047, "global_step": 187732, "epoch": 1551} {"train_loss": -41.330909729003906, "global_step": 187733, "epoch": 1551} {"train_loss": -40.50336837768555, "global_step": 187734, "epoch": 1551} {"train_loss": -40.92432403564453, "global_step": 187735, "epoch": 1551} {"train_loss": -40.601497650146484, "global_step": 187736, "epoch": 1551} {"train_loss": -41.07808303833008, "global_step": 187737, "epoch": 1551} {"train_loss": -40.2984619140625, "global_step": 187738, "epoch": 1551} {"train_loss": -39.6651725769043, "global_step": 187739, "epoch": 1551} {"train_loss": -40.568965911865234, "global_step": 187740, "epoch": 1551} {"train_loss": -41.509342193603516, "global_step": 187741, "epoch": 1551} {"train_loss": -40.99602127075195, "global_step": 187742, "epoch": 1551} {"train_loss": -40.9549560546875, "global_step": 187743, "epoch": 1551} {"train_loss": -39.992706298828125, "global_step": 187744, "epoch": 1551} {"train_loss": -40.07182693481445, "global_step": 187745, "epoch": 1551} {"train_loss": -41.203426361083984, "global_step": 187746, "epoch": 1551} {"train_loss": -41.212398529052734, "global_step": 187747, "epoch": 1551} {"train_loss": -40.869171142578125, "global_step": 187748, "epoch": 1551} {"train_loss": -41.70736312866211, "global_step": 187749, "epoch": 1551} {"train_loss": -40.40478515625, "global_step": 187750, "epoch": 1551} {"train_loss": -41.01062774658203, "global_step": 187751, "epoch": 1551} {"train_loss": -41.292903900146484, "global_step": 187752, "epoch": 1551} {"train_loss": -41.30353546142578, "global_step": 187753, "epoch": 1551} {"train_loss": -41.202457427978516, "global_step": 187754, "epoch": 1551} {"train_loss": -39.44460678100586, "global_step": 187755, "epoch": 1551} {"train_loss": -40.73175811767578, "global_step": 187756, "epoch": 1551} {"train_loss": -39.890316009521484, "global_step": 187757, "epoch": 1551} {"train_loss": -41.23118209838867, "global_step": 187758, "epoch": 1551} {"train_loss": -40.93382263183594, "global_step": 187759, "epoch": 1551} {"train_loss": -39.70948028564453, "global_step": 187760, "epoch": 1551} {"train_loss": -40.06535339355469, "global_step": 187761, "epoch": 1551} {"train_loss": -39.21806716918945, "global_step": 187762, "epoch": 1551} {"train_loss": -41.01337432861328, "global_step": 187763, "epoch": 1551} {"train_loss": -41.250160217285156, "global_step": 187764, "epoch": 1551} {"train_loss": -40.485897064208984, "global_step": 187765, "epoch": 1551} {"train_loss": -39.48518371582031, "global_step": 187766, "epoch": 1551} {"train_loss": -40.79082107543945, "global_step": 187767, "epoch": 1551} {"train_loss": -40.025169372558594, "global_step": 187768, "epoch": 1551} {"train_loss": -36.57756423950195, "global_step": 187769, "epoch": 1551} {"train_loss": -39.912044525146484, "global_step": 187770, "epoch": 1551} {"train_loss": -36.92678451538086, "global_step": 187771, "epoch": 1551} {"train_loss": -41.251888275146484, "global_step": 187772, "epoch": 1551} {"train_loss": -39.61520004272461, "global_step": 187773, "epoch": 1551} {"train_loss": -40.32050704956055, "global_step": 187774, "epoch": 1551} {"train_loss": -39.16695022583008, "global_step": 187775, "epoch": 1551} {"train_loss": -40.25221633911133, "global_step": 187776, "epoch": 1551} {"train_loss": -38.36758041381836, "global_step": 187777, "epoch": 1551} {"train_loss": -39.06385040283203, "global_step": 187778, "epoch": 1551} {"train_loss": -40.3092041015625, "global_step": 187779, "epoch": 1551} {"train_loss": -37.46466827392578, "global_step": 187780, "epoch": 1551} {"train_loss": -41.02851104736328, "global_step": 187781, "epoch": 1551} {"train_loss": -40.30400848388672, "global_step": 187782, "epoch": 1551} {"train_loss": -39.695762634277344, "global_step": 187783, "epoch": 1551} {"train_loss": -40.74994659423828, "global_step": 187784, "epoch": 1551} {"train_loss": -38.87716293334961, "global_step": 187785, "epoch": 1551} {"train_loss": -40.81045150756836, "global_step": 187786, "epoch": 1551} {"train_loss": -40.878963470458984, "global_step": 187787, "epoch": 1551} {"train_loss": -40.03587341308594, "global_step": 187788, "epoch": 1551} {"train_loss": -37.516693115234375, "global_step": 187789, "epoch": 1551} {"train_loss": -40.274532318115234, "global_step": 187790, "epoch": 1551} {"train_loss": -40.47469131217515, "global_step": 187791, "epoch": 1551, "val_loss": 2637920.25} {"train_loss": -40.75812911987305, "global_step": 187792, "epoch": 1552} {"train_loss": -39.893310546875, "global_step": 187793, "epoch": 1552} {"train_loss": -40.38102340698242, "global_step": 187794, "epoch": 1552} {"train_loss": -40.24349594116211, "global_step": 187795, "epoch": 1552} {"train_loss": -36.38005447387695, "global_step": 187796, "epoch": 1552} {"train_loss": -40.641456604003906, "global_step": 187797, "epoch": 1552} {"train_loss": -41.10663986206055, "global_step": 187798, "epoch": 1552} {"train_loss": -40.440582275390625, "global_step": 187799, "epoch": 1552} {"train_loss": -40.097808837890625, "global_step": 187800, "epoch": 1552} {"train_loss": -40.34968185424805, "global_step": 187801, "epoch": 1552} {"train_loss": -40.07052230834961, "global_step": 187802, "epoch": 1552} {"train_loss": -38.83814239501953, "global_step": 187803, "epoch": 1552} {"train_loss": -40.98637008666992, "global_step": 187804, "epoch": 1552} {"train_loss": -40.872066497802734, "global_step": 187805, "epoch": 1552} {"train_loss": -40.48492431640625, "global_step": 187806, "epoch": 1552} {"train_loss": -40.86370086669922, "global_step": 187807, "epoch": 1552} {"train_loss": -38.754554748535156, "global_step": 187808, "epoch": 1552} {"train_loss": -40.128448486328125, "global_step": 187809, "epoch": 1552} {"train_loss": -38.58755874633789, "global_step": 187810, "epoch": 1552} {"train_loss": -40.70343780517578, "global_step": 187811, "epoch": 1552} {"train_loss": -38.367713928222656, "global_step": 187812, "epoch": 1552} {"train_loss": -39.76581954956055, "global_step": 187813, "epoch": 1552} {"train_loss": -40.884254455566406, "global_step": 187814, "epoch": 1552} {"train_loss": -41.01680374145508, "global_step": 187815, "epoch": 1552} {"train_loss": -41.237945556640625, "global_step": 187816, "epoch": 1552} {"train_loss": -39.39231491088867, "global_step": 187817, "epoch": 1552} {"train_loss": -40.340789794921875, "global_step": 187818, "epoch": 1552} {"train_loss": -39.4382209777832, "global_step": 187819, "epoch": 1552} {"train_loss": -40.09965896606445, "global_step": 187820, "epoch": 1552} {"train_loss": -40.86909866333008, "global_step": 187821, "epoch": 1552} {"train_loss": -41.24777603149414, "global_step": 187822, "epoch": 1552} {"train_loss": -40.953956604003906, "global_step": 187823, "epoch": 1552} {"train_loss": -39.95833969116211, "global_step": 187824, "epoch": 1552} {"train_loss": -40.190948486328125, "global_step": 187825, "epoch": 1552} {"train_loss": -40.1766242980957, "global_step": 187826, "epoch": 1552} {"train_loss": -40.661495208740234, "global_step": 187827, "epoch": 1552} {"train_loss": -40.149879455566406, "global_step": 187828, "epoch": 1552} {"train_loss": -40.341243743896484, "global_step": 187829, "epoch": 1552} {"train_loss": -40.09785461425781, "global_step": 187830, "epoch": 1552} {"train_loss": -39.47697067260742, "global_step": 187831, "epoch": 1552} {"train_loss": -40.35003662109375, "global_step": 187832, "epoch": 1552} {"train_loss": -40.07307052612305, "global_step": 187833, "epoch": 1552} {"train_loss": -40.574703216552734, "global_step": 187834, "epoch": 1552} {"train_loss": -40.79213333129883, "global_step": 187835, "epoch": 1552} {"train_loss": -41.237701416015625, "global_step": 187836, "epoch": 1552} {"train_loss": -40.605369567871094, "global_step": 187837, "epoch": 1552} {"train_loss": -39.830753326416016, "global_step": 187838, "epoch": 1552} {"train_loss": -40.259986877441406, "global_step": 187839, "epoch": 1552} {"train_loss": -40.94173812866211, "global_step": 187840, "epoch": 1552} {"train_loss": -40.19724655151367, "global_step": 187841, "epoch": 1552} {"train_loss": -41.75693893432617, "global_step": 187842, "epoch": 1552} {"train_loss": -41.2400016784668, "global_step": 187843, "epoch": 1552} {"train_loss": -41.020469665527344, "global_step": 187844, "epoch": 1552} {"train_loss": -40.349971771240234, "global_step": 187845, "epoch": 1552} {"train_loss": -40.80792236328125, "global_step": 187846, "epoch": 1552} {"train_loss": -40.97383499145508, "global_step": 187847, "epoch": 1552} {"train_loss": -40.78567886352539, "global_step": 187848, "epoch": 1552} {"train_loss": -38.739479064941406, "global_step": 187849, "epoch": 1552} {"train_loss": -39.2826042175293, "global_step": 187850, "epoch": 1552} {"train_loss": -40.75145721435547, "global_step": 187851, "epoch": 1552} {"train_loss": -40.306724548339844, "global_step": 187852, "epoch": 1552} {"train_loss": -39.74591064453125, "global_step": 187853, "epoch": 1552} {"train_loss": -40.62485122680664, "global_step": 187854, "epoch": 1552} {"train_loss": -40.6912956237793, "global_step": 187855, "epoch": 1552} {"train_loss": -39.91862869262695, "global_step": 187856, "epoch": 1552} {"train_loss": -41.52583694458008, "global_step": 187857, "epoch": 1552} {"train_loss": -41.214839935302734, "global_step": 187858, "epoch": 1552} {"train_loss": -40.76340866088867, "global_step": 187859, "epoch": 1552} {"train_loss": -41.005367279052734, "global_step": 187860, "epoch": 1552} {"train_loss": -41.064903259277344, "global_step": 187861, "epoch": 1552} {"train_loss": -40.44220733642578, "global_step": 187862, "epoch": 1552} {"train_loss": -39.332923889160156, "global_step": 187863, "epoch": 1552} {"train_loss": -40.70637130737305, "global_step": 187864, "epoch": 1552} {"train_loss": -40.63408279418945, "global_step": 187865, "epoch": 1552} {"train_loss": -40.38317108154297, "global_step": 187866, "epoch": 1552} {"train_loss": -40.979217529296875, "global_step": 187867, "epoch": 1552} {"train_loss": -41.16920852661133, "global_step": 187868, "epoch": 1552} {"train_loss": -40.92876052856445, "global_step": 187869, "epoch": 1552} {"train_loss": -41.23681640625, "global_step": 187870, "epoch": 1552} {"train_loss": -39.605403900146484, "global_step": 187871, "epoch": 1552} {"train_loss": -40.630531311035156, "global_step": 187872, "epoch": 1552} {"train_loss": -40.86037826538086, "global_step": 187873, "epoch": 1552} {"train_loss": -40.91339874267578, "global_step": 187874, "epoch": 1552} {"train_loss": -40.93596267700195, "global_step": 187875, "epoch": 1552} {"train_loss": -40.66047286987305, "global_step": 187876, "epoch": 1552} {"train_loss": -38.734310150146484, "global_step": 187877, "epoch": 1552} {"train_loss": -40.934722900390625, "global_step": 187878, "epoch": 1552} {"train_loss": -40.92567825317383, "global_step": 187879, "epoch": 1552} {"train_loss": -39.47684097290039, "global_step": 187880, "epoch": 1552} {"train_loss": -40.1887092590332, "global_step": 187881, "epoch": 1552} {"train_loss": -39.95137405395508, "global_step": 187882, "epoch": 1552} {"train_loss": -39.18498611450195, "global_step": 187883, "epoch": 1552} {"train_loss": -40.065364837646484, "global_step": 187884, "epoch": 1552} {"train_loss": -39.13945770263672, "global_step": 187885, "epoch": 1552} {"train_loss": -39.58136749267578, "global_step": 187886, "epoch": 1552} {"train_loss": -40.95542526245117, "global_step": 187887, "epoch": 1552} {"train_loss": -40.12770462036133, "global_step": 187888, "epoch": 1552} {"train_loss": -40.354732513427734, "global_step": 187889, "epoch": 1552} {"train_loss": -37.778175354003906, "global_step": 187890, "epoch": 1552} {"train_loss": -41.08454513549805, "global_step": 187891, "epoch": 1552} {"train_loss": -40.28841781616211, "global_step": 187892, "epoch": 1552} {"train_loss": -39.69198226928711, "global_step": 187893, "epoch": 1552} {"train_loss": -36.999305725097656, "global_step": 187894, "epoch": 1552} {"train_loss": -40.03766632080078, "global_step": 187895, "epoch": 1552} {"train_loss": -40.37418746948242, "global_step": 187896, "epoch": 1552} {"train_loss": -39.902198791503906, "global_step": 187897, "epoch": 1552} {"train_loss": -40.2563591003418, "global_step": 187898, "epoch": 1552} {"train_loss": -40.1993293762207, "global_step": 187899, "epoch": 1552} {"train_loss": -40.4751091003418, "global_step": 187900, "epoch": 1552} {"train_loss": -39.85111618041992, "global_step": 187901, "epoch": 1552} {"train_loss": -40.06657409667969, "global_step": 187902, "epoch": 1552} {"train_loss": -38.852962493896484, "global_step": 187903, "epoch": 1552} {"train_loss": -39.106380462646484, "global_step": 187904, "epoch": 1552} {"train_loss": -40.75522994995117, "global_step": 187905, "epoch": 1552} {"train_loss": -39.64168167114258, "global_step": 187906, "epoch": 1552} {"train_loss": -36.97541046142578, "global_step": 187907, "epoch": 1552} {"train_loss": -39.8372917175293, "global_step": 187908, "epoch": 1552} {"train_loss": -36.32685470581055, "global_step": 187909, "epoch": 1552} {"train_loss": -24.422719955444336, "global_step": 187910, "epoch": 1552} {"train_loss": -38.63922119140625, "global_step": 187911, "epoch": 1552} {"train_loss": -39.99824244916932, "global_step": 187912, "epoch": 1552, "val_loss": 2573167.0} {"train_loss": -30.979602813720703, "global_step": 187913, "epoch": 1553} {"train_loss": -34.32062530517578, "global_step": 187914, "epoch": 1553} {"train_loss": -34.832576751708984, "global_step": 187915, "epoch": 1553} {"train_loss": -35.73517990112305, "global_step": 187916, "epoch": 1553} {"train_loss": -35.223663330078125, "global_step": 187917, "epoch": 1553} {"train_loss": -34.3166618347168, "global_step": 187918, "epoch": 1553} {"train_loss": -36.781612396240234, "global_step": 187919, "epoch": 1553} {"train_loss": -34.86220932006836, "global_step": 187920, "epoch": 1553} {"train_loss": -30.031177520751953, "global_step": 187921, "epoch": 1553} {"train_loss": -35.6551399230957, "global_step": 187922, "epoch": 1553} {"train_loss": -37.0167236328125, "global_step": 187923, "epoch": 1553} {"train_loss": -38.9085807800293, "global_step": 187924, "epoch": 1553} {"train_loss": -37.99888229370117, "global_step": 187925, "epoch": 1553} {"train_loss": -35.68325424194336, "global_step": 187926, "epoch": 1553} {"train_loss": -37.38711166381836, "global_step": 187927, "epoch": 1553} {"train_loss": -36.68230056762695, "global_step": 187928, "epoch": 1553} {"train_loss": -37.72282791137695, "global_step": 187929, "epoch": 1553} {"train_loss": -35.74091720581055, "global_step": 187930, "epoch": 1553} {"train_loss": -37.55556869506836, "global_step": 187931, "epoch": 1553} {"train_loss": -38.40584182739258, "global_step": 187932, "epoch": 1553} {"train_loss": -38.32863998413086, "global_step": 187933, "epoch": 1553} {"train_loss": -36.49689865112305, "global_step": 187934, "epoch": 1553} {"train_loss": -37.76377487182617, "global_step": 187935, "epoch": 1553} {"train_loss": -38.82465362548828, "global_step": 187936, "epoch": 1553} {"train_loss": -37.23290252685547, "global_step": 187937, "epoch": 1553} {"train_loss": -36.27225112915039, "global_step": 187938, "epoch": 1553} {"train_loss": -38.28368377685547, "global_step": 187939, "epoch": 1553} {"train_loss": -37.98469161987305, "global_step": 187940, "epoch": 1553} {"train_loss": -39.23583984375, "global_step": 187941, "epoch": 1553} {"train_loss": -38.75447463989258, "global_step": 187942, "epoch": 1553} {"train_loss": -39.95185089111328, "global_step": 187943, "epoch": 1553} {"train_loss": -37.82573699951172, "global_step": 187944, "epoch": 1553} {"train_loss": -37.861392974853516, "global_step": 187945, "epoch": 1553} {"train_loss": -39.43989181518555, "global_step": 187946, "epoch": 1553} {"train_loss": -38.92301940917969, "global_step": 187947, "epoch": 1553} {"train_loss": -38.967498779296875, "global_step": 187948, "epoch": 1553} {"train_loss": -39.22652053833008, "global_step": 187949, "epoch": 1553} {"train_loss": -38.446651458740234, "global_step": 187950, "epoch": 1553} {"train_loss": -39.538421630859375, "global_step": 187951, "epoch": 1553} {"train_loss": -39.7387809753418, "global_step": 187952, "epoch": 1553} {"train_loss": -39.900325775146484, "global_step": 187953, "epoch": 1553} {"train_loss": -40.10712432861328, "global_step": 187954, "epoch": 1553} {"train_loss": -39.23365783691406, "global_step": 187955, "epoch": 1553} {"train_loss": -38.05489730834961, "global_step": 187956, "epoch": 1553} {"train_loss": -39.35133361816406, "global_step": 187957, "epoch": 1553} {"train_loss": -40.05426025390625, "global_step": 187958, "epoch": 1553} {"train_loss": -40.28067398071289, "global_step": 187959, "epoch": 1553} {"train_loss": -39.320499420166016, "global_step": 187960, "epoch": 1553} {"train_loss": -40.445411682128906, "global_step": 187961, "epoch": 1553} {"train_loss": -40.178592681884766, "global_step": 187962, "epoch": 1553} {"train_loss": -40.2982177734375, "global_step": 187963, "epoch": 1553} {"train_loss": -40.01190185546875, "global_step": 187964, "epoch": 1553} {"train_loss": -40.699432373046875, "global_step": 187965, "epoch": 1553} {"train_loss": -40.38523483276367, "global_step": 187966, "epoch": 1553} {"train_loss": -40.03845977783203, "global_step": 187967, "epoch": 1553} {"train_loss": -39.9821891784668, "global_step": 187968, "epoch": 1553} {"train_loss": -40.20309066772461, "global_step": 187969, "epoch": 1553} {"train_loss": -40.45453643798828, "global_step": 187970, "epoch": 1553} {"train_loss": -40.22869110107422, "global_step": 187971, "epoch": 1553} {"train_loss": -40.68048858642578, "global_step": 187972, "epoch": 1553} {"train_loss": -40.6381950378418, "global_step": 187973, "epoch": 1553} {"train_loss": -40.34294128417969, "global_step": 187974, "epoch": 1553} {"train_loss": -40.32536697387695, "global_step": 187975, "epoch": 1553} {"train_loss": -40.67578125, "global_step": 187976, "epoch": 1553} {"train_loss": -40.14899826049805, "global_step": 187977, "epoch": 1553} {"train_loss": -40.42673873901367, "global_step": 187978, "epoch": 1553} {"train_loss": -40.24245834350586, "global_step": 187979, "epoch": 1553} {"train_loss": -39.61981201171875, "global_step": 187980, "epoch": 1553} {"train_loss": -40.53409194946289, "global_step": 187981, "epoch": 1553} {"train_loss": -40.271236419677734, "global_step": 187982, "epoch": 1553} {"train_loss": -40.46904754638672, "global_step": 187983, "epoch": 1553} {"train_loss": -40.70036315917969, "global_step": 187984, "epoch": 1553} {"train_loss": -40.15508270263672, "global_step": 187985, "epoch": 1553} {"train_loss": -39.55119323730469, "global_step": 187986, "epoch": 1553} {"train_loss": -40.78540802001953, "global_step": 187987, "epoch": 1553} {"train_loss": -40.71017074584961, "global_step": 187988, "epoch": 1553} {"train_loss": -40.456851959228516, "global_step": 187989, "epoch": 1553} {"train_loss": -40.49501419067383, "global_step": 187990, "epoch": 1553} {"train_loss": -40.87272262573242, "global_step": 187991, "epoch": 1553} {"train_loss": -40.698787689208984, "global_step": 187992, "epoch": 1553} {"train_loss": -40.95924377441406, "global_step": 187993, "epoch": 1553} {"train_loss": -40.71595001220703, "global_step": 187994, "epoch": 1553} {"train_loss": -40.96906661987305, "global_step": 187995, "epoch": 1553} {"train_loss": -41.580562591552734, "global_step": 187996, "epoch": 1553} {"train_loss": -40.21002960205078, "global_step": 187997, "epoch": 1553} {"train_loss": -41.47373580932617, "global_step": 187998, "epoch": 1553} {"train_loss": -41.4027214050293, "global_step": 187999, "epoch": 1553} {"train_loss": -40.37907028198242, "global_step": 188000, "epoch": 1553} {"train_loss": -38.10953903198242, "global_step": 188001, "epoch": 1553} {"train_loss": -40.859344482421875, "global_step": 188002, "epoch": 1553} {"train_loss": -41.36288070678711, "global_step": 188003, "epoch": 1553} {"train_loss": -40.82527542114258, "global_step": 188004, "epoch": 1553} {"train_loss": -40.785072326660156, "global_step": 188005, "epoch": 1553} {"train_loss": -40.94684600830078, "global_step": 188006, "epoch": 1553} {"train_loss": -41.61025619506836, "global_step": 188007, "epoch": 1553} {"train_loss": -41.63859176635742, "global_step": 188008, "epoch": 1553} {"train_loss": -41.60755157470703, "global_step": 188009, "epoch": 1553} {"train_loss": -40.74959182739258, "global_step": 188010, "epoch": 1553} {"train_loss": -41.40789794921875, "global_step": 188011, "epoch": 1553} {"train_loss": -41.5678825378418, "global_step": 188012, "epoch": 1553} {"train_loss": -41.340301513671875, "global_step": 188013, "epoch": 1553} {"train_loss": -39.7944450378418, "global_step": 188014, "epoch": 1553} {"train_loss": -41.43071365356445, "global_step": 188015, "epoch": 1553} {"train_loss": -41.710426330566406, "global_step": 188016, "epoch": 1553} {"train_loss": -41.180816650390625, "global_step": 188017, "epoch": 1553} {"train_loss": -39.87397384643555, "global_step": 188018, "epoch": 1553} {"train_loss": -40.84657669067383, "global_step": 188019, "epoch": 1553} {"train_loss": -40.84865188598633, "global_step": 188020, "epoch": 1553} {"train_loss": -41.2603874206543, "global_step": 188021, "epoch": 1553} {"train_loss": -41.2795295715332, "global_step": 188022, "epoch": 1553} {"train_loss": -41.32552719116211, "global_step": 188023, "epoch": 1553} {"train_loss": -40.669288635253906, "global_step": 188024, "epoch": 1553} {"train_loss": -38.627071380615234, "global_step": 188025, "epoch": 1553} {"train_loss": -40.986289978027344, "global_step": 188026, "epoch": 1553} {"train_loss": -41.67295455932617, "global_step": 188027, "epoch": 1553} {"train_loss": -40.90778350830078, "global_step": 188028, "epoch": 1553} {"train_loss": -41.193660736083984, "global_step": 188029, "epoch": 1553} {"train_loss": -39.97396469116211, "global_step": 188030, "epoch": 1553} {"train_loss": -40.13425827026367, "global_step": 188031, "epoch": 1553} {"train_loss": -38.992706298828125, "global_step": 188032, "epoch": 1553} {"train_loss": -39.393945173783735, "global_step": 188033, "epoch": 1553, "val_loss": 2780505.25} {"train_loss": -39.916561126708984, "global_step": 188034, "epoch": 1554} {"train_loss": -38.67817306518555, "global_step": 188035, "epoch": 1554} {"train_loss": -37.01728439331055, "global_step": 188036, "epoch": 1554} {"train_loss": -40.050472259521484, "global_step": 188037, "epoch": 1554} {"train_loss": -38.38761901855469, "global_step": 188038, "epoch": 1554} {"train_loss": -40.613643646240234, "global_step": 188039, "epoch": 1554} {"train_loss": -37.49003219604492, "global_step": 188040, "epoch": 1554} {"train_loss": -39.75840377807617, "global_step": 188041, "epoch": 1554} {"train_loss": -37.143001556396484, "global_step": 188042, "epoch": 1554} {"train_loss": -39.04704666137695, "global_step": 188043, "epoch": 1554} {"train_loss": -39.9981803894043, "global_step": 188044, "epoch": 1554} {"train_loss": -39.48910140991211, "global_step": 188045, "epoch": 1554} {"train_loss": -39.9064826965332, "global_step": 188046, "epoch": 1554} {"train_loss": -40.562538146972656, "global_step": 188047, "epoch": 1554} {"train_loss": -38.17085266113281, "global_step": 188048, "epoch": 1554} {"train_loss": -38.09938430786133, "global_step": 188049, "epoch": 1554} {"train_loss": -40.17019271850586, "global_step": 188050, "epoch": 1554} {"train_loss": -38.921714782714844, "global_step": 188051, "epoch": 1554} {"train_loss": -39.5434684753418, "global_step": 188052, "epoch": 1554} {"train_loss": -35.473121643066406, "global_step": 188053, "epoch": 1554} {"train_loss": -36.86643981933594, "global_step": 188054, "epoch": 1554} {"train_loss": -40.954315185546875, "global_step": 188055, "epoch": 1554} {"train_loss": -39.153602600097656, "global_step": 188056, "epoch": 1554} {"train_loss": -38.18250274658203, "global_step": 188057, "epoch": 1554} {"train_loss": -39.492469787597656, "global_step": 188058, "epoch": 1554} {"train_loss": -40.34484100341797, "global_step": 188059, "epoch": 1554} {"train_loss": -39.11977005004883, "global_step": 188060, "epoch": 1554} {"train_loss": -39.035037994384766, "global_step": 188061, "epoch": 1554} {"train_loss": -40.83761215209961, "global_step": 188062, "epoch": 1554} {"train_loss": -39.09939956665039, "global_step": 188063, "epoch": 1554} {"train_loss": -39.557613372802734, "global_step": 188064, "epoch": 1554} {"train_loss": -40.0372314453125, "global_step": 188065, "epoch": 1554} {"train_loss": -40.35101318359375, "global_step": 188066, "epoch": 1554} {"train_loss": -40.66085433959961, "global_step": 188067, "epoch": 1554} {"train_loss": -40.864688873291016, "global_step": 188068, "epoch": 1554} {"train_loss": -38.968482971191406, "global_step": 188069, "epoch": 1554} {"train_loss": -40.61064910888672, "global_step": 188070, "epoch": 1554} {"train_loss": -40.595882415771484, "global_step": 188071, "epoch": 1554} {"train_loss": -41.32194900512695, "global_step": 188072, "epoch": 1554} {"train_loss": -40.461910247802734, "global_step": 188073, "epoch": 1554} {"train_loss": -41.20559310913086, "global_step": 188074, "epoch": 1554} {"train_loss": -40.39921569824219, "global_step": 188075, "epoch": 1554} {"train_loss": -40.9777946472168, "global_step": 188076, "epoch": 1554} {"train_loss": -40.747528076171875, "global_step": 188077, "epoch": 1554} {"train_loss": -41.06094741821289, "global_step": 188078, "epoch": 1554} {"train_loss": -40.687767028808594, "global_step": 188079, "epoch": 1554} {"train_loss": -40.8243293762207, "global_step": 188080, "epoch": 1554} {"train_loss": -40.90822982788086, "global_step": 188081, "epoch": 1554} {"train_loss": -41.01314163208008, "global_step": 188082, "epoch": 1554} {"train_loss": -41.16305160522461, "global_step": 188083, "epoch": 1554} {"train_loss": -40.992919921875, "global_step": 188084, "epoch": 1554} {"train_loss": -41.00688934326172, "global_step": 188085, "epoch": 1554} {"train_loss": -41.073997497558594, "global_step": 188086, "epoch": 1554} {"train_loss": -41.441619873046875, "global_step": 188087, "epoch": 1554} {"train_loss": -41.208343505859375, "global_step": 188088, "epoch": 1554} {"train_loss": -41.297611236572266, "global_step": 188089, "epoch": 1554} {"train_loss": -41.83222579956055, "global_step": 188090, "epoch": 1554} {"train_loss": -41.1417236328125, "global_step": 188091, "epoch": 1554} {"train_loss": -41.90382385253906, "global_step": 188092, "epoch": 1554} {"train_loss": -41.43099594116211, "global_step": 188093, "epoch": 1554} {"train_loss": -41.69318389892578, "global_step": 188094, "epoch": 1554} {"train_loss": -41.75550842285156, "global_step": 188095, "epoch": 1554} {"train_loss": -41.3392448425293, "global_step": 188096, "epoch": 1554} {"train_loss": -41.74971389770508, "global_step": 188097, "epoch": 1554} {"train_loss": -41.71039962768555, "global_step": 188098, "epoch": 1554} {"train_loss": -41.71999740600586, "global_step": 188099, "epoch": 1554} {"train_loss": -41.316871643066406, "global_step": 188100, "epoch": 1554} {"train_loss": -40.71845245361328, "global_step": 188101, "epoch": 1554} {"train_loss": -41.67683029174805, "global_step": 188102, "epoch": 1554} {"train_loss": -42.24531936645508, "global_step": 188103, "epoch": 1554} {"train_loss": -41.54358673095703, "global_step": 188104, "epoch": 1554} {"train_loss": -41.38443374633789, "global_step": 188105, "epoch": 1554} {"train_loss": -41.87947463989258, "global_step": 188106, "epoch": 1554} {"train_loss": -41.85052490234375, "global_step": 188107, "epoch": 1554} {"train_loss": -41.51363754272461, "global_step": 188108, "epoch": 1554} {"train_loss": -41.31178283691406, "global_step": 188109, "epoch": 1554} {"train_loss": -41.06467056274414, "global_step": 188110, "epoch": 1554} {"train_loss": -41.795101165771484, "global_step": 188111, "epoch": 1554} {"train_loss": -41.06871032714844, "global_step": 188112, "epoch": 1554} {"train_loss": -41.93117904663086, "global_step": 188113, "epoch": 1554} {"train_loss": -42.367366790771484, "global_step": 188114, "epoch": 1554} {"train_loss": -42.130374908447266, "global_step": 188115, "epoch": 1554} {"train_loss": -41.27647018432617, "global_step": 188116, "epoch": 1554} {"train_loss": -41.109222412109375, "global_step": 188117, "epoch": 1554} {"train_loss": -41.214778900146484, "global_step": 188118, "epoch": 1554} {"train_loss": -39.97036361694336, "global_step": 188119, "epoch": 1554} {"train_loss": -37.61812973022461, "global_step": 188120, "epoch": 1554} {"train_loss": -40.416358947753906, "global_step": 188121, "epoch": 1554} {"train_loss": -40.58420944213867, "global_step": 188122, "epoch": 1554} {"train_loss": -37.99127960205078, "global_step": 188123, "epoch": 1554} {"train_loss": -33.80413818359375, "global_step": 188124, "epoch": 1554} {"train_loss": -31.563013076782227, "global_step": 188125, "epoch": 1554} {"train_loss": -32.285850524902344, "global_step": 188126, "epoch": 1554} {"train_loss": -39.19890213012695, "global_step": 188127, "epoch": 1554} {"train_loss": -38.135528564453125, "global_step": 188128, "epoch": 1554} {"train_loss": -33.02344512939453, "global_step": 188129, "epoch": 1554} {"train_loss": -36.083492279052734, "global_step": 188130, "epoch": 1554} {"train_loss": -40.68109130859375, "global_step": 188131, "epoch": 1554} {"train_loss": -34.97224807739258, "global_step": 188132, "epoch": 1554} {"train_loss": -39.815486907958984, "global_step": 188133, "epoch": 1554} {"train_loss": -38.04969024658203, "global_step": 188134, "epoch": 1554} {"train_loss": -39.53626251220703, "global_step": 188135, "epoch": 1554} {"train_loss": -39.079551696777344, "global_step": 188136, "epoch": 1554} {"train_loss": -39.78646469116211, "global_step": 188137, "epoch": 1554} {"train_loss": -39.17874526977539, "global_step": 188138, "epoch": 1554} {"train_loss": -40.54866409301758, "global_step": 188139, "epoch": 1554} {"train_loss": -39.79469680786133, "global_step": 188140, "epoch": 1554} {"train_loss": -40.18339538574219, "global_step": 188141, "epoch": 1554} {"train_loss": -39.1405029296875, "global_step": 188142, "epoch": 1554} {"train_loss": -39.09762954711914, "global_step": 188143, "epoch": 1554} {"train_loss": -39.84436798095703, "global_step": 188144, "epoch": 1554} {"train_loss": -39.581539154052734, "global_step": 188145, "epoch": 1554} {"train_loss": -37.104095458984375, "global_step": 188146, "epoch": 1554} {"train_loss": -36.42753601074219, "global_step": 188147, "epoch": 1554} {"train_loss": -38.37241744995117, "global_step": 188148, "epoch": 1554} {"train_loss": -39.405921936035156, "global_step": 188149, "epoch": 1554} {"train_loss": -38.281803131103516, "global_step": 188150, "epoch": 1554} {"train_loss": -38.9397087097168, "global_step": 188151, "epoch": 1554} {"train_loss": -39.45566940307617, "global_step": 188152, "epoch": 1554} {"train_loss": -37.48101806640625, "global_step": 188153, "epoch": 1554} {"train_loss": -39.766047564419836, "global_step": 188154, "epoch": 1554, "val_loss": 2605687.75} {"train_loss": -38.8132438659668, "global_step": 188155, "epoch": 1555} {"train_loss": -39.713706970214844, "global_step": 188156, "epoch": 1555} {"train_loss": -39.30898666381836, "global_step": 188157, "epoch": 1555} {"train_loss": -38.917396545410156, "global_step": 188158, "epoch": 1555} {"train_loss": -39.931304931640625, "global_step": 188159, "epoch": 1555} {"train_loss": -40.35032272338867, "global_step": 188160, "epoch": 1555} {"train_loss": -38.74503707885742, "global_step": 188161, "epoch": 1555} {"train_loss": -40.706199645996094, "global_step": 188162, "epoch": 1555} {"train_loss": -39.69203567504883, "global_step": 188163, "epoch": 1555} {"train_loss": -39.83609390258789, "global_step": 188164, "epoch": 1555} {"train_loss": -40.970619201660156, "global_step": 188165, "epoch": 1555} {"train_loss": -39.81342697143555, "global_step": 188166, "epoch": 1555} {"train_loss": -40.550838470458984, "global_step": 188167, "epoch": 1555} {"train_loss": -40.34849166870117, "global_step": 188168, "epoch": 1555} {"train_loss": -40.754798889160156, "global_step": 188169, "epoch": 1555} {"train_loss": -40.32862854003906, "global_step": 188170, "epoch": 1555} {"train_loss": -41.02495193481445, "global_step": 188171, "epoch": 1555} {"train_loss": -40.92593765258789, "global_step": 188172, "epoch": 1555} {"train_loss": -40.54746627807617, "global_step": 188173, "epoch": 1555} {"train_loss": -41.297847747802734, "global_step": 188174, "epoch": 1555} {"train_loss": -40.88716125488281, "global_step": 188175, "epoch": 1555} {"train_loss": -41.26727294921875, "global_step": 188176, "epoch": 1555} {"train_loss": -40.93585205078125, "global_step": 188177, "epoch": 1555} {"train_loss": -41.071922302246094, "global_step": 188178, "epoch": 1555} {"train_loss": -40.95818328857422, "global_step": 188179, "epoch": 1555} {"train_loss": -41.2029914855957, "global_step": 188180, "epoch": 1555} {"train_loss": -41.4310188293457, "global_step": 188181, "epoch": 1555} {"train_loss": -41.3377799987793, "global_step": 188182, "epoch": 1555} {"train_loss": -41.203529357910156, "global_step": 188183, "epoch": 1555} {"train_loss": -41.88356399536133, "global_step": 188184, "epoch": 1555} {"train_loss": -41.736610412597656, "global_step": 188185, "epoch": 1555} {"train_loss": -41.67011642456055, "global_step": 188186, "epoch": 1555} {"train_loss": -41.94378662109375, "global_step": 188187, "epoch": 1555} {"train_loss": -41.432918548583984, "global_step": 188188, "epoch": 1555} {"train_loss": -41.9728889465332, "global_step": 188189, "epoch": 1555} {"train_loss": -41.86090850830078, "global_step": 188190, "epoch": 1555} {"train_loss": -41.76093673706055, "global_step": 188191, "epoch": 1555} {"train_loss": -42.13582992553711, "global_step": 188192, "epoch": 1555} {"train_loss": -41.617801666259766, "global_step": 188193, "epoch": 1555} {"train_loss": -42.1369514465332, "global_step": 188194, "epoch": 1555} {"train_loss": -41.886566162109375, "global_step": 188195, "epoch": 1555} {"train_loss": -41.930355072021484, "global_step": 188196, "epoch": 1555} {"train_loss": -42.22753143310547, "global_step": 188197, "epoch": 1555} {"train_loss": -42.22222137451172, "global_step": 188198, "epoch": 1555} {"train_loss": -42.27744674682617, "global_step": 188199, "epoch": 1555} {"train_loss": -42.32582092285156, "global_step": 188200, "epoch": 1555} {"train_loss": -42.80720138549805, "global_step": 188201, "epoch": 1555} {"train_loss": -42.28369903564453, "global_step": 188202, "epoch": 1555} {"train_loss": -42.567726135253906, "global_step": 188203, "epoch": 1555} {"train_loss": -42.37470245361328, "global_step": 188204, "epoch": 1555} {"train_loss": -42.257564544677734, "global_step": 188205, "epoch": 1555} {"train_loss": -42.13874053955078, "global_step": 188206, "epoch": 1555} {"train_loss": -41.866947174072266, "global_step": 188207, "epoch": 1555} {"train_loss": -42.08002471923828, "global_step": 188208, "epoch": 1555} {"train_loss": -42.740962982177734, "global_step": 188209, "epoch": 1555} {"train_loss": -42.2553596496582, "global_step": 188210, "epoch": 1555} {"train_loss": -42.194515228271484, "global_step": 188211, "epoch": 1555} {"train_loss": -41.81288146972656, "global_step": 188212, "epoch": 1555} {"train_loss": -41.10539627075195, "global_step": 188213, "epoch": 1555} {"train_loss": -41.2098503112793, "global_step": 188214, "epoch": 1555} {"train_loss": -42.40530014038086, "global_step": 188215, "epoch": 1555} {"train_loss": -41.980037689208984, "global_step": 188216, "epoch": 1555} {"train_loss": -41.359901428222656, "global_step": 188217, "epoch": 1555} {"train_loss": -41.83183670043945, "global_step": 188218, "epoch": 1555} {"train_loss": -42.05373001098633, "global_step": 188219, "epoch": 1555} {"train_loss": -41.094276428222656, "global_step": 188220, "epoch": 1555} {"train_loss": -40.25840377807617, "global_step": 188221, "epoch": 1555} {"train_loss": -40.093265533447266, "global_step": 188222, "epoch": 1555} {"train_loss": -39.434391021728516, "global_step": 188223, "epoch": 1555} {"train_loss": -37.353572845458984, "global_step": 188224, "epoch": 1555} {"train_loss": -28.272790908813477, "global_step": 188225, "epoch": 1555} {"train_loss": -13.366559028625488, "global_step": 188226, "epoch": 1555} {"train_loss": -19.96516227722168, "global_step": 188227, "epoch": 1555} {"train_loss": -34.17707061767578, "global_step": 188228, "epoch": 1555} {"train_loss": -33.58240509033203, "global_step": 188229, "epoch": 1555} {"train_loss": -31.036853790283203, "global_step": 188230, "epoch": 1555} {"train_loss": -34.919864654541016, "global_step": 188231, "epoch": 1555} {"train_loss": -34.48988723754883, "global_step": 188232, "epoch": 1555} {"train_loss": -38.743316650390625, "global_step": 188233, "epoch": 1555} {"train_loss": -33.38594436645508, "global_step": 188234, "epoch": 1555} {"train_loss": -39.58238220214844, "global_step": 188235, "epoch": 1555} {"train_loss": -35.998897552490234, "global_step": 188236, "epoch": 1555} {"train_loss": -39.1733512878418, "global_step": 188237, "epoch": 1555} {"train_loss": -37.74135208129883, "global_step": 188238, "epoch": 1555} {"train_loss": -39.19892501831055, "global_step": 188239, "epoch": 1555} {"train_loss": -38.4627799987793, "global_step": 188240, "epoch": 1555} {"train_loss": -39.217464447021484, "global_step": 188241, "epoch": 1555} {"train_loss": -38.15313720703125, "global_step": 188242, "epoch": 1555} {"train_loss": -39.72465515136719, "global_step": 188243, "epoch": 1555} {"train_loss": -38.92998504638672, "global_step": 188244, "epoch": 1555} {"train_loss": -40.02153396606445, "global_step": 188245, "epoch": 1555} {"train_loss": -39.41030502319336, "global_step": 188246, "epoch": 1555} {"train_loss": -40.1747932434082, "global_step": 188247, "epoch": 1555} {"train_loss": -40.37031936645508, "global_step": 188248, "epoch": 1555} {"train_loss": -40.34061813354492, "global_step": 188249, "epoch": 1555} {"train_loss": -40.5645866394043, "global_step": 188250, "epoch": 1555} {"train_loss": -40.60858917236328, "global_step": 188251, "epoch": 1555} {"train_loss": -40.713558197021484, "global_step": 188252, "epoch": 1555} {"train_loss": -40.74341583251953, "global_step": 188253, "epoch": 1555} {"train_loss": -40.52040481567383, "global_step": 188254, "epoch": 1555} {"train_loss": -40.45417404174805, "global_step": 188255, "epoch": 1555} {"train_loss": -40.5070915222168, "global_step": 188256, "epoch": 1555} {"train_loss": -41.05674362182617, "global_step": 188257, "epoch": 1555} {"train_loss": -41.00511932373047, "global_step": 188258, "epoch": 1555} {"train_loss": -41.07149124145508, "global_step": 188259, "epoch": 1555} {"train_loss": -41.163875579833984, "global_step": 188260, "epoch": 1555} {"train_loss": -41.25190353393555, "global_step": 188261, "epoch": 1555} {"train_loss": -40.8788948059082, "global_step": 188262, "epoch": 1555} {"train_loss": -41.15505599975586, "global_step": 188263, "epoch": 1555} {"train_loss": -41.18186569213867, "global_step": 188264, "epoch": 1555} {"train_loss": -41.26029586791992, "global_step": 188265, "epoch": 1555} {"train_loss": -41.29502487182617, "global_step": 188266, "epoch": 1555} {"train_loss": -41.70001220703125, "global_step": 188267, "epoch": 1555} {"train_loss": -41.34294509887695, "global_step": 188268, "epoch": 1555} {"train_loss": -41.717830657958984, "global_step": 188269, "epoch": 1555} {"train_loss": -41.449459075927734, "global_step": 188270, "epoch": 1555} {"train_loss": -41.63495635986328, "global_step": 188271, "epoch": 1555} {"train_loss": -41.663021087646484, "global_step": 188272, "epoch": 1555} {"train_loss": -41.58339309692383, "global_step": 188273, "epoch": 1555} {"train_loss": -41.571189880371094, "global_step": 188274, "epoch": 1555} {"train_loss": -40.014710930753346, "global_step": 188275, "epoch": 1555, "val_loss": 2547394.25} {"train_loss": -41.69883346557617, "global_step": 188276, "epoch": 1556} {"train_loss": -41.94186019897461, "global_step": 188277, "epoch": 1556} {"train_loss": -41.67769241333008, "global_step": 188278, "epoch": 1556} {"train_loss": -41.72335433959961, "global_step": 188279, "epoch": 1556} {"train_loss": -41.695579528808594, "global_step": 188280, "epoch": 1556} {"train_loss": -41.93524932861328, "global_step": 188281, "epoch": 1556} {"train_loss": -42.10908508300781, "global_step": 188282, "epoch": 1556} {"train_loss": -42.088932037353516, "global_step": 188283, "epoch": 1556} {"train_loss": -41.6939582824707, "global_step": 188284, "epoch": 1556} {"train_loss": -41.572322845458984, "global_step": 188285, "epoch": 1556} {"train_loss": -42.28695297241211, "global_step": 188286, "epoch": 1556} {"train_loss": -42.04575729370117, "global_step": 188287, "epoch": 1556} {"train_loss": -41.24744415283203, "global_step": 188288, "epoch": 1556} {"train_loss": -42.067771911621094, "global_step": 188289, "epoch": 1556} {"train_loss": -42.154937744140625, "global_step": 188290, "epoch": 1556} {"train_loss": -42.265743255615234, "global_step": 188291, "epoch": 1556} {"train_loss": -41.95038986206055, "global_step": 188292, "epoch": 1556} {"train_loss": -42.088157653808594, "global_step": 188293, "epoch": 1556} {"train_loss": -41.92294692993164, "global_step": 188294, "epoch": 1556} {"train_loss": -41.85105895996094, "global_step": 188295, "epoch": 1556} {"train_loss": -41.9581298828125, "global_step": 188296, "epoch": 1556} {"train_loss": -41.600948333740234, "global_step": 188297, "epoch": 1556} {"train_loss": -41.90113067626953, "global_step": 188298, "epoch": 1556} {"train_loss": -42.205711364746094, "global_step": 188299, "epoch": 1556} {"train_loss": -42.26387405395508, "global_step": 188300, "epoch": 1556} {"train_loss": -42.046138763427734, "global_step": 188301, "epoch": 1556} {"train_loss": -42.2942008972168, "global_step": 188302, "epoch": 1556} {"train_loss": -41.862281799316406, "global_step": 188303, "epoch": 1556} {"train_loss": -41.676841735839844, "global_step": 188304, "epoch": 1556} {"train_loss": -42.249813079833984, "global_step": 188305, "epoch": 1556} {"train_loss": -41.92113494873047, "global_step": 188306, "epoch": 1556} {"train_loss": -42.404354095458984, "global_step": 188307, "epoch": 1556} {"train_loss": -42.26306915283203, "global_step": 188308, "epoch": 1556} {"train_loss": -42.02983856201172, "global_step": 188309, "epoch": 1556} {"train_loss": -42.374691009521484, "global_step": 188310, "epoch": 1556} {"train_loss": -42.83610153198242, "global_step": 188311, "epoch": 1556} {"train_loss": -42.17152404785156, "global_step": 188312, "epoch": 1556} {"train_loss": -42.52834701538086, "global_step": 188313, "epoch": 1556} {"train_loss": -42.391273498535156, "global_step": 188314, "epoch": 1556} {"train_loss": -42.5943717956543, "global_step": 188315, "epoch": 1556} {"train_loss": -42.1524658203125, "global_step": 188316, "epoch": 1556} {"train_loss": -42.84774398803711, "global_step": 188317, "epoch": 1556} {"train_loss": -42.474971771240234, "global_step": 188318, "epoch": 1556} {"train_loss": -41.8021125793457, "global_step": 188319, "epoch": 1556} {"train_loss": -42.430328369140625, "global_step": 188320, "epoch": 1556} {"train_loss": -42.32509994506836, "global_step": 188321, "epoch": 1556} {"train_loss": -41.930694580078125, "global_step": 188322, "epoch": 1556} {"train_loss": -42.44636154174805, "global_step": 188323, "epoch": 1556} {"train_loss": -42.4549446105957, "global_step": 188324, "epoch": 1556} {"train_loss": -42.39033889770508, "global_step": 188325, "epoch": 1556} {"train_loss": -41.548763275146484, "global_step": 188326, "epoch": 1556} {"train_loss": -41.8570671081543, "global_step": 188327, "epoch": 1556} {"train_loss": -42.399322509765625, "global_step": 188328, "epoch": 1556} {"train_loss": -41.83843994140625, "global_step": 188329, "epoch": 1556} {"train_loss": -41.56039047241211, "global_step": 188330, "epoch": 1556} {"train_loss": -41.419532775878906, "global_step": 188331, "epoch": 1556} {"train_loss": -40.81455612182617, "global_step": 188332, "epoch": 1556} {"train_loss": -41.51490020751953, "global_step": 188333, "epoch": 1556} {"train_loss": -41.74220657348633, "global_step": 188334, "epoch": 1556} {"train_loss": -40.93233871459961, "global_step": 188335, "epoch": 1556} {"train_loss": -39.8359260559082, "global_step": 188336, "epoch": 1556} {"train_loss": -40.58913040161133, "global_step": 188337, "epoch": 1556} {"train_loss": -38.9314079284668, "global_step": 188338, "epoch": 1556} {"train_loss": -40.68778610229492, "global_step": 188339, "epoch": 1556} {"train_loss": -39.944602966308594, "global_step": 188340, "epoch": 1556} {"train_loss": -36.184810638427734, "global_step": 188341, "epoch": 1556} {"train_loss": -37.148067474365234, "global_step": 188342, "epoch": 1556} {"train_loss": -39.38824462890625, "global_step": 188343, "epoch": 1556} {"train_loss": -36.082122802734375, "global_step": 188344, "epoch": 1556} {"train_loss": -35.17050552368164, "global_step": 188345, "epoch": 1556} {"train_loss": -39.696895599365234, "global_step": 188346, "epoch": 1556} {"train_loss": -36.985713958740234, "global_step": 188347, "epoch": 1556} {"train_loss": -39.708251953125, "global_step": 188348, "epoch": 1556} {"train_loss": -40.50411605834961, "global_step": 188349, "epoch": 1556} {"train_loss": -39.19929122924805, "global_step": 188350, "epoch": 1556} {"train_loss": -40.69496154785156, "global_step": 188351, "epoch": 1556} {"train_loss": -40.157508850097656, "global_step": 188352, "epoch": 1556} {"train_loss": -39.49006271362305, "global_step": 188353, "epoch": 1556} {"train_loss": -40.65641403198242, "global_step": 188354, "epoch": 1556} {"train_loss": -41.14811325073242, "global_step": 188355, "epoch": 1556} {"train_loss": -39.488224029541016, "global_step": 188356, "epoch": 1556} {"train_loss": -41.20786666870117, "global_step": 188357, "epoch": 1556} {"train_loss": -40.55634307861328, "global_step": 188358, "epoch": 1556} {"train_loss": -39.840824127197266, "global_step": 188359, "epoch": 1556} {"train_loss": -40.0766716003418, "global_step": 188360, "epoch": 1556} {"train_loss": -40.52279281616211, "global_step": 188361, "epoch": 1556} {"train_loss": -39.44416427612305, "global_step": 188362, "epoch": 1556} {"train_loss": -39.956058502197266, "global_step": 188363, "epoch": 1556} {"train_loss": -40.997406005859375, "global_step": 188364, "epoch": 1556} {"train_loss": -39.428077697753906, "global_step": 188365, "epoch": 1556} {"train_loss": -40.78520584106445, "global_step": 188366, "epoch": 1556} {"train_loss": -40.58325958251953, "global_step": 188367, "epoch": 1556} {"train_loss": -40.39102554321289, "global_step": 188368, "epoch": 1556} {"train_loss": -41.318416595458984, "global_step": 188369, "epoch": 1556} {"train_loss": -41.469573974609375, "global_step": 188370, "epoch": 1556} {"train_loss": -40.090614318847656, "global_step": 188371, "epoch": 1556} {"train_loss": -41.098751068115234, "global_step": 188372, "epoch": 1556} {"train_loss": -41.78070068359375, "global_step": 188373, "epoch": 1556} {"train_loss": -40.945255279541016, "global_step": 188374, "epoch": 1556} {"train_loss": -41.56840133666992, "global_step": 188375, "epoch": 1556} {"train_loss": -41.70742416381836, "global_step": 188376, "epoch": 1556} {"train_loss": -41.389495849609375, "global_step": 188377, "epoch": 1556} {"train_loss": -41.46388626098633, "global_step": 188378, "epoch": 1556} {"train_loss": -40.67737579345703, "global_step": 188379, "epoch": 1556} {"train_loss": -41.713722229003906, "global_step": 188380, "epoch": 1556} {"train_loss": -41.877899169921875, "global_step": 188381, "epoch": 1556} {"train_loss": -41.504425048828125, "global_step": 188382, "epoch": 1556} {"train_loss": -41.6660041809082, "global_step": 188383, "epoch": 1556} {"train_loss": -42.164310455322266, "global_step": 188384, "epoch": 1556} {"train_loss": -40.985755920410156, "global_step": 188385, "epoch": 1556} {"train_loss": -41.238555908203125, "global_step": 188386, "epoch": 1556} {"train_loss": -42.29721450805664, "global_step": 188387, "epoch": 1556} {"train_loss": -41.64567184448242, "global_step": 188388, "epoch": 1556} {"train_loss": -41.54642868041992, "global_step": 188389, "epoch": 1556} {"train_loss": -42.03606033325195, "global_step": 188390, "epoch": 1556} {"train_loss": -41.82307815551758, "global_step": 188391, "epoch": 1556} {"train_loss": -41.98182678222656, "global_step": 188392, "epoch": 1556} {"train_loss": -42.020137786865234, "global_step": 188393, "epoch": 1556} {"train_loss": -41.96883010864258, "global_step": 188394, "epoch": 1556} {"train_loss": -41.7963981628418, "global_step": 188395, "epoch": 1556} {"train_loss": -41.23682264848189, "global_step": 188396, "epoch": 1556, "val_loss": 2629486.0} {"train_loss": -42.50387954711914, "global_step": 188397, "epoch": 1557} {"train_loss": -42.43232727050781, "global_step": 188398, "epoch": 1557} {"train_loss": -42.45806884765625, "global_step": 188399, "epoch": 1557} {"train_loss": -42.6767692565918, "global_step": 188400, "epoch": 1557} {"train_loss": -42.40297317504883, "global_step": 188401, "epoch": 1557} {"train_loss": -42.52894973754883, "global_step": 188402, "epoch": 1557} {"train_loss": -42.49966049194336, "global_step": 188403, "epoch": 1557} {"train_loss": -42.19785690307617, "global_step": 188404, "epoch": 1557} {"train_loss": -42.39751434326172, "global_step": 188405, "epoch": 1557} {"train_loss": -42.43745040893555, "global_step": 188406, "epoch": 1557} {"train_loss": -42.69196701049805, "global_step": 188407, "epoch": 1557} {"train_loss": -41.62813949584961, "global_step": 188408, "epoch": 1557} {"train_loss": -42.17885971069336, "global_step": 188409, "epoch": 1557} {"train_loss": -42.587005615234375, "global_step": 188410, "epoch": 1557} {"train_loss": -42.15656661987305, "global_step": 188411, "epoch": 1557} {"train_loss": -41.51212692260742, "global_step": 188412, "epoch": 1557} {"train_loss": -41.76764678955078, "global_step": 188413, "epoch": 1557} {"train_loss": -42.338809967041016, "global_step": 188414, "epoch": 1557} {"train_loss": -42.38186264038086, "global_step": 188415, "epoch": 1557} {"train_loss": -42.7286376953125, "global_step": 188416, "epoch": 1557} {"train_loss": -42.47393798828125, "global_step": 188417, "epoch": 1557} {"train_loss": -42.62510299682617, "global_step": 188418, "epoch": 1557} {"train_loss": -42.55495071411133, "global_step": 188419, "epoch": 1557} {"train_loss": -42.92696762084961, "global_step": 188420, "epoch": 1557} {"train_loss": -42.66263961791992, "global_step": 188421, "epoch": 1557} {"train_loss": -42.41869354248047, "global_step": 188422, "epoch": 1557} {"train_loss": -41.92524337768555, "global_step": 188423, "epoch": 1557} {"train_loss": -42.172218322753906, "global_step": 188424, "epoch": 1557} {"train_loss": -41.97650146484375, "global_step": 188425, "epoch": 1557} {"train_loss": -41.50556182861328, "global_step": 188426, "epoch": 1557} {"train_loss": -41.660118103027344, "global_step": 188427, "epoch": 1557} {"train_loss": -42.3446159362793, "global_step": 188428, "epoch": 1557} {"train_loss": -41.802913665771484, "global_step": 188429, "epoch": 1557} {"train_loss": -40.4417610168457, "global_step": 188430, "epoch": 1557} {"train_loss": -40.069454193115234, "global_step": 188431, "epoch": 1557} {"train_loss": -38.91889953613281, "global_step": 188432, "epoch": 1557} {"train_loss": -35.41690444946289, "global_step": 188433, "epoch": 1557} {"train_loss": -31.930103302001953, "global_step": 188434, "epoch": 1557} {"train_loss": -36.38237380981445, "global_step": 188435, "epoch": 1557} {"train_loss": -41.29515838623047, "global_step": 188436, "epoch": 1557} {"train_loss": -39.124114990234375, "global_step": 188437, "epoch": 1557} {"train_loss": -33.844329833984375, "global_step": 188438, "epoch": 1557} {"train_loss": -36.92621994018555, "global_step": 188439, "epoch": 1557} {"train_loss": -40.53998565673828, "global_step": 188440, "epoch": 1557} {"train_loss": -36.812538146972656, "global_step": 188441, "epoch": 1557} {"train_loss": -39.88507080078125, "global_step": 188442, "epoch": 1557} {"train_loss": -38.71276092529297, "global_step": 188443, "epoch": 1557} {"train_loss": -39.97639083862305, "global_step": 188444, "epoch": 1557} {"train_loss": -40.71883773803711, "global_step": 188445, "epoch": 1557} {"train_loss": -41.53300476074219, "global_step": 188446, "epoch": 1557} {"train_loss": -40.587371826171875, "global_step": 188447, "epoch": 1557} {"train_loss": -40.96358871459961, "global_step": 188448, "epoch": 1557} {"train_loss": -39.865020751953125, "global_step": 188449, "epoch": 1557} {"train_loss": -41.45466995239258, "global_step": 188450, "epoch": 1557} {"train_loss": -41.39645004272461, "global_step": 188451, "epoch": 1557} {"train_loss": -42.07237243652344, "global_step": 188452, "epoch": 1557} {"train_loss": -40.87253952026367, "global_step": 188453, "epoch": 1557} {"train_loss": -41.070125579833984, "global_step": 188454, "epoch": 1557} {"train_loss": -41.45691680908203, "global_step": 188455, "epoch": 1557} {"train_loss": -41.91411209106445, "global_step": 188456, "epoch": 1557} {"train_loss": -41.869407653808594, "global_step": 188457, "epoch": 1557} {"train_loss": -42.126426696777344, "global_step": 188458, "epoch": 1557} {"train_loss": -41.59971237182617, "global_step": 188459, "epoch": 1557} {"train_loss": -41.897254943847656, "global_step": 188460, "epoch": 1557} {"train_loss": -41.59114456176758, "global_step": 188461, "epoch": 1557} {"train_loss": -41.96708297729492, "global_step": 188462, "epoch": 1557} {"train_loss": -41.716522216796875, "global_step": 188463, "epoch": 1557} {"train_loss": -41.794795989990234, "global_step": 188464, "epoch": 1557} {"train_loss": -41.93999481201172, "global_step": 188465, "epoch": 1557} {"train_loss": -42.17746353149414, "global_step": 188466, "epoch": 1557} {"train_loss": -41.85192108154297, "global_step": 188467, "epoch": 1557} {"train_loss": -41.944026947021484, "global_step": 188468, "epoch": 1557} {"train_loss": -42.31996536254883, "global_step": 188469, "epoch": 1557} {"train_loss": -42.52523422241211, "global_step": 188470, "epoch": 1557} {"train_loss": -42.06000900268555, "global_step": 188471, "epoch": 1557} {"train_loss": -42.050682067871094, "global_step": 188472, "epoch": 1557} {"train_loss": -42.61903762817383, "global_step": 188473, "epoch": 1557} {"train_loss": -42.21743392944336, "global_step": 188474, "epoch": 1557} {"train_loss": -42.37405014038086, "global_step": 188475, "epoch": 1557} {"train_loss": -42.55683898925781, "global_step": 188476, "epoch": 1557} {"train_loss": -42.17665100097656, "global_step": 188477, "epoch": 1557} {"train_loss": -41.968841552734375, "global_step": 188478, "epoch": 1557} {"train_loss": -42.282470703125, "global_step": 188479, "epoch": 1557} {"train_loss": -41.63740539550781, "global_step": 188480, "epoch": 1557} {"train_loss": -41.66339111328125, "global_step": 188481, "epoch": 1557} {"train_loss": -42.080810546875, "global_step": 188482, "epoch": 1557} {"train_loss": -41.897010803222656, "global_step": 188483, "epoch": 1557} {"train_loss": -42.47587203979492, "global_step": 188484, "epoch": 1557} {"train_loss": -42.5020637512207, "global_step": 188485, "epoch": 1557} {"train_loss": -42.047794342041016, "global_step": 188486, "epoch": 1557} {"train_loss": -42.80643844604492, "global_step": 188487, "epoch": 1557} {"train_loss": -42.01615524291992, "global_step": 188488, "epoch": 1557} {"train_loss": -41.713565826416016, "global_step": 188489, "epoch": 1557} {"train_loss": -42.621883392333984, "global_step": 188490, "epoch": 1557} {"train_loss": -42.51777267456055, "global_step": 188491, "epoch": 1557} {"train_loss": -42.10499954223633, "global_step": 188492, "epoch": 1557} {"train_loss": -41.4405517578125, "global_step": 188493, "epoch": 1557} {"train_loss": -41.55973434448242, "global_step": 188494, "epoch": 1557} {"train_loss": -42.155059814453125, "global_step": 188495, "epoch": 1557} {"train_loss": -40.93922424316406, "global_step": 188496, "epoch": 1557} {"train_loss": -40.98113250732422, "global_step": 188497, "epoch": 1557} {"train_loss": -42.118019104003906, "global_step": 188498, "epoch": 1557} {"train_loss": -42.35121536254883, "global_step": 188499, "epoch": 1557} {"train_loss": -41.41699981689453, "global_step": 188500, "epoch": 1557} {"train_loss": -41.95527267456055, "global_step": 188501, "epoch": 1557} {"train_loss": -42.12145233154297, "global_step": 188502, "epoch": 1557} {"train_loss": -42.40083694458008, "global_step": 188503, "epoch": 1557} {"train_loss": -42.0367546081543, "global_step": 188504, "epoch": 1557} {"train_loss": -41.96883010864258, "global_step": 188505, "epoch": 1557} {"train_loss": -41.195899963378906, "global_step": 188506, "epoch": 1557} {"train_loss": -39.85808181762695, "global_step": 188507, "epoch": 1557} {"train_loss": -39.410396575927734, "global_step": 188508, "epoch": 1557} {"train_loss": -40.316158294677734, "global_step": 188509, "epoch": 1557} {"train_loss": -40.95738983154297, "global_step": 188510, "epoch": 1557} {"train_loss": -41.619720458984375, "global_step": 188511, "epoch": 1557} {"train_loss": -41.78043746948242, "global_step": 188512, "epoch": 1557} {"train_loss": -39.83030319213867, "global_step": 188513, "epoch": 1557} {"train_loss": -38.734676361083984, "global_step": 188514, "epoch": 1557} {"train_loss": -38.845760345458984, "global_step": 188515, "epoch": 1557} {"train_loss": -40.58565902709961, "global_step": 188516, "epoch": 1557} {"train_loss": -41.35325184341305, "global_step": 188517, "epoch": 1557, "val_loss": 2610904.0} {"train_loss": -41.39496612548828, "global_step": 188518, "epoch": 1558} {"train_loss": -41.31498718261719, "global_step": 188519, "epoch": 1558} {"train_loss": -41.6199836730957, "global_step": 188520, "epoch": 1558} {"train_loss": -42.21833038330078, "global_step": 188521, "epoch": 1558} {"train_loss": -41.72274398803711, "global_step": 188522, "epoch": 1558} {"train_loss": -41.397369384765625, "global_step": 188523, "epoch": 1558} {"train_loss": -41.75527572631836, "global_step": 188524, "epoch": 1558} {"train_loss": -41.8598747253418, "global_step": 188525, "epoch": 1558} {"train_loss": -41.19557571411133, "global_step": 188526, "epoch": 1558} {"train_loss": -40.62819290161133, "global_step": 188527, "epoch": 1558} {"train_loss": -40.630157470703125, "global_step": 188528, "epoch": 1558} {"train_loss": -42.079620361328125, "global_step": 188529, "epoch": 1558} {"train_loss": -42.0555534362793, "global_step": 188530, "epoch": 1558} {"train_loss": -41.25199508666992, "global_step": 188531, "epoch": 1558} {"train_loss": -39.74843215942383, "global_step": 188532, "epoch": 1558} {"train_loss": -41.320404052734375, "global_step": 188533, "epoch": 1558} {"train_loss": -42.07392883300781, "global_step": 188534, "epoch": 1558} {"train_loss": -41.405574798583984, "global_step": 188535, "epoch": 1558} {"train_loss": -40.228721618652344, "global_step": 188536, "epoch": 1558} {"train_loss": -40.690879821777344, "global_step": 188537, "epoch": 1558} {"train_loss": -41.008113861083984, "global_step": 188538, "epoch": 1558} {"train_loss": -41.66361618041992, "global_step": 188539, "epoch": 1558} {"train_loss": -41.67908477783203, "global_step": 188540, "epoch": 1558} {"train_loss": -41.32430648803711, "global_step": 188541, "epoch": 1558} {"train_loss": -41.98232650756836, "global_step": 188542, "epoch": 1558} {"train_loss": -42.11416244506836, "global_step": 188543, "epoch": 1558} {"train_loss": -40.67921829223633, "global_step": 188544, "epoch": 1558} {"train_loss": -41.33195495605469, "global_step": 188545, "epoch": 1558} {"train_loss": -42.214271545410156, "global_step": 188546, "epoch": 1558} {"train_loss": -41.886783599853516, "global_step": 188547, "epoch": 1558} {"train_loss": -41.97152328491211, "global_step": 188548, "epoch": 1558} {"train_loss": -41.82763671875, "global_step": 188549, "epoch": 1558} {"train_loss": -42.40778350830078, "global_step": 188550, "epoch": 1558} {"train_loss": -42.335575103759766, "global_step": 188551, "epoch": 1558} {"train_loss": -41.868934631347656, "global_step": 188552, "epoch": 1558} {"train_loss": -42.794097900390625, "global_step": 188553, "epoch": 1558} {"train_loss": -42.71076583862305, "global_step": 188554, "epoch": 1558} {"train_loss": -42.76202392578125, "global_step": 188555, "epoch": 1558} {"train_loss": -42.786373138427734, "global_step": 188556, "epoch": 1558} {"train_loss": -42.63067626953125, "global_step": 188557, "epoch": 1558} {"train_loss": -42.493797302246094, "global_step": 188558, "epoch": 1558} {"train_loss": -42.62520217895508, "global_step": 188559, "epoch": 1558} {"train_loss": -41.616756439208984, "global_step": 188560, "epoch": 1558} {"train_loss": -42.67493438720703, "global_step": 188561, "epoch": 1558} {"train_loss": -42.22946548461914, "global_step": 188562, "epoch": 1558} {"train_loss": -42.0877685546875, "global_step": 188563, "epoch": 1558} {"train_loss": -42.32674789428711, "global_step": 188564, "epoch": 1558} {"train_loss": -42.79426956176758, "global_step": 188565, "epoch": 1558} {"train_loss": -42.35914611816406, "global_step": 188566, "epoch": 1558} {"train_loss": -42.20717239379883, "global_step": 188567, "epoch": 1558} {"train_loss": -42.23324203491211, "global_step": 188568, "epoch": 1558} {"train_loss": -42.79693603515625, "global_step": 188569, "epoch": 1558} {"train_loss": -42.3306770324707, "global_step": 188570, "epoch": 1558} {"train_loss": -41.782440185546875, "global_step": 188571, "epoch": 1558} {"train_loss": -41.76799392700195, "global_step": 188572, "epoch": 1558} {"train_loss": -42.36178207397461, "global_step": 188573, "epoch": 1558} {"train_loss": -41.34969711303711, "global_step": 188574, "epoch": 1558} {"train_loss": -41.67157745361328, "global_step": 188575, "epoch": 1558} {"train_loss": -42.16826629638672, "global_step": 188576, "epoch": 1558} {"train_loss": -41.49793243408203, "global_step": 188577, "epoch": 1558} {"train_loss": -40.76766586303711, "global_step": 188578, "epoch": 1558} {"train_loss": -42.26089096069336, "global_step": 188579, "epoch": 1558} {"train_loss": -42.16958236694336, "global_step": 188580, "epoch": 1558} {"train_loss": -42.441043853759766, "global_step": 188581, "epoch": 1558} {"train_loss": -41.05756759643555, "global_step": 188582, "epoch": 1558} {"train_loss": -41.71524429321289, "global_step": 188583, "epoch": 1558} {"train_loss": -42.216644287109375, "global_step": 188584, "epoch": 1558} {"train_loss": -42.3173942565918, "global_step": 188585, "epoch": 1558} {"train_loss": -41.64631271362305, "global_step": 188586, "epoch": 1558} {"train_loss": -41.76298904418945, "global_step": 188587, "epoch": 1558} {"train_loss": -41.2644157409668, "global_step": 188588, "epoch": 1558} {"train_loss": -41.89201354980469, "global_step": 188589, "epoch": 1558} {"train_loss": -41.82126235961914, "global_step": 188590, "epoch": 1558} {"train_loss": -41.423500061035156, "global_step": 188591, "epoch": 1558} {"train_loss": -38.68923568725586, "global_step": 188592, "epoch": 1558} {"train_loss": -40.528629302978516, "global_step": 188593, "epoch": 1558} {"train_loss": -41.70166015625, "global_step": 188594, "epoch": 1558} {"train_loss": -39.45737838745117, "global_step": 188595, "epoch": 1558} {"train_loss": -40.40185546875, "global_step": 188596, "epoch": 1558} {"train_loss": -40.79499435424805, "global_step": 188597, "epoch": 1558} {"train_loss": -39.13789749145508, "global_step": 188598, "epoch": 1558} {"train_loss": -39.444557189941406, "global_step": 188599, "epoch": 1558} {"train_loss": -41.19087219238281, "global_step": 188600, "epoch": 1558} {"train_loss": -41.4122314453125, "global_step": 188601, "epoch": 1558} {"train_loss": -40.59324645996094, "global_step": 188602, "epoch": 1558} {"train_loss": -39.4974250793457, "global_step": 188603, "epoch": 1558} {"train_loss": -40.8754997253418, "global_step": 188604, "epoch": 1558} {"train_loss": -41.11784362792969, "global_step": 188605, "epoch": 1558} {"train_loss": -39.74422836303711, "global_step": 188606, "epoch": 1558} {"train_loss": -41.18948745727539, "global_step": 188607, "epoch": 1558} {"train_loss": -39.734859466552734, "global_step": 188608, "epoch": 1558} {"train_loss": -38.94200134277344, "global_step": 188609, "epoch": 1558} {"train_loss": -41.06576156616211, "global_step": 188610, "epoch": 1558} {"train_loss": -40.61014938354492, "global_step": 188611, "epoch": 1558} {"train_loss": -39.437259674072266, "global_step": 188612, "epoch": 1558} {"train_loss": -36.27631378173828, "global_step": 188613, "epoch": 1558} {"train_loss": -39.18634796142578, "global_step": 188614, "epoch": 1558} {"train_loss": -40.12773513793945, "global_step": 188615, "epoch": 1558} {"train_loss": -38.30270004272461, "global_step": 188616, "epoch": 1558} {"train_loss": -39.05795669555664, "global_step": 188617, "epoch": 1558} {"train_loss": -41.32221221923828, "global_step": 188618, "epoch": 1558} {"train_loss": -39.703704833984375, "global_step": 188619, "epoch": 1558} {"train_loss": -40.215084075927734, "global_step": 188620, "epoch": 1558} {"train_loss": -40.311527252197266, "global_step": 188621, "epoch": 1558} {"train_loss": -40.193355560302734, "global_step": 188622, "epoch": 1558} {"train_loss": -39.59256362915039, "global_step": 188623, "epoch": 1558} {"train_loss": -41.414974212646484, "global_step": 188624, "epoch": 1558} {"train_loss": -41.06203842163086, "global_step": 188625, "epoch": 1558} {"train_loss": -40.30076217651367, "global_step": 188626, "epoch": 1558} {"train_loss": -40.522193908691406, "global_step": 188627, "epoch": 1558} {"train_loss": -41.39322280883789, "global_step": 188628, "epoch": 1558} {"train_loss": -41.312217712402344, "global_step": 188629, "epoch": 1558} {"train_loss": -41.17368698120117, "global_step": 188630, "epoch": 1558} {"train_loss": -40.829647064208984, "global_step": 188631, "epoch": 1558} {"train_loss": -41.46350860595703, "global_step": 188632, "epoch": 1558} {"train_loss": -39.93745040893555, "global_step": 188633, "epoch": 1558} {"train_loss": -41.29514694213867, "global_step": 188634, "epoch": 1558} {"train_loss": -41.215065002441406, "global_step": 188635, "epoch": 1558} {"train_loss": -41.5064582824707, "global_step": 188636, "epoch": 1558} {"train_loss": -41.608943939208984, "global_step": 188637, "epoch": 1558} {"train_loss": -41.24672755722172, "global_step": 188638, "epoch": 1558, "val_loss": 2549219.75} {"train_loss": -41.37038803100586, "global_step": 188639, "epoch": 1559} {"train_loss": -41.999324798583984, "global_step": 188640, "epoch": 1559} {"train_loss": -41.22471618652344, "global_step": 188641, "epoch": 1559} {"train_loss": -41.5563850402832, "global_step": 188642, "epoch": 1559} {"train_loss": -41.16636276245117, "global_step": 188643, "epoch": 1559} {"train_loss": -41.50077438354492, "global_step": 188644, "epoch": 1559} {"train_loss": -41.00606918334961, "global_step": 188645, "epoch": 1559} {"train_loss": -41.29093551635742, "global_step": 188646, "epoch": 1559} {"train_loss": -41.405845642089844, "global_step": 188647, "epoch": 1559} {"train_loss": -40.86907196044922, "global_step": 188648, "epoch": 1559} {"train_loss": -41.616493225097656, "global_step": 188649, "epoch": 1559} {"train_loss": -41.479915618896484, "global_step": 188650, "epoch": 1559} {"train_loss": -41.01199722290039, "global_step": 188651, "epoch": 1559} {"train_loss": -40.02059555053711, "global_step": 188652, "epoch": 1559} {"train_loss": -41.465145111083984, "global_step": 188653, "epoch": 1559} {"train_loss": -41.3380012512207, "global_step": 188654, "epoch": 1559} {"train_loss": -41.44417190551758, "global_step": 188655, "epoch": 1559} {"train_loss": -41.7067985534668, "global_step": 188656, "epoch": 1559} {"train_loss": -40.8844108581543, "global_step": 188657, "epoch": 1559} {"train_loss": -42.22327423095703, "global_step": 188658, "epoch": 1559} {"train_loss": -41.949981689453125, "global_step": 188659, "epoch": 1559} {"train_loss": -41.93153762817383, "global_step": 188660, "epoch": 1559} {"train_loss": -41.82658004760742, "global_step": 188661, "epoch": 1559} {"train_loss": -42.13507843017578, "global_step": 188662, "epoch": 1559} {"train_loss": -41.826171875, "global_step": 188663, "epoch": 1559} {"train_loss": -42.19715118408203, "global_step": 188664, "epoch": 1559} {"train_loss": -41.69309616088867, "global_step": 188665, "epoch": 1559} {"train_loss": -41.5973014831543, "global_step": 188666, "epoch": 1559} {"train_loss": -40.664306640625, "global_step": 188667, "epoch": 1559} {"train_loss": -41.86316680908203, "global_step": 188668, "epoch": 1559} {"train_loss": -40.20527267456055, "global_step": 188669, "epoch": 1559} {"train_loss": -42.15476608276367, "global_step": 188670, "epoch": 1559} {"train_loss": -40.68385696411133, "global_step": 188671, "epoch": 1559} {"train_loss": -38.7668342590332, "global_step": 188672, "epoch": 1559} {"train_loss": -37.355743408203125, "global_step": 188673, "epoch": 1559} {"train_loss": -39.7832145690918, "global_step": 188674, "epoch": 1559} {"train_loss": -40.3022346496582, "global_step": 188675, "epoch": 1559} {"train_loss": -36.10857009887695, "global_step": 188676, "epoch": 1559} {"train_loss": -39.79039764404297, "global_step": 188677, "epoch": 1559} {"train_loss": -38.905540466308594, "global_step": 188678, "epoch": 1559} {"train_loss": -36.138633728027344, "global_step": 188679, "epoch": 1559} {"train_loss": -39.15351867675781, "global_step": 188680, "epoch": 1559} {"train_loss": -37.07239532470703, "global_step": 188681, "epoch": 1559} {"train_loss": -36.11562728881836, "global_step": 188682, "epoch": 1559} {"train_loss": -39.20768356323242, "global_step": 188683, "epoch": 1559} {"train_loss": -38.054874420166016, "global_step": 188684, "epoch": 1559} {"train_loss": -39.75547409057617, "global_step": 188685, "epoch": 1559} {"train_loss": -39.5019645690918, "global_step": 188686, "epoch": 1559} {"train_loss": -39.9998664855957, "global_step": 188687, "epoch": 1559} {"train_loss": -38.196876525878906, "global_step": 188688, "epoch": 1559} {"train_loss": -36.82369613647461, "global_step": 188689, "epoch": 1559} {"train_loss": -36.86289596557617, "global_step": 188690, "epoch": 1559} {"train_loss": -39.07487106323242, "global_step": 188691, "epoch": 1559} {"train_loss": -35.467464447021484, "global_step": 188692, "epoch": 1559} {"train_loss": -41.010040283203125, "global_step": 188693, "epoch": 1559} {"train_loss": -37.1002082824707, "global_step": 188694, "epoch": 1559} {"train_loss": -40.12065124511719, "global_step": 188695, "epoch": 1559} {"train_loss": -38.80241012573242, "global_step": 188696, "epoch": 1559} {"train_loss": -41.098567962646484, "global_step": 188697, "epoch": 1559} {"train_loss": -39.072021484375, "global_step": 188698, "epoch": 1559} {"train_loss": -41.50544738769531, "global_step": 188699, "epoch": 1559} {"train_loss": -38.21126937866211, "global_step": 188700, "epoch": 1559} {"train_loss": -41.194732666015625, "global_step": 188701, "epoch": 1559} {"train_loss": -38.8802375793457, "global_step": 188702, "epoch": 1559} {"train_loss": -41.08137130737305, "global_step": 188703, "epoch": 1559} {"train_loss": -40.08309555053711, "global_step": 188704, "epoch": 1559} {"train_loss": -40.64104080200195, "global_step": 188705, "epoch": 1559} {"train_loss": -40.695526123046875, "global_step": 188706, "epoch": 1559} {"train_loss": -40.96268081665039, "global_step": 188707, "epoch": 1559} {"train_loss": -41.38779830932617, "global_step": 188708, "epoch": 1559} {"train_loss": -40.797698974609375, "global_step": 188709, "epoch": 1559} {"train_loss": -40.98603057861328, "global_step": 188710, "epoch": 1559} {"train_loss": -41.20914077758789, "global_step": 188711, "epoch": 1559} {"train_loss": -41.058467864990234, "global_step": 188712, "epoch": 1559} {"train_loss": -40.87331771850586, "global_step": 188713, "epoch": 1559} {"train_loss": -40.86775588989258, "global_step": 188714, "epoch": 1559} {"train_loss": -41.248008728027344, "global_step": 188715, "epoch": 1559} {"train_loss": -39.75278854370117, "global_step": 188716, "epoch": 1559} {"train_loss": -41.444244384765625, "global_step": 188717, "epoch": 1559} {"train_loss": -40.793209075927734, "global_step": 188718, "epoch": 1559} {"train_loss": -41.03614807128906, "global_step": 188719, "epoch": 1559} {"train_loss": -41.9950065612793, "global_step": 188720, "epoch": 1559} {"train_loss": -41.845088958740234, "global_step": 188721, "epoch": 1559} {"train_loss": -41.684059143066406, "global_step": 188722, "epoch": 1559} {"train_loss": -41.613914489746094, "global_step": 188723, "epoch": 1559} {"train_loss": -42.01728439331055, "global_step": 188724, "epoch": 1559} {"train_loss": -41.92845153808594, "global_step": 188725, "epoch": 1559} {"train_loss": -41.414737701416016, "global_step": 188726, "epoch": 1559} {"train_loss": -41.73672103881836, "global_step": 188727, "epoch": 1559} {"train_loss": -41.7854118347168, "global_step": 188728, "epoch": 1559} {"train_loss": -42.134002685546875, "global_step": 188729, "epoch": 1559} {"train_loss": -41.73054885864258, "global_step": 188730, "epoch": 1559} {"train_loss": -41.87284469604492, "global_step": 188731, "epoch": 1559} {"train_loss": -42.26723098754883, "global_step": 188732, "epoch": 1559} {"train_loss": -42.236305236816406, "global_step": 188733, "epoch": 1559} {"train_loss": -41.8740348815918, "global_step": 188734, "epoch": 1559} {"train_loss": -42.04634094238281, "global_step": 188735, "epoch": 1559} {"train_loss": -42.0873908996582, "global_step": 188736, "epoch": 1559} {"train_loss": -41.76869201660156, "global_step": 188737, "epoch": 1559} {"train_loss": -41.47867202758789, "global_step": 188738, "epoch": 1559} {"train_loss": -42.28021240234375, "global_step": 188739, "epoch": 1559} {"train_loss": -41.988685607910156, "global_step": 188740, "epoch": 1559} {"train_loss": -42.074501037597656, "global_step": 188741, "epoch": 1559} {"train_loss": -42.2851676940918, "global_step": 188742, "epoch": 1559} {"train_loss": -41.56137466430664, "global_step": 188743, "epoch": 1559} {"train_loss": -42.76426315307617, "global_step": 188744, "epoch": 1559} {"train_loss": -42.2314567565918, "global_step": 188745, "epoch": 1559} {"train_loss": -42.248802185058594, "global_step": 188746, "epoch": 1559} {"train_loss": -41.866024017333984, "global_step": 188747, "epoch": 1559} {"train_loss": -41.1197509765625, "global_step": 188748, "epoch": 1559} {"train_loss": -41.93368148803711, "global_step": 188749, "epoch": 1559} {"train_loss": -41.91876220703125, "global_step": 188750, "epoch": 1559} {"train_loss": -41.854339599609375, "global_step": 188751, "epoch": 1559} {"train_loss": -42.4187126159668, "global_step": 188752, "epoch": 1559} {"train_loss": -41.69831466674805, "global_step": 188753, "epoch": 1559} {"train_loss": -41.13239669799805, "global_step": 188754, "epoch": 1559} {"train_loss": -40.96625518798828, "global_step": 188755, "epoch": 1559} {"train_loss": -40.22449493408203, "global_step": 188756, "epoch": 1559} {"train_loss": -39.89680099487305, "global_step": 188757, "epoch": 1559} {"train_loss": -40.75508117675781, "global_step": 188758, "epoch": 1559} {"train_loss": -40.761221798983485, "global_step": 188759, "epoch": 1559, "val_loss": 2443700.25} {"train_loss": -41.96733093261719, "global_step": 188760, "epoch": 1560} {"train_loss": -41.90995788574219, "global_step": 188761, "epoch": 1560} {"train_loss": -42.224727630615234, "global_step": 188762, "epoch": 1560} {"train_loss": -42.39646530151367, "global_step": 188763, "epoch": 1560} {"train_loss": -42.467864990234375, "global_step": 188764, "epoch": 1560} {"train_loss": -41.416324615478516, "global_step": 188765, "epoch": 1560} {"train_loss": -39.80143737792969, "global_step": 188766, "epoch": 1560} {"train_loss": -41.53322982788086, "global_step": 188767, "epoch": 1560} {"train_loss": -41.52596664428711, "global_step": 188768, "epoch": 1560} {"train_loss": -41.43666458129883, "global_step": 188769, "epoch": 1560} {"train_loss": -41.791664123535156, "global_step": 188770, "epoch": 1560} {"train_loss": -41.2125358581543, "global_step": 188771, "epoch": 1560} {"train_loss": -39.890743255615234, "global_step": 188772, "epoch": 1560} {"train_loss": -40.844337463378906, "global_step": 188773, "epoch": 1560} {"train_loss": -41.62317657470703, "global_step": 188774, "epoch": 1560} {"train_loss": -40.76447677612305, "global_step": 188775, "epoch": 1560} {"train_loss": -41.42438507080078, "global_step": 188776, "epoch": 1560} {"train_loss": -42.24998474121094, "global_step": 188777, "epoch": 1560} {"train_loss": -41.97176742553711, "global_step": 188778, "epoch": 1560} {"train_loss": -40.588714599609375, "global_step": 188779, "epoch": 1560} {"train_loss": -40.81159591674805, "global_step": 188780, "epoch": 1560} {"train_loss": -41.7674446105957, "global_step": 188781, "epoch": 1560} {"train_loss": -41.26845169067383, "global_step": 188782, "epoch": 1560} {"train_loss": -40.511837005615234, "global_step": 188783, "epoch": 1560} {"train_loss": -40.78734588623047, "global_step": 188784, "epoch": 1560} {"train_loss": -41.37494659423828, "global_step": 188785, "epoch": 1560} {"train_loss": -41.25558090209961, "global_step": 188786, "epoch": 1560} {"train_loss": -39.563011169433594, "global_step": 188787, "epoch": 1560} {"train_loss": -39.79719924926758, "global_step": 188788, "epoch": 1560} {"train_loss": -41.204254150390625, "global_step": 188789, "epoch": 1560} {"train_loss": -41.03023910522461, "global_step": 188790, "epoch": 1560} {"train_loss": -41.18819808959961, "global_step": 188791, "epoch": 1560} {"train_loss": -41.74870681762695, "global_step": 188792, "epoch": 1560} {"train_loss": -40.477657318115234, "global_step": 188793, "epoch": 1560} {"train_loss": -40.76921081542969, "global_step": 188794, "epoch": 1560} {"train_loss": -41.46456527709961, "global_step": 188795, "epoch": 1560} {"train_loss": -41.335670471191406, "global_step": 188796, "epoch": 1560} {"train_loss": -41.11117172241211, "global_step": 188797, "epoch": 1560} {"train_loss": -41.74997329711914, "global_step": 188798, "epoch": 1560} {"train_loss": -40.8851203918457, "global_step": 188799, "epoch": 1560} {"train_loss": -41.30597686767578, "global_step": 188800, "epoch": 1560} {"train_loss": -40.98491287231445, "global_step": 188801, "epoch": 1560} {"train_loss": -41.17498016357422, "global_step": 188802, "epoch": 1560} {"train_loss": -40.6319465637207, "global_step": 188803, "epoch": 1560} {"train_loss": -41.816246032714844, "global_step": 188804, "epoch": 1560} {"train_loss": -41.4561653137207, "global_step": 188805, "epoch": 1560} {"train_loss": -40.76981735229492, "global_step": 188806, "epoch": 1560} {"train_loss": -41.69020462036133, "global_step": 188807, "epoch": 1560} {"train_loss": -40.418556213378906, "global_step": 188808, "epoch": 1560} {"train_loss": -40.98322677612305, "global_step": 188809, "epoch": 1560} {"train_loss": -40.87183380126953, "global_step": 188810, "epoch": 1560} {"train_loss": -40.643394470214844, "global_step": 188811, "epoch": 1560} {"train_loss": -41.06341552734375, "global_step": 188812, "epoch": 1560} {"train_loss": -40.36749267578125, "global_step": 188813, "epoch": 1560} {"train_loss": -40.40309524536133, "global_step": 188814, "epoch": 1560} {"train_loss": -41.50754928588867, "global_step": 188815, "epoch": 1560} {"train_loss": -39.0709342956543, "global_step": 188816, "epoch": 1560} {"train_loss": -41.20219039916992, "global_step": 188817, "epoch": 1560} {"train_loss": -40.25921630859375, "global_step": 188818, "epoch": 1560} {"train_loss": -40.7981071472168, "global_step": 188819, "epoch": 1560} {"train_loss": -39.34727478027344, "global_step": 188820, "epoch": 1560} {"train_loss": -40.54591751098633, "global_step": 188821, "epoch": 1560} {"train_loss": -39.85354232788086, "global_step": 188822, "epoch": 1560} {"train_loss": -40.770782470703125, "global_step": 188823, "epoch": 1560} {"train_loss": -40.628570556640625, "global_step": 188824, "epoch": 1560} {"train_loss": -40.388328552246094, "global_step": 188825, "epoch": 1560} {"train_loss": -41.69546890258789, "global_step": 188826, "epoch": 1560} {"train_loss": -40.4888801574707, "global_step": 188827, "epoch": 1560} {"train_loss": -41.629276275634766, "global_step": 188828, "epoch": 1560} {"train_loss": -40.91022872924805, "global_step": 188829, "epoch": 1560} {"train_loss": -40.83340072631836, "global_step": 188830, "epoch": 1560} {"train_loss": -39.78195571899414, "global_step": 188831, "epoch": 1560} {"train_loss": -41.139766693115234, "global_step": 188832, "epoch": 1560} {"train_loss": -38.7879524230957, "global_step": 188833, "epoch": 1560} {"train_loss": -40.049739837646484, "global_step": 188834, "epoch": 1560} {"train_loss": -41.35922622680664, "global_step": 188835, "epoch": 1560} {"train_loss": -40.761329650878906, "global_step": 188836, "epoch": 1560} {"train_loss": -40.787410736083984, "global_step": 188837, "epoch": 1560} {"train_loss": -40.984615325927734, "global_step": 188838, "epoch": 1560} {"train_loss": -41.795799255371094, "global_step": 188839, "epoch": 1560} {"train_loss": -39.824249267578125, "global_step": 188840, "epoch": 1560} {"train_loss": -39.88367462158203, "global_step": 188841, "epoch": 1560} {"train_loss": -39.17303466796875, "global_step": 188842, "epoch": 1560} {"train_loss": -38.64277648925781, "global_step": 188843, "epoch": 1560} {"train_loss": -38.16978073120117, "global_step": 188844, "epoch": 1560} {"train_loss": -37.796630859375, "global_step": 188845, "epoch": 1560} {"train_loss": -39.79035949707031, "global_step": 188846, "epoch": 1560} {"train_loss": -39.58315658569336, "global_step": 188847, "epoch": 1560} {"train_loss": -39.80843734741211, "global_step": 188848, "epoch": 1560} {"train_loss": -38.65910339355469, "global_step": 188849, "epoch": 1560} {"train_loss": -41.796112060546875, "global_step": 188850, "epoch": 1560} {"train_loss": -40.574256896972656, "global_step": 188851, "epoch": 1560} {"train_loss": -41.459842681884766, "global_step": 188852, "epoch": 1560} {"train_loss": -37.837890625, "global_step": 188853, "epoch": 1560} {"train_loss": -31.81336784362793, "global_step": 188854, "epoch": 1560} {"train_loss": -40.40350341796875, "global_step": 188855, "epoch": 1560} {"train_loss": -40.684322357177734, "global_step": 188856, "epoch": 1560} {"train_loss": -37.288265228271484, "global_step": 188857, "epoch": 1560} {"train_loss": -38.7204704284668, "global_step": 188858, "epoch": 1560} {"train_loss": -39.56255340576172, "global_step": 188859, "epoch": 1560} {"train_loss": -38.33572769165039, "global_step": 188860, "epoch": 1560} {"train_loss": -36.365962982177734, "global_step": 188861, "epoch": 1560} {"train_loss": -30.346410751342773, "global_step": 188862, "epoch": 1560} {"train_loss": -37.76633834838867, "global_step": 188863, "epoch": 1560} {"train_loss": -33.34804916381836, "global_step": 188864, "epoch": 1560} {"train_loss": -36.805511474609375, "global_step": 188865, "epoch": 1560} {"train_loss": -40.27119064331055, "global_step": 188866, "epoch": 1560} {"train_loss": -37.23639678955078, "global_step": 188867, "epoch": 1560} {"train_loss": -35.805702209472656, "global_step": 188868, "epoch": 1560} {"train_loss": -38.39161682128906, "global_step": 188869, "epoch": 1560} {"train_loss": -34.08208465576172, "global_step": 188870, "epoch": 1560} {"train_loss": -38.65932083129883, "global_step": 188871, "epoch": 1560} {"train_loss": -39.02679443359375, "global_step": 188872, "epoch": 1560} {"train_loss": -38.90822982788086, "global_step": 188873, "epoch": 1560} {"train_loss": -38.99612808227539, "global_step": 188874, "epoch": 1560} {"train_loss": -37.29014205932617, "global_step": 188875, "epoch": 1560} {"train_loss": -37.636775970458984, "global_step": 188876, "epoch": 1560} {"train_loss": -36.0085334777832, "global_step": 188877, "epoch": 1560} {"train_loss": -38.800777435302734, "global_step": 188878, "epoch": 1560} {"train_loss": -37.92721176147461, "global_step": 188879, "epoch": 1560} {"train_loss": -39.99552725169284, "global_step": 188880, "epoch": 1560, "val_loss": 3025173.75} {"train_loss": -36.776424407958984, "global_step": 188881, "epoch": 1561} {"train_loss": -32.78053283691406, "global_step": 188882, "epoch": 1561} {"train_loss": -36.1027946472168, "global_step": 188883, "epoch": 1561} {"train_loss": -36.427650451660156, "global_step": 188884, "epoch": 1561} {"train_loss": -38.79580307006836, "global_step": 188885, "epoch": 1561} {"train_loss": -37.53815460205078, "global_step": 188886, "epoch": 1561} {"train_loss": -39.734161376953125, "global_step": 188887, "epoch": 1561} {"train_loss": -39.142147064208984, "global_step": 188888, "epoch": 1561} {"train_loss": -38.868263244628906, "global_step": 188889, "epoch": 1561} {"train_loss": -38.93084716796875, "global_step": 188890, "epoch": 1561} {"train_loss": -38.958805084228516, "global_step": 188891, "epoch": 1561} {"train_loss": -39.3733024597168, "global_step": 188892, "epoch": 1561} {"train_loss": -36.623329162597656, "global_step": 188893, "epoch": 1561} {"train_loss": -36.876407623291016, "global_step": 188894, "epoch": 1561} {"train_loss": -39.41992950439453, "global_step": 188895, "epoch": 1561} {"train_loss": -38.7554931640625, "global_step": 188896, "epoch": 1561} {"train_loss": -40.41417694091797, "global_step": 188897, "epoch": 1561} {"train_loss": -39.52821731567383, "global_step": 188898, "epoch": 1561} {"train_loss": -39.8760986328125, "global_step": 188899, "epoch": 1561} {"train_loss": -40.6571044921875, "global_step": 188900, "epoch": 1561} {"train_loss": -39.41136932373047, "global_step": 188901, "epoch": 1561} {"train_loss": -37.7531623840332, "global_step": 188902, "epoch": 1561} {"train_loss": -39.73484802246094, "global_step": 188903, "epoch": 1561} {"train_loss": -39.837791442871094, "global_step": 188904, "epoch": 1561} {"train_loss": -39.86918640136719, "global_step": 188905, "epoch": 1561} {"train_loss": -39.03279495239258, "global_step": 188906, "epoch": 1561} {"train_loss": -39.59855270385742, "global_step": 188907, "epoch": 1561} {"train_loss": -38.78978729248047, "global_step": 188908, "epoch": 1561} {"train_loss": -39.61936950683594, "global_step": 188909, "epoch": 1561} {"train_loss": -39.690391540527344, "global_step": 188910, "epoch": 1561} {"train_loss": -39.83878707885742, "global_step": 188911, "epoch": 1561} {"train_loss": -39.50429153442383, "global_step": 188912, "epoch": 1561} {"train_loss": -38.700172424316406, "global_step": 188913, "epoch": 1561} {"train_loss": -40.09125900268555, "global_step": 188914, "epoch": 1561} {"train_loss": -39.3004264831543, "global_step": 188915, "epoch": 1561} {"train_loss": -40.51894760131836, "global_step": 188916, "epoch": 1561} {"train_loss": -39.38081741333008, "global_step": 188917, "epoch": 1561} {"train_loss": -40.72450637817383, "global_step": 188918, "epoch": 1561} {"train_loss": -39.47032165527344, "global_step": 188919, "epoch": 1561} {"train_loss": -40.68815612792969, "global_step": 188920, "epoch": 1561} {"train_loss": -40.64824295043945, "global_step": 188921, "epoch": 1561} {"train_loss": -40.34174346923828, "global_step": 188922, "epoch": 1561} {"train_loss": -40.88397979736328, "global_step": 188923, "epoch": 1561} {"train_loss": -40.85743713378906, "global_step": 188924, "epoch": 1561} {"train_loss": -39.960819244384766, "global_step": 188925, "epoch": 1561} {"train_loss": -40.65166091918945, "global_step": 188926, "epoch": 1561} {"train_loss": -38.62234878540039, "global_step": 188927, "epoch": 1561} {"train_loss": -40.337135314941406, "global_step": 188928, "epoch": 1561} {"train_loss": -40.29232406616211, "global_step": 188929, "epoch": 1561} {"train_loss": -40.425506591796875, "global_step": 188930, "epoch": 1561} {"train_loss": -40.89191818237305, "global_step": 188931, "epoch": 1561} {"train_loss": -40.94938278198242, "global_step": 188932, "epoch": 1561} {"train_loss": -41.04317092895508, "global_step": 188933, "epoch": 1561} {"train_loss": -40.53345489501953, "global_step": 188934, "epoch": 1561} {"train_loss": -41.03583908081055, "global_step": 188935, "epoch": 1561} {"train_loss": -41.07744598388672, "global_step": 188936, "epoch": 1561} {"train_loss": -40.839012145996094, "global_step": 188937, "epoch": 1561} {"train_loss": -40.50950241088867, "global_step": 188938, "epoch": 1561} {"train_loss": -41.385498046875, "global_step": 188939, "epoch": 1561} {"train_loss": -41.455650329589844, "global_step": 188940, "epoch": 1561} {"train_loss": -41.3322868347168, "global_step": 188941, "epoch": 1561} {"train_loss": -41.38566207885742, "global_step": 188942, "epoch": 1561} {"train_loss": -41.222835540771484, "global_step": 188943, "epoch": 1561} {"train_loss": -40.498653411865234, "global_step": 188944, "epoch": 1561} {"train_loss": -41.187652587890625, "global_step": 188945, "epoch": 1561} {"train_loss": -41.49851608276367, "global_step": 188946, "epoch": 1561} {"train_loss": -41.00362014770508, "global_step": 188947, "epoch": 1561} {"train_loss": -41.205345153808594, "global_step": 188948, "epoch": 1561} {"train_loss": -41.72041702270508, "global_step": 188949, "epoch": 1561} {"train_loss": -40.28937911987305, "global_step": 188950, "epoch": 1561} {"train_loss": -41.064266204833984, "global_step": 188951, "epoch": 1561} {"train_loss": -41.10835647583008, "global_step": 188952, "epoch": 1561} {"train_loss": -39.92422103881836, "global_step": 188953, "epoch": 1561} {"train_loss": -41.19544219970703, "global_step": 188954, "epoch": 1561} {"train_loss": -41.582847595214844, "global_step": 188955, "epoch": 1561} {"train_loss": -40.97137451171875, "global_step": 188956, "epoch": 1561} {"train_loss": -41.081172943115234, "global_step": 188957, "epoch": 1561} {"train_loss": -41.154296875, "global_step": 188958, "epoch": 1561} {"train_loss": -41.683448791503906, "global_step": 188959, "epoch": 1561} {"train_loss": -34.9392204284668, "global_step": 188960, "epoch": 1561} {"train_loss": -40.28923416137695, "global_step": 188961, "epoch": 1561} {"train_loss": -41.49911117553711, "global_step": 188962, "epoch": 1561} {"train_loss": -40.901241302490234, "global_step": 188963, "epoch": 1561} {"train_loss": -40.92128372192383, "global_step": 188964, "epoch": 1561} {"train_loss": -40.594017028808594, "global_step": 188965, "epoch": 1561} {"train_loss": -23.252363204956055, "global_step": 188966, "epoch": 1561} {"train_loss": -39.87275314331055, "global_step": 188967, "epoch": 1561} {"train_loss": -40.25074005126953, "global_step": 188968, "epoch": 1561} {"train_loss": -10.836493492126465, "global_step": 188969, "epoch": 1561} {"train_loss": -36.497108459472656, "global_step": 188970, "epoch": 1561} {"train_loss": -18.57114028930664, "global_step": 188971, "epoch": 1561} {"train_loss": -32.838600158691406, "global_step": 188972, "epoch": 1561} {"train_loss": -33.90420150756836, "global_step": 188973, "epoch": 1561} {"train_loss": -38.175594329833984, "global_step": 188974, "epoch": 1561} {"train_loss": -28.89487648010254, "global_step": 188975, "epoch": 1561} {"train_loss": -21.608003616333008, "global_step": 188976, "epoch": 1561} {"train_loss": -23.919546127319336, "global_step": 188977, "epoch": 1561} {"train_loss": -35.41379165649414, "global_step": 188978, "epoch": 1561} {"train_loss": -35.52751541137695, "global_step": 188979, "epoch": 1561} {"train_loss": -35.335384368896484, "global_step": 188980, "epoch": 1561} {"train_loss": -30.0064640045166, "global_step": 188981, "epoch": 1561} {"train_loss": -34.4512939453125, "global_step": 188982, "epoch": 1561} {"train_loss": -31.679370880126953, "global_step": 188983, "epoch": 1561} {"train_loss": -32.12000274658203, "global_step": 188984, "epoch": 1561} {"train_loss": -34.51383972167969, "global_step": 188985, "epoch": 1561} {"train_loss": -35.00385284423828, "global_step": 188986, "epoch": 1561} {"train_loss": -34.34455108642578, "global_step": 188987, "epoch": 1561} {"train_loss": -37.631195068359375, "global_step": 188988, "epoch": 1561} {"train_loss": -36.60895919799805, "global_step": 188989, "epoch": 1561} {"train_loss": -34.57080841064453, "global_step": 188990, "epoch": 1561} {"train_loss": -36.549095153808594, "global_step": 188991, "epoch": 1561} {"train_loss": -32.322242736816406, "global_step": 188992, "epoch": 1561} {"train_loss": -35.68825149536133, "global_step": 188993, "epoch": 1561} {"train_loss": -38.234554290771484, "global_step": 188994, "epoch": 1561} {"train_loss": -37.006526947021484, "global_step": 188995, "epoch": 1561} {"train_loss": -37.31498336791992, "global_step": 188996, "epoch": 1561} {"train_loss": -36.11188888549805, "global_step": 188997, "epoch": 1561} {"train_loss": -34.815704345703125, "global_step": 188998, "epoch": 1561} {"train_loss": -35.91537094116211, "global_step": 188999, "epoch": 1561} {"train_loss": -35.624263763427734, "global_step": 189000, "epoch": 1561} {"train_loss": -37.86053757628134, "global_step": 189001, "epoch": 1561, "val_loss": 2645111.75} {"train_loss": -37.383522033691406, "global_step": 189002, "epoch": 1562} {"train_loss": -37.94027328491211, "global_step": 189003, "epoch": 1562} {"train_loss": -37.879066467285156, "global_step": 189004, "epoch": 1562} {"train_loss": -38.66838455200195, "global_step": 189005, "epoch": 1562} {"train_loss": -37.44565200805664, "global_step": 189006, "epoch": 1562} {"train_loss": -37.69580841064453, "global_step": 189007, "epoch": 1562} {"train_loss": -38.341163635253906, "global_step": 189008, "epoch": 1562} {"train_loss": -36.96894836425781, "global_step": 189009, "epoch": 1562} {"train_loss": -38.38496017456055, "global_step": 189010, "epoch": 1562} {"train_loss": -37.30202102661133, "global_step": 189011, "epoch": 1562} {"train_loss": -37.472694396972656, "global_step": 189012, "epoch": 1562} {"train_loss": -36.50196075439453, "global_step": 189013, "epoch": 1562} {"train_loss": -37.13361358642578, "global_step": 189014, "epoch": 1562} {"train_loss": -37.51667022705078, "global_step": 189015, "epoch": 1562} {"train_loss": -38.02527618408203, "global_step": 189016, "epoch": 1562} {"train_loss": -39.44721221923828, "global_step": 189017, "epoch": 1562} {"train_loss": -34.60958480834961, "global_step": 189018, "epoch": 1562} {"train_loss": -38.3567008972168, "global_step": 189019, "epoch": 1562} {"train_loss": -38.53313064575195, "global_step": 189020, "epoch": 1562} {"train_loss": -36.9455451965332, "global_step": 189021, "epoch": 1562} {"train_loss": -38.43177032470703, "global_step": 189022, "epoch": 1562} {"train_loss": -39.03881072998047, "global_step": 189023, "epoch": 1562} {"train_loss": -37.15070343017578, "global_step": 189024, "epoch": 1562} {"train_loss": -38.295005798339844, "global_step": 189025, "epoch": 1562} {"train_loss": -38.95619583129883, "global_step": 189026, "epoch": 1562} {"train_loss": -39.1293830871582, "global_step": 189027, "epoch": 1562} {"train_loss": -38.559814453125, "global_step": 189028, "epoch": 1562} {"train_loss": -39.817108154296875, "global_step": 189029, "epoch": 1562} {"train_loss": -38.8913688659668, "global_step": 189030, "epoch": 1562} {"train_loss": -38.95782470703125, "global_step": 189031, "epoch": 1562} {"train_loss": -39.40864944458008, "global_step": 189032, "epoch": 1562} {"train_loss": -38.73616409301758, "global_step": 189033, "epoch": 1562} {"train_loss": -39.1330680847168, "global_step": 189034, "epoch": 1562} {"train_loss": -39.08582305908203, "global_step": 189035, "epoch": 1562} {"train_loss": -39.20130920410156, "global_step": 189036, "epoch": 1562} {"train_loss": -39.3956413269043, "global_step": 189037, "epoch": 1562} {"train_loss": -39.56372833251953, "global_step": 189038, "epoch": 1562} {"train_loss": -39.232032775878906, "global_step": 189039, "epoch": 1562} {"train_loss": -39.249908447265625, "global_step": 189040, "epoch": 1562} {"train_loss": -39.604854583740234, "global_step": 189041, "epoch": 1562} {"train_loss": -39.161373138427734, "global_step": 189042, "epoch": 1562} {"train_loss": -39.519527435302734, "global_step": 189043, "epoch": 1562} {"train_loss": -39.46149826049805, "global_step": 189044, "epoch": 1562} {"train_loss": -39.195011138916016, "global_step": 189045, "epoch": 1562} {"train_loss": -40.0212516784668, "global_step": 189046, "epoch": 1562} {"train_loss": -39.283912658691406, "global_step": 189047, "epoch": 1562} {"train_loss": -40.09141159057617, "global_step": 189048, "epoch": 1562} {"train_loss": -39.85300827026367, "global_step": 189049, "epoch": 1562} {"train_loss": -39.54359817504883, "global_step": 189050, "epoch": 1562} {"train_loss": -39.29015350341797, "global_step": 189051, "epoch": 1562} {"train_loss": -40.08279037475586, "global_step": 189052, "epoch": 1562} {"train_loss": -40.0152702331543, "global_step": 189053, "epoch": 1562} {"train_loss": -39.2149772644043, "global_step": 189054, "epoch": 1562} {"train_loss": -39.96138381958008, "global_step": 189055, "epoch": 1562} {"train_loss": -38.584815979003906, "global_step": 189056, "epoch": 1562} {"train_loss": -39.79859924316406, "global_step": 189057, "epoch": 1562} {"train_loss": -39.4392204284668, "global_step": 189058, "epoch": 1562} {"train_loss": -40.412837982177734, "global_step": 189059, "epoch": 1562} {"train_loss": -40.10622787475586, "global_step": 189060, "epoch": 1562} {"train_loss": -40.13322448730469, "global_step": 189061, "epoch": 1562} {"train_loss": -39.59364700317383, "global_step": 189062, "epoch": 1562} {"train_loss": -40.24711227416992, "global_step": 189063, "epoch": 1562} {"train_loss": -40.476131439208984, "global_step": 189064, "epoch": 1562} {"train_loss": -39.98615264892578, "global_step": 189065, "epoch": 1562} {"train_loss": -40.35660934448242, "global_step": 189066, "epoch": 1562} {"train_loss": -39.94768142700195, "global_step": 189067, "epoch": 1562} {"train_loss": -40.1279296875, "global_step": 189068, "epoch": 1562} {"train_loss": -40.840797424316406, "global_step": 189069, "epoch": 1562} {"train_loss": -40.53696060180664, "global_step": 189070, "epoch": 1562} {"train_loss": -40.596351623535156, "global_step": 189071, "epoch": 1562} {"train_loss": -40.80147933959961, "global_step": 189072, "epoch": 1562} {"train_loss": -40.6444206237793, "global_step": 189073, "epoch": 1562} {"train_loss": -40.789310455322266, "global_step": 189074, "epoch": 1562} {"train_loss": -40.1633186340332, "global_step": 189075, "epoch": 1562} {"train_loss": -40.39686584472656, "global_step": 189076, "epoch": 1562} {"train_loss": -40.776611328125, "global_step": 189077, "epoch": 1562} {"train_loss": -40.29601287841797, "global_step": 189078, "epoch": 1562} {"train_loss": -40.3511962890625, "global_step": 189079, "epoch": 1562} {"train_loss": -40.96659469604492, "global_step": 189080, "epoch": 1562} {"train_loss": -41.37744140625, "global_step": 189081, "epoch": 1562} {"train_loss": -40.81637191772461, "global_step": 189082, "epoch": 1562} {"train_loss": -40.68471145629883, "global_step": 189083, "epoch": 1562} {"train_loss": -40.88904571533203, "global_step": 189084, "epoch": 1562} {"train_loss": -41.184715270996094, "global_step": 189085, "epoch": 1562} {"train_loss": -41.015926361083984, "global_step": 189086, "epoch": 1562} {"train_loss": -40.96371078491211, "global_step": 189087, "epoch": 1562} {"train_loss": -41.19976806640625, "global_step": 189088, "epoch": 1562} {"train_loss": -40.9478874206543, "global_step": 189089, "epoch": 1562} {"train_loss": -41.32001876831055, "global_step": 189090, "epoch": 1562} {"train_loss": -41.047462463378906, "global_step": 189091, "epoch": 1562} {"train_loss": -41.00382614135742, "global_step": 189092, "epoch": 1562} {"train_loss": -40.963863372802734, "global_step": 189093, "epoch": 1562} {"train_loss": -41.195594787597656, "global_step": 189094, "epoch": 1562} {"train_loss": -40.95409393310547, "global_step": 189095, "epoch": 1562} {"train_loss": -41.35868453979492, "global_step": 189096, "epoch": 1562} {"train_loss": -41.19514846801758, "global_step": 189097, "epoch": 1562} {"train_loss": -41.265296936035156, "global_step": 189098, "epoch": 1562} {"train_loss": -40.567474365234375, "global_step": 189099, "epoch": 1562} {"train_loss": -41.01029586791992, "global_step": 189100, "epoch": 1562} {"train_loss": -40.720672607421875, "global_step": 189101, "epoch": 1562} {"train_loss": -41.14480209350586, "global_step": 189102, "epoch": 1562} {"train_loss": -41.676429748535156, "global_step": 189103, "epoch": 1562} {"train_loss": -41.519657135009766, "global_step": 189104, "epoch": 1562} {"train_loss": -41.63008117675781, "global_step": 189105, "epoch": 1562} {"train_loss": -40.48861312866211, "global_step": 189106, "epoch": 1562} {"train_loss": -40.6432991027832, "global_step": 189107, "epoch": 1562} {"train_loss": -41.47298812866211, "global_step": 189108, "epoch": 1562} {"train_loss": -41.28097152709961, "global_step": 189109, "epoch": 1562} {"train_loss": -41.34862518310547, "global_step": 189110, "epoch": 1562} {"train_loss": -41.61317825317383, "global_step": 189111, "epoch": 1562} {"train_loss": -41.79388427734375, "global_step": 189112, "epoch": 1562} {"train_loss": -42.08726119995117, "global_step": 189113, "epoch": 1562} {"train_loss": -41.5928840637207, "global_step": 189114, "epoch": 1562} {"train_loss": -41.653900146484375, "global_step": 189115, "epoch": 1562} {"train_loss": -41.51874542236328, "global_step": 189116, "epoch": 1562} {"train_loss": -41.914608001708984, "global_step": 189117, "epoch": 1562} {"train_loss": -41.169647216796875, "global_step": 189118, "epoch": 1562} {"train_loss": -41.5377311706543, "global_step": 189119, "epoch": 1562} {"train_loss": -41.47194290161133, "global_step": 189120, "epoch": 1562} {"train_loss": -41.563331604003906, "global_step": 189121, "epoch": 1562} {"train_loss": -39.88456795432351, "global_step": 189122, "epoch": 1562, "val_loss": 2480571.0} {"train_loss": -41.82415771484375, "global_step": 189123, "epoch": 1563} {"train_loss": -41.83749008178711, "global_step": 189124, "epoch": 1563} {"train_loss": -41.67876052856445, "global_step": 189125, "epoch": 1563} {"train_loss": -40.9892463684082, "global_step": 189126, "epoch": 1563} {"train_loss": -40.24287033081055, "global_step": 189127, "epoch": 1563} {"train_loss": -38.86271667480469, "global_step": 189128, "epoch": 1563} {"train_loss": -36.343292236328125, "global_step": 189129, "epoch": 1563} {"train_loss": -35.72152328491211, "global_step": 189130, "epoch": 1563} {"train_loss": -36.261390686035156, "global_step": 189131, "epoch": 1563} {"train_loss": -40.34383773803711, "global_step": 189132, "epoch": 1563} {"train_loss": -41.24652099609375, "global_step": 189133, "epoch": 1563} {"train_loss": -38.55110549926758, "global_step": 189134, "epoch": 1563} {"train_loss": -38.873046875, "global_step": 189135, "epoch": 1563} {"train_loss": -39.67851638793945, "global_step": 189136, "epoch": 1563} {"train_loss": -41.033241271972656, "global_step": 189137, "epoch": 1563} {"train_loss": -38.9791374206543, "global_step": 189138, "epoch": 1563} {"train_loss": -39.46319580078125, "global_step": 189139, "epoch": 1563} {"train_loss": -39.76748275756836, "global_step": 189140, "epoch": 1563} {"train_loss": -40.43706130981445, "global_step": 189141, "epoch": 1563} {"train_loss": -40.89066696166992, "global_step": 189142, "epoch": 1563} {"train_loss": -39.667510986328125, "global_step": 189143, "epoch": 1563} {"train_loss": -40.89323043823242, "global_step": 189144, "epoch": 1563} {"train_loss": -39.595394134521484, "global_step": 189145, "epoch": 1563} {"train_loss": -41.13227081298828, "global_step": 189146, "epoch": 1563} {"train_loss": -39.87563705444336, "global_step": 189147, "epoch": 1563} {"train_loss": -41.36981964111328, "global_step": 189148, "epoch": 1563} {"train_loss": -40.14606857299805, "global_step": 189149, "epoch": 1563} {"train_loss": -41.06721115112305, "global_step": 189150, "epoch": 1563} {"train_loss": -40.27656936645508, "global_step": 189151, "epoch": 1563} {"train_loss": -41.3107795715332, "global_step": 189152, "epoch": 1563} {"train_loss": -40.78274154663086, "global_step": 189153, "epoch": 1563} {"train_loss": -41.10939407348633, "global_step": 189154, "epoch": 1563} {"train_loss": -40.85612106323242, "global_step": 189155, "epoch": 1563} {"train_loss": -41.132362365722656, "global_step": 189156, "epoch": 1563} {"train_loss": -41.09041213989258, "global_step": 189157, "epoch": 1563} {"train_loss": -40.093727111816406, "global_step": 189158, "epoch": 1563} {"train_loss": -41.322959899902344, "global_step": 189159, "epoch": 1563} {"train_loss": -40.75716018676758, "global_step": 189160, "epoch": 1563} {"train_loss": -41.367061614990234, "global_step": 189161, "epoch": 1563} {"train_loss": -41.20248031616211, "global_step": 189162, "epoch": 1563} {"train_loss": -40.99912643432617, "global_step": 189163, "epoch": 1563} {"train_loss": -41.24736022949219, "global_step": 189164, "epoch": 1563} {"train_loss": -41.03029251098633, "global_step": 189165, "epoch": 1563} {"train_loss": -40.69007110595703, "global_step": 189166, "epoch": 1563} {"train_loss": -40.328243255615234, "global_step": 189167, "epoch": 1563} {"train_loss": -40.07558822631836, "global_step": 189168, "epoch": 1563} {"train_loss": -39.69816207885742, "global_step": 189169, "epoch": 1563} {"train_loss": -39.77520751953125, "global_step": 189170, "epoch": 1563} {"train_loss": -39.91228485107422, "global_step": 189171, "epoch": 1563} {"train_loss": -40.66617965698242, "global_step": 189172, "epoch": 1563} {"train_loss": -41.58283615112305, "global_step": 189173, "epoch": 1563} {"train_loss": -40.81640625, "global_step": 189174, "epoch": 1563} {"train_loss": -40.570369720458984, "global_step": 189175, "epoch": 1563} {"train_loss": -40.009883880615234, "global_step": 189176, "epoch": 1563} {"train_loss": -39.08077621459961, "global_step": 189177, "epoch": 1563} {"train_loss": -39.507808685302734, "global_step": 189178, "epoch": 1563} {"train_loss": -39.737770080566406, "global_step": 189179, "epoch": 1563} {"train_loss": -40.38532257080078, "global_step": 189180, "epoch": 1563} {"train_loss": -41.287906646728516, "global_step": 189181, "epoch": 1563} {"train_loss": -41.071388244628906, "global_step": 189182, "epoch": 1563} {"train_loss": -41.59344482421875, "global_step": 189183, "epoch": 1563} {"train_loss": -41.28523635864258, "global_step": 189184, "epoch": 1563} {"train_loss": -41.63444900512695, "global_step": 189185, "epoch": 1563} {"train_loss": -41.2838134765625, "global_step": 189186, "epoch": 1563} {"train_loss": -40.624183654785156, "global_step": 189187, "epoch": 1563} {"train_loss": -40.713069915771484, "global_step": 189188, "epoch": 1563} {"train_loss": -41.60136795043945, "global_step": 189189, "epoch": 1563} {"train_loss": -40.95100784301758, "global_step": 189190, "epoch": 1563} {"train_loss": -41.83753967285156, "global_step": 189191, "epoch": 1563} {"train_loss": -40.66937255859375, "global_step": 189192, "epoch": 1563} {"train_loss": -40.376564025878906, "global_step": 189193, "epoch": 1563} {"train_loss": -41.227291107177734, "global_step": 189194, "epoch": 1563} {"train_loss": -41.28255844116211, "global_step": 189195, "epoch": 1563} {"train_loss": -38.44976806640625, "global_step": 189196, "epoch": 1563} {"train_loss": -38.31734848022461, "global_step": 189197, "epoch": 1563} {"train_loss": -41.35477828979492, "global_step": 189198, "epoch": 1563} {"train_loss": -40.89641571044922, "global_step": 189199, "epoch": 1563} {"train_loss": -40.65301513671875, "global_step": 189200, "epoch": 1563} {"train_loss": -41.10540008544922, "global_step": 189201, "epoch": 1563} {"train_loss": -41.72390365600586, "global_step": 189202, "epoch": 1563} {"train_loss": -41.612911224365234, "global_step": 189203, "epoch": 1563} {"train_loss": -41.42959213256836, "global_step": 189204, "epoch": 1563} {"train_loss": -42.03196716308594, "global_step": 189205, "epoch": 1563} {"train_loss": -41.105472564697266, "global_step": 189206, "epoch": 1563} {"train_loss": -41.28474044799805, "global_step": 189207, "epoch": 1563} {"train_loss": -41.243377685546875, "global_step": 189208, "epoch": 1563} {"train_loss": -41.63751220703125, "global_step": 189209, "epoch": 1563} {"train_loss": -41.7450065612793, "global_step": 189210, "epoch": 1563} {"train_loss": -41.5534553527832, "global_step": 189211, "epoch": 1563} {"train_loss": -41.73637771606445, "global_step": 189212, "epoch": 1563} {"train_loss": -41.50423049926758, "global_step": 189213, "epoch": 1563} {"train_loss": -41.91849899291992, "global_step": 189214, "epoch": 1563} {"train_loss": -41.4234504699707, "global_step": 189215, "epoch": 1563} {"train_loss": -41.137142181396484, "global_step": 189216, "epoch": 1563} {"train_loss": -41.789608001708984, "global_step": 189217, "epoch": 1563} {"train_loss": -40.93695068359375, "global_step": 189218, "epoch": 1563} {"train_loss": -41.50677490234375, "global_step": 189219, "epoch": 1563} {"train_loss": -41.98665237426758, "global_step": 189220, "epoch": 1563} {"train_loss": -41.304561614990234, "global_step": 189221, "epoch": 1563} {"train_loss": -41.693382263183594, "global_step": 189222, "epoch": 1563} {"train_loss": -41.45136260986328, "global_step": 189223, "epoch": 1563} {"train_loss": -40.43230056762695, "global_step": 189224, "epoch": 1563} {"train_loss": -41.84943389892578, "global_step": 189225, "epoch": 1563} {"train_loss": -42.13755416870117, "global_step": 189226, "epoch": 1563} {"train_loss": -41.79487609863281, "global_step": 189227, "epoch": 1563} {"train_loss": -40.040435791015625, "global_step": 189228, "epoch": 1563} {"train_loss": -41.46810531616211, "global_step": 189229, "epoch": 1563} {"train_loss": -41.49256134033203, "global_step": 189230, "epoch": 1563} {"train_loss": -41.73920822143555, "global_step": 189231, "epoch": 1563} {"train_loss": -40.991729736328125, "global_step": 189232, "epoch": 1563} {"train_loss": -41.981441497802734, "global_step": 189233, "epoch": 1563} {"train_loss": -42.13174057006836, "global_step": 189234, "epoch": 1563} {"train_loss": -41.52094650268555, "global_step": 189235, "epoch": 1563} {"train_loss": -41.755977630615234, "global_step": 189236, "epoch": 1563} {"train_loss": -39.07351303100586, "global_step": 189237, "epoch": 1563} {"train_loss": -41.51144790649414, "global_step": 189238, "epoch": 1563} {"train_loss": -31.932653427124023, "global_step": 189239, "epoch": 1563} {"train_loss": -41.11104965209961, "global_step": 189240, "epoch": 1563} {"train_loss": -40.52922439575195, "global_step": 189241, "epoch": 1563} {"train_loss": -41.05366134643555, "global_step": 189242, "epoch": 1563} {"train_loss": -40.662705744593595, "global_step": 189243, "epoch": 1563, "val_loss": 2578321.75} {"train_loss": -36.2904167175293, "global_step": 189244, "epoch": 1564} {"train_loss": -40.336299896240234, "global_step": 189245, "epoch": 1564} {"train_loss": -38.8213005065918, "global_step": 189246, "epoch": 1564} {"train_loss": -35.1862678527832, "global_step": 189247, "epoch": 1564} {"train_loss": -40.78601837158203, "global_step": 189248, "epoch": 1564} {"train_loss": -39.320045471191406, "global_step": 189249, "epoch": 1564} {"train_loss": -38.340728759765625, "global_step": 189250, "epoch": 1564} {"train_loss": -39.173091888427734, "global_step": 189251, "epoch": 1564} {"train_loss": -40.888099670410156, "global_step": 189252, "epoch": 1564} {"train_loss": -40.33525466918945, "global_step": 189253, "epoch": 1564} {"train_loss": -39.7420768737793, "global_step": 189254, "epoch": 1564} {"train_loss": -40.6596565246582, "global_step": 189255, "epoch": 1564} {"train_loss": -40.39793014526367, "global_step": 189256, "epoch": 1564} {"train_loss": -40.60215377807617, "global_step": 189257, "epoch": 1564} {"train_loss": -39.58307647705078, "global_step": 189258, "epoch": 1564} {"train_loss": -38.7703971862793, "global_step": 189259, "epoch": 1564} {"train_loss": -38.72126388549805, "global_step": 189260, "epoch": 1564} {"train_loss": -40.53178405761719, "global_step": 189261, "epoch": 1564} {"train_loss": -40.77741622924805, "global_step": 189262, "epoch": 1564} {"train_loss": -39.799922943115234, "global_step": 189263, "epoch": 1564} {"train_loss": -39.34432601928711, "global_step": 189264, "epoch": 1564} {"train_loss": -41.1928596496582, "global_step": 189265, "epoch": 1564} {"train_loss": -41.16154098510742, "global_step": 189266, "epoch": 1564} {"train_loss": -41.02012252807617, "global_step": 189267, "epoch": 1564} {"train_loss": -41.6460075378418, "global_step": 189268, "epoch": 1564} {"train_loss": -40.0211296081543, "global_step": 189269, "epoch": 1564} {"train_loss": -40.345916748046875, "global_step": 189270, "epoch": 1564} {"train_loss": -40.1089973449707, "global_step": 189271, "epoch": 1564} {"train_loss": -37.92721176147461, "global_step": 189272, "epoch": 1564} {"train_loss": -40.68520736694336, "global_step": 189273, "epoch": 1564} {"train_loss": -40.81056594848633, "global_step": 189274, "epoch": 1564} {"train_loss": -40.9271240234375, "global_step": 189275, "epoch": 1564} {"train_loss": -40.660152435302734, "global_step": 189276, "epoch": 1564} {"train_loss": -41.60956573486328, "global_step": 189277, "epoch": 1564} {"train_loss": -41.265193939208984, "global_step": 189278, "epoch": 1564} {"train_loss": -41.45680618286133, "global_step": 189279, "epoch": 1564} {"train_loss": -40.681514739990234, "global_step": 189280, "epoch": 1564} {"train_loss": -41.79537582397461, "global_step": 189281, "epoch": 1564} {"train_loss": -41.128170013427734, "global_step": 189282, "epoch": 1564} {"train_loss": -41.4473991394043, "global_step": 189283, "epoch": 1564} {"train_loss": -41.27439498901367, "global_step": 189284, "epoch": 1564} {"train_loss": -41.58513259887695, "global_step": 189285, "epoch": 1564} {"train_loss": -41.6765022277832, "global_step": 189286, "epoch": 1564} {"train_loss": -41.3985595703125, "global_step": 189287, "epoch": 1564} {"train_loss": -41.45064926147461, "global_step": 189288, "epoch": 1564} {"train_loss": -41.17192840576172, "global_step": 189289, "epoch": 1564} {"train_loss": -40.68714904785156, "global_step": 189290, "epoch": 1564} {"train_loss": -40.74699783325195, "global_step": 189291, "epoch": 1564} {"train_loss": -40.96687316894531, "global_step": 189292, "epoch": 1564} {"train_loss": -40.97755813598633, "global_step": 189293, "epoch": 1564} {"train_loss": -40.795406341552734, "global_step": 189294, "epoch": 1564} {"train_loss": -41.16015625, "global_step": 189295, "epoch": 1564} {"train_loss": -41.499019622802734, "global_step": 189296, "epoch": 1564} {"train_loss": -40.27522277832031, "global_step": 189297, "epoch": 1564} {"train_loss": -39.921539306640625, "global_step": 189298, "epoch": 1564} {"train_loss": -40.927791595458984, "global_step": 189299, "epoch": 1564} {"train_loss": -40.634273529052734, "global_step": 189300, "epoch": 1564} {"train_loss": -41.53683090209961, "global_step": 189301, "epoch": 1564} {"train_loss": -41.44594955444336, "global_step": 189302, "epoch": 1564} {"train_loss": -40.497711181640625, "global_step": 189303, "epoch": 1564} {"train_loss": -40.78974533081055, "global_step": 189304, "epoch": 1564} {"train_loss": -41.524940490722656, "global_step": 189305, "epoch": 1564} {"train_loss": -40.98936080932617, "global_step": 189306, "epoch": 1564} {"train_loss": -39.73979568481445, "global_step": 189307, "epoch": 1564} {"train_loss": -41.57100296020508, "global_step": 189308, "epoch": 1564} {"train_loss": -41.62933349609375, "global_step": 189309, "epoch": 1564} {"train_loss": -41.116058349609375, "global_step": 189310, "epoch": 1564} {"train_loss": -41.36164093017578, "global_step": 189311, "epoch": 1564} {"train_loss": -41.4265251159668, "global_step": 189312, "epoch": 1564} {"train_loss": -41.671932220458984, "global_step": 189313, "epoch": 1564} {"train_loss": -41.847755432128906, "global_step": 189314, "epoch": 1564} {"train_loss": -41.69739532470703, "global_step": 189315, "epoch": 1564} {"train_loss": -41.663814544677734, "global_step": 189316, "epoch": 1564} {"train_loss": -41.74650192260742, "global_step": 189317, "epoch": 1564} {"train_loss": -41.28828811645508, "global_step": 189318, "epoch": 1564} {"train_loss": -41.58978271484375, "global_step": 189319, "epoch": 1564} {"train_loss": -42.25419998168945, "global_step": 189320, "epoch": 1564} {"train_loss": -41.813350677490234, "global_step": 189321, "epoch": 1564} {"train_loss": -40.40055465698242, "global_step": 189322, "epoch": 1564} {"train_loss": -40.97495651245117, "global_step": 189323, "epoch": 1564} {"train_loss": -41.71419906616211, "global_step": 189324, "epoch": 1564} {"train_loss": -41.2099723815918, "global_step": 189325, "epoch": 1564} {"train_loss": -41.13508224487305, "global_step": 189326, "epoch": 1564} {"train_loss": -41.93378829956055, "global_step": 189327, "epoch": 1564} {"train_loss": -41.480079650878906, "global_step": 189328, "epoch": 1564} {"train_loss": -41.74872970581055, "global_step": 189329, "epoch": 1564} {"train_loss": -41.89799118041992, "global_step": 189330, "epoch": 1564} {"train_loss": -41.73206329345703, "global_step": 189331, "epoch": 1564} {"train_loss": -42.21112060546875, "global_step": 189332, "epoch": 1564} {"train_loss": -42.29127502441406, "global_step": 189333, "epoch": 1564} {"train_loss": -41.94822692871094, "global_step": 189334, "epoch": 1564} {"train_loss": -41.5291748046875, "global_step": 189335, "epoch": 1564} {"train_loss": -41.59926986694336, "global_step": 189336, "epoch": 1564} {"train_loss": -40.97519302368164, "global_step": 189337, "epoch": 1564} {"train_loss": -41.90000534057617, "global_step": 189338, "epoch": 1564} {"train_loss": -41.84811782836914, "global_step": 189339, "epoch": 1564} {"train_loss": -41.389732360839844, "global_step": 189340, "epoch": 1564} {"train_loss": -42.611480712890625, "global_step": 189341, "epoch": 1564} {"train_loss": -42.13077926635742, "global_step": 189342, "epoch": 1564} {"train_loss": -42.15139389038086, "global_step": 189343, "epoch": 1564} {"train_loss": -42.17659378051758, "global_step": 189344, "epoch": 1564} {"train_loss": -41.986839294433594, "global_step": 189345, "epoch": 1564} {"train_loss": -42.175201416015625, "global_step": 189346, "epoch": 1564} {"train_loss": -42.15480041503906, "global_step": 189347, "epoch": 1564} {"train_loss": -42.32078170776367, "global_step": 189348, "epoch": 1564} {"train_loss": -42.500518798828125, "global_step": 189349, "epoch": 1564} {"train_loss": -41.412715911865234, "global_step": 189350, "epoch": 1564} {"train_loss": -41.91756820678711, "global_step": 189351, "epoch": 1564} {"train_loss": -41.25637435913086, "global_step": 189352, "epoch": 1564} {"train_loss": -40.87667465209961, "global_step": 189353, "epoch": 1564} {"train_loss": -38.057838439941406, "global_step": 189354, "epoch": 1564} {"train_loss": -34.23696517944336, "global_step": 189355, "epoch": 1564} {"train_loss": -31.771692276000977, "global_step": 189356, "epoch": 1564} {"train_loss": -26.79962730407715, "global_step": 189357, "epoch": 1564} {"train_loss": -24.349393844604492, "global_step": 189358, "epoch": 1564} {"train_loss": -23.78511619567871, "global_step": 189359, "epoch": 1564} {"train_loss": -34.438472747802734, "global_step": 189360, "epoch": 1564} {"train_loss": -37.12331771850586, "global_step": 189361, "epoch": 1564} {"train_loss": -31.975202560424805, "global_step": 189362, "epoch": 1564} {"train_loss": -37.60365676879883, "global_step": 189363, "epoch": 1564} {"train_loss": -40.161022864097404, "global_step": 189364, "epoch": 1564, "val_loss": 2446131.25} {"train_loss": -35.68195343017578, "global_step": 189365, "epoch": 1565} {"train_loss": -35.83143997192383, "global_step": 189366, "epoch": 1565} {"train_loss": -36.670467376708984, "global_step": 189367, "epoch": 1565} {"train_loss": -37.11631393432617, "global_step": 189368, "epoch": 1565} {"train_loss": -37.460636138916016, "global_step": 189369, "epoch": 1565} {"train_loss": -37.025550842285156, "global_step": 189370, "epoch": 1565} {"train_loss": -35.587284088134766, "global_step": 189371, "epoch": 1565} {"train_loss": -39.29820251464844, "global_step": 189372, "epoch": 1565} {"train_loss": -37.92695236206055, "global_step": 189373, "epoch": 1565} {"train_loss": -39.200016021728516, "global_step": 189374, "epoch": 1565} {"train_loss": -38.49616622924805, "global_step": 189375, "epoch": 1565} {"train_loss": -39.73142623901367, "global_step": 189376, "epoch": 1565} {"train_loss": -39.83449172973633, "global_step": 189377, "epoch": 1565} {"train_loss": -39.926815032958984, "global_step": 189378, "epoch": 1565} {"train_loss": -40.22599411010742, "global_step": 189379, "epoch": 1565} {"train_loss": -40.519065856933594, "global_step": 189380, "epoch": 1565} {"train_loss": -40.623687744140625, "global_step": 189381, "epoch": 1565} {"train_loss": -40.947628021240234, "global_step": 189382, "epoch": 1565} {"train_loss": -40.61296463012695, "global_step": 189383, "epoch": 1565} {"train_loss": -40.93355941772461, "global_step": 189384, "epoch": 1565} {"train_loss": -40.31631088256836, "global_step": 189385, "epoch": 1565} {"train_loss": -40.3951301574707, "global_step": 189386, "epoch": 1565} {"train_loss": -41.13240432739258, "global_step": 189387, "epoch": 1565} {"train_loss": -40.90129852294922, "global_step": 189388, "epoch": 1565} {"train_loss": -41.24727249145508, "global_step": 189389, "epoch": 1565} {"train_loss": -41.10490417480469, "global_step": 189390, "epoch": 1565} {"train_loss": -40.548423767089844, "global_step": 189391, "epoch": 1565} {"train_loss": -41.06341552734375, "global_step": 189392, "epoch": 1565} {"train_loss": -40.91199493408203, "global_step": 189393, "epoch": 1565} {"train_loss": -40.972347259521484, "global_step": 189394, "epoch": 1565} {"train_loss": -41.467315673828125, "global_step": 189395, "epoch": 1565} {"train_loss": -41.001922607421875, "global_step": 189396, "epoch": 1565} {"train_loss": -41.50572204589844, "global_step": 189397, "epoch": 1565} {"train_loss": -41.08161544799805, "global_step": 189398, "epoch": 1565} {"train_loss": -41.123348236083984, "global_step": 189399, "epoch": 1565} {"train_loss": -41.204952239990234, "global_step": 189400, "epoch": 1565} {"train_loss": -41.126033782958984, "global_step": 189401, "epoch": 1565} {"train_loss": -41.25482177734375, "global_step": 189402, "epoch": 1565} {"train_loss": -41.37010955810547, "global_step": 189403, "epoch": 1565} {"train_loss": -40.953914642333984, "global_step": 189404, "epoch": 1565} {"train_loss": -41.62892150878906, "global_step": 189405, "epoch": 1565} {"train_loss": -41.16817092895508, "global_step": 189406, "epoch": 1565} {"train_loss": -41.69907760620117, "global_step": 189407, "epoch": 1565} {"train_loss": -41.14247512817383, "global_step": 189408, "epoch": 1565} {"train_loss": -41.59626007080078, "global_step": 189409, "epoch": 1565} {"train_loss": -42.02817916870117, "global_step": 189410, "epoch": 1565} {"train_loss": -41.65335464477539, "global_step": 189411, "epoch": 1565} {"train_loss": -41.739166259765625, "global_step": 189412, "epoch": 1565} {"train_loss": -41.775264739990234, "global_step": 189413, "epoch": 1565} {"train_loss": -41.88752365112305, "global_step": 189414, "epoch": 1565} {"train_loss": -42.3048210144043, "global_step": 189415, "epoch": 1565} {"train_loss": -42.018707275390625, "global_step": 189416, "epoch": 1565} {"train_loss": -41.99343490600586, "global_step": 189417, "epoch": 1565} {"train_loss": -42.02000045776367, "global_step": 189418, "epoch": 1565} {"train_loss": -41.932613372802734, "global_step": 189419, "epoch": 1565} {"train_loss": -42.345027923583984, "global_step": 189420, "epoch": 1565} {"train_loss": -41.78867721557617, "global_step": 189421, "epoch": 1565} {"train_loss": -41.869232177734375, "global_step": 189422, "epoch": 1565} {"train_loss": -42.44414520263672, "global_step": 189423, "epoch": 1565} {"train_loss": -42.174190521240234, "global_step": 189424, "epoch": 1565} {"train_loss": -42.26527786254883, "global_step": 189425, "epoch": 1565} {"train_loss": -41.925025939941406, "global_step": 189426, "epoch": 1565} {"train_loss": -41.98939895629883, "global_step": 189427, "epoch": 1565} {"train_loss": -41.94470977783203, "global_step": 189428, "epoch": 1565} {"train_loss": -42.11625289916992, "global_step": 189429, "epoch": 1565} {"train_loss": -42.58362579345703, "global_step": 189430, "epoch": 1565} {"train_loss": -42.31111526489258, "global_step": 189431, "epoch": 1565} {"train_loss": -42.14214324951172, "global_step": 189432, "epoch": 1565} {"train_loss": -42.14493942260742, "global_step": 189433, "epoch": 1565} {"train_loss": -42.13957214355469, "global_step": 189434, "epoch": 1565} {"train_loss": -42.439208984375, "global_step": 189435, "epoch": 1565} {"train_loss": -42.63130569458008, "global_step": 189436, "epoch": 1565} {"train_loss": -42.36766052246094, "global_step": 189437, "epoch": 1565} {"train_loss": -42.04562759399414, "global_step": 189438, "epoch": 1565} {"train_loss": -42.55712890625, "global_step": 189439, "epoch": 1565} {"train_loss": -42.21287155151367, "global_step": 189440, "epoch": 1565} {"train_loss": -42.25994873046875, "global_step": 189441, "epoch": 1565} {"train_loss": -42.2704963684082, "global_step": 189442, "epoch": 1565} {"train_loss": -42.612483978271484, "global_step": 189443, "epoch": 1565} {"train_loss": -42.33736038208008, "global_step": 189444, "epoch": 1565} {"train_loss": -42.72005844116211, "global_step": 189445, "epoch": 1565} {"train_loss": -42.52478790283203, "global_step": 189446, "epoch": 1565} {"train_loss": -42.94792938232422, "global_step": 189447, "epoch": 1565} {"train_loss": -42.7509880065918, "global_step": 189448, "epoch": 1565} {"train_loss": -42.95482635498047, "global_step": 189449, "epoch": 1565} {"train_loss": -42.737030029296875, "global_step": 189450, "epoch": 1565} {"train_loss": -42.77340316772461, "global_step": 189451, "epoch": 1565} {"train_loss": -42.76264572143555, "global_step": 189452, "epoch": 1565} {"train_loss": -42.664058685302734, "global_step": 189453, "epoch": 1565} {"train_loss": -42.404598236083984, "global_step": 189454, "epoch": 1565} {"train_loss": -42.342281341552734, "global_step": 189455, "epoch": 1565} {"train_loss": -42.2784309387207, "global_step": 189456, "epoch": 1565} {"train_loss": -41.819339752197266, "global_step": 189457, "epoch": 1565} {"train_loss": -41.993892669677734, "global_step": 189458, "epoch": 1565} {"train_loss": -42.28358840942383, "global_step": 189459, "epoch": 1565} {"train_loss": -41.461883544921875, "global_step": 189460, "epoch": 1565} {"train_loss": -41.85880661010742, "global_step": 189461, "epoch": 1565} {"train_loss": -42.54642868041992, "global_step": 189462, "epoch": 1565} {"train_loss": -42.82516098022461, "global_step": 189463, "epoch": 1565} {"train_loss": -42.721248626708984, "global_step": 189464, "epoch": 1565} {"train_loss": -42.4873161315918, "global_step": 189465, "epoch": 1565} {"train_loss": -41.96151351928711, "global_step": 189466, "epoch": 1565} {"train_loss": -41.179996490478516, "global_step": 189467, "epoch": 1565} {"train_loss": -42.040138244628906, "global_step": 189468, "epoch": 1565} {"train_loss": -42.91305160522461, "global_step": 189469, "epoch": 1565} {"train_loss": -42.08011245727539, "global_step": 189470, "epoch": 1565} {"train_loss": -42.36285400390625, "global_step": 189471, "epoch": 1565} {"train_loss": -42.317626953125, "global_step": 189472, "epoch": 1565} {"train_loss": -43.0160026550293, "global_step": 189473, "epoch": 1565} {"train_loss": -42.719268798828125, "global_step": 189474, "epoch": 1565} {"train_loss": -42.444427490234375, "global_step": 189475, "epoch": 1565} {"train_loss": -42.39874267578125, "global_step": 189476, "epoch": 1565} {"train_loss": -42.833370208740234, "global_step": 189477, "epoch": 1565} {"train_loss": -42.303802490234375, "global_step": 189478, "epoch": 1565} {"train_loss": -40.669918060302734, "global_step": 189479, "epoch": 1565} {"train_loss": -40.003292083740234, "global_step": 189480, "epoch": 1565} {"train_loss": -40.15633773803711, "global_step": 189481, "epoch": 1565} {"train_loss": -41.539302825927734, "global_step": 189482, "epoch": 1565} {"train_loss": -41.89248275756836, "global_step": 189483, "epoch": 1565} {"train_loss": -39.13042449951172, "global_step": 189484, "epoch": 1565} {"train_loss": -41.34639036950986, "global_step": 189485, "epoch": 1565, "val_loss": 2417802.5} {"train_loss": -39.953006744384766, "global_step": 189486, "epoch": 1566} {"train_loss": -39.89162826538086, "global_step": 189487, "epoch": 1566} {"train_loss": -41.27097702026367, "global_step": 189488, "epoch": 1566} {"train_loss": -41.19223403930664, "global_step": 189489, "epoch": 1566} {"train_loss": -40.42759704589844, "global_step": 189490, "epoch": 1566} {"train_loss": -41.573516845703125, "global_step": 189491, "epoch": 1566} {"train_loss": -41.26565933227539, "global_step": 189492, "epoch": 1566} {"train_loss": -40.522457122802734, "global_step": 189493, "epoch": 1566} {"train_loss": -40.33850860595703, "global_step": 189494, "epoch": 1566} {"train_loss": -41.330772399902344, "global_step": 189495, "epoch": 1566} {"train_loss": -40.4766960144043, "global_step": 189496, "epoch": 1566} {"train_loss": -40.070167541503906, "global_step": 189497, "epoch": 1566} {"train_loss": -41.030357360839844, "global_step": 189498, "epoch": 1566} {"train_loss": -39.12009048461914, "global_step": 189499, "epoch": 1566} {"train_loss": -41.741573333740234, "global_step": 189500, "epoch": 1566} {"train_loss": -41.4538688659668, "global_step": 189501, "epoch": 1566} {"train_loss": -40.71613693237305, "global_step": 189502, "epoch": 1566} {"train_loss": -40.599037170410156, "global_step": 189503, "epoch": 1566} {"train_loss": -40.48308181762695, "global_step": 189504, "epoch": 1566} {"train_loss": -41.64082336425781, "global_step": 189505, "epoch": 1566} {"train_loss": -40.155635833740234, "global_step": 189506, "epoch": 1566} {"train_loss": -41.915077209472656, "global_step": 189507, "epoch": 1566} {"train_loss": -41.19792556762695, "global_step": 189508, "epoch": 1566} {"train_loss": -41.68659210205078, "global_step": 189509, "epoch": 1566} {"train_loss": -40.77043533325195, "global_step": 189510, "epoch": 1566} {"train_loss": -40.40121078491211, "global_step": 189511, "epoch": 1566} {"train_loss": -40.104774475097656, "global_step": 189512, "epoch": 1566} {"train_loss": -40.66877365112305, "global_step": 189513, "epoch": 1566} {"train_loss": -41.40450668334961, "global_step": 189514, "epoch": 1566} {"train_loss": -40.408416748046875, "global_step": 189515, "epoch": 1566} {"train_loss": -41.43531036376953, "global_step": 189516, "epoch": 1566} {"train_loss": -40.41728210449219, "global_step": 189517, "epoch": 1566} {"train_loss": -40.842124938964844, "global_step": 189518, "epoch": 1566} {"train_loss": -39.71944046020508, "global_step": 189519, "epoch": 1566} {"train_loss": -41.40095138549805, "global_step": 189520, "epoch": 1566} {"train_loss": -40.90884017944336, "global_step": 189521, "epoch": 1566} {"train_loss": -40.805419921875, "global_step": 189522, "epoch": 1566} {"train_loss": -41.11293411254883, "global_step": 189523, "epoch": 1566} {"train_loss": -41.619384765625, "global_step": 189524, "epoch": 1566} {"train_loss": -41.32356643676758, "global_step": 189525, "epoch": 1566} {"train_loss": -41.39724349975586, "global_step": 189526, "epoch": 1566} {"train_loss": -41.283023834228516, "global_step": 189527, "epoch": 1566} {"train_loss": -41.87518310546875, "global_step": 189528, "epoch": 1566} {"train_loss": -40.9693489074707, "global_step": 189529, "epoch": 1566} {"train_loss": -41.651405334472656, "global_step": 189530, "epoch": 1566} {"train_loss": -40.8176155090332, "global_step": 189531, "epoch": 1566} {"train_loss": -41.002159118652344, "global_step": 189532, "epoch": 1566} {"train_loss": -40.7226448059082, "global_step": 189533, "epoch": 1566} {"train_loss": -40.19436264038086, "global_step": 189534, "epoch": 1566} {"train_loss": -40.79292678833008, "global_step": 189535, "epoch": 1566} {"train_loss": -40.406063079833984, "global_step": 189536, "epoch": 1566} {"train_loss": -41.68378829956055, "global_step": 189537, "epoch": 1566} {"train_loss": -42.07646942138672, "global_step": 189538, "epoch": 1566} {"train_loss": -40.84177780151367, "global_step": 189539, "epoch": 1566} {"train_loss": -41.032928466796875, "global_step": 189540, "epoch": 1566} {"train_loss": -41.23427963256836, "global_step": 189541, "epoch": 1566} {"train_loss": -41.150630950927734, "global_step": 189542, "epoch": 1566} {"train_loss": -41.407039642333984, "global_step": 189543, "epoch": 1566} {"train_loss": -40.98765563964844, "global_step": 189544, "epoch": 1566} {"train_loss": -40.218379974365234, "global_step": 189545, "epoch": 1566} {"train_loss": -40.9426383972168, "global_step": 189546, "epoch": 1566} {"train_loss": -42.238773345947266, "global_step": 189547, "epoch": 1566} {"train_loss": -41.986610412597656, "global_step": 189548, "epoch": 1566} {"train_loss": -41.87450408935547, "global_step": 189549, "epoch": 1566} {"train_loss": -42.12498092651367, "global_step": 189550, "epoch": 1566} {"train_loss": -42.46564865112305, "global_step": 189551, "epoch": 1566} {"train_loss": -40.74823760986328, "global_step": 189552, "epoch": 1566} {"train_loss": -41.34889602661133, "global_step": 189553, "epoch": 1566} {"train_loss": -41.68777084350586, "global_step": 189554, "epoch": 1566} {"train_loss": -41.796852111816406, "global_step": 189555, "epoch": 1566} {"train_loss": -41.36373519897461, "global_step": 189556, "epoch": 1566} {"train_loss": -40.989418029785156, "global_step": 189557, "epoch": 1566} {"train_loss": -42.72001266479492, "global_step": 189558, "epoch": 1566} {"train_loss": -41.19904708862305, "global_step": 189559, "epoch": 1566} {"train_loss": -42.06026840209961, "global_step": 189560, "epoch": 1566} {"train_loss": -41.74470138549805, "global_step": 189561, "epoch": 1566} {"train_loss": -41.0286750793457, "global_step": 189562, "epoch": 1566} {"train_loss": -40.764766693115234, "global_step": 189563, "epoch": 1566} {"train_loss": -39.17002487182617, "global_step": 189564, "epoch": 1566} {"train_loss": -39.59589767456055, "global_step": 189565, "epoch": 1566} {"train_loss": -40.283897399902344, "global_step": 189566, "epoch": 1566} {"train_loss": -40.678321838378906, "global_step": 189567, "epoch": 1566} {"train_loss": -40.28043746948242, "global_step": 189568, "epoch": 1566} {"train_loss": -41.2130012512207, "global_step": 189569, "epoch": 1566} {"train_loss": -40.2095832824707, "global_step": 189570, "epoch": 1566} {"train_loss": -41.46314239501953, "global_step": 189571, "epoch": 1566} {"train_loss": -41.259029388427734, "global_step": 189572, "epoch": 1566} {"train_loss": -41.72062683105469, "global_step": 189573, "epoch": 1566} {"train_loss": -40.84384536743164, "global_step": 189574, "epoch": 1566} {"train_loss": -40.44974899291992, "global_step": 189575, "epoch": 1566} {"train_loss": -41.29270553588867, "global_step": 189576, "epoch": 1566} {"train_loss": -39.62409973144531, "global_step": 189577, "epoch": 1566} {"train_loss": -37.20304489135742, "global_step": 189578, "epoch": 1566} {"train_loss": -40.682777404785156, "global_step": 189579, "epoch": 1566} {"train_loss": -37.20766830444336, "global_step": 189580, "epoch": 1566} {"train_loss": -36.54351806640625, "global_step": 189581, "epoch": 1566} {"train_loss": -41.70550537109375, "global_step": 189582, "epoch": 1566} {"train_loss": -38.52436828613281, "global_step": 189583, "epoch": 1566} {"train_loss": -36.3375358581543, "global_step": 189584, "epoch": 1566} {"train_loss": -42.055965423583984, "global_step": 189585, "epoch": 1566} {"train_loss": -35.74686050415039, "global_step": 189586, "epoch": 1566} {"train_loss": -38.74996566772461, "global_step": 189587, "epoch": 1566} {"train_loss": -39.72992706298828, "global_step": 189588, "epoch": 1566} {"train_loss": -36.39529037475586, "global_step": 189589, "epoch": 1566} {"train_loss": -41.6092643737793, "global_step": 189590, "epoch": 1566} {"train_loss": -36.88210678100586, "global_step": 189591, "epoch": 1566} {"train_loss": -41.49433517456055, "global_step": 189592, "epoch": 1566} {"train_loss": -38.5941276550293, "global_step": 189593, "epoch": 1566} {"train_loss": -40.6998291015625, "global_step": 189594, "epoch": 1566} {"train_loss": -38.829830169677734, "global_step": 189595, "epoch": 1566} {"train_loss": -40.25974655151367, "global_step": 189596, "epoch": 1566} {"train_loss": -40.96133041381836, "global_step": 189597, "epoch": 1566} {"train_loss": -41.00918960571289, "global_step": 189598, "epoch": 1566} {"train_loss": -40.78798294067383, "global_step": 189599, "epoch": 1566} {"train_loss": -41.53669357299805, "global_step": 189600, "epoch": 1566} {"train_loss": -40.73862838745117, "global_step": 189601, "epoch": 1566} {"train_loss": -40.84491729736328, "global_step": 189602, "epoch": 1566} {"train_loss": -41.194091796875, "global_step": 189603, "epoch": 1566} {"train_loss": -42.015228271484375, "global_step": 189604, "epoch": 1566} {"train_loss": -40.64425277709961, "global_step": 189605, "epoch": 1566} {"train_loss": -40.684614607125276, "global_step": 189606, "epoch": 1566, "val_loss": 2483968.75} {"train_loss": -41.84321594238281, "global_step": 189607, "epoch": 1567} {"train_loss": -41.400997161865234, "global_step": 189608, "epoch": 1567} {"train_loss": -41.86147689819336, "global_step": 189609, "epoch": 1567} {"train_loss": -41.3170280456543, "global_step": 189610, "epoch": 1567} {"train_loss": -41.45357894897461, "global_step": 189611, "epoch": 1567} {"train_loss": -41.001014709472656, "global_step": 189612, "epoch": 1567} {"train_loss": -41.747947692871094, "global_step": 189613, "epoch": 1567} {"train_loss": -41.744991302490234, "global_step": 189614, "epoch": 1567} {"train_loss": -41.72858810424805, "global_step": 189615, "epoch": 1567} {"train_loss": -41.94245529174805, "global_step": 189616, "epoch": 1567} {"train_loss": -41.4600944519043, "global_step": 189617, "epoch": 1567} {"train_loss": -41.6080322265625, "global_step": 189618, "epoch": 1567} {"train_loss": -42.36770248413086, "global_step": 189619, "epoch": 1567} {"train_loss": -41.672054290771484, "global_step": 189620, "epoch": 1567} {"train_loss": -41.61812973022461, "global_step": 189621, "epoch": 1567} {"train_loss": -41.88765335083008, "global_step": 189622, "epoch": 1567} {"train_loss": -41.966304779052734, "global_step": 189623, "epoch": 1567} {"train_loss": -41.98073196411133, "global_step": 189624, "epoch": 1567} {"train_loss": -42.298282623291016, "global_step": 189625, "epoch": 1567} {"train_loss": -41.943939208984375, "global_step": 189626, "epoch": 1567} {"train_loss": -42.32206344604492, "global_step": 189627, "epoch": 1567} {"train_loss": -41.7187614440918, "global_step": 189628, "epoch": 1567} {"train_loss": -42.20473861694336, "global_step": 189629, "epoch": 1567} {"train_loss": -42.5737190246582, "global_step": 189630, "epoch": 1567} {"train_loss": -41.69013214111328, "global_step": 189631, "epoch": 1567} {"train_loss": -41.79866027832031, "global_step": 189632, "epoch": 1567} {"train_loss": -41.35869598388672, "global_step": 189633, "epoch": 1567} {"train_loss": -41.976776123046875, "global_step": 189634, "epoch": 1567} {"train_loss": -41.39232635498047, "global_step": 189635, "epoch": 1567} {"train_loss": -40.71041488647461, "global_step": 189636, "epoch": 1567} {"train_loss": -41.683555603027344, "global_step": 189637, "epoch": 1567} {"train_loss": -41.021461486816406, "global_step": 189638, "epoch": 1567} {"train_loss": -41.47077178955078, "global_step": 189639, "epoch": 1567} {"train_loss": -41.029457092285156, "global_step": 189640, "epoch": 1567} {"train_loss": -41.796993255615234, "global_step": 189641, "epoch": 1567} {"train_loss": -41.58087158203125, "global_step": 189642, "epoch": 1567} {"train_loss": -41.142364501953125, "global_step": 189643, "epoch": 1567} {"train_loss": -42.01033401489258, "global_step": 189644, "epoch": 1567} {"train_loss": -41.58999252319336, "global_step": 189645, "epoch": 1567} {"train_loss": -41.40736770629883, "global_step": 189646, "epoch": 1567} {"train_loss": -41.89795684814453, "global_step": 189647, "epoch": 1567} {"train_loss": -41.873619079589844, "global_step": 189648, "epoch": 1567} {"train_loss": -40.371646881103516, "global_step": 189649, "epoch": 1567} {"train_loss": -41.283138275146484, "global_step": 189650, "epoch": 1567} {"train_loss": -41.727718353271484, "global_step": 189651, "epoch": 1567} {"train_loss": -39.69219970703125, "global_step": 189652, "epoch": 1567} {"train_loss": -41.5647087097168, "global_step": 189653, "epoch": 1567} {"train_loss": -41.76975631713867, "global_step": 189654, "epoch": 1567} {"train_loss": -40.7567138671875, "global_step": 189655, "epoch": 1567} {"train_loss": -41.18507385253906, "global_step": 189656, "epoch": 1567} {"train_loss": -41.465667724609375, "global_step": 189657, "epoch": 1567} {"train_loss": -40.070533752441406, "global_step": 189658, "epoch": 1567} {"train_loss": -41.79720687866211, "global_step": 189659, "epoch": 1567} {"train_loss": -39.13869857788086, "global_step": 189660, "epoch": 1567} {"train_loss": -40.47435760498047, "global_step": 189661, "epoch": 1567} {"train_loss": -40.1876220703125, "global_step": 189662, "epoch": 1567} {"train_loss": -37.859100341796875, "global_step": 189663, "epoch": 1567} {"train_loss": -40.74951171875, "global_step": 189664, "epoch": 1567} {"train_loss": -39.44590377807617, "global_step": 189665, "epoch": 1567} {"train_loss": -38.8571662902832, "global_step": 189666, "epoch": 1567} {"train_loss": -41.689491271972656, "global_step": 189667, "epoch": 1567} {"train_loss": -39.6781005859375, "global_step": 189668, "epoch": 1567} {"train_loss": -41.35319137573242, "global_step": 189669, "epoch": 1567} {"train_loss": -39.69742965698242, "global_step": 189670, "epoch": 1567} {"train_loss": -39.77928924560547, "global_step": 189671, "epoch": 1567} {"train_loss": -40.704803466796875, "global_step": 189672, "epoch": 1567} {"train_loss": -40.82253646850586, "global_step": 189673, "epoch": 1567} {"train_loss": -41.31532669067383, "global_step": 189674, "epoch": 1567} {"train_loss": -40.84817123413086, "global_step": 189675, "epoch": 1567} {"train_loss": -40.50642013549805, "global_step": 189676, "epoch": 1567} {"train_loss": -40.88237762451172, "global_step": 189677, "epoch": 1567} {"train_loss": -40.60426712036133, "global_step": 189678, "epoch": 1567} {"train_loss": -40.409332275390625, "global_step": 189679, "epoch": 1567} {"train_loss": -40.94486618041992, "global_step": 189680, "epoch": 1567} {"train_loss": -40.5483512878418, "global_step": 189681, "epoch": 1567} {"train_loss": -41.58071517944336, "global_step": 189682, "epoch": 1567} {"train_loss": -39.2132568359375, "global_step": 189683, "epoch": 1567} {"train_loss": -36.909095764160156, "global_step": 189684, "epoch": 1567} {"train_loss": -34.53374481201172, "global_step": 189685, "epoch": 1567} {"train_loss": -37.49110794067383, "global_step": 189686, "epoch": 1567} {"train_loss": -41.418067932128906, "global_step": 189687, "epoch": 1567} {"train_loss": -36.227210998535156, "global_step": 189688, "epoch": 1567} {"train_loss": -35.950897216796875, "global_step": 189689, "epoch": 1567} {"train_loss": -39.456871032714844, "global_step": 189690, "epoch": 1567} {"train_loss": -40.68154525756836, "global_step": 189691, "epoch": 1567} {"train_loss": -38.51371383666992, "global_step": 189692, "epoch": 1567} {"train_loss": -41.219058990478516, "global_step": 189693, "epoch": 1567} {"train_loss": -40.61408615112305, "global_step": 189694, "epoch": 1567} {"train_loss": -40.623470306396484, "global_step": 189695, "epoch": 1567} {"train_loss": -40.922218322753906, "global_step": 189696, "epoch": 1567} {"train_loss": -40.01006317138672, "global_step": 189697, "epoch": 1567} {"train_loss": -37.89977264404297, "global_step": 189698, "epoch": 1567} {"train_loss": -39.33597946166992, "global_step": 189699, "epoch": 1567} {"train_loss": -40.91679763793945, "global_step": 189700, "epoch": 1567} {"train_loss": -40.12150955200195, "global_step": 189701, "epoch": 1567} {"train_loss": -41.68876266479492, "global_step": 189702, "epoch": 1567} {"train_loss": -41.29423904418945, "global_step": 189703, "epoch": 1567} {"train_loss": -41.78062057495117, "global_step": 189704, "epoch": 1567} {"train_loss": -41.306392669677734, "global_step": 189705, "epoch": 1567} {"train_loss": -41.60956954956055, "global_step": 189706, "epoch": 1567} {"train_loss": -41.12007141113281, "global_step": 189707, "epoch": 1567} {"train_loss": -41.75851821899414, "global_step": 189708, "epoch": 1567} {"train_loss": -40.53853988647461, "global_step": 189709, "epoch": 1567} {"train_loss": -41.81338119506836, "global_step": 189710, "epoch": 1567} {"train_loss": -41.491668701171875, "global_step": 189711, "epoch": 1567} {"train_loss": -41.70475387573242, "global_step": 189712, "epoch": 1567} {"train_loss": -41.99637985229492, "global_step": 189713, "epoch": 1567} {"train_loss": -40.68515396118164, "global_step": 189714, "epoch": 1567} {"train_loss": -42.14252471923828, "global_step": 189715, "epoch": 1567} {"train_loss": -41.52732849121094, "global_step": 189716, "epoch": 1567} {"train_loss": -41.97574996948242, "global_step": 189717, "epoch": 1567} {"train_loss": -42.13881301879883, "global_step": 189718, "epoch": 1567} {"train_loss": -42.19610595703125, "global_step": 189719, "epoch": 1567} {"train_loss": -42.445125579833984, "global_step": 189720, "epoch": 1567} {"train_loss": -41.96580505371094, "global_step": 189721, "epoch": 1567} {"train_loss": -42.05665969848633, "global_step": 189722, "epoch": 1567} {"train_loss": -42.39142990112305, "global_step": 189723, "epoch": 1567} {"train_loss": -42.50938034057617, "global_step": 189724, "epoch": 1567} {"train_loss": -42.34212112426758, "global_step": 189725, "epoch": 1567} {"train_loss": -42.3038215637207, "global_step": 189726, "epoch": 1567} {"train_loss": -40.979269926213036, "global_step": 189727, "epoch": 1567, "val_loss": 2386724.0} {"train_loss": -42.79660415649414, "global_step": 189728, "epoch": 1568} {"train_loss": -42.58708190917969, "global_step": 189729, "epoch": 1568} {"train_loss": -42.586456298828125, "global_step": 189730, "epoch": 1568} {"train_loss": -42.6020393371582, "global_step": 189731, "epoch": 1568} {"train_loss": -42.5819091796875, "global_step": 189732, "epoch": 1568} {"train_loss": -41.88080596923828, "global_step": 189733, "epoch": 1568} {"train_loss": -42.23577880859375, "global_step": 189734, "epoch": 1568} {"train_loss": -42.09516525268555, "global_step": 189735, "epoch": 1568} {"train_loss": -42.709007263183594, "global_step": 189736, "epoch": 1568} {"train_loss": -42.5949821472168, "global_step": 189737, "epoch": 1568} {"train_loss": -42.766319274902344, "global_step": 189738, "epoch": 1568} {"train_loss": -42.02628707885742, "global_step": 189739, "epoch": 1568} {"train_loss": -42.27766036987305, "global_step": 189740, "epoch": 1568} {"train_loss": -41.35954284667969, "global_step": 189741, "epoch": 1568} {"train_loss": -42.7849235534668, "global_step": 189742, "epoch": 1568} {"train_loss": -42.32976150512695, "global_step": 189743, "epoch": 1568} {"train_loss": -42.27797317504883, "global_step": 189744, "epoch": 1568} {"train_loss": -40.19249725341797, "global_step": 189745, "epoch": 1568} {"train_loss": -41.51042938232422, "global_step": 189746, "epoch": 1568} {"train_loss": -41.906490325927734, "global_step": 189747, "epoch": 1568} {"train_loss": -42.00254440307617, "global_step": 189748, "epoch": 1568} {"train_loss": -40.847652435302734, "global_step": 189749, "epoch": 1568} {"train_loss": -40.314998626708984, "global_step": 189750, "epoch": 1568} {"train_loss": -40.7409782409668, "global_step": 189751, "epoch": 1568} {"train_loss": -40.18134689331055, "global_step": 189752, "epoch": 1568} {"train_loss": -40.99613952636719, "global_step": 189753, "epoch": 1568} {"train_loss": -41.67945098876953, "global_step": 189754, "epoch": 1568} {"train_loss": -41.18461990356445, "global_step": 189755, "epoch": 1568} {"train_loss": -40.669673919677734, "global_step": 189756, "epoch": 1568} {"train_loss": -40.61799240112305, "global_step": 189757, "epoch": 1568} {"train_loss": -40.85295486450195, "global_step": 189758, "epoch": 1568} {"train_loss": -40.988624572753906, "global_step": 189759, "epoch": 1568} {"train_loss": -40.96815872192383, "global_step": 189760, "epoch": 1568} {"train_loss": -41.19756317138672, "global_step": 189761, "epoch": 1568} {"train_loss": -40.564632415771484, "global_step": 189762, "epoch": 1568} {"train_loss": -41.51055908203125, "global_step": 189763, "epoch": 1568} {"train_loss": -41.45711898803711, "global_step": 189764, "epoch": 1568} {"train_loss": -41.78169631958008, "global_step": 189765, "epoch": 1568} {"train_loss": -41.84819793701172, "global_step": 189766, "epoch": 1568} {"train_loss": -42.257347106933594, "global_step": 189767, "epoch": 1568} {"train_loss": -42.25252914428711, "global_step": 189768, "epoch": 1568} {"train_loss": -41.873050689697266, "global_step": 189769, "epoch": 1568} {"train_loss": -42.479007720947266, "global_step": 189770, "epoch": 1568} {"train_loss": -42.21724319458008, "global_step": 189771, "epoch": 1568} {"train_loss": -41.953460693359375, "global_step": 189772, "epoch": 1568} {"train_loss": -42.163475036621094, "global_step": 189773, "epoch": 1568} {"train_loss": -42.57467269897461, "global_step": 189774, "epoch": 1568} {"train_loss": -42.16989517211914, "global_step": 189775, "epoch": 1568} {"train_loss": -41.52940368652344, "global_step": 189776, "epoch": 1568} {"train_loss": -41.99237060546875, "global_step": 189777, "epoch": 1568} {"train_loss": -42.57441329956055, "global_step": 189778, "epoch": 1568} {"train_loss": -41.57969284057617, "global_step": 189779, "epoch": 1568} {"train_loss": -41.05817794799805, "global_step": 189780, "epoch": 1568} {"train_loss": -42.19065856933594, "global_step": 189781, "epoch": 1568} {"train_loss": -41.0471305847168, "global_step": 189782, "epoch": 1568} {"train_loss": -41.38157653808594, "global_step": 189783, "epoch": 1568} {"train_loss": -42.257904052734375, "global_step": 189784, "epoch": 1568} {"train_loss": -41.81953048706055, "global_step": 189785, "epoch": 1568} {"train_loss": -41.38753128051758, "global_step": 189786, "epoch": 1568} {"train_loss": -42.52961349487305, "global_step": 189787, "epoch": 1568} {"train_loss": -41.792327880859375, "global_step": 189788, "epoch": 1568} {"train_loss": -38.168243408203125, "global_step": 189789, "epoch": 1568} {"train_loss": -40.32596969604492, "global_step": 189790, "epoch": 1568} {"train_loss": -39.112422943115234, "global_step": 189791, "epoch": 1568} {"train_loss": -41.680259704589844, "global_step": 189792, "epoch": 1568} {"train_loss": -38.272056579589844, "global_step": 189793, "epoch": 1568} {"train_loss": -39.2449836730957, "global_step": 189794, "epoch": 1568} {"train_loss": -35.657161712646484, "global_step": 189795, "epoch": 1568} {"train_loss": -37.95371627807617, "global_step": 189796, "epoch": 1568} {"train_loss": -40.8297004699707, "global_step": 189797, "epoch": 1568} {"train_loss": -39.90248489379883, "global_step": 189798, "epoch": 1568} {"train_loss": -34.598995208740234, "global_step": 189799, "epoch": 1568} {"train_loss": -31.55487632751465, "global_step": 189800, "epoch": 1568} {"train_loss": -39.74705123901367, "global_step": 189801, "epoch": 1568} {"train_loss": -39.18574905395508, "global_step": 189802, "epoch": 1568} {"train_loss": -39.69269561767578, "global_step": 189803, "epoch": 1568} {"train_loss": -37.791839599609375, "global_step": 189804, "epoch": 1568} {"train_loss": -37.14994430541992, "global_step": 189805, "epoch": 1568} {"train_loss": -38.5570182800293, "global_step": 189806, "epoch": 1568} {"train_loss": -40.56744384765625, "global_step": 189807, "epoch": 1568} {"train_loss": -38.71505355834961, "global_step": 189808, "epoch": 1568} {"train_loss": -39.82452392578125, "global_step": 189809, "epoch": 1568} {"train_loss": -40.968658447265625, "global_step": 189810, "epoch": 1568} {"train_loss": -37.098873138427734, "global_step": 189811, "epoch": 1568} {"train_loss": -38.10010528564453, "global_step": 189812, "epoch": 1568} {"train_loss": -39.301048278808594, "global_step": 189813, "epoch": 1568} {"train_loss": -39.15129089355469, "global_step": 189814, "epoch": 1568} {"train_loss": -40.37690353393555, "global_step": 189815, "epoch": 1568} {"train_loss": -38.06435775756836, "global_step": 189816, "epoch": 1568} {"train_loss": -39.660701751708984, "global_step": 189817, "epoch": 1568} {"train_loss": -38.67525863647461, "global_step": 189818, "epoch": 1568} {"train_loss": -36.886043548583984, "global_step": 189819, "epoch": 1568} {"train_loss": -41.054595947265625, "global_step": 189820, "epoch": 1568} {"train_loss": -39.6099739074707, "global_step": 189821, "epoch": 1568} {"train_loss": -37.590362548828125, "global_step": 189822, "epoch": 1568} {"train_loss": -39.87599563598633, "global_step": 189823, "epoch": 1568} {"train_loss": -38.850852966308594, "global_step": 189824, "epoch": 1568} {"train_loss": -38.83134078979492, "global_step": 189825, "epoch": 1568} {"train_loss": -40.194427490234375, "global_step": 189826, "epoch": 1568} {"train_loss": -38.470245361328125, "global_step": 189827, "epoch": 1568} {"train_loss": -38.37693405151367, "global_step": 189828, "epoch": 1568} {"train_loss": -40.147518157958984, "global_step": 189829, "epoch": 1568} {"train_loss": -40.04648208618164, "global_step": 189830, "epoch": 1568} {"train_loss": -39.52262496948242, "global_step": 189831, "epoch": 1568} {"train_loss": -39.90693664550781, "global_step": 189832, "epoch": 1568} {"train_loss": -37.97645950317383, "global_step": 189833, "epoch": 1568} {"train_loss": -39.39488220214844, "global_step": 189834, "epoch": 1568} {"train_loss": -39.89934158325195, "global_step": 189835, "epoch": 1568} {"train_loss": -40.14019775390625, "global_step": 189836, "epoch": 1568} {"train_loss": -40.285560607910156, "global_step": 189837, "epoch": 1568} {"train_loss": -39.430049896240234, "global_step": 189838, "epoch": 1568} {"train_loss": -40.81391525268555, "global_step": 189839, "epoch": 1568} {"train_loss": -41.254608154296875, "global_step": 189840, "epoch": 1568} {"train_loss": -40.77535629272461, "global_step": 189841, "epoch": 1568} {"train_loss": -40.123313903808594, "global_step": 189842, "epoch": 1568} {"train_loss": -41.530757904052734, "global_step": 189843, "epoch": 1568} {"train_loss": -40.82123565673828, "global_step": 189844, "epoch": 1568} {"train_loss": -40.895015716552734, "global_step": 189845, "epoch": 1568} {"train_loss": -41.46895980834961, "global_step": 189846, "epoch": 1568} {"train_loss": -40.98869705200195, "global_step": 189847, "epoch": 1568} {"train_loss": -40.5280687158758, "global_step": 189848, "epoch": 1568, "val_loss": 2473349.0} {"train_loss": -40.74299240112305, "global_step": 189849, "epoch": 1569} {"train_loss": -40.730506896972656, "global_step": 189850, "epoch": 1569} {"train_loss": -41.72895431518555, "global_step": 189851, "epoch": 1569} {"train_loss": -40.712013244628906, "global_step": 189852, "epoch": 1569} {"train_loss": -42.026100158691406, "global_step": 189853, "epoch": 1569} {"train_loss": -41.517879486083984, "global_step": 189854, "epoch": 1569} {"train_loss": -41.31033706665039, "global_step": 189855, "epoch": 1569} {"train_loss": -41.400997161865234, "global_step": 189856, "epoch": 1569} {"train_loss": -41.99940872192383, "global_step": 189857, "epoch": 1569} {"train_loss": -41.99217224121094, "global_step": 189858, "epoch": 1569} {"train_loss": -41.8939208984375, "global_step": 189859, "epoch": 1569} {"train_loss": -42.1172981262207, "global_step": 189860, "epoch": 1569} {"train_loss": -41.865413665771484, "global_step": 189861, "epoch": 1569} {"train_loss": -41.8204345703125, "global_step": 189862, "epoch": 1569} {"train_loss": -41.983463287353516, "global_step": 189863, "epoch": 1569} {"train_loss": -41.8264045715332, "global_step": 189864, "epoch": 1569} {"train_loss": -41.943965911865234, "global_step": 189865, "epoch": 1569} {"train_loss": -42.0289421081543, "global_step": 189866, "epoch": 1569} {"train_loss": -41.748779296875, "global_step": 189867, "epoch": 1569} {"train_loss": -42.477073669433594, "global_step": 189868, "epoch": 1569} {"train_loss": -41.74808883666992, "global_step": 189869, "epoch": 1569} {"train_loss": -41.72389602661133, "global_step": 189870, "epoch": 1569} {"train_loss": -42.21580123901367, "global_step": 189871, "epoch": 1569} {"train_loss": -41.97929763793945, "global_step": 189872, "epoch": 1569} {"train_loss": -42.23902130126953, "global_step": 189873, "epoch": 1569} {"train_loss": -42.385498046875, "global_step": 189874, "epoch": 1569} {"train_loss": -42.39678192138672, "global_step": 189875, "epoch": 1569} {"train_loss": -42.328887939453125, "global_step": 189876, "epoch": 1569} {"train_loss": -41.55481719970703, "global_step": 189877, "epoch": 1569} {"train_loss": -42.50236129760742, "global_step": 189878, "epoch": 1569} {"train_loss": -42.48458480834961, "global_step": 189879, "epoch": 1569} {"train_loss": -42.46987533569336, "global_step": 189880, "epoch": 1569} {"train_loss": -42.41786575317383, "global_step": 189881, "epoch": 1569} {"train_loss": -42.11800765991211, "global_step": 189882, "epoch": 1569} {"train_loss": -42.34696578979492, "global_step": 189883, "epoch": 1569} {"train_loss": -42.285919189453125, "global_step": 189884, "epoch": 1569} {"train_loss": -42.515342712402344, "global_step": 189885, "epoch": 1569} {"train_loss": -41.92096710205078, "global_step": 189886, "epoch": 1569} {"train_loss": -42.466793060302734, "global_step": 189887, "epoch": 1569} {"train_loss": -42.45233154296875, "global_step": 189888, "epoch": 1569} {"train_loss": -42.83761215209961, "global_step": 189889, "epoch": 1569} {"train_loss": -42.5717887878418, "global_step": 189890, "epoch": 1569} {"train_loss": -42.321197509765625, "global_step": 189891, "epoch": 1569} {"train_loss": -42.2419548034668, "global_step": 189892, "epoch": 1569} {"train_loss": -42.150814056396484, "global_step": 189893, "epoch": 1569} {"train_loss": -42.33475875854492, "global_step": 189894, "epoch": 1569} {"train_loss": -41.50689697265625, "global_step": 189895, "epoch": 1569} {"train_loss": -40.133384704589844, "global_step": 189896, "epoch": 1569} {"train_loss": -42.17417526245117, "global_step": 189897, "epoch": 1569} {"train_loss": -40.937232971191406, "global_step": 189898, "epoch": 1569} {"train_loss": -41.74298858642578, "global_step": 189899, "epoch": 1569} {"train_loss": -41.0989875793457, "global_step": 189900, "epoch": 1569} {"train_loss": -40.932098388671875, "global_step": 189901, "epoch": 1569} {"train_loss": -40.92151641845703, "global_step": 189902, "epoch": 1569} {"train_loss": -40.052284240722656, "global_step": 189903, "epoch": 1569} {"train_loss": -41.60020065307617, "global_step": 189904, "epoch": 1569} {"train_loss": -39.71645736694336, "global_step": 189905, "epoch": 1569} {"train_loss": -37.92940139770508, "global_step": 189906, "epoch": 1569} {"train_loss": -39.257625579833984, "global_step": 189907, "epoch": 1569} {"train_loss": -39.377830505371094, "global_step": 189908, "epoch": 1569} {"train_loss": -41.054298400878906, "global_step": 189909, "epoch": 1569} {"train_loss": -40.337928771972656, "global_step": 189910, "epoch": 1569} {"train_loss": -41.087799072265625, "global_step": 189911, "epoch": 1569} {"train_loss": -39.80607223510742, "global_step": 189912, "epoch": 1569} {"train_loss": -40.24381637573242, "global_step": 189913, "epoch": 1569} {"train_loss": -40.73661422729492, "global_step": 189914, "epoch": 1569} {"train_loss": -40.82411575317383, "global_step": 189915, "epoch": 1569} {"train_loss": -41.28745651245117, "global_step": 189916, "epoch": 1569} {"train_loss": -41.44111251831055, "global_step": 189917, "epoch": 1569} {"train_loss": -40.71942901611328, "global_step": 189918, "epoch": 1569} {"train_loss": -40.08698654174805, "global_step": 189919, "epoch": 1569} {"train_loss": -41.081459045410156, "global_step": 189920, "epoch": 1569} {"train_loss": -40.57707595825195, "global_step": 189921, "epoch": 1569} {"train_loss": -41.87000274658203, "global_step": 189922, "epoch": 1569} {"train_loss": -41.375709533691406, "global_step": 189923, "epoch": 1569} {"train_loss": -40.68577194213867, "global_step": 189924, "epoch": 1569} {"train_loss": -40.9300537109375, "global_step": 189925, "epoch": 1569} {"train_loss": -41.76375961303711, "global_step": 189926, "epoch": 1569} {"train_loss": -41.834957122802734, "global_step": 189927, "epoch": 1569} {"train_loss": -40.77192306518555, "global_step": 189928, "epoch": 1569} {"train_loss": -41.770015716552734, "global_step": 189929, "epoch": 1569} {"train_loss": -41.6284294128418, "global_step": 189930, "epoch": 1569} {"train_loss": -40.92879867553711, "global_step": 189931, "epoch": 1569} {"train_loss": -41.11613082885742, "global_step": 189932, "epoch": 1569} {"train_loss": -41.636810302734375, "global_step": 189933, "epoch": 1569} {"train_loss": -41.841888427734375, "global_step": 189934, "epoch": 1569} {"train_loss": -41.70009994506836, "global_step": 189935, "epoch": 1569} {"train_loss": -42.35042190551758, "global_step": 189936, "epoch": 1569} {"train_loss": -41.76648712158203, "global_step": 189937, "epoch": 1569} {"train_loss": -42.16110610961914, "global_step": 189938, "epoch": 1569} {"train_loss": -42.61808395385742, "global_step": 189939, "epoch": 1569} {"train_loss": -41.862667083740234, "global_step": 189940, "epoch": 1569} {"train_loss": -41.531654357910156, "global_step": 189941, "epoch": 1569} {"train_loss": -42.26687240600586, "global_step": 189942, "epoch": 1569} {"train_loss": -42.12632369995117, "global_step": 189943, "epoch": 1569} {"train_loss": -41.8450927734375, "global_step": 189944, "epoch": 1569} {"train_loss": -41.8276481628418, "global_step": 189945, "epoch": 1569} {"train_loss": -41.41264343261719, "global_step": 189946, "epoch": 1569} {"train_loss": -41.644779205322266, "global_step": 189947, "epoch": 1569} {"train_loss": -41.78486251831055, "global_step": 189948, "epoch": 1569} {"train_loss": -42.09157180786133, "global_step": 189949, "epoch": 1569} {"train_loss": -42.36511993408203, "global_step": 189950, "epoch": 1569} {"train_loss": -41.50946807861328, "global_step": 189951, "epoch": 1569} {"train_loss": -40.79293441772461, "global_step": 189952, "epoch": 1569} {"train_loss": -40.53423309326172, "global_step": 189953, "epoch": 1569} {"train_loss": -41.35725021362305, "global_step": 189954, "epoch": 1569} {"train_loss": -41.09072494506836, "global_step": 189955, "epoch": 1569} {"train_loss": -39.783363342285156, "global_step": 189956, "epoch": 1569} {"train_loss": -39.559104919433594, "global_step": 189957, "epoch": 1569} {"train_loss": -41.202327728271484, "global_step": 189958, "epoch": 1569} {"train_loss": -41.25849533081055, "global_step": 189959, "epoch": 1569} {"train_loss": -41.409278869628906, "global_step": 189960, "epoch": 1569} {"train_loss": -42.05759811401367, "global_step": 189961, "epoch": 1569} {"train_loss": -41.430538177490234, "global_step": 189962, "epoch": 1569} {"train_loss": -40.82918167114258, "global_step": 189963, "epoch": 1569} {"train_loss": -40.96611785888672, "global_step": 189964, "epoch": 1569} {"train_loss": -41.16938018798828, "global_step": 189965, "epoch": 1569} {"train_loss": -41.627132415771484, "global_step": 189966, "epoch": 1569} {"train_loss": -40.95170593261719, "global_step": 189967, "epoch": 1569} {"train_loss": -41.33498764038086, "global_step": 189968, "epoch": 1569} {"train_loss": -41.48165672869722, "global_step": 189969, "epoch": 1569, "val_loss": 2418895.75} {"train_loss": -40.84324264526367, "global_step": 189970, "epoch": 1570} {"train_loss": -39.91522979736328, "global_step": 189971, "epoch": 1570} {"train_loss": -41.648658752441406, "global_step": 189972, "epoch": 1570} {"train_loss": -40.86174392700195, "global_step": 189973, "epoch": 1570} {"train_loss": -40.347469329833984, "global_step": 189974, "epoch": 1570} {"train_loss": -41.9106559753418, "global_step": 189975, "epoch": 1570} {"train_loss": -41.418006896972656, "global_step": 189976, "epoch": 1570} {"train_loss": -40.535335540771484, "global_step": 189977, "epoch": 1570} {"train_loss": -41.33209228515625, "global_step": 189978, "epoch": 1570} {"train_loss": -41.64936447143555, "global_step": 189979, "epoch": 1570} {"train_loss": -41.3469352722168, "global_step": 189980, "epoch": 1570} {"train_loss": -39.56414794921875, "global_step": 189981, "epoch": 1570} {"train_loss": -41.48988723754883, "global_step": 189982, "epoch": 1570} {"train_loss": -39.37656784057617, "global_step": 189983, "epoch": 1570} {"train_loss": -40.29817199707031, "global_step": 189984, "epoch": 1570} {"train_loss": -41.439937591552734, "global_step": 189985, "epoch": 1570} {"train_loss": -40.627864837646484, "global_step": 189986, "epoch": 1570} {"train_loss": -41.36013412475586, "global_step": 189987, "epoch": 1570} {"train_loss": -40.74774932861328, "global_step": 189988, "epoch": 1570} {"train_loss": -41.58613204956055, "global_step": 189989, "epoch": 1570} {"train_loss": -42.120609283447266, "global_step": 189990, "epoch": 1570} {"train_loss": -41.06511306762695, "global_step": 189991, "epoch": 1570} {"train_loss": -41.194698333740234, "global_step": 189992, "epoch": 1570} {"train_loss": -41.575599670410156, "global_step": 189993, "epoch": 1570} {"train_loss": -40.35396194458008, "global_step": 189994, "epoch": 1570} {"train_loss": -42.079933166503906, "global_step": 189995, "epoch": 1570} {"train_loss": -41.41831588745117, "global_step": 189996, "epoch": 1570} {"train_loss": -41.73371505737305, "global_step": 189997, "epoch": 1570} {"train_loss": -41.7271842956543, "global_step": 189998, "epoch": 1570} {"train_loss": -41.00315856933594, "global_step": 189999, "epoch": 1570} {"train_loss": -41.99225997924805, "global_step": 190000, "epoch": 1570} {"train_loss": -42.064754486083984, "global_step": 190001, "epoch": 1570} {"train_loss": -41.61190414428711, "global_step": 190002, "epoch": 1570} {"train_loss": -41.20570373535156, "global_step": 190003, "epoch": 1570} {"train_loss": -42.04695129394531, "global_step": 190004, "epoch": 1570} {"train_loss": -41.0697135925293, "global_step": 190005, "epoch": 1570} {"train_loss": -40.426544189453125, "global_step": 190006, "epoch": 1570} {"train_loss": -42.593017578125, "global_step": 190007, "epoch": 1570} {"train_loss": -40.92753982543945, "global_step": 190008, "epoch": 1570} {"train_loss": -41.54294967651367, "global_step": 190009, "epoch": 1570} {"train_loss": -41.6120491027832, "global_step": 190010, "epoch": 1570} {"train_loss": -41.785152435302734, "global_step": 190011, "epoch": 1570} {"train_loss": -41.9242057800293, "global_step": 190012, "epoch": 1570} {"train_loss": -42.52968978881836, "global_step": 190013, "epoch": 1570} {"train_loss": -41.52266311645508, "global_step": 190014, "epoch": 1570} {"train_loss": -41.948299407958984, "global_step": 190015, "epoch": 1570} {"train_loss": -41.87872314453125, "global_step": 190016, "epoch": 1570} {"train_loss": -42.31770706176758, "global_step": 190017, "epoch": 1570} {"train_loss": -41.48591995239258, "global_step": 190018, "epoch": 1570} {"train_loss": -42.146644592285156, "global_step": 190019, "epoch": 1570} {"train_loss": -42.04890060424805, "global_step": 190020, "epoch": 1570} {"train_loss": -41.19700241088867, "global_step": 190021, "epoch": 1570} {"train_loss": -42.28532028198242, "global_step": 190022, "epoch": 1570} {"train_loss": -41.974151611328125, "global_step": 190023, "epoch": 1570} {"train_loss": -41.3818244934082, "global_step": 190024, "epoch": 1570} {"train_loss": -42.044273376464844, "global_step": 190025, "epoch": 1570} {"train_loss": -41.599735260009766, "global_step": 190026, "epoch": 1570} {"train_loss": -39.808284759521484, "global_step": 190027, "epoch": 1570} {"train_loss": -41.16548538208008, "global_step": 190028, "epoch": 1570} {"train_loss": -41.92595291137695, "global_step": 190029, "epoch": 1570} {"train_loss": -41.55826950073242, "global_step": 190030, "epoch": 1570} {"train_loss": -41.54281997680664, "global_step": 190031, "epoch": 1570} {"train_loss": -41.65536117553711, "global_step": 190032, "epoch": 1570} {"train_loss": -41.756736755371094, "global_step": 190033, "epoch": 1570} {"train_loss": -41.87916564941406, "global_step": 190034, "epoch": 1570} {"train_loss": -42.3828125, "global_step": 190035, "epoch": 1570} {"train_loss": -40.620723724365234, "global_step": 190036, "epoch": 1570} {"train_loss": -40.84455108642578, "global_step": 190037, "epoch": 1570} {"train_loss": -40.022945404052734, "global_step": 190038, "epoch": 1570} {"train_loss": -41.02201461791992, "global_step": 190039, "epoch": 1570} {"train_loss": -42.094051361083984, "global_step": 190040, "epoch": 1570} {"train_loss": -41.71194076538086, "global_step": 190041, "epoch": 1570} {"train_loss": -39.62118148803711, "global_step": 190042, "epoch": 1570} {"train_loss": -41.77985382080078, "global_step": 190043, "epoch": 1570} {"train_loss": -41.384857177734375, "global_step": 190044, "epoch": 1570} {"train_loss": -39.938446044921875, "global_step": 190045, "epoch": 1570} {"train_loss": -40.814876556396484, "global_step": 190046, "epoch": 1570} {"train_loss": -41.729915618896484, "global_step": 190047, "epoch": 1570} {"train_loss": -41.875972747802734, "global_step": 190048, "epoch": 1570} {"train_loss": -41.0573844909668, "global_step": 190049, "epoch": 1570} {"train_loss": -40.05831527709961, "global_step": 190050, "epoch": 1570} {"train_loss": -41.33565902709961, "global_step": 190051, "epoch": 1570} {"train_loss": -41.853729248046875, "global_step": 190052, "epoch": 1570} {"train_loss": -40.890445709228516, "global_step": 190053, "epoch": 1570} {"train_loss": -40.20661544799805, "global_step": 190054, "epoch": 1570} {"train_loss": -42.37286376953125, "global_step": 190055, "epoch": 1570} {"train_loss": -41.558807373046875, "global_step": 190056, "epoch": 1570} {"train_loss": -41.6995964050293, "global_step": 190057, "epoch": 1570} {"train_loss": -42.531185150146484, "global_step": 190058, "epoch": 1570} {"train_loss": -41.79743576049805, "global_step": 190059, "epoch": 1570} {"train_loss": -41.62721633911133, "global_step": 190060, "epoch": 1570} {"train_loss": -41.857666015625, "global_step": 190061, "epoch": 1570} {"train_loss": -41.83805465698242, "global_step": 190062, "epoch": 1570} {"train_loss": -42.41624069213867, "global_step": 190063, "epoch": 1570} {"train_loss": -42.29905319213867, "global_step": 190064, "epoch": 1570} {"train_loss": -42.33114242553711, "global_step": 190065, "epoch": 1570} {"train_loss": -42.40812301635742, "global_step": 190066, "epoch": 1570} {"train_loss": -42.24112319946289, "global_step": 190067, "epoch": 1570} {"train_loss": -42.42891311645508, "global_step": 190068, "epoch": 1570} {"train_loss": -42.675994873046875, "global_step": 190069, "epoch": 1570} {"train_loss": -42.04677200317383, "global_step": 190070, "epoch": 1570} {"train_loss": -41.926944732666016, "global_step": 190071, "epoch": 1570} {"train_loss": -42.460418701171875, "global_step": 190072, "epoch": 1570} {"train_loss": -42.1642951965332, "global_step": 190073, "epoch": 1570} {"train_loss": -42.853084564208984, "global_step": 190074, "epoch": 1570} {"train_loss": -41.788021087646484, "global_step": 190075, "epoch": 1570} {"train_loss": -42.27740478515625, "global_step": 190076, "epoch": 1570} {"train_loss": -42.532386779785156, "global_step": 190077, "epoch": 1570} {"train_loss": -42.06214141845703, "global_step": 190078, "epoch": 1570} {"train_loss": -42.55088424682617, "global_step": 190079, "epoch": 1570} {"train_loss": -42.73160934448242, "global_step": 190080, "epoch": 1570} {"train_loss": -42.28807830810547, "global_step": 190081, "epoch": 1570} {"train_loss": -42.4245719909668, "global_step": 190082, "epoch": 1570} {"train_loss": -42.693233489990234, "global_step": 190083, "epoch": 1570} {"train_loss": -42.440399169921875, "global_step": 190084, "epoch": 1570} {"train_loss": -42.278175354003906, "global_step": 190085, "epoch": 1570} {"train_loss": -42.31905746459961, "global_step": 190086, "epoch": 1570} {"train_loss": -42.459815979003906, "global_step": 190087, "epoch": 1570} {"train_loss": -41.61690139770508, "global_step": 190088, "epoch": 1570} {"train_loss": -40.956748962402344, "global_step": 190089, "epoch": 1570} {"train_loss": -41.58069065188573, "global_step": 190090, "epoch": 1570, "val_loss": 2475018.75} {"train_loss": -42.57670211791992, "global_step": 190091, "epoch": 1571} {"train_loss": -42.06124496459961, "global_step": 190092, "epoch": 1571} {"train_loss": -42.932491302490234, "global_step": 190093, "epoch": 1571} {"train_loss": -41.88991928100586, "global_step": 190094, "epoch": 1571} {"train_loss": -41.8572998046875, "global_step": 190095, "epoch": 1571} {"train_loss": -41.267391204833984, "global_step": 190096, "epoch": 1571} {"train_loss": -42.01624298095703, "global_step": 190097, "epoch": 1571} {"train_loss": -40.33816146850586, "global_step": 190098, "epoch": 1571} {"train_loss": -37.809791564941406, "global_step": 190099, "epoch": 1571} {"train_loss": -38.6297492980957, "global_step": 190100, "epoch": 1571} {"train_loss": -41.9262580871582, "global_step": 190101, "epoch": 1571} {"train_loss": -41.32329177856445, "global_step": 190102, "epoch": 1571} {"train_loss": -40.448421478271484, "global_step": 190103, "epoch": 1571} {"train_loss": -41.7388916015625, "global_step": 190104, "epoch": 1571} {"train_loss": -39.545711517333984, "global_step": 190105, "epoch": 1571} {"train_loss": -38.19905471801758, "global_step": 190106, "epoch": 1571} {"train_loss": -40.28635787963867, "global_step": 190107, "epoch": 1571} {"train_loss": -39.57841873168945, "global_step": 190108, "epoch": 1571} {"train_loss": -39.19818878173828, "global_step": 190109, "epoch": 1571} {"train_loss": -40.86518859863281, "global_step": 190110, "epoch": 1571} {"train_loss": -40.54787826538086, "global_step": 190111, "epoch": 1571} {"train_loss": -38.243709564208984, "global_step": 190112, "epoch": 1571} {"train_loss": -40.74555206298828, "global_step": 190113, "epoch": 1571} {"train_loss": -41.91969299316406, "global_step": 190114, "epoch": 1571} {"train_loss": -39.14748764038086, "global_step": 190115, "epoch": 1571} {"train_loss": -41.55624008178711, "global_step": 190116, "epoch": 1571} {"train_loss": -41.1947021484375, "global_step": 190117, "epoch": 1571} {"train_loss": -41.15995407104492, "global_step": 190118, "epoch": 1571} {"train_loss": -40.89161682128906, "global_step": 190119, "epoch": 1571} {"train_loss": -40.45327377319336, "global_step": 190120, "epoch": 1571} {"train_loss": -41.14223861694336, "global_step": 190121, "epoch": 1571} {"train_loss": -41.0778923034668, "global_step": 190122, "epoch": 1571} {"train_loss": -41.928131103515625, "global_step": 190123, "epoch": 1571} {"train_loss": -40.19606018066406, "global_step": 190124, "epoch": 1571} {"train_loss": -39.863765716552734, "global_step": 190125, "epoch": 1571} {"train_loss": -41.0912971496582, "global_step": 190126, "epoch": 1571} {"train_loss": -42.056541442871094, "global_step": 190127, "epoch": 1571} {"train_loss": -40.28042221069336, "global_step": 190128, "epoch": 1571} {"train_loss": -40.3638801574707, "global_step": 190129, "epoch": 1571} {"train_loss": -41.62650680541992, "global_step": 190130, "epoch": 1571} {"train_loss": -42.23991012573242, "global_step": 190131, "epoch": 1571} {"train_loss": -40.43729782104492, "global_step": 190132, "epoch": 1571} {"train_loss": -39.606483459472656, "global_step": 190133, "epoch": 1571} {"train_loss": -41.586708068847656, "global_step": 190134, "epoch": 1571} {"train_loss": -41.43684387207031, "global_step": 190135, "epoch": 1571} {"train_loss": -40.6204719543457, "global_step": 190136, "epoch": 1571} {"train_loss": -40.330562591552734, "global_step": 190137, "epoch": 1571} {"train_loss": -41.9796142578125, "global_step": 190138, "epoch": 1571} {"train_loss": -40.06541061401367, "global_step": 190139, "epoch": 1571} {"train_loss": -40.688114166259766, "global_step": 190140, "epoch": 1571} {"train_loss": -42.19344711303711, "global_step": 190141, "epoch": 1571} {"train_loss": -39.30086135864258, "global_step": 190142, "epoch": 1571} {"train_loss": -41.37308883666992, "global_step": 190143, "epoch": 1571} {"train_loss": -40.45100784301758, "global_step": 190144, "epoch": 1571} {"train_loss": -40.84296417236328, "global_step": 190145, "epoch": 1571} {"train_loss": -38.70652389526367, "global_step": 190146, "epoch": 1571} {"train_loss": -40.86887741088867, "global_step": 190147, "epoch": 1571} {"train_loss": -38.84739685058594, "global_step": 190148, "epoch": 1571} {"train_loss": -31.8077335357666, "global_step": 190149, "epoch": 1571} {"train_loss": -41.769622802734375, "global_step": 190150, "epoch": 1571} {"train_loss": -38.348731994628906, "global_step": 190151, "epoch": 1571} {"train_loss": -31.099363327026367, "global_step": 190152, "epoch": 1571} {"train_loss": -38.0340690612793, "global_step": 190153, "epoch": 1571} {"train_loss": -39.12142562866211, "global_step": 190154, "epoch": 1571} {"train_loss": -36.34572982788086, "global_step": 190155, "epoch": 1571} {"train_loss": -35.108787536621094, "global_step": 190156, "epoch": 1571} {"train_loss": -36.12850570678711, "global_step": 190157, "epoch": 1571} {"train_loss": -33.36863708496094, "global_step": 190158, "epoch": 1571} {"train_loss": -37.447933197021484, "global_step": 190159, "epoch": 1571} {"train_loss": -32.64290237426758, "global_step": 190160, "epoch": 1571} {"train_loss": -29.746994018554688, "global_step": 190161, "epoch": 1571} {"train_loss": -35.08855056762695, "global_step": 190162, "epoch": 1571} {"train_loss": -36.12476348876953, "global_step": 190163, "epoch": 1571} {"train_loss": -38.69717025756836, "global_step": 190164, "epoch": 1571} {"train_loss": -33.05348205566406, "global_step": 190165, "epoch": 1571} {"train_loss": -33.15398025512695, "global_step": 190166, "epoch": 1571} {"train_loss": -37.67179489135742, "global_step": 190167, "epoch": 1571} {"train_loss": -37.27924728393555, "global_step": 190168, "epoch": 1571} {"train_loss": -35.73531723022461, "global_step": 190169, "epoch": 1571} {"train_loss": -36.729061126708984, "global_step": 190170, "epoch": 1571} {"train_loss": -36.671077728271484, "global_step": 190171, "epoch": 1571} {"train_loss": -38.98556137084961, "global_step": 190172, "epoch": 1571} {"train_loss": -38.97248077392578, "global_step": 190173, "epoch": 1571} {"train_loss": -34.0294303894043, "global_step": 190174, "epoch": 1571} {"train_loss": -38.642086029052734, "global_step": 190175, "epoch": 1571} {"train_loss": -37.92696762084961, "global_step": 190176, "epoch": 1571} {"train_loss": -39.316139221191406, "global_step": 190177, "epoch": 1571} {"train_loss": -39.20012664794922, "global_step": 190178, "epoch": 1571} {"train_loss": -38.34370803833008, "global_step": 190179, "epoch": 1571} {"train_loss": -38.61745834350586, "global_step": 190180, "epoch": 1571} {"train_loss": -38.775848388671875, "global_step": 190181, "epoch": 1571} {"train_loss": -38.69890594482422, "global_step": 190182, "epoch": 1571} {"train_loss": -38.83067321777344, "global_step": 190183, "epoch": 1571} {"train_loss": -39.253448486328125, "global_step": 190184, "epoch": 1571} {"train_loss": -39.80891036987305, "global_step": 190185, "epoch": 1571} {"train_loss": -39.695465087890625, "global_step": 190186, "epoch": 1571} {"train_loss": -39.95293045043945, "global_step": 190187, "epoch": 1571} {"train_loss": -40.24994659423828, "global_step": 190188, "epoch": 1571} {"train_loss": -40.51583480834961, "global_step": 190189, "epoch": 1571} {"train_loss": -40.09737014770508, "global_step": 190190, "epoch": 1571} {"train_loss": -40.17031478881836, "global_step": 190191, "epoch": 1571} {"train_loss": -39.566619873046875, "global_step": 190192, "epoch": 1571} {"train_loss": -39.52305603027344, "global_step": 190193, "epoch": 1571} {"train_loss": -40.59751510620117, "global_step": 190194, "epoch": 1571} {"train_loss": -39.962608337402344, "global_step": 190195, "epoch": 1571} {"train_loss": -40.377586364746094, "global_step": 190196, "epoch": 1571} {"train_loss": -39.96748733520508, "global_step": 190197, "epoch": 1571} {"train_loss": -40.748382568359375, "global_step": 190198, "epoch": 1571} {"train_loss": -40.290218353271484, "global_step": 190199, "epoch": 1571} {"train_loss": -39.86331558227539, "global_step": 190200, "epoch": 1571} {"train_loss": -41.088356018066406, "global_step": 190201, "epoch": 1571} {"train_loss": -41.02750778198242, "global_step": 190202, "epoch": 1571} {"train_loss": -40.42679977416992, "global_step": 190203, "epoch": 1571} {"train_loss": -40.82794952392578, "global_step": 190204, "epoch": 1571} {"train_loss": -40.80338668823242, "global_step": 190205, "epoch": 1571} {"train_loss": -40.76668167114258, "global_step": 190206, "epoch": 1571} {"train_loss": -40.848751068115234, "global_step": 190207, "epoch": 1571} {"train_loss": -40.67519760131836, "global_step": 190208, "epoch": 1571} {"train_loss": -40.7952766418457, "global_step": 190209, "epoch": 1571} {"train_loss": -41.33148193359375, "global_step": 190210, "epoch": 1571} {"train_loss": -39.44403287398914, "global_step": 190211, "epoch": 1571, "val_loss": 2484583.25} {"train_loss": -41.26699447631836, "global_step": 190212, "epoch": 1572} {"train_loss": -40.94364547729492, "global_step": 190213, "epoch": 1572} {"train_loss": -41.0619010925293, "global_step": 190214, "epoch": 1572} {"train_loss": -41.011226654052734, "global_step": 190215, "epoch": 1572} {"train_loss": -41.5572395324707, "global_step": 190216, "epoch": 1572} {"train_loss": -41.799285888671875, "global_step": 190217, "epoch": 1572} {"train_loss": -40.94639205932617, "global_step": 190218, "epoch": 1572} {"train_loss": -41.59928512573242, "global_step": 190219, "epoch": 1572} {"train_loss": -41.24821472167969, "global_step": 190220, "epoch": 1572} {"train_loss": -41.32716369628906, "global_step": 190221, "epoch": 1572} {"train_loss": -41.612064361572266, "global_step": 190222, "epoch": 1572} {"train_loss": -41.21446228027344, "global_step": 190223, "epoch": 1572} {"train_loss": -41.763526916503906, "global_step": 190224, "epoch": 1572} {"train_loss": -41.667640686035156, "global_step": 190225, "epoch": 1572} {"train_loss": -41.957820892333984, "global_step": 190226, "epoch": 1572} {"train_loss": -41.6839714050293, "global_step": 190227, "epoch": 1572} {"train_loss": -42.08739471435547, "global_step": 190228, "epoch": 1572} {"train_loss": -41.58686828613281, "global_step": 190229, "epoch": 1572} {"train_loss": -41.8023567199707, "global_step": 190230, "epoch": 1572} {"train_loss": -41.3571662902832, "global_step": 190231, "epoch": 1572} {"train_loss": -41.82763671875, "global_step": 190232, "epoch": 1572} {"train_loss": -41.81352233886719, "global_step": 190233, "epoch": 1572} {"train_loss": -41.967315673828125, "global_step": 190234, "epoch": 1572} {"train_loss": -42.227210998535156, "global_step": 190235, "epoch": 1572} {"train_loss": -41.75265121459961, "global_step": 190236, "epoch": 1572} {"train_loss": -42.15373611450195, "global_step": 190237, "epoch": 1572} {"train_loss": -41.97447967529297, "global_step": 190238, "epoch": 1572} {"train_loss": -41.88228225708008, "global_step": 190239, "epoch": 1572} {"train_loss": -42.001441955566406, "global_step": 190240, "epoch": 1572} {"train_loss": -41.37784957885742, "global_step": 190241, "epoch": 1572} {"train_loss": -42.22261047363281, "global_step": 190242, "epoch": 1572} {"train_loss": -42.211219787597656, "global_step": 190243, "epoch": 1572} {"train_loss": -41.9290885925293, "global_step": 190244, "epoch": 1572} {"train_loss": -41.75270462036133, "global_step": 190245, "epoch": 1572} {"train_loss": -42.123817443847656, "global_step": 190246, "epoch": 1572} {"train_loss": -42.263404846191406, "global_step": 190247, "epoch": 1572} {"train_loss": -42.45990753173828, "global_step": 190248, "epoch": 1572} {"train_loss": -42.00034713745117, "global_step": 190249, "epoch": 1572} {"train_loss": -42.47111129760742, "global_step": 190250, "epoch": 1572} {"train_loss": -41.974422454833984, "global_step": 190251, "epoch": 1572} {"train_loss": -42.4894905090332, "global_step": 190252, "epoch": 1572} {"train_loss": -42.23643493652344, "global_step": 190253, "epoch": 1572} {"train_loss": -41.79743194580078, "global_step": 190254, "epoch": 1572} {"train_loss": -42.466705322265625, "global_step": 190255, "epoch": 1572} {"train_loss": -42.30870056152344, "global_step": 190256, "epoch": 1572} {"train_loss": -42.63737106323242, "global_step": 190257, "epoch": 1572} {"train_loss": -42.19144821166992, "global_step": 190258, "epoch": 1572} {"train_loss": -42.84905242919922, "global_step": 190259, "epoch": 1572} {"train_loss": -41.27788162231445, "global_step": 190260, "epoch": 1572} {"train_loss": -41.07355880737305, "global_step": 190261, "epoch": 1572} {"train_loss": -42.2747802734375, "global_step": 190262, "epoch": 1572} {"train_loss": -41.53280258178711, "global_step": 190263, "epoch": 1572} {"train_loss": -40.785640716552734, "global_step": 190264, "epoch": 1572} {"train_loss": -41.34211349487305, "global_step": 190265, "epoch": 1572} {"train_loss": -41.52151107788086, "global_step": 190266, "epoch": 1572} {"train_loss": -41.56060791015625, "global_step": 190267, "epoch": 1572} {"train_loss": -41.79514694213867, "global_step": 190268, "epoch": 1572} {"train_loss": -41.09821701049805, "global_step": 190269, "epoch": 1572} {"train_loss": -41.65353012084961, "global_step": 190270, "epoch": 1572} {"train_loss": -41.32793045043945, "global_step": 190271, "epoch": 1572} {"train_loss": -40.465633392333984, "global_step": 190272, "epoch": 1572} {"train_loss": -40.86647415161133, "global_step": 190273, "epoch": 1572} {"train_loss": -41.325923919677734, "global_step": 190274, "epoch": 1572} {"train_loss": -41.73994445800781, "global_step": 190275, "epoch": 1572} {"train_loss": -41.580013275146484, "global_step": 190276, "epoch": 1572} {"train_loss": -40.335533142089844, "global_step": 190277, "epoch": 1572} {"train_loss": -38.690467834472656, "global_step": 190278, "epoch": 1572} {"train_loss": -36.3104362487793, "global_step": 190279, "epoch": 1572} {"train_loss": -39.10543441772461, "global_step": 190280, "epoch": 1572} {"train_loss": -41.21082305908203, "global_step": 190281, "epoch": 1572} {"train_loss": -39.31819534301758, "global_step": 190282, "epoch": 1572} {"train_loss": -36.0069465637207, "global_step": 190283, "epoch": 1572} {"train_loss": -33.286434173583984, "global_step": 190284, "epoch": 1572} {"train_loss": -38.962711334228516, "global_step": 190285, "epoch": 1572} {"train_loss": -33.87446594238281, "global_step": 190286, "epoch": 1572} {"train_loss": -32.18927001953125, "global_step": 190287, "epoch": 1572} {"train_loss": -34.853797912597656, "global_step": 190288, "epoch": 1572} {"train_loss": -37.43316650390625, "global_step": 190289, "epoch": 1572} {"train_loss": -36.062740325927734, "global_step": 190290, "epoch": 1572} {"train_loss": -39.05512619018555, "global_step": 190291, "epoch": 1572} {"train_loss": -38.23183822631836, "global_step": 190292, "epoch": 1572} {"train_loss": -38.209163665771484, "global_step": 190293, "epoch": 1572} {"train_loss": -40.091827392578125, "global_step": 190294, "epoch": 1572} {"train_loss": -39.89251708984375, "global_step": 190295, "epoch": 1572} {"train_loss": -38.86797332763672, "global_step": 190296, "epoch": 1572} {"train_loss": -38.17448043823242, "global_step": 190297, "epoch": 1572} {"train_loss": -39.72794723510742, "global_step": 190298, "epoch": 1572} {"train_loss": -37.357112884521484, "global_step": 190299, "epoch": 1572} {"train_loss": -39.91094970703125, "global_step": 190300, "epoch": 1572} {"train_loss": -39.401283264160156, "global_step": 190301, "epoch": 1572} {"train_loss": -39.22430419921875, "global_step": 190302, "epoch": 1572} {"train_loss": -39.29352951049805, "global_step": 190303, "epoch": 1572} {"train_loss": -39.891815185546875, "global_step": 190304, "epoch": 1572} {"train_loss": -39.71179962158203, "global_step": 190305, "epoch": 1572} {"train_loss": -40.5891227722168, "global_step": 190306, "epoch": 1572} {"train_loss": -40.53382110595703, "global_step": 190307, "epoch": 1572} {"train_loss": -40.65464782714844, "global_step": 190308, "epoch": 1572} {"train_loss": -41.01920700073242, "global_step": 190309, "epoch": 1572} {"train_loss": -39.9074592590332, "global_step": 190310, "epoch": 1572} {"train_loss": -40.69174575805664, "global_step": 190311, "epoch": 1572} {"train_loss": -40.67066192626953, "global_step": 190312, "epoch": 1572} {"train_loss": -41.395263671875, "global_step": 190313, "epoch": 1572} {"train_loss": -41.13197708129883, "global_step": 190314, "epoch": 1572} {"train_loss": -40.96730041503906, "global_step": 190315, "epoch": 1572} {"train_loss": -41.79811477661133, "global_step": 190316, "epoch": 1572} {"train_loss": -41.42083740234375, "global_step": 190317, "epoch": 1572} {"train_loss": -41.55984115600586, "global_step": 190318, "epoch": 1572} {"train_loss": -41.491920471191406, "global_step": 190319, "epoch": 1572} {"train_loss": -41.4793586730957, "global_step": 190320, "epoch": 1572} {"train_loss": -41.31074142456055, "global_step": 190321, "epoch": 1572} {"train_loss": -41.1342887878418, "global_step": 190322, "epoch": 1572} {"train_loss": -41.65829086303711, "global_step": 190323, "epoch": 1572} {"train_loss": -41.615577697753906, "global_step": 190324, "epoch": 1572} {"train_loss": -41.539520263671875, "global_step": 190325, "epoch": 1572} {"train_loss": -41.69865417480469, "global_step": 190326, "epoch": 1572} {"train_loss": -42.05056381225586, "global_step": 190327, "epoch": 1572} {"train_loss": -41.4989013671875, "global_step": 190328, "epoch": 1572} {"train_loss": -41.89870834350586, "global_step": 190329, "epoch": 1572} {"train_loss": -41.9495735168457, "global_step": 190330, "epoch": 1572} {"train_loss": -41.61725997924805, "global_step": 190331, "epoch": 1572} {"train_loss": -40.75833968485682, "global_step": 190332, "epoch": 1572, "val_loss": 2446039.25} {"train_loss": -41.93597412109375, "global_step": 190333, "epoch": 1573} {"train_loss": -41.76430130004883, "global_step": 190334, "epoch": 1573} {"train_loss": -41.84653854370117, "global_step": 190335, "epoch": 1573} {"train_loss": -42.154659271240234, "global_step": 190336, "epoch": 1573} {"train_loss": -41.60439682006836, "global_step": 190337, "epoch": 1573} {"train_loss": -41.38126754760742, "global_step": 190338, "epoch": 1573} {"train_loss": -41.53071594238281, "global_step": 190339, "epoch": 1573} {"train_loss": -42.19472122192383, "global_step": 190340, "epoch": 1573} {"train_loss": -42.26556396484375, "global_step": 190341, "epoch": 1573} {"train_loss": -42.20258331298828, "global_step": 190342, "epoch": 1573} {"train_loss": -41.95093536376953, "global_step": 190343, "epoch": 1573} {"train_loss": -42.295127868652344, "global_step": 190344, "epoch": 1573} {"train_loss": -42.28152084350586, "global_step": 190345, "epoch": 1573} {"train_loss": -42.05576705932617, "global_step": 190346, "epoch": 1573} {"train_loss": -42.27360153198242, "global_step": 190347, "epoch": 1573} {"train_loss": -41.796504974365234, "global_step": 190348, "epoch": 1573} {"train_loss": -42.47749710083008, "global_step": 190349, "epoch": 1573} {"train_loss": -42.22208786010742, "global_step": 190350, "epoch": 1573} {"train_loss": -42.40058135986328, "global_step": 190351, "epoch": 1573} {"train_loss": -42.04135513305664, "global_step": 190352, "epoch": 1573} {"train_loss": -42.13159942626953, "global_step": 190353, "epoch": 1573} {"train_loss": -42.38839340209961, "global_step": 190354, "epoch": 1573} {"train_loss": -42.05743408203125, "global_step": 190355, "epoch": 1573} {"train_loss": -42.33842468261719, "global_step": 190356, "epoch": 1573} {"train_loss": -42.30767822265625, "global_step": 190357, "epoch": 1573} {"train_loss": -42.4345817565918, "global_step": 190358, "epoch": 1573} {"train_loss": -41.95487594604492, "global_step": 190359, "epoch": 1573} {"train_loss": -42.210872650146484, "global_step": 190360, "epoch": 1573} {"train_loss": -41.79780960083008, "global_step": 190361, "epoch": 1573} {"train_loss": -42.42497634887695, "global_step": 190362, "epoch": 1573} {"train_loss": -42.12268829345703, "global_step": 190363, "epoch": 1573} {"train_loss": -42.34001541137695, "global_step": 190364, "epoch": 1573} {"train_loss": -42.27976608276367, "global_step": 190365, "epoch": 1573} {"train_loss": -42.14798355102539, "global_step": 190366, "epoch": 1573} {"train_loss": -42.1142692565918, "global_step": 190367, "epoch": 1573} {"train_loss": -42.138404846191406, "global_step": 190368, "epoch": 1573} {"train_loss": -42.067134857177734, "global_step": 190369, "epoch": 1573} {"train_loss": -42.434356689453125, "global_step": 190370, "epoch": 1573} {"train_loss": -42.51436996459961, "global_step": 190371, "epoch": 1573} {"train_loss": -42.01021194458008, "global_step": 190372, "epoch": 1573} {"train_loss": -41.90482711791992, "global_step": 190373, "epoch": 1573} {"train_loss": -41.9171028137207, "global_step": 190374, "epoch": 1573} {"train_loss": -41.858943939208984, "global_step": 190375, "epoch": 1573} {"train_loss": -41.47684097290039, "global_step": 190376, "epoch": 1573} {"train_loss": -41.74691390991211, "global_step": 190377, "epoch": 1573} {"train_loss": -41.878868103027344, "global_step": 190378, "epoch": 1573} {"train_loss": -40.879150390625, "global_step": 190379, "epoch": 1573} {"train_loss": -41.389678955078125, "global_step": 190380, "epoch": 1573} {"train_loss": -40.779083251953125, "global_step": 190381, "epoch": 1573} {"train_loss": -39.64204025268555, "global_step": 190382, "epoch": 1573} {"train_loss": -42.35171127319336, "global_step": 190383, "epoch": 1573} {"train_loss": -39.921566009521484, "global_step": 190384, "epoch": 1573} {"train_loss": -37.298240661621094, "global_step": 190385, "epoch": 1573} {"train_loss": -39.55260467529297, "global_step": 190386, "epoch": 1573} {"train_loss": -39.931488037109375, "global_step": 190387, "epoch": 1573} {"train_loss": -40.730403900146484, "global_step": 190388, "epoch": 1573} {"train_loss": -40.63900375366211, "global_step": 190389, "epoch": 1573} {"train_loss": -41.40837478637695, "global_step": 190390, "epoch": 1573} {"train_loss": -40.513816833496094, "global_step": 190391, "epoch": 1573} {"train_loss": -40.51721954345703, "global_step": 190392, "epoch": 1573} {"train_loss": -40.451778411865234, "global_step": 190393, "epoch": 1573} {"train_loss": -39.343055725097656, "global_step": 190394, "epoch": 1573} {"train_loss": -38.94941329956055, "global_step": 190395, "epoch": 1573} {"train_loss": -39.71718978881836, "global_step": 190396, "epoch": 1573} {"train_loss": -40.62820053100586, "global_step": 190397, "epoch": 1573} {"train_loss": -41.05033493041992, "global_step": 190398, "epoch": 1573} {"train_loss": -40.357357025146484, "global_step": 190399, "epoch": 1573} {"train_loss": -41.71247482299805, "global_step": 190400, "epoch": 1573} {"train_loss": -41.40158462524414, "global_step": 190401, "epoch": 1573} {"train_loss": -40.970760345458984, "global_step": 190402, "epoch": 1573} {"train_loss": -41.5488395690918, "global_step": 190403, "epoch": 1573} {"train_loss": -41.976898193359375, "global_step": 190404, "epoch": 1573} {"train_loss": -41.61102294921875, "global_step": 190405, "epoch": 1573} {"train_loss": -41.55830001831055, "global_step": 190406, "epoch": 1573} {"train_loss": -41.431819915771484, "global_step": 190407, "epoch": 1573} {"train_loss": -41.145015716552734, "global_step": 190408, "epoch": 1573} {"train_loss": -40.64028549194336, "global_step": 190409, "epoch": 1573} {"train_loss": -39.84078598022461, "global_step": 190410, "epoch": 1573} {"train_loss": -40.744293212890625, "global_step": 190411, "epoch": 1573} {"train_loss": -41.63745880126953, "global_step": 190412, "epoch": 1573} {"train_loss": -41.20808792114258, "global_step": 190413, "epoch": 1573} {"train_loss": -38.8966178894043, "global_step": 190414, "epoch": 1573} {"train_loss": -40.33994674682617, "global_step": 190415, "epoch": 1573} {"train_loss": -41.74518585205078, "global_step": 190416, "epoch": 1573} {"train_loss": -40.06548309326172, "global_step": 190417, "epoch": 1573} {"train_loss": -37.399349212646484, "global_step": 190418, "epoch": 1573} {"train_loss": -40.023860931396484, "global_step": 190419, "epoch": 1573} {"train_loss": -42.000213623046875, "global_step": 190420, "epoch": 1573} {"train_loss": -39.91008377075195, "global_step": 190421, "epoch": 1573} {"train_loss": -40.28483963012695, "global_step": 190422, "epoch": 1573} {"train_loss": -41.794715881347656, "global_step": 190423, "epoch": 1573} {"train_loss": -40.656490325927734, "global_step": 190424, "epoch": 1573} {"train_loss": -40.296722412109375, "global_step": 190425, "epoch": 1573} {"train_loss": -42.02775573730469, "global_step": 190426, "epoch": 1573} {"train_loss": -40.71897506713867, "global_step": 190427, "epoch": 1573} {"train_loss": -40.553192138671875, "global_step": 190428, "epoch": 1573} {"train_loss": -42.12685775756836, "global_step": 190429, "epoch": 1573} {"train_loss": -40.73108673095703, "global_step": 190430, "epoch": 1573} {"train_loss": -41.5527229309082, "global_step": 190431, "epoch": 1573} {"train_loss": -42.10029220581055, "global_step": 190432, "epoch": 1573} {"train_loss": -41.47221755981445, "global_step": 190433, "epoch": 1573} {"train_loss": -41.33683776855469, "global_step": 190434, "epoch": 1573} {"train_loss": -42.14065170288086, "global_step": 190435, "epoch": 1573} {"train_loss": -41.7574577331543, "global_step": 190436, "epoch": 1573} {"train_loss": -41.167057037353516, "global_step": 190437, "epoch": 1573} {"train_loss": -41.858375549316406, "global_step": 190438, "epoch": 1573} {"train_loss": -41.41554260253906, "global_step": 190439, "epoch": 1573} {"train_loss": -41.346771240234375, "global_step": 190440, "epoch": 1573} {"train_loss": -41.378292083740234, "global_step": 190441, "epoch": 1573} {"train_loss": -41.710365295410156, "global_step": 190442, "epoch": 1573} {"train_loss": -41.96540451049805, "global_step": 190443, "epoch": 1573} {"train_loss": -42.01203155517578, "global_step": 190444, "epoch": 1573} {"train_loss": -40.80371856689453, "global_step": 190445, "epoch": 1573} {"train_loss": -41.351688385009766, "global_step": 190446, "epoch": 1573} {"train_loss": -41.956905364990234, "global_step": 190447, "epoch": 1573} {"train_loss": -42.12038803100586, "global_step": 190448, "epoch": 1573} {"train_loss": -41.865169525146484, "global_step": 190449, "epoch": 1573} {"train_loss": -41.6175651550293, "global_step": 190450, "epoch": 1573} {"train_loss": -42.505313873291016, "global_step": 190451, "epoch": 1573} {"train_loss": -41.666934967041016, "global_step": 190452, "epoch": 1573} {"train_loss": -41.388822476725935, "global_step": 190453, "epoch": 1573, "val_loss": 2436799.75} {"train_loss": -42.53729248046875, "global_step": 190454, "epoch": 1574} {"train_loss": -41.847042083740234, "global_step": 190455, "epoch": 1574} {"train_loss": -42.504302978515625, "global_step": 190456, "epoch": 1574} {"train_loss": -42.33727264404297, "global_step": 190457, "epoch": 1574} {"train_loss": -42.654998779296875, "global_step": 190458, "epoch": 1574} {"train_loss": -42.196250915527344, "global_step": 190459, "epoch": 1574} {"train_loss": -42.385005950927734, "global_step": 190460, "epoch": 1574} {"train_loss": -42.132686614990234, "global_step": 190461, "epoch": 1574} {"train_loss": -42.51327133178711, "global_step": 190462, "epoch": 1574} {"train_loss": -42.18562316894531, "global_step": 190463, "epoch": 1574} {"train_loss": -42.876155853271484, "global_step": 190464, "epoch": 1574} {"train_loss": -41.80428695678711, "global_step": 190465, "epoch": 1574} {"train_loss": -42.462955474853516, "global_step": 190466, "epoch": 1574} {"train_loss": -42.19900131225586, "global_step": 190467, "epoch": 1574} {"train_loss": -41.95720291137695, "global_step": 190468, "epoch": 1574} {"train_loss": -42.97218704223633, "global_step": 190469, "epoch": 1574} {"train_loss": -42.34269714355469, "global_step": 190470, "epoch": 1574} {"train_loss": -42.17942428588867, "global_step": 190471, "epoch": 1574} {"train_loss": -42.63215255737305, "global_step": 190472, "epoch": 1574} {"train_loss": -42.330020904541016, "global_step": 190473, "epoch": 1574} {"train_loss": -42.37763214111328, "global_step": 190474, "epoch": 1574} {"train_loss": -42.41732406616211, "global_step": 190475, "epoch": 1574} {"train_loss": -42.24722671508789, "global_step": 190476, "epoch": 1574} {"train_loss": -42.608131408691406, "global_step": 190477, "epoch": 1574} {"train_loss": -42.292724609375, "global_step": 190478, "epoch": 1574} {"train_loss": -41.808746337890625, "global_step": 190479, "epoch": 1574} {"train_loss": -42.660030364990234, "global_step": 190480, "epoch": 1574} {"train_loss": -41.344032287597656, "global_step": 190481, "epoch": 1574} {"train_loss": -41.92203903198242, "global_step": 190482, "epoch": 1574} {"train_loss": -42.639862060546875, "global_step": 190483, "epoch": 1574} {"train_loss": -41.71198272705078, "global_step": 190484, "epoch": 1574} {"train_loss": -41.91437530517578, "global_step": 190485, "epoch": 1574} {"train_loss": -42.35915756225586, "global_step": 190486, "epoch": 1574} {"train_loss": -41.75263595581055, "global_step": 190487, "epoch": 1574} {"train_loss": -41.685699462890625, "global_step": 190488, "epoch": 1574} {"train_loss": -41.89402770996094, "global_step": 190489, "epoch": 1574} {"train_loss": -41.690940856933594, "global_step": 190490, "epoch": 1574} {"train_loss": -42.343692779541016, "global_step": 190491, "epoch": 1574} {"train_loss": -41.01005172729492, "global_step": 190492, "epoch": 1574} {"train_loss": -40.578407287597656, "global_step": 190493, "epoch": 1574} {"train_loss": -41.48802185058594, "global_step": 190494, "epoch": 1574} {"train_loss": -41.263309478759766, "global_step": 190495, "epoch": 1574} {"train_loss": -40.32268524169922, "global_step": 190496, "epoch": 1574} {"train_loss": -41.40434646606445, "global_step": 190497, "epoch": 1574} {"train_loss": -40.76557159423828, "global_step": 190498, "epoch": 1574} {"train_loss": -41.0694465637207, "global_step": 190499, "epoch": 1574} {"train_loss": -42.051151275634766, "global_step": 190500, "epoch": 1574} {"train_loss": -41.594478607177734, "global_step": 190501, "epoch": 1574} {"train_loss": -39.61581039428711, "global_step": 190502, "epoch": 1574} {"train_loss": -39.42033767700195, "global_step": 190503, "epoch": 1574} {"train_loss": -39.950984954833984, "global_step": 190504, "epoch": 1574} {"train_loss": -39.70353317260742, "global_step": 190505, "epoch": 1574} {"train_loss": -39.13569259643555, "global_step": 190506, "epoch": 1574} {"train_loss": -40.8691520690918, "global_step": 190507, "epoch": 1574} {"train_loss": -39.74135971069336, "global_step": 190508, "epoch": 1574} {"train_loss": -37.66233444213867, "global_step": 190509, "epoch": 1574} {"train_loss": -40.89645767211914, "global_step": 190510, "epoch": 1574} {"train_loss": -40.15766143798828, "global_step": 190511, "epoch": 1574} {"train_loss": -40.68134307861328, "global_step": 190512, "epoch": 1574} {"train_loss": -40.18579864501953, "global_step": 190513, "epoch": 1574} {"train_loss": -41.79378128051758, "global_step": 190514, "epoch": 1574} {"train_loss": -39.25633239746094, "global_step": 190515, "epoch": 1574} {"train_loss": -41.18046569824219, "global_step": 190516, "epoch": 1574} {"train_loss": -41.06630325317383, "global_step": 190517, "epoch": 1574} {"train_loss": -37.71992111206055, "global_step": 190518, "epoch": 1574} {"train_loss": -42.023868560791016, "global_step": 190519, "epoch": 1574} {"train_loss": -39.15736770629883, "global_step": 190520, "epoch": 1574} {"train_loss": -38.4621467590332, "global_step": 190521, "epoch": 1574} {"train_loss": -39.58079147338867, "global_step": 190522, "epoch": 1574} {"train_loss": -41.21529769897461, "global_step": 190523, "epoch": 1574} {"train_loss": -40.40732955932617, "global_step": 190524, "epoch": 1574} {"train_loss": -40.99318313598633, "global_step": 190525, "epoch": 1574} {"train_loss": -39.25395965576172, "global_step": 190526, "epoch": 1574} {"train_loss": -40.61235427856445, "global_step": 190527, "epoch": 1574} {"train_loss": -40.00581741333008, "global_step": 190528, "epoch": 1574} {"train_loss": -39.50069046020508, "global_step": 190529, "epoch": 1574} {"train_loss": -40.88580322265625, "global_step": 190530, "epoch": 1574} {"train_loss": -40.295108795166016, "global_step": 190531, "epoch": 1574} {"train_loss": -40.97988510131836, "global_step": 190532, "epoch": 1574} {"train_loss": -39.95405960083008, "global_step": 190533, "epoch": 1574} {"train_loss": -41.75033187866211, "global_step": 190534, "epoch": 1574} {"train_loss": -40.18206024169922, "global_step": 190535, "epoch": 1574} {"train_loss": -40.987056732177734, "global_step": 190536, "epoch": 1574} {"train_loss": -41.83711624145508, "global_step": 190537, "epoch": 1574} {"train_loss": -40.62211990356445, "global_step": 190538, "epoch": 1574} {"train_loss": -41.295955657958984, "global_step": 190539, "epoch": 1574} {"train_loss": -41.01762771606445, "global_step": 190540, "epoch": 1574} {"train_loss": -41.51505661010742, "global_step": 190541, "epoch": 1574} {"train_loss": -41.931156158447266, "global_step": 190542, "epoch": 1574} {"train_loss": -41.74699783325195, "global_step": 190543, "epoch": 1574} {"train_loss": -42.137630462646484, "global_step": 190544, "epoch": 1574} {"train_loss": -41.94810485839844, "global_step": 190545, "epoch": 1574} {"train_loss": -42.19795227050781, "global_step": 190546, "epoch": 1574} {"train_loss": -41.78827667236328, "global_step": 190547, "epoch": 1574} {"train_loss": -42.124427795410156, "global_step": 190548, "epoch": 1574} {"train_loss": -42.27882766723633, "global_step": 190549, "epoch": 1574} {"train_loss": -42.048152923583984, "global_step": 190550, "epoch": 1574} {"train_loss": -42.26455307006836, "global_step": 190551, "epoch": 1574} {"train_loss": -42.455867767333984, "global_step": 190552, "epoch": 1574} {"train_loss": -42.47282791137695, "global_step": 190553, "epoch": 1574} {"train_loss": -42.3661994934082, "global_step": 190554, "epoch": 1574} {"train_loss": -42.52718734741211, "global_step": 190555, "epoch": 1574} {"train_loss": -41.81023025512695, "global_step": 190556, "epoch": 1574} {"train_loss": -42.41933059692383, "global_step": 190557, "epoch": 1574} {"train_loss": -42.28697204589844, "global_step": 190558, "epoch": 1574} {"train_loss": -42.04352951049805, "global_step": 190559, "epoch": 1574} {"train_loss": -42.17974853515625, "global_step": 190560, "epoch": 1574} {"train_loss": -42.9508171081543, "global_step": 190561, "epoch": 1574} {"train_loss": -42.555904388427734, "global_step": 190562, "epoch": 1574} {"train_loss": -42.85315704345703, "global_step": 190563, "epoch": 1574} {"train_loss": -42.41605758666992, "global_step": 190564, "epoch": 1574} {"train_loss": -42.235836029052734, "global_step": 190565, "epoch": 1574} {"train_loss": -42.921504974365234, "global_step": 190566, "epoch": 1574} {"train_loss": -42.83395004272461, "global_step": 190567, "epoch": 1574} {"train_loss": -42.438819885253906, "global_step": 190568, "epoch": 1574} {"train_loss": -42.70096969604492, "global_step": 190569, "epoch": 1574} {"train_loss": -42.62500762939453, "global_step": 190570, "epoch": 1574} {"train_loss": -42.722896575927734, "global_step": 190571, "epoch": 1574} {"train_loss": -42.4255256652832, "global_step": 190572, "epoch": 1574} {"train_loss": -42.3340950012207, "global_step": 190573, "epoch": 1574} {"train_loss": -41.535599700675526, "global_step": 190574, "epoch": 1574, "val_loss": 2450072.75} {"train_loss": -42.744686126708984, "global_step": 190575, "epoch": 1575} {"train_loss": -42.76213836669922, "global_step": 190576, "epoch": 1575} {"train_loss": -42.909263610839844, "global_step": 190577, "epoch": 1575} {"train_loss": -42.496402740478516, "global_step": 190578, "epoch": 1575} {"train_loss": -42.93378448486328, "global_step": 190579, "epoch": 1575} {"train_loss": -42.73807907104492, "global_step": 190580, "epoch": 1575} {"train_loss": -42.56562042236328, "global_step": 190581, "epoch": 1575} {"train_loss": -43.00178146362305, "global_step": 190582, "epoch": 1575} {"train_loss": -42.354270935058594, "global_step": 190583, "epoch": 1575} {"train_loss": -43.12900924682617, "global_step": 190584, "epoch": 1575} {"train_loss": -42.46991729736328, "global_step": 190585, "epoch": 1575} {"train_loss": -41.98806381225586, "global_step": 190586, "epoch": 1575} {"train_loss": -41.86376953125, "global_step": 190587, "epoch": 1575} {"train_loss": -41.577781677246094, "global_step": 190588, "epoch": 1575} {"train_loss": -42.05121612548828, "global_step": 190589, "epoch": 1575} {"train_loss": -41.984771728515625, "global_step": 190590, "epoch": 1575} {"train_loss": -40.632240295410156, "global_step": 190591, "epoch": 1575} {"train_loss": -41.69658279418945, "global_step": 190592, "epoch": 1575} {"train_loss": -41.193641662597656, "global_step": 190593, "epoch": 1575} {"train_loss": -42.20613098144531, "global_step": 190594, "epoch": 1575} {"train_loss": -41.93943405151367, "global_step": 190595, "epoch": 1575} {"train_loss": -41.34313201904297, "global_step": 190596, "epoch": 1575} {"train_loss": -40.6390380859375, "global_step": 190597, "epoch": 1575} {"train_loss": -39.9485969543457, "global_step": 190598, "epoch": 1575} {"train_loss": -40.24942398071289, "global_step": 190599, "epoch": 1575} {"train_loss": -41.18214797973633, "global_step": 190600, "epoch": 1575} {"train_loss": -41.625553131103516, "global_step": 190601, "epoch": 1575} {"train_loss": -38.629581451416016, "global_step": 190602, "epoch": 1575} {"train_loss": -38.59431838989258, "global_step": 190603, "epoch": 1575} {"train_loss": -40.51901626586914, "global_step": 190604, "epoch": 1575} {"train_loss": -39.598609924316406, "global_step": 190605, "epoch": 1575} {"train_loss": -41.17108917236328, "global_step": 190606, "epoch": 1575} {"train_loss": -41.07748031616211, "global_step": 190607, "epoch": 1575} {"train_loss": -40.62893295288086, "global_step": 190608, "epoch": 1575} {"train_loss": -41.880699157714844, "global_step": 190609, "epoch": 1575} {"train_loss": -40.793121337890625, "global_step": 190610, "epoch": 1575} {"train_loss": -41.022308349609375, "global_step": 190611, "epoch": 1575} {"train_loss": -39.727569580078125, "global_step": 190612, "epoch": 1575} {"train_loss": -38.215206146240234, "global_step": 190613, "epoch": 1575} {"train_loss": -41.29800033569336, "global_step": 190614, "epoch": 1575} {"train_loss": -40.608978271484375, "global_step": 190615, "epoch": 1575} {"train_loss": -40.61568069458008, "global_step": 190616, "epoch": 1575} {"train_loss": -41.095516204833984, "global_step": 190617, "epoch": 1575} {"train_loss": -39.754756927490234, "global_step": 190618, "epoch": 1575} {"train_loss": -40.979522705078125, "global_step": 190619, "epoch": 1575} {"train_loss": -40.89686965942383, "global_step": 190620, "epoch": 1575} {"train_loss": -40.03064727783203, "global_step": 190621, "epoch": 1575} {"train_loss": -40.982627868652344, "global_step": 190622, "epoch": 1575} {"train_loss": -41.20588684082031, "global_step": 190623, "epoch": 1575} {"train_loss": -40.840152740478516, "global_step": 190624, "epoch": 1575} {"train_loss": -40.056453704833984, "global_step": 190625, "epoch": 1575} {"train_loss": -39.65802764892578, "global_step": 190626, "epoch": 1575} {"train_loss": -41.957679748535156, "global_step": 190627, "epoch": 1575} {"train_loss": -40.201107025146484, "global_step": 190628, "epoch": 1575} {"train_loss": -40.48769760131836, "global_step": 190629, "epoch": 1575} {"train_loss": -40.7883415222168, "global_step": 190630, "epoch": 1575} {"train_loss": -41.55576705932617, "global_step": 190631, "epoch": 1575} {"train_loss": -39.77411651611328, "global_step": 190632, "epoch": 1575} {"train_loss": -41.477325439453125, "global_step": 190633, "epoch": 1575} {"train_loss": -41.097625732421875, "global_step": 190634, "epoch": 1575} {"train_loss": -41.88459396362305, "global_step": 190635, "epoch": 1575} {"train_loss": -41.55021286010742, "global_step": 190636, "epoch": 1575} {"train_loss": -41.11562728881836, "global_step": 190637, "epoch": 1575} {"train_loss": -42.312408447265625, "global_step": 190638, "epoch": 1575} {"train_loss": -41.24467849731445, "global_step": 190639, "epoch": 1575} {"train_loss": -41.1186408996582, "global_step": 190640, "epoch": 1575} {"train_loss": -40.63911437988281, "global_step": 190641, "epoch": 1575} {"train_loss": -41.75249481201172, "global_step": 190642, "epoch": 1575} {"train_loss": -42.077449798583984, "global_step": 190643, "epoch": 1575} {"train_loss": -41.707366943359375, "global_step": 190644, "epoch": 1575} {"train_loss": -40.13053512573242, "global_step": 190645, "epoch": 1575} {"train_loss": -41.30033493041992, "global_step": 190646, "epoch": 1575} {"train_loss": -42.32572555541992, "global_step": 190647, "epoch": 1575} {"train_loss": -40.34318161010742, "global_step": 190648, "epoch": 1575} {"train_loss": -38.37401580810547, "global_step": 190649, "epoch": 1575} {"train_loss": -41.8159065246582, "global_step": 190650, "epoch": 1575} {"train_loss": -39.79453659057617, "global_step": 190651, "epoch": 1575} {"train_loss": -36.809295654296875, "global_step": 190652, "epoch": 1575} {"train_loss": -34.46323776245117, "global_step": 190653, "epoch": 1575} {"train_loss": -37.023414611816406, "global_step": 190654, "epoch": 1575} {"train_loss": -36.94763946533203, "global_step": 190655, "epoch": 1575} {"train_loss": -32.7594108581543, "global_step": 190656, "epoch": 1575} {"train_loss": -40.038272857666016, "global_step": 190657, "epoch": 1575} {"train_loss": -36.85389709472656, "global_step": 190658, "epoch": 1575} {"train_loss": -37.55221176147461, "global_step": 190659, "epoch": 1575} {"train_loss": -39.407379150390625, "global_step": 190660, "epoch": 1575} {"train_loss": -37.958839416503906, "global_step": 190661, "epoch": 1575} {"train_loss": -41.01573181152344, "global_step": 190662, "epoch": 1575} {"train_loss": -39.24589157104492, "global_step": 190663, "epoch": 1575} {"train_loss": -40.95882797241211, "global_step": 190664, "epoch": 1575} {"train_loss": -37.51169204711914, "global_step": 190665, "epoch": 1575} {"train_loss": -41.113826751708984, "global_step": 190666, "epoch": 1575} {"train_loss": -38.79819869995117, "global_step": 190667, "epoch": 1575} {"train_loss": -40.69526290893555, "global_step": 190668, "epoch": 1575} {"train_loss": -39.414180755615234, "global_step": 190669, "epoch": 1575} {"train_loss": -41.0755729675293, "global_step": 190670, "epoch": 1575} {"train_loss": -39.440608978271484, "global_step": 190671, "epoch": 1575} {"train_loss": -40.96820068359375, "global_step": 190672, "epoch": 1575} {"train_loss": -39.98868942260742, "global_step": 190673, "epoch": 1575} {"train_loss": -41.11491775512695, "global_step": 190674, "epoch": 1575} {"train_loss": -40.489967346191406, "global_step": 190675, "epoch": 1575} {"train_loss": -41.40731430053711, "global_step": 190676, "epoch": 1575} {"train_loss": -41.48518371582031, "global_step": 190677, "epoch": 1575} {"train_loss": -41.4355583190918, "global_step": 190678, "epoch": 1575} {"train_loss": -41.10297393798828, "global_step": 190679, "epoch": 1575} {"train_loss": -41.1961555480957, "global_step": 190680, "epoch": 1575} {"train_loss": -41.41969680786133, "global_step": 190681, "epoch": 1575} {"train_loss": -41.97750473022461, "global_step": 190682, "epoch": 1575} {"train_loss": -41.1745719909668, "global_step": 190683, "epoch": 1575} {"train_loss": -41.520870208740234, "global_step": 190684, "epoch": 1575} {"train_loss": -42.259456634521484, "global_step": 190685, "epoch": 1575} {"train_loss": -42.0655403137207, "global_step": 190686, "epoch": 1575} {"train_loss": -42.090938568115234, "global_step": 190687, "epoch": 1575} {"train_loss": -41.84500503540039, "global_step": 190688, "epoch": 1575} {"train_loss": -42.24172592163086, "global_step": 190689, "epoch": 1575} {"train_loss": -42.04172897338867, "global_step": 190690, "epoch": 1575} {"train_loss": -42.243553161621094, "global_step": 190691, "epoch": 1575} {"train_loss": -42.14767074584961, "global_step": 190692, "epoch": 1575} {"train_loss": -41.6754264831543, "global_step": 190693, "epoch": 1575} {"train_loss": -42.18967819213867, "global_step": 190694, "epoch": 1575} {"train_loss": -40.79627643931996, "global_step": 190695, "epoch": 1575, "val_loss": 2518654.5} {"train_loss": -42.35227584838867, "global_step": 190696, "epoch": 1576} {"train_loss": -42.29308319091797, "global_step": 190697, "epoch": 1576} {"train_loss": -42.07748031616211, "global_step": 190698, "epoch": 1576} {"train_loss": -42.35799789428711, "global_step": 190699, "epoch": 1576} {"train_loss": -42.149696350097656, "global_step": 190700, "epoch": 1576} {"train_loss": -42.65925216674805, "global_step": 190701, "epoch": 1576} {"train_loss": -42.420616149902344, "global_step": 190702, "epoch": 1576} {"train_loss": -42.990440368652344, "global_step": 190703, "epoch": 1576} {"train_loss": -42.70988082885742, "global_step": 190704, "epoch": 1576} {"train_loss": -42.35995101928711, "global_step": 190705, "epoch": 1576} {"train_loss": -42.782474517822266, "global_step": 190706, "epoch": 1576} {"train_loss": -42.2637825012207, "global_step": 190707, "epoch": 1576} {"train_loss": -42.41965866088867, "global_step": 190708, "epoch": 1576} {"train_loss": -42.34360885620117, "global_step": 190709, "epoch": 1576} {"train_loss": -42.8870849609375, "global_step": 190710, "epoch": 1576} {"train_loss": -42.37115478515625, "global_step": 190711, "epoch": 1576} {"train_loss": -42.24467086791992, "global_step": 190712, "epoch": 1576} {"train_loss": -42.874237060546875, "global_step": 190713, "epoch": 1576} {"train_loss": -42.928192138671875, "global_step": 190714, "epoch": 1576} {"train_loss": -42.82722091674805, "global_step": 190715, "epoch": 1576} {"train_loss": -42.77432632446289, "global_step": 190716, "epoch": 1576} {"train_loss": -43.10567855834961, "global_step": 190717, "epoch": 1576} {"train_loss": -42.75307083129883, "global_step": 190718, "epoch": 1576} {"train_loss": -42.88629150390625, "global_step": 190719, "epoch": 1576} {"train_loss": -43.100669860839844, "global_step": 190720, "epoch": 1576} {"train_loss": -42.99394989013672, "global_step": 190721, "epoch": 1576} {"train_loss": -42.68036651611328, "global_step": 190722, "epoch": 1576} {"train_loss": -42.598602294921875, "global_step": 190723, "epoch": 1576} {"train_loss": -42.121849060058594, "global_step": 190724, "epoch": 1576} {"train_loss": -42.34662628173828, "global_step": 190725, "epoch": 1576} {"train_loss": -42.677734375, "global_step": 190726, "epoch": 1576} {"train_loss": -42.87050247192383, "global_step": 190727, "epoch": 1576} {"train_loss": -42.68209457397461, "global_step": 190728, "epoch": 1576} {"train_loss": -42.57587814331055, "global_step": 190729, "epoch": 1576} {"train_loss": -43.02267074584961, "global_step": 190730, "epoch": 1576} {"train_loss": -42.3541259765625, "global_step": 190731, "epoch": 1576} {"train_loss": -43.0305290222168, "global_step": 190732, "epoch": 1576} {"train_loss": -42.87168884277344, "global_step": 190733, "epoch": 1576} {"train_loss": -42.4669075012207, "global_step": 190734, "epoch": 1576} {"train_loss": -40.801753997802734, "global_step": 190735, "epoch": 1576} {"train_loss": -37.87183380126953, "global_step": 190736, "epoch": 1576} {"train_loss": -36.210845947265625, "global_step": 190737, "epoch": 1576} {"train_loss": -41.29566192626953, "global_step": 190738, "epoch": 1576} {"train_loss": -41.46209716796875, "global_step": 190739, "epoch": 1576} {"train_loss": -37.704986572265625, "global_step": 190740, "epoch": 1576} {"train_loss": -36.51070785522461, "global_step": 190741, "epoch": 1576} {"train_loss": -38.920894622802734, "global_step": 190742, "epoch": 1576} {"train_loss": -39.81222152709961, "global_step": 190743, "epoch": 1576} {"train_loss": -39.90214920043945, "global_step": 190744, "epoch": 1576} {"train_loss": -41.545902252197266, "global_step": 190745, "epoch": 1576} {"train_loss": -41.26865768432617, "global_step": 190746, "epoch": 1576} {"train_loss": -40.66096496582031, "global_step": 190747, "epoch": 1576} {"train_loss": -40.430580139160156, "global_step": 190748, "epoch": 1576} {"train_loss": -40.41912841796875, "global_step": 190749, "epoch": 1576} {"train_loss": -38.73714828491211, "global_step": 190750, "epoch": 1576} {"train_loss": -40.0439567565918, "global_step": 190751, "epoch": 1576} {"train_loss": -37.9779167175293, "global_step": 190752, "epoch": 1576} {"train_loss": -37.39650344848633, "global_step": 190753, "epoch": 1576} {"train_loss": -38.57462692260742, "global_step": 190754, "epoch": 1576} {"train_loss": -41.017452239990234, "global_step": 190755, "epoch": 1576} {"train_loss": -37.649269104003906, "global_step": 190756, "epoch": 1576} {"train_loss": -40.73325729370117, "global_step": 190757, "epoch": 1576} {"train_loss": -39.63119125366211, "global_step": 190758, "epoch": 1576} {"train_loss": -41.12128829956055, "global_step": 190759, "epoch": 1576} {"train_loss": -40.78759002685547, "global_step": 190760, "epoch": 1576} {"train_loss": -41.81855392456055, "global_step": 190761, "epoch": 1576} {"train_loss": -40.480377197265625, "global_step": 190762, "epoch": 1576} {"train_loss": -41.86342239379883, "global_step": 190763, "epoch": 1576} {"train_loss": -41.59537124633789, "global_step": 190764, "epoch": 1576} {"train_loss": -41.47025680541992, "global_step": 190765, "epoch": 1576} {"train_loss": -41.378662109375, "global_step": 190766, "epoch": 1576} {"train_loss": -41.59513473510742, "global_step": 190767, "epoch": 1576} {"train_loss": -41.8398551940918, "global_step": 190768, "epoch": 1576} {"train_loss": -41.5228385925293, "global_step": 190769, "epoch": 1576} {"train_loss": -41.952362060546875, "global_step": 190770, "epoch": 1576} {"train_loss": -41.74497985839844, "global_step": 190771, "epoch": 1576} {"train_loss": -41.95925521850586, "global_step": 190772, "epoch": 1576} {"train_loss": -41.39323043823242, "global_step": 190773, "epoch": 1576} {"train_loss": -41.549407958984375, "global_step": 190774, "epoch": 1576} {"train_loss": -42.0897331237793, "global_step": 190775, "epoch": 1576} {"train_loss": -41.825443267822266, "global_step": 190776, "epoch": 1576} {"train_loss": -41.86371994018555, "global_step": 190777, "epoch": 1576} {"train_loss": -42.196468353271484, "global_step": 190778, "epoch": 1576} {"train_loss": -42.02863311767578, "global_step": 190779, "epoch": 1576} {"train_loss": -42.254817962646484, "global_step": 190780, "epoch": 1576} {"train_loss": -41.943695068359375, "global_step": 190781, "epoch": 1576} {"train_loss": -41.72987365722656, "global_step": 190782, "epoch": 1576} {"train_loss": -42.00605010986328, "global_step": 190783, "epoch": 1576} {"train_loss": -42.494422912597656, "global_step": 190784, "epoch": 1576} {"train_loss": -41.846500396728516, "global_step": 190785, "epoch": 1576} {"train_loss": -42.597389221191406, "global_step": 190786, "epoch": 1576} {"train_loss": -41.521827697753906, "global_step": 190787, "epoch": 1576} {"train_loss": -41.16697311401367, "global_step": 190788, "epoch": 1576} {"train_loss": -42.286014556884766, "global_step": 190789, "epoch": 1576} {"train_loss": -41.398868560791016, "global_step": 190790, "epoch": 1576} {"train_loss": -41.70140838623047, "global_step": 190791, "epoch": 1576} {"train_loss": -42.041046142578125, "global_step": 190792, "epoch": 1576} {"train_loss": -42.58002853393555, "global_step": 190793, "epoch": 1576} {"train_loss": -41.7339973449707, "global_step": 190794, "epoch": 1576} {"train_loss": -42.383846282958984, "global_step": 190795, "epoch": 1576} {"train_loss": -41.85334014892578, "global_step": 190796, "epoch": 1576} {"train_loss": -41.93604278564453, "global_step": 190797, "epoch": 1576} {"train_loss": -42.890193939208984, "global_step": 190798, "epoch": 1576} {"train_loss": -42.36888885498047, "global_step": 190799, "epoch": 1576} {"train_loss": -42.26897430419922, "global_step": 190800, "epoch": 1576} {"train_loss": -42.59859848022461, "global_step": 190801, "epoch": 1576} {"train_loss": -42.709861755371094, "global_step": 190802, "epoch": 1576} {"train_loss": -42.669918060302734, "global_step": 190803, "epoch": 1576} {"train_loss": -42.209716796875, "global_step": 190804, "epoch": 1576} {"train_loss": -42.11288070678711, "global_step": 190805, "epoch": 1576} {"train_loss": -43.06428146362305, "global_step": 190806, "epoch": 1576} {"train_loss": -42.49775314331055, "global_step": 190807, "epoch": 1576} {"train_loss": -42.56301498413086, "global_step": 190808, "epoch": 1576} {"train_loss": -42.654048919677734, "global_step": 190809, "epoch": 1576} {"train_loss": -42.79853439331055, "global_step": 190810, "epoch": 1576} {"train_loss": -42.992156982421875, "global_step": 190811, "epoch": 1576} {"train_loss": -42.59256362915039, "global_step": 190812, "epoch": 1576} {"train_loss": -42.740745544433594, "global_step": 190813, "epoch": 1576} {"train_loss": -42.320655822753906, "global_step": 190814, "epoch": 1576} {"train_loss": -43.02345657348633, "global_step": 190815, "epoch": 1576} {"train_loss": -41.7191675990081, "global_step": 190816, "epoch": 1576, "val_loss": 2485180.75} {"train_loss": -42.8988151550293, "global_step": 190817, "epoch": 1577} {"train_loss": -42.69679641723633, "global_step": 190818, "epoch": 1577} {"train_loss": -42.175479888916016, "global_step": 190819, "epoch": 1577} {"train_loss": -42.7448844909668, "global_step": 190820, "epoch": 1577} {"train_loss": -42.317970275878906, "global_step": 190821, "epoch": 1577} {"train_loss": -42.08968734741211, "global_step": 190822, "epoch": 1577} {"train_loss": -42.64467239379883, "global_step": 190823, "epoch": 1577} {"train_loss": -42.51896286010742, "global_step": 190824, "epoch": 1577} {"train_loss": -42.658050537109375, "global_step": 190825, "epoch": 1577} {"train_loss": -42.12795639038086, "global_step": 190826, "epoch": 1577} {"train_loss": -42.60063552856445, "global_step": 190827, "epoch": 1577} {"train_loss": -42.78187561035156, "global_step": 190828, "epoch": 1577} {"train_loss": -41.1849365234375, "global_step": 190829, "epoch": 1577} {"train_loss": -41.786163330078125, "global_step": 190830, "epoch": 1577} {"train_loss": -42.75071334838867, "global_step": 190831, "epoch": 1577} {"train_loss": -41.540706634521484, "global_step": 190832, "epoch": 1577} {"train_loss": -41.264373779296875, "global_step": 190833, "epoch": 1577} {"train_loss": -41.76883316040039, "global_step": 190834, "epoch": 1577} {"train_loss": -40.14509963989258, "global_step": 190835, "epoch": 1577} {"train_loss": -38.8156623840332, "global_step": 190836, "epoch": 1577} {"train_loss": -38.764644622802734, "global_step": 190837, "epoch": 1577} {"train_loss": -39.277923583984375, "global_step": 190838, "epoch": 1577} {"train_loss": -38.5258674621582, "global_step": 190839, "epoch": 1577} {"train_loss": -40.13063049316406, "global_step": 190840, "epoch": 1577} {"train_loss": -41.51518630981445, "global_step": 190841, "epoch": 1577} {"train_loss": -38.86768341064453, "global_step": 190842, "epoch": 1577} {"train_loss": -38.051631927490234, "global_step": 190843, "epoch": 1577} {"train_loss": -38.36199188232422, "global_step": 190844, "epoch": 1577} {"train_loss": -40.69197463989258, "global_step": 190845, "epoch": 1577} {"train_loss": -40.04392623901367, "global_step": 190846, "epoch": 1577} {"train_loss": -35.67450714111328, "global_step": 190847, "epoch": 1577} {"train_loss": -38.99738693237305, "global_step": 190848, "epoch": 1577} {"train_loss": -37.4936408996582, "global_step": 190849, "epoch": 1577} {"train_loss": -39.34748458862305, "global_step": 190850, "epoch": 1577} {"train_loss": -39.98783493041992, "global_step": 190851, "epoch": 1577} {"train_loss": -38.650447845458984, "global_step": 190852, "epoch": 1577} {"train_loss": -38.31415939331055, "global_step": 190853, "epoch": 1577} {"train_loss": -41.531585693359375, "global_step": 190854, "epoch": 1577} {"train_loss": -39.33237838745117, "global_step": 190855, "epoch": 1577} {"train_loss": -40.462310791015625, "global_step": 190856, "epoch": 1577} {"train_loss": -41.080257415771484, "global_step": 190857, "epoch": 1577} {"train_loss": -39.98311996459961, "global_step": 190858, "epoch": 1577} {"train_loss": -40.27394485473633, "global_step": 190859, "epoch": 1577} {"train_loss": -41.419334411621094, "global_step": 190860, "epoch": 1577} {"train_loss": -38.483924865722656, "global_step": 190861, "epoch": 1577} {"train_loss": -39.935848236083984, "global_step": 190862, "epoch": 1577} {"train_loss": -40.42643356323242, "global_step": 190863, "epoch": 1577} {"train_loss": -39.52168655395508, "global_step": 190864, "epoch": 1577} {"train_loss": -41.18539047241211, "global_step": 190865, "epoch": 1577} {"train_loss": -39.7490348815918, "global_step": 190866, "epoch": 1577} {"train_loss": -40.95339584350586, "global_step": 190867, "epoch": 1577} {"train_loss": -40.55949020385742, "global_step": 190868, "epoch": 1577} {"train_loss": -39.963008880615234, "global_step": 190869, "epoch": 1577} {"train_loss": -41.564632415771484, "global_step": 190870, "epoch": 1577} {"train_loss": -39.37889862060547, "global_step": 190871, "epoch": 1577} {"train_loss": -41.562652587890625, "global_step": 190872, "epoch": 1577} {"train_loss": -39.993141174316406, "global_step": 190873, "epoch": 1577} {"train_loss": -40.01998519897461, "global_step": 190874, "epoch": 1577} {"train_loss": -41.4281120300293, "global_step": 190875, "epoch": 1577} {"train_loss": -40.57844161987305, "global_step": 190876, "epoch": 1577} {"train_loss": -40.5776252746582, "global_step": 190877, "epoch": 1577} {"train_loss": -41.15513229370117, "global_step": 190878, "epoch": 1577} {"train_loss": -41.05178451538086, "global_step": 190879, "epoch": 1577} {"train_loss": -41.45594787597656, "global_step": 190880, "epoch": 1577} {"train_loss": -41.544395446777344, "global_step": 190881, "epoch": 1577} {"train_loss": -41.324398040771484, "global_step": 190882, "epoch": 1577} {"train_loss": -41.04234313964844, "global_step": 190883, "epoch": 1577} {"train_loss": -41.445159912109375, "global_step": 190884, "epoch": 1577} {"train_loss": -41.840091705322266, "global_step": 190885, "epoch": 1577} {"train_loss": -41.78916549682617, "global_step": 190886, "epoch": 1577} {"train_loss": -41.86599349975586, "global_step": 190887, "epoch": 1577} {"train_loss": -41.77018356323242, "global_step": 190888, "epoch": 1577} {"train_loss": -41.809906005859375, "global_step": 190889, "epoch": 1577} {"train_loss": -42.13874053955078, "global_step": 190890, "epoch": 1577} {"train_loss": -41.745418548583984, "global_step": 190891, "epoch": 1577} {"train_loss": -41.84600830078125, "global_step": 190892, "epoch": 1577} {"train_loss": -41.80495071411133, "global_step": 190893, "epoch": 1577} {"train_loss": -42.37476348876953, "global_step": 190894, "epoch": 1577} {"train_loss": -42.12775802612305, "global_step": 190895, "epoch": 1577} {"train_loss": -42.316505432128906, "global_step": 190896, "epoch": 1577} {"train_loss": -42.181331634521484, "global_step": 190897, "epoch": 1577} {"train_loss": -42.1218147277832, "global_step": 190898, "epoch": 1577} {"train_loss": -41.446407318115234, "global_step": 190899, "epoch": 1577} {"train_loss": -42.54159927368164, "global_step": 190900, "epoch": 1577} {"train_loss": -41.977840423583984, "global_step": 190901, "epoch": 1577} {"train_loss": -42.42501449584961, "global_step": 190902, "epoch": 1577} {"train_loss": -42.875179290771484, "global_step": 190903, "epoch": 1577} {"train_loss": -41.92595672607422, "global_step": 190904, "epoch": 1577} {"train_loss": -42.459781646728516, "global_step": 190905, "epoch": 1577} {"train_loss": -42.66505813598633, "global_step": 190906, "epoch": 1577} {"train_loss": -42.44010543823242, "global_step": 190907, "epoch": 1577} {"train_loss": -42.58643341064453, "global_step": 190908, "epoch": 1577} {"train_loss": -42.330604553222656, "global_step": 190909, "epoch": 1577} {"train_loss": -42.68104934692383, "global_step": 190910, "epoch": 1577} {"train_loss": -42.478816986083984, "global_step": 190911, "epoch": 1577} {"train_loss": -42.42513656616211, "global_step": 190912, "epoch": 1577} {"train_loss": -42.79755783081055, "global_step": 190913, "epoch": 1577} {"train_loss": -42.14777374267578, "global_step": 190914, "epoch": 1577} {"train_loss": -42.88065719604492, "global_step": 190915, "epoch": 1577} {"train_loss": -42.011077880859375, "global_step": 190916, "epoch": 1577} {"train_loss": -42.78081130981445, "global_step": 190917, "epoch": 1577} {"train_loss": -42.24566650390625, "global_step": 190918, "epoch": 1577} {"train_loss": -42.71413040161133, "global_step": 190919, "epoch": 1577} {"train_loss": -42.82076644897461, "global_step": 190920, "epoch": 1577} {"train_loss": -42.78407287597656, "global_step": 190921, "epoch": 1577} {"train_loss": -42.761837005615234, "global_step": 190922, "epoch": 1577} {"train_loss": -42.679588317871094, "global_step": 190923, "epoch": 1577} {"train_loss": -43.076637268066406, "global_step": 190924, "epoch": 1577} {"train_loss": -42.81973648071289, "global_step": 190925, "epoch": 1577} {"train_loss": -42.99198913574219, "global_step": 190926, "epoch": 1577} {"train_loss": -43.071380615234375, "global_step": 190927, "epoch": 1577} {"train_loss": -42.681861877441406, "global_step": 190928, "epoch": 1577} {"train_loss": -43.43088150024414, "global_step": 190929, "epoch": 1577} {"train_loss": -43.0436897277832, "global_step": 190930, "epoch": 1577} {"train_loss": -42.74856185913086, "global_step": 190931, "epoch": 1577} {"train_loss": -42.86558151245117, "global_step": 190932, "epoch": 1577} {"train_loss": -42.14558792114258, "global_step": 190933, "epoch": 1577} {"train_loss": -42.46683883666992, "global_step": 190934, "epoch": 1577} {"train_loss": -43.05924987792969, "global_step": 190935, "epoch": 1577} {"train_loss": -43.066741943359375, "global_step": 190936, "epoch": 1577} {"train_loss": -41.41019029853758, "global_step": 190937, "epoch": 1577, "val_loss": 2525183.0} {"train_loss": -42.993377685546875, "global_step": 190938, "epoch": 1578} {"train_loss": -42.70388412475586, "global_step": 190939, "epoch": 1578} {"train_loss": -42.662635803222656, "global_step": 190940, "epoch": 1578} {"train_loss": -42.96664047241211, "global_step": 190941, "epoch": 1578} {"train_loss": -42.491661071777344, "global_step": 190942, "epoch": 1578} {"train_loss": -42.813175201416016, "global_step": 190943, "epoch": 1578} {"train_loss": -42.4715576171875, "global_step": 190944, "epoch": 1578} {"train_loss": -43.21785354614258, "global_step": 190945, "epoch": 1578} {"train_loss": -42.95817565917969, "global_step": 190946, "epoch": 1578} {"train_loss": -42.985137939453125, "global_step": 190947, "epoch": 1578} {"train_loss": -42.558223724365234, "global_step": 190948, "epoch": 1578} {"train_loss": -42.91399383544922, "global_step": 190949, "epoch": 1578} {"train_loss": -42.92708969116211, "global_step": 190950, "epoch": 1578} {"train_loss": -42.314449310302734, "global_step": 190951, "epoch": 1578} {"train_loss": -43.11174392700195, "global_step": 190952, "epoch": 1578} {"train_loss": -43.415130615234375, "global_step": 190953, "epoch": 1578} {"train_loss": -43.04014205932617, "global_step": 190954, "epoch": 1578} {"train_loss": -42.74702072143555, "global_step": 190955, "epoch": 1578} {"train_loss": -43.327640533447266, "global_step": 190956, "epoch": 1578} {"train_loss": -42.26389694213867, "global_step": 190957, "epoch": 1578} {"train_loss": -40.4229736328125, "global_step": 190958, "epoch": 1578} {"train_loss": -41.44330978393555, "global_step": 190959, "epoch": 1578} {"train_loss": -41.924861907958984, "global_step": 190960, "epoch": 1578} {"train_loss": -41.429229736328125, "global_step": 190961, "epoch": 1578} {"train_loss": -40.86665725708008, "global_step": 190962, "epoch": 1578} {"train_loss": -42.16337203979492, "global_step": 190963, "epoch": 1578} {"train_loss": -40.34403991699219, "global_step": 190964, "epoch": 1578} {"train_loss": -39.96043014526367, "global_step": 190965, "epoch": 1578} {"train_loss": -42.09645080566406, "global_step": 190966, "epoch": 1578} {"train_loss": -41.659603118896484, "global_step": 190967, "epoch": 1578} {"train_loss": -39.29976272583008, "global_step": 190968, "epoch": 1578} {"train_loss": -39.75442886352539, "global_step": 190969, "epoch": 1578} {"train_loss": -40.72228240966797, "global_step": 190970, "epoch": 1578} {"train_loss": -36.19742965698242, "global_step": 190971, "epoch": 1578} {"train_loss": -40.67313766479492, "global_step": 190972, "epoch": 1578} {"train_loss": -40.79048538208008, "global_step": 190973, "epoch": 1578} {"train_loss": -40.75864028930664, "global_step": 190974, "epoch": 1578} {"train_loss": -39.278297424316406, "global_step": 190975, "epoch": 1578} {"train_loss": -40.24604415893555, "global_step": 190976, "epoch": 1578} {"train_loss": -41.50046157836914, "global_step": 190977, "epoch": 1578} {"train_loss": -41.997840881347656, "global_step": 190978, "epoch": 1578} {"train_loss": -40.477291107177734, "global_step": 190979, "epoch": 1578} {"train_loss": -40.700958251953125, "global_step": 190980, "epoch": 1578} {"train_loss": -40.04286575317383, "global_step": 190981, "epoch": 1578} {"train_loss": -39.749176025390625, "global_step": 190982, "epoch": 1578} {"train_loss": -41.03730392456055, "global_step": 190983, "epoch": 1578} {"train_loss": -41.19719696044922, "global_step": 190984, "epoch": 1578} {"train_loss": -40.669677734375, "global_step": 190985, "epoch": 1578} {"train_loss": -40.645076751708984, "global_step": 190986, "epoch": 1578} {"train_loss": -41.963077545166016, "global_step": 190987, "epoch": 1578} {"train_loss": -41.524627685546875, "global_step": 190988, "epoch": 1578} {"train_loss": -41.3203239440918, "global_step": 190989, "epoch": 1578} {"train_loss": -42.32807540893555, "global_step": 190990, "epoch": 1578} {"train_loss": -41.82016372680664, "global_step": 190991, "epoch": 1578} {"train_loss": -41.77002716064453, "global_step": 190992, "epoch": 1578} {"train_loss": -41.79845428466797, "global_step": 190993, "epoch": 1578} {"train_loss": -41.692813873291016, "global_step": 190994, "epoch": 1578} {"train_loss": -41.6628303527832, "global_step": 190995, "epoch": 1578} {"train_loss": -41.8692512512207, "global_step": 190996, "epoch": 1578} {"train_loss": -41.896236419677734, "global_step": 190997, "epoch": 1578} {"train_loss": -42.466819763183594, "global_step": 190998, "epoch": 1578} {"train_loss": -42.039222717285156, "global_step": 190999, "epoch": 1578} {"train_loss": -42.3764533996582, "global_step": 191000, "epoch": 1578} {"train_loss": -42.36875534057617, "global_step": 191001, "epoch": 1578} {"train_loss": -42.03449249267578, "global_step": 191002, "epoch": 1578} {"train_loss": -42.79988098144531, "global_step": 191003, "epoch": 1578} {"train_loss": -42.876251220703125, "global_step": 191004, "epoch": 1578} {"train_loss": -42.091365814208984, "global_step": 191005, "epoch": 1578} {"train_loss": -42.04887008666992, "global_step": 191006, "epoch": 1578} {"train_loss": -42.915096282958984, "global_step": 191007, "epoch": 1578} {"train_loss": -42.85443115234375, "global_step": 191008, "epoch": 1578} {"train_loss": -42.84543991088867, "global_step": 191009, "epoch": 1578} {"train_loss": -42.40670394897461, "global_step": 191010, "epoch": 1578} {"train_loss": -42.510929107666016, "global_step": 191011, "epoch": 1578} {"train_loss": -42.220420837402344, "global_step": 191012, "epoch": 1578} {"train_loss": -42.3470458984375, "global_step": 191013, "epoch": 1578} {"train_loss": -42.80801010131836, "global_step": 191014, "epoch": 1578} {"train_loss": -41.816864013671875, "global_step": 191015, "epoch": 1578} {"train_loss": -41.75672912597656, "global_step": 191016, "epoch": 1578} {"train_loss": -42.48788070678711, "global_step": 191017, "epoch": 1578} {"train_loss": -43.144771575927734, "global_step": 191018, "epoch": 1578} {"train_loss": -42.694557189941406, "global_step": 191019, "epoch": 1578} {"train_loss": -42.90059280395508, "global_step": 191020, "epoch": 1578} {"train_loss": -42.74310302734375, "global_step": 191021, "epoch": 1578} {"train_loss": -42.73765182495117, "global_step": 191022, "epoch": 1578} {"train_loss": -42.30291748046875, "global_step": 191023, "epoch": 1578} {"train_loss": -42.4970817565918, "global_step": 191024, "epoch": 1578} {"train_loss": -42.915191650390625, "global_step": 191025, "epoch": 1578} {"train_loss": -42.136287689208984, "global_step": 191026, "epoch": 1578} {"train_loss": -42.33816146850586, "global_step": 191027, "epoch": 1578} {"train_loss": -42.89129638671875, "global_step": 191028, "epoch": 1578} {"train_loss": -42.6095085144043, "global_step": 191029, "epoch": 1578} {"train_loss": -42.927276611328125, "global_step": 191030, "epoch": 1578} {"train_loss": -43.516326904296875, "global_step": 191031, "epoch": 1578} {"train_loss": -42.881195068359375, "global_step": 191032, "epoch": 1578} {"train_loss": -43.03591537475586, "global_step": 191033, "epoch": 1578} {"train_loss": -42.88321304321289, "global_step": 191034, "epoch": 1578} {"train_loss": -43.35105514526367, "global_step": 191035, "epoch": 1578} {"train_loss": -43.2882194519043, "global_step": 191036, "epoch": 1578} {"train_loss": -43.563716888427734, "global_step": 191037, "epoch": 1578} {"train_loss": -43.426795959472656, "global_step": 191038, "epoch": 1578} {"train_loss": -43.420894622802734, "global_step": 191039, "epoch": 1578} {"train_loss": -43.17719650268555, "global_step": 191040, "epoch": 1578} {"train_loss": -42.667903900146484, "global_step": 191041, "epoch": 1578} {"train_loss": -41.26151657104492, "global_step": 191042, "epoch": 1578} {"train_loss": -39.7512321472168, "global_step": 191043, "epoch": 1578} {"train_loss": -41.70016098022461, "global_step": 191044, "epoch": 1578} {"train_loss": -42.4024658203125, "global_step": 191045, "epoch": 1578} {"train_loss": -41.4512825012207, "global_step": 191046, "epoch": 1578} {"train_loss": -41.863380432128906, "global_step": 191047, "epoch": 1578} {"train_loss": -42.65889358520508, "global_step": 191048, "epoch": 1578} {"train_loss": -41.861053466796875, "global_step": 191049, "epoch": 1578} {"train_loss": -40.89685821533203, "global_step": 191050, "epoch": 1578} {"train_loss": -39.900638580322266, "global_step": 191051, "epoch": 1578} {"train_loss": -41.66085433959961, "global_step": 191052, "epoch": 1578} {"train_loss": -40.605587005615234, "global_step": 191053, "epoch": 1578} {"train_loss": -38.63371658325195, "global_step": 191054, "epoch": 1578} {"train_loss": -41.73788070678711, "global_step": 191055, "epoch": 1578} {"train_loss": -40.44405746459961, "global_step": 191056, "epoch": 1578} {"train_loss": -36.46724319458008, "global_step": 191057, "epoch": 1578} {"train_loss": -41.88099481251614, "global_step": 191058, "epoch": 1578, "val_loss": 2519637.0} {"train_loss": -41.02052688598633, "global_step": 191059, "epoch": 1579} {"train_loss": -40.15869903564453, "global_step": 191060, "epoch": 1579} {"train_loss": -40.738128662109375, "global_step": 191061, "epoch": 1579} {"train_loss": -41.125732421875, "global_step": 191062, "epoch": 1579} {"train_loss": -41.15297317504883, "global_step": 191063, "epoch": 1579} {"train_loss": -42.36098861694336, "global_step": 191064, "epoch": 1579} {"train_loss": -40.96815872192383, "global_step": 191065, "epoch": 1579} {"train_loss": -39.302589416503906, "global_step": 191066, "epoch": 1579} {"train_loss": -41.08366775512695, "global_step": 191067, "epoch": 1579} {"train_loss": -39.864166259765625, "global_step": 191068, "epoch": 1579} {"train_loss": -41.30403137207031, "global_step": 191069, "epoch": 1579} {"train_loss": -40.8377799987793, "global_step": 191070, "epoch": 1579} {"train_loss": -40.50017166137695, "global_step": 191071, "epoch": 1579} {"train_loss": -39.19214630126953, "global_step": 191072, "epoch": 1579} {"train_loss": -41.6228141784668, "global_step": 191073, "epoch": 1579} {"train_loss": -40.77650833129883, "global_step": 191074, "epoch": 1579} {"train_loss": -39.41694259643555, "global_step": 191075, "epoch": 1579} {"train_loss": -40.44810104370117, "global_step": 191076, "epoch": 1579} {"train_loss": -40.51031494140625, "global_step": 191077, "epoch": 1579} {"train_loss": -40.80137252807617, "global_step": 191078, "epoch": 1579} {"train_loss": -40.201881408691406, "global_step": 191079, "epoch": 1579} {"train_loss": -41.537593841552734, "global_step": 191080, "epoch": 1579} {"train_loss": -40.539730072021484, "global_step": 191081, "epoch": 1579} {"train_loss": -40.409297943115234, "global_step": 191082, "epoch": 1579} {"train_loss": -42.5311393737793, "global_step": 191083, "epoch": 1579} {"train_loss": -40.87423324584961, "global_step": 191084, "epoch": 1579} {"train_loss": -41.34563064575195, "global_step": 191085, "epoch": 1579} {"train_loss": -42.23681640625, "global_step": 191086, "epoch": 1579} {"train_loss": -41.31361770629883, "global_step": 191087, "epoch": 1579} {"train_loss": -41.8664665222168, "global_step": 191088, "epoch": 1579} {"train_loss": -41.962623596191406, "global_step": 191089, "epoch": 1579} {"train_loss": -41.17375564575195, "global_step": 191090, "epoch": 1579} {"train_loss": -42.34422302246094, "global_step": 191091, "epoch": 1579} {"train_loss": -41.38969802856445, "global_step": 191092, "epoch": 1579} {"train_loss": -41.816253662109375, "global_step": 191093, "epoch": 1579} {"train_loss": -42.34730911254883, "global_step": 191094, "epoch": 1579} {"train_loss": -41.35523223876953, "global_step": 191095, "epoch": 1579} {"train_loss": -42.3439826965332, "global_step": 191096, "epoch": 1579} {"train_loss": -41.6899299621582, "global_step": 191097, "epoch": 1579} {"train_loss": -42.079627990722656, "global_step": 191098, "epoch": 1579} {"train_loss": -41.96453857421875, "global_step": 191099, "epoch": 1579} {"train_loss": -42.264705657958984, "global_step": 191100, "epoch": 1579} {"train_loss": -42.265289306640625, "global_step": 191101, "epoch": 1579} {"train_loss": -41.58241653442383, "global_step": 191102, "epoch": 1579} {"train_loss": -42.213844299316406, "global_step": 191103, "epoch": 1579} {"train_loss": -41.81339645385742, "global_step": 191104, "epoch": 1579} {"train_loss": -42.16997528076172, "global_step": 191105, "epoch": 1579} {"train_loss": -41.572418212890625, "global_step": 191106, "epoch": 1579} {"train_loss": -42.57268524169922, "global_step": 191107, "epoch": 1579} {"train_loss": -41.635860443115234, "global_step": 191108, "epoch": 1579} {"train_loss": -42.386329650878906, "global_step": 191109, "epoch": 1579} {"train_loss": -41.60728073120117, "global_step": 191110, "epoch": 1579} {"train_loss": -41.56878662109375, "global_step": 191111, "epoch": 1579} {"train_loss": -42.5936393737793, "global_step": 191112, "epoch": 1579} {"train_loss": -41.45147705078125, "global_step": 191113, "epoch": 1579} {"train_loss": -41.633636474609375, "global_step": 191114, "epoch": 1579} {"train_loss": -42.087337493896484, "global_step": 191115, "epoch": 1579} {"train_loss": -41.880184173583984, "global_step": 191116, "epoch": 1579} {"train_loss": -41.52120590209961, "global_step": 191117, "epoch": 1579} {"train_loss": -42.48051071166992, "global_step": 191118, "epoch": 1579} {"train_loss": -42.52825927734375, "global_step": 191119, "epoch": 1579} {"train_loss": -42.79549789428711, "global_step": 191120, "epoch": 1579} {"train_loss": -41.73210525512695, "global_step": 191121, "epoch": 1579} {"train_loss": -41.83247756958008, "global_step": 191122, "epoch": 1579} {"train_loss": -42.46536636352539, "global_step": 191123, "epoch": 1579} {"train_loss": -42.836181640625, "global_step": 191124, "epoch": 1579} {"train_loss": -42.3829345703125, "global_step": 191125, "epoch": 1579} {"train_loss": -42.03499984741211, "global_step": 191126, "epoch": 1579} {"train_loss": -42.970794677734375, "global_step": 191127, "epoch": 1579} {"train_loss": -42.174903869628906, "global_step": 191128, "epoch": 1579} {"train_loss": -41.60331344604492, "global_step": 191129, "epoch": 1579} {"train_loss": -42.39188766479492, "global_step": 191130, "epoch": 1579} {"train_loss": -42.69588088989258, "global_step": 191131, "epoch": 1579} {"train_loss": -42.693233489990234, "global_step": 191132, "epoch": 1579} {"train_loss": -42.30414581298828, "global_step": 191133, "epoch": 1579} {"train_loss": -42.48960494995117, "global_step": 191134, "epoch": 1579} {"train_loss": -42.9373664855957, "global_step": 191135, "epoch": 1579} {"train_loss": -42.22857666015625, "global_step": 191136, "epoch": 1579} {"train_loss": -42.74656677246094, "global_step": 191137, "epoch": 1579} {"train_loss": -42.64455795288086, "global_step": 191138, "epoch": 1579} {"train_loss": -42.67658233642578, "global_step": 191139, "epoch": 1579} {"train_loss": -43.09389877319336, "global_step": 191140, "epoch": 1579} {"train_loss": -42.600067138671875, "global_step": 191141, "epoch": 1579} {"train_loss": -42.11123275756836, "global_step": 191142, "epoch": 1579} {"train_loss": -42.808780670166016, "global_step": 191143, "epoch": 1579} {"train_loss": -42.62734603881836, "global_step": 191144, "epoch": 1579} {"train_loss": -41.701839447021484, "global_step": 191145, "epoch": 1579} {"train_loss": -42.17435836791992, "global_step": 191146, "epoch": 1579} {"train_loss": -42.86503219604492, "global_step": 191147, "epoch": 1579} {"train_loss": -42.20377731323242, "global_step": 191148, "epoch": 1579} {"train_loss": -42.85907745361328, "global_step": 191149, "epoch": 1579} {"train_loss": -42.199222564697266, "global_step": 191150, "epoch": 1579} {"train_loss": -41.53153610229492, "global_step": 191151, "epoch": 1579} {"train_loss": -42.46150588989258, "global_step": 191152, "epoch": 1579} {"train_loss": -41.6813850402832, "global_step": 191153, "epoch": 1579} {"train_loss": -39.95778274536133, "global_step": 191154, "epoch": 1579} {"train_loss": -40.85443115234375, "global_step": 191155, "epoch": 1579} {"train_loss": -42.12127685546875, "global_step": 191156, "epoch": 1579} {"train_loss": -40.633453369140625, "global_step": 191157, "epoch": 1579} {"train_loss": -39.622283935546875, "global_step": 191158, "epoch": 1579} {"train_loss": -41.525733947753906, "global_step": 191159, "epoch": 1579} {"train_loss": -42.27623748779297, "global_step": 191160, "epoch": 1579} {"train_loss": -41.861541748046875, "global_step": 191161, "epoch": 1579} {"train_loss": -42.54597091674805, "global_step": 191162, "epoch": 1579} {"train_loss": -42.19388961791992, "global_step": 191163, "epoch": 1579} {"train_loss": -41.278594970703125, "global_step": 191164, "epoch": 1579} {"train_loss": -40.99375534057617, "global_step": 191165, "epoch": 1579} {"train_loss": -40.32600021362305, "global_step": 191166, "epoch": 1579} {"train_loss": -40.22392272949219, "global_step": 191167, "epoch": 1579} {"train_loss": -39.79341506958008, "global_step": 191168, "epoch": 1579} {"train_loss": -40.84617614746094, "global_step": 191169, "epoch": 1579} {"train_loss": -42.35129928588867, "global_step": 191170, "epoch": 1579} {"train_loss": -42.33347702026367, "global_step": 191171, "epoch": 1579} {"train_loss": -42.26621627807617, "global_step": 191172, "epoch": 1579} {"train_loss": -41.679039001464844, "global_step": 191173, "epoch": 1579} {"train_loss": -41.51340866088867, "global_step": 191174, "epoch": 1579} {"train_loss": -41.20353317260742, "global_step": 191175, "epoch": 1579} {"train_loss": -41.6689567565918, "global_step": 191176, "epoch": 1579} {"train_loss": -41.476985931396484, "global_step": 191177, "epoch": 1579} {"train_loss": -42.41852951049805, "global_step": 191178, "epoch": 1579} {"train_loss": -41.68154844173715, "global_step": 191179, "epoch": 1579, "val_loss": 2509366.75} {"train_loss": -41.44562530517578, "global_step": 191180, "epoch": 1580} {"train_loss": -41.839412689208984, "global_step": 191181, "epoch": 1580} {"train_loss": -42.100257873535156, "global_step": 191182, "epoch": 1580} {"train_loss": -41.655941009521484, "global_step": 191183, "epoch": 1580} {"train_loss": -41.437164306640625, "global_step": 191184, "epoch": 1580} {"train_loss": -42.474910736083984, "global_step": 191185, "epoch": 1580} {"train_loss": -39.796539306640625, "global_step": 191186, "epoch": 1580} {"train_loss": -37.90889358520508, "global_step": 191187, "epoch": 1580} {"train_loss": -37.75368118286133, "global_step": 191188, "epoch": 1580} {"train_loss": -39.285072326660156, "global_step": 191189, "epoch": 1580} {"train_loss": -38.394981384277344, "global_step": 191190, "epoch": 1580} {"train_loss": -40.59614944458008, "global_step": 191191, "epoch": 1580} {"train_loss": -39.46112060546875, "global_step": 191192, "epoch": 1580} {"train_loss": -39.61845016479492, "global_step": 191193, "epoch": 1580} {"train_loss": -40.89595031738281, "global_step": 191194, "epoch": 1580} {"train_loss": -40.209651947021484, "global_step": 191195, "epoch": 1580} {"train_loss": -39.84846115112305, "global_step": 191196, "epoch": 1580} {"train_loss": -37.9211311340332, "global_step": 191197, "epoch": 1580} {"train_loss": -40.181819915771484, "global_step": 191198, "epoch": 1580} {"train_loss": -40.159515380859375, "global_step": 191199, "epoch": 1580} {"train_loss": -39.89889907836914, "global_step": 191200, "epoch": 1580} {"train_loss": -40.2174072265625, "global_step": 191201, "epoch": 1580} {"train_loss": -40.262630462646484, "global_step": 191202, "epoch": 1580} {"train_loss": -39.65511703491211, "global_step": 191203, "epoch": 1580} {"train_loss": -39.15967559814453, "global_step": 191204, "epoch": 1580} {"train_loss": -40.84332275390625, "global_step": 191205, "epoch": 1580} {"train_loss": -41.276466369628906, "global_step": 191206, "epoch": 1580} {"train_loss": -36.908790588378906, "global_step": 191207, "epoch": 1580} {"train_loss": -41.2368278503418, "global_step": 191208, "epoch": 1580} {"train_loss": -39.38908386230469, "global_step": 191209, "epoch": 1580} {"train_loss": -38.18388748168945, "global_step": 191210, "epoch": 1580} {"train_loss": -41.39543533325195, "global_step": 191211, "epoch": 1580} {"train_loss": -39.61577606201172, "global_step": 191212, "epoch": 1580} {"train_loss": -41.51889419555664, "global_step": 191213, "epoch": 1580} {"train_loss": -40.463417053222656, "global_step": 191214, "epoch": 1580} {"train_loss": -40.17134475708008, "global_step": 191215, "epoch": 1580} {"train_loss": -41.49530029296875, "global_step": 191216, "epoch": 1580} {"train_loss": -40.68886947631836, "global_step": 191217, "epoch": 1580} {"train_loss": -41.6478385925293, "global_step": 191218, "epoch": 1580} {"train_loss": -41.78859329223633, "global_step": 191219, "epoch": 1580} {"train_loss": -41.476497650146484, "global_step": 191220, "epoch": 1580} {"train_loss": -41.67893600463867, "global_step": 191221, "epoch": 1580} {"train_loss": -41.66201400756836, "global_step": 191222, "epoch": 1580} {"train_loss": -42.15560531616211, "global_step": 191223, "epoch": 1580} {"train_loss": -41.02770233154297, "global_step": 191224, "epoch": 1580} {"train_loss": -42.055240631103516, "global_step": 191225, "epoch": 1580} {"train_loss": -41.876930236816406, "global_step": 191226, "epoch": 1580} {"train_loss": -42.1946907043457, "global_step": 191227, "epoch": 1580} {"train_loss": -42.215457916259766, "global_step": 191228, "epoch": 1580} {"train_loss": -42.41164779663086, "global_step": 191229, "epoch": 1580} {"train_loss": -42.551692962646484, "global_step": 191230, "epoch": 1580} {"train_loss": -42.82942581176758, "global_step": 191231, "epoch": 1580} {"train_loss": -42.65092468261719, "global_step": 191232, "epoch": 1580} {"train_loss": -42.53378677368164, "global_step": 191233, "epoch": 1580} {"train_loss": -42.87797164916992, "global_step": 191234, "epoch": 1580} {"train_loss": -42.72905349731445, "global_step": 191235, "epoch": 1580} {"train_loss": -43.04637145996094, "global_step": 191236, "epoch": 1580} {"train_loss": -43.08658981323242, "global_step": 191237, "epoch": 1580} {"train_loss": -42.850826263427734, "global_step": 191238, "epoch": 1580} {"train_loss": -42.86295700073242, "global_step": 191239, "epoch": 1580} {"train_loss": -42.89628219604492, "global_step": 191240, "epoch": 1580} {"train_loss": -43.322479248046875, "global_step": 191241, "epoch": 1580} {"train_loss": -43.31959915161133, "global_step": 191242, "epoch": 1580} {"train_loss": -43.00577926635742, "global_step": 191243, "epoch": 1580} {"train_loss": -43.21479034423828, "global_step": 191244, "epoch": 1580} {"train_loss": -43.20088577270508, "global_step": 191245, "epoch": 1580} {"train_loss": -43.36145782470703, "global_step": 191246, "epoch": 1580} {"train_loss": -43.41292953491211, "global_step": 191247, "epoch": 1580} {"train_loss": -42.956295013427734, "global_step": 191248, "epoch": 1580} {"train_loss": -43.29472732543945, "global_step": 191249, "epoch": 1580} {"train_loss": -43.128440856933594, "global_step": 191250, "epoch": 1580} {"train_loss": -43.1779670715332, "global_step": 191251, "epoch": 1580} {"train_loss": -43.2477912902832, "global_step": 191252, "epoch": 1580} {"train_loss": -43.19439697265625, "global_step": 191253, "epoch": 1580} {"train_loss": -43.33742904663086, "global_step": 191254, "epoch": 1580} {"train_loss": -42.97317123413086, "global_step": 191255, "epoch": 1580} {"train_loss": -43.201881408691406, "global_step": 191256, "epoch": 1580} {"train_loss": -43.58074951171875, "global_step": 191257, "epoch": 1580} {"train_loss": -43.1389045715332, "global_step": 191258, "epoch": 1580} {"train_loss": -42.91280746459961, "global_step": 191259, "epoch": 1580} {"train_loss": -43.05794143676758, "global_step": 191260, "epoch": 1580} {"train_loss": -42.76760482788086, "global_step": 191261, "epoch": 1580} {"train_loss": -43.22105026245117, "global_step": 191262, "epoch": 1580} {"train_loss": -43.138671875, "global_step": 191263, "epoch": 1580} {"train_loss": -43.18195343017578, "global_step": 191264, "epoch": 1580} {"train_loss": -42.949851989746094, "global_step": 191265, "epoch": 1580} {"train_loss": -42.287899017333984, "global_step": 191266, "epoch": 1580} {"train_loss": -40.10548782348633, "global_step": 191267, "epoch": 1580} {"train_loss": -39.03651809692383, "global_step": 191268, "epoch": 1580} {"train_loss": -41.48640441894531, "global_step": 191269, "epoch": 1580} {"train_loss": -43.06158447265625, "global_step": 191270, "epoch": 1580} {"train_loss": -42.287052154541016, "global_step": 191271, "epoch": 1580} {"train_loss": -42.074275970458984, "global_step": 191272, "epoch": 1580} {"train_loss": -42.138343811035156, "global_step": 191273, "epoch": 1580} {"train_loss": -42.9843864440918, "global_step": 191274, "epoch": 1580} {"train_loss": -43.16559600830078, "global_step": 191275, "epoch": 1580} {"train_loss": -42.343868255615234, "global_step": 191276, "epoch": 1580} {"train_loss": -41.1148681640625, "global_step": 191277, "epoch": 1580} {"train_loss": -39.55173873901367, "global_step": 191278, "epoch": 1580} {"train_loss": -41.613739013671875, "global_step": 191279, "epoch": 1580} {"train_loss": -42.14358901977539, "global_step": 191280, "epoch": 1580} {"train_loss": -41.666099548339844, "global_step": 191281, "epoch": 1580} {"train_loss": -42.2421989440918, "global_step": 191282, "epoch": 1580} {"train_loss": -42.11385726928711, "global_step": 191283, "epoch": 1580} {"train_loss": -41.94294357299805, "global_step": 191284, "epoch": 1580} {"train_loss": -42.619815826416016, "global_step": 191285, "epoch": 1580} {"train_loss": -42.819122314453125, "global_step": 191286, "epoch": 1580} {"train_loss": -41.565731048583984, "global_step": 191287, "epoch": 1580} {"train_loss": -40.97785568237305, "global_step": 191288, "epoch": 1580} {"train_loss": -39.685279846191406, "global_step": 191289, "epoch": 1580} {"train_loss": -40.23714065551758, "global_step": 191290, "epoch": 1580} {"train_loss": -38.940452575683594, "global_step": 191291, "epoch": 1580} {"train_loss": -40.9140625, "global_step": 191292, "epoch": 1580} {"train_loss": -41.33456802368164, "global_step": 191293, "epoch": 1580} {"train_loss": -40.67119598388672, "global_step": 191294, "epoch": 1580} {"train_loss": -40.30787658691406, "global_step": 191295, "epoch": 1580} {"train_loss": -39.27206802368164, "global_step": 191296, "epoch": 1580} {"train_loss": -39.54287338256836, "global_step": 191297, "epoch": 1580} {"train_loss": -38.629337310791016, "global_step": 191298, "epoch": 1580} {"train_loss": -40.59035873413086, "global_step": 191299, "epoch": 1580} {"train_loss": -41.496581369195106, "global_step": 191300, "epoch": 1580, "val_loss": 2541348.25} {"train_loss": -39.76025390625, "global_step": 191301, "epoch": 1581} {"train_loss": -38.529239654541016, "global_step": 191302, "epoch": 1581} {"train_loss": -36.9881477355957, "global_step": 191303, "epoch": 1581} {"train_loss": -39.48148727416992, "global_step": 191304, "epoch": 1581} {"train_loss": -38.83323669433594, "global_step": 191305, "epoch": 1581} {"train_loss": -39.14088439941406, "global_step": 191306, "epoch": 1581} {"train_loss": -40.870361328125, "global_step": 191307, "epoch": 1581} {"train_loss": -40.62569808959961, "global_step": 191308, "epoch": 1581} {"train_loss": -40.24809646606445, "global_step": 191309, "epoch": 1581} {"train_loss": -40.79429244995117, "global_step": 191310, "epoch": 1581} {"train_loss": -40.946441650390625, "global_step": 191311, "epoch": 1581} {"train_loss": -39.88031005859375, "global_step": 191312, "epoch": 1581} {"train_loss": -41.21631622314453, "global_step": 191313, "epoch": 1581} {"train_loss": -41.4131965637207, "global_step": 191314, "epoch": 1581} {"train_loss": -41.60264205932617, "global_step": 191315, "epoch": 1581} {"train_loss": -41.4329719543457, "global_step": 191316, "epoch": 1581} {"train_loss": -41.4464225769043, "global_step": 191317, "epoch": 1581} {"train_loss": -41.59523010253906, "global_step": 191318, "epoch": 1581} {"train_loss": -42.0523796081543, "global_step": 191319, "epoch": 1581} {"train_loss": -40.73934555053711, "global_step": 191320, "epoch": 1581} {"train_loss": -42.015132904052734, "global_step": 191321, "epoch": 1581} {"train_loss": -42.31402587890625, "global_step": 191322, "epoch": 1581} {"train_loss": -42.08402633666992, "global_step": 191323, "epoch": 1581} {"train_loss": -41.8172607421875, "global_step": 191324, "epoch": 1581} {"train_loss": -41.87184524536133, "global_step": 191325, "epoch": 1581} {"train_loss": -42.27113723754883, "global_step": 191326, "epoch": 1581} {"train_loss": -42.46914291381836, "global_step": 191327, "epoch": 1581} {"train_loss": -42.5021858215332, "global_step": 191328, "epoch": 1581} {"train_loss": -42.67146682739258, "global_step": 191329, "epoch": 1581} {"train_loss": -42.444461822509766, "global_step": 191330, "epoch": 1581} {"train_loss": -42.7271842956543, "global_step": 191331, "epoch": 1581} {"train_loss": -42.47206497192383, "global_step": 191332, "epoch": 1581} {"train_loss": -41.91301727294922, "global_step": 191333, "epoch": 1581} {"train_loss": -42.581336975097656, "global_step": 191334, "epoch": 1581} {"train_loss": -42.35256576538086, "global_step": 191335, "epoch": 1581} {"train_loss": -42.7124137878418, "global_step": 191336, "epoch": 1581} {"train_loss": -41.7829704284668, "global_step": 191337, "epoch": 1581} {"train_loss": -42.806243896484375, "global_step": 191338, "epoch": 1581} {"train_loss": -42.56425476074219, "global_step": 191339, "epoch": 1581} {"train_loss": -42.13833236694336, "global_step": 191340, "epoch": 1581} {"train_loss": -42.21083068847656, "global_step": 191341, "epoch": 1581} {"train_loss": -43.280540466308594, "global_step": 191342, "epoch": 1581} {"train_loss": -42.627723693847656, "global_step": 191343, "epoch": 1581} {"train_loss": -42.600643157958984, "global_step": 191344, "epoch": 1581} {"train_loss": -43.00449752807617, "global_step": 191345, "epoch": 1581} {"train_loss": -42.828025817871094, "global_step": 191346, "epoch": 1581} {"train_loss": -42.5727653503418, "global_step": 191347, "epoch": 1581} {"train_loss": -42.6821403503418, "global_step": 191348, "epoch": 1581} {"train_loss": -42.72706604003906, "global_step": 191349, "epoch": 1581} {"train_loss": -43.25039291381836, "global_step": 191350, "epoch": 1581} {"train_loss": -42.98653793334961, "global_step": 191351, "epoch": 1581} {"train_loss": -42.6791877746582, "global_step": 191352, "epoch": 1581} {"train_loss": -43.1075439453125, "global_step": 191353, "epoch": 1581} {"train_loss": -43.37539291381836, "global_step": 191354, "epoch": 1581} {"train_loss": -43.25237274169922, "global_step": 191355, "epoch": 1581} {"train_loss": -42.60110092163086, "global_step": 191356, "epoch": 1581} {"train_loss": -43.30326461791992, "global_step": 191357, "epoch": 1581} {"train_loss": -42.79532241821289, "global_step": 191358, "epoch": 1581} {"train_loss": -43.16080856323242, "global_step": 191359, "epoch": 1581} {"train_loss": -42.89106369018555, "global_step": 191360, "epoch": 1581} {"train_loss": -43.11140823364258, "global_step": 191361, "epoch": 1581} {"train_loss": -43.22250747680664, "global_step": 191362, "epoch": 1581} {"train_loss": -43.32027053833008, "global_step": 191363, "epoch": 1581} {"train_loss": -42.57087326049805, "global_step": 191364, "epoch": 1581} {"train_loss": -42.85451126098633, "global_step": 191365, "epoch": 1581} {"train_loss": -42.87539291381836, "global_step": 191366, "epoch": 1581} {"train_loss": -43.264923095703125, "global_step": 191367, "epoch": 1581} {"train_loss": -42.503536224365234, "global_step": 191368, "epoch": 1581} {"train_loss": -42.797325134277344, "global_step": 191369, "epoch": 1581} {"train_loss": -43.07766342163086, "global_step": 191370, "epoch": 1581} {"train_loss": -43.21860122680664, "global_step": 191371, "epoch": 1581} {"train_loss": -42.69449234008789, "global_step": 191372, "epoch": 1581} {"train_loss": -43.13113021850586, "global_step": 191373, "epoch": 1581} {"train_loss": -43.009376525878906, "global_step": 191374, "epoch": 1581} {"train_loss": -41.35927963256836, "global_step": 191375, "epoch": 1581} {"train_loss": -42.208892822265625, "global_step": 191376, "epoch": 1581} {"train_loss": -41.988765716552734, "global_step": 191377, "epoch": 1581} {"train_loss": -41.5352897644043, "global_step": 191378, "epoch": 1581} {"train_loss": -42.97138214111328, "global_step": 191379, "epoch": 1581} {"train_loss": -43.142860412597656, "global_step": 191380, "epoch": 1581} {"train_loss": -42.5029182434082, "global_step": 191381, "epoch": 1581} {"train_loss": -42.5775260925293, "global_step": 191382, "epoch": 1581} {"train_loss": -41.19158935546875, "global_step": 191383, "epoch": 1581} {"train_loss": -40.04780960083008, "global_step": 191384, "epoch": 1581} {"train_loss": -40.787261962890625, "global_step": 191385, "epoch": 1581} {"train_loss": -41.18416213989258, "global_step": 191386, "epoch": 1581} {"train_loss": -40.46426010131836, "global_step": 191387, "epoch": 1581} {"train_loss": -41.7517204284668, "global_step": 191388, "epoch": 1581} {"train_loss": -42.714622497558594, "global_step": 191389, "epoch": 1581} {"train_loss": -41.969966888427734, "global_step": 191390, "epoch": 1581} {"train_loss": -41.49056625366211, "global_step": 191391, "epoch": 1581} {"train_loss": -41.73309326171875, "global_step": 191392, "epoch": 1581} {"train_loss": -41.80717086791992, "global_step": 191393, "epoch": 1581} {"train_loss": -42.75564193725586, "global_step": 191394, "epoch": 1581} {"train_loss": -42.43874740600586, "global_step": 191395, "epoch": 1581} {"train_loss": -42.517391204833984, "global_step": 191396, "epoch": 1581} {"train_loss": -43.00324249267578, "global_step": 191397, "epoch": 1581} {"train_loss": -42.138633728027344, "global_step": 191398, "epoch": 1581} {"train_loss": -42.47983932495117, "global_step": 191399, "epoch": 1581} {"train_loss": -42.58433151245117, "global_step": 191400, "epoch": 1581} {"train_loss": -42.80959701538086, "global_step": 191401, "epoch": 1581} {"train_loss": -42.69802474975586, "global_step": 191402, "epoch": 1581} {"train_loss": -42.8130989074707, "global_step": 191403, "epoch": 1581} {"train_loss": -42.62923049926758, "global_step": 191404, "epoch": 1581} {"train_loss": -43.106300354003906, "global_step": 191405, "epoch": 1581} {"train_loss": -41.8781852722168, "global_step": 191406, "epoch": 1581} {"train_loss": -41.82594680786133, "global_step": 191407, "epoch": 1581} {"train_loss": -40.317134857177734, "global_step": 191408, "epoch": 1581} {"train_loss": -41.617183685302734, "global_step": 191409, "epoch": 1581} {"train_loss": -41.47919464111328, "global_step": 191410, "epoch": 1581} {"train_loss": -40.42063522338867, "global_step": 191411, "epoch": 1581} {"train_loss": -39.87015914916992, "global_step": 191412, "epoch": 1581} {"train_loss": -41.755184173583984, "global_step": 191413, "epoch": 1581} {"train_loss": -40.90522384643555, "global_step": 191414, "epoch": 1581} {"train_loss": -41.21187973022461, "global_step": 191415, "epoch": 1581} {"train_loss": -41.39421463012695, "global_step": 191416, "epoch": 1581} {"train_loss": -41.63261032104492, "global_step": 191417, "epoch": 1581} {"train_loss": -40.44758224487305, "global_step": 191418, "epoch": 1581} {"train_loss": -39.76444625854492, "global_step": 191419, "epoch": 1581} {"train_loss": -40.08061218261719, "global_step": 191420, "epoch": 1581} {"train_loss": -41.93293982891997, "global_step": 191421, "epoch": 1581, "val_loss": 2454254.25} {"train_loss": -42.76961898803711, "global_step": 191422, "epoch": 1582} {"train_loss": -40.43744659423828, "global_step": 191423, "epoch": 1582} {"train_loss": -41.641326904296875, "global_step": 191424, "epoch": 1582} {"train_loss": -41.49349594116211, "global_step": 191425, "epoch": 1582} {"train_loss": -40.4459342956543, "global_step": 191426, "epoch": 1582} {"train_loss": -39.681617736816406, "global_step": 191427, "epoch": 1582} {"train_loss": -40.46015548706055, "global_step": 191428, "epoch": 1582} {"train_loss": -41.233551025390625, "global_step": 191429, "epoch": 1582} {"train_loss": -41.54296112060547, "global_step": 191430, "epoch": 1582} {"train_loss": -42.00716781616211, "global_step": 191431, "epoch": 1582} {"train_loss": -41.786415100097656, "global_step": 191432, "epoch": 1582} {"train_loss": -42.111934661865234, "global_step": 191433, "epoch": 1582} {"train_loss": -42.026058197021484, "global_step": 191434, "epoch": 1582} {"train_loss": -42.454341888427734, "global_step": 191435, "epoch": 1582} {"train_loss": -41.82064437866211, "global_step": 191436, "epoch": 1582} {"train_loss": -41.63735580444336, "global_step": 191437, "epoch": 1582} {"train_loss": -41.8946418762207, "global_step": 191438, "epoch": 1582} {"train_loss": -42.47321319580078, "global_step": 191439, "epoch": 1582} {"train_loss": -41.810791015625, "global_step": 191440, "epoch": 1582} {"train_loss": -42.35120391845703, "global_step": 191441, "epoch": 1582} {"train_loss": -42.51082229614258, "global_step": 191442, "epoch": 1582} {"train_loss": -41.94829177856445, "global_step": 191443, "epoch": 1582} {"train_loss": -41.596336364746094, "global_step": 191444, "epoch": 1582} {"train_loss": -42.0335693359375, "global_step": 191445, "epoch": 1582} {"train_loss": -41.79022979736328, "global_step": 191446, "epoch": 1582} {"train_loss": -42.46442794799805, "global_step": 191447, "epoch": 1582} {"train_loss": -41.68397903442383, "global_step": 191448, "epoch": 1582} {"train_loss": -41.74312973022461, "global_step": 191449, "epoch": 1582} {"train_loss": -41.505218505859375, "global_step": 191450, "epoch": 1582} {"train_loss": -40.62793731689453, "global_step": 191451, "epoch": 1582} {"train_loss": -41.77732467651367, "global_step": 191452, "epoch": 1582} {"train_loss": -42.316497802734375, "global_step": 191453, "epoch": 1582} {"train_loss": -42.360748291015625, "global_step": 191454, "epoch": 1582} {"train_loss": -42.6176872253418, "global_step": 191455, "epoch": 1582} {"train_loss": -42.02790451049805, "global_step": 191456, "epoch": 1582} {"train_loss": -41.98727035522461, "global_step": 191457, "epoch": 1582} {"train_loss": -42.100154876708984, "global_step": 191458, "epoch": 1582} {"train_loss": -42.06476974487305, "global_step": 191459, "epoch": 1582} {"train_loss": -42.50374984741211, "global_step": 191460, "epoch": 1582} {"train_loss": -42.454891204833984, "global_step": 191461, "epoch": 1582} {"train_loss": -41.617584228515625, "global_step": 191462, "epoch": 1582} {"train_loss": -42.9072380065918, "global_step": 191463, "epoch": 1582} {"train_loss": -41.50080108642578, "global_step": 191464, "epoch": 1582} {"train_loss": -40.30782699584961, "global_step": 191465, "epoch": 1582} {"train_loss": -41.07954025268555, "global_step": 191466, "epoch": 1582} {"train_loss": -41.99348068237305, "global_step": 191467, "epoch": 1582} {"train_loss": -39.90541458129883, "global_step": 191468, "epoch": 1582} {"train_loss": -42.1934814453125, "global_step": 191469, "epoch": 1582} {"train_loss": -41.7374382019043, "global_step": 191470, "epoch": 1582} {"train_loss": -39.62956237792969, "global_step": 191471, "epoch": 1582} {"train_loss": -42.347267150878906, "global_step": 191472, "epoch": 1582} {"train_loss": -39.56452560424805, "global_step": 191473, "epoch": 1582} {"train_loss": -41.71980667114258, "global_step": 191474, "epoch": 1582} {"train_loss": -41.45302963256836, "global_step": 191475, "epoch": 1582} {"train_loss": -41.108028411865234, "global_step": 191476, "epoch": 1582} {"train_loss": -42.49696731567383, "global_step": 191477, "epoch": 1582} {"train_loss": -41.459999084472656, "global_step": 191478, "epoch": 1582} {"train_loss": -42.27301025390625, "global_step": 191479, "epoch": 1582} {"train_loss": -41.5782585144043, "global_step": 191480, "epoch": 1582} {"train_loss": -42.1659049987793, "global_step": 191481, "epoch": 1582} {"train_loss": -42.76823043823242, "global_step": 191482, "epoch": 1582} {"train_loss": -42.346065521240234, "global_step": 191483, "epoch": 1582} {"train_loss": -42.782745361328125, "global_step": 191484, "epoch": 1582} {"train_loss": -42.619441986083984, "global_step": 191485, "epoch": 1582} {"train_loss": -42.30531692504883, "global_step": 191486, "epoch": 1582} {"train_loss": -42.131954193115234, "global_step": 191487, "epoch": 1582} {"train_loss": -42.41944885253906, "global_step": 191488, "epoch": 1582} {"train_loss": -42.17491149902344, "global_step": 191489, "epoch": 1582} {"train_loss": -42.431549072265625, "global_step": 191490, "epoch": 1582} {"train_loss": -42.97410583496094, "global_step": 191491, "epoch": 1582} {"train_loss": -43.18691635131836, "global_step": 191492, "epoch": 1582} {"train_loss": -42.21382522583008, "global_step": 191493, "epoch": 1582} {"train_loss": -42.075538635253906, "global_step": 191494, "epoch": 1582} {"train_loss": -42.209259033203125, "global_step": 191495, "epoch": 1582} {"train_loss": -42.42643356323242, "global_step": 191496, "epoch": 1582} {"train_loss": -42.959869384765625, "global_step": 191497, "epoch": 1582} {"train_loss": -42.867427825927734, "global_step": 191498, "epoch": 1582} {"train_loss": -42.48984909057617, "global_step": 191499, "epoch": 1582} {"train_loss": -42.66828536987305, "global_step": 191500, "epoch": 1582} {"train_loss": -42.46195983886719, "global_step": 191501, "epoch": 1582} {"train_loss": -42.70211410522461, "global_step": 191502, "epoch": 1582} {"train_loss": -42.41670227050781, "global_step": 191503, "epoch": 1582} {"train_loss": -41.34870147705078, "global_step": 191504, "epoch": 1582} {"train_loss": -41.284793853759766, "global_step": 191505, "epoch": 1582} {"train_loss": -39.84733963012695, "global_step": 191506, "epoch": 1582} {"train_loss": -37.3913459777832, "global_step": 191507, "epoch": 1582} {"train_loss": -37.50885772705078, "global_step": 191508, "epoch": 1582} {"train_loss": -42.24654769897461, "global_step": 191509, "epoch": 1582} {"train_loss": -41.70432662963867, "global_step": 191510, "epoch": 1582} {"train_loss": -39.971439361572266, "global_step": 191511, "epoch": 1582} {"train_loss": -37.049739837646484, "global_step": 191512, "epoch": 1582} {"train_loss": -36.79561233520508, "global_step": 191513, "epoch": 1582} {"train_loss": -39.57549285888672, "global_step": 191514, "epoch": 1582} {"train_loss": -41.6336555480957, "global_step": 191515, "epoch": 1582} {"train_loss": -40.51174545288086, "global_step": 191516, "epoch": 1582} {"train_loss": -40.238643646240234, "global_step": 191517, "epoch": 1582} {"train_loss": -40.35811233520508, "global_step": 191518, "epoch": 1582} {"train_loss": -39.78184127807617, "global_step": 191519, "epoch": 1582} {"train_loss": -41.33712387084961, "global_step": 191520, "epoch": 1582} {"train_loss": -39.84893798828125, "global_step": 191521, "epoch": 1582} {"train_loss": -40.657955169677734, "global_step": 191522, "epoch": 1582} {"train_loss": -41.8831901550293, "global_step": 191523, "epoch": 1582} {"train_loss": -40.45573806762695, "global_step": 191524, "epoch": 1582} {"train_loss": -41.28229904174805, "global_step": 191525, "epoch": 1582} {"train_loss": -41.96639633178711, "global_step": 191526, "epoch": 1582} {"train_loss": -40.44289779663086, "global_step": 191527, "epoch": 1582} {"train_loss": -41.27545166015625, "global_step": 191528, "epoch": 1582} {"train_loss": -40.97915267944336, "global_step": 191529, "epoch": 1582} {"train_loss": -41.71232986450195, "global_step": 191530, "epoch": 1582} {"train_loss": -42.16292953491211, "global_step": 191531, "epoch": 1582} {"train_loss": -42.3609619140625, "global_step": 191532, "epoch": 1582} {"train_loss": -42.84023666381836, "global_step": 191533, "epoch": 1582} {"train_loss": -42.433380126953125, "global_step": 191534, "epoch": 1582} {"train_loss": -42.91954040527344, "global_step": 191535, "epoch": 1582} {"train_loss": -42.71552658081055, "global_step": 191536, "epoch": 1582} {"train_loss": -42.51044464111328, "global_step": 191537, "epoch": 1582} {"train_loss": -42.98810958862305, "global_step": 191538, "epoch": 1582} {"train_loss": -42.83584976196289, "global_step": 191539, "epoch": 1582} {"train_loss": -42.9638786315918, "global_step": 191540, "epoch": 1582} {"train_loss": -42.975120544433594, "global_step": 191541, "epoch": 1582} {"train_loss": -41.639693362653745, "global_step": 191542, "epoch": 1582, "val_loss": 2498759.75} {"train_loss": -42.5298957824707, "global_step": 191543, "epoch": 1583} {"train_loss": -42.943660736083984, "global_step": 191544, "epoch": 1583} {"train_loss": -43.1555290222168, "global_step": 191545, "epoch": 1583} {"train_loss": -42.78594207763672, "global_step": 191546, "epoch": 1583} {"train_loss": -42.82951736450195, "global_step": 191547, "epoch": 1583} {"train_loss": -43.38918685913086, "global_step": 191548, "epoch": 1583} {"train_loss": -42.65312576293945, "global_step": 191549, "epoch": 1583} {"train_loss": -42.78235626220703, "global_step": 191550, "epoch": 1583} {"train_loss": -42.72825241088867, "global_step": 191551, "epoch": 1583} {"train_loss": -42.0294189453125, "global_step": 191552, "epoch": 1583} {"train_loss": -42.24983596801758, "global_step": 191553, "epoch": 1583} {"train_loss": -39.78980255126953, "global_step": 191554, "epoch": 1583} {"train_loss": -39.877288818359375, "global_step": 191555, "epoch": 1583} {"train_loss": -42.12803268432617, "global_step": 191556, "epoch": 1583} {"train_loss": -42.247650146484375, "global_step": 191557, "epoch": 1583} {"train_loss": -40.54522705078125, "global_step": 191558, "epoch": 1583} {"train_loss": -39.14921188354492, "global_step": 191559, "epoch": 1583} {"train_loss": -41.70968246459961, "global_step": 191560, "epoch": 1583} {"train_loss": -41.840576171875, "global_step": 191561, "epoch": 1583} {"train_loss": -41.50111389160156, "global_step": 191562, "epoch": 1583} {"train_loss": -41.747772216796875, "global_step": 191563, "epoch": 1583} {"train_loss": -42.37507247924805, "global_step": 191564, "epoch": 1583} {"train_loss": -41.881065368652344, "global_step": 191565, "epoch": 1583} {"train_loss": -42.27407455444336, "global_step": 191566, "epoch": 1583} {"train_loss": -41.897396087646484, "global_step": 191567, "epoch": 1583} {"train_loss": -41.02543258666992, "global_step": 191568, "epoch": 1583} {"train_loss": -41.72520065307617, "global_step": 191569, "epoch": 1583} {"train_loss": -41.58192825317383, "global_step": 191570, "epoch": 1583} {"train_loss": -42.37347412109375, "global_step": 191571, "epoch": 1583} {"train_loss": -41.81279373168945, "global_step": 191572, "epoch": 1583} {"train_loss": -41.526588439941406, "global_step": 191573, "epoch": 1583} {"train_loss": -41.772029876708984, "global_step": 191574, "epoch": 1583} {"train_loss": -41.33060836791992, "global_step": 191575, "epoch": 1583} {"train_loss": -41.208614349365234, "global_step": 191576, "epoch": 1583} {"train_loss": -41.710670471191406, "global_step": 191577, "epoch": 1583} {"train_loss": -40.4378662109375, "global_step": 191578, "epoch": 1583} {"train_loss": -42.2980842590332, "global_step": 191579, "epoch": 1583} {"train_loss": -41.72186279296875, "global_step": 191580, "epoch": 1583} {"train_loss": -41.70759963989258, "global_step": 191581, "epoch": 1583} {"train_loss": -42.42499542236328, "global_step": 191582, "epoch": 1583} {"train_loss": -41.17558670043945, "global_step": 191583, "epoch": 1583} {"train_loss": -42.27287673950195, "global_step": 191584, "epoch": 1583} {"train_loss": -41.66438674926758, "global_step": 191585, "epoch": 1583} {"train_loss": -42.079952239990234, "global_step": 191586, "epoch": 1583} {"train_loss": -41.97512435913086, "global_step": 191587, "epoch": 1583} {"train_loss": -42.193695068359375, "global_step": 191588, "epoch": 1583} {"train_loss": -42.80977249145508, "global_step": 191589, "epoch": 1583} {"train_loss": -41.84379196166992, "global_step": 191590, "epoch": 1583} {"train_loss": -42.51115036010742, "global_step": 191591, "epoch": 1583} {"train_loss": -42.34914016723633, "global_step": 191592, "epoch": 1583} {"train_loss": -42.53236770629883, "global_step": 191593, "epoch": 1583} {"train_loss": -41.89089584350586, "global_step": 191594, "epoch": 1583} {"train_loss": -41.94596862792969, "global_step": 191595, "epoch": 1583} {"train_loss": -42.360713958740234, "global_step": 191596, "epoch": 1583} {"train_loss": -42.77722930908203, "global_step": 191597, "epoch": 1583} {"train_loss": -42.2203483581543, "global_step": 191598, "epoch": 1583} {"train_loss": -42.256805419921875, "global_step": 191599, "epoch": 1583} {"train_loss": -42.986751556396484, "global_step": 191600, "epoch": 1583} {"train_loss": -42.85468292236328, "global_step": 191601, "epoch": 1583} {"train_loss": -42.73307418823242, "global_step": 191602, "epoch": 1583} {"train_loss": -43.22109603881836, "global_step": 191603, "epoch": 1583} {"train_loss": -43.26185989379883, "global_step": 191604, "epoch": 1583} {"train_loss": -42.11580276489258, "global_step": 191605, "epoch": 1583} {"train_loss": -42.48058319091797, "global_step": 191606, "epoch": 1583} {"train_loss": -42.7623291015625, "global_step": 191607, "epoch": 1583} {"train_loss": -42.282493591308594, "global_step": 191608, "epoch": 1583} {"train_loss": -42.102725982666016, "global_step": 191609, "epoch": 1583} {"train_loss": -42.5007209777832, "global_step": 191610, "epoch": 1583} {"train_loss": -42.68242263793945, "global_step": 191611, "epoch": 1583} {"train_loss": -41.96438980102539, "global_step": 191612, "epoch": 1583} {"train_loss": -42.09834671020508, "global_step": 191613, "epoch": 1583} {"train_loss": -42.925167083740234, "global_step": 191614, "epoch": 1583} {"train_loss": -42.55316925048828, "global_step": 191615, "epoch": 1583} {"train_loss": -42.33952713012695, "global_step": 191616, "epoch": 1583} {"train_loss": -42.72147750854492, "global_step": 191617, "epoch": 1583} {"train_loss": -42.64884567260742, "global_step": 191618, "epoch": 1583} {"train_loss": -42.539825439453125, "global_step": 191619, "epoch": 1583} {"train_loss": -41.8347053527832, "global_step": 191620, "epoch": 1583} {"train_loss": -42.303768157958984, "global_step": 191621, "epoch": 1583} {"train_loss": -43.14095687866211, "global_step": 191622, "epoch": 1583} {"train_loss": -42.40264892578125, "global_step": 191623, "epoch": 1583} {"train_loss": -43.04719543457031, "global_step": 191624, "epoch": 1583} {"train_loss": -42.58903884887695, "global_step": 191625, "epoch": 1583} {"train_loss": -43.02138137817383, "global_step": 191626, "epoch": 1583} {"train_loss": -42.72346115112305, "global_step": 191627, "epoch": 1583} {"train_loss": -42.6459846496582, "global_step": 191628, "epoch": 1583} {"train_loss": -42.197628021240234, "global_step": 191629, "epoch": 1583} {"train_loss": -42.85188674926758, "global_step": 191630, "epoch": 1583} {"train_loss": -42.86458969116211, "global_step": 191631, "epoch": 1583} {"train_loss": -41.83468246459961, "global_step": 191632, "epoch": 1583} {"train_loss": -41.67512512207031, "global_step": 191633, "epoch": 1583} {"train_loss": -42.57700729370117, "global_step": 191634, "epoch": 1583} {"train_loss": -42.165164947509766, "global_step": 191635, "epoch": 1583} {"train_loss": -41.90564727783203, "global_step": 191636, "epoch": 1583} {"train_loss": -42.54688262939453, "global_step": 191637, "epoch": 1583} {"train_loss": -42.70709228515625, "global_step": 191638, "epoch": 1583} {"train_loss": -41.54811477661133, "global_step": 191639, "epoch": 1583} {"train_loss": -42.89326858520508, "global_step": 191640, "epoch": 1583} {"train_loss": -42.21638107299805, "global_step": 191641, "epoch": 1583} {"train_loss": -42.026302337646484, "global_step": 191642, "epoch": 1583} {"train_loss": -42.53989791870117, "global_step": 191643, "epoch": 1583} {"train_loss": -41.926551818847656, "global_step": 191644, "epoch": 1583} {"train_loss": -43.08858871459961, "global_step": 191645, "epoch": 1583} {"train_loss": -41.69626998901367, "global_step": 191646, "epoch": 1583} {"train_loss": -41.09482955932617, "global_step": 191647, "epoch": 1583} {"train_loss": -41.80607223510742, "global_step": 191648, "epoch": 1583} {"train_loss": -41.71917724609375, "global_step": 191649, "epoch": 1583} {"train_loss": -41.613006591796875, "global_step": 191650, "epoch": 1583} {"train_loss": -42.228694915771484, "global_step": 191651, "epoch": 1583} {"train_loss": -42.09186935424805, "global_step": 191652, "epoch": 1583} {"train_loss": -41.464717864990234, "global_step": 191653, "epoch": 1583} {"train_loss": -41.3695068359375, "global_step": 191654, "epoch": 1583} {"train_loss": -41.79413604736328, "global_step": 191655, "epoch": 1583} {"train_loss": -42.328060150146484, "global_step": 191656, "epoch": 1583} {"train_loss": -38.6390495300293, "global_step": 191657, "epoch": 1583} {"train_loss": -40.31186294555664, "global_step": 191658, "epoch": 1583} {"train_loss": -42.495208740234375, "global_step": 191659, "epoch": 1583} {"train_loss": -40.18633270263672, "global_step": 191660, "epoch": 1583} {"train_loss": -41.67011260986328, "global_step": 191661, "epoch": 1583} {"train_loss": -40.292049407958984, "global_step": 191662, "epoch": 1583} {"train_loss": -42.068726846994444, "global_step": 191663, "epoch": 1583, "val_loss": 2485156.25} {"train_loss": -40.94917678833008, "global_step": 191664, "epoch": 1584} {"train_loss": -40.51716232299805, "global_step": 191665, "epoch": 1584} {"train_loss": -40.1417236328125, "global_step": 191666, "epoch": 1584} {"train_loss": -41.36931228637695, "global_step": 191667, "epoch": 1584} {"train_loss": -41.5711669921875, "global_step": 191668, "epoch": 1584} {"train_loss": -41.37321853637695, "global_step": 191669, "epoch": 1584} {"train_loss": -42.74184036254883, "global_step": 191670, "epoch": 1584} {"train_loss": -42.18375778198242, "global_step": 191671, "epoch": 1584} {"train_loss": -41.87697982788086, "global_step": 191672, "epoch": 1584} {"train_loss": -42.24369430541992, "global_step": 191673, "epoch": 1584} {"train_loss": -41.46262741088867, "global_step": 191674, "epoch": 1584} {"train_loss": -42.23000717163086, "global_step": 191675, "epoch": 1584} {"train_loss": -42.137325286865234, "global_step": 191676, "epoch": 1584} {"train_loss": -41.943702697753906, "global_step": 191677, "epoch": 1584} {"train_loss": -41.80497741699219, "global_step": 191678, "epoch": 1584} {"train_loss": -41.474361419677734, "global_step": 191679, "epoch": 1584} {"train_loss": -42.0113525390625, "global_step": 191680, "epoch": 1584} {"train_loss": -41.94411849975586, "global_step": 191681, "epoch": 1584} {"train_loss": -42.417640686035156, "global_step": 191682, "epoch": 1584} {"train_loss": -42.2446174621582, "global_step": 191683, "epoch": 1584} {"train_loss": -42.08774948120117, "global_step": 191684, "epoch": 1584} {"train_loss": -42.434112548828125, "global_step": 191685, "epoch": 1584} {"train_loss": -42.5394172668457, "global_step": 191686, "epoch": 1584} {"train_loss": -42.68593215942383, "global_step": 191687, "epoch": 1584} {"train_loss": -43.05038070678711, "global_step": 191688, "epoch": 1584} {"train_loss": -42.70720291137695, "global_step": 191689, "epoch": 1584} {"train_loss": -42.854331970214844, "global_step": 191690, "epoch": 1584} {"train_loss": -43.36488342285156, "global_step": 191691, "epoch": 1584} {"train_loss": -42.84206771850586, "global_step": 191692, "epoch": 1584} {"train_loss": -42.635799407958984, "global_step": 191693, "epoch": 1584} {"train_loss": -43.34626770019531, "global_step": 191694, "epoch": 1584} {"train_loss": -42.93435287475586, "global_step": 191695, "epoch": 1584} {"train_loss": -43.008121490478516, "global_step": 191696, "epoch": 1584} {"train_loss": -43.138648986816406, "global_step": 191697, "epoch": 1584} {"train_loss": -42.47490310668945, "global_step": 191698, "epoch": 1584} {"train_loss": -42.73752975463867, "global_step": 191699, "epoch": 1584} {"train_loss": -42.955562591552734, "global_step": 191700, "epoch": 1584} {"train_loss": -43.07643508911133, "global_step": 191701, "epoch": 1584} {"train_loss": -42.816585540771484, "global_step": 191702, "epoch": 1584} {"train_loss": -42.967647552490234, "global_step": 191703, "epoch": 1584} {"train_loss": -42.496273040771484, "global_step": 191704, "epoch": 1584} {"train_loss": -42.43037796020508, "global_step": 191705, "epoch": 1584} {"train_loss": -42.87177276611328, "global_step": 191706, "epoch": 1584} {"train_loss": -43.0201301574707, "global_step": 191707, "epoch": 1584} {"train_loss": -42.939517974853516, "global_step": 191708, "epoch": 1584} {"train_loss": -42.89483642578125, "global_step": 191709, "epoch": 1584} {"train_loss": -42.433345794677734, "global_step": 191710, "epoch": 1584} {"train_loss": -41.1805419921875, "global_step": 191711, "epoch": 1584} {"train_loss": -39.39188766479492, "global_step": 191712, "epoch": 1584} {"train_loss": -41.87421798706055, "global_step": 191713, "epoch": 1584} {"train_loss": -41.818965911865234, "global_step": 191714, "epoch": 1584} {"train_loss": -41.09571075439453, "global_step": 191715, "epoch": 1584} {"train_loss": -38.52345657348633, "global_step": 191716, "epoch": 1584} {"train_loss": -36.258785247802734, "global_step": 191717, "epoch": 1584} {"train_loss": -34.537723541259766, "global_step": 191718, "epoch": 1584} {"train_loss": -37.45786666870117, "global_step": 191719, "epoch": 1584} {"train_loss": -40.89361572265625, "global_step": 191720, "epoch": 1584} {"train_loss": -34.45296859741211, "global_step": 191721, "epoch": 1584} {"train_loss": -35.6493034362793, "global_step": 191722, "epoch": 1584} {"train_loss": -41.19108963012695, "global_step": 191723, "epoch": 1584} {"train_loss": -35.42307662963867, "global_step": 191724, "epoch": 1584} {"train_loss": -37.289058685302734, "global_step": 191725, "epoch": 1584} {"train_loss": -39.16434860229492, "global_step": 191726, "epoch": 1584} {"train_loss": -36.654998779296875, "global_step": 191727, "epoch": 1584} {"train_loss": -40.169761657714844, "global_step": 191728, "epoch": 1584} {"train_loss": -38.242347717285156, "global_step": 191729, "epoch": 1584} {"train_loss": -39.64314651489258, "global_step": 191730, "epoch": 1584} {"train_loss": -40.35001754760742, "global_step": 191731, "epoch": 1584} {"train_loss": -39.361446380615234, "global_step": 191732, "epoch": 1584} {"train_loss": -39.7827262878418, "global_step": 191733, "epoch": 1584} {"train_loss": -41.277381896972656, "global_step": 191734, "epoch": 1584} {"train_loss": -40.516754150390625, "global_step": 191735, "epoch": 1584} {"train_loss": -41.66524887084961, "global_step": 191736, "epoch": 1584} {"train_loss": -41.02463912963867, "global_step": 191737, "epoch": 1584} {"train_loss": -41.463714599609375, "global_step": 191738, "epoch": 1584} {"train_loss": -41.33846664428711, "global_step": 191739, "epoch": 1584} {"train_loss": -41.834808349609375, "global_step": 191740, "epoch": 1584} {"train_loss": -41.299415588378906, "global_step": 191741, "epoch": 1584} {"train_loss": -40.77473831176758, "global_step": 191742, "epoch": 1584} {"train_loss": -41.721614837646484, "global_step": 191743, "epoch": 1584} {"train_loss": -41.57985305786133, "global_step": 191744, "epoch": 1584} {"train_loss": -40.93693161010742, "global_step": 191745, "epoch": 1584} {"train_loss": -41.3658447265625, "global_step": 191746, "epoch": 1584} {"train_loss": -41.86343002319336, "global_step": 191747, "epoch": 1584} {"train_loss": -41.033363342285156, "global_step": 191748, "epoch": 1584} {"train_loss": -42.30691909790039, "global_step": 191749, "epoch": 1584} {"train_loss": -42.369895935058594, "global_step": 191750, "epoch": 1584} {"train_loss": -41.90182113647461, "global_step": 191751, "epoch": 1584} {"train_loss": -42.62749099731445, "global_step": 191752, "epoch": 1584} {"train_loss": -41.42196273803711, "global_step": 191753, "epoch": 1584} {"train_loss": -42.061180114746094, "global_step": 191754, "epoch": 1584} {"train_loss": -42.10786056518555, "global_step": 191755, "epoch": 1584} {"train_loss": -41.94905471801758, "global_step": 191756, "epoch": 1584} {"train_loss": -41.48623275756836, "global_step": 191757, "epoch": 1584} {"train_loss": -42.24724578857422, "global_step": 191758, "epoch": 1584} {"train_loss": -42.57428741455078, "global_step": 191759, "epoch": 1584} {"train_loss": -42.4591064453125, "global_step": 191760, "epoch": 1584} {"train_loss": -42.652523040771484, "global_step": 191761, "epoch": 1584} {"train_loss": -42.00297164916992, "global_step": 191762, "epoch": 1584} {"train_loss": -42.614601135253906, "global_step": 191763, "epoch": 1584} {"train_loss": -42.71778106689453, "global_step": 191764, "epoch": 1584} {"train_loss": -42.597198486328125, "global_step": 191765, "epoch": 1584} {"train_loss": -42.550743103027344, "global_step": 191766, "epoch": 1584} {"train_loss": -42.21001052856445, "global_step": 191767, "epoch": 1584} {"train_loss": -42.700199127197266, "global_step": 191768, "epoch": 1584} {"train_loss": -42.789058685302734, "global_step": 191769, "epoch": 1584} {"train_loss": -42.919097900390625, "global_step": 191770, "epoch": 1584} {"train_loss": -42.726539611816406, "global_step": 191771, "epoch": 1584} {"train_loss": -42.92335891723633, "global_step": 191772, "epoch": 1584} {"train_loss": -43.00975036621094, "global_step": 191773, "epoch": 1584} {"train_loss": -42.96775436401367, "global_step": 191774, "epoch": 1584} {"train_loss": -43.220462799072266, "global_step": 191775, "epoch": 1584} {"train_loss": -43.19367599487305, "global_step": 191776, "epoch": 1584} {"train_loss": -43.14608383178711, "global_step": 191777, "epoch": 1584} {"train_loss": -43.30731201171875, "global_step": 191778, "epoch": 1584} {"train_loss": -42.87339782714844, "global_step": 191779, "epoch": 1584} {"train_loss": -43.19779968261719, "global_step": 191780, "epoch": 1584} {"train_loss": -43.44401168823242, "global_step": 191781, "epoch": 1584} {"train_loss": -43.19807815551758, "global_step": 191782, "epoch": 1584} {"train_loss": -43.11092758178711, "global_step": 191783, "epoch": 1584} {"train_loss": -41.61459164580038, "global_step": 191784, "epoch": 1584, "val_loss": 2532417.75} {"train_loss": -42.713226318359375, "global_step": 191785, "epoch": 1585} {"train_loss": -42.93479537963867, "global_step": 191786, "epoch": 1585} {"train_loss": -42.71260452270508, "global_step": 191787, "epoch": 1585} {"train_loss": -42.73712158203125, "global_step": 191788, "epoch": 1585} {"train_loss": -43.07228469848633, "global_step": 191789, "epoch": 1585} {"train_loss": -43.08127212524414, "global_step": 191790, "epoch": 1585} {"train_loss": -43.356170654296875, "global_step": 191791, "epoch": 1585} {"train_loss": -42.73079299926758, "global_step": 191792, "epoch": 1585} {"train_loss": -43.455318450927734, "global_step": 191793, "epoch": 1585} {"train_loss": -43.05636978149414, "global_step": 191794, "epoch": 1585} {"train_loss": -42.07217025756836, "global_step": 191795, "epoch": 1585} {"train_loss": -43.00946044921875, "global_step": 191796, "epoch": 1585} {"train_loss": -42.93143081665039, "global_step": 191797, "epoch": 1585} {"train_loss": -42.67193603515625, "global_step": 191798, "epoch": 1585} {"train_loss": -43.08882522583008, "global_step": 191799, "epoch": 1585} {"train_loss": -42.60740280151367, "global_step": 191800, "epoch": 1585} {"train_loss": -42.122188568115234, "global_step": 191801, "epoch": 1585} {"train_loss": -43.161224365234375, "global_step": 191802, "epoch": 1585} {"train_loss": -43.56117248535156, "global_step": 191803, "epoch": 1585} {"train_loss": -42.34782028198242, "global_step": 191804, "epoch": 1585} {"train_loss": -42.32219314575195, "global_step": 191805, "epoch": 1585} {"train_loss": -42.202083587646484, "global_step": 191806, "epoch": 1585} {"train_loss": -41.373226165771484, "global_step": 191807, "epoch": 1585} {"train_loss": -40.435340881347656, "global_step": 191808, "epoch": 1585} {"train_loss": -41.768917083740234, "global_step": 191809, "epoch": 1585} {"train_loss": -42.511749267578125, "global_step": 191810, "epoch": 1585} {"train_loss": -42.7248649597168, "global_step": 191811, "epoch": 1585} {"train_loss": -42.4123420715332, "global_step": 191812, "epoch": 1585} {"train_loss": -42.096012115478516, "global_step": 191813, "epoch": 1585} {"train_loss": -41.839229583740234, "global_step": 191814, "epoch": 1585} {"train_loss": -42.360076904296875, "global_step": 191815, "epoch": 1585} {"train_loss": -42.9818229675293, "global_step": 191816, "epoch": 1585} {"train_loss": -42.98442459106445, "global_step": 191817, "epoch": 1585} {"train_loss": -42.593868255615234, "global_step": 191818, "epoch": 1585} {"train_loss": -42.08922576904297, "global_step": 191819, "epoch": 1585} {"train_loss": -43.05752182006836, "global_step": 191820, "epoch": 1585} {"train_loss": -42.541534423828125, "global_step": 191821, "epoch": 1585} {"train_loss": -43.28664016723633, "global_step": 191822, "epoch": 1585} {"train_loss": -42.54553985595703, "global_step": 191823, "epoch": 1585} {"train_loss": -42.78254699707031, "global_step": 191824, "epoch": 1585} {"train_loss": -42.681922912597656, "global_step": 191825, "epoch": 1585} {"train_loss": -42.337398529052734, "global_step": 191826, "epoch": 1585} {"train_loss": -41.9160270690918, "global_step": 191827, "epoch": 1585} {"train_loss": -41.28591537475586, "global_step": 191828, "epoch": 1585} {"train_loss": -41.38591766357422, "global_step": 191829, "epoch": 1585} {"train_loss": -42.133846282958984, "global_step": 191830, "epoch": 1585} {"train_loss": -42.22007369995117, "global_step": 191831, "epoch": 1585} {"train_loss": -40.148460388183594, "global_step": 191832, "epoch": 1585} {"train_loss": -38.60492706298828, "global_step": 191833, "epoch": 1585} {"train_loss": -42.17416000366211, "global_step": 191834, "epoch": 1585} {"train_loss": -40.30601501464844, "global_step": 191835, "epoch": 1585} {"train_loss": -35.958614349365234, "global_step": 191836, "epoch": 1585} {"train_loss": -40.58555221557617, "global_step": 191837, "epoch": 1585} {"train_loss": -39.83795928955078, "global_step": 191838, "epoch": 1585} {"train_loss": -39.24094009399414, "global_step": 191839, "epoch": 1585} {"train_loss": -39.712581634521484, "global_step": 191840, "epoch": 1585} {"train_loss": -39.9514274597168, "global_step": 191841, "epoch": 1585} {"train_loss": -41.19480514526367, "global_step": 191842, "epoch": 1585} {"train_loss": -40.9160041809082, "global_step": 191843, "epoch": 1585} {"train_loss": -38.19245910644531, "global_step": 191844, "epoch": 1585} {"train_loss": -41.75278854370117, "global_step": 191845, "epoch": 1585} {"train_loss": -39.836158752441406, "global_step": 191846, "epoch": 1585} {"train_loss": -39.65690231323242, "global_step": 191847, "epoch": 1585} {"train_loss": -38.84359359741211, "global_step": 191848, "epoch": 1585} {"train_loss": -39.4090690612793, "global_step": 191849, "epoch": 1585} {"train_loss": -39.53232955932617, "global_step": 191850, "epoch": 1585} {"train_loss": -40.37040328979492, "global_step": 191851, "epoch": 1585} {"train_loss": -38.96728515625, "global_step": 191852, "epoch": 1585} {"train_loss": -39.419921875, "global_step": 191853, "epoch": 1585} {"train_loss": -38.01142501831055, "global_step": 191854, "epoch": 1585} {"train_loss": -39.73249435424805, "global_step": 191855, "epoch": 1585} {"train_loss": -39.48228454589844, "global_step": 191856, "epoch": 1585} {"train_loss": -39.269222259521484, "global_step": 191857, "epoch": 1585} {"train_loss": -39.06339645385742, "global_step": 191858, "epoch": 1585} {"train_loss": -39.42840576171875, "global_step": 191859, "epoch": 1585} {"train_loss": -39.74610900878906, "global_step": 191860, "epoch": 1585} {"train_loss": -40.115352630615234, "global_step": 191861, "epoch": 1585} {"train_loss": -39.31623077392578, "global_step": 191862, "epoch": 1585} {"train_loss": -41.48481750488281, "global_step": 191863, "epoch": 1585} {"train_loss": -40.3842887878418, "global_step": 191864, "epoch": 1585} {"train_loss": -41.502803802490234, "global_step": 191865, "epoch": 1585} {"train_loss": -40.12017822265625, "global_step": 191866, "epoch": 1585} {"train_loss": -42.028892517089844, "global_step": 191867, "epoch": 1585} {"train_loss": -40.55434799194336, "global_step": 191868, "epoch": 1585} {"train_loss": -41.34471893310547, "global_step": 191869, "epoch": 1585} {"train_loss": -41.39855194091797, "global_step": 191870, "epoch": 1585} {"train_loss": -41.380645751953125, "global_step": 191871, "epoch": 1585} {"train_loss": -41.33203125, "global_step": 191872, "epoch": 1585} {"train_loss": -41.28165817260742, "global_step": 191873, "epoch": 1585} {"train_loss": -41.82656478881836, "global_step": 191874, "epoch": 1585} {"train_loss": -41.804298400878906, "global_step": 191875, "epoch": 1585} {"train_loss": -42.23145294189453, "global_step": 191876, "epoch": 1585} {"train_loss": -41.552757263183594, "global_step": 191877, "epoch": 1585} {"train_loss": -41.768951416015625, "global_step": 191878, "epoch": 1585} {"train_loss": -41.90595245361328, "global_step": 191879, "epoch": 1585} {"train_loss": -42.275238037109375, "global_step": 191880, "epoch": 1585} {"train_loss": -41.98200607299805, "global_step": 191881, "epoch": 1585} {"train_loss": -42.43528366088867, "global_step": 191882, "epoch": 1585} {"train_loss": -42.18874740600586, "global_step": 191883, "epoch": 1585} {"train_loss": -42.386043548583984, "global_step": 191884, "epoch": 1585} {"train_loss": -42.269588470458984, "global_step": 191885, "epoch": 1585} {"train_loss": -42.707244873046875, "global_step": 191886, "epoch": 1585} {"train_loss": -42.72591781616211, "global_step": 191887, "epoch": 1585} {"train_loss": -42.13611602783203, "global_step": 191888, "epoch": 1585} {"train_loss": -42.52951431274414, "global_step": 191889, "epoch": 1585} {"train_loss": -42.52519226074219, "global_step": 191890, "epoch": 1585} {"train_loss": -42.100250244140625, "global_step": 191891, "epoch": 1585} {"train_loss": -42.498382568359375, "global_step": 191892, "epoch": 1585} {"train_loss": -42.700965881347656, "global_step": 191893, "epoch": 1585} {"train_loss": -42.864139556884766, "global_step": 191894, "epoch": 1585} {"train_loss": -42.94830322265625, "global_step": 191895, "epoch": 1585} {"train_loss": -42.8388557434082, "global_step": 191896, "epoch": 1585} {"train_loss": -42.82435989379883, "global_step": 191897, "epoch": 1585} {"train_loss": -42.7592887878418, "global_step": 191898, "epoch": 1585} {"train_loss": -43.302852630615234, "global_step": 191899, "epoch": 1585} {"train_loss": -42.627281188964844, "global_step": 191900, "epoch": 1585} {"train_loss": -43.03188705444336, "global_step": 191901, "epoch": 1585} {"train_loss": -42.9149055480957, "global_step": 191902, "epoch": 1585} {"train_loss": -42.626216888427734, "global_step": 191903, "epoch": 1585} {"train_loss": -43.166954040527344, "global_step": 191904, "epoch": 1585} {"train_loss": -41.64179258110109, "global_step": 191905, "epoch": 1585, "val_loss": 2516087.5} {"train_loss": -43.06464767456055, "global_step": 191906, "epoch": 1586} {"train_loss": -43.144046783447266, "global_step": 191907, "epoch": 1586} {"train_loss": -43.130775451660156, "global_step": 191908, "epoch": 1586} {"train_loss": -43.1837043762207, "global_step": 191909, "epoch": 1586} {"train_loss": -43.31604766845703, "global_step": 191910, "epoch": 1586} {"train_loss": -43.19027328491211, "global_step": 191911, "epoch": 1586} {"train_loss": -43.166015625, "global_step": 191912, "epoch": 1586} {"train_loss": -42.83623123168945, "global_step": 191913, "epoch": 1586} {"train_loss": -43.09377670288086, "global_step": 191914, "epoch": 1586} {"train_loss": -42.73639678955078, "global_step": 191915, "epoch": 1586} {"train_loss": -43.18779373168945, "global_step": 191916, "epoch": 1586} {"train_loss": -42.91270065307617, "global_step": 191917, "epoch": 1586} {"train_loss": -42.427101135253906, "global_step": 191918, "epoch": 1586} {"train_loss": -42.94649124145508, "global_step": 191919, "epoch": 1586} {"train_loss": -42.74641036987305, "global_step": 191920, "epoch": 1586} {"train_loss": -42.288211822509766, "global_step": 191921, "epoch": 1586} {"train_loss": -41.783905029296875, "global_step": 191922, "epoch": 1586} {"train_loss": -40.19472885131836, "global_step": 191923, "epoch": 1586} {"train_loss": -40.94805145263672, "global_step": 191924, "epoch": 1586} {"train_loss": -40.05022048950195, "global_step": 191925, "epoch": 1586} {"train_loss": -39.806400299072266, "global_step": 191926, "epoch": 1586} {"train_loss": -42.03461837768555, "global_step": 191927, "epoch": 1586} {"train_loss": -41.99040603637695, "global_step": 191928, "epoch": 1586} {"train_loss": -40.4972038269043, "global_step": 191929, "epoch": 1586} {"train_loss": -41.766109466552734, "global_step": 191930, "epoch": 1586} {"train_loss": -40.5346794128418, "global_step": 191931, "epoch": 1586} {"train_loss": -40.824058532714844, "global_step": 191932, "epoch": 1586} {"train_loss": -43.03093338012695, "global_step": 191933, "epoch": 1586} {"train_loss": -41.624202728271484, "global_step": 191934, "epoch": 1586} {"train_loss": -41.12862777709961, "global_step": 191935, "epoch": 1586} {"train_loss": -42.77162551879883, "global_step": 191936, "epoch": 1586} {"train_loss": -40.78152084350586, "global_step": 191937, "epoch": 1586} {"train_loss": -41.75992965698242, "global_step": 191938, "epoch": 1586} {"train_loss": -41.764747619628906, "global_step": 191939, "epoch": 1586} {"train_loss": -40.0619010925293, "global_step": 191940, "epoch": 1586} {"train_loss": -42.90812301635742, "global_step": 191941, "epoch": 1586} {"train_loss": -41.370052337646484, "global_step": 191942, "epoch": 1586} {"train_loss": -41.946163177490234, "global_step": 191943, "epoch": 1586} {"train_loss": -42.25423812866211, "global_step": 191944, "epoch": 1586} {"train_loss": -42.20475769042969, "global_step": 191945, "epoch": 1586} {"train_loss": -41.986122131347656, "global_step": 191946, "epoch": 1586} {"train_loss": -42.3847541809082, "global_step": 191947, "epoch": 1586} {"train_loss": -42.21924591064453, "global_step": 191948, "epoch": 1586} {"train_loss": -42.47696304321289, "global_step": 191949, "epoch": 1586} {"train_loss": -41.656166076660156, "global_step": 191950, "epoch": 1586} {"train_loss": -42.74713897705078, "global_step": 191951, "epoch": 1586} {"train_loss": -41.82392120361328, "global_step": 191952, "epoch": 1586} {"train_loss": -42.612545013427734, "global_step": 191953, "epoch": 1586} {"train_loss": -41.76111602783203, "global_step": 191954, "epoch": 1586} {"train_loss": -42.67647171020508, "global_step": 191955, "epoch": 1586} {"train_loss": -41.8816032409668, "global_step": 191956, "epoch": 1586} {"train_loss": -42.26168441772461, "global_step": 191957, "epoch": 1586} {"train_loss": -42.126766204833984, "global_step": 191958, "epoch": 1586} {"train_loss": -42.536376953125, "global_step": 191959, "epoch": 1586} {"train_loss": -42.66315841674805, "global_step": 191960, "epoch": 1586} {"train_loss": -42.63045120239258, "global_step": 191961, "epoch": 1586} {"train_loss": -42.73089599609375, "global_step": 191962, "epoch": 1586} {"train_loss": -43.1328239440918, "global_step": 191963, "epoch": 1586} {"train_loss": -42.96635055541992, "global_step": 191964, "epoch": 1586} {"train_loss": -42.724952697753906, "global_step": 191965, "epoch": 1586} {"train_loss": -42.98908233642578, "global_step": 191966, "epoch": 1586} {"train_loss": -43.05229949951172, "global_step": 191967, "epoch": 1586} {"train_loss": -43.21596908569336, "global_step": 191968, "epoch": 1586} {"train_loss": -43.44758224487305, "global_step": 191969, "epoch": 1586} {"train_loss": -43.18479919433594, "global_step": 191970, "epoch": 1586} {"train_loss": -43.41264343261719, "global_step": 191971, "epoch": 1586} {"train_loss": -42.9044189453125, "global_step": 191972, "epoch": 1586} {"train_loss": -42.2685546875, "global_step": 191973, "epoch": 1586} {"train_loss": -41.82984161376953, "global_step": 191974, "epoch": 1586} {"train_loss": -40.869171142578125, "global_step": 191975, "epoch": 1586} {"train_loss": -39.258174896240234, "global_step": 191976, "epoch": 1586} {"train_loss": -38.77753829956055, "global_step": 191977, "epoch": 1586} {"train_loss": -41.54372787475586, "global_step": 191978, "epoch": 1586} {"train_loss": -42.438907623291016, "global_step": 191979, "epoch": 1586} {"train_loss": -40.30093002319336, "global_step": 191980, "epoch": 1586} {"train_loss": -38.62453842163086, "global_step": 191981, "epoch": 1586} {"train_loss": -40.86033248901367, "global_step": 191982, "epoch": 1586} {"train_loss": -42.4686279296875, "global_step": 191983, "epoch": 1586} {"train_loss": -40.09432601928711, "global_step": 191984, "epoch": 1586} {"train_loss": -39.6763801574707, "global_step": 191985, "epoch": 1586} {"train_loss": -39.77226257324219, "global_step": 191986, "epoch": 1586} {"train_loss": -41.9637565612793, "global_step": 191987, "epoch": 1586} {"train_loss": -41.01460266113281, "global_step": 191988, "epoch": 1586} {"train_loss": -41.7479362487793, "global_step": 191989, "epoch": 1586} {"train_loss": -41.85445022583008, "global_step": 191990, "epoch": 1586} {"train_loss": -41.75335693359375, "global_step": 191991, "epoch": 1586} {"train_loss": -41.749332427978516, "global_step": 191992, "epoch": 1586} {"train_loss": -40.769588470458984, "global_step": 191993, "epoch": 1586} {"train_loss": -42.569271087646484, "global_step": 191994, "epoch": 1586} {"train_loss": -41.61994552612305, "global_step": 191995, "epoch": 1586} {"train_loss": -42.5634765625, "global_step": 191996, "epoch": 1586} {"train_loss": -41.44137191772461, "global_step": 191997, "epoch": 1586} {"train_loss": -41.52265548706055, "global_step": 191998, "epoch": 1586} {"train_loss": -42.01432418823242, "global_step": 191999, "epoch": 1586} {"train_loss": -41.52848434448242, "global_step": 192000, "epoch": 1586} {"train_loss": -42.2874870300293, "global_step": 192001, "epoch": 1586} {"train_loss": -41.405948638916016, "global_step": 192002, "epoch": 1586} {"train_loss": -42.07463073730469, "global_step": 192003, "epoch": 1586} {"train_loss": -41.96126174926758, "global_step": 192004, "epoch": 1586} {"train_loss": -42.472259521484375, "global_step": 192005, "epoch": 1586} {"train_loss": -41.77014923095703, "global_step": 192006, "epoch": 1586} {"train_loss": -41.97285842895508, "global_step": 192007, "epoch": 1586} {"train_loss": -42.634437561035156, "global_step": 192008, "epoch": 1586} {"train_loss": -42.13429260253906, "global_step": 192009, "epoch": 1586} {"train_loss": -42.5982551574707, "global_step": 192010, "epoch": 1586} {"train_loss": -43.004146575927734, "global_step": 192011, "epoch": 1586} {"train_loss": -42.489742279052734, "global_step": 192012, "epoch": 1586} {"train_loss": -42.961334228515625, "global_step": 192013, "epoch": 1586} {"train_loss": -41.75985336303711, "global_step": 192014, "epoch": 1586} {"train_loss": -42.738319396972656, "global_step": 192015, "epoch": 1586} {"train_loss": -43.11031723022461, "global_step": 192016, "epoch": 1586} {"train_loss": -41.89388656616211, "global_step": 192017, "epoch": 1586} {"train_loss": -41.855255126953125, "global_step": 192018, "epoch": 1586} {"train_loss": -42.56903839111328, "global_step": 192019, "epoch": 1586} {"train_loss": -41.98069763183594, "global_step": 192020, "epoch": 1586} {"train_loss": -41.41602325439453, "global_step": 192021, "epoch": 1586} {"train_loss": -41.04468536376953, "global_step": 192022, "epoch": 1586} {"train_loss": -42.6183967590332, "global_step": 192023, "epoch": 1586} {"train_loss": -42.59811019897461, "global_step": 192024, "epoch": 1586} {"train_loss": -41.98191833496094, "global_step": 192025, "epoch": 1586} {"train_loss": -41.99628114306237, "global_step": 192026, "epoch": 1586, "val_loss": 2609987.75} {"train_loss": -42.819427490234375, "global_step": 192027, "epoch": 1587} {"train_loss": -41.359649658203125, "global_step": 192028, "epoch": 1587} {"train_loss": -40.36719512939453, "global_step": 192029, "epoch": 1587} {"train_loss": -41.86187744140625, "global_step": 192030, "epoch": 1587} {"train_loss": -42.32416915893555, "global_step": 192031, "epoch": 1587} {"train_loss": -39.01631546020508, "global_step": 192032, "epoch": 1587} {"train_loss": -41.27104568481445, "global_step": 192033, "epoch": 1587} {"train_loss": -39.83150863647461, "global_step": 192034, "epoch": 1587} {"train_loss": -38.71096420288086, "global_step": 192035, "epoch": 1587} {"train_loss": -40.3018913269043, "global_step": 192036, "epoch": 1587} {"train_loss": -42.01759719848633, "global_step": 192037, "epoch": 1587} {"train_loss": -39.57015609741211, "global_step": 192038, "epoch": 1587} {"train_loss": -41.4559440612793, "global_step": 192039, "epoch": 1587} {"train_loss": -40.954044342041016, "global_step": 192040, "epoch": 1587} {"train_loss": -41.74453353881836, "global_step": 192041, "epoch": 1587} {"train_loss": -42.18988800048828, "global_step": 192042, "epoch": 1587} {"train_loss": -41.12165451049805, "global_step": 192043, "epoch": 1587} {"train_loss": -42.51464080810547, "global_step": 192044, "epoch": 1587} {"train_loss": -40.05282211303711, "global_step": 192045, "epoch": 1587} {"train_loss": -41.5582160949707, "global_step": 192046, "epoch": 1587} {"train_loss": -42.480224609375, "global_step": 192047, "epoch": 1587} {"train_loss": -40.872283935546875, "global_step": 192048, "epoch": 1587} {"train_loss": -41.625816345214844, "global_step": 192049, "epoch": 1587} {"train_loss": -41.691524505615234, "global_step": 192050, "epoch": 1587} {"train_loss": -42.0728759765625, "global_step": 192051, "epoch": 1587} {"train_loss": -41.48823165893555, "global_step": 192052, "epoch": 1587} {"train_loss": -41.63022994995117, "global_step": 192053, "epoch": 1587} {"train_loss": -41.29950714111328, "global_step": 192054, "epoch": 1587} {"train_loss": -40.48596954345703, "global_step": 192055, "epoch": 1587} {"train_loss": -38.906131744384766, "global_step": 192056, "epoch": 1587} {"train_loss": -41.89202880859375, "global_step": 192057, "epoch": 1587} {"train_loss": -42.52495193481445, "global_step": 192058, "epoch": 1587} {"train_loss": -39.66243362426758, "global_step": 192059, "epoch": 1587} {"train_loss": -35.9542121887207, "global_step": 192060, "epoch": 1587} {"train_loss": -37.42871856689453, "global_step": 192061, "epoch": 1587} {"train_loss": -39.7342643737793, "global_step": 192062, "epoch": 1587} {"train_loss": -39.98482131958008, "global_step": 192063, "epoch": 1587} {"train_loss": -36.24885940551758, "global_step": 192064, "epoch": 1587} {"train_loss": -39.975440979003906, "global_step": 192065, "epoch": 1587} {"train_loss": -28.325408935546875, "global_step": 192066, "epoch": 1587} {"train_loss": -39.339141845703125, "global_step": 192067, "epoch": 1587} {"train_loss": -38.72301483154297, "global_step": 192068, "epoch": 1587} {"train_loss": -29.678787231445312, "global_step": 192069, "epoch": 1587} {"train_loss": -36.33167266845703, "global_step": 192070, "epoch": 1587} {"train_loss": -39.498775482177734, "global_step": 192071, "epoch": 1587} {"train_loss": -30.54886245727539, "global_step": 192072, "epoch": 1587} {"train_loss": -28.74185562133789, "global_step": 192073, "epoch": 1587} {"train_loss": -28.860342025756836, "global_step": 192074, "epoch": 1587} {"train_loss": -28.505767822265625, "global_step": 192075, "epoch": 1587} {"train_loss": -21.118053436279297, "global_step": 192076, "epoch": 1587} {"train_loss": -8.250761032104492, "global_step": 192077, "epoch": 1587} {"train_loss": -20.342721939086914, "global_step": 192078, "epoch": 1587} {"train_loss": -26.767118453979492, "global_step": 192079, "epoch": 1587} {"train_loss": -22.627456665039062, "global_step": 192080, "epoch": 1587} {"train_loss": -23.162220001220703, "global_step": 192081, "epoch": 1587} {"train_loss": -30.119970321655273, "global_step": 192082, "epoch": 1587} {"train_loss": -25.4145450592041, "global_step": 192083, "epoch": 1587} {"train_loss": -29.373640060424805, "global_step": 192084, "epoch": 1587} {"train_loss": -28.36638832092285, "global_step": 192085, "epoch": 1587} {"train_loss": -32.64007568359375, "global_step": 192086, "epoch": 1587} {"train_loss": -33.04954147338867, "global_step": 192087, "epoch": 1587} {"train_loss": -31.3353328704834, "global_step": 192088, "epoch": 1587} {"train_loss": -35.52775192260742, "global_step": 192089, "epoch": 1587} {"train_loss": -35.03936767578125, "global_step": 192090, "epoch": 1587} {"train_loss": -35.438758850097656, "global_step": 192091, "epoch": 1587} {"train_loss": -34.184547424316406, "global_step": 192092, "epoch": 1587} {"train_loss": -34.09334945678711, "global_step": 192093, "epoch": 1587} {"train_loss": -36.06450271606445, "global_step": 192094, "epoch": 1587} {"train_loss": -36.695533752441406, "global_step": 192095, "epoch": 1587} {"train_loss": -36.82855987548828, "global_step": 192096, "epoch": 1587} {"train_loss": -37.04865646362305, "global_step": 192097, "epoch": 1587} {"train_loss": -37.113643646240234, "global_step": 192098, "epoch": 1587} {"train_loss": -36.550437927246094, "global_step": 192099, "epoch": 1587} {"train_loss": -37.00270080566406, "global_step": 192100, "epoch": 1587} {"train_loss": -38.37968063354492, "global_step": 192101, "epoch": 1587} {"train_loss": -37.74333572387695, "global_step": 192102, "epoch": 1587} {"train_loss": -37.20309066772461, "global_step": 192103, "epoch": 1587} {"train_loss": -36.2903938293457, "global_step": 192104, "epoch": 1587} {"train_loss": -38.06783676147461, "global_step": 192105, "epoch": 1587} {"train_loss": -37.13546371459961, "global_step": 192106, "epoch": 1587} {"train_loss": -37.96233367919922, "global_step": 192107, "epoch": 1587} {"train_loss": -37.95246124267578, "global_step": 192108, "epoch": 1587} {"train_loss": -38.02126693725586, "global_step": 192109, "epoch": 1587} {"train_loss": -38.66022872924805, "global_step": 192110, "epoch": 1587} {"train_loss": -38.5152587890625, "global_step": 192111, "epoch": 1587} {"train_loss": -39.06218338012695, "global_step": 192112, "epoch": 1587} {"train_loss": -38.59321975708008, "global_step": 192113, "epoch": 1587} {"train_loss": -38.5136604309082, "global_step": 192114, "epoch": 1587} {"train_loss": -38.236629486083984, "global_step": 192115, "epoch": 1587} {"train_loss": -38.21302795410156, "global_step": 192116, "epoch": 1587} {"train_loss": -39.72896957397461, "global_step": 192117, "epoch": 1587} {"train_loss": -38.61807632446289, "global_step": 192118, "epoch": 1587} {"train_loss": -39.50800704956055, "global_step": 192119, "epoch": 1587} {"train_loss": -38.50037384033203, "global_step": 192120, "epoch": 1587} {"train_loss": -39.49669647216797, "global_step": 192121, "epoch": 1587} {"train_loss": -39.45939254760742, "global_step": 192122, "epoch": 1587} {"train_loss": -38.46494674682617, "global_step": 192123, "epoch": 1587} {"train_loss": -39.4902458190918, "global_step": 192124, "epoch": 1587} {"train_loss": -39.90761947631836, "global_step": 192125, "epoch": 1587} {"train_loss": -38.866878509521484, "global_step": 192126, "epoch": 1587} {"train_loss": -38.99161911010742, "global_step": 192127, "epoch": 1587} {"train_loss": -39.74202346801758, "global_step": 192128, "epoch": 1587} {"train_loss": -39.52241516113281, "global_step": 192129, "epoch": 1587} {"train_loss": -39.89594268798828, "global_step": 192130, "epoch": 1587} {"train_loss": -39.73397445678711, "global_step": 192131, "epoch": 1587} {"train_loss": -39.82001876831055, "global_step": 192132, "epoch": 1587} {"train_loss": -39.72617721557617, "global_step": 192133, "epoch": 1587} {"train_loss": -39.98367691040039, "global_step": 192134, "epoch": 1587} {"train_loss": -39.7893180847168, "global_step": 192135, "epoch": 1587} {"train_loss": -40.35188293457031, "global_step": 192136, "epoch": 1587} {"train_loss": -39.519752502441406, "global_step": 192137, "epoch": 1587} {"train_loss": -39.26227951049805, "global_step": 192138, "epoch": 1587} {"train_loss": -40.01227569580078, "global_step": 192139, "epoch": 1587} {"train_loss": -38.81588363647461, "global_step": 192140, "epoch": 1587} {"train_loss": -40.321998596191406, "global_step": 192141, "epoch": 1587} {"train_loss": -40.54130172729492, "global_step": 192142, "epoch": 1587} {"train_loss": -40.51224899291992, "global_step": 192143, "epoch": 1587} {"train_loss": -40.013301849365234, "global_step": 192144, "epoch": 1587} {"train_loss": -39.69880294799805, "global_step": 192145, "epoch": 1587} {"train_loss": -39.86800003051758, "global_step": 192146, "epoch": 1587} {"train_loss": -37.32490200641727, "global_step": 192147, "epoch": 1587, "val_loss": 2472026.75} {"train_loss": -40.84198760986328, "global_step": 192148, "epoch": 1588} {"train_loss": -40.357540130615234, "global_step": 192149, "epoch": 1588} {"train_loss": -41.25429916381836, "global_step": 192150, "epoch": 1588} {"train_loss": -41.090667724609375, "global_step": 192151, "epoch": 1588} {"train_loss": -40.64370346069336, "global_step": 192152, "epoch": 1588} {"train_loss": -40.4853401184082, "global_step": 192153, "epoch": 1588} {"train_loss": -40.492088317871094, "global_step": 192154, "epoch": 1588} {"train_loss": -40.555335998535156, "global_step": 192155, "epoch": 1588} {"train_loss": -41.25154495239258, "global_step": 192156, "epoch": 1588} {"train_loss": -40.409236907958984, "global_step": 192157, "epoch": 1588} {"train_loss": -40.703460693359375, "global_step": 192158, "epoch": 1588} {"train_loss": -41.061988830566406, "global_step": 192159, "epoch": 1588} {"train_loss": -41.72956466674805, "global_step": 192160, "epoch": 1588} {"train_loss": -40.824737548828125, "global_step": 192161, "epoch": 1588} {"train_loss": -41.03995895385742, "global_step": 192162, "epoch": 1588} {"train_loss": -40.882389068603516, "global_step": 192163, "epoch": 1588} {"train_loss": -41.07235336303711, "global_step": 192164, "epoch": 1588} {"train_loss": -41.23176193237305, "global_step": 192165, "epoch": 1588} {"train_loss": -40.99354553222656, "global_step": 192166, "epoch": 1588} {"train_loss": -41.1363525390625, "global_step": 192167, "epoch": 1588} {"train_loss": -41.772762298583984, "global_step": 192168, "epoch": 1588} {"train_loss": -41.71095275878906, "global_step": 192169, "epoch": 1588} {"train_loss": -41.470821380615234, "global_step": 192170, "epoch": 1588} {"train_loss": -39.90473556518555, "global_step": 192171, "epoch": 1588} {"train_loss": -41.18063735961914, "global_step": 192172, "epoch": 1588} {"train_loss": -41.282684326171875, "global_step": 192173, "epoch": 1588} {"train_loss": -41.19553756713867, "global_step": 192174, "epoch": 1588} {"train_loss": -41.215938568115234, "global_step": 192175, "epoch": 1588} {"train_loss": -41.1297721862793, "global_step": 192176, "epoch": 1588} {"train_loss": -41.45490264892578, "global_step": 192177, "epoch": 1588} {"train_loss": -41.23317337036133, "global_step": 192178, "epoch": 1588} {"train_loss": -41.4674186706543, "global_step": 192179, "epoch": 1588} {"train_loss": -41.04370880126953, "global_step": 192180, "epoch": 1588} {"train_loss": -41.63181686401367, "global_step": 192181, "epoch": 1588} {"train_loss": -42.06993865966797, "global_step": 192182, "epoch": 1588} {"train_loss": -41.27567672729492, "global_step": 192183, "epoch": 1588} {"train_loss": -41.57453918457031, "global_step": 192184, "epoch": 1588} {"train_loss": -41.68624496459961, "global_step": 192185, "epoch": 1588} {"train_loss": -41.43616485595703, "global_step": 192186, "epoch": 1588} {"train_loss": -41.4901237487793, "global_step": 192187, "epoch": 1588} {"train_loss": -41.84964370727539, "global_step": 192188, "epoch": 1588} {"train_loss": -42.056556701660156, "global_step": 192189, "epoch": 1588} {"train_loss": -41.170074462890625, "global_step": 192190, "epoch": 1588} {"train_loss": -41.76784133911133, "global_step": 192191, "epoch": 1588} {"train_loss": -42.63240432739258, "global_step": 192192, "epoch": 1588} {"train_loss": -41.072139739990234, "global_step": 192193, "epoch": 1588} {"train_loss": -42.16559982299805, "global_step": 192194, "epoch": 1588} {"train_loss": -41.4329948425293, "global_step": 192195, "epoch": 1588} {"train_loss": -41.78179931640625, "global_step": 192196, "epoch": 1588} {"train_loss": -41.85813903808594, "global_step": 192197, "epoch": 1588} {"train_loss": -41.671566009521484, "global_step": 192198, "epoch": 1588} {"train_loss": -41.94432830810547, "global_step": 192199, "epoch": 1588} {"train_loss": -42.327999114990234, "global_step": 192200, "epoch": 1588} {"train_loss": -41.82749557495117, "global_step": 192201, "epoch": 1588} {"train_loss": -41.14583969116211, "global_step": 192202, "epoch": 1588} {"train_loss": -42.662532806396484, "global_step": 192203, "epoch": 1588} {"train_loss": -42.02183151245117, "global_step": 192204, "epoch": 1588} {"train_loss": -41.894439697265625, "global_step": 192205, "epoch": 1588} {"train_loss": -40.966156005859375, "global_step": 192206, "epoch": 1588} {"train_loss": -41.619720458984375, "global_step": 192207, "epoch": 1588} {"train_loss": -41.12044906616211, "global_step": 192208, "epoch": 1588} {"train_loss": -40.959381103515625, "global_step": 192209, "epoch": 1588} {"train_loss": -41.5828857421875, "global_step": 192210, "epoch": 1588} {"train_loss": -41.00931167602539, "global_step": 192211, "epoch": 1588} {"train_loss": -41.75588607788086, "global_step": 192212, "epoch": 1588} {"train_loss": -41.53438186645508, "global_step": 192213, "epoch": 1588} {"train_loss": -40.355628967285156, "global_step": 192214, "epoch": 1588} {"train_loss": -42.00436019897461, "global_step": 192215, "epoch": 1588} {"train_loss": -41.493221282958984, "global_step": 192216, "epoch": 1588} {"train_loss": -41.61585235595703, "global_step": 192217, "epoch": 1588} {"train_loss": -40.476558685302734, "global_step": 192218, "epoch": 1588} {"train_loss": -41.49541473388672, "global_step": 192219, "epoch": 1588} {"train_loss": -41.17335891723633, "global_step": 192220, "epoch": 1588} {"train_loss": -41.373775482177734, "global_step": 192221, "epoch": 1588} {"train_loss": -40.63459396362305, "global_step": 192222, "epoch": 1588} {"train_loss": -40.491512298583984, "global_step": 192223, "epoch": 1588} {"train_loss": -41.09293746948242, "global_step": 192224, "epoch": 1588} {"train_loss": -40.31653594970703, "global_step": 192225, "epoch": 1588} {"train_loss": -39.8455924987793, "global_step": 192226, "epoch": 1588} {"train_loss": -39.763092041015625, "global_step": 192227, "epoch": 1588} {"train_loss": -39.94804000854492, "global_step": 192228, "epoch": 1588} {"train_loss": -36.42690658569336, "global_step": 192229, "epoch": 1588} {"train_loss": -39.29983139038086, "global_step": 192230, "epoch": 1588} {"train_loss": -39.15955352783203, "global_step": 192231, "epoch": 1588} {"train_loss": -38.91054153442383, "global_step": 192232, "epoch": 1588} {"train_loss": -40.3023567199707, "global_step": 192233, "epoch": 1588} {"train_loss": -39.93626022338867, "global_step": 192234, "epoch": 1588} {"train_loss": -39.18738555908203, "global_step": 192235, "epoch": 1588} {"train_loss": -38.76968002319336, "global_step": 192236, "epoch": 1588} {"train_loss": -41.08158874511719, "global_step": 192237, "epoch": 1588} {"train_loss": -39.922096252441406, "global_step": 192238, "epoch": 1588} {"train_loss": -39.33675003051758, "global_step": 192239, "epoch": 1588} {"train_loss": -39.86483383178711, "global_step": 192240, "epoch": 1588} {"train_loss": -39.756874084472656, "global_step": 192241, "epoch": 1588} {"train_loss": -39.66407012939453, "global_step": 192242, "epoch": 1588} {"train_loss": -37.879451751708984, "global_step": 192243, "epoch": 1588} {"train_loss": -35.75519943237305, "global_step": 192244, "epoch": 1588} {"train_loss": -39.47151565551758, "global_step": 192245, "epoch": 1588} {"train_loss": -33.726295471191406, "global_step": 192246, "epoch": 1588} {"train_loss": -34.47391891479492, "global_step": 192247, "epoch": 1588} {"train_loss": -20.35810661315918, "global_step": 192248, "epoch": 1588} {"train_loss": -27.717161178588867, "global_step": 192249, "epoch": 1588} {"train_loss": -32.37503433227539, "global_step": 192250, "epoch": 1588} {"train_loss": -30.821317672729492, "global_step": 192251, "epoch": 1588} {"train_loss": -34.31199645996094, "global_step": 192252, "epoch": 1588} {"train_loss": -34.790279388427734, "global_step": 192253, "epoch": 1588} {"train_loss": -32.690513610839844, "global_step": 192254, "epoch": 1588} {"train_loss": -36.7564697265625, "global_step": 192255, "epoch": 1588} {"train_loss": -35.2657585144043, "global_step": 192256, "epoch": 1588} {"train_loss": -36.459896087646484, "global_step": 192257, "epoch": 1588} {"train_loss": -35.508487701416016, "global_step": 192258, "epoch": 1588} {"train_loss": -36.4808235168457, "global_step": 192259, "epoch": 1588} {"train_loss": -35.85269546508789, "global_step": 192260, "epoch": 1588} {"train_loss": -38.3875846862793, "global_step": 192261, "epoch": 1588} {"train_loss": -35.6917610168457, "global_step": 192262, "epoch": 1588} {"train_loss": -38.73883056640625, "global_step": 192263, "epoch": 1588} {"train_loss": -37.1098518371582, "global_step": 192264, "epoch": 1588} {"train_loss": -36.91170883178711, "global_step": 192265, "epoch": 1588} {"train_loss": -37.43259811401367, "global_step": 192266, "epoch": 1588} {"train_loss": -37.58587646484375, "global_step": 192267, "epoch": 1588} {"train_loss": -39.70163160907335, "global_step": 192268, "epoch": 1588, "val_loss": 2441598.75} {"train_loss": -36.90747833251953, "global_step": 192269, "epoch": 1589} {"train_loss": -39.025367736816406, "global_step": 192270, "epoch": 1589} {"train_loss": -38.42898178100586, "global_step": 192271, "epoch": 1589} {"train_loss": -39.25716781616211, "global_step": 192272, "epoch": 1589} {"train_loss": -39.454559326171875, "global_step": 192273, "epoch": 1589} {"train_loss": -38.19675827026367, "global_step": 192274, "epoch": 1589} {"train_loss": -39.675758361816406, "global_step": 192275, "epoch": 1589} {"train_loss": -39.208412170410156, "global_step": 192276, "epoch": 1589} {"train_loss": -39.4412727355957, "global_step": 192277, "epoch": 1589} {"train_loss": -39.557373046875, "global_step": 192278, "epoch": 1589} {"train_loss": -39.125484466552734, "global_step": 192279, "epoch": 1589} {"train_loss": -39.213619232177734, "global_step": 192280, "epoch": 1589} {"train_loss": -39.51020431518555, "global_step": 192281, "epoch": 1589} {"train_loss": -39.81345748901367, "global_step": 192282, "epoch": 1589} {"train_loss": -39.329345703125, "global_step": 192283, "epoch": 1589} {"train_loss": -40.4055290222168, "global_step": 192284, "epoch": 1589} {"train_loss": -39.7808952331543, "global_step": 192285, "epoch": 1589} {"train_loss": -40.2421989440918, "global_step": 192286, "epoch": 1589} {"train_loss": -39.74839782714844, "global_step": 192287, "epoch": 1589} {"train_loss": -40.00051498413086, "global_step": 192288, "epoch": 1589} {"train_loss": -40.04812240600586, "global_step": 192289, "epoch": 1589} {"train_loss": -40.52250671386719, "global_step": 192290, "epoch": 1589} {"train_loss": -40.130882263183594, "global_step": 192291, "epoch": 1589} {"train_loss": -41.000606536865234, "global_step": 192292, "epoch": 1589} {"train_loss": -40.34589767456055, "global_step": 192293, "epoch": 1589} {"train_loss": -40.62158966064453, "global_step": 192294, "epoch": 1589} {"train_loss": -40.7882194519043, "global_step": 192295, "epoch": 1589} {"train_loss": -40.741268157958984, "global_step": 192296, "epoch": 1589} {"train_loss": -40.6165771484375, "global_step": 192297, "epoch": 1589} {"train_loss": -40.49189376831055, "global_step": 192298, "epoch": 1589} {"train_loss": -40.75425338745117, "global_step": 192299, "epoch": 1589} {"train_loss": -41.118221282958984, "global_step": 192300, "epoch": 1589} {"train_loss": -40.784725189208984, "global_step": 192301, "epoch": 1589} {"train_loss": -41.097206115722656, "global_step": 192302, "epoch": 1589} {"train_loss": -40.85222244262695, "global_step": 192303, "epoch": 1589} {"train_loss": -41.01898193359375, "global_step": 192304, "epoch": 1589} {"train_loss": -41.12461471557617, "global_step": 192305, "epoch": 1589} {"train_loss": -41.01020050048828, "global_step": 192306, "epoch": 1589} {"train_loss": -41.123390197753906, "global_step": 192307, "epoch": 1589} {"train_loss": -41.0307731628418, "global_step": 192308, "epoch": 1589} {"train_loss": -41.6746940612793, "global_step": 192309, "epoch": 1589} {"train_loss": -40.911163330078125, "global_step": 192310, "epoch": 1589} {"train_loss": -40.82893753051758, "global_step": 192311, "epoch": 1589} {"train_loss": -41.40815353393555, "global_step": 192312, "epoch": 1589} {"train_loss": -41.23722839355469, "global_step": 192313, "epoch": 1589} {"train_loss": -41.33771514892578, "global_step": 192314, "epoch": 1589} {"train_loss": -41.7627067565918, "global_step": 192315, "epoch": 1589} {"train_loss": -41.61007308959961, "global_step": 192316, "epoch": 1589} {"train_loss": -41.614227294921875, "global_step": 192317, "epoch": 1589} {"train_loss": -41.413143157958984, "global_step": 192318, "epoch": 1589} {"train_loss": -40.85676956176758, "global_step": 192319, "epoch": 1589} {"train_loss": -41.50078201293945, "global_step": 192320, "epoch": 1589} {"train_loss": -41.49038314819336, "global_step": 192321, "epoch": 1589} {"train_loss": -41.069820404052734, "global_step": 192322, "epoch": 1589} {"train_loss": -41.13933563232422, "global_step": 192323, "epoch": 1589} {"train_loss": -41.77958297729492, "global_step": 192324, "epoch": 1589} {"train_loss": -40.377445220947266, "global_step": 192325, "epoch": 1589} {"train_loss": -40.689247131347656, "global_step": 192326, "epoch": 1589} {"train_loss": -41.304847717285156, "global_step": 192327, "epoch": 1589} {"train_loss": -41.022621154785156, "global_step": 192328, "epoch": 1589} {"train_loss": -40.765560150146484, "global_step": 192329, "epoch": 1589} {"train_loss": -41.10542678833008, "global_step": 192330, "epoch": 1589} {"train_loss": -41.62826156616211, "global_step": 192331, "epoch": 1589} {"train_loss": -41.312217712402344, "global_step": 192332, "epoch": 1589} {"train_loss": -41.70620346069336, "global_step": 192333, "epoch": 1589} {"train_loss": -41.24253463745117, "global_step": 192334, "epoch": 1589} {"train_loss": -41.637481689453125, "global_step": 192335, "epoch": 1589} {"train_loss": -41.81858444213867, "global_step": 192336, "epoch": 1589} {"train_loss": -40.902305603027344, "global_step": 192337, "epoch": 1589} {"train_loss": -40.431148529052734, "global_step": 192338, "epoch": 1589} {"train_loss": -40.86170196533203, "global_step": 192339, "epoch": 1589} {"train_loss": -41.98672103881836, "global_step": 192340, "epoch": 1589} {"train_loss": -41.14518356323242, "global_step": 192341, "epoch": 1589} {"train_loss": -39.954036712646484, "global_step": 192342, "epoch": 1589} {"train_loss": -40.41733932495117, "global_step": 192343, "epoch": 1589} {"train_loss": -41.691688537597656, "global_step": 192344, "epoch": 1589} {"train_loss": -41.59894943237305, "global_step": 192345, "epoch": 1589} {"train_loss": -41.313018798828125, "global_step": 192346, "epoch": 1589} {"train_loss": -41.49269485473633, "global_step": 192347, "epoch": 1589} {"train_loss": -42.25580978393555, "global_step": 192348, "epoch": 1589} {"train_loss": -41.480037689208984, "global_step": 192349, "epoch": 1589} {"train_loss": -41.85509490966797, "global_step": 192350, "epoch": 1589} {"train_loss": -42.029579162597656, "global_step": 192351, "epoch": 1589} {"train_loss": -42.239906311035156, "global_step": 192352, "epoch": 1589} {"train_loss": -41.96723556518555, "global_step": 192353, "epoch": 1589} {"train_loss": -41.88962936401367, "global_step": 192354, "epoch": 1589} {"train_loss": -41.3992805480957, "global_step": 192355, "epoch": 1589} {"train_loss": -41.97426986694336, "global_step": 192356, "epoch": 1589} {"train_loss": -41.76456832885742, "global_step": 192357, "epoch": 1589} {"train_loss": -41.30280685424805, "global_step": 192358, "epoch": 1589} {"train_loss": -41.813072204589844, "global_step": 192359, "epoch": 1589} {"train_loss": -41.80450439453125, "global_step": 192360, "epoch": 1589} {"train_loss": -41.68513107299805, "global_step": 192361, "epoch": 1589} {"train_loss": -42.32691192626953, "global_step": 192362, "epoch": 1589} {"train_loss": -41.920562744140625, "global_step": 192363, "epoch": 1589} {"train_loss": -41.95029830932617, "global_step": 192364, "epoch": 1589} {"train_loss": -42.50428009033203, "global_step": 192365, "epoch": 1589} {"train_loss": -41.264381408691406, "global_step": 192366, "epoch": 1589} {"train_loss": -41.65218734741211, "global_step": 192367, "epoch": 1589} {"train_loss": -42.00031661987305, "global_step": 192368, "epoch": 1589} {"train_loss": -41.49581527709961, "global_step": 192369, "epoch": 1589} {"train_loss": -41.524715423583984, "global_step": 192370, "epoch": 1589} {"train_loss": -41.66547775268555, "global_step": 192371, "epoch": 1589} {"train_loss": -42.367835998535156, "global_step": 192372, "epoch": 1589} {"train_loss": -42.260799407958984, "global_step": 192373, "epoch": 1589} {"train_loss": -41.749019622802734, "global_step": 192374, "epoch": 1589} {"train_loss": -42.4674186706543, "global_step": 192375, "epoch": 1589} {"train_loss": -42.25532531738281, "global_step": 192376, "epoch": 1589} {"train_loss": -42.66129684448242, "global_step": 192377, "epoch": 1589} {"train_loss": -42.3440055847168, "global_step": 192378, "epoch": 1589} {"train_loss": -42.5459098815918, "global_step": 192379, "epoch": 1589} {"train_loss": -42.330440521240234, "global_step": 192380, "epoch": 1589} {"train_loss": -42.119117736816406, "global_step": 192381, "epoch": 1589} {"train_loss": -41.89874267578125, "global_step": 192382, "epoch": 1589} {"train_loss": -42.56298828125, "global_step": 192383, "epoch": 1589} {"train_loss": -41.91475296020508, "global_step": 192384, "epoch": 1589} {"train_loss": -41.865352630615234, "global_step": 192385, "epoch": 1589} {"train_loss": -42.509559631347656, "global_step": 192386, "epoch": 1589} {"train_loss": -42.342376708984375, "global_step": 192387, "epoch": 1589} {"train_loss": -41.63786697387695, "global_step": 192388, "epoch": 1589} {"train_loss": -41.09238537875089, "global_step": 192389, "epoch": 1589, "val_loss": 2526904.5} {"train_loss": -40.74581527709961, "global_step": 192390, "epoch": 1590} {"train_loss": -42.13786697387695, "global_step": 192391, "epoch": 1590} {"train_loss": -42.13129806518555, "global_step": 192392, "epoch": 1590} {"train_loss": -41.876487731933594, "global_step": 192393, "epoch": 1590} {"train_loss": -42.0036735534668, "global_step": 192394, "epoch": 1590} {"train_loss": -41.39876937866211, "global_step": 192395, "epoch": 1590} {"train_loss": -42.220333099365234, "global_step": 192396, "epoch": 1590} {"train_loss": -41.535675048828125, "global_step": 192397, "epoch": 1590} {"train_loss": -41.01803207397461, "global_step": 192398, "epoch": 1590} {"train_loss": -41.319576263427734, "global_step": 192399, "epoch": 1590} {"train_loss": -41.864715576171875, "global_step": 192400, "epoch": 1590} {"train_loss": -42.1572265625, "global_step": 192401, "epoch": 1590} {"train_loss": -40.985504150390625, "global_step": 192402, "epoch": 1590} {"train_loss": -40.7706298828125, "global_step": 192403, "epoch": 1590} {"train_loss": -41.542205810546875, "global_step": 192404, "epoch": 1590} {"train_loss": -42.186279296875, "global_step": 192405, "epoch": 1590} {"train_loss": -41.038204193115234, "global_step": 192406, "epoch": 1590} {"train_loss": -39.825592041015625, "global_step": 192407, "epoch": 1590} {"train_loss": -40.86707305908203, "global_step": 192408, "epoch": 1590} {"train_loss": -40.9347038269043, "global_step": 192409, "epoch": 1590} {"train_loss": -41.086727142333984, "global_step": 192410, "epoch": 1590} {"train_loss": -42.29642868041992, "global_step": 192411, "epoch": 1590} {"train_loss": -41.226348876953125, "global_step": 192412, "epoch": 1590} {"train_loss": -38.76770782470703, "global_step": 192413, "epoch": 1590} {"train_loss": -40.74332809448242, "global_step": 192414, "epoch": 1590} {"train_loss": -41.318267822265625, "global_step": 192415, "epoch": 1590} {"train_loss": -39.02750015258789, "global_step": 192416, "epoch": 1590} {"train_loss": -38.991477966308594, "global_step": 192417, "epoch": 1590} {"train_loss": -40.400794982910156, "global_step": 192418, "epoch": 1590} {"train_loss": -39.000144958496094, "global_step": 192419, "epoch": 1590} {"train_loss": -39.67939376831055, "global_step": 192420, "epoch": 1590} {"train_loss": -39.7836799621582, "global_step": 192421, "epoch": 1590} {"train_loss": -38.39483642578125, "global_step": 192422, "epoch": 1590} {"train_loss": -40.33515930175781, "global_step": 192423, "epoch": 1590} {"train_loss": -39.667022705078125, "global_step": 192424, "epoch": 1590} {"train_loss": -41.362213134765625, "global_step": 192425, "epoch": 1590} {"train_loss": -40.0217399597168, "global_step": 192426, "epoch": 1590} {"train_loss": -40.49380111694336, "global_step": 192427, "epoch": 1590} {"train_loss": -41.743160247802734, "global_step": 192428, "epoch": 1590} {"train_loss": -41.20835494995117, "global_step": 192429, "epoch": 1590} {"train_loss": -40.952301025390625, "global_step": 192430, "epoch": 1590} {"train_loss": -41.72468948364258, "global_step": 192431, "epoch": 1590} {"train_loss": -41.835689544677734, "global_step": 192432, "epoch": 1590} {"train_loss": -41.48297882080078, "global_step": 192433, "epoch": 1590} {"train_loss": -41.80017852783203, "global_step": 192434, "epoch": 1590} {"train_loss": -41.905906677246094, "global_step": 192435, "epoch": 1590} {"train_loss": -41.8104362487793, "global_step": 192436, "epoch": 1590} {"train_loss": -41.56977462768555, "global_step": 192437, "epoch": 1590} {"train_loss": -41.872135162353516, "global_step": 192438, "epoch": 1590} {"train_loss": -41.95705795288086, "global_step": 192439, "epoch": 1590} {"train_loss": -41.487579345703125, "global_step": 192440, "epoch": 1590} {"train_loss": -41.58993148803711, "global_step": 192441, "epoch": 1590} {"train_loss": -42.14271926879883, "global_step": 192442, "epoch": 1590} {"train_loss": -42.18532943725586, "global_step": 192443, "epoch": 1590} {"train_loss": -41.039649963378906, "global_step": 192444, "epoch": 1590} {"train_loss": -41.817562103271484, "global_step": 192445, "epoch": 1590} {"train_loss": -41.56997299194336, "global_step": 192446, "epoch": 1590} {"train_loss": -41.48224639892578, "global_step": 192447, "epoch": 1590} {"train_loss": -41.128639221191406, "global_step": 192448, "epoch": 1590} {"train_loss": -41.37939453125, "global_step": 192449, "epoch": 1590} {"train_loss": -41.405452728271484, "global_step": 192450, "epoch": 1590} {"train_loss": -41.682830810546875, "global_step": 192451, "epoch": 1590} {"train_loss": -40.79472732543945, "global_step": 192452, "epoch": 1590} {"train_loss": -42.45656967163086, "global_step": 192453, "epoch": 1590} {"train_loss": -40.802215576171875, "global_step": 192454, "epoch": 1590} {"train_loss": -41.28240966796875, "global_step": 192455, "epoch": 1590} {"train_loss": -41.1102409362793, "global_step": 192456, "epoch": 1590} {"train_loss": -41.779815673828125, "global_step": 192457, "epoch": 1590} {"train_loss": -42.02949142456055, "global_step": 192458, "epoch": 1590} {"train_loss": -41.09718704223633, "global_step": 192459, "epoch": 1590} {"train_loss": -41.792945861816406, "global_step": 192460, "epoch": 1590} {"train_loss": -41.18148422241211, "global_step": 192461, "epoch": 1590} {"train_loss": -41.249359130859375, "global_step": 192462, "epoch": 1590} {"train_loss": -42.182254791259766, "global_step": 192463, "epoch": 1590} {"train_loss": -41.23704147338867, "global_step": 192464, "epoch": 1590} {"train_loss": -42.08859634399414, "global_step": 192465, "epoch": 1590} {"train_loss": -41.06863021850586, "global_step": 192466, "epoch": 1590} {"train_loss": -41.90438461303711, "global_step": 192467, "epoch": 1590} {"train_loss": -41.12614059448242, "global_step": 192468, "epoch": 1590} {"train_loss": -40.60908126831055, "global_step": 192469, "epoch": 1590} {"train_loss": -41.80730056762695, "global_step": 192470, "epoch": 1590} {"train_loss": -41.84443283081055, "global_step": 192471, "epoch": 1590} {"train_loss": -41.888038635253906, "global_step": 192472, "epoch": 1590} {"train_loss": -41.94918441772461, "global_step": 192473, "epoch": 1590} {"train_loss": -41.775386810302734, "global_step": 192474, "epoch": 1590} {"train_loss": -42.024635314941406, "global_step": 192475, "epoch": 1590} {"train_loss": -41.638938903808594, "global_step": 192476, "epoch": 1590} {"train_loss": -41.42563247680664, "global_step": 192477, "epoch": 1590} {"train_loss": -41.809444427490234, "global_step": 192478, "epoch": 1590} {"train_loss": -41.538387298583984, "global_step": 192479, "epoch": 1590} {"train_loss": -41.194820404052734, "global_step": 192480, "epoch": 1590} {"train_loss": -41.7243766784668, "global_step": 192481, "epoch": 1590} {"train_loss": -41.8713493347168, "global_step": 192482, "epoch": 1590} {"train_loss": -40.902008056640625, "global_step": 192483, "epoch": 1590} {"train_loss": -41.67635726928711, "global_step": 192484, "epoch": 1590} {"train_loss": -42.20228958129883, "global_step": 192485, "epoch": 1590} {"train_loss": -41.98734664916992, "global_step": 192486, "epoch": 1590} {"train_loss": -41.94152069091797, "global_step": 192487, "epoch": 1590} {"train_loss": -42.62864685058594, "global_step": 192488, "epoch": 1590} {"train_loss": -41.0163688659668, "global_step": 192489, "epoch": 1590} {"train_loss": -41.28278732299805, "global_step": 192490, "epoch": 1590} {"train_loss": -40.52690505981445, "global_step": 192491, "epoch": 1590} {"train_loss": -41.93319320678711, "global_step": 192492, "epoch": 1590} {"train_loss": -42.06171798706055, "global_step": 192493, "epoch": 1590} {"train_loss": -42.676082611083984, "global_step": 192494, "epoch": 1590} {"train_loss": -41.56367111206055, "global_step": 192495, "epoch": 1590} {"train_loss": -40.74453353881836, "global_step": 192496, "epoch": 1590} {"train_loss": -39.775325775146484, "global_step": 192497, "epoch": 1590} {"train_loss": -42.172908782958984, "global_step": 192498, "epoch": 1590} {"train_loss": -40.6382942199707, "global_step": 192499, "epoch": 1590} {"train_loss": -37.480098724365234, "global_step": 192500, "epoch": 1590} {"train_loss": -38.69287872314453, "global_step": 192501, "epoch": 1590} {"train_loss": -42.157894134521484, "global_step": 192502, "epoch": 1590} {"train_loss": -39.98747634887695, "global_step": 192503, "epoch": 1590} {"train_loss": -38.66421127319336, "global_step": 192504, "epoch": 1590} {"train_loss": -40.362770080566406, "global_step": 192505, "epoch": 1590} {"train_loss": -41.523624420166016, "global_step": 192506, "epoch": 1590} {"train_loss": -39.74534606933594, "global_step": 192507, "epoch": 1590} {"train_loss": -41.649452209472656, "global_step": 192508, "epoch": 1590} {"train_loss": -40.52681350708008, "global_step": 192509, "epoch": 1590} {"train_loss": -41.18323072323129, "global_step": 192510, "epoch": 1590, "val_loss": 2526510.0} {"train_loss": -41.22043228149414, "global_step": 192511, "epoch": 1591} {"train_loss": -41.11955642700195, "global_step": 192512, "epoch": 1591} {"train_loss": -40.93307113647461, "global_step": 192513, "epoch": 1591} {"train_loss": -40.20505905151367, "global_step": 192514, "epoch": 1591} {"train_loss": -40.49869155883789, "global_step": 192515, "epoch": 1591} {"train_loss": -41.66549301147461, "global_step": 192516, "epoch": 1591} {"train_loss": -39.35258483886719, "global_step": 192517, "epoch": 1591} {"train_loss": -41.28131866455078, "global_step": 192518, "epoch": 1591} {"train_loss": -40.563621520996094, "global_step": 192519, "epoch": 1591} {"train_loss": -40.39199447631836, "global_step": 192520, "epoch": 1591} {"train_loss": -39.95223617553711, "global_step": 192521, "epoch": 1591} {"train_loss": -40.970428466796875, "global_step": 192522, "epoch": 1591} {"train_loss": -42.07440948486328, "global_step": 192523, "epoch": 1591} {"train_loss": -40.41606140136719, "global_step": 192524, "epoch": 1591} {"train_loss": -41.07804489135742, "global_step": 192525, "epoch": 1591} {"train_loss": -41.18752670288086, "global_step": 192526, "epoch": 1591} {"train_loss": -40.4216423034668, "global_step": 192527, "epoch": 1591} {"train_loss": -40.39559555053711, "global_step": 192528, "epoch": 1591} {"train_loss": -41.746437072753906, "global_step": 192529, "epoch": 1591} {"train_loss": -40.75564193725586, "global_step": 192530, "epoch": 1591} {"train_loss": -40.344459533691406, "global_step": 192531, "epoch": 1591} {"train_loss": -40.825809478759766, "global_step": 192532, "epoch": 1591} {"train_loss": -41.88951873779297, "global_step": 192533, "epoch": 1591} {"train_loss": -40.18465805053711, "global_step": 192534, "epoch": 1591} {"train_loss": -40.53776550292969, "global_step": 192535, "epoch": 1591} {"train_loss": -41.6125602722168, "global_step": 192536, "epoch": 1591} {"train_loss": -40.51247024536133, "global_step": 192537, "epoch": 1591} {"train_loss": -41.368629455566406, "global_step": 192538, "epoch": 1591} {"train_loss": -41.66563034057617, "global_step": 192539, "epoch": 1591} {"train_loss": -40.679935455322266, "global_step": 192540, "epoch": 1591} {"train_loss": -41.069976806640625, "global_step": 192541, "epoch": 1591} {"train_loss": -41.53144454956055, "global_step": 192542, "epoch": 1591} {"train_loss": -41.10577392578125, "global_step": 192543, "epoch": 1591} {"train_loss": -41.549354553222656, "global_step": 192544, "epoch": 1591} {"train_loss": -41.78425979614258, "global_step": 192545, "epoch": 1591} {"train_loss": -41.87214660644531, "global_step": 192546, "epoch": 1591} {"train_loss": -41.4245491027832, "global_step": 192547, "epoch": 1591} {"train_loss": -41.586212158203125, "global_step": 192548, "epoch": 1591} {"train_loss": -41.52236557006836, "global_step": 192549, "epoch": 1591} {"train_loss": -41.6064567565918, "global_step": 192550, "epoch": 1591} {"train_loss": -42.083736419677734, "global_step": 192551, "epoch": 1591} {"train_loss": -41.55891036987305, "global_step": 192552, "epoch": 1591} {"train_loss": -41.60712814331055, "global_step": 192553, "epoch": 1591} {"train_loss": -41.608131408691406, "global_step": 192554, "epoch": 1591} {"train_loss": -42.27952194213867, "global_step": 192555, "epoch": 1591} {"train_loss": -41.61469650268555, "global_step": 192556, "epoch": 1591} {"train_loss": -41.939144134521484, "global_step": 192557, "epoch": 1591} {"train_loss": -40.868019104003906, "global_step": 192558, "epoch": 1591} {"train_loss": -42.12685775756836, "global_step": 192559, "epoch": 1591} {"train_loss": -41.56672286987305, "global_step": 192560, "epoch": 1591} {"train_loss": -41.72443771362305, "global_step": 192561, "epoch": 1591} {"train_loss": -42.36396026611328, "global_step": 192562, "epoch": 1591} {"train_loss": -41.36149597167969, "global_step": 192563, "epoch": 1591} {"train_loss": -42.27094268798828, "global_step": 192564, "epoch": 1591} {"train_loss": -42.2220573425293, "global_step": 192565, "epoch": 1591} {"train_loss": -42.18877029418945, "global_step": 192566, "epoch": 1591} {"train_loss": -42.32927703857422, "global_step": 192567, "epoch": 1591} {"train_loss": -42.331031799316406, "global_step": 192568, "epoch": 1591} {"train_loss": -42.62666320800781, "global_step": 192569, "epoch": 1591} {"train_loss": -42.50777053833008, "global_step": 192570, "epoch": 1591} {"train_loss": -42.46210479736328, "global_step": 192571, "epoch": 1591} {"train_loss": -42.043174743652344, "global_step": 192572, "epoch": 1591} {"train_loss": -42.781185150146484, "global_step": 192573, "epoch": 1591} {"train_loss": -42.8751220703125, "global_step": 192574, "epoch": 1591} {"train_loss": -41.665931701660156, "global_step": 192575, "epoch": 1591} {"train_loss": -42.060298919677734, "global_step": 192576, "epoch": 1591} {"train_loss": -42.47145080566406, "global_step": 192577, "epoch": 1591} {"train_loss": -42.495723724365234, "global_step": 192578, "epoch": 1591} {"train_loss": -42.6651496887207, "global_step": 192579, "epoch": 1591} {"train_loss": -42.42249298095703, "global_step": 192580, "epoch": 1591} {"train_loss": -42.50651168823242, "global_step": 192581, "epoch": 1591} {"train_loss": -42.49444580078125, "global_step": 192582, "epoch": 1591} {"train_loss": -42.09207534790039, "global_step": 192583, "epoch": 1591} {"train_loss": -42.79896926879883, "global_step": 192584, "epoch": 1591} {"train_loss": -42.32805633544922, "global_step": 192585, "epoch": 1591} {"train_loss": -42.224117279052734, "global_step": 192586, "epoch": 1591} {"train_loss": -42.6978759765625, "global_step": 192587, "epoch": 1591} {"train_loss": -42.636226654052734, "global_step": 192588, "epoch": 1591} {"train_loss": -42.613121032714844, "global_step": 192589, "epoch": 1591} {"train_loss": -41.970947265625, "global_step": 192590, "epoch": 1591} {"train_loss": -42.75598907470703, "global_step": 192591, "epoch": 1591} {"train_loss": -42.69695281982422, "global_step": 192592, "epoch": 1591} {"train_loss": -42.71392822265625, "global_step": 192593, "epoch": 1591} {"train_loss": -42.68282699584961, "global_step": 192594, "epoch": 1591} {"train_loss": -42.34900665283203, "global_step": 192595, "epoch": 1591} {"train_loss": -41.69245147705078, "global_step": 192596, "epoch": 1591} {"train_loss": -39.05998611450195, "global_step": 192597, "epoch": 1591} {"train_loss": -35.49331283569336, "global_step": 192598, "epoch": 1591} {"train_loss": -41.43846893310547, "global_step": 192599, "epoch": 1591} {"train_loss": -36.69679641723633, "global_step": 192600, "epoch": 1591} {"train_loss": -36.4340934753418, "global_step": 192601, "epoch": 1591} {"train_loss": -41.7847785949707, "global_step": 192602, "epoch": 1591} {"train_loss": -36.661251068115234, "global_step": 192603, "epoch": 1591} {"train_loss": -41.17031478881836, "global_step": 192604, "epoch": 1591} {"train_loss": -38.90118408203125, "global_step": 192605, "epoch": 1591} {"train_loss": -39.01740264892578, "global_step": 192606, "epoch": 1591} {"train_loss": -40.64503860473633, "global_step": 192607, "epoch": 1591} {"train_loss": -38.804813385009766, "global_step": 192608, "epoch": 1591} {"train_loss": -40.63699722290039, "global_step": 192609, "epoch": 1591} {"train_loss": -40.27641296386719, "global_step": 192610, "epoch": 1591} {"train_loss": -40.915870666503906, "global_step": 192611, "epoch": 1591} {"train_loss": -40.38825607299805, "global_step": 192612, "epoch": 1591} {"train_loss": -40.6562614440918, "global_step": 192613, "epoch": 1591} {"train_loss": -41.15618896484375, "global_step": 192614, "epoch": 1591} {"train_loss": -41.11079788208008, "global_step": 192615, "epoch": 1591} {"train_loss": -40.48484420776367, "global_step": 192616, "epoch": 1591} {"train_loss": -40.86635208129883, "global_step": 192617, "epoch": 1591} {"train_loss": -40.64850616455078, "global_step": 192618, "epoch": 1591} {"train_loss": -40.24018096923828, "global_step": 192619, "epoch": 1591} {"train_loss": -41.33260726928711, "global_step": 192620, "epoch": 1591} {"train_loss": -39.79720687866211, "global_step": 192621, "epoch": 1591} {"train_loss": -41.570655822753906, "global_step": 192622, "epoch": 1591} {"train_loss": -41.02066421508789, "global_step": 192623, "epoch": 1591} {"train_loss": -40.75062942504883, "global_step": 192624, "epoch": 1591} {"train_loss": -41.56809616088867, "global_step": 192625, "epoch": 1591} {"train_loss": -40.87499237060547, "global_step": 192626, "epoch": 1591} {"train_loss": -41.84031295776367, "global_step": 192627, "epoch": 1591} {"train_loss": -40.81098556518555, "global_step": 192628, "epoch": 1591} {"train_loss": -41.10801315307617, "global_step": 192629, "epoch": 1591} {"train_loss": -41.48572540283203, "global_step": 192630, "epoch": 1591} {"train_loss": -41.24374928750282, "global_step": 192631, "epoch": 1591, "val_loss": 2518168.75} {"train_loss": -41.65452194213867, "global_step": 192632, "epoch": 1592} {"train_loss": -41.210750579833984, "global_step": 192633, "epoch": 1592} {"train_loss": -40.82075500488281, "global_step": 192634, "epoch": 1592} {"train_loss": -41.522335052490234, "global_step": 192635, "epoch": 1592} {"train_loss": -40.32546615600586, "global_step": 192636, "epoch": 1592} {"train_loss": -41.2491569519043, "global_step": 192637, "epoch": 1592} {"train_loss": -41.821834564208984, "global_step": 192638, "epoch": 1592} {"train_loss": -40.84626388549805, "global_step": 192639, "epoch": 1592} {"train_loss": -40.907283782958984, "global_step": 192640, "epoch": 1592} {"train_loss": -41.835689544677734, "global_step": 192641, "epoch": 1592} {"train_loss": -42.02363204956055, "global_step": 192642, "epoch": 1592} {"train_loss": -42.54269027709961, "global_step": 192643, "epoch": 1592} {"train_loss": -41.66592025756836, "global_step": 192644, "epoch": 1592} {"train_loss": -42.3191032409668, "global_step": 192645, "epoch": 1592} {"train_loss": -41.73551559448242, "global_step": 192646, "epoch": 1592} {"train_loss": -41.909053802490234, "global_step": 192647, "epoch": 1592} {"train_loss": -41.56622314453125, "global_step": 192648, "epoch": 1592} {"train_loss": -42.39448165893555, "global_step": 192649, "epoch": 1592} {"train_loss": -42.3901252746582, "global_step": 192650, "epoch": 1592} {"train_loss": -42.230072021484375, "global_step": 192651, "epoch": 1592} {"train_loss": -42.48622512817383, "global_step": 192652, "epoch": 1592} {"train_loss": -41.89376449584961, "global_step": 192653, "epoch": 1592} {"train_loss": -42.45833969116211, "global_step": 192654, "epoch": 1592} {"train_loss": -42.35090637207031, "global_step": 192655, "epoch": 1592} {"train_loss": -42.09757614135742, "global_step": 192656, "epoch": 1592} {"train_loss": -41.22623825073242, "global_step": 192657, "epoch": 1592} {"train_loss": -42.21307373046875, "global_step": 192658, "epoch": 1592} {"train_loss": -42.7761344909668, "global_step": 192659, "epoch": 1592} {"train_loss": -42.409908294677734, "global_step": 192660, "epoch": 1592} {"train_loss": -41.54037857055664, "global_step": 192661, "epoch": 1592} {"train_loss": -40.50922775268555, "global_step": 192662, "epoch": 1592} {"train_loss": -40.108577728271484, "global_step": 192663, "epoch": 1592} {"train_loss": -38.28729248046875, "global_step": 192664, "epoch": 1592} {"train_loss": -38.73395538330078, "global_step": 192665, "epoch": 1592} {"train_loss": -41.23199462890625, "global_step": 192666, "epoch": 1592} {"train_loss": -41.531837463378906, "global_step": 192667, "epoch": 1592} {"train_loss": -41.17356491088867, "global_step": 192668, "epoch": 1592} {"train_loss": -39.05695724487305, "global_step": 192669, "epoch": 1592} {"train_loss": -41.085636138916016, "global_step": 192670, "epoch": 1592} {"train_loss": -42.216949462890625, "global_step": 192671, "epoch": 1592} {"train_loss": -38.76970291137695, "global_step": 192672, "epoch": 1592} {"train_loss": -37.26091384887695, "global_step": 192673, "epoch": 1592} {"train_loss": -41.93117904663086, "global_step": 192674, "epoch": 1592} {"train_loss": -35.49921417236328, "global_step": 192675, "epoch": 1592} {"train_loss": -38.706111907958984, "global_step": 192676, "epoch": 1592} {"train_loss": -33.3855094909668, "global_step": 192677, "epoch": 1592} {"train_loss": -32.32845687866211, "global_step": 192678, "epoch": 1592} {"train_loss": -38.47504806518555, "global_step": 192679, "epoch": 1592} {"train_loss": -27.932861328125, "global_step": 192680, "epoch": 1592} {"train_loss": -38.37699890136719, "global_step": 192681, "epoch": 1592} {"train_loss": -32.96488952636719, "global_step": 192682, "epoch": 1592} {"train_loss": -36.355472564697266, "global_step": 192683, "epoch": 1592} {"train_loss": -39.2125129699707, "global_step": 192684, "epoch": 1592} {"train_loss": -37.640625, "global_step": 192685, "epoch": 1592} {"train_loss": -39.23736572265625, "global_step": 192686, "epoch": 1592} {"train_loss": -37.41590881347656, "global_step": 192687, "epoch": 1592} {"train_loss": -39.01522445678711, "global_step": 192688, "epoch": 1592} {"train_loss": -38.94477844238281, "global_step": 192689, "epoch": 1592} {"train_loss": -38.688655853271484, "global_step": 192690, "epoch": 1592} {"train_loss": -38.5462760925293, "global_step": 192691, "epoch": 1592} {"train_loss": -36.359554290771484, "global_step": 192692, "epoch": 1592} {"train_loss": -39.18217849731445, "global_step": 192693, "epoch": 1592} {"train_loss": -38.76459884643555, "global_step": 192694, "epoch": 1592} {"train_loss": -38.478450775146484, "global_step": 192695, "epoch": 1592} {"train_loss": -39.754878997802734, "global_step": 192696, "epoch": 1592} {"train_loss": -38.15869140625, "global_step": 192697, "epoch": 1592} {"train_loss": -40.09640121459961, "global_step": 192698, "epoch": 1592} {"train_loss": -39.37533187866211, "global_step": 192699, "epoch": 1592} {"train_loss": -40.40568542480469, "global_step": 192700, "epoch": 1592} {"train_loss": -39.52271270751953, "global_step": 192701, "epoch": 1592} {"train_loss": -41.09385299682617, "global_step": 192702, "epoch": 1592} {"train_loss": -40.707725524902344, "global_step": 192703, "epoch": 1592} {"train_loss": -41.275386810302734, "global_step": 192704, "epoch": 1592} {"train_loss": -40.35370635986328, "global_step": 192705, "epoch": 1592} {"train_loss": -41.38365173339844, "global_step": 192706, "epoch": 1592} {"train_loss": -40.857643127441406, "global_step": 192707, "epoch": 1592} {"train_loss": -41.441219329833984, "global_step": 192708, "epoch": 1592} {"train_loss": -41.16716384887695, "global_step": 192709, "epoch": 1592} {"train_loss": -41.1667594909668, "global_step": 192710, "epoch": 1592} {"train_loss": -41.32699203491211, "global_step": 192711, "epoch": 1592} {"train_loss": -41.33028793334961, "global_step": 192712, "epoch": 1592} {"train_loss": -41.16939163208008, "global_step": 192713, "epoch": 1592} {"train_loss": -41.539215087890625, "global_step": 192714, "epoch": 1592} {"train_loss": -41.150943756103516, "global_step": 192715, "epoch": 1592} {"train_loss": -41.6193962097168, "global_step": 192716, "epoch": 1592} {"train_loss": -41.56010055541992, "global_step": 192717, "epoch": 1592} {"train_loss": -42.01180648803711, "global_step": 192718, "epoch": 1592} {"train_loss": -41.766571044921875, "global_step": 192719, "epoch": 1592} {"train_loss": -42.17498779296875, "global_step": 192720, "epoch": 1592} {"train_loss": -42.008575439453125, "global_step": 192721, "epoch": 1592} {"train_loss": -42.1724853515625, "global_step": 192722, "epoch": 1592} {"train_loss": -42.060420989990234, "global_step": 192723, "epoch": 1592} {"train_loss": -41.92529296875, "global_step": 192724, "epoch": 1592} {"train_loss": -41.78964614868164, "global_step": 192725, "epoch": 1592} {"train_loss": -42.1583366394043, "global_step": 192726, "epoch": 1592} {"train_loss": -42.00143051147461, "global_step": 192727, "epoch": 1592} {"train_loss": -42.187110900878906, "global_step": 192728, "epoch": 1592} {"train_loss": -42.3537712097168, "global_step": 192729, "epoch": 1592} {"train_loss": -42.345611572265625, "global_step": 192730, "epoch": 1592} {"train_loss": -42.29615020751953, "global_step": 192731, "epoch": 1592} {"train_loss": -42.648555755615234, "global_step": 192732, "epoch": 1592} {"train_loss": -42.25806427001953, "global_step": 192733, "epoch": 1592} {"train_loss": -42.082210540771484, "global_step": 192734, "epoch": 1592} {"train_loss": -42.614070892333984, "global_step": 192735, "epoch": 1592} {"train_loss": -42.23984909057617, "global_step": 192736, "epoch": 1592} {"train_loss": -42.4579963684082, "global_step": 192737, "epoch": 1592} {"train_loss": -42.06133270263672, "global_step": 192738, "epoch": 1592} {"train_loss": -42.53887176513672, "global_step": 192739, "epoch": 1592} {"train_loss": -42.65497589111328, "global_step": 192740, "epoch": 1592} {"train_loss": -42.532501220703125, "global_step": 192741, "epoch": 1592} {"train_loss": -42.616939544677734, "global_step": 192742, "epoch": 1592} {"train_loss": -42.458473205566406, "global_step": 192743, "epoch": 1592} {"train_loss": -42.71725082397461, "global_step": 192744, "epoch": 1592} {"train_loss": -42.42025375366211, "global_step": 192745, "epoch": 1592} {"train_loss": -42.684234619140625, "global_step": 192746, "epoch": 1592} {"train_loss": -42.27155685424805, "global_step": 192747, "epoch": 1592} {"train_loss": -42.22660446166992, "global_step": 192748, "epoch": 1592} {"train_loss": -42.55376052856445, "global_step": 192749, "epoch": 1592} {"train_loss": -42.4816780090332, "global_step": 192750, "epoch": 1592} {"train_loss": -42.86265182495117, "global_step": 192751, "epoch": 1592} {"train_loss": -40.73613972309207, "global_step": 192752, "epoch": 1592, "val_loss": 2417839.25} {"train_loss": -42.71487045288086, "global_step": 192753, "epoch": 1593} {"train_loss": -42.78626251220703, "global_step": 192754, "epoch": 1593} {"train_loss": -43.15353775024414, "global_step": 192755, "epoch": 1593} {"train_loss": -42.402687072753906, "global_step": 192756, "epoch": 1593} {"train_loss": -42.69944381713867, "global_step": 192757, "epoch": 1593} {"train_loss": -42.940223693847656, "global_step": 192758, "epoch": 1593} {"train_loss": -42.72991943359375, "global_step": 192759, "epoch": 1593} {"train_loss": -42.91107177734375, "global_step": 192760, "epoch": 1593} {"train_loss": -42.89101791381836, "global_step": 192761, "epoch": 1593} {"train_loss": -42.44532012939453, "global_step": 192762, "epoch": 1593} {"train_loss": -42.76603698730469, "global_step": 192763, "epoch": 1593} {"train_loss": -42.95064926147461, "global_step": 192764, "epoch": 1593} {"train_loss": -42.352996826171875, "global_step": 192765, "epoch": 1593} {"train_loss": -42.0106201171875, "global_step": 192766, "epoch": 1593} {"train_loss": -42.033809661865234, "global_step": 192767, "epoch": 1593} {"train_loss": -42.50020217895508, "global_step": 192768, "epoch": 1593} {"train_loss": -42.03826904296875, "global_step": 192769, "epoch": 1593} {"train_loss": -41.47764587402344, "global_step": 192770, "epoch": 1593} {"train_loss": -41.30601501464844, "global_step": 192771, "epoch": 1593} {"train_loss": -42.948875427246094, "global_step": 192772, "epoch": 1593} {"train_loss": -41.91279220581055, "global_step": 192773, "epoch": 1593} {"train_loss": -41.17463302612305, "global_step": 192774, "epoch": 1593} {"train_loss": -40.64073181152344, "global_step": 192775, "epoch": 1593} {"train_loss": -41.805259704589844, "global_step": 192776, "epoch": 1593} {"train_loss": -41.59562301635742, "global_step": 192777, "epoch": 1593} {"train_loss": -42.98225402832031, "global_step": 192778, "epoch": 1593} {"train_loss": -42.46895980834961, "global_step": 192779, "epoch": 1593} {"train_loss": -42.57529830932617, "global_step": 192780, "epoch": 1593} {"train_loss": -42.614498138427734, "global_step": 192781, "epoch": 1593} {"train_loss": -42.71147537231445, "global_step": 192782, "epoch": 1593} {"train_loss": -42.27204513549805, "global_step": 192783, "epoch": 1593} {"train_loss": -42.52687072753906, "global_step": 192784, "epoch": 1593} {"train_loss": -42.38127517700195, "global_step": 192785, "epoch": 1593} {"train_loss": -41.61669921875, "global_step": 192786, "epoch": 1593} {"train_loss": -42.67911148071289, "global_step": 192787, "epoch": 1593} {"train_loss": -42.8573112487793, "global_step": 192788, "epoch": 1593} {"train_loss": -41.851985931396484, "global_step": 192789, "epoch": 1593} {"train_loss": -42.71918869018555, "global_step": 192790, "epoch": 1593} {"train_loss": -42.28206253051758, "global_step": 192791, "epoch": 1593} {"train_loss": -40.805763244628906, "global_step": 192792, "epoch": 1593} {"train_loss": -41.670684814453125, "global_step": 192793, "epoch": 1593} {"train_loss": -42.32190704345703, "global_step": 192794, "epoch": 1593} {"train_loss": -42.17413330078125, "global_step": 192795, "epoch": 1593} {"train_loss": -42.028282165527344, "global_step": 192796, "epoch": 1593} {"train_loss": -42.459686279296875, "global_step": 192797, "epoch": 1593} {"train_loss": -42.48065948486328, "global_step": 192798, "epoch": 1593} {"train_loss": -42.80095672607422, "global_step": 192799, "epoch": 1593} {"train_loss": -42.17682647705078, "global_step": 192800, "epoch": 1593} {"train_loss": -42.452056884765625, "global_step": 192801, "epoch": 1593} {"train_loss": -42.100311279296875, "global_step": 192802, "epoch": 1593} {"train_loss": -42.414215087890625, "global_step": 192803, "epoch": 1593} {"train_loss": -42.279747009277344, "global_step": 192804, "epoch": 1593} {"train_loss": -41.81461715698242, "global_step": 192805, "epoch": 1593} {"train_loss": -42.60938262939453, "global_step": 192806, "epoch": 1593} {"train_loss": -42.1515007019043, "global_step": 192807, "epoch": 1593} {"train_loss": -41.34375, "global_step": 192808, "epoch": 1593} {"train_loss": -40.25901794433594, "global_step": 192809, "epoch": 1593} {"train_loss": -41.91465377807617, "global_step": 192810, "epoch": 1593} {"train_loss": -40.95229721069336, "global_step": 192811, "epoch": 1593} {"train_loss": -39.004310607910156, "global_step": 192812, "epoch": 1593} {"train_loss": -40.49526596069336, "global_step": 192813, "epoch": 1593} {"train_loss": -40.7205696105957, "global_step": 192814, "epoch": 1593} {"train_loss": -39.3480110168457, "global_step": 192815, "epoch": 1593} {"train_loss": -38.345985412597656, "global_step": 192816, "epoch": 1593} {"train_loss": -41.168052673339844, "global_step": 192817, "epoch": 1593} {"train_loss": -39.9259033203125, "global_step": 192818, "epoch": 1593} {"train_loss": -41.23167419433594, "global_step": 192819, "epoch": 1593} {"train_loss": -41.12605667114258, "global_step": 192820, "epoch": 1593} {"train_loss": -40.72954559326172, "global_step": 192821, "epoch": 1593} {"train_loss": -40.610595703125, "global_step": 192822, "epoch": 1593} {"train_loss": -41.31973648071289, "global_step": 192823, "epoch": 1593} {"train_loss": -41.186859130859375, "global_step": 192824, "epoch": 1593} {"train_loss": -40.959075927734375, "global_step": 192825, "epoch": 1593} {"train_loss": -40.93557357788086, "global_step": 192826, "epoch": 1593} {"train_loss": -42.270263671875, "global_step": 192827, "epoch": 1593} {"train_loss": -41.367767333984375, "global_step": 192828, "epoch": 1593} {"train_loss": -41.385589599609375, "global_step": 192829, "epoch": 1593} {"train_loss": -41.35642623901367, "global_step": 192830, "epoch": 1593} {"train_loss": -42.3463020324707, "global_step": 192831, "epoch": 1593} {"train_loss": -41.481937408447266, "global_step": 192832, "epoch": 1593} {"train_loss": -42.18435287475586, "global_step": 192833, "epoch": 1593} {"train_loss": -41.97394943237305, "global_step": 192834, "epoch": 1593} {"train_loss": -42.31887435913086, "global_step": 192835, "epoch": 1593} {"train_loss": -42.465126037597656, "global_step": 192836, "epoch": 1593} {"train_loss": -41.76284408569336, "global_step": 192837, "epoch": 1593} {"train_loss": -42.11812973022461, "global_step": 192838, "epoch": 1593} {"train_loss": -42.523841857910156, "global_step": 192839, "epoch": 1593} {"train_loss": -42.08180618286133, "global_step": 192840, "epoch": 1593} {"train_loss": -42.048805236816406, "global_step": 192841, "epoch": 1593} {"train_loss": -42.36450958251953, "global_step": 192842, "epoch": 1593} {"train_loss": -42.65776443481445, "global_step": 192843, "epoch": 1593} {"train_loss": -42.31827926635742, "global_step": 192844, "epoch": 1593} {"train_loss": -42.63450241088867, "global_step": 192845, "epoch": 1593} {"train_loss": -42.816471099853516, "global_step": 192846, "epoch": 1593} {"train_loss": -43.046260833740234, "global_step": 192847, "epoch": 1593} {"train_loss": -42.36469650268555, "global_step": 192848, "epoch": 1593} {"train_loss": -42.37664794921875, "global_step": 192849, "epoch": 1593} {"train_loss": -42.09382247924805, "global_step": 192850, "epoch": 1593} {"train_loss": -42.58503341674805, "global_step": 192851, "epoch": 1593} {"train_loss": -41.916358947753906, "global_step": 192852, "epoch": 1593} {"train_loss": -43.02717971801758, "global_step": 192853, "epoch": 1593} {"train_loss": -42.38731384277344, "global_step": 192854, "epoch": 1593} {"train_loss": -41.58233642578125, "global_step": 192855, "epoch": 1593} {"train_loss": -42.640865325927734, "global_step": 192856, "epoch": 1593} {"train_loss": -41.7648811340332, "global_step": 192857, "epoch": 1593} {"train_loss": -41.58747482299805, "global_step": 192858, "epoch": 1593} {"train_loss": -41.66992950439453, "global_step": 192859, "epoch": 1593} {"train_loss": -41.94573974609375, "global_step": 192860, "epoch": 1593} {"train_loss": -42.525638580322266, "global_step": 192861, "epoch": 1593} {"train_loss": -41.16841125488281, "global_step": 192862, "epoch": 1593} {"train_loss": -39.5999755859375, "global_step": 192863, "epoch": 1593} {"train_loss": -38.5562744140625, "global_step": 192864, "epoch": 1593} {"train_loss": -39.47090530395508, "global_step": 192865, "epoch": 1593} {"train_loss": -41.64081954956055, "global_step": 192866, "epoch": 1593} {"train_loss": -41.26924514770508, "global_step": 192867, "epoch": 1593} {"train_loss": -40.641029357910156, "global_step": 192868, "epoch": 1593} {"train_loss": -41.59445571899414, "global_step": 192869, "epoch": 1593} {"train_loss": -41.27634048461914, "global_step": 192870, "epoch": 1593} {"train_loss": -41.408424377441406, "global_step": 192871, "epoch": 1593} {"train_loss": -41.6077995300293, "global_step": 192872, "epoch": 1593} {"train_loss": -41.83293378845719, "global_step": 192873, "epoch": 1593, "val_loss": 2450701.25} {"train_loss": -39.25252914428711, "global_step": 192874, "epoch": 1594} {"train_loss": -39.911415100097656, "global_step": 192875, "epoch": 1594} {"train_loss": -41.90682601928711, "global_step": 192876, "epoch": 1594} {"train_loss": -41.773948669433594, "global_step": 192877, "epoch": 1594} {"train_loss": -41.29575729370117, "global_step": 192878, "epoch": 1594} {"train_loss": -41.136898040771484, "global_step": 192879, "epoch": 1594} {"train_loss": -42.201515197753906, "global_step": 192880, "epoch": 1594} {"train_loss": -41.41764831542969, "global_step": 192881, "epoch": 1594} {"train_loss": -42.339229583740234, "global_step": 192882, "epoch": 1594} {"train_loss": -41.15087890625, "global_step": 192883, "epoch": 1594} {"train_loss": -41.38846969604492, "global_step": 192884, "epoch": 1594} {"train_loss": -42.28717803955078, "global_step": 192885, "epoch": 1594} {"train_loss": -41.60298538208008, "global_step": 192886, "epoch": 1594} {"train_loss": -42.044063568115234, "global_step": 192887, "epoch": 1594} {"train_loss": -41.92709732055664, "global_step": 192888, "epoch": 1594} {"train_loss": -42.17716598510742, "global_step": 192889, "epoch": 1594} {"train_loss": -41.50728225708008, "global_step": 192890, "epoch": 1594} {"train_loss": -42.491485595703125, "global_step": 192891, "epoch": 1594} {"train_loss": -41.340179443359375, "global_step": 192892, "epoch": 1594} {"train_loss": -41.91706848144531, "global_step": 192893, "epoch": 1594} {"train_loss": -41.08782958984375, "global_step": 192894, "epoch": 1594} {"train_loss": -40.76359176635742, "global_step": 192895, "epoch": 1594} {"train_loss": -41.69500732421875, "global_step": 192896, "epoch": 1594} {"train_loss": -40.64567565917969, "global_step": 192897, "epoch": 1594} {"train_loss": -42.10799789428711, "global_step": 192898, "epoch": 1594} {"train_loss": -40.66946029663086, "global_step": 192899, "epoch": 1594} {"train_loss": -41.946712493896484, "global_step": 192900, "epoch": 1594} {"train_loss": -42.30216598510742, "global_step": 192901, "epoch": 1594} {"train_loss": -41.33244705200195, "global_step": 192902, "epoch": 1594} {"train_loss": -41.56804275512695, "global_step": 192903, "epoch": 1594} {"train_loss": -41.62714385986328, "global_step": 192904, "epoch": 1594} {"train_loss": -42.67332077026367, "global_step": 192905, "epoch": 1594} {"train_loss": -42.47200393676758, "global_step": 192906, "epoch": 1594} {"train_loss": -42.40498352050781, "global_step": 192907, "epoch": 1594} {"train_loss": -42.68865203857422, "global_step": 192908, "epoch": 1594} {"train_loss": -42.29311752319336, "global_step": 192909, "epoch": 1594} {"train_loss": -42.011714935302734, "global_step": 192910, "epoch": 1594} {"train_loss": -42.078277587890625, "global_step": 192911, "epoch": 1594} {"train_loss": -42.46492385864258, "global_step": 192912, "epoch": 1594} {"train_loss": -42.01113510131836, "global_step": 192913, "epoch": 1594} {"train_loss": -42.41789627075195, "global_step": 192914, "epoch": 1594} {"train_loss": -42.444515228271484, "global_step": 192915, "epoch": 1594} {"train_loss": -42.719173431396484, "global_step": 192916, "epoch": 1594} {"train_loss": -42.37944412231445, "global_step": 192917, "epoch": 1594} {"train_loss": -42.31678009033203, "global_step": 192918, "epoch": 1594} {"train_loss": -42.45972442626953, "global_step": 192919, "epoch": 1594} {"train_loss": -42.52456283569336, "global_step": 192920, "epoch": 1594} {"train_loss": -42.573307037353516, "global_step": 192921, "epoch": 1594} {"train_loss": -43.083763122558594, "global_step": 192922, "epoch": 1594} {"train_loss": -42.81389617919922, "global_step": 192923, "epoch": 1594} {"train_loss": -42.98104476928711, "global_step": 192924, "epoch": 1594} {"train_loss": -42.715614318847656, "global_step": 192925, "epoch": 1594} {"train_loss": -42.964813232421875, "global_step": 192926, "epoch": 1594} {"train_loss": -43.13665008544922, "global_step": 192927, "epoch": 1594} {"train_loss": -43.01105880737305, "global_step": 192928, "epoch": 1594} {"train_loss": -43.19095993041992, "global_step": 192929, "epoch": 1594} {"train_loss": -43.015594482421875, "global_step": 192930, "epoch": 1594} {"train_loss": -43.085567474365234, "global_step": 192931, "epoch": 1594} {"train_loss": -43.018611907958984, "global_step": 192932, "epoch": 1594} {"train_loss": -42.4641227722168, "global_step": 192933, "epoch": 1594} {"train_loss": -43.5213623046875, "global_step": 192934, "epoch": 1594} {"train_loss": -43.0061149597168, "global_step": 192935, "epoch": 1594} {"train_loss": -42.6109733581543, "global_step": 192936, "epoch": 1594} {"train_loss": -42.66828155517578, "global_step": 192937, "epoch": 1594} {"train_loss": -43.42921829223633, "global_step": 192938, "epoch": 1594} {"train_loss": -42.87173080444336, "global_step": 192939, "epoch": 1594} {"train_loss": -42.81298828125, "global_step": 192940, "epoch": 1594} {"train_loss": -43.31839370727539, "global_step": 192941, "epoch": 1594} {"train_loss": -42.61419677734375, "global_step": 192942, "epoch": 1594} {"train_loss": -43.049171447753906, "global_step": 192943, "epoch": 1594} {"train_loss": -43.0147819519043, "global_step": 192944, "epoch": 1594} {"train_loss": -42.59377670288086, "global_step": 192945, "epoch": 1594} {"train_loss": -42.960880279541016, "global_step": 192946, "epoch": 1594} {"train_loss": -42.804931640625, "global_step": 192947, "epoch": 1594} {"train_loss": -43.124977111816406, "global_step": 192948, "epoch": 1594} {"train_loss": -43.20772171020508, "global_step": 192949, "epoch": 1594} {"train_loss": -43.0670280456543, "global_step": 192950, "epoch": 1594} {"train_loss": -42.75584030151367, "global_step": 192951, "epoch": 1594} {"train_loss": -43.26812744140625, "global_step": 192952, "epoch": 1594} {"train_loss": -42.88887405395508, "global_step": 192953, "epoch": 1594} {"train_loss": -42.35322952270508, "global_step": 192954, "epoch": 1594} {"train_loss": -43.157955169677734, "global_step": 192955, "epoch": 1594} {"train_loss": -41.380733489990234, "global_step": 192956, "epoch": 1594} {"train_loss": -39.1173210144043, "global_step": 192957, "epoch": 1594} {"train_loss": -40.80116653442383, "global_step": 192958, "epoch": 1594} {"train_loss": -40.51673126220703, "global_step": 192959, "epoch": 1594} {"train_loss": -40.76859664916992, "global_step": 192960, "epoch": 1594} {"train_loss": -41.840065002441406, "global_step": 192961, "epoch": 1594} {"train_loss": -41.96891403198242, "global_step": 192962, "epoch": 1594} {"train_loss": -39.683372497558594, "global_step": 192963, "epoch": 1594} {"train_loss": -38.77656555175781, "global_step": 192964, "epoch": 1594} {"train_loss": -40.440433502197266, "global_step": 192965, "epoch": 1594} {"train_loss": -37.824134826660156, "global_step": 192966, "epoch": 1594} {"train_loss": -37.365264892578125, "global_step": 192967, "epoch": 1594} {"train_loss": -40.1046257019043, "global_step": 192968, "epoch": 1594} {"train_loss": -40.004207611083984, "global_step": 192969, "epoch": 1594} {"train_loss": -40.865142822265625, "global_step": 192970, "epoch": 1594} {"train_loss": -41.35248565673828, "global_step": 192971, "epoch": 1594} {"train_loss": -41.37850570678711, "global_step": 192972, "epoch": 1594} {"train_loss": -40.851985931396484, "global_step": 192973, "epoch": 1594} {"train_loss": -39.932167053222656, "global_step": 192974, "epoch": 1594} {"train_loss": -40.75825119018555, "global_step": 192975, "epoch": 1594} {"train_loss": -41.63817596435547, "global_step": 192976, "epoch": 1594} {"train_loss": -40.459136962890625, "global_step": 192977, "epoch": 1594} {"train_loss": -41.22283935546875, "global_step": 192978, "epoch": 1594} {"train_loss": -40.97309494018555, "global_step": 192979, "epoch": 1594} {"train_loss": -40.41782760620117, "global_step": 192980, "epoch": 1594} {"train_loss": -41.88064956665039, "global_step": 192981, "epoch": 1594} {"train_loss": -41.54303741455078, "global_step": 192982, "epoch": 1594} {"train_loss": -40.08122634887695, "global_step": 192983, "epoch": 1594} {"train_loss": -42.007484436035156, "global_step": 192984, "epoch": 1594} {"train_loss": -41.07809829711914, "global_step": 192985, "epoch": 1594} {"train_loss": -41.205692291259766, "global_step": 192986, "epoch": 1594} {"train_loss": -40.9571418762207, "global_step": 192987, "epoch": 1594} {"train_loss": -41.91564178466797, "global_step": 192988, "epoch": 1594} {"train_loss": -40.97209548950195, "global_step": 192989, "epoch": 1594} {"train_loss": -41.585205078125, "global_step": 192990, "epoch": 1594} {"train_loss": -41.78889083862305, "global_step": 192991, "epoch": 1594} {"train_loss": -41.886837005615234, "global_step": 192992, "epoch": 1594} {"train_loss": -42.173439025878906, "global_step": 192993, "epoch": 1594} {"train_loss": -41.816120872812824, "global_step": 192994, "epoch": 1594, "val_loss": 2462781.25} {"train_loss": -41.987457275390625, "global_step": 192995, "epoch": 1595} {"train_loss": -41.37526321411133, "global_step": 192996, "epoch": 1595} {"train_loss": -42.349830627441406, "global_step": 192997, "epoch": 1595} {"train_loss": -41.6131706237793, "global_step": 192998, "epoch": 1595} {"train_loss": -42.57441329956055, "global_step": 192999, "epoch": 1595} {"train_loss": -41.606319427490234, "global_step": 193000, "epoch": 1595} {"train_loss": -41.78534698486328, "global_step": 193001, "epoch": 1595} {"train_loss": -42.641605377197266, "global_step": 193002, "epoch": 1595} {"train_loss": -42.36024856567383, "global_step": 193003, "epoch": 1595} {"train_loss": -42.389320373535156, "global_step": 193004, "epoch": 1595} {"train_loss": -41.73208236694336, "global_step": 193005, "epoch": 1595} {"train_loss": -42.25114059448242, "global_step": 193006, "epoch": 1595} {"train_loss": -41.16522216796875, "global_step": 193007, "epoch": 1595} {"train_loss": -42.72001266479492, "global_step": 193008, "epoch": 1595} {"train_loss": -41.23353958129883, "global_step": 193009, "epoch": 1595} {"train_loss": -42.53691101074219, "global_step": 193010, "epoch": 1595} {"train_loss": -41.62030029296875, "global_step": 193011, "epoch": 1595} {"train_loss": -41.79130935668945, "global_step": 193012, "epoch": 1595} {"train_loss": -42.46119689941406, "global_step": 193013, "epoch": 1595} {"train_loss": -41.356536865234375, "global_step": 193014, "epoch": 1595} {"train_loss": -42.506256103515625, "global_step": 193015, "epoch": 1595} {"train_loss": -42.57750701904297, "global_step": 193016, "epoch": 1595} {"train_loss": -42.490447998046875, "global_step": 193017, "epoch": 1595} {"train_loss": -42.09699249267578, "global_step": 193018, "epoch": 1595} {"train_loss": -41.72591018676758, "global_step": 193019, "epoch": 1595} {"train_loss": -42.443172454833984, "global_step": 193020, "epoch": 1595} {"train_loss": -42.16404342651367, "global_step": 193021, "epoch": 1595} {"train_loss": -42.74860763549805, "global_step": 193022, "epoch": 1595} {"train_loss": -42.872032165527344, "global_step": 193023, "epoch": 1595} {"train_loss": -42.29376983642578, "global_step": 193024, "epoch": 1595} {"train_loss": -42.94123458862305, "global_step": 193025, "epoch": 1595} {"train_loss": -42.69858932495117, "global_step": 193026, "epoch": 1595} {"train_loss": -42.13135528564453, "global_step": 193027, "epoch": 1595} {"train_loss": -42.5022087097168, "global_step": 193028, "epoch": 1595} {"train_loss": -42.43259811401367, "global_step": 193029, "epoch": 1595} {"train_loss": -42.30487060546875, "global_step": 193030, "epoch": 1595} {"train_loss": -42.07529830932617, "global_step": 193031, "epoch": 1595} {"train_loss": -41.26974105834961, "global_step": 193032, "epoch": 1595} {"train_loss": -43.03251647949219, "global_step": 193033, "epoch": 1595} {"train_loss": -41.367061614990234, "global_step": 193034, "epoch": 1595} {"train_loss": -41.86175537109375, "global_step": 193035, "epoch": 1595} {"train_loss": -42.89645004272461, "global_step": 193036, "epoch": 1595} {"train_loss": -42.4203987121582, "global_step": 193037, "epoch": 1595} {"train_loss": -42.92757034301758, "global_step": 193038, "epoch": 1595} {"train_loss": -42.63407516479492, "global_step": 193039, "epoch": 1595} {"train_loss": -42.637447357177734, "global_step": 193040, "epoch": 1595} {"train_loss": -42.29879379272461, "global_step": 193041, "epoch": 1595} {"train_loss": -41.8416748046875, "global_step": 193042, "epoch": 1595} {"train_loss": -41.494544982910156, "global_step": 193043, "epoch": 1595} {"train_loss": -41.123023986816406, "global_step": 193044, "epoch": 1595} {"train_loss": -42.346473693847656, "global_step": 193045, "epoch": 1595} {"train_loss": -42.65102767944336, "global_step": 193046, "epoch": 1595} {"train_loss": -39.757110595703125, "global_step": 193047, "epoch": 1595} {"train_loss": -37.70065689086914, "global_step": 193048, "epoch": 1595} {"train_loss": -40.88203811645508, "global_step": 193049, "epoch": 1595} {"train_loss": -41.51093673706055, "global_step": 193050, "epoch": 1595} {"train_loss": -39.36567306518555, "global_step": 193051, "epoch": 1595} {"train_loss": -39.74372482299805, "global_step": 193052, "epoch": 1595} {"train_loss": -41.01580047607422, "global_step": 193053, "epoch": 1595} {"train_loss": -41.4047737121582, "global_step": 193054, "epoch": 1595} {"train_loss": -38.61699295043945, "global_step": 193055, "epoch": 1595} {"train_loss": -36.523067474365234, "global_step": 193056, "epoch": 1595} {"train_loss": -40.96025848388672, "global_step": 193057, "epoch": 1595} {"train_loss": -40.19065475463867, "global_step": 193058, "epoch": 1595} {"train_loss": -39.3194694519043, "global_step": 193059, "epoch": 1595} {"train_loss": -40.06884765625, "global_step": 193060, "epoch": 1595} {"train_loss": -40.92441940307617, "global_step": 193061, "epoch": 1595} {"train_loss": -40.85884475708008, "global_step": 193062, "epoch": 1595} {"train_loss": -38.59220504760742, "global_step": 193063, "epoch": 1595} {"train_loss": -39.4816780090332, "global_step": 193064, "epoch": 1595} {"train_loss": -40.886844635009766, "global_step": 193065, "epoch": 1595} {"train_loss": -39.66214370727539, "global_step": 193066, "epoch": 1595} {"train_loss": -40.211971282958984, "global_step": 193067, "epoch": 1595} {"train_loss": -39.93500900268555, "global_step": 193068, "epoch": 1595} {"train_loss": -41.564823150634766, "global_step": 193069, "epoch": 1595} {"train_loss": -41.09992599487305, "global_step": 193070, "epoch": 1595} {"train_loss": -40.062721252441406, "global_step": 193071, "epoch": 1595} {"train_loss": -41.847206115722656, "global_step": 193072, "epoch": 1595} {"train_loss": -41.23793411254883, "global_step": 193073, "epoch": 1595} {"train_loss": -42.00934600830078, "global_step": 193074, "epoch": 1595} {"train_loss": -40.07625961303711, "global_step": 193075, "epoch": 1595} {"train_loss": -41.523372650146484, "global_step": 193076, "epoch": 1595} {"train_loss": -41.09405517578125, "global_step": 193077, "epoch": 1595} {"train_loss": -40.98491287231445, "global_step": 193078, "epoch": 1595} {"train_loss": -41.43028259277344, "global_step": 193079, "epoch": 1595} {"train_loss": -41.180912017822266, "global_step": 193080, "epoch": 1595} {"train_loss": -41.80152130126953, "global_step": 193081, "epoch": 1595} {"train_loss": -41.60332107543945, "global_step": 193082, "epoch": 1595} {"train_loss": -42.001766204833984, "global_step": 193083, "epoch": 1595} {"train_loss": -41.462135314941406, "global_step": 193084, "epoch": 1595} {"train_loss": -41.96084976196289, "global_step": 193085, "epoch": 1595} {"train_loss": -41.16496658325195, "global_step": 193086, "epoch": 1595} {"train_loss": -41.68109130859375, "global_step": 193087, "epoch": 1595} {"train_loss": -41.81120681762695, "global_step": 193088, "epoch": 1595} {"train_loss": -42.31647872924805, "global_step": 193089, "epoch": 1595} {"train_loss": -42.54572296142578, "global_step": 193090, "epoch": 1595} {"train_loss": -41.82954025268555, "global_step": 193091, "epoch": 1595} {"train_loss": -42.563819885253906, "global_step": 193092, "epoch": 1595} {"train_loss": -42.340972900390625, "global_step": 193093, "epoch": 1595} {"train_loss": -42.57168197631836, "global_step": 193094, "epoch": 1595} {"train_loss": -42.52295684814453, "global_step": 193095, "epoch": 1595} {"train_loss": -42.70414733886719, "global_step": 193096, "epoch": 1595} {"train_loss": -42.443416595458984, "global_step": 193097, "epoch": 1595} {"train_loss": -42.520835876464844, "global_step": 193098, "epoch": 1595} {"train_loss": -42.884273529052734, "global_step": 193099, "epoch": 1595} {"train_loss": -42.54325485229492, "global_step": 193100, "epoch": 1595} {"train_loss": -42.46748733520508, "global_step": 193101, "epoch": 1595} {"train_loss": -42.77922439575195, "global_step": 193102, "epoch": 1595} {"train_loss": -42.95624542236328, "global_step": 193103, "epoch": 1595} {"train_loss": -42.83207702636719, "global_step": 193104, "epoch": 1595} {"train_loss": -42.65714645385742, "global_step": 193105, "epoch": 1595} {"train_loss": -42.7113037109375, "global_step": 193106, "epoch": 1595} {"train_loss": -42.883338928222656, "global_step": 193107, "epoch": 1595} {"train_loss": -42.22330856323242, "global_step": 193108, "epoch": 1595} {"train_loss": -42.898921966552734, "global_step": 193109, "epoch": 1595} {"train_loss": -42.938899993896484, "global_step": 193110, "epoch": 1595} {"train_loss": -42.82991409301758, "global_step": 193111, "epoch": 1595} {"train_loss": -42.81416320800781, "global_step": 193112, "epoch": 1595} {"train_loss": -43.168792724609375, "global_step": 193113, "epoch": 1595} {"train_loss": -42.67620849609375, "global_step": 193114, "epoch": 1595} {"train_loss": -41.73534995465239, "global_step": 193115, "epoch": 1595, "val_loss": 2581315.0} {"train_loss": -43.091617584228516, "global_step": 193116, "epoch": 1596} {"train_loss": -42.849952697753906, "global_step": 193117, "epoch": 1596} {"train_loss": -43.066627502441406, "global_step": 193118, "epoch": 1596} {"train_loss": -42.56271743774414, "global_step": 193119, "epoch": 1596} {"train_loss": -34.3382453918457, "global_step": 193120, "epoch": 1596} {"train_loss": -43.061805725097656, "global_step": 193121, "epoch": 1596} {"train_loss": -42.65617752075195, "global_step": 193122, "epoch": 1596} {"train_loss": -42.92403030395508, "global_step": 193123, "epoch": 1596} {"train_loss": -35.51438522338867, "global_step": 193124, "epoch": 1596} {"train_loss": -42.27325439453125, "global_step": 193125, "epoch": 1596} {"train_loss": -42.303924560546875, "global_step": 193126, "epoch": 1596} {"train_loss": -42.342411041259766, "global_step": 193127, "epoch": 1596} {"train_loss": -42.87285614013672, "global_step": 193128, "epoch": 1596} {"train_loss": -42.58087158203125, "global_step": 193129, "epoch": 1596} {"train_loss": -41.60841751098633, "global_step": 193130, "epoch": 1596} {"train_loss": -42.29865264892578, "global_step": 193131, "epoch": 1596} {"train_loss": -42.92034149169922, "global_step": 193132, "epoch": 1596} {"train_loss": -42.547882080078125, "global_step": 193133, "epoch": 1596} {"train_loss": -42.96091842651367, "global_step": 193134, "epoch": 1596} {"train_loss": -42.989009857177734, "global_step": 193135, "epoch": 1596} {"train_loss": -42.7338752746582, "global_step": 193136, "epoch": 1596} {"train_loss": -42.283321380615234, "global_step": 193137, "epoch": 1596} {"train_loss": -42.92578887939453, "global_step": 193138, "epoch": 1596} {"train_loss": -41.5289192199707, "global_step": 193139, "epoch": 1596} {"train_loss": -41.71807861328125, "global_step": 193140, "epoch": 1596} {"train_loss": -42.474021911621094, "global_step": 193141, "epoch": 1596} {"train_loss": -42.859893798828125, "global_step": 193142, "epoch": 1596} {"train_loss": -41.87616729736328, "global_step": 193143, "epoch": 1596} {"train_loss": -39.496707916259766, "global_step": 193144, "epoch": 1596} {"train_loss": -40.961524963378906, "global_step": 193145, "epoch": 1596} {"train_loss": -40.134735107421875, "global_step": 193146, "epoch": 1596} {"train_loss": -40.84489822387695, "global_step": 193147, "epoch": 1596} {"train_loss": -38.3707389831543, "global_step": 193148, "epoch": 1596} {"train_loss": -39.192867279052734, "global_step": 193149, "epoch": 1596} {"train_loss": -40.4373779296875, "global_step": 193150, "epoch": 1596} {"train_loss": -40.54397201538086, "global_step": 193151, "epoch": 1596} {"train_loss": -41.9578971862793, "global_step": 193152, "epoch": 1596} {"train_loss": -40.052738189697266, "global_step": 193153, "epoch": 1596} {"train_loss": -40.84672164916992, "global_step": 193154, "epoch": 1596} {"train_loss": -40.2684211730957, "global_step": 193155, "epoch": 1596} {"train_loss": -40.72085952758789, "global_step": 193156, "epoch": 1596} {"train_loss": -40.40993881225586, "global_step": 193157, "epoch": 1596} {"train_loss": -41.53657150268555, "global_step": 193158, "epoch": 1596} {"train_loss": -40.909332275390625, "global_step": 193159, "epoch": 1596} {"train_loss": -41.886016845703125, "global_step": 193160, "epoch": 1596} {"train_loss": -40.57860565185547, "global_step": 193161, "epoch": 1596} {"train_loss": -39.102394104003906, "global_step": 193162, "epoch": 1596} {"train_loss": -42.063724517822266, "global_step": 193163, "epoch": 1596} {"train_loss": -40.89802169799805, "global_step": 193164, "epoch": 1596} {"train_loss": -41.56214904785156, "global_step": 193165, "epoch": 1596} {"train_loss": -42.02398681640625, "global_step": 193166, "epoch": 1596} {"train_loss": -41.842254638671875, "global_step": 193167, "epoch": 1596} {"train_loss": -40.98765182495117, "global_step": 193168, "epoch": 1596} {"train_loss": -41.59746170043945, "global_step": 193169, "epoch": 1596} {"train_loss": -42.29368209838867, "global_step": 193170, "epoch": 1596} {"train_loss": -40.508941650390625, "global_step": 193171, "epoch": 1596} {"train_loss": -41.0622444152832, "global_step": 193172, "epoch": 1596} {"train_loss": -41.48579025268555, "global_step": 193173, "epoch": 1596} {"train_loss": -41.998714447021484, "global_step": 193174, "epoch": 1596} {"train_loss": -42.25039291381836, "global_step": 193175, "epoch": 1596} {"train_loss": -41.0561637878418, "global_step": 193176, "epoch": 1596} {"train_loss": -41.74860763549805, "global_step": 193177, "epoch": 1596} {"train_loss": -42.329078674316406, "global_step": 193178, "epoch": 1596} {"train_loss": -41.88694763183594, "global_step": 193179, "epoch": 1596} {"train_loss": -41.44989013671875, "global_step": 193180, "epoch": 1596} {"train_loss": -42.099788665771484, "global_step": 193181, "epoch": 1596} {"train_loss": -41.933860778808594, "global_step": 193182, "epoch": 1596} {"train_loss": -42.14704132080078, "global_step": 193183, "epoch": 1596} {"train_loss": -42.55482864379883, "global_step": 193184, "epoch": 1596} {"train_loss": -42.041419982910156, "global_step": 193185, "epoch": 1596} {"train_loss": -41.03740310668945, "global_step": 193186, "epoch": 1596} {"train_loss": -42.516788482666016, "global_step": 193187, "epoch": 1596} {"train_loss": -41.585540771484375, "global_step": 193188, "epoch": 1596} {"train_loss": -41.23408126831055, "global_step": 193189, "epoch": 1596} {"train_loss": -42.34684753417969, "global_step": 193190, "epoch": 1596} {"train_loss": -42.69279479980469, "global_step": 193191, "epoch": 1596} {"train_loss": -42.48789596557617, "global_step": 193192, "epoch": 1596} {"train_loss": -41.25483322143555, "global_step": 193193, "epoch": 1596} {"train_loss": -43.08112716674805, "global_step": 193194, "epoch": 1596} {"train_loss": -41.04865646362305, "global_step": 193195, "epoch": 1596} {"train_loss": -42.20689010620117, "global_step": 193196, "epoch": 1596} {"train_loss": -42.254207611083984, "global_step": 193197, "epoch": 1596} {"train_loss": -41.098209381103516, "global_step": 193198, "epoch": 1596} {"train_loss": -42.453243255615234, "global_step": 193199, "epoch": 1596} {"train_loss": -41.77138900756836, "global_step": 193200, "epoch": 1596} {"train_loss": -41.38314437866211, "global_step": 193201, "epoch": 1596} {"train_loss": -42.30365753173828, "global_step": 193202, "epoch": 1596} {"train_loss": -41.78646469116211, "global_step": 193203, "epoch": 1596} {"train_loss": -41.64801025390625, "global_step": 193204, "epoch": 1596} {"train_loss": -42.61176681518555, "global_step": 193205, "epoch": 1596} {"train_loss": -42.00318145751953, "global_step": 193206, "epoch": 1596} {"train_loss": -42.04243850708008, "global_step": 193207, "epoch": 1596} {"train_loss": -41.05317306518555, "global_step": 193208, "epoch": 1596} {"train_loss": -42.26322937011719, "global_step": 193209, "epoch": 1596} {"train_loss": -41.1563835144043, "global_step": 193210, "epoch": 1596} {"train_loss": -41.94398498535156, "global_step": 193211, "epoch": 1596} {"train_loss": -41.51058578491211, "global_step": 193212, "epoch": 1596} {"train_loss": -41.94182205200195, "global_step": 193213, "epoch": 1596} {"train_loss": -41.43747329711914, "global_step": 193214, "epoch": 1596} {"train_loss": -41.50425338745117, "global_step": 193215, "epoch": 1596} {"train_loss": -41.00954818725586, "global_step": 193216, "epoch": 1596} {"train_loss": -39.91659164428711, "global_step": 193217, "epoch": 1596} {"train_loss": -41.04810333251953, "global_step": 193218, "epoch": 1596} {"train_loss": -40.34774398803711, "global_step": 193219, "epoch": 1596} {"train_loss": -41.86198043823242, "global_step": 193220, "epoch": 1596} {"train_loss": -41.23711013793945, "global_step": 193221, "epoch": 1596} {"train_loss": -41.154632568359375, "global_step": 193222, "epoch": 1596} {"train_loss": -40.99526596069336, "global_step": 193223, "epoch": 1596} {"train_loss": -40.8528938293457, "global_step": 193224, "epoch": 1596} {"train_loss": -41.0742073059082, "global_step": 193225, "epoch": 1596} {"train_loss": -41.735530853271484, "global_step": 193226, "epoch": 1596} {"train_loss": -41.876129150390625, "global_step": 193227, "epoch": 1596} {"train_loss": -40.8852653503418, "global_step": 193228, "epoch": 1596} {"train_loss": -39.936431884765625, "global_step": 193229, "epoch": 1596} {"train_loss": -39.58098220825195, "global_step": 193230, "epoch": 1596} {"train_loss": -41.52647018432617, "global_step": 193231, "epoch": 1596} {"train_loss": -41.16468048095703, "global_step": 193232, "epoch": 1596} {"train_loss": -38.33966064453125, "global_step": 193233, "epoch": 1596} {"train_loss": -41.2805061340332, "global_step": 193234, "epoch": 1596} {"train_loss": -40.79803466796875, "global_step": 193235, "epoch": 1596} {"train_loss": -41.45927000439857, "global_step": 193236, "epoch": 1596, "val_loss": 2549204.75} {"train_loss": -39.53372573852539, "global_step": 193237, "epoch": 1597} {"train_loss": -41.837440490722656, "global_step": 193238, "epoch": 1597} {"train_loss": -41.06689453125, "global_step": 193239, "epoch": 1597} {"train_loss": -39.06724166870117, "global_step": 193240, "epoch": 1597} {"train_loss": -41.43482208251953, "global_step": 193241, "epoch": 1597} {"train_loss": -41.499298095703125, "global_step": 193242, "epoch": 1597} {"train_loss": -40.855751037597656, "global_step": 193243, "epoch": 1597} {"train_loss": -41.47773742675781, "global_step": 193244, "epoch": 1597} {"train_loss": -41.32715606689453, "global_step": 193245, "epoch": 1597} {"train_loss": -41.5623893737793, "global_step": 193246, "epoch": 1597} {"train_loss": -41.36167526245117, "global_step": 193247, "epoch": 1597} {"train_loss": -40.96356964111328, "global_step": 193248, "epoch": 1597} {"train_loss": -40.5675163269043, "global_step": 193249, "epoch": 1597} {"train_loss": -42.09339141845703, "global_step": 193250, "epoch": 1597} {"train_loss": -41.77151107788086, "global_step": 193251, "epoch": 1597} {"train_loss": -42.24146270751953, "global_step": 193252, "epoch": 1597} {"train_loss": -42.22251892089844, "global_step": 193253, "epoch": 1597} {"train_loss": -41.798187255859375, "global_step": 193254, "epoch": 1597} {"train_loss": -41.81913375854492, "global_step": 193255, "epoch": 1597} {"train_loss": -41.5463981628418, "global_step": 193256, "epoch": 1597} {"train_loss": -40.354610443115234, "global_step": 193257, "epoch": 1597} {"train_loss": -42.32693099975586, "global_step": 193258, "epoch": 1597} {"train_loss": -42.424964904785156, "global_step": 193259, "epoch": 1597} {"train_loss": -42.26557159423828, "global_step": 193260, "epoch": 1597} {"train_loss": -41.117916107177734, "global_step": 193261, "epoch": 1597} {"train_loss": -41.69366455078125, "global_step": 193262, "epoch": 1597} {"train_loss": -42.19239807128906, "global_step": 193263, "epoch": 1597} {"train_loss": -42.070125579833984, "global_step": 193264, "epoch": 1597} {"train_loss": -41.294124603271484, "global_step": 193265, "epoch": 1597} {"train_loss": -42.2957763671875, "global_step": 193266, "epoch": 1597} {"train_loss": -41.30254364013672, "global_step": 193267, "epoch": 1597} {"train_loss": -42.67075729370117, "global_step": 193268, "epoch": 1597} {"train_loss": -41.71323776245117, "global_step": 193269, "epoch": 1597} {"train_loss": -41.251731872558594, "global_step": 193270, "epoch": 1597} {"train_loss": -42.636322021484375, "global_step": 193271, "epoch": 1597} {"train_loss": -41.24432373046875, "global_step": 193272, "epoch": 1597} {"train_loss": -39.37373733520508, "global_step": 193273, "epoch": 1597} {"train_loss": -39.78690719604492, "global_step": 193274, "epoch": 1597} {"train_loss": -41.963287353515625, "global_step": 193275, "epoch": 1597} {"train_loss": -40.421592712402344, "global_step": 193276, "epoch": 1597} {"train_loss": -41.28876876831055, "global_step": 193277, "epoch": 1597} {"train_loss": -42.15062713623047, "global_step": 193278, "epoch": 1597} {"train_loss": -39.623409271240234, "global_step": 193279, "epoch": 1597} {"train_loss": -41.207515716552734, "global_step": 193280, "epoch": 1597} {"train_loss": -42.131656646728516, "global_step": 193281, "epoch": 1597} {"train_loss": -40.226341247558594, "global_step": 193282, "epoch": 1597} {"train_loss": -41.286888122558594, "global_step": 193283, "epoch": 1597} {"train_loss": -42.067626953125, "global_step": 193284, "epoch": 1597} {"train_loss": -40.0008659362793, "global_step": 193285, "epoch": 1597} {"train_loss": -41.37350082397461, "global_step": 193286, "epoch": 1597} {"train_loss": -39.44142150878906, "global_step": 193287, "epoch": 1597} {"train_loss": -41.76497268676758, "global_step": 193288, "epoch": 1597} {"train_loss": -41.14287185668945, "global_step": 193289, "epoch": 1597} {"train_loss": -40.61669158935547, "global_step": 193290, "epoch": 1597} {"train_loss": -41.474037170410156, "global_step": 193291, "epoch": 1597} {"train_loss": -41.19466781616211, "global_step": 193292, "epoch": 1597} {"train_loss": -40.814613342285156, "global_step": 193293, "epoch": 1597} {"train_loss": -41.39521026611328, "global_step": 193294, "epoch": 1597} {"train_loss": -42.19448471069336, "global_step": 193295, "epoch": 1597} {"train_loss": -41.6695556640625, "global_step": 193296, "epoch": 1597} {"train_loss": -42.20265579223633, "global_step": 193297, "epoch": 1597} {"train_loss": -41.62473678588867, "global_step": 193298, "epoch": 1597} {"train_loss": -41.4201774597168, "global_step": 193299, "epoch": 1597} {"train_loss": -41.578460693359375, "global_step": 193300, "epoch": 1597} {"train_loss": -42.21116256713867, "global_step": 193301, "epoch": 1597} {"train_loss": -41.918975830078125, "global_step": 193302, "epoch": 1597} {"train_loss": -42.07035827636719, "global_step": 193303, "epoch": 1597} {"train_loss": -41.528987884521484, "global_step": 193304, "epoch": 1597} {"train_loss": -42.08180618286133, "global_step": 193305, "epoch": 1597} {"train_loss": -41.64938735961914, "global_step": 193306, "epoch": 1597} {"train_loss": -41.82096481323242, "global_step": 193307, "epoch": 1597} {"train_loss": -42.45540237426758, "global_step": 193308, "epoch": 1597} {"train_loss": -41.74564743041992, "global_step": 193309, "epoch": 1597} {"train_loss": -41.181697845458984, "global_step": 193310, "epoch": 1597} {"train_loss": -40.85380172729492, "global_step": 193311, "epoch": 1597} {"train_loss": -40.69732666015625, "global_step": 193312, "epoch": 1597} {"train_loss": -42.61187744140625, "global_step": 193313, "epoch": 1597} {"train_loss": -41.20466995239258, "global_step": 193314, "epoch": 1597} {"train_loss": -42.15999221801758, "global_step": 193315, "epoch": 1597} {"train_loss": -41.767398834228516, "global_step": 193316, "epoch": 1597} {"train_loss": -42.691650390625, "global_step": 193317, "epoch": 1597} {"train_loss": -41.180110931396484, "global_step": 193318, "epoch": 1597} {"train_loss": -43.08240509033203, "global_step": 193319, "epoch": 1597} {"train_loss": -40.80989456176758, "global_step": 193320, "epoch": 1597} {"train_loss": -42.39242172241211, "global_step": 193321, "epoch": 1597} {"train_loss": -40.74690628051758, "global_step": 193322, "epoch": 1597} {"train_loss": -42.45695114135742, "global_step": 193323, "epoch": 1597} {"train_loss": -41.0960807800293, "global_step": 193324, "epoch": 1597} {"train_loss": -42.14031982421875, "global_step": 193325, "epoch": 1597} {"train_loss": -42.07246780395508, "global_step": 193326, "epoch": 1597} {"train_loss": -42.6894645690918, "global_step": 193327, "epoch": 1597} {"train_loss": -41.21504211425781, "global_step": 193328, "epoch": 1597} {"train_loss": -42.86172103881836, "global_step": 193329, "epoch": 1597} {"train_loss": -41.42197799682617, "global_step": 193330, "epoch": 1597} {"train_loss": -42.587520599365234, "global_step": 193331, "epoch": 1597} {"train_loss": -42.360069274902344, "global_step": 193332, "epoch": 1597} {"train_loss": -41.655391693115234, "global_step": 193333, "epoch": 1597} {"train_loss": -42.74574661254883, "global_step": 193334, "epoch": 1597} {"train_loss": -40.45036315917969, "global_step": 193335, "epoch": 1597} {"train_loss": -42.37046432495117, "global_step": 193336, "epoch": 1597} {"train_loss": -33.8641242980957, "global_step": 193337, "epoch": 1597} {"train_loss": -42.507320404052734, "global_step": 193338, "epoch": 1597} {"train_loss": -41.862823486328125, "global_step": 193339, "epoch": 1597} {"train_loss": -42.351722717285156, "global_step": 193340, "epoch": 1597} {"train_loss": -40.91938018798828, "global_step": 193341, "epoch": 1597} {"train_loss": -41.8875617980957, "global_step": 193342, "epoch": 1597} {"train_loss": -41.77093505859375, "global_step": 193343, "epoch": 1597} {"train_loss": -40.649993896484375, "global_step": 193344, "epoch": 1597} {"train_loss": -37.75448989868164, "global_step": 193345, "epoch": 1597} {"train_loss": -34.19877243041992, "global_step": 193346, "epoch": 1597} {"train_loss": -41.787681579589844, "global_step": 193347, "epoch": 1597} {"train_loss": -37.3868293762207, "global_step": 193348, "epoch": 1597} {"train_loss": -36.392189025878906, "global_step": 193349, "epoch": 1597} {"train_loss": -39.800113677978516, "global_step": 193350, "epoch": 1597} {"train_loss": -31.711624145507812, "global_step": 193351, "epoch": 1597} {"train_loss": -32.93976593017578, "global_step": 193352, "epoch": 1597} {"train_loss": -33.11446762084961, "global_step": 193353, "epoch": 1597} {"train_loss": -38.80768966674805, "global_step": 193354, "epoch": 1597} {"train_loss": -34.821380615234375, "global_step": 193355, "epoch": 1597} {"train_loss": -36.698001861572266, "global_step": 193356, "epoch": 1597} {"train_loss": -40.91533887878922, "global_step": 193357, "epoch": 1597, "val_loss": 2464181.75} {"train_loss": -38.941410064697266, "global_step": 193358, "epoch": 1598} {"train_loss": -34.4013786315918, "global_step": 193359, "epoch": 1598} {"train_loss": -40.6767692565918, "global_step": 193360, "epoch": 1598} {"train_loss": -39.558284759521484, "global_step": 193361, "epoch": 1598} {"train_loss": -39.27347946166992, "global_step": 193362, "epoch": 1598} {"train_loss": -40.36094284057617, "global_step": 193363, "epoch": 1598} {"train_loss": -39.992774963378906, "global_step": 193364, "epoch": 1598} {"train_loss": -40.200469970703125, "global_step": 193365, "epoch": 1598} {"train_loss": -39.613128662109375, "global_step": 193366, "epoch": 1598} {"train_loss": -38.690547943115234, "global_step": 193367, "epoch": 1598} {"train_loss": -40.92902374267578, "global_step": 193368, "epoch": 1598} {"train_loss": -40.37441635131836, "global_step": 193369, "epoch": 1598} {"train_loss": -40.543148040771484, "global_step": 193370, "epoch": 1598} {"train_loss": -41.22683334350586, "global_step": 193371, "epoch": 1598} {"train_loss": -41.51819610595703, "global_step": 193372, "epoch": 1598} {"train_loss": -40.79872512817383, "global_step": 193373, "epoch": 1598} {"train_loss": -40.611724853515625, "global_step": 193374, "epoch": 1598} {"train_loss": -41.670570373535156, "global_step": 193375, "epoch": 1598} {"train_loss": -41.47914505004883, "global_step": 193376, "epoch": 1598} {"train_loss": -41.5472297668457, "global_step": 193377, "epoch": 1598} {"train_loss": -41.5652961730957, "global_step": 193378, "epoch": 1598} {"train_loss": -42.399967193603516, "global_step": 193379, "epoch": 1598} {"train_loss": -41.330909729003906, "global_step": 193380, "epoch": 1598} {"train_loss": -39.709774017333984, "global_step": 193381, "epoch": 1598} {"train_loss": -41.31380081176758, "global_step": 193382, "epoch": 1598} {"train_loss": -41.29362106323242, "global_step": 193383, "epoch": 1598} {"train_loss": -42.31417465209961, "global_step": 193384, "epoch": 1598} {"train_loss": -41.87785339355469, "global_step": 193385, "epoch": 1598} {"train_loss": -41.22314453125, "global_step": 193386, "epoch": 1598} {"train_loss": -42.08625030517578, "global_step": 193387, "epoch": 1598} {"train_loss": -41.49296188354492, "global_step": 193388, "epoch": 1598} {"train_loss": -40.14809036254883, "global_step": 193389, "epoch": 1598} {"train_loss": -42.018001556396484, "global_step": 193390, "epoch": 1598} {"train_loss": -41.716304779052734, "global_step": 193391, "epoch": 1598} {"train_loss": -41.30843734741211, "global_step": 193392, "epoch": 1598} {"train_loss": -42.425384521484375, "global_step": 193393, "epoch": 1598} {"train_loss": -41.72259521484375, "global_step": 193394, "epoch": 1598} {"train_loss": -42.08460235595703, "global_step": 193395, "epoch": 1598} {"train_loss": -42.056026458740234, "global_step": 193396, "epoch": 1598} {"train_loss": -41.795928955078125, "global_step": 193397, "epoch": 1598} {"train_loss": -42.170772552490234, "global_step": 193398, "epoch": 1598} {"train_loss": -42.79288864135742, "global_step": 193399, "epoch": 1598} {"train_loss": -41.807003021240234, "global_step": 193400, "epoch": 1598} {"train_loss": -42.10215377807617, "global_step": 193401, "epoch": 1598} {"train_loss": -42.02996826171875, "global_step": 193402, "epoch": 1598} {"train_loss": -42.45490646362305, "global_step": 193403, "epoch": 1598} {"train_loss": -41.050025939941406, "global_step": 193404, "epoch": 1598} {"train_loss": -42.53493881225586, "global_step": 193405, "epoch": 1598} {"train_loss": -42.22467803955078, "global_step": 193406, "epoch": 1598} {"train_loss": -42.18966293334961, "global_step": 193407, "epoch": 1598} {"train_loss": -42.04081726074219, "global_step": 193408, "epoch": 1598} {"train_loss": -42.33325958251953, "global_step": 193409, "epoch": 1598} {"train_loss": -42.26192092895508, "global_step": 193410, "epoch": 1598} {"train_loss": -42.47212219238281, "global_step": 193411, "epoch": 1598} {"train_loss": -42.3597526550293, "global_step": 193412, "epoch": 1598} {"train_loss": -42.43332290649414, "global_step": 193413, "epoch": 1598} {"train_loss": -42.2645263671875, "global_step": 193414, "epoch": 1598} {"train_loss": -42.89301300048828, "global_step": 193415, "epoch": 1598} {"train_loss": -42.55624771118164, "global_step": 193416, "epoch": 1598} {"train_loss": -41.93430709838867, "global_step": 193417, "epoch": 1598} {"train_loss": -42.68939208984375, "global_step": 193418, "epoch": 1598} {"train_loss": -41.8298454284668, "global_step": 193419, "epoch": 1598} {"train_loss": -42.745052337646484, "global_step": 193420, "epoch": 1598} {"train_loss": -42.809261322021484, "global_step": 193421, "epoch": 1598} {"train_loss": -42.52288818359375, "global_step": 193422, "epoch": 1598} {"train_loss": -42.71031188964844, "global_step": 193423, "epoch": 1598} {"train_loss": -42.84333038330078, "global_step": 193424, "epoch": 1598} {"train_loss": -42.6060905456543, "global_step": 193425, "epoch": 1598} {"train_loss": -43.170467376708984, "global_step": 193426, "epoch": 1598} {"train_loss": -42.43464279174805, "global_step": 193427, "epoch": 1598} {"train_loss": -42.53422164916992, "global_step": 193428, "epoch": 1598} {"train_loss": -42.461360931396484, "global_step": 193429, "epoch": 1598} {"train_loss": -42.4354133605957, "global_step": 193430, "epoch": 1598} {"train_loss": -42.29472351074219, "global_step": 193431, "epoch": 1598} {"train_loss": -42.61497116088867, "global_step": 193432, "epoch": 1598} {"train_loss": -42.65261459350586, "global_step": 193433, "epoch": 1598} {"train_loss": -41.741371154785156, "global_step": 193434, "epoch": 1598} {"train_loss": -41.0889778137207, "global_step": 193435, "epoch": 1598} {"train_loss": -38.699256896972656, "global_step": 193436, "epoch": 1598} {"train_loss": -37.21733856201172, "global_step": 193437, "epoch": 1598} {"train_loss": -38.68388366699219, "global_step": 193438, "epoch": 1598} {"train_loss": -41.758567810058594, "global_step": 193439, "epoch": 1598} {"train_loss": -38.452632904052734, "global_step": 193440, "epoch": 1598} {"train_loss": -35.51335525512695, "global_step": 193441, "epoch": 1598} {"train_loss": -36.194435119628906, "global_step": 193442, "epoch": 1598} {"train_loss": -37.297019958496094, "global_step": 193443, "epoch": 1598} {"train_loss": -34.95442581176758, "global_step": 193444, "epoch": 1598} {"train_loss": -35.011962890625, "global_step": 193445, "epoch": 1598} {"train_loss": -35.559364318847656, "global_step": 193446, "epoch": 1598} {"train_loss": -35.66292953491211, "global_step": 193447, "epoch": 1598} {"train_loss": -36.10005569458008, "global_step": 193448, "epoch": 1598} {"train_loss": -35.5888671875, "global_step": 193449, "epoch": 1598} {"train_loss": -37.07412338256836, "global_step": 193450, "epoch": 1598} {"train_loss": -37.27790069580078, "global_step": 193451, "epoch": 1598} {"train_loss": -36.84309005737305, "global_step": 193452, "epoch": 1598} {"train_loss": -36.751129150390625, "global_step": 193453, "epoch": 1598} {"train_loss": -38.18965148925781, "global_step": 193454, "epoch": 1598} {"train_loss": -39.928260803222656, "global_step": 193455, "epoch": 1598} {"train_loss": -40.49400329589844, "global_step": 193456, "epoch": 1598} {"train_loss": -39.11186218261719, "global_step": 193457, "epoch": 1598} {"train_loss": -39.32442092895508, "global_step": 193458, "epoch": 1598} {"train_loss": -39.652198791503906, "global_step": 193459, "epoch": 1598} {"train_loss": -39.34408950805664, "global_step": 193460, "epoch": 1598} {"train_loss": -40.78957748413086, "global_step": 193461, "epoch": 1598} {"train_loss": -38.3068962097168, "global_step": 193462, "epoch": 1598} {"train_loss": -39.9813232421875, "global_step": 193463, "epoch": 1598} {"train_loss": -39.29433822631836, "global_step": 193464, "epoch": 1598} {"train_loss": -36.70185470581055, "global_step": 193465, "epoch": 1598} {"train_loss": -40.10432052612305, "global_step": 193466, "epoch": 1598} {"train_loss": -35.11434555053711, "global_step": 193467, "epoch": 1598} {"train_loss": -35.976417541503906, "global_step": 193468, "epoch": 1598} {"train_loss": -39.310611724853516, "global_step": 193469, "epoch": 1598} {"train_loss": -35.8835563659668, "global_step": 193470, "epoch": 1598} {"train_loss": -40.34902572631836, "global_step": 193471, "epoch": 1598} {"train_loss": -37.12434005737305, "global_step": 193472, "epoch": 1598} {"train_loss": -39.4837646484375, "global_step": 193473, "epoch": 1598} {"train_loss": -38.6821403503418, "global_step": 193474, "epoch": 1598} {"train_loss": -41.30355453491211, "global_step": 193475, "epoch": 1598} {"train_loss": -38.97100830078125, "global_step": 193476, "epoch": 1598} {"train_loss": -41.082584381103516, "global_step": 193477, "epoch": 1598} {"train_loss": -40.34813204678622, "global_step": 193478, "epoch": 1598, "val_loss": 2455193.0} {"train_loss": -40.2441291809082, "global_step": 193479, "epoch": 1599} {"train_loss": -39.618282318115234, "global_step": 193480, "epoch": 1599} {"train_loss": -39.17680740356445, "global_step": 193481, "epoch": 1599} {"train_loss": -41.383766174316406, "global_step": 193482, "epoch": 1599} {"train_loss": -38.88719940185547, "global_step": 193483, "epoch": 1599} {"train_loss": -41.41086959838867, "global_step": 193484, "epoch": 1599} {"train_loss": -39.95524978637695, "global_step": 193485, "epoch": 1599} {"train_loss": -40.977394104003906, "global_step": 193486, "epoch": 1599} {"train_loss": -41.01774978637695, "global_step": 193487, "epoch": 1599} {"train_loss": -40.057334899902344, "global_step": 193488, "epoch": 1599} {"train_loss": -41.58588790893555, "global_step": 193489, "epoch": 1599} {"train_loss": -40.63507843017578, "global_step": 193490, "epoch": 1599} {"train_loss": -41.92322540283203, "global_step": 193491, "epoch": 1599} {"train_loss": -41.01182556152344, "global_step": 193492, "epoch": 1599} {"train_loss": -41.42108917236328, "global_step": 193493, "epoch": 1599} {"train_loss": -40.81920623779297, "global_step": 193494, "epoch": 1599} {"train_loss": -41.29914474487305, "global_step": 193495, "epoch": 1599} {"train_loss": -41.17668914794922, "global_step": 193496, "epoch": 1599} {"train_loss": -40.964698791503906, "global_step": 193497, "epoch": 1599} {"train_loss": -41.163936614990234, "global_step": 193498, "epoch": 1599} {"train_loss": -41.14799880981445, "global_step": 193499, "epoch": 1599} {"train_loss": -41.2470588684082, "global_step": 193500, "epoch": 1599} {"train_loss": -41.00509262084961, "global_step": 193501, "epoch": 1599} {"train_loss": -40.0848503112793, "global_step": 193502, "epoch": 1599} {"train_loss": -41.57960510253906, "global_step": 193503, "epoch": 1599} {"train_loss": -40.66400909423828, "global_step": 193504, "epoch": 1599} {"train_loss": -41.640045166015625, "global_step": 193505, "epoch": 1599} {"train_loss": -40.577327728271484, "global_step": 193506, "epoch": 1599} {"train_loss": -41.69178009033203, "global_step": 193507, "epoch": 1599} {"train_loss": -41.331214904785156, "global_step": 193508, "epoch": 1599} {"train_loss": -41.96236801147461, "global_step": 193509, "epoch": 1599} {"train_loss": -41.032047271728516, "global_step": 193510, "epoch": 1599} {"train_loss": -41.70210647583008, "global_step": 193511, "epoch": 1599} {"train_loss": -41.607730865478516, "global_step": 193512, "epoch": 1599} {"train_loss": -41.52760314941406, "global_step": 193513, "epoch": 1599} {"train_loss": -41.57880783081055, "global_step": 193514, "epoch": 1599} {"train_loss": -41.88838577270508, "global_step": 193515, "epoch": 1599} {"train_loss": -42.33822250366211, "global_step": 193516, "epoch": 1599} {"train_loss": -41.735084533691406, "global_step": 193517, "epoch": 1599} {"train_loss": -41.98176193237305, "global_step": 193518, "epoch": 1599} {"train_loss": -41.8800163269043, "global_step": 193519, "epoch": 1599} {"train_loss": -41.923919677734375, "global_step": 193520, "epoch": 1599} {"train_loss": -41.114253997802734, "global_step": 193521, "epoch": 1599} {"train_loss": -41.35802459716797, "global_step": 193522, "epoch": 1599} {"train_loss": -41.39628982543945, "global_step": 193523, "epoch": 1599} {"train_loss": -40.00507736206055, "global_step": 193524, "epoch": 1599} {"train_loss": -40.74794387817383, "global_step": 193525, "epoch": 1599} {"train_loss": -41.70368576049805, "global_step": 193526, "epoch": 1599} {"train_loss": -42.408363342285156, "global_step": 193527, "epoch": 1599} {"train_loss": -42.611934661865234, "global_step": 193528, "epoch": 1599} {"train_loss": -42.43333435058594, "global_step": 193529, "epoch": 1599} {"train_loss": -42.14249801635742, "global_step": 193530, "epoch": 1599} {"train_loss": -42.846073150634766, "global_step": 193531, "epoch": 1599} {"train_loss": -42.10039520263672, "global_step": 193532, "epoch": 1599} {"train_loss": -41.84255599975586, "global_step": 193533, "epoch": 1599} {"train_loss": -41.413658142089844, "global_step": 193534, "epoch": 1599} {"train_loss": -39.55195236206055, "global_step": 193535, "epoch": 1599} {"train_loss": -41.93076705932617, "global_step": 193536, "epoch": 1599} {"train_loss": -42.35400390625, "global_step": 193537, "epoch": 1599} {"train_loss": -42.09040451049805, "global_step": 193538, "epoch": 1599} {"train_loss": -41.0924186706543, "global_step": 193539, "epoch": 1599} {"train_loss": -40.730159759521484, "global_step": 193540, "epoch": 1599} {"train_loss": -41.29775619506836, "global_step": 193541, "epoch": 1599} {"train_loss": -42.107643127441406, "global_step": 193542, "epoch": 1599} {"train_loss": -42.55958938598633, "global_step": 193543, "epoch": 1599} {"train_loss": -42.153717041015625, "global_step": 193544, "epoch": 1599} {"train_loss": -42.27511215209961, "global_step": 193545, "epoch": 1599} {"train_loss": -42.51691436767578, "global_step": 193546, "epoch": 1599} {"train_loss": -41.64999771118164, "global_step": 193547, "epoch": 1599} {"train_loss": -42.25425338745117, "global_step": 193548, "epoch": 1599} {"train_loss": -42.55145263671875, "global_step": 193549, "epoch": 1599} {"train_loss": -42.22152328491211, "global_step": 193550, "epoch": 1599} {"train_loss": -41.9577522277832, "global_step": 193551, "epoch": 1599} {"train_loss": -41.693336486816406, "global_step": 193552, "epoch": 1599} {"train_loss": -42.402137756347656, "global_step": 193553, "epoch": 1599} {"train_loss": -42.771148681640625, "global_step": 193554, "epoch": 1599} {"train_loss": -42.22119140625, "global_step": 193555, "epoch": 1599} {"train_loss": -42.8352165222168, "global_step": 193556, "epoch": 1599} {"train_loss": -42.13691329956055, "global_step": 193557, "epoch": 1599} {"train_loss": -42.617916107177734, "global_step": 193558, "epoch": 1599} {"train_loss": -42.31051254272461, "global_step": 193559, "epoch": 1599} {"train_loss": -40.47591781616211, "global_step": 193560, "epoch": 1599} {"train_loss": -42.377967834472656, "global_step": 193561, "epoch": 1599} {"train_loss": -41.53559112548828, "global_step": 193562, "epoch": 1599} {"train_loss": -42.005855560302734, "global_step": 193563, "epoch": 1599} {"train_loss": -42.764549255371094, "global_step": 193564, "epoch": 1599} {"train_loss": -42.82272720336914, "global_step": 193565, "epoch": 1599} {"train_loss": -42.148765563964844, "global_step": 193566, "epoch": 1599} {"train_loss": -40.35026168823242, "global_step": 193567, "epoch": 1599} {"train_loss": -40.436424255371094, "global_step": 193568, "epoch": 1599} {"train_loss": -41.73427963256836, "global_step": 193569, "epoch": 1599} {"train_loss": -42.20623779296875, "global_step": 193570, "epoch": 1599} {"train_loss": -40.45383834838867, "global_step": 193571, "epoch": 1599} {"train_loss": -41.4031867980957, "global_step": 193572, "epoch": 1599} {"train_loss": -42.425079345703125, "global_step": 193573, "epoch": 1599} {"train_loss": -40.69050979614258, "global_step": 193574, "epoch": 1599} {"train_loss": -40.028175354003906, "global_step": 193575, "epoch": 1599} {"train_loss": -42.62580490112305, "global_step": 193576, "epoch": 1599} {"train_loss": -41.99561309814453, "global_step": 193577, "epoch": 1599} {"train_loss": -41.63119125366211, "global_step": 193578, "epoch": 1599} {"train_loss": -41.59841537475586, "global_step": 193579, "epoch": 1599} {"train_loss": -41.775691986083984, "global_step": 193580, "epoch": 1599} {"train_loss": -41.942054748535156, "global_step": 193581, "epoch": 1599} {"train_loss": -42.88903045654297, "global_step": 193582, "epoch": 1599} {"train_loss": -41.95134353637695, "global_step": 193583, "epoch": 1599} {"train_loss": -42.657447814941406, "global_step": 193584, "epoch": 1599} {"train_loss": -42.576133728027344, "global_step": 193585, "epoch": 1599} {"train_loss": -42.168209075927734, "global_step": 193586, "epoch": 1599} {"train_loss": -42.122093200683594, "global_step": 193587, "epoch": 1599} {"train_loss": -42.13723373413086, "global_step": 193588, "epoch": 1599} {"train_loss": -42.2785758972168, "global_step": 193589, "epoch": 1599} {"train_loss": -42.30805587768555, "global_step": 193590, "epoch": 1599} {"train_loss": -43.02012252807617, "global_step": 193591, "epoch": 1599} {"train_loss": -42.48884201049805, "global_step": 193592, "epoch": 1599} {"train_loss": -42.50929260253906, "global_step": 193593, "epoch": 1599} {"train_loss": -42.12218475341797, "global_step": 193594, "epoch": 1599} {"train_loss": -42.970611572265625, "global_step": 193595, "epoch": 1599} {"train_loss": -42.65627670288086, "global_step": 193596, "epoch": 1599} {"train_loss": -41.57844924926758, "global_step": 193597, "epoch": 1599} {"train_loss": -42.61379623413086, "global_step": 193598, "epoch": 1599} {"train_loss": -41.65340965838472, "global_step": 193599, "epoch": 1599, "val_loss": 2429831.25} {"train_loss": -42.81458282470703, "global_step": 193600, "epoch": 1600} {"train_loss": -43.38365173339844, "global_step": 193601, "epoch": 1600} {"train_loss": -42.414608001708984, "global_step": 193602, "epoch": 1600} {"train_loss": -42.879512786865234, "global_step": 193603, "epoch": 1600} {"train_loss": -41.59186553955078, "global_step": 193604, "epoch": 1600} {"train_loss": -41.56441116333008, "global_step": 193605, "epoch": 1600} {"train_loss": -41.90745162963867, "global_step": 193606, "epoch": 1600} {"train_loss": -41.60713195800781, "global_step": 193607, "epoch": 1600} {"train_loss": -41.66530227661133, "global_step": 193608, "epoch": 1600} {"train_loss": -43.091548919677734, "global_step": 193609, "epoch": 1600} {"train_loss": -42.82786178588867, "global_step": 193610, "epoch": 1600} {"train_loss": -42.57952117919922, "global_step": 193611, "epoch": 1600} {"train_loss": -41.39765548706055, "global_step": 193612, "epoch": 1600} {"train_loss": -42.69029998779297, "global_step": 193613, "epoch": 1600} {"train_loss": -42.57841873168945, "global_step": 193614, "epoch": 1600} {"train_loss": -42.78373336791992, "global_step": 193615, "epoch": 1600} {"train_loss": -42.3714599609375, "global_step": 193616, "epoch": 1600} {"train_loss": -41.991127014160156, "global_step": 193617, "epoch": 1600} {"train_loss": -42.796852111816406, "global_step": 193618, "epoch": 1600} {"train_loss": -42.65397262573242, "global_step": 193619, "epoch": 1600} {"train_loss": -41.07918930053711, "global_step": 193620, "epoch": 1600} {"train_loss": -40.443519592285156, "global_step": 193621, "epoch": 1600} {"train_loss": -39.332881927490234, "global_step": 193622, "epoch": 1600} {"train_loss": -41.35834503173828, "global_step": 193623, "epoch": 1600} {"train_loss": -41.927371978759766, "global_step": 193624, "epoch": 1600} {"train_loss": -41.94926452636719, "global_step": 193625, "epoch": 1600} {"train_loss": -41.309051513671875, "global_step": 193626, "epoch": 1600} {"train_loss": -41.60380172729492, "global_step": 193627, "epoch": 1600} {"train_loss": -42.240936279296875, "global_step": 193628, "epoch": 1600} {"train_loss": -41.59884262084961, "global_step": 193629, "epoch": 1600} {"train_loss": -42.21769714355469, "global_step": 193630, "epoch": 1600} {"train_loss": -42.87276840209961, "global_step": 193631, "epoch": 1600} {"train_loss": -42.16771697998047, "global_step": 193632, "epoch": 1600} {"train_loss": -42.671688079833984, "global_step": 193633, "epoch": 1600} {"train_loss": -42.61613082885742, "global_step": 193634, "epoch": 1600} {"train_loss": -42.88393020629883, "global_step": 193635, "epoch": 1600} {"train_loss": -42.0367317199707, "global_step": 193636, "epoch": 1600} {"train_loss": -42.079383850097656, "global_step": 193637, "epoch": 1600} {"train_loss": -41.58381652832031, "global_step": 193638, "epoch": 1600} {"train_loss": -41.79207229614258, "global_step": 193639, "epoch": 1600} {"train_loss": -41.92629623413086, "global_step": 193640, "epoch": 1600} {"train_loss": -42.306575775146484, "global_step": 193641, "epoch": 1600} {"train_loss": -42.47319412231445, "global_step": 193642, "epoch": 1600} {"train_loss": -42.4321174621582, "global_step": 193643, "epoch": 1600} {"train_loss": -41.63969039916992, "global_step": 193644, "epoch": 1600} {"train_loss": -42.2116813659668, "global_step": 193645, "epoch": 1600} {"train_loss": -42.436405181884766, "global_step": 193646, "epoch": 1600} {"train_loss": -41.913082122802734, "global_step": 193647, "epoch": 1600} {"train_loss": -40.994903564453125, "global_step": 193648, "epoch": 1600} {"train_loss": -42.76311111450195, "global_step": 193649, "epoch": 1600} {"train_loss": -42.6241569519043, "global_step": 193650, "epoch": 1600} {"train_loss": -42.50324630737305, "global_step": 193651, "epoch": 1600} {"train_loss": -41.620845794677734, "global_step": 193652, "epoch": 1600} {"train_loss": -40.82816696166992, "global_step": 193653, "epoch": 1600} {"train_loss": -40.431884765625, "global_step": 193654, "epoch": 1600} {"train_loss": -40.635536193847656, "global_step": 193655, "epoch": 1600} {"train_loss": -41.996437072753906, "global_step": 193656, "epoch": 1600} {"train_loss": -40.217689514160156, "global_step": 193657, "epoch": 1600} {"train_loss": -38.496273040771484, "global_step": 193658, "epoch": 1600} {"train_loss": -42.744300842285156, "global_step": 193659, "epoch": 1600} {"train_loss": -39.94697952270508, "global_step": 193660, "epoch": 1600} {"train_loss": -40.884403228759766, "global_step": 193661, "epoch": 1600} {"train_loss": -41.4801139831543, "global_step": 193662, "epoch": 1600} {"train_loss": -39.17798614501953, "global_step": 193663, "epoch": 1600} {"train_loss": -40.5761833190918, "global_step": 193664, "epoch": 1600} {"train_loss": -42.19369888305664, "global_step": 193665, "epoch": 1600} {"train_loss": -40.429283142089844, "global_step": 193666, "epoch": 1600} {"train_loss": -40.28574752807617, "global_step": 193667, "epoch": 1600} {"train_loss": -42.54421615600586, "global_step": 193668, "epoch": 1600} {"train_loss": -40.238948822021484, "global_step": 193669, "epoch": 1600} {"train_loss": -40.167606353759766, "global_step": 193670, "epoch": 1600} {"train_loss": -40.89579391479492, "global_step": 193671, "epoch": 1600} {"train_loss": -40.65447998046875, "global_step": 193672, "epoch": 1600} {"train_loss": -42.49605941772461, "global_step": 193673, "epoch": 1600} {"train_loss": -40.670570373535156, "global_step": 193674, "epoch": 1600} {"train_loss": -40.00896072387695, "global_step": 193675, "epoch": 1600} {"train_loss": -41.413673400878906, "global_step": 193676, "epoch": 1600} {"train_loss": -41.04887390136719, "global_step": 193677, "epoch": 1600} {"train_loss": -41.51378631591797, "global_step": 193678, "epoch": 1600} {"train_loss": -40.63993453979492, "global_step": 193679, "epoch": 1600} {"train_loss": -40.957862854003906, "global_step": 193680, "epoch": 1600} {"train_loss": -40.53605651855469, "global_step": 193681, "epoch": 1600} {"train_loss": -42.179439544677734, "global_step": 193682, "epoch": 1600} {"train_loss": -40.83159255981445, "global_step": 193683, "epoch": 1600} {"train_loss": -40.456809997558594, "global_step": 193684, "epoch": 1600} {"train_loss": -41.87344741821289, "global_step": 193685, "epoch": 1600} {"train_loss": -40.67694854736328, "global_step": 193686, "epoch": 1600} {"train_loss": -41.70821762084961, "global_step": 193687, "epoch": 1600} {"train_loss": -41.43833923339844, "global_step": 193688, "epoch": 1600} {"train_loss": -41.966976165771484, "global_step": 193689, "epoch": 1600} {"train_loss": -41.41510772705078, "global_step": 193690, "epoch": 1600} {"train_loss": -41.62763595581055, "global_step": 193691, "epoch": 1600} {"train_loss": -41.81589889526367, "global_step": 193692, "epoch": 1600} {"train_loss": -42.00177764892578, "global_step": 193693, "epoch": 1600} {"train_loss": -41.83800506591797, "global_step": 193694, "epoch": 1600} {"train_loss": -42.553382873535156, "global_step": 193695, "epoch": 1600} {"train_loss": -41.82494354248047, "global_step": 193696, "epoch": 1600} {"train_loss": -41.40498733520508, "global_step": 193697, "epoch": 1600} {"train_loss": -41.3662223815918, "global_step": 193698, "epoch": 1600} {"train_loss": -42.39849853515625, "global_step": 193699, "epoch": 1600} {"train_loss": -42.270938873291016, "global_step": 193700, "epoch": 1600} {"train_loss": -42.01945495605469, "global_step": 193701, "epoch": 1600} {"train_loss": -42.34812545776367, "global_step": 193702, "epoch": 1600} {"train_loss": -42.7580680847168, "global_step": 193703, "epoch": 1600} {"train_loss": -42.58726119995117, "global_step": 193704, "epoch": 1600} {"train_loss": -42.50674819946289, "global_step": 193705, "epoch": 1600} {"train_loss": -42.86492919921875, "global_step": 193706, "epoch": 1600} {"train_loss": -42.44504928588867, "global_step": 193707, "epoch": 1600} {"train_loss": -42.33577346801758, "global_step": 193708, "epoch": 1600} {"train_loss": -42.54777145385742, "global_step": 193709, "epoch": 1600} {"train_loss": -42.61484909057617, "global_step": 193710, "epoch": 1600} {"train_loss": -42.796024322509766, "global_step": 193711, "epoch": 1600} {"train_loss": -42.99708938598633, "global_step": 193712, "epoch": 1600} {"train_loss": -43.08121109008789, "global_step": 193713, "epoch": 1600} {"train_loss": -42.436702728271484, "global_step": 193714, "epoch": 1600} {"train_loss": -42.85287094116211, "global_step": 193715, "epoch": 1600} {"train_loss": -41.731651306152344, "global_step": 193716, "epoch": 1600} {"train_loss": -42.886104583740234, "global_step": 193717, "epoch": 1600} {"train_loss": -42.92383575439453, "global_step": 193718, "epoch": 1600} {"train_loss": -42.58054733276367, "global_step": 193719, "epoch": 1600} {"train_loss": -41.811168386916485, "global_step": 193720, "epoch": 1600, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4400000": 1.0, "test/sim_max_reward_4400001": 1.0, "test/sim_max_reward_4400002": 1.0, "test/sim_max_reward_4400003": 1.0, "test/sim_max_reward_4400004": 1.0, "test/sim_max_reward_4400005": 1.0, "test/sim_max_reward_4400006": 1.0, "test/sim_max_reward_4400007": 1.0, "test/sim_max_reward_4400008": 1.0, "test/sim_max_reward_4400009": 1.0, "test/sim_max_reward_4400010": 1.0, "test/sim_max_reward_4400011": 1.0, "test/sim_max_reward_4400012": 1.0, "test/sim_max_reward_4400013": 1.0, "test/sim_max_reward_4400014": 1.0, "test/sim_max_reward_4400015": 1.0, "test/sim_max_reward_4400016": 1.0, "test/sim_max_reward_4400017": 1.0, "test/sim_max_reward_4400018": 1.0, "test/sim_max_reward_4400019": 1.0, "test/sim_max_reward_4400020": 1.0, "test/sim_max_reward_4400021": 1.0, "train/mean_score": 1.0, "test/mean_score": 1.0, "val_loss": 2480189.75} {"train_loss": -43.179874420166016, "global_step": 193721, "epoch": 1601} {"train_loss": -43.17657470703125, "global_step": 193722, "epoch": 1601} {"train_loss": -43.00474166870117, "global_step": 193723, "epoch": 1601} {"train_loss": -42.927268981933594, "global_step": 193724, "epoch": 1601} {"train_loss": -42.86923599243164, "global_step": 193725, "epoch": 1601} {"train_loss": -43.05971908569336, "global_step": 193726, "epoch": 1601} {"train_loss": -42.98334503173828, "global_step": 193727, "epoch": 1601} {"train_loss": -42.51380920410156, "global_step": 193728, "epoch": 1601} {"train_loss": -42.71889114379883, "global_step": 193729, "epoch": 1601} {"train_loss": -42.5769157409668, "global_step": 193730, "epoch": 1601} {"train_loss": -41.0919303894043, "global_step": 193731, "epoch": 1601} {"train_loss": -37.656307220458984, "global_step": 193732, "epoch": 1601} {"train_loss": -42.942562103271484, "global_step": 193733, "epoch": 1601} {"train_loss": -39.33447265625, "global_step": 193734, "epoch": 1601} {"train_loss": -37.50825881958008, "global_step": 193735, "epoch": 1601} {"train_loss": -41.29340744018555, "global_step": 193736, "epoch": 1601} {"train_loss": -40.955299377441406, "global_step": 193737, "epoch": 1601} {"train_loss": -39.38630676269531, "global_step": 193738, "epoch": 1601} {"train_loss": -41.044124603271484, "global_step": 193739, "epoch": 1601} {"train_loss": -41.61126708984375, "global_step": 193740, "epoch": 1601} {"train_loss": -41.31248092651367, "global_step": 193741, "epoch": 1601} {"train_loss": -41.22304916381836, "global_step": 193742, "epoch": 1601} {"train_loss": -41.70819091796875, "global_step": 193743, "epoch": 1601} {"train_loss": -38.983280181884766, "global_step": 193744, "epoch": 1601} {"train_loss": -41.27620315551758, "global_step": 193745, "epoch": 1601} {"train_loss": -41.624752044677734, "global_step": 193746, "epoch": 1601} {"train_loss": -38.79423141479492, "global_step": 193747, "epoch": 1601} {"train_loss": -40.58940505981445, "global_step": 193748, "epoch": 1601} {"train_loss": -40.70530700683594, "global_step": 193749, "epoch": 1601} {"train_loss": -40.50009536743164, "global_step": 193750, "epoch": 1601} {"train_loss": -41.844364166259766, "global_step": 193751, "epoch": 1601} {"train_loss": -40.51162338256836, "global_step": 193752, "epoch": 1601} {"train_loss": -40.31073760986328, "global_step": 193753, "epoch": 1601} {"train_loss": -41.5666618347168, "global_step": 193754, "epoch": 1601} {"train_loss": -40.62582015991211, "global_step": 193755, "epoch": 1601} {"train_loss": -41.22846984863281, "global_step": 193756, "epoch": 1601} {"train_loss": -41.344783782958984, "global_step": 193757, "epoch": 1601} {"train_loss": -40.85189437866211, "global_step": 193758, "epoch": 1601} {"train_loss": -42.28827667236328, "global_step": 193759, "epoch": 1601} {"train_loss": -41.31791305541992, "global_step": 193760, "epoch": 1601} {"train_loss": -40.882991790771484, "global_step": 193761, "epoch": 1601} {"train_loss": -41.98725509643555, "global_step": 193762, "epoch": 1601} {"train_loss": -41.86997985839844, "global_step": 193763, "epoch": 1601} {"train_loss": -40.79165267944336, "global_step": 193764, "epoch": 1601} {"train_loss": -41.2967529296875, "global_step": 193765, "epoch": 1601} {"train_loss": -42.76713943481445, "global_step": 193766, "epoch": 1601} {"train_loss": -42.38179397583008, "global_step": 193767, "epoch": 1601} {"train_loss": -40.953712463378906, "global_step": 193768, "epoch": 1601} {"train_loss": -42.441017150878906, "global_step": 193769, "epoch": 1601} {"train_loss": -41.971309661865234, "global_step": 193770, "epoch": 1601} {"train_loss": -39.78485107421875, "global_step": 193771, "epoch": 1601} {"train_loss": -42.52402877807617, "global_step": 193772, "epoch": 1601} {"train_loss": -41.99654769897461, "global_step": 193773, "epoch": 1601} {"train_loss": -39.8736457824707, "global_step": 193774, "epoch": 1601} {"train_loss": -41.29613494873047, "global_step": 193775, "epoch": 1601} {"train_loss": -42.515098571777344, "global_step": 193776, "epoch": 1601} {"train_loss": -41.6021614074707, "global_step": 193777, "epoch": 1601} {"train_loss": -42.093910217285156, "global_step": 193778, "epoch": 1601} {"train_loss": -42.13222885131836, "global_step": 193779, "epoch": 1601} {"train_loss": -42.50033187866211, "global_step": 193780, "epoch": 1601} {"train_loss": -40.69355773925781, "global_step": 193781, "epoch": 1601} {"train_loss": -41.27006149291992, "global_step": 193782, "epoch": 1601} {"train_loss": -42.58079528808594, "global_step": 193783, "epoch": 1601} {"train_loss": -41.13985061645508, "global_step": 193784, "epoch": 1601} {"train_loss": -40.99977111816406, "global_step": 193785, "epoch": 1601} {"train_loss": -42.015926361083984, "global_step": 193786, "epoch": 1601} {"train_loss": -41.07650375366211, "global_step": 193787, "epoch": 1601} {"train_loss": -42.24868392944336, "global_step": 193788, "epoch": 1601} {"train_loss": -41.388423919677734, "global_step": 193789, "epoch": 1601} {"train_loss": -41.62166976928711, "global_step": 193790, "epoch": 1601} {"train_loss": -42.164520263671875, "global_step": 193791, "epoch": 1601} {"train_loss": -42.562042236328125, "global_step": 193792, "epoch": 1601} {"train_loss": -42.10363006591797, "global_step": 193793, "epoch": 1601} {"train_loss": -42.29618453979492, "global_step": 193794, "epoch": 1601} {"train_loss": -41.3026123046875, "global_step": 193795, "epoch": 1601} {"train_loss": -41.71195602416992, "global_step": 193796, "epoch": 1601} {"train_loss": -42.38893508911133, "global_step": 193797, "epoch": 1601} {"train_loss": -41.40450668334961, "global_step": 193798, "epoch": 1601} {"train_loss": -41.010498046875, "global_step": 193799, "epoch": 1601} {"train_loss": -42.70427322387695, "global_step": 193800, "epoch": 1601} {"train_loss": -41.537437438964844, "global_step": 193801, "epoch": 1601} {"train_loss": -42.511714935302734, "global_step": 193802, "epoch": 1601} {"train_loss": -42.27968215942383, "global_step": 193803, "epoch": 1601} {"train_loss": -42.276546478271484, "global_step": 193804, "epoch": 1601} {"train_loss": -41.741981506347656, "global_step": 193805, "epoch": 1601} {"train_loss": -41.74766540527344, "global_step": 193806, "epoch": 1601} {"train_loss": -42.798580169677734, "global_step": 193807, "epoch": 1601} {"train_loss": -41.053497314453125, "global_step": 193808, "epoch": 1601} {"train_loss": -42.13916015625, "global_step": 193809, "epoch": 1601} {"train_loss": -41.97939682006836, "global_step": 193810, "epoch": 1601} {"train_loss": -40.67232131958008, "global_step": 193811, "epoch": 1601} {"train_loss": -42.114952087402344, "global_step": 193812, "epoch": 1601} {"train_loss": -42.23209762573242, "global_step": 193813, "epoch": 1601} {"train_loss": -42.59226989746094, "global_step": 193814, "epoch": 1601} {"train_loss": -42.16520309448242, "global_step": 193815, "epoch": 1601} {"train_loss": -42.50093078613281, "global_step": 193816, "epoch": 1601} {"train_loss": -42.78886032104492, "global_step": 193817, "epoch": 1601} {"train_loss": -41.58071517944336, "global_step": 193818, "epoch": 1601} {"train_loss": -42.43015670776367, "global_step": 193819, "epoch": 1601} {"train_loss": -42.19584274291992, "global_step": 193820, "epoch": 1601} {"train_loss": -41.85224151611328, "global_step": 193821, "epoch": 1601} {"train_loss": -42.604915618896484, "global_step": 193822, "epoch": 1601} {"train_loss": -41.501808166503906, "global_step": 193823, "epoch": 1601} {"train_loss": -41.977779388427734, "global_step": 193824, "epoch": 1601} {"train_loss": -41.554744720458984, "global_step": 193825, "epoch": 1601} {"train_loss": -42.201595306396484, "global_step": 193826, "epoch": 1601} {"train_loss": -42.09588623046875, "global_step": 193827, "epoch": 1601} {"train_loss": -42.071956634521484, "global_step": 193828, "epoch": 1601} {"train_loss": -42.9723014831543, "global_step": 193829, "epoch": 1601} {"train_loss": -42.026222229003906, "global_step": 193830, "epoch": 1601} {"train_loss": -42.49797439575195, "global_step": 193831, "epoch": 1601} {"train_loss": -42.84096145629883, "global_step": 193832, "epoch": 1601} {"train_loss": -42.13446807861328, "global_step": 193833, "epoch": 1601} {"train_loss": -41.870140075683594, "global_step": 193834, "epoch": 1601} {"train_loss": -42.20209884643555, "global_step": 193835, "epoch": 1601} {"train_loss": -42.68891525268555, "global_step": 193836, "epoch": 1601} {"train_loss": -42.62958526611328, "global_step": 193837, "epoch": 1601} {"train_loss": -42.649776458740234, "global_step": 193838, "epoch": 1601} {"train_loss": -42.750457763671875, "global_step": 193839, "epoch": 1601} {"train_loss": -41.24653244018555, "global_step": 193840, "epoch": 1601} {"train_loss": -41.71187128114306, "global_step": 193841, "epoch": 1601, "val_loss": 2773197.75} {"train_loss": -42.0570182800293, "global_step": 193842, "epoch": 1602} {"train_loss": -42.136268615722656, "global_step": 193843, "epoch": 1602} {"train_loss": -41.110084533691406, "global_step": 193844, "epoch": 1602} {"train_loss": -42.33100509643555, "global_step": 193845, "epoch": 1602} {"train_loss": -42.543373107910156, "global_step": 193846, "epoch": 1602} {"train_loss": -42.2803840637207, "global_step": 193847, "epoch": 1602} {"train_loss": -41.41998291015625, "global_step": 193848, "epoch": 1602} {"train_loss": -42.353172302246094, "global_step": 193849, "epoch": 1602} {"train_loss": -41.357845306396484, "global_step": 193850, "epoch": 1602} {"train_loss": -40.06441116333008, "global_step": 193851, "epoch": 1602} {"train_loss": -39.89664840698242, "global_step": 193852, "epoch": 1602} {"train_loss": -40.67057418823242, "global_step": 193853, "epoch": 1602} {"train_loss": -40.703163146972656, "global_step": 193854, "epoch": 1602} {"train_loss": -42.46818923950195, "global_step": 193855, "epoch": 1602} {"train_loss": -42.124366760253906, "global_step": 193856, "epoch": 1602} {"train_loss": -42.49119186401367, "global_step": 193857, "epoch": 1602} {"train_loss": -41.2364501953125, "global_step": 193858, "epoch": 1602} {"train_loss": -41.90605545043945, "global_step": 193859, "epoch": 1602} {"train_loss": -41.35186767578125, "global_step": 193860, "epoch": 1602} {"train_loss": -40.295814514160156, "global_step": 193861, "epoch": 1602} {"train_loss": -41.04951858520508, "global_step": 193862, "epoch": 1602} {"train_loss": -42.092830657958984, "global_step": 193863, "epoch": 1602} {"train_loss": -40.517086029052734, "global_step": 193864, "epoch": 1602} {"train_loss": -41.36454391479492, "global_step": 193865, "epoch": 1602} {"train_loss": -39.65232467651367, "global_step": 193866, "epoch": 1602} {"train_loss": -40.229164123535156, "global_step": 193867, "epoch": 1602} {"train_loss": -41.32869338989258, "global_step": 193868, "epoch": 1602} {"train_loss": -40.42516326904297, "global_step": 193869, "epoch": 1602} {"train_loss": -38.56631088256836, "global_step": 193870, "epoch": 1602} {"train_loss": -39.63198471069336, "global_step": 193871, "epoch": 1602} {"train_loss": -40.56673812866211, "global_step": 193872, "epoch": 1602} {"train_loss": -39.35266876220703, "global_step": 193873, "epoch": 1602} {"train_loss": -37.20527267456055, "global_step": 193874, "epoch": 1602} {"train_loss": -40.87787628173828, "global_step": 193875, "epoch": 1602} {"train_loss": -40.61298751831055, "global_step": 193876, "epoch": 1602} {"train_loss": -38.42121505737305, "global_step": 193877, "epoch": 1602} {"train_loss": -40.54338073730469, "global_step": 193878, "epoch": 1602} {"train_loss": -41.27230453491211, "global_step": 193879, "epoch": 1602} {"train_loss": -38.895999908447266, "global_step": 193880, "epoch": 1602} {"train_loss": -36.610565185546875, "global_step": 193881, "epoch": 1602} {"train_loss": -41.10346221923828, "global_step": 193882, "epoch": 1602} {"train_loss": -39.25397872924805, "global_step": 193883, "epoch": 1602} {"train_loss": -40.260066986083984, "global_step": 193884, "epoch": 1602} {"train_loss": -41.38307571411133, "global_step": 193885, "epoch": 1602} {"train_loss": -39.99844741821289, "global_step": 193886, "epoch": 1602} {"train_loss": -40.968929290771484, "global_step": 193887, "epoch": 1602} {"train_loss": -40.5140380859375, "global_step": 193888, "epoch": 1602} {"train_loss": -39.44370651245117, "global_step": 193889, "epoch": 1602} {"train_loss": -41.057125091552734, "global_step": 193890, "epoch": 1602} {"train_loss": -38.945255279541016, "global_step": 193891, "epoch": 1602} {"train_loss": -38.822811126708984, "global_step": 193892, "epoch": 1602} {"train_loss": -40.679927825927734, "global_step": 193893, "epoch": 1602} {"train_loss": -39.0339469909668, "global_step": 193894, "epoch": 1602} {"train_loss": -40.47026824951172, "global_step": 193895, "epoch": 1602} {"train_loss": -38.90106201171875, "global_step": 193896, "epoch": 1602} {"train_loss": -38.660400390625, "global_step": 193897, "epoch": 1602} {"train_loss": -40.81086730957031, "global_step": 193898, "epoch": 1602} {"train_loss": -40.49974822998047, "global_step": 193899, "epoch": 1602} {"train_loss": -41.162933349609375, "global_step": 193900, "epoch": 1602} {"train_loss": -40.136329650878906, "global_step": 193901, "epoch": 1602} {"train_loss": -40.066566467285156, "global_step": 193902, "epoch": 1602} {"train_loss": -39.53885269165039, "global_step": 193903, "epoch": 1602} {"train_loss": -40.469112396240234, "global_step": 193904, "epoch": 1602} {"train_loss": -40.1823616027832, "global_step": 193905, "epoch": 1602} {"train_loss": -40.796722412109375, "global_step": 193906, "epoch": 1602} {"train_loss": -40.261199951171875, "global_step": 193907, "epoch": 1602} {"train_loss": -41.12308883666992, "global_step": 193908, "epoch": 1602} {"train_loss": -42.03131866455078, "global_step": 193909, "epoch": 1602} {"train_loss": -40.498138427734375, "global_step": 193910, "epoch": 1602} {"train_loss": -40.81519317626953, "global_step": 193911, "epoch": 1602} {"train_loss": -40.97578048706055, "global_step": 193912, "epoch": 1602} {"train_loss": -38.7709846496582, "global_step": 193913, "epoch": 1602} {"train_loss": -41.5677490234375, "global_step": 193914, "epoch": 1602} {"train_loss": -41.01510238647461, "global_step": 193915, "epoch": 1602} {"train_loss": -41.737545013427734, "global_step": 193916, "epoch": 1602} {"train_loss": -41.48735427856445, "global_step": 193917, "epoch": 1602} {"train_loss": -41.01008224487305, "global_step": 193918, "epoch": 1602} {"train_loss": -42.316864013671875, "global_step": 193919, "epoch": 1602} {"train_loss": -41.38361740112305, "global_step": 193920, "epoch": 1602} {"train_loss": -41.209800720214844, "global_step": 193921, "epoch": 1602} {"train_loss": -41.20785140991211, "global_step": 193922, "epoch": 1602} {"train_loss": -40.7401237487793, "global_step": 193923, "epoch": 1602} {"train_loss": -40.61088180541992, "global_step": 193924, "epoch": 1602} {"train_loss": -41.60159683227539, "global_step": 193925, "epoch": 1602} {"train_loss": -41.25167465209961, "global_step": 193926, "epoch": 1602} {"train_loss": -40.9257698059082, "global_step": 193927, "epoch": 1602} {"train_loss": -41.27362823486328, "global_step": 193928, "epoch": 1602} {"train_loss": -41.686676025390625, "global_step": 193929, "epoch": 1602} {"train_loss": -42.27278518676758, "global_step": 193930, "epoch": 1602} {"train_loss": -40.88515853881836, "global_step": 193931, "epoch": 1602} {"train_loss": -41.05216979980469, "global_step": 193932, "epoch": 1602} {"train_loss": -41.54951095581055, "global_step": 193933, "epoch": 1602} {"train_loss": -42.160682678222656, "global_step": 193934, "epoch": 1602} {"train_loss": -41.48344421386719, "global_step": 193935, "epoch": 1602} {"train_loss": -38.8992805480957, "global_step": 193936, "epoch": 1602} {"train_loss": -41.90235137939453, "global_step": 193937, "epoch": 1602} {"train_loss": -40.87041091918945, "global_step": 193938, "epoch": 1602} {"train_loss": -41.70179748535156, "global_step": 193939, "epoch": 1602} {"train_loss": -41.30031967163086, "global_step": 193940, "epoch": 1602} {"train_loss": -41.348793029785156, "global_step": 193941, "epoch": 1602} {"train_loss": -41.77611541748047, "global_step": 193942, "epoch": 1602} {"train_loss": -39.86994171142578, "global_step": 193943, "epoch": 1602} {"train_loss": -41.88589096069336, "global_step": 193944, "epoch": 1602} {"train_loss": -41.47794723510742, "global_step": 193945, "epoch": 1602} {"train_loss": -41.648841857910156, "global_step": 193946, "epoch": 1602} {"train_loss": -40.06785202026367, "global_step": 193947, "epoch": 1602} {"train_loss": -39.85697555541992, "global_step": 193948, "epoch": 1602} {"train_loss": -41.3527946472168, "global_step": 193949, "epoch": 1602} {"train_loss": -41.07765579223633, "global_step": 193950, "epoch": 1602} {"train_loss": -38.361331939697266, "global_step": 193951, "epoch": 1602} {"train_loss": -41.73926544189453, "global_step": 193952, "epoch": 1602} {"train_loss": -37.724056243896484, "global_step": 193953, "epoch": 1602} {"train_loss": -41.497467041015625, "global_step": 193954, "epoch": 1602} {"train_loss": -40.00013732910156, "global_step": 193955, "epoch": 1602} {"train_loss": -41.86164474487305, "global_step": 193956, "epoch": 1602} {"train_loss": -42.082115173339844, "global_step": 193957, "epoch": 1602} {"train_loss": -40.7061653137207, "global_step": 193958, "epoch": 1602} {"train_loss": -42.03792953491211, "global_step": 193959, "epoch": 1602} {"train_loss": -40.91230392456055, "global_step": 193960, "epoch": 1602} {"train_loss": -41.43748092651367, "global_step": 193961, "epoch": 1602} {"train_loss": -40.77648137620658, "global_step": 193962, "epoch": 1602, "val_loss": 2588031.25} {"train_loss": -41.54547882080078, "global_step": 193963, "epoch": 1603} {"train_loss": -41.566551208496094, "global_step": 193964, "epoch": 1603} {"train_loss": -42.015254974365234, "global_step": 193965, "epoch": 1603} {"train_loss": -41.68754959106445, "global_step": 193966, "epoch": 1603} {"train_loss": -42.24930953979492, "global_step": 193967, "epoch": 1603} {"train_loss": -41.46609115600586, "global_step": 193968, "epoch": 1603} {"train_loss": -42.0426025390625, "global_step": 193969, "epoch": 1603} {"train_loss": -42.20829772949219, "global_step": 193970, "epoch": 1603} {"train_loss": -41.76498031616211, "global_step": 193971, "epoch": 1603} {"train_loss": -41.21372985839844, "global_step": 193972, "epoch": 1603} {"train_loss": -41.597625732421875, "global_step": 193973, "epoch": 1603} {"train_loss": -42.52738571166992, "global_step": 193974, "epoch": 1603} {"train_loss": -42.366485595703125, "global_step": 193975, "epoch": 1603} {"train_loss": -41.43503952026367, "global_step": 193976, "epoch": 1603} {"train_loss": -42.54595184326172, "global_step": 193977, "epoch": 1603} {"train_loss": -42.513824462890625, "global_step": 193978, "epoch": 1603} {"train_loss": -42.02567672729492, "global_step": 193979, "epoch": 1603} {"train_loss": -41.38444900512695, "global_step": 193980, "epoch": 1603} {"train_loss": -42.72504425048828, "global_step": 193981, "epoch": 1603} {"train_loss": -42.57139205932617, "global_step": 193982, "epoch": 1603} {"train_loss": -42.24112319946289, "global_step": 193983, "epoch": 1603} {"train_loss": -42.137508392333984, "global_step": 193984, "epoch": 1603} {"train_loss": -42.769344329833984, "global_step": 193985, "epoch": 1603} {"train_loss": -41.8268928527832, "global_step": 193986, "epoch": 1603} {"train_loss": -42.25825881958008, "global_step": 193987, "epoch": 1603} {"train_loss": -42.566650390625, "global_step": 193988, "epoch": 1603} {"train_loss": -41.627803802490234, "global_step": 193989, "epoch": 1603} {"train_loss": -42.652217864990234, "global_step": 193990, "epoch": 1603} {"train_loss": -41.89064025878906, "global_step": 193991, "epoch": 1603} {"train_loss": -41.12786865234375, "global_step": 193992, "epoch": 1603} {"train_loss": -41.64572525024414, "global_step": 193993, "epoch": 1603} {"train_loss": -42.78957748413086, "global_step": 193994, "epoch": 1603} {"train_loss": -42.667354583740234, "global_step": 193995, "epoch": 1603} {"train_loss": -42.66884994506836, "global_step": 193996, "epoch": 1603} {"train_loss": -42.02482986450195, "global_step": 193997, "epoch": 1603} {"train_loss": -42.267757415771484, "global_step": 193998, "epoch": 1603} {"train_loss": -43.05671310424805, "global_step": 193999, "epoch": 1603} {"train_loss": -41.19725799560547, "global_step": 194000, "epoch": 1603} {"train_loss": -42.52249526977539, "global_step": 194001, "epoch": 1603} {"train_loss": -42.53548049926758, "global_step": 194002, "epoch": 1603} {"train_loss": -42.62787628173828, "global_step": 194003, "epoch": 1603} {"train_loss": -42.50922393798828, "global_step": 194004, "epoch": 1603} {"train_loss": -43.19289016723633, "global_step": 194005, "epoch": 1603} {"train_loss": -42.1240234375, "global_step": 194006, "epoch": 1603} {"train_loss": -42.612789154052734, "global_step": 194007, "epoch": 1603} {"train_loss": -41.29497146606445, "global_step": 194008, "epoch": 1603} {"train_loss": -40.22783279418945, "global_step": 194009, "epoch": 1603} {"train_loss": -40.5737190246582, "global_step": 194010, "epoch": 1603} {"train_loss": -42.58901596069336, "global_step": 194011, "epoch": 1603} {"train_loss": -41.999916076660156, "global_step": 194012, "epoch": 1603} {"train_loss": -41.93134689331055, "global_step": 194013, "epoch": 1603} {"train_loss": -41.845890045166016, "global_step": 194014, "epoch": 1603} {"train_loss": -41.86855697631836, "global_step": 194015, "epoch": 1603} {"train_loss": -41.51961898803711, "global_step": 194016, "epoch": 1603} {"train_loss": -41.11183547973633, "global_step": 194017, "epoch": 1603} {"train_loss": -41.5268669128418, "global_step": 194018, "epoch": 1603} {"train_loss": -42.112239837646484, "global_step": 194019, "epoch": 1603} {"train_loss": -41.68433380126953, "global_step": 194020, "epoch": 1603} {"train_loss": -41.01613998413086, "global_step": 194021, "epoch": 1603} {"train_loss": -39.59593200683594, "global_step": 194022, "epoch": 1603} {"train_loss": -40.30671310424805, "global_step": 194023, "epoch": 1603} {"train_loss": -41.007164001464844, "global_step": 194024, "epoch": 1603} {"train_loss": -41.66781234741211, "global_step": 194025, "epoch": 1603} {"train_loss": -40.7082405090332, "global_step": 194026, "epoch": 1603} {"train_loss": -39.374088287353516, "global_step": 194027, "epoch": 1603} {"train_loss": -39.10952377319336, "global_step": 194028, "epoch": 1603} {"train_loss": -39.198604583740234, "global_step": 194029, "epoch": 1603} {"train_loss": -38.14860153198242, "global_step": 194030, "epoch": 1603} {"train_loss": -41.32332229614258, "global_step": 194031, "epoch": 1603} {"train_loss": -39.12446212768555, "global_step": 194032, "epoch": 1603} {"train_loss": -41.43740463256836, "global_step": 194033, "epoch": 1603} {"train_loss": -40.33698272705078, "global_step": 194034, "epoch": 1603} {"train_loss": -40.46134567260742, "global_step": 194035, "epoch": 1603} {"train_loss": -41.25509262084961, "global_step": 194036, "epoch": 1603} {"train_loss": -39.411556243896484, "global_step": 194037, "epoch": 1603} {"train_loss": -41.16177749633789, "global_step": 194038, "epoch": 1603} {"train_loss": -40.02387619018555, "global_step": 194039, "epoch": 1603} {"train_loss": -41.416500091552734, "global_step": 194040, "epoch": 1603} {"train_loss": -41.17148971557617, "global_step": 194041, "epoch": 1603} {"train_loss": -40.29273986816406, "global_step": 194042, "epoch": 1603} {"train_loss": -41.57556915283203, "global_step": 194043, "epoch": 1603} {"train_loss": -39.084999084472656, "global_step": 194044, "epoch": 1603} {"train_loss": -41.181243896484375, "global_step": 194045, "epoch": 1603} {"train_loss": -39.762115478515625, "global_step": 194046, "epoch": 1603} {"train_loss": -39.20399856567383, "global_step": 194047, "epoch": 1603} {"train_loss": -40.002437591552734, "global_step": 194048, "epoch": 1603} {"train_loss": -41.41341018676758, "global_step": 194049, "epoch": 1603} {"train_loss": -40.40825271606445, "global_step": 194050, "epoch": 1603} {"train_loss": -41.39396286010742, "global_step": 194051, "epoch": 1603} {"train_loss": -40.30532455444336, "global_step": 194052, "epoch": 1603} {"train_loss": -41.316463470458984, "global_step": 194053, "epoch": 1603} {"train_loss": -40.472320556640625, "global_step": 194054, "epoch": 1603} {"train_loss": -41.204158782958984, "global_step": 194055, "epoch": 1603} {"train_loss": -41.583614349365234, "global_step": 194056, "epoch": 1603} {"train_loss": -41.9715461730957, "global_step": 194057, "epoch": 1603} {"train_loss": -41.34108352661133, "global_step": 194058, "epoch": 1603} {"train_loss": -40.54851150512695, "global_step": 194059, "epoch": 1603} {"train_loss": -41.0211296081543, "global_step": 194060, "epoch": 1603} {"train_loss": -41.23820114135742, "global_step": 194061, "epoch": 1603} {"train_loss": -41.65874099731445, "global_step": 194062, "epoch": 1603} {"train_loss": -41.52676773071289, "global_step": 194063, "epoch": 1603} {"train_loss": -41.76273727416992, "global_step": 194064, "epoch": 1603} {"train_loss": -42.152305603027344, "global_step": 194065, "epoch": 1603} {"train_loss": -42.119136810302734, "global_step": 194066, "epoch": 1603} {"train_loss": -42.09619140625, "global_step": 194067, "epoch": 1603} {"train_loss": -41.39461898803711, "global_step": 194068, "epoch": 1603} {"train_loss": -42.1967658996582, "global_step": 194069, "epoch": 1603} {"train_loss": -42.261627197265625, "global_step": 194070, "epoch": 1603} {"train_loss": -40.7957763671875, "global_step": 194071, "epoch": 1603} {"train_loss": -41.87929916381836, "global_step": 194072, "epoch": 1603} {"train_loss": -42.097164154052734, "global_step": 194073, "epoch": 1603} {"train_loss": -40.22468185424805, "global_step": 194074, "epoch": 1603} {"train_loss": -41.71103286743164, "global_step": 194075, "epoch": 1603} {"train_loss": -42.519142150878906, "global_step": 194076, "epoch": 1603} {"train_loss": -41.890323638916016, "global_step": 194077, "epoch": 1603} {"train_loss": -40.7549934387207, "global_step": 194078, "epoch": 1603} {"train_loss": -38.791988372802734, "global_step": 194079, "epoch": 1603} {"train_loss": -42.532344818115234, "global_step": 194080, "epoch": 1603} {"train_loss": -38.67561721801758, "global_step": 194081, "epoch": 1603} {"train_loss": -40.644771575927734, "global_step": 194082, "epoch": 1603} {"train_loss": -41.415429044360955, "global_step": 194083, "epoch": 1603, "val_loss": 2723292.5} {"train_loss": -40.2808723449707, "global_step": 194084, "epoch": 1604} {"train_loss": -37.94376754760742, "global_step": 194085, "epoch": 1604} {"train_loss": -40.490264892578125, "global_step": 194086, "epoch": 1604} {"train_loss": -40.31814193725586, "global_step": 194087, "epoch": 1604} {"train_loss": -40.7038688659668, "global_step": 194088, "epoch": 1604} {"train_loss": -41.41948318481445, "global_step": 194089, "epoch": 1604} {"train_loss": -40.74482727050781, "global_step": 194090, "epoch": 1604} {"train_loss": -41.280372619628906, "global_step": 194091, "epoch": 1604} {"train_loss": -41.720882415771484, "global_step": 194092, "epoch": 1604} {"train_loss": -36.27067184448242, "global_step": 194093, "epoch": 1604} {"train_loss": -40.92390823364258, "global_step": 194094, "epoch": 1604} {"train_loss": -41.38261795043945, "global_step": 194095, "epoch": 1604} {"train_loss": -40.657100677490234, "global_step": 194096, "epoch": 1604} {"train_loss": -41.70766830444336, "global_step": 194097, "epoch": 1604} {"train_loss": -38.05615997314453, "global_step": 194098, "epoch": 1604} {"train_loss": -37.794918060302734, "global_step": 194099, "epoch": 1604} {"train_loss": -41.62785339355469, "global_step": 194100, "epoch": 1604} {"train_loss": -41.14588165283203, "global_step": 194101, "epoch": 1604} {"train_loss": -41.310302734375, "global_step": 194102, "epoch": 1604} {"train_loss": -41.09160232543945, "global_step": 194103, "epoch": 1604} {"train_loss": -40.99592971801758, "global_step": 194104, "epoch": 1604} {"train_loss": -39.64738082885742, "global_step": 194105, "epoch": 1604} {"train_loss": -41.58758544921875, "global_step": 194106, "epoch": 1604} {"train_loss": -41.47258377075195, "global_step": 194107, "epoch": 1604} {"train_loss": -41.967708587646484, "global_step": 194108, "epoch": 1604} {"train_loss": -41.73062515258789, "global_step": 194109, "epoch": 1604} {"train_loss": -42.089168548583984, "global_step": 194110, "epoch": 1604} {"train_loss": -41.879310607910156, "global_step": 194111, "epoch": 1604} {"train_loss": -42.476806640625, "global_step": 194112, "epoch": 1604} {"train_loss": -40.0748405456543, "global_step": 194113, "epoch": 1604} {"train_loss": -42.2380485534668, "global_step": 194114, "epoch": 1604} {"train_loss": -41.80957794189453, "global_step": 194115, "epoch": 1604} {"train_loss": -41.4875602722168, "global_step": 194116, "epoch": 1604} {"train_loss": -40.946529388427734, "global_step": 194117, "epoch": 1604} {"train_loss": -42.605224609375, "global_step": 194118, "epoch": 1604} {"train_loss": -41.50213623046875, "global_step": 194119, "epoch": 1604} {"train_loss": -39.61855697631836, "global_step": 194120, "epoch": 1604} {"train_loss": -41.65230941772461, "global_step": 194121, "epoch": 1604} {"train_loss": -41.688472747802734, "global_step": 194122, "epoch": 1604} {"train_loss": -40.022315979003906, "global_step": 194123, "epoch": 1604} {"train_loss": -40.94240951538086, "global_step": 194124, "epoch": 1604} {"train_loss": -42.31702423095703, "global_step": 194125, "epoch": 1604} {"train_loss": -41.17367172241211, "global_step": 194126, "epoch": 1604} {"train_loss": -39.865577697753906, "global_step": 194127, "epoch": 1604} {"train_loss": -40.569210052490234, "global_step": 194128, "epoch": 1604} {"train_loss": -41.167945861816406, "global_step": 194129, "epoch": 1604} {"train_loss": -41.2622184753418, "global_step": 194130, "epoch": 1604} {"train_loss": -40.47354507446289, "global_step": 194131, "epoch": 1604} {"train_loss": -40.96967315673828, "global_step": 194132, "epoch": 1604} {"train_loss": -42.63990783691406, "global_step": 194133, "epoch": 1604} {"train_loss": -40.3454704284668, "global_step": 194134, "epoch": 1604} {"train_loss": -41.48478317260742, "global_step": 194135, "epoch": 1604} {"train_loss": -41.70515060424805, "global_step": 194136, "epoch": 1604} {"train_loss": -40.99452590942383, "global_step": 194137, "epoch": 1604} {"train_loss": -42.3983154296875, "global_step": 194138, "epoch": 1604} {"train_loss": -41.804969787597656, "global_step": 194139, "epoch": 1604} {"train_loss": -42.51748275756836, "global_step": 194140, "epoch": 1604} {"train_loss": -42.07282638549805, "global_step": 194141, "epoch": 1604} {"train_loss": -42.05085754394531, "global_step": 194142, "epoch": 1604} {"train_loss": -41.98706817626953, "global_step": 194143, "epoch": 1604} {"train_loss": -41.91545486450195, "global_step": 194144, "epoch": 1604} {"train_loss": -42.92856979370117, "global_step": 194145, "epoch": 1604} {"train_loss": -41.7477912902832, "global_step": 194146, "epoch": 1604} {"train_loss": -42.17928695678711, "global_step": 194147, "epoch": 1604} {"train_loss": -42.51947784423828, "global_step": 194148, "epoch": 1604} {"train_loss": -42.16456985473633, "global_step": 194149, "epoch": 1604} {"train_loss": -42.17806625366211, "global_step": 194150, "epoch": 1604} {"train_loss": -42.3581428527832, "global_step": 194151, "epoch": 1604} {"train_loss": -42.74301528930664, "global_step": 194152, "epoch": 1604} {"train_loss": -42.5630989074707, "global_step": 194153, "epoch": 1604} {"train_loss": -42.895328521728516, "global_step": 194154, "epoch": 1604} {"train_loss": -42.641395568847656, "global_step": 194155, "epoch": 1604} {"train_loss": -42.60155487060547, "global_step": 194156, "epoch": 1604} {"train_loss": -42.39120101928711, "global_step": 194157, "epoch": 1604} {"train_loss": -43.27555465698242, "global_step": 194158, "epoch": 1604} {"train_loss": -42.09980392456055, "global_step": 194159, "epoch": 1604} {"train_loss": -43.147090911865234, "global_step": 194160, "epoch": 1604} {"train_loss": -43.12125778198242, "global_step": 194161, "epoch": 1604} {"train_loss": -42.7596321105957, "global_step": 194162, "epoch": 1604} {"train_loss": -42.77513122558594, "global_step": 194163, "epoch": 1604} {"train_loss": -42.69253158569336, "global_step": 194164, "epoch": 1604} {"train_loss": -41.88979721069336, "global_step": 194165, "epoch": 1604} {"train_loss": -42.27804183959961, "global_step": 194166, "epoch": 1604} {"train_loss": -43.2913703918457, "global_step": 194167, "epoch": 1604} {"train_loss": -42.09920120239258, "global_step": 194168, "epoch": 1604} {"train_loss": -42.354248046875, "global_step": 194169, "epoch": 1604} {"train_loss": -41.14817428588867, "global_step": 194170, "epoch": 1604} {"train_loss": -41.65999221801758, "global_step": 194171, "epoch": 1604} {"train_loss": -42.4289665222168, "global_step": 194172, "epoch": 1604} {"train_loss": -43.1141357421875, "global_step": 194173, "epoch": 1604} {"train_loss": -41.97197341918945, "global_step": 194174, "epoch": 1604} {"train_loss": -42.2392578125, "global_step": 194175, "epoch": 1604} {"train_loss": -42.31939697265625, "global_step": 194176, "epoch": 1604} {"train_loss": -42.31838607788086, "global_step": 194177, "epoch": 1604} {"train_loss": -42.9613151550293, "global_step": 194178, "epoch": 1604} {"train_loss": -42.41176223754883, "global_step": 194179, "epoch": 1604} {"train_loss": -43.02527618408203, "global_step": 194180, "epoch": 1604} {"train_loss": -42.46247482299805, "global_step": 194181, "epoch": 1604} {"train_loss": -42.77878952026367, "global_step": 194182, "epoch": 1604} {"train_loss": -41.423213958740234, "global_step": 194183, "epoch": 1604} {"train_loss": -42.77042770385742, "global_step": 194184, "epoch": 1604} {"train_loss": -41.786922454833984, "global_step": 194185, "epoch": 1604} {"train_loss": -42.083473205566406, "global_step": 194186, "epoch": 1604} {"train_loss": -42.748043060302734, "global_step": 194187, "epoch": 1604} {"train_loss": -42.41852569580078, "global_step": 194188, "epoch": 1604} {"train_loss": -40.86330032348633, "global_step": 194189, "epoch": 1604} {"train_loss": -40.685569763183594, "global_step": 194190, "epoch": 1604} {"train_loss": -39.583274841308594, "global_step": 194191, "epoch": 1604} {"train_loss": -37.487056732177734, "global_step": 194192, "epoch": 1604} {"train_loss": -39.46479415893555, "global_step": 194193, "epoch": 1604} {"train_loss": -36.64204025268555, "global_step": 194194, "epoch": 1604} {"train_loss": -36.69047164916992, "global_step": 194195, "epoch": 1604} {"train_loss": -33.691219329833984, "global_step": 194196, "epoch": 1604} {"train_loss": -34.79376220703125, "global_step": 194197, "epoch": 1604} {"train_loss": -39.25761795043945, "global_step": 194198, "epoch": 1604} {"train_loss": -35.88141632080078, "global_step": 194199, "epoch": 1604} {"train_loss": -31.991657257080078, "global_step": 194200, "epoch": 1604} {"train_loss": -35.5838737487793, "global_step": 194201, "epoch": 1604} {"train_loss": -35.24367904663086, "global_step": 194202, "epoch": 1604} {"train_loss": -35.68048095703125, "global_step": 194203, "epoch": 1604} {"train_loss": -40.95074965737083, "global_step": 194204, "epoch": 1604, "val_loss": 2477568.75} {"train_loss": -33.66892623901367, "global_step": 194205, "epoch": 1605} {"train_loss": -36.669612884521484, "global_step": 194206, "epoch": 1605} {"train_loss": -33.90666580200195, "global_step": 194207, "epoch": 1605} {"train_loss": -37.504207611083984, "global_step": 194208, "epoch": 1605} {"train_loss": -36.86786651611328, "global_step": 194209, "epoch": 1605} {"train_loss": -35.086830139160156, "global_step": 194210, "epoch": 1605} {"train_loss": -37.076045989990234, "global_step": 194211, "epoch": 1605} {"train_loss": -36.40922164916992, "global_step": 194212, "epoch": 1605} {"train_loss": -38.478294372558594, "global_step": 194213, "epoch": 1605} {"train_loss": -37.50945281982422, "global_step": 194214, "epoch": 1605} {"train_loss": -37.203453063964844, "global_step": 194215, "epoch": 1605} {"train_loss": -37.90847396850586, "global_step": 194216, "epoch": 1605} {"train_loss": -37.13566970825195, "global_step": 194217, "epoch": 1605} {"train_loss": -39.4325065612793, "global_step": 194218, "epoch": 1605} {"train_loss": -37.43091583251953, "global_step": 194219, "epoch": 1605} {"train_loss": -39.868934631347656, "global_step": 194220, "epoch": 1605} {"train_loss": -39.989341735839844, "global_step": 194221, "epoch": 1605} {"train_loss": -37.75020980834961, "global_step": 194222, "epoch": 1605} {"train_loss": -39.63363265991211, "global_step": 194223, "epoch": 1605} {"train_loss": -39.97561264038086, "global_step": 194224, "epoch": 1605} {"train_loss": -39.21684265136719, "global_step": 194225, "epoch": 1605} {"train_loss": -40.527183532714844, "global_step": 194226, "epoch": 1605} {"train_loss": -40.42091369628906, "global_step": 194227, "epoch": 1605} {"train_loss": -39.892303466796875, "global_step": 194228, "epoch": 1605} {"train_loss": -40.483131408691406, "global_step": 194229, "epoch": 1605} {"train_loss": -40.723060607910156, "global_step": 194230, "epoch": 1605} {"train_loss": -40.23329162597656, "global_step": 194231, "epoch": 1605} {"train_loss": -41.14718246459961, "global_step": 194232, "epoch": 1605} {"train_loss": -40.827022552490234, "global_step": 194233, "epoch": 1605} {"train_loss": -41.27070236206055, "global_step": 194234, "epoch": 1605} {"train_loss": -40.91537094116211, "global_step": 194235, "epoch": 1605} {"train_loss": -41.130218505859375, "global_step": 194236, "epoch": 1605} {"train_loss": -41.08357620239258, "global_step": 194237, "epoch": 1605} {"train_loss": -40.857627868652344, "global_step": 194238, "epoch": 1605} {"train_loss": -41.10721206665039, "global_step": 194239, "epoch": 1605} {"train_loss": -41.06144332885742, "global_step": 194240, "epoch": 1605} {"train_loss": -41.37697982788086, "global_step": 194241, "epoch": 1605} {"train_loss": -41.47905349731445, "global_step": 194242, "epoch": 1605} {"train_loss": -41.45356369018555, "global_step": 194243, "epoch": 1605} {"train_loss": -41.7190055847168, "global_step": 194244, "epoch": 1605} {"train_loss": -41.65576171875, "global_step": 194245, "epoch": 1605} {"train_loss": -41.76261901855469, "global_step": 194246, "epoch": 1605} {"train_loss": -41.584407806396484, "global_step": 194247, "epoch": 1605} {"train_loss": -41.65179443359375, "global_step": 194248, "epoch": 1605} {"train_loss": -41.87662887573242, "global_step": 194249, "epoch": 1605} {"train_loss": -41.99225997924805, "global_step": 194250, "epoch": 1605} {"train_loss": -41.95705795288086, "global_step": 194251, "epoch": 1605} {"train_loss": -41.858055114746094, "global_step": 194252, "epoch": 1605} {"train_loss": -41.799625396728516, "global_step": 194253, "epoch": 1605} {"train_loss": -41.648590087890625, "global_step": 194254, "epoch": 1605} {"train_loss": -42.10284423828125, "global_step": 194255, "epoch": 1605} {"train_loss": -41.972007751464844, "global_step": 194256, "epoch": 1605} {"train_loss": -41.889339447021484, "global_step": 194257, "epoch": 1605} {"train_loss": -42.306209564208984, "global_step": 194258, "epoch": 1605} {"train_loss": -42.1664924621582, "global_step": 194259, "epoch": 1605} {"train_loss": -42.349212646484375, "global_step": 194260, "epoch": 1605} {"train_loss": -42.44768142700195, "global_step": 194261, "epoch": 1605} {"train_loss": -42.238101959228516, "global_step": 194262, "epoch": 1605} {"train_loss": -42.252052307128906, "global_step": 194263, "epoch": 1605} {"train_loss": -42.37455368041992, "global_step": 194264, "epoch": 1605} {"train_loss": -42.23110580444336, "global_step": 194265, "epoch": 1605} {"train_loss": -42.69381332397461, "global_step": 194266, "epoch": 1605} {"train_loss": -42.63854217529297, "global_step": 194267, "epoch": 1605} {"train_loss": -42.868221282958984, "global_step": 194268, "epoch": 1605} {"train_loss": -42.32926559448242, "global_step": 194269, "epoch": 1605} {"train_loss": -42.471153259277344, "global_step": 194270, "epoch": 1605} {"train_loss": -42.452537536621094, "global_step": 194271, "epoch": 1605} {"train_loss": -42.5006217956543, "global_step": 194272, "epoch": 1605} {"train_loss": -42.844173431396484, "global_step": 194273, "epoch": 1605} {"train_loss": -42.57528305053711, "global_step": 194274, "epoch": 1605} {"train_loss": -42.673988342285156, "global_step": 194275, "epoch": 1605} {"train_loss": -42.795772552490234, "global_step": 194276, "epoch": 1605} {"train_loss": -42.155879974365234, "global_step": 194277, "epoch": 1605} {"train_loss": -42.484397888183594, "global_step": 194278, "epoch": 1605} {"train_loss": -41.80146026611328, "global_step": 194279, "epoch": 1605} {"train_loss": -41.94123458862305, "global_step": 194280, "epoch": 1605} {"train_loss": -42.492523193359375, "global_step": 194281, "epoch": 1605} {"train_loss": -42.44985580444336, "global_step": 194282, "epoch": 1605} {"train_loss": -42.6307373046875, "global_step": 194283, "epoch": 1605} {"train_loss": -42.52972412109375, "global_step": 194284, "epoch": 1605} {"train_loss": -41.077056884765625, "global_step": 194285, "epoch": 1605} {"train_loss": -37.732154846191406, "global_step": 194286, "epoch": 1605} {"train_loss": -35.78528594970703, "global_step": 194287, "epoch": 1605} {"train_loss": -37.21963882446289, "global_step": 194288, "epoch": 1605} {"train_loss": -40.76436996459961, "global_step": 194289, "epoch": 1605} {"train_loss": -42.284149169921875, "global_step": 194290, "epoch": 1605} {"train_loss": -41.26826477050781, "global_step": 194291, "epoch": 1605} {"train_loss": -40.69975662231445, "global_step": 194292, "epoch": 1605} {"train_loss": -42.20881271362305, "global_step": 194293, "epoch": 1605} {"train_loss": -42.71525192260742, "global_step": 194294, "epoch": 1605} {"train_loss": -41.92119598388672, "global_step": 194295, "epoch": 1605} {"train_loss": -40.621463775634766, "global_step": 194296, "epoch": 1605} {"train_loss": -41.6312141418457, "global_step": 194297, "epoch": 1605} {"train_loss": -42.816986083984375, "global_step": 194298, "epoch": 1605} {"train_loss": -41.41938781738281, "global_step": 194299, "epoch": 1605} {"train_loss": -41.552337646484375, "global_step": 194300, "epoch": 1605} {"train_loss": -42.00679397583008, "global_step": 194301, "epoch": 1605} {"train_loss": -40.94761657714844, "global_step": 194302, "epoch": 1605} {"train_loss": -40.46804428100586, "global_step": 194303, "epoch": 1605} {"train_loss": -42.502601623535156, "global_step": 194304, "epoch": 1605} {"train_loss": -42.19514846801758, "global_step": 194305, "epoch": 1605} {"train_loss": -41.364017486572266, "global_step": 194306, "epoch": 1605} {"train_loss": -42.08692932128906, "global_step": 194307, "epoch": 1605} {"train_loss": -40.9190788269043, "global_step": 194308, "epoch": 1605} {"train_loss": -42.198299407958984, "global_step": 194309, "epoch": 1605} {"train_loss": -41.8406982421875, "global_step": 194310, "epoch": 1605} {"train_loss": -41.1108512878418, "global_step": 194311, "epoch": 1605} {"train_loss": -41.28908920288086, "global_step": 194312, "epoch": 1605} {"train_loss": -41.46695327758789, "global_step": 194313, "epoch": 1605} {"train_loss": -42.67378234863281, "global_step": 194314, "epoch": 1605} {"train_loss": -42.15421676635742, "global_step": 194315, "epoch": 1605} {"train_loss": -41.25122833251953, "global_step": 194316, "epoch": 1605} {"train_loss": -41.732666015625, "global_step": 194317, "epoch": 1605} {"train_loss": -41.992095947265625, "global_step": 194318, "epoch": 1605} {"train_loss": -41.5073356628418, "global_step": 194319, "epoch": 1605} {"train_loss": -41.46377182006836, "global_step": 194320, "epoch": 1605} {"train_loss": -42.320838928222656, "global_step": 194321, "epoch": 1605} {"train_loss": -41.696041107177734, "global_step": 194322, "epoch": 1605} {"train_loss": -41.15650177001953, "global_step": 194323, "epoch": 1605} {"train_loss": -41.84515380859375, "global_step": 194324, "epoch": 1605} {"train_loss": -40.90619091948202, "global_step": 194325, "epoch": 1605, "val_loss": 2473239.75} {"train_loss": -42.269779205322266, "global_step": 194326, "epoch": 1606} {"train_loss": -41.70445251464844, "global_step": 194327, "epoch": 1606} {"train_loss": -41.98773193359375, "global_step": 194328, "epoch": 1606} {"train_loss": -41.627540588378906, "global_step": 194329, "epoch": 1606} {"train_loss": -41.957916259765625, "global_step": 194330, "epoch": 1606} {"train_loss": -41.933040618896484, "global_step": 194331, "epoch": 1606} {"train_loss": -42.538448333740234, "global_step": 194332, "epoch": 1606} {"train_loss": -41.47235870361328, "global_step": 194333, "epoch": 1606} {"train_loss": -42.504058837890625, "global_step": 194334, "epoch": 1606} {"train_loss": -41.950408935546875, "global_step": 194335, "epoch": 1606} {"train_loss": -42.1220817565918, "global_step": 194336, "epoch": 1606} {"train_loss": -42.5738639831543, "global_step": 194337, "epoch": 1606} {"train_loss": -41.47850036621094, "global_step": 194338, "epoch": 1606} {"train_loss": -41.8575325012207, "global_step": 194339, "epoch": 1606} {"train_loss": -42.09157180786133, "global_step": 194340, "epoch": 1606} {"train_loss": -42.090553283691406, "global_step": 194341, "epoch": 1606} {"train_loss": -42.44727325439453, "global_step": 194342, "epoch": 1606} {"train_loss": -42.20667266845703, "global_step": 194343, "epoch": 1606} {"train_loss": -41.5124626159668, "global_step": 194344, "epoch": 1606} {"train_loss": -41.6392936706543, "global_step": 194345, "epoch": 1606} {"train_loss": -42.116729736328125, "global_step": 194346, "epoch": 1606} {"train_loss": -42.25368881225586, "global_step": 194347, "epoch": 1606} {"train_loss": -42.69313049316406, "global_step": 194348, "epoch": 1606} {"train_loss": -42.05290603637695, "global_step": 194349, "epoch": 1606} {"train_loss": -41.697261810302734, "global_step": 194350, "epoch": 1606} {"train_loss": -42.101951599121094, "global_step": 194351, "epoch": 1606} {"train_loss": -42.581233978271484, "global_step": 194352, "epoch": 1606} {"train_loss": -41.976593017578125, "global_step": 194353, "epoch": 1606} {"train_loss": -42.052734375, "global_step": 194354, "epoch": 1606} {"train_loss": -42.486488342285156, "global_step": 194355, "epoch": 1606} {"train_loss": -41.829471588134766, "global_step": 194356, "epoch": 1606} {"train_loss": -41.80124282836914, "global_step": 194357, "epoch": 1606} {"train_loss": -41.476104736328125, "global_step": 194358, "epoch": 1606} {"train_loss": -42.38904571533203, "global_step": 194359, "epoch": 1606} {"train_loss": -41.42877960205078, "global_step": 194360, "epoch": 1606} {"train_loss": -37.4630241394043, "global_step": 194361, "epoch": 1606} {"train_loss": -40.9063835144043, "global_step": 194362, "epoch": 1606} {"train_loss": -39.805023193359375, "global_step": 194363, "epoch": 1606} {"train_loss": -39.359046936035156, "global_step": 194364, "epoch": 1606} {"train_loss": -39.716773986816406, "global_step": 194365, "epoch": 1606} {"train_loss": -37.80330276489258, "global_step": 194366, "epoch": 1606} {"train_loss": -41.81471633911133, "global_step": 194367, "epoch": 1606} {"train_loss": -41.17707824707031, "global_step": 194368, "epoch": 1606} {"train_loss": -39.87236785888672, "global_step": 194369, "epoch": 1606} {"train_loss": -41.6174430847168, "global_step": 194370, "epoch": 1606} {"train_loss": -41.97726058959961, "global_step": 194371, "epoch": 1606} {"train_loss": -40.54698944091797, "global_step": 194372, "epoch": 1606} {"train_loss": -41.035316467285156, "global_step": 194373, "epoch": 1606} {"train_loss": -42.3055305480957, "global_step": 194374, "epoch": 1606} {"train_loss": -40.677364349365234, "global_step": 194375, "epoch": 1606} {"train_loss": -42.3950080871582, "global_step": 194376, "epoch": 1606} {"train_loss": -41.494415283203125, "global_step": 194377, "epoch": 1606} {"train_loss": -41.28609085083008, "global_step": 194378, "epoch": 1606} {"train_loss": -41.51976776123047, "global_step": 194379, "epoch": 1606} {"train_loss": -41.94761276245117, "global_step": 194380, "epoch": 1606} {"train_loss": -41.40193176269531, "global_step": 194381, "epoch": 1606} {"train_loss": -42.051795959472656, "global_step": 194382, "epoch": 1606} {"train_loss": -40.98714828491211, "global_step": 194383, "epoch": 1606} {"train_loss": -42.580562591552734, "global_step": 194384, "epoch": 1606} {"train_loss": -41.51099395751953, "global_step": 194385, "epoch": 1606} {"train_loss": -42.33796310424805, "global_step": 194386, "epoch": 1606} {"train_loss": -41.48429489135742, "global_step": 194387, "epoch": 1606} {"train_loss": -41.953548431396484, "global_step": 194388, "epoch": 1606} {"train_loss": -42.06531524658203, "global_step": 194389, "epoch": 1606} {"train_loss": -41.49467849731445, "global_step": 194390, "epoch": 1606} {"train_loss": -42.14655303955078, "global_step": 194391, "epoch": 1606} {"train_loss": -42.15609359741211, "global_step": 194392, "epoch": 1606} {"train_loss": -42.426734924316406, "global_step": 194393, "epoch": 1606} {"train_loss": -41.69686508178711, "global_step": 194394, "epoch": 1606} {"train_loss": -42.465904235839844, "global_step": 194395, "epoch": 1606} {"train_loss": -42.38767623901367, "global_step": 194396, "epoch": 1606} {"train_loss": -42.4188346862793, "global_step": 194397, "epoch": 1606} {"train_loss": -42.701751708984375, "global_step": 194398, "epoch": 1606} {"train_loss": -42.6718635559082, "global_step": 194399, "epoch": 1606} {"train_loss": -42.8685417175293, "global_step": 194400, "epoch": 1606} {"train_loss": -41.990821838378906, "global_step": 194401, "epoch": 1606} {"train_loss": -40.89005661010742, "global_step": 194402, "epoch": 1606} {"train_loss": -42.592315673828125, "global_step": 194403, "epoch": 1606} {"train_loss": -39.631935119628906, "global_step": 194404, "epoch": 1606} {"train_loss": -41.439083099365234, "global_step": 194405, "epoch": 1606} {"train_loss": -40.58591842651367, "global_step": 194406, "epoch": 1606} {"train_loss": -38.33195877075195, "global_step": 194407, "epoch": 1606} {"train_loss": -41.844295501708984, "global_step": 194408, "epoch": 1606} {"train_loss": -40.29191207885742, "global_step": 194409, "epoch": 1606} {"train_loss": -42.002986907958984, "global_step": 194410, "epoch": 1606} {"train_loss": -40.511592864990234, "global_step": 194411, "epoch": 1606} {"train_loss": -42.848812103271484, "global_step": 194412, "epoch": 1606} {"train_loss": -40.763275146484375, "global_step": 194413, "epoch": 1606} {"train_loss": -42.08576202392578, "global_step": 194414, "epoch": 1606} {"train_loss": -41.61863708496094, "global_step": 194415, "epoch": 1606} {"train_loss": -42.484798431396484, "global_step": 194416, "epoch": 1606} {"train_loss": -42.2347526550293, "global_step": 194417, "epoch": 1606} {"train_loss": -42.235347747802734, "global_step": 194418, "epoch": 1606} {"train_loss": -41.78125762939453, "global_step": 194419, "epoch": 1606} {"train_loss": -42.852787017822266, "global_step": 194420, "epoch": 1606} {"train_loss": -41.72258758544922, "global_step": 194421, "epoch": 1606} {"train_loss": -41.61143112182617, "global_step": 194422, "epoch": 1606} {"train_loss": -41.98907470703125, "global_step": 194423, "epoch": 1606} {"train_loss": -41.40005111694336, "global_step": 194424, "epoch": 1606} {"train_loss": -41.289825439453125, "global_step": 194425, "epoch": 1606} {"train_loss": -42.116695404052734, "global_step": 194426, "epoch": 1606} {"train_loss": -42.54275894165039, "global_step": 194427, "epoch": 1606} {"train_loss": -41.39727783203125, "global_step": 194428, "epoch": 1606} {"train_loss": -42.622676849365234, "global_step": 194429, "epoch": 1606} {"train_loss": -42.06675338745117, "global_step": 194430, "epoch": 1606} {"train_loss": -42.2974739074707, "global_step": 194431, "epoch": 1606} {"train_loss": -42.119903564453125, "global_step": 194432, "epoch": 1606} {"train_loss": -43.175594329833984, "global_step": 194433, "epoch": 1606} {"train_loss": -42.033382415771484, "global_step": 194434, "epoch": 1606} {"train_loss": -42.88731002807617, "global_step": 194435, "epoch": 1606} {"train_loss": -42.48922348022461, "global_step": 194436, "epoch": 1606} {"train_loss": -42.784481048583984, "global_step": 194437, "epoch": 1606} {"train_loss": -42.7697639465332, "global_step": 194438, "epoch": 1606} {"train_loss": -43.1536865234375, "global_step": 194439, "epoch": 1606} {"train_loss": -43.26070785522461, "global_step": 194440, "epoch": 1606} {"train_loss": -43.0580940246582, "global_step": 194441, "epoch": 1606} {"train_loss": -42.87897872924805, "global_step": 194442, "epoch": 1606} {"train_loss": -42.79801940917969, "global_step": 194443, "epoch": 1606} {"train_loss": -43.482784271240234, "global_step": 194444, "epoch": 1606} {"train_loss": -43.33881378173828, "global_step": 194445, "epoch": 1606} {"train_loss": -41.82628905871683, "global_step": 194446, "epoch": 1606, "val_loss": 2531946.75} {"train_loss": -42.73780059814453, "global_step": 194447, "epoch": 1607} {"train_loss": -42.5037956237793, "global_step": 194448, "epoch": 1607} {"train_loss": -42.56145477294922, "global_step": 194449, "epoch": 1607} {"train_loss": -41.77125930786133, "global_step": 194450, "epoch": 1607} {"train_loss": -43.066131591796875, "global_step": 194451, "epoch": 1607} {"train_loss": -42.76862335205078, "global_step": 194452, "epoch": 1607} {"train_loss": -40.84852981567383, "global_step": 194453, "epoch": 1607} {"train_loss": -39.575069427490234, "global_step": 194454, "epoch": 1607} {"train_loss": -36.8916015625, "global_step": 194455, "epoch": 1607} {"train_loss": -40.9068489074707, "global_step": 194456, "epoch": 1607} {"train_loss": -39.9926872253418, "global_step": 194457, "epoch": 1607} {"train_loss": -36.018524169921875, "global_step": 194458, "epoch": 1607} {"train_loss": -39.87363052368164, "global_step": 194459, "epoch": 1607} {"train_loss": -35.769283294677734, "global_step": 194460, "epoch": 1607} {"train_loss": -35.69219207763672, "global_step": 194461, "epoch": 1607} {"train_loss": -36.79191207885742, "global_step": 194462, "epoch": 1607} {"train_loss": -38.02621078491211, "global_step": 194463, "epoch": 1607} {"train_loss": -39.720558166503906, "global_step": 194464, "epoch": 1607} {"train_loss": -37.07509994506836, "global_step": 194465, "epoch": 1607} {"train_loss": -36.3465576171875, "global_step": 194466, "epoch": 1607} {"train_loss": -38.04716873168945, "global_step": 194467, "epoch": 1607} {"train_loss": -35.13426208496094, "global_step": 194468, "epoch": 1607} {"train_loss": -36.46266174316406, "global_step": 194469, "epoch": 1607} {"train_loss": -38.39333724975586, "global_step": 194470, "epoch": 1607} {"train_loss": -37.64763641357422, "global_step": 194471, "epoch": 1607} {"train_loss": -38.36330795288086, "global_step": 194472, "epoch": 1607} {"train_loss": -38.95321273803711, "global_step": 194473, "epoch": 1607} {"train_loss": -40.21657943725586, "global_step": 194474, "epoch": 1607} {"train_loss": -40.496681213378906, "global_step": 194475, "epoch": 1607} {"train_loss": -40.083003997802734, "global_step": 194476, "epoch": 1607} {"train_loss": -39.88161849975586, "global_step": 194477, "epoch": 1607} {"train_loss": -40.59429931640625, "global_step": 194478, "epoch": 1607} {"train_loss": -40.40107345581055, "global_step": 194479, "epoch": 1607} {"train_loss": -40.80074691772461, "global_step": 194480, "epoch": 1607} {"train_loss": -40.889808654785156, "global_step": 194481, "epoch": 1607} {"train_loss": -40.90810775756836, "global_step": 194482, "epoch": 1607} {"train_loss": -40.72162628173828, "global_step": 194483, "epoch": 1607} {"train_loss": -40.133270263671875, "global_step": 194484, "epoch": 1607} {"train_loss": -41.38838577270508, "global_step": 194485, "epoch": 1607} {"train_loss": -40.742855072021484, "global_step": 194486, "epoch": 1607} {"train_loss": -40.856834411621094, "global_step": 194487, "epoch": 1607} {"train_loss": -41.159767150878906, "global_step": 194488, "epoch": 1607} {"train_loss": -41.94098663330078, "global_step": 194489, "epoch": 1607} {"train_loss": -41.459693908691406, "global_step": 194490, "epoch": 1607} {"train_loss": -41.99272537231445, "global_step": 194491, "epoch": 1607} {"train_loss": -41.53891372680664, "global_step": 194492, "epoch": 1607} {"train_loss": -41.6392822265625, "global_step": 194493, "epoch": 1607} {"train_loss": -42.23752212524414, "global_step": 194494, "epoch": 1607} {"train_loss": -41.783321380615234, "global_step": 194495, "epoch": 1607} {"train_loss": -41.84138107299805, "global_step": 194496, "epoch": 1607} {"train_loss": -41.30738830566406, "global_step": 194497, "epoch": 1607} {"train_loss": -41.761962890625, "global_step": 194498, "epoch": 1607} {"train_loss": -41.446449279785156, "global_step": 194499, "epoch": 1607} {"train_loss": -42.23432159423828, "global_step": 194500, "epoch": 1607} {"train_loss": -41.53745651245117, "global_step": 194501, "epoch": 1607} {"train_loss": -41.504886627197266, "global_step": 194502, "epoch": 1607} {"train_loss": -42.056190490722656, "global_step": 194503, "epoch": 1607} {"train_loss": -41.970699310302734, "global_step": 194504, "epoch": 1607} {"train_loss": -41.93342208862305, "global_step": 194505, "epoch": 1607} {"train_loss": -41.932647705078125, "global_step": 194506, "epoch": 1607} {"train_loss": -41.491676330566406, "global_step": 194507, "epoch": 1607} {"train_loss": -42.1561164855957, "global_step": 194508, "epoch": 1607} {"train_loss": -41.793487548828125, "global_step": 194509, "epoch": 1607} {"train_loss": -41.57242965698242, "global_step": 194510, "epoch": 1607} {"train_loss": -41.39356231689453, "global_step": 194511, "epoch": 1607} {"train_loss": -42.07710647583008, "global_step": 194512, "epoch": 1607} {"train_loss": -42.21677780151367, "global_step": 194513, "epoch": 1607} {"train_loss": -42.442623138427734, "global_step": 194514, "epoch": 1607} {"train_loss": -42.41597366333008, "global_step": 194515, "epoch": 1607} {"train_loss": -42.32890701293945, "global_step": 194516, "epoch": 1607} {"train_loss": -42.10427474975586, "global_step": 194517, "epoch": 1607} {"train_loss": -42.456478118896484, "global_step": 194518, "epoch": 1607} {"train_loss": -42.8541374206543, "global_step": 194519, "epoch": 1607} {"train_loss": -42.508235931396484, "global_step": 194520, "epoch": 1607} {"train_loss": -42.258201599121094, "global_step": 194521, "epoch": 1607} {"train_loss": -42.37754440307617, "global_step": 194522, "epoch": 1607} {"train_loss": -42.651893615722656, "global_step": 194523, "epoch": 1607} {"train_loss": -42.079837799072266, "global_step": 194524, "epoch": 1607} {"train_loss": -42.78988265991211, "global_step": 194525, "epoch": 1607} {"train_loss": -42.0466194152832, "global_step": 194526, "epoch": 1607} {"train_loss": -42.30476760864258, "global_step": 194527, "epoch": 1607} {"train_loss": -41.88962936401367, "global_step": 194528, "epoch": 1607} {"train_loss": -40.91334915161133, "global_step": 194529, "epoch": 1607} {"train_loss": -41.245059967041016, "global_step": 194530, "epoch": 1607} {"train_loss": -42.0792350769043, "global_step": 194531, "epoch": 1607} {"train_loss": -41.992584228515625, "global_step": 194532, "epoch": 1607} {"train_loss": -41.93080520629883, "global_step": 194533, "epoch": 1607} {"train_loss": -41.99094772338867, "global_step": 194534, "epoch": 1607} {"train_loss": -42.626258850097656, "global_step": 194535, "epoch": 1607} {"train_loss": -42.32966995239258, "global_step": 194536, "epoch": 1607} {"train_loss": -42.067378997802734, "global_step": 194537, "epoch": 1607} {"train_loss": -43.11769485473633, "global_step": 194538, "epoch": 1607} {"train_loss": -42.302982330322266, "global_step": 194539, "epoch": 1607} {"train_loss": -41.82390594482422, "global_step": 194540, "epoch": 1607} {"train_loss": -42.65460968017578, "global_step": 194541, "epoch": 1607} {"train_loss": -42.85421371459961, "global_step": 194542, "epoch": 1607} {"train_loss": -42.223052978515625, "global_step": 194543, "epoch": 1607} {"train_loss": -42.452205657958984, "global_step": 194544, "epoch": 1607} {"train_loss": -42.39609146118164, "global_step": 194545, "epoch": 1607} {"train_loss": -42.43148422241211, "global_step": 194546, "epoch": 1607} {"train_loss": -43.06441116333008, "global_step": 194547, "epoch": 1607} {"train_loss": -42.69480514526367, "global_step": 194548, "epoch": 1607} {"train_loss": -42.53513717651367, "global_step": 194549, "epoch": 1607} {"train_loss": -42.6531982421875, "global_step": 194550, "epoch": 1607} {"train_loss": -43.381614685058594, "global_step": 194551, "epoch": 1607} {"train_loss": -42.83582305908203, "global_step": 194552, "epoch": 1607} {"train_loss": -42.3481559753418, "global_step": 194553, "epoch": 1607} {"train_loss": -42.10734176635742, "global_step": 194554, "epoch": 1607} {"train_loss": -41.861427307128906, "global_step": 194555, "epoch": 1607} {"train_loss": -41.46925735473633, "global_step": 194556, "epoch": 1607} {"train_loss": -41.0681037902832, "global_step": 194557, "epoch": 1607} {"train_loss": -41.26268768310547, "global_step": 194558, "epoch": 1607} {"train_loss": -40.905792236328125, "global_step": 194559, "epoch": 1607} {"train_loss": -40.83119583129883, "global_step": 194560, "epoch": 1607} {"train_loss": -40.15235137939453, "global_step": 194561, "epoch": 1607} {"train_loss": -40.07529830932617, "global_step": 194562, "epoch": 1607} {"train_loss": -42.44401931762695, "global_step": 194563, "epoch": 1607} {"train_loss": -41.68095016479492, "global_step": 194564, "epoch": 1607} {"train_loss": -40.082820892333984, "global_step": 194565, "epoch": 1607} {"train_loss": -42.10525131225586, "global_step": 194566, "epoch": 1607} {"train_loss": -41.14123437424337, "global_step": 194567, "epoch": 1607, "val_loss": 2564703.0} {"train_loss": -39.4953727722168, "global_step": 194568, "epoch": 1608} {"train_loss": -39.978328704833984, "global_step": 194569, "epoch": 1608} {"train_loss": -42.556068420410156, "global_step": 194570, "epoch": 1608} {"train_loss": -40.05178451538086, "global_step": 194571, "epoch": 1608} {"train_loss": -38.4030876159668, "global_step": 194572, "epoch": 1608} {"train_loss": -42.41941452026367, "global_step": 194573, "epoch": 1608} {"train_loss": -37.55644607543945, "global_step": 194574, "epoch": 1608} {"train_loss": -42.25635528564453, "global_step": 194575, "epoch": 1608} {"train_loss": -39.916378021240234, "global_step": 194576, "epoch": 1608} {"train_loss": -39.05315399169922, "global_step": 194577, "epoch": 1608} {"train_loss": -42.29290008544922, "global_step": 194578, "epoch": 1608} {"train_loss": -39.17429733276367, "global_step": 194579, "epoch": 1608} {"train_loss": -42.158138275146484, "global_step": 194580, "epoch": 1608} {"train_loss": -39.099857330322266, "global_step": 194581, "epoch": 1608} {"train_loss": -41.95671463012695, "global_step": 194582, "epoch": 1608} {"train_loss": -40.43428421020508, "global_step": 194583, "epoch": 1608} {"train_loss": -41.890804290771484, "global_step": 194584, "epoch": 1608} {"train_loss": -41.80412673950195, "global_step": 194585, "epoch": 1608} {"train_loss": -42.13316345214844, "global_step": 194586, "epoch": 1608} {"train_loss": -41.76651382446289, "global_step": 194587, "epoch": 1608} {"train_loss": -41.8365364074707, "global_step": 194588, "epoch": 1608} {"train_loss": -41.75822830200195, "global_step": 194589, "epoch": 1608} {"train_loss": -42.1285514831543, "global_step": 194590, "epoch": 1608} {"train_loss": -42.434329986572266, "global_step": 194591, "epoch": 1608} {"train_loss": -42.555816650390625, "global_step": 194592, "epoch": 1608} {"train_loss": -42.65925598144531, "global_step": 194593, "epoch": 1608} {"train_loss": -42.27634811401367, "global_step": 194594, "epoch": 1608} {"train_loss": -42.163909912109375, "global_step": 194595, "epoch": 1608} {"train_loss": -42.16265869140625, "global_step": 194596, "epoch": 1608} {"train_loss": -42.42228698730469, "global_step": 194597, "epoch": 1608} {"train_loss": -42.55531692504883, "global_step": 194598, "epoch": 1608} {"train_loss": -42.72263717651367, "global_step": 194599, "epoch": 1608} {"train_loss": -42.59013748168945, "global_step": 194600, "epoch": 1608} {"train_loss": -42.97019577026367, "global_step": 194601, "epoch": 1608} {"train_loss": -42.55010986328125, "global_step": 194602, "epoch": 1608} {"train_loss": -42.531463623046875, "global_step": 194603, "epoch": 1608} {"train_loss": -43.121253967285156, "global_step": 194604, "epoch": 1608} {"train_loss": -42.65139389038086, "global_step": 194605, "epoch": 1608} {"train_loss": -42.56147384643555, "global_step": 194606, "epoch": 1608} {"train_loss": -41.83529281616211, "global_step": 194607, "epoch": 1608} {"train_loss": -43.025753021240234, "global_step": 194608, "epoch": 1608} {"train_loss": -42.77602767944336, "global_step": 194609, "epoch": 1608} {"train_loss": -42.804901123046875, "global_step": 194610, "epoch": 1608} {"train_loss": -42.82454299926758, "global_step": 194611, "epoch": 1608} {"train_loss": -43.127010345458984, "global_step": 194612, "epoch": 1608} {"train_loss": -42.86906814575195, "global_step": 194613, "epoch": 1608} {"train_loss": -42.20002746582031, "global_step": 194614, "epoch": 1608} {"train_loss": -42.80695343017578, "global_step": 194615, "epoch": 1608} {"train_loss": -42.5801887512207, "global_step": 194616, "epoch": 1608} {"train_loss": -42.92704391479492, "global_step": 194617, "epoch": 1608} {"train_loss": -42.64779281616211, "global_step": 194618, "epoch": 1608} {"train_loss": -42.83015060424805, "global_step": 194619, "epoch": 1608} {"train_loss": -42.57855224609375, "global_step": 194620, "epoch": 1608} {"train_loss": -42.44288635253906, "global_step": 194621, "epoch": 1608} {"train_loss": -43.17078399658203, "global_step": 194622, "epoch": 1608} {"train_loss": -42.733036041259766, "global_step": 194623, "epoch": 1608} {"train_loss": -41.992008209228516, "global_step": 194624, "epoch": 1608} {"train_loss": -42.60099411010742, "global_step": 194625, "epoch": 1608} {"train_loss": -42.8215446472168, "global_step": 194626, "epoch": 1608} {"train_loss": -43.23472213745117, "global_step": 194627, "epoch": 1608} {"train_loss": -42.550167083740234, "global_step": 194628, "epoch": 1608} {"train_loss": -42.12644958496094, "global_step": 194629, "epoch": 1608} {"train_loss": -42.979305267333984, "global_step": 194630, "epoch": 1608} {"train_loss": -42.48967361450195, "global_step": 194631, "epoch": 1608} {"train_loss": -41.09658432006836, "global_step": 194632, "epoch": 1608} {"train_loss": -42.86845397949219, "global_step": 194633, "epoch": 1608} {"train_loss": -42.022823333740234, "global_step": 194634, "epoch": 1608} {"train_loss": -41.705257415771484, "global_step": 194635, "epoch": 1608} {"train_loss": -40.197486877441406, "global_step": 194636, "epoch": 1608} {"train_loss": -42.097137451171875, "global_step": 194637, "epoch": 1608} {"train_loss": -41.83114242553711, "global_step": 194638, "epoch": 1608} {"train_loss": -40.585792541503906, "global_step": 194639, "epoch": 1608} {"train_loss": -41.77669906616211, "global_step": 194640, "epoch": 1608} {"train_loss": -42.75057601928711, "global_step": 194641, "epoch": 1608} {"train_loss": -42.081512451171875, "global_step": 194642, "epoch": 1608} {"train_loss": -42.197750091552734, "global_step": 194643, "epoch": 1608} {"train_loss": -43.028419494628906, "global_step": 194644, "epoch": 1608} {"train_loss": -42.60555648803711, "global_step": 194645, "epoch": 1608} {"train_loss": -42.28354263305664, "global_step": 194646, "epoch": 1608} {"train_loss": -42.86506652832031, "global_step": 194647, "epoch": 1608} {"train_loss": -42.20633316040039, "global_step": 194648, "epoch": 1608} {"train_loss": -43.2064208984375, "global_step": 194649, "epoch": 1608} {"train_loss": -42.97918701171875, "global_step": 194650, "epoch": 1608} {"train_loss": -42.6080436706543, "global_step": 194651, "epoch": 1608} {"train_loss": -42.69321823120117, "global_step": 194652, "epoch": 1608} {"train_loss": -42.939491271972656, "global_step": 194653, "epoch": 1608} {"train_loss": -42.911285400390625, "global_step": 194654, "epoch": 1608} {"train_loss": -43.4718017578125, "global_step": 194655, "epoch": 1608} {"train_loss": -43.14590835571289, "global_step": 194656, "epoch": 1608} {"train_loss": -42.9968376159668, "global_step": 194657, "epoch": 1608} {"train_loss": -43.10957336425781, "global_step": 194658, "epoch": 1608} {"train_loss": -43.25361251831055, "global_step": 194659, "epoch": 1608} {"train_loss": -42.46286392211914, "global_step": 194660, "epoch": 1608} {"train_loss": -42.89323043823242, "global_step": 194661, "epoch": 1608} {"train_loss": -42.744293212890625, "global_step": 194662, "epoch": 1608} {"train_loss": -41.84975814819336, "global_step": 194663, "epoch": 1608} {"train_loss": -42.26666259765625, "global_step": 194664, "epoch": 1608} {"train_loss": -41.541072845458984, "global_step": 194665, "epoch": 1608} {"train_loss": -40.51365280151367, "global_step": 194666, "epoch": 1608} {"train_loss": -40.55391311645508, "global_step": 194667, "epoch": 1608} {"train_loss": -41.82157516479492, "global_step": 194668, "epoch": 1608} {"train_loss": -42.626155853271484, "global_step": 194669, "epoch": 1608} {"train_loss": -42.91657638549805, "global_step": 194670, "epoch": 1608} {"train_loss": -42.86945343017578, "global_step": 194671, "epoch": 1608} {"train_loss": -42.74900436401367, "global_step": 194672, "epoch": 1608} {"train_loss": -42.7098388671875, "global_step": 194673, "epoch": 1608} {"train_loss": -42.79352951049805, "global_step": 194674, "epoch": 1608} {"train_loss": -42.91960525512695, "global_step": 194675, "epoch": 1608} {"train_loss": -43.08771896362305, "global_step": 194676, "epoch": 1608} {"train_loss": -43.14263916015625, "global_step": 194677, "epoch": 1608} {"train_loss": -42.40074920654297, "global_step": 194678, "epoch": 1608} {"train_loss": -42.3268928527832, "global_step": 194679, "epoch": 1608} {"train_loss": -41.440181732177734, "global_step": 194680, "epoch": 1608} {"train_loss": -41.240631103515625, "global_step": 194681, "epoch": 1608} {"train_loss": -42.68046188354492, "global_step": 194682, "epoch": 1608} {"train_loss": -42.55107879638672, "global_step": 194683, "epoch": 1608} {"train_loss": -41.845619201660156, "global_step": 194684, "epoch": 1608} {"train_loss": -41.381813049316406, "global_step": 194685, "epoch": 1608} {"train_loss": -40.32215881347656, "global_step": 194686, "epoch": 1608} {"train_loss": -40.84529495239258, "global_step": 194687, "epoch": 1608} {"train_loss": -42.11468036115662, "global_step": 194688, "epoch": 1608, "val_loss": 2468325.25} {"train_loss": -40.678672790527344, "global_step": 194689, "epoch": 1609} {"train_loss": -39.58490753173828, "global_step": 194690, "epoch": 1609} {"train_loss": -40.20927810668945, "global_step": 194691, "epoch": 1609} {"train_loss": -40.797542572021484, "global_step": 194692, "epoch": 1609} {"train_loss": -36.89695739746094, "global_step": 194693, "epoch": 1609} {"train_loss": -39.512306213378906, "global_step": 194694, "epoch": 1609} {"train_loss": -39.96727752685547, "global_step": 194695, "epoch": 1609} {"train_loss": -32.762935638427734, "global_step": 194696, "epoch": 1609} {"train_loss": -32.73920822143555, "global_step": 194697, "epoch": 1609} {"train_loss": -33.3924446105957, "global_step": 194698, "epoch": 1609} {"train_loss": -29.694116592407227, "global_step": 194699, "epoch": 1609} {"train_loss": -37.19135665893555, "global_step": 194700, "epoch": 1609} {"train_loss": -35.891143798828125, "global_step": 194701, "epoch": 1609} {"train_loss": -34.54820251464844, "global_step": 194702, "epoch": 1609} {"train_loss": -36.245357513427734, "global_step": 194703, "epoch": 1609} {"train_loss": -34.95002365112305, "global_step": 194704, "epoch": 1609} {"train_loss": -35.130455017089844, "global_step": 194705, "epoch": 1609} {"train_loss": -37.85882568359375, "global_step": 194706, "epoch": 1609} {"train_loss": -34.774295806884766, "global_step": 194707, "epoch": 1609} {"train_loss": -37.708797454833984, "global_step": 194708, "epoch": 1609} {"train_loss": -35.35325622558594, "global_step": 194709, "epoch": 1609} {"train_loss": -37.84737777709961, "global_step": 194710, "epoch": 1609} {"train_loss": -36.772884368896484, "global_step": 194711, "epoch": 1609} {"train_loss": -38.72639083862305, "global_step": 194712, "epoch": 1609} {"train_loss": -38.11857986450195, "global_step": 194713, "epoch": 1609} {"train_loss": -37.74325942993164, "global_step": 194714, "epoch": 1609} {"train_loss": -39.78235626220703, "global_step": 194715, "epoch": 1609} {"train_loss": -37.60124588012695, "global_step": 194716, "epoch": 1609} {"train_loss": -39.66053009033203, "global_step": 194717, "epoch": 1609} {"train_loss": -34.96412658691406, "global_step": 194718, "epoch": 1609} {"train_loss": -39.06759262084961, "global_step": 194719, "epoch": 1609} {"train_loss": -35.776302337646484, "global_step": 194720, "epoch": 1609} {"train_loss": -38.88847732543945, "global_step": 194721, "epoch": 1609} {"train_loss": -40.0233268737793, "global_step": 194722, "epoch": 1609} {"train_loss": -39.562252044677734, "global_step": 194723, "epoch": 1609} {"train_loss": -38.57273864746094, "global_step": 194724, "epoch": 1609} {"train_loss": -39.82183837890625, "global_step": 194725, "epoch": 1609} {"train_loss": -38.9739990234375, "global_step": 194726, "epoch": 1609} {"train_loss": -39.67938232421875, "global_step": 194727, "epoch": 1609} {"train_loss": -39.52946853637695, "global_step": 194728, "epoch": 1609} {"train_loss": -38.39296340942383, "global_step": 194729, "epoch": 1609} {"train_loss": -40.19758605957031, "global_step": 194730, "epoch": 1609} {"train_loss": -39.86552810668945, "global_step": 194731, "epoch": 1609} {"train_loss": -40.00404739379883, "global_step": 194732, "epoch": 1609} {"train_loss": -39.44181442260742, "global_step": 194733, "epoch": 1609} {"train_loss": -39.74561309814453, "global_step": 194734, "epoch": 1609} {"train_loss": -39.85911560058594, "global_step": 194735, "epoch": 1609} {"train_loss": -40.166683197021484, "global_step": 194736, "epoch": 1609} {"train_loss": -40.754844665527344, "global_step": 194737, "epoch": 1609} {"train_loss": -40.3946533203125, "global_step": 194738, "epoch": 1609} {"train_loss": -40.650543212890625, "global_step": 194739, "epoch": 1609} {"train_loss": -39.74073791503906, "global_step": 194740, "epoch": 1609} {"train_loss": -40.55542755126953, "global_step": 194741, "epoch": 1609} {"train_loss": -40.62862777709961, "global_step": 194742, "epoch": 1609} {"train_loss": -40.77751922607422, "global_step": 194743, "epoch": 1609} {"train_loss": -41.01832580566406, "global_step": 194744, "epoch": 1609} {"train_loss": -40.78867721557617, "global_step": 194745, "epoch": 1609} {"train_loss": -40.982383728027344, "global_step": 194746, "epoch": 1609} {"train_loss": -41.24502182006836, "global_step": 194747, "epoch": 1609} {"train_loss": -40.49582290649414, "global_step": 194748, "epoch": 1609} {"train_loss": -41.06504440307617, "global_step": 194749, "epoch": 1609} {"train_loss": -40.384456634521484, "global_step": 194750, "epoch": 1609} {"train_loss": -41.071353912353516, "global_step": 194751, "epoch": 1609} {"train_loss": -41.13633346557617, "global_step": 194752, "epoch": 1609} {"train_loss": -41.63477325439453, "global_step": 194753, "epoch": 1609} {"train_loss": -40.958919525146484, "global_step": 194754, "epoch": 1609} {"train_loss": -40.454341888427734, "global_step": 194755, "epoch": 1609} {"train_loss": -40.930397033691406, "global_step": 194756, "epoch": 1609} {"train_loss": -41.374263763427734, "global_step": 194757, "epoch": 1609} {"train_loss": -41.041439056396484, "global_step": 194758, "epoch": 1609} {"train_loss": -41.64491653442383, "global_step": 194759, "epoch": 1609} {"train_loss": -41.91727828979492, "global_step": 194760, "epoch": 1609} {"train_loss": -41.79427719116211, "global_step": 194761, "epoch": 1609} {"train_loss": -41.781044006347656, "global_step": 194762, "epoch": 1609} {"train_loss": -41.249935150146484, "global_step": 194763, "epoch": 1609} {"train_loss": -41.9753303527832, "global_step": 194764, "epoch": 1609} {"train_loss": -42.245967864990234, "global_step": 194765, "epoch": 1609} {"train_loss": -42.202449798583984, "global_step": 194766, "epoch": 1609} {"train_loss": -41.87811279296875, "global_step": 194767, "epoch": 1609} {"train_loss": -42.0977783203125, "global_step": 194768, "epoch": 1609} {"train_loss": -41.68636703491211, "global_step": 194769, "epoch": 1609} {"train_loss": -41.4001350402832, "global_step": 194770, "epoch": 1609} {"train_loss": -42.43008041381836, "global_step": 194771, "epoch": 1609} {"train_loss": -42.141807556152344, "global_step": 194772, "epoch": 1609} {"train_loss": -42.43197250366211, "global_step": 194773, "epoch": 1609} {"train_loss": -42.28247833251953, "global_step": 194774, "epoch": 1609} {"train_loss": -42.34025955200195, "global_step": 194775, "epoch": 1609} {"train_loss": -42.58134841918945, "global_step": 194776, "epoch": 1609} {"train_loss": -42.170814514160156, "global_step": 194777, "epoch": 1609} {"train_loss": -41.990638732910156, "global_step": 194778, "epoch": 1609} {"train_loss": -42.53094482421875, "global_step": 194779, "epoch": 1609} {"train_loss": -42.37382888793945, "global_step": 194780, "epoch": 1609} {"train_loss": -41.64881896972656, "global_step": 194781, "epoch": 1609} {"train_loss": -43.0826416015625, "global_step": 194782, "epoch": 1609} {"train_loss": -42.223751068115234, "global_step": 194783, "epoch": 1609} {"train_loss": -42.336151123046875, "global_step": 194784, "epoch": 1609} {"train_loss": -42.75629425048828, "global_step": 194785, "epoch": 1609} {"train_loss": -42.88434600830078, "global_step": 194786, "epoch": 1609} {"train_loss": -43.02976608276367, "global_step": 194787, "epoch": 1609} {"train_loss": -42.80202865600586, "global_step": 194788, "epoch": 1609} {"train_loss": -42.39344787597656, "global_step": 194789, "epoch": 1609} {"train_loss": -42.58849334716797, "global_step": 194790, "epoch": 1609} {"train_loss": -42.69941329956055, "global_step": 194791, "epoch": 1609} {"train_loss": -42.394893646240234, "global_step": 194792, "epoch": 1609} {"train_loss": -42.95164489746094, "global_step": 194793, "epoch": 1609} {"train_loss": -42.66087341308594, "global_step": 194794, "epoch": 1609} {"train_loss": -42.69367599487305, "global_step": 194795, "epoch": 1609} {"train_loss": -42.90187072753906, "global_step": 194796, "epoch": 1609} {"train_loss": -42.813323974609375, "global_step": 194797, "epoch": 1609} {"train_loss": -43.1613883972168, "global_step": 194798, "epoch": 1609} {"train_loss": -42.496063232421875, "global_step": 194799, "epoch": 1609} {"train_loss": -43.362152099609375, "global_step": 194800, "epoch": 1609} {"train_loss": -43.24421310424805, "global_step": 194801, "epoch": 1609} {"train_loss": -43.34878158569336, "global_step": 194802, "epoch": 1609} {"train_loss": -43.05317306518555, "global_step": 194803, "epoch": 1609} {"train_loss": -43.124515533447266, "global_step": 194804, "epoch": 1609} {"train_loss": -42.75466537475586, "global_step": 194805, "epoch": 1609} {"train_loss": -43.131771087646484, "global_step": 194806, "epoch": 1609} {"train_loss": -43.42564392089844, "global_step": 194807, "epoch": 1609} {"train_loss": -43.30244064331055, "global_step": 194808, "epoch": 1609} {"train_loss": -40.32648447525403, "global_step": 194809, "epoch": 1609, "val_loss": 2559173.75} {"train_loss": -42.57465362548828, "global_step": 194810, "epoch": 1610} {"train_loss": -42.17599105834961, "global_step": 194811, "epoch": 1610} {"train_loss": -42.087135314941406, "global_step": 194812, "epoch": 1610} {"train_loss": -43.11558151245117, "global_step": 194813, "epoch": 1610} {"train_loss": -43.33492660522461, "global_step": 194814, "epoch": 1610} {"train_loss": -42.26224899291992, "global_step": 194815, "epoch": 1610} {"train_loss": -40.85418701171875, "global_step": 194816, "epoch": 1610} {"train_loss": -40.34532928466797, "global_step": 194817, "epoch": 1610} {"train_loss": -38.32045364379883, "global_step": 194818, "epoch": 1610} {"train_loss": -38.85304641723633, "global_step": 194819, "epoch": 1610} {"train_loss": -37.21084213256836, "global_step": 194820, "epoch": 1610} {"train_loss": -41.57827377319336, "global_step": 194821, "epoch": 1610} {"train_loss": -39.856605529785156, "global_step": 194822, "epoch": 1610} {"train_loss": -37.4215087890625, "global_step": 194823, "epoch": 1610} {"train_loss": -41.096248626708984, "global_step": 194824, "epoch": 1610} {"train_loss": -39.52971267700195, "global_step": 194825, "epoch": 1610} {"train_loss": -36.33284378051758, "global_step": 194826, "epoch": 1610} {"train_loss": -41.0433235168457, "global_step": 194827, "epoch": 1610} {"train_loss": -39.31889343261719, "global_step": 194828, "epoch": 1610} {"train_loss": -40.19717025756836, "global_step": 194829, "epoch": 1610} {"train_loss": -38.157081604003906, "global_step": 194830, "epoch": 1610} {"train_loss": -41.61639404296875, "global_step": 194831, "epoch": 1610} {"train_loss": -39.61745071411133, "global_step": 194832, "epoch": 1610} {"train_loss": -37.296051025390625, "global_step": 194833, "epoch": 1610} {"train_loss": -41.35205078125, "global_step": 194834, "epoch": 1610} {"train_loss": -37.23598098754883, "global_step": 194835, "epoch": 1610} {"train_loss": -41.628787994384766, "global_step": 194836, "epoch": 1610} {"train_loss": -38.99761199951172, "global_step": 194837, "epoch": 1610} {"train_loss": -41.034141540527344, "global_step": 194838, "epoch": 1610} {"train_loss": -40.65249252319336, "global_step": 194839, "epoch": 1610} {"train_loss": -39.89786911010742, "global_step": 194840, "epoch": 1610} {"train_loss": -41.73332595825195, "global_step": 194841, "epoch": 1610} {"train_loss": -38.400169372558594, "global_step": 194842, "epoch": 1610} {"train_loss": -40.3018684387207, "global_step": 194843, "epoch": 1610} {"train_loss": -39.725765228271484, "global_step": 194844, "epoch": 1610} {"train_loss": -41.32332992553711, "global_step": 194845, "epoch": 1610} {"train_loss": -41.43253707885742, "global_step": 194846, "epoch": 1610} {"train_loss": -41.45784378051758, "global_step": 194847, "epoch": 1610} {"train_loss": -40.818241119384766, "global_step": 194848, "epoch": 1610} {"train_loss": -40.446834564208984, "global_step": 194849, "epoch": 1610} {"train_loss": -40.938106536865234, "global_step": 194850, "epoch": 1610} {"train_loss": -41.07642364501953, "global_step": 194851, "epoch": 1610} {"train_loss": -41.543914794921875, "global_step": 194852, "epoch": 1610} {"train_loss": -40.826351165771484, "global_step": 194853, "epoch": 1610} {"train_loss": -41.689144134521484, "global_step": 194854, "epoch": 1610} {"train_loss": -40.98335266113281, "global_step": 194855, "epoch": 1610} {"train_loss": -41.7907600402832, "global_step": 194856, "epoch": 1610} {"train_loss": -40.39076232910156, "global_step": 194857, "epoch": 1610} {"train_loss": -41.65841293334961, "global_step": 194858, "epoch": 1610} {"train_loss": -40.19538497924805, "global_step": 194859, "epoch": 1610} {"train_loss": -41.44599151611328, "global_step": 194860, "epoch": 1610} {"train_loss": -41.1626091003418, "global_step": 194861, "epoch": 1610} {"train_loss": -42.1381950378418, "global_step": 194862, "epoch": 1610} {"train_loss": -41.07271957397461, "global_step": 194863, "epoch": 1610} {"train_loss": -41.51945877075195, "global_step": 194864, "epoch": 1610} {"train_loss": -42.09566116333008, "global_step": 194865, "epoch": 1610} {"train_loss": -40.81658935546875, "global_step": 194866, "epoch": 1610} {"train_loss": -42.04343795776367, "global_step": 194867, "epoch": 1610} {"train_loss": -41.330936431884766, "global_step": 194868, "epoch": 1610} {"train_loss": -41.96084976196289, "global_step": 194869, "epoch": 1610} {"train_loss": -41.8054313659668, "global_step": 194870, "epoch": 1610} {"train_loss": -41.35942459106445, "global_step": 194871, "epoch": 1610} {"train_loss": -42.293251037597656, "global_step": 194872, "epoch": 1610} {"train_loss": -41.36094284057617, "global_step": 194873, "epoch": 1610} {"train_loss": -42.618377685546875, "global_step": 194874, "epoch": 1610} {"train_loss": -41.425201416015625, "global_step": 194875, "epoch": 1610} {"train_loss": -42.40220260620117, "global_step": 194876, "epoch": 1610} {"train_loss": -42.06520462036133, "global_step": 194877, "epoch": 1610} {"train_loss": -42.72105026245117, "global_step": 194878, "epoch": 1610} {"train_loss": -42.5064697265625, "global_step": 194879, "epoch": 1610} {"train_loss": -41.74307632446289, "global_step": 194880, "epoch": 1610} {"train_loss": -42.66831588745117, "global_step": 194881, "epoch": 1610} {"train_loss": -41.946475982666016, "global_step": 194882, "epoch": 1610} {"train_loss": -42.63457107543945, "global_step": 194883, "epoch": 1610} {"train_loss": -42.722442626953125, "global_step": 194884, "epoch": 1610} {"train_loss": -42.776851654052734, "global_step": 194885, "epoch": 1610} {"train_loss": -42.0523796081543, "global_step": 194886, "epoch": 1610} {"train_loss": -43.111568450927734, "global_step": 194887, "epoch": 1610} {"train_loss": -42.54761505126953, "global_step": 194888, "epoch": 1610} {"train_loss": -42.74493408203125, "global_step": 194889, "epoch": 1610} {"train_loss": -42.861663818359375, "global_step": 194890, "epoch": 1610} {"train_loss": -42.894344329833984, "global_step": 194891, "epoch": 1610} {"train_loss": -42.9179801940918, "global_step": 194892, "epoch": 1610} {"train_loss": -42.18010330200195, "global_step": 194893, "epoch": 1610} {"train_loss": -43.03385543823242, "global_step": 194894, "epoch": 1610} {"train_loss": -42.944332122802734, "global_step": 194895, "epoch": 1610} {"train_loss": -42.580684661865234, "global_step": 194896, "epoch": 1610} {"train_loss": -41.86696243286133, "global_step": 194897, "epoch": 1610} {"train_loss": -41.783748626708984, "global_step": 194898, "epoch": 1610} {"train_loss": -40.2274169921875, "global_step": 194899, "epoch": 1610} {"train_loss": -38.81454086303711, "global_step": 194900, "epoch": 1610} {"train_loss": -41.077606201171875, "global_step": 194901, "epoch": 1610} {"train_loss": -43.10459518432617, "global_step": 194902, "epoch": 1610} {"train_loss": -41.73267364501953, "global_step": 194903, "epoch": 1610} {"train_loss": -42.26835632324219, "global_step": 194904, "epoch": 1610} {"train_loss": -42.350154876708984, "global_step": 194905, "epoch": 1610} {"train_loss": -42.55904769897461, "global_step": 194906, "epoch": 1610} {"train_loss": -42.28407287597656, "global_step": 194907, "epoch": 1610} {"train_loss": -43.096309661865234, "global_step": 194908, "epoch": 1610} {"train_loss": -42.48886489868164, "global_step": 194909, "epoch": 1610} {"train_loss": -41.795814514160156, "global_step": 194910, "epoch": 1610} {"train_loss": -42.31440353393555, "global_step": 194911, "epoch": 1610} {"train_loss": -42.95137405395508, "global_step": 194912, "epoch": 1610} {"train_loss": -42.39983367919922, "global_step": 194913, "epoch": 1610} {"train_loss": -42.24878692626953, "global_step": 194914, "epoch": 1610} {"train_loss": -43.08606719970703, "global_step": 194915, "epoch": 1610} {"train_loss": -41.886863708496094, "global_step": 194916, "epoch": 1610} {"train_loss": -41.037269592285156, "global_step": 194917, "epoch": 1610} {"train_loss": -41.806983947753906, "global_step": 194918, "epoch": 1610} {"train_loss": -41.369388580322266, "global_step": 194919, "epoch": 1610} {"train_loss": -38.795528411865234, "global_step": 194920, "epoch": 1610} {"train_loss": -41.85439682006836, "global_step": 194921, "epoch": 1610} {"train_loss": -42.78121566772461, "global_step": 194922, "epoch": 1610} {"train_loss": -42.222042083740234, "global_step": 194923, "epoch": 1610} {"train_loss": -41.86968994140625, "global_step": 194924, "epoch": 1610} {"train_loss": -41.585689544677734, "global_step": 194925, "epoch": 1610} {"train_loss": -41.728511810302734, "global_step": 194926, "epoch": 1610} {"train_loss": -41.78720474243164, "global_step": 194927, "epoch": 1610} {"train_loss": -42.28506088256836, "global_step": 194928, "epoch": 1610} {"train_loss": -41.59901809692383, "global_step": 194929, "epoch": 1610} {"train_loss": -41.36925002169018, "global_step": 194930, "epoch": 1610, "val_loss": 2533746.75} {"train_loss": -42.55841064453125, "global_step": 194931, "epoch": 1611} {"train_loss": -42.58049392700195, "global_step": 194932, "epoch": 1611} {"train_loss": -41.9713134765625, "global_step": 194933, "epoch": 1611} {"train_loss": -42.34163284301758, "global_step": 194934, "epoch": 1611} {"train_loss": -42.150489807128906, "global_step": 194935, "epoch": 1611} {"train_loss": -42.393924713134766, "global_step": 194936, "epoch": 1611} {"train_loss": -43.11981201171875, "global_step": 194937, "epoch": 1611} {"train_loss": -42.08543395996094, "global_step": 194938, "epoch": 1611} {"train_loss": -42.18450927734375, "global_step": 194939, "epoch": 1611} {"train_loss": -42.60593795776367, "global_step": 194940, "epoch": 1611} {"train_loss": -41.76945877075195, "global_step": 194941, "epoch": 1611} {"train_loss": -42.28307342529297, "global_step": 194942, "epoch": 1611} {"train_loss": -42.29472732543945, "global_step": 194943, "epoch": 1611} {"train_loss": -42.77800369262695, "global_step": 194944, "epoch": 1611} {"train_loss": -42.31608963012695, "global_step": 194945, "epoch": 1611} {"train_loss": -41.57188034057617, "global_step": 194946, "epoch": 1611} {"train_loss": -42.605445861816406, "global_step": 194947, "epoch": 1611} {"train_loss": -42.977359771728516, "global_step": 194948, "epoch": 1611} {"train_loss": -41.321632385253906, "global_step": 194949, "epoch": 1611} {"train_loss": -41.7469596862793, "global_step": 194950, "epoch": 1611} {"train_loss": -42.90834426879883, "global_step": 194951, "epoch": 1611} {"train_loss": -42.30706787109375, "global_step": 194952, "epoch": 1611} {"train_loss": -42.11708450317383, "global_step": 194953, "epoch": 1611} {"train_loss": -42.114559173583984, "global_step": 194954, "epoch": 1611} {"train_loss": -42.87422561645508, "global_step": 194955, "epoch": 1611} {"train_loss": -41.354156494140625, "global_step": 194956, "epoch": 1611} {"train_loss": -38.22639083862305, "global_step": 194957, "epoch": 1611} {"train_loss": -39.6056022644043, "global_step": 194958, "epoch": 1611} {"train_loss": -40.11341857910156, "global_step": 194959, "epoch": 1611} {"train_loss": -42.25944137573242, "global_step": 194960, "epoch": 1611} {"train_loss": -41.03090286254883, "global_step": 194961, "epoch": 1611} {"train_loss": -37.9517822265625, "global_step": 194962, "epoch": 1611} {"train_loss": -39.75564193725586, "global_step": 194963, "epoch": 1611} {"train_loss": -42.856239318847656, "global_step": 194964, "epoch": 1611} {"train_loss": -41.1466178894043, "global_step": 194965, "epoch": 1611} {"train_loss": -41.54183578491211, "global_step": 194966, "epoch": 1611} {"train_loss": -42.94047927856445, "global_step": 194967, "epoch": 1611} {"train_loss": -42.2952995300293, "global_step": 194968, "epoch": 1611} {"train_loss": -41.327152252197266, "global_step": 194969, "epoch": 1611} {"train_loss": -42.30849075317383, "global_step": 194970, "epoch": 1611} {"train_loss": -42.18192672729492, "global_step": 194971, "epoch": 1611} {"train_loss": -42.17319869995117, "global_step": 194972, "epoch": 1611} {"train_loss": -42.56532669067383, "global_step": 194973, "epoch": 1611} {"train_loss": -41.67947769165039, "global_step": 194974, "epoch": 1611} {"train_loss": -40.78824234008789, "global_step": 194975, "epoch": 1611} {"train_loss": -40.85676956176758, "global_step": 194976, "epoch": 1611} {"train_loss": -42.376338958740234, "global_step": 194977, "epoch": 1611} {"train_loss": -40.806304931640625, "global_step": 194978, "epoch": 1611} {"train_loss": -41.27152633666992, "global_step": 194979, "epoch": 1611} {"train_loss": -42.0562858581543, "global_step": 194980, "epoch": 1611} {"train_loss": -41.025177001953125, "global_step": 194981, "epoch": 1611} {"train_loss": -41.712860107421875, "global_step": 194982, "epoch": 1611} {"train_loss": -40.4222526550293, "global_step": 194983, "epoch": 1611} {"train_loss": -42.44552230834961, "global_step": 194984, "epoch": 1611} {"train_loss": -41.13981246948242, "global_step": 194985, "epoch": 1611} {"train_loss": -40.17405319213867, "global_step": 194986, "epoch": 1611} {"train_loss": -42.96611404418945, "global_step": 194987, "epoch": 1611} {"train_loss": -40.72441482543945, "global_step": 194988, "epoch": 1611} {"train_loss": -41.1201286315918, "global_step": 194989, "epoch": 1611} {"train_loss": -42.00920486450195, "global_step": 194990, "epoch": 1611} {"train_loss": -39.37540817260742, "global_step": 194991, "epoch": 1611} {"train_loss": -41.190765380859375, "global_step": 194992, "epoch": 1611} {"train_loss": -42.26765060424805, "global_step": 194993, "epoch": 1611} {"train_loss": -40.84933090209961, "global_step": 194994, "epoch": 1611} {"train_loss": -42.60161209106445, "global_step": 194995, "epoch": 1611} {"train_loss": -42.49041748046875, "global_step": 194996, "epoch": 1611} {"train_loss": -42.24658966064453, "global_step": 194997, "epoch": 1611} {"train_loss": -42.75358200073242, "global_step": 194998, "epoch": 1611} {"train_loss": -42.25971221923828, "global_step": 194999, "epoch": 1611} {"train_loss": -42.39932632446289, "global_step": 195000, "epoch": 1611} {"train_loss": -42.52338790893555, "global_step": 195001, "epoch": 1611} {"train_loss": -42.301143646240234, "global_step": 195002, "epoch": 1611} {"train_loss": -42.30790328979492, "global_step": 195003, "epoch": 1611} {"train_loss": -42.00440216064453, "global_step": 195004, "epoch": 1611} {"train_loss": -42.608253479003906, "global_step": 195005, "epoch": 1611} {"train_loss": -42.18935775756836, "global_step": 195006, "epoch": 1611} {"train_loss": -42.64138412475586, "global_step": 195007, "epoch": 1611} {"train_loss": -43.141483306884766, "global_step": 195008, "epoch": 1611} {"train_loss": -42.52094650268555, "global_step": 195009, "epoch": 1611} {"train_loss": -43.14590072631836, "global_step": 195010, "epoch": 1611} {"train_loss": -41.67641067504883, "global_step": 195011, "epoch": 1611} {"train_loss": -42.535099029541016, "global_step": 195012, "epoch": 1611} {"train_loss": -42.51002502441406, "global_step": 195013, "epoch": 1611} {"train_loss": -42.296302795410156, "global_step": 195014, "epoch": 1611} {"train_loss": -42.47512435913086, "global_step": 195015, "epoch": 1611} {"train_loss": -42.52474594116211, "global_step": 195016, "epoch": 1611} {"train_loss": -42.2802619934082, "global_step": 195017, "epoch": 1611} {"train_loss": -42.674072265625, "global_step": 195018, "epoch": 1611} {"train_loss": -42.910606384277344, "global_step": 195019, "epoch": 1611} {"train_loss": -42.996253967285156, "global_step": 195020, "epoch": 1611} {"train_loss": -43.07941818237305, "global_step": 195021, "epoch": 1611} {"train_loss": -42.8680534362793, "global_step": 195022, "epoch": 1611} {"train_loss": -43.04579162597656, "global_step": 195023, "epoch": 1611} {"train_loss": -42.864681243896484, "global_step": 195024, "epoch": 1611} {"train_loss": -43.22273635864258, "global_step": 195025, "epoch": 1611} {"train_loss": -43.29865646362305, "global_step": 195026, "epoch": 1611} {"train_loss": -43.15647506713867, "global_step": 195027, "epoch": 1611} {"train_loss": -43.311458587646484, "global_step": 195028, "epoch": 1611} {"train_loss": -43.18345260620117, "global_step": 195029, "epoch": 1611} {"train_loss": -42.4106559753418, "global_step": 195030, "epoch": 1611} {"train_loss": -43.11307907104492, "global_step": 195031, "epoch": 1611} {"train_loss": -43.0982780456543, "global_step": 195032, "epoch": 1611} {"train_loss": -42.386924743652344, "global_step": 195033, "epoch": 1611} {"train_loss": -43.18679428100586, "global_step": 195034, "epoch": 1611} {"train_loss": -43.21193313598633, "global_step": 195035, "epoch": 1611} {"train_loss": -41.7970085144043, "global_step": 195036, "epoch": 1611} {"train_loss": -42.170387268066406, "global_step": 195037, "epoch": 1611} {"train_loss": -43.096832275390625, "global_step": 195038, "epoch": 1611} {"train_loss": -41.460479736328125, "global_step": 195039, "epoch": 1611} {"train_loss": -42.230594635009766, "global_step": 195040, "epoch": 1611} {"train_loss": -42.61171340942383, "global_step": 195041, "epoch": 1611} {"train_loss": -42.041114807128906, "global_step": 195042, "epoch": 1611} {"train_loss": -42.07857894897461, "global_step": 195043, "epoch": 1611} {"train_loss": -41.756107330322266, "global_step": 195044, "epoch": 1611} {"train_loss": -41.7901725769043, "global_step": 195045, "epoch": 1611} {"train_loss": -42.2165412902832, "global_step": 195046, "epoch": 1611} {"train_loss": -42.521697998046875, "global_step": 195047, "epoch": 1611} {"train_loss": -41.349517822265625, "global_step": 195048, "epoch": 1611} {"train_loss": -41.57826232910156, "global_step": 195049, "epoch": 1611} {"train_loss": -41.93622970581055, "global_step": 195050, "epoch": 1611} {"train_loss": -42.06261822408881, "global_step": 195051, "epoch": 1611, "val_loss": 2499961.75} {"train_loss": -41.65168380737305, "global_step": 195052, "epoch": 1612} {"train_loss": -42.04817581176758, "global_step": 195053, "epoch": 1612} {"train_loss": -42.49967956542969, "global_step": 195054, "epoch": 1612} {"train_loss": -41.28292465209961, "global_step": 195055, "epoch": 1612} {"train_loss": -41.3729362487793, "global_step": 195056, "epoch": 1612} {"train_loss": -42.28742218017578, "global_step": 195057, "epoch": 1612} {"train_loss": -42.39777374267578, "global_step": 195058, "epoch": 1612} {"train_loss": -42.041744232177734, "global_step": 195059, "epoch": 1612} {"train_loss": -42.14042282104492, "global_step": 195060, "epoch": 1612} {"train_loss": -42.619346618652344, "global_step": 195061, "epoch": 1612} {"train_loss": -42.11306381225586, "global_step": 195062, "epoch": 1612} {"train_loss": -41.3931884765625, "global_step": 195063, "epoch": 1612} {"train_loss": -41.641273498535156, "global_step": 195064, "epoch": 1612} {"train_loss": -41.473854064941406, "global_step": 195065, "epoch": 1612} {"train_loss": -42.8797721862793, "global_step": 195066, "epoch": 1612} {"train_loss": -41.83950424194336, "global_step": 195067, "epoch": 1612} {"train_loss": -41.61594772338867, "global_step": 195068, "epoch": 1612} {"train_loss": -42.141971588134766, "global_step": 195069, "epoch": 1612} {"train_loss": -42.5642204284668, "global_step": 195070, "epoch": 1612} {"train_loss": -42.03554153442383, "global_step": 195071, "epoch": 1612} {"train_loss": -42.28815460205078, "global_step": 195072, "epoch": 1612} {"train_loss": -41.13218307495117, "global_step": 195073, "epoch": 1612} {"train_loss": -41.95888900756836, "global_step": 195074, "epoch": 1612} {"train_loss": -42.59072494506836, "global_step": 195075, "epoch": 1612} {"train_loss": -42.84017562866211, "global_step": 195076, "epoch": 1612} {"train_loss": -42.127098083496094, "global_step": 195077, "epoch": 1612} {"train_loss": -41.965267181396484, "global_step": 195078, "epoch": 1612} {"train_loss": -42.831085205078125, "global_step": 195079, "epoch": 1612} {"train_loss": -42.3216667175293, "global_step": 195080, "epoch": 1612} {"train_loss": -42.54403305053711, "global_step": 195081, "epoch": 1612} {"train_loss": -41.31725311279297, "global_step": 195082, "epoch": 1612} {"train_loss": -41.85657501220703, "global_step": 195083, "epoch": 1612} {"train_loss": -42.4528923034668, "global_step": 195084, "epoch": 1612} {"train_loss": -42.1839599609375, "global_step": 195085, "epoch": 1612} {"train_loss": -39.44459915161133, "global_step": 195086, "epoch": 1612} {"train_loss": -41.580379486083984, "global_step": 195087, "epoch": 1612} {"train_loss": -42.31163024902344, "global_step": 195088, "epoch": 1612} {"train_loss": -41.393497467041016, "global_step": 195089, "epoch": 1612} {"train_loss": -40.73093032836914, "global_step": 195090, "epoch": 1612} {"train_loss": -40.39179611206055, "global_step": 195091, "epoch": 1612} {"train_loss": -41.91678237915039, "global_step": 195092, "epoch": 1612} {"train_loss": -41.72249221801758, "global_step": 195093, "epoch": 1612} {"train_loss": -41.31220245361328, "global_step": 195094, "epoch": 1612} {"train_loss": -40.6663932800293, "global_step": 195095, "epoch": 1612} {"train_loss": -41.25358200073242, "global_step": 195096, "epoch": 1612} {"train_loss": -42.140411376953125, "global_step": 195097, "epoch": 1612} {"train_loss": -42.4117431640625, "global_step": 195098, "epoch": 1612} {"train_loss": -41.56490707397461, "global_step": 195099, "epoch": 1612} {"train_loss": -41.8055534362793, "global_step": 195100, "epoch": 1612} {"train_loss": -41.95912170410156, "global_step": 195101, "epoch": 1612} {"train_loss": -40.54899597167969, "global_step": 195102, "epoch": 1612} {"train_loss": -40.91464614868164, "global_step": 195103, "epoch": 1612} {"train_loss": -42.2766227722168, "global_step": 195104, "epoch": 1612} {"train_loss": -40.2159423828125, "global_step": 195105, "epoch": 1612} {"train_loss": -42.21859359741211, "global_step": 195106, "epoch": 1612} {"train_loss": -41.23299026489258, "global_step": 195107, "epoch": 1612} {"train_loss": -40.84731674194336, "global_step": 195108, "epoch": 1612} {"train_loss": -41.55683135986328, "global_step": 195109, "epoch": 1612} {"train_loss": -40.9311408996582, "global_step": 195110, "epoch": 1612} {"train_loss": -41.144752502441406, "global_step": 195111, "epoch": 1612} {"train_loss": -33.54918670654297, "global_step": 195112, "epoch": 1612} {"train_loss": -40.067989349365234, "global_step": 195113, "epoch": 1612} {"train_loss": -38.8597297668457, "global_step": 195114, "epoch": 1612} {"train_loss": -40.30501174926758, "global_step": 195115, "epoch": 1612} {"train_loss": -39.58086013793945, "global_step": 195116, "epoch": 1612} {"train_loss": -38.637691497802734, "global_step": 195117, "epoch": 1612} {"train_loss": -40.67658615112305, "global_step": 195118, "epoch": 1612} {"train_loss": -41.56016159057617, "global_step": 195119, "epoch": 1612} {"train_loss": -38.62982940673828, "global_step": 195120, "epoch": 1612} {"train_loss": -39.94490051269531, "global_step": 195121, "epoch": 1612} {"train_loss": -37.92020797729492, "global_step": 195122, "epoch": 1612} {"train_loss": -40.822898864746094, "global_step": 195123, "epoch": 1612} {"train_loss": -39.35600662231445, "global_step": 195124, "epoch": 1612} {"train_loss": -40.38222122192383, "global_step": 195125, "epoch": 1612} {"train_loss": -39.96979904174805, "global_step": 195126, "epoch": 1612} {"train_loss": -40.16512680053711, "global_step": 195127, "epoch": 1612} {"train_loss": -40.55537033081055, "global_step": 195128, "epoch": 1612} {"train_loss": -40.468868255615234, "global_step": 195129, "epoch": 1612} {"train_loss": -39.824951171875, "global_step": 195130, "epoch": 1612} {"train_loss": -36.283233642578125, "global_step": 195131, "epoch": 1612} {"train_loss": -40.613346099853516, "global_step": 195132, "epoch": 1612} {"train_loss": -40.80586624145508, "global_step": 195133, "epoch": 1612} {"train_loss": -32.503204345703125, "global_step": 195134, "epoch": 1612} {"train_loss": -39.39698028564453, "global_step": 195135, "epoch": 1612} {"train_loss": -38.56181716918945, "global_step": 195136, "epoch": 1612} {"train_loss": -41.17856979370117, "global_step": 195137, "epoch": 1612} {"train_loss": -39.586021423339844, "global_step": 195138, "epoch": 1612} {"train_loss": -40.30073165893555, "global_step": 195139, "epoch": 1612} {"train_loss": -39.72909927368164, "global_step": 195140, "epoch": 1612} {"train_loss": -40.72278594970703, "global_step": 195141, "epoch": 1612} {"train_loss": -39.952247619628906, "global_step": 195142, "epoch": 1612} {"train_loss": -41.11086654663086, "global_step": 195143, "epoch": 1612} {"train_loss": -40.18990707397461, "global_step": 195144, "epoch": 1612} {"train_loss": -40.25373077392578, "global_step": 195145, "epoch": 1612} {"train_loss": -37.613929748535156, "global_step": 195146, "epoch": 1612} {"train_loss": -40.597225189208984, "global_step": 195147, "epoch": 1612} {"train_loss": -40.479427337646484, "global_step": 195148, "epoch": 1612} {"train_loss": -40.613807678222656, "global_step": 195149, "epoch": 1612} {"train_loss": -41.304908752441406, "global_step": 195150, "epoch": 1612} {"train_loss": -41.59957504272461, "global_step": 195151, "epoch": 1612} {"train_loss": -40.828826904296875, "global_step": 195152, "epoch": 1612} {"train_loss": -41.839359283447266, "global_step": 195153, "epoch": 1612} {"train_loss": -41.81093978881836, "global_step": 195154, "epoch": 1612} {"train_loss": -41.33400344848633, "global_step": 195155, "epoch": 1612} {"train_loss": -41.43659591674805, "global_step": 195156, "epoch": 1612} {"train_loss": -41.64643478393555, "global_step": 195157, "epoch": 1612} {"train_loss": -41.90828323364258, "global_step": 195158, "epoch": 1612} {"train_loss": -42.086334228515625, "global_step": 195159, "epoch": 1612} {"train_loss": -41.76548385620117, "global_step": 195160, "epoch": 1612} {"train_loss": -40.90808868408203, "global_step": 195161, "epoch": 1612} {"train_loss": -41.9818229675293, "global_step": 195162, "epoch": 1612} {"train_loss": -42.23487854003906, "global_step": 195163, "epoch": 1612} {"train_loss": -42.25899124145508, "global_step": 195164, "epoch": 1612} {"train_loss": -42.00556564331055, "global_step": 195165, "epoch": 1612} {"train_loss": -41.21864318847656, "global_step": 195166, "epoch": 1612} {"train_loss": -42.11894607543945, "global_step": 195167, "epoch": 1612} {"train_loss": -42.51827621459961, "global_step": 195168, "epoch": 1612} {"train_loss": -42.54483413696289, "global_step": 195169, "epoch": 1612} {"train_loss": -42.45515060424805, "global_step": 195170, "epoch": 1612} {"train_loss": -42.280006408691406, "global_step": 195171, "epoch": 1612} {"train_loss": -41.06607657818755, "global_step": 195172, "epoch": 1612, "val_loss": 2475298.75} {"train_loss": -42.596763610839844, "global_step": 195173, "epoch": 1613} {"train_loss": -42.62484359741211, "global_step": 195174, "epoch": 1613} {"train_loss": -42.83076858520508, "global_step": 195175, "epoch": 1613} {"train_loss": -42.366127014160156, "global_step": 195176, "epoch": 1613} {"train_loss": -42.84785461425781, "global_step": 195177, "epoch": 1613} {"train_loss": -42.369232177734375, "global_step": 195178, "epoch": 1613} {"train_loss": -42.08830642700195, "global_step": 195179, "epoch": 1613} {"train_loss": -41.919593811035156, "global_step": 195180, "epoch": 1613} {"train_loss": -42.804443359375, "global_step": 195181, "epoch": 1613} {"train_loss": -42.70972442626953, "global_step": 195182, "epoch": 1613} {"train_loss": -42.76813888549805, "global_step": 195183, "epoch": 1613} {"train_loss": -42.113460540771484, "global_step": 195184, "epoch": 1613} {"train_loss": -43.01658248901367, "global_step": 195185, "epoch": 1613} {"train_loss": -42.881465911865234, "global_step": 195186, "epoch": 1613} {"train_loss": -42.98382568359375, "global_step": 195187, "epoch": 1613} {"train_loss": -42.94355392456055, "global_step": 195188, "epoch": 1613} {"train_loss": -42.6092529296875, "global_step": 195189, "epoch": 1613} {"train_loss": -42.93900680541992, "global_step": 195190, "epoch": 1613} {"train_loss": -42.68478012084961, "global_step": 195191, "epoch": 1613} {"train_loss": -43.02476119995117, "global_step": 195192, "epoch": 1613} {"train_loss": -42.82534408569336, "global_step": 195193, "epoch": 1613} {"train_loss": -43.047340393066406, "global_step": 195194, "epoch": 1613} {"train_loss": -42.86652755737305, "global_step": 195195, "epoch": 1613} {"train_loss": -43.28004837036133, "global_step": 195196, "epoch": 1613} {"train_loss": -42.198768615722656, "global_step": 195197, "epoch": 1613} {"train_loss": -42.57279586791992, "global_step": 195198, "epoch": 1613} {"train_loss": -42.207637786865234, "global_step": 195199, "epoch": 1613} {"train_loss": -40.42513656616211, "global_step": 195200, "epoch": 1613} {"train_loss": -37.34961700439453, "global_step": 195201, "epoch": 1613} {"train_loss": -42.47444534301758, "global_step": 195202, "epoch": 1613} {"train_loss": -41.399532318115234, "global_step": 195203, "epoch": 1613} {"train_loss": -39.377098083496094, "global_step": 195204, "epoch": 1613} {"train_loss": -41.344993591308594, "global_step": 195205, "epoch": 1613} {"train_loss": -41.0427131652832, "global_step": 195206, "epoch": 1613} {"train_loss": -40.296810150146484, "global_step": 195207, "epoch": 1613} {"train_loss": -41.364688873291016, "global_step": 195208, "epoch": 1613} {"train_loss": -37.84119415283203, "global_step": 195209, "epoch": 1613} {"train_loss": -42.49420928955078, "global_step": 195210, "epoch": 1613} {"train_loss": -40.39282989501953, "global_step": 195211, "epoch": 1613} {"train_loss": -39.77274703979492, "global_step": 195212, "epoch": 1613} {"train_loss": -41.981292724609375, "global_step": 195213, "epoch": 1613} {"train_loss": -38.22114944458008, "global_step": 195214, "epoch": 1613} {"train_loss": -42.368019104003906, "global_step": 195215, "epoch": 1613} {"train_loss": -38.41130447387695, "global_step": 195216, "epoch": 1613} {"train_loss": -41.52244186401367, "global_step": 195217, "epoch": 1613} {"train_loss": -39.6027946472168, "global_step": 195218, "epoch": 1613} {"train_loss": -40.33961868286133, "global_step": 195219, "epoch": 1613} {"train_loss": -41.70228958129883, "global_step": 195220, "epoch": 1613} {"train_loss": -39.385372161865234, "global_step": 195221, "epoch": 1613} {"train_loss": -42.04932403564453, "global_step": 195222, "epoch": 1613} {"train_loss": -39.89597702026367, "global_step": 195223, "epoch": 1613} {"train_loss": -41.75150680541992, "global_step": 195224, "epoch": 1613} {"train_loss": -41.4986686706543, "global_step": 195225, "epoch": 1613} {"train_loss": -42.23176193237305, "global_step": 195226, "epoch": 1613} {"train_loss": -42.686195373535156, "global_step": 195227, "epoch": 1613} {"train_loss": -41.44230651855469, "global_step": 195228, "epoch": 1613} {"train_loss": -42.530513763427734, "global_step": 195229, "epoch": 1613} {"train_loss": -42.261512756347656, "global_step": 195230, "epoch": 1613} {"train_loss": -42.32615280151367, "global_step": 195231, "epoch": 1613} {"train_loss": -42.48020553588867, "global_step": 195232, "epoch": 1613} {"train_loss": -42.74831771850586, "global_step": 195233, "epoch": 1613} {"train_loss": -41.841949462890625, "global_step": 195234, "epoch": 1613} {"train_loss": -41.700347900390625, "global_step": 195235, "epoch": 1613} {"train_loss": -42.2803840637207, "global_step": 195236, "epoch": 1613} {"train_loss": -42.32077407836914, "global_step": 195237, "epoch": 1613} {"train_loss": -42.223052978515625, "global_step": 195238, "epoch": 1613} {"train_loss": -42.66291427612305, "global_step": 195239, "epoch": 1613} {"train_loss": -42.47629928588867, "global_step": 195240, "epoch": 1613} {"train_loss": -42.55707550048828, "global_step": 195241, "epoch": 1613} {"train_loss": -42.3167839050293, "global_step": 195242, "epoch": 1613} {"train_loss": -42.15810775756836, "global_step": 195243, "epoch": 1613} {"train_loss": -42.52846908569336, "global_step": 195244, "epoch": 1613} {"train_loss": -42.83280563354492, "global_step": 195245, "epoch": 1613} {"train_loss": -41.91265869140625, "global_step": 195246, "epoch": 1613} {"train_loss": -40.225196838378906, "global_step": 195247, "epoch": 1613} {"train_loss": -42.0084342956543, "global_step": 195248, "epoch": 1613} {"train_loss": -42.256771087646484, "global_step": 195249, "epoch": 1613} {"train_loss": -39.41422653198242, "global_step": 195250, "epoch": 1613} {"train_loss": -41.074825286865234, "global_step": 195251, "epoch": 1613} {"train_loss": -42.19328689575195, "global_step": 195252, "epoch": 1613} {"train_loss": -39.11886978149414, "global_step": 195253, "epoch": 1613} {"train_loss": -41.957210540771484, "global_step": 195254, "epoch": 1613} {"train_loss": -41.03874969482422, "global_step": 195255, "epoch": 1613} {"train_loss": -39.282691955566406, "global_step": 195256, "epoch": 1613} {"train_loss": -41.81281280517578, "global_step": 195257, "epoch": 1613} {"train_loss": -37.04609298706055, "global_step": 195258, "epoch": 1613} {"train_loss": -42.047149658203125, "global_step": 195259, "epoch": 1613} {"train_loss": -38.26860427856445, "global_step": 195260, "epoch": 1613} {"train_loss": -36.54484939575195, "global_step": 195261, "epoch": 1613} {"train_loss": -37.165863037109375, "global_step": 195262, "epoch": 1613} {"train_loss": -39.924156188964844, "global_step": 195263, "epoch": 1613} {"train_loss": -41.2161979675293, "global_step": 195264, "epoch": 1613} {"train_loss": -39.13898468017578, "global_step": 195265, "epoch": 1613} {"train_loss": -41.12897872924805, "global_step": 195266, "epoch": 1613} {"train_loss": -40.05942916870117, "global_step": 195267, "epoch": 1613} {"train_loss": -40.94532012939453, "global_step": 195268, "epoch": 1613} {"train_loss": -41.300994873046875, "global_step": 195269, "epoch": 1613} {"train_loss": -39.58589553833008, "global_step": 195270, "epoch": 1613} {"train_loss": -41.023189544677734, "global_step": 195271, "epoch": 1613} {"train_loss": -39.14711380004883, "global_step": 195272, "epoch": 1613} {"train_loss": -39.82974624633789, "global_step": 195273, "epoch": 1613} {"train_loss": -39.78328323364258, "global_step": 195274, "epoch": 1613} {"train_loss": -42.243377685546875, "global_step": 195275, "epoch": 1613} {"train_loss": -39.60516357421875, "global_step": 195276, "epoch": 1613} {"train_loss": -41.49233627319336, "global_step": 195277, "epoch": 1613} {"train_loss": -40.10631561279297, "global_step": 195278, "epoch": 1613} {"train_loss": -40.25211715698242, "global_step": 195279, "epoch": 1613} {"train_loss": -41.599395751953125, "global_step": 195280, "epoch": 1613} {"train_loss": -40.85476303100586, "global_step": 195281, "epoch": 1613} {"train_loss": -41.682735443115234, "global_step": 195282, "epoch": 1613} {"train_loss": -41.637577056884766, "global_step": 195283, "epoch": 1613} {"train_loss": -41.733665466308594, "global_step": 195284, "epoch": 1613} {"train_loss": -41.2153434753418, "global_step": 195285, "epoch": 1613} {"train_loss": -41.57158279418945, "global_step": 195286, "epoch": 1613} {"train_loss": -41.66105270385742, "global_step": 195287, "epoch": 1613} {"train_loss": -42.14834213256836, "global_step": 195288, "epoch": 1613} {"train_loss": -40.42716598510742, "global_step": 195289, "epoch": 1613} {"train_loss": -39.551361083984375, "global_step": 195290, "epoch": 1613} {"train_loss": -41.948665618896484, "global_step": 195291, "epoch": 1613} {"train_loss": -41.028358459472656, "global_step": 195292, "epoch": 1613} {"train_loss": -41.33705120244302, "global_step": 195293, "epoch": 1613, "val_loss": 2574570.25} {"train_loss": -41.34531784057617, "global_step": 195294, "epoch": 1614} {"train_loss": -42.110496520996094, "global_step": 195295, "epoch": 1614} {"train_loss": -41.9336051940918, "global_step": 195296, "epoch": 1614} {"train_loss": -41.915462493896484, "global_step": 195297, "epoch": 1614} {"train_loss": -42.1684684753418, "global_step": 195298, "epoch": 1614} {"train_loss": -42.26072311401367, "global_step": 195299, "epoch": 1614} {"train_loss": -41.50754928588867, "global_step": 195300, "epoch": 1614} {"train_loss": -42.5217399597168, "global_step": 195301, "epoch": 1614} {"train_loss": -41.32853317260742, "global_step": 195302, "epoch": 1614} {"train_loss": -42.247955322265625, "global_step": 195303, "epoch": 1614} {"train_loss": -41.76454544067383, "global_step": 195304, "epoch": 1614} {"train_loss": -42.25569534301758, "global_step": 195305, "epoch": 1614} {"train_loss": -41.379573822021484, "global_step": 195306, "epoch": 1614} {"train_loss": -42.20429229736328, "global_step": 195307, "epoch": 1614} {"train_loss": -41.762813568115234, "global_step": 195308, "epoch": 1614} {"train_loss": -42.227394104003906, "global_step": 195309, "epoch": 1614} {"train_loss": -41.8984489440918, "global_step": 195310, "epoch": 1614} {"train_loss": -42.346466064453125, "global_step": 195311, "epoch": 1614} {"train_loss": -42.098548889160156, "global_step": 195312, "epoch": 1614} {"train_loss": -42.51692581176758, "global_step": 195313, "epoch": 1614} {"train_loss": -42.754146575927734, "global_step": 195314, "epoch": 1614} {"train_loss": -42.6287727355957, "global_step": 195315, "epoch": 1614} {"train_loss": -43.071590423583984, "global_step": 195316, "epoch": 1614} {"train_loss": -42.35531234741211, "global_step": 195317, "epoch": 1614} {"train_loss": -42.738887786865234, "global_step": 195318, "epoch": 1614} {"train_loss": -41.853919982910156, "global_step": 195319, "epoch": 1614} {"train_loss": -42.686004638671875, "global_step": 195320, "epoch": 1614} {"train_loss": -42.2018928527832, "global_step": 195321, "epoch": 1614} {"train_loss": -41.245750427246094, "global_step": 195322, "epoch": 1614} {"train_loss": -42.58340072631836, "global_step": 195323, "epoch": 1614} {"train_loss": -42.719398498535156, "global_step": 195324, "epoch": 1614} {"train_loss": -42.98722457885742, "global_step": 195325, "epoch": 1614} {"train_loss": -42.292030334472656, "global_step": 195326, "epoch": 1614} {"train_loss": -43.13056564331055, "global_step": 195327, "epoch": 1614} {"train_loss": -42.99469757080078, "global_step": 195328, "epoch": 1614} {"train_loss": -41.76777267456055, "global_step": 195329, "epoch": 1614} {"train_loss": -40.415645599365234, "global_step": 195330, "epoch": 1614} {"train_loss": -41.011566162109375, "global_step": 195331, "epoch": 1614} {"train_loss": -42.11311340332031, "global_step": 195332, "epoch": 1614} {"train_loss": -41.70845413208008, "global_step": 195333, "epoch": 1614} {"train_loss": -38.84436798095703, "global_step": 195334, "epoch": 1614} {"train_loss": -40.54800033569336, "global_step": 195335, "epoch": 1614} {"train_loss": -42.09396743774414, "global_step": 195336, "epoch": 1614} {"train_loss": -40.188594818115234, "global_step": 195337, "epoch": 1614} {"train_loss": -40.642208099365234, "global_step": 195338, "epoch": 1614} {"train_loss": -41.0855827331543, "global_step": 195339, "epoch": 1614} {"train_loss": -41.619850158691406, "global_step": 195340, "epoch": 1614} {"train_loss": -41.24139404296875, "global_step": 195341, "epoch": 1614} {"train_loss": -39.627872467041016, "global_step": 195342, "epoch": 1614} {"train_loss": -42.248382568359375, "global_step": 195343, "epoch": 1614} {"train_loss": -41.36574172973633, "global_step": 195344, "epoch": 1614} {"train_loss": -42.357879638671875, "global_step": 195345, "epoch": 1614} {"train_loss": -41.99928665161133, "global_step": 195346, "epoch": 1614} {"train_loss": -41.81634521484375, "global_step": 195347, "epoch": 1614} {"train_loss": -42.235206604003906, "global_step": 195348, "epoch": 1614} {"train_loss": -41.600990295410156, "global_step": 195349, "epoch": 1614} {"train_loss": -42.3667106628418, "global_step": 195350, "epoch": 1614} {"train_loss": -41.93870162963867, "global_step": 195351, "epoch": 1614} {"train_loss": -42.468544006347656, "global_step": 195352, "epoch": 1614} {"train_loss": -42.36795425415039, "global_step": 195353, "epoch": 1614} {"train_loss": -42.427330017089844, "global_step": 195354, "epoch": 1614} {"train_loss": -41.99874496459961, "global_step": 195355, "epoch": 1614} {"train_loss": -42.394039154052734, "global_step": 195356, "epoch": 1614} {"train_loss": -42.17551040649414, "global_step": 195357, "epoch": 1614} {"train_loss": -42.32090377807617, "global_step": 195358, "epoch": 1614} {"train_loss": -42.7939453125, "global_step": 195359, "epoch": 1614} {"train_loss": -42.01450729370117, "global_step": 195360, "epoch": 1614} {"train_loss": -41.72902297973633, "global_step": 195361, "epoch": 1614} {"train_loss": -42.40291976928711, "global_step": 195362, "epoch": 1614} {"train_loss": -42.476402282714844, "global_step": 195363, "epoch": 1614} {"train_loss": -42.30928421020508, "global_step": 195364, "epoch": 1614} {"train_loss": -41.815982818603516, "global_step": 195365, "epoch": 1614} {"train_loss": -42.054813385009766, "global_step": 195366, "epoch": 1614} {"train_loss": -42.23111343383789, "global_step": 195367, "epoch": 1614} {"train_loss": -42.02973175048828, "global_step": 195368, "epoch": 1614} {"train_loss": -42.28065872192383, "global_step": 195369, "epoch": 1614} {"train_loss": -42.612247467041016, "global_step": 195370, "epoch": 1614} {"train_loss": -41.785011291503906, "global_step": 195371, "epoch": 1614} {"train_loss": -41.94841003417969, "global_step": 195372, "epoch": 1614} {"train_loss": -42.787986755371094, "global_step": 195373, "epoch": 1614} {"train_loss": -42.23545455932617, "global_step": 195374, "epoch": 1614} {"train_loss": -42.74457931518555, "global_step": 195375, "epoch": 1614} {"train_loss": -42.26804733276367, "global_step": 195376, "epoch": 1614} {"train_loss": -42.01801681518555, "global_step": 195377, "epoch": 1614} {"train_loss": -42.59931182861328, "global_step": 195378, "epoch": 1614} {"train_loss": -43.06714630126953, "global_step": 195379, "epoch": 1614} {"train_loss": -43.16925811767578, "global_step": 195380, "epoch": 1614} {"train_loss": -42.8079833984375, "global_step": 195381, "epoch": 1614} {"train_loss": -43.070552825927734, "global_step": 195382, "epoch": 1614} {"train_loss": -42.96934127807617, "global_step": 195383, "epoch": 1614} {"train_loss": -41.794132232666016, "global_step": 195384, "epoch": 1614} {"train_loss": -42.79200744628906, "global_step": 195385, "epoch": 1614} {"train_loss": -43.35929489135742, "global_step": 195386, "epoch": 1614} {"train_loss": -42.54133987426758, "global_step": 195387, "epoch": 1614} {"train_loss": -42.37142562866211, "global_step": 195388, "epoch": 1614} {"train_loss": -42.73986053466797, "global_step": 195389, "epoch": 1614} {"train_loss": -41.876708984375, "global_step": 195390, "epoch": 1614} {"train_loss": -41.493377685546875, "global_step": 195391, "epoch": 1614} {"train_loss": -40.69683837890625, "global_step": 195392, "epoch": 1614} {"train_loss": -39.312931060791016, "global_step": 195393, "epoch": 1614} {"train_loss": -41.52034378051758, "global_step": 195394, "epoch": 1614} {"train_loss": -42.86330032348633, "global_step": 195395, "epoch": 1614} {"train_loss": -42.20340347290039, "global_step": 195396, "epoch": 1614} {"train_loss": -42.36306381225586, "global_step": 195397, "epoch": 1614} {"train_loss": -42.46541976928711, "global_step": 195398, "epoch": 1614} {"train_loss": -42.121891021728516, "global_step": 195399, "epoch": 1614} {"train_loss": -41.01752471923828, "global_step": 195400, "epoch": 1614} {"train_loss": -41.89326477050781, "global_step": 195401, "epoch": 1614} {"train_loss": -42.50063705444336, "global_step": 195402, "epoch": 1614} {"train_loss": -41.56903839111328, "global_step": 195403, "epoch": 1614} {"train_loss": -41.32442092895508, "global_step": 195404, "epoch": 1614} {"train_loss": -41.527042388916016, "global_step": 195405, "epoch": 1614} {"train_loss": -42.69413375854492, "global_step": 195406, "epoch": 1614} {"train_loss": -42.49931716918945, "global_step": 195407, "epoch": 1614} {"train_loss": -41.473392486572266, "global_step": 195408, "epoch": 1614} {"train_loss": -42.412872314453125, "global_step": 195409, "epoch": 1614} {"train_loss": -41.608638763427734, "global_step": 195410, "epoch": 1614} {"train_loss": -42.732421875, "global_step": 195411, "epoch": 1614} {"train_loss": -42.21462631225586, "global_step": 195412, "epoch": 1614} {"train_loss": -42.857295989990234, "global_step": 195413, "epoch": 1614} {"train_loss": -42.058627357167644, "global_step": 195414, "epoch": 1614, "val_loss": 2638153.0} {"train_loss": -42.60655975341797, "global_step": 195415, "epoch": 1615} {"train_loss": -42.6588134765625, "global_step": 195416, "epoch": 1615} {"train_loss": -42.01024627685547, "global_step": 195417, "epoch": 1615} {"train_loss": -43.26198959350586, "global_step": 195418, "epoch": 1615} {"train_loss": -42.21369934082031, "global_step": 195419, "epoch": 1615} {"train_loss": -42.431365966796875, "global_step": 195420, "epoch": 1615} {"train_loss": -42.09845733642578, "global_step": 195421, "epoch": 1615} {"train_loss": -41.61855697631836, "global_step": 195422, "epoch": 1615} {"train_loss": -42.899410247802734, "global_step": 195423, "epoch": 1615} {"train_loss": -41.282752990722656, "global_step": 195424, "epoch": 1615} {"train_loss": -42.70301818847656, "global_step": 195425, "epoch": 1615} {"train_loss": -41.5953254699707, "global_step": 195426, "epoch": 1615} {"train_loss": -42.0715217590332, "global_step": 195427, "epoch": 1615} {"train_loss": -42.25339889526367, "global_step": 195428, "epoch": 1615} {"train_loss": -42.40376663208008, "global_step": 195429, "epoch": 1615} {"train_loss": -42.20902633666992, "global_step": 195430, "epoch": 1615} {"train_loss": -43.08694076538086, "global_step": 195431, "epoch": 1615} {"train_loss": -42.201717376708984, "global_step": 195432, "epoch": 1615} {"train_loss": -40.34160614013672, "global_step": 195433, "epoch": 1615} {"train_loss": -40.05270004272461, "global_step": 195434, "epoch": 1615} {"train_loss": -42.08991622924805, "global_step": 195435, "epoch": 1615} {"train_loss": -41.725765228271484, "global_step": 195436, "epoch": 1615} {"train_loss": -40.65503692626953, "global_step": 195437, "epoch": 1615} {"train_loss": -38.35860061645508, "global_step": 195438, "epoch": 1615} {"train_loss": -42.32505416870117, "global_step": 195439, "epoch": 1615} {"train_loss": -36.7597770690918, "global_step": 195440, "epoch": 1615} {"train_loss": -42.21805191040039, "global_step": 195441, "epoch": 1615} {"train_loss": -38.2719612121582, "global_step": 195442, "epoch": 1615} {"train_loss": -37.706085205078125, "global_step": 195443, "epoch": 1615} {"train_loss": -40.519954681396484, "global_step": 195444, "epoch": 1615} {"train_loss": -34.88351058959961, "global_step": 195445, "epoch": 1615} {"train_loss": -40.2989501953125, "global_step": 195446, "epoch": 1615} {"train_loss": -37.589195251464844, "global_step": 195447, "epoch": 1615} {"train_loss": -39.70670700073242, "global_step": 195448, "epoch": 1615} {"train_loss": -40.54658126831055, "global_step": 195449, "epoch": 1615} {"train_loss": -40.1331672668457, "global_step": 195450, "epoch": 1615} {"train_loss": -39.341270446777344, "global_step": 195451, "epoch": 1615} {"train_loss": -40.504695892333984, "global_step": 195452, "epoch": 1615} {"train_loss": -41.8607292175293, "global_step": 195453, "epoch": 1615} {"train_loss": -39.20146179199219, "global_step": 195454, "epoch": 1615} {"train_loss": -38.11442184448242, "global_step": 195455, "epoch": 1615} {"train_loss": -39.52260971069336, "global_step": 195456, "epoch": 1615} {"train_loss": -38.58633041381836, "global_step": 195457, "epoch": 1615} {"train_loss": -38.945919036865234, "global_step": 195458, "epoch": 1615} {"train_loss": -41.29082107543945, "global_step": 195459, "epoch": 1615} {"train_loss": -40.74129867553711, "global_step": 195460, "epoch": 1615} {"train_loss": -40.338096618652344, "global_step": 195461, "epoch": 1615} {"train_loss": -41.676753997802734, "global_step": 195462, "epoch": 1615} {"train_loss": -41.498958587646484, "global_step": 195463, "epoch": 1615} {"train_loss": -41.580894470214844, "global_step": 195464, "epoch": 1615} {"train_loss": -39.70684814453125, "global_step": 195465, "epoch": 1615} {"train_loss": -40.8729133605957, "global_step": 195466, "epoch": 1615} {"train_loss": -41.863136291503906, "global_step": 195467, "epoch": 1615} {"train_loss": -41.014617919921875, "global_step": 195468, "epoch": 1615} {"train_loss": -41.995235443115234, "global_step": 195469, "epoch": 1615} {"train_loss": -41.660308837890625, "global_step": 195470, "epoch": 1615} {"train_loss": -41.08487319946289, "global_step": 195471, "epoch": 1615} {"train_loss": -41.75532913208008, "global_step": 195472, "epoch": 1615} {"train_loss": -41.97724533081055, "global_step": 195473, "epoch": 1615} {"train_loss": -41.567970275878906, "global_step": 195474, "epoch": 1615} {"train_loss": -42.21963882446289, "global_step": 195475, "epoch": 1615} {"train_loss": -41.81410598754883, "global_step": 195476, "epoch": 1615} {"train_loss": -42.20652389526367, "global_step": 195477, "epoch": 1615} {"train_loss": -41.84617233276367, "global_step": 195478, "epoch": 1615} {"train_loss": -42.16163635253906, "global_step": 195479, "epoch": 1615} {"train_loss": -41.99650192260742, "global_step": 195480, "epoch": 1615} {"train_loss": -42.83903121948242, "global_step": 195481, "epoch": 1615} {"train_loss": -42.230865478515625, "global_step": 195482, "epoch": 1615} {"train_loss": -42.45178985595703, "global_step": 195483, "epoch": 1615} {"train_loss": -41.63337326049805, "global_step": 195484, "epoch": 1615} {"train_loss": -42.613563537597656, "global_step": 195485, "epoch": 1615} {"train_loss": -41.9605712890625, "global_step": 195486, "epoch": 1615} {"train_loss": -42.51826095581055, "global_step": 195487, "epoch": 1615} {"train_loss": -42.74924850463867, "global_step": 195488, "epoch": 1615} {"train_loss": -42.2288703918457, "global_step": 195489, "epoch": 1615} {"train_loss": -43.01393508911133, "global_step": 195490, "epoch": 1615} {"train_loss": -42.783935546875, "global_step": 195491, "epoch": 1615} {"train_loss": -42.669010162353516, "global_step": 195492, "epoch": 1615} {"train_loss": -42.90350341796875, "global_step": 195493, "epoch": 1615} {"train_loss": -42.794918060302734, "global_step": 195494, "epoch": 1615} {"train_loss": -43.018577575683594, "global_step": 195495, "epoch": 1615} {"train_loss": -42.78836441040039, "global_step": 195496, "epoch": 1615} {"train_loss": -42.772029876708984, "global_step": 195497, "epoch": 1615} {"train_loss": -41.45155715942383, "global_step": 195498, "epoch": 1615} {"train_loss": -42.78407669067383, "global_step": 195499, "epoch": 1615} {"train_loss": -42.89652633666992, "global_step": 195500, "epoch": 1615} {"train_loss": -39.68018341064453, "global_step": 195501, "epoch": 1615} {"train_loss": -40.00265121459961, "global_step": 195502, "epoch": 1615} {"train_loss": -40.884334564208984, "global_step": 195503, "epoch": 1615} {"train_loss": -41.49668884277344, "global_step": 195504, "epoch": 1615} {"train_loss": -42.284156799316406, "global_step": 195505, "epoch": 1615} {"train_loss": -42.490291595458984, "global_step": 195506, "epoch": 1615} {"train_loss": -39.26766586303711, "global_step": 195507, "epoch": 1615} {"train_loss": -40.50522994995117, "global_step": 195508, "epoch": 1615} {"train_loss": -37.72079849243164, "global_step": 195509, "epoch": 1615} {"train_loss": -36.30583190917969, "global_step": 195510, "epoch": 1615} {"train_loss": -31.64349365234375, "global_step": 195511, "epoch": 1615} {"train_loss": -38.9853630065918, "global_step": 195512, "epoch": 1615} {"train_loss": -38.141456604003906, "global_step": 195513, "epoch": 1615} {"train_loss": -34.978790283203125, "global_step": 195514, "epoch": 1615} {"train_loss": -39.128021240234375, "global_step": 195515, "epoch": 1615} {"train_loss": -36.111488342285156, "global_step": 195516, "epoch": 1615} {"train_loss": -37.833919525146484, "global_step": 195517, "epoch": 1615} {"train_loss": -33.97907257080078, "global_step": 195518, "epoch": 1615} {"train_loss": -19.141286849975586, "global_step": 195519, "epoch": 1615} {"train_loss": -38.18410873413086, "global_step": 195520, "epoch": 1615} {"train_loss": -36.0153694152832, "global_step": 195521, "epoch": 1615} {"train_loss": -32.982200622558594, "global_step": 195522, "epoch": 1615} {"train_loss": -34.21760940551758, "global_step": 195523, "epoch": 1615} {"train_loss": -36.121490478515625, "global_step": 195524, "epoch": 1615} {"train_loss": -37.618011474609375, "global_step": 195525, "epoch": 1615} {"train_loss": -38.42988204956055, "global_step": 195526, "epoch": 1615} {"train_loss": -38.83075714111328, "global_step": 195527, "epoch": 1615} {"train_loss": -38.27708435058594, "global_step": 195528, "epoch": 1615} {"train_loss": -38.80501174926758, "global_step": 195529, "epoch": 1615} {"train_loss": -38.99386215209961, "global_step": 195530, "epoch": 1615} {"train_loss": -37.18035888671875, "global_step": 195531, "epoch": 1615} {"train_loss": -38.065914154052734, "global_step": 195532, "epoch": 1615} {"train_loss": -37.7042236328125, "global_step": 195533, "epoch": 1615} {"train_loss": -39.8321533203125, "global_step": 195534, "epoch": 1615} {"train_loss": -40.220510482788086, "global_step": 195535, "epoch": 1615, "val_loss": 2542246.0} {"train_loss": -40.03815460205078, "global_step": 195536, "epoch": 1616} {"train_loss": -40.09298324584961, "global_step": 195537, "epoch": 1616} {"train_loss": -39.364013671875, "global_step": 195538, "epoch": 1616} {"train_loss": -39.264617919921875, "global_step": 195539, "epoch": 1616} {"train_loss": -37.244476318359375, "global_step": 195540, "epoch": 1616} {"train_loss": -40.711029052734375, "global_step": 195541, "epoch": 1616} {"train_loss": -39.84774398803711, "global_step": 195542, "epoch": 1616} {"train_loss": -41.040809631347656, "global_step": 195543, "epoch": 1616} {"train_loss": -38.9932975769043, "global_step": 195544, "epoch": 1616} {"train_loss": -40.601566314697266, "global_step": 195545, "epoch": 1616} {"train_loss": -39.283790588378906, "global_step": 195546, "epoch": 1616} {"train_loss": -40.273616790771484, "global_step": 195547, "epoch": 1616} {"train_loss": -40.48539352416992, "global_step": 195548, "epoch": 1616} {"train_loss": -39.58063888549805, "global_step": 195549, "epoch": 1616} {"train_loss": -40.21570587158203, "global_step": 195550, "epoch": 1616} {"train_loss": -39.49854278564453, "global_step": 195551, "epoch": 1616} {"train_loss": -40.415950775146484, "global_step": 195552, "epoch": 1616} {"train_loss": -39.79331588745117, "global_step": 195553, "epoch": 1616} {"train_loss": -40.06243896484375, "global_step": 195554, "epoch": 1616} {"train_loss": -41.150264739990234, "global_step": 195555, "epoch": 1616} {"train_loss": -40.418983459472656, "global_step": 195556, "epoch": 1616} {"train_loss": -40.32927322387695, "global_step": 195557, "epoch": 1616} {"train_loss": -40.8828010559082, "global_step": 195558, "epoch": 1616} {"train_loss": -41.374454498291016, "global_step": 195559, "epoch": 1616} {"train_loss": -40.476314544677734, "global_step": 195560, "epoch": 1616} {"train_loss": -41.77298355102539, "global_step": 195561, "epoch": 1616} {"train_loss": -40.970088958740234, "global_step": 195562, "epoch": 1616} {"train_loss": -41.183223724365234, "global_step": 195563, "epoch": 1616} {"train_loss": -41.08376693725586, "global_step": 195564, "epoch": 1616} {"train_loss": -41.638179779052734, "global_step": 195565, "epoch": 1616} {"train_loss": -41.44356155395508, "global_step": 195566, "epoch": 1616} {"train_loss": -41.0611572265625, "global_step": 195567, "epoch": 1616} {"train_loss": -42.16080856323242, "global_step": 195568, "epoch": 1616} {"train_loss": -41.524169921875, "global_step": 195569, "epoch": 1616} {"train_loss": -41.04033279418945, "global_step": 195570, "epoch": 1616} {"train_loss": -41.67362594604492, "global_step": 195571, "epoch": 1616} {"train_loss": -42.14541244506836, "global_step": 195572, "epoch": 1616} {"train_loss": -41.9632453918457, "global_step": 195573, "epoch": 1616} {"train_loss": -42.082515716552734, "global_step": 195574, "epoch": 1616} {"train_loss": -41.708709716796875, "global_step": 195575, "epoch": 1616} {"train_loss": -41.66357421875, "global_step": 195576, "epoch": 1616} {"train_loss": -42.11183166503906, "global_step": 195577, "epoch": 1616} {"train_loss": -42.154144287109375, "global_step": 195578, "epoch": 1616} {"train_loss": -41.75345993041992, "global_step": 195579, "epoch": 1616} {"train_loss": -42.04146957397461, "global_step": 195580, "epoch": 1616} {"train_loss": -41.68722152709961, "global_step": 195581, "epoch": 1616} {"train_loss": -42.63568115234375, "global_step": 195582, "epoch": 1616} {"train_loss": -41.86056137084961, "global_step": 195583, "epoch": 1616} {"train_loss": -40.836734771728516, "global_step": 195584, "epoch": 1616} {"train_loss": -42.61526107788086, "global_step": 195585, "epoch": 1616} {"train_loss": -42.71503829956055, "global_step": 195586, "epoch": 1616} {"train_loss": -41.635257720947266, "global_step": 195587, "epoch": 1616} {"train_loss": -42.605464935302734, "global_step": 195588, "epoch": 1616} {"train_loss": -42.124629974365234, "global_step": 195589, "epoch": 1616} {"train_loss": -42.25330352783203, "global_step": 195590, "epoch": 1616} {"train_loss": -41.86088943481445, "global_step": 195591, "epoch": 1616} {"train_loss": -42.66160202026367, "global_step": 195592, "epoch": 1616} {"train_loss": -42.683021545410156, "global_step": 195593, "epoch": 1616} {"train_loss": -41.1789436340332, "global_step": 195594, "epoch": 1616} {"train_loss": -41.792301177978516, "global_step": 195595, "epoch": 1616} {"train_loss": -42.89320755004883, "global_step": 195596, "epoch": 1616} {"train_loss": -42.17119598388672, "global_step": 195597, "epoch": 1616} {"train_loss": -42.21533203125, "global_step": 195598, "epoch": 1616} {"train_loss": -42.6669807434082, "global_step": 195599, "epoch": 1616} {"train_loss": -42.31863021850586, "global_step": 195600, "epoch": 1616} {"train_loss": -42.58264923095703, "global_step": 195601, "epoch": 1616} {"train_loss": -41.66971969604492, "global_step": 195602, "epoch": 1616} {"train_loss": -43.2287712097168, "global_step": 195603, "epoch": 1616} {"train_loss": -42.43966293334961, "global_step": 195604, "epoch": 1616} {"train_loss": -42.72705078125, "global_step": 195605, "epoch": 1616} {"train_loss": -41.8659553527832, "global_step": 195606, "epoch": 1616} {"train_loss": -42.82196044921875, "global_step": 195607, "epoch": 1616} {"train_loss": -41.79359817504883, "global_step": 195608, "epoch": 1616} {"train_loss": -41.59247970581055, "global_step": 195609, "epoch": 1616} {"train_loss": -42.06104278564453, "global_step": 195610, "epoch": 1616} {"train_loss": -41.86235809326172, "global_step": 195611, "epoch": 1616} {"train_loss": -42.5606803894043, "global_step": 195612, "epoch": 1616} {"train_loss": -42.363765716552734, "global_step": 195613, "epoch": 1616} {"train_loss": -42.6559944152832, "global_step": 195614, "epoch": 1616} {"train_loss": -42.625099182128906, "global_step": 195615, "epoch": 1616} {"train_loss": -41.80562210083008, "global_step": 195616, "epoch": 1616} {"train_loss": -40.66291046142578, "global_step": 195617, "epoch": 1616} {"train_loss": -39.68351364135742, "global_step": 195618, "epoch": 1616} {"train_loss": -38.595619201660156, "global_step": 195619, "epoch": 1616} {"train_loss": -36.08498764038086, "global_step": 195620, "epoch": 1616} {"train_loss": -40.623287200927734, "global_step": 195621, "epoch": 1616} {"train_loss": -33.20717239379883, "global_step": 195622, "epoch": 1616} {"train_loss": -28.27284812927246, "global_step": 195623, "epoch": 1616} {"train_loss": -26.5141544342041, "global_step": 195624, "epoch": 1616} {"train_loss": -28.8566837310791, "global_step": 195625, "epoch": 1616} {"train_loss": -28.0136775970459, "global_step": 195626, "epoch": 1616} {"train_loss": -29.68283462524414, "global_step": 195627, "epoch": 1616} {"train_loss": -28.866790771484375, "global_step": 195628, "epoch": 1616} {"train_loss": -31.71209144592285, "global_step": 195629, "epoch": 1616} {"train_loss": -31.5723819732666, "global_step": 195630, "epoch": 1616} {"train_loss": -30.26008415222168, "global_step": 195631, "epoch": 1616} {"train_loss": -32.270748138427734, "global_step": 195632, "epoch": 1616} {"train_loss": -32.6484260559082, "global_step": 195633, "epoch": 1616} {"train_loss": -33.200252532958984, "global_step": 195634, "epoch": 1616} {"train_loss": -32.24221420288086, "global_step": 195635, "epoch": 1616} {"train_loss": -33.6048698425293, "global_step": 195636, "epoch": 1616} {"train_loss": -33.262298583984375, "global_step": 195637, "epoch": 1616} {"train_loss": -32.428157806396484, "global_step": 195638, "epoch": 1616} {"train_loss": -33.84556579589844, "global_step": 195639, "epoch": 1616} {"train_loss": -35.12986755371094, "global_step": 195640, "epoch": 1616} {"train_loss": -34.55402755737305, "global_step": 195641, "epoch": 1616} {"train_loss": -34.04551315307617, "global_step": 195642, "epoch": 1616} {"train_loss": -34.76213455200195, "global_step": 195643, "epoch": 1616} {"train_loss": -35.0351448059082, "global_step": 195644, "epoch": 1616} {"train_loss": -35.32147979736328, "global_step": 195645, "epoch": 1616} {"train_loss": -35.17705535888672, "global_step": 195646, "epoch": 1616} {"train_loss": -35.45392990112305, "global_step": 195647, "epoch": 1616} {"train_loss": -35.434608459472656, "global_step": 195648, "epoch": 1616} {"train_loss": -35.307674407958984, "global_step": 195649, "epoch": 1616} {"train_loss": -35.6312255859375, "global_step": 195650, "epoch": 1616} {"train_loss": -35.56929397583008, "global_step": 195651, "epoch": 1616} {"train_loss": -35.43354415893555, "global_step": 195652, "epoch": 1616} {"train_loss": -35.57724380493164, "global_step": 195653, "epoch": 1616} {"train_loss": -35.03102493286133, "global_step": 195654, "epoch": 1616} {"train_loss": -35.95423126220703, "global_step": 195655, "epoch": 1616} {"train_loss": -38.92596878493128, "global_step": 195656, "epoch": 1616, "val_loss": 2633547.25} {"train_loss": -35.642333984375, "global_step": 195657, "epoch": 1617} {"train_loss": -35.672061920166016, "global_step": 195658, "epoch": 1617} {"train_loss": -35.666770935058594, "global_step": 195659, "epoch": 1617} {"train_loss": -36.478145599365234, "global_step": 195660, "epoch": 1617} {"train_loss": -36.16532516479492, "global_step": 195661, "epoch": 1617} {"train_loss": -36.37324142456055, "global_step": 195662, "epoch": 1617} {"train_loss": -36.41780090332031, "global_step": 195663, "epoch": 1617} {"train_loss": -36.73756790161133, "global_step": 195664, "epoch": 1617} {"train_loss": -36.84836196899414, "global_step": 195665, "epoch": 1617} {"train_loss": -36.98151397705078, "global_step": 195666, "epoch": 1617} {"train_loss": -36.888427734375, "global_step": 195667, "epoch": 1617} {"train_loss": -37.5501823425293, "global_step": 195668, "epoch": 1617} {"train_loss": -37.46474075317383, "global_step": 195669, "epoch": 1617} {"train_loss": -37.22066879272461, "global_step": 195670, "epoch": 1617} {"train_loss": -37.791542053222656, "global_step": 195671, "epoch": 1617} {"train_loss": -37.499298095703125, "global_step": 195672, "epoch": 1617} {"train_loss": -37.558692932128906, "global_step": 195673, "epoch": 1617} {"train_loss": -37.721797943115234, "global_step": 195674, "epoch": 1617} {"train_loss": -37.26755905151367, "global_step": 195675, "epoch": 1617} {"train_loss": -36.8496208190918, "global_step": 195676, "epoch": 1617} {"train_loss": -33.848751068115234, "global_step": 195677, "epoch": 1617} {"train_loss": -33.79692077636719, "global_step": 195678, "epoch": 1617} {"train_loss": -38.14045715332031, "global_step": 195679, "epoch": 1617} {"train_loss": -34.52185821533203, "global_step": 195680, "epoch": 1617} {"train_loss": -37.92292404174805, "global_step": 195681, "epoch": 1617} {"train_loss": -36.17803955078125, "global_step": 195682, "epoch": 1617} {"train_loss": -37.705875396728516, "global_step": 195683, "epoch": 1617} {"train_loss": -35.5914421081543, "global_step": 195684, "epoch": 1617} {"train_loss": -38.0396728515625, "global_step": 195685, "epoch": 1617} {"train_loss": -35.69993209838867, "global_step": 195686, "epoch": 1617} {"train_loss": -38.17412185668945, "global_step": 195687, "epoch": 1617} {"train_loss": -37.134857177734375, "global_step": 195688, "epoch": 1617} {"train_loss": -37.739051818847656, "global_step": 195689, "epoch": 1617} {"train_loss": -38.788856506347656, "global_step": 195690, "epoch": 1617} {"train_loss": -37.020076751708984, "global_step": 195691, "epoch": 1617} {"train_loss": -38.09626770019531, "global_step": 195692, "epoch": 1617} {"train_loss": -36.14913558959961, "global_step": 195693, "epoch": 1617} {"train_loss": -35.229610443115234, "global_step": 195694, "epoch": 1617} {"train_loss": -36.39775466918945, "global_step": 195695, "epoch": 1617} {"train_loss": -37.83210754394531, "global_step": 195696, "epoch": 1617} {"train_loss": -36.04869079589844, "global_step": 195697, "epoch": 1617} {"train_loss": -38.377357482910156, "global_step": 195698, "epoch": 1617} {"train_loss": -37.60334396362305, "global_step": 195699, "epoch": 1617} {"train_loss": -37.996620178222656, "global_step": 195700, "epoch": 1617} {"train_loss": -38.19174575805664, "global_step": 195701, "epoch": 1617} {"train_loss": -37.96403121948242, "global_step": 195702, "epoch": 1617} {"train_loss": -38.53635787963867, "global_step": 195703, "epoch": 1617} {"train_loss": -38.49866485595703, "global_step": 195704, "epoch": 1617} {"train_loss": -37.59927749633789, "global_step": 195705, "epoch": 1617} {"train_loss": -37.86642074584961, "global_step": 195706, "epoch": 1617} {"train_loss": -38.337074279785156, "global_step": 195707, "epoch": 1617} {"train_loss": -38.993534088134766, "global_step": 195708, "epoch": 1617} {"train_loss": -38.822139739990234, "global_step": 195709, "epoch": 1617} {"train_loss": -38.62622833251953, "global_step": 195710, "epoch": 1617} {"train_loss": -38.775264739990234, "global_step": 195711, "epoch": 1617} {"train_loss": -39.33978271484375, "global_step": 195712, "epoch": 1617} {"train_loss": -38.35756301879883, "global_step": 195713, "epoch": 1617} {"train_loss": -38.403133392333984, "global_step": 195714, "epoch": 1617} {"train_loss": -39.158355712890625, "global_step": 195715, "epoch": 1617} {"train_loss": -38.56417465209961, "global_step": 195716, "epoch": 1617} {"train_loss": -39.09564208984375, "global_step": 195717, "epoch": 1617} {"train_loss": -39.25153350830078, "global_step": 195718, "epoch": 1617} {"train_loss": -39.15911102294922, "global_step": 195719, "epoch": 1617} {"train_loss": -38.89767837524414, "global_step": 195720, "epoch": 1617} {"train_loss": -39.775543212890625, "global_step": 195721, "epoch": 1617} {"train_loss": -39.40350341796875, "global_step": 195722, "epoch": 1617} {"train_loss": -39.299373626708984, "global_step": 195723, "epoch": 1617} {"train_loss": -39.418704986572266, "global_step": 195724, "epoch": 1617} {"train_loss": -39.39395523071289, "global_step": 195725, "epoch": 1617} {"train_loss": -39.10919189453125, "global_step": 195726, "epoch": 1617} {"train_loss": -39.66050338745117, "global_step": 195727, "epoch": 1617} {"train_loss": -38.87189865112305, "global_step": 195728, "epoch": 1617} {"train_loss": -38.92417526245117, "global_step": 195729, "epoch": 1617} {"train_loss": -39.1182861328125, "global_step": 195730, "epoch": 1617} {"train_loss": -39.02956771850586, "global_step": 195731, "epoch": 1617} {"train_loss": -38.56824493408203, "global_step": 195732, "epoch": 1617} {"train_loss": -37.922996520996094, "global_step": 195733, "epoch": 1617} {"train_loss": -39.13204574584961, "global_step": 195734, "epoch": 1617} {"train_loss": -40.05781555175781, "global_step": 195735, "epoch": 1617} {"train_loss": -39.37787628173828, "global_step": 195736, "epoch": 1617} {"train_loss": -38.1967887878418, "global_step": 195737, "epoch": 1617} {"train_loss": -38.652076721191406, "global_step": 195738, "epoch": 1617} {"train_loss": -39.98964309692383, "global_step": 195739, "epoch": 1617} {"train_loss": -37.447242736816406, "global_step": 195740, "epoch": 1617} {"train_loss": -39.644447326660156, "global_step": 195741, "epoch": 1617} {"train_loss": -39.93001937866211, "global_step": 195742, "epoch": 1617} {"train_loss": -39.64790725708008, "global_step": 195743, "epoch": 1617} {"train_loss": -38.08622360229492, "global_step": 195744, "epoch": 1617} {"train_loss": -40.08842849731445, "global_step": 195745, "epoch": 1617} {"train_loss": -39.33285140991211, "global_step": 195746, "epoch": 1617} {"train_loss": -39.455039978027344, "global_step": 195747, "epoch": 1617} {"train_loss": -39.009857177734375, "global_step": 195748, "epoch": 1617} {"train_loss": -39.071834564208984, "global_step": 195749, "epoch": 1617} {"train_loss": -39.83352279663086, "global_step": 195750, "epoch": 1617} {"train_loss": -37.687965393066406, "global_step": 195751, "epoch": 1617} {"train_loss": -38.96002197265625, "global_step": 195752, "epoch": 1617} {"train_loss": -38.9648323059082, "global_step": 195753, "epoch": 1617} {"train_loss": -38.904747009277344, "global_step": 195754, "epoch": 1617} {"train_loss": -34.940208435058594, "global_step": 195755, "epoch": 1617} {"train_loss": -36.888851165771484, "global_step": 195756, "epoch": 1617} {"train_loss": -38.70150375366211, "global_step": 195757, "epoch": 1617} {"train_loss": -39.303192138671875, "global_step": 195758, "epoch": 1617} {"train_loss": -37.77030563354492, "global_step": 195759, "epoch": 1617} {"train_loss": -38.931800842285156, "global_step": 195760, "epoch": 1617} {"train_loss": -32.52851486206055, "global_step": 195761, "epoch": 1617} {"train_loss": -38.66341781616211, "global_step": 195762, "epoch": 1617} {"train_loss": -36.559356689453125, "global_step": 195763, "epoch": 1617} {"train_loss": -34.39582443237305, "global_step": 195764, "epoch": 1617} {"train_loss": -38.05662155151367, "global_step": 195765, "epoch": 1617} {"train_loss": -38.91538619995117, "global_step": 195766, "epoch": 1617} {"train_loss": -36.04706954956055, "global_step": 195767, "epoch": 1617} {"train_loss": -31.411975860595703, "global_step": 195768, "epoch": 1617} {"train_loss": -35.3884162902832, "global_step": 195769, "epoch": 1617} {"train_loss": -35.472328186035156, "global_step": 195770, "epoch": 1617} {"train_loss": -35.60807418823242, "global_step": 195771, "epoch": 1617} {"train_loss": -38.40769577026367, "global_step": 195772, "epoch": 1617} {"train_loss": -36.912837982177734, "global_step": 195773, "epoch": 1617} {"train_loss": -36.862770080566406, "global_step": 195774, "epoch": 1617} {"train_loss": -38.495948791503906, "global_step": 195775, "epoch": 1617} {"train_loss": -38.445831298828125, "global_step": 195776, "epoch": 1617} {"train_loss": -37.753802275854696, "global_step": 195777, "epoch": 1617, "val_loss": 3115987.25} {"train_loss": -37.904052734375, "global_step": 195778, "epoch": 1618} {"train_loss": -36.6382942199707, "global_step": 195779, "epoch": 1618} {"train_loss": -37.63812255859375, "global_step": 195780, "epoch": 1618} {"train_loss": -35.906612396240234, "global_step": 195781, "epoch": 1618} {"train_loss": -36.912994384765625, "global_step": 195782, "epoch": 1618} {"train_loss": -36.85735321044922, "global_step": 195783, "epoch": 1618} {"train_loss": -38.072322845458984, "global_step": 195784, "epoch": 1618} {"train_loss": -38.47747802734375, "global_step": 195785, "epoch": 1618} {"train_loss": -36.935062408447266, "global_step": 195786, "epoch": 1618} {"train_loss": -38.490631103515625, "global_step": 195787, "epoch": 1618} {"train_loss": -37.51549530029297, "global_step": 195788, "epoch": 1618} {"train_loss": -37.5815315246582, "global_step": 195789, "epoch": 1618} {"train_loss": -34.746089935302734, "global_step": 195790, "epoch": 1618} {"train_loss": -38.93228530883789, "global_step": 195791, "epoch": 1618} {"train_loss": -36.36073303222656, "global_step": 195792, "epoch": 1618} {"train_loss": -37.87232208251953, "global_step": 195793, "epoch": 1618} {"train_loss": -29.757678985595703, "global_step": 195794, "epoch": 1618} {"train_loss": -37.89580535888672, "global_step": 195795, "epoch": 1618} {"train_loss": -38.76445388793945, "global_step": 195796, "epoch": 1618} {"train_loss": -36.28036117553711, "global_step": 195797, "epoch": 1618} {"train_loss": -36.343910217285156, "global_step": 195798, "epoch": 1618} {"train_loss": -36.41067886352539, "global_step": 195799, "epoch": 1618} {"train_loss": -36.32259750366211, "global_step": 195800, "epoch": 1618} {"train_loss": -34.60942840576172, "global_step": 195801, "epoch": 1618} {"train_loss": -37.25834655761719, "global_step": 195802, "epoch": 1618} {"train_loss": -38.29283142089844, "global_step": 195803, "epoch": 1618} {"train_loss": -37.367671966552734, "global_step": 195804, "epoch": 1618} {"train_loss": -38.29420852661133, "global_step": 195805, "epoch": 1618} {"train_loss": -36.82009506225586, "global_step": 195806, "epoch": 1618} {"train_loss": -38.12561798095703, "global_step": 195807, "epoch": 1618} {"train_loss": -37.40346145629883, "global_step": 195808, "epoch": 1618} {"train_loss": -35.7253532409668, "global_step": 195809, "epoch": 1618} {"train_loss": -38.720489501953125, "global_step": 195810, "epoch": 1618} {"train_loss": -37.459110260009766, "global_step": 195811, "epoch": 1618} {"train_loss": -37.331905364990234, "global_step": 195812, "epoch": 1618} {"train_loss": -36.844051361083984, "global_step": 195813, "epoch": 1618} {"train_loss": -36.77567672729492, "global_step": 195814, "epoch": 1618} {"train_loss": -37.89142990112305, "global_step": 195815, "epoch": 1618} {"train_loss": -38.07716369628906, "global_step": 195816, "epoch": 1618} {"train_loss": -36.90119552612305, "global_step": 195817, "epoch": 1618} {"train_loss": -37.656982421875, "global_step": 195818, "epoch": 1618} {"train_loss": -38.116390228271484, "global_step": 195819, "epoch": 1618} {"train_loss": -39.073341369628906, "global_step": 195820, "epoch": 1618} {"train_loss": -36.86310577392578, "global_step": 195821, "epoch": 1618} {"train_loss": -38.13437271118164, "global_step": 195822, "epoch": 1618} {"train_loss": -38.742984771728516, "global_step": 195823, "epoch": 1618} {"train_loss": -38.68276596069336, "global_step": 195824, "epoch": 1618} {"train_loss": -38.594173431396484, "global_step": 195825, "epoch": 1618} {"train_loss": -38.41546630859375, "global_step": 195826, "epoch": 1618} {"train_loss": -37.825233459472656, "global_step": 195827, "epoch": 1618} {"train_loss": -37.87953567504883, "global_step": 195828, "epoch": 1618} {"train_loss": -39.00103759765625, "global_step": 195829, "epoch": 1618} {"train_loss": -38.68168258666992, "global_step": 195830, "epoch": 1618} {"train_loss": -38.57246017456055, "global_step": 195831, "epoch": 1618} {"train_loss": -39.0613899230957, "global_step": 195832, "epoch": 1618} {"train_loss": -38.635860443115234, "global_step": 195833, "epoch": 1618} {"train_loss": -39.12108612060547, "global_step": 195834, "epoch": 1618} {"train_loss": -39.50179672241211, "global_step": 195835, "epoch": 1618} {"train_loss": -37.6138916015625, "global_step": 195836, "epoch": 1618} {"train_loss": -39.17428970336914, "global_step": 195837, "epoch": 1618} {"train_loss": -37.552791595458984, "global_step": 195838, "epoch": 1618} {"train_loss": -37.86194610595703, "global_step": 195839, "epoch": 1618} {"train_loss": -39.73042678833008, "global_step": 195840, "epoch": 1618} {"train_loss": -39.44907760620117, "global_step": 195841, "epoch": 1618} {"train_loss": -39.20266342163086, "global_step": 195842, "epoch": 1618} {"train_loss": -39.521453857421875, "global_step": 195843, "epoch": 1618} {"train_loss": -39.039154052734375, "global_step": 195844, "epoch": 1618} {"train_loss": -39.1442756652832, "global_step": 195845, "epoch": 1618} {"train_loss": -38.94017791748047, "global_step": 195846, "epoch": 1618} {"train_loss": -38.962066650390625, "global_step": 195847, "epoch": 1618} {"train_loss": -37.40272903442383, "global_step": 195848, "epoch": 1618} {"train_loss": -38.8691520690918, "global_step": 195849, "epoch": 1618} {"train_loss": -39.070594787597656, "global_step": 195850, "epoch": 1618} {"train_loss": -38.52788162231445, "global_step": 195851, "epoch": 1618} {"train_loss": -39.37227249145508, "global_step": 195852, "epoch": 1618} {"train_loss": -39.9143180847168, "global_step": 195853, "epoch": 1618} {"train_loss": -39.75407791137695, "global_step": 195854, "epoch": 1618} {"train_loss": -39.8119010925293, "global_step": 195855, "epoch": 1618} {"train_loss": -40.05896759033203, "global_step": 195856, "epoch": 1618} {"train_loss": -39.779029846191406, "global_step": 195857, "epoch": 1618} {"train_loss": -39.39278030395508, "global_step": 195858, "epoch": 1618} {"train_loss": -38.10227584838867, "global_step": 195859, "epoch": 1618} {"train_loss": -36.722564697265625, "global_step": 195860, "epoch": 1618} {"train_loss": -38.95670700073242, "global_step": 195861, "epoch": 1618} {"train_loss": -38.753963470458984, "global_step": 195862, "epoch": 1618} {"train_loss": -37.75042724609375, "global_step": 195863, "epoch": 1618} {"train_loss": -39.0606803894043, "global_step": 195864, "epoch": 1618} {"train_loss": -39.9265251159668, "global_step": 195865, "epoch": 1618} {"train_loss": -37.67555236816406, "global_step": 195866, "epoch": 1618} {"train_loss": -39.54851150512695, "global_step": 195867, "epoch": 1618} {"train_loss": -38.25726318359375, "global_step": 195868, "epoch": 1618} {"train_loss": -39.10085678100586, "global_step": 195869, "epoch": 1618} {"train_loss": -38.50287628173828, "global_step": 195870, "epoch": 1618} {"train_loss": -38.967315673828125, "global_step": 195871, "epoch": 1618} {"train_loss": -39.8969612121582, "global_step": 195872, "epoch": 1618} {"train_loss": -39.12135314941406, "global_step": 195873, "epoch": 1618} {"train_loss": -39.97217559814453, "global_step": 195874, "epoch": 1618} {"train_loss": -39.17163848876953, "global_step": 195875, "epoch": 1618} {"train_loss": -40.33773422241211, "global_step": 195876, "epoch": 1618} {"train_loss": -39.484310150146484, "global_step": 195877, "epoch": 1618} {"train_loss": -39.713619232177734, "global_step": 195878, "epoch": 1618} {"train_loss": -39.569480895996094, "global_step": 195879, "epoch": 1618} {"train_loss": -39.73023223876953, "global_step": 195880, "epoch": 1618} {"train_loss": -39.267494201660156, "global_step": 195881, "epoch": 1618} {"train_loss": -39.517311096191406, "global_step": 195882, "epoch": 1618} {"train_loss": -39.674407958984375, "global_step": 195883, "epoch": 1618} {"train_loss": -39.451560974121094, "global_step": 195884, "epoch": 1618} {"train_loss": -39.553104400634766, "global_step": 195885, "epoch": 1618} {"train_loss": -39.416683197021484, "global_step": 195886, "epoch": 1618} {"train_loss": -38.95376968383789, "global_step": 195887, "epoch": 1618} {"train_loss": -39.96958541870117, "global_step": 195888, "epoch": 1618} {"train_loss": -39.58294677734375, "global_step": 195889, "epoch": 1618} {"train_loss": -39.62758255004883, "global_step": 195890, "epoch": 1618} {"train_loss": -38.665645599365234, "global_step": 195891, "epoch": 1618} {"train_loss": -39.88568878173828, "global_step": 195892, "epoch": 1618} {"train_loss": -38.45838165283203, "global_step": 195893, "epoch": 1618} {"train_loss": -38.92594909667969, "global_step": 195894, "epoch": 1618} {"train_loss": -37.42457580566406, "global_step": 195895, "epoch": 1618} {"train_loss": -37.94101333618164, "global_step": 195896, "epoch": 1618} {"train_loss": -40.037353515625, "global_step": 195897, "epoch": 1618} {"train_loss": -38.323359055952594, "global_step": 195898, "epoch": 1618, "val_loss": 2574375.75} {"train_loss": -39.07651901245117, "global_step": 195899, "epoch": 1619} {"train_loss": -39.358673095703125, "global_step": 195900, "epoch": 1619} {"train_loss": -39.532135009765625, "global_step": 195901, "epoch": 1619} {"train_loss": -40.2188720703125, "global_step": 195902, "epoch": 1619} {"train_loss": -39.2242317199707, "global_step": 195903, "epoch": 1619} {"train_loss": -39.9989013671875, "global_step": 195904, "epoch": 1619} {"train_loss": -39.744056701660156, "global_step": 195905, "epoch": 1619} {"train_loss": -40.29826736450195, "global_step": 195906, "epoch": 1619} {"train_loss": -39.50352096557617, "global_step": 195907, "epoch": 1619} {"train_loss": -40.3580436706543, "global_step": 195908, "epoch": 1619} {"train_loss": -39.4273567199707, "global_step": 195909, "epoch": 1619} {"train_loss": -39.28095626831055, "global_step": 195910, "epoch": 1619} {"train_loss": -40.27399826049805, "global_step": 195911, "epoch": 1619} {"train_loss": -40.04478073120117, "global_step": 195912, "epoch": 1619} {"train_loss": -40.828086853027344, "global_step": 195913, "epoch": 1619} {"train_loss": -39.792457580566406, "global_step": 195914, "epoch": 1619} {"train_loss": -39.65529251098633, "global_step": 195915, "epoch": 1619} {"train_loss": -40.613033294677734, "global_step": 195916, "epoch": 1619} {"train_loss": -40.70427703857422, "global_step": 195917, "epoch": 1619} {"train_loss": -39.97337341308594, "global_step": 195918, "epoch": 1619} {"train_loss": -38.846961975097656, "global_step": 195919, "epoch": 1619} {"train_loss": -38.24877166748047, "global_step": 195920, "epoch": 1619} {"train_loss": -40.921634674072266, "global_step": 195921, "epoch": 1619} {"train_loss": -39.75212478637695, "global_step": 195922, "epoch": 1619} {"train_loss": -38.797821044921875, "global_step": 195923, "epoch": 1619} {"train_loss": -40.14683151245117, "global_step": 195924, "epoch": 1619} {"train_loss": -40.92169952392578, "global_step": 195925, "epoch": 1619} {"train_loss": -39.84824752807617, "global_step": 195926, "epoch": 1619} {"train_loss": -40.01985549926758, "global_step": 195927, "epoch": 1619} {"train_loss": -40.50297927856445, "global_step": 195928, "epoch": 1619} {"train_loss": -40.41444778442383, "global_step": 195929, "epoch": 1619} {"train_loss": -40.18301773071289, "global_step": 195930, "epoch": 1619} {"train_loss": -40.595481872558594, "global_step": 195931, "epoch": 1619} {"train_loss": -40.46224594116211, "global_step": 195932, "epoch": 1619} {"train_loss": -40.486629486083984, "global_step": 195933, "epoch": 1619} {"train_loss": -40.21125411987305, "global_step": 195934, "epoch": 1619} {"train_loss": -39.787662506103516, "global_step": 195935, "epoch": 1619} {"train_loss": -40.332984924316406, "global_step": 195936, "epoch": 1619} {"train_loss": -40.764339447021484, "global_step": 195937, "epoch": 1619} {"train_loss": -40.05446243286133, "global_step": 195938, "epoch": 1619} {"train_loss": -37.99587631225586, "global_step": 195939, "epoch": 1619} {"train_loss": -41.08599090576172, "global_step": 195940, "epoch": 1619} {"train_loss": -39.86057662963867, "global_step": 195941, "epoch": 1619} {"train_loss": -39.68634033203125, "global_step": 195942, "epoch": 1619} {"train_loss": -40.86091232299805, "global_step": 195943, "epoch": 1619} {"train_loss": -39.79805374145508, "global_step": 195944, "epoch": 1619} {"train_loss": -40.67356491088867, "global_step": 195945, "epoch": 1619} {"train_loss": -41.001953125, "global_step": 195946, "epoch": 1619} {"train_loss": -40.3751335144043, "global_step": 195947, "epoch": 1619} {"train_loss": -41.06464767456055, "global_step": 195948, "epoch": 1619} {"train_loss": -40.536346435546875, "global_step": 195949, "epoch": 1619} {"train_loss": -40.48784255981445, "global_step": 195950, "epoch": 1619} {"train_loss": -40.52337646484375, "global_step": 195951, "epoch": 1619} {"train_loss": -39.83768844604492, "global_step": 195952, "epoch": 1619} {"train_loss": -40.2607307434082, "global_step": 195953, "epoch": 1619} {"train_loss": -40.38691711425781, "global_step": 195954, "epoch": 1619} {"train_loss": -39.66145706176758, "global_step": 195955, "epoch": 1619} {"train_loss": -41.37947082519531, "global_step": 195956, "epoch": 1619} {"train_loss": -40.18672561645508, "global_step": 195957, "epoch": 1619} {"train_loss": -40.48915481567383, "global_step": 195958, "epoch": 1619} {"train_loss": -40.694244384765625, "global_step": 195959, "epoch": 1619} {"train_loss": -40.704524993896484, "global_step": 195960, "epoch": 1619} {"train_loss": -41.45519256591797, "global_step": 195961, "epoch": 1619} {"train_loss": -40.824825286865234, "global_step": 195962, "epoch": 1619} {"train_loss": -40.22089385986328, "global_step": 195963, "epoch": 1619} {"train_loss": -40.759315490722656, "global_step": 195964, "epoch": 1619} {"train_loss": -40.82151412963867, "global_step": 195965, "epoch": 1619} {"train_loss": -40.27822494506836, "global_step": 195966, "epoch": 1619} {"train_loss": -40.53310775756836, "global_step": 195967, "epoch": 1619} {"train_loss": -40.86173629760742, "global_step": 195968, "epoch": 1619} {"train_loss": -39.70164108276367, "global_step": 195969, "epoch": 1619} {"train_loss": -40.88243103027344, "global_step": 195970, "epoch": 1619} {"train_loss": -40.881813049316406, "global_step": 195971, "epoch": 1619} {"train_loss": -40.707881927490234, "global_step": 195972, "epoch": 1619} {"train_loss": -41.4237060546875, "global_step": 195973, "epoch": 1619} {"train_loss": -41.03262710571289, "global_step": 195974, "epoch": 1619} {"train_loss": -41.16078186035156, "global_step": 195975, "epoch": 1619} {"train_loss": -40.48154830932617, "global_step": 195976, "epoch": 1619} {"train_loss": -41.1521110534668, "global_step": 195977, "epoch": 1619} {"train_loss": -41.4595832824707, "global_step": 195978, "epoch": 1619} {"train_loss": -41.04267501831055, "global_step": 195979, "epoch": 1619} {"train_loss": -41.08229064941406, "global_step": 195980, "epoch": 1619} {"train_loss": -41.06441879272461, "global_step": 195981, "epoch": 1619} {"train_loss": -41.24412155151367, "global_step": 195982, "epoch": 1619} {"train_loss": -40.990169525146484, "global_step": 195983, "epoch": 1619} {"train_loss": -40.83760452270508, "global_step": 195984, "epoch": 1619} {"train_loss": -40.18809509277344, "global_step": 195985, "epoch": 1619} {"train_loss": -39.13918685913086, "global_step": 195986, "epoch": 1619} {"train_loss": -39.4201774597168, "global_step": 195987, "epoch": 1619} {"train_loss": -39.92326736450195, "global_step": 195988, "epoch": 1619} {"train_loss": -40.8660774230957, "global_step": 195989, "epoch": 1619} {"train_loss": -41.77183151245117, "global_step": 195990, "epoch": 1619} {"train_loss": -41.09486770629883, "global_step": 195991, "epoch": 1619} {"train_loss": -40.49379348754883, "global_step": 195992, "epoch": 1619} {"train_loss": -41.036861419677734, "global_step": 195993, "epoch": 1619} {"train_loss": -37.59305953979492, "global_step": 195994, "epoch": 1619} {"train_loss": -39.40092849731445, "global_step": 195995, "epoch": 1619} {"train_loss": -37.99222946166992, "global_step": 195996, "epoch": 1619} {"train_loss": -36.362789154052734, "global_step": 195997, "epoch": 1619} {"train_loss": -21.337779998779297, "global_step": 195998, "epoch": 1619} {"train_loss": -37.91434860229492, "global_step": 195999, "epoch": 1619} {"train_loss": -34.234619140625, "global_step": 196000, "epoch": 1619} {"train_loss": -36.048423767089844, "global_step": 196001, "epoch": 1619} {"train_loss": 5.95083475112915, "global_step": 196002, "epoch": 1619} {"train_loss": -30.254520416259766, "global_step": 196003, "epoch": 1619} {"train_loss": -24.71929168701172, "global_step": 196004, "epoch": 1619} {"train_loss": 13.874295234680176, "global_step": 196005, "epoch": 1619} {"train_loss": -22.50293731689453, "global_step": 196006, "epoch": 1619} {"train_loss": -9.834792137145996, "global_step": 196007, "epoch": 1619} {"train_loss": -4.358799934387207, "global_step": 196008, "epoch": 1619} {"train_loss": -28.48414421081543, "global_step": 196009, "epoch": 1619} {"train_loss": -5.252425670623779, "global_step": 196010, "epoch": 1619} {"train_loss": -13.941004753112793, "global_step": 196011, "epoch": 1619} {"train_loss": -24.08629608154297, "global_step": 196012, "epoch": 1619} {"train_loss": -32.11155700683594, "global_step": 196013, "epoch": 1619} {"train_loss": -25.74087905883789, "global_step": 196014, "epoch": 1619} {"train_loss": -28.11126136779785, "global_step": 196015, "epoch": 1619} {"train_loss": -27.466510772705078, "global_step": 196016, "epoch": 1619} {"train_loss": -32.65134811401367, "global_step": 196017, "epoch": 1619} {"train_loss": -33.098358154296875, "global_step": 196018, "epoch": 1619} {"train_loss": -36.93265589406668, "global_step": 196019, "epoch": 1619, "val_loss": 3441070.0} {"train_loss": -32.51435470581055, "global_step": 196020, "epoch": 1620} {"train_loss": -30.793745040893555, "global_step": 196021, "epoch": 1620} {"train_loss": -33.02516555786133, "global_step": 196022, "epoch": 1620} {"train_loss": -31.500843048095703, "global_step": 196023, "epoch": 1620} {"train_loss": -32.24970626831055, "global_step": 196024, "epoch": 1620} {"train_loss": -31.5539493560791, "global_step": 196025, "epoch": 1620} {"train_loss": -33.70564270019531, "global_step": 196026, "epoch": 1620} {"train_loss": -34.28654098510742, "global_step": 196027, "epoch": 1620} {"train_loss": -31.762313842773438, "global_step": 196028, "epoch": 1620} {"train_loss": -32.66019821166992, "global_step": 196029, "epoch": 1620} {"train_loss": -33.89060592651367, "global_step": 196030, "epoch": 1620} {"train_loss": -33.947383880615234, "global_step": 196031, "epoch": 1620} {"train_loss": -31.82187843322754, "global_step": 196032, "epoch": 1620} {"train_loss": -33.500083923339844, "global_step": 196033, "epoch": 1620} {"train_loss": -34.26512145996094, "global_step": 196034, "epoch": 1620} {"train_loss": -34.74559020996094, "global_step": 196035, "epoch": 1620} {"train_loss": -33.65597152709961, "global_step": 196036, "epoch": 1620} {"train_loss": -33.0455207824707, "global_step": 196037, "epoch": 1620} {"train_loss": -35.011714935302734, "global_step": 196038, "epoch": 1620} {"train_loss": -34.800716400146484, "global_step": 196039, "epoch": 1620} {"train_loss": -34.25495529174805, "global_step": 196040, "epoch": 1620} {"train_loss": -33.94961166381836, "global_step": 196041, "epoch": 1620} {"train_loss": -35.05427169799805, "global_step": 196042, "epoch": 1620} {"train_loss": -34.81647872924805, "global_step": 196043, "epoch": 1620} {"train_loss": -33.80506134033203, "global_step": 196044, "epoch": 1620} {"train_loss": -34.5893669128418, "global_step": 196045, "epoch": 1620} {"train_loss": -36.02693557739258, "global_step": 196046, "epoch": 1620} {"train_loss": -34.261146545410156, "global_step": 196047, "epoch": 1620} {"train_loss": -35.48234176635742, "global_step": 196048, "epoch": 1620} {"train_loss": -34.87437057495117, "global_step": 196049, "epoch": 1620} {"train_loss": -35.15595245361328, "global_step": 196050, "epoch": 1620} {"train_loss": -34.46769714355469, "global_step": 196051, "epoch": 1620} {"train_loss": -34.892330169677734, "global_step": 196052, "epoch": 1620} {"train_loss": -35.7021598815918, "global_step": 196053, "epoch": 1620} {"train_loss": -34.25892639160156, "global_step": 196054, "epoch": 1620} {"train_loss": -35.86550521850586, "global_step": 196055, "epoch": 1620} {"train_loss": -36.000267028808594, "global_step": 196056, "epoch": 1620} {"train_loss": -35.540130615234375, "global_step": 196057, "epoch": 1620} {"train_loss": -34.96647644042969, "global_step": 196058, "epoch": 1620} {"train_loss": -36.26296615600586, "global_step": 196059, "epoch": 1620} {"train_loss": -36.33312225341797, "global_step": 196060, "epoch": 1620} {"train_loss": -35.614173889160156, "global_step": 196061, "epoch": 1620} {"train_loss": -36.68623733520508, "global_step": 196062, "epoch": 1620} {"train_loss": -35.29594039916992, "global_step": 196063, "epoch": 1620} {"train_loss": -35.530948638916016, "global_step": 196064, "epoch": 1620} {"train_loss": -36.710723876953125, "global_step": 196065, "epoch": 1620} {"train_loss": -36.06973648071289, "global_step": 196066, "epoch": 1620} {"train_loss": -36.17546081542969, "global_step": 196067, "epoch": 1620} {"train_loss": -36.49761962890625, "global_step": 196068, "epoch": 1620} {"train_loss": -35.51593780517578, "global_step": 196069, "epoch": 1620} {"train_loss": -36.83232116699219, "global_step": 196070, "epoch": 1620} {"train_loss": -36.25736999511719, "global_step": 196071, "epoch": 1620} {"train_loss": -37.04781723022461, "global_step": 196072, "epoch": 1620} {"train_loss": -36.901485443115234, "global_step": 196073, "epoch": 1620} {"train_loss": -35.49592208862305, "global_step": 196074, "epoch": 1620} {"train_loss": -37.81398391723633, "global_step": 196075, "epoch": 1620} {"train_loss": -35.810523986816406, "global_step": 196076, "epoch": 1620} {"train_loss": -36.61981201171875, "global_step": 196077, "epoch": 1620} {"train_loss": -36.581329345703125, "global_step": 196078, "epoch": 1620} {"train_loss": -36.54951858520508, "global_step": 196079, "epoch": 1620} {"train_loss": -36.98476791381836, "global_step": 196080, "epoch": 1620} {"train_loss": -36.68292236328125, "global_step": 196081, "epoch": 1620} {"train_loss": -37.830440521240234, "global_step": 196082, "epoch": 1620} {"train_loss": -37.29345703125, "global_step": 196083, "epoch": 1620} {"train_loss": -37.56462097167969, "global_step": 196084, "epoch": 1620} {"train_loss": -37.38727951049805, "global_step": 196085, "epoch": 1620} {"train_loss": -37.88691329956055, "global_step": 196086, "epoch": 1620} {"train_loss": -35.946258544921875, "global_step": 196087, "epoch": 1620} {"train_loss": -37.18670654296875, "global_step": 196088, "epoch": 1620} {"train_loss": -37.53972625732422, "global_step": 196089, "epoch": 1620} {"train_loss": -37.43252182006836, "global_step": 196090, "epoch": 1620} {"train_loss": -36.67660903930664, "global_step": 196091, "epoch": 1620} {"train_loss": -37.93426513671875, "global_step": 196092, "epoch": 1620} {"train_loss": -35.93280792236328, "global_step": 196093, "epoch": 1620} {"train_loss": -37.541351318359375, "global_step": 196094, "epoch": 1620} {"train_loss": -37.72431564331055, "global_step": 196095, "epoch": 1620} {"train_loss": -37.77485275268555, "global_step": 196096, "epoch": 1620} {"train_loss": -37.42654800415039, "global_step": 196097, "epoch": 1620} {"train_loss": -37.76340103149414, "global_step": 196098, "epoch": 1620} {"train_loss": -37.5606803894043, "global_step": 196099, "epoch": 1620} {"train_loss": -38.53782272338867, "global_step": 196100, "epoch": 1620} {"train_loss": -37.08732604980469, "global_step": 196101, "epoch": 1620} {"train_loss": -37.19502258300781, "global_step": 196102, "epoch": 1620} {"train_loss": -36.8748893737793, "global_step": 196103, "epoch": 1620} {"train_loss": -37.623809814453125, "global_step": 196104, "epoch": 1620} {"train_loss": -36.471900939941406, "global_step": 196105, "epoch": 1620} {"train_loss": -38.48359298706055, "global_step": 196106, "epoch": 1620} {"train_loss": -37.26581573486328, "global_step": 196107, "epoch": 1620} {"train_loss": -37.367034912109375, "global_step": 196108, "epoch": 1620} {"train_loss": -37.591617584228516, "global_step": 196109, "epoch": 1620} {"train_loss": -38.17894744873047, "global_step": 196110, "epoch": 1620} {"train_loss": -37.89033889770508, "global_step": 196111, "epoch": 1620} {"train_loss": -38.424964904785156, "global_step": 196112, "epoch": 1620} {"train_loss": -37.93764877319336, "global_step": 196113, "epoch": 1620} {"train_loss": -38.42356491088867, "global_step": 196114, "epoch": 1620} {"train_loss": -38.816768646240234, "global_step": 196115, "epoch": 1620} {"train_loss": -37.73817825317383, "global_step": 196116, "epoch": 1620} {"train_loss": -38.60454177856445, "global_step": 196117, "epoch": 1620} {"train_loss": -38.33367919921875, "global_step": 196118, "epoch": 1620} {"train_loss": -38.276390075683594, "global_step": 196119, "epoch": 1620} {"train_loss": -39.14584732055664, "global_step": 196120, "epoch": 1620} {"train_loss": -38.848331451416016, "global_step": 196121, "epoch": 1620} {"train_loss": -38.27401351928711, "global_step": 196122, "epoch": 1620} {"train_loss": -38.37650680541992, "global_step": 196123, "epoch": 1620} {"train_loss": -38.90073776245117, "global_step": 196124, "epoch": 1620} {"train_loss": -38.9560546875, "global_step": 196125, "epoch": 1620} {"train_loss": -38.260860443115234, "global_step": 196126, "epoch": 1620} {"train_loss": -38.60087966918945, "global_step": 196127, "epoch": 1620} {"train_loss": -38.43037796020508, "global_step": 196128, "epoch": 1620} {"train_loss": -38.80110168457031, "global_step": 196129, "epoch": 1620} {"train_loss": -38.60099411010742, "global_step": 196130, "epoch": 1620} {"train_loss": -38.081966400146484, "global_step": 196131, "epoch": 1620} {"train_loss": -38.63509750366211, "global_step": 196132, "epoch": 1620} {"train_loss": -38.00944137573242, "global_step": 196133, "epoch": 1620} {"train_loss": -38.513824462890625, "global_step": 196134, "epoch": 1620} {"train_loss": -37.83789825439453, "global_step": 196135, "epoch": 1620} {"train_loss": -39.27309036254883, "global_step": 196136, "epoch": 1620} {"train_loss": -38.20287322998047, "global_step": 196137, "epoch": 1620} {"train_loss": -38.1955680847168, "global_step": 196138, "epoch": 1620} {"train_loss": -39.89374923706055, "global_step": 196139, "epoch": 1620} {"train_loss": -36.389514245277596, "global_step": 196140, "epoch": 1620, "val_loss": 2527236.0} {"train_loss": -39.05160140991211, "global_step": 196141, "epoch": 1621} {"train_loss": -38.30736541748047, "global_step": 196142, "epoch": 1621} {"train_loss": -34.547332763671875, "global_step": 196143, "epoch": 1621} {"train_loss": -28.093305587768555, "global_step": 196144, "epoch": 1621} {"train_loss": -35.623836517333984, "global_step": 196145, "epoch": 1621} {"train_loss": -38.59479522705078, "global_step": 196146, "epoch": 1621} {"train_loss": -37.208065032958984, "global_step": 196147, "epoch": 1621} {"train_loss": -37.8077278137207, "global_step": 196148, "epoch": 1621} {"train_loss": -38.038368225097656, "global_step": 196149, "epoch": 1621} {"train_loss": -37.493282318115234, "global_step": 196150, "epoch": 1621} {"train_loss": -39.6212158203125, "global_step": 196151, "epoch": 1621} {"train_loss": -38.90268325805664, "global_step": 196152, "epoch": 1621} {"train_loss": -39.125938415527344, "global_step": 196153, "epoch": 1621} {"train_loss": -39.04429244995117, "global_step": 196154, "epoch": 1621} {"train_loss": -38.906768798828125, "global_step": 196155, "epoch": 1621} {"train_loss": -40.12286376953125, "global_step": 196156, "epoch": 1621} {"train_loss": -38.95512771606445, "global_step": 196157, "epoch": 1621} {"train_loss": -38.95591354370117, "global_step": 196158, "epoch": 1621} {"train_loss": -38.55955123901367, "global_step": 196159, "epoch": 1621} {"train_loss": -39.08030319213867, "global_step": 196160, "epoch": 1621} {"train_loss": -40.1316032409668, "global_step": 196161, "epoch": 1621} {"train_loss": -38.27546691894531, "global_step": 196162, "epoch": 1621} {"train_loss": -38.425777435302734, "global_step": 196163, "epoch": 1621} {"train_loss": -39.13499069213867, "global_step": 196164, "epoch": 1621} {"train_loss": -38.33195114135742, "global_step": 196165, "epoch": 1621} {"train_loss": -38.981807708740234, "global_step": 196166, "epoch": 1621} {"train_loss": -39.1219367980957, "global_step": 196167, "epoch": 1621} {"train_loss": -39.186641693115234, "global_step": 196168, "epoch": 1621} {"train_loss": -39.09541320800781, "global_step": 196169, "epoch": 1621} {"train_loss": -38.71152877807617, "global_step": 196170, "epoch": 1621} {"train_loss": -39.67194366455078, "global_step": 196171, "epoch": 1621} {"train_loss": -39.097084045410156, "global_step": 196172, "epoch": 1621} {"train_loss": -38.9073600769043, "global_step": 196173, "epoch": 1621} {"train_loss": -38.7431755065918, "global_step": 196174, "epoch": 1621} {"train_loss": -39.29401779174805, "global_step": 196175, "epoch": 1621} {"train_loss": -38.48101043701172, "global_step": 196176, "epoch": 1621} {"train_loss": -39.10665512084961, "global_step": 196177, "epoch": 1621} {"train_loss": -38.456111907958984, "global_step": 196178, "epoch": 1621} {"train_loss": -38.23835754394531, "global_step": 196179, "epoch": 1621} {"train_loss": -39.07645797729492, "global_step": 196180, "epoch": 1621} {"train_loss": -39.29791259765625, "global_step": 196181, "epoch": 1621} {"train_loss": -39.31965255737305, "global_step": 196182, "epoch": 1621} {"train_loss": -39.571693420410156, "global_step": 196183, "epoch": 1621} {"train_loss": -39.23816680908203, "global_step": 196184, "epoch": 1621} {"train_loss": -40.0761604309082, "global_step": 196185, "epoch": 1621} {"train_loss": -39.639434814453125, "global_step": 196186, "epoch": 1621} {"train_loss": -38.1275749206543, "global_step": 196187, "epoch": 1621} {"train_loss": -39.6765251159668, "global_step": 196188, "epoch": 1621} {"train_loss": -38.68868637084961, "global_step": 196189, "epoch": 1621} {"train_loss": -40.34783172607422, "global_step": 196190, "epoch": 1621} {"train_loss": -39.25696563720703, "global_step": 196191, "epoch": 1621} {"train_loss": -40.374263763427734, "global_step": 196192, "epoch": 1621} {"train_loss": -39.49397659301758, "global_step": 196193, "epoch": 1621} {"train_loss": -38.602169036865234, "global_step": 196194, "epoch": 1621} {"train_loss": -38.03498458862305, "global_step": 196195, "epoch": 1621} {"train_loss": -38.73112487792969, "global_step": 196196, "epoch": 1621} {"train_loss": -39.75569534301758, "global_step": 196197, "epoch": 1621} {"train_loss": -39.46427536010742, "global_step": 196198, "epoch": 1621} {"train_loss": -39.347408294677734, "global_step": 196199, "epoch": 1621} {"train_loss": -39.57038116455078, "global_step": 196200, "epoch": 1621} {"train_loss": -37.801246643066406, "global_step": 196201, "epoch": 1621} {"train_loss": -38.18368148803711, "global_step": 196202, "epoch": 1621} {"train_loss": -36.87980651855469, "global_step": 196203, "epoch": 1621} {"train_loss": -39.17671585083008, "global_step": 196204, "epoch": 1621} {"train_loss": -37.29154586791992, "global_step": 196205, "epoch": 1621} {"train_loss": -38.239044189453125, "global_step": 196206, "epoch": 1621} {"train_loss": -37.140830993652344, "global_step": 196207, "epoch": 1621} {"train_loss": -38.98462677001953, "global_step": 196208, "epoch": 1621} {"train_loss": -38.39556884765625, "global_step": 196209, "epoch": 1621} {"train_loss": -40.085121154785156, "global_step": 196210, "epoch": 1621} {"train_loss": -39.05762481689453, "global_step": 196211, "epoch": 1621} {"train_loss": -39.77363586425781, "global_step": 196212, "epoch": 1621} {"train_loss": -38.5637092590332, "global_step": 196213, "epoch": 1621} {"train_loss": -39.32658386230469, "global_step": 196214, "epoch": 1621} {"train_loss": -40.14585494995117, "global_step": 196215, "epoch": 1621} {"train_loss": -38.9983024597168, "global_step": 196216, "epoch": 1621} {"train_loss": -39.34032440185547, "global_step": 196217, "epoch": 1621} {"train_loss": -38.768123626708984, "global_step": 196218, "epoch": 1621} {"train_loss": -39.59981918334961, "global_step": 196219, "epoch": 1621} {"train_loss": -39.44721603393555, "global_step": 196220, "epoch": 1621} {"train_loss": -39.81924057006836, "global_step": 196221, "epoch": 1621} {"train_loss": -39.31672286987305, "global_step": 196222, "epoch": 1621} {"train_loss": -39.50455856323242, "global_step": 196223, "epoch": 1621} {"train_loss": -39.89052200317383, "global_step": 196224, "epoch": 1621} {"train_loss": -39.35117721557617, "global_step": 196225, "epoch": 1621} {"train_loss": -40.27505874633789, "global_step": 196226, "epoch": 1621} {"train_loss": -39.91986846923828, "global_step": 196227, "epoch": 1621} {"train_loss": -38.19123077392578, "global_step": 196228, "epoch": 1621} {"train_loss": -38.9739990234375, "global_step": 196229, "epoch": 1621} {"train_loss": -39.39255905151367, "global_step": 196230, "epoch": 1621} {"train_loss": -39.27097702026367, "global_step": 196231, "epoch": 1621} {"train_loss": -40.42472457885742, "global_step": 196232, "epoch": 1621} {"train_loss": -40.11289596557617, "global_step": 196233, "epoch": 1621} {"train_loss": -39.763954162597656, "global_step": 196234, "epoch": 1621} {"train_loss": -38.405303955078125, "global_step": 196235, "epoch": 1621} {"train_loss": -40.479576110839844, "global_step": 196236, "epoch": 1621} {"train_loss": -39.69778060913086, "global_step": 196237, "epoch": 1621} {"train_loss": -39.227020263671875, "global_step": 196238, "epoch": 1621} {"train_loss": -39.95669937133789, "global_step": 196239, "epoch": 1621} {"train_loss": -40.12726974487305, "global_step": 196240, "epoch": 1621} {"train_loss": -40.068511962890625, "global_step": 196241, "epoch": 1621} {"train_loss": -39.7911262512207, "global_step": 196242, "epoch": 1621} {"train_loss": -39.46653366088867, "global_step": 196243, "epoch": 1621} {"train_loss": -38.02775955200195, "global_step": 196244, "epoch": 1621} {"train_loss": -38.05680465698242, "global_step": 196245, "epoch": 1621} {"train_loss": -39.46731948852539, "global_step": 196246, "epoch": 1621} {"train_loss": -39.08613204956055, "global_step": 196247, "epoch": 1621} {"train_loss": -38.49165725708008, "global_step": 196248, "epoch": 1621} {"train_loss": -39.02785873413086, "global_step": 196249, "epoch": 1621} {"train_loss": -38.944183349609375, "global_step": 196250, "epoch": 1621} {"train_loss": -37.693603515625, "global_step": 196251, "epoch": 1621} {"train_loss": -38.00608444213867, "global_step": 196252, "epoch": 1621} {"train_loss": -37.86117172241211, "global_step": 196253, "epoch": 1621} {"train_loss": -40.5207405090332, "global_step": 196254, "epoch": 1621} {"train_loss": -38.44977569580078, "global_step": 196255, "epoch": 1621} {"train_loss": -37.642189025878906, "global_step": 196256, "epoch": 1621} {"train_loss": -40.00465774536133, "global_step": 196257, "epoch": 1621} {"train_loss": -38.19131088256836, "global_step": 196258, "epoch": 1621} {"train_loss": -35.93455123901367, "global_step": 196259, "epoch": 1621} {"train_loss": -39.132198333740234, "global_step": 196260, "epoch": 1621} {"train_loss": -38.85408466118427, "global_step": 196261, "epoch": 1621, "val_loss": 2575504.0} {"train_loss": -36.467769622802734, "global_step": 196262, "epoch": 1622} {"train_loss": -38.94393539428711, "global_step": 196263, "epoch": 1622} {"train_loss": -40.178260803222656, "global_step": 196264, "epoch": 1622} {"train_loss": -38.28120040893555, "global_step": 196265, "epoch": 1622} {"train_loss": -39.215362548828125, "global_step": 196266, "epoch": 1622} {"train_loss": -39.726112365722656, "global_step": 196267, "epoch": 1622} {"train_loss": -37.74530029296875, "global_step": 196268, "epoch": 1622} {"train_loss": -38.9886360168457, "global_step": 196269, "epoch": 1622} {"train_loss": -39.07904815673828, "global_step": 196270, "epoch": 1622} {"train_loss": -37.61343002319336, "global_step": 196271, "epoch": 1622} {"train_loss": -38.78501892089844, "global_step": 196272, "epoch": 1622} {"train_loss": -38.780757904052734, "global_step": 196273, "epoch": 1622} {"train_loss": -37.48610305786133, "global_step": 196274, "epoch": 1622} {"train_loss": -37.99715805053711, "global_step": 196275, "epoch": 1622} {"train_loss": -37.850006103515625, "global_step": 196276, "epoch": 1622} {"train_loss": -38.49859619140625, "global_step": 196277, "epoch": 1622} {"train_loss": -38.93192672729492, "global_step": 196278, "epoch": 1622} {"train_loss": -39.022953033447266, "global_step": 196279, "epoch": 1622} {"train_loss": -37.75120162963867, "global_step": 196280, "epoch": 1622} {"train_loss": -40.0306510925293, "global_step": 196281, "epoch": 1622} {"train_loss": -39.7718391418457, "global_step": 196282, "epoch": 1622} {"train_loss": -39.29902267456055, "global_step": 196283, "epoch": 1622} {"train_loss": -39.06734085083008, "global_step": 196284, "epoch": 1622} {"train_loss": -39.187557220458984, "global_step": 196285, "epoch": 1622} {"train_loss": -40.374637603759766, "global_step": 196286, "epoch": 1622} {"train_loss": -39.80399703979492, "global_step": 196287, "epoch": 1622} {"train_loss": -39.405364990234375, "global_step": 196288, "epoch": 1622} {"train_loss": -39.5191535949707, "global_step": 196289, "epoch": 1622} {"train_loss": -40.03467559814453, "global_step": 196290, "epoch": 1622} {"train_loss": -40.1387939453125, "global_step": 196291, "epoch": 1622} {"train_loss": -40.42513656616211, "global_step": 196292, "epoch": 1622} {"train_loss": -40.49673843383789, "global_step": 196293, "epoch": 1622} {"train_loss": -40.0718994140625, "global_step": 196294, "epoch": 1622} {"train_loss": -40.04349899291992, "global_step": 196295, "epoch": 1622} {"train_loss": -40.77001953125, "global_step": 196296, "epoch": 1622} {"train_loss": -40.769989013671875, "global_step": 196297, "epoch": 1622} {"train_loss": -40.79209518432617, "global_step": 196298, "epoch": 1622} {"train_loss": -39.11082077026367, "global_step": 196299, "epoch": 1622} {"train_loss": -39.35194778442383, "global_step": 196300, "epoch": 1622} {"train_loss": -40.201385498046875, "global_step": 196301, "epoch": 1622} {"train_loss": -40.786041259765625, "global_step": 196302, "epoch": 1622} {"train_loss": -39.957000732421875, "global_step": 196303, "epoch": 1622} {"train_loss": -41.14010238647461, "global_step": 196304, "epoch": 1622} {"train_loss": -40.3437614440918, "global_step": 196305, "epoch": 1622} {"train_loss": -40.42629623413086, "global_step": 196306, "epoch": 1622} {"train_loss": -41.033966064453125, "global_step": 196307, "epoch": 1622} {"train_loss": -40.984832763671875, "global_step": 196308, "epoch": 1622} {"train_loss": -40.708744049072266, "global_step": 196309, "epoch": 1622} {"train_loss": -40.06087875366211, "global_step": 196310, "epoch": 1622} {"train_loss": -41.14882278442383, "global_step": 196311, "epoch": 1622} {"train_loss": -40.17945861816406, "global_step": 196312, "epoch": 1622} {"train_loss": -40.50985336303711, "global_step": 196313, "epoch": 1622} {"train_loss": -40.43099594116211, "global_step": 196314, "epoch": 1622} {"train_loss": -40.98398971557617, "global_step": 196315, "epoch": 1622} {"train_loss": -40.68254852294922, "global_step": 196316, "epoch": 1622} {"train_loss": -40.701080322265625, "global_step": 196317, "epoch": 1622} {"train_loss": -40.337371826171875, "global_step": 196318, "epoch": 1622} {"train_loss": -41.265560150146484, "global_step": 196319, "epoch": 1622} {"train_loss": -41.354583740234375, "global_step": 196320, "epoch": 1622} {"train_loss": -40.651790618896484, "global_step": 196321, "epoch": 1622} {"train_loss": -40.931739807128906, "global_step": 196322, "epoch": 1622} {"train_loss": -41.09280014038086, "global_step": 196323, "epoch": 1622} {"train_loss": -41.20539855957031, "global_step": 196324, "epoch": 1622} {"train_loss": -40.6179084777832, "global_step": 196325, "epoch": 1622} {"train_loss": -41.039024353027344, "global_step": 196326, "epoch": 1622} {"train_loss": -41.336708068847656, "global_step": 196327, "epoch": 1622} {"train_loss": -40.883052825927734, "global_step": 196328, "epoch": 1622} {"train_loss": -39.51558303833008, "global_step": 196329, "epoch": 1622} {"train_loss": -41.18144226074219, "global_step": 196330, "epoch": 1622} {"train_loss": -41.70419692993164, "global_step": 196331, "epoch": 1622} {"train_loss": -41.36285400390625, "global_step": 196332, "epoch": 1622} {"train_loss": -40.567195892333984, "global_step": 196333, "epoch": 1622} {"train_loss": -38.34845733642578, "global_step": 196334, "epoch": 1622} {"train_loss": -39.990230560302734, "global_step": 196335, "epoch": 1622} {"train_loss": -41.3099479675293, "global_step": 196336, "epoch": 1622} {"train_loss": -40.95789337158203, "global_step": 196337, "epoch": 1622} {"train_loss": -39.09115982055664, "global_step": 196338, "epoch": 1622} {"train_loss": -39.364906311035156, "global_step": 196339, "epoch": 1622} {"train_loss": -40.119441986083984, "global_step": 196340, "epoch": 1622} {"train_loss": -39.78152084350586, "global_step": 196341, "epoch": 1622} {"train_loss": -39.05476760864258, "global_step": 196342, "epoch": 1622} {"train_loss": -39.96088409423828, "global_step": 196343, "epoch": 1622} {"train_loss": -35.023311614990234, "global_step": 196344, "epoch": 1622} {"train_loss": -38.741065979003906, "global_step": 196345, "epoch": 1622} {"train_loss": -40.89390563964844, "global_step": 196346, "epoch": 1622} {"train_loss": -37.008636474609375, "global_step": 196347, "epoch": 1622} {"train_loss": -39.20122146606445, "global_step": 196348, "epoch": 1622} {"train_loss": -34.73509979248047, "global_step": 196349, "epoch": 1622} {"train_loss": -39.97593307495117, "global_step": 196350, "epoch": 1622} {"train_loss": -38.152957916259766, "global_step": 196351, "epoch": 1622} {"train_loss": -39.25703811645508, "global_step": 196352, "epoch": 1622} {"train_loss": -35.069332122802734, "global_step": 196353, "epoch": 1622} {"train_loss": -37.59310531616211, "global_step": 196354, "epoch": 1622} {"train_loss": -35.73324966430664, "global_step": 196355, "epoch": 1622} {"train_loss": -22.254716873168945, "global_step": 196356, "epoch": 1622} {"train_loss": -30.822967529296875, "global_step": 196357, "epoch": 1622} {"train_loss": -34.0368766784668, "global_step": 196358, "epoch": 1622} {"train_loss": -16.137744903564453, "global_step": 196359, "epoch": 1622} {"train_loss": -33.63926315307617, "global_step": 196360, "epoch": 1622} {"train_loss": -28.238439559936523, "global_step": 196361, "epoch": 1622} {"train_loss": -26.257898330688477, "global_step": 196362, "epoch": 1622} {"train_loss": -34.882625579833984, "global_step": 196363, "epoch": 1622} {"train_loss": -27.250940322875977, "global_step": 196364, "epoch": 1622} {"train_loss": -32.95669174194336, "global_step": 196365, "epoch": 1622} {"train_loss": -31.273792266845703, "global_step": 196366, "epoch": 1622} {"train_loss": -28.651416778564453, "global_step": 196367, "epoch": 1622} {"train_loss": -24.35706901550293, "global_step": 196368, "epoch": 1622} {"train_loss": -31.812702178955078, "global_step": 196369, "epoch": 1622} {"train_loss": -26.232044219970703, "global_step": 196370, "epoch": 1622} {"train_loss": -22.538856506347656, "global_step": 196371, "epoch": 1622} {"train_loss": -21.784391403198242, "global_step": 196372, "epoch": 1622} {"train_loss": -29.460920333862305, "global_step": 196373, "epoch": 1622} {"train_loss": -22.019580841064453, "global_step": 196374, "epoch": 1622} {"train_loss": -32.96328353881836, "global_step": 196375, "epoch": 1622} {"train_loss": -29.849817276000977, "global_step": 196376, "epoch": 1622} {"train_loss": -31.3077449798584, "global_step": 196377, "epoch": 1622} {"train_loss": -28.8489990234375, "global_step": 196378, "epoch": 1622} {"train_loss": -31.31009864807129, "global_step": 196379, "epoch": 1622} {"train_loss": -30.666601181030273, "global_step": 196380, "epoch": 1622} {"train_loss": -32.495033264160156, "global_step": 196381, "epoch": 1622} {"train_loss": -37.18102316422896, "global_step": 196382, "epoch": 1622, "val_loss": 2639059.75} {"train_loss": -34.45396041870117, "global_step": 196383, "epoch": 1623} {"train_loss": -33.35798263549805, "global_step": 196384, "epoch": 1623} {"train_loss": -32.76837921142578, "global_step": 196385, "epoch": 1623} {"train_loss": -34.644813537597656, "global_step": 196386, "epoch": 1623} {"train_loss": -33.74215316772461, "global_step": 196387, "epoch": 1623} {"train_loss": -33.57786560058594, "global_step": 196388, "epoch": 1623} {"train_loss": -34.91764450073242, "global_step": 196389, "epoch": 1623} {"train_loss": -35.40690612792969, "global_step": 196390, "epoch": 1623} {"train_loss": -32.857173919677734, "global_step": 196391, "epoch": 1623} {"train_loss": -35.12176513671875, "global_step": 196392, "epoch": 1623} {"train_loss": -36.00885772705078, "global_step": 196393, "epoch": 1623} {"train_loss": -34.105587005615234, "global_step": 196394, "epoch": 1623} {"train_loss": -34.806304931640625, "global_step": 196395, "epoch": 1623} {"train_loss": -33.70986557006836, "global_step": 196396, "epoch": 1623} {"train_loss": -34.5876579284668, "global_step": 196397, "epoch": 1623} {"train_loss": -35.87508010864258, "global_step": 196398, "epoch": 1623} {"train_loss": -35.49591064453125, "global_step": 196399, "epoch": 1623} {"train_loss": -34.951473236083984, "global_step": 196400, "epoch": 1623} {"train_loss": -35.209007263183594, "global_step": 196401, "epoch": 1623} {"train_loss": -36.4901237487793, "global_step": 196402, "epoch": 1623} {"train_loss": -35.48701095581055, "global_step": 196403, "epoch": 1623} {"train_loss": -36.647579193115234, "global_step": 196404, "epoch": 1623} {"train_loss": -35.96086502075195, "global_step": 196405, "epoch": 1623} {"train_loss": -35.8261604309082, "global_step": 196406, "epoch": 1623} {"train_loss": -37.114959716796875, "global_step": 196407, "epoch": 1623} {"train_loss": -37.03852462768555, "global_step": 196408, "epoch": 1623} {"train_loss": -37.26818084716797, "global_step": 196409, "epoch": 1623} {"train_loss": -37.02859115600586, "global_step": 196410, "epoch": 1623} {"train_loss": -37.22379684448242, "global_step": 196411, "epoch": 1623} {"train_loss": -36.286766052246094, "global_step": 196412, "epoch": 1623} {"train_loss": -36.42048263549805, "global_step": 196413, "epoch": 1623} {"train_loss": -37.18120574951172, "global_step": 196414, "epoch": 1623} {"train_loss": -37.5633430480957, "global_step": 196415, "epoch": 1623} {"train_loss": -37.25175094604492, "global_step": 196416, "epoch": 1623} {"train_loss": -36.81870651245117, "global_step": 196417, "epoch": 1623} {"train_loss": -36.7389030456543, "global_step": 196418, "epoch": 1623} {"train_loss": -36.103145599365234, "global_step": 196419, "epoch": 1623} {"train_loss": -37.27865219116211, "global_step": 196420, "epoch": 1623} {"train_loss": -37.6418342590332, "global_step": 196421, "epoch": 1623} {"train_loss": -37.784908294677734, "global_step": 196422, "epoch": 1623} {"train_loss": -36.62089157104492, "global_step": 196423, "epoch": 1623} {"train_loss": -37.913509368896484, "global_step": 196424, "epoch": 1623} {"train_loss": -38.04926300048828, "global_step": 196425, "epoch": 1623} {"train_loss": -37.164466857910156, "global_step": 196426, "epoch": 1623} {"train_loss": -37.97524642944336, "global_step": 196427, "epoch": 1623} {"train_loss": -37.04800033569336, "global_step": 196428, "epoch": 1623} {"train_loss": -37.91769027709961, "global_step": 196429, "epoch": 1623} {"train_loss": -37.97605514526367, "global_step": 196430, "epoch": 1623} {"train_loss": -37.86154556274414, "global_step": 196431, "epoch": 1623} {"train_loss": -38.28048324584961, "global_step": 196432, "epoch": 1623} {"train_loss": -37.8609733581543, "global_step": 196433, "epoch": 1623} {"train_loss": -38.38182830810547, "global_step": 196434, "epoch": 1623} {"train_loss": -38.582183837890625, "global_step": 196435, "epoch": 1623} {"train_loss": -37.848114013671875, "global_step": 196436, "epoch": 1623} {"train_loss": -38.05820846557617, "global_step": 196437, "epoch": 1623} {"train_loss": -38.37413024902344, "global_step": 196438, "epoch": 1623} {"train_loss": -38.36988067626953, "global_step": 196439, "epoch": 1623} {"train_loss": -37.64304733276367, "global_step": 196440, "epoch": 1623} {"train_loss": -38.53239059448242, "global_step": 196441, "epoch": 1623} {"train_loss": -38.69434356689453, "global_step": 196442, "epoch": 1623} {"train_loss": -37.64122772216797, "global_step": 196443, "epoch": 1623} {"train_loss": -38.293312072753906, "global_step": 196444, "epoch": 1623} {"train_loss": -38.5710563659668, "global_step": 196445, "epoch": 1623} {"train_loss": -37.465675354003906, "global_step": 196446, "epoch": 1623} {"train_loss": -38.80987548828125, "global_step": 196447, "epoch": 1623} {"train_loss": -37.97133255004883, "global_step": 196448, "epoch": 1623} {"train_loss": -38.56373596191406, "global_step": 196449, "epoch": 1623} {"train_loss": -38.71981430053711, "global_step": 196450, "epoch": 1623} {"train_loss": -38.931427001953125, "global_step": 196451, "epoch": 1623} {"train_loss": -39.12936019897461, "global_step": 196452, "epoch": 1623} {"train_loss": -38.59858322143555, "global_step": 196453, "epoch": 1623} {"train_loss": -38.32820510864258, "global_step": 196454, "epoch": 1623} {"train_loss": -39.09324264526367, "global_step": 196455, "epoch": 1623} {"train_loss": -38.60634994506836, "global_step": 196456, "epoch": 1623} {"train_loss": -38.5177116394043, "global_step": 196457, "epoch": 1623} {"train_loss": -39.435997009277344, "global_step": 196458, "epoch": 1623} {"train_loss": -39.1617546081543, "global_step": 196459, "epoch": 1623} {"train_loss": -38.77374267578125, "global_step": 196460, "epoch": 1623} {"train_loss": -38.52486801147461, "global_step": 196461, "epoch": 1623} {"train_loss": -38.97453308105469, "global_step": 196462, "epoch": 1623} {"train_loss": -38.60453414916992, "global_step": 196463, "epoch": 1623} {"train_loss": -38.60824203491211, "global_step": 196464, "epoch": 1623} {"train_loss": -39.0953369140625, "global_step": 196465, "epoch": 1623} {"train_loss": -38.9169807434082, "global_step": 196466, "epoch": 1623} {"train_loss": -39.10850143432617, "global_step": 196467, "epoch": 1623} {"train_loss": -39.03173828125, "global_step": 196468, "epoch": 1623} {"train_loss": -39.689666748046875, "global_step": 196469, "epoch": 1623} {"train_loss": -39.569671630859375, "global_step": 196470, "epoch": 1623} {"train_loss": -39.45942306518555, "global_step": 196471, "epoch": 1623} {"train_loss": -39.65608596801758, "global_step": 196472, "epoch": 1623} {"train_loss": -38.94892501831055, "global_step": 196473, "epoch": 1623} {"train_loss": -39.31122970581055, "global_step": 196474, "epoch": 1623} {"train_loss": -39.08803939819336, "global_step": 196475, "epoch": 1623} {"train_loss": -38.359310150146484, "global_step": 196476, "epoch": 1623} {"train_loss": -39.47000503540039, "global_step": 196477, "epoch": 1623} {"train_loss": -39.11464309692383, "global_step": 196478, "epoch": 1623} {"train_loss": -39.87188720703125, "global_step": 196479, "epoch": 1623} {"train_loss": -38.233272552490234, "global_step": 196480, "epoch": 1623} {"train_loss": -39.97684860229492, "global_step": 196481, "epoch": 1623} {"train_loss": -39.59843444824219, "global_step": 196482, "epoch": 1623} {"train_loss": -39.63423538208008, "global_step": 196483, "epoch": 1623} {"train_loss": -39.02639389038086, "global_step": 196484, "epoch": 1623} {"train_loss": -39.79030990600586, "global_step": 196485, "epoch": 1623} {"train_loss": -40.126094818115234, "global_step": 196486, "epoch": 1623} {"train_loss": -38.59418487548828, "global_step": 196487, "epoch": 1623} {"train_loss": -39.80365753173828, "global_step": 196488, "epoch": 1623} {"train_loss": -39.96613311767578, "global_step": 196489, "epoch": 1623} {"train_loss": -39.868896484375, "global_step": 196490, "epoch": 1623} {"train_loss": -40.26339340209961, "global_step": 196491, "epoch": 1623} {"train_loss": -39.99631881713867, "global_step": 196492, "epoch": 1623} {"train_loss": -39.97782516479492, "global_step": 196493, "epoch": 1623} {"train_loss": -39.92213821411133, "global_step": 196494, "epoch": 1623} {"train_loss": -39.7720832824707, "global_step": 196495, "epoch": 1623} {"train_loss": -39.16011428833008, "global_step": 196496, "epoch": 1623} {"train_loss": -40.436588287353516, "global_step": 196497, "epoch": 1623} {"train_loss": -40.2047233581543, "global_step": 196498, "epoch": 1623} {"train_loss": -39.61637496948242, "global_step": 196499, "epoch": 1623} {"train_loss": -40.147151947021484, "global_step": 196500, "epoch": 1623} {"train_loss": -39.7547607421875, "global_step": 196501, "epoch": 1623} {"train_loss": -39.67871856689453, "global_step": 196502, "epoch": 1623} {"train_loss": -37.84142388588141, "global_step": 196503, "epoch": 1623, "val_loss": 2557130.0} {"train_loss": -40.0053825378418, "global_step": 196504, "epoch": 1624} {"train_loss": -39.628292083740234, "global_step": 196505, "epoch": 1624} {"train_loss": -39.98200607299805, "global_step": 196506, "epoch": 1624} {"train_loss": -39.65460968017578, "global_step": 196507, "epoch": 1624} {"train_loss": -40.203460693359375, "global_step": 196508, "epoch": 1624} {"train_loss": -40.377445220947266, "global_step": 196509, "epoch": 1624} {"train_loss": -40.64111328125, "global_step": 196510, "epoch": 1624} {"train_loss": -40.7005729675293, "global_step": 196511, "epoch": 1624} {"train_loss": -40.18904495239258, "global_step": 196512, "epoch": 1624} {"train_loss": -40.821205139160156, "global_step": 196513, "epoch": 1624} {"train_loss": -40.35398483276367, "global_step": 196514, "epoch": 1624} {"train_loss": -40.41703796386719, "global_step": 196515, "epoch": 1624} {"train_loss": -40.7455940246582, "global_step": 196516, "epoch": 1624} {"train_loss": -40.42121124267578, "global_step": 196517, "epoch": 1624} {"train_loss": -40.53867721557617, "global_step": 196518, "epoch": 1624} {"train_loss": -40.44045639038086, "global_step": 196519, "epoch": 1624} {"train_loss": -40.36526107788086, "global_step": 196520, "epoch": 1624} {"train_loss": -40.9141960144043, "global_step": 196521, "epoch": 1624} {"train_loss": -40.12949752807617, "global_step": 196522, "epoch": 1624} {"train_loss": -40.16243362426758, "global_step": 196523, "epoch": 1624} {"train_loss": -40.6347541809082, "global_step": 196524, "epoch": 1624} {"train_loss": -40.62824630737305, "global_step": 196525, "epoch": 1624} {"train_loss": -40.548789978027344, "global_step": 196526, "epoch": 1624} {"train_loss": -40.4298095703125, "global_step": 196527, "epoch": 1624} {"train_loss": -40.55204391479492, "global_step": 196528, "epoch": 1624} {"train_loss": -39.86955642700195, "global_step": 196529, "epoch": 1624} {"train_loss": -38.79201889038086, "global_step": 196530, "epoch": 1624} {"train_loss": -38.29791259765625, "global_step": 196531, "epoch": 1624} {"train_loss": -36.666744232177734, "global_step": 196532, "epoch": 1624} {"train_loss": -33.54091262817383, "global_step": 196533, "epoch": 1624} {"train_loss": -31.399372100830078, "global_step": 196534, "epoch": 1624} {"train_loss": -37.43113708496094, "global_step": 196535, "epoch": 1624} {"train_loss": -39.99665451049805, "global_step": 196536, "epoch": 1624} {"train_loss": -36.32711410522461, "global_step": 196537, "epoch": 1624} {"train_loss": -38.72683334350586, "global_step": 196538, "epoch": 1624} {"train_loss": -39.61522674560547, "global_step": 196539, "epoch": 1624} {"train_loss": -38.07973098754883, "global_step": 196540, "epoch": 1624} {"train_loss": -39.666770935058594, "global_step": 196541, "epoch": 1624} {"train_loss": -39.470985412597656, "global_step": 196542, "epoch": 1624} {"train_loss": -38.648006439208984, "global_step": 196543, "epoch": 1624} {"train_loss": -39.307899475097656, "global_step": 196544, "epoch": 1624} {"train_loss": -40.51125717163086, "global_step": 196545, "epoch": 1624} {"train_loss": -39.938228607177734, "global_step": 196546, "epoch": 1624} {"train_loss": -39.70820236206055, "global_step": 196547, "epoch": 1624} {"train_loss": -40.046112060546875, "global_step": 196548, "epoch": 1624} {"train_loss": -39.66080093383789, "global_step": 196549, "epoch": 1624} {"train_loss": -39.83672332763672, "global_step": 196550, "epoch": 1624} {"train_loss": -39.927425384521484, "global_step": 196551, "epoch": 1624} {"train_loss": -40.4193000793457, "global_step": 196552, "epoch": 1624} {"train_loss": -40.12571334838867, "global_step": 196553, "epoch": 1624} {"train_loss": -40.50837326049805, "global_step": 196554, "epoch": 1624} {"train_loss": -40.157501220703125, "global_step": 196555, "epoch": 1624} {"train_loss": -39.84183883666992, "global_step": 196556, "epoch": 1624} {"train_loss": -40.205299377441406, "global_step": 196557, "epoch": 1624} {"train_loss": -39.60276412963867, "global_step": 196558, "epoch": 1624} {"train_loss": -40.13580322265625, "global_step": 196559, "epoch": 1624} {"train_loss": -40.10356521606445, "global_step": 196560, "epoch": 1624} {"train_loss": -39.75877380371094, "global_step": 196561, "epoch": 1624} {"train_loss": -40.54788589477539, "global_step": 196562, "epoch": 1624} {"train_loss": -38.834381103515625, "global_step": 196563, "epoch": 1624} {"train_loss": -39.337703704833984, "global_step": 196564, "epoch": 1624} {"train_loss": -39.23420333862305, "global_step": 196565, "epoch": 1624} {"train_loss": -38.77614974975586, "global_step": 196566, "epoch": 1624} {"train_loss": -40.49613571166992, "global_step": 196567, "epoch": 1624} {"train_loss": -39.21118927001953, "global_step": 196568, "epoch": 1624} {"train_loss": -40.33846664428711, "global_step": 196569, "epoch": 1624} {"train_loss": -40.76023483276367, "global_step": 196570, "epoch": 1624} {"train_loss": -40.473140716552734, "global_step": 196571, "epoch": 1624} {"train_loss": -40.36030960083008, "global_step": 196572, "epoch": 1624} {"train_loss": -40.17198944091797, "global_step": 196573, "epoch": 1624} {"train_loss": -40.07420349121094, "global_step": 196574, "epoch": 1624} {"train_loss": -39.06107711791992, "global_step": 196575, "epoch": 1624} {"train_loss": -40.2891960144043, "global_step": 196576, "epoch": 1624} {"train_loss": -39.65751266479492, "global_step": 196577, "epoch": 1624} {"train_loss": -38.997894287109375, "global_step": 196578, "epoch": 1624} {"train_loss": -38.67658615112305, "global_step": 196579, "epoch": 1624} {"train_loss": -38.99541091918945, "global_step": 196580, "epoch": 1624} {"train_loss": -39.98432159423828, "global_step": 196581, "epoch": 1624} {"train_loss": -39.28980255126953, "global_step": 196582, "epoch": 1624} {"train_loss": -41.05842590332031, "global_step": 196583, "epoch": 1624} {"train_loss": -38.54659652709961, "global_step": 196584, "epoch": 1624} {"train_loss": -40.262786865234375, "global_step": 196585, "epoch": 1624} {"train_loss": -40.88566207885742, "global_step": 196586, "epoch": 1624} {"train_loss": -40.70412063598633, "global_step": 196587, "epoch": 1624} {"train_loss": -40.03791046142578, "global_step": 196588, "epoch": 1624} {"train_loss": -39.84324264526367, "global_step": 196589, "epoch": 1624} {"train_loss": -40.72462463378906, "global_step": 196590, "epoch": 1624} {"train_loss": -40.44561004638672, "global_step": 196591, "epoch": 1624} {"train_loss": -40.32356643676758, "global_step": 196592, "epoch": 1624} {"train_loss": -40.583412170410156, "global_step": 196593, "epoch": 1624} {"train_loss": -40.892120361328125, "global_step": 196594, "epoch": 1624} {"train_loss": -41.080650329589844, "global_step": 196595, "epoch": 1624} {"train_loss": -40.6861686706543, "global_step": 196596, "epoch": 1624} {"train_loss": -40.881385803222656, "global_step": 196597, "epoch": 1624} {"train_loss": -39.59151840209961, "global_step": 196598, "epoch": 1624} {"train_loss": -40.81925582885742, "global_step": 196599, "epoch": 1624} {"train_loss": -40.493099212646484, "global_step": 196600, "epoch": 1624} {"train_loss": -40.17352294921875, "global_step": 196601, "epoch": 1624} {"train_loss": -40.871978759765625, "global_step": 196602, "epoch": 1624} {"train_loss": -40.61610794067383, "global_step": 196603, "epoch": 1624} {"train_loss": -41.147029876708984, "global_step": 196604, "epoch": 1624} {"train_loss": -39.75464630126953, "global_step": 196605, "epoch": 1624} {"train_loss": -40.42011642456055, "global_step": 196606, "epoch": 1624} {"train_loss": -39.56924057006836, "global_step": 196607, "epoch": 1624} {"train_loss": -40.959774017333984, "global_step": 196608, "epoch": 1624} {"train_loss": -40.57061004638672, "global_step": 196609, "epoch": 1624} {"train_loss": -40.470916748046875, "global_step": 196610, "epoch": 1624} {"train_loss": -39.8034782409668, "global_step": 196611, "epoch": 1624} {"train_loss": -40.8927001953125, "global_step": 196612, "epoch": 1624} {"train_loss": -41.07917022705078, "global_step": 196613, "epoch": 1624} {"train_loss": -41.020870208740234, "global_step": 196614, "epoch": 1624} {"train_loss": -40.36994552612305, "global_step": 196615, "epoch": 1624} {"train_loss": -39.88844680786133, "global_step": 196616, "epoch": 1624} {"train_loss": -41.11077117919922, "global_step": 196617, "epoch": 1624} {"train_loss": -40.91940689086914, "global_step": 196618, "epoch": 1624} {"train_loss": -40.36039352416992, "global_step": 196619, "epoch": 1624} {"train_loss": -39.918643951416016, "global_step": 196620, "epoch": 1624} {"train_loss": -40.081947326660156, "global_step": 196621, "epoch": 1624} {"train_loss": -39.73893356323242, "global_step": 196622, "epoch": 1624} {"train_loss": -40.69204330444336, "global_step": 196623, "epoch": 1624} {"train_loss": -39.8985541162412, "global_step": 196624, "epoch": 1624, "val_loss": 2623628.0} {"train_loss": -40.689823150634766, "global_step": 196625, "epoch": 1625} {"train_loss": -40.83869552612305, "global_step": 196626, "epoch": 1625} {"train_loss": -40.41754913330078, "global_step": 196627, "epoch": 1625} {"train_loss": -39.677886962890625, "global_step": 196628, "epoch": 1625} {"train_loss": -39.52824783325195, "global_step": 196629, "epoch": 1625} {"train_loss": -40.79755401611328, "global_step": 196630, "epoch": 1625} {"train_loss": -41.546958923339844, "global_step": 196631, "epoch": 1625} {"train_loss": -39.584205627441406, "global_step": 196632, "epoch": 1625} {"train_loss": -40.80427932739258, "global_step": 196633, "epoch": 1625} {"train_loss": -41.08597946166992, "global_step": 196634, "epoch": 1625} {"train_loss": -40.46781539916992, "global_step": 196635, "epoch": 1625} {"train_loss": -41.042354583740234, "global_step": 196636, "epoch": 1625} {"train_loss": -41.22208786010742, "global_step": 196637, "epoch": 1625} {"train_loss": -40.27126693725586, "global_step": 196638, "epoch": 1625} {"train_loss": -40.84796142578125, "global_step": 196639, "epoch": 1625} {"train_loss": -41.38284683227539, "global_step": 196640, "epoch": 1625} {"train_loss": -40.25539016723633, "global_step": 196641, "epoch": 1625} {"train_loss": -41.37000274658203, "global_step": 196642, "epoch": 1625} {"train_loss": -41.099422454833984, "global_step": 196643, "epoch": 1625} {"train_loss": -41.38041305541992, "global_step": 196644, "epoch": 1625} {"train_loss": -41.30378341674805, "global_step": 196645, "epoch": 1625} {"train_loss": -41.364715576171875, "global_step": 196646, "epoch": 1625} {"train_loss": -41.290191650390625, "global_step": 196647, "epoch": 1625} {"train_loss": -40.99549865722656, "global_step": 196648, "epoch": 1625} {"train_loss": -41.09719467163086, "global_step": 196649, "epoch": 1625} {"train_loss": -41.04293441772461, "global_step": 196650, "epoch": 1625} {"train_loss": -40.4842529296875, "global_step": 196651, "epoch": 1625} {"train_loss": -40.92704391479492, "global_step": 196652, "epoch": 1625} {"train_loss": -41.084197998046875, "global_step": 196653, "epoch": 1625} {"train_loss": -40.397090911865234, "global_step": 196654, "epoch": 1625} {"train_loss": -40.44074630737305, "global_step": 196655, "epoch": 1625} {"train_loss": -40.72981643676758, "global_step": 196656, "epoch": 1625} {"train_loss": -40.94741439819336, "global_step": 196657, "epoch": 1625} {"train_loss": -41.78861618041992, "global_step": 196658, "epoch": 1625} {"train_loss": -41.2061653137207, "global_step": 196659, "epoch": 1625} {"train_loss": -41.084197998046875, "global_step": 196660, "epoch": 1625} {"train_loss": -40.515708923339844, "global_step": 196661, "epoch": 1625} {"train_loss": -41.28171920776367, "global_step": 196662, "epoch": 1625} {"train_loss": -40.97169876098633, "global_step": 196663, "epoch": 1625} {"train_loss": -41.72846603393555, "global_step": 196664, "epoch": 1625} {"train_loss": -40.386104583740234, "global_step": 196665, "epoch": 1625} {"train_loss": -41.18976593017578, "global_step": 196666, "epoch": 1625} {"train_loss": -40.774749755859375, "global_step": 196667, "epoch": 1625} {"train_loss": -40.4095458984375, "global_step": 196668, "epoch": 1625} {"train_loss": -40.25991439819336, "global_step": 196669, "epoch": 1625} {"train_loss": -40.38631820678711, "global_step": 196670, "epoch": 1625} {"train_loss": -39.775421142578125, "global_step": 196671, "epoch": 1625} {"train_loss": -41.444610595703125, "global_step": 196672, "epoch": 1625} {"train_loss": -39.7990837097168, "global_step": 196673, "epoch": 1625} {"train_loss": -41.15775680541992, "global_step": 196674, "epoch": 1625} {"train_loss": -39.690155029296875, "global_step": 196675, "epoch": 1625} {"train_loss": -40.950191497802734, "global_step": 196676, "epoch": 1625} {"train_loss": -39.820247650146484, "global_step": 196677, "epoch": 1625} {"train_loss": -40.03034591674805, "global_step": 196678, "epoch": 1625} {"train_loss": -41.24531936645508, "global_step": 196679, "epoch": 1625} {"train_loss": -39.96866989135742, "global_step": 196680, "epoch": 1625} {"train_loss": -40.68624496459961, "global_step": 196681, "epoch": 1625} {"train_loss": -40.306304931640625, "global_step": 196682, "epoch": 1625} {"train_loss": -37.105403900146484, "global_step": 196683, "epoch": 1625} {"train_loss": -38.633331298828125, "global_step": 196684, "epoch": 1625} {"train_loss": -40.307247161865234, "global_step": 196685, "epoch": 1625} {"train_loss": -40.19304656982422, "global_step": 196686, "epoch": 1625} {"train_loss": -40.383731842041016, "global_step": 196687, "epoch": 1625} {"train_loss": -39.74896240234375, "global_step": 196688, "epoch": 1625} {"train_loss": -39.88548278808594, "global_step": 196689, "epoch": 1625} {"train_loss": -41.133750915527344, "global_step": 196690, "epoch": 1625} {"train_loss": -39.68872833251953, "global_step": 196691, "epoch": 1625} {"train_loss": -35.38991165161133, "global_step": 196692, "epoch": 1625} {"train_loss": -36.96843338012695, "global_step": 196693, "epoch": 1625} {"train_loss": -38.515716552734375, "global_step": 196694, "epoch": 1625} {"train_loss": -39.22319793701172, "global_step": 196695, "epoch": 1625} {"train_loss": -36.95576477050781, "global_step": 196696, "epoch": 1625} {"train_loss": -38.035884857177734, "global_step": 196697, "epoch": 1625} {"train_loss": -40.45717239379883, "global_step": 196698, "epoch": 1625} {"train_loss": -37.319637298583984, "global_step": 196699, "epoch": 1625} {"train_loss": -37.76508331298828, "global_step": 196700, "epoch": 1625} {"train_loss": -40.5299186706543, "global_step": 196701, "epoch": 1625} {"train_loss": -39.69049835205078, "global_step": 196702, "epoch": 1625} {"train_loss": -40.91817855834961, "global_step": 196703, "epoch": 1625} {"train_loss": -40.43878173828125, "global_step": 196704, "epoch": 1625} {"train_loss": -40.21223831176758, "global_step": 196705, "epoch": 1625} {"train_loss": -41.2972526550293, "global_step": 196706, "epoch": 1625} {"train_loss": -40.46712875366211, "global_step": 196707, "epoch": 1625} {"train_loss": -40.70924758911133, "global_step": 196708, "epoch": 1625} {"train_loss": -40.49277877807617, "global_step": 196709, "epoch": 1625} {"train_loss": -40.8780632019043, "global_step": 196710, "epoch": 1625} {"train_loss": -41.32923126220703, "global_step": 196711, "epoch": 1625} {"train_loss": -40.48834228515625, "global_step": 196712, "epoch": 1625} {"train_loss": -40.73861312866211, "global_step": 196713, "epoch": 1625} {"train_loss": -41.184444427490234, "global_step": 196714, "epoch": 1625} {"train_loss": -40.41383743286133, "global_step": 196715, "epoch": 1625} {"train_loss": -40.43158721923828, "global_step": 196716, "epoch": 1625} {"train_loss": -40.97178649902344, "global_step": 196717, "epoch": 1625} {"train_loss": -40.71893310546875, "global_step": 196718, "epoch": 1625} {"train_loss": -41.2389030456543, "global_step": 196719, "epoch": 1625} {"train_loss": -41.44536590576172, "global_step": 196720, "epoch": 1625} {"train_loss": -41.5595817565918, "global_step": 196721, "epoch": 1625} {"train_loss": -40.70893478393555, "global_step": 196722, "epoch": 1625} {"train_loss": -41.69918441772461, "global_step": 196723, "epoch": 1625} {"train_loss": -41.49110412597656, "global_step": 196724, "epoch": 1625} {"train_loss": -41.67311477661133, "global_step": 196725, "epoch": 1625} {"train_loss": -41.580135345458984, "global_step": 196726, "epoch": 1625} {"train_loss": -41.28009796142578, "global_step": 196727, "epoch": 1625} {"train_loss": -41.15034103393555, "global_step": 196728, "epoch": 1625} {"train_loss": -41.330867767333984, "global_step": 196729, "epoch": 1625} {"train_loss": -40.73017501831055, "global_step": 196730, "epoch": 1625} {"train_loss": -40.92014694213867, "global_step": 196731, "epoch": 1625} {"train_loss": -41.5565185546875, "global_step": 196732, "epoch": 1625} {"train_loss": -40.627197265625, "global_step": 196733, "epoch": 1625} {"train_loss": -41.199581146240234, "global_step": 196734, "epoch": 1625} {"train_loss": -40.961273193359375, "global_step": 196735, "epoch": 1625} {"train_loss": -41.56188201904297, "global_step": 196736, "epoch": 1625} {"train_loss": -41.04631423950195, "global_step": 196737, "epoch": 1625} {"train_loss": -40.85966110229492, "global_step": 196738, "epoch": 1625} {"train_loss": -41.42749786376953, "global_step": 196739, "epoch": 1625} {"train_loss": -41.69752883911133, "global_step": 196740, "epoch": 1625} {"train_loss": -41.572975158691406, "global_step": 196741, "epoch": 1625} {"train_loss": -40.49878692626953, "global_step": 196742, "epoch": 1625} {"train_loss": -39.889801025390625, "global_step": 196743, "epoch": 1625} {"train_loss": -40.31964111328125, "global_step": 196744, "epoch": 1625} {"train_loss": -40.50404184514826, "global_step": 196745, "epoch": 1625, "val_loss": 2584392.75} {"train_loss": -41.322479248046875, "global_step": 196746, "epoch": 1626} {"train_loss": -41.18013000488281, "global_step": 196747, "epoch": 1626} {"train_loss": -37.893226623535156, "global_step": 196748, "epoch": 1626} {"train_loss": -38.569000244140625, "global_step": 196749, "epoch": 1626} {"train_loss": -40.85712814331055, "global_step": 196750, "epoch": 1626} {"train_loss": -40.178627014160156, "global_step": 196751, "epoch": 1626} {"train_loss": -34.656494140625, "global_step": 196752, "epoch": 1626} {"train_loss": -37.76983642578125, "global_step": 196753, "epoch": 1626} {"train_loss": -39.779876708984375, "global_step": 196754, "epoch": 1626} {"train_loss": -37.66464614868164, "global_step": 196755, "epoch": 1626} {"train_loss": -39.34596252441406, "global_step": 196756, "epoch": 1626} {"train_loss": -38.14305877685547, "global_step": 196757, "epoch": 1626} {"train_loss": -37.931724548339844, "global_step": 196758, "epoch": 1626} {"train_loss": -37.11899948120117, "global_step": 196759, "epoch": 1626} {"train_loss": -36.32174301147461, "global_step": 196760, "epoch": 1626} {"train_loss": -40.002532958984375, "global_step": 196761, "epoch": 1626} {"train_loss": -36.940608978271484, "global_step": 196762, "epoch": 1626} {"train_loss": -39.28217697143555, "global_step": 196763, "epoch": 1626} {"train_loss": -38.57490158081055, "global_step": 196764, "epoch": 1626} {"train_loss": -37.53712844848633, "global_step": 196765, "epoch": 1626} {"train_loss": -38.495365142822266, "global_step": 196766, "epoch": 1626} {"train_loss": -38.42233657836914, "global_step": 196767, "epoch": 1626} {"train_loss": -39.27968215942383, "global_step": 196768, "epoch": 1626} {"train_loss": -39.917171478271484, "global_step": 196769, "epoch": 1626} {"train_loss": -39.59514617919922, "global_step": 196770, "epoch": 1626} {"train_loss": -39.81509017944336, "global_step": 196771, "epoch": 1626} {"train_loss": -40.436946868896484, "global_step": 196772, "epoch": 1626} {"train_loss": -40.22285842895508, "global_step": 196773, "epoch": 1626} {"train_loss": -41.05775833129883, "global_step": 196774, "epoch": 1626} {"train_loss": -39.00350570678711, "global_step": 196775, "epoch": 1626} {"train_loss": -41.09061050415039, "global_step": 196776, "epoch": 1626} {"train_loss": -40.01506805419922, "global_step": 196777, "epoch": 1626} {"train_loss": -40.45042037963867, "global_step": 196778, "epoch": 1626} {"train_loss": -41.04407501220703, "global_step": 196779, "epoch": 1626} {"train_loss": -40.22185516357422, "global_step": 196780, "epoch": 1626} {"train_loss": -40.070865631103516, "global_step": 196781, "epoch": 1626} {"train_loss": -41.074737548828125, "global_step": 196782, "epoch": 1626} {"train_loss": -40.54823684692383, "global_step": 196783, "epoch": 1626} {"train_loss": -40.72016525268555, "global_step": 196784, "epoch": 1626} {"train_loss": -39.88360595703125, "global_step": 196785, "epoch": 1626} {"train_loss": -41.01552963256836, "global_step": 196786, "epoch": 1626} {"train_loss": -40.28767013549805, "global_step": 196787, "epoch": 1626} {"train_loss": -41.24558639526367, "global_step": 196788, "epoch": 1626} {"train_loss": -40.34130859375, "global_step": 196789, "epoch": 1626} {"train_loss": -41.25197219848633, "global_step": 196790, "epoch": 1626} {"train_loss": -39.83483123779297, "global_step": 196791, "epoch": 1626} {"train_loss": -40.98848342895508, "global_step": 196792, "epoch": 1626} {"train_loss": -40.363643646240234, "global_step": 196793, "epoch": 1626} {"train_loss": -39.94875717163086, "global_step": 196794, "epoch": 1626} {"train_loss": -40.863155364990234, "global_step": 196795, "epoch": 1626} {"train_loss": -39.439117431640625, "global_step": 196796, "epoch": 1626} {"train_loss": -41.41741943359375, "global_step": 196797, "epoch": 1626} {"train_loss": -41.52154541015625, "global_step": 196798, "epoch": 1626} {"train_loss": -40.1555290222168, "global_step": 196799, "epoch": 1626} {"train_loss": -41.16579055786133, "global_step": 196800, "epoch": 1626} {"train_loss": -39.772308349609375, "global_step": 196801, "epoch": 1626} {"train_loss": -41.504730224609375, "global_step": 196802, "epoch": 1626} {"train_loss": -40.97304916381836, "global_step": 196803, "epoch": 1626} {"train_loss": -41.381343841552734, "global_step": 196804, "epoch": 1626} {"train_loss": -41.55363082885742, "global_step": 196805, "epoch": 1626} {"train_loss": -40.8713493347168, "global_step": 196806, "epoch": 1626} {"train_loss": -40.37514877319336, "global_step": 196807, "epoch": 1626} {"train_loss": -41.62466049194336, "global_step": 196808, "epoch": 1626} {"train_loss": -41.63294219970703, "global_step": 196809, "epoch": 1626} {"train_loss": -41.47243881225586, "global_step": 196810, "epoch": 1626} {"train_loss": -40.8201789855957, "global_step": 196811, "epoch": 1626} {"train_loss": -41.00086212158203, "global_step": 196812, "epoch": 1626} {"train_loss": -41.25971221923828, "global_step": 196813, "epoch": 1626} {"train_loss": -41.59249496459961, "global_step": 196814, "epoch": 1626} {"train_loss": -41.17219924926758, "global_step": 196815, "epoch": 1626} {"train_loss": -40.91091537475586, "global_step": 196816, "epoch": 1626} {"train_loss": -41.66749954223633, "global_step": 196817, "epoch": 1626} {"train_loss": -41.42986297607422, "global_step": 196818, "epoch": 1626} {"train_loss": -41.418880462646484, "global_step": 196819, "epoch": 1626} {"train_loss": -41.02654266357422, "global_step": 196820, "epoch": 1626} {"train_loss": -41.19488525390625, "global_step": 196821, "epoch": 1626} {"train_loss": -40.589839935302734, "global_step": 196822, "epoch": 1626} {"train_loss": -40.76082992553711, "global_step": 196823, "epoch": 1626} {"train_loss": -39.602169036865234, "global_step": 196824, "epoch": 1626} {"train_loss": -41.08015823364258, "global_step": 196825, "epoch": 1626} {"train_loss": -40.6212158203125, "global_step": 196826, "epoch": 1626} {"train_loss": -40.96541976928711, "global_step": 196827, "epoch": 1626} {"train_loss": -41.0496940612793, "global_step": 196828, "epoch": 1626} {"train_loss": -41.544715881347656, "global_step": 196829, "epoch": 1626} {"train_loss": -41.272682189941406, "global_step": 196830, "epoch": 1626} {"train_loss": -41.29232406616211, "global_step": 196831, "epoch": 1626} {"train_loss": -40.26372146606445, "global_step": 196832, "epoch": 1626} {"train_loss": -41.053401947021484, "global_step": 196833, "epoch": 1626} {"train_loss": -40.13103103637695, "global_step": 196834, "epoch": 1626} {"train_loss": -38.107418060302734, "global_step": 196835, "epoch": 1626} {"train_loss": -36.22882843017578, "global_step": 196836, "epoch": 1626} {"train_loss": -36.34466552734375, "global_step": 196837, "epoch": 1626} {"train_loss": -38.50537872314453, "global_step": 196838, "epoch": 1626} {"train_loss": -39.71223831176758, "global_step": 196839, "epoch": 1626} {"train_loss": -36.63859558105469, "global_step": 196840, "epoch": 1626} {"train_loss": -37.82204055786133, "global_step": 196841, "epoch": 1626} {"train_loss": -39.25305938720703, "global_step": 196842, "epoch": 1626} {"train_loss": -35.159828186035156, "global_step": 196843, "epoch": 1626} {"train_loss": -39.18185806274414, "global_step": 196844, "epoch": 1626} {"train_loss": -39.20424270629883, "global_step": 196845, "epoch": 1626} {"train_loss": -35.850093841552734, "global_step": 196846, "epoch": 1626} {"train_loss": -39.847412109375, "global_step": 196847, "epoch": 1626} {"train_loss": -36.4015007019043, "global_step": 196848, "epoch": 1626} {"train_loss": -38.62023162841797, "global_step": 196849, "epoch": 1626} {"train_loss": -40.70973587036133, "global_step": 196850, "epoch": 1626} {"train_loss": -39.04098129272461, "global_step": 196851, "epoch": 1626} {"train_loss": -40.400936126708984, "global_step": 196852, "epoch": 1626} {"train_loss": -40.09480285644531, "global_step": 196853, "epoch": 1626} {"train_loss": -41.39898681640625, "global_step": 196854, "epoch": 1626} {"train_loss": -39.7829475402832, "global_step": 196855, "epoch": 1626} {"train_loss": -40.411163330078125, "global_step": 196856, "epoch": 1626} {"train_loss": -40.240360260009766, "global_step": 196857, "epoch": 1626} {"train_loss": -40.397098541259766, "global_step": 196858, "epoch": 1626} {"train_loss": -40.32634353637695, "global_step": 196859, "epoch": 1626} {"train_loss": -40.16917419433594, "global_step": 196860, "epoch": 1626} {"train_loss": -39.94373321533203, "global_step": 196861, "epoch": 1626} {"train_loss": -40.061283111572266, "global_step": 196862, "epoch": 1626} {"train_loss": -40.97212219238281, "global_step": 196863, "epoch": 1626} {"train_loss": -40.7554931640625, "global_step": 196864, "epoch": 1626} {"train_loss": -40.811161041259766, "global_step": 196865, "epoch": 1626} {"train_loss": -39.92728651062516, "global_step": 196866, "epoch": 1626, "val_loss": 2520639.25} {"train_loss": -40.83720016479492, "global_step": 196867, "epoch": 1627} {"train_loss": -40.80159378051758, "global_step": 196868, "epoch": 1627} {"train_loss": -41.40055465698242, "global_step": 196869, "epoch": 1627} {"train_loss": -41.03196334838867, "global_step": 196870, "epoch": 1627} {"train_loss": -40.496788024902344, "global_step": 196871, "epoch": 1627} {"train_loss": -41.022212982177734, "global_step": 196872, "epoch": 1627} {"train_loss": -41.50980758666992, "global_step": 196873, "epoch": 1627} {"train_loss": -41.67403793334961, "global_step": 196874, "epoch": 1627} {"train_loss": -41.57619857788086, "global_step": 196875, "epoch": 1627} {"train_loss": -41.50246810913086, "global_step": 196876, "epoch": 1627} {"train_loss": -41.436126708984375, "global_step": 196877, "epoch": 1627} {"train_loss": -41.55280303955078, "global_step": 196878, "epoch": 1627} {"train_loss": -40.867610931396484, "global_step": 196879, "epoch": 1627} {"train_loss": -41.52834701538086, "global_step": 196880, "epoch": 1627} {"train_loss": -41.46533203125, "global_step": 196881, "epoch": 1627} {"train_loss": -41.396461486816406, "global_step": 196882, "epoch": 1627} {"train_loss": -41.738040924072266, "global_step": 196883, "epoch": 1627} {"train_loss": -40.692779541015625, "global_step": 196884, "epoch": 1627} {"train_loss": -41.4443359375, "global_step": 196885, "epoch": 1627} {"train_loss": -41.01667404174805, "global_step": 196886, "epoch": 1627} {"train_loss": -41.48903274536133, "global_step": 196887, "epoch": 1627} {"train_loss": -41.59260177612305, "global_step": 196888, "epoch": 1627} {"train_loss": -41.70565414428711, "global_step": 196889, "epoch": 1627} {"train_loss": -41.0423583984375, "global_step": 196890, "epoch": 1627} {"train_loss": -42.00468826293945, "global_step": 196891, "epoch": 1627} {"train_loss": -41.513694763183594, "global_step": 196892, "epoch": 1627} {"train_loss": -41.66515350341797, "global_step": 196893, "epoch": 1627} {"train_loss": -41.81074142456055, "global_step": 196894, "epoch": 1627} {"train_loss": -41.67634201049805, "global_step": 196895, "epoch": 1627} {"train_loss": -41.1766471862793, "global_step": 196896, "epoch": 1627} {"train_loss": -40.89360427856445, "global_step": 196897, "epoch": 1627} {"train_loss": -41.65142822265625, "global_step": 196898, "epoch": 1627} {"train_loss": -42.079524993896484, "global_step": 196899, "epoch": 1627} {"train_loss": -41.5487174987793, "global_step": 196900, "epoch": 1627} {"train_loss": -41.83346176147461, "global_step": 196901, "epoch": 1627} {"train_loss": -42.124961853027344, "global_step": 196902, "epoch": 1627} {"train_loss": -41.59710693359375, "global_step": 196903, "epoch": 1627} {"train_loss": -42.25230407714844, "global_step": 196904, "epoch": 1627} {"train_loss": -42.0055046081543, "global_step": 196905, "epoch": 1627} {"train_loss": -41.9299201965332, "global_step": 196906, "epoch": 1627} {"train_loss": -41.82200241088867, "global_step": 196907, "epoch": 1627} {"train_loss": -40.59425354003906, "global_step": 196908, "epoch": 1627} {"train_loss": -40.63454055786133, "global_step": 196909, "epoch": 1627} {"train_loss": -37.797035217285156, "global_step": 196910, "epoch": 1627} {"train_loss": -39.30593490600586, "global_step": 196911, "epoch": 1627} {"train_loss": -40.58779525756836, "global_step": 196912, "epoch": 1627} {"train_loss": -40.47328186035156, "global_step": 196913, "epoch": 1627} {"train_loss": -41.00106430053711, "global_step": 196914, "epoch": 1627} {"train_loss": -40.960601806640625, "global_step": 196915, "epoch": 1627} {"train_loss": -39.39912033081055, "global_step": 196916, "epoch": 1627} {"train_loss": -35.51850509643555, "global_step": 196917, "epoch": 1627} {"train_loss": -36.16128921508789, "global_step": 196918, "epoch": 1627} {"train_loss": -40.42376708984375, "global_step": 196919, "epoch": 1627} {"train_loss": -40.862422943115234, "global_step": 196920, "epoch": 1627} {"train_loss": -39.34357452392578, "global_step": 196921, "epoch": 1627} {"train_loss": -39.77181625366211, "global_step": 196922, "epoch": 1627} {"train_loss": -41.842872619628906, "global_step": 196923, "epoch": 1627} {"train_loss": -40.300079345703125, "global_step": 196924, "epoch": 1627} {"train_loss": -40.36373519897461, "global_step": 196925, "epoch": 1627} {"train_loss": -41.276466369628906, "global_step": 196926, "epoch": 1627} {"train_loss": -40.67744064331055, "global_step": 196927, "epoch": 1627} {"train_loss": -41.346309661865234, "global_step": 196928, "epoch": 1627} {"train_loss": -40.91482162475586, "global_step": 196929, "epoch": 1627} {"train_loss": -41.61872100830078, "global_step": 196930, "epoch": 1627} {"train_loss": -41.408016204833984, "global_step": 196931, "epoch": 1627} {"train_loss": -42.1485595703125, "global_step": 196932, "epoch": 1627} {"train_loss": -40.664886474609375, "global_step": 196933, "epoch": 1627} {"train_loss": -40.43983459472656, "global_step": 196934, "epoch": 1627} {"train_loss": -40.5029182434082, "global_step": 196935, "epoch": 1627} {"train_loss": -39.872798919677734, "global_step": 196936, "epoch": 1627} {"train_loss": -41.02895736694336, "global_step": 196937, "epoch": 1627} {"train_loss": -41.355018615722656, "global_step": 196938, "epoch": 1627} {"train_loss": -40.66305160522461, "global_step": 196939, "epoch": 1627} {"train_loss": -41.920631408691406, "global_step": 196940, "epoch": 1627} {"train_loss": -40.609764099121094, "global_step": 196941, "epoch": 1627} {"train_loss": -40.12984848022461, "global_step": 196942, "epoch": 1627} {"train_loss": -40.47736740112305, "global_step": 196943, "epoch": 1627} {"train_loss": -40.63869094848633, "global_step": 196944, "epoch": 1627} {"train_loss": -41.16294479370117, "global_step": 196945, "epoch": 1627} {"train_loss": -40.77311325073242, "global_step": 196946, "epoch": 1627} {"train_loss": -41.35378646850586, "global_step": 196947, "epoch": 1627} {"train_loss": -40.552608489990234, "global_step": 196948, "epoch": 1627} {"train_loss": -40.9730339050293, "global_step": 196949, "epoch": 1627} {"train_loss": -39.436153411865234, "global_step": 196950, "epoch": 1627} {"train_loss": -41.00796127319336, "global_step": 196951, "epoch": 1627} {"train_loss": -41.34865951538086, "global_step": 196952, "epoch": 1627} {"train_loss": -41.16901779174805, "global_step": 196953, "epoch": 1627} {"train_loss": -41.303558349609375, "global_step": 196954, "epoch": 1627} {"train_loss": -41.33259582519531, "global_step": 196955, "epoch": 1627} {"train_loss": -40.99250411987305, "global_step": 196956, "epoch": 1627} {"train_loss": -41.72206497192383, "global_step": 196957, "epoch": 1627} {"train_loss": -42.177852630615234, "global_step": 196958, "epoch": 1627} {"train_loss": -41.13087844848633, "global_step": 196959, "epoch": 1627} {"train_loss": -41.0465202331543, "global_step": 196960, "epoch": 1627} {"train_loss": -41.61781692504883, "global_step": 196961, "epoch": 1627} {"train_loss": -39.11936569213867, "global_step": 196962, "epoch": 1627} {"train_loss": -41.20725631713867, "global_step": 196963, "epoch": 1627} {"train_loss": -40.81781768798828, "global_step": 196964, "epoch": 1627} {"train_loss": -41.571685791015625, "global_step": 196965, "epoch": 1627} {"train_loss": -40.82696533203125, "global_step": 196966, "epoch": 1627} {"train_loss": -39.9737548828125, "global_step": 196967, "epoch": 1627} {"train_loss": -40.090362548828125, "global_step": 196968, "epoch": 1627} {"train_loss": -39.361061096191406, "global_step": 196969, "epoch": 1627} {"train_loss": -41.110816955566406, "global_step": 196970, "epoch": 1627} {"train_loss": -41.45905685424805, "global_step": 196971, "epoch": 1627} {"train_loss": -39.118526458740234, "global_step": 196972, "epoch": 1627} {"train_loss": -39.29115676879883, "global_step": 196973, "epoch": 1627} {"train_loss": -32.86238479614258, "global_step": 196974, "epoch": 1627} {"train_loss": -38.87815856933594, "global_step": 196975, "epoch": 1627} {"train_loss": -36.39561080932617, "global_step": 196976, "epoch": 1627} {"train_loss": -39.946231842041016, "global_step": 196977, "epoch": 1627} {"train_loss": -37.39496994018555, "global_step": 196978, "epoch": 1627} {"train_loss": -40.014034271240234, "global_step": 196979, "epoch": 1627} {"train_loss": -40.49540328979492, "global_step": 196980, "epoch": 1627} {"train_loss": -39.93225860595703, "global_step": 196981, "epoch": 1627} {"train_loss": -38.62398910522461, "global_step": 196982, "epoch": 1627} {"train_loss": -40.109493255615234, "global_step": 196983, "epoch": 1627} {"train_loss": -40.26559066772461, "global_step": 196984, "epoch": 1627} {"train_loss": -40.13128662109375, "global_step": 196985, "epoch": 1627} {"train_loss": -40.2862663269043, "global_step": 196986, "epoch": 1627} {"train_loss": -40.67744133689187, "global_step": 196987, "epoch": 1627, "val_loss": 2556711.75} {"train_loss": -40.55929183959961, "global_step": 196988, "epoch": 1628} {"train_loss": -40.939552307128906, "global_step": 196989, "epoch": 1628} {"train_loss": -41.0628776550293, "global_step": 196990, "epoch": 1628} {"train_loss": -40.79997634887695, "global_step": 196991, "epoch": 1628} {"train_loss": -40.8037223815918, "global_step": 196992, "epoch": 1628} {"train_loss": -38.762020111083984, "global_step": 196993, "epoch": 1628} {"train_loss": -39.89039993286133, "global_step": 196994, "epoch": 1628} {"train_loss": -40.71194076538086, "global_step": 196995, "epoch": 1628} {"train_loss": -40.07951736450195, "global_step": 196996, "epoch": 1628} {"train_loss": -36.9770622253418, "global_step": 196997, "epoch": 1628} {"train_loss": -39.77680587768555, "global_step": 196998, "epoch": 1628} {"train_loss": -40.41236114501953, "global_step": 196999, "epoch": 1628} {"train_loss": -40.21827697753906, "global_step": 197000, "epoch": 1628} {"train_loss": -39.305145263671875, "global_step": 197001, "epoch": 1628} {"train_loss": -40.32637405395508, "global_step": 197002, "epoch": 1628} {"train_loss": -40.75522994995117, "global_step": 197003, "epoch": 1628} {"train_loss": -41.86668014526367, "global_step": 197004, "epoch": 1628} {"train_loss": -40.53765869140625, "global_step": 197005, "epoch": 1628} {"train_loss": -40.94558334350586, "global_step": 197006, "epoch": 1628} {"train_loss": -41.147857666015625, "global_step": 197007, "epoch": 1628} {"train_loss": -41.17036056518555, "global_step": 197008, "epoch": 1628} {"train_loss": -41.80116653442383, "global_step": 197009, "epoch": 1628} {"train_loss": -40.51548385620117, "global_step": 197010, "epoch": 1628} {"train_loss": -41.346046447753906, "global_step": 197011, "epoch": 1628} {"train_loss": -40.2274284362793, "global_step": 197012, "epoch": 1628} {"train_loss": -41.90098190307617, "global_step": 197013, "epoch": 1628} {"train_loss": -41.17749786376953, "global_step": 197014, "epoch": 1628} {"train_loss": -41.79724884033203, "global_step": 197015, "epoch": 1628} {"train_loss": -41.77096939086914, "global_step": 197016, "epoch": 1628} {"train_loss": -41.617820739746094, "global_step": 197017, "epoch": 1628} {"train_loss": -40.8963623046875, "global_step": 197018, "epoch": 1628} {"train_loss": -40.64054489135742, "global_step": 197019, "epoch": 1628} {"train_loss": -39.68040466308594, "global_step": 197020, "epoch": 1628} {"train_loss": -40.83989334106445, "global_step": 197021, "epoch": 1628} {"train_loss": -40.976104736328125, "global_step": 197022, "epoch": 1628} {"train_loss": -40.826473236083984, "global_step": 197023, "epoch": 1628} {"train_loss": -40.75187301635742, "global_step": 197024, "epoch": 1628} {"train_loss": -39.644569396972656, "global_step": 197025, "epoch": 1628} {"train_loss": -40.90735626220703, "global_step": 197026, "epoch": 1628} {"train_loss": -42.026309967041016, "global_step": 197027, "epoch": 1628} {"train_loss": -40.98062515258789, "global_step": 197028, "epoch": 1628} {"train_loss": -41.178470611572266, "global_step": 197029, "epoch": 1628} {"train_loss": -39.80955123901367, "global_step": 197030, "epoch": 1628} {"train_loss": -41.661285400390625, "global_step": 197031, "epoch": 1628} {"train_loss": -39.0695915222168, "global_step": 197032, "epoch": 1628} {"train_loss": -40.612876892089844, "global_step": 197033, "epoch": 1628} {"train_loss": -41.25197219848633, "global_step": 197034, "epoch": 1628} {"train_loss": -40.50884246826172, "global_step": 197035, "epoch": 1628} {"train_loss": -36.298736572265625, "global_step": 197036, "epoch": 1628} {"train_loss": -40.28351974487305, "global_step": 197037, "epoch": 1628} {"train_loss": -40.487300872802734, "global_step": 197038, "epoch": 1628} {"train_loss": -41.1125602722168, "global_step": 197039, "epoch": 1628} {"train_loss": -39.47996139526367, "global_step": 197040, "epoch": 1628} {"train_loss": -40.42933654785156, "global_step": 197041, "epoch": 1628} {"train_loss": -40.57015609741211, "global_step": 197042, "epoch": 1628} {"train_loss": -39.43247604370117, "global_step": 197043, "epoch": 1628} {"train_loss": -40.72304153442383, "global_step": 197044, "epoch": 1628} {"train_loss": -40.74753189086914, "global_step": 197045, "epoch": 1628} {"train_loss": -39.95869064331055, "global_step": 197046, "epoch": 1628} {"train_loss": -41.12105178833008, "global_step": 197047, "epoch": 1628} {"train_loss": -41.04514694213867, "global_step": 197048, "epoch": 1628} {"train_loss": -38.883827209472656, "global_step": 197049, "epoch": 1628} {"train_loss": -41.324214935302734, "global_step": 197050, "epoch": 1628} {"train_loss": -40.618125915527344, "global_step": 197051, "epoch": 1628} {"train_loss": -40.44462203979492, "global_step": 197052, "epoch": 1628} {"train_loss": -41.14996337890625, "global_step": 197053, "epoch": 1628} {"train_loss": -41.74141311645508, "global_step": 197054, "epoch": 1628} {"train_loss": -41.3298454284668, "global_step": 197055, "epoch": 1628} {"train_loss": -39.15926742553711, "global_step": 197056, "epoch": 1628} {"train_loss": -40.21225357055664, "global_step": 197057, "epoch": 1628} {"train_loss": -39.002140045166016, "global_step": 197058, "epoch": 1628} {"train_loss": -40.71417236328125, "global_step": 197059, "epoch": 1628} {"train_loss": -40.413795471191406, "global_step": 197060, "epoch": 1628} {"train_loss": -41.30930709838867, "global_step": 197061, "epoch": 1628} {"train_loss": -40.833885192871094, "global_step": 197062, "epoch": 1628} {"train_loss": -40.169471740722656, "global_step": 197063, "epoch": 1628} {"train_loss": -39.198646545410156, "global_step": 197064, "epoch": 1628} {"train_loss": -40.468780517578125, "global_step": 197065, "epoch": 1628} {"train_loss": -40.043251037597656, "global_step": 197066, "epoch": 1628} {"train_loss": -39.46023178100586, "global_step": 197067, "epoch": 1628} {"train_loss": -39.4908447265625, "global_step": 197068, "epoch": 1628} {"train_loss": -39.80743408203125, "global_step": 197069, "epoch": 1628} {"train_loss": -41.13800048828125, "global_step": 197070, "epoch": 1628} {"train_loss": -40.4985466003418, "global_step": 197071, "epoch": 1628} {"train_loss": -39.41096115112305, "global_step": 197072, "epoch": 1628} {"train_loss": -39.41022872924805, "global_step": 197073, "epoch": 1628} {"train_loss": -41.17399215698242, "global_step": 197074, "epoch": 1628} {"train_loss": -39.523494720458984, "global_step": 197075, "epoch": 1628} {"train_loss": -38.31122589111328, "global_step": 197076, "epoch": 1628} {"train_loss": -38.905479431152344, "global_step": 197077, "epoch": 1628} {"train_loss": -40.50716018676758, "global_step": 197078, "epoch": 1628} {"train_loss": -38.45832824707031, "global_step": 197079, "epoch": 1628} {"train_loss": -40.90049362182617, "global_step": 197080, "epoch": 1628} {"train_loss": -40.438720703125, "global_step": 197081, "epoch": 1628} {"train_loss": -40.1497802734375, "global_step": 197082, "epoch": 1628} {"train_loss": -40.797183990478516, "global_step": 197083, "epoch": 1628} {"train_loss": -39.28116989135742, "global_step": 197084, "epoch": 1628} {"train_loss": -40.750125885009766, "global_step": 197085, "epoch": 1628} {"train_loss": -40.86688995361328, "global_step": 197086, "epoch": 1628} {"train_loss": -38.85923385620117, "global_step": 197087, "epoch": 1628} {"train_loss": -38.18904495239258, "global_step": 197088, "epoch": 1628} {"train_loss": -40.863258361816406, "global_step": 197089, "epoch": 1628} {"train_loss": -39.34682083129883, "global_step": 197090, "epoch": 1628} {"train_loss": -40.17139434814453, "global_step": 197091, "epoch": 1628} {"train_loss": -40.88920593261719, "global_step": 197092, "epoch": 1628} {"train_loss": -40.46976089477539, "global_step": 197093, "epoch": 1628} {"train_loss": -40.83989334106445, "global_step": 197094, "epoch": 1628} {"train_loss": -41.08990478515625, "global_step": 197095, "epoch": 1628} {"train_loss": -40.639278411865234, "global_step": 197096, "epoch": 1628} {"train_loss": -40.74832534790039, "global_step": 197097, "epoch": 1628} {"train_loss": -40.4503059387207, "global_step": 197098, "epoch": 1628} {"train_loss": -40.83900833129883, "global_step": 197099, "epoch": 1628} {"train_loss": -41.2588005065918, "global_step": 197100, "epoch": 1628} {"train_loss": -40.708709716796875, "global_step": 197101, "epoch": 1628} {"train_loss": -41.10377502441406, "global_step": 197102, "epoch": 1628} {"train_loss": -41.202022552490234, "global_step": 197103, "epoch": 1628} {"train_loss": -41.43976593017578, "global_step": 197104, "epoch": 1628} {"train_loss": -41.077510833740234, "global_step": 197105, "epoch": 1628} {"train_loss": -41.414424896240234, "global_step": 197106, "epoch": 1628} {"train_loss": -40.54176330566406, "global_step": 197107, "epoch": 1628} {"train_loss": -40.43894517126162, "global_step": 197108, "epoch": 1628, "val_loss": 2572639.0} {"train_loss": -39.272830963134766, "global_step": 197109, "epoch": 1629} {"train_loss": -40.200408935546875, "global_step": 197110, "epoch": 1629} {"train_loss": -41.44266891479492, "global_step": 197111, "epoch": 1629} {"train_loss": -41.9519157409668, "global_step": 197112, "epoch": 1629} {"train_loss": -41.312538146972656, "global_step": 197113, "epoch": 1629} {"train_loss": -41.21119689941406, "global_step": 197114, "epoch": 1629} {"train_loss": -41.69607162475586, "global_step": 197115, "epoch": 1629} {"train_loss": -41.161956787109375, "global_step": 197116, "epoch": 1629} {"train_loss": -40.99369430541992, "global_step": 197117, "epoch": 1629} {"train_loss": -41.943824768066406, "global_step": 197118, "epoch": 1629} {"train_loss": -41.578861236572266, "global_step": 197119, "epoch": 1629} {"train_loss": -41.14957809448242, "global_step": 197120, "epoch": 1629} {"train_loss": -41.63564682006836, "global_step": 197121, "epoch": 1629} {"train_loss": -41.210182189941406, "global_step": 197122, "epoch": 1629} {"train_loss": -41.992347717285156, "global_step": 197123, "epoch": 1629} {"train_loss": -41.22734832763672, "global_step": 197124, "epoch": 1629} {"train_loss": -41.88576889038086, "global_step": 197125, "epoch": 1629} {"train_loss": -42.09737014770508, "global_step": 197126, "epoch": 1629} {"train_loss": -40.980918884277344, "global_step": 197127, "epoch": 1629} {"train_loss": -41.837005615234375, "global_step": 197128, "epoch": 1629} {"train_loss": -41.999820709228516, "global_step": 197129, "epoch": 1629} {"train_loss": -41.809173583984375, "global_step": 197130, "epoch": 1629} {"train_loss": -41.75020217895508, "global_step": 197131, "epoch": 1629} {"train_loss": -41.80339813232422, "global_step": 197132, "epoch": 1629} {"train_loss": -41.68473434448242, "global_step": 197133, "epoch": 1629} {"train_loss": -41.84486770629883, "global_step": 197134, "epoch": 1629} {"train_loss": -41.89955520629883, "global_step": 197135, "epoch": 1629} {"train_loss": -41.8077507019043, "global_step": 197136, "epoch": 1629} {"train_loss": -42.00033950805664, "global_step": 197137, "epoch": 1629} {"train_loss": -40.58484649658203, "global_step": 197138, "epoch": 1629} {"train_loss": -40.578773498535156, "global_step": 197139, "epoch": 1629} {"train_loss": -39.01457595825195, "global_step": 197140, "epoch": 1629} {"train_loss": -38.47669219970703, "global_step": 197141, "epoch": 1629} {"train_loss": -41.00584411621094, "global_step": 197142, "epoch": 1629} {"train_loss": -42.260223388671875, "global_step": 197143, "epoch": 1629} {"train_loss": -39.803855895996094, "global_step": 197144, "epoch": 1629} {"train_loss": -39.58853530883789, "global_step": 197145, "epoch": 1629} {"train_loss": -41.02925491333008, "global_step": 197146, "epoch": 1629} {"train_loss": -41.7869987487793, "global_step": 197147, "epoch": 1629} {"train_loss": -39.66416549682617, "global_step": 197148, "epoch": 1629} {"train_loss": -41.118873596191406, "global_step": 197149, "epoch": 1629} {"train_loss": -42.18967819213867, "global_step": 197150, "epoch": 1629} {"train_loss": -41.86497497558594, "global_step": 197151, "epoch": 1629} {"train_loss": -41.75337219238281, "global_step": 197152, "epoch": 1629} {"train_loss": -41.12014389038086, "global_step": 197153, "epoch": 1629} {"train_loss": -40.93014144897461, "global_step": 197154, "epoch": 1629} {"train_loss": -41.352901458740234, "global_step": 197155, "epoch": 1629} {"train_loss": -41.39601516723633, "global_step": 197156, "epoch": 1629} {"train_loss": -41.57804870605469, "global_step": 197157, "epoch": 1629} {"train_loss": -41.64409637451172, "global_step": 197158, "epoch": 1629} {"train_loss": -41.2822265625, "global_step": 197159, "epoch": 1629} {"train_loss": -41.79207229614258, "global_step": 197160, "epoch": 1629} {"train_loss": -41.757320404052734, "global_step": 197161, "epoch": 1629} {"train_loss": -42.114253997802734, "global_step": 197162, "epoch": 1629} {"train_loss": -41.317962646484375, "global_step": 197163, "epoch": 1629} {"train_loss": -42.09072494506836, "global_step": 197164, "epoch": 1629} {"train_loss": -42.4489860534668, "global_step": 197165, "epoch": 1629} {"train_loss": -41.58726119995117, "global_step": 197166, "epoch": 1629} {"train_loss": -41.71308135986328, "global_step": 197167, "epoch": 1629} {"train_loss": -41.73862838745117, "global_step": 197168, "epoch": 1629} {"train_loss": -41.458560943603516, "global_step": 197169, "epoch": 1629} {"train_loss": -41.841949462890625, "global_step": 197170, "epoch": 1629} {"train_loss": -41.939117431640625, "global_step": 197171, "epoch": 1629} {"train_loss": -40.831607818603516, "global_step": 197172, "epoch": 1629} {"train_loss": -41.238765716552734, "global_step": 197173, "epoch": 1629} {"train_loss": -41.3889274597168, "global_step": 197174, "epoch": 1629} {"train_loss": -41.51810836791992, "global_step": 197175, "epoch": 1629} {"train_loss": -40.8799934387207, "global_step": 197176, "epoch": 1629} {"train_loss": -40.87472152709961, "global_step": 197177, "epoch": 1629} {"train_loss": -39.80646896362305, "global_step": 197178, "epoch": 1629} {"train_loss": -39.12946319580078, "global_step": 197179, "epoch": 1629} {"train_loss": -35.84206771850586, "global_step": 197180, "epoch": 1629} {"train_loss": -37.8240966796875, "global_step": 197181, "epoch": 1629} {"train_loss": -40.11769104003906, "global_step": 197182, "epoch": 1629} {"train_loss": -40.284847259521484, "global_step": 197183, "epoch": 1629} {"train_loss": -38.51019287109375, "global_step": 197184, "epoch": 1629} {"train_loss": -35.552669525146484, "global_step": 197185, "epoch": 1629} {"train_loss": -38.64714813232422, "global_step": 197186, "epoch": 1629} {"train_loss": -41.171112060546875, "global_step": 197187, "epoch": 1629} {"train_loss": -39.37403106689453, "global_step": 197188, "epoch": 1629} {"train_loss": -39.47554397583008, "global_step": 197189, "epoch": 1629} {"train_loss": -40.28743362426758, "global_step": 197190, "epoch": 1629} {"train_loss": -40.04404067993164, "global_step": 197191, "epoch": 1629} {"train_loss": -40.94293212890625, "global_step": 197192, "epoch": 1629} {"train_loss": -39.9804801940918, "global_step": 197193, "epoch": 1629} {"train_loss": -40.82373809814453, "global_step": 197194, "epoch": 1629} {"train_loss": -40.7733039855957, "global_step": 197195, "epoch": 1629} {"train_loss": -39.91472244262695, "global_step": 197196, "epoch": 1629} {"train_loss": -41.11444091796875, "global_step": 197197, "epoch": 1629} {"train_loss": -40.245635986328125, "global_step": 197198, "epoch": 1629} {"train_loss": -41.24474334716797, "global_step": 197199, "epoch": 1629} {"train_loss": -40.914119720458984, "global_step": 197200, "epoch": 1629} {"train_loss": -40.190250396728516, "global_step": 197201, "epoch": 1629} {"train_loss": -41.14289474487305, "global_step": 197202, "epoch": 1629} {"train_loss": -41.18770980834961, "global_step": 197203, "epoch": 1629} {"train_loss": -40.53064727783203, "global_step": 197204, "epoch": 1629} {"train_loss": -41.187225341796875, "global_step": 197205, "epoch": 1629} {"train_loss": -40.43000411987305, "global_step": 197206, "epoch": 1629} {"train_loss": -41.22520065307617, "global_step": 197207, "epoch": 1629} {"train_loss": -39.9754753112793, "global_step": 197208, "epoch": 1629} {"train_loss": -40.91654586791992, "global_step": 197209, "epoch": 1629} {"train_loss": -40.63987350463867, "global_step": 197210, "epoch": 1629} {"train_loss": -40.07760238647461, "global_step": 197211, "epoch": 1629} {"train_loss": -40.968753814697266, "global_step": 197212, "epoch": 1629} {"train_loss": -39.813392639160156, "global_step": 197213, "epoch": 1629} {"train_loss": -41.059425354003906, "global_step": 197214, "epoch": 1629} {"train_loss": -41.32105255126953, "global_step": 197215, "epoch": 1629} {"train_loss": -40.14228057861328, "global_step": 197216, "epoch": 1629} {"train_loss": -40.97774887084961, "global_step": 197217, "epoch": 1629} {"train_loss": -41.51542282104492, "global_step": 197218, "epoch": 1629} {"train_loss": -41.41218185424805, "global_step": 197219, "epoch": 1629} {"train_loss": -40.830440521240234, "global_step": 197220, "epoch": 1629} {"train_loss": -41.976715087890625, "global_step": 197221, "epoch": 1629} {"train_loss": -41.31608963012695, "global_step": 197222, "epoch": 1629} {"train_loss": -42.24137496948242, "global_step": 197223, "epoch": 1629} {"train_loss": -41.851600646972656, "global_step": 197224, "epoch": 1629} {"train_loss": -41.50148010253906, "global_step": 197225, "epoch": 1629} {"train_loss": -41.621150970458984, "global_step": 197226, "epoch": 1629} {"train_loss": -41.832977294921875, "global_step": 197227, "epoch": 1629} {"train_loss": -41.833858489990234, "global_step": 197228, "epoch": 1629} {"train_loss": -40.952459823986715, "global_step": 197229, "epoch": 1629, "val_loss": 2551716.25} {"train_loss": -41.63907241821289, "global_step": 197230, "epoch": 1630} {"train_loss": -41.177677154541016, "global_step": 197231, "epoch": 1630} {"train_loss": -41.692195892333984, "global_step": 197232, "epoch": 1630} {"train_loss": -41.514373779296875, "global_step": 197233, "epoch": 1630} {"train_loss": -40.93117141723633, "global_step": 197234, "epoch": 1630} {"train_loss": -41.2904167175293, "global_step": 197235, "epoch": 1630} {"train_loss": -41.1611442565918, "global_step": 197236, "epoch": 1630} {"train_loss": -41.15596389770508, "global_step": 197237, "epoch": 1630} {"train_loss": -41.71601867675781, "global_step": 197238, "epoch": 1630} {"train_loss": -41.22105026245117, "global_step": 197239, "epoch": 1630} {"train_loss": -40.156593322753906, "global_step": 197240, "epoch": 1630} {"train_loss": -41.64077377319336, "global_step": 197241, "epoch": 1630} {"train_loss": -40.51615905761719, "global_step": 197242, "epoch": 1630} {"train_loss": -41.35561752319336, "global_step": 197243, "epoch": 1630} {"train_loss": -41.01136779785156, "global_step": 197244, "epoch": 1630} {"train_loss": -40.90644454956055, "global_step": 197245, "epoch": 1630} {"train_loss": -39.8717155456543, "global_step": 197246, "epoch": 1630} {"train_loss": -40.25263595581055, "global_step": 197247, "epoch": 1630} {"train_loss": -40.81767654418945, "global_step": 197248, "epoch": 1630} {"train_loss": -38.1185188293457, "global_step": 197249, "epoch": 1630} {"train_loss": -40.01424026489258, "global_step": 197250, "epoch": 1630} {"train_loss": -39.767330169677734, "global_step": 197251, "epoch": 1630} {"train_loss": -38.6108512878418, "global_step": 197252, "epoch": 1630} {"train_loss": -39.7558708190918, "global_step": 197253, "epoch": 1630} {"train_loss": -40.41587448120117, "global_step": 197254, "epoch": 1630} {"train_loss": -37.28908920288086, "global_step": 197255, "epoch": 1630} {"train_loss": -39.087127685546875, "global_step": 197256, "epoch": 1630} {"train_loss": -39.60575485229492, "global_step": 197257, "epoch": 1630} {"train_loss": -40.12144088745117, "global_step": 197258, "epoch": 1630} {"train_loss": -40.2279167175293, "global_step": 197259, "epoch": 1630} {"train_loss": -39.15950393676758, "global_step": 197260, "epoch": 1630} {"train_loss": -40.27147674560547, "global_step": 197261, "epoch": 1630} {"train_loss": -38.6909294128418, "global_step": 197262, "epoch": 1630} {"train_loss": -40.166015625, "global_step": 197263, "epoch": 1630} {"train_loss": -39.602134704589844, "global_step": 197264, "epoch": 1630} {"train_loss": -41.21238327026367, "global_step": 197265, "epoch": 1630} {"train_loss": -39.1777229309082, "global_step": 197266, "epoch": 1630} {"train_loss": -39.28121566772461, "global_step": 197267, "epoch": 1630} {"train_loss": -39.92525863647461, "global_step": 197268, "epoch": 1630} {"train_loss": -40.23427200317383, "global_step": 197269, "epoch": 1630} {"train_loss": -40.11655807495117, "global_step": 197270, "epoch": 1630} {"train_loss": -40.873382568359375, "global_step": 197271, "epoch": 1630} {"train_loss": -40.91650390625, "global_step": 197272, "epoch": 1630} {"train_loss": -39.881038665771484, "global_step": 197273, "epoch": 1630} {"train_loss": -39.19240951538086, "global_step": 197274, "epoch": 1630} {"train_loss": -40.40817642211914, "global_step": 197275, "epoch": 1630} {"train_loss": -39.22172164916992, "global_step": 197276, "epoch": 1630} {"train_loss": -41.06306076049805, "global_step": 197277, "epoch": 1630} {"train_loss": -41.063507080078125, "global_step": 197278, "epoch": 1630} {"train_loss": -41.353004455566406, "global_step": 197279, "epoch": 1630} {"train_loss": -41.520626068115234, "global_step": 197280, "epoch": 1630} {"train_loss": -40.30098342895508, "global_step": 197281, "epoch": 1630} {"train_loss": -40.44732666015625, "global_step": 197282, "epoch": 1630} {"train_loss": -41.6875114440918, "global_step": 197283, "epoch": 1630} {"train_loss": -41.56549835205078, "global_step": 197284, "epoch": 1630} {"train_loss": -40.466888427734375, "global_step": 197285, "epoch": 1630} {"train_loss": -39.25302505493164, "global_step": 197286, "epoch": 1630} {"train_loss": -35.92399215698242, "global_step": 197287, "epoch": 1630} {"train_loss": -40.74286651611328, "global_step": 197288, "epoch": 1630} {"train_loss": -40.379241943359375, "global_step": 197289, "epoch": 1630} {"train_loss": -40.67911911010742, "global_step": 197290, "epoch": 1630} {"train_loss": -34.50863265991211, "global_step": 197291, "epoch": 1630} {"train_loss": -40.741111755371094, "global_step": 197292, "epoch": 1630} {"train_loss": -39.01845169067383, "global_step": 197293, "epoch": 1630} {"train_loss": -36.92965316772461, "global_step": 197294, "epoch": 1630} {"train_loss": -37.927589416503906, "global_step": 197295, "epoch": 1630} {"train_loss": -41.715965270996094, "global_step": 197296, "epoch": 1630} {"train_loss": -39.953243255615234, "global_step": 197297, "epoch": 1630} {"train_loss": -39.37667465209961, "global_step": 197298, "epoch": 1630} {"train_loss": -41.27346420288086, "global_step": 197299, "epoch": 1630} {"train_loss": -35.754329681396484, "global_step": 197300, "epoch": 1630} {"train_loss": -37.13556671142578, "global_step": 197301, "epoch": 1630} {"train_loss": -37.36507797241211, "global_step": 197302, "epoch": 1630} {"train_loss": -35.43940353393555, "global_step": 197303, "epoch": 1630} {"train_loss": -38.1307487487793, "global_step": 197304, "epoch": 1630} {"train_loss": -36.0754508972168, "global_step": 197305, "epoch": 1630} {"train_loss": -38.4775505065918, "global_step": 197306, "epoch": 1630} {"train_loss": -40.151424407958984, "global_step": 197307, "epoch": 1630} {"train_loss": -36.60116958618164, "global_step": 197308, "epoch": 1630} {"train_loss": -38.44460678100586, "global_step": 197309, "epoch": 1630} {"train_loss": -36.02397537231445, "global_step": 197310, "epoch": 1630} {"train_loss": -36.44810104370117, "global_step": 197311, "epoch": 1630} {"train_loss": -38.00932312011719, "global_step": 197312, "epoch": 1630} {"train_loss": -40.12778091430664, "global_step": 197313, "epoch": 1630} {"train_loss": -34.18663787841797, "global_step": 197314, "epoch": 1630} {"train_loss": -40.22005844116211, "global_step": 197315, "epoch": 1630} {"train_loss": -37.44845199584961, "global_step": 197316, "epoch": 1630} {"train_loss": -38.11766052246094, "global_step": 197317, "epoch": 1630} {"train_loss": -38.31523132324219, "global_step": 197318, "epoch": 1630} {"train_loss": -41.21293258666992, "global_step": 197319, "epoch": 1630} {"train_loss": -40.08100509643555, "global_step": 197320, "epoch": 1630} {"train_loss": -35.04107666015625, "global_step": 197321, "epoch": 1630} {"train_loss": -36.61199951171875, "global_step": 197322, "epoch": 1630} {"train_loss": -37.506019592285156, "global_step": 197323, "epoch": 1630} {"train_loss": -39.2813606262207, "global_step": 197324, "epoch": 1630} {"train_loss": -39.69464874267578, "global_step": 197325, "epoch": 1630} {"train_loss": -38.40720748901367, "global_step": 197326, "epoch": 1630} {"train_loss": -37.75034713745117, "global_step": 197327, "epoch": 1630} {"train_loss": -38.09265899658203, "global_step": 197328, "epoch": 1630} {"train_loss": -37.712181091308594, "global_step": 197329, "epoch": 1630} {"train_loss": -38.82929229736328, "global_step": 197330, "epoch": 1630} {"train_loss": -38.329830169677734, "global_step": 197331, "epoch": 1630} {"train_loss": -36.171112060546875, "global_step": 197332, "epoch": 1630} {"train_loss": -29.91953468322754, "global_step": 197333, "epoch": 1630} {"train_loss": -39.551109313964844, "global_step": 197334, "epoch": 1630} {"train_loss": -39.140472412109375, "global_step": 197335, "epoch": 1630} {"train_loss": -37.79558181762695, "global_step": 197336, "epoch": 1630} {"train_loss": -38.75835418701172, "global_step": 197337, "epoch": 1630} {"train_loss": -37.540794372558594, "global_step": 197338, "epoch": 1630} {"train_loss": -39.37177658081055, "global_step": 197339, "epoch": 1630} {"train_loss": -39.68416213989258, "global_step": 197340, "epoch": 1630} {"train_loss": -40.42946243286133, "global_step": 197341, "epoch": 1630} {"train_loss": -36.75534439086914, "global_step": 197342, "epoch": 1630} {"train_loss": -37.32193374633789, "global_step": 197343, "epoch": 1630} {"train_loss": -38.79488754272461, "global_step": 197344, "epoch": 1630} {"train_loss": -37.2476921081543, "global_step": 197345, "epoch": 1630} {"train_loss": -39.440731048583984, "global_step": 197346, "epoch": 1630} {"train_loss": -40.33205795288086, "global_step": 197347, "epoch": 1630} {"train_loss": -39.384498596191406, "global_step": 197348, "epoch": 1630} {"train_loss": -40.5968132019043, "global_step": 197349, "epoch": 1630} {"train_loss": -39.23532862702677, "global_step": 197350, "epoch": 1630, "val_loss": 2639336.25} {"train_loss": -39.3741340637207, "global_step": 197351, "epoch": 1631} {"train_loss": -40.08052444458008, "global_step": 197352, "epoch": 1631} {"train_loss": -39.147212982177734, "global_step": 197353, "epoch": 1631} {"train_loss": -40.74689483642578, "global_step": 197354, "epoch": 1631} {"train_loss": -39.278663635253906, "global_step": 197355, "epoch": 1631} {"train_loss": -39.02967834472656, "global_step": 197356, "epoch": 1631} {"train_loss": -40.39778518676758, "global_step": 197357, "epoch": 1631} {"train_loss": -40.48752975463867, "global_step": 197358, "epoch": 1631} {"train_loss": -40.62725830078125, "global_step": 197359, "epoch": 1631} {"train_loss": -40.147735595703125, "global_step": 197360, "epoch": 1631} {"train_loss": -40.35737609863281, "global_step": 197361, "epoch": 1631} {"train_loss": -39.8798713684082, "global_step": 197362, "epoch": 1631} {"train_loss": -40.40371322631836, "global_step": 197363, "epoch": 1631} {"train_loss": -40.724586486816406, "global_step": 197364, "epoch": 1631} {"train_loss": -40.21527862548828, "global_step": 197365, "epoch": 1631} {"train_loss": -40.6177864074707, "global_step": 197366, "epoch": 1631} {"train_loss": -41.195892333984375, "global_step": 197367, "epoch": 1631} {"train_loss": -40.18482208251953, "global_step": 197368, "epoch": 1631} {"train_loss": -39.90189743041992, "global_step": 197369, "epoch": 1631} {"train_loss": -38.60222625732422, "global_step": 197370, "epoch": 1631} {"train_loss": -40.997337341308594, "global_step": 197371, "epoch": 1631} {"train_loss": -37.570640563964844, "global_step": 197372, "epoch": 1631} {"train_loss": -40.25333786010742, "global_step": 197373, "epoch": 1631} {"train_loss": -41.02732467651367, "global_step": 197374, "epoch": 1631} {"train_loss": -39.586570739746094, "global_step": 197375, "epoch": 1631} {"train_loss": -40.83639907836914, "global_step": 197376, "epoch": 1631} {"train_loss": -41.165096282958984, "global_step": 197377, "epoch": 1631} {"train_loss": -40.40195846557617, "global_step": 197378, "epoch": 1631} {"train_loss": -40.98334884643555, "global_step": 197379, "epoch": 1631} {"train_loss": -36.00272750854492, "global_step": 197380, "epoch": 1631} {"train_loss": -40.376033782958984, "global_step": 197381, "epoch": 1631} {"train_loss": -40.409603118896484, "global_step": 197382, "epoch": 1631} {"train_loss": -38.761192321777344, "global_step": 197383, "epoch": 1631} {"train_loss": -39.864646911621094, "global_step": 197384, "epoch": 1631} {"train_loss": -40.36076736450195, "global_step": 197385, "epoch": 1631} {"train_loss": -40.17739486694336, "global_step": 197386, "epoch": 1631} {"train_loss": -40.4594612121582, "global_step": 197387, "epoch": 1631} {"train_loss": -38.81342315673828, "global_step": 197388, "epoch": 1631} {"train_loss": -39.79508972167969, "global_step": 197389, "epoch": 1631} {"train_loss": -39.86190414428711, "global_step": 197390, "epoch": 1631} {"train_loss": -39.142822265625, "global_step": 197391, "epoch": 1631} {"train_loss": -40.76787185668945, "global_step": 197392, "epoch": 1631} {"train_loss": -39.18309783935547, "global_step": 197393, "epoch": 1631} {"train_loss": -41.07206344604492, "global_step": 197394, "epoch": 1631} {"train_loss": -39.8817138671875, "global_step": 197395, "epoch": 1631} {"train_loss": -40.341617584228516, "global_step": 197396, "epoch": 1631} {"train_loss": -39.59939193725586, "global_step": 197397, "epoch": 1631} {"train_loss": -40.22792434692383, "global_step": 197398, "epoch": 1631} {"train_loss": -39.71363067626953, "global_step": 197399, "epoch": 1631} {"train_loss": -39.89057540893555, "global_step": 197400, "epoch": 1631} {"train_loss": -38.83045196533203, "global_step": 197401, "epoch": 1631} {"train_loss": -41.31330871582031, "global_step": 197402, "epoch": 1631} {"train_loss": -40.181549072265625, "global_step": 197403, "epoch": 1631} {"train_loss": -40.2755012512207, "global_step": 197404, "epoch": 1631} {"train_loss": -39.61753463745117, "global_step": 197405, "epoch": 1631} {"train_loss": -40.49402618408203, "global_step": 197406, "epoch": 1631} {"train_loss": -39.676578521728516, "global_step": 197407, "epoch": 1631} {"train_loss": -41.29304885864258, "global_step": 197408, "epoch": 1631} {"train_loss": -40.70911407470703, "global_step": 197409, "epoch": 1631} {"train_loss": -40.46962356567383, "global_step": 197410, "epoch": 1631} {"train_loss": -41.28131866455078, "global_step": 197411, "epoch": 1631} {"train_loss": -40.94386672973633, "global_step": 197412, "epoch": 1631} {"train_loss": -41.67019271850586, "global_step": 197413, "epoch": 1631} {"train_loss": -41.12662887573242, "global_step": 197414, "epoch": 1631} {"train_loss": -40.5357551574707, "global_step": 197415, "epoch": 1631} {"train_loss": -40.924346923828125, "global_step": 197416, "epoch": 1631} {"train_loss": -41.55016326904297, "global_step": 197417, "epoch": 1631} {"train_loss": -40.661678314208984, "global_step": 197418, "epoch": 1631} {"train_loss": -40.79912185668945, "global_step": 197419, "epoch": 1631} {"train_loss": -41.350711822509766, "global_step": 197420, "epoch": 1631} {"train_loss": -40.84821701049805, "global_step": 197421, "epoch": 1631} {"train_loss": -40.75601577758789, "global_step": 197422, "epoch": 1631} {"train_loss": -39.50516891479492, "global_step": 197423, "epoch": 1631} {"train_loss": -41.07573318481445, "global_step": 197424, "epoch": 1631} {"train_loss": -41.20268249511719, "global_step": 197425, "epoch": 1631} {"train_loss": -41.14461898803711, "global_step": 197426, "epoch": 1631} {"train_loss": -40.640628814697266, "global_step": 197427, "epoch": 1631} {"train_loss": -39.679222106933594, "global_step": 197428, "epoch": 1631} {"train_loss": -38.05941390991211, "global_step": 197429, "epoch": 1631} {"train_loss": -39.53837203979492, "global_step": 197430, "epoch": 1631} {"train_loss": -39.328468322753906, "global_step": 197431, "epoch": 1631} {"train_loss": -39.80268096923828, "global_step": 197432, "epoch": 1631} {"train_loss": -40.301570892333984, "global_step": 197433, "epoch": 1631} {"train_loss": -39.046756744384766, "global_step": 197434, "epoch": 1631} {"train_loss": -40.84328079223633, "global_step": 197435, "epoch": 1631} {"train_loss": -40.694190979003906, "global_step": 197436, "epoch": 1631} {"train_loss": -40.87840270996094, "global_step": 197437, "epoch": 1631} {"train_loss": -40.6745719909668, "global_step": 197438, "epoch": 1631} {"train_loss": -41.48040771484375, "global_step": 197439, "epoch": 1631} {"train_loss": -41.35396957397461, "global_step": 197440, "epoch": 1631} {"train_loss": -41.0687141418457, "global_step": 197441, "epoch": 1631} {"train_loss": -40.45212936401367, "global_step": 197442, "epoch": 1631} {"train_loss": -41.43667221069336, "global_step": 197443, "epoch": 1631} {"train_loss": -40.890663146972656, "global_step": 197444, "epoch": 1631} {"train_loss": -40.40809631347656, "global_step": 197445, "epoch": 1631} {"train_loss": -40.42357635498047, "global_step": 197446, "epoch": 1631} {"train_loss": -41.13603591918945, "global_step": 197447, "epoch": 1631} {"train_loss": -40.2076416015625, "global_step": 197448, "epoch": 1631} {"train_loss": -38.7720832824707, "global_step": 197449, "epoch": 1631} {"train_loss": -40.90253448486328, "global_step": 197450, "epoch": 1631} {"train_loss": -40.13785934448242, "global_step": 197451, "epoch": 1631} {"train_loss": -36.21561813354492, "global_step": 197452, "epoch": 1631} {"train_loss": -38.33413314819336, "global_step": 197453, "epoch": 1631} {"train_loss": -40.940677642822266, "global_step": 197454, "epoch": 1631} {"train_loss": -40.5295524597168, "global_step": 197455, "epoch": 1631} {"train_loss": -39.2766227722168, "global_step": 197456, "epoch": 1631} {"train_loss": -40.874732971191406, "global_step": 197457, "epoch": 1631} {"train_loss": -40.49592590332031, "global_step": 197458, "epoch": 1631} {"train_loss": -39.8408203125, "global_step": 197459, "epoch": 1631} {"train_loss": -38.80825424194336, "global_step": 197460, "epoch": 1631} {"train_loss": -37.799442291259766, "global_step": 197461, "epoch": 1631} {"train_loss": -39.612060546875, "global_step": 197462, "epoch": 1631} {"train_loss": -40.99834060668945, "global_step": 197463, "epoch": 1631} {"train_loss": -39.759727478027344, "global_step": 197464, "epoch": 1631} {"train_loss": -40.609134674072266, "global_step": 197465, "epoch": 1631} {"train_loss": -39.71946716308594, "global_step": 197466, "epoch": 1631} {"train_loss": -40.71439743041992, "global_step": 197467, "epoch": 1631} {"train_loss": -40.296688079833984, "global_step": 197468, "epoch": 1631} {"train_loss": -40.152854919433594, "global_step": 197469, "epoch": 1631} {"train_loss": -39.868934631347656, "global_step": 197470, "epoch": 1631} {"train_loss": -40.16552028183109, "global_step": 197471, "epoch": 1631, "val_loss": 2439756.75} {"train_loss": -40.398677825927734, "global_step": 197472, "epoch": 1632} {"train_loss": -41.10264205932617, "global_step": 197473, "epoch": 1632} {"train_loss": -40.79726791381836, "global_step": 197474, "epoch": 1632} {"train_loss": -40.017295837402344, "global_step": 197475, "epoch": 1632} {"train_loss": -40.58021926879883, "global_step": 197476, "epoch": 1632} {"train_loss": -41.22066116333008, "global_step": 197477, "epoch": 1632} {"train_loss": -39.81220245361328, "global_step": 197478, "epoch": 1632} {"train_loss": -40.606101989746094, "global_step": 197479, "epoch": 1632} {"train_loss": -41.41594314575195, "global_step": 197480, "epoch": 1632} {"train_loss": -40.89555740356445, "global_step": 197481, "epoch": 1632} {"train_loss": -40.781593322753906, "global_step": 197482, "epoch": 1632} {"train_loss": -40.479122161865234, "global_step": 197483, "epoch": 1632} {"train_loss": -41.35398483276367, "global_step": 197484, "epoch": 1632} {"train_loss": -39.34015655517578, "global_step": 197485, "epoch": 1632} {"train_loss": -40.627437591552734, "global_step": 197486, "epoch": 1632} {"train_loss": -41.556312561035156, "global_step": 197487, "epoch": 1632} {"train_loss": -40.59162521362305, "global_step": 197488, "epoch": 1632} {"train_loss": -41.01101303100586, "global_step": 197489, "epoch": 1632} {"train_loss": -40.96649169921875, "global_step": 197490, "epoch": 1632} {"train_loss": -41.120697021484375, "global_step": 197491, "epoch": 1632} {"train_loss": -41.73887634277344, "global_step": 197492, "epoch": 1632} {"train_loss": -41.39016342163086, "global_step": 197493, "epoch": 1632} {"train_loss": -41.548744201660156, "global_step": 197494, "epoch": 1632} {"train_loss": -41.78189468383789, "global_step": 197495, "epoch": 1632} {"train_loss": -40.823486328125, "global_step": 197496, "epoch": 1632} {"train_loss": -41.5665397644043, "global_step": 197497, "epoch": 1632} {"train_loss": -42.1837158203125, "global_step": 197498, "epoch": 1632} {"train_loss": -41.10778045654297, "global_step": 197499, "epoch": 1632} {"train_loss": -41.427459716796875, "global_step": 197500, "epoch": 1632} {"train_loss": -41.65085983276367, "global_step": 197501, "epoch": 1632} {"train_loss": -41.677978515625, "global_step": 197502, "epoch": 1632} {"train_loss": -40.793060302734375, "global_step": 197503, "epoch": 1632} {"train_loss": -41.36037063598633, "global_step": 197504, "epoch": 1632} {"train_loss": -38.01941680908203, "global_step": 197505, "epoch": 1632} {"train_loss": -38.21579360961914, "global_step": 197506, "epoch": 1632} {"train_loss": -39.380523681640625, "global_step": 197507, "epoch": 1632} {"train_loss": -39.854530334472656, "global_step": 197508, "epoch": 1632} {"train_loss": -41.14916229248047, "global_step": 197509, "epoch": 1632} {"train_loss": -36.402618408203125, "global_step": 197510, "epoch": 1632} {"train_loss": -32.3073844909668, "global_step": 197511, "epoch": 1632} {"train_loss": -38.77915573120117, "global_step": 197512, "epoch": 1632} {"train_loss": -40.345523834228516, "global_step": 197513, "epoch": 1632} {"train_loss": -36.731048583984375, "global_step": 197514, "epoch": 1632} {"train_loss": -40.76524353027344, "global_step": 197515, "epoch": 1632} {"train_loss": -37.70298385620117, "global_step": 197516, "epoch": 1632} {"train_loss": -37.89825439453125, "global_step": 197517, "epoch": 1632} {"train_loss": -41.038238525390625, "global_step": 197518, "epoch": 1632} {"train_loss": -37.804229736328125, "global_step": 197519, "epoch": 1632} {"train_loss": -40.04115676879883, "global_step": 197520, "epoch": 1632} {"train_loss": -39.751792907714844, "global_step": 197521, "epoch": 1632} {"train_loss": -39.84782791137695, "global_step": 197522, "epoch": 1632} {"train_loss": -41.68067169189453, "global_step": 197523, "epoch": 1632} {"train_loss": -38.268157958984375, "global_step": 197524, "epoch": 1632} {"train_loss": -40.55314254760742, "global_step": 197525, "epoch": 1632} {"train_loss": -39.928951263427734, "global_step": 197526, "epoch": 1632} {"train_loss": -40.84774398803711, "global_step": 197527, "epoch": 1632} {"train_loss": -39.85075759887695, "global_step": 197528, "epoch": 1632} {"train_loss": -40.519447326660156, "global_step": 197529, "epoch": 1632} {"train_loss": -40.63250732421875, "global_step": 197530, "epoch": 1632} {"train_loss": -40.69712448120117, "global_step": 197531, "epoch": 1632} {"train_loss": -40.34861373901367, "global_step": 197532, "epoch": 1632} {"train_loss": -41.46824264526367, "global_step": 197533, "epoch": 1632} {"train_loss": -40.27323532104492, "global_step": 197534, "epoch": 1632} {"train_loss": -41.09292221069336, "global_step": 197535, "epoch": 1632} {"train_loss": -40.468017578125, "global_step": 197536, "epoch": 1632} {"train_loss": -40.88114547729492, "global_step": 197537, "epoch": 1632} {"train_loss": -41.024654388427734, "global_step": 197538, "epoch": 1632} {"train_loss": -40.621437072753906, "global_step": 197539, "epoch": 1632} {"train_loss": -40.95323944091797, "global_step": 197540, "epoch": 1632} {"train_loss": -39.77289581298828, "global_step": 197541, "epoch": 1632} {"train_loss": -40.8287467956543, "global_step": 197542, "epoch": 1632} {"train_loss": -41.21750259399414, "global_step": 197543, "epoch": 1632} {"train_loss": -41.85198974609375, "global_step": 197544, "epoch": 1632} {"train_loss": -38.72333908081055, "global_step": 197545, "epoch": 1632} {"train_loss": -41.33529281616211, "global_step": 197546, "epoch": 1632} {"train_loss": -41.02594757080078, "global_step": 197547, "epoch": 1632} {"train_loss": -39.3237190246582, "global_step": 197548, "epoch": 1632} {"train_loss": -41.01345443725586, "global_step": 197549, "epoch": 1632} {"train_loss": -40.0343017578125, "global_step": 197550, "epoch": 1632} {"train_loss": -39.64527130126953, "global_step": 197551, "epoch": 1632} {"train_loss": -40.8626823425293, "global_step": 197552, "epoch": 1632} {"train_loss": -41.23044967651367, "global_step": 197553, "epoch": 1632} {"train_loss": -41.0641975402832, "global_step": 197554, "epoch": 1632} {"train_loss": -41.249664306640625, "global_step": 197555, "epoch": 1632} {"train_loss": -41.39873123168945, "global_step": 197556, "epoch": 1632} {"train_loss": -40.49846267700195, "global_step": 197557, "epoch": 1632} {"train_loss": -41.48920440673828, "global_step": 197558, "epoch": 1632} {"train_loss": -41.99641036987305, "global_step": 197559, "epoch": 1632} {"train_loss": -41.10726547241211, "global_step": 197560, "epoch": 1632} {"train_loss": -41.079627990722656, "global_step": 197561, "epoch": 1632} {"train_loss": -41.57647705078125, "global_step": 197562, "epoch": 1632} {"train_loss": -40.92890167236328, "global_step": 197563, "epoch": 1632} {"train_loss": -40.3942756652832, "global_step": 197564, "epoch": 1632} {"train_loss": -41.38273239135742, "global_step": 197565, "epoch": 1632} {"train_loss": -39.732845306396484, "global_step": 197566, "epoch": 1632} {"train_loss": -40.75503921508789, "global_step": 197567, "epoch": 1632} {"train_loss": -41.77910614013672, "global_step": 197568, "epoch": 1632} {"train_loss": -41.634307861328125, "global_step": 197569, "epoch": 1632} {"train_loss": -42.143211364746094, "global_step": 197570, "epoch": 1632} {"train_loss": -41.41070556640625, "global_step": 197571, "epoch": 1632} {"train_loss": -41.94928741455078, "global_step": 197572, "epoch": 1632} {"train_loss": -41.39533233642578, "global_step": 197573, "epoch": 1632} {"train_loss": -41.97323226928711, "global_step": 197574, "epoch": 1632} {"train_loss": -40.85078430175781, "global_step": 197575, "epoch": 1632} {"train_loss": -41.92415237426758, "global_step": 197576, "epoch": 1632} {"train_loss": -41.668331146240234, "global_step": 197577, "epoch": 1632} {"train_loss": -41.80525588989258, "global_step": 197578, "epoch": 1632} {"train_loss": -41.77756881713867, "global_step": 197579, "epoch": 1632} {"train_loss": -41.852535247802734, "global_step": 197580, "epoch": 1632} {"train_loss": -41.548927307128906, "global_step": 197581, "epoch": 1632} {"train_loss": -41.54591369628906, "global_step": 197582, "epoch": 1632} {"train_loss": -42.00063705444336, "global_step": 197583, "epoch": 1632} {"train_loss": -41.67720413208008, "global_step": 197584, "epoch": 1632} {"train_loss": -41.7170295715332, "global_step": 197585, "epoch": 1632} {"train_loss": -41.57573318481445, "global_step": 197586, "epoch": 1632} {"train_loss": -42.1495246887207, "global_step": 197587, "epoch": 1632} {"train_loss": -41.57345199584961, "global_step": 197588, "epoch": 1632} {"train_loss": -41.863128662109375, "global_step": 197589, "epoch": 1632} {"train_loss": -40.89240646362305, "global_step": 197590, "epoch": 1632} {"train_loss": -41.2156982421875, "global_step": 197591, "epoch": 1632} {"train_loss": -40.68095710060813, "global_step": 197592, "epoch": 1632, "val_loss": 2555451.0} {"train_loss": -41.080108642578125, "global_step": 197593, "epoch": 1633} {"train_loss": -41.84608840942383, "global_step": 197594, "epoch": 1633} {"train_loss": -42.13903045654297, "global_step": 197595, "epoch": 1633} {"train_loss": -42.48211669921875, "global_step": 197596, "epoch": 1633} {"train_loss": -41.9442024230957, "global_step": 197597, "epoch": 1633} {"train_loss": -42.82619094848633, "global_step": 197598, "epoch": 1633} {"train_loss": -41.0406608581543, "global_step": 197599, "epoch": 1633} {"train_loss": -40.56362533569336, "global_step": 197600, "epoch": 1633} {"train_loss": -35.6071891784668, "global_step": 197601, "epoch": 1633} {"train_loss": -31.042509078979492, "global_step": 197602, "epoch": 1633} {"train_loss": -29.0988712310791, "global_step": 197603, "epoch": 1633} {"train_loss": -38.03597640991211, "global_step": 197604, "epoch": 1633} {"train_loss": -40.40865707397461, "global_step": 197605, "epoch": 1633} {"train_loss": -36.647743225097656, "global_step": 197606, "epoch": 1633} {"train_loss": -39.24203109741211, "global_step": 197607, "epoch": 1633} {"train_loss": -39.20280075073242, "global_step": 197608, "epoch": 1633} {"train_loss": -36.92334747314453, "global_step": 197609, "epoch": 1633} {"train_loss": -40.14345932006836, "global_step": 197610, "epoch": 1633} {"train_loss": -39.67268753051758, "global_step": 197611, "epoch": 1633} {"train_loss": -38.39959716796875, "global_step": 197612, "epoch": 1633} {"train_loss": -41.2778434753418, "global_step": 197613, "epoch": 1633} {"train_loss": -38.71725082397461, "global_step": 197614, "epoch": 1633} {"train_loss": -41.370479583740234, "global_step": 197615, "epoch": 1633} {"train_loss": -38.55693435668945, "global_step": 197616, "epoch": 1633} {"train_loss": -41.34109115600586, "global_step": 197617, "epoch": 1633} {"train_loss": -39.31747055053711, "global_step": 197618, "epoch": 1633} {"train_loss": -41.12057113647461, "global_step": 197619, "epoch": 1633} {"train_loss": -39.38728713989258, "global_step": 197620, "epoch": 1633} {"train_loss": -40.8421630859375, "global_step": 197621, "epoch": 1633} {"train_loss": -40.49312210083008, "global_step": 197622, "epoch": 1633} {"train_loss": -40.28987503051758, "global_step": 197623, "epoch": 1633} {"train_loss": -40.73966598510742, "global_step": 197624, "epoch": 1633} {"train_loss": -40.621829986572266, "global_step": 197625, "epoch": 1633} {"train_loss": -40.62873077392578, "global_step": 197626, "epoch": 1633} {"train_loss": -40.192317962646484, "global_step": 197627, "epoch": 1633} {"train_loss": -40.8663444519043, "global_step": 197628, "epoch": 1633} {"train_loss": -40.95526123046875, "global_step": 197629, "epoch": 1633} {"train_loss": -41.076045989990234, "global_step": 197630, "epoch": 1633} {"train_loss": -41.012451171875, "global_step": 197631, "epoch": 1633} {"train_loss": -41.441280364990234, "global_step": 197632, "epoch": 1633} {"train_loss": -40.71555709838867, "global_step": 197633, "epoch": 1633} {"train_loss": -41.0348014831543, "global_step": 197634, "epoch": 1633} {"train_loss": -41.36027908325195, "global_step": 197635, "epoch": 1633} {"train_loss": -41.6292724609375, "global_step": 197636, "epoch": 1633} {"train_loss": -41.6637077331543, "global_step": 197637, "epoch": 1633} {"train_loss": -41.49306106567383, "global_step": 197638, "epoch": 1633} {"train_loss": -41.5483283996582, "global_step": 197639, "epoch": 1633} {"train_loss": -41.679439544677734, "global_step": 197640, "epoch": 1633} {"train_loss": -41.88676071166992, "global_step": 197641, "epoch": 1633} {"train_loss": -41.2979850769043, "global_step": 197642, "epoch": 1633} {"train_loss": -42.15102767944336, "global_step": 197643, "epoch": 1633} {"train_loss": -41.5352897644043, "global_step": 197644, "epoch": 1633} {"train_loss": -41.80097579956055, "global_step": 197645, "epoch": 1633} {"train_loss": -40.98331069946289, "global_step": 197646, "epoch": 1633} {"train_loss": -42.082305908203125, "global_step": 197647, "epoch": 1633} {"train_loss": -41.85486602783203, "global_step": 197648, "epoch": 1633} {"train_loss": -42.29779052734375, "global_step": 197649, "epoch": 1633} {"train_loss": -42.133941650390625, "global_step": 197650, "epoch": 1633} {"train_loss": -42.050785064697266, "global_step": 197651, "epoch": 1633} {"train_loss": -41.87580490112305, "global_step": 197652, "epoch": 1633} {"train_loss": -41.75861740112305, "global_step": 197653, "epoch": 1633} {"train_loss": -42.062965393066406, "global_step": 197654, "epoch": 1633} {"train_loss": -42.034400939941406, "global_step": 197655, "epoch": 1633} {"train_loss": -41.16147232055664, "global_step": 197656, "epoch": 1633} {"train_loss": -42.27811813354492, "global_step": 197657, "epoch": 1633} {"train_loss": -42.11620330810547, "global_step": 197658, "epoch": 1633} {"train_loss": -41.57997512817383, "global_step": 197659, "epoch": 1633} {"train_loss": -41.69758987426758, "global_step": 197660, "epoch": 1633} {"train_loss": -41.92076873779297, "global_step": 197661, "epoch": 1633} {"train_loss": -41.78937911987305, "global_step": 197662, "epoch": 1633} {"train_loss": -41.67757797241211, "global_step": 197663, "epoch": 1633} {"train_loss": -41.9285888671875, "global_step": 197664, "epoch": 1633} {"train_loss": -41.728858947753906, "global_step": 197665, "epoch": 1633} {"train_loss": -40.973018646240234, "global_step": 197666, "epoch": 1633} {"train_loss": -40.72545623779297, "global_step": 197667, "epoch": 1633} {"train_loss": -41.46321105957031, "global_step": 197668, "epoch": 1633} {"train_loss": -41.687679290771484, "global_step": 197669, "epoch": 1633} {"train_loss": -41.62525177001953, "global_step": 197670, "epoch": 1633} {"train_loss": -41.55730438232422, "global_step": 197671, "epoch": 1633} {"train_loss": -41.35044479370117, "global_step": 197672, "epoch": 1633} {"train_loss": -40.73688888549805, "global_step": 197673, "epoch": 1633} {"train_loss": -41.04238510131836, "global_step": 197674, "epoch": 1633} {"train_loss": -42.3466911315918, "global_step": 197675, "epoch": 1633} {"train_loss": -40.505821228027344, "global_step": 197676, "epoch": 1633} {"train_loss": -41.2663688659668, "global_step": 197677, "epoch": 1633} {"train_loss": -40.91477584838867, "global_step": 197678, "epoch": 1633} {"train_loss": -41.420387268066406, "global_step": 197679, "epoch": 1633} {"train_loss": -42.33600997924805, "global_step": 197680, "epoch": 1633} {"train_loss": -40.738853454589844, "global_step": 197681, "epoch": 1633} {"train_loss": -40.72809982299805, "global_step": 197682, "epoch": 1633} {"train_loss": -42.09420394897461, "global_step": 197683, "epoch": 1633} {"train_loss": -39.29030227661133, "global_step": 197684, "epoch": 1633} {"train_loss": -38.82975387573242, "global_step": 197685, "epoch": 1633} {"train_loss": -40.78139114379883, "global_step": 197686, "epoch": 1633} {"train_loss": -41.15427017211914, "global_step": 197687, "epoch": 1633} {"train_loss": -40.24786376953125, "global_step": 197688, "epoch": 1633} {"train_loss": -39.93764877319336, "global_step": 197689, "epoch": 1633} {"train_loss": -41.54637145996094, "global_step": 197690, "epoch": 1633} {"train_loss": -39.456817626953125, "global_step": 197691, "epoch": 1633} {"train_loss": -40.86505889892578, "global_step": 197692, "epoch": 1633} {"train_loss": -40.9980583190918, "global_step": 197693, "epoch": 1633} {"train_loss": -39.65869140625, "global_step": 197694, "epoch": 1633} {"train_loss": -40.18217849731445, "global_step": 197695, "epoch": 1633} {"train_loss": -39.94505310058594, "global_step": 197696, "epoch": 1633} {"train_loss": -39.57306671142578, "global_step": 197697, "epoch": 1633} {"train_loss": -40.87522506713867, "global_step": 197698, "epoch": 1633} {"train_loss": -38.8831787109375, "global_step": 197699, "epoch": 1633} {"train_loss": -39.25022506713867, "global_step": 197700, "epoch": 1633} {"train_loss": -40.5795783996582, "global_step": 197701, "epoch": 1633} {"train_loss": -39.79569625854492, "global_step": 197702, "epoch": 1633} {"train_loss": -40.82789611816406, "global_step": 197703, "epoch": 1633} {"train_loss": -39.40679931640625, "global_step": 197704, "epoch": 1633} {"train_loss": -41.19828414916992, "global_step": 197705, "epoch": 1633} {"train_loss": -40.58320999145508, "global_step": 197706, "epoch": 1633} {"train_loss": -41.230289459228516, "global_step": 197707, "epoch": 1633} {"train_loss": -39.71749496459961, "global_step": 197708, "epoch": 1633} {"train_loss": -40.466957092285156, "global_step": 197709, "epoch": 1633} {"train_loss": -41.257293701171875, "global_step": 197710, "epoch": 1633} {"train_loss": -41.35544967651367, "global_step": 197711, "epoch": 1633} {"train_loss": -41.39374542236328, "global_step": 197712, "epoch": 1633} {"train_loss": -40.644006713362764, "global_step": 197713, "epoch": 1633, "val_loss": 2522066.0} {"train_loss": -40.35396957397461, "global_step": 197714, "epoch": 1634} {"train_loss": -41.83271408081055, "global_step": 197715, "epoch": 1634} {"train_loss": -41.115291595458984, "global_step": 197716, "epoch": 1634} {"train_loss": -39.4033088684082, "global_step": 197717, "epoch": 1634} {"train_loss": -41.277587890625, "global_step": 197718, "epoch": 1634} {"train_loss": -40.93571090698242, "global_step": 197719, "epoch": 1634} {"train_loss": -41.43861770629883, "global_step": 197720, "epoch": 1634} {"train_loss": -40.571895599365234, "global_step": 197721, "epoch": 1634} {"train_loss": -41.82358932495117, "global_step": 197722, "epoch": 1634} {"train_loss": -40.6379508972168, "global_step": 197723, "epoch": 1634} {"train_loss": -41.44169235229492, "global_step": 197724, "epoch": 1634} {"train_loss": -41.34907913208008, "global_step": 197725, "epoch": 1634} {"train_loss": -41.786434173583984, "global_step": 197726, "epoch": 1634} {"train_loss": -41.32753372192383, "global_step": 197727, "epoch": 1634} {"train_loss": -40.63068771362305, "global_step": 197728, "epoch": 1634} {"train_loss": -41.22186279296875, "global_step": 197729, "epoch": 1634} {"train_loss": -41.032440185546875, "global_step": 197730, "epoch": 1634} {"train_loss": -40.663368225097656, "global_step": 197731, "epoch": 1634} {"train_loss": -41.36428451538086, "global_step": 197732, "epoch": 1634} {"train_loss": -41.855743408203125, "global_step": 197733, "epoch": 1634} {"train_loss": -40.607460021972656, "global_step": 197734, "epoch": 1634} {"train_loss": -41.307003021240234, "global_step": 197735, "epoch": 1634} {"train_loss": -39.625038146972656, "global_step": 197736, "epoch": 1634} {"train_loss": -36.80800247192383, "global_step": 197737, "epoch": 1634} {"train_loss": -40.453582763671875, "global_step": 197738, "epoch": 1634} {"train_loss": -41.964447021484375, "global_step": 197739, "epoch": 1634} {"train_loss": -40.1617546081543, "global_step": 197740, "epoch": 1634} {"train_loss": -41.66646194458008, "global_step": 197741, "epoch": 1634} {"train_loss": -35.56584548950195, "global_step": 197742, "epoch": 1634} {"train_loss": -40.15212631225586, "global_step": 197743, "epoch": 1634} {"train_loss": -41.091461181640625, "global_step": 197744, "epoch": 1634} {"train_loss": -40.7156867980957, "global_step": 197745, "epoch": 1634} {"train_loss": -41.144081115722656, "global_step": 197746, "epoch": 1634} {"train_loss": -40.90189743041992, "global_step": 197747, "epoch": 1634} {"train_loss": -39.81498336791992, "global_step": 197748, "epoch": 1634} {"train_loss": -41.35688018798828, "global_step": 197749, "epoch": 1634} {"train_loss": -40.41807174682617, "global_step": 197750, "epoch": 1634} {"train_loss": -41.36021423339844, "global_step": 197751, "epoch": 1634} {"train_loss": -41.95512008666992, "global_step": 197752, "epoch": 1634} {"train_loss": -41.04861068725586, "global_step": 197753, "epoch": 1634} {"train_loss": -41.41798782348633, "global_step": 197754, "epoch": 1634} {"train_loss": -41.8413200378418, "global_step": 197755, "epoch": 1634} {"train_loss": -41.397029876708984, "global_step": 197756, "epoch": 1634} {"train_loss": -40.97848129272461, "global_step": 197757, "epoch": 1634} {"train_loss": -37.478363037109375, "global_step": 197758, "epoch": 1634} {"train_loss": -40.912994384765625, "global_step": 197759, "epoch": 1634} {"train_loss": -34.86850357055664, "global_step": 197760, "epoch": 1634} {"train_loss": -41.7850456237793, "global_step": 197761, "epoch": 1634} {"train_loss": -39.23756790161133, "global_step": 197762, "epoch": 1634} {"train_loss": -39.613746643066406, "global_step": 197763, "epoch": 1634} {"train_loss": -41.63676452636719, "global_step": 197764, "epoch": 1634} {"train_loss": -41.27355194091797, "global_step": 197765, "epoch": 1634} {"train_loss": -40.93239974975586, "global_step": 197766, "epoch": 1634} {"train_loss": -39.953102111816406, "global_step": 197767, "epoch": 1634} {"train_loss": -41.773311614990234, "global_step": 197768, "epoch": 1634} {"train_loss": -41.13920974731445, "global_step": 197769, "epoch": 1634} {"train_loss": -41.400665283203125, "global_step": 197770, "epoch": 1634} {"train_loss": -41.567256927490234, "global_step": 197771, "epoch": 1634} {"train_loss": -40.78993606567383, "global_step": 197772, "epoch": 1634} {"train_loss": -40.85188293457031, "global_step": 197773, "epoch": 1634} {"train_loss": -41.733089447021484, "global_step": 197774, "epoch": 1634} {"train_loss": -38.663169860839844, "global_step": 197775, "epoch": 1634} {"train_loss": -40.914894104003906, "global_step": 197776, "epoch": 1634} {"train_loss": -42.22706985473633, "global_step": 197777, "epoch": 1634} {"train_loss": -40.23914337158203, "global_step": 197778, "epoch": 1634} {"train_loss": -41.043975830078125, "global_step": 197779, "epoch": 1634} {"train_loss": -39.55988693237305, "global_step": 197780, "epoch": 1634} {"train_loss": -41.40803527832031, "global_step": 197781, "epoch": 1634} {"train_loss": -39.93622970581055, "global_step": 197782, "epoch": 1634} {"train_loss": -39.720577239990234, "global_step": 197783, "epoch": 1634} {"train_loss": -39.4200439453125, "global_step": 197784, "epoch": 1634} {"train_loss": -41.54349899291992, "global_step": 197785, "epoch": 1634} {"train_loss": -41.123687744140625, "global_step": 197786, "epoch": 1634} {"train_loss": -34.69873809814453, "global_step": 197787, "epoch": 1634} {"train_loss": -38.403255462646484, "global_step": 197788, "epoch": 1634} {"train_loss": -40.32783126831055, "global_step": 197789, "epoch": 1634} {"train_loss": -41.00337600708008, "global_step": 197790, "epoch": 1634} {"train_loss": -37.65447235107422, "global_step": 197791, "epoch": 1634} {"train_loss": -41.52541732788086, "global_step": 197792, "epoch": 1634} {"train_loss": -41.27500915527344, "global_step": 197793, "epoch": 1634} {"train_loss": -41.64067459106445, "global_step": 197794, "epoch": 1634} {"train_loss": -41.25131607055664, "global_step": 197795, "epoch": 1634} {"train_loss": -41.222537994384766, "global_step": 197796, "epoch": 1634} {"train_loss": -41.440650939941406, "global_step": 197797, "epoch": 1634} {"train_loss": -38.14119338989258, "global_step": 197798, "epoch": 1634} {"train_loss": -39.4954948425293, "global_step": 197799, "epoch": 1634} {"train_loss": -37.06489181518555, "global_step": 197800, "epoch": 1634} {"train_loss": -40.7763671875, "global_step": 197801, "epoch": 1634} {"train_loss": -42.06787872314453, "global_step": 197802, "epoch": 1634} {"train_loss": -39.79591369628906, "global_step": 197803, "epoch": 1634} {"train_loss": -40.480220794677734, "global_step": 197804, "epoch": 1634} {"train_loss": -41.0954475402832, "global_step": 197805, "epoch": 1634} {"train_loss": -40.701820373535156, "global_step": 197806, "epoch": 1634} {"train_loss": -40.26801300048828, "global_step": 197807, "epoch": 1634} {"train_loss": -41.373382568359375, "global_step": 197808, "epoch": 1634} {"train_loss": -40.27889633178711, "global_step": 197809, "epoch": 1634} {"train_loss": -41.06988525390625, "global_step": 197810, "epoch": 1634} {"train_loss": -41.03666305541992, "global_step": 197811, "epoch": 1634} {"train_loss": -40.58797073364258, "global_step": 197812, "epoch": 1634} {"train_loss": -40.613155364990234, "global_step": 197813, "epoch": 1634} {"train_loss": -40.62919235229492, "global_step": 197814, "epoch": 1634} {"train_loss": -40.37482452392578, "global_step": 197815, "epoch": 1634} {"train_loss": -40.082271575927734, "global_step": 197816, "epoch": 1634} {"train_loss": -40.922576904296875, "global_step": 197817, "epoch": 1634} {"train_loss": -39.81968307495117, "global_step": 197818, "epoch": 1634} {"train_loss": -40.626583099365234, "global_step": 197819, "epoch": 1634} {"train_loss": -40.731807708740234, "global_step": 197820, "epoch": 1634} {"train_loss": -40.32294845581055, "global_step": 197821, "epoch": 1634} {"train_loss": -41.15279006958008, "global_step": 197822, "epoch": 1634} {"train_loss": -40.44540023803711, "global_step": 197823, "epoch": 1634} {"train_loss": -40.12313461303711, "global_step": 197824, "epoch": 1634} {"train_loss": -40.50909423828125, "global_step": 197825, "epoch": 1634} {"train_loss": -41.68518829345703, "global_step": 197826, "epoch": 1634} {"train_loss": -39.99420166015625, "global_step": 197827, "epoch": 1634} {"train_loss": -40.79584884643555, "global_step": 197828, "epoch": 1634} {"train_loss": -41.479793548583984, "global_step": 197829, "epoch": 1634} {"train_loss": -40.965789794921875, "global_step": 197830, "epoch": 1634} {"train_loss": -40.92669677734375, "global_step": 197831, "epoch": 1634} {"train_loss": -41.8046875, "global_step": 197832, "epoch": 1634} {"train_loss": -40.86477279663086, "global_step": 197833, "epoch": 1634} {"train_loss": -40.57504048623329, "global_step": 197834, "epoch": 1634, "val_loss": 2516400.75} {"train_loss": -38.348388671875, "global_step": 197835, "epoch": 1635} {"train_loss": -41.06928634643555, "global_step": 197836, "epoch": 1635} {"train_loss": -41.057411193847656, "global_step": 197837, "epoch": 1635} {"train_loss": -41.233489990234375, "global_step": 197838, "epoch": 1635} {"train_loss": -39.82551193237305, "global_step": 197839, "epoch": 1635} {"train_loss": -41.874019622802734, "global_step": 197840, "epoch": 1635} {"train_loss": -38.896785736083984, "global_step": 197841, "epoch": 1635} {"train_loss": -39.596195220947266, "global_step": 197842, "epoch": 1635} {"train_loss": -40.641334533691406, "global_step": 197843, "epoch": 1635} {"train_loss": -40.16571044921875, "global_step": 197844, "epoch": 1635} {"train_loss": -41.15155792236328, "global_step": 197845, "epoch": 1635} {"train_loss": -40.38764572143555, "global_step": 197846, "epoch": 1635} {"train_loss": -40.32115173339844, "global_step": 197847, "epoch": 1635} {"train_loss": -41.389095306396484, "global_step": 197848, "epoch": 1635} {"train_loss": -40.089332580566406, "global_step": 197849, "epoch": 1635} {"train_loss": -40.73106002807617, "global_step": 197850, "epoch": 1635} {"train_loss": -39.303321838378906, "global_step": 197851, "epoch": 1635} {"train_loss": -40.849395751953125, "global_step": 197852, "epoch": 1635} {"train_loss": -39.65230941772461, "global_step": 197853, "epoch": 1635} {"train_loss": -39.62097930908203, "global_step": 197854, "epoch": 1635} {"train_loss": -39.70875930786133, "global_step": 197855, "epoch": 1635} {"train_loss": -38.28132247924805, "global_step": 197856, "epoch": 1635} {"train_loss": -41.293701171875, "global_step": 197857, "epoch": 1635} {"train_loss": -41.388790130615234, "global_step": 197858, "epoch": 1635} {"train_loss": -40.75259780883789, "global_step": 197859, "epoch": 1635} {"train_loss": -39.13067626953125, "global_step": 197860, "epoch": 1635} {"train_loss": -39.42702102661133, "global_step": 197861, "epoch": 1635} {"train_loss": -40.5396614074707, "global_step": 197862, "epoch": 1635} {"train_loss": -40.6961784362793, "global_step": 197863, "epoch": 1635} {"train_loss": -41.987510681152344, "global_step": 197864, "epoch": 1635} {"train_loss": -41.031471252441406, "global_step": 197865, "epoch": 1635} {"train_loss": -41.88886260986328, "global_step": 197866, "epoch": 1635} {"train_loss": -40.7696533203125, "global_step": 197867, "epoch": 1635} {"train_loss": -41.75302505493164, "global_step": 197868, "epoch": 1635} {"train_loss": -40.83152770996094, "global_step": 197869, "epoch": 1635} {"train_loss": -41.733280181884766, "global_step": 197870, "epoch": 1635} {"train_loss": -41.416175842285156, "global_step": 197871, "epoch": 1635} {"train_loss": -40.861839294433594, "global_step": 197872, "epoch": 1635} {"train_loss": -41.37064743041992, "global_step": 197873, "epoch": 1635} {"train_loss": -41.80257034301758, "global_step": 197874, "epoch": 1635} {"train_loss": -41.335201263427734, "global_step": 197875, "epoch": 1635} {"train_loss": -41.27975082397461, "global_step": 197876, "epoch": 1635} {"train_loss": -41.54549789428711, "global_step": 197877, "epoch": 1635} {"train_loss": -41.0361442565918, "global_step": 197878, "epoch": 1635} {"train_loss": -37.755836486816406, "global_step": 197879, "epoch": 1635} {"train_loss": -41.27177047729492, "global_step": 197880, "epoch": 1635} {"train_loss": -40.16270065307617, "global_step": 197881, "epoch": 1635} {"train_loss": -41.354942321777344, "global_step": 197882, "epoch": 1635} {"train_loss": -40.70020294189453, "global_step": 197883, "epoch": 1635} {"train_loss": -39.56391525268555, "global_step": 197884, "epoch": 1635} {"train_loss": -41.41106033325195, "global_step": 197885, "epoch": 1635} {"train_loss": -40.47694396972656, "global_step": 197886, "epoch": 1635} {"train_loss": -41.23297882080078, "global_step": 197887, "epoch": 1635} {"train_loss": -40.2387809753418, "global_step": 197888, "epoch": 1635} {"train_loss": -41.00851058959961, "global_step": 197889, "epoch": 1635} {"train_loss": -40.353511810302734, "global_step": 197890, "epoch": 1635} {"train_loss": -41.685359954833984, "global_step": 197891, "epoch": 1635} {"train_loss": -40.66964340209961, "global_step": 197892, "epoch": 1635} {"train_loss": -39.2564697265625, "global_step": 197893, "epoch": 1635} {"train_loss": -40.547176361083984, "global_step": 197894, "epoch": 1635} {"train_loss": -41.31396484375, "global_step": 197895, "epoch": 1635} {"train_loss": -39.484901428222656, "global_step": 197896, "epoch": 1635} {"train_loss": -41.843299865722656, "global_step": 197897, "epoch": 1635} {"train_loss": -40.94438171386719, "global_step": 197898, "epoch": 1635} {"train_loss": -40.581825256347656, "global_step": 197899, "epoch": 1635} {"train_loss": -38.328731536865234, "global_step": 197900, "epoch": 1635} {"train_loss": -41.11488723754883, "global_step": 197901, "epoch": 1635} {"train_loss": -38.96030807495117, "global_step": 197902, "epoch": 1635} {"train_loss": -40.02939987182617, "global_step": 197903, "epoch": 1635} {"train_loss": -40.054595947265625, "global_step": 197904, "epoch": 1635} {"train_loss": -40.986572265625, "global_step": 197905, "epoch": 1635} {"train_loss": -37.77788543701172, "global_step": 197906, "epoch": 1635} {"train_loss": -40.8692741394043, "global_step": 197907, "epoch": 1635} {"train_loss": -41.400291442871094, "global_step": 197908, "epoch": 1635} {"train_loss": -41.88277816772461, "global_step": 197909, "epoch": 1635} {"train_loss": -39.95368576049805, "global_step": 197910, "epoch": 1635} {"train_loss": -40.907318115234375, "global_step": 197911, "epoch": 1635} {"train_loss": -40.214866638183594, "global_step": 197912, "epoch": 1635} {"train_loss": -42.18931198120117, "global_step": 197913, "epoch": 1635} {"train_loss": -39.07318115234375, "global_step": 197914, "epoch": 1635} {"train_loss": -34.9520378112793, "global_step": 197915, "epoch": 1635} {"train_loss": -37.669490814208984, "global_step": 197916, "epoch": 1635} {"train_loss": -38.22126388549805, "global_step": 197917, "epoch": 1635} {"train_loss": -38.85622024536133, "global_step": 197918, "epoch": 1635} {"train_loss": -39.544830322265625, "global_step": 197919, "epoch": 1635} {"train_loss": -40.456336975097656, "global_step": 197920, "epoch": 1635} {"train_loss": -39.667293548583984, "global_step": 197921, "epoch": 1635} {"train_loss": -39.79859161376953, "global_step": 197922, "epoch": 1635} {"train_loss": -40.20555114746094, "global_step": 197923, "epoch": 1635} {"train_loss": -37.94424057006836, "global_step": 197924, "epoch": 1635} {"train_loss": -39.697479248046875, "global_step": 197925, "epoch": 1635} {"train_loss": -38.529815673828125, "global_step": 197926, "epoch": 1635} {"train_loss": -41.35541915893555, "global_step": 197927, "epoch": 1635} {"train_loss": -40.3283576965332, "global_step": 197928, "epoch": 1635} {"train_loss": -39.40729904174805, "global_step": 197929, "epoch": 1635} {"train_loss": -38.430686950683594, "global_step": 197930, "epoch": 1635} {"train_loss": -39.7789306640625, "global_step": 197931, "epoch": 1635} {"train_loss": -40.07500457763672, "global_step": 197932, "epoch": 1635} {"train_loss": -41.359230041503906, "global_step": 197933, "epoch": 1635} {"train_loss": -37.9527587890625, "global_step": 197934, "epoch": 1635} {"train_loss": -40.38252639770508, "global_step": 197935, "epoch": 1635} {"train_loss": -39.42420196533203, "global_step": 197936, "epoch": 1635} {"train_loss": -41.036495208740234, "global_step": 197937, "epoch": 1635} {"train_loss": -39.21154022216797, "global_step": 197938, "epoch": 1635} {"train_loss": -39.5302619934082, "global_step": 197939, "epoch": 1635} {"train_loss": -40.27972412109375, "global_step": 197940, "epoch": 1635} {"train_loss": -38.98369216918945, "global_step": 197941, "epoch": 1635} {"train_loss": -41.132911682128906, "global_step": 197942, "epoch": 1635} {"train_loss": -40.090484619140625, "global_step": 197943, "epoch": 1635} {"train_loss": -39.828163146972656, "global_step": 197944, "epoch": 1635} {"train_loss": -39.157569885253906, "global_step": 197945, "epoch": 1635} {"train_loss": -39.88355255126953, "global_step": 197946, "epoch": 1635} {"train_loss": -41.06142044067383, "global_step": 197947, "epoch": 1635} {"train_loss": -38.17891311645508, "global_step": 197948, "epoch": 1635} {"train_loss": -40.78428649902344, "global_step": 197949, "epoch": 1635} {"train_loss": -38.94070053100586, "global_step": 197950, "epoch": 1635} {"train_loss": -39.76247787475586, "global_step": 197951, "epoch": 1635} {"train_loss": -40.02370071411133, "global_step": 197952, "epoch": 1635} {"train_loss": -40.36648178100586, "global_step": 197953, "epoch": 1635} {"train_loss": -37.14318084716797, "global_step": 197954, "epoch": 1635} {"train_loss": -40.16217378348358, "global_step": 197955, "epoch": 1635, "val_loss": 2538246.0} {"train_loss": -39.800872802734375, "global_step": 197956, "epoch": 1636} {"train_loss": -39.462646484375, "global_step": 197957, "epoch": 1636} {"train_loss": -41.08140182495117, "global_step": 197958, "epoch": 1636} {"train_loss": -40.06911087036133, "global_step": 197959, "epoch": 1636} {"train_loss": -40.47640609741211, "global_step": 197960, "epoch": 1636} {"train_loss": -40.65725326538086, "global_step": 197961, "epoch": 1636} {"train_loss": -38.649330139160156, "global_step": 197962, "epoch": 1636} {"train_loss": -38.635772705078125, "global_step": 197963, "epoch": 1636} {"train_loss": -39.323333740234375, "global_step": 197964, "epoch": 1636} {"train_loss": -40.451778411865234, "global_step": 197965, "epoch": 1636} {"train_loss": -36.840396881103516, "global_step": 197966, "epoch": 1636} {"train_loss": -37.55720138549805, "global_step": 197967, "epoch": 1636} {"train_loss": -40.355499267578125, "global_step": 197968, "epoch": 1636} {"train_loss": -40.84635925292969, "global_step": 197969, "epoch": 1636} {"train_loss": -38.34423065185547, "global_step": 197970, "epoch": 1636} {"train_loss": -39.052215576171875, "global_step": 197971, "epoch": 1636} {"train_loss": -40.97288131713867, "global_step": 197972, "epoch": 1636} {"train_loss": -38.23984909057617, "global_step": 197973, "epoch": 1636} {"train_loss": -40.00590896606445, "global_step": 197974, "epoch": 1636} {"train_loss": -40.469661712646484, "global_step": 197975, "epoch": 1636} {"train_loss": -39.85324478149414, "global_step": 197976, "epoch": 1636} {"train_loss": -40.26556396484375, "global_step": 197977, "epoch": 1636} {"train_loss": -38.69901657104492, "global_step": 197978, "epoch": 1636} {"train_loss": -40.66401290893555, "global_step": 197979, "epoch": 1636} {"train_loss": -40.85541915893555, "global_step": 197980, "epoch": 1636} {"train_loss": -36.01911544799805, "global_step": 197981, "epoch": 1636} {"train_loss": -35.67580795288086, "global_step": 197982, "epoch": 1636} {"train_loss": -39.58390426635742, "global_step": 197983, "epoch": 1636} {"train_loss": -41.038665771484375, "global_step": 197984, "epoch": 1636} {"train_loss": -40.932735443115234, "global_step": 197985, "epoch": 1636} {"train_loss": -39.51346206665039, "global_step": 197986, "epoch": 1636} {"train_loss": -39.01133728027344, "global_step": 197987, "epoch": 1636} {"train_loss": -38.48249053955078, "global_step": 197988, "epoch": 1636} {"train_loss": -40.54670333862305, "global_step": 197989, "epoch": 1636} {"train_loss": -40.1434326171875, "global_step": 197990, "epoch": 1636} {"train_loss": -39.543701171875, "global_step": 197991, "epoch": 1636} {"train_loss": -39.152896881103516, "global_step": 197992, "epoch": 1636} {"train_loss": -40.25203323364258, "global_step": 197993, "epoch": 1636} {"train_loss": -38.61238098144531, "global_step": 197994, "epoch": 1636} {"train_loss": -39.53216552734375, "global_step": 197995, "epoch": 1636} {"train_loss": -40.754268646240234, "global_step": 197996, "epoch": 1636} {"train_loss": -41.208011627197266, "global_step": 197997, "epoch": 1636} {"train_loss": -41.16059494018555, "global_step": 197998, "epoch": 1636} {"train_loss": -40.767112731933594, "global_step": 197999, "epoch": 1636} {"train_loss": -40.616573333740234, "global_step": 198000, "epoch": 1636} {"train_loss": -39.470516204833984, "global_step": 198001, "epoch": 1636} {"train_loss": -40.47147750854492, "global_step": 198002, "epoch": 1636} {"train_loss": -40.67042541503906, "global_step": 198003, "epoch": 1636} {"train_loss": -40.55569076538086, "global_step": 198004, "epoch": 1636} {"train_loss": -39.977264404296875, "global_step": 198005, "epoch": 1636} {"train_loss": -40.92137908935547, "global_step": 198006, "epoch": 1636} {"train_loss": -40.76115036010742, "global_step": 198007, "epoch": 1636} {"train_loss": -38.41474533081055, "global_step": 198008, "epoch": 1636} {"train_loss": -41.39078903198242, "global_step": 198009, "epoch": 1636} {"train_loss": -39.7951545715332, "global_step": 198010, "epoch": 1636} {"train_loss": -39.88627243041992, "global_step": 198011, "epoch": 1636} {"train_loss": -41.208534240722656, "global_step": 198012, "epoch": 1636} {"train_loss": -39.45913314819336, "global_step": 198013, "epoch": 1636} {"train_loss": -41.29774475097656, "global_step": 198014, "epoch": 1636} {"train_loss": -41.13151168823242, "global_step": 198015, "epoch": 1636} {"train_loss": -41.08902359008789, "global_step": 198016, "epoch": 1636} {"train_loss": -40.90143585205078, "global_step": 198017, "epoch": 1636} {"train_loss": -40.367977142333984, "global_step": 198018, "epoch": 1636} {"train_loss": -39.82994842529297, "global_step": 198019, "epoch": 1636} {"train_loss": -40.407501220703125, "global_step": 198020, "epoch": 1636} {"train_loss": -39.617122650146484, "global_step": 198021, "epoch": 1636} {"train_loss": -40.264617919921875, "global_step": 198022, "epoch": 1636} {"train_loss": -41.3233757019043, "global_step": 198023, "epoch": 1636} {"train_loss": -41.07708740234375, "global_step": 198024, "epoch": 1636} {"train_loss": -41.24689865112305, "global_step": 198025, "epoch": 1636} {"train_loss": -39.0488166809082, "global_step": 198026, "epoch": 1636} {"train_loss": -40.80427169799805, "global_step": 198027, "epoch": 1636} {"train_loss": -40.81385040283203, "global_step": 198028, "epoch": 1636} {"train_loss": -40.18077850341797, "global_step": 198029, "epoch": 1636} {"train_loss": -41.419132232666016, "global_step": 198030, "epoch": 1636} {"train_loss": -39.96100616455078, "global_step": 198031, "epoch": 1636} {"train_loss": -40.54414749145508, "global_step": 198032, "epoch": 1636} {"train_loss": -41.04977035522461, "global_step": 198033, "epoch": 1636} {"train_loss": -40.84562301635742, "global_step": 198034, "epoch": 1636} {"train_loss": -41.4614143371582, "global_step": 198035, "epoch": 1636} {"train_loss": -40.379695892333984, "global_step": 198036, "epoch": 1636} {"train_loss": -39.98678207397461, "global_step": 198037, "epoch": 1636} {"train_loss": -39.71197509765625, "global_step": 198038, "epoch": 1636} {"train_loss": -39.458274841308594, "global_step": 198039, "epoch": 1636} {"train_loss": -38.79334259033203, "global_step": 198040, "epoch": 1636} {"train_loss": -40.51007843017578, "global_step": 198041, "epoch": 1636} {"train_loss": -40.0042610168457, "global_step": 198042, "epoch": 1636} {"train_loss": -40.28036117553711, "global_step": 198043, "epoch": 1636} {"train_loss": -38.94771957397461, "global_step": 198044, "epoch": 1636} {"train_loss": -40.17030334472656, "global_step": 198045, "epoch": 1636} {"train_loss": -39.25708770751953, "global_step": 198046, "epoch": 1636} {"train_loss": -40.6160888671875, "global_step": 198047, "epoch": 1636} {"train_loss": -38.87858200073242, "global_step": 198048, "epoch": 1636} {"train_loss": -39.32899475097656, "global_step": 198049, "epoch": 1636} {"train_loss": -39.08042526245117, "global_step": 198050, "epoch": 1636} {"train_loss": -40.41069030761719, "global_step": 198051, "epoch": 1636} {"train_loss": -40.55268096923828, "global_step": 198052, "epoch": 1636} {"train_loss": -39.75803756713867, "global_step": 198053, "epoch": 1636} {"train_loss": -39.431671142578125, "global_step": 198054, "epoch": 1636} {"train_loss": -39.566688537597656, "global_step": 198055, "epoch": 1636} {"train_loss": -39.369022369384766, "global_step": 198056, "epoch": 1636} {"train_loss": -40.6279182434082, "global_step": 198057, "epoch": 1636} {"train_loss": -40.9332389831543, "global_step": 198058, "epoch": 1636} {"train_loss": -41.1050910949707, "global_step": 198059, "epoch": 1636} {"train_loss": -40.5164794921875, "global_step": 198060, "epoch": 1636} {"train_loss": -41.10622787475586, "global_step": 198061, "epoch": 1636} {"train_loss": -41.000545501708984, "global_step": 198062, "epoch": 1636} {"train_loss": -40.902931213378906, "global_step": 198063, "epoch": 1636} {"train_loss": -40.674747467041016, "global_step": 198064, "epoch": 1636} {"train_loss": -41.45643997192383, "global_step": 198065, "epoch": 1636} {"train_loss": -40.864376068115234, "global_step": 198066, "epoch": 1636} {"train_loss": -40.59282302856445, "global_step": 198067, "epoch": 1636} {"train_loss": -41.2799072265625, "global_step": 198068, "epoch": 1636} {"train_loss": -40.92552947998047, "global_step": 198069, "epoch": 1636} {"train_loss": -41.33391189575195, "global_step": 198070, "epoch": 1636} {"train_loss": -41.48641586303711, "global_step": 198071, "epoch": 1636} {"train_loss": -41.35465621948242, "global_step": 198072, "epoch": 1636} {"train_loss": -41.21458435058594, "global_step": 198073, "epoch": 1636} {"train_loss": -40.82966995239258, "global_step": 198074, "epoch": 1636} {"train_loss": -41.35283279418945, "global_step": 198075, "epoch": 1636} {"train_loss": -40.118871420868174, "global_step": 198076, "epoch": 1636, "val_loss": 2545753.75} {"train_loss": -41.3944206237793, "global_step": 198077, "epoch": 1637} {"train_loss": -41.33819580078125, "global_step": 198078, "epoch": 1637} {"train_loss": -41.11833953857422, "global_step": 198079, "epoch": 1637} {"train_loss": -41.258567810058594, "global_step": 198080, "epoch": 1637} {"train_loss": -41.02113342285156, "global_step": 198081, "epoch": 1637} {"train_loss": -41.211181640625, "global_step": 198082, "epoch": 1637} {"train_loss": -39.1877555847168, "global_step": 198083, "epoch": 1637} {"train_loss": -41.6447639465332, "global_step": 198084, "epoch": 1637} {"train_loss": -40.9610595703125, "global_step": 198085, "epoch": 1637} {"train_loss": -40.47568893432617, "global_step": 198086, "epoch": 1637} {"train_loss": -39.806392669677734, "global_step": 198087, "epoch": 1637} {"train_loss": -41.154457092285156, "global_step": 198088, "epoch": 1637} {"train_loss": -41.0300407409668, "global_step": 198089, "epoch": 1637} {"train_loss": -41.6424674987793, "global_step": 198090, "epoch": 1637} {"train_loss": -41.60218811035156, "global_step": 198091, "epoch": 1637} {"train_loss": -40.391815185546875, "global_step": 198092, "epoch": 1637} {"train_loss": -41.48107147216797, "global_step": 198093, "epoch": 1637} {"train_loss": -41.2218017578125, "global_step": 198094, "epoch": 1637} {"train_loss": -41.46794509887695, "global_step": 198095, "epoch": 1637} {"train_loss": -40.494537353515625, "global_step": 198096, "epoch": 1637} {"train_loss": -41.36238098144531, "global_step": 198097, "epoch": 1637} {"train_loss": -41.86845016479492, "global_step": 198098, "epoch": 1637} {"train_loss": -41.891075134277344, "global_step": 198099, "epoch": 1637} {"train_loss": -40.64030838012695, "global_step": 198100, "epoch": 1637} {"train_loss": -41.5899543762207, "global_step": 198101, "epoch": 1637} {"train_loss": -42.01747131347656, "global_step": 198102, "epoch": 1637} {"train_loss": -40.904598236083984, "global_step": 198103, "epoch": 1637} {"train_loss": -42.1306037902832, "global_step": 198104, "epoch": 1637} {"train_loss": -41.22689437866211, "global_step": 198105, "epoch": 1637} {"train_loss": -40.01637649536133, "global_step": 198106, "epoch": 1637} {"train_loss": -38.93928527832031, "global_step": 198107, "epoch": 1637} {"train_loss": -38.96135330200195, "global_step": 198108, "epoch": 1637} {"train_loss": -37.64741897583008, "global_step": 198109, "epoch": 1637} {"train_loss": -38.0763053894043, "global_step": 198110, "epoch": 1637} {"train_loss": -40.2580451965332, "global_step": 198111, "epoch": 1637} {"train_loss": -40.10888671875, "global_step": 198112, "epoch": 1637} {"train_loss": -39.494197845458984, "global_step": 198113, "epoch": 1637} {"train_loss": -37.933921813964844, "global_step": 198114, "epoch": 1637} {"train_loss": -39.232154846191406, "global_step": 198115, "epoch": 1637} {"train_loss": -39.992855072021484, "global_step": 198116, "epoch": 1637} {"train_loss": -40.15141677856445, "global_step": 198117, "epoch": 1637} {"train_loss": -38.938411712646484, "global_step": 198118, "epoch": 1637} {"train_loss": -39.453243255615234, "global_step": 198119, "epoch": 1637} {"train_loss": -40.730926513671875, "global_step": 198120, "epoch": 1637} {"train_loss": -39.779022216796875, "global_step": 198121, "epoch": 1637} {"train_loss": -41.003509521484375, "global_step": 198122, "epoch": 1637} {"train_loss": -40.2232780456543, "global_step": 198123, "epoch": 1637} {"train_loss": -39.15532302856445, "global_step": 198124, "epoch": 1637} {"train_loss": -39.42112350463867, "global_step": 198125, "epoch": 1637} {"train_loss": -40.28544998168945, "global_step": 198126, "epoch": 1637} {"train_loss": -39.78965377807617, "global_step": 198127, "epoch": 1637} {"train_loss": -40.599708557128906, "global_step": 198128, "epoch": 1637} {"train_loss": -39.31013870239258, "global_step": 198129, "epoch": 1637} {"train_loss": -40.36935043334961, "global_step": 198130, "epoch": 1637} {"train_loss": -40.61787796020508, "global_step": 198131, "epoch": 1637} {"train_loss": -38.78851318359375, "global_step": 198132, "epoch": 1637} {"train_loss": -39.8701057434082, "global_step": 198133, "epoch": 1637} {"train_loss": -40.076900482177734, "global_step": 198134, "epoch": 1637} {"train_loss": -40.388092041015625, "global_step": 198135, "epoch": 1637} {"train_loss": -39.7319450378418, "global_step": 198136, "epoch": 1637} {"train_loss": -39.430824279785156, "global_step": 198137, "epoch": 1637} {"train_loss": -39.58639144897461, "global_step": 198138, "epoch": 1637} {"train_loss": -38.443206787109375, "global_step": 198139, "epoch": 1637} {"train_loss": -38.718074798583984, "global_step": 198140, "epoch": 1637} {"train_loss": -40.5746955871582, "global_step": 198141, "epoch": 1637} {"train_loss": -40.804786682128906, "global_step": 198142, "epoch": 1637} {"train_loss": -39.94928741455078, "global_step": 198143, "epoch": 1637} {"train_loss": -39.92485809326172, "global_step": 198144, "epoch": 1637} {"train_loss": -40.47513961791992, "global_step": 198145, "epoch": 1637} {"train_loss": -41.24047088623047, "global_step": 198146, "epoch": 1637} {"train_loss": -41.17631530761719, "global_step": 198147, "epoch": 1637} {"train_loss": -40.6530647277832, "global_step": 198148, "epoch": 1637} {"train_loss": -41.20581817626953, "global_step": 198149, "epoch": 1637} {"train_loss": -41.306270599365234, "global_step": 198150, "epoch": 1637} {"train_loss": -41.078975677490234, "global_step": 198151, "epoch": 1637} {"train_loss": -41.31545639038086, "global_step": 198152, "epoch": 1637} {"train_loss": -40.73455047607422, "global_step": 198153, "epoch": 1637} {"train_loss": -40.52004623413086, "global_step": 198154, "epoch": 1637} {"train_loss": -41.255306243896484, "global_step": 198155, "epoch": 1637} {"train_loss": -41.780677795410156, "global_step": 198156, "epoch": 1637} {"train_loss": -41.03806686401367, "global_step": 198157, "epoch": 1637} {"train_loss": -41.47688674926758, "global_step": 198158, "epoch": 1637} {"train_loss": -40.344520568847656, "global_step": 198159, "epoch": 1637} {"train_loss": -41.2617301940918, "global_step": 198160, "epoch": 1637} {"train_loss": -41.28693771362305, "global_step": 198161, "epoch": 1637} {"train_loss": -41.08930587768555, "global_step": 198162, "epoch": 1637} {"train_loss": -41.116851806640625, "global_step": 198163, "epoch": 1637} {"train_loss": -41.01960372924805, "global_step": 198164, "epoch": 1637} {"train_loss": -41.77964782714844, "global_step": 198165, "epoch": 1637} {"train_loss": -40.73617172241211, "global_step": 198166, "epoch": 1637} {"train_loss": -41.18054962158203, "global_step": 198167, "epoch": 1637} {"train_loss": -41.00815200805664, "global_step": 198168, "epoch": 1637} {"train_loss": -41.47028350830078, "global_step": 198169, "epoch": 1637} {"train_loss": -41.311256408691406, "global_step": 198170, "epoch": 1637} {"train_loss": -41.743221282958984, "global_step": 198171, "epoch": 1637} {"train_loss": -41.23651885986328, "global_step": 198172, "epoch": 1637} {"train_loss": -42.049983978271484, "global_step": 198173, "epoch": 1637} {"train_loss": -40.39630889892578, "global_step": 198174, "epoch": 1637} {"train_loss": -41.56767272949219, "global_step": 198175, "epoch": 1637} {"train_loss": -41.47797393798828, "global_step": 198176, "epoch": 1637} {"train_loss": -40.09242248535156, "global_step": 198177, "epoch": 1637} {"train_loss": -40.99151611328125, "global_step": 198178, "epoch": 1637} {"train_loss": -41.10579299926758, "global_step": 198179, "epoch": 1637} {"train_loss": -41.38163375854492, "global_step": 198180, "epoch": 1637} {"train_loss": -41.282230377197266, "global_step": 198181, "epoch": 1637} {"train_loss": -41.29243850708008, "global_step": 198182, "epoch": 1637} {"train_loss": -41.554046630859375, "global_step": 198183, "epoch": 1637} {"train_loss": -41.14540481567383, "global_step": 198184, "epoch": 1637} {"train_loss": -41.63938522338867, "global_step": 198185, "epoch": 1637} {"train_loss": -40.69486999511719, "global_step": 198186, "epoch": 1637} {"train_loss": -41.37466812133789, "global_step": 198187, "epoch": 1637} {"train_loss": -41.42283248901367, "global_step": 198188, "epoch": 1637} {"train_loss": -39.42238998413086, "global_step": 198189, "epoch": 1637} {"train_loss": -36.342750549316406, "global_step": 198190, "epoch": 1637} {"train_loss": -37.39387130737305, "global_step": 198191, "epoch": 1637} {"train_loss": -39.98460006713867, "global_step": 198192, "epoch": 1637} {"train_loss": -40.779842376708984, "global_step": 198193, "epoch": 1637} {"train_loss": -41.62276077270508, "global_step": 198194, "epoch": 1637} {"train_loss": -40.40156173706055, "global_step": 198195, "epoch": 1637} {"train_loss": -41.24854278564453, "global_step": 198196, "epoch": 1637} {"train_loss": -40.57731306848447, "global_step": 198197, "epoch": 1637, "val_loss": 2567082.0} {"train_loss": -41.393043518066406, "global_step": 198198, "epoch": 1638} {"train_loss": -41.48707962036133, "global_step": 198199, "epoch": 1638} {"train_loss": -41.71068572998047, "global_step": 198200, "epoch": 1638} {"train_loss": -39.758113861083984, "global_step": 198201, "epoch": 1638} {"train_loss": -41.0272216796875, "global_step": 198202, "epoch": 1638} {"train_loss": -41.35550308227539, "global_step": 198203, "epoch": 1638} {"train_loss": -40.80044174194336, "global_step": 198204, "epoch": 1638} {"train_loss": -40.16621398925781, "global_step": 198205, "epoch": 1638} {"train_loss": -40.83217239379883, "global_step": 198206, "epoch": 1638} {"train_loss": -38.94907760620117, "global_step": 198207, "epoch": 1638} {"train_loss": -40.43708419799805, "global_step": 198208, "epoch": 1638} {"train_loss": -41.97959899902344, "global_step": 198209, "epoch": 1638} {"train_loss": -40.324623107910156, "global_step": 198210, "epoch": 1638} {"train_loss": -40.471160888671875, "global_step": 198211, "epoch": 1638} {"train_loss": -41.34430694580078, "global_step": 198212, "epoch": 1638} {"train_loss": -40.413604736328125, "global_step": 198213, "epoch": 1638} {"train_loss": -41.15447235107422, "global_step": 198214, "epoch": 1638} {"train_loss": -39.97980880737305, "global_step": 198215, "epoch": 1638} {"train_loss": -41.332881927490234, "global_step": 198216, "epoch": 1638} {"train_loss": -40.25751495361328, "global_step": 198217, "epoch": 1638} {"train_loss": -39.13733673095703, "global_step": 198218, "epoch": 1638} {"train_loss": -39.63380432128906, "global_step": 198219, "epoch": 1638} {"train_loss": -41.3502197265625, "global_step": 198220, "epoch": 1638} {"train_loss": -38.40631103515625, "global_step": 198221, "epoch": 1638} {"train_loss": -35.2702751159668, "global_step": 198222, "epoch": 1638} {"train_loss": -38.54315948486328, "global_step": 198223, "epoch": 1638} {"train_loss": -40.2720947265625, "global_step": 198224, "epoch": 1638} {"train_loss": -37.048797607421875, "global_step": 198225, "epoch": 1638} {"train_loss": -40.9329833984375, "global_step": 198226, "epoch": 1638} {"train_loss": -38.866943359375, "global_step": 198227, "epoch": 1638} {"train_loss": -38.97944259643555, "global_step": 198228, "epoch": 1638} {"train_loss": -40.53847885131836, "global_step": 198229, "epoch": 1638} {"train_loss": -39.08762741088867, "global_step": 198230, "epoch": 1638} {"train_loss": -40.740882873535156, "global_step": 198231, "epoch": 1638} {"train_loss": -39.65545654296875, "global_step": 198232, "epoch": 1638} {"train_loss": -39.53651809692383, "global_step": 198233, "epoch": 1638} {"train_loss": -40.76205062866211, "global_step": 198234, "epoch": 1638} {"train_loss": -38.30807113647461, "global_step": 198235, "epoch": 1638} {"train_loss": -41.04450607299805, "global_step": 198236, "epoch": 1638} {"train_loss": -39.10210037231445, "global_step": 198237, "epoch": 1638} {"train_loss": -39.869590759277344, "global_step": 198238, "epoch": 1638} {"train_loss": -39.94247817993164, "global_step": 198239, "epoch": 1638} {"train_loss": -41.243404388427734, "global_step": 198240, "epoch": 1638} {"train_loss": -39.77812576293945, "global_step": 198241, "epoch": 1638} {"train_loss": -41.39755630493164, "global_step": 198242, "epoch": 1638} {"train_loss": -40.0471076965332, "global_step": 198243, "epoch": 1638} {"train_loss": -40.84890365600586, "global_step": 198244, "epoch": 1638} {"train_loss": -39.909664154052734, "global_step": 198245, "epoch": 1638} {"train_loss": -40.22993087768555, "global_step": 198246, "epoch": 1638} {"train_loss": -40.78310012817383, "global_step": 198247, "epoch": 1638} {"train_loss": -41.34547424316406, "global_step": 198248, "epoch": 1638} {"train_loss": -41.25764083862305, "global_step": 198249, "epoch": 1638} {"train_loss": -41.665645599365234, "global_step": 198250, "epoch": 1638} {"train_loss": -40.96163558959961, "global_step": 198251, "epoch": 1638} {"train_loss": -41.447784423828125, "global_step": 198252, "epoch": 1638} {"train_loss": -41.31123733520508, "global_step": 198253, "epoch": 1638} {"train_loss": -41.73505783081055, "global_step": 198254, "epoch": 1638} {"train_loss": -40.1547966003418, "global_step": 198255, "epoch": 1638} {"train_loss": -41.74221420288086, "global_step": 198256, "epoch": 1638} {"train_loss": -41.489437103271484, "global_step": 198257, "epoch": 1638} {"train_loss": -41.78369903564453, "global_step": 198258, "epoch": 1638} {"train_loss": -41.40772247314453, "global_step": 198259, "epoch": 1638} {"train_loss": -41.9681396484375, "global_step": 198260, "epoch": 1638} {"train_loss": -41.766632080078125, "global_step": 198261, "epoch": 1638} {"train_loss": -40.995601654052734, "global_step": 198262, "epoch": 1638} {"train_loss": -41.91575241088867, "global_step": 198263, "epoch": 1638} {"train_loss": -41.76407241821289, "global_step": 198264, "epoch": 1638} {"train_loss": -41.35544967651367, "global_step": 198265, "epoch": 1638} {"train_loss": -41.758358001708984, "global_step": 198266, "epoch": 1638} {"train_loss": -42.055908203125, "global_step": 198267, "epoch": 1638} {"train_loss": -41.77081298828125, "global_step": 198268, "epoch": 1638} {"train_loss": -41.85758590698242, "global_step": 198269, "epoch": 1638} {"train_loss": -40.59339141845703, "global_step": 198270, "epoch": 1638} {"train_loss": -42.25938034057617, "global_step": 198271, "epoch": 1638} {"train_loss": -41.16604232788086, "global_step": 198272, "epoch": 1638} {"train_loss": -41.63297653198242, "global_step": 198273, "epoch": 1638} {"train_loss": -42.1833381652832, "global_step": 198274, "epoch": 1638} {"train_loss": -42.058067321777344, "global_step": 198275, "epoch": 1638} {"train_loss": -42.00623321533203, "global_step": 198276, "epoch": 1638} {"train_loss": -41.73234939575195, "global_step": 198277, "epoch": 1638} {"train_loss": -42.063777923583984, "global_step": 198278, "epoch": 1638} {"train_loss": -42.01443099975586, "global_step": 198279, "epoch": 1638} {"train_loss": -42.00887680053711, "global_step": 198280, "epoch": 1638} {"train_loss": -41.92940139770508, "global_step": 198281, "epoch": 1638} {"train_loss": -42.17210388183594, "global_step": 198282, "epoch": 1638} {"train_loss": -40.747955322265625, "global_step": 198283, "epoch": 1638} {"train_loss": -42.27581787109375, "global_step": 198284, "epoch": 1638} {"train_loss": -41.681182861328125, "global_step": 198285, "epoch": 1638} {"train_loss": -40.8026237487793, "global_step": 198286, "epoch": 1638} {"train_loss": -39.601531982421875, "global_step": 198287, "epoch": 1638} {"train_loss": -41.72040939331055, "global_step": 198288, "epoch": 1638} {"train_loss": -39.631832122802734, "global_step": 198289, "epoch": 1638} {"train_loss": -37.24272918701172, "global_step": 198290, "epoch": 1638} {"train_loss": -41.69817352294922, "global_step": 198291, "epoch": 1638} {"train_loss": -41.87813949584961, "global_step": 198292, "epoch": 1638} {"train_loss": -40.83037185668945, "global_step": 198293, "epoch": 1638} {"train_loss": -39.4704704284668, "global_step": 198294, "epoch": 1638} {"train_loss": -39.054927825927734, "global_step": 198295, "epoch": 1638} {"train_loss": -41.62930679321289, "global_step": 198296, "epoch": 1638} {"train_loss": -36.76664733886719, "global_step": 198297, "epoch": 1638} {"train_loss": -40.889705657958984, "global_step": 198298, "epoch": 1638} {"train_loss": -41.18056869506836, "global_step": 198299, "epoch": 1638} {"train_loss": -39.53573226928711, "global_step": 198300, "epoch": 1638} {"train_loss": -35.75056457519531, "global_step": 198301, "epoch": 1638} {"train_loss": -33.77986145019531, "global_step": 198302, "epoch": 1638} {"train_loss": -36.517303466796875, "global_step": 198303, "epoch": 1638} {"train_loss": -35.3049201965332, "global_step": 198304, "epoch": 1638} {"train_loss": -37.84143829345703, "global_step": 198305, "epoch": 1638} {"train_loss": -35.18846893310547, "global_step": 198306, "epoch": 1638} {"train_loss": -36.67588424682617, "global_step": 198307, "epoch": 1638} {"train_loss": -38.71683883666992, "global_step": 198308, "epoch": 1638} {"train_loss": -37.797603607177734, "global_step": 198309, "epoch": 1638} {"train_loss": -31.487451553344727, "global_step": 198310, "epoch": 1638} {"train_loss": -30.5145206451416, "global_step": 198311, "epoch": 1638} {"train_loss": -34.552425384521484, "global_step": 198312, "epoch": 1638} {"train_loss": -34.53622055053711, "global_step": 198313, "epoch": 1638} {"train_loss": -38.25564956665039, "global_step": 198314, "epoch": 1638} {"train_loss": -35.12727737426758, "global_step": 198315, "epoch": 1638} {"train_loss": -33.75197219848633, "global_step": 198316, "epoch": 1638} {"train_loss": -32.1109733581543, "global_step": 198317, "epoch": 1638} {"train_loss": -39.8737445547561, "global_step": 198318, "epoch": 1638, "val_loss": 2735193.75} {"train_loss": -36.74805450439453, "global_step": 198319, "epoch": 1639} {"train_loss": -35.535133361816406, "global_step": 198320, "epoch": 1639} {"train_loss": -34.47492218017578, "global_step": 198321, "epoch": 1639} {"train_loss": -32.029449462890625, "global_step": 198322, "epoch": 1639} {"train_loss": -34.35340881347656, "global_step": 198323, "epoch": 1639} {"train_loss": -37.071773529052734, "global_step": 198324, "epoch": 1639} {"train_loss": -36.32452392578125, "global_step": 198325, "epoch": 1639} {"train_loss": -34.706844329833984, "global_step": 198326, "epoch": 1639} {"train_loss": -33.53217697143555, "global_step": 198327, "epoch": 1639} {"train_loss": -36.315956115722656, "global_step": 198328, "epoch": 1639} {"train_loss": -36.53767395019531, "global_step": 198329, "epoch": 1639} {"train_loss": -36.904293060302734, "global_step": 198330, "epoch": 1639} {"train_loss": -35.032493591308594, "global_step": 198331, "epoch": 1639} {"train_loss": -35.861061096191406, "global_step": 198332, "epoch": 1639} {"train_loss": -37.75967025756836, "global_step": 198333, "epoch": 1639} {"train_loss": -37.342159271240234, "global_step": 198334, "epoch": 1639} {"train_loss": -37.75522994995117, "global_step": 198335, "epoch": 1639} {"train_loss": -36.24958038330078, "global_step": 198336, "epoch": 1639} {"train_loss": -37.535064697265625, "global_step": 198337, "epoch": 1639} {"train_loss": -37.91765213012695, "global_step": 198338, "epoch": 1639} {"train_loss": -37.78036117553711, "global_step": 198339, "epoch": 1639} {"train_loss": -39.684730529785156, "global_step": 198340, "epoch": 1639} {"train_loss": -38.10184860229492, "global_step": 198341, "epoch": 1639} {"train_loss": -37.66453170776367, "global_step": 198342, "epoch": 1639} {"train_loss": -36.95924758911133, "global_step": 198343, "epoch": 1639} {"train_loss": -38.679500579833984, "global_step": 198344, "epoch": 1639} {"train_loss": -38.032894134521484, "global_step": 198345, "epoch": 1639} {"train_loss": -36.96674728393555, "global_step": 198346, "epoch": 1639} {"train_loss": -39.16903305053711, "global_step": 198347, "epoch": 1639} {"train_loss": -38.87687683105469, "global_step": 198348, "epoch": 1639} {"train_loss": -38.572811126708984, "global_step": 198349, "epoch": 1639} {"train_loss": -39.344688415527344, "global_step": 198350, "epoch": 1639} {"train_loss": -39.1939811706543, "global_step": 198351, "epoch": 1639} {"train_loss": -38.77448272705078, "global_step": 198352, "epoch": 1639} {"train_loss": -39.58007049560547, "global_step": 198353, "epoch": 1639} {"train_loss": -38.77259063720703, "global_step": 198354, "epoch": 1639} {"train_loss": -39.22343444824219, "global_step": 198355, "epoch": 1639} {"train_loss": -39.52616882324219, "global_step": 198356, "epoch": 1639} {"train_loss": -39.97050857543945, "global_step": 198357, "epoch": 1639} {"train_loss": -39.21599578857422, "global_step": 198358, "epoch": 1639} {"train_loss": -38.451332092285156, "global_step": 198359, "epoch": 1639} {"train_loss": -38.83041000366211, "global_step": 198360, "epoch": 1639} {"train_loss": -39.6795768737793, "global_step": 198361, "epoch": 1639} {"train_loss": -39.82871627807617, "global_step": 198362, "epoch": 1639} {"train_loss": -39.35129928588867, "global_step": 198363, "epoch": 1639} {"train_loss": -39.68916702270508, "global_step": 198364, "epoch": 1639} {"train_loss": -39.83383560180664, "global_step": 198365, "epoch": 1639} {"train_loss": -39.28184509277344, "global_step": 198366, "epoch": 1639} {"train_loss": -39.19074630737305, "global_step": 198367, "epoch": 1639} {"train_loss": -40.523563385009766, "global_step": 198368, "epoch": 1639} {"train_loss": -39.76937484741211, "global_step": 198369, "epoch": 1639} {"train_loss": -39.216346740722656, "global_step": 198370, "epoch": 1639} {"train_loss": -39.706321716308594, "global_step": 198371, "epoch": 1639} {"train_loss": -40.07033920288086, "global_step": 198372, "epoch": 1639} {"train_loss": -40.5902214050293, "global_step": 198373, "epoch": 1639} {"train_loss": -39.13705062866211, "global_step": 198374, "epoch": 1639} {"train_loss": -40.7010498046875, "global_step": 198375, "epoch": 1639} {"train_loss": -40.137081146240234, "global_step": 198376, "epoch": 1639} {"train_loss": -40.122520446777344, "global_step": 198377, "epoch": 1639} {"train_loss": -40.33122253417969, "global_step": 198378, "epoch": 1639} {"train_loss": -41.2883186340332, "global_step": 198379, "epoch": 1639} {"train_loss": -40.04293441772461, "global_step": 198380, "epoch": 1639} {"train_loss": -40.36005401611328, "global_step": 198381, "epoch": 1639} {"train_loss": -40.07532501220703, "global_step": 198382, "epoch": 1639} {"train_loss": -40.51554489135742, "global_step": 198383, "epoch": 1639} {"train_loss": -40.2179069519043, "global_step": 198384, "epoch": 1639} {"train_loss": -40.25638961791992, "global_step": 198385, "epoch": 1639} {"train_loss": -40.404693603515625, "global_step": 198386, "epoch": 1639} {"train_loss": -40.40876007080078, "global_step": 198387, "epoch": 1639} {"train_loss": -40.743038177490234, "global_step": 198388, "epoch": 1639} {"train_loss": -41.0463981628418, "global_step": 198389, "epoch": 1639} {"train_loss": -41.002742767333984, "global_step": 198390, "epoch": 1639} {"train_loss": -40.966949462890625, "global_step": 198391, "epoch": 1639} {"train_loss": -41.174049377441406, "global_step": 198392, "epoch": 1639} {"train_loss": -39.46949005126953, "global_step": 198393, "epoch": 1639} {"train_loss": -40.128414154052734, "global_step": 198394, "epoch": 1639} {"train_loss": -41.307899475097656, "global_step": 198395, "epoch": 1639} {"train_loss": -40.62061309814453, "global_step": 198396, "epoch": 1639} {"train_loss": -40.926090240478516, "global_step": 198397, "epoch": 1639} {"train_loss": -41.354183197021484, "global_step": 198398, "epoch": 1639} {"train_loss": -40.729217529296875, "global_step": 198399, "epoch": 1639} {"train_loss": -41.55735397338867, "global_step": 198400, "epoch": 1639} {"train_loss": -41.0465087890625, "global_step": 198401, "epoch": 1639} {"train_loss": -40.4654655456543, "global_step": 198402, "epoch": 1639} {"train_loss": -41.669795989990234, "global_step": 198403, "epoch": 1639} {"train_loss": -40.47736740112305, "global_step": 198404, "epoch": 1639} {"train_loss": -40.9854621887207, "global_step": 198405, "epoch": 1639} {"train_loss": -41.297607421875, "global_step": 198406, "epoch": 1639} {"train_loss": -41.744327545166016, "global_step": 198407, "epoch": 1639} {"train_loss": -41.19506072998047, "global_step": 198408, "epoch": 1639} {"train_loss": -41.09370803833008, "global_step": 198409, "epoch": 1639} {"train_loss": -40.40623092651367, "global_step": 198410, "epoch": 1639} {"train_loss": -41.15871047973633, "global_step": 198411, "epoch": 1639} {"train_loss": -40.842140197753906, "global_step": 198412, "epoch": 1639} {"train_loss": -41.11874008178711, "global_step": 198413, "epoch": 1639} {"train_loss": -40.70627975463867, "global_step": 198414, "epoch": 1639} {"train_loss": -40.77939987182617, "global_step": 198415, "epoch": 1639} {"train_loss": -41.2806282043457, "global_step": 198416, "epoch": 1639} {"train_loss": -41.2775764465332, "global_step": 198417, "epoch": 1639} {"train_loss": -41.239463806152344, "global_step": 198418, "epoch": 1639} {"train_loss": -41.5084228515625, "global_step": 198419, "epoch": 1639} {"train_loss": -41.6123046875, "global_step": 198420, "epoch": 1639} {"train_loss": -41.758602142333984, "global_step": 198421, "epoch": 1639} {"train_loss": -41.47359848022461, "global_step": 198422, "epoch": 1639} {"train_loss": -41.695133209228516, "global_step": 198423, "epoch": 1639} {"train_loss": -39.73041534423828, "global_step": 198424, "epoch": 1639} {"train_loss": -41.371891021728516, "global_step": 198425, "epoch": 1639} {"train_loss": -40.86414337158203, "global_step": 198426, "epoch": 1639} {"train_loss": -41.47503662109375, "global_step": 198427, "epoch": 1639} {"train_loss": -41.439544677734375, "global_step": 198428, "epoch": 1639} {"train_loss": -41.96515655517578, "global_step": 198429, "epoch": 1639} {"train_loss": -41.86259078979492, "global_step": 198430, "epoch": 1639} {"train_loss": -41.388397216796875, "global_step": 198431, "epoch": 1639} {"train_loss": -41.358436584472656, "global_step": 198432, "epoch": 1639} {"train_loss": -41.46090316772461, "global_step": 198433, "epoch": 1639} {"train_loss": -41.07737731933594, "global_step": 198434, "epoch": 1639} {"train_loss": -41.92434310913086, "global_step": 198435, "epoch": 1639} {"train_loss": -41.30814743041992, "global_step": 198436, "epoch": 1639} {"train_loss": -37.58576583862305, "global_step": 198437, "epoch": 1639} {"train_loss": -38.12354278564453, "global_step": 198438, "epoch": 1639} {"train_loss": -39.52669329682657, "global_step": 198439, "epoch": 1639, "val_loss": 2602039.0} {"train_loss": -38.71932601928711, "global_step": 198440, "epoch": 1640} {"train_loss": -41.39045333862305, "global_step": 198441, "epoch": 1640} {"train_loss": -39.63679504394531, "global_step": 198442, "epoch": 1640} {"train_loss": -40.47996139526367, "global_step": 198443, "epoch": 1640} {"train_loss": -39.96619415283203, "global_step": 198444, "epoch": 1640} {"train_loss": -40.18918991088867, "global_step": 198445, "epoch": 1640} {"train_loss": -40.258323669433594, "global_step": 198446, "epoch": 1640} {"train_loss": -40.9658317565918, "global_step": 198447, "epoch": 1640} {"train_loss": -39.77772521972656, "global_step": 198448, "epoch": 1640} {"train_loss": -38.58372116088867, "global_step": 198449, "epoch": 1640} {"train_loss": -38.96168518066406, "global_step": 198450, "epoch": 1640} {"train_loss": -40.21734619140625, "global_step": 198451, "epoch": 1640} {"train_loss": -39.771583557128906, "global_step": 198452, "epoch": 1640} {"train_loss": -40.09663391113281, "global_step": 198453, "epoch": 1640} {"train_loss": -39.273597717285156, "global_step": 198454, "epoch": 1640} {"train_loss": -40.32417678833008, "global_step": 198455, "epoch": 1640} {"train_loss": -40.00537872314453, "global_step": 198456, "epoch": 1640} {"train_loss": -39.1593132019043, "global_step": 198457, "epoch": 1640} {"train_loss": -40.94830322265625, "global_step": 198458, "epoch": 1640} {"train_loss": -40.03504180908203, "global_step": 198459, "epoch": 1640} {"train_loss": -40.6584587097168, "global_step": 198460, "epoch": 1640} {"train_loss": -40.990177154541016, "global_step": 198461, "epoch": 1640} {"train_loss": -40.141910552978516, "global_step": 198462, "epoch": 1640} {"train_loss": -40.61351013183594, "global_step": 198463, "epoch": 1640} {"train_loss": -41.05095291137695, "global_step": 198464, "epoch": 1640} {"train_loss": -41.115875244140625, "global_step": 198465, "epoch": 1640} {"train_loss": -41.28614044189453, "global_step": 198466, "epoch": 1640} {"train_loss": -40.883419036865234, "global_step": 198467, "epoch": 1640} {"train_loss": -40.697383880615234, "global_step": 198468, "epoch": 1640} {"train_loss": -40.8693733215332, "global_step": 198469, "epoch": 1640} {"train_loss": -41.58411407470703, "global_step": 198470, "epoch": 1640} {"train_loss": -40.9570426940918, "global_step": 198471, "epoch": 1640} {"train_loss": -41.229896545410156, "global_step": 198472, "epoch": 1640} {"train_loss": -41.1879997253418, "global_step": 198473, "epoch": 1640} {"train_loss": -41.40523910522461, "global_step": 198474, "epoch": 1640} {"train_loss": -41.39786148071289, "global_step": 198475, "epoch": 1640} {"train_loss": -41.12131881713867, "global_step": 198476, "epoch": 1640} {"train_loss": -41.60420227050781, "global_step": 198477, "epoch": 1640} {"train_loss": -41.28501510620117, "global_step": 198478, "epoch": 1640} {"train_loss": -40.902931213378906, "global_step": 198479, "epoch": 1640} {"train_loss": -41.189056396484375, "global_step": 198480, "epoch": 1640} {"train_loss": -41.62639617919922, "global_step": 198481, "epoch": 1640} {"train_loss": -42.021240234375, "global_step": 198482, "epoch": 1640} {"train_loss": -40.83730697631836, "global_step": 198483, "epoch": 1640} {"train_loss": -42.10645294189453, "global_step": 198484, "epoch": 1640} {"train_loss": -40.83367919921875, "global_step": 198485, "epoch": 1640} {"train_loss": -41.89639663696289, "global_step": 198486, "epoch": 1640} {"train_loss": -41.856868743896484, "global_step": 198487, "epoch": 1640} {"train_loss": -41.7531852722168, "global_step": 198488, "epoch": 1640} {"train_loss": -41.542232513427734, "global_step": 198489, "epoch": 1640} {"train_loss": -41.676025390625, "global_step": 198490, "epoch": 1640} {"train_loss": -41.44917678833008, "global_step": 198491, "epoch": 1640} {"train_loss": -41.332611083984375, "global_step": 198492, "epoch": 1640} {"train_loss": -41.40578842163086, "global_step": 198493, "epoch": 1640} {"train_loss": -40.319419860839844, "global_step": 198494, "epoch": 1640} {"train_loss": -40.67577362060547, "global_step": 198495, "epoch": 1640} {"train_loss": -41.1987190246582, "global_step": 198496, "epoch": 1640} {"train_loss": -41.22221755981445, "global_step": 198497, "epoch": 1640} {"train_loss": -42.335304260253906, "global_step": 198498, "epoch": 1640} {"train_loss": -41.64301300048828, "global_step": 198499, "epoch": 1640} {"train_loss": -40.29185485839844, "global_step": 198500, "epoch": 1640} {"train_loss": -41.244483947753906, "global_step": 198501, "epoch": 1640} {"train_loss": -41.617034912109375, "global_step": 198502, "epoch": 1640} {"train_loss": -41.5137939453125, "global_step": 198503, "epoch": 1640} {"train_loss": -41.793331146240234, "global_step": 198504, "epoch": 1640} {"train_loss": -39.98193359375, "global_step": 198505, "epoch": 1640} {"train_loss": -40.9661865234375, "global_step": 198506, "epoch": 1640} {"train_loss": -40.77412033081055, "global_step": 198507, "epoch": 1640} {"train_loss": -40.49671936035156, "global_step": 198508, "epoch": 1640} {"train_loss": -41.641292572021484, "global_step": 198509, "epoch": 1640} {"train_loss": -40.10548400878906, "global_step": 198510, "epoch": 1640} {"train_loss": -40.933204650878906, "global_step": 198511, "epoch": 1640} {"train_loss": -40.35009765625, "global_step": 198512, "epoch": 1640} {"train_loss": -40.635169982910156, "global_step": 198513, "epoch": 1640} {"train_loss": -39.73476791381836, "global_step": 198514, "epoch": 1640} {"train_loss": -40.70866012573242, "global_step": 198515, "epoch": 1640} {"train_loss": -41.087493896484375, "global_step": 198516, "epoch": 1640} {"train_loss": -40.79822540283203, "global_step": 198517, "epoch": 1640} {"train_loss": -39.41374588012695, "global_step": 198518, "epoch": 1640} {"train_loss": -40.43251419067383, "global_step": 198519, "epoch": 1640} {"train_loss": -39.76960372924805, "global_step": 198520, "epoch": 1640} {"train_loss": -39.09846878051758, "global_step": 198521, "epoch": 1640} {"train_loss": -40.5178337097168, "global_step": 198522, "epoch": 1640} {"train_loss": -40.604434967041016, "global_step": 198523, "epoch": 1640} {"train_loss": -39.19537353515625, "global_step": 198524, "epoch": 1640} {"train_loss": -40.092567443847656, "global_step": 198525, "epoch": 1640} {"train_loss": -40.734893798828125, "global_step": 198526, "epoch": 1640} {"train_loss": -40.61763381958008, "global_step": 198527, "epoch": 1640} {"train_loss": -41.158966064453125, "global_step": 198528, "epoch": 1640} {"train_loss": -41.23523712158203, "global_step": 198529, "epoch": 1640} {"train_loss": -39.619529724121094, "global_step": 198530, "epoch": 1640} {"train_loss": -40.3324089050293, "global_step": 198531, "epoch": 1640} {"train_loss": -34.88040542602539, "global_step": 198532, "epoch": 1640} {"train_loss": -38.076045989990234, "global_step": 198533, "epoch": 1640} {"train_loss": -31.860462188720703, "global_step": 198534, "epoch": 1640} {"train_loss": -36.0264892578125, "global_step": 198535, "epoch": 1640} {"train_loss": -39.292762756347656, "global_step": 198536, "epoch": 1640} {"train_loss": -39.46403884887695, "global_step": 198537, "epoch": 1640} {"train_loss": -35.1967658996582, "global_step": 198538, "epoch": 1640} {"train_loss": -38.24985885620117, "global_step": 198539, "epoch": 1640} {"train_loss": -39.309173583984375, "global_step": 198540, "epoch": 1640} {"train_loss": -37.872737884521484, "global_step": 198541, "epoch": 1640} {"train_loss": -39.92329025268555, "global_step": 198542, "epoch": 1640} {"train_loss": -38.686004638671875, "global_step": 198543, "epoch": 1640} {"train_loss": -40.281917572021484, "global_step": 198544, "epoch": 1640} {"train_loss": -38.65408706665039, "global_step": 198545, "epoch": 1640} {"train_loss": -39.873287200927734, "global_step": 198546, "epoch": 1640} {"train_loss": -39.508724212646484, "global_step": 198547, "epoch": 1640} {"train_loss": -40.088844299316406, "global_step": 198548, "epoch": 1640} {"train_loss": -39.9283561706543, "global_step": 198549, "epoch": 1640} {"train_loss": -38.8268928527832, "global_step": 198550, "epoch": 1640} {"train_loss": -39.40641403198242, "global_step": 198551, "epoch": 1640} {"train_loss": -38.70765686035156, "global_step": 198552, "epoch": 1640} {"train_loss": -40.146854400634766, "global_step": 198553, "epoch": 1640} {"train_loss": -40.44031524658203, "global_step": 198554, "epoch": 1640} {"train_loss": -39.24512481689453, "global_step": 198555, "epoch": 1640} {"train_loss": -41.0359992980957, "global_step": 198556, "epoch": 1640} {"train_loss": -40.66360092163086, "global_step": 198557, "epoch": 1640} {"train_loss": -40.46348190307617, "global_step": 198558, "epoch": 1640} {"train_loss": -41.047542572021484, "global_step": 198559, "epoch": 1640} {"train_loss": -40.2797526840336, "global_step": 198560, "epoch": 1640, "val_loss": 2620577.25} {"train_loss": -41.00596237182617, "global_step": 198561, "epoch": 1641} {"train_loss": -40.8820686340332, "global_step": 198562, "epoch": 1641} {"train_loss": -40.880775451660156, "global_step": 198563, "epoch": 1641} {"train_loss": -41.08692932128906, "global_step": 198564, "epoch": 1641} {"train_loss": -41.10712814331055, "global_step": 198565, "epoch": 1641} {"train_loss": -41.226959228515625, "global_step": 198566, "epoch": 1641} {"train_loss": -40.02728271484375, "global_step": 198567, "epoch": 1641} {"train_loss": -41.31473922729492, "global_step": 198568, "epoch": 1641} {"train_loss": -40.217708587646484, "global_step": 198569, "epoch": 1641} {"train_loss": -41.3274040222168, "global_step": 198570, "epoch": 1641} {"train_loss": -40.730899810791016, "global_step": 198571, "epoch": 1641} {"train_loss": -40.794795989990234, "global_step": 198572, "epoch": 1641} {"train_loss": -41.1692008972168, "global_step": 198573, "epoch": 1641} {"train_loss": -41.680641174316406, "global_step": 198574, "epoch": 1641} {"train_loss": -41.300209045410156, "global_step": 198575, "epoch": 1641} {"train_loss": -36.93833541870117, "global_step": 198576, "epoch": 1641} {"train_loss": -41.32288360595703, "global_step": 198577, "epoch": 1641} {"train_loss": -41.774776458740234, "global_step": 198578, "epoch": 1641} {"train_loss": -41.2777099609375, "global_step": 198579, "epoch": 1641} {"train_loss": -41.44631576538086, "global_step": 198580, "epoch": 1641} {"train_loss": -41.76082992553711, "global_step": 198581, "epoch": 1641} {"train_loss": -36.11677932739258, "global_step": 198582, "epoch": 1641} {"train_loss": -41.47245407104492, "global_step": 198583, "epoch": 1641} {"train_loss": -40.2991943359375, "global_step": 198584, "epoch": 1641} {"train_loss": -40.93513107299805, "global_step": 198585, "epoch": 1641} {"train_loss": -40.714420318603516, "global_step": 198586, "epoch": 1641} {"train_loss": -40.76569366455078, "global_step": 198587, "epoch": 1641} {"train_loss": -41.01323318481445, "global_step": 198588, "epoch": 1641} {"train_loss": -40.79204177856445, "global_step": 198589, "epoch": 1641} {"train_loss": -41.56965255737305, "global_step": 198590, "epoch": 1641} {"train_loss": -41.07560348510742, "global_step": 198591, "epoch": 1641} {"train_loss": -41.3742790222168, "global_step": 198592, "epoch": 1641} {"train_loss": -39.90034103393555, "global_step": 198593, "epoch": 1641} {"train_loss": -41.8841552734375, "global_step": 198594, "epoch": 1641} {"train_loss": -40.65122604370117, "global_step": 198595, "epoch": 1641} {"train_loss": -41.42678451538086, "global_step": 198596, "epoch": 1641} {"train_loss": -41.6652946472168, "global_step": 198597, "epoch": 1641} {"train_loss": -41.14665603637695, "global_step": 198598, "epoch": 1641} {"train_loss": -41.405147552490234, "global_step": 198599, "epoch": 1641} {"train_loss": -41.06290817260742, "global_step": 198600, "epoch": 1641} {"train_loss": -41.4764404296875, "global_step": 198601, "epoch": 1641} {"train_loss": -41.33712387084961, "global_step": 198602, "epoch": 1641} {"train_loss": -41.970088958740234, "global_step": 198603, "epoch": 1641} {"train_loss": -41.755889892578125, "global_step": 198604, "epoch": 1641} {"train_loss": -41.53788757324219, "global_step": 198605, "epoch": 1641} {"train_loss": -41.61043930053711, "global_step": 198606, "epoch": 1641} {"train_loss": -40.81367492675781, "global_step": 198607, "epoch": 1641} {"train_loss": -41.20806884765625, "global_step": 198608, "epoch": 1641} {"train_loss": -41.01069259643555, "global_step": 198609, "epoch": 1641} {"train_loss": -40.30436325073242, "global_step": 198610, "epoch": 1641} {"train_loss": -41.0001335144043, "global_step": 198611, "epoch": 1641} {"train_loss": -41.45071792602539, "global_step": 198612, "epoch": 1641} {"train_loss": -41.416934967041016, "global_step": 198613, "epoch": 1641} {"train_loss": -41.803585052490234, "global_step": 198614, "epoch": 1641} {"train_loss": -41.829708099365234, "global_step": 198615, "epoch": 1641} {"train_loss": -41.38908767700195, "global_step": 198616, "epoch": 1641} {"train_loss": -38.63652420043945, "global_step": 198617, "epoch": 1641} {"train_loss": -40.9541130065918, "global_step": 198618, "epoch": 1641} {"train_loss": -39.9891242980957, "global_step": 198619, "epoch": 1641} {"train_loss": -39.238365173339844, "global_step": 198620, "epoch": 1641} {"train_loss": -40.64712142944336, "global_step": 198621, "epoch": 1641} {"train_loss": -40.40444564819336, "global_step": 198622, "epoch": 1641} {"train_loss": -32.11812973022461, "global_step": 198623, "epoch": 1641} {"train_loss": -38.02891159057617, "global_step": 198624, "epoch": 1641} {"train_loss": -40.46490478515625, "global_step": 198625, "epoch": 1641} {"train_loss": -36.669612884521484, "global_step": 198626, "epoch": 1641} {"train_loss": -30.205747604370117, "global_step": 198627, "epoch": 1641} {"train_loss": -36.90662384033203, "global_step": 198628, "epoch": 1641} {"train_loss": -40.15232467651367, "global_step": 198629, "epoch": 1641} {"train_loss": -39.162227630615234, "global_step": 198630, "epoch": 1641} {"train_loss": -38.91994094848633, "global_step": 198631, "epoch": 1641} {"train_loss": -40.10300827026367, "global_step": 198632, "epoch": 1641} {"train_loss": -39.682716369628906, "global_step": 198633, "epoch": 1641} {"train_loss": -39.63203048706055, "global_step": 198634, "epoch": 1641} {"train_loss": -40.43723678588867, "global_step": 198635, "epoch": 1641} {"train_loss": -37.694000244140625, "global_step": 198636, "epoch": 1641} {"train_loss": -39.50007247924805, "global_step": 198637, "epoch": 1641} {"train_loss": -40.012786865234375, "global_step": 198638, "epoch": 1641} {"train_loss": -39.567237854003906, "global_step": 198639, "epoch": 1641} {"train_loss": -39.735538482666016, "global_step": 198640, "epoch": 1641} {"train_loss": -40.64986801147461, "global_step": 198641, "epoch": 1641} {"train_loss": -40.81448745727539, "global_step": 198642, "epoch": 1641} {"train_loss": -39.99857711791992, "global_step": 198643, "epoch": 1641} {"train_loss": -40.63357162475586, "global_step": 198644, "epoch": 1641} {"train_loss": -40.289588928222656, "global_step": 198645, "epoch": 1641} {"train_loss": -40.716644287109375, "global_step": 198646, "epoch": 1641} {"train_loss": -40.7982063293457, "global_step": 198647, "epoch": 1641} {"train_loss": -40.714378356933594, "global_step": 198648, "epoch": 1641} {"train_loss": -38.86430740356445, "global_step": 198649, "epoch": 1641} {"train_loss": -39.18467330932617, "global_step": 198650, "epoch": 1641} {"train_loss": -41.057044982910156, "global_step": 198651, "epoch": 1641} {"train_loss": -40.44180679321289, "global_step": 198652, "epoch": 1641} {"train_loss": -38.48308181762695, "global_step": 198653, "epoch": 1641} {"train_loss": -40.37994384765625, "global_step": 198654, "epoch": 1641} {"train_loss": -40.62229537963867, "global_step": 198655, "epoch": 1641} {"train_loss": -39.84719467163086, "global_step": 198656, "epoch": 1641} {"train_loss": -37.7465705871582, "global_step": 198657, "epoch": 1641} {"train_loss": -40.0924072265625, "global_step": 198658, "epoch": 1641} {"train_loss": -41.08382034301758, "global_step": 198659, "epoch": 1641} {"train_loss": -39.942657470703125, "global_step": 198660, "epoch": 1641} {"train_loss": -39.297828674316406, "global_step": 198661, "epoch": 1641} {"train_loss": -39.91717529296875, "global_step": 198662, "epoch": 1641} {"train_loss": -40.30830001831055, "global_step": 198663, "epoch": 1641} {"train_loss": -40.334415435791016, "global_step": 198664, "epoch": 1641} {"train_loss": -36.9191780090332, "global_step": 198665, "epoch": 1641} {"train_loss": -38.129066467285156, "global_step": 198666, "epoch": 1641} {"train_loss": -41.082393646240234, "global_step": 198667, "epoch": 1641} {"train_loss": -41.70060348510742, "global_step": 198668, "epoch": 1641} {"train_loss": -40.20769119262695, "global_step": 198669, "epoch": 1641} {"train_loss": -41.098060607910156, "global_step": 198670, "epoch": 1641} {"train_loss": -40.90468215942383, "global_step": 198671, "epoch": 1641} {"train_loss": -40.371429443359375, "global_step": 198672, "epoch": 1641} {"train_loss": -37.97622299194336, "global_step": 198673, "epoch": 1641} {"train_loss": -40.830440521240234, "global_step": 198674, "epoch": 1641} {"train_loss": -40.55474853515625, "global_step": 198675, "epoch": 1641} {"train_loss": -39.4846305847168, "global_step": 198676, "epoch": 1641} {"train_loss": -40.600765228271484, "global_step": 198677, "epoch": 1641} {"train_loss": -39.4974365234375, "global_step": 198678, "epoch": 1641} {"train_loss": -39.8575439453125, "global_step": 198679, "epoch": 1641} {"train_loss": -39.997772216796875, "global_step": 198680, "epoch": 1641} {"train_loss": -40.20331947074449, "global_step": 198681, "epoch": 1641, "val_loss": 2873020.75} {"train_loss": -38.19914245605469, "global_step": 198682, "epoch": 1642} {"train_loss": -40.168758392333984, "global_step": 198683, "epoch": 1642} {"train_loss": -40.417640686035156, "global_step": 198684, "epoch": 1642} {"train_loss": -38.626625061035156, "global_step": 198685, "epoch": 1642} {"train_loss": -39.15163040161133, "global_step": 198686, "epoch": 1642} {"train_loss": -40.46869659423828, "global_step": 198687, "epoch": 1642} {"train_loss": -36.515987396240234, "global_step": 198688, "epoch": 1642} {"train_loss": -38.99394989013672, "global_step": 198689, "epoch": 1642} {"train_loss": -40.55937957763672, "global_step": 198690, "epoch": 1642} {"train_loss": -38.29182815551758, "global_step": 198691, "epoch": 1642} {"train_loss": -39.5507926940918, "global_step": 198692, "epoch": 1642} {"train_loss": -40.77836990356445, "global_step": 198693, "epoch": 1642} {"train_loss": -39.5821418762207, "global_step": 198694, "epoch": 1642} {"train_loss": -41.186885833740234, "global_step": 198695, "epoch": 1642} {"train_loss": -39.91073989868164, "global_step": 198696, "epoch": 1642} {"train_loss": -39.739173889160156, "global_step": 198697, "epoch": 1642} {"train_loss": -39.866127014160156, "global_step": 198698, "epoch": 1642} {"train_loss": -40.2069206237793, "global_step": 198699, "epoch": 1642} {"train_loss": -40.26790237426758, "global_step": 198700, "epoch": 1642} {"train_loss": -40.895999908447266, "global_step": 198701, "epoch": 1642} {"train_loss": -39.787349700927734, "global_step": 198702, "epoch": 1642} {"train_loss": -40.93320846557617, "global_step": 198703, "epoch": 1642} {"train_loss": -41.316837310791016, "global_step": 198704, "epoch": 1642} {"train_loss": -40.919525146484375, "global_step": 198705, "epoch": 1642} {"train_loss": -40.770782470703125, "global_step": 198706, "epoch": 1642} {"train_loss": -40.728755950927734, "global_step": 198707, "epoch": 1642} {"train_loss": -41.371604919433594, "global_step": 198708, "epoch": 1642} {"train_loss": -41.752777099609375, "global_step": 198709, "epoch": 1642} {"train_loss": -40.17387008666992, "global_step": 198710, "epoch": 1642} {"train_loss": -40.872066497802734, "global_step": 198711, "epoch": 1642} {"train_loss": -41.28586959838867, "global_step": 198712, "epoch": 1642} {"train_loss": -41.221435546875, "global_step": 198713, "epoch": 1642} {"train_loss": -41.612911224365234, "global_step": 198714, "epoch": 1642} {"train_loss": -41.796226501464844, "global_step": 198715, "epoch": 1642} {"train_loss": -40.85652542114258, "global_step": 198716, "epoch": 1642} {"train_loss": -41.39870834350586, "global_step": 198717, "epoch": 1642} {"train_loss": -41.122894287109375, "global_step": 198718, "epoch": 1642} {"train_loss": -41.01484298706055, "global_step": 198719, "epoch": 1642} {"train_loss": -41.7983283996582, "global_step": 198720, "epoch": 1642} {"train_loss": -41.338565826416016, "global_step": 198721, "epoch": 1642} {"train_loss": -41.17287826538086, "global_step": 198722, "epoch": 1642} {"train_loss": -41.84778594970703, "global_step": 198723, "epoch": 1642} {"train_loss": -41.10356521606445, "global_step": 198724, "epoch": 1642} {"train_loss": -41.485042572021484, "global_step": 198725, "epoch": 1642} {"train_loss": -40.28956985473633, "global_step": 198726, "epoch": 1642} {"train_loss": -41.753387451171875, "global_step": 198727, "epoch": 1642} {"train_loss": -40.7509880065918, "global_step": 198728, "epoch": 1642} {"train_loss": -40.94587326049805, "global_step": 198729, "epoch": 1642} {"train_loss": -41.35443115234375, "global_step": 198730, "epoch": 1642} {"train_loss": -41.18950653076172, "global_step": 198731, "epoch": 1642} {"train_loss": -41.40200424194336, "global_step": 198732, "epoch": 1642} {"train_loss": -41.39659881591797, "global_step": 198733, "epoch": 1642} {"train_loss": -39.37516784667969, "global_step": 198734, "epoch": 1642} {"train_loss": -41.135128021240234, "global_step": 198735, "epoch": 1642} {"train_loss": -41.7501335144043, "global_step": 198736, "epoch": 1642} {"train_loss": -41.425350189208984, "global_step": 198737, "epoch": 1642} {"train_loss": -40.98862838745117, "global_step": 198738, "epoch": 1642} {"train_loss": -40.613887786865234, "global_step": 198739, "epoch": 1642} {"train_loss": -42.0354118347168, "global_step": 198740, "epoch": 1642} {"train_loss": -41.10951232910156, "global_step": 198741, "epoch": 1642} {"train_loss": -39.998451232910156, "global_step": 198742, "epoch": 1642} {"train_loss": -40.884883880615234, "global_step": 198743, "epoch": 1642} {"train_loss": -41.313167572021484, "global_step": 198744, "epoch": 1642} {"train_loss": -41.0150146484375, "global_step": 198745, "epoch": 1642} {"train_loss": -41.09050750732422, "global_step": 198746, "epoch": 1642} {"train_loss": -40.955928802490234, "global_step": 198747, "epoch": 1642} {"train_loss": -41.18575668334961, "global_step": 198748, "epoch": 1642} {"train_loss": -41.70358657836914, "global_step": 198749, "epoch": 1642} {"train_loss": -41.06293869018555, "global_step": 198750, "epoch": 1642} {"train_loss": -40.767452239990234, "global_step": 198751, "epoch": 1642} {"train_loss": -41.9398078918457, "global_step": 198752, "epoch": 1642} {"train_loss": -41.21596908569336, "global_step": 198753, "epoch": 1642} {"train_loss": -38.684242248535156, "global_step": 198754, "epoch": 1642} {"train_loss": -41.34796142578125, "global_step": 198755, "epoch": 1642} {"train_loss": -40.49781036376953, "global_step": 198756, "epoch": 1642} {"train_loss": -41.5678596496582, "global_step": 198757, "epoch": 1642} {"train_loss": -40.70100784301758, "global_step": 198758, "epoch": 1642} {"train_loss": -40.647579193115234, "global_step": 198759, "epoch": 1642} {"train_loss": -41.15180969238281, "global_step": 198760, "epoch": 1642} {"train_loss": -39.6281852722168, "global_step": 198761, "epoch": 1642} {"train_loss": -38.20015335083008, "global_step": 198762, "epoch": 1642} {"train_loss": -38.13178634643555, "global_step": 198763, "epoch": 1642} {"train_loss": -40.7358512878418, "global_step": 198764, "epoch": 1642} {"train_loss": -35.433921813964844, "global_step": 198765, "epoch": 1642} {"train_loss": -41.6977653503418, "global_step": 198766, "epoch": 1642} {"train_loss": -41.7088737487793, "global_step": 198767, "epoch": 1642} {"train_loss": -41.34723663330078, "global_step": 198768, "epoch": 1642} {"train_loss": -41.57135009765625, "global_step": 198769, "epoch": 1642} {"train_loss": -39.559814453125, "global_step": 198770, "epoch": 1642} {"train_loss": -41.46982192993164, "global_step": 198771, "epoch": 1642} {"train_loss": -41.55453109741211, "global_step": 198772, "epoch": 1642} {"train_loss": -40.65076446533203, "global_step": 198773, "epoch": 1642} {"train_loss": -42.04151916503906, "global_step": 198774, "epoch": 1642} {"train_loss": -41.6543083190918, "global_step": 198775, "epoch": 1642} {"train_loss": -41.77813720703125, "global_step": 198776, "epoch": 1642} {"train_loss": -42.066036224365234, "global_step": 198777, "epoch": 1642} {"train_loss": -39.035919189453125, "global_step": 198778, "epoch": 1642} {"train_loss": -41.15157699584961, "global_step": 198779, "epoch": 1642} {"train_loss": -41.70347213745117, "global_step": 198780, "epoch": 1642} {"train_loss": -41.40510940551758, "global_step": 198781, "epoch": 1642} {"train_loss": -41.33414840698242, "global_step": 198782, "epoch": 1642} {"train_loss": -41.05683135986328, "global_step": 198783, "epoch": 1642} {"train_loss": -41.23020553588867, "global_step": 198784, "epoch": 1642} {"train_loss": -42.439476013183594, "global_step": 198785, "epoch": 1642} {"train_loss": -41.02106475830078, "global_step": 198786, "epoch": 1642} {"train_loss": -41.65290069580078, "global_step": 198787, "epoch": 1642} {"train_loss": -41.02117919921875, "global_step": 198788, "epoch": 1642} {"train_loss": -41.53184127807617, "global_step": 198789, "epoch": 1642} {"train_loss": -41.86479568481445, "global_step": 198790, "epoch": 1642} {"train_loss": -42.00159454345703, "global_step": 198791, "epoch": 1642} {"train_loss": -39.24842071533203, "global_step": 198792, "epoch": 1642} {"train_loss": -39.978702545166016, "global_step": 198793, "epoch": 1642} {"train_loss": -39.67212677001953, "global_step": 198794, "epoch": 1642} {"train_loss": -41.34577178955078, "global_step": 198795, "epoch": 1642} {"train_loss": -40.59148025512695, "global_step": 198796, "epoch": 1642} {"train_loss": -41.426029205322266, "global_step": 198797, "epoch": 1642} {"train_loss": -40.777870178222656, "global_step": 198798, "epoch": 1642} {"train_loss": -39.83448028564453, "global_step": 198799, "epoch": 1642} {"train_loss": -40.114498138427734, "global_step": 198800, "epoch": 1642} {"train_loss": -35.787200927734375, "global_step": 198801, "epoch": 1642} {"train_loss": -40.67265631935813, "global_step": 198802, "epoch": 1642, "val_loss": 2733213.25} {"train_loss": -40.9266471862793, "global_step": 198803, "epoch": 1643} {"train_loss": -40.749149322509766, "global_step": 198804, "epoch": 1643} {"train_loss": -39.490474700927734, "global_step": 198805, "epoch": 1643} {"train_loss": -41.51099395751953, "global_step": 198806, "epoch": 1643} {"train_loss": -40.918365478515625, "global_step": 198807, "epoch": 1643} {"train_loss": -40.267578125, "global_step": 198808, "epoch": 1643} {"train_loss": -38.78950119018555, "global_step": 198809, "epoch": 1643} {"train_loss": -37.79289627075195, "global_step": 198810, "epoch": 1643} {"train_loss": -39.49641036987305, "global_step": 198811, "epoch": 1643} {"train_loss": -40.08380889892578, "global_step": 198812, "epoch": 1643} {"train_loss": -39.95423889160156, "global_step": 198813, "epoch": 1643} {"train_loss": -40.794769287109375, "global_step": 198814, "epoch": 1643} {"train_loss": -39.87774658203125, "global_step": 198815, "epoch": 1643} {"train_loss": -40.46529006958008, "global_step": 198816, "epoch": 1643} {"train_loss": -39.87331008911133, "global_step": 198817, "epoch": 1643} {"train_loss": -40.084232330322266, "global_step": 198818, "epoch": 1643} {"train_loss": -41.4708251953125, "global_step": 198819, "epoch": 1643} {"train_loss": -40.31140899658203, "global_step": 198820, "epoch": 1643} {"train_loss": -41.25962448120117, "global_step": 198821, "epoch": 1643} {"train_loss": -41.69483184814453, "global_step": 198822, "epoch": 1643} {"train_loss": -40.83757781982422, "global_step": 198823, "epoch": 1643} {"train_loss": -41.549373626708984, "global_step": 198824, "epoch": 1643} {"train_loss": -40.914127349853516, "global_step": 198825, "epoch": 1643} {"train_loss": -41.98728561401367, "global_step": 198826, "epoch": 1643} {"train_loss": -40.23676681518555, "global_step": 198827, "epoch": 1643} {"train_loss": -41.12715530395508, "global_step": 198828, "epoch": 1643} {"train_loss": -41.200923919677734, "global_step": 198829, "epoch": 1643} {"train_loss": -41.953121185302734, "global_step": 198830, "epoch": 1643} {"train_loss": -41.73281478881836, "global_step": 198831, "epoch": 1643} {"train_loss": -40.93329620361328, "global_step": 198832, "epoch": 1643} {"train_loss": -41.63983917236328, "global_step": 198833, "epoch": 1643} {"train_loss": -41.72097396850586, "global_step": 198834, "epoch": 1643} {"train_loss": -41.85921859741211, "global_step": 198835, "epoch": 1643} {"train_loss": -41.61175537109375, "global_step": 198836, "epoch": 1643} {"train_loss": -42.28929901123047, "global_step": 198837, "epoch": 1643} {"train_loss": -40.67304611206055, "global_step": 198838, "epoch": 1643} {"train_loss": -41.19612503051758, "global_step": 198839, "epoch": 1643} {"train_loss": -40.2457275390625, "global_step": 198840, "epoch": 1643} {"train_loss": -41.05670166015625, "global_step": 198841, "epoch": 1643} {"train_loss": -39.48662185668945, "global_step": 198842, "epoch": 1643} {"train_loss": -41.12616729736328, "global_step": 198843, "epoch": 1643} {"train_loss": -40.99047088623047, "global_step": 198844, "epoch": 1643} {"train_loss": -41.87415313720703, "global_step": 198845, "epoch": 1643} {"train_loss": -40.80979537963867, "global_step": 198846, "epoch": 1643} {"train_loss": -41.695640563964844, "global_step": 198847, "epoch": 1643} {"train_loss": -40.51514434814453, "global_step": 198848, "epoch": 1643} {"train_loss": -41.31851577758789, "global_step": 198849, "epoch": 1643} {"train_loss": -39.08427810668945, "global_step": 198850, "epoch": 1643} {"train_loss": -37.98284149169922, "global_step": 198851, "epoch": 1643} {"train_loss": -38.65827941894531, "global_step": 198852, "epoch": 1643} {"train_loss": -36.93143844604492, "global_step": 198853, "epoch": 1643} {"train_loss": -33.7896728515625, "global_step": 198854, "epoch": 1643} {"train_loss": -35.98941421508789, "global_step": 198855, "epoch": 1643} {"train_loss": -40.042720794677734, "global_step": 198856, "epoch": 1643} {"train_loss": -35.04136276245117, "global_step": 198857, "epoch": 1643} {"train_loss": -38.5833854675293, "global_step": 198858, "epoch": 1643} {"train_loss": -39.99847412109375, "global_step": 198859, "epoch": 1643} {"train_loss": -37.44319152832031, "global_step": 198860, "epoch": 1643} {"train_loss": -40.89466094970703, "global_step": 198861, "epoch": 1643} {"train_loss": -39.90183639526367, "global_step": 198862, "epoch": 1643} {"train_loss": -39.479618072509766, "global_step": 198863, "epoch": 1643} {"train_loss": -40.439170837402344, "global_step": 198864, "epoch": 1643} {"train_loss": -40.11179733276367, "global_step": 198865, "epoch": 1643} {"train_loss": -39.67320251464844, "global_step": 198866, "epoch": 1643} {"train_loss": -38.89863204956055, "global_step": 198867, "epoch": 1643} {"train_loss": -39.45112228393555, "global_step": 198868, "epoch": 1643} {"train_loss": -38.045291900634766, "global_step": 198869, "epoch": 1643} {"train_loss": -38.7908935546875, "global_step": 198870, "epoch": 1643} {"train_loss": -40.3953971862793, "global_step": 198871, "epoch": 1643} {"train_loss": -40.52777099609375, "global_step": 198872, "epoch": 1643} {"train_loss": -39.449798583984375, "global_step": 198873, "epoch": 1643} {"train_loss": -39.026695251464844, "global_step": 198874, "epoch": 1643} {"train_loss": -25.89348793029785, "global_step": 198875, "epoch": 1643} {"train_loss": -34.5623893737793, "global_step": 198876, "epoch": 1643} {"train_loss": -36.489925384521484, "global_step": 198877, "epoch": 1643} {"train_loss": -37.38240432739258, "global_step": 198878, "epoch": 1643} {"train_loss": -39.17179870605469, "global_step": 198879, "epoch": 1643} {"train_loss": -39.18418502807617, "global_step": 198880, "epoch": 1643} {"train_loss": -39.315826416015625, "global_step": 198881, "epoch": 1643} {"train_loss": -35.25876235961914, "global_step": 198882, "epoch": 1643} {"train_loss": -38.71223068237305, "global_step": 198883, "epoch": 1643} {"train_loss": -38.37096405029297, "global_step": 198884, "epoch": 1643} {"train_loss": -30.46640968322754, "global_step": 198885, "epoch": 1643} {"train_loss": -38.183467864990234, "global_step": 198886, "epoch": 1643} {"train_loss": -36.06062698364258, "global_step": 198887, "epoch": 1643} {"train_loss": -35.16676712036133, "global_step": 198888, "epoch": 1643} {"train_loss": -39.4538459777832, "global_step": 198889, "epoch": 1643} {"train_loss": -37.27893829345703, "global_step": 198890, "epoch": 1643} {"train_loss": -38.79990768432617, "global_step": 198891, "epoch": 1643} {"train_loss": -37.44900131225586, "global_step": 198892, "epoch": 1643} {"train_loss": -38.05666732788086, "global_step": 198893, "epoch": 1643} {"train_loss": -35.70222854614258, "global_step": 198894, "epoch": 1643} {"train_loss": -39.35285949707031, "global_step": 198895, "epoch": 1643} {"train_loss": -39.01333236694336, "global_step": 198896, "epoch": 1643} {"train_loss": -40.309932708740234, "global_step": 198897, "epoch": 1643} {"train_loss": -38.738033294677734, "global_step": 198898, "epoch": 1643} {"train_loss": -38.51111602783203, "global_step": 198899, "epoch": 1643} {"train_loss": -38.19667434692383, "global_step": 198900, "epoch": 1643} {"train_loss": -39.966732025146484, "global_step": 198901, "epoch": 1643} {"train_loss": -38.001930236816406, "global_step": 198902, "epoch": 1643} {"train_loss": -38.189937591552734, "global_step": 198903, "epoch": 1643} {"train_loss": -39.03274154663086, "global_step": 198904, "epoch": 1643} {"train_loss": -40.11581039428711, "global_step": 198905, "epoch": 1643} {"train_loss": -39.929176330566406, "global_step": 198906, "epoch": 1643} {"train_loss": -40.21733474731445, "global_step": 198907, "epoch": 1643} {"train_loss": -39.195125579833984, "global_step": 198908, "epoch": 1643} {"train_loss": -39.47721862792969, "global_step": 198909, "epoch": 1643} {"train_loss": -39.776329040527344, "global_step": 198910, "epoch": 1643} {"train_loss": -40.060787200927734, "global_step": 198911, "epoch": 1643} {"train_loss": -39.87066650390625, "global_step": 198912, "epoch": 1643} {"train_loss": -37.77547836303711, "global_step": 198913, "epoch": 1643} {"train_loss": -40.493953704833984, "global_step": 198914, "epoch": 1643} {"train_loss": -40.10208511352539, "global_step": 198915, "epoch": 1643} {"train_loss": -40.000083923339844, "global_step": 198916, "epoch": 1643} {"train_loss": -40.05032730102539, "global_step": 198917, "epoch": 1643} {"train_loss": -40.43512725830078, "global_step": 198918, "epoch": 1643} {"train_loss": -39.78281784057617, "global_step": 198919, "epoch": 1643} {"train_loss": -41.08611297607422, "global_step": 198920, "epoch": 1643} {"train_loss": -40.76791000366211, "global_step": 198921, "epoch": 1643} {"train_loss": -38.49230194091797, "global_step": 198922, "epoch": 1643} {"train_loss": -39.37859413840554, "global_step": 198923, "epoch": 1643, "val_loss": 2585476.0} {"train_loss": -41.05449295043945, "global_step": 198924, "epoch": 1644} {"train_loss": -39.937496185302734, "global_step": 198925, "epoch": 1644} {"train_loss": -40.687801361083984, "global_step": 198926, "epoch": 1644} {"train_loss": -40.69026184082031, "global_step": 198927, "epoch": 1644} {"train_loss": -40.353546142578125, "global_step": 198928, "epoch": 1644} {"train_loss": -40.618568420410156, "global_step": 198929, "epoch": 1644} {"train_loss": -40.606075286865234, "global_step": 198930, "epoch": 1644} {"train_loss": -40.559303283691406, "global_step": 198931, "epoch": 1644} {"train_loss": -40.70451736450195, "global_step": 198932, "epoch": 1644} {"train_loss": -40.988590240478516, "global_step": 198933, "epoch": 1644} {"train_loss": -40.85310745239258, "global_step": 198934, "epoch": 1644} {"train_loss": -41.14284896850586, "global_step": 198935, "epoch": 1644} {"train_loss": -41.26899337768555, "global_step": 198936, "epoch": 1644} {"train_loss": -40.80382537841797, "global_step": 198937, "epoch": 1644} {"train_loss": -41.1822509765625, "global_step": 198938, "epoch": 1644} {"train_loss": -41.321041107177734, "global_step": 198939, "epoch": 1644} {"train_loss": -41.48416519165039, "global_step": 198940, "epoch": 1644} {"train_loss": -41.21810531616211, "global_step": 198941, "epoch": 1644} {"train_loss": -40.59257888793945, "global_step": 198942, "epoch": 1644} {"train_loss": -41.513607025146484, "global_step": 198943, "epoch": 1644} {"train_loss": -41.293270111083984, "global_step": 198944, "epoch": 1644} {"train_loss": -41.648006439208984, "global_step": 198945, "epoch": 1644} {"train_loss": -40.30240249633789, "global_step": 198946, "epoch": 1644} {"train_loss": -40.19170379638672, "global_step": 198947, "epoch": 1644} {"train_loss": -40.99189758300781, "global_step": 198948, "epoch": 1644} {"train_loss": -41.40070724487305, "global_step": 198949, "epoch": 1644} {"train_loss": -41.508724212646484, "global_step": 198950, "epoch": 1644} {"train_loss": -39.99821090698242, "global_step": 198951, "epoch": 1644} {"train_loss": -41.60532760620117, "global_step": 198952, "epoch": 1644} {"train_loss": -41.00873947143555, "global_step": 198953, "epoch": 1644} {"train_loss": -41.13978958129883, "global_step": 198954, "epoch": 1644} {"train_loss": -41.960235595703125, "global_step": 198955, "epoch": 1644} {"train_loss": -41.36652374267578, "global_step": 198956, "epoch": 1644} {"train_loss": -41.18647384643555, "global_step": 198957, "epoch": 1644} {"train_loss": -41.79884719848633, "global_step": 198958, "epoch": 1644} {"train_loss": -42.00056076049805, "global_step": 198959, "epoch": 1644} {"train_loss": -41.893550872802734, "global_step": 198960, "epoch": 1644} {"train_loss": -41.611122131347656, "global_step": 198961, "epoch": 1644} {"train_loss": -39.547672271728516, "global_step": 198962, "epoch": 1644} {"train_loss": -41.061492919921875, "global_step": 198963, "epoch": 1644} {"train_loss": -42.081851959228516, "global_step": 198964, "epoch": 1644} {"train_loss": -41.54909896850586, "global_step": 198965, "epoch": 1644} {"train_loss": -41.75511932373047, "global_step": 198966, "epoch": 1644} {"train_loss": -41.332759857177734, "global_step": 198967, "epoch": 1644} {"train_loss": -41.4697151184082, "global_step": 198968, "epoch": 1644} {"train_loss": -41.86719512939453, "global_step": 198969, "epoch": 1644} {"train_loss": -41.582881927490234, "global_step": 198970, "epoch": 1644} {"train_loss": -39.818824768066406, "global_step": 198971, "epoch": 1644} {"train_loss": -41.05680847167969, "global_step": 198972, "epoch": 1644} {"train_loss": -40.968772888183594, "global_step": 198973, "epoch": 1644} {"train_loss": -41.20524215698242, "global_step": 198974, "epoch": 1644} {"train_loss": -38.9223518371582, "global_step": 198975, "epoch": 1644} {"train_loss": -41.3979606628418, "global_step": 198976, "epoch": 1644} {"train_loss": -40.95520782470703, "global_step": 198977, "epoch": 1644} {"train_loss": -41.829078674316406, "global_step": 198978, "epoch": 1644} {"train_loss": -41.6713752746582, "global_step": 198979, "epoch": 1644} {"train_loss": -41.912994384765625, "global_step": 198980, "epoch": 1644} {"train_loss": -41.54432678222656, "global_step": 198981, "epoch": 1644} {"train_loss": -40.4854850769043, "global_step": 198982, "epoch": 1644} {"train_loss": -41.71718978881836, "global_step": 198983, "epoch": 1644} {"train_loss": -40.965518951416016, "global_step": 198984, "epoch": 1644} {"train_loss": -40.82466506958008, "global_step": 198985, "epoch": 1644} {"train_loss": -41.0875358581543, "global_step": 198986, "epoch": 1644} {"train_loss": -40.325984954833984, "global_step": 198987, "epoch": 1644} {"train_loss": -39.52227783203125, "global_step": 198988, "epoch": 1644} {"train_loss": -37.75532531738281, "global_step": 198989, "epoch": 1644} {"train_loss": -36.580867767333984, "global_step": 198990, "epoch": 1644} {"train_loss": -35.989501953125, "global_step": 198991, "epoch": 1644} {"train_loss": -40.187564849853516, "global_step": 198992, "epoch": 1644} {"train_loss": -39.80849838256836, "global_step": 198993, "epoch": 1644} {"train_loss": -33.875732421875, "global_step": 198994, "epoch": 1644} {"train_loss": -32.68537521362305, "global_step": 198995, "epoch": 1644} {"train_loss": -33.65108108520508, "global_step": 198996, "epoch": 1644} {"train_loss": -39.68628692626953, "global_step": 198997, "epoch": 1644} {"train_loss": -37.69759750366211, "global_step": 198998, "epoch": 1644} {"train_loss": -39.48081588745117, "global_step": 198999, "epoch": 1644} {"train_loss": -39.16802978515625, "global_step": 199000, "epoch": 1644} {"train_loss": -40.0487174987793, "global_step": 199001, "epoch": 1644} {"train_loss": -36.35282516479492, "global_step": 199002, "epoch": 1644} {"train_loss": -39.8311882019043, "global_step": 199003, "epoch": 1644} {"train_loss": -39.458839416503906, "global_step": 199004, "epoch": 1644} {"train_loss": -39.41123962402344, "global_step": 199005, "epoch": 1644} {"train_loss": -40.52741241455078, "global_step": 199006, "epoch": 1644} {"train_loss": -38.804412841796875, "global_step": 199007, "epoch": 1644} {"train_loss": -39.95663833618164, "global_step": 199008, "epoch": 1644} {"train_loss": -39.71920394897461, "global_step": 199009, "epoch": 1644} {"train_loss": -39.77126693725586, "global_step": 199010, "epoch": 1644} {"train_loss": -39.99620819091797, "global_step": 199011, "epoch": 1644} {"train_loss": -39.7552604675293, "global_step": 199012, "epoch": 1644} {"train_loss": -40.25248336791992, "global_step": 199013, "epoch": 1644} {"train_loss": -39.98402404785156, "global_step": 199014, "epoch": 1644} {"train_loss": -40.0411376953125, "global_step": 199015, "epoch": 1644} {"train_loss": -40.09450149536133, "global_step": 199016, "epoch": 1644} {"train_loss": -40.44593048095703, "global_step": 199017, "epoch": 1644} {"train_loss": -38.49540328979492, "global_step": 199018, "epoch": 1644} {"train_loss": -39.9386100769043, "global_step": 199019, "epoch": 1644} {"train_loss": -40.62627029418945, "global_step": 199020, "epoch": 1644} {"train_loss": -39.96228790283203, "global_step": 199021, "epoch": 1644} {"train_loss": -40.57778549194336, "global_step": 199022, "epoch": 1644} {"train_loss": -40.65513229370117, "global_step": 199023, "epoch": 1644} {"train_loss": -40.84119415283203, "global_step": 199024, "epoch": 1644} {"train_loss": -39.89140701293945, "global_step": 199025, "epoch": 1644} {"train_loss": -40.90047073364258, "global_step": 199026, "epoch": 1644} {"train_loss": -40.38872528076172, "global_step": 199027, "epoch": 1644} {"train_loss": -40.58869552612305, "global_step": 199028, "epoch": 1644} {"train_loss": -40.3177604675293, "global_step": 199029, "epoch": 1644} {"train_loss": -40.471588134765625, "global_step": 199030, "epoch": 1644} {"train_loss": -40.19256591796875, "global_step": 199031, "epoch": 1644} {"train_loss": -40.778987884521484, "global_step": 199032, "epoch": 1644} {"train_loss": -40.076297760009766, "global_step": 199033, "epoch": 1644} {"train_loss": -40.93105697631836, "global_step": 199034, "epoch": 1644} {"train_loss": -40.22975540161133, "global_step": 199035, "epoch": 1644} {"train_loss": -40.89905548095703, "global_step": 199036, "epoch": 1644} {"train_loss": -41.00429916381836, "global_step": 199037, "epoch": 1644} {"train_loss": -41.11151123046875, "global_step": 199038, "epoch": 1644} {"train_loss": -41.18070602416992, "global_step": 199039, "epoch": 1644} {"train_loss": -41.36797332763672, "global_step": 199040, "epoch": 1644} {"train_loss": -41.41162872314453, "global_step": 199041, "epoch": 1644} {"train_loss": -41.4893684387207, "global_step": 199042, "epoch": 1644} {"train_loss": -40.723690032958984, "global_step": 199043, "epoch": 1644} {"train_loss": -40.38042062176161, "global_step": 199044, "epoch": 1644, "val_loss": 2585608.75} {"train_loss": -41.34576416015625, "global_step": 199045, "epoch": 1645} {"train_loss": -41.41393280029297, "global_step": 199046, "epoch": 1645} {"train_loss": -41.23356246948242, "global_step": 199047, "epoch": 1645} {"train_loss": -41.072303771972656, "global_step": 199048, "epoch": 1645} {"train_loss": -41.769351959228516, "global_step": 199049, "epoch": 1645} {"train_loss": -41.33441162109375, "global_step": 199050, "epoch": 1645} {"train_loss": -41.40696334838867, "global_step": 199051, "epoch": 1645} {"train_loss": -41.14483642578125, "global_step": 199052, "epoch": 1645} {"train_loss": -41.72655487060547, "global_step": 199053, "epoch": 1645} {"train_loss": -41.346229553222656, "global_step": 199054, "epoch": 1645} {"train_loss": -41.42612838745117, "global_step": 199055, "epoch": 1645} {"train_loss": -41.07639694213867, "global_step": 199056, "epoch": 1645} {"train_loss": -41.64616775512695, "global_step": 199057, "epoch": 1645} {"train_loss": -41.282562255859375, "global_step": 199058, "epoch": 1645} {"train_loss": -40.942012786865234, "global_step": 199059, "epoch": 1645} {"train_loss": -41.44491195678711, "global_step": 199060, "epoch": 1645} {"train_loss": -41.24809646606445, "global_step": 199061, "epoch": 1645} {"train_loss": -41.61442947387695, "global_step": 199062, "epoch": 1645} {"train_loss": -41.7261848449707, "global_step": 199063, "epoch": 1645} {"train_loss": -41.406795501708984, "global_step": 199064, "epoch": 1645} {"train_loss": -41.56850814819336, "global_step": 199065, "epoch": 1645} {"train_loss": -41.55577850341797, "global_step": 199066, "epoch": 1645} {"train_loss": -40.749385833740234, "global_step": 199067, "epoch": 1645} {"train_loss": -40.927669525146484, "global_step": 199068, "epoch": 1645} {"train_loss": -41.42782211303711, "global_step": 199069, "epoch": 1645} {"train_loss": -41.45289993286133, "global_step": 199070, "epoch": 1645} {"train_loss": -41.880943298339844, "global_step": 199071, "epoch": 1645} {"train_loss": -41.37108612060547, "global_step": 199072, "epoch": 1645} {"train_loss": -41.703277587890625, "global_step": 199073, "epoch": 1645} {"train_loss": -41.421993255615234, "global_step": 199074, "epoch": 1645} {"train_loss": -40.703041076660156, "global_step": 199075, "epoch": 1645} {"train_loss": -39.30747604370117, "global_step": 199076, "epoch": 1645} {"train_loss": -38.83146667480469, "global_step": 199077, "epoch": 1645} {"train_loss": -39.83605194091797, "global_step": 199078, "epoch": 1645} {"train_loss": -41.33963394165039, "global_step": 199079, "epoch": 1645} {"train_loss": -41.73846435546875, "global_step": 199080, "epoch": 1645} {"train_loss": -42.45664596557617, "global_step": 199081, "epoch": 1645} {"train_loss": -41.18918991088867, "global_step": 199082, "epoch": 1645} {"train_loss": -40.828983306884766, "global_step": 199083, "epoch": 1645} {"train_loss": -40.089088439941406, "global_step": 199084, "epoch": 1645} {"train_loss": -38.85774612426758, "global_step": 199085, "epoch": 1645} {"train_loss": -40.75181198120117, "global_step": 199086, "epoch": 1645} {"train_loss": -41.56020736694336, "global_step": 199087, "epoch": 1645} {"train_loss": -39.900691986083984, "global_step": 199088, "epoch": 1645} {"train_loss": -39.21275329589844, "global_step": 199089, "epoch": 1645} {"train_loss": -38.89301681518555, "global_step": 199090, "epoch": 1645} {"train_loss": -39.605926513671875, "global_step": 199091, "epoch": 1645} {"train_loss": -41.227535247802734, "global_step": 199092, "epoch": 1645} {"train_loss": -40.31083679199219, "global_step": 199093, "epoch": 1645} {"train_loss": -41.00497055053711, "global_step": 199094, "epoch": 1645} {"train_loss": -40.64939498901367, "global_step": 199095, "epoch": 1645} {"train_loss": -40.953651428222656, "global_step": 199096, "epoch": 1645} {"train_loss": -40.7622184753418, "global_step": 199097, "epoch": 1645} {"train_loss": -40.45280838012695, "global_step": 199098, "epoch": 1645} {"train_loss": -41.443660736083984, "global_step": 199099, "epoch": 1645} {"train_loss": -40.71467971801758, "global_step": 199100, "epoch": 1645} {"train_loss": -41.410587310791016, "global_step": 199101, "epoch": 1645} {"train_loss": -41.288063049316406, "global_step": 199102, "epoch": 1645} {"train_loss": -41.22119140625, "global_step": 199103, "epoch": 1645} {"train_loss": -41.47817611694336, "global_step": 199104, "epoch": 1645} {"train_loss": -41.48684310913086, "global_step": 199105, "epoch": 1645} {"train_loss": -40.92508316040039, "global_step": 199106, "epoch": 1645} {"train_loss": -41.61920928955078, "global_step": 199107, "epoch": 1645} {"train_loss": -41.98160171508789, "global_step": 199108, "epoch": 1645} {"train_loss": -41.32859420776367, "global_step": 199109, "epoch": 1645} {"train_loss": -41.73810958862305, "global_step": 199110, "epoch": 1645} {"train_loss": -41.782981872558594, "global_step": 199111, "epoch": 1645} {"train_loss": -41.47341537475586, "global_step": 199112, "epoch": 1645} {"train_loss": -41.4508171081543, "global_step": 199113, "epoch": 1645} {"train_loss": -41.529151916503906, "global_step": 199114, "epoch": 1645} {"train_loss": -41.8558349609375, "global_step": 199115, "epoch": 1645} {"train_loss": -41.62582015991211, "global_step": 199116, "epoch": 1645} {"train_loss": -41.57867431640625, "global_step": 199117, "epoch": 1645} {"train_loss": -41.897377014160156, "global_step": 199118, "epoch": 1645} {"train_loss": -41.23875427246094, "global_step": 199119, "epoch": 1645} {"train_loss": -41.366268157958984, "global_step": 199120, "epoch": 1645} {"train_loss": -41.50803756713867, "global_step": 199121, "epoch": 1645} {"train_loss": -41.39124298095703, "global_step": 199122, "epoch": 1645} {"train_loss": -41.897918701171875, "global_step": 199123, "epoch": 1645} {"train_loss": -42.287349700927734, "global_step": 199124, "epoch": 1645} {"train_loss": -42.23481369018555, "global_step": 199125, "epoch": 1645} {"train_loss": -42.311927795410156, "global_step": 199126, "epoch": 1645} {"train_loss": -41.787654876708984, "global_step": 199127, "epoch": 1645} {"train_loss": -41.46786880493164, "global_step": 199128, "epoch": 1645} {"train_loss": -41.62849044799805, "global_step": 199129, "epoch": 1645} {"train_loss": -41.138370513916016, "global_step": 199130, "epoch": 1645} {"train_loss": -38.96038055419922, "global_step": 199131, "epoch": 1645} {"train_loss": -40.960205078125, "global_step": 199132, "epoch": 1645} {"train_loss": -39.94391632080078, "global_step": 199133, "epoch": 1645} {"train_loss": -40.21611404418945, "global_step": 199134, "epoch": 1645} {"train_loss": -38.42987823486328, "global_step": 199135, "epoch": 1645} {"train_loss": -39.201778411865234, "global_step": 199136, "epoch": 1645} {"train_loss": -40.199363708496094, "global_step": 199137, "epoch": 1645} {"train_loss": -39.151466369628906, "global_step": 199138, "epoch": 1645} {"train_loss": -39.29458236694336, "global_step": 199139, "epoch": 1645} {"train_loss": -40.65517044067383, "global_step": 199140, "epoch": 1645} {"train_loss": -39.0682258605957, "global_step": 199141, "epoch": 1645} {"train_loss": -40.02420425415039, "global_step": 199142, "epoch": 1645} {"train_loss": -41.35234451293945, "global_step": 199143, "epoch": 1645} {"train_loss": -41.25217819213867, "global_step": 199144, "epoch": 1645} {"train_loss": -40.74138259887695, "global_step": 199145, "epoch": 1645} {"train_loss": -39.59836959838867, "global_step": 199146, "epoch": 1645} {"train_loss": -41.0655517578125, "global_step": 199147, "epoch": 1645} {"train_loss": -41.18331527709961, "global_step": 199148, "epoch": 1645} {"train_loss": -40.952247619628906, "global_step": 199149, "epoch": 1645} {"train_loss": -40.9033317565918, "global_step": 199150, "epoch": 1645} {"train_loss": -41.84465408325195, "global_step": 199151, "epoch": 1645} {"train_loss": -41.408565521240234, "global_step": 199152, "epoch": 1645} {"train_loss": -41.42574691772461, "global_step": 199153, "epoch": 1645} {"train_loss": -41.96037673950195, "global_step": 199154, "epoch": 1645} {"train_loss": -41.89289093017578, "global_step": 199155, "epoch": 1645} {"train_loss": -41.84534454345703, "global_step": 199156, "epoch": 1645} {"train_loss": -40.808353424072266, "global_step": 199157, "epoch": 1645} {"train_loss": -42.33341598510742, "global_step": 199158, "epoch": 1645} {"train_loss": -41.58045196533203, "global_step": 199159, "epoch": 1645} {"train_loss": -41.70361328125, "global_step": 199160, "epoch": 1645} {"train_loss": -41.150146484375, "global_step": 199161, "epoch": 1645} {"train_loss": -41.54038619995117, "global_step": 199162, "epoch": 1645} {"train_loss": -41.16997146606445, "global_step": 199163, "epoch": 1645} {"train_loss": -41.64168930053711, "global_step": 199164, "epoch": 1645} {"train_loss": -41.07098281482035, "global_step": 199165, "epoch": 1645, "val_loss": 2666483.75} {"train_loss": -41.56280517578125, "global_step": 199166, "epoch": 1646} {"train_loss": -41.566402435302734, "global_step": 199167, "epoch": 1646} {"train_loss": -41.55122756958008, "global_step": 199168, "epoch": 1646} {"train_loss": -42.4155387878418, "global_step": 199169, "epoch": 1646} {"train_loss": -41.32908248901367, "global_step": 199170, "epoch": 1646} {"train_loss": -41.08506774902344, "global_step": 199171, "epoch": 1646} {"train_loss": -41.73573684692383, "global_step": 199172, "epoch": 1646} {"train_loss": -42.67708969116211, "global_step": 199173, "epoch": 1646} {"train_loss": -42.35469055175781, "global_step": 199174, "epoch": 1646} {"train_loss": -42.422462463378906, "global_step": 199175, "epoch": 1646} {"train_loss": -42.15195846557617, "global_step": 199176, "epoch": 1646} {"train_loss": -41.68396759033203, "global_step": 199177, "epoch": 1646} {"train_loss": -41.559417724609375, "global_step": 199178, "epoch": 1646} {"train_loss": -42.03047561645508, "global_step": 199179, "epoch": 1646} {"train_loss": -42.565486907958984, "global_step": 199180, "epoch": 1646} {"train_loss": -41.92722702026367, "global_step": 199181, "epoch": 1646} {"train_loss": -41.11579513549805, "global_step": 199182, "epoch": 1646} {"train_loss": -41.08566665649414, "global_step": 199183, "epoch": 1646} {"train_loss": -41.76478958129883, "global_step": 199184, "epoch": 1646} {"train_loss": -42.634193420410156, "global_step": 199185, "epoch": 1646} {"train_loss": -41.89121627807617, "global_step": 199186, "epoch": 1646} {"train_loss": -42.084320068359375, "global_step": 199187, "epoch": 1646} {"train_loss": -42.04148864746094, "global_step": 199188, "epoch": 1646} {"train_loss": -42.28010559082031, "global_step": 199189, "epoch": 1646} {"train_loss": -42.04800033569336, "global_step": 199190, "epoch": 1646} {"train_loss": -41.984561920166016, "global_step": 199191, "epoch": 1646} {"train_loss": -41.99951171875, "global_step": 199192, "epoch": 1646} {"train_loss": -42.08547592163086, "global_step": 199193, "epoch": 1646} {"train_loss": -41.59352493286133, "global_step": 199194, "epoch": 1646} {"train_loss": -41.835487365722656, "global_step": 199195, "epoch": 1646} {"train_loss": -40.9650993347168, "global_step": 199196, "epoch": 1646} {"train_loss": -40.8009033203125, "global_step": 199197, "epoch": 1646} {"train_loss": -41.916194915771484, "global_step": 199198, "epoch": 1646} {"train_loss": -40.48188781738281, "global_step": 199199, "epoch": 1646} {"train_loss": -37.340431213378906, "global_step": 199200, "epoch": 1646} {"train_loss": -38.05635070800781, "global_step": 199201, "epoch": 1646} {"train_loss": -39.263790130615234, "global_step": 199202, "epoch": 1646} {"train_loss": -39.217926025390625, "global_step": 199203, "epoch": 1646} {"train_loss": -39.83237838745117, "global_step": 199204, "epoch": 1646} {"train_loss": -38.31365966796875, "global_step": 199205, "epoch": 1646} {"train_loss": -38.492652893066406, "global_step": 199206, "epoch": 1646} {"train_loss": -38.360198974609375, "global_step": 199207, "epoch": 1646} {"train_loss": -40.052059173583984, "global_step": 199208, "epoch": 1646} {"train_loss": -40.15127182006836, "global_step": 199209, "epoch": 1646} {"train_loss": -40.409271240234375, "global_step": 199210, "epoch": 1646} {"train_loss": -40.373111724853516, "global_step": 199211, "epoch": 1646} {"train_loss": -41.11532211303711, "global_step": 199212, "epoch": 1646} {"train_loss": -41.37310791015625, "global_step": 199213, "epoch": 1646} {"train_loss": -40.6622200012207, "global_step": 199214, "epoch": 1646} {"train_loss": -40.38173294067383, "global_step": 199215, "epoch": 1646} {"train_loss": -40.42547607421875, "global_step": 199216, "epoch": 1646} {"train_loss": -40.41562271118164, "global_step": 199217, "epoch": 1646} {"train_loss": -37.67686462402344, "global_step": 199218, "epoch": 1646} {"train_loss": -41.56727981567383, "global_step": 199219, "epoch": 1646} {"train_loss": -40.81241989135742, "global_step": 199220, "epoch": 1646} {"train_loss": -41.04593276977539, "global_step": 199221, "epoch": 1646} {"train_loss": -37.46529006958008, "global_step": 199222, "epoch": 1646} {"train_loss": -41.011287689208984, "global_step": 199223, "epoch": 1646} {"train_loss": -41.0593147277832, "global_step": 199224, "epoch": 1646} {"train_loss": -40.910945892333984, "global_step": 199225, "epoch": 1646} {"train_loss": -41.33858871459961, "global_step": 199226, "epoch": 1646} {"train_loss": -38.48871994018555, "global_step": 199227, "epoch": 1646} {"train_loss": -40.73334884643555, "global_step": 199228, "epoch": 1646} {"train_loss": -39.081451416015625, "global_step": 199229, "epoch": 1646} {"train_loss": -40.65780258178711, "global_step": 199230, "epoch": 1646} {"train_loss": -39.43146514892578, "global_step": 199231, "epoch": 1646} {"train_loss": -40.29061508178711, "global_step": 199232, "epoch": 1646} {"train_loss": -40.679405212402344, "global_step": 199233, "epoch": 1646} {"train_loss": -40.58697509765625, "global_step": 199234, "epoch": 1646} {"train_loss": -40.788509368896484, "global_step": 199235, "epoch": 1646} {"train_loss": -41.10929489135742, "global_step": 199236, "epoch": 1646} {"train_loss": -40.74772262573242, "global_step": 199237, "epoch": 1646} {"train_loss": -40.37469482421875, "global_step": 199238, "epoch": 1646} {"train_loss": -39.65155029296875, "global_step": 199239, "epoch": 1646} {"train_loss": -40.257198333740234, "global_step": 199240, "epoch": 1646} {"train_loss": -39.802677154541016, "global_step": 199241, "epoch": 1646} {"train_loss": -37.008975982666016, "global_step": 199242, "epoch": 1646} {"train_loss": -39.7138557434082, "global_step": 199243, "epoch": 1646} {"train_loss": -40.54694747924805, "global_step": 199244, "epoch": 1646} {"train_loss": -39.091835021972656, "global_step": 199245, "epoch": 1646} {"train_loss": -39.99363327026367, "global_step": 199246, "epoch": 1646} {"train_loss": -41.45185470581055, "global_step": 199247, "epoch": 1646} {"train_loss": -40.23905944824219, "global_step": 199248, "epoch": 1646} {"train_loss": -40.85978317260742, "global_step": 199249, "epoch": 1646} {"train_loss": -40.98927688598633, "global_step": 199250, "epoch": 1646} {"train_loss": -40.56990051269531, "global_step": 199251, "epoch": 1646} {"train_loss": -40.401790618896484, "global_step": 199252, "epoch": 1646} {"train_loss": -39.15012741088867, "global_step": 199253, "epoch": 1646} {"train_loss": -37.45663070678711, "global_step": 199254, "epoch": 1646} {"train_loss": -40.316184997558594, "global_step": 199255, "epoch": 1646} {"train_loss": -41.15407180786133, "global_step": 199256, "epoch": 1646} {"train_loss": -41.390968322753906, "global_step": 199257, "epoch": 1646} {"train_loss": -41.17253875732422, "global_step": 199258, "epoch": 1646} {"train_loss": -40.003082275390625, "global_step": 199259, "epoch": 1646} {"train_loss": -39.702877044677734, "global_step": 199260, "epoch": 1646} {"train_loss": -37.404232025146484, "global_step": 199261, "epoch": 1646} {"train_loss": -40.78742218017578, "global_step": 199262, "epoch": 1646} {"train_loss": -39.56024169921875, "global_step": 199263, "epoch": 1646} {"train_loss": -40.379730224609375, "global_step": 199264, "epoch": 1646} {"train_loss": -41.24550247192383, "global_step": 199265, "epoch": 1646} {"train_loss": -33.83632278442383, "global_step": 199266, "epoch": 1646} {"train_loss": -37.33735275268555, "global_step": 199267, "epoch": 1646} {"train_loss": -41.15346908569336, "global_step": 199268, "epoch": 1646} {"train_loss": -36.98958206176758, "global_step": 199269, "epoch": 1646} {"train_loss": -39.77222442626953, "global_step": 199270, "epoch": 1646} {"train_loss": -37.86323165893555, "global_step": 199271, "epoch": 1646} {"train_loss": -40.45983123779297, "global_step": 199272, "epoch": 1646} {"train_loss": -39.23883819580078, "global_step": 199273, "epoch": 1646} {"train_loss": -41.10508346557617, "global_step": 199274, "epoch": 1646} {"train_loss": -39.692115783691406, "global_step": 199275, "epoch": 1646} {"train_loss": -41.08858108520508, "global_step": 199276, "epoch": 1646} {"train_loss": -38.23573684692383, "global_step": 199277, "epoch": 1646} {"train_loss": -38.90608596801758, "global_step": 199278, "epoch": 1646} {"train_loss": -41.148193359375, "global_step": 199279, "epoch": 1646} {"train_loss": -39.92080307006836, "global_step": 199280, "epoch": 1646} {"train_loss": -39.85169982910156, "global_step": 199281, "epoch": 1646} {"train_loss": -41.12844467163086, "global_step": 199282, "epoch": 1646} {"train_loss": -40.65914535522461, "global_step": 199283, "epoch": 1646} {"train_loss": -41.23952865600586, "global_step": 199284, "epoch": 1646} {"train_loss": -41.73653793334961, "global_step": 199285, "epoch": 1646} {"train_loss": -40.45405884419591, "global_step": 199286, "epoch": 1646, "val_loss": 2747693.0} {"train_loss": -41.60603332519531, "global_step": 199287, "epoch": 1647} {"train_loss": -40.02885055541992, "global_step": 199288, "epoch": 1647} {"train_loss": -40.3476676940918, "global_step": 199289, "epoch": 1647} {"train_loss": -39.86686706542969, "global_step": 199290, "epoch": 1647} {"train_loss": -36.24836730957031, "global_step": 199291, "epoch": 1647} {"train_loss": -41.60515213012695, "global_step": 199292, "epoch": 1647} {"train_loss": -42.07186508178711, "global_step": 199293, "epoch": 1647} {"train_loss": -38.84515380859375, "global_step": 199294, "epoch": 1647} {"train_loss": -37.252620697021484, "global_step": 199295, "epoch": 1647} {"train_loss": -38.7469482421875, "global_step": 199296, "epoch": 1647} {"train_loss": -40.18514633178711, "global_step": 199297, "epoch": 1647} {"train_loss": -40.84449768066406, "global_step": 199298, "epoch": 1647} {"train_loss": -40.99606704711914, "global_step": 199299, "epoch": 1647} {"train_loss": -40.672760009765625, "global_step": 199300, "epoch": 1647} {"train_loss": -40.2573356628418, "global_step": 199301, "epoch": 1647} {"train_loss": -40.764347076416016, "global_step": 199302, "epoch": 1647} {"train_loss": -39.767704010009766, "global_step": 199303, "epoch": 1647} {"train_loss": -40.7453498840332, "global_step": 199304, "epoch": 1647} {"train_loss": -39.795162200927734, "global_step": 199305, "epoch": 1647} {"train_loss": -41.068153381347656, "global_step": 199306, "epoch": 1647} {"train_loss": -39.494232177734375, "global_step": 199307, "epoch": 1647} {"train_loss": -40.10953903198242, "global_step": 199308, "epoch": 1647} {"train_loss": -40.8927116394043, "global_step": 199309, "epoch": 1647} {"train_loss": -41.321590423583984, "global_step": 199310, "epoch": 1647} {"train_loss": -41.53617477416992, "global_step": 199311, "epoch": 1647} {"train_loss": -41.56527328491211, "global_step": 199312, "epoch": 1647} {"train_loss": -41.23367691040039, "global_step": 199313, "epoch": 1647} {"train_loss": -41.27425765991211, "global_step": 199314, "epoch": 1647} {"train_loss": -41.4448356628418, "global_step": 199315, "epoch": 1647} {"train_loss": -40.91704177856445, "global_step": 199316, "epoch": 1647} {"train_loss": -41.404052734375, "global_step": 199317, "epoch": 1647} {"train_loss": -42.00495529174805, "global_step": 199318, "epoch": 1647} {"train_loss": -41.695167541503906, "global_step": 199319, "epoch": 1647} {"train_loss": -41.108924865722656, "global_step": 199320, "epoch": 1647} {"train_loss": -41.5965576171875, "global_step": 199321, "epoch": 1647} {"train_loss": -41.21027755737305, "global_step": 199322, "epoch": 1647} {"train_loss": -42.190120697021484, "global_step": 199323, "epoch": 1647} {"train_loss": -41.03932189941406, "global_step": 199324, "epoch": 1647} {"train_loss": -41.604496002197266, "global_step": 199325, "epoch": 1647} {"train_loss": -41.581642150878906, "global_step": 199326, "epoch": 1647} {"train_loss": -41.11116027832031, "global_step": 199327, "epoch": 1647} {"train_loss": -41.3043212890625, "global_step": 199328, "epoch": 1647} {"train_loss": -40.72148895263672, "global_step": 199329, "epoch": 1647} {"train_loss": -40.60670852661133, "global_step": 199330, "epoch": 1647} {"train_loss": -41.277313232421875, "global_step": 199331, "epoch": 1647} {"train_loss": -40.66538619995117, "global_step": 199332, "epoch": 1647} {"train_loss": -40.72858810424805, "global_step": 199333, "epoch": 1647} {"train_loss": -41.17605209350586, "global_step": 199334, "epoch": 1647} {"train_loss": -39.56248092651367, "global_step": 199335, "epoch": 1647} {"train_loss": -40.3795051574707, "global_step": 199336, "epoch": 1647} {"train_loss": -39.05771255493164, "global_step": 199337, "epoch": 1647} {"train_loss": -39.57965850830078, "global_step": 199338, "epoch": 1647} {"train_loss": -38.93085479736328, "global_step": 199339, "epoch": 1647} {"train_loss": -38.491668701171875, "global_step": 199340, "epoch": 1647} {"train_loss": -38.844078063964844, "global_step": 199341, "epoch": 1647} {"train_loss": -34.03270721435547, "global_step": 199342, "epoch": 1647} {"train_loss": -36.83060836791992, "global_step": 199343, "epoch": 1647} {"train_loss": -37.266082763671875, "global_step": 199344, "epoch": 1647} {"train_loss": -39.40317916870117, "global_step": 199345, "epoch": 1647} {"train_loss": -40.66886520385742, "global_step": 199346, "epoch": 1647} {"train_loss": -38.974609375, "global_step": 199347, "epoch": 1647} {"train_loss": -38.25627517700195, "global_step": 199348, "epoch": 1647} {"train_loss": -40.85853958129883, "global_step": 199349, "epoch": 1647} {"train_loss": -39.09449005126953, "global_step": 199350, "epoch": 1647} {"train_loss": -39.72671890258789, "global_step": 199351, "epoch": 1647} {"train_loss": -40.933956146240234, "global_step": 199352, "epoch": 1647} {"train_loss": -39.956695556640625, "global_step": 199353, "epoch": 1647} {"train_loss": -39.999427795410156, "global_step": 199354, "epoch": 1647} {"train_loss": -40.91309356689453, "global_step": 199355, "epoch": 1647} {"train_loss": -40.43789291381836, "global_step": 199356, "epoch": 1647} {"train_loss": -40.45425033569336, "global_step": 199357, "epoch": 1647} {"train_loss": -41.03561782836914, "global_step": 199358, "epoch": 1647} {"train_loss": -41.619293212890625, "global_step": 199359, "epoch": 1647} {"train_loss": -40.04025650024414, "global_step": 199360, "epoch": 1647} {"train_loss": -40.66642761230469, "global_step": 199361, "epoch": 1647} {"train_loss": -37.44041442871094, "global_step": 199362, "epoch": 1647} {"train_loss": -41.211669921875, "global_step": 199363, "epoch": 1647} {"train_loss": -38.98284912109375, "global_step": 199364, "epoch": 1647} {"train_loss": -41.08332443237305, "global_step": 199365, "epoch": 1647} {"train_loss": -41.68223190307617, "global_step": 199366, "epoch": 1647} {"train_loss": -41.3553581237793, "global_step": 199367, "epoch": 1647} {"train_loss": -39.28517150878906, "global_step": 199368, "epoch": 1647} {"train_loss": -40.59723663330078, "global_step": 199369, "epoch": 1647} {"train_loss": -41.4052848815918, "global_step": 199370, "epoch": 1647} {"train_loss": -41.70737838745117, "global_step": 199371, "epoch": 1647} {"train_loss": -41.04368209838867, "global_step": 199372, "epoch": 1647} {"train_loss": -40.97248077392578, "global_step": 199373, "epoch": 1647} {"train_loss": -41.158931732177734, "global_step": 199374, "epoch": 1647} {"train_loss": -41.6455192565918, "global_step": 199375, "epoch": 1647} {"train_loss": -41.537471771240234, "global_step": 199376, "epoch": 1647} {"train_loss": -40.18736267089844, "global_step": 199377, "epoch": 1647} {"train_loss": -41.59180450439453, "global_step": 199378, "epoch": 1647} {"train_loss": -40.77740478515625, "global_step": 199379, "epoch": 1647} {"train_loss": -41.02867126464844, "global_step": 199380, "epoch": 1647} {"train_loss": -41.654518127441406, "global_step": 199381, "epoch": 1647} {"train_loss": -41.2364616394043, "global_step": 199382, "epoch": 1647} {"train_loss": -41.708740234375, "global_step": 199383, "epoch": 1647} {"train_loss": -41.8133659362793, "global_step": 199384, "epoch": 1647} {"train_loss": -42.412837982177734, "global_step": 199385, "epoch": 1647} {"train_loss": -42.0207405090332, "global_step": 199386, "epoch": 1647} {"train_loss": -40.898712158203125, "global_step": 199387, "epoch": 1647} {"train_loss": -41.702735900878906, "global_step": 199388, "epoch": 1647} {"train_loss": -41.41913986206055, "global_step": 199389, "epoch": 1647} {"train_loss": -42.115386962890625, "global_step": 199390, "epoch": 1647} {"train_loss": -41.46159362792969, "global_step": 199391, "epoch": 1647} {"train_loss": -40.20050048828125, "global_step": 199392, "epoch": 1647} {"train_loss": -41.30601119995117, "global_step": 199393, "epoch": 1647} {"train_loss": -41.095436096191406, "global_step": 199394, "epoch": 1647} {"train_loss": -41.337825775146484, "global_step": 199395, "epoch": 1647} {"train_loss": -41.90518569946289, "global_step": 199396, "epoch": 1647} {"train_loss": -41.619930267333984, "global_step": 199397, "epoch": 1647} {"train_loss": -41.48373031616211, "global_step": 199398, "epoch": 1647} {"train_loss": -41.00844955444336, "global_step": 199399, "epoch": 1647} {"train_loss": -41.080596923828125, "global_step": 199400, "epoch": 1647} {"train_loss": -39.9099006652832, "global_step": 199401, "epoch": 1647} {"train_loss": -40.59621047973633, "global_step": 199402, "epoch": 1647} {"train_loss": -41.799564361572266, "global_step": 199403, "epoch": 1647} {"train_loss": -41.282012939453125, "global_step": 199404, "epoch": 1647} {"train_loss": -37.502010345458984, "global_step": 199405, "epoch": 1647} {"train_loss": -40.918251037597656, "global_step": 199406, "epoch": 1647} {"train_loss": -40.51771677821136, "global_step": 199407, "epoch": 1647, "val_loss": 2676731.0} {"train_loss": -41.194881439208984, "global_step": 199408, "epoch": 1648} {"train_loss": -39.65342330932617, "global_step": 199409, "epoch": 1648} {"train_loss": -40.63322067260742, "global_step": 199410, "epoch": 1648} {"train_loss": -41.0645866394043, "global_step": 199411, "epoch": 1648} {"train_loss": -41.52693557739258, "global_step": 199412, "epoch": 1648} {"train_loss": -40.99493408203125, "global_step": 199413, "epoch": 1648} {"train_loss": -39.76826858520508, "global_step": 199414, "epoch": 1648} {"train_loss": -41.05763244628906, "global_step": 199415, "epoch": 1648} {"train_loss": -41.64331817626953, "global_step": 199416, "epoch": 1648} {"train_loss": -37.77217483520508, "global_step": 199417, "epoch": 1648} {"train_loss": -40.57008743286133, "global_step": 199418, "epoch": 1648} {"train_loss": -40.23714828491211, "global_step": 199419, "epoch": 1648} {"train_loss": -36.96047592163086, "global_step": 199420, "epoch": 1648} {"train_loss": -36.594539642333984, "global_step": 199421, "epoch": 1648} {"train_loss": -39.24709701538086, "global_step": 199422, "epoch": 1648} {"train_loss": -37.19971466064453, "global_step": 199423, "epoch": 1648} {"train_loss": -39.93130874633789, "global_step": 199424, "epoch": 1648} {"train_loss": -40.00895309448242, "global_step": 199425, "epoch": 1648} {"train_loss": -40.81315231323242, "global_step": 199426, "epoch": 1648} {"train_loss": -39.87369155883789, "global_step": 199427, "epoch": 1648} {"train_loss": -39.02651596069336, "global_step": 199428, "epoch": 1648} {"train_loss": -40.22206115722656, "global_step": 199429, "epoch": 1648} {"train_loss": -37.24031066894531, "global_step": 199430, "epoch": 1648} {"train_loss": -39.0141716003418, "global_step": 199431, "epoch": 1648} {"train_loss": -39.40155029296875, "global_step": 199432, "epoch": 1648} {"train_loss": -38.70622253417969, "global_step": 199433, "epoch": 1648} {"train_loss": -37.86112594604492, "global_step": 199434, "epoch": 1648} {"train_loss": -38.517574310302734, "global_step": 199435, "epoch": 1648} {"train_loss": -39.95277404785156, "global_step": 199436, "epoch": 1648} {"train_loss": -37.3539924621582, "global_step": 199437, "epoch": 1648} {"train_loss": -40.5543327331543, "global_step": 199438, "epoch": 1648} {"train_loss": -39.50840759277344, "global_step": 199439, "epoch": 1648} {"train_loss": -39.55253601074219, "global_step": 199440, "epoch": 1648} {"train_loss": -39.09049987792969, "global_step": 199441, "epoch": 1648} {"train_loss": -37.9156494140625, "global_step": 199442, "epoch": 1648} {"train_loss": -40.20758056640625, "global_step": 199443, "epoch": 1648} {"train_loss": -38.02924346923828, "global_step": 199444, "epoch": 1648} {"train_loss": -37.921783447265625, "global_step": 199445, "epoch": 1648} {"train_loss": -35.950069427490234, "global_step": 199446, "epoch": 1648} {"train_loss": -39.721351623535156, "global_step": 199447, "epoch": 1648} {"train_loss": -38.623287200927734, "global_step": 199448, "epoch": 1648} {"train_loss": -38.34011459350586, "global_step": 199449, "epoch": 1648} {"train_loss": -40.34934616088867, "global_step": 199450, "epoch": 1648} {"train_loss": -39.25978469848633, "global_step": 199451, "epoch": 1648} {"train_loss": -39.912086486816406, "global_step": 199452, "epoch": 1648} {"train_loss": -39.41132736206055, "global_step": 199453, "epoch": 1648} {"train_loss": -40.539955139160156, "global_step": 199454, "epoch": 1648} {"train_loss": -40.72457504272461, "global_step": 199455, "epoch": 1648} {"train_loss": -39.97199630737305, "global_step": 199456, "epoch": 1648} {"train_loss": -41.21523666381836, "global_step": 199457, "epoch": 1648} {"train_loss": -38.21467590332031, "global_step": 199458, "epoch": 1648} {"train_loss": -39.59257888793945, "global_step": 199459, "epoch": 1648} {"train_loss": -40.709869384765625, "global_step": 199460, "epoch": 1648} {"train_loss": -40.857398986816406, "global_step": 199461, "epoch": 1648} {"train_loss": -40.29602813720703, "global_step": 199462, "epoch": 1648} {"train_loss": -40.56357955932617, "global_step": 199463, "epoch": 1648} {"train_loss": -39.5673828125, "global_step": 199464, "epoch": 1648} {"train_loss": -38.95305252075195, "global_step": 199465, "epoch": 1648} {"train_loss": -40.616329193115234, "global_step": 199466, "epoch": 1648} {"train_loss": -39.16207504272461, "global_step": 199467, "epoch": 1648} {"train_loss": -38.197566986083984, "global_step": 199468, "epoch": 1648} {"train_loss": -40.366119384765625, "global_step": 199469, "epoch": 1648} {"train_loss": -40.385005950927734, "global_step": 199470, "epoch": 1648} {"train_loss": -39.674072265625, "global_step": 199471, "epoch": 1648} {"train_loss": -40.5974235534668, "global_step": 199472, "epoch": 1648} {"train_loss": -39.90877914428711, "global_step": 199473, "epoch": 1648} {"train_loss": -41.22150421142578, "global_step": 199474, "epoch": 1648} {"train_loss": -40.076446533203125, "global_step": 199475, "epoch": 1648} {"train_loss": -41.17323684692383, "global_step": 199476, "epoch": 1648} {"train_loss": -40.74468994140625, "global_step": 199477, "epoch": 1648} {"train_loss": -40.47734832763672, "global_step": 199478, "epoch": 1648} {"train_loss": -40.997188568115234, "global_step": 199479, "epoch": 1648} {"train_loss": -40.838497161865234, "global_step": 199480, "epoch": 1648} {"train_loss": -40.72698974609375, "global_step": 199481, "epoch": 1648} {"train_loss": -40.50703048706055, "global_step": 199482, "epoch": 1648} {"train_loss": -40.737525939941406, "global_step": 199483, "epoch": 1648} {"train_loss": -40.70962142944336, "global_step": 199484, "epoch": 1648} {"train_loss": -40.1849479675293, "global_step": 199485, "epoch": 1648} {"train_loss": -41.47027587890625, "global_step": 199486, "epoch": 1648} {"train_loss": -41.304298400878906, "global_step": 199487, "epoch": 1648} {"train_loss": -41.30595779418945, "global_step": 199488, "epoch": 1648} {"train_loss": -41.155941009521484, "global_step": 199489, "epoch": 1648} {"train_loss": -40.35569381713867, "global_step": 199490, "epoch": 1648} {"train_loss": -39.9769287109375, "global_step": 199491, "epoch": 1648} {"train_loss": -40.82435989379883, "global_step": 199492, "epoch": 1648} {"train_loss": -41.11247634887695, "global_step": 199493, "epoch": 1648} {"train_loss": -41.44276809692383, "global_step": 199494, "epoch": 1648} {"train_loss": -41.13086700439453, "global_step": 199495, "epoch": 1648} {"train_loss": -41.0319709777832, "global_step": 199496, "epoch": 1648} {"train_loss": -42.0609245300293, "global_step": 199497, "epoch": 1648} {"train_loss": -40.381385803222656, "global_step": 199498, "epoch": 1648} {"train_loss": -41.36293029785156, "global_step": 199499, "epoch": 1648} {"train_loss": -41.39250183105469, "global_step": 199500, "epoch": 1648} {"train_loss": -40.920257568359375, "global_step": 199501, "epoch": 1648} {"train_loss": -40.083187103271484, "global_step": 199502, "epoch": 1648} {"train_loss": -40.454463958740234, "global_step": 199503, "epoch": 1648} {"train_loss": -41.09092330932617, "global_step": 199504, "epoch": 1648} {"train_loss": -40.88385009765625, "global_step": 199505, "epoch": 1648} {"train_loss": -41.31876754760742, "global_step": 199506, "epoch": 1648} {"train_loss": -39.842281341552734, "global_step": 199507, "epoch": 1648} {"train_loss": -41.68540954589844, "global_step": 199508, "epoch": 1648} {"train_loss": -41.46726989746094, "global_step": 199509, "epoch": 1648} {"train_loss": -41.01912307739258, "global_step": 199510, "epoch": 1648} {"train_loss": -41.40900802612305, "global_step": 199511, "epoch": 1648} {"train_loss": -41.759765625, "global_step": 199512, "epoch": 1648} {"train_loss": -41.762142181396484, "global_step": 199513, "epoch": 1648} {"train_loss": -41.57902145385742, "global_step": 199514, "epoch": 1648} {"train_loss": -41.91627502441406, "global_step": 199515, "epoch": 1648} {"train_loss": -41.079864501953125, "global_step": 199516, "epoch": 1648} {"train_loss": -39.23275375366211, "global_step": 199517, "epoch": 1648} {"train_loss": -40.72772979736328, "global_step": 199518, "epoch": 1648} {"train_loss": -39.75252151489258, "global_step": 199519, "epoch": 1648} {"train_loss": -41.013221740722656, "global_step": 199520, "epoch": 1648} {"train_loss": -40.6529541015625, "global_step": 199521, "epoch": 1648} {"train_loss": -41.14155197143555, "global_step": 199522, "epoch": 1648} {"train_loss": -41.38905715942383, "global_step": 199523, "epoch": 1648} {"train_loss": -40.447662353515625, "global_step": 199524, "epoch": 1648} {"train_loss": -39.73884201049805, "global_step": 199525, "epoch": 1648} {"train_loss": -40.463619232177734, "global_step": 199526, "epoch": 1648} {"train_loss": -40.861083984375, "global_step": 199527, "epoch": 1648} {"train_loss": -40.15187693824453, "global_step": 199528, "epoch": 1648, "val_loss": 2726490.25} {"train_loss": -41.539878845214844, "global_step": 199529, "epoch": 1649} {"train_loss": -40.209197998046875, "global_step": 199530, "epoch": 1649} {"train_loss": -35.48027420043945, "global_step": 199531, "epoch": 1649} {"train_loss": -40.94983673095703, "global_step": 199532, "epoch": 1649} {"train_loss": -41.901546478271484, "global_step": 199533, "epoch": 1649} {"train_loss": -40.70198059082031, "global_step": 199534, "epoch": 1649} {"train_loss": -38.535823822021484, "global_step": 199535, "epoch": 1649} {"train_loss": -39.06964874267578, "global_step": 199536, "epoch": 1649} {"train_loss": -40.62773513793945, "global_step": 199537, "epoch": 1649} {"train_loss": -41.543052673339844, "global_step": 199538, "epoch": 1649} {"train_loss": -39.011531829833984, "global_step": 199539, "epoch": 1649} {"train_loss": -41.278499603271484, "global_step": 199540, "epoch": 1649} {"train_loss": -41.13234329223633, "global_step": 199541, "epoch": 1649} {"train_loss": -39.98914337158203, "global_step": 199542, "epoch": 1649} {"train_loss": -40.54278564453125, "global_step": 199543, "epoch": 1649} {"train_loss": -39.24396896362305, "global_step": 199544, "epoch": 1649} {"train_loss": -40.77021026611328, "global_step": 199545, "epoch": 1649} {"train_loss": -41.0446662902832, "global_step": 199546, "epoch": 1649} {"train_loss": -41.074886322021484, "global_step": 199547, "epoch": 1649} {"train_loss": -39.445404052734375, "global_step": 199548, "epoch": 1649} {"train_loss": -38.568843841552734, "global_step": 199549, "epoch": 1649} {"train_loss": -39.00601577758789, "global_step": 199550, "epoch": 1649} {"train_loss": -38.04243087768555, "global_step": 199551, "epoch": 1649} {"train_loss": -38.82966232299805, "global_step": 199552, "epoch": 1649} {"train_loss": -37.11309051513672, "global_step": 199553, "epoch": 1649} {"train_loss": -34.891170501708984, "global_step": 199554, "epoch": 1649} {"train_loss": -37.22886276245117, "global_step": 199555, "epoch": 1649} {"train_loss": -37.615943908691406, "global_step": 199556, "epoch": 1649} {"train_loss": -38.34939956665039, "global_step": 199557, "epoch": 1649} {"train_loss": -38.57951736450195, "global_step": 199558, "epoch": 1649} {"train_loss": -36.19594955444336, "global_step": 199559, "epoch": 1649} {"train_loss": -38.88972854614258, "global_step": 199560, "epoch": 1649} {"train_loss": -39.017723083496094, "global_step": 199561, "epoch": 1649} {"train_loss": -38.29871368408203, "global_step": 199562, "epoch": 1649} {"train_loss": -34.952388763427734, "global_step": 199563, "epoch": 1649} {"train_loss": -40.07166290283203, "global_step": 199564, "epoch": 1649} {"train_loss": -37.897979736328125, "global_step": 199565, "epoch": 1649} {"train_loss": -38.10350799560547, "global_step": 199566, "epoch": 1649} {"train_loss": -39.09305953979492, "global_step": 199567, "epoch": 1649} {"train_loss": -37.6449089050293, "global_step": 199568, "epoch": 1649} {"train_loss": -39.82552719116211, "global_step": 199569, "epoch": 1649} {"train_loss": -36.46566390991211, "global_step": 199570, "epoch": 1649} {"train_loss": -38.2719841003418, "global_step": 199571, "epoch": 1649} {"train_loss": -40.07208251953125, "global_step": 199572, "epoch": 1649} {"train_loss": -36.81374740600586, "global_step": 199573, "epoch": 1649} {"train_loss": -40.09574508666992, "global_step": 199574, "epoch": 1649} {"train_loss": -38.60163116455078, "global_step": 199575, "epoch": 1649} {"train_loss": -38.957942962646484, "global_step": 199576, "epoch": 1649} {"train_loss": -38.648311614990234, "global_step": 199577, "epoch": 1649} {"train_loss": -38.68357849121094, "global_step": 199578, "epoch": 1649} {"train_loss": -39.734378814697266, "global_step": 199579, "epoch": 1649} {"train_loss": -38.30630111694336, "global_step": 199580, "epoch": 1649} {"train_loss": -40.70049285888672, "global_step": 199581, "epoch": 1649} {"train_loss": -39.19082260131836, "global_step": 199582, "epoch": 1649} {"train_loss": -40.720947265625, "global_step": 199583, "epoch": 1649} {"train_loss": -39.21940612792969, "global_step": 199584, "epoch": 1649} {"train_loss": -39.17118453979492, "global_step": 199585, "epoch": 1649} {"train_loss": -39.38995361328125, "global_step": 199586, "epoch": 1649} {"train_loss": -39.28636932373047, "global_step": 199587, "epoch": 1649} {"train_loss": -40.47251510620117, "global_step": 199588, "epoch": 1649} {"train_loss": -38.72544860839844, "global_step": 199589, "epoch": 1649} {"train_loss": -39.79576110839844, "global_step": 199590, "epoch": 1649} {"train_loss": -40.05515670776367, "global_step": 199591, "epoch": 1649} {"train_loss": -40.109962463378906, "global_step": 199592, "epoch": 1649} {"train_loss": -40.59901809692383, "global_step": 199593, "epoch": 1649} {"train_loss": -40.45576858520508, "global_step": 199594, "epoch": 1649} {"train_loss": -40.43722152709961, "global_step": 199595, "epoch": 1649} {"train_loss": -40.91480255126953, "global_step": 199596, "epoch": 1649} {"train_loss": -40.842342376708984, "global_step": 199597, "epoch": 1649} {"train_loss": -40.60603713989258, "global_step": 199598, "epoch": 1649} {"train_loss": -40.577247619628906, "global_step": 199599, "epoch": 1649} {"train_loss": -40.26395797729492, "global_step": 199600, "epoch": 1649} {"train_loss": -40.10360336303711, "global_step": 199601, "epoch": 1649} {"train_loss": -40.82178497314453, "global_step": 199602, "epoch": 1649} {"train_loss": -41.45149230957031, "global_step": 199603, "epoch": 1649} {"train_loss": -40.9060173034668, "global_step": 199604, "epoch": 1649} {"train_loss": -41.510406494140625, "global_step": 199605, "epoch": 1649} {"train_loss": -40.59212112426758, "global_step": 199606, "epoch": 1649} {"train_loss": -40.69106674194336, "global_step": 199607, "epoch": 1649} {"train_loss": -41.42311477661133, "global_step": 199608, "epoch": 1649} {"train_loss": -40.53514099121094, "global_step": 199609, "epoch": 1649} {"train_loss": -41.15216827392578, "global_step": 199610, "epoch": 1649} {"train_loss": -41.42529296875, "global_step": 199611, "epoch": 1649} {"train_loss": -40.36927032470703, "global_step": 199612, "epoch": 1649} {"train_loss": -41.0035514831543, "global_step": 199613, "epoch": 1649} {"train_loss": -40.61669158935547, "global_step": 199614, "epoch": 1649} {"train_loss": -41.540916442871094, "global_step": 199615, "epoch": 1649} {"train_loss": -41.57062530517578, "global_step": 199616, "epoch": 1649} {"train_loss": -40.88638687133789, "global_step": 199617, "epoch": 1649} {"train_loss": -41.71003341674805, "global_step": 199618, "epoch": 1649} {"train_loss": -40.94888687133789, "global_step": 199619, "epoch": 1649} {"train_loss": -40.779693603515625, "global_step": 199620, "epoch": 1649} {"train_loss": -42.07630920410156, "global_step": 199621, "epoch": 1649} {"train_loss": -41.29143142700195, "global_step": 199622, "epoch": 1649} {"train_loss": -41.615203857421875, "global_step": 199623, "epoch": 1649} {"train_loss": -41.43451690673828, "global_step": 199624, "epoch": 1649} {"train_loss": -41.46796798706055, "global_step": 199625, "epoch": 1649} {"train_loss": -41.26292037963867, "global_step": 199626, "epoch": 1649} {"train_loss": -41.714168548583984, "global_step": 199627, "epoch": 1649} {"train_loss": -41.22916030883789, "global_step": 199628, "epoch": 1649} {"train_loss": -40.80640411376953, "global_step": 199629, "epoch": 1649} {"train_loss": -40.57671356201172, "global_step": 199630, "epoch": 1649} {"train_loss": -41.74943542480469, "global_step": 199631, "epoch": 1649} {"train_loss": -41.712982177734375, "global_step": 199632, "epoch": 1649} {"train_loss": -42.18000411987305, "global_step": 199633, "epoch": 1649} {"train_loss": -41.08046340942383, "global_step": 199634, "epoch": 1649} {"train_loss": -39.05257797241211, "global_step": 199635, "epoch": 1649} {"train_loss": -40.86917495727539, "global_step": 199636, "epoch": 1649} {"train_loss": -42.106834411621094, "global_step": 199637, "epoch": 1649} {"train_loss": -40.155189514160156, "global_step": 199638, "epoch": 1649} {"train_loss": -41.618133544921875, "global_step": 199639, "epoch": 1649} {"train_loss": -42.24134063720703, "global_step": 199640, "epoch": 1649} {"train_loss": -41.68160629272461, "global_step": 199641, "epoch": 1649} {"train_loss": -41.21044158935547, "global_step": 199642, "epoch": 1649} {"train_loss": -42.21389389038086, "global_step": 199643, "epoch": 1649} {"train_loss": -41.52313232421875, "global_step": 199644, "epoch": 1649} {"train_loss": -41.082435607910156, "global_step": 199645, "epoch": 1649} {"train_loss": -41.69853973388672, "global_step": 199646, "epoch": 1649} {"train_loss": -41.69828414916992, "global_step": 199647, "epoch": 1649} {"train_loss": -41.67891311645508, "global_step": 199648, "epoch": 1649} {"train_loss": -40.07902974530685, "global_step": 199649, "epoch": 1649, "val_loss": 2597224.25} {"train_loss": -41.74158477783203, "global_step": 199650, "epoch": 1650} {"train_loss": -39.6309928894043, "global_step": 199651, "epoch": 1650} {"train_loss": -39.604183197021484, "global_step": 199652, "epoch": 1650} {"train_loss": -41.060646057128906, "global_step": 199653, "epoch": 1650} {"train_loss": -41.60111618041992, "global_step": 199654, "epoch": 1650} {"train_loss": -41.333770751953125, "global_step": 199655, "epoch": 1650} {"train_loss": -42.264461517333984, "global_step": 199656, "epoch": 1650} {"train_loss": -40.820308685302734, "global_step": 199657, "epoch": 1650} {"train_loss": -42.1592903137207, "global_step": 199658, "epoch": 1650} {"train_loss": -41.97665023803711, "global_step": 199659, "epoch": 1650} {"train_loss": -41.88512420654297, "global_step": 199660, "epoch": 1650} {"train_loss": -41.5998420715332, "global_step": 199661, "epoch": 1650} {"train_loss": -39.84635925292969, "global_step": 199662, "epoch": 1650} {"train_loss": -39.96217727661133, "global_step": 199663, "epoch": 1650} {"train_loss": -41.428829193115234, "global_step": 199664, "epoch": 1650} {"train_loss": -41.45933151245117, "global_step": 199665, "epoch": 1650} {"train_loss": -41.816932678222656, "global_step": 199666, "epoch": 1650} {"train_loss": -41.2241325378418, "global_step": 199667, "epoch": 1650} {"train_loss": -41.85318374633789, "global_step": 199668, "epoch": 1650} {"train_loss": -41.11172103881836, "global_step": 199669, "epoch": 1650} {"train_loss": -41.463478088378906, "global_step": 199670, "epoch": 1650} {"train_loss": -41.04138946533203, "global_step": 199671, "epoch": 1650} {"train_loss": -41.23681640625, "global_step": 199672, "epoch": 1650} {"train_loss": -39.83848190307617, "global_step": 199673, "epoch": 1650} {"train_loss": -40.0677604675293, "global_step": 199674, "epoch": 1650} {"train_loss": -41.52467727661133, "global_step": 199675, "epoch": 1650} {"train_loss": -41.445072174072266, "global_step": 199676, "epoch": 1650} {"train_loss": -38.51101303100586, "global_step": 199677, "epoch": 1650} {"train_loss": -41.73285675048828, "global_step": 199678, "epoch": 1650} {"train_loss": -41.23863983154297, "global_step": 199679, "epoch": 1650} {"train_loss": -42.2476806640625, "global_step": 199680, "epoch": 1650} {"train_loss": -41.83649826049805, "global_step": 199681, "epoch": 1650} {"train_loss": -39.13566207885742, "global_step": 199682, "epoch": 1650} {"train_loss": -41.4177360534668, "global_step": 199683, "epoch": 1650} {"train_loss": -40.50938034057617, "global_step": 199684, "epoch": 1650} {"train_loss": -40.08735275268555, "global_step": 199685, "epoch": 1650} {"train_loss": -41.3799934387207, "global_step": 199686, "epoch": 1650} {"train_loss": -41.10146713256836, "global_step": 199687, "epoch": 1650} {"train_loss": -40.462242126464844, "global_step": 199688, "epoch": 1650} {"train_loss": -40.28980255126953, "global_step": 199689, "epoch": 1650} {"train_loss": -39.4116325378418, "global_step": 199690, "epoch": 1650} {"train_loss": -38.41580581665039, "global_step": 199691, "epoch": 1650} {"train_loss": -40.722900390625, "global_step": 199692, "epoch": 1650} {"train_loss": -41.010799407958984, "global_step": 199693, "epoch": 1650} {"train_loss": -41.34522247314453, "global_step": 199694, "epoch": 1650} {"train_loss": -40.65581130981445, "global_step": 199695, "epoch": 1650} {"train_loss": -41.29054260253906, "global_step": 199696, "epoch": 1650} {"train_loss": -41.40627670288086, "global_step": 199697, "epoch": 1650} {"train_loss": -40.27546310424805, "global_step": 199698, "epoch": 1650} {"train_loss": -40.846351623535156, "global_step": 199699, "epoch": 1650} {"train_loss": -39.50494384765625, "global_step": 199700, "epoch": 1650} {"train_loss": -41.26163864135742, "global_step": 199701, "epoch": 1650} {"train_loss": -38.82571029663086, "global_step": 199702, "epoch": 1650} {"train_loss": -41.231040954589844, "global_step": 199703, "epoch": 1650} {"train_loss": -40.42771530151367, "global_step": 199704, "epoch": 1650} {"train_loss": -40.5880241394043, "global_step": 199705, "epoch": 1650} {"train_loss": -40.69225311279297, "global_step": 199706, "epoch": 1650} {"train_loss": -41.25396728515625, "global_step": 199707, "epoch": 1650} {"train_loss": -40.12174606323242, "global_step": 199708, "epoch": 1650} {"train_loss": -40.961647033691406, "global_step": 199709, "epoch": 1650} {"train_loss": -36.250911712646484, "global_step": 199710, "epoch": 1650} {"train_loss": -40.79484558105469, "global_step": 199711, "epoch": 1650} {"train_loss": -40.5483512878418, "global_step": 199712, "epoch": 1650} {"train_loss": -40.716529846191406, "global_step": 199713, "epoch": 1650} {"train_loss": -41.53959655761719, "global_step": 199714, "epoch": 1650} {"train_loss": -41.11469650268555, "global_step": 199715, "epoch": 1650} {"train_loss": -40.23798751831055, "global_step": 199716, "epoch": 1650} {"train_loss": -40.1622200012207, "global_step": 199717, "epoch": 1650} {"train_loss": -41.57621765136719, "global_step": 199718, "epoch": 1650} {"train_loss": -37.247703552246094, "global_step": 199719, "epoch": 1650} {"train_loss": -40.98688888549805, "global_step": 199720, "epoch": 1650} {"train_loss": -40.68417739868164, "global_step": 199721, "epoch": 1650} {"train_loss": -39.22811508178711, "global_step": 199722, "epoch": 1650} {"train_loss": -39.431884765625, "global_step": 199723, "epoch": 1650} {"train_loss": -40.1870231628418, "global_step": 199724, "epoch": 1650} {"train_loss": -40.959510803222656, "global_step": 199725, "epoch": 1650} {"train_loss": -36.04378890991211, "global_step": 199726, "epoch": 1650} {"train_loss": -40.673828125, "global_step": 199727, "epoch": 1650} {"train_loss": -40.317413330078125, "global_step": 199728, "epoch": 1650} {"train_loss": -39.52262496948242, "global_step": 199729, "epoch": 1650} {"train_loss": -41.438819885253906, "global_step": 199730, "epoch": 1650} {"train_loss": -39.7845344543457, "global_step": 199731, "epoch": 1650} {"train_loss": -40.20478057861328, "global_step": 199732, "epoch": 1650} {"train_loss": -39.652591705322266, "global_step": 199733, "epoch": 1650} {"train_loss": -40.02668380737305, "global_step": 199734, "epoch": 1650} {"train_loss": -39.96498489379883, "global_step": 199735, "epoch": 1650} {"train_loss": -40.61717224121094, "global_step": 199736, "epoch": 1650} {"train_loss": -39.76509094238281, "global_step": 199737, "epoch": 1650} {"train_loss": -40.03876495361328, "global_step": 199738, "epoch": 1650} {"train_loss": -39.7765998840332, "global_step": 199739, "epoch": 1650} {"train_loss": -40.53701400756836, "global_step": 199740, "epoch": 1650} {"train_loss": -40.6168212890625, "global_step": 199741, "epoch": 1650} {"train_loss": -40.686214447021484, "global_step": 199742, "epoch": 1650} {"train_loss": -40.86556625366211, "global_step": 199743, "epoch": 1650} {"train_loss": -39.10006332397461, "global_step": 199744, "epoch": 1650} {"train_loss": -41.00117111206055, "global_step": 199745, "epoch": 1650} {"train_loss": -41.246917724609375, "global_step": 199746, "epoch": 1650} {"train_loss": -40.34885787963867, "global_step": 199747, "epoch": 1650} {"train_loss": -41.12200927734375, "global_step": 199748, "epoch": 1650} {"train_loss": -41.33229446411133, "global_step": 199749, "epoch": 1650} {"train_loss": -41.22930145263672, "global_step": 199750, "epoch": 1650} {"train_loss": -41.55393600463867, "global_step": 199751, "epoch": 1650} {"train_loss": -39.522403717041016, "global_step": 199752, "epoch": 1650} {"train_loss": -41.187374114990234, "global_step": 199753, "epoch": 1650} {"train_loss": -41.14082717895508, "global_step": 199754, "epoch": 1650} {"train_loss": -40.76129913330078, "global_step": 199755, "epoch": 1650} {"train_loss": -41.54158020019531, "global_step": 199756, "epoch": 1650} {"train_loss": -40.31410217285156, "global_step": 199757, "epoch": 1650} {"train_loss": -40.58360290527344, "global_step": 199758, "epoch": 1650} {"train_loss": -39.63226318359375, "global_step": 199759, "epoch": 1650} {"train_loss": -42.02125930786133, "global_step": 199760, "epoch": 1650} {"train_loss": -41.354373931884766, "global_step": 199761, "epoch": 1650} {"train_loss": -40.47332000732422, "global_step": 199762, "epoch": 1650} {"train_loss": -42.00544357299805, "global_step": 199763, "epoch": 1650} {"train_loss": -41.456787109375, "global_step": 199764, "epoch": 1650} {"train_loss": -41.217891693115234, "global_step": 199765, "epoch": 1650} {"train_loss": -42.10772705078125, "global_step": 199766, "epoch": 1650} {"train_loss": -40.83103942871094, "global_step": 199767, "epoch": 1650} {"train_loss": -40.60761642456055, "global_step": 199768, "epoch": 1650} {"train_loss": -41.59370040893555, "global_step": 199769, "epoch": 1650} {"train_loss": -40.65966509984545, "global_step": 199770, "epoch": 1650, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 0.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4400000": 1.0, "test/sim_max_reward_4400001": 1.0, "test/sim_max_reward_4400002": 1.0, "test/sim_max_reward_4400003": 0.0, "test/sim_max_reward_4400004": 1.0, "test/sim_max_reward_4400005": 1.0, "test/sim_max_reward_4400006": 1.0, "test/sim_max_reward_4400007": 1.0, "test/sim_max_reward_4400008": 0.0, "test/sim_max_reward_4400009": 1.0, "test/sim_max_reward_4400010": 1.0, "test/sim_max_reward_4400011": 1.0, "test/sim_max_reward_4400012": 1.0, "test/sim_max_reward_4400013": 1.0, "test/sim_max_reward_4400014": 1.0, "test/sim_max_reward_4400015": 1.0, "test/sim_max_reward_4400016": 1.0, "test/sim_max_reward_4400017": 1.0, "test/sim_max_reward_4400018": 1.0, "test/sim_max_reward_4400019": 1.0, "test/sim_max_reward_4400020": 1.0, "test/sim_max_reward_4400021": 1.0, "train/mean_score": 0.8333333333333334, "test/mean_score": 0.9090909090909091, "val_loss": 2625393.75} {"train_loss": -41.361114501953125, "global_step": 199771, "epoch": 1651} {"train_loss": -40.97948455810547, "global_step": 199772, "epoch": 1651} {"train_loss": -40.95697021484375, "global_step": 199773, "epoch": 1651} {"train_loss": -40.059364318847656, "global_step": 199774, "epoch": 1651} {"train_loss": -41.1630744934082, "global_step": 199775, "epoch": 1651} {"train_loss": -39.14287185668945, "global_step": 199776, "epoch": 1651} {"train_loss": -40.434932708740234, "global_step": 199777, "epoch": 1651} {"train_loss": -41.23198318481445, "global_step": 199778, "epoch": 1651} {"train_loss": -39.69811248779297, "global_step": 199779, "epoch": 1651} {"train_loss": -40.8953971862793, "global_step": 199780, "epoch": 1651} {"train_loss": -42.17142868041992, "global_step": 199781, "epoch": 1651} {"train_loss": -40.10581588745117, "global_step": 199782, "epoch": 1651} {"train_loss": -40.51780700683594, "global_step": 199783, "epoch": 1651} {"train_loss": -38.974117279052734, "global_step": 199784, "epoch": 1651} {"train_loss": -40.743892669677734, "global_step": 199785, "epoch": 1651} {"train_loss": -41.42694091796875, "global_step": 199786, "epoch": 1651} {"train_loss": -39.85797119140625, "global_step": 199787, "epoch": 1651} {"train_loss": -40.104679107666016, "global_step": 199788, "epoch": 1651} {"train_loss": -37.0679931640625, "global_step": 199789, "epoch": 1651} {"train_loss": -30.02579116821289, "global_step": 199790, "epoch": 1651} {"train_loss": -37.26470184326172, "global_step": 199791, "epoch": 1651} {"train_loss": -39.86306381225586, "global_step": 199792, "epoch": 1651} {"train_loss": -39.96590805053711, "global_step": 199793, "epoch": 1651} {"train_loss": -39.054901123046875, "global_step": 199794, "epoch": 1651} {"train_loss": -40.01637649536133, "global_step": 199795, "epoch": 1651} {"train_loss": -40.337310791015625, "global_step": 199796, "epoch": 1651} {"train_loss": -40.90068435668945, "global_step": 199797, "epoch": 1651} {"train_loss": -39.700408935546875, "global_step": 199798, "epoch": 1651} {"train_loss": -40.20675277709961, "global_step": 199799, "epoch": 1651} {"train_loss": -40.397193908691406, "global_step": 199800, "epoch": 1651} {"train_loss": -39.475372314453125, "global_step": 199801, "epoch": 1651} {"train_loss": -35.62220001220703, "global_step": 199802, "epoch": 1651} {"train_loss": -40.79662322998047, "global_step": 199803, "epoch": 1651} {"train_loss": -40.25318145751953, "global_step": 199804, "epoch": 1651} {"train_loss": -40.53046798706055, "global_step": 199805, "epoch": 1651} {"train_loss": -40.46833419799805, "global_step": 199806, "epoch": 1651} {"train_loss": -40.48629379272461, "global_step": 199807, "epoch": 1651} {"train_loss": -41.02651596069336, "global_step": 199808, "epoch": 1651} {"train_loss": -40.94562530517578, "global_step": 199809, "epoch": 1651} {"train_loss": -40.480567932128906, "global_step": 199810, "epoch": 1651} {"train_loss": -39.11684799194336, "global_step": 199811, "epoch": 1651} {"train_loss": -40.6646614074707, "global_step": 199812, "epoch": 1651} {"train_loss": -41.132904052734375, "global_step": 199813, "epoch": 1651} {"train_loss": -39.40534210205078, "global_step": 199814, "epoch": 1651} {"train_loss": -40.936370849609375, "global_step": 199815, "epoch": 1651} {"train_loss": -41.1143798828125, "global_step": 199816, "epoch": 1651} {"train_loss": -41.280738830566406, "global_step": 199817, "epoch": 1651} {"train_loss": -40.846595764160156, "global_step": 199818, "epoch": 1651} {"train_loss": -41.33437728881836, "global_step": 199819, "epoch": 1651} {"train_loss": -41.48802947998047, "global_step": 199820, "epoch": 1651} {"train_loss": -40.958683013916016, "global_step": 199821, "epoch": 1651} {"train_loss": -40.950374603271484, "global_step": 199822, "epoch": 1651} {"train_loss": -40.813232421875, "global_step": 199823, "epoch": 1651} {"train_loss": -40.909889221191406, "global_step": 199824, "epoch": 1651} {"train_loss": -38.01107406616211, "global_step": 199825, "epoch": 1651} {"train_loss": -41.22702407836914, "global_step": 199826, "epoch": 1651} {"train_loss": -36.58687210083008, "global_step": 199827, "epoch": 1651} {"train_loss": -41.954383850097656, "global_step": 199828, "epoch": 1651} {"train_loss": -42.209739685058594, "global_step": 199829, "epoch": 1651} {"train_loss": -40.60768508911133, "global_step": 199830, "epoch": 1651} {"train_loss": -41.95267868041992, "global_step": 199831, "epoch": 1651} {"train_loss": -38.948360443115234, "global_step": 199832, "epoch": 1651} {"train_loss": -40.85068130493164, "global_step": 199833, "epoch": 1651} {"train_loss": -41.279293060302734, "global_step": 199834, "epoch": 1651} {"train_loss": -40.94472122192383, "global_step": 199835, "epoch": 1651} {"train_loss": -40.68235778808594, "global_step": 199836, "epoch": 1651} {"train_loss": -41.19527053833008, "global_step": 199837, "epoch": 1651} {"train_loss": -42.19297409057617, "global_step": 199838, "epoch": 1651} {"train_loss": -41.62118911743164, "global_step": 199839, "epoch": 1651} {"train_loss": -41.39056396484375, "global_step": 199840, "epoch": 1651} {"train_loss": -40.723724365234375, "global_step": 199841, "epoch": 1651} {"train_loss": -41.22248840332031, "global_step": 199842, "epoch": 1651} {"train_loss": -41.854671478271484, "global_step": 199843, "epoch": 1651} {"train_loss": -42.123619079589844, "global_step": 199844, "epoch": 1651} {"train_loss": -42.051856994628906, "global_step": 199845, "epoch": 1651} {"train_loss": -41.58155822753906, "global_step": 199846, "epoch": 1651} {"train_loss": -41.8201904296875, "global_step": 199847, "epoch": 1651} {"train_loss": -42.17495346069336, "global_step": 199848, "epoch": 1651} {"train_loss": -42.05225372314453, "global_step": 199849, "epoch": 1651} {"train_loss": -42.21052551269531, "global_step": 199850, "epoch": 1651} {"train_loss": -42.5847282409668, "global_step": 199851, "epoch": 1651} {"train_loss": -41.660682678222656, "global_step": 199852, "epoch": 1651} {"train_loss": -42.15547561645508, "global_step": 199853, "epoch": 1651} {"train_loss": -41.62370300292969, "global_step": 199854, "epoch": 1651} {"train_loss": -41.7310791015625, "global_step": 199855, "epoch": 1651} {"train_loss": -41.28499221801758, "global_step": 199856, "epoch": 1651} {"train_loss": -42.039833068847656, "global_step": 199857, "epoch": 1651} {"train_loss": -40.411521911621094, "global_step": 199858, "epoch": 1651} {"train_loss": -41.458656311035156, "global_step": 199859, "epoch": 1651} {"train_loss": -40.27022171020508, "global_step": 199860, "epoch": 1651} {"train_loss": -41.958892822265625, "global_step": 199861, "epoch": 1651} {"train_loss": -40.208683013916016, "global_step": 199862, "epoch": 1651} {"train_loss": -40.89466094970703, "global_step": 199863, "epoch": 1651} {"train_loss": -41.3321647644043, "global_step": 199864, "epoch": 1651} {"train_loss": -41.467010498046875, "global_step": 199865, "epoch": 1651} {"train_loss": -41.685813903808594, "global_step": 199866, "epoch": 1651} {"train_loss": -41.331153869628906, "global_step": 199867, "epoch": 1651} {"train_loss": -41.77256393432617, "global_step": 199868, "epoch": 1651} {"train_loss": -41.6979866027832, "global_step": 199869, "epoch": 1651} {"train_loss": -41.88706588745117, "global_step": 199870, "epoch": 1651} {"train_loss": -41.24662399291992, "global_step": 199871, "epoch": 1651} {"train_loss": -41.70913314819336, "global_step": 199872, "epoch": 1651} {"train_loss": -41.01648712158203, "global_step": 199873, "epoch": 1651} {"train_loss": -41.81062316894531, "global_step": 199874, "epoch": 1651} {"train_loss": -39.622352600097656, "global_step": 199875, "epoch": 1651} {"train_loss": -41.37681198120117, "global_step": 199876, "epoch": 1651} {"train_loss": -36.749610900878906, "global_step": 199877, "epoch": 1651} {"train_loss": -40.867706298828125, "global_step": 199878, "epoch": 1651} {"train_loss": -40.55287551879883, "global_step": 199879, "epoch": 1651} {"train_loss": -41.62166976928711, "global_step": 199880, "epoch": 1651} {"train_loss": -39.023929595947266, "global_step": 199881, "epoch": 1651} {"train_loss": -40.134971618652344, "global_step": 199882, "epoch": 1651} {"train_loss": -40.52523422241211, "global_step": 199883, "epoch": 1651} {"train_loss": -40.33370590209961, "global_step": 199884, "epoch": 1651} {"train_loss": -40.15645217895508, "global_step": 199885, "epoch": 1651} {"train_loss": -41.49978256225586, "global_step": 199886, "epoch": 1651} {"train_loss": -40.9607048034668, "global_step": 199887, "epoch": 1651} {"train_loss": -41.00461959838867, "global_step": 199888, "epoch": 1651} {"train_loss": -41.81632614135742, "global_step": 199889, "epoch": 1651} {"train_loss": -41.17371368408203, "global_step": 199890, "epoch": 1651} {"train_loss": -40.65266175703569, "global_step": 199891, "epoch": 1651, "val_loss": 2646794.75} {"train_loss": -41.15102005004883, "global_step": 199892, "epoch": 1652} {"train_loss": -41.29975509643555, "global_step": 199893, "epoch": 1652} {"train_loss": -41.311580657958984, "global_step": 199894, "epoch": 1652} {"train_loss": -40.545310974121094, "global_step": 199895, "epoch": 1652} {"train_loss": -41.226470947265625, "global_step": 199896, "epoch": 1652} {"train_loss": -41.11222839355469, "global_step": 199897, "epoch": 1652} {"train_loss": -40.92392349243164, "global_step": 199898, "epoch": 1652} {"train_loss": -41.7736930847168, "global_step": 199899, "epoch": 1652} {"train_loss": -41.15283203125, "global_step": 199900, "epoch": 1652} {"train_loss": -41.10811996459961, "global_step": 199901, "epoch": 1652} {"train_loss": -41.83595657348633, "global_step": 199902, "epoch": 1652} {"train_loss": -41.62779998779297, "global_step": 199903, "epoch": 1652} {"train_loss": -42.01424789428711, "global_step": 199904, "epoch": 1652} {"train_loss": -41.73462677001953, "global_step": 199905, "epoch": 1652} {"train_loss": -40.96018600463867, "global_step": 199906, "epoch": 1652} {"train_loss": -41.944149017333984, "global_step": 199907, "epoch": 1652} {"train_loss": -41.48868942260742, "global_step": 199908, "epoch": 1652} {"train_loss": -41.62012481689453, "global_step": 199909, "epoch": 1652} {"train_loss": -41.20363235473633, "global_step": 199910, "epoch": 1652} {"train_loss": -41.514122009277344, "global_step": 199911, "epoch": 1652} {"train_loss": -41.94633483886719, "global_step": 199912, "epoch": 1652} {"train_loss": -41.72299575805664, "global_step": 199913, "epoch": 1652} {"train_loss": -40.81722640991211, "global_step": 199914, "epoch": 1652} {"train_loss": -41.04233932495117, "global_step": 199915, "epoch": 1652} {"train_loss": -40.61939239501953, "global_step": 199916, "epoch": 1652} {"train_loss": -41.25020980834961, "global_step": 199917, "epoch": 1652} {"train_loss": -40.49906921386719, "global_step": 199918, "epoch": 1652} {"train_loss": -40.13802719116211, "global_step": 199919, "epoch": 1652} {"train_loss": -40.81428527832031, "global_step": 199920, "epoch": 1652} {"train_loss": -41.5654411315918, "global_step": 199921, "epoch": 1652} {"train_loss": -40.53965377807617, "global_step": 199922, "epoch": 1652} {"train_loss": -37.1423454284668, "global_step": 199923, "epoch": 1652} {"train_loss": -34.386653900146484, "global_step": 199924, "epoch": 1652} {"train_loss": -37.07228469848633, "global_step": 199925, "epoch": 1652} {"train_loss": -41.6122932434082, "global_step": 199926, "epoch": 1652} {"train_loss": -39.558589935302734, "global_step": 199927, "epoch": 1652} {"train_loss": -39.682899475097656, "global_step": 199928, "epoch": 1652} {"train_loss": -39.75999069213867, "global_step": 199929, "epoch": 1652} {"train_loss": -40.634979248046875, "global_step": 199930, "epoch": 1652} {"train_loss": -39.56683349609375, "global_step": 199931, "epoch": 1652} {"train_loss": -40.07082748413086, "global_step": 199932, "epoch": 1652} {"train_loss": -40.487728118896484, "global_step": 199933, "epoch": 1652} {"train_loss": -39.87321090698242, "global_step": 199934, "epoch": 1652} {"train_loss": -40.27956771850586, "global_step": 199935, "epoch": 1652} {"train_loss": -40.72135543823242, "global_step": 199936, "epoch": 1652} {"train_loss": -42.0506706237793, "global_step": 199937, "epoch": 1652} {"train_loss": -40.42851257324219, "global_step": 199938, "epoch": 1652} {"train_loss": -40.50202178955078, "global_step": 199939, "epoch": 1652} {"train_loss": -40.65739822387695, "global_step": 199940, "epoch": 1652} {"train_loss": -40.66306686401367, "global_step": 199941, "epoch": 1652} {"train_loss": -41.46160888671875, "global_step": 199942, "epoch": 1652} {"train_loss": -40.420440673828125, "global_step": 199943, "epoch": 1652} {"train_loss": -41.454978942871094, "global_step": 199944, "epoch": 1652} {"train_loss": -40.89817810058594, "global_step": 199945, "epoch": 1652} {"train_loss": -40.01578903198242, "global_step": 199946, "epoch": 1652} {"train_loss": -41.0189094543457, "global_step": 199947, "epoch": 1652} {"train_loss": -41.215362548828125, "global_step": 199948, "epoch": 1652} {"train_loss": -41.263912200927734, "global_step": 199949, "epoch": 1652} {"train_loss": -40.89080810546875, "global_step": 199950, "epoch": 1652} {"train_loss": -40.75311279296875, "global_step": 199951, "epoch": 1652} {"train_loss": -41.51011276245117, "global_step": 199952, "epoch": 1652} {"train_loss": -41.5208625793457, "global_step": 199953, "epoch": 1652} {"train_loss": -40.992218017578125, "global_step": 199954, "epoch": 1652} {"train_loss": -41.25086212158203, "global_step": 199955, "epoch": 1652} {"train_loss": -39.2869873046875, "global_step": 199956, "epoch": 1652} {"train_loss": -39.77653121948242, "global_step": 199957, "epoch": 1652} {"train_loss": -40.0017204284668, "global_step": 199958, "epoch": 1652} {"train_loss": -41.59157180786133, "global_step": 199959, "epoch": 1652} {"train_loss": -40.92045211791992, "global_step": 199960, "epoch": 1652} {"train_loss": -37.99007797241211, "global_step": 199961, "epoch": 1652} {"train_loss": -41.384822845458984, "global_step": 199962, "epoch": 1652} {"train_loss": -40.44907760620117, "global_step": 199963, "epoch": 1652} {"train_loss": -38.457523345947266, "global_step": 199964, "epoch": 1652} {"train_loss": -36.61769485473633, "global_step": 199965, "epoch": 1652} {"train_loss": -39.953407287597656, "global_step": 199966, "epoch": 1652} {"train_loss": -40.191497802734375, "global_step": 199967, "epoch": 1652} {"train_loss": -39.15843963623047, "global_step": 199968, "epoch": 1652} {"train_loss": -40.815059661865234, "global_step": 199969, "epoch": 1652} {"train_loss": -40.305206298828125, "global_step": 199970, "epoch": 1652} {"train_loss": -38.05070495605469, "global_step": 199971, "epoch": 1652} {"train_loss": -40.70151901245117, "global_step": 199972, "epoch": 1652} {"train_loss": -40.452423095703125, "global_step": 199973, "epoch": 1652} {"train_loss": -41.452423095703125, "global_step": 199974, "epoch": 1652} {"train_loss": -41.42005920410156, "global_step": 199975, "epoch": 1652} {"train_loss": -40.3582763671875, "global_step": 199976, "epoch": 1652} {"train_loss": -40.50836944580078, "global_step": 199977, "epoch": 1652} {"train_loss": -41.02620315551758, "global_step": 199978, "epoch": 1652} {"train_loss": -41.222408294677734, "global_step": 199979, "epoch": 1652} {"train_loss": -40.78654098510742, "global_step": 199980, "epoch": 1652} {"train_loss": -41.66022872924805, "global_step": 199981, "epoch": 1652} {"train_loss": -41.20349884033203, "global_step": 199982, "epoch": 1652} {"train_loss": -41.958160400390625, "global_step": 199983, "epoch": 1652} {"train_loss": -41.03741455078125, "global_step": 199984, "epoch": 1652} {"train_loss": -41.85224914550781, "global_step": 199985, "epoch": 1652} {"train_loss": -40.657806396484375, "global_step": 199986, "epoch": 1652} {"train_loss": -41.867733001708984, "global_step": 199987, "epoch": 1652} {"train_loss": -41.93170166015625, "global_step": 199988, "epoch": 1652} {"train_loss": -41.969669342041016, "global_step": 199989, "epoch": 1652} {"train_loss": -41.91196823120117, "global_step": 199990, "epoch": 1652} {"train_loss": -41.96326446533203, "global_step": 199991, "epoch": 1652} {"train_loss": -40.934322357177734, "global_step": 199992, "epoch": 1652} {"train_loss": -42.43304443359375, "global_step": 199993, "epoch": 1652} {"train_loss": -41.92563247680664, "global_step": 199994, "epoch": 1652} {"train_loss": -42.0629997253418, "global_step": 199995, "epoch": 1652} {"train_loss": -42.02556228637695, "global_step": 199996, "epoch": 1652} {"train_loss": -42.04403305053711, "global_step": 199997, "epoch": 1652} {"train_loss": -42.02294921875, "global_step": 199998, "epoch": 1652} {"train_loss": -41.57441711425781, "global_step": 199999, "epoch": 1652} {"train_loss": -41.21125411987305, "global_step": 200000, "epoch": 1652} {"train_loss": -42.02598190307617, "global_step": 200001, "epoch": 1652} {"train_loss": -41.0384521484375, "global_step": 200002, "epoch": 1652} {"train_loss": -41.89133071899414, "global_step": 200003, "epoch": 1652} {"train_loss": -42.94620895385742, "global_step": 200004, "epoch": 1652} {"train_loss": -40.56919479370117, "global_step": 200005, "epoch": 1652} {"train_loss": -42.34086227416992, "global_step": 200006, "epoch": 1652} {"train_loss": -40.671913146972656, "global_step": 200007, "epoch": 1652} {"train_loss": -40.91874313354492, "global_step": 200008, "epoch": 1652} {"train_loss": -41.73537063598633, "global_step": 200009, "epoch": 1652} {"train_loss": -42.24345779418945, "global_step": 200010, "epoch": 1652} {"train_loss": -41.58980941772461, "global_step": 200011, "epoch": 1652} {"train_loss": -40.8356784473766, "global_step": 200012, "epoch": 1652, "val_loss": 2584964.0} {"train_loss": -42.124324798583984, "global_step": 200013, "epoch": 1653} {"train_loss": -41.327186584472656, "global_step": 200014, "epoch": 1653} {"train_loss": -41.00300979614258, "global_step": 200015, "epoch": 1653} {"train_loss": -40.42456817626953, "global_step": 200016, "epoch": 1653} {"train_loss": -38.79446029663086, "global_step": 200017, "epoch": 1653} {"train_loss": -38.71549606323242, "global_step": 200018, "epoch": 1653} {"train_loss": -39.47190475463867, "global_step": 200019, "epoch": 1653} {"train_loss": -38.33536911010742, "global_step": 200020, "epoch": 1653} {"train_loss": -41.002742767333984, "global_step": 200021, "epoch": 1653} {"train_loss": -40.0240364074707, "global_step": 200022, "epoch": 1653} {"train_loss": -40.33250427246094, "global_step": 200023, "epoch": 1653} {"train_loss": -38.78985595703125, "global_step": 200024, "epoch": 1653} {"train_loss": -41.34421920776367, "global_step": 200025, "epoch": 1653} {"train_loss": -36.84482955932617, "global_step": 200026, "epoch": 1653} {"train_loss": -39.483760833740234, "global_step": 200027, "epoch": 1653} {"train_loss": -41.22518539428711, "global_step": 200028, "epoch": 1653} {"train_loss": -40.866294860839844, "global_step": 200029, "epoch": 1653} {"train_loss": -39.746952056884766, "global_step": 200030, "epoch": 1653} {"train_loss": -39.4547233581543, "global_step": 200031, "epoch": 1653} {"train_loss": -41.56553268432617, "global_step": 200032, "epoch": 1653} {"train_loss": -38.82306671142578, "global_step": 200033, "epoch": 1653} {"train_loss": -39.8275032043457, "global_step": 200034, "epoch": 1653} {"train_loss": -40.35540771484375, "global_step": 200035, "epoch": 1653} {"train_loss": -39.85579299926758, "global_step": 200036, "epoch": 1653} {"train_loss": -41.497901916503906, "global_step": 200037, "epoch": 1653} {"train_loss": -39.889190673828125, "global_step": 200038, "epoch": 1653} {"train_loss": -41.177955627441406, "global_step": 200039, "epoch": 1653} {"train_loss": -41.11007308959961, "global_step": 200040, "epoch": 1653} {"train_loss": -40.443878173828125, "global_step": 200041, "epoch": 1653} {"train_loss": -40.43784713745117, "global_step": 200042, "epoch": 1653} {"train_loss": -41.97974395751953, "global_step": 200043, "epoch": 1653} {"train_loss": -40.79917526245117, "global_step": 200044, "epoch": 1653} {"train_loss": -40.876930236816406, "global_step": 200045, "epoch": 1653} {"train_loss": -41.31877517700195, "global_step": 200046, "epoch": 1653} {"train_loss": -41.380165100097656, "global_step": 200047, "epoch": 1653} {"train_loss": -41.39927291870117, "global_step": 200048, "epoch": 1653} {"train_loss": -40.39677047729492, "global_step": 200049, "epoch": 1653} {"train_loss": -41.1088752746582, "global_step": 200050, "epoch": 1653} {"train_loss": -38.17975616455078, "global_step": 200051, "epoch": 1653} {"train_loss": -41.58584213256836, "global_step": 200052, "epoch": 1653} {"train_loss": -41.409908294677734, "global_step": 200053, "epoch": 1653} {"train_loss": -39.83808135986328, "global_step": 200054, "epoch": 1653} {"train_loss": -39.17477035522461, "global_step": 200055, "epoch": 1653} {"train_loss": -40.906063079833984, "global_step": 200056, "epoch": 1653} {"train_loss": -32.484371185302734, "global_step": 200057, "epoch": 1653} {"train_loss": -40.4065055847168, "global_step": 200058, "epoch": 1653} {"train_loss": -40.323516845703125, "global_step": 200059, "epoch": 1653} {"train_loss": -38.696632385253906, "global_step": 200060, "epoch": 1653} {"train_loss": -37.324127197265625, "global_step": 200061, "epoch": 1653} {"train_loss": -37.172828674316406, "global_step": 200062, "epoch": 1653} {"train_loss": -39.787818908691406, "global_step": 200063, "epoch": 1653} {"train_loss": -40.84394073486328, "global_step": 200064, "epoch": 1653} {"train_loss": -39.96210861206055, "global_step": 200065, "epoch": 1653} {"train_loss": -40.24241256713867, "global_step": 200066, "epoch": 1653} {"train_loss": -40.08253860473633, "global_step": 200067, "epoch": 1653} {"train_loss": -40.26503372192383, "global_step": 200068, "epoch": 1653} {"train_loss": -38.73676681518555, "global_step": 200069, "epoch": 1653} {"train_loss": -40.5804443359375, "global_step": 200070, "epoch": 1653} {"train_loss": -38.83024978637695, "global_step": 200071, "epoch": 1653} {"train_loss": -38.35293197631836, "global_step": 200072, "epoch": 1653} {"train_loss": -37.649566650390625, "global_step": 200073, "epoch": 1653} {"train_loss": -40.14407730102539, "global_step": 200074, "epoch": 1653} {"train_loss": -40.6136474609375, "global_step": 200075, "epoch": 1653} {"train_loss": -39.26496887207031, "global_step": 200076, "epoch": 1653} {"train_loss": -41.17877197265625, "global_step": 200077, "epoch": 1653} {"train_loss": -39.476600646972656, "global_step": 200078, "epoch": 1653} {"train_loss": -38.80489730834961, "global_step": 200079, "epoch": 1653} {"train_loss": -40.39702606201172, "global_step": 200080, "epoch": 1653} {"train_loss": -40.919124603271484, "global_step": 200081, "epoch": 1653} {"train_loss": -40.82904815673828, "global_step": 200082, "epoch": 1653} {"train_loss": -37.888553619384766, "global_step": 200083, "epoch": 1653} {"train_loss": -38.21711349487305, "global_step": 200084, "epoch": 1653} {"train_loss": -39.72715377807617, "global_step": 200085, "epoch": 1653} {"train_loss": -40.174415588378906, "global_step": 200086, "epoch": 1653} {"train_loss": -40.50771713256836, "global_step": 200087, "epoch": 1653} {"train_loss": -39.8692741394043, "global_step": 200088, "epoch": 1653} {"train_loss": -40.965328216552734, "global_step": 200089, "epoch": 1653} {"train_loss": -40.7285041809082, "global_step": 200090, "epoch": 1653} {"train_loss": -38.45368576049805, "global_step": 200091, "epoch": 1653} {"train_loss": -37.672672271728516, "global_step": 200092, "epoch": 1653} {"train_loss": -41.167625427246094, "global_step": 200093, "epoch": 1653} {"train_loss": -39.71625900268555, "global_step": 200094, "epoch": 1653} {"train_loss": -38.91660690307617, "global_step": 200095, "epoch": 1653} {"train_loss": -39.629947662353516, "global_step": 200096, "epoch": 1653} {"train_loss": -39.7635612487793, "global_step": 200097, "epoch": 1653} {"train_loss": -40.050113677978516, "global_step": 200098, "epoch": 1653} {"train_loss": -39.794158935546875, "global_step": 200099, "epoch": 1653} {"train_loss": -37.87666702270508, "global_step": 200100, "epoch": 1653} {"train_loss": -39.70636749267578, "global_step": 200101, "epoch": 1653} {"train_loss": -37.77375411987305, "global_step": 200102, "epoch": 1653} {"train_loss": -40.8618278503418, "global_step": 200103, "epoch": 1653} {"train_loss": -40.29621505737305, "global_step": 200104, "epoch": 1653} {"train_loss": -40.6143798828125, "global_step": 200105, "epoch": 1653} {"train_loss": -41.19790267944336, "global_step": 200106, "epoch": 1653} {"train_loss": -40.90119171142578, "global_step": 200107, "epoch": 1653} {"train_loss": -40.6195182800293, "global_step": 200108, "epoch": 1653} {"train_loss": -41.272071838378906, "global_step": 200109, "epoch": 1653} {"train_loss": -41.15264892578125, "global_step": 200110, "epoch": 1653} {"train_loss": -41.30643844604492, "global_step": 200111, "epoch": 1653} {"train_loss": -40.31452560424805, "global_step": 200112, "epoch": 1653} {"train_loss": -41.3474006652832, "global_step": 200113, "epoch": 1653} {"train_loss": -40.48189926147461, "global_step": 200114, "epoch": 1653} {"train_loss": -40.66215896606445, "global_step": 200115, "epoch": 1653} {"train_loss": -41.03339767456055, "global_step": 200116, "epoch": 1653} {"train_loss": -41.421241760253906, "global_step": 200117, "epoch": 1653} {"train_loss": -40.31803512573242, "global_step": 200118, "epoch": 1653} {"train_loss": -41.04975509643555, "global_step": 200119, "epoch": 1653} {"train_loss": -41.533931732177734, "global_step": 200120, "epoch": 1653} {"train_loss": -40.32659912109375, "global_step": 200121, "epoch": 1653} {"train_loss": -40.5464973449707, "global_step": 200122, "epoch": 1653} {"train_loss": -41.60087966918945, "global_step": 200123, "epoch": 1653} {"train_loss": -41.06633377075195, "global_step": 200124, "epoch": 1653} {"train_loss": -41.542236328125, "global_step": 200125, "epoch": 1653} {"train_loss": -41.32633590698242, "global_step": 200126, "epoch": 1653} {"train_loss": -39.88562774658203, "global_step": 200127, "epoch": 1653} {"train_loss": -40.136756896972656, "global_step": 200128, "epoch": 1653} {"train_loss": -40.849395751953125, "global_step": 200129, "epoch": 1653} {"train_loss": -40.61022186279297, "global_step": 200130, "epoch": 1653} {"train_loss": -41.43767547607422, "global_step": 200131, "epoch": 1653} {"train_loss": -40.700618743896484, "global_step": 200132, "epoch": 1653} {"train_loss": -40.11389768616227, "global_step": 200133, "epoch": 1653, "val_loss": 2642521.75} {"train_loss": -40.924407958984375, "global_step": 200134, "epoch": 1654} {"train_loss": -40.51283645629883, "global_step": 200135, "epoch": 1654} {"train_loss": -40.561336517333984, "global_step": 200136, "epoch": 1654} {"train_loss": -41.44710922241211, "global_step": 200137, "epoch": 1654} {"train_loss": -41.04561233520508, "global_step": 200138, "epoch": 1654} {"train_loss": -41.628517150878906, "global_step": 200139, "epoch": 1654} {"train_loss": -40.49244689941406, "global_step": 200140, "epoch": 1654} {"train_loss": -41.608882904052734, "global_step": 200141, "epoch": 1654} {"train_loss": -41.67822265625, "global_step": 200142, "epoch": 1654} {"train_loss": -41.66206359863281, "global_step": 200143, "epoch": 1654} {"train_loss": -41.17585372924805, "global_step": 200144, "epoch": 1654} {"train_loss": -41.25086212158203, "global_step": 200145, "epoch": 1654} {"train_loss": -41.583560943603516, "global_step": 200146, "epoch": 1654} {"train_loss": -41.67344284057617, "global_step": 200147, "epoch": 1654} {"train_loss": -40.837886810302734, "global_step": 200148, "epoch": 1654} {"train_loss": -40.665771484375, "global_step": 200149, "epoch": 1654} {"train_loss": -40.31841278076172, "global_step": 200150, "epoch": 1654} {"train_loss": -40.832759857177734, "global_step": 200151, "epoch": 1654} {"train_loss": -39.85254669189453, "global_step": 200152, "epoch": 1654} {"train_loss": -41.18061447143555, "global_step": 200153, "epoch": 1654} {"train_loss": -39.81330108642578, "global_step": 200154, "epoch": 1654} {"train_loss": -37.73967742919922, "global_step": 200155, "epoch": 1654} {"train_loss": -38.58417892456055, "global_step": 200156, "epoch": 1654} {"train_loss": -37.94758224487305, "global_step": 200157, "epoch": 1654} {"train_loss": -39.74224853515625, "global_step": 200158, "epoch": 1654} {"train_loss": -37.57426834106445, "global_step": 200159, "epoch": 1654} {"train_loss": -41.6290283203125, "global_step": 200160, "epoch": 1654} {"train_loss": -37.823787689208984, "global_step": 200161, "epoch": 1654} {"train_loss": -40.63384246826172, "global_step": 200162, "epoch": 1654} {"train_loss": -36.84815216064453, "global_step": 200163, "epoch": 1654} {"train_loss": -40.22710037231445, "global_step": 200164, "epoch": 1654} {"train_loss": -39.9736328125, "global_step": 200165, "epoch": 1654} {"train_loss": -41.03144454956055, "global_step": 200166, "epoch": 1654} {"train_loss": -40.9228401184082, "global_step": 200167, "epoch": 1654} {"train_loss": -41.41649627685547, "global_step": 200168, "epoch": 1654} {"train_loss": -40.64359664916992, "global_step": 200169, "epoch": 1654} {"train_loss": -40.03120803833008, "global_step": 200170, "epoch": 1654} {"train_loss": -40.32865905761719, "global_step": 200171, "epoch": 1654} {"train_loss": -41.01124954223633, "global_step": 200172, "epoch": 1654} {"train_loss": -40.9460563659668, "global_step": 200173, "epoch": 1654} {"train_loss": -40.95075607299805, "global_step": 200174, "epoch": 1654} {"train_loss": -41.00968551635742, "global_step": 200175, "epoch": 1654} {"train_loss": -40.5672607421875, "global_step": 200176, "epoch": 1654} {"train_loss": -40.880531311035156, "global_step": 200177, "epoch": 1654} {"train_loss": -41.151763916015625, "global_step": 200178, "epoch": 1654} {"train_loss": -40.77116012573242, "global_step": 200179, "epoch": 1654} {"train_loss": -40.50457763671875, "global_step": 200180, "epoch": 1654} {"train_loss": -40.84540557861328, "global_step": 200181, "epoch": 1654} {"train_loss": -39.09989929199219, "global_step": 200182, "epoch": 1654} {"train_loss": -40.6151237487793, "global_step": 200183, "epoch": 1654} {"train_loss": -39.98283386230469, "global_step": 200184, "epoch": 1654} {"train_loss": -41.43931579589844, "global_step": 200185, "epoch": 1654} {"train_loss": -39.440185546875, "global_step": 200186, "epoch": 1654} {"train_loss": -38.99823760986328, "global_step": 200187, "epoch": 1654} {"train_loss": -41.489864349365234, "global_step": 200188, "epoch": 1654} {"train_loss": -41.00844192504883, "global_step": 200189, "epoch": 1654} {"train_loss": -40.36853790283203, "global_step": 200190, "epoch": 1654} {"train_loss": -40.6063117980957, "global_step": 200191, "epoch": 1654} {"train_loss": -41.70356369018555, "global_step": 200192, "epoch": 1654} {"train_loss": -40.08721160888672, "global_step": 200193, "epoch": 1654} {"train_loss": -39.81940841674805, "global_step": 200194, "epoch": 1654} {"train_loss": -41.68319320678711, "global_step": 200195, "epoch": 1654} {"train_loss": -41.57125473022461, "global_step": 200196, "epoch": 1654} {"train_loss": -41.08723068237305, "global_step": 200197, "epoch": 1654} {"train_loss": -40.87876510620117, "global_step": 200198, "epoch": 1654} {"train_loss": -40.8798713684082, "global_step": 200199, "epoch": 1654} {"train_loss": -41.43803024291992, "global_step": 200200, "epoch": 1654} {"train_loss": -41.12571716308594, "global_step": 200201, "epoch": 1654} {"train_loss": -41.32638168334961, "global_step": 200202, "epoch": 1654} {"train_loss": -40.93811798095703, "global_step": 200203, "epoch": 1654} {"train_loss": -39.766578674316406, "global_step": 200204, "epoch": 1654} {"train_loss": -41.06441879272461, "global_step": 200205, "epoch": 1654} {"train_loss": -40.56496047973633, "global_step": 200206, "epoch": 1654} {"train_loss": -40.04789352416992, "global_step": 200207, "epoch": 1654} {"train_loss": -40.22148132324219, "global_step": 200208, "epoch": 1654} {"train_loss": -41.91167068481445, "global_step": 200209, "epoch": 1654} {"train_loss": -40.00184631347656, "global_step": 200210, "epoch": 1654} {"train_loss": -40.591064453125, "global_step": 200211, "epoch": 1654} {"train_loss": -40.67927169799805, "global_step": 200212, "epoch": 1654} {"train_loss": -41.24005126953125, "global_step": 200213, "epoch": 1654} {"train_loss": -39.538875579833984, "global_step": 200214, "epoch": 1654} {"train_loss": -40.473480224609375, "global_step": 200215, "epoch": 1654} {"train_loss": -40.76197052001953, "global_step": 200216, "epoch": 1654} {"train_loss": -41.321319580078125, "global_step": 200217, "epoch": 1654} {"train_loss": -40.194820404052734, "global_step": 200218, "epoch": 1654} {"train_loss": -41.12323760986328, "global_step": 200219, "epoch": 1654} {"train_loss": -40.60870361328125, "global_step": 200220, "epoch": 1654} {"train_loss": -40.9061393737793, "global_step": 200221, "epoch": 1654} {"train_loss": -41.4530029296875, "global_step": 200222, "epoch": 1654} {"train_loss": -40.0467643737793, "global_step": 200223, "epoch": 1654} {"train_loss": -41.7588996887207, "global_step": 200224, "epoch": 1654} {"train_loss": -41.185184478759766, "global_step": 200225, "epoch": 1654} {"train_loss": -41.05049514770508, "global_step": 200226, "epoch": 1654} {"train_loss": -41.011104583740234, "global_step": 200227, "epoch": 1654} {"train_loss": -41.404815673828125, "global_step": 200228, "epoch": 1654} {"train_loss": -39.987911224365234, "global_step": 200229, "epoch": 1654} {"train_loss": -39.87488555908203, "global_step": 200230, "epoch": 1654} {"train_loss": -39.82471466064453, "global_step": 200231, "epoch": 1654} {"train_loss": -40.58763122558594, "global_step": 200232, "epoch": 1654} {"train_loss": -41.77456283569336, "global_step": 200233, "epoch": 1654} {"train_loss": -41.62042236328125, "global_step": 200234, "epoch": 1654} {"train_loss": -41.7497673034668, "global_step": 200235, "epoch": 1654} {"train_loss": -41.43441390991211, "global_step": 200236, "epoch": 1654} {"train_loss": -40.89552688598633, "global_step": 200237, "epoch": 1654} {"train_loss": -41.270050048828125, "global_step": 200238, "epoch": 1654} {"train_loss": -41.71791076660156, "global_step": 200239, "epoch": 1654} {"train_loss": -41.2274284362793, "global_step": 200240, "epoch": 1654} {"train_loss": -41.586761474609375, "global_step": 200241, "epoch": 1654} {"train_loss": -42.18637466430664, "global_step": 200242, "epoch": 1654} {"train_loss": -41.589107513427734, "global_step": 200243, "epoch": 1654} {"train_loss": -40.3942756652832, "global_step": 200244, "epoch": 1654} {"train_loss": -41.03293991088867, "global_step": 200245, "epoch": 1654} {"train_loss": -41.22108840942383, "global_step": 200246, "epoch": 1654} {"train_loss": -40.83269119262695, "global_step": 200247, "epoch": 1654} {"train_loss": -42.35197067260742, "global_step": 200248, "epoch": 1654} {"train_loss": -41.753414154052734, "global_step": 200249, "epoch": 1654} {"train_loss": -40.141845703125, "global_step": 200250, "epoch": 1654} {"train_loss": -40.64448928833008, "global_step": 200251, "epoch": 1654} {"train_loss": -40.46538162231445, "global_step": 200252, "epoch": 1654} {"train_loss": -39.66884994506836, "global_step": 200253, "epoch": 1654} {"train_loss": -40.69213498328343, "global_step": 200254, "epoch": 1654, "val_loss": 2674294.0} {"train_loss": -41.40460205078125, "global_step": 200255, "epoch": 1655} {"train_loss": -41.61507797241211, "global_step": 200256, "epoch": 1655} {"train_loss": -41.150726318359375, "global_step": 200257, "epoch": 1655} {"train_loss": -37.7013053894043, "global_step": 200258, "epoch": 1655} {"train_loss": -40.938045501708984, "global_step": 200259, "epoch": 1655} {"train_loss": -40.22096252441406, "global_step": 200260, "epoch": 1655} {"train_loss": -38.27607345581055, "global_step": 200261, "epoch": 1655} {"train_loss": -39.38056564331055, "global_step": 200262, "epoch": 1655} {"train_loss": -37.98948287963867, "global_step": 200263, "epoch": 1655} {"train_loss": -37.59028244018555, "global_step": 200264, "epoch": 1655} {"train_loss": -38.931819915771484, "global_step": 200265, "epoch": 1655} {"train_loss": -40.52401351928711, "global_step": 200266, "epoch": 1655} {"train_loss": -38.760982513427734, "global_step": 200267, "epoch": 1655} {"train_loss": -40.50872802734375, "global_step": 200268, "epoch": 1655} {"train_loss": -35.14977264404297, "global_step": 200269, "epoch": 1655} {"train_loss": -40.58163070678711, "global_step": 200270, "epoch": 1655} {"train_loss": -40.591285705566406, "global_step": 200271, "epoch": 1655} {"train_loss": -38.40388107299805, "global_step": 200272, "epoch": 1655} {"train_loss": -39.3416862487793, "global_step": 200273, "epoch": 1655} {"train_loss": -39.60741424560547, "global_step": 200274, "epoch": 1655} {"train_loss": -39.66641616821289, "global_step": 200275, "epoch": 1655} {"train_loss": -34.50971603393555, "global_step": 200276, "epoch": 1655} {"train_loss": -36.42647933959961, "global_step": 200277, "epoch": 1655} {"train_loss": -38.94865036010742, "global_step": 200278, "epoch": 1655} {"train_loss": -35.67048263549805, "global_step": 200279, "epoch": 1655} {"train_loss": -37.41324996948242, "global_step": 200280, "epoch": 1655} {"train_loss": -33.575801849365234, "global_step": 200281, "epoch": 1655} {"train_loss": -33.67307662963867, "global_step": 200282, "epoch": 1655} {"train_loss": -34.1043701171875, "global_step": 200283, "epoch": 1655} {"train_loss": -36.84697723388672, "global_step": 200284, "epoch": 1655} {"train_loss": -36.18650817871094, "global_step": 200285, "epoch": 1655} {"train_loss": -37.4194221496582, "global_step": 200286, "epoch": 1655} {"train_loss": -36.983489990234375, "global_step": 200287, "epoch": 1655} {"train_loss": -35.81681442260742, "global_step": 200288, "epoch": 1655} {"train_loss": -34.154052734375, "global_step": 200289, "epoch": 1655} {"train_loss": -35.73632049560547, "global_step": 200290, "epoch": 1655} {"train_loss": -39.00810623168945, "global_step": 200291, "epoch": 1655} {"train_loss": -34.743255615234375, "global_step": 200292, "epoch": 1655} {"train_loss": -38.182682037353516, "global_step": 200293, "epoch": 1655} {"train_loss": -36.370540618896484, "global_step": 200294, "epoch": 1655} {"train_loss": -35.81716537475586, "global_step": 200295, "epoch": 1655} {"train_loss": -34.57076644897461, "global_step": 200296, "epoch": 1655} {"train_loss": -36.139808654785156, "global_step": 200297, "epoch": 1655} {"train_loss": -36.464168548583984, "global_step": 200298, "epoch": 1655} {"train_loss": -38.587154388427734, "global_step": 200299, "epoch": 1655} {"train_loss": -37.37076950073242, "global_step": 200300, "epoch": 1655} {"train_loss": -39.10847091674805, "global_step": 200301, "epoch": 1655} {"train_loss": -38.61758041381836, "global_step": 200302, "epoch": 1655} {"train_loss": -35.91976547241211, "global_step": 200303, "epoch": 1655} {"train_loss": -36.948055267333984, "global_step": 200304, "epoch": 1655} {"train_loss": -38.95125961303711, "global_step": 200305, "epoch": 1655} {"train_loss": -38.99451446533203, "global_step": 200306, "epoch": 1655} {"train_loss": -38.399009704589844, "global_step": 200307, "epoch": 1655} {"train_loss": -38.40171432495117, "global_step": 200308, "epoch": 1655} {"train_loss": -39.40693283081055, "global_step": 200309, "epoch": 1655} {"train_loss": -39.188392639160156, "global_step": 200310, "epoch": 1655} {"train_loss": -39.58930206298828, "global_step": 200311, "epoch": 1655} {"train_loss": -38.800865173339844, "global_step": 200312, "epoch": 1655} {"train_loss": -38.64251708984375, "global_step": 200313, "epoch": 1655} {"train_loss": -39.85137939453125, "global_step": 200314, "epoch": 1655} {"train_loss": -39.10121154785156, "global_step": 200315, "epoch": 1655} {"train_loss": -39.45104217529297, "global_step": 200316, "epoch": 1655} {"train_loss": -39.448646545410156, "global_step": 200317, "epoch": 1655} {"train_loss": -39.20252227783203, "global_step": 200318, "epoch": 1655} {"train_loss": -39.3662223815918, "global_step": 200319, "epoch": 1655} {"train_loss": -39.83120346069336, "global_step": 200320, "epoch": 1655} {"train_loss": -39.45981979370117, "global_step": 200321, "epoch": 1655} {"train_loss": -38.783111572265625, "global_step": 200322, "epoch": 1655} {"train_loss": -40.0092887878418, "global_step": 200323, "epoch": 1655} {"train_loss": -39.94470977783203, "global_step": 200324, "epoch": 1655} {"train_loss": -39.892887115478516, "global_step": 200325, "epoch": 1655} {"train_loss": -40.222389221191406, "global_step": 200326, "epoch": 1655} {"train_loss": -39.30562973022461, "global_step": 200327, "epoch": 1655} {"train_loss": -39.53700637817383, "global_step": 200328, "epoch": 1655} {"train_loss": -40.27531051635742, "global_step": 200329, "epoch": 1655} {"train_loss": -40.62046432495117, "global_step": 200330, "epoch": 1655} {"train_loss": -40.05588912963867, "global_step": 200331, "epoch": 1655} {"train_loss": -40.7173957824707, "global_step": 200332, "epoch": 1655} {"train_loss": -41.04562759399414, "global_step": 200333, "epoch": 1655} {"train_loss": -40.56999588012695, "global_step": 200334, "epoch": 1655} {"train_loss": -40.309600830078125, "global_step": 200335, "epoch": 1655} {"train_loss": -40.25676345825195, "global_step": 200336, "epoch": 1655} {"train_loss": -39.8873405456543, "global_step": 200337, "epoch": 1655} {"train_loss": -39.1420783996582, "global_step": 200338, "epoch": 1655} {"train_loss": -41.10655212402344, "global_step": 200339, "epoch": 1655} {"train_loss": -40.15447998046875, "global_step": 200340, "epoch": 1655} {"train_loss": -39.89925003051758, "global_step": 200341, "epoch": 1655} {"train_loss": -40.941741943359375, "global_step": 200342, "epoch": 1655} {"train_loss": -40.36142349243164, "global_step": 200343, "epoch": 1655} {"train_loss": -40.560855865478516, "global_step": 200344, "epoch": 1655} {"train_loss": -40.751522064208984, "global_step": 200345, "epoch": 1655} {"train_loss": -39.842308044433594, "global_step": 200346, "epoch": 1655} {"train_loss": -41.0350227355957, "global_step": 200347, "epoch": 1655} {"train_loss": -40.92538833618164, "global_step": 200348, "epoch": 1655} {"train_loss": -41.02668380737305, "global_step": 200349, "epoch": 1655} {"train_loss": -40.9307746887207, "global_step": 200350, "epoch": 1655} {"train_loss": -40.927120208740234, "global_step": 200351, "epoch": 1655} {"train_loss": -40.33274459838867, "global_step": 200352, "epoch": 1655} {"train_loss": -40.94727325439453, "global_step": 200353, "epoch": 1655} {"train_loss": -40.614498138427734, "global_step": 200354, "epoch": 1655} {"train_loss": -41.28998565673828, "global_step": 200355, "epoch": 1655} {"train_loss": -40.474430084228516, "global_step": 200356, "epoch": 1655} {"train_loss": -40.075050354003906, "global_step": 200357, "epoch": 1655} {"train_loss": -40.43488693237305, "global_step": 200358, "epoch": 1655} {"train_loss": -40.496856689453125, "global_step": 200359, "epoch": 1655} {"train_loss": -40.7232780456543, "global_step": 200360, "epoch": 1655} {"train_loss": -41.520259857177734, "global_step": 200361, "epoch": 1655} {"train_loss": -40.77748107910156, "global_step": 200362, "epoch": 1655} {"train_loss": -40.62461853027344, "global_step": 200363, "epoch": 1655} {"train_loss": -40.76074981689453, "global_step": 200364, "epoch": 1655} {"train_loss": -41.321956634521484, "global_step": 200365, "epoch": 1655} {"train_loss": -40.906673431396484, "global_step": 200366, "epoch": 1655} {"train_loss": -41.04781723022461, "global_step": 200367, "epoch": 1655} {"train_loss": -41.56214141845703, "global_step": 200368, "epoch": 1655} {"train_loss": -40.95842361450195, "global_step": 200369, "epoch": 1655} {"train_loss": -41.62131881713867, "global_step": 200370, "epoch": 1655} {"train_loss": -41.15081787109375, "global_step": 200371, "epoch": 1655} {"train_loss": -41.689151763916016, "global_step": 200372, "epoch": 1655} {"train_loss": -41.0760612487793, "global_step": 200373, "epoch": 1655} {"train_loss": -41.69048309326172, "global_step": 200374, "epoch": 1655} {"train_loss": -39.192946284270484, "global_step": 200375, "epoch": 1655, "val_loss": 2608960.0} {"train_loss": -41.481143951416016, "global_step": 200376, "epoch": 1656} {"train_loss": -41.64655303955078, "global_step": 200377, "epoch": 1656} {"train_loss": -41.67687225341797, "global_step": 200378, "epoch": 1656} {"train_loss": -41.80031204223633, "global_step": 200379, "epoch": 1656} {"train_loss": -41.31638717651367, "global_step": 200380, "epoch": 1656} {"train_loss": -41.325191497802734, "global_step": 200381, "epoch": 1656} {"train_loss": -41.98462677001953, "global_step": 200382, "epoch": 1656} {"train_loss": -42.06190490722656, "global_step": 200383, "epoch": 1656} {"train_loss": -40.765132904052734, "global_step": 200384, "epoch": 1656} {"train_loss": -41.7564811706543, "global_step": 200385, "epoch": 1656} {"train_loss": -42.24420166015625, "global_step": 200386, "epoch": 1656} {"train_loss": -41.60868453979492, "global_step": 200387, "epoch": 1656} {"train_loss": -41.35422897338867, "global_step": 200388, "epoch": 1656} {"train_loss": -42.17232894897461, "global_step": 200389, "epoch": 1656} {"train_loss": -41.739479064941406, "global_step": 200390, "epoch": 1656} {"train_loss": -40.934505462646484, "global_step": 200391, "epoch": 1656} {"train_loss": -40.728248596191406, "global_step": 200392, "epoch": 1656} {"train_loss": -42.316497802734375, "global_step": 200393, "epoch": 1656} {"train_loss": -40.73853302001953, "global_step": 200394, "epoch": 1656} {"train_loss": -40.8273811340332, "global_step": 200395, "epoch": 1656} {"train_loss": -41.98915100097656, "global_step": 200396, "epoch": 1656} {"train_loss": -41.920860290527344, "global_step": 200397, "epoch": 1656} {"train_loss": -41.78047561645508, "global_step": 200398, "epoch": 1656} {"train_loss": -41.68952941894531, "global_step": 200399, "epoch": 1656} {"train_loss": -40.97309112548828, "global_step": 200400, "epoch": 1656} {"train_loss": -42.081512451171875, "global_step": 200401, "epoch": 1656} {"train_loss": -40.90385055541992, "global_step": 200402, "epoch": 1656} {"train_loss": -37.95579528808594, "global_step": 200403, "epoch": 1656} {"train_loss": -38.87577438354492, "global_step": 200404, "epoch": 1656} {"train_loss": -41.42181396484375, "global_step": 200405, "epoch": 1656} {"train_loss": -41.074378967285156, "global_step": 200406, "epoch": 1656} {"train_loss": -38.97240447998047, "global_step": 200407, "epoch": 1656} {"train_loss": -37.4456901550293, "global_step": 200408, "epoch": 1656} {"train_loss": -35.90764236450195, "global_step": 200409, "epoch": 1656} {"train_loss": -38.18061828613281, "global_step": 200410, "epoch": 1656} {"train_loss": -40.858154296875, "global_step": 200411, "epoch": 1656} {"train_loss": -41.523963928222656, "global_step": 200412, "epoch": 1656} {"train_loss": -39.76218795776367, "global_step": 200413, "epoch": 1656} {"train_loss": -40.29901885986328, "global_step": 200414, "epoch": 1656} {"train_loss": -41.6696891784668, "global_step": 200415, "epoch": 1656} {"train_loss": -41.33818817138672, "global_step": 200416, "epoch": 1656} {"train_loss": -41.03103256225586, "global_step": 200417, "epoch": 1656} {"train_loss": -41.29566955566406, "global_step": 200418, "epoch": 1656} {"train_loss": -41.709537506103516, "global_step": 200419, "epoch": 1656} {"train_loss": -41.55637741088867, "global_step": 200420, "epoch": 1656} {"train_loss": -41.81110763549805, "global_step": 200421, "epoch": 1656} {"train_loss": -41.08462142944336, "global_step": 200422, "epoch": 1656} {"train_loss": -41.35676193237305, "global_step": 200423, "epoch": 1656} {"train_loss": -41.410457611083984, "global_step": 200424, "epoch": 1656} {"train_loss": -42.034847259521484, "global_step": 200425, "epoch": 1656} {"train_loss": -40.90133285522461, "global_step": 200426, "epoch": 1656} {"train_loss": -40.985652923583984, "global_step": 200427, "epoch": 1656} {"train_loss": -41.76162338256836, "global_step": 200428, "epoch": 1656} {"train_loss": -42.14433670043945, "global_step": 200429, "epoch": 1656} {"train_loss": -41.653926849365234, "global_step": 200430, "epoch": 1656} {"train_loss": -41.7232666015625, "global_step": 200431, "epoch": 1656} {"train_loss": -40.816829681396484, "global_step": 200432, "epoch": 1656} {"train_loss": -42.16626739501953, "global_step": 200433, "epoch": 1656} {"train_loss": -41.858211517333984, "global_step": 200434, "epoch": 1656} {"train_loss": -41.350582122802734, "global_step": 200435, "epoch": 1656} {"train_loss": -41.413455963134766, "global_step": 200436, "epoch": 1656} {"train_loss": -42.394775390625, "global_step": 200437, "epoch": 1656} {"train_loss": -41.93114471435547, "global_step": 200438, "epoch": 1656} {"train_loss": -41.17401885986328, "global_step": 200439, "epoch": 1656} {"train_loss": -41.6559944152832, "global_step": 200440, "epoch": 1656} {"train_loss": -40.82883834838867, "global_step": 200441, "epoch": 1656} {"train_loss": -41.114288330078125, "global_step": 200442, "epoch": 1656} {"train_loss": -41.673336029052734, "global_step": 200443, "epoch": 1656} {"train_loss": -41.7205696105957, "global_step": 200444, "epoch": 1656} {"train_loss": -40.96128463745117, "global_step": 200445, "epoch": 1656} {"train_loss": -41.216148376464844, "global_step": 200446, "epoch": 1656} {"train_loss": -41.66162109375, "global_step": 200447, "epoch": 1656} {"train_loss": -41.63137435913086, "global_step": 200448, "epoch": 1656} {"train_loss": -41.2256965637207, "global_step": 200449, "epoch": 1656} {"train_loss": -41.28201675415039, "global_step": 200450, "epoch": 1656} {"train_loss": -41.40155029296875, "global_step": 200451, "epoch": 1656} {"train_loss": -41.71426010131836, "global_step": 200452, "epoch": 1656} {"train_loss": -41.94598388671875, "global_step": 200453, "epoch": 1656} {"train_loss": -42.012237548828125, "global_step": 200454, "epoch": 1656} {"train_loss": -41.14402770996094, "global_step": 200455, "epoch": 1656} {"train_loss": -39.2244758605957, "global_step": 200456, "epoch": 1656} {"train_loss": -40.56013870239258, "global_step": 200457, "epoch": 1656} {"train_loss": -41.05036163330078, "global_step": 200458, "epoch": 1656} {"train_loss": -41.62696075439453, "global_step": 200459, "epoch": 1656} {"train_loss": -41.19077682495117, "global_step": 200460, "epoch": 1656} {"train_loss": -42.190914154052734, "global_step": 200461, "epoch": 1656} {"train_loss": -41.05326461791992, "global_step": 200462, "epoch": 1656} {"train_loss": -40.81856918334961, "global_step": 200463, "epoch": 1656} {"train_loss": -41.8763427734375, "global_step": 200464, "epoch": 1656} {"train_loss": -42.07951736450195, "global_step": 200465, "epoch": 1656} {"train_loss": -41.795265197753906, "global_step": 200466, "epoch": 1656} {"train_loss": -41.590003967285156, "global_step": 200467, "epoch": 1656} {"train_loss": -42.064815521240234, "global_step": 200468, "epoch": 1656} {"train_loss": -40.90042495727539, "global_step": 200469, "epoch": 1656} {"train_loss": -40.53567123413086, "global_step": 200470, "epoch": 1656} {"train_loss": -41.73566818237305, "global_step": 200471, "epoch": 1656} {"train_loss": -40.90201950073242, "global_step": 200472, "epoch": 1656} {"train_loss": -39.76054763793945, "global_step": 200473, "epoch": 1656} {"train_loss": -40.667518615722656, "global_step": 200474, "epoch": 1656} {"train_loss": -41.33028793334961, "global_step": 200475, "epoch": 1656} {"train_loss": -41.17084503173828, "global_step": 200476, "epoch": 1656} {"train_loss": -41.43302536010742, "global_step": 200477, "epoch": 1656} {"train_loss": -40.7565803527832, "global_step": 200478, "epoch": 1656} {"train_loss": -41.68659591674805, "global_step": 200479, "epoch": 1656} {"train_loss": -41.69110870361328, "global_step": 200480, "epoch": 1656} {"train_loss": -40.4665641784668, "global_step": 200481, "epoch": 1656} {"train_loss": -39.637081146240234, "global_step": 200482, "epoch": 1656} {"train_loss": -41.338623046875, "global_step": 200483, "epoch": 1656} {"train_loss": -40.26472854614258, "global_step": 200484, "epoch": 1656} {"train_loss": -38.883209228515625, "global_step": 200485, "epoch": 1656} {"train_loss": -40.799102783203125, "global_step": 200486, "epoch": 1656} {"train_loss": -40.35302734375, "global_step": 200487, "epoch": 1656} {"train_loss": -37.23128128051758, "global_step": 200488, "epoch": 1656} {"train_loss": -38.59220504760742, "global_step": 200489, "epoch": 1656} {"train_loss": -39.9521369934082, "global_step": 200490, "epoch": 1656} {"train_loss": -40.22359848022461, "global_step": 200491, "epoch": 1656} {"train_loss": -39.772560119628906, "global_step": 200492, "epoch": 1656} {"train_loss": -38.77334213256836, "global_step": 200493, "epoch": 1656} {"train_loss": -41.2230339050293, "global_step": 200494, "epoch": 1656} {"train_loss": -39.690399169921875, "global_step": 200495, "epoch": 1656} {"train_loss": -41.01188498883208, "global_step": 200496, "epoch": 1656, "val_loss": 2598350.0} {"train_loss": -40.546993255615234, "global_step": 200497, "epoch": 1657} {"train_loss": -40.597713470458984, "global_step": 200498, "epoch": 1657} {"train_loss": -39.64469528198242, "global_step": 200499, "epoch": 1657} {"train_loss": -41.00110626220703, "global_step": 200500, "epoch": 1657} {"train_loss": -40.044734954833984, "global_step": 200501, "epoch": 1657} {"train_loss": -40.61924743652344, "global_step": 200502, "epoch": 1657} {"train_loss": -41.325347900390625, "global_step": 200503, "epoch": 1657} {"train_loss": -41.11371994018555, "global_step": 200504, "epoch": 1657} {"train_loss": -40.84623336791992, "global_step": 200505, "epoch": 1657} {"train_loss": -41.384822845458984, "global_step": 200506, "epoch": 1657} {"train_loss": -41.155128479003906, "global_step": 200507, "epoch": 1657} {"train_loss": -41.35869598388672, "global_step": 200508, "epoch": 1657} {"train_loss": -40.3109016418457, "global_step": 200509, "epoch": 1657} {"train_loss": -41.074615478515625, "global_step": 200510, "epoch": 1657} {"train_loss": -40.402191162109375, "global_step": 200511, "epoch": 1657} {"train_loss": -40.41456985473633, "global_step": 200512, "epoch": 1657} {"train_loss": -40.52326202392578, "global_step": 200513, "epoch": 1657} {"train_loss": -40.806880950927734, "global_step": 200514, "epoch": 1657} {"train_loss": -42.062644958496094, "global_step": 200515, "epoch": 1657} {"train_loss": -40.43351364135742, "global_step": 200516, "epoch": 1657} {"train_loss": -40.462066650390625, "global_step": 200517, "epoch": 1657} {"train_loss": -40.412837982177734, "global_step": 200518, "epoch": 1657} {"train_loss": -40.443538665771484, "global_step": 200519, "epoch": 1657} {"train_loss": -41.14937973022461, "global_step": 200520, "epoch": 1657} {"train_loss": -40.086727142333984, "global_step": 200521, "epoch": 1657} {"train_loss": -41.40298843383789, "global_step": 200522, "epoch": 1657} {"train_loss": -39.80729293823242, "global_step": 200523, "epoch": 1657} {"train_loss": -41.29180908203125, "global_step": 200524, "epoch": 1657} {"train_loss": -41.65614700317383, "global_step": 200525, "epoch": 1657} {"train_loss": -40.20084762573242, "global_step": 200526, "epoch": 1657} {"train_loss": -41.41900634765625, "global_step": 200527, "epoch": 1657} {"train_loss": -40.88313674926758, "global_step": 200528, "epoch": 1657} {"train_loss": -40.553466796875, "global_step": 200529, "epoch": 1657} {"train_loss": -40.812679290771484, "global_step": 200530, "epoch": 1657} {"train_loss": -41.259090423583984, "global_step": 200531, "epoch": 1657} {"train_loss": -40.67525863647461, "global_step": 200532, "epoch": 1657} {"train_loss": -41.203731536865234, "global_step": 200533, "epoch": 1657} {"train_loss": -40.75577926635742, "global_step": 200534, "epoch": 1657} {"train_loss": -40.26715850830078, "global_step": 200535, "epoch": 1657} {"train_loss": -40.23065948486328, "global_step": 200536, "epoch": 1657} {"train_loss": -41.12350845336914, "global_step": 200537, "epoch": 1657} {"train_loss": -41.636260986328125, "global_step": 200538, "epoch": 1657} {"train_loss": -41.52958679199219, "global_step": 200539, "epoch": 1657} {"train_loss": -40.052947998046875, "global_step": 200540, "epoch": 1657} {"train_loss": -40.507354736328125, "global_step": 200541, "epoch": 1657} {"train_loss": -40.15865707397461, "global_step": 200542, "epoch": 1657} {"train_loss": -40.72417449951172, "global_step": 200543, "epoch": 1657} {"train_loss": -39.82544708251953, "global_step": 200544, "epoch": 1657} {"train_loss": -40.58272171020508, "global_step": 200545, "epoch": 1657} {"train_loss": -41.37205505371094, "global_step": 200546, "epoch": 1657} {"train_loss": -41.269020080566406, "global_step": 200547, "epoch": 1657} {"train_loss": -40.664459228515625, "global_step": 200548, "epoch": 1657} {"train_loss": -40.91701889038086, "global_step": 200549, "epoch": 1657} {"train_loss": -40.67147445678711, "global_step": 200550, "epoch": 1657} {"train_loss": -39.60768508911133, "global_step": 200551, "epoch": 1657} {"train_loss": -41.739070892333984, "global_step": 200552, "epoch": 1657} {"train_loss": -40.999813079833984, "global_step": 200553, "epoch": 1657} {"train_loss": -41.32237243652344, "global_step": 200554, "epoch": 1657} {"train_loss": -41.57079315185547, "global_step": 200555, "epoch": 1657} {"train_loss": -41.558712005615234, "global_step": 200556, "epoch": 1657} {"train_loss": -41.363338470458984, "global_step": 200557, "epoch": 1657} {"train_loss": -41.70452880859375, "global_step": 200558, "epoch": 1657} {"train_loss": -41.866310119628906, "global_step": 200559, "epoch": 1657} {"train_loss": -41.10264587402344, "global_step": 200560, "epoch": 1657} {"train_loss": -40.9980583190918, "global_step": 200561, "epoch": 1657} {"train_loss": -40.87458038330078, "global_step": 200562, "epoch": 1657} {"train_loss": -38.354915618896484, "global_step": 200563, "epoch": 1657} {"train_loss": -40.58998489379883, "global_step": 200564, "epoch": 1657} {"train_loss": -40.550045013427734, "global_step": 200565, "epoch": 1657} {"train_loss": -39.98675537109375, "global_step": 200566, "epoch": 1657} {"train_loss": -39.47145462036133, "global_step": 200567, "epoch": 1657} {"train_loss": -34.19499969482422, "global_step": 200568, "epoch": 1657} {"train_loss": -37.26847457885742, "global_step": 200569, "epoch": 1657} {"train_loss": -37.923095703125, "global_step": 200570, "epoch": 1657} {"train_loss": -39.031917572021484, "global_step": 200571, "epoch": 1657} {"train_loss": -40.62578201293945, "global_step": 200572, "epoch": 1657} {"train_loss": -39.61235046386719, "global_step": 200573, "epoch": 1657} {"train_loss": -39.065792083740234, "global_step": 200574, "epoch": 1657} {"train_loss": -34.47030258178711, "global_step": 200575, "epoch": 1657} {"train_loss": -40.04899978637695, "global_step": 200576, "epoch": 1657} {"train_loss": -40.008338928222656, "global_step": 200577, "epoch": 1657} {"train_loss": -38.76961898803711, "global_step": 200578, "epoch": 1657} {"train_loss": -38.0148811340332, "global_step": 200579, "epoch": 1657} {"train_loss": -40.69973373413086, "global_step": 200580, "epoch": 1657} {"train_loss": -39.78928756713867, "global_step": 200581, "epoch": 1657} {"train_loss": -40.351192474365234, "global_step": 200582, "epoch": 1657} {"train_loss": -39.74776840209961, "global_step": 200583, "epoch": 1657} {"train_loss": -39.23927688598633, "global_step": 200584, "epoch": 1657} {"train_loss": -39.988277435302734, "global_step": 200585, "epoch": 1657} {"train_loss": -37.752105712890625, "global_step": 200586, "epoch": 1657} {"train_loss": -37.670406341552734, "global_step": 200587, "epoch": 1657} {"train_loss": -40.46674728393555, "global_step": 200588, "epoch": 1657} {"train_loss": -39.677345275878906, "global_step": 200589, "epoch": 1657} {"train_loss": -35.43474197387695, "global_step": 200590, "epoch": 1657} {"train_loss": -40.672664642333984, "global_step": 200591, "epoch": 1657} {"train_loss": -39.274444580078125, "global_step": 200592, "epoch": 1657} {"train_loss": -36.50863265991211, "global_step": 200593, "epoch": 1657} {"train_loss": -37.68684768676758, "global_step": 200594, "epoch": 1657} {"train_loss": -39.58909225463867, "global_step": 200595, "epoch": 1657} {"train_loss": -40.884918212890625, "global_step": 200596, "epoch": 1657} {"train_loss": -38.77143478393555, "global_step": 200597, "epoch": 1657} {"train_loss": -38.86316680908203, "global_step": 200598, "epoch": 1657} {"train_loss": -40.60894775390625, "global_step": 200599, "epoch": 1657} {"train_loss": -39.07603073120117, "global_step": 200600, "epoch": 1657} {"train_loss": -38.40745162963867, "global_step": 200601, "epoch": 1657} {"train_loss": -40.37522888183594, "global_step": 200602, "epoch": 1657} {"train_loss": -40.734859466552734, "global_step": 200603, "epoch": 1657} {"train_loss": -37.625335693359375, "global_step": 200604, "epoch": 1657} {"train_loss": -39.7285270690918, "global_step": 200605, "epoch": 1657} {"train_loss": -38.98927688598633, "global_step": 200606, "epoch": 1657} {"train_loss": -40.089412689208984, "global_step": 200607, "epoch": 1657} {"train_loss": -41.00659942626953, "global_step": 200608, "epoch": 1657} {"train_loss": -39.85847091674805, "global_step": 200609, "epoch": 1657} {"train_loss": -37.677181243896484, "global_step": 200610, "epoch": 1657} {"train_loss": -40.29480743408203, "global_step": 200611, "epoch": 1657} {"train_loss": -38.92073059082031, "global_step": 200612, "epoch": 1657} {"train_loss": -41.04311752319336, "global_step": 200613, "epoch": 1657} {"train_loss": -37.93669509887695, "global_step": 200614, "epoch": 1657} {"train_loss": -40.28407669067383, "global_step": 200615, "epoch": 1657} {"train_loss": -40.767181396484375, "global_step": 200616, "epoch": 1657} {"train_loss": -40.09561428353806, "global_step": 200617, "epoch": 1657, "val_loss": 2655012.5} {"train_loss": -40.0842399597168, "global_step": 200618, "epoch": 1658} {"train_loss": -40.254119873046875, "global_step": 200619, "epoch": 1658} {"train_loss": -40.5639762878418, "global_step": 200620, "epoch": 1658} {"train_loss": -40.671138763427734, "global_step": 200621, "epoch": 1658} {"train_loss": -40.0625114440918, "global_step": 200622, "epoch": 1658} {"train_loss": -39.96921920776367, "global_step": 200623, "epoch": 1658} {"train_loss": -41.51105499267578, "global_step": 200624, "epoch": 1658} {"train_loss": -41.02801513671875, "global_step": 200625, "epoch": 1658} {"train_loss": -40.62595748901367, "global_step": 200626, "epoch": 1658} {"train_loss": -40.703678131103516, "global_step": 200627, "epoch": 1658} {"train_loss": -40.93974685668945, "global_step": 200628, "epoch": 1658} {"train_loss": -41.360416412353516, "global_step": 200629, "epoch": 1658} {"train_loss": -41.0147590637207, "global_step": 200630, "epoch": 1658} {"train_loss": -40.4389762878418, "global_step": 200631, "epoch": 1658} {"train_loss": -38.544803619384766, "global_step": 200632, "epoch": 1658} {"train_loss": -41.10597610473633, "global_step": 200633, "epoch": 1658} {"train_loss": -40.36027526855469, "global_step": 200634, "epoch": 1658} {"train_loss": -41.320068359375, "global_step": 200635, "epoch": 1658} {"train_loss": -40.86578369140625, "global_step": 200636, "epoch": 1658} {"train_loss": -41.179203033447266, "global_step": 200637, "epoch": 1658} {"train_loss": -40.4245719909668, "global_step": 200638, "epoch": 1658} {"train_loss": -40.74343490600586, "global_step": 200639, "epoch": 1658} {"train_loss": -38.737701416015625, "global_step": 200640, "epoch": 1658} {"train_loss": -40.897605895996094, "global_step": 200641, "epoch": 1658} {"train_loss": -39.778594970703125, "global_step": 200642, "epoch": 1658} {"train_loss": -40.02461624145508, "global_step": 200643, "epoch": 1658} {"train_loss": -40.16004180908203, "global_step": 200644, "epoch": 1658} {"train_loss": -39.44680404663086, "global_step": 200645, "epoch": 1658} {"train_loss": -39.99543380737305, "global_step": 200646, "epoch": 1658} {"train_loss": -40.317413330078125, "global_step": 200647, "epoch": 1658} {"train_loss": -41.51888656616211, "global_step": 200648, "epoch": 1658} {"train_loss": -38.72002029418945, "global_step": 200649, "epoch": 1658} {"train_loss": -40.54817581176758, "global_step": 200650, "epoch": 1658} {"train_loss": -39.552303314208984, "global_step": 200651, "epoch": 1658} {"train_loss": -41.19060134887695, "global_step": 200652, "epoch": 1658} {"train_loss": -40.3337516784668, "global_step": 200653, "epoch": 1658} {"train_loss": -40.570648193359375, "global_step": 200654, "epoch": 1658} {"train_loss": -41.10443115234375, "global_step": 200655, "epoch": 1658} {"train_loss": -40.17313766479492, "global_step": 200656, "epoch": 1658} {"train_loss": -41.429019927978516, "global_step": 200657, "epoch": 1658} {"train_loss": -41.35273361206055, "global_step": 200658, "epoch": 1658} {"train_loss": -40.83247756958008, "global_step": 200659, "epoch": 1658} {"train_loss": -41.28339385986328, "global_step": 200660, "epoch": 1658} {"train_loss": -40.454559326171875, "global_step": 200661, "epoch": 1658} {"train_loss": -41.27017593383789, "global_step": 200662, "epoch": 1658} {"train_loss": -40.63874053955078, "global_step": 200663, "epoch": 1658} {"train_loss": -39.766082763671875, "global_step": 200664, "epoch": 1658} {"train_loss": -39.1435432434082, "global_step": 200665, "epoch": 1658} {"train_loss": -38.830379486083984, "global_step": 200666, "epoch": 1658} {"train_loss": -40.10107421875, "global_step": 200667, "epoch": 1658} {"train_loss": -40.599700927734375, "global_step": 200668, "epoch": 1658} {"train_loss": -41.91116714477539, "global_step": 200669, "epoch": 1658} {"train_loss": -41.45400619506836, "global_step": 200670, "epoch": 1658} {"train_loss": -40.589202880859375, "global_step": 200671, "epoch": 1658} {"train_loss": -38.86286544799805, "global_step": 200672, "epoch": 1658} {"train_loss": -40.7379035949707, "global_step": 200673, "epoch": 1658} {"train_loss": -38.250038146972656, "global_step": 200674, "epoch": 1658} {"train_loss": -40.168521881103516, "global_step": 200675, "epoch": 1658} {"train_loss": -39.6163444519043, "global_step": 200676, "epoch": 1658} {"train_loss": -39.5355110168457, "global_step": 200677, "epoch": 1658} {"train_loss": -40.963470458984375, "global_step": 200678, "epoch": 1658} {"train_loss": -41.441078186035156, "global_step": 200679, "epoch": 1658} {"train_loss": -40.3511848449707, "global_step": 200680, "epoch": 1658} {"train_loss": -41.37124252319336, "global_step": 200681, "epoch": 1658} {"train_loss": -40.5216064453125, "global_step": 200682, "epoch": 1658} {"train_loss": -40.978694915771484, "global_step": 200683, "epoch": 1658} {"train_loss": -35.772254943847656, "global_step": 200684, "epoch": 1658} {"train_loss": -40.047298431396484, "global_step": 200685, "epoch": 1658} {"train_loss": -40.368934631347656, "global_step": 200686, "epoch": 1658} {"train_loss": -40.8642692565918, "global_step": 200687, "epoch": 1658} {"train_loss": -41.44901657104492, "global_step": 200688, "epoch": 1658} {"train_loss": -39.541168212890625, "global_step": 200689, "epoch": 1658} {"train_loss": -41.234413146972656, "global_step": 200690, "epoch": 1658} {"train_loss": -40.26361846923828, "global_step": 200691, "epoch": 1658} {"train_loss": -39.342464447021484, "global_step": 200692, "epoch": 1658} {"train_loss": -40.350685119628906, "global_step": 200693, "epoch": 1658} {"train_loss": -40.54255676269531, "global_step": 200694, "epoch": 1658} {"train_loss": -37.89799118041992, "global_step": 200695, "epoch": 1658} {"train_loss": -39.407752990722656, "global_step": 200696, "epoch": 1658} {"train_loss": -41.432838439941406, "global_step": 200697, "epoch": 1658} {"train_loss": -40.670196533203125, "global_step": 200698, "epoch": 1658} {"train_loss": -39.82845687866211, "global_step": 200699, "epoch": 1658} {"train_loss": -40.74382781982422, "global_step": 200700, "epoch": 1658} {"train_loss": -41.48204803466797, "global_step": 200701, "epoch": 1658} {"train_loss": -40.476802825927734, "global_step": 200702, "epoch": 1658} {"train_loss": -41.5168571472168, "global_step": 200703, "epoch": 1658} {"train_loss": -40.963592529296875, "global_step": 200704, "epoch": 1658} {"train_loss": -40.761837005615234, "global_step": 200705, "epoch": 1658} {"train_loss": -40.26249694824219, "global_step": 200706, "epoch": 1658} {"train_loss": -40.842063903808594, "global_step": 200707, "epoch": 1658} {"train_loss": -40.05712890625, "global_step": 200708, "epoch": 1658} {"train_loss": -40.17486572265625, "global_step": 200709, "epoch": 1658} {"train_loss": -40.69707107543945, "global_step": 200710, "epoch": 1658} {"train_loss": -39.8271484375, "global_step": 200711, "epoch": 1658} {"train_loss": -41.8674430847168, "global_step": 200712, "epoch": 1658} {"train_loss": -40.92276382446289, "global_step": 200713, "epoch": 1658} {"train_loss": -41.04142379760742, "global_step": 200714, "epoch": 1658} {"train_loss": -40.41290283203125, "global_step": 200715, "epoch": 1658} {"train_loss": -41.354248046875, "global_step": 200716, "epoch": 1658} {"train_loss": -40.96294021606445, "global_step": 200717, "epoch": 1658} {"train_loss": -40.668922424316406, "global_step": 200718, "epoch": 1658} {"train_loss": -40.84334945678711, "global_step": 200719, "epoch": 1658} {"train_loss": -41.34928894042969, "global_step": 200720, "epoch": 1658} {"train_loss": -41.01068878173828, "global_step": 200721, "epoch": 1658} {"train_loss": -41.023162841796875, "global_step": 200722, "epoch": 1658} {"train_loss": -41.6573600769043, "global_step": 200723, "epoch": 1658} {"train_loss": -41.4009895324707, "global_step": 200724, "epoch": 1658} {"train_loss": -40.406089782714844, "global_step": 200725, "epoch": 1658} {"train_loss": -40.58608627319336, "global_step": 200726, "epoch": 1658} {"train_loss": -41.10493087768555, "global_step": 200727, "epoch": 1658} {"train_loss": -41.37849807739258, "global_step": 200728, "epoch": 1658} {"train_loss": -40.70900344848633, "global_step": 200729, "epoch": 1658} {"train_loss": -40.489776611328125, "global_step": 200730, "epoch": 1658} {"train_loss": -40.60613250732422, "global_step": 200731, "epoch": 1658} {"train_loss": -39.355621337890625, "global_step": 200732, "epoch": 1658} {"train_loss": -40.038795471191406, "global_step": 200733, "epoch": 1658} {"train_loss": -41.30449295043945, "global_step": 200734, "epoch": 1658} {"train_loss": -40.46744918823242, "global_step": 200735, "epoch": 1658} {"train_loss": -39.98543930053711, "global_step": 200736, "epoch": 1658} {"train_loss": -38.859466552734375, "global_step": 200737, "epoch": 1658} {"train_loss": -40.439316804743996, "global_step": 200738, "epoch": 1658, "val_loss": 2563154.5} {"train_loss": -39.92866897583008, "global_step": 200739, "epoch": 1659} {"train_loss": -41.9215087890625, "global_step": 200740, "epoch": 1659} {"train_loss": -40.281227111816406, "global_step": 200741, "epoch": 1659} {"train_loss": -40.69823455810547, "global_step": 200742, "epoch": 1659} {"train_loss": -40.46969985961914, "global_step": 200743, "epoch": 1659} {"train_loss": -39.4453239440918, "global_step": 200744, "epoch": 1659} {"train_loss": -41.56563949584961, "global_step": 200745, "epoch": 1659} {"train_loss": -40.970947265625, "global_step": 200746, "epoch": 1659} {"train_loss": -40.433074951171875, "global_step": 200747, "epoch": 1659} {"train_loss": -40.506526947021484, "global_step": 200748, "epoch": 1659} {"train_loss": -40.523555755615234, "global_step": 200749, "epoch": 1659} {"train_loss": -40.94062805175781, "global_step": 200750, "epoch": 1659} {"train_loss": -41.12209701538086, "global_step": 200751, "epoch": 1659} {"train_loss": -39.67505645751953, "global_step": 200752, "epoch": 1659} {"train_loss": -40.85285186767578, "global_step": 200753, "epoch": 1659} {"train_loss": -39.377296447753906, "global_step": 200754, "epoch": 1659} {"train_loss": -41.01446533203125, "global_step": 200755, "epoch": 1659} {"train_loss": -39.25728988647461, "global_step": 200756, "epoch": 1659} {"train_loss": -41.4073600769043, "global_step": 200757, "epoch": 1659} {"train_loss": -40.35818099975586, "global_step": 200758, "epoch": 1659} {"train_loss": -40.63054275512695, "global_step": 200759, "epoch": 1659} {"train_loss": -40.7087516784668, "global_step": 200760, "epoch": 1659} {"train_loss": -39.017391204833984, "global_step": 200761, "epoch": 1659} {"train_loss": -39.59699630737305, "global_step": 200762, "epoch": 1659} {"train_loss": -39.37221908569336, "global_step": 200763, "epoch": 1659} {"train_loss": -40.69790267944336, "global_step": 200764, "epoch": 1659} {"train_loss": -38.68825149536133, "global_step": 200765, "epoch": 1659} {"train_loss": -40.798736572265625, "global_step": 200766, "epoch": 1659} {"train_loss": -40.66598129272461, "global_step": 200767, "epoch": 1659} {"train_loss": -41.623409271240234, "global_step": 200768, "epoch": 1659} {"train_loss": -39.831424713134766, "global_step": 200769, "epoch": 1659} {"train_loss": -39.41120147705078, "global_step": 200770, "epoch": 1659} {"train_loss": -39.746246337890625, "global_step": 200771, "epoch": 1659} {"train_loss": -41.043758392333984, "global_step": 200772, "epoch": 1659} {"train_loss": -40.66990661621094, "global_step": 200773, "epoch": 1659} {"train_loss": -38.859764099121094, "global_step": 200774, "epoch": 1659} {"train_loss": -40.22765350341797, "global_step": 200775, "epoch": 1659} {"train_loss": -41.63557434082031, "global_step": 200776, "epoch": 1659} {"train_loss": -41.4005126953125, "global_step": 200777, "epoch": 1659} {"train_loss": -39.66926574707031, "global_step": 200778, "epoch": 1659} {"train_loss": -40.57797622680664, "global_step": 200779, "epoch": 1659} {"train_loss": -41.3463020324707, "global_step": 200780, "epoch": 1659} {"train_loss": -39.711456298828125, "global_step": 200781, "epoch": 1659} {"train_loss": -40.6368293762207, "global_step": 200782, "epoch": 1659} {"train_loss": -40.94886016845703, "global_step": 200783, "epoch": 1659} {"train_loss": -40.343196868896484, "global_step": 200784, "epoch": 1659} {"train_loss": -41.616275787353516, "global_step": 200785, "epoch": 1659} {"train_loss": -40.990028381347656, "global_step": 200786, "epoch": 1659} {"train_loss": -40.520896911621094, "global_step": 200787, "epoch": 1659} {"train_loss": -41.37008285522461, "global_step": 200788, "epoch": 1659} {"train_loss": -40.3031120300293, "global_step": 200789, "epoch": 1659} {"train_loss": -40.86930465698242, "global_step": 200790, "epoch": 1659} {"train_loss": -40.742774963378906, "global_step": 200791, "epoch": 1659} {"train_loss": -40.31623077392578, "global_step": 200792, "epoch": 1659} {"train_loss": -40.9476203918457, "global_step": 200793, "epoch": 1659} {"train_loss": -41.510162353515625, "global_step": 200794, "epoch": 1659} {"train_loss": -40.99646759033203, "global_step": 200795, "epoch": 1659} {"train_loss": -40.53291702270508, "global_step": 200796, "epoch": 1659} {"train_loss": -39.71564865112305, "global_step": 200797, "epoch": 1659} {"train_loss": -41.866695404052734, "global_step": 200798, "epoch": 1659} {"train_loss": -40.80633544921875, "global_step": 200799, "epoch": 1659} {"train_loss": -41.91178512573242, "global_step": 200800, "epoch": 1659} {"train_loss": -40.755584716796875, "global_step": 200801, "epoch": 1659} {"train_loss": -41.69428634643555, "global_step": 200802, "epoch": 1659} {"train_loss": -41.797943115234375, "global_step": 200803, "epoch": 1659} {"train_loss": -42.0592041015625, "global_step": 200804, "epoch": 1659} {"train_loss": -41.79177474975586, "global_step": 200805, "epoch": 1659} {"train_loss": -37.777523040771484, "global_step": 200806, "epoch": 1659} {"train_loss": -41.956092834472656, "global_step": 200807, "epoch": 1659} {"train_loss": -42.047149658203125, "global_step": 200808, "epoch": 1659} {"train_loss": -41.9837532043457, "global_step": 200809, "epoch": 1659} {"train_loss": -41.82786178588867, "global_step": 200810, "epoch": 1659} {"train_loss": -41.58879089355469, "global_step": 200811, "epoch": 1659} {"train_loss": -40.561824798583984, "global_step": 200812, "epoch": 1659} {"train_loss": -37.48540115356445, "global_step": 200813, "epoch": 1659} {"train_loss": -40.53253173828125, "global_step": 200814, "epoch": 1659} {"train_loss": -40.293861389160156, "global_step": 200815, "epoch": 1659} {"train_loss": -40.073272705078125, "global_step": 200816, "epoch": 1659} {"train_loss": -40.24970245361328, "global_step": 200817, "epoch": 1659} {"train_loss": -37.9642219543457, "global_step": 200818, "epoch": 1659} {"train_loss": -41.699886322021484, "global_step": 200819, "epoch": 1659} {"train_loss": -40.773983001708984, "global_step": 200820, "epoch": 1659} {"train_loss": -34.1029052734375, "global_step": 200821, "epoch": 1659} {"train_loss": -41.02812576293945, "global_step": 200822, "epoch": 1659} {"train_loss": -41.545318603515625, "global_step": 200823, "epoch": 1659} {"train_loss": -39.38753890991211, "global_step": 200824, "epoch": 1659} {"train_loss": -41.38969039916992, "global_step": 200825, "epoch": 1659} {"train_loss": -40.39622116088867, "global_step": 200826, "epoch": 1659} {"train_loss": -40.2347526550293, "global_step": 200827, "epoch": 1659} {"train_loss": -41.057647705078125, "global_step": 200828, "epoch": 1659} {"train_loss": -40.37067794799805, "global_step": 200829, "epoch": 1659} {"train_loss": -41.0390510559082, "global_step": 200830, "epoch": 1659} {"train_loss": -35.66271209716797, "global_step": 200831, "epoch": 1659} {"train_loss": -38.05991744995117, "global_step": 200832, "epoch": 1659} {"train_loss": -35.60921096801758, "global_step": 200833, "epoch": 1659} {"train_loss": -39.837562561035156, "global_step": 200834, "epoch": 1659} {"train_loss": -39.56559371948242, "global_step": 200835, "epoch": 1659} {"train_loss": -39.412899017333984, "global_step": 200836, "epoch": 1659} {"train_loss": -41.40619659423828, "global_step": 200837, "epoch": 1659} {"train_loss": -40.9007453918457, "global_step": 200838, "epoch": 1659} {"train_loss": -39.797054290771484, "global_step": 200839, "epoch": 1659} {"train_loss": -40.81629180908203, "global_step": 200840, "epoch": 1659} {"train_loss": -38.74288558959961, "global_step": 200841, "epoch": 1659} {"train_loss": -41.398681640625, "global_step": 200842, "epoch": 1659} {"train_loss": -40.85618209838867, "global_step": 200843, "epoch": 1659} {"train_loss": -40.27927780151367, "global_step": 200844, "epoch": 1659} {"train_loss": -40.576812744140625, "global_step": 200845, "epoch": 1659} {"train_loss": -39.03084945678711, "global_step": 200846, "epoch": 1659} {"train_loss": -39.49124526977539, "global_step": 200847, "epoch": 1659} {"train_loss": -41.04411697387695, "global_step": 200848, "epoch": 1659} {"train_loss": -41.04972839355469, "global_step": 200849, "epoch": 1659} {"train_loss": -40.968074798583984, "global_step": 200850, "epoch": 1659} {"train_loss": -39.38540267944336, "global_step": 200851, "epoch": 1659} {"train_loss": -40.79927444458008, "global_step": 200852, "epoch": 1659} {"train_loss": -41.48711013793945, "global_step": 200853, "epoch": 1659} {"train_loss": -41.10325622558594, "global_step": 200854, "epoch": 1659} {"train_loss": -40.286251068115234, "global_step": 200855, "epoch": 1659} {"train_loss": -39.462867736816406, "global_step": 200856, "epoch": 1659} {"train_loss": -41.64686965942383, "global_step": 200857, "epoch": 1659} {"train_loss": -39.661041259765625, "global_step": 200858, "epoch": 1659} {"train_loss": -40.341310611441116, "global_step": 200859, "epoch": 1659, "val_loss": 2732429.75} {"train_loss": -38.65935134887695, "global_step": 200860, "epoch": 1660} {"train_loss": -40.358551025390625, "global_step": 200861, "epoch": 1660} {"train_loss": -38.93819808959961, "global_step": 200862, "epoch": 1660} {"train_loss": -39.352970123291016, "global_step": 200863, "epoch": 1660} {"train_loss": -40.089576721191406, "global_step": 200864, "epoch": 1660} {"train_loss": -40.413299560546875, "global_step": 200865, "epoch": 1660} {"train_loss": -37.78443145751953, "global_step": 200866, "epoch": 1660} {"train_loss": -40.50889587402344, "global_step": 200867, "epoch": 1660} {"train_loss": -41.020240783691406, "global_step": 200868, "epoch": 1660} {"train_loss": -40.64857482910156, "global_step": 200869, "epoch": 1660} {"train_loss": -40.915626525878906, "global_step": 200870, "epoch": 1660} {"train_loss": -40.839786529541016, "global_step": 200871, "epoch": 1660} {"train_loss": -41.26495361328125, "global_step": 200872, "epoch": 1660} {"train_loss": -40.12862777709961, "global_step": 200873, "epoch": 1660} {"train_loss": -39.948455810546875, "global_step": 200874, "epoch": 1660} {"train_loss": -40.87566375732422, "global_step": 200875, "epoch": 1660} {"train_loss": -41.6885871887207, "global_step": 200876, "epoch": 1660} {"train_loss": -41.08892059326172, "global_step": 200877, "epoch": 1660} {"train_loss": -41.412689208984375, "global_step": 200878, "epoch": 1660} {"train_loss": -41.12118148803711, "global_step": 200879, "epoch": 1660} {"train_loss": -40.76513671875, "global_step": 200880, "epoch": 1660} {"train_loss": -41.28371810913086, "global_step": 200881, "epoch": 1660} {"train_loss": -41.21484375, "global_step": 200882, "epoch": 1660} {"train_loss": -40.66535568237305, "global_step": 200883, "epoch": 1660} {"train_loss": -41.64844512939453, "global_step": 200884, "epoch": 1660} {"train_loss": -40.84010696411133, "global_step": 200885, "epoch": 1660} {"train_loss": -40.927284240722656, "global_step": 200886, "epoch": 1660} {"train_loss": -41.12969207763672, "global_step": 200887, "epoch": 1660} {"train_loss": -41.082393646240234, "global_step": 200888, "epoch": 1660} {"train_loss": -40.869564056396484, "global_step": 200889, "epoch": 1660} {"train_loss": -41.131744384765625, "global_step": 200890, "epoch": 1660} {"train_loss": -41.16261672973633, "global_step": 200891, "epoch": 1660} {"train_loss": -38.79848098754883, "global_step": 200892, "epoch": 1660} {"train_loss": -40.105953216552734, "global_step": 200893, "epoch": 1660} {"train_loss": -39.16524124145508, "global_step": 200894, "epoch": 1660} {"train_loss": -41.2066650390625, "global_step": 200895, "epoch": 1660} {"train_loss": -40.65499496459961, "global_step": 200896, "epoch": 1660} {"train_loss": -41.31519317626953, "global_step": 200897, "epoch": 1660} {"train_loss": -40.055885314941406, "global_step": 200898, "epoch": 1660} {"train_loss": -40.94146728515625, "global_step": 200899, "epoch": 1660} {"train_loss": -41.10779571533203, "global_step": 200900, "epoch": 1660} {"train_loss": -36.9024772644043, "global_step": 200901, "epoch": 1660} {"train_loss": -39.55315399169922, "global_step": 200902, "epoch": 1660} {"train_loss": -41.2728385925293, "global_step": 200903, "epoch": 1660} {"train_loss": -39.914913177490234, "global_step": 200904, "epoch": 1660} {"train_loss": -39.74119186401367, "global_step": 200905, "epoch": 1660} {"train_loss": -41.28620529174805, "global_step": 200906, "epoch": 1660} {"train_loss": -39.22695541381836, "global_step": 200907, "epoch": 1660} {"train_loss": -39.75474166870117, "global_step": 200908, "epoch": 1660} {"train_loss": -40.91006088256836, "global_step": 200909, "epoch": 1660} {"train_loss": -40.288082122802734, "global_step": 200910, "epoch": 1660} {"train_loss": -39.456233978271484, "global_step": 200911, "epoch": 1660} {"train_loss": -40.246864318847656, "global_step": 200912, "epoch": 1660} {"train_loss": -40.220130920410156, "global_step": 200913, "epoch": 1660} {"train_loss": -39.19258499145508, "global_step": 200914, "epoch": 1660} {"train_loss": -38.98676300048828, "global_step": 200915, "epoch": 1660} {"train_loss": -38.604732513427734, "global_step": 200916, "epoch": 1660} {"train_loss": -40.126705169677734, "global_step": 200917, "epoch": 1660} {"train_loss": -39.02360153198242, "global_step": 200918, "epoch": 1660} {"train_loss": -39.79841613769531, "global_step": 200919, "epoch": 1660} {"train_loss": -38.961551666259766, "global_step": 200920, "epoch": 1660} {"train_loss": -40.2424430847168, "global_step": 200921, "epoch": 1660} {"train_loss": -39.83225631713867, "global_step": 200922, "epoch": 1660} {"train_loss": -39.73788833618164, "global_step": 200923, "epoch": 1660} {"train_loss": -38.3398323059082, "global_step": 200924, "epoch": 1660} {"train_loss": -41.143898010253906, "global_step": 200925, "epoch": 1660} {"train_loss": -41.130611419677734, "global_step": 200926, "epoch": 1660} {"train_loss": -41.04905319213867, "global_step": 200927, "epoch": 1660} {"train_loss": -40.12699508666992, "global_step": 200928, "epoch": 1660} {"train_loss": -41.191158294677734, "global_step": 200929, "epoch": 1660} {"train_loss": -37.4501953125, "global_step": 200930, "epoch": 1660} {"train_loss": -41.026546478271484, "global_step": 200931, "epoch": 1660} {"train_loss": -39.34116744995117, "global_step": 200932, "epoch": 1660} {"train_loss": -40.223243713378906, "global_step": 200933, "epoch": 1660} {"train_loss": -40.68807601928711, "global_step": 200934, "epoch": 1660} {"train_loss": -38.88240051269531, "global_step": 200935, "epoch": 1660} {"train_loss": -40.56034469604492, "global_step": 200936, "epoch": 1660} {"train_loss": -39.52875518798828, "global_step": 200937, "epoch": 1660} {"train_loss": -40.42757797241211, "global_step": 200938, "epoch": 1660} {"train_loss": -39.46241760253906, "global_step": 200939, "epoch": 1660} {"train_loss": -40.0965576171875, "global_step": 200940, "epoch": 1660} {"train_loss": -40.84553527832031, "global_step": 200941, "epoch": 1660} {"train_loss": -41.3521842956543, "global_step": 200942, "epoch": 1660} {"train_loss": -41.48308181762695, "global_step": 200943, "epoch": 1660} {"train_loss": -41.51249694824219, "global_step": 200944, "epoch": 1660} {"train_loss": -40.46700668334961, "global_step": 200945, "epoch": 1660} {"train_loss": -41.3791618347168, "global_step": 200946, "epoch": 1660} {"train_loss": -41.67692947387695, "global_step": 200947, "epoch": 1660} {"train_loss": -40.61149978637695, "global_step": 200948, "epoch": 1660} {"train_loss": -41.35025405883789, "global_step": 200949, "epoch": 1660} {"train_loss": -40.89804458618164, "global_step": 200950, "epoch": 1660} {"train_loss": -40.47902297973633, "global_step": 200951, "epoch": 1660} {"train_loss": -40.10002517700195, "global_step": 200952, "epoch": 1660} {"train_loss": -38.72805404663086, "global_step": 200953, "epoch": 1660} {"train_loss": -40.37092971801758, "global_step": 200954, "epoch": 1660} {"train_loss": -41.18433380126953, "global_step": 200955, "epoch": 1660} {"train_loss": -40.50691604614258, "global_step": 200956, "epoch": 1660} {"train_loss": -41.15687561035156, "global_step": 200957, "epoch": 1660} {"train_loss": -40.60170364379883, "global_step": 200958, "epoch": 1660} {"train_loss": -40.83186721801758, "global_step": 200959, "epoch": 1660} {"train_loss": -41.05656814575195, "global_step": 200960, "epoch": 1660} {"train_loss": -40.30091857910156, "global_step": 200961, "epoch": 1660} {"train_loss": -41.15447998046875, "global_step": 200962, "epoch": 1660} {"train_loss": -41.32520294189453, "global_step": 200963, "epoch": 1660} {"train_loss": -40.340003967285156, "global_step": 200964, "epoch": 1660} {"train_loss": -41.39205551147461, "global_step": 200965, "epoch": 1660} {"train_loss": -41.01847457885742, "global_step": 200966, "epoch": 1660} {"train_loss": -40.86963653564453, "global_step": 200967, "epoch": 1660} {"train_loss": -39.63297653198242, "global_step": 200968, "epoch": 1660} {"train_loss": -40.787025451660156, "global_step": 200969, "epoch": 1660} {"train_loss": -39.46064758300781, "global_step": 200970, "epoch": 1660} {"train_loss": -40.18073654174805, "global_step": 200971, "epoch": 1660} {"train_loss": -39.093143463134766, "global_step": 200972, "epoch": 1660} {"train_loss": -39.21902084350586, "global_step": 200973, "epoch": 1660} {"train_loss": -38.391456604003906, "global_step": 200974, "epoch": 1660} {"train_loss": -39.13710403442383, "global_step": 200975, "epoch": 1660} {"train_loss": -40.04663848876953, "global_step": 200976, "epoch": 1660} {"train_loss": -39.598724365234375, "global_step": 200977, "epoch": 1660} {"train_loss": -39.93225860595703, "global_step": 200978, "epoch": 1660} {"train_loss": -41.11165237426758, "global_step": 200979, "epoch": 1660} {"train_loss": -40.30007748564413, "global_step": 200980, "epoch": 1660, "val_loss": 2611107.0} {"train_loss": -40.041481018066406, "global_step": 200981, "epoch": 1661} {"train_loss": -39.88825607299805, "global_step": 200982, "epoch": 1661} {"train_loss": -39.1082763671875, "global_step": 200983, "epoch": 1661} {"train_loss": -40.136905670166016, "global_step": 200984, "epoch": 1661} {"train_loss": -41.2296257019043, "global_step": 200985, "epoch": 1661} {"train_loss": -40.20718765258789, "global_step": 200986, "epoch": 1661} {"train_loss": -40.663143157958984, "global_step": 200987, "epoch": 1661} {"train_loss": -40.44682693481445, "global_step": 200988, "epoch": 1661} {"train_loss": -40.83827590942383, "global_step": 200989, "epoch": 1661} {"train_loss": -40.26980209350586, "global_step": 200990, "epoch": 1661} {"train_loss": -41.00132369995117, "global_step": 200991, "epoch": 1661} {"train_loss": -41.826045989990234, "global_step": 200992, "epoch": 1661} {"train_loss": -40.3097038269043, "global_step": 200993, "epoch": 1661} {"train_loss": -41.039703369140625, "global_step": 200994, "epoch": 1661} {"train_loss": -40.91303634643555, "global_step": 200995, "epoch": 1661} {"train_loss": -41.3879508972168, "global_step": 200996, "epoch": 1661} {"train_loss": -40.72842025756836, "global_step": 200997, "epoch": 1661} {"train_loss": -41.08124542236328, "global_step": 200998, "epoch": 1661} {"train_loss": -42.041358947753906, "global_step": 200999, "epoch": 1661} {"train_loss": -42.0408821105957, "global_step": 201000, "epoch": 1661} {"train_loss": -40.95771026611328, "global_step": 201001, "epoch": 1661} {"train_loss": -41.3598747253418, "global_step": 201002, "epoch": 1661} {"train_loss": -41.62717056274414, "global_step": 201003, "epoch": 1661} {"train_loss": -40.72420120239258, "global_step": 201004, "epoch": 1661} {"train_loss": -42.01161575317383, "global_step": 201005, "epoch": 1661} {"train_loss": -41.88360595703125, "global_step": 201006, "epoch": 1661} {"train_loss": -41.82731246948242, "global_step": 201007, "epoch": 1661} {"train_loss": -42.429908752441406, "global_step": 201008, "epoch": 1661} {"train_loss": -42.11848831176758, "global_step": 201009, "epoch": 1661} {"train_loss": -40.544105529785156, "global_step": 201010, "epoch": 1661} {"train_loss": -41.9704475402832, "global_step": 201011, "epoch": 1661} {"train_loss": -42.294124603271484, "global_step": 201012, "epoch": 1661} {"train_loss": -42.18572235107422, "global_step": 201013, "epoch": 1661} {"train_loss": -42.1432991027832, "global_step": 201014, "epoch": 1661} {"train_loss": -42.51153564453125, "global_step": 201015, "epoch": 1661} {"train_loss": -42.6087646484375, "global_step": 201016, "epoch": 1661} {"train_loss": -41.22270584106445, "global_step": 201017, "epoch": 1661} {"train_loss": -41.4697151184082, "global_step": 201018, "epoch": 1661} {"train_loss": -42.5828971862793, "global_step": 201019, "epoch": 1661} {"train_loss": -42.44415283203125, "global_step": 201020, "epoch": 1661} {"train_loss": -42.316349029541016, "global_step": 201021, "epoch": 1661} {"train_loss": -42.210418701171875, "global_step": 201022, "epoch": 1661} {"train_loss": -41.78605270385742, "global_step": 201023, "epoch": 1661} {"train_loss": -42.32658004760742, "global_step": 201024, "epoch": 1661} {"train_loss": -41.552703857421875, "global_step": 201025, "epoch": 1661} {"train_loss": -41.81058883666992, "global_step": 201026, "epoch": 1661} {"train_loss": -41.72468948364258, "global_step": 201027, "epoch": 1661} {"train_loss": -42.007965087890625, "global_step": 201028, "epoch": 1661} {"train_loss": -42.280426025390625, "global_step": 201029, "epoch": 1661} {"train_loss": -42.29259490966797, "global_step": 201030, "epoch": 1661} {"train_loss": -42.64494323730469, "global_step": 201031, "epoch": 1661} {"train_loss": -42.58871078491211, "global_step": 201032, "epoch": 1661} {"train_loss": -42.24610137939453, "global_step": 201033, "epoch": 1661} {"train_loss": -42.15286636352539, "global_step": 201034, "epoch": 1661} {"train_loss": -42.019371032714844, "global_step": 201035, "epoch": 1661} {"train_loss": -41.256622314453125, "global_step": 201036, "epoch": 1661} {"train_loss": -39.964927673339844, "global_step": 201037, "epoch": 1661} {"train_loss": -39.033912658691406, "global_step": 201038, "epoch": 1661} {"train_loss": -35.29713439941406, "global_step": 201039, "epoch": 1661} {"train_loss": -28.290430068969727, "global_step": 201040, "epoch": 1661} {"train_loss": -35.738197326660156, "global_step": 201041, "epoch": 1661} {"train_loss": -37.5337028503418, "global_step": 201042, "epoch": 1661} {"train_loss": -40.4521598815918, "global_step": 201043, "epoch": 1661} {"train_loss": -39.54336166381836, "global_step": 201044, "epoch": 1661} {"train_loss": -36.99028396606445, "global_step": 201045, "epoch": 1661} {"train_loss": -37.29058074951172, "global_step": 201046, "epoch": 1661} {"train_loss": -40.06521224975586, "global_step": 201047, "epoch": 1661} {"train_loss": -38.832088470458984, "global_step": 201048, "epoch": 1661} {"train_loss": -40.56340408325195, "global_step": 201049, "epoch": 1661} {"train_loss": -39.48881149291992, "global_step": 201050, "epoch": 1661} {"train_loss": -40.030677795410156, "global_step": 201051, "epoch": 1661} {"train_loss": -37.278411865234375, "global_step": 201052, "epoch": 1661} {"train_loss": -39.26803207397461, "global_step": 201053, "epoch": 1661} {"train_loss": -39.44561767578125, "global_step": 201054, "epoch": 1661} {"train_loss": -39.90910720825195, "global_step": 201055, "epoch": 1661} {"train_loss": -40.3695068359375, "global_step": 201056, "epoch": 1661} {"train_loss": -35.606815338134766, "global_step": 201057, "epoch": 1661} {"train_loss": -38.932861328125, "global_step": 201058, "epoch": 1661} {"train_loss": -39.86866760253906, "global_step": 201059, "epoch": 1661} {"train_loss": -41.27128982543945, "global_step": 201060, "epoch": 1661} {"train_loss": -29.813037872314453, "global_step": 201061, "epoch": 1661} {"train_loss": -38.582576751708984, "global_step": 201062, "epoch": 1661} {"train_loss": -34.15983200073242, "global_step": 201063, "epoch": 1661} {"train_loss": -40.13044738769531, "global_step": 201064, "epoch": 1661} {"train_loss": -38.27216720581055, "global_step": 201065, "epoch": 1661} {"train_loss": -40.40130615234375, "global_step": 201066, "epoch": 1661} {"train_loss": -39.62614059448242, "global_step": 201067, "epoch": 1661} {"train_loss": -39.65684127807617, "global_step": 201068, "epoch": 1661} {"train_loss": -39.416290283203125, "global_step": 201069, "epoch": 1661} {"train_loss": -33.9735221862793, "global_step": 201070, "epoch": 1661} {"train_loss": -35.27756118774414, "global_step": 201071, "epoch": 1661} {"train_loss": -36.36798095703125, "global_step": 201072, "epoch": 1661} {"train_loss": -38.636749267578125, "global_step": 201073, "epoch": 1661} {"train_loss": -40.72571563720703, "global_step": 201074, "epoch": 1661} {"train_loss": -30.96184730529785, "global_step": 201075, "epoch": 1661} {"train_loss": -33.441131591796875, "global_step": 201076, "epoch": 1661} {"train_loss": -35.66788864135742, "global_step": 201077, "epoch": 1661} {"train_loss": -28.04129981994629, "global_step": 201078, "epoch": 1661} {"train_loss": -32.663307189941406, "global_step": 201079, "epoch": 1661} {"train_loss": -29.948535919189453, "global_step": 201080, "epoch": 1661} {"train_loss": -32.742774963378906, "global_step": 201081, "epoch": 1661} {"train_loss": -38.114479064941406, "global_step": 201082, "epoch": 1661} {"train_loss": -33.91610336303711, "global_step": 201083, "epoch": 1661} {"train_loss": -36.65749740600586, "global_step": 201084, "epoch": 1661} {"train_loss": -35.93549728393555, "global_step": 201085, "epoch": 1661} {"train_loss": -34.374603271484375, "global_step": 201086, "epoch": 1661} {"train_loss": -37.40596008300781, "global_step": 201087, "epoch": 1661} {"train_loss": -38.18980026245117, "global_step": 201088, "epoch": 1661} {"train_loss": -28.81778907775879, "global_step": 201089, "epoch": 1661} {"train_loss": -35.31748580932617, "global_step": 201090, "epoch": 1661} {"train_loss": -37.395843505859375, "global_step": 201091, "epoch": 1661} {"train_loss": -35.9445915222168, "global_step": 201092, "epoch": 1661} {"train_loss": -36.45600128173828, "global_step": 201093, "epoch": 1661} {"train_loss": -38.07002639770508, "global_step": 201094, "epoch": 1661} {"train_loss": -36.436405181884766, "global_step": 201095, "epoch": 1661} {"train_loss": -34.82262420654297, "global_step": 201096, "epoch": 1661} {"train_loss": -36.42611312866211, "global_step": 201097, "epoch": 1661} {"train_loss": -36.04536437988281, "global_step": 201098, "epoch": 1661} {"train_loss": -38.037628173828125, "global_step": 201099, "epoch": 1661} {"train_loss": -37.65500259399414, "global_step": 201100, "epoch": 1661} {"train_loss": -38.99311021536835, "global_step": 201101, "epoch": 1661, "val_loss": 2585848.0} {"train_loss": -38.25938034057617, "global_step": 201102, "epoch": 1662} {"train_loss": -37.859771728515625, "global_step": 201103, "epoch": 1662} {"train_loss": -38.14706039428711, "global_step": 201104, "epoch": 1662} {"train_loss": -38.3973274230957, "global_step": 201105, "epoch": 1662} {"train_loss": -36.96796417236328, "global_step": 201106, "epoch": 1662} {"train_loss": -38.56877899169922, "global_step": 201107, "epoch": 1662} {"train_loss": -39.349464416503906, "global_step": 201108, "epoch": 1662} {"train_loss": -39.2451171875, "global_step": 201109, "epoch": 1662} {"train_loss": -38.34901428222656, "global_step": 201110, "epoch": 1662} {"train_loss": -39.61601638793945, "global_step": 201111, "epoch": 1662} {"train_loss": -38.6049690246582, "global_step": 201112, "epoch": 1662} {"train_loss": -38.643062591552734, "global_step": 201113, "epoch": 1662} {"train_loss": -38.9067497253418, "global_step": 201114, "epoch": 1662} {"train_loss": -39.2041130065918, "global_step": 201115, "epoch": 1662} {"train_loss": -38.985679626464844, "global_step": 201116, "epoch": 1662} {"train_loss": -38.9409294128418, "global_step": 201117, "epoch": 1662} {"train_loss": -39.385982513427734, "global_step": 201118, "epoch": 1662} {"train_loss": -39.363216400146484, "global_step": 201119, "epoch": 1662} {"train_loss": -38.71673583984375, "global_step": 201120, "epoch": 1662} {"train_loss": -39.33176803588867, "global_step": 201121, "epoch": 1662} {"train_loss": -39.095703125, "global_step": 201122, "epoch": 1662} {"train_loss": -39.972774505615234, "global_step": 201123, "epoch": 1662} {"train_loss": -39.34362030029297, "global_step": 201124, "epoch": 1662} {"train_loss": -38.90525436401367, "global_step": 201125, "epoch": 1662} {"train_loss": -39.244632720947266, "global_step": 201126, "epoch": 1662} {"train_loss": -39.316951751708984, "global_step": 201127, "epoch": 1662} {"train_loss": -39.976234436035156, "global_step": 201128, "epoch": 1662} {"train_loss": -40.02650833129883, "global_step": 201129, "epoch": 1662} {"train_loss": -40.22126007080078, "global_step": 201130, "epoch": 1662} {"train_loss": -40.39973449707031, "global_step": 201131, "epoch": 1662} {"train_loss": -40.2288932800293, "global_step": 201132, "epoch": 1662} {"train_loss": -40.176429748535156, "global_step": 201133, "epoch": 1662} {"train_loss": -40.5607795715332, "global_step": 201134, "epoch": 1662} {"train_loss": -40.02411651611328, "global_step": 201135, "epoch": 1662} {"train_loss": -39.90925216674805, "global_step": 201136, "epoch": 1662} {"train_loss": -40.031089782714844, "global_step": 201137, "epoch": 1662} {"train_loss": -40.20305633544922, "global_step": 201138, "epoch": 1662} {"train_loss": -40.926204681396484, "global_step": 201139, "epoch": 1662} {"train_loss": -40.32573699951172, "global_step": 201140, "epoch": 1662} {"train_loss": -39.630088806152344, "global_step": 201141, "epoch": 1662} {"train_loss": -40.80577087402344, "global_step": 201142, "epoch": 1662} {"train_loss": -40.0127067565918, "global_step": 201143, "epoch": 1662} {"train_loss": -40.415103912353516, "global_step": 201144, "epoch": 1662} {"train_loss": -40.52143096923828, "global_step": 201145, "epoch": 1662} {"train_loss": -41.05288314819336, "global_step": 201146, "epoch": 1662} {"train_loss": -41.04659652709961, "global_step": 201147, "epoch": 1662} {"train_loss": -40.356082916259766, "global_step": 201148, "epoch": 1662} {"train_loss": -40.897117614746094, "global_step": 201149, "epoch": 1662} {"train_loss": -40.60995101928711, "global_step": 201150, "epoch": 1662} {"train_loss": -40.757320404052734, "global_step": 201151, "epoch": 1662} {"train_loss": -41.02785873413086, "global_step": 201152, "epoch": 1662} {"train_loss": -39.41019821166992, "global_step": 201153, "epoch": 1662} {"train_loss": -41.02223205566406, "global_step": 201154, "epoch": 1662} {"train_loss": -40.751502990722656, "global_step": 201155, "epoch": 1662} {"train_loss": -41.30720138549805, "global_step": 201156, "epoch": 1662} {"train_loss": -40.892494201660156, "global_step": 201157, "epoch": 1662} {"train_loss": -40.970863342285156, "global_step": 201158, "epoch": 1662} {"train_loss": -40.64036178588867, "global_step": 201159, "epoch": 1662} {"train_loss": -41.62488555908203, "global_step": 201160, "epoch": 1662} {"train_loss": -41.23455810546875, "global_step": 201161, "epoch": 1662} {"train_loss": -40.294734954833984, "global_step": 201162, "epoch": 1662} {"train_loss": -40.98873519897461, "global_step": 201163, "epoch": 1662} {"train_loss": -41.358131408691406, "global_step": 201164, "epoch": 1662} {"train_loss": -41.39021682739258, "global_step": 201165, "epoch": 1662} {"train_loss": -41.0920524597168, "global_step": 201166, "epoch": 1662} {"train_loss": -40.22730255126953, "global_step": 201167, "epoch": 1662} {"train_loss": -41.1691780090332, "global_step": 201168, "epoch": 1662} {"train_loss": -41.179107666015625, "global_step": 201169, "epoch": 1662} {"train_loss": -41.562557220458984, "global_step": 201170, "epoch": 1662} {"train_loss": -41.41324996948242, "global_step": 201171, "epoch": 1662} {"train_loss": -41.45255661010742, "global_step": 201172, "epoch": 1662} {"train_loss": -41.55772018432617, "global_step": 201173, "epoch": 1662} {"train_loss": -41.2524528503418, "global_step": 201174, "epoch": 1662} {"train_loss": -41.6899299621582, "global_step": 201175, "epoch": 1662} {"train_loss": -41.04338073730469, "global_step": 201176, "epoch": 1662} {"train_loss": -41.29873275756836, "global_step": 201177, "epoch": 1662} {"train_loss": -41.46965789794922, "global_step": 201178, "epoch": 1662} {"train_loss": -41.05483627319336, "global_step": 201179, "epoch": 1662} {"train_loss": -41.16815948486328, "global_step": 201180, "epoch": 1662} {"train_loss": -41.383358001708984, "global_step": 201181, "epoch": 1662} {"train_loss": -40.905059814453125, "global_step": 201182, "epoch": 1662} {"train_loss": -40.83830642700195, "global_step": 201183, "epoch": 1662} {"train_loss": -40.95689010620117, "global_step": 201184, "epoch": 1662} {"train_loss": -41.882442474365234, "global_step": 201185, "epoch": 1662} {"train_loss": -41.635616302490234, "global_step": 201186, "epoch": 1662} {"train_loss": -40.59055709838867, "global_step": 201187, "epoch": 1662} {"train_loss": -41.156192779541016, "global_step": 201188, "epoch": 1662} {"train_loss": -39.977108001708984, "global_step": 201189, "epoch": 1662} {"train_loss": -40.77757263183594, "global_step": 201190, "epoch": 1662} {"train_loss": -41.31300735473633, "global_step": 201191, "epoch": 1662} {"train_loss": -41.23562240600586, "global_step": 201192, "epoch": 1662} {"train_loss": -41.51810073852539, "global_step": 201193, "epoch": 1662} {"train_loss": -40.845306396484375, "global_step": 201194, "epoch": 1662} {"train_loss": -40.999446868896484, "global_step": 201195, "epoch": 1662} {"train_loss": -41.69121170043945, "global_step": 201196, "epoch": 1662} {"train_loss": -39.01993942260742, "global_step": 201197, "epoch": 1662} {"train_loss": -39.145931243896484, "global_step": 201198, "epoch": 1662} {"train_loss": -39.12493896484375, "global_step": 201199, "epoch": 1662} {"train_loss": -39.71917724609375, "global_step": 201200, "epoch": 1662} {"train_loss": -41.62204360961914, "global_step": 201201, "epoch": 1662} {"train_loss": -39.8631591796875, "global_step": 201202, "epoch": 1662} {"train_loss": -39.16618728637695, "global_step": 201203, "epoch": 1662} {"train_loss": -40.30811309814453, "global_step": 201204, "epoch": 1662} {"train_loss": -41.63570785522461, "global_step": 201205, "epoch": 1662} {"train_loss": -40.42118453979492, "global_step": 201206, "epoch": 1662} {"train_loss": -40.46620559692383, "global_step": 201207, "epoch": 1662} {"train_loss": -40.820228576660156, "global_step": 201208, "epoch": 1662} {"train_loss": -40.176551818847656, "global_step": 201209, "epoch": 1662} {"train_loss": -40.57554244995117, "global_step": 201210, "epoch": 1662} {"train_loss": -40.5345344543457, "global_step": 201211, "epoch": 1662} {"train_loss": -40.78678512573242, "global_step": 201212, "epoch": 1662} {"train_loss": -40.329952239990234, "global_step": 201213, "epoch": 1662} {"train_loss": -41.65085220336914, "global_step": 201214, "epoch": 1662} {"train_loss": -40.173683166503906, "global_step": 201215, "epoch": 1662} {"train_loss": -41.00428771972656, "global_step": 201216, "epoch": 1662} {"train_loss": -41.18022918701172, "global_step": 201217, "epoch": 1662} {"train_loss": -40.91842269897461, "global_step": 201218, "epoch": 1662} {"train_loss": -41.43684005737305, "global_step": 201219, "epoch": 1662} {"train_loss": -40.9708251953125, "global_step": 201220, "epoch": 1662} {"train_loss": -41.47392654418945, "global_step": 201221, "epoch": 1662} {"train_loss": -40.34869416292049, "global_step": 201222, "epoch": 1662, "val_loss": 2646389.25} {"train_loss": -40.92873001098633, "global_step": 201223, "epoch": 1663} {"train_loss": -40.74039840698242, "global_step": 201224, "epoch": 1663} {"train_loss": -41.740535736083984, "global_step": 201225, "epoch": 1663} {"train_loss": -41.5107421875, "global_step": 201226, "epoch": 1663} {"train_loss": -41.417964935302734, "global_step": 201227, "epoch": 1663} {"train_loss": -40.216339111328125, "global_step": 201228, "epoch": 1663} {"train_loss": -41.129058837890625, "global_step": 201229, "epoch": 1663} {"train_loss": -40.28464126586914, "global_step": 201230, "epoch": 1663} {"train_loss": -40.7617073059082, "global_step": 201231, "epoch": 1663} {"train_loss": -40.662818908691406, "global_step": 201232, "epoch": 1663} {"train_loss": -41.91239547729492, "global_step": 201233, "epoch": 1663} {"train_loss": -41.097660064697266, "global_step": 201234, "epoch": 1663} {"train_loss": -39.572147369384766, "global_step": 201235, "epoch": 1663} {"train_loss": -40.6097412109375, "global_step": 201236, "epoch": 1663} {"train_loss": -40.073036193847656, "global_step": 201237, "epoch": 1663} {"train_loss": -40.63323974609375, "global_step": 201238, "epoch": 1663} {"train_loss": -39.83461380004883, "global_step": 201239, "epoch": 1663} {"train_loss": -35.066444396972656, "global_step": 201240, "epoch": 1663} {"train_loss": -32.11935806274414, "global_step": 201241, "epoch": 1663} {"train_loss": -37.545326232910156, "global_step": 201242, "epoch": 1663} {"train_loss": -39.79422378540039, "global_step": 201243, "epoch": 1663} {"train_loss": -35.35601806640625, "global_step": 201244, "epoch": 1663} {"train_loss": -36.16279602050781, "global_step": 201245, "epoch": 1663} {"train_loss": -40.48969650268555, "global_step": 201246, "epoch": 1663} {"train_loss": -37.969947814941406, "global_step": 201247, "epoch": 1663} {"train_loss": -40.38832473754883, "global_step": 201248, "epoch": 1663} {"train_loss": -39.292171478271484, "global_step": 201249, "epoch": 1663} {"train_loss": -40.67473602294922, "global_step": 201250, "epoch": 1663} {"train_loss": -40.856170654296875, "global_step": 201251, "epoch": 1663} {"train_loss": -40.716426849365234, "global_step": 201252, "epoch": 1663} {"train_loss": -40.46223068237305, "global_step": 201253, "epoch": 1663} {"train_loss": -40.88303756713867, "global_step": 201254, "epoch": 1663} {"train_loss": -40.39936447143555, "global_step": 201255, "epoch": 1663} {"train_loss": -40.88976287841797, "global_step": 201256, "epoch": 1663} {"train_loss": -41.128448486328125, "global_step": 201257, "epoch": 1663} {"train_loss": -41.14363479614258, "global_step": 201258, "epoch": 1663} {"train_loss": -39.559810638427734, "global_step": 201259, "epoch": 1663} {"train_loss": -40.95143508911133, "global_step": 201260, "epoch": 1663} {"train_loss": -40.477359771728516, "global_step": 201261, "epoch": 1663} {"train_loss": -41.99115753173828, "global_step": 201262, "epoch": 1663} {"train_loss": -41.229286193847656, "global_step": 201263, "epoch": 1663} {"train_loss": -40.59823989868164, "global_step": 201264, "epoch": 1663} {"train_loss": -40.82215118408203, "global_step": 201265, "epoch": 1663} {"train_loss": -41.79664993286133, "global_step": 201266, "epoch": 1663} {"train_loss": -41.01604461669922, "global_step": 201267, "epoch": 1663} {"train_loss": -41.520503997802734, "global_step": 201268, "epoch": 1663} {"train_loss": -41.36065673828125, "global_step": 201269, "epoch": 1663} {"train_loss": -41.20512771606445, "global_step": 201270, "epoch": 1663} {"train_loss": -41.40483856201172, "global_step": 201271, "epoch": 1663} {"train_loss": -41.71641159057617, "global_step": 201272, "epoch": 1663} {"train_loss": -41.15574264526367, "global_step": 201273, "epoch": 1663} {"train_loss": -41.57353591918945, "global_step": 201274, "epoch": 1663} {"train_loss": -41.512821197509766, "global_step": 201275, "epoch": 1663} {"train_loss": -41.62533187866211, "global_step": 201276, "epoch": 1663} {"train_loss": -40.783477783203125, "global_step": 201277, "epoch": 1663} {"train_loss": -41.71881103515625, "global_step": 201278, "epoch": 1663} {"train_loss": -41.871131896972656, "global_step": 201279, "epoch": 1663} {"train_loss": -41.61942672729492, "global_step": 201280, "epoch": 1663} {"train_loss": -40.29951858520508, "global_step": 201281, "epoch": 1663} {"train_loss": -42.20743942260742, "global_step": 201282, "epoch": 1663} {"train_loss": -41.57427978515625, "global_step": 201283, "epoch": 1663} {"train_loss": -41.846343994140625, "global_step": 201284, "epoch": 1663} {"train_loss": -41.9069709777832, "global_step": 201285, "epoch": 1663} {"train_loss": -42.24372100830078, "global_step": 201286, "epoch": 1663} {"train_loss": -41.90858840942383, "global_step": 201287, "epoch": 1663} {"train_loss": -40.951934814453125, "global_step": 201288, "epoch": 1663} {"train_loss": -40.80221176147461, "global_step": 201289, "epoch": 1663} {"train_loss": -41.30933380126953, "global_step": 201290, "epoch": 1663} {"train_loss": -41.937381744384766, "global_step": 201291, "epoch": 1663} {"train_loss": -41.555877685546875, "global_step": 201292, "epoch": 1663} {"train_loss": -41.89512252807617, "global_step": 201293, "epoch": 1663} {"train_loss": -41.331485748291016, "global_step": 201294, "epoch": 1663} {"train_loss": -41.66301727294922, "global_step": 201295, "epoch": 1663} {"train_loss": -41.91545104980469, "global_step": 201296, "epoch": 1663} {"train_loss": -41.585670471191406, "global_step": 201297, "epoch": 1663} {"train_loss": -42.1427001953125, "global_step": 201298, "epoch": 1663} {"train_loss": -38.88228988647461, "global_step": 201299, "epoch": 1663} {"train_loss": -40.69938278198242, "global_step": 201300, "epoch": 1663} {"train_loss": -41.89203643798828, "global_step": 201301, "epoch": 1663} {"train_loss": -41.57331466674805, "global_step": 201302, "epoch": 1663} {"train_loss": -41.572998046875, "global_step": 201303, "epoch": 1663} {"train_loss": -40.91618728637695, "global_step": 201304, "epoch": 1663} {"train_loss": -42.361637115478516, "global_step": 201305, "epoch": 1663} {"train_loss": -41.122047424316406, "global_step": 201306, "epoch": 1663} {"train_loss": -40.454586029052734, "global_step": 201307, "epoch": 1663} {"train_loss": -41.28926086425781, "global_step": 201308, "epoch": 1663} {"train_loss": -40.56986999511719, "global_step": 201309, "epoch": 1663} {"train_loss": -41.04276657104492, "global_step": 201310, "epoch": 1663} {"train_loss": -41.75645446777344, "global_step": 201311, "epoch": 1663} {"train_loss": -40.93876266479492, "global_step": 201312, "epoch": 1663} {"train_loss": -38.14124298095703, "global_step": 201313, "epoch": 1663} {"train_loss": -34.207454681396484, "global_step": 201314, "epoch": 1663} {"train_loss": -24.513708114624023, "global_step": 201315, "epoch": 1663} {"train_loss": -24.896085739135742, "global_step": 201316, "epoch": 1663} {"train_loss": -33.069915771484375, "global_step": 201317, "epoch": 1663} {"train_loss": -29.685556411743164, "global_step": 201318, "epoch": 1663} {"train_loss": -28.99732780456543, "global_step": 201319, "epoch": 1663} {"train_loss": -37.27865219116211, "global_step": 201320, "epoch": 1663} {"train_loss": -34.165374755859375, "global_step": 201321, "epoch": 1663} {"train_loss": -31.89828872680664, "global_step": 201322, "epoch": 1663} {"train_loss": -37.53764343261719, "global_step": 201323, "epoch": 1663} {"train_loss": -28.215696334838867, "global_step": 201324, "epoch": 1663} {"train_loss": -34.32372283935547, "global_step": 201325, "epoch": 1663} {"train_loss": -35.06309509277344, "global_step": 201326, "epoch": 1663} {"train_loss": -36.236968994140625, "global_step": 201327, "epoch": 1663} {"train_loss": -36.61971664428711, "global_step": 201328, "epoch": 1663} {"train_loss": -35.44184494018555, "global_step": 201329, "epoch": 1663} {"train_loss": -38.60435104370117, "global_step": 201330, "epoch": 1663} {"train_loss": -35.51784896850586, "global_step": 201331, "epoch": 1663} {"train_loss": -39.26272201538086, "global_step": 201332, "epoch": 1663} {"train_loss": -37.26616287231445, "global_step": 201333, "epoch": 1663} {"train_loss": -39.83578109741211, "global_step": 201334, "epoch": 1663} {"train_loss": -38.44171905517578, "global_step": 201335, "epoch": 1663} {"train_loss": -39.17197799682617, "global_step": 201336, "epoch": 1663} {"train_loss": -38.81551742553711, "global_step": 201337, "epoch": 1663} {"train_loss": -39.72248077392578, "global_step": 201338, "epoch": 1663} {"train_loss": -40.047706604003906, "global_step": 201339, "epoch": 1663} {"train_loss": -39.878395080566406, "global_step": 201340, "epoch": 1663} {"train_loss": -39.71455001831055, "global_step": 201341, "epoch": 1663} {"train_loss": -39.39036178588867, "global_step": 201342, "epoch": 1663} {"train_loss": -39.43227656025532, "global_step": 201343, "epoch": 1663, "val_loss": 2669998.25} {"train_loss": -40.491092681884766, "global_step": 201344, "epoch": 1664} {"train_loss": -39.415096282958984, "global_step": 201345, "epoch": 1664} {"train_loss": -40.40796661376953, "global_step": 201346, "epoch": 1664} {"train_loss": -40.31493377685547, "global_step": 201347, "epoch": 1664} {"train_loss": -39.87474060058594, "global_step": 201348, "epoch": 1664} {"train_loss": -40.54811477661133, "global_step": 201349, "epoch": 1664} {"train_loss": -40.30412673950195, "global_step": 201350, "epoch": 1664} {"train_loss": -40.23163604736328, "global_step": 201351, "epoch": 1664} {"train_loss": -40.918148040771484, "global_step": 201352, "epoch": 1664} {"train_loss": -40.2578125, "global_step": 201353, "epoch": 1664} {"train_loss": -40.45121383666992, "global_step": 201354, "epoch": 1664} {"train_loss": -40.66917037963867, "global_step": 201355, "epoch": 1664} {"train_loss": -40.48419952392578, "global_step": 201356, "epoch": 1664} {"train_loss": -41.204872131347656, "global_step": 201357, "epoch": 1664} {"train_loss": -40.54954147338867, "global_step": 201358, "epoch": 1664} {"train_loss": -40.66622543334961, "global_step": 201359, "epoch": 1664} {"train_loss": -41.14303207397461, "global_step": 201360, "epoch": 1664} {"train_loss": -40.57844161987305, "global_step": 201361, "epoch": 1664} {"train_loss": -41.00687789916992, "global_step": 201362, "epoch": 1664} {"train_loss": -41.39702224731445, "global_step": 201363, "epoch": 1664} {"train_loss": -41.32594680786133, "global_step": 201364, "epoch": 1664} {"train_loss": -40.3857307434082, "global_step": 201365, "epoch": 1664} {"train_loss": -40.57976531982422, "global_step": 201366, "epoch": 1664} {"train_loss": -41.21818923950195, "global_step": 201367, "epoch": 1664} {"train_loss": -41.36530303955078, "global_step": 201368, "epoch": 1664} {"train_loss": -41.219390869140625, "global_step": 201369, "epoch": 1664} {"train_loss": -41.21387481689453, "global_step": 201370, "epoch": 1664} {"train_loss": -41.10535430908203, "global_step": 201371, "epoch": 1664} {"train_loss": -41.1648063659668, "global_step": 201372, "epoch": 1664} {"train_loss": -41.5772819519043, "global_step": 201373, "epoch": 1664} {"train_loss": -41.29236602783203, "global_step": 201374, "epoch": 1664} {"train_loss": -41.71926498413086, "global_step": 201375, "epoch": 1664} {"train_loss": -41.36143112182617, "global_step": 201376, "epoch": 1664} {"train_loss": -41.316158294677734, "global_step": 201377, "epoch": 1664} {"train_loss": -41.864234924316406, "global_step": 201378, "epoch": 1664} {"train_loss": -41.87896728515625, "global_step": 201379, "epoch": 1664} {"train_loss": -42.02031707763672, "global_step": 201380, "epoch": 1664} {"train_loss": -41.77381134033203, "global_step": 201381, "epoch": 1664} {"train_loss": -41.14007568359375, "global_step": 201382, "epoch": 1664} {"train_loss": -41.98502731323242, "global_step": 201383, "epoch": 1664} {"train_loss": -41.85388946533203, "global_step": 201384, "epoch": 1664} {"train_loss": -41.77503204345703, "global_step": 201385, "epoch": 1664} {"train_loss": -41.34652328491211, "global_step": 201386, "epoch": 1664} {"train_loss": -42.1854133605957, "global_step": 201387, "epoch": 1664} {"train_loss": -41.935115814208984, "global_step": 201388, "epoch": 1664} {"train_loss": -42.2191162109375, "global_step": 201389, "epoch": 1664} {"train_loss": -41.6699104309082, "global_step": 201390, "epoch": 1664} {"train_loss": -42.27326583862305, "global_step": 201391, "epoch": 1664} {"train_loss": -41.904605865478516, "global_step": 201392, "epoch": 1664} {"train_loss": -41.64919662475586, "global_step": 201393, "epoch": 1664} {"train_loss": -42.06936264038086, "global_step": 201394, "epoch": 1664} {"train_loss": -41.93254470825195, "global_step": 201395, "epoch": 1664} {"train_loss": -41.761260986328125, "global_step": 201396, "epoch": 1664} {"train_loss": -42.24287414550781, "global_step": 201397, "epoch": 1664} {"train_loss": -41.9321403503418, "global_step": 201398, "epoch": 1664} {"train_loss": -42.46586227416992, "global_step": 201399, "epoch": 1664} {"train_loss": -42.55129623413086, "global_step": 201400, "epoch": 1664} {"train_loss": -42.36296463012695, "global_step": 201401, "epoch": 1664} {"train_loss": -42.33059310913086, "global_step": 201402, "epoch": 1664} {"train_loss": -41.95795822143555, "global_step": 201403, "epoch": 1664} {"train_loss": -42.39409255981445, "global_step": 201404, "epoch": 1664} {"train_loss": -40.961456298828125, "global_step": 201405, "epoch": 1664} {"train_loss": -42.24709701538086, "global_step": 201406, "epoch": 1664} {"train_loss": -42.49251174926758, "global_step": 201407, "epoch": 1664} {"train_loss": -42.37938690185547, "global_step": 201408, "epoch": 1664} {"train_loss": -42.816444396972656, "global_step": 201409, "epoch": 1664} {"train_loss": -42.5605583190918, "global_step": 201410, "epoch": 1664} {"train_loss": -41.541500091552734, "global_step": 201411, "epoch": 1664} {"train_loss": -41.972686767578125, "global_step": 201412, "epoch": 1664} {"train_loss": -41.6922721862793, "global_step": 201413, "epoch": 1664} {"train_loss": -42.27958297729492, "global_step": 201414, "epoch": 1664} {"train_loss": -42.28131866455078, "global_step": 201415, "epoch": 1664} {"train_loss": -41.93339538574219, "global_step": 201416, "epoch": 1664} {"train_loss": -42.31290817260742, "global_step": 201417, "epoch": 1664} {"train_loss": -42.20657730102539, "global_step": 201418, "epoch": 1664} {"train_loss": -42.278499603271484, "global_step": 201419, "epoch": 1664} {"train_loss": -42.1133918762207, "global_step": 201420, "epoch": 1664} {"train_loss": -41.97943115234375, "global_step": 201421, "epoch": 1664} {"train_loss": -42.4400749206543, "global_step": 201422, "epoch": 1664} {"train_loss": -42.40423583984375, "global_step": 201423, "epoch": 1664} {"train_loss": -42.40822982788086, "global_step": 201424, "epoch": 1664} {"train_loss": -41.23694610595703, "global_step": 201425, "epoch": 1664} {"train_loss": -41.44521713256836, "global_step": 201426, "epoch": 1664} {"train_loss": -42.0064582824707, "global_step": 201427, "epoch": 1664} {"train_loss": -42.121639251708984, "global_step": 201428, "epoch": 1664} {"train_loss": -41.514137268066406, "global_step": 201429, "epoch": 1664} {"train_loss": -41.784420013427734, "global_step": 201430, "epoch": 1664} {"train_loss": -42.31895065307617, "global_step": 201431, "epoch": 1664} {"train_loss": -42.231876373291016, "global_step": 201432, "epoch": 1664} {"train_loss": -41.53419876098633, "global_step": 201433, "epoch": 1664} {"train_loss": -41.520076751708984, "global_step": 201434, "epoch": 1664} {"train_loss": -42.413333892822266, "global_step": 201435, "epoch": 1664} {"train_loss": -40.84542465209961, "global_step": 201436, "epoch": 1664} {"train_loss": -42.266273498535156, "global_step": 201437, "epoch": 1664} {"train_loss": -41.498939514160156, "global_step": 201438, "epoch": 1664} {"train_loss": -39.92346954345703, "global_step": 201439, "epoch": 1664} {"train_loss": -39.79757308959961, "global_step": 201440, "epoch": 1664} {"train_loss": -40.43233108520508, "global_step": 201441, "epoch": 1664} {"train_loss": -42.01237106323242, "global_step": 201442, "epoch": 1664} {"train_loss": -40.83757400512695, "global_step": 201443, "epoch": 1664} {"train_loss": -38.54863357543945, "global_step": 201444, "epoch": 1664} {"train_loss": -33.45211410522461, "global_step": 201445, "epoch": 1664} {"train_loss": -34.4494514465332, "global_step": 201446, "epoch": 1664} {"train_loss": -39.68436813354492, "global_step": 201447, "epoch": 1664} {"train_loss": -38.95945358276367, "global_step": 201448, "epoch": 1664} {"train_loss": -36.563941955566406, "global_step": 201449, "epoch": 1664} {"train_loss": -37.0175895690918, "global_step": 201450, "epoch": 1664} {"train_loss": -38.68046569824219, "global_step": 201451, "epoch": 1664} {"train_loss": -37.24155807495117, "global_step": 201452, "epoch": 1664} {"train_loss": -38.63898849487305, "global_step": 201453, "epoch": 1664} {"train_loss": -39.00843048095703, "global_step": 201454, "epoch": 1664} {"train_loss": -36.73476028442383, "global_step": 201455, "epoch": 1664} {"train_loss": -39.19600296020508, "global_step": 201456, "epoch": 1664} {"train_loss": -39.46439743041992, "global_step": 201457, "epoch": 1664} {"train_loss": -37.476417541503906, "global_step": 201458, "epoch": 1664} {"train_loss": -40.32596206665039, "global_step": 201459, "epoch": 1664} {"train_loss": -39.51826477050781, "global_step": 201460, "epoch": 1664} {"train_loss": -39.808101654052734, "global_step": 201461, "epoch": 1664} {"train_loss": -38.90079879760742, "global_step": 201462, "epoch": 1664} {"train_loss": -39.1804313659668, "global_step": 201463, "epoch": 1664} {"train_loss": -40.93938565845332, "global_step": 201464, "epoch": 1664, "val_loss": 2649506.75} {"train_loss": -39.72147750854492, "global_step": 201465, "epoch": 1665} {"train_loss": -38.39487838745117, "global_step": 201466, "epoch": 1665} {"train_loss": -40.175575256347656, "global_step": 201467, "epoch": 1665} {"train_loss": -38.5988655090332, "global_step": 201468, "epoch": 1665} {"train_loss": -37.890342712402344, "global_step": 201469, "epoch": 1665} {"train_loss": -38.87474060058594, "global_step": 201470, "epoch": 1665} {"train_loss": -40.810237884521484, "global_step": 201471, "epoch": 1665} {"train_loss": -39.519874572753906, "global_step": 201472, "epoch": 1665} {"train_loss": -40.1248893737793, "global_step": 201473, "epoch": 1665} {"train_loss": -40.8914909362793, "global_step": 201474, "epoch": 1665} {"train_loss": -39.89470291137695, "global_step": 201475, "epoch": 1665} {"train_loss": -40.74937438964844, "global_step": 201476, "epoch": 1665} {"train_loss": -40.50594711303711, "global_step": 201477, "epoch": 1665} {"train_loss": -40.7423210144043, "global_step": 201478, "epoch": 1665} {"train_loss": -39.1341667175293, "global_step": 201479, "epoch": 1665} {"train_loss": -40.994720458984375, "global_step": 201480, "epoch": 1665} {"train_loss": -41.047332763671875, "global_step": 201481, "epoch": 1665} {"train_loss": -40.964080810546875, "global_step": 201482, "epoch": 1665} {"train_loss": -41.34156036376953, "global_step": 201483, "epoch": 1665} {"train_loss": -40.9172477722168, "global_step": 201484, "epoch": 1665} {"train_loss": -41.47614288330078, "global_step": 201485, "epoch": 1665} {"train_loss": -41.1668586730957, "global_step": 201486, "epoch": 1665} {"train_loss": -41.5456657409668, "global_step": 201487, "epoch": 1665} {"train_loss": -41.1676139831543, "global_step": 201488, "epoch": 1665} {"train_loss": -41.73977279663086, "global_step": 201489, "epoch": 1665} {"train_loss": -41.757408142089844, "global_step": 201490, "epoch": 1665} {"train_loss": -41.690673828125, "global_step": 201491, "epoch": 1665} {"train_loss": -41.49138259887695, "global_step": 201492, "epoch": 1665} {"train_loss": -41.83063507080078, "global_step": 201493, "epoch": 1665} {"train_loss": -41.722469329833984, "global_step": 201494, "epoch": 1665} {"train_loss": -42.01639938354492, "global_step": 201495, "epoch": 1665} {"train_loss": -42.06464767456055, "global_step": 201496, "epoch": 1665} {"train_loss": -39.83875274658203, "global_step": 201497, "epoch": 1665} {"train_loss": -41.794105529785156, "global_step": 201498, "epoch": 1665} {"train_loss": -41.939308166503906, "global_step": 201499, "epoch": 1665} {"train_loss": -42.16016387939453, "global_step": 201500, "epoch": 1665} {"train_loss": -42.02363967895508, "global_step": 201501, "epoch": 1665} {"train_loss": -37.76782989501953, "global_step": 201502, "epoch": 1665} {"train_loss": -42.28883743286133, "global_step": 201503, "epoch": 1665} {"train_loss": -41.67177200317383, "global_step": 201504, "epoch": 1665} {"train_loss": -42.145263671875, "global_step": 201505, "epoch": 1665} {"train_loss": -40.381900787353516, "global_step": 201506, "epoch": 1665} {"train_loss": -42.31045150756836, "global_step": 201507, "epoch": 1665} {"train_loss": -40.913490295410156, "global_step": 201508, "epoch": 1665} {"train_loss": -42.187652587890625, "global_step": 201509, "epoch": 1665} {"train_loss": -41.70505905151367, "global_step": 201510, "epoch": 1665} {"train_loss": -40.794612884521484, "global_step": 201511, "epoch": 1665} {"train_loss": -41.916812896728516, "global_step": 201512, "epoch": 1665} {"train_loss": -36.37066650390625, "global_step": 201513, "epoch": 1665} {"train_loss": -40.81502914428711, "global_step": 201514, "epoch": 1665} {"train_loss": -37.08182907104492, "global_step": 201515, "epoch": 1665} {"train_loss": -40.55107879638672, "global_step": 201516, "epoch": 1665} {"train_loss": -40.98419952392578, "global_step": 201517, "epoch": 1665} {"train_loss": -41.85028839111328, "global_step": 201518, "epoch": 1665} {"train_loss": -41.952938079833984, "global_step": 201519, "epoch": 1665} {"train_loss": -40.77883529663086, "global_step": 201520, "epoch": 1665} {"train_loss": -40.6415901184082, "global_step": 201521, "epoch": 1665} {"train_loss": -40.017852783203125, "global_step": 201522, "epoch": 1665} {"train_loss": -40.981475830078125, "global_step": 201523, "epoch": 1665} {"train_loss": -40.93752670288086, "global_step": 201524, "epoch": 1665} {"train_loss": -40.79044723510742, "global_step": 201525, "epoch": 1665} {"train_loss": -41.66268539428711, "global_step": 201526, "epoch": 1665} {"train_loss": -42.093387603759766, "global_step": 201527, "epoch": 1665} {"train_loss": -41.74043273925781, "global_step": 201528, "epoch": 1665} {"train_loss": -40.917781829833984, "global_step": 201529, "epoch": 1665} {"train_loss": -40.527381896972656, "global_step": 201530, "epoch": 1665} {"train_loss": -41.44981002807617, "global_step": 201531, "epoch": 1665} {"train_loss": -40.46855545043945, "global_step": 201532, "epoch": 1665} {"train_loss": -42.53044891357422, "global_step": 201533, "epoch": 1665} {"train_loss": -40.862831115722656, "global_step": 201534, "epoch": 1665} {"train_loss": -41.71879959106445, "global_step": 201535, "epoch": 1665} {"train_loss": -41.54911804199219, "global_step": 201536, "epoch": 1665} {"train_loss": -42.501216888427734, "global_step": 201537, "epoch": 1665} {"train_loss": -41.238460540771484, "global_step": 201538, "epoch": 1665} {"train_loss": -40.20577621459961, "global_step": 201539, "epoch": 1665} {"train_loss": -41.071224212646484, "global_step": 201540, "epoch": 1665} {"train_loss": -41.01887893676758, "global_step": 201541, "epoch": 1665} {"train_loss": -40.80755615234375, "global_step": 201542, "epoch": 1665} {"train_loss": -41.57137680053711, "global_step": 201543, "epoch": 1665} {"train_loss": -41.9522590637207, "global_step": 201544, "epoch": 1665} {"train_loss": -41.5744514465332, "global_step": 201545, "epoch": 1665} {"train_loss": -41.71366500854492, "global_step": 201546, "epoch": 1665} {"train_loss": -41.75794219970703, "global_step": 201547, "epoch": 1665} {"train_loss": -41.62822341918945, "global_step": 201548, "epoch": 1665} {"train_loss": -41.2349967956543, "global_step": 201549, "epoch": 1665} {"train_loss": -41.76156234741211, "global_step": 201550, "epoch": 1665} {"train_loss": -41.82189178466797, "global_step": 201551, "epoch": 1665} {"train_loss": -41.74127197265625, "global_step": 201552, "epoch": 1665} {"train_loss": -41.61274337768555, "global_step": 201553, "epoch": 1665} {"train_loss": -40.39662170410156, "global_step": 201554, "epoch": 1665} {"train_loss": -41.70548629760742, "global_step": 201555, "epoch": 1665} {"train_loss": -41.51035690307617, "global_step": 201556, "epoch": 1665} {"train_loss": -41.41654586791992, "global_step": 201557, "epoch": 1665} {"train_loss": -41.25213623046875, "global_step": 201558, "epoch": 1665} {"train_loss": -41.343536376953125, "global_step": 201559, "epoch": 1665} {"train_loss": -39.64822006225586, "global_step": 201560, "epoch": 1665} {"train_loss": -41.384334564208984, "global_step": 201561, "epoch": 1665} {"train_loss": -41.80622100830078, "global_step": 201562, "epoch": 1665} {"train_loss": -42.0195426940918, "global_step": 201563, "epoch": 1665} {"train_loss": -41.082977294921875, "global_step": 201564, "epoch": 1665} {"train_loss": -41.316192626953125, "global_step": 201565, "epoch": 1665} {"train_loss": -41.504764556884766, "global_step": 201566, "epoch": 1665} {"train_loss": -41.103736877441406, "global_step": 201567, "epoch": 1665} {"train_loss": -41.05290985107422, "global_step": 201568, "epoch": 1665} {"train_loss": -41.6617431640625, "global_step": 201569, "epoch": 1665} {"train_loss": -41.80477523803711, "global_step": 201570, "epoch": 1665} {"train_loss": -42.10341262817383, "global_step": 201571, "epoch": 1665} {"train_loss": -41.11966323852539, "global_step": 201572, "epoch": 1665} {"train_loss": -41.89768981933594, "global_step": 201573, "epoch": 1665} {"train_loss": -41.678611755371094, "global_step": 201574, "epoch": 1665} {"train_loss": -41.666080474853516, "global_step": 201575, "epoch": 1665} {"train_loss": -41.932186126708984, "global_step": 201576, "epoch": 1665} {"train_loss": -41.948726654052734, "global_step": 201577, "epoch": 1665} {"train_loss": -41.13381576538086, "global_step": 201578, "epoch": 1665} {"train_loss": -40.94321823120117, "global_step": 201579, "epoch": 1665} {"train_loss": -41.77075958251953, "global_step": 201580, "epoch": 1665} {"train_loss": -41.8839225769043, "global_step": 201581, "epoch": 1665} {"train_loss": -41.55625534057617, "global_step": 201582, "epoch": 1665} {"train_loss": -42.08976364135742, "global_step": 201583, "epoch": 1665} {"train_loss": -41.64095687866211, "global_step": 201584, "epoch": 1665} {"train_loss": -41.10898653140738, "global_step": 201585, "epoch": 1665, "val_loss": 2603024.0} {"train_loss": -41.935943603515625, "global_step": 201586, "epoch": 1666} {"train_loss": -42.17529296875, "global_step": 201587, "epoch": 1666} {"train_loss": -42.6553840637207, "global_step": 201588, "epoch": 1666} {"train_loss": -41.4603157043457, "global_step": 201589, "epoch": 1666} {"train_loss": -41.28546142578125, "global_step": 201590, "epoch": 1666} {"train_loss": -40.81287384033203, "global_step": 201591, "epoch": 1666} {"train_loss": -40.49966049194336, "global_step": 201592, "epoch": 1666} {"train_loss": -38.4135627746582, "global_step": 201593, "epoch": 1666} {"train_loss": -40.43857955932617, "global_step": 201594, "epoch": 1666} {"train_loss": -38.844669342041016, "global_step": 201595, "epoch": 1666} {"train_loss": -40.11692428588867, "global_step": 201596, "epoch": 1666} {"train_loss": -38.3477668762207, "global_step": 201597, "epoch": 1666} {"train_loss": -37.34505081176758, "global_step": 201598, "epoch": 1666} {"train_loss": -34.6641960144043, "global_step": 201599, "epoch": 1666} {"train_loss": -40.8383903503418, "global_step": 201600, "epoch": 1666} {"train_loss": -39.0470085144043, "global_step": 201601, "epoch": 1666} {"train_loss": -40.45003890991211, "global_step": 201602, "epoch": 1666} {"train_loss": -40.73478317260742, "global_step": 201603, "epoch": 1666} {"train_loss": -40.540191650390625, "global_step": 201604, "epoch": 1666} {"train_loss": -40.5948600769043, "global_step": 201605, "epoch": 1666} {"train_loss": -39.8791618347168, "global_step": 201606, "epoch": 1666} {"train_loss": -40.96061706542969, "global_step": 201607, "epoch": 1666} {"train_loss": -40.85368728637695, "global_step": 201608, "epoch": 1666} {"train_loss": -41.09725570678711, "global_step": 201609, "epoch": 1666} {"train_loss": -40.87824249267578, "global_step": 201610, "epoch": 1666} {"train_loss": -39.99679183959961, "global_step": 201611, "epoch": 1666} {"train_loss": -40.27703857421875, "global_step": 201612, "epoch": 1666} {"train_loss": -39.263729095458984, "global_step": 201613, "epoch": 1666} {"train_loss": -40.68452835083008, "global_step": 201614, "epoch": 1666} {"train_loss": -40.77314376831055, "global_step": 201615, "epoch": 1666} {"train_loss": -40.83002853393555, "global_step": 201616, "epoch": 1666} {"train_loss": -41.537391662597656, "global_step": 201617, "epoch": 1666} {"train_loss": -40.52915573120117, "global_step": 201618, "epoch": 1666} {"train_loss": -41.5784797668457, "global_step": 201619, "epoch": 1666} {"train_loss": -41.305416107177734, "global_step": 201620, "epoch": 1666} {"train_loss": -41.2076530456543, "global_step": 201621, "epoch": 1666} {"train_loss": -40.53813171386719, "global_step": 201622, "epoch": 1666} {"train_loss": -39.88190841674805, "global_step": 201623, "epoch": 1666} {"train_loss": -40.7646484375, "global_step": 201624, "epoch": 1666} {"train_loss": -40.85364532470703, "global_step": 201625, "epoch": 1666} {"train_loss": -41.472198486328125, "global_step": 201626, "epoch": 1666} {"train_loss": -41.728206634521484, "global_step": 201627, "epoch": 1666} {"train_loss": -40.86812973022461, "global_step": 201628, "epoch": 1666} {"train_loss": -40.455535888671875, "global_step": 201629, "epoch": 1666} {"train_loss": -41.546875, "global_step": 201630, "epoch": 1666} {"train_loss": -41.51169967651367, "global_step": 201631, "epoch": 1666} {"train_loss": -41.74161911010742, "global_step": 201632, "epoch": 1666} {"train_loss": -41.841556549072266, "global_step": 201633, "epoch": 1666} {"train_loss": -41.7955207824707, "global_step": 201634, "epoch": 1666} {"train_loss": -42.16416549682617, "global_step": 201635, "epoch": 1666} {"train_loss": -40.89331817626953, "global_step": 201636, "epoch": 1666} {"train_loss": -41.3994255065918, "global_step": 201637, "epoch": 1666} {"train_loss": -42.075904846191406, "global_step": 201638, "epoch": 1666} {"train_loss": -38.63850021362305, "global_step": 201639, "epoch": 1666} {"train_loss": -41.57996368408203, "global_step": 201640, "epoch": 1666} {"train_loss": -40.244564056396484, "global_step": 201641, "epoch": 1666} {"train_loss": -41.86502456665039, "global_step": 201642, "epoch": 1666} {"train_loss": -41.20307540893555, "global_step": 201643, "epoch": 1666} {"train_loss": -40.47126007080078, "global_step": 201644, "epoch": 1666} {"train_loss": -40.25592041015625, "global_step": 201645, "epoch": 1666} {"train_loss": -40.83015823364258, "global_step": 201646, "epoch": 1666} {"train_loss": -39.624610900878906, "global_step": 201647, "epoch": 1666} {"train_loss": -37.41324996948242, "global_step": 201648, "epoch": 1666} {"train_loss": -39.6912727355957, "global_step": 201649, "epoch": 1666} {"train_loss": -41.4367790222168, "global_step": 201650, "epoch": 1666} {"train_loss": -41.53095626831055, "global_step": 201651, "epoch": 1666} {"train_loss": -41.54017639160156, "global_step": 201652, "epoch": 1666} {"train_loss": -41.10438919067383, "global_step": 201653, "epoch": 1666} {"train_loss": -41.663516998291016, "global_step": 201654, "epoch": 1666} {"train_loss": -40.343135833740234, "global_step": 201655, "epoch": 1666} {"train_loss": -41.395263671875, "global_step": 201656, "epoch": 1666} {"train_loss": -40.71318817138672, "global_step": 201657, "epoch": 1666} {"train_loss": -41.613216400146484, "global_step": 201658, "epoch": 1666} {"train_loss": -41.521766662597656, "global_step": 201659, "epoch": 1666} {"train_loss": -41.85768508911133, "global_step": 201660, "epoch": 1666} {"train_loss": -41.786067962646484, "global_step": 201661, "epoch": 1666} {"train_loss": -41.283443450927734, "global_step": 201662, "epoch": 1666} {"train_loss": -41.331077575683594, "global_step": 201663, "epoch": 1666} {"train_loss": -41.76333236694336, "global_step": 201664, "epoch": 1666} {"train_loss": -34.72982406616211, "global_step": 201665, "epoch": 1666} {"train_loss": -41.59838104248047, "global_step": 201666, "epoch": 1666} {"train_loss": -41.36676025390625, "global_step": 201667, "epoch": 1666} {"train_loss": -41.59907913208008, "global_step": 201668, "epoch": 1666} {"train_loss": -42.0092887878418, "global_step": 201669, "epoch": 1666} {"train_loss": -37.28495407104492, "global_step": 201670, "epoch": 1666} {"train_loss": -41.80207443237305, "global_step": 201671, "epoch": 1666} {"train_loss": -41.291873931884766, "global_step": 201672, "epoch": 1666} {"train_loss": -41.181915283203125, "global_step": 201673, "epoch": 1666} {"train_loss": -41.01859664916992, "global_step": 201674, "epoch": 1666} {"train_loss": -41.07896423339844, "global_step": 201675, "epoch": 1666} {"train_loss": -41.859310150146484, "global_step": 201676, "epoch": 1666} {"train_loss": -41.8208122253418, "global_step": 201677, "epoch": 1666} {"train_loss": -41.58310317993164, "global_step": 201678, "epoch": 1666} {"train_loss": -42.02706527709961, "global_step": 201679, "epoch": 1666} {"train_loss": -41.47395706176758, "global_step": 201680, "epoch": 1666} {"train_loss": -41.387630462646484, "global_step": 201681, "epoch": 1666} {"train_loss": -42.020545959472656, "global_step": 201682, "epoch": 1666} {"train_loss": -42.249332427978516, "global_step": 201683, "epoch": 1666} {"train_loss": -42.17802047729492, "global_step": 201684, "epoch": 1666} {"train_loss": -41.476131439208984, "global_step": 201685, "epoch": 1666} {"train_loss": -41.883724212646484, "global_step": 201686, "epoch": 1666} {"train_loss": -37.46388626098633, "global_step": 201687, "epoch": 1666} {"train_loss": -41.9363899230957, "global_step": 201688, "epoch": 1666} {"train_loss": -41.56629180908203, "global_step": 201689, "epoch": 1666} {"train_loss": -41.904701232910156, "global_step": 201690, "epoch": 1666} {"train_loss": -41.65322494506836, "global_step": 201691, "epoch": 1666} {"train_loss": -41.30302047729492, "global_step": 201692, "epoch": 1666} {"train_loss": -41.8013801574707, "global_step": 201693, "epoch": 1666} {"train_loss": -41.777286529541016, "global_step": 201694, "epoch": 1666} {"train_loss": -40.30833053588867, "global_step": 201695, "epoch": 1666} {"train_loss": -40.97843551635742, "global_step": 201696, "epoch": 1666} {"train_loss": -41.470882415771484, "global_step": 201697, "epoch": 1666} {"train_loss": -41.26559829711914, "global_step": 201698, "epoch": 1666} {"train_loss": -42.091026306152344, "global_step": 201699, "epoch": 1666} {"train_loss": -42.0993537902832, "global_step": 201700, "epoch": 1666} {"train_loss": -40.18128967285156, "global_step": 201701, "epoch": 1666} {"train_loss": -39.85492706298828, "global_step": 201702, "epoch": 1666} {"train_loss": -40.4159049987793, "global_step": 201703, "epoch": 1666} {"train_loss": -40.68703842163086, "global_step": 201704, "epoch": 1666} {"train_loss": -40.65869140625, "global_step": 201705, "epoch": 1666} {"train_loss": -40.799383841270256, "global_step": 201706, "epoch": 1666, "val_loss": 2565111.75} {"train_loss": -39.11336135864258, "global_step": 201707, "epoch": 1667} {"train_loss": -40.11021041870117, "global_step": 201708, "epoch": 1667} {"train_loss": -39.21372604370117, "global_step": 201709, "epoch": 1667} {"train_loss": -36.07412338256836, "global_step": 201710, "epoch": 1667} {"train_loss": -29.8203067779541, "global_step": 201711, "epoch": 1667} {"train_loss": -36.7900505065918, "global_step": 201712, "epoch": 1667} {"train_loss": -39.10981369018555, "global_step": 201713, "epoch": 1667} {"train_loss": -34.516544342041016, "global_step": 201714, "epoch": 1667} {"train_loss": -29.898548126220703, "global_step": 201715, "epoch": 1667} {"train_loss": -33.055599212646484, "global_step": 201716, "epoch": 1667} {"train_loss": -36.1868896484375, "global_step": 201717, "epoch": 1667} {"train_loss": -31.613733291625977, "global_step": 201718, "epoch": 1667} {"train_loss": -25.05569839477539, "global_step": 201719, "epoch": 1667} {"train_loss": -34.03279495239258, "global_step": 201720, "epoch": 1667} {"train_loss": -33.69690704345703, "global_step": 201721, "epoch": 1667} {"train_loss": -32.19393539428711, "global_step": 201722, "epoch": 1667} {"train_loss": -34.78736114501953, "global_step": 201723, "epoch": 1667} {"train_loss": -28.115747451782227, "global_step": 201724, "epoch": 1667} {"train_loss": -32.30988311767578, "global_step": 201725, "epoch": 1667} {"train_loss": -33.34962844848633, "global_step": 201726, "epoch": 1667} {"train_loss": -36.38067626953125, "global_step": 201727, "epoch": 1667} {"train_loss": -35.379085540771484, "global_step": 201728, "epoch": 1667} {"train_loss": -37.420654296875, "global_step": 201729, "epoch": 1667} {"train_loss": -35.30308151245117, "global_step": 201730, "epoch": 1667} {"train_loss": -36.427547454833984, "global_step": 201731, "epoch": 1667} {"train_loss": -38.173030853271484, "global_step": 201732, "epoch": 1667} {"train_loss": -34.82628631591797, "global_step": 201733, "epoch": 1667} {"train_loss": -35.43281173706055, "global_step": 201734, "epoch": 1667} {"train_loss": -37.6202507019043, "global_step": 201735, "epoch": 1667} {"train_loss": -37.84404754638672, "global_step": 201736, "epoch": 1667} {"train_loss": -38.510372161865234, "global_step": 201737, "epoch": 1667} {"train_loss": -37.95493698120117, "global_step": 201738, "epoch": 1667} {"train_loss": -38.374568939208984, "global_step": 201739, "epoch": 1667} {"train_loss": -39.252098083496094, "global_step": 201740, "epoch": 1667} {"train_loss": -38.43411636352539, "global_step": 201741, "epoch": 1667} {"train_loss": -39.57181930541992, "global_step": 201742, "epoch": 1667} {"train_loss": -39.10322189331055, "global_step": 201743, "epoch": 1667} {"train_loss": -38.962974548339844, "global_step": 201744, "epoch": 1667} {"train_loss": -38.258033752441406, "global_step": 201745, "epoch": 1667} {"train_loss": -38.9998779296875, "global_step": 201746, "epoch": 1667} {"train_loss": -39.40694808959961, "global_step": 201747, "epoch": 1667} {"train_loss": -40.0099983215332, "global_step": 201748, "epoch": 1667} {"train_loss": -38.859535217285156, "global_step": 201749, "epoch": 1667} {"train_loss": -37.55587387084961, "global_step": 201750, "epoch": 1667} {"train_loss": -38.763545989990234, "global_step": 201751, "epoch": 1667} {"train_loss": -36.82802200317383, "global_step": 201752, "epoch": 1667} {"train_loss": -39.17121505737305, "global_step": 201753, "epoch": 1667} {"train_loss": -39.506343841552734, "global_step": 201754, "epoch": 1667} {"train_loss": -38.51089096069336, "global_step": 201755, "epoch": 1667} {"train_loss": -39.593658447265625, "global_step": 201756, "epoch": 1667} {"train_loss": -39.608577728271484, "global_step": 201757, "epoch": 1667} {"train_loss": -39.91239547729492, "global_step": 201758, "epoch": 1667} {"train_loss": -39.74991226196289, "global_step": 201759, "epoch": 1667} {"train_loss": -39.677059173583984, "global_step": 201760, "epoch": 1667} {"train_loss": -39.97168731689453, "global_step": 201761, "epoch": 1667} {"train_loss": -40.02008056640625, "global_step": 201762, "epoch": 1667} {"train_loss": -40.11625289916992, "global_step": 201763, "epoch": 1667} {"train_loss": -40.562049865722656, "global_step": 201764, "epoch": 1667} {"train_loss": -40.48036193847656, "global_step": 201765, "epoch": 1667} {"train_loss": -40.43994140625, "global_step": 201766, "epoch": 1667} {"train_loss": -40.183837890625, "global_step": 201767, "epoch": 1667} {"train_loss": -40.53264236450195, "global_step": 201768, "epoch": 1667} {"train_loss": -40.643863677978516, "global_step": 201769, "epoch": 1667} {"train_loss": -40.285064697265625, "global_step": 201770, "epoch": 1667} {"train_loss": -40.330413818359375, "global_step": 201771, "epoch": 1667} {"train_loss": -40.470577239990234, "global_step": 201772, "epoch": 1667} {"train_loss": -40.450740814208984, "global_step": 201773, "epoch": 1667} {"train_loss": -40.11290740966797, "global_step": 201774, "epoch": 1667} {"train_loss": -40.769771575927734, "global_step": 201775, "epoch": 1667} {"train_loss": -40.41410446166992, "global_step": 201776, "epoch": 1667} {"train_loss": -40.81148147583008, "global_step": 201777, "epoch": 1667} {"train_loss": -40.49727249145508, "global_step": 201778, "epoch": 1667} {"train_loss": -40.57794189453125, "global_step": 201779, "epoch": 1667} {"train_loss": -39.54309844970703, "global_step": 201780, "epoch": 1667} {"train_loss": -40.840972900390625, "global_step": 201781, "epoch": 1667} {"train_loss": -39.77486801147461, "global_step": 201782, "epoch": 1667} {"train_loss": -40.274898529052734, "global_step": 201783, "epoch": 1667} {"train_loss": -40.64331817626953, "global_step": 201784, "epoch": 1667} {"train_loss": -40.77861404418945, "global_step": 201785, "epoch": 1667} {"train_loss": -40.84391403198242, "global_step": 201786, "epoch": 1667} {"train_loss": -40.66545486450195, "global_step": 201787, "epoch": 1667} {"train_loss": -40.8177604675293, "global_step": 201788, "epoch": 1667} {"train_loss": -41.415218353271484, "global_step": 201789, "epoch": 1667} {"train_loss": -41.46013259887695, "global_step": 201790, "epoch": 1667} {"train_loss": -40.20417022705078, "global_step": 201791, "epoch": 1667} {"train_loss": -40.976375579833984, "global_step": 201792, "epoch": 1667} {"train_loss": -41.16791534423828, "global_step": 201793, "epoch": 1667} {"train_loss": -41.063995361328125, "global_step": 201794, "epoch": 1667} {"train_loss": -40.60537338256836, "global_step": 201795, "epoch": 1667} {"train_loss": -41.647457122802734, "global_step": 201796, "epoch": 1667} {"train_loss": -41.64619064331055, "global_step": 201797, "epoch": 1667} {"train_loss": -40.830989837646484, "global_step": 201798, "epoch": 1667} {"train_loss": -41.655677795410156, "global_step": 201799, "epoch": 1667} {"train_loss": -41.021480560302734, "global_step": 201800, "epoch": 1667} {"train_loss": -41.5904426574707, "global_step": 201801, "epoch": 1667} {"train_loss": -40.86466598510742, "global_step": 201802, "epoch": 1667} {"train_loss": -41.15415573120117, "global_step": 201803, "epoch": 1667} {"train_loss": -41.324607849121094, "global_step": 201804, "epoch": 1667} {"train_loss": -41.655879974365234, "global_step": 201805, "epoch": 1667} {"train_loss": -41.3226203918457, "global_step": 201806, "epoch": 1667} {"train_loss": -40.89834213256836, "global_step": 201807, "epoch": 1667} {"train_loss": -41.66775131225586, "global_step": 201808, "epoch": 1667} {"train_loss": -41.685821533203125, "global_step": 201809, "epoch": 1667} {"train_loss": -41.67975997924805, "global_step": 201810, "epoch": 1667} {"train_loss": -41.85946273803711, "global_step": 201811, "epoch": 1667} {"train_loss": -41.679195404052734, "global_step": 201812, "epoch": 1667} {"train_loss": -40.942779541015625, "global_step": 201813, "epoch": 1667} {"train_loss": -41.76821517944336, "global_step": 201814, "epoch": 1667} {"train_loss": -41.486839294433594, "global_step": 201815, "epoch": 1667} {"train_loss": -41.5251579284668, "global_step": 201816, "epoch": 1667} {"train_loss": -41.27571487426758, "global_step": 201817, "epoch": 1667} {"train_loss": -42.21147537231445, "global_step": 201818, "epoch": 1667} {"train_loss": -41.677303314208984, "global_step": 201819, "epoch": 1667} {"train_loss": -41.09320068359375, "global_step": 201820, "epoch": 1667} {"train_loss": -41.80613327026367, "global_step": 201821, "epoch": 1667} {"train_loss": -42.195640563964844, "global_step": 201822, "epoch": 1667} {"train_loss": -42.221771240234375, "global_step": 201823, "epoch": 1667} {"train_loss": -42.03337478637695, "global_step": 201824, "epoch": 1667} {"train_loss": -42.03369903564453, "global_step": 201825, "epoch": 1667} {"train_loss": -42.14278030395508, "global_step": 201826, "epoch": 1667} {"train_loss": -39.06812540164664, "global_step": 201827, "epoch": 1667, "val_loss": 2581513.25} {"train_loss": -42.18743896484375, "global_step": 201828, "epoch": 1668} {"train_loss": -42.35226058959961, "global_step": 201829, "epoch": 1668} {"train_loss": -41.47519302368164, "global_step": 201830, "epoch": 1668} {"train_loss": -41.6815071105957, "global_step": 201831, "epoch": 1668} {"train_loss": -42.06452178955078, "global_step": 201832, "epoch": 1668} {"train_loss": -42.34934616088867, "global_step": 201833, "epoch": 1668} {"train_loss": -42.379878997802734, "global_step": 201834, "epoch": 1668} {"train_loss": -42.19959259033203, "global_step": 201835, "epoch": 1668} {"train_loss": -42.29884719848633, "global_step": 201836, "epoch": 1668} {"train_loss": -41.94682693481445, "global_step": 201837, "epoch": 1668} {"train_loss": -42.54178237915039, "global_step": 201838, "epoch": 1668} {"train_loss": -42.36387634277344, "global_step": 201839, "epoch": 1668} {"train_loss": -42.438228607177734, "global_step": 201840, "epoch": 1668} {"train_loss": -42.2907829284668, "global_step": 201841, "epoch": 1668} {"train_loss": -42.5998649597168, "global_step": 201842, "epoch": 1668} {"train_loss": -42.61237716674805, "global_step": 201843, "epoch": 1668} {"train_loss": -42.878841400146484, "global_step": 201844, "epoch": 1668} {"train_loss": -42.1363525390625, "global_step": 201845, "epoch": 1668} {"train_loss": -41.78374099731445, "global_step": 201846, "epoch": 1668} {"train_loss": -42.658721923828125, "global_step": 201847, "epoch": 1668} {"train_loss": -42.72050476074219, "global_step": 201848, "epoch": 1668} {"train_loss": -41.985755920410156, "global_step": 201849, "epoch": 1668} {"train_loss": -42.80073165893555, "global_step": 201850, "epoch": 1668} {"train_loss": -42.77009582519531, "global_step": 201851, "epoch": 1668} {"train_loss": -42.707061767578125, "global_step": 201852, "epoch": 1668} {"train_loss": -42.73274230957031, "global_step": 201853, "epoch": 1668} {"train_loss": -42.87435531616211, "global_step": 201854, "epoch": 1668} {"train_loss": -42.778324127197266, "global_step": 201855, "epoch": 1668} {"train_loss": -42.18346405029297, "global_step": 201856, "epoch": 1668} {"train_loss": -43.03141784667969, "global_step": 201857, "epoch": 1668} {"train_loss": -42.469051361083984, "global_step": 201858, "epoch": 1668} {"train_loss": -42.73130416870117, "global_step": 201859, "epoch": 1668} {"train_loss": -42.72183609008789, "global_step": 201860, "epoch": 1668} {"train_loss": -42.263362884521484, "global_step": 201861, "epoch": 1668} {"train_loss": -42.443904876708984, "global_step": 201862, "epoch": 1668} {"train_loss": -43.07297897338867, "global_step": 201863, "epoch": 1668} {"train_loss": -42.474639892578125, "global_step": 201864, "epoch": 1668} {"train_loss": -42.804012298583984, "global_step": 201865, "epoch": 1668} {"train_loss": -42.23836898803711, "global_step": 201866, "epoch": 1668} {"train_loss": -42.57122802734375, "global_step": 201867, "epoch": 1668} {"train_loss": -42.42133712768555, "global_step": 201868, "epoch": 1668} {"train_loss": -41.9378776550293, "global_step": 201869, "epoch": 1668} {"train_loss": -41.1711311340332, "global_step": 201870, "epoch": 1668} {"train_loss": -41.5460090637207, "global_step": 201871, "epoch": 1668} {"train_loss": -41.61100387573242, "global_step": 201872, "epoch": 1668} {"train_loss": -42.05022048950195, "global_step": 201873, "epoch": 1668} {"train_loss": -41.93901443481445, "global_step": 201874, "epoch": 1668} {"train_loss": -42.225013732910156, "global_step": 201875, "epoch": 1668} {"train_loss": -42.62076950073242, "global_step": 201876, "epoch": 1668} {"train_loss": -41.77206039428711, "global_step": 201877, "epoch": 1668} {"train_loss": -42.27853012084961, "global_step": 201878, "epoch": 1668} {"train_loss": -41.310546875, "global_step": 201879, "epoch": 1668} {"train_loss": -40.0351676940918, "global_step": 201880, "epoch": 1668} {"train_loss": -39.78139877319336, "global_step": 201881, "epoch": 1668} {"train_loss": -40.51459503173828, "global_step": 201882, "epoch": 1668} {"train_loss": -40.26930618286133, "global_step": 201883, "epoch": 1668} {"train_loss": -41.29489517211914, "global_step": 201884, "epoch": 1668} {"train_loss": -41.22529220581055, "global_step": 201885, "epoch": 1668} {"train_loss": -40.50681686401367, "global_step": 201886, "epoch": 1668} {"train_loss": -36.39043045043945, "global_step": 201887, "epoch": 1668} {"train_loss": -32.76185989379883, "global_step": 201888, "epoch": 1668} {"train_loss": -38.016170501708984, "global_step": 201889, "epoch": 1668} {"train_loss": -40.282772064208984, "global_step": 201890, "epoch": 1668} {"train_loss": -35.582576751708984, "global_step": 201891, "epoch": 1668} {"train_loss": -34.876197814941406, "global_step": 201892, "epoch": 1668} {"train_loss": -39.42206573486328, "global_step": 201893, "epoch": 1668} {"train_loss": -36.197509765625, "global_step": 201894, "epoch": 1668} {"train_loss": -36.579193115234375, "global_step": 201895, "epoch": 1668} {"train_loss": -39.60002517700195, "global_step": 201896, "epoch": 1668} {"train_loss": -38.271453857421875, "global_step": 201897, "epoch": 1668} {"train_loss": -38.79474639892578, "global_step": 201898, "epoch": 1668} {"train_loss": -39.68414306640625, "global_step": 201899, "epoch": 1668} {"train_loss": -39.02691650390625, "global_step": 201900, "epoch": 1668} {"train_loss": -39.95559310913086, "global_step": 201901, "epoch": 1668} {"train_loss": -40.273902893066406, "global_step": 201902, "epoch": 1668} {"train_loss": -39.36075973510742, "global_step": 201903, "epoch": 1668} {"train_loss": -40.048973083496094, "global_step": 201904, "epoch": 1668} {"train_loss": -39.53377151489258, "global_step": 201905, "epoch": 1668} {"train_loss": -40.20581817626953, "global_step": 201906, "epoch": 1668} {"train_loss": -39.430824279785156, "global_step": 201907, "epoch": 1668} {"train_loss": -39.21651840209961, "global_step": 201908, "epoch": 1668} {"train_loss": -40.46839141845703, "global_step": 201909, "epoch": 1668} {"train_loss": -40.1909294128418, "global_step": 201910, "epoch": 1668} {"train_loss": -39.93374252319336, "global_step": 201911, "epoch": 1668} {"train_loss": -40.26670837402344, "global_step": 201912, "epoch": 1668} {"train_loss": -40.9797477722168, "global_step": 201913, "epoch": 1668} {"train_loss": -40.66734313964844, "global_step": 201914, "epoch": 1668} {"train_loss": -39.419227600097656, "global_step": 201915, "epoch": 1668} {"train_loss": -41.320674896240234, "global_step": 201916, "epoch": 1668} {"train_loss": -40.475677490234375, "global_step": 201917, "epoch": 1668} {"train_loss": -40.9165153503418, "global_step": 201918, "epoch": 1668} {"train_loss": -40.09669876098633, "global_step": 201919, "epoch": 1668} {"train_loss": -40.65978240966797, "global_step": 201920, "epoch": 1668} {"train_loss": -40.521358489990234, "global_step": 201921, "epoch": 1668} {"train_loss": -41.00196838378906, "global_step": 201922, "epoch": 1668} {"train_loss": -40.359806060791016, "global_step": 201923, "epoch": 1668} {"train_loss": -41.471981048583984, "global_step": 201924, "epoch": 1668} {"train_loss": -41.151893615722656, "global_step": 201925, "epoch": 1668} {"train_loss": -41.32176971435547, "global_step": 201926, "epoch": 1668} {"train_loss": -41.47880172729492, "global_step": 201927, "epoch": 1668} {"train_loss": -41.3114013671875, "global_step": 201928, "epoch": 1668} {"train_loss": -42.06720733642578, "global_step": 201929, "epoch": 1668} {"train_loss": -41.140682220458984, "global_step": 201930, "epoch": 1668} {"train_loss": -42.097412109375, "global_step": 201931, "epoch": 1668} {"train_loss": -41.20219039916992, "global_step": 201932, "epoch": 1668} {"train_loss": -41.78171157836914, "global_step": 201933, "epoch": 1668} {"train_loss": -41.4736442565918, "global_step": 201934, "epoch": 1668} {"train_loss": -41.638893127441406, "global_step": 201935, "epoch": 1668} {"train_loss": -41.80514144897461, "global_step": 201936, "epoch": 1668} {"train_loss": -41.179176330566406, "global_step": 201937, "epoch": 1668} {"train_loss": -41.82090377807617, "global_step": 201938, "epoch": 1668} {"train_loss": -41.12260818481445, "global_step": 201939, "epoch": 1668} {"train_loss": -41.78938674926758, "global_step": 201940, "epoch": 1668} {"train_loss": -41.62014389038086, "global_step": 201941, "epoch": 1668} {"train_loss": -42.316314697265625, "global_step": 201942, "epoch": 1668} {"train_loss": -41.13511657714844, "global_step": 201943, "epoch": 1668} {"train_loss": -41.637054443359375, "global_step": 201944, "epoch": 1668} {"train_loss": -41.4178581237793, "global_step": 201945, "epoch": 1668} {"train_loss": -41.74049758911133, "global_step": 201946, "epoch": 1668} {"train_loss": -42.19283676147461, "global_step": 201947, "epoch": 1668} {"train_loss": -41.11550600666645, "global_step": 201948, "epoch": 1668, "val_loss": 2585786.75} {"train_loss": -41.83024215698242, "global_step": 201949, "epoch": 1669} {"train_loss": -41.75456237792969, "global_step": 201950, "epoch": 1669} {"train_loss": -42.37374496459961, "global_step": 201951, "epoch": 1669} {"train_loss": -42.2285270690918, "global_step": 201952, "epoch": 1669} {"train_loss": -42.398529052734375, "global_step": 201953, "epoch": 1669} {"train_loss": -41.902278900146484, "global_step": 201954, "epoch": 1669} {"train_loss": -41.81534194946289, "global_step": 201955, "epoch": 1669} {"train_loss": -42.42029571533203, "global_step": 201956, "epoch": 1669} {"train_loss": -42.44951248168945, "global_step": 201957, "epoch": 1669} {"train_loss": -42.169429779052734, "global_step": 201958, "epoch": 1669} {"train_loss": -42.34760284423828, "global_step": 201959, "epoch": 1669} {"train_loss": -42.39571762084961, "global_step": 201960, "epoch": 1669} {"train_loss": -42.61616897583008, "global_step": 201961, "epoch": 1669} {"train_loss": -42.349952697753906, "global_step": 201962, "epoch": 1669} {"train_loss": -42.129459381103516, "global_step": 201963, "epoch": 1669} {"train_loss": -42.19488525390625, "global_step": 201964, "epoch": 1669} {"train_loss": -41.45038986206055, "global_step": 201965, "epoch": 1669} {"train_loss": -42.0138053894043, "global_step": 201966, "epoch": 1669} {"train_loss": -42.08126449584961, "global_step": 201967, "epoch": 1669} {"train_loss": -42.172542572021484, "global_step": 201968, "epoch": 1669} {"train_loss": -41.98667526245117, "global_step": 201969, "epoch": 1669} {"train_loss": -41.76070785522461, "global_step": 201970, "epoch": 1669} {"train_loss": -42.395076751708984, "global_step": 201971, "epoch": 1669} {"train_loss": -42.6453742980957, "global_step": 201972, "epoch": 1669} {"train_loss": -42.54781723022461, "global_step": 201973, "epoch": 1669} {"train_loss": -41.73057556152344, "global_step": 201974, "epoch": 1669} {"train_loss": -41.712074279785156, "global_step": 201975, "epoch": 1669} {"train_loss": -42.028812408447266, "global_step": 201976, "epoch": 1669} {"train_loss": -41.895408630371094, "global_step": 201977, "epoch": 1669} {"train_loss": -42.361541748046875, "global_step": 201978, "epoch": 1669} {"train_loss": -41.906105041503906, "global_step": 201979, "epoch": 1669} {"train_loss": -40.228633880615234, "global_step": 201980, "epoch": 1669} {"train_loss": -38.071624755859375, "global_step": 201981, "epoch": 1669} {"train_loss": -37.04909896850586, "global_step": 201982, "epoch": 1669} {"train_loss": -38.31240463256836, "global_step": 201983, "epoch": 1669} {"train_loss": -40.9451789855957, "global_step": 201984, "epoch": 1669} {"train_loss": -42.436317443847656, "global_step": 201985, "epoch": 1669} {"train_loss": -39.61687088012695, "global_step": 201986, "epoch": 1669} {"train_loss": -37.95109939575195, "global_step": 201987, "epoch": 1669} {"train_loss": -39.4754638671875, "global_step": 201988, "epoch": 1669} {"train_loss": -41.52075958251953, "global_step": 201989, "epoch": 1669} {"train_loss": -38.343505859375, "global_step": 201990, "epoch": 1669} {"train_loss": -38.00086975097656, "global_step": 201991, "epoch": 1669} {"train_loss": -41.730831146240234, "global_step": 201992, "epoch": 1669} {"train_loss": -39.72310256958008, "global_step": 201993, "epoch": 1669} {"train_loss": -40.76653289794922, "global_step": 201994, "epoch": 1669} {"train_loss": -40.79996109008789, "global_step": 201995, "epoch": 1669} {"train_loss": -40.12459182739258, "global_step": 201996, "epoch": 1669} {"train_loss": -41.723724365234375, "global_step": 201997, "epoch": 1669} {"train_loss": -40.14341735839844, "global_step": 201998, "epoch": 1669} {"train_loss": -41.31000518798828, "global_step": 201999, "epoch": 1669} {"train_loss": -41.324745178222656, "global_step": 202000, "epoch": 1669} {"train_loss": -41.482147216796875, "global_step": 202001, "epoch": 1669} {"train_loss": -41.522762298583984, "global_step": 202002, "epoch": 1669} {"train_loss": -41.54413986206055, "global_step": 202003, "epoch": 1669} {"train_loss": -40.64368438720703, "global_step": 202004, "epoch": 1669} {"train_loss": -41.31831741333008, "global_step": 202005, "epoch": 1669} {"train_loss": -41.4807243347168, "global_step": 202006, "epoch": 1669} {"train_loss": -41.40168762207031, "global_step": 202007, "epoch": 1669} {"train_loss": -41.34519577026367, "global_step": 202008, "epoch": 1669} {"train_loss": -42.04740524291992, "global_step": 202009, "epoch": 1669} {"train_loss": -42.05593490600586, "global_step": 202010, "epoch": 1669} {"train_loss": -42.1593132019043, "global_step": 202011, "epoch": 1669} {"train_loss": -41.34141159057617, "global_step": 202012, "epoch": 1669} {"train_loss": -41.27418518066406, "global_step": 202013, "epoch": 1669} {"train_loss": -41.980953216552734, "global_step": 202014, "epoch": 1669} {"train_loss": -42.128780364990234, "global_step": 202015, "epoch": 1669} {"train_loss": -41.269771575927734, "global_step": 202016, "epoch": 1669} {"train_loss": -40.805999755859375, "global_step": 202017, "epoch": 1669} {"train_loss": -41.29587936401367, "global_step": 202018, "epoch": 1669} {"train_loss": -41.76944351196289, "global_step": 202019, "epoch": 1669} {"train_loss": -40.97249984741211, "global_step": 202020, "epoch": 1669} {"train_loss": -41.43817901611328, "global_step": 202021, "epoch": 1669} {"train_loss": -42.149513244628906, "global_step": 202022, "epoch": 1669} {"train_loss": -41.85310745239258, "global_step": 202023, "epoch": 1669} {"train_loss": -41.80463790893555, "global_step": 202024, "epoch": 1669} {"train_loss": -42.282264709472656, "global_step": 202025, "epoch": 1669} {"train_loss": -41.27155685424805, "global_step": 202026, "epoch": 1669} {"train_loss": -42.004417419433594, "global_step": 202027, "epoch": 1669} {"train_loss": -41.46943283081055, "global_step": 202028, "epoch": 1669} {"train_loss": -41.43588638305664, "global_step": 202029, "epoch": 1669} {"train_loss": -42.0782356262207, "global_step": 202030, "epoch": 1669} {"train_loss": -42.11367416381836, "global_step": 202031, "epoch": 1669} {"train_loss": -41.8299446105957, "global_step": 202032, "epoch": 1669} {"train_loss": -41.85073471069336, "global_step": 202033, "epoch": 1669} {"train_loss": -41.402801513671875, "global_step": 202034, "epoch": 1669} {"train_loss": -41.70962142944336, "global_step": 202035, "epoch": 1669} {"train_loss": -41.9932861328125, "global_step": 202036, "epoch": 1669} {"train_loss": -42.26348876953125, "global_step": 202037, "epoch": 1669} {"train_loss": -41.364803314208984, "global_step": 202038, "epoch": 1669} {"train_loss": -40.15452194213867, "global_step": 202039, "epoch": 1669} {"train_loss": -38.86323165893555, "global_step": 202040, "epoch": 1669} {"train_loss": -37.098140716552734, "global_step": 202041, "epoch": 1669} {"train_loss": -37.32207107543945, "global_step": 202042, "epoch": 1669} {"train_loss": -38.03976058959961, "global_step": 202043, "epoch": 1669} {"train_loss": -40.9266242980957, "global_step": 202044, "epoch": 1669} {"train_loss": -41.68059158325195, "global_step": 202045, "epoch": 1669} {"train_loss": -40.29457473754883, "global_step": 202046, "epoch": 1669} {"train_loss": -40.86868667602539, "global_step": 202047, "epoch": 1669} {"train_loss": -41.03463363647461, "global_step": 202048, "epoch": 1669} {"train_loss": -41.243953704833984, "global_step": 202049, "epoch": 1669} {"train_loss": -41.20623779296875, "global_step": 202050, "epoch": 1669} {"train_loss": -41.06348419189453, "global_step": 202051, "epoch": 1669} {"train_loss": -41.46873092651367, "global_step": 202052, "epoch": 1669} {"train_loss": -40.8258171081543, "global_step": 202053, "epoch": 1669} {"train_loss": -41.53742599487305, "global_step": 202054, "epoch": 1669} {"train_loss": -40.73155212402344, "global_step": 202055, "epoch": 1669} {"train_loss": -41.967529296875, "global_step": 202056, "epoch": 1669} {"train_loss": -41.250831604003906, "global_step": 202057, "epoch": 1669} {"train_loss": -41.5221061706543, "global_step": 202058, "epoch": 1669} {"train_loss": -41.54267120361328, "global_step": 202059, "epoch": 1669} {"train_loss": -40.93977355957031, "global_step": 202060, "epoch": 1669} {"train_loss": -41.81855392456055, "global_step": 202061, "epoch": 1669} {"train_loss": -40.86597442626953, "global_step": 202062, "epoch": 1669} {"train_loss": -41.47492218017578, "global_step": 202063, "epoch": 1669} {"train_loss": -41.78527069091797, "global_step": 202064, "epoch": 1669} {"train_loss": -40.96236038208008, "global_step": 202065, "epoch": 1669} {"train_loss": -41.54450607299805, "global_step": 202066, "epoch": 1669} {"train_loss": -41.786434173583984, "global_step": 202067, "epoch": 1669} {"train_loss": -41.17891311645508, "global_step": 202068, "epoch": 1669} {"train_loss": -41.26020570234819, "global_step": 202069, "epoch": 1669, "val_loss": 2563620.25} {"train_loss": -40.95713424682617, "global_step": 202070, "epoch": 1670} {"train_loss": -40.9078369140625, "global_step": 202071, "epoch": 1670} {"train_loss": -42.139644622802734, "global_step": 202072, "epoch": 1670} {"train_loss": -41.52364730834961, "global_step": 202073, "epoch": 1670} {"train_loss": -40.7575798034668, "global_step": 202074, "epoch": 1670} {"train_loss": -41.72960662841797, "global_step": 202075, "epoch": 1670} {"train_loss": -40.97968292236328, "global_step": 202076, "epoch": 1670} {"train_loss": -41.06475830078125, "global_step": 202077, "epoch": 1670} {"train_loss": -40.68288803100586, "global_step": 202078, "epoch": 1670} {"train_loss": -42.0370979309082, "global_step": 202079, "epoch": 1670} {"train_loss": -41.225807189941406, "global_step": 202080, "epoch": 1670} {"train_loss": -42.042869567871094, "global_step": 202081, "epoch": 1670} {"train_loss": -41.40320587158203, "global_step": 202082, "epoch": 1670} {"train_loss": -41.92213821411133, "global_step": 202083, "epoch": 1670} {"train_loss": -41.6573371887207, "global_step": 202084, "epoch": 1670} {"train_loss": -41.82413864135742, "global_step": 202085, "epoch": 1670} {"train_loss": -42.44485092163086, "global_step": 202086, "epoch": 1670} {"train_loss": -40.87763977050781, "global_step": 202087, "epoch": 1670} {"train_loss": -39.207035064697266, "global_step": 202088, "epoch": 1670} {"train_loss": -41.327327728271484, "global_step": 202089, "epoch": 1670} {"train_loss": -39.92510986328125, "global_step": 202090, "epoch": 1670} {"train_loss": -39.93790054321289, "global_step": 202091, "epoch": 1670} {"train_loss": -41.548580169677734, "global_step": 202092, "epoch": 1670} {"train_loss": -40.61133575439453, "global_step": 202093, "epoch": 1670} {"train_loss": -39.52816390991211, "global_step": 202094, "epoch": 1670} {"train_loss": -39.33306884765625, "global_step": 202095, "epoch": 1670} {"train_loss": -41.52302932739258, "global_step": 202096, "epoch": 1670} {"train_loss": -40.18281936645508, "global_step": 202097, "epoch": 1670} {"train_loss": -38.57707977294922, "global_step": 202098, "epoch": 1670} {"train_loss": -38.259796142578125, "global_step": 202099, "epoch": 1670} {"train_loss": -41.65980529785156, "global_step": 202100, "epoch": 1670} {"train_loss": -37.789302825927734, "global_step": 202101, "epoch": 1670} {"train_loss": -37.30317306518555, "global_step": 202102, "epoch": 1670} {"train_loss": -41.915279388427734, "global_step": 202103, "epoch": 1670} {"train_loss": -36.9593391418457, "global_step": 202104, "epoch": 1670} {"train_loss": -40.75944900512695, "global_step": 202105, "epoch": 1670} {"train_loss": -40.01411437988281, "global_step": 202106, "epoch": 1670} {"train_loss": -39.50026321411133, "global_step": 202107, "epoch": 1670} {"train_loss": -41.26609420776367, "global_step": 202108, "epoch": 1670} {"train_loss": -38.63810348510742, "global_step": 202109, "epoch": 1670} {"train_loss": -41.051204681396484, "global_step": 202110, "epoch": 1670} {"train_loss": -40.4983024597168, "global_step": 202111, "epoch": 1670} {"train_loss": -40.98042678833008, "global_step": 202112, "epoch": 1670} {"train_loss": -41.18109893798828, "global_step": 202113, "epoch": 1670} {"train_loss": -39.47218704223633, "global_step": 202114, "epoch": 1670} {"train_loss": -40.95040512084961, "global_step": 202115, "epoch": 1670} {"train_loss": -40.597862243652344, "global_step": 202116, "epoch": 1670} {"train_loss": -40.70133590698242, "global_step": 202117, "epoch": 1670} {"train_loss": -41.44257736206055, "global_step": 202118, "epoch": 1670} {"train_loss": -41.16142654418945, "global_step": 202119, "epoch": 1670} {"train_loss": -41.59811019897461, "global_step": 202120, "epoch": 1670} {"train_loss": -40.90250015258789, "global_step": 202121, "epoch": 1670} {"train_loss": -41.0676155090332, "global_step": 202122, "epoch": 1670} {"train_loss": -41.37904357910156, "global_step": 202123, "epoch": 1670} {"train_loss": -40.61385726928711, "global_step": 202124, "epoch": 1670} {"train_loss": -41.79896926879883, "global_step": 202125, "epoch": 1670} {"train_loss": -40.56048583984375, "global_step": 202126, "epoch": 1670} {"train_loss": -41.82709884643555, "global_step": 202127, "epoch": 1670} {"train_loss": -41.44275665283203, "global_step": 202128, "epoch": 1670} {"train_loss": -41.98261642456055, "global_step": 202129, "epoch": 1670} {"train_loss": -40.9990348815918, "global_step": 202130, "epoch": 1670} {"train_loss": -41.80198669433594, "global_step": 202131, "epoch": 1670} {"train_loss": -41.320167541503906, "global_step": 202132, "epoch": 1670} {"train_loss": -41.65070343017578, "global_step": 202133, "epoch": 1670} {"train_loss": -42.159271240234375, "global_step": 202134, "epoch": 1670} {"train_loss": -41.7767333984375, "global_step": 202135, "epoch": 1670} {"train_loss": -41.67994689941406, "global_step": 202136, "epoch": 1670} {"train_loss": -41.17117691040039, "global_step": 202137, "epoch": 1670} {"train_loss": -42.09255599975586, "global_step": 202138, "epoch": 1670} {"train_loss": -41.18385696411133, "global_step": 202139, "epoch": 1670} {"train_loss": -41.85268020629883, "global_step": 202140, "epoch": 1670} {"train_loss": -41.6351432800293, "global_step": 202141, "epoch": 1670} {"train_loss": -41.99943161010742, "global_step": 202142, "epoch": 1670} {"train_loss": -41.94370651245117, "global_step": 202143, "epoch": 1670} {"train_loss": -41.468780517578125, "global_step": 202144, "epoch": 1670} {"train_loss": -42.06648635864258, "global_step": 202145, "epoch": 1670} {"train_loss": -41.639862060546875, "global_step": 202146, "epoch": 1670} {"train_loss": -42.170406341552734, "global_step": 202147, "epoch": 1670} {"train_loss": -41.332706451416016, "global_step": 202148, "epoch": 1670} {"train_loss": -42.1810417175293, "global_step": 202149, "epoch": 1670} {"train_loss": -41.980140686035156, "global_step": 202150, "epoch": 1670} {"train_loss": -42.19629669189453, "global_step": 202151, "epoch": 1670} {"train_loss": -41.59897994995117, "global_step": 202152, "epoch": 1670} {"train_loss": -41.9483528137207, "global_step": 202153, "epoch": 1670} {"train_loss": -41.3345832824707, "global_step": 202154, "epoch": 1670} {"train_loss": -42.676815032958984, "global_step": 202155, "epoch": 1670} {"train_loss": -42.38390350341797, "global_step": 202156, "epoch": 1670} {"train_loss": -42.1876220703125, "global_step": 202157, "epoch": 1670} {"train_loss": -42.496524810791016, "global_step": 202158, "epoch": 1670} {"train_loss": -42.79490661621094, "global_step": 202159, "epoch": 1670} {"train_loss": -42.518760681152344, "global_step": 202160, "epoch": 1670} {"train_loss": -42.527130126953125, "global_step": 202161, "epoch": 1670} {"train_loss": -42.87948989868164, "global_step": 202162, "epoch": 1670} {"train_loss": -42.500732421875, "global_step": 202163, "epoch": 1670} {"train_loss": -42.526241302490234, "global_step": 202164, "epoch": 1670} {"train_loss": -42.89377212524414, "global_step": 202165, "epoch": 1670} {"train_loss": -42.68204879760742, "global_step": 202166, "epoch": 1670} {"train_loss": -42.688331604003906, "global_step": 202167, "epoch": 1670} {"train_loss": -42.812191009521484, "global_step": 202168, "epoch": 1670} {"train_loss": -42.62050247192383, "global_step": 202169, "epoch": 1670} {"train_loss": -42.830501556396484, "global_step": 202170, "epoch": 1670} {"train_loss": -42.67331314086914, "global_step": 202171, "epoch": 1670} {"train_loss": -42.58244323730469, "global_step": 202172, "epoch": 1670} {"train_loss": -42.37611389160156, "global_step": 202173, "epoch": 1670} {"train_loss": -43.1005973815918, "global_step": 202174, "epoch": 1670} {"train_loss": -42.68496322631836, "global_step": 202175, "epoch": 1670} {"train_loss": -43.45590591430664, "global_step": 202176, "epoch": 1670} {"train_loss": -42.7782096862793, "global_step": 202177, "epoch": 1670} {"train_loss": -42.546043395996094, "global_step": 202178, "epoch": 1670} {"train_loss": -42.54898452758789, "global_step": 202179, "epoch": 1670} {"train_loss": -42.585182189941406, "global_step": 202180, "epoch": 1670} {"train_loss": -42.43165969848633, "global_step": 202181, "epoch": 1670} {"train_loss": -41.72318649291992, "global_step": 202182, "epoch": 1670} {"train_loss": -42.929195404052734, "global_step": 202183, "epoch": 1670} {"train_loss": -42.94440841674805, "global_step": 202184, "epoch": 1670} {"train_loss": -42.62003707885742, "global_step": 202185, "epoch": 1670} {"train_loss": -42.77346420288086, "global_step": 202186, "epoch": 1670} {"train_loss": -42.323516845703125, "global_step": 202187, "epoch": 1670} {"train_loss": -40.85520553588867, "global_step": 202188, "epoch": 1670} {"train_loss": -39.230743408203125, "global_step": 202189, "epoch": 1670} {"train_loss": -41.399504827073784, "global_step": 202190, "epoch": 1670, "val_loss": 2525547.0} {"train_loss": -29.84527587890625, "global_step": 202191, "epoch": 1671} {"train_loss": -29.45798110961914, "global_step": 202192, "epoch": 1671} {"train_loss": -38.279335021972656, "global_step": 202193, "epoch": 1671} {"train_loss": -36.59503936767578, "global_step": 202194, "epoch": 1671} {"train_loss": -32.537776947021484, "global_step": 202195, "epoch": 1671} {"train_loss": -33.20964431762695, "global_step": 202196, "epoch": 1671} {"train_loss": -36.499176025390625, "global_step": 202197, "epoch": 1671} {"train_loss": -35.15752029418945, "global_step": 202198, "epoch": 1671} {"train_loss": -37.925575256347656, "global_step": 202199, "epoch": 1671} {"train_loss": -37.91637420654297, "global_step": 202200, "epoch": 1671} {"train_loss": -36.1756706237793, "global_step": 202201, "epoch": 1671} {"train_loss": -40.35563278198242, "global_step": 202202, "epoch": 1671} {"train_loss": -38.781105041503906, "global_step": 202203, "epoch": 1671} {"train_loss": -38.99884796142578, "global_step": 202204, "epoch": 1671} {"train_loss": -39.757381439208984, "global_step": 202205, "epoch": 1671} {"train_loss": -38.44782638549805, "global_step": 202206, "epoch": 1671} {"train_loss": -40.65986251831055, "global_step": 202207, "epoch": 1671} {"train_loss": -39.35750961303711, "global_step": 202208, "epoch": 1671} {"train_loss": -40.71763229370117, "global_step": 202209, "epoch": 1671} {"train_loss": -39.91731643676758, "global_step": 202210, "epoch": 1671} {"train_loss": -39.74215316772461, "global_step": 202211, "epoch": 1671} {"train_loss": -40.36418151855469, "global_step": 202212, "epoch": 1671} {"train_loss": -41.0063591003418, "global_step": 202213, "epoch": 1671} {"train_loss": -40.4943962097168, "global_step": 202214, "epoch": 1671} {"train_loss": -40.61748123168945, "global_step": 202215, "epoch": 1671} {"train_loss": -40.00309371948242, "global_step": 202216, "epoch": 1671} {"train_loss": -41.10761260986328, "global_step": 202217, "epoch": 1671} {"train_loss": -41.169837951660156, "global_step": 202218, "epoch": 1671} {"train_loss": -41.01374435424805, "global_step": 202219, "epoch": 1671} {"train_loss": -40.85491943359375, "global_step": 202220, "epoch": 1671} {"train_loss": -40.421607971191406, "global_step": 202221, "epoch": 1671} {"train_loss": -41.060150146484375, "global_step": 202222, "epoch": 1671} {"train_loss": -41.59182357788086, "global_step": 202223, "epoch": 1671} {"train_loss": -41.61457443237305, "global_step": 202224, "epoch": 1671} {"train_loss": -41.53892135620117, "global_step": 202225, "epoch": 1671} {"train_loss": -41.53228759765625, "global_step": 202226, "epoch": 1671} {"train_loss": -41.421756744384766, "global_step": 202227, "epoch": 1671} {"train_loss": -41.545772552490234, "global_step": 202228, "epoch": 1671} {"train_loss": -41.275733947753906, "global_step": 202229, "epoch": 1671} {"train_loss": -41.2813835144043, "global_step": 202230, "epoch": 1671} {"train_loss": -41.671688079833984, "global_step": 202231, "epoch": 1671} {"train_loss": -41.54676055908203, "global_step": 202232, "epoch": 1671} {"train_loss": -41.971614837646484, "global_step": 202233, "epoch": 1671} {"train_loss": -42.16817092895508, "global_step": 202234, "epoch": 1671} {"train_loss": -42.31354522705078, "global_step": 202235, "epoch": 1671} {"train_loss": -42.01011276245117, "global_step": 202236, "epoch": 1671} {"train_loss": -42.09983444213867, "global_step": 202237, "epoch": 1671} {"train_loss": -42.15198516845703, "global_step": 202238, "epoch": 1671} {"train_loss": -42.02486038208008, "global_step": 202239, "epoch": 1671} {"train_loss": -42.19797897338867, "global_step": 202240, "epoch": 1671} {"train_loss": -41.93132400512695, "global_step": 202241, "epoch": 1671} {"train_loss": -41.792049407958984, "global_step": 202242, "epoch": 1671} {"train_loss": -42.11124801635742, "global_step": 202243, "epoch": 1671} {"train_loss": -42.36896514892578, "global_step": 202244, "epoch": 1671} {"train_loss": -42.281898498535156, "global_step": 202245, "epoch": 1671} {"train_loss": -42.33681869506836, "global_step": 202246, "epoch": 1671} {"train_loss": -42.20158386230469, "global_step": 202247, "epoch": 1671} {"train_loss": -42.55918884277344, "global_step": 202248, "epoch": 1671} {"train_loss": -42.550941467285156, "global_step": 202249, "epoch": 1671} {"train_loss": -42.28207015991211, "global_step": 202250, "epoch": 1671} {"train_loss": -42.4003791809082, "global_step": 202251, "epoch": 1671} {"train_loss": -42.39396286010742, "global_step": 202252, "epoch": 1671} {"train_loss": -42.62541961669922, "global_step": 202253, "epoch": 1671} {"train_loss": -43.11720657348633, "global_step": 202254, "epoch": 1671} {"train_loss": -42.3006591796875, "global_step": 202255, "epoch": 1671} {"train_loss": -42.282283782958984, "global_step": 202256, "epoch": 1671} {"train_loss": -42.767059326171875, "global_step": 202257, "epoch": 1671} {"train_loss": -42.38654708862305, "global_step": 202258, "epoch": 1671} {"train_loss": -42.8829345703125, "global_step": 202259, "epoch": 1671} {"train_loss": -42.728355407714844, "global_step": 202260, "epoch": 1671} {"train_loss": -42.52864456176758, "global_step": 202261, "epoch": 1671} {"train_loss": -42.732460021972656, "global_step": 202262, "epoch": 1671} {"train_loss": -42.4498176574707, "global_step": 202263, "epoch": 1671} {"train_loss": -43.0418815612793, "global_step": 202264, "epoch": 1671} {"train_loss": -42.84475326538086, "global_step": 202265, "epoch": 1671} {"train_loss": -43.093299865722656, "global_step": 202266, "epoch": 1671} {"train_loss": -42.792510986328125, "global_step": 202267, "epoch": 1671} {"train_loss": -42.58883285522461, "global_step": 202268, "epoch": 1671} {"train_loss": -41.98876953125, "global_step": 202269, "epoch": 1671} {"train_loss": -41.81766891479492, "global_step": 202270, "epoch": 1671} {"train_loss": -41.57322311401367, "global_step": 202271, "epoch": 1671} {"train_loss": -41.21895217895508, "global_step": 202272, "epoch": 1671} {"train_loss": -40.36594772338867, "global_step": 202273, "epoch": 1671} {"train_loss": -39.96268844604492, "global_step": 202274, "epoch": 1671} {"train_loss": -40.413394927978516, "global_step": 202275, "epoch": 1671} {"train_loss": -41.02759552001953, "global_step": 202276, "epoch": 1671} {"train_loss": -43.00419235229492, "global_step": 202277, "epoch": 1671} {"train_loss": -41.679290771484375, "global_step": 202278, "epoch": 1671} {"train_loss": -39.85535430908203, "global_step": 202279, "epoch": 1671} {"train_loss": -39.9890251159668, "global_step": 202280, "epoch": 1671} {"train_loss": -41.92755889892578, "global_step": 202281, "epoch": 1671} {"train_loss": -41.868526458740234, "global_step": 202282, "epoch": 1671} {"train_loss": -39.63968276977539, "global_step": 202283, "epoch": 1671} {"train_loss": -39.149898529052734, "global_step": 202284, "epoch": 1671} {"train_loss": -38.45161056518555, "global_step": 202285, "epoch": 1671} {"train_loss": -39.311100006103516, "global_step": 202286, "epoch": 1671} {"train_loss": -40.66356658935547, "global_step": 202287, "epoch": 1671} {"train_loss": -39.26581573486328, "global_step": 202288, "epoch": 1671} {"train_loss": -38.557735443115234, "global_step": 202289, "epoch": 1671} {"train_loss": -38.75846481323242, "global_step": 202290, "epoch": 1671} {"train_loss": -40.468502044677734, "global_step": 202291, "epoch": 1671} {"train_loss": -36.697853088378906, "global_step": 202292, "epoch": 1671} {"train_loss": -38.471343994140625, "global_step": 202293, "epoch": 1671} {"train_loss": -39.97785186767578, "global_step": 202294, "epoch": 1671} {"train_loss": -40.359130859375, "global_step": 202295, "epoch": 1671} {"train_loss": -39.23766326904297, "global_step": 202296, "epoch": 1671} {"train_loss": -41.31447219848633, "global_step": 202297, "epoch": 1671} {"train_loss": -40.41603088378906, "global_step": 202298, "epoch": 1671} {"train_loss": -39.28145217895508, "global_step": 202299, "epoch": 1671} {"train_loss": -42.023231506347656, "global_step": 202300, "epoch": 1671} {"train_loss": -39.82339859008789, "global_step": 202301, "epoch": 1671} {"train_loss": -40.556556701660156, "global_step": 202302, "epoch": 1671} {"train_loss": -41.223018646240234, "global_step": 202303, "epoch": 1671} {"train_loss": -41.23822784423828, "global_step": 202304, "epoch": 1671} {"train_loss": -41.231746673583984, "global_step": 202305, "epoch": 1671} {"train_loss": -40.925689697265625, "global_step": 202306, "epoch": 1671} {"train_loss": -41.43595504760742, "global_step": 202307, "epoch": 1671} {"train_loss": -41.49692916870117, "global_step": 202308, "epoch": 1671} {"train_loss": -41.808712005615234, "global_step": 202309, "epoch": 1671} {"train_loss": -41.32563018798828, "global_step": 202310, "epoch": 1671} {"train_loss": -40.60147734712963, "global_step": 202311, "epoch": 1671, "val_loss": 2553852.75} {"train_loss": -41.01902389526367, "global_step": 202312, "epoch": 1672} {"train_loss": -42.10065460205078, "global_step": 202313, "epoch": 1672} {"train_loss": -42.17119216918945, "global_step": 202314, "epoch": 1672} {"train_loss": -42.324378967285156, "global_step": 202315, "epoch": 1672} {"train_loss": -42.178157806396484, "global_step": 202316, "epoch": 1672} {"train_loss": -42.165443420410156, "global_step": 202317, "epoch": 1672} {"train_loss": -42.51504135131836, "global_step": 202318, "epoch": 1672} {"train_loss": -42.41256332397461, "global_step": 202319, "epoch": 1672} {"train_loss": -42.499916076660156, "global_step": 202320, "epoch": 1672} {"train_loss": -41.8295783996582, "global_step": 202321, "epoch": 1672} {"train_loss": -42.365474700927734, "global_step": 202322, "epoch": 1672} {"train_loss": -42.631404876708984, "global_step": 202323, "epoch": 1672} {"train_loss": -42.242427825927734, "global_step": 202324, "epoch": 1672} {"train_loss": -42.183448791503906, "global_step": 202325, "epoch": 1672} {"train_loss": -42.63155746459961, "global_step": 202326, "epoch": 1672} {"train_loss": -42.78456115722656, "global_step": 202327, "epoch": 1672} {"train_loss": -42.646278381347656, "global_step": 202328, "epoch": 1672} {"train_loss": -42.66694259643555, "global_step": 202329, "epoch": 1672} {"train_loss": -42.93156051635742, "global_step": 202330, "epoch": 1672} {"train_loss": -42.439910888671875, "global_step": 202331, "epoch": 1672} {"train_loss": -42.75031280517578, "global_step": 202332, "epoch": 1672} {"train_loss": -42.52671432495117, "global_step": 202333, "epoch": 1672} {"train_loss": -42.61198806762695, "global_step": 202334, "epoch": 1672} {"train_loss": -42.42090606689453, "global_step": 202335, "epoch": 1672} {"train_loss": -42.61442184448242, "global_step": 202336, "epoch": 1672} {"train_loss": -41.609596252441406, "global_step": 202337, "epoch": 1672} {"train_loss": -42.731014251708984, "global_step": 202338, "epoch": 1672} {"train_loss": -42.31831359863281, "global_step": 202339, "epoch": 1672} {"train_loss": -43.01360321044922, "global_step": 202340, "epoch": 1672} {"train_loss": -42.851715087890625, "global_step": 202341, "epoch": 1672} {"train_loss": -42.53866195678711, "global_step": 202342, "epoch": 1672} {"train_loss": -41.70172882080078, "global_step": 202343, "epoch": 1672} {"train_loss": -41.68993377685547, "global_step": 202344, "epoch": 1672} {"train_loss": -41.33475875854492, "global_step": 202345, "epoch": 1672} {"train_loss": -41.92295455932617, "global_step": 202346, "epoch": 1672} {"train_loss": -41.87672424316406, "global_step": 202347, "epoch": 1672} {"train_loss": -41.192962646484375, "global_step": 202348, "epoch": 1672} {"train_loss": -42.418121337890625, "global_step": 202349, "epoch": 1672} {"train_loss": -42.1268424987793, "global_step": 202350, "epoch": 1672} {"train_loss": -40.9774169921875, "global_step": 202351, "epoch": 1672} {"train_loss": -41.607086181640625, "global_step": 202352, "epoch": 1672} {"train_loss": -37.5332145690918, "global_step": 202353, "epoch": 1672} {"train_loss": -39.088233947753906, "global_step": 202354, "epoch": 1672} {"train_loss": -41.04192352294922, "global_step": 202355, "epoch": 1672} {"train_loss": -41.2234001159668, "global_step": 202356, "epoch": 1672} {"train_loss": -42.326358795166016, "global_step": 202357, "epoch": 1672} {"train_loss": -41.78540802001953, "global_step": 202358, "epoch": 1672} {"train_loss": -40.6581916809082, "global_step": 202359, "epoch": 1672} {"train_loss": -39.32407760620117, "global_step": 202360, "epoch": 1672} {"train_loss": -39.78925704956055, "global_step": 202361, "epoch": 1672} {"train_loss": -42.15420913696289, "global_step": 202362, "epoch": 1672} {"train_loss": -41.29777908325195, "global_step": 202363, "epoch": 1672} {"train_loss": -40.08220672607422, "global_step": 202364, "epoch": 1672} {"train_loss": -41.930599212646484, "global_step": 202365, "epoch": 1672} {"train_loss": -40.84717559814453, "global_step": 202366, "epoch": 1672} {"train_loss": -39.62556076049805, "global_step": 202367, "epoch": 1672} {"train_loss": -39.1318359375, "global_step": 202368, "epoch": 1672} {"train_loss": -41.191505432128906, "global_step": 202369, "epoch": 1672} {"train_loss": -41.677467346191406, "global_step": 202370, "epoch": 1672} {"train_loss": -40.58384323120117, "global_step": 202371, "epoch": 1672} {"train_loss": -40.94392395019531, "global_step": 202372, "epoch": 1672} {"train_loss": -40.44054412841797, "global_step": 202373, "epoch": 1672} {"train_loss": -41.37118148803711, "global_step": 202374, "epoch": 1672} {"train_loss": -40.62209701538086, "global_step": 202375, "epoch": 1672} {"train_loss": -41.39460372924805, "global_step": 202376, "epoch": 1672} {"train_loss": -41.6971321105957, "global_step": 202377, "epoch": 1672} {"train_loss": -41.39859390258789, "global_step": 202378, "epoch": 1672} {"train_loss": -41.63519287109375, "global_step": 202379, "epoch": 1672} {"train_loss": -41.13037872314453, "global_step": 202380, "epoch": 1672} {"train_loss": -40.97890090942383, "global_step": 202381, "epoch": 1672} {"train_loss": -42.150543212890625, "global_step": 202382, "epoch": 1672} {"train_loss": -41.76903533935547, "global_step": 202383, "epoch": 1672} {"train_loss": -42.31695556640625, "global_step": 202384, "epoch": 1672} {"train_loss": -42.05610275268555, "global_step": 202385, "epoch": 1672} {"train_loss": -42.23115158081055, "global_step": 202386, "epoch": 1672} {"train_loss": -42.24299240112305, "global_step": 202387, "epoch": 1672} {"train_loss": -41.40220260620117, "global_step": 202388, "epoch": 1672} {"train_loss": -41.95856857299805, "global_step": 202389, "epoch": 1672} {"train_loss": -41.817298889160156, "global_step": 202390, "epoch": 1672} {"train_loss": -42.202327728271484, "global_step": 202391, "epoch": 1672} {"train_loss": -41.98198318481445, "global_step": 202392, "epoch": 1672} {"train_loss": -41.60042953491211, "global_step": 202393, "epoch": 1672} {"train_loss": -42.73220443725586, "global_step": 202394, "epoch": 1672} {"train_loss": -42.711936950683594, "global_step": 202395, "epoch": 1672} {"train_loss": -42.58000564575195, "global_step": 202396, "epoch": 1672} {"train_loss": -42.47154998779297, "global_step": 202397, "epoch": 1672} {"train_loss": -42.003902435302734, "global_step": 202398, "epoch": 1672} {"train_loss": -42.51765441894531, "global_step": 202399, "epoch": 1672} {"train_loss": -42.95612335205078, "global_step": 202400, "epoch": 1672} {"train_loss": -42.6901741027832, "global_step": 202401, "epoch": 1672} {"train_loss": -42.48394775390625, "global_step": 202402, "epoch": 1672} {"train_loss": -42.464656829833984, "global_step": 202403, "epoch": 1672} {"train_loss": -42.82427978515625, "global_step": 202404, "epoch": 1672} {"train_loss": -42.960174560546875, "global_step": 202405, "epoch": 1672} {"train_loss": -39.64658737182617, "global_step": 202406, "epoch": 1672} {"train_loss": -42.40034866333008, "global_step": 202407, "epoch": 1672} {"train_loss": -40.79624557495117, "global_step": 202408, "epoch": 1672} {"train_loss": -42.31769943237305, "global_step": 202409, "epoch": 1672} {"train_loss": -42.65631866455078, "global_step": 202410, "epoch": 1672} {"train_loss": -42.164161682128906, "global_step": 202411, "epoch": 1672} {"train_loss": -41.10049819946289, "global_step": 202412, "epoch": 1672} {"train_loss": -42.67656707763672, "global_step": 202413, "epoch": 1672} {"train_loss": -42.780555725097656, "global_step": 202414, "epoch": 1672} {"train_loss": -42.095760345458984, "global_step": 202415, "epoch": 1672} {"train_loss": -42.44183349609375, "global_step": 202416, "epoch": 1672} {"train_loss": -42.242088317871094, "global_step": 202417, "epoch": 1672} {"train_loss": -42.387874603271484, "global_step": 202418, "epoch": 1672} {"train_loss": -41.58761215209961, "global_step": 202419, "epoch": 1672} {"train_loss": -42.06034469604492, "global_step": 202420, "epoch": 1672} {"train_loss": -42.5805549621582, "global_step": 202421, "epoch": 1672} {"train_loss": -41.727874755859375, "global_step": 202422, "epoch": 1672} {"train_loss": -41.86918258666992, "global_step": 202423, "epoch": 1672} {"train_loss": -42.41459274291992, "global_step": 202424, "epoch": 1672} {"train_loss": -41.462181091308594, "global_step": 202425, "epoch": 1672} {"train_loss": -42.80500411987305, "global_step": 202426, "epoch": 1672} {"train_loss": -42.25416946411133, "global_step": 202427, "epoch": 1672} {"train_loss": -42.65139389038086, "global_step": 202428, "epoch": 1672} {"train_loss": -42.59965896606445, "global_step": 202429, "epoch": 1672} {"train_loss": -41.839839935302734, "global_step": 202430, "epoch": 1672} {"train_loss": -40.85415267944336, "global_step": 202431, "epoch": 1672} {"train_loss": -41.84234348013381, "global_step": 202432, "epoch": 1672, "val_loss": 2488588.75} {"train_loss": -41.2432975769043, "global_step": 202433, "epoch": 1673} {"train_loss": -41.10383605957031, "global_step": 202434, "epoch": 1673} {"train_loss": -42.396602630615234, "global_step": 202435, "epoch": 1673} {"train_loss": -41.62806701660156, "global_step": 202436, "epoch": 1673} {"train_loss": -39.98189163208008, "global_step": 202437, "epoch": 1673} {"train_loss": -39.91794204711914, "global_step": 202438, "epoch": 1673} {"train_loss": -40.19426345825195, "global_step": 202439, "epoch": 1673} {"train_loss": -41.5858154296875, "global_step": 202440, "epoch": 1673} {"train_loss": -40.64878463745117, "global_step": 202441, "epoch": 1673} {"train_loss": -38.001705169677734, "global_step": 202442, "epoch": 1673} {"train_loss": -40.00602340698242, "global_step": 202443, "epoch": 1673} {"train_loss": -40.09324264526367, "global_step": 202444, "epoch": 1673} {"train_loss": -41.58091354370117, "global_step": 202445, "epoch": 1673} {"train_loss": -38.948585510253906, "global_step": 202446, "epoch": 1673} {"train_loss": -38.559593200683594, "global_step": 202447, "epoch": 1673} {"train_loss": -40.89573287963867, "global_step": 202448, "epoch": 1673} {"train_loss": -40.09394073486328, "global_step": 202449, "epoch": 1673} {"train_loss": -39.51813507080078, "global_step": 202450, "epoch": 1673} {"train_loss": -41.14344024658203, "global_step": 202451, "epoch": 1673} {"train_loss": -41.57501220703125, "global_step": 202452, "epoch": 1673} {"train_loss": -38.1979866027832, "global_step": 202453, "epoch": 1673} {"train_loss": -40.359130859375, "global_step": 202454, "epoch": 1673} {"train_loss": -37.80292892456055, "global_step": 202455, "epoch": 1673} {"train_loss": -40.79117965698242, "global_step": 202456, "epoch": 1673} {"train_loss": -41.3964729309082, "global_step": 202457, "epoch": 1673} {"train_loss": -41.88753890991211, "global_step": 202458, "epoch": 1673} {"train_loss": -39.882198333740234, "global_step": 202459, "epoch": 1673} {"train_loss": -41.91407775878906, "global_step": 202460, "epoch": 1673} {"train_loss": -40.478572845458984, "global_step": 202461, "epoch": 1673} {"train_loss": -41.24285888671875, "global_step": 202462, "epoch": 1673} {"train_loss": -40.700538635253906, "global_step": 202463, "epoch": 1673} {"train_loss": -40.34651565551758, "global_step": 202464, "epoch": 1673} {"train_loss": -39.82827377319336, "global_step": 202465, "epoch": 1673} {"train_loss": -40.13404083251953, "global_step": 202466, "epoch": 1673} {"train_loss": -41.29413986206055, "global_step": 202467, "epoch": 1673} {"train_loss": -41.66903305053711, "global_step": 202468, "epoch": 1673} {"train_loss": -41.01078414916992, "global_step": 202469, "epoch": 1673} {"train_loss": -40.7206916809082, "global_step": 202470, "epoch": 1673} {"train_loss": -39.833702087402344, "global_step": 202471, "epoch": 1673} {"train_loss": -40.612449645996094, "global_step": 202472, "epoch": 1673} {"train_loss": -41.4018669128418, "global_step": 202473, "epoch": 1673} {"train_loss": -40.28746795654297, "global_step": 202474, "epoch": 1673} {"train_loss": -40.78076171875, "global_step": 202475, "epoch": 1673} {"train_loss": -40.73683166503906, "global_step": 202476, "epoch": 1673} {"train_loss": -40.77254867553711, "global_step": 202477, "epoch": 1673} {"train_loss": -42.24518585205078, "global_step": 202478, "epoch": 1673} {"train_loss": -41.52579879760742, "global_step": 202479, "epoch": 1673} {"train_loss": -42.49698257446289, "global_step": 202480, "epoch": 1673} {"train_loss": -40.998695373535156, "global_step": 202481, "epoch": 1673} {"train_loss": -41.71076583862305, "global_step": 202482, "epoch": 1673} {"train_loss": -41.9744873046875, "global_step": 202483, "epoch": 1673} {"train_loss": -42.01538848876953, "global_step": 202484, "epoch": 1673} {"train_loss": -41.65681076049805, "global_step": 202485, "epoch": 1673} {"train_loss": -42.12201690673828, "global_step": 202486, "epoch": 1673} {"train_loss": -42.28007125854492, "global_step": 202487, "epoch": 1673} {"train_loss": -41.0313720703125, "global_step": 202488, "epoch": 1673} {"train_loss": -42.92164993286133, "global_step": 202489, "epoch": 1673} {"train_loss": -42.55112838745117, "global_step": 202490, "epoch": 1673} {"train_loss": -42.33589553833008, "global_step": 202491, "epoch": 1673} {"train_loss": -42.790252685546875, "global_step": 202492, "epoch": 1673} {"train_loss": -41.175048828125, "global_step": 202493, "epoch": 1673} {"train_loss": -42.22075271606445, "global_step": 202494, "epoch": 1673} {"train_loss": -42.504852294921875, "global_step": 202495, "epoch": 1673} {"train_loss": -42.26844024658203, "global_step": 202496, "epoch": 1673} {"train_loss": -42.350379943847656, "global_step": 202497, "epoch": 1673} {"train_loss": -42.55916213989258, "global_step": 202498, "epoch": 1673} {"train_loss": -41.927608489990234, "global_step": 202499, "epoch": 1673} {"train_loss": -41.43124771118164, "global_step": 202500, "epoch": 1673} {"train_loss": -42.299190521240234, "global_step": 202501, "epoch": 1673} {"train_loss": -42.133113861083984, "global_step": 202502, "epoch": 1673} {"train_loss": -40.9752311706543, "global_step": 202503, "epoch": 1673} {"train_loss": -42.13825225830078, "global_step": 202504, "epoch": 1673} {"train_loss": -42.35993957519531, "global_step": 202505, "epoch": 1673} {"train_loss": -41.99479293823242, "global_step": 202506, "epoch": 1673} {"train_loss": -41.10591506958008, "global_step": 202507, "epoch": 1673} {"train_loss": -41.36158752441406, "global_step": 202508, "epoch": 1673} {"train_loss": -40.873043060302734, "global_step": 202509, "epoch": 1673} {"train_loss": -40.83823013305664, "global_step": 202510, "epoch": 1673} {"train_loss": -39.267982482910156, "global_step": 202511, "epoch": 1673} {"train_loss": -41.20380783081055, "global_step": 202512, "epoch": 1673} {"train_loss": -42.033321380615234, "global_step": 202513, "epoch": 1673} {"train_loss": -42.711700439453125, "global_step": 202514, "epoch": 1673} {"train_loss": -42.28738021850586, "global_step": 202515, "epoch": 1673} {"train_loss": -41.455909729003906, "global_step": 202516, "epoch": 1673} {"train_loss": -41.45746994018555, "global_step": 202517, "epoch": 1673} {"train_loss": -42.06106948852539, "global_step": 202518, "epoch": 1673} {"train_loss": -41.832489013671875, "global_step": 202519, "epoch": 1673} {"train_loss": -40.21390914916992, "global_step": 202520, "epoch": 1673} {"train_loss": -42.0393180847168, "global_step": 202521, "epoch": 1673} {"train_loss": -40.548038482666016, "global_step": 202522, "epoch": 1673} {"train_loss": -42.893455505371094, "global_step": 202523, "epoch": 1673} {"train_loss": -41.155635833740234, "global_step": 202524, "epoch": 1673} {"train_loss": -42.193572998046875, "global_step": 202525, "epoch": 1673} {"train_loss": -42.14551544189453, "global_step": 202526, "epoch": 1673} {"train_loss": -41.69395065307617, "global_step": 202527, "epoch": 1673} {"train_loss": -42.3391227722168, "global_step": 202528, "epoch": 1673} {"train_loss": -42.49263000488281, "global_step": 202529, "epoch": 1673} {"train_loss": -41.77962112426758, "global_step": 202530, "epoch": 1673} {"train_loss": -41.60430908203125, "global_step": 202531, "epoch": 1673} {"train_loss": -42.326900482177734, "global_step": 202532, "epoch": 1673} {"train_loss": -42.303157806396484, "global_step": 202533, "epoch": 1673} {"train_loss": -42.415260314941406, "global_step": 202534, "epoch": 1673} {"train_loss": -42.21574020385742, "global_step": 202535, "epoch": 1673} {"train_loss": -42.396480560302734, "global_step": 202536, "epoch": 1673} {"train_loss": -42.444549560546875, "global_step": 202537, "epoch": 1673} {"train_loss": -41.873023986816406, "global_step": 202538, "epoch": 1673} {"train_loss": -42.15641403198242, "global_step": 202539, "epoch": 1673} {"train_loss": -42.37394332885742, "global_step": 202540, "epoch": 1673} {"train_loss": -41.9531135559082, "global_step": 202541, "epoch": 1673} {"train_loss": -41.61881637573242, "global_step": 202542, "epoch": 1673} {"train_loss": -40.73379135131836, "global_step": 202543, "epoch": 1673} {"train_loss": -40.049224853515625, "global_step": 202544, "epoch": 1673} {"train_loss": -39.29057693481445, "global_step": 202545, "epoch": 1673} {"train_loss": -40.583919525146484, "global_step": 202546, "epoch": 1673} {"train_loss": -41.71051788330078, "global_step": 202547, "epoch": 1673} {"train_loss": -41.884971618652344, "global_step": 202548, "epoch": 1673} {"train_loss": -41.748592376708984, "global_step": 202549, "epoch": 1673} {"train_loss": -41.83816909790039, "global_step": 202550, "epoch": 1673} {"train_loss": -41.12836456298828, "global_step": 202551, "epoch": 1673} {"train_loss": -41.50592803955078, "global_step": 202552, "epoch": 1673} {"train_loss": -41.311184370813294, "global_step": 202553, "epoch": 1673, "val_loss": 2591941.25} {"train_loss": -40.74860763549805, "global_step": 202554, "epoch": 1674} {"train_loss": -38.591949462890625, "global_step": 202555, "epoch": 1674} {"train_loss": -37.61713790893555, "global_step": 202556, "epoch": 1674} {"train_loss": -39.2089729309082, "global_step": 202557, "epoch": 1674} {"train_loss": -40.821041107177734, "global_step": 202558, "epoch": 1674} {"train_loss": -38.796749114990234, "global_step": 202559, "epoch": 1674} {"train_loss": -39.32482147216797, "global_step": 202560, "epoch": 1674} {"train_loss": -40.19530487060547, "global_step": 202561, "epoch": 1674} {"train_loss": -38.85146713256836, "global_step": 202562, "epoch": 1674} {"train_loss": -37.73309326171875, "global_step": 202563, "epoch": 1674} {"train_loss": -38.1312141418457, "global_step": 202564, "epoch": 1674} {"train_loss": -39.4353141784668, "global_step": 202565, "epoch": 1674} {"train_loss": -39.527793884277344, "global_step": 202566, "epoch": 1674} {"train_loss": -39.94822692871094, "global_step": 202567, "epoch": 1674} {"train_loss": -39.5940055847168, "global_step": 202568, "epoch": 1674} {"train_loss": -39.819618225097656, "global_step": 202569, "epoch": 1674} {"train_loss": -40.22308349609375, "global_step": 202570, "epoch": 1674} {"train_loss": -41.38145065307617, "global_step": 202571, "epoch": 1674} {"train_loss": -41.11377716064453, "global_step": 202572, "epoch": 1674} {"train_loss": -41.02899169921875, "global_step": 202573, "epoch": 1674} {"train_loss": -40.710872650146484, "global_step": 202574, "epoch": 1674} {"train_loss": -41.95880126953125, "global_step": 202575, "epoch": 1674} {"train_loss": -40.30618667602539, "global_step": 202576, "epoch": 1674} {"train_loss": -41.649742126464844, "global_step": 202577, "epoch": 1674} {"train_loss": -41.6005973815918, "global_step": 202578, "epoch": 1674} {"train_loss": -41.35124588012695, "global_step": 202579, "epoch": 1674} {"train_loss": -40.917755126953125, "global_step": 202580, "epoch": 1674} {"train_loss": -41.21773910522461, "global_step": 202581, "epoch": 1674} {"train_loss": -41.81044006347656, "global_step": 202582, "epoch": 1674} {"train_loss": -41.62338638305664, "global_step": 202583, "epoch": 1674} {"train_loss": -41.948707580566406, "global_step": 202584, "epoch": 1674} {"train_loss": -42.0395622253418, "global_step": 202585, "epoch": 1674} {"train_loss": -41.98434066772461, "global_step": 202586, "epoch": 1674} {"train_loss": -41.94257354736328, "global_step": 202587, "epoch": 1674} {"train_loss": -42.25185775756836, "global_step": 202588, "epoch": 1674} {"train_loss": -42.38210678100586, "global_step": 202589, "epoch": 1674} {"train_loss": -42.13778305053711, "global_step": 202590, "epoch": 1674} {"train_loss": -42.24077224731445, "global_step": 202591, "epoch": 1674} {"train_loss": -42.371456146240234, "global_step": 202592, "epoch": 1674} {"train_loss": -42.26721954345703, "global_step": 202593, "epoch": 1674} {"train_loss": -42.462623596191406, "global_step": 202594, "epoch": 1674} {"train_loss": -42.6624641418457, "global_step": 202595, "epoch": 1674} {"train_loss": -42.45626449584961, "global_step": 202596, "epoch": 1674} {"train_loss": -42.60014724731445, "global_step": 202597, "epoch": 1674} {"train_loss": -42.26636505126953, "global_step": 202598, "epoch": 1674} {"train_loss": -42.52034378051758, "global_step": 202599, "epoch": 1674} {"train_loss": -42.8028678894043, "global_step": 202600, "epoch": 1674} {"train_loss": -42.285560607910156, "global_step": 202601, "epoch": 1674} {"train_loss": -42.68425369262695, "global_step": 202602, "epoch": 1674} {"train_loss": -42.56999969482422, "global_step": 202603, "epoch": 1674} {"train_loss": -42.84601593017578, "global_step": 202604, "epoch": 1674} {"train_loss": -42.43111038208008, "global_step": 202605, "epoch": 1674} {"train_loss": -42.45684814453125, "global_step": 202606, "epoch": 1674} {"train_loss": -42.62423324584961, "global_step": 202607, "epoch": 1674} {"train_loss": -42.746826171875, "global_step": 202608, "epoch": 1674} {"train_loss": -43.039058685302734, "global_step": 202609, "epoch": 1674} {"train_loss": -42.56577682495117, "global_step": 202610, "epoch": 1674} {"train_loss": -43.074642181396484, "global_step": 202611, "epoch": 1674} {"train_loss": -42.929264068603516, "global_step": 202612, "epoch": 1674} {"train_loss": -42.657588958740234, "global_step": 202613, "epoch": 1674} {"train_loss": -42.97196578979492, "global_step": 202614, "epoch": 1674} {"train_loss": -42.84772872924805, "global_step": 202615, "epoch": 1674} {"train_loss": -43.336788177490234, "global_step": 202616, "epoch": 1674} {"train_loss": -42.43500518798828, "global_step": 202617, "epoch": 1674} {"train_loss": -42.73330307006836, "global_step": 202618, "epoch": 1674} {"train_loss": -43.55381774902344, "global_step": 202619, "epoch": 1674} {"train_loss": -42.672035217285156, "global_step": 202620, "epoch": 1674} {"train_loss": -42.92390060424805, "global_step": 202621, "epoch": 1674} {"train_loss": -43.19158172607422, "global_step": 202622, "epoch": 1674} {"train_loss": -42.8482780456543, "global_step": 202623, "epoch": 1674} {"train_loss": -43.192665100097656, "global_step": 202624, "epoch": 1674} {"train_loss": -42.30609130859375, "global_step": 202625, "epoch": 1674} {"train_loss": -42.25386428833008, "global_step": 202626, "epoch": 1674} {"train_loss": -43.32910919189453, "global_step": 202627, "epoch": 1674} {"train_loss": -42.66721725463867, "global_step": 202628, "epoch": 1674} {"train_loss": -42.53679275512695, "global_step": 202629, "epoch": 1674} {"train_loss": -42.26160430908203, "global_step": 202630, "epoch": 1674} {"train_loss": -42.54096603393555, "global_step": 202631, "epoch": 1674} {"train_loss": -42.972381591796875, "global_step": 202632, "epoch": 1674} {"train_loss": -41.61066818237305, "global_step": 202633, "epoch": 1674} {"train_loss": -39.61196517944336, "global_step": 202634, "epoch": 1674} {"train_loss": -40.119754791259766, "global_step": 202635, "epoch": 1674} {"train_loss": -41.32777786254883, "global_step": 202636, "epoch": 1674} {"train_loss": -40.885311126708984, "global_step": 202637, "epoch": 1674} {"train_loss": -39.1483268737793, "global_step": 202638, "epoch": 1674} {"train_loss": -41.9846305847168, "global_step": 202639, "epoch": 1674} {"train_loss": -42.76713943481445, "global_step": 202640, "epoch": 1674} {"train_loss": -40.28388595581055, "global_step": 202641, "epoch": 1674} {"train_loss": -39.81977081298828, "global_step": 202642, "epoch": 1674} {"train_loss": -41.94682693481445, "global_step": 202643, "epoch": 1674} {"train_loss": -42.2418327331543, "global_step": 202644, "epoch": 1674} {"train_loss": -40.190948486328125, "global_step": 202645, "epoch": 1674} {"train_loss": -42.1066780090332, "global_step": 202646, "epoch": 1674} {"train_loss": -41.55867385864258, "global_step": 202647, "epoch": 1674} {"train_loss": -41.0035514831543, "global_step": 202648, "epoch": 1674} {"train_loss": -40.77291488647461, "global_step": 202649, "epoch": 1674} {"train_loss": -39.99585723876953, "global_step": 202650, "epoch": 1674} {"train_loss": -40.27821350097656, "global_step": 202651, "epoch": 1674} {"train_loss": -40.65971755981445, "global_step": 202652, "epoch": 1674} {"train_loss": -41.39119338989258, "global_step": 202653, "epoch": 1674} {"train_loss": -40.99441146850586, "global_step": 202654, "epoch": 1674} {"train_loss": -40.77690505981445, "global_step": 202655, "epoch": 1674} {"train_loss": -40.46407699584961, "global_step": 202656, "epoch": 1674} {"train_loss": -39.38544845581055, "global_step": 202657, "epoch": 1674} {"train_loss": -40.994895935058594, "global_step": 202658, "epoch": 1674} {"train_loss": -41.81119918823242, "global_step": 202659, "epoch": 1674} {"train_loss": -40.356414794921875, "global_step": 202660, "epoch": 1674} {"train_loss": -40.41254425048828, "global_step": 202661, "epoch": 1674} {"train_loss": -40.52982711791992, "global_step": 202662, "epoch": 1674} {"train_loss": -40.137298583984375, "global_step": 202663, "epoch": 1674} {"train_loss": -38.38831329345703, "global_step": 202664, "epoch": 1674} {"train_loss": -37.52083969116211, "global_step": 202665, "epoch": 1674} {"train_loss": -38.99968719482422, "global_step": 202666, "epoch": 1674} {"train_loss": -41.232601165771484, "global_step": 202667, "epoch": 1674} {"train_loss": -41.26421356201172, "global_step": 202668, "epoch": 1674} {"train_loss": -40.61076736450195, "global_step": 202669, "epoch": 1674} {"train_loss": -41.7010498046875, "global_step": 202670, "epoch": 1674} {"train_loss": -42.253841400146484, "global_step": 202671, "epoch": 1674} {"train_loss": -41.6938591003418, "global_step": 202672, "epoch": 1674} {"train_loss": -41.8991584777832, "global_step": 202673, "epoch": 1674} {"train_loss": -41.37397315285423, "global_step": 202674, "epoch": 1674, "val_loss": 2573769.5} {"train_loss": -41.85395812988281, "global_step": 202675, "epoch": 1675} {"train_loss": -41.85598373413086, "global_step": 202676, "epoch": 1675} {"train_loss": -41.80025100708008, "global_step": 202677, "epoch": 1675} {"train_loss": -42.05292892456055, "global_step": 202678, "epoch": 1675} {"train_loss": -42.09657669067383, "global_step": 202679, "epoch": 1675} {"train_loss": -41.4901008605957, "global_step": 202680, "epoch": 1675} {"train_loss": -41.511356353759766, "global_step": 202681, "epoch": 1675} {"train_loss": -42.361915588378906, "global_step": 202682, "epoch": 1675} {"train_loss": -41.752254486083984, "global_step": 202683, "epoch": 1675} {"train_loss": -42.55394744873047, "global_step": 202684, "epoch": 1675} {"train_loss": -42.79491424560547, "global_step": 202685, "epoch": 1675} {"train_loss": -41.81385803222656, "global_step": 202686, "epoch": 1675} {"train_loss": -42.303199768066406, "global_step": 202687, "epoch": 1675} {"train_loss": -42.340576171875, "global_step": 202688, "epoch": 1675} {"train_loss": -41.74755859375, "global_step": 202689, "epoch": 1675} {"train_loss": -41.943626403808594, "global_step": 202690, "epoch": 1675} {"train_loss": -42.910675048828125, "global_step": 202691, "epoch": 1675} {"train_loss": -41.992637634277344, "global_step": 202692, "epoch": 1675} {"train_loss": -42.4957389831543, "global_step": 202693, "epoch": 1675} {"train_loss": -42.327816009521484, "global_step": 202694, "epoch": 1675} {"train_loss": -42.68745803833008, "global_step": 202695, "epoch": 1675} {"train_loss": -42.2260627746582, "global_step": 202696, "epoch": 1675} {"train_loss": -42.392974853515625, "global_step": 202697, "epoch": 1675} {"train_loss": -42.65313720703125, "global_step": 202698, "epoch": 1675} {"train_loss": -42.268917083740234, "global_step": 202699, "epoch": 1675} {"train_loss": -42.32180404663086, "global_step": 202700, "epoch": 1675} {"train_loss": -42.71559524536133, "global_step": 202701, "epoch": 1675} {"train_loss": -42.74216842651367, "global_step": 202702, "epoch": 1675} {"train_loss": -42.52004623413086, "global_step": 202703, "epoch": 1675} {"train_loss": -43.56441116333008, "global_step": 202704, "epoch": 1675} {"train_loss": -42.4942626953125, "global_step": 202705, "epoch": 1675} {"train_loss": -42.33956527709961, "global_step": 202706, "epoch": 1675} {"train_loss": -42.77524948120117, "global_step": 202707, "epoch": 1675} {"train_loss": -42.81402587890625, "global_step": 202708, "epoch": 1675} {"train_loss": -42.99494171142578, "global_step": 202709, "epoch": 1675} {"train_loss": -42.134525299072266, "global_step": 202710, "epoch": 1675} {"train_loss": -41.5748176574707, "global_step": 202711, "epoch": 1675} {"train_loss": -42.66786193847656, "global_step": 202712, "epoch": 1675} {"train_loss": -42.847896575927734, "global_step": 202713, "epoch": 1675} {"train_loss": -42.34314727783203, "global_step": 202714, "epoch": 1675} {"train_loss": -42.5810546875, "global_step": 202715, "epoch": 1675} {"train_loss": -42.628456115722656, "global_step": 202716, "epoch": 1675} {"train_loss": -42.97365188598633, "global_step": 202717, "epoch": 1675} {"train_loss": -42.57459259033203, "global_step": 202718, "epoch": 1675} {"train_loss": -41.9005126953125, "global_step": 202719, "epoch": 1675} {"train_loss": -40.556209564208984, "global_step": 202720, "epoch": 1675} {"train_loss": -39.24848556518555, "global_step": 202721, "epoch": 1675} {"train_loss": -41.04536056518555, "global_step": 202722, "epoch": 1675} {"train_loss": -42.41791915893555, "global_step": 202723, "epoch": 1675} {"train_loss": -41.962867736816406, "global_step": 202724, "epoch": 1675} {"train_loss": -41.158382415771484, "global_step": 202725, "epoch": 1675} {"train_loss": -42.083290100097656, "global_step": 202726, "epoch": 1675} {"train_loss": -42.5496826171875, "global_step": 202727, "epoch": 1675} {"train_loss": -41.575069427490234, "global_step": 202728, "epoch": 1675} {"train_loss": -40.05721664428711, "global_step": 202729, "epoch": 1675} {"train_loss": -41.681148529052734, "global_step": 202730, "epoch": 1675} {"train_loss": -41.9205436706543, "global_step": 202731, "epoch": 1675} {"train_loss": -41.35309982299805, "global_step": 202732, "epoch": 1675} {"train_loss": -41.33540344238281, "global_step": 202733, "epoch": 1675} {"train_loss": -42.29926300048828, "global_step": 202734, "epoch": 1675} {"train_loss": -42.41717529296875, "global_step": 202735, "epoch": 1675} {"train_loss": -41.52190399169922, "global_step": 202736, "epoch": 1675} {"train_loss": -42.91761016845703, "global_step": 202737, "epoch": 1675} {"train_loss": -42.90978240966797, "global_step": 202738, "epoch": 1675} {"train_loss": -42.058937072753906, "global_step": 202739, "epoch": 1675} {"train_loss": -43.0433464050293, "global_step": 202740, "epoch": 1675} {"train_loss": -42.416168212890625, "global_step": 202741, "epoch": 1675} {"train_loss": -42.038116455078125, "global_step": 202742, "epoch": 1675} {"train_loss": -42.47473907470703, "global_step": 202743, "epoch": 1675} {"train_loss": -42.797264099121094, "global_step": 202744, "epoch": 1675} {"train_loss": -41.73261642456055, "global_step": 202745, "epoch": 1675} {"train_loss": -40.44117736816406, "global_step": 202746, "epoch": 1675} {"train_loss": -39.779083251953125, "global_step": 202747, "epoch": 1675} {"train_loss": -42.019981384277344, "global_step": 202748, "epoch": 1675} {"train_loss": -41.316707611083984, "global_step": 202749, "epoch": 1675} {"train_loss": -40.3510856628418, "global_step": 202750, "epoch": 1675} {"train_loss": -41.03573226928711, "global_step": 202751, "epoch": 1675} {"train_loss": -40.642250061035156, "global_step": 202752, "epoch": 1675} {"train_loss": -41.796443939208984, "global_step": 202753, "epoch": 1675} {"train_loss": -42.532081604003906, "global_step": 202754, "epoch": 1675} {"train_loss": -42.180816650390625, "global_step": 202755, "epoch": 1675} {"train_loss": -41.63663864135742, "global_step": 202756, "epoch": 1675} {"train_loss": -42.32081985473633, "global_step": 202757, "epoch": 1675} {"train_loss": -42.344032287597656, "global_step": 202758, "epoch": 1675} {"train_loss": -41.983619689941406, "global_step": 202759, "epoch": 1675} {"train_loss": -42.638607025146484, "global_step": 202760, "epoch": 1675} {"train_loss": -42.61146545410156, "global_step": 202761, "epoch": 1675} {"train_loss": -42.26676559448242, "global_step": 202762, "epoch": 1675} {"train_loss": -42.683284759521484, "global_step": 202763, "epoch": 1675} {"train_loss": -42.390846252441406, "global_step": 202764, "epoch": 1675} {"train_loss": -42.89410400390625, "global_step": 202765, "epoch": 1675} {"train_loss": -42.670623779296875, "global_step": 202766, "epoch": 1675} {"train_loss": -42.84389114379883, "global_step": 202767, "epoch": 1675} {"train_loss": -43.24577713012695, "global_step": 202768, "epoch": 1675} {"train_loss": -42.663002014160156, "global_step": 202769, "epoch": 1675} {"train_loss": -42.335018157958984, "global_step": 202770, "epoch": 1675} {"train_loss": -42.43997573852539, "global_step": 202771, "epoch": 1675} {"train_loss": -42.99909210205078, "global_step": 202772, "epoch": 1675} {"train_loss": -42.6576042175293, "global_step": 202773, "epoch": 1675} {"train_loss": -41.5454216003418, "global_step": 202774, "epoch": 1675} {"train_loss": -40.99830627441406, "global_step": 202775, "epoch": 1675} {"train_loss": -41.79426193237305, "global_step": 202776, "epoch": 1675} {"train_loss": -43.077247619628906, "global_step": 202777, "epoch": 1675} {"train_loss": -43.042476654052734, "global_step": 202778, "epoch": 1675} {"train_loss": -42.509986877441406, "global_step": 202779, "epoch": 1675} {"train_loss": -42.05373001098633, "global_step": 202780, "epoch": 1675} {"train_loss": -43.0307731628418, "global_step": 202781, "epoch": 1675} {"train_loss": -42.994140625, "global_step": 202782, "epoch": 1675} {"train_loss": -43.137611389160156, "global_step": 202783, "epoch": 1675} {"train_loss": -42.905574798583984, "global_step": 202784, "epoch": 1675} {"train_loss": -42.46730041503906, "global_step": 202785, "epoch": 1675} {"train_loss": -42.96613311767578, "global_step": 202786, "epoch": 1675} {"train_loss": -42.678627014160156, "global_step": 202787, "epoch": 1675} {"train_loss": -42.88734817504883, "global_step": 202788, "epoch": 1675} {"train_loss": -43.36664962768555, "global_step": 202789, "epoch": 1675} {"train_loss": -42.922969818115234, "global_step": 202790, "epoch": 1675} {"train_loss": -41.724117279052734, "global_step": 202791, "epoch": 1675} {"train_loss": -37.395103454589844, "global_step": 202792, "epoch": 1675} {"train_loss": -40.809261322021484, "global_step": 202793, "epoch": 1675} {"train_loss": -42.17226028442383, "global_step": 202794, "epoch": 1675} {"train_loss": -42.13882717416306, "global_step": 202795, "epoch": 1675, "val_loss": 2545373.0} {"train_loss": -41.28420639038086, "global_step": 202796, "epoch": 1676} {"train_loss": -42.60505294799805, "global_step": 202797, "epoch": 1676} {"train_loss": -42.410858154296875, "global_step": 202798, "epoch": 1676} {"train_loss": -41.07374954223633, "global_step": 202799, "epoch": 1676} {"train_loss": -39.23514938354492, "global_step": 202800, "epoch": 1676} {"train_loss": -39.74387741088867, "global_step": 202801, "epoch": 1676} {"train_loss": -41.56803894042969, "global_step": 202802, "epoch": 1676} {"train_loss": -39.96844482421875, "global_step": 202803, "epoch": 1676} {"train_loss": -39.726375579833984, "global_step": 202804, "epoch": 1676} {"train_loss": -41.70346450805664, "global_step": 202805, "epoch": 1676} {"train_loss": -40.54422378540039, "global_step": 202806, "epoch": 1676} {"train_loss": -41.20673751831055, "global_step": 202807, "epoch": 1676} {"train_loss": -40.22073745727539, "global_step": 202808, "epoch": 1676} {"train_loss": -40.00330352783203, "global_step": 202809, "epoch": 1676} {"train_loss": -41.74955368041992, "global_step": 202810, "epoch": 1676} {"train_loss": -36.94582748413086, "global_step": 202811, "epoch": 1676} {"train_loss": -41.24500274658203, "global_step": 202812, "epoch": 1676} {"train_loss": -39.99763870239258, "global_step": 202813, "epoch": 1676} {"train_loss": -38.564208984375, "global_step": 202814, "epoch": 1676} {"train_loss": -40.03848648071289, "global_step": 202815, "epoch": 1676} {"train_loss": -39.30153274536133, "global_step": 202816, "epoch": 1676} {"train_loss": -39.146976470947266, "global_step": 202817, "epoch": 1676} {"train_loss": -37.2269287109375, "global_step": 202818, "epoch": 1676} {"train_loss": -41.85883712768555, "global_step": 202819, "epoch": 1676} {"train_loss": -39.03822708129883, "global_step": 202820, "epoch": 1676} {"train_loss": -38.79659652709961, "global_step": 202821, "epoch": 1676} {"train_loss": -38.40353012084961, "global_step": 202822, "epoch": 1676} {"train_loss": -40.5964469909668, "global_step": 202823, "epoch": 1676} {"train_loss": -39.720184326171875, "global_step": 202824, "epoch": 1676} {"train_loss": -40.69672775268555, "global_step": 202825, "epoch": 1676} {"train_loss": -38.778785705566406, "global_step": 202826, "epoch": 1676} {"train_loss": -41.830596923828125, "global_step": 202827, "epoch": 1676} {"train_loss": -39.68241500854492, "global_step": 202828, "epoch": 1676} {"train_loss": -41.88235092163086, "global_step": 202829, "epoch": 1676} {"train_loss": -40.4809684753418, "global_step": 202830, "epoch": 1676} {"train_loss": -41.98740005493164, "global_step": 202831, "epoch": 1676} {"train_loss": -41.1164665222168, "global_step": 202832, "epoch": 1676} {"train_loss": -41.57242202758789, "global_step": 202833, "epoch": 1676} {"train_loss": -41.52726364135742, "global_step": 202834, "epoch": 1676} {"train_loss": -41.853057861328125, "global_step": 202835, "epoch": 1676} {"train_loss": -41.81885528564453, "global_step": 202836, "epoch": 1676} {"train_loss": -41.43300247192383, "global_step": 202837, "epoch": 1676} {"train_loss": -42.00797653198242, "global_step": 202838, "epoch": 1676} {"train_loss": -41.404354095458984, "global_step": 202839, "epoch": 1676} {"train_loss": -41.894065856933594, "global_step": 202840, "epoch": 1676} {"train_loss": -41.873897552490234, "global_step": 202841, "epoch": 1676} {"train_loss": -41.780120849609375, "global_step": 202842, "epoch": 1676} {"train_loss": -41.76141357421875, "global_step": 202843, "epoch": 1676} {"train_loss": -41.83492660522461, "global_step": 202844, "epoch": 1676} {"train_loss": -42.361568450927734, "global_step": 202845, "epoch": 1676} {"train_loss": -41.63051986694336, "global_step": 202846, "epoch": 1676} {"train_loss": -42.17380905151367, "global_step": 202847, "epoch": 1676} {"train_loss": -41.86564254760742, "global_step": 202848, "epoch": 1676} {"train_loss": -42.30546188354492, "global_step": 202849, "epoch": 1676} {"train_loss": -42.59605407714844, "global_step": 202850, "epoch": 1676} {"train_loss": -42.10506820678711, "global_step": 202851, "epoch": 1676} {"train_loss": -42.41494369506836, "global_step": 202852, "epoch": 1676} {"train_loss": -42.19107437133789, "global_step": 202853, "epoch": 1676} {"train_loss": -40.870967864990234, "global_step": 202854, "epoch": 1676} {"train_loss": -41.47779083251953, "global_step": 202855, "epoch": 1676} {"train_loss": -42.1793327331543, "global_step": 202856, "epoch": 1676} {"train_loss": -42.19947052001953, "global_step": 202857, "epoch": 1676} {"train_loss": -42.53205490112305, "global_step": 202858, "epoch": 1676} {"train_loss": -42.09473419189453, "global_step": 202859, "epoch": 1676} {"train_loss": -42.360748291015625, "global_step": 202860, "epoch": 1676} {"train_loss": -42.33766555786133, "global_step": 202861, "epoch": 1676} {"train_loss": -42.71297073364258, "global_step": 202862, "epoch": 1676} {"train_loss": -42.74294662475586, "global_step": 202863, "epoch": 1676} {"train_loss": -42.19684600830078, "global_step": 202864, "epoch": 1676} {"train_loss": -42.350521087646484, "global_step": 202865, "epoch": 1676} {"train_loss": -43.02069854736328, "global_step": 202866, "epoch": 1676} {"train_loss": -42.38266372680664, "global_step": 202867, "epoch": 1676} {"train_loss": -41.46718215942383, "global_step": 202868, "epoch": 1676} {"train_loss": -42.83298873901367, "global_step": 202869, "epoch": 1676} {"train_loss": -42.618099212646484, "global_step": 202870, "epoch": 1676} {"train_loss": -41.767574310302734, "global_step": 202871, "epoch": 1676} {"train_loss": -41.95783233642578, "global_step": 202872, "epoch": 1676} {"train_loss": -41.85402297973633, "global_step": 202873, "epoch": 1676} {"train_loss": -40.394954681396484, "global_step": 202874, "epoch": 1676} {"train_loss": -39.32599639892578, "global_step": 202875, "epoch": 1676} {"train_loss": -38.6812858581543, "global_step": 202876, "epoch": 1676} {"train_loss": -37.622554779052734, "global_step": 202877, "epoch": 1676} {"train_loss": -42.165626525878906, "global_step": 202878, "epoch": 1676} {"train_loss": -39.61284255981445, "global_step": 202879, "epoch": 1676} {"train_loss": -34.46120071411133, "global_step": 202880, "epoch": 1676} {"train_loss": -33.6598014831543, "global_step": 202881, "epoch": 1676} {"train_loss": -41.599056243896484, "global_step": 202882, "epoch": 1676} {"train_loss": -29.819726943969727, "global_step": 202883, "epoch": 1676} {"train_loss": -25.45186424255371, "global_step": 202884, "epoch": 1676} {"train_loss": -39.48246383666992, "global_step": 202885, "epoch": 1676} {"train_loss": -38.13994598388672, "global_step": 202886, "epoch": 1676} {"train_loss": -37.62263870239258, "global_step": 202887, "epoch": 1676} {"train_loss": -39.18168640136719, "global_step": 202888, "epoch": 1676} {"train_loss": -39.57894515991211, "global_step": 202889, "epoch": 1676} {"train_loss": -34.53659439086914, "global_step": 202890, "epoch": 1676} {"train_loss": -39.34731674194336, "global_step": 202891, "epoch": 1676} {"train_loss": -39.17036056518555, "global_step": 202892, "epoch": 1676} {"train_loss": -40.33164978027344, "global_step": 202893, "epoch": 1676} {"train_loss": -38.55647659301758, "global_step": 202894, "epoch": 1676} {"train_loss": -40.041622161865234, "global_step": 202895, "epoch": 1676} {"train_loss": -40.832420349121094, "global_step": 202896, "epoch": 1676} {"train_loss": -40.36581039428711, "global_step": 202897, "epoch": 1676} {"train_loss": -39.09763717651367, "global_step": 202898, "epoch": 1676} {"train_loss": -39.50626754760742, "global_step": 202899, "epoch": 1676} {"train_loss": -36.43684768676758, "global_step": 202900, "epoch": 1676} {"train_loss": -40.62578582763672, "global_step": 202901, "epoch": 1676} {"train_loss": -40.971832275390625, "global_step": 202902, "epoch": 1676} {"train_loss": -39.74077606201172, "global_step": 202903, "epoch": 1676} {"train_loss": -40.81948471069336, "global_step": 202904, "epoch": 1676} {"train_loss": -38.727455139160156, "global_step": 202905, "epoch": 1676} {"train_loss": -41.16820526123047, "global_step": 202906, "epoch": 1676} {"train_loss": -39.00782012939453, "global_step": 202907, "epoch": 1676} {"train_loss": -39.829437255859375, "global_step": 202908, "epoch": 1676} {"train_loss": -38.932647705078125, "global_step": 202909, "epoch": 1676} {"train_loss": -39.671485900878906, "global_step": 202910, "epoch": 1676} {"train_loss": -40.73690414428711, "global_step": 202911, "epoch": 1676} {"train_loss": -40.75831985473633, "global_step": 202912, "epoch": 1676} {"train_loss": -39.052040100097656, "global_step": 202913, "epoch": 1676} {"train_loss": -40.70207214355469, "global_step": 202914, "epoch": 1676} {"train_loss": -40.8184814453125, "global_step": 202915, "epoch": 1676} {"train_loss": -40.309304481695506, "global_step": 202916, "epoch": 1676, "val_loss": 2656466.75} {"train_loss": -40.907344818115234, "global_step": 202917, "epoch": 1677} {"train_loss": -37.71455001831055, "global_step": 202918, "epoch": 1677} {"train_loss": -33.1567268371582, "global_step": 202919, "epoch": 1677} {"train_loss": -40.48617935180664, "global_step": 202920, "epoch": 1677} {"train_loss": -36.6449089050293, "global_step": 202921, "epoch": 1677} {"train_loss": -37.62971496582031, "global_step": 202922, "epoch": 1677} {"train_loss": -40.843021392822266, "global_step": 202923, "epoch": 1677} {"train_loss": -40.52359390258789, "global_step": 202924, "epoch": 1677} {"train_loss": -37.07632064819336, "global_step": 202925, "epoch": 1677} {"train_loss": -38.03084945678711, "global_step": 202926, "epoch": 1677} {"train_loss": -25.699926376342773, "global_step": 202927, "epoch": 1677} {"train_loss": -39.18937301635742, "global_step": 202928, "epoch": 1677} {"train_loss": -38.940120697021484, "global_step": 202929, "epoch": 1677} {"train_loss": -33.342010498046875, "global_step": 202930, "epoch": 1677} {"train_loss": -29.349393844604492, "global_step": 202931, "epoch": 1677} {"train_loss": -37.13758850097656, "global_step": 202932, "epoch": 1677} {"train_loss": -38.28028106689453, "global_step": 202933, "epoch": 1677} {"train_loss": -32.877010345458984, "global_step": 202934, "epoch": 1677} {"train_loss": -37.79592514038086, "global_step": 202935, "epoch": 1677} {"train_loss": -34.20454025268555, "global_step": 202936, "epoch": 1677} {"train_loss": -31.4708194732666, "global_step": 202937, "epoch": 1677} {"train_loss": -32.949642181396484, "global_step": 202938, "epoch": 1677} {"train_loss": -37.41550827026367, "global_step": 202939, "epoch": 1677} {"train_loss": -36.59164047241211, "global_step": 202940, "epoch": 1677} {"train_loss": -38.04138946533203, "global_step": 202941, "epoch": 1677} {"train_loss": -40.011287689208984, "global_step": 202942, "epoch": 1677} {"train_loss": -35.14402770996094, "global_step": 202943, "epoch": 1677} {"train_loss": -34.63700485229492, "global_step": 202944, "epoch": 1677} {"train_loss": -39.36128616333008, "global_step": 202945, "epoch": 1677} {"train_loss": -38.607452392578125, "global_step": 202946, "epoch": 1677} {"train_loss": -39.788246154785156, "global_step": 202947, "epoch": 1677} {"train_loss": -37.67646026611328, "global_step": 202948, "epoch": 1677} {"train_loss": -39.557315826416016, "global_step": 202949, "epoch": 1677} {"train_loss": -38.01642608642578, "global_step": 202950, "epoch": 1677} {"train_loss": -38.6286735534668, "global_step": 202951, "epoch": 1677} {"train_loss": -38.606361389160156, "global_step": 202952, "epoch": 1677} {"train_loss": -38.22760009765625, "global_step": 202953, "epoch": 1677} {"train_loss": -37.598602294921875, "global_step": 202954, "epoch": 1677} {"train_loss": -40.08955001831055, "global_step": 202955, "epoch": 1677} {"train_loss": -39.24448776245117, "global_step": 202956, "epoch": 1677} {"train_loss": -38.796504974365234, "global_step": 202957, "epoch": 1677} {"train_loss": -38.70588302612305, "global_step": 202958, "epoch": 1677} {"train_loss": -39.21477508544922, "global_step": 202959, "epoch": 1677} {"train_loss": -38.767086029052734, "global_step": 202960, "epoch": 1677} {"train_loss": -38.586212158203125, "global_step": 202961, "epoch": 1677} {"train_loss": -37.784908294677734, "global_step": 202962, "epoch": 1677} {"train_loss": -39.89801788330078, "global_step": 202963, "epoch": 1677} {"train_loss": -40.29811096191406, "global_step": 202964, "epoch": 1677} {"train_loss": -39.4968376159668, "global_step": 202965, "epoch": 1677} {"train_loss": -38.75067138671875, "global_step": 202966, "epoch": 1677} {"train_loss": -39.54841232299805, "global_step": 202967, "epoch": 1677} {"train_loss": -39.33266830444336, "global_step": 202968, "epoch": 1677} {"train_loss": -39.85496139526367, "global_step": 202969, "epoch": 1677} {"train_loss": -39.18622970581055, "global_step": 202970, "epoch": 1677} {"train_loss": -39.59087371826172, "global_step": 202971, "epoch": 1677} {"train_loss": -40.28190231323242, "global_step": 202972, "epoch": 1677} {"train_loss": -40.60560607910156, "global_step": 202973, "epoch": 1677} {"train_loss": -40.83926010131836, "global_step": 202974, "epoch": 1677} {"train_loss": -40.53473663330078, "global_step": 202975, "epoch": 1677} {"train_loss": -39.5720100402832, "global_step": 202976, "epoch": 1677} {"train_loss": -40.0997200012207, "global_step": 202977, "epoch": 1677} {"train_loss": -39.00996780395508, "global_step": 202978, "epoch": 1677} {"train_loss": -40.45161056518555, "global_step": 202979, "epoch": 1677} {"train_loss": -40.24880599975586, "global_step": 202980, "epoch": 1677} {"train_loss": -40.40047073364258, "global_step": 202981, "epoch": 1677} {"train_loss": -40.360267639160156, "global_step": 202982, "epoch": 1677} {"train_loss": -40.37553024291992, "global_step": 202983, "epoch": 1677} {"train_loss": -40.818599700927734, "global_step": 202984, "epoch": 1677} {"train_loss": -40.31135940551758, "global_step": 202985, "epoch": 1677} {"train_loss": -40.72393798828125, "global_step": 202986, "epoch": 1677} {"train_loss": -40.79627227783203, "global_step": 202987, "epoch": 1677} {"train_loss": -40.894588470458984, "global_step": 202988, "epoch": 1677} {"train_loss": -40.047237396240234, "global_step": 202989, "epoch": 1677} {"train_loss": -39.48897171020508, "global_step": 202990, "epoch": 1677} {"train_loss": -40.08829879760742, "global_step": 202991, "epoch": 1677} {"train_loss": -40.80955123901367, "global_step": 202992, "epoch": 1677} {"train_loss": -40.404842376708984, "global_step": 202993, "epoch": 1677} {"train_loss": -40.62807846069336, "global_step": 202994, "epoch": 1677} {"train_loss": -41.16017532348633, "global_step": 202995, "epoch": 1677} {"train_loss": -41.12620162963867, "global_step": 202996, "epoch": 1677} {"train_loss": -41.09977340698242, "global_step": 202997, "epoch": 1677} {"train_loss": -41.185699462890625, "global_step": 202998, "epoch": 1677} {"train_loss": -40.63788604736328, "global_step": 202999, "epoch": 1677} {"train_loss": -40.27368927001953, "global_step": 203000, "epoch": 1677} {"train_loss": -41.76390075683594, "global_step": 203001, "epoch": 1677} {"train_loss": -41.420379638671875, "global_step": 203002, "epoch": 1677} {"train_loss": -41.613277435302734, "global_step": 203003, "epoch": 1677} {"train_loss": -41.18128204345703, "global_step": 203004, "epoch": 1677} {"train_loss": -41.281005859375, "global_step": 203005, "epoch": 1677} {"train_loss": -41.58515548706055, "global_step": 203006, "epoch": 1677} {"train_loss": -41.31324768066406, "global_step": 203007, "epoch": 1677} {"train_loss": -41.37844467163086, "global_step": 203008, "epoch": 1677} {"train_loss": -41.87240219116211, "global_step": 203009, "epoch": 1677} {"train_loss": -40.57400131225586, "global_step": 203010, "epoch": 1677} {"train_loss": -41.862579345703125, "global_step": 203011, "epoch": 1677} {"train_loss": -41.49298858642578, "global_step": 203012, "epoch": 1677} {"train_loss": -41.66748809814453, "global_step": 203013, "epoch": 1677} {"train_loss": -41.24123001098633, "global_step": 203014, "epoch": 1677} {"train_loss": -41.32326126098633, "global_step": 203015, "epoch": 1677} {"train_loss": -41.32603073120117, "global_step": 203016, "epoch": 1677} {"train_loss": -41.75094223022461, "global_step": 203017, "epoch": 1677} {"train_loss": -41.8179817199707, "global_step": 203018, "epoch": 1677} {"train_loss": -40.84825897216797, "global_step": 203019, "epoch": 1677} {"train_loss": -41.41197204589844, "global_step": 203020, "epoch": 1677} {"train_loss": -42.543251037597656, "global_step": 203021, "epoch": 1677} {"train_loss": -41.443641662597656, "global_step": 203022, "epoch": 1677} {"train_loss": -41.373023986816406, "global_step": 203023, "epoch": 1677} {"train_loss": -42.0195426940918, "global_step": 203024, "epoch": 1677} {"train_loss": -41.81093215942383, "global_step": 203025, "epoch": 1677} {"train_loss": -41.43267822265625, "global_step": 203026, "epoch": 1677} {"train_loss": -41.69103240966797, "global_step": 203027, "epoch": 1677} {"train_loss": -42.21148681640625, "global_step": 203028, "epoch": 1677} {"train_loss": -41.77427291870117, "global_step": 203029, "epoch": 1677} {"train_loss": -42.237613677978516, "global_step": 203030, "epoch": 1677} {"train_loss": -42.2618408203125, "global_step": 203031, "epoch": 1677} {"train_loss": -41.329833984375, "global_step": 203032, "epoch": 1677} {"train_loss": -42.43071746826172, "global_step": 203033, "epoch": 1677} {"train_loss": -41.744876861572266, "global_step": 203034, "epoch": 1677} {"train_loss": -42.017452239990234, "global_step": 203035, "epoch": 1677} {"train_loss": -41.960811614990234, "global_step": 203036, "epoch": 1677} {"train_loss": -39.5303246837017, "global_step": 203037, "epoch": 1677, "val_loss": 2576932.75} {"train_loss": -42.10432052612305, "global_step": 203038, "epoch": 1678} {"train_loss": -42.48493576049805, "global_step": 203039, "epoch": 1678} {"train_loss": -41.99024200439453, "global_step": 203040, "epoch": 1678} {"train_loss": -42.29941940307617, "global_step": 203041, "epoch": 1678} {"train_loss": -41.022254943847656, "global_step": 203042, "epoch": 1678} {"train_loss": -41.15887451171875, "global_step": 203043, "epoch": 1678} {"train_loss": -41.36082077026367, "global_step": 203044, "epoch": 1678} {"train_loss": -42.44919967651367, "global_step": 203045, "epoch": 1678} {"train_loss": -33.800777435302734, "global_step": 203046, "epoch": 1678} {"train_loss": -39.18731689453125, "global_step": 203047, "epoch": 1678} {"train_loss": -41.32822799682617, "global_step": 203048, "epoch": 1678} {"train_loss": -40.948551177978516, "global_step": 203049, "epoch": 1678} {"train_loss": -40.97819137573242, "global_step": 203050, "epoch": 1678} {"train_loss": -40.69791793823242, "global_step": 203051, "epoch": 1678} {"train_loss": -39.556854248046875, "global_step": 203052, "epoch": 1678} {"train_loss": -39.32451248168945, "global_step": 203053, "epoch": 1678} {"train_loss": -38.65252685546875, "global_step": 203054, "epoch": 1678} {"train_loss": -39.140655517578125, "global_step": 203055, "epoch": 1678} {"train_loss": -40.623653411865234, "global_step": 203056, "epoch": 1678} {"train_loss": -38.85337448120117, "global_step": 203057, "epoch": 1678} {"train_loss": -34.91331100463867, "global_step": 203058, "epoch": 1678} {"train_loss": -37.83373260498047, "global_step": 203059, "epoch": 1678} {"train_loss": -40.74276351928711, "global_step": 203060, "epoch": 1678} {"train_loss": -38.306495666503906, "global_step": 203061, "epoch": 1678} {"train_loss": -37.360233306884766, "global_step": 203062, "epoch": 1678} {"train_loss": -39.971046447753906, "global_step": 203063, "epoch": 1678} {"train_loss": -39.93662643432617, "global_step": 203064, "epoch": 1678} {"train_loss": -37.53534698486328, "global_step": 203065, "epoch": 1678} {"train_loss": -39.25312042236328, "global_step": 203066, "epoch": 1678} {"train_loss": -39.2088737487793, "global_step": 203067, "epoch": 1678} {"train_loss": -38.688446044921875, "global_step": 203068, "epoch": 1678} {"train_loss": -39.51797103881836, "global_step": 203069, "epoch": 1678} {"train_loss": -39.442626953125, "global_step": 203070, "epoch": 1678} {"train_loss": -38.53119659423828, "global_step": 203071, "epoch": 1678} {"train_loss": -40.6814079284668, "global_step": 203072, "epoch": 1678} {"train_loss": -40.075496673583984, "global_step": 203073, "epoch": 1678} {"train_loss": -40.464820861816406, "global_step": 203074, "epoch": 1678} {"train_loss": -40.48505783081055, "global_step": 203075, "epoch": 1678} {"train_loss": -41.178802490234375, "global_step": 203076, "epoch": 1678} {"train_loss": -41.0893669128418, "global_step": 203077, "epoch": 1678} {"train_loss": -40.16624069213867, "global_step": 203078, "epoch": 1678} {"train_loss": -41.0291862487793, "global_step": 203079, "epoch": 1678} {"train_loss": -41.471004486083984, "global_step": 203080, "epoch": 1678} {"train_loss": -40.76168441772461, "global_step": 203081, "epoch": 1678} {"train_loss": -40.83487319946289, "global_step": 203082, "epoch": 1678} {"train_loss": -41.447757720947266, "global_step": 203083, "epoch": 1678} {"train_loss": -40.40688705444336, "global_step": 203084, "epoch": 1678} {"train_loss": -41.8343391418457, "global_step": 203085, "epoch": 1678} {"train_loss": -40.815589904785156, "global_step": 203086, "epoch": 1678} {"train_loss": -40.4754753112793, "global_step": 203087, "epoch": 1678} {"train_loss": -41.930938720703125, "global_step": 203088, "epoch": 1678} {"train_loss": -40.8244743347168, "global_step": 203089, "epoch": 1678} {"train_loss": -40.814876556396484, "global_step": 203090, "epoch": 1678} {"train_loss": -41.60255813598633, "global_step": 203091, "epoch": 1678} {"train_loss": -41.24223327636719, "global_step": 203092, "epoch": 1678} {"train_loss": -40.75636672973633, "global_step": 203093, "epoch": 1678} {"train_loss": -41.12478256225586, "global_step": 203094, "epoch": 1678} {"train_loss": -41.532352447509766, "global_step": 203095, "epoch": 1678} {"train_loss": -42.207923889160156, "global_step": 203096, "epoch": 1678} {"train_loss": -41.901546478271484, "global_step": 203097, "epoch": 1678} {"train_loss": -41.07203674316406, "global_step": 203098, "epoch": 1678} {"train_loss": -41.750404357910156, "global_step": 203099, "epoch": 1678} {"train_loss": -41.66584014892578, "global_step": 203100, "epoch": 1678} {"train_loss": -41.40276336669922, "global_step": 203101, "epoch": 1678} {"train_loss": -41.83486557006836, "global_step": 203102, "epoch": 1678} {"train_loss": -41.28372573852539, "global_step": 203103, "epoch": 1678} {"train_loss": -42.0258903503418, "global_step": 203104, "epoch": 1678} {"train_loss": -42.0713996887207, "global_step": 203105, "epoch": 1678} {"train_loss": -41.83816146850586, "global_step": 203106, "epoch": 1678} {"train_loss": -42.50912857055664, "global_step": 203107, "epoch": 1678} {"train_loss": -41.688053131103516, "global_step": 203108, "epoch": 1678} {"train_loss": -42.226470947265625, "global_step": 203109, "epoch": 1678} {"train_loss": -41.962799072265625, "global_step": 203110, "epoch": 1678} {"train_loss": -42.079139709472656, "global_step": 203111, "epoch": 1678} {"train_loss": -41.05937957763672, "global_step": 203112, "epoch": 1678} {"train_loss": -42.053321838378906, "global_step": 203113, "epoch": 1678} {"train_loss": -42.320960998535156, "global_step": 203114, "epoch": 1678} {"train_loss": -41.9645881652832, "global_step": 203115, "epoch": 1678} {"train_loss": -42.043636322021484, "global_step": 203116, "epoch": 1678} {"train_loss": -42.50528335571289, "global_step": 203117, "epoch": 1678} {"train_loss": -42.4200439453125, "global_step": 203118, "epoch": 1678} {"train_loss": -41.82686996459961, "global_step": 203119, "epoch": 1678} {"train_loss": -42.122474670410156, "global_step": 203120, "epoch": 1678} {"train_loss": -41.82935333251953, "global_step": 203121, "epoch": 1678} {"train_loss": -42.466304779052734, "global_step": 203122, "epoch": 1678} {"train_loss": -42.08076095581055, "global_step": 203123, "epoch": 1678} {"train_loss": -41.68088912963867, "global_step": 203124, "epoch": 1678} {"train_loss": -41.17423629760742, "global_step": 203125, "epoch": 1678} {"train_loss": -41.1754035949707, "global_step": 203126, "epoch": 1678} {"train_loss": -42.42548370361328, "global_step": 203127, "epoch": 1678} {"train_loss": -41.7900390625, "global_step": 203128, "epoch": 1678} {"train_loss": -41.96230697631836, "global_step": 203129, "epoch": 1678} {"train_loss": -42.2446174621582, "global_step": 203130, "epoch": 1678} {"train_loss": -41.31394958496094, "global_step": 203131, "epoch": 1678} {"train_loss": -42.099403381347656, "global_step": 203132, "epoch": 1678} {"train_loss": -42.61396026611328, "global_step": 203133, "epoch": 1678} {"train_loss": -42.01510238647461, "global_step": 203134, "epoch": 1678} {"train_loss": -42.63135528564453, "global_step": 203135, "epoch": 1678} {"train_loss": -41.184085845947266, "global_step": 203136, "epoch": 1678} {"train_loss": -41.429073333740234, "global_step": 203137, "epoch": 1678} {"train_loss": -42.14290237426758, "global_step": 203138, "epoch": 1678} {"train_loss": -42.027984619140625, "global_step": 203139, "epoch": 1678} {"train_loss": -42.62494659423828, "global_step": 203140, "epoch": 1678} {"train_loss": -41.37312316894531, "global_step": 203141, "epoch": 1678} {"train_loss": -41.69938659667969, "global_step": 203142, "epoch": 1678} {"train_loss": -42.122310638427734, "global_step": 203143, "epoch": 1678} {"train_loss": -41.985137939453125, "global_step": 203144, "epoch": 1678} {"train_loss": -42.579524993896484, "global_step": 203145, "epoch": 1678} {"train_loss": -42.283233642578125, "global_step": 203146, "epoch": 1678} {"train_loss": -42.69306182861328, "global_step": 203147, "epoch": 1678} {"train_loss": -42.277587890625, "global_step": 203148, "epoch": 1678} {"train_loss": -42.86167526245117, "global_step": 203149, "epoch": 1678} {"train_loss": -41.24726867675781, "global_step": 203150, "epoch": 1678} {"train_loss": -42.10435104370117, "global_step": 203151, "epoch": 1678} {"train_loss": -42.444637298583984, "global_step": 203152, "epoch": 1678} {"train_loss": -42.703975677490234, "global_step": 203153, "epoch": 1678} {"train_loss": -42.889930725097656, "global_step": 203154, "epoch": 1678} {"train_loss": -41.820552825927734, "global_step": 203155, "epoch": 1678} {"train_loss": -42.616085052490234, "global_step": 203156, "epoch": 1678} {"train_loss": -42.1136360168457, "global_step": 203157, "epoch": 1678} {"train_loss": -41.14781267780903, "global_step": 203158, "epoch": 1678, "val_loss": 2632332.75} {"train_loss": -41.779598236083984, "global_step": 203159, "epoch": 1679} {"train_loss": -41.979156494140625, "global_step": 203160, "epoch": 1679} {"train_loss": -42.68549346923828, "global_step": 203161, "epoch": 1679} {"train_loss": -41.16801834106445, "global_step": 203162, "epoch": 1679} {"train_loss": -41.56525421142578, "global_step": 203163, "epoch": 1679} {"train_loss": -41.74922180175781, "global_step": 203164, "epoch": 1679} {"train_loss": -42.20652770996094, "global_step": 203165, "epoch": 1679} {"train_loss": -41.313133239746094, "global_step": 203166, "epoch": 1679} {"train_loss": -40.33514404296875, "global_step": 203167, "epoch": 1679} {"train_loss": -41.6484489440918, "global_step": 203168, "epoch": 1679} {"train_loss": -40.81192398071289, "global_step": 203169, "epoch": 1679} {"train_loss": -40.63242721557617, "global_step": 203170, "epoch": 1679} {"train_loss": -41.48580551147461, "global_step": 203171, "epoch": 1679} {"train_loss": -40.57124710083008, "global_step": 203172, "epoch": 1679} {"train_loss": -38.05532455444336, "global_step": 203173, "epoch": 1679} {"train_loss": -36.69329071044922, "global_step": 203174, "epoch": 1679} {"train_loss": -36.96876907348633, "global_step": 203175, "epoch": 1679} {"train_loss": -39.35087585449219, "global_step": 203176, "epoch": 1679} {"train_loss": -41.70579528808594, "global_step": 203177, "epoch": 1679} {"train_loss": -41.004859924316406, "global_step": 203178, "epoch": 1679} {"train_loss": -41.1993522644043, "global_step": 203179, "epoch": 1679} {"train_loss": -41.298526763916016, "global_step": 203180, "epoch": 1679} {"train_loss": -40.89680862426758, "global_step": 203181, "epoch": 1679} {"train_loss": -40.51495361328125, "global_step": 203182, "epoch": 1679} {"train_loss": -41.89674758911133, "global_step": 203183, "epoch": 1679} {"train_loss": -40.67658615112305, "global_step": 203184, "epoch": 1679} {"train_loss": -40.6344108581543, "global_step": 203185, "epoch": 1679} {"train_loss": -41.74029541015625, "global_step": 203186, "epoch": 1679} {"train_loss": -40.85148239135742, "global_step": 203187, "epoch": 1679} {"train_loss": -41.6907958984375, "global_step": 203188, "epoch": 1679} {"train_loss": -40.692047119140625, "global_step": 203189, "epoch": 1679} {"train_loss": -41.7346076965332, "global_step": 203190, "epoch": 1679} {"train_loss": -41.17520523071289, "global_step": 203191, "epoch": 1679} {"train_loss": -41.21137237548828, "global_step": 203192, "epoch": 1679} {"train_loss": -41.02165222167969, "global_step": 203193, "epoch": 1679} {"train_loss": -40.96900177001953, "global_step": 203194, "epoch": 1679} {"train_loss": -41.80501174926758, "global_step": 203195, "epoch": 1679} {"train_loss": -40.914852142333984, "global_step": 203196, "epoch": 1679} {"train_loss": -41.81013488769531, "global_step": 203197, "epoch": 1679} {"train_loss": -41.156192779541016, "global_step": 203198, "epoch": 1679} {"train_loss": -41.954498291015625, "global_step": 203199, "epoch": 1679} {"train_loss": -41.501834869384766, "global_step": 203200, "epoch": 1679} {"train_loss": -42.06288528442383, "global_step": 203201, "epoch": 1679} {"train_loss": -42.139869689941406, "global_step": 203202, "epoch": 1679} {"train_loss": -41.877620697021484, "global_step": 203203, "epoch": 1679} {"train_loss": -42.028160095214844, "global_step": 203204, "epoch": 1679} {"train_loss": -41.87197494506836, "global_step": 203205, "epoch": 1679} {"train_loss": -41.80562973022461, "global_step": 203206, "epoch": 1679} {"train_loss": -42.28644943237305, "global_step": 203207, "epoch": 1679} {"train_loss": -42.42481994628906, "global_step": 203208, "epoch": 1679} {"train_loss": -40.38843536376953, "global_step": 203209, "epoch": 1679} {"train_loss": -42.38485336303711, "global_step": 203210, "epoch": 1679} {"train_loss": -40.581275939941406, "global_step": 203211, "epoch": 1679} {"train_loss": -42.36491394042969, "global_step": 203212, "epoch": 1679} {"train_loss": -42.0726432800293, "global_step": 203213, "epoch": 1679} {"train_loss": -41.86233901977539, "global_step": 203214, "epoch": 1679} {"train_loss": -41.84625244140625, "global_step": 203215, "epoch": 1679} {"train_loss": -41.76057815551758, "global_step": 203216, "epoch": 1679} {"train_loss": -38.99799728393555, "global_step": 203217, "epoch": 1679} {"train_loss": -39.54671859741211, "global_step": 203218, "epoch": 1679} {"train_loss": -41.329986572265625, "global_step": 203219, "epoch": 1679} {"train_loss": -39.054439544677734, "global_step": 203220, "epoch": 1679} {"train_loss": -40.88819122314453, "global_step": 203221, "epoch": 1679} {"train_loss": -40.59010696411133, "global_step": 203222, "epoch": 1679} {"train_loss": -39.606929779052734, "global_step": 203223, "epoch": 1679} {"train_loss": -39.49738311767578, "global_step": 203224, "epoch": 1679} {"train_loss": -39.79473876953125, "global_step": 203225, "epoch": 1679} {"train_loss": -40.278621673583984, "global_step": 203226, "epoch": 1679} {"train_loss": -40.77111053466797, "global_step": 203227, "epoch": 1679} {"train_loss": -40.7474365234375, "global_step": 203228, "epoch": 1679} {"train_loss": -41.326683044433594, "global_step": 203229, "epoch": 1679} {"train_loss": -41.008121490478516, "global_step": 203230, "epoch": 1679} {"train_loss": -41.281471252441406, "global_step": 203231, "epoch": 1679} {"train_loss": -41.484222412109375, "global_step": 203232, "epoch": 1679} {"train_loss": -41.96232604980469, "global_step": 203233, "epoch": 1679} {"train_loss": -41.025081634521484, "global_step": 203234, "epoch": 1679} {"train_loss": -42.278926849365234, "global_step": 203235, "epoch": 1679} {"train_loss": -40.97249221801758, "global_step": 203236, "epoch": 1679} {"train_loss": -42.25950241088867, "global_step": 203237, "epoch": 1679} {"train_loss": -40.551795959472656, "global_step": 203238, "epoch": 1679} {"train_loss": -41.95441818237305, "global_step": 203239, "epoch": 1679} {"train_loss": -40.89524459838867, "global_step": 203240, "epoch": 1679} {"train_loss": -40.7619743347168, "global_step": 203241, "epoch": 1679} {"train_loss": -41.681671142578125, "global_step": 203242, "epoch": 1679} {"train_loss": -42.22618103027344, "global_step": 203243, "epoch": 1679} {"train_loss": -40.96077346801758, "global_step": 203244, "epoch": 1679} {"train_loss": -40.416419982910156, "global_step": 203245, "epoch": 1679} {"train_loss": -40.610713958740234, "global_step": 203246, "epoch": 1679} {"train_loss": -42.2896728515625, "global_step": 203247, "epoch": 1679} {"train_loss": -41.702327728271484, "global_step": 203248, "epoch": 1679} {"train_loss": -41.72141647338867, "global_step": 203249, "epoch": 1679} {"train_loss": -40.47565841674805, "global_step": 203250, "epoch": 1679} {"train_loss": -42.16585922241211, "global_step": 203251, "epoch": 1679} {"train_loss": -41.9011116027832, "global_step": 203252, "epoch": 1679} {"train_loss": -41.8192138671875, "global_step": 203253, "epoch": 1679} {"train_loss": -41.76884078979492, "global_step": 203254, "epoch": 1679} {"train_loss": -41.74402618408203, "global_step": 203255, "epoch": 1679} {"train_loss": -42.24541473388672, "global_step": 203256, "epoch": 1679} {"train_loss": -41.61747360229492, "global_step": 203257, "epoch": 1679} {"train_loss": -41.67862319946289, "global_step": 203258, "epoch": 1679} {"train_loss": -41.86527633666992, "global_step": 203259, "epoch": 1679} {"train_loss": -42.02683639526367, "global_step": 203260, "epoch": 1679} {"train_loss": -41.65481948852539, "global_step": 203261, "epoch": 1679} {"train_loss": -41.78925704956055, "global_step": 203262, "epoch": 1679} {"train_loss": -42.01395797729492, "global_step": 203263, "epoch": 1679} {"train_loss": -40.74121856689453, "global_step": 203264, "epoch": 1679} {"train_loss": -41.01408004760742, "global_step": 203265, "epoch": 1679} {"train_loss": -42.0971565246582, "global_step": 203266, "epoch": 1679} {"train_loss": -42.261314392089844, "global_step": 203267, "epoch": 1679} {"train_loss": -42.44009017944336, "global_step": 203268, "epoch": 1679} {"train_loss": -41.93619918823242, "global_step": 203269, "epoch": 1679} {"train_loss": -40.69190216064453, "global_step": 203270, "epoch": 1679} {"train_loss": -42.57947540283203, "global_step": 203271, "epoch": 1679} {"train_loss": -41.53825759887695, "global_step": 203272, "epoch": 1679} {"train_loss": -42.7217903137207, "global_step": 203273, "epoch": 1679} {"train_loss": -42.18359375, "global_step": 203274, "epoch": 1679} {"train_loss": -40.43086624145508, "global_step": 203275, "epoch": 1679} {"train_loss": -41.56574249267578, "global_step": 203276, "epoch": 1679} {"train_loss": -41.647212982177734, "global_step": 203277, "epoch": 1679} {"train_loss": -41.25360870361328, "global_step": 203278, "epoch": 1679} {"train_loss": -41.242858161611004, "global_step": 203279, "epoch": 1679, "val_loss": 2551818.0} {"train_loss": -42.285945892333984, "global_step": 203280, "epoch": 1680} {"train_loss": -42.261817932128906, "global_step": 203281, "epoch": 1680} {"train_loss": -42.14636993408203, "global_step": 203282, "epoch": 1680} {"train_loss": -41.954776763916016, "global_step": 203283, "epoch": 1680} {"train_loss": -40.964752197265625, "global_step": 203284, "epoch": 1680} {"train_loss": -42.055110931396484, "global_step": 203285, "epoch": 1680} {"train_loss": -42.34262466430664, "global_step": 203286, "epoch": 1680} {"train_loss": -41.658931732177734, "global_step": 203287, "epoch": 1680} {"train_loss": -40.28180694580078, "global_step": 203288, "epoch": 1680} {"train_loss": -42.032814025878906, "global_step": 203289, "epoch": 1680} {"train_loss": -41.283695220947266, "global_step": 203290, "epoch": 1680} {"train_loss": -41.04269027709961, "global_step": 203291, "epoch": 1680} {"train_loss": -42.522789001464844, "global_step": 203292, "epoch": 1680} {"train_loss": -41.318233489990234, "global_step": 203293, "epoch": 1680} {"train_loss": -39.251953125, "global_step": 203294, "epoch": 1680} {"train_loss": -38.629547119140625, "global_step": 203295, "epoch": 1680} {"train_loss": -42.39187240600586, "global_step": 203296, "epoch": 1680} {"train_loss": -41.07003402709961, "global_step": 203297, "epoch": 1680} {"train_loss": -37.17546081542969, "global_step": 203298, "epoch": 1680} {"train_loss": -40.03773880004883, "global_step": 203299, "epoch": 1680} {"train_loss": -40.59678268432617, "global_step": 203300, "epoch": 1680} {"train_loss": -37.870460510253906, "global_step": 203301, "epoch": 1680} {"train_loss": -35.028316497802734, "global_step": 203302, "epoch": 1680} {"train_loss": -40.16962814331055, "global_step": 203303, "epoch": 1680} {"train_loss": -39.95880126953125, "global_step": 203304, "epoch": 1680} {"train_loss": -30.777875900268555, "global_step": 203305, "epoch": 1680} {"train_loss": -31.607458114624023, "global_step": 203306, "epoch": 1680} {"train_loss": -32.38328170776367, "global_step": 203307, "epoch": 1680} {"train_loss": -37.75041580200195, "global_step": 203308, "epoch": 1680} {"train_loss": -36.09590530395508, "global_step": 203309, "epoch": 1680} {"train_loss": -26.830472946166992, "global_step": 203310, "epoch": 1680} {"train_loss": -32.451202392578125, "global_step": 203311, "epoch": 1680} {"train_loss": -34.022701263427734, "global_step": 203312, "epoch": 1680} {"train_loss": -19.159893035888672, "global_step": 203313, "epoch": 1680} {"train_loss": -32.72115707397461, "global_step": 203314, "epoch": 1680} {"train_loss": -36.40705490112305, "global_step": 203315, "epoch": 1680} {"train_loss": -23.863061904907227, "global_step": 203316, "epoch": 1680} {"train_loss": -33.662845611572266, "global_step": 203317, "epoch": 1680} {"train_loss": -31.659591674804688, "global_step": 203318, "epoch": 1680} {"train_loss": -31.418012619018555, "global_step": 203319, "epoch": 1680} {"train_loss": -31.241132736206055, "global_step": 203320, "epoch": 1680} {"train_loss": -18.70063591003418, "global_step": 203321, "epoch": 1680} {"train_loss": -31.193531036376953, "global_step": 203322, "epoch": 1680} {"train_loss": -30.509052276611328, "global_step": 203323, "epoch": 1680} {"train_loss": -31.851171493530273, "global_step": 203324, "epoch": 1680} {"train_loss": -35.247642517089844, "global_step": 203325, "epoch": 1680} {"train_loss": -32.59355545043945, "global_step": 203326, "epoch": 1680} {"train_loss": -26.98862648010254, "global_step": 203327, "epoch": 1680} {"train_loss": -31.24500846862793, "global_step": 203328, "epoch": 1680} {"train_loss": -32.99451446533203, "global_step": 203329, "epoch": 1680} {"train_loss": -35.719173431396484, "global_step": 203330, "epoch": 1680} {"train_loss": -34.69887161254883, "global_step": 203331, "epoch": 1680} {"train_loss": -35.49477005004883, "global_step": 203332, "epoch": 1680} {"train_loss": -34.92489242553711, "global_step": 203333, "epoch": 1680} {"train_loss": -34.625701904296875, "global_step": 203334, "epoch": 1680} {"train_loss": -35.184120178222656, "global_step": 203335, "epoch": 1680} {"train_loss": -36.02140426635742, "global_step": 203336, "epoch": 1680} {"train_loss": -35.013221740722656, "global_step": 203337, "epoch": 1680} {"train_loss": -36.175296783447266, "global_step": 203338, "epoch": 1680} {"train_loss": -35.3719596862793, "global_step": 203339, "epoch": 1680} {"train_loss": -37.043148040771484, "global_step": 203340, "epoch": 1680} {"train_loss": -36.33393478393555, "global_step": 203341, "epoch": 1680} {"train_loss": -36.81785202026367, "global_step": 203342, "epoch": 1680} {"train_loss": -37.40594482421875, "global_step": 203343, "epoch": 1680} {"train_loss": -37.86019515991211, "global_step": 203344, "epoch": 1680} {"train_loss": -36.76198959350586, "global_step": 203345, "epoch": 1680} {"train_loss": -37.98255157470703, "global_step": 203346, "epoch": 1680} {"train_loss": -36.59322738647461, "global_step": 203347, "epoch": 1680} {"train_loss": -37.6986083984375, "global_step": 203348, "epoch": 1680} {"train_loss": -37.7773551940918, "global_step": 203349, "epoch": 1680} {"train_loss": -36.43657302856445, "global_step": 203350, "epoch": 1680} {"train_loss": -37.91938400268555, "global_step": 203351, "epoch": 1680} {"train_loss": -37.5504264831543, "global_step": 203352, "epoch": 1680} {"train_loss": -36.69794845581055, "global_step": 203353, "epoch": 1680} {"train_loss": -37.457881927490234, "global_step": 203354, "epoch": 1680} {"train_loss": -38.97294235229492, "global_step": 203355, "epoch": 1680} {"train_loss": -37.39200210571289, "global_step": 203356, "epoch": 1680} {"train_loss": -38.550601959228516, "global_step": 203357, "epoch": 1680} {"train_loss": -37.95436477661133, "global_step": 203358, "epoch": 1680} {"train_loss": -38.29148483276367, "global_step": 203359, "epoch": 1680} {"train_loss": -38.68536376953125, "global_step": 203360, "epoch": 1680} {"train_loss": -38.8196907043457, "global_step": 203361, "epoch": 1680} {"train_loss": -38.111454010009766, "global_step": 203362, "epoch": 1680} {"train_loss": -38.032344818115234, "global_step": 203363, "epoch": 1680} {"train_loss": -38.74452590942383, "global_step": 203364, "epoch": 1680} {"train_loss": -38.17603302001953, "global_step": 203365, "epoch": 1680} {"train_loss": -38.66793441772461, "global_step": 203366, "epoch": 1680} {"train_loss": -39.15861129760742, "global_step": 203367, "epoch": 1680} {"train_loss": -38.40501022338867, "global_step": 203368, "epoch": 1680} {"train_loss": -38.32371139526367, "global_step": 203369, "epoch": 1680} {"train_loss": -39.42715835571289, "global_step": 203370, "epoch": 1680} {"train_loss": -38.69326400756836, "global_step": 203371, "epoch": 1680} {"train_loss": -39.32245635986328, "global_step": 203372, "epoch": 1680} {"train_loss": -38.25418472290039, "global_step": 203373, "epoch": 1680} {"train_loss": -39.197322845458984, "global_step": 203374, "epoch": 1680} {"train_loss": -39.93301773071289, "global_step": 203375, "epoch": 1680} {"train_loss": -39.58952713012695, "global_step": 203376, "epoch": 1680} {"train_loss": -40.117916107177734, "global_step": 203377, "epoch": 1680} {"train_loss": -39.00846481323242, "global_step": 203378, "epoch": 1680} {"train_loss": -39.201202392578125, "global_step": 203379, "epoch": 1680} {"train_loss": -38.98594284057617, "global_step": 203380, "epoch": 1680} {"train_loss": -39.724693298339844, "global_step": 203381, "epoch": 1680} {"train_loss": -38.82926559448242, "global_step": 203382, "epoch": 1680} {"train_loss": -40.04220962524414, "global_step": 203383, "epoch": 1680} {"train_loss": -39.770179748535156, "global_step": 203384, "epoch": 1680} {"train_loss": -40.130916595458984, "global_step": 203385, "epoch": 1680} {"train_loss": -39.83146286010742, "global_step": 203386, "epoch": 1680} {"train_loss": -39.997982025146484, "global_step": 203387, "epoch": 1680} {"train_loss": -40.02761459350586, "global_step": 203388, "epoch": 1680} {"train_loss": -39.31336975097656, "global_step": 203389, "epoch": 1680} {"train_loss": -38.792781829833984, "global_step": 203390, "epoch": 1680} {"train_loss": -40.48744583129883, "global_step": 203391, "epoch": 1680} {"train_loss": -39.985252380371094, "global_step": 203392, "epoch": 1680} {"train_loss": -40.5552864074707, "global_step": 203393, "epoch": 1680} {"train_loss": -39.31011962890625, "global_step": 203394, "epoch": 1680} {"train_loss": -39.78988265991211, "global_step": 203395, "epoch": 1680} {"train_loss": -39.742496490478516, "global_step": 203396, "epoch": 1680} {"train_loss": -38.81939697265625, "global_step": 203397, "epoch": 1680} {"train_loss": -39.06170654296875, "global_step": 203398, "epoch": 1680} {"train_loss": -40.566070556640625, "global_step": 203399, "epoch": 1680} {"train_loss": -37.22900800468508, "global_step": 203400, "epoch": 1680, "val_loss": 2630955.75} {"train_loss": -40.1544189453125, "global_step": 203401, "epoch": 1681} {"train_loss": -40.30732345581055, "global_step": 203402, "epoch": 1681} {"train_loss": -40.31797409057617, "global_step": 203403, "epoch": 1681} {"train_loss": -40.62749099731445, "global_step": 203404, "epoch": 1681} {"train_loss": -39.987342834472656, "global_step": 203405, "epoch": 1681} {"train_loss": -40.456417083740234, "global_step": 203406, "epoch": 1681} {"train_loss": -40.453529357910156, "global_step": 203407, "epoch": 1681} {"train_loss": -40.83917999267578, "global_step": 203408, "epoch": 1681} {"train_loss": -40.61528396606445, "global_step": 203409, "epoch": 1681} {"train_loss": -40.25520324707031, "global_step": 203410, "epoch": 1681} {"train_loss": -39.49715805053711, "global_step": 203411, "epoch": 1681} {"train_loss": -40.7458610534668, "global_step": 203412, "epoch": 1681} {"train_loss": -40.412906646728516, "global_step": 203413, "epoch": 1681} {"train_loss": -40.34426498413086, "global_step": 203414, "epoch": 1681} {"train_loss": -40.95565414428711, "global_step": 203415, "epoch": 1681} {"train_loss": -40.830013275146484, "global_step": 203416, "epoch": 1681} {"train_loss": -40.42715072631836, "global_step": 203417, "epoch": 1681} {"train_loss": -39.86307144165039, "global_step": 203418, "epoch": 1681} {"train_loss": -40.63935852050781, "global_step": 203419, "epoch": 1681} {"train_loss": -41.04701614379883, "global_step": 203420, "epoch": 1681} {"train_loss": -40.74371337890625, "global_step": 203421, "epoch": 1681} {"train_loss": -41.022804260253906, "global_step": 203422, "epoch": 1681} {"train_loss": -40.89826583862305, "global_step": 203423, "epoch": 1681} {"train_loss": -39.99797439575195, "global_step": 203424, "epoch": 1681} {"train_loss": -41.36538314819336, "global_step": 203425, "epoch": 1681} {"train_loss": -40.59920883178711, "global_step": 203426, "epoch": 1681} {"train_loss": -41.10490036010742, "global_step": 203427, "epoch": 1681} {"train_loss": -40.89921188354492, "global_step": 203428, "epoch": 1681} {"train_loss": -40.669254302978516, "global_step": 203429, "epoch": 1681} {"train_loss": -41.092403411865234, "global_step": 203430, "epoch": 1681} {"train_loss": -40.84952926635742, "global_step": 203431, "epoch": 1681} {"train_loss": -41.87514114379883, "global_step": 203432, "epoch": 1681} {"train_loss": -40.7823371887207, "global_step": 203433, "epoch": 1681} {"train_loss": -40.48305892944336, "global_step": 203434, "epoch": 1681} {"train_loss": -41.82854080200195, "global_step": 203435, "epoch": 1681} {"train_loss": -40.95331954956055, "global_step": 203436, "epoch": 1681} {"train_loss": -40.93021774291992, "global_step": 203437, "epoch": 1681} {"train_loss": -40.924171447753906, "global_step": 203438, "epoch": 1681} {"train_loss": -40.725379943847656, "global_step": 203439, "epoch": 1681} {"train_loss": -41.316219329833984, "global_step": 203440, "epoch": 1681} {"train_loss": -41.004390716552734, "global_step": 203441, "epoch": 1681} {"train_loss": -41.49557876586914, "global_step": 203442, "epoch": 1681} {"train_loss": -41.43555450439453, "global_step": 203443, "epoch": 1681} {"train_loss": -40.201881408691406, "global_step": 203444, "epoch": 1681} {"train_loss": -40.162261962890625, "global_step": 203445, "epoch": 1681} {"train_loss": -40.75706100463867, "global_step": 203446, "epoch": 1681} {"train_loss": -41.63059616088867, "global_step": 203447, "epoch": 1681} {"train_loss": -40.67543411254883, "global_step": 203448, "epoch": 1681} {"train_loss": -41.33654022216797, "global_step": 203449, "epoch": 1681} {"train_loss": -42.030067443847656, "global_step": 203450, "epoch": 1681} {"train_loss": -41.95955276489258, "global_step": 203451, "epoch": 1681} {"train_loss": -41.52571105957031, "global_step": 203452, "epoch": 1681} {"train_loss": -41.482032775878906, "global_step": 203453, "epoch": 1681} {"train_loss": -41.19794464111328, "global_step": 203454, "epoch": 1681} {"train_loss": -41.30826950073242, "global_step": 203455, "epoch": 1681} {"train_loss": -41.762454986572266, "global_step": 203456, "epoch": 1681} {"train_loss": -41.748504638671875, "global_step": 203457, "epoch": 1681} {"train_loss": -41.249629974365234, "global_step": 203458, "epoch": 1681} {"train_loss": -41.129676818847656, "global_step": 203459, "epoch": 1681} {"train_loss": -41.50373458862305, "global_step": 203460, "epoch": 1681} {"train_loss": -41.55907440185547, "global_step": 203461, "epoch": 1681} {"train_loss": -40.8604736328125, "global_step": 203462, "epoch": 1681} {"train_loss": -40.60677719116211, "global_step": 203463, "epoch": 1681} {"train_loss": -41.36396408081055, "global_step": 203464, "epoch": 1681} {"train_loss": -42.51704788208008, "global_step": 203465, "epoch": 1681} {"train_loss": -40.5675163269043, "global_step": 203466, "epoch": 1681} {"train_loss": -41.708492279052734, "global_step": 203467, "epoch": 1681} {"train_loss": -40.37334060668945, "global_step": 203468, "epoch": 1681} {"train_loss": -41.04818344116211, "global_step": 203469, "epoch": 1681} {"train_loss": -40.52182388305664, "global_step": 203470, "epoch": 1681} {"train_loss": -41.47151565551758, "global_step": 203471, "epoch": 1681} {"train_loss": -42.11466598510742, "global_step": 203472, "epoch": 1681} {"train_loss": -40.89548873901367, "global_step": 203473, "epoch": 1681} {"train_loss": -41.0860481262207, "global_step": 203474, "epoch": 1681} {"train_loss": -41.14628219604492, "global_step": 203475, "epoch": 1681} {"train_loss": -41.44330596923828, "global_step": 203476, "epoch": 1681} {"train_loss": -41.62299346923828, "global_step": 203477, "epoch": 1681} {"train_loss": -41.52450180053711, "global_step": 203478, "epoch": 1681} {"train_loss": -41.698646545410156, "global_step": 203479, "epoch": 1681} {"train_loss": -41.2226676940918, "global_step": 203480, "epoch": 1681} {"train_loss": -41.56159591674805, "global_step": 203481, "epoch": 1681} {"train_loss": -42.001495361328125, "global_step": 203482, "epoch": 1681} {"train_loss": -41.11671447753906, "global_step": 203483, "epoch": 1681} {"train_loss": -41.4543571472168, "global_step": 203484, "epoch": 1681} {"train_loss": -40.8504638671875, "global_step": 203485, "epoch": 1681} {"train_loss": -41.4487190246582, "global_step": 203486, "epoch": 1681} {"train_loss": -41.67224884033203, "global_step": 203487, "epoch": 1681} {"train_loss": -41.27924728393555, "global_step": 203488, "epoch": 1681} {"train_loss": -39.58126449584961, "global_step": 203489, "epoch": 1681} {"train_loss": -38.68603515625, "global_step": 203490, "epoch": 1681} {"train_loss": -35.54084396362305, "global_step": 203491, "epoch": 1681} {"train_loss": -30.453418731689453, "global_step": 203492, "epoch": 1681} {"train_loss": -24.62617301940918, "global_step": 203493, "epoch": 1681} {"train_loss": -25.137920379638672, "global_step": 203494, "epoch": 1681} {"train_loss": -39.15941619873047, "global_step": 203495, "epoch": 1681} {"train_loss": -34.49258041381836, "global_step": 203496, "epoch": 1681} {"train_loss": -35.32393264770508, "global_step": 203497, "epoch": 1681} {"train_loss": -39.39133071899414, "global_step": 203498, "epoch": 1681} {"train_loss": -36.2306022644043, "global_step": 203499, "epoch": 1681} {"train_loss": -36.83111572265625, "global_step": 203500, "epoch": 1681} {"train_loss": -34.27256393432617, "global_step": 203501, "epoch": 1681} {"train_loss": -37.526397705078125, "global_step": 203502, "epoch": 1681} {"train_loss": -35.122127532958984, "global_step": 203503, "epoch": 1681} {"train_loss": -34.74845504760742, "global_step": 203504, "epoch": 1681} {"train_loss": -35.810882568359375, "global_step": 203505, "epoch": 1681} {"train_loss": -35.23493576049805, "global_step": 203506, "epoch": 1681} {"train_loss": -33.275787353515625, "global_step": 203507, "epoch": 1681} {"train_loss": -36.53293991088867, "global_step": 203508, "epoch": 1681} {"train_loss": -32.07838439941406, "global_step": 203509, "epoch": 1681} {"train_loss": -31.50101089477539, "global_step": 203510, "epoch": 1681} {"train_loss": -25.9730167388916, "global_step": 203511, "epoch": 1681} {"train_loss": -35.04887771606445, "global_step": 203512, "epoch": 1681} {"train_loss": -38.59563064575195, "global_step": 203513, "epoch": 1681} {"train_loss": -21.40339469909668, "global_step": 203514, "epoch": 1681} {"train_loss": -7.4919753074646, "global_step": 203515, "epoch": 1681} {"train_loss": -24.4710693359375, "global_step": 203516, "epoch": 1681} {"train_loss": -32.35311508178711, "global_step": 203517, "epoch": 1681} {"train_loss": -32.08124542236328, "global_step": 203518, "epoch": 1681} {"train_loss": -25.83087158203125, "global_step": 203519, "epoch": 1681} {"train_loss": -32.24402618408203, "global_step": 203520, "epoch": 1681} {"train_loss": -38.69113833451074, "global_step": 203521, "epoch": 1681, "val_loss": 2702978.25} {"train_loss": -33.72300720214844, "global_step": 203522, "epoch": 1682} {"train_loss": -30.709516525268555, "global_step": 203523, "epoch": 1682} {"train_loss": -27.747812271118164, "global_step": 203524, "epoch": 1682} {"train_loss": -32.16340255737305, "global_step": 203525, "epoch": 1682} {"train_loss": -32.086891174316406, "global_step": 203526, "epoch": 1682} {"train_loss": -36.39581298828125, "global_step": 203527, "epoch": 1682} {"train_loss": -34.05674743652344, "global_step": 203528, "epoch": 1682} {"train_loss": -34.95180892944336, "global_step": 203529, "epoch": 1682} {"train_loss": -37.5207405090332, "global_step": 203530, "epoch": 1682} {"train_loss": -34.595821380615234, "global_step": 203531, "epoch": 1682} {"train_loss": -35.57875442504883, "global_step": 203532, "epoch": 1682} {"train_loss": -36.8823127746582, "global_step": 203533, "epoch": 1682} {"train_loss": -35.53261184692383, "global_step": 203534, "epoch": 1682} {"train_loss": -36.930572509765625, "global_step": 203535, "epoch": 1682} {"train_loss": -36.08998489379883, "global_step": 203536, "epoch": 1682} {"train_loss": -36.73673629760742, "global_step": 203537, "epoch": 1682} {"train_loss": -35.528926849365234, "global_step": 203538, "epoch": 1682} {"train_loss": -37.97361373901367, "global_step": 203539, "epoch": 1682} {"train_loss": -37.615333557128906, "global_step": 203540, "epoch": 1682} {"train_loss": -36.04142761230469, "global_step": 203541, "epoch": 1682} {"train_loss": -37.09414291381836, "global_step": 203542, "epoch": 1682} {"train_loss": -37.59598922729492, "global_step": 203543, "epoch": 1682} {"train_loss": -37.364051818847656, "global_step": 203544, "epoch": 1682} {"train_loss": -37.351715087890625, "global_step": 203545, "epoch": 1682} {"train_loss": -37.027381896972656, "global_step": 203546, "epoch": 1682} {"train_loss": -37.6104736328125, "global_step": 203547, "epoch": 1682} {"train_loss": -37.587860107421875, "global_step": 203548, "epoch": 1682} {"train_loss": -36.027801513671875, "global_step": 203549, "epoch": 1682} {"train_loss": -38.33632278442383, "global_step": 203550, "epoch": 1682} {"train_loss": -37.755287170410156, "global_step": 203551, "epoch": 1682} {"train_loss": -38.20333480834961, "global_step": 203552, "epoch": 1682} {"train_loss": -37.839088439941406, "global_step": 203553, "epoch": 1682} {"train_loss": -37.93349075317383, "global_step": 203554, "epoch": 1682} {"train_loss": -38.357704162597656, "global_step": 203555, "epoch": 1682} {"train_loss": -38.8083610534668, "global_step": 203556, "epoch": 1682} {"train_loss": -37.9473991394043, "global_step": 203557, "epoch": 1682} {"train_loss": -37.87238311767578, "global_step": 203558, "epoch": 1682} {"train_loss": -38.79610824584961, "global_step": 203559, "epoch": 1682} {"train_loss": -38.0462760925293, "global_step": 203560, "epoch": 1682} {"train_loss": -38.18021774291992, "global_step": 203561, "epoch": 1682} {"train_loss": -37.76567840576172, "global_step": 203562, "epoch": 1682} {"train_loss": -38.74738311767578, "global_step": 203563, "epoch": 1682} {"train_loss": -39.437252044677734, "global_step": 203564, "epoch": 1682} {"train_loss": -38.942626953125, "global_step": 203565, "epoch": 1682} {"train_loss": -39.106300354003906, "global_step": 203566, "epoch": 1682} {"train_loss": -38.8228874206543, "global_step": 203567, "epoch": 1682} {"train_loss": -38.61092758178711, "global_step": 203568, "epoch": 1682} {"train_loss": -38.739784240722656, "global_step": 203569, "epoch": 1682} {"train_loss": -38.391414642333984, "global_step": 203570, "epoch": 1682} {"train_loss": -39.48613357543945, "global_step": 203571, "epoch": 1682} {"train_loss": -38.677120208740234, "global_step": 203572, "epoch": 1682} {"train_loss": -38.731075286865234, "global_step": 203573, "epoch": 1682} {"train_loss": -38.70439529418945, "global_step": 203574, "epoch": 1682} {"train_loss": -38.44047164916992, "global_step": 203575, "epoch": 1682} {"train_loss": -38.6053466796875, "global_step": 203576, "epoch": 1682} {"train_loss": -38.352149963378906, "global_step": 203577, "epoch": 1682} {"train_loss": -37.90437316894531, "global_step": 203578, "epoch": 1682} {"train_loss": -39.230064392089844, "global_step": 203579, "epoch": 1682} {"train_loss": -38.625, "global_step": 203580, "epoch": 1682} {"train_loss": -39.18376541137695, "global_step": 203581, "epoch": 1682} {"train_loss": -39.31950378417969, "global_step": 203582, "epoch": 1682} {"train_loss": -39.60100555419922, "global_step": 203583, "epoch": 1682} {"train_loss": -39.241981506347656, "global_step": 203584, "epoch": 1682} {"train_loss": -39.336647033691406, "global_step": 203585, "epoch": 1682} {"train_loss": -39.956398010253906, "global_step": 203586, "epoch": 1682} {"train_loss": -39.753021240234375, "global_step": 203587, "epoch": 1682} {"train_loss": -39.35284423828125, "global_step": 203588, "epoch": 1682} {"train_loss": -39.94137954711914, "global_step": 203589, "epoch": 1682} {"train_loss": -39.4499397277832, "global_step": 203590, "epoch": 1682} {"train_loss": -39.86434555053711, "global_step": 203591, "epoch": 1682} {"train_loss": -39.547115325927734, "global_step": 203592, "epoch": 1682} {"train_loss": -39.67829513549805, "global_step": 203593, "epoch": 1682} {"train_loss": -39.90346145629883, "global_step": 203594, "epoch": 1682} {"train_loss": -39.5330696105957, "global_step": 203595, "epoch": 1682} {"train_loss": -39.72652816772461, "global_step": 203596, "epoch": 1682} {"train_loss": -40.14195251464844, "global_step": 203597, "epoch": 1682} {"train_loss": -40.00959396362305, "global_step": 203598, "epoch": 1682} {"train_loss": -39.878623962402344, "global_step": 203599, "epoch": 1682} {"train_loss": -39.823612213134766, "global_step": 203600, "epoch": 1682} {"train_loss": -39.862056732177734, "global_step": 203601, "epoch": 1682} {"train_loss": -40.20127487182617, "global_step": 203602, "epoch": 1682} {"train_loss": -39.57337188720703, "global_step": 203603, "epoch": 1682} {"train_loss": -40.12379837036133, "global_step": 203604, "epoch": 1682} {"train_loss": -40.389034271240234, "global_step": 203605, "epoch": 1682} {"train_loss": -40.18416213989258, "global_step": 203606, "epoch": 1682} {"train_loss": -40.2401237487793, "global_step": 203607, "epoch": 1682} {"train_loss": -39.77749252319336, "global_step": 203608, "epoch": 1682} {"train_loss": -38.96257781982422, "global_step": 203609, "epoch": 1682} {"train_loss": -40.52863311767578, "global_step": 203610, "epoch": 1682} {"train_loss": -39.43408966064453, "global_step": 203611, "epoch": 1682} {"train_loss": -40.4704704284668, "global_step": 203612, "epoch": 1682} {"train_loss": -40.78463363647461, "global_step": 203613, "epoch": 1682} {"train_loss": -39.680908203125, "global_step": 203614, "epoch": 1682} {"train_loss": -40.868587493896484, "global_step": 203615, "epoch": 1682} {"train_loss": -40.47923278808594, "global_step": 203616, "epoch": 1682} {"train_loss": -40.53963088989258, "global_step": 203617, "epoch": 1682} {"train_loss": -40.59904098510742, "global_step": 203618, "epoch": 1682} {"train_loss": -40.786643981933594, "global_step": 203619, "epoch": 1682} {"train_loss": -39.22347640991211, "global_step": 203620, "epoch": 1682} {"train_loss": -40.98453903198242, "global_step": 203621, "epoch": 1682} {"train_loss": -40.74309158325195, "global_step": 203622, "epoch": 1682} {"train_loss": -41.09420394897461, "global_step": 203623, "epoch": 1682} {"train_loss": -39.784942626953125, "global_step": 203624, "epoch": 1682} {"train_loss": -40.87954330444336, "global_step": 203625, "epoch": 1682} {"train_loss": -40.06135559082031, "global_step": 203626, "epoch": 1682} {"train_loss": -39.42930221557617, "global_step": 203627, "epoch": 1682} {"train_loss": -41.39070510864258, "global_step": 203628, "epoch": 1682} {"train_loss": -40.573856353759766, "global_step": 203629, "epoch": 1682} {"train_loss": -41.14750289916992, "global_step": 203630, "epoch": 1682} {"train_loss": -40.72249221801758, "global_step": 203631, "epoch": 1682} {"train_loss": -40.24518585205078, "global_step": 203632, "epoch": 1682} {"train_loss": -40.92365264892578, "global_step": 203633, "epoch": 1682} {"train_loss": -40.78713607788086, "global_step": 203634, "epoch": 1682} {"train_loss": -41.391456604003906, "global_step": 203635, "epoch": 1682} {"train_loss": -40.9202880859375, "global_step": 203636, "epoch": 1682} {"train_loss": -41.419334411621094, "global_step": 203637, "epoch": 1682} {"train_loss": -41.380348205566406, "global_step": 203638, "epoch": 1682} {"train_loss": -40.2666015625, "global_step": 203639, "epoch": 1682} {"train_loss": -40.76430892944336, "global_step": 203640, "epoch": 1682} {"train_loss": -41.074066162109375, "global_step": 203641, "epoch": 1682} {"train_loss": -38.70945099759693, "global_step": 203642, "epoch": 1682, "val_loss": 2702013.75} {"train_loss": -41.26839065551758, "global_step": 203643, "epoch": 1683} {"train_loss": -40.8984489440918, "global_step": 203644, "epoch": 1683} {"train_loss": -40.625587463378906, "global_step": 203645, "epoch": 1683} {"train_loss": -41.433448791503906, "global_step": 203646, "epoch": 1683} {"train_loss": -41.68661117553711, "global_step": 203647, "epoch": 1683} {"train_loss": -40.979427337646484, "global_step": 203648, "epoch": 1683} {"train_loss": -41.35453414916992, "global_step": 203649, "epoch": 1683} {"train_loss": -41.21110153198242, "global_step": 203650, "epoch": 1683} {"train_loss": -41.54713821411133, "global_step": 203651, "epoch": 1683} {"train_loss": -41.523128509521484, "global_step": 203652, "epoch": 1683} {"train_loss": -40.08010482788086, "global_step": 203653, "epoch": 1683} {"train_loss": -39.7713737487793, "global_step": 203654, "epoch": 1683} {"train_loss": -36.8948860168457, "global_step": 203655, "epoch": 1683} {"train_loss": -39.14594650268555, "global_step": 203656, "epoch": 1683} {"train_loss": -41.200679779052734, "global_step": 203657, "epoch": 1683} {"train_loss": -39.07956314086914, "global_step": 203658, "epoch": 1683} {"train_loss": -35.07463455200195, "global_step": 203659, "epoch": 1683} {"train_loss": -40.51708984375, "global_step": 203660, "epoch": 1683} {"train_loss": -40.7583122253418, "global_step": 203661, "epoch": 1683} {"train_loss": -37.59798049926758, "global_step": 203662, "epoch": 1683} {"train_loss": -36.624000549316406, "global_step": 203663, "epoch": 1683} {"train_loss": -38.39467239379883, "global_step": 203664, "epoch": 1683} {"train_loss": -41.4116325378418, "global_step": 203665, "epoch": 1683} {"train_loss": -37.09548568725586, "global_step": 203666, "epoch": 1683} {"train_loss": -38.01304626464844, "global_step": 203667, "epoch": 1683} {"train_loss": -39.56472396850586, "global_step": 203668, "epoch": 1683} {"train_loss": -40.392208099365234, "global_step": 203669, "epoch": 1683} {"train_loss": -37.83430480957031, "global_step": 203670, "epoch": 1683} {"train_loss": -38.78475570678711, "global_step": 203671, "epoch": 1683} {"train_loss": -40.3601188659668, "global_step": 203672, "epoch": 1683} {"train_loss": -39.33928680419922, "global_step": 203673, "epoch": 1683} {"train_loss": -38.69161605834961, "global_step": 203674, "epoch": 1683} {"train_loss": -40.48383331298828, "global_step": 203675, "epoch": 1683} {"train_loss": -40.68146514892578, "global_step": 203676, "epoch": 1683} {"train_loss": -37.90816116333008, "global_step": 203677, "epoch": 1683} {"train_loss": -40.35702133178711, "global_step": 203678, "epoch": 1683} {"train_loss": -40.58414077758789, "global_step": 203679, "epoch": 1683} {"train_loss": -40.16032791137695, "global_step": 203680, "epoch": 1683} {"train_loss": -41.11953353881836, "global_step": 203681, "epoch": 1683} {"train_loss": -41.150875091552734, "global_step": 203682, "epoch": 1683} {"train_loss": -40.456787109375, "global_step": 203683, "epoch": 1683} {"train_loss": -40.946346282958984, "global_step": 203684, "epoch": 1683} {"train_loss": -41.26123046875, "global_step": 203685, "epoch": 1683} {"train_loss": -40.61335372924805, "global_step": 203686, "epoch": 1683} {"train_loss": -40.713897705078125, "global_step": 203687, "epoch": 1683} {"train_loss": -41.707637786865234, "global_step": 203688, "epoch": 1683} {"train_loss": -40.77617263793945, "global_step": 203689, "epoch": 1683} {"train_loss": -41.141387939453125, "global_step": 203690, "epoch": 1683} {"train_loss": -40.712425231933594, "global_step": 203691, "epoch": 1683} {"train_loss": -40.79360580444336, "global_step": 203692, "epoch": 1683} {"train_loss": -40.33980941772461, "global_step": 203693, "epoch": 1683} {"train_loss": -40.79829025268555, "global_step": 203694, "epoch": 1683} {"train_loss": -40.43754196166992, "global_step": 203695, "epoch": 1683} {"train_loss": -40.83320999145508, "global_step": 203696, "epoch": 1683} {"train_loss": -40.866153717041016, "global_step": 203697, "epoch": 1683} {"train_loss": -41.437843322753906, "global_step": 203698, "epoch": 1683} {"train_loss": -41.56211471557617, "global_step": 203699, "epoch": 1683} {"train_loss": -40.59060287475586, "global_step": 203700, "epoch": 1683} {"train_loss": -40.93935775756836, "global_step": 203701, "epoch": 1683} {"train_loss": -41.68616485595703, "global_step": 203702, "epoch": 1683} {"train_loss": -40.70066833496094, "global_step": 203703, "epoch": 1683} {"train_loss": -39.58089065551758, "global_step": 203704, "epoch": 1683} {"train_loss": -40.575294494628906, "global_step": 203705, "epoch": 1683} {"train_loss": -41.258548736572266, "global_step": 203706, "epoch": 1683} {"train_loss": -41.21084213256836, "global_step": 203707, "epoch": 1683} {"train_loss": -40.18147659301758, "global_step": 203708, "epoch": 1683} {"train_loss": -39.43949508666992, "global_step": 203709, "epoch": 1683} {"train_loss": -39.64640426635742, "global_step": 203710, "epoch": 1683} {"train_loss": -41.179195404052734, "global_step": 203711, "epoch": 1683} {"train_loss": -40.9841423034668, "global_step": 203712, "epoch": 1683} {"train_loss": -37.54874038696289, "global_step": 203713, "epoch": 1683} {"train_loss": -38.9051399230957, "global_step": 203714, "epoch": 1683} {"train_loss": -41.371063232421875, "global_step": 203715, "epoch": 1683} {"train_loss": -37.5904541015625, "global_step": 203716, "epoch": 1683} {"train_loss": -39.08079147338867, "global_step": 203717, "epoch": 1683} {"train_loss": -40.55485916137695, "global_step": 203718, "epoch": 1683} {"train_loss": -39.4288330078125, "global_step": 203719, "epoch": 1683} {"train_loss": -39.29624557495117, "global_step": 203720, "epoch": 1683} {"train_loss": -41.1642951965332, "global_step": 203721, "epoch": 1683} {"train_loss": -40.405094146728516, "global_step": 203722, "epoch": 1683} {"train_loss": -39.41818618774414, "global_step": 203723, "epoch": 1683} {"train_loss": -41.0725212097168, "global_step": 203724, "epoch": 1683} {"train_loss": -37.952308654785156, "global_step": 203725, "epoch": 1683} {"train_loss": -38.79494857788086, "global_step": 203726, "epoch": 1683} {"train_loss": -40.9711799621582, "global_step": 203727, "epoch": 1683} {"train_loss": -38.5417594909668, "global_step": 203728, "epoch": 1683} {"train_loss": -41.11891555786133, "global_step": 203729, "epoch": 1683} {"train_loss": -40.61808395385742, "global_step": 203730, "epoch": 1683} {"train_loss": -38.530025482177734, "global_step": 203731, "epoch": 1683} {"train_loss": -40.55739212036133, "global_step": 203732, "epoch": 1683} {"train_loss": -39.823604583740234, "global_step": 203733, "epoch": 1683} {"train_loss": -41.3943977355957, "global_step": 203734, "epoch": 1683} {"train_loss": -40.943782806396484, "global_step": 203735, "epoch": 1683} {"train_loss": -39.802730560302734, "global_step": 203736, "epoch": 1683} {"train_loss": -41.893856048583984, "global_step": 203737, "epoch": 1683} {"train_loss": -39.317012786865234, "global_step": 203738, "epoch": 1683} {"train_loss": -38.35675048828125, "global_step": 203739, "epoch": 1683} {"train_loss": -41.010982513427734, "global_step": 203740, "epoch": 1683} {"train_loss": -39.56280517578125, "global_step": 203741, "epoch": 1683} {"train_loss": -38.32807540893555, "global_step": 203742, "epoch": 1683} {"train_loss": -41.1328010559082, "global_step": 203743, "epoch": 1683} {"train_loss": -38.0515251159668, "global_step": 203744, "epoch": 1683} {"train_loss": -40.134002685546875, "global_step": 203745, "epoch": 1683} {"train_loss": -39.81550216674805, "global_step": 203746, "epoch": 1683} {"train_loss": -39.92290115356445, "global_step": 203747, "epoch": 1683} {"train_loss": -40.46678924560547, "global_step": 203748, "epoch": 1683} {"train_loss": -39.44588851928711, "global_step": 203749, "epoch": 1683} {"train_loss": -39.466957092285156, "global_step": 203750, "epoch": 1683} {"train_loss": -40.172515869140625, "global_step": 203751, "epoch": 1683} {"train_loss": -40.24563217163086, "global_step": 203752, "epoch": 1683} {"train_loss": -39.58300018310547, "global_step": 203753, "epoch": 1683} {"train_loss": -40.34498977661133, "global_step": 203754, "epoch": 1683} {"train_loss": -40.28209686279297, "global_step": 203755, "epoch": 1683} {"train_loss": -39.83366394042969, "global_step": 203756, "epoch": 1683} {"train_loss": -40.497249603271484, "global_step": 203757, "epoch": 1683} {"train_loss": -39.56834030151367, "global_step": 203758, "epoch": 1683} {"train_loss": -40.51682662963867, "global_step": 203759, "epoch": 1683} {"train_loss": -40.87726974487305, "global_step": 203760, "epoch": 1683} {"train_loss": -40.65067672729492, "global_step": 203761, "epoch": 1683} {"train_loss": -40.82242965698242, "global_step": 203762, "epoch": 1683} {"train_loss": -40.09528678704884, "global_step": 203763, "epoch": 1683, "val_loss": 2625443.25} {"train_loss": -40.54313278198242, "global_step": 203764, "epoch": 1684} {"train_loss": -40.16396713256836, "global_step": 203765, "epoch": 1684} {"train_loss": -40.9803581237793, "global_step": 203766, "epoch": 1684} {"train_loss": -40.34970474243164, "global_step": 203767, "epoch": 1684} {"train_loss": -41.00075912475586, "global_step": 203768, "epoch": 1684} {"train_loss": -40.438514709472656, "global_step": 203769, "epoch": 1684} {"train_loss": -41.52065658569336, "global_step": 203770, "epoch": 1684} {"train_loss": -41.05632400512695, "global_step": 203771, "epoch": 1684} {"train_loss": -41.56559371948242, "global_step": 203772, "epoch": 1684} {"train_loss": -41.519779205322266, "global_step": 203773, "epoch": 1684} {"train_loss": -41.290775299072266, "global_step": 203774, "epoch": 1684} {"train_loss": -41.67487716674805, "global_step": 203775, "epoch": 1684} {"train_loss": -41.029884338378906, "global_step": 203776, "epoch": 1684} {"train_loss": -40.42556381225586, "global_step": 203777, "epoch": 1684} {"train_loss": -41.28779983520508, "global_step": 203778, "epoch": 1684} {"train_loss": -42.02875518798828, "global_step": 203779, "epoch": 1684} {"train_loss": -41.52219772338867, "global_step": 203780, "epoch": 1684} {"train_loss": -41.70769119262695, "global_step": 203781, "epoch": 1684} {"train_loss": -42.1162223815918, "global_step": 203782, "epoch": 1684} {"train_loss": -41.40787887573242, "global_step": 203783, "epoch": 1684} {"train_loss": -42.05136489868164, "global_step": 203784, "epoch": 1684} {"train_loss": -41.829524993896484, "global_step": 203785, "epoch": 1684} {"train_loss": -40.886566162109375, "global_step": 203786, "epoch": 1684} {"train_loss": -41.55398178100586, "global_step": 203787, "epoch": 1684} {"train_loss": -41.82815170288086, "global_step": 203788, "epoch": 1684} {"train_loss": -42.03005599975586, "global_step": 203789, "epoch": 1684} {"train_loss": -42.0631103515625, "global_step": 203790, "epoch": 1684} {"train_loss": -41.14588165283203, "global_step": 203791, "epoch": 1684} {"train_loss": -42.119140625, "global_step": 203792, "epoch": 1684} {"train_loss": -41.97459030151367, "global_step": 203793, "epoch": 1684} {"train_loss": -41.56640625, "global_step": 203794, "epoch": 1684} {"train_loss": -41.41962814331055, "global_step": 203795, "epoch": 1684} {"train_loss": -41.766845703125, "global_step": 203796, "epoch": 1684} {"train_loss": -41.614070892333984, "global_step": 203797, "epoch": 1684} {"train_loss": -41.45707321166992, "global_step": 203798, "epoch": 1684} {"train_loss": -41.81841278076172, "global_step": 203799, "epoch": 1684} {"train_loss": -41.28972244262695, "global_step": 203800, "epoch": 1684} {"train_loss": -41.41251754760742, "global_step": 203801, "epoch": 1684} {"train_loss": -41.74692916870117, "global_step": 203802, "epoch": 1684} {"train_loss": -41.560302734375, "global_step": 203803, "epoch": 1684} {"train_loss": -41.763885498046875, "global_step": 203804, "epoch": 1684} {"train_loss": -41.93490219116211, "global_step": 203805, "epoch": 1684} {"train_loss": -41.62886428833008, "global_step": 203806, "epoch": 1684} {"train_loss": -41.584224700927734, "global_step": 203807, "epoch": 1684} {"train_loss": -41.8910026550293, "global_step": 203808, "epoch": 1684} {"train_loss": -41.213191986083984, "global_step": 203809, "epoch": 1684} {"train_loss": -40.325531005859375, "global_step": 203810, "epoch": 1684} {"train_loss": -41.70863342285156, "global_step": 203811, "epoch": 1684} {"train_loss": -42.40556716918945, "global_step": 203812, "epoch": 1684} {"train_loss": -41.99353790283203, "global_step": 203813, "epoch": 1684} {"train_loss": -41.60779571533203, "global_step": 203814, "epoch": 1684} {"train_loss": -41.445823669433594, "global_step": 203815, "epoch": 1684} {"train_loss": -41.643741607666016, "global_step": 203816, "epoch": 1684} {"train_loss": -41.210426330566406, "global_step": 203817, "epoch": 1684} {"train_loss": -42.55585861206055, "global_step": 203818, "epoch": 1684} {"train_loss": -41.082855224609375, "global_step": 203819, "epoch": 1684} {"train_loss": -40.05781173706055, "global_step": 203820, "epoch": 1684} {"train_loss": -40.528541564941406, "global_step": 203821, "epoch": 1684} {"train_loss": -41.42719268798828, "global_step": 203822, "epoch": 1684} {"train_loss": -40.97841262817383, "global_step": 203823, "epoch": 1684} {"train_loss": -41.12791442871094, "global_step": 203824, "epoch": 1684} {"train_loss": -39.25181579589844, "global_step": 203825, "epoch": 1684} {"train_loss": -39.703590393066406, "global_step": 203826, "epoch": 1684} {"train_loss": -40.22144317626953, "global_step": 203827, "epoch": 1684} {"train_loss": -41.625, "global_step": 203828, "epoch": 1684} {"train_loss": -41.894927978515625, "global_step": 203829, "epoch": 1684} {"train_loss": -40.225685119628906, "global_step": 203830, "epoch": 1684} {"train_loss": -40.44132995605469, "global_step": 203831, "epoch": 1684} {"train_loss": -42.37311935424805, "global_step": 203832, "epoch": 1684} {"train_loss": -41.982975006103516, "global_step": 203833, "epoch": 1684} {"train_loss": -41.66140365600586, "global_step": 203834, "epoch": 1684} {"train_loss": -41.0450439453125, "global_step": 203835, "epoch": 1684} {"train_loss": -41.00297164916992, "global_step": 203836, "epoch": 1684} {"train_loss": -41.463409423828125, "global_step": 203837, "epoch": 1684} {"train_loss": -41.97613525390625, "global_step": 203838, "epoch": 1684} {"train_loss": -41.98942947387695, "global_step": 203839, "epoch": 1684} {"train_loss": -41.45951461791992, "global_step": 203840, "epoch": 1684} {"train_loss": -41.65578079223633, "global_step": 203841, "epoch": 1684} {"train_loss": -42.200538635253906, "global_step": 203842, "epoch": 1684} {"train_loss": -41.418495178222656, "global_step": 203843, "epoch": 1684} {"train_loss": -41.35049057006836, "global_step": 203844, "epoch": 1684} {"train_loss": -41.6256103515625, "global_step": 203845, "epoch": 1684} {"train_loss": -41.68646240234375, "global_step": 203846, "epoch": 1684} {"train_loss": -40.64247131347656, "global_step": 203847, "epoch": 1684} {"train_loss": -41.693580627441406, "global_step": 203848, "epoch": 1684} {"train_loss": -41.8211784362793, "global_step": 203849, "epoch": 1684} {"train_loss": -41.00371170043945, "global_step": 203850, "epoch": 1684} {"train_loss": -40.25673294067383, "global_step": 203851, "epoch": 1684} {"train_loss": -41.443565368652344, "global_step": 203852, "epoch": 1684} {"train_loss": -40.5423583984375, "global_step": 203853, "epoch": 1684} {"train_loss": -39.37437057495117, "global_step": 203854, "epoch": 1684} {"train_loss": -40.072120666503906, "global_step": 203855, "epoch": 1684} {"train_loss": -39.81365966796875, "global_step": 203856, "epoch": 1684} {"train_loss": -41.341590881347656, "global_step": 203857, "epoch": 1684} {"train_loss": -39.825504302978516, "global_step": 203858, "epoch": 1684} {"train_loss": -41.372596740722656, "global_step": 203859, "epoch": 1684} {"train_loss": -39.242584228515625, "global_step": 203860, "epoch": 1684} {"train_loss": -39.70351028442383, "global_step": 203861, "epoch": 1684} {"train_loss": -39.869075775146484, "global_step": 203862, "epoch": 1684} {"train_loss": -41.40076446533203, "global_step": 203863, "epoch": 1684} {"train_loss": -40.69671630859375, "global_step": 203864, "epoch": 1684} {"train_loss": -41.77320861816406, "global_step": 203865, "epoch": 1684} {"train_loss": -41.77248764038086, "global_step": 203866, "epoch": 1684} {"train_loss": -41.55534362792969, "global_step": 203867, "epoch": 1684} {"train_loss": -40.87405014038086, "global_step": 203868, "epoch": 1684} {"train_loss": -41.17839431762695, "global_step": 203869, "epoch": 1684} {"train_loss": -41.40426254272461, "global_step": 203870, "epoch": 1684} {"train_loss": -41.344783782958984, "global_step": 203871, "epoch": 1684} {"train_loss": -40.831024169921875, "global_step": 203872, "epoch": 1684} {"train_loss": -39.539764404296875, "global_step": 203873, "epoch": 1684} {"train_loss": -38.55485153198242, "global_step": 203874, "epoch": 1684} {"train_loss": -40.19519805908203, "global_step": 203875, "epoch": 1684} {"train_loss": -41.00714111328125, "global_step": 203876, "epoch": 1684} {"train_loss": -38.94683074951172, "global_step": 203877, "epoch": 1684} {"train_loss": -40.228759765625, "global_step": 203878, "epoch": 1684} {"train_loss": -40.8364372253418, "global_step": 203879, "epoch": 1684} {"train_loss": -36.92131042480469, "global_step": 203880, "epoch": 1684} {"train_loss": -40.7999382019043, "global_step": 203881, "epoch": 1684} {"train_loss": -36.07514953613281, "global_step": 203882, "epoch": 1684} {"train_loss": -40.082618713378906, "global_step": 203883, "epoch": 1684} {"train_loss": -41.00771394839957, "global_step": 203884, "epoch": 1684, "val_loss": 2663897.5} {"train_loss": -31.1344051361084, "global_step": 203885, "epoch": 1685} {"train_loss": -28.858301162719727, "global_step": 203886, "epoch": 1685} {"train_loss": -28.275959014892578, "global_step": 203887, "epoch": 1685} {"train_loss": -31.14723014831543, "global_step": 203888, "epoch": 1685} {"train_loss": -27.067249298095703, "global_step": 203889, "epoch": 1685} {"train_loss": -33.626277923583984, "global_step": 203890, "epoch": 1685} {"train_loss": -32.12008285522461, "global_step": 203891, "epoch": 1685} {"train_loss": -31.538101196289062, "global_step": 203892, "epoch": 1685} {"train_loss": -33.57551956176758, "global_step": 203893, "epoch": 1685} {"train_loss": -32.37247085571289, "global_step": 203894, "epoch": 1685} {"train_loss": -33.42995834350586, "global_step": 203895, "epoch": 1685} {"train_loss": -35.14619445800781, "global_step": 203896, "epoch": 1685} {"train_loss": -35.18222427368164, "global_step": 203897, "epoch": 1685} {"train_loss": -37.38151168823242, "global_step": 203898, "epoch": 1685} {"train_loss": -38.25107955932617, "global_step": 203899, "epoch": 1685} {"train_loss": -37.303382873535156, "global_step": 203900, "epoch": 1685} {"train_loss": -37.62326431274414, "global_step": 203901, "epoch": 1685} {"train_loss": -37.8951530456543, "global_step": 203902, "epoch": 1685} {"train_loss": -38.24468994140625, "global_step": 203903, "epoch": 1685} {"train_loss": -39.1893310546875, "global_step": 203904, "epoch": 1685} {"train_loss": -38.66225051879883, "global_step": 203905, "epoch": 1685} {"train_loss": -39.751251220703125, "global_step": 203906, "epoch": 1685} {"train_loss": -39.05389404296875, "global_step": 203907, "epoch": 1685} {"train_loss": -39.743988037109375, "global_step": 203908, "epoch": 1685} {"train_loss": -39.67224884033203, "global_step": 203909, "epoch": 1685} {"train_loss": -39.26951217651367, "global_step": 203910, "epoch": 1685} {"train_loss": -39.27763366699219, "global_step": 203911, "epoch": 1685} {"train_loss": -40.492984771728516, "global_step": 203912, "epoch": 1685} {"train_loss": -39.61286163330078, "global_step": 203913, "epoch": 1685} {"train_loss": -39.813880920410156, "global_step": 203914, "epoch": 1685} {"train_loss": -39.987220764160156, "global_step": 203915, "epoch": 1685} {"train_loss": -40.17684555053711, "global_step": 203916, "epoch": 1685} {"train_loss": -40.12250518798828, "global_step": 203917, "epoch": 1685} {"train_loss": -40.830265045166016, "global_step": 203918, "epoch": 1685} {"train_loss": -41.260467529296875, "global_step": 203919, "epoch": 1685} {"train_loss": -40.540164947509766, "global_step": 203920, "epoch": 1685} {"train_loss": -40.75849533081055, "global_step": 203921, "epoch": 1685} {"train_loss": -40.90858840942383, "global_step": 203922, "epoch": 1685} {"train_loss": -40.81730270385742, "global_step": 203923, "epoch": 1685} {"train_loss": -41.37498092651367, "global_step": 203924, "epoch": 1685} {"train_loss": -41.185821533203125, "global_step": 203925, "epoch": 1685} {"train_loss": -41.552608489990234, "global_step": 203926, "epoch": 1685} {"train_loss": -41.49745559692383, "global_step": 203927, "epoch": 1685} {"train_loss": -40.98596954345703, "global_step": 203928, "epoch": 1685} {"train_loss": -41.5601692199707, "global_step": 203929, "epoch": 1685} {"train_loss": -41.6275520324707, "global_step": 203930, "epoch": 1685} {"train_loss": -41.68317794799805, "global_step": 203931, "epoch": 1685} {"train_loss": -41.331947326660156, "global_step": 203932, "epoch": 1685} {"train_loss": -41.85207748413086, "global_step": 203933, "epoch": 1685} {"train_loss": -41.86439895629883, "global_step": 203934, "epoch": 1685} {"train_loss": -41.753334045410156, "global_step": 203935, "epoch": 1685} {"train_loss": -41.2735710144043, "global_step": 203936, "epoch": 1685} {"train_loss": -41.69440460205078, "global_step": 203937, "epoch": 1685} {"train_loss": -41.51384353637695, "global_step": 203938, "epoch": 1685} {"train_loss": -41.88082504272461, "global_step": 203939, "epoch": 1685} {"train_loss": -41.88196563720703, "global_step": 203940, "epoch": 1685} {"train_loss": -41.87166976928711, "global_step": 203941, "epoch": 1685} {"train_loss": -42.21250915527344, "global_step": 203942, "epoch": 1685} {"train_loss": -41.725799560546875, "global_step": 203943, "epoch": 1685} {"train_loss": -42.049476623535156, "global_step": 203944, "epoch": 1685} {"train_loss": -41.761817932128906, "global_step": 203945, "epoch": 1685} {"train_loss": -41.04022216796875, "global_step": 203946, "epoch": 1685} {"train_loss": -41.90804672241211, "global_step": 203947, "epoch": 1685} {"train_loss": -42.457271575927734, "global_step": 203948, "epoch": 1685} {"train_loss": -42.45209503173828, "global_step": 203949, "epoch": 1685} {"train_loss": -41.75160217285156, "global_step": 203950, "epoch": 1685} {"train_loss": -42.12578582763672, "global_step": 203951, "epoch": 1685} {"train_loss": -42.106719970703125, "global_step": 203952, "epoch": 1685} {"train_loss": -41.98629379272461, "global_step": 203953, "epoch": 1685} {"train_loss": -41.90057373046875, "global_step": 203954, "epoch": 1685} {"train_loss": -42.17607498168945, "global_step": 203955, "epoch": 1685} {"train_loss": -42.130435943603516, "global_step": 203956, "epoch": 1685} {"train_loss": -42.37453842163086, "global_step": 203957, "epoch": 1685} {"train_loss": -42.11932373046875, "global_step": 203958, "epoch": 1685} {"train_loss": -42.691322326660156, "global_step": 203959, "epoch": 1685} {"train_loss": -42.563838958740234, "global_step": 203960, "epoch": 1685} {"train_loss": -42.4517936706543, "global_step": 203961, "epoch": 1685} {"train_loss": -42.75724411010742, "global_step": 203962, "epoch": 1685} {"train_loss": -42.13432693481445, "global_step": 203963, "epoch": 1685} {"train_loss": -42.35698318481445, "global_step": 203964, "epoch": 1685} {"train_loss": -42.4282341003418, "global_step": 203965, "epoch": 1685} {"train_loss": -42.382747650146484, "global_step": 203966, "epoch": 1685} {"train_loss": -42.7724609375, "global_step": 203967, "epoch": 1685} {"train_loss": -42.32563018798828, "global_step": 203968, "epoch": 1685} {"train_loss": -42.843387603759766, "global_step": 203969, "epoch": 1685} {"train_loss": -42.429134368896484, "global_step": 203970, "epoch": 1685} {"train_loss": -41.93733215332031, "global_step": 203971, "epoch": 1685} {"train_loss": -42.52510070800781, "global_step": 203972, "epoch": 1685} {"train_loss": -42.47377014160156, "global_step": 203973, "epoch": 1685} {"train_loss": -41.6737174987793, "global_step": 203974, "epoch": 1685} {"train_loss": -42.7619514465332, "global_step": 203975, "epoch": 1685} {"train_loss": -41.90473556518555, "global_step": 203976, "epoch": 1685} {"train_loss": -42.738555908203125, "global_step": 203977, "epoch": 1685} {"train_loss": -42.129798889160156, "global_step": 203978, "epoch": 1685} {"train_loss": -42.07966995239258, "global_step": 203979, "epoch": 1685} {"train_loss": -39.790374755859375, "global_step": 203980, "epoch": 1685} {"train_loss": -34.11090087890625, "global_step": 203981, "epoch": 1685} {"train_loss": -41.47772216796875, "global_step": 203982, "epoch": 1685} {"train_loss": -41.6085319519043, "global_step": 203983, "epoch": 1685} {"train_loss": -35.40224838256836, "global_step": 203984, "epoch": 1685} {"train_loss": -35.41344451904297, "global_step": 203985, "epoch": 1685} {"train_loss": -39.338558197021484, "global_step": 203986, "epoch": 1685} {"train_loss": -34.75821304321289, "global_step": 203987, "epoch": 1685} {"train_loss": -34.31809997558594, "global_step": 203988, "epoch": 1685} {"train_loss": -36.71830368041992, "global_step": 203989, "epoch": 1685} {"train_loss": -36.40094757080078, "global_step": 203990, "epoch": 1685} {"train_loss": -35.968135833740234, "global_step": 203991, "epoch": 1685} {"train_loss": -37.07851791381836, "global_step": 203992, "epoch": 1685} {"train_loss": -37.155879974365234, "global_step": 203993, "epoch": 1685} {"train_loss": -38.49822998046875, "global_step": 203994, "epoch": 1685} {"train_loss": -39.822731018066406, "global_step": 203995, "epoch": 1685} {"train_loss": -36.988826751708984, "global_step": 203996, "epoch": 1685} {"train_loss": -39.48883056640625, "global_step": 203997, "epoch": 1685} {"train_loss": -36.80449676513672, "global_step": 203998, "epoch": 1685} {"train_loss": -39.11928939819336, "global_step": 203999, "epoch": 1685} {"train_loss": -37.111968994140625, "global_step": 204000, "epoch": 1685} {"train_loss": -37.97721481323242, "global_step": 204001, "epoch": 1685} {"train_loss": -36.92771530151367, "global_step": 204002, "epoch": 1685} {"train_loss": -37.753719329833984, "global_step": 204003, "epoch": 1685} {"train_loss": -38.12214279174805, "global_step": 204004, "epoch": 1685} {"train_loss": -39.418285921585465, "global_step": 204005, "epoch": 1685, "val_loss": 2606937.0} {"train_loss": -39.740318298339844, "global_step": 204006, "epoch": 1686} {"train_loss": -38.77521514892578, "global_step": 204007, "epoch": 1686} {"train_loss": -39.98440170288086, "global_step": 204008, "epoch": 1686} {"train_loss": -40.57593536376953, "global_step": 204009, "epoch": 1686} {"train_loss": -40.23755645751953, "global_step": 204010, "epoch": 1686} {"train_loss": -40.085506439208984, "global_step": 204011, "epoch": 1686} {"train_loss": -41.27233123779297, "global_step": 204012, "epoch": 1686} {"train_loss": -40.82352828979492, "global_step": 204013, "epoch": 1686} {"train_loss": -41.47860336303711, "global_step": 204014, "epoch": 1686} {"train_loss": -40.72810363769531, "global_step": 204015, "epoch": 1686} {"train_loss": -40.70937728881836, "global_step": 204016, "epoch": 1686} {"train_loss": -41.14759063720703, "global_step": 204017, "epoch": 1686} {"train_loss": -41.23890686035156, "global_step": 204018, "epoch": 1686} {"train_loss": -41.201351165771484, "global_step": 204019, "epoch": 1686} {"train_loss": -41.860347747802734, "global_step": 204020, "epoch": 1686} {"train_loss": -40.095664978027344, "global_step": 204021, "epoch": 1686} {"train_loss": -41.09869384765625, "global_step": 204022, "epoch": 1686} {"train_loss": -41.83195114135742, "global_step": 204023, "epoch": 1686} {"train_loss": -41.36410140991211, "global_step": 204024, "epoch": 1686} {"train_loss": -41.67348098754883, "global_step": 204025, "epoch": 1686} {"train_loss": -41.85711669921875, "global_step": 204026, "epoch": 1686} {"train_loss": -41.38572311401367, "global_step": 204027, "epoch": 1686} {"train_loss": -41.504066467285156, "global_step": 204028, "epoch": 1686} {"train_loss": -41.599998474121094, "global_step": 204029, "epoch": 1686} {"train_loss": -41.90206527709961, "global_step": 204030, "epoch": 1686} {"train_loss": -41.7477912902832, "global_step": 204031, "epoch": 1686} {"train_loss": -41.70597457885742, "global_step": 204032, "epoch": 1686} {"train_loss": -41.06161880493164, "global_step": 204033, "epoch": 1686} {"train_loss": -41.7227668762207, "global_step": 204034, "epoch": 1686} {"train_loss": -42.13859558105469, "global_step": 204035, "epoch": 1686} {"train_loss": -41.32021713256836, "global_step": 204036, "epoch": 1686} {"train_loss": -41.844417572021484, "global_step": 204037, "epoch": 1686} {"train_loss": -41.57118225097656, "global_step": 204038, "epoch": 1686} {"train_loss": -41.84220504760742, "global_step": 204039, "epoch": 1686} {"train_loss": -42.140655517578125, "global_step": 204040, "epoch": 1686} {"train_loss": -42.056678771972656, "global_step": 204041, "epoch": 1686} {"train_loss": -41.36368942260742, "global_step": 204042, "epoch": 1686} {"train_loss": -41.22279357910156, "global_step": 204043, "epoch": 1686} {"train_loss": -41.76544952392578, "global_step": 204044, "epoch": 1686} {"train_loss": -41.49546813964844, "global_step": 204045, "epoch": 1686} {"train_loss": -41.73872756958008, "global_step": 204046, "epoch": 1686} {"train_loss": -41.30810546875, "global_step": 204047, "epoch": 1686} {"train_loss": -42.249629974365234, "global_step": 204048, "epoch": 1686} {"train_loss": -41.73689651489258, "global_step": 204049, "epoch": 1686} {"train_loss": -41.900665283203125, "global_step": 204050, "epoch": 1686} {"train_loss": -41.59824752807617, "global_step": 204051, "epoch": 1686} {"train_loss": -41.02429962158203, "global_step": 204052, "epoch": 1686} {"train_loss": -42.20142364501953, "global_step": 204053, "epoch": 1686} {"train_loss": -41.75123596191406, "global_step": 204054, "epoch": 1686} {"train_loss": -40.27980041503906, "global_step": 204055, "epoch": 1686} {"train_loss": -39.97612380981445, "global_step": 204056, "epoch": 1686} {"train_loss": -40.96982955932617, "global_step": 204057, "epoch": 1686} {"train_loss": -40.514984130859375, "global_step": 204058, "epoch": 1686} {"train_loss": -42.50999069213867, "global_step": 204059, "epoch": 1686} {"train_loss": -41.7474250793457, "global_step": 204060, "epoch": 1686} {"train_loss": -41.00604248046875, "global_step": 204061, "epoch": 1686} {"train_loss": -39.98032760620117, "global_step": 204062, "epoch": 1686} {"train_loss": -40.793495178222656, "global_step": 204063, "epoch": 1686} {"train_loss": -39.619659423828125, "global_step": 204064, "epoch": 1686} {"train_loss": -40.85213851928711, "global_step": 204065, "epoch": 1686} {"train_loss": -41.156307220458984, "global_step": 204066, "epoch": 1686} {"train_loss": -41.50626754760742, "global_step": 204067, "epoch": 1686} {"train_loss": -40.6463737487793, "global_step": 204068, "epoch": 1686} {"train_loss": -41.0583381652832, "global_step": 204069, "epoch": 1686} {"train_loss": -41.326568603515625, "global_step": 204070, "epoch": 1686} {"train_loss": -40.97060775756836, "global_step": 204071, "epoch": 1686} {"train_loss": -39.55057907104492, "global_step": 204072, "epoch": 1686} {"train_loss": -38.946136474609375, "global_step": 204073, "epoch": 1686} {"train_loss": -41.13045883178711, "global_step": 204074, "epoch": 1686} {"train_loss": -41.57218551635742, "global_step": 204075, "epoch": 1686} {"train_loss": -39.472938537597656, "global_step": 204076, "epoch": 1686} {"train_loss": -40.49186706542969, "global_step": 204077, "epoch": 1686} {"train_loss": -41.72880172729492, "global_step": 204078, "epoch": 1686} {"train_loss": -42.25895309448242, "global_step": 204079, "epoch": 1686} {"train_loss": -41.04387283325195, "global_step": 204080, "epoch": 1686} {"train_loss": -41.490352630615234, "global_step": 204081, "epoch": 1686} {"train_loss": -42.17757797241211, "global_step": 204082, "epoch": 1686} {"train_loss": -42.18185043334961, "global_step": 204083, "epoch": 1686} {"train_loss": -41.1044807434082, "global_step": 204084, "epoch": 1686} {"train_loss": -41.94723892211914, "global_step": 204085, "epoch": 1686} {"train_loss": -41.3713493347168, "global_step": 204086, "epoch": 1686} {"train_loss": -41.0817756652832, "global_step": 204087, "epoch": 1686} {"train_loss": -41.84824752807617, "global_step": 204088, "epoch": 1686} {"train_loss": -41.927581787109375, "global_step": 204089, "epoch": 1686} {"train_loss": -40.8304557800293, "global_step": 204090, "epoch": 1686} {"train_loss": -41.619102478027344, "global_step": 204091, "epoch": 1686} {"train_loss": -41.65728759765625, "global_step": 204092, "epoch": 1686} {"train_loss": -41.92157745361328, "global_step": 204093, "epoch": 1686} {"train_loss": -41.876869201660156, "global_step": 204094, "epoch": 1686} {"train_loss": -42.13176345825195, "global_step": 204095, "epoch": 1686} {"train_loss": -42.48798751831055, "global_step": 204096, "epoch": 1686} {"train_loss": -42.19183349609375, "global_step": 204097, "epoch": 1686} {"train_loss": -41.95402908325195, "global_step": 204098, "epoch": 1686} {"train_loss": -41.77834701538086, "global_step": 204099, "epoch": 1686} {"train_loss": -42.6470947265625, "global_step": 204100, "epoch": 1686} {"train_loss": -41.867584228515625, "global_step": 204101, "epoch": 1686} {"train_loss": -41.89272689819336, "global_step": 204102, "epoch": 1686} {"train_loss": -41.185909271240234, "global_step": 204103, "epoch": 1686} {"train_loss": -42.044063568115234, "global_step": 204104, "epoch": 1686} {"train_loss": -41.18024444580078, "global_step": 204105, "epoch": 1686} {"train_loss": -42.08686447143555, "global_step": 204106, "epoch": 1686} {"train_loss": -42.281463623046875, "global_step": 204107, "epoch": 1686} {"train_loss": -41.33221435546875, "global_step": 204108, "epoch": 1686} {"train_loss": -40.75440216064453, "global_step": 204109, "epoch": 1686} {"train_loss": -41.733070373535156, "global_step": 204110, "epoch": 1686} {"train_loss": -41.055355072021484, "global_step": 204111, "epoch": 1686} {"train_loss": -41.777950286865234, "global_step": 204112, "epoch": 1686} {"train_loss": -41.20566940307617, "global_step": 204113, "epoch": 1686} {"train_loss": -41.951019287109375, "global_step": 204114, "epoch": 1686} {"train_loss": -42.1319580078125, "global_step": 204115, "epoch": 1686} {"train_loss": -42.14665985107422, "global_step": 204116, "epoch": 1686} {"train_loss": -41.608821868896484, "global_step": 204117, "epoch": 1686} {"train_loss": -41.24538040161133, "global_step": 204118, "epoch": 1686} {"train_loss": -41.5090446472168, "global_step": 204119, "epoch": 1686} {"train_loss": -41.290313720703125, "global_step": 204120, "epoch": 1686} {"train_loss": -40.43879318237305, "global_step": 204121, "epoch": 1686} {"train_loss": -38.4842414855957, "global_step": 204122, "epoch": 1686} {"train_loss": -39.548492431640625, "global_step": 204123, "epoch": 1686} {"train_loss": -40.615116119384766, "global_step": 204124, "epoch": 1686} {"train_loss": -41.27182388305664, "global_step": 204125, "epoch": 1686} {"train_loss": -41.28149117714118, "global_step": 204126, "epoch": 1686, "val_loss": 2648529.75} {"train_loss": -40.69050979614258, "global_step": 204127, "epoch": 1687} {"train_loss": -41.626365661621094, "global_step": 204128, "epoch": 1687} {"train_loss": -41.22038650512695, "global_step": 204129, "epoch": 1687} {"train_loss": -40.077659606933594, "global_step": 204130, "epoch": 1687} {"train_loss": -40.81425094604492, "global_step": 204131, "epoch": 1687} {"train_loss": -40.76505661010742, "global_step": 204132, "epoch": 1687} {"train_loss": -41.51301574707031, "global_step": 204133, "epoch": 1687} {"train_loss": -40.60346603393555, "global_step": 204134, "epoch": 1687} {"train_loss": -41.23293685913086, "global_step": 204135, "epoch": 1687} {"train_loss": -40.25880432128906, "global_step": 204136, "epoch": 1687} {"train_loss": -40.3944206237793, "global_step": 204137, "epoch": 1687} {"train_loss": -42.0179443359375, "global_step": 204138, "epoch": 1687} {"train_loss": -40.63125991821289, "global_step": 204139, "epoch": 1687} {"train_loss": -40.155513763427734, "global_step": 204140, "epoch": 1687} {"train_loss": -41.6336784362793, "global_step": 204141, "epoch": 1687} {"train_loss": -41.222198486328125, "global_step": 204142, "epoch": 1687} {"train_loss": -42.21602249145508, "global_step": 204143, "epoch": 1687} {"train_loss": -41.998451232910156, "global_step": 204144, "epoch": 1687} {"train_loss": -42.02396011352539, "global_step": 204145, "epoch": 1687} {"train_loss": -41.496761322021484, "global_step": 204146, "epoch": 1687} {"train_loss": -41.930259704589844, "global_step": 204147, "epoch": 1687} {"train_loss": -42.09934616088867, "global_step": 204148, "epoch": 1687} {"train_loss": -40.58309555053711, "global_step": 204149, "epoch": 1687} {"train_loss": -41.81903839111328, "global_step": 204150, "epoch": 1687} {"train_loss": -41.663963317871094, "global_step": 204151, "epoch": 1687} {"train_loss": -42.02480697631836, "global_step": 204152, "epoch": 1687} {"train_loss": -41.09711837768555, "global_step": 204153, "epoch": 1687} {"train_loss": -42.098731994628906, "global_step": 204154, "epoch": 1687} {"train_loss": -41.93232345581055, "global_step": 204155, "epoch": 1687} {"train_loss": -42.238826751708984, "global_step": 204156, "epoch": 1687} {"train_loss": -42.78944396972656, "global_step": 204157, "epoch": 1687} {"train_loss": -41.6767692565918, "global_step": 204158, "epoch": 1687} {"train_loss": -42.064144134521484, "global_step": 204159, "epoch": 1687} {"train_loss": -42.45942687988281, "global_step": 204160, "epoch": 1687} {"train_loss": -42.82897186279297, "global_step": 204161, "epoch": 1687} {"train_loss": -41.817806243896484, "global_step": 204162, "epoch": 1687} {"train_loss": -42.81777572631836, "global_step": 204163, "epoch": 1687} {"train_loss": -42.119850158691406, "global_step": 204164, "epoch": 1687} {"train_loss": -41.61900329589844, "global_step": 204165, "epoch": 1687} {"train_loss": -42.30019760131836, "global_step": 204166, "epoch": 1687} {"train_loss": -41.58049774169922, "global_step": 204167, "epoch": 1687} {"train_loss": -42.48141098022461, "global_step": 204168, "epoch": 1687} {"train_loss": -42.3727912902832, "global_step": 204169, "epoch": 1687} {"train_loss": -42.240234375, "global_step": 204170, "epoch": 1687} {"train_loss": -42.55305099487305, "global_step": 204171, "epoch": 1687} {"train_loss": -42.50350570678711, "global_step": 204172, "epoch": 1687} {"train_loss": -42.1633415222168, "global_step": 204173, "epoch": 1687} {"train_loss": -42.13119125366211, "global_step": 204174, "epoch": 1687} {"train_loss": -42.256412506103516, "global_step": 204175, "epoch": 1687} {"train_loss": -42.848751068115234, "global_step": 204176, "epoch": 1687} {"train_loss": -42.23666000366211, "global_step": 204177, "epoch": 1687} {"train_loss": -42.951934814453125, "global_step": 204178, "epoch": 1687} {"train_loss": -42.6862907409668, "global_step": 204179, "epoch": 1687} {"train_loss": -42.23700714111328, "global_step": 204180, "epoch": 1687} {"train_loss": -41.840511322021484, "global_step": 204181, "epoch": 1687} {"train_loss": -42.841609954833984, "global_step": 204182, "epoch": 1687} {"train_loss": -42.15425109863281, "global_step": 204183, "epoch": 1687} {"train_loss": -40.509185791015625, "global_step": 204184, "epoch": 1687} {"train_loss": -40.34479522705078, "global_step": 204185, "epoch": 1687} {"train_loss": -41.53981399536133, "global_step": 204186, "epoch": 1687} {"train_loss": -41.46284103393555, "global_step": 204187, "epoch": 1687} {"train_loss": -41.75254440307617, "global_step": 204188, "epoch": 1687} {"train_loss": -41.1008186340332, "global_step": 204189, "epoch": 1687} {"train_loss": -41.74867630004883, "global_step": 204190, "epoch": 1687} {"train_loss": -41.5852165222168, "global_step": 204191, "epoch": 1687} {"train_loss": -40.07577896118164, "global_step": 204192, "epoch": 1687} {"train_loss": -40.704471588134766, "global_step": 204193, "epoch": 1687} {"train_loss": -41.6334114074707, "global_step": 204194, "epoch": 1687} {"train_loss": -41.070281982421875, "global_step": 204195, "epoch": 1687} {"train_loss": -40.83759689331055, "global_step": 204196, "epoch": 1687} {"train_loss": -41.7109260559082, "global_step": 204197, "epoch": 1687} {"train_loss": -40.52634811401367, "global_step": 204198, "epoch": 1687} {"train_loss": -39.73832321166992, "global_step": 204199, "epoch": 1687} {"train_loss": -40.51581954956055, "global_step": 204200, "epoch": 1687} {"train_loss": -39.638607025146484, "global_step": 204201, "epoch": 1687} {"train_loss": -39.942970275878906, "global_step": 204202, "epoch": 1687} {"train_loss": -40.90123748779297, "global_step": 204203, "epoch": 1687} {"train_loss": -38.82442092895508, "global_step": 204204, "epoch": 1687} {"train_loss": -41.4320182800293, "global_step": 204205, "epoch": 1687} {"train_loss": -39.509803771972656, "global_step": 204206, "epoch": 1687} {"train_loss": -41.33209991455078, "global_step": 204207, "epoch": 1687} {"train_loss": -40.48786544799805, "global_step": 204208, "epoch": 1687} {"train_loss": -39.130577087402344, "global_step": 204209, "epoch": 1687} {"train_loss": -39.32988739013672, "global_step": 204210, "epoch": 1687} {"train_loss": -41.14236068725586, "global_step": 204211, "epoch": 1687} {"train_loss": -39.70556640625, "global_step": 204212, "epoch": 1687} {"train_loss": -41.45134353637695, "global_step": 204213, "epoch": 1687} {"train_loss": -39.193328857421875, "global_step": 204214, "epoch": 1687} {"train_loss": -40.37013626098633, "global_step": 204215, "epoch": 1687} {"train_loss": -38.96775436401367, "global_step": 204216, "epoch": 1687} {"train_loss": -40.09637451171875, "global_step": 204217, "epoch": 1687} {"train_loss": -40.96659469604492, "global_step": 204218, "epoch": 1687} {"train_loss": -40.18851852416992, "global_step": 204219, "epoch": 1687} {"train_loss": -40.264442443847656, "global_step": 204220, "epoch": 1687} {"train_loss": -40.628902435302734, "global_step": 204221, "epoch": 1687} {"train_loss": -40.21907043457031, "global_step": 204222, "epoch": 1687} {"train_loss": -41.813480377197266, "global_step": 204223, "epoch": 1687} {"train_loss": -39.44239044189453, "global_step": 204224, "epoch": 1687} {"train_loss": -41.7603645324707, "global_step": 204225, "epoch": 1687} {"train_loss": -40.98488235473633, "global_step": 204226, "epoch": 1687} {"train_loss": -39.76625442504883, "global_step": 204227, "epoch": 1687} {"train_loss": -41.63885498046875, "global_step": 204228, "epoch": 1687} {"train_loss": -41.33419418334961, "global_step": 204229, "epoch": 1687} {"train_loss": -40.85840606689453, "global_step": 204230, "epoch": 1687} {"train_loss": -42.07636642456055, "global_step": 204231, "epoch": 1687} {"train_loss": -40.214141845703125, "global_step": 204232, "epoch": 1687} {"train_loss": -41.18500518798828, "global_step": 204233, "epoch": 1687} {"train_loss": -41.89522171020508, "global_step": 204234, "epoch": 1687} {"train_loss": -41.635616302490234, "global_step": 204235, "epoch": 1687} {"train_loss": -41.09737014770508, "global_step": 204236, "epoch": 1687} {"train_loss": -41.34994125366211, "global_step": 204237, "epoch": 1687} {"train_loss": -42.56162643432617, "global_step": 204238, "epoch": 1687} {"train_loss": -41.12135696411133, "global_step": 204239, "epoch": 1687} {"train_loss": -42.308712005615234, "global_step": 204240, "epoch": 1687} {"train_loss": -41.8153190612793, "global_step": 204241, "epoch": 1687} {"train_loss": -42.35595703125, "global_step": 204242, "epoch": 1687} {"train_loss": -41.495582580566406, "global_step": 204243, "epoch": 1687} {"train_loss": -42.22370910644531, "global_step": 204244, "epoch": 1687} {"train_loss": -42.459293365478516, "global_step": 204245, "epoch": 1687} {"train_loss": -41.79074478149414, "global_step": 204246, "epoch": 1687} {"train_loss": -41.3264471637316, "global_step": 204247, "epoch": 1687, "val_loss": 2592495.75} {"train_loss": -42.614967346191406, "global_step": 204248, "epoch": 1688} {"train_loss": -42.363765716552734, "global_step": 204249, "epoch": 1688} {"train_loss": -42.44805908203125, "global_step": 204250, "epoch": 1688} {"train_loss": -42.33225631713867, "global_step": 204251, "epoch": 1688} {"train_loss": -42.16432571411133, "global_step": 204252, "epoch": 1688} {"train_loss": -42.94857406616211, "global_step": 204253, "epoch": 1688} {"train_loss": -42.362518310546875, "global_step": 204254, "epoch": 1688} {"train_loss": -42.2222900390625, "global_step": 204255, "epoch": 1688} {"train_loss": -42.623138427734375, "global_step": 204256, "epoch": 1688} {"train_loss": -42.87944412231445, "global_step": 204257, "epoch": 1688} {"train_loss": -42.60702133178711, "global_step": 204258, "epoch": 1688} {"train_loss": -42.596317291259766, "global_step": 204259, "epoch": 1688} {"train_loss": -42.364959716796875, "global_step": 204260, "epoch": 1688} {"train_loss": -42.649208068847656, "global_step": 204261, "epoch": 1688} {"train_loss": -42.216163635253906, "global_step": 204262, "epoch": 1688} {"train_loss": -43.09403610229492, "global_step": 204263, "epoch": 1688} {"train_loss": -42.3548583984375, "global_step": 204264, "epoch": 1688} {"train_loss": -41.758201599121094, "global_step": 204265, "epoch": 1688} {"train_loss": -42.67629623413086, "global_step": 204266, "epoch": 1688} {"train_loss": -42.59450912475586, "global_step": 204267, "epoch": 1688} {"train_loss": -42.534324645996094, "global_step": 204268, "epoch": 1688} {"train_loss": -42.91587829589844, "global_step": 204269, "epoch": 1688} {"train_loss": -43.23225021362305, "global_step": 204270, "epoch": 1688} {"train_loss": -42.321590423583984, "global_step": 204271, "epoch": 1688} {"train_loss": -42.614715576171875, "global_step": 204272, "epoch": 1688} {"train_loss": -42.6041145324707, "global_step": 204273, "epoch": 1688} {"train_loss": -43.4810905456543, "global_step": 204274, "epoch": 1688} {"train_loss": -42.52256393432617, "global_step": 204275, "epoch": 1688} {"train_loss": -42.76539993286133, "global_step": 204276, "epoch": 1688} {"train_loss": -42.010040283203125, "global_step": 204277, "epoch": 1688} {"train_loss": -43.12128448486328, "global_step": 204278, "epoch": 1688} {"train_loss": -43.02231216430664, "global_step": 204279, "epoch": 1688} {"train_loss": -42.416255950927734, "global_step": 204280, "epoch": 1688} {"train_loss": -42.44727325439453, "global_step": 204281, "epoch": 1688} {"train_loss": -43.029964447021484, "global_step": 204282, "epoch": 1688} {"train_loss": -42.1337890625, "global_step": 204283, "epoch": 1688} {"train_loss": -39.371368408203125, "global_step": 204284, "epoch": 1688} {"train_loss": -37.765499114990234, "global_step": 204285, "epoch": 1688} {"train_loss": -41.714900970458984, "global_step": 204286, "epoch": 1688} {"train_loss": -41.8153076171875, "global_step": 204287, "epoch": 1688} {"train_loss": -40.88350296020508, "global_step": 204288, "epoch": 1688} {"train_loss": -42.39912033081055, "global_step": 204289, "epoch": 1688} {"train_loss": -38.30390167236328, "global_step": 204290, "epoch": 1688} {"train_loss": -37.756954193115234, "global_step": 204291, "epoch": 1688} {"train_loss": -41.44126510620117, "global_step": 204292, "epoch": 1688} {"train_loss": -38.32598876953125, "global_step": 204293, "epoch": 1688} {"train_loss": -40.642791748046875, "global_step": 204294, "epoch": 1688} {"train_loss": -40.32985305786133, "global_step": 204295, "epoch": 1688} {"train_loss": -39.83879470825195, "global_step": 204296, "epoch": 1688} {"train_loss": -41.89043426513672, "global_step": 204297, "epoch": 1688} {"train_loss": -40.63350296020508, "global_step": 204298, "epoch": 1688} {"train_loss": -39.31957244873047, "global_step": 204299, "epoch": 1688} {"train_loss": -42.800636291503906, "global_step": 204300, "epoch": 1688} {"train_loss": -39.16439437866211, "global_step": 204301, "epoch": 1688} {"train_loss": -41.21370315551758, "global_step": 204302, "epoch": 1688} {"train_loss": -41.294151306152344, "global_step": 204303, "epoch": 1688} {"train_loss": -40.9430046081543, "global_step": 204304, "epoch": 1688} {"train_loss": -41.53827667236328, "global_step": 204305, "epoch": 1688} {"train_loss": -40.5153923034668, "global_step": 204306, "epoch": 1688} {"train_loss": -41.01996994018555, "global_step": 204307, "epoch": 1688} {"train_loss": -42.24403381347656, "global_step": 204308, "epoch": 1688} {"train_loss": -41.02780532836914, "global_step": 204309, "epoch": 1688} {"train_loss": -41.43581008911133, "global_step": 204310, "epoch": 1688} {"train_loss": -41.45570755004883, "global_step": 204311, "epoch": 1688} {"train_loss": -41.916988372802734, "global_step": 204312, "epoch": 1688} {"train_loss": -41.23405838012695, "global_step": 204313, "epoch": 1688} {"train_loss": -41.85740280151367, "global_step": 204314, "epoch": 1688} {"train_loss": -42.110294342041016, "global_step": 204315, "epoch": 1688} {"train_loss": -41.5078010559082, "global_step": 204316, "epoch": 1688} {"train_loss": -41.98688507080078, "global_step": 204317, "epoch": 1688} {"train_loss": -41.62691879272461, "global_step": 204318, "epoch": 1688} {"train_loss": -42.19796371459961, "global_step": 204319, "epoch": 1688} {"train_loss": -42.371498107910156, "global_step": 204320, "epoch": 1688} {"train_loss": -42.075740814208984, "global_step": 204321, "epoch": 1688} {"train_loss": -41.943092346191406, "global_step": 204322, "epoch": 1688} {"train_loss": -42.094337463378906, "global_step": 204323, "epoch": 1688} {"train_loss": -42.227169036865234, "global_step": 204324, "epoch": 1688} {"train_loss": -42.61940383911133, "global_step": 204325, "epoch": 1688} {"train_loss": -41.34363555908203, "global_step": 204326, "epoch": 1688} {"train_loss": -41.624427795410156, "global_step": 204327, "epoch": 1688} {"train_loss": -41.539485931396484, "global_step": 204328, "epoch": 1688} {"train_loss": -42.23059844970703, "global_step": 204329, "epoch": 1688} {"train_loss": -40.65220642089844, "global_step": 204330, "epoch": 1688} {"train_loss": -40.930458068847656, "global_step": 204331, "epoch": 1688} {"train_loss": -41.57032012939453, "global_step": 204332, "epoch": 1688} {"train_loss": -40.668251037597656, "global_step": 204333, "epoch": 1688} {"train_loss": -40.123653411865234, "global_step": 204334, "epoch": 1688} {"train_loss": -41.299259185791016, "global_step": 204335, "epoch": 1688} {"train_loss": -40.60730743408203, "global_step": 204336, "epoch": 1688} {"train_loss": -39.986202239990234, "global_step": 204337, "epoch": 1688} {"train_loss": -41.72665023803711, "global_step": 204338, "epoch": 1688} {"train_loss": -40.83303451538086, "global_step": 204339, "epoch": 1688} {"train_loss": -40.613990783691406, "global_step": 204340, "epoch": 1688} {"train_loss": -42.3143424987793, "global_step": 204341, "epoch": 1688} {"train_loss": -41.17341613769531, "global_step": 204342, "epoch": 1688} {"train_loss": -40.71531295776367, "global_step": 204343, "epoch": 1688} {"train_loss": -40.63966751098633, "global_step": 204344, "epoch": 1688} {"train_loss": -41.35603332519531, "global_step": 204345, "epoch": 1688} {"train_loss": -40.74473190307617, "global_step": 204346, "epoch": 1688} {"train_loss": -40.92267990112305, "global_step": 204347, "epoch": 1688} {"train_loss": -41.218292236328125, "global_step": 204348, "epoch": 1688} {"train_loss": -38.23582077026367, "global_step": 204349, "epoch": 1688} {"train_loss": -39.33421325683594, "global_step": 204350, "epoch": 1688} {"train_loss": -40.93092727661133, "global_step": 204351, "epoch": 1688} {"train_loss": -41.5664176940918, "global_step": 204352, "epoch": 1688} {"train_loss": -39.08713912963867, "global_step": 204353, "epoch": 1688} {"train_loss": -41.35475540161133, "global_step": 204354, "epoch": 1688} {"train_loss": -40.77236557006836, "global_step": 204355, "epoch": 1688} {"train_loss": -40.7623405456543, "global_step": 204356, "epoch": 1688} {"train_loss": -41.419349670410156, "global_step": 204357, "epoch": 1688} {"train_loss": -40.68946075439453, "global_step": 204358, "epoch": 1688} {"train_loss": -41.12705612182617, "global_step": 204359, "epoch": 1688} {"train_loss": -42.10821533203125, "global_step": 204360, "epoch": 1688} {"train_loss": -42.19260787963867, "global_step": 204361, "epoch": 1688} {"train_loss": -42.25257110595703, "global_step": 204362, "epoch": 1688} {"train_loss": -42.41100311279297, "global_step": 204363, "epoch": 1688} {"train_loss": -42.28898239135742, "global_step": 204364, "epoch": 1688} {"train_loss": -42.19782638549805, "global_step": 204365, "epoch": 1688} {"train_loss": -41.947303771972656, "global_step": 204366, "epoch": 1688} {"train_loss": -42.20936965942383, "global_step": 204367, "epoch": 1688} {"train_loss": -41.549350297155456, "global_step": 204368, "epoch": 1688, "val_loss": 2582934.75} {"train_loss": -42.761451721191406, "global_step": 204369, "epoch": 1689} {"train_loss": -42.04303741455078, "global_step": 204370, "epoch": 1689} {"train_loss": -42.200782775878906, "global_step": 204371, "epoch": 1689} {"train_loss": -42.48200607299805, "global_step": 204372, "epoch": 1689} {"train_loss": -42.60230255126953, "global_step": 204373, "epoch": 1689} {"train_loss": -42.696266174316406, "global_step": 204374, "epoch": 1689} {"train_loss": -42.53803253173828, "global_step": 204375, "epoch": 1689} {"train_loss": -42.719215393066406, "global_step": 204376, "epoch": 1689} {"train_loss": -42.52077865600586, "global_step": 204377, "epoch": 1689} {"train_loss": -42.63944625854492, "global_step": 204378, "epoch": 1689} {"train_loss": -42.17464065551758, "global_step": 204379, "epoch": 1689} {"train_loss": -42.66153335571289, "global_step": 204380, "epoch": 1689} {"train_loss": -42.17754364013672, "global_step": 204381, "epoch": 1689} {"train_loss": -41.88279342651367, "global_step": 204382, "epoch": 1689} {"train_loss": -43.13658905029297, "global_step": 204383, "epoch": 1689} {"train_loss": -42.057281494140625, "global_step": 204384, "epoch": 1689} {"train_loss": -41.17470169067383, "global_step": 204385, "epoch": 1689} {"train_loss": -40.99958038330078, "global_step": 204386, "epoch": 1689} {"train_loss": -41.29521179199219, "global_step": 204387, "epoch": 1689} {"train_loss": -42.645687103271484, "global_step": 204388, "epoch": 1689} {"train_loss": -40.58469772338867, "global_step": 204389, "epoch": 1689} {"train_loss": -40.92392349243164, "global_step": 204390, "epoch": 1689} {"train_loss": -41.66314697265625, "global_step": 204391, "epoch": 1689} {"train_loss": -42.08039855957031, "global_step": 204392, "epoch": 1689} {"train_loss": -40.63461685180664, "global_step": 204393, "epoch": 1689} {"train_loss": -39.35430908203125, "global_step": 204394, "epoch": 1689} {"train_loss": -41.306453704833984, "global_step": 204395, "epoch": 1689} {"train_loss": -42.107093811035156, "global_step": 204396, "epoch": 1689} {"train_loss": -42.15654373168945, "global_step": 204397, "epoch": 1689} {"train_loss": -41.07173538208008, "global_step": 204398, "epoch": 1689} {"train_loss": -40.89734649658203, "global_step": 204399, "epoch": 1689} {"train_loss": -41.81221389770508, "global_step": 204400, "epoch": 1689} {"train_loss": -42.449493408203125, "global_step": 204401, "epoch": 1689} {"train_loss": -41.64167404174805, "global_step": 204402, "epoch": 1689} {"train_loss": -41.69435501098633, "global_step": 204403, "epoch": 1689} {"train_loss": -40.747798919677734, "global_step": 204404, "epoch": 1689} {"train_loss": -41.96306610107422, "global_step": 204405, "epoch": 1689} {"train_loss": -41.58935546875, "global_step": 204406, "epoch": 1689} {"train_loss": -40.84222412109375, "global_step": 204407, "epoch": 1689} {"train_loss": -42.09735107421875, "global_step": 204408, "epoch": 1689} {"train_loss": -41.57949447631836, "global_step": 204409, "epoch": 1689} {"train_loss": -41.0198974609375, "global_step": 204410, "epoch": 1689} {"train_loss": -42.034908294677734, "global_step": 204411, "epoch": 1689} {"train_loss": -41.774837493896484, "global_step": 204412, "epoch": 1689} {"train_loss": -40.91215896606445, "global_step": 204413, "epoch": 1689} {"train_loss": -41.5986442565918, "global_step": 204414, "epoch": 1689} {"train_loss": -42.36083984375, "global_step": 204415, "epoch": 1689} {"train_loss": -42.21482849121094, "global_step": 204416, "epoch": 1689} {"train_loss": -41.5616455078125, "global_step": 204417, "epoch": 1689} {"train_loss": -41.74078369140625, "global_step": 204418, "epoch": 1689} {"train_loss": -42.07892990112305, "global_step": 204419, "epoch": 1689} {"train_loss": -41.701942443847656, "global_step": 204420, "epoch": 1689} {"train_loss": -42.49699020385742, "global_step": 204421, "epoch": 1689} {"train_loss": -41.06843185424805, "global_step": 204422, "epoch": 1689} {"train_loss": -42.23819351196289, "global_step": 204423, "epoch": 1689} {"train_loss": -41.970577239990234, "global_step": 204424, "epoch": 1689} {"train_loss": -41.407928466796875, "global_step": 204425, "epoch": 1689} {"train_loss": -41.62578582763672, "global_step": 204426, "epoch": 1689} {"train_loss": -42.243892669677734, "global_step": 204427, "epoch": 1689} {"train_loss": -41.80485534667969, "global_step": 204428, "epoch": 1689} {"train_loss": -42.142818450927734, "global_step": 204429, "epoch": 1689} {"train_loss": -42.21558380126953, "global_step": 204430, "epoch": 1689} {"train_loss": -40.8812370300293, "global_step": 204431, "epoch": 1689} {"train_loss": -41.9642333984375, "global_step": 204432, "epoch": 1689} {"train_loss": -41.045772552490234, "global_step": 204433, "epoch": 1689} {"train_loss": -42.349220275878906, "global_step": 204434, "epoch": 1689} {"train_loss": -41.26569747924805, "global_step": 204435, "epoch": 1689} {"train_loss": -40.61273956298828, "global_step": 204436, "epoch": 1689} {"train_loss": -40.3943977355957, "global_step": 204437, "epoch": 1689} {"train_loss": -41.21753692626953, "global_step": 204438, "epoch": 1689} {"train_loss": -42.662696838378906, "global_step": 204439, "epoch": 1689} {"train_loss": -41.3093376159668, "global_step": 204440, "epoch": 1689} {"train_loss": -41.114280700683594, "global_step": 204441, "epoch": 1689} {"train_loss": -42.37132263183594, "global_step": 204442, "epoch": 1689} {"train_loss": -41.57818603515625, "global_step": 204443, "epoch": 1689} {"train_loss": -40.56782150268555, "global_step": 204444, "epoch": 1689} {"train_loss": -42.30780029296875, "global_step": 204445, "epoch": 1689} {"train_loss": -42.019508361816406, "global_step": 204446, "epoch": 1689} {"train_loss": -41.385498046875, "global_step": 204447, "epoch": 1689} {"train_loss": -42.03886795043945, "global_step": 204448, "epoch": 1689} {"train_loss": -42.238067626953125, "global_step": 204449, "epoch": 1689} {"train_loss": -42.3869514465332, "global_step": 204450, "epoch": 1689} {"train_loss": -41.81753921508789, "global_step": 204451, "epoch": 1689} {"train_loss": -42.5686149597168, "global_step": 204452, "epoch": 1689} {"train_loss": -40.353370666503906, "global_step": 204453, "epoch": 1689} {"train_loss": -41.27900314331055, "global_step": 204454, "epoch": 1689} {"train_loss": -42.134239196777344, "global_step": 204455, "epoch": 1689} {"train_loss": -41.28410720825195, "global_step": 204456, "epoch": 1689} {"train_loss": -41.75761032104492, "global_step": 204457, "epoch": 1689} {"train_loss": -41.71272659301758, "global_step": 204458, "epoch": 1689} {"train_loss": -42.23591613769531, "global_step": 204459, "epoch": 1689} {"train_loss": -41.6673469543457, "global_step": 204460, "epoch": 1689} {"train_loss": -41.9393424987793, "global_step": 204461, "epoch": 1689} {"train_loss": -41.6798210144043, "global_step": 204462, "epoch": 1689} {"train_loss": -41.80141830444336, "global_step": 204463, "epoch": 1689} {"train_loss": -40.44473648071289, "global_step": 204464, "epoch": 1689} {"train_loss": -42.778133392333984, "global_step": 204465, "epoch": 1689} {"train_loss": -41.19283676147461, "global_step": 204466, "epoch": 1689} {"train_loss": -41.12762451171875, "global_step": 204467, "epoch": 1689} {"train_loss": -43.21366500854492, "global_step": 204468, "epoch": 1689} {"train_loss": -41.81058883666992, "global_step": 204469, "epoch": 1689} {"train_loss": -42.59772491455078, "global_step": 204470, "epoch": 1689} {"train_loss": -42.70621871948242, "global_step": 204471, "epoch": 1689} {"train_loss": -42.01624298095703, "global_step": 204472, "epoch": 1689} {"train_loss": -42.78432846069336, "global_step": 204473, "epoch": 1689} {"train_loss": -42.641883850097656, "global_step": 204474, "epoch": 1689} {"train_loss": -42.66725158691406, "global_step": 204475, "epoch": 1689} {"train_loss": -42.92133712768555, "global_step": 204476, "epoch": 1689} {"train_loss": -42.48490524291992, "global_step": 204477, "epoch": 1689} {"train_loss": -42.649471282958984, "global_step": 204478, "epoch": 1689} {"train_loss": -42.39000701904297, "global_step": 204479, "epoch": 1689} {"train_loss": -42.89773178100586, "global_step": 204480, "epoch": 1689} {"train_loss": -43.10274124145508, "global_step": 204481, "epoch": 1689} {"train_loss": -41.779510498046875, "global_step": 204482, "epoch": 1689} {"train_loss": -41.7389030456543, "global_step": 204483, "epoch": 1689} {"train_loss": -42.91151809692383, "global_step": 204484, "epoch": 1689} {"train_loss": -41.262550354003906, "global_step": 204485, "epoch": 1689} {"train_loss": -40.78481674194336, "global_step": 204486, "epoch": 1689} {"train_loss": -42.3675651550293, "global_step": 204487, "epoch": 1689} {"train_loss": -42.89668273925781, "global_step": 204488, "epoch": 1689} {"train_loss": -41.859846383086904, "global_step": 204489, "epoch": 1689, "val_loss": 2606111.75} {"train_loss": -41.09572982788086, "global_step": 204490, "epoch": 1690} {"train_loss": -42.202606201171875, "global_step": 204491, "epoch": 1690} {"train_loss": -42.66909408569336, "global_step": 204492, "epoch": 1690} {"train_loss": -42.5986213684082, "global_step": 204493, "epoch": 1690} {"train_loss": -41.4336051940918, "global_step": 204494, "epoch": 1690} {"train_loss": -41.312774658203125, "global_step": 204495, "epoch": 1690} {"train_loss": -41.794227600097656, "global_step": 204496, "epoch": 1690} {"train_loss": -42.64666748046875, "global_step": 204497, "epoch": 1690} {"train_loss": -42.435665130615234, "global_step": 204498, "epoch": 1690} {"train_loss": -42.42357635498047, "global_step": 204499, "epoch": 1690} {"train_loss": -42.36479187011719, "global_step": 204500, "epoch": 1690} {"train_loss": -43.19060134887695, "global_step": 204501, "epoch": 1690} {"train_loss": -42.67206954956055, "global_step": 204502, "epoch": 1690} {"train_loss": -42.486724853515625, "global_step": 204503, "epoch": 1690} {"train_loss": -42.4648323059082, "global_step": 204504, "epoch": 1690} {"train_loss": -42.491878509521484, "global_step": 204505, "epoch": 1690} {"train_loss": -42.85905075073242, "global_step": 204506, "epoch": 1690} {"train_loss": -42.6568603515625, "global_step": 204507, "epoch": 1690} {"train_loss": -42.58760070800781, "global_step": 204508, "epoch": 1690} {"train_loss": -41.929744720458984, "global_step": 204509, "epoch": 1690} {"train_loss": -42.61361312866211, "global_step": 204510, "epoch": 1690} {"train_loss": -42.68544006347656, "global_step": 204511, "epoch": 1690} {"train_loss": -43.00471115112305, "global_step": 204512, "epoch": 1690} {"train_loss": -42.45320510864258, "global_step": 204513, "epoch": 1690} {"train_loss": -41.91602325439453, "global_step": 204514, "epoch": 1690} {"train_loss": -42.654537200927734, "global_step": 204515, "epoch": 1690} {"train_loss": -41.97488784790039, "global_step": 204516, "epoch": 1690} {"train_loss": -41.62347412109375, "global_step": 204517, "epoch": 1690} {"train_loss": -42.31918716430664, "global_step": 204518, "epoch": 1690} {"train_loss": -42.72248458862305, "global_step": 204519, "epoch": 1690} {"train_loss": -41.1825065612793, "global_step": 204520, "epoch": 1690} {"train_loss": -40.65478515625, "global_step": 204521, "epoch": 1690} {"train_loss": -42.60029220581055, "global_step": 204522, "epoch": 1690} {"train_loss": -42.041175842285156, "global_step": 204523, "epoch": 1690} {"train_loss": -41.88127517700195, "global_step": 204524, "epoch": 1690} {"train_loss": -40.54795455932617, "global_step": 204525, "epoch": 1690} {"train_loss": -41.53566360473633, "global_step": 204526, "epoch": 1690} {"train_loss": -42.64870834350586, "global_step": 204527, "epoch": 1690} {"train_loss": -41.181541442871094, "global_step": 204528, "epoch": 1690} {"train_loss": -41.00565719604492, "global_step": 204529, "epoch": 1690} {"train_loss": -41.46332931518555, "global_step": 204530, "epoch": 1690} {"train_loss": -41.255615234375, "global_step": 204531, "epoch": 1690} {"train_loss": -41.3917350769043, "global_step": 204532, "epoch": 1690} {"train_loss": -40.79130554199219, "global_step": 204533, "epoch": 1690} {"train_loss": -41.51361846923828, "global_step": 204534, "epoch": 1690} {"train_loss": -40.84760665893555, "global_step": 204535, "epoch": 1690} {"train_loss": -42.03300857543945, "global_step": 204536, "epoch": 1690} {"train_loss": -41.545711517333984, "global_step": 204537, "epoch": 1690} {"train_loss": -41.24415969848633, "global_step": 204538, "epoch": 1690} {"train_loss": -40.55141067504883, "global_step": 204539, "epoch": 1690} {"train_loss": -40.47664260864258, "global_step": 204540, "epoch": 1690} {"train_loss": -42.59421920776367, "global_step": 204541, "epoch": 1690} {"train_loss": -41.26396179199219, "global_step": 204542, "epoch": 1690} {"train_loss": -41.506561279296875, "global_step": 204543, "epoch": 1690} {"train_loss": -41.663997650146484, "global_step": 204544, "epoch": 1690} {"train_loss": -41.828975677490234, "global_step": 204545, "epoch": 1690} {"train_loss": -41.4481315612793, "global_step": 204546, "epoch": 1690} {"train_loss": -41.70037841796875, "global_step": 204547, "epoch": 1690} {"train_loss": -40.925804138183594, "global_step": 204548, "epoch": 1690} {"train_loss": -41.28396224975586, "global_step": 204549, "epoch": 1690} {"train_loss": -41.319602966308594, "global_step": 204550, "epoch": 1690} {"train_loss": -40.3646240234375, "global_step": 204551, "epoch": 1690} {"train_loss": -41.38381576538086, "global_step": 204552, "epoch": 1690} {"train_loss": -41.91438674926758, "global_step": 204553, "epoch": 1690} {"train_loss": -41.172786712646484, "global_step": 204554, "epoch": 1690} {"train_loss": -40.24971389770508, "global_step": 204555, "epoch": 1690} {"train_loss": -40.2413444519043, "global_step": 204556, "epoch": 1690} {"train_loss": -42.14281463623047, "global_step": 204557, "epoch": 1690} {"train_loss": -41.13878631591797, "global_step": 204558, "epoch": 1690} {"train_loss": -39.77669143676758, "global_step": 204559, "epoch": 1690} {"train_loss": -42.39789581298828, "global_step": 204560, "epoch": 1690} {"train_loss": -40.680641174316406, "global_step": 204561, "epoch": 1690} {"train_loss": -41.89719009399414, "global_step": 204562, "epoch": 1690} {"train_loss": -41.499141693115234, "global_step": 204563, "epoch": 1690} {"train_loss": -41.44413375854492, "global_step": 204564, "epoch": 1690} {"train_loss": -42.31527328491211, "global_step": 204565, "epoch": 1690} {"train_loss": -41.892555236816406, "global_step": 204566, "epoch": 1690} {"train_loss": -41.232215881347656, "global_step": 204567, "epoch": 1690} {"train_loss": -42.47291946411133, "global_step": 204568, "epoch": 1690} {"train_loss": -42.28860092163086, "global_step": 204569, "epoch": 1690} {"train_loss": -40.54072189331055, "global_step": 204570, "epoch": 1690} {"train_loss": -41.1861457824707, "global_step": 204571, "epoch": 1690} {"train_loss": -41.839111328125, "global_step": 204572, "epoch": 1690} {"train_loss": -41.84424591064453, "global_step": 204573, "epoch": 1690} {"train_loss": -40.98345947265625, "global_step": 204574, "epoch": 1690} {"train_loss": -40.77309799194336, "global_step": 204575, "epoch": 1690} {"train_loss": -41.67891311645508, "global_step": 204576, "epoch": 1690} {"train_loss": -41.63252639770508, "global_step": 204577, "epoch": 1690} {"train_loss": -39.44309997558594, "global_step": 204578, "epoch": 1690} {"train_loss": -39.379940032958984, "global_step": 204579, "epoch": 1690} {"train_loss": -41.969234466552734, "global_step": 204580, "epoch": 1690} {"train_loss": -42.410133361816406, "global_step": 204581, "epoch": 1690} {"train_loss": -40.331024169921875, "global_step": 204582, "epoch": 1690} {"train_loss": -39.43593215942383, "global_step": 204583, "epoch": 1690} {"train_loss": -42.522762298583984, "global_step": 204584, "epoch": 1690} {"train_loss": -39.792213439941406, "global_step": 204585, "epoch": 1690} {"train_loss": -39.545772552490234, "global_step": 204586, "epoch": 1690} {"train_loss": -41.165771484375, "global_step": 204587, "epoch": 1690} {"train_loss": -39.077789306640625, "global_step": 204588, "epoch": 1690} {"train_loss": -38.92567825317383, "global_step": 204589, "epoch": 1690} {"train_loss": -42.146846771240234, "global_step": 204590, "epoch": 1690} {"train_loss": -38.00258255004883, "global_step": 204591, "epoch": 1690} {"train_loss": -41.79927444458008, "global_step": 204592, "epoch": 1690} {"train_loss": -37.65519332885742, "global_step": 204593, "epoch": 1690} {"train_loss": -41.9136848449707, "global_step": 204594, "epoch": 1690} {"train_loss": -39.25056838989258, "global_step": 204595, "epoch": 1690} {"train_loss": -40.49713134765625, "global_step": 204596, "epoch": 1690} {"train_loss": -41.34888458251953, "global_step": 204597, "epoch": 1690} {"train_loss": -39.29655075073242, "global_step": 204598, "epoch": 1690} {"train_loss": -41.561824798583984, "global_step": 204599, "epoch": 1690} {"train_loss": -39.916316986083984, "global_step": 204600, "epoch": 1690} {"train_loss": -41.18568801879883, "global_step": 204601, "epoch": 1690} {"train_loss": -39.39292526245117, "global_step": 204602, "epoch": 1690} {"train_loss": -40.29643249511719, "global_step": 204603, "epoch": 1690} {"train_loss": -42.32758712768555, "global_step": 204604, "epoch": 1690} {"train_loss": -40.180206298828125, "global_step": 204605, "epoch": 1690} {"train_loss": -41.614376068115234, "global_step": 204606, "epoch": 1690} {"train_loss": -40.642391204833984, "global_step": 204607, "epoch": 1690} {"train_loss": -40.0536003112793, "global_step": 204608, "epoch": 1690} {"train_loss": -41.54299545288086, "global_step": 204609, "epoch": 1690} {"train_loss": -41.377316120242284, "global_step": 204610, "epoch": 1690, "val_loss": 2645616.0} {"train_loss": -40.85788345336914, "global_step": 204611, "epoch": 1691} {"train_loss": -40.826107025146484, "global_step": 204612, "epoch": 1691} {"train_loss": -42.212554931640625, "global_step": 204613, "epoch": 1691} {"train_loss": -41.37091064453125, "global_step": 204614, "epoch": 1691} {"train_loss": -41.25944137573242, "global_step": 204615, "epoch": 1691} {"train_loss": -41.38848114013672, "global_step": 204616, "epoch": 1691} {"train_loss": -41.243324279785156, "global_step": 204617, "epoch": 1691} {"train_loss": -41.998714447021484, "global_step": 204618, "epoch": 1691} {"train_loss": -41.78351593017578, "global_step": 204619, "epoch": 1691} {"train_loss": -41.88604736328125, "global_step": 204620, "epoch": 1691} {"train_loss": -42.5948486328125, "global_step": 204621, "epoch": 1691} {"train_loss": -42.25703430175781, "global_step": 204622, "epoch": 1691} {"train_loss": -42.110877990722656, "global_step": 204623, "epoch": 1691} {"train_loss": -42.38418197631836, "global_step": 204624, "epoch": 1691} {"train_loss": -42.1439094543457, "global_step": 204625, "epoch": 1691} {"train_loss": -42.33658981323242, "global_step": 204626, "epoch": 1691} {"train_loss": -42.929931640625, "global_step": 204627, "epoch": 1691} {"train_loss": -42.42238235473633, "global_step": 204628, "epoch": 1691} {"train_loss": -42.83480453491211, "global_step": 204629, "epoch": 1691} {"train_loss": -42.774566650390625, "global_step": 204630, "epoch": 1691} {"train_loss": -42.793025970458984, "global_step": 204631, "epoch": 1691} {"train_loss": -42.979793548583984, "global_step": 204632, "epoch": 1691} {"train_loss": -43.022552490234375, "global_step": 204633, "epoch": 1691} {"train_loss": -42.622745513916016, "global_step": 204634, "epoch": 1691} {"train_loss": -43.089229583740234, "global_step": 204635, "epoch": 1691} {"train_loss": -42.79313278198242, "global_step": 204636, "epoch": 1691} {"train_loss": -42.21500015258789, "global_step": 204637, "epoch": 1691} {"train_loss": -42.595157623291016, "global_step": 204638, "epoch": 1691} {"train_loss": -43.01646041870117, "global_step": 204639, "epoch": 1691} {"train_loss": -42.7986946105957, "global_step": 204640, "epoch": 1691} {"train_loss": -42.48329544067383, "global_step": 204641, "epoch": 1691} {"train_loss": -42.99001693725586, "global_step": 204642, "epoch": 1691} {"train_loss": -41.52167510986328, "global_step": 204643, "epoch": 1691} {"train_loss": -42.044551849365234, "global_step": 204644, "epoch": 1691} {"train_loss": -42.577308654785156, "global_step": 204645, "epoch": 1691} {"train_loss": -42.3499641418457, "global_step": 204646, "epoch": 1691} {"train_loss": -42.260955810546875, "global_step": 204647, "epoch": 1691} {"train_loss": -42.985347747802734, "global_step": 204648, "epoch": 1691} {"train_loss": -41.56592559814453, "global_step": 204649, "epoch": 1691} {"train_loss": -42.59878158569336, "global_step": 204650, "epoch": 1691} {"train_loss": -41.89933776855469, "global_step": 204651, "epoch": 1691} {"train_loss": -43.131561279296875, "global_step": 204652, "epoch": 1691} {"train_loss": -41.82627868652344, "global_step": 204653, "epoch": 1691} {"train_loss": -42.92778778076172, "global_step": 204654, "epoch": 1691} {"train_loss": -42.81782150268555, "global_step": 204655, "epoch": 1691} {"train_loss": -42.03436279296875, "global_step": 204656, "epoch": 1691} {"train_loss": -42.9610710144043, "global_step": 204657, "epoch": 1691} {"train_loss": -42.895660400390625, "global_step": 204658, "epoch": 1691} {"train_loss": -42.88042068481445, "global_step": 204659, "epoch": 1691} {"train_loss": -42.40743637084961, "global_step": 204660, "epoch": 1691} {"train_loss": -42.510860443115234, "global_step": 204661, "epoch": 1691} {"train_loss": -43.102230072021484, "global_step": 204662, "epoch": 1691} {"train_loss": -42.88339614868164, "global_step": 204663, "epoch": 1691} {"train_loss": -42.84025192260742, "global_step": 204664, "epoch": 1691} {"train_loss": -42.59784698486328, "global_step": 204665, "epoch": 1691} {"train_loss": -43.04008483886719, "global_step": 204666, "epoch": 1691} {"train_loss": -43.226375579833984, "global_step": 204667, "epoch": 1691} {"train_loss": -43.12334060668945, "global_step": 204668, "epoch": 1691} {"train_loss": -43.04151153564453, "global_step": 204669, "epoch": 1691} {"train_loss": -42.97900390625, "global_step": 204670, "epoch": 1691} {"train_loss": -43.18499755859375, "global_step": 204671, "epoch": 1691} {"train_loss": -43.0305061340332, "global_step": 204672, "epoch": 1691} {"train_loss": -42.93161392211914, "global_step": 204673, "epoch": 1691} {"train_loss": -43.091461181640625, "global_step": 204674, "epoch": 1691} {"train_loss": -42.852882385253906, "global_step": 204675, "epoch": 1691} {"train_loss": -43.4541130065918, "global_step": 204676, "epoch": 1691} {"train_loss": -42.42749786376953, "global_step": 204677, "epoch": 1691} {"train_loss": -43.33332061767578, "global_step": 204678, "epoch": 1691} {"train_loss": -43.22410202026367, "global_step": 204679, "epoch": 1691} {"train_loss": -43.141639709472656, "global_step": 204680, "epoch": 1691} {"train_loss": -43.59291076660156, "global_step": 204681, "epoch": 1691} {"train_loss": -42.09993362426758, "global_step": 204682, "epoch": 1691} {"train_loss": -42.23286819458008, "global_step": 204683, "epoch": 1691} {"train_loss": -42.649044036865234, "global_step": 204684, "epoch": 1691} {"train_loss": -43.03110885620117, "global_step": 204685, "epoch": 1691} {"train_loss": -42.960018157958984, "global_step": 204686, "epoch": 1691} {"train_loss": -42.474037170410156, "global_step": 204687, "epoch": 1691} {"train_loss": -42.113746643066406, "global_step": 204688, "epoch": 1691} {"train_loss": -41.82381820678711, "global_step": 204689, "epoch": 1691} {"train_loss": -41.9854621887207, "global_step": 204690, "epoch": 1691} {"train_loss": -42.623146057128906, "global_step": 204691, "epoch": 1691} {"train_loss": -43.02583694458008, "global_step": 204692, "epoch": 1691} {"train_loss": -42.512908935546875, "global_step": 204693, "epoch": 1691} {"train_loss": -41.285621643066406, "global_step": 204694, "epoch": 1691} {"train_loss": -40.87437057495117, "global_step": 204695, "epoch": 1691} {"train_loss": -41.99271774291992, "global_step": 204696, "epoch": 1691} {"train_loss": -41.31561279296875, "global_step": 204697, "epoch": 1691} {"train_loss": -41.03809356689453, "global_step": 204698, "epoch": 1691} {"train_loss": -41.12807083129883, "global_step": 204699, "epoch": 1691} {"train_loss": -41.277095794677734, "global_step": 204700, "epoch": 1691} {"train_loss": -42.43513870239258, "global_step": 204701, "epoch": 1691} {"train_loss": -42.258811950683594, "global_step": 204702, "epoch": 1691} {"train_loss": -42.50217819213867, "global_step": 204703, "epoch": 1691} {"train_loss": -40.13389587402344, "global_step": 204704, "epoch": 1691} {"train_loss": -40.6002082824707, "global_step": 204705, "epoch": 1691} {"train_loss": -42.56797409057617, "global_step": 204706, "epoch": 1691} {"train_loss": -41.876251220703125, "global_step": 204707, "epoch": 1691} {"train_loss": -40.70487594604492, "global_step": 204708, "epoch": 1691} {"train_loss": -42.51581573486328, "global_step": 204709, "epoch": 1691} {"train_loss": -41.96794509887695, "global_step": 204710, "epoch": 1691} {"train_loss": -39.1154670715332, "global_step": 204711, "epoch": 1691} {"train_loss": -40.71433639526367, "global_step": 204712, "epoch": 1691} {"train_loss": -42.35230255126953, "global_step": 204713, "epoch": 1691} {"train_loss": -39.995086669921875, "global_step": 204714, "epoch": 1691} {"train_loss": -37.469181060791016, "global_step": 204715, "epoch": 1691} {"train_loss": -41.73800277709961, "global_step": 204716, "epoch": 1691} {"train_loss": -34.0962028503418, "global_step": 204717, "epoch": 1691} {"train_loss": -37.288578033447266, "global_step": 204718, "epoch": 1691} {"train_loss": -38.20001220703125, "global_step": 204719, "epoch": 1691} {"train_loss": -38.274940490722656, "global_step": 204720, "epoch": 1691} {"train_loss": -38.83442306518555, "global_step": 204721, "epoch": 1691} {"train_loss": -40.41781234741211, "global_step": 204722, "epoch": 1691} {"train_loss": -38.255558013916016, "global_step": 204723, "epoch": 1691} {"train_loss": -39.15438461303711, "global_step": 204724, "epoch": 1691} {"train_loss": -37.737205505371094, "global_step": 204725, "epoch": 1691} {"train_loss": -37.14347457885742, "global_step": 204726, "epoch": 1691} {"train_loss": -41.607460021972656, "global_step": 204727, "epoch": 1691} {"train_loss": -37.85725021362305, "global_step": 204728, "epoch": 1691} {"train_loss": -40.670902252197266, "global_step": 204729, "epoch": 1691} {"train_loss": -38.545257568359375, "global_step": 204730, "epoch": 1691} {"train_loss": -41.79336024512929, "global_step": 204731, "epoch": 1691, "val_loss": 2628276.25} {"train_loss": -38.961036682128906, "global_step": 204732, "epoch": 1692} {"train_loss": -41.41439437866211, "global_step": 204733, "epoch": 1692} {"train_loss": -39.18644332885742, "global_step": 204734, "epoch": 1692} {"train_loss": -41.09092330932617, "global_step": 204735, "epoch": 1692} {"train_loss": -40.337520599365234, "global_step": 204736, "epoch": 1692} {"train_loss": -40.89105987548828, "global_step": 204737, "epoch": 1692} {"train_loss": -40.06614303588867, "global_step": 204738, "epoch": 1692} {"train_loss": -40.67835235595703, "global_step": 204739, "epoch": 1692} {"train_loss": -41.12925720214844, "global_step": 204740, "epoch": 1692} {"train_loss": -40.72924041748047, "global_step": 204741, "epoch": 1692} {"train_loss": -41.407073974609375, "global_step": 204742, "epoch": 1692} {"train_loss": -41.07673263549805, "global_step": 204743, "epoch": 1692} {"train_loss": -41.86083221435547, "global_step": 204744, "epoch": 1692} {"train_loss": -41.836490631103516, "global_step": 204745, "epoch": 1692} {"train_loss": -42.235225677490234, "global_step": 204746, "epoch": 1692} {"train_loss": -41.70099639892578, "global_step": 204747, "epoch": 1692} {"train_loss": -41.685394287109375, "global_step": 204748, "epoch": 1692} {"train_loss": -41.53886032104492, "global_step": 204749, "epoch": 1692} {"train_loss": -41.66986846923828, "global_step": 204750, "epoch": 1692} {"train_loss": -42.546531677246094, "global_step": 204751, "epoch": 1692} {"train_loss": -41.469215393066406, "global_step": 204752, "epoch": 1692} {"train_loss": -41.92363357543945, "global_step": 204753, "epoch": 1692} {"train_loss": -41.93162155151367, "global_step": 204754, "epoch": 1692} {"train_loss": -42.00997543334961, "global_step": 204755, "epoch": 1692} {"train_loss": -42.064483642578125, "global_step": 204756, "epoch": 1692} {"train_loss": -42.50593185424805, "global_step": 204757, "epoch": 1692} {"train_loss": -41.496253967285156, "global_step": 204758, "epoch": 1692} {"train_loss": -42.64341354370117, "global_step": 204759, "epoch": 1692} {"train_loss": -42.03583526611328, "global_step": 204760, "epoch": 1692} {"train_loss": -42.2524528503418, "global_step": 204761, "epoch": 1692} {"train_loss": -42.0682373046875, "global_step": 204762, "epoch": 1692} {"train_loss": -42.27865219116211, "global_step": 204763, "epoch": 1692} {"train_loss": -42.358436584472656, "global_step": 204764, "epoch": 1692} {"train_loss": -42.54379653930664, "global_step": 204765, "epoch": 1692} {"train_loss": -42.39991760253906, "global_step": 204766, "epoch": 1692} {"train_loss": -41.399169921875, "global_step": 204767, "epoch": 1692} {"train_loss": -42.53711700439453, "global_step": 204768, "epoch": 1692} {"train_loss": -42.68458938598633, "global_step": 204769, "epoch": 1692} {"train_loss": -41.42435836791992, "global_step": 204770, "epoch": 1692} {"train_loss": -42.071319580078125, "global_step": 204771, "epoch": 1692} {"train_loss": -42.32792282104492, "global_step": 204772, "epoch": 1692} {"train_loss": -42.203426361083984, "global_step": 204773, "epoch": 1692} {"train_loss": -42.32851791381836, "global_step": 204774, "epoch": 1692} {"train_loss": -42.365516662597656, "global_step": 204775, "epoch": 1692} {"train_loss": -41.75880813598633, "global_step": 204776, "epoch": 1692} {"train_loss": -42.94988250732422, "global_step": 204777, "epoch": 1692} {"train_loss": -42.046722412109375, "global_step": 204778, "epoch": 1692} {"train_loss": -42.44102478027344, "global_step": 204779, "epoch": 1692} {"train_loss": -42.30918502807617, "global_step": 204780, "epoch": 1692} {"train_loss": -42.25830078125, "global_step": 204781, "epoch": 1692} {"train_loss": -41.92942810058594, "global_step": 204782, "epoch": 1692} {"train_loss": -42.282344818115234, "global_step": 204783, "epoch": 1692} {"train_loss": -42.95244216918945, "global_step": 204784, "epoch": 1692} {"train_loss": -42.392913818359375, "global_step": 204785, "epoch": 1692} {"train_loss": -42.4345703125, "global_step": 204786, "epoch": 1692} {"train_loss": -41.940059661865234, "global_step": 204787, "epoch": 1692} {"train_loss": -42.11272430419922, "global_step": 204788, "epoch": 1692} {"train_loss": -42.48150634765625, "global_step": 204789, "epoch": 1692} {"train_loss": -42.29081344604492, "global_step": 204790, "epoch": 1692} {"train_loss": -42.06240463256836, "global_step": 204791, "epoch": 1692} {"train_loss": -41.908546447753906, "global_step": 204792, "epoch": 1692} {"train_loss": -42.3795051574707, "global_step": 204793, "epoch": 1692} {"train_loss": -41.9332160949707, "global_step": 204794, "epoch": 1692} {"train_loss": -39.8647346496582, "global_step": 204795, "epoch": 1692} {"train_loss": -41.10148239135742, "global_step": 204796, "epoch": 1692} {"train_loss": -41.905460357666016, "global_step": 204797, "epoch": 1692} {"train_loss": -42.786781311035156, "global_step": 204798, "epoch": 1692} {"train_loss": -41.39760971069336, "global_step": 204799, "epoch": 1692} {"train_loss": -39.437477111816406, "global_step": 204800, "epoch": 1692} {"train_loss": -38.4503173828125, "global_step": 204801, "epoch": 1692} {"train_loss": -41.62667465209961, "global_step": 204802, "epoch": 1692} {"train_loss": -38.31508255004883, "global_step": 204803, "epoch": 1692} {"train_loss": -37.013301849365234, "global_step": 204804, "epoch": 1692} {"train_loss": -42.41951370239258, "global_step": 204805, "epoch": 1692} {"train_loss": -37.511146545410156, "global_step": 204806, "epoch": 1692} {"train_loss": -40.9123649597168, "global_step": 204807, "epoch": 1692} {"train_loss": -41.3561897277832, "global_step": 204808, "epoch": 1692} {"train_loss": -40.90916442871094, "global_step": 204809, "epoch": 1692} {"train_loss": -39.64043045043945, "global_step": 204810, "epoch": 1692} {"train_loss": -40.42768096923828, "global_step": 204811, "epoch": 1692} {"train_loss": -41.89045333862305, "global_step": 204812, "epoch": 1692} {"train_loss": -41.353939056396484, "global_step": 204813, "epoch": 1692} {"train_loss": -41.16917419433594, "global_step": 204814, "epoch": 1692} {"train_loss": -41.93547439575195, "global_step": 204815, "epoch": 1692} {"train_loss": -40.62006759643555, "global_step": 204816, "epoch": 1692} {"train_loss": -42.23731231689453, "global_step": 204817, "epoch": 1692} {"train_loss": -40.46149826049805, "global_step": 204818, "epoch": 1692} {"train_loss": -40.33787536621094, "global_step": 204819, "epoch": 1692} {"train_loss": -41.05723190307617, "global_step": 204820, "epoch": 1692} {"train_loss": -40.65327072143555, "global_step": 204821, "epoch": 1692} {"train_loss": -41.40348815917969, "global_step": 204822, "epoch": 1692} {"train_loss": -40.690521240234375, "global_step": 204823, "epoch": 1692} {"train_loss": -41.34922790527344, "global_step": 204824, "epoch": 1692} {"train_loss": -41.5700798034668, "global_step": 204825, "epoch": 1692} {"train_loss": -41.56838607788086, "global_step": 204826, "epoch": 1692} {"train_loss": -41.67499542236328, "global_step": 204827, "epoch": 1692} {"train_loss": -41.45795440673828, "global_step": 204828, "epoch": 1692} {"train_loss": -42.6025276184082, "global_step": 204829, "epoch": 1692} {"train_loss": -42.11567306518555, "global_step": 204830, "epoch": 1692} {"train_loss": -41.81370544433594, "global_step": 204831, "epoch": 1692} {"train_loss": -42.388790130615234, "global_step": 204832, "epoch": 1692} {"train_loss": -42.37297439575195, "global_step": 204833, "epoch": 1692} {"train_loss": -42.72141647338867, "global_step": 204834, "epoch": 1692} {"train_loss": -42.51169967651367, "global_step": 204835, "epoch": 1692} {"train_loss": -41.96430206298828, "global_step": 204836, "epoch": 1692} {"train_loss": -42.527565002441406, "global_step": 204837, "epoch": 1692} {"train_loss": -42.660091400146484, "global_step": 204838, "epoch": 1692} {"train_loss": -41.84754180908203, "global_step": 204839, "epoch": 1692} {"train_loss": -42.335079193115234, "global_step": 204840, "epoch": 1692} {"train_loss": -42.596736907958984, "global_step": 204841, "epoch": 1692} {"train_loss": -41.96684265136719, "global_step": 204842, "epoch": 1692} {"train_loss": -42.400634765625, "global_step": 204843, "epoch": 1692} {"train_loss": -42.32058334350586, "global_step": 204844, "epoch": 1692} {"train_loss": -42.2868766784668, "global_step": 204845, "epoch": 1692} {"train_loss": -42.00165939331055, "global_step": 204846, "epoch": 1692} {"train_loss": -42.34032440185547, "global_step": 204847, "epoch": 1692} {"train_loss": -43.1806755065918, "global_step": 204848, "epoch": 1692} {"train_loss": -42.54859924316406, "global_step": 204849, "epoch": 1692} {"train_loss": -42.80659866333008, "global_step": 204850, "epoch": 1692} {"train_loss": -43.1122932434082, "global_step": 204851, "epoch": 1692} {"train_loss": -41.662174224853516, "global_step": 204852, "epoch": 1692, "val_loss": 2598957.25} {"train_loss": -42.90487289428711, "global_step": 204853, "epoch": 1693} {"train_loss": -42.786659240722656, "global_step": 204854, "epoch": 1693} {"train_loss": -42.62305450439453, "global_step": 204855, "epoch": 1693} {"train_loss": -43.068538665771484, "global_step": 204856, "epoch": 1693} {"train_loss": -43.132667541503906, "global_step": 204857, "epoch": 1693} {"train_loss": -43.17488479614258, "global_step": 204858, "epoch": 1693} {"train_loss": -43.420806884765625, "global_step": 204859, "epoch": 1693} {"train_loss": -42.716514587402344, "global_step": 204860, "epoch": 1693} {"train_loss": -42.6973991394043, "global_step": 204861, "epoch": 1693} {"train_loss": -42.76588821411133, "global_step": 204862, "epoch": 1693} {"train_loss": -42.43064880371094, "global_step": 204863, "epoch": 1693} {"train_loss": -42.63338851928711, "global_step": 204864, "epoch": 1693} {"train_loss": -42.94932556152344, "global_step": 204865, "epoch": 1693} {"train_loss": -43.238128662109375, "global_step": 204866, "epoch": 1693} {"train_loss": -43.082645416259766, "global_step": 204867, "epoch": 1693} {"train_loss": -43.426795959472656, "global_step": 204868, "epoch": 1693} {"train_loss": -43.501190185546875, "global_step": 204869, "epoch": 1693} {"train_loss": -43.262474060058594, "global_step": 204870, "epoch": 1693} {"train_loss": -43.9030647277832, "global_step": 204871, "epoch": 1693} {"train_loss": -42.9013557434082, "global_step": 204872, "epoch": 1693} {"train_loss": -42.773250579833984, "global_step": 204873, "epoch": 1693} {"train_loss": -43.38741683959961, "global_step": 204874, "epoch": 1693} {"train_loss": -42.82377243041992, "global_step": 204875, "epoch": 1693} {"train_loss": -43.13753890991211, "global_step": 204876, "epoch": 1693} {"train_loss": -42.33418273925781, "global_step": 204877, "epoch": 1693} {"train_loss": -42.3968505859375, "global_step": 204878, "epoch": 1693} {"train_loss": -41.41874313354492, "global_step": 204879, "epoch": 1693} {"train_loss": -42.785221099853516, "global_step": 204880, "epoch": 1693} {"train_loss": -43.2872200012207, "global_step": 204881, "epoch": 1693} {"train_loss": -41.45283889770508, "global_step": 204882, "epoch": 1693} {"train_loss": -38.915897369384766, "global_step": 204883, "epoch": 1693} {"train_loss": -42.701412200927734, "global_step": 204884, "epoch": 1693} {"train_loss": -42.37798309326172, "global_step": 204885, "epoch": 1693} {"train_loss": -39.98406982421875, "global_step": 204886, "epoch": 1693} {"train_loss": -42.56755447387695, "global_step": 204887, "epoch": 1693} {"train_loss": -40.346160888671875, "global_step": 204888, "epoch": 1693} {"train_loss": -38.56909942626953, "global_step": 204889, "epoch": 1693} {"train_loss": -42.42618179321289, "global_step": 204890, "epoch": 1693} {"train_loss": -37.64704513549805, "global_step": 204891, "epoch": 1693} {"train_loss": -41.34463119506836, "global_step": 204892, "epoch": 1693} {"train_loss": -40.85693359375, "global_step": 204893, "epoch": 1693} {"train_loss": -38.09515380859375, "global_step": 204894, "epoch": 1693} {"train_loss": -40.0540885925293, "global_step": 204895, "epoch": 1693} {"train_loss": -36.97581481933594, "global_step": 204896, "epoch": 1693} {"train_loss": -41.7215576171875, "global_step": 204897, "epoch": 1693} {"train_loss": -38.19673538208008, "global_step": 204898, "epoch": 1693} {"train_loss": -40.48555374145508, "global_step": 204899, "epoch": 1693} {"train_loss": -40.70650100708008, "global_step": 204900, "epoch": 1693} {"train_loss": -40.95945739746094, "global_step": 204901, "epoch": 1693} {"train_loss": -42.15031051635742, "global_step": 204902, "epoch": 1693} {"train_loss": -40.451698303222656, "global_step": 204903, "epoch": 1693} {"train_loss": -41.06742858886719, "global_step": 204904, "epoch": 1693} {"train_loss": -40.56068801879883, "global_step": 204905, "epoch": 1693} {"train_loss": -40.06440353393555, "global_step": 204906, "epoch": 1693} {"train_loss": -38.56761932373047, "global_step": 204907, "epoch": 1693} {"train_loss": -41.5247688293457, "global_step": 204908, "epoch": 1693} {"train_loss": -39.83663558959961, "global_step": 204909, "epoch": 1693} {"train_loss": -40.85988998413086, "global_step": 204910, "epoch": 1693} {"train_loss": -39.27909469604492, "global_step": 204911, "epoch": 1693} {"train_loss": -41.336063385009766, "global_step": 204912, "epoch": 1693} {"train_loss": -39.96602249145508, "global_step": 204913, "epoch": 1693} {"train_loss": -41.84328079223633, "global_step": 204914, "epoch": 1693} {"train_loss": -39.61716842651367, "global_step": 204915, "epoch": 1693} {"train_loss": -40.462623596191406, "global_step": 204916, "epoch": 1693} {"train_loss": -41.9422492980957, "global_step": 204917, "epoch": 1693} {"train_loss": -41.47998809814453, "global_step": 204918, "epoch": 1693} {"train_loss": -39.60784912109375, "global_step": 204919, "epoch": 1693} {"train_loss": -40.94442367553711, "global_step": 204920, "epoch": 1693} {"train_loss": -39.81650924682617, "global_step": 204921, "epoch": 1693} {"train_loss": -39.87638473510742, "global_step": 204922, "epoch": 1693} {"train_loss": -41.75185775756836, "global_step": 204923, "epoch": 1693} {"train_loss": -40.12800216674805, "global_step": 204924, "epoch": 1693} {"train_loss": -39.96880340576172, "global_step": 204925, "epoch": 1693} {"train_loss": -41.201446533203125, "global_step": 204926, "epoch": 1693} {"train_loss": -41.6058464050293, "global_step": 204927, "epoch": 1693} {"train_loss": -40.62491989135742, "global_step": 204928, "epoch": 1693} {"train_loss": -40.699867248535156, "global_step": 204929, "epoch": 1693} {"train_loss": -41.1186408996582, "global_step": 204930, "epoch": 1693} {"train_loss": -41.80939865112305, "global_step": 204931, "epoch": 1693} {"train_loss": -41.561336517333984, "global_step": 204932, "epoch": 1693} {"train_loss": -42.10332107543945, "global_step": 204933, "epoch": 1693} {"train_loss": -41.564430236816406, "global_step": 204934, "epoch": 1693} {"train_loss": -41.3951416015625, "global_step": 204935, "epoch": 1693} {"train_loss": -41.98916244506836, "global_step": 204936, "epoch": 1693} {"train_loss": -42.59177780151367, "global_step": 204937, "epoch": 1693} {"train_loss": -41.862483978271484, "global_step": 204938, "epoch": 1693} {"train_loss": -41.8422966003418, "global_step": 204939, "epoch": 1693} {"train_loss": -42.10140609741211, "global_step": 204940, "epoch": 1693} {"train_loss": -42.41047286987305, "global_step": 204941, "epoch": 1693} {"train_loss": -41.719573974609375, "global_step": 204942, "epoch": 1693} {"train_loss": -41.985591888427734, "global_step": 204943, "epoch": 1693} {"train_loss": -42.526031494140625, "global_step": 204944, "epoch": 1693} {"train_loss": -42.27967071533203, "global_step": 204945, "epoch": 1693} {"train_loss": -42.141151428222656, "global_step": 204946, "epoch": 1693} {"train_loss": -42.27385330200195, "global_step": 204947, "epoch": 1693} {"train_loss": -42.123294830322266, "global_step": 204948, "epoch": 1693} {"train_loss": -42.199317932128906, "global_step": 204949, "epoch": 1693} {"train_loss": -42.80849075317383, "global_step": 204950, "epoch": 1693} {"train_loss": -42.373573303222656, "global_step": 204951, "epoch": 1693} {"train_loss": -42.7253532409668, "global_step": 204952, "epoch": 1693} {"train_loss": -42.42828369140625, "global_step": 204953, "epoch": 1693} {"train_loss": -43.103973388671875, "global_step": 204954, "epoch": 1693} {"train_loss": -42.96918487548828, "global_step": 204955, "epoch": 1693} {"train_loss": -42.48153305053711, "global_step": 204956, "epoch": 1693} {"train_loss": -42.833648681640625, "global_step": 204957, "epoch": 1693} {"train_loss": -43.15224838256836, "global_step": 204958, "epoch": 1693} {"train_loss": -43.007080078125, "global_step": 204959, "epoch": 1693} {"train_loss": -43.12306213378906, "global_step": 204960, "epoch": 1693} {"train_loss": -43.2805061340332, "global_step": 204961, "epoch": 1693} {"train_loss": -43.14567565917969, "global_step": 204962, "epoch": 1693} {"train_loss": -42.7277946472168, "global_step": 204963, "epoch": 1693} {"train_loss": -43.08906173706055, "global_step": 204964, "epoch": 1693} {"train_loss": -43.21684265136719, "global_step": 204965, "epoch": 1693} {"train_loss": -42.836151123046875, "global_step": 204966, "epoch": 1693} {"train_loss": -43.19651794433594, "global_step": 204967, "epoch": 1693} {"train_loss": -42.48481369018555, "global_step": 204968, "epoch": 1693} {"train_loss": -42.86590576171875, "global_step": 204969, "epoch": 1693} {"train_loss": -43.343013763427734, "global_step": 204970, "epoch": 1693} {"train_loss": -43.36780548095703, "global_step": 204971, "epoch": 1693} {"train_loss": -42.0831184387207, "global_step": 204972, "epoch": 1693} {"train_loss": -41.801205374977805, "global_step": 204973, "epoch": 1693, "val_loss": 2628163.25} {"train_loss": -43.04566192626953, "global_step": 204974, "epoch": 1694} {"train_loss": -42.58924102783203, "global_step": 204975, "epoch": 1694} {"train_loss": -42.77162551879883, "global_step": 204976, "epoch": 1694} {"train_loss": -43.49900817871094, "global_step": 204977, "epoch": 1694} {"train_loss": -42.757293701171875, "global_step": 204978, "epoch": 1694} {"train_loss": -42.50761413574219, "global_step": 204979, "epoch": 1694} {"train_loss": -42.71968460083008, "global_step": 204980, "epoch": 1694} {"train_loss": -42.75638961791992, "global_step": 204981, "epoch": 1694} {"train_loss": -43.19159698486328, "global_step": 204982, "epoch": 1694} {"train_loss": -42.83930206298828, "global_step": 204983, "epoch": 1694} {"train_loss": -42.892311096191406, "global_step": 204984, "epoch": 1694} {"train_loss": -43.216346740722656, "global_step": 204985, "epoch": 1694} {"train_loss": -42.51506423950195, "global_step": 204986, "epoch": 1694} {"train_loss": -42.76582717895508, "global_step": 204987, "epoch": 1694} {"train_loss": -42.81625747680664, "global_step": 204988, "epoch": 1694} {"train_loss": -43.208621978759766, "global_step": 204989, "epoch": 1694} {"train_loss": -43.17840576171875, "global_step": 204990, "epoch": 1694} {"train_loss": -43.061317443847656, "global_step": 204991, "epoch": 1694} {"train_loss": -42.76157760620117, "global_step": 204992, "epoch": 1694} {"train_loss": -43.32646560668945, "global_step": 204993, "epoch": 1694} {"train_loss": -42.692955017089844, "global_step": 204994, "epoch": 1694} {"train_loss": -43.09721374511719, "global_step": 204995, "epoch": 1694} {"train_loss": -42.6900520324707, "global_step": 204996, "epoch": 1694} {"train_loss": -42.715797424316406, "global_step": 204997, "epoch": 1694} {"train_loss": -42.762718200683594, "global_step": 204998, "epoch": 1694} {"train_loss": -43.04652786254883, "global_step": 204999, "epoch": 1694} {"train_loss": -42.20583724975586, "global_step": 205000, "epoch": 1694} {"train_loss": -42.373294830322266, "global_step": 205001, "epoch": 1694} {"train_loss": -40.6794548034668, "global_step": 205002, "epoch": 1694} {"train_loss": -37.66672897338867, "global_step": 205003, "epoch": 1694} {"train_loss": -42.1458740234375, "global_step": 205004, "epoch": 1694} {"train_loss": -42.49113082885742, "global_step": 205005, "epoch": 1694} {"train_loss": -41.42595291137695, "global_step": 205006, "epoch": 1694} {"train_loss": -38.61373519897461, "global_step": 205007, "epoch": 1694} {"train_loss": -35.517601013183594, "global_step": 205008, "epoch": 1694} {"train_loss": -37.59505081176758, "global_step": 205009, "epoch": 1694} {"train_loss": -25.098024368286133, "global_step": 205010, "epoch": 1694} {"train_loss": -29.880292892456055, "global_step": 205011, "epoch": 1694} {"train_loss": -27.704181671142578, "global_step": 205012, "epoch": 1694} {"train_loss": -34.38398361206055, "global_step": 205013, "epoch": 1694} {"train_loss": -27.255903244018555, "global_step": 205014, "epoch": 1694} {"train_loss": -32.901607513427734, "global_step": 205015, "epoch": 1694} {"train_loss": -32.76826095581055, "global_step": 205016, "epoch": 1694} {"train_loss": -29.117294311523438, "global_step": 205017, "epoch": 1694} {"train_loss": -34.0975227355957, "global_step": 205018, "epoch": 1694} {"train_loss": -31.992502212524414, "global_step": 205019, "epoch": 1694} {"train_loss": -31.821197509765625, "global_step": 205020, "epoch": 1694} {"train_loss": -32.32038497924805, "global_step": 205021, "epoch": 1694} {"train_loss": -35.33051681518555, "global_step": 205022, "epoch": 1694} {"train_loss": -33.21195983886719, "global_step": 205023, "epoch": 1694} {"train_loss": -35.03171920776367, "global_step": 205024, "epoch": 1694} {"train_loss": -34.039119720458984, "global_step": 205025, "epoch": 1694} {"train_loss": -35.18547821044922, "global_step": 205026, "epoch": 1694} {"train_loss": -34.60403060913086, "global_step": 205027, "epoch": 1694} {"train_loss": -33.91887283325195, "global_step": 205028, "epoch": 1694} {"train_loss": -35.797157287597656, "global_step": 205029, "epoch": 1694} {"train_loss": -35.86183166503906, "global_step": 205030, "epoch": 1694} {"train_loss": -35.97882843017578, "global_step": 205031, "epoch": 1694} {"train_loss": -34.698673248291016, "global_step": 205032, "epoch": 1694} {"train_loss": -35.806556701660156, "global_step": 205033, "epoch": 1694} {"train_loss": -36.323368072509766, "global_step": 205034, "epoch": 1694} {"train_loss": -36.48513412475586, "global_step": 205035, "epoch": 1694} {"train_loss": -35.95603561401367, "global_step": 205036, "epoch": 1694} {"train_loss": -35.90768051147461, "global_step": 205037, "epoch": 1694} {"train_loss": -36.45203399658203, "global_step": 205038, "epoch": 1694} {"train_loss": -36.9821662902832, "global_step": 205039, "epoch": 1694} {"train_loss": -36.45747756958008, "global_step": 205040, "epoch": 1694} {"train_loss": -37.274391174316406, "global_step": 205041, "epoch": 1694} {"train_loss": -37.724124908447266, "global_step": 205042, "epoch": 1694} {"train_loss": -37.316551208496094, "global_step": 205043, "epoch": 1694} {"train_loss": -37.03965377807617, "global_step": 205044, "epoch": 1694} {"train_loss": -36.920326232910156, "global_step": 205045, "epoch": 1694} {"train_loss": -37.47365951538086, "global_step": 205046, "epoch": 1694} {"train_loss": -36.02959060668945, "global_step": 205047, "epoch": 1694} {"train_loss": -33.2184944152832, "global_step": 205048, "epoch": 1694} {"train_loss": -37.94043731689453, "global_step": 205049, "epoch": 1694} {"train_loss": -34.94904708862305, "global_step": 205050, "epoch": 1694} {"train_loss": -36.60642623901367, "global_step": 205051, "epoch": 1694} {"train_loss": -36.82748031616211, "global_step": 205052, "epoch": 1694} {"train_loss": -37.40721130371094, "global_step": 205053, "epoch": 1694} {"train_loss": -36.50551986694336, "global_step": 205054, "epoch": 1694} {"train_loss": -37.30147933959961, "global_step": 205055, "epoch": 1694} {"train_loss": -36.69063949584961, "global_step": 205056, "epoch": 1694} {"train_loss": -36.88710021972656, "global_step": 205057, "epoch": 1694} {"train_loss": -38.15788650512695, "global_step": 205058, "epoch": 1694} {"train_loss": -37.10872268676758, "global_step": 205059, "epoch": 1694} {"train_loss": -37.9159049987793, "global_step": 205060, "epoch": 1694} {"train_loss": -37.22111129760742, "global_step": 205061, "epoch": 1694} {"train_loss": -38.32095718383789, "global_step": 205062, "epoch": 1694} {"train_loss": -37.606788635253906, "global_step": 205063, "epoch": 1694} {"train_loss": -37.915462493896484, "global_step": 205064, "epoch": 1694} {"train_loss": -38.48732376098633, "global_step": 205065, "epoch": 1694} {"train_loss": -38.63621139526367, "global_step": 205066, "epoch": 1694} {"train_loss": -37.994972229003906, "global_step": 205067, "epoch": 1694} {"train_loss": -38.551727294921875, "global_step": 205068, "epoch": 1694} {"train_loss": -38.15321731567383, "global_step": 205069, "epoch": 1694} {"train_loss": -38.964324951171875, "global_step": 205070, "epoch": 1694} {"train_loss": -37.6058235168457, "global_step": 205071, "epoch": 1694} {"train_loss": -38.863956451416016, "global_step": 205072, "epoch": 1694} {"train_loss": -39.03609848022461, "global_step": 205073, "epoch": 1694} {"train_loss": -38.924190521240234, "global_step": 205074, "epoch": 1694} {"train_loss": -38.54436111450195, "global_step": 205075, "epoch": 1694} {"train_loss": -38.22271728515625, "global_step": 205076, "epoch": 1694} {"train_loss": -38.835487365722656, "global_step": 205077, "epoch": 1694} {"train_loss": -39.03560256958008, "global_step": 205078, "epoch": 1694} {"train_loss": -39.465999603271484, "global_step": 205079, "epoch": 1694} {"train_loss": -39.104305267333984, "global_step": 205080, "epoch": 1694} {"train_loss": -39.64357376098633, "global_step": 205081, "epoch": 1694} {"train_loss": -39.700408935546875, "global_step": 205082, "epoch": 1694} {"train_loss": -39.57746124267578, "global_step": 205083, "epoch": 1694} {"train_loss": -39.67311096191406, "global_step": 205084, "epoch": 1694} {"train_loss": -39.875179290771484, "global_step": 205085, "epoch": 1694} {"train_loss": -38.49381637573242, "global_step": 205086, "epoch": 1694} {"train_loss": -38.22119903564453, "global_step": 205087, "epoch": 1694} {"train_loss": -36.869041442871094, "global_step": 205088, "epoch": 1694} {"train_loss": -37.335670471191406, "global_step": 205089, "epoch": 1694} {"train_loss": -39.675960540771484, "global_step": 205090, "epoch": 1694} {"train_loss": -36.22018051147461, "global_step": 205091, "epoch": 1694} {"train_loss": -37.85944366455078, "global_step": 205092, "epoch": 1694} {"train_loss": -39.494327545166016, "global_step": 205093, "epoch": 1694} {"train_loss": -38.07721294056285, "global_step": 205094, "epoch": 1694, "val_loss": 2602976.0} {"train_loss": -39.129573822021484, "global_step": 205095, "epoch": 1695} {"train_loss": -39.47473907470703, "global_step": 205096, "epoch": 1695} {"train_loss": -37.78318405151367, "global_step": 205097, "epoch": 1695} {"train_loss": -39.89980697631836, "global_step": 205098, "epoch": 1695} {"train_loss": -37.20408248901367, "global_step": 205099, "epoch": 1695} {"train_loss": -38.862056732177734, "global_step": 205100, "epoch": 1695} {"train_loss": -39.8766975402832, "global_step": 205101, "epoch": 1695} {"train_loss": -39.8736457824707, "global_step": 205102, "epoch": 1695} {"train_loss": -39.54258728027344, "global_step": 205103, "epoch": 1695} {"train_loss": -39.109798431396484, "global_step": 205104, "epoch": 1695} {"train_loss": -37.63694381713867, "global_step": 205105, "epoch": 1695} {"train_loss": -38.305213928222656, "global_step": 205106, "epoch": 1695} {"train_loss": -38.03036117553711, "global_step": 205107, "epoch": 1695} {"train_loss": -39.13423156738281, "global_step": 205108, "epoch": 1695} {"train_loss": -39.89344024658203, "global_step": 205109, "epoch": 1695} {"train_loss": -37.15673065185547, "global_step": 205110, "epoch": 1695} {"train_loss": -37.7029914855957, "global_step": 205111, "epoch": 1695} {"train_loss": -38.43548583984375, "global_step": 205112, "epoch": 1695} {"train_loss": -38.99020767211914, "global_step": 205113, "epoch": 1695} {"train_loss": -39.755889892578125, "global_step": 205114, "epoch": 1695} {"train_loss": -39.532958984375, "global_step": 205115, "epoch": 1695} {"train_loss": -38.19442367553711, "global_step": 205116, "epoch": 1695} {"train_loss": -38.201698303222656, "global_step": 205117, "epoch": 1695} {"train_loss": -39.3942985534668, "global_step": 205118, "epoch": 1695} {"train_loss": -39.753753662109375, "global_step": 205119, "epoch": 1695} {"train_loss": -38.964176177978516, "global_step": 205120, "epoch": 1695} {"train_loss": -39.44350814819336, "global_step": 205121, "epoch": 1695} {"train_loss": -38.89334487915039, "global_step": 205122, "epoch": 1695} {"train_loss": -39.707984924316406, "global_step": 205123, "epoch": 1695} {"train_loss": -35.991275787353516, "global_step": 205124, "epoch": 1695} {"train_loss": -38.13941192626953, "global_step": 205125, "epoch": 1695} {"train_loss": -40.2247314453125, "global_step": 205126, "epoch": 1695} {"train_loss": -38.79933166503906, "global_step": 205127, "epoch": 1695} {"train_loss": -39.3016471862793, "global_step": 205128, "epoch": 1695} {"train_loss": -39.96648406982422, "global_step": 205129, "epoch": 1695} {"train_loss": -39.729278564453125, "global_step": 205130, "epoch": 1695} {"train_loss": -39.876949310302734, "global_step": 205131, "epoch": 1695} {"train_loss": -39.09572982788086, "global_step": 205132, "epoch": 1695} {"train_loss": -40.60825729370117, "global_step": 205133, "epoch": 1695} {"train_loss": -40.060909271240234, "global_step": 205134, "epoch": 1695} {"train_loss": -39.328147888183594, "global_step": 205135, "epoch": 1695} {"train_loss": -40.3918342590332, "global_step": 205136, "epoch": 1695} {"train_loss": -40.041873931884766, "global_step": 205137, "epoch": 1695} {"train_loss": -40.3287353515625, "global_step": 205138, "epoch": 1695} {"train_loss": -38.65766525268555, "global_step": 205139, "epoch": 1695} {"train_loss": -39.74552917480469, "global_step": 205140, "epoch": 1695} {"train_loss": -40.53214645385742, "global_step": 205141, "epoch": 1695} {"train_loss": -40.543331146240234, "global_step": 205142, "epoch": 1695} {"train_loss": -40.61381530761719, "global_step": 205143, "epoch": 1695} {"train_loss": -40.480628967285156, "global_step": 205144, "epoch": 1695} {"train_loss": -39.97370147705078, "global_step": 205145, "epoch": 1695} {"train_loss": -40.97860336303711, "global_step": 205146, "epoch": 1695} {"train_loss": -40.161964416503906, "global_step": 205147, "epoch": 1695} {"train_loss": -41.0962028503418, "global_step": 205148, "epoch": 1695} {"train_loss": -40.78477096557617, "global_step": 205149, "epoch": 1695} {"train_loss": -40.909332275390625, "global_step": 205150, "epoch": 1695} {"train_loss": -40.55841064453125, "global_step": 205151, "epoch": 1695} {"train_loss": -41.210445404052734, "global_step": 205152, "epoch": 1695} {"train_loss": -40.64651107788086, "global_step": 205153, "epoch": 1695} {"train_loss": -40.624935150146484, "global_step": 205154, "epoch": 1695} {"train_loss": -40.87251663208008, "global_step": 205155, "epoch": 1695} {"train_loss": -41.095726013183594, "global_step": 205156, "epoch": 1695} {"train_loss": -40.87277603149414, "global_step": 205157, "epoch": 1695} {"train_loss": -40.62623977661133, "global_step": 205158, "epoch": 1695} {"train_loss": -41.221107482910156, "global_step": 205159, "epoch": 1695} {"train_loss": -41.57334518432617, "global_step": 205160, "epoch": 1695} {"train_loss": -41.115020751953125, "global_step": 205161, "epoch": 1695} {"train_loss": -41.78953170776367, "global_step": 205162, "epoch": 1695} {"train_loss": -41.79523468017578, "global_step": 205163, "epoch": 1695} {"train_loss": -41.8233757019043, "global_step": 205164, "epoch": 1695} {"train_loss": -41.3984260559082, "global_step": 205165, "epoch": 1695} {"train_loss": -41.755863189697266, "global_step": 205166, "epoch": 1695} {"train_loss": -41.28746032714844, "global_step": 205167, "epoch": 1695} {"train_loss": -41.51931381225586, "global_step": 205168, "epoch": 1695} {"train_loss": -40.97211837768555, "global_step": 205169, "epoch": 1695} {"train_loss": -39.89848709106445, "global_step": 205170, "epoch": 1695} {"train_loss": -39.5112190246582, "global_step": 205171, "epoch": 1695} {"train_loss": -39.177364349365234, "global_step": 205172, "epoch": 1695} {"train_loss": -39.636512756347656, "global_step": 205173, "epoch": 1695} {"train_loss": -39.88481521606445, "global_step": 205174, "epoch": 1695} {"train_loss": -39.753761291503906, "global_step": 205175, "epoch": 1695} {"train_loss": -41.0915641784668, "global_step": 205176, "epoch": 1695} {"train_loss": -39.706417083740234, "global_step": 205177, "epoch": 1695} {"train_loss": -40.20106887817383, "global_step": 205178, "epoch": 1695} {"train_loss": -41.13723373413086, "global_step": 205179, "epoch": 1695} {"train_loss": -41.0296745300293, "global_step": 205180, "epoch": 1695} {"train_loss": -41.339813232421875, "global_step": 205181, "epoch": 1695} {"train_loss": -40.26561737060547, "global_step": 205182, "epoch": 1695} {"train_loss": -40.367881774902344, "global_step": 205183, "epoch": 1695} {"train_loss": -40.3792839050293, "global_step": 205184, "epoch": 1695} {"train_loss": -39.84499740600586, "global_step": 205185, "epoch": 1695} {"train_loss": -40.76206970214844, "global_step": 205186, "epoch": 1695} {"train_loss": -39.83747482299805, "global_step": 205187, "epoch": 1695} {"train_loss": -41.2490119934082, "global_step": 205188, "epoch": 1695} {"train_loss": -40.339778900146484, "global_step": 205189, "epoch": 1695} {"train_loss": -39.968048095703125, "global_step": 205190, "epoch": 1695} {"train_loss": -40.2025146484375, "global_step": 205191, "epoch": 1695} {"train_loss": -38.71051025390625, "global_step": 205192, "epoch": 1695} {"train_loss": -40.99907302856445, "global_step": 205193, "epoch": 1695} {"train_loss": -40.13788986206055, "global_step": 205194, "epoch": 1695} {"train_loss": -41.94478225708008, "global_step": 205195, "epoch": 1695} {"train_loss": -41.0019416809082, "global_step": 205196, "epoch": 1695} {"train_loss": -41.07855224609375, "global_step": 205197, "epoch": 1695} {"train_loss": -41.46158218383789, "global_step": 205198, "epoch": 1695} {"train_loss": -40.610904693603516, "global_step": 205199, "epoch": 1695} {"train_loss": -41.308692932128906, "global_step": 205200, "epoch": 1695} {"train_loss": -40.64561080932617, "global_step": 205201, "epoch": 1695} {"train_loss": -40.874080657958984, "global_step": 205202, "epoch": 1695} {"train_loss": -40.92342758178711, "global_step": 205203, "epoch": 1695} {"train_loss": -38.33050537109375, "global_step": 205204, "epoch": 1695} {"train_loss": -40.68031692504883, "global_step": 205205, "epoch": 1695} {"train_loss": -40.62249755859375, "global_step": 205206, "epoch": 1695} {"train_loss": -39.938838958740234, "global_step": 205207, "epoch": 1695} {"train_loss": -40.29018783569336, "global_step": 205208, "epoch": 1695} {"train_loss": -40.62751770019531, "global_step": 205209, "epoch": 1695} {"train_loss": -39.662715911865234, "global_step": 205210, "epoch": 1695} {"train_loss": -37.517513275146484, "global_step": 205211, "epoch": 1695} {"train_loss": -37.78892517089844, "global_step": 205212, "epoch": 1695} {"train_loss": -38.302120208740234, "global_step": 205213, "epoch": 1695} {"train_loss": -38.763423919677734, "global_step": 205214, "epoch": 1695} {"train_loss": -39.920603161015784, "global_step": 205215, "epoch": 1695, "val_loss": 2585783.75} {"train_loss": -38.073509216308594, "global_step": 205216, "epoch": 1696} {"train_loss": -37.562068939208984, "global_step": 205217, "epoch": 1696} {"train_loss": -36.82424545288086, "global_step": 205218, "epoch": 1696} {"train_loss": -29.89496421813965, "global_step": 205219, "epoch": 1696} {"train_loss": -38.1005973815918, "global_step": 205220, "epoch": 1696} {"train_loss": -30.144556045532227, "global_step": 205221, "epoch": 1696} {"train_loss": -36.0211067199707, "global_step": 205222, "epoch": 1696} {"train_loss": -26.545984268188477, "global_step": 205223, "epoch": 1696} {"train_loss": -38.80652618408203, "global_step": 205224, "epoch": 1696} {"train_loss": -30.95318031311035, "global_step": 205225, "epoch": 1696} {"train_loss": -33.731971740722656, "global_step": 205226, "epoch": 1696} {"train_loss": -33.08342361450195, "global_step": 205227, "epoch": 1696} {"train_loss": -32.6130256652832, "global_step": 205228, "epoch": 1696} {"train_loss": -36.55910873413086, "global_step": 205229, "epoch": 1696} {"train_loss": -32.868995666503906, "global_step": 205230, "epoch": 1696} {"train_loss": -36.860469818115234, "global_step": 205231, "epoch": 1696} {"train_loss": -38.819759368896484, "global_step": 205232, "epoch": 1696} {"train_loss": -34.4644889831543, "global_step": 205233, "epoch": 1696} {"train_loss": -36.50123977661133, "global_step": 205234, "epoch": 1696} {"train_loss": -38.818355560302734, "global_step": 205235, "epoch": 1696} {"train_loss": -37.49325942993164, "global_step": 205236, "epoch": 1696} {"train_loss": -36.6876106262207, "global_step": 205237, "epoch": 1696} {"train_loss": -39.685218811035156, "global_step": 205238, "epoch": 1696} {"train_loss": -35.017372131347656, "global_step": 205239, "epoch": 1696} {"train_loss": -35.9685173034668, "global_step": 205240, "epoch": 1696} {"train_loss": -36.4089469909668, "global_step": 205241, "epoch": 1696} {"train_loss": -39.50922775268555, "global_step": 205242, "epoch": 1696} {"train_loss": -39.370357513427734, "global_step": 205243, "epoch": 1696} {"train_loss": -38.59198760986328, "global_step": 205244, "epoch": 1696} {"train_loss": -39.4814338684082, "global_step": 205245, "epoch": 1696} {"train_loss": -39.19803237915039, "global_step": 205246, "epoch": 1696} {"train_loss": -36.32654571533203, "global_step": 205247, "epoch": 1696} {"train_loss": -39.407222747802734, "global_step": 205248, "epoch": 1696} {"train_loss": -37.755069732666016, "global_step": 205249, "epoch": 1696} {"train_loss": -39.25974655151367, "global_step": 205250, "epoch": 1696} {"train_loss": -39.346370697021484, "global_step": 205251, "epoch": 1696} {"train_loss": -37.39733123779297, "global_step": 205252, "epoch": 1696} {"train_loss": -38.513221740722656, "global_step": 205253, "epoch": 1696} {"train_loss": -35.57194137573242, "global_step": 205254, "epoch": 1696} {"train_loss": -37.8454704284668, "global_step": 205255, "epoch": 1696} {"train_loss": -39.665592193603516, "global_step": 205256, "epoch": 1696} {"train_loss": -38.68894577026367, "global_step": 205257, "epoch": 1696} {"train_loss": -37.99020004272461, "global_step": 205258, "epoch": 1696} {"train_loss": -38.938087463378906, "global_step": 205259, "epoch": 1696} {"train_loss": -38.54315185546875, "global_step": 205260, "epoch": 1696} {"train_loss": -38.80828094482422, "global_step": 205261, "epoch": 1696} {"train_loss": -39.322113037109375, "global_step": 205262, "epoch": 1696} {"train_loss": -38.45806884765625, "global_step": 205263, "epoch": 1696} {"train_loss": -38.31379318237305, "global_step": 205264, "epoch": 1696} {"train_loss": -38.6351203918457, "global_step": 205265, "epoch": 1696} {"train_loss": -37.18642044067383, "global_step": 205266, "epoch": 1696} {"train_loss": -37.69462203979492, "global_step": 205267, "epoch": 1696} {"train_loss": -38.578548431396484, "global_step": 205268, "epoch": 1696} {"train_loss": -34.60261154174805, "global_step": 205269, "epoch": 1696} {"train_loss": -38.209327697753906, "global_step": 205270, "epoch": 1696} {"train_loss": -37.961544036865234, "global_step": 205271, "epoch": 1696} {"train_loss": -37.353389739990234, "global_step": 205272, "epoch": 1696} {"train_loss": -39.0935173034668, "global_step": 205273, "epoch": 1696} {"train_loss": -39.87584686279297, "global_step": 205274, "epoch": 1696} {"train_loss": -38.99422073364258, "global_step": 205275, "epoch": 1696} {"train_loss": -38.9941291809082, "global_step": 205276, "epoch": 1696} {"train_loss": -36.09251022338867, "global_step": 205277, "epoch": 1696} {"train_loss": -38.62458038330078, "global_step": 205278, "epoch": 1696} {"train_loss": -38.217708587646484, "global_step": 205279, "epoch": 1696} {"train_loss": -36.64292526245117, "global_step": 205280, "epoch": 1696} {"train_loss": -38.85139083862305, "global_step": 205281, "epoch": 1696} {"train_loss": -38.05837631225586, "global_step": 205282, "epoch": 1696} {"train_loss": -39.0904541015625, "global_step": 205283, "epoch": 1696} {"train_loss": -38.80274963378906, "global_step": 205284, "epoch": 1696} {"train_loss": -37.76750564575195, "global_step": 205285, "epoch": 1696} {"train_loss": -38.8134880065918, "global_step": 205286, "epoch": 1696} {"train_loss": -37.46780014038086, "global_step": 205287, "epoch": 1696} {"train_loss": -38.87044906616211, "global_step": 205288, "epoch": 1696} {"train_loss": -39.04706954956055, "global_step": 205289, "epoch": 1696} {"train_loss": -37.3487548828125, "global_step": 205290, "epoch": 1696} {"train_loss": -37.62709426879883, "global_step": 205291, "epoch": 1696} {"train_loss": -37.261837005615234, "global_step": 205292, "epoch": 1696} {"train_loss": -38.381927490234375, "global_step": 205293, "epoch": 1696} {"train_loss": -38.91309356689453, "global_step": 205294, "epoch": 1696} {"train_loss": -37.22160720825195, "global_step": 205295, "epoch": 1696} {"train_loss": -38.78620529174805, "global_step": 205296, "epoch": 1696} {"train_loss": -37.9787712097168, "global_step": 205297, "epoch": 1696} {"train_loss": -36.32575988769531, "global_step": 205298, "epoch": 1696} {"train_loss": -39.735958099365234, "global_step": 205299, "epoch": 1696} {"train_loss": -36.29871368408203, "global_step": 205300, "epoch": 1696} {"train_loss": -36.050384521484375, "global_step": 205301, "epoch": 1696} {"train_loss": -38.78449249267578, "global_step": 205302, "epoch": 1696} {"train_loss": -38.01220703125, "global_step": 205303, "epoch": 1696} {"train_loss": -39.25831985473633, "global_step": 205304, "epoch": 1696} {"train_loss": -38.49888229370117, "global_step": 205305, "epoch": 1696} {"train_loss": -37.97412872314453, "global_step": 205306, "epoch": 1696} {"train_loss": -37.275794982910156, "global_step": 205307, "epoch": 1696} {"train_loss": -39.12554931640625, "global_step": 205308, "epoch": 1696} {"train_loss": -39.75584411621094, "global_step": 205309, "epoch": 1696} {"train_loss": -38.97992706298828, "global_step": 205310, "epoch": 1696} {"train_loss": -36.88908004760742, "global_step": 205311, "epoch": 1696} {"train_loss": -39.57835388183594, "global_step": 205312, "epoch": 1696} {"train_loss": -38.821292877197266, "global_step": 205313, "epoch": 1696} {"train_loss": -38.451053619384766, "global_step": 205314, "epoch": 1696} {"train_loss": -38.9672966003418, "global_step": 205315, "epoch": 1696} {"train_loss": -39.77410888671875, "global_step": 205316, "epoch": 1696} {"train_loss": -40.0111198425293, "global_step": 205317, "epoch": 1696} {"train_loss": -38.718299865722656, "global_step": 205318, "epoch": 1696} {"train_loss": -39.34066390991211, "global_step": 205319, "epoch": 1696} {"train_loss": -39.57918167114258, "global_step": 205320, "epoch": 1696} {"train_loss": -40.234500885009766, "global_step": 205321, "epoch": 1696} {"train_loss": -38.71852493286133, "global_step": 205322, "epoch": 1696} {"train_loss": -39.03987121582031, "global_step": 205323, "epoch": 1696} {"train_loss": -39.82706832885742, "global_step": 205324, "epoch": 1696} {"train_loss": -39.56187057495117, "global_step": 205325, "epoch": 1696} {"train_loss": -40.20136642456055, "global_step": 205326, "epoch": 1696} {"train_loss": -39.81550598144531, "global_step": 205327, "epoch": 1696} {"train_loss": -38.81913757324219, "global_step": 205328, "epoch": 1696} {"train_loss": -38.24087142944336, "global_step": 205329, "epoch": 1696} {"train_loss": -39.48652267456055, "global_step": 205330, "epoch": 1696} {"train_loss": -40.37120056152344, "global_step": 205331, "epoch": 1696} {"train_loss": -38.82552719116211, "global_step": 205332, "epoch": 1696} {"train_loss": -39.52893829345703, "global_step": 205333, "epoch": 1696} {"train_loss": -39.17348861694336, "global_step": 205334, "epoch": 1696} {"train_loss": -37.60456466674805, "global_step": 205335, "epoch": 1696} {"train_loss": -37.82739472192181, "global_step": 205336, "epoch": 1696, "val_loss": 2443766.0} {"train_loss": -38.67670440673828, "global_step": 205337, "epoch": 1697} {"train_loss": -36.54856491088867, "global_step": 205338, "epoch": 1697} {"train_loss": -40.2905387878418, "global_step": 205339, "epoch": 1697} {"train_loss": -39.682228088378906, "global_step": 205340, "epoch": 1697} {"train_loss": -38.87495040893555, "global_step": 205341, "epoch": 1697} {"train_loss": -38.42667770385742, "global_step": 205342, "epoch": 1697} {"train_loss": -39.496150970458984, "global_step": 205343, "epoch": 1697} {"train_loss": -39.92313766479492, "global_step": 205344, "epoch": 1697} {"train_loss": -39.99528121948242, "global_step": 205345, "epoch": 1697} {"train_loss": -39.3430290222168, "global_step": 205346, "epoch": 1697} {"train_loss": -38.90699005126953, "global_step": 205347, "epoch": 1697} {"train_loss": -39.974365234375, "global_step": 205348, "epoch": 1697} {"train_loss": -40.28907012939453, "global_step": 205349, "epoch": 1697} {"train_loss": -40.372520446777344, "global_step": 205350, "epoch": 1697} {"train_loss": -39.66694641113281, "global_step": 205351, "epoch": 1697} {"train_loss": -39.76131820678711, "global_step": 205352, "epoch": 1697} {"train_loss": -40.874454498291016, "global_step": 205353, "epoch": 1697} {"train_loss": -40.296932220458984, "global_step": 205354, "epoch": 1697} {"train_loss": -39.78653335571289, "global_step": 205355, "epoch": 1697} {"train_loss": -40.4308967590332, "global_step": 205356, "epoch": 1697} {"train_loss": -40.87374496459961, "global_step": 205357, "epoch": 1697} {"train_loss": -39.308631896972656, "global_step": 205358, "epoch": 1697} {"train_loss": -40.06901168823242, "global_step": 205359, "epoch": 1697} {"train_loss": -40.51700973510742, "global_step": 205360, "epoch": 1697} {"train_loss": -40.50368881225586, "global_step": 205361, "epoch": 1697} {"train_loss": -40.561798095703125, "global_step": 205362, "epoch": 1697} {"train_loss": -40.57307815551758, "global_step": 205363, "epoch": 1697} {"train_loss": -39.78596496582031, "global_step": 205364, "epoch": 1697} {"train_loss": -40.72608184814453, "global_step": 205365, "epoch": 1697} {"train_loss": -40.92975616455078, "global_step": 205366, "epoch": 1697} {"train_loss": -40.370601654052734, "global_step": 205367, "epoch": 1697} {"train_loss": -40.22532272338867, "global_step": 205368, "epoch": 1697} {"train_loss": -38.86792755126953, "global_step": 205369, "epoch": 1697} {"train_loss": -39.68234634399414, "global_step": 205370, "epoch": 1697} {"train_loss": -40.23927688598633, "global_step": 205371, "epoch": 1697} {"train_loss": -40.017494201660156, "global_step": 205372, "epoch": 1697} {"train_loss": -39.84004592895508, "global_step": 205373, "epoch": 1697} {"train_loss": -40.67342758178711, "global_step": 205374, "epoch": 1697} {"train_loss": -38.1215705871582, "global_step": 205375, "epoch": 1697} {"train_loss": -38.91524887084961, "global_step": 205376, "epoch": 1697} {"train_loss": -38.63170623779297, "global_step": 205377, "epoch": 1697} {"train_loss": -40.686763763427734, "global_step": 205378, "epoch": 1697} {"train_loss": -37.69895553588867, "global_step": 205379, "epoch": 1697} {"train_loss": -40.47349548339844, "global_step": 205380, "epoch": 1697} {"train_loss": -37.35321807861328, "global_step": 205381, "epoch": 1697} {"train_loss": -39.70301055908203, "global_step": 205382, "epoch": 1697} {"train_loss": -39.9223747253418, "global_step": 205383, "epoch": 1697} {"train_loss": -37.24691390991211, "global_step": 205384, "epoch": 1697} {"train_loss": -37.01351547241211, "global_step": 205385, "epoch": 1697} {"train_loss": -35.446815490722656, "global_step": 205386, "epoch": 1697} {"train_loss": -40.0062141418457, "global_step": 205387, "epoch": 1697} {"train_loss": -39.51754379272461, "global_step": 205388, "epoch": 1697} {"train_loss": -37.52126693725586, "global_step": 205389, "epoch": 1697} {"train_loss": -39.301971435546875, "global_step": 205390, "epoch": 1697} {"train_loss": -39.088035583496094, "global_step": 205391, "epoch": 1697} {"train_loss": -38.06509780883789, "global_step": 205392, "epoch": 1697} {"train_loss": -38.5053825378418, "global_step": 205393, "epoch": 1697} {"train_loss": -40.220550537109375, "global_step": 205394, "epoch": 1697} {"train_loss": -39.1213493347168, "global_step": 205395, "epoch": 1697} {"train_loss": -39.3603630065918, "global_step": 205396, "epoch": 1697} {"train_loss": -38.911346435546875, "global_step": 205397, "epoch": 1697} {"train_loss": -40.53784942626953, "global_step": 205398, "epoch": 1697} {"train_loss": -38.63062286376953, "global_step": 205399, "epoch": 1697} {"train_loss": -35.29520797729492, "global_step": 205400, "epoch": 1697} {"train_loss": -37.92220687866211, "global_step": 205401, "epoch": 1697} {"train_loss": -38.02349853515625, "global_step": 205402, "epoch": 1697} {"train_loss": -38.80616760253906, "global_step": 205403, "epoch": 1697} {"train_loss": -38.340126037597656, "global_step": 205404, "epoch": 1697} {"train_loss": -34.37353515625, "global_step": 205405, "epoch": 1697} {"train_loss": -37.805091857910156, "global_step": 205406, "epoch": 1697} {"train_loss": -37.60435104370117, "global_step": 205407, "epoch": 1697} {"train_loss": -39.33137130737305, "global_step": 205408, "epoch": 1697} {"train_loss": -38.82950973510742, "global_step": 205409, "epoch": 1697} {"train_loss": -38.88766860961914, "global_step": 205410, "epoch": 1697} {"train_loss": -39.51914596557617, "global_step": 205411, "epoch": 1697} {"train_loss": -39.51760482788086, "global_step": 205412, "epoch": 1697} {"train_loss": -37.820499420166016, "global_step": 205413, "epoch": 1697} {"train_loss": -34.39866256713867, "global_step": 205414, "epoch": 1697} {"train_loss": -38.875301361083984, "global_step": 205415, "epoch": 1697} {"train_loss": -38.348567962646484, "global_step": 205416, "epoch": 1697} {"train_loss": -36.444950103759766, "global_step": 205417, "epoch": 1697} {"train_loss": -37.638057708740234, "global_step": 205418, "epoch": 1697} {"train_loss": -33.97496032714844, "global_step": 205419, "epoch": 1697} {"train_loss": -38.11033248901367, "global_step": 205420, "epoch": 1697} {"train_loss": -37.8775634765625, "global_step": 205421, "epoch": 1697} {"train_loss": -36.36106491088867, "global_step": 205422, "epoch": 1697} {"train_loss": -34.809844970703125, "global_step": 205423, "epoch": 1697} {"train_loss": -37.58777618408203, "global_step": 205424, "epoch": 1697} {"train_loss": -38.19068145751953, "global_step": 205425, "epoch": 1697} {"train_loss": -38.36209487915039, "global_step": 205426, "epoch": 1697} {"train_loss": -38.19523239135742, "global_step": 205427, "epoch": 1697} {"train_loss": -38.05463790893555, "global_step": 205428, "epoch": 1697} {"train_loss": -36.91732406616211, "global_step": 205429, "epoch": 1697} {"train_loss": -37.70661163330078, "global_step": 205430, "epoch": 1697} {"train_loss": -38.65201950073242, "global_step": 205431, "epoch": 1697} {"train_loss": -39.174110412597656, "global_step": 205432, "epoch": 1697} {"train_loss": -38.91514205932617, "global_step": 205433, "epoch": 1697} {"train_loss": -38.09302520751953, "global_step": 205434, "epoch": 1697} {"train_loss": -36.48255157470703, "global_step": 205435, "epoch": 1697} {"train_loss": -37.60553741455078, "global_step": 205436, "epoch": 1697} {"train_loss": -38.931129455566406, "global_step": 205437, "epoch": 1697} {"train_loss": -37.877933502197266, "global_step": 205438, "epoch": 1697} {"train_loss": -39.492977142333984, "global_step": 205439, "epoch": 1697} {"train_loss": -39.5972900390625, "global_step": 205440, "epoch": 1697} {"train_loss": -38.74436950683594, "global_step": 205441, "epoch": 1697} {"train_loss": -38.9068603515625, "global_step": 205442, "epoch": 1697} {"train_loss": -39.57349395751953, "global_step": 205443, "epoch": 1697} {"train_loss": -38.18266296386719, "global_step": 205444, "epoch": 1697} {"train_loss": -38.0017204284668, "global_step": 205445, "epoch": 1697} {"train_loss": -38.696800231933594, "global_step": 205446, "epoch": 1697} {"train_loss": -39.61219024658203, "global_step": 205447, "epoch": 1697} {"train_loss": -38.37979507446289, "global_step": 205448, "epoch": 1697} {"train_loss": -38.947471618652344, "global_step": 205449, "epoch": 1697} {"train_loss": -39.126033782958984, "global_step": 205450, "epoch": 1697} {"train_loss": -39.83457565307617, "global_step": 205451, "epoch": 1697} {"train_loss": -39.031795501708984, "global_step": 205452, "epoch": 1697} {"train_loss": -39.175296783447266, "global_step": 205453, "epoch": 1697} {"train_loss": -38.04970932006836, "global_step": 205454, "epoch": 1697} {"train_loss": -37.66245651245117, "global_step": 205455, "epoch": 1697} {"train_loss": -39.85966491699219, "global_step": 205456, "epoch": 1697} {"train_loss": -38.80222487646686, "global_step": 205457, "epoch": 1697, "val_loss": 2894900.25} {"train_loss": -38.377410888671875, "global_step": 205458, "epoch": 1698} {"train_loss": -38.683937072753906, "global_step": 205459, "epoch": 1698} {"train_loss": -39.19032669067383, "global_step": 205460, "epoch": 1698} {"train_loss": -38.2115592956543, "global_step": 205461, "epoch": 1698} {"train_loss": -38.55146026611328, "global_step": 205462, "epoch": 1698} {"train_loss": -39.41389083862305, "global_step": 205463, "epoch": 1698} {"train_loss": -38.78993606567383, "global_step": 205464, "epoch": 1698} {"train_loss": -39.203277587890625, "global_step": 205465, "epoch": 1698} {"train_loss": -38.18798828125, "global_step": 205466, "epoch": 1698} {"train_loss": -39.82542037963867, "global_step": 205467, "epoch": 1698} {"train_loss": -39.82429885864258, "global_step": 205468, "epoch": 1698} {"train_loss": -39.100807189941406, "global_step": 205469, "epoch": 1698} {"train_loss": -40.18693161010742, "global_step": 205470, "epoch": 1698} {"train_loss": -40.37394714355469, "global_step": 205471, "epoch": 1698} {"train_loss": -39.63972854614258, "global_step": 205472, "epoch": 1698} {"train_loss": -39.60414123535156, "global_step": 205473, "epoch": 1698} {"train_loss": -39.29875564575195, "global_step": 205474, "epoch": 1698} {"train_loss": -39.0231819152832, "global_step": 205475, "epoch": 1698} {"train_loss": -40.158172607421875, "global_step": 205476, "epoch": 1698} {"train_loss": -40.553375244140625, "global_step": 205477, "epoch": 1698} {"train_loss": -39.15234375, "global_step": 205478, "epoch": 1698} {"train_loss": -36.80992889404297, "global_step": 205479, "epoch": 1698} {"train_loss": -38.481361389160156, "global_step": 205480, "epoch": 1698} {"train_loss": -39.55788803100586, "global_step": 205481, "epoch": 1698} {"train_loss": -39.95860290527344, "global_step": 205482, "epoch": 1698} {"train_loss": -39.39777755737305, "global_step": 205483, "epoch": 1698} {"train_loss": -38.79435348510742, "global_step": 205484, "epoch": 1698} {"train_loss": -40.18309020996094, "global_step": 205485, "epoch": 1698} {"train_loss": -39.14567947387695, "global_step": 205486, "epoch": 1698} {"train_loss": -39.83119583129883, "global_step": 205487, "epoch": 1698} {"train_loss": -39.751705169677734, "global_step": 205488, "epoch": 1698} {"train_loss": -40.60860824584961, "global_step": 205489, "epoch": 1698} {"train_loss": -39.1183967590332, "global_step": 205490, "epoch": 1698} {"train_loss": -40.1932373046875, "global_step": 205491, "epoch": 1698} {"train_loss": -39.72480392456055, "global_step": 205492, "epoch": 1698} {"train_loss": -39.151329040527344, "global_step": 205493, "epoch": 1698} {"train_loss": -40.0655517578125, "global_step": 205494, "epoch": 1698} {"train_loss": -40.514068603515625, "global_step": 205495, "epoch": 1698} {"train_loss": -40.96986770629883, "global_step": 205496, "epoch": 1698} {"train_loss": -40.24837875366211, "global_step": 205497, "epoch": 1698} {"train_loss": -40.5966682434082, "global_step": 205498, "epoch": 1698} {"train_loss": -40.61741256713867, "global_step": 205499, "epoch": 1698} {"train_loss": -40.54985046386719, "global_step": 205500, "epoch": 1698} {"train_loss": -40.60138702392578, "global_step": 205501, "epoch": 1698} {"train_loss": -41.02730941772461, "global_step": 205502, "epoch": 1698} {"train_loss": -39.929080963134766, "global_step": 205503, "epoch": 1698} {"train_loss": -40.48563766479492, "global_step": 205504, "epoch": 1698} {"train_loss": -40.52982711791992, "global_step": 205505, "epoch": 1698} {"train_loss": -38.63423538208008, "global_step": 205506, "epoch": 1698} {"train_loss": -35.10028076171875, "global_step": 205507, "epoch": 1698} {"train_loss": -36.497737884521484, "global_step": 205508, "epoch": 1698} {"train_loss": -38.49729919433594, "global_step": 205509, "epoch": 1698} {"train_loss": -40.73507308959961, "global_step": 205510, "epoch": 1698} {"train_loss": -37.462432861328125, "global_step": 205511, "epoch": 1698} {"train_loss": -37.44095993041992, "global_step": 205512, "epoch": 1698} {"train_loss": -38.802249908447266, "global_step": 205513, "epoch": 1698} {"train_loss": -40.5842399597168, "global_step": 205514, "epoch": 1698} {"train_loss": -38.711647033691406, "global_step": 205515, "epoch": 1698} {"train_loss": -40.37972640991211, "global_step": 205516, "epoch": 1698} {"train_loss": -40.48268127441406, "global_step": 205517, "epoch": 1698} {"train_loss": -39.36885452270508, "global_step": 205518, "epoch": 1698} {"train_loss": -40.59040069580078, "global_step": 205519, "epoch": 1698} {"train_loss": -38.429813385009766, "global_step": 205520, "epoch": 1698} {"train_loss": -38.87577438354492, "global_step": 205521, "epoch": 1698} {"train_loss": -39.98841094970703, "global_step": 205522, "epoch": 1698} {"train_loss": -38.938575744628906, "global_step": 205523, "epoch": 1698} {"train_loss": -39.656978607177734, "global_step": 205524, "epoch": 1698} {"train_loss": -38.46284866333008, "global_step": 205525, "epoch": 1698} {"train_loss": -41.15840530395508, "global_step": 205526, "epoch": 1698} {"train_loss": -38.59978103637695, "global_step": 205527, "epoch": 1698} {"train_loss": -40.102779388427734, "global_step": 205528, "epoch": 1698} {"train_loss": -38.53436279296875, "global_step": 205529, "epoch": 1698} {"train_loss": -40.02787399291992, "global_step": 205530, "epoch": 1698} {"train_loss": -36.6668701171875, "global_step": 205531, "epoch": 1698} {"train_loss": -39.47153091430664, "global_step": 205532, "epoch": 1698} {"train_loss": -39.6951789855957, "global_step": 205533, "epoch": 1698} {"train_loss": -40.02954864501953, "global_step": 205534, "epoch": 1698} {"train_loss": -38.48895263671875, "global_step": 205535, "epoch": 1698} {"train_loss": -39.70045852661133, "global_step": 205536, "epoch": 1698} {"train_loss": -39.6208610534668, "global_step": 205537, "epoch": 1698} {"train_loss": -39.20606994628906, "global_step": 205538, "epoch": 1698} {"train_loss": -40.46497344970703, "global_step": 205539, "epoch": 1698} {"train_loss": -39.012935638427734, "global_step": 205540, "epoch": 1698} {"train_loss": -38.40183639526367, "global_step": 205541, "epoch": 1698} {"train_loss": -36.05129623413086, "global_step": 205542, "epoch": 1698} {"train_loss": -39.581451416015625, "global_step": 205543, "epoch": 1698} {"train_loss": -37.7801628112793, "global_step": 205544, "epoch": 1698} {"train_loss": -39.32503890991211, "global_step": 205545, "epoch": 1698} {"train_loss": -39.3992919921875, "global_step": 205546, "epoch": 1698} {"train_loss": -38.492042541503906, "global_step": 205547, "epoch": 1698} {"train_loss": -40.513729095458984, "global_step": 205548, "epoch": 1698} {"train_loss": -40.30894470214844, "global_step": 205549, "epoch": 1698} {"train_loss": -39.08170700073242, "global_step": 205550, "epoch": 1698} {"train_loss": -39.949153900146484, "global_step": 205551, "epoch": 1698} {"train_loss": -40.42779541015625, "global_step": 205552, "epoch": 1698} {"train_loss": -40.0091552734375, "global_step": 205553, "epoch": 1698} {"train_loss": -40.472984313964844, "global_step": 205554, "epoch": 1698} {"train_loss": -40.60920715332031, "global_step": 205555, "epoch": 1698} {"train_loss": -40.3673210144043, "global_step": 205556, "epoch": 1698} {"train_loss": -40.23308181762695, "global_step": 205557, "epoch": 1698} {"train_loss": -38.912574768066406, "global_step": 205558, "epoch": 1698} {"train_loss": -40.72854995727539, "global_step": 205559, "epoch": 1698} {"train_loss": -40.956092834472656, "global_step": 205560, "epoch": 1698} {"train_loss": -40.33857727050781, "global_step": 205561, "epoch": 1698} {"train_loss": -40.618682861328125, "global_step": 205562, "epoch": 1698} {"train_loss": -41.18457794189453, "global_step": 205563, "epoch": 1698} {"train_loss": -39.96522521972656, "global_step": 205564, "epoch": 1698} {"train_loss": -37.81638717651367, "global_step": 205565, "epoch": 1698} {"train_loss": -38.26369857788086, "global_step": 205566, "epoch": 1698} {"train_loss": -39.44612503051758, "global_step": 205567, "epoch": 1698} {"train_loss": -41.0273551940918, "global_step": 205568, "epoch": 1698} {"train_loss": -40.10090255737305, "global_step": 205569, "epoch": 1698} {"train_loss": -39.73649215698242, "global_step": 205570, "epoch": 1698} {"train_loss": -40.076873779296875, "global_step": 205571, "epoch": 1698} {"train_loss": -38.542816162109375, "global_step": 205572, "epoch": 1698} {"train_loss": -39.66618347167969, "global_step": 205573, "epoch": 1698} {"train_loss": -40.3270149230957, "global_step": 205574, "epoch": 1698} {"train_loss": -36.293914794921875, "global_step": 205575, "epoch": 1698} {"train_loss": -39.078033447265625, "global_step": 205576, "epoch": 1698} {"train_loss": -40.879608154296875, "global_step": 205577, "epoch": 1698} {"train_loss": -39.47003810661884, "global_step": 205578, "epoch": 1698, "val_loss": 2646659.25} {"train_loss": -40.685752868652344, "global_step": 205579, "epoch": 1699} {"train_loss": -40.40130615234375, "global_step": 205580, "epoch": 1699} {"train_loss": -39.60551071166992, "global_step": 205581, "epoch": 1699} {"train_loss": -38.74580001831055, "global_step": 205582, "epoch": 1699} {"train_loss": -40.83768844604492, "global_step": 205583, "epoch": 1699} {"train_loss": -41.460018157958984, "global_step": 205584, "epoch": 1699} {"train_loss": -36.85988998413086, "global_step": 205585, "epoch": 1699} {"train_loss": -39.98820114135742, "global_step": 205586, "epoch": 1699} {"train_loss": -37.910213470458984, "global_step": 205587, "epoch": 1699} {"train_loss": -39.785152435302734, "global_step": 205588, "epoch": 1699} {"train_loss": -39.453617095947266, "global_step": 205589, "epoch": 1699} {"train_loss": -41.181121826171875, "global_step": 205590, "epoch": 1699} {"train_loss": -40.09906005859375, "global_step": 205591, "epoch": 1699} {"train_loss": -39.67724609375, "global_step": 205592, "epoch": 1699} {"train_loss": -40.785430908203125, "global_step": 205593, "epoch": 1699} {"train_loss": -40.653934478759766, "global_step": 205594, "epoch": 1699} {"train_loss": -40.716983795166016, "global_step": 205595, "epoch": 1699} {"train_loss": -40.50950241088867, "global_step": 205596, "epoch": 1699} {"train_loss": -40.357479095458984, "global_step": 205597, "epoch": 1699} {"train_loss": -40.43144607543945, "global_step": 205598, "epoch": 1699} {"train_loss": -38.8616943359375, "global_step": 205599, "epoch": 1699} {"train_loss": -40.419857025146484, "global_step": 205600, "epoch": 1699} {"train_loss": -39.69675827026367, "global_step": 205601, "epoch": 1699} {"train_loss": -39.91646957397461, "global_step": 205602, "epoch": 1699} {"train_loss": -39.1135368347168, "global_step": 205603, "epoch": 1699} {"train_loss": -40.93407440185547, "global_step": 205604, "epoch": 1699} {"train_loss": -41.38936233520508, "global_step": 205605, "epoch": 1699} {"train_loss": -40.51234817504883, "global_step": 205606, "epoch": 1699} {"train_loss": -39.65444564819336, "global_step": 205607, "epoch": 1699} {"train_loss": -40.02991485595703, "global_step": 205608, "epoch": 1699} {"train_loss": -39.87860870361328, "global_step": 205609, "epoch": 1699} {"train_loss": -33.86517333984375, "global_step": 205610, "epoch": 1699} {"train_loss": -40.32807159423828, "global_step": 205611, "epoch": 1699} {"train_loss": -40.559295654296875, "global_step": 205612, "epoch": 1699} {"train_loss": -40.14361572265625, "global_step": 205613, "epoch": 1699} {"train_loss": -40.3405876159668, "global_step": 205614, "epoch": 1699} {"train_loss": -39.584224700927734, "global_step": 205615, "epoch": 1699} {"train_loss": -40.51860046386719, "global_step": 205616, "epoch": 1699} {"train_loss": -40.818077087402344, "global_step": 205617, "epoch": 1699} {"train_loss": -33.3427848815918, "global_step": 205618, "epoch": 1699} {"train_loss": -39.987789154052734, "global_step": 205619, "epoch": 1699} {"train_loss": -38.96562957763672, "global_step": 205620, "epoch": 1699} {"train_loss": -40.9361686706543, "global_step": 205621, "epoch": 1699} {"train_loss": -41.425018310546875, "global_step": 205622, "epoch": 1699} {"train_loss": -39.841617584228516, "global_step": 205623, "epoch": 1699} {"train_loss": -39.52962112426758, "global_step": 205624, "epoch": 1699} {"train_loss": -39.83137893676758, "global_step": 205625, "epoch": 1699} {"train_loss": -40.40885543823242, "global_step": 205626, "epoch": 1699} {"train_loss": -33.333274841308594, "global_step": 205627, "epoch": 1699} {"train_loss": -39.23237991333008, "global_step": 205628, "epoch": 1699} {"train_loss": -40.028289794921875, "global_step": 205629, "epoch": 1699} {"train_loss": -40.55819320678711, "global_step": 205630, "epoch": 1699} {"train_loss": -40.118587493896484, "global_step": 205631, "epoch": 1699} {"train_loss": -39.28098678588867, "global_step": 205632, "epoch": 1699} {"train_loss": -36.23649215698242, "global_step": 205633, "epoch": 1699} {"train_loss": -39.996646881103516, "global_step": 205634, "epoch": 1699} {"train_loss": -38.062171936035156, "global_step": 205635, "epoch": 1699} {"train_loss": -37.634918212890625, "global_step": 205636, "epoch": 1699} {"train_loss": -40.51548385620117, "global_step": 205637, "epoch": 1699} {"train_loss": -39.9178352355957, "global_step": 205638, "epoch": 1699} {"train_loss": -40.243072509765625, "global_step": 205639, "epoch": 1699} {"train_loss": -37.26380920410156, "global_step": 205640, "epoch": 1699} {"train_loss": -38.24610137939453, "global_step": 205641, "epoch": 1699} {"train_loss": -40.650203704833984, "global_step": 205642, "epoch": 1699} {"train_loss": -37.235904693603516, "global_step": 205643, "epoch": 1699} {"train_loss": -31.308990478515625, "global_step": 205644, "epoch": 1699} {"train_loss": -34.29899978637695, "global_step": 205645, "epoch": 1699} {"train_loss": -37.899879455566406, "global_step": 205646, "epoch": 1699} {"train_loss": -38.797760009765625, "global_step": 205647, "epoch": 1699} {"train_loss": -37.89208984375, "global_step": 205648, "epoch": 1699} {"train_loss": -36.7022590637207, "global_step": 205649, "epoch": 1699} {"train_loss": -34.699501037597656, "global_step": 205650, "epoch": 1699} {"train_loss": -39.120750427246094, "global_step": 205651, "epoch": 1699} {"train_loss": -37.21397399902344, "global_step": 205652, "epoch": 1699} {"train_loss": -40.654415130615234, "global_step": 205653, "epoch": 1699} {"train_loss": -38.40445327758789, "global_step": 205654, "epoch": 1699} {"train_loss": -38.96152877807617, "global_step": 205655, "epoch": 1699} {"train_loss": -38.6153564453125, "global_step": 205656, "epoch": 1699} {"train_loss": -35.93473434448242, "global_step": 205657, "epoch": 1699} {"train_loss": -38.7686767578125, "global_step": 205658, "epoch": 1699} {"train_loss": -38.86449432373047, "global_step": 205659, "epoch": 1699} {"train_loss": -39.599853515625, "global_step": 205660, "epoch": 1699} {"train_loss": -39.772064208984375, "global_step": 205661, "epoch": 1699} {"train_loss": -39.298988342285156, "global_step": 205662, "epoch": 1699} {"train_loss": -39.58075714111328, "global_step": 205663, "epoch": 1699} {"train_loss": -37.674129486083984, "global_step": 205664, "epoch": 1699} {"train_loss": -39.965553283691406, "global_step": 205665, "epoch": 1699} {"train_loss": -39.790287017822266, "global_step": 205666, "epoch": 1699} {"train_loss": -38.38379669189453, "global_step": 205667, "epoch": 1699} {"train_loss": -36.08159255981445, "global_step": 205668, "epoch": 1699} {"train_loss": -39.804962158203125, "global_step": 205669, "epoch": 1699} {"train_loss": -36.92136764526367, "global_step": 205670, "epoch": 1699} {"train_loss": -38.71811294555664, "global_step": 205671, "epoch": 1699} {"train_loss": -39.112281799316406, "global_step": 205672, "epoch": 1699} {"train_loss": -39.53188705444336, "global_step": 205673, "epoch": 1699} {"train_loss": -38.90563201904297, "global_step": 205674, "epoch": 1699} {"train_loss": -37.75352096557617, "global_step": 205675, "epoch": 1699} {"train_loss": -39.0439453125, "global_step": 205676, "epoch": 1699} {"train_loss": -39.70560073852539, "global_step": 205677, "epoch": 1699} {"train_loss": -39.612205505371094, "global_step": 205678, "epoch": 1699} {"train_loss": -39.469417572021484, "global_step": 205679, "epoch": 1699} {"train_loss": -37.63033676147461, "global_step": 205680, "epoch": 1699} {"train_loss": -40.163265228271484, "global_step": 205681, "epoch": 1699} {"train_loss": -38.975093841552734, "global_step": 205682, "epoch": 1699} {"train_loss": -40.24799728393555, "global_step": 205683, "epoch": 1699} {"train_loss": -39.774532318115234, "global_step": 205684, "epoch": 1699} {"train_loss": -39.76323318481445, "global_step": 205685, "epoch": 1699} {"train_loss": -39.89740753173828, "global_step": 205686, "epoch": 1699} {"train_loss": -39.43109130859375, "global_step": 205687, "epoch": 1699} {"train_loss": -36.52952194213867, "global_step": 205688, "epoch": 1699} {"train_loss": -39.8453254699707, "global_step": 205689, "epoch": 1699} {"train_loss": -39.17341232299805, "global_step": 205690, "epoch": 1699} {"train_loss": -40.612606048583984, "global_step": 205691, "epoch": 1699} {"train_loss": -39.16320037841797, "global_step": 205692, "epoch": 1699} {"train_loss": -38.05228805541992, "global_step": 205693, "epoch": 1699} {"train_loss": -40.964599609375, "global_step": 205694, "epoch": 1699} {"train_loss": -38.104331970214844, "global_step": 205695, "epoch": 1699} {"train_loss": -40.125152587890625, "global_step": 205696, "epoch": 1699} {"train_loss": -39.97369384765625, "global_step": 205697, "epoch": 1699} {"train_loss": -39.86441421508789, "global_step": 205698, "epoch": 1699} {"train_loss": -39.127096475648486, "global_step": 205699, "epoch": 1699, "val_loss": 2578595.25} {"train_loss": -39.774532318115234, "global_step": 205700, "epoch": 1700} {"train_loss": -40.19107437133789, "global_step": 205701, "epoch": 1700} {"train_loss": -40.345245361328125, "global_step": 205702, "epoch": 1700} {"train_loss": -40.36919021606445, "global_step": 205703, "epoch": 1700} {"train_loss": -40.23884582519531, "global_step": 205704, "epoch": 1700} {"train_loss": -39.500667572021484, "global_step": 205705, "epoch": 1700} {"train_loss": -40.84476852416992, "global_step": 205706, "epoch": 1700} {"train_loss": -40.09489059448242, "global_step": 205707, "epoch": 1700} {"train_loss": -39.533447265625, "global_step": 205708, "epoch": 1700} {"train_loss": -40.2873649597168, "global_step": 205709, "epoch": 1700} {"train_loss": -40.59833908081055, "global_step": 205710, "epoch": 1700} {"train_loss": -40.69062423706055, "global_step": 205711, "epoch": 1700} {"train_loss": -37.597869873046875, "global_step": 205712, "epoch": 1700} {"train_loss": -39.70994567871094, "global_step": 205713, "epoch": 1700} {"train_loss": -40.512603759765625, "global_step": 205714, "epoch": 1700} {"train_loss": -39.75824737548828, "global_step": 205715, "epoch": 1700} {"train_loss": -39.39590072631836, "global_step": 205716, "epoch": 1700} {"train_loss": -40.82979965209961, "global_step": 205717, "epoch": 1700} {"train_loss": -40.76845932006836, "global_step": 205718, "epoch": 1700} {"train_loss": -40.439735412597656, "global_step": 205719, "epoch": 1700} {"train_loss": -39.870208740234375, "global_step": 205720, "epoch": 1700} {"train_loss": -38.30707931518555, "global_step": 205721, "epoch": 1700} {"train_loss": -39.566505432128906, "global_step": 205722, "epoch": 1700} {"train_loss": -40.58565139770508, "global_step": 205723, "epoch": 1700} {"train_loss": -40.31754684448242, "global_step": 205724, "epoch": 1700} {"train_loss": -39.498043060302734, "global_step": 205725, "epoch": 1700} {"train_loss": -39.86785125732422, "global_step": 205726, "epoch": 1700} {"train_loss": -40.980709075927734, "global_step": 205727, "epoch": 1700} {"train_loss": -39.79819107055664, "global_step": 205728, "epoch": 1700} {"train_loss": -40.3841667175293, "global_step": 205729, "epoch": 1700} {"train_loss": -41.216243743896484, "global_step": 205730, "epoch": 1700} {"train_loss": -41.11550521850586, "global_step": 205731, "epoch": 1700} {"train_loss": -40.31374740600586, "global_step": 205732, "epoch": 1700} {"train_loss": -40.3154411315918, "global_step": 205733, "epoch": 1700} {"train_loss": -40.564571380615234, "global_step": 205734, "epoch": 1700} {"train_loss": -40.871795654296875, "global_step": 205735, "epoch": 1700} {"train_loss": -39.50120162963867, "global_step": 205736, "epoch": 1700} {"train_loss": -41.19745635986328, "global_step": 205737, "epoch": 1700} {"train_loss": -41.21751022338867, "global_step": 205738, "epoch": 1700} {"train_loss": -40.390480041503906, "global_step": 205739, "epoch": 1700} {"train_loss": -40.097103118896484, "global_step": 205740, "epoch": 1700} {"train_loss": -40.0689582824707, "global_step": 205741, "epoch": 1700} {"train_loss": -40.412105560302734, "global_step": 205742, "epoch": 1700} {"train_loss": -41.292659759521484, "global_step": 205743, "epoch": 1700} {"train_loss": -41.02687454223633, "global_step": 205744, "epoch": 1700} {"train_loss": -40.41779327392578, "global_step": 205745, "epoch": 1700} {"train_loss": -40.81005859375, "global_step": 205746, "epoch": 1700} {"train_loss": -39.0352783203125, "global_step": 205747, "epoch": 1700} {"train_loss": -41.516746520996094, "global_step": 205748, "epoch": 1700} {"train_loss": -41.18764877319336, "global_step": 205749, "epoch": 1700} {"train_loss": -41.55470275878906, "global_step": 205750, "epoch": 1700} {"train_loss": -40.353668212890625, "global_step": 205751, "epoch": 1700} {"train_loss": -40.23322677612305, "global_step": 205752, "epoch": 1700} {"train_loss": -39.8951301574707, "global_step": 205753, "epoch": 1700} {"train_loss": -39.47565460205078, "global_step": 205754, "epoch": 1700} {"train_loss": -39.847503662109375, "global_step": 205755, "epoch": 1700} {"train_loss": -37.34208297729492, "global_step": 205756, "epoch": 1700} {"train_loss": -30.824140548706055, "global_step": 205757, "epoch": 1700} {"train_loss": -24.100244522094727, "global_step": 205758, "epoch": 1700} {"train_loss": -24.147062301635742, "global_step": 205759, "epoch": 1700} {"train_loss": -33.58156204223633, "global_step": 205760, "epoch": 1700} {"train_loss": -38.6583137512207, "global_step": 205761, "epoch": 1700} {"train_loss": -33.0681266784668, "global_step": 205762, "epoch": 1700} {"train_loss": -39.49993133544922, "global_step": 205763, "epoch": 1700} {"train_loss": -34.545257568359375, "global_step": 205764, "epoch": 1700} {"train_loss": -38.68192672729492, "global_step": 205765, "epoch": 1700} {"train_loss": -37.52350997924805, "global_step": 205766, "epoch": 1700} {"train_loss": -38.82558822631836, "global_step": 205767, "epoch": 1700} {"train_loss": -38.427547454833984, "global_step": 205768, "epoch": 1700} {"train_loss": -38.83323287963867, "global_step": 205769, "epoch": 1700} {"train_loss": -38.19255828857422, "global_step": 205770, "epoch": 1700} {"train_loss": -39.99721145629883, "global_step": 205771, "epoch": 1700} {"train_loss": -39.02557373046875, "global_step": 205772, "epoch": 1700} {"train_loss": -40.67239761352539, "global_step": 205773, "epoch": 1700} {"train_loss": -38.773582458496094, "global_step": 205774, "epoch": 1700} {"train_loss": -40.7410774230957, "global_step": 205775, "epoch": 1700} {"train_loss": -40.2108039855957, "global_step": 205776, "epoch": 1700} {"train_loss": -39.73304748535156, "global_step": 205777, "epoch": 1700} {"train_loss": -39.53790283203125, "global_step": 205778, "epoch": 1700} {"train_loss": -39.79207992553711, "global_step": 205779, "epoch": 1700} {"train_loss": -40.2041130065918, "global_step": 205780, "epoch": 1700} {"train_loss": -40.241668701171875, "global_step": 205781, "epoch": 1700} {"train_loss": -39.805545806884766, "global_step": 205782, "epoch": 1700} {"train_loss": -40.86460876464844, "global_step": 205783, "epoch": 1700} {"train_loss": -40.36043930053711, "global_step": 205784, "epoch": 1700} {"train_loss": -39.92120361328125, "global_step": 205785, "epoch": 1700} {"train_loss": -40.3222541809082, "global_step": 205786, "epoch": 1700} {"train_loss": -40.723873138427734, "global_step": 205787, "epoch": 1700} {"train_loss": -40.9607048034668, "global_step": 205788, "epoch": 1700} {"train_loss": -40.17661666870117, "global_step": 205789, "epoch": 1700} {"train_loss": -40.79787826538086, "global_step": 205790, "epoch": 1700} {"train_loss": -41.246192932128906, "global_step": 205791, "epoch": 1700} {"train_loss": -40.40815353393555, "global_step": 205792, "epoch": 1700} {"train_loss": -41.0433349609375, "global_step": 205793, "epoch": 1700} {"train_loss": -40.8189811706543, "global_step": 205794, "epoch": 1700} {"train_loss": -40.491127014160156, "global_step": 205795, "epoch": 1700} {"train_loss": -41.90483856201172, "global_step": 205796, "epoch": 1700} {"train_loss": -40.66646194458008, "global_step": 205797, "epoch": 1700} {"train_loss": -41.03507614135742, "global_step": 205798, "epoch": 1700} {"train_loss": -41.057586669921875, "global_step": 205799, "epoch": 1700} {"train_loss": -41.544166564941406, "global_step": 205800, "epoch": 1700} {"train_loss": -40.70560836791992, "global_step": 205801, "epoch": 1700} {"train_loss": -40.82192611694336, "global_step": 205802, "epoch": 1700} {"train_loss": -41.025882720947266, "global_step": 205803, "epoch": 1700} {"train_loss": -41.387813568115234, "global_step": 205804, "epoch": 1700} {"train_loss": -41.34177780151367, "global_step": 205805, "epoch": 1700} {"train_loss": -41.4685173034668, "global_step": 205806, "epoch": 1700} {"train_loss": -41.561500549316406, "global_step": 205807, "epoch": 1700} {"train_loss": -41.230159759521484, "global_step": 205808, "epoch": 1700} {"train_loss": -40.79644775390625, "global_step": 205809, "epoch": 1700} {"train_loss": -41.487972259521484, "global_step": 205810, "epoch": 1700} {"train_loss": -40.78956985473633, "global_step": 205811, "epoch": 1700} {"train_loss": -41.274559020996094, "global_step": 205812, "epoch": 1700} {"train_loss": -41.18288803100586, "global_step": 205813, "epoch": 1700} {"train_loss": -40.48398971557617, "global_step": 205814, "epoch": 1700} {"train_loss": -41.68934631347656, "global_step": 205815, "epoch": 1700} {"train_loss": -41.65024948120117, "global_step": 205816, "epoch": 1700} {"train_loss": -41.542747497558594, "global_step": 205817, "epoch": 1700} {"train_loss": -41.605224609375, "global_step": 205818, "epoch": 1700} {"train_loss": -41.65333938598633, "global_step": 205819, "epoch": 1700} {"train_loss": -39.828748072474454, "global_step": 205820, "epoch": 1700, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 0.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4400000": 1.0, "test/sim_max_reward_4400001": 1.0, "test/sim_max_reward_4400002": 1.0, "test/sim_max_reward_4400003": 1.0, "test/sim_max_reward_4400004": 1.0, "test/sim_max_reward_4400005": 1.0, "test/sim_max_reward_4400006": 1.0, "test/sim_max_reward_4400007": 1.0, "test/sim_max_reward_4400008": 1.0, "test/sim_max_reward_4400009": 1.0, "test/sim_max_reward_4400010": 1.0, "test/sim_max_reward_4400011": 1.0, "test/sim_max_reward_4400012": 1.0, "test/sim_max_reward_4400013": 1.0, "test/sim_max_reward_4400014": 1.0, "test/sim_max_reward_4400015": 1.0, "test/sim_max_reward_4400016": 1.0, "test/sim_max_reward_4400017": 1.0, "test/sim_max_reward_4400018": 1.0, "test/sim_max_reward_4400019": 1.0, "test/sim_max_reward_4400020": 1.0, "test/sim_max_reward_4400021": 1.0, "train/mean_score": 0.8333333333333334, "test/mean_score": 1.0, "val_loss": 2501527.75} {"train_loss": -41.34846115112305, "global_step": 205821, "epoch": 1701} {"train_loss": -41.45668411254883, "global_step": 205822, "epoch": 1701} {"train_loss": -42.04851150512695, "global_step": 205823, "epoch": 1701} {"train_loss": -41.025386810302734, "global_step": 205824, "epoch": 1701} {"train_loss": -41.126953125, "global_step": 205825, "epoch": 1701} {"train_loss": -41.18422317504883, "global_step": 205826, "epoch": 1701} {"train_loss": -40.41292953491211, "global_step": 205827, "epoch": 1701} {"train_loss": -40.45234298706055, "global_step": 205828, "epoch": 1701} {"train_loss": -39.69412612915039, "global_step": 205829, "epoch": 1701} {"train_loss": -40.85773468017578, "global_step": 205830, "epoch": 1701} {"train_loss": -41.34609603881836, "global_step": 205831, "epoch": 1701} {"train_loss": -41.176631927490234, "global_step": 205832, "epoch": 1701} {"train_loss": -39.75899124145508, "global_step": 205833, "epoch": 1701} {"train_loss": -37.02042007446289, "global_step": 205834, "epoch": 1701} {"train_loss": -37.142250061035156, "global_step": 205835, "epoch": 1701} {"train_loss": -41.46133041381836, "global_step": 205836, "epoch": 1701} {"train_loss": -41.13633346557617, "global_step": 205837, "epoch": 1701} {"train_loss": -38.464412689208984, "global_step": 205838, "epoch": 1701} {"train_loss": -39.03129196166992, "global_step": 205839, "epoch": 1701} {"train_loss": -40.89706039428711, "global_step": 205840, "epoch": 1701} {"train_loss": -39.97108840942383, "global_step": 205841, "epoch": 1701} {"train_loss": -39.569435119628906, "global_step": 205842, "epoch": 1701} {"train_loss": -41.795745849609375, "global_step": 205843, "epoch": 1701} {"train_loss": -40.02873992919922, "global_step": 205844, "epoch": 1701} {"train_loss": -40.69953155517578, "global_step": 205845, "epoch": 1701} {"train_loss": -41.5540771484375, "global_step": 205846, "epoch": 1701} {"train_loss": -40.29872512817383, "global_step": 205847, "epoch": 1701} {"train_loss": -41.255096435546875, "global_step": 205848, "epoch": 1701} {"train_loss": -41.0065803527832, "global_step": 205849, "epoch": 1701} {"train_loss": -39.738155364990234, "global_step": 205850, "epoch": 1701} {"train_loss": -40.758296966552734, "global_step": 205851, "epoch": 1701} {"train_loss": -40.641231536865234, "global_step": 205852, "epoch": 1701} {"train_loss": -40.291500091552734, "global_step": 205853, "epoch": 1701} {"train_loss": -40.85462951660156, "global_step": 205854, "epoch": 1701} {"train_loss": -40.67058181762695, "global_step": 205855, "epoch": 1701} {"train_loss": -39.891632080078125, "global_step": 205856, "epoch": 1701} {"train_loss": -39.33073425292969, "global_step": 205857, "epoch": 1701} {"train_loss": -40.9143180847168, "global_step": 205858, "epoch": 1701} {"train_loss": -40.474361419677734, "global_step": 205859, "epoch": 1701} {"train_loss": -39.99943923950195, "global_step": 205860, "epoch": 1701} {"train_loss": -40.03916549682617, "global_step": 205861, "epoch": 1701} {"train_loss": -41.55622863769531, "global_step": 205862, "epoch": 1701} {"train_loss": -39.464378356933594, "global_step": 205863, "epoch": 1701} {"train_loss": -41.66838836669922, "global_step": 205864, "epoch": 1701} {"train_loss": -41.08575439453125, "global_step": 205865, "epoch": 1701} {"train_loss": -42.10215377807617, "global_step": 205866, "epoch": 1701} {"train_loss": -41.19454574584961, "global_step": 205867, "epoch": 1701} {"train_loss": -41.2116584777832, "global_step": 205868, "epoch": 1701} {"train_loss": -40.965065002441406, "global_step": 205869, "epoch": 1701} {"train_loss": -41.5537223815918, "global_step": 205870, "epoch": 1701} {"train_loss": -41.23130416870117, "global_step": 205871, "epoch": 1701} {"train_loss": -41.3425178527832, "global_step": 205872, "epoch": 1701} {"train_loss": -40.22761154174805, "global_step": 205873, "epoch": 1701} {"train_loss": -40.87899398803711, "global_step": 205874, "epoch": 1701} {"train_loss": -40.426082611083984, "global_step": 205875, "epoch": 1701} {"train_loss": -40.32133102416992, "global_step": 205876, "epoch": 1701} {"train_loss": -40.95711898803711, "global_step": 205877, "epoch": 1701} {"train_loss": -40.62955093383789, "global_step": 205878, "epoch": 1701} {"train_loss": -41.38977813720703, "global_step": 205879, "epoch": 1701} {"train_loss": -41.284889221191406, "global_step": 205880, "epoch": 1701} {"train_loss": -40.5319938659668, "global_step": 205881, "epoch": 1701} {"train_loss": -41.07877731323242, "global_step": 205882, "epoch": 1701} {"train_loss": -39.442481994628906, "global_step": 205883, "epoch": 1701} {"train_loss": -41.66420364379883, "global_step": 205884, "epoch": 1701} {"train_loss": -40.85826110839844, "global_step": 205885, "epoch": 1701} {"train_loss": -40.54523849487305, "global_step": 205886, "epoch": 1701} {"train_loss": -40.012630462646484, "global_step": 205887, "epoch": 1701} {"train_loss": -40.61432647705078, "global_step": 205888, "epoch": 1701} {"train_loss": -41.1968879699707, "global_step": 205889, "epoch": 1701} {"train_loss": -40.9489631652832, "global_step": 205890, "epoch": 1701} {"train_loss": -41.37343978881836, "global_step": 205891, "epoch": 1701} {"train_loss": -40.03749465942383, "global_step": 205892, "epoch": 1701} {"train_loss": -39.23944854736328, "global_step": 205893, "epoch": 1701} {"train_loss": -40.79042434692383, "global_step": 205894, "epoch": 1701} {"train_loss": -41.4444580078125, "global_step": 205895, "epoch": 1701} {"train_loss": -39.68259811401367, "global_step": 205896, "epoch": 1701} {"train_loss": -40.46298599243164, "global_step": 205897, "epoch": 1701} {"train_loss": -41.4501953125, "global_step": 205898, "epoch": 1701} {"train_loss": -41.12378692626953, "global_step": 205899, "epoch": 1701} {"train_loss": -41.0280876159668, "global_step": 205900, "epoch": 1701} {"train_loss": -41.24518966674805, "global_step": 205901, "epoch": 1701} {"train_loss": -40.608497619628906, "global_step": 205902, "epoch": 1701} {"train_loss": -41.18996810913086, "global_step": 205903, "epoch": 1701} {"train_loss": -41.127899169921875, "global_step": 205904, "epoch": 1701} {"train_loss": -41.41706085205078, "global_step": 205905, "epoch": 1701} {"train_loss": -41.18331527709961, "global_step": 205906, "epoch": 1701} {"train_loss": -41.55093002319336, "global_step": 205907, "epoch": 1701} {"train_loss": -40.43600845336914, "global_step": 205908, "epoch": 1701} {"train_loss": -41.24351501464844, "global_step": 205909, "epoch": 1701} {"train_loss": -41.63697052001953, "global_step": 205910, "epoch": 1701} {"train_loss": -40.75108337402344, "global_step": 205911, "epoch": 1701} {"train_loss": -41.24980545043945, "global_step": 205912, "epoch": 1701} {"train_loss": -42.05279541015625, "global_step": 205913, "epoch": 1701} {"train_loss": -41.48075485229492, "global_step": 205914, "epoch": 1701} {"train_loss": -41.50017166137695, "global_step": 205915, "epoch": 1701} {"train_loss": -41.41780471801758, "global_step": 205916, "epoch": 1701} {"train_loss": -41.5693359375, "global_step": 205917, "epoch": 1701} {"train_loss": -40.69915771484375, "global_step": 205918, "epoch": 1701} {"train_loss": -40.60026168823242, "global_step": 205919, "epoch": 1701} {"train_loss": -41.20783233642578, "global_step": 205920, "epoch": 1701} {"train_loss": -41.52675247192383, "global_step": 205921, "epoch": 1701} {"train_loss": -41.84894943237305, "global_step": 205922, "epoch": 1701} {"train_loss": -41.311424255371094, "global_step": 205923, "epoch": 1701} {"train_loss": -40.8448371887207, "global_step": 205924, "epoch": 1701} {"train_loss": -41.622432708740234, "global_step": 205925, "epoch": 1701} {"train_loss": -41.349544525146484, "global_step": 205926, "epoch": 1701} {"train_loss": -41.703060150146484, "global_step": 205927, "epoch": 1701} {"train_loss": -41.76776885986328, "global_step": 205928, "epoch": 1701} {"train_loss": -42.06532669067383, "global_step": 205929, "epoch": 1701} {"train_loss": -41.518829345703125, "global_step": 205930, "epoch": 1701} {"train_loss": -41.546871185302734, "global_step": 205931, "epoch": 1701} {"train_loss": -41.84480667114258, "global_step": 205932, "epoch": 1701} {"train_loss": -41.642478942871094, "global_step": 205933, "epoch": 1701} {"train_loss": -41.349037170410156, "global_step": 205934, "epoch": 1701} {"train_loss": -41.19377517700195, "global_step": 205935, "epoch": 1701} {"train_loss": -42.083282470703125, "global_step": 205936, "epoch": 1701} {"train_loss": -42.34756088256836, "global_step": 205937, "epoch": 1701} {"train_loss": -39.12301254272461, "global_step": 205938, "epoch": 1701} {"train_loss": -41.62971115112305, "global_step": 205939, "epoch": 1701} {"train_loss": -41.8108024597168, "global_step": 205940, "epoch": 1701} {"train_loss": -40.87175700290144, "global_step": 205941, "epoch": 1701, "val_loss": 2494281.25} {"train_loss": -41.1840934753418, "global_step": 205942, "epoch": 1702} {"train_loss": -40.54591751098633, "global_step": 205943, "epoch": 1702} {"train_loss": -39.018707275390625, "global_step": 205944, "epoch": 1702} {"train_loss": -42.3604621887207, "global_step": 205945, "epoch": 1702} {"train_loss": -42.04972839355469, "global_step": 205946, "epoch": 1702} {"train_loss": -41.10540771484375, "global_step": 205947, "epoch": 1702} {"train_loss": -32.80167007446289, "global_step": 205948, "epoch": 1702} {"train_loss": -41.604400634765625, "global_step": 205949, "epoch": 1702} {"train_loss": -40.76007843017578, "global_step": 205950, "epoch": 1702} {"train_loss": -39.507835388183594, "global_step": 205951, "epoch": 1702} {"train_loss": -39.66652297973633, "global_step": 205952, "epoch": 1702} {"train_loss": -35.9693717956543, "global_step": 205953, "epoch": 1702} {"train_loss": -38.44144821166992, "global_step": 205954, "epoch": 1702} {"train_loss": -39.17121505737305, "global_step": 205955, "epoch": 1702} {"train_loss": -37.9232063293457, "global_step": 205956, "epoch": 1702} {"train_loss": -39.42121124267578, "global_step": 205957, "epoch": 1702} {"train_loss": -34.5189094543457, "global_step": 205958, "epoch": 1702} {"train_loss": -37.11345291137695, "global_step": 205959, "epoch": 1702} {"train_loss": -36.850982666015625, "global_step": 205960, "epoch": 1702} {"train_loss": -35.88761520385742, "global_step": 205961, "epoch": 1702} {"train_loss": -34.71906661987305, "global_step": 205962, "epoch": 1702} {"train_loss": -39.43880081176758, "global_step": 205963, "epoch": 1702} {"train_loss": -38.792476654052734, "global_step": 205964, "epoch": 1702} {"train_loss": -38.23784255981445, "global_step": 205965, "epoch": 1702} {"train_loss": -37.333343505859375, "global_step": 205966, "epoch": 1702} {"train_loss": -38.533851623535156, "global_step": 205967, "epoch": 1702} {"train_loss": -38.23413848876953, "global_step": 205968, "epoch": 1702} {"train_loss": -37.477779388427734, "global_step": 205969, "epoch": 1702} {"train_loss": -40.000396728515625, "global_step": 205970, "epoch": 1702} {"train_loss": -34.908233642578125, "global_step": 205971, "epoch": 1702} {"train_loss": -39.221771240234375, "global_step": 205972, "epoch": 1702} {"train_loss": -39.09537124633789, "global_step": 205973, "epoch": 1702} {"train_loss": -38.02260971069336, "global_step": 205974, "epoch": 1702} {"train_loss": -38.63750076293945, "global_step": 205975, "epoch": 1702} {"train_loss": -39.4920654296875, "global_step": 205976, "epoch": 1702} {"train_loss": -39.325897216796875, "global_step": 205977, "epoch": 1702} {"train_loss": -39.39933395385742, "global_step": 205978, "epoch": 1702} {"train_loss": -40.0282096862793, "global_step": 205979, "epoch": 1702} {"train_loss": -39.184532165527344, "global_step": 205980, "epoch": 1702} {"train_loss": -38.0687141418457, "global_step": 205981, "epoch": 1702} {"train_loss": -37.80537796020508, "global_step": 205982, "epoch": 1702} {"train_loss": -38.30021286010742, "global_step": 205983, "epoch": 1702} {"train_loss": -38.1744384765625, "global_step": 205984, "epoch": 1702} {"train_loss": -38.831298828125, "global_step": 205985, "epoch": 1702} {"train_loss": -39.395751953125, "global_step": 205986, "epoch": 1702} {"train_loss": -39.99332809448242, "global_step": 205987, "epoch": 1702} {"train_loss": -36.871437072753906, "global_step": 205988, "epoch": 1702} {"train_loss": -39.096622467041016, "global_step": 205989, "epoch": 1702} {"train_loss": -39.626888275146484, "global_step": 205990, "epoch": 1702} {"train_loss": -38.78289794921875, "global_step": 205991, "epoch": 1702} {"train_loss": -38.24737548828125, "global_step": 205992, "epoch": 1702} {"train_loss": -38.53300857543945, "global_step": 205993, "epoch": 1702} {"train_loss": -39.190284729003906, "global_step": 205994, "epoch": 1702} {"train_loss": -39.49893569946289, "global_step": 205995, "epoch": 1702} {"train_loss": -39.921241760253906, "global_step": 205996, "epoch": 1702} {"train_loss": -38.798065185546875, "global_step": 205997, "epoch": 1702} {"train_loss": -38.37950134277344, "global_step": 205998, "epoch": 1702} {"train_loss": -38.74542999267578, "global_step": 205999, "epoch": 1702} {"train_loss": -39.52842330932617, "global_step": 206000, "epoch": 1702} {"train_loss": -37.20073318481445, "global_step": 206001, "epoch": 1702} {"train_loss": -40.43302536010742, "global_step": 206002, "epoch": 1702} {"train_loss": -39.39543151855469, "global_step": 206003, "epoch": 1702} {"train_loss": -40.34882354736328, "global_step": 206004, "epoch": 1702} {"train_loss": -40.218292236328125, "global_step": 206005, "epoch": 1702} {"train_loss": -39.7043342590332, "global_step": 206006, "epoch": 1702} {"train_loss": -39.39289093017578, "global_step": 206007, "epoch": 1702} {"train_loss": -40.75155258178711, "global_step": 206008, "epoch": 1702} {"train_loss": -39.25434494018555, "global_step": 206009, "epoch": 1702} {"train_loss": -38.45548629760742, "global_step": 206010, "epoch": 1702} {"train_loss": -40.6479606628418, "global_step": 206011, "epoch": 1702} {"train_loss": -40.1468505859375, "global_step": 206012, "epoch": 1702} {"train_loss": -40.51148223876953, "global_step": 206013, "epoch": 1702} {"train_loss": -40.705596923828125, "global_step": 206014, "epoch": 1702} {"train_loss": -40.87059020996094, "global_step": 206015, "epoch": 1702} {"train_loss": -40.64087677001953, "global_step": 206016, "epoch": 1702} {"train_loss": -40.68579864501953, "global_step": 206017, "epoch": 1702} {"train_loss": -39.76351547241211, "global_step": 206018, "epoch": 1702} {"train_loss": -40.97768783569336, "global_step": 206019, "epoch": 1702} {"train_loss": -41.21445846557617, "global_step": 206020, "epoch": 1702} {"train_loss": -40.25848388671875, "global_step": 206021, "epoch": 1702} {"train_loss": -37.74982452392578, "global_step": 206022, "epoch": 1702} {"train_loss": -38.78892135620117, "global_step": 206023, "epoch": 1702} {"train_loss": -40.86619186401367, "global_step": 206024, "epoch": 1702} {"train_loss": -40.134979248046875, "global_step": 206025, "epoch": 1702} {"train_loss": -41.02590560913086, "global_step": 206026, "epoch": 1702} {"train_loss": -40.67965316772461, "global_step": 206027, "epoch": 1702} {"train_loss": -40.83636474609375, "global_step": 206028, "epoch": 1702} {"train_loss": -40.00216293334961, "global_step": 206029, "epoch": 1702} {"train_loss": -41.27274703979492, "global_step": 206030, "epoch": 1702} {"train_loss": -41.489524841308594, "global_step": 206031, "epoch": 1702} {"train_loss": -40.69015121459961, "global_step": 206032, "epoch": 1702} {"train_loss": -41.690277099609375, "global_step": 206033, "epoch": 1702} {"train_loss": -39.24116897583008, "global_step": 206034, "epoch": 1702} {"train_loss": -40.332035064697266, "global_step": 206035, "epoch": 1702} {"train_loss": -40.94450759887695, "global_step": 206036, "epoch": 1702} {"train_loss": -40.85280990600586, "global_step": 206037, "epoch": 1702} {"train_loss": -41.04281997680664, "global_step": 206038, "epoch": 1702} {"train_loss": -41.313209533691406, "global_step": 206039, "epoch": 1702} {"train_loss": -41.20779037475586, "global_step": 206040, "epoch": 1702} {"train_loss": -41.072444915771484, "global_step": 206041, "epoch": 1702} {"train_loss": -41.35792922973633, "global_step": 206042, "epoch": 1702} {"train_loss": -41.189430236816406, "global_step": 206043, "epoch": 1702} {"train_loss": -40.97128677368164, "global_step": 206044, "epoch": 1702} {"train_loss": -41.14609909057617, "global_step": 206045, "epoch": 1702} {"train_loss": -40.886165618896484, "global_step": 206046, "epoch": 1702} {"train_loss": -41.23550033569336, "global_step": 206047, "epoch": 1702} {"train_loss": -40.86436462402344, "global_step": 206048, "epoch": 1702} {"train_loss": -41.26190185546875, "global_step": 206049, "epoch": 1702} {"train_loss": -41.30643844604492, "global_step": 206050, "epoch": 1702} {"train_loss": -41.323211669921875, "global_step": 206051, "epoch": 1702} {"train_loss": -39.927520751953125, "global_step": 206052, "epoch": 1702} {"train_loss": -40.42048263549805, "global_step": 206053, "epoch": 1702} {"train_loss": -39.96497344970703, "global_step": 206054, "epoch": 1702} {"train_loss": -40.93585968017578, "global_step": 206055, "epoch": 1702} {"train_loss": -40.94784164428711, "global_step": 206056, "epoch": 1702} {"train_loss": -41.16859817504883, "global_step": 206057, "epoch": 1702} {"train_loss": -40.67079544067383, "global_step": 206058, "epoch": 1702} {"train_loss": -40.66242218017578, "global_step": 206059, "epoch": 1702} {"train_loss": -40.908966064453125, "global_step": 206060, "epoch": 1702} {"train_loss": -41.385738372802734, "global_step": 206061, "epoch": 1702} {"train_loss": -39.62200290900616, "global_step": 206062, "epoch": 1702, "val_loss": 2552196.25} {"train_loss": -40.6490592956543, "global_step": 206063, "epoch": 1703} {"train_loss": -40.692054748535156, "global_step": 206064, "epoch": 1703} {"train_loss": -39.090328216552734, "global_step": 206065, "epoch": 1703} {"train_loss": -39.394989013671875, "global_step": 206066, "epoch": 1703} {"train_loss": -39.28533935546875, "global_step": 206067, "epoch": 1703} {"train_loss": -39.38920974731445, "global_step": 206068, "epoch": 1703} {"train_loss": -38.355831146240234, "global_step": 206069, "epoch": 1703} {"train_loss": -40.62972640991211, "global_step": 206070, "epoch": 1703} {"train_loss": -41.67285919189453, "global_step": 206071, "epoch": 1703} {"train_loss": -39.97626876831055, "global_step": 206072, "epoch": 1703} {"train_loss": -40.29635238647461, "global_step": 206073, "epoch": 1703} {"train_loss": -40.758174896240234, "global_step": 206074, "epoch": 1703} {"train_loss": -38.76081848144531, "global_step": 206075, "epoch": 1703} {"train_loss": -39.45256423950195, "global_step": 206076, "epoch": 1703} {"train_loss": -40.91593933105469, "global_step": 206077, "epoch": 1703} {"train_loss": -39.8332633972168, "global_step": 206078, "epoch": 1703} {"train_loss": -39.78982162475586, "global_step": 206079, "epoch": 1703} {"train_loss": -39.89276885986328, "global_step": 206080, "epoch": 1703} {"train_loss": -40.932369232177734, "global_step": 206081, "epoch": 1703} {"train_loss": -40.14606475830078, "global_step": 206082, "epoch": 1703} {"train_loss": -41.80367660522461, "global_step": 206083, "epoch": 1703} {"train_loss": -41.53056716918945, "global_step": 206084, "epoch": 1703} {"train_loss": -39.969478607177734, "global_step": 206085, "epoch": 1703} {"train_loss": -41.10880661010742, "global_step": 206086, "epoch": 1703} {"train_loss": -41.025123596191406, "global_step": 206087, "epoch": 1703} {"train_loss": -40.24864196777344, "global_step": 206088, "epoch": 1703} {"train_loss": -41.33088684082031, "global_step": 206089, "epoch": 1703} {"train_loss": -40.25189208984375, "global_step": 206090, "epoch": 1703} {"train_loss": -41.36861801147461, "global_step": 206091, "epoch": 1703} {"train_loss": -40.94455337524414, "global_step": 206092, "epoch": 1703} {"train_loss": -41.28023147583008, "global_step": 206093, "epoch": 1703} {"train_loss": -41.468170166015625, "global_step": 206094, "epoch": 1703} {"train_loss": -41.07406234741211, "global_step": 206095, "epoch": 1703} {"train_loss": -41.26362609863281, "global_step": 206096, "epoch": 1703} {"train_loss": -41.52223587036133, "global_step": 206097, "epoch": 1703} {"train_loss": -41.48136520385742, "global_step": 206098, "epoch": 1703} {"train_loss": -41.20824432373047, "global_step": 206099, "epoch": 1703} {"train_loss": -41.80558395385742, "global_step": 206100, "epoch": 1703} {"train_loss": -40.12986373901367, "global_step": 206101, "epoch": 1703} {"train_loss": -41.91141891479492, "global_step": 206102, "epoch": 1703} {"train_loss": -41.188323974609375, "global_step": 206103, "epoch": 1703} {"train_loss": -40.2335319519043, "global_step": 206104, "epoch": 1703} {"train_loss": -41.222652435302734, "global_step": 206105, "epoch": 1703} {"train_loss": -41.43861770629883, "global_step": 206106, "epoch": 1703} {"train_loss": -41.585445404052734, "global_step": 206107, "epoch": 1703} {"train_loss": -41.744232177734375, "global_step": 206108, "epoch": 1703} {"train_loss": -41.598182678222656, "global_step": 206109, "epoch": 1703} {"train_loss": -41.77568817138672, "global_step": 206110, "epoch": 1703} {"train_loss": -41.83377456665039, "global_step": 206111, "epoch": 1703} {"train_loss": -42.07965087890625, "global_step": 206112, "epoch": 1703} {"train_loss": -41.6571159362793, "global_step": 206113, "epoch": 1703} {"train_loss": -41.807430267333984, "global_step": 206114, "epoch": 1703} {"train_loss": -41.750579833984375, "global_step": 206115, "epoch": 1703} {"train_loss": -41.968318939208984, "global_step": 206116, "epoch": 1703} {"train_loss": -40.666664123535156, "global_step": 206117, "epoch": 1703} {"train_loss": -41.83974838256836, "global_step": 206118, "epoch": 1703} {"train_loss": -41.04543685913086, "global_step": 206119, "epoch": 1703} {"train_loss": -41.83991241455078, "global_step": 206120, "epoch": 1703} {"train_loss": -40.596981048583984, "global_step": 206121, "epoch": 1703} {"train_loss": -41.2274284362793, "global_step": 206122, "epoch": 1703} {"train_loss": -41.46326446533203, "global_step": 206123, "epoch": 1703} {"train_loss": -41.417449951171875, "global_step": 206124, "epoch": 1703} {"train_loss": -40.926918029785156, "global_step": 206125, "epoch": 1703} {"train_loss": -41.1113166809082, "global_step": 206126, "epoch": 1703} {"train_loss": -41.5103645324707, "global_step": 206127, "epoch": 1703} {"train_loss": -41.484039306640625, "global_step": 206128, "epoch": 1703} {"train_loss": -40.47853469848633, "global_step": 206129, "epoch": 1703} {"train_loss": -39.752132415771484, "global_step": 206130, "epoch": 1703} {"train_loss": -40.94333267211914, "global_step": 206131, "epoch": 1703} {"train_loss": -41.084808349609375, "global_step": 206132, "epoch": 1703} {"train_loss": -38.741851806640625, "global_step": 206133, "epoch": 1703} {"train_loss": -39.544795989990234, "global_step": 206134, "epoch": 1703} {"train_loss": -40.09627151489258, "global_step": 206135, "epoch": 1703} {"train_loss": -40.626319885253906, "global_step": 206136, "epoch": 1703} {"train_loss": -38.3995475769043, "global_step": 206137, "epoch": 1703} {"train_loss": -38.93732452392578, "global_step": 206138, "epoch": 1703} {"train_loss": -40.55157470703125, "global_step": 206139, "epoch": 1703} {"train_loss": -40.27315902709961, "global_step": 206140, "epoch": 1703} {"train_loss": -40.161617279052734, "global_step": 206141, "epoch": 1703} {"train_loss": -41.377540588378906, "global_step": 206142, "epoch": 1703} {"train_loss": -38.76052474975586, "global_step": 206143, "epoch": 1703} {"train_loss": -40.87136459350586, "global_step": 206144, "epoch": 1703} {"train_loss": -41.129417419433594, "global_step": 206145, "epoch": 1703} {"train_loss": -39.778377532958984, "global_step": 206146, "epoch": 1703} {"train_loss": -40.322303771972656, "global_step": 206147, "epoch": 1703} {"train_loss": -40.25349044799805, "global_step": 206148, "epoch": 1703} {"train_loss": -40.11338424682617, "global_step": 206149, "epoch": 1703} {"train_loss": -41.774139404296875, "global_step": 206150, "epoch": 1703} {"train_loss": -41.42061233520508, "global_step": 206151, "epoch": 1703} {"train_loss": -41.67151641845703, "global_step": 206152, "epoch": 1703} {"train_loss": -40.83891677856445, "global_step": 206153, "epoch": 1703} {"train_loss": -41.822696685791016, "global_step": 206154, "epoch": 1703} {"train_loss": -41.31150436401367, "global_step": 206155, "epoch": 1703} {"train_loss": -40.7603645324707, "global_step": 206156, "epoch": 1703} {"train_loss": -41.00419998168945, "global_step": 206157, "epoch": 1703} {"train_loss": -40.72549057006836, "global_step": 206158, "epoch": 1703} {"train_loss": -41.48287582397461, "global_step": 206159, "epoch": 1703} {"train_loss": -39.46364212036133, "global_step": 206160, "epoch": 1703} {"train_loss": -40.65017318725586, "global_step": 206161, "epoch": 1703} {"train_loss": -41.180721282958984, "global_step": 206162, "epoch": 1703} {"train_loss": -41.77631759643555, "global_step": 206163, "epoch": 1703} {"train_loss": -40.757225036621094, "global_step": 206164, "epoch": 1703} {"train_loss": -41.34438705444336, "global_step": 206165, "epoch": 1703} {"train_loss": -40.7050666809082, "global_step": 206166, "epoch": 1703} {"train_loss": -41.89785385131836, "global_step": 206167, "epoch": 1703} {"train_loss": -41.26797103881836, "global_step": 206168, "epoch": 1703} {"train_loss": -37.816802978515625, "global_step": 206169, "epoch": 1703} {"train_loss": -36.148284912109375, "global_step": 206170, "epoch": 1703} {"train_loss": -39.577003479003906, "global_step": 206171, "epoch": 1703} {"train_loss": -41.9146842956543, "global_step": 206172, "epoch": 1703} {"train_loss": -40.690120697021484, "global_step": 206173, "epoch": 1703} {"train_loss": -39.924964904785156, "global_step": 206174, "epoch": 1703} {"train_loss": -40.04037094116211, "global_step": 206175, "epoch": 1703} {"train_loss": -40.77693557739258, "global_step": 206176, "epoch": 1703} {"train_loss": -41.17562484741211, "global_step": 206177, "epoch": 1703} {"train_loss": -40.92973709106445, "global_step": 206178, "epoch": 1703} {"train_loss": -39.10869216918945, "global_step": 206179, "epoch": 1703} {"train_loss": -39.10166549682617, "global_step": 206180, "epoch": 1703} {"train_loss": -40.57891845703125, "global_step": 206181, "epoch": 1703} {"train_loss": -41.17341613769531, "global_step": 206182, "epoch": 1703} {"train_loss": -40.6823586708258, "global_step": 206183, "epoch": 1703, "val_loss": 2606038.0} {"train_loss": -40.70741653442383, "global_step": 206184, "epoch": 1704} {"train_loss": -40.023868560791016, "global_step": 206185, "epoch": 1704} {"train_loss": -40.200050354003906, "global_step": 206186, "epoch": 1704} {"train_loss": -37.559425354003906, "global_step": 206187, "epoch": 1704} {"train_loss": -40.230751037597656, "global_step": 206188, "epoch": 1704} {"train_loss": -38.73191452026367, "global_step": 206189, "epoch": 1704} {"train_loss": -39.35038375854492, "global_step": 206190, "epoch": 1704} {"train_loss": -36.000667572021484, "global_step": 206191, "epoch": 1704} {"train_loss": -40.67612838745117, "global_step": 206192, "epoch": 1704} {"train_loss": -40.30806350708008, "global_step": 206193, "epoch": 1704} {"train_loss": -40.447689056396484, "global_step": 206194, "epoch": 1704} {"train_loss": -37.81402587890625, "global_step": 206195, "epoch": 1704} {"train_loss": -39.137123107910156, "global_step": 206196, "epoch": 1704} {"train_loss": -33.90544509887695, "global_step": 206197, "epoch": 1704} {"train_loss": -34.810150146484375, "global_step": 206198, "epoch": 1704} {"train_loss": -35.90625762939453, "global_step": 206199, "epoch": 1704} {"train_loss": -37.82256317138672, "global_step": 206200, "epoch": 1704} {"train_loss": -39.61503982543945, "global_step": 206201, "epoch": 1704} {"train_loss": -39.31147384643555, "global_step": 206202, "epoch": 1704} {"train_loss": -38.5167236328125, "global_step": 206203, "epoch": 1704} {"train_loss": -37.96326446533203, "global_step": 206204, "epoch": 1704} {"train_loss": -39.1499137878418, "global_step": 206205, "epoch": 1704} {"train_loss": -39.7845344543457, "global_step": 206206, "epoch": 1704} {"train_loss": -40.36088180541992, "global_step": 206207, "epoch": 1704} {"train_loss": -35.246925354003906, "global_step": 206208, "epoch": 1704} {"train_loss": -39.30263900756836, "global_step": 206209, "epoch": 1704} {"train_loss": -37.05379867553711, "global_step": 206210, "epoch": 1704} {"train_loss": -36.02745819091797, "global_step": 206211, "epoch": 1704} {"train_loss": -27.703632354736328, "global_step": 206212, "epoch": 1704} {"train_loss": -35.01593017578125, "global_step": 206213, "epoch": 1704} {"train_loss": -36.629417419433594, "global_step": 206214, "epoch": 1704} {"train_loss": -29.252685546875, "global_step": 206215, "epoch": 1704} {"train_loss": -37.491268157958984, "global_step": 206216, "epoch": 1704} {"train_loss": -35.14170455932617, "global_step": 206217, "epoch": 1704} {"train_loss": -39.00311279296875, "global_step": 206218, "epoch": 1704} {"train_loss": -33.981693267822266, "global_step": 206219, "epoch": 1704} {"train_loss": -35.55073928833008, "global_step": 206220, "epoch": 1704} {"train_loss": -30.989547729492188, "global_step": 206221, "epoch": 1704} {"train_loss": -35.00151062011719, "global_step": 206222, "epoch": 1704} {"train_loss": -31.631366729736328, "global_step": 206223, "epoch": 1704} {"train_loss": -33.84700012207031, "global_step": 206224, "epoch": 1704} {"train_loss": -37.295223236083984, "global_step": 206225, "epoch": 1704} {"train_loss": -33.09346008300781, "global_step": 206226, "epoch": 1704} {"train_loss": -29.250635147094727, "global_step": 206227, "epoch": 1704} {"train_loss": -33.34687042236328, "global_step": 206228, "epoch": 1704} {"train_loss": -36.641014099121094, "global_step": 206229, "epoch": 1704} {"train_loss": -37.65131378173828, "global_step": 206230, "epoch": 1704} {"train_loss": -36.707496643066406, "global_step": 206231, "epoch": 1704} {"train_loss": -33.52522659301758, "global_step": 206232, "epoch": 1704} {"train_loss": -35.746456146240234, "global_step": 206233, "epoch": 1704} {"train_loss": -36.71401596069336, "global_step": 206234, "epoch": 1704} {"train_loss": -35.78030776977539, "global_step": 206235, "epoch": 1704} {"train_loss": -35.467987060546875, "global_step": 206236, "epoch": 1704} {"train_loss": -36.700557708740234, "global_step": 206237, "epoch": 1704} {"train_loss": -36.93594741821289, "global_step": 206238, "epoch": 1704} {"train_loss": -33.999481201171875, "global_step": 206239, "epoch": 1704} {"train_loss": -37.0623893737793, "global_step": 206240, "epoch": 1704} {"train_loss": -38.52852249145508, "global_step": 206241, "epoch": 1704} {"train_loss": -36.10367202758789, "global_step": 206242, "epoch": 1704} {"train_loss": -37.73982620239258, "global_step": 206243, "epoch": 1704} {"train_loss": -38.74727249145508, "global_step": 206244, "epoch": 1704} {"train_loss": -38.66819763183594, "global_step": 206245, "epoch": 1704} {"train_loss": -36.165279388427734, "global_step": 206246, "epoch": 1704} {"train_loss": -37.615360260009766, "global_step": 206247, "epoch": 1704} {"train_loss": -38.43227767944336, "global_step": 206248, "epoch": 1704} {"train_loss": -38.68610763549805, "global_step": 206249, "epoch": 1704} {"train_loss": -38.48445510864258, "global_step": 206250, "epoch": 1704} {"train_loss": -38.73514938354492, "global_step": 206251, "epoch": 1704} {"train_loss": -37.602359771728516, "global_step": 206252, "epoch": 1704} {"train_loss": -38.9028434753418, "global_step": 206253, "epoch": 1704} {"train_loss": -37.66669464111328, "global_step": 206254, "epoch": 1704} {"train_loss": -37.629512786865234, "global_step": 206255, "epoch": 1704} {"train_loss": -38.84821319580078, "global_step": 206256, "epoch": 1704} {"train_loss": -38.698219299316406, "global_step": 206257, "epoch": 1704} {"train_loss": -39.22401428222656, "global_step": 206258, "epoch": 1704} {"train_loss": -38.84046173095703, "global_step": 206259, "epoch": 1704} {"train_loss": -39.243560791015625, "global_step": 206260, "epoch": 1704} {"train_loss": -39.05770492553711, "global_step": 206261, "epoch": 1704} {"train_loss": -38.83768844604492, "global_step": 206262, "epoch": 1704} {"train_loss": -38.923866271972656, "global_step": 206263, "epoch": 1704} {"train_loss": -38.950653076171875, "global_step": 206264, "epoch": 1704} {"train_loss": -38.48409652709961, "global_step": 206265, "epoch": 1704} {"train_loss": -38.550315856933594, "global_step": 206266, "epoch": 1704} {"train_loss": -39.82571029663086, "global_step": 206267, "epoch": 1704} {"train_loss": -39.63474655151367, "global_step": 206268, "epoch": 1704} {"train_loss": -39.259944915771484, "global_step": 206269, "epoch": 1704} {"train_loss": -38.592098236083984, "global_step": 206270, "epoch": 1704} {"train_loss": -38.545204162597656, "global_step": 206271, "epoch": 1704} {"train_loss": -38.78898239135742, "global_step": 206272, "epoch": 1704} {"train_loss": -39.88962936401367, "global_step": 206273, "epoch": 1704} {"train_loss": -38.04594039916992, "global_step": 206274, "epoch": 1704} {"train_loss": -39.28982162475586, "global_step": 206275, "epoch": 1704} {"train_loss": -39.954444885253906, "global_step": 206276, "epoch": 1704} {"train_loss": -39.92715072631836, "global_step": 206277, "epoch": 1704} {"train_loss": -39.67121505737305, "global_step": 206278, "epoch": 1704} {"train_loss": -39.926204681396484, "global_step": 206279, "epoch": 1704} {"train_loss": -39.702510833740234, "global_step": 206280, "epoch": 1704} {"train_loss": -39.628074645996094, "global_step": 206281, "epoch": 1704} {"train_loss": -40.157222747802734, "global_step": 206282, "epoch": 1704} {"train_loss": -39.05171585083008, "global_step": 206283, "epoch": 1704} {"train_loss": -39.33466720581055, "global_step": 206284, "epoch": 1704} {"train_loss": -39.793819427490234, "global_step": 206285, "epoch": 1704} {"train_loss": -39.839839935302734, "global_step": 206286, "epoch": 1704} {"train_loss": -39.4747428894043, "global_step": 206287, "epoch": 1704} {"train_loss": -40.04520797729492, "global_step": 206288, "epoch": 1704} {"train_loss": -39.2893180847168, "global_step": 206289, "epoch": 1704} {"train_loss": -39.851261138916016, "global_step": 206290, "epoch": 1704} {"train_loss": -40.245643615722656, "global_step": 206291, "epoch": 1704} {"train_loss": -39.69343185424805, "global_step": 206292, "epoch": 1704} {"train_loss": -40.1027946472168, "global_step": 206293, "epoch": 1704} {"train_loss": -40.21329879760742, "global_step": 206294, "epoch": 1704} {"train_loss": -40.2258415222168, "global_step": 206295, "epoch": 1704} {"train_loss": -40.23385238647461, "global_step": 206296, "epoch": 1704} {"train_loss": -40.539371490478516, "global_step": 206297, "epoch": 1704} {"train_loss": -40.43182373046875, "global_step": 206298, "epoch": 1704} {"train_loss": -39.613887786865234, "global_step": 206299, "epoch": 1704} {"train_loss": -40.056949615478516, "global_step": 206300, "epoch": 1704} {"train_loss": -40.79159927368164, "global_step": 206301, "epoch": 1704} {"train_loss": -40.329647064208984, "global_step": 206302, "epoch": 1704} {"train_loss": -40.11267852783203, "global_step": 206303, "epoch": 1704} {"train_loss": -37.94465764889047, "global_step": 206304, "epoch": 1704, "val_loss": 2531083.5} {"train_loss": -40.142982482910156, "global_step": 206305, "epoch": 1705} {"train_loss": -40.825645446777344, "global_step": 206306, "epoch": 1705} {"train_loss": -40.037349700927734, "global_step": 206307, "epoch": 1705} {"train_loss": -40.591732025146484, "global_step": 206308, "epoch": 1705} {"train_loss": -40.445152282714844, "global_step": 206309, "epoch": 1705} {"train_loss": -40.43519973754883, "global_step": 206310, "epoch": 1705} {"train_loss": -40.978431701660156, "global_step": 206311, "epoch": 1705} {"train_loss": -41.066890716552734, "global_step": 206312, "epoch": 1705} {"train_loss": -41.12441635131836, "global_step": 206313, "epoch": 1705} {"train_loss": -40.8824462890625, "global_step": 206314, "epoch": 1705} {"train_loss": -41.31666946411133, "global_step": 206315, "epoch": 1705} {"train_loss": -40.371864318847656, "global_step": 206316, "epoch": 1705} {"train_loss": -40.96151351928711, "global_step": 206317, "epoch": 1705} {"train_loss": -40.514644622802734, "global_step": 206318, "epoch": 1705} {"train_loss": -40.02204513549805, "global_step": 206319, "epoch": 1705} {"train_loss": -41.14371871948242, "global_step": 206320, "epoch": 1705} {"train_loss": -40.8387336730957, "global_step": 206321, "epoch": 1705} {"train_loss": -41.23189163208008, "global_step": 206322, "epoch": 1705} {"train_loss": -40.59254837036133, "global_step": 206323, "epoch": 1705} {"train_loss": -41.3657112121582, "global_step": 206324, "epoch": 1705} {"train_loss": -40.50917434692383, "global_step": 206325, "epoch": 1705} {"train_loss": -41.33036422729492, "global_step": 206326, "epoch": 1705} {"train_loss": -41.503631591796875, "global_step": 206327, "epoch": 1705} {"train_loss": -41.10490417480469, "global_step": 206328, "epoch": 1705} {"train_loss": -40.9879150390625, "global_step": 206329, "epoch": 1705} {"train_loss": -40.51189422607422, "global_step": 206330, "epoch": 1705} {"train_loss": -40.6905403137207, "global_step": 206331, "epoch": 1705} {"train_loss": -41.293331146240234, "global_step": 206332, "epoch": 1705} {"train_loss": -41.12144470214844, "global_step": 206333, "epoch": 1705} {"train_loss": -40.075313568115234, "global_step": 206334, "epoch": 1705} {"train_loss": -38.87746810913086, "global_step": 206335, "epoch": 1705} {"train_loss": -40.99089813232422, "global_step": 206336, "epoch": 1705} {"train_loss": -40.6928825378418, "global_step": 206337, "epoch": 1705} {"train_loss": -40.80792236328125, "global_step": 206338, "epoch": 1705} {"train_loss": -40.32670211791992, "global_step": 206339, "epoch": 1705} {"train_loss": -41.07075881958008, "global_step": 206340, "epoch": 1705} {"train_loss": -41.17939376831055, "global_step": 206341, "epoch": 1705} {"train_loss": -40.084266662597656, "global_step": 206342, "epoch": 1705} {"train_loss": -39.882442474365234, "global_step": 206343, "epoch": 1705} {"train_loss": -40.52436447143555, "global_step": 206344, "epoch": 1705} {"train_loss": -40.26519775390625, "global_step": 206345, "epoch": 1705} {"train_loss": -40.65824890136719, "global_step": 206346, "epoch": 1705} {"train_loss": -39.92922592163086, "global_step": 206347, "epoch": 1705} {"train_loss": -41.307247161865234, "global_step": 206348, "epoch": 1705} {"train_loss": -40.93552780151367, "global_step": 206349, "epoch": 1705} {"train_loss": -40.58181381225586, "global_step": 206350, "epoch": 1705} {"train_loss": -40.99586868286133, "global_step": 206351, "epoch": 1705} {"train_loss": -41.1488037109375, "global_step": 206352, "epoch": 1705} {"train_loss": -41.04948806762695, "global_step": 206353, "epoch": 1705} {"train_loss": -40.85696029663086, "global_step": 206354, "epoch": 1705} {"train_loss": -41.0190544128418, "global_step": 206355, "epoch": 1705} {"train_loss": -41.23520278930664, "global_step": 206356, "epoch": 1705} {"train_loss": -40.265316009521484, "global_step": 206357, "epoch": 1705} {"train_loss": -37.84709930419922, "global_step": 206358, "epoch": 1705} {"train_loss": -34.686553955078125, "global_step": 206359, "epoch": 1705} {"train_loss": -32.51765441894531, "global_step": 206360, "epoch": 1705} {"train_loss": -36.43070602416992, "global_step": 206361, "epoch": 1705} {"train_loss": -40.19955062866211, "global_step": 206362, "epoch": 1705} {"train_loss": -38.877593994140625, "global_step": 206363, "epoch": 1705} {"train_loss": -34.197994232177734, "global_step": 206364, "epoch": 1705} {"train_loss": -32.64945602416992, "global_step": 206365, "epoch": 1705} {"train_loss": -38.596290588378906, "global_step": 206366, "epoch": 1705} {"train_loss": -39.772315979003906, "global_step": 206367, "epoch": 1705} {"train_loss": -35.340065002441406, "global_step": 206368, "epoch": 1705} {"train_loss": -40.38411331176758, "global_step": 206369, "epoch": 1705} {"train_loss": -34.735958099365234, "global_step": 206370, "epoch": 1705} {"train_loss": -33.756099700927734, "global_step": 206371, "epoch": 1705} {"train_loss": -40.20138168334961, "global_step": 206372, "epoch": 1705} {"train_loss": -36.524932861328125, "global_step": 206373, "epoch": 1705} {"train_loss": -39.97898864746094, "global_step": 206374, "epoch": 1705} {"train_loss": -36.343048095703125, "global_step": 206375, "epoch": 1705} {"train_loss": -40.177879333496094, "global_step": 206376, "epoch": 1705} {"train_loss": -37.52495193481445, "global_step": 206377, "epoch": 1705} {"train_loss": -39.747528076171875, "global_step": 206378, "epoch": 1705} {"train_loss": -39.36971664428711, "global_step": 206379, "epoch": 1705} {"train_loss": -39.4078483581543, "global_step": 206380, "epoch": 1705} {"train_loss": -39.50996017456055, "global_step": 206381, "epoch": 1705} {"train_loss": -40.373260498046875, "global_step": 206382, "epoch": 1705} {"train_loss": -39.75905990600586, "global_step": 206383, "epoch": 1705} {"train_loss": -39.927894592285156, "global_step": 206384, "epoch": 1705} {"train_loss": -40.51783752441406, "global_step": 206385, "epoch": 1705} {"train_loss": -39.763614654541016, "global_step": 206386, "epoch": 1705} {"train_loss": -40.0410270690918, "global_step": 206387, "epoch": 1705} {"train_loss": -40.496742248535156, "global_step": 206388, "epoch": 1705} {"train_loss": -40.32499313354492, "global_step": 206389, "epoch": 1705} {"train_loss": -40.344024658203125, "global_step": 206390, "epoch": 1705} {"train_loss": -39.97972106933594, "global_step": 206391, "epoch": 1705} {"train_loss": -40.307437896728516, "global_step": 206392, "epoch": 1705} {"train_loss": -40.53962326049805, "global_step": 206393, "epoch": 1705} {"train_loss": -39.82947540283203, "global_step": 206394, "epoch": 1705} {"train_loss": -40.47235870361328, "global_step": 206395, "epoch": 1705} {"train_loss": -40.62236022949219, "global_step": 206396, "epoch": 1705} {"train_loss": -40.470279693603516, "global_step": 206397, "epoch": 1705} {"train_loss": -40.775169372558594, "global_step": 206398, "epoch": 1705} {"train_loss": -40.57186508178711, "global_step": 206399, "epoch": 1705} {"train_loss": -40.18651580810547, "global_step": 206400, "epoch": 1705} {"train_loss": -40.71411895751953, "global_step": 206401, "epoch": 1705} {"train_loss": -40.13812255859375, "global_step": 206402, "epoch": 1705} {"train_loss": -41.541473388671875, "global_step": 206403, "epoch": 1705} {"train_loss": -40.16032028198242, "global_step": 206404, "epoch": 1705} {"train_loss": -40.25313949584961, "global_step": 206405, "epoch": 1705} {"train_loss": -41.01359939575195, "global_step": 206406, "epoch": 1705} {"train_loss": -40.36368179321289, "global_step": 206407, "epoch": 1705} {"train_loss": -41.39296340942383, "global_step": 206408, "epoch": 1705} {"train_loss": -41.45062255859375, "global_step": 206409, "epoch": 1705} {"train_loss": -40.82489776611328, "global_step": 206410, "epoch": 1705} {"train_loss": -41.363765716552734, "global_step": 206411, "epoch": 1705} {"train_loss": -40.6994743347168, "global_step": 206412, "epoch": 1705} {"train_loss": -40.660823822021484, "global_step": 206413, "epoch": 1705} {"train_loss": -41.40217590332031, "global_step": 206414, "epoch": 1705} {"train_loss": -41.34280014038086, "global_step": 206415, "epoch": 1705} {"train_loss": -41.374305725097656, "global_step": 206416, "epoch": 1705} {"train_loss": -41.67814254760742, "global_step": 206417, "epoch": 1705} {"train_loss": -41.31193161010742, "global_step": 206418, "epoch": 1705} {"train_loss": -41.08054733276367, "global_step": 206419, "epoch": 1705} {"train_loss": -41.8778190612793, "global_step": 206420, "epoch": 1705} {"train_loss": -41.505374908447266, "global_step": 206421, "epoch": 1705} {"train_loss": -41.0064811706543, "global_step": 206422, "epoch": 1705} {"train_loss": -41.66358184814453, "global_step": 206423, "epoch": 1705} {"train_loss": -41.32643508911133, "global_step": 206424, "epoch": 1705} {"train_loss": -40.085912940915954, "global_step": 206425, "epoch": 1705, "val_loss": 2498292.25} {"train_loss": -41.04363250732422, "global_step": 206426, "epoch": 1706} {"train_loss": -41.18689727783203, "global_step": 206427, "epoch": 1706} {"train_loss": -41.13801574707031, "global_step": 206428, "epoch": 1706} {"train_loss": -41.2493896484375, "global_step": 206429, "epoch": 1706} {"train_loss": -40.982608795166016, "global_step": 206430, "epoch": 1706} {"train_loss": -40.75596237182617, "global_step": 206431, "epoch": 1706} {"train_loss": -41.74694061279297, "global_step": 206432, "epoch": 1706} {"train_loss": -41.012203216552734, "global_step": 206433, "epoch": 1706} {"train_loss": -41.16339874267578, "global_step": 206434, "epoch": 1706} {"train_loss": -41.73532485961914, "global_step": 206435, "epoch": 1706} {"train_loss": -40.5411376953125, "global_step": 206436, "epoch": 1706} {"train_loss": -41.840301513671875, "global_step": 206437, "epoch": 1706} {"train_loss": -41.7330322265625, "global_step": 206438, "epoch": 1706} {"train_loss": -41.67271423339844, "global_step": 206439, "epoch": 1706} {"train_loss": -41.79220199584961, "global_step": 206440, "epoch": 1706} {"train_loss": -42.08787155151367, "global_step": 206441, "epoch": 1706} {"train_loss": -41.063819885253906, "global_step": 206442, "epoch": 1706} {"train_loss": -41.86887741088867, "global_step": 206443, "epoch": 1706} {"train_loss": -41.236175537109375, "global_step": 206444, "epoch": 1706} {"train_loss": -41.123104095458984, "global_step": 206445, "epoch": 1706} {"train_loss": -41.49274826049805, "global_step": 206446, "epoch": 1706} {"train_loss": -41.72941207885742, "global_step": 206447, "epoch": 1706} {"train_loss": -42.06876754760742, "global_step": 206448, "epoch": 1706} {"train_loss": -42.21943283081055, "global_step": 206449, "epoch": 1706} {"train_loss": -41.8607063293457, "global_step": 206450, "epoch": 1706} {"train_loss": -41.95783615112305, "global_step": 206451, "epoch": 1706} {"train_loss": -41.95815658569336, "global_step": 206452, "epoch": 1706} {"train_loss": -42.21311569213867, "global_step": 206453, "epoch": 1706} {"train_loss": -41.77528762817383, "global_step": 206454, "epoch": 1706} {"train_loss": -42.115020751953125, "global_step": 206455, "epoch": 1706} {"train_loss": -41.95969772338867, "global_step": 206456, "epoch": 1706} {"train_loss": -42.134334564208984, "global_step": 206457, "epoch": 1706} {"train_loss": -41.9316291809082, "global_step": 206458, "epoch": 1706} {"train_loss": -41.67273712158203, "global_step": 206459, "epoch": 1706} {"train_loss": -41.491554260253906, "global_step": 206460, "epoch": 1706} {"train_loss": -41.7542724609375, "global_step": 206461, "epoch": 1706} {"train_loss": -41.71805953979492, "global_step": 206462, "epoch": 1706} {"train_loss": -41.48972702026367, "global_step": 206463, "epoch": 1706} {"train_loss": -40.661766052246094, "global_step": 206464, "epoch": 1706} {"train_loss": -40.694183349609375, "global_step": 206465, "epoch": 1706} {"train_loss": -41.68324661254883, "global_step": 206466, "epoch": 1706} {"train_loss": -41.613338470458984, "global_step": 206467, "epoch": 1706} {"train_loss": -41.09255599975586, "global_step": 206468, "epoch": 1706} {"train_loss": -37.71140670776367, "global_step": 206469, "epoch": 1706} {"train_loss": -38.34466552734375, "global_step": 206470, "epoch": 1706} {"train_loss": -40.44205856323242, "global_step": 206471, "epoch": 1706} {"train_loss": -39.527339935302734, "global_step": 206472, "epoch": 1706} {"train_loss": -38.52759552001953, "global_step": 206473, "epoch": 1706} {"train_loss": -40.84423065185547, "global_step": 206474, "epoch": 1706} {"train_loss": -41.7022819519043, "global_step": 206475, "epoch": 1706} {"train_loss": -40.06973648071289, "global_step": 206476, "epoch": 1706} {"train_loss": -38.27876281738281, "global_step": 206477, "epoch": 1706} {"train_loss": -39.87101364135742, "global_step": 206478, "epoch": 1706} {"train_loss": -41.60524368286133, "global_step": 206479, "epoch": 1706} {"train_loss": -38.70378494262695, "global_step": 206480, "epoch": 1706} {"train_loss": -39.625423431396484, "global_step": 206481, "epoch": 1706} {"train_loss": -41.11385726928711, "global_step": 206482, "epoch": 1706} {"train_loss": -41.16976547241211, "global_step": 206483, "epoch": 1706} {"train_loss": -40.641807556152344, "global_step": 206484, "epoch": 1706} {"train_loss": -41.68515396118164, "global_step": 206485, "epoch": 1706} {"train_loss": -40.62057876586914, "global_step": 206486, "epoch": 1706} {"train_loss": -40.25588607788086, "global_step": 206487, "epoch": 1706} {"train_loss": -41.58541488647461, "global_step": 206488, "epoch": 1706} {"train_loss": -40.941890716552734, "global_step": 206489, "epoch": 1706} {"train_loss": -40.333614349365234, "global_step": 206490, "epoch": 1706} {"train_loss": -40.71180725097656, "global_step": 206491, "epoch": 1706} {"train_loss": -40.831825256347656, "global_step": 206492, "epoch": 1706} {"train_loss": -40.25751876831055, "global_step": 206493, "epoch": 1706} {"train_loss": -40.61616897583008, "global_step": 206494, "epoch": 1706} {"train_loss": -40.69091796875, "global_step": 206495, "epoch": 1706} {"train_loss": -41.78675079345703, "global_step": 206496, "epoch": 1706} {"train_loss": -40.554134368896484, "global_step": 206497, "epoch": 1706} {"train_loss": -40.7315673828125, "global_step": 206498, "epoch": 1706} {"train_loss": -41.13380813598633, "global_step": 206499, "epoch": 1706} {"train_loss": -40.9319953918457, "global_step": 206500, "epoch": 1706} {"train_loss": -41.38941955566406, "global_step": 206501, "epoch": 1706} {"train_loss": -40.716346740722656, "global_step": 206502, "epoch": 1706} {"train_loss": -41.46006774902344, "global_step": 206503, "epoch": 1706} {"train_loss": -40.93104934692383, "global_step": 206504, "epoch": 1706} {"train_loss": -40.674415588378906, "global_step": 206505, "epoch": 1706} {"train_loss": -40.85675048828125, "global_step": 206506, "epoch": 1706} {"train_loss": -41.43280792236328, "global_step": 206507, "epoch": 1706} {"train_loss": -41.08785629272461, "global_step": 206508, "epoch": 1706} {"train_loss": -41.15572738647461, "global_step": 206509, "epoch": 1706} {"train_loss": -41.72052764892578, "global_step": 206510, "epoch": 1706} {"train_loss": -40.604278564453125, "global_step": 206511, "epoch": 1706} {"train_loss": -40.38959503173828, "global_step": 206512, "epoch": 1706} {"train_loss": -38.91325759887695, "global_step": 206513, "epoch": 1706} {"train_loss": -41.86940383911133, "global_step": 206514, "epoch": 1706} {"train_loss": -39.96731185913086, "global_step": 206515, "epoch": 1706} {"train_loss": -41.47624588012695, "global_step": 206516, "epoch": 1706} {"train_loss": -41.522010803222656, "global_step": 206517, "epoch": 1706} {"train_loss": -41.67890548706055, "global_step": 206518, "epoch": 1706} {"train_loss": -41.306373596191406, "global_step": 206519, "epoch": 1706} {"train_loss": -40.92264938354492, "global_step": 206520, "epoch": 1706} {"train_loss": -41.2728271484375, "global_step": 206521, "epoch": 1706} {"train_loss": -40.3528938293457, "global_step": 206522, "epoch": 1706} {"train_loss": -40.13618850708008, "global_step": 206523, "epoch": 1706} {"train_loss": -41.530311584472656, "global_step": 206524, "epoch": 1706} {"train_loss": -41.95449447631836, "global_step": 206525, "epoch": 1706} {"train_loss": -41.4449577331543, "global_step": 206526, "epoch": 1706} {"train_loss": -41.51612854003906, "global_step": 206527, "epoch": 1706} {"train_loss": -41.14829635620117, "global_step": 206528, "epoch": 1706} {"train_loss": -42.1334228515625, "global_step": 206529, "epoch": 1706} {"train_loss": -41.24658966064453, "global_step": 206530, "epoch": 1706} {"train_loss": -41.99117660522461, "global_step": 206531, "epoch": 1706} {"train_loss": -39.68797302246094, "global_step": 206532, "epoch": 1706} {"train_loss": -41.395320892333984, "global_step": 206533, "epoch": 1706} {"train_loss": -40.503082275390625, "global_step": 206534, "epoch": 1706} {"train_loss": -41.98960494995117, "global_step": 206535, "epoch": 1706} {"train_loss": -41.11812973022461, "global_step": 206536, "epoch": 1706} {"train_loss": -40.37512969970703, "global_step": 206537, "epoch": 1706} {"train_loss": -37.8134765625, "global_step": 206538, "epoch": 1706} {"train_loss": -41.03886795043945, "global_step": 206539, "epoch": 1706} {"train_loss": -41.270668029785156, "global_step": 206540, "epoch": 1706} {"train_loss": -40.2671012878418, "global_step": 206541, "epoch": 1706} {"train_loss": -40.380950927734375, "global_step": 206542, "epoch": 1706} {"train_loss": -40.37760925292969, "global_step": 206543, "epoch": 1706} {"train_loss": -40.370887756347656, "global_step": 206544, "epoch": 1706} {"train_loss": -39.26083755493164, "global_step": 206545, "epoch": 1706} {"train_loss": -40.980679819406554, "global_step": 206546, "epoch": 1706, "val_loss": 2491612.0} {"train_loss": -39.98313522338867, "global_step": 206547, "epoch": 1707} {"train_loss": -39.81431198120117, "global_step": 206548, "epoch": 1707} {"train_loss": -38.759273529052734, "global_step": 206549, "epoch": 1707} {"train_loss": -37.6444206237793, "global_step": 206550, "epoch": 1707} {"train_loss": -40.17871856689453, "global_step": 206551, "epoch": 1707} {"train_loss": -38.030941009521484, "global_step": 206552, "epoch": 1707} {"train_loss": -38.96651840209961, "global_step": 206553, "epoch": 1707} {"train_loss": -33.89883041381836, "global_step": 206554, "epoch": 1707} {"train_loss": -39.4760856628418, "global_step": 206555, "epoch": 1707} {"train_loss": -38.86869430541992, "global_step": 206556, "epoch": 1707} {"train_loss": -40.325435638427734, "global_step": 206557, "epoch": 1707} {"train_loss": -36.39413070678711, "global_step": 206558, "epoch": 1707} {"train_loss": -39.85932159423828, "global_step": 206559, "epoch": 1707} {"train_loss": -35.97835159301758, "global_step": 206560, "epoch": 1707} {"train_loss": -35.44499206542969, "global_step": 206561, "epoch": 1707} {"train_loss": -38.60919952392578, "global_step": 206562, "epoch": 1707} {"train_loss": -37.53876876831055, "global_step": 206563, "epoch": 1707} {"train_loss": -37.74382019042969, "global_step": 206564, "epoch": 1707} {"train_loss": -34.12885665893555, "global_step": 206565, "epoch": 1707} {"train_loss": -22.982290267944336, "global_step": 206566, "epoch": 1707} {"train_loss": -36.57566452026367, "global_step": 206567, "epoch": 1707} {"train_loss": -27.562210083007812, "global_step": 206568, "epoch": 1707} {"train_loss": -38.60245895385742, "global_step": 206569, "epoch": 1707} {"train_loss": -33.4570426940918, "global_step": 206570, "epoch": 1707} {"train_loss": -32.99824523925781, "global_step": 206571, "epoch": 1707} {"train_loss": -32.529605865478516, "global_step": 206572, "epoch": 1707} {"train_loss": -35.402732849121094, "global_step": 206573, "epoch": 1707} {"train_loss": -37.79224395751953, "global_step": 206574, "epoch": 1707} {"train_loss": -36.93524932861328, "global_step": 206575, "epoch": 1707} {"train_loss": -34.83285140991211, "global_step": 206576, "epoch": 1707} {"train_loss": -36.525291442871094, "global_step": 206577, "epoch": 1707} {"train_loss": -36.825836181640625, "global_step": 206578, "epoch": 1707} {"train_loss": -38.47153854370117, "global_step": 206579, "epoch": 1707} {"train_loss": -39.1718864440918, "global_step": 206580, "epoch": 1707} {"train_loss": -38.01055145263672, "global_step": 206581, "epoch": 1707} {"train_loss": -38.617488861083984, "global_step": 206582, "epoch": 1707} {"train_loss": -36.7216911315918, "global_step": 206583, "epoch": 1707} {"train_loss": -36.285484313964844, "global_step": 206584, "epoch": 1707} {"train_loss": -36.69804000854492, "global_step": 206585, "epoch": 1707} {"train_loss": -37.2480583190918, "global_step": 206586, "epoch": 1707} {"train_loss": -38.769866943359375, "global_step": 206587, "epoch": 1707} {"train_loss": -38.383155822753906, "global_step": 206588, "epoch": 1707} {"train_loss": -39.481468200683594, "global_step": 206589, "epoch": 1707} {"train_loss": -37.36430740356445, "global_step": 206590, "epoch": 1707} {"train_loss": -38.91633987426758, "global_step": 206591, "epoch": 1707} {"train_loss": -37.28092575073242, "global_step": 206592, "epoch": 1707} {"train_loss": -37.594661712646484, "global_step": 206593, "epoch": 1707} {"train_loss": -39.34539794921875, "global_step": 206594, "epoch": 1707} {"train_loss": -39.69291305541992, "global_step": 206595, "epoch": 1707} {"train_loss": -39.08558654785156, "global_step": 206596, "epoch": 1707} {"train_loss": -39.60613250732422, "global_step": 206597, "epoch": 1707} {"train_loss": -39.94874954223633, "global_step": 206598, "epoch": 1707} {"train_loss": -39.90754318237305, "global_step": 206599, "epoch": 1707} {"train_loss": -39.12615203857422, "global_step": 206600, "epoch": 1707} {"train_loss": -38.6753044128418, "global_step": 206601, "epoch": 1707} {"train_loss": -39.15864944458008, "global_step": 206602, "epoch": 1707} {"train_loss": -39.157649993896484, "global_step": 206603, "epoch": 1707} {"train_loss": -38.89154052734375, "global_step": 206604, "epoch": 1707} {"train_loss": -39.3326301574707, "global_step": 206605, "epoch": 1707} {"train_loss": -39.46049118041992, "global_step": 206606, "epoch": 1707} {"train_loss": -39.09526443481445, "global_step": 206607, "epoch": 1707} {"train_loss": -39.44782257080078, "global_step": 206608, "epoch": 1707} {"train_loss": -39.972591400146484, "global_step": 206609, "epoch": 1707} {"train_loss": -39.44929885864258, "global_step": 206610, "epoch": 1707} {"train_loss": -40.00911331176758, "global_step": 206611, "epoch": 1707} {"train_loss": -40.06268310546875, "global_step": 206612, "epoch": 1707} {"train_loss": -39.013084411621094, "global_step": 206613, "epoch": 1707} {"train_loss": -40.0197639465332, "global_step": 206614, "epoch": 1707} {"train_loss": -39.97134780883789, "global_step": 206615, "epoch": 1707} {"train_loss": -40.39905548095703, "global_step": 206616, "epoch": 1707} {"train_loss": -40.20505142211914, "global_step": 206617, "epoch": 1707} {"train_loss": -40.47819900512695, "global_step": 206618, "epoch": 1707} {"train_loss": -40.575767517089844, "global_step": 206619, "epoch": 1707} {"train_loss": -40.1457633972168, "global_step": 206620, "epoch": 1707} {"train_loss": -40.89052200317383, "global_step": 206621, "epoch": 1707} {"train_loss": -40.1453857421875, "global_step": 206622, "epoch": 1707} {"train_loss": -40.467628479003906, "global_step": 206623, "epoch": 1707} {"train_loss": -40.31317901611328, "global_step": 206624, "epoch": 1707} {"train_loss": -40.145328521728516, "global_step": 206625, "epoch": 1707} {"train_loss": -40.83550262451172, "global_step": 206626, "epoch": 1707} {"train_loss": -40.9366340637207, "global_step": 206627, "epoch": 1707} {"train_loss": -40.303836822509766, "global_step": 206628, "epoch": 1707} {"train_loss": -41.026100158691406, "global_step": 206629, "epoch": 1707} {"train_loss": -40.6527214050293, "global_step": 206630, "epoch": 1707} {"train_loss": -40.84930419921875, "global_step": 206631, "epoch": 1707} {"train_loss": -40.131778717041016, "global_step": 206632, "epoch": 1707} {"train_loss": -40.651611328125, "global_step": 206633, "epoch": 1707} {"train_loss": -40.3399543762207, "global_step": 206634, "epoch": 1707} {"train_loss": -41.19597244262695, "global_step": 206635, "epoch": 1707} {"train_loss": -39.052284240722656, "global_step": 206636, "epoch": 1707} {"train_loss": -40.95659255981445, "global_step": 206637, "epoch": 1707} {"train_loss": -40.77267074584961, "global_step": 206638, "epoch": 1707} {"train_loss": -41.03862380981445, "global_step": 206639, "epoch": 1707} {"train_loss": -41.38564682006836, "global_step": 206640, "epoch": 1707} {"train_loss": -41.602840423583984, "global_step": 206641, "epoch": 1707} {"train_loss": -41.030242919921875, "global_step": 206642, "epoch": 1707} {"train_loss": -41.26900100708008, "global_step": 206643, "epoch": 1707} {"train_loss": -41.21247100830078, "global_step": 206644, "epoch": 1707} {"train_loss": -41.19004440307617, "global_step": 206645, "epoch": 1707} {"train_loss": -41.05727767944336, "global_step": 206646, "epoch": 1707} {"train_loss": -39.13240432739258, "global_step": 206647, "epoch": 1707} {"train_loss": -40.89733123779297, "global_step": 206648, "epoch": 1707} {"train_loss": -40.37805938720703, "global_step": 206649, "epoch": 1707} {"train_loss": -41.46461868286133, "global_step": 206650, "epoch": 1707} {"train_loss": -40.76359176635742, "global_step": 206651, "epoch": 1707} {"train_loss": -40.360572814941406, "global_step": 206652, "epoch": 1707} {"train_loss": -40.214599609375, "global_step": 206653, "epoch": 1707} {"train_loss": -41.518733978271484, "global_step": 206654, "epoch": 1707} {"train_loss": -41.05404281616211, "global_step": 206655, "epoch": 1707} {"train_loss": -40.400634765625, "global_step": 206656, "epoch": 1707} {"train_loss": -38.11727523803711, "global_step": 206657, "epoch": 1707} {"train_loss": -38.785560607910156, "global_step": 206658, "epoch": 1707} {"train_loss": -39.07564926147461, "global_step": 206659, "epoch": 1707} {"train_loss": -40.45825958251953, "global_step": 206660, "epoch": 1707} {"train_loss": -41.64098358154297, "global_step": 206661, "epoch": 1707} {"train_loss": -39.55735397338867, "global_step": 206662, "epoch": 1707} {"train_loss": -38.91178512573242, "global_step": 206663, "epoch": 1707} {"train_loss": -40.230106353759766, "global_step": 206664, "epoch": 1707} {"train_loss": -41.455718994140625, "global_step": 206665, "epoch": 1707} {"train_loss": -40.750572204589844, "global_step": 206666, "epoch": 1707} {"train_loss": -38.90631347845409, "global_step": 206667, "epoch": 1707, "val_loss": 2579585.75} {"train_loss": -40.53804397583008, "global_step": 206668, "epoch": 1708} {"train_loss": -41.57420349121094, "global_step": 206669, "epoch": 1708} {"train_loss": -41.17555618286133, "global_step": 206670, "epoch": 1708} {"train_loss": -40.25584030151367, "global_step": 206671, "epoch": 1708} {"train_loss": -41.30731201171875, "global_step": 206672, "epoch": 1708} {"train_loss": -40.50123977661133, "global_step": 206673, "epoch": 1708} {"train_loss": -39.722896575927734, "global_step": 206674, "epoch": 1708} {"train_loss": -41.01042175292969, "global_step": 206675, "epoch": 1708} {"train_loss": -41.316253662109375, "global_step": 206676, "epoch": 1708} {"train_loss": -40.6895866394043, "global_step": 206677, "epoch": 1708} {"train_loss": -40.93275833129883, "global_step": 206678, "epoch": 1708} {"train_loss": -41.28874588012695, "global_step": 206679, "epoch": 1708} {"train_loss": -41.327186584472656, "global_step": 206680, "epoch": 1708} {"train_loss": -41.1270637512207, "global_step": 206681, "epoch": 1708} {"train_loss": -41.29031753540039, "global_step": 206682, "epoch": 1708} {"train_loss": -41.10696029663086, "global_step": 206683, "epoch": 1708} {"train_loss": -41.02288055419922, "global_step": 206684, "epoch": 1708} {"train_loss": -41.51616668701172, "global_step": 206685, "epoch": 1708} {"train_loss": -41.441139221191406, "global_step": 206686, "epoch": 1708} {"train_loss": -41.372039794921875, "global_step": 206687, "epoch": 1708} {"train_loss": -41.10415267944336, "global_step": 206688, "epoch": 1708} {"train_loss": -41.66640090942383, "global_step": 206689, "epoch": 1708} {"train_loss": -41.62327575683594, "global_step": 206690, "epoch": 1708} {"train_loss": -41.79096221923828, "global_step": 206691, "epoch": 1708} {"train_loss": -42.0479621887207, "global_step": 206692, "epoch": 1708} {"train_loss": -41.7193489074707, "global_step": 206693, "epoch": 1708} {"train_loss": -41.70884323120117, "global_step": 206694, "epoch": 1708} {"train_loss": -41.66097640991211, "global_step": 206695, "epoch": 1708} {"train_loss": -40.96466827392578, "global_step": 206696, "epoch": 1708} {"train_loss": -42.070343017578125, "global_step": 206697, "epoch": 1708} {"train_loss": -41.86852264404297, "global_step": 206698, "epoch": 1708} {"train_loss": -41.77059555053711, "global_step": 206699, "epoch": 1708} {"train_loss": -41.812679290771484, "global_step": 206700, "epoch": 1708} {"train_loss": -41.3995475769043, "global_step": 206701, "epoch": 1708} {"train_loss": -41.06330108642578, "global_step": 206702, "epoch": 1708} {"train_loss": -41.55733108520508, "global_step": 206703, "epoch": 1708} {"train_loss": -41.68274688720703, "global_step": 206704, "epoch": 1708} {"train_loss": -41.12688446044922, "global_step": 206705, "epoch": 1708} {"train_loss": -40.73832702636719, "global_step": 206706, "epoch": 1708} {"train_loss": -40.015621185302734, "global_step": 206707, "epoch": 1708} {"train_loss": -39.22465515136719, "global_step": 206708, "epoch": 1708} {"train_loss": -37.39201736450195, "global_step": 206709, "epoch": 1708} {"train_loss": -36.700679779052734, "global_step": 206710, "epoch": 1708} {"train_loss": -35.286582946777344, "global_step": 206711, "epoch": 1708} {"train_loss": -35.11552810668945, "global_step": 206712, "epoch": 1708} {"train_loss": -36.9786376953125, "global_step": 206713, "epoch": 1708} {"train_loss": -41.12018966674805, "global_step": 206714, "epoch": 1708} {"train_loss": -39.92432403564453, "global_step": 206715, "epoch": 1708} {"train_loss": -38.26433181762695, "global_step": 206716, "epoch": 1708} {"train_loss": -39.209346771240234, "global_step": 206717, "epoch": 1708} {"train_loss": -40.5523796081543, "global_step": 206718, "epoch": 1708} {"train_loss": -41.16488265991211, "global_step": 206719, "epoch": 1708} {"train_loss": -39.68567657470703, "global_step": 206720, "epoch": 1708} {"train_loss": -41.175689697265625, "global_step": 206721, "epoch": 1708} {"train_loss": -41.31264114379883, "global_step": 206722, "epoch": 1708} {"train_loss": -40.013214111328125, "global_step": 206723, "epoch": 1708} {"train_loss": -41.69086837768555, "global_step": 206724, "epoch": 1708} {"train_loss": -40.760536193847656, "global_step": 206725, "epoch": 1708} {"train_loss": -41.3908805847168, "global_step": 206726, "epoch": 1708} {"train_loss": -41.573848724365234, "global_step": 206727, "epoch": 1708} {"train_loss": -41.71308135986328, "global_step": 206728, "epoch": 1708} {"train_loss": -41.2866325378418, "global_step": 206729, "epoch": 1708} {"train_loss": -41.5426025390625, "global_step": 206730, "epoch": 1708} {"train_loss": -41.65731430053711, "global_step": 206731, "epoch": 1708} {"train_loss": -41.70817184448242, "global_step": 206732, "epoch": 1708} {"train_loss": -41.9051513671875, "global_step": 206733, "epoch": 1708} {"train_loss": -41.22959518432617, "global_step": 206734, "epoch": 1708} {"train_loss": -41.64597702026367, "global_step": 206735, "epoch": 1708} {"train_loss": -41.66691207885742, "global_step": 206736, "epoch": 1708} {"train_loss": -41.2481803894043, "global_step": 206737, "epoch": 1708} {"train_loss": -41.46156692504883, "global_step": 206738, "epoch": 1708} {"train_loss": -41.955196380615234, "global_step": 206739, "epoch": 1708} {"train_loss": -42.229736328125, "global_step": 206740, "epoch": 1708} {"train_loss": -41.303123474121094, "global_step": 206741, "epoch": 1708} {"train_loss": -41.46345901489258, "global_step": 206742, "epoch": 1708} {"train_loss": -41.288856506347656, "global_step": 206743, "epoch": 1708} {"train_loss": -41.13719177246094, "global_step": 206744, "epoch": 1708} {"train_loss": -42.01093673706055, "global_step": 206745, "epoch": 1708} {"train_loss": -41.90625, "global_step": 206746, "epoch": 1708} {"train_loss": -41.67087936401367, "global_step": 206747, "epoch": 1708} {"train_loss": -42.02461624145508, "global_step": 206748, "epoch": 1708} {"train_loss": -42.04790115356445, "global_step": 206749, "epoch": 1708} {"train_loss": -41.61322784423828, "global_step": 206750, "epoch": 1708} {"train_loss": -42.04396438598633, "global_step": 206751, "epoch": 1708} {"train_loss": -42.18962860107422, "global_step": 206752, "epoch": 1708} {"train_loss": -42.324459075927734, "global_step": 206753, "epoch": 1708} {"train_loss": -41.516475677490234, "global_step": 206754, "epoch": 1708} {"train_loss": -41.92585754394531, "global_step": 206755, "epoch": 1708} {"train_loss": -42.198341369628906, "global_step": 206756, "epoch": 1708} {"train_loss": -42.00779342651367, "global_step": 206757, "epoch": 1708} {"train_loss": -42.36592102050781, "global_step": 206758, "epoch": 1708} {"train_loss": -41.71792984008789, "global_step": 206759, "epoch": 1708} {"train_loss": -42.18904113769531, "global_step": 206760, "epoch": 1708} {"train_loss": -41.999725341796875, "global_step": 206761, "epoch": 1708} {"train_loss": -41.58719253540039, "global_step": 206762, "epoch": 1708} {"train_loss": -41.214019775390625, "global_step": 206763, "epoch": 1708} {"train_loss": -39.57817077636719, "global_step": 206764, "epoch": 1708} {"train_loss": -41.56782150268555, "global_step": 206765, "epoch": 1708} {"train_loss": -41.6375617980957, "global_step": 206766, "epoch": 1708} {"train_loss": -42.03263854980469, "global_step": 206767, "epoch": 1708} {"train_loss": -41.382911682128906, "global_step": 206768, "epoch": 1708} {"train_loss": -37.40353775024414, "global_step": 206769, "epoch": 1708} {"train_loss": -40.67574691772461, "global_step": 206770, "epoch": 1708} {"train_loss": -35.1413688659668, "global_step": 206771, "epoch": 1708} {"train_loss": -40.15668869018555, "global_step": 206772, "epoch": 1708} {"train_loss": -40.68178176879883, "global_step": 206773, "epoch": 1708} {"train_loss": -37.75515365600586, "global_step": 206774, "epoch": 1708} {"train_loss": -36.77436065673828, "global_step": 206775, "epoch": 1708} {"train_loss": -37.27506637573242, "global_step": 206776, "epoch": 1708} {"train_loss": -40.39000701904297, "global_step": 206777, "epoch": 1708} {"train_loss": -35.979732513427734, "global_step": 206778, "epoch": 1708} {"train_loss": -38.9215202331543, "global_step": 206779, "epoch": 1708} {"train_loss": -39.42306137084961, "global_step": 206780, "epoch": 1708} {"train_loss": -40.19062042236328, "global_step": 206781, "epoch": 1708} {"train_loss": -37.63960266113281, "global_step": 206782, "epoch": 1708} {"train_loss": -36.90425491333008, "global_step": 206783, "epoch": 1708} {"train_loss": -39.78748321533203, "global_step": 206784, "epoch": 1708} {"train_loss": -38.096778869628906, "global_step": 206785, "epoch": 1708} {"train_loss": -39.691673278808594, "global_step": 206786, "epoch": 1708} {"train_loss": -28.410202026367188, "global_step": 206787, "epoch": 1708} {"train_loss": -40.53474246568916, "global_step": 206788, "epoch": 1708, "val_loss": 2482295.75} {"train_loss": -32.93019485473633, "global_step": 206789, "epoch": 1709} {"train_loss": -31.299814224243164, "global_step": 206790, "epoch": 1709} {"train_loss": -38.176395416259766, "global_step": 206791, "epoch": 1709} {"train_loss": -32.4803466796875, "global_step": 206792, "epoch": 1709} {"train_loss": -37.8792724609375, "global_step": 206793, "epoch": 1709} {"train_loss": -36.47334289550781, "global_step": 206794, "epoch": 1709} {"train_loss": -37.13155746459961, "global_step": 206795, "epoch": 1709} {"train_loss": -34.29610061645508, "global_step": 206796, "epoch": 1709} {"train_loss": -35.4360466003418, "global_step": 206797, "epoch": 1709} {"train_loss": -36.85759353637695, "global_step": 206798, "epoch": 1709} {"train_loss": -35.9826774597168, "global_step": 206799, "epoch": 1709} {"train_loss": -35.97521209716797, "global_step": 206800, "epoch": 1709} {"train_loss": -36.75981521606445, "global_step": 206801, "epoch": 1709} {"train_loss": -34.95134353637695, "global_step": 206802, "epoch": 1709} {"train_loss": -38.72035598754883, "global_step": 206803, "epoch": 1709} {"train_loss": -37.6512451171875, "global_step": 206804, "epoch": 1709} {"train_loss": -39.46399688720703, "global_step": 206805, "epoch": 1709} {"train_loss": -36.273193359375, "global_step": 206806, "epoch": 1709} {"train_loss": -37.75210952758789, "global_step": 206807, "epoch": 1709} {"train_loss": -38.44081497192383, "global_step": 206808, "epoch": 1709} {"train_loss": -32.90422439575195, "global_step": 206809, "epoch": 1709} {"train_loss": -38.25383377075195, "global_step": 206810, "epoch": 1709} {"train_loss": -38.40919876098633, "global_step": 206811, "epoch": 1709} {"train_loss": -37.52937698364258, "global_step": 206812, "epoch": 1709} {"train_loss": -36.9634895324707, "global_step": 206813, "epoch": 1709} {"train_loss": -38.34978103637695, "global_step": 206814, "epoch": 1709} {"train_loss": -37.79560089111328, "global_step": 206815, "epoch": 1709} {"train_loss": -39.044002532958984, "global_step": 206816, "epoch": 1709} {"train_loss": -38.29450607299805, "global_step": 206817, "epoch": 1709} {"train_loss": -39.2714729309082, "global_step": 206818, "epoch": 1709} {"train_loss": -38.124664306640625, "global_step": 206819, "epoch": 1709} {"train_loss": -39.372867584228516, "global_step": 206820, "epoch": 1709} {"train_loss": -38.663578033447266, "global_step": 206821, "epoch": 1709} {"train_loss": -39.06593322753906, "global_step": 206822, "epoch": 1709} {"train_loss": -39.812896728515625, "global_step": 206823, "epoch": 1709} {"train_loss": -38.594017028808594, "global_step": 206824, "epoch": 1709} {"train_loss": -38.957496643066406, "global_step": 206825, "epoch": 1709} {"train_loss": -39.55683517456055, "global_step": 206826, "epoch": 1709} {"train_loss": -39.90185546875, "global_step": 206827, "epoch": 1709} {"train_loss": -39.50392150878906, "global_step": 206828, "epoch": 1709} {"train_loss": -39.43101119995117, "global_step": 206829, "epoch": 1709} {"train_loss": -38.80615997314453, "global_step": 206830, "epoch": 1709} {"train_loss": -39.86320877075195, "global_step": 206831, "epoch": 1709} {"train_loss": -39.007080078125, "global_step": 206832, "epoch": 1709} {"train_loss": -39.864681243896484, "global_step": 206833, "epoch": 1709} {"train_loss": -39.92076873779297, "global_step": 206834, "epoch": 1709} {"train_loss": -40.04259490966797, "global_step": 206835, "epoch": 1709} {"train_loss": -39.37849044799805, "global_step": 206836, "epoch": 1709} {"train_loss": -39.81093978881836, "global_step": 206837, "epoch": 1709} {"train_loss": -39.99447250366211, "global_step": 206838, "epoch": 1709} {"train_loss": -39.862056732177734, "global_step": 206839, "epoch": 1709} {"train_loss": -39.73393630981445, "global_step": 206840, "epoch": 1709} {"train_loss": -40.1804084777832, "global_step": 206841, "epoch": 1709} {"train_loss": -39.11866760253906, "global_step": 206842, "epoch": 1709} {"train_loss": -40.15080261230469, "global_step": 206843, "epoch": 1709} {"train_loss": -39.98064422607422, "global_step": 206844, "epoch": 1709} {"train_loss": -39.949005126953125, "global_step": 206845, "epoch": 1709} {"train_loss": -39.88425827026367, "global_step": 206846, "epoch": 1709} {"train_loss": -40.259552001953125, "global_step": 206847, "epoch": 1709} {"train_loss": -40.201324462890625, "global_step": 206848, "epoch": 1709} {"train_loss": -39.125823974609375, "global_step": 206849, "epoch": 1709} {"train_loss": -39.89794921875, "global_step": 206850, "epoch": 1709} {"train_loss": -40.770973205566406, "global_step": 206851, "epoch": 1709} {"train_loss": -40.518917083740234, "global_step": 206852, "epoch": 1709} {"train_loss": -41.20351028442383, "global_step": 206853, "epoch": 1709} {"train_loss": -39.32452392578125, "global_step": 206854, "epoch": 1709} {"train_loss": -40.50935363769531, "global_step": 206855, "epoch": 1709} {"train_loss": -40.299652099609375, "global_step": 206856, "epoch": 1709} {"train_loss": -40.58747482299805, "global_step": 206857, "epoch": 1709} {"train_loss": -40.46700668334961, "global_step": 206858, "epoch": 1709} {"train_loss": -40.843055725097656, "global_step": 206859, "epoch": 1709} {"train_loss": -41.09647750854492, "global_step": 206860, "epoch": 1709} {"train_loss": -40.85142517089844, "global_step": 206861, "epoch": 1709} {"train_loss": -40.973419189453125, "global_step": 206862, "epoch": 1709} {"train_loss": -41.10544967651367, "global_step": 206863, "epoch": 1709} {"train_loss": -41.03577423095703, "global_step": 206864, "epoch": 1709} {"train_loss": -41.4254264831543, "global_step": 206865, "epoch": 1709} {"train_loss": -40.67241668701172, "global_step": 206866, "epoch": 1709} {"train_loss": -41.451011657714844, "global_step": 206867, "epoch": 1709} {"train_loss": -40.65557861328125, "global_step": 206868, "epoch": 1709} {"train_loss": -40.874629974365234, "global_step": 206869, "epoch": 1709} {"train_loss": -41.323795318603516, "global_step": 206870, "epoch": 1709} {"train_loss": -41.17238235473633, "global_step": 206871, "epoch": 1709} {"train_loss": -40.23273468017578, "global_step": 206872, "epoch": 1709} {"train_loss": -40.770118713378906, "global_step": 206873, "epoch": 1709} {"train_loss": -40.43456268310547, "global_step": 206874, "epoch": 1709} {"train_loss": -41.17960739135742, "global_step": 206875, "epoch": 1709} {"train_loss": -40.659820556640625, "global_step": 206876, "epoch": 1709} {"train_loss": -41.468910217285156, "global_step": 206877, "epoch": 1709} {"train_loss": -41.091949462890625, "global_step": 206878, "epoch": 1709} {"train_loss": -41.5109748840332, "global_step": 206879, "epoch": 1709} {"train_loss": -41.386993408203125, "global_step": 206880, "epoch": 1709} {"train_loss": -40.26240921020508, "global_step": 206881, "epoch": 1709} {"train_loss": -41.46566390991211, "global_step": 206882, "epoch": 1709} {"train_loss": -40.844181060791016, "global_step": 206883, "epoch": 1709} {"train_loss": -41.42330551147461, "global_step": 206884, "epoch": 1709} {"train_loss": -41.59700393676758, "global_step": 206885, "epoch": 1709} {"train_loss": -41.53010940551758, "global_step": 206886, "epoch": 1709} {"train_loss": -41.024288177490234, "global_step": 206887, "epoch": 1709} {"train_loss": -40.8864860534668, "global_step": 206888, "epoch": 1709} {"train_loss": -40.92841339111328, "global_step": 206889, "epoch": 1709} {"train_loss": -41.49374008178711, "global_step": 206890, "epoch": 1709} {"train_loss": -41.400882720947266, "global_step": 206891, "epoch": 1709} {"train_loss": -41.951351165771484, "global_step": 206892, "epoch": 1709} {"train_loss": -41.08827590942383, "global_step": 206893, "epoch": 1709} {"train_loss": -41.44522476196289, "global_step": 206894, "epoch": 1709} {"train_loss": -41.47576904296875, "global_step": 206895, "epoch": 1709} {"train_loss": -41.5043830871582, "global_step": 206896, "epoch": 1709} {"train_loss": -41.45865249633789, "global_step": 206897, "epoch": 1709} {"train_loss": -41.821746826171875, "global_step": 206898, "epoch": 1709} {"train_loss": -41.378509521484375, "global_step": 206899, "epoch": 1709} {"train_loss": -41.344913482666016, "global_step": 206900, "epoch": 1709} {"train_loss": -41.527252197265625, "global_step": 206901, "epoch": 1709} {"train_loss": -41.792171478271484, "global_step": 206902, "epoch": 1709} {"train_loss": -41.42042922973633, "global_step": 206903, "epoch": 1709} {"train_loss": -41.14276123046875, "global_step": 206904, "epoch": 1709} {"train_loss": -40.57182693481445, "global_step": 206905, "epoch": 1709} {"train_loss": -41.71735382080078, "global_step": 206906, "epoch": 1709} {"train_loss": -41.32109451293945, "global_step": 206907, "epoch": 1709} {"train_loss": -39.78540802001953, "global_step": 206908, "epoch": 1709} {"train_loss": -39.56376867057863, "global_step": 206909, "epoch": 1709, "val_loss": 2406113.0} {"train_loss": -37.808937072753906, "global_step": 206910, "epoch": 1710} {"train_loss": -40.97599411010742, "global_step": 206911, "epoch": 1710} {"train_loss": -40.73516845703125, "global_step": 206912, "epoch": 1710} {"train_loss": -39.18636703491211, "global_step": 206913, "epoch": 1710} {"train_loss": -35.111385345458984, "global_step": 206914, "epoch": 1710} {"train_loss": -32.46909713745117, "global_step": 206915, "epoch": 1710} {"train_loss": -21.771711349487305, "global_step": 206916, "epoch": 1710} {"train_loss": -1.2406855821609497, "global_step": 206917, "epoch": 1710} {"train_loss": -18.785566329956055, "global_step": 206918, "epoch": 1710} {"train_loss": -35.92181396484375, "global_step": 206919, "epoch": 1710} {"train_loss": -21.188215255737305, "global_step": 206920, "epoch": 1710} {"train_loss": -34.4778938293457, "global_step": 206921, "epoch": 1710} {"train_loss": -29.392988204956055, "global_step": 206922, "epoch": 1710} {"train_loss": -34.21353530883789, "global_step": 206923, "epoch": 1710} {"train_loss": -31.080673217773438, "global_step": 206924, "epoch": 1710} {"train_loss": -34.82468795776367, "global_step": 206925, "epoch": 1710} {"train_loss": -31.739973068237305, "global_step": 206926, "epoch": 1710} {"train_loss": -37.26364517211914, "global_step": 206927, "epoch": 1710} {"train_loss": -35.918941497802734, "global_step": 206928, "epoch": 1710} {"train_loss": -35.5894660949707, "global_step": 206929, "epoch": 1710} {"train_loss": -38.3248405456543, "global_step": 206930, "epoch": 1710} {"train_loss": -36.9512939453125, "global_step": 206931, "epoch": 1710} {"train_loss": -35.86845779418945, "global_step": 206932, "epoch": 1710} {"train_loss": -38.655540466308594, "global_step": 206933, "epoch": 1710} {"train_loss": -35.183475494384766, "global_step": 206934, "epoch": 1710} {"train_loss": -37.866363525390625, "global_step": 206935, "epoch": 1710} {"train_loss": -39.17470169067383, "global_step": 206936, "epoch": 1710} {"train_loss": -37.37256622314453, "global_step": 206937, "epoch": 1710} {"train_loss": -37.77891159057617, "global_step": 206938, "epoch": 1710} {"train_loss": -38.941097259521484, "global_step": 206939, "epoch": 1710} {"train_loss": -38.51362228393555, "global_step": 206940, "epoch": 1710} {"train_loss": -38.39649200439453, "global_step": 206941, "epoch": 1710} {"train_loss": -39.333675384521484, "global_step": 206942, "epoch": 1710} {"train_loss": -38.9299201965332, "global_step": 206943, "epoch": 1710} {"train_loss": -39.950191497802734, "global_step": 206944, "epoch": 1710} {"train_loss": -39.00828170776367, "global_step": 206945, "epoch": 1710} {"train_loss": -38.722408294677734, "global_step": 206946, "epoch": 1710} {"train_loss": -39.354793548583984, "global_step": 206947, "epoch": 1710} {"train_loss": -39.163509368896484, "global_step": 206948, "epoch": 1710} {"train_loss": -40.00064468383789, "global_step": 206949, "epoch": 1710} {"train_loss": -39.45709228515625, "global_step": 206950, "epoch": 1710} {"train_loss": -39.988460540771484, "global_step": 206951, "epoch": 1710} {"train_loss": -40.073509216308594, "global_step": 206952, "epoch": 1710} {"train_loss": -40.043739318847656, "global_step": 206953, "epoch": 1710} {"train_loss": -40.42069625854492, "global_step": 206954, "epoch": 1710} {"train_loss": -39.89807891845703, "global_step": 206955, "epoch": 1710} {"train_loss": -39.9010009765625, "global_step": 206956, "epoch": 1710} {"train_loss": -40.63228988647461, "global_step": 206957, "epoch": 1710} {"train_loss": -40.0345458984375, "global_step": 206958, "epoch": 1710} {"train_loss": -39.62361145019531, "global_step": 206959, "epoch": 1710} {"train_loss": -40.045738220214844, "global_step": 206960, "epoch": 1710} {"train_loss": -40.13021469116211, "global_step": 206961, "epoch": 1710} {"train_loss": -40.483009338378906, "global_step": 206962, "epoch": 1710} {"train_loss": -40.168922424316406, "global_step": 206963, "epoch": 1710} {"train_loss": -40.59526443481445, "global_step": 206964, "epoch": 1710} {"train_loss": -40.17827224731445, "global_step": 206965, "epoch": 1710} {"train_loss": -40.965633392333984, "global_step": 206966, "epoch": 1710} {"train_loss": -40.69523239135742, "global_step": 206967, "epoch": 1710} {"train_loss": -40.53053283691406, "global_step": 206968, "epoch": 1710} {"train_loss": -40.670745849609375, "global_step": 206969, "epoch": 1710} {"train_loss": -40.93221664428711, "global_step": 206970, "epoch": 1710} {"train_loss": -40.847537994384766, "global_step": 206971, "epoch": 1710} {"train_loss": -40.723079681396484, "global_step": 206972, "epoch": 1710} {"train_loss": -41.02769088745117, "global_step": 206973, "epoch": 1710} {"train_loss": -40.68708801269531, "global_step": 206974, "epoch": 1710} {"train_loss": -40.88271713256836, "global_step": 206975, "epoch": 1710} {"train_loss": -41.12694549560547, "global_step": 206976, "epoch": 1710} {"train_loss": -40.86424255371094, "global_step": 206977, "epoch": 1710} {"train_loss": -41.18099594116211, "global_step": 206978, "epoch": 1710} {"train_loss": -41.508872985839844, "global_step": 206979, "epoch": 1710} {"train_loss": -41.00049591064453, "global_step": 206980, "epoch": 1710} {"train_loss": -41.227142333984375, "global_step": 206981, "epoch": 1710} {"train_loss": -41.02840805053711, "global_step": 206982, "epoch": 1710} {"train_loss": -41.62266159057617, "global_step": 206983, "epoch": 1710} {"train_loss": -41.18274688720703, "global_step": 206984, "epoch": 1710} {"train_loss": -41.64452362060547, "global_step": 206985, "epoch": 1710} {"train_loss": -41.83041000366211, "global_step": 206986, "epoch": 1710} {"train_loss": -41.58264923095703, "global_step": 206987, "epoch": 1710} {"train_loss": -41.308685302734375, "global_step": 206988, "epoch": 1710} {"train_loss": -41.783203125, "global_step": 206989, "epoch": 1710} {"train_loss": -41.84507369995117, "global_step": 206990, "epoch": 1710} {"train_loss": -41.15694808959961, "global_step": 206991, "epoch": 1710} {"train_loss": -41.238807678222656, "global_step": 206992, "epoch": 1710} {"train_loss": -41.816184997558594, "global_step": 206993, "epoch": 1710} {"train_loss": -41.923797607421875, "global_step": 206994, "epoch": 1710} {"train_loss": -41.31291580200195, "global_step": 206995, "epoch": 1710} {"train_loss": -41.76644515991211, "global_step": 206996, "epoch": 1710} {"train_loss": -41.71387481689453, "global_step": 206997, "epoch": 1710} {"train_loss": -41.146827697753906, "global_step": 206998, "epoch": 1710} {"train_loss": -41.84593963623047, "global_step": 206999, "epoch": 1710} {"train_loss": -41.586666107177734, "global_step": 207000, "epoch": 1710} {"train_loss": -41.56596374511719, "global_step": 207001, "epoch": 1710} {"train_loss": -41.553321838378906, "global_step": 207002, "epoch": 1710} {"train_loss": -41.854835510253906, "global_step": 207003, "epoch": 1710} {"train_loss": -42.238033294677734, "global_step": 207004, "epoch": 1710} {"train_loss": -41.777984619140625, "global_step": 207005, "epoch": 1710} {"train_loss": -41.814849853515625, "global_step": 207006, "epoch": 1710} {"train_loss": -42.046138763427734, "global_step": 207007, "epoch": 1710} {"train_loss": -42.166343688964844, "global_step": 207008, "epoch": 1710} {"train_loss": -41.83502960205078, "global_step": 207009, "epoch": 1710} {"train_loss": -41.607730865478516, "global_step": 207010, "epoch": 1710} {"train_loss": -42.43248748779297, "global_step": 207011, "epoch": 1710} {"train_loss": -41.9447135925293, "global_step": 207012, "epoch": 1710} {"train_loss": -42.0507926940918, "global_step": 207013, "epoch": 1710} {"train_loss": -41.770042419433594, "global_step": 207014, "epoch": 1710} {"train_loss": -42.31233596801758, "global_step": 207015, "epoch": 1710} {"train_loss": -42.35579299926758, "global_step": 207016, "epoch": 1710} {"train_loss": -41.87767791748047, "global_step": 207017, "epoch": 1710} {"train_loss": -42.0831298828125, "global_step": 207018, "epoch": 1710} {"train_loss": -41.92083740234375, "global_step": 207019, "epoch": 1710} {"train_loss": -41.58943557739258, "global_step": 207020, "epoch": 1710} {"train_loss": -41.79763412475586, "global_step": 207021, "epoch": 1710} {"train_loss": -41.800453186035156, "global_step": 207022, "epoch": 1710} {"train_loss": -42.439735412597656, "global_step": 207023, "epoch": 1710} {"train_loss": -42.52442169189453, "global_step": 207024, "epoch": 1710} {"train_loss": -41.82515335083008, "global_step": 207025, "epoch": 1710} {"train_loss": -42.17127227783203, "global_step": 207026, "epoch": 1710} {"train_loss": -41.70159912109375, "global_step": 207027, "epoch": 1710} {"train_loss": -41.601165771484375, "global_step": 207028, "epoch": 1710} {"train_loss": -41.19211196899414, "global_step": 207029, "epoch": 1710} {"train_loss": -39.16499491861044, "global_step": 207030, "epoch": 1710, "val_loss": 2501542.25} {"train_loss": -38.60565185546875, "global_step": 207031, "epoch": 1711} {"train_loss": -37.50541687011719, "global_step": 207032, "epoch": 1711} {"train_loss": -37.3121452331543, "global_step": 207033, "epoch": 1711} {"train_loss": -34.93720626831055, "global_step": 207034, "epoch": 1711} {"train_loss": -31.671279907226562, "global_step": 207035, "epoch": 1711} {"train_loss": -34.954017639160156, "global_step": 207036, "epoch": 1711} {"train_loss": -37.52445602416992, "global_step": 207037, "epoch": 1711} {"train_loss": -38.6041374206543, "global_step": 207038, "epoch": 1711} {"train_loss": -39.902591705322266, "global_step": 207039, "epoch": 1711} {"train_loss": -38.54302215576172, "global_step": 207040, "epoch": 1711} {"train_loss": -38.74127197265625, "global_step": 207041, "epoch": 1711} {"train_loss": -40.03910446166992, "global_step": 207042, "epoch": 1711} {"train_loss": -40.325408935546875, "global_step": 207043, "epoch": 1711} {"train_loss": -40.77547836303711, "global_step": 207044, "epoch": 1711} {"train_loss": -40.1218147277832, "global_step": 207045, "epoch": 1711} {"train_loss": -39.67660140991211, "global_step": 207046, "epoch": 1711} {"train_loss": -40.5285758972168, "global_step": 207047, "epoch": 1711} {"train_loss": -40.1702880859375, "global_step": 207048, "epoch": 1711} {"train_loss": -40.7170524597168, "global_step": 207049, "epoch": 1711} {"train_loss": -40.739959716796875, "global_step": 207050, "epoch": 1711} {"train_loss": -40.78419494628906, "global_step": 207051, "epoch": 1711} {"train_loss": -41.200313568115234, "global_step": 207052, "epoch": 1711} {"train_loss": -40.561981201171875, "global_step": 207053, "epoch": 1711} {"train_loss": -41.148738861083984, "global_step": 207054, "epoch": 1711} {"train_loss": -41.15264129638672, "global_step": 207055, "epoch": 1711} {"train_loss": -40.187530517578125, "global_step": 207056, "epoch": 1711} {"train_loss": -41.044185638427734, "global_step": 207057, "epoch": 1711} {"train_loss": -40.856807708740234, "global_step": 207058, "epoch": 1711} {"train_loss": -41.658504486083984, "global_step": 207059, "epoch": 1711} {"train_loss": -40.96067428588867, "global_step": 207060, "epoch": 1711} {"train_loss": -41.55012130737305, "global_step": 207061, "epoch": 1711} {"train_loss": -41.569637298583984, "global_step": 207062, "epoch": 1711} {"train_loss": -41.381771087646484, "global_step": 207063, "epoch": 1711} {"train_loss": -41.67717361450195, "global_step": 207064, "epoch": 1711} {"train_loss": -41.6181526184082, "global_step": 207065, "epoch": 1711} {"train_loss": -41.88303756713867, "global_step": 207066, "epoch": 1711} {"train_loss": -41.60392761230469, "global_step": 207067, "epoch": 1711} {"train_loss": -41.57289123535156, "global_step": 207068, "epoch": 1711} {"train_loss": -42.05739974975586, "global_step": 207069, "epoch": 1711} {"train_loss": -41.56018829345703, "global_step": 207070, "epoch": 1711} {"train_loss": -42.09401321411133, "global_step": 207071, "epoch": 1711} {"train_loss": -41.79834747314453, "global_step": 207072, "epoch": 1711} {"train_loss": -41.892250061035156, "global_step": 207073, "epoch": 1711} {"train_loss": -41.752418518066406, "global_step": 207074, "epoch": 1711} {"train_loss": -41.57016372680664, "global_step": 207075, "epoch": 1711} {"train_loss": -41.53409957885742, "global_step": 207076, "epoch": 1711} {"train_loss": -42.00277328491211, "global_step": 207077, "epoch": 1711} {"train_loss": -42.18720245361328, "global_step": 207078, "epoch": 1711} {"train_loss": -42.51063919067383, "global_step": 207079, "epoch": 1711} {"train_loss": -42.15619659423828, "global_step": 207080, "epoch": 1711} {"train_loss": -42.2342414855957, "global_step": 207081, "epoch": 1711} {"train_loss": -41.86417770385742, "global_step": 207082, "epoch": 1711} {"train_loss": -42.376094818115234, "global_step": 207083, "epoch": 1711} {"train_loss": -42.25298309326172, "global_step": 207084, "epoch": 1711} {"train_loss": -41.911949157714844, "global_step": 207085, "epoch": 1711} {"train_loss": -42.30735397338867, "global_step": 207086, "epoch": 1711} {"train_loss": -42.39717483520508, "global_step": 207087, "epoch": 1711} {"train_loss": -41.86869430541992, "global_step": 207088, "epoch": 1711} {"train_loss": -42.2697868347168, "global_step": 207089, "epoch": 1711} {"train_loss": -42.21915817260742, "global_step": 207090, "epoch": 1711} {"train_loss": -42.24155807495117, "global_step": 207091, "epoch": 1711} {"train_loss": -42.356590270996094, "global_step": 207092, "epoch": 1711} {"train_loss": -42.039390563964844, "global_step": 207093, "epoch": 1711} {"train_loss": -41.69234848022461, "global_step": 207094, "epoch": 1711} {"train_loss": -41.740474700927734, "global_step": 207095, "epoch": 1711} {"train_loss": -41.660194396972656, "global_step": 207096, "epoch": 1711} {"train_loss": -42.40119552612305, "global_step": 207097, "epoch": 1711} {"train_loss": -42.0413703918457, "global_step": 207098, "epoch": 1711} {"train_loss": -42.52775955200195, "global_step": 207099, "epoch": 1711} {"train_loss": -42.088165283203125, "global_step": 207100, "epoch": 1711} {"train_loss": -42.28361129760742, "global_step": 207101, "epoch": 1711} {"train_loss": -41.7808837890625, "global_step": 207102, "epoch": 1711} {"train_loss": -41.94948959350586, "global_step": 207103, "epoch": 1711} {"train_loss": -42.125152587890625, "global_step": 207104, "epoch": 1711} {"train_loss": -41.91456985473633, "global_step": 207105, "epoch": 1711} {"train_loss": -41.85870361328125, "global_step": 207106, "epoch": 1711} {"train_loss": -41.9438591003418, "global_step": 207107, "epoch": 1711} {"train_loss": -42.02680587768555, "global_step": 207108, "epoch": 1711} {"train_loss": -41.99434280395508, "global_step": 207109, "epoch": 1711} {"train_loss": -41.107906341552734, "global_step": 207110, "epoch": 1711} {"train_loss": -42.618247985839844, "global_step": 207111, "epoch": 1711} {"train_loss": -42.4000244140625, "global_step": 207112, "epoch": 1711} {"train_loss": -42.284671783447266, "global_step": 207113, "epoch": 1711} {"train_loss": -42.40251159667969, "global_step": 207114, "epoch": 1711} {"train_loss": -42.19480514526367, "global_step": 207115, "epoch": 1711} {"train_loss": -41.694740295410156, "global_step": 207116, "epoch": 1711} {"train_loss": -42.228145599365234, "global_step": 207117, "epoch": 1711} {"train_loss": -42.13711166381836, "global_step": 207118, "epoch": 1711} {"train_loss": -40.80410385131836, "global_step": 207119, "epoch": 1711} {"train_loss": -37.30294418334961, "global_step": 207120, "epoch": 1711} {"train_loss": -32.48006057739258, "global_step": 207121, "epoch": 1711} {"train_loss": -31.67262077331543, "global_step": 207122, "epoch": 1711} {"train_loss": -31.881208419799805, "global_step": 207123, "epoch": 1711} {"train_loss": -35.846126556396484, "global_step": 207124, "epoch": 1711} {"train_loss": -37.650875091552734, "global_step": 207125, "epoch": 1711} {"train_loss": -38.91584396362305, "global_step": 207126, "epoch": 1711} {"train_loss": -34.39851760864258, "global_step": 207127, "epoch": 1711} {"train_loss": -39.788307189941406, "global_step": 207128, "epoch": 1711} {"train_loss": -38.82381820678711, "global_step": 207129, "epoch": 1711} {"train_loss": -38.297054290771484, "global_step": 207130, "epoch": 1711} {"train_loss": -40.173484802246094, "global_step": 207131, "epoch": 1711} {"train_loss": -38.61579513549805, "global_step": 207132, "epoch": 1711} {"train_loss": -40.229698181152344, "global_step": 207133, "epoch": 1711} {"train_loss": -40.197715759277344, "global_step": 207134, "epoch": 1711} {"train_loss": -39.84538650512695, "global_step": 207135, "epoch": 1711} {"train_loss": -38.54943084716797, "global_step": 207136, "epoch": 1711} {"train_loss": -41.39076614379883, "global_step": 207137, "epoch": 1711} {"train_loss": -40.53983688354492, "global_step": 207138, "epoch": 1711} {"train_loss": -41.01496124267578, "global_step": 207139, "epoch": 1711} {"train_loss": -41.00569534301758, "global_step": 207140, "epoch": 1711} {"train_loss": -40.92977523803711, "global_step": 207141, "epoch": 1711} {"train_loss": -41.03118896484375, "global_step": 207142, "epoch": 1711} {"train_loss": -40.88624954223633, "global_step": 207143, "epoch": 1711} {"train_loss": -40.70412826538086, "global_step": 207144, "epoch": 1711} {"train_loss": -40.76555252075195, "global_step": 207145, "epoch": 1711} {"train_loss": -41.35942459106445, "global_step": 207146, "epoch": 1711} {"train_loss": -40.48400115966797, "global_step": 207147, "epoch": 1711} {"train_loss": -40.7219123840332, "global_step": 207148, "epoch": 1711} {"train_loss": -41.15894317626953, "global_step": 207149, "epoch": 1711} {"train_loss": -41.360626220703125, "global_step": 207150, "epoch": 1711} {"train_loss": -40.55147079593879, "global_step": 207151, "epoch": 1711, "val_loss": 2526347.25} {"train_loss": -41.5948486328125, "global_step": 207152, "epoch": 1712} {"train_loss": -41.14137649536133, "global_step": 207153, "epoch": 1712} {"train_loss": -41.63356399536133, "global_step": 207154, "epoch": 1712} {"train_loss": -41.24890899658203, "global_step": 207155, "epoch": 1712} {"train_loss": -41.37325668334961, "global_step": 207156, "epoch": 1712} {"train_loss": -41.8969841003418, "global_step": 207157, "epoch": 1712} {"train_loss": -41.41933059692383, "global_step": 207158, "epoch": 1712} {"train_loss": -41.67682647705078, "global_step": 207159, "epoch": 1712} {"train_loss": -41.75519561767578, "global_step": 207160, "epoch": 1712} {"train_loss": -41.191829681396484, "global_step": 207161, "epoch": 1712} {"train_loss": -42.02659225463867, "global_step": 207162, "epoch": 1712} {"train_loss": -41.564300537109375, "global_step": 207163, "epoch": 1712} {"train_loss": -41.22431945800781, "global_step": 207164, "epoch": 1712} {"train_loss": -42.01980209350586, "global_step": 207165, "epoch": 1712} {"train_loss": -41.44506072998047, "global_step": 207166, "epoch": 1712} {"train_loss": -41.751434326171875, "global_step": 207167, "epoch": 1712} {"train_loss": -41.72658920288086, "global_step": 207168, "epoch": 1712} {"train_loss": -40.09682083129883, "global_step": 207169, "epoch": 1712} {"train_loss": -41.558101654052734, "global_step": 207170, "epoch": 1712} {"train_loss": -41.63423538208008, "global_step": 207171, "epoch": 1712} {"train_loss": -41.544700622558594, "global_step": 207172, "epoch": 1712} {"train_loss": -41.9735107421875, "global_step": 207173, "epoch": 1712} {"train_loss": -42.05852127075195, "global_step": 207174, "epoch": 1712} {"train_loss": -42.440670013427734, "global_step": 207175, "epoch": 1712} {"train_loss": -42.06105422973633, "global_step": 207176, "epoch": 1712} {"train_loss": -41.68422317504883, "global_step": 207177, "epoch": 1712} {"train_loss": -42.68592071533203, "global_step": 207178, "epoch": 1712} {"train_loss": -41.93464279174805, "global_step": 207179, "epoch": 1712} {"train_loss": -41.815486907958984, "global_step": 207180, "epoch": 1712} {"train_loss": -42.4595832824707, "global_step": 207181, "epoch": 1712} {"train_loss": -41.9075813293457, "global_step": 207182, "epoch": 1712} {"train_loss": -41.90504455566406, "global_step": 207183, "epoch": 1712} {"train_loss": -42.179908752441406, "global_step": 207184, "epoch": 1712} {"train_loss": -41.66361618041992, "global_step": 207185, "epoch": 1712} {"train_loss": -41.39818572998047, "global_step": 207186, "epoch": 1712} {"train_loss": -41.65813064575195, "global_step": 207187, "epoch": 1712} {"train_loss": -41.84487533569336, "global_step": 207188, "epoch": 1712} {"train_loss": -42.025691986083984, "global_step": 207189, "epoch": 1712} {"train_loss": -42.20417785644531, "global_step": 207190, "epoch": 1712} {"train_loss": -41.76353073120117, "global_step": 207191, "epoch": 1712} {"train_loss": -41.6356086730957, "global_step": 207192, "epoch": 1712} {"train_loss": -41.41506576538086, "global_step": 207193, "epoch": 1712} {"train_loss": -42.02035140991211, "global_step": 207194, "epoch": 1712} {"train_loss": -41.9781379699707, "global_step": 207195, "epoch": 1712} {"train_loss": -40.4567985534668, "global_step": 207196, "epoch": 1712} {"train_loss": -39.9311408996582, "global_step": 207197, "epoch": 1712} {"train_loss": -39.60490036010742, "global_step": 207198, "epoch": 1712} {"train_loss": -39.949310302734375, "global_step": 207199, "epoch": 1712} {"train_loss": -41.000728607177734, "global_step": 207200, "epoch": 1712} {"train_loss": -38.912139892578125, "global_step": 207201, "epoch": 1712} {"train_loss": -40.9003791809082, "global_step": 207202, "epoch": 1712} {"train_loss": -41.497474670410156, "global_step": 207203, "epoch": 1712} {"train_loss": -38.295692443847656, "global_step": 207204, "epoch": 1712} {"train_loss": -38.16622543334961, "global_step": 207205, "epoch": 1712} {"train_loss": -41.29537582397461, "global_step": 207206, "epoch": 1712} {"train_loss": -40.79303741455078, "global_step": 207207, "epoch": 1712} {"train_loss": -40.57767868041992, "global_step": 207208, "epoch": 1712} {"train_loss": -40.49818801879883, "global_step": 207209, "epoch": 1712} {"train_loss": -40.672882080078125, "global_step": 207210, "epoch": 1712} {"train_loss": -39.442665100097656, "global_step": 207211, "epoch": 1712} {"train_loss": -39.7220344543457, "global_step": 207212, "epoch": 1712} {"train_loss": -40.74270248413086, "global_step": 207213, "epoch": 1712} {"train_loss": -41.48735427856445, "global_step": 207214, "epoch": 1712} {"train_loss": -39.879512786865234, "global_step": 207215, "epoch": 1712} {"train_loss": -40.80418395996094, "global_step": 207216, "epoch": 1712} {"train_loss": -41.01807403564453, "global_step": 207217, "epoch": 1712} {"train_loss": -40.724937438964844, "global_step": 207218, "epoch": 1712} {"train_loss": -41.17864990234375, "global_step": 207219, "epoch": 1712} {"train_loss": -40.360450744628906, "global_step": 207220, "epoch": 1712} {"train_loss": -41.62052536010742, "global_step": 207221, "epoch": 1712} {"train_loss": -41.55819320678711, "global_step": 207222, "epoch": 1712} {"train_loss": -40.28226089477539, "global_step": 207223, "epoch": 1712} {"train_loss": -40.188682556152344, "global_step": 207224, "epoch": 1712} {"train_loss": -41.39069366455078, "global_step": 207225, "epoch": 1712} {"train_loss": -41.24140930175781, "global_step": 207226, "epoch": 1712} {"train_loss": -40.60246658325195, "global_step": 207227, "epoch": 1712} {"train_loss": -39.907691955566406, "global_step": 207228, "epoch": 1712} {"train_loss": -41.24436569213867, "global_step": 207229, "epoch": 1712} {"train_loss": -40.66259002685547, "global_step": 207230, "epoch": 1712} {"train_loss": -41.01182556152344, "global_step": 207231, "epoch": 1712} {"train_loss": -41.28983688354492, "global_step": 207232, "epoch": 1712} {"train_loss": -40.868896484375, "global_step": 207233, "epoch": 1712} {"train_loss": -40.1649284362793, "global_step": 207234, "epoch": 1712} {"train_loss": -42.2770881652832, "global_step": 207235, "epoch": 1712} {"train_loss": -40.01518630981445, "global_step": 207236, "epoch": 1712} {"train_loss": -40.21643829345703, "global_step": 207237, "epoch": 1712} {"train_loss": -41.2506103515625, "global_step": 207238, "epoch": 1712} {"train_loss": -40.15083694458008, "global_step": 207239, "epoch": 1712} {"train_loss": -41.35770797729492, "global_step": 207240, "epoch": 1712} {"train_loss": -39.603477478027344, "global_step": 207241, "epoch": 1712} {"train_loss": -40.4559211730957, "global_step": 207242, "epoch": 1712} {"train_loss": -40.192684173583984, "global_step": 207243, "epoch": 1712} {"train_loss": -39.37064743041992, "global_step": 207244, "epoch": 1712} {"train_loss": -38.11083221435547, "global_step": 207245, "epoch": 1712} {"train_loss": -40.96546936035156, "global_step": 207246, "epoch": 1712} {"train_loss": -41.2378044128418, "global_step": 207247, "epoch": 1712} {"train_loss": -40.545654296875, "global_step": 207248, "epoch": 1712} {"train_loss": -39.21261215209961, "global_step": 207249, "epoch": 1712} {"train_loss": -37.61630630493164, "global_step": 207250, "epoch": 1712} {"train_loss": -40.32305908203125, "global_step": 207251, "epoch": 1712} {"train_loss": -39.804744720458984, "global_step": 207252, "epoch": 1712} {"train_loss": -35.433013916015625, "global_step": 207253, "epoch": 1712} {"train_loss": -39.901344299316406, "global_step": 207254, "epoch": 1712} {"train_loss": -36.5417594909668, "global_step": 207255, "epoch": 1712} {"train_loss": -39.66770553588867, "global_step": 207256, "epoch": 1712} {"train_loss": -40.036964416503906, "global_step": 207257, "epoch": 1712} {"train_loss": -39.40341567993164, "global_step": 207258, "epoch": 1712} {"train_loss": -40.53056335449219, "global_step": 207259, "epoch": 1712} {"train_loss": -39.53792190551758, "global_step": 207260, "epoch": 1712} {"train_loss": -37.506404876708984, "global_step": 207261, "epoch": 1712} {"train_loss": -40.32434844970703, "global_step": 207262, "epoch": 1712} {"train_loss": -39.909584045410156, "global_step": 207263, "epoch": 1712} {"train_loss": -38.32269287109375, "global_step": 207264, "epoch": 1712} {"train_loss": -36.43906784057617, "global_step": 207265, "epoch": 1712} {"train_loss": -40.137611389160156, "global_step": 207266, "epoch": 1712} {"train_loss": -32.19455337524414, "global_step": 207267, "epoch": 1712} {"train_loss": -39.504085540771484, "global_step": 207268, "epoch": 1712} {"train_loss": -39.4852180480957, "global_step": 207269, "epoch": 1712} {"train_loss": -37.9267692565918, "global_step": 207270, "epoch": 1712} {"train_loss": -32.221168518066406, "global_step": 207271, "epoch": 1712} {"train_loss": -40.42810246175971, "global_step": 207272, "epoch": 1712, "val_loss": 2608995.5} {"train_loss": -33.36436080932617, "global_step": 207273, "epoch": 1713} {"train_loss": -36.263912200927734, "global_step": 207274, "epoch": 1713} {"train_loss": -33.81251907348633, "global_step": 207275, "epoch": 1713} {"train_loss": -36.321346282958984, "global_step": 207276, "epoch": 1713} {"train_loss": -36.38774490356445, "global_step": 207277, "epoch": 1713} {"train_loss": -38.37566375732422, "global_step": 207278, "epoch": 1713} {"train_loss": -35.954795837402344, "global_step": 207279, "epoch": 1713} {"train_loss": -36.48467254638672, "global_step": 207280, "epoch": 1713} {"train_loss": -38.92570114135742, "global_step": 207281, "epoch": 1713} {"train_loss": -37.10538101196289, "global_step": 207282, "epoch": 1713} {"train_loss": -31.650833129882812, "global_step": 207283, "epoch": 1713} {"train_loss": -36.358604431152344, "global_step": 207284, "epoch": 1713} {"train_loss": -38.42094802856445, "global_step": 207285, "epoch": 1713} {"train_loss": -37.38705062866211, "global_step": 207286, "epoch": 1713} {"train_loss": -37.32558059692383, "global_step": 207287, "epoch": 1713} {"train_loss": -38.7429313659668, "global_step": 207288, "epoch": 1713} {"train_loss": -39.1401481628418, "global_step": 207289, "epoch": 1713} {"train_loss": -38.5062141418457, "global_step": 207290, "epoch": 1713} {"train_loss": -39.3358268737793, "global_step": 207291, "epoch": 1713} {"train_loss": -36.368831634521484, "global_step": 207292, "epoch": 1713} {"train_loss": -38.35175323486328, "global_step": 207293, "epoch": 1713} {"train_loss": -37.79802703857422, "global_step": 207294, "epoch": 1713} {"train_loss": -38.64958572387695, "global_step": 207295, "epoch": 1713} {"train_loss": -39.692195892333984, "global_step": 207296, "epoch": 1713} {"train_loss": -38.656654357910156, "global_step": 207297, "epoch": 1713} {"train_loss": -39.54354476928711, "global_step": 207298, "epoch": 1713} {"train_loss": -39.64857864379883, "global_step": 207299, "epoch": 1713} {"train_loss": -38.571895599365234, "global_step": 207300, "epoch": 1713} {"train_loss": -39.843177795410156, "global_step": 207301, "epoch": 1713} {"train_loss": -39.26143264770508, "global_step": 207302, "epoch": 1713} {"train_loss": -39.487117767333984, "global_step": 207303, "epoch": 1713} {"train_loss": -39.94738006591797, "global_step": 207304, "epoch": 1713} {"train_loss": -39.80331039428711, "global_step": 207305, "epoch": 1713} {"train_loss": -39.64388656616211, "global_step": 207306, "epoch": 1713} {"train_loss": -39.91547775268555, "global_step": 207307, "epoch": 1713} {"train_loss": -38.9560546875, "global_step": 207308, "epoch": 1713} {"train_loss": -40.27959442138672, "global_step": 207309, "epoch": 1713} {"train_loss": -39.89054489135742, "global_step": 207310, "epoch": 1713} {"train_loss": -38.90534591674805, "global_step": 207311, "epoch": 1713} {"train_loss": -39.90003204345703, "global_step": 207312, "epoch": 1713} {"train_loss": -40.13280487060547, "global_step": 207313, "epoch": 1713} {"train_loss": -39.740177154541016, "global_step": 207314, "epoch": 1713} {"train_loss": -40.149330139160156, "global_step": 207315, "epoch": 1713} {"train_loss": -40.119510650634766, "global_step": 207316, "epoch": 1713} {"train_loss": -39.36427688598633, "global_step": 207317, "epoch": 1713} {"train_loss": -40.43859100341797, "global_step": 207318, "epoch": 1713} {"train_loss": -40.0096549987793, "global_step": 207319, "epoch": 1713} {"train_loss": -40.019344329833984, "global_step": 207320, "epoch": 1713} {"train_loss": -40.665489196777344, "global_step": 207321, "epoch": 1713} {"train_loss": -40.490699768066406, "global_step": 207322, "epoch": 1713} {"train_loss": -40.00276565551758, "global_step": 207323, "epoch": 1713} {"train_loss": -39.6547737121582, "global_step": 207324, "epoch": 1713} {"train_loss": -40.694427490234375, "global_step": 207325, "epoch": 1713} {"train_loss": -39.65045928955078, "global_step": 207326, "epoch": 1713} {"train_loss": -40.19682693481445, "global_step": 207327, "epoch": 1713} {"train_loss": -37.2639274597168, "global_step": 207328, "epoch": 1713} {"train_loss": -40.815452575683594, "global_step": 207329, "epoch": 1713} {"train_loss": -40.50752258300781, "global_step": 207330, "epoch": 1713} {"train_loss": -40.65874099731445, "global_step": 207331, "epoch": 1713} {"train_loss": -39.245662689208984, "global_step": 207332, "epoch": 1713} {"train_loss": -40.522823333740234, "global_step": 207333, "epoch": 1713} {"train_loss": -37.97785186767578, "global_step": 207334, "epoch": 1713} {"train_loss": -40.45924758911133, "global_step": 207335, "epoch": 1713} {"train_loss": -40.5940055847168, "global_step": 207336, "epoch": 1713} {"train_loss": -40.31429672241211, "global_step": 207337, "epoch": 1713} {"train_loss": -39.24530792236328, "global_step": 207338, "epoch": 1713} {"train_loss": -40.50361251831055, "global_step": 207339, "epoch": 1713} {"train_loss": -39.26044845581055, "global_step": 207340, "epoch": 1713} {"train_loss": -40.44649887084961, "global_step": 207341, "epoch": 1713} {"train_loss": -39.77250289916992, "global_step": 207342, "epoch": 1713} {"train_loss": -40.70526123046875, "global_step": 207343, "epoch": 1713} {"train_loss": -40.558223724365234, "global_step": 207344, "epoch": 1713} {"train_loss": -40.294044494628906, "global_step": 207345, "epoch": 1713} {"train_loss": -41.11403274536133, "global_step": 207346, "epoch": 1713} {"train_loss": -40.593421936035156, "global_step": 207347, "epoch": 1713} {"train_loss": -40.67014694213867, "global_step": 207348, "epoch": 1713} {"train_loss": -40.90730667114258, "global_step": 207349, "epoch": 1713} {"train_loss": -40.5195198059082, "global_step": 207350, "epoch": 1713} {"train_loss": -39.33198165893555, "global_step": 207351, "epoch": 1713} {"train_loss": -41.254791259765625, "global_step": 207352, "epoch": 1713} {"train_loss": -40.401058197021484, "global_step": 207353, "epoch": 1713} {"train_loss": -41.23897933959961, "global_step": 207354, "epoch": 1713} {"train_loss": -40.97562789916992, "global_step": 207355, "epoch": 1713} {"train_loss": -41.66704559326172, "global_step": 207356, "epoch": 1713} {"train_loss": -40.606712341308594, "global_step": 207357, "epoch": 1713} {"train_loss": -40.7122688293457, "global_step": 207358, "epoch": 1713} {"train_loss": -39.688297271728516, "global_step": 207359, "epoch": 1713} {"train_loss": -40.32038879394531, "global_step": 207360, "epoch": 1713} {"train_loss": -40.68062210083008, "global_step": 207361, "epoch": 1713} {"train_loss": -41.553707122802734, "global_step": 207362, "epoch": 1713} {"train_loss": -41.27260208129883, "global_step": 207363, "epoch": 1713} {"train_loss": -41.69989776611328, "global_step": 207364, "epoch": 1713} {"train_loss": -41.45912551879883, "global_step": 207365, "epoch": 1713} {"train_loss": -41.65242004394531, "global_step": 207366, "epoch": 1713} {"train_loss": -41.36546325683594, "global_step": 207367, "epoch": 1713} {"train_loss": -41.072975158691406, "global_step": 207368, "epoch": 1713} {"train_loss": -42.088897705078125, "global_step": 207369, "epoch": 1713} {"train_loss": -41.37815475463867, "global_step": 207370, "epoch": 1713} {"train_loss": -40.90223693847656, "global_step": 207371, "epoch": 1713} {"train_loss": -40.37540054321289, "global_step": 207372, "epoch": 1713} {"train_loss": -41.76812744140625, "global_step": 207373, "epoch": 1713} {"train_loss": -40.99665069580078, "global_step": 207374, "epoch": 1713} {"train_loss": -39.72336196899414, "global_step": 207375, "epoch": 1713} {"train_loss": -40.85900115966797, "global_step": 207376, "epoch": 1713} {"train_loss": -40.61376953125, "global_step": 207377, "epoch": 1713} {"train_loss": -41.27594757080078, "global_step": 207378, "epoch": 1713} {"train_loss": -41.024139404296875, "global_step": 207379, "epoch": 1713} {"train_loss": -41.7037467956543, "global_step": 207380, "epoch": 1713} {"train_loss": -41.64176559448242, "global_step": 207381, "epoch": 1713} {"train_loss": -41.03517532348633, "global_step": 207382, "epoch": 1713} {"train_loss": -41.064334869384766, "global_step": 207383, "epoch": 1713} {"train_loss": -40.267818450927734, "global_step": 207384, "epoch": 1713} {"train_loss": -39.11330032348633, "global_step": 207385, "epoch": 1713} {"train_loss": -41.53520202636719, "global_step": 207386, "epoch": 1713} {"train_loss": -41.65435791015625, "global_step": 207387, "epoch": 1713} {"train_loss": -40.65860366821289, "global_step": 207388, "epoch": 1713} {"train_loss": -41.46232604980469, "global_step": 207389, "epoch": 1713} {"train_loss": -40.65885543823242, "global_step": 207390, "epoch": 1713} {"train_loss": -39.994773864746094, "global_step": 207391, "epoch": 1713} {"train_loss": -41.32204818725586, "global_step": 207392, "epoch": 1713} {"train_loss": -39.737195669126905, "global_step": 207393, "epoch": 1713, "val_loss": 2825769.75} {"train_loss": -40.8420524597168, "global_step": 207394, "epoch": 1714} {"train_loss": -40.900997161865234, "global_step": 207395, "epoch": 1714} {"train_loss": -40.00645065307617, "global_step": 207396, "epoch": 1714} {"train_loss": -40.226863861083984, "global_step": 207397, "epoch": 1714} {"train_loss": -41.038665771484375, "global_step": 207398, "epoch": 1714} {"train_loss": -41.337398529052734, "global_step": 207399, "epoch": 1714} {"train_loss": -41.13918685913086, "global_step": 207400, "epoch": 1714} {"train_loss": -38.98984909057617, "global_step": 207401, "epoch": 1714} {"train_loss": -37.9849967956543, "global_step": 207402, "epoch": 1714} {"train_loss": -40.6386833190918, "global_step": 207403, "epoch": 1714} {"train_loss": -39.2840461730957, "global_step": 207404, "epoch": 1714} {"train_loss": -39.490474700927734, "global_step": 207405, "epoch": 1714} {"train_loss": -39.17142868041992, "global_step": 207406, "epoch": 1714} {"train_loss": -38.606597900390625, "global_step": 207407, "epoch": 1714} {"train_loss": -36.727386474609375, "global_step": 207408, "epoch": 1714} {"train_loss": -37.61528015136719, "global_step": 207409, "epoch": 1714} {"train_loss": -39.0965690612793, "global_step": 207410, "epoch": 1714} {"train_loss": -39.6993293762207, "global_step": 207411, "epoch": 1714} {"train_loss": -36.01981735229492, "global_step": 207412, "epoch": 1714} {"train_loss": -34.610347747802734, "global_step": 207413, "epoch": 1714} {"train_loss": -35.90663528442383, "global_step": 207414, "epoch": 1714} {"train_loss": -39.42681884765625, "global_step": 207415, "epoch": 1714} {"train_loss": -39.65165328979492, "global_step": 207416, "epoch": 1714} {"train_loss": -34.76108932495117, "global_step": 207417, "epoch": 1714} {"train_loss": -40.21113204956055, "global_step": 207418, "epoch": 1714} {"train_loss": -37.6246223449707, "global_step": 207419, "epoch": 1714} {"train_loss": -38.169700622558594, "global_step": 207420, "epoch": 1714} {"train_loss": -38.37861251831055, "global_step": 207421, "epoch": 1714} {"train_loss": -36.58625411987305, "global_step": 207422, "epoch": 1714} {"train_loss": -38.752681732177734, "global_step": 207423, "epoch": 1714} {"train_loss": -38.899436950683594, "global_step": 207424, "epoch": 1714} {"train_loss": -36.30535888671875, "global_step": 207425, "epoch": 1714} {"train_loss": -40.12018966674805, "global_step": 207426, "epoch": 1714} {"train_loss": -39.999977111816406, "global_step": 207427, "epoch": 1714} {"train_loss": -39.5230712890625, "global_step": 207428, "epoch": 1714} {"train_loss": -40.09392547607422, "global_step": 207429, "epoch": 1714} {"train_loss": -40.57804489135742, "global_step": 207430, "epoch": 1714} {"train_loss": -39.80666732788086, "global_step": 207431, "epoch": 1714} {"train_loss": -41.083431243896484, "global_step": 207432, "epoch": 1714} {"train_loss": -39.583106994628906, "global_step": 207433, "epoch": 1714} {"train_loss": -40.9341926574707, "global_step": 207434, "epoch": 1714} {"train_loss": -40.36979293823242, "global_step": 207435, "epoch": 1714} {"train_loss": -40.72827911376953, "global_step": 207436, "epoch": 1714} {"train_loss": -40.6046257019043, "global_step": 207437, "epoch": 1714} {"train_loss": -40.999366760253906, "global_step": 207438, "epoch": 1714} {"train_loss": -41.08261489868164, "global_step": 207439, "epoch": 1714} {"train_loss": -39.95626449584961, "global_step": 207440, "epoch": 1714} {"train_loss": -40.69704055786133, "global_step": 207441, "epoch": 1714} {"train_loss": -40.54117965698242, "global_step": 207442, "epoch": 1714} {"train_loss": -40.219879150390625, "global_step": 207443, "epoch": 1714} {"train_loss": -41.2893180847168, "global_step": 207444, "epoch": 1714} {"train_loss": -40.61857223510742, "global_step": 207445, "epoch": 1714} {"train_loss": -41.02218246459961, "global_step": 207446, "epoch": 1714} {"train_loss": -41.0281982421875, "global_step": 207447, "epoch": 1714} {"train_loss": -41.18083190917969, "global_step": 207448, "epoch": 1714} {"train_loss": -41.15729904174805, "global_step": 207449, "epoch": 1714} {"train_loss": -40.81739044189453, "global_step": 207450, "epoch": 1714} {"train_loss": -41.468116760253906, "global_step": 207451, "epoch": 1714} {"train_loss": -39.15413284301758, "global_step": 207452, "epoch": 1714} {"train_loss": -40.531551361083984, "global_step": 207453, "epoch": 1714} {"train_loss": -41.40018844604492, "global_step": 207454, "epoch": 1714} {"train_loss": -39.999691009521484, "global_step": 207455, "epoch": 1714} {"train_loss": -41.25709915161133, "global_step": 207456, "epoch": 1714} {"train_loss": -41.5770149230957, "global_step": 207457, "epoch": 1714} {"train_loss": -41.527767181396484, "global_step": 207458, "epoch": 1714} {"train_loss": -40.80183029174805, "global_step": 207459, "epoch": 1714} {"train_loss": -40.76776885986328, "global_step": 207460, "epoch": 1714} {"train_loss": -41.351715087890625, "global_step": 207461, "epoch": 1714} {"train_loss": -41.99534225463867, "global_step": 207462, "epoch": 1714} {"train_loss": -41.43836975097656, "global_step": 207463, "epoch": 1714} {"train_loss": -41.1736946105957, "global_step": 207464, "epoch": 1714} {"train_loss": -41.47219467163086, "global_step": 207465, "epoch": 1714} {"train_loss": -41.19913864135742, "global_step": 207466, "epoch": 1714} {"train_loss": -41.387779235839844, "global_step": 207467, "epoch": 1714} {"train_loss": -41.745277404785156, "global_step": 207468, "epoch": 1714} {"train_loss": -41.24374008178711, "global_step": 207469, "epoch": 1714} {"train_loss": -41.08792495727539, "global_step": 207470, "epoch": 1714} {"train_loss": -41.09054946899414, "global_step": 207471, "epoch": 1714} {"train_loss": -41.25916290283203, "global_step": 207472, "epoch": 1714} {"train_loss": -40.8342170715332, "global_step": 207473, "epoch": 1714} {"train_loss": -41.2856559753418, "global_step": 207474, "epoch": 1714} {"train_loss": -41.12384796142578, "global_step": 207475, "epoch": 1714} {"train_loss": -40.8789176940918, "global_step": 207476, "epoch": 1714} {"train_loss": -41.52467727661133, "global_step": 207477, "epoch": 1714} {"train_loss": -41.108272552490234, "global_step": 207478, "epoch": 1714} {"train_loss": -39.98953628540039, "global_step": 207479, "epoch": 1714} {"train_loss": -41.5621452331543, "global_step": 207480, "epoch": 1714} {"train_loss": -40.06598663330078, "global_step": 207481, "epoch": 1714} {"train_loss": -41.5871696472168, "global_step": 207482, "epoch": 1714} {"train_loss": -41.02144241333008, "global_step": 207483, "epoch": 1714} {"train_loss": -41.21988296508789, "global_step": 207484, "epoch": 1714} {"train_loss": -40.479591369628906, "global_step": 207485, "epoch": 1714} {"train_loss": -40.43365478515625, "global_step": 207486, "epoch": 1714} {"train_loss": -41.37322998046875, "global_step": 207487, "epoch": 1714} {"train_loss": -41.492584228515625, "global_step": 207488, "epoch": 1714} {"train_loss": -40.39188766479492, "global_step": 207489, "epoch": 1714} {"train_loss": -41.07315444946289, "global_step": 207490, "epoch": 1714} {"train_loss": -41.02745819091797, "global_step": 207491, "epoch": 1714} {"train_loss": -40.991676330566406, "global_step": 207492, "epoch": 1714} {"train_loss": -41.049129486083984, "global_step": 207493, "epoch": 1714} {"train_loss": -40.32155990600586, "global_step": 207494, "epoch": 1714} {"train_loss": -41.806060791015625, "global_step": 207495, "epoch": 1714} {"train_loss": -39.211910247802734, "global_step": 207496, "epoch": 1714} {"train_loss": -41.63016128540039, "global_step": 207497, "epoch": 1714} {"train_loss": -40.42280197143555, "global_step": 207498, "epoch": 1714} {"train_loss": -40.066070556640625, "global_step": 207499, "epoch": 1714} {"train_loss": -41.49016571044922, "global_step": 207500, "epoch": 1714} {"train_loss": -39.2002067565918, "global_step": 207501, "epoch": 1714} {"train_loss": -39.672237396240234, "global_step": 207502, "epoch": 1714} {"train_loss": -40.48571014404297, "global_step": 207503, "epoch": 1714} {"train_loss": -38.99586868286133, "global_step": 207504, "epoch": 1714} {"train_loss": -40.213890075683594, "global_step": 207505, "epoch": 1714} {"train_loss": -37.884681701660156, "global_step": 207506, "epoch": 1714} {"train_loss": -40.463993072509766, "global_step": 207507, "epoch": 1714} {"train_loss": -40.796688079833984, "global_step": 207508, "epoch": 1714} {"train_loss": -40.868141174316406, "global_step": 207509, "epoch": 1714} {"train_loss": -40.46586227416992, "global_step": 207510, "epoch": 1714} {"train_loss": -41.346092224121094, "global_step": 207511, "epoch": 1714} {"train_loss": -40.66312789916992, "global_step": 207512, "epoch": 1714} {"train_loss": -40.30310821533203, "global_step": 207513, "epoch": 1714} {"train_loss": -40.2141513982095, "global_step": 207514, "epoch": 1714, "val_loss": 2616920.25} {"train_loss": -40.74045944213867, "global_step": 207515, "epoch": 1715} {"train_loss": -39.96812057495117, "global_step": 207516, "epoch": 1715} {"train_loss": -40.84931564331055, "global_step": 207517, "epoch": 1715} {"train_loss": -41.759700775146484, "global_step": 207518, "epoch": 1715} {"train_loss": -39.178741455078125, "global_step": 207519, "epoch": 1715} {"train_loss": -39.065711975097656, "global_step": 207520, "epoch": 1715} {"train_loss": -41.6733512878418, "global_step": 207521, "epoch": 1715} {"train_loss": -39.9978141784668, "global_step": 207522, "epoch": 1715} {"train_loss": -39.67437744140625, "global_step": 207523, "epoch": 1715} {"train_loss": -41.80104446411133, "global_step": 207524, "epoch": 1715} {"train_loss": -40.612911224365234, "global_step": 207525, "epoch": 1715} {"train_loss": -39.66721725463867, "global_step": 207526, "epoch": 1715} {"train_loss": -39.95699691772461, "global_step": 207527, "epoch": 1715} {"train_loss": -41.435630798339844, "global_step": 207528, "epoch": 1715} {"train_loss": -41.09489059448242, "global_step": 207529, "epoch": 1715} {"train_loss": -41.21744918823242, "global_step": 207530, "epoch": 1715} {"train_loss": -40.513763427734375, "global_step": 207531, "epoch": 1715} {"train_loss": -40.76234436035156, "global_step": 207532, "epoch": 1715} {"train_loss": -40.58462905883789, "global_step": 207533, "epoch": 1715} {"train_loss": -41.11810302734375, "global_step": 207534, "epoch": 1715} {"train_loss": -41.67463684082031, "global_step": 207535, "epoch": 1715} {"train_loss": -41.5060920715332, "global_step": 207536, "epoch": 1715} {"train_loss": -41.5205192565918, "global_step": 207537, "epoch": 1715} {"train_loss": -41.22022247314453, "global_step": 207538, "epoch": 1715} {"train_loss": -41.42777633666992, "global_step": 207539, "epoch": 1715} {"train_loss": -41.57073974609375, "global_step": 207540, "epoch": 1715} {"train_loss": -40.741355895996094, "global_step": 207541, "epoch": 1715} {"train_loss": -42.47763442993164, "global_step": 207542, "epoch": 1715} {"train_loss": -41.401031494140625, "global_step": 207543, "epoch": 1715} {"train_loss": -41.563995361328125, "global_step": 207544, "epoch": 1715} {"train_loss": -40.52049255371094, "global_step": 207545, "epoch": 1715} {"train_loss": -41.77619552612305, "global_step": 207546, "epoch": 1715} {"train_loss": -41.847450256347656, "global_step": 207547, "epoch": 1715} {"train_loss": -42.08169937133789, "global_step": 207548, "epoch": 1715} {"train_loss": -41.88539505004883, "global_step": 207549, "epoch": 1715} {"train_loss": -41.93586730957031, "global_step": 207550, "epoch": 1715} {"train_loss": -37.73783874511719, "global_step": 207551, "epoch": 1715} {"train_loss": -42.1263427734375, "global_step": 207552, "epoch": 1715} {"train_loss": -41.167457580566406, "global_step": 207553, "epoch": 1715} {"train_loss": -40.5269775390625, "global_step": 207554, "epoch": 1715} {"train_loss": -42.254722595214844, "global_step": 207555, "epoch": 1715} {"train_loss": -41.644081115722656, "global_step": 207556, "epoch": 1715} {"train_loss": -41.64472579956055, "global_step": 207557, "epoch": 1715} {"train_loss": -41.41231155395508, "global_step": 207558, "epoch": 1715} {"train_loss": -40.73690414428711, "global_step": 207559, "epoch": 1715} {"train_loss": -42.11091232299805, "global_step": 207560, "epoch": 1715} {"train_loss": -41.9114990234375, "global_step": 207561, "epoch": 1715} {"train_loss": -42.112457275390625, "global_step": 207562, "epoch": 1715} {"train_loss": -41.381622314453125, "global_step": 207563, "epoch": 1715} {"train_loss": -41.10272979736328, "global_step": 207564, "epoch": 1715} {"train_loss": -42.76936721801758, "global_step": 207565, "epoch": 1715} {"train_loss": -42.19868469238281, "global_step": 207566, "epoch": 1715} {"train_loss": -42.205684661865234, "global_step": 207567, "epoch": 1715} {"train_loss": -42.05179977416992, "global_step": 207568, "epoch": 1715} {"train_loss": -42.35770797729492, "global_step": 207569, "epoch": 1715} {"train_loss": -42.61281967163086, "global_step": 207570, "epoch": 1715} {"train_loss": -42.1791877746582, "global_step": 207571, "epoch": 1715} {"train_loss": -41.890071868896484, "global_step": 207572, "epoch": 1715} {"train_loss": -41.9903678894043, "global_step": 207573, "epoch": 1715} {"train_loss": -42.14039611816406, "global_step": 207574, "epoch": 1715} {"train_loss": -42.210487365722656, "global_step": 207575, "epoch": 1715} {"train_loss": -42.447723388671875, "global_step": 207576, "epoch": 1715} {"train_loss": -41.207122802734375, "global_step": 207577, "epoch": 1715} {"train_loss": -42.833343505859375, "global_step": 207578, "epoch": 1715} {"train_loss": -42.13773727416992, "global_step": 207579, "epoch": 1715} {"train_loss": -42.42637634277344, "global_step": 207580, "epoch": 1715} {"train_loss": -41.32830810546875, "global_step": 207581, "epoch": 1715} {"train_loss": -41.23927688598633, "global_step": 207582, "epoch": 1715} {"train_loss": -42.543067932128906, "global_step": 207583, "epoch": 1715} {"train_loss": -42.105709075927734, "global_step": 207584, "epoch": 1715} {"train_loss": -42.6677360534668, "global_step": 207585, "epoch": 1715} {"train_loss": -42.699886322021484, "global_step": 207586, "epoch": 1715} {"train_loss": -42.71369552612305, "global_step": 207587, "epoch": 1715} {"train_loss": -42.54121780395508, "global_step": 207588, "epoch": 1715} {"train_loss": -42.2502555847168, "global_step": 207589, "epoch": 1715} {"train_loss": -40.866886138916016, "global_step": 207590, "epoch": 1715} {"train_loss": -41.79777526855469, "global_step": 207591, "epoch": 1715} {"train_loss": -42.068172454833984, "global_step": 207592, "epoch": 1715} {"train_loss": -42.33893966674805, "global_step": 207593, "epoch": 1715} {"train_loss": -42.28068161010742, "global_step": 207594, "epoch": 1715} {"train_loss": -41.56161880493164, "global_step": 207595, "epoch": 1715} {"train_loss": -42.24924087524414, "global_step": 207596, "epoch": 1715} {"train_loss": -41.52838134765625, "global_step": 207597, "epoch": 1715} {"train_loss": -41.91165542602539, "global_step": 207598, "epoch": 1715} {"train_loss": -41.58687973022461, "global_step": 207599, "epoch": 1715} {"train_loss": -41.27692794799805, "global_step": 207600, "epoch": 1715} {"train_loss": -41.6035270690918, "global_step": 207601, "epoch": 1715} {"train_loss": -41.9378662109375, "global_step": 207602, "epoch": 1715} {"train_loss": -41.70132064819336, "global_step": 207603, "epoch": 1715} {"train_loss": -41.5609130859375, "global_step": 207604, "epoch": 1715} {"train_loss": -39.59392166137695, "global_step": 207605, "epoch": 1715} {"train_loss": -39.475276947021484, "global_step": 207606, "epoch": 1715} {"train_loss": -39.74275588989258, "global_step": 207607, "epoch": 1715} {"train_loss": -40.07574462890625, "global_step": 207608, "epoch": 1715} {"train_loss": -38.79229736328125, "global_step": 207609, "epoch": 1715} {"train_loss": -37.68748474121094, "global_step": 207610, "epoch": 1715} {"train_loss": -35.64775466918945, "global_step": 207611, "epoch": 1715} {"train_loss": -40.20374298095703, "global_step": 207612, "epoch": 1715} {"train_loss": -37.57696533203125, "global_step": 207613, "epoch": 1715} {"train_loss": -40.362545013427734, "global_step": 207614, "epoch": 1715} {"train_loss": -40.18294906616211, "global_step": 207615, "epoch": 1715} {"train_loss": -38.73026657104492, "global_step": 207616, "epoch": 1715} {"train_loss": -39.650390625, "global_step": 207617, "epoch": 1715} {"train_loss": -38.760250091552734, "global_step": 207618, "epoch": 1715} {"train_loss": -41.18532943725586, "global_step": 207619, "epoch": 1715} {"train_loss": -39.64276123046875, "global_step": 207620, "epoch": 1715} {"train_loss": -39.308204650878906, "global_step": 207621, "epoch": 1715} {"train_loss": -40.24666976928711, "global_step": 207622, "epoch": 1715} {"train_loss": -40.86817169189453, "global_step": 207623, "epoch": 1715} {"train_loss": -40.357444763183594, "global_step": 207624, "epoch": 1715} {"train_loss": -40.757164001464844, "global_step": 207625, "epoch": 1715} {"train_loss": -40.840003967285156, "global_step": 207626, "epoch": 1715} {"train_loss": -39.72661209106445, "global_step": 207627, "epoch": 1715} {"train_loss": -40.743995666503906, "global_step": 207628, "epoch": 1715} {"train_loss": -40.9273796081543, "global_step": 207629, "epoch": 1715} {"train_loss": -40.92609786987305, "global_step": 207630, "epoch": 1715} {"train_loss": -40.2801628112793, "global_step": 207631, "epoch": 1715} {"train_loss": -41.52913284301758, "global_step": 207632, "epoch": 1715} {"train_loss": -41.25973129272461, "global_step": 207633, "epoch": 1715} {"train_loss": -41.462032318115234, "global_step": 207634, "epoch": 1715} {"train_loss": -41.11084249196959, "global_step": 207635, "epoch": 1715, "val_loss": 2638928.0} {"train_loss": -41.2846794128418, "global_step": 207636, "epoch": 1716} {"train_loss": -40.98318099975586, "global_step": 207637, "epoch": 1716} {"train_loss": -41.35856628417969, "global_step": 207638, "epoch": 1716} {"train_loss": -41.20500946044922, "global_step": 207639, "epoch": 1716} {"train_loss": -41.057891845703125, "global_step": 207640, "epoch": 1716} {"train_loss": -41.5187873840332, "global_step": 207641, "epoch": 1716} {"train_loss": -41.80128479003906, "global_step": 207642, "epoch": 1716} {"train_loss": -41.096553802490234, "global_step": 207643, "epoch": 1716} {"train_loss": -40.7288703918457, "global_step": 207644, "epoch": 1716} {"train_loss": -41.96369552612305, "global_step": 207645, "epoch": 1716} {"train_loss": -41.46192169189453, "global_step": 207646, "epoch": 1716} {"train_loss": -41.353206634521484, "global_step": 207647, "epoch": 1716} {"train_loss": -41.732662200927734, "global_step": 207648, "epoch": 1716} {"train_loss": -41.520992279052734, "global_step": 207649, "epoch": 1716} {"train_loss": -40.92418670654297, "global_step": 207650, "epoch": 1716} {"train_loss": -40.6928825378418, "global_step": 207651, "epoch": 1716} {"train_loss": -40.21028518676758, "global_step": 207652, "epoch": 1716} {"train_loss": -41.42011260986328, "global_step": 207653, "epoch": 1716} {"train_loss": -41.649925231933594, "global_step": 207654, "epoch": 1716} {"train_loss": -41.8268928527832, "global_step": 207655, "epoch": 1716} {"train_loss": -42.200355529785156, "global_step": 207656, "epoch": 1716} {"train_loss": -41.68928527832031, "global_step": 207657, "epoch": 1716} {"train_loss": -41.86619567871094, "global_step": 207658, "epoch": 1716} {"train_loss": -41.72334671020508, "global_step": 207659, "epoch": 1716} {"train_loss": -41.92658996582031, "global_step": 207660, "epoch": 1716} {"train_loss": -42.227394104003906, "global_step": 207661, "epoch": 1716} {"train_loss": -41.96123123168945, "global_step": 207662, "epoch": 1716} {"train_loss": -39.937129974365234, "global_step": 207663, "epoch": 1716} {"train_loss": -40.578365325927734, "global_step": 207664, "epoch": 1716} {"train_loss": -39.008331298828125, "global_step": 207665, "epoch": 1716} {"train_loss": -41.56890106201172, "global_step": 207666, "epoch": 1716} {"train_loss": -38.85723876953125, "global_step": 207667, "epoch": 1716} {"train_loss": -41.72052001953125, "global_step": 207668, "epoch": 1716} {"train_loss": -39.646339416503906, "global_step": 207669, "epoch": 1716} {"train_loss": -41.71230697631836, "global_step": 207670, "epoch": 1716} {"train_loss": -40.37205123901367, "global_step": 207671, "epoch": 1716} {"train_loss": -42.00115203857422, "global_step": 207672, "epoch": 1716} {"train_loss": -42.0416259765625, "global_step": 207673, "epoch": 1716} {"train_loss": -40.637386322021484, "global_step": 207674, "epoch": 1716} {"train_loss": -41.67708969116211, "global_step": 207675, "epoch": 1716} {"train_loss": -40.806331634521484, "global_step": 207676, "epoch": 1716} {"train_loss": -41.93781280517578, "global_step": 207677, "epoch": 1716} {"train_loss": -42.11238479614258, "global_step": 207678, "epoch": 1716} {"train_loss": -41.0655632019043, "global_step": 207679, "epoch": 1716} {"train_loss": -42.477230072021484, "global_step": 207680, "epoch": 1716} {"train_loss": -41.7088623046875, "global_step": 207681, "epoch": 1716} {"train_loss": -41.80172348022461, "global_step": 207682, "epoch": 1716} {"train_loss": -40.920650482177734, "global_step": 207683, "epoch": 1716} {"train_loss": -42.332645416259766, "global_step": 207684, "epoch": 1716} {"train_loss": -41.332298278808594, "global_step": 207685, "epoch": 1716} {"train_loss": -41.981353759765625, "global_step": 207686, "epoch": 1716} {"train_loss": -42.10828399658203, "global_step": 207687, "epoch": 1716} {"train_loss": -42.39936065673828, "global_step": 207688, "epoch": 1716} {"train_loss": -40.96216583251953, "global_step": 207689, "epoch": 1716} {"train_loss": -41.51637649536133, "global_step": 207690, "epoch": 1716} {"train_loss": -40.920494079589844, "global_step": 207691, "epoch": 1716} {"train_loss": -42.09876251220703, "global_step": 207692, "epoch": 1716} {"train_loss": -42.10622024536133, "global_step": 207693, "epoch": 1716} {"train_loss": -43.0916748046875, "global_step": 207694, "epoch": 1716} {"train_loss": -41.97756576538086, "global_step": 207695, "epoch": 1716} {"train_loss": -42.3516845703125, "global_step": 207696, "epoch": 1716} {"train_loss": -42.001705169677734, "global_step": 207697, "epoch": 1716} {"train_loss": -42.778045654296875, "global_step": 207698, "epoch": 1716} {"train_loss": -42.56135177612305, "global_step": 207699, "epoch": 1716} {"train_loss": -41.9706916809082, "global_step": 207700, "epoch": 1716} {"train_loss": -42.0135498046875, "global_step": 207701, "epoch": 1716} {"train_loss": -41.65546798706055, "global_step": 207702, "epoch": 1716} {"train_loss": -37.5241813659668, "global_step": 207703, "epoch": 1716} {"train_loss": -42.27067184448242, "global_step": 207704, "epoch": 1716} {"train_loss": -42.5657958984375, "global_step": 207705, "epoch": 1716} {"train_loss": -41.508140563964844, "global_step": 207706, "epoch": 1716} {"train_loss": -39.406681060791016, "global_step": 207707, "epoch": 1716} {"train_loss": -40.48830795288086, "global_step": 207708, "epoch": 1716} {"train_loss": -40.85285568237305, "global_step": 207709, "epoch": 1716} {"train_loss": -41.58822250366211, "global_step": 207710, "epoch": 1716} {"train_loss": -42.61906433105469, "global_step": 207711, "epoch": 1716} {"train_loss": -40.941280364990234, "global_step": 207712, "epoch": 1716} {"train_loss": -40.578697204589844, "global_step": 207713, "epoch": 1716} {"train_loss": -37.99717330932617, "global_step": 207714, "epoch": 1716} {"train_loss": -41.16814422607422, "global_step": 207715, "epoch": 1716} {"train_loss": -41.54207992553711, "global_step": 207716, "epoch": 1716} {"train_loss": -41.108394622802734, "global_step": 207717, "epoch": 1716} {"train_loss": -40.60499572753906, "global_step": 207718, "epoch": 1716} {"train_loss": -40.20756149291992, "global_step": 207719, "epoch": 1716} {"train_loss": -39.66347885131836, "global_step": 207720, "epoch": 1716} {"train_loss": -40.11821365356445, "global_step": 207721, "epoch": 1716} {"train_loss": -39.393550872802734, "global_step": 207722, "epoch": 1716} {"train_loss": -40.055397033691406, "global_step": 207723, "epoch": 1716} {"train_loss": -39.721351623535156, "global_step": 207724, "epoch": 1716} {"train_loss": -38.104248046875, "global_step": 207725, "epoch": 1716} {"train_loss": -37.719417572021484, "global_step": 207726, "epoch": 1716} {"train_loss": -33.98662567138672, "global_step": 207727, "epoch": 1716} {"train_loss": -33.84724807739258, "global_step": 207728, "epoch": 1716} {"train_loss": -37.82444381713867, "global_step": 207729, "epoch": 1716} {"train_loss": -40.53652572631836, "global_step": 207730, "epoch": 1716} {"train_loss": -37.771663665771484, "global_step": 207731, "epoch": 1716} {"train_loss": -38.66775131225586, "global_step": 207732, "epoch": 1716} {"train_loss": -39.942787170410156, "global_step": 207733, "epoch": 1716} {"train_loss": -39.33594512939453, "global_step": 207734, "epoch": 1716} {"train_loss": -40.768310546875, "global_step": 207735, "epoch": 1716} {"train_loss": -38.26493453979492, "global_step": 207736, "epoch": 1716} {"train_loss": -39.325523376464844, "global_step": 207737, "epoch": 1716} {"train_loss": -40.595489501953125, "global_step": 207738, "epoch": 1716} {"train_loss": -41.153594970703125, "global_step": 207739, "epoch": 1716} {"train_loss": -40.731319427490234, "global_step": 207740, "epoch": 1716} {"train_loss": -41.658260345458984, "global_step": 207741, "epoch": 1716} {"train_loss": -40.798824310302734, "global_step": 207742, "epoch": 1716} {"train_loss": -39.59820556640625, "global_step": 207743, "epoch": 1716} {"train_loss": -40.55860900878906, "global_step": 207744, "epoch": 1716} {"train_loss": -40.901485443115234, "global_step": 207745, "epoch": 1716} {"train_loss": -39.90796661376953, "global_step": 207746, "epoch": 1716} {"train_loss": -40.1171760559082, "global_step": 207747, "epoch": 1716} {"train_loss": -41.12366485595703, "global_step": 207748, "epoch": 1716} {"train_loss": -41.31246566772461, "global_step": 207749, "epoch": 1716} {"train_loss": -41.60010528564453, "global_step": 207750, "epoch": 1716} {"train_loss": -40.696083068847656, "global_step": 207751, "epoch": 1716} {"train_loss": -41.51947021484375, "global_step": 207752, "epoch": 1716} {"train_loss": -41.207698822021484, "global_step": 207753, "epoch": 1716} {"train_loss": -42.27415084838867, "global_step": 207754, "epoch": 1716} {"train_loss": -37.78945541381836, "global_step": 207755, "epoch": 1716} {"train_loss": -40.852879011926575, "global_step": 207756, "epoch": 1716, "val_loss": 2498143.75} {"train_loss": -41.895660400390625, "global_step": 207757, "epoch": 1717} {"train_loss": -41.622779846191406, "global_step": 207758, "epoch": 1717} {"train_loss": -39.92597198486328, "global_step": 207759, "epoch": 1717} {"train_loss": -41.940895080566406, "global_step": 207760, "epoch": 1717} {"train_loss": -41.69080352783203, "global_step": 207761, "epoch": 1717} {"train_loss": -41.15285110473633, "global_step": 207762, "epoch": 1717} {"train_loss": -41.693946838378906, "global_step": 207763, "epoch": 1717} {"train_loss": -41.1472053527832, "global_step": 207764, "epoch": 1717} {"train_loss": -40.39039993286133, "global_step": 207765, "epoch": 1717} {"train_loss": -41.76567077636719, "global_step": 207766, "epoch": 1717} {"train_loss": -38.82368087768555, "global_step": 207767, "epoch": 1717} {"train_loss": -39.304298400878906, "global_step": 207768, "epoch": 1717} {"train_loss": -41.06159591674805, "global_step": 207769, "epoch": 1717} {"train_loss": -40.81908416748047, "global_step": 207770, "epoch": 1717} {"train_loss": -40.6953239440918, "global_step": 207771, "epoch": 1717} {"train_loss": -38.74605941772461, "global_step": 207772, "epoch": 1717} {"train_loss": -39.336700439453125, "global_step": 207773, "epoch": 1717} {"train_loss": -40.88873291015625, "global_step": 207774, "epoch": 1717} {"train_loss": -32.373714447021484, "global_step": 207775, "epoch": 1717} {"train_loss": -39.87673568725586, "global_step": 207776, "epoch": 1717} {"train_loss": -40.109642028808594, "global_step": 207777, "epoch": 1717} {"train_loss": -40.3254508972168, "global_step": 207778, "epoch": 1717} {"train_loss": -37.84176254272461, "global_step": 207779, "epoch": 1717} {"train_loss": -31.95404624938965, "global_step": 207780, "epoch": 1717} {"train_loss": -36.42682647705078, "global_step": 207781, "epoch": 1717} {"train_loss": -37.434791564941406, "global_step": 207782, "epoch": 1717} {"train_loss": -38.15803146362305, "global_step": 207783, "epoch": 1717} {"train_loss": -40.19056701660156, "global_step": 207784, "epoch": 1717} {"train_loss": -39.0535774230957, "global_step": 207785, "epoch": 1717} {"train_loss": -40.65977096557617, "global_step": 207786, "epoch": 1717} {"train_loss": -39.12771224975586, "global_step": 207787, "epoch": 1717} {"train_loss": -39.7834358215332, "global_step": 207788, "epoch": 1717} {"train_loss": -37.57731246948242, "global_step": 207789, "epoch": 1717} {"train_loss": -38.383888244628906, "global_step": 207790, "epoch": 1717} {"train_loss": -38.28514862060547, "global_step": 207791, "epoch": 1717} {"train_loss": -38.960479736328125, "global_step": 207792, "epoch": 1717} {"train_loss": -39.17900466918945, "global_step": 207793, "epoch": 1717} {"train_loss": -39.585960388183594, "global_step": 207794, "epoch": 1717} {"train_loss": -40.526363372802734, "global_step": 207795, "epoch": 1717} {"train_loss": -38.645416259765625, "global_step": 207796, "epoch": 1717} {"train_loss": -38.629940032958984, "global_step": 207797, "epoch": 1717} {"train_loss": -39.90983963012695, "global_step": 207798, "epoch": 1717} {"train_loss": -38.67778396606445, "global_step": 207799, "epoch": 1717} {"train_loss": -39.887081146240234, "global_step": 207800, "epoch": 1717} {"train_loss": -40.43084716796875, "global_step": 207801, "epoch": 1717} {"train_loss": -39.72058868408203, "global_step": 207802, "epoch": 1717} {"train_loss": -39.723670959472656, "global_step": 207803, "epoch": 1717} {"train_loss": -39.8565559387207, "global_step": 207804, "epoch": 1717} {"train_loss": -40.30239486694336, "global_step": 207805, "epoch": 1717} {"train_loss": -40.53115463256836, "global_step": 207806, "epoch": 1717} {"train_loss": -40.01336669921875, "global_step": 207807, "epoch": 1717} {"train_loss": -39.807533264160156, "global_step": 207808, "epoch": 1717} {"train_loss": -40.775020599365234, "global_step": 207809, "epoch": 1717} {"train_loss": -41.07089614868164, "global_step": 207810, "epoch": 1717} {"train_loss": -38.557289123535156, "global_step": 207811, "epoch": 1717} {"train_loss": -40.654335021972656, "global_step": 207812, "epoch": 1717} {"train_loss": -41.47993087768555, "global_step": 207813, "epoch": 1717} {"train_loss": -41.270389556884766, "global_step": 207814, "epoch": 1717} {"train_loss": -39.18801498413086, "global_step": 207815, "epoch": 1717} {"train_loss": -39.864532470703125, "global_step": 207816, "epoch": 1717} {"train_loss": -41.51261901855469, "global_step": 207817, "epoch": 1717} {"train_loss": -41.38399887084961, "global_step": 207818, "epoch": 1717} {"train_loss": -40.93259811401367, "global_step": 207819, "epoch": 1717} {"train_loss": -41.188114166259766, "global_step": 207820, "epoch": 1717} {"train_loss": -41.236602783203125, "global_step": 207821, "epoch": 1717} {"train_loss": -41.55267333984375, "global_step": 207822, "epoch": 1717} {"train_loss": -41.063961029052734, "global_step": 207823, "epoch": 1717} {"train_loss": -40.844295501708984, "global_step": 207824, "epoch": 1717} {"train_loss": -41.594783782958984, "global_step": 207825, "epoch": 1717} {"train_loss": -41.42143630981445, "global_step": 207826, "epoch": 1717} {"train_loss": -41.581783294677734, "global_step": 207827, "epoch": 1717} {"train_loss": -41.677425384521484, "global_step": 207828, "epoch": 1717} {"train_loss": -41.54228210449219, "global_step": 207829, "epoch": 1717} {"train_loss": -42.06553268432617, "global_step": 207830, "epoch": 1717} {"train_loss": -41.87937545776367, "global_step": 207831, "epoch": 1717} {"train_loss": -40.709381103515625, "global_step": 207832, "epoch": 1717} {"train_loss": -40.680110931396484, "global_step": 207833, "epoch": 1717} {"train_loss": -42.237159729003906, "global_step": 207834, "epoch": 1717} {"train_loss": -41.5638542175293, "global_step": 207835, "epoch": 1717} {"train_loss": -40.505096435546875, "global_step": 207836, "epoch": 1717} {"train_loss": -41.95502853393555, "global_step": 207837, "epoch": 1717} {"train_loss": -41.67539596557617, "global_step": 207838, "epoch": 1717} {"train_loss": -42.22959518432617, "global_step": 207839, "epoch": 1717} {"train_loss": -42.23237991333008, "global_step": 207840, "epoch": 1717} {"train_loss": -42.12276840209961, "global_step": 207841, "epoch": 1717} {"train_loss": -42.32014846801758, "global_step": 207842, "epoch": 1717} {"train_loss": -41.85224533081055, "global_step": 207843, "epoch": 1717} {"train_loss": -42.44769287109375, "global_step": 207844, "epoch": 1717} {"train_loss": -41.564544677734375, "global_step": 207845, "epoch": 1717} {"train_loss": -42.0415153503418, "global_step": 207846, "epoch": 1717} {"train_loss": -42.23085403442383, "global_step": 207847, "epoch": 1717} {"train_loss": -41.30419158935547, "global_step": 207848, "epoch": 1717} {"train_loss": -39.88310623168945, "global_step": 207849, "epoch": 1717} {"train_loss": -41.98511505126953, "global_step": 207850, "epoch": 1717} {"train_loss": -42.0909423828125, "global_step": 207851, "epoch": 1717} {"train_loss": -42.602718353271484, "global_step": 207852, "epoch": 1717} {"train_loss": -41.55315399169922, "global_step": 207853, "epoch": 1717} {"train_loss": -42.03638458251953, "global_step": 207854, "epoch": 1717} {"train_loss": -41.04854965209961, "global_step": 207855, "epoch": 1717} {"train_loss": -42.44853973388672, "global_step": 207856, "epoch": 1717} {"train_loss": -41.981502532958984, "global_step": 207857, "epoch": 1717} {"train_loss": -41.7567253112793, "global_step": 207858, "epoch": 1717} {"train_loss": -40.324886322021484, "global_step": 207859, "epoch": 1717} {"train_loss": -41.462371826171875, "global_step": 207860, "epoch": 1717} {"train_loss": -41.94655990600586, "global_step": 207861, "epoch": 1717} {"train_loss": -42.51235580444336, "global_step": 207862, "epoch": 1717} {"train_loss": -41.08710861206055, "global_step": 207863, "epoch": 1717} {"train_loss": -41.6915397644043, "global_step": 207864, "epoch": 1717} {"train_loss": -41.568363189697266, "global_step": 207865, "epoch": 1717} {"train_loss": -41.66740036010742, "global_step": 207866, "epoch": 1717} {"train_loss": -41.24699783325195, "global_step": 207867, "epoch": 1717} {"train_loss": -39.89076614379883, "global_step": 207868, "epoch": 1717} {"train_loss": -39.13230514526367, "global_step": 207869, "epoch": 1717} {"train_loss": -37.69143295288086, "global_step": 207870, "epoch": 1717} {"train_loss": -38.365211486816406, "global_step": 207871, "epoch": 1717} {"train_loss": -38.69987106323242, "global_step": 207872, "epoch": 1717} {"train_loss": -41.017608642578125, "global_step": 207873, "epoch": 1717} {"train_loss": -41.66686248779297, "global_step": 207874, "epoch": 1717} {"train_loss": -40.03068161010742, "global_step": 207875, "epoch": 1717} {"train_loss": -40.69706344604492, "global_step": 207876, "epoch": 1717} {"train_loss": -40.483375785764586, "global_step": 207877, "epoch": 1717, "val_loss": 2558436.0} {"train_loss": -41.42991256713867, "global_step": 207878, "epoch": 1718} {"train_loss": -41.72101593017578, "global_step": 207879, "epoch": 1718} {"train_loss": -41.32680892944336, "global_step": 207880, "epoch": 1718} {"train_loss": -40.92345428466797, "global_step": 207881, "epoch": 1718} {"train_loss": -41.99748229980469, "global_step": 207882, "epoch": 1718} {"train_loss": -42.00138473510742, "global_step": 207883, "epoch": 1718} {"train_loss": -41.456336975097656, "global_step": 207884, "epoch": 1718} {"train_loss": -41.88040542602539, "global_step": 207885, "epoch": 1718} {"train_loss": -41.73459243774414, "global_step": 207886, "epoch": 1718} {"train_loss": -40.89821243286133, "global_step": 207887, "epoch": 1718} {"train_loss": -41.54774856567383, "global_step": 207888, "epoch": 1718} {"train_loss": -41.191043853759766, "global_step": 207889, "epoch": 1718} {"train_loss": -41.65887451171875, "global_step": 207890, "epoch": 1718} {"train_loss": -41.617042541503906, "global_step": 207891, "epoch": 1718} {"train_loss": -40.45020294189453, "global_step": 207892, "epoch": 1718} {"train_loss": -40.94069290161133, "global_step": 207893, "epoch": 1718} {"train_loss": -41.5745849609375, "global_step": 207894, "epoch": 1718} {"train_loss": -42.0733642578125, "global_step": 207895, "epoch": 1718} {"train_loss": -40.29668045043945, "global_step": 207896, "epoch": 1718} {"train_loss": -40.8766975402832, "global_step": 207897, "epoch": 1718} {"train_loss": -41.72426986694336, "global_step": 207898, "epoch": 1718} {"train_loss": -39.5446891784668, "global_step": 207899, "epoch": 1718} {"train_loss": -39.46040344238281, "global_step": 207900, "epoch": 1718} {"train_loss": -41.952110290527344, "global_step": 207901, "epoch": 1718} {"train_loss": -40.63906478881836, "global_step": 207902, "epoch": 1718} {"train_loss": -37.188507080078125, "global_step": 207903, "epoch": 1718} {"train_loss": -39.56961441040039, "global_step": 207904, "epoch": 1718} {"train_loss": -40.974910736083984, "global_step": 207905, "epoch": 1718} {"train_loss": -41.16656494140625, "global_step": 207906, "epoch": 1718} {"train_loss": -40.048885345458984, "global_step": 207907, "epoch": 1718} {"train_loss": -39.99644470214844, "global_step": 207908, "epoch": 1718} {"train_loss": -37.79085159301758, "global_step": 207909, "epoch": 1718} {"train_loss": -37.192928314208984, "global_step": 207910, "epoch": 1718} {"train_loss": -41.28762435913086, "global_step": 207911, "epoch": 1718} {"train_loss": -39.31280517578125, "global_step": 207912, "epoch": 1718} {"train_loss": -38.891326904296875, "global_step": 207913, "epoch": 1718} {"train_loss": -38.78138732910156, "global_step": 207914, "epoch": 1718} {"train_loss": -39.34579086303711, "global_step": 207915, "epoch": 1718} {"train_loss": -36.583091735839844, "global_step": 207916, "epoch": 1718} {"train_loss": -38.04824447631836, "global_step": 207917, "epoch": 1718} {"train_loss": -39.96445846557617, "global_step": 207918, "epoch": 1718} {"train_loss": -40.57902908325195, "global_step": 207919, "epoch": 1718} {"train_loss": -37.46474075317383, "global_step": 207920, "epoch": 1718} {"train_loss": -40.15228271484375, "global_step": 207921, "epoch": 1718} {"train_loss": -30.521484375, "global_step": 207922, "epoch": 1718} {"train_loss": -40.05474853515625, "global_step": 207923, "epoch": 1718} {"train_loss": -38.574520111083984, "global_step": 207924, "epoch": 1718} {"train_loss": -35.71763229370117, "global_step": 207925, "epoch": 1718} {"train_loss": -41.113182067871094, "global_step": 207926, "epoch": 1718} {"train_loss": -39.71316909790039, "global_step": 207927, "epoch": 1718} {"train_loss": -40.2779541015625, "global_step": 207928, "epoch": 1718} {"train_loss": -36.717342376708984, "global_step": 207929, "epoch": 1718} {"train_loss": -36.076534271240234, "global_step": 207930, "epoch": 1718} {"train_loss": -36.151939392089844, "global_step": 207931, "epoch": 1718} {"train_loss": -38.522972106933594, "global_step": 207932, "epoch": 1718} {"train_loss": -31.726181030273438, "global_step": 207933, "epoch": 1718} {"train_loss": -40.18471145629883, "global_step": 207934, "epoch": 1718} {"train_loss": -35.42841339111328, "global_step": 207935, "epoch": 1718} {"train_loss": -38.91062545776367, "global_step": 207936, "epoch": 1718} {"train_loss": -40.299617767333984, "global_step": 207937, "epoch": 1718} {"train_loss": -39.35610580444336, "global_step": 207938, "epoch": 1718} {"train_loss": -38.47749710083008, "global_step": 207939, "epoch": 1718} {"train_loss": -39.49677658081055, "global_step": 207940, "epoch": 1718} {"train_loss": -36.667354583740234, "global_step": 207941, "epoch": 1718} {"train_loss": -38.14545440673828, "global_step": 207942, "epoch": 1718} {"train_loss": -39.3177490234375, "global_step": 207943, "epoch": 1718} {"train_loss": -38.353904724121094, "global_step": 207944, "epoch": 1718} {"train_loss": -38.99271011352539, "global_step": 207945, "epoch": 1718} {"train_loss": -33.047767639160156, "global_step": 207946, "epoch": 1718} {"train_loss": -39.18001937866211, "global_step": 207947, "epoch": 1718} {"train_loss": -38.040794372558594, "global_step": 207948, "epoch": 1718} {"train_loss": -39.0872917175293, "global_step": 207949, "epoch": 1718} {"train_loss": -39.78278732299805, "global_step": 207950, "epoch": 1718} {"train_loss": -39.83170700073242, "global_step": 207951, "epoch": 1718} {"train_loss": -39.50115203857422, "global_step": 207952, "epoch": 1718} {"train_loss": -39.87089920043945, "global_step": 207953, "epoch": 1718} {"train_loss": -40.0402717590332, "global_step": 207954, "epoch": 1718} {"train_loss": -39.558956146240234, "global_step": 207955, "epoch": 1718} {"train_loss": -39.04279327392578, "global_step": 207956, "epoch": 1718} {"train_loss": -38.67999267578125, "global_step": 207957, "epoch": 1718} {"train_loss": -40.985694885253906, "global_step": 207958, "epoch": 1718} {"train_loss": -39.141910552978516, "global_step": 207959, "epoch": 1718} {"train_loss": -38.427711486816406, "global_step": 207960, "epoch": 1718} {"train_loss": -39.43989944458008, "global_step": 207961, "epoch": 1718} {"train_loss": -39.01784896850586, "global_step": 207962, "epoch": 1718} {"train_loss": -37.624969482421875, "global_step": 207963, "epoch": 1718} {"train_loss": -38.3598518371582, "global_step": 207964, "epoch": 1718} {"train_loss": -37.911895751953125, "global_step": 207965, "epoch": 1718} {"train_loss": -40.87091064453125, "global_step": 207966, "epoch": 1718} {"train_loss": -37.629066467285156, "global_step": 207967, "epoch": 1718} {"train_loss": -39.485565185546875, "global_step": 207968, "epoch": 1718} {"train_loss": -40.379512786865234, "global_step": 207969, "epoch": 1718} {"train_loss": -40.64999771118164, "global_step": 207970, "epoch": 1718} {"train_loss": -40.46722412109375, "global_step": 207971, "epoch": 1718} {"train_loss": -40.14126205444336, "global_step": 207972, "epoch": 1718} {"train_loss": -40.93794631958008, "global_step": 207973, "epoch": 1718} {"train_loss": -39.14908981323242, "global_step": 207974, "epoch": 1718} {"train_loss": -39.87519836425781, "global_step": 207975, "epoch": 1718} {"train_loss": -40.3865852355957, "global_step": 207976, "epoch": 1718} {"train_loss": -39.580623626708984, "global_step": 207977, "epoch": 1718} {"train_loss": -39.25883102416992, "global_step": 207978, "epoch": 1718} {"train_loss": -40.293025970458984, "global_step": 207979, "epoch": 1718} {"train_loss": -39.6921272277832, "global_step": 207980, "epoch": 1718} {"train_loss": -39.838314056396484, "global_step": 207981, "epoch": 1718} {"train_loss": -39.12936019897461, "global_step": 207982, "epoch": 1718} {"train_loss": -40.35405731201172, "global_step": 207983, "epoch": 1718} {"train_loss": -40.00502395629883, "global_step": 207984, "epoch": 1718} {"train_loss": -39.978267669677734, "global_step": 207985, "epoch": 1718} {"train_loss": -40.76282501220703, "global_step": 207986, "epoch": 1718} {"train_loss": -40.31534194946289, "global_step": 207987, "epoch": 1718} {"train_loss": -39.909828186035156, "global_step": 207988, "epoch": 1718} {"train_loss": -37.45548629760742, "global_step": 207989, "epoch": 1718} {"train_loss": -40.576045989990234, "global_step": 207990, "epoch": 1718} {"train_loss": -40.37717819213867, "global_step": 207991, "epoch": 1718} {"train_loss": -39.44794845581055, "global_step": 207992, "epoch": 1718} {"train_loss": -40.38397216796875, "global_step": 207993, "epoch": 1718} {"train_loss": -36.18273162841797, "global_step": 207994, "epoch": 1718} {"train_loss": -41.13908767700195, "global_step": 207995, "epoch": 1718} {"train_loss": -40.594451904296875, "global_step": 207996, "epoch": 1718} {"train_loss": -41.07796096801758, "global_step": 207997, "epoch": 1718} {"train_loss": -39.46394259870545, "global_step": 207998, "epoch": 1718, "val_loss": 3786470.0} {"train_loss": -41.4713134765625, "global_step": 207999, "epoch": 1719} {"train_loss": -40.59861373901367, "global_step": 208000, "epoch": 1719} {"train_loss": -40.63328170776367, "global_step": 208001, "epoch": 1719} {"train_loss": -38.315528869628906, "global_step": 208002, "epoch": 1719} {"train_loss": -38.04740524291992, "global_step": 208003, "epoch": 1719} {"train_loss": -40.36067581176758, "global_step": 208004, "epoch": 1719} {"train_loss": -39.95924758911133, "global_step": 208005, "epoch": 1719} {"train_loss": -40.98090362548828, "global_step": 208006, "epoch": 1719} {"train_loss": -41.06631088256836, "global_step": 208007, "epoch": 1719} {"train_loss": -40.87778854370117, "global_step": 208008, "epoch": 1719} {"train_loss": -41.18425369262695, "global_step": 208009, "epoch": 1719} {"train_loss": -41.0351676940918, "global_step": 208010, "epoch": 1719} {"train_loss": -40.00570297241211, "global_step": 208011, "epoch": 1719} {"train_loss": -37.762386322021484, "global_step": 208012, "epoch": 1719} {"train_loss": -41.21759033203125, "global_step": 208013, "epoch": 1719} {"train_loss": -41.245033264160156, "global_step": 208014, "epoch": 1719} {"train_loss": -40.44694900512695, "global_step": 208015, "epoch": 1719} {"train_loss": -38.78232955932617, "global_step": 208016, "epoch": 1719} {"train_loss": -41.517860412597656, "global_step": 208017, "epoch": 1719} {"train_loss": -41.30963134765625, "global_step": 208018, "epoch": 1719} {"train_loss": -40.283077239990234, "global_step": 208019, "epoch": 1719} {"train_loss": -40.749420166015625, "global_step": 208020, "epoch": 1719} {"train_loss": -41.408016204833984, "global_step": 208021, "epoch": 1719} {"train_loss": -40.60108184814453, "global_step": 208022, "epoch": 1719} {"train_loss": -41.40892791748047, "global_step": 208023, "epoch": 1719} {"train_loss": -40.57509994506836, "global_step": 208024, "epoch": 1719} {"train_loss": -40.2764892578125, "global_step": 208025, "epoch": 1719} {"train_loss": -40.598445892333984, "global_step": 208026, "epoch": 1719} {"train_loss": -41.25873947143555, "global_step": 208027, "epoch": 1719} {"train_loss": -40.8860969543457, "global_step": 208028, "epoch": 1719} {"train_loss": -41.722381591796875, "global_step": 208029, "epoch": 1719} {"train_loss": -39.455108642578125, "global_step": 208030, "epoch": 1719} {"train_loss": -40.18581008911133, "global_step": 208031, "epoch": 1719} {"train_loss": -41.035221099853516, "global_step": 208032, "epoch": 1719} {"train_loss": -41.78429412841797, "global_step": 208033, "epoch": 1719} {"train_loss": -41.3027229309082, "global_step": 208034, "epoch": 1719} {"train_loss": -41.353851318359375, "global_step": 208035, "epoch": 1719} {"train_loss": -41.89171600341797, "global_step": 208036, "epoch": 1719} {"train_loss": -41.5158576965332, "global_step": 208037, "epoch": 1719} {"train_loss": -40.50836944580078, "global_step": 208038, "epoch": 1719} {"train_loss": -41.68549346923828, "global_step": 208039, "epoch": 1719} {"train_loss": -41.54279708862305, "global_step": 208040, "epoch": 1719} {"train_loss": -40.596492767333984, "global_step": 208041, "epoch": 1719} {"train_loss": -41.19811248779297, "global_step": 208042, "epoch": 1719} {"train_loss": -41.51313400268555, "global_step": 208043, "epoch": 1719} {"train_loss": -40.63435745239258, "global_step": 208044, "epoch": 1719} {"train_loss": -41.58330154418945, "global_step": 208045, "epoch": 1719} {"train_loss": -41.61229705810547, "global_step": 208046, "epoch": 1719} {"train_loss": -41.6713752746582, "global_step": 208047, "epoch": 1719} {"train_loss": -41.245994567871094, "global_step": 208048, "epoch": 1719} {"train_loss": -41.908416748046875, "global_step": 208049, "epoch": 1719} {"train_loss": -41.23256301879883, "global_step": 208050, "epoch": 1719} {"train_loss": -40.941505432128906, "global_step": 208051, "epoch": 1719} {"train_loss": -41.56905746459961, "global_step": 208052, "epoch": 1719} {"train_loss": -40.575172424316406, "global_step": 208053, "epoch": 1719} {"train_loss": -41.67472457885742, "global_step": 208054, "epoch": 1719} {"train_loss": -40.78907012939453, "global_step": 208055, "epoch": 1719} {"train_loss": -40.17997360229492, "global_step": 208056, "epoch": 1719} {"train_loss": -41.240535736083984, "global_step": 208057, "epoch": 1719} {"train_loss": -41.78131866455078, "global_step": 208058, "epoch": 1719} {"train_loss": -41.101905822753906, "global_step": 208059, "epoch": 1719} {"train_loss": -41.41462326049805, "global_step": 208060, "epoch": 1719} {"train_loss": -41.91966247558594, "global_step": 208061, "epoch": 1719} {"train_loss": -41.44293212890625, "global_step": 208062, "epoch": 1719} {"train_loss": -41.440284729003906, "global_step": 208063, "epoch": 1719} {"train_loss": -42.1766242980957, "global_step": 208064, "epoch": 1719} {"train_loss": -41.7833251953125, "global_step": 208065, "epoch": 1719} {"train_loss": -41.28766632080078, "global_step": 208066, "epoch": 1719} {"train_loss": -40.864017486572266, "global_step": 208067, "epoch": 1719} {"train_loss": -40.54453659057617, "global_step": 208068, "epoch": 1719} {"train_loss": -41.321712493896484, "global_step": 208069, "epoch": 1719} {"train_loss": -42.00127029418945, "global_step": 208070, "epoch": 1719} {"train_loss": -41.6313591003418, "global_step": 208071, "epoch": 1719} {"train_loss": -41.07649612426758, "global_step": 208072, "epoch": 1719} {"train_loss": -39.95876693725586, "global_step": 208073, "epoch": 1719} {"train_loss": -40.17744064331055, "global_step": 208074, "epoch": 1719} {"train_loss": -41.68182373046875, "global_step": 208075, "epoch": 1719} {"train_loss": -41.72504806518555, "global_step": 208076, "epoch": 1719} {"train_loss": -42.040889739990234, "global_step": 208077, "epoch": 1719} {"train_loss": -41.786407470703125, "global_step": 208078, "epoch": 1719} {"train_loss": -41.68727111816406, "global_step": 208079, "epoch": 1719} {"train_loss": -41.85129928588867, "global_step": 208080, "epoch": 1719} {"train_loss": -41.710628509521484, "global_step": 208081, "epoch": 1719} {"train_loss": -41.59890365600586, "global_step": 208082, "epoch": 1719} {"train_loss": -42.19147872924805, "global_step": 208083, "epoch": 1719} {"train_loss": -41.58374786376953, "global_step": 208084, "epoch": 1719} {"train_loss": -41.315792083740234, "global_step": 208085, "epoch": 1719} {"train_loss": -39.714019775390625, "global_step": 208086, "epoch": 1719} {"train_loss": -41.83926010131836, "global_step": 208087, "epoch": 1719} {"train_loss": -40.71749496459961, "global_step": 208088, "epoch": 1719} {"train_loss": -38.67169189453125, "global_step": 208089, "epoch": 1719} {"train_loss": -41.698604583740234, "global_step": 208090, "epoch": 1719} {"train_loss": -37.167388916015625, "global_step": 208091, "epoch": 1719} {"train_loss": -41.0028076171875, "global_step": 208092, "epoch": 1719} {"train_loss": -40.506591796875, "global_step": 208093, "epoch": 1719} {"train_loss": -40.97323989868164, "global_step": 208094, "epoch": 1719} {"train_loss": -39.4658088684082, "global_step": 208095, "epoch": 1719} {"train_loss": -38.305416107177734, "global_step": 208096, "epoch": 1719} {"train_loss": -40.23538589477539, "global_step": 208097, "epoch": 1719} {"train_loss": -36.5992431640625, "global_step": 208098, "epoch": 1719} {"train_loss": -40.09504318237305, "global_step": 208099, "epoch": 1719} {"train_loss": -37.54490280151367, "global_step": 208100, "epoch": 1719} {"train_loss": -39.685401916503906, "global_step": 208101, "epoch": 1719} {"train_loss": -37.94277572631836, "global_step": 208102, "epoch": 1719} {"train_loss": -39.418785095214844, "global_step": 208103, "epoch": 1719} {"train_loss": -39.7408332824707, "global_step": 208104, "epoch": 1719} {"train_loss": -39.65956497192383, "global_step": 208105, "epoch": 1719} {"train_loss": -40.14091873168945, "global_step": 208106, "epoch": 1719} {"train_loss": -39.7774772644043, "global_step": 208107, "epoch": 1719} {"train_loss": -40.42203140258789, "global_step": 208108, "epoch": 1719} {"train_loss": -40.569393157958984, "global_step": 208109, "epoch": 1719} {"train_loss": -39.022857666015625, "global_step": 208110, "epoch": 1719} {"train_loss": -39.54935836791992, "global_step": 208111, "epoch": 1719} {"train_loss": -39.554622650146484, "global_step": 208112, "epoch": 1719} {"train_loss": -39.945068359375, "global_step": 208113, "epoch": 1719} {"train_loss": -40.124366760253906, "global_step": 208114, "epoch": 1719} {"train_loss": -40.2011833190918, "global_step": 208115, "epoch": 1719} {"train_loss": -40.06605911254883, "global_step": 208116, "epoch": 1719} {"train_loss": -40.195858001708984, "global_step": 208117, "epoch": 1719} {"train_loss": -40.11676788330078, "global_step": 208118, "epoch": 1719} {"train_loss": -40.671283974135214, "global_step": 208119, "epoch": 1719, "val_loss": 2515633.75} {"train_loss": -40.40956115722656, "global_step": 208120, "epoch": 1720} {"train_loss": -40.530181884765625, "global_step": 208121, "epoch": 1720} {"train_loss": -40.72384262084961, "global_step": 208122, "epoch": 1720} {"train_loss": -40.13290786743164, "global_step": 208123, "epoch": 1720} {"train_loss": -41.16469955444336, "global_step": 208124, "epoch": 1720} {"train_loss": -41.62017059326172, "global_step": 208125, "epoch": 1720} {"train_loss": -40.6762809753418, "global_step": 208126, "epoch": 1720} {"train_loss": -41.56829833984375, "global_step": 208127, "epoch": 1720} {"train_loss": -41.445404052734375, "global_step": 208128, "epoch": 1720} {"train_loss": -40.82672119140625, "global_step": 208129, "epoch": 1720} {"train_loss": -42.177001953125, "global_step": 208130, "epoch": 1720} {"train_loss": -40.66809844970703, "global_step": 208131, "epoch": 1720} {"train_loss": -41.03727340698242, "global_step": 208132, "epoch": 1720} {"train_loss": -41.01742935180664, "global_step": 208133, "epoch": 1720} {"train_loss": -40.9602165222168, "global_step": 208134, "epoch": 1720} {"train_loss": -41.84245681762695, "global_step": 208135, "epoch": 1720} {"train_loss": -41.55693435668945, "global_step": 208136, "epoch": 1720} {"train_loss": -41.611366271972656, "global_step": 208137, "epoch": 1720} {"train_loss": -41.344173431396484, "global_step": 208138, "epoch": 1720} {"train_loss": -41.6301383972168, "global_step": 208139, "epoch": 1720} {"train_loss": -41.4705924987793, "global_step": 208140, "epoch": 1720} {"train_loss": -40.53548049926758, "global_step": 208141, "epoch": 1720} {"train_loss": -41.28204345703125, "global_step": 208142, "epoch": 1720} {"train_loss": -41.54476547241211, "global_step": 208143, "epoch": 1720} {"train_loss": -41.14776611328125, "global_step": 208144, "epoch": 1720} {"train_loss": -41.403106689453125, "global_step": 208145, "epoch": 1720} {"train_loss": -41.679012298583984, "global_step": 208146, "epoch": 1720} {"train_loss": -41.3086051940918, "global_step": 208147, "epoch": 1720} {"train_loss": -42.04201126098633, "global_step": 208148, "epoch": 1720} {"train_loss": -41.948055267333984, "global_step": 208149, "epoch": 1720} {"train_loss": -41.39840316772461, "global_step": 208150, "epoch": 1720} {"train_loss": -41.19423294067383, "global_step": 208151, "epoch": 1720} {"train_loss": -41.5066032409668, "global_step": 208152, "epoch": 1720} {"train_loss": -40.55704879760742, "global_step": 208153, "epoch": 1720} {"train_loss": -40.61101531982422, "global_step": 208154, "epoch": 1720} {"train_loss": -42.00798416137695, "global_step": 208155, "epoch": 1720} {"train_loss": -40.326637268066406, "global_step": 208156, "epoch": 1720} {"train_loss": -38.86665725708008, "global_step": 208157, "epoch": 1720} {"train_loss": -40.62612533569336, "global_step": 208158, "epoch": 1720} {"train_loss": -38.85531234741211, "global_step": 208159, "epoch": 1720} {"train_loss": -37.6150016784668, "global_step": 208160, "epoch": 1720} {"train_loss": -36.482643127441406, "global_step": 208161, "epoch": 1720} {"train_loss": -40.289676666259766, "global_step": 208162, "epoch": 1720} {"train_loss": -37.560516357421875, "global_step": 208163, "epoch": 1720} {"train_loss": -41.24601364135742, "global_step": 208164, "epoch": 1720} {"train_loss": -40.88702392578125, "global_step": 208165, "epoch": 1720} {"train_loss": -39.828590393066406, "global_step": 208166, "epoch": 1720} {"train_loss": -38.88568878173828, "global_step": 208167, "epoch": 1720} {"train_loss": -39.8511962890625, "global_step": 208168, "epoch": 1720} {"train_loss": -38.816768646240234, "global_step": 208169, "epoch": 1720} {"train_loss": -37.574859619140625, "global_step": 208170, "epoch": 1720} {"train_loss": -36.180538177490234, "global_step": 208171, "epoch": 1720} {"train_loss": -36.65102005004883, "global_step": 208172, "epoch": 1720} {"train_loss": -41.08164596557617, "global_step": 208173, "epoch": 1720} {"train_loss": -39.03145980834961, "global_step": 208174, "epoch": 1720} {"train_loss": -37.91689682006836, "global_step": 208175, "epoch": 1720} {"train_loss": -41.0897331237793, "global_step": 208176, "epoch": 1720} {"train_loss": -37.690406799316406, "global_step": 208177, "epoch": 1720} {"train_loss": -38.03054428100586, "global_step": 208178, "epoch": 1720} {"train_loss": -41.15407180786133, "global_step": 208179, "epoch": 1720} {"train_loss": -38.08126449584961, "global_step": 208180, "epoch": 1720} {"train_loss": -39.65898513793945, "global_step": 208181, "epoch": 1720} {"train_loss": -39.71433639526367, "global_step": 208182, "epoch": 1720} {"train_loss": -38.52254867553711, "global_step": 208183, "epoch": 1720} {"train_loss": -39.99300003051758, "global_step": 208184, "epoch": 1720} {"train_loss": -39.19167709350586, "global_step": 208185, "epoch": 1720} {"train_loss": -39.75751876831055, "global_step": 208186, "epoch": 1720} {"train_loss": -39.16905975341797, "global_step": 208187, "epoch": 1720} {"train_loss": -39.61052322387695, "global_step": 208188, "epoch": 1720} {"train_loss": -40.268558502197266, "global_step": 208189, "epoch": 1720} {"train_loss": -37.7213249206543, "global_step": 208190, "epoch": 1720} {"train_loss": -40.4320068359375, "global_step": 208191, "epoch": 1720} {"train_loss": -41.46921920776367, "global_step": 208192, "epoch": 1720} {"train_loss": -40.46731185913086, "global_step": 208193, "epoch": 1720} {"train_loss": -41.22477340698242, "global_step": 208194, "epoch": 1720} {"train_loss": -39.47682189941406, "global_step": 208195, "epoch": 1720} {"train_loss": -40.149410247802734, "global_step": 208196, "epoch": 1720} {"train_loss": -40.571022033691406, "global_step": 208197, "epoch": 1720} {"train_loss": -40.283870697021484, "global_step": 208198, "epoch": 1720} {"train_loss": -40.79435729980469, "global_step": 208199, "epoch": 1720} {"train_loss": -41.54460144042969, "global_step": 208200, "epoch": 1720} {"train_loss": -41.3748779296875, "global_step": 208201, "epoch": 1720} {"train_loss": -41.18729782104492, "global_step": 208202, "epoch": 1720} {"train_loss": -41.206661224365234, "global_step": 208203, "epoch": 1720} {"train_loss": -41.912776947021484, "global_step": 208204, "epoch": 1720} {"train_loss": -41.550228118896484, "global_step": 208205, "epoch": 1720} {"train_loss": -41.88904571533203, "global_step": 208206, "epoch": 1720} {"train_loss": -41.781917572021484, "global_step": 208207, "epoch": 1720} {"train_loss": -41.84320831298828, "global_step": 208208, "epoch": 1720} {"train_loss": -41.508506774902344, "global_step": 208209, "epoch": 1720} {"train_loss": -40.62110137939453, "global_step": 208210, "epoch": 1720} {"train_loss": -40.95786666870117, "global_step": 208211, "epoch": 1720} {"train_loss": -40.135780334472656, "global_step": 208212, "epoch": 1720} {"train_loss": -41.564979553222656, "global_step": 208213, "epoch": 1720} {"train_loss": -41.80985641479492, "global_step": 208214, "epoch": 1720} {"train_loss": -41.566097259521484, "global_step": 208215, "epoch": 1720} {"train_loss": -41.97748947143555, "global_step": 208216, "epoch": 1720} {"train_loss": -41.61249542236328, "global_step": 208217, "epoch": 1720} {"train_loss": -42.142921447753906, "global_step": 208218, "epoch": 1720} {"train_loss": -42.05834197998047, "global_step": 208219, "epoch": 1720} {"train_loss": -41.74589157104492, "global_step": 208220, "epoch": 1720} {"train_loss": -41.22115707397461, "global_step": 208221, "epoch": 1720} {"train_loss": -39.955753326416016, "global_step": 208222, "epoch": 1720} {"train_loss": -42.14088821411133, "global_step": 208223, "epoch": 1720} {"train_loss": -42.02099609375, "global_step": 208224, "epoch": 1720} {"train_loss": -42.180747985839844, "global_step": 208225, "epoch": 1720} {"train_loss": -41.812225341796875, "global_step": 208226, "epoch": 1720} {"train_loss": -41.62409591674805, "global_step": 208227, "epoch": 1720} {"train_loss": -42.26721954345703, "global_step": 208228, "epoch": 1720} {"train_loss": -41.93928146362305, "global_step": 208229, "epoch": 1720} {"train_loss": -42.49523162841797, "global_step": 208230, "epoch": 1720} {"train_loss": -41.889251708984375, "global_step": 208231, "epoch": 1720} {"train_loss": -42.506343841552734, "global_step": 208232, "epoch": 1720} {"train_loss": -42.246803283691406, "global_step": 208233, "epoch": 1720} {"train_loss": -42.697933197021484, "global_step": 208234, "epoch": 1720} {"train_loss": -42.526485443115234, "global_step": 208235, "epoch": 1720} {"train_loss": -42.71509552001953, "global_step": 208236, "epoch": 1720} {"train_loss": -42.42647171020508, "global_step": 208237, "epoch": 1720} {"train_loss": -42.64197540283203, "global_step": 208238, "epoch": 1720} {"train_loss": -41.60316848754883, "global_step": 208239, "epoch": 1720} {"train_loss": -40.75500872903619, "global_step": 208240, "epoch": 1720, "val_loss": 2474169.75} {"train_loss": -42.3955078125, "global_step": 208241, "epoch": 1721} {"train_loss": -42.23639678955078, "global_step": 208242, "epoch": 1721} {"train_loss": -42.4363899230957, "global_step": 208243, "epoch": 1721} {"train_loss": -42.15534591674805, "global_step": 208244, "epoch": 1721} {"train_loss": -42.67670822143555, "global_step": 208245, "epoch": 1721} {"train_loss": -41.83573913574219, "global_step": 208246, "epoch": 1721} {"train_loss": -42.481285095214844, "global_step": 208247, "epoch": 1721} {"train_loss": -42.60200119018555, "global_step": 208248, "epoch": 1721} {"train_loss": -42.248878479003906, "global_step": 208249, "epoch": 1721} {"train_loss": -42.049190521240234, "global_step": 208250, "epoch": 1721} {"train_loss": -43.05921173095703, "global_step": 208251, "epoch": 1721} {"train_loss": -42.700435638427734, "global_step": 208252, "epoch": 1721} {"train_loss": -42.09763717651367, "global_step": 208253, "epoch": 1721} {"train_loss": -42.24782943725586, "global_step": 208254, "epoch": 1721} {"train_loss": -42.692359924316406, "global_step": 208255, "epoch": 1721} {"train_loss": -42.69172668457031, "global_step": 208256, "epoch": 1721} {"train_loss": -43.44437789916992, "global_step": 208257, "epoch": 1721} {"train_loss": -42.57255172729492, "global_step": 208258, "epoch": 1721} {"train_loss": -41.742000579833984, "global_step": 208259, "epoch": 1721} {"train_loss": -40.919403076171875, "global_step": 208260, "epoch": 1721} {"train_loss": -39.87101364135742, "global_step": 208261, "epoch": 1721} {"train_loss": -42.63515090942383, "global_step": 208262, "epoch": 1721} {"train_loss": -42.09974670410156, "global_step": 208263, "epoch": 1721} {"train_loss": -41.81981658935547, "global_step": 208264, "epoch": 1721} {"train_loss": -41.121578216552734, "global_step": 208265, "epoch": 1721} {"train_loss": -40.58879470825195, "global_step": 208266, "epoch": 1721} {"train_loss": -40.53493881225586, "global_step": 208267, "epoch": 1721} {"train_loss": -37.952842712402344, "global_step": 208268, "epoch": 1721} {"train_loss": -31.919010162353516, "global_step": 208269, "epoch": 1721} {"train_loss": -24.1831111907959, "global_step": 208270, "epoch": 1721} {"train_loss": -32.81800079345703, "global_step": 208271, "epoch": 1721} {"train_loss": -38.23065185546875, "global_step": 208272, "epoch": 1721} {"train_loss": -33.19552230834961, "global_step": 208273, "epoch": 1721} {"train_loss": -30.018402099609375, "global_step": 208274, "epoch": 1721} {"train_loss": -39.92153549194336, "global_step": 208275, "epoch": 1721} {"train_loss": -35.47579574584961, "global_step": 208276, "epoch": 1721} {"train_loss": -33.143795013427734, "global_step": 208277, "epoch": 1721} {"train_loss": -40.0040283203125, "global_step": 208278, "epoch": 1721} {"train_loss": -37.144500732421875, "global_step": 208279, "epoch": 1721} {"train_loss": -39.55528259277344, "global_step": 208280, "epoch": 1721} {"train_loss": -37.79692459106445, "global_step": 208281, "epoch": 1721} {"train_loss": -39.943359375, "global_step": 208282, "epoch": 1721} {"train_loss": -37.0252685546875, "global_step": 208283, "epoch": 1721} {"train_loss": -39.33578109741211, "global_step": 208284, "epoch": 1721} {"train_loss": -39.50202941894531, "global_step": 208285, "epoch": 1721} {"train_loss": -39.66421890258789, "global_step": 208286, "epoch": 1721} {"train_loss": -40.04963684082031, "global_step": 208287, "epoch": 1721} {"train_loss": -39.63252639770508, "global_step": 208288, "epoch": 1721} {"train_loss": -39.83857345581055, "global_step": 208289, "epoch": 1721} {"train_loss": -39.628997802734375, "global_step": 208290, "epoch": 1721} {"train_loss": -40.21726608276367, "global_step": 208291, "epoch": 1721} {"train_loss": -40.61141586303711, "global_step": 208292, "epoch": 1721} {"train_loss": -39.93954086303711, "global_step": 208293, "epoch": 1721} {"train_loss": -40.614315032958984, "global_step": 208294, "epoch": 1721} {"train_loss": -40.75190353393555, "global_step": 208295, "epoch": 1721} {"train_loss": -40.802547454833984, "global_step": 208296, "epoch": 1721} {"train_loss": -41.168514251708984, "global_step": 208297, "epoch": 1721} {"train_loss": -41.15629196166992, "global_step": 208298, "epoch": 1721} {"train_loss": -41.706050872802734, "global_step": 208299, "epoch": 1721} {"train_loss": -41.46852493286133, "global_step": 208300, "epoch": 1721} {"train_loss": -41.32076644897461, "global_step": 208301, "epoch": 1721} {"train_loss": -41.40291213989258, "global_step": 208302, "epoch": 1721} {"train_loss": -41.51872253417969, "global_step": 208303, "epoch": 1721} {"train_loss": -41.5927734375, "global_step": 208304, "epoch": 1721} {"train_loss": -41.27842712402344, "global_step": 208305, "epoch": 1721} {"train_loss": -41.90632247924805, "global_step": 208306, "epoch": 1721} {"train_loss": -41.54337692260742, "global_step": 208307, "epoch": 1721} {"train_loss": -41.953365325927734, "global_step": 208308, "epoch": 1721} {"train_loss": -41.821800231933594, "global_step": 208309, "epoch": 1721} {"train_loss": -41.6271858215332, "global_step": 208310, "epoch": 1721} {"train_loss": -40.927955627441406, "global_step": 208311, "epoch": 1721} {"train_loss": -41.90871047973633, "global_step": 208312, "epoch": 1721} {"train_loss": -41.814510345458984, "global_step": 208313, "epoch": 1721} {"train_loss": -41.58193588256836, "global_step": 208314, "epoch": 1721} {"train_loss": -42.27779769897461, "global_step": 208315, "epoch": 1721} {"train_loss": -41.70058059692383, "global_step": 208316, "epoch": 1721} {"train_loss": -42.23186111450195, "global_step": 208317, "epoch": 1721} {"train_loss": -42.07097244262695, "global_step": 208318, "epoch": 1721} {"train_loss": -42.168212890625, "global_step": 208319, "epoch": 1721} {"train_loss": -41.86717987060547, "global_step": 208320, "epoch": 1721} {"train_loss": -42.19558334350586, "global_step": 208321, "epoch": 1721} {"train_loss": -42.305694580078125, "global_step": 208322, "epoch": 1721} {"train_loss": -41.73140335083008, "global_step": 208323, "epoch": 1721} {"train_loss": -42.40134048461914, "global_step": 208324, "epoch": 1721} {"train_loss": -42.49623107910156, "global_step": 208325, "epoch": 1721} {"train_loss": -42.60500717163086, "global_step": 208326, "epoch": 1721} {"train_loss": -42.18775177001953, "global_step": 208327, "epoch": 1721} {"train_loss": -42.4536247253418, "global_step": 208328, "epoch": 1721} {"train_loss": -42.09187698364258, "global_step": 208329, "epoch": 1721} {"train_loss": -42.32857894897461, "global_step": 208330, "epoch": 1721} {"train_loss": -41.65105056762695, "global_step": 208331, "epoch": 1721} {"train_loss": -42.70022964477539, "global_step": 208332, "epoch": 1721} {"train_loss": -41.6657829284668, "global_step": 208333, "epoch": 1721} {"train_loss": -42.61823654174805, "global_step": 208334, "epoch": 1721} {"train_loss": -42.015724182128906, "global_step": 208335, "epoch": 1721} {"train_loss": -41.88657760620117, "global_step": 208336, "epoch": 1721} {"train_loss": -42.52665710449219, "global_step": 208337, "epoch": 1721} {"train_loss": -42.49335479736328, "global_step": 208338, "epoch": 1721} {"train_loss": -42.308895111083984, "global_step": 208339, "epoch": 1721} {"train_loss": -42.03002166748047, "global_step": 208340, "epoch": 1721} {"train_loss": -42.990848541259766, "global_step": 208341, "epoch": 1721} {"train_loss": -42.858699798583984, "global_step": 208342, "epoch": 1721} {"train_loss": -42.54153060913086, "global_step": 208343, "epoch": 1721} {"train_loss": -42.5845947265625, "global_step": 208344, "epoch": 1721} {"train_loss": -42.74489974975586, "global_step": 208345, "epoch": 1721} {"train_loss": -42.05538558959961, "global_step": 208346, "epoch": 1721} {"train_loss": -42.650936126708984, "global_step": 208347, "epoch": 1721} {"train_loss": -42.6085205078125, "global_step": 208348, "epoch": 1721} {"train_loss": -42.41630935668945, "global_step": 208349, "epoch": 1721} {"train_loss": -43.01629638671875, "global_step": 208350, "epoch": 1721} {"train_loss": -42.31736373901367, "global_step": 208351, "epoch": 1721} {"train_loss": -42.657413482666016, "global_step": 208352, "epoch": 1721} {"train_loss": -42.59971237182617, "global_step": 208353, "epoch": 1721} {"train_loss": -42.958030700683594, "global_step": 208354, "epoch": 1721} {"train_loss": -42.144020080566406, "global_step": 208355, "epoch": 1721} {"train_loss": -41.98869705200195, "global_step": 208356, "epoch": 1721} {"train_loss": -40.68842697143555, "global_step": 208357, "epoch": 1721} {"train_loss": -38.1643180847168, "global_step": 208358, "epoch": 1721} {"train_loss": -39.093379974365234, "global_step": 208359, "epoch": 1721} {"train_loss": -41.27952194213867, "global_step": 208360, "epoch": 1721} {"train_loss": -40.902164506518154, "global_step": 208361, "epoch": 1721, "val_loss": 2495386.0} {"train_loss": -37.6048583984375, "global_step": 208362, "epoch": 1722} {"train_loss": -41.013301849365234, "global_step": 208363, "epoch": 1722} {"train_loss": -41.98481369018555, "global_step": 208364, "epoch": 1722} {"train_loss": -40.38924789428711, "global_step": 208365, "epoch": 1722} {"train_loss": -39.8167610168457, "global_step": 208366, "epoch": 1722} {"train_loss": -39.04315948486328, "global_step": 208367, "epoch": 1722} {"train_loss": -39.04127883911133, "global_step": 208368, "epoch": 1722} {"train_loss": -41.01911926269531, "global_step": 208369, "epoch": 1722} {"train_loss": -41.30656433105469, "global_step": 208370, "epoch": 1722} {"train_loss": -41.23090362548828, "global_step": 208371, "epoch": 1722} {"train_loss": -41.64740753173828, "global_step": 208372, "epoch": 1722} {"train_loss": -41.27986526489258, "global_step": 208373, "epoch": 1722} {"train_loss": -41.28876495361328, "global_step": 208374, "epoch": 1722} {"train_loss": -41.33303451538086, "global_step": 208375, "epoch": 1722} {"train_loss": -40.90035629272461, "global_step": 208376, "epoch": 1722} {"train_loss": -42.026893615722656, "global_step": 208377, "epoch": 1722} {"train_loss": -41.41310501098633, "global_step": 208378, "epoch": 1722} {"train_loss": -41.73545455932617, "global_step": 208379, "epoch": 1722} {"train_loss": -42.10894012451172, "global_step": 208380, "epoch": 1722} {"train_loss": -41.249263763427734, "global_step": 208381, "epoch": 1722} {"train_loss": -42.18312454223633, "global_step": 208382, "epoch": 1722} {"train_loss": -41.53553009033203, "global_step": 208383, "epoch": 1722} {"train_loss": -41.84829330444336, "global_step": 208384, "epoch": 1722} {"train_loss": -42.33782958984375, "global_step": 208385, "epoch": 1722} {"train_loss": -41.81655502319336, "global_step": 208386, "epoch": 1722} {"train_loss": -42.32195281982422, "global_step": 208387, "epoch": 1722} {"train_loss": -41.920631408691406, "global_step": 208388, "epoch": 1722} {"train_loss": -42.3385009765625, "global_step": 208389, "epoch": 1722} {"train_loss": -42.0244140625, "global_step": 208390, "epoch": 1722} {"train_loss": -42.22232437133789, "global_step": 208391, "epoch": 1722} {"train_loss": -41.92864990234375, "global_step": 208392, "epoch": 1722} {"train_loss": -41.53203201293945, "global_step": 208393, "epoch": 1722} {"train_loss": -42.23065185546875, "global_step": 208394, "epoch": 1722} {"train_loss": -41.51378631591797, "global_step": 208395, "epoch": 1722} {"train_loss": -41.447174072265625, "global_step": 208396, "epoch": 1722} {"train_loss": -41.5645866394043, "global_step": 208397, "epoch": 1722} {"train_loss": -41.554779052734375, "global_step": 208398, "epoch": 1722} {"train_loss": -41.24363327026367, "global_step": 208399, "epoch": 1722} {"train_loss": -41.81655502319336, "global_step": 208400, "epoch": 1722} {"train_loss": -42.14106369018555, "global_step": 208401, "epoch": 1722} {"train_loss": -42.09725570678711, "global_step": 208402, "epoch": 1722} {"train_loss": -42.07276153564453, "global_step": 208403, "epoch": 1722} {"train_loss": -42.09711837768555, "global_step": 208404, "epoch": 1722} {"train_loss": -41.07490921020508, "global_step": 208405, "epoch": 1722} {"train_loss": -42.1163330078125, "global_step": 208406, "epoch": 1722} {"train_loss": -41.76715087890625, "global_step": 208407, "epoch": 1722} {"train_loss": -42.30718231201172, "global_step": 208408, "epoch": 1722} {"train_loss": -41.6287841796875, "global_step": 208409, "epoch": 1722} {"train_loss": -40.735618591308594, "global_step": 208410, "epoch": 1722} {"train_loss": -41.445919036865234, "global_step": 208411, "epoch": 1722} {"train_loss": -42.367801666259766, "global_step": 208412, "epoch": 1722} {"train_loss": -42.67580032348633, "global_step": 208413, "epoch": 1722} {"train_loss": -42.535438537597656, "global_step": 208414, "epoch": 1722} {"train_loss": -42.204341888427734, "global_step": 208415, "epoch": 1722} {"train_loss": -42.204551696777344, "global_step": 208416, "epoch": 1722} {"train_loss": -42.583621978759766, "global_step": 208417, "epoch": 1722} {"train_loss": -42.511817932128906, "global_step": 208418, "epoch": 1722} {"train_loss": -42.45195770263672, "global_step": 208419, "epoch": 1722} {"train_loss": -41.92879867553711, "global_step": 208420, "epoch": 1722} {"train_loss": -41.2965202331543, "global_step": 208421, "epoch": 1722} {"train_loss": -41.59477233886719, "global_step": 208422, "epoch": 1722} {"train_loss": -42.250396728515625, "global_step": 208423, "epoch": 1722} {"train_loss": -42.010440826416016, "global_step": 208424, "epoch": 1722} {"train_loss": -41.28695297241211, "global_step": 208425, "epoch": 1722} {"train_loss": -41.3495979309082, "global_step": 208426, "epoch": 1722} {"train_loss": -40.9969482421875, "global_step": 208427, "epoch": 1722} {"train_loss": -42.4036979675293, "global_step": 208428, "epoch": 1722} {"train_loss": -41.49886703491211, "global_step": 208429, "epoch": 1722} {"train_loss": -41.6031608581543, "global_step": 208430, "epoch": 1722} {"train_loss": -41.23784255981445, "global_step": 208431, "epoch": 1722} {"train_loss": -40.994361877441406, "global_step": 208432, "epoch": 1722} {"train_loss": -42.67771911621094, "global_step": 208433, "epoch": 1722} {"train_loss": -41.2727165222168, "global_step": 208434, "epoch": 1722} {"train_loss": -40.3952751159668, "global_step": 208435, "epoch": 1722} {"train_loss": -38.83847427368164, "global_step": 208436, "epoch": 1722} {"train_loss": -39.605831146240234, "global_step": 208437, "epoch": 1722} {"train_loss": -41.38466262817383, "global_step": 208438, "epoch": 1722} {"train_loss": -41.88288116455078, "global_step": 208439, "epoch": 1722} {"train_loss": -40.80118942260742, "global_step": 208440, "epoch": 1722} {"train_loss": -40.893028259277344, "global_step": 208441, "epoch": 1722} {"train_loss": -39.58377456665039, "global_step": 208442, "epoch": 1722} {"train_loss": -39.043678283691406, "global_step": 208443, "epoch": 1722} {"train_loss": -39.03058624267578, "global_step": 208444, "epoch": 1722} {"train_loss": -40.53130340576172, "global_step": 208445, "epoch": 1722} {"train_loss": -41.529632568359375, "global_step": 208446, "epoch": 1722} {"train_loss": -41.5261116027832, "global_step": 208447, "epoch": 1722} {"train_loss": -39.287208557128906, "global_step": 208448, "epoch": 1722} {"train_loss": -38.87738037109375, "global_step": 208449, "epoch": 1722} {"train_loss": -41.59836959838867, "global_step": 208450, "epoch": 1722} {"train_loss": -41.075416564941406, "global_step": 208451, "epoch": 1722} {"train_loss": -40.43730545043945, "global_step": 208452, "epoch": 1722} {"train_loss": -40.81889724731445, "global_step": 208453, "epoch": 1722} {"train_loss": -40.83054733276367, "global_step": 208454, "epoch": 1722} {"train_loss": -41.33510208129883, "global_step": 208455, "epoch": 1722} {"train_loss": -40.38398361206055, "global_step": 208456, "epoch": 1722} {"train_loss": -40.73647689819336, "global_step": 208457, "epoch": 1722} {"train_loss": -41.1919059753418, "global_step": 208458, "epoch": 1722} {"train_loss": -40.40395736694336, "global_step": 208459, "epoch": 1722} {"train_loss": -41.59626388549805, "global_step": 208460, "epoch": 1722} {"train_loss": -41.51491165161133, "global_step": 208461, "epoch": 1722} {"train_loss": -40.99861145019531, "global_step": 208462, "epoch": 1722} {"train_loss": -41.7054328918457, "global_step": 208463, "epoch": 1722} {"train_loss": -42.416259765625, "global_step": 208464, "epoch": 1722} {"train_loss": -41.488346099853516, "global_step": 208465, "epoch": 1722} {"train_loss": -41.98298263549805, "global_step": 208466, "epoch": 1722} {"train_loss": -41.585113525390625, "global_step": 208467, "epoch": 1722} {"train_loss": -42.061798095703125, "global_step": 208468, "epoch": 1722} {"train_loss": -41.72662353515625, "global_step": 208469, "epoch": 1722} {"train_loss": -41.55941390991211, "global_step": 208470, "epoch": 1722} {"train_loss": -42.22718048095703, "global_step": 208471, "epoch": 1722} {"train_loss": -41.62296676635742, "global_step": 208472, "epoch": 1722} {"train_loss": -41.69626998901367, "global_step": 208473, "epoch": 1722} {"train_loss": -42.36516189575195, "global_step": 208474, "epoch": 1722} {"train_loss": -41.97560119628906, "global_step": 208475, "epoch": 1722} {"train_loss": -41.94932556152344, "global_step": 208476, "epoch": 1722} {"train_loss": -42.01620864868164, "global_step": 208477, "epoch": 1722} {"train_loss": -42.115177154541016, "global_step": 208478, "epoch": 1722} {"train_loss": -41.37364196777344, "global_step": 208479, "epoch": 1722} {"train_loss": -41.70998001098633, "global_step": 208480, "epoch": 1722} {"train_loss": -42.210567474365234, "global_step": 208481, "epoch": 1722} {"train_loss": -41.40456437670495, "global_step": 208482, "epoch": 1722, "val_loss": 2435431.25} {"train_loss": -42.142860412597656, "global_step": 208483, "epoch": 1723} {"train_loss": -41.72515869140625, "global_step": 208484, "epoch": 1723} {"train_loss": -41.94480895996094, "global_step": 208485, "epoch": 1723} {"train_loss": -41.07025146484375, "global_step": 208486, "epoch": 1723} {"train_loss": -42.15798568725586, "global_step": 208487, "epoch": 1723} {"train_loss": -42.20916748046875, "global_step": 208488, "epoch": 1723} {"train_loss": -40.7619743347168, "global_step": 208489, "epoch": 1723} {"train_loss": -42.703590393066406, "global_step": 208490, "epoch": 1723} {"train_loss": -42.31002426147461, "global_step": 208491, "epoch": 1723} {"train_loss": -41.519168853759766, "global_step": 208492, "epoch": 1723} {"train_loss": -42.62700271606445, "global_step": 208493, "epoch": 1723} {"train_loss": -42.51939010620117, "global_step": 208494, "epoch": 1723} {"train_loss": -41.40174865722656, "global_step": 208495, "epoch": 1723} {"train_loss": -41.418128967285156, "global_step": 208496, "epoch": 1723} {"train_loss": -41.25480651855469, "global_step": 208497, "epoch": 1723} {"train_loss": -37.67706298828125, "global_step": 208498, "epoch": 1723} {"train_loss": -41.726985931396484, "global_step": 208499, "epoch": 1723} {"train_loss": -40.65113830566406, "global_step": 208500, "epoch": 1723} {"train_loss": -41.848812103271484, "global_step": 208501, "epoch": 1723} {"train_loss": -39.40840530395508, "global_step": 208502, "epoch": 1723} {"train_loss": -41.1954460144043, "global_step": 208503, "epoch": 1723} {"train_loss": -40.14980697631836, "global_step": 208504, "epoch": 1723} {"train_loss": -40.07917022705078, "global_step": 208505, "epoch": 1723} {"train_loss": -37.8840446472168, "global_step": 208506, "epoch": 1723} {"train_loss": -41.88662338256836, "global_step": 208507, "epoch": 1723} {"train_loss": -39.695499420166016, "global_step": 208508, "epoch": 1723} {"train_loss": -39.626609802246094, "global_step": 208509, "epoch": 1723} {"train_loss": -41.440269470214844, "global_step": 208510, "epoch": 1723} {"train_loss": -41.48580551147461, "global_step": 208511, "epoch": 1723} {"train_loss": -40.76471710205078, "global_step": 208512, "epoch": 1723} {"train_loss": -41.28170394897461, "global_step": 208513, "epoch": 1723} {"train_loss": -40.17227554321289, "global_step": 208514, "epoch": 1723} {"train_loss": -41.45473861694336, "global_step": 208515, "epoch": 1723} {"train_loss": -33.94371795654297, "global_step": 208516, "epoch": 1723} {"train_loss": -37.70978546142578, "global_step": 208517, "epoch": 1723} {"train_loss": -34.5265007019043, "global_step": 208518, "epoch": 1723} {"train_loss": -35.171730041503906, "global_step": 208519, "epoch": 1723} {"train_loss": -31.382831573486328, "global_step": 208520, "epoch": 1723} {"train_loss": -31.017675399780273, "global_step": 208521, "epoch": 1723} {"train_loss": -39.28120803833008, "global_step": 208522, "epoch": 1723} {"train_loss": -39.465850830078125, "global_step": 208523, "epoch": 1723} {"train_loss": -30.623138427734375, "global_step": 208524, "epoch": 1723} {"train_loss": -34.753135681152344, "global_step": 208525, "epoch": 1723} {"train_loss": -36.735103607177734, "global_step": 208526, "epoch": 1723} {"train_loss": -33.9649543762207, "global_step": 208527, "epoch": 1723} {"train_loss": -35.5318489074707, "global_step": 208528, "epoch": 1723} {"train_loss": -36.7302131652832, "global_step": 208529, "epoch": 1723} {"train_loss": -37.70491027832031, "global_step": 208530, "epoch": 1723} {"train_loss": -40.79144287109375, "global_step": 208531, "epoch": 1723} {"train_loss": -34.765071868896484, "global_step": 208532, "epoch": 1723} {"train_loss": -38.02912139892578, "global_step": 208533, "epoch": 1723} {"train_loss": -30.807886123657227, "global_step": 208534, "epoch": 1723} {"train_loss": -38.517391204833984, "global_step": 208535, "epoch": 1723} {"train_loss": -36.33784866333008, "global_step": 208536, "epoch": 1723} {"train_loss": -36.365264892578125, "global_step": 208537, "epoch": 1723} {"train_loss": -35.198486328125, "global_step": 208538, "epoch": 1723} {"train_loss": -39.3443489074707, "global_step": 208539, "epoch": 1723} {"train_loss": -37.06224060058594, "global_step": 208540, "epoch": 1723} {"train_loss": -38.9047737121582, "global_step": 208541, "epoch": 1723} {"train_loss": -34.142330169677734, "global_step": 208542, "epoch": 1723} {"train_loss": -37.30964279174805, "global_step": 208543, "epoch": 1723} {"train_loss": -38.29854965209961, "global_step": 208544, "epoch": 1723} {"train_loss": -39.84578323364258, "global_step": 208545, "epoch": 1723} {"train_loss": -38.804134368896484, "global_step": 208546, "epoch": 1723} {"train_loss": -38.810237884521484, "global_step": 208547, "epoch": 1723} {"train_loss": -37.97046661376953, "global_step": 208548, "epoch": 1723} {"train_loss": -39.19407272338867, "global_step": 208549, "epoch": 1723} {"train_loss": -38.07712936401367, "global_step": 208550, "epoch": 1723} {"train_loss": -38.82699203491211, "global_step": 208551, "epoch": 1723} {"train_loss": -39.32221603393555, "global_step": 208552, "epoch": 1723} {"train_loss": -39.66846466064453, "global_step": 208553, "epoch": 1723} {"train_loss": -40.03171157836914, "global_step": 208554, "epoch": 1723} {"train_loss": -39.71536636352539, "global_step": 208555, "epoch": 1723} {"train_loss": -40.04221725463867, "global_step": 208556, "epoch": 1723} {"train_loss": -36.764503479003906, "global_step": 208557, "epoch": 1723} {"train_loss": -39.564697265625, "global_step": 208558, "epoch": 1723} {"train_loss": -40.25102233886719, "global_step": 208559, "epoch": 1723} {"train_loss": -38.39379119873047, "global_step": 208560, "epoch": 1723} {"train_loss": -40.04352569580078, "global_step": 208561, "epoch": 1723} {"train_loss": -40.468055725097656, "global_step": 208562, "epoch": 1723} {"train_loss": -40.97256851196289, "global_step": 208563, "epoch": 1723} {"train_loss": -38.585391998291016, "global_step": 208564, "epoch": 1723} {"train_loss": -40.28639602661133, "global_step": 208565, "epoch": 1723} {"train_loss": -40.00095748901367, "global_step": 208566, "epoch": 1723} {"train_loss": -39.633384704589844, "global_step": 208567, "epoch": 1723} {"train_loss": -40.965946197509766, "global_step": 208568, "epoch": 1723} {"train_loss": -40.24583053588867, "global_step": 208569, "epoch": 1723} {"train_loss": -39.674583435058594, "global_step": 208570, "epoch": 1723} {"train_loss": -39.511165618896484, "global_step": 208571, "epoch": 1723} {"train_loss": -41.137569427490234, "global_step": 208572, "epoch": 1723} {"train_loss": -41.03040313720703, "global_step": 208573, "epoch": 1723} {"train_loss": -40.90379333496094, "global_step": 208574, "epoch": 1723} {"train_loss": -40.370906829833984, "global_step": 208575, "epoch": 1723} {"train_loss": -40.49688720703125, "global_step": 208576, "epoch": 1723} {"train_loss": -40.69065475463867, "global_step": 208577, "epoch": 1723} {"train_loss": -40.79826736450195, "global_step": 208578, "epoch": 1723} {"train_loss": -39.9564323425293, "global_step": 208579, "epoch": 1723} {"train_loss": -40.72356033325195, "global_step": 208580, "epoch": 1723} {"train_loss": -40.645809173583984, "global_step": 208581, "epoch": 1723} {"train_loss": -40.70632553100586, "global_step": 208582, "epoch": 1723} {"train_loss": -40.05739212036133, "global_step": 208583, "epoch": 1723} {"train_loss": -39.60655212402344, "global_step": 208584, "epoch": 1723} {"train_loss": -41.17437744140625, "global_step": 208585, "epoch": 1723} {"train_loss": -41.03548812866211, "global_step": 208586, "epoch": 1723} {"train_loss": -40.51195526123047, "global_step": 208587, "epoch": 1723} {"train_loss": -40.8761100769043, "global_step": 208588, "epoch": 1723} {"train_loss": -40.590919494628906, "global_step": 208589, "epoch": 1723} {"train_loss": -41.033565521240234, "global_step": 208590, "epoch": 1723} {"train_loss": -41.13956832885742, "global_step": 208591, "epoch": 1723} {"train_loss": -42.026771545410156, "global_step": 208592, "epoch": 1723} {"train_loss": -41.588130950927734, "global_step": 208593, "epoch": 1723} {"train_loss": -41.11246109008789, "global_step": 208594, "epoch": 1723} {"train_loss": -41.886268615722656, "global_step": 208595, "epoch": 1723} {"train_loss": -41.38172149658203, "global_step": 208596, "epoch": 1723} {"train_loss": -40.87057876586914, "global_step": 208597, "epoch": 1723} {"train_loss": -41.014835357666016, "global_step": 208598, "epoch": 1723} {"train_loss": -41.65519714355469, "global_step": 208599, "epoch": 1723} {"train_loss": -41.58338165283203, "global_step": 208600, "epoch": 1723} {"train_loss": -41.170265197753906, "global_step": 208601, "epoch": 1723} {"train_loss": -41.66536331176758, "global_step": 208602, "epoch": 1723} {"train_loss": -39.47259212525423, "global_step": 208603, "epoch": 1723, "val_loss": 2624087.5} {"train_loss": -41.81513595581055, "global_step": 208604, "epoch": 1724} {"train_loss": -41.59791946411133, "global_step": 208605, "epoch": 1724} {"train_loss": -41.42183303833008, "global_step": 208606, "epoch": 1724} {"train_loss": -42.0623893737793, "global_step": 208607, "epoch": 1724} {"train_loss": -41.752418518066406, "global_step": 208608, "epoch": 1724} {"train_loss": -41.5954704284668, "global_step": 208609, "epoch": 1724} {"train_loss": -41.63422775268555, "global_step": 208610, "epoch": 1724} {"train_loss": -41.80752182006836, "global_step": 208611, "epoch": 1724} {"train_loss": -41.949127197265625, "global_step": 208612, "epoch": 1724} {"train_loss": -42.011817932128906, "global_step": 208613, "epoch": 1724} {"train_loss": -42.272071838378906, "global_step": 208614, "epoch": 1724} {"train_loss": -41.287837982177734, "global_step": 208615, "epoch": 1724} {"train_loss": -42.4401969909668, "global_step": 208616, "epoch": 1724} {"train_loss": -42.094478607177734, "global_step": 208617, "epoch": 1724} {"train_loss": -42.09077453613281, "global_step": 208618, "epoch": 1724} {"train_loss": -42.411827087402344, "global_step": 208619, "epoch": 1724} {"train_loss": -42.66598129272461, "global_step": 208620, "epoch": 1724} {"train_loss": -42.1518669128418, "global_step": 208621, "epoch": 1724} {"train_loss": -42.051963806152344, "global_step": 208622, "epoch": 1724} {"train_loss": -42.26631546020508, "global_step": 208623, "epoch": 1724} {"train_loss": -42.25010299682617, "global_step": 208624, "epoch": 1724} {"train_loss": -41.6919059753418, "global_step": 208625, "epoch": 1724} {"train_loss": -42.55864334106445, "global_step": 208626, "epoch": 1724} {"train_loss": -42.54806137084961, "global_step": 208627, "epoch": 1724} {"train_loss": -42.4359130859375, "global_step": 208628, "epoch": 1724} {"train_loss": -42.33220291137695, "global_step": 208629, "epoch": 1724} {"train_loss": -42.72948455810547, "global_step": 208630, "epoch": 1724} {"train_loss": -42.06569290161133, "global_step": 208631, "epoch": 1724} {"train_loss": -42.48663330078125, "global_step": 208632, "epoch": 1724} {"train_loss": -42.53725051879883, "global_step": 208633, "epoch": 1724} {"train_loss": -42.39680480957031, "global_step": 208634, "epoch": 1724} {"train_loss": -41.3946647644043, "global_step": 208635, "epoch": 1724} {"train_loss": -41.89265060424805, "global_step": 208636, "epoch": 1724} {"train_loss": -42.1567268371582, "global_step": 208637, "epoch": 1724} {"train_loss": -41.0210075378418, "global_step": 208638, "epoch": 1724} {"train_loss": -41.195125579833984, "global_step": 208639, "epoch": 1724} {"train_loss": -41.86796951293945, "global_step": 208640, "epoch": 1724} {"train_loss": -42.11376953125, "global_step": 208641, "epoch": 1724} {"train_loss": -39.5972900390625, "global_step": 208642, "epoch": 1724} {"train_loss": -36.61221694946289, "global_step": 208643, "epoch": 1724} {"train_loss": -34.12540817260742, "global_step": 208644, "epoch": 1724} {"train_loss": -28.063940048217773, "global_step": 208645, "epoch": 1724} {"train_loss": -24.106521606445312, "global_step": 208646, "epoch": 1724} {"train_loss": -27.290449142456055, "global_step": 208647, "epoch": 1724} {"train_loss": -36.91561508178711, "global_step": 208648, "epoch": 1724} {"train_loss": -35.06032943725586, "global_step": 208649, "epoch": 1724} {"train_loss": -26.8143253326416, "global_step": 208650, "epoch": 1724} {"train_loss": -31.77015495300293, "global_step": 208651, "epoch": 1724} {"train_loss": -37.93050765991211, "global_step": 208652, "epoch": 1724} {"train_loss": -33.7357177734375, "global_step": 208653, "epoch": 1724} {"train_loss": -35.431175231933594, "global_step": 208654, "epoch": 1724} {"train_loss": -34.83293533325195, "global_step": 208655, "epoch": 1724} {"train_loss": -39.0561637878418, "global_step": 208656, "epoch": 1724} {"train_loss": -37.652442932128906, "global_step": 208657, "epoch": 1724} {"train_loss": -39.26632308959961, "global_step": 208658, "epoch": 1724} {"train_loss": -38.01276779174805, "global_step": 208659, "epoch": 1724} {"train_loss": -39.02329635620117, "global_step": 208660, "epoch": 1724} {"train_loss": -39.76923751831055, "global_step": 208661, "epoch": 1724} {"train_loss": -39.47377395629883, "global_step": 208662, "epoch": 1724} {"train_loss": -40.694549560546875, "global_step": 208663, "epoch": 1724} {"train_loss": -39.84505844116211, "global_step": 208664, "epoch": 1724} {"train_loss": -40.02663803100586, "global_step": 208665, "epoch": 1724} {"train_loss": -39.58073043823242, "global_step": 208666, "epoch": 1724} {"train_loss": -39.27385330200195, "global_step": 208667, "epoch": 1724} {"train_loss": -39.56547164916992, "global_step": 208668, "epoch": 1724} {"train_loss": -40.424312591552734, "global_step": 208669, "epoch": 1724} {"train_loss": -39.336334228515625, "global_step": 208670, "epoch": 1724} {"train_loss": -40.7577018737793, "global_step": 208671, "epoch": 1724} {"train_loss": -39.478092193603516, "global_step": 208672, "epoch": 1724} {"train_loss": -40.55219268798828, "global_step": 208673, "epoch": 1724} {"train_loss": -41.10273361206055, "global_step": 208674, "epoch": 1724} {"train_loss": -40.31535720825195, "global_step": 208675, "epoch": 1724} {"train_loss": -40.56180953979492, "global_step": 208676, "epoch": 1724} {"train_loss": -40.90729904174805, "global_step": 208677, "epoch": 1724} {"train_loss": -40.77253723144531, "global_step": 208678, "epoch": 1724} {"train_loss": -40.8154411315918, "global_step": 208679, "epoch": 1724} {"train_loss": -41.037811279296875, "global_step": 208680, "epoch": 1724} {"train_loss": -40.60951614379883, "global_step": 208681, "epoch": 1724} {"train_loss": -41.06511306762695, "global_step": 208682, "epoch": 1724} {"train_loss": -41.69792175292969, "global_step": 208683, "epoch": 1724} {"train_loss": -41.804134368896484, "global_step": 208684, "epoch": 1724} {"train_loss": -41.442623138427734, "global_step": 208685, "epoch": 1724} {"train_loss": -41.183258056640625, "global_step": 208686, "epoch": 1724} {"train_loss": -40.8885383605957, "global_step": 208687, "epoch": 1724} {"train_loss": -41.33763885498047, "global_step": 208688, "epoch": 1724} {"train_loss": -41.440704345703125, "global_step": 208689, "epoch": 1724} {"train_loss": -41.68764114379883, "global_step": 208690, "epoch": 1724} {"train_loss": -41.426063537597656, "global_step": 208691, "epoch": 1724} {"train_loss": -41.42425537109375, "global_step": 208692, "epoch": 1724} {"train_loss": -41.503787994384766, "global_step": 208693, "epoch": 1724} {"train_loss": -41.737667083740234, "global_step": 208694, "epoch": 1724} {"train_loss": -41.534488677978516, "global_step": 208695, "epoch": 1724} {"train_loss": -41.60939025878906, "global_step": 208696, "epoch": 1724} {"train_loss": -41.17359161376953, "global_step": 208697, "epoch": 1724} {"train_loss": -42.020084381103516, "global_step": 208698, "epoch": 1724} {"train_loss": -41.42824172973633, "global_step": 208699, "epoch": 1724} {"train_loss": -41.717926025390625, "global_step": 208700, "epoch": 1724} {"train_loss": -41.37641525268555, "global_step": 208701, "epoch": 1724} {"train_loss": -41.528987884521484, "global_step": 208702, "epoch": 1724} {"train_loss": -41.670101165771484, "global_step": 208703, "epoch": 1724} {"train_loss": -42.136512756347656, "global_step": 208704, "epoch": 1724} {"train_loss": -41.699501037597656, "global_step": 208705, "epoch": 1724} {"train_loss": -41.7479362487793, "global_step": 208706, "epoch": 1724} {"train_loss": -42.06188201904297, "global_step": 208707, "epoch": 1724} {"train_loss": -41.7951545715332, "global_step": 208708, "epoch": 1724} {"train_loss": -42.041297912597656, "global_step": 208709, "epoch": 1724} {"train_loss": -41.974029541015625, "global_step": 208710, "epoch": 1724} {"train_loss": -42.0012321472168, "global_step": 208711, "epoch": 1724} {"train_loss": -42.26487350463867, "global_step": 208712, "epoch": 1724} {"train_loss": -42.37453842163086, "global_step": 208713, "epoch": 1724} {"train_loss": -42.12783432006836, "global_step": 208714, "epoch": 1724} {"train_loss": -42.28913497924805, "global_step": 208715, "epoch": 1724} {"train_loss": -42.30538558959961, "global_step": 208716, "epoch": 1724} {"train_loss": -42.77851104736328, "global_step": 208717, "epoch": 1724} {"train_loss": -41.95994186401367, "global_step": 208718, "epoch": 1724} {"train_loss": -42.015987396240234, "global_step": 208719, "epoch": 1724} {"train_loss": -42.520912170410156, "global_step": 208720, "epoch": 1724} {"train_loss": -42.01082992553711, "global_step": 208721, "epoch": 1724} {"train_loss": -42.525054931640625, "global_step": 208722, "epoch": 1724} {"train_loss": -42.62447738647461, "global_step": 208723, "epoch": 1724} {"train_loss": -40.45935692274866, "global_step": 208724, "epoch": 1724, "val_loss": 2625847.25} {"train_loss": -42.69929122924805, "global_step": 208725, "epoch": 1725} {"train_loss": -42.603179931640625, "global_step": 208726, "epoch": 1725} {"train_loss": -42.59662628173828, "global_step": 208727, "epoch": 1725} {"train_loss": -42.94328689575195, "global_step": 208728, "epoch": 1725} {"train_loss": -42.63228225708008, "global_step": 208729, "epoch": 1725} {"train_loss": -42.178749084472656, "global_step": 208730, "epoch": 1725} {"train_loss": -42.21151351928711, "global_step": 208731, "epoch": 1725} {"train_loss": -41.01642990112305, "global_step": 208732, "epoch": 1725} {"train_loss": -42.47599411010742, "global_step": 208733, "epoch": 1725} {"train_loss": -42.663429260253906, "global_step": 208734, "epoch": 1725} {"train_loss": -42.68164825439453, "global_step": 208735, "epoch": 1725} {"train_loss": -42.54950714111328, "global_step": 208736, "epoch": 1725} {"train_loss": -42.93425369262695, "global_step": 208737, "epoch": 1725} {"train_loss": -42.94252395629883, "global_step": 208738, "epoch": 1725} {"train_loss": -42.8087272644043, "global_step": 208739, "epoch": 1725} {"train_loss": -43.0164909362793, "global_step": 208740, "epoch": 1725} {"train_loss": -42.717159271240234, "global_step": 208741, "epoch": 1725} {"train_loss": -42.632080078125, "global_step": 208742, "epoch": 1725} {"train_loss": -42.74137496948242, "global_step": 208743, "epoch": 1725} {"train_loss": -43.06809616088867, "global_step": 208744, "epoch": 1725} {"train_loss": -42.804073333740234, "global_step": 208745, "epoch": 1725} {"train_loss": -43.09043502807617, "global_step": 208746, "epoch": 1725} {"train_loss": -43.02363967895508, "global_step": 208747, "epoch": 1725} {"train_loss": -42.81978988647461, "global_step": 208748, "epoch": 1725} {"train_loss": -43.21612548828125, "global_step": 208749, "epoch": 1725} {"train_loss": -43.37697982788086, "global_step": 208750, "epoch": 1725} {"train_loss": -43.230934143066406, "global_step": 208751, "epoch": 1725} {"train_loss": -43.191463470458984, "global_step": 208752, "epoch": 1725} {"train_loss": -43.18333053588867, "global_step": 208753, "epoch": 1725} {"train_loss": -42.54594802856445, "global_step": 208754, "epoch": 1725} {"train_loss": -42.73188018798828, "global_step": 208755, "epoch": 1725} {"train_loss": -43.446739196777344, "global_step": 208756, "epoch": 1725} {"train_loss": -42.919776916503906, "global_step": 208757, "epoch": 1725} {"train_loss": -42.69026565551758, "global_step": 208758, "epoch": 1725} {"train_loss": -42.78771209716797, "global_step": 208759, "epoch": 1725} {"train_loss": -42.3863639831543, "global_step": 208760, "epoch": 1725} {"train_loss": -42.75409698486328, "global_step": 208761, "epoch": 1725} {"train_loss": -43.24495315551758, "global_step": 208762, "epoch": 1725} {"train_loss": -42.76750564575195, "global_step": 208763, "epoch": 1725} {"train_loss": -42.791709899902344, "global_step": 208764, "epoch": 1725} {"train_loss": -42.790096282958984, "global_step": 208765, "epoch": 1725} {"train_loss": -42.73789596557617, "global_step": 208766, "epoch": 1725} {"train_loss": -42.4075927734375, "global_step": 208767, "epoch": 1725} {"train_loss": -42.857418060302734, "global_step": 208768, "epoch": 1725} {"train_loss": -41.20162582397461, "global_step": 208769, "epoch": 1725} {"train_loss": -39.9492073059082, "global_step": 208770, "epoch": 1725} {"train_loss": -39.22051239013672, "global_step": 208771, "epoch": 1725} {"train_loss": -38.89777374267578, "global_step": 208772, "epoch": 1725} {"train_loss": -41.37348937988281, "global_step": 208773, "epoch": 1725} {"train_loss": -42.83137893676758, "global_step": 208774, "epoch": 1725} {"train_loss": -38.205230712890625, "global_step": 208775, "epoch": 1725} {"train_loss": -28.13331413269043, "global_step": 208776, "epoch": 1725} {"train_loss": -24.819623947143555, "global_step": 208777, "epoch": 1725} {"train_loss": -34.16250228881836, "global_step": 208778, "epoch": 1725} {"train_loss": -37.4640007019043, "global_step": 208779, "epoch": 1725} {"train_loss": -34.55054473876953, "global_step": 208780, "epoch": 1725} {"train_loss": -35.28264617919922, "global_step": 208781, "epoch": 1725} {"train_loss": -34.701812744140625, "global_step": 208782, "epoch": 1725} {"train_loss": -32.43253707885742, "global_step": 208783, "epoch": 1725} {"train_loss": -38.58382034301758, "global_step": 208784, "epoch": 1725} {"train_loss": -35.51625442504883, "global_step": 208785, "epoch": 1725} {"train_loss": -37.71368408203125, "global_step": 208786, "epoch": 1725} {"train_loss": -37.284549713134766, "global_step": 208787, "epoch": 1725} {"train_loss": -39.56089401245117, "global_step": 208788, "epoch": 1725} {"train_loss": -38.67806625366211, "global_step": 208789, "epoch": 1725} {"train_loss": -39.640438079833984, "global_step": 208790, "epoch": 1725} {"train_loss": -39.0823974609375, "global_step": 208791, "epoch": 1725} {"train_loss": -38.06308364868164, "global_step": 208792, "epoch": 1725} {"train_loss": -40.59019088745117, "global_step": 208793, "epoch": 1725} {"train_loss": -39.14061737060547, "global_step": 208794, "epoch": 1725} {"train_loss": -38.30021286010742, "global_step": 208795, "epoch": 1725} {"train_loss": -38.27311325073242, "global_step": 208796, "epoch": 1725} {"train_loss": -39.20661544799805, "global_step": 208797, "epoch": 1725} {"train_loss": -40.193946838378906, "global_step": 208798, "epoch": 1725} {"train_loss": -40.6922607421875, "global_step": 208799, "epoch": 1725} {"train_loss": -39.764156341552734, "global_step": 208800, "epoch": 1725} {"train_loss": -40.22352600097656, "global_step": 208801, "epoch": 1725} {"train_loss": -40.40716552734375, "global_step": 208802, "epoch": 1725} {"train_loss": -39.7872314453125, "global_step": 208803, "epoch": 1725} {"train_loss": -34.884883880615234, "global_step": 208804, "epoch": 1725} {"train_loss": -37.55491256713867, "global_step": 208805, "epoch": 1725} {"train_loss": -39.52203369140625, "global_step": 208806, "epoch": 1725} {"train_loss": -37.828399658203125, "global_step": 208807, "epoch": 1725} {"train_loss": -37.63767623901367, "global_step": 208808, "epoch": 1725} {"train_loss": -38.37575912475586, "global_step": 208809, "epoch": 1725} {"train_loss": -36.55698776245117, "global_step": 208810, "epoch": 1725} {"train_loss": -36.818294525146484, "global_step": 208811, "epoch": 1725} {"train_loss": -34.00776290893555, "global_step": 208812, "epoch": 1725} {"train_loss": -26.823144912719727, "global_step": 208813, "epoch": 1725} {"train_loss": -38.616310119628906, "global_step": 208814, "epoch": 1725} {"train_loss": -38.51365280151367, "global_step": 208815, "epoch": 1725} {"train_loss": -34.6304931640625, "global_step": 208816, "epoch": 1725} {"train_loss": -40.16641616821289, "global_step": 208817, "epoch": 1725} {"train_loss": -40.16231918334961, "global_step": 208818, "epoch": 1725} {"train_loss": -38.37754440307617, "global_step": 208819, "epoch": 1725} {"train_loss": -36.58488845825195, "global_step": 208820, "epoch": 1725} {"train_loss": -37.71043014526367, "global_step": 208821, "epoch": 1725} {"train_loss": -38.88843536376953, "global_step": 208822, "epoch": 1725} {"train_loss": -39.73037338256836, "global_step": 208823, "epoch": 1725} {"train_loss": -36.768470764160156, "global_step": 208824, "epoch": 1725} {"train_loss": -38.66727066040039, "global_step": 208825, "epoch": 1725} {"train_loss": -40.33138656616211, "global_step": 208826, "epoch": 1725} {"train_loss": -36.899559020996094, "global_step": 208827, "epoch": 1725} {"train_loss": -39.781837463378906, "global_step": 208828, "epoch": 1725} {"train_loss": -39.80885696411133, "global_step": 208829, "epoch": 1725} {"train_loss": -39.55265808105469, "global_step": 208830, "epoch": 1725} {"train_loss": -38.672935485839844, "global_step": 208831, "epoch": 1725} {"train_loss": -39.760169982910156, "global_step": 208832, "epoch": 1725} {"train_loss": -36.91200637817383, "global_step": 208833, "epoch": 1725} {"train_loss": -40.05196762084961, "global_step": 208834, "epoch": 1725} {"train_loss": -39.703895568847656, "global_step": 208835, "epoch": 1725} {"train_loss": -40.22669219970703, "global_step": 208836, "epoch": 1725} {"train_loss": -34.13216781616211, "global_step": 208837, "epoch": 1725} {"train_loss": -37.33417510986328, "global_step": 208838, "epoch": 1725} {"train_loss": -39.76460647583008, "global_step": 208839, "epoch": 1725} {"train_loss": -39.054603576660156, "global_step": 208840, "epoch": 1725} {"train_loss": -39.49113464355469, "global_step": 208841, "epoch": 1725} {"train_loss": -39.73398971557617, "global_step": 208842, "epoch": 1725} {"train_loss": -39.830360412597656, "global_step": 208843, "epoch": 1725} {"train_loss": -40.01484298706055, "global_step": 208844, "epoch": 1725} {"train_loss": -39.723234554952825, "global_step": 208845, "epoch": 1725, "val_loss": 3087577.75} {"train_loss": -40.97005844116211, "global_step": 208846, "epoch": 1726} {"train_loss": -40.57693099975586, "global_step": 208847, "epoch": 1726} {"train_loss": -40.394203186035156, "global_step": 208848, "epoch": 1726} {"train_loss": -40.925537109375, "global_step": 208849, "epoch": 1726} {"train_loss": -40.08794021606445, "global_step": 208850, "epoch": 1726} {"train_loss": -38.24299621582031, "global_step": 208851, "epoch": 1726} {"train_loss": -39.595638275146484, "global_step": 208852, "epoch": 1726} {"train_loss": -39.15876388549805, "global_step": 208853, "epoch": 1726} {"train_loss": -40.03403854370117, "global_step": 208854, "epoch": 1726} {"train_loss": -40.66884994506836, "global_step": 208855, "epoch": 1726} {"train_loss": -40.1038703918457, "global_step": 208856, "epoch": 1726} {"train_loss": -40.92335510253906, "global_step": 208857, "epoch": 1726} {"train_loss": -40.28040313720703, "global_step": 208858, "epoch": 1726} {"train_loss": -41.31317138671875, "global_step": 208859, "epoch": 1726} {"train_loss": -41.23591995239258, "global_step": 208860, "epoch": 1726} {"train_loss": -40.75531005859375, "global_step": 208861, "epoch": 1726} {"train_loss": -40.886817932128906, "global_step": 208862, "epoch": 1726} {"train_loss": -40.9244499206543, "global_step": 208863, "epoch": 1726} {"train_loss": -40.384151458740234, "global_step": 208864, "epoch": 1726} {"train_loss": -40.623260498046875, "global_step": 208865, "epoch": 1726} {"train_loss": -40.22270965576172, "global_step": 208866, "epoch": 1726} {"train_loss": -40.85700607299805, "global_step": 208867, "epoch": 1726} {"train_loss": -40.56398391723633, "global_step": 208868, "epoch": 1726} {"train_loss": -41.195587158203125, "global_step": 208869, "epoch": 1726} {"train_loss": -40.925235748291016, "global_step": 208870, "epoch": 1726} {"train_loss": -40.670833587646484, "global_step": 208871, "epoch": 1726} {"train_loss": -41.33024215698242, "global_step": 208872, "epoch": 1726} {"train_loss": -40.49925231933594, "global_step": 208873, "epoch": 1726} {"train_loss": -40.733882904052734, "global_step": 208874, "epoch": 1726} {"train_loss": -41.700565338134766, "global_step": 208875, "epoch": 1726} {"train_loss": -41.295135498046875, "global_step": 208876, "epoch": 1726} {"train_loss": -41.06148147583008, "global_step": 208877, "epoch": 1726} {"train_loss": -41.159423828125, "global_step": 208878, "epoch": 1726} {"train_loss": -40.8057975769043, "global_step": 208879, "epoch": 1726} {"train_loss": -41.707454681396484, "global_step": 208880, "epoch": 1726} {"train_loss": -41.896419525146484, "global_step": 208881, "epoch": 1726} {"train_loss": -40.75557327270508, "global_step": 208882, "epoch": 1726} {"train_loss": -41.5665397644043, "global_step": 208883, "epoch": 1726} {"train_loss": -41.89708709716797, "global_step": 208884, "epoch": 1726} {"train_loss": -40.73755645751953, "global_step": 208885, "epoch": 1726} {"train_loss": -42.18446731567383, "global_step": 208886, "epoch": 1726} {"train_loss": -41.77718734741211, "global_step": 208887, "epoch": 1726} {"train_loss": -40.90639114379883, "global_step": 208888, "epoch": 1726} {"train_loss": -40.92859649658203, "global_step": 208889, "epoch": 1726} {"train_loss": -41.11345291137695, "global_step": 208890, "epoch": 1726} {"train_loss": -41.41737747192383, "global_step": 208891, "epoch": 1726} {"train_loss": -41.47501754760742, "global_step": 208892, "epoch": 1726} {"train_loss": -41.73002243041992, "global_step": 208893, "epoch": 1726} {"train_loss": -41.89467239379883, "global_step": 208894, "epoch": 1726} {"train_loss": -41.94465255737305, "global_step": 208895, "epoch": 1726} {"train_loss": -41.20148849487305, "global_step": 208896, "epoch": 1726} {"train_loss": -41.77241134643555, "global_step": 208897, "epoch": 1726} {"train_loss": -42.45497512817383, "global_step": 208898, "epoch": 1726} {"train_loss": -42.22669219970703, "global_step": 208899, "epoch": 1726} {"train_loss": -42.447566986083984, "global_step": 208900, "epoch": 1726} {"train_loss": -41.731868743896484, "global_step": 208901, "epoch": 1726} {"train_loss": -41.75809860229492, "global_step": 208902, "epoch": 1726} {"train_loss": -42.12308883666992, "global_step": 208903, "epoch": 1726} {"train_loss": -41.907772064208984, "global_step": 208904, "epoch": 1726} {"train_loss": -41.082069396972656, "global_step": 208905, "epoch": 1726} {"train_loss": -41.5368766784668, "global_step": 208906, "epoch": 1726} {"train_loss": -41.76154327392578, "global_step": 208907, "epoch": 1726} {"train_loss": -42.332984924316406, "global_step": 208908, "epoch": 1726} {"train_loss": -41.87630081176758, "global_step": 208909, "epoch": 1726} {"train_loss": -41.487422943115234, "global_step": 208910, "epoch": 1726} {"train_loss": -41.38086700439453, "global_step": 208911, "epoch": 1726} {"train_loss": -41.96931076049805, "global_step": 208912, "epoch": 1726} {"train_loss": -41.776527404785156, "global_step": 208913, "epoch": 1726} {"train_loss": -41.97956466674805, "global_step": 208914, "epoch": 1726} {"train_loss": -41.604793548583984, "global_step": 208915, "epoch": 1726} {"train_loss": -42.14746856689453, "global_step": 208916, "epoch": 1726} {"train_loss": -40.61507034301758, "global_step": 208917, "epoch": 1726} {"train_loss": -41.47332763671875, "global_step": 208918, "epoch": 1726} {"train_loss": -41.61231231689453, "global_step": 208919, "epoch": 1726} {"train_loss": -42.1879997253418, "global_step": 208920, "epoch": 1726} {"train_loss": -42.185489654541016, "global_step": 208921, "epoch": 1726} {"train_loss": -42.08502197265625, "global_step": 208922, "epoch": 1726} {"train_loss": -42.1494255065918, "global_step": 208923, "epoch": 1726} {"train_loss": -41.7411994934082, "global_step": 208924, "epoch": 1726} {"train_loss": -41.05159378051758, "global_step": 208925, "epoch": 1726} {"train_loss": -41.01173782348633, "global_step": 208926, "epoch": 1726} {"train_loss": -40.897674560546875, "global_step": 208927, "epoch": 1726} {"train_loss": -41.632537841796875, "global_step": 208928, "epoch": 1726} {"train_loss": -41.77944564819336, "global_step": 208929, "epoch": 1726} {"train_loss": -42.00802993774414, "global_step": 208930, "epoch": 1726} {"train_loss": -41.753448486328125, "global_step": 208931, "epoch": 1726} {"train_loss": -42.75019836425781, "global_step": 208932, "epoch": 1726} {"train_loss": -41.00063705444336, "global_step": 208933, "epoch": 1726} {"train_loss": -42.578857421875, "global_step": 208934, "epoch": 1726} {"train_loss": -41.63862228393555, "global_step": 208935, "epoch": 1726} {"train_loss": -41.56846237182617, "global_step": 208936, "epoch": 1726} {"train_loss": -40.48198699951172, "global_step": 208937, "epoch": 1726} {"train_loss": -41.580657958984375, "global_step": 208938, "epoch": 1726} {"train_loss": -41.9072151184082, "global_step": 208939, "epoch": 1726} {"train_loss": -40.894996643066406, "global_step": 208940, "epoch": 1726} {"train_loss": -41.496944427490234, "global_step": 208941, "epoch": 1726} {"train_loss": -42.07014083862305, "global_step": 208942, "epoch": 1726} {"train_loss": -41.44320297241211, "global_step": 208943, "epoch": 1726} {"train_loss": -40.870479583740234, "global_step": 208944, "epoch": 1726} {"train_loss": -41.68486404418945, "global_step": 208945, "epoch": 1726} {"train_loss": -41.648250579833984, "global_step": 208946, "epoch": 1726} {"train_loss": -41.35042953491211, "global_step": 208947, "epoch": 1726} {"train_loss": -41.67936706542969, "global_step": 208948, "epoch": 1726} {"train_loss": -42.021888732910156, "global_step": 208949, "epoch": 1726} {"train_loss": -41.52858352661133, "global_step": 208950, "epoch": 1726} {"train_loss": -41.84927749633789, "global_step": 208951, "epoch": 1726} {"train_loss": -42.16066360473633, "global_step": 208952, "epoch": 1726} {"train_loss": -41.870052337646484, "global_step": 208953, "epoch": 1726} {"train_loss": -42.328365325927734, "global_step": 208954, "epoch": 1726} {"train_loss": -41.93313217163086, "global_step": 208955, "epoch": 1726} {"train_loss": -42.14796829223633, "global_step": 208956, "epoch": 1726} {"train_loss": -42.01810836791992, "global_step": 208957, "epoch": 1726} {"train_loss": -42.0829963684082, "global_step": 208958, "epoch": 1726} {"train_loss": -41.127376556396484, "global_step": 208959, "epoch": 1726} {"train_loss": -41.99542999267578, "global_step": 208960, "epoch": 1726} {"train_loss": -40.64421081542969, "global_step": 208961, "epoch": 1726} {"train_loss": -40.35435104370117, "global_step": 208962, "epoch": 1726} {"train_loss": -40.541542053222656, "global_step": 208963, "epoch": 1726} {"train_loss": -41.33452224731445, "global_step": 208964, "epoch": 1726} {"train_loss": -39.08586883544922, "global_step": 208965, "epoch": 1726} {"train_loss": -41.32083773021856, "global_step": 208966, "epoch": 1726, "val_loss": 2664175.75} {"train_loss": -34.480831146240234, "global_step": 208967, "epoch": 1727} {"train_loss": -20.26716423034668, "global_step": 208968, "epoch": 1727} {"train_loss": -39.40205764770508, "global_step": 208969, "epoch": 1727} {"train_loss": -30.761632919311523, "global_step": 208970, "epoch": 1727} {"train_loss": -39.37495040893555, "global_step": 208971, "epoch": 1727} {"train_loss": -34.16829299926758, "global_step": 208972, "epoch": 1727} {"train_loss": -40.05818557739258, "global_step": 208973, "epoch": 1727} {"train_loss": -35.01184844970703, "global_step": 208974, "epoch": 1727} {"train_loss": -40.55547332763672, "global_step": 208975, "epoch": 1727} {"train_loss": -38.64484786987305, "global_step": 208976, "epoch": 1727} {"train_loss": -37.685665130615234, "global_step": 208977, "epoch": 1727} {"train_loss": -40.189971923828125, "global_step": 208978, "epoch": 1727} {"train_loss": -38.01581954956055, "global_step": 208979, "epoch": 1727} {"train_loss": -40.291866302490234, "global_step": 208980, "epoch": 1727} {"train_loss": -37.27564239501953, "global_step": 208981, "epoch": 1727} {"train_loss": -39.975555419921875, "global_step": 208982, "epoch": 1727} {"train_loss": -36.82442855834961, "global_step": 208983, "epoch": 1727} {"train_loss": -37.18391418457031, "global_step": 208984, "epoch": 1727} {"train_loss": -41.06825637817383, "global_step": 208985, "epoch": 1727} {"train_loss": -39.36056137084961, "global_step": 208986, "epoch": 1727} {"train_loss": -39.573829650878906, "global_step": 208987, "epoch": 1727} {"train_loss": -39.92729568481445, "global_step": 208988, "epoch": 1727} {"train_loss": -35.252159118652344, "global_step": 208989, "epoch": 1727} {"train_loss": -37.8056755065918, "global_step": 208990, "epoch": 1727} {"train_loss": -39.895809173583984, "global_step": 208991, "epoch": 1727} {"train_loss": -37.9202880859375, "global_step": 208992, "epoch": 1727} {"train_loss": -37.14286804199219, "global_step": 208993, "epoch": 1727} {"train_loss": -39.61009979248047, "global_step": 208994, "epoch": 1727} {"train_loss": -30.854248046875, "global_step": 208995, "epoch": 1727} {"train_loss": -38.323768615722656, "global_step": 208996, "epoch": 1727} {"train_loss": -38.837257385253906, "global_step": 208997, "epoch": 1727} {"train_loss": -38.07981872558594, "global_step": 208998, "epoch": 1727} {"train_loss": -38.79962158203125, "global_step": 208999, "epoch": 1727} {"train_loss": -38.43532180786133, "global_step": 209000, "epoch": 1727} {"train_loss": -40.370853424072266, "global_step": 209001, "epoch": 1727} {"train_loss": -38.340492248535156, "global_step": 209002, "epoch": 1727} {"train_loss": -37.575103759765625, "global_step": 209003, "epoch": 1727} {"train_loss": -37.403079986572266, "global_step": 209004, "epoch": 1727} {"train_loss": -38.94718551635742, "global_step": 209005, "epoch": 1727} {"train_loss": -38.8670768737793, "global_step": 209006, "epoch": 1727} {"train_loss": -38.994503021240234, "global_step": 209007, "epoch": 1727} {"train_loss": -38.96857452392578, "global_step": 209008, "epoch": 1727} {"train_loss": -40.10003662109375, "global_step": 209009, "epoch": 1727} {"train_loss": -38.40252685546875, "global_step": 209010, "epoch": 1727} {"train_loss": -40.509891510009766, "global_step": 209011, "epoch": 1727} {"train_loss": -38.54610824584961, "global_step": 209012, "epoch": 1727} {"train_loss": -40.02378463745117, "global_step": 209013, "epoch": 1727} {"train_loss": -39.62282180786133, "global_step": 209014, "epoch": 1727} {"train_loss": -38.46004104614258, "global_step": 209015, "epoch": 1727} {"train_loss": -36.80036163330078, "global_step": 209016, "epoch": 1727} {"train_loss": -38.402809143066406, "global_step": 209017, "epoch": 1727} {"train_loss": -38.739479064941406, "global_step": 209018, "epoch": 1727} {"train_loss": -40.038448333740234, "global_step": 209019, "epoch": 1727} {"train_loss": -32.180442810058594, "global_step": 209020, "epoch": 1727} {"train_loss": -37.8315544128418, "global_step": 209021, "epoch": 1727} {"train_loss": -37.44655227661133, "global_step": 209022, "epoch": 1727} {"train_loss": -38.85514831542969, "global_step": 209023, "epoch": 1727} {"train_loss": -40.49349594116211, "global_step": 209024, "epoch": 1727} {"train_loss": -39.261226654052734, "global_step": 209025, "epoch": 1727} {"train_loss": -40.33300018310547, "global_step": 209026, "epoch": 1727} {"train_loss": -38.88734817504883, "global_step": 209027, "epoch": 1727} {"train_loss": -38.74900436401367, "global_step": 209028, "epoch": 1727} {"train_loss": -36.72596740722656, "global_step": 209029, "epoch": 1727} {"train_loss": -38.536495208740234, "global_step": 209030, "epoch": 1727} {"train_loss": -38.19491958618164, "global_step": 209031, "epoch": 1727} {"train_loss": -39.323299407958984, "global_step": 209032, "epoch": 1727} {"train_loss": -39.87889099121094, "global_step": 209033, "epoch": 1727} {"train_loss": -39.826026916503906, "global_step": 209034, "epoch": 1727} {"train_loss": -39.194129943847656, "global_step": 209035, "epoch": 1727} {"train_loss": -39.831214904785156, "global_step": 209036, "epoch": 1727} {"train_loss": -39.74536895751953, "global_step": 209037, "epoch": 1727} {"train_loss": -39.2870979309082, "global_step": 209038, "epoch": 1727} {"train_loss": -37.94390869140625, "global_step": 209039, "epoch": 1727} {"train_loss": -40.053104400634766, "global_step": 209040, "epoch": 1727} {"train_loss": -37.83970260620117, "global_step": 209041, "epoch": 1727} {"train_loss": -40.681976318359375, "global_step": 209042, "epoch": 1727} {"train_loss": -40.10941696166992, "global_step": 209043, "epoch": 1727} {"train_loss": -39.57117462158203, "global_step": 209044, "epoch": 1727} {"train_loss": -39.66545867919922, "global_step": 209045, "epoch": 1727} {"train_loss": -39.921810150146484, "global_step": 209046, "epoch": 1727} {"train_loss": -40.14408493041992, "global_step": 209047, "epoch": 1727} {"train_loss": -39.8599739074707, "global_step": 209048, "epoch": 1727} {"train_loss": -39.426448822021484, "global_step": 209049, "epoch": 1727} {"train_loss": -39.561397552490234, "global_step": 209050, "epoch": 1727} {"train_loss": -39.939308166503906, "global_step": 209051, "epoch": 1727} {"train_loss": -40.63003921508789, "global_step": 209052, "epoch": 1727} {"train_loss": -40.911643981933594, "global_step": 209053, "epoch": 1727} {"train_loss": -40.83559036254883, "global_step": 209054, "epoch": 1727} {"train_loss": -40.52375030517578, "global_step": 209055, "epoch": 1727} {"train_loss": -40.143775939941406, "global_step": 209056, "epoch": 1727} {"train_loss": -40.98969268798828, "global_step": 209057, "epoch": 1727} {"train_loss": -38.61518478393555, "global_step": 209058, "epoch": 1727} {"train_loss": -40.067691802978516, "global_step": 209059, "epoch": 1727} {"train_loss": -39.76118850708008, "global_step": 209060, "epoch": 1727} {"train_loss": -41.12815856933594, "global_step": 209061, "epoch": 1727} {"train_loss": -40.8072509765625, "global_step": 209062, "epoch": 1727} {"train_loss": -40.40034866333008, "global_step": 209063, "epoch": 1727} {"train_loss": -40.26502227783203, "global_step": 209064, "epoch": 1727} {"train_loss": -39.68134307861328, "global_step": 209065, "epoch": 1727} {"train_loss": -40.4528694152832, "global_step": 209066, "epoch": 1727} {"train_loss": -40.14049530029297, "global_step": 209067, "epoch": 1727} {"train_loss": -41.52289581298828, "global_step": 209068, "epoch": 1727} {"train_loss": -40.20259475708008, "global_step": 209069, "epoch": 1727} {"train_loss": -41.13826370239258, "global_step": 209070, "epoch": 1727} {"train_loss": -41.35580062866211, "global_step": 209071, "epoch": 1727} {"train_loss": -39.729034423828125, "global_step": 209072, "epoch": 1727} {"train_loss": -40.684478759765625, "global_step": 209073, "epoch": 1727} {"train_loss": -41.05963134765625, "global_step": 209074, "epoch": 1727} {"train_loss": -41.671512603759766, "global_step": 209075, "epoch": 1727} {"train_loss": -41.48290252685547, "global_step": 209076, "epoch": 1727} {"train_loss": -41.33711624145508, "global_step": 209077, "epoch": 1727} {"train_loss": -41.8541259765625, "global_step": 209078, "epoch": 1727} {"train_loss": -41.191524505615234, "global_step": 209079, "epoch": 1727} {"train_loss": -41.0943603515625, "global_step": 209080, "epoch": 1727} {"train_loss": -39.981285095214844, "global_step": 209081, "epoch": 1727} {"train_loss": -41.54081344604492, "global_step": 209082, "epoch": 1727} {"train_loss": -41.23104476928711, "global_step": 209083, "epoch": 1727} {"train_loss": -41.403602600097656, "global_step": 209084, "epoch": 1727} {"train_loss": -42.2780647277832, "global_step": 209085, "epoch": 1727} {"train_loss": -41.51270294189453, "global_step": 209086, "epoch": 1727} {"train_loss": -39.07286065472059, "global_step": 209087, "epoch": 1727, "val_loss": 2692747.0} {"train_loss": -41.293277740478516, "global_step": 209088, "epoch": 1728} {"train_loss": -42.1400260925293, "global_step": 209089, "epoch": 1728} {"train_loss": -41.150909423828125, "global_step": 209090, "epoch": 1728} {"train_loss": -41.657344818115234, "global_step": 209091, "epoch": 1728} {"train_loss": -41.74684524536133, "global_step": 209092, "epoch": 1728} {"train_loss": -41.762939453125, "global_step": 209093, "epoch": 1728} {"train_loss": -41.46565628051758, "global_step": 209094, "epoch": 1728} {"train_loss": -42.078025817871094, "global_step": 209095, "epoch": 1728} {"train_loss": -41.226219177246094, "global_step": 209096, "epoch": 1728} {"train_loss": -41.145591735839844, "global_step": 209097, "epoch": 1728} {"train_loss": -41.808143615722656, "global_step": 209098, "epoch": 1728} {"train_loss": -42.142330169677734, "global_step": 209099, "epoch": 1728} {"train_loss": -42.24215316772461, "global_step": 209100, "epoch": 1728} {"train_loss": -41.264732360839844, "global_step": 209101, "epoch": 1728} {"train_loss": -41.151241302490234, "global_step": 209102, "epoch": 1728} {"train_loss": -41.91746520996094, "global_step": 209103, "epoch": 1728} {"train_loss": -41.863338470458984, "global_step": 209104, "epoch": 1728} {"train_loss": -42.34511184692383, "global_step": 209105, "epoch": 1728} {"train_loss": -41.870086669921875, "global_step": 209106, "epoch": 1728} {"train_loss": -41.150978088378906, "global_step": 209107, "epoch": 1728} {"train_loss": -41.668914794921875, "global_step": 209108, "epoch": 1728} {"train_loss": -42.563819885253906, "global_step": 209109, "epoch": 1728} {"train_loss": -41.842159271240234, "global_step": 209110, "epoch": 1728} {"train_loss": -39.493099212646484, "global_step": 209111, "epoch": 1728} {"train_loss": -37.30214309692383, "global_step": 209112, "epoch": 1728} {"train_loss": -39.33027648925781, "global_step": 209113, "epoch": 1728} {"train_loss": -42.01837921142578, "global_step": 209114, "epoch": 1728} {"train_loss": -41.052921295166016, "global_step": 209115, "epoch": 1728} {"train_loss": -38.41372299194336, "global_step": 209116, "epoch": 1728} {"train_loss": -38.06878662109375, "global_step": 209117, "epoch": 1728} {"train_loss": -39.59176254272461, "global_step": 209118, "epoch": 1728} {"train_loss": -41.0140380859375, "global_step": 209119, "epoch": 1728} {"train_loss": -38.06937026977539, "global_step": 209120, "epoch": 1728} {"train_loss": -35.545013427734375, "global_step": 209121, "epoch": 1728} {"train_loss": -39.75492858886719, "global_step": 209122, "epoch": 1728} {"train_loss": -39.000267028808594, "global_step": 209123, "epoch": 1728} {"train_loss": -39.40827560424805, "global_step": 209124, "epoch": 1728} {"train_loss": -40.91538619995117, "global_step": 209125, "epoch": 1728} {"train_loss": -40.161434173583984, "global_step": 209126, "epoch": 1728} {"train_loss": -41.01675033569336, "global_step": 209127, "epoch": 1728} {"train_loss": -37.40397262573242, "global_step": 209128, "epoch": 1728} {"train_loss": -38.193302154541016, "global_step": 209129, "epoch": 1728} {"train_loss": -41.40482711791992, "global_step": 209130, "epoch": 1728} {"train_loss": -40.53513717651367, "global_step": 209131, "epoch": 1728} {"train_loss": -41.25010299682617, "global_step": 209132, "epoch": 1728} {"train_loss": -41.30489730834961, "global_step": 209133, "epoch": 1728} {"train_loss": -41.167083740234375, "global_step": 209134, "epoch": 1728} {"train_loss": -41.180763244628906, "global_step": 209135, "epoch": 1728} {"train_loss": -41.03369140625, "global_step": 209136, "epoch": 1728} {"train_loss": -41.62610626220703, "global_step": 209137, "epoch": 1728} {"train_loss": -40.711055755615234, "global_step": 209138, "epoch": 1728} {"train_loss": -41.893550872802734, "global_step": 209139, "epoch": 1728} {"train_loss": -37.729183197021484, "global_step": 209140, "epoch": 1728} {"train_loss": -41.28974151611328, "global_step": 209141, "epoch": 1728} {"train_loss": -41.33406066894531, "global_step": 209142, "epoch": 1728} {"train_loss": -41.0035285949707, "global_step": 209143, "epoch": 1728} {"train_loss": -40.9503288269043, "global_step": 209144, "epoch": 1728} {"train_loss": -41.523006439208984, "global_step": 209145, "epoch": 1728} {"train_loss": -41.779685974121094, "global_step": 209146, "epoch": 1728} {"train_loss": -41.85206604003906, "global_step": 209147, "epoch": 1728} {"train_loss": -41.901763916015625, "global_step": 209148, "epoch": 1728} {"train_loss": -41.458194732666016, "global_step": 209149, "epoch": 1728} {"train_loss": -41.88094711303711, "global_step": 209150, "epoch": 1728} {"train_loss": -41.73627853393555, "global_step": 209151, "epoch": 1728} {"train_loss": -41.72178268432617, "global_step": 209152, "epoch": 1728} {"train_loss": -41.35401153564453, "global_step": 209153, "epoch": 1728} {"train_loss": -41.717567443847656, "global_step": 209154, "epoch": 1728} {"train_loss": -41.868709564208984, "global_step": 209155, "epoch": 1728} {"train_loss": -42.519500732421875, "global_step": 209156, "epoch": 1728} {"train_loss": -40.959651947021484, "global_step": 209157, "epoch": 1728} {"train_loss": -41.60219955444336, "global_step": 209158, "epoch": 1728} {"train_loss": -42.47001266479492, "global_step": 209159, "epoch": 1728} {"train_loss": -41.95370864868164, "global_step": 209160, "epoch": 1728} {"train_loss": -42.15644454956055, "global_step": 209161, "epoch": 1728} {"train_loss": -41.843074798583984, "global_step": 209162, "epoch": 1728} {"train_loss": -42.05000686645508, "global_step": 209163, "epoch": 1728} {"train_loss": -42.23493576049805, "global_step": 209164, "epoch": 1728} {"train_loss": -42.3198127746582, "global_step": 209165, "epoch": 1728} {"train_loss": -41.751197814941406, "global_step": 209166, "epoch": 1728} {"train_loss": -42.48651123046875, "global_step": 209167, "epoch": 1728} {"train_loss": -41.631553649902344, "global_step": 209168, "epoch": 1728} {"train_loss": -41.51605987548828, "global_step": 209169, "epoch": 1728} {"train_loss": -42.15353012084961, "global_step": 209170, "epoch": 1728} {"train_loss": -41.205379486083984, "global_step": 209171, "epoch": 1728} {"train_loss": -42.16259002685547, "global_step": 209172, "epoch": 1728} {"train_loss": -40.940956115722656, "global_step": 209173, "epoch": 1728} {"train_loss": -42.29025650024414, "global_step": 209174, "epoch": 1728} {"train_loss": -41.596248626708984, "global_step": 209175, "epoch": 1728} {"train_loss": -41.168785095214844, "global_step": 209176, "epoch": 1728} {"train_loss": -42.02532958984375, "global_step": 209177, "epoch": 1728} {"train_loss": -40.95683288574219, "global_step": 209178, "epoch": 1728} {"train_loss": -41.567848205566406, "global_step": 209179, "epoch": 1728} {"train_loss": -41.95395278930664, "global_step": 209180, "epoch": 1728} {"train_loss": -41.71857452392578, "global_step": 209181, "epoch": 1728} {"train_loss": -41.77316665649414, "global_step": 209182, "epoch": 1728} {"train_loss": -42.198585510253906, "global_step": 209183, "epoch": 1728} {"train_loss": -42.363338470458984, "global_step": 209184, "epoch": 1728} {"train_loss": -40.020198822021484, "global_step": 209185, "epoch": 1728} {"train_loss": -41.456268310546875, "global_step": 209186, "epoch": 1728} {"train_loss": -42.370365142822266, "global_step": 209187, "epoch": 1728} {"train_loss": -41.201744079589844, "global_step": 209188, "epoch": 1728} {"train_loss": -42.227760314941406, "global_step": 209189, "epoch": 1728} {"train_loss": -41.75851058959961, "global_step": 209190, "epoch": 1728} {"train_loss": -39.084049224853516, "global_step": 209191, "epoch": 1728} {"train_loss": -42.04948806762695, "global_step": 209192, "epoch": 1728} {"train_loss": -42.33008575439453, "global_step": 209193, "epoch": 1728} {"train_loss": -40.92998123168945, "global_step": 209194, "epoch": 1728} {"train_loss": -41.90289306640625, "global_step": 209195, "epoch": 1728} {"train_loss": -39.874908447265625, "global_step": 209196, "epoch": 1728} {"train_loss": -40.04088592529297, "global_step": 209197, "epoch": 1728} {"train_loss": -41.54758834838867, "global_step": 209198, "epoch": 1728} {"train_loss": -41.32186508178711, "global_step": 209199, "epoch": 1728} {"train_loss": -41.895931243896484, "global_step": 209200, "epoch": 1728} {"train_loss": -40.95106887817383, "global_step": 209201, "epoch": 1728} {"train_loss": -39.70113754272461, "global_step": 209202, "epoch": 1728} {"train_loss": -40.955074310302734, "global_step": 209203, "epoch": 1728} {"train_loss": -41.3632926940918, "global_step": 209204, "epoch": 1728} {"train_loss": -40.25814437866211, "global_step": 209205, "epoch": 1728} {"train_loss": -41.24519729614258, "global_step": 209206, "epoch": 1728} {"train_loss": -40.717647552490234, "global_step": 209207, "epoch": 1728} {"train_loss": -41.132349755153186, "global_step": 209208, "epoch": 1728, "val_loss": 2519430.25} {"train_loss": -41.2891731262207, "global_step": 209209, "epoch": 1729} {"train_loss": -40.23719024658203, "global_step": 209210, "epoch": 1729} {"train_loss": -40.992340087890625, "global_step": 209211, "epoch": 1729} {"train_loss": -37.6533317565918, "global_step": 209212, "epoch": 1729} {"train_loss": -36.69470977783203, "global_step": 209213, "epoch": 1729} {"train_loss": -39.81168746948242, "global_step": 209214, "epoch": 1729} {"train_loss": -38.350624084472656, "global_step": 209215, "epoch": 1729} {"train_loss": -40.305049896240234, "global_step": 209216, "epoch": 1729} {"train_loss": -37.13383102416992, "global_step": 209217, "epoch": 1729} {"train_loss": -38.70969772338867, "global_step": 209218, "epoch": 1729} {"train_loss": -39.31336212158203, "global_step": 209219, "epoch": 1729} {"train_loss": -30.601343154907227, "global_step": 209220, "epoch": 1729} {"train_loss": -36.99164962768555, "global_step": 209221, "epoch": 1729} {"train_loss": -40.0349235534668, "global_step": 209222, "epoch": 1729} {"train_loss": -41.20619583129883, "global_step": 209223, "epoch": 1729} {"train_loss": -38.74903869628906, "global_step": 209224, "epoch": 1729} {"train_loss": -38.46836471557617, "global_step": 209225, "epoch": 1729} {"train_loss": -40.3552360534668, "global_step": 209226, "epoch": 1729} {"train_loss": -36.690185546875, "global_step": 209227, "epoch": 1729} {"train_loss": -40.34080123901367, "global_step": 209228, "epoch": 1729} {"train_loss": -40.02888107299805, "global_step": 209229, "epoch": 1729} {"train_loss": -40.14534378051758, "global_step": 209230, "epoch": 1729} {"train_loss": -39.87130355834961, "global_step": 209231, "epoch": 1729} {"train_loss": -41.313865661621094, "global_step": 209232, "epoch": 1729} {"train_loss": -39.06248092651367, "global_step": 209233, "epoch": 1729} {"train_loss": -40.29008865356445, "global_step": 209234, "epoch": 1729} {"train_loss": -38.702308654785156, "global_step": 209235, "epoch": 1729} {"train_loss": -37.39632797241211, "global_step": 209236, "epoch": 1729} {"train_loss": -38.60942840576172, "global_step": 209237, "epoch": 1729} {"train_loss": -40.28513717651367, "global_step": 209238, "epoch": 1729} {"train_loss": -39.278602600097656, "global_step": 209239, "epoch": 1729} {"train_loss": -40.963619232177734, "global_step": 209240, "epoch": 1729} {"train_loss": -37.45363235473633, "global_step": 209241, "epoch": 1729} {"train_loss": -40.262142181396484, "global_step": 209242, "epoch": 1729} {"train_loss": -40.91285705566406, "global_step": 209243, "epoch": 1729} {"train_loss": -40.509578704833984, "global_step": 209244, "epoch": 1729} {"train_loss": -40.89775085449219, "global_step": 209245, "epoch": 1729} {"train_loss": -41.291412353515625, "global_step": 209246, "epoch": 1729} {"train_loss": -40.8653678894043, "global_step": 209247, "epoch": 1729} {"train_loss": -40.99509811401367, "global_step": 209248, "epoch": 1729} {"train_loss": -39.92494583129883, "global_step": 209249, "epoch": 1729} {"train_loss": -40.54262161254883, "global_step": 209250, "epoch": 1729} {"train_loss": -40.339820861816406, "global_step": 209251, "epoch": 1729} {"train_loss": -41.02109146118164, "global_step": 209252, "epoch": 1729} {"train_loss": -41.48148727416992, "global_step": 209253, "epoch": 1729} {"train_loss": -39.84064483642578, "global_step": 209254, "epoch": 1729} {"train_loss": -41.64512252807617, "global_step": 209255, "epoch": 1729} {"train_loss": -41.36532211303711, "global_step": 209256, "epoch": 1729} {"train_loss": -41.29641342163086, "global_step": 209257, "epoch": 1729} {"train_loss": -40.689632415771484, "global_step": 209258, "epoch": 1729} {"train_loss": -41.43207931518555, "global_step": 209259, "epoch": 1729} {"train_loss": -41.17977523803711, "global_step": 209260, "epoch": 1729} {"train_loss": -39.7147331237793, "global_step": 209261, "epoch": 1729} {"train_loss": -41.584869384765625, "global_step": 209262, "epoch": 1729} {"train_loss": -39.473506927490234, "global_step": 209263, "epoch": 1729} {"train_loss": -41.61007308959961, "global_step": 209264, "epoch": 1729} {"train_loss": -40.3254280090332, "global_step": 209265, "epoch": 1729} {"train_loss": -41.76572799682617, "global_step": 209266, "epoch": 1729} {"train_loss": -41.2309684753418, "global_step": 209267, "epoch": 1729} {"train_loss": -41.72419357299805, "global_step": 209268, "epoch": 1729} {"train_loss": -40.77983093261719, "global_step": 209269, "epoch": 1729} {"train_loss": -41.5635986328125, "global_step": 209270, "epoch": 1729} {"train_loss": -41.11408996582031, "global_step": 209271, "epoch": 1729} {"train_loss": -41.93034744262695, "global_step": 209272, "epoch": 1729} {"train_loss": -41.92947006225586, "global_step": 209273, "epoch": 1729} {"train_loss": -41.59935760498047, "global_step": 209274, "epoch": 1729} {"train_loss": -41.914241790771484, "global_step": 209275, "epoch": 1729} {"train_loss": -41.84778594970703, "global_step": 209276, "epoch": 1729} {"train_loss": -40.31488800048828, "global_step": 209277, "epoch": 1729} {"train_loss": -42.26887512207031, "global_step": 209278, "epoch": 1729} {"train_loss": -40.69991683959961, "global_step": 209279, "epoch": 1729} {"train_loss": -41.96297836303711, "global_step": 209280, "epoch": 1729} {"train_loss": -41.748023986816406, "global_step": 209281, "epoch": 1729} {"train_loss": -41.93526840209961, "global_step": 209282, "epoch": 1729} {"train_loss": -40.686767578125, "global_step": 209283, "epoch": 1729} {"train_loss": -41.64659881591797, "global_step": 209284, "epoch": 1729} {"train_loss": -39.51102828979492, "global_step": 209285, "epoch": 1729} {"train_loss": -40.94367218017578, "global_step": 209286, "epoch": 1729} {"train_loss": -38.506038665771484, "global_step": 209287, "epoch": 1729} {"train_loss": -40.37518310546875, "global_step": 209288, "epoch": 1729} {"train_loss": -41.03996276855469, "global_step": 209289, "epoch": 1729} {"train_loss": -40.09281921386719, "global_step": 209290, "epoch": 1729} {"train_loss": -36.980464935302734, "global_step": 209291, "epoch": 1729} {"train_loss": -40.552589416503906, "global_step": 209292, "epoch": 1729} {"train_loss": -39.73884201049805, "global_step": 209293, "epoch": 1729} {"train_loss": -39.88600158691406, "global_step": 209294, "epoch": 1729} {"train_loss": -39.425315856933594, "global_step": 209295, "epoch": 1729} {"train_loss": -40.08063888549805, "global_step": 209296, "epoch": 1729} {"train_loss": -37.66704177856445, "global_step": 209297, "epoch": 1729} {"train_loss": -39.13899612426758, "global_step": 209298, "epoch": 1729} {"train_loss": -38.497249603271484, "global_step": 209299, "epoch": 1729} {"train_loss": -36.21934127807617, "global_step": 209300, "epoch": 1729} {"train_loss": -41.424407958984375, "global_step": 209301, "epoch": 1729} {"train_loss": -41.143978118896484, "global_step": 209302, "epoch": 1729} {"train_loss": -41.2782096862793, "global_step": 209303, "epoch": 1729} {"train_loss": -40.56669235229492, "global_step": 209304, "epoch": 1729} {"train_loss": -39.0529670715332, "global_step": 209305, "epoch": 1729} {"train_loss": -40.58607864379883, "global_step": 209306, "epoch": 1729} {"train_loss": -40.24668502807617, "global_step": 209307, "epoch": 1729} {"train_loss": -41.23090744018555, "global_step": 209308, "epoch": 1729} {"train_loss": -38.43702697753906, "global_step": 209309, "epoch": 1729} {"train_loss": -41.153221130371094, "global_step": 209310, "epoch": 1729} {"train_loss": -40.96408462524414, "global_step": 209311, "epoch": 1729} {"train_loss": -39.4459114074707, "global_step": 209312, "epoch": 1729} {"train_loss": -40.73396682739258, "global_step": 209313, "epoch": 1729} {"train_loss": -39.859310150146484, "global_step": 209314, "epoch": 1729} {"train_loss": -39.668453216552734, "global_step": 209315, "epoch": 1729} {"train_loss": -40.5160026550293, "global_step": 209316, "epoch": 1729} {"train_loss": -39.877586364746094, "global_step": 209317, "epoch": 1729} {"train_loss": -39.08942413330078, "global_step": 209318, "epoch": 1729} {"train_loss": -40.32951736450195, "global_step": 209319, "epoch": 1729} {"train_loss": -38.56608200073242, "global_step": 209320, "epoch": 1729} {"train_loss": -38.131431579589844, "global_step": 209321, "epoch": 1729} {"train_loss": -41.15163040161133, "global_step": 209322, "epoch": 1729} {"train_loss": -40.340065002441406, "global_step": 209323, "epoch": 1729} {"train_loss": -38.47449493408203, "global_step": 209324, "epoch": 1729} {"train_loss": -39.41284942626953, "global_step": 209325, "epoch": 1729} {"train_loss": -40.59738540649414, "global_step": 209326, "epoch": 1729} {"train_loss": -39.89846420288086, "global_step": 209327, "epoch": 1729} {"train_loss": -39.96406936645508, "global_step": 209328, "epoch": 1729} {"train_loss": -40.04264171064393, "global_step": 209329, "epoch": 1729, "val_loss": 2585133.25} {"train_loss": -40.07870101928711, "global_step": 209330, "epoch": 1730} {"train_loss": -35.29251480102539, "global_step": 209331, "epoch": 1730} {"train_loss": -40.44263458251953, "global_step": 209332, "epoch": 1730} {"train_loss": -38.826229095458984, "global_step": 209333, "epoch": 1730} {"train_loss": -38.08945846557617, "global_step": 209334, "epoch": 1730} {"train_loss": -38.28652572631836, "global_step": 209335, "epoch": 1730} {"train_loss": -35.37812423706055, "global_step": 209336, "epoch": 1730} {"train_loss": -37.86764144897461, "global_step": 209337, "epoch": 1730} {"train_loss": -37.86540222167969, "global_step": 209338, "epoch": 1730} {"train_loss": -38.93234634399414, "global_step": 209339, "epoch": 1730} {"train_loss": -37.99138259887695, "global_step": 209340, "epoch": 1730} {"train_loss": -38.834835052490234, "global_step": 209341, "epoch": 1730} {"train_loss": -37.68156051635742, "global_step": 209342, "epoch": 1730} {"train_loss": -40.39996337890625, "global_step": 209343, "epoch": 1730} {"train_loss": -30.599933624267578, "global_step": 209344, "epoch": 1730} {"train_loss": -37.6268196105957, "global_step": 209345, "epoch": 1730} {"train_loss": -37.41423416137695, "global_step": 209346, "epoch": 1730} {"train_loss": -38.92772674560547, "global_step": 209347, "epoch": 1730} {"train_loss": -37.326934814453125, "global_step": 209348, "epoch": 1730} {"train_loss": -40.020790100097656, "global_step": 209349, "epoch": 1730} {"train_loss": -38.26225662231445, "global_step": 209350, "epoch": 1730} {"train_loss": -39.01093673706055, "global_step": 209351, "epoch": 1730} {"train_loss": -36.9555549621582, "global_step": 209352, "epoch": 1730} {"train_loss": -39.28211212158203, "global_step": 209353, "epoch": 1730} {"train_loss": -37.13888168334961, "global_step": 209354, "epoch": 1730} {"train_loss": -39.28407669067383, "global_step": 209355, "epoch": 1730} {"train_loss": -38.42315673828125, "global_step": 209356, "epoch": 1730} {"train_loss": -39.29643249511719, "global_step": 209357, "epoch": 1730} {"train_loss": -38.94540786743164, "global_step": 209358, "epoch": 1730} {"train_loss": -40.81168746948242, "global_step": 209359, "epoch": 1730} {"train_loss": -38.79927444458008, "global_step": 209360, "epoch": 1730} {"train_loss": -39.00297164916992, "global_step": 209361, "epoch": 1730} {"train_loss": -37.90060806274414, "global_step": 209362, "epoch": 1730} {"train_loss": -38.529476165771484, "global_step": 209363, "epoch": 1730} {"train_loss": -39.1307373046875, "global_step": 209364, "epoch": 1730} {"train_loss": -40.27431869506836, "global_step": 209365, "epoch": 1730} {"train_loss": -39.400203704833984, "global_step": 209366, "epoch": 1730} {"train_loss": -40.474483489990234, "global_step": 209367, "epoch": 1730} {"train_loss": -40.578102111816406, "global_step": 209368, "epoch": 1730} {"train_loss": -39.69044494628906, "global_step": 209369, "epoch": 1730} {"train_loss": -39.128395080566406, "global_step": 209370, "epoch": 1730} {"train_loss": -40.14179611206055, "global_step": 209371, "epoch": 1730} {"train_loss": -40.23894119262695, "global_step": 209372, "epoch": 1730} {"train_loss": -40.485774993896484, "global_step": 209373, "epoch": 1730} {"train_loss": -41.03975296020508, "global_step": 209374, "epoch": 1730} {"train_loss": -40.22124099731445, "global_step": 209375, "epoch": 1730} {"train_loss": -39.749935150146484, "global_step": 209376, "epoch": 1730} {"train_loss": -40.89272689819336, "global_step": 209377, "epoch": 1730} {"train_loss": -39.71186065673828, "global_step": 209378, "epoch": 1730} {"train_loss": -40.13888168334961, "global_step": 209379, "epoch": 1730} {"train_loss": -40.94969940185547, "global_step": 209380, "epoch": 1730} {"train_loss": -39.561798095703125, "global_step": 209381, "epoch": 1730} {"train_loss": -40.710540771484375, "global_step": 209382, "epoch": 1730} {"train_loss": -40.893680572509766, "global_step": 209383, "epoch": 1730} {"train_loss": -40.28403854370117, "global_step": 209384, "epoch": 1730} {"train_loss": -40.0750846862793, "global_step": 209385, "epoch": 1730} {"train_loss": -40.455535888671875, "global_step": 209386, "epoch": 1730} {"train_loss": -40.9921989440918, "global_step": 209387, "epoch": 1730} {"train_loss": -40.327293395996094, "global_step": 209388, "epoch": 1730} {"train_loss": -40.61970138549805, "global_step": 209389, "epoch": 1730} {"train_loss": -40.595947265625, "global_step": 209390, "epoch": 1730} {"train_loss": -40.94320297241211, "global_step": 209391, "epoch": 1730} {"train_loss": -41.00436019897461, "global_step": 209392, "epoch": 1730} {"train_loss": -41.28327178955078, "global_step": 209393, "epoch": 1730} {"train_loss": -41.019325256347656, "global_step": 209394, "epoch": 1730} {"train_loss": -41.00635528564453, "global_step": 209395, "epoch": 1730} {"train_loss": -41.609493255615234, "global_step": 209396, "epoch": 1730} {"train_loss": -40.928836822509766, "global_step": 209397, "epoch": 1730} {"train_loss": -41.757080078125, "global_step": 209398, "epoch": 1730} {"train_loss": -41.313133239746094, "global_step": 209399, "epoch": 1730} {"train_loss": -41.52531051635742, "global_step": 209400, "epoch": 1730} {"train_loss": -41.469947814941406, "global_step": 209401, "epoch": 1730} {"train_loss": -41.422359466552734, "global_step": 209402, "epoch": 1730} {"train_loss": -40.83393478393555, "global_step": 209403, "epoch": 1730} {"train_loss": -41.03923416137695, "global_step": 209404, "epoch": 1730} {"train_loss": -41.30542755126953, "global_step": 209405, "epoch": 1730} {"train_loss": -41.002838134765625, "global_step": 209406, "epoch": 1730} {"train_loss": -41.549957275390625, "global_step": 209407, "epoch": 1730} {"train_loss": -40.69265365600586, "global_step": 209408, "epoch": 1730} {"train_loss": -41.35099411010742, "global_step": 209409, "epoch": 1730} {"train_loss": -41.675209045410156, "global_step": 209410, "epoch": 1730} {"train_loss": -40.726436614990234, "global_step": 209411, "epoch": 1730} {"train_loss": -41.4085807800293, "global_step": 209412, "epoch": 1730} {"train_loss": -41.9696044921875, "global_step": 209413, "epoch": 1730} {"train_loss": -42.04047393798828, "global_step": 209414, "epoch": 1730} {"train_loss": -40.85064697265625, "global_step": 209415, "epoch": 1730} {"train_loss": -41.75562286376953, "global_step": 209416, "epoch": 1730} {"train_loss": -41.547245025634766, "global_step": 209417, "epoch": 1730} {"train_loss": -41.50962829589844, "global_step": 209418, "epoch": 1730} {"train_loss": -41.613094329833984, "global_step": 209419, "epoch": 1730} {"train_loss": -42.31923294067383, "global_step": 209420, "epoch": 1730} {"train_loss": -41.58967208862305, "global_step": 209421, "epoch": 1730} {"train_loss": -41.580909729003906, "global_step": 209422, "epoch": 1730} {"train_loss": -41.686668395996094, "global_step": 209423, "epoch": 1730} {"train_loss": -41.85715866088867, "global_step": 209424, "epoch": 1730} {"train_loss": -41.400115966796875, "global_step": 209425, "epoch": 1730} {"train_loss": -40.97991943359375, "global_step": 209426, "epoch": 1730} {"train_loss": -41.671974182128906, "global_step": 209427, "epoch": 1730} {"train_loss": -41.973731994628906, "global_step": 209428, "epoch": 1730} {"train_loss": -41.861080169677734, "global_step": 209429, "epoch": 1730} {"train_loss": -41.90336990356445, "global_step": 209430, "epoch": 1730} {"train_loss": -42.22161865234375, "global_step": 209431, "epoch": 1730} {"train_loss": -41.6925163269043, "global_step": 209432, "epoch": 1730} {"train_loss": -42.230743408203125, "global_step": 209433, "epoch": 1730} {"train_loss": -42.615047454833984, "global_step": 209434, "epoch": 1730} {"train_loss": -41.957969665527344, "global_step": 209435, "epoch": 1730} {"train_loss": -41.99626541137695, "global_step": 209436, "epoch": 1730} {"train_loss": -42.22077560424805, "global_step": 209437, "epoch": 1730} {"train_loss": -42.39199447631836, "global_step": 209438, "epoch": 1730} {"train_loss": -41.935977935791016, "global_step": 209439, "epoch": 1730} {"train_loss": -41.51850891113281, "global_step": 209440, "epoch": 1730} {"train_loss": -41.48310089111328, "global_step": 209441, "epoch": 1730} {"train_loss": -39.9326057434082, "global_step": 209442, "epoch": 1730} {"train_loss": -33.484718322753906, "global_step": 209443, "epoch": 1730} {"train_loss": -7.345901012420654, "global_step": 209444, "epoch": 1730} {"train_loss": 25.640506744384766, "global_step": 209445, "epoch": 1730} {"train_loss": -1.984742522239685, "global_step": 209446, "epoch": 1730} {"train_loss": -36.69736862182617, "global_step": 209447, "epoch": 1730} {"train_loss": -2.1158440113067627, "global_step": 209448, "epoch": 1730} {"train_loss": -36.24836349487305, "global_step": 209449, "epoch": 1730} {"train_loss": -38.42660245126929, "global_step": 209450, "epoch": 1730, "val_loss": 2602668.25} {"train_loss": -37.01688766479492, "global_step": 209451, "epoch": 1731} {"train_loss": -16.57293128967285, "global_step": 209452, "epoch": 1731} {"train_loss": -37.33243942260742, "global_step": 209453, "epoch": 1731} {"train_loss": -28.374372482299805, "global_step": 209454, "epoch": 1731} {"train_loss": -30.51673698425293, "global_step": 209455, "epoch": 1731} {"train_loss": -35.50046920776367, "global_step": 209456, "epoch": 1731} {"train_loss": -32.3502311706543, "global_step": 209457, "epoch": 1731} {"train_loss": -32.11780548095703, "global_step": 209458, "epoch": 1731} {"train_loss": -37.22188186645508, "global_step": 209459, "epoch": 1731} {"train_loss": -33.44943618774414, "global_step": 209460, "epoch": 1731} {"train_loss": -35.03505325317383, "global_step": 209461, "epoch": 1731} {"train_loss": -37.45417022705078, "global_step": 209462, "epoch": 1731} {"train_loss": -37.10676193237305, "global_step": 209463, "epoch": 1731} {"train_loss": -34.91089630126953, "global_step": 209464, "epoch": 1731} {"train_loss": -37.32075119018555, "global_step": 209465, "epoch": 1731} {"train_loss": -38.873985290527344, "global_step": 209466, "epoch": 1731} {"train_loss": -36.86186218261719, "global_step": 209467, "epoch": 1731} {"train_loss": -37.24738693237305, "global_step": 209468, "epoch": 1731} {"train_loss": -38.61237335205078, "global_step": 209469, "epoch": 1731} {"train_loss": -39.1864128112793, "global_step": 209470, "epoch": 1731} {"train_loss": -38.54642105102539, "global_step": 209471, "epoch": 1731} {"train_loss": -38.347164154052734, "global_step": 209472, "epoch": 1731} {"train_loss": -38.53505325317383, "global_step": 209473, "epoch": 1731} {"train_loss": -39.10935592651367, "global_step": 209474, "epoch": 1731} {"train_loss": -38.69240951538086, "global_step": 209475, "epoch": 1731} {"train_loss": -39.53689193725586, "global_step": 209476, "epoch": 1731} {"train_loss": -39.52163314819336, "global_step": 209477, "epoch": 1731} {"train_loss": -39.597782135009766, "global_step": 209478, "epoch": 1731} {"train_loss": -38.848934173583984, "global_step": 209479, "epoch": 1731} {"train_loss": -39.43695831298828, "global_step": 209480, "epoch": 1731} {"train_loss": -39.521663665771484, "global_step": 209481, "epoch": 1731} {"train_loss": -39.836509704589844, "global_step": 209482, "epoch": 1731} {"train_loss": -39.64760208129883, "global_step": 209483, "epoch": 1731} {"train_loss": -39.82159423828125, "global_step": 209484, "epoch": 1731} {"train_loss": -39.66650390625, "global_step": 209485, "epoch": 1731} {"train_loss": -39.816261291503906, "global_step": 209486, "epoch": 1731} {"train_loss": -39.810546875, "global_step": 209487, "epoch": 1731} {"train_loss": -39.631988525390625, "global_step": 209488, "epoch": 1731} {"train_loss": -39.66752243041992, "global_step": 209489, "epoch": 1731} {"train_loss": -39.96627426147461, "global_step": 209490, "epoch": 1731} {"train_loss": -40.106502532958984, "global_step": 209491, "epoch": 1731} {"train_loss": -39.57281494140625, "global_step": 209492, "epoch": 1731} {"train_loss": -40.09696578979492, "global_step": 209493, "epoch": 1731} {"train_loss": -40.435157775878906, "global_step": 209494, "epoch": 1731} {"train_loss": -40.162689208984375, "global_step": 209495, "epoch": 1731} {"train_loss": -40.076812744140625, "global_step": 209496, "epoch": 1731} {"train_loss": -40.346920013427734, "global_step": 209497, "epoch": 1731} {"train_loss": -40.0837516784668, "global_step": 209498, "epoch": 1731} {"train_loss": -40.20857620239258, "global_step": 209499, "epoch": 1731} {"train_loss": -40.36693572998047, "global_step": 209500, "epoch": 1731} {"train_loss": -40.454078674316406, "global_step": 209501, "epoch": 1731} {"train_loss": -40.62569808959961, "global_step": 209502, "epoch": 1731} {"train_loss": -40.25747299194336, "global_step": 209503, "epoch": 1731} {"train_loss": -40.59796905517578, "global_step": 209504, "epoch": 1731} {"train_loss": -40.73181915283203, "global_step": 209505, "epoch": 1731} {"train_loss": -40.58938217163086, "global_step": 209506, "epoch": 1731} {"train_loss": -40.68746566772461, "global_step": 209507, "epoch": 1731} {"train_loss": -40.86664581298828, "global_step": 209508, "epoch": 1731} {"train_loss": -40.94965744018555, "global_step": 209509, "epoch": 1731} {"train_loss": -40.97314453125, "global_step": 209510, "epoch": 1731} {"train_loss": -41.04850387573242, "global_step": 209511, "epoch": 1731} {"train_loss": -41.19514846801758, "global_step": 209512, "epoch": 1731} {"train_loss": -40.62346267700195, "global_step": 209513, "epoch": 1731} {"train_loss": -40.87958908081055, "global_step": 209514, "epoch": 1731} {"train_loss": -40.93064880371094, "global_step": 209515, "epoch": 1731} {"train_loss": -41.121192932128906, "global_step": 209516, "epoch": 1731} {"train_loss": -41.00421905517578, "global_step": 209517, "epoch": 1731} {"train_loss": -41.245361328125, "global_step": 209518, "epoch": 1731} {"train_loss": -41.22983932495117, "global_step": 209519, "epoch": 1731} {"train_loss": -40.952125549316406, "global_step": 209520, "epoch": 1731} {"train_loss": -41.19990921020508, "global_step": 209521, "epoch": 1731} {"train_loss": -41.38117599487305, "global_step": 209522, "epoch": 1731} {"train_loss": -41.6339111328125, "global_step": 209523, "epoch": 1731} {"train_loss": -41.45730209350586, "global_step": 209524, "epoch": 1731} {"train_loss": -41.63133239746094, "global_step": 209525, "epoch": 1731} {"train_loss": -41.6585693359375, "global_step": 209526, "epoch": 1731} {"train_loss": -41.3385124206543, "global_step": 209527, "epoch": 1731} {"train_loss": -41.93059158325195, "global_step": 209528, "epoch": 1731} {"train_loss": -41.40104293823242, "global_step": 209529, "epoch": 1731} {"train_loss": -41.23688888549805, "global_step": 209530, "epoch": 1731} {"train_loss": -41.677093505859375, "global_step": 209531, "epoch": 1731} {"train_loss": -41.572689056396484, "global_step": 209532, "epoch": 1731} {"train_loss": -41.453636169433594, "global_step": 209533, "epoch": 1731} {"train_loss": -41.13408279418945, "global_step": 209534, "epoch": 1731} {"train_loss": -41.69662857055664, "global_step": 209535, "epoch": 1731} {"train_loss": -41.70194625854492, "global_step": 209536, "epoch": 1731} {"train_loss": -41.81083679199219, "global_step": 209537, "epoch": 1731} {"train_loss": -41.4759407043457, "global_step": 209538, "epoch": 1731} {"train_loss": -41.676788330078125, "global_step": 209539, "epoch": 1731} {"train_loss": -41.65903854370117, "global_step": 209540, "epoch": 1731} {"train_loss": -41.79939270019531, "global_step": 209541, "epoch": 1731} {"train_loss": -41.70132064819336, "global_step": 209542, "epoch": 1731} {"train_loss": -42.03080368041992, "global_step": 209543, "epoch": 1731} {"train_loss": -42.0389518737793, "global_step": 209544, "epoch": 1731} {"train_loss": -42.10434341430664, "global_step": 209545, "epoch": 1731} {"train_loss": -41.840240478515625, "global_step": 209546, "epoch": 1731} {"train_loss": -42.10720443725586, "global_step": 209547, "epoch": 1731} {"train_loss": -41.6275634765625, "global_step": 209548, "epoch": 1731} {"train_loss": -41.58498764038086, "global_step": 209549, "epoch": 1731} {"train_loss": -41.78972244262695, "global_step": 209550, "epoch": 1731} {"train_loss": -42.06686019897461, "global_step": 209551, "epoch": 1731} {"train_loss": -42.331119537353516, "global_step": 209552, "epoch": 1731} {"train_loss": -42.032833099365234, "global_step": 209553, "epoch": 1731} {"train_loss": -42.263999938964844, "global_step": 209554, "epoch": 1731} {"train_loss": -42.07268142700195, "global_step": 209555, "epoch": 1731} {"train_loss": -41.57178497314453, "global_step": 209556, "epoch": 1731} {"train_loss": -42.3155403137207, "global_step": 209557, "epoch": 1731} {"train_loss": -42.124000549316406, "global_step": 209558, "epoch": 1731} {"train_loss": -42.46481704711914, "global_step": 209559, "epoch": 1731} {"train_loss": -42.41078186035156, "global_step": 209560, "epoch": 1731} {"train_loss": -42.487525939941406, "global_step": 209561, "epoch": 1731} {"train_loss": -42.29861068725586, "global_step": 209562, "epoch": 1731} {"train_loss": -41.62255096435547, "global_step": 209563, "epoch": 1731} {"train_loss": -42.449100494384766, "global_step": 209564, "epoch": 1731} {"train_loss": -42.149314880371094, "global_step": 209565, "epoch": 1731} {"train_loss": -42.73673629760742, "global_step": 209566, "epoch": 1731} {"train_loss": -42.124141693115234, "global_step": 209567, "epoch": 1731} {"train_loss": -42.080963134765625, "global_step": 209568, "epoch": 1731} {"train_loss": -42.64851379394531, "global_step": 209569, "epoch": 1731} {"train_loss": -42.342529296875, "global_step": 209570, "epoch": 1731} {"train_loss": -39.95956302674349, "global_step": 209571, "epoch": 1731, "val_loss": 2628195.0} {"train_loss": -42.68931198120117, "global_step": 209572, "epoch": 1732} {"train_loss": -42.11356735229492, "global_step": 209573, "epoch": 1732} {"train_loss": -42.003719329833984, "global_step": 209574, "epoch": 1732} {"train_loss": -42.624176025390625, "global_step": 209575, "epoch": 1732} {"train_loss": -42.79867172241211, "global_step": 209576, "epoch": 1732} {"train_loss": -42.62482452392578, "global_step": 209577, "epoch": 1732} {"train_loss": -42.456417083740234, "global_step": 209578, "epoch": 1732} {"train_loss": -42.16585159301758, "global_step": 209579, "epoch": 1732} {"train_loss": -42.21834182739258, "global_step": 209580, "epoch": 1732} {"train_loss": -42.0385856628418, "global_step": 209581, "epoch": 1732} {"train_loss": -41.76123046875, "global_step": 209582, "epoch": 1732} {"train_loss": -42.5921630859375, "global_step": 209583, "epoch": 1732} {"train_loss": -42.305294036865234, "global_step": 209584, "epoch": 1732} {"train_loss": -42.01424026489258, "global_step": 209585, "epoch": 1732} {"train_loss": -40.534420013427734, "global_step": 209586, "epoch": 1732} {"train_loss": -39.017303466796875, "global_step": 209587, "epoch": 1732} {"train_loss": -37.579322814941406, "global_step": 209588, "epoch": 1732} {"train_loss": -40.8897590637207, "global_step": 209589, "epoch": 1732} {"train_loss": -42.113922119140625, "global_step": 209590, "epoch": 1732} {"train_loss": -41.796775817871094, "global_step": 209591, "epoch": 1732} {"train_loss": -41.26533126831055, "global_step": 209592, "epoch": 1732} {"train_loss": -41.747615814208984, "global_step": 209593, "epoch": 1732} {"train_loss": -42.445556640625, "global_step": 209594, "epoch": 1732} {"train_loss": -41.22640609741211, "global_step": 209595, "epoch": 1732} {"train_loss": -41.01716995239258, "global_step": 209596, "epoch": 1732} {"train_loss": -41.710140228271484, "global_step": 209597, "epoch": 1732} {"train_loss": -41.8739013671875, "global_step": 209598, "epoch": 1732} {"train_loss": -41.85780334472656, "global_step": 209599, "epoch": 1732} {"train_loss": -42.47626876831055, "global_step": 209600, "epoch": 1732} {"train_loss": -42.79270553588867, "global_step": 209601, "epoch": 1732} {"train_loss": -42.41909408569336, "global_step": 209602, "epoch": 1732} {"train_loss": -42.32169723510742, "global_step": 209603, "epoch": 1732} {"train_loss": -41.665069580078125, "global_step": 209604, "epoch": 1732} {"train_loss": -42.2653923034668, "global_step": 209605, "epoch": 1732} {"train_loss": -41.89435577392578, "global_step": 209606, "epoch": 1732} {"train_loss": -42.45270919799805, "global_step": 209607, "epoch": 1732} {"train_loss": -42.06692123413086, "global_step": 209608, "epoch": 1732} {"train_loss": -42.65930938720703, "global_step": 209609, "epoch": 1732} {"train_loss": -41.66938400268555, "global_step": 209610, "epoch": 1732} {"train_loss": -41.74811553955078, "global_step": 209611, "epoch": 1732} {"train_loss": -42.04429626464844, "global_step": 209612, "epoch": 1732} {"train_loss": -42.02958297729492, "global_step": 209613, "epoch": 1732} {"train_loss": -42.04973220825195, "global_step": 209614, "epoch": 1732} {"train_loss": -42.13126754760742, "global_step": 209615, "epoch": 1732} {"train_loss": -41.955787658691406, "global_step": 209616, "epoch": 1732} {"train_loss": -41.384674072265625, "global_step": 209617, "epoch": 1732} {"train_loss": -41.69184112548828, "global_step": 209618, "epoch": 1732} {"train_loss": -42.243350982666016, "global_step": 209619, "epoch": 1732} {"train_loss": -41.36542892456055, "global_step": 209620, "epoch": 1732} {"train_loss": -40.888954162597656, "global_step": 209621, "epoch": 1732} {"train_loss": -41.80064010620117, "global_step": 209622, "epoch": 1732} {"train_loss": -42.02810287475586, "global_step": 209623, "epoch": 1732} {"train_loss": -40.50890350341797, "global_step": 209624, "epoch": 1732} {"train_loss": -41.93757247924805, "global_step": 209625, "epoch": 1732} {"train_loss": -40.56745147705078, "global_step": 209626, "epoch": 1732} {"train_loss": -39.89925765991211, "global_step": 209627, "epoch": 1732} {"train_loss": -40.874629974365234, "global_step": 209628, "epoch": 1732} {"train_loss": -41.540802001953125, "global_step": 209629, "epoch": 1732} {"train_loss": -39.49985122680664, "global_step": 209630, "epoch": 1732} {"train_loss": -38.96128463745117, "global_step": 209631, "epoch": 1732} {"train_loss": -39.81745529174805, "global_step": 209632, "epoch": 1732} {"train_loss": -41.23578643798828, "global_step": 209633, "epoch": 1732} {"train_loss": -41.7567024230957, "global_step": 209634, "epoch": 1732} {"train_loss": -40.62837219238281, "global_step": 209635, "epoch": 1732} {"train_loss": -40.337310791015625, "global_step": 209636, "epoch": 1732} {"train_loss": -40.73115921020508, "global_step": 209637, "epoch": 1732} {"train_loss": -38.19337844848633, "global_step": 209638, "epoch": 1732} {"train_loss": -36.652828216552734, "global_step": 209639, "epoch": 1732} {"train_loss": -38.80000305175781, "global_step": 209640, "epoch": 1732} {"train_loss": -39.2497673034668, "global_step": 209641, "epoch": 1732} {"train_loss": -40.43620681762695, "global_step": 209642, "epoch": 1732} {"train_loss": -40.742225646972656, "global_step": 209643, "epoch": 1732} {"train_loss": -40.98994827270508, "global_step": 209644, "epoch": 1732} {"train_loss": -40.671974182128906, "global_step": 209645, "epoch": 1732} {"train_loss": -39.47639083862305, "global_step": 209646, "epoch": 1732} {"train_loss": -40.58827590942383, "global_step": 209647, "epoch": 1732} {"train_loss": -41.0490837097168, "global_step": 209648, "epoch": 1732} {"train_loss": -40.21906280517578, "global_step": 209649, "epoch": 1732} {"train_loss": -41.262451171875, "global_step": 209650, "epoch": 1732} {"train_loss": -40.98427963256836, "global_step": 209651, "epoch": 1732} {"train_loss": -41.28204345703125, "global_step": 209652, "epoch": 1732} {"train_loss": -41.04750442504883, "global_step": 209653, "epoch": 1732} {"train_loss": -41.03986740112305, "global_step": 209654, "epoch": 1732} {"train_loss": -41.70728302001953, "global_step": 209655, "epoch": 1732} {"train_loss": -41.38996505737305, "global_step": 209656, "epoch": 1732} {"train_loss": -41.528133392333984, "global_step": 209657, "epoch": 1732} {"train_loss": -41.511165618896484, "global_step": 209658, "epoch": 1732} {"train_loss": -41.45089340209961, "global_step": 209659, "epoch": 1732} {"train_loss": -41.51806640625, "global_step": 209660, "epoch": 1732} {"train_loss": -41.565467834472656, "global_step": 209661, "epoch": 1732} {"train_loss": -41.79254913330078, "global_step": 209662, "epoch": 1732} {"train_loss": -41.93452072143555, "global_step": 209663, "epoch": 1732} {"train_loss": -42.208492279052734, "global_step": 209664, "epoch": 1732} {"train_loss": -41.7553596496582, "global_step": 209665, "epoch": 1732} {"train_loss": -41.73141098022461, "global_step": 209666, "epoch": 1732} {"train_loss": -42.010101318359375, "global_step": 209667, "epoch": 1732} {"train_loss": -41.86707305908203, "global_step": 209668, "epoch": 1732} {"train_loss": -41.58254623413086, "global_step": 209669, "epoch": 1732} {"train_loss": -41.52328109741211, "global_step": 209670, "epoch": 1732} {"train_loss": -41.81657791137695, "global_step": 209671, "epoch": 1732} {"train_loss": -41.49433135986328, "global_step": 209672, "epoch": 1732} {"train_loss": -41.29607391357422, "global_step": 209673, "epoch": 1732} {"train_loss": -42.08124923706055, "global_step": 209674, "epoch": 1732} {"train_loss": -41.673866271972656, "global_step": 209675, "epoch": 1732} {"train_loss": -41.63788604736328, "global_step": 209676, "epoch": 1732} {"train_loss": -41.654396057128906, "global_step": 209677, "epoch": 1732} {"train_loss": -42.09435272216797, "global_step": 209678, "epoch": 1732} {"train_loss": -41.75677490234375, "global_step": 209679, "epoch": 1732} {"train_loss": -41.98591232299805, "global_step": 209680, "epoch": 1732} {"train_loss": -41.92892837524414, "global_step": 209681, "epoch": 1732} {"train_loss": -41.53944396972656, "global_step": 209682, "epoch": 1732} {"train_loss": -42.272335052490234, "global_step": 209683, "epoch": 1732} {"train_loss": -42.31907272338867, "global_step": 209684, "epoch": 1732} {"train_loss": -41.77848815917969, "global_step": 209685, "epoch": 1732} {"train_loss": -41.86806106567383, "global_step": 209686, "epoch": 1732} {"train_loss": -42.710693359375, "global_step": 209687, "epoch": 1732} {"train_loss": -42.16147994995117, "global_step": 209688, "epoch": 1732} {"train_loss": -42.13792037963867, "global_step": 209689, "epoch": 1732} {"train_loss": -42.18678665161133, "global_step": 209690, "epoch": 1732} {"train_loss": -42.10752487182617, "global_step": 209691, "epoch": 1732} {"train_loss": -41.4571043282501, "global_step": 209692, "epoch": 1732, "val_loss": 2543106.75} {"train_loss": -42.6890754699707, "global_step": 209693, "epoch": 1733} {"train_loss": -41.38999938964844, "global_step": 209694, "epoch": 1733} {"train_loss": -41.535335540771484, "global_step": 209695, "epoch": 1733} {"train_loss": -42.561424255371094, "global_step": 209696, "epoch": 1733} {"train_loss": -41.00321960449219, "global_step": 209697, "epoch": 1733} {"train_loss": -40.358543395996094, "global_step": 209698, "epoch": 1733} {"train_loss": -40.3948860168457, "global_step": 209699, "epoch": 1733} {"train_loss": -41.64358139038086, "global_step": 209700, "epoch": 1733} {"train_loss": -40.28589630126953, "global_step": 209701, "epoch": 1733} {"train_loss": -39.878047943115234, "global_step": 209702, "epoch": 1733} {"train_loss": -41.84737014770508, "global_step": 209703, "epoch": 1733} {"train_loss": -41.209877014160156, "global_step": 209704, "epoch": 1733} {"train_loss": -41.54856491088867, "global_step": 209705, "epoch": 1733} {"train_loss": -41.931488037109375, "global_step": 209706, "epoch": 1733} {"train_loss": -42.157955169677734, "global_step": 209707, "epoch": 1733} {"train_loss": -41.953590393066406, "global_step": 209708, "epoch": 1733} {"train_loss": -42.23066329956055, "global_step": 209709, "epoch": 1733} {"train_loss": -42.09352493286133, "global_step": 209710, "epoch": 1733} {"train_loss": -42.06269073486328, "global_step": 209711, "epoch": 1733} {"train_loss": -41.85494613647461, "global_step": 209712, "epoch": 1733} {"train_loss": -42.06277084350586, "global_step": 209713, "epoch": 1733} {"train_loss": -41.95893478393555, "global_step": 209714, "epoch": 1733} {"train_loss": -42.337852478027344, "global_step": 209715, "epoch": 1733} {"train_loss": -41.77189254760742, "global_step": 209716, "epoch": 1733} {"train_loss": -39.880653381347656, "global_step": 209717, "epoch": 1733} {"train_loss": -41.237213134765625, "global_step": 209718, "epoch": 1733} {"train_loss": -42.232269287109375, "global_step": 209719, "epoch": 1733} {"train_loss": -41.06403732299805, "global_step": 209720, "epoch": 1733} {"train_loss": -40.55162811279297, "global_step": 209721, "epoch": 1733} {"train_loss": -41.60575485229492, "global_step": 209722, "epoch": 1733} {"train_loss": -40.926490783691406, "global_step": 209723, "epoch": 1733} {"train_loss": -37.467403411865234, "global_step": 209724, "epoch": 1733} {"train_loss": -38.7136116027832, "global_step": 209725, "epoch": 1733} {"train_loss": -40.939666748046875, "global_step": 209726, "epoch": 1733} {"train_loss": -38.84440994262695, "global_step": 209727, "epoch": 1733} {"train_loss": -38.168006896972656, "global_step": 209728, "epoch": 1733} {"train_loss": -41.185359954833984, "global_step": 209729, "epoch": 1733} {"train_loss": -41.02579879760742, "global_step": 209730, "epoch": 1733} {"train_loss": -39.152217864990234, "global_step": 209731, "epoch": 1733} {"train_loss": -40.35429763793945, "global_step": 209732, "epoch": 1733} {"train_loss": -40.324981689453125, "global_step": 209733, "epoch": 1733} {"train_loss": -39.61737060546875, "global_step": 209734, "epoch": 1733} {"train_loss": -41.72017288208008, "global_step": 209735, "epoch": 1733} {"train_loss": -39.53715133666992, "global_step": 209736, "epoch": 1733} {"train_loss": -41.46135330200195, "global_step": 209737, "epoch": 1733} {"train_loss": -40.10552978515625, "global_step": 209738, "epoch": 1733} {"train_loss": -40.0909309387207, "global_step": 209739, "epoch": 1733} {"train_loss": -41.32969284057617, "global_step": 209740, "epoch": 1733} {"train_loss": -40.53815841674805, "global_step": 209741, "epoch": 1733} {"train_loss": -40.65555191040039, "global_step": 209742, "epoch": 1733} {"train_loss": -38.88941955566406, "global_step": 209743, "epoch": 1733} {"train_loss": -40.29896926879883, "global_step": 209744, "epoch": 1733} {"train_loss": -41.81501007080078, "global_step": 209745, "epoch": 1733} {"train_loss": -39.90387725830078, "global_step": 209746, "epoch": 1733} {"train_loss": -41.21798324584961, "global_step": 209747, "epoch": 1733} {"train_loss": -41.11174392700195, "global_step": 209748, "epoch": 1733} {"train_loss": -41.52751159667969, "global_step": 209749, "epoch": 1733} {"train_loss": -41.126033782958984, "global_step": 209750, "epoch": 1733} {"train_loss": -41.593013763427734, "global_step": 209751, "epoch": 1733} {"train_loss": -38.96572494506836, "global_step": 209752, "epoch": 1733} {"train_loss": -41.96449279785156, "global_step": 209753, "epoch": 1733} {"train_loss": -40.49639892578125, "global_step": 209754, "epoch": 1733} {"train_loss": -40.44376754760742, "global_step": 209755, "epoch": 1733} {"train_loss": -41.68526840209961, "global_step": 209756, "epoch": 1733} {"train_loss": -40.093746185302734, "global_step": 209757, "epoch": 1733} {"train_loss": -41.69263458251953, "global_step": 209758, "epoch": 1733} {"train_loss": -41.315467834472656, "global_step": 209759, "epoch": 1733} {"train_loss": -40.27079772949219, "global_step": 209760, "epoch": 1733} {"train_loss": -42.42865753173828, "global_step": 209761, "epoch": 1733} {"train_loss": -41.757328033447266, "global_step": 209762, "epoch": 1733} {"train_loss": -41.57770919799805, "global_step": 209763, "epoch": 1733} {"train_loss": -41.4105339050293, "global_step": 209764, "epoch": 1733} {"train_loss": -40.899288177490234, "global_step": 209765, "epoch": 1733} {"train_loss": -40.9339485168457, "global_step": 209766, "epoch": 1733} {"train_loss": -41.64789581298828, "global_step": 209767, "epoch": 1733} {"train_loss": -42.142757415771484, "global_step": 209768, "epoch": 1733} {"train_loss": -41.19557189941406, "global_step": 209769, "epoch": 1733} {"train_loss": -42.06541061401367, "global_step": 209770, "epoch": 1733} {"train_loss": -42.260536193847656, "global_step": 209771, "epoch": 1733} {"train_loss": -42.015541076660156, "global_step": 209772, "epoch": 1733} {"train_loss": -42.085426330566406, "global_step": 209773, "epoch": 1733} {"train_loss": -41.9012336730957, "global_step": 209774, "epoch": 1733} {"train_loss": -41.685302734375, "global_step": 209775, "epoch": 1733} {"train_loss": -42.56256866455078, "global_step": 209776, "epoch": 1733} {"train_loss": -42.66899871826172, "global_step": 209777, "epoch": 1733} {"train_loss": -42.53573226928711, "global_step": 209778, "epoch": 1733} {"train_loss": -42.34930419921875, "global_step": 209779, "epoch": 1733} {"train_loss": -42.44352340698242, "global_step": 209780, "epoch": 1733} {"train_loss": -42.5917854309082, "global_step": 209781, "epoch": 1733} {"train_loss": -42.42544174194336, "global_step": 209782, "epoch": 1733} {"train_loss": -41.688018798828125, "global_step": 209783, "epoch": 1733} {"train_loss": -42.850337982177734, "global_step": 209784, "epoch": 1733} {"train_loss": -42.407405853271484, "global_step": 209785, "epoch": 1733} {"train_loss": -43.25580596923828, "global_step": 209786, "epoch": 1733} {"train_loss": -42.38283920288086, "global_step": 209787, "epoch": 1733} {"train_loss": -42.73344039916992, "global_step": 209788, "epoch": 1733} {"train_loss": -41.78064727783203, "global_step": 209789, "epoch": 1733} {"train_loss": -42.629188537597656, "global_step": 209790, "epoch": 1733} {"train_loss": -42.57575607299805, "global_step": 209791, "epoch": 1733} {"train_loss": -41.785823822021484, "global_step": 209792, "epoch": 1733} {"train_loss": -42.58494186401367, "global_step": 209793, "epoch": 1733} {"train_loss": -42.888458251953125, "global_step": 209794, "epoch": 1733} {"train_loss": -43.20277786254883, "global_step": 209795, "epoch": 1733} {"train_loss": -42.410377502441406, "global_step": 209796, "epoch": 1733} {"train_loss": -42.674434661865234, "global_step": 209797, "epoch": 1733} {"train_loss": -42.7925910949707, "global_step": 209798, "epoch": 1733} {"train_loss": -43.00006866455078, "global_step": 209799, "epoch": 1733} {"train_loss": -43.02362823486328, "global_step": 209800, "epoch": 1733} {"train_loss": -42.398067474365234, "global_step": 209801, "epoch": 1733} {"train_loss": -42.33394241333008, "global_step": 209802, "epoch": 1733} {"train_loss": -42.21208953857422, "global_step": 209803, "epoch": 1733} {"train_loss": -41.40761184692383, "global_step": 209804, "epoch": 1733} {"train_loss": -41.94486999511719, "global_step": 209805, "epoch": 1733} {"train_loss": -41.871578216552734, "global_step": 209806, "epoch": 1733} {"train_loss": -42.3311653137207, "global_step": 209807, "epoch": 1733} {"train_loss": -42.43603515625, "global_step": 209808, "epoch": 1733} {"train_loss": -43.00651168823242, "global_step": 209809, "epoch": 1733} {"train_loss": -42.425777435302734, "global_step": 209810, "epoch": 1733} {"train_loss": -42.71182632446289, "global_step": 209811, "epoch": 1733} {"train_loss": -41.90175247192383, "global_step": 209812, "epoch": 1733} {"train_loss": -41.49696463592782, "global_step": 209813, "epoch": 1733, "val_loss": 2462433.75} {"train_loss": -42.215370178222656, "global_step": 209814, "epoch": 1734} {"train_loss": -41.94456481933594, "global_step": 209815, "epoch": 1734} {"train_loss": -42.8990478515625, "global_step": 209816, "epoch": 1734} {"train_loss": -40.701271057128906, "global_step": 209817, "epoch": 1734} {"train_loss": -39.942901611328125, "global_step": 209818, "epoch": 1734} {"train_loss": -38.766170501708984, "global_step": 209819, "epoch": 1734} {"train_loss": -40.32144546508789, "global_step": 209820, "epoch": 1734} {"train_loss": -41.441104888916016, "global_step": 209821, "epoch": 1734} {"train_loss": -40.851070404052734, "global_step": 209822, "epoch": 1734} {"train_loss": -40.72834396362305, "global_step": 209823, "epoch": 1734} {"train_loss": -42.357513427734375, "global_step": 209824, "epoch": 1734} {"train_loss": -41.9734001159668, "global_step": 209825, "epoch": 1734} {"train_loss": -40.65040588378906, "global_step": 209826, "epoch": 1734} {"train_loss": -41.527931213378906, "global_step": 209827, "epoch": 1734} {"train_loss": -41.6192741394043, "global_step": 209828, "epoch": 1734} {"train_loss": -40.892948150634766, "global_step": 209829, "epoch": 1734} {"train_loss": -42.19388961791992, "global_step": 209830, "epoch": 1734} {"train_loss": -40.650691986083984, "global_step": 209831, "epoch": 1734} {"train_loss": -41.41775131225586, "global_step": 209832, "epoch": 1734} {"train_loss": -42.3123893737793, "global_step": 209833, "epoch": 1734} {"train_loss": -41.39216232299805, "global_step": 209834, "epoch": 1734} {"train_loss": -41.8892936706543, "global_step": 209835, "epoch": 1734} {"train_loss": -41.33456039428711, "global_step": 209836, "epoch": 1734} {"train_loss": -41.672889709472656, "global_step": 209837, "epoch": 1734} {"train_loss": -41.47231674194336, "global_step": 209838, "epoch": 1734} {"train_loss": -42.32097625732422, "global_step": 209839, "epoch": 1734} {"train_loss": -39.79566192626953, "global_step": 209840, "epoch": 1734} {"train_loss": -41.512977600097656, "global_step": 209841, "epoch": 1734} {"train_loss": -41.85051345825195, "global_step": 209842, "epoch": 1734} {"train_loss": -41.64967727661133, "global_step": 209843, "epoch": 1734} {"train_loss": -41.2214241027832, "global_step": 209844, "epoch": 1734} {"train_loss": -41.505767822265625, "global_step": 209845, "epoch": 1734} {"train_loss": -41.16987991333008, "global_step": 209846, "epoch": 1734} {"train_loss": -40.787044525146484, "global_step": 209847, "epoch": 1734} {"train_loss": -41.57567596435547, "global_step": 209848, "epoch": 1734} {"train_loss": -39.884521484375, "global_step": 209849, "epoch": 1734} {"train_loss": -41.57607650756836, "global_step": 209850, "epoch": 1734} {"train_loss": -42.21695327758789, "global_step": 209851, "epoch": 1734} {"train_loss": -39.99045181274414, "global_step": 209852, "epoch": 1734} {"train_loss": -41.885841369628906, "global_step": 209853, "epoch": 1734} {"train_loss": -41.46728515625, "global_step": 209854, "epoch": 1734} {"train_loss": -42.0122184753418, "global_step": 209855, "epoch": 1734} {"train_loss": -41.59004592895508, "global_step": 209856, "epoch": 1734} {"train_loss": -40.74611282348633, "global_step": 209857, "epoch": 1734} {"train_loss": -41.4509391784668, "global_step": 209858, "epoch": 1734} {"train_loss": -39.94629669189453, "global_step": 209859, "epoch": 1734} {"train_loss": -41.118072509765625, "global_step": 209860, "epoch": 1734} {"train_loss": -42.098941802978516, "global_step": 209861, "epoch": 1734} {"train_loss": -41.7049446105957, "global_step": 209862, "epoch": 1734} {"train_loss": -41.896183013916016, "global_step": 209863, "epoch": 1734} {"train_loss": -41.58449172973633, "global_step": 209864, "epoch": 1734} {"train_loss": -42.23241424560547, "global_step": 209865, "epoch": 1734} {"train_loss": -42.089839935302734, "global_step": 209866, "epoch": 1734} {"train_loss": -42.13605880737305, "global_step": 209867, "epoch": 1734} {"train_loss": -41.966617584228516, "global_step": 209868, "epoch": 1734} {"train_loss": -41.74787521362305, "global_step": 209869, "epoch": 1734} {"train_loss": -40.94977569580078, "global_step": 209870, "epoch": 1734} {"train_loss": -42.71394729614258, "global_step": 209871, "epoch": 1734} {"train_loss": -41.47597885131836, "global_step": 209872, "epoch": 1734} {"train_loss": -40.786903381347656, "global_step": 209873, "epoch": 1734} {"train_loss": -40.771453857421875, "global_step": 209874, "epoch": 1734} {"train_loss": -41.199153900146484, "global_step": 209875, "epoch": 1734} {"train_loss": -42.327850341796875, "global_step": 209876, "epoch": 1734} {"train_loss": -41.56703186035156, "global_step": 209877, "epoch": 1734} {"train_loss": -41.851226806640625, "global_step": 209878, "epoch": 1734} {"train_loss": -41.020721435546875, "global_step": 209879, "epoch": 1734} {"train_loss": -42.05621337890625, "global_step": 209880, "epoch": 1734} {"train_loss": -41.652748107910156, "global_step": 209881, "epoch": 1734} {"train_loss": -41.27607345581055, "global_step": 209882, "epoch": 1734} {"train_loss": -41.83406448364258, "global_step": 209883, "epoch": 1734} {"train_loss": -40.99809646606445, "global_step": 209884, "epoch": 1734} {"train_loss": -41.999664306640625, "global_step": 209885, "epoch": 1734} {"train_loss": -41.583656311035156, "global_step": 209886, "epoch": 1734} {"train_loss": -42.2119255065918, "global_step": 209887, "epoch": 1734} {"train_loss": -41.97944259643555, "global_step": 209888, "epoch": 1734} {"train_loss": -41.9366455078125, "global_step": 209889, "epoch": 1734} {"train_loss": -41.54627227783203, "global_step": 209890, "epoch": 1734} {"train_loss": -42.89793395996094, "global_step": 209891, "epoch": 1734} {"train_loss": -42.64908981323242, "global_step": 209892, "epoch": 1734} {"train_loss": -41.91912078857422, "global_step": 209893, "epoch": 1734} {"train_loss": -42.755943298339844, "global_step": 209894, "epoch": 1734} {"train_loss": -42.7345085144043, "global_step": 209895, "epoch": 1734} {"train_loss": -41.88932418823242, "global_step": 209896, "epoch": 1734} {"train_loss": -42.69111251831055, "global_step": 209897, "epoch": 1734} {"train_loss": -42.4478874206543, "global_step": 209898, "epoch": 1734} {"train_loss": -41.88230514526367, "global_step": 209899, "epoch": 1734} {"train_loss": -42.25468826293945, "global_step": 209900, "epoch": 1734} {"train_loss": -41.55401611328125, "global_step": 209901, "epoch": 1734} {"train_loss": -42.33934020996094, "global_step": 209902, "epoch": 1734} {"train_loss": -42.31281280517578, "global_step": 209903, "epoch": 1734} {"train_loss": -41.99591827392578, "global_step": 209904, "epoch": 1734} {"train_loss": -40.00761795043945, "global_step": 209905, "epoch": 1734} {"train_loss": -39.49715042114258, "global_step": 209906, "epoch": 1734} {"train_loss": -40.426326751708984, "global_step": 209907, "epoch": 1734} {"train_loss": -41.795570373535156, "global_step": 209908, "epoch": 1734} {"train_loss": -41.755706787109375, "global_step": 209909, "epoch": 1734} {"train_loss": -41.82545471191406, "global_step": 209910, "epoch": 1734} {"train_loss": -42.35810089111328, "global_step": 209911, "epoch": 1734} {"train_loss": -42.35969161987305, "global_step": 209912, "epoch": 1734} {"train_loss": -41.945552825927734, "global_step": 209913, "epoch": 1734} {"train_loss": -41.07006072998047, "global_step": 209914, "epoch": 1734} {"train_loss": -42.6320686340332, "global_step": 209915, "epoch": 1734} {"train_loss": -41.89920425415039, "global_step": 209916, "epoch": 1734} {"train_loss": -41.708778381347656, "global_step": 209917, "epoch": 1734} {"train_loss": -41.99827194213867, "global_step": 209918, "epoch": 1734} {"train_loss": -41.699588775634766, "global_step": 209919, "epoch": 1734} {"train_loss": -39.97509765625, "global_step": 209920, "epoch": 1734} {"train_loss": -39.434112548828125, "global_step": 209921, "epoch": 1734} {"train_loss": -40.388648986816406, "global_step": 209922, "epoch": 1734} {"train_loss": -39.258609771728516, "global_step": 209923, "epoch": 1734} {"train_loss": -39.58189010620117, "global_step": 209924, "epoch": 1734} {"train_loss": -41.0921630859375, "global_step": 209925, "epoch": 1734} {"train_loss": -38.76108169555664, "global_step": 209926, "epoch": 1734} {"train_loss": -41.79023361206055, "global_step": 209927, "epoch": 1734} {"train_loss": -40.0319938659668, "global_step": 209928, "epoch": 1734} {"train_loss": -39.89811325073242, "global_step": 209929, "epoch": 1734} {"train_loss": -41.436214447021484, "global_step": 209930, "epoch": 1734} {"train_loss": -38.64308547973633, "global_step": 209931, "epoch": 1734} {"train_loss": -39.30548095703125, "global_step": 209932, "epoch": 1734} {"train_loss": -41.50065612792969, "global_step": 209933, "epoch": 1734} {"train_loss": -41.354217340138334, "global_step": 209934, "epoch": 1734, "val_loss": 2475815.0} {"train_loss": -40.281463623046875, "global_step": 209935, "epoch": 1735} {"train_loss": -38.89263916015625, "global_step": 209936, "epoch": 1735} {"train_loss": -40.06953048706055, "global_step": 209937, "epoch": 1735} {"train_loss": -39.635955810546875, "global_step": 209938, "epoch": 1735} {"train_loss": -40.64780807495117, "global_step": 209939, "epoch": 1735} {"train_loss": -40.16400146484375, "global_step": 209940, "epoch": 1735} {"train_loss": -39.87533187866211, "global_step": 209941, "epoch": 1735} {"train_loss": -40.74335479736328, "global_step": 209942, "epoch": 1735} {"train_loss": -39.88570785522461, "global_step": 209943, "epoch": 1735} {"train_loss": -40.45662307739258, "global_step": 209944, "epoch": 1735} {"train_loss": -39.2927131652832, "global_step": 209945, "epoch": 1735} {"train_loss": -40.642730712890625, "global_step": 209946, "epoch": 1735} {"train_loss": -39.4751091003418, "global_step": 209947, "epoch": 1735} {"train_loss": -41.977413177490234, "global_step": 209948, "epoch": 1735} {"train_loss": -38.2496223449707, "global_step": 209949, "epoch": 1735} {"train_loss": -40.178829193115234, "global_step": 209950, "epoch": 1735} {"train_loss": -39.63649368286133, "global_step": 209951, "epoch": 1735} {"train_loss": -40.27350997924805, "global_step": 209952, "epoch": 1735} {"train_loss": -39.108882904052734, "global_step": 209953, "epoch": 1735} {"train_loss": -40.38395309448242, "global_step": 209954, "epoch": 1735} {"train_loss": -40.15286636352539, "global_step": 209955, "epoch": 1735} {"train_loss": -38.15035629272461, "global_step": 209956, "epoch": 1735} {"train_loss": -34.20933532714844, "global_step": 209957, "epoch": 1735} {"train_loss": -37.640480041503906, "global_step": 209958, "epoch": 1735} {"train_loss": -39.7335090637207, "global_step": 209959, "epoch": 1735} {"train_loss": -37.606319427490234, "global_step": 209960, "epoch": 1735} {"train_loss": -40.96574783325195, "global_step": 209961, "epoch": 1735} {"train_loss": -40.36878204345703, "global_step": 209962, "epoch": 1735} {"train_loss": -40.75627517700195, "global_step": 209963, "epoch": 1735} {"train_loss": -39.57080078125, "global_step": 209964, "epoch": 1735} {"train_loss": -40.430335998535156, "global_step": 209965, "epoch": 1735} {"train_loss": -40.356327056884766, "global_step": 209966, "epoch": 1735} {"train_loss": -39.725242614746094, "global_step": 209967, "epoch": 1735} {"train_loss": -40.83070755004883, "global_step": 209968, "epoch": 1735} {"train_loss": -40.39390182495117, "global_step": 209969, "epoch": 1735} {"train_loss": -41.22216796875, "global_step": 209970, "epoch": 1735} {"train_loss": -40.65195846557617, "global_step": 209971, "epoch": 1735} {"train_loss": -40.47285079956055, "global_step": 209972, "epoch": 1735} {"train_loss": -40.799861907958984, "global_step": 209973, "epoch": 1735} {"train_loss": -36.34968185424805, "global_step": 209974, "epoch": 1735} {"train_loss": -41.890052795410156, "global_step": 209975, "epoch": 1735} {"train_loss": -41.823177337646484, "global_step": 209976, "epoch": 1735} {"train_loss": -41.46345138549805, "global_step": 209977, "epoch": 1735} {"train_loss": -41.467220306396484, "global_step": 209978, "epoch": 1735} {"train_loss": -40.59185791015625, "global_step": 209979, "epoch": 1735} {"train_loss": -42.2374153137207, "global_step": 209980, "epoch": 1735} {"train_loss": -40.58175277709961, "global_step": 209981, "epoch": 1735} {"train_loss": -41.098934173583984, "global_step": 209982, "epoch": 1735} {"train_loss": -41.562103271484375, "global_step": 209983, "epoch": 1735} {"train_loss": -41.713253021240234, "global_step": 209984, "epoch": 1735} {"train_loss": -39.2346305847168, "global_step": 209985, "epoch": 1735} {"train_loss": -41.338966369628906, "global_step": 209986, "epoch": 1735} {"train_loss": -41.36500549316406, "global_step": 209987, "epoch": 1735} {"train_loss": -40.657737731933594, "global_step": 209988, "epoch": 1735} {"train_loss": -42.3773307800293, "global_step": 209989, "epoch": 1735} {"train_loss": -41.9025764465332, "global_step": 209990, "epoch": 1735} {"train_loss": -42.057735443115234, "global_step": 209991, "epoch": 1735} {"train_loss": -41.53998947143555, "global_step": 209992, "epoch": 1735} {"train_loss": -41.658653259277344, "global_step": 209993, "epoch": 1735} {"train_loss": -42.19065475463867, "global_step": 209994, "epoch": 1735} {"train_loss": -41.86960983276367, "global_step": 209995, "epoch": 1735} {"train_loss": -40.961021423339844, "global_step": 209996, "epoch": 1735} {"train_loss": -41.960601806640625, "global_step": 209997, "epoch": 1735} {"train_loss": -42.125579833984375, "global_step": 209998, "epoch": 1735} {"train_loss": -41.44721221923828, "global_step": 209999, "epoch": 1735} {"train_loss": -42.392608642578125, "global_step": 210000, "epoch": 1735} {"train_loss": -40.67837142944336, "global_step": 210001, "epoch": 1735} {"train_loss": -41.16981506347656, "global_step": 210002, "epoch": 1735} {"train_loss": -41.74018478393555, "global_step": 210003, "epoch": 1735} {"train_loss": -42.49683380126953, "global_step": 210004, "epoch": 1735} {"train_loss": -41.685943603515625, "global_step": 210005, "epoch": 1735} {"train_loss": -41.43992614746094, "global_step": 210006, "epoch": 1735} {"train_loss": -40.03076934814453, "global_step": 210007, "epoch": 1735} {"train_loss": -42.13036346435547, "global_step": 210008, "epoch": 1735} {"train_loss": -41.673954010009766, "global_step": 210009, "epoch": 1735} {"train_loss": -41.785850524902344, "global_step": 210010, "epoch": 1735} {"train_loss": -42.02312088012695, "global_step": 210011, "epoch": 1735} {"train_loss": -42.144439697265625, "global_step": 210012, "epoch": 1735} {"train_loss": -42.588836669921875, "global_step": 210013, "epoch": 1735} {"train_loss": -42.49434280395508, "global_step": 210014, "epoch": 1735} {"train_loss": -42.44419860839844, "global_step": 210015, "epoch": 1735} {"train_loss": -42.0235710144043, "global_step": 210016, "epoch": 1735} {"train_loss": -42.28948974609375, "global_step": 210017, "epoch": 1735} {"train_loss": -42.02877426147461, "global_step": 210018, "epoch": 1735} {"train_loss": -42.2899284362793, "global_step": 210019, "epoch": 1735} {"train_loss": -42.28638458251953, "global_step": 210020, "epoch": 1735} {"train_loss": -41.86727523803711, "global_step": 210021, "epoch": 1735} {"train_loss": -42.243385314941406, "global_step": 210022, "epoch": 1735} {"train_loss": -42.03434753417969, "global_step": 210023, "epoch": 1735} {"train_loss": -42.16300582885742, "global_step": 210024, "epoch": 1735} {"train_loss": -42.32206344604492, "global_step": 210025, "epoch": 1735} {"train_loss": -41.01126480102539, "global_step": 210026, "epoch": 1735} {"train_loss": -42.80085372924805, "global_step": 210027, "epoch": 1735} {"train_loss": -42.488548278808594, "global_step": 210028, "epoch": 1735} {"train_loss": -42.563533782958984, "global_step": 210029, "epoch": 1735} {"train_loss": -42.438140869140625, "global_step": 210030, "epoch": 1735} {"train_loss": -42.59550857543945, "global_step": 210031, "epoch": 1735} {"train_loss": -42.31725311279297, "global_step": 210032, "epoch": 1735} {"train_loss": -42.32126998901367, "global_step": 210033, "epoch": 1735} {"train_loss": -41.91549301147461, "global_step": 210034, "epoch": 1735} {"train_loss": -41.93087387084961, "global_step": 210035, "epoch": 1735} {"train_loss": -42.0506706237793, "global_step": 210036, "epoch": 1735} {"train_loss": -42.05723190307617, "global_step": 210037, "epoch": 1735} {"train_loss": -41.44898223876953, "global_step": 210038, "epoch": 1735} {"train_loss": -42.16029739379883, "global_step": 210039, "epoch": 1735} {"train_loss": -41.763790130615234, "global_step": 210040, "epoch": 1735} {"train_loss": -41.280029296875, "global_step": 210041, "epoch": 1735} {"train_loss": -41.036930084228516, "global_step": 210042, "epoch": 1735} {"train_loss": -40.178836822509766, "global_step": 210043, "epoch": 1735} {"train_loss": -39.75276184082031, "global_step": 210044, "epoch": 1735} {"train_loss": -40.910072326660156, "global_step": 210045, "epoch": 1735} {"train_loss": -41.0764045715332, "global_step": 210046, "epoch": 1735} {"train_loss": -39.61438751220703, "global_step": 210047, "epoch": 1735} {"train_loss": -38.323970794677734, "global_step": 210048, "epoch": 1735} {"train_loss": -39.070980072021484, "global_step": 210049, "epoch": 1735} {"train_loss": -40.317230224609375, "global_step": 210050, "epoch": 1735} {"train_loss": -41.48994445800781, "global_step": 210051, "epoch": 1735} {"train_loss": -39.7336311340332, "global_step": 210052, "epoch": 1735} {"train_loss": -40.89265060424805, "global_step": 210053, "epoch": 1735} {"train_loss": -37.67783737182617, "global_step": 210054, "epoch": 1735} {"train_loss": -40.91808823514576, "global_step": 210055, "epoch": 1735, "val_loss": 2547407.25} {"train_loss": -34.5050048828125, "global_step": 210056, "epoch": 1736} {"train_loss": -39.79606246948242, "global_step": 210057, "epoch": 1736} {"train_loss": -36.23057174682617, "global_step": 210058, "epoch": 1736} {"train_loss": -33.89926528930664, "global_step": 210059, "epoch": 1736} {"train_loss": -40.03594207763672, "global_step": 210060, "epoch": 1736} {"train_loss": -37.70499801635742, "global_step": 210061, "epoch": 1736} {"train_loss": -39.77452087402344, "global_step": 210062, "epoch": 1736} {"train_loss": -40.103519439697266, "global_step": 210063, "epoch": 1736} {"train_loss": -37.56623840332031, "global_step": 210064, "epoch": 1736} {"train_loss": -41.1490364074707, "global_step": 210065, "epoch": 1736} {"train_loss": -39.678680419921875, "global_step": 210066, "epoch": 1736} {"train_loss": -39.05769729614258, "global_step": 210067, "epoch": 1736} {"train_loss": -40.1797981262207, "global_step": 210068, "epoch": 1736} {"train_loss": -36.58676528930664, "global_step": 210069, "epoch": 1736} {"train_loss": -40.913787841796875, "global_step": 210070, "epoch": 1736} {"train_loss": -40.83292770385742, "global_step": 210071, "epoch": 1736} {"train_loss": -41.786338806152344, "global_step": 210072, "epoch": 1736} {"train_loss": -40.66947555541992, "global_step": 210073, "epoch": 1736} {"train_loss": -41.83848190307617, "global_step": 210074, "epoch": 1736} {"train_loss": -40.80745315551758, "global_step": 210075, "epoch": 1736} {"train_loss": -41.17231750488281, "global_step": 210076, "epoch": 1736} {"train_loss": -40.66048049926758, "global_step": 210077, "epoch": 1736} {"train_loss": -40.54147720336914, "global_step": 210078, "epoch": 1736} {"train_loss": -40.596988677978516, "global_step": 210079, "epoch": 1736} {"train_loss": -40.352149963378906, "global_step": 210080, "epoch": 1736} {"train_loss": -40.687599182128906, "global_step": 210081, "epoch": 1736} {"train_loss": -41.15443801879883, "global_step": 210082, "epoch": 1736} {"train_loss": -41.31462860107422, "global_step": 210083, "epoch": 1736} {"train_loss": -41.275390625, "global_step": 210084, "epoch": 1736} {"train_loss": -41.22669219970703, "global_step": 210085, "epoch": 1736} {"train_loss": -41.335723876953125, "global_step": 210086, "epoch": 1736} {"train_loss": -37.357330322265625, "global_step": 210087, "epoch": 1736} {"train_loss": -36.79897689819336, "global_step": 210088, "epoch": 1736} {"train_loss": -40.4367790222168, "global_step": 210089, "epoch": 1736} {"train_loss": -40.79902648925781, "global_step": 210090, "epoch": 1736} {"train_loss": -41.18607711791992, "global_step": 210091, "epoch": 1736} {"train_loss": -40.7415771484375, "global_step": 210092, "epoch": 1736} {"train_loss": -40.605018615722656, "global_step": 210093, "epoch": 1736} {"train_loss": -40.486358642578125, "global_step": 210094, "epoch": 1736} {"train_loss": -40.8494873046875, "global_step": 210095, "epoch": 1736} {"train_loss": -41.23808288574219, "global_step": 210096, "epoch": 1736} {"train_loss": -38.70806884765625, "global_step": 210097, "epoch": 1736} {"train_loss": -40.7545051574707, "global_step": 210098, "epoch": 1736} {"train_loss": -41.2076530456543, "global_step": 210099, "epoch": 1736} {"train_loss": -40.75883102416992, "global_step": 210100, "epoch": 1736} {"train_loss": -38.85896682739258, "global_step": 210101, "epoch": 1736} {"train_loss": -39.81454086303711, "global_step": 210102, "epoch": 1736} {"train_loss": -40.62135314941406, "global_step": 210103, "epoch": 1736} {"train_loss": -41.03945541381836, "global_step": 210104, "epoch": 1736} {"train_loss": -41.015785217285156, "global_step": 210105, "epoch": 1736} {"train_loss": -38.996917724609375, "global_step": 210106, "epoch": 1736} {"train_loss": -40.94325637817383, "global_step": 210107, "epoch": 1736} {"train_loss": -40.72391891479492, "global_step": 210108, "epoch": 1736} {"train_loss": -40.288692474365234, "global_step": 210109, "epoch": 1736} {"train_loss": -41.165279388427734, "global_step": 210110, "epoch": 1736} {"train_loss": -38.6683349609375, "global_step": 210111, "epoch": 1736} {"train_loss": -40.1557731628418, "global_step": 210112, "epoch": 1736} {"train_loss": -39.21968460083008, "global_step": 210113, "epoch": 1736} {"train_loss": -41.549072265625, "global_step": 210114, "epoch": 1736} {"train_loss": -41.3492431640625, "global_step": 210115, "epoch": 1736} {"train_loss": -40.841392517089844, "global_step": 210116, "epoch": 1736} {"train_loss": -41.49708938598633, "global_step": 210117, "epoch": 1736} {"train_loss": -40.739540100097656, "global_step": 210118, "epoch": 1736} {"train_loss": -41.026573181152344, "global_step": 210119, "epoch": 1736} {"train_loss": -40.637088775634766, "global_step": 210120, "epoch": 1736} {"train_loss": -41.66425704956055, "global_step": 210121, "epoch": 1736} {"train_loss": -40.45119857788086, "global_step": 210122, "epoch": 1736} {"train_loss": -41.6563835144043, "global_step": 210123, "epoch": 1736} {"train_loss": -41.91020965576172, "global_step": 210124, "epoch": 1736} {"train_loss": -40.57495880126953, "global_step": 210125, "epoch": 1736} {"train_loss": -41.88212203979492, "global_step": 210126, "epoch": 1736} {"train_loss": -41.08746337890625, "global_step": 210127, "epoch": 1736} {"train_loss": -41.89373779296875, "global_step": 210128, "epoch": 1736} {"train_loss": -41.88734817504883, "global_step": 210129, "epoch": 1736} {"train_loss": -41.06477737426758, "global_step": 210130, "epoch": 1736} {"train_loss": -42.36849594116211, "global_step": 210131, "epoch": 1736} {"train_loss": -41.23380661010742, "global_step": 210132, "epoch": 1736} {"train_loss": -41.92607498168945, "global_step": 210133, "epoch": 1736} {"train_loss": -41.06528854370117, "global_step": 210134, "epoch": 1736} {"train_loss": -39.615264892578125, "global_step": 210135, "epoch": 1736} {"train_loss": -41.378929138183594, "global_step": 210136, "epoch": 1736} {"train_loss": -40.45093536376953, "global_step": 210137, "epoch": 1736} {"train_loss": -41.85043716430664, "global_step": 210138, "epoch": 1736} {"train_loss": -41.544532775878906, "global_step": 210139, "epoch": 1736} {"train_loss": -42.06191635131836, "global_step": 210140, "epoch": 1736} {"train_loss": -43.0667724609375, "global_step": 210141, "epoch": 1736} {"train_loss": -40.6530647277832, "global_step": 210142, "epoch": 1736} {"train_loss": -42.09120559692383, "global_step": 210143, "epoch": 1736} {"train_loss": -42.65576934814453, "global_step": 210144, "epoch": 1736} {"train_loss": -42.19914245605469, "global_step": 210145, "epoch": 1736} {"train_loss": -42.499755859375, "global_step": 210146, "epoch": 1736} {"train_loss": -41.35466384887695, "global_step": 210147, "epoch": 1736} {"train_loss": -41.89502716064453, "global_step": 210148, "epoch": 1736} {"train_loss": -42.24970626831055, "global_step": 210149, "epoch": 1736} {"train_loss": -42.30902099609375, "global_step": 210150, "epoch": 1736} {"train_loss": -41.570858001708984, "global_step": 210151, "epoch": 1736} {"train_loss": -40.79334259033203, "global_step": 210152, "epoch": 1736} {"train_loss": -41.18392562866211, "global_step": 210153, "epoch": 1736} {"train_loss": -41.80092239379883, "global_step": 210154, "epoch": 1736} {"train_loss": -42.07514572143555, "global_step": 210155, "epoch": 1736} {"train_loss": -41.54473114013672, "global_step": 210156, "epoch": 1736} {"train_loss": -40.67161178588867, "global_step": 210157, "epoch": 1736} {"train_loss": -41.3400993347168, "global_step": 210158, "epoch": 1736} {"train_loss": -39.05208969116211, "global_step": 210159, "epoch": 1736} {"train_loss": -40.5629997253418, "global_step": 210160, "epoch": 1736} {"train_loss": -39.9544563293457, "global_step": 210161, "epoch": 1736} {"train_loss": -39.74580764770508, "global_step": 210162, "epoch": 1736} {"train_loss": -41.5009880065918, "global_step": 210163, "epoch": 1736} {"train_loss": -41.17121505737305, "global_step": 210164, "epoch": 1736} {"train_loss": -42.60622024536133, "global_step": 210165, "epoch": 1736} {"train_loss": -41.11372375488281, "global_step": 210166, "epoch": 1736} {"train_loss": -41.77537155151367, "global_step": 210167, "epoch": 1736} {"train_loss": -41.200843811035156, "global_step": 210168, "epoch": 1736} {"train_loss": -41.31422805786133, "global_step": 210169, "epoch": 1736} {"train_loss": -42.42741012573242, "global_step": 210170, "epoch": 1736} {"train_loss": -39.3023567199707, "global_step": 210171, "epoch": 1736} {"train_loss": -41.524383544921875, "global_step": 210172, "epoch": 1736} {"train_loss": -38.416622161865234, "global_step": 210173, "epoch": 1736} {"train_loss": -41.95716094970703, "global_step": 210174, "epoch": 1736} {"train_loss": -42.03792953491211, "global_step": 210175, "epoch": 1736} {"train_loss": -40.664483030965506, "global_step": 210176, "epoch": 1736, "val_loss": 2611404.25} {"train_loss": -40.215572357177734, "global_step": 210177, "epoch": 1737} {"train_loss": -39.78695297241211, "global_step": 210178, "epoch": 1737} {"train_loss": -41.679927825927734, "global_step": 210179, "epoch": 1737} {"train_loss": -39.85153579711914, "global_step": 210180, "epoch": 1737} {"train_loss": -39.23720932006836, "global_step": 210181, "epoch": 1737} {"train_loss": -39.87907028198242, "global_step": 210182, "epoch": 1737} {"train_loss": -40.4635124206543, "global_step": 210183, "epoch": 1737} {"train_loss": -37.867034912109375, "global_step": 210184, "epoch": 1737} {"train_loss": -40.752601623535156, "global_step": 210185, "epoch": 1737} {"train_loss": -41.08699417114258, "global_step": 210186, "epoch": 1737} {"train_loss": -39.6955451965332, "global_step": 210187, "epoch": 1737} {"train_loss": -40.976318359375, "global_step": 210188, "epoch": 1737} {"train_loss": -40.46089553833008, "global_step": 210189, "epoch": 1737} {"train_loss": -40.951820373535156, "global_step": 210190, "epoch": 1737} {"train_loss": -39.7365837097168, "global_step": 210191, "epoch": 1737} {"train_loss": -39.90042495727539, "global_step": 210192, "epoch": 1737} {"train_loss": -41.59804916381836, "global_step": 210193, "epoch": 1737} {"train_loss": -39.8936767578125, "global_step": 210194, "epoch": 1737} {"train_loss": -39.04103469848633, "global_step": 210195, "epoch": 1737} {"train_loss": -41.03096008300781, "global_step": 210196, "epoch": 1737} {"train_loss": -41.60530471801758, "global_step": 210197, "epoch": 1737} {"train_loss": -32.132232666015625, "global_step": 210198, "epoch": 1737} {"train_loss": -41.330997467041016, "global_step": 210199, "epoch": 1737} {"train_loss": -40.725921630859375, "global_step": 210200, "epoch": 1737} {"train_loss": -40.59110641479492, "global_step": 210201, "epoch": 1737} {"train_loss": -40.981319427490234, "global_step": 210202, "epoch": 1737} {"train_loss": -40.64980697631836, "global_step": 210203, "epoch": 1737} {"train_loss": -41.23426055908203, "global_step": 210204, "epoch": 1737} {"train_loss": -42.32853317260742, "global_step": 210205, "epoch": 1737} {"train_loss": -39.892822265625, "global_step": 210206, "epoch": 1737} {"train_loss": -40.07044219970703, "global_step": 210207, "epoch": 1737} {"train_loss": -37.297847747802734, "global_step": 210208, "epoch": 1737} {"train_loss": -38.309051513671875, "global_step": 210209, "epoch": 1737} {"train_loss": -40.920345306396484, "global_step": 210210, "epoch": 1737} {"train_loss": -40.652992248535156, "global_step": 210211, "epoch": 1737} {"train_loss": -40.5391845703125, "global_step": 210212, "epoch": 1737} {"train_loss": -42.262935638427734, "global_step": 210213, "epoch": 1737} {"train_loss": -39.53102493286133, "global_step": 210214, "epoch": 1737} {"train_loss": -40.9947624206543, "global_step": 210215, "epoch": 1737} {"train_loss": -38.90224838256836, "global_step": 210216, "epoch": 1737} {"train_loss": -39.95058822631836, "global_step": 210217, "epoch": 1737} {"train_loss": -39.33848190307617, "global_step": 210218, "epoch": 1737} {"train_loss": -39.095855712890625, "global_step": 210219, "epoch": 1737} {"train_loss": -40.1407356262207, "global_step": 210220, "epoch": 1737} {"train_loss": -41.57755661010742, "global_step": 210221, "epoch": 1737} {"train_loss": -40.85816192626953, "global_step": 210222, "epoch": 1737} {"train_loss": -41.64502716064453, "global_step": 210223, "epoch": 1737} {"train_loss": -41.2074089050293, "global_step": 210224, "epoch": 1737} {"train_loss": -33.52723693847656, "global_step": 210225, "epoch": 1737} {"train_loss": -38.40126419067383, "global_step": 210226, "epoch": 1737} {"train_loss": -39.615264892578125, "global_step": 210227, "epoch": 1737} {"train_loss": -41.26749801635742, "global_step": 210228, "epoch": 1737} {"train_loss": -40.72679901123047, "global_step": 210229, "epoch": 1737} {"train_loss": -40.52695846557617, "global_step": 210230, "epoch": 1737} {"train_loss": -40.26810836791992, "global_step": 210231, "epoch": 1737} {"train_loss": -39.950355529785156, "global_step": 210232, "epoch": 1737} {"train_loss": -39.279884338378906, "global_step": 210233, "epoch": 1737} {"train_loss": -36.42843246459961, "global_step": 210234, "epoch": 1737} {"train_loss": -39.57511901855469, "global_step": 210235, "epoch": 1737} {"train_loss": -34.658843994140625, "global_step": 210236, "epoch": 1737} {"train_loss": -39.95646286010742, "global_step": 210237, "epoch": 1737} {"train_loss": -41.132965087890625, "global_step": 210238, "epoch": 1737} {"train_loss": -37.36733627319336, "global_step": 210239, "epoch": 1737} {"train_loss": -31.753278732299805, "global_step": 210240, "epoch": 1737} {"train_loss": -39.827308654785156, "global_step": 210241, "epoch": 1737} {"train_loss": -39.34957504272461, "global_step": 210242, "epoch": 1737} {"train_loss": -39.718360900878906, "global_step": 210243, "epoch": 1737} {"train_loss": -37.99732208251953, "global_step": 210244, "epoch": 1737} {"train_loss": -38.25641632080078, "global_step": 210245, "epoch": 1737} {"train_loss": -37.768714904785156, "global_step": 210246, "epoch": 1737} {"train_loss": -40.46267318725586, "global_step": 210247, "epoch": 1737} {"train_loss": -34.57312774658203, "global_step": 210248, "epoch": 1737} {"train_loss": -37.386714935302734, "global_step": 210249, "epoch": 1737} {"train_loss": -40.25749969482422, "global_step": 210250, "epoch": 1737} {"train_loss": -35.01950454711914, "global_step": 210251, "epoch": 1737} {"train_loss": -40.28308868408203, "global_step": 210252, "epoch": 1737} {"train_loss": -36.919708251953125, "global_step": 210253, "epoch": 1737} {"train_loss": -40.62217712402344, "global_step": 210254, "epoch": 1737} {"train_loss": -40.199886322021484, "global_step": 210255, "epoch": 1737} {"train_loss": -39.978092193603516, "global_step": 210256, "epoch": 1737} {"train_loss": -38.476898193359375, "global_step": 210257, "epoch": 1737} {"train_loss": -40.309932708740234, "global_step": 210258, "epoch": 1737} {"train_loss": -40.2171630859375, "global_step": 210259, "epoch": 1737} {"train_loss": -39.143192291259766, "global_step": 210260, "epoch": 1737} {"train_loss": -38.14583206176758, "global_step": 210261, "epoch": 1737} {"train_loss": -39.79113006591797, "global_step": 210262, "epoch": 1737} {"train_loss": -39.65570068359375, "global_step": 210263, "epoch": 1737} {"train_loss": -39.22885513305664, "global_step": 210264, "epoch": 1737} {"train_loss": -40.66057586669922, "global_step": 210265, "epoch": 1737} {"train_loss": -39.075599670410156, "global_step": 210266, "epoch": 1737} {"train_loss": -40.094078063964844, "global_step": 210267, "epoch": 1737} {"train_loss": -39.92102813720703, "global_step": 210268, "epoch": 1737} {"train_loss": -39.71477508544922, "global_step": 210269, "epoch": 1737} {"train_loss": -40.036415100097656, "global_step": 210270, "epoch": 1737} {"train_loss": -40.36138916015625, "global_step": 210271, "epoch": 1737} {"train_loss": -40.51026153564453, "global_step": 210272, "epoch": 1737} {"train_loss": -39.30560302734375, "global_step": 210273, "epoch": 1737} {"train_loss": -39.33271408081055, "global_step": 210274, "epoch": 1737} {"train_loss": -39.569576263427734, "global_step": 210275, "epoch": 1737} {"train_loss": -40.41676712036133, "global_step": 210276, "epoch": 1737} {"train_loss": -40.24026107788086, "global_step": 210277, "epoch": 1737} {"train_loss": -40.638179779052734, "global_step": 210278, "epoch": 1737} {"train_loss": -40.16579055786133, "global_step": 210279, "epoch": 1737} {"train_loss": -40.697025299072266, "global_step": 210280, "epoch": 1737} {"train_loss": -39.37929916381836, "global_step": 210281, "epoch": 1737} {"train_loss": -37.090206146240234, "global_step": 210282, "epoch": 1737} {"train_loss": -41.1956901550293, "global_step": 210283, "epoch": 1737} {"train_loss": -40.35327911376953, "global_step": 210284, "epoch": 1737} {"train_loss": -40.693477630615234, "global_step": 210285, "epoch": 1737} {"train_loss": -40.881805419921875, "global_step": 210286, "epoch": 1737} {"train_loss": -37.970001220703125, "global_step": 210287, "epoch": 1737} {"train_loss": -41.08781814575195, "global_step": 210288, "epoch": 1737} {"train_loss": -40.260066986083984, "global_step": 210289, "epoch": 1737} {"train_loss": -40.85841369628906, "global_step": 210290, "epoch": 1737} {"train_loss": -40.57704162597656, "global_step": 210291, "epoch": 1737} {"train_loss": -41.2031364440918, "global_step": 210292, "epoch": 1737} {"train_loss": -40.52598571777344, "global_step": 210293, "epoch": 1737} {"train_loss": -41.34260940551758, "global_step": 210294, "epoch": 1737} {"train_loss": -41.36231994628906, "global_step": 210295, "epoch": 1737} {"train_loss": -41.484310150146484, "global_step": 210296, "epoch": 1737} {"train_loss": -39.7011057167999, "global_step": 210297, "epoch": 1737, "val_loss": 2532939.75} {"train_loss": -40.7063102722168, "global_step": 210298, "epoch": 1738} {"train_loss": -41.441627502441406, "global_step": 210299, "epoch": 1738} {"train_loss": -41.03272247314453, "global_step": 210300, "epoch": 1738} {"train_loss": -40.79298400878906, "global_step": 210301, "epoch": 1738} {"train_loss": -41.0966911315918, "global_step": 210302, "epoch": 1738} {"train_loss": -41.32542419433594, "global_step": 210303, "epoch": 1738} {"train_loss": -41.95503234863281, "global_step": 210304, "epoch": 1738} {"train_loss": -40.672698974609375, "global_step": 210305, "epoch": 1738} {"train_loss": -38.212284088134766, "global_step": 210306, "epoch": 1738} {"train_loss": -41.27959060668945, "global_step": 210307, "epoch": 1738} {"train_loss": -40.69866943359375, "global_step": 210308, "epoch": 1738} {"train_loss": -41.0374755859375, "global_step": 210309, "epoch": 1738} {"train_loss": -41.76900863647461, "global_step": 210310, "epoch": 1738} {"train_loss": -39.999427795410156, "global_step": 210311, "epoch": 1738} {"train_loss": -41.00627136230469, "global_step": 210312, "epoch": 1738} {"train_loss": -41.38072967529297, "global_step": 210313, "epoch": 1738} {"train_loss": -40.0756950378418, "global_step": 210314, "epoch": 1738} {"train_loss": -41.266273498535156, "global_step": 210315, "epoch": 1738} {"train_loss": -41.70711135864258, "global_step": 210316, "epoch": 1738} {"train_loss": -41.75788879394531, "global_step": 210317, "epoch": 1738} {"train_loss": -41.10319137573242, "global_step": 210318, "epoch": 1738} {"train_loss": -40.255863189697266, "global_step": 210319, "epoch": 1738} {"train_loss": -41.528358459472656, "global_step": 210320, "epoch": 1738} {"train_loss": -41.0911979675293, "global_step": 210321, "epoch": 1738} {"train_loss": -40.89297103881836, "global_step": 210322, "epoch": 1738} {"train_loss": -41.46636962890625, "global_step": 210323, "epoch": 1738} {"train_loss": -41.45753479003906, "global_step": 210324, "epoch": 1738} {"train_loss": -41.580177307128906, "global_step": 210325, "epoch": 1738} {"train_loss": -40.58234786987305, "global_step": 210326, "epoch": 1738} {"train_loss": -40.62566375732422, "global_step": 210327, "epoch": 1738} {"train_loss": -41.637786865234375, "global_step": 210328, "epoch": 1738} {"train_loss": -38.15188217163086, "global_step": 210329, "epoch": 1738} {"train_loss": -41.33364486694336, "global_step": 210330, "epoch": 1738} {"train_loss": -41.041473388671875, "global_step": 210331, "epoch": 1738} {"train_loss": -41.047584533691406, "global_step": 210332, "epoch": 1738} {"train_loss": -41.30841827392578, "global_step": 210333, "epoch": 1738} {"train_loss": -41.92026901245117, "global_step": 210334, "epoch": 1738} {"train_loss": -41.49713134765625, "global_step": 210335, "epoch": 1738} {"train_loss": -42.303932189941406, "global_step": 210336, "epoch": 1738} {"train_loss": -42.10499954223633, "global_step": 210337, "epoch": 1738} {"train_loss": -41.80025863647461, "global_step": 210338, "epoch": 1738} {"train_loss": -41.739437103271484, "global_step": 210339, "epoch": 1738} {"train_loss": -42.161312103271484, "global_step": 210340, "epoch": 1738} {"train_loss": -40.195369720458984, "global_step": 210341, "epoch": 1738} {"train_loss": -42.08106231689453, "global_step": 210342, "epoch": 1738} {"train_loss": -41.18576431274414, "global_step": 210343, "epoch": 1738} {"train_loss": -41.35580825805664, "global_step": 210344, "epoch": 1738} {"train_loss": -41.2927360534668, "global_step": 210345, "epoch": 1738} {"train_loss": -41.802120208740234, "global_step": 210346, "epoch": 1738} {"train_loss": -41.87933349609375, "global_step": 210347, "epoch": 1738} {"train_loss": -41.832008361816406, "global_step": 210348, "epoch": 1738} {"train_loss": -40.14973449707031, "global_step": 210349, "epoch": 1738} {"train_loss": -39.713558197021484, "global_step": 210350, "epoch": 1738} {"train_loss": -41.636505126953125, "global_step": 210351, "epoch": 1738} {"train_loss": -41.67293930053711, "global_step": 210352, "epoch": 1738} {"train_loss": -40.917537689208984, "global_step": 210353, "epoch": 1738} {"train_loss": -40.51438903808594, "global_step": 210354, "epoch": 1738} {"train_loss": -40.5815315246582, "global_step": 210355, "epoch": 1738} {"train_loss": -39.55732345581055, "global_step": 210356, "epoch": 1738} {"train_loss": -39.224830627441406, "global_step": 210357, "epoch": 1738} {"train_loss": -41.4334831237793, "global_step": 210358, "epoch": 1738} {"train_loss": -38.42121124267578, "global_step": 210359, "epoch": 1738} {"train_loss": -37.65788650512695, "global_step": 210360, "epoch": 1738} {"train_loss": -35.83033752441406, "global_step": 210361, "epoch": 1738} {"train_loss": -37.25679397583008, "global_step": 210362, "epoch": 1738} {"train_loss": -40.587894439697266, "global_step": 210363, "epoch": 1738} {"train_loss": -40.86164093017578, "global_step": 210364, "epoch": 1738} {"train_loss": -38.36675262451172, "global_step": 210365, "epoch": 1738} {"train_loss": -39.65172576904297, "global_step": 210366, "epoch": 1738} {"train_loss": -41.39252853393555, "global_step": 210367, "epoch": 1738} {"train_loss": -38.57011795043945, "global_step": 210368, "epoch": 1738} {"train_loss": -40.55651092529297, "global_step": 210369, "epoch": 1738} {"train_loss": -40.79761505126953, "global_step": 210370, "epoch": 1738} {"train_loss": -38.011146545410156, "global_step": 210371, "epoch": 1738} {"train_loss": -40.352088928222656, "global_step": 210372, "epoch": 1738} {"train_loss": -41.432064056396484, "global_step": 210373, "epoch": 1738} {"train_loss": -38.491004943847656, "global_step": 210374, "epoch": 1738} {"train_loss": -40.67568588256836, "global_step": 210375, "epoch": 1738} {"train_loss": -40.51700973510742, "global_step": 210376, "epoch": 1738} {"train_loss": -41.325660705566406, "global_step": 210377, "epoch": 1738} {"train_loss": -40.88666534423828, "global_step": 210378, "epoch": 1738} {"train_loss": -40.34357833862305, "global_step": 210379, "epoch": 1738} {"train_loss": -41.99274826049805, "global_step": 210380, "epoch": 1738} {"train_loss": -41.41822814941406, "global_step": 210381, "epoch": 1738} {"train_loss": -40.77225875854492, "global_step": 210382, "epoch": 1738} {"train_loss": -40.98496627807617, "global_step": 210383, "epoch": 1738} {"train_loss": -40.815155029296875, "global_step": 210384, "epoch": 1738} {"train_loss": -40.674678802490234, "global_step": 210385, "epoch": 1738} {"train_loss": -41.376129150390625, "global_step": 210386, "epoch": 1738} {"train_loss": -41.416725158691406, "global_step": 210387, "epoch": 1738} {"train_loss": -41.03945541381836, "global_step": 210388, "epoch": 1738} {"train_loss": -41.2030143737793, "global_step": 210389, "epoch": 1738} {"train_loss": -40.46445083618164, "global_step": 210390, "epoch": 1738} {"train_loss": -41.25033950805664, "global_step": 210391, "epoch": 1738} {"train_loss": -40.037506103515625, "global_step": 210392, "epoch": 1738} {"train_loss": -40.852821350097656, "global_step": 210393, "epoch": 1738} {"train_loss": -41.209754943847656, "global_step": 210394, "epoch": 1738} {"train_loss": -40.494537353515625, "global_step": 210395, "epoch": 1738} {"train_loss": -41.8156852722168, "global_step": 210396, "epoch": 1738} {"train_loss": -40.73142623901367, "global_step": 210397, "epoch": 1738} {"train_loss": -41.83268356323242, "global_step": 210398, "epoch": 1738} {"train_loss": -41.2224235534668, "global_step": 210399, "epoch": 1738} {"train_loss": -41.250545501708984, "global_step": 210400, "epoch": 1738} {"train_loss": -39.725547790527344, "global_step": 210401, "epoch": 1738} {"train_loss": -41.64208221435547, "global_step": 210402, "epoch": 1738} {"train_loss": -41.554649353027344, "global_step": 210403, "epoch": 1738} {"train_loss": -42.141353607177734, "global_step": 210404, "epoch": 1738} {"train_loss": -41.51386260986328, "global_step": 210405, "epoch": 1738} {"train_loss": -39.833927154541016, "global_step": 210406, "epoch": 1738} {"train_loss": -39.8794059753418, "global_step": 210407, "epoch": 1738} {"train_loss": -40.966060638427734, "global_step": 210408, "epoch": 1738} {"train_loss": -38.908748626708984, "global_step": 210409, "epoch": 1738} {"train_loss": -41.74375534057617, "global_step": 210410, "epoch": 1738} {"train_loss": -40.20038986206055, "global_step": 210411, "epoch": 1738} {"train_loss": -40.42721939086914, "global_step": 210412, "epoch": 1738} {"train_loss": -41.3217887878418, "global_step": 210413, "epoch": 1738} {"train_loss": -41.43083572387695, "global_step": 210414, "epoch": 1738} {"train_loss": -38.952720642089844, "global_step": 210415, "epoch": 1738} {"train_loss": -40.0123291015625, "global_step": 210416, "epoch": 1738} {"train_loss": -41.90007400512695, "global_step": 210417, "epoch": 1738} {"train_loss": -40.751609802246094, "global_step": 210418, "epoch": 1738, "val_loss": 2468942.25} {"train_loss": -41.02103805541992, "global_step": 210419, "epoch": 1739} {"train_loss": -42.16138458251953, "global_step": 210420, "epoch": 1739} {"train_loss": -40.70633316040039, "global_step": 210421, "epoch": 1739} {"train_loss": -41.86351776123047, "global_step": 210422, "epoch": 1739} {"train_loss": -40.7331657409668, "global_step": 210423, "epoch": 1739} {"train_loss": -42.08811569213867, "global_step": 210424, "epoch": 1739} {"train_loss": -41.610206604003906, "global_step": 210425, "epoch": 1739} {"train_loss": -41.54618453979492, "global_step": 210426, "epoch": 1739} {"train_loss": -42.135616302490234, "global_step": 210427, "epoch": 1739} {"train_loss": -40.66035842895508, "global_step": 210428, "epoch": 1739} {"train_loss": -42.14276885986328, "global_step": 210429, "epoch": 1739} {"train_loss": -41.28622055053711, "global_step": 210430, "epoch": 1739} {"train_loss": -42.28770065307617, "global_step": 210431, "epoch": 1739} {"train_loss": -41.550716400146484, "global_step": 210432, "epoch": 1739} {"train_loss": -42.22145462036133, "global_step": 210433, "epoch": 1739} {"train_loss": -40.560787200927734, "global_step": 210434, "epoch": 1739} {"train_loss": -41.606895446777344, "global_step": 210435, "epoch": 1739} {"train_loss": -41.690460205078125, "global_step": 210436, "epoch": 1739} {"train_loss": -41.875118255615234, "global_step": 210437, "epoch": 1739} {"train_loss": -41.1381950378418, "global_step": 210438, "epoch": 1739} {"train_loss": -41.48739242553711, "global_step": 210439, "epoch": 1739} {"train_loss": -42.24732208251953, "global_step": 210440, "epoch": 1739} {"train_loss": -42.1256217956543, "global_step": 210441, "epoch": 1739} {"train_loss": -41.64013671875, "global_step": 210442, "epoch": 1739} {"train_loss": -40.11020278930664, "global_step": 210443, "epoch": 1739} {"train_loss": -40.98106002807617, "global_step": 210444, "epoch": 1739} {"train_loss": -40.448814392089844, "global_step": 210445, "epoch": 1739} {"train_loss": -42.115089416503906, "global_step": 210446, "epoch": 1739} {"train_loss": -40.734127044677734, "global_step": 210447, "epoch": 1739} {"train_loss": -41.89716720581055, "global_step": 210448, "epoch": 1739} {"train_loss": -41.61122512817383, "global_step": 210449, "epoch": 1739} {"train_loss": -42.33152770996094, "global_step": 210450, "epoch": 1739} {"train_loss": -42.0909423828125, "global_step": 210451, "epoch": 1739} {"train_loss": -41.53878402709961, "global_step": 210452, "epoch": 1739} {"train_loss": -41.5811653137207, "global_step": 210453, "epoch": 1739} {"train_loss": -41.15906524658203, "global_step": 210454, "epoch": 1739} {"train_loss": -41.32966232299805, "global_step": 210455, "epoch": 1739} {"train_loss": -40.47459030151367, "global_step": 210456, "epoch": 1739} {"train_loss": -41.792537689208984, "global_step": 210457, "epoch": 1739} {"train_loss": -37.344276428222656, "global_step": 210458, "epoch": 1739} {"train_loss": -40.6238899230957, "global_step": 210459, "epoch": 1739} {"train_loss": -41.98113250732422, "global_step": 210460, "epoch": 1739} {"train_loss": -39.15201950073242, "global_step": 210461, "epoch": 1739} {"train_loss": -40.16654586791992, "global_step": 210462, "epoch": 1739} {"train_loss": -39.26665115356445, "global_step": 210463, "epoch": 1739} {"train_loss": -39.126129150390625, "global_step": 210464, "epoch": 1739} {"train_loss": -39.734500885009766, "global_step": 210465, "epoch": 1739} {"train_loss": -41.876068115234375, "global_step": 210466, "epoch": 1739} {"train_loss": -39.23779296875, "global_step": 210467, "epoch": 1739} {"train_loss": -39.833892822265625, "global_step": 210468, "epoch": 1739} {"train_loss": -41.3097038269043, "global_step": 210469, "epoch": 1739} {"train_loss": -41.58765411376953, "global_step": 210470, "epoch": 1739} {"train_loss": -40.30183792114258, "global_step": 210471, "epoch": 1739} {"train_loss": -41.172847747802734, "global_step": 210472, "epoch": 1739} {"train_loss": -36.82688522338867, "global_step": 210473, "epoch": 1739} {"train_loss": -40.859031677246094, "global_step": 210474, "epoch": 1739} {"train_loss": -41.56476974487305, "global_step": 210475, "epoch": 1739} {"train_loss": -41.64860153198242, "global_step": 210476, "epoch": 1739} {"train_loss": -41.56175231933594, "global_step": 210477, "epoch": 1739} {"train_loss": -41.811458587646484, "global_step": 210478, "epoch": 1739} {"train_loss": -41.61423873901367, "global_step": 210479, "epoch": 1739} {"train_loss": -41.505149841308594, "global_step": 210480, "epoch": 1739} {"train_loss": -41.7292594909668, "global_step": 210481, "epoch": 1739} {"train_loss": -41.664302825927734, "global_step": 210482, "epoch": 1739} {"train_loss": -40.93960952758789, "global_step": 210483, "epoch": 1739} {"train_loss": -42.58353805541992, "global_step": 210484, "epoch": 1739} {"train_loss": -40.50004196166992, "global_step": 210485, "epoch": 1739} {"train_loss": -41.32719039916992, "global_step": 210486, "epoch": 1739} {"train_loss": -41.03772735595703, "global_step": 210487, "epoch": 1739} {"train_loss": -40.647743225097656, "global_step": 210488, "epoch": 1739} {"train_loss": -41.7115592956543, "global_step": 210489, "epoch": 1739} {"train_loss": -39.98222732543945, "global_step": 210490, "epoch": 1739} {"train_loss": -41.487342834472656, "global_step": 210491, "epoch": 1739} {"train_loss": -42.03412628173828, "global_step": 210492, "epoch": 1739} {"train_loss": -41.66065979003906, "global_step": 210493, "epoch": 1739} {"train_loss": -40.30205154418945, "global_step": 210494, "epoch": 1739} {"train_loss": -40.27970504760742, "global_step": 210495, "epoch": 1739} {"train_loss": -41.2281494140625, "global_step": 210496, "epoch": 1739} {"train_loss": -40.98507308959961, "global_step": 210497, "epoch": 1739} {"train_loss": -41.359981536865234, "global_step": 210498, "epoch": 1739} {"train_loss": -41.11964797973633, "global_step": 210499, "epoch": 1739} {"train_loss": -41.41400146484375, "global_step": 210500, "epoch": 1739} {"train_loss": -42.18457794189453, "global_step": 210501, "epoch": 1739} {"train_loss": -41.875640869140625, "global_step": 210502, "epoch": 1739} {"train_loss": -41.302337646484375, "global_step": 210503, "epoch": 1739} {"train_loss": -42.396087646484375, "global_step": 210504, "epoch": 1739} {"train_loss": -38.09998321533203, "global_step": 210505, "epoch": 1739} {"train_loss": -41.4508056640625, "global_step": 210506, "epoch": 1739} {"train_loss": -40.472103118896484, "global_step": 210507, "epoch": 1739} {"train_loss": -40.34098815917969, "global_step": 210508, "epoch": 1739} {"train_loss": -41.39115524291992, "global_step": 210509, "epoch": 1739} {"train_loss": -41.36963653564453, "global_step": 210510, "epoch": 1739} {"train_loss": -42.33130645751953, "global_step": 210511, "epoch": 1739} {"train_loss": -41.38709259033203, "global_step": 210512, "epoch": 1739} {"train_loss": -41.56560134887695, "global_step": 210513, "epoch": 1739} {"train_loss": -42.445823669433594, "global_step": 210514, "epoch": 1739} {"train_loss": -41.36525344848633, "global_step": 210515, "epoch": 1739} {"train_loss": -41.3890266418457, "global_step": 210516, "epoch": 1739} {"train_loss": -41.8724479675293, "global_step": 210517, "epoch": 1739} {"train_loss": -41.670623779296875, "global_step": 210518, "epoch": 1739} {"train_loss": -41.63833236694336, "global_step": 210519, "epoch": 1739} {"train_loss": -40.93006896972656, "global_step": 210520, "epoch": 1739} {"train_loss": -41.03471755981445, "global_step": 210521, "epoch": 1739} {"train_loss": -42.154747009277344, "global_step": 210522, "epoch": 1739} {"train_loss": -42.1749267578125, "global_step": 210523, "epoch": 1739} {"train_loss": -42.2464714050293, "global_step": 210524, "epoch": 1739} {"train_loss": -42.051143646240234, "global_step": 210525, "epoch": 1739} {"train_loss": -42.06273651123047, "global_step": 210526, "epoch": 1739} {"train_loss": -42.2735481262207, "global_step": 210527, "epoch": 1739} {"train_loss": -40.88666915893555, "global_step": 210528, "epoch": 1739} {"train_loss": -41.88679122924805, "global_step": 210529, "epoch": 1739} {"train_loss": -41.194183349609375, "global_step": 210530, "epoch": 1739} {"train_loss": -41.54130554199219, "global_step": 210531, "epoch": 1739} {"train_loss": -41.48948669433594, "global_step": 210532, "epoch": 1739} {"train_loss": -40.72243881225586, "global_step": 210533, "epoch": 1739} {"train_loss": -42.040061950683594, "global_step": 210534, "epoch": 1739} {"train_loss": -42.3457145690918, "global_step": 210535, "epoch": 1739} {"train_loss": -41.915184020996094, "global_step": 210536, "epoch": 1739} {"train_loss": -41.64498519897461, "global_step": 210537, "epoch": 1739} {"train_loss": -41.16386032104492, "global_step": 210538, "epoch": 1739} {"train_loss": -41.26315878245456, "global_step": 210539, "epoch": 1739, "val_loss": 2443480.25} {"train_loss": -41.734832763671875, "global_step": 210540, "epoch": 1740} {"train_loss": -42.82954788208008, "global_step": 210541, "epoch": 1740} {"train_loss": -41.4223747253418, "global_step": 210542, "epoch": 1740} {"train_loss": -42.21262741088867, "global_step": 210543, "epoch": 1740} {"train_loss": -41.50978469848633, "global_step": 210544, "epoch": 1740} {"train_loss": -41.780364990234375, "global_step": 210545, "epoch": 1740} {"train_loss": -41.22764587402344, "global_step": 210546, "epoch": 1740} {"train_loss": -41.72296905517578, "global_step": 210547, "epoch": 1740} {"train_loss": -42.211326599121094, "global_step": 210548, "epoch": 1740} {"train_loss": -41.39306640625, "global_step": 210549, "epoch": 1740} {"train_loss": -42.15096664428711, "global_step": 210550, "epoch": 1740} {"train_loss": -41.699371337890625, "global_step": 210551, "epoch": 1740} {"train_loss": -42.01697540283203, "global_step": 210552, "epoch": 1740} {"train_loss": -40.71146774291992, "global_step": 210553, "epoch": 1740} {"train_loss": -42.92579650878906, "global_step": 210554, "epoch": 1740} {"train_loss": -42.707008361816406, "global_step": 210555, "epoch": 1740} {"train_loss": -41.9451904296875, "global_step": 210556, "epoch": 1740} {"train_loss": -41.36914825439453, "global_step": 210557, "epoch": 1740} {"train_loss": -41.6197624206543, "global_step": 210558, "epoch": 1740} {"train_loss": -41.833526611328125, "global_step": 210559, "epoch": 1740} {"train_loss": -39.44294738769531, "global_step": 210560, "epoch": 1740} {"train_loss": -39.20663070678711, "global_step": 210561, "epoch": 1740} {"train_loss": -41.26081466674805, "global_step": 210562, "epoch": 1740} {"train_loss": -41.815555572509766, "global_step": 210563, "epoch": 1740} {"train_loss": -41.62421798706055, "global_step": 210564, "epoch": 1740} {"train_loss": -41.02169418334961, "global_step": 210565, "epoch": 1740} {"train_loss": -40.991180419921875, "global_step": 210566, "epoch": 1740} {"train_loss": -41.20050048828125, "global_step": 210567, "epoch": 1740} {"train_loss": -40.48891830444336, "global_step": 210568, "epoch": 1740} {"train_loss": -40.45831298828125, "global_step": 210569, "epoch": 1740} {"train_loss": -40.932281494140625, "global_step": 210570, "epoch": 1740} {"train_loss": -40.50810623168945, "global_step": 210571, "epoch": 1740} {"train_loss": -41.04032897949219, "global_step": 210572, "epoch": 1740} {"train_loss": -40.66862869262695, "global_step": 210573, "epoch": 1740} {"train_loss": -41.51517868041992, "global_step": 210574, "epoch": 1740} {"train_loss": -40.80392074584961, "global_step": 210575, "epoch": 1740} {"train_loss": -41.024200439453125, "global_step": 210576, "epoch": 1740} {"train_loss": -41.26375961303711, "global_step": 210577, "epoch": 1740} {"train_loss": -41.28178405761719, "global_step": 210578, "epoch": 1740} {"train_loss": -40.75701904296875, "global_step": 210579, "epoch": 1740} {"train_loss": -41.74209976196289, "global_step": 210580, "epoch": 1740} {"train_loss": -41.11916732788086, "global_step": 210581, "epoch": 1740} {"train_loss": -39.74856185913086, "global_step": 210582, "epoch": 1740} {"train_loss": -41.24563217163086, "global_step": 210583, "epoch": 1740} {"train_loss": -42.02825164794922, "global_step": 210584, "epoch": 1740} {"train_loss": -40.73462677001953, "global_step": 210585, "epoch": 1740} {"train_loss": -41.21406173706055, "global_step": 210586, "epoch": 1740} {"train_loss": -41.12762451171875, "global_step": 210587, "epoch": 1740} {"train_loss": -41.15645217895508, "global_step": 210588, "epoch": 1740} {"train_loss": -41.16343307495117, "global_step": 210589, "epoch": 1740} {"train_loss": -40.9330940246582, "global_step": 210590, "epoch": 1740} {"train_loss": -40.65055465698242, "global_step": 210591, "epoch": 1740} {"train_loss": -41.408294677734375, "global_step": 210592, "epoch": 1740} {"train_loss": -41.69458770751953, "global_step": 210593, "epoch": 1740} {"train_loss": -41.16701889038086, "global_step": 210594, "epoch": 1740} {"train_loss": -41.0971794128418, "global_step": 210595, "epoch": 1740} {"train_loss": -42.094696044921875, "global_step": 210596, "epoch": 1740} {"train_loss": -41.016658782958984, "global_step": 210597, "epoch": 1740} {"train_loss": -41.771820068359375, "global_step": 210598, "epoch": 1740} {"train_loss": -40.05350875854492, "global_step": 210599, "epoch": 1740} {"train_loss": -42.19524002075195, "global_step": 210600, "epoch": 1740} {"train_loss": -40.242069244384766, "global_step": 210601, "epoch": 1740} {"train_loss": -40.80086135864258, "global_step": 210602, "epoch": 1740} {"train_loss": -41.70053482055664, "global_step": 210603, "epoch": 1740} {"train_loss": -41.20414352416992, "global_step": 210604, "epoch": 1740} {"train_loss": -42.52076721191406, "global_step": 210605, "epoch": 1740} {"train_loss": -42.07132339477539, "global_step": 210606, "epoch": 1740} {"train_loss": -42.0889778137207, "global_step": 210607, "epoch": 1740} {"train_loss": -42.4380989074707, "global_step": 210608, "epoch": 1740} {"train_loss": -41.399375915527344, "global_step": 210609, "epoch": 1740} {"train_loss": -41.11256790161133, "global_step": 210610, "epoch": 1740} {"train_loss": -42.48323440551758, "global_step": 210611, "epoch": 1740} {"train_loss": -41.77434539794922, "global_step": 210612, "epoch": 1740} {"train_loss": -40.87694549560547, "global_step": 210613, "epoch": 1740} {"train_loss": -42.630714416503906, "global_step": 210614, "epoch": 1740} {"train_loss": -41.758056640625, "global_step": 210615, "epoch": 1740} {"train_loss": -41.91654586791992, "global_step": 210616, "epoch": 1740} {"train_loss": -40.67362594604492, "global_step": 210617, "epoch": 1740} {"train_loss": -41.859283447265625, "global_step": 210618, "epoch": 1740} {"train_loss": -42.76605224609375, "global_step": 210619, "epoch": 1740} {"train_loss": -40.86553955078125, "global_step": 210620, "epoch": 1740} {"train_loss": -42.4642448425293, "global_step": 210621, "epoch": 1740} {"train_loss": -42.55617141723633, "global_step": 210622, "epoch": 1740} {"train_loss": -42.26320266723633, "global_step": 210623, "epoch": 1740} {"train_loss": -41.47664260864258, "global_step": 210624, "epoch": 1740} {"train_loss": -40.2011833190918, "global_step": 210625, "epoch": 1740} {"train_loss": -42.11252212524414, "global_step": 210626, "epoch": 1740} {"train_loss": -41.8282470703125, "global_step": 210627, "epoch": 1740} {"train_loss": -41.69102478027344, "global_step": 210628, "epoch": 1740} {"train_loss": -42.097652435302734, "global_step": 210629, "epoch": 1740} {"train_loss": -41.83990478515625, "global_step": 210630, "epoch": 1740} {"train_loss": -41.93244552612305, "global_step": 210631, "epoch": 1740} {"train_loss": -41.88566207885742, "global_step": 210632, "epoch": 1740} {"train_loss": -39.43079376220703, "global_step": 210633, "epoch": 1740} {"train_loss": -41.118350982666016, "global_step": 210634, "epoch": 1740} {"train_loss": -42.57383346557617, "global_step": 210635, "epoch": 1740} {"train_loss": -40.7695426940918, "global_step": 210636, "epoch": 1740} {"train_loss": -41.00113296508789, "global_step": 210637, "epoch": 1740} {"train_loss": -39.9850959777832, "global_step": 210638, "epoch": 1740} {"train_loss": -39.2395133972168, "global_step": 210639, "epoch": 1740} {"train_loss": -39.77656173706055, "global_step": 210640, "epoch": 1740} {"train_loss": -39.60470962524414, "global_step": 210641, "epoch": 1740} {"train_loss": -38.19758224487305, "global_step": 210642, "epoch": 1740} {"train_loss": -40.18340301513672, "global_step": 210643, "epoch": 1740} {"train_loss": -40.84719467163086, "global_step": 210644, "epoch": 1740} {"train_loss": -38.62856674194336, "global_step": 210645, "epoch": 1740} {"train_loss": -36.912506103515625, "global_step": 210646, "epoch": 1740} {"train_loss": -39.81584167480469, "global_step": 210647, "epoch": 1740} {"train_loss": -39.528114318847656, "global_step": 210648, "epoch": 1740} {"train_loss": -41.345088958740234, "global_step": 210649, "epoch": 1740} {"train_loss": -37.6097412109375, "global_step": 210650, "epoch": 1740} {"train_loss": -39.51900100708008, "global_step": 210651, "epoch": 1740} {"train_loss": -35.385711669921875, "global_step": 210652, "epoch": 1740} {"train_loss": -36.25086212158203, "global_step": 210653, "epoch": 1740} {"train_loss": -39.41445541381836, "global_step": 210654, "epoch": 1740} {"train_loss": -34.58633041381836, "global_step": 210655, "epoch": 1740} {"train_loss": -39.7343864440918, "global_step": 210656, "epoch": 1740} {"train_loss": -37.547542572021484, "global_step": 210657, "epoch": 1740} {"train_loss": -36.83918380737305, "global_step": 210658, "epoch": 1740} {"train_loss": -37.65715408325195, "global_step": 210659, "epoch": 1740} {"train_loss": -40.895021769626084, "global_step": 210660, "epoch": 1740, "val_loss": 2962930.25} {"train_loss": -37.12651062011719, "global_step": 210661, "epoch": 1741} {"train_loss": -40.72595977783203, "global_step": 210662, "epoch": 1741} {"train_loss": -39.25252914428711, "global_step": 210663, "epoch": 1741} {"train_loss": -39.808815002441406, "global_step": 210664, "epoch": 1741} {"train_loss": -38.271209716796875, "global_step": 210665, "epoch": 1741} {"train_loss": -38.470123291015625, "global_step": 210666, "epoch": 1741} {"train_loss": -38.591793060302734, "global_step": 210667, "epoch": 1741} {"train_loss": -39.00362014770508, "global_step": 210668, "epoch": 1741} {"train_loss": -37.80376052856445, "global_step": 210669, "epoch": 1741} {"train_loss": -40.27482986450195, "global_step": 210670, "epoch": 1741} {"train_loss": -39.7326774597168, "global_step": 210671, "epoch": 1741} {"train_loss": -41.07747268676758, "global_step": 210672, "epoch": 1741} {"train_loss": -40.994808197021484, "global_step": 210673, "epoch": 1741} {"train_loss": -38.565731048583984, "global_step": 210674, "epoch": 1741} {"train_loss": -13.923480033874512, "global_step": 210675, "epoch": 1741} {"train_loss": -34.1131706237793, "global_step": 210676, "epoch": 1741} {"train_loss": -34.491756439208984, "global_step": 210677, "epoch": 1741} {"train_loss": -36.4840202331543, "global_step": 210678, "epoch": 1741} {"train_loss": -39.680416107177734, "global_step": 210679, "epoch": 1741} {"train_loss": -36.233245849609375, "global_step": 210680, "epoch": 1741} {"train_loss": -37.8307991027832, "global_step": 210681, "epoch": 1741} {"train_loss": -30.5756893157959, "global_step": 210682, "epoch": 1741} {"train_loss": -34.40747833251953, "global_step": 210683, "epoch": 1741} {"train_loss": -40.017242431640625, "global_step": 210684, "epoch": 1741} {"train_loss": -38.02482986450195, "global_step": 210685, "epoch": 1741} {"train_loss": -39.08095932006836, "global_step": 210686, "epoch": 1741} {"train_loss": -35.96908187866211, "global_step": 210687, "epoch": 1741} {"train_loss": -31.768918991088867, "global_step": 210688, "epoch": 1741} {"train_loss": -39.55427169799805, "global_step": 210689, "epoch": 1741} {"train_loss": -39.43212890625, "global_step": 210690, "epoch": 1741} {"train_loss": -32.448875427246094, "global_step": 210691, "epoch": 1741} {"train_loss": -38.64099884033203, "global_step": 210692, "epoch": 1741} {"train_loss": -40.74760818481445, "global_step": 210693, "epoch": 1741} {"train_loss": -38.119564056396484, "global_step": 210694, "epoch": 1741} {"train_loss": -34.11772537231445, "global_step": 210695, "epoch": 1741} {"train_loss": -39.0091438293457, "global_step": 210696, "epoch": 1741} {"train_loss": -39.2862663269043, "global_step": 210697, "epoch": 1741} {"train_loss": -39.755340576171875, "global_step": 210698, "epoch": 1741} {"train_loss": -37.37367630004883, "global_step": 210699, "epoch": 1741} {"train_loss": -39.685638427734375, "global_step": 210700, "epoch": 1741} {"train_loss": -39.75676345825195, "global_step": 210701, "epoch": 1741} {"train_loss": -39.96015548706055, "global_step": 210702, "epoch": 1741} {"train_loss": -39.283809661865234, "global_step": 210703, "epoch": 1741} {"train_loss": -40.179752349853516, "global_step": 210704, "epoch": 1741} {"train_loss": -40.30361557006836, "global_step": 210705, "epoch": 1741} {"train_loss": -38.786800384521484, "global_step": 210706, "epoch": 1741} {"train_loss": -40.53779983520508, "global_step": 210707, "epoch": 1741} {"train_loss": -39.86762237548828, "global_step": 210708, "epoch": 1741} {"train_loss": -40.030052185058594, "global_step": 210709, "epoch": 1741} {"train_loss": -38.98575210571289, "global_step": 210710, "epoch": 1741} {"train_loss": -40.850276947021484, "global_step": 210711, "epoch": 1741} {"train_loss": -36.2495002746582, "global_step": 210712, "epoch": 1741} {"train_loss": -40.968589782714844, "global_step": 210713, "epoch": 1741} {"train_loss": -39.11941146850586, "global_step": 210714, "epoch": 1741} {"train_loss": -40.56242752075195, "global_step": 210715, "epoch": 1741} {"train_loss": -40.792964935302734, "global_step": 210716, "epoch": 1741} {"train_loss": -40.411781311035156, "global_step": 210717, "epoch": 1741} {"train_loss": -39.519142150878906, "global_step": 210718, "epoch": 1741} {"train_loss": -39.67719268798828, "global_step": 210719, "epoch": 1741} {"train_loss": -39.90000534057617, "global_step": 210720, "epoch": 1741} {"train_loss": -40.13337707519531, "global_step": 210721, "epoch": 1741} {"train_loss": -40.71560287475586, "global_step": 210722, "epoch": 1741} {"train_loss": -40.4340934753418, "global_step": 210723, "epoch": 1741} {"train_loss": -39.76619338989258, "global_step": 210724, "epoch": 1741} {"train_loss": -40.533992767333984, "global_step": 210725, "epoch": 1741} {"train_loss": -41.001102447509766, "global_step": 210726, "epoch": 1741} {"train_loss": -41.24918746948242, "global_step": 210727, "epoch": 1741} {"train_loss": -40.86198043823242, "global_step": 210728, "epoch": 1741} {"train_loss": -41.13236618041992, "global_step": 210729, "epoch": 1741} {"train_loss": -40.61248779296875, "global_step": 210730, "epoch": 1741} {"train_loss": -40.99729537963867, "global_step": 210731, "epoch": 1741} {"train_loss": -41.0744514465332, "global_step": 210732, "epoch": 1741} {"train_loss": -40.29395294189453, "global_step": 210733, "epoch": 1741} {"train_loss": -40.739688873291016, "global_step": 210734, "epoch": 1741} {"train_loss": -40.98270797729492, "global_step": 210735, "epoch": 1741} {"train_loss": -41.451133728027344, "global_step": 210736, "epoch": 1741} {"train_loss": -41.57920455932617, "global_step": 210737, "epoch": 1741} {"train_loss": -41.469478607177734, "global_step": 210738, "epoch": 1741} {"train_loss": -41.41648864746094, "global_step": 210739, "epoch": 1741} {"train_loss": -41.821414947509766, "global_step": 210740, "epoch": 1741} {"train_loss": -41.0606575012207, "global_step": 210741, "epoch": 1741} {"train_loss": -41.41826629638672, "global_step": 210742, "epoch": 1741} {"train_loss": -41.96979904174805, "global_step": 210743, "epoch": 1741} {"train_loss": -41.44343948364258, "global_step": 210744, "epoch": 1741} {"train_loss": -41.82647705078125, "global_step": 210745, "epoch": 1741} {"train_loss": -41.16000747680664, "global_step": 210746, "epoch": 1741} {"train_loss": -41.64036178588867, "global_step": 210747, "epoch": 1741} {"train_loss": -41.46588134765625, "global_step": 210748, "epoch": 1741} {"train_loss": -41.506595611572266, "global_step": 210749, "epoch": 1741} {"train_loss": -41.67599105834961, "global_step": 210750, "epoch": 1741} {"train_loss": -41.77628707885742, "global_step": 210751, "epoch": 1741} {"train_loss": -41.507057189941406, "global_step": 210752, "epoch": 1741} {"train_loss": -41.64066696166992, "global_step": 210753, "epoch": 1741} {"train_loss": -39.79745101928711, "global_step": 210754, "epoch": 1741} {"train_loss": -41.50341796875, "global_step": 210755, "epoch": 1741} {"train_loss": -41.52695846557617, "global_step": 210756, "epoch": 1741} {"train_loss": -41.362850189208984, "global_step": 210757, "epoch": 1741} {"train_loss": -42.00624084472656, "global_step": 210758, "epoch": 1741} {"train_loss": -41.53824996948242, "global_step": 210759, "epoch": 1741} {"train_loss": -42.112823486328125, "global_step": 210760, "epoch": 1741} {"train_loss": -41.94391632080078, "global_step": 210761, "epoch": 1741} {"train_loss": -41.631011962890625, "global_step": 210762, "epoch": 1741} {"train_loss": -42.0910758972168, "global_step": 210763, "epoch": 1741} {"train_loss": -41.91646957397461, "global_step": 210764, "epoch": 1741} {"train_loss": -41.835575103759766, "global_step": 210765, "epoch": 1741} {"train_loss": -41.5651969909668, "global_step": 210766, "epoch": 1741} {"train_loss": -41.671443939208984, "global_step": 210767, "epoch": 1741} {"train_loss": -41.202449798583984, "global_step": 210768, "epoch": 1741} {"train_loss": -42.1440544128418, "global_step": 210769, "epoch": 1741} {"train_loss": -41.69792175292969, "global_step": 210770, "epoch": 1741} {"train_loss": -41.6883430480957, "global_step": 210771, "epoch": 1741} {"train_loss": -41.67403793334961, "global_step": 210772, "epoch": 1741} {"train_loss": -42.23295211791992, "global_step": 210773, "epoch": 1741} {"train_loss": -42.11414337158203, "global_step": 210774, "epoch": 1741} {"train_loss": -40.725189208984375, "global_step": 210775, "epoch": 1741} {"train_loss": -40.4952507019043, "global_step": 210776, "epoch": 1741} {"train_loss": -42.140384674072266, "global_step": 210777, "epoch": 1741} {"train_loss": -42.499446868896484, "global_step": 210778, "epoch": 1741} {"train_loss": -41.83231735229492, "global_step": 210779, "epoch": 1741} {"train_loss": -41.102108001708984, "global_step": 210780, "epoch": 1741} {"train_loss": -39.76122169652261, "global_step": 210781, "epoch": 1741, "val_loss": 2473358.5} {"train_loss": -41.59196090698242, "global_step": 210782, "epoch": 1742} {"train_loss": -41.7356071472168, "global_step": 210783, "epoch": 1742} {"train_loss": -41.842803955078125, "global_step": 210784, "epoch": 1742} {"train_loss": -42.07743453979492, "global_step": 210785, "epoch": 1742} {"train_loss": -42.260231018066406, "global_step": 210786, "epoch": 1742} {"train_loss": -42.162811279296875, "global_step": 210787, "epoch": 1742} {"train_loss": -41.82674026489258, "global_step": 210788, "epoch": 1742} {"train_loss": -41.69450759887695, "global_step": 210789, "epoch": 1742} {"train_loss": -40.42022705078125, "global_step": 210790, "epoch": 1742} {"train_loss": -38.912376403808594, "global_step": 210791, "epoch": 1742} {"train_loss": -34.559043884277344, "global_step": 210792, "epoch": 1742} {"train_loss": -33.36788558959961, "global_step": 210793, "epoch": 1742} {"train_loss": -35.160552978515625, "global_step": 210794, "epoch": 1742} {"train_loss": -38.239070892333984, "global_step": 210795, "epoch": 1742} {"train_loss": -39.7138671875, "global_step": 210796, "epoch": 1742} {"train_loss": -36.07914352416992, "global_step": 210797, "epoch": 1742} {"train_loss": -37.60841751098633, "global_step": 210798, "epoch": 1742} {"train_loss": -39.771602630615234, "global_step": 210799, "epoch": 1742} {"train_loss": -37.642147064208984, "global_step": 210800, "epoch": 1742} {"train_loss": -39.52185821533203, "global_step": 210801, "epoch": 1742} {"train_loss": -40.64786911010742, "global_step": 210802, "epoch": 1742} {"train_loss": -39.635013580322266, "global_step": 210803, "epoch": 1742} {"train_loss": -40.3275260925293, "global_step": 210804, "epoch": 1742} {"train_loss": -40.873252868652344, "global_step": 210805, "epoch": 1742} {"train_loss": -41.38610076904297, "global_step": 210806, "epoch": 1742} {"train_loss": -40.33524703979492, "global_step": 210807, "epoch": 1742} {"train_loss": -41.23936080932617, "global_step": 210808, "epoch": 1742} {"train_loss": -41.20730972290039, "global_step": 210809, "epoch": 1742} {"train_loss": -40.905792236328125, "global_step": 210810, "epoch": 1742} {"train_loss": -41.567543029785156, "global_step": 210811, "epoch": 1742} {"train_loss": -41.342220306396484, "global_step": 210812, "epoch": 1742} {"train_loss": -41.257572174072266, "global_step": 210813, "epoch": 1742} {"train_loss": -41.41181182861328, "global_step": 210814, "epoch": 1742} {"train_loss": -41.715675354003906, "global_step": 210815, "epoch": 1742} {"train_loss": -41.31080627441406, "global_step": 210816, "epoch": 1742} {"train_loss": -41.65319061279297, "global_step": 210817, "epoch": 1742} {"train_loss": -41.809661865234375, "global_step": 210818, "epoch": 1742} {"train_loss": -41.778743743896484, "global_step": 210819, "epoch": 1742} {"train_loss": -42.08655548095703, "global_step": 210820, "epoch": 1742} {"train_loss": -41.7532844543457, "global_step": 210821, "epoch": 1742} {"train_loss": -41.369110107421875, "global_step": 210822, "epoch": 1742} {"train_loss": -41.64326095581055, "global_step": 210823, "epoch": 1742} {"train_loss": -41.8199348449707, "global_step": 210824, "epoch": 1742} {"train_loss": -41.89453887939453, "global_step": 210825, "epoch": 1742} {"train_loss": -41.75934600830078, "global_step": 210826, "epoch": 1742} {"train_loss": -42.0084114074707, "global_step": 210827, "epoch": 1742} {"train_loss": -41.97152328491211, "global_step": 210828, "epoch": 1742} {"train_loss": -41.467647552490234, "global_step": 210829, "epoch": 1742} {"train_loss": -40.981170654296875, "global_step": 210830, "epoch": 1742} {"train_loss": -41.71920394897461, "global_step": 210831, "epoch": 1742} {"train_loss": -41.39347457885742, "global_step": 210832, "epoch": 1742} {"train_loss": -41.82915115356445, "global_step": 210833, "epoch": 1742} {"train_loss": -42.1508674621582, "global_step": 210834, "epoch": 1742} {"train_loss": -41.80671691894531, "global_step": 210835, "epoch": 1742} {"train_loss": -41.49375915527344, "global_step": 210836, "epoch": 1742} {"train_loss": -41.86029052734375, "global_step": 210837, "epoch": 1742} {"train_loss": -41.035491943359375, "global_step": 210838, "epoch": 1742} {"train_loss": -41.13715744018555, "global_step": 210839, "epoch": 1742} {"train_loss": -41.86555862426758, "global_step": 210840, "epoch": 1742} {"train_loss": -41.90098190307617, "global_step": 210841, "epoch": 1742} {"train_loss": -42.05250930786133, "global_step": 210842, "epoch": 1742} {"train_loss": -42.21934509277344, "global_step": 210843, "epoch": 1742} {"train_loss": -41.813899993896484, "global_step": 210844, "epoch": 1742} {"train_loss": -41.74930191040039, "global_step": 210845, "epoch": 1742} {"train_loss": -42.132076263427734, "global_step": 210846, "epoch": 1742} {"train_loss": -42.28776168823242, "global_step": 210847, "epoch": 1742} {"train_loss": -41.794734954833984, "global_step": 210848, "epoch": 1742} {"train_loss": -41.810176849365234, "global_step": 210849, "epoch": 1742} {"train_loss": -41.889095306396484, "global_step": 210850, "epoch": 1742} {"train_loss": -42.36849594116211, "global_step": 210851, "epoch": 1742} {"train_loss": -42.103057861328125, "global_step": 210852, "epoch": 1742} {"train_loss": -42.224552154541016, "global_step": 210853, "epoch": 1742} {"train_loss": -42.65865707397461, "global_step": 210854, "epoch": 1742} {"train_loss": -42.38447189331055, "global_step": 210855, "epoch": 1742} {"train_loss": -41.96757507324219, "global_step": 210856, "epoch": 1742} {"train_loss": -41.702301025390625, "global_step": 210857, "epoch": 1742} {"train_loss": -40.95780563354492, "global_step": 210858, "epoch": 1742} {"train_loss": -41.9356575012207, "global_step": 210859, "epoch": 1742} {"train_loss": -42.16144561767578, "global_step": 210860, "epoch": 1742} {"train_loss": -41.53728103637695, "global_step": 210861, "epoch": 1742} {"train_loss": -41.824920654296875, "global_step": 210862, "epoch": 1742} {"train_loss": -42.04179000854492, "global_step": 210863, "epoch": 1742} {"train_loss": -42.033782958984375, "global_step": 210864, "epoch": 1742} {"train_loss": -41.22246551513672, "global_step": 210865, "epoch": 1742} {"train_loss": -41.64829635620117, "global_step": 210866, "epoch": 1742} {"train_loss": -41.673179626464844, "global_step": 210867, "epoch": 1742} {"train_loss": -41.16471481323242, "global_step": 210868, "epoch": 1742} {"train_loss": -42.0213508605957, "global_step": 210869, "epoch": 1742} {"train_loss": -42.42157745361328, "global_step": 210870, "epoch": 1742} {"train_loss": -41.53363037109375, "global_step": 210871, "epoch": 1742} {"train_loss": -41.92258071899414, "global_step": 210872, "epoch": 1742} {"train_loss": -42.64385986328125, "global_step": 210873, "epoch": 1742} {"train_loss": -42.38019943237305, "global_step": 210874, "epoch": 1742} {"train_loss": -41.8905143737793, "global_step": 210875, "epoch": 1742} {"train_loss": -41.9655876159668, "global_step": 210876, "epoch": 1742} {"train_loss": -41.248714447021484, "global_step": 210877, "epoch": 1742} {"train_loss": -41.815757751464844, "global_step": 210878, "epoch": 1742} {"train_loss": -42.410400390625, "global_step": 210879, "epoch": 1742} {"train_loss": -42.30832290649414, "global_step": 210880, "epoch": 1742} {"train_loss": -41.36561965942383, "global_step": 210881, "epoch": 1742} {"train_loss": -42.3626594543457, "global_step": 210882, "epoch": 1742} {"train_loss": -41.20253372192383, "global_step": 210883, "epoch": 1742} {"train_loss": -41.855281829833984, "global_step": 210884, "epoch": 1742} {"train_loss": -41.93562698364258, "global_step": 210885, "epoch": 1742} {"train_loss": -41.852272033691406, "global_step": 210886, "epoch": 1742} {"train_loss": -41.75759506225586, "global_step": 210887, "epoch": 1742} {"train_loss": -41.29008865356445, "global_step": 210888, "epoch": 1742} {"train_loss": -41.96973419189453, "global_step": 210889, "epoch": 1742} {"train_loss": -41.74714660644531, "global_step": 210890, "epoch": 1742} {"train_loss": -41.86452865600586, "global_step": 210891, "epoch": 1742} {"train_loss": -41.70317459106445, "global_step": 210892, "epoch": 1742} {"train_loss": -41.39487838745117, "global_step": 210893, "epoch": 1742} {"train_loss": -39.80485153198242, "global_step": 210894, "epoch": 1742} {"train_loss": -41.22905731201172, "global_step": 210895, "epoch": 1742} {"train_loss": -40.382659912109375, "global_step": 210896, "epoch": 1742} {"train_loss": -41.839656829833984, "global_step": 210897, "epoch": 1742} {"train_loss": -38.00999069213867, "global_step": 210898, "epoch": 1742} {"train_loss": -40.39568328857422, "global_step": 210899, "epoch": 1742} {"train_loss": -39.85322189331055, "global_step": 210900, "epoch": 1742} {"train_loss": -41.03343200683594, "global_step": 210901, "epoch": 1742} {"train_loss": -41.194968073821265, "global_step": 210902, "epoch": 1742, "val_loss": 2566381.25} {"train_loss": -41.034400939941406, "global_step": 210903, "epoch": 1743} {"train_loss": -40.88888168334961, "global_step": 210904, "epoch": 1743} {"train_loss": -41.596107482910156, "global_step": 210905, "epoch": 1743} {"train_loss": -41.84023666381836, "global_step": 210906, "epoch": 1743} {"train_loss": -40.575469970703125, "global_step": 210907, "epoch": 1743} {"train_loss": -41.71744155883789, "global_step": 210908, "epoch": 1743} {"train_loss": -38.87498092651367, "global_step": 210909, "epoch": 1743} {"train_loss": -36.41099166870117, "global_step": 210910, "epoch": 1743} {"train_loss": -37.82074737548828, "global_step": 210911, "epoch": 1743} {"train_loss": -40.45524215698242, "global_step": 210912, "epoch": 1743} {"train_loss": -40.119781494140625, "global_step": 210913, "epoch": 1743} {"train_loss": -41.75193405151367, "global_step": 210914, "epoch": 1743} {"train_loss": -38.284732818603516, "global_step": 210915, "epoch": 1743} {"train_loss": -40.01542282104492, "global_step": 210916, "epoch": 1743} {"train_loss": -41.23645782470703, "global_step": 210917, "epoch": 1743} {"train_loss": -38.06618118286133, "global_step": 210918, "epoch": 1743} {"train_loss": -39.52058029174805, "global_step": 210919, "epoch": 1743} {"train_loss": -38.555965423583984, "global_step": 210920, "epoch": 1743} {"train_loss": -30.989532470703125, "global_step": 210921, "epoch": 1743} {"train_loss": -37.937313079833984, "global_step": 210922, "epoch": 1743} {"train_loss": -40.61641311645508, "global_step": 210923, "epoch": 1743} {"train_loss": -40.48435592651367, "global_step": 210924, "epoch": 1743} {"train_loss": -41.38014602661133, "global_step": 210925, "epoch": 1743} {"train_loss": -40.873653411865234, "global_step": 210926, "epoch": 1743} {"train_loss": -38.546875, "global_step": 210927, "epoch": 1743} {"train_loss": -40.87569046020508, "global_step": 210928, "epoch": 1743} {"train_loss": -40.57807159423828, "global_step": 210929, "epoch": 1743} {"train_loss": -40.31284713745117, "global_step": 210930, "epoch": 1743} {"train_loss": -39.27756881713867, "global_step": 210931, "epoch": 1743} {"train_loss": -41.01749801635742, "global_step": 210932, "epoch": 1743} {"train_loss": -40.403465270996094, "global_step": 210933, "epoch": 1743} {"train_loss": -41.4548225402832, "global_step": 210934, "epoch": 1743} {"train_loss": -40.76192855834961, "global_step": 210935, "epoch": 1743} {"train_loss": -40.69794845581055, "global_step": 210936, "epoch": 1743} {"train_loss": -40.722328186035156, "global_step": 210937, "epoch": 1743} {"train_loss": -41.48704147338867, "global_step": 210938, "epoch": 1743} {"train_loss": -40.08018112182617, "global_step": 210939, "epoch": 1743} {"train_loss": -38.20968246459961, "global_step": 210940, "epoch": 1743} {"train_loss": -40.830440521240234, "global_step": 210941, "epoch": 1743} {"train_loss": -41.00799560546875, "global_step": 210942, "epoch": 1743} {"train_loss": -36.79978561401367, "global_step": 210943, "epoch": 1743} {"train_loss": -40.71732711791992, "global_step": 210944, "epoch": 1743} {"train_loss": -41.225460052490234, "global_step": 210945, "epoch": 1743} {"train_loss": -41.22502517700195, "global_step": 210946, "epoch": 1743} {"train_loss": -41.1667366027832, "global_step": 210947, "epoch": 1743} {"train_loss": -41.74032211303711, "global_step": 210948, "epoch": 1743} {"train_loss": -39.91436767578125, "global_step": 210949, "epoch": 1743} {"train_loss": -41.11439514160156, "global_step": 210950, "epoch": 1743} {"train_loss": -41.49062728881836, "global_step": 210951, "epoch": 1743} {"train_loss": -41.38542556762695, "global_step": 210952, "epoch": 1743} {"train_loss": -39.692256927490234, "global_step": 210953, "epoch": 1743} {"train_loss": -39.26694107055664, "global_step": 210954, "epoch": 1743} {"train_loss": -41.016658782958984, "global_step": 210955, "epoch": 1743} {"train_loss": -40.12972640991211, "global_step": 210956, "epoch": 1743} {"train_loss": -41.803775787353516, "global_step": 210957, "epoch": 1743} {"train_loss": -41.77690505981445, "global_step": 210958, "epoch": 1743} {"train_loss": -41.32916259765625, "global_step": 210959, "epoch": 1743} {"train_loss": -41.384674072265625, "global_step": 210960, "epoch": 1743} {"train_loss": -41.43850326538086, "global_step": 210961, "epoch": 1743} {"train_loss": -42.05554962158203, "global_step": 210962, "epoch": 1743} {"train_loss": -41.42087936401367, "global_step": 210963, "epoch": 1743} {"train_loss": -41.27566146850586, "global_step": 210964, "epoch": 1743} {"train_loss": -41.48762130737305, "global_step": 210965, "epoch": 1743} {"train_loss": -41.997188568115234, "global_step": 210966, "epoch": 1743} {"train_loss": -41.75261306762695, "global_step": 210967, "epoch": 1743} {"train_loss": -42.00252914428711, "global_step": 210968, "epoch": 1743} {"train_loss": -41.31913375854492, "global_step": 210969, "epoch": 1743} {"train_loss": -42.1591796875, "global_step": 210970, "epoch": 1743} {"train_loss": -41.76130676269531, "global_step": 210971, "epoch": 1743} {"train_loss": -42.205501556396484, "global_step": 210972, "epoch": 1743} {"train_loss": -40.84235382080078, "global_step": 210973, "epoch": 1743} {"train_loss": -42.10319137573242, "global_step": 210974, "epoch": 1743} {"train_loss": -42.309879302978516, "global_step": 210975, "epoch": 1743} {"train_loss": -41.82199478149414, "global_step": 210976, "epoch": 1743} {"train_loss": -42.57518768310547, "global_step": 210977, "epoch": 1743} {"train_loss": -41.247413635253906, "global_step": 210978, "epoch": 1743} {"train_loss": -41.659122467041016, "global_step": 210979, "epoch": 1743} {"train_loss": -41.56165313720703, "global_step": 210980, "epoch": 1743} {"train_loss": -41.9338264465332, "global_step": 210981, "epoch": 1743} {"train_loss": -41.291725158691406, "global_step": 210982, "epoch": 1743} {"train_loss": -42.461326599121094, "global_step": 210983, "epoch": 1743} {"train_loss": -35.06757736206055, "global_step": 210984, "epoch": 1743} {"train_loss": -41.40899658203125, "global_step": 210985, "epoch": 1743} {"train_loss": -40.87325668334961, "global_step": 210986, "epoch": 1743} {"train_loss": -41.78974533081055, "global_step": 210987, "epoch": 1743} {"train_loss": -41.38083267211914, "global_step": 210988, "epoch": 1743} {"train_loss": -40.84572982788086, "global_step": 210989, "epoch": 1743} {"train_loss": -38.021541595458984, "global_step": 210990, "epoch": 1743} {"train_loss": -42.169857025146484, "global_step": 210991, "epoch": 1743} {"train_loss": -41.21649932861328, "global_step": 210992, "epoch": 1743} {"train_loss": -39.21529006958008, "global_step": 210993, "epoch": 1743} {"train_loss": -40.66609191894531, "global_step": 210994, "epoch": 1743} {"train_loss": -41.5780029296875, "global_step": 210995, "epoch": 1743} {"train_loss": -41.17986297607422, "global_step": 210996, "epoch": 1743} {"train_loss": -39.74647903442383, "global_step": 210997, "epoch": 1743} {"train_loss": -41.490989685058594, "global_step": 210998, "epoch": 1743} {"train_loss": -40.7772331237793, "global_step": 210999, "epoch": 1743} {"train_loss": -41.77215576171875, "global_step": 211000, "epoch": 1743} {"train_loss": -41.99167251586914, "global_step": 211001, "epoch": 1743} {"train_loss": -41.0933952331543, "global_step": 211002, "epoch": 1743} {"train_loss": -41.073699951171875, "global_step": 211003, "epoch": 1743} {"train_loss": -42.108882904052734, "global_step": 211004, "epoch": 1743} {"train_loss": -41.37964630126953, "global_step": 211005, "epoch": 1743} {"train_loss": -41.00932693481445, "global_step": 211006, "epoch": 1743} {"train_loss": -40.424312591552734, "global_step": 211007, "epoch": 1743} {"train_loss": -41.305538177490234, "global_step": 211008, "epoch": 1743} {"train_loss": -41.478553771972656, "global_step": 211009, "epoch": 1743} {"train_loss": -39.73360824584961, "global_step": 211010, "epoch": 1743} {"train_loss": -39.770992279052734, "global_step": 211011, "epoch": 1743} {"train_loss": -39.58181381225586, "global_step": 211012, "epoch": 1743} {"train_loss": -38.44533920288086, "global_step": 211013, "epoch": 1743} {"train_loss": -40.23920822143555, "global_step": 211014, "epoch": 1743} {"train_loss": -39.16083526611328, "global_step": 211015, "epoch": 1743} {"train_loss": -40.915950775146484, "global_step": 211016, "epoch": 1743} {"train_loss": -38.00271224975586, "global_step": 211017, "epoch": 1743} {"train_loss": -38.4881591796875, "global_step": 211018, "epoch": 1743} {"train_loss": -36.738338470458984, "global_step": 211019, "epoch": 1743} {"train_loss": -35.15822219848633, "global_step": 211020, "epoch": 1743} {"train_loss": -38.510231018066406, "global_step": 211021, "epoch": 1743} {"train_loss": -34.86035919189453, "global_step": 211022, "epoch": 1743} {"train_loss": -40.431695859294294, "global_step": 211023, "epoch": 1743, "val_loss": 2508369.75} {"train_loss": -36.757442474365234, "global_step": 211024, "epoch": 1744} {"train_loss": -40.03521728515625, "global_step": 211025, "epoch": 1744} {"train_loss": -39.64772415161133, "global_step": 211026, "epoch": 1744} {"train_loss": -38.90228271484375, "global_step": 211027, "epoch": 1744} {"train_loss": -40.35558319091797, "global_step": 211028, "epoch": 1744} {"train_loss": -40.85516357421875, "global_step": 211029, "epoch": 1744} {"train_loss": -38.190467834472656, "global_step": 211030, "epoch": 1744} {"train_loss": -39.98271179199219, "global_step": 211031, "epoch": 1744} {"train_loss": -40.55068588256836, "global_step": 211032, "epoch": 1744} {"train_loss": -36.70634078979492, "global_step": 211033, "epoch": 1744} {"train_loss": -41.32078170776367, "global_step": 211034, "epoch": 1744} {"train_loss": -38.668739318847656, "global_step": 211035, "epoch": 1744} {"train_loss": -38.57290267944336, "global_step": 211036, "epoch": 1744} {"train_loss": -41.10568618774414, "global_step": 211037, "epoch": 1744} {"train_loss": -39.448482513427734, "global_step": 211038, "epoch": 1744} {"train_loss": -40.639625549316406, "global_step": 211039, "epoch": 1744} {"train_loss": -40.58501434326172, "global_step": 211040, "epoch": 1744} {"train_loss": -40.813106536865234, "global_step": 211041, "epoch": 1744} {"train_loss": -40.46329116821289, "global_step": 211042, "epoch": 1744} {"train_loss": -39.94206619262695, "global_step": 211043, "epoch": 1744} {"train_loss": -41.004112243652344, "global_step": 211044, "epoch": 1744} {"train_loss": -41.659523010253906, "global_step": 211045, "epoch": 1744} {"train_loss": -41.10334014892578, "global_step": 211046, "epoch": 1744} {"train_loss": -40.608131408691406, "global_step": 211047, "epoch": 1744} {"train_loss": -41.83124923706055, "global_step": 211048, "epoch": 1744} {"train_loss": -41.31072235107422, "global_step": 211049, "epoch": 1744} {"train_loss": -41.47243881225586, "global_step": 211050, "epoch": 1744} {"train_loss": -41.392738342285156, "global_step": 211051, "epoch": 1744} {"train_loss": -41.72594451904297, "global_step": 211052, "epoch": 1744} {"train_loss": -41.63561248779297, "global_step": 211053, "epoch": 1744} {"train_loss": -41.636348724365234, "global_step": 211054, "epoch": 1744} {"train_loss": -42.050350189208984, "global_step": 211055, "epoch": 1744} {"train_loss": -41.68124008178711, "global_step": 211056, "epoch": 1744} {"train_loss": -41.81241989135742, "global_step": 211057, "epoch": 1744} {"train_loss": -41.30036163330078, "global_step": 211058, "epoch": 1744} {"train_loss": -41.699214935302734, "global_step": 211059, "epoch": 1744} {"train_loss": -41.9107666015625, "global_step": 211060, "epoch": 1744} {"train_loss": -42.09999084472656, "global_step": 211061, "epoch": 1744} {"train_loss": -41.960933685302734, "global_step": 211062, "epoch": 1744} {"train_loss": -42.28757858276367, "global_step": 211063, "epoch": 1744} {"train_loss": -41.929718017578125, "global_step": 211064, "epoch": 1744} {"train_loss": -42.27116775512695, "global_step": 211065, "epoch": 1744} {"train_loss": -42.47970199584961, "global_step": 211066, "epoch": 1744} {"train_loss": -42.12618637084961, "global_step": 211067, "epoch": 1744} {"train_loss": -42.140968322753906, "global_step": 211068, "epoch": 1744} {"train_loss": -42.3398323059082, "global_step": 211069, "epoch": 1744} {"train_loss": -42.25429153442383, "global_step": 211070, "epoch": 1744} {"train_loss": -42.5980224609375, "global_step": 211071, "epoch": 1744} {"train_loss": -42.5299186706543, "global_step": 211072, "epoch": 1744} {"train_loss": -42.74688720703125, "global_step": 211073, "epoch": 1744} {"train_loss": -42.772064208984375, "global_step": 211074, "epoch": 1744} {"train_loss": -42.83766174316406, "global_step": 211075, "epoch": 1744} {"train_loss": -42.526039123535156, "global_step": 211076, "epoch": 1744} {"train_loss": -42.20917892456055, "global_step": 211077, "epoch": 1744} {"train_loss": -42.476680755615234, "global_step": 211078, "epoch": 1744} {"train_loss": -42.83662796020508, "global_step": 211079, "epoch": 1744} {"train_loss": -42.45491409301758, "global_step": 211080, "epoch": 1744} {"train_loss": -42.66157150268555, "global_step": 211081, "epoch": 1744} {"train_loss": -41.96515655517578, "global_step": 211082, "epoch": 1744} {"train_loss": -42.85230255126953, "global_step": 211083, "epoch": 1744} {"train_loss": -42.1070671081543, "global_step": 211084, "epoch": 1744} {"train_loss": -42.31901168823242, "global_step": 211085, "epoch": 1744} {"train_loss": -42.77590560913086, "global_step": 211086, "epoch": 1744} {"train_loss": -42.35889434814453, "global_step": 211087, "epoch": 1744} {"train_loss": -42.193023681640625, "global_step": 211088, "epoch": 1744} {"train_loss": -42.05845260620117, "global_step": 211089, "epoch": 1744} {"train_loss": -42.53989791870117, "global_step": 211090, "epoch": 1744} {"train_loss": -42.62683868408203, "global_step": 211091, "epoch": 1744} {"train_loss": -42.48800277709961, "global_step": 211092, "epoch": 1744} {"train_loss": -42.519832611083984, "global_step": 211093, "epoch": 1744} {"train_loss": -42.76436233520508, "global_step": 211094, "epoch": 1744} {"train_loss": -42.42752456665039, "global_step": 211095, "epoch": 1744} {"train_loss": -41.448429107666016, "global_step": 211096, "epoch": 1744} {"train_loss": -40.744468688964844, "global_step": 211097, "epoch": 1744} {"train_loss": -38.49934005737305, "global_step": 211098, "epoch": 1744} {"train_loss": -38.67145538330078, "global_step": 211099, "epoch": 1744} {"train_loss": -40.33721923828125, "global_step": 211100, "epoch": 1744} {"train_loss": -39.881900787353516, "global_step": 211101, "epoch": 1744} {"train_loss": -39.965301513671875, "global_step": 211102, "epoch": 1744} {"train_loss": -39.058284759521484, "global_step": 211103, "epoch": 1744} {"train_loss": -38.74897766113281, "global_step": 211104, "epoch": 1744} {"train_loss": -38.42769241333008, "global_step": 211105, "epoch": 1744} {"train_loss": -40.37195587158203, "global_step": 211106, "epoch": 1744} {"train_loss": -40.33417892456055, "global_step": 211107, "epoch": 1744} {"train_loss": -40.4551887512207, "global_step": 211108, "epoch": 1744} {"train_loss": -40.41807174682617, "global_step": 211109, "epoch": 1744} {"train_loss": -40.28278350830078, "global_step": 211110, "epoch": 1744} {"train_loss": -39.10641860961914, "global_step": 211111, "epoch": 1744} {"train_loss": -39.66138458251953, "global_step": 211112, "epoch": 1744} {"train_loss": -40.75592803955078, "global_step": 211113, "epoch": 1744} {"train_loss": -39.00843811035156, "global_step": 211114, "epoch": 1744} {"train_loss": -39.45657730102539, "global_step": 211115, "epoch": 1744} {"train_loss": -41.104793548583984, "global_step": 211116, "epoch": 1744} {"train_loss": -39.4675407409668, "global_step": 211117, "epoch": 1744} {"train_loss": -41.403289794921875, "global_step": 211118, "epoch": 1744} {"train_loss": -41.31085205078125, "global_step": 211119, "epoch": 1744} {"train_loss": -41.71051025390625, "global_step": 211120, "epoch": 1744} {"train_loss": -41.773738861083984, "global_step": 211121, "epoch": 1744} {"train_loss": -41.22547912597656, "global_step": 211122, "epoch": 1744} {"train_loss": -41.643428802490234, "global_step": 211123, "epoch": 1744} {"train_loss": -41.88047409057617, "global_step": 211124, "epoch": 1744} {"train_loss": -42.07277297973633, "global_step": 211125, "epoch": 1744} {"train_loss": -41.637916564941406, "global_step": 211126, "epoch": 1744} {"train_loss": -41.194942474365234, "global_step": 211127, "epoch": 1744} {"train_loss": -41.85055923461914, "global_step": 211128, "epoch": 1744} {"train_loss": -41.71243667602539, "global_step": 211129, "epoch": 1744} {"train_loss": -42.355010986328125, "global_step": 211130, "epoch": 1744} {"train_loss": -41.391387939453125, "global_step": 211131, "epoch": 1744} {"train_loss": -41.5272331237793, "global_step": 211132, "epoch": 1744} {"train_loss": -40.53017044067383, "global_step": 211133, "epoch": 1744} {"train_loss": -41.28336715698242, "global_step": 211134, "epoch": 1744} {"train_loss": -41.6596794128418, "global_step": 211135, "epoch": 1744} {"train_loss": -42.059242248535156, "global_step": 211136, "epoch": 1744} {"train_loss": -41.367408752441406, "global_step": 211137, "epoch": 1744} {"train_loss": -42.195220947265625, "global_step": 211138, "epoch": 1744} {"train_loss": -41.901458740234375, "global_step": 211139, "epoch": 1744} {"train_loss": -42.348976135253906, "global_step": 211140, "epoch": 1744} {"train_loss": -42.201866149902344, "global_step": 211141, "epoch": 1744} {"train_loss": -42.20414352416992, "global_step": 211142, "epoch": 1744} {"train_loss": -41.805206298828125, "global_step": 211143, "epoch": 1744} {"train_loss": -41.20565698166524, "global_step": 211144, "epoch": 1744, "val_loss": 2540814.75} {"train_loss": -41.249874114990234, "global_step": 211145, "epoch": 1745} {"train_loss": -41.487335205078125, "global_step": 211146, "epoch": 1745} {"train_loss": -41.3504753112793, "global_step": 211147, "epoch": 1745} {"train_loss": -41.84781265258789, "global_step": 211148, "epoch": 1745} {"train_loss": -41.7947998046875, "global_step": 211149, "epoch": 1745} {"train_loss": -42.182708740234375, "global_step": 211150, "epoch": 1745} {"train_loss": -41.31092071533203, "global_step": 211151, "epoch": 1745} {"train_loss": -42.14016342163086, "global_step": 211152, "epoch": 1745} {"train_loss": -41.29836654663086, "global_step": 211153, "epoch": 1745} {"train_loss": -41.8809928894043, "global_step": 211154, "epoch": 1745} {"train_loss": -41.75868606567383, "global_step": 211155, "epoch": 1745} {"train_loss": -42.04375076293945, "global_step": 211156, "epoch": 1745} {"train_loss": -41.839454650878906, "global_step": 211157, "epoch": 1745} {"train_loss": -41.674354553222656, "global_step": 211158, "epoch": 1745} {"train_loss": -41.63777542114258, "global_step": 211159, "epoch": 1745} {"train_loss": -42.197174072265625, "global_step": 211160, "epoch": 1745} {"train_loss": -41.809478759765625, "global_step": 211161, "epoch": 1745} {"train_loss": -42.427894592285156, "global_step": 211162, "epoch": 1745} {"train_loss": -42.05155563354492, "global_step": 211163, "epoch": 1745} {"train_loss": -41.52834701538086, "global_step": 211164, "epoch": 1745} {"train_loss": -40.77631759643555, "global_step": 211165, "epoch": 1745} {"train_loss": -41.52885055541992, "global_step": 211166, "epoch": 1745} {"train_loss": -41.2954216003418, "global_step": 211167, "epoch": 1745} {"train_loss": -41.55381393432617, "global_step": 211168, "epoch": 1745} {"train_loss": -41.92744064331055, "global_step": 211169, "epoch": 1745} {"train_loss": -41.52666091918945, "global_step": 211170, "epoch": 1745} {"train_loss": -41.55775451660156, "global_step": 211171, "epoch": 1745} {"train_loss": -40.953609466552734, "global_step": 211172, "epoch": 1745} {"train_loss": -41.80781936645508, "global_step": 211173, "epoch": 1745} {"train_loss": -42.235591888427734, "global_step": 211174, "epoch": 1745} {"train_loss": -41.55219268798828, "global_step": 211175, "epoch": 1745} {"train_loss": -40.93445587158203, "global_step": 211176, "epoch": 1745} {"train_loss": -41.310394287109375, "global_step": 211177, "epoch": 1745} {"train_loss": -41.39738082885742, "global_step": 211178, "epoch": 1745} {"train_loss": -42.39046096801758, "global_step": 211179, "epoch": 1745} {"train_loss": -40.862213134765625, "global_step": 211180, "epoch": 1745} {"train_loss": -41.39616775512695, "global_step": 211181, "epoch": 1745} {"train_loss": -42.0086784362793, "global_step": 211182, "epoch": 1745} {"train_loss": -42.161128997802734, "global_step": 211183, "epoch": 1745} {"train_loss": -42.46759033203125, "global_step": 211184, "epoch": 1745} {"train_loss": -42.15366744995117, "global_step": 211185, "epoch": 1745} {"train_loss": -42.49953842163086, "global_step": 211186, "epoch": 1745} {"train_loss": -42.04772186279297, "global_step": 211187, "epoch": 1745} {"train_loss": -42.14502716064453, "global_step": 211188, "epoch": 1745} {"train_loss": -42.004737854003906, "global_step": 211189, "epoch": 1745} {"train_loss": -39.908992767333984, "global_step": 211190, "epoch": 1745} {"train_loss": -39.58892059326172, "global_step": 211191, "epoch": 1745} {"train_loss": -40.89741897583008, "global_step": 211192, "epoch": 1745} {"train_loss": -41.081722259521484, "global_step": 211193, "epoch": 1745} {"train_loss": -41.27888107299805, "global_step": 211194, "epoch": 1745} {"train_loss": -42.403785705566406, "global_step": 211195, "epoch": 1745} {"train_loss": -41.950592041015625, "global_step": 211196, "epoch": 1745} {"train_loss": -42.25112533569336, "global_step": 211197, "epoch": 1745} {"train_loss": -42.240020751953125, "global_step": 211198, "epoch": 1745} {"train_loss": -41.84901809692383, "global_step": 211199, "epoch": 1745} {"train_loss": -41.10392379760742, "global_step": 211200, "epoch": 1745} {"train_loss": -41.00089645385742, "global_step": 211201, "epoch": 1745} {"train_loss": -41.72020721435547, "global_step": 211202, "epoch": 1745} {"train_loss": -41.52464294433594, "global_step": 211203, "epoch": 1745} {"train_loss": -41.62295150756836, "global_step": 211204, "epoch": 1745} {"train_loss": -40.9696159362793, "global_step": 211205, "epoch": 1745} {"train_loss": -41.795772552490234, "global_step": 211206, "epoch": 1745} {"train_loss": -42.17673873901367, "global_step": 211207, "epoch": 1745} {"train_loss": -40.944129943847656, "global_step": 211208, "epoch": 1745} {"train_loss": -40.82534408569336, "global_step": 211209, "epoch": 1745} {"train_loss": -41.583251953125, "global_step": 211210, "epoch": 1745} {"train_loss": -41.87132263183594, "global_step": 211211, "epoch": 1745} {"train_loss": -40.843658447265625, "global_step": 211212, "epoch": 1745} {"train_loss": -41.22705078125, "global_step": 211213, "epoch": 1745} {"train_loss": -39.731014251708984, "global_step": 211214, "epoch": 1745} {"train_loss": -40.131385803222656, "global_step": 211215, "epoch": 1745} {"train_loss": -41.76602554321289, "global_step": 211216, "epoch": 1745} {"train_loss": -42.16706466674805, "global_step": 211217, "epoch": 1745} {"train_loss": -40.59199142456055, "global_step": 211218, "epoch": 1745} {"train_loss": -41.05784225463867, "global_step": 211219, "epoch": 1745} {"train_loss": -42.144981384277344, "global_step": 211220, "epoch": 1745} {"train_loss": -41.5566291809082, "global_step": 211221, "epoch": 1745} {"train_loss": -40.91912078857422, "global_step": 211222, "epoch": 1745} {"train_loss": -40.930965423583984, "global_step": 211223, "epoch": 1745} {"train_loss": -41.78083801269531, "global_step": 211224, "epoch": 1745} {"train_loss": -41.58119583129883, "global_step": 211225, "epoch": 1745} {"train_loss": -39.99225616455078, "global_step": 211226, "epoch": 1745} {"train_loss": -41.000240325927734, "global_step": 211227, "epoch": 1745} {"train_loss": -41.459442138671875, "global_step": 211228, "epoch": 1745} {"train_loss": -39.841548919677734, "global_step": 211229, "epoch": 1745} {"train_loss": -40.72403335571289, "global_step": 211230, "epoch": 1745} {"train_loss": -40.578556060791016, "global_step": 211231, "epoch": 1745} {"train_loss": -39.5970344543457, "global_step": 211232, "epoch": 1745} {"train_loss": -40.142147064208984, "global_step": 211233, "epoch": 1745} {"train_loss": -41.4451904296875, "global_step": 211234, "epoch": 1745} {"train_loss": -40.299835205078125, "global_step": 211235, "epoch": 1745} {"train_loss": -39.2740478515625, "global_step": 211236, "epoch": 1745} {"train_loss": -41.4184684753418, "global_step": 211237, "epoch": 1745} {"train_loss": -39.464290618896484, "global_step": 211238, "epoch": 1745} {"train_loss": -40.692359924316406, "global_step": 211239, "epoch": 1745} {"train_loss": -39.76015090942383, "global_step": 211240, "epoch": 1745} {"train_loss": -42.07985305786133, "global_step": 211241, "epoch": 1745} {"train_loss": -40.04134750366211, "global_step": 211242, "epoch": 1745} {"train_loss": -40.71289825439453, "global_step": 211243, "epoch": 1745} {"train_loss": -41.730369567871094, "global_step": 211244, "epoch": 1745} {"train_loss": -40.59568405151367, "global_step": 211245, "epoch": 1745} {"train_loss": -41.128662109375, "global_step": 211246, "epoch": 1745} {"train_loss": -41.468807220458984, "global_step": 211247, "epoch": 1745} {"train_loss": -40.845123291015625, "global_step": 211248, "epoch": 1745} {"train_loss": -41.06096267700195, "global_step": 211249, "epoch": 1745} {"train_loss": -42.260955810546875, "global_step": 211250, "epoch": 1745} {"train_loss": -41.869895935058594, "global_step": 211251, "epoch": 1745} {"train_loss": -41.529788970947266, "global_step": 211252, "epoch": 1745} {"train_loss": -41.65882873535156, "global_step": 211253, "epoch": 1745} {"train_loss": -41.40308380126953, "global_step": 211254, "epoch": 1745} {"train_loss": -40.931243896484375, "global_step": 211255, "epoch": 1745} {"train_loss": -41.96138381958008, "global_step": 211256, "epoch": 1745} {"train_loss": -41.224788665771484, "global_step": 211257, "epoch": 1745} {"train_loss": -41.80896759033203, "global_step": 211258, "epoch": 1745} {"train_loss": -41.88216018676758, "global_step": 211259, "epoch": 1745} {"train_loss": -41.867000579833984, "global_step": 211260, "epoch": 1745} {"train_loss": -41.71923828125, "global_step": 211261, "epoch": 1745} {"train_loss": -41.247920989990234, "global_step": 211262, "epoch": 1745} {"train_loss": -41.77617645263672, "global_step": 211263, "epoch": 1745} {"train_loss": -41.6584587097168, "global_step": 211264, "epoch": 1745} {"train_loss": -41.380381655101935, "global_step": 211265, "epoch": 1745, "val_loss": 2547339.75} {"train_loss": -41.86049270629883, "global_step": 211266, "epoch": 1746} {"train_loss": -42.21722412109375, "global_step": 211267, "epoch": 1746} {"train_loss": -41.083518981933594, "global_step": 211268, "epoch": 1746} {"train_loss": -41.57772445678711, "global_step": 211269, "epoch": 1746} {"train_loss": -41.90449905395508, "global_step": 211270, "epoch": 1746} {"train_loss": -42.008056640625, "global_step": 211271, "epoch": 1746} {"train_loss": -41.98432540893555, "global_step": 211272, "epoch": 1746} {"train_loss": -41.7207145690918, "global_step": 211273, "epoch": 1746} {"train_loss": -41.70607376098633, "global_step": 211274, "epoch": 1746} {"train_loss": -41.629947662353516, "global_step": 211275, "epoch": 1746} {"train_loss": -42.87196731567383, "global_step": 211276, "epoch": 1746} {"train_loss": -41.03984451293945, "global_step": 211277, "epoch": 1746} {"train_loss": -41.78822708129883, "global_step": 211278, "epoch": 1746} {"train_loss": -42.33072280883789, "global_step": 211279, "epoch": 1746} {"train_loss": -41.89019775390625, "global_step": 211280, "epoch": 1746} {"train_loss": -41.557838439941406, "global_step": 211281, "epoch": 1746} {"train_loss": -41.94576644897461, "global_step": 211282, "epoch": 1746} {"train_loss": -41.5254020690918, "global_step": 211283, "epoch": 1746} {"train_loss": -42.18951416015625, "global_step": 211284, "epoch": 1746} {"train_loss": -42.497859954833984, "global_step": 211285, "epoch": 1746} {"train_loss": -42.02444839477539, "global_step": 211286, "epoch": 1746} {"train_loss": -42.38311767578125, "global_step": 211287, "epoch": 1746} {"train_loss": -42.40620040893555, "global_step": 211288, "epoch": 1746} {"train_loss": -42.22429275512695, "global_step": 211289, "epoch": 1746} {"train_loss": -42.38738250732422, "global_step": 211290, "epoch": 1746} {"train_loss": -42.44987869262695, "global_step": 211291, "epoch": 1746} {"train_loss": -42.42939758300781, "global_step": 211292, "epoch": 1746} {"train_loss": -42.69221115112305, "global_step": 211293, "epoch": 1746} {"train_loss": -42.36935806274414, "global_step": 211294, "epoch": 1746} {"train_loss": -42.79358673095703, "global_step": 211295, "epoch": 1746} {"train_loss": -42.88994216918945, "global_step": 211296, "epoch": 1746} {"train_loss": -42.596282958984375, "global_step": 211297, "epoch": 1746} {"train_loss": -41.60430908203125, "global_step": 211298, "epoch": 1746} {"train_loss": -42.288238525390625, "global_step": 211299, "epoch": 1746} {"train_loss": -42.89664840698242, "global_step": 211300, "epoch": 1746} {"train_loss": -42.23545837402344, "global_step": 211301, "epoch": 1746} {"train_loss": -42.0086555480957, "global_step": 211302, "epoch": 1746} {"train_loss": -42.729000091552734, "global_step": 211303, "epoch": 1746} {"train_loss": -42.897926330566406, "global_step": 211304, "epoch": 1746} {"train_loss": -43.014747619628906, "global_step": 211305, "epoch": 1746} {"train_loss": -42.43073654174805, "global_step": 211306, "epoch": 1746} {"train_loss": -41.71579360961914, "global_step": 211307, "epoch": 1746} {"train_loss": -42.681331634521484, "global_step": 211308, "epoch": 1746} {"train_loss": -42.76706314086914, "global_step": 211309, "epoch": 1746} {"train_loss": -42.730140686035156, "global_step": 211310, "epoch": 1746} {"train_loss": -42.60370635986328, "global_step": 211311, "epoch": 1746} {"train_loss": -41.92949295043945, "global_step": 211312, "epoch": 1746} {"train_loss": -41.939605712890625, "global_step": 211313, "epoch": 1746} {"train_loss": -42.39999008178711, "global_step": 211314, "epoch": 1746} {"train_loss": -42.22489547729492, "global_step": 211315, "epoch": 1746} {"train_loss": -41.66604232788086, "global_step": 211316, "epoch": 1746} {"train_loss": -40.804473876953125, "global_step": 211317, "epoch": 1746} {"train_loss": -41.079078674316406, "global_step": 211318, "epoch": 1746} {"train_loss": -41.58675765991211, "global_step": 211319, "epoch": 1746} {"train_loss": -42.32839584350586, "global_step": 211320, "epoch": 1746} {"train_loss": -42.81289291381836, "global_step": 211321, "epoch": 1746} {"train_loss": -42.09569549560547, "global_step": 211322, "epoch": 1746} {"train_loss": -42.3729362487793, "global_step": 211323, "epoch": 1746} {"train_loss": -41.74704360961914, "global_step": 211324, "epoch": 1746} {"train_loss": -41.37976837158203, "global_step": 211325, "epoch": 1746} {"train_loss": -41.694976806640625, "global_step": 211326, "epoch": 1746} {"train_loss": -41.208560943603516, "global_step": 211327, "epoch": 1746} {"train_loss": -42.02999496459961, "global_step": 211328, "epoch": 1746} {"train_loss": -41.93023681640625, "global_step": 211329, "epoch": 1746} {"train_loss": -42.03957748413086, "global_step": 211330, "epoch": 1746} {"train_loss": -41.679603576660156, "global_step": 211331, "epoch": 1746} {"train_loss": -43.00324630737305, "global_step": 211332, "epoch": 1746} {"train_loss": -43.05632019042969, "global_step": 211333, "epoch": 1746} {"train_loss": -42.51473617553711, "global_step": 211334, "epoch": 1746} {"train_loss": -42.26209259033203, "global_step": 211335, "epoch": 1746} {"train_loss": -42.284915924072266, "global_step": 211336, "epoch": 1746} {"train_loss": -42.54188537597656, "global_step": 211337, "epoch": 1746} {"train_loss": -42.75584030151367, "global_step": 211338, "epoch": 1746} {"train_loss": -42.124813079833984, "global_step": 211339, "epoch": 1746} {"train_loss": -42.4902458190918, "global_step": 211340, "epoch": 1746} {"train_loss": -41.093475341796875, "global_step": 211341, "epoch": 1746} {"train_loss": -41.62282943725586, "global_step": 211342, "epoch": 1746} {"train_loss": -42.719417572021484, "global_step": 211343, "epoch": 1746} {"train_loss": -40.20720672607422, "global_step": 211344, "epoch": 1746} {"train_loss": -36.93876266479492, "global_step": 211345, "epoch": 1746} {"train_loss": -38.593868255615234, "global_step": 211346, "epoch": 1746} {"train_loss": -41.81148910522461, "global_step": 211347, "epoch": 1746} {"train_loss": -39.640724182128906, "global_step": 211348, "epoch": 1746} {"train_loss": -38.03971481323242, "global_step": 211349, "epoch": 1746} {"train_loss": -41.458778381347656, "global_step": 211350, "epoch": 1746} {"train_loss": -41.31890869140625, "global_step": 211351, "epoch": 1746} {"train_loss": -37.388301849365234, "global_step": 211352, "epoch": 1746} {"train_loss": -39.09518051147461, "global_step": 211353, "epoch": 1746} {"train_loss": -41.744361877441406, "global_step": 211354, "epoch": 1746} {"train_loss": -40.95641326904297, "global_step": 211355, "epoch": 1746} {"train_loss": -39.69681167602539, "global_step": 211356, "epoch": 1746} {"train_loss": -39.5629997253418, "global_step": 211357, "epoch": 1746} {"train_loss": -41.72039794921875, "global_step": 211358, "epoch": 1746} {"train_loss": -41.21458053588867, "global_step": 211359, "epoch": 1746} {"train_loss": -40.4757194519043, "global_step": 211360, "epoch": 1746} {"train_loss": -42.06816482543945, "global_step": 211361, "epoch": 1746} {"train_loss": -39.496681213378906, "global_step": 211362, "epoch": 1746} {"train_loss": -39.71576690673828, "global_step": 211363, "epoch": 1746} {"train_loss": -40.49689483642578, "global_step": 211364, "epoch": 1746} {"train_loss": -42.002685546875, "global_step": 211365, "epoch": 1746} {"train_loss": -40.420101165771484, "global_step": 211366, "epoch": 1746} {"train_loss": -41.303436279296875, "global_step": 211367, "epoch": 1746} {"train_loss": -42.29621505737305, "global_step": 211368, "epoch": 1746} {"train_loss": -41.32366943359375, "global_step": 211369, "epoch": 1746} {"train_loss": -41.82326889038086, "global_step": 211370, "epoch": 1746} {"train_loss": -41.55568313598633, "global_step": 211371, "epoch": 1746} {"train_loss": -41.80778121948242, "global_step": 211372, "epoch": 1746} {"train_loss": -41.19076156616211, "global_step": 211373, "epoch": 1746} {"train_loss": -41.60014724731445, "global_step": 211374, "epoch": 1746} {"train_loss": -41.66889572143555, "global_step": 211375, "epoch": 1746} {"train_loss": -42.67947006225586, "global_step": 211376, "epoch": 1746} {"train_loss": -41.69990539550781, "global_step": 211377, "epoch": 1746} {"train_loss": -41.76625061035156, "global_step": 211378, "epoch": 1746} {"train_loss": -41.75749969482422, "global_step": 211379, "epoch": 1746} {"train_loss": -42.208770751953125, "global_step": 211380, "epoch": 1746} {"train_loss": -40.89738082885742, "global_step": 211381, "epoch": 1746} {"train_loss": -41.51346969604492, "global_step": 211382, "epoch": 1746} {"train_loss": -42.54250717163086, "global_step": 211383, "epoch": 1746} {"train_loss": -41.2850227355957, "global_step": 211384, "epoch": 1746} {"train_loss": -41.01845932006836, "global_step": 211385, "epoch": 1746} {"train_loss": -41.697844071821734, "global_step": 211386, "epoch": 1746, "val_loss": 2566915.25} {"train_loss": -40.639408111572266, "global_step": 211387, "epoch": 1747} {"train_loss": -41.307952880859375, "global_step": 211388, "epoch": 1747} {"train_loss": -42.15444564819336, "global_step": 211389, "epoch": 1747} {"train_loss": -39.962738037109375, "global_step": 211390, "epoch": 1747} {"train_loss": -41.02479934692383, "global_step": 211391, "epoch": 1747} {"train_loss": -42.2029914855957, "global_step": 211392, "epoch": 1747} {"train_loss": -41.35897445678711, "global_step": 211393, "epoch": 1747} {"train_loss": -41.79492950439453, "global_step": 211394, "epoch": 1747} {"train_loss": -42.008148193359375, "global_step": 211395, "epoch": 1747} {"train_loss": -40.021705627441406, "global_step": 211396, "epoch": 1747} {"train_loss": -41.66305160522461, "global_step": 211397, "epoch": 1747} {"train_loss": -42.206695556640625, "global_step": 211398, "epoch": 1747} {"train_loss": -41.435462951660156, "global_step": 211399, "epoch": 1747} {"train_loss": -42.08065414428711, "global_step": 211400, "epoch": 1747} {"train_loss": -42.128902435302734, "global_step": 211401, "epoch": 1747} {"train_loss": -42.283260345458984, "global_step": 211402, "epoch": 1747} {"train_loss": -41.59092712402344, "global_step": 211403, "epoch": 1747} {"train_loss": -42.60042953491211, "global_step": 211404, "epoch": 1747} {"train_loss": -42.18421173095703, "global_step": 211405, "epoch": 1747} {"train_loss": -41.497230529785156, "global_step": 211406, "epoch": 1747} {"train_loss": -42.23603439331055, "global_step": 211407, "epoch": 1747} {"train_loss": -41.80625534057617, "global_step": 211408, "epoch": 1747} {"train_loss": -41.44245529174805, "global_step": 211409, "epoch": 1747} {"train_loss": -42.13441848754883, "global_step": 211410, "epoch": 1747} {"train_loss": -42.35615539550781, "global_step": 211411, "epoch": 1747} {"train_loss": -41.74036407470703, "global_step": 211412, "epoch": 1747} {"train_loss": -41.573909759521484, "global_step": 211413, "epoch": 1747} {"train_loss": -42.482295989990234, "global_step": 211414, "epoch": 1747} {"train_loss": -42.548213958740234, "global_step": 211415, "epoch": 1747} {"train_loss": -42.4046516418457, "global_step": 211416, "epoch": 1747} {"train_loss": -42.05834197998047, "global_step": 211417, "epoch": 1747} {"train_loss": -42.58654022216797, "global_step": 211418, "epoch": 1747} {"train_loss": -42.26363754272461, "global_step": 211419, "epoch": 1747} {"train_loss": -41.956329345703125, "global_step": 211420, "epoch": 1747} {"train_loss": -42.608612060546875, "global_step": 211421, "epoch": 1747} {"train_loss": -42.448238372802734, "global_step": 211422, "epoch": 1747} {"train_loss": -43.034358978271484, "global_step": 211423, "epoch": 1747} {"train_loss": -42.77762985229492, "global_step": 211424, "epoch": 1747} {"train_loss": -42.1945686340332, "global_step": 211425, "epoch": 1747} {"train_loss": -42.00389099121094, "global_step": 211426, "epoch": 1747} {"train_loss": -42.67878341674805, "global_step": 211427, "epoch": 1747} {"train_loss": -42.75216293334961, "global_step": 211428, "epoch": 1747} {"train_loss": -42.021541595458984, "global_step": 211429, "epoch": 1747} {"train_loss": -42.3154296875, "global_step": 211430, "epoch": 1747} {"train_loss": -42.65497970581055, "global_step": 211431, "epoch": 1747} {"train_loss": -42.5200309753418, "global_step": 211432, "epoch": 1747} {"train_loss": -42.18852996826172, "global_step": 211433, "epoch": 1747} {"train_loss": -42.59511947631836, "global_step": 211434, "epoch": 1747} {"train_loss": -42.481834411621094, "global_step": 211435, "epoch": 1747} {"train_loss": -42.75883865356445, "global_step": 211436, "epoch": 1747} {"train_loss": -42.7998046875, "global_step": 211437, "epoch": 1747} {"train_loss": -42.3424072265625, "global_step": 211438, "epoch": 1747} {"train_loss": -42.62967300415039, "global_step": 211439, "epoch": 1747} {"train_loss": -43.05415344238281, "global_step": 211440, "epoch": 1747} {"train_loss": -42.35520553588867, "global_step": 211441, "epoch": 1747} {"train_loss": -42.33537292480469, "global_step": 211442, "epoch": 1747} {"train_loss": -42.39242172241211, "global_step": 211443, "epoch": 1747} {"train_loss": -42.52846908569336, "global_step": 211444, "epoch": 1747} {"train_loss": -42.621009826660156, "global_step": 211445, "epoch": 1747} {"train_loss": -42.612056732177734, "global_step": 211446, "epoch": 1747} {"train_loss": -43.10798263549805, "global_step": 211447, "epoch": 1747} {"train_loss": -42.54178237915039, "global_step": 211448, "epoch": 1747} {"train_loss": -43.18791580200195, "global_step": 211449, "epoch": 1747} {"train_loss": -42.4896240234375, "global_step": 211450, "epoch": 1747} {"train_loss": -41.951393127441406, "global_step": 211451, "epoch": 1747} {"train_loss": -42.03852462768555, "global_step": 211452, "epoch": 1747} {"train_loss": -41.57863235473633, "global_step": 211453, "epoch": 1747} {"train_loss": -41.687931060791016, "global_step": 211454, "epoch": 1747} {"train_loss": -41.603111267089844, "global_step": 211455, "epoch": 1747} {"train_loss": -42.64142990112305, "global_step": 211456, "epoch": 1747} {"train_loss": -42.51691818237305, "global_step": 211457, "epoch": 1747} {"train_loss": -42.29193878173828, "global_step": 211458, "epoch": 1747} {"train_loss": -36.85445022583008, "global_step": 211459, "epoch": 1747} {"train_loss": -31.48610496520996, "global_step": 211460, "epoch": 1747} {"train_loss": -33.766632080078125, "global_step": 211461, "epoch": 1747} {"train_loss": -38.96769714355469, "global_step": 211462, "epoch": 1747} {"train_loss": -34.161712646484375, "global_step": 211463, "epoch": 1747} {"train_loss": -37.83493423461914, "global_step": 211464, "epoch": 1747} {"train_loss": -40.570228576660156, "global_step": 211465, "epoch": 1747} {"train_loss": -38.84445571899414, "global_step": 211466, "epoch": 1747} {"train_loss": -40.57514572143555, "global_step": 211467, "epoch": 1747} {"train_loss": -38.578853607177734, "global_step": 211468, "epoch": 1747} {"train_loss": -39.624507904052734, "global_step": 211469, "epoch": 1747} {"train_loss": -38.8139762878418, "global_step": 211470, "epoch": 1747} {"train_loss": -37.685523986816406, "global_step": 211471, "epoch": 1747} {"train_loss": -39.375282287597656, "global_step": 211472, "epoch": 1747} {"train_loss": -38.7671012878418, "global_step": 211473, "epoch": 1747} {"train_loss": -39.238155364990234, "global_step": 211474, "epoch": 1747} {"train_loss": -38.61147689819336, "global_step": 211475, "epoch": 1747} {"train_loss": -39.593379974365234, "global_step": 211476, "epoch": 1747} {"train_loss": -39.20681381225586, "global_step": 211477, "epoch": 1747} {"train_loss": -37.45009994506836, "global_step": 211478, "epoch": 1747} {"train_loss": -37.423248291015625, "global_step": 211479, "epoch": 1747} {"train_loss": -39.00047302246094, "global_step": 211480, "epoch": 1747} {"train_loss": -39.21433639526367, "global_step": 211481, "epoch": 1747} {"train_loss": -38.87113571166992, "global_step": 211482, "epoch": 1747} {"train_loss": -38.851707458496094, "global_step": 211483, "epoch": 1747} {"train_loss": -39.23663330078125, "global_step": 211484, "epoch": 1747} {"train_loss": -38.495826721191406, "global_step": 211485, "epoch": 1747} {"train_loss": -40.38154220581055, "global_step": 211486, "epoch": 1747} {"train_loss": -39.229427337646484, "global_step": 211487, "epoch": 1747} {"train_loss": -39.43791580200195, "global_step": 211488, "epoch": 1747} {"train_loss": -40.2159538269043, "global_step": 211489, "epoch": 1747} {"train_loss": -39.79299545288086, "global_step": 211490, "epoch": 1747} {"train_loss": -40.698028564453125, "global_step": 211491, "epoch": 1747} {"train_loss": -39.45138168334961, "global_step": 211492, "epoch": 1747} {"train_loss": -41.311214447021484, "global_step": 211493, "epoch": 1747} {"train_loss": -39.84988021850586, "global_step": 211494, "epoch": 1747} {"train_loss": -40.14897155761719, "global_step": 211495, "epoch": 1747} {"train_loss": -41.33869552612305, "global_step": 211496, "epoch": 1747} {"train_loss": -40.02320861816406, "global_step": 211497, "epoch": 1747} {"train_loss": -41.32832336425781, "global_step": 211498, "epoch": 1747} {"train_loss": -41.03261947631836, "global_step": 211499, "epoch": 1747} {"train_loss": -40.228302001953125, "global_step": 211500, "epoch": 1747} {"train_loss": -41.990901947021484, "global_step": 211501, "epoch": 1747} {"train_loss": -40.74796676635742, "global_step": 211502, "epoch": 1747} {"train_loss": -41.31672286987305, "global_step": 211503, "epoch": 1747} {"train_loss": -41.636024475097656, "global_step": 211504, "epoch": 1747} {"train_loss": -41.31725311279297, "global_step": 211505, "epoch": 1747} {"train_loss": -41.996726989746094, "global_step": 211506, "epoch": 1747} {"train_loss": -41.003544626157144, "global_step": 211507, "epoch": 1747, "val_loss": 2580292.5} {"train_loss": -42.11898422241211, "global_step": 211508, "epoch": 1748} {"train_loss": -41.574981689453125, "global_step": 211509, "epoch": 1748} {"train_loss": -42.278926849365234, "global_step": 211510, "epoch": 1748} {"train_loss": -42.016361236572266, "global_step": 211511, "epoch": 1748} {"train_loss": -42.1128044128418, "global_step": 211512, "epoch": 1748} {"train_loss": -42.31891632080078, "global_step": 211513, "epoch": 1748} {"train_loss": -41.62661361694336, "global_step": 211514, "epoch": 1748} {"train_loss": -41.86835861206055, "global_step": 211515, "epoch": 1748} {"train_loss": -42.38248825073242, "global_step": 211516, "epoch": 1748} {"train_loss": -42.27009963989258, "global_step": 211517, "epoch": 1748} {"train_loss": -42.238006591796875, "global_step": 211518, "epoch": 1748} {"train_loss": -42.55251693725586, "global_step": 211519, "epoch": 1748} {"train_loss": -42.34596633911133, "global_step": 211520, "epoch": 1748} {"train_loss": -42.68825149536133, "global_step": 211521, "epoch": 1748} {"train_loss": -42.138607025146484, "global_step": 211522, "epoch": 1748} {"train_loss": -42.6279411315918, "global_step": 211523, "epoch": 1748} {"train_loss": -42.78581619262695, "global_step": 211524, "epoch": 1748} {"train_loss": -42.59229278564453, "global_step": 211525, "epoch": 1748} {"train_loss": -42.12128829956055, "global_step": 211526, "epoch": 1748} {"train_loss": -42.85698699951172, "global_step": 211527, "epoch": 1748} {"train_loss": -42.82760238647461, "global_step": 211528, "epoch": 1748} {"train_loss": -42.93793487548828, "global_step": 211529, "epoch": 1748} {"train_loss": -42.522369384765625, "global_step": 211530, "epoch": 1748} {"train_loss": -42.90571212768555, "global_step": 211531, "epoch": 1748} {"train_loss": -42.995052337646484, "global_step": 211532, "epoch": 1748} {"train_loss": -42.689918518066406, "global_step": 211533, "epoch": 1748} {"train_loss": -42.92966079711914, "global_step": 211534, "epoch": 1748} {"train_loss": -42.75104522705078, "global_step": 211535, "epoch": 1748} {"train_loss": -42.922916412353516, "global_step": 211536, "epoch": 1748} {"train_loss": -42.357845306396484, "global_step": 211537, "epoch": 1748} {"train_loss": -43.030941009521484, "global_step": 211538, "epoch": 1748} {"train_loss": -42.90701675415039, "global_step": 211539, "epoch": 1748} {"train_loss": -42.89649963378906, "global_step": 211540, "epoch": 1748} {"train_loss": -42.78882598876953, "global_step": 211541, "epoch": 1748} {"train_loss": -42.5975456237793, "global_step": 211542, "epoch": 1748} {"train_loss": -42.85970687866211, "global_step": 211543, "epoch": 1748} {"train_loss": -43.47056579589844, "global_step": 211544, "epoch": 1748} {"train_loss": -43.0998420715332, "global_step": 211545, "epoch": 1748} {"train_loss": -42.801639556884766, "global_step": 211546, "epoch": 1748} {"train_loss": -43.06570053100586, "global_step": 211547, "epoch": 1748} {"train_loss": -43.1993408203125, "global_step": 211548, "epoch": 1748} {"train_loss": -43.010128021240234, "global_step": 211549, "epoch": 1748} {"train_loss": -43.38819122314453, "global_step": 211550, "epoch": 1748} {"train_loss": -43.31438064575195, "global_step": 211551, "epoch": 1748} {"train_loss": -43.38233947753906, "global_step": 211552, "epoch": 1748} {"train_loss": -43.20915222167969, "global_step": 211553, "epoch": 1748} {"train_loss": -42.98769760131836, "global_step": 211554, "epoch": 1748} {"train_loss": -43.306053161621094, "global_step": 211555, "epoch": 1748} {"train_loss": -42.383079528808594, "global_step": 211556, "epoch": 1748} {"train_loss": -41.211360931396484, "global_step": 211557, "epoch": 1748} {"train_loss": -40.03581619262695, "global_step": 211558, "epoch": 1748} {"train_loss": -41.32768630981445, "global_step": 211559, "epoch": 1748} {"train_loss": -43.1914176940918, "global_step": 211560, "epoch": 1748} {"train_loss": -42.550960540771484, "global_step": 211561, "epoch": 1748} {"train_loss": -42.6424674987793, "global_step": 211562, "epoch": 1748} {"train_loss": -42.128326416015625, "global_step": 211563, "epoch": 1748} {"train_loss": -40.96706771850586, "global_step": 211564, "epoch": 1748} {"train_loss": -42.51286315917969, "global_step": 211565, "epoch": 1748} {"train_loss": -42.739498138427734, "global_step": 211566, "epoch": 1748} {"train_loss": -42.4266471862793, "global_step": 211567, "epoch": 1748} {"train_loss": -42.15153884887695, "global_step": 211568, "epoch": 1748} {"train_loss": -42.42019271850586, "global_step": 211569, "epoch": 1748} {"train_loss": -41.996620178222656, "global_step": 211570, "epoch": 1748} {"train_loss": -42.12854766845703, "global_step": 211571, "epoch": 1748} {"train_loss": -42.68268585205078, "global_step": 211572, "epoch": 1748} {"train_loss": -42.118438720703125, "global_step": 211573, "epoch": 1748} {"train_loss": -41.680545806884766, "global_step": 211574, "epoch": 1748} {"train_loss": -41.502227783203125, "global_step": 211575, "epoch": 1748} {"train_loss": -40.03150939941406, "global_step": 211576, "epoch": 1748} {"train_loss": -38.47498321533203, "global_step": 211577, "epoch": 1748} {"train_loss": -39.015560150146484, "global_step": 211578, "epoch": 1748} {"train_loss": -40.87662124633789, "global_step": 211579, "epoch": 1748} {"train_loss": -42.03132247924805, "global_step": 211580, "epoch": 1748} {"train_loss": -40.444461822509766, "global_step": 211581, "epoch": 1748} {"train_loss": -41.12632369995117, "global_step": 211582, "epoch": 1748} {"train_loss": -41.269737243652344, "global_step": 211583, "epoch": 1748} {"train_loss": -41.132808685302734, "global_step": 211584, "epoch": 1748} {"train_loss": -38.814937591552734, "global_step": 211585, "epoch": 1748} {"train_loss": -40.775184631347656, "global_step": 211586, "epoch": 1748} {"train_loss": -41.23176193237305, "global_step": 211587, "epoch": 1748} {"train_loss": -38.835811614990234, "global_step": 211588, "epoch": 1748} {"train_loss": -39.75858688354492, "global_step": 211589, "epoch": 1748} {"train_loss": -40.754573822021484, "global_step": 211590, "epoch": 1748} {"train_loss": -37.96808624267578, "global_step": 211591, "epoch": 1748} {"train_loss": -37.27070617675781, "global_step": 211592, "epoch": 1748} {"train_loss": -41.34730911254883, "global_step": 211593, "epoch": 1748} {"train_loss": -36.58823776245117, "global_step": 211594, "epoch": 1748} {"train_loss": -39.721561431884766, "global_step": 211595, "epoch": 1748} {"train_loss": -35.327369689941406, "global_step": 211596, "epoch": 1748} {"train_loss": -35.31053161621094, "global_step": 211597, "epoch": 1748} {"train_loss": -37.876953125, "global_step": 211598, "epoch": 1748} {"train_loss": -39.1096076965332, "global_step": 211599, "epoch": 1748} {"train_loss": -38.05134963989258, "global_step": 211600, "epoch": 1748} {"train_loss": -39.12104034423828, "global_step": 211601, "epoch": 1748} {"train_loss": -39.44800567626953, "global_step": 211602, "epoch": 1748} {"train_loss": -38.42326736450195, "global_step": 211603, "epoch": 1748} {"train_loss": -39.58943557739258, "global_step": 211604, "epoch": 1748} {"train_loss": -40.07290267944336, "global_step": 211605, "epoch": 1748} {"train_loss": -37.6320915222168, "global_step": 211606, "epoch": 1748} {"train_loss": -40.653724670410156, "global_step": 211607, "epoch": 1748} {"train_loss": -39.2247428894043, "global_step": 211608, "epoch": 1748} {"train_loss": -37.932186126708984, "global_step": 211609, "epoch": 1748} {"train_loss": -39.5567626953125, "global_step": 211610, "epoch": 1748} {"train_loss": -40.621543884277344, "global_step": 211611, "epoch": 1748} {"train_loss": -38.412925720214844, "global_step": 211612, "epoch": 1748} {"train_loss": -39.67267990112305, "global_step": 211613, "epoch": 1748} {"train_loss": -40.54638671875, "global_step": 211614, "epoch": 1748} {"train_loss": -40.354835510253906, "global_step": 211615, "epoch": 1748} {"train_loss": -39.94692611694336, "global_step": 211616, "epoch": 1748} {"train_loss": -40.331939697265625, "global_step": 211617, "epoch": 1748} {"train_loss": -40.698299407958984, "global_step": 211618, "epoch": 1748} {"train_loss": -41.570186614990234, "global_step": 211619, "epoch": 1748} {"train_loss": -39.16518020629883, "global_step": 211620, "epoch": 1748} {"train_loss": -41.12834930419922, "global_step": 211621, "epoch": 1748} {"train_loss": -41.210628509521484, "global_step": 211622, "epoch": 1748} {"train_loss": -40.9652099609375, "global_step": 211623, "epoch": 1748} {"train_loss": -40.77013397216797, "global_step": 211624, "epoch": 1748} {"train_loss": -40.86684799194336, "global_step": 211625, "epoch": 1748} {"train_loss": -41.86021041870117, "global_step": 211626, "epoch": 1748} {"train_loss": -41.49481964111328, "global_step": 211627, "epoch": 1748} {"train_loss": -41.28028983124032, "global_step": 211628, "epoch": 1748, "val_loss": 2569363.75} {"train_loss": -41.72317886352539, "global_step": 211629, "epoch": 1749} {"train_loss": -41.91249465942383, "global_step": 211630, "epoch": 1749} {"train_loss": -41.61831283569336, "global_step": 211631, "epoch": 1749} {"train_loss": -41.893890380859375, "global_step": 211632, "epoch": 1749} {"train_loss": -41.91779708862305, "global_step": 211633, "epoch": 1749} {"train_loss": -41.973480224609375, "global_step": 211634, "epoch": 1749} {"train_loss": -42.13094711303711, "global_step": 211635, "epoch": 1749} {"train_loss": -42.562782287597656, "global_step": 211636, "epoch": 1749} {"train_loss": -41.865692138671875, "global_step": 211637, "epoch": 1749} {"train_loss": -42.45267868041992, "global_step": 211638, "epoch": 1749} {"train_loss": -41.82940673828125, "global_step": 211639, "epoch": 1749} {"train_loss": -42.54657745361328, "global_step": 211640, "epoch": 1749} {"train_loss": -42.07033920288086, "global_step": 211641, "epoch": 1749} {"train_loss": -41.963558197021484, "global_step": 211642, "epoch": 1749} {"train_loss": -42.27532958984375, "global_step": 211643, "epoch": 1749} {"train_loss": -42.210994720458984, "global_step": 211644, "epoch": 1749} {"train_loss": -42.44313430786133, "global_step": 211645, "epoch": 1749} {"train_loss": -42.436866760253906, "global_step": 211646, "epoch": 1749} {"train_loss": -42.5384521484375, "global_step": 211647, "epoch": 1749} {"train_loss": -42.75274658203125, "global_step": 211648, "epoch": 1749} {"train_loss": -42.539669036865234, "global_step": 211649, "epoch": 1749} {"train_loss": -42.405269622802734, "global_step": 211650, "epoch": 1749} {"train_loss": -42.66389465332031, "global_step": 211651, "epoch": 1749} {"train_loss": -42.888153076171875, "global_step": 211652, "epoch": 1749} {"train_loss": -42.796058654785156, "global_step": 211653, "epoch": 1749} {"train_loss": -42.55855941772461, "global_step": 211654, "epoch": 1749} {"train_loss": -42.86213302612305, "global_step": 211655, "epoch": 1749} {"train_loss": -43.06018829345703, "global_step": 211656, "epoch": 1749} {"train_loss": -42.722286224365234, "global_step": 211657, "epoch": 1749} {"train_loss": -43.124446868896484, "global_step": 211658, "epoch": 1749} {"train_loss": -42.943931579589844, "global_step": 211659, "epoch": 1749} {"train_loss": -42.82395553588867, "global_step": 211660, "epoch": 1749} {"train_loss": -42.473018646240234, "global_step": 211661, "epoch": 1749} {"train_loss": -42.54703140258789, "global_step": 211662, "epoch": 1749} {"train_loss": -42.78418731689453, "global_step": 211663, "epoch": 1749} {"train_loss": -42.02683639526367, "global_step": 211664, "epoch": 1749} {"train_loss": -42.74011993408203, "global_step": 211665, "epoch": 1749} {"train_loss": -42.6508674621582, "global_step": 211666, "epoch": 1749} {"train_loss": -41.98566818237305, "global_step": 211667, "epoch": 1749} {"train_loss": -41.617828369140625, "global_step": 211668, "epoch": 1749} {"train_loss": -42.643741607666016, "global_step": 211669, "epoch": 1749} {"train_loss": -43.03365707397461, "global_step": 211670, "epoch": 1749} {"train_loss": -42.977535247802734, "global_step": 211671, "epoch": 1749} {"train_loss": -42.939430236816406, "global_step": 211672, "epoch": 1749} {"train_loss": -43.139625549316406, "global_step": 211673, "epoch": 1749} {"train_loss": -41.8956413269043, "global_step": 211674, "epoch": 1749} {"train_loss": -42.611793518066406, "global_step": 211675, "epoch": 1749} {"train_loss": -42.99802780151367, "global_step": 211676, "epoch": 1749} {"train_loss": -43.082645416259766, "global_step": 211677, "epoch": 1749} {"train_loss": -42.044921875, "global_step": 211678, "epoch": 1749} {"train_loss": -42.17255401611328, "global_step": 211679, "epoch": 1749} {"train_loss": -42.88370895385742, "global_step": 211680, "epoch": 1749} {"train_loss": -42.71033477783203, "global_step": 211681, "epoch": 1749} {"train_loss": -42.30794906616211, "global_step": 211682, "epoch": 1749} {"train_loss": -41.69584274291992, "global_step": 211683, "epoch": 1749} {"train_loss": -41.305057525634766, "global_step": 211684, "epoch": 1749} {"train_loss": -43.02302169799805, "global_step": 211685, "epoch": 1749} {"train_loss": -42.46366500854492, "global_step": 211686, "epoch": 1749} {"train_loss": -40.742183685302734, "global_step": 211687, "epoch": 1749} {"train_loss": -40.27348709106445, "global_step": 211688, "epoch": 1749} {"train_loss": -42.09627151489258, "global_step": 211689, "epoch": 1749} {"train_loss": -42.17833709716797, "global_step": 211690, "epoch": 1749} {"train_loss": -39.31342697143555, "global_step": 211691, "epoch": 1749} {"train_loss": -38.95685577392578, "global_step": 211692, "epoch": 1749} {"train_loss": -39.705989837646484, "global_step": 211693, "epoch": 1749} {"train_loss": -42.072120666503906, "global_step": 211694, "epoch": 1749} {"train_loss": -40.973331451416016, "global_step": 211695, "epoch": 1749} {"train_loss": -41.47126007080078, "global_step": 211696, "epoch": 1749} {"train_loss": -42.22332763671875, "global_step": 211697, "epoch": 1749} {"train_loss": -41.03223419189453, "global_step": 211698, "epoch": 1749} {"train_loss": -40.489356994628906, "global_step": 211699, "epoch": 1749} {"train_loss": -41.916656494140625, "global_step": 211700, "epoch": 1749} {"train_loss": -42.24222946166992, "global_step": 211701, "epoch": 1749} {"train_loss": -40.02326202392578, "global_step": 211702, "epoch": 1749} {"train_loss": -41.601661682128906, "global_step": 211703, "epoch": 1749} {"train_loss": -40.906410217285156, "global_step": 211704, "epoch": 1749} {"train_loss": -37.4352912902832, "global_step": 211705, "epoch": 1749} {"train_loss": -38.644775390625, "global_step": 211706, "epoch": 1749} {"train_loss": -40.80299758911133, "global_step": 211707, "epoch": 1749} {"train_loss": -39.83844757080078, "global_step": 211708, "epoch": 1749} {"train_loss": -40.5584716796875, "global_step": 211709, "epoch": 1749} {"train_loss": -41.56232452392578, "global_step": 211710, "epoch": 1749} {"train_loss": -41.097938537597656, "global_step": 211711, "epoch": 1749} {"train_loss": -41.20524597167969, "global_step": 211712, "epoch": 1749} {"train_loss": -41.84023666381836, "global_step": 211713, "epoch": 1749} {"train_loss": -41.37429428100586, "global_step": 211714, "epoch": 1749} {"train_loss": -40.27529525756836, "global_step": 211715, "epoch": 1749} {"train_loss": -40.28178024291992, "global_step": 211716, "epoch": 1749} {"train_loss": -41.39552688598633, "global_step": 211717, "epoch": 1749} {"train_loss": -42.27303695678711, "global_step": 211718, "epoch": 1749} {"train_loss": -41.742919921875, "global_step": 211719, "epoch": 1749} {"train_loss": -40.99276351928711, "global_step": 211720, "epoch": 1749} {"train_loss": -42.60296630859375, "global_step": 211721, "epoch": 1749} {"train_loss": -41.59438705444336, "global_step": 211722, "epoch": 1749} {"train_loss": -41.83747482299805, "global_step": 211723, "epoch": 1749} {"train_loss": -42.062496185302734, "global_step": 211724, "epoch": 1749} {"train_loss": -41.912315368652344, "global_step": 211725, "epoch": 1749} {"train_loss": -42.14908218383789, "global_step": 211726, "epoch": 1749} {"train_loss": -42.400455474853516, "global_step": 211727, "epoch": 1749} {"train_loss": -41.99803161621094, "global_step": 211728, "epoch": 1749} {"train_loss": -42.32966995239258, "global_step": 211729, "epoch": 1749} {"train_loss": -42.03220748901367, "global_step": 211730, "epoch": 1749} {"train_loss": -42.19401168823242, "global_step": 211731, "epoch": 1749} {"train_loss": -42.233154296875, "global_step": 211732, "epoch": 1749} {"train_loss": -42.36103057861328, "global_step": 211733, "epoch": 1749} {"train_loss": -42.21836853027344, "global_step": 211734, "epoch": 1749} {"train_loss": -41.954383850097656, "global_step": 211735, "epoch": 1749} {"train_loss": -42.12272262573242, "global_step": 211736, "epoch": 1749} {"train_loss": -42.50080108642578, "global_step": 211737, "epoch": 1749} {"train_loss": -42.255218505859375, "global_step": 211738, "epoch": 1749} {"train_loss": -42.430545806884766, "global_step": 211739, "epoch": 1749} {"train_loss": -42.4625129699707, "global_step": 211740, "epoch": 1749} {"train_loss": -42.190914154052734, "global_step": 211741, "epoch": 1749} {"train_loss": -42.563411712646484, "global_step": 211742, "epoch": 1749} {"train_loss": -42.33268356323242, "global_step": 211743, "epoch": 1749} {"train_loss": -42.83452224731445, "global_step": 211744, "epoch": 1749} {"train_loss": -42.67999267578125, "global_step": 211745, "epoch": 1749} {"train_loss": -42.80398941040039, "global_step": 211746, "epoch": 1749} {"train_loss": -42.959590911865234, "global_step": 211747, "epoch": 1749} {"train_loss": -42.99148178100586, "global_step": 211748, "epoch": 1749} {"train_loss": -41.97163561355969, "global_step": 211749, "epoch": 1749, "val_loss": 2570367.25} {"train_loss": -42.9683952331543, "global_step": 211750, "epoch": 1750} {"train_loss": -42.93880081176758, "global_step": 211751, "epoch": 1750} {"train_loss": -43.17356491088867, "global_step": 211752, "epoch": 1750} {"train_loss": -42.86032485961914, "global_step": 211753, "epoch": 1750} {"train_loss": -42.9390754699707, "global_step": 211754, "epoch": 1750} {"train_loss": -42.783546447753906, "global_step": 211755, "epoch": 1750} {"train_loss": -43.09284591674805, "global_step": 211756, "epoch": 1750} {"train_loss": -42.373592376708984, "global_step": 211757, "epoch": 1750} {"train_loss": -42.783687591552734, "global_step": 211758, "epoch": 1750} {"train_loss": -42.906368255615234, "global_step": 211759, "epoch": 1750} {"train_loss": -42.3174934387207, "global_step": 211760, "epoch": 1750} {"train_loss": -42.7232551574707, "global_step": 211761, "epoch": 1750} {"train_loss": -43.22481918334961, "global_step": 211762, "epoch": 1750} {"train_loss": -42.93798828125, "global_step": 211763, "epoch": 1750} {"train_loss": -42.962135314941406, "global_step": 211764, "epoch": 1750} {"train_loss": -42.636138916015625, "global_step": 211765, "epoch": 1750} {"train_loss": -43.249507904052734, "global_step": 211766, "epoch": 1750} {"train_loss": -43.15920639038086, "global_step": 211767, "epoch": 1750} {"train_loss": -43.23996353149414, "global_step": 211768, "epoch": 1750} {"train_loss": -43.22417068481445, "global_step": 211769, "epoch": 1750} {"train_loss": -42.92546463012695, "global_step": 211770, "epoch": 1750} {"train_loss": -42.812255859375, "global_step": 211771, "epoch": 1750} {"train_loss": -42.5076904296875, "global_step": 211772, "epoch": 1750} {"train_loss": -43.032737731933594, "global_step": 211773, "epoch": 1750} {"train_loss": -42.9597282409668, "global_step": 211774, "epoch": 1750} {"train_loss": -42.9770622253418, "global_step": 211775, "epoch": 1750} {"train_loss": -42.78091049194336, "global_step": 211776, "epoch": 1750} {"train_loss": -43.24619674682617, "global_step": 211777, "epoch": 1750} {"train_loss": -42.49723815917969, "global_step": 211778, "epoch": 1750} {"train_loss": -42.66294479370117, "global_step": 211779, "epoch": 1750} {"train_loss": -42.71689987182617, "global_step": 211780, "epoch": 1750} {"train_loss": -42.0418815612793, "global_step": 211781, "epoch": 1750} {"train_loss": -42.22525405883789, "global_step": 211782, "epoch": 1750} {"train_loss": -42.4915885925293, "global_step": 211783, "epoch": 1750} {"train_loss": -41.66735076904297, "global_step": 211784, "epoch": 1750} {"train_loss": -39.88297653198242, "global_step": 211785, "epoch": 1750} {"train_loss": -38.44366455078125, "global_step": 211786, "epoch": 1750} {"train_loss": -38.6346321105957, "global_step": 211787, "epoch": 1750} {"train_loss": -41.03205108642578, "global_step": 211788, "epoch": 1750} {"train_loss": -41.251930236816406, "global_step": 211789, "epoch": 1750} {"train_loss": -38.99163055419922, "global_step": 211790, "epoch": 1750} {"train_loss": -37.534759521484375, "global_step": 211791, "epoch": 1750} {"train_loss": -35.84336853027344, "global_step": 211792, "epoch": 1750} {"train_loss": -37.40430450439453, "global_step": 211793, "epoch": 1750} {"train_loss": -40.940467834472656, "global_step": 211794, "epoch": 1750} {"train_loss": -39.96860885620117, "global_step": 211795, "epoch": 1750} {"train_loss": -36.165828704833984, "global_step": 211796, "epoch": 1750} {"train_loss": -41.470123291015625, "global_step": 211797, "epoch": 1750} {"train_loss": -38.98653030395508, "global_step": 211798, "epoch": 1750} {"train_loss": -39.33770751953125, "global_step": 211799, "epoch": 1750} {"train_loss": -41.00861358642578, "global_step": 211800, "epoch": 1750} {"train_loss": -38.4736442565918, "global_step": 211801, "epoch": 1750} {"train_loss": -40.24911117553711, "global_step": 211802, "epoch": 1750} {"train_loss": -39.97365951538086, "global_step": 211803, "epoch": 1750} {"train_loss": -40.43843078613281, "global_step": 211804, "epoch": 1750} {"train_loss": -41.39200973510742, "global_step": 211805, "epoch": 1750} {"train_loss": -39.98834991455078, "global_step": 211806, "epoch": 1750} {"train_loss": -40.49483108520508, "global_step": 211807, "epoch": 1750} {"train_loss": -40.771942138671875, "global_step": 211808, "epoch": 1750} {"train_loss": -40.023681640625, "global_step": 211809, "epoch": 1750} {"train_loss": -40.54592514038086, "global_step": 211810, "epoch": 1750} {"train_loss": -41.29730224609375, "global_step": 211811, "epoch": 1750} {"train_loss": -41.01731491088867, "global_step": 211812, "epoch": 1750} {"train_loss": -40.93607711791992, "global_step": 211813, "epoch": 1750} {"train_loss": -41.73899459838867, "global_step": 211814, "epoch": 1750} {"train_loss": -40.898433685302734, "global_step": 211815, "epoch": 1750} {"train_loss": -41.8954963684082, "global_step": 211816, "epoch": 1750} {"train_loss": -40.98936462402344, "global_step": 211817, "epoch": 1750} {"train_loss": -42.272457122802734, "global_step": 211818, "epoch": 1750} {"train_loss": -41.36227035522461, "global_step": 211819, "epoch": 1750} {"train_loss": -41.58657455444336, "global_step": 211820, "epoch": 1750} {"train_loss": -42.33515548706055, "global_step": 211821, "epoch": 1750} {"train_loss": -41.707740783691406, "global_step": 211822, "epoch": 1750} {"train_loss": -41.735328674316406, "global_step": 211823, "epoch": 1750} {"train_loss": -41.97827911376953, "global_step": 211824, "epoch": 1750} {"train_loss": -41.722286224365234, "global_step": 211825, "epoch": 1750} {"train_loss": -42.33171463012695, "global_step": 211826, "epoch": 1750} {"train_loss": -42.25358200073242, "global_step": 211827, "epoch": 1750} {"train_loss": -42.07106399536133, "global_step": 211828, "epoch": 1750} {"train_loss": -42.223350524902344, "global_step": 211829, "epoch": 1750} {"train_loss": -42.209232330322266, "global_step": 211830, "epoch": 1750} {"train_loss": -42.21780014038086, "global_step": 211831, "epoch": 1750} {"train_loss": -42.19084548950195, "global_step": 211832, "epoch": 1750} {"train_loss": -42.68060302734375, "global_step": 211833, "epoch": 1750} {"train_loss": -42.6148796081543, "global_step": 211834, "epoch": 1750} {"train_loss": -42.63665771484375, "global_step": 211835, "epoch": 1750} {"train_loss": -42.53874206542969, "global_step": 211836, "epoch": 1750} {"train_loss": -42.9847526550293, "global_step": 211837, "epoch": 1750} {"train_loss": -42.8105583190918, "global_step": 211838, "epoch": 1750} {"train_loss": -42.638545989990234, "global_step": 211839, "epoch": 1750} {"train_loss": -42.5955696105957, "global_step": 211840, "epoch": 1750} {"train_loss": -42.89089584350586, "global_step": 211841, "epoch": 1750} {"train_loss": -42.36851119995117, "global_step": 211842, "epoch": 1750} {"train_loss": -42.92677688598633, "global_step": 211843, "epoch": 1750} {"train_loss": -42.7024040222168, "global_step": 211844, "epoch": 1750} {"train_loss": -43.03644943237305, "global_step": 211845, "epoch": 1750} {"train_loss": -42.66575241088867, "global_step": 211846, "epoch": 1750} {"train_loss": -42.640193939208984, "global_step": 211847, "epoch": 1750} {"train_loss": -42.53895950317383, "global_step": 211848, "epoch": 1750} {"train_loss": -42.3099479675293, "global_step": 211849, "epoch": 1750} {"train_loss": -43.12296676635742, "global_step": 211850, "epoch": 1750} {"train_loss": -42.95914840698242, "global_step": 211851, "epoch": 1750} {"train_loss": -43.07057571411133, "global_step": 211852, "epoch": 1750} {"train_loss": -43.29361343383789, "global_step": 211853, "epoch": 1750} {"train_loss": -43.11581039428711, "global_step": 211854, "epoch": 1750} {"train_loss": -43.38676071166992, "global_step": 211855, "epoch": 1750} {"train_loss": -43.08221435546875, "global_step": 211856, "epoch": 1750} {"train_loss": -42.6091423034668, "global_step": 211857, "epoch": 1750} {"train_loss": -42.94503402709961, "global_step": 211858, "epoch": 1750} {"train_loss": -43.012733459472656, "global_step": 211859, "epoch": 1750} {"train_loss": -42.91972732543945, "global_step": 211860, "epoch": 1750} {"train_loss": -42.635162353515625, "global_step": 211861, "epoch": 1750} {"train_loss": -42.7680778503418, "global_step": 211862, "epoch": 1750} {"train_loss": -43.0174560546875, "global_step": 211863, "epoch": 1750} {"train_loss": -43.218074798583984, "global_step": 211864, "epoch": 1750} {"train_loss": -42.85346603393555, "global_step": 211865, "epoch": 1750} {"train_loss": -43.20458984375, "global_step": 211866, "epoch": 1750} {"train_loss": -42.927650451660156, "global_step": 211867, "epoch": 1750} {"train_loss": -42.79436111450195, "global_step": 211868, "epoch": 1750} {"train_loss": -42.52592086791992, "global_step": 211869, "epoch": 1750} {"train_loss": -41.93645587637405, "global_step": 211870, "epoch": 1750, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4400000": 1.0, "test/sim_max_reward_4400001": 1.0, "test/sim_max_reward_4400002": 1.0, "test/sim_max_reward_4400003": 1.0, "test/sim_max_reward_4400004": 1.0, "test/sim_max_reward_4400005": 1.0, "test/sim_max_reward_4400006": 1.0, "test/sim_max_reward_4400007": 1.0, "test/sim_max_reward_4400008": 1.0, "test/sim_max_reward_4400009": 1.0, "test/sim_max_reward_4400010": 1.0, "test/sim_max_reward_4400011": 1.0, "test/sim_max_reward_4400012": 1.0, "test/sim_max_reward_4400013": 1.0, "test/sim_max_reward_4400014": 1.0, "test/sim_max_reward_4400015": 1.0, "test/sim_max_reward_4400016": 1.0, "test/sim_max_reward_4400017": 1.0, "test/sim_max_reward_4400018": 1.0, "test/sim_max_reward_4400019": 1.0, "test/sim_max_reward_4400020": 1.0, "test/sim_max_reward_4400021": 1.0, "train/mean_score": 1.0, "test/mean_score": 1.0, "val_loss": 2531276.0} {"train_loss": -42.98093795776367, "global_step": 211871, "epoch": 1751} {"train_loss": -43.12342071533203, "global_step": 211872, "epoch": 1751} {"train_loss": -41.63652420043945, "global_step": 211873, "epoch": 1751} {"train_loss": -41.9206657409668, "global_step": 211874, "epoch": 1751} {"train_loss": -42.700740814208984, "global_step": 211875, "epoch": 1751} {"train_loss": -41.44783401489258, "global_step": 211876, "epoch": 1751} {"train_loss": -38.505550384521484, "global_step": 211877, "epoch": 1751} {"train_loss": -38.3221549987793, "global_step": 211878, "epoch": 1751} {"train_loss": -40.80353927612305, "global_step": 211879, "epoch": 1751} {"train_loss": -40.17266082763672, "global_step": 211880, "epoch": 1751} {"train_loss": -39.3521614074707, "global_step": 211881, "epoch": 1751} {"train_loss": -42.45345687866211, "global_step": 211882, "epoch": 1751} {"train_loss": -41.02809524536133, "global_step": 211883, "epoch": 1751} {"train_loss": -39.908790588378906, "global_step": 211884, "epoch": 1751} {"train_loss": -42.60464096069336, "global_step": 211885, "epoch": 1751} {"train_loss": -40.61442184448242, "global_step": 211886, "epoch": 1751} {"train_loss": -40.74447250366211, "global_step": 211887, "epoch": 1751} {"train_loss": -42.139915466308594, "global_step": 211888, "epoch": 1751} {"train_loss": -42.23491287231445, "global_step": 211889, "epoch": 1751} {"train_loss": -41.797603607177734, "global_step": 211890, "epoch": 1751} {"train_loss": -40.9267578125, "global_step": 211891, "epoch": 1751} {"train_loss": -41.62644958496094, "global_step": 211892, "epoch": 1751} {"train_loss": -42.19740676879883, "global_step": 211893, "epoch": 1751} {"train_loss": -42.16548538208008, "global_step": 211894, "epoch": 1751} {"train_loss": -40.91223907470703, "global_step": 211895, "epoch": 1751} {"train_loss": -40.97639846801758, "global_step": 211896, "epoch": 1751} {"train_loss": -42.450660705566406, "global_step": 211897, "epoch": 1751} {"train_loss": -41.83891677856445, "global_step": 211898, "epoch": 1751} {"train_loss": -40.98826599121094, "global_step": 211899, "epoch": 1751} {"train_loss": -41.856666564941406, "global_step": 211900, "epoch": 1751} {"train_loss": -42.716217041015625, "global_step": 211901, "epoch": 1751} {"train_loss": -42.13051223754883, "global_step": 211902, "epoch": 1751} {"train_loss": -42.22090530395508, "global_step": 211903, "epoch": 1751} {"train_loss": -42.33633041381836, "global_step": 211904, "epoch": 1751} {"train_loss": -42.389862060546875, "global_step": 211905, "epoch": 1751} {"train_loss": -41.4835205078125, "global_step": 211906, "epoch": 1751} {"train_loss": -42.465354919433594, "global_step": 211907, "epoch": 1751} {"train_loss": -42.64170455932617, "global_step": 211908, "epoch": 1751} {"train_loss": -41.827728271484375, "global_step": 211909, "epoch": 1751} {"train_loss": -42.20542526245117, "global_step": 211910, "epoch": 1751} {"train_loss": -42.56557083129883, "global_step": 211911, "epoch": 1751} {"train_loss": -42.127079010009766, "global_step": 211912, "epoch": 1751} {"train_loss": -42.702754974365234, "global_step": 211913, "epoch": 1751} {"train_loss": -43.00776290893555, "global_step": 211914, "epoch": 1751} {"train_loss": -42.55571365356445, "global_step": 211915, "epoch": 1751} {"train_loss": -42.55605697631836, "global_step": 211916, "epoch": 1751} {"train_loss": -43.03778076171875, "global_step": 211917, "epoch": 1751} {"train_loss": -43.47283172607422, "global_step": 211918, "epoch": 1751} {"train_loss": -42.859466552734375, "global_step": 211919, "epoch": 1751} {"train_loss": -43.03961944580078, "global_step": 211920, "epoch": 1751} {"train_loss": -43.02643585205078, "global_step": 211921, "epoch": 1751} {"train_loss": -43.134090423583984, "global_step": 211922, "epoch": 1751} {"train_loss": -43.1088752746582, "global_step": 211923, "epoch": 1751} {"train_loss": -43.422828674316406, "global_step": 211924, "epoch": 1751} {"train_loss": -43.17292785644531, "global_step": 211925, "epoch": 1751} {"train_loss": -43.347625732421875, "global_step": 211926, "epoch": 1751} {"train_loss": -42.8489990234375, "global_step": 211927, "epoch": 1751} {"train_loss": -43.22612762451172, "global_step": 211928, "epoch": 1751} {"train_loss": -43.22283935546875, "global_step": 211929, "epoch": 1751} {"train_loss": -43.33530044555664, "global_step": 211930, "epoch": 1751} {"train_loss": -43.167911529541016, "global_step": 211931, "epoch": 1751} {"train_loss": -42.92854690551758, "global_step": 211932, "epoch": 1751} {"train_loss": -43.452239990234375, "global_step": 211933, "epoch": 1751} {"train_loss": -42.86846160888672, "global_step": 211934, "epoch": 1751} {"train_loss": -42.734405517578125, "global_step": 211935, "epoch": 1751} {"train_loss": -42.21547317504883, "global_step": 211936, "epoch": 1751} {"train_loss": -41.964420318603516, "global_step": 211937, "epoch": 1751} {"train_loss": -39.604366302490234, "global_step": 211938, "epoch": 1751} {"train_loss": -38.4382209777832, "global_step": 211939, "epoch": 1751} {"train_loss": -40.74793243408203, "global_step": 211940, "epoch": 1751} {"train_loss": -41.66132354736328, "global_step": 211941, "epoch": 1751} {"train_loss": -37.7418327331543, "global_step": 211942, "epoch": 1751} {"train_loss": -40.20566940307617, "global_step": 211943, "epoch": 1751} {"train_loss": -41.25172805786133, "global_step": 211944, "epoch": 1751} {"train_loss": -39.450984954833984, "global_step": 211945, "epoch": 1751} {"train_loss": -39.108551025390625, "global_step": 211946, "epoch": 1751} {"train_loss": -39.356868743896484, "global_step": 211947, "epoch": 1751} {"train_loss": -38.93970489501953, "global_step": 211948, "epoch": 1751} {"train_loss": -40.18075180053711, "global_step": 211949, "epoch": 1751} {"train_loss": -39.22801971435547, "global_step": 211950, "epoch": 1751} {"train_loss": -38.3876838684082, "global_step": 211951, "epoch": 1751} {"train_loss": -41.60136795043945, "global_step": 211952, "epoch": 1751} {"train_loss": -39.81288528442383, "global_step": 211953, "epoch": 1751} {"train_loss": -39.31406784057617, "global_step": 211954, "epoch": 1751} {"train_loss": -41.659664154052734, "global_step": 211955, "epoch": 1751} {"train_loss": -39.11537170410156, "global_step": 211956, "epoch": 1751} {"train_loss": -41.75579833984375, "global_step": 211957, "epoch": 1751} {"train_loss": -40.304195404052734, "global_step": 211958, "epoch": 1751} {"train_loss": -41.31824493408203, "global_step": 211959, "epoch": 1751} {"train_loss": -41.04121017456055, "global_step": 211960, "epoch": 1751} {"train_loss": -40.534053802490234, "global_step": 211961, "epoch": 1751} {"train_loss": -40.32778549194336, "global_step": 211962, "epoch": 1751} {"train_loss": -41.61576461791992, "global_step": 211963, "epoch": 1751} {"train_loss": -40.4755973815918, "global_step": 211964, "epoch": 1751} {"train_loss": -40.9084587097168, "global_step": 211965, "epoch": 1751} {"train_loss": -41.07335662841797, "global_step": 211966, "epoch": 1751} {"train_loss": -40.94429016113281, "global_step": 211967, "epoch": 1751} {"train_loss": -41.46596908569336, "global_step": 211968, "epoch": 1751} {"train_loss": -40.39973068237305, "global_step": 211969, "epoch": 1751} {"train_loss": -42.30360412597656, "global_step": 211970, "epoch": 1751} {"train_loss": -40.245059967041016, "global_step": 211971, "epoch": 1751} {"train_loss": -41.99323654174805, "global_step": 211972, "epoch": 1751} {"train_loss": -41.4721565246582, "global_step": 211973, "epoch": 1751} {"train_loss": -42.06045150756836, "global_step": 211974, "epoch": 1751} {"train_loss": -41.01527786254883, "global_step": 211975, "epoch": 1751} {"train_loss": -42.482173919677734, "global_step": 211976, "epoch": 1751} {"train_loss": -41.19254684448242, "global_step": 211977, "epoch": 1751} {"train_loss": -42.44688415527344, "global_step": 211978, "epoch": 1751} {"train_loss": -42.32673263549805, "global_step": 211979, "epoch": 1751} {"train_loss": -42.012908935546875, "global_step": 211980, "epoch": 1751} {"train_loss": -42.342491149902344, "global_step": 211981, "epoch": 1751} {"train_loss": -42.692108154296875, "global_step": 211982, "epoch": 1751} {"train_loss": -42.21478271484375, "global_step": 211983, "epoch": 1751} {"train_loss": -42.33274841308594, "global_step": 211984, "epoch": 1751} {"train_loss": -41.27132034301758, "global_step": 211985, "epoch": 1751} {"train_loss": -42.75123977661133, "global_step": 211986, "epoch": 1751} {"train_loss": -41.82801055908203, "global_step": 211987, "epoch": 1751} {"train_loss": -42.36035919189453, "global_step": 211988, "epoch": 1751} {"train_loss": -42.4156494140625, "global_step": 211989, "epoch": 1751} {"train_loss": -42.25336837768555, "global_step": 211990, "epoch": 1751} {"train_loss": -41.60536319953351, "global_step": 211991, "epoch": 1751, "val_loss": 2549330.25} {"train_loss": -42.127925872802734, "global_step": 211992, "epoch": 1752} {"train_loss": -41.72259521484375, "global_step": 211993, "epoch": 1752} {"train_loss": -42.35478591918945, "global_step": 211994, "epoch": 1752} {"train_loss": -42.04084396362305, "global_step": 211995, "epoch": 1752} {"train_loss": -42.306861877441406, "global_step": 211996, "epoch": 1752} {"train_loss": -42.92902374267578, "global_step": 211997, "epoch": 1752} {"train_loss": -42.42675018310547, "global_step": 211998, "epoch": 1752} {"train_loss": -42.5269660949707, "global_step": 211999, "epoch": 1752} {"train_loss": -43.200645446777344, "global_step": 212000, "epoch": 1752} {"train_loss": -42.29510498046875, "global_step": 212001, "epoch": 1752} {"train_loss": -42.77293014526367, "global_step": 212002, "epoch": 1752} {"train_loss": -43.205806732177734, "global_step": 212003, "epoch": 1752} {"train_loss": -42.509090423583984, "global_step": 212004, "epoch": 1752} {"train_loss": -42.79079818725586, "global_step": 212005, "epoch": 1752} {"train_loss": -43.157325744628906, "global_step": 212006, "epoch": 1752} {"train_loss": -42.918182373046875, "global_step": 212007, "epoch": 1752} {"train_loss": -43.185272216796875, "global_step": 212008, "epoch": 1752} {"train_loss": -42.9737663269043, "global_step": 212009, "epoch": 1752} {"train_loss": -42.947792053222656, "global_step": 212010, "epoch": 1752} {"train_loss": -43.25957107543945, "global_step": 212011, "epoch": 1752} {"train_loss": -42.301856994628906, "global_step": 212012, "epoch": 1752} {"train_loss": -42.91349411010742, "global_step": 212013, "epoch": 1752} {"train_loss": -43.59919357299805, "global_step": 212014, "epoch": 1752} {"train_loss": -42.16443634033203, "global_step": 212015, "epoch": 1752} {"train_loss": -42.866912841796875, "global_step": 212016, "epoch": 1752} {"train_loss": -42.77124786376953, "global_step": 212017, "epoch": 1752} {"train_loss": -42.272621154785156, "global_step": 212018, "epoch": 1752} {"train_loss": -42.68618392944336, "global_step": 212019, "epoch": 1752} {"train_loss": -42.42485809326172, "global_step": 212020, "epoch": 1752} {"train_loss": -42.619441986083984, "global_step": 212021, "epoch": 1752} {"train_loss": -42.10513687133789, "global_step": 212022, "epoch": 1752} {"train_loss": -42.43882369995117, "global_step": 212023, "epoch": 1752} {"train_loss": -42.03034210205078, "global_step": 212024, "epoch": 1752} {"train_loss": -41.08585739135742, "global_step": 212025, "epoch": 1752} {"train_loss": -42.89720153808594, "global_step": 212026, "epoch": 1752} {"train_loss": -41.9144172668457, "global_step": 212027, "epoch": 1752} {"train_loss": -41.57063674926758, "global_step": 212028, "epoch": 1752} {"train_loss": -40.95676803588867, "global_step": 212029, "epoch": 1752} {"train_loss": -42.43653106689453, "global_step": 212030, "epoch": 1752} {"train_loss": -42.223182678222656, "global_step": 212031, "epoch": 1752} {"train_loss": -41.50786209106445, "global_step": 212032, "epoch": 1752} {"train_loss": -41.20358657836914, "global_step": 212033, "epoch": 1752} {"train_loss": -40.129085540771484, "global_step": 212034, "epoch": 1752} {"train_loss": -38.30104064941406, "global_step": 212035, "epoch": 1752} {"train_loss": -36.783687591552734, "global_step": 212036, "epoch": 1752} {"train_loss": -42.62584686279297, "global_step": 212037, "epoch": 1752} {"train_loss": -41.09939193725586, "global_step": 212038, "epoch": 1752} {"train_loss": -38.22907638549805, "global_step": 212039, "epoch": 1752} {"train_loss": -38.4302978515625, "global_step": 212040, "epoch": 1752} {"train_loss": -40.72478485107422, "global_step": 212041, "epoch": 1752} {"train_loss": -42.178375244140625, "global_step": 212042, "epoch": 1752} {"train_loss": -39.16075897216797, "global_step": 212043, "epoch": 1752} {"train_loss": -35.57760238647461, "global_step": 212044, "epoch": 1752} {"train_loss": -40.691219329833984, "global_step": 212045, "epoch": 1752} {"train_loss": -35.20753860473633, "global_step": 212046, "epoch": 1752} {"train_loss": -40.50507736206055, "global_step": 212047, "epoch": 1752} {"train_loss": -38.25196838378906, "global_step": 212048, "epoch": 1752} {"train_loss": -39.8328971862793, "global_step": 212049, "epoch": 1752} {"train_loss": -41.27077865600586, "global_step": 212050, "epoch": 1752} {"train_loss": -39.52030944824219, "global_step": 212051, "epoch": 1752} {"train_loss": -40.988426208496094, "global_step": 212052, "epoch": 1752} {"train_loss": -40.36373519897461, "global_step": 212053, "epoch": 1752} {"train_loss": -39.95039367675781, "global_step": 212054, "epoch": 1752} {"train_loss": -40.53241729736328, "global_step": 212055, "epoch": 1752} {"train_loss": -40.147369384765625, "global_step": 212056, "epoch": 1752} {"train_loss": -41.73847579956055, "global_step": 212057, "epoch": 1752} {"train_loss": -41.518856048583984, "global_step": 212058, "epoch": 1752} {"train_loss": -42.01335525512695, "global_step": 212059, "epoch": 1752} {"train_loss": -41.92100143432617, "global_step": 212060, "epoch": 1752} {"train_loss": -41.61959457397461, "global_step": 212061, "epoch": 1752} {"train_loss": -42.12754440307617, "global_step": 212062, "epoch": 1752} {"train_loss": -42.37458419799805, "global_step": 212063, "epoch": 1752} {"train_loss": -41.01149368286133, "global_step": 212064, "epoch": 1752} {"train_loss": -41.66695022583008, "global_step": 212065, "epoch": 1752} {"train_loss": -40.571102142333984, "global_step": 212066, "epoch": 1752} {"train_loss": -42.441993713378906, "global_step": 212067, "epoch": 1752} {"train_loss": -41.43832015991211, "global_step": 212068, "epoch": 1752} {"train_loss": -42.110416412353516, "global_step": 212069, "epoch": 1752} {"train_loss": -42.27631378173828, "global_step": 212070, "epoch": 1752} {"train_loss": -42.412227630615234, "global_step": 212071, "epoch": 1752} {"train_loss": -42.409915924072266, "global_step": 212072, "epoch": 1752} {"train_loss": -42.43803024291992, "global_step": 212073, "epoch": 1752} {"train_loss": -42.12235641479492, "global_step": 212074, "epoch": 1752} {"train_loss": -42.720088958740234, "global_step": 212075, "epoch": 1752} {"train_loss": -42.2567138671875, "global_step": 212076, "epoch": 1752} {"train_loss": -42.75921630859375, "global_step": 212077, "epoch": 1752} {"train_loss": -42.76709747314453, "global_step": 212078, "epoch": 1752} {"train_loss": -42.7216911315918, "global_step": 212079, "epoch": 1752} {"train_loss": -42.76516342163086, "global_step": 212080, "epoch": 1752} {"train_loss": -42.893157958984375, "global_step": 212081, "epoch": 1752} {"train_loss": -42.799739837646484, "global_step": 212082, "epoch": 1752} {"train_loss": -42.88164520263672, "global_step": 212083, "epoch": 1752} {"train_loss": -42.63542938232422, "global_step": 212084, "epoch": 1752} {"train_loss": -42.61019515991211, "global_step": 212085, "epoch": 1752} {"train_loss": -43.04978561401367, "global_step": 212086, "epoch": 1752} {"train_loss": -42.37369918823242, "global_step": 212087, "epoch": 1752} {"train_loss": -42.8199577331543, "global_step": 212088, "epoch": 1752} {"train_loss": -42.77293014526367, "global_step": 212089, "epoch": 1752} {"train_loss": -43.006099700927734, "global_step": 212090, "epoch": 1752} {"train_loss": -42.078861236572266, "global_step": 212091, "epoch": 1752} {"train_loss": -42.715972900390625, "global_step": 212092, "epoch": 1752} {"train_loss": -42.803436279296875, "global_step": 212093, "epoch": 1752} {"train_loss": -42.47907638549805, "global_step": 212094, "epoch": 1752} {"train_loss": -42.4525146484375, "global_step": 212095, "epoch": 1752} {"train_loss": -43.04269027709961, "global_step": 212096, "epoch": 1752} {"train_loss": -42.562984466552734, "global_step": 212097, "epoch": 1752} {"train_loss": -42.335968017578125, "global_step": 212098, "epoch": 1752} {"train_loss": -42.40464401245117, "global_step": 212099, "epoch": 1752} {"train_loss": -43.13993835449219, "global_step": 212100, "epoch": 1752} {"train_loss": -43.21571350097656, "global_step": 212101, "epoch": 1752} {"train_loss": -42.10309600830078, "global_step": 212102, "epoch": 1752} {"train_loss": -42.484962463378906, "global_step": 212103, "epoch": 1752} {"train_loss": -42.60497283935547, "global_step": 212104, "epoch": 1752} {"train_loss": -42.46450424194336, "global_step": 212105, "epoch": 1752} {"train_loss": -41.351009368896484, "global_step": 212106, "epoch": 1752} {"train_loss": -41.05272674560547, "global_step": 212107, "epoch": 1752} {"train_loss": -43.01066207885742, "global_step": 212108, "epoch": 1752} {"train_loss": -42.66349411010742, "global_step": 212109, "epoch": 1752} {"train_loss": -41.17576217651367, "global_step": 212110, "epoch": 1752} {"train_loss": -41.778587341308594, "global_step": 212111, "epoch": 1752} {"train_loss": -41.84931882747934, "global_step": 212112, "epoch": 1752, "val_loss": 2565953.75} {"train_loss": -42.84721374511719, "global_step": 212113, "epoch": 1753} {"train_loss": -42.227020263671875, "global_step": 212114, "epoch": 1753} {"train_loss": -42.6911506652832, "global_step": 212115, "epoch": 1753} {"train_loss": -43.143184661865234, "global_step": 212116, "epoch": 1753} {"train_loss": -42.63140869140625, "global_step": 212117, "epoch": 1753} {"train_loss": -42.32609176635742, "global_step": 212118, "epoch": 1753} {"train_loss": -42.448333740234375, "global_step": 212119, "epoch": 1753} {"train_loss": -42.4360466003418, "global_step": 212120, "epoch": 1753} {"train_loss": -41.301631927490234, "global_step": 212121, "epoch": 1753} {"train_loss": -41.70018768310547, "global_step": 212122, "epoch": 1753} {"train_loss": -43.00934982299805, "global_step": 212123, "epoch": 1753} {"train_loss": -42.65735626220703, "global_step": 212124, "epoch": 1753} {"train_loss": -41.631832122802734, "global_step": 212125, "epoch": 1753} {"train_loss": -42.3309326171875, "global_step": 212126, "epoch": 1753} {"train_loss": -42.97658920288086, "global_step": 212127, "epoch": 1753} {"train_loss": -40.69147491455078, "global_step": 212128, "epoch": 1753} {"train_loss": -41.3557014465332, "global_step": 212129, "epoch": 1753} {"train_loss": -42.73391342163086, "global_step": 212130, "epoch": 1753} {"train_loss": -42.07870101928711, "global_step": 212131, "epoch": 1753} {"train_loss": -41.05712890625, "global_step": 212132, "epoch": 1753} {"train_loss": -42.75490951538086, "global_step": 212133, "epoch": 1753} {"train_loss": -41.81636428833008, "global_step": 212134, "epoch": 1753} {"train_loss": -40.67433547973633, "global_step": 212135, "epoch": 1753} {"train_loss": -41.37425994873047, "global_step": 212136, "epoch": 1753} {"train_loss": -42.51180648803711, "global_step": 212137, "epoch": 1753} {"train_loss": -39.777320861816406, "global_step": 212138, "epoch": 1753} {"train_loss": -42.04157638549805, "global_step": 212139, "epoch": 1753} {"train_loss": -42.0564079284668, "global_step": 212140, "epoch": 1753} {"train_loss": -41.28091049194336, "global_step": 212141, "epoch": 1753} {"train_loss": -42.729759216308594, "global_step": 212142, "epoch": 1753} {"train_loss": -41.31134033203125, "global_step": 212143, "epoch": 1753} {"train_loss": -42.2279052734375, "global_step": 212144, "epoch": 1753} {"train_loss": -42.04317092895508, "global_step": 212145, "epoch": 1753} {"train_loss": -41.99859619140625, "global_step": 212146, "epoch": 1753} {"train_loss": -41.16875457763672, "global_step": 212147, "epoch": 1753} {"train_loss": -42.942718505859375, "global_step": 212148, "epoch": 1753} {"train_loss": -42.294368743896484, "global_step": 212149, "epoch": 1753} {"train_loss": -42.274051666259766, "global_step": 212150, "epoch": 1753} {"train_loss": -42.276432037353516, "global_step": 212151, "epoch": 1753} {"train_loss": -42.223873138427734, "global_step": 212152, "epoch": 1753} {"train_loss": -42.50509262084961, "global_step": 212153, "epoch": 1753} {"train_loss": -41.34684371948242, "global_step": 212154, "epoch": 1753} {"train_loss": -41.49135971069336, "global_step": 212155, "epoch": 1753} {"train_loss": -41.729652404785156, "global_step": 212156, "epoch": 1753} {"train_loss": -41.6804084777832, "global_step": 212157, "epoch": 1753} {"train_loss": -41.26850128173828, "global_step": 212158, "epoch": 1753} {"train_loss": -41.6796875, "global_step": 212159, "epoch": 1753} {"train_loss": -41.825401306152344, "global_step": 212160, "epoch": 1753} {"train_loss": -42.04189682006836, "global_step": 212161, "epoch": 1753} {"train_loss": -41.83999252319336, "global_step": 212162, "epoch": 1753} {"train_loss": -41.6150016784668, "global_step": 212163, "epoch": 1753} {"train_loss": -42.00098419189453, "global_step": 212164, "epoch": 1753} {"train_loss": -40.336849212646484, "global_step": 212165, "epoch": 1753} {"train_loss": -40.41457748413086, "global_step": 212166, "epoch": 1753} {"train_loss": -42.39535140991211, "global_step": 212167, "epoch": 1753} {"train_loss": -41.58146286010742, "global_step": 212168, "epoch": 1753} {"train_loss": -39.5277214050293, "global_step": 212169, "epoch": 1753} {"train_loss": -40.774410247802734, "global_step": 212170, "epoch": 1753} {"train_loss": -42.18617630004883, "global_step": 212171, "epoch": 1753} {"train_loss": -41.49371337890625, "global_step": 212172, "epoch": 1753} {"train_loss": -40.962196350097656, "global_step": 212173, "epoch": 1753} {"train_loss": -42.24509811401367, "global_step": 212174, "epoch": 1753} {"train_loss": -41.9721794128418, "global_step": 212175, "epoch": 1753} {"train_loss": -41.35589599609375, "global_step": 212176, "epoch": 1753} {"train_loss": -41.89973831176758, "global_step": 212177, "epoch": 1753} {"train_loss": -42.26123809814453, "global_step": 212178, "epoch": 1753} {"train_loss": -42.06472396850586, "global_step": 212179, "epoch": 1753} {"train_loss": -41.30721664428711, "global_step": 212180, "epoch": 1753} {"train_loss": -41.56787872314453, "global_step": 212181, "epoch": 1753} {"train_loss": -42.581871032714844, "global_step": 212182, "epoch": 1753} {"train_loss": -42.07115173339844, "global_step": 212183, "epoch": 1753} {"train_loss": -42.18678665161133, "global_step": 212184, "epoch": 1753} {"train_loss": -41.36738204956055, "global_step": 212185, "epoch": 1753} {"train_loss": -43.210750579833984, "global_step": 212186, "epoch": 1753} {"train_loss": -42.006412506103516, "global_step": 212187, "epoch": 1753} {"train_loss": -42.19423294067383, "global_step": 212188, "epoch": 1753} {"train_loss": -42.711830139160156, "global_step": 212189, "epoch": 1753} {"train_loss": -41.31410598754883, "global_step": 212190, "epoch": 1753} {"train_loss": -42.68165969848633, "global_step": 212191, "epoch": 1753} {"train_loss": -41.6072883605957, "global_step": 212192, "epoch": 1753} {"train_loss": -42.60189437866211, "global_step": 212193, "epoch": 1753} {"train_loss": -42.239097595214844, "global_step": 212194, "epoch": 1753} {"train_loss": -41.76461410522461, "global_step": 212195, "epoch": 1753} {"train_loss": -42.97176742553711, "global_step": 212196, "epoch": 1753} {"train_loss": -42.43868637084961, "global_step": 212197, "epoch": 1753} {"train_loss": -42.40714645385742, "global_step": 212198, "epoch": 1753} {"train_loss": -42.230525970458984, "global_step": 212199, "epoch": 1753} {"train_loss": -42.89009475708008, "global_step": 212200, "epoch": 1753} {"train_loss": -42.646270751953125, "global_step": 212201, "epoch": 1753} {"train_loss": -42.14262771606445, "global_step": 212202, "epoch": 1753} {"train_loss": -42.80129623413086, "global_step": 212203, "epoch": 1753} {"train_loss": -42.52452850341797, "global_step": 212204, "epoch": 1753} {"train_loss": -42.69023513793945, "global_step": 212205, "epoch": 1753} {"train_loss": -42.510498046875, "global_step": 212206, "epoch": 1753} {"train_loss": -41.814605712890625, "global_step": 212207, "epoch": 1753} {"train_loss": -42.91659164428711, "global_step": 212208, "epoch": 1753} {"train_loss": -42.58516311645508, "global_step": 212209, "epoch": 1753} {"train_loss": -42.4822998046875, "global_step": 212210, "epoch": 1753} {"train_loss": -42.97066879272461, "global_step": 212211, "epoch": 1753} {"train_loss": -42.324703216552734, "global_step": 212212, "epoch": 1753} {"train_loss": -42.82223129272461, "global_step": 212213, "epoch": 1753} {"train_loss": -43.19428253173828, "global_step": 212214, "epoch": 1753} {"train_loss": -42.808712005615234, "global_step": 212215, "epoch": 1753} {"train_loss": -42.45235824584961, "global_step": 212216, "epoch": 1753} {"train_loss": -43.0852165222168, "global_step": 212217, "epoch": 1753} {"train_loss": -42.27267074584961, "global_step": 212218, "epoch": 1753} {"train_loss": -42.35414505004883, "global_step": 212219, "epoch": 1753} {"train_loss": -41.849708557128906, "global_step": 212220, "epoch": 1753} {"train_loss": -42.41970443725586, "global_step": 212221, "epoch": 1753} {"train_loss": -41.5039176940918, "global_step": 212222, "epoch": 1753} {"train_loss": -42.676124572753906, "global_step": 212223, "epoch": 1753} {"train_loss": -42.61599349975586, "global_step": 212224, "epoch": 1753} {"train_loss": -43.027130126953125, "global_step": 212225, "epoch": 1753} {"train_loss": -42.284637451171875, "global_step": 212226, "epoch": 1753} {"train_loss": -43.16782760620117, "global_step": 212227, "epoch": 1753} {"train_loss": -41.812782287597656, "global_step": 212228, "epoch": 1753} {"train_loss": -41.902950286865234, "global_step": 212229, "epoch": 1753} {"train_loss": -42.41267776489258, "global_step": 212230, "epoch": 1753} {"train_loss": -42.96516036987305, "global_step": 212231, "epoch": 1753} {"train_loss": -42.91514205932617, "global_step": 212232, "epoch": 1753} {"train_loss": -42.10001754760742, "global_step": 212233, "epoch": 1753, "val_loss": 2605711.25} {"train_loss": -42.636375427246094, "global_step": 212234, "epoch": 1754} {"train_loss": -42.38554763793945, "global_step": 212235, "epoch": 1754} {"train_loss": -42.366241455078125, "global_step": 212236, "epoch": 1754} {"train_loss": -42.110443115234375, "global_step": 212237, "epoch": 1754} {"train_loss": -43.221317291259766, "global_step": 212238, "epoch": 1754} {"train_loss": -41.06060791015625, "global_step": 212239, "epoch": 1754} {"train_loss": -42.5199089050293, "global_step": 212240, "epoch": 1754} {"train_loss": -42.580596923828125, "global_step": 212241, "epoch": 1754} {"train_loss": -42.260589599609375, "global_step": 212242, "epoch": 1754} {"train_loss": -42.742610931396484, "global_step": 212243, "epoch": 1754} {"train_loss": -42.53083419799805, "global_step": 212244, "epoch": 1754} {"train_loss": -41.736053466796875, "global_step": 212245, "epoch": 1754} {"train_loss": -42.22605514526367, "global_step": 212246, "epoch": 1754} {"train_loss": -42.3563117980957, "global_step": 212247, "epoch": 1754} {"train_loss": -39.879730224609375, "global_step": 212248, "epoch": 1754} {"train_loss": -41.81201934814453, "global_step": 212249, "epoch": 1754} {"train_loss": -40.94963455200195, "global_step": 212250, "epoch": 1754} {"train_loss": -39.3632698059082, "global_step": 212251, "epoch": 1754} {"train_loss": -40.82337951660156, "global_step": 212252, "epoch": 1754} {"train_loss": -41.60778045654297, "global_step": 212253, "epoch": 1754} {"train_loss": -39.685150146484375, "global_step": 212254, "epoch": 1754} {"train_loss": -34.235084533691406, "global_step": 212255, "epoch": 1754} {"train_loss": -40.179752349853516, "global_step": 212256, "epoch": 1754} {"train_loss": -40.336177825927734, "global_step": 212257, "epoch": 1754} {"train_loss": -36.91339111328125, "global_step": 212258, "epoch": 1754} {"train_loss": -38.08901596069336, "global_step": 212259, "epoch": 1754} {"train_loss": -38.01498794555664, "global_step": 212260, "epoch": 1754} {"train_loss": -40.86954879760742, "global_step": 212261, "epoch": 1754} {"train_loss": -37.48881912231445, "global_step": 212262, "epoch": 1754} {"train_loss": -37.756309509277344, "global_step": 212263, "epoch": 1754} {"train_loss": -35.3354606628418, "global_step": 212264, "epoch": 1754} {"train_loss": -38.018882751464844, "global_step": 212265, "epoch": 1754} {"train_loss": -33.33896255493164, "global_step": 212266, "epoch": 1754} {"train_loss": -38.02900314331055, "global_step": 212267, "epoch": 1754} {"train_loss": -37.91511154174805, "global_step": 212268, "epoch": 1754} {"train_loss": -34.35403060913086, "global_step": 212269, "epoch": 1754} {"train_loss": -34.615901947021484, "global_step": 212270, "epoch": 1754} {"train_loss": -36.089542388916016, "global_step": 212271, "epoch": 1754} {"train_loss": -36.17808151245117, "global_step": 212272, "epoch": 1754} {"train_loss": -37.4298210144043, "global_step": 212273, "epoch": 1754} {"train_loss": -36.57689666748047, "global_step": 212274, "epoch": 1754} {"train_loss": -35.02912139892578, "global_step": 212275, "epoch": 1754} {"train_loss": -37.241424560546875, "global_step": 212276, "epoch": 1754} {"train_loss": -32.6478271484375, "global_step": 212277, "epoch": 1754} {"train_loss": -36.74715042114258, "global_step": 212278, "epoch": 1754} {"train_loss": -36.785518646240234, "global_step": 212279, "epoch": 1754} {"train_loss": -37.264801025390625, "global_step": 212280, "epoch": 1754} {"train_loss": -37.0960578918457, "global_step": 212281, "epoch": 1754} {"train_loss": -38.2689208984375, "global_step": 212282, "epoch": 1754} {"train_loss": -36.89129638671875, "global_step": 212283, "epoch": 1754} {"train_loss": -38.2957763671875, "global_step": 212284, "epoch": 1754} {"train_loss": -36.75511932373047, "global_step": 212285, "epoch": 1754} {"train_loss": -38.65193557739258, "global_step": 212286, "epoch": 1754} {"train_loss": -39.326229095458984, "global_step": 212287, "epoch": 1754} {"train_loss": -38.90816879272461, "global_step": 212288, "epoch": 1754} {"train_loss": -39.718170166015625, "global_step": 212289, "epoch": 1754} {"train_loss": -39.81199264526367, "global_step": 212290, "epoch": 1754} {"train_loss": -39.89692306518555, "global_step": 212291, "epoch": 1754} {"train_loss": -39.41938781738281, "global_step": 212292, "epoch": 1754} {"train_loss": -39.8551139831543, "global_step": 212293, "epoch": 1754} {"train_loss": -39.82650375366211, "global_step": 212294, "epoch": 1754} {"train_loss": -40.57035827636719, "global_step": 212295, "epoch": 1754} {"train_loss": -40.595577239990234, "global_step": 212296, "epoch": 1754} {"train_loss": -40.1424446105957, "global_step": 212297, "epoch": 1754} {"train_loss": -40.88127136230469, "global_step": 212298, "epoch": 1754} {"train_loss": -40.799156188964844, "global_step": 212299, "epoch": 1754} {"train_loss": -41.14925765991211, "global_step": 212300, "epoch": 1754} {"train_loss": -40.646366119384766, "global_step": 212301, "epoch": 1754} {"train_loss": -40.75502395629883, "global_step": 212302, "epoch": 1754} {"train_loss": -41.38679122924805, "global_step": 212303, "epoch": 1754} {"train_loss": -41.279293060302734, "global_step": 212304, "epoch": 1754} {"train_loss": -41.21110153198242, "global_step": 212305, "epoch": 1754} {"train_loss": -40.9747314453125, "global_step": 212306, "epoch": 1754} {"train_loss": -41.29927062988281, "global_step": 212307, "epoch": 1754} {"train_loss": -41.22125244140625, "global_step": 212308, "epoch": 1754} {"train_loss": -41.096378326416016, "global_step": 212309, "epoch": 1754} {"train_loss": -41.551841735839844, "global_step": 212310, "epoch": 1754} {"train_loss": -42.01176071166992, "global_step": 212311, "epoch": 1754} {"train_loss": -41.509944915771484, "global_step": 212312, "epoch": 1754} {"train_loss": -40.75202560424805, "global_step": 212313, "epoch": 1754} {"train_loss": -41.17438888549805, "global_step": 212314, "epoch": 1754} {"train_loss": -41.725765228271484, "global_step": 212315, "epoch": 1754} {"train_loss": -41.7234992980957, "global_step": 212316, "epoch": 1754} {"train_loss": -41.84012222290039, "global_step": 212317, "epoch": 1754} {"train_loss": -41.76664352416992, "global_step": 212318, "epoch": 1754} {"train_loss": -42.20867919921875, "global_step": 212319, "epoch": 1754} {"train_loss": -41.63949203491211, "global_step": 212320, "epoch": 1754} {"train_loss": -42.44330978393555, "global_step": 212321, "epoch": 1754} {"train_loss": -42.12886428833008, "global_step": 212322, "epoch": 1754} {"train_loss": -41.903160095214844, "global_step": 212323, "epoch": 1754} {"train_loss": -42.188720703125, "global_step": 212324, "epoch": 1754} {"train_loss": -42.21037673950195, "global_step": 212325, "epoch": 1754} {"train_loss": -42.149330139160156, "global_step": 212326, "epoch": 1754} {"train_loss": -42.23640060424805, "global_step": 212327, "epoch": 1754} {"train_loss": -42.2877197265625, "global_step": 212328, "epoch": 1754} {"train_loss": -42.60062789916992, "global_step": 212329, "epoch": 1754} {"train_loss": -42.4234619140625, "global_step": 212330, "epoch": 1754} {"train_loss": -41.83037567138672, "global_step": 212331, "epoch": 1754} {"train_loss": -41.99802780151367, "global_step": 212332, "epoch": 1754} {"train_loss": -42.56901168823242, "global_step": 212333, "epoch": 1754} {"train_loss": -42.07552719116211, "global_step": 212334, "epoch": 1754} {"train_loss": -42.549171447753906, "global_step": 212335, "epoch": 1754} {"train_loss": -42.122886657714844, "global_step": 212336, "epoch": 1754} {"train_loss": -43.080657958984375, "global_step": 212337, "epoch": 1754} {"train_loss": -42.345672607421875, "global_step": 212338, "epoch": 1754} {"train_loss": -42.18048858642578, "global_step": 212339, "epoch": 1754} {"train_loss": -42.351287841796875, "global_step": 212340, "epoch": 1754} {"train_loss": -42.82168960571289, "global_step": 212341, "epoch": 1754} {"train_loss": -42.6324462890625, "global_step": 212342, "epoch": 1754} {"train_loss": -42.75303268432617, "global_step": 212343, "epoch": 1754} {"train_loss": -42.781028747558594, "global_step": 212344, "epoch": 1754} {"train_loss": -42.34206008911133, "global_step": 212345, "epoch": 1754} {"train_loss": -42.64685821533203, "global_step": 212346, "epoch": 1754} {"train_loss": -42.48183822631836, "global_step": 212347, "epoch": 1754} {"train_loss": -42.123321533203125, "global_step": 212348, "epoch": 1754} {"train_loss": -42.185508728027344, "global_step": 212349, "epoch": 1754} {"train_loss": -42.68706130981445, "global_step": 212350, "epoch": 1754} {"train_loss": -42.352638244628906, "global_step": 212351, "epoch": 1754} {"train_loss": -41.6468620300293, "global_step": 212352, "epoch": 1754} {"train_loss": -42.1627311706543, "global_step": 212353, "epoch": 1754} {"train_loss": -40.4023952641763, "global_step": 212354, "epoch": 1754, "val_loss": 2594422.5} {"train_loss": -42.887813568115234, "global_step": 212355, "epoch": 1755} {"train_loss": -42.645729064941406, "global_step": 212356, "epoch": 1755} {"train_loss": -42.18779373168945, "global_step": 212357, "epoch": 1755} {"train_loss": -42.266231536865234, "global_step": 212358, "epoch": 1755} {"train_loss": -42.94110107421875, "global_step": 212359, "epoch": 1755} {"train_loss": -43.24492263793945, "global_step": 212360, "epoch": 1755} {"train_loss": -43.18532943725586, "global_step": 212361, "epoch": 1755} {"train_loss": -42.8558464050293, "global_step": 212362, "epoch": 1755} {"train_loss": -42.94135665893555, "global_step": 212363, "epoch": 1755} {"train_loss": -43.12824630737305, "global_step": 212364, "epoch": 1755} {"train_loss": -42.72923278808594, "global_step": 212365, "epoch": 1755} {"train_loss": -42.60960388183594, "global_step": 212366, "epoch": 1755} {"train_loss": -42.197662353515625, "global_step": 212367, "epoch": 1755} {"train_loss": -42.255863189697266, "global_step": 212368, "epoch": 1755} {"train_loss": -41.35689163208008, "global_step": 212369, "epoch": 1755} {"train_loss": -41.136104583740234, "global_step": 212370, "epoch": 1755} {"train_loss": -39.73293685913086, "global_step": 212371, "epoch": 1755} {"train_loss": -39.28485870361328, "global_step": 212372, "epoch": 1755} {"train_loss": -39.47700500488281, "global_step": 212373, "epoch": 1755} {"train_loss": -42.907344818115234, "global_step": 212374, "epoch": 1755} {"train_loss": -39.74669647216797, "global_step": 212375, "epoch": 1755} {"train_loss": -37.2110595703125, "global_step": 212376, "epoch": 1755} {"train_loss": -41.526119232177734, "global_step": 212377, "epoch": 1755} {"train_loss": -33.977474212646484, "global_step": 212378, "epoch": 1755} {"train_loss": -36.505062103271484, "global_step": 212379, "epoch": 1755} {"train_loss": -33.236629486083984, "global_step": 212380, "epoch": 1755} {"train_loss": -33.4618034362793, "global_step": 212381, "epoch": 1755} {"train_loss": -23.907333374023438, "global_step": 212382, "epoch": 1755} {"train_loss": -32.477291107177734, "global_step": 212383, "epoch": 1755} {"train_loss": -33.039791107177734, "global_step": 212384, "epoch": 1755} {"train_loss": -32.20937728881836, "global_step": 212385, "epoch": 1755} {"train_loss": -32.771278381347656, "global_step": 212386, "epoch": 1755} {"train_loss": -32.0616455078125, "global_step": 212387, "epoch": 1755} {"train_loss": -34.92770004272461, "global_step": 212388, "epoch": 1755} {"train_loss": -32.24540328979492, "global_step": 212389, "epoch": 1755} {"train_loss": -34.888336181640625, "global_step": 212390, "epoch": 1755} {"train_loss": -33.28147506713867, "global_step": 212391, "epoch": 1755} {"train_loss": -35.34627151489258, "global_step": 212392, "epoch": 1755} {"train_loss": -34.96905517578125, "global_step": 212393, "epoch": 1755} {"train_loss": -35.33724594116211, "global_step": 212394, "epoch": 1755} {"train_loss": -35.57698059082031, "global_step": 212395, "epoch": 1755} {"train_loss": -36.763240814208984, "global_step": 212396, "epoch": 1755} {"train_loss": -37.26201248168945, "global_step": 212397, "epoch": 1755} {"train_loss": -37.531524658203125, "global_step": 212398, "epoch": 1755} {"train_loss": -37.39060592651367, "global_step": 212399, "epoch": 1755} {"train_loss": -37.3472900390625, "global_step": 212400, "epoch": 1755} {"train_loss": -38.249019622802734, "global_step": 212401, "epoch": 1755} {"train_loss": -38.50079345703125, "global_step": 212402, "epoch": 1755} {"train_loss": -38.47943878173828, "global_step": 212403, "epoch": 1755} {"train_loss": -38.54189682006836, "global_step": 212404, "epoch": 1755} {"train_loss": -39.34804153442383, "global_step": 212405, "epoch": 1755} {"train_loss": -39.80763626098633, "global_step": 212406, "epoch": 1755} {"train_loss": -39.938106536865234, "global_step": 212407, "epoch": 1755} {"train_loss": -40.273040771484375, "global_step": 212408, "epoch": 1755} {"train_loss": -40.29032516479492, "global_step": 212409, "epoch": 1755} {"train_loss": -40.394412994384766, "global_step": 212410, "epoch": 1755} {"train_loss": -39.528438568115234, "global_step": 212411, "epoch": 1755} {"train_loss": -41.464847564697266, "global_step": 212412, "epoch": 1755} {"train_loss": -40.63718795776367, "global_step": 212413, "epoch": 1755} {"train_loss": -39.85546875, "global_step": 212414, "epoch": 1755} {"train_loss": -41.44027328491211, "global_step": 212415, "epoch": 1755} {"train_loss": -39.69537353515625, "global_step": 212416, "epoch": 1755} {"train_loss": -41.20013427734375, "global_step": 212417, "epoch": 1755} {"train_loss": -38.9085578918457, "global_step": 212418, "epoch": 1755} {"train_loss": -40.595069885253906, "global_step": 212419, "epoch": 1755} {"train_loss": -39.68217468261719, "global_step": 212420, "epoch": 1755} {"train_loss": -39.83210372924805, "global_step": 212421, "epoch": 1755} {"train_loss": -40.253578186035156, "global_step": 212422, "epoch": 1755} {"train_loss": -39.17713165283203, "global_step": 212423, "epoch": 1755} {"train_loss": -41.07474899291992, "global_step": 212424, "epoch": 1755} {"train_loss": -40.02313995361328, "global_step": 212425, "epoch": 1755} {"train_loss": -40.74241256713867, "global_step": 212426, "epoch": 1755} {"train_loss": -40.40376281738281, "global_step": 212427, "epoch": 1755} {"train_loss": -40.476985931396484, "global_step": 212428, "epoch": 1755} {"train_loss": -41.40617752075195, "global_step": 212429, "epoch": 1755} {"train_loss": -40.36617660522461, "global_step": 212430, "epoch": 1755} {"train_loss": -41.16060256958008, "global_step": 212431, "epoch": 1755} {"train_loss": -40.37537384033203, "global_step": 212432, "epoch": 1755} {"train_loss": -40.50484848022461, "global_step": 212433, "epoch": 1755} {"train_loss": -41.01942825317383, "global_step": 212434, "epoch": 1755} {"train_loss": -41.039161682128906, "global_step": 212435, "epoch": 1755} {"train_loss": -41.44223403930664, "global_step": 212436, "epoch": 1755} {"train_loss": -41.01735305786133, "global_step": 212437, "epoch": 1755} {"train_loss": -41.17615509033203, "global_step": 212438, "epoch": 1755} {"train_loss": -41.173763275146484, "global_step": 212439, "epoch": 1755} {"train_loss": -40.635711669921875, "global_step": 212440, "epoch": 1755} {"train_loss": -41.57249450683594, "global_step": 212441, "epoch": 1755} {"train_loss": -41.35369873046875, "global_step": 212442, "epoch": 1755} {"train_loss": -42.0079231262207, "global_step": 212443, "epoch": 1755} {"train_loss": -41.43949508666992, "global_step": 212444, "epoch": 1755} {"train_loss": -41.80659103393555, "global_step": 212445, "epoch": 1755} {"train_loss": -42.00048065185547, "global_step": 212446, "epoch": 1755} {"train_loss": -42.17806625366211, "global_step": 212447, "epoch": 1755} {"train_loss": -41.80290603637695, "global_step": 212448, "epoch": 1755} {"train_loss": -42.72015380859375, "global_step": 212449, "epoch": 1755} {"train_loss": -41.743465423583984, "global_step": 212450, "epoch": 1755} {"train_loss": -41.878231048583984, "global_step": 212451, "epoch": 1755} {"train_loss": -42.21305465698242, "global_step": 212452, "epoch": 1755} {"train_loss": -42.26710891723633, "global_step": 212453, "epoch": 1755} {"train_loss": -42.715755462646484, "global_step": 212454, "epoch": 1755} {"train_loss": -42.32711410522461, "global_step": 212455, "epoch": 1755} {"train_loss": -42.53898239135742, "global_step": 212456, "epoch": 1755} {"train_loss": -42.58204650878906, "global_step": 212457, "epoch": 1755} {"train_loss": -42.26408004760742, "global_step": 212458, "epoch": 1755} {"train_loss": -42.57169723510742, "global_step": 212459, "epoch": 1755} {"train_loss": -42.631046295166016, "global_step": 212460, "epoch": 1755} {"train_loss": -42.99081039428711, "global_step": 212461, "epoch": 1755} {"train_loss": -42.902862548828125, "global_step": 212462, "epoch": 1755} {"train_loss": -42.24921417236328, "global_step": 212463, "epoch": 1755} {"train_loss": -42.9305534362793, "global_step": 212464, "epoch": 1755} {"train_loss": -42.272335052490234, "global_step": 212465, "epoch": 1755} {"train_loss": -42.90571975708008, "global_step": 212466, "epoch": 1755} {"train_loss": -42.907020568847656, "global_step": 212467, "epoch": 1755} {"train_loss": -42.975040435791016, "global_step": 212468, "epoch": 1755} {"train_loss": -42.52714538574219, "global_step": 212469, "epoch": 1755} {"train_loss": -42.18156814575195, "global_step": 212470, "epoch": 1755} {"train_loss": -42.69352340698242, "global_step": 212471, "epoch": 1755} {"train_loss": -42.92721176147461, "global_step": 212472, "epoch": 1755} {"train_loss": -42.2862663269043, "global_step": 212473, "epoch": 1755} {"train_loss": -42.83770751953125, "global_step": 212474, "epoch": 1755} {"train_loss": -39.996632473527896, "global_step": 212475, "epoch": 1755, "val_loss": 2560558.25} {"train_loss": -40.65449905395508, "global_step": 212476, "epoch": 1756} {"train_loss": -39.41180419921875, "global_step": 212477, "epoch": 1756} {"train_loss": -40.07537078857422, "global_step": 212478, "epoch": 1756} {"train_loss": -42.0999641418457, "global_step": 212479, "epoch": 1756} {"train_loss": -42.41549301147461, "global_step": 212480, "epoch": 1756} {"train_loss": -40.89005661010742, "global_step": 212481, "epoch": 1756} {"train_loss": -40.72818374633789, "global_step": 212482, "epoch": 1756} {"train_loss": -41.357723236083984, "global_step": 212483, "epoch": 1756} {"train_loss": -41.9463996887207, "global_step": 212484, "epoch": 1756} {"train_loss": -42.15464401245117, "global_step": 212485, "epoch": 1756} {"train_loss": -41.66434097290039, "global_step": 212486, "epoch": 1756} {"train_loss": -42.224788665771484, "global_step": 212487, "epoch": 1756} {"train_loss": -42.097408294677734, "global_step": 212488, "epoch": 1756} {"train_loss": -42.64596176147461, "global_step": 212489, "epoch": 1756} {"train_loss": -42.2286376953125, "global_step": 212490, "epoch": 1756} {"train_loss": -42.74617004394531, "global_step": 212491, "epoch": 1756} {"train_loss": -42.9114990234375, "global_step": 212492, "epoch": 1756} {"train_loss": -42.8679313659668, "global_step": 212493, "epoch": 1756} {"train_loss": -43.194091796875, "global_step": 212494, "epoch": 1756} {"train_loss": -42.16126251220703, "global_step": 212495, "epoch": 1756} {"train_loss": -42.30402374267578, "global_step": 212496, "epoch": 1756} {"train_loss": -42.97040939331055, "global_step": 212497, "epoch": 1756} {"train_loss": -42.88814163208008, "global_step": 212498, "epoch": 1756} {"train_loss": -42.51717758178711, "global_step": 212499, "epoch": 1756} {"train_loss": -42.791473388671875, "global_step": 212500, "epoch": 1756} {"train_loss": -42.56834030151367, "global_step": 212501, "epoch": 1756} {"train_loss": -42.21847152709961, "global_step": 212502, "epoch": 1756} {"train_loss": -42.92850875854492, "global_step": 212503, "epoch": 1756} {"train_loss": -42.65980529785156, "global_step": 212504, "epoch": 1756} {"train_loss": -43.14332962036133, "global_step": 212505, "epoch": 1756} {"train_loss": -42.53517532348633, "global_step": 212506, "epoch": 1756} {"train_loss": -42.73286056518555, "global_step": 212507, "epoch": 1756} {"train_loss": -42.807281494140625, "global_step": 212508, "epoch": 1756} {"train_loss": -43.19794464111328, "global_step": 212509, "epoch": 1756} {"train_loss": -42.904232025146484, "global_step": 212510, "epoch": 1756} {"train_loss": -42.634674072265625, "global_step": 212511, "epoch": 1756} {"train_loss": -42.70022201538086, "global_step": 212512, "epoch": 1756} {"train_loss": -43.21220779418945, "global_step": 212513, "epoch": 1756} {"train_loss": -43.08199691772461, "global_step": 212514, "epoch": 1756} {"train_loss": -42.40242385864258, "global_step": 212515, "epoch": 1756} {"train_loss": -42.75392532348633, "global_step": 212516, "epoch": 1756} {"train_loss": -43.212459564208984, "global_step": 212517, "epoch": 1756} {"train_loss": -42.704097747802734, "global_step": 212518, "epoch": 1756} {"train_loss": -42.711116790771484, "global_step": 212519, "epoch": 1756} {"train_loss": -42.785865783691406, "global_step": 212520, "epoch": 1756} {"train_loss": -42.284942626953125, "global_step": 212521, "epoch": 1756} {"train_loss": -42.57905960083008, "global_step": 212522, "epoch": 1756} {"train_loss": -41.548072814941406, "global_step": 212523, "epoch": 1756} {"train_loss": -41.717567443847656, "global_step": 212524, "epoch": 1756} {"train_loss": -41.90178298950195, "global_step": 212525, "epoch": 1756} {"train_loss": -42.2902946472168, "global_step": 212526, "epoch": 1756} {"train_loss": -41.80839920043945, "global_step": 212527, "epoch": 1756} {"train_loss": -41.187660217285156, "global_step": 212528, "epoch": 1756} {"train_loss": -39.62632369995117, "global_step": 212529, "epoch": 1756} {"train_loss": -38.24270248413086, "global_step": 212530, "epoch": 1756} {"train_loss": -40.94889450073242, "global_step": 212531, "epoch": 1756} {"train_loss": -38.035457611083984, "global_step": 212532, "epoch": 1756} {"train_loss": -42.22774887084961, "global_step": 212533, "epoch": 1756} {"train_loss": -37.299903869628906, "global_step": 212534, "epoch": 1756} {"train_loss": -41.45365524291992, "global_step": 212535, "epoch": 1756} {"train_loss": -36.4843635559082, "global_step": 212536, "epoch": 1756} {"train_loss": -35.90509796142578, "global_step": 212537, "epoch": 1756} {"train_loss": -37.499996185302734, "global_step": 212538, "epoch": 1756} {"train_loss": -38.07673645019531, "global_step": 212539, "epoch": 1756} {"train_loss": -35.766048431396484, "global_step": 212540, "epoch": 1756} {"train_loss": -37.78303146362305, "global_step": 212541, "epoch": 1756} {"train_loss": -37.49311065673828, "global_step": 212542, "epoch": 1756} {"train_loss": -36.9338493347168, "global_step": 212543, "epoch": 1756} {"train_loss": -37.984031677246094, "global_step": 212544, "epoch": 1756} {"train_loss": -38.84904479980469, "global_step": 212545, "epoch": 1756} {"train_loss": -37.87972640991211, "global_step": 212546, "epoch": 1756} {"train_loss": -39.91313552856445, "global_step": 212547, "epoch": 1756} {"train_loss": -38.992000579833984, "global_step": 212548, "epoch": 1756} {"train_loss": -38.616607666015625, "global_step": 212549, "epoch": 1756} {"train_loss": -40.12126541137695, "global_step": 212550, "epoch": 1756} {"train_loss": -39.06538772583008, "global_step": 212551, "epoch": 1756} {"train_loss": -40.83917999267578, "global_step": 212552, "epoch": 1756} {"train_loss": -40.7324104309082, "global_step": 212553, "epoch": 1756} {"train_loss": -41.76002502441406, "global_step": 212554, "epoch": 1756} {"train_loss": -41.1905632019043, "global_step": 212555, "epoch": 1756} {"train_loss": -40.903900146484375, "global_step": 212556, "epoch": 1756} {"train_loss": -40.7216682434082, "global_step": 212557, "epoch": 1756} {"train_loss": -41.955745697021484, "global_step": 212558, "epoch": 1756} {"train_loss": -41.60088348388672, "global_step": 212559, "epoch": 1756} {"train_loss": -41.98291778564453, "global_step": 212560, "epoch": 1756} {"train_loss": -41.931060791015625, "global_step": 212561, "epoch": 1756} {"train_loss": -41.93130111694336, "global_step": 212562, "epoch": 1756} {"train_loss": -41.391090393066406, "global_step": 212563, "epoch": 1756} {"train_loss": -41.88552474975586, "global_step": 212564, "epoch": 1756} {"train_loss": -41.83248519897461, "global_step": 212565, "epoch": 1756} {"train_loss": -42.18198776245117, "global_step": 212566, "epoch": 1756} {"train_loss": -41.663658142089844, "global_step": 212567, "epoch": 1756} {"train_loss": -42.15006637573242, "global_step": 212568, "epoch": 1756} {"train_loss": -41.897727966308594, "global_step": 212569, "epoch": 1756} {"train_loss": -41.77959060668945, "global_step": 212570, "epoch": 1756} {"train_loss": -41.580780029296875, "global_step": 212571, "epoch": 1756} {"train_loss": -42.382381439208984, "global_step": 212572, "epoch": 1756} {"train_loss": -42.205230712890625, "global_step": 212573, "epoch": 1756} {"train_loss": -42.19452667236328, "global_step": 212574, "epoch": 1756} {"train_loss": -42.26313400268555, "global_step": 212575, "epoch": 1756} {"train_loss": -41.399169921875, "global_step": 212576, "epoch": 1756} {"train_loss": -42.1981315612793, "global_step": 212577, "epoch": 1756} {"train_loss": -41.5860595703125, "global_step": 212578, "epoch": 1756} {"train_loss": -42.1767692565918, "global_step": 212579, "epoch": 1756} {"train_loss": -41.456443786621094, "global_step": 212580, "epoch": 1756} {"train_loss": -42.064666748046875, "global_step": 212581, "epoch": 1756} {"train_loss": -42.13325500488281, "global_step": 212582, "epoch": 1756} {"train_loss": -41.94367599487305, "global_step": 212583, "epoch": 1756} {"train_loss": -42.15815353393555, "global_step": 212584, "epoch": 1756} {"train_loss": -41.83439254760742, "global_step": 212585, "epoch": 1756} {"train_loss": -41.2490348815918, "global_step": 212586, "epoch": 1756} {"train_loss": -41.24514389038086, "global_step": 212587, "epoch": 1756} {"train_loss": -41.73698043823242, "global_step": 212588, "epoch": 1756} {"train_loss": -41.83353805541992, "global_step": 212589, "epoch": 1756} {"train_loss": -42.43961715698242, "global_step": 212590, "epoch": 1756} {"train_loss": -41.32969284057617, "global_step": 212591, "epoch": 1756} {"train_loss": -40.90618896484375, "global_step": 212592, "epoch": 1756} {"train_loss": -42.45205307006836, "global_step": 212593, "epoch": 1756} {"train_loss": -40.38037109375, "global_step": 212594, "epoch": 1756} {"train_loss": -39.25287628173828, "global_step": 212595, "epoch": 1756} {"train_loss": -41.33059723909236, "global_step": 212596, "epoch": 1756, "val_loss": 2562313.25} {"train_loss": -40.0949592590332, "global_step": 212597, "epoch": 1757} {"train_loss": -41.94639205932617, "global_step": 212598, "epoch": 1757} {"train_loss": -39.86103820800781, "global_step": 212599, "epoch": 1757} {"train_loss": -41.68151092529297, "global_step": 212600, "epoch": 1757} {"train_loss": -41.755157470703125, "global_step": 212601, "epoch": 1757} {"train_loss": -40.65064239501953, "global_step": 212602, "epoch": 1757} {"train_loss": -42.37826156616211, "global_step": 212603, "epoch": 1757} {"train_loss": -40.76673889160156, "global_step": 212604, "epoch": 1757} {"train_loss": -42.41413497924805, "global_step": 212605, "epoch": 1757} {"train_loss": -41.5348014831543, "global_step": 212606, "epoch": 1757} {"train_loss": -41.40141677856445, "global_step": 212607, "epoch": 1757} {"train_loss": -42.32417297363281, "global_step": 212608, "epoch": 1757} {"train_loss": -41.5173225402832, "global_step": 212609, "epoch": 1757} {"train_loss": -43.01127624511719, "global_step": 212610, "epoch": 1757} {"train_loss": -40.20230484008789, "global_step": 212611, "epoch": 1757} {"train_loss": -41.81435775756836, "global_step": 212612, "epoch": 1757} {"train_loss": -41.0595588684082, "global_step": 212613, "epoch": 1757} {"train_loss": -41.922489166259766, "global_step": 212614, "epoch": 1757} {"train_loss": -42.13713455200195, "global_step": 212615, "epoch": 1757} {"train_loss": -42.30009841918945, "global_step": 212616, "epoch": 1757} {"train_loss": -42.37501907348633, "global_step": 212617, "epoch": 1757} {"train_loss": -41.88178253173828, "global_step": 212618, "epoch": 1757} {"train_loss": -42.54800033569336, "global_step": 212619, "epoch": 1757} {"train_loss": -41.95009994506836, "global_step": 212620, "epoch": 1757} {"train_loss": -42.99665069580078, "global_step": 212621, "epoch": 1757} {"train_loss": -41.79536056518555, "global_step": 212622, "epoch": 1757} {"train_loss": -42.59092330932617, "global_step": 212623, "epoch": 1757} {"train_loss": -41.947608947753906, "global_step": 212624, "epoch": 1757} {"train_loss": -41.88458251953125, "global_step": 212625, "epoch": 1757} {"train_loss": -42.62845993041992, "global_step": 212626, "epoch": 1757} {"train_loss": -41.85905075073242, "global_step": 212627, "epoch": 1757} {"train_loss": -41.27483367919922, "global_step": 212628, "epoch": 1757} {"train_loss": -41.50197219848633, "global_step": 212629, "epoch": 1757} {"train_loss": -42.679359436035156, "global_step": 212630, "epoch": 1757} {"train_loss": -42.2261962890625, "global_step": 212631, "epoch": 1757} {"train_loss": -41.74604415893555, "global_step": 212632, "epoch": 1757} {"train_loss": -42.42245101928711, "global_step": 212633, "epoch": 1757} {"train_loss": -41.48725128173828, "global_step": 212634, "epoch": 1757} {"train_loss": -42.3585319519043, "global_step": 212635, "epoch": 1757} {"train_loss": -42.13818359375, "global_step": 212636, "epoch": 1757} {"train_loss": -41.52523422241211, "global_step": 212637, "epoch": 1757} {"train_loss": -40.935909271240234, "global_step": 212638, "epoch": 1757} {"train_loss": -41.7627067565918, "global_step": 212639, "epoch": 1757} {"train_loss": -41.13886642456055, "global_step": 212640, "epoch": 1757} {"train_loss": -42.43166732788086, "global_step": 212641, "epoch": 1757} {"train_loss": -42.35457992553711, "global_step": 212642, "epoch": 1757} {"train_loss": -41.69673538208008, "global_step": 212643, "epoch": 1757} {"train_loss": -41.932613372802734, "global_step": 212644, "epoch": 1757} {"train_loss": -41.51304244995117, "global_step": 212645, "epoch": 1757} {"train_loss": -42.388031005859375, "global_step": 212646, "epoch": 1757} {"train_loss": -42.51569366455078, "global_step": 212647, "epoch": 1757} {"train_loss": -40.80188751220703, "global_step": 212648, "epoch": 1757} {"train_loss": -40.62821578979492, "global_step": 212649, "epoch": 1757} {"train_loss": -42.569740295410156, "global_step": 212650, "epoch": 1757} {"train_loss": -38.239784240722656, "global_step": 212651, "epoch": 1757} {"train_loss": -40.62250900268555, "global_step": 212652, "epoch": 1757} {"train_loss": -41.508636474609375, "global_step": 212653, "epoch": 1757} {"train_loss": -41.085853576660156, "global_step": 212654, "epoch": 1757} {"train_loss": -38.271995544433594, "global_step": 212655, "epoch": 1757} {"train_loss": -42.65705108642578, "global_step": 212656, "epoch": 1757} {"train_loss": -39.86786651611328, "global_step": 212657, "epoch": 1757} {"train_loss": -40.64900588989258, "global_step": 212658, "epoch": 1757} {"train_loss": -42.29931640625, "global_step": 212659, "epoch": 1757} {"train_loss": -41.907470703125, "global_step": 212660, "epoch": 1757} {"train_loss": -41.52798080444336, "global_step": 212661, "epoch": 1757} {"train_loss": -42.377498626708984, "global_step": 212662, "epoch": 1757} {"train_loss": -41.00018310546875, "global_step": 212663, "epoch": 1757} {"train_loss": -41.99345779418945, "global_step": 212664, "epoch": 1757} {"train_loss": -41.699703216552734, "global_step": 212665, "epoch": 1757} {"train_loss": -41.234615325927734, "global_step": 212666, "epoch": 1757} {"train_loss": -42.35279083251953, "global_step": 212667, "epoch": 1757} {"train_loss": -41.97651672363281, "global_step": 212668, "epoch": 1757} {"train_loss": -42.41378402709961, "global_step": 212669, "epoch": 1757} {"train_loss": -41.798194885253906, "global_step": 212670, "epoch": 1757} {"train_loss": -42.556304931640625, "global_step": 212671, "epoch": 1757} {"train_loss": -42.58626174926758, "global_step": 212672, "epoch": 1757} {"train_loss": -42.76913070678711, "global_step": 212673, "epoch": 1757} {"train_loss": -42.70143127441406, "global_step": 212674, "epoch": 1757} {"train_loss": -42.74260711669922, "global_step": 212675, "epoch": 1757} {"train_loss": -42.38469314575195, "global_step": 212676, "epoch": 1757} {"train_loss": -42.63010787963867, "global_step": 212677, "epoch": 1757} {"train_loss": -42.84371566772461, "global_step": 212678, "epoch": 1757} {"train_loss": -43.1633415222168, "global_step": 212679, "epoch": 1757} {"train_loss": -43.0410041809082, "global_step": 212680, "epoch": 1757} {"train_loss": -42.34634780883789, "global_step": 212681, "epoch": 1757} {"train_loss": -42.755615234375, "global_step": 212682, "epoch": 1757} {"train_loss": -42.879268646240234, "global_step": 212683, "epoch": 1757} {"train_loss": -42.16644287109375, "global_step": 212684, "epoch": 1757} {"train_loss": -41.4139518737793, "global_step": 212685, "epoch": 1757} {"train_loss": -42.35504150390625, "global_step": 212686, "epoch": 1757} {"train_loss": -42.75870895385742, "global_step": 212687, "epoch": 1757} {"train_loss": -41.52327346801758, "global_step": 212688, "epoch": 1757} {"train_loss": -41.4803352355957, "global_step": 212689, "epoch": 1757} {"train_loss": -42.98133087158203, "global_step": 212690, "epoch": 1757} {"train_loss": -42.29142761230469, "global_step": 212691, "epoch": 1757} {"train_loss": -42.224308013916016, "global_step": 212692, "epoch": 1757} {"train_loss": -42.91398239135742, "global_step": 212693, "epoch": 1757} {"train_loss": -42.08829879760742, "global_step": 212694, "epoch": 1757} {"train_loss": -41.783199310302734, "global_step": 212695, "epoch": 1757} {"train_loss": -41.27927017211914, "global_step": 212696, "epoch": 1757} {"train_loss": -41.13877868652344, "global_step": 212697, "epoch": 1757} {"train_loss": -41.84102249145508, "global_step": 212698, "epoch": 1757} {"train_loss": -41.622623443603516, "global_step": 212699, "epoch": 1757} {"train_loss": -40.5037841796875, "global_step": 212700, "epoch": 1757} {"train_loss": -42.2160758972168, "global_step": 212701, "epoch": 1757} {"train_loss": -42.79463195800781, "global_step": 212702, "epoch": 1757} {"train_loss": -42.74874496459961, "global_step": 212703, "epoch": 1757} {"train_loss": -42.56936264038086, "global_step": 212704, "epoch": 1757} {"train_loss": -42.4737434387207, "global_step": 212705, "epoch": 1757} {"train_loss": -42.872703552246094, "global_step": 212706, "epoch": 1757} {"train_loss": -42.87201690673828, "global_step": 212707, "epoch": 1757} {"train_loss": -42.004608154296875, "global_step": 212708, "epoch": 1757} {"train_loss": -41.00518035888672, "global_step": 212709, "epoch": 1757} {"train_loss": -41.570491790771484, "global_step": 212710, "epoch": 1757} {"train_loss": -43.01383590698242, "global_step": 212711, "epoch": 1757} {"train_loss": -43.046661376953125, "global_step": 212712, "epoch": 1757} {"train_loss": -40.68962478637695, "global_step": 212713, "epoch": 1757} {"train_loss": -42.43067169189453, "global_step": 212714, "epoch": 1757} {"train_loss": -42.904945373535156, "global_step": 212715, "epoch": 1757} {"train_loss": -41.811588287353516, "global_step": 212716, "epoch": 1757} {"train_loss": -41.88301376468879, "global_step": 212717, "epoch": 1757, "val_loss": 2635673.0} {"train_loss": -40.86548614501953, "global_step": 212718, "epoch": 1758} {"train_loss": -42.6580696105957, "global_step": 212719, "epoch": 1758} {"train_loss": -40.58376693725586, "global_step": 212720, "epoch": 1758} {"train_loss": -40.88505935668945, "global_step": 212721, "epoch": 1758} {"train_loss": -42.6515998840332, "global_step": 212722, "epoch": 1758} {"train_loss": -41.8125114440918, "global_step": 212723, "epoch": 1758} {"train_loss": -42.03580093383789, "global_step": 212724, "epoch": 1758} {"train_loss": -43.018455505371094, "global_step": 212725, "epoch": 1758} {"train_loss": -42.398590087890625, "global_step": 212726, "epoch": 1758} {"train_loss": -42.38359451293945, "global_step": 212727, "epoch": 1758} {"train_loss": -43.16559600830078, "global_step": 212728, "epoch": 1758} {"train_loss": -42.68528747558594, "global_step": 212729, "epoch": 1758} {"train_loss": -42.6503791809082, "global_step": 212730, "epoch": 1758} {"train_loss": -42.755069732666016, "global_step": 212731, "epoch": 1758} {"train_loss": -42.86807632446289, "global_step": 212732, "epoch": 1758} {"train_loss": -42.913246154785156, "global_step": 212733, "epoch": 1758} {"train_loss": -43.20036697387695, "global_step": 212734, "epoch": 1758} {"train_loss": -42.897064208984375, "global_step": 212735, "epoch": 1758} {"train_loss": -42.93061447143555, "global_step": 212736, "epoch": 1758} {"train_loss": -42.66927719116211, "global_step": 212737, "epoch": 1758} {"train_loss": -42.61477279663086, "global_step": 212738, "epoch": 1758} {"train_loss": -42.197452545166016, "global_step": 212739, "epoch": 1758} {"train_loss": -42.479793548583984, "global_step": 212740, "epoch": 1758} {"train_loss": -42.963348388671875, "global_step": 212741, "epoch": 1758} {"train_loss": -42.9293098449707, "global_step": 212742, "epoch": 1758} {"train_loss": -42.71488571166992, "global_step": 212743, "epoch": 1758} {"train_loss": -42.54255676269531, "global_step": 212744, "epoch": 1758} {"train_loss": -43.141090393066406, "global_step": 212745, "epoch": 1758} {"train_loss": -42.943477630615234, "global_step": 212746, "epoch": 1758} {"train_loss": -42.662208557128906, "global_step": 212747, "epoch": 1758} {"train_loss": -42.04203414916992, "global_step": 212748, "epoch": 1758} {"train_loss": -43.107608795166016, "global_step": 212749, "epoch": 1758} {"train_loss": -43.27676773071289, "global_step": 212750, "epoch": 1758} {"train_loss": -42.96372604370117, "global_step": 212751, "epoch": 1758} {"train_loss": -43.02999496459961, "global_step": 212752, "epoch": 1758} {"train_loss": -42.58808517456055, "global_step": 212753, "epoch": 1758} {"train_loss": -43.1881217956543, "global_step": 212754, "epoch": 1758} {"train_loss": -42.83173751831055, "global_step": 212755, "epoch": 1758} {"train_loss": -40.499385833740234, "global_step": 212756, "epoch": 1758} {"train_loss": -41.539276123046875, "global_step": 212757, "epoch": 1758} {"train_loss": -41.74268341064453, "global_step": 212758, "epoch": 1758} {"train_loss": -42.70392990112305, "global_step": 212759, "epoch": 1758} {"train_loss": -43.24894332885742, "global_step": 212760, "epoch": 1758} {"train_loss": -42.3321418762207, "global_step": 212761, "epoch": 1758} {"train_loss": -42.61995315551758, "global_step": 212762, "epoch": 1758} {"train_loss": -43.20682907104492, "global_step": 212763, "epoch": 1758} {"train_loss": -42.479270935058594, "global_step": 212764, "epoch": 1758} {"train_loss": -42.71889114379883, "global_step": 212765, "epoch": 1758} {"train_loss": -42.74757766723633, "global_step": 212766, "epoch": 1758} {"train_loss": -41.2788200378418, "global_step": 212767, "epoch": 1758} {"train_loss": -40.67110824584961, "global_step": 212768, "epoch": 1758} {"train_loss": -42.54764938354492, "global_step": 212769, "epoch": 1758} {"train_loss": -41.887939453125, "global_step": 212770, "epoch": 1758} {"train_loss": -41.49826431274414, "global_step": 212771, "epoch": 1758} {"train_loss": -42.43775177001953, "global_step": 212772, "epoch": 1758} {"train_loss": -42.89452362060547, "global_step": 212773, "epoch": 1758} {"train_loss": -42.591033935546875, "global_step": 212774, "epoch": 1758} {"train_loss": -42.331092834472656, "global_step": 212775, "epoch": 1758} {"train_loss": -42.61180114746094, "global_step": 212776, "epoch": 1758} {"train_loss": -42.68156051635742, "global_step": 212777, "epoch": 1758} {"train_loss": -42.561195373535156, "global_step": 212778, "epoch": 1758} {"train_loss": -42.584686279296875, "global_step": 212779, "epoch": 1758} {"train_loss": -42.8929557800293, "global_step": 212780, "epoch": 1758} {"train_loss": -42.47209548950195, "global_step": 212781, "epoch": 1758} {"train_loss": -42.55507278442383, "global_step": 212782, "epoch": 1758} {"train_loss": -42.978851318359375, "global_step": 212783, "epoch": 1758} {"train_loss": -42.20831298828125, "global_step": 212784, "epoch": 1758} {"train_loss": -42.51118469238281, "global_step": 212785, "epoch": 1758} {"train_loss": -41.73696517944336, "global_step": 212786, "epoch": 1758} {"train_loss": -41.82803726196289, "global_step": 212787, "epoch": 1758} {"train_loss": -42.30963897705078, "global_step": 212788, "epoch": 1758} {"train_loss": -43.03072738647461, "global_step": 212789, "epoch": 1758} {"train_loss": -43.05952835083008, "global_step": 212790, "epoch": 1758} {"train_loss": -41.63116455078125, "global_step": 212791, "epoch": 1758} {"train_loss": -41.11183166503906, "global_step": 212792, "epoch": 1758} {"train_loss": -41.33559799194336, "global_step": 212793, "epoch": 1758} {"train_loss": -40.10737228393555, "global_step": 212794, "epoch": 1758} {"train_loss": -40.531463623046875, "global_step": 212795, "epoch": 1758} {"train_loss": -41.39530563354492, "global_step": 212796, "epoch": 1758} {"train_loss": -42.07123565673828, "global_step": 212797, "epoch": 1758} {"train_loss": -42.08364486694336, "global_step": 212798, "epoch": 1758} {"train_loss": -42.186279296875, "global_step": 212799, "epoch": 1758} {"train_loss": -41.365028381347656, "global_step": 212800, "epoch": 1758} {"train_loss": -40.931514739990234, "global_step": 212801, "epoch": 1758} {"train_loss": -40.127166748046875, "global_step": 212802, "epoch": 1758} {"train_loss": -40.17692565917969, "global_step": 212803, "epoch": 1758} {"train_loss": -40.81986618041992, "global_step": 212804, "epoch": 1758} {"train_loss": -40.480377197265625, "global_step": 212805, "epoch": 1758} {"train_loss": -39.760162353515625, "global_step": 212806, "epoch": 1758} {"train_loss": -40.923011779785156, "global_step": 212807, "epoch": 1758} {"train_loss": -41.11730194091797, "global_step": 212808, "epoch": 1758} {"train_loss": -41.74949264526367, "global_step": 212809, "epoch": 1758} {"train_loss": -38.63325881958008, "global_step": 212810, "epoch": 1758} {"train_loss": -41.63778305053711, "global_step": 212811, "epoch": 1758} {"train_loss": -40.934139251708984, "global_step": 212812, "epoch": 1758} {"train_loss": -38.430633544921875, "global_step": 212813, "epoch": 1758} {"train_loss": -40.56556701660156, "global_step": 212814, "epoch": 1758} {"train_loss": -40.0725212097168, "global_step": 212815, "epoch": 1758} {"train_loss": -39.619606018066406, "global_step": 212816, "epoch": 1758} {"train_loss": -40.97629928588867, "global_step": 212817, "epoch": 1758} {"train_loss": -39.85807418823242, "global_step": 212818, "epoch": 1758} {"train_loss": -41.33916091918945, "global_step": 212819, "epoch": 1758} {"train_loss": -41.58822250366211, "global_step": 212820, "epoch": 1758} {"train_loss": -40.4611930847168, "global_step": 212821, "epoch": 1758} {"train_loss": -42.00856399536133, "global_step": 212822, "epoch": 1758} {"train_loss": -41.032039642333984, "global_step": 212823, "epoch": 1758} {"train_loss": -41.52358627319336, "global_step": 212824, "epoch": 1758} {"train_loss": -42.52651596069336, "global_step": 212825, "epoch": 1758} {"train_loss": -41.1510009765625, "global_step": 212826, "epoch": 1758} {"train_loss": -41.35660934448242, "global_step": 212827, "epoch": 1758} {"train_loss": -41.62647247314453, "global_step": 212828, "epoch": 1758} {"train_loss": -41.0357551574707, "global_step": 212829, "epoch": 1758} {"train_loss": -41.811309814453125, "global_step": 212830, "epoch": 1758} {"train_loss": -42.183902740478516, "global_step": 212831, "epoch": 1758} {"train_loss": -41.9200325012207, "global_step": 212832, "epoch": 1758} {"train_loss": -42.32405471801758, "global_step": 212833, "epoch": 1758} {"train_loss": -42.150394439697266, "global_step": 212834, "epoch": 1758} {"train_loss": -42.82996368408203, "global_step": 212835, "epoch": 1758} {"train_loss": -42.450130462646484, "global_step": 212836, "epoch": 1758} {"train_loss": -43.19169235229492, "global_step": 212837, "epoch": 1758} {"train_loss": -41.97080700456603, "global_step": 212838, "epoch": 1758, "val_loss": 2514518.25} {"train_loss": -43.09202194213867, "global_step": 212839, "epoch": 1759} {"train_loss": -42.75194549560547, "global_step": 212840, "epoch": 1759} {"train_loss": -42.593528747558594, "global_step": 212841, "epoch": 1759} {"train_loss": -43.13261795043945, "global_step": 212842, "epoch": 1759} {"train_loss": -42.17405319213867, "global_step": 212843, "epoch": 1759} {"train_loss": -43.00532913208008, "global_step": 212844, "epoch": 1759} {"train_loss": -42.90243148803711, "global_step": 212845, "epoch": 1759} {"train_loss": -42.70216751098633, "global_step": 212846, "epoch": 1759} {"train_loss": -42.64519500732422, "global_step": 212847, "epoch": 1759} {"train_loss": -43.006385803222656, "global_step": 212848, "epoch": 1759} {"train_loss": -42.95606994628906, "global_step": 212849, "epoch": 1759} {"train_loss": -43.29024887084961, "global_step": 212850, "epoch": 1759} {"train_loss": -42.161983489990234, "global_step": 212851, "epoch": 1759} {"train_loss": -42.572486877441406, "global_step": 212852, "epoch": 1759} {"train_loss": -43.11848068237305, "global_step": 212853, "epoch": 1759} {"train_loss": -42.53422927856445, "global_step": 212854, "epoch": 1759} {"train_loss": -42.708980560302734, "global_step": 212855, "epoch": 1759} {"train_loss": -42.93796920776367, "global_step": 212856, "epoch": 1759} {"train_loss": -43.16009521484375, "global_step": 212857, "epoch": 1759} {"train_loss": -42.556190490722656, "global_step": 212858, "epoch": 1759} {"train_loss": -42.86701202392578, "global_step": 212859, "epoch": 1759} {"train_loss": -43.231021881103516, "global_step": 212860, "epoch": 1759} {"train_loss": -43.36663818359375, "global_step": 212861, "epoch": 1759} {"train_loss": -42.6512336730957, "global_step": 212862, "epoch": 1759} {"train_loss": -42.81925582885742, "global_step": 212863, "epoch": 1759} {"train_loss": -42.639217376708984, "global_step": 212864, "epoch": 1759} {"train_loss": -42.09565353393555, "global_step": 212865, "epoch": 1759} {"train_loss": -42.66796875, "global_step": 212866, "epoch": 1759} {"train_loss": -42.83304214477539, "global_step": 212867, "epoch": 1759} {"train_loss": -43.40995407104492, "global_step": 212868, "epoch": 1759} {"train_loss": -41.20030975341797, "global_step": 212869, "epoch": 1759} {"train_loss": -43.1759147644043, "global_step": 212870, "epoch": 1759} {"train_loss": -42.3437385559082, "global_step": 212871, "epoch": 1759} {"train_loss": -42.05156707763672, "global_step": 212872, "epoch": 1759} {"train_loss": -41.621726989746094, "global_step": 212873, "epoch": 1759} {"train_loss": -41.809017181396484, "global_step": 212874, "epoch": 1759} {"train_loss": -42.788055419921875, "global_step": 212875, "epoch": 1759} {"train_loss": -43.33926773071289, "global_step": 212876, "epoch": 1759} {"train_loss": -42.30831527709961, "global_step": 212877, "epoch": 1759} {"train_loss": -42.19355392456055, "global_step": 212878, "epoch": 1759} {"train_loss": -40.60789108276367, "global_step": 212879, "epoch": 1759} {"train_loss": -42.27769088745117, "global_step": 212880, "epoch": 1759} {"train_loss": -42.6931266784668, "global_step": 212881, "epoch": 1759} {"train_loss": -42.72704315185547, "global_step": 212882, "epoch": 1759} {"train_loss": -42.8184928894043, "global_step": 212883, "epoch": 1759} {"train_loss": -42.15253448486328, "global_step": 212884, "epoch": 1759} {"train_loss": -42.170284271240234, "global_step": 212885, "epoch": 1759} {"train_loss": -41.72568893432617, "global_step": 212886, "epoch": 1759} {"train_loss": -42.54718017578125, "global_step": 212887, "epoch": 1759} {"train_loss": -40.435733795166016, "global_step": 212888, "epoch": 1759} {"train_loss": -39.4060173034668, "global_step": 212889, "epoch": 1759} {"train_loss": -42.36725616455078, "global_step": 212890, "epoch": 1759} {"train_loss": -40.49126434326172, "global_step": 212891, "epoch": 1759} {"train_loss": -37.247039794921875, "global_step": 212892, "epoch": 1759} {"train_loss": -41.04932403564453, "global_step": 212893, "epoch": 1759} {"train_loss": -35.77943801879883, "global_step": 212894, "epoch": 1759} {"train_loss": -38.7959098815918, "global_step": 212895, "epoch": 1759} {"train_loss": -36.41292953491211, "global_step": 212896, "epoch": 1759} {"train_loss": -39.10034942626953, "global_step": 212897, "epoch": 1759} {"train_loss": -38.66428756713867, "global_step": 212898, "epoch": 1759} {"train_loss": -39.6788215637207, "global_step": 212899, "epoch": 1759} {"train_loss": -42.00478744506836, "global_step": 212900, "epoch": 1759} {"train_loss": -37.616432189941406, "global_step": 212901, "epoch": 1759} {"train_loss": -39.80107879638672, "global_step": 212902, "epoch": 1759} {"train_loss": -40.39424514770508, "global_step": 212903, "epoch": 1759} {"train_loss": -40.4371223449707, "global_step": 212904, "epoch": 1759} {"train_loss": -41.275997161865234, "global_step": 212905, "epoch": 1759} {"train_loss": -37.43403625488281, "global_step": 212906, "epoch": 1759} {"train_loss": -39.10581588745117, "global_step": 212907, "epoch": 1759} {"train_loss": -40.56708526611328, "global_step": 212908, "epoch": 1759} {"train_loss": -40.52812576293945, "global_step": 212909, "epoch": 1759} {"train_loss": -40.28337860107422, "global_step": 212910, "epoch": 1759} {"train_loss": -39.76339340209961, "global_step": 212911, "epoch": 1759} {"train_loss": -38.678321838378906, "global_step": 212912, "epoch": 1759} {"train_loss": -38.45232009887695, "global_step": 212913, "epoch": 1759} {"train_loss": -38.929317474365234, "global_step": 212914, "epoch": 1759} {"train_loss": -26.766529083251953, "global_step": 212915, "epoch": 1759} {"train_loss": -38.24392318725586, "global_step": 212916, "epoch": 1759} {"train_loss": -39.989776611328125, "global_step": 212917, "epoch": 1759} {"train_loss": -39.58138656616211, "global_step": 212918, "epoch": 1759} {"train_loss": -39.32217025756836, "global_step": 212919, "epoch": 1759} {"train_loss": -38.14191436767578, "global_step": 212920, "epoch": 1759} {"train_loss": -31.446134567260742, "global_step": 212921, "epoch": 1759} {"train_loss": -37.12349319458008, "global_step": 212922, "epoch": 1759} {"train_loss": -40.90013885498047, "global_step": 212923, "epoch": 1759} {"train_loss": -37.574642181396484, "global_step": 212924, "epoch": 1759} {"train_loss": -39.29119873046875, "global_step": 212925, "epoch": 1759} {"train_loss": -37.74639892578125, "global_step": 212926, "epoch": 1759} {"train_loss": -29.254730224609375, "global_step": 212927, "epoch": 1759} {"train_loss": -35.616981506347656, "global_step": 212928, "epoch": 1759} {"train_loss": -35.898433685302734, "global_step": 212929, "epoch": 1759} {"train_loss": -38.40372848510742, "global_step": 212930, "epoch": 1759} {"train_loss": -40.47489929199219, "global_step": 212931, "epoch": 1759} {"train_loss": -37.5712776184082, "global_step": 212932, "epoch": 1759} {"train_loss": -37.40398406982422, "global_step": 212933, "epoch": 1759} {"train_loss": -36.76481246948242, "global_step": 212934, "epoch": 1759} {"train_loss": -31.633604049682617, "global_step": 212935, "epoch": 1759} {"train_loss": -35.81557846069336, "global_step": 212936, "epoch": 1759} {"train_loss": -39.41809844970703, "global_step": 212937, "epoch": 1759} {"train_loss": -37.849178314208984, "global_step": 212938, "epoch": 1759} {"train_loss": -40.022979736328125, "global_step": 212939, "epoch": 1759} {"train_loss": -40.605255126953125, "global_step": 212940, "epoch": 1759} {"train_loss": -38.98057174682617, "global_step": 212941, "epoch": 1759} {"train_loss": -36.835079193115234, "global_step": 212942, "epoch": 1759} {"train_loss": -40.03764724731445, "global_step": 212943, "epoch": 1759} {"train_loss": -37.895118713378906, "global_step": 212944, "epoch": 1759} {"train_loss": -38.536136627197266, "global_step": 212945, "epoch": 1759} {"train_loss": -37.24766159057617, "global_step": 212946, "epoch": 1759} {"train_loss": -38.21689224243164, "global_step": 212947, "epoch": 1759} {"train_loss": -39.832252502441406, "global_step": 212948, "epoch": 1759} {"train_loss": -40.20633316040039, "global_step": 212949, "epoch": 1759} {"train_loss": -40.548583984375, "global_step": 212950, "epoch": 1759} {"train_loss": -39.343868255615234, "global_step": 212951, "epoch": 1759} {"train_loss": -40.01252365112305, "global_step": 212952, "epoch": 1759} {"train_loss": -39.263397216796875, "global_step": 212953, "epoch": 1759} {"train_loss": -38.64067840576172, "global_step": 212954, "epoch": 1759} {"train_loss": -40.091468811035156, "global_step": 212955, "epoch": 1759} {"train_loss": -40.20329666137695, "global_step": 212956, "epoch": 1759} {"train_loss": -40.242584228515625, "global_step": 212957, "epoch": 1759} {"train_loss": -41.47480010986328, "global_step": 212958, "epoch": 1759} {"train_loss": -40.190012435282554, "global_step": 212959, "epoch": 1759, "val_loss": 2571219.75} {"train_loss": -40.57088088989258, "global_step": 212960, "epoch": 1760} {"train_loss": -39.86316680908203, "global_step": 212961, "epoch": 1760} {"train_loss": -40.940025329589844, "global_step": 212962, "epoch": 1760} {"train_loss": -40.666622161865234, "global_step": 212963, "epoch": 1760} {"train_loss": -40.746490478515625, "global_step": 212964, "epoch": 1760} {"train_loss": -40.3065185546875, "global_step": 212965, "epoch": 1760} {"train_loss": -41.33007049560547, "global_step": 212966, "epoch": 1760} {"train_loss": -41.587345123291016, "global_step": 212967, "epoch": 1760} {"train_loss": -40.378658294677734, "global_step": 212968, "epoch": 1760} {"train_loss": -41.79420852661133, "global_step": 212969, "epoch": 1760} {"train_loss": -41.34836959838867, "global_step": 212970, "epoch": 1760} {"train_loss": -42.05898666381836, "global_step": 212971, "epoch": 1760} {"train_loss": -41.56142807006836, "global_step": 212972, "epoch": 1760} {"train_loss": -41.13661193847656, "global_step": 212973, "epoch": 1760} {"train_loss": -41.657623291015625, "global_step": 212974, "epoch": 1760} {"train_loss": -41.4116096496582, "global_step": 212975, "epoch": 1760} {"train_loss": -42.41917419433594, "global_step": 212976, "epoch": 1760} {"train_loss": -41.96662521362305, "global_step": 212977, "epoch": 1760} {"train_loss": -41.62995910644531, "global_step": 212978, "epoch": 1760} {"train_loss": -41.64409255981445, "global_step": 212979, "epoch": 1760} {"train_loss": -41.807960510253906, "global_step": 212980, "epoch": 1760} {"train_loss": -41.16654586791992, "global_step": 212981, "epoch": 1760} {"train_loss": -42.08259201049805, "global_step": 212982, "epoch": 1760} {"train_loss": -41.641571044921875, "global_step": 212983, "epoch": 1760} {"train_loss": -41.92841339111328, "global_step": 212984, "epoch": 1760} {"train_loss": -41.15808868408203, "global_step": 212985, "epoch": 1760} {"train_loss": -41.70915603637695, "global_step": 212986, "epoch": 1760} {"train_loss": -42.4576416015625, "global_step": 212987, "epoch": 1760} {"train_loss": -42.53538513183594, "global_step": 212988, "epoch": 1760} {"train_loss": -41.93898010253906, "global_step": 212989, "epoch": 1760} {"train_loss": -41.34339141845703, "global_step": 212990, "epoch": 1760} {"train_loss": -42.382774353027344, "global_step": 212991, "epoch": 1760} {"train_loss": -42.43954086303711, "global_step": 212992, "epoch": 1760} {"train_loss": -41.95726776123047, "global_step": 212993, "epoch": 1760} {"train_loss": -42.34295654296875, "global_step": 212994, "epoch": 1760} {"train_loss": -42.351314544677734, "global_step": 212995, "epoch": 1760} {"train_loss": -42.041439056396484, "global_step": 212996, "epoch": 1760} {"train_loss": -42.12482833862305, "global_step": 212997, "epoch": 1760} {"train_loss": -41.85781478881836, "global_step": 212998, "epoch": 1760} {"train_loss": -42.42868423461914, "global_step": 212999, "epoch": 1760} {"train_loss": -42.4384765625, "global_step": 213000, "epoch": 1760} {"train_loss": -42.49335479736328, "global_step": 213001, "epoch": 1760} {"train_loss": -41.925716400146484, "global_step": 213002, "epoch": 1760} {"train_loss": -42.94144058227539, "global_step": 213003, "epoch": 1760} {"train_loss": -42.3855094909668, "global_step": 213004, "epoch": 1760} {"train_loss": -42.7625617980957, "global_step": 213005, "epoch": 1760} {"train_loss": -42.24782180786133, "global_step": 213006, "epoch": 1760} {"train_loss": -42.73971176147461, "global_step": 213007, "epoch": 1760} {"train_loss": -42.26337814331055, "global_step": 213008, "epoch": 1760} {"train_loss": -42.43362045288086, "global_step": 213009, "epoch": 1760} {"train_loss": -42.579227447509766, "global_step": 213010, "epoch": 1760} {"train_loss": -42.7371826171875, "global_step": 213011, "epoch": 1760} {"train_loss": -42.64661407470703, "global_step": 213012, "epoch": 1760} {"train_loss": -42.38203811645508, "global_step": 213013, "epoch": 1760} {"train_loss": -42.00490188598633, "global_step": 213014, "epoch": 1760} {"train_loss": -42.616004943847656, "global_step": 213015, "epoch": 1760} {"train_loss": -42.565025329589844, "global_step": 213016, "epoch": 1760} {"train_loss": -42.14292526245117, "global_step": 213017, "epoch": 1760} {"train_loss": -42.593318939208984, "global_step": 213018, "epoch": 1760} {"train_loss": -42.504150390625, "global_step": 213019, "epoch": 1760} {"train_loss": -42.09035873413086, "global_step": 213020, "epoch": 1760} {"train_loss": -42.51810836791992, "global_step": 213021, "epoch": 1760} {"train_loss": -42.26070785522461, "global_step": 213022, "epoch": 1760} {"train_loss": -42.962581634521484, "global_step": 213023, "epoch": 1760} {"train_loss": -42.45821762084961, "global_step": 213024, "epoch": 1760} {"train_loss": -41.605567932128906, "global_step": 213025, "epoch": 1760} {"train_loss": -42.80992889404297, "global_step": 213026, "epoch": 1760} {"train_loss": -41.147315979003906, "global_step": 213027, "epoch": 1760} {"train_loss": -40.58420181274414, "global_step": 213028, "epoch": 1760} {"train_loss": -41.47877502441406, "global_step": 213029, "epoch": 1760} {"train_loss": -41.221256256103516, "global_step": 213030, "epoch": 1760} {"train_loss": -41.75533676147461, "global_step": 213031, "epoch": 1760} {"train_loss": -39.21102523803711, "global_step": 213032, "epoch": 1760} {"train_loss": -40.74399948120117, "global_step": 213033, "epoch": 1760} {"train_loss": -40.802711486816406, "global_step": 213034, "epoch": 1760} {"train_loss": -40.210716247558594, "global_step": 213035, "epoch": 1760} {"train_loss": -40.59653854370117, "global_step": 213036, "epoch": 1760} {"train_loss": -40.932716369628906, "global_step": 213037, "epoch": 1760} {"train_loss": -42.118194580078125, "global_step": 213038, "epoch": 1760} {"train_loss": -42.01331329345703, "global_step": 213039, "epoch": 1760} {"train_loss": -41.397857666015625, "global_step": 213040, "epoch": 1760} {"train_loss": -40.396636962890625, "global_step": 213041, "epoch": 1760} {"train_loss": -40.13596725463867, "global_step": 213042, "epoch": 1760} {"train_loss": -42.57378005981445, "global_step": 213043, "epoch": 1760} {"train_loss": -40.371578216552734, "global_step": 213044, "epoch": 1760} {"train_loss": -39.01997756958008, "global_step": 213045, "epoch": 1760} {"train_loss": -40.35403060913086, "global_step": 213046, "epoch": 1760} {"train_loss": -40.87221908569336, "global_step": 213047, "epoch": 1760} {"train_loss": -42.115535736083984, "global_step": 213048, "epoch": 1760} {"train_loss": -39.57109451293945, "global_step": 213049, "epoch": 1760} {"train_loss": -40.09836959838867, "global_step": 213050, "epoch": 1760} {"train_loss": -40.849945068359375, "global_step": 213051, "epoch": 1760} {"train_loss": -40.98467254638672, "global_step": 213052, "epoch": 1760} {"train_loss": -41.58144760131836, "global_step": 213053, "epoch": 1760} {"train_loss": -41.7722282409668, "global_step": 213054, "epoch": 1760} {"train_loss": -41.31496810913086, "global_step": 213055, "epoch": 1760} {"train_loss": -40.69920349121094, "global_step": 213056, "epoch": 1760} {"train_loss": -41.82650375366211, "global_step": 213057, "epoch": 1760} {"train_loss": -41.93451690673828, "global_step": 213058, "epoch": 1760} {"train_loss": -40.81289291381836, "global_step": 213059, "epoch": 1760} {"train_loss": -42.23683547973633, "global_step": 213060, "epoch": 1760} {"train_loss": -41.23887634277344, "global_step": 213061, "epoch": 1760} {"train_loss": -41.77063751220703, "global_step": 213062, "epoch": 1760} {"train_loss": -42.01548767089844, "global_step": 213063, "epoch": 1760} {"train_loss": -42.106319427490234, "global_step": 213064, "epoch": 1760} {"train_loss": -41.02925491333008, "global_step": 213065, "epoch": 1760} {"train_loss": -41.76972579956055, "global_step": 213066, "epoch": 1760} {"train_loss": -41.06986999511719, "global_step": 213067, "epoch": 1760} {"train_loss": -40.314491271972656, "global_step": 213068, "epoch": 1760} {"train_loss": -41.81342315673828, "global_step": 213069, "epoch": 1760} {"train_loss": -41.440860748291016, "global_step": 213070, "epoch": 1760} {"train_loss": -42.11289596557617, "global_step": 213071, "epoch": 1760} {"train_loss": -40.9935417175293, "global_step": 213072, "epoch": 1760} {"train_loss": -40.93646240234375, "global_step": 213073, "epoch": 1760} {"train_loss": -41.828819274902344, "global_step": 213074, "epoch": 1760} {"train_loss": -41.35798263549805, "global_step": 213075, "epoch": 1760} {"train_loss": -41.54572677612305, "global_step": 213076, "epoch": 1760} {"train_loss": -41.710044860839844, "global_step": 213077, "epoch": 1760} {"train_loss": -41.3960075378418, "global_step": 213078, "epoch": 1760} {"train_loss": -41.8843879699707, "global_step": 213079, "epoch": 1760} {"train_loss": -41.606888384858436, "global_step": 213080, "epoch": 1760, "val_loss": 2599902.0} {"train_loss": -41.70029830932617, "global_step": 213081, "epoch": 1761} {"train_loss": -41.75327682495117, "global_step": 213082, "epoch": 1761} {"train_loss": -42.41399002075195, "global_step": 213083, "epoch": 1761} {"train_loss": -41.63756561279297, "global_step": 213084, "epoch": 1761} {"train_loss": -42.10978317260742, "global_step": 213085, "epoch": 1761} {"train_loss": -41.70530319213867, "global_step": 213086, "epoch": 1761} {"train_loss": -41.99209213256836, "global_step": 213087, "epoch": 1761} {"train_loss": -42.07860565185547, "global_step": 213088, "epoch": 1761} {"train_loss": -42.23476791381836, "global_step": 213089, "epoch": 1761} {"train_loss": -42.20561218261719, "global_step": 213090, "epoch": 1761} {"train_loss": -42.131954193115234, "global_step": 213091, "epoch": 1761} {"train_loss": -42.10235595703125, "global_step": 213092, "epoch": 1761} {"train_loss": -42.97095489501953, "global_step": 213093, "epoch": 1761} {"train_loss": -42.22369384765625, "global_step": 213094, "epoch": 1761} {"train_loss": -41.95370101928711, "global_step": 213095, "epoch": 1761} {"train_loss": -42.85341262817383, "global_step": 213096, "epoch": 1761} {"train_loss": -42.68910598754883, "global_step": 213097, "epoch": 1761} {"train_loss": -42.50543975830078, "global_step": 213098, "epoch": 1761} {"train_loss": -40.87938690185547, "global_step": 213099, "epoch": 1761} {"train_loss": -42.262115478515625, "global_step": 213100, "epoch": 1761} {"train_loss": -42.89008331298828, "global_step": 213101, "epoch": 1761} {"train_loss": -42.528499603271484, "global_step": 213102, "epoch": 1761} {"train_loss": -42.23236846923828, "global_step": 213103, "epoch": 1761} {"train_loss": -41.965187072753906, "global_step": 213104, "epoch": 1761} {"train_loss": -41.2534294128418, "global_step": 213105, "epoch": 1761} {"train_loss": -42.7070426940918, "global_step": 213106, "epoch": 1761} {"train_loss": -42.30976486206055, "global_step": 213107, "epoch": 1761} {"train_loss": -41.58599853515625, "global_step": 213108, "epoch": 1761} {"train_loss": -42.86267852783203, "global_step": 213109, "epoch": 1761} {"train_loss": -42.45791244506836, "global_step": 213110, "epoch": 1761} {"train_loss": -42.23081588745117, "global_step": 213111, "epoch": 1761} {"train_loss": -42.94277572631836, "global_step": 213112, "epoch": 1761} {"train_loss": -43.00657272338867, "global_step": 213113, "epoch": 1761} {"train_loss": -42.1852912902832, "global_step": 213114, "epoch": 1761} {"train_loss": -41.84608840942383, "global_step": 213115, "epoch": 1761} {"train_loss": -42.81317901611328, "global_step": 213116, "epoch": 1761} {"train_loss": -42.6900634765625, "global_step": 213117, "epoch": 1761} {"train_loss": -42.73765182495117, "global_step": 213118, "epoch": 1761} {"train_loss": -41.87993621826172, "global_step": 213119, "epoch": 1761} {"train_loss": -40.73322677612305, "global_step": 213120, "epoch": 1761} {"train_loss": -42.52488327026367, "global_step": 213121, "epoch": 1761} {"train_loss": -42.82181930541992, "global_step": 213122, "epoch": 1761} {"train_loss": -41.97613525390625, "global_step": 213123, "epoch": 1761} {"train_loss": -39.93486404418945, "global_step": 213124, "epoch": 1761} {"train_loss": -40.909515380859375, "global_step": 213125, "epoch": 1761} {"train_loss": -41.6933708190918, "global_step": 213126, "epoch": 1761} {"train_loss": -41.5838623046875, "global_step": 213127, "epoch": 1761} {"train_loss": -41.807350158691406, "global_step": 213128, "epoch": 1761} {"train_loss": -42.452728271484375, "global_step": 213129, "epoch": 1761} {"train_loss": -42.569644927978516, "global_step": 213130, "epoch": 1761} {"train_loss": -42.20569610595703, "global_step": 213131, "epoch": 1761} {"train_loss": -41.79201889038086, "global_step": 213132, "epoch": 1761} {"train_loss": -42.366050720214844, "global_step": 213133, "epoch": 1761} {"train_loss": -42.39495849609375, "global_step": 213134, "epoch": 1761} {"train_loss": -41.59055709838867, "global_step": 213135, "epoch": 1761} {"train_loss": -41.50368881225586, "global_step": 213136, "epoch": 1761} {"train_loss": -42.24372482299805, "global_step": 213137, "epoch": 1761} {"train_loss": -41.91377639770508, "global_step": 213138, "epoch": 1761} {"train_loss": -40.440521240234375, "global_step": 213139, "epoch": 1761} {"train_loss": -40.422576904296875, "global_step": 213140, "epoch": 1761} {"train_loss": -42.421348571777344, "global_step": 213141, "epoch": 1761} {"train_loss": -41.07877731323242, "global_step": 213142, "epoch": 1761} {"train_loss": -39.649330139160156, "global_step": 213143, "epoch": 1761} {"train_loss": -41.648765563964844, "global_step": 213144, "epoch": 1761} {"train_loss": -40.908504486083984, "global_step": 213145, "epoch": 1761} {"train_loss": -40.97065353393555, "global_step": 213146, "epoch": 1761} {"train_loss": -40.39614486694336, "global_step": 213147, "epoch": 1761} {"train_loss": -40.08698654174805, "global_step": 213148, "epoch": 1761} {"train_loss": -41.314918518066406, "global_step": 213149, "epoch": 1761} {"train_loss": -39.30760192871094, "global_step": 213150, "epoch": 1761} {"train_loss": -41.24116897583008, "global_step": 213151, "epoch": 1761} {"train_loss": -38.32666778564453, "global_step": 213152, "epoch": 1761} {"train_loss": -40.821327209472656, "global_step": 213153, "epoch": 1761} {"train_loss": -38.71537780761719, "global_step": 213154, "epoch": 1761} {"train_loss": -41.200721740722656, "global_step": 213155, "epoch": 1761} {"train_loss": -37.8071403503418, "global_step": 213156, "epoch": 1761} {"train_loss": -41.3985481262207, "global_step": 213157, "epoch": 1761} {"train_loss": -38.34630584716797, "global_step": 213158, "epoch": 1761} {"train_loss": -40.07637405395508, "global_step": 213159, "epoch": 1761} {"train_loss": -39.12961959838867, "global_step": 213160, "epoch": 1761} {"train_loss": -40.625240325927734, "global_step": 213161, "epoch": 1761} {"train_loss": -39.35090255737305, "global_step": 213162, "epoch": 1761} {"train_loss": -41.16011428833008, "global_step": 213163, "epoch": 1761} {"train_loss": -38.60966873168945, "global_step": 213164, "epoch": 1761} {"train_loss": -40.86021423339844, "global_step": 213165, "epoch": 1761} {"train_loss": -39.45539474487305, "global_step": 213166, "epoch": 1761} {"train_loss": -41.10667419433594, "global_step": 213167, "epoch": 1761} {"train_loss": -39.05181884765625, "global_step": 213168, "epoch": 1761} {"train_loss": -40.77394485473633, "global_step": 213169, "epoch": 1761} {"train_loss": -39.98222351074219, "global_step": 213170, "epoch": 1761} {"train_loss": -40.504764556884766, "global_step": 213171, "epoch": 1761} {"train_loss": -40.7852668762207, "global_step": 213172, "epoch": 1761} {"train_loss": -40.870765686035156, "global_step": 213173, "epoch": 1761} {"train_loss": -41.62944412231445, "global_step": 213174, "epoch": 1761} {"train_loss": -40.57016372680664, "global_step": 213175, "epoch": 1761} {"train_loss": -42.23796081542969, "global_step": 213176, "epoch": 1761} {"train_loss": -41.1925163269043, "global_step": 213177, "epoch": 1761} {"train_loss": -42.03730392456055, "global_step": 213178, "epoch": 1761} {"train_loss": -40.85028076171875, "global_step": 213179, "epoch": 1761} {"train_loss": -41.54643630981445, "global_step": 213180, "epoch": 1761} {"train_loss": -41.302894592285156, "global_step": 213181, "epoch": 1761} {"train_loss": -42.0394172668457, "global_step": 213182, "epoch": 1761} {"train_loss": -41.702022552490234, "global_step": 213183, "epoch": 1761} {"train_loss": -41.89522171020508, "global_step": 213184, "epoch": 1761} {"train_loss": -41.47134017944336, "global_step": 213185, "epoch": 1761} {"train_loss": -42.14063262939453, "global_step": 213186, "epoch": 1761} {"train_loss": -42.13920974731445, "global_step": 213187, "epoch": 1761} {"train_loss": -42.42314147949219, "global_step": 213188, "epoch": 1761} {"train_loss": -41.68392562866211, "global_step": 213189, "epoch": 1761} {"train_loss": -42.05078887939453, "global_step": 213190, "epoch": 1761} {"train_loss": -42.24844741821289, "global_step": 213191, "epoch": 1761} {"train_loss": -42.364444732666016, "global_step": 213192, "epoch": 1761} {"train_loss": -42.553646087646484, "global_step": 213193, "epoch": 1761} {"train_loss": -42.40176773071289, "global_step": 213194, "epoch": 1761} {"train_loss": -42.46451950073242, "global_step": 213195, "epoch": 1761} {"train_loss": -42.38631820678711, "global_step": 213196, "epoch": 1761} {"train_loss": -42.19685745239258, "global_step": 213197, "epoch": 1761} {"train_loss": -42.55906295776367, "global_step": 213198, "epoch": 1761} {"train_loss": -42.37638473510742, "global_step": 213199, "epoch": 1761} {"train_loss": -42.8202018737793, "global_step": 213200, "epoch": 1761} {"train_loss": -41.54719565525528, "global_step": 213201, "epoch": 1761, "val_loss": 2488797.75} {"train_loss": -42.859100341796875, "global_step": 213202, "epoch": 1762} {"train_loss": -41.93058395385742, "global_step": 213203, "epoch": 1762} {"train_loss": -42.19903564453125, "global_step": 213204, "epoch": 1762} {"train_loss": -41.48270797729492, "global_step": 213205, "epoch": 1762} {"train_loss": -42.645572662353516, "global_step": 213206, "epoch": 1762} {"train_loss": -42.5211067199707, "global_step": 213207, "epoch": 1762} {"train_loss": -42.5584602355957, "global_step": 213208, "epoch": 1762} {"train_loss": -42.83369064331055, "global_step": 213209, "epoch": 1762} {"train_loss": -43.01750564575195, "global_step": 213210, "epoch": 1762} {"train_loss": -43.02781295776367, "global_step": 213211, "epoch": 1762} {"train_loss": -42.91898727416992, "global_step": 213212, "epoch": 1762} {"train_loss": -42.812252044677734, "global_step": 213213, "epoch": 1762} {"train_loss": -43.118099212646484, "global_step": 213214, "epoch": 1762} {"train_loss": -42.71700668334961, "global_step": 213215, "epoch": 1762} {"train_loss": -42.35563278198242, "global_step": 213216, "epoch": 1762} {"train_loss": -42.98357009887695, "global_step": 213217, "epoch": 1762} {"train_loss": -42.66703414916992, "global_step": 213218, "epoch": 1762} {"train_loss": -42.32650375366211, "global_step": 213219, "epoch": 1762} {"train_loss": -40.54263687133789, "global_step": 213220, "epoch": 1762} {"train_loss": -41.00136947631836, "global_step": 213221, "epoch": 1762} {"train_loss": -41.956199645996094, "global_step": 213222, "epoch": 1762} {"train_loss": -43.20584487915039, "global_step": 213223, "epoch": 1762} {"train_loss": -42.0751953125, "global_step": 213224, "epoch": 1762} {"train_loss": -40.78493881225586, "global_step": 213225, "epoch": 1762} {"train_loss": -41.54671859741211, "global_step": 213226, "epoch": 1762} {"train_loss": -42.969234466552734, "global_step": 213227, "epoch": 1762} {"train_loss": -41.108543395996094, "global_step": 213228, "epoch": 1762} {"train_loss": -38.75960922241211, "global_step": 213229, "epoch": 1762} {"train_loss": -38.45356369018555, "global_step": 213230, "epoch": 1762} {"train_loss": -41.0721435546875, "global_step": 213231, "epoch": 1762} {"train_loss": -41.755062103271484, "global_step": 213232, "epoch": 1762} {"train_loss": -39.65863800048828, "global_step": 213233, "epoch": 1762} {"train_loss": -41.06754684448242, "global_step": 213234, "epoch": 1762} {"train_loss": -42.90032958984375, "global_step": 213235, "epoch": 1762} {"train_loss": -41.28756332397461, "global_step": 213236, "epoch": 1762} {"train_loss": -38.62451934814453, "global_step": 213237, "epoch": 1762} {"train_loss": -41.91408920288086, "global_step": 213238, "epoch": 1762} {"train_loss": -38.384334564208984, "global_step": 213239, "epoch": 1762} {"train_loss": -40.147743225097656, "global_step": 213240, "epoch": 1762} {"train_loss": -41.6528434753418, "global_step": 213241, "epoch": 1762} {"train_loss": -40.7326774597168, "global_step": 213242, "epoch": 1762} {"train_loss": -41.6883544921875, "global_step": 213243, "epoch": 1762} {"train_loss": -40.62673568725586, "global_step": 213244, "epoch": 1762} {"train_loss": -42.48909378051758, "global_step": 213245, "epoch": 1762} {"train_loss": -40.426422119140625, "global_step": 213246, "epoch": 1762} {"train_loss": -39.965911865234375, "global_step": 213247, "epoch": 1762} {"train_loss": -40.028987884521484, "global_step": 213248, "epoch": 1762} {"train_loss": -40.25654983520508, "global_step": 213249, "epoch": 1762} {"train_loss": -41.3368034362793, "global_step": 213250, "epoch": 1762} {"train_loss": -39.15806579589844, "global_step": 213251, "epoch": 1762} {"train_loss": -40.266578674316406, "global_step": 213252, "epoch": 1762} {"train_loss": -41.4051399230957, "global_step": 213253, "epoch": 1762} {"train_loss": -39.12771224975586, "global_step": 213254, "epoch": 1762} {"train_loss": -40.17231369018555, "global_step": 213255, "epoch": 1762} {"train_loss": -41.563968658447266, "global_step": 213256, "epoch": 1762} {"train_loss": -40.4228630065918, "global_step": 213257, "epoch": 1762} {"train_loss": -40.155616760253906, "global_step": 213258, "epoch": 1762} {"train_loss": -40.57715606689453, "global_step": 213259, "epoch": 1762} {"train_loss": -39.97671127319336, "global_step": 213260, "epoch": 1762} {"train_loss": -40.037635803222656, "global_step": 213261, "epoch": 1762} {"train_loss": -40.0137825012207, "global_step": 213262, "epoch": 1762} {"train_loss": -40.99973678588867, "global_step": 213263, "epoch": 1762} {"train_loss": -40.58224105834961, "global_step": 213264, "epoch": 1762} {"train_loss": -41.56132888793945, "global_step": 213265, "epoch": 1762} {"train_loss": -39.91493606567383, "global_step": 213266, "epoch": 1762} {"train_loss": -41.149024963378906, "global_step": 213267, "epoch": 1762} {"train_loss": -41.40032196044922, "global_step": 213268, "epoch": 1762} {"train_loss": -40.76752471923828, "global_step": 213269, "epoch": 1762} {"train_loss": -40.6983757019043, "global_step": 213270, "epoch": 1762} {"train_loss": -41.68900680541992, "global_step": 213271, "epoch": 1762} {"train_loss": -42.09347152709961, "global_step": 213272, "epoch": 1762} {"train_loss": -41.909210205078125, "global_step": 213273, "epoch": 1762} {"train_loss": -41.296199798583984, "global_step": 213274, "epoch": 1762} {"train_loss": -41.91339111328125, "global_step": 213275, "epoch": 1762} {"train_loss": -41.51515579223633, "global_step": 213276, "epoch": 1762} {"train_loss": -41.54056930541992, "global_step": 213277, "epoch": 1762} {"train_loss": -41.71883010864258, "global_step": 213278, "epoch": 1762} {"train_loss": -41.65525436401367, "global_step": 213279, "epoch": 1762} {"train_loss": -41.45738220214844, "global_step": 213280, "epoch": 1762} {"train_loss": -40.93697738647461, "global_step": 213281, "epoch": 1762} {"train_loss": -41.88531494140625, "global_step": 213282, "epoch": 1762} {"train_loss": -42.09318161010742, "global_step": 213283, "epoch": 1762} {"train_loss": -42.133975982666016, "global_step": 213284, "epoch": 1762} {"train_loss": -42.45893859863281, "global_step": 213285, "epoch": 1762} {"train_loss": -41.797401428222656, "global_step": 213286, "epoch": 1762} {"train_loss": -41.615840911865234, "global_step": 213287, "epoch": 1762} {"train_loss": -41.111549377441406, "global_step": 213288, "epoch": 1762} {"train_loss": -41.05181884765625, "global_step": 213289, "epoch": 1762} {"train_loss": -42.0265007019043, "global_step": 213290, "epoch": 1762} {"train_loss": -41.46202087402344, "global_step": 213291, "epoch": 1762} {"train_loss": -41.28879165649414, "global_step": 213292, "epoch": 1762} {"train_loss": -41.068519592285156, "global_step": 213293, "epoch": 1762} {"train_loss": -42.16864013671875, "global_step": 213294, "epoch": 1762} {"train_loss": -41.05173873901367, "global_step": 213295, "epoch": 1762} {"train_loss": -40.63456344604492, "global_step": 213296, "epoch": 1762} {"train_loss": -42.30232620239258, "global_step": 213297, "epoch": 1762} {"train_loss": -40.94253158569336, "global_step": 213298, "epoch": 1762} {"train_loss": -41.46748352050781, "global_step": 213299, "epoch": 1762} {"train_loss": -41.75027084350586, "global_step": 213300, "epoch": 1762} {"train_loss": -42.7176399230957, "global_step": 213301, "epoch": 1762} {"train_loss": -41.682987213134766, "global_step": 213302, "epoch": 1762} {"train_loss": -42.372833251953125, "global_step": 213303, "epoch": 1762} {"train_loss": -42.66497802734375, "global_step": 213304, "epoch": 1762} {"train_loss": -42.5147590637207, "global_step": 213305, "epoch": 1762} {"train_loss": -42.53059768676758, "global_step": 213306, "epoch": 1762} {"train_loss": -42.34917449951172, "global_step": 213307, "epoch": 1762} {"train_loss": -42.71977996826172, "global_step": 213308, "epoch": 1762} {"train_loss": -42.83583450317383, "global_step": 213309, "epoch": 1762} {"train_loss": -42.3372917175293, "global_step": 213310, "epoch": 1762} {"train_loss": -41.89282989501953, "global_step": 213311, "epoch": 1762} {"train_loss": -41.492916107177734, "global_step": 213312, "epoch": 1762} {"train_loss": -41.44579315185547, "global_step": 213313, "epoch": 1762} {"train_loss": -41.55617141723633, "global_step": 213314, "epoch": 1762} {"train_loss": -40.08661651611328, "global_step": 213315, "epoch": 1762} {"train_loss": -41.2795524597168, "global_step": 213316, "epoch": 1762} {"train_loss": -41.316856384277344, "global_step": 213317, "epoch": 1762} {"train_loss": -42.449615478515625, "global_step": 213318, "epoch": 1762} {"train_loss": -42.33012771606445, "global_step": 213319, "epoch": 1762} {"train_loss": -40.819976806640625, "global_step": 213320, "epoch": 1762} {"train_loss": -41.288970947265625, "global_step": 213321, "epoch": 1762} {"train_loss": -41.45486484874379, "global_step": 213322, "epoch": 1762, "val_loss": 2541176.75} {"train_loss": -41.81202697753906, "global_step": 213323, "epoch": 1763} {"train_loss": -38.943206787109375, "global_step": 213324, "epoch": 1763} {"train_loss": -40.14026641845703, "global_step": 213325, "epoch": 1763} {"train_loss": -41.39089584350586, "global_step": 213326, "epoch": 1763} {"train_loss": -40.67287826538086, "global_step": 213327, "epoch": 1763} {"train_loss": -40.7867317199707, "global_step": 213328, "epoch": 1763} {"train_loss": -41.809814453125, "global_step": 213329, "epoch": 1763} {"train_loss": -40.77743148803711, "global_step": 213330, "epoch": 1763} {"train_loss": -41.23854446411133, "global_step": 213331, "epoch": 1763} {"train_loss": -41.94160461425781, "global_step": 213332, "epoch": 1763} {"train_loss": -39.82136917114258, "global_step": 213333, "epoch": 1763} {"train_loss": -42.512977600097656, "global_step": 213334, "epoch": 1763} {"train_loss": -39.599609375, "global_step": 213335, "epoch": 1763} {"train_loss": -42.09661865234375, "global_step": 213336, "epoch": 1763} {"train_loss": -42.41019821166992, "global_step": 213337, "epoch": 1763} {"train_loss": -40.59298324584961, "global_step": 213338, "epoch": 1763} {"train_loss": -42.449737548828125, "global_step": 213339, "epoch": 1763} {"train_loss": -41.12176513671875, "global_step": 213340, "epoch": 1763} {"train_loss": -42.02379608154297, "global_step": 213341, "epoch": 1763} {"train_loss": -43.00221633911133, "global_step": 213342, "epoch": 1763} {"train_loss": -42.08390426635742, "global_step": 213343, "epoch": 1763} {"train_loss": -42.02030563354492, "global_step": 213344, "epoch": 1763} {"train_loss": -42.16262435913086, "global_step": 213345, "epoch": 1763} {"train_loss": -42.173919677734375, "global_step": 213346, "epoch": 1763} {"train_loss": -41.42855453491211, "global_step": 213347, "epoch": 1763} {"train_loss": -42.0953254699707, "global_step": 213348, "epoch": 1763} {"train_loss": -42.570980072021484, "global_step": 213349, "epoch": 1763} {"train_loss": -40.42782211303711, "global_step": 213350, "epoch": 1763} {"train_loss": -42.00751495361328, "global_step": 213351, "epoch": 1763} {"train_loss": -41.96442794799805, "global_step": 213352, "epoch": 1763} {"train_loss": -41.06219482421875, "global_step": 213353, "epoch": 1763} {"train_loss": -41.44792938232422, "global_step": 213354, "epoch": 1763} {"train_loss": -41.11668014526367, "global_step": 213355, "epoch": 1763} {"train_loss": -40.90407943725586, "global_step": 213356, "epoch": 1763} {"train_loss": -42.32108688354492, "global_step": 213357, "epoch": 1763} {"train_loss": -41.015201568603516, "global_step": 213358, "epoch": 1763} {"train_loss": -39.575565338134766, "global_step": 213359, "epoch": 1763} {"train_loss": -40.19401931762695, "global_step": 213360, "epoch": 1763} {"train_loss": -41.83480453491211, "global_step": 213361, "epoch": 1763} {"train_loss": -41.724544525146484, "global_step": 213362, "epoch": 1763} {"train_loss": -41.00325012207031, "global_step": 213363, "epoch": 1763} {"train_loss": -41.8435173034668, "global_step": 213364, "epoch": 1763} {"train_loss": -42.21509552001953, "global_step": 213365, "epoch": 1763} {"train_loss": -40.76070785522461, "global_step": 213366, "epoch": 1763} {"train_loss": -42.42306900024414, "global_step": 213367, "epoch": 1763} {"train_loss": -41.384620666503906, "global_step": 213368, "epoch": 1763} {"train_loss": -42.33445358276367, "global_step": 213369, "epoch": 1763} {"train_loss": -41.496368408203125, "global_step": 213370, "epoch": 1763} {"train_loss": -41.67660140991211, "global_step": 213371, "epoch": 1763} {"train_loss": -42.48102569580078, "global_step": 213372, "epoch": 1763} {"train_loss": -42.01220703125, "global_step": 213373, "epoch": 1763} {"train_loss": -42.15789031982422, "global_step": 213374, "epoch": 1763} {"train_loss": -41.601478576660156, "global_step": 213375, "epoch": 1763} {"train_loss": -41.30976486206055, "global_step": 213376, "epoch": 1763} {"train_loss": -42.53558349609375, "global_step": 213377, "epoch": 1763} {"train_loss": -41.41457748413086, "global_step": 213378, "epoch": 1763} {"train_loss": -42.09627914428711, "global_step": 213379, "epoch": 1763} {"train_loss": -42.112308502197266, "global_step": 213380, "epoch": 1763} {"train_loss": -42.056724548339844, "global_step": 213381, "epoch": 1763} {"train_loss": -41.367340087890625, "global_step": 213382, "epoch": 1763} {"train_loss": -42.53877639770508, "global_step": 213383, "epoch": 1763} {"train_loss": -41.427337646484375, "global_step": 213384, "epoch": 1763} {"train_loss": -41.890316009521484, "global_step": 213385, "epoch": 1763} {"train_loss": -42.596492767333984, "global_step": 213386, "epoch": 1763} {"train_loss": -42.403377532958984, "global_step": 213387, "epoch": 1763} {"train_loss": -41.567543029785156, "global_step": 213388, "epoch": 1763} {"train_loss": -42.23687744140625, "global_step": 213389, "epoch": 1763} {"train_loss": -42.43684387207031, "global_step": 213390, "epoch": 1763} {"train_loss": -42.16716766357422, "global_step": 213391, "epoch": 1763} {"train_loss": -42.53615951538086, "global_step": 213392, "epoch": 1763} {"train_loss": -41.5215950012207, "global_step": 213393, "epoch": 1763} {"train_loss": -42.737117767333984, "global_step": 213394, "epoch": 1763} {"train_loss": -43.028656005859375, "global_step": 213395, "epoch": 1763} {"train_loss": -41.73371505737305, "global_step": 213396, "epoch": 1763} {"train_loss": -42.906158447265625, "global_step": 213397, "epoch": 1763} {"train_loss": -43.029842376708984, "global_step": 213398, "epoch": 1763} {"train_loss": -42.928871154785156, "global_step": 213399, "epoch": 1763} {"train_loss": -42.870574951171875, "global_step": 213400, "epoch": 1763} {"train_loss": -42.10836410522461, "global_step": 213401, "epoch": 1763} {"train_loss": -42.61524963378906, "global_step": 213402, "epoch": 1763} {"train_loss": -42.6505241394043, "global_step": 213403, "epoch": 1763} {"train_loss": -41.7972297668457, "global_step": 213404, "epoch": 1763} {"train_loss": -42.348785400390625, "global_step": 213405, "epoch": 1763} {"train_loss": -41.82882308959961, "global_step": 213406, "epoch": 1763} {"train_loss": -42.34263229370117, "global_step": 213407, "epoch": 1763} {"train_loss": -42.206024169921875, "global_step": 213408, "epoch": 1763} {"train_loss": -42.377357482910156, "global_step": 213409, "epoch": 1763} {"train_loss": -41.103572845458984, "global_step": 213410, "epoch": 1763} {"train_loss": -41.69032669067383, "global_step": 213411, "epoch": 1763} {"train_loss": -42.73698806762695, "global_step": 213412, "epoch": 1763} {"train_loss": -41.774410247802734, "global_step": 213413, "epoch": 1763} {"train_loss": -40.473663330078125, "global_step": 213414, "epoch": 1763} {"train_loss": -39.2739143371582, "global_step": 213415, "epoch": 1763} {"train_loss": -43.095550537109375, "global_step": 213416, "epoch": 1763} {"train_loss": -42.0291862487793, "global_step": 213417, "epoch": 1763} {"train_loss": -41.16401290893555, "global_step": 213418, "epoch": 1763} {"train_loss": -41.857879638671875, "global_step": 213419, "epoch": 1763} {"train_loss": -41.78779220581055, "global_step": 213420, "epoch": 1763} {"train_loss": -39.92920684814453, "global_step": 213421, "epoch": 1763} {"train_loss": -40.1881217956543, "global_step": 213422, "epoch": 1763} {"train_loss": -41.119625091552734, "global_step": 213423, "epoch": 1763} {"train_loss": -41.01593017578125, "global_step": 213424, "epoch": 1763} {"train_loss": -42.48166275024414, "global_step": 213425, "epoch": 1763} {"train_loss": -41.78556823730469, "global_step": 213426, "epoch": 1763} {"train_loss": -41.98171615600586, "global_step": 213427, "epoch": 1763} {"train_loss": -42.18110656738281, "global_step": 213428, "epoch": 1763} {"train_loss": -42.410762786865234, "global_step": 213429, "epoch": 1763} {"train_loss": -41.78889465332031, "global_step": 213430, "epoch": 1763} {"train_loss": -40.03512191772461, "global_step": 213431, "epoch": 1763} {"train_loss": -41.999385833740234, "global_step": 213432, "epoch": 1763} {"train_loss": -40.96015930175781, "global_step": 213433, "epoch": 1763} {"train_loss": -41.979736328125, "global_step": 213434, "epoch": 1763} {"train_loss": -40.44297409057617, "global_step": 213435, "epoch": 1763} {"train_loss": -42.26639938354492, "global_step": 213436, "epoch": 1763} {"train_loss": -41.78450012207031, "global_step": 213437, "epoch": 1763} {"train_loss": -41.554779052734375, "global_step": 213438, "epoch": 1763} {"train_loss": -42.31787109375, "global_step": 213439, "epoch": 1763} {"train_loss": -40.972328186035156, "global_step": 213440, "epoch": 1763} {"train_loss": -41.86433029174805, "global_step": 213441, "epoch": 1763} {"train_loss": -41.061798095703125, "global_step": 213442, "epoch": 1763} {"train_loss": -41.69708103778934, "global_step": 213443, "epoch": 1763, "val_loss": 2510275.75} {"train_loss": -42.419517517089844, "global_step": 213444, "epoch": 1764} {"train_loss": -41.313411712646484, "global_step": 213445, "epoch": 1764} {"train_loss": -40.38349533081055, "global_step": 213446, "epoch": 1764} {"train_loss": -42.05064010620117, "global_step": 213447, "epoch": 1764} {"train_loss": -41.34070587158203, "global_step": 213448, "epoch": 1764} {"train_loss": -41.833099365234375, "global_step": 213449, "epoch": 1764} {"train_loss": -40.747657775878906, "global_step": 213450, "epoch": 1764} {"train_loss": -41.531089782714844, "global_step": 213451, "epoch": 1764} {"train_loss": -41.003902435302734, "global_step": 213452, "epoch": 1764} {"train_loss": -42.27933883666992, "global_step": 213453, "epoch": 1764} {"train_loss": -41.419368743896484, "global_step": 213454, "epoch": 1764} {"train_loss": -41.700199127197266, "global_step": 213455, "epoch": 1764} {"train_loss": -41.43986892700195, "global_step": 213456, "epoch": 1764} {"train_loss": -42.17112731933594, "global_step": 213457, "epoch": 1764} {"train_loss": -41.62952423095703, "global_step": 213458, "epoch": 1764} {"train_loss": -42.08856964111328, "global_step": 213459, "epoch": 1764} {"train_loss": -41.088191986083984, "global_step": 213460, "epoch": 1764} {"train_loss": -42.967472076416016, "global_step": 213461, "epoch": 1764} {"train_loss": -41.297607421875, "global_step": 213462, "epoch": 1764} {"train_loss": -42.68709182739258, "global_step": 213463, "epoch": 1764} {"train_loss": -41.775447845458984, "global_step": 213464, "epoch": 1764} {"train_loss": -42.232322692871094, "global_step": 213465, "epoch": 1764} {"train_loss": -42.78792190551758, "global_step": 213466, "epoch": 1764} {"train_loss": -42.42152404785156, "global_step": 213467, "epoch": 1764} {"train_loss": -42.630550384521484, "global_step": 213468, "epoch": 1764} {"train_loss": -42.295894622802734, "global_step": 213469, "epoch": 1764} {"train_loss": -41.77085876464844, "global_step": 213470, "epoch": 1764} {"train_loss": -42.96714401245117, "global_step": 213471, "epoch": 1764} {"train_loss": -42.75679397583008, "global_step": 213472, "epoch": 1764} {"train_loss": -41.506752014160156, "global_step": 213473, "epoch": 1764} {"train_loss": -42.61555099487305, "global_step": 213474, "epoch": 1764} {"train_loss": -40.76742172241211, "global_step": 213475, "epoch": 1764} {"train_loss": -41.603858947753906, "global_step": 213476, "epoch": 1764} {"train_loss": -41.94407272338867, "global_step": 213477, "epoch": 1764} {"train_loss": -42.27774429321289, "global_step": 213478, "epoch": 1764} {"train_loss": -42.81441116333008, "global_step": 213479, "epoch": 1764} {"train_loss": -42.76274490356445, "global_step": 213480, "epoch": 1764} {"train_loss": -39.686607360839844, "global_step": 213481, "epoch": 1764} {"train_loss": -42.52199935913086, "global_step": 213482, "epoch": 1764} {"train_loss": -42.216678619384766, "global_step": 213483, "epoch": 1764} {"train_loss": -42.47666931152344, "global_step": 213484, "epoch": 1764} {"train_loss": -41.84833526611328, "global_step": 213485, "epoch": 1764} {"train_loss": -42.448909759521484, "global_step": 213486, "epoch": 1764} {"train_loss": -42.14662170410156, "global_step": 213487, "epoch": 1764} {"train_loss": -40.354888916015625, "global_step": 213488, "epoch": 1764} {"train_loss": -42.16753005981445, "global_step": 213489, "epoch": 1764} {"train_loss": -42.16353225708008, "global_step": 213490, "epoch": 1764} {"train_loss": -43.095314025878906, "global_step": 213491, "epoch": 1764} {"train_loss": -42.20965576171875, "global_step": 213492, "epoch": 1764} {"train_loss": -41.3087272644043, "global_step": 213493, "epoch": 1764} {"train_loss": -40.70435333251953, "global_step": 213494, "epoch": 1764} {"train_loss": -40.73112106323242, "global_step": 213495, "epoch": 1764} {"train_loss": -39.83897399902344, "global_step": 213496, "epoch": 1764} {"train_loss": -41.84182357788086, "global_step": 213497, "epoch": 1764} {"train_loss": -41.299964904785156, "global_step": 213498, "epoch": 1764} {"train_loss": -40.658607482910156, "global_step": 213499, "epoch": 1764} {"train_loss": -39.474891662597656, "global_step": 213500, "epoch": 1764} {"train_loss": -38.400238037109375, "global_step": 213501, "epoch": 1764} {"train_loss": -42.005950927734375, "global_step": 213502, "epoch": 1764} {"train_loss": -41.78072738647461, "global_step": 213503, "epoch": 1764} {"train_loss": -39.04874038696289, "global_step": 213504, "epoch": 1764} {"train_loss": -40.89834213256836, "global_step": 213505, "epoch": 1764} {"train_loss": -40.85032272338867, "global_step": 213506, "epoch": 1764} {"train_loss": -40.6983642578125, "global_step": 213507, "epoch": 1764} {"train_loss": -41.45936965942383, "global_step": 213508, "epoch": 1764} {"train_loss": -41.137718200683594, "global_step": 213509, "epoch": 1764} {"train_loss": -41.82279586791992, "global_step": 213510, "epoch": 1764} {"train_loss": -42.64229965209961, "global_step": 213511, "epoch": 1764} {"train_loss": -41.40227508544922, "global_step": 213512, "epoch": 1764} {"train_loss": -41.7159309387207, "global_step": 213513, "epoch": 1764} {"train_loss": -42.08089065551758, "global_step": 213514, "epoch": 1764} {"train_loss": -42.30437088012695, "global_step": 213515, "epoch": 1764} {"train_loss": -41.17648696899414, "global_step": 213516, "epoch": 1764} {"train_loss": -40.77445983886719, "global_step": 213517, "epoch": 1764} {"train_loss": -42.507266998291016, "global_step": 213518, "epoch": 1764} {"train_loss": -42.17310333251953, "global_step": 213519, "epoch": 1764} {"train_loss": -42.097137451171875, "global_step": 213520, "epoch": 1764} {"train_loss": -42.904266357421875, "global_step": 213521, "epoch": 1764} {"train_loss": -42.162540435791016, "global_step": 213522, "epoch": 1764} {"train_loss": -42.866451263427734, "global_step": 213523, "epoch": 1764} {"train_loss": -41.75413131713867, "global_step": 213524, "epoch": 1764} {"train_loss": -41.2920036315918, "global_step": 213525, "epoch": 1764} {"train_loss": -41.629615783691406, "global_step": 213526, "epoch": 1764} {"train_loss": -42.45894241333008, "global_step": 213527, "epoch": 1764} {"train_loss": -43.102455139160156, "global_step": 213528, "epoch": 1764} {"train_loss": -42.653602600097656, "global_step": 213529, "epoch": 1764} {"train_loss": -42.654300689697266, "global_step": 213530, "epoch": 1764} {"train_loss": -40.70590591430664, "global_step": 213531, "epoch": 1764} {"train_loss": -38.08220291137695, "global_step": 213532, "epoch": 1764} {"train_loss": -42.43717956542969, "global_step": 213533, "epoch": 1764} {"train_loss": -41.122047424316406, "global_step": 213534, "epoch": 1764} {"train_loss": -40.4218635559082, "global_step": 213535, "epoch": 1764} {"train_loss": -41.87538528442383, "global_step": 213536, "epoch": 1764} {"train_loss": -42.06168746948242, "global_step": 213537, "epoch": 1764} {"train_loss": -42.348228454589844, "global_step": 213538, "epoch": 1764} {"train_loss": -42.08422088623047, "global_step": 213539, "epoch": 1764} {"train_loss": -41.6111946105957, "global_step": 213540, "epoch": 1764} {"train_loss": -42.41986846923828, "global_step": 213541, "epoch": 1764} {"train_loss": -42.38654708862305, "global_step": 213542, "epoch": 1764} {"train_loss": -42.21925735473633, "global_step": 213543, "epoch": 1764} {"train_loss": -41.62018585205078, "global_step": 213544, "epoch": 1764} {"train_loss": -42.18052291870117, "global_step": 213545, "epoch": 1764} {"train_loss": -41.73701095581055, "global_step": 213546, "epoch": 1764} {"train_loss": -42.263450622558594, "global_step": 213547, "epoch": 1764} {"train_loss": -40.75541305541992, "global_step": 213548, "epoch": 1764} {"train_loss": -41.98097229003906, "global_step": 213549, "epoch": 1764} {"train_loss": -42.71970748901367, "global_step": 213550, "epoch": 1764} {"train_loss": -42.148651123046875, "global_step": 213551, "epoch": 1764} {"train_loss": -41.56482696533203, "global_step": 213552, "epoch": 1764} {"train_loss": -41.32997512817383, "global_step": 213553, "epoch": 1764} {"train_loss": -42.96718978881836, "global_step": 213554, "epoch": 1764} {"train_loss": -42.263755798339844, "global_step": 213555, "epoch": 1764} {"train_loss": -39.44761276245117, "global_step": 213556, "epoch": 1764} {"train_loss": -41.131324768066406, "global_step": 213557, "epoch": 1764} {"train_loss": -42.60400390625, "global_step": 213558, "epoch": 1764} {"train_loss": -41.28688430786133, "global_step": 213559, "epoch": 1764} {"train_loss": -40.80263900756836, "global_step": 213560, "epoch": 1764} {"train_loss": -41.53676986694336, "global_step": 213561, "epoch": 1764} {"train_loss": -41.7880973815918, "global_step": 213562, "epoch": 1764} {"train_loss": -40.66663360595703, "global_step": 213563, "epoch": 1764} {"train_loss": -41.697085640647195, "global_step": 213564, "epoch": 1764, "val_loss": 2676567.75} {"train_loss": -41.16180419921875, "global_step": 213565, "epoch": 1765} {"train_loss": -40.873661041259766, "global_step": 213566, "epoch": 1765} {"train_loss": -41.22187423706055, "global_step": 213567, "epoch": 1765} {"train_loss": -40.24409866333008, "global_step": 213568, "epoch": 1765} {"train_loss": -41.47819137573242, "global_step": 213569, "epoch": 1765} {"train_loss": -41.17919921875, "global_step": 213570, "epoch": 1765} {"train_loss": -41.324676513671875, "global_step": 213571, "epoch": 1765} {"train_loss": -41.15852355957031, "global_step": 213572, "epoch": 1765} {"train_loss": -40.44307327270508, "global_step": 213573, "epoch": 1765} {"train_loss": -41.893184661865234, "global_step": 213574, "epoch": 1765} {"train_loss": -41.228328704833984, "global_step": 213575, "epoch": 1765} {"train_loss": -41.416194915771484, "global_step": 213576, "epoch": 1765} {"train_loss": -41.72422409057617, "global_step": 213577, "epoch": 1765} {"train_loss": -40.0086784362793, "global_step": 213578, "epoch": 1765} {"train_loss": -40.06480026245117, "global_step": 213579, "epoch": 1765} {"train_loss": -42.39680862426758, "global_step": 213580, "epoch": 1765} {"train_loss": -41.5386848449707, "global_step": 213581, "epoch": 1765} {"train_loss": -41.149044036865234, "global_step": 213582, "epoch": 1765} {"train_loss": -42.67939376831055, "global_step": 213583, "epoch": 1765} {"train_loss": -41.23166275024414, "global_step": 213584, "epoch": 1765} {"train_loss": -41.48142623901367, "global_step": 213585, "epoch": 1765} {"train_loss": -42.190128326416016, "global_step": 213586, "epoch": 1765} {"train_loss": -40.58391189575195, "global_step": 213587, "epoch": 1765} {"train_loss": -42.05328369140625, "global_step": 213588, "epoch": 1765} {"train_loss": -42.185787200927734, "global_step": 213589, "epoch": 1765} {"train_loss": -41.201812744140625, "global_step": 213590, "epoch": 1765} {"train_loss": -42.76499557495117, "global_step": 213591, "epoch": 1765} {"train_loss": -41.34824752807617, "global_step": 213592, "epoch": 1765} {"train_loss": -41.20762252807617, "global_step": 213593, "epoch": 1765} {"train_loss": -41.703208923339844, "global_step": 213594, "epoch": 1765} {"train_loss": -41.693016052246094, "global_step": 213595, "epoch": 1765} {"train_loss": -42.14023971557617, "global_step": 213596, "epoch": 1765} {"train_loss": -41.31528854370117, "global_step": 213597, "epoch": 1765} {"train_loss": -42.454280853271484, "global_step": 213598, "epoch": 1765} {"train_loss": -41.521385192871094, "global_step": 213599, "epoch": 1765} {"train_loss": -42.14900207519531, "global_step": 213600, "epoch": 1765} {"train_loss": -41.807960510253906, "global_step": 213601, "epoch": 1765} {"train_loss": -41.9229850769043, "global_step": 213602, "epoch": 1765} {"train_loss": -42.27503204345703, "global_step": 213603, "epoch": 1765} {"train_loss": -42.001888275146484, "global_step": 213604, "epoch": 1765} {"train_loss": -42.96592330932617, "global_step": 213605, "epoch": 1765} {"train_loss": -42.53995132446289, "global_step": 213606, "epoch": 1765} {"train_loss": -42.74892807006836, "global_step": 213607, "epoch": 1765} {"train_loss": -42.58399200439453, "global_step": 213608, "epoch": 1765} {"train_loss": -42.69395065307617, "global_step": 213609, "epoch": 1765} {"train_loss": -42.00236892700195, "global_step": 213610, "epoch": 1765} {"train_loss": -42.113460540771484, "global_step": 213611, "epoch": 1765} {"train_loss": -42.450801849365234, "global_step": 213612, "epoch": 1765} {"train_loss": -42.501522064208984, "global_step": 213613, "epoch": 1765} {"train_loss": -42.945098876953125, "global_step": 213614, "epoch": 1765} {"train_loss": -41.934814453125, "global_step": 213615, "epoch": 1765} {"train_loss": -43.07070541381836, "global_step": 213616, "epoch": 1765} {"train_loss": -42.970191955566406, "global_step": 213617, "epoch": 1765} {"train_loss": -42.40423583984375, "global_step": 213618, "epoch": 1765} {"train_loss": -42.39386749267578, "global_step": 213619, "epoch": 1765} {"train_loss": -42.996490478515625, "global_step": 213620, "epoch": 1765} {"train_loss": -42.7965202331543, "global_step": 213621, "epoch": 1765} {"train_loss": -43.08787536621094, "global_step": 213622, "epoch": 1765} {"train_loss": -42.47406768798828, "global_step": 213623, "epoch": 1765} {"train_loss": -42.71500778198242, "global_step": 213624, "epoch": 1765} {"train_loss": -42.3143424987793, "global_step": 213625, "epoch": 1765} {"train_loss": -42.07733917236328, "global_step": 213626, "epoch": 1765} {"train_loss": -42.73745346069336, "global_step": 213627, "epoch": 1765} {"train_loss": -42.646297454833984, "global_step": 213628, "epoch": 1765} {"train_loss": -42.728424072265625, "global_step": 213629, "epoch": 1765} {"train_loss": -42.146053314208984, "global_step": 213630, "epoch": 1765} {"train_loss": -42.48145294189453, "global_step": 213631, "epoch": 1765} {"train_loss": -41.54213333129883, "global_step": 213632, "epoch": 1765} {"train_loss": -42.605377197265625, "global_step": 213633, "epoch": 1765} {"train_loss": -43.0579833984375, "global_step": 213634, "epoch": 1765} {"train_loss": -42.498748779296875, "global_step": 213635, "epoch": 1765} {"train_loss": -42.839935302734375, "global_step": 213636, "epoch": 1765} {"train_loss": -42.87313461303711, "global_step": 213637, "epoch": 1765} {"train_loss": -42.50732421875, "global_step": 213638, "epoch": 1765} {"train_loss": -42.89976119995117, "global_step": 213639, "epoch": 1765} {"train_loss": -43.19682693481445, "global_step": 213640, "epoch": 1765} {"train_loss": -43.444297790527344, "global_step": 213641, "epoch": 1765} {"train_loss": -43.27797317504883, "global_step": 213642, "epoch": 1765} {"train_loss": -42.60537338256836, "global_step": 213643, "epoch": 1765} {"train_loss": -42.80680465698242, "global_step": 213644, "epoch": 1765} {"train_loss": -43.15592575073242, "global_step": 213645, "epoch": 1765} {"train_loss": -42.31367874145508, "global_step": 213646, "epoch": 1765} {"train_loss": -42.072139739990234, "global_step": 213647, "epoch": 1765} {"train_loss": -40.8232536315918, "global_step": 213648, "epoch": 1765} {"train_loss": -41.22808074951172, "global_step": 213649, "epoch": 1765} {"train_loss": -39.70132064819336, "global_step": 213650, "epoch": 1765} {"train_loss": -42.18031311035156, "global_step": 213651, "epoch": 1765} {"train_loss": -42.53982925415039, "global_step": 213652, "epoch": 1765} {"train_loss": -41.740230560302734, "global_step": 213653, "epoch": 1765} {"train_loss": -40.242244720458984, "global_step": 213654, "epoch": 1765} {"train_loss": -39.803077697753906, "global_step": 213655, "epoch": 1765} {"train_loss": -42.30439376831055, "global_step": 213656, "epoch": 1765} {"train_loss": -38.82343292236328, "global_step": 213657, "epoch": 1765} {"train_loss": -39.728267669677734, "global_step": 213658, "epoch": 1765} {"train_loss": -40.84449005126953, "global_step": 213659, "epoch": 1765} {"train_loss": -38.05884552001953, "global_step": 213660, "epoch": 1765} {"train_loss": -39.88628005981445, "global_step": 213661, "epoch": 1765} {"train_loss": -37.98298263549805, "global_step": 213662, "epoch": 1765} {"train_loss": -36.415985107421875, "global_step": 213663, "epoch": 1765} {"train_loss": -37.07861328125, "global_step": 213664, "epoch": 1765} {"train_loss": -38.075931549072266, "global_step": 213665, "epoch": 1765} {"train_loss": -38.35335159301758, "global_step": 213666, "epoch": 1765} {"train_loss": -37.66000747680664, "global_step": 213667, "epoch": 1765} {"train_loss": -38.6524543762207, "global_step": 213668, "epoch": 1765} {"train_loss": -36.913612365722656, "global_step": 213669, "epoch": 1765} {"train_loss": -39.02715301513672, "global_step": 213670, "epoch": 1765} {"train_loss": -37.72629928588867, "global_step": 213671, "epoch": 1765} {"train_loss": -39.122283935546875, "global_step": 213672, "epoch": 1765} {"train_loss": -39.04823684692383, "global_step": 213673, "epoch": 1765} {"train_loss": -40.94469451904297, "global_step": 213674, "epoch": 1765} {"train_loss": -40.657894134521484, "global_step": 213675, "epoch": 1765} {"train_loss": -41.13715744018555, "global_step": 213676, "epoch": 1765} {"train_loss": -40.30631637573242, "global_step": 213677, "epoch": 1765} {"train_loss": -40.577693939208984, "global_step": 213678, "epoch": 1765} {"train_loss": -41.52295684814453, "global_step": 213679, "epoch": 1765} {"train_loss": -40.87852096557617, "global_step": 213680, "epoch": 1765} {"train_loss": -41.61385726928711, "global_step": 213681, "epoch": 1765} {"train_loss": -40.0005989074707, "global_step": 213682, "epoch": 1765} {"train_loss": -41.7181396484375, "global_step": 213683, "epoch": 1765} {"train_loss": -41.00640869140625, "global_step": 213684, "epoch": 1765} {"train_loss": -41.40110340591305, "global_step": 213685, "epoch": 1765, "val_loss": 2552393.75} {"train_loss": -40.214107513427734, "global_step": 213686, "epoch": 1766} {"train_loss": -40.8883171081543, "global_step": 213687, "epoch": 1766} {"train_loss": -40.44416427612305, "global_step": 213688, "epoch": 1766} {"train_loss": -41.72317886352539, "global_step": 213689, "epoch": 1766} {"train_loss": -40.81051254272461, "global_step": 213690, "epoch": 1766} {"train_loss": -41.394020080566406, "global_step": 213691, "epoch": 1766} {"train_loss": -40.822322845458984, "global_step": 213692, "epoch": 1766} {"train_loss": -39.94890594482422, "global_step": 213693, "epoch": 1766} {"train_loss": -42.513160705566406, "global_step": 213694, "epoch": 1766} {"train_loss": -41.08434295654297, "global_step": 213695, "epoch": 1766} {"train_loss": -42.57343292236328, "global_step": 213696, "epoch": 1766} {"train_loss": -40.157318115234375, "global_step": 213697, "epoch": 1766} {"train_loss": -41.52512741088867, "global_step": 213698, "epoch": 1766} {"train_loss": -41.20013427734375, "global_step": 213699, "epoch": 1766} {"train_loss": -42.229061126708984, "global_step": 213700, "epoch": 1766} {"train_loss": -40.264991760253906, "global_step": 213701, "epoch": 1766} {"train_loss": -40.67939376831055, "global_step": 213702, "epoch": 1766} {"train_loss": -41.228248596191406, "global_step": 213703, "epoch": 1766} {"train_loss": -41.3434944152832, "global_step": 213704, "epoch": 1766} {"train_loss": -39.04608917236328, "global_step": 213705, "epoch": 1766} {"train_loss": -41.7086296081543, "global_step": 213706, "epoch": 1766} {"train_loss": -40.12984085083008, "global_step": 213707, "epoch": 1766} {"train_loss": -39.162349700927734, "global_step": 213708, "epoch": 1766} {"train_loss": -42.36613845825195, "global_step": 213709, "epoch": 1766} {"train_loss": -40.31458282470703, "global_step": 213710, "epoch": 1766} {"train_loss": -41.06682205200195, "global_step": 213711, "epoch": 1766} {"train_loss": -42.70293045043945, "global_step": 213712, "epoch": 1766} {"train_loss": -40.178585052490234, "global_step": 213713, "epoch": 1766} {"train_loss": -42.450679779052734, "global_step": 213714, "epoch": 1766} {"train_loss": -41.429195404052734, "global_step": 213715, "epoch": 1766} {"train_loss": -41.158931732177734, "global_step": 213716, "epoch": 1766} {"train_loss": -42.180259704589844, "global_step": 213717, "epoch": 1766} {"train_loss": -40.565155029296875, "global_step": 213718, "epoch": 1766} {"train_loss": -42.01503372192383, "global_step": 213719, "epoch": 1766} {"train_loss": -41.07865524291992, "global_step": 213720, "epoch": 1766} {"train_loss": -42.72978591918945, "global_step": 213721, "epoch": 1766} {"train_loss": -41.66556930541992, "global_step": 213722, "epoch": 1766} {"train_loss": -43.025550842285156, "global_step": 213723, "epoch": 1766} {"train_loss": -41.38904571533203, "global_step": 213724, "epoch": 1766} {"train_loss": -42.85519027709961, "global_step": 213725, "epoch": 1766} {"train_loss": -42.39651107788086, "global_step": 213726, "epoch": 1766} {"train_loss": -42.71197509765625, "global_step": 213727, "epoch": 1766} {"train_loss": -42.33526611328125, "global_step": 213728, "epoch": 1766} {"train_loss": -42.377071380615234, "global_step": 213729, "epoch": 1766} {"train_loss": -42.70005416870117, "global_step": 213730, "epoch": 1766} {"train_loss": -42.69746398925781, "global_step": 213731, "epoch": 1766} {"train_loss": -42.78655242919922, "global_step": 213732, "epoch": 1766} {"train_loss": -42.64036178588867, "global_step": 213733, "epoch": 1766} {"train_loss": -42.57118606567383, "global_step": 213734, "epoch": 1766} {"train_loss": -42.21857833862305, "global_step": 213735, "epoch": 1766} {"train_loss": -42.83293151855469, "global_step": 213736, "epoch": 1766} {"train_loss": -41.964324951171875, "global_step": 213737, "epoch": 1766} {"train_loss": -42.4581413269043, "global_step": 213738, "epoch": 1766} {"train_loss": -43.02238082885742, "global_step": 213739, "epoch": 1766} {"train_loss": -42.95361328125, "global_step": 213740, "epoch": 1766} {"train_loss": -42.2882080078125, "global_step": 213741, "epoch": 1766} {"train_loss": -42.86411666870117, "global_step": 213742, "epoch": 1766} {"train_loss": -42.01593017578125, "global_step": 213743, "epoch": 1766} {"train_loss": -42.74609375, "global_step": 213744, "epoch": 1766} {"train_loss": -42.47330093383789, "global_step": 213745, "epoch": 1766} {"train_loss": -42.915618896484375, "global_step": 213746, "epoch": 1766} {"train_loss": -41.79902267456055, "global_step": 213747, "epoch": 1766} {"train_loss": -43.22689437866211, "global_step": 213748, "epoch": 1766} {"train_loss": -42.766658782958984, "global_step": 213749, "epoch": 1766} {"train_loss": -42.47761154174805, "global_step": 213750, "epoch": 1766} {"train_loss": -42.730892181396484, "global_step": 213751, "epoch": 1766} {"train_loss": -42.80941390991211, "global_step": 213752, "epoch": 1766} {"train_loss": -41.24834060668945, "global_step": 213753, "epoch": 1766} {"train_loss": -42.503021240234375, "global_step": 213754, "epoch": 1766} {"train_loss": -42.63477325439453, "global_step": 213755, "epoch": 1766} {"train_loss": -42.86176300048828, "global_step": 213756, "epoch": 1766} {"train_loss": -42.559486389160156, "global_step": 213757, "epoch": 1766} {"train_loss": -43.1746940612793, "global_step": 213758, "epoch": 1766} {"train_loss": -43.21702194213867, "global_step": 213759, "epoch": 1766} {"train_loss": -43.00059509277344, "global_step": 213760, "epoch": 1766} {"train_loss": -42.8680534362793, "global_step": 213761, "epoch": 1766} {"train_loss": -43.09149169921875, "global_step": 213762, "epoch": 1766} {"train_loss": -43.17252731323242, "global_step": 213763, "epoch": 1766} {"train_loss": -42.76559066772461, "global_step": 213764, "epoch": 1766} {"train_loss": -42.34543991088867, "global_step": 213765, "epoch": 1766} {"train_loss": -43.16579055786133, "global_step": 213766, "epoch": 1766} {"train_loss": -42.02988815307617, "global_step": 213767, "epoch": 1766} {"train_loss": -41.82145309448242, "global_step": 213768, "epoch": 1766} {"train_loss": -42.912960052490234, "global_step": 213769, "epoch": 1766} {"train_loss": -41.33723068237305, "global_step": 213770, "epoch": 1766} {"train_loss": -39.09147644042969, "global_step": 213771, "epoch": 1766} {"train_loss": -42.630855560302734, "global_step": 213772, "epoch": 1766} {"train_loss": -40.64387893676758, "global_step": 213773, "epoch": 1766} {"train_loss": -41.82496643066406, "global_step": 213774, "epoch": 1766} {"train_loss": -42.02522659301758, "global_step": 213775, "epoch": 1766} {"train_loss": -39.159236907958984, "global_step": 213776, "epoch": 1766} {"train_loss": -42.997276306152344, "global_step": 213777, "epoch": 1766} {"train_loss": -39.54035949707031, "global_step": 213778, "epoch": 1766} {"train_loss": -42.34143829345703, "global_step": 213779, "epoch": 1766} {"train_loss": -41.214698791503906, "global_step": 213780, "epoch": 1766} {"train_loss": -40.79720687866211, "global_step": 213781, "epoch": 1766} {"train_loss": -41.462646484375, "global_step": 213782, "epoch": 1766} {"train_loss": -42.067562103271484, "global_step": 213783, "epoch": 1766} {"train_loss": -40.758766174316406, "global_step": 213784, "epoch": 1766} {"train_loss": -40.96284484863281, "global_step": 213785, "epoch": 1766} {"train_loss": -42.21794509887695, "global_step": 213786, "epoch": 1766} {"train_loss": -39.78621292114258, "global_step": 213787, "epoch": 1766} {"train_loss": -41.927425384521484, "global_step": 213788, "epoch": 1766} {"train_loss": -42.42045974731445, "global_step": 213789, "epoch": 1766} {"train_loss": -41.659141540527344, "global_step": 213790, "epoch": 1766} {"train_loss": -41.65955352783203, "global_step": 213791, "epoch": 1766} {"train_loss": -41.17621994018555, "global_step": 213792, "epoch": 1766} {"train_loss": -41.6181755065918, "global_step": 213793, "epoch": 1766} {"train_loss": -41.91376876831055, "global_step": 213794, "epoch": 1766} {"train_loss": -41.63432312011719, "global_step": 213795, "epoch": 1766} {"train_loss": -42.7391471862793, "global_step": 213796, "epoch": 1766} {"train_loss": -42.04862594604492, "global_step": 213797, "epoch": 1766} {"train_loss": -42.406368255615234, "global_step": 213798, "epoch": 1766} {"train_loss": -42.06155014038086, "global_step": 213799, "epoch": 1766} {"train_loss": -42.112892150878906, "global_step": 213800, "epoch": 1766} {"train_loss": -42.04207992553711, "global_step": 213801, "epoch": 1766} {"train_loss": -42.44792175292969, "global_step": 213802, "epoch": 1766} {"train_loss": -42.241363525390625, "global_step": 213803, "epoch": 1766} {"train_loss": -42.58567810058594, "global_step": 213804, "epoch": 1766} {"train_loss": -42.876888275146484, "global_step": 213805, "epoch": 1766} {"train_loss": -41.86281503724658, "global_step": 213806, "epoch": 1766, "val_loss": 2449259.0} {"train_loss": -41.1710205078125, "global_step": 213807, "epoch": 1767} {"train_loss": -42.837318420410156, "global_step": 213808, "epoch": 1767} {"train_loss": -42.36319351196289, "global_step": 213809, "epoch": 1767} {"train_loss": -41.89236068725586, "global_step": 213810, "epoch": 1767} {"train_loss": -41.28541564941406, "global_step": 213811, "epoch": 1767} {"train_loss": -41.116943359375, "global_step": 213812, "epoch": 1767} {"train_loss": -43.250335693359375, "global_step": 213813, "epoch": 1767} {"train_loss": -42.796260833740234, "global_step": 213814, "epoch": 1767} {"train_loss": -42.56279373168945, "global_step": 213815, "epoch": 1767} {"train_loss": -42.936702728271484, "global_step": 213816, "epoch": 1767} {"train_loss": -42.77470016479492, "global_step": 213817, "epoch": 1767} {"train_loss": -42.76180648803711, "global_step": 213818, "epoch": 1767} {"train_loss": -42.6292724609375, "global_step": 213819, "epoch": 1767} {"train_loss": -42.86420440673828, "global_step": 213820, "epoch": 1767} {"train_loss": -43.48116683959961, "global_step": 213821, "epoch": 1767} {"train_loss": -42.9571647644043, "global_step": 213822, "epoch": 1767} {"train_loss": -42.656192779541016, "global_step": 213823, "epoch": 1767} {"train_loss": -41.919593811035156, "global_step": 213824, "epoch": 1767} {"train_loss": -42.33632278442383, "global_step": 213825, "epoch": 1767} {"train_loss": -42.84590530395508, "global_step": 213826, "epoch": 1767} {"train_loss": -43.21085739135742, "global_step": 213827, "epoch": 1767} {"train_loss": -42.687416076660156, "global_step": 213828, "epoch": 1767} {"train_loss": -42.227542877197266, "global_step": 213829, "epoch": 1767} {"train_loss": -43.51845932006836, "global_step": 213830, "epoch": 1767} {"train_loss": -42.9511604309082, "global_step": 213831, "epoch": 1767} {"train_loss": -43.23603057861328, "global_step": 213832, "epoch": 1767} {"train_loss": -42.32855224609375, "global_step": 213833, "epoch": 1767} {"train_loss": -42.45232009887695, "global_step": 213834, "epoch": 1767} {"train_loss": -43.1903076171875, "global_step": 213835, "epoch": 1767} {"train_loss": -42.530399322509766, "global_step": 213836, "epoch": 1767} {"train_loss": -42.641998291015625, "global_step": 213837, "epoch": 1767} {"train_loss": -42.94402313232422, "global_step": 213838, "epoch": 1767} {"train_loss": -43.27556228637695, "global_step": 213839, "epoch": 1767} {"train_loss": -42.790870666503906, "global_step": 213840, "epoch": 1767} {"train_loss": -41.7327995300293, "global_step": 213841, "epoch": 1767} {"train_loss": -42.26969528198242, "global_step": 213842, "epoch": 1767} {"train_loss": -42.68162155151367, "global_step": 213843, "epoch": 1767} {"train_loss": -42.977298736572266, "global_step": 213844, "epoch": 1767} {"train_loss": -42.553443908691406, "global_step": 213845, "epoch": 1767} {"train_loss": -42.080257415771484, "global_step": 213846, "epoch": 1767} {"train_loss": -42.821327209472656, "global_step": 213847, "epoch": 1767} {"train_loss": -41.965457916259766, "global_step": 213848, "epoch": 1767} {"train_loss": -42.762001037597656, "global_step": 213849, "epoch": 1767} {"train_loss": -42.57706832885742, "global_step": 213850, "epoch": 1767} {"train_loss": -42.06285095214844, "global_step": 213851, "epoch": 1767} {"train_loss": -42.43107223510742, "global_step": 213852, "epoch": 1767} {"train_loss": -42.567413330078125, "global_step": 213853, "epoch": 1767} {"train_loss": -42.122955322265625, "global_step": 213854, "epoch": 1767} {"train_loss": -42.792476654052734, "global_step": 213855, "epoch": 1767} {"train_loss": -41.18679428100586, "global_step": 213856, "epoch": 1767} {"train_loss": -40.128395080566406, "global_step": 213857, "epoch": 1767} {"train_loss": -40.98318099975586, "global_step": 213858, "epoch": 1767} {"train_loss": -40.8320198059082, "global_step": 213859, "epoch": 1767} {"train_loss": -42.66636657714844, "global_step": 213860, "epoch": 1767} {"train_loss": -42.507606506347656, "global_step": 213861, "epoch": 1767} {"train_loss": -41.762447357177734, "global_step": 213862, "epoch": 1767} {"train_loss": -41.82145309448242, "global_step": 213863, "epoch": 1767} {"train_loss": -39.1607666015625, "global_step": 213864, "epoch": 1767} {"train_loss": -39.40367126464844, "global_step": 213865, "epoch": 1767} {"train_loss": -41.33811569213867, "global_step": 213866, "epoch": 1767} {"train_loss": -40.67145919799805, "global_step": 213867, "epoch": 1767} {"train_loss": -40.850372314453125, "global_step": 213868, "epoch": 1767} {"train_loss": -40.43095016479492, "global_step": 213869, "epoch": 1767} {"train_loss": -40.89666748046875, "global_step": 213870, "epoch": 1767} {"train_loss": -42.501556396484375, "global_step": 213871, "epoch": 1767} {"train_loss": -40.077293395996094, "global_step": 213872, "epoch": 1767} {"train_loss": -38.65157699584961, "global_step": 213873, "epoch": 1767} {"train_loss": -41.4693717956543, "global_step": 213874, "epoch": 1767} {"train_loss": -39.27618408203125, "global_step": 213875, "epoch": 1767} {"train_loss": -41.13851547241211, "global_step": 213876, "epoch": 1767} {"train_loss": -40.125484466552734, "global_step": 213877, "epoch": 1767} {"train_loss": -41.04246139526367, "global_step": 213878, "epoch": 1767} {"train_loss": -39.82914352416992, "global_step": 213879, "epoch": 1767} {"train_loss": -41.82949447631836, "global_step": 213880, "epoch": 1767} {"train_loss": -41.116207122802734, "global_step": 213881, "epoch": 1767} {"train_loss": -40.46010208129883, "global_step": 213882, "epoch": 1767} {"train_loss": -41.57988357543945, "global_step": 213883, "epoch": 1767} {"train_loss": -40.991943359375, "global_step": 213884, "epoch": 1767} {"train_loss": -40.18336486816406, "global_step": 213885, "epoch": 1767} {"train_loss": -40.603675842285156, "global_step": 213886, "epoch": 1767} {"train_loss": -41.692901611328125, "global_step": 213887, "epoch": 1767} {"train_loss": -41.89695739746094, "global_step": 213888, "epoch": 1767} {"train_loss": -40.79267501831055, "global_step": 213889, "epoch": 1767} {"train_loss": -42.27528762817383, "global_step": 213890, "epoch": 1767} {"train_loss": -41.089351654052734, "global_step": 213891, "epoch": 1767} {"train_loss": -41.77546310424805, "global_step": 213892, "epoch": 1767} {"train_loss": -41.70225143432617, "global_step": 213893, "epoch": 1767} {"train_loss": -41.39750289916992, "global_step": 213894, "epoch": 1767} {"train_loss": -42.18452072143555, "global_step": 213895, "epoch": 1767} {"train_loss": -41.668190002441406, "global_step": 213896, "epoch": 1767} {"train_loss": -40.65122985839844, "global_step": 213897, "epoch": 1767} {"train_loss": -42.080589294433594, "global_step": 213898, "epoch": 1767} {"train_loss": -41.92245864868164, "global_step": 213899, "epoch": 1767} {"train_loss": -42.461647033691406, "global_step": 213900, "epoch": 1767} {"train_loss": -42.028804779052734, "global_step": 213901, "epoch": 1767} {"train_loss": -41.21711730957031, "global_step": 213902, "epoch": 1767} {"train_loss": -41.45875930786133, "global_step": 213903, "epoch": 1767} {"train_loss": -42.80807113647461, "global_step": 213904, "epoch": 1767} {"train_loss": -38.201656341552734, "global_step": 213905, "epoch": 1767} {"train_loss": -40.06061935424805, "global_step": 213906, "epoch": 1767} {"train_loss": -41.702571868896484, "global_step": 213907, "epoch": 1767} {"train_loss": -40.96685791015625, "global_step": 213908, "epoch": 1767} {"train_loss": -40.37422561645508, "global_step": 213909, "epoch": 1767} {"train_loss": -37.91307067871094, "global_step": 213910, "epoch": 1767} {"train_loss": -40.1273078918457, "global_step": 213911, "epoch": 1767} {"train_loss": -40.05933380126953, "global_step": 213912, "epoch": 1767} {"train_loss": -41.813262939453125, "global_step": 213913, "epoch": 1767} {"train_loss": -40.30997848510742, "global_step": 213914, "epoch": 1767} {"train_loss": -41.54105758666992, "global_step": 213915, "epoch": 1767} {"train_loss": -37.97306442260742, "global_step": 213916, "epoch": 1767} {"train_loss": -41.430213928222656, "global_step": 213917, "epoch": 1767} {"train_loss": -41.81904602050781, "global_step": 213918, "epoch": 1767} {"train_loss": -40.71584701538086, "global_step": 213919, "epoch": 1767} {"train_loss": -39.67228317260742, "global_step": 213920, "epoch": 1767} {"train_loss": -41.01018524169922, "global_step": 213921, "epoch": 1767} {"train_loss": -41.28116989135742, "global_step": 213922, "epoch": 1767} {"train_loss": -41.8393669128418, "global_step": 213923, "epoch": 1767} {"train_loss": -41.72505569458008, "global_step": 213924, "epoch": 1767} {"train_loss": -42.33224105834961, "global_step": 213925, "epoch": 1767} {"train_loss": -40.57954025268555, "global_step": 213926, "epoch": 1767} {"train_loss": -41.63727216484133, "global_step": 213927, "epoch": 1767, "val_loss": 2450042.0} {"train_loss": -40.1234130859375, "global_step": 213928, "epoch": 1768} {"train_loss": -42.30929183959961, "global_step": 213929, "epoch": 1768} {"train_loss": -41.8079948425293, "global_step": 213930, "epoch": 1768} {"train_loss": -41.869903564453125, "global_step": 213931, "epoch": 1768} {"train_loss": -42.140235900878906, "global_step": 213932, "epoch": 1768} {"train_loss": -41.65902328491211, "global_step": 213933, "epoch": 1768} {"train_loss": -39.89458084106445, "global_step": 213934, "epoch": 1768} {"train_loss": -40.6351432800293, "global_step": 213935, "epoch": 1768} {"train_loss": -40.530128479003906, "global_step": 213936, "epoch": 1768} {"train_loss": -42.130592346191406, "global_step": 213937, "epoch": 1768} {"train_loss": -37.4613151550293, "global_step": 213938, "epoch": 1768} {"train_loss": -41.5258674621582, "global_step": 213939, "epoch": 1768} {"train_loss": -40.861175537109375, "global_step": 213940, "epoch": 1768} {"train_loss": -41.26259231567383, "global_step": 213941, "epoch": 1768} {"train_loss": -41.057010650634766, "global_step": 213942, "epoch": 1768} {"train_loss": -41.47512435913086, "global_step": 213943, "epoch": 1768} {"train_loss": -35.11186599731445, "global_step": 213944, "epoch": 1768} {"train_loss": -41.21604537963867, "global_step": 213945, "epoch": 1768} {"train_loss": -37.759986877441406, "global_step": 213946, "epoch": 1768} {"train_loss": -41.057132720947266, "global_step": 213947, "epoch": 1768} {"train_loss": -41.24405288696289, "global_step": 213948, "epoch": 1768} {"train_loss": -40.64337158203125, "global_step": 213949, "epoch": 1768} {"train_loss": -39.90758514404297, "global_step": 213950, "epoch": 1768} {"train_loss": -39.32588577270508, "global_step": 213951, "epoch": 1768} {"train_loss": -40.28498458862305, "global_step": 213952, "epoch": 1768} {"train_loss": -41.88901901245117, "global_step": 213953, "epoch": 1768} {"train_loss": -41.21254348754883, "global_step": 213954, "epoch": 1768} {"train_loss": -40.33543014526367, "global_step": 213955, "epoch": 1768} {"train_loss": -40.99888229370117, "global_step": 213956, "epoch": 1768} {"train_loss": -41.0482177734375, "global_step": 213957, "epoch": 1768} {"train_loss": -41.25091552734375, "global_step": 213958, "epoch": 1768} {"train_loss": -41.55527877807617, "global_step": 213959, "epoch": 1768} {"train_loss": -42.59328842163086, "global_step": 213960, "epoch": 1768} {"train_loss": -34.75478744506836, "global_step": 213961, "epoch": 1768} {"train_loss": -42.526546478271484, "global_step": 213962, "epoch": 1768} {"train_loss": -41.466270446777344, "global_step": 213963, "epoch": 1768} {"train_loss": -41.54665756225586, "global_step": 213964, "epoch": 1768} {"train_loss": -41.80341339111328, "global_step": 213965, "epoch": 1768} {"train_loss": -41.77163314819336, "global_step": 213966, "epoch": 1768} {"train_loss": -41.725826263427734, "global_step": 213967, "epoch": 1768} {"train_loss": -38.58936309814453, "global_step": 213968, "epoch": 1768} {"train_loss": -41.991024017333984, "global_step": 213969, "epoch": 1768} {"train_loss": -42.31474304199219, "global_step": 213970, "epoch": 1768} {"train_loss": -42.22450637817383, "global_step": 213971, "epoch": 1768} {"train_loss": -41.9032096862793, "global_step": 213972, "epoch": 1768} {"train_loss": -40.05585861206055, "global_step": 213973, "epoch": 1768} {"train_loss": -42.34571075439453, "global_step": 213974, "epoch": 1768} {"train_loss": -41.245384216308594, "global_step": 213975, "epoch": 1768} {"train_loss": -42.79172897338867, "global_step": 213976, "epoch": 1768} {"train_loss": -42.06278610229492, "global_step": 213977, "epoch": 1768} {"train_loss": -42.28920364379883, "global_step": 213978, "epoch": 1768} {"train_loss": -42.22372055053711, "global_step": 213979, "epoch": 1768} {"train_loss": -42.13873291015625, "global_step": 213980, "epoch": 1768} {"train_loss": -42.34788131713867, "global_step": 213981, "epoch": 1768} {"train_loss": -40.802127838134766, "global_step": 213982, "epoch": 1768} {"train_loss": -42.842891693115234, "global_step": 213983, "epoch": 1768} {"train_loss": -40.630828857421875, "global_step": 213984, "epoch": 1768} {"train_loss": -42.14488220214844, "global_step": 213985, "epoch": 1768} {"train_loss": -41.51960754394531, "global_step": 213986, "epoch": 1768} {"train_loss": -42.77460861206055, "global_step": 213987, "epoch": 1768} {"train_loss": -43.0499382019043, "global_step": 213988, "epoch": 1768} {"train_loss": -42.92523956298828, "global_step": 213989, "epoch": 1768} {"train_loss": -43.09296798706055, "global_step": 213990, "epoch": 1768} {"train_loss": -42.45525360107422, "global_step": 213991, "epoch": 1768} {"train_loss": -42.97543716430664, "global_step": 213992, "epoch": 1768} {"train_loss": -42.75316619873047, "global_step": 213993, "epoch": 1768} {"train_loss": -42.2468376159668, "global_step": 213994, "epoch": 1768} {"train_loss": -41.40157699584961, "global_step": 213995, "epoch": 1768} {"train_loss": -41.225521087646484, "global_step": 213996, "epoch": 1768} {"train_loss": -40.61151885986328, "global_step": 213997, "epoch": 1768} {"train_loss": -39.138771057128906, "global_step": 213998, "epoch": 1768} {"train_loss": -40.77150344848633, "global_step": 213999, "epoch": 1768} {"train_loss": -42.15324783325195, "global_step": 214000, "epoch": 1768} {"train_loss": -42.26661682128906, "global_step": 214001, "epoch": 1768} {"train_loss": -40.57147979736328, "global_step": 214002, "epoch": 1768} {"train_loss": -38.85822677612305, "global_step": 214003, "epoch": 1768} {"train_loss": -42.411537170410156, "global_step": 214004, "epoch": 1768} {"train_loss": -38.936920166015625, "global_step": 214005, "epoch": 1768} {"train_loss": -38.76169967651367, "global_step": 214006, "epoch": 1768} {"train_loss": -42.67559814453125, "global_step": 214007, "epoch": 1768} {"train_loss": -38.79975128173828, "global_step": 214008, "epoch": 1768} {"train_loss": -41.92566680908203, "global_step": 214009, "epoch": 1768} {"train_loss": -36.31248092651367, "global_step": 214010, "epoch": 1768} {"train_loss": -41.185325622558594, "global_step": 214011, "epoch": 1768} {"train_loss": -37.10157775878906, "global_step": 214012, "epoch": 1768} {"train_loss": -39.476318359375, "global_step": 214013, "epoch": 1768} {"train_loss": -36.83700180053711, "global_step": 214014, "epoch": 1768} {"train_loss": -37.68343734741211, "global_step": 214015, "epoch": 1768} {"train_loss": -39.13335418701172, "global_step": 214016, "epoch": 1768} {"train_loss": -33.64399337768555, "global_step": 214017, "epoch": 1768} {"train_loss": -37.60390853881836, "global_step": 214018, "epoch": 1768} {"train_loss": -38.128658294677734, "global_step": 214019, "epoch": 1768} {"train_loss": -39.046485900878906, "global_step": 214020, "epoch": 1768} {"train_loss": -39.83110809326172, "global_step": 214021, "epoch": 1768} {"train_loss": -37.021114349365234, "global_step": 214022, "epoch": 1768} {"train_loss": -40.35126876831055, "global_step": 214023, "epoch": 1768} {"train_loss": -36.8792839050293, "global_step": 214024, "epoch": 1768} {"train_loss": -39.211463928222656, "global_step": 214025, "epoch": 1768} {"train_loss": -36.469215393066406, "global_step": 214026, "epoch": 1768} {"train_loss": -35.020179748535156, "global_step": 214027, "epoch": 1768} {"train_loss": -35.42888641357422, "global_step": 214028, "epoch": 1768} {"train_loss": -36.28995895385742, "global_step": 214029, "epoch": 1768} {"train_loss": -37.19723129272461, "global_step": 214030, "epoch": 1768} {"train_loss": -38.806861877441406, "global_step": 214031, "epoch": 1768} {"train_loss": -38.778480529785156, "global_step": 214032, "epoch": 1768} {"train_loss": -39.8797492980957, "global_step": 214033, "epoch": 1768} {"train_loss": -39.03910827636719, "global_step": 214034, "epoch": 1768} {"train_loss": -40.200477600097656, "global_step": 214035, "epoch": 1768} {"train_loss": -39.325042724609375, "global_step": 214036, "epoch": 1768} {"train_loss": -38.81134033203125, "global_step": 214037, "epoch": 1768} {"train_loss": -40.66133499145508, "global_step": 214038, "epoch": 1768} {"train_loss": -40.205108642578125, "global_step": 214039, "epoch": 1768} {"train_loss": -40.98543930053711, "global_step": 214040, "epoch": 1768} {"train_loss": -41.04575729370117, "global_step": 214041, "epoch": 1768} {"train_loss": -40.658199310302734, "global_step": 214042, "epoch": 1768} {"train_loss": -40.93434524536133, "global_step": 214043, "epoch": 1768} {"train_loss": -40.60537338256836, "global_step": 214044, "epoch": 1768} {"train_loss": -40.88779830932617, "global_step": 214045, "epoch": 1768} {"train_loss": -41.16514205932617, "global_step": 214046, "epoch": 1768} {"train_loss": -41.02519226074219, "global_step": 214047, "epoch": 1768} {"train_loss": -40.40834943913231, "global_step": 214048, "epoch": 1768, "val_loss": 2577553.25} {"train_loss": -41.424434661865234, "global_step": 214049, "epoch": 1769} {"train_loss": -41.42329788208008, "global_step": 214050, "epoch": 1769} {"train_loss": -41.10410690307617, "global_step": 214051, "epoch": 1769} {"train_loss": -41.49155807495117, "global_step": 214052, "epoch": 1769} {"train_loss": -41.23517608642578, "global_step": 214053, "epoch": 1769} {"train_loss": -41.51522445678711, "global_step": 214054, "epoch": 1769} {"train_loss": -41.49803161621094, "global_step": 214055, "epoch": 1769} {"train_loss": -41.27604293823242, "global_step": 214056, "epoch": 1769} {"train_loss": -41.71488571166992, "global_step": 214057, "epoch": 1769} {"train_loss": -42.18231201171875, "global_step": 214058, "epoch": 1769} {"train_loss": -42.01227951049805, "global_step": 214059, "epoch": 1769} {"train_loss": -42.34669876098633, "global_step": 214060, "epoch": 1769} {"train_loss": -42.204708099365234, "global_step": 214061, "epoch": 1769} {"train_loss": -42.27470397949219, "global_step": 214062, "epoch": 1769} {"train_loss": -41.93709945678711, "global_step": 214063, "epoch": 1769} {"train_loss": -42.49624252319336, "global_step": 214064, "epoch": 1769} {"train_loss": -42.46400833129883, "global_step": 214065, "epoch": 1769} {"train_loss": -42.03788375854492, "global_step": 214066, "epoch": 1769} {"train_loss": -42.41816329956055, "global_step": 214067, "epoch": 1769} {"train_loss": -42.4925537109375, "global_step": 214068, "epoch": 1769} {"train_loss": -42.00288772583008, "global_step": 214069, "epoch": 1769} {"train_loss": -42.27625274658203, "global_step": 214070, "epoch": 1769} {"train_loss": -42.03313064575195, "global_step": 214071, "epoch": 1769} {"train_loss": -42.21747589111328, "global_step": 214072, "epoch": 1769} {"train_loss": -42.245731353759766, "global_step": 214073, "epoch": 1769} {"train_loss": -41.46493911743164, "global_step": 214074, "epoch": 1769} {"train_loss": -42.5454216003418, "global_step": 214075, "epoch": 1769} {"train_loss": -42.046180725097656, "global_step": 214076, "epoch": 1769} {"train_loss": -42.21931838989258, "global_step": 214077, "epoch": 1769} {"train_loss": -42.595951080322266, "global_step": 214078, "epoch": 1769} {"train_loss": -41.45147705078125, "global_step": 214079, "epoch": 1769} {"train_loss": -38.76028060913086, "global_step": 214080, "epoch": 1769} {"train_loss": -35.419776916503906, "global_step": 214081, "epoch": 1769} {"train_loss": -35.33075714111328, "global_step": 214082, "epoch": 1769} {"train_loss": -29.631200790405273, "global_step": 214083, "epoch": 1769} {"train_loss": -30.543567657470703, "global_step": 214084, "epoch": 1769} {"train_loss": -35.58748245239258, "global_step": 214085, "epoch": 1769} {"train_loss": -34.20225143432617, "global_step": 214086, "epoch": 1769} {"train_loss": -34.81138229370117, "global_step": 214087, "epoch": 1769} {"train_loss": -36.72213363647461, "global_step": 214088, "epoch": 1769} {"train_loss": -34.9146614074707, "global_step": 214089, "epoch": 1769} {"train_loss": -36.47922897338867, "global_step": 214090, "epoch": 1769} {"train_loss": -37.2004280090332, "global_step": 214091, "epoch": 1769} {"train_loss": -34.65647506713867, "global_step": 214092, "epoch": 1769} {"train_loss": -35.74795150756836, "global_step": 214093, "epoch": 1769} {"train_loss": -36.27482223510742, "global_step": 214094, "epoch": 1769} {"train_loss": -35.44789123535156, "global_step": 214095, "epoch": 1769} {"train_loss": -37.28290557861328, "global_step": 214096, "epoch": 1769} {"train_loss": -37.13588333129883, "global_step": 214097, "epoch": 1769} {"train_loss": -35.96686935424805, "global_step": 214098, "epoch": 1769} {"train_loss": -37.41120529174805, "global_step": 214099, "epoch": 1769} {"train_loss": -37.289527893066406, "global_step": 214100, "epoch": 1769} {"train_loss": -37.49077606201172, "global_step": 214101, "epoch": 1769} {"train_loss": -37.19881057739258, "global_step": 214102, "epoch": 1769} {"train_loss": -37.82017135620117, "global_step": 214103, "epoch": 1769} {"train_loss": -38.09347152709961, "global_step": 214104, "epoch": 1769} {"train_loss": -38.04228591918945, "global_step": 214105, "epoch": 1769} {"train_loss": -37.79046630859375, "global_step": 214106, "epoch": 1769} {"train_loss": -38.75028610229492, "global_step": 214107, "epoch": 1769} {"train_loss": -38.5436897277832, "global_step": 214108, "epoch": 1769} {"train_loss": -39.14026641845703, "global_step": 214109, "epoch": 1769} {"train_loss": -38.98579025268555, "global_step": 214110, "epoch": 1769} {"train_loss": -38.884010314941406, "global_step": 214111, "epoch": 1769} {"train_loss": -38.8931884765625, "global_step": 214112, "epoch": 1769} {"train_loss": -39.48473358154297, "global_step": 214113, "epoch": 1769} {"train_loss": -40.8453483581543, "global_step": 214114, "epoch": 1769} {"train_loss": -38.878143310546875, "global_step": 214115, "epoch": 1769} {"train_loss": -40.30613327026367, "global_step": 214116, "epoch": 1769} {"train_loss": -39.90208053588867, "global_step": 214117, "epoch": 1769} {"train_loss": -39.61843490600586, "global_step": 214118, "epoch": 1769} {"train_loss": -40.22328186035156, "global_step": 214119, "epoch": 1769} {"train_loss": -40.714752197265625, "global_step": 214120, "epoch": 1769} {"train_loss": -40.08903884887695, "global_step": 214121, "epoch": 1769} {"train_loss": -41.177978515625, "global_step": 214122, "epoch": 1769} {"train_loss": -40.87077713012695, "global_step": 214123, "epoch": 1769} {"train_loss": -41.799251556396484, "global_step": 214124, "epoch": 1769} {"train_loss": -41.33933639526367, "global_step": 214125, "epoch": 1769} {"train_loss": -41.788230895996094, "global_step": 214126, "epoch": 1769} {"train_loss": -41.60746765136719, "global_step": 214127, "epoch": 1769} {"train_loss": -41.677650451660156, "global_step": 214128, "epoch": 1769} {"train_loss": -41.20821762084961, "global_step": 214129, "epoch": 1769} {"train_loss": -42.0769157409668, "global_step": 214130, "epoch": 1769} {"train_loss": -42.25586700439453, "global_step": 214131, "epoch": 1769} {"train_loss": -42.094356536865234, "global_step": 214132, "epoch": 1769} {"train_loss": -42.225433349609375, "global_step": 214133, "epoch": 1769} {"train_loss": -42.063995361328125, "global_step": 214134, "epoch": 1769} {"train_loss": -42.34590148925781, "global_step": 214135, "epoch": 1769} {"train_loss": -42.58864212036133, "global_step": 214136, "epoch": 1769} {"train_loss": -42.87635040283203, "global_step": 214137, "epoch": 1769} {"train_loss": -42.66090393066406, "global_step": 214138, "epoch": 1769} {"train_loss": -42.42135238647461, "global_step": 214139, "epoch": 1769} {"train_loss": -42.35885238647461, "global_step": 214140, "epoch": 1769} {"train_loss": -42.88715744018555, "global_step": 214141, "epoch": 1769} {"train_loss": -41.89352035522461, "global_step": 214142, "epoch": 1769} {"train_loss": -38.90763473510742, "global_step": 214143, "epoch": 1769} {"train_loss": -40.05594253540039, "global_step": 214144, "epoch": 1769} {"train_loss": -37.89617919921875, "global_step": 214145, "epoch": 1769} {"train_loss": -31.75190544128418, "global_step": 214146, "epoch": 1769} {"train_loss": -22.066221237182617, "global_step": 214147, "epoch": 1769} {"train_loss": -35.460750579833984, "global_step": 214148, "epoch": 1769} {"train_loss": -27.445112228393555, "global_step": 214149, "epoch": 1769} {"train_loss": -35.66938400268555, "global_step": 214150, "epoch": 1769} {"train_loss": -31.35736656188965, "global_step": 214151, "epoch": 1769} {"train_loss": -33.853084564208984, "global_step": 214152, "epoch": 1769} {"train_loss": -36.66617965698242, "global_step": 214153, "epoch": 1769} {"train_loss": -33.0851936340332, "global_step": 214154, "epoch": 1769} {"train_loss": -37.233333587646484, "global_step": 214155, "epoch": 1769} {"train_loss": -36.93717575073242, "global_step": 214156, "epoch": 1769} {"train_loss": -34.88982391357422, "global_step": 214157, "epoch": 1769} {"train_loss": -37.48934555053711, "global_step": 214158, "epoch": 1769} {"train_loss": -37.07908248901367, "global_step": 214159, "epoch": 1769} {"train_loss": -36.13014602661133, "global_step": 214160, "epoch": 1769} {"train_loss": -37.365875244140625, "global_step": 214161, "epoch": 1769} {"train_loss": -37.653194427490234, "global_step": 214162, "epoch": 1769} {"train_loss": -37.73236846923828, "global_step": 214163, "epoch": 1769} {"train_loss": -37.9587287902832, "global_step": 214164, "epoch": 1769} {"train_loss": -38.51520919799805, "global_step": 214165, "epoch": 1769} {"train_loss": -38.02408981323242, "global_step": 214166, "epoch": 1769} {"train_loss": -38.69672393798828, "global_step": 214167, "epoch": 1769} {"train_loss": -38.76990509033203, "global_step": 214168, "epoch": 1769} {"train_loss": -38.983246811165294, "global_step": 214169, "epoch": 1769, "val_loss": 2564164.25} {"train_loss": -38.36843490600586, "global_step": 214170, "epoch": 1770} {"train_loss": -38.24384307861328, "global_step": 214171, "epoch": 1770} {"train_loss": -39.061214447021484, "global_step": 214172, "epoch": 1770} {"train_loss": -38.635658264160156, "global_step": 214173, "epoch": 1770} {"train_loss": -38.459259033203125, "global_step": 214174, "epoch": 1770} {"train_loss": -39.166961669921875, "global_step": 214175, "epoch": 1770} {"train_loss": -38.87290954589844, "global_step": 214176, "epoch": 1770} {"train_loss": -38.37575912475586, "global_step": 214177, "epoch": 1770} {"train_loss": -37.41057205200195, "global_step": 214178, "epoch": 1770} {"train_loss": -36.560726165771484, "global_step": 214179, "epoch": 1770} {"train_loss": -38.489009857177734, "global_step": 214180, "epoch": 1770} {"train_loss": -38.949317932128906, "global_step": 214181, "epoch": 1770} {"train_loss": -37.68840408325195, "global_step": 214182, "epoch": 1770} {"train_loss": -39.255767822265625, "global_step": 214183, "epoch": 1770} {"train_loss": -38.50496292114258, "global_step": 214184, "epoch": 1770} {"train_loss": -38.78803634643555, "global_step": 214185, "epoch": 1770} {"train_loss": -39.87691879272461, "global_step": 214186, "epoch": 1770} {"train_loss": -39.304012298583984, "global_step": 214187, "epoch": 1770} {"train_loss": -39.63015365600586, "global_step": 214188, "epoch": 1770} {"train_loss": -39.42800521850586, "global_step": 214189, "epoch": 1770} {"train_loss": -39.946903228759766, "global_step": 214190, "epoch": 1770} {"train_loss": -38.96807861328125, "global_step": 214191, "epoch": 1770} {"train_loss": -38.80784225463867, "global_step": 214192, "epoch": 1770} {"train_loss": -37.63616943359375, "global_step": 214193, "epoch": 1770} {"train_loss": -39.69586181640625, "global_step": 214194, "epoch": 1770} {"train_loss": -39.107421875, "global_step": 214195, "epoch": 1770} {"train_loss": -38.7780876159668, "global_step": 214196, "epoch": 1770} {"train_loss": -39.606292724609375, "global_step": 214197, "epoch": 1770} {"train_loss": -39.11671447753906, "global_step": 214198, "epoch": 1770} {"train_loss": -39.57497787475586, "global_step": 214199, "epoch": 1770} {"train_loss": -40.108760833740234, "global_step": 214200, "epoch": 1770} {"train_loss": -40.31135177612305, "global_step": 214201, "epoch": 1770} {"train_loss": -39.81992721557617, "global_step": 214202, "epoch": 1770} {"train_loss": -39.61245346069336, "global_step": 214203, "epoch": 1770} {"train_loss": -39.73404312133789, "global_step": 214204, "epoch": 1770} {"train_loss": -39.548458099365234, "global_step": 214205, "epoch": 1770} {"train_loss": -39.48179626464844, "global_step": 214206, "epoch": 1770} {"train_loss": -39.4398078918457, "global_step": 214207, "epoch": 1770} {"train_loss": -39.849647521972656, "global_step": 214208, "epoch": 1770} {"train_loss": -40.0288200378418, "global_step": 214209, "epoch": 1770} {"train_loss": -40.21685791015625, "global_step": 214210, "epoch": 1770} {"train_loss": -39.7640266418457, "global_step": 214211, "epoch": 1770} {"train_loss": -40.47980880737305, "global_step": 214212, "epoch": 1770} {"train_loss": -37.895263671875, "global_step": 214213, "epoch": 1770} {"train_loss": -40.313819885253906, "global_step": 214214, "epoch": 1770} {"train_loss": -40.54296875, "global_step": 214215, "epoch": 1770} {"train_loss": -39.958927154541016, "global_step": 214216, "epoch": 1770} {"train_loss": -39.47037887573242, "global_step": 214217, "epoch": 1770} {"train_loss": -40.34479522705078, "global_step": 214218, "epoch": 1770} {"train_loss": -40.20512008666992, "global_step": 214219, "epoch": 1770} {"train_loss": -39.95341110229492, "global_step": 214220, "epoch": 1770} {"train_loss": -40.31585693359375, "global_step": 214221, "epoch": 1770} {"train_loss": -39.18085861206055, "global_step": 214222, "epoch": 1770} {"train_loss": -40.202301025390625, "global_step": 214223, "epoch": 1770} {"train_loss": -40.24491500854492, "global_step": 214224, "epoch": 1770} {"train_loss": -39.978736877441406, "global_step": 214225, "epoch": 1770} {"train_loss": -40.14751052856445, "global_step": 214226, "epoch": 1770} {"train_loss": -39.426116943359375, "global_step": 214227, "epoch": 1770} {"train_loss": -40.9133415222168, "global_step": 214228, "epoch": 1770} {"train_loss": -40.5833854675293, "global_step": 214229, "epoch": 1770} {"train_loss": -40.125091552734375, "global_step": 214230, "epoch": 1770} {"train_loss": -40.59009552001953, "global_step": 214231, "epoch": 1770} {"train_loss": -40.93765640258789, "global_step": 214232, "epoch": 1770} {"train_loss": -40.66384506225586, "global_step": 214233, "epoch": 1770} {"train_loss": -37.466644287109375, "global_step": 214234, "epoch": 1770} {"train_loss": -39.33618927001953, "global_step": 214235, "epoch": 1770} {"train_loss": -39.58804702758789, "global_step": 214236, "epoch": 1770} {"train_loss": -39.80842590332031, "global_step": 214237, "epoch": 1770} {"train_loss": -33.4874267578125, "global_step": 214238, "epoch": 1770} {"train_loss": -37.50313949584961, "global_step": 214239, "epoch": 1770} {"train_loss": -40.02388000488281, "global_step": 214240, "epoch": 1770} {"train_loss": -38.035186767578125, "global_step": 214241, "epoch": 1770} {"train_loss": -36.88019943237305, "global_step": 214242, "epoch": 1770} {"train_loss": -36.050655364990234, "global_step": 214243, "epoch": 1770} {"train_loss": -23.463520050048828, "global_step": 214244, "epoch": 1770} {"train_loss": -37.194419860839844, "global_step": 214245, "epoch": 1770} {"train_loss": -36.4749641418457, "global_step": 214246, "epoch": 1770} {"train_loss": -31.785436630249023, "global_step": 214247, "epoch": 1770} {"train_loss": -34.735530853271484, "global_step": 214248, "epoch": 1770} {"train_loss": -35.436100006103516, "global_step": 214249, "epoch": 1770} {"train_loss": -32.9372673034668, "global_step": 214250, "epoch": 1770} {"train_loss": -35.66205978393555, "global_step": 214251, "epoch": 1770} {"train_loss": -36.530357360839844, "global_step": 214252, "epoch": 1770} {"train_loss": -36.97431564331055, "global_step": 214253, "epoch": 1770} {"train_loss": -37.2232551574707, "global_step": 214254, "epoch": 1770} {"train_loss": -37.33143997192383, "global_step": 214255, "epoch": 1770} {"train_loss": -34.45439910888672, "global_step": 214256, "epoch": 1770} {"train_loss": -38.208309173583984, "global_step": 214257, "epoch": 1770} {"train_loss": -32.506107330322266, "global_step": 214258, "epoch": 1770} {"train_loss": -33.19464874267578, "global_step": 214259, "epoch": 1770} {"train_loss": -37.878273010253906, "global_step": 214260, "epoch": 1770} {"train_loss": -38.01930618286133, "global_step": 214261, "epoch": 1770} {"train_loss": -35.24715042114258, "global_step": 214262, "epoch": 1770} {"train_loss": -37.97151565551758, "global_step": 214263, "epoch": 1770} {"train_loss": -38.35596466064453, "global_step": 214264, "epoch": 1770} {"train_loss": -36.93925476074219, "global_step": 214265, "epoch": 1770} {"train_loss": -37.562862396240234, "global_step": 214266, "epoch": 1770} {"train_loss": -36.65289306640625, "global_step": 214267, "epoch": 1770} {"train_loss": -38.15168380737305, "global_step": 214268, "epoch": 1770} {"train_loss": -38.998531341552734, "global_step": 214269, "epoch": 1770} {"train_loss": -36.78751754760742, "global_step": 214270, "epoch": 1770} {"train_loss": -37.71454620361328, "global_step": 214271, "epoch": 1770} {"train_loss": -39.459835052490234, "global_step": 214272, "epoch": 1770} {"train_loss": -38.40925979614258, "global_step": 214273, "epoch": 1770} {"train_loss": -39.164894104003906, "global_step": 214274, "epoch": 1770} {"train_loss": -38.5601692199707, "global_step": 214275, "epoch": 1770} {"train_loss": -37.72922897338867, "global_step": 214276, "epoch": 1770} {"train_loss": -39.52535629272461, "global_step": 214277, "epoch": 1770} {"train_loss": -37.77971649169922, "global_step": 214278, "epoch": 1770} {"train_loss": -38.255367279052734, "global_step": 214279, "epoch": 1770} {"train_loss": -38.044677734375, "global_step": 214280, "epoch": 1770} {"train_loss": -39.17844772338867, "global_step": 214281, "epoch": 1770} {"train_loss": -39.29039001464844, "global_step": 214282, "epoch": 1770} {"train_loss": -39.66305160522461, "global_step": 214283, "epoch": 1770} {"train_loss": -37.995845794677734, "global_step": 214284, "epoch": 1770} {"train_loss": -39.53260040283203, "global_step": 214285, "epoch": 1770} {"train_loss": -38.988189697265625, "global_step": 214286, "epoch": 1770} {"train_loss": -39.225101470947266, "global_step": 214287, "epoch": 1770} {"train_loss": -37.654335021972656, "global_step": 214288, "epoch": 1770} {"train_loss": -39.10915756225586, "global_step": 214289, "epoch": 1770} {"train_loss": -38.384511064891974, "global_step": 214290, "epoch": 1770, "val_loss": 2557603.0} {"train_loss": -39.120967864990234, "global_step": 214291, "epoch": 1771} {"train_loss": -38.501258850097656, "global_step": 214292, "epoch": 1771} {"train_loss": -38.21609878540039, "global_step": 214293, "epoch": 1771} {"train_loss": -39.236019134521484, "global_step": 214294, "epoch": 1771} {"train_loss": -39.201473236083984, "global_step": 214295, "epoch": 1771} {"train_loss": -39.56303787231445, "global_step": 214296, "epoch": 1771} {"train_loss": -39.28887939453125, "global_step": 214297, "epoch": 1771} {"train_loss": -40.1839714050293, "global_step": 214298, "epoch": 1771} {"train_loss": -38.235595703125, "global_step": 214299, "epoch": 1771} {"train_loss": -39.437103271484375, "global_step": 214300, "epoch": 1771} {"train_loss": -39.90989303588867, "global_step": 214301, "epoch": 1771} {"train_loss": -39.42924880981445, "global_step": 214302, "epoch": 1771} {"train_loss": -39.58054733276367, "global_step": 214303, "epoch": 1771} {"train_loss": -39.46235275268555, "global_step": 214304, "epoch": 1771} {"train_loss": -40.22345733642578, "global_step": 214305, "epoch": 1771} {"train_loss": -39.36276626586914, "global_step": 214306, "epoch": 1771} {"train_loss": -38.55641555786133, "global_step": 214307, "epoch": 1771} {"train_loss": -38.75856399536133, "global_step": 214308, "epoch": 1771} {"train_loss": -39.548763275146484, "global_step": 214309, "epoch": 1771} {"train_loss": -39.604698181152344, "global_step": 214310, "epoch": 1771} {"train_loss": -40.230587005615234, "global_step": 214311, "epoch": 1771} {"train_loss": -40.37905502319336, "global_step": 214312, "epoch": 1771} {"train_loss": -40.57167053222656, "global_step": 214313, "epoch": 1771} {"train_loss": -40.30581283569336, "global_step": 214314, "epoch": 1771} {"train_loss": -40.35288619995117, "global_step": 214315, "epoch": 1771} {"train_loss": -40.26835250854492, "global_step": 214316, "epoch": 1771} {"train_loss": -40.39493179321289, "global_step": 214317, "epoch": 1771} {"train_loss": -40.350772857666016, "global_step": 214318, "epoch": 1771} {"train_loss": -39.4461555480957, "global_step": 214319, "epoch": 1771} {"train_loss": -40.76853561401367, "global_step": 214320, "epoch": 1771} {"train_loss": -39.8538703918457, "global_step": 214321, "epoch": 1771} {"train_loss": -39.860103607177734, "global_step": 214322, "epoch": 1771} {"train_loss": -39.763668060302734, "global_step": 214323, "epoch": 1771} {"train_loss": -40.70036697387695, "global_step": 214324, "epoch": 1771} {"train_loss": -40.57296371459961, "global_step": 214325, "epoch": 1771} {"train_loss": -39.49152755737305, "global_step": 214326, "epoch": 1771} {"train_loss": -40.50587463378906, "global_step": 214327, "epoch": 1771} {"train_loss": -41.14913558959961, "global_step": 214328, "epoch": 1771} {"train_loss": -41.052642822265625, "global_step": 214329, "epoch": 1771} {"train_loss": -40.4059944152832, "global_step": 214330, "epoch": 1771} {"train_loss": -41.12263107299805, "global_step": 214331, "epoch": 1771} {"train_loss": -40.80384063720703, "global_step": 214332, "epoch": 1771} {"train_loss": -41.24525451660156, "global_step": 214333, "epoch": 1771} {"train_loss": -40.35811996459961, "global_step": 214334, "epoch": 1771} {"train_loss": -40.308265686035156, "global_step": 214335, "epoch": 1771} {"train_loss": -39.9568977355957, "global_step": 214336, "epoch": 1771} {"train_loss": -40.449851989746094, "global_step": 214337, "epoch": 1771} {"train_loss": -39.7251091003418, "global_step": 214338, "epoch": 1771} {"train_loss": -40.61813735961914, "global_step": 214339, "epoch": 1771} {"train_loss": -40.510955810546875, "global_step": 214340, "epoch": 1771} {"train_loss": -41.23513412475586, "global_step": 214341, "epoch": 1771} {"train_loss": -40.12730407714844, "global_step": 214342, "epoch": 1771} {"train_loss": -40.521507263183594, "global_step": 214343, "epoch": 1771} {"train_loss": -40.90314865112305, "global_step": 214344, "epoch": 1771} {"train_loss": -40.582149505615234, "global_step": 214345, "epoch": 1771} {"train_loss": -40.00067138671875, "global_step": 214346, "epoch": 1771} {"train_loss": -40.57143020629883, "global_step": 214347, "epoch": 1771} {"train_loss": -41.56266403198242, "global_step": 214348, "epoch": 1771} {"train_loss": -39.383270263671875, "global_step": 214349, "epoch": 1771} {"train_loss": -40.81676483154297, "global_step": 214350, "epoch": 1771} {"train_loss": -41.58369064331055, "global_step": 214351, "epoch": 1771} {"train_loss": -40.24819564819336, "global_step": 214352, "epoch": 1771} {"train_loss": -40.47797393798828, "global_step": 214353, "epoch": 1771} {"train_loss": -41.8445930480957, "global_step": 214354, "epoch": 1771} {"train_loss": -41.348297119140625, "global_step": 214355, "epoch": 1771} {"train_loss": -41.26874923706055, "global_step": 214356, "epoch": 1771} {"train_loss": -40.641605377197266, "global_step": 214357, "epoch": 1771} {"train_loss": -40.92021179199219, "global_step": 214358, "epoch": 1771} {"train_loss": -40.93703079223633, "global_step": 214359, "epoch": 1771} {"train_loss": -40.936153411865234, "global_step": 214360, "epoch": 1771} {"train_loss": -41.38424301147461, "global_step": 214361, "epoch": 1771} {"train_loss": -41.68671798706055, "global_step": 214362, "epoch": 1771} {"train_loss": -39.98934555053711, "global_step": 214363, "epoch": 1771} {"train_loss": -40.71963119506836, "global_step": 214364, "epoch": 1771} {"train_loss": -40.72273635864258, "global_step": 214365, "epoch": 1771} {"train_loss": -37.14760208129883, "global_step": 214366, "epoch": 1771} {"train_loss": -40.500396728515625, "global_step": 214367, "epoch": 1771} {"train_loss": -39.20107650756836, "global_step": 214368, "epoch": 1771} {"train_loss": -37.3524284362793, "global_step": 214369, "epoch": 1771} {"train_loss": -38.82255935668945, "global_step": 214370, "epoch": 1771} {"train_loss": -38.64684295654297, "global_step": 214371, "epoch": 1771} {"train_loss": -40.207794189453125, "global_step": 214372, "epoch": 1771} {"train_loss": -41.32920455932617, "global_step": 214373, "epoch": 1771} {"train_loss": -39.305908203125, "global_step": 214374, "epoch": 1771} {"train_loss": -38.944427490234375, "global_step": 214375, "epoch": 1771} {"train_loss": -40.048221588134766, "global_step": 214376, "epoch": 1771} {"train_loss": -41.193843841552734, "global_step": 214377, "epoch": 1771} {"train_loss": -40.281673431396484, "global_step": 214378, "epoch": 1771} {"train_loss": -40.411033630371094, "global_step": 214379, "epoch": 1771} {"train_loss": -40.97690963745117, "global_step": 214380, "epoch": 1771} {"train_loss": -40.906978607177734, "global_step": 214381, "epoch": 1771} {"train_loss": -40.40598678588867, "global_step": 214382, "epoch": 1771} {"train_loss": -40.99018096923828, "global_step": 214383, "epoch": 1771} {"train_loss": -40.72892379760742, "global_step": 214384, "epoch": 1771} {"train_loss": -40.79743194580078, "global_step": 214385, "epoch": 1771} {"train_loss": -40.930320739746094, "global_step": 214386, "epoch": 1771} {"train_loss": -41.25071334838867, "global_step": 214387, "epoch": 1771} {"train_loss": -41.16493225097656, "global_step": 214388, "epoch": 1771} {"train_loss": -40.975704193115234, "global_step": 214389, "epoch": 1771} {"train_loss": -41.0918083190918, "global_step": 214390, "epoch": 1771} {"train_loss": -41.663177490234375, "global_step": 214391, "epoch": 1771} {"train_loss": -41.74409103393555, "global_step": 214392, "epoch": 1771} {"train_loss": -40.70085906982422, "global_step": 214393, "epoch": 1771} {"train_loss": -40.97962188720703, "global_step": 214394, "epoch": 1771} {"train_loss": -41.310401916503906, "global_step": 214395, "epoch": 1771} {"train_loss": -41.47376251220703, "global_step": 214396, "epoch": 1771} {"train_loss": -41.50246810913086, "global_step": 214397, "epoch": 1771} {"train_loss": -40.704383850097656, "global_step": 214398, "epoch": 1771} {"train_loss": -41.75210189819336, "global_step": 214399, "epoch": 1771} {"train_loss": -41.01520919799805, "global_step": 214400, "epoch": 1771} {"train_loss": -39.996803283691406, "global_step": 214401, "epoch": 1771} {"train_loss": -40.1265869140625, "global_step": 214402, "epoch": 1771} {"train_loss": -40.93440246582031, "global_step": 214403, "epoch": 1771} {"train_loss": -40.75590133666992, "global_step": 214404, "epoch": 1771} {"train_loss": -39.69802474975586, "global_step": 214405, "epoch": 1771} {"train_loss": -41.39752197265625, "global_step": 214406, "epoch": 1771} {"train_loss": -41.5135383605957, "global_step": 214407, "epoch": 1771} {"train_loss": -41.09233856201172, "global_step": 214408, "epoch": 1771} {"train_loss": -41.73601531982422, "global_step": 214409, "epoch": 1771} {"train_loss": -41.464019775390625, "global_step": 214410, "epoch": 1771} {"train_loss": -40.35706704510145, "global_step": 214411, "epoch": 1771, "val_loss": 2665274.0} {"train_loss": -41.4456787109375, "global_step": 214412, "epoch": 1772} {"train_loss": -40.83466339111328, "global_step": 214413, "epoch": 1772} {"train_loss": -39.45471954345703, "global_step": 214414, "epoch": 1772} {"train_loss": -38.79096603393555, "global_step": 214415, "epoch": 1772} {"train_loss": -39.81614303588867, "global_step": 214416, "epoch": 1772} {"train_loss": -41.516456604003906, "global_step": 214417, "epoch": 1772} {"train_loss": -38.5639533996582, "global_step": 214418, "epoch": 1772} {"train_loss": -39.228267669677734, "global_step": 214419, "epoch": 1772} {"train_loss": -41.75522994995117, "global_step": 214420, "epoch": 1772} {"train_loss": -40.659481048583984, "global_step": 214421, "epoch": 1772} {"train_loss": -39.87392044067383, "global_step": 214422, "epoch": 1772} {"train_loss": -41.14113998413086, "global_step": 214423, "epoch": 1772} {"train_loss": -40.47605895996094, "global_step": 214424, "epoch": 1772} {"train_loss": -40.56107711791992, "global_step": 214425, "epoch": 1772} {"train_loss": -41.31781768798828, "global_step": 214426, "epoch": 1772} {"train_loss": -40.755889892578125, "global_step": 214427, "epoch": 1772} {"train_loss": -41.34315872192383, "global_step": 214428, "epoch": 1772} {"train_loss": -41.58121871948242, "global_step": 214429, "epoch": 1772} {"train_loss": -40.45222854614258, "global_step": 214430, "epoch": 1772} {"train_loss": -42.260005950927734, "global_step": 214431, "epoch": 1772} {"train_loss": -41.14814376831055, "global_step": 214432, "epoch": 1772} {"train_loss": -40.93696975708008, "global_step": 214433, "epoch": 1772} {"train_loss": -41.0408935546875, "global_step": 214434, "epoch": 1772} {"train_loss": -41.22279739379883, "global_step": 214435, "epoch": 1772} {"train_loss": -41.566673278808594, "global_step": 214436, "epoch": 1772} {"train_loss": -41.076480865478516, "global_step": 214437, "epoch": 1772} {"train_loss": -41.86305618286133, "global_step": 214438, "epoch": 1772} {"train_loss": -41.209716796875, "global_step": 214439, "epoch": 1772} {"train_loss": -40.73353576660156, "global_step": 214440, "epoch": 1772} {"train_loss": -42.54145431518555, "global_step": 214441, "epoch": 1772} {"train_loss": -40.56716537475586, "global_step": 214442, "epoch": 1772} {"train_loss": -40.38499069213867, "global_step": 214443, "epoch": 1772} {"train_loss": -40.840667724609375, "global_step": 214444, "epoch": 1772} {"train_loss": -41.60404586791992, "global_step": 214445, "epoch": 1772} {"train_loss": -40.82958984375, "global_step": 214446, "epoch": 1772} {"train_loss": -41.3558349609375, "global_step": 214447, "epoch": 1772} {"train_loss": -41.52459716796875, "global_step": 214448, "epoch": 1772} {"train_loss": -41.537593841552734, "global_step": 214449, "epoch": 1772} {"train_loss": -40.904449462890625, "global_step": 214450, "epoch": 1772} {"train_loss": -41.39060592651367, "global_step": 214451, "epoch": 1772} {"train_loss": -40.99873733520508, "global_step": 214452, "epoch": 1772} {"train_loss": -40.43893814086914, "global_step": 214453, "epoch": 1772} {"train_loss": -41.135406494140625, "global_step": 214454, "epoch": 1772} {"train_loss": -40.698707580566406, "global_step": 214455, "epoch": 1772} {"train_loss": -40.946346282958984, "global_step": 214456, "epoch": 1772} {"train_loss": -40.538780212402344, "global_step": 214457, "epoch": 1772} {"train_loss": -41.41858673095703, "global_step": 214458, "epoch": 1772} {"train_loss": -40.939208984375, "global_step": 214459, "epoch": 1772} {"train_loss": -41.942481994628906, "global_step": 214460, "epoch": 1772} {"train_loss": -41.22144317626953, "global_step": 214461, "epoch": 1772} {"train_loss": -39.906314849853516, "global_step": 214462, "epoch": 1772} {"train_loss": -37.668212890625, "global_step": 214463, "epoch": 1772} {"train_loss": -39.85761642456055, "global_step": 214464, "epoch": 1772} {"train_loss": -41.18647766113281, "global_step": 214465, "epoch": 1772} {"train_loss": -40.872982025146484, "global_step": 214466, "epoch": 1772} {"train_loss": -39.27136993408203, "global_step": 214467, "epoch": 1772} {"train_loss": -41.52047348022461, "global_step": 214468, "epoch": 1772} {"train_loss": -41.3922233581543, "global_step": 214469, "epoch": 1772} {"train_loss": -40.595436096191406, "global_step": 214470, "epoch": 1772} {"train_loss": -41.389862060546875, "global_step": 214471, "epoch": 1772} {"train_loss": -41.28481674194336, "global_step": 214472, "epoch": 1772} {"train_loss": -41.32928466796875, "global_step": 214473, "epoch": 1772} {"train_loss": -41.81819534301758, "global_step": 214474, "epoch": 1772} {"train_loss": -41.22844314575195, "global_step": 214475, "epoch": 1772} {"train_loss": -40.83966064453125, "global_step": 214476, "epoch": 1772} {"train_loss": -41.51409912109375, "global_step": 214477, "epoch": 1772} {"train_loss": -41.4433708190918, "global_step": 214478, "epoch": 1772} {"train_loss": -41.10024642944336, "global_step": 214479, "epoch": 1772} {"train_loss": -41.33626174926758, "global_step": 214480, "epoch": 1772} {"train_loss": -41.469242095947266, "global_step": 214481, "epoch": 1772} {"train_loss": -40.9599723815918, "global_step": 214482, "epoch": 1772} {"train_loss": -39.801185607910156, "global_step": 214483, "epoch": 1772} {"train_loss": -40.988346099853516, "global_step": 214484, "epoch": 1772} {"train_loss": -41.71709060668945, "global_step": 214485, "epoch": 1772} {"train_loss": -40.82946014404297, "global_step": 214486, "epoch": 1772} {"train_loss": -41.183799743652344, "global_step": 214487, "epoch": 1772} {"train_loss": -39.85584259033203, "global_step": 214488, "epoch": 1772} {"train_loss": -41.867923736572266, "global_step": 214489, "epoch": 1772} {"train_loss": -41.21096420288086, "global_step": 214490, "epoch": 1772} {"train_loss": -40.85919952392578, "global_step": 214491, "epoch": 1772} {"train_loss": -41.0314826965332, "global_step": 214492, "epoch": 1772} {"train_loss": -42.02461624145508, "global_step": 214493, "epoch": 1772} {"train_loss": -41.20881271362305, "global_step": 214494, "epoch": 1772} {"train_loss": -41.413330078125, "global_step": 214495, "epoch": 1772} {"train_loss": -41.66701889038086, "global_step": 214496, "epoch": 1772} {"train_loss": -40.98130416870117, "global_step": 214497, "epoch": 1772} {"train_loss": -41.405799865722656, "global_step": 214498, "epoch": 1772} {"train_loss": -39.3828010559082, "global_step": 214499, "epoch": 1772} {"train_loss": -41.552268981933594, "global_step": 214500, "epoch": 1772} {"train_loss": -40.74464797973633, "global_step": 214501, "epoch": 1772} {"train_loss": -40.72018814086914, "global_step": 214502, "epoch": 1772} {"train_loss": -38.38255310058594, "global_step": 214503, "epoch": 1772} {"train_loss": -39.56895065307617, "global_step": 214504, "epoch": 1772} {"train_loss": -38.13776779174805, "global_step": 214505, "epoch": 1772} {"train_loss": -36.49649429321289, "global_step": 214506, "epoch": 1772} {"train_loss": -40.02016067504883, "global_step": 214507, "epoch": 1772} {"train_loss": -40.40568923950195, "global_step": 214508, "epoch": 1772} {"train_loss": -35.502254486083984, "global_step": 214509, "epoch": 1772} {"train_loss": -36.95612716674805, "global_step": 214510, "epoch": 1772} {"train_loss": -27.884733200073242, "global_step": 214511, "epoch": 1772} {"train_loss": -34.41032028198242, "global_step": 214512, "epoch": 1772} {"train_loss": -39.13452911376953, "global_step": 214513, "epoch": 1772} {"train_loss": -26.481679916381836, "global_step": 214514, "epoch": 1772} {"train_loss": -35.865943908691406, "global_step": 214515, "epoch": 1772} {"train_loss": -33.25417709350586, "global_step": 214516, "epoch": 1772} {"train_loss": -33.71714401245117, "global_step": 214517, "epoch": 1772} {"train_loss": -34.21440505981445, "global_step": 214518, "epoch": 1772} {"train_loss": -35.972503662109375, "global_step": 214519, "epoch": 1772} {"train_loss": -35.51398468017578, "global_step": 214520, "epoch": 1772} {"train_loss": -35.211421966552734, "global_step": 214521, "epoch": 1772} {"train_loss": -35.24275588989258, "global_step": 214522, "epoch": 1772} {"train_loss": -35.51565170288086, "global_step": 214523, "epoch": 1772} {"train_loss": -27.69368553161621, "global_step": 214524, "epoch": 1772} {"train_loss": -32.660030364990234, "global_step": 214525, "epoch": 1772} {"train_loss": -35.01251220703125, "global_step": 214526, "epoch": 1772} {"train_loss": -31.847143173217773, "global_step": 214527, "epoch": 1772} {"train_loss": -34.1099967956543, "global_step": 214528, "epoch": 1772} {"train_loss": -35.08685302734375, "global_step": 214529, "epoch": 1772} {"train_loss": -29.371997833251953, "global_step": 214530, "epoch": 1772} {"train_loss": -32.04848861694336, "global_step": 214531, "epoch": 1772} {"train_loss": -39.384242380946134, "global_step": 214532, "epoch": 1772, "val_loss": 2595144.25} {"train_loss": -32.625423431396484, "global_step": 214533, "epoch": 1773} {"train_loss": -32.88624954223633, "global_step": 214534, "epoch": 1773} {"train_loss": -35.697906494140625, "global_step": 214535, "epoch": 1773} {"train_loss": -31.906665802001953, "global_step": 214536, "epoch": 1773} {"train_loss": -28.620580673217773, "global_step": 214537, "epoch": 1773} {"train_loss": -34.06736373901367, "global_step": 214538, "epoch": 1773} {"train_loss": -35.045589447021484, "global_step": 214539, "epoch": 1773} {"train_loss": -34.377113342285156, "global_step": 214540, "epoch": 1773} {"train_loss": -36.863861083984375, "global_step": 214541, "epoch": 1773} {"train_loss": -36.97597885131836, "global_step": 214542, "epoch": 1773} {"train_loss": -32.9648551940918, "global_step": 214543, "epoch": 1773} {"train_loss": -36.86328887939453, "global_step": 214544, "epoch": 1773} {"train_loss": -34.427974700927734, "global_step": 214545, "epoch": 1773} {"train_loss": -35.466793060302734, "global_step": 214546, "epoch": 1773} {"train_loss": -34.882102966308594, "global_step": 214547, "epoch": 1773} {"train_loss": -36.11091232299805, "global_step": 214548, "epoch": 1773} {"train_loss": -36.950103759765625, "global_step": 214549, "epoch": 1773} {"train_loss": -37.042152404785156, "global_step": 214550, "epoch": 1773} {"train_loss": -37.99772644042969, "global_step": 214551, "epoch": 1773} {"train_loss": -35.72018051147461, "global_step": 214552, "epoch": 1773} {"train_loss": -37.403499603271484, "global_step": 214553, "epoch": 1773} {"train_loss": -37.55642318725586, "global_step": 214554, "epoch": 1773} {"train_loss": -37.1748046875, "global_step": 214555, "epoch": 1773} {"train_loss": -37.19417190551758, "global_step": 214556, "epoch": 1773} {"train_loss": -37.890586853027344, "global_step": 214557, "epoch": 1773} {"train_loss": -37.539772033691406, "global_step": 214558, "epoch": 1773} {"train_loss": -37.44145584106445, "global_step": 214559, "epoch": 1773} {"train_loss": -38.012420654296875, "global_step": 214560, "epoch": 1773} {"train_loss": -37.45302963256836, "global_step": 214561, "epoch": 1773} {"train_loss": -37.2801399230957, "global_step": 214562, "epoch": 1773} {"train_loss": -37.211822509765625, "global_step": 214563, "epoch": 1773} {"train_loss": -38.042701721191406, "global_step": 214564, "epoch": 1773} {"train_loss": -37.17139434814453, "global_step": 214565, "epoch": 1773} {"train_loss": -38.58106231689453, "global_step": 214566, "epoch": 1773} {"train_loss": -38.62601852416992, "global_step": 214567, "epoch": 1773} {"train_loss": -38.4434928894043, "global_step": 214568, "epoch": 1773} {"train_loss": -38.893653869628906, "global_step": 214569, "epoch": 1773} {"train_loss": -39.134857177734375, "global_step": 214570, "epoch": 1773} {"train_loss": -38.954776763916016, "global_step": 214571, "epoch": 1773} {"train_loss": -38.65315628051758, "global_step": 214572, "epoch": 1773} {"train_loss": -38.536502838134766, "global_step": 214573, "epoch": 1773} {"train_loss": -38.352149963378906, "global_step": 214574, "epoch": 1773} {"train_loss": -38.19111251831055, "global_step": 214575, "epoch": 1773} {"train_loss": -38.578033447265625, "global_step": 214576, "epoch": 1773} {"train_loss": -38.85148239135742, "global_step": 214577, "epoch": 1773} {"train_loss": -38.580230712890625, "global_step": 214578, "epoch": 1773} {"train_loss": -39.082191467285156, "global_step": 214579, "epoch": 1773} {"train_loss": -38.70412826538086, "global_step": 214580, "epoch": 1773} {"train_loss": -39.439170837402344, "global_step": 214581, "epoch": 1773} {"train_loss": -39.360939025878906, "global_step": 214582, "epoch": 1773} {"train_loss": -39.010772705078125, "global_step": 214583, "epoch": 1773} {"train_loss": -39.574134826660156, "global_step": 214584, "epoch": 1773} {"train_loss": -39.16042709350586, "global_step": 214585, "epoch": 1773} {"train_loss": -39.63701248168945, "global_step": 214586, "epoch": 1773} {"train_loss": -39.777915954589844, "global_step": 214587, "epoch": 1773} {"train_loss": -39.57082748413086, "global_step": 214588, "epoch": 1773} {"train_loss": -39.21662139892578, "global_step": 214589, "epoch": 1773} {"train_loss": -39.88987350463867, "global_step": 214590, "epoch": 1773} {"train_loss": -39.05288314819336, "global_step": 214591, "epoch": 1773} {"train_loss": -38.828834533691406, "global_step": 214592, "epoch": 1773} {"train_loss": -39.64107894897461, "global_step": 214593, "epoch": 1773} {"train_loss": -39.629329681396484, "global_step": 214594, "epoch": 1773} {"train_loss": -39.70082473754883, "global_step": 214595, "epoch": 1773} {"train_loss": -39.6454963684082, "global_step": 214596, "epoch": 1773} {"train_loss": -39.513240814208984, "global_step": 214597, "epoch": 1773} {"train_loss": -38.285438537597656, "global_step": 214598, "epoch": 1773} {"train_loss": -39.608558654785156, "global_step": 214599, "epoch": 1773} {"train_loss": -39.62319564819336, "global_step": 214600, "epoch": 1773} {"train_loss": -40.01252365112305, "global_step": 214601, "epoch": 1773} {"train_loss": -38.99993896484375, "global_step": 214602, "epoch": 1773} {"train_loss": -40.17069625854492, "global_step": 214603, "epoch": 1773} {"train_loss": -39.5725212097168, "global_step": 214604, "epoch": 1773} {"train_loss": -40.18850326538086, "global_step": 214605, "epoch": 1773} {"train_loss": -40.23828125, "global_step": 214606, "epoch": 1773} {"train_loss": -40.50381088256836, "global_step": 214607, "epoch": 1773} {"train_loss": -39.23189926147461, "global_step": 214608, "epoch": 1773} {"train_loss": -39.46773910522461, "global_step": 214609, "epoch": 1773} {"train_loss": -40.03976058959961, "global_step": 214610, "epoch": 1773} {"train_loss": -40.15346145629883, "global_step": 214611, "epoch": 1773} {"train_loss": -40.43618392944336, "global_step": 214612, "epoch": 1773} {"train_loss": -40.18532943725586, "global_step": 214613, "epoch": 1773} {"train_loss": -40.26418685913086, "global_step": 214614, "epoch": 1773} {"train_loss": -40.5448112487793, "global_step": 214615, "epoch": 1773} {"train_loss": -40.69073486328125, "global_step": 214616, "epoch": 1773} {"train_loss": -40.460628509521484, "global_step": 214617, "epoch": 1773} {"train_loss": -39.62226867675781, "global_step": 214618, "epoch": 1773} {"train_loss": -40.1870002746582, "global_step": 214619, "epoch": 1773} {"train_loss": -40.7495231628418, "global_step": 214620, "epoch": 1773} {"train_loss": -40.32682418823242, "global_step": 214621, "epoch": 1773} {"train_loss": -40.59307861328125, "global_step": 214622, "epoch": 1773} {"train_loss": -40.30652618408203, "global_step": 214623, "epoch": 1773} {"train_loss": -40.37114715576172, "global_step": 214624, "epoch": 1773} {"train_loss": -40.77598190307617, "global_step": 214625, "epoch": 1773} {"train_loss": -40.12331008911133, "global_step": 214626, "epoch": 1773} {"train_loss": -40.81001663208008, "global_step": 214627, "epoch": 1773} {"train_loss": -41.021339416503906, "global_step": 214628, "epoch": 1773} {"train_loss": -41.076385498046875, "global_step": 214629, "epoch": 1773} {"train_loss": -40.3427848815918, "global_step": 214630, "epoch": 1773} {"train_loss": -40.0536003112793, "global_step": 214631, "epoch": 1773} {"train_loss": -41.064483642578125, "global_step": 214632, "epoch": 1773} {"train_loss": -40.95217514038086, "global_step": 214633, "epoch": 1773} {"train_loss": -40.4775505065918, "global_step": 214634, "epoch": 1773} {"train_loss": -40.693477630615234, "global_step": 214635, "epoch": 1773} {"train_loss": -40.6624755859375, "global_step": 214636, "epoch": 1773} {"train_loss": -40.3375129699707, "global_step": 214637, "epoch": 1773} {"train_loss": -40.80635452270508, "global_step": 214638, "epoch": 1773} {"train_loss": -40.70611572265625, "global_step": 214639, "epoch": 1773} {"train_loss": -40.40676498413086, "global_step": 214640, "epoch": 1773} {"train_loss": -38.112606048583984, "global_step": 214641, "epoch": 1773} {"train_loss": -37.08028793334961, "global_step": 214642, "epoch": 1773} {"train_loss": -37.01894760131836, "global_step": 214643, "epoch": 1773} {"train_loss": -37.70966339111328, "global_step": 214644, "epoch": 1773} {"train_loss": -39.57961654663086, "global_step": 214645, "epoch": 1773} {"train_loss": -40.64958190917969, "global_step": 214646, "epoch": 1773} {"train_loss": -39.79871368408203, "global_step": 214647, "epoch": 1773} {"train_loss": -39.41035842895508, "global_step": 214648, "epoch": 1773} {"train_loss": -39.851348876953125, "global_step": 214649, "epoch": 1773} {"train_loss": -40.904842376708984, "global_step": 214650, "epoch": 1773} {"train_loss": -39.27666091918945, "global_step": 214651, "epoch": 1773} {"train_loss": -38.21990966796875, "global_step": 214652, "epoch": 1773} {"train_loss": -38.63748725386691, "global_step": 214653, "epoch": 1773, "val_loss": 2548342.75} {"train_loss": -40.1860466003418, "global_step": 214654, "epoch": 1774} {"train_loss": -40.18928146362305, "global_step": 214655, "epoch": 1774} {"train_loss": -40.272151947021484, "global_step": 214656, "epoch": 1774} {"train_loss": -40.281253814697266, "global_step": 214657, "epoch": 1774} {"train_loss": -40.736305236816406, "global_step": 214658, "epoch": 1774} {"train_loss": -40.04726028442383, "global_step": 214659, "epoch": 1774} {"train_loss": -40.1055908203125, "global_step": 214660, "epoch": 1774} {"train_loss": -40.49318313598633, "global_step": 214661, "epoch": 1774} {"train_loss": -40.18851089477539, "global_step": 214662, "epoch": 1774} {"train_loss": -39.862762451171875, "global_step": 214663, "epoch": 1774} {"train_loss": -39.52353286743164, "global_step": 214664, "epoch": 1774} {"train_loss": -40.85044479370117, "global_step": 214665, "epoch": 1774} {"train_loss": -40.624122619628906, "global_step": 214666, "epoch": 1774} {"train_loss": -40.291168212890625, "global_step": 214667, "epoch": 1774} {"train_loss": -40.837547302246094, "global_step": 214668, "epoch": 1774} {"train_loss": -41.24436569213867, "global_step": 214669, "epoch": 1774} {"train_loss": -40.84736633300781, "global_step": 214670, "epoch": 1774} {"train_loss": -40.57420349121094, "global_step": 214671, "epoch": 1774} {"train_loss": -40.99114990234375, "global_step": 214672, "epoch": 1774} {"train_loss": -41.21391677856445, "global_step": 214673, "epoch": 1774} {"train_loss": -41.010406494140625, "global_step": 214674, "epoch": 1774} {"train_loss": -40.608428955078125, "global_step": 214675, "epoch": 1774} {"train_loss": -41.65031814575195, "global_step": 214676, "epoch": 1774} {"train_loss": -41.22600173950195, "global_step": 214677, "epoch": 1774} {"train_loss": -41.13557434082031, "global_step": 214678, "epoch": 1774} {"train_loss": -41.03578567504883, "global_step": 214679, "epoch": 1774} {"train_loss": -40.46761703491211, "global_step": 214680, "epoch": 1774} {"train_loss": -40.97703170776367, "global_step": 214681, "epoch": 1774} {"train_loss": -41.177486419677734, "global_step": 214682, "epoch": 1774} {"train_loss": -40.4282112121582, "global_step": 214683, "epoch": 1774} {"train_loss": -39.96952819824219, "global_step": 214684, "epoch": 1774} {"train_loss": -39.5308952331543, "global_step": 214685, "epoch": 1774} {"train_loss": -40.901607513427734, "global_step": 214686, "epoch": 1774} {"train_loss": -41.72809982299805, "global_step": 214687, "epoch": 1774} {"train_loss": -41.05641555786133, "global_step": 214688, "epoch": 1774} {"train_loss": -38.574642181396484, "global_step": 214689, "epoch": 1774} {"train_loss": -40.19393539428711, "global_step": 214690, "epoch": 1774} {"train_loss": -39.87677001953125, "global_step": 214691, "epoch": 1774} {"train_loss": -41.42753219604492, "global_step": 214692, "epoch": 1774} {"train_loss": -40.546356201171875, "global_step": 214693, "epoch": 1774} {"train_loss": -40.37467575073242, "global_step": 214694, "epoch": 1774} {"train_loss": -40.74943161010742, "global_step": 214695, "epoch": 1774} {"train_loss": -41.44956588745117, "global_step": 214696, "epoch": 1774} {"train_loss": -40.17588424682617, "global_step": 214697, "epoch": 1774} {"train_loss": -41.01615905761719, "global_step": 214698, "epoch": 1774} {"train_loss": -41.0181884765625, "global_step": 214699, "epoch": 1774} {"train_loss": -41.497947692871094, "global_step": 214700, "epoch": 1774} {"train_loss": -40.93921661376953, "global_step": 214701, "epoch": 1774} {"train_loss": -41.869354248046875, "global_step": 214702, "epoch": 1774} {"train_loss": -41.8945426940918, "global_step": 214703, "epoch": 1774} {"train_loss": -41.41265869140625, "global_step": 214704, "epoch": 1774} {"train_loss": -41.827693939208984, "global_step": 214705, "epoch": 1774} {"train_loss": -41.91858673095703, "global_step": 214706, "epoch": 1774} {"train_loss": -41.7098274230957, "global_step": 214707, "epoch": 1774} {"train_loss": -41.3607063293457, "global_step": 214708, "epoch": 1774} {"train_loss": -42.18963623046875, "global_step": 214709, "epoch": 1774} {"train_loss": -41.77359390258789, "global_step": 214710, "epoch": 1774} {"train_loss": -41.61970901489258, "global_step": 214711, "epoch": 1774} {"train_loss": -41.3112907409668, "global_step": 214712, "epoch": 1774} {"train_loss": -42.398983001708984, "global_step": 214713, "epoch": 1774} {"train_loss": -41.40250778198242, "global_step": 214714, "epoch": 1774} {"train_loss": -40.996456146240234, "global_step": 214715, "epoch": 1774} {"train_loss": -41.9624137878418, "global_step": 214716, "epoch": 1774} {"train_loss": -41.972267150878906, "global_step": 214717, "epoch": 1774} {"train_loss": -41.39534378051758, "global_step": 214718, "epoch": 1774} {"train_loss": -41.35873031616211, "global_step": 214719, "epoch": 1774} {"train_loss": -41.05965042114258, "global_step": 214720, "epoch": 1774} {"train_loss": -42.33319854736328, "global_step": 214721, "epoch": 1774} {"train_loss": -42.245296478271484, "global_step": 214722, "epoch": 1774} {"train_loss": -40.6228141784668, "global_step": 214723, "epoch": 1774} {"train_loss": -41.572872161865234, "global_step": 214724, "epoch": 1774} {"train_loss": -42.026039123535156, "global_step": 214725, "epoch": 1774} {"train_loss": -41.70695114135742, "global_step": 214726, "epoch": 1774} {"train_loss": -41.877197265625, "global_step": 214727, "epoch": 1774} {"train_loss": -41.53286361694336, "global_step": 214728, "epoch": 1774} {"train_loss": -41.18330001831055, "global_step": 214729, "epoch": 1774} {"train_loss": -41.85992431640625, "global_step": 214730, "epoch": 1774} {"train_loss": -41.1001091003418, "global_step": 214731, "epoch": 1774} {"train_loss": -39.470394134521484, "global_step": 214732, "epoch": 1774} {"train_loss": -39.91021728515625, "global_step": 214733, "epoch": 1774} {"train_loss": -40.19718551635742, "global_step": 214734, "epoch": 1774} {"train_loss": -41.08642578125, "global_step": 214735, "epoch": 1774} {"train_loss": -41.76508331298828, "global_step": 214736, "epoch": 1774} {"train_loss": -40.60075759887695, "global_step": 214737, "epoch": 1774} {"train_loss": -39.56618118286133, "global_step": 214738, "epoch": 1774} {"train_loss": -40.20627975463867, "global_step": 214739, "epoch": 1774} {"train_loss": -39.21050262451172, "global_step": 214740, "epoch": 1774} {"train_loss": -41.317909240722656, "global_step": 214741, "epoch": 1774} {"train_loss": -40.05963897705078, "global_step": 214742, "epoch": 1774} {"train_loss": -41.004119873046875, "global_step": 214743, "epoch": 1774} {"train_loss": -41.294979095458984, "global_step": 214744, "epoch": 1774} {"train_loss": -41.355072021484375, "global_step": 214745, "epoch": 1774} {"train_loss": -42.1052360534668, "global_step": 214746, "epoch": 1774} {"train_loss": -40.525543212890625, "global_step": 214747, "epoch": 1774} {"train_loss": -41.39994430541992, "global_step": 214748, "epoch": 1774} {"train_loss": -41.59846115112305, "global_step": 214749, "epoch": 1774} {"train_loss": -41.629241943359375, "global_step": 214750, "epoch": 1774} {"train_loss": -41.58679962158203, "global_step": 214751, "epoch": 1774} {"train_loss": -41.88671112060547, "global_step": 214752, "epoch": 1774} {"train_loss": -41.860355377197266, "global_step": 214753, "epoch": 1774} {"train_loss": -40.48154830932617, "global_step": 214754, "epoch": 1774} {"train_loss": -40.99484634399414, "global_step": 214755, "epoch": 1774} {"train_loss": -41.36945724487305, "global_step": 214756, "epoch": 1774} {"train_loss": -40.63776779174805, "global_step": 214757, "epoch": 1774} {"train_loss": -41.4088249206543, "global_step": 214758, "epoch": 1774} {"train_loss": -41.7237663269043, "global_step": 214759, "epoch": 1774} {"train_loss": -41.48884582519531, "global_step": 214760, "epoch": 1774} {"train_loss": -40.95463180541992, "global_step": 214761, "epoch": 1774} {"train_loss": -40.41598129272461, "global_step": 214762, "epoch": 1774} {"train_loss": -40.46320724487305, "global_step": 214763, "epoch": 1774} {"train_loss": -39.104434967041016, "global_step": 214764, "epoch": 1774} {"train_loss": -37.75945281982422, "global_step": 214765, "epoch": 1774} {"train_loss": -36.73922348022461, "global_step": 214766, "epoch": 1774} {"train_loss": -36.83052444458008, "global_step": 214767, "epoch": 1774} {"train_loss": -36.75499725341797, "global_step": 214768, "epoch": 1774} {"train_loss": -40.16429901123047, "global_step": 214769, "epoch": 1774} {"train_loss": -41.2900505065918, "global_step": 214770, "epoch": 1774} {"train_loss": -39.420536041259766, "global_step": 214771, "epoch": 1774} {"train_loss": -41.02900314331055, "global_step": 214772, "epoch": 1774} {"train_loss": -40.17292785644531, "global_step": 214773, "epoch": 1774} {"train_loss": -40.79598784643756, "global_step": 214774, "epoch": 1774, "val_loss": 2627784.75} {"train_loss": -38.72682571411133, "global_step": 214775, "epoch": 1775} {"train_loss": -40.73618698120117, "global_step": 214776, "epoch": 1775} {"train_loss": -41.035160064697266, "global_step": 214777, "epoch": 1775} {"train_loss": -40.53828430175781, "global_step": 214778, "epoch": 1775} {"train_loss": -41.0626106262207, "global_step": 214779, "epoch": 1775} {"train_loss": -40.027835845947266, "global_step": 214780, "epoch": 1775} {"train_loss": -39.510955810546875, "global_step": 214781, "epoch": 1775} {"train_loss": -41.25735855102539, "global_step": 214782, "epoch": 1775} {"train_loss": -41.191654205322266, "global_step": 214783, "epoch": 1775} {"train_loss": -40.15186309814453, "global_step": 214784, "epoch": 1775} {"train_loss": -41.12538528442383, "global_step": 214785, "epoch": 1775} {"train_loss": -41.03208923339844, "global_step": 214786, "epoch": 1775} {"train_loss": -40.71133041381836, "global_step": 214787, "epoch": 1775} {"train_loss": -40.599910736083984, "global_step": 214788, "epoch": 1775} {"train_loss": -41.526309967041016, "global_step": 214789, "epoch": 1775} {"train_loss": -37.63933181762695, "global_step": 214790, "epoch": 1775} {"train_loss": -41.31484603881836, "global_step": 214791, "epoch": 1775} {"train_loss": -39.26634979248047, "global_step": 214792, "epoch": 1775} {"train_loss": -41.01308059692383, "global_step": 214793, "epoch": 1775} {"train_loss": -41.42436218261719, "global_step": 214794, "epoch": 1775} {"train_loss": -41.24982833862305, "global_step": 214795, "epoch": 1775} {"train_loss": -41.553890228271484, "global_step": 214796, "epoch": 1775} {"train_loss": -40.98853302001953, "global_step": 214797, "epoch": 1775} {"train_loss": -41.45602035522461, "global_step": 214798, "epoch": 1775} {"train_loss": -40.601402282714844, "global_step": 214799, "epoch": 1775} {"train_loss": -41.515316009521484, "global_step": 214800, "epoch": 1775} {"train_loss": -41.289302825927734, "global_step": 214801, "epoch": 1775} {"train_loss": -41.21912384033203, "global_step": 214802, "epoch": 1775} {"train_loss": -41.523658752441406, "global_step": 214803, "epoch": 1775} {"train_loss": -40.809852600097656, "global_step": 214804, "epoch": 1775} {"train_loss": -41.67234420776367, "global_step": 214805, "epoch": 1775} {"train_loss": -41.38028335571289, "global_step": 214806, "epoch": 1775} {"train_loss": -40.828407287597656, "global_step": 214807, "epoch": 1775} {"train_loss": -40.90010452270508, "global_step": 214808, "epoch": 1775} {"train_loss": -41.5478630065918, "global_step": 214809, "epoch": 1775} {"train_loss": -41.3205680847168, "global_step": 214810, "epoch": 1775} {"train_loss": -39.92586898803711, "global_step": 214811, "epoch": 1775} {"train_loss": -40.08860397338867, "global_step": 214812, "epoch": 1775} {"train_loss": -40.575923919677734, "global_step": 214813, "epoch": 1775} {"train_loss": -39.148738861083984, "global_step": 214814, "epoch": 1775} {"train_loss": -39.23662185668945, "global_step": 214815, "epoch": 1775} {"train_loss": -41.00748062133789, "global_step": 214816, "epoch": 1775} {"train_loss": -39.89719772338867, "global_step": 214817, "epoch": 1775} {"train_loss": -38.226749420166016, "global_step": 214818, "epoch": 1775} {"train_loss": -39.30766296386719, "global_step": 214819, "epoch": 1775} {"train_loss": -41.02661895751953, "global_step": 214820, "epoch": 1775} {"train_loss": -41.14816665649414, "global_step": 214821, "epoch": 1775} {"train_loss": -40.18758773803711, "global_step": 214822, "epoch": 1775} {"train_loss": -40.79771041870117, "global_step": 214823, "epoch": 1775} {"train_loss": -41.0813102722168, "global_step": 214824, "epoch": 1775} {"train_loss": -40.92707443237305, "global_step": 214825, "epoch": 1775} {"train_loss": -41.140724182128906, "global_step": 214826, "epoch": 1775} {"train_loss": -40.347042083740234, "global_step": 214827, "epoch": 1775} {"train_loss": -41.06244659423828, "global_step": 214828, "epoch": 1775} {"train_loss": -41.861446380615234, "global_step": 214829, "epoch": 1775} {"train_loss": -41.20988464355469, "global_step": 214830, "epoch": 1775} {"train_loss": -41.292781829833984, "global_step": 214831, "epoch": 1775} {"train_loss": -41.96452713012695, "global_step": 214832, "epoch": 1775} {"train_loss": -41.15863800048828, "global_step": 214833, "epoch": 1775} {"train_loss": -41.96171188354492, "global_step": 214834, "epoch": 1775} {"train_loss": -42.21814727783203, "global_step": 214835, "epoch": 1775} {"train_loss": -42.095577239990234, "global_step": 214836, "epoch": 1775} {"train_loss": -41.56787872314453, "global_step": 214837, "epoch": 1775} {"train_loss": -42.050201416015625, "global_step": 214838, "epoch": 1775} {"train_loss": -42.092830657958984, "global_step": 214839, "epoch": 1775} {"train_loss": -42.225860595703125, "global_step": 214840, "epoch": 1775} {"train_loss": -41.599239349365234, "global_step": 214841, "epoch": 1775} {"train_loss": -41.88972091674805, "global_step": 214842, "epoch": 1775} {"train_loss": -41.80325698852539, "global_step": 214843, "epoch": 1775} {"train_loss": -41.709102630615234, "global_step": 214844, "epoch": 1775} {"train_loss": -41.733489990234375, "global_step": 214845, "epoch": 1775} {"train_loss": -40.61262130737305, "global_step": 214846, "epoch": 1775} {"train_loss": -40.7708625793457, "global_step": 214847, "epoch": 1775} {"train_loss": -41.09419250488281, "global_step": 214848, "epoch": 1775} {"train_loss": -41.17877197265625, "global_step": 214849, "epoch": 1775} {"train_loss": -41.4011344909668, "global_step": 214850, "epoch": 1775} {"train_loss": -41.8957633972168, "global_step": 214851, "epoch": 1775} {"train_loss": -40.8421745300293, "global_step": 214852, "epoch": 1775} {"train_loss": -40.28406524658203, "global_step": 214853, "epoch": 1775} {"train_loss": -41.72610092163086, "global_step": 214854, "epoch": 1775} {"train_loss": -42.079952239990234, "global_step": 214855, "epoch": 1775} {"train_loss": -39.58795166015625, "global_step": 214856, "epoch": 1775} {"train_loss": -40.13698959350586, "global_step": 214857, "epoch": 1775} {"train_loss": -40.09260177612305, "global_step": 214858, "epoch": 1775} {"train_loss": -41.10348892211914, "global_step": 214859, "epoch": 1775} {"train_loss": -41.95956039428711, "global_step": 214860, "epoch": 1775} {"train_loss": -40.041194915771484, "global_step": 214861, "epoch": 1775} {"train_loss": -41.20204162597656, "global_step": 214862, "epoch": 1775} {"train_loss": -41.2069091796875, "global_step": 214863, "epoch": 1775} {"train_loss": -40.55588912963867, "global_step": 214864, "epoch": 1775} {"train_loss": -40.30408477783203, "global_step": 214865, "epoch": 1775} {"train_loss": -41.524505615234375, "global_step": 214866, "epoch": 1775} {"train_loss": -40.5406608581543, "global_step": 214867, "epoch": 1775} {"train_loss": -41.89347457885742, "global_step": 214868, "epoch": 1775} {"train_loss": -40.68992233276367, "global_step": 214869, "epoch": 1775} {"train_loss": -41.263702392578125, "global_step": 214870, "epoch": 1775} {"train_loss": -40.25688171386719, "global_step": 214871, "epoch": 1775} {"train_loss": -40.75636672973633, "global_step": 214872, "epoch": 1775} {"train_loss": -40.781063079833984, "global_step": 214873, "epoch": 1775} {"train_loss": -38.493072509765625, "global_step": 214874, "epoch": 1775} {"train_loss": -40.72709274291992, "global_step": 214875, "epoch": 1775} {"train_loss": -40.51313018798828, "global_step": 214876, "epoch": 1775} {"train_loss": -40.324764251708984, "global_step": 214877, "epoch": 1775} {"train_loss": -39.715545654296875, "global_step": 214878, "epoch": 1775} {"train_loss": -40.9798469543457, "global_step": 214879, "epoch": 1775} {"train_loss": -40.7321662902832, "global_step": 214880, "epoch": 1775} {"train_loss": -41.025726318359375, "global_step": 214881, "epoch": 1775} {"train_loss": -40.8966178894043, "global_step": 214882, "epoch": 1775} {"train_loss": -41.265655517578125, "global_step": 214883, "epoch": 1775} {"train_loss": -41.496368408203125, "global_step": 214884, "epoch": 1775} {"train_loss": -41.2573127746582, "global_step": 214885, "epoch": 1775} {"train_loss": -41.65644836425781, "global_step": 214886, "epoch": 1775} {"train_loss": -41.66943359375, "global_step": 214887, "epoch": 1775} {"train_loss": -40.850616455078125, "global_step": 214888, "epoch": 1775} {"train_loss": -41.80765914916992, "global_step": 214889, "epoch": 1775} {"train_loss": -40.701900482177734, "global_step": 214890, "epoch": 1775} {"train_loss": -41.33563232421875, "global_step": 214891, "epoch": 1775} {"train_loss": -42.44792556762695, "global_step": 214892, "epoch": 1775} {"train_loss": -41.764183044433594, "global_step": 214893, "epoch": 1775} {"train_loss": -41.052406311035156, "global_step": 214894, "epoch": 1775} {"train_loss": -40.937462546608664, "global_step": 214895, "epoch": 1775, "val_loss": 2632919.0} {"train_loss": -40.87161636352539, "global_step": 214896, "epoch": 1776} {"train_loss": -40.656429290771484, "global_step": 214897, "epoch": 1776} {"train_loss": -41.4864616394043, "global_step": 214898, "epoch": 1776} {"train_loss": -41.79204559326172, "global_step": 214899, "epoch": 1776} {"train_loss": -40.66456604003906, "global_step": 214900, "epoch": 1776} {"train_loss": -40.984249114990234, "global_step": 214901, "epoch": 1776} {"train_loss": -40.066890716552734, "global_step": 214902, "epoch": 1776} {"train_loss": -41.82344055175781, "global_step": 214903, "epoch": 1776} {"train_loss": -41.300445556640625, "global_step": 214904, "epoch": 1776} {"train_loss": -41.318756103515625, "global_step": 214905, "epoch": 1776} {"train_loss": -41.181636810302734, "global_step": 214906, "epoch": 1776} {"train_loss": -41.37598419189453, "global_step": 214907, "epoch": 1776} {"train_loss": -40.3092041015625, "global_step": 214908, "epoch": 1776} {"train_loss": -41.631980895996094, "global_step": 214909, "epoch": 1776} {"train_loss": -41.9931755065918, "global_step": 214910, "epoch": 1776} {"train_loss": -41.18158721923828, "global_step": 214911, "epoch": 1776} {"train_loss": -41.428260803222656, "global_step": 214912, "epoch": 1776} {"train_loss": -41.82717514038086, "global_step": 214913, "epoch": 1776} {"train_loss": -41.749107360839844, "global_step": 214914, "epoch": 1776} {"train_loss": -42.057762145996094, "global_step": 214915, "epoch": 1776} {"train_loss": -41.25008010864258, "global_step": 214916, "epoch": 1776} {"train_loss": -41.841064453125, "global_step": 214917, "epoch": 1776} {"train_loss": -41.7761116027832, "global_step": 214918, "epoch": 1776} {"train_loss": -41.83553695678711, "global_step": 214919, "epoch": 1776} {"train_loss": -42.48923873901367, "global_step": 214920, "epoch": 1776} {"train_loss": -42.04713821411133, "global_step": 214921, "epoch": 1776} {"train_loss": -42.1992301940918, "global_step": 214922, "epoch": 1776} {"train_loss": -42.47062301635742, "global_step": 214923, "epoch": 1776} {"train_loss": -41.6442985534668, "global_step": 214924, "epoch": 1776} {"train_loss": -42.03359603881836, "global_step": 214925, "epoch": 1776} {"train_loss": -41.69775390625, "global_step": 214926, "epoch": 1776} {"train_loss": -41.640987396240234, "global_step": 214927, "epoch": 1776} {"train_loss": -40.60274887084961, "global_step": 214928, "epoch": 1776} {"train_loss": -40.7596435546875, "global_step": 214929, "epoch": 1776} {"train_loss": -41.060184478759766, "global_step": 214930, "epoch": 1776} {"train_loss": -40.70988082885742, "global_step": 214931, "epoch": 1776} {"train_loss": -41.6580696105957, "global_step": 214932, "epoch": 1776} {"train_loss": -41.50215148925781, "global_step": 214933, "epoch": 1776} {"train_loss": -39.46173858642578, "global_step": 214934, "epoch": 1776} {"train_loss": -42.149295806884766, "global_step": 214935, "epoch": 1776} {"train_loss": -41.16660690307617, "global_step": 214936, "epoch": 1776} {"train_loss": -40.84189987182617, "global_step": 214937, "epoch": 1776} {"train_loss": -42.24695587158203, "global_step": 214938, "epoch": 1776} {"train_loss": -41.107887268066406, "global_step": 214939, "epoch": 1776} {"train_loss": -40.9033088684082, "global_step": 214940, "epoch": 1776} {"train_loss": -40.344696044921875, "global_step": 214941, "epoch": 1776} {"train_loss": -41.87343978881836, "global_step": 214942, "epoch": 1776} {"train_loss": -39.98992919921875, "global_step": 214943, "epoch": 1776} {"train_loss": -38.44795608520508, "global_step": 214944, "epoch": 1776} {"train_loss": -39.76303482055664, "global_step": 214945, "epoch": 1776} {"train_loss": -41.70809555053711, "global_step": 214946, "epoch": 1776} {"train_loss": -37.948028564453125, "global_step": 214947, "epoch": 1776} {"train_loss": -38.975589752197266, "global_step": 214948, "epoch": 1776} {"train_loss": -40.58518981933594, "global_step": 214949, "epoch": 1776} {"train_loss": -40.51726150512695, "global_step": 214950, "epoch": 1776} {"train_loss": -39.74943542480469, "global_step": 214951, "epoch": 1776} {"train_loss": -39.87261199951172, "global_step": 214952, "epoch": 1776} {"train_loss": -41.003639221191406, "global_step": 214953, "epoch": 1776} {"train_loss": -39.73578643798828, "global_step": 214954, "epoch": 1776} {"train_loss": -40.91449737548828, "global_step": 214955, "epoch": 1776} {"train_loss": -41.41506576538086, "global_step": 214956, "epoch": 1776} {"train_loss": -38.82061004638672, "global_step": 214957, "epoch": 1776} {"train_loss": -40.98653030395508, "global_step": 214958, "epoch": 1776} {"train_loss": -41.23408889770508, "global_step": 214959, "epoch": 1776} {"train_loss": -39.536109924316406, "global_step": 214960, "epoch": 1776} {"train_loss": -42.16481399536133, "global_step": 214961, "epoch": 1776} {"train_loss": -41.12299346923828, "global_step": 214962, "epoch": 1776} {"train_loss": -41.162025451660156, "global_step": 214963, "epoch": 1776} {"train_loss": -42.046607971191406, "global_step": 214964, "epoch": 1776} {"train_loss": -41.75110626220703, "global_step": 214965, "epoch": 1776} {"train_loss": -41.15519332885742, "global_step": 214966, "epoch": 1776} {"train_loss": -38.5915641784668, "global_step": 214967, "epoch": 1776} {"train_loss": -41.17869186401367, "global_step": 214968, "epoch": 1776} {"train_loss": -40.811241149902344, "global_step": 214969, "epoch": 1776} {"train_loss": -40.62128829956055, "global_step": 214970, "epoch": 1776} {"train_loss": -39.08857345581055, "global_step": 214971, "epoch": 1776} {"train_loss": -39.61227798461914, "global_step": 214972, "epoch": 1776} {"train_loss": -38.870391845703125, "global_step": 214973, "epoch": 1776} {"train_loss": -38.00634765625, "global_step": 214974, "epoch": 1776} {"train_loss": -41.3355598449707, "global_step": 214975, "epoch": 1776} {"train_loss": -37.445350646972656, "global_step": 214976, "epoch": 1776} {"train_loss": -36.463348388671875, "global_step": 214977, "epoch": 1776} {"train_loss": -40.48769760131836, "global_step": 214978, "epoch": 1776} {"train_loss": -38.740867614746094, "global_step": 214979, "epoch": 1776} {"train_loss": -37.525794982910156, "global_step": 214980, "epoch": 1776} {"train_loss": -40.22422790527344, "global_step": 214981, "epoch": 1776} {"train_loss": -37.902557373046875, "global_step": 214982, "epoch": 1776} {"train_loss": -35.705936431884766, "global_step": 214983, "epoch": 1776} {"train_loss": -37.214447021484375, "global_step": 214984, "epoch": 1776} {"train_loss": -37.70638656616211, "global_step": 214985, "epoch": 1776} {"train_loss": -39.9416618347168, "global_step": 214986, "epoch": 1776} {"train_loss": -39.08662414550781, "global_step": 214987, "epoch": 1776} {"train_loss": -37.46477127075195, "global_step": 214988, "epoch": 1776} {"train_loss": -35.87578201293945, "global_step": 214989, "epoch": 1776} {"train_loss": -40.079132080078125, "global_step": 214990, "epoch": 1776} {"train_loss": -34.698341369628906, "global_step": 214991, "epoch": 1776} {"train_loss": -39.29307556152344, "global_step": 214992, "epoch": 1776} {"train_loss": -38.02444076538086, "global_step": 214993, "epoch": 1776} {"train_loss": -39.95277786254883, "global_step": 214994, "epoch": 1776} {"train_loss": -40.19856643676758, "global_step": 214995, "epoch": 1776} {"train_loss": -37.467071533203125, "global_step": 214996, "epoch": 1776} {"train_loss": -37.188961029052734, "global_step": 214997, "epoch": 1776} {"train_loss": -39.06814193725586, "global_step": 214998, "epoch": 1776} {"train_loss": -36.34101104736328, "global_step": 214999, "epoch": 1776} {"train_loss": -34.89204406738281, "global_step": 215000, "epoch": 1776} {"train_loss": -36.48380661010742, "global_step": 215001, "epoch": 1776} {"train_loss": -38.48029708862305, "global_step": 215002, "epoch": 1776} {"train_loss": -39.493587493896484, "global_step": 215003, "epoch": 1776} {"train_loss": -39.19215774536133, "global_step": 215004, "epoch": 1776} {"train_loss": -38.295860290527344, "global_step": 215005, "epoch": 1776} {"train_loss": -36.6515007019043, "global_step": 215006, "epoch": 1776} {"train_loss": -36.317806243896484, "global_step": 215007, "epoch": 1776} {"train_loss": -39.197444915771484, "global_step": 215008, "epoch": 1776} {"train_loss": -39.464576721191406, "global_step": 215009, "epoch": 1776} {"train_loss": -38.624080657958984, "global_step": 215010, "epoch": 1776} {"train_loss": -38.20917510986328, "global_step": 215011, "epoch": 1776} {"train_loss": -39.349666595458984, "global_step": 215012, "epoch": 1776} {"train_loss": -35.888282775878906, "global_step": 215013, "epoch": 1776} {"train_loss": -38.62118148803711, "global_step": 215014, "epoch": 1776} {"train_loss": -39.88716506958008, "global_step": 215015, "epoch": 1776} {"train_loss": -39.97026553823928, "global_step": 215016, "epoch": 1776, "val_loss": 2560409.75} {"train_loss": -37.003326416015625, "global_step": 215017, "epoch": 1777} {"train_loss": -40.066165924072266, "global_step": 215018, "epoch": 1777} {"train_loss": -40.798561096191406, "global_step": 215019, "epoch": 1777} {"train_loss": -39.053279876708984, "global_step": 215020, "epoch": 1777} {"train_loss": -39.69767379760742, "global_step": 215021, "epoch": 1777} {"train_loss": -39.73345184326172, "global_step": 215022, "epoch": 1777} {"train_loss": -34.25160598754883, "global_step": 215023, "epoch": 1777} {"train_loss": -38.7298469543457, "global_step": 215024, "epoch": 1777} {"train_loss": -39.52599334716797, "global_step": 215025, "epoch": 1777} {"train_loss": -39.743690490722656, "global_step": 215026, "epoch": 1777} {"train_loss": -38.52877426147461, "global_step": 215027, "epoch": 1777} {"train_loss": -36.925636291503906, "global_step": 215028, "epoch": 1777} {"train_loss": -40.14617919921875, "global_step": 215029, "epoch": 1777} {"train_loss": -40.22498321533203, "global_step": 215030, "epoch": 1777} {"train_loss": -38.60877990722656, "global_step": 215031, "epoch": 1777} {"train_loss": -39.48682403564453, "global_step": 215032, "epoch": 1777} {"train_loss": -35.82564163208008, "global_step": 215033, "epoch": 1777} {"train_loss": -38.153255462646484, "global_step": 215034, "epoch": 1777} {"train_loss": -38.13096237182617, "global_step": 215035, "epoch": 1777} {"train_loss": -37.99178695678711, "global_step": 215036, "epoch": 1777} {"train_loss": -36.348995208740234, "global_step": 215037, "epoch": 1777} {"train_loss": -39.214229583740234, "global_step": 215038, "epoch": 1777} {"train_loss": -39.58869552612305, "global_step": 215039, "epoch": 1777} {"train_loss": -36.635032653808594, "global_step": 215040, "epoch": 1777} {"train_loss": -38.18404006958008, "global_step": 215041, "epoch": 1777} {"train_loss": -22.742162704467773, "global_step": 215042, "epoch": 1777} {"train_loss": -31.715356826782227, "global_step": 215043, "epoch": 1777} {"train_loss": -39.76214599609375, "global_step": 215044, "epoch": 1777} {"train_loss": -37.54212188720703, "global_step": 215045, "epoch": 1777} {"train_loss": -30.342390060424805, "global_step": 215046, "epoch": 1777} {"train_loss": -15.415826797485352, "global_step": 215047, "epoch": 1777} {"train_loss": -30.266529083251953, "global_step": 215048, "epoch": 1777} {"train_loss": -35.83002853393555, "global_step": 215049, "epoch": 1777} {"train_loss": -33.90047073364258, "global_step": 215050, "epoch": 1777} {"train_loss": -34.59504318237305, "global_step": 215051, "epoch": 1777} {"train_loss": -35.696861267089844, "global_step": 215052, "epoch": 1777} {"train_loss": -35.92478561401367, "global_step": 215053, "epoch": 1777} {"train_loss": -24.498830795288086, "global_step": 215054, "epoch": 1777} {"train_loss": -30.383756637573242, "global_step": 215055, "epoch": 1777} {"train_loss": -35.8082389831543, "global_step": 215056, "epoch": 1777} {"train_loss": -28.450056076049805, "global_step": 215057, "epoch": 1777} {"train_loss": -34.154476165771484, "global_step": 215058, "epoch": 1777} {"train_loss": -33.805755615234375, "global_step": 215059, "epoch": 1777} {"train_loss": -22.545852661132812, "global_step": 215060, "epoch": 1777} {"train_loss": -32.309234619140625, "global_step": 215061, "epoch": 1777} {"train_loss": -36.809364318847656, "global_step": 215062, "epoch": 1777} {"train_loss": -36.674110412597656, "global_step": 215063, "epoch": 1777} {"train_loss": -36.40761184692383, "global_step": 215064, "epoch": 1777} {"train_loss": -33.386539459228516, "global_step": 215065, "epoch": 1777} {"train_loss": -35.1651725769043, "global_step": 215066, "epoch": 1777} {"train_loss": -32.731285095214844, "global_step": 215067, "epoch": 1777} {"train_loss": -35.5728874206543, "global_step": 215068, "epoch": 1777} {"train_loss": -36.428802490234375, "global_step": 215069, "epoch": 1777} {"train_loss": -34.858848571777344, "global_step": 215070, "epoch": 1777} {"train_loss": -36.21442413330078, "global_step": 215071, "epoch": 1777} {"train_loss": -37.14626693725586, "global_step": 215072, "epoch": 1777} {"train_loss": -36.25265121459961, "global_step": 215073, "epoch": 1777} {"train_loss": -35.745174407958984, "global_step": 215074, "epoch": 1777} {"train_loss": -37.00027084350586, "global_step": 215075, "epoch": 1777} {"train_loss": -37.81956100463867, "global_step": 215076, "epoch": 1777} {"train_loss": -36.669071197509766, "global_step": 215077, "epoch": 1777} {"train_loss": -36.2514533996582, "global_step": 215078, "epoch": 1777} {"train_loss": -36.84345626831055, "global_step": 215079, "epoch": 1777} {"train_loss": -38.03921127319336, "global_step": 215080, "epoch": 1777} {"train_loss": -37.66961669921875, "global_step": 215081, "epoch": 1777} {"train_loss": -37.79194259643555, "global_step": 215082, "epoch": 1777} {"train_loss": -37.47690200805664, "global_step": 215083, "epoch": 1777} {"train_loss": -37.25635528564453, "global_step": 215084, "epoch": 1777} {"train_loss": -36.429718017578125, "global_step": 215085, "epoch": 1777} {"train_loss": -37.795745849609375, "global_step": 215086, "epoch": 1777} {"train_loss": -37.97407150268555, "global_step": 215087, "epoch": 1777} {"train_loss": -37.63909912109375, "global_step": 215088, "epoch": 1777} {"train_loss": -38.49824142456055, "global_step": 215089, "epoch": 1777} {"train_loss": -38.394073486328125, "global_step": 215090, "epoch": 1777} {"train_loss": -37.75754928588867, "global_step": 215091, "epoch": 1777} {"train_loss": -38.42884826660156, "global_step": 215092, "epoch": 1777} {"train_loss": -38.60551834106445, "global_step": 215093, "epoch": 1777} {"train_loss": -38.58331298828125, "global_step": 215094, "epoch": 1777} {"train_loss": -38.06254196166992, "global_step": 215095, "epoch": 1777} {"train_loss": -38.75287628173828, "global_step": 215096, "epoch": 1777} {"train_loss": -38.66394805908203, "global_step": 215097, "epoch": 1777} {"train_loss": -39.07685852050781, "global_step": 215098, "epoch": 1777} {"train_loss": -38.9720573425293, "global_step": 215099, "epoch": 1777} {"train_loss": -38.91030502319336, "global_step": 215100, "epoch": 1777} {"train_loss": -38.78038787841797, "global_step": 215101, "epoch": 1777} {"train_loss": -38.49066925048828, "global_step": 215102, "epoch": 1777} {"train_loss": -38.94353103637695, "global_step": 215103, "epoch": 1777} {"train_loss": -38.45658493041992, "global_step": 215104, "epoch": 1777} {"train_loss": -39.02180099487305, "global_step": 215105, "epoch": 1777} {"train_loss": -38.877925872802734, "global_step": 215106, "epoch": 1777} {"train_loss": -38.77941131591797, "global_step": 215107, "epoch": 1777} {"train_loss": -39.52617263793945, "global_step": 215108, "epoch": 1777} {"train_loss": -38.5692253112793, "global_step": 215109, "epoch": 1777} {"train_loss": -39.56719207763672, "global_step": 215110, "epoch": 1777} {"train_loss": -39.16401290893555, "global_step": 215111, "epoch": 1777} {"train_loss": -38.577491760253906, "global_step": 215112, "epoch": 1777} {"train_loss": -38.997581481933594, "global_step": 215113, "epoch": 1777} {"train_loss": -39.24213409423828, "global_step": 215114, "epoch": 1777} {"train_loss": -39.59218978881836, "global_step": 215115, "epoch": 1777} {"train_loss": -39.546722412109375, "global_step": 215116, "epoch": 1777} {"train_loss": -39.47892379760742, "global_step": 215117, "epoch": 1777} {"train_loss": -40.01448059082031, "global_step": 215118, "epoch": 1777} {"train_loss": -39.25409698486328, "global_step": 215119, "epoch": 1777} {"train_loss": -39.5229377746582, "global_step": 215120, "epoch": 1777} {"train_loss": -39.567420959472656, "global_step": 215121, "epoch": 1777} {"train_loss": -39.437904357910156, "global_step": 215122, "epoch": 1777} {"train_loss": -39.05440139770508, "global_step": 215123, "epoch": 1777} {"train_loss": -39.591793060302734, "global_step": 215124, "epoch": 1777} {"train_loss": -40.22190475463867, "global_step": 215125, "epoch": 1777} {"train_loss": -40.18283462524414, "global_step": 215126, "epoch": 1777} {"train_loss": -39.49812698364258, "global_step": 215127, "epoch": 1777} {"train_loss": -39.95046615600586, "global_step": 215128, "epoch": 1777} {"train_loss": -39.54949188232422, "global_step": 215129, "epoch": 1777} {"train_loss": -40.099544525146484, "global_step": 215130, "epoch": 1777} {"train_loss": -39.98427200317383, "global_step": 215131, "epoch": 1777} {"train_loss": -39.84930419921875, "global_step": 215132, "epoch": 1777} {"train_loss": -39.628814697265625, "global_step": 215133, "epoch": 1777} {"train_loss": -40.15338134765625, "global_step": 215134, "epoch": 1777} {"train_loss": -40.12251281738281, "global_step": 215135, "epoch": 1777} {"train_loss": -40.57773971557617, "global_step": 215136, "epoch": 1777} {"train_loss": -37.167911671409925, "global_step": 215137, "epoch": 1777, "val_loss": 2707170.25} {"train_loss": -40.2065315246582, "global_step": 215138, "epoch": 1778} {"train_loss": -40.54879379272461, "global_step": 215139, "epoch": 1778} {"train_loss": -40.87160873413086, "global_step": 215140, "epoch": 1778} {"train_loss": -40.55209732055664, "global_step": 215141, "epoch": 1778} {"train_loss": -40.30137634277344, "global_step": 215142, "epoch": 1778} {"train_loss": -40.59716033935547, "global_step": 215143, "epoch": 1778} {"train_loss": -40.178409576416016, "global_step": 215144, "epoch": 1778} {"train_loss": -40.60383224487305, "global_step": 215145, "epoch": 1778} {"train_loss": -40.78392028808594, "global_step": 215146, "epoch": 1778} {"train_loss": -39.66122055053711, "global_step": 215147, "epoch": 1778} {"train_loss": -40.65005874633789, "global_step": 215148, "epoch": 1778} {"train_loss": -40.28026580810547, "global_step": 215149, "epoch": 1778} {"train_loss": -40.6702880859375, "global_step": 215150, "epoch": 1778} {"train_loss": -40.693180084228516, "global_step": 215151, "epoch": 1778} {"train_loss": -40.99885559082031, "global_step": 215152, "epoch": 1778} {"train_loss": -40.29822540283203, "global_step": 215153, "epoch": 1778} {"train_loss": -41.20327377319336, "global_step": 215154, "epoch": 1778} {"train_loss": -40.934505462646484, "global_step": 215155, "epoch": 1778} {"train_loss": -41.01410675048828, "global_step": 215156, "epoch": 1778} {"train_loss": -40.675540924072266, "global_step": 215157, "epoch": 1778} {"train_loss": -40.545753479003906, "global_step": 215158, "epoch": 1778} {"train_loss": -40.84027862548828, "global_step": 215159, "epoch": 1778} {"train_loss": -40.80692672729492, "global_step": 215160, "epoch": 1778} {"train_loss": -40.443660736083984, "global_step": 215161, "epoch": 1778} {"train_loss": -40.8728141784668, "global_step": 215162, "epoch": 1778} {"train_loss": -41.14760971069336, "global_step": 215163, "epoch": 1778} {"train_loss": -40.99359130859375, "global_step": 215164, "epoch": 1778} {"train_loss": -40.57338333129883, "global_step": 215165, "epoch": 1778} {"train_loss": -40.82595443725586, "global_step": 215166, "epoch": 1778} {"train_loss": -40.84811019897461, "global_step": 215167, "epoch": 1778} {"train_loss": -40.5817985534668, "global_step": 215168, "epoch": 1778} {"train_loss": -40.90591049194336, "global_step": 215169, "epoch": 1778} {"train_loss": -40.74227523803711, "global_step": 215170, "epoch": 1778} {"train_loss": -40.5850944519043, "global_step": 215171, "epoch": 1778} {"train_loss": -40.819435119628906, "global_step": 215172, "epoch": 1778} {"train_loss": -40.834835052490234, "global_step": 215173, "epoch": 1778} {"train_loss": -40.98043441772461, "global_step": 215174, "epoch": 1778} {"train_loss": -40.350704193115234, "global_step": 215175, "epoch": 1778} {"train_loss": -41.36955642700195, "global_step": 215176, "epoch": 1778} {"train_loss": -41.294044494628906, "global_step": 215177, "epoch": 1778} {"train_loss": -40.42167282104492, "global_step": 215178, "epoch": 1778} {"train_loss": -41.08837890625, "global_step": 215179, "epoch": 1778} {"train_loss": -40.502113342285156, "global_step": 215180, "epoch": 1778} {"train_loss": -41.27315902709961, "global_step": 215181, "epoch": 1778} {"train_loss": -40.709625244140625, "global_step": 215182, "epoch": 1778} {"train_loss": -41.30598831176758, "global_step": 215183, "epoch": 1778} {"train_loss": -40.93918991088867, "global_step": 215184, "epoch": 1778} {"train_loss": -41.028507232666016, "global_step": 215185, "epoch": 1778} {"train_loss": -41.16782760620117, "global_step": 215186, "epoch": 1778} {"train_loss": -41.05463409423828, "global_step": 215187, "epoch": 1778} {"train_loss": -40.66625213623047, "global_step": 215188, "epoch": 1778} {"train_loss": -40.3376350402832, "global_step": 215189, "epoch": 1778} {"train_loss": -41.498291015625, "global_step": 215190, "epoch": 1778} {"train_loss": -41.38917541503906, "global_step": 215191, "epoch": 1778} {"train_loss": -40.681983947753906, "global_step": 215192, "epoch": 1778} {"train_loss": -41.323638916015625, "global_step": 215193, "epoch": 1778} {"train_loss": -41.35201644897461, "global_step": 215194, "epoch": 1778} {"train_loss": -39.7585334777832, "global_step": 215195, "epoch": 1778} {"train_loss": -40.71479797363281, "global_step": 215196, "epoch": 1778} {"train_loss": -41.12688064575195, "global_step": 215197, "epoch": 1778} {"train_loss": -41.06171417236328, "global_step": 215198, "epoch": 1778} {"train_loss": -41.423824310302734, "global_step": 215199, "epoch": 1778} {"train_loss": -40.95634078979492, "global_step": 215200, "epoch": 1778} {"train_loss": -41.06313705444336, "global_step": 215201, "epoch": 1778} {"train_loss": -40.4176025390625, "global_step": 215202, "epoch": 1778} {"train_loss": -41.2795524597168, "global_step": 215203, "epoch": 1778} {"train_loss": -41.27297592163086, "global_step": 215204, "epoch": 1778} {"train_loss": -40.749267578125, "global_step": 215205, "epoch": 1778} {"train_loss": -41.121952056884766, "global_step": 215206, "epoch": 1778} {"train_loss": -40.94599533081055, "global_step": 215207, "epoch": 1778} {"train_loss": -41.04825973510742, "global_step": 215208, "epoch": 1778} {"train_loss": -40.463253021240234, "global_step": 215209, "epoch": 1778} {"train_loss": -41.172752380371094, "global_step": 215210, "epoch": 1778} {"train_loss": -40.76763153076172, "global_step": 215211, "epoch": 1778} {"train_loss": -38.29182815551758, "global_step": 215212, "epoch": 1778} {"train_loss": -32.36400604248047, "global_step": 215213, "epoch": 1778} {"train_loss": -32.293304443359375, "global_step": 215214, "epoch": 1778} {"train_loss": -34.6343994140625, "global_step": 215215, "epoch": 1778} {"train_loss": -36.16550064086914, "global_step": 215216, "epoch": 1778} {"train_loss": -38.6014289855957, "global_step": 215217, "epoch": 1778} {"train_loss": -36.65255355834961, "global_step": 215218, "epoch": 1778} {"train_loss": -40.12528610229492, "global_step": 215219, "epoch": 1778} {"train_loss": -39.048797607421875, "global_step": 215220, "epoch": 1778} {"train_loss": -39.92116928100586, "global_step": 215221, "epoch": 1778} {"train_loss": -39.5629997253418, "global_step": 215222, "epoch": 1778} {"train_loss": -38.502315521240234, "global_step": 215223, "epoch": 1778} {"train_loss": -38.75028610229492, "global_step": 215224, "epoch": 1778} {"train_loss": -37.73846435546875, "global_step": 215225, "epoch": 1778} {"train_loss": -39.505859375, "global_step": 215226, "epoch": 1778} {"train_loss": -38.801025390625, "global_step": 215227, "epoch": 1778} {"train_loss": -39.91456604003906, "global_step": 215228, "epoch": 1778} {"train_loss": -38.574493408203125, "global_step": 215229, "epoch": 1778} {"train_loss": -39.99101638793945, "global_step": 215230, "epoch": 1778} {"train_loss": -39.1749382019043, "global_step": 215231, "epoch": 1778} {"train_loss": -39.6660041809082, "global_step": 215232, "epoch": 1778} {"train_loss": -40.49103927612305, "global_step": 215233, "epoch": 1778} {"train_loss": -39.74143600463867, "global_step": 215234, "epoch": 1778} {"train_loss": -40.49293899536133, "global_step": 215235, "epoch": 1778} {"train_loss": -39.86782455444336, "global_step": 215236, "epoch": 1778} {"train_loss": -40.45979690551758, "global_step": 215237, "epoch": 1778} {"train_loss": -39.40994644165039, "global_step": 215238, "epoch": 1778} {"train_loss": -40.53802490234375, "global_step": 215239, "epoch": 1778} {"train_loss": -40.54195022583008, "global_step": 215240, "epoch": 1778} {"train_loss": -39.958282470703125, "global_step": 215241, "epoch": 1778} {"train_loss": -41.11048126220703, "global_step": 215242, "epoch": 1778} {"train_loss": -41.086402893066406, "global_step": 215243, "epoch": 1778} {"train_loss": -40.00978469848633, "global_step": 215244, "epoch": 1778} {"train_loss": -41.176971435546875, "global_step": 215245, "epoch": 1778} {"train_loss": -40.58198928833008, "global_step": 215246, "epoch": 1778} {"train_loss": -39.6383171081543, "global_step": 215247, "epoch": 1778} {"train_loss": -40.8192253112793, "global_step": 215248, "epoch": 1778} {"train_loss": -41.38540267944336, "global_step": 215249, "epoch": 1778} {"train_loss": -39.874794006347656, "global_step": 215250, "epoch": 1778} {"train_loss": -41.019893646240234, "global_step": 215251, "epoch": 1778} {"train_loss": -40.722896575927734, "global_step": 215252, "epoch": 1778} {"train_loss": -40.62858200073242, "global_step": 215253, "epoch": 1778} {"train_loss": -41.414772033691406, "global_step": 215254, "epoch": 1778} {"train_loss": -41.31521224975586, "global_step": 215255, "epoch": 1778} {"train_loss": -41.01268768310547, "global_step": 215256, "epoch": 1778} {"train_loss": -40.977413177490234, "global_step": 215257, "epoch": 1778} {"train_loss": -40.2782970144729, "global_step": 215258, "epoch": 1778, "val_loss": 2599072.0} {"train_loss": -41.21075439453125, "global_step": 215259, "epoch": 1779} {"train_loss": -41.35272979736328, "global_step": 215260, "epoch": 1779} {"train_loss": -41.78072738647461, "global_step": 215261, "epoch": 1779} {"train_loss": -41.999053955078125, "global_step": 215262, "epoch": 1779} {"train_loss": -41.491024017333984, "global_step": 215263, "epoch": 1779} {"train_loss": -41.86890411376953, "global_step": 215264, "epoch": 1779} {"train_loss": -41.91340255737305, "global_step": 215265, "epoch": 1779} {"train_loss": -41.183589935302734, "global_step": 215266, "epoch": 1779} {"train_loss": -41.384403228759766, "global_step": 215267, "epoch": 1779} {"train_loss": -41.461158752441406, "global_step": 215268, "epoch": 1779} {"train_loss": -42.18682861328125, "global_step": 215269, "epoch": 1779} {"train_loss": -41.134700775146484, "global_step": 215270, "epoch": 1779} {"train_loss": -40.60237121582031, "global_step": 215271, "epoch": 1779} {"train_loss": -41.7774772644043, "global_step": 215272, "epoch": 1779} {"train_loss": -41.926876068115234, "global_step": 215273, "epoch": 1779} {"train_loss": -41.22846221923828, "global_step": 215274, "epoch": 1779} {"train_loss": -41.53701400756836, "global_step": 215275, "epoch": 1779} {"train_loss": -41.69756317138672, "global_step": 215276, "epoch": 1779} {"train_loss": -41.69267272949219, "global_step": 215277, "epoch": 1779} {"train_loss": -41.68598175048828, "global_step": 215278, "epoch": 1779} {"train_loss": -42.00751876831055, "global_step": 215279, "epoch": 1779} {"train_loss": -42.1776237487793, "global_step": 215280, "epoch": 1779} {"train_loss": -41.674800872802734, "global_step": 215281, "epoch": 1779} {"train_loss": -41.51695251464844, "global_step": 215282, "epoch": 1779} {"train_loss": -42.15582275390625, "global_step": 215283, "epoch": 1779} {"train_loss": -41.861106872558594, "global_step": 215284, "epoch": 1779} {"train_loss": -41.02376174926758, "global_step": 215285, "epoch": 1779} {"train_loss": -41.56702423095703, "global_step": 215286, "epoch": 1779} {"train_loss": -42.1249885559082, "global_step": 215287, "epoch": 1779} {"train_loss": -42.47917556762695, "global_step": 215288, "epoch": 1779} {"train_loss": -41.450836181640625, "global_step": 215289, "epoch": 1779} {"train_loss": -41.886592864990234, "global_step": 215290, "epoch": 1779} {"train_loss": -41.44646072387695, "global_step": 215291, "epoch": 1779} {"train_loss": -41.38082504272461, "global_step": 215292, "epoch": 1779} {"train_loss": -41.982391357421875, "global_step": 215293, "epoch": 1779} {"train_loss": -42.53211212158203, "global_step": 215294, "epoch": 1779} {"train_loss": -41.99058151245117, "global_step": 215295, "epoch": 1779} {"train_loss": -42.20587921142578, "global_step": 215296, "epoch": 1779} {"train_loss": -42.73708724975586, "global_step": 215297, "epoch": 1779} {"train_loss": -42.53438949584961, "global_step": 215298, "epoch": 1779} {"train_loss": -42.17790603637695, "global_step": 215299, "epoch": 1779} {"train_loss": -41.90913009643555, "global_step": 215300, "epoch": 1779} {"train_loss": -41.497554779052734, "global_step": 215301, "epoch": 1779} {"train_loss": -42.400577545166016, "global_step": 215302, "epoch": 1779} {"train_loss": -42.1652946472168, "global_step": 215303, "epoch": 1779} {"train_loss": -41.94657516479492, "global_step": 215304, "epoch": 1779} {"train_loss": -41.439205169677734, "global_step": 215305, "epoch": 1779} {"train_loss": -41.67033004760742, "global_step": 215306, "epoch": 1779} {"train_loss": -40.898075103759766, "global_step": 215307, "epoch": 1779} {"train_loss": -40.03804397583008, "global_step": 215308, "epoch": 1779} {"train_loss": -41.382694244384766, "global_step": 215309, "epoch": 1779} {"train_loss": -41.688819885253906, "global_step": 215310, "epoch": 1779} {"train_loss": -40.51447296142578, "global_step": 215311, "epoch": 1779} {"train_loss": -37.003135681152344, "global_step": 215312, "epoch": 1779} {"train_loss": -36.71455001831055, "global_step": 215313, "epoch": 1779} {"train_loss": -37.628273010253906, "global_step": 215314, "epoch": 1779} {"train_loss": -37.45449447631836, "global_step": 215315, "epoch": 1779} {"train_loss": -40.4307746887207, "global_step": 215316, "epoch": 1779} {"train_loss": -34.054073333740234, "global_step": 215317, "epoch": 1779} {"train_loss": -34.890899658203125, "global_step": 215318, "epoch": 1779} {"train_loss": -33.01057052612305, "global_step": 215319, "epoch": 1779} {"train_loss": -31.095117568969727, "global_step": 215320, "epoch": 1779} {"train_loss": -39.89234924316406, "global_step": 215321, "epoch": 1779} {"train_loss": -31.763959884643555, "global_step": 215322, "epoch": 1779} {"train_loss": -35.01057434082031, "global_step": 215323, "epoch": 1779} {"train_loss": -32.209957122802734, "global_step": 215324, "epoch": 1779} {"train_loss": -36.62269592285156, "global_step": 215325, "epoch": 1779} {"train_loss": -37.893672943115234, "global_step": 215326, "epoch": 1779} {"train_loss": -33.47306442260742, "global_step": 215327, "epoch": 1779} {"train_loss": -39.6131591796875, "global_step": 215328, "epoch": 1779} {"train_loss": -37.74139404296875, "global_step": 215329, "epoch": 1779} {"train_loss": -35.432682037353516, "global_step": 215330, "epoch": 1779} {"train_loss": -40.25814437866211, "global_step": 215331, "epoch": 1779} {"train_loss": -37.1486930847168, "global_step": 215332, "epoch": 1779} {"train_loss": -38.97565460205078, "global_step": 215333, "epoch": 1779} {"train_loss": -39.393184661865234, "global_step": 215334, "epoch": 1779} {"train_loss": -38.8532600402832, "global_step": 215335, "epoch": 1779} {"train_loss": -38.727203369140625, "global_step": 215336, "epoch": 1779} {"train_loss": -39.495948791503906, "global_step": 215337, "epoch": 1779} {"train_loss": -40.1215934753418, "global_step": 215338, "epoch": 1779} {"train_loss": -38.03082275390625, "global_step": 215339, "epoch": 1779} {"train_loss": -40.33755874633789, "global_step": 215340, "epoch": 1779} {"train_loss": -39.58723449707031, "global_step": 215341, "epoch": 1779} {"train_loss": -39.253448486328125, "global_step": 215342, "epoch": 1779} {"train_loss": -39.380126953125, "global_step": 215343, "epoch": 1779} {"train_loss": -40.6494255065918, "global_step": 215344, "epoch": 1779} {"train_loss": -39.897098541259766, "global_step": 215345, "epoch": 1779} {"train_loss": -39.47876739501953, "global_step": 215346, "epoch": 1779} {"train_loss": -40.669551849365234, "global_step": 215347, "epoch": 1779} {"train_loss": -40.38141632080078, "global_step": 215348, "epoch": 1779} {"train_loss": -40.712921142578125, "global_step": 215349, "epoch": 1779} {"train_loss": -40.78584671020508, "global_step": 215350, "epoch": 1779} {"train_loss": -41.60709762573242, "global_step": 215351, "epoch": 1779} {"train_loss": -40.639217376708984, "global_step": 215352, "epoch": 1779} {"train_loss": -39.74128341674805, "global_step": 215353, "epoch": 1779} {"train_loss": -40.881431579589844, "global_step": 215354, "epoch": 1779} {"train_loss": -40.82472610473633, "global_step": 215355, "epoch": 1779} {"train_loss": -40.64493942260742, "global_step": 215356, "epoch": 1779} {"train_loss": -41.37887191772461, "global_step": 215357, "epoch": 1779} {"train_loss": -40.78618240356445, "global_step": 215358, "epoch": 1779} {"train_loss": -41.278297424316406, "global_step": 215359, "epoch": 1779} {"train_loss": -41.08102035522461, "global_step": 215360, "epoch": 1779} {"train_loss": -41.673980712890625, "global_step": 215361, "epoch": 1779} {"train_loss": -40.57310104370117, "global_step": 215362, "epoch": 1779} {"train_loss": -41.00468826293945, "global_step": 215363, "epoch": 1779} {"train_loss": -40.90460968017578, "global_step": 215364, "epoch": 1779} {"train_loss": -41.38985824584961, "global_step": 215365, "epoch": 1779} {"train_loss": -40.95222091674805, "global_step": 215366, "epoch": 1779} {"train_loss": -41.7586784362793, "global_step": 215367, "epoch": 1779} {"train_loss": -41.55076217651367, "global_step": 215368, "epoch": 1779} {"train_loss": -41.56589889526367, "global_step": 215369, "epoch": 1779} {"train_loss": -41.70437240600586, "global_step": 215370, "epoch": 1779} {"train_loss": -41.67832565307617, "global_step": 215371, "epoch": 1779} {"train_loss": -41.901546478271484, "global_step": 215372, "epoch": 1779} {"train_loss": -41.2512092590332, "global_step": 215373, "epoch": 1779} {"train_loss": -42.03779602050781, "global_step": 215374, "epoch": 1779} {"train_loss": -41.70502471923828, "global_step": 215375, "epoch": 1779} {"train_loss": -41.62284469604492, "global_step": 215376, "epoch": 1779} {"train_loss": -41.709632873535156, "global_step": 215377, "epoch": 1779} {"train_loss": -41.856605529785156, "global_step": 215378, "epoch": 1779} {"train_loss": -40.338611791941744, "global_step": 215379, "epoch": 1779, "val_loss": 2694202.25} {"train_loss": -41.90748596191406, "global_step": 215380, "epoch": 1780} {"train_loss": -42.388179779052734, "global_step": 215381, "epoch": 1780} {"train_loss": -42.00509262084961, "global_step": 215382, "epoch": 1780} {"train_loss": -42.43213653564453, "global_step": 215383, "epoch": 1780} {"train_loss": -42.09047317504883, "global_step": 215384, "epoch": 1780} {"train_loss": -41.96015167236328, "global_step": 215385, "epoch": 1780} {"train_loss": -42.15870666503906, "global_step": 215386, "epoch": 1780} {"train_loss": -41.93539047241211, "global_step": 215387, "epoch": 1780} {"train_loss": -42.277801513671875, "global_step": 215388, "epoch": 1780} {"train_loss": -42.15604782104492, "global_step": 215389, "epoch": 1780} {"train_loss": -42.44933319091797, "global_step": 215390, "epoch": 1780} {"train_loss": -42.294342041015625, "global_step": 215391, "epoch": 1780} {"train_loss": -41.88454055786133, "global_step": 215392, "epoch": 1780} {"train_loss": -42.03786849975586, "global_step": 215393, "epoch": 1780} {"train_loss": -42.18387222290039, "global_step": 215394, "epoch": 1780} {"train_loss": -42.0563850402832, "global_step": 215395, "epoch": 1780} {"train_loss": -42.20627212524414, "global_step": 215396, "epoch": 1780} {"train_loss": -42.283565521240234, "global_step": 215397, "epoch": 1780} {"train_loss": -42.7724609375, "global_step": 215398, "epoch": 1780} {"train_loss": -42.564266204833984, "global_step": 215399, "epoch": 1780} {"train_loss": -42.71683883666992, "global_step": 215400, "epoch": 1780} {"train_loss": -42.5798454284668, "global_step": 215401, "epoch": 1780} {"train_loss": -41.97634506225586, "global_step": 215402, "epoch": 1780} {"train_loss": -41.67155838012695, "global_step": 215403, "epoch": 1780} {"train_loss": -42.24421310424805, "global_step": 215404, "epoch": 1780} {"train_loss": -42.21443557739258, "global_step": 215405, "epoch": 1780} {"train_loss": -42.35387420654297, "global_step": 215406, "epoch": 1780} {"train_loss": -42.78239059448242, "global_step": 215407, "epoch": 1780} {"train_loss": -42.862274169921875, "global_step": 215408, "epoch": 1780} {"train_loss": -42.6790885925293, "global_step": 215409, "epoch": 1780} {"train_loss": -41.71319580078125, "global_step": 215410, "epoch": 1780} {"train_loss": -40.00189208984375, "global_step": 215411, "epoch": 1780} {"train_loss": -36.522090911865234, "global_step": 215412, "epoch": 1780} {"train_loss": -31.62977409362793, "global_step": 215413, "epoch": 1780} {"train_loss": -36.18333053588867, "global_step": 215414, "epoch": 1780} {"train_loss": -40.90485763549805, "global_step": 215415, "epoch": 1780} {"train_loss": -38.667205810546875, "global_step": 215416, "epoch": 1780} {"train_loss": -36.50852584838867, "global_step": 215417, "epoch": 1780} {"train_loss": -41.47636032104492, "global_step": 215418, "epoch": 1780} {"train_loss": -38.65792465209961, "global_step": 215419, "epoch": 1780} {"train_loss": -36.144039154052734, "global_step": 215420, "epoch": 1780} {"train_loss": -40.93854904174805, "global_step": 215421, "epoch": 1780} {"train_loss": -38.01194381713867, "global_step": 215422, "epoch": 1780} {"train_loss": -39.515953063964844, "global_step": 215423, "epoch": 1780} {"train_loss": -38.826351165771484, "global_step": 215424, "epoch": 1780} {"train_loss": -37.654232025146484, "global_step": 215425, "epoch": 1780} {"train_loss": -40.95974349975586, "global_step": 215426, "epoch": 1780} {"train_loss": -39.690711975097656, "global_step": 215427, "epoch": 1780} {"train_loss": -41.87400436401367, "global_step": 215428, "epoch": 1780} {"train_loss": -39.43795394897461, "global_step": 215429, "epoch": 1780} {"train_loss": -41.154476165771484, "global_step": 215430, "epoch": 1780} {"train_loss": -41.41560363769531, "global_step": 215431, "epoch": 1780} {"train_loss": -40.36965560913086, "global_step": 215432, "epoch": 1780} {"train_loss": -41.53103256225586, "global_step": 215433, "epoch": 1780} {"train_loss": -41.0778694152832, "global_step": 215434, "epoch": 1780} {"train_loss": -41.03695297241211, "global_step": 215435, "epoch": 1780} {"train_loss": -41.63190460205078, "global_step": 215436, "epoch": 1780} {"train_loss": -41.46885299682617, "global_step": 215437, "epoch": 1780} {"train_loss": -40.965065002441406, "global_step": 215438, "epoch": 1780} {"train_loss": -41.395084381103516, "global_step": 215439, "epoch": 1780} {"train_loss": -40.523555755615234, "global_step": 215440, "epoch": 1780} {"train_loss": -41.150794982910156, "global_step": 215441, "epoch": 1780} {"train_loss": -41.0480842590332, "global_step": 215442, "epoch": 1780} {"train_loss": -40.95726776123047, "global_step": 215443, "epoch": 1780} {"train_loss": -41.300636291503906, "global_step": 215444, "epoch": 1780} {"train_loss": -41.742977142333984, "global_step": 215445, "epoch": 1780} {"train_loss": -41.666481018066406, "global_step": 215446, "epoch": 1780} {"train_loss": -40.497554779052734, "global_step": 215447, "epoch": 1780} {"train_loss": -41.563228607177734, "global_step": 215448, "epoch": 1780} {"train_loss": -41.75069046020508, "global_step": 215449, "epoch": 1780} {"train_loss": -41.0582275390625, "global_step": 215450, "epoch": 1780} {"train_loss": -41.588584899902344, "global_step": 215451, "epoch": 1780} {"train_loss": -40.587745666503906, "global_step": 215452, "epoch": 1780} {"train_loss": -41.62660217285156, "global_step": 215453, "epoch": 1780} {"train_loss": -41.71541213989258, "global_step": 215454, "epoch": 1780} {"train_loss": -41.53737258911133, "global_step": 215455, "epoch": 1780} {"train_loss": -41.20128631591797, "global_step": 215456, "epoch": 1780} {"train_loss": -41.570350646972656, "global_step": 215457, "epoch": 1780} {"train_loss": -41.56233596801758, "global_step": 215458, "epoch": 1780} {"train_loss": -41.88412857055664, "global_step": 215459, "epoch": 1780} {"train_loss": -41.156639099121094, "global_step": 215460, "epoch": 1780} {"train_loss": -41.90522003173828, "global_step": 215461, "epoch": 1780} {"train_loss": -41.90959930419922, "global_step": 215462, "epoch": 1780} {"train_loss": -41.53103256225586, "global_step": 215463, "epoch": 1780} {"train_loss": -41.1673469543457, "global_step": 215464, "epoch": 1780} {"train_loss": -41.939998626708984, "global_step": 215465, "epoch": 1780} {"train_loss": -42.06543731689453, "global_step": 215466, "epoch": 1780} {"train_loss": -41.83537292480469, "global_step": 215467, "epoch": 1780} {"train_loss": -42.26070785522461, "global_step": 215468, "epoch": 1780} {"train_loss": -41.58607864379883, "global_step": 215469, "epoch": 1780} {"train_loss": -42.229774475097656, "global_step": 215470, "epoch": 1780} {"train_loss": -42.16787338256836, "global_step": 215471, "epoch": 1780} {"train_loss": -41.879661560058594, "global_step": 215472, "epoch": 1780} {"train_loss": -41.84764862060547, "global_step": 215473, "epoch": 1780} {"train_loss": -41.604583740234375, "global_step": 215474, "epoch": 1780} {"train_loss": -41.99530792236328, "global_step": 215475, "epoch": 1780} {"train_loss": -41.84058380126953, "global_step": 215476, "epoch": 1780} {"train_loss": -42.366432189941406, "global_step": 215477, "epoch": 1780} {"train_loss": -42.1065673828125, "global_step": 215478, "epoch": 1780} {"train_loss": -42.49396896362305, "global_step": 215479, "epoch": 1780} {"train_loss": -42.22465515136719, "global_step": 215480, "epoch": 1780} {"train_loss": -42.24555206298828, "global_step": 215481, "epoch": 1780} {"train_loss": -41.78559494018555, "global_step": 215482, "epoch": 1780} {"train_loss": -41.473785400390625, "global_step": 215483, "epoch": 1780} {"train_loss": -39.6254997253418, "global_step": 215484, "epoch": 1780} {"train_loss": -41.20313262939453, "global_step": 215485, "epoch": 1780} {"train_loss": -40.17655563354492, "global_step": 215486, "epoch": 1780} {"train_loss": -40.16231155395508, "global_step": 215487, "epoch": 1780} {"train_loss": -41.331260681152344, "global_step": 215488, "epoch": 1780} {"train_loss": -41.67620849609375, "global_step": 215489, "epoch": 1780} {"train_loss": -40.695247650146484, "global_step": 215490, "epoch": 1780} {"train_loss": -39.5598030090332, "global_step": 215491, "epoch": 1780} {"train_loss": -40.20056915283203, "global_step": 215492, "epoch": 1780} {"train_loss": -40.8339958190918, "global_step": 215493, "epoch": 1780} {"train_loss": -39.75477981567383, "global_step": 215494, "epoch": 1780} {"train_loss": -40.80727005004883, "global_step": 215495, "epoch": 1780} {"train_loss": -41.324317932128906, "global_step": 215496, "epoch": 1780} {"train_loss": -38.04935836791992, "global_step": 215497, "epoch": 1780} {"train_loss": -40.078304290771484, "global_step": 215498, "epoch": 1780} {"train_loss": -41.031219482421875, "global_step": 215499, "epoch": 1780} {"train_loss": -41.10973022397884, "global_step": 215500, "epoch": 1780, "val_loss": 2723302.25} {"train_loss": -40.11396026611328, "global_step": 215501, "epoch": 1781} {"train_loss": -36.785194396972656, "global_step": 215502, "epoch": 1781} {"train_loss": -41.02888107299805, "global_step": 215503, "epoch": 1781} {"train_loss": -40.5611457824707, "global_step": 215504, "epoch": 1781} {"train_loss": -37.75978469848633, "global_step": 215505, "epoch": 1781} {"train_loss": -39.69330596923828, "global_step": 215506, "epoch": 1781} {"train_loss": -38.11574172973633, "global_step": 215507, "epoch": 1781} {"train_loss": -37.828495025634766, "global_step": 215508, "epoch": 1781} {"train_loss": -39.543209075927734, "global_step": 215509, "epoch": 1781} {"train_loss": -38.91461181640625, "global_step": 215510, "epoch": 1781} {"train_loss": -39.37437057495117, "global_step": 215511, "epoch": 1781} {"train_loss": -39.00428009033203, "global_step": 215512, "epoch": 1781} {"train_loss": -38.15016174316406, "global_step": 215513, "epoch": 1781} {"train_loss": -38.825927734375, "global_step": 215514, "epoch": 1781} {"train_loss": -36.98557662963867, "global_step": 215515, "epoch": 1781} {"train_loss": -36.21916961669922, "global_step": 215516, "epoch": 1781} {"train_loss": -37.757972717285156, "global_step": 215517, "epoch": 1781} {"train_loss": -39.2642936706543, "global_step": 215518, "epoch": 1781} {"train_loss": -38.25270462036133, "global_step": 215519, "epoch": 1781} {"train_loss": -38.61550521850586, "global_step": 215520, "epoch": 1781} {"train_loss": -37.00826644897461, "global_step": 215521, "epoch": 1781} {"train_loss": -39.14683151245117, "global_step": 215522, "epoch": 1781} {"train_loss": -40.0062370300293, "global_step": 215523, "epoch": 1781} {"train_loss": -38.37831497192383, "global_step": 215524, "epoch": 1781} {"train_loss": -37.067203521728516, "global_step": 215525, "epoch": 1781} {"train_loss": -38.030757904052734, "global_step": 215526, "epoch": 1781} {"train_loss": -39.72066116333008, "global_step": 215527, "epoch": 1781} {"train_loss": -35.442176818847656, "global_step": 215528, "epoch": 1781} {"train_loss": -40.40829086303711, "global_step": 215529, "epoch": 1781} {"train_loss": -39.1335563659668, "global_step": 215530, "epoch": 1781} {"train_loss": -39.398738861083984, "global_step": 215531, "epoch": 1781} {"train_loss": -40.50098419189453, "global_step": 215532, "epoch": 1781} {"train_loss": -40.13393020629883, "global_step": 215533, "epoch": 1781} {"train_loss": -40.1461067199707, "global_step": 215534, "epoch": 1781} {"train_loss": -37.65283203125, "global_step": 215535, "epoch": 1781} {"train_loss": -39.72043991088867, "global_step": 215536, "epoch": 1781} {"train_loss": -40.05561447143555, "global_step": 215537, "epoch": 1781} {"train_loss": -39.156429290771484, "global_step": 215538, "epoch": 1781} {"train_loss": -37.94241714477539, "global_step": 215539, "epoch": 1781} {"train_loss": -40.38801574707031, "global_step": 215540, "epoch": 1781} {"train_loss": -39.919132232666016, "global_step": 215541, "epoch": 1781} {"train_loss": -40.33586883544922, "global_step": 215542, "epoch": 1781} {"train_loss": -40.16425323486328, "global_step": 215543, "epoch": 1781} {"train_loss": -39.13614273071289, "global_step": 215544, "epoch": 1781} {"train_loss": -37.48604965209961, "global_step": 215545, "epoch": 1781} {"train_loss": -37.2964973449707, "global_step": 215546, "epoch": 1781} {"train_loss": -39.04471969604492, "global_step": 215547, "epoch": 1781} {"train_loss": -40.06745529174805, "global_step": 215548, "epoch": 1781} {"train_loss": -39.907203674316406, "global_step": 215549, "epoch": 1781} {"train_loss": -40.006649017333984, "global_step": 215550, "epoch": 1781} {"train_loss": -39.23012924194336, "global_step": 215551, "epoch": 1781} {"train_loss": -39.75709533691406, "global_step": 215552, "epoch": 1781} {"train_loss": -39.649959564208984, "global_step": 215553, "epoch": 1781} {"train_loss": -40.573646545410156, "global_step": 215554, "epoch": 1781} {"train_loss": -40.014827728271484, "global_step": 215555, "epoch": 1781} {"train_loss": -40.10005187988281, "global_step": 215556, "epoch": 1781} {"train_loss": -38.232276916503906, "global_step": 215557, "epoch": 1781} {"train_loss": -40.36075973510742, "global_step": 215558, "epoch": 1781} {"train_loss": -37.09556579589844, "global_step": 215559, "epoch": 1781} {"train_loss": -39.761837005615234, "global_step": 215560, "epoch": 1781} {"train_loss": -40.74432373046875, "global_step": 215561, "epoch": 1781} {"train_loss": -39.27305603027344, "global_step": 215562, "epoch": 1781} {"train_loss": -39.41598129272461, "global_step": 215563, "epoch": 1781} {"train_loss": -40.01580810546875, "global_step": 215564, "epoch": 1781} {"train_loss": -40.21235275268555, "global_step": 215565, "epoch": 1781} {"train_loss": -40.61255645751953, "global_step": 215566, "epoch": 1781} {"train_loss": -40.05153274536133, "global_step": 215567, "epoch": 1781} {"train_loss": -40.00629806518555, "global_step": 215568, "epoch": 1781} {"train_loss": -40.68308639526367, "global_step": 215569, "epoch": 1781} {"train_loss": -39.27967071533203, "global_step": 215570, "epoch": 1781} {"train_loss": -39.723384857177734, "global_step": 215571, "epoch": 1781} {"train_loss": -37.7951545715332, "global_step": 215572, "epoch": 1781} {"train_loss": -40.8671875, "global_step": 215573, "epoch": 1781} {"train_loss": -41.09857177734375, "global_step": 215574, "epoch": 1781} {"train_loss": -40.865291595458984, "global_step": 215575, "epoch": 1781} {"train_loss": -39.54069137573242, "global_step": 215576, "epoch": 1781} {"train_loss": -40.685333251953125, "global_step": 215577, "epoch": 1781} {"train_loss": -40.77438735961914, "global_step": 215578, "epoch": 1781} {"train_loss": -41.91029739379883, "global_step": 215579, "epoch": 1781} {"train_loss": -41.131683349609375, "global_step": 215580, "epoch": 1781} {"train_loss": -40.24294662475586, "global_step": 215581, "epoch": 1781} {"train_loss": -41.12276840209961, "global_step": 215582, "epoch": 1781} {"train_loss": -41.593360900878906, "global_step": 215583, "epoch": 1781} {"train_loss": -41.04572677612305, "global_step": 215584, "epoch": 1781} {"train_loss": -41.4846305847168, "global_step": 215585, "epoch": 1781} {"train_loss": -41.34278106689453, "global_step": 215586, "epoch": 1781} {"train_loss": -40.03837966918945, "global_step": 215587, "epoch": 1781} {"train_loss": -37.001564025878906, "global_step": 215588, "epoch": 1781} {"train_loss": -39.32976150512695, "global_step": 215589, "epoch": 1781} {"train_loss": -40.5586051940918, "global_step": 215590, "epoch": 1781} {"train_loss": -40.83975601196289, "global_step": 215591, "epoch": 1781} {"train_loss": -41.407859802246094, "global_step": 215592, "epoch": 1781} {"train_loss": -41.55572509765625, "global_step": 215593, "epoch": 1781} {"train_loss": -40.202186584472656, "global_step": 215594, "epoch": 1781} {"train_loss": -41.40299987792969, "global_step": 215595, "epoch": 1781} {"train_loss": -41.669586181640625, "global_step": 215596, "epoch": 1781} {"train_loss": -36.67859649658203, "global_step": 215597, "epoch": 1781} {"train_loss": -41.61906814575195, "global_step": 215598, "epoch": 1781} {"train_loss": -41.4100456237793, "global_step": 215599, "epoch": 1781} {"train_loss": -41.658042907714844, "global_step": 215600, "epoch": 1781} {"train_loss": -41.5324592590332, "global_step": 215601, "epoch": 1781} {"train_loss": -40.83988571166992, "global_step": 215602, "epoch": 1781} {"train_loss": -41.46775436401367, "global_step": 215603, "epoch": 1781} {"train_loss": -41.42744827270508, "global_step": 215604, "epoch": 1781} {"train_loss": -39.73292922973633, "global_step": 215605, "epoch": 1781} {"train_loss": -41.1238899230957, "global_step": 215606, "epoch": 1781} {"train_loss": -39.77568435668945, "global_step": 215607, "epoch": 1781} {"train_loss": -41.9786262512207, "global_step": 215608, "epoch": 1781} {"train_loss": -41.84701156616211, "global_step": 215609, "epoch": 1781} {"train_loss": -41.33815002441406, "global_step": 215610, "epoch": 1781} {"train_loss": -41.9216423034668, "global_step": 215611, "epoch": 1781} {"train_loss": -41.53101348876953, "global_step": 215612, "epoch": 1781} {"train_loss": -41.2601318359375, "global_step": 215613, "epoch": 1781} {"train_loss": -40.442626953125, "global_step": 215614, "epoch": 1781} {"train_loss": -42.000606536865234, "global_step": 215615, "epoch": 1781} {"train_loss": -41.238643646240234, "global_step": 215616, "epoch": 1781} {"train_loss": -39.94622039794922, "global_step": 215617, "epoch": 1781} {"train_loss": -41.91770553588867, "global_step": 215618, "epoch": 1781} {"train_loss": -40.76210403442383, "global_step": 215619, "epoch": 1781} {"train_loss": -40.188350677490234, "global_step": 215620, "epoch": 1781} {"train_loss": -39.81776945256004, "global_step": 215621, "epoch": 1781, "val_loss": 2934662.0} {"train_loss": -40.38308334350586, "global_step": 215622, "epoch": 1782} {"train_loss": -39.98879623413086, "global_step": 215623, "epoch": 1782} {"train_loss": -39.578460693359375, "global_step": 215624, "epoch": 1782} {"train_loss": -41.23246383666992, "global_step": 215625, "epoch": 1782} {"train_loss": -41.3505973815918, "global_step": 215626, "epoch": 1782} {"train_loss": -41.487770080566406, "global_step": 215627, "epoch": 1782} {"train_loss": -39.22207260131836, "global_step": 215628, "epoch": 1782} {"train_loss": -39.304931640625, "global_step": 215629, "epoch": 1782} {"train_loss": -41.220062255859375, "global_step": 215630, "epoch": 1782} {"train_loss": -40.32184982299805, "global_step": 215631, "epoch": 1782} {"train_loss": -35.182838439941406, "global_step": 215632, "epoch": 1782} {"train_loss": -36.955265045166016, "global_step": 215633, "epoch": 1782} {"train_loss": -39.158424377441406, "global_step": 215634, "epoch": 1782} {"train_loss": -40.55934143066406, "global_step": 215635, "epoch": 1782} {"train_loss": -39.14509963989258, "global_step": 215636, "epoch": 1782} {"train_loss": -38.8221549987793, "global_step": 215637, "epoch": 1782} {"train_loss": -39.82481002807617, "global_step": 215638, "epoch": 1782} {"train_loss": -40.76842498779297, "global_step": 215639, "epoch": 1782} {"train_loss": -39.49324417114258, "global_step": 215640, "epoch": 1782} {"train_loss": -39.14100646972656, "global_step": 215641, "epoch": 1782} {"train_loss": -39.55553436279297, "global_step": 215642, "epoch": 1782} {"train_loss": -38.15239334106445, "global_step": 215643, "epoch": 1782} {"train_loss": -37.14791488647461, "global_step": 215644, "epoch": 1782} {"train_loss": -37.8323860168457, "global_step": 215645, "epoch": 1782} {"train_loss": -40.40070724487305, "global_step": 215646, "epoch": 1782} {"train_loss": -40.46452331542969, "global_step": 215647, "epoch": 1782} {"train_loss": -38.841129302978516, "global_step": 215648, "epoch": 1782} {"train_loss": -39.7675666809082, "global_step": 215649, "epoch": 1782} {"train_loss": -39.93959045410156, "global_step": 215650, "epoch": 1782} {"train_loss": -39.6943244934082, "global_step": 215651, "epoch": 1782} {"train_loss": -40.6875114440918, "global_step": 215652, "epoch": 1782} {"train_loss": -39.959083557128906, "global_step": 215653, "epoch": 1782} {"train_loss": -40.116302490234375, "global_step": 215654, "epoch": 1782} {"train_loss": -36.86570358276367, "global_step": 215655, "epoch": 1782} {"train_loss": -41.10580062866211, "global_step": 215656, "epoch": 1782} {"train_loss": -40.50726318359375, "global_step": 215657, "epoch": 1782} {"train_loss": -39.79313278198242, "global_step": 215658, "epoch": 1782} {"train_loss": -39.98612594604492, "global_step": 215659, "epoch": 1782} {"train_loss": -41.20947265625, "global_step": 215660, "epoch": 1782} {"train_loss": -40.34809494018555, "global_step": 215661, "epoch": 1782} {"train_loss": -41.104347229003906, "global_step": 215662, "epoch": 1782} {"train_loss": -41.7392463684082, "global_step": 215663, "epoch": 1782} {"train_loss": -40.39485549926758, "global_step": 215664, "epoch": 1782} {"train_loss": -41.75345993041992, "global_step": 215665, "epoch": 1782} {"train_loss": -41.3813591003418, "global_step": 215666, "epoch": 1782} {"train_loss": -40.36225509643555, "global_step": 215667, "epoch": 1782} {"train_loss": -38.64397048950195, "global_step": 215668, "epoch": 1782} {"train_loss": -41.36809158325195, "global_step": 215669, "epoch": 1782} {"train_loss": -41.311744689941406, "global_step": 215670, "epoch": 1782} {"train_loss": -40.19154357910156, "global_step": 215671, "epoch": 1782} {"train_loss": -40.77678680419922, "global_step": 215672, "epoch": 1782} {"train_loss": -40.903141021728516, "global_step": 215673, "epoch": 1782} {"train_loss": -41.74363708496094, "global_step": 215674, "epoch": 1782} {"train_loss": -41.44850540161133, "global_step": 215675, "epoch": 1782} {"train_loss": -40.670372009277344, "global_step": 215676, "epoch": 1782} {"train_loss": -41.41522979736328, "global_step": 215677, "epoch": 1782} {"train_loss": -41.08945846557617, "global_step": 215678, "epoch": 1782} {"train_loss": -41.5411376953125, "global_step": 215679, "epoch": 1782} {"train_loss": -41.80295944213867, "global_step": 215680, "epoch": 1782} {"train_loss": -40.22145462036133, "global_step": 215681, "epoch": 1782} {"train_loss": -41.370460510253906, "global_step": 215682, "epoch": 1782} {"train_loss": -41.98002243041992, "global_step": 215683, "epoch": 1782} {"train_loss": -41.30891418457031, "global_step": 215684, "epoch": 1782} {"train_loss": -42.09271240234375, "global_step": 215685, "epoch": 1782} {"train_loss": -41.71787643432617, "global_step": 215686, "epoch": 1782} {"train_loss": -42.4001579284668, "global_step": 215687, "epoch": 1782} {"train_loss": -41.22626876831055, "global_step": 215688, "epoch": 1782} {"train_loss": -41.93378829956055, "global_step": 215689, "epoch": 1782} {"train_loss": -41.81550216674805, "global_step": 215690, "epoch": 1782} {"train_loss": -41.833431243896484, "global_step": 215691, "epoch": 1782} {"train_loss": -41.79962921142578, "global_step": 215692, "epoch": 1782} {"train_loss": -41.246028900146484, "global_step": 215693, "epoch": 1782} {"train_loss": -41.8824577331543, "global_step": 215694, "epoch": 1782} {"train_loss": -41.97199630737305, "global_step": 215695, "epoch": 1782} {"train_loss": -41.917633056640625, "global_step": 215696, "epoch": 1782} {"train_loss": -40.640625, "global_step": 215697, "epoch": 1782} {"train_loss": -41.6149787902832, "global_step": 215698, "epoch": 1782} {"train_loss": -41.5571403503418, "global_step": 215699, "epoch": 1782} {"train_loss": -41.6274299621582, "global_step": 215700, "epoch": 1782} {"train_loss": -41.9950065612793, "global_step": 215701, "epoch": 1782} {"train_loss": -41.48494338989258, "global_step": 215702, "epoch": 1782} {"train_loss": -41.732845306396484, "global_step": 215703, "epoch": 1782} {"train_loss": -41.83032989501953, "global_step": 215704, "epoch": 1782} {"train_loss": -41.86177444458008, "global_step": 215705, "epoch": 1782} {"train_loss": -42.107364654541016, "global_step": 215706, "epoch": 1782} {"train_loss": -38.42002868652344, "global_step": 215707, "epoch": 1782} {"train_loss": -41.764495849609375, "global_step": 215708, "epoch": 1782} {"train_loss": -41.53689193725586, "global_step": 215709, "epoch": 1782} {"train_loss": -41.143157958984375, "global_step": 215710, "epoch": 1782} {"train_loss": -40.33826446533203, "global_step": 215711, "epoch": 1782} {"train_loss": -41.05216598510742, "global_step": 215712, "epoch": 1782} {"train_loss": -40.341407775878906, "global_step": 215713, "epoch": 1782} {"train_loss": -40.15910720825195, "global_step": 215714, "epoch": 1782} {"train_loss": -41.95978546142578, "global_step": 215715, "epoch": 1782} {"train_loss": -41.20124053955078, "global_step": 215716, "epoch": 1782} {"train_loss": -39.61721420288086, "global_step": 215717, "epoch": 1782} {"train_loss": -39.83991241455078, "global_step": 215718, "epoch": 1782} {"train_loss": -40.24245834350586, "global_step": 215719, "epoch": 1782} {"train_loss": -40.6989860534668, "global_step": 215720, "epoch": 1782} {"train_loss": -38.20471954345703, "global_step": 215721, "epoch": 1782} {"train_loss": -40.47229766845703, "global_step": 215722, "epoch": 1782} {"train_loss": -41.250240325927734, "global_step": 215723, "epoch": 1782} {"train_loss": -38.1104736328125, "global_step": 215724, "epoch": 1782} {"train_loss": -28.534717559814453, "global_step": 215725, "epoch": 1782} {"train_loss": -36.802406311035156, "global_step": 215726, "epoch": 1782} {"train_loss": -38.4931526184082, "global_step": 215727, "epoch": 1782} {"train_loss": -34.3576545715332, "global_step": 215728, "epoch": 1782} {"train_loss": -19.74553871154785, "global_step": 215729, "epoch": 1782} {"train_loss": -34.151466369628906, "global_step": 215730, "epoch": 1782} {"train_loss": -27.638525009155273, "global_step": 215731, "epoch": 1782} {"train_loss": -27.868314743041992, "global_step": 215732, "epoch": 1782} {"train_loss": -32.91754913330078, "global_step": 215733, "epoch": 1782} {"train_loss": -35.8068962097168, "global_step": 215734, "epoch": 1782} {"train_loss": -30.949228286743164, "global_step": 215735, "epoch": 1782} {"train_loss": -22.63048553466797, "global_step": 215736, "epoch": 1782} {"train_loss": -31.659299850463867, "global_step": 215737, "epoch": 1782} {"train_loss": -36.40020751953125, "global_step": 215738, "epoch": 1782} {"train_loss": -17.849407196044922, "global_step": 215739, "epoch": 1782} {"train_loss": -30.51552391052246, "global_step": 215740, "epoch": 1782} {"train_loss": -37.319374084472656, "global_step": 215741, "epoch": 1782} {"train_loss": -39.127699796818504, "global_step": 215742, "epoch": 1782, "val_loss": 2650621.5} {"train_loss": -29.806293487548828, "global_step": 215743, "epoch": 1783} {"train_loss": -34.567562103271484, "global_step": 215744, "epoch": 1783} {"train_loss": -24.484647750854492, "global_step": 215745, "epoch": 1783} {"train_loss": -36.73436737060547, "global_step": 215746, "epoch": 1783} {"train_loss": -34.56745147705078, "global_step": 215747, "epoch": 1783} {"train_loss": -35.14846420288086, "global_step": 215748, "epoch": 1783} {"train_loss": -31.878904342651367, "global_step": 215749, "epoch": 1783} {"train_loss": -31.99073600769043, "global_step": 215750, "epoch": 1783} {"train_loss": -34.31416320800781, "global_step": 215751, "epoch": 1783} {"train_loss": -34.35909652709961, "global_step": 215752, "epoch": 1783} {"train_loss": -30.201841354370117, "global_step": 215753, "epoch": 1783} {"train_loss": -34.687721252441406, "global_step": 215754, "epoch": 1783} {"train_loss": -31.57220458984375, "global_step": 215755, "epoch": 1783} {"train_loss": -30.887449264526367, "global_step": 215756, "epoch": 1783} {"train_loss": -37.9013671875, "global_step": 215757, "epoch": 1783} {"train_loss": -36.46136474609375, "global_step": 215758, "epoch": 1783} {"train_loss": -35.17229080200195, "global_step": 215759, "epoch": 1783} {"train_loss": -36.30781936645508, "global_step": 215760, "epoch": 1783} {"train_loss": -36.1099853515625, "global_step": 215761, "epoch": 1783} {"train_loss": -37.94540786743164, "global_step": 215762, "epoch": 1783} {"train_loss": -35.28799057006836, "global_step": 215763, "epoch": 1783} {"train_loss": -33.93507766723633, "global_step": 215764, "epoch": 1783} {"train_loss": -36.52392578125, "global_step": 215765, "epoch": 1783} {"train_loss": -37.21682357788086, "global_step": 215766, "epoch": 1783} {"train_loss": -37.99264144897461, "global_step": 215767, "epoch": 1783} {"train_loss": -38.35980224609375, "global_step": 215768, "epoch": 1783} {"train_loss": -36.4715690612793, "global_step": 215769, "epoch": 1783} {"train_loss": -37.39340591430664, "global_step": 215770, "epoch": 1783} {"train_loss": -37.71541976928711, "global_step": 215771, "epoch": 1783} {"train_loss": -37.78298568725586, "global_step": 215772, "epoch": 1783} {"train_loss": -38.84489822387695, "global_step": 215773, "epoch": 1783} {"train_loss": -37.42536544799805, "global_step": 215774, "epoch": 1783} {"train_loss": -38.26008605957031, "global_step": 215775, "epoch": 1783} {"train_loss": -37.59841537475586, "global_step": 215776, "epoch": 1783} {"train_loss": -37.5590934753418, "global_step": 215777, "epoch": 1783} {"train_loss": -36.82802963256836, "global_step": 215778, "epoch": 1783} {"train_loss": -38.49398422241211, "global_step": 215779, "epoch": 1783} {"train_loss": -38.075592041015625, "global_step": 215780, "epoch": 1783} {"train_loss": -38.893035888671875, "global_step": 215781, "epoch": 1783} {"train_loss": -38.48439407348633, "global_step": 215782, "epoch": 1783} {"train_loss": -38.950016021728516, "global_step": 215783, "epoch": 1783} {"train_loss": -39.07802963256836, "global_step": 215784, "epoch": 1783} {"train_loss": -39.29140853881836, "global_step": 215785, "epoch": 1783} {"train_loss": -39.4117431640625, "global_step": 215786, "epoch": 1783} {"train_loss": -39.4558219909668, "global_step": 215787, "epoch": 1783} {"train_loss": -38.573516845703125, "global_step": 215788, "epoch": 1783} {"train_loss": -38.905513763427734, "global_step": 215789, "epoch": 1783} {"train_loss": -38.873226165771484, "global_step": 215790, "epoch": 1783} {"train_loss": -39.26245880126953, "global_step": 215791, "epoch": 1783} {"train_loss": -39.53769302368164, "global_step": 215792, "epoch": 1783} {"train_loss": -38.7822265625, "global_step": 215793, "epoch": 1783} {"train_loss": -39.13166046142578, "global_step": 215794, "epoch": 1783} {"train_loss": -39.045936584472656, "global_step": 215795, "epoch": 1783} {"train_loss": -39.357112884521484, "global_step": 215796, "epoch": 1783} {"train_loss": -39.18677520751953, "global_step": 215797, "epoch": 1783} {"train_loss": -39.236854553222656, "global_step": 215798, "epoch": 1783} {"train_loss": -39.3138313293457, "global_step": 215799, "epoch": 1783} {"train_loss": -39.61167526245117, "global_step": 215800, "epoch": 1783} {"train_loss": -39.482906341552734, "global_step": 215801, "epoch": 1783} {"train_loss": -39.25710678100586, "global_step": 215802, "epoch": 1783} {"train_loss": -40.00188446044922, "global_step": 215803, "epoch": 1783} {"train_loss": -39.65110778808594, "global_step": 215804, "epoch": 1783} {"train_loss": -38.95023727416992, "global_step": 215805, "epoch": 1783} {"train_loss": -40.37644958496094, "global_step": 215806, "epoch": 1783} {"train_loss": -39.33717727661133, "global_step": 215807, "epoch": 1783} {"train_loss": -38.9412956237793, "global_step": 215808, "epoch": 1783} {"train_loss": -39.98996353149414, "global_step": 215809, "epoch": 1783} {"train_loss": -39.995784759521484, "global_step": 215810, "epoch": 1783} {"train_loss": -40.2591667175293, "global_step": 215811, "epoch": 1783} {"train_loss": -39.756343841552734, "global_step": 215812, "epoch": 1783} {"train_loss": -39.54209518432617, "global_step": 215813, "epoch": 1783} {"train_loss": -39.423587799072266, "global_step": 215814, "epoch": 1783} {"train_loss": -39.58555221557617, "global_step": 215815, "epoch": 1783} {"train_loss": -40.22676467895508, "global_step": 215816, "epoch": 1783} {"train_loss": -39.3440055847168, "global_step": 215817, "epoch": 1783} {"train_loss": -40.16940689086914, "global_step": 215818, "epoch": 1783} {"train_loss": -40.28156661987305, "global_step": 215819, "epoch": 1783} {"train_loss": -39.83998489379883, "global_step": 215820, "epoch": 1783} {"train_loss": -40.510459899902344, "global_step": 215821, "epoch": 1783} {"train_loss": -39.8498420715332, "global_step": 215822, "epoch": 1783} {"train_loss": -39.48785400390625, "global_step": 215823, "epoch": 1783} {"train_loss": -39.88727951049805, "global_step": 215824, "epoch": 1783} {"train_loss": -40.03232955932617, "global_step": 215825, "epoch": 1783} {"train_loss": -40.19769287109375, "global_step": 215826, "epoch": 1783} {"train_loss": -40.12955856323242, "global_step": 215827, "epoch": 1783} {"train_loss": -39.1491584777832, "global_step": 215828, "epoch": 1783} {"train_loss": -40.41598129272461, "global_step": 215829, "epoch": 1783} {"train_loss": -40.453033447265625, "global_step": 215830, "epoch": 1783} {"train_loss": -40.31574630737305, "global_step": 215831, "epoch": 1783} {"train_loss": -40.476810455322266, "global_step": 215832, "epoch": 1783} {"train_loss": -39.250465393066406, "global_step": 215833, "epoch": 1783} {"train_loss": -40.421363830566406, "global_step": 215834, "epoch": 1783} {"train_loss": -40.1619873046875, "global_step": 215835, "epoch": 1783} {"train_loss": -40.43138885498047, "global_step": 215836, "epoch": 1783} {"train_loss": -40.553070068359375, "global_step": 215837, "epoch": 1783} {"train_loss": -40.6150016784668, "global_step": 215838, "epoch": 1783} {"train_loss": -40.85874557495117, "global_step": 215839, "epoch": 1783} {"train_loss": -41.01499557495117, "global_step": 215840, "epoch": 1783} {"train_loss": -40.86284255981445, "global_step": 215841, "epoch": 1783} {"train_loss": -40.39741134643555, "global_step": 215842, "epoch": 1783} {"train_loss": -40.34916305541992, "global_step": 215843, "epoch": 1783} {"train_loss": -40.9256591796875, "global_step": 215844, "epoch": 1783} {"train_loss": -40.04063415527344, "global_step": 215845, "epoch": 1783} {"train_loss": -40.592628479003906, "global_step": 215846, "epoch": 1783} {"train_loss": -40.995731353759766, "global_step": 215847, "epoch": 1783} {"train_loss": -40.4063720703125, "global_step": 215848, "epoch": 1783} {"train_loss": -39.903255462646484, "global_step": 215849, "epoch": 1783} {"train_loss": -40.91719055175781, "global_step": 215850, "epoch": 1783} {"train_loss": -40.96101760864258, "global_step": 215851, "epoch": 1783} {"train_loss": -41.10956954956055, "global_step": 215852, "epoch": 1783} {"train_loss": -41.04751968383789, "global_step": 215853, "epoch": 1783} {"train_loss": -40.83689880371094, "global_step": 215854, "epoch": 1783} {"train_loss": -41.15072250366211, "global_step": 215855, "epoch": 1783} {"train_loss": -41.57937240600586, "global_step": 215856, "epoch": 1783} {"train_loss": -41.227474212646484, "global_step": 215857, "epoch": 1783} {"train_loss": -41.42548751831055, "global_step": 215858, "epoch": 1783} {"train_loss": -40.88186264038086, "global_step": 215859, "epoch": 1783} {"train_loss": -39.61831283569336, "global_step": 215860, "epoch": 1783} {"train_loss": -40.94136047363281, "global_step": 215861, "epoch": 1783} {"train_loss": -40.31233596801758, "global_step": 215862, "epoch": 1783} {"train_loss": -38.55770941805248, "global_step": 215863, "epoch": 1783, "val_loss": 2671400.0} {"train_loss": -40.997100830078125, "global_step": 215864, "epoch": 1784} {"train_loss": -40.618412017822266, "global_step": 215865, "epoch": 1784} {"train_loss": -41.24100875854492, "global_step": 215866, "epoch": 1784} {"train_loss": -41.1213493347168, "global_step": 215867, "epoch": 1784} {"train_loss": -41.51373291015625, "global_step": 215868, "epoch": 1784} {"train_loss": -41.075626373291016, "global_step": 215869, "epoch": 1784} {"train_loss": -41.55965805053711, "global_step": 215870, "epoch": 1784} {"train_loss": -41.58474349975586, "global_step": 215871, "epoch": 1784} {"train_loss": -41.08542251586914, "global_step": 215872, "epoch": 1784} {"train_loss": -41.36086654663086, "global_step": 215873, "epoch": 1784} {"train_loss": -41.20139694213867, "global_step": 215874, "epoch": 1784} {"train_loss": -41.86190414428711, "global_step": 215875, "epoch": 1784} {"train_loss": -41.10566329956055, "global_step": 215876, "epoch": 1784} {"train_loss": -41.151527404785156, "global_step": 215877, "epoch": 1784} {"train_loss": -41.024471282958984, "global_step": 215878, "epoch": 1784} {"train_loss": -41.49388885498047, "global_step": 215879, "epoch": 1784} {"train_loss": -41.91028594970703, "global_step": 215880, "epoch": 1784} {"train_loss": -41.32892608642578, "global_step": 215881, "epoch": 1784} {"train_loss": -41.217063903808594, "global_step": 215882, "epoch": 1784} {"train_loss": -41.22233200073242, "global_step": 215883, "epoch": 1784} {"train_loss": -40.94053649902344, "global_step": 215884, "epoch": 1784} {"train_loss": -41.87923049926758, "global_step": 215885, "epoch": 1784} {"train_loss": -41.552860260009766, "global_step": 215886, "epoch": 1784} {"train_loss": -41.61028289794922, "global_step": 215887, "epoch": 1784} {"train_loss": -41.78515625, "global_step": 215888, "epoch": 1784} {"train_loss": -41.69380569458008, "global_step": 215889, "epoch": 1784} {"train_loss": -42.11211013793945, "global_step": 215890, "epoch": 1784} {"train_loss": -41.979591369628906, "global_step": 215891, "epoch": 1784} {"train_loss": -41.93437194824219, "global_step": 215892, "epoch": 1784} {"train_loss": -41.425743103027344, "global_step": 215893, "epoch": 1784} {"train_loss": -41.5456657409668, "global_step": 215894, "epoch": 1784} {"train_loss": -41.30863571166992, "global_step": 215895, "epoch": 1784} {"train_loss": -40.61565399169922, "global_step": 215896, "epoch": 1784} {"train_loss": -40.101722717285156, "global_step": 215897, "epoch": 1784} {"train_loss": -39.606781005859375, "global_step": 215898, "epoch": 1784} {"train_loss": -40.306304931640625, "global_step": 215899, "epoch": 1784} {"train_loss": -39.19701385498047, "global_step": 215900, "epoch": 1784} {"train_loss": -37.23450469970703, "global_step": 215901, "epoch": 1784} {"train_loss": -34.83518600463867, "global_step": 215902, "epoch": 1784} {"train_loss": -37.47819900512695, "global_step": 215903, "epoch": 1784} {"train_loss": -39.44318771362305, "global_step": 215904, "epoch": 1784} {"train_loss": -39.84247589111328, "global_step": 215905, "epoch": 1784} {"train_loss": -40.47529220581055, "global_step": 215906, "epoch": 1784} {"train_loss": -40.56223678588867, "global_step": 215907, "epoch": 1784} {"train_loss": -39.41193771362305, "global_step": 215908, "epoch": 1784} {"train_loss": -40.26980209350586, "global_step": 215909, "epoch": 1784} {"train_loss": -39.87236404418945, "global_step": 215910, "epoch": 1784} {"train_loss": -40.15351486206055, "global_step": 215911, "epoch": 1784} {"train_loss": -40.234474182128906, "global_step": 215912, "epoch": 1784} {"train_loss": -40.02250671386719, "global_step": 215913, "epoch": 1784} {"train_loss": -40.27356719970703, "global_step": 215914, "epoch": 1784} {"train_loss": -39.954627990722656, "global_step": 215915, "epoch": 1784} {"train_loss": -40.75790023803711, "global_step": 215916, "epoch": 1784} {"train_loss": -40.510215759277344, "global_step": 215917, "epoch": 1784} {"train_loss": -39.982879638671875, "global_step": 215918, "epoch": 1784} {"train_loss": -40.482704162597656, "global_step": 215919, "epoch": 1784} {"train_loss": -41.251007080078125, "global_step": 215920, "epoch": 1784} {"train_loss": -41.05304718017578, "global_step": 215921, "epoch": 1784} {"train_loss": -40.8377799987793, "global_step": 215922, "epoch": 1784} {"train_loss": -40.65818405151367, "global_step": 215923, "epoch": 1784} {"train_loss": -40.76797103881836, "global_step": 215924, "epoch": 1784} {"train_loss": -40.95874786376953, "global_step": 215925, "epoch": 1784} {"train_loss": -41.35369110107422, "global_step": 215926, "epoch": 1784} {"train_loss": -41.14013671875, "global_step": 215927, "epoch": 1784} {"train_loss": -41.22939682006836, "global_step": 215928, "epoch": 1784} {"train_loss": -41.640174865722656, "global_step": 215929, "epoch": 1784} {"train_loss": -41.50018310546875, "global_step": 215930, "epoch": 1784} {"train_loss": -41.229488372802734, "global_step": 215931, "epoch": 1784} {"train_loss": -41.25116729736328, "global_step": 215932, "epoch": 1784} {"train_loss": -40.96693801879883, "global_step": 215933, "epoch": 1784} {"train_loss": -41.675533294677734, "global_step": 215934, "epoch": 1784} {"train_loss": -41.34639358520508, "global_step": 215935, "epoch": 1784} {"train_loss": -41.973655700683594, "global_step": 215936, "epoch": 1784} {"train_loss": -41.5601806640625, "global_step": 215937, "epoch": 1784} {"train_loss": -40.826263427734375, "global_step": 215938, "epoch": 1784} {"train_loss": -42.09482955932617, "global_step": 215939, "epoch": 1784} {"train_loss": -41.24740219116211, "global_step": 215940, "epoch": 1784} {"train_loss": -41.92853927612305, "global_step": 215941, "epoch": 1784} {"train_loss": -41.33400344848633, "global_step": 215942, "epoch": 1784} {"train_loss": -40.72284698486328, "global_step": 215943, "epoch": 1784} {"train_loss": -42.18923568725586, "global_step": 215944, "epoch": 1784} {"train_loss": -41.31618881225586, "global_step": 215945, "epoch": 1784} {"train_loss": -41.45220947265625, "global_step": 215946, "epoch": 1784} {"train_loss": -41.20023727416992, "global_step": 215947, "epoch": 1784} {"train_loss": -41.974910736083984, "global_step": 215948, "epoch": 1784} {"train_loss": -41.128665924072266, "global_step": 215949, "epoch": 1784} {"train_loss": -42.31772994995117, "global_step": 215950, "epoch": 1784} {"train_loss": -41.20733642578125, "global_step": 215951, "epoch": 1784} {"train_loss": -41.3591423034668, "global_step": 215952, "epoch": 1784} {"train_loss": -40.672767639160156, "global_step": 215953, "epoch": 1784} {"train_loss": -40.202205657958984, "global_step": 215954, "epoch": 1784} {"train_loss": -41.39704132080078, "global_step": 215955, "epoch": 1784} {"train_loss": -41.2075080871582, "global_step": 215956, "epoch": 1784} {"train_loss": -40.09534454345703, "global_step": 215957, "epoch": 1784} {"train_loss": -38.6258430480957, "global_step": 215958, "epoch": 1784} {"train_loss": -40.05781173706055, "global_step": 215959, "epoch": 1784} {"train_loss": -40.62910842895508, "global_step": 215960, "epoch": 1784} {"train_loss": -41.0617561340332, "global_step": 215961, "epoch": 1784} {"train_loss": -41.36525344848633, "global_step": 215962, "epoch": 1784} {"train_loss": -42.06574630737305, "global_step": 215963, "epoch": 1784} {"train_loss": -40.68232345581055, "global_step": 215964, "epoch": 1784} {"train_loss": -37.84089279174805, "global_step": 215965, "epoch": 1784} {"train_loss": -39.84760665893555, "global_step": 215966, "epoch": 1784} {"train_loss": -39.400596618652344, "global_step": 215967, "epoch": 1784} {"train_loss": -40.45905303955078, "global_step": 215968, "epoch": 1784} {"train_loss": -35.88149642944336, "global_step": 215969, "epoch": 1784} {"train_loss": -34.62970733642578, "global_step": 215970, "epoch": 1784} {"train_loss": -38.57814407348633, "global_step": 215971, "epoch": 1784} {"train_loss": -41.282142639160156, "global_step": 215972, "epoch": 1784} {"train_loss": -39.04799270629883, "global_step": 215973, "epoch": 1784} {"train_loss": -40.9007682800293, "global_step": 215974, "epoch": 1784} {"train_loss": -40.66521072387695, "global_step": 215975, "epoch": 1784} {"train_loss": -39.713287353515625, "global_step": 215976, "epoch": 1784} {"train_loss": -40.58486557006836, "global_step": 215977, "epoch": 1784} {"train_loss": -41.18966293334961, "global_step": 215978, "epoch": 1784} {"train_loss": -39.963863372802734, "global_step": 215979, "epoch": 1784} {"train_loss": -41.394283294677734, "global_step": 215980, "epoch": 1784} {"train_loss": -40.85602569580078, "global_step": 215981, "epoch": 1784} {"train_loss": -39.35667037963867, "global_step": 215982, "epoch": 1784} {"train_loss": -40.83344650268555, "global_step": 215983, "epoch": 1784} {"train_loss": -40.68761131980202, "global_step": 215984, "epoch": 1784, "val_loss": 2672691.5} {"train_loss": -40.49862289428711, "global_step": 215985, "epoch": 1785} {"train_loss": -41.42194747924805, "global_step": 215986, "epoch": 1785} {"train_loss": -41.08710861206055, "global_step": 215987, "epoch": 1785} {"train_loss": -40.997283935546875, "global_step": 215988, "epoch": 1785} {"train_loss": -41.56343460083008, "global_step": 215989, "epoch": 1785} {"train_loss": -41.652992248535156, "global_step": 215990, "epoch": 1785} {"train_loss": -41.78737258911133, "global_step": 215991, "epoch": 1785} {"train_loss": -41.669395446777344, "global_step": 215992, "epoch": 1785} {"train_loss": -41.28215408325195, "global_step": 215993, "epoch": 1785} {"train_loss": -41.194026947021484, "global_step": 215994, "epoch": 1785} {"train_loss": -41.5438346862793, "global_step": 215995, "epoch": 1785} {"train_loss": -41.575439453125, "global_step": 215996, "epoch": 1785} {"train_loss": -41.546451568603516, "global_step": 215997, "epoch": 1785} {"train_loss": -41.4404296875, "global_step": 215998, "epoch": 1785} {"train_loss": -41.80764389038086, "global_step": 215999, "epoch": 1785} {"train_loss": -40.123992919921875, "global_step": 216000, "epoch": 1785} {"train_loss": -41.74892807006836, "global_step": 216001, "epoch": 1785} {"train_loss": -40.93558883666992, "global_step": 216002, "epoch": 1785} {"train_loss": -41.64425277709961, "global_step": 216003, "epoch": 1785} {"train_loss": -40.806800842285156, "global_step": 216004, "epoch": 1785} {"train_loss": -40.2725944519043, "global_step": 216005, "epoch": 1785} {"train_loss": -40.953426361083984, "global_step": 216006, "epoch": 1785} {"train_loss": -40.634010314941406, "global_step": 216007, "epoch": 1785} {"train_loss": -41.05498123168945, "global_step": 216008, "epoch": 1785} {"train_loss": -39.208858489990234, "global_step": 216009, "epoch": 1785} {"train_loss": -41.925071716308594, "global_step": 216010, "epoch": 1785} {"train_loss": -40.379737854003906, "global_step": 216011, "epoch": 1785} {"train_loss": -41.04486846923828, "global_step": 216012, "epoch": 1785} {"train_loss": -40.55164337158203, "global_step": 216013, "epoch": 1785} {"train_loss": -39.60198211669922, "global_step": 216014, "epoch": 1785} {"train_loss": -40.506771087646484, "global_step": 216015, "epoch": 1785} {"train_loss": -41.0128288269043, "global_step": 216016, "epoch": 1785} {"train_loss": -41.033931732177734, "global_step": 216017, "epoch": 1785} {"train_loss": -41.514278411865234, "global_step": 216018, "epoch": 1785} {"train_loss": -41.66736602783203, "global_step": 216019, "epoch": 1785} {"train_loss": -41.55154800415039, "global_step": 216020, "epoch": 1785} {"train_loss": -42.22577667236328, "global_step": 216021, "epoch": 1785} {"train_loss": -41.711124420166016, "global_step": 216022, "epoch": 1785} {"train_loss": -41.83700180053711, "global_step": 216023, "epoch": 1785} {"train_loss": -41.5667839050293, "global_step": 216024, "epoch": 1785} {"train_loss": -41.69530487060547, "global_step": 216025, "epoch": 1785} {"train_loss": -41.62366485595703, "global_step": 216026, "epoch": 1785} {"train_loss": -41.41292190551758, "global_step": 216027, "epoch": 1785} {"train_loss": -40.282554626464844, "global_step": 216028, "epoch": 1785} {"train_loss": -41.6597900390625, "global_step": 216029, "epoch": 1785} {"train_loss": -40.76455307006836, "global_step": 216030, "epoch": 1785} {"train_loss": -40.78013229370117, "global_step": 216031, "epoch": 1785} {"train_loss": -40.98651885986328, "global_step": 216032, "epoch": 1785} {"train_loss": -41.35206985473633, "global_step": 216033, "epoch": 1785} {"train_loss": -40.66291427612305, "global_step": 216034, "epoch": 1785} {"train_loss": -41.56852340698242, "global_step": 216035, "epoch": 1785} {"train_loss": -41.222232818603516, "global_step": 216036, "epoch": 1785} {"train_loss": -41.208003997802734, "global_step": 216037, "epoch": 1785} {"train_loss": -40.86666488647461, "global_step": 216038, "epoch": 1785} {"train_loss": -42.00761795043945, "global_step": 216039, "epoch": 1785} {"train_loss": -41.00469207763672, "global_step": 216040, "epoch": 1785} {"train_loss": -40.431373596191406, "global_step": 216041, "epoch": 1785} {"train_loss": -40.780296325683594, "global_step": 216042, "epoch": 1785} {"train_loss": -42.17507553100586, "global_step": 216043, "epoch": 1785} {"train_loss": -41.776607513427734, "global_step": 216044, "epoch": 1785} {"train_loss": -41.12999725341797, "global_step": 216045, "epoch": 1785} {"train_loss": -40.8385009765625, "global_step": 216046, "epoch": 1785} {"train_loss": -42.0659065246582, "global_step": 216047, "epoch": 1785} {"train_loss": -41.07722091674805, "global_step": 216048, "epoch": 1785} {"train_loss": -42.122802734375, "global_step": 216049, "epoch": 1785} {"train_loss": -41.78261184692383, "global_step": 216050, "epoch": 1785} {"train_loss": -41.37129211425781, "global_step": 216051, "epoch": 1785} {"train_loss": -38.928279876708984, "global_step": 216052, "epoch": 1785} {"train_loss": -40.1113395690918, "global_step": 216053, "epoch": 1785} {"train_loss": -41.044715881347656, "global_step": 216054, "epoch": 1785} {"train_loss": -40.79071044921875, "global_step": 216055, "epoch": 1785} {"train_loss": -42.12260818481445, "global_step": 216056, "epoch": 1785} {"train_loss": -40.908790588378906, "global_step": 216057, "epoch": 1785} {"train_loss": -40.90073776245117, "global_step": 216058, "epoch": 1785} {"train_loss": -41.65768814086914, "global_step": 216059, "epoch": 1785} {"train_loss": -42.08148956298828, "global_step": 216060, "epoch": 1785} {"train_loss": -41.93142318725586, "global_step": 216061, "epoch": 1785} {"train_loss": -40.9846076965332, "global_step": 216062, "epoch": 1785} {"train_loss": -41.94883346557617, "global_step": 216063, "epoch": 1785} {"train_loss": -41.075618743896484, "global_step": 216064, "epoch": 1785} {"train_loss": -41.84172439575195, "global_step": 216065, "epoch": 1785} {"train_loss": -42.61091232299805, "global_step": 216066, "epoch": 1785} {"train_loss": -41.334197998046875, "global_step": 216067, "epoch": 1785} {"train_loss": -41.58027267456055, "global_step": 216068, "epoch": 1785} {"train_loss": -41.839637756347656, "global_step": 216069, "epoch": 1785} {"train_loss": -39.91730880737305, "global_step": 216070, "epoch": 1785} {"train_loss": -40.39773178100586, "global_step": 216071, "epoch": 1785} {"train_loss": -42.41297149658203, "global_step": 216072, "epoch": 1785} {"train_loss": -40.64467239379883, "global_step": 216073, "epoch": 1785} {"train_loss": -38.14705276489258, "global_step": 216074, "epoch": 1785} {"train_loss": -41.7288703918457, "global_step": 216075, "epoch": 1785} {"train_loss": -40.441165924072266, "global_step": 216076, "epoch": 1785} {"train_loss": -40.06227111816406, "global_step": 216077, "epoch": 1785} {"train_loss": -38.1437873840332, "global_step": 216078, "epoch": 1785} {"train_loss": -39.89683151245117, "global_step": 216079, "epoch": 1785} {"train_loss": -40.6077995300293, "global_step": 216080, "epoch": 1785} {"train_loss": -40.35067367553711, "global_step": 216081, "epoch": 1785} {"train_loss": -41.30886459350586, "global_step": 216082, "epoch": 1785} {"train_loss": -40.8005485534668, "global_step": 216083, "epoch": 1785} {"train_loss": -41.17816162109375, "global_step": 216084, "epoch": 1785} {"train_loss": -39.32943344116211, "global_step": 216085, "epoch": 1785} {"train_loss": -40.9550895690918, "global_step": 216086, "epoch": 1785} {"train_loss": -40.19483947753906, "global_step": 216087, "epoch": 1785} {"train_loss": -38.323333740234375, "global_step": 216088, "epoch": 1785} {"train_loss": -38.59778594970703, "global_step": 216089, "epoch": 1785} {"train_loss": -39.94758224487305, "global_step": 216090, "epoch": 1785} {"train_loss": -38.81874084472656, "global_step": 216091, "epoch": 1785} {"train_loss": -39.0160026550293, "global_step": 216092, "epoch": 1785} {"train_loss": -38.7735481262207, "global_step": 216093, "epoch": 1785} {"train_loss": -41.4932861328125, "global_step": 216094, "epoch": 1785} {"train_loss": -34.87018585205078, "global_step": 216095, "epoch": 1785} {"train_loss": -37.55607986450195, "global_step": 216096, "epoch": 1785} {"train_loss": -37.28687286376953, "global_step": 216097, "epoch": 1785} {"train_loss": -39.018890380859375, "global_step": 216098, "epoch": 1785} {"train_loss": -36.81022262573242, "global_step": 216099, "epoch": 1785} {"train_loss": -37.45449447631836, "global_step": 216100, "epoch": 1785} {"train_loss": -38.313270568847656, "global_step": 216101, "epoch": 1785} {"train_loss": -38.98822784423828, "global_step": 216102, "epoch": 1785} {"train_loss": -37.05078125, "global_step": 216103, "epoch": 1785} {"train_loss": -20.779966354370117, "global_step": 216104, "epoch": 1785} {"train_loss": -40.502850698045464, "global_step": 216105, "epoch": 1785, "val_loss": 2660878.75} {"train_loss": -34.46847152709961, "global_step": 216106, "epoch": 1786} {"train_loss": -39.25988006591797, "global_step": 216107, "epoch": 1786} {"train_loss": -37.8758659362793, "global_step": 216108, "epoch": 1786} {"train_loss": -39.20551681518555, "global_step": 216109, "epoch": 1786} {"train_loss": -39.01334762573242, "global_step": 216110, "epoch": 1786} {"train_loss": -38.31428909301758, "global_step": 216111, "epoch": 1786} {"train_loss": -39.886470794677734, "global_step": 216112, "epoch": 1786} {"train_loss": -34.84450912475586, "global_step": 216113, "epoch": 1786} {"train_loss": -37.86357116699219, "global_step": 216114, "epoch": 1786} {"train_loss": -38.47747802734375, "global_step": 216115, "epoch": 1786} {"train_loss": -39.03104782104492, "global_step": 216116, "epoch": 1786} {"train_loss": -38.00456237792969, "global_step": 216117, "epoch": 1786} {"train_loss": -39.99859619140625, "global_step": 216118, "epoch": 1786} {"train_loss": -39.62085723876953, "global_step": 216119, "epoch": 1786} {"train_loss": -39.43670654296875, "global_step": 216120, "epoch": 1786} {"train_loss": -39.92643356323242, "global_step": 216121, "epoch": 1786} {"train_loss": -39.56865310668945, "global_step": 216122, "epoch": 1786} {"train_loss": -38.02993392944336, "global_step": 216123, "epoch": 1786} {"train_loss": -40.151878356933594, "global_step": 216124, "epoch": 1786} {"train_loss": -40.3727912902832, "global_step": 216125, "epoch": 1786} {"train_loss": -35.59029006958008, "global_step": 216126, "epoch": 1786} {"train_loss": -37.989654541015625, "global_step": 216127, "epoch": 1786} {"train_loss": -40.217529296875, "global_step": 216128, "epoch": 1786} {"train_loss": -40.36187744140625, "global_step": 216129, "epoch": 1786} {"train_loss": -39.20023727416992, "global_step": 216130, "epoch": 1786} {"train_loss": -39.91559600830078, "global_step": 216131, "epoch": 1786} {"train_loss": -40.38709259033203, "global_step": 216132, "epoch": 1786} {"train_loss": -39.91071701049805, "global_step": 216133, "epoch": 1786} {"train_loss": -40.523765563964844, "global_step": 216134, "epoch": 1786} {"train_loss": -40.90651321411133, "global_step": 216135, "epoch": 1786} {"train_loss": -40.1191291809082, "global_step": 216136, "epoch": 1786} {"train_loss": -40.42033004760742, "global_step": 216137, "epoch": 1786} {"train_loss": -39.4969596862793, "global_step": 216138, "epoch": 1786} {"train_loss": -40.60836410522461, "global_step": 216139, "epoch": 1786} {"train_loss": -40.00419235229492, "global_step": 216140, "epoch": 1786} {"train_loss": -40.35215377807617, "global_step": 216141, "epoch": 1786} {"train_loss": -40.78620147705078, "global_step": 216142, "epoch": 1786} {"train_loss": -40.40488815307617, "global_step": 216143, "epoch": 1786} {"train_loss": -38.519012451171875, "global_step": 216144, "epoch": 1786} {"train_loss": -39.71407699584961, "global_step": 216145, "epoch": 1786} {"train_loss": -41.14057159423828, "global_step": 216146, "epoch": 1786} {"train_loss": -40.93487548828125, "global_step": 216147, "epoch": 1786} {"train_loss": -39.295101165771484, "global_step": 216148, "epoch": 1786} {"train_loss": -40.41410827636719, "global_step": 216149, "epoch": 1786} {"train_loss": -41.36722946166992, "global_step": 216150, "epoch": 1786} {"train_loss": -41.322418212890625, "global_step": 216151, "epoch": 1786} {"train_loss": -41.35733413696289, "global_step": 216152, "epoch": 1786} {"train_loss": -41.09208297729492, "global_step": 216153, "epoch": 1786} {"train_loss": -39.90876388549805, "global_step": 216154, "epoch": 1786} {"train_loss": -40.20968246459961, "global_step": 216155, "epoch": 1786} {"train_loss": -39.54938888549805, "global_step": 216156, "epoch": 1786} {"train_loss": -41.00529098510742, "global_step": 216157, "epoch": 1786} {"train_loss": -40.76383590698242, "global_step": 216158, "epoch": 1786} {"train_loss": -39.91069030761719, "global_step": 216159, "epoch": 1786} {"train_loss": -41.574951171875, "global_step": 216160, "epoch": 1786} {"train_loss": -40.968318939208984, "global_step": 216161, "epoch": 1786} {"train_loss": -41.20111846923828, "global_step": 216162, "epoch": 1786} {"train_loss": -41.448665618896484, "global_step": 216163, "epoch": 1786} {"train_loss": -40.578407287597656, "global_step": 216164, "epoch": 1786} {"train_loss": -41.799720764160156, "global_step": 216165, "epoch": 1786} {"train_loss": -41.4417839050293, "global_step": 216166, "epoch": 1786} {"train_loss": -40.91103744506836, "global_step": 216167, "epoch": 1786} {"train_loss": -41.162349700927734, "global_step": 216168, "epoch": 1786} {"train_loss": -41.1458854675293, "global_step": 216169, "epoch": 1786} {"train_loss": -41.4334831237793, "global_step": 216170, "epoch": 1786} {"train_loss": -40.90678024291992, "global_step": 216171, "epoch": 1786} {"train_loss": -40.17166519165039, "global_step": 216172, "epoch": 1786} {"train_loss": -41.96335983276367, "global_step": 216173, "epoch": 1786} {"train_loss": -41.71296310424805, "global_step": 216174, "epoch": 1786} {"train_loss": -40.5592155456543, "global_step": 216175, "epoch": 1786} {"train_loss": -38.449859619140625, "global_step": 216176, "epoch": 1786} {"train_loss": -41.474609375, "global_step": 216177, "epoch": 1786} {"train_loss": -40.6044807434082, "global_step": 216178, "epoch": 1786} {"train_loss": -41.721534729003906, "global_step": 216179, "epoch": 1786} {"train_loss": -40.67300033569336, "global_step": 216180, "epoch": 1786} {"train_loss": -41.47652053833008, "global_step": 216181, "epoch": 1786} {"train_loss": -41.54994583129883, "global_step": 216182, "epoch": 1786} {"train_loss": -40.59159469604492, "global_step": 216183, "epoch": 1786} {"train_loss": -42.068233489990234, "global_step": 216184, "epoch": 1786} {"train_loss": -40.97418975830078, "global_step": 216185, "epoch": 1786} {"train_loss": -40.24802780151367, "global_step": 216186, "epoch": 1786} {"train_loss": -41.174896240234375, "global_step": 216187, "epoch": 1786} {"train_loss": -41.98445129394531, "global_step": 216188, "epoch": 1786} {"train_loss": -39.45736312866211, "global_step": 216189, "epoch": 1786} {"train_loss": -42.2681770324707, "global_step": 216190, "epoch": 1786} {"train_loss": -41.624603271484375, "global_step": 216191, "epoch": 1786} {"train_loss": -41.50049591064453, "global_step": 216192, "epoch": 1786} {"train_loss": -39.96403121948242, "global_step": 216193, "epoch": 1786} {"train_loss": -41.726497650146484, "global_step": 216194, "epoch": 1786} {"train_loss": -41.17922592163086, "global_step": 216195, "epoch": 1786} {"train_loss": -41.067657470703125, "global_step": 216196, "epoch": 1786} {"train_loss": -41.47556686401367, "global_step": 216197, "epoch": 1786} {"train_loss": -40.98232650756836, "global_step": 216198, "epoch": 1786} {"train_loss": -40.83668899536133, "global_step": 216199, "epoch": 1786} {"train_loss": -41.31528854370117, "global_step": 216200, "epoch": 1786} {"train_loss": -40.758544921875, "global_step": 216201, "epoch": 1786} {"train_loss": -41.29190444946289, "global_step": 216202, "epoch": 1786} {"train_loss": -40.6254768371582, "global_step": 216203, "epoch": 1786} {"train_loss": -41.661075592041016, "global_step": 216204, "epoch": 1786} {"train_loss": -42.35416030883789, "global_step": 216205, "epoch": 1786} {"train_loss": -41.03336715698242, "global_step": 216206, "epoch": 1786} {"train_loss": -42.086517333984375, "global_step": 216207, "epoch": 1786} {"train_loss": -42.10186767578125, "global_step": 216208, "epoch": 1786} {"train_loss": -40.695003509521484, "global_step": 216209, "epoch": 1786} {"train_loss": -41.34748458862305, "global_step": 216210, "epoch": 1786} {"train_loss": -41.189476013183594, "global_step": 216211, "epoch": 1786} {"train_loss": -39.802127838134766, "global_step": 216212, "epoch": 1786} {"train_loss": -37.24678421020508, "global_step": 216213, "epoch": 1786} {"train_loss": -38.70262908935547, "global_step": 216214, "epoch": 1786} {"train_loss": -41.75356674194336, "global_step": 216215, "epoch": 1786} {"train_loss": -39.25044631958008, "global_step": 216216, "epoch": 1786} {"train_loss": -35.50283432006836, "global_step": 216217, "epoch": 1786} {"train_loss": -39.3718147277832, "global_step": 216218, "epoch": 1786} {"train_loss": -41.4034309387207, "global_step": 216219, "epoch": 1786} {"train_loss": -36.86345291137695, "global_step": 216220, "epoch": 1786} {"train_loss": -38.87777328491211, "global_step": 216221, "epoch": 1786} {"train_loss": -41.21104431152344, "global_step": 216222, "epoch": 1786} {"train_loss": -38.484657287597656, "global_step": 216223, "epoch": 1786} {"train_loss": -39.98584747314453, "global_step": 216224, "epoch": 1786} {"train_loss": -41.79132080078125, "global_step": 216225, "epoch": 1786} {"train_loss": -40.23065462979403, "global_step": 216226, "epoch": 1786, "val_loss": 2655496.5} {"train_loss": -40.412776947021484, "global_step": 216227, "epoch": 1787} {"train_loss": -40.776702880859375, "global_step": 216228, "epoch": 1787} {"train_loss": -41.58159255981445, "global_step": 216229, "epoch": 1787} {"train_loss": -41.49680709838867, "global_step": 216230, "epoch": 1787} {"train_loss": -39.440608978271484, "global_step": 216231, "epoch": 1787} {"train_loss": -39.8985595703125, "global_step": 216232, "epoch": 1787} {"train_loss": -41.19734573364258, "global_step": 216233, "epoch": 1787} {"train_loss": -41.138484954833984, "global_step": 216234, "epoch": 1787} {"train_loss": -40.8852424621582, "global_step": 216235, "epoch": 1787} {"train_loss": -39.38114929199219, "global_step": 216236, "epoch": 1787} {"train_loss": -41.63225555419922, "global_step": 216237, "epoch": 1787} {"train_loss": -41.41825485229492, "global_step": 216238, "epoch": 1787} {"train_loss": -41.63381576538086, "global_step": 216239, "epoch": 1787} {"train_loss": -41.20747756958008, "global_step": 216240, "epoch": 1787} {"train_loss": -41.55899429321289, "global_step": 216241, "epoch": 1787} {"train_loss": -41.40911102294922, "global_step": 216242, "epoch": 1787} {"train_loss": -40.9755859375, "global_step": 216243, "epoch": 1787} {"train_loss": -41.88897705078125, "global_step": 216244, "epoch": 1787} {"train_loss": -40.963958740234375, "global_step": 216245, "epoch": 1787} {"train_loss": -41.00510025024414, "global_step": 216246, "epoch": 1787} {"train_loss": -41.7116813659668, "global_step": 216247, "epoch": 1787} {"train_loss": -40.942012786865234, "global_step": 216248, "epoch": 1787} {"train_loss": -40.477996826171875, "global_step": 216249, "epoch": 1787} {"train_loss": -41.54914474487305, "global_step": 216250, "epoch": 1787} {"train_loss": -41.77875900268555, "global_step": 216251, "epoch": 1787} {"train_loss": -40.9285888671875, "global_step": 216252, "epoch": 1787} {"train_loss": -41.89427185058594, "global_step": 216253, "epoch": 1787} {"train_loss": -41.931427001953125, "global_step": 216254, "epoch": 1787} {"train_loss": -41.89009475708008, "global_step": 216255, "epoch": 1787} {"train_loss": -42.44231414794922, "global_step": 216256, "epoch": 1787} {"train_loss": -41.61617660522461, "global_step": 216257, "epoch": 1787} {"train_loss": -41.99983596801758, "global_step": 216258, "epoch": 1787} {"train_loss": -42.181392669677734, "global_step": 216259, "epoch": 1787} {"train_loss": -41.74270248413086, "global_step": 216260, "epoch": 1787} {"train_loss": -42.365509033203125, "global_step": 216261, "epoch": 1787} {"train_loss": -42.4459342956543, "global_step": 216262, "epoch": 1787} {"train_loss": -42.310630798339844, "global_step": 216263, "epoch": 1787} {"train_loss": -42.385887145996094, "global_step": 216264, "epoch": 1787} {"train_loss": -42.047218322753906, "global_step": 216265, "epoch": 1787} {"train_loss": -42.40253448486328, "global_step": 216266, "epoch": 1787} {"train_loss": -41.8350830078125, "global_step": 216267, "epoch": 1787} {"train_loss": -41.76700210571289, "global_step": 216268, "epoch": 1787} {"train_loss": -42.36470413208008, "global_step": 216269, "epoch": 1787} {"train_loss": -42.07649230957031, "global_step": 216270, "epoch": 1787} {"train_loss": -42.51132583618164, "global_step": 216271, "epoch": 1787} {"train_loss": -42.388973236083984, "global_step": 216272, "epoch": 1787} {"train_loss": -40.97939682006836, "global_step": 216273, "epoch": 1787} {"train_loss": -41.85670471191406, "global_step": 216274, "epoch": 1787} {"train_loss": -42.3920783996582, "global_step": 216275, "epoch": 1787} {"train_loss": -42.22388458251953, "global_step": 216276, "epoch": 1787} {"train_loss": -42.4042854309082, "global_step": 216277, "epoch": 1787} {"train_loss": -41.202571868896484, "global_step": 216278, "epoch": 1787} {"train_loss": -40.33941650390625, "global_step": 216279, "epoch": 1787} {"train_loss": -41.452388763427734, "global_step": 216280, "epoch": 1787} {"train_loss": -41.42348098754883, "global_step": 216281, "epoch": 1787} {"train_loss": -41.92519760131836, "global_step": 216282, "epoch": 1787} {"train_loss": -41.0510139465332, "global_step": 216283, "epoch": 1787} {"train_loss": -41.229827880859375, "global_step": 216284, "epoch": 1787} {"train_loss": -42.02492904663086, "global_step": 216285, "epoch": 1787} {"train_loss": -41.18911361694336, "global_step": 216286, "epoch": 1787} {"train_loss": -41.28916549682617, "global_step": 216287, "epoch": 1787} {"train_loss": -39.20595169067383, "global_step": 216288, "epoch": 1787} {"train_loss": -38.46820831298828, "global_step": 216289, "epoch": 1787} {"train_loss": -39.774471282958984, "global_step": 216290, "epoch": 1787} {"train_loss": -38.80125045776367, "global_step": 216291, "epoch": 1787} {"train_loss": -41.02150344848633, "global_step": 216292, "epoch": 1787} {"train_loss": -41.916229248046875, "global_step": 216293, "epoch": 1787} {"train_loss": -40.88208770751953, "global_step": 216294, "epoch": 1787} {"train_loss": -40.52027130126953, "global_step": 216295, "epoch": 1787} {"train_loss": -36.08502197265625, "global_step": 216296, "epoch": 1787} {"train_loss": -38.0051155090332, "global_step": 216297, "epoch": 1787} {"train_loss": -38.353511810302734, "global_step": 216298, "epoch": 1787} {"train_loss": -40.26496887207031, "global_step": 216299, "epoch": 1787} {"train_loss": -38.53154373168945, "global_step": 216300, "epoch": 1787} {"train_loss": -38.55464553833008, "global_step": 216301, "epoch": 1787} {"train_loss": -40.04762649536133, "global_step": 216302, "epoch": 1787} {"train_loss": -39.233577728271484, "global_step": 216303, "epoch": 1787} {"train_loss": -39.89657211303711, "global_step": 216304, "epoch": 1787} {"train_loss": -39.4581184387207, "global_step": 216305, "epoch": 1787} {"train_loss": -39.78743362426758, "global_step": 216306, "epoch": 1787} {"train_loss": -40.977577209472656, "global_step": 216307, "epoch": 1787} {"train_loss": -40.91181564331055, "global_step": 216308, "epoch": 1787} {"train_loss": -39.2672119140625, "global_step": 216309, "epoch": 1787} {"train_loss": -40.98826217651367, "global_step": 216310, "epoch": 1787} {"train_loss": -40.65778732299805, "global_step": 216311, "epoch": 1787} {"train_loss": -40.08185577392578, "global_step": 216312, "epoch": 1787} {"train_loss": -40.96433639526367, "global_step": 216313, "epoch": 1787} {"train_loss": -39.34843826293945, "global_step": 216314, "epoch": 1787} {"train_loss": -40.13163375854492, "global_step": 216315, "epoch": 1787} {"train_loss": -41.5884895324707, "global_step": 216316, "epoch": 1787} {"train_loss": -41.12140655517578, "global_step": 216317, "epoch": 1787} {"train_loss": -41.504825592041016, "global_step": 216318, "epoch": 1787} {"train_loss": -41.4986457824707, "global_step": 216319, "epoch": 1787} {"train_loss": -41.64894485473633, "global_step": 216320, "epoch": 1787} {"train_loss": -41.34082794189453, "global_step": 216321, "epoch": 1787} {"train_loss": -40.392704010009766, "global_step": 216322, "epoch": 1787} {"train_loss": -42.00759506225586, "global_step": 216323, "epoch": 1787} {"train_loss": -41.25303268432617, "global_step": 216324, "epoch": 1787} {"train_loss": -41.4798583984375, "global_step": 216325, "epoch": 1787} {"train_loss": -41.43716812133789, "global_step": 216326, "epoch": 1787} {"train_loss": -41.1236572265625, "global_step": 216327, "epoch": 1787} {"train_loss": -41.04457092285156, "global_step": 216328, "epoch": 1787} {"train_loss": -41.74917221069336, "global_step": 216329, "epoch": 1787} {"train_loss": -41.78033447265625, "global_step": 216330, "epoch": 1787} {"train_loss": -41.41862869262695, "global_step": 216331, "epoch": 1787} {"train_loss": -41.665771484375, "global_step": 216332, "epoch": 1787} {"train_loss": -41.09243392944336, "global_step": 216333, "epoch": 1787} {"train_loss": -40.79999542236328, "global_step": 216334, "epoch": 1787} {"train_loss": -41.652732849121094, "global_step": 216335, "epoch": 1787} {"train_loss": -41.78208923339844, "global_step": 216336, "epoch": 1787} {"train_loss": -42.17312240600586, "global_step": 216337, "epoch": 1787} {"train_loss": -41.99443435668945, "global_step": 216338, "epoch": 1787} {"train_loss": -42.34768295288086, "global_step": 216339, "epoch": 1787} {"train_loss": -41.645172119140625, "global_step": 216340, "epoch": 1787} {"train_loss": -40.235469818115234, "global_step": 216341, "epoch": 1787} {"train_loss": -42.18760299682617, "global_step": 216342, "epoch": 1787} {"train_loss": -41.7649040222168, "global_step": 216343, "epoch": 1787} {"train_loss": -41.808937072753906, "global_step": 216344, "epoch": 1787} {"train_loss": -42.25529098510742, "global_step": 216345, "epoch": 1787} {"train_loss": -40.246253967285156, "global_step": 216346, "epoch": 1787} {"train_loss": -41.096981647586034, "global_step": 216347, "epoch": 1787, "val_loss": 2833507.25} {"train_loss": -42.2108154296875, "global_step": 216348, "epoch": 1788} {"train_loss": -42.642147064208984, "global_step": 216349, "epoch": 1788} {"train_loss": -39.562843322753906, "global_step": 216350, "epoch": 1788} {"train_loss": -40.6233024597168, "global_step": 216351, "epoch": 1788} {"train_loss": -41.71383285522461, "global_step": 216352, "epoch": 1788} {"train_loss": -42.047698974609375, "global_step": 216353, "epoch": 1788} {"train_loss": -42.18224334716797, "global_step": 216354, "epoch": 1788} {"train_loss": -41.9087028503418, "global_step": 216355, "epoch": 1788} {"train_loss": -40.38236999511719, "global_step": 216356, "epoch": 1788} {"train_loss": -42.01308822631836, "global_step": 216357, "epoch": 1788} {"train_loss": -41.35432434082031, "global_step": 216358, "epoch": 1788} {"train_loss": -41.41372299194336, "global_step": 216359, "epoch": 1788} {"train_loss": -41.9515495300293, "global_step": 216360, "epoch": 1788} {"train_loss": -41.66278839111328, "global_step": 216361, "epoch": 1788} {"train_loss": -41.770599365234375, "global_step": 216362, "epoch": 1788} {"train_loss": -42.100433349609375, "global_step": 216363, "epoch": 1788} {"train_loss": -41.1009635925293, "global_step": 216364, "epoch": 1788} {"train_loss": -42.30720138549805, "global_step": 216365, "epoch": 1788} {"train_loss": -42.47732162475586, "global_step": 216366, "epoch": 1788} {"train_loss": -41.56997299194336, "global_step": 216367, "epoch": 1788} {"train_loss": -42.02802276611328, "global_step": 216368, "epoch": 1788} {"train_loss": -41.236541748046875, "global_step": 216369, "epoch": 1788} {"train_loss": -42.53037643432617, "global_step": 216370, "epoch": 1788} {"train_loss": -42.04667282104492, "global_step": 216371, "epoch": 1788} {"train_loss": -41.575469970703125, "global_step": 216372, "epoch": 1788} {"train_loss": -42.16584396362305, "global_step": 216373, "epoch": 1788} {"train_loss": -40.724395751953125, "global_step": 216374, "epoch": 1788} {"train_loss": -38.75820541381836, "global_step": 216375, "epoch": 1788} {"train_loss": -41.29050827026367, "global_step": 216376, "epoch": 1788} {"train_loss": -42.04460525512695, "global_step": 216377, "epoch": 1788} {"train_loss": -41.52651596069336, "global_step": 216378, "epoch": 1788} {"train_loss": -41.009193420410156, "global_step": 216379, "epoch": 1788} {"train_loss": -42.07457733154297, "global_step": 216380, "epoch": 1788} {"train_loss": -41.86306381225586, "global_step": 216381, "epoch": 1788} {"train_loss": -41.58431625366211, "global_step": 216382, "epoch": 1788} {"train_loss": -41.25532913208008, "global_step": 216383, "epoch": 1788} {"train_loss": -40.89360809326172, "global_step": 216384, "epoch": 1788} {"train_loss": -41.695343017578125, "global_step": 216385, "epoch": 1788} {"train_loss": -41.24253463745117, "global_step": 216386, "epoch": 1788} {"train_loss": -40.48224639892578, "global_step": 216387, "epoch": 1788} {"train_loss": -38.938720703125, "global_step": 216388, "epoch": 1788} {"train_loss": -40.47377014160156, "global_step": 216389, "epoch": 1788} {"train_loss": -41.49763107299805, "global_step": 216390, "epoch": 1788} {"train_loss": -42.0685920715332, "global_step": 216391, "epoch": 1788} {"train_loss": -42.03487014770508, "global_step": 216392, "epoch": 1788} {"train_loss": -41.06948471069336, "global_step": 216393, "epoch": 1788} {"train_loss": -41.594268798828125, "global_step": 216394, "epoch": 1788} {"train_loss": -41.476863861083984, "global_step": 216395, "epoch": 1788} {"train_loss": -40.55436325073242, "global_step": 216396, "epoch": 1788} {"train_loss": -40.59937286376953, "global_step": 216397, "epoch": 1788} {"train_loss": -41.822601318359375, "global_step": 216398, "epoch": 1788} {"train_loss": -38.74671173095703, "global_step": 216399, "epoch": 1788} {"train_loss": -40.64229965209961, "global_step": 216400, "epoch": 1788} {"train_loss": -40.685546875, "global_step": 216401, "epoch": 1788} {"train_loss": -42.1078987121582, "global_step": 216402, "epoch": 1788} {"train_loss": -40.162940979003906, "global_step": 216403, "epoch": 1788} {"train_loss": -40.99994659423828, "global_step": 216404, "epoch": 1788} {"train_loss": -42.373497009277344, "global_step": 216405, "epoch": 1788} {"train_loss": -41.71535873413086, "global_step": 216406, "epoch": 1788} {"train_loss": -41.71060562133789, "global_step": 216407, "epoch": 1788} {"train_loss": -41.3818359375, "global_step": 216408, "epoch": 1788} {"train_loss": -40.3924560546875, "global_step": 216409, "epoch": 1788} {"train_loss": -41.84401321411133, "global_step": 216410, "epoch": 1788} {"train_loss": -40.961212158203125, "global_step": 216411, "epoch": 1788} {"train_loss": -41.83378219604492, "global_step": 216412, "epoch": 1788} {"train_loss": -41.31078338623047, "global_step": 216413, "epoch": 1788} {"train_loss": -41.33726119995117, "global_step": 216414, "epoch": 1788} {"train_loss": -41.95589065551758, "global_step": 216415, "epoch": 1788} {"train_loss": -40.9605598449707, "global_step": 216416, "epoch": 1788} {"train_loss": -41.62553024291992, "global_step": 216417, "epoch": 1788} {"train_loss": -41.93367385864258, "global_step": 216418, "epoch": 1788} {"train_loss": -42.25021743774414, "global_step": 216419, "epoch": 1788} {"train_loss": -41.944252014160156, "global_step": 216420, "epoch": 1788} {"train_loss": -41.036983489990234, "global_step": 216421, "epoch": 1788} {"train_loss": -41.50602340698242, "global_step": 216422, "epoch": 1788} {"train_loss": -41.91347122192383, "global_step": 216423, "epoch": 1788} {"train_loss": -41.24451446533203, "global_step": 216424, "epoch": 1788} {"train_loss": -41.42301940917969, "global_step": 216425, "epoch": 1788} {"train_loss": -41.455467224121094, "global_step": 216426, "epoch": 1788} {"train_loss": -42.24399185180664, "global_step": 216427, "epoch": 1788} {"train_loss": -41.644935607910156, "global_step": 216428, "epoch": 1788} {"train_loss": -41.874664306640625, "global_step": 216429, "epoch": 1788} {"train_loss": -42.25367736816406, "global_step": 216430, "epoch": 1788} {"train_loss": -41.7524299621582, "global_step": 216431, "epoch": 1788} {"train_loss": -41.930721282958984, "global_step": 216432, "epoch": 1788} {"train_loss": -41.82886505126953, "global_step": 216433, "epoch": 1788} {"train_loss": -41.724063873291016, "global_step": 216434, "epoch": 1788} {"train_loss": -41.8186149597168, "global_step": 216435, "epoch": 1788} {"train_loss": -42.18146514892578, "global_step": 216436, "epoch": 1788} {"train_loss": -41.975337982177734, "global_step": 216437, "epoch": 1788} {"train_loss": -40.518802642822266, "global_step": 216438, "epoch": 1788} {"train_loss": -40.97201156616211, "global_step": 216439, "epoch": 1788} {"train_loss": -38.63045120239258, "global_step": 216440, "epoch": 1788} {"train_loss": -40.284942626953125, "global_step": 216441, "epoch": 1788} {"train_loss": -40.21409225463867, "global_step": 216442, "epoch": 1788} {"train_loss": -39.64547348022461, "global_step": 216443, "epoch": 1788} {"train_loss": -39.79221725463867, "global_step": 216444, "epoch": 1788} {"train_loss": -41.271759033203125, "global_step": 216445, "epoch": 1788} {"train_loss": -38.735713958740234, "global_step": 216446, "epoch": 1788} {"train_loss": -39.67441177368164, "global_step": 216447, "epoch": 1788} {"train_loss": -35.44092559814453, "global_step": 216448, "epoch": 1788} {"train_loss": -38.49026107788086, "global_step": 216449, "epoch": 1788} {"train_loss": -39.89594650268555, "global_step": 216450, "epoch": 1788} {"train_loss": -41.884342193603516, "global_step": 216451, "epoch": 1788} {"train_loss": -40.31144332885742, "global_step": 216452, "epoch": 1788} {"train_loss": -39.253475189208984, "global_step": 216453, "epoch": 1788} {"train_loss": -42.05156707763672, "global_step": 216454, "epoch": 1788} {"train_loss": -40.07207107543945, "global_step": 216455, "epoch": 1788} {"train_loss": -41.75386428833008, "global_step": 216456, "epoch": 1788} {"train_loss": -41.48093795776367, "global_step": 216457, "epoch": 1788} {"train_loss": -39.848140716552734, "global_step": 216458, "epoch": 1788} {"train_loss": -41.4161491394043, "global_step": 216459, "epoch": 1788} {"train_loss": -41.691986083984375, "global_step": 216460, "epoch": 1788} {"train_loss": -31.099218368530273, "global_step": 216461, "epoch": 1788} {"train_loss": -40.5316047668457, "global_step": 216462, "epoch": 1788} {"train_loss": -40.75056076049805, "global_step": 216463, "epoch": 1788} {"train_loss": -39.47684860229492, "global_step": 216464, "epoch": 1788} {"train_loss": -41.310935974121094, "global_step": 216465, "epoch": 1788} {"train_loss": -39.74021530151367, "global_step": 216466, "epoch": 1788} {"train_loss": -40.977359771728516, "global_step": 216467, "epoch": 1788} {"train_loss": -41.06490254993281, "global_step": 216468, "epoch": 1788, "val_loss": 2779511.0} {"train_loss": -39.47674560546875, "global_step": 216469, "epoch": 1789} {"train_loss": -40.7526741027832, "global_step": 216470, "epoch": 1789} {"train_loss": -31.8066349029541, "global_step": 216471, "epoch": 1789} {"train_loss": -41.182044982910156, "global_step": 216472, "epoch": 1789} {"train_loss": -38.83284378051758, "global_step": 216473, "epoch": 1789} {"train_loss": -41.07550811767578, "global_step": 216474, "epoch": 1789} {"train_loss": -39.60556411743164, "global_step": 216475, "epoch": 1789} {"train_loss": -41.501888275146484, "global_step": 216476, "epoch": 1789} {"train_loss": -41.84003829956055, "global_step": 216477, "epoch": 1789} {"train_loss": -40.69968795776367, "global_step": 216478, "epoch": 1789} {"train_loss": -37.77293014526367, "global_step": 216479, "epoch": 1789} {"train_loss": -40.668121337890625, "global_step": 216480, "epoch": 1789} {"train_loss": -41.17308807373047, "global_step": 216481, "epoch": 1789} {"train_loss": -40.08894729614258, "global_step": 216482, "epoch": 1789} {"train_loss": -39.37478256225586, "global_step": 216483, "epoch": 1789} {"train_loss": -40.17335891723633, "global_step": 216484, "epoch": 1789} {"train_loss": -41.55852127075195, "global_step": 216485, "epoch": 1789} {"train_loss": -35.166259765625, "global_step": 216486, "epoch": 1789} {"train_loss": -41.018768310546875, "global_step": 216487, "epoch": 1789} {"train_loss": -41.802032470703125, "global_step": 216488, "epoch": 1789} {"train_loss": -39.6116828918457, "global_step": 216489, "epoch": 1789} {"train_loss": -40.29510498046875, "global_step": 216490, "epoch": 1789} {"train_loss": -40.14253234863281, "global_step": 216491, "epoch": 1789} {"train_loss": -40.30887985229492, "global_step": 216492, "epoch": 1789} {"train_loss": -41.75339889526367, "global_step": 216493, "epoch": 1789} {"train_loss": -40.78480529785156, "global_step": 216494, "epoch": 1789} {"train_loss": -41.51848602294922, "global_step": 216495, "epoch": 1789} {"train_loss": -41.374488830566406, "global_step": 216496, "epoch": 1789} {"train_loss": -37.42477035522461, "global_step": 216497, "epoch": 1789} {"train_loss": -38.089195251464844, "global_step": 216498, "epoch": 1789} {"train_loss": -37.91312026977539, "global_step": 216499, "epoch": 1789} {"train_loss": -41.48698806762695, "global_step": 216500, "epoch": 1789} {"train_loss": -41.90760040283203, "global_step": 216501, "epoch": 1789} {"train_loss": -40.12281036376953, "global_step": 216502, "epoch": 1789} {"train_loss": -39.3109130859375, "global_step": 216503, "epoch": 1789} {"train_loss": -41.748409271240234, "global_step": 216504, "epoch": 1789} {"train_loss": -35.39265441894531, "global_step": 216505, "epoch": 1789} {"train_loss": -40.98968505859375, "global_step": 216506, "epoch": 1789} {"train_loss": -41.12629699707031, "global_step": 216507, "epoch": 1789} {"train_loss": -41.09647750854492, "global_step": 216508, "epoch": 1789} {"train_loss": -40.68293380737305, "global_step": 216509, "epoch": 1789} {"train_loss": -39.40226364135742, "global_step": 216510, "epoch": 1789} {"train_loss": -41.09623336791992, "global_step": 216511, "epoch": 1789} {"train_loss": -41.01522445678711, "global_step": 216512, "epoch": 1789} {"train_loss": -40.870277404785156, "global_step": 216513, "epoch": 1789} {"train_loss": -41.25068283081055, "global_step": 216514, "epoch": 1789} {"train_loss": -41.09074401855469, "global_step": 216515, "epoch": 1789} {"train_loss": -40.65644454956055, "global_step": 216516, "epoch": 1789} {"train_loss": -41.40145492553711, "global_step": 216517, "epoch": 1789} {"train_loss": -39.773075103759766, "global_step": 216518, "epoch": 1789} {"train_loss": -40.106346130371094, "global_step": 216519, "epoch": 1789} {"train_loss": -40.46413803100586, "global_step": 216520, "epoch": 1789} {"train_loss": -41.881324768066406, "global_step": 216521, "epoch": 1789} {"train_loss": -41.65361404418945, "global_step": 216522, "epoch": 1789} {"train_loss": -41.672359466552734, "global_step": 216523, "epoch": 1789} {"train_loss": -41.975067138671875, "global_step": 216524, "epoch": 1789} {"train_loss": -41.990394592285156, "global_step": 216525, "epoch": 1789} {"train_loss": -42.16099166870117, "global_step": 216526, "epoch": 1789} {"train_loss": -41.11261749267578, "global_step": 216527, "epoch": 1789} {"train_loss": -38.638153076171875, "global_step": 216528, "epoch": 1789} {"train_loss": -41.826416015625, "global_step": 216529, "epoch": 1789} {"train_loss": -41.423439025878906, "global_step": 216530, "epoch": 1789} {"train_loss": -41.97108840942383, "global_step": 216531, "epoch": 1789} {"train_loss": -42.115360260009766, "global_step": 216532, "epoch": 1789} {"train_loss": -41.67861557006836, "global_step": 216533, "epoch": 1789} {"train_loss": -41.408660888671875, "global_step": 216534, "epoch": 1789} {"train_loss": -41.22806167602539, "global_step": 216535, "epoch": 1789} {"train_loss": -41.74142837524414, "global_step": 216536, "epoch": 1789} {"train_loss": -37.72967529296875, "global_step": 216537, "epoch": 1789} {"train_loss": -41.4603157043457, "global_step": 216538, "epoch": 1789} {"train_loss": -41.93047332763672, "global_step": 216539, "epoch": 1789} {"train_loss": -41.678504943847656, "global_step": 216540, "epoch": 1789} {"train_loss": -41.705352783203125, "global_step": 216541, "epoch": 1789} {"train_loss": -41.911006927490234, "global_step": 216542, "epoch": 1789} {"train_loss": -41.45974349975586, "global_step": 216543, "epoch": 1789} {"train_loss": -42.273773193359375, "global_step": 216544, "epoch": 1789} {"train_loss": -41.02543640136719, "global_step": 216545, "epoch": 1789} {"train_loss": -41.10757064819336, "global_step": 216546, "epoch": 1789} {"train_loss": -41.49050521850586, "global_step": 216547, "epoch": 1789} {"train_loss": -42.28594207763672, "global_step": 216548, "epoch": 1789} {"train_loss": -40.69865036010742, "global_step": 216549, "epoch": 1789} {"train_loss": -41.576778411865234, "global_step": 216550, "epoch": 1789} {"train_loss": -41.54263687133789, "global_step": 216551, "epoch": 1789} {"train_loss": -42.194664001464844, "global_step": 216552, "epoch": 1789} {"train_loss": -41.04315185546875, "global_step": 216553, "epoch": 1789} {"train_loss": -41.432403564453125, "global_step": 216554, "epoch": 1789} {"train_loss": -41.3990592956543, "global_step": 216555, "epoch": 1789} {"train_loss": -42.078102111816406, "global_step": 216556, "epoch": 1789} {"train_loss": -41.59870529174805, "global_step": 216557, "epoch": 1789} {"train_loss": -42.14781188964844, "global_step": 216558, "epoch": 1789} {"train_loss": -41.979736328125, "global_step": 216559, "epoch": 1789} {"train_loss": -41.599365234375, "global_step": 216560, "epoch": 1789} {"train_loss": -42.3416862487793, "global_step": 216561, "epoch": 1789} {"train_loss": -42.010650634765625, "global_step": 216562, "epoch": 1789} {"train_loss": -42.33443069458008, "global_step": 216563, "epoch": 1789} {"train_loss": -42.288143157958984, "global_step": 216564, "epoch": 1789} {"train_loss": -41.14467239379883, "global_step": 216565, "epoch": 1789} {"train_loss": -42.1371955871582, "global_step": 216566, "epoch": 1789} {"train_loss": -42.39421463012695, "global_step": 216567, "epoch": 1789} {"train_loss": -42.332149505615234, "global_step": 216568, "epoch": 1789} {"train_loss": -42.677772521972656, "global_step": 216569, "epoch": 1789} {"train_loss": -42.091182708740234, "global_step": 216570, "epoch": 1789} {"train_loss": -42.548954010009766, "global_step": 216571, "epoch": 1789} {"train_loss": -42.552284240722656, "global_step": 216572, "epoch": 1789} {"train_loss": -41.5256462097168, "global_step": 216573, "epoch": 1789} {"train_loss": -41.650630950927734, "global_step": 216574, "epoch": 1789} {"train_loss": -42.117671966552734, "global_step": 216575, "epoch": 1789} {"train_loss": -42.16554641723633, "global_step": 216576, "epoch": 1789} {"train_loss": -41.36541748046875, "global_step": 216577, "epoch": 1789} {"train_loss": -42.350799560546875, "global_step": 216578, "epoch": 1789} {"train_loss": -42.11691665649414, "global_step": 216579, "epoch": 1789} {"train_loss": -41.80080032348633, "global_step": 216580, "epoch": 1789} {"train_loss": -41.45457077026367, "global_step": 216581, "epoch": 1789} {"train_loss": -41.96165084838867, "global_step": 216582, "epoch": 1789} {"train_loss": -41.26066970825195, "global_step": 216583, "epoch": 1789} {"train_loss": -41.188232421875, "global_step": 216584, "epoch": 1789} {"train_loss": -41.42744827270508, "global_step": 216585, "epoch": 1789} {"train_loss": -40.52788543701172, "global_step": 216586, "epoch": 1789} {"train_loss": -42.10559844970703, "global_step": 216587, "epoch": 1789} {"train_loss": -41.69725799560547, "global_step": 216588, "epoch": 1789} {"train_loss": -40.99608913137893, "global_step": 216589, "epoch": 1789, "val_loss": 2678930.25} {"train_loss": -41.828182220458984, "global_step": 216590, "epoch": 1790} {"train_loss": -41.18171310424805, "global_step": 216591, "epoch": 1790} {"train_loss": -40.74309158325195, "global_step": 216592, "epoch": 1790} {"train_loss": -39.94028091430664, "global_step": 216593, "epoch": 1790} {"train_loss": -41.30881118774414, "global_step": 216594, "epoch": 1790} {"train_loss": -41.0411262512207, "global_step": 216595, "epoch": 1790} {"train_loss": -39.746212005615234, "global_step": 216596, "epoch": 1790} {"train_loss": -37.51866912841797, "global_step": 216597, "epoch": 1790} {"train_loss": -37.258182525634766, "global_step": 216598, "epoch": 1790} {"train_loss": -39.544898986816406, "global_step": 216599, "epoch": 1790} {"train_loss": -40.85353469848633, "global_step": 216600, "epoch": 1790} {"train_loss": -36.915374755859375, "global_step": 216601, "epoch": 1790} {"train_loss": -39.78464889526367, "global_step": 216602, "epoch": 1790} {"train_loss": -39.451351165771484, "global_step": 216603, "epoch": 1790} {"train_loss": -38.64613342285156, "global_step": 216604, "epoch": 1790} {"train_loss": -40.503475189208984, "global_step": 216605, "epoch": 1790} {"train_loss": -41.49778366088867, "global_step": 216606, "epoch": 1790} {"train_loss": -39.86165237426758, "global_step": 216607, "epoch": 1790} {"train_loss": -40.099483489990234, "global_step": 216608, "epoch": 1790} {"train_loss": -39.859954833984375, "global_step": 216609, "epoch": 1790} {"train_loss": -40.71108627319336, "global_step": 216610, "epoch": 1790} {"train_loss": -40.67434310913086, "global_step": 216611, "epoch": 1790} {"train_loss": -41.70390701293945, "global_step": 216612, "epoch": 1790} {"train_loss": -40.349090576171875, "global_step": 216613, "epoch": 1790} {"train_loss": -40.34187698364258, "global_step": 216614, "epoch": 1790} {"train_loss": -40.92856979370117, "global_step": 216615, "epoch": 1790} {"train_loss": -39.73527908325195, "global_step": 216616, "epoch": 1790} {"train_loss": -39.6991081237793, "global_step": 216617, "epoch": 1790} {"train_loss": -39.92413330078125, "global_step": 216618, "epoch": 1790} {"train_loss": -40.21989059448242, "global_step": 216619, "epoch": 1790} {"train_loss": -40.63683319091797, "global_step": 216620, "epoch": 1790} {"train_loss": -40.27748489379883, "global_step": 216621, "epoch": 1790} {"train_loss": -40.106143951416016, "global_step": 216622, "epoch": 1790} {"train_loss": -40.204017639160156, "global_step": 216623, "epoch": 1790} {"train_loss": -40.795223236083984, "global_step": 216624, "epoch": 1790} {"train_loss": -40.79359817504883, "global_step": 216625, "epoch": 1790} {"train_loss": -37.86970901489258, "global_step": 216626, "epoch": 1790} {"train_loss": -39.93697738647461, "global_step": 216627, "epoch": 1790} {"train_loss": -41.370235443115234, "global_step": 216628, "epoch": 1790} {"train_loss": -37.25417709350586, "global_step": 216629, "epoch": 1790} {"train_loss": -37.28813934326172, "global_step": 216630, "epoch": 1790} {"train_loss": -41.15165328979492, "global_step": 216631, "epoch": 1790} {"train_loss": -38.4669075012207, "global_step": 216632, "epoch": 1790} {"train_loss": -36.5106201171875, "global_step": 216633, "epoch": 1790} {"train_loss": -40.51844024658203, "global_step": 216634, "epoch": 1790} {"train_loss": -37.12318801879883, "global_step": 216635, "epoch": 1790} {"train_loss": -40.284461975097656, "global_step": 216636, "epoch": 1790} {"train_loss": -38.52378463745117, "global_step": 216637, "epoch": 1790} {"train_loss": -39.95806121826172, "global_step": 216638, "epoch": 1790} {"train_loss": -39.73833465576172, "global_step": 216639, "epoch": 1790} {"train_loss": -39.800594329833984, "global_step": 216640, "epoch": 1790} {"train_loss": -40.39013671875, "global_step": 216641, "epoch": 1790} {"train_loss": -40.67606735229492, "global_step": 216642, "epoch": 1790} {"train_loss": -40.916412353515625, "global_step": 216643, "epoch": 1790} {"train_loss": -41.282997131347656, "global_step": 216644, "epoch": 1790} {"train_loss": -40.969905853271484, "global_step": 216645, "epoch": 1790} {"train_loss": -40.813011169433594, "global_step": 216646, "epoch": 1790} {"train_loss": -41.173458099365234, "global_step": 216647, "epoch": 1790} {"train_loss": -40.80086898803711, "global_step": 216648, "epoch": 1790} {"train_loss": -41.382789611816406, "global_step": 216649, "epoch": 1790} {"train_loss": -40.846858978271484, "global_step": 216650, "epoch": 1790} {"train_loss": -41.44065475463867, "global_step": 216651, "epoch": 1790} {"train_loss": -41.89106369018555, "global_step": 216652, "epoch": 1790} {"train_loss": -41.68769454956055, "global_step": 216653, "epoch": 1790} {"train_loss": -41.94654083251953, "global_step": 216654, "epoch": 1790} {"train_loss": -41.75926208496094, "global_step": 216655, "epoch": 1790} {"train_loss": -41.84659957885742, "global_step": 216656, "epoch": 1790} {"train_loss": -41.76359176635742, "global_step": 216657, "epoch": 1790} {"train_loss": -41.9998664855957, "global_step": 216658, "epoch": 1790} {"train_loss": -42.30610275268555, "global_step": 216659, "epoch": 1790} {"train_loss": -42.27651596069336, "global_step": 216660, "epoch": 1790} {"train_loss": -42.207679748535156, "global_step": 216661, "epoch": 1790} {"train_loss": -41.84125900268555, "global_step": 216662, "epoch": 1790} {"train_loss": -42.42366409301758, "global_step": 216663, "epoch": 1790} {"train_loss": -41.93978500366211, "global_step": 216664, "epoch": 1790} {"train_loss": -42.211387634277344, "global_step": 216665, "epoch": 1790} {"train_loss": -42.431678771972656, "global_step": 216666, "epoch": 1790} {"train_loss": -42.18874740600586, "global_step": 216667, "epoch": 1790} {"train_loss": -41.55325698852539, "global_step": 216668, "epoch": 1790} {"train_loss": -42.233272552490234, "global_step": 216669, "epoch": 1790} {"train_loss": -42.22184371948242, "global_step": 216670, "epoch": 1790} {"train_loss": -41.5120735168457, "global_step": 216671, "epoch": 1790} {"train_loss": -42.09737777709961, "global_step": 216672, "epoch": 1790} {"train_loss": -42.20451736450195, "global_step": 216673, "epoch": 1790} {"train_loss": -42.21187210083008, "global_step": 216674, "epoch": 1790} {"train_loss": -42.38246536254883, "global_step": 216675, "epoch": 1790} {"train_loss": -41.04179382324219, "global_step": 216676, "epoch": 1790} {"train_loss": -40.495174407958984, "global_step": 216677, "epoch": 1790} {"train_loss": -41.80748748779297, "global_step": 216678, "epoch": 1790} {"train_loss": -42.54702377319336, "global_step": 216679, "epoch": 1790} {"train_loss": -42.020050048828125, "global_step": 216680, "epoch": 1790} {"train_loss": -42.140419006347656, "global_step": 216681, "epoch": 1790} {"train_loss": -42.17934799194336, "global_step": 216682, "epoch": 1790} {"train_loss": -42.260982513427734, "global_step": 216683, "epoch": 1790} {"train_loss": -42.49006271362305, "global_step": 216684, "epoch": 1790} {"train_loss": -42.3006591796875, "global_step": 216685, "epoch": 1790} {"train_loss": -42.39241409301758, "global_step": 216686, "epoch": 1790} {"train_loss": -42.617855072021484, "global_step": 216687, "epoch": 1790} {"train_loss": -41.64992904663086, "global_step": 216688, "epoch": 1790} {"train_loss": -40.95685958862305, "global_step": 216689, "epoch": 1790} {"train_loss": -42.20381546020508, "global_step": 216690, "epoch": 1790} {"train_loss": -41.210872650146484, "global_step": 216691, "epoch": 1790} {"train_loss": -42.17905807495117, "global_step": 216692, "epoch": 1790} {"train_loss": -42.43172836303711, "global_step": 216693, "epoch": 1790} {"train_loss": -42.196990966796875, "global_step": 216694, "epoch": 1790} {"train_loss": -42.34059143066406, "global_step": 216695, "epoch": 1790} {"train_loss": -42.808563232421875, "global_step": 216696, "epoch": 1790} {"train_loss": -42.38082504272461, "global_step": 216697, "epoch": 1790} {"train_loss": -42.49113082885742, "global_step": 216698, "epoch": 1790} {"train_loss": -41.29183578491211, "global_step": 216699, "epoch": 1790} {"train_loss": -42.11201858520508, "global_step": 216700, "epoch": 1790} {"train_loss": -41.931697845458984, "global_step": 216701, "epoch": 1790} {"train_loss": -42.017791748046875, "global_step": 216702, "epoch": 1790} {"train_loss": -42.563194274902344, "global_step": 216703, "epoch": 1790} {"train_loss": -42.7504997253418, "global_step": 216704, "epoch": 1790} {"train_loss": -42.03144073486328, "global_step": 216705, "epoch": 1790} {"train_loss": -42.2805061340332, "global_step": 216706, "epoch": 1790} {"train_loss": -42.403297424316406, "global_step": 216707, "epoch": 1790} {"train_loss": -42.778167724609375, "global_step": 216708, "epoch": 1790} {"train_loss": -42.11185836791992, "global_step": 216709, "epoch": 1790} {"train_loss": -41.02595242587003, "global_step": 216710, "epoch": 1790, "val_loss": 2677107.0} {"train_loss": -40.507320404052734, "global_step": 216711, "epoch": 1791} {"train_loss": -41.34642028808594, "global_step": 216712, "epoch": 1791} {"train_loss": -41.14686584472656, "global_step": 216713, "epoch": 1791} {"train_loss": -42.57262420654297, "global_step": 216714, "epoch": 1791} {"train_loss": -41.88062286376953, "global_step": 216715, "epoch": 1791} {"train_loss": -41.97823715209961, "global_step": 216716, "epoch": 1791} {"train_loss": -41.37832260131836, "global_step": 216717, "epoch": 1791} {"train_loss": -41.72938919067383, "global_step": 216718, "epoch": 1791} {"train_loss": -41.083560943603516, "global_step": 216719, "epoch": 1791} {"train_loss": -40.95426559448242, "global_step": 216720, "epoch": 1791} {"train_loss": -40.48788070678711, "global_step": 216721, "epoch": 1791} {"train_loss": -41.07674026489258, "global_step": 216722, "epoch": 1791} {"train_loss": -41.334571838378906, "global_step": 216723, "epoch": 1791} {"train_loss": -40.14558029174805, "global_step": 216724, "epoch": 1791} {"train_loss": -41.17769241333008, "global_step": 216725, "epoch": 1791} {"train_loss": -41.16572189331055, "global_step": 216726, "epoch": 1791} {"train_loss": -40.84938430786133, "global_step": 216727, "epoch": 1791} {"train_loss": -41.019195556640625, "global_step": 216728, "epoch": 1791} {"train_loss": -41.973140716552734, "global_step": 216729, "epoch": 1791} {"train_loss": -40.10909652709961, "global_step": 216730, "epoch": 1791} {"train_loss": -40.5608024597168, "global_step": 216731, "epoch": 1791} {"train_loss": -41.521480560302734, "global_step": 216732, "epoch": 1791} {"train_loss": -40.588600158691406, "global_step": 216733, "epoch": 1791} {"train_loss": -41.522239685058594, "global_step": 216734, "epoch": 1791} {"train_loss": -41.53418731689453, "global_step": 216735, "epoch": 1791} {"train_loss": -40.79288101196289, "global_step": 216736, "epoch": 1791} {"train_loss": -41.940887451171875, "global_step": 216737, "epoch": 1791} {"train_loss": -40.275386810302734, "global_step": 216738, "epoch": 1791} {"train_loss": -41.40745162963867, "global_step": 216739, "epoch": 1791} {"train_loss": -42.055641174316406, "global_step": 216740, "epoch": 1791} {"train_loss": -40.88277816772461, "global_step": 216741, "epoch": 1791} {"train_loss": -41.154441833496094, "global_step": 216742, "epoch": 1791} {"train_loss": -41.00413513183594, "global_step": 216743, "epoch": 1791} {"train_loss": -40.90961837768555, "global_step": 216744, "epoch": 1791} {"train_loss": -40.295989990234375, "global_step": 216745, "epoch": 1791} {"train_loss": -40.45913314819336, "global_step": 216746, "epoch": 1791} {"train_loss": -41.225372314453125, "global_step": 216747, "epoch": 1791} {"train_loss": -41.02444839477539, "global_step": 216748, "epoch": 1791} {"train_loss": -40.17084503173828, "global_step": 216749, "epoch": 1791} {"train_loss": -41.1032829284668, "global_step": 216750, "epoch": 1791} {"train_loss": -41.83970260620117, "global_step": 216751, "epoch": 1791} {"train_loss": -41.450965881347656, "global_step": 216752, "epoch": 1791} {"train_loss": -42.196998596191406, "global_step": 216753, "epoch": 1791} {"train_loss": -41.79872512817383, "global_step": 216754, "epoch": 1791} {"train_loss": -41.970428466796875, "global_step": 216755, "epoch": 1791} {"train_loss": -41.618743896484375, "global_step": 216756, "epoch": 1791} {"train_loss": -42.373046875, "global_step": 216757, "epoch": 1791} {"train_loss": -41.232513427734375, "global_step": 216758, "epoch": 1791} {"train_loss": -41.447784423828125, "global_step": 216759, "epoch": 1791} {"train_loss": -42.033653259277344, "global_step": 216760, "epoch": 1791} {"train_loss": -41.87263488769531, "global_step": 216761, "epoch": 1791} {"train_loss": -41.382808685302734, "global_step": 216762, "epoch": 1791} {"train_loss": -42.02788162231445, "global_step": 216763, "epoch": 1791} {"train_loss": -41.531307220458984, "global_step": 216764, "epoch": 1791} {"train_loss": -40.75749969482422, "global_step": 216765, "epoch": 1791} {"train_loss": -42.25971221923828, "global_step": 216766, "epoch": 1791} {"train_loss": -42.61820983886719, "global_step": 216767, "epoch": 1791} {"train_loss": -42.21653747558594, "global_step": 216768, "epoch": 1791} {"train_loss": -42.23169708251953, "global_step": 216769, "epoch": 1791} {"train_loss": -41.543941497802734, "global_step": 216770, "epoch": 1791} {"train_loss": -41.69184494018555, "global_step": 216771, "epoch": 1791} {"train_loss": -41.98944854736328, "global_step": 216772, "epoch": 1791} {"train_loss": -41.242156982421875, "global_step": 216773, "epoch": 1791} {"train_loss": -41.75933837890625, "global_step": 216774, "epoch": 1791} {"train_loss": -41.71309280395508, "global_step": 216775, "epoch": 1791} {"train_loss": -39.59060287475586, "global_step": 216776, "epoch": 1791} {"train_loss": -39.14622116088867, "global_step": 216777, "epoch": 1791} {"train_loss": -41.01171112060547, "global_step": 216778, "epoch": 1791} {"train_loss": -38.0924186706543, "global_step": 216779, "epoch": 1791} {"train_loss": -36.59918212890625, "global_step": 216780, "epoch": 1791} {"train_loss": -38.8341178894043, "global_step": 216781, "epoch": 1791} {"train_loss": -40.61133575439453, "global_step": 216782, "epoch": 1791} {"train_loss": -41.0913200378418, "global_step": 216783, "epoch": 1791} {"train_loss": -38.06131362915039, "global_step": 216784, "epoch": 1791} {"train_loss": -39.65208053588867, "global_step": 216785, "epoch": 1791} {"train_loss": -40.592681884765625, "global_step": 216786, "epoch": 1791} {"train_loss": -39.33327865600586, "global_step": 216787, "epoch": 1791} {"train_loss": -41.43976593017578, "global_step": 216788, "epoch": 1791} {"train_loss": -40.25397491455078, "global_step": 216789, "epoch": 1791} {"train_loss": -40.521209716796875, "global_step": 216790, "epoch": 1791} {"train_loss": -41.61720657348633, "global_step": 216791, "epoch": 1791} {"train_loss": -40.17972946166992, "global_step": 216792, "epoch": 1791} {"train_loss": -41.392181396484375, "global_step": 216793, "epoch": 1791} {"train_loss": -41.03724670410156, "global_step": 216794, "epoch": 1791} {"train_loss": -41.49456787109375, "global_step": 216795, "epoch": 1791} {"train_loss": -41.73017120361328, "global_step": 216796, "epoch": 1791} {"train_loss": -41.1876335144043, "global_step": 216797, "epoch": 1791} {"train_loss": -41.60648727416992, "global_step": 216798, "epoch": 1791} {"train_loss": -41.8597526550293, "global_step": 216799, "epoch": 1791} {"train_loss": -41.75587844848633, "global_step": 216800, "epoch": 1791} {"train_loss": -41.31158447265625, "global_step": 216801, "epoch": 1791} {"train_loss": -40.786373138427734, "global_step": 216802, "epoch": 1791} {"train_loss": -41.889686584472656, "global_step": 216803, "epoch": 1791} {"train_loss": -41.17109680175781, "global_step": 216804, "epoch": 1791} {"train_loss": -42.37458038330078, "global_step": 216805, "epoch": 1791} {"train_loss": -41.995262145996094, "global_step": 216806, "epoch": 1791} {"train_loss": -41.605323791503906, "global_step": 216807, "epoch": 1791} {"train_loss": -41.93441390991211, "global_step": 216808, "epoch": 1791} {"train_loss": -41.75373458862305, "global_step": 216809, "epoch": 1791} {"train_loss": -41.92041015625, "global_step": 216810, "epoch": 1791} {"train_loss": -41.769012451171875, "global_step": 216811, "epoch": 1791} {"train_loss": -41.60919952392578, "global_step": 216812, "epoch": 1791} {"train_loss": -41.87977600097656, "global_step": 216813, "epoch": 1791} {"train_loss": -42.33195877075195, "global_step": 216814, "epoch": 1791} {"train_loss": -41.31167984008789, "global_step": 216815, "epoch": 1791} {"train_loss": -41.90067672729492, "global_step": 216816, "epoch": 1791} {"train_loss": -40.833152770996094, "global_step": 216817, "epoch": 1791} {"train_loss": -41.80710983276367, "global_step": 216818, "epoch": 1791} {"train_loss": -42.409732818603516, "global_step": 216819, "epoch": 1791} {"train_loss": -42.32198715209961, "global_step": 216820, "epoch": 1791} {"train_loss": -42.30206298828125, "global_step": 216821, "epoch": 1791} {"train_loss": -42.54248809814453, "global_step": 216822, "epoch": 1791} {"train_loss": -42.19659423828125, "global_step": 216823, "epoch": 1791} {"train_loss": -41.74270248413086, "global_step": 216824, "epoch": 1791} {"train_loss": -42.0942497253418, "global_step": 216825, "epoch": 1791} {"train_loss": -42.253143310546875, "global_step": 216826, "epoch": 1791} {"train_loss": -42.51484680175781, "global_step": 216827, "epoch": 1791} {"train_loss": -41.230472564697266, "global_step": 216828, "epoch": 1791} {"train_loss": -42.19963455200195, "global_step": 216829, "epoch": 1791} {"train_loss": -41.982364654541016, "global_step": 216830, "epoch": 1791} {"train_loss": -41.2831181928146, "global_step": 216831, "epoch": 1791, "val_loss": 2593312.25} {"train_loss": -41.321800231933594, "global_step": 216832, "epoch": 1792} {"train_loss": -42.23142623901367, "global_step": 216833, "epoch": 1792} {"train_loss": -41.269020080566406, "global_step": 216834, "epoch": 1792} {"train_loss": -42.518638610839844, "global_step": 216835, "epoch": 1792} {"train_loss": -41.41111373901367, "global_step": 216836, "epoch": 1792} {"train_loss": -41.92228317260742, "global_step": 216837, "epoch": 1792} {"train_loss": -41.96942901611328, "global_step": 216838, "epoch": 1792} {"train_loss": -41.781280517578125, "global_step": 216839, "epoch": 1792} {"train_loss": -41.97809982299805, "global_step": 216840, "epoch": 1792} {"train_loss": -41.674495697021484, "global_step": 216841, "epoch": 1792} {"train_loss": -41.53642654418945, "global_step": 216842, "epoch": 1792} {"train_loss": -42.18329620361328, "global_step": 216843, "epoch": 1792} {"train_loss": -41.69990158081055, "global_step": 216844, "epoch": 1792} {"train_loss": -41.272315979003906, "global_step": 216845, "epoch": 1792} {"train_loss": -42.79850387573242, "global_step": 216846, "epoch": 1792} {"train_loss": -42.24883270263672, "global_step": 216847, "epoch": 1792} {"train_loss": -42.23551940917969, "global_step": 216848, "epoch": 1792} {"train_loss": -42.385894775390625, "global_step": 216849, "epoch": 1792} {"train_loss": -42.51401901245117, "global_step": 216850, "epoch": 1792} {"train_loss": -42.858821868896484, "global_step": 216851, "epoch": 1792} {"train_loss": -42.73355484008789, "global_step": 216852, "epoch": 1792} {"train_loss": -42.26118850708008, "global_step": 216853, "epoch": 1792} {"train_loss": -42.61606979370117, "global_step": 216854, "epoch": 1792} {"train_loss": -42.56410598754883, "global_step": 216855, "epoch": 1792} {"train_loss": -42.90817642211914, "global_step": 216856, "epoch": 1792} {"train_loss": -42.813148498535156, "global_step": 216857, "epoch": 1792} {"train_loss": -42.55390548706055, "global_step": 216858, "epoch": 1792} {"train_loss": -42.39588165283203, "global_step": 216859, "epoch": 1792} {"train_loss": -42.87054443359375, "global_step": 216860, "epoch": 1792} {"train_loss": -43.0528678894043, "global_step": 216861, "epoch": 1792} {"train_loss": -42.592037200927734, "global_step": 216862, "epoch": 1792} {"train_loss": -42.84346389770508, "global_step": 216863, "epoch": 1792} {"train_loss": -42.62194061279297, "global_step": 216864, "epoch": 1792} {"train_loss": -42.703590393066406, "global_step": 216865, "epoch": 1792} {"train_loss": -41.58700180053711, "global_step": 216866, "epoch": 1792} {"train_loss": -41.007110595703125, "global_step": 216867, "epoch": 1792} {"train_loss": -38.17936325073242, "global_step": 216868, "epoch": 1792} {"train_loss": -31.92721939086914, "global_step": 216869, "epoch": 1792} {"train_loss": -28.124868392944336, "global_step": 216870, "epoch": 1792} {"train_loss": -24.745498657226562, "global_step": 216871, "epoch": 1792} {"train_loss": -35.20923614501953, "global_step": 216872, "epoch": 1792} {"train_loss": -41.845306396484375, "global_step": 216873, "epoch": 1792} {"train_loss": -33.195953369140625, "global_step": 216874, "epoch": 1792} {"train_loss": -37.96734619140625, "global_step": 216875, "epoch": 1792} {"train_loss": -41.270503997802734, "global_step": 216876, "epoch": 1792} {"train_loss": -39.6505241394043, "global_step": 216877, "epoch": 1792} {"train_loss": -39.560394287109375, "global_step": 216878, "epoch": 1792} {"train_loss": -39.268856048583984, "global_step": 216879, "epoch": 1792} {"train_loss": -41.05275344848633, "global_step": 216880, "epoch": 1792} {"train_loss": -40.493682861328125, "global_step": 216881, "epoch": 1792} {"train_loss": -41.83683395385742, "global_step": 216882, "epoch": 1792} {"train_loss": -40.7377815246582, "global_step": 216883, "epoch": 1792} {"train_loss": -41.502742767333984, "global_step": 216884, "epoch": 1792} {"train_loss": -41.486759185791016, "global_step": 216885, "epoch": 1792} {"train_loss": -41.948204040527344, "global_step": 216886, "epoch": 1792} {"train_loss": -41.05482482910156, "global_step": 216887, "epoch": 1792} {"train_loss": -41.93227767944336, "global_step": 216888, "epoch": 1792} {"train_loss": -41.517486572265625, "global_step": 216889, "epoch": 1792} {"train_loss": -41.974178314208984, "global_step": 216890, "epoch": 1792} {"train_loss": -41.15521240234375, "global_step": 216891, "epoch": 1792} {"train_loss": -41.65833282470703, "global_step": 216892, "epoch": 1792} {"train_loss": -41.78559112548828, "global_step": 216893, "epoch": 1792} {"train_loss": -41.68997573852539, "global_step": 216894, "epoch": 1792} {"train_loss": -41.442317962646484, "global_step": 216895, "epoch": 1792} {"train_loss": -41.791629791259766, "global_step": 216896, "epoch": 1792} {"train_loss": -41.63725662231445, "global_step": 216897, "epoch": 1792} {"train_loss": -41.91189193725586, "global_step": 216898, "epoch": 1792} {"train_loss": -41.28497314453125, "global_step": 216899, "epoch": 1792} {"train_loss": -42.33982849121094, "global_step": 216900, "epoch": 1792} {"train_loss": -41.92135238647461, "global_step": 216901, "epoch": 1792} {"train_loss": -42.18841552734375, "global_step": 216902, "epoch": 1792} {"train_loss": -42.01455307006836, "global_step": 216903, "epoch": 1792} {"train_loss": -40.8089485168457, "global_step": 216904, "epoch": 1792} {"train_loss": -42.114994049072266, "global_step": 216905, "epoch": 1792} {"train_loss": -41.42294692993164, "global_step": 216906, "epoch": 1792} {"train_loss": -42.3486328125, "global_step": 216907, "epoch": 1792} {"train_loss": -42.287818908691406, "global_step": 216908, "epoch": 1792} {"train_loss": -42.275672912597656, "global_step": 216909, "epoch": 1792} {"train_loss": -42.28668212890625, "global_step": 216910, "epoch": 1792} {"train_loss": -42.32261276245117, "global_step": 216911, "epoch": 1792} {"train_loss": -42.37351989746094, "global_step": 216912, "epoch": 1792} {"train_loss": -42.355403900146484, "global_step": 216913, "epoch": 1792} {"train_loss": -42.6909294128418, "global_step": 216914, "epoch": 1792} {"train_loss": -42.1786994934082, "global_step": 216915, "epoch": 1792} {"train_loss": -42.309791564941406, "global_step": 216916, "epoch": 1792} {"train_loss": -42.062740325927734, "global_step": 216917, "epoch": 1792} {"train_loss": -42.15220260620117, "global_step": 216918, "epoch": 1792} {"train_loss": -42.39815139770508, "global_step": 216919, "epoch": 1792} {"train_loss": -42.120277404785156, "global_step": 216920, "epoch": 1792} {"train_loss": -42.62746810913086, "global_step": 216921, "epoch": 1792} {"train_loss": -42.34394454956055, "global_step": 216922, "epoch": 1792} {"train_loss": -42.452850341796875, "global_step": 216923, "epoch": 1792} {"train_loss": -42.54629135131836, "global_step": 216924, "epoch": 1792} {"train_loss": -42.795440673828125, "global_step": 216925, "epoch": 1792} {"train_loss": -43.00692367553711, "global_step": 216926, "epoch": 1792} {"train_loss": -42.550445556640625, "global_step": 216927, "epoch": 1792} {"train_loss": -42.646846771240234, "global_step": 216928, "epoch": 1792} {"train_loss": -42.79834747314453, "global_step": 216929, "epoch": 1792} {"train_loss": -42.513710021972656, "global_step": 216930, "epoch": 1792} {"train_loss": -42.76369857788086, "global_step": 216931, "epoch": 1792} {"train_loss": -43.050804138183594, "global_step": 216932, "epoch": 1792} {"train_loss": -42.922821044921875, "global_step": 216933, "epoch": 1792} {"train_loss": -42.23057556152344, "global_step": 216934, "epoch": 1792} {"train_loss": -42.7595329284668, "global_step": 216935, "epoch": 1792} {"train_loss": -42.7736930847168, "global_step": 216936, "epoch": 1792} {"train_loss": -42.7351188659668, "global_step": 216937, "epoch": 1792} {"train_loss": -42.63842010498047, "global_step": 216938, "epoch": 1792} {"train_loss": -42.43943786621094, "global_step": 216939, "epoch": 1792} {"train_loss": -42.57589340209961, "global_step": 216940, "epoch": 1792} {"train_loss": -43.34814453125, "global_step": 216941, "epoch": 1792} {"train_loss": -43.130611419677734, "global_step": 216942, "epoch": 1792} {"train_loss": -42.46041488647461, "global_step": 216943, "epoch": 1792} {"train_loss": -42.27719497680664, "global_step": 216944, "epoch": 1792} {"train_loss": -42.73781967163086, "global_step": 216945, "epoch": 1792} {"train_loss": -42.50785446166992, "global_step": 216946, "epoch": 1792} {"train_loss": -43.36519241333008, "global_step": 216947, "epoch": 1792} {"train_loss": -43.362281799316406, "global_step": 216948, "epoch": 1792} {"train_loss": -42.430633544921875, "global_step": 216949, "epoch": 1792} {"train_loss": -42.87881088256836, "global_step": 216950, "epoch": 1792} {"train_loss": -42.64040756225586, "global_step": 216951, "epoch": 1792} {"train_loss": -41.594750286133824, "global_step": 216952, "epoch": 1792, "val_loss": 2627015.25} {"train_loss": -42.51560592651367, "global_step": 216953, "epoch": 1793} {"train_loss": -42.474365234375, "global_step": 216954, "epoch": 1793} {"train_loss": -41.87030792236328, "global_step": 216955, "epoch": 1793} {"train_loss": -42.070472717285156, "global_step": 216956, "epoch": 1793} {"train_loss": -40.48630905151367, "global_step": 216957, "epoch": 1793} {"train_loss": -37.23150634765625, "global_step": 216958, "epoch": 1793} {"train_loss": -36.393470764160156, "global_step": 216959, "epoch": 1793} {"train_loss": -39.38604736328125, "global_step": 216960, "epoch": 1793} {"train_loss": -40.187801361083984, "global_step": 216961, "epoch": 1793} {"train_loss": -39.362667083740234, "global_step": 216962, "epoch": 1793} {"train_loss": -40.29067611694336, "global_step": 216963, "epoch": 1793} {"train_loss": -41.10853958129883, "global_step": 216964, "epoch": 1793} {"train_loss": -40.691585540771484, "global_step": 216965, "epoch": 1793} {"train_loss": -41.57587814331055, "global_step": 216966, "epoch": 1793} {"train_loss": -41.880977630615234, "global_step": 216967, "epoch": 1793} {"train_loss": -41.81806182861328, "global_step": 216968, "epoch": 1793} {"train_loss": -39.80654525756836, "global_step": 216969, "epoch": 1793} {"train_loss": -40.0748405456543, "global_step": 216970, "epoch": 1793} {"train_loss": -41.6613655090332, "global_step": 216971, "epoch": 1793} {"train_loss": -40.768245697021484, "global_step": 216972, "epoch": 1793} {"train_loss": -42.158992767333984, "global_step": 216973, "epoch": 1793} {"train_loss": -41.35485076904297, "global_step": 216974, "epoch": 1793} {"train_loss": -41.6447639465332, "global_step": 216975, "epoch": 1793} {"train_loss": -41.20041275024414, "global_step": 216976, "epoch": 1793} {"train_loss": -41.46118927001953, "global_step": 216977, "epoch": 1793} {"train_loss": -42.40452194213867, "global_step": 216978, "epoch": 1793} {"train_loss": -41.50669479370117, "global_step": 216979, "epoch": 1793} {"train_loss": -40.00161361694336, "global_step": 216980, "epoch": 1793} {"train_loss": -41.177425384521484, "global_step": 216981, "epoch": 1793} {"train_loss": -41.005523681640625, "global_step": 216982, "epoch": 1793} {"train_loss": -40.645381927490234, "global_step": 216983, "epoch": 1793} {"train_loss": -40.62389373779297, "global_step": 216984, "epoch": 1793} {"train_loss": -40.76115036010742, "global_step": 216985, "epoch": 1793} {"train_loss": -40.78558349609375, "global_step": 216986, "epoch": 1793} {"train_loss": -40.610572814941406, "global_step": 216987, "epoch": 1793} {"train_loss": -39.92104721069336, "global_step": 216988, "epoch": 1793} {"train_loss": -41.442344665527344, "global_step": 216989, "epoch": 1793} {"train_loss": -41.10155487060547, "global_step": 216990, "epoch": 1793} {"train_loss": -40.68442916870117, "global_step": 216991, "epoch": 1793} {"train_loss": -42.16647720336914, "global_step": 216992, "epoch": 1793} {"train_loss": -40.3872184753418, "global_step": 216993, "epoch": 1793} {"train_loss": -41.184688568115234, "global_step": 216994, "epoch": 1793} {"train_loss": -41.207942962646484, "global_step": 216995, "epoch": 1793} {"train_loss": -41.2246208190918, "global_step": 216996, "epoch": 1793} {"train_loss": -40.67717742919922, "global_step": 216997, "epoch": 1793} {"train_loss": -41.78702926635742, "global_step": 216998, "epoch": 1793} {"train_loss": -40.33784103393555, "global_step": 216999, "epoch": 1793} {"train_loss": -38.9600715637207, "global_step": 217000, "epoch": 1793} {"train_loss": -41.90381622314453, "global_step": 217001, "epoch": 1793} {"train_loss": -38.635047912597656, "global_step": 217002, "epoch": 1793} {"train_loss": -38.64247131347656, "global_step": 217003, "epoch": 1793} {"train_loss": -40.88052749633789, "global_step": 217004, "epoch": 1793} {"train_loss": -39.566287994384766, "global_step": 217005, "epoch": 1793} {"train_loss": -40.254554748535156, "global_step": 217006, "epoch": 1793} {"train_loss": -39.98114013671875, "global_step": 217007, "epoch": 1793} {"train_loss": -39.95417022705078, "global_step": 217008, "epoch": 1793} {"train_loss": -40.31159591674805, "global_step": 217009, "epoch": 1793} {"train_loss": -40.49793243408203, "global_step": 217010, "epoch": 1793} {"train_loss": -40.940338134765625, "global_step": 217011, "epoch": 1793} {"train_loss": -40.15715408325195, "global_step": 217012, "epoch": 1793} {"train_loss": -41.379337310791016, "global_step": 217013, "epoch": 1793} {"train_loss": -40.827613830566406, "global_step": 217014, "epoch": 1793} {"train_loss": -40.302467346191406, "global_step": 217015, "epoch": 1793} {"train_loss": -41.44459533691406, "global_step": 217016, "epoch": 1793} {"train_loss": -41.16053009033203, "global_step": 217017, "epoch": 1793} {"train_loss": -40.36608123779297, "global_step": 217018, "epoch": 1793} {"train_loss": -40.44252014160156, "global_step": 217019, "epoch": 1793} {"train_loss": -40.487911224365234, "global_step": 217020, "epoch": 1793} {"train_loss": -40.83156967163086, "global_step": 217021, "epoch": 1793} {"train_loss": -41.854068756103516, "global_step": 217022, "epoch": 1793} {"train_loss": -41.1196403503418, "global_step": 217023, "epoch": 1793} {"train_loss": -41.42085647583008, "global_step": 217024, "epoch": 1793} {"train_loss": -41.96467971801758, "global_step": 217025, "epoch": 1793} {"train_loss": -41.69529342651367, "global_step": 217026, "epoch": 1793} {"train_loss": -41.47983932495117, "global_step": 217027, "epoch": 1793} {"train_loss": -41.678524017333984, "global_step": 217028, "epoch": 1793} {"train_loss": -41.903987884521484, "global_step": 217029, "epoch": 1793} {"train_loss": -41.70599365234375, "global_step": 217030, "epoch": 1793} {"train_loss": -41.843624114990234, "global_step": 217031, "epoch": 1793} {"train_loss": -41.974342346191406, "global_step": 217032, "epoch": 1793} {"train_loss": -41.863704681396484, "global_step": 217033, "epoch": 1793} {"train_loss": -42.69499969482422, "global_step": 217034, "epoch": 1793} {"train_loss": -42.272281646728516, "global_step": 217035, "epoch": 1793} {"train_loss": -42.13644027709961, "global_step": 217036, "epoch": 1793} {"train_loss": -42.34526443481445, "global_step": 217037, "epoch": 1793} {"train_loss": -41.97637939453125, "global_step": 217038, "epoch": 1793} {"train_loss": -42.55919647216797, "global_step": 217039, "epoch": 1793} {"train_loss": -42.59418869018555, "global_step": 217040, "epoch": 1793} {"train_loss": -42.294578552246094, "global_step": 217041, "epoch": 1793} {"train_loss": -42.91852951049805, "global_step": 217042, "epoch": 1793} {"train_loss": -42.28623962402344, "global_step": 217043, "epoch": 1793} {"train_loss": -42.543121337890625, "global_step": 217044, "epoch": 1793} {"train_loss": -42.4356689453125, "global_step": 217045, "epoch": 1793} {"train_loss": -42.68635177612305, "global_step": 217046, "epoch": 1793} {"train_loss": -42.24102783203125, "global_step": 217047, "epoch": 1793} {"train_loss": -42.22785186767578, "global_step": 217048, "epoch": 1793} {"train_loss": -42.91538619995117, "global_step": 217049, "epoch": 1793} {"train_loss": -42.6971435546875, "global_step": 217050, "epoch": 1793} {"train_loss": -42.371070861816406, "global_step": 217051, "epoch": 1793} {"train_loss": -42.49483108520508, "global_step": 217052, "epoch": 1793} {"train_loss": -43.04056930541992, "global_step": 217053, "epoch": 1793} {"train_loss": -42.37441635131836, "global_step": 217054, "epoch": 1793} {"train_loss": -42.01020050048828, "global_step": 217055, "epoch": 1793} {"train_loss": -43.0796012878418, "global_step": 217056, "epoch": 1793} {"train_loss": -42.92755126953125, "global_step": 217057, "epoch": 1793} {"train_loss": -42.89950180053711, "global_step": 217058, "epoch": 1793} {"train_loss": -43.13950729370117, "global_step": 217059, "epoch": 1793} {"train_loss": -43.17442321777344, "global_step": 217060, "epoch": 1793} {"train_loss": -43.270263671875, "global_step": 217061, "epoch": 1793} {"train_loss": -42.968536376953125, "global_step": 217062, "epoch": 1793} {"train_loss": -43.18333053588867, "global_step": 217063, "epoch": 1793} {"train_loss": -43.1494255065918, "global_step": 217064, "epoch": 1793} {"train_loss": -43.11328887939453, "global_step": 217065, "epoch": 1793} {"train_loss": -42.11732482910156, "global_step": 217066, "epoch": 1793} {"train_loss": -43.28181076049805, "global_step": 217067, "epoch": 1793} {"train_loss": -43.47418212890625, "global_step": 217068, "epoch": 1793} {"train_loss": -43.317787170410156, "global_step": 217069, "epoch": 1793} {"train_loss": -43.372432708740234, "global_step": 217070, "epoch": 1793} {"train_loss": -43.282772064208984, "global_step": 217071, "epoch": 1793} {"train_loss": -42.82685852050781, "global_step": 217072, "epoch": 1793} {"train_loss": -41.48588256205409, "global_step": 217073, "epoch": 1793, "val_loss": 2742603.75} {"train_loss": -43.0543098449707, "global_step": 217074, "epoch": 1794} {"train_loss": -42.139278411865234, "global_step": 217075, "epoch": 1794} {"train_loss": -41.00928497314453, "global_step": 217076, "epoch": 1794} {"train_loss": -41.33524703979492, "global_step": 217077, "epoch": 1794} {"train_loss": -42.782073974609375, "global_step": 217078, "epoch": 1794} {"train_loss": -43.51066970825195, "global_step": 217079, "epoch": 1794} {"train_loss": -40.3758430480957, "global_step": 217080, "epoch": 1794} {"train_loss": -35.76839828491211, "global_step": 217081, "epoch": 1794} {"train_loss": -33.11415481567383, "global_step": 217082, "epoch": 1794} {"train_loss": -37.351322174072266, "global_step": 217083, "epoch": 1794} {"train_loss": -39.95638656616211, "global_step": 217084, "epoch": 1794} {"train_loss": -34.855098724365234, "global_step": 217085, "epoch": 1794} {"train_loss": -24.75066566467285, "global_step": 217086, "epoch": 1794} {"train_loss": -23.62314224243164, "global_step": 217087, "epoch": 1794} {"train_loss": -34.82019805908203, "global_step": 217088, "epoch": 1794} {"train_loss": -30.94257926940918, "global_step": 217089, "epoch": 1794} {"train_loss": -33.2050666809082, "global_step": 217090, "epoch": 1794} {"train_loss": -37.14888381958008, "global_step": 217091, "epoch": 1794} {"train_loss": -36.01212692260742, "global_step": 217092, "epoch": 1794} {"train_loss": -37.492576599121094, "global_step": 217093, "epoch": 1794} {"train_loss": -34.40458297729492, "global_step": 217094, "epoch": 1794} {"train_loss": -39.92615509033203, "global_step": 217095, "epoch": 1794} {"train_loss": -37.44408416748047, "global_step": 217096, "epoch": 1794} {"train_loss": -38.8152961730957, "global_step": 217097, "epoch": 1794} {"train_loss": -39.88423538208008, "global_step": 217098, "epoch": 1794} {"train_loss": -39.041595458984375, "global_step": 217099, "epoch": 1794} {"train_loss": -39.3143310546875, "global_step": 217100, "epoch": 1794} {"train_loss": -37.0186767578125, "global_step": 217101, "epoch": 1794} {"train_loss": -39.9369010925293, "global_step": 217102, "epoch": 1794} {"train_loss": -39.61897659301758, "global_step": 217103, "epoch": 1794} {"train_loss": -40.256282806396484, "global_step": 217104, "epoch": 1794} {"train_loss": -39.5574836730957, "global_step": 217105, "epoch": 1794} {"train_loss": -40.59158706665039, "global_step": 217106, "epoch": 1794} {"train_loss": -40.51800537109375, "global_step": 217107, "epoch": 1794} {"train_loss": -41.02804183959961, "global_step": 217108, "epoch": 1794} {"train_loss": -40.03799057006836, "global_step": 217109, "epoch": 1794} {"train_loss": -41.23982620239258, "global_step": 217110, "epoch": 1794} {"train_loss": -40.499244689941406, "global_step": 217111, "epoch": 1794} {"train_loss": -38.08686447143555, "global_step": 217112, "epoch": 1794} {"train_loss": -40.55567932128906, "global_step": 217113, "epoch": 1794} {"train_loss": -40.553741455078125, "global_step": 217114, "epoch": 1794} {"train_loss": -39.613216400146484, "global_step": 217115, "epoch": 1794} {"train_loss": -41.40021896362305, "global_step": 217116, "epoch": 1794} {"train_loss": -40.95681381225586, "global_step": 217117, "epoch": 1794} {"train_loss": -40.994659423828125, "global_step": 217118, "epoch": 1794} {"train_loss": -40.896324157714844, "global_step": 217119, "epoch": 1794} {"train_loss": -40.88447952270508, "global_step": 217120, "epoch": 1794} {"train_loss": -40.77191162109375, "global_step": 217121, "epoch": 1794} {"train_loss": -40.5640983581543, "global_step": 217122, "epoch": 1794} {"train_loss": -40.97948455810547, "global_step": 217123, "epoch": 1794} {"train_loss": -41.583553314208984, "global_step": 217124, "epoch": 1794} {"train_loss": -40.94474411010742, "global_step": 217125, "epoch": 1794} {"train_loss": -41.09406280517578, "global_step": 217126, "epoch": 1794} {"train_loss": -41.53533935546875, "global_step": 217127, "epoch": 1794} {"train_loss": -41.63121795654297, "global_step": 217128, "epoch": 1794} {"train_loss": -41.661739349365234, "global_step": 217129, "epoch": 1794} {"train_loss": -40.95370101928711, "global_step": 217130, "epoch": 1794} {"train_loss": -40.0463981628418, "global_step": 217131, "epoch": 1794} {"train_loss": -41.51158905029297, "global_step": 217132, "epoch": 1794} {"train_loss": -40.68499755859375, "global_step": 217133, "epoch": 1794} {"train_loss": -41.2054328918457, "global_step": 217134, "epoch": 1794} {"train_loss": -41.99027633666992, "global_step": 217135, "epoch": 1794} {"train_loss": -41.9171028137207, "global_step": 217136, "epoch": 1794} {"train_loss": -41.26765823364258, "global_step": 217137, "epoch": 1794} {"train_loss": -42.2115478515625, "global_step": 217138, "epoch": 1794} {"train_loss": -41.7884635925293, "global_step": 217139, "epoch": 1794} {"train_loss": -41.99312210083008, "global_step": 217140, "epoch": 1794} {"train_loss": -42.30320358276367, "global_step": 217141, "epoch": 1794} {"train_loss": -40.85304641723633, "global_step": 217142, "epoch": 1794} {"train_loss": -42.131996154785156, "global_step": 217143, "epoch": 1794} {"train_loss": -42.270626068115234, "global_step": 217144, "epoch": 1794} {"train_loss": -42.361846923828125, "global_step": 217145, "epoch": 1794} {"train_loss": -41.93821334838867, "global_step": 217146, "epoch": 1794} {"train_loss": -42.295814514160156, "global_step": 217147, "epoch": 1794} {"train_loss": -42.08478927612305, "global_step": 217148, "epoch": 1794} {"train_loss": -42.47501754760742, "global_step": 217149, "epoch": 1794} {"train_loss": -42.12550735473633, "global_step": 217150, "epoch": 1794} {"train_loss": -42.30729675292969, "global_step": 217151, "epoch": 1794} {"train_loss": -42.17607498168945, "global_step": 217152, "epoch": 1794} {"train_loss": -42.63975524902344, "global_step": 217153, "epoch": 1794} {"train_loss": -42.44340515136719, "global_step": 217154, "epoch": 1794} {"train_loss": -42.36574172973633, "global_step": 217155, "epoch": 1794} {"train_loss": -42.6292724609375, "global_step": 217156, "epoch": 1794} {"train_loss": -42.963069915771484, "global_step": 217157, "epoch": 1794} {"train_loss": -42.41998291015625, "global_step": 217158, "epoch": 1794} {"train_loss": -42.7164306640625, "global_step": 217159, "epoch": 1794} {"train_loss": -42.40199661254883, "global_step": 217160, "epoch": 1794} {"train_loss": -43.05469512939453, "global_step": 217161, "epoch": 1794} {"train_loss": -42.49137496948242, "global_step": 217162, "epoch": 1794} {"train_loss": -42.63471603393555, "global_step": 217163, "epoch": 1794} {"train_loss": -43.1105842590332, "global_step": 217164, "epoch": 1794} {"train_loss": -42.4177360534668, "global_step": 217165, "epoch": 1794} {"train_loss": -42.94617462158203, "global_step": 217166, "epoch": 1794} {"train_loss": -42.84781265258789, "global_step": 217167, "epoch": 1794} {"train_loss": -42.27604293823242, "global_step": 217168, "epoch": 1794} {"train_loss": -42.54828643798828, "global_step": 217169, "epoch": 1794} {"train_loss": -42.849609375, "global_step": 217170, "epoch": 1794} {"train_loss": -42.64646530151367, "global_step": 217171, "epoch": 1794} {"train_loss": -42.72486114501953, "global_step": 217172, "epoch": 1794} {"train_loss": -42.58130645751953, "global_step": 217173, "epoch": 1794} {"train_loss": -42.88434600830078, "global_step": 217174, "epoch": 1794} {"train_loss": -42.58353042602539, "global_step": 217175, "epoch": 1794} {"train_loss": -43.132686614990234, "global_step": 217176, "epoch": 1794} {"train_loss": -42.72730255126953, "global_step": 217177, "epoch": 1794} {"train_loss": -42.953182220458984, "global_step": 217178, "epoch": 1794} {"train_loss": -42.81859588623047, "global_step": 217179, "epoch": 1794} {"train_loss": -42.59489059448242, "global_step": 217180, "epoch": 1794} {"train_loss": -42.596961975097656, "global_step": 217181, "epoch": 1794} {"train_loss": -43.040260314941406, "global_step": 217182, "epoch": 1794} {"train_loss": -43.27897262573242, "global_step": 217183, "epoch": 1794} {"train_loss": -43.04021072387695, "global_step": 217184, "epoch": 1794} {"train_loss": -43.15204620361328, "global_step": 217185, "epoch": 1794} {"train_loss": -43.249549865722656, "global_step": 217186, "epoch": 1794} {"train_loss": -42.25443649291992, "global_step": 217187, "epoch": 1794} {"train_loss": -42.79355239868164, "global_step": 217188, "epoch": 1794} {"train_loss": -43.1287727355957, "global_step": 217189, "epoch": 1794} {"train_loss": -43.19641876220703, "global_step": 217190, "epoch": 1794} {"train_loss": -42.4461669921875, "global_step": 217191, "epoch": 1794} {"train_loss": -41.990535736083984, "global_step": 217192, "epoch": 1794} {"train_loss": -42.0206298828125, "global_step": 217193, "epoch": 1794} {"train_loss": -40.76368659783986, "global_step": 217194, "epoch": 1794, "val_loss": 2660744.25} {"train_loss": -43.14289093017578, "global_step": 217195, "epoch": 1795} {"train_loss": -41.77531814575195, "global_step": 217196, "epoch": 1795} {"train_loss": -41.576080322265625, "global_step": 217197, "epoch": 1795} {"train_loss": -42.60276412963867, "global_step": 217198, "epoch": 1795} {"train_loss": -42.53377914428711, "global_step": 217199, "epoch": 1795} {"train_loss": -42.51716613769531, "global_step": 217200, "epoch": 1795} {"train_loss": -42.169647216796875, "global_step": 217201, "epoch": 1795} {"train_loss": -42.48955535888672, "global_step": 217202, "epoch": 1795} {"train_loss": -42.5180778503418, "global_step": 217203, "epoch": 1795} {"train_loss": -42.06992721557617, "global_step": 217204, "epoch": 1795} {"train_loss": -42.42002487182617, "global_step": 217205, "epoch": 1795} {"train_loss": -42.80153274536133, "global_step": 217206, "epoch": 1795} {"train_loss": -41.897701263427734, "global_step": 217207, "epoch": 1795} {"train_loss": -42.14195251464844, "global_step": 217208, "epoch": 1795} {"train_loss": -42.55876922607422, "global_step": 217209, "epoch": 1795} {"train_loss": -42.02283477783203, "global_step": 217210, "epoch": 1795} {"train_loss": -42.208343505859375, "global_step": 217211, "epoch": 1795} {"train_loss": -42.44465255737305, "global_step": 217212, "epoch": 1795} {"train_loss": -43.19651412963867, "global_step": 217213, "epoch": 1795} {"train_loss": -41.84556198120117, "global_step": 217214, "epoch": 1795} {"train_loss": -41.811153411865234, "global_step": 217215, "epoch": 1795} {"train_loss": -42.5988655090332, "global_step": 217216, "epoch": 1795} {"train_loss": -42.44404983520508, "global_step": 217217, "epoch": 1795} {"train_loss": -43.023616790771484, "global_step": 217218, "epoch": 1795} {"train_loss": -41.98512649536133, "global_step": 217219, "epoch": 1795} {"train_loss": -41.891387939453125, "global_step": 217220, "epoch": 1795} {"train_loss": -42.29359817504883, "global_step": 217221, "epoch": 1795} {"train_loss": -41.14448928833008, "global_step": 217222, "epoch": 1795} {"train_loss": -41.37453842163086, "global_step": 217223, "epoch": 1795} {"train_loss": -41.82598876953125, "global_step": 217224, "epoch": 1795} {"train_loss": -39.977291107177734, "global_step": 217225, "epoch": 1795} {"train_loss": -40.56843185424805, "global_step": 217226, "epoch": 1795} {"train_loss": -41.470699310302734, "global_step": 217227, "epoch": 1795} {"train_loss": -39.04665756225586, "global_step": 217228, "epoch": 1795} {"train_loss": -42.63367462158203, "global_step": 217229, "epoch": 1795} {"train_loss": -40.48822021484375, "global_step": 217230, "epoch": 1795} {"train_loss": -41.9290657043457, "global_step": 217231, "epoch": 1795} {"train_loss": -36.572818756103516, "global_step": 217232, "epoch": 1795} {"train_loss": -37.696022033691406, "global_step": 217233, "epoch": 1795} {"train_loss": -39.99876403808594, "global_step": 217234, "epoch": 1795} {"train_loss": -38.80780792236328, "global_step": 217235, "epoch": 1795} {"train_loss": -38.66123962402344, "global_step": 217236, "epoch": 1795} {"train_loss": -41.11876678466797, "global_step": 217237, "epoch": 1795} {"train_loss": -38.19131088256836, "global_step": 217238, "epoch": 1795} {"train_loss": -40.578285217285156, "global_step": 217239, "epoch": 1795} {"train_loss": -39.68838119506836, "global_step": 217240, "epoch": 1795} {"train_loss": -38.66266632080078, "global_step": 217241, "epoch": 1795} {"train_loss": -40.670166015625, "global_step": 217242, "epoch": 1795} {"train_loss": -40.59843826293945, "global_step": 217243, "epoch": 1795} {"train_loss": -40.454708099365234, "global_step": 217244, "epoch": 1795} {"train_loss": -38.59086227416992, "global_step": 217245, "epoch": 1795} {"train_loss": -37.349037170410156, "global_step": 217246, "epoch": 1795} {"train_loss": -40.9527587890625, "global_step": 217247, "epoch": 1795} {"train_loss": -40.463287353515625, "global_step": 217248, "epoch": 1795} {"train_loss": -39.11069869995117, "global_step": 217249, "epoch": 1795} {"train_loss": -39.95087814331055, "global_step": 217250, "epoch": 1795} {"train_loss": -41.05494689941406, "global_step": 217251, "epoch": 1795} {"train_loss": -39.125267028808594, "global_step": 217252, "epoch": 1795} {"train_loss": -39.8116455078125, "global_step": 217253, "epoch": 1795} {"train_loss": -40.98023223876953, "global_step": 217254, "epoch": 1795} {"train_loss": -37.77126693725586, "global_step": 217255, "epoch": 1795} {"train_loss": -41.00305938720703, "global_step": 217256, "epoch": 1795} {"train_loss": -41.08070755004883, "global_step": 217257, "epoch": 1795} {"train_loss": -41.356170654296875, "global_step": 217258, "epoch": 1795} {"train_loss": -41.323726654052734, "global_step": 217259, "epoch": 1795} {"train_loss": -41.29400634765625, "global_step": 217260, "epoch": 1795} {"train_loss": -41.73283004760742, "global_step": 217261, "epoch": 1795} {"train_loss": -41.2945671081543, "global_step": 217262, "epoch": 1795} {"train_loss": -40.219940185546875, "global_step": 217263, "epoch": 1795} {"train_loss": -42.06112289428711, "global_step": 217264, "epoch": 1795} {"train_loss": -41.85285186767578, "global_step": 217265, "epoch": 1795} {"train_loss": -41.71017074584961, "global_step": 217266, "epoch": 1795} {"train_loss": -41.549293518066406, "global_step": 217267, "epoch": 1795} {"train_loss": -41.754417419433594, "global_step": 217268, "epoch": 1795} {"train_loss": -42.20893096923828, "global_step": 217269, "epoch": 1795} {"train_loss": -41.9604606628418, "global_step": 217270, "epoch": 1795} {"train_loss": -42.19375991821289, "global_step": 217271, "epoch": 1795} {"train_loss": -40.63898468017578, "global_step": 217272, "epoch": 1795} {"train_loss": -41.79567337036133, "global_step": 217273, "epoch": 1795} {"train_loss": -42.230079650878906, "global_step": 217274, "epoch": 1795} {"train_loss": -42.19964599609375, "global_step": 217275, "epoch": 1795} {"train_loss": -41.39178466796875, "global_step": 217276, "epoch": 1795} {"train_loss": -42.26898193359375, "global_step": 217277, "epoch": 1795} {"train_loss": -42.39425277709961, "global_step": 217278, "epoch": 1795} {"train_loss": -42.563812255859375, "global_step": 217279, "epoch": 1795} {"train_loss": -42.541534423828125, "global_step": 217280, "epoch": 1795} {"train_loss": -42.42947006225586, "global_step": 217281, "epoch": 1795} {"train_loss": -42.52383041381836, "global_step": 217282, "epoch": 1795} {"train_loss": -42.39567184448242, "global_step": 217283, "epoch": 1795} {"train_loss": -41.91019058227539, "global_step": 217284, "epoch": 1795} {"train_loss": -42.46540451049805, "global_step": 217285, "epoch": 1795} {"train_loss": -42.92558670043945, "global_step": 217286, "epoch": 1795} {"train_loss": -42.25613021850586, "global_step": 217287, "epoch": 1795} {"train_loss": -42.00069046020508, "global_step": 217288, "epoch": 1795} {"train_loss": -41.364479064941406, "global_step": 217289, "epoch": 1795} {"train_loss": -40.79882049560547, "global_step": 217290, "epoch": 1795} {"train_loss": -42.98102569580078, "global_step": 217291, "epoch": 1795} {"train_loss": -42.148311614990234, "global_step": 217292, "epoch": 1795} {"train_loss": -41.6069450378418, "global_step": 217293, "epoch": 1795} {"train_loss": -42.362667083740234, "global_step": 217294, "epoch": 1795} {"train_loss": -42.10455322265625, "global_step": 217295, "epoch": 1795} {"train_loss": -40.5703239440918, "global_step": 217296, "epoch": 1795} {"train_loss": -41.831092834472656, "global_step": 217297, "epoch": 1795} {"train_loss": -42.51951599121094, "global_step": 217298, "epoch": 1795} {"train_loss": -41.558250427246094, "global_step": 217299, "epoch": 1795} {"train_loss": -42.4647216796875, "global_step": 217300, "epoch": 1795} {"train_loss": -39.76177215576172, "global_step": 217301, "epoch": 1795} {"train_loss": -41.18375778198242, "global_step": 217302, "epoch": 1795} {"train_loss": -43.185394287109375, "global_step": 217303, "epoch": 1795} {"train_loss": -42.092010498046875, "global_step": 217304, "epoch": 1795} {"train_loss": -41.75027084350586, "global_step": 217305, "epoch": 1795} {"train_loss": -42.91168212890625, "global_step": 217306, "epoch": 1795} {"train_loss": -42.0528678894043, "global_step": 217307, "epoch": 1795} {"train_loss": -42.44747543334961, "global_step": 217308, "epoch": 1795} {"train_loss": -42.83274841308594, "global_step": 217309, "epoch": 1795} {"train_loss": -42.40559768676758, "global_step": 217310, "epoch": 1795} {"train_loss": -42.6682243347168, "global_step": 217311, "epoch": 1795} {"train_loss": -42.59617233276367, "global_step": 217312, "epoch": 1795} {"train_loss": -40.56807327270508, "global_step": 217313, "epoch": 1795} {"train_loss": -42.747676849365234, "global_step": 217314, "epoch": 1795} {"train_loss": -41.44807115665152, "global_step": 217315, "epoch": 1795, "val_loss": 2485049.25} {"train_loss": -42.80733871459961, "global_step": 217316, "epoch": 1796} {"train_loss": -43.103458404541016, "global_step": 217317, "epoch": 1796} {"train_loss": -42.34612274169922, "global_step": 217318, "epoch": 1796} {"train_loss": -41.489105224609375, "global_step": 217319, "epoch": 1796} {"train_loss": -42.773494720458984, "global_step": 217320, "epoch": 1796} {"train_loss": -42.35898971557617, "global_step": 217321, "epoch": 1796} {"train_loss": -42.332847595214844, "global_step": 217322, "epoch": 1796} {"train_loss": -43.17668151855469, "global_step": 217323, "epoch": 1796} {"train_loss": -41.98674392700195, "global_step": 217324, "epoch": 1796} {"train_loss": -42.69452667236328, "global_step": 217325, "epoch": 1796} {"train_loss": -42.705440521240234, "global_step": 217326, "epoch": 1796} {"train_loss": -41.538814544677734, "global_step": 217327, "epoch": 1796} {"train_loss": -41.95284652709961, "global_step": 217328, "epoch": 1796} {"train_loss": -43.1898307800293, "global_step": 217329, "epoch": 1796} {"train_loss": -43.098453521728516, "global_step": 217330, "epoch": 1796} {"train_loss": -41.44316482543945, "global_step": 217331, "epoch": 1796} {"train_loss": -43.309207916259766, "global_step": 217332, "epoch": 1796} {"train_loss": -42.17938232421875, "global_step": 217333, "epoch": 1796} {"train_loss": -42.40024948120117, "global_step": 217334, "epoch": 1796} {"train_loss": -41.70273971557617, "global_step": 217335, "epoch": 1796} {"train_loss": -41.9083366394043, "global_step": 217336, "epoch": 1796} {"train_loss": -43.12049865722656, "global_step": 217337, "epoch": 1796} {"train_loss": -41.79872131347656, "global_step": 217338, "epoch": 1796} {"train_loss": -41.690242767333984, "global_step": 217339, "epoch": 1796} {"train_loss": -41.88724899291992, "global_step": 217340, "epoch": 1796} {"train_loss": -43.1845817565918, "global_step": 217341, "epoch": 1796} {"train_loss": -40.18450927734375, "global_step": 217342, "epoch": 1796} {"train_loss": -42.09876251220703, "global_step": 217343, "epoch": 1796} {"train_loss": -42.74639892578125, "global_step": 217344, "epoch": 1796} {"train_loss": -42.084651947021484, "global_step": 217345, "epoch": 1796} {"train_loss": -41.99357604980469, "global_step": 217346, "epoch": 1796} {"train_loss": -42.54639434814453, "global_step": 217347, "epoch": 1796} {"train_loss": -42.24728012084961, "global_step": 217348, "epoch": 1796} {"train_loss": -42.65609359741211, "global_step": 217349, "epoch": 1796} {"train_loss": -30.33186149597168, "global_step": 217350, "epoch": 1796} {"train_loss": -41.9931755065918, "global_step": 217351, "epoch": 1796} {"train_loss": -42.108009338378906, "global_step": 217352, "epoch": 1796} {"train_loss": -42.47795486450195, "global_step": 217353, "epoch": 1796} {"train_loss": -42.215087890625, "global_step": 217354, "epoch": 1796} {"train_loss": -41.70853805541992, "global_step": 217355, "epoch": 1796} {"train_loss": -41.59934997558594, "global_step": 217356, "epoch": 1796} {"train_loss": -42.41393280029297, "global_step": 217357, "epoch": 1796} {"train_loss": -42.35443878173828, "global_step": 217358, "epoch": 1796} {"train_loss": -41.63483810424805, "global_step": 217359, "epoch": 1796} {"train_loss": -42.3016357421875, "global_step": 217360, "epoch": 1796} {"train_loss": -42.29500198364258, "global_step": 217361, "epoch": 1796} {"train_loss": -42.107810974121094, "global_step": 217362, "epoch": 1796} {"train_loss": -42.062400817871094, "global_step": 217363, "epoch": 1796} {"train_loss": -41.86652374267578, "global_step": 217364, "epoch": 1796} {"train_loss": -42.165069580078125, "global_step": 217365, "epoch": 1796} {"train_loss": -42.97434616088867, "global_step": 217366, "epoch": 1796} {"train_loss": -42.38956069946289, "global_step": 217367, "epoch": 1796} {"train_loss": -42.767818450927734, "global_step": 217368, "epoch": 1796} {"train_loss": -41.6838493347168, "global_step": 217369, "epoch": 1796} {"train_loss": -42.02535629272461, "global_step": 217370, "epoch": 1796} {"train_loss": -42.0712776184082, "global_step": 217371, "epoch": 1796} {"train_loss": -41.353973388671875, "global_step": 217372, "epoch": 1796} {"train_loss": -42.9220085144043, "global_step": 217373, "epoch": 1796} {"train_loss": -42.361724853515625, "global_step": 217374, "epoch": 1796} {"train_loss": -42.4140510559082, "global_step": 217375, "epoch": 1796} {"train_loss": -42.75046157836914, "global_step": 217376, "epoch": 1796} {"train_loss": -42.599063873291016, "global_step": 217377, "epoch": 1796} {"train_loss": -42.88324737548828, "global_step": 217378, "epoch": 1796} {"train_loss": -43.0011100769043, "global_step": 217379, "epoch": 1796} {"train_loss": -42.400238037109375, "global_step": 217380, "epoch": 1796} {"train_loss": -42.82790756225586, "global_step": 217381, "epoch": 1796} {"train_loss": -41.341060638427734, "global_step": 217382, "epoch": 1796} {"train_loss": -42.72883224487305, "global_step": 217383, "epoch": 1796} {"train_loss": -41.75133514404297, "global_step": 217384, "epoch": 1796} {"train_loss": -42.63840866088867, "global_step": 217385, "epoch": 1796} {"train_loss": -42.342010498046875, "global_step": 217386, "epoch": 1796} {"train_loss": -43.10341262817383, "global_step": 217387, "epoch": 1796} {"train_loss": -43.030025482177734, "global_step": 217388, "epoch": 1796} {"train_loss": -41.66066360473633, "global_step": 217389, "epoch": 1796} {"train_loss": -41.61745071411133, "global_step": 217390, "epoch": 1796} {"train_loss": -40.90945053100586, "global_step": 217391, "epoch": 1796} {"train_loss": -40.7872314453125, "global_step": 217392, "epoch": 1796} {"train_loss": -40.583892822265625, "global_step": 217393, "epoch": 1796} {"train_loss": -41.12104034423828, "global_step": 217394, "epoch": 1796} {"train_loss": -42.758544921875, "global_step": 217395, "epoch": 1796} {"train_loss": -42.52934646606445, "global_step": 217396, "epoch": 1796} {"train_loss": -41.76142120361328, "global_step": 217397, "epoch": 1796} {"train_loss": -39.34246826171875, "global_step": 217398, "epoch": 1796} {"train_loss": -41.52107620239258, "global_step": 217399, "epoch": 1796} {"train_loss": -42.249202728271484, "global_step": 217400, "epoch": 1796} {"train_loss": -41.34932327270508, "global_step": 217401, "epoch": 1796} {"train_loss": -40.9847526550293, "global_step": 217402, "epoch": 1796} {"train_loss": -42.077781677246094, "global_step": 217403, "epoch": 1796} {"train_loss": -42.2505989074707, "global_step": 217404, "epoch": 1796} {"train_loss": -41.6775016784668, "global_step": 217405, "epoch": 1796} {"train_loss": -41.60689926147461, "global_step": 217406, "epoch": 1796} {"train_loss": -42.07932662963867, "global_step": 217407, "epoch": 1796} {"train_loss": -41.86167526245117, "global_step": 217408, "epoch": 1796} {"train_loss": -42.669349670410156, "global_step": 217409, "epoch": 1796} {"train_loss": -42.31388473510742, "global_step": 217410, "epoch": 1796} {"train_loss": -41.1263427734375, "global_step": 217411, "epoch": 1796} {"train_loss": -42.0091667175293, "global_step": 217412, "epoch": 1796} {"train_loss": -42.21841049194336, "global_step": 217413, "epoch": 1796} {"train_loss": -40.98804473876953, "global_step": 217414, "epoch": 1796} {"train_loss": -41.5179443359375, "global_step": 217415, "epoch": 1796} {"train_loss": -41.819061279296875, "global_step": 217416, "epoch": 1796} {"train_loss": -41.393829345703125, "global_step": 217417, "epoch": 1796} {"train_loss": -42.516990661621094, "global_step": 217418, "epoch": 1796} {"train_loss": -41.620967864990234, "global_step": 217419, "epoch": 1796} {"train_loss": -41.324127197265625, "global_step": 217420, "epoch": 1796} {"train_loss": -42.55465316772461, "global_step": 217421, "epoch": 1796} {"train_loss": -41.2528190612793, "global_step": 217422, "epoch": 1796} {"train_loss": -39.61689376831055, "global_step": 217423, "epoch": 1796} {"train_loss": -40.17332077026367, "global_step": 217424, "epoch": 1796} {"train_loss": -41.415870666503906, "global_step": 217425, "epoch": 1796} {"train_loss": -40.44305419921875, "global_step": 217426, "epoch": 1796} {"train_loss": -42.15646743774414, "global_step": 217427, "epoch": 1796} {"train_loss": -40.63886260986328, "global_step": 217428, "epoch": 1796} {"train_loss": -38.70523452758789, "global_step": 217429, "epoch": 1796} {"train_loss": -34.63471221923828, "global_step": 217430, "epoch": 1796} {"train_loss": -41.60248947143555, "global_step": 217431, "epoch": 1796} {"train_loss": -35.64321517944336, "global_step": 217432, "epoch": 1796} {"train_loss": -39.63386917114258, "global_step": 217433, "epoch": 1796} {"train_loss": -40.94211196899414, "global_step": 217434, "epoch": 1796} {"train_loss": -39.62949752807617, "global_step": 217435, "epoch": 1796} {"train_loss": -41.709348899273834, "global_step": 217436, "epoch": 1796, "val_loss": 3025183.0} {"train_loss": -40.52320098876953, "global_step": 217437, "epoch": 1797} {"train_loss": -37.778358459472656, "global_step": 217438, "epoch": 1797} {"train_loss": -17.6527099609375, "global_step": 217439, "epoch": 1797} {"train_loss": -36.873023986816406, "global_step": 217440, "epoch": 1797} {"train_loss": -34.69684600830078, "global_step": 217441, "epoch": 1797} {"train_loss": -27.68098258972168, "global_step": 217442, "epoch": 1797} {"train_loss": -16.110280990600586, "global_step": 217443, "epoch": 1797} {"train_loss": -28.45271110534668, "global_step": 217444, "epoch": 1797} {"train_loss": -34.67830276489258, "global_step": 217445, "epoch": 1797} {"train_loss": -24.588403701782227, "global_step": 217446, "epoch": 1797} {"train_loss": -8.08232307434082, "global_step": 217447, "epoch": 1797} {"train_loss": -20.653667449951172, "global_step": 217448, "epoch": 1797} {"train_loss": -29.386152267456055, "global_step": 217449, "epoch": 1797} {"train_loss": -11.83066463470459, "global_step": 217450, "epoch": 1797} {"train_loss": -32.01201629638672, "global_step": 217451, "epoch": 1797} {"train_loss": -26.07710075378418, "global_step": 217452, "epoch": 1797} {"train_loss": -20.091632843017578, "global_step": 217453, "epoch": 1797} {"train_loss": -25.159883499145508, "global_step": 217454, "epoch": 1797} {"train_loss": -30.976016998291016, "global_step": 217455, "epoch": 1797} {"train_loss": -33.20838165283203, "global_step": 217456, "epoch": 1797} {"train_loss": -27.149250030517578, "global_step": 217457, "epoch": 1797} {"train_loss": -30.96821403503418, "global_step": 217458, "epoch": 1797} {"train_loss": -31.796493530273438, "global_step": 217459, "epoch": 1797} {"train_loss": -32.986366271972656, "global_step": 217460, "epoch": 1797} {"train_loss": -35.228057861328125, "global_step": 217461, "epoch": 1797} {"train_loss": -35.389827728271484, "global_step": 217462, "epoch": 1797} {"train_loss": -32.367122650146484, "global_step": 217463, "epoch": 1797} {"train_loss": -35.746395111083984, "global_step": 217464, "epoch": 1797} {"train_loss": -32.98725509643555, "global_step": 217465, "epoch": 1797} {"train_loss": -35.57334518432617, "global_step": 217466, "epoch": 1797} {"train_loss": -34.87885284423828, "global_step": 217467, "epoch": 1797} {"train_loss": -37.22005844116211, "global_step": 217468, "epoch": 1797} {"train_loss": -35.98270797729492, "global_step": 217469, "epoch": 1797} {"train_loss": -37.1853141784668, "global_step": 217470, "epoch": 1797} {"train_loss": -34.21550369262695, "global_step": 217471, "epoch": 1797} {"train_loss": -35.64683151245117, "global_step": 217472, "epoch": 1797} {"train_loss": -35.874481201171875, "global_step": 217473, "epoch": 1797} {"train_loss": -36.03186798095703, "global_step": 217474, "epoch": 1797} {"train_loss": -35.40949249267578, "global_step": 217475, "epoch": 1797} {"train_loss": -34.859230041503906, "global_step": 217476, "epoch": 1797} {"train_loss": -36.88038635253906, "global_step": 217477, "epoch": 1797} {"train_loss": -36.43513107299805, "global_step": 217478, "epoch": 1797} {"train_loss": -35.190284729003906, "global_step": 217479, "epoch": 1797} {"train_loss": -36.380706787109375, "global_step": 217480, "epoch": 1797} {"train_loss": -37.51972198486328, "global_step": 217481, "epoch": 1797} {"train_loss": -37.04370880126953, "global_step": 217482, "epoch": 1797} {"train_loss": -36.77522277832031, "global_step": 217483, "epoch": 1797} {"train_loss": -37.23964309692383, "global_step": 217484, "epoch": 1797} {"train_loss": -37.10541915893555, "global_step": 217485, "epoch": 1797} {"train_loss": -37.175594329833984, "global_step": 217486, "epoch": 1797} {"train_loss": -36.41768264770508, "global_step": 217487, "epoch": 1797} {"train_loss": -36.494415283203125, "global_step": 217488, "epoch": 1797} {"train_loss": -36.912452697753906, "global_step": 217489, "epoch": 1797} {"train_loss": -37.2878532409668, "global_step": 217490, "epoch": 1797} {"train_loss": -37.082733154296875, "global_step": 217491, "epoch": 1797} {"train_loss": -36.9964485168457, "global_step": 217492, "epoch": 1797} {"train_loss": -37.02708053588867, "global_step": 217493, "epoch": 1797} {"train_loss": -37.18256759643555, "global_step": 217494, "epoch": 1797} {"train_loss": -36.966312408447266, "global_step": 217495, "epoch": 1797} {"train_loss": -37.33994674682617, "global_step": 217496, "epoch": 1797} {"train_loss": -37.29518127441406, "global_step": 217497, "epoch": 1797} {"train_loss": -37.90639114379883, "global_step": 217498, "epoch": 1797} {"train_loss": -38.46826171875, "global_step": 217499, "epoch": 1797} {"train_loss": -38.67499923706055, "global_step": 217500, "epoch": 1797} {"train_loss": -37.3145866394043, "global_step": 217501, "epoch": 1797} {"train_loss": -38.41510772705078, "global_step": 217502, "epoch": 1797} {"train_loss": -38.8306884765625, "global_step": 217503, "epoch": 1797} {"train_loss": -38.875823974609375, "global_step": 217504, "epoch": 1797} {"train_loss": -38.166194915771484, "global_step": 217505, "epoch": 1797} {"train_loss": -37.7840461730957, "global_step": 217506, "epoch": 1797} {"train_loss": -37.327388763427734, "global_step": 217507, "epoch": 1797} {"train_loss": -38.18335723876953, "global_step": 217508, "epoch": 1797} {"train_loss": -38.36386489868164, "global_step": 217509, "epoch": 1797} {"train_loss": -38.48792266845703, "global_step": 217510, "epoch": 1797} {"train_loss": -38.87866973876953, "global_step": 217511, "epoch": 1797} {"train_loss": -39.09211349487305, "global_step": 217512, "epoch": 1797} {"train_loss": -39.05109405517578, "global_step": 217513, "epoch": 1797} {"train_loss": -38.7304801940918, "global_step": 217514, "epoch": 1797} {"train_loss": -38.78468322753906, "global_step": 217515, "epoch": 1797} {"train_loss": -38.72758865356445, "global_step": 217516, "epoch": 1797} {"train_loss": -38.41498947143555, "global_step": 217517, "epoch": 1797} {"train_loss": -39.21516799926758, "global_step": 217518, "epoch": 1797} {"train_loss": -38.852508544921875, "global_step": 217519, "epoch": 1797} {"train_loss": -38.72201156616211, "global_step": 217520, "epoch": 1797} {"train_loss": -39.06950759887695, "global_step": 217521, "epoch": 1797} {"train_loss": -37.81051254272461, "global_step": 217522, "epoch": 1797} {"train_loss": -39.06913375854492, "global_step": 217523, "epoch": 1797} {"train_loss": -38.73828887939453, "global_step": 217524, "epoch": 1797} {"train_loss": -39.332923889160156, "global_step": 217525, "epoch": 1797} {"train_loss": -39.1673583984375, "global_step": 217526, "epoch": 1797} {"train_loss": -38.272857666015625, "global_step": 217527, "epoch": 1797} {"train_loss": -38.378292083740234, "global_step": 217528, "epoch": 1797} {"train_loss": -39.48493194580078, "global_step": 217529, "epoch": 1797} {"train_loss": -40.021358489990234, "global_step": 217530, "epoch": 1797} {"train_loss": -39.69834518432617, "global_step": 217531, "epoch": 1797} {"train_loss": -39.06421661376953, "global_step": 217532, "epoch": 1797} {"train_loss": -38.67711639404297, "global_step": 217533, "epoch": 1797} {"train_loss": -38.76929473876953, "global_step": 217534, "epoch": 1797} {"train_loss": -39.25808334350586, "global_step": 217535, "epoch": 1797} {"train_loss": -38.39459228515625, "global_step": 217536, "epoch": 1797} {"train_loss": -40.077388763427734, "global_step": 217537, "epoch": 1797} {"train_loss": -39.410465240478516, "global_step": 217538, "epoch": 1797} {"train_loss": -39.239662170410156, "global_step": 217539, "epoch": 1797} {"train_loss": -39.470211029052734, "global_step": 217540, "epoch": 1797} {"train_loss": -38.82552719116211, "global_step": 217541, "epoch": 1797} {"train_loss": -39.309814453125, "global_step": 217542, "epoch": 1797} {"train_loss": -39.711456298828125, "global_step": 217543, "epoch": 1797} {"train_loss": -39.42289733886719, "global_step": 217544, "epoch": 1797} {"train_loss": -39.74949264526367, "global_step": 217545, "epoch": 1797} {"train_loss": -40.101806640625, "global_step": 217546, "epoch": 1797} {"train_loss": -40.29977035522461, "global_step": 217547, "epoch": 1797} {"train_loss": -40.6920280456543, "global_step": 217548, "epoch": 1797} {"train_loss": -39.30599594116211, "global_step": 217549, "epoch": 1797} {"train_loss": -39.76655960083008, "global_step": 217550, "epoch": 1797} {"train_loss": -40.08368682861328, "global_step": 217551, "epoch": 1797} {"train_loss": -40.24761962890625, "global_step": 217552, "epoch": 1797} {"train_loss": -39.80592727661133, "global_step": 217553, "epoch": 1797} {"train_loss": -39.33674240112305, "global_step": 217554, "epoch": 1797} {"train_loss": -39.029380798339844, "global_step": 217555, "epoch": 1797} {"train_loss": -39.59151840209961, "global_step": 217556, "epoch": 1797} {"train_loss": -35.88033437334801, "global_step": 217557, "epoch": 1797, "val_loss": 2758629.75} {"train_loss": -39.07061767578125, "global_step": 217558, "epoch": 1798} {"train_loss": -39.64680099487305, "global_step": 217559, "epoch": 1798} {"train_loss": -40.689674377441406, "global_step": 217560, "epoch": 1798} {"train_loss": -40.20117950439453, "global_step": 217561, "epoch": 1798} {"train_loss": -40.44295883178711, "global_step": 217562, "epoch": 1798} {"train_loss": -40.6323127746582, "global_step": 217563, "epoch": 1798} {"train_loss": -40.26588821411133, "global_step": 217564, "epoch": 1798} {"train_loss": -39.557281494140625, "global_step": 217565, "epoch": 1798} {"train_loss": -40.586097717285156, "global_step": 217566, "epoch": 1798} {"train_loss": -40.748226165771484, "global_step": 217567, "epoch": 1798} {"train_loss": -40.54767608642578, "global_step": 217568, "epoch": 1798} {"train_loss": -40.31880569458008, "global_step": 217569, "epoch": 1798} {"train_loss": -40.60002517700195, "global_step": 217570, "epoch": 1798} {"train_loss": -40.397727966308594, "global_step": 217571, "epoch": 1798} {"train_loss": -40.217315673828125, "global_step": 217572, "epoch": 1798} {"train_loss": -39.22579574584961, "global_step": 217573, "epoch": 1798} {"train_loss": -40.58336639404297, "global_step": 217574, "epoch": 1798} {"train_loss": -41.322147369384766, "global_step": 217575, "epoch": 1798} {"train_loss": -40.01641845703125, "global_step": 217576, "epoch": 1798} {"train_loss": -40.62351608276367, "global_step": 217577, "epoch": 1798} {"train_loss": -40.76628494262695, "global_step": 217578, "epoch": 1798} {"train_loss": -40.66572952270508, "global_step": 217579, "epoch": 1798} {"train_loss": -40.49598693847656, "global_step": 217580, "epoch": 1798} {"train_loss": -41.1504020690918, "global_step": 217581, "epoch": 1798} {"train_loss": -40.8521842956543, "global_step": 217582, "epoch": 1798} {"train_loss": -40.71257781982422, "global_step": 217583, "epoch": 1798} {"train_loss": -41.07521057128906, "global_step": 217584, "epoch": 1798} {"train_loss": -41.132659912109375, "global_step": 217585, "epoch": 1798} {"train_loss": -40.691505432128906, "global_step": 217586, "epoch": 1798} {"train_loss": -41.422218322753906, "global_step": 217587, "epoch": 1798} {"train_loss": -39.9468994140625, "global_step": 217588, "epoch": 1798} {"train_loss": -40.52216339111328, "global_step": 217589, "epoch": 1798} {"train_loss": -41.07493209838867, "global_step": 217590, "epoch": 1798} {"train_loss": -40.779048919677734, "global_step": 217591, "epoch": 1798} {"train_loss": -41.52457046508789, "global_step": 217592, "epoch": 1798} {"train_loss": -40.49418640136719, "global_step": 217593, "epoch": 1798} {"train_loss": -40.794189453125, "global_step": 217594, "epoch": 1798} {"train_loss": -40.75532913208008, "global_step": 217595, "epoch": 1798} {"train_loss": -41.275978088378906, "global_step": 217596, "epoch": 1798} {"train_loss": -41.34489059448242, "global_step": 217597, "epoch": 1798} {"train_loss": -41.149742126464844, "global_step": 217598, "epoch": 1798} {"train_loss": -40.00318145751953, "global_step": 217599, "epoch": 1798} {"train_loss": -42.09598922729492, "global_step": 217600, "epoch": 1798} {"train_loss": -41.64997482299805, "global_step": 217601, "epoch": 1798} {"train_loss": -41.81940841674805, "global_step": 217602, "epoch": 1798} {"train_loss": -40.35856628417969, "global_step": 217603, "epoch": 1798} {"train_loss": -40.92295455932617, "global_step": 217604, "epoch": 1798} {"train_loss": -40.852237701416016, "global_step": 217605, "epoch": 1798} {"train_loss": -41.05522537231445, "global_step": 217606, "epoch": 1798} {"train_loss": -41.817630767822266, "global_step": 217607, "epoch": 1798} {"train_loss": -40.362815856933594, "global_step": 217608, "epoch": 1798} {"train_loss": -41.06905746459961, "global_step": 217609, "epoch": 1798} {"train_loss": -41.14992904663086, "global_step": 217610, "epoch": 1798} {"train_loss": -40.88649368286133, "global_step": 217611, "epoch": 1798} {"train_loss": -40.33669662475586, "global_step": 217612, "epoch": 1798} {"train_loss": -40.0541877746582, "global_step": 217613, "epoch": 1798} {"train_loss": -40.76980209350586, "global_step": 217614, "epoch": 1798} {"train_loss": -41.1868896484375, "global_step": 217615, "epoch": 1798} {"train_loss": -39.163265228271484, "global_step": 217616, "epoch": 1798} {"train_loss": -40.07480239868164, "global_step": 217617, "epoch": 1798} {"train_loss": -41.37519073486328, "global_step": 217618, "epoch": 1798} {"train_loss": -40.186031341552734, "global_step": 217619, "epoch": 1798} {"train_loss": -39.840084075927734, "global_step": 217620, "epoch": 1798} {"train_loss": -40.77735900878906, "global_step": 217621, "epoch": 1798} {"train_loss": -41.18927001953125, "global_step": 217622, "epoch": 1798} {"train_loss": -39.82855224609375, "global_step": 217623, "epoch": 1798} {"train_loss": -40.218929290771484, "global_step": 217624, "epoch": 1798} {"train_loss": -41.40707778930664, "global_step": 217625, "epoch": 1798} {"train_loss": -37.49017333984375, "global_step": 217626, "epoch": 1798} {"train_loss": -39.785186767578125, "global_step": 217627, "epoch": 1798} {"train_loss": -39.99925231933594, "global_step": 217628, "epoch": 1798} {"train_loss": -39.221221923828125, "global_step": 217629, "epoch": 1798} {"train_loss": -39.049739837646484, "global_step": 217630, "epoch": 1798} {"train_loss": -40.679176330566406, "global_step": 217631, "epoch": 1798} {"train_loss": -38.95177459716797, "global_step": 217632, "epoch": 1798} {"train_loss": -40.79879379272461, "global_step": 217633, "epoch": 1798} {"train_loss": -40.697757720947266, "global_step": 217634, "epoch": 1798} {"train_loss": -40.21004867553711, "global_step": 217635, "epoch": 1798} {"train_loss": -40.903804779052734, "global_step": 217636, "epoch": 1798} {"train_loss": -40.868309020996094, "global_step": 217637, "epoch": 1798} {"train_loss": -40.180721282958984, "global_step": 217638, "epoch": 1798} {"train_loss": -41.10649871826172, "global_step": 217639, "epoch": 1798} {"train_loss": -40.65670394897461, "global_step": 217640, "epoch": 1798} {"train_loss": -40.68296432495117, "global_step": 217641, "epoch": 1798} {"train_loss": -39.56925582885742, "global_step": 217642, "epoch": 1798} {"train_loss": -40.391090393066406, "global_step": 217643, "epoch": 1798} {"train_loss": -40.7833251953125, "global_step": 217644, "epoch": 1798} {"train_loss": -40.529205322265625, "global_step": 217645, "epoch": 1798} {"train_loss": -41.28370666503906, "global_step": 217646, "epoch": 1798} {"train_loss": -41.26316452026367, "global_step": 217647, "epoch": 1798} {"train_loss": -41.56721878051758, "global_step": 217648, "epoch": 1798} {"train_loss": -41.268184661865234, "global_step": 217649, "epoch": 1798} {"train_loss": -41.57306671142578, "global_step": 217650, "epoch": 1798} {"train_loss": -40.97496795654297, "global_step": 217651, "epoch": 1798} {"train_loss": -41.08325958251953, "global_step": 217652, "epoch": 1798} {"train_loss": -41.002567291259766, "global_step": 217653, "epoch": 1798} {"train_loss": -40.76799011230469, "global_step": 217654, "epoch": 1798} {"train_loss": -41.496986389160156, "global_step": 217655, "epoch": 1798} {"train_loss": -41.6645393371582, "global_step": 217656, "epoch": 1798} {"train_loss": -41.64164352416992, "global_step": 217657, "epoch": 1798} {"train_loss": -41.721187591552734, "global_step": 217658, "epoch": 1798} {"train_loss": -40.82095718383789, "global_step": 217659, "epoch": 1798} {"train_loss": -41.842041015625, "global_step": 217660, "epoch": 1798} {"train_loss": -41.756954193115234, "global_step": 217661, "epoch": 1798} {"train_loss": -41.890625, "global_step": 217662, "epoch": 1798} {"train_loss": -41.993736267089844, "global_step": 217663, "epoch": 1798} {"train_loss": -41.142486572265625, "global_step": 217664, "epoch": 1798} {"train_loss": -41.24104690551758, "global_step": 217665, "epoch": 1798} {"train_loss": -41.30622863769531, "global_step": 217666, "epoch": 1798} {"train_loss": -42.26422119140625, "global_step": 217667, "epoch": 1798} {"train_loss": -41.01282501220703, "global_step": 217668, "epoch": 1798} {"train_loss": -41.8428840637207, "global_step": 217669, "epoch": 1798} {"train_loss": -40.91236877441406, "global_step": 217670, "epoch": 1798} {"train_loss": -41.87922286987305, "global_step": 217671, "epoch": 1798} {"train_loss": -42.00564193725586, "global_step": 217672, "epoch": 1798} {"train_loss": -41.672393798828125, "global_step": 217673, "epoch": 1798} {"train_loss": -42.03853988647461, "global_step": 217674, "epoch": 1798} {"train_loss": -41.177371978759766, "global_step": 217675, "epoch": 1798} {"train_loss": -41.500205993652344, "global_step": 217676, "epoch": 1798} {"train_loss": -41.6108283996582, "global_step": 217677, "epoch": 1798} {"train_loss": -40.79763708823968, "global_step": 217678, "epoch": 1798, "val_loss": 2587642.0} {"train_loss": -41.84259033203125, "global_step": 217679, "epoch": 1799} {"train_loss": -42.011959075927734, "global_step": 217680, "epoch": 1799} {"train_loss": -41.61594772338867, "global_step": 217681, "epoch": 1799} {"train_loss": -42.036476135253906, "global_step": 217682, "epoch": 1799} {"train_loss": -42.11613082885742, "global_step": 217683, "epoch": 1799} {"train_loss": -41.61888885498047, "global_step": 217684, "epoch": 1799} {"train_loss": -42.226165771484375, "global_step": 217685, "epoch": 1799} {"train_loss": -42.438629150390625, "global_step": 217686, "epoch": 1799} {"train_loss": -42.429683685302734, "global_step": 217687, "epoch": 1799} {"train_loss": -42.179927825927734, "global_step": 217688, "epoch": 1799} {"train_loss": -42.101470947265625, "global_step": 217689, "epoch": 1799} {"train_loss": -42.01628494262695, "global_step": 217690, "epoch": 1799} {"train_loss": -41.67623519897461, "global_step": 217691, "epoch": 1799} {"train_loss": -42.458065032958984, "global_step": 217692, "epoch": 1799} {"train_loss": -42.2586784362793, "global_step": 217693, "epoch": 1799} {"train_loss": -42.32816696166992, "global_step": 217694, "epoch": 1799} {"train_loss": -40.68647384643555, "global_step": 217695, "epoch": 1799} {"train_loss": -42.09619903564453, "global_step": 217696, "epoch": 1799} {"train_loss": -40.864505767822266, "global_step": 217697, "epoch": 1799} {"train_loss": -40.11379623413086, "global_step": 217698, "epoch": 1799} {"train_loss": -37.632076263427734, "global_step": 217699, "epoch": 1799} {"train_loss": -36.08771514892578, "global_step": 217700, "epoch": 1799} {"train_loss": -37.12070083618164, "global_step": 217701, "epoch": 1799} {"train_loss": -38.88762283325195, "global_step": 217702, "epoch": 1799} {"train_loss": -39.15157699584961, "global_step": 217703, "epoch": 1799} {"train_loss": -36.15170669555664, "global_step": 217704, "epoch": 1799} {"train_loss": -34.404632568359375, "global_step": 217705, "epoch": 1799} {"train_loss": -37.45570755004883, "global_step": 217706, "epoch": 1799} {"train_loss": -40.830322265625, "global_step": 217707, "epoch": 1799} {"train_loss": -38.8383903503418, "global_step": 217708, "epoch": 1799} {"train_loss": -39.32429122924805, "global_step": 217709, "epoch": 1799} {"train_loss": -37.998626708984375, "global_step": 217710, "epoch": 1799} {"train_loss": -40.399654388427734, "global_step": 217711, "epoch": 1799} {"train_loss": -39.54922103881836, "global_step": 217712, "epoch": 1799} {"train_loss": -40.01227951049805, "global_step": 217713, "epoch": 1799} {"train_loss": -39.07822036743164, "global_step": 217714, "epoch": 1799} {"train_loss": -40.05803298950195, "global_step": 217715, "epoch": 1799} {"train_loss": -40.55351257324219, "global_step": 217716, "epoch": 1799} {"train_loss": -39.100852966308594, "global_step": 217717, "epoch": 1799} {"train_loss": -41.4929313659668, "global_step": 217718, "epoch": 1799} {"train_loss": -38.92220687866211, "global_step": 217719, "epoch": 1799} {"train_loss": -40.84455490112305, "global_step": 217720, "epoch": 1799} {"train_loss": -40.250362396240234, "global_step": 217721, "epoch": 1799} {"train_loss": -41.161617279052734, "global_step": 217722, "epoch": 1799} {"train_loss": -39.56560134887695, "global_step": 217723, "epoch": 1799} {"train_loss": -40.92417526245117, "global_step": 217724, "epoch": 1799} {"train_loss": -40.70087432861328, "global_step": 217725, "epoch": 1799} {"train_loss": -40.6141471862793, "global_step": 217726, "epoch": 1799} {"train_loss": -41.330501556396484, "global_step": 217727, "epoch": 1799} {"train_loss": -40.49607467651367, "global_step": 217728, "epoch": 1799} {"train_loss": -41.19979476928711, "global_step": 217729, "epoch": 1799} {"train_loss": -41.51646041870117, "global_step": 217730, "epoch": 1799} {"train_loss": -41.838478088378906, "global_step": 217731, "epoch": 1799} {"train_loss": -41.407161712646484, "global_step": 217732, "epoch": 1799} {"train_loss": -41.646812438964844, "global_step": 217733, "epoch": 1799} {"train_loss": -41.99778366088867, "global_step": 217734, "epoch": 1799} {"train_loss": -42.07094955444336, "global_step": 217735, "epoch": 1799} {"train_loss": -41.443485260009766, "global_step": 217736, "epoch": 1799} {"train_loss": -41.13905334472656, "global_step": 217737, "epoch": 1799} {"train_loss": -41.35845947265625, "global_step": 217738, "epoch": 1799} {"train_loss": -41.8393669128418, "global_step": 217739, "epoch": 1799} {"train_loss": -41.7094841003418, "global_step": 217740, "epoch": 1799} {"train_loss": -41.51777267456055, "global_step": 217741, "epoch": 1799} {"train_loss": -40.987728118896484, "global_step": 217742, "epoch": 1799} {"train_loss": -42.31155014038086, "global_step": 217743, "epoch": 1799} {"train_loss": -42.61845397949219, "global_step": 217744, "epoch": 1799} {"train_loss": -40.18557357788086, "global_step": 217745, "epoch": 1799} {"train_loss": -42.16714859008789, "global_step": 217746, "epoch": 1799} {"train_loss": -41.291690826416016, "global_step": 217747, "epoch": 1799} {"train_loss": -41.71097183227539, "global_step": 217748, "epoch": 1799} {"train_loss": -42.019927978515625, "global_step": 217749, "epoch": 1799} {"train_loss": -42.1990852355957, "global_step": 217750, "epoch": 1799} {"train_loss": -42.35720443725586, "global_step": 217751, "epoch": 1799} {"train_loss": -42.006866455078125, "global_step": 217752, "epoch": 1799} {"train_loss": -42.09858322143555, "global_step": 217753, "epoch": 1799} {"train_loss": -42.2746696472168, "global_step": 217754, "epoch": 1799} {"train_loss": -41.97919845581055, "global_step": 217755, "epoch": 1799} {"train_loss": -41.91238784790039, "global_step": 217756, "epoch": 1799} {"train_loss": -42.58002853393555, "global_step": 217757, "epoch": 1799} {"train_loss": -42.0420036315918, "global_step": 217758, "epoch": 1799} {"train_loss": -41.865966796875, "global_step": 217759, "epoch": 1799} {"train_loss": -41.609230041503906, "global_step": 217760, "epoch": 1799} {"train_loss": -42.14170837402344, "global_step": 217761, "epoch": 1799} {"train_loss": -42.33530044555664, "global_step": 217762, "epoch": 1799} {"train_loss": -41.908931732177734, "global_step": 217763, "epoch": 1799} {"train_loss": -42.265960693359375, "global_step": 217764, "epoch": 1799} {"train_loss": -41.90953826904297, "global_step": 217765, "epoch": 1799} {"train_loss": -42.081390380859375, "global_step": 217766, "epoch": 1799} {"train_loss": -42.176055908203125, "global_step": 217767, "epoch": 1799} {"train_loss": -42.11455154418945, "global_step": 217768, "epoch": 1799} {"train_loss": -41.65021514892578, "global_step": 217769, "epoch": 1799} {"train_loss": -41.72020721435547, "global_step": 217770, "epoch": 1799} {"train_loss": -42.251708984375, "global_step": 217771, "epoch": 1799} {"train_loss": -40.473182678222656, "global_step": 217772, "epoch": 1799} {"train_loss": -41.45899200439453, "global_step": 217773, "epoch": 1799} {"train_loss": -42.37449264526367, "global_step": 217774, "epoch": 1799} {"train_loss": -41.653160095214844, "global_step": 217775, "epoch": 1799} {"train_loss": -41.934810638427734, "global_step": 217776, "epoch": 1799} {"train_loss": -42.30466842651367, "global_step": 217777, "epoch": 1799} {"train_loss": -41.678192138671875, "global_step": 217778, "epoch": 1799} {"train_loss": -42.02424240112305, "global_step": 217779, "epoch": 1799} {"train_loss": -41.69121170043945, "global_step": 217780, "epoch": 1799} {"train_loss": -41.65377426147461, "global_step": 217781, "epoch": 1799} {"train_loss": -42.21399688720703, "global_step": 217782, "epoch": 1799} {"train_loss": -41.28281784057617, "global_step": 217783, "epoch": 1799} {"train_loss": -41.668453216552734, "global_step": 217784, "epoch": 1799} {"train_loss": -40.77437973022461, "global_step": 217785, "epoch": 1799} {"train_loss": -41.26693344116211, "global_step": 217786, "epoch": 1799} {"train_loss": -41.0358772277832, "global_step": 217787, "epoch": 1799} {"train_loss": -42.07062530517578, "global_step": 217788, "epoch": 1799} {"train_loss": -41.29961013793945, "global_step": 217789, "epoch": 1799} {"train_loss": -41.379886627197266, "global_step": 217790, "epoch": 1799} {"train_loss": -41.24419403076172, "global_step": 217791, "epoch": 1799} {"train_loss": -40.93273162841797, "global_step": 217792, "epoch": 1799} {"train_loss": -42.636451721191406, "global_step": 217793, "epoch": 1799} {"train_loss": -41.73218536376953, "global_step": 217794, "epoch": 1799} {"train_loss": -41.18168258666992, "global_step": 217795, "epoch": 1799} {"train_loss": -42.52851486206055, "global_step": 217796, "epoch": 1799} {"train_loss": -40.60911178588867, "global_step": 217797, "epoch": 1799} {"train_loss": -41.03671646118164, "global_step": 217798, "epoch": 1799} {"train_loss": -41.14499948044454, "global_step": 217799, "epoch": 1799, "val_loss": 2694485.0} {"train_loss": -41.321712493896484, "global_step": 217800, "epoch": 1800} {"train_loss": -41.233699798583984, "global_step": 217801, "epoch": 1800} {"train_loss": -41.01459503173828, "global_step": 217802, "epoch": 1800} {"train_loss": -40.88507080078125, "global_step": 217803, "epoch": 1800} {"train_loss": -40.61609649658203, "global_step": 217804, "epoch": 1800} {"train_loss": -41.03037643432617, "global_step": 217805, "epoch": 1800} {"train_loss": -38.874568939208984, "global_step": 217806, "epoch": 1800} {"train_loss": -36.01275634765625, "global_step": 217807, "epoch": 1800} {"train_loss": -31.248737335205078, "global_step": 217808, "epoch": 1800} {"train_loss": -27.464706420898438, "global_step": 217809, "epoch": 1800} {"train_loss": -33.62240219116211, "global_step": 217810, "epoch": 1800} {"train_loss": -39.0943489074707, "global_step": 217811, "epoch": 1800} {"train_loss": -37.49311447143555, "global_step": 217812, "epoch": 1800} {"train_loss": -40.156558990478516, "global_step": 217813, "epoch": 1800} {"train_loss": -37.26961898803711, "global_step": 217814, "epoch": 1800} {"train_loss": -37.9854621887207, "global_step": 217815, "epoch": 1800} {"train_loss": -40.286678314208984, "global_step": 217816, "epoch": 1800} {"train_loss": -37.2340087890625, "global_step": 217817, "epoch": 1800} {"train_loss": -37.793663024902344, "global_step": 217818, "epoch": 1800} {"train_loss": -40.94370651245117, "global_step": 217819, "epoch": 1800} {"train_loss": -36.658966064453125, "global_step": 217820, "epoch": 1800} {"train_loss": -39.419166564941406, "global_step": 217821, "epoch": 1800} {"train_loss": -39.64495086669922, "global_step": 217822, "epoch": 1800} {"train_loss": -38.02260971069336, "global_step": 217823, "epoch": 1800} {"train_loss": -39.76240921020508, "global_step": 217824, "epoch": 1800} {"train_loss": -38.51861572265625, "global_step": 217825, "epoch": 1800} {"train_loss": -39.028846740722656, "global_step": 217826, "epoch": 1800} {"train_loss": -39.79226303100586, "global_step": 217827, "epoch": 1800} {"train_loss": -37.22772979736328, "global_step": 217828, "epoch": 1800} {"train_loss": -40.389244079589844, "global_step": 217829, "epoch": 1800} {"train_loss": -40.093929290771484, "global_step": 217830, "epoch": 1800} {"train_loss": -39.897701263427734, "global_step": 217831, "epoch": 1800} {"train_loss": -40.94355392456055, "global_step": 217832, "epoch": 1800} {"train_loss": -40.084049224853516, "global_step": 217833, "epoch": 1800} {"train_loss": -40.96467971801758, "global_step": 217834, "epoch": 1800} {"train_loss": -41.4515380859375, "global_step": 217835, "epoch": 1800} {"train_loss": -40.702632904052734, "global_step": 217836, "epoch": 1800} {"train_loss": -41.56913375854492, "global_step": 217837, "epoch": 1800} {"train_loss": -40.841461181640625, "global_step": 217838, "epoch": 1800} {"train_loss": -41.418331146240234, "global_step": 217839, "epoch": 1800} {"train_loss": -42.136199951171875, "global_step": 217840, "epoch": 1800} {"train_loss": -41.189971923828125, "global_step": 217841, "epoch": 1800} {"train_loss": -42.29464340209961, "global_step": 217842, "epoch": 1800} {"train_loss": -41.16209030151367, "global_step": 217843, "epoch": 1800} {"train_loss": -41.1701545715332, "global_step": 217844, "epoch": 1800} {"train_loss": -41.63093948364258, "global_step": 217845, "epoch": 1800} {"train_loss": -41.6551628112793, "global_step": 217846, "epoch": 1800} {"train_loss": -41.832618713378906, "global_step": 217847, "epoch": 1800} {"train_loss": -41.56908416748047, "global_step": 217848, "epoch": 1800} {"train_loss": -42.045074462890625, "global_step": 217849, "epoch": 1800} {"train_loss": -41.128265380859375, "global_step": 217850, "epoch": 1800} {"train_loss": -41.37413787841797, "global_step": 217851, "epoch": 1800} {"train_loss": -41.144649505615234, "global_step": 217852, "epoch": 1800} {"train_loss": -41.88259506225586, "global_step": 217853, "epoch": 1800} {"train_loss": -41.44270706176758, "global_step": 217854, "epoch": 1800} {"train_loss": -41.59955596923828, "global_step": 217855, "epoch": 1800} {"train_loss": -40.37568664550781, "global_step": 217856, "epoch": 1800} {"train_loss": -41.671260833740234, "global_step": 217857, "epoch": 1800} {"train_loss": -41.70962905883789, "global_step": 217858, "epoch": 1800} {"train_loss": -41.87291717529297, "global_step": 217859, "epoch": 1800} {"train_loss": -42.065330505371094, "global_step": 217860, "epoch": 1800} {"train_loss": -42.03286361694336, "global_step": 217861, "epoch": 1800} {"train_loss": -42.471099853515625, "global_step": 217862, "epoch": 1800} {"train_loss": -41.66228103637695, "global_step": 217863, "epoch": 1800} {"train_loss": -42.397911071777344, "global_step": 217864, "epoch": 1800} {"train_loss": -41.77372360229492, "global_step": 217865, "epoch": 1800} {"train_loss": -41.9830322265625, "global_step": 217866, "epoch": 1800} {"train_loss": -41.88916778564453, "global_step": 217867, "epoch": 1800} {"train_loss": -41.5891227722168, "global_step": 217868, "epoch": 1800} {"train_loss": -42.430641174316406, "global_step": 217869, "epoch": 1800} {"train_loss": -42.03152847290039, "global_step": 217870, "epoch": 1800} {"train_loss": -42.222686767578125, "global_step": 217871, "epoch": 1800} {"train_loss": -41.90652084350586, "global_step": 217872, "epoch": 1800} {"train_loss": -42.35401153564453, "global_step": 217873, "epoch": 1800} {"train_loss": -42.338436126708984, "global_step": 217874, "epoch": 1800} {"train_loss": -42.381263732910156, "global_step": 217875, "epoch": 1800} {"train_loss": -42.16402816772461, "global_step": 217876, "epoch": 1800} {"train_loss": -41.10850143432617, "global_step": 217877, "epoch": 1800} {"train_loss": -42.54339599609375, "global_step": 217878, "epoch": 1800} {"train_loss": -41.02979278564453, "global_step": 217879, "epoch": 1800} {"train_loss": -41.86407470703125, "global_step": 217880, "epoch": 1800} {"train_loss": -42.68679428100586, "global_step": 217881, "epoch": 1800} {"train_loss": -42.07184982299805, "global_step": 217882, "epoch": 1800} {"train_loss": -42.55447006225586, "global_step": 217883, "epoch": 1800} {"train_loss": -42.32952117919922, "global_step": 217884, "epoch": 1800} {"train_loss": -42.3868293762207, "global_step": 217885, "epoch": 1800} {"train_loss": -42.115848541259766, "global_step": 217886, "epoch": 1800} {"train_loss": -42.429073333740234, "global_step": 217887, "epoch": 1800} {"train_loss": -42.62907028198242, "global_step": 217888, "epoch": 1800} {"train_loss": -38.85889434814453, "global_step": 217889, "epoch": 1800} {"train_loss": -42.71097946166992, "global_step": 217890, "epoch": 1800} {"train_loss": -41.8480224609375, "global_step": 217891, "epoch": 1800} {"train_loss": -42.502864837646484, "global_step": 217892, "epoch": 1800} {"train_loss": -42.78013229370117, "global_step": 217893, "epoch": 1800} {"train_loss": -42.24851608276367, "global_step": 217894, "epoch": 1800} {"train_loss": -42.02105712890625, "global_step": 217895, "epoch": 1800} {"train_loss": -41.96192169189453, "global_step": 217896, "epoch": 1800} {"train_loss": -42.205989837646484, "global_step": 217897, "epoch": 1800} {"train_loss": -41.82944107055664, "global_step": 217898, "epoch": 1800} {"train_loss": -41.842613220214844, "global_step": 217899, "epoch": 1800} {"train_loss": -42.46791458129883, "global_step": 217900, "epoch": 1800} {"train_loss": -42.31009292602539, "global_step": 217901, "epoch": 1800} {"train_loss": -41.59881591796875, "global_step": 217902, "epoch": 1800} {"train_loss": -42.35897445678711, "global_step": 217903, "epoch": 1800} {"train_loss": -41.71241760253906, "global_step": 217904, "epoch": 1800} {"train_loss": -42.4415397644043, "global_step": 217905, "epoch": 1800} {"train_loss": -42.14982223510742, "global_step": 217906, "epoch": 1800} {"train_loss": -41.692527770996094, "global_step": 217907, "epoch": 1800} {"train_loss": -42.12245559692383, "global_step": 217908, "epoch": 1800} {"train_loss": -42.778656005859375, "global_step": 217909, "epoch": 1800} {"train_loss": -42.47968673706055, "global_step": 217910, "epoch": 1800} {"train_loss": -41.10995864868164, "global_step": 217911, "epoch": 1800} {"train_loss": -41.39008712768555, "global_step": 217912, "epoch": 1800} {"train_loss": -42.044769287109375, "global_step": 217913, "epoch": 1800} {"train_loss": -42.73566818237305, "global_step": 217914, "epoch": 1800} {"train_loss": -41.6578369140625, "global_step": 217915, "epoch": 1800} {"train_loss": -42.02971649169922, "global_step": 217916, "epoch": 1800} {"train_loss": -41.576683044433594, "global_step": 217917, "epoch": 1800} {"train_loss": -42.853919982910156, "global_step": 217918, "epoch": 1800} {"train_loss": -40.833740234375, "global_step": 217919, "epoch": 1800} {"train_loss": -40.94309392251259, "global_step": 217920, "epoch": 1800, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4400000": 1.0, "test/sim_max_reward_4400001": 1.0, "test/sim_max_reward_4400002": 1.0, "test/sim_max_reward_4400003": 1.0, "test/sim_max_reward_4400004": 1.0, "test/sim_max_reward_4400005": 1.0, "test/sim_max_reward_4400006": 1.0, "test/sim_max_reward_4400007": 1.0, "test/sim_max_reward_4400008": 1.0, "test/sim_max_reward_4400009": 1.0, "test/sim_max_reward_4400010": 1.0, "test/sim_max_reward_4400011": 1.0, "test/sim_max_reward_4400012": 1.0, "test/sim_max_reward_4400013": 1.0, "test/sim_max_reward_4400014": 1.0, "test/sim_max_reward_4400015": 1.0, "test/sim_max_reward_4400016": 1.0, "test/sim_max_reward_4400017": 1.0, "test/sim_max_reward_4400018": 1.0, "test/sim_max_reward_4400019": 1.0, "test/sim_max_reward_4400020": 1.0, "test/sim_max_reward_4400021": 1.0, "train/mean_score": 1.0, "test/mean_score": 1.0, "val_loss": 2660589.75} {"train_loss": -42.17322540283203, "global_step": 217921, "epoch": 1801} {"train_loss": -40.48768615722656, "global_step": 217922, "epoch": 1801} {"train_loss": -41.98748016357422, "global_step": 217923, "epoch": 1801} {"train_loss": -42.40726852416992, "global_step": 217924, "epoch": 1801} {"train_loss": -42.06048583984375, "global_step": 217925, "epoch": 1801} {"train_loss": -40.87644577026367, "global_step": 217926, "epoch": 1801} {"train_loss": -42.19367599487305, "global_step": 217927, "epoch": 1801} {"train_loss": -42.0780029296875, "global_step": 217928, "epoch": 1801} {"train_loss": -41.70573043823242, "global_step": 217929, "epoch": 1801} {"train_loss": -40.17954635620117, "global_step": 217930, "epoch": 1801} {"train_loss": -42.179290771484375, "global_step": 217931, "epoch": 1801} {"train_loss": -40.642452239990234, "global_step": 217932, "epoch": 1801} {"train_loss": -41.39634704589844, "global_step": 217933, "epoch": 1801} {"train_loss": -41.544586181640625, "global_step": 217934, "epoch": 1801} {"train_loss": -41.69767379760742, "global_step": 217935, "epoch": 1801} {"train_loss": -41.4823112487793, "global_step": 217936, "epoch": 1801} {"train_loss": -40.843196868896484, "global_step": 217937, "epoch": 1801} {"train_loss": -42.22353744506836, "global_step": 217938, "epoch": 1801} {"train_loss": -41.79807662963867, "global_step": 217939, "epoch": 1801} {"train_loss": -41.795631408691406, "global_step": 217940, "epoch": 1801} {"train_loss": -38.076866149902344, "global_step": 217941, "epoch": 1801} {"train_loss": -40.916629791259766, "global_step": 217942, "epoch": 1801} {"train_loss": -41.28799057006836, "global_step": 217943, "epoch": 1801} {"train_loss": -41.21342086791992, "global_step": 217944, "epoch": 1801} {"train_loss": -41.52354049682617, "global_step": 217945, "epoch": 1801} {"train_loss": -41.450904846191406, "global_step": 217946, "epoch": 1801} {"train_loss": -41.90042495727539, "global_step": 217947, "epoch": 1801} {"train_loss": -41.25600051879883, "global_step": 217948, "epoch": 1801} {"train_loss": -42.179656982421875, "global_step": 217949, "epoch": 1801} {"train_loss": -41.77090072631836, "global_step": 217950, "epoch": 1801} {"train_loss": -41.59115219116211, "global_step": 217951, "epoch": 1801} {"train_loss": -41.171451568603516, "global_step": 217952, "epoch": 1801} {"train_loss": -41.7526969909668, "global_step": 217953, "epoch": 1801} {"train_loss": -42.195030212402344, "global_step": 217954, "epoch": 1801} {"train_loss": -40.678768157958984, "global_step": 217955, "epoch": 1801} {"train_loss": -41.8758430480957, "global_step": 217956, "epoch": 1801} {"train_loss": -41.654396057128906, "global_step": 217957, "epoch": 1801} {"train_loss": -41.13010025024414, "global_step": 217958, "epoch": 1801} {"train_loss": -41.43799591064453, "global_step": 217959, "epoch": 1801} {"train_loss": -41.712154388427734, "global_step": 217960, "epoch": 1801} {"train_loss": -40.25556182861328, "global_step": 217961, "epoch": 1801} {"train_loss": -39.88605880737305, "global_step": 217962, "epoch": 1801} {"train_loss": -39.688255310058594, "global_step": 217963, "epoch": 1801} {"train_loss": -40.56307601928711, "global_step": 217964, "epoch": 1801} {"train_loss": -42.565589904785156, "global_step": 217965, "epoch": 1801} {"train_loss": -41.668800354003906, "global_step": 217966, "epoch": 1801} {"train_loss": -39.7459831237793, "global_step": 217967, "epoch": 1801} {"train_loss": -41.079811096191406, "global_step": 217968, "epoch": 1801} {"train_loss": -41.25273895263672, "global_step": 217969, "epoch": 1801} {"train_loss": -40.38621139526367, "global_step": 217970, "epoch": 1801} {"train_loss": -41.948848724365234, "global_step": 217971, "epoch": 1801} {"train_loss": -40.900733947753906, "global_step": 217972, "epoch": 1801} {"train_loss": -40.04645538330078, "global_step": 217973, "epoch": 1801} {"train_loss": -40.767127990722656, "global_step": 217974, "epoch": 1801} {"train_loss": -41.9726448059082, "global_step": 217975, "epoch": 1801} {"train_loss": -39.977027893066406, "global_step": 217976, "epoch": 1801} {"train_loss": -38.57268142700195, "global_step": 217977, "epoch": 1801} {"train_loss": -39.83108901977539, "global_step": 217978, "epoch": 1801} {"train_loss": -41.9746208190918, "global_step": 217979, "epoch": 1801} {"train_loss": -41.310401916503906, "global_step": 217980, "epoch": 1801} {"train_loss": -40.882015228271484, "global_step": 217981, "epoch": 1801} {"train_loss": -42.11654281616211, "global_step": 217982, "epoch": 1801} {"train_loss": -42.07966995239258, "global_step": 217983, "epoch": 1801} {"train_loss": -42.94306182861328, "global_step": 217984, "epoch": 1801} {"train_loss": -42.24599075317383, "global_step": 217985, "epoch": 1801} {"train_loss": -42.44108581542969, "global_step": 217986, "epoch": 1801} {"train_loss": -42.54485321044922, "global_step": 217987, "epoch": 1801} {"train_loss": -41.941097259521484, "global_step": 217988, "epoch": 1801} {"train_loss": -42.2437629699707, "global_step": 217989, "epoch": 1801} {"train_loss": -41.284420013427734, "global_step": 217990, "epoch": 1801} {"train_loss": -42.06966781616211, "global_step": 217991, "epoch": 1801} {"train_loss": -40.86359786987305, "global_step": 217992, "epoch": 1801} {"train_loss": -42.23629379272461, "global_step": 217993, "epoch": 1801} {"train_loss": -41.71683883666992, "global_step": 217994, "epoch": 1801} {"train_loss": -41.96426010131836, "global_step": 217995, "epoch": 1801} {"train_loss": -42.130733489990234, "global_step": 217996, "epoch": 1801} {"train_loss": -40.823158264160156, "global_step": 217997, "epoch": 1801} {"train_loss": -42.09580993652344, "global_step": 217998, "epoch": 1801} {"train_loss": -42.55508041381836, "global_step": 217999, "epoch": 1801} {"train_loss": -42.0200080871582, "global_step": 218000, "epoch": 1801} {"train_loss": -42.105587005615234, "global_step": 218001, "epoch": 1801} {"train_loss": -42.4001579284668, "global_step": 218002, "epoch": 1801} {"train_loss": -42.42069625854492, "global_step": 218003, "epoch": 1801} {"train_loss": -42.67840576171875, "global_step": 218004, "epoch": 1801} {"train_loss": -42.039127349853516, "global_step": 218005, "epoch": 1801} {"train_loss": -42.109310150146484, "global_step": 218006, "epoch": 1801} {"train_loss": -41.952693939208984, "global_step": 218007, "epoch": 1801} {"train_loss": -41.718143463134766, "global_step": 218008, "epoch": 1801} {"train_loss": -41.016143798828125, "global_step": 218009, "epoch": 1801} {"train_loss": -42.078468322753906, "global_step": 218010, "epoch": 1801} {"train_loss": -41.01209259033203, "global_step": 218011, "epoch": 1801} {"train_loss": -42.396663665771484, "global_step": 218012, "epoch": 1801} {"train_loss": -40.24644088745117, "global_step": 218013, "epoch": 1801} {"train_loss": -42.00340270996094, "global_step": 218014, "epoch": 1801} {"train_loss": -37.69118118286133, "global_step": 218015, "epoch": 1801} {"train_loss": -41.34853744506836, "global_step": 218016, "epoch": 1801} {"train_loss": -40.574378967285156, "global_step": 218017, "epoch": 1801} {"train_loss": -39.49064254760742, "global_step": 218018, "epoch": 1801} {"train_loss": -36.627933502197266, "global_step": 218019, "epoch": 1801} {"train_loss": -42.0496826171875, "global_step": 218020, "epoch": 1801} {"train_loss": -40.99617385864258, "global_step": 218021, "epoch": 1801} {"train_loss": -40.49969482421875, "global_step": 218022, "epoch": 1801} {"train_loss": -39.06604766845703, "global_step": 218023, "epoch": 1801} {"train_loss": -39.975433349609375, "global_step": 218024, "epoch": 1801} {"train_loss": -39.80533981323242, "global_step": 218025, "epoch": 1801} {"train_loss": -35.149757385253906, "global_step": 218026, "epoch": 1801} {"train_loss": -39.065284729003906, "global_step": 218027, "epoch": 1801} {"train_loss": -39.04144287109375, "global_step": 218028, "epoch": 1801} {"train_loss": -38.2547492980957, "global_step": 218029, "epoch": 1801} {"train_loss": -36.077369689941406, "global_step": 218030, "epoch": 1801} {"train_loss": -40.191917419433594, "global_step": 218031, "epoch": 1801} {"train_loss": -36.9796257019043, "global_step": 218032, "epoch": 1801} {"train_loss": -37.736297607421875, "global_step": 218033, "epoch": 1801} {"train_loss": -40.30170822143555, "global_step": 218034, "epoch": 1801} {"train_loss": -38.80318832397461, "global_step": 218035, "epoch": 1801} {"train_loss": -39.24620056152344, "global_step": 218036, "epoch": 1801} {"train_loss": -36.21669006347656, "global_step": 218037, "epoch": 1801} {"train_loss": -39.55471420288086, "global_step": 218038, "epoch": 1801} {"train_loss": -38.22340393066406, "global_step": 218039, "epoch": 1801} {"train_loss": -39.494140625, "global_step": 218040, "epoch": 1801} {"train_loss": -40.917086230821845, "global_step": 218041, "epoch": 1801, "val_loss": 2719616.75} {"train_loss": -38.95363235473633, "global_step": 218042, "epoch": 1802} {"train_loss": -39.59864044189453, "global_step": 218043, "epoch": 1802} {"train_loss": -41.178829193115234, "global_step": 218044, "epoch": 1802} {"train_loss": -40.73523712158203, "global_step": 218045, "epoch": 1802} {"train_loss": -40.435081481933594, "global_step": 218046, "epoch": 1802} {"train_loss": -41.18367004394531, "global_step": 218047, "epoch": 1802} {"train_loss": -40.811065673828125, "global_step": 218048, "epoch": 1802} {"train_loss": -41.00954818725586, "global_step": 218049, "epoch": 1802} {"train_loss": -41.313716888427734, "global_step": 218050, "epoch": 1802} {"train_loss": -41.095123291015625, "global_step": 218051, "epoch": 1802} {"train_loss": -40.87866973876953, "global_step": 218052, "epoch": 1802} {"train_loss": -41.54631423950195, "global_step": 218053, "epoch": 1802} {"train_loss": -41.25410842895508, "global_step": 218054, "epoch": 1802} {"train_loss": -41.728126525878906, "global_step": 218055, "epoch": 1802} {"train_loss": -40.42701721191406, "global_step": 218056, "epoch": 1802} {"train_loss": -42.01670455932617, "global_step": 218057, "epoch": 1802} {"train_loss": -41.77458572387695, "global_step": 218058, "epoch": 1802} {"train_loss": -41.840492248535156, "global_step": 218059, "epoch": 1802} {"train_loss": -42.22420883178711, "global_step": 218060, "epoch": 1802} {"train_loss": -42.076271057128906, "global_step": 218061, "epoch": 1802} {"train_loss": -41.422340393066406, "global_step": 218062, "epoch": 1802} {"train_loss": -40.5076904296875, "global_step": 218063, "epoch": 1802} {"train_loss": -41.177406311035156, "global_step": 218064, "epoch": 1802} {"train_loss": -41.11338424682617, "global_step": 218065, "epoch": 1802} {"train_loss": -41.87632369995117, "global_step": 218066, "epoch": 1802} {"train_loss": -41.14957809448242, "global_step": 218067, "epoch": 1802} {"train_loss": -42.224430084228516, "global_step": 218068, "epoch": 1802} {"train_loss": -40.79159164428711, "global_step": 218069, "epoch": 1802} {"train_loss": -40.99630355834961, "global_step": 218070, "epoch": 1802} {"train_loss": -42.43827438354492, "global_step": 218071, "epoch": 1802} {"train_loss": -42.27891159057617, "global_step": 218072, "epoch": 1802} {"train_loss": -42.30134201049805, "global_step": 218073, "epoch": 1802} {"train_loss": -41.83942794799805, "global_step": 218074, "epoch": 1802} {"train_loss": -42.14759063720703, "global_step": 218075, "epoch": 1802} {"train_loss": -41.71253204345703, "global_step": 218076, "epoch": 1802} {"train_loss": -42.45428466796875, "global_step": 218077, "epoch": 1802} {"train_loss": -42.5695915222168, "global_step": 218078, "epoch": 1802} {"train_loss": -42.013275146484375, "global_step": 218079, "epoch": 1802} {"train_loss": -42.864437103271484, "global_step": 218080, "epoch": 1802} {"train_loss": -42.181434631347656, "global_step": 218081, "epoch": 1802} {"train_loss": -42.232147216796875, "global_step": 218082, "epoch": 1802} {"train_loss": -42.18258285522461, "global_step": 218083, "epoch": 1802} {"train_loss": -41.92700958251953, "global_step": 218084, "epoch": 1802} {"train_loss": -42.11228561401367, "global_step": 218085, "epoch": 1802} {"train_loss": -41.80036544799805, "global_step": 218086, "epoch": 1802} {"train_loss": -42.22392654418945, "global_step": 218087, "epoch": 1802} {"train_loss": -42.78843307495117, "global_step": 218088, "epoch": 1802} {"train_loss": -42.51839828491211, "global_step": 218089, "epoch": 1802} {"train_loss": -42.96211242675781, "global_step": 218090, "epoch": 1802} {"train_loss": -42.50677490234375, "global_step": 218091, "epoch": 1802} {"train_loss": -42.251644134521484, "global_step": 218092, "epoch": 1802} {"train_loss": -42.67389678955078, "global_step": 218093, "epoch": 1802} {"train_loss": -42.52048110961914, "global_step": 218094, "epoch": 1802} {"train_loss": -42.690948486328125, "global_step": 218095, "epoch": 1802} {"train_loss": -42.08065414428711, "global_step": 218096, "epoch": 1802} {"train_loss": -42.820098876953125, "global_step": 218097, "epoch": 1802} {"train_loss": -42.428627014160156, "global_step": 218098, "epoch": 1802} {"train_loss": -41.896812438964844, "global_step": 218099, "epoch": 1802} {"train_loss": -42.827205657958984, "global_step": 218100, "epoch": 1802} {"train_loss": -42.31074142456055, "global_step": 218101, "epoch": 1802} {"train_loss": -42.37628936767578, "global_step": 218102, "epoch": 1802} {"train_loss": -42.526119232177734, "global_step": 218103, "epoch": 1802} {"train_loss": -42.83644485473633, "global_step": 218104, "epoch": 1802} {"train_loss": -41.80439758300781, "global_step": 218105, "epoch": 1802} {"train_loss": -42.8404655456543, "global_step": 218106, "epoch": 1802} {"train_loss": -42.904598236083984, "global_step": 218107, "epoch": 1802} {"train_loss": -42.45166015625, "global_step": 218108, "epoch": 1802} {"train_loss": -41.829524993896484, "global_step": 218109, "epoch": 1802} {"train_loss": -42.91856384277344, "global_step": 218110, "epoch": 1802} {"train_loss": -42.9520378112793, "global_step": 218111, "epoch": 1802} {"train_loss": -40.92584991455078, "global_step": 218112, "epoch": 1802} {"train_loss": -40.45085906982422, "global_step": 218113, "epoch": 1802} {"train_loss": -41.374481201171875, "global_step": 218114, "epoch": 1802} {"train_loss": -42.244171142578125, "global_step": 218115, "epoch": 1802} {"train_loss": -42.62675094604492, "global_step": 218116, "epoch": 1802} {"train_loss": -40.85575485229492, "global_step": 218117, "epoch": 1802} {"train_loss": -41.6171875, "global_step": 218118, "epoch": 1802} {"train_loss": -41.504859924316406, "global_step": 218119, "epoch": 1802} {"train_loss": -42.252498626708984, "global_step": 218120, "epoch": 1802} {"train_loss": -41.02009201049805, "global_step": 218121, "epoch": 1802} {"train_loss": -40.6407356262207, "global_step": 218122, "epoch": 1802} {"train_loss": -41.45389938354492, "global_step": 218123, "epoch": 1802} {"train_loss": -42.531829833984375, "global_step": 218124, "epoch": 1802} {"train_loss": -41.6616096496582, "global_step": 218125, "epoch": 1802} {"train_loss": -41.14713668823242, "global_step": 218126, "epoch": 1802} {"train_loss": -42.40006637573242, "global_step": 218127, "epoch": 1802} {"train_loss": -42.165687561035156, "global_step": 218128, "epoch": 1802} {"train_loss": -39.611122131347656, "global_step": 218129, "epoch": 1802} {"train_loss": -39.82866668701172, "global_step": 218130, "epoch": 1802} {"train_loss": -37.16626739501953, "global_step": 218131, "epoch": 1802} {"train_loss": -42.00969314575195, "global_step": 218132, "epoch": 1802} {"train_loss": -40.5245246887207, "global_step": 218133, "epoch": 1802} {"train_loss": -40.21668243408203, "global_step": 218134, "epoch": 1802} {"train_loss": -42.0704460144043, "global_step": 218135, "epoch": 1802} {"train_loss": -40.41603469848633, "global_step": 218136, "epoch": 1802} {"train_loss": -40.720333099365234, "global_step": 218137, "epoch": 1802} {"train_loss": -40.39821243286133, "global_step": 218138, "epoch": 1802} {"train_loss": -40.43433380126953, "global_step": 218139, "epoch": 1802} {"train_loss": -40.03080368041992, "global_step": 218140, "epoch": 1802} {"train_loss": -39.48445129394531, "global_step": 218141, "epoch": 1802} {"train_loss": -40.33929443359375, "global_step": 218142, "epoch": 1802} {"train_loss": -39.81919860839844, "global_step": 218143, "epoch": 1802} {"train_loss": -40.01334762573242, "global_step": 218144, "epoch": 1802} {"train_loss": -40.933807373046875, "global_step": 218145, "epoch": 1802} {"train_loss": -41.8131217956543, "global_step": 218146, "epoch": 1802} {"train_loss": -40.56318283081055, "global_step": 218147, "epoch": 1802} {"train_loss": -41.351009368896484, "global_step": 218148, "epoch": 1802} {"train_loss": -41.67718505859375, "global_step": 218149, "epoch": 1802} {"train_loss": -41.59605026245117, "global_step": 218150, "epoch": 1802} {"train_loss": -41.20200729370117, "global_step": 218151, "epoch": 1802} {"train_loss": -41.251930236816406, "global_step": 218152, "epoch": 1802} {"train_loss": -41.6540641784668, "global_step": 218153, "epoch": 1802} {"train_loss": -40.813262939453125, "global_step": 218154, "epoch": 1802} {"train_loss": -40.7785758972168, "global_step": 218155, "epoch": 1802} {"train_loss": -40.09455871582031, "global_step": 218156, "epoch": 1802} {"train_loss": -41.75381851196289, "global_step": 218157, "epoch": 1802} {"train_loss": -40.66865158081055, "global_step": 218158, "epoch": 1802} {"train_loss": -41.03651428222656, "global_step": 218159, "epoch": 1802} {"train_loss": -41.09711837768555, "global_step": 218160, "epoch": 1802} {"train_loss": -40.28515625, "global_step": 218161, "epoch": 1802} {"train_loss": -41.48878791115501, "global_step": 218162, "epoch": 1802, "val_loss": 2692066.75} {"train_loss": -41.1717643737793, "global_step": 218163, "epoch": 1803} {"train_loss": -40.294673919677734, "global_step": 218164, "epoch": 1803} {"train_loss": -40.80666732788086, "global_step": 218165, "epoch": 1803} {"train_loss": -40.06684494018555, "global_step": 218166, "epoch": 1803} {"train_loss": -41.128662109375, "global_step": 218167, "epoch": 1803} {"train_loss": -41.355716705322266, "global_step": 218168, "epoch": 1803} {"train_loss": -41.85566329956055, "global_step": 218169, "epoch": 1803} {"train_loss": -41.91719436645508, "global_step": 218170, "epoch": 1803} {"train_loss": -41.4326286315918, "global_step": 218171, "epoch": 1803} {"train_loss": -39.52278137207031, "global_step": 218172, "epoch": 1803} {"train_loss": -41.976158142089844, "global_step": 218173, "epoch": 1803} {"train_loss": -41.381282806396484, "global_step": 218174, "epoch": 1803} {"train_loss": -40.636226654052734, "global_step": 218175, "epoch": 1803} {"train_loss": -40.503353118896484, "global_step": 218176, "epoch": 1803} {"train_loss": -41.51188278198242, "global_step": 218177, "epoch": 1803} {"train_loss": -40.791927337646484, "global_step": 218178, "epoch": 1803} {"train_loss": -41.359954833984375, "global_step": 218179, "epoch": 1803} {"train_loss": -42.34853744506836, "global_step": 218180, "epoch": 1803} {"train_loss": -40.754085540771484, "global_step": 218181, "epoch": 1803} {"train_loss": -38.83830642700195, "global_step": 218182, "epoch": 1803} {"train_loss": -39.826534271240234, "global_step": 218183, "epoch": 1803} {"train_loss": -41.38040542602539, "global_step": 218184, "epoch": 1803} {"train_loss": -40.78425216674805, "global_step": 218185, "epoch": 1803} {"train_loss": -41.559627532958984, "global_step": 218186, "epoch": 1803} {"train_loss": -40.007781982421875, "global_step": 218187, "epoch": 1803} {"train_loss": -41.27815628051758, "global_step": 218188, "epoch": 1803} {"train_loss": -42.184722900390625, "global_step": 218189, "epoch": 1803} {"train_loss": -41.45260238647461, "global_step": 218190, "epoch": 1803} {"train_loss": -41.60742950439453, "global_step": 218191, "epoch": 1803} {"train_loss": -39.19691848754883, "global_step": 218192, "epoch": 1803} {"train_loss": -40.795188903808594, "global_step": 218193, "epoch": 1803} {"train_loss": -41.878883361816406, "global_step": 218194, "epoch": 1803} {"train_loss": -39.92139434814453, "global_step": 218195, "epoch": 1803} {"train_loss": -41.61857223510742, "global_step": 218196, "epoch": 1803} {"train_loss": -40.123924255371094, "global_step": 218197, "epoch": 1803} {"train_loss": -41.240196228027344, "global_step": 218198, "epoch": 1803} {"train_loss": -41.942054748535156, "global_step": 218199, "epoch": 1803} {"train_loss": -41.396236419677734, "global_step": 218200, "epoch": 1803} {"train_loss": -35.36701583862305, "global_step": 218201, "epoch": 1803} {"train_loss": -31.89875602722168, "global_step": 218202, "epoch": 1803} {"train_loss": -40.245094299316406, "global_step": 218203, "epoch": 1803} {"train_loss": -40.9769401550293, "global_step": 218204, "epoch": 1803} {"train_loss": -40.550758361816406, "global_step": 218205, "epoch": 1803} {"train_loss": -40.34555435180664, "global_step": 218206, "epoch": 1803} {"train_loss": -39.64494323730469, "global_step": 218207, "epoch": 1803} {"train_loss": -34.824501037597656, "global_step": 218208, "epoch": 1803} {"train_loss": -26.8602352142334, "global_step": 218209, "epoch": 1803} {"train_loss": -37.55961990356445, "global_step": 218210, "epoch": 1803} {"train_loss": -39.866058349609375, "global_step": 218211, "epoch": 1803} {"train_loss": -34.181617736816406, "global_step": 218212, "epoch": 1803} {"train_loss": -13.155047416687012, "global_step": 218213, "epoch": 1803} {"train_loss": -34.4738883972168, "global_step": 218214, "epoch": 1803} {"train_loss": -37.05595779418945, "global_step": 218215, "epoch": 1803} {"train_loss": -37.60844802856445, "global_step": 218216, "epoch": 1803} {"train_loss": -36.67255783081055, "global_step": 218217, "epoch": 1803} {"train_loss": -33.40242385864258, "global_step": 218218, "epoch": 1803} {"train_loss": -34.522987365722656, "global_step": 218219, "epoch": 1803} {"train_loss": -32.48476791381836, "global_step": 218220, "epoch": 1803} {"train_loss": -36.555694580078125, "global_step": 218221, "epoch": 1803} {"train_loss": -35.299922943115234, "global_step": 218222, "epoch": 1803} {"train_loss": -38.118377685546875, "global_step": 218223, "epoch": 1803} {"train_loss": -33.25638961791992, "global_step": 218224, "epoch": 1803} {"train_loss": -36.36007308959961, "global_step": 218225, "epoch": 1803} {"train_loss": -35.94092559814453, "global_step": 218226, "epoch": 1803} {"train_loss": -38.01951217651367, "global_step": 218227, "epoch": 1803} {"train_loss": -36.98260498046875, "global_step": 218228, "epoch": 1803} {"train_loss": -37.56671905517578, "global_step": 218229, "epoch": 1803} {"train_loss": -36.172725677490234, "global_step": 218230, "epoch": 1803} {"train_loss": -38.874488830566406, "global_step": 218231, "epoch": 1803} {"train_loss": -34.737178802490234, "global_step": 218232, "epoch": 1803} {"train_loss": -38.91495895385742, "global_step": 218233, "epoch": 1803} {"train_loss": -34.69028854370117, "global_step": 218234, "epoch": 1803} {"train_loss": -38.506446838378906, "global_step": 218235, "epoch": 1803} {"train_loss": -37.19552993774414, "global_step": 218236, "epoch": 1803} {"train_loss": -37.84613037109375, "global_step": 218237, "epoch": 1803} {"train_loss": -37.31437683105469, "global_step": 218238, "epoch": 1803} {"train_loss": -38.03976058959961, "global_step": 218239, "epoch": 1803} {"train_loss": -36.01679229736328, "global_step": 218240, "epoch": 1803} {"train_loss": -38.00279235839844, "global_step": 218241, "epoch": 1803} {"train_loss": -38.75759506225586, "global_step": 218242, "epoch": 1803} {"train_loss": -37.96242904663086, "global_step": 218243, "epoch": 1803} {"train_loss": -37.2639274597168, "global_step": 218244, "epoch": 1803} {"train_loss": -39.25168228149414, "global_step": 218245, "epoch": 1803} {"train_loss": -39.023406982421875, "global_step": 218246, "epoch": 1803} {"train_loss": -38.252140045166016, "global_step": 218247, "epoch": 1803} {"train_loss": -39.66305160522461, "global_step": 218248, "epoch": 1803} {"train_loss": -38.918704986572266, "global_step": 218249, "epoch": 1803} {"train_loss": -39.69293212890625, "global_step": 218250, "epoch": 1803} {"train_loss": -40.23110580444336, "global_step": 218251, "epoch": 1803} {"train_loss": -38.282894134521484, "global_step": 218252, "epoch": 1803} {"train_loss": -39.3547477722168, "global_step": 218253, "epoch": 1803} {"train_loss": -40.60886764526367, "global_step": 218254, "epoch": 1803} {"train_loss": -37.93397903442383, "global_step": 218255, "epoch": 1803} {"train_loss": -39.983009338378906, "global_step": 218256, "epoch": 1803} {"train_loss": -39.91550827026367, "global_step": 218257, "epoch": 1803} {"train_loss": -39.3489990234375, "global_step": 218258, "epoch": 1803} {"train_loss": -39.72747802734375, "global_step": 218259, "epoch": 1803} {"train_loss": -40.27321243286133, "global_step": 218260, "epoch": 1803} {"train_loss": -39.778743743896484, "global_step": 218261, "epoch": 1803} {"train_loss": -39.76194763183594, "global_step": 218262, "epoch": 1803} {"train_loss": -38.937618255615234, "global_step": 218263, "epoch": 1803} {"train_loss": -38.78628158569336, "global_step": 218264, "epoch": 1803} {"train_loss": -40.336273193359375, "global_step": 218265, "epoch": 1803} {"train_loss": -38.9284782409668, "global_step": 218266, "epoch": 1803} {"train_loss": -40.25796127319336, "global_step": 218267, "epoch": 1803} {"train_loss": -39.42909240722656, "global_step": 218268, "epoch": 1803} {"train_loss": -39.792625427246094, "global_step": 218269, "epoch": 1803} {"train_loss": -41.12565994262695, "global_step": 218270, "epoch": 1803} {"train_loss": -39.75590133666992, "global_step": 218271, "epoch": 1803} {"train_loss": -40.76674270629883, "global_step": 218272, "epoch": 1803} {"train_loss": -40.3400993347168, "global_step": 218273, "epoch": 1803} {"train_loss": -40.17885971069336, "global_step": 218274, "epoch": 1803} {"train_loss": -39.56351852416992, "global_step": 218275, "epoch": 1803} {"train_loss": -39.935970306396484, "global_step": 218276, "epoch": 1803} {"train_loss": -40.67390060424805, "global_step": 218277, "epoch": 1803} {"train_loss": -41.291378021240234, "global_step": 218278, "epoch": 1803} {"train_loss": -38.61235427856445, "global_step": 218279, "epoch": 1803} {"train_loss": -41.16141891479492, "global_step": 218280, "epoch": 1803} {"train_loss": -40.17184066772461, "global_step": 218281, "epoch": 1803} {"train_loss": -41.13853073120117, "global_step": 218282, "epoch": 1803} {"train_loss": -38.844106713602365, "global_step": 218283, "epoch": 1803, "val_loss": 2625813.0} {"train_loss": -40.47886657714844, "global_step": 218284, "epoch": 1804} {"train_loss": -40.25493240356445, "global_step": 218285, "epoch": 1804} {"train_loss": -40.67600631713867, "global_step": 218286, "epoch": 1804} {"train_loss": -41.050846099853516, "global_step": 218287, "epoch": 1804} {"train_loss": -41.02104568481445, "global_step": 218288, "epoch": 1804} {"train_loss": -41.60466384887695, "global_step": 218289, "epoch": 1804} {"train_loss": -41.29375457763672, "global_step": 218290, "epoch": 1804} {"train_loss": -40.68316650390625, "global_step": 218291, "epoch": 1804} {"train_loss": -41.02903366088867, "global_step": 218292, "epoch": 1804} {"train_loss": -40.74342727661133, "global_step": 218293, "epoch": 1804} {"train_loss": -40.05522155761719, "global_step": 218294, "epoch": 1804} {"train_loss": -41.07168960571289, "global_step": 218295, "epoch": 1804} {"train_loss": -41.325069427490234, "global_step": 218296, "epoch": 1804} {"train_loss": -41.01868438720703, "global_step": 218297, "epoch": 1804} {"train_loss": -41.2984619140625, "global_step": 218298, "epoch": 1804} {"train_loss": -41.447750091552734, "global_step": 218299, "epoch": 1804} {"train_loss": -40.95170211791992, "global_step": 218300, "epoch": 1804} {"train_loss": -41.1413688659668, "global_step": 218301, "epoch": 1804} {"train_loss": -41.411537170410156, "global_step": 218302, "epoch": 1804} {"train_loss": -41.19548034667969, "global_step": 218303, "epoch": 1804} {"train_loss": -41.41010665893555, "global_step": 218304, "epoch": 1804} {"train_loss": -42.12430953979492, "global_step": 218305, "epoch": 1804} {"train_loss": -41.510658264160156, "global_step": 218306, "epoch": 1804} {"train_loss": -41.45585632324219, "global_step": 218307, "epoch": 1804} {"train_loss": -40.999732971191406, "global_step": 218308, "epoch": 1804} {"train_loss": -41.32485580444336, "global_step": 218309, "epoch": 1804} {"train_loss": -42.361328125, "global_step": 218310, "epoch": 1804} {"train_loss": -41.62481689453125, "global_step": 218311, "epoch": 1804} {"train_loss": -42.05879211425781, "global_step": 218312, "epoch": 1804} {"train_loss": -41.59739303588867, "global_step": 218313, "epoch": 1804} {"train_loss": -41.207740783691406, "global_step": 218314, "epoch": 1804} {"train_loss": -41.98598861694336, "global_step": 218315, "epoch": 1804} {"train_loss": -40.79285430908203, "global_step": 218316, "epoch": 1804} {"train_loss": -41.28449630737305, "global_step": 218317, "epoch": 1804} {"train_loss": -42.4661750793457, "global_step": 218318, "epoch": 1804} {"train_loss": -40.891273498535156, "global_step": 218319, "epoch": 1804} {"train_loss": -41.63188171386719, "global_step": 218320, "epoch": 1804} {"train_loss": -42.10502243041992, "global_step": 218321, "epoch": 1804} {"train_loss": -41.38710403442383, "global_step": 218322, "epoch": 1804} {"train_loss": -41.52674102783203, "global_step": 218323, "epoch": 1804} {"train_loss": -41.655887603759766, "global_step": 218324, "epoch": 1804} {"train_loss": -40.624061584472656, "global_step": 218325, "epoch": 1804} {"train_loss": -41.85404968261719, "global_step": 218326, "epoch": 1804} {"train_loss": -42.391788482666016, "global_step": 218327, "epoch": 1804} {"train_loss": -41.865150451660156, "global_step": 218328, "epoch": 1804} {"train_loss": -42.62179183959961, "global_step": 218329, "epoch": 1804} {"train_loss": -42.0507926940918, "global_step": 218330, "epoch": 1804} {"train_loss": -42.337249755859375, "global_step": 218331, "epoch": 1804} {"train_loss": -41.6179313659668, "global_step": 218332, "epoch": 1804} {"train_loss": -42.3204345703125, "global_step": 218333, "epoch": 1804} {"train_loss": -41.942909240722656, "global_step": 218334, "epoch": 1804} {"train_loss": -42.342742919921875, "global_step": 218335, "epoch": 1804} {"train_loss": -42.4072151184082, "global_step": 218336, "epoch": 1804} {"train_loss": -42.469512939453125, "global_step": 218337, "epoch": 1804} {"train_loss": -41.30170822143555, "global_step": 218338, "epoch": 1804} {"train_loss": -42.15133285522461, "global_step": 218339, "epoch": 1804} {"train_loss": -41.9792366027832, "global_step": 218340, "epoch": 1804} {"train_loss": -42.173458099365234, "global_step": 218341, "epoch": 1804} {"train_loss": -42.39272689819336, "global_step": 218342, "epoch": 1804} {"train_loss": -41.90461349487305, "global_step": 218343, "epoch": 1804} {"train_loss": -42.56059646606445, "global_step": 218344, "epoch": 1804} {"train_loss": -42.224056243896484, "global_step": 218345, "epoch": 1804} {"train_loss": -41.68546676635742, "global_step": 218346, "epoch": 1804} {"train_loss": -41.356502532958984, "global_step": 218347, "epoch": 1804} {"train_loss": -40.23054885864258, "global_step": 218348, "epoch": 1804} {"train_loss": -41.1517219543457, "global_step": 218349, "epoch": 1804} {"train_loss": -41.887203216552734, "global_step": 218350, "epoch": 1804} {"train_loss": -42.0536003112793, "global_step": 218351, "epoch": 1804} {"train_loss": -42.449302673339844, "global_step": 218352, "epoch": 1804} {"train_loss": -41.60892868041992, "global_step": 218353, "epoch": 1804} {"train_loss": -40.9255256652832, "global_step": 218354, "epoch": 1804} {"train_loss": -41.71882247924805, "global_step": 218355, "epoch": 1804} {"train_loss": -39.65370559692383, "global_step": 218356, "epoch": 1804} {"train_loss": -41.052276611328125, "global_step": 218357, "epoch": 1804} {"train_loss": -38.98153305053711, "global_step": 218358, "epoch": 1804} {"train_loss": -35.76455307006836, "global_step": 218359, "epoch": 1804} {"train_loss": -38.127498626708984, "global_step": 218360, "epoch": 1804} {"train_loss": -39.591732025146484, "global_step": 218361, "epoch": 1804} {"train_loss": -39.45558547973633, "global_step": 218362, "epoch": 1804} {"train_loss": -41.84495544433594, "global_step": 218363, "epoch": 1804} {"train_loss": -40.66446304321289, "global_step": 218364, "epoch": 1804} {"train_loss": -40.507755279541016, "global_step": 218365, "epoch": 1804} {"train_loss": -40.43090057373047, "global_step": 218366, "epoch": 1804} {"train_loss": -41.626487731933594, "global_step": 218367, "epoch": 1804} {"train_loss": -41.76225662231445, "global_step": 218368, "epoch": 1804} {"train_loss": -41.15102767944336, "global_step": 218369, "epoch": 1804} {"train_loss": -41.62232208251953, "global_step": 218370, "epoch": 1804} {"train_loss": -40.97963333129883, "global_step": 218371, "epoch": 1804} {"train_loss": -40.05282974243164, "global_step": 218372, "epoch": 1804} {"train_loss": -41.289527893066406, "global_step": 218373, "epoch": 1804} {"train_loss": -41.774044036865234, "global_step": 218374, "epoch": 1804} {"train_loss": -41.43459701538086, "global_step": 218375, "epoch": 1804} {"train_loss": -40.880409240722656, "global_step": 218376, "epoch": 1804} {"train_loss": -40.169429779052734, "global_step": 218377, "epoch": 1804} {"train_loss": -39.49857711791992, "global_step": 218378, "epoch": 1804} {"train_loss": -41.38716506958008, "global_step": 218379, "epoch": 1804} {"train_loss": -42.30902099609375, "global_step": 218380, "epoch": 1804} {"train_loss": -41.28665542602539, "global_step": 218381, "epoch": 1804} {"train_loss": -39.94968795776367, "global_step": 218382, "epoch": 1804} {"train_loss": -39.90693283081055, "global_step": 218383, "epoch": 1804} {"train_loss": -40.53382110595703, "global_step": 218384, "epoch": 1804} {"train_loss": -42.13627243041992, "global_step": 218385, "epoch": 1804} {"train_loss": -42.3727912902832, "global_step": 218386, "epoch": 1804} {"train_loss": -41.2351188659668, "global_step": 218387, "epoch": 1804} {"train_loss": -40.00136184692383, "global_step": 218388, "epoch": 1804} {"train_loss": -41.5057258605957, "global_step": 218389, "epoch": 1804} {"train_loss": -41.4124641418457, "global_step": 218390, "epoch": 1804} {"train_loss": -41.676002502441406, "global_step": 218391, "epoch": 1804} {"train_loss": -41.85308837890625, "global_step": 218392, "epoch": 1804} {"train_loss": -41.624549865722656, "global_step": 218393, "epoch": 1804} {"train_loss": -42.332061767578125, "global_step": 218394, "epoch": 1804} {"train_loss": -41.44154739379883, "global_step": 218395, "epoch": 1804} {"train_loss": -40.89899444580078, "global_step": 218396, "epoch": 1804} {"train_loss": -40.74251937866211, "global_step": 218397, "epoch": 1804} {"train_loss": -41.836822509765625, "global_step": 218398, "epoch": 1804} {"train_loss": -40.84192657470703, "global_step": 218399, "epoch": 1804} {"train_loss": -40.7932014465332, "global_step": 218400, "epoch": 1804} {"train_loss": -41.3533821105957, "global_step": 218401, "epoch": 1804} {"train_loss": -42.232704162597656, "global_step": 218402, "epoch": 1804} {"train_loss": -40.93471908569336, "global_step": 218403, "epoch": 1804} {"train_loss": -41.26574801610521, "global_step": 218404, "epoch": 1804, "val_loss": 2622542.5} {"train_loss": -41.510074615478516, "global_step": 218405, "epoch": 1805} {"train_loss": -42.316184997558594, "global_step": 218406, "epoch": 1805} {"train_loss": -40.14217758178711, "global_step": 218407, "epoch": 1805} {"train_loss": -39.0191535949707, "global_step": 218408, "epoch": 1805} {"train_loss": -41.2155876159668, "global_step": 218409, "epoch": 1805} {"train_loss": -41.62434768676758, "global_step": 218410, "epoch": 1805} {"train_loss": -39.63377380371094, "global_step": 218411, "epoch": 1805} {"train_loss": -38.39698028564453, "global_step": 218412, "epoch": 1805} {"train_loss": -41.20432662963867, "global_step": 218413, "epoch": 1805} {"train_loss": -41.09740447998047, "global_step": 218414, "epoch": 1805} {"train_loss": -40.23627471923828, "global_step": 218415, "epoch": 1805} {"train_loss": -41.23714828491211, "global_step": 218416, "epoch": 1805} {"train_loss": -41.39650344848633, "global_step": 218417, "epoch": 1805} {"train_loss": -40.713592529296875, "global_step": 218418, "epoch": 1805} {"train_loss": -42.186119079589844, "global_step": 218419, "epoch": 1805} {"train_loss": -41.466224670410156, "global_step": 218420, "epoch": 1805} {"train_loss": -40.873451232910156, "global_step": 218421, "epoch": 1805} {"train_loss": -41.64912796020508, "global_step": 218422, "epoch": 1805} {"train_loss": -42.117164611816406, "global_step": 218423, "epoch": 1805} {"train_loss": -41.4892692565918, "global_step": 218424, "epoch": 1805} {"train_loss": -41.83673095703125, "global_step": 218425, "epoch": 1805} {"train_loss": -42.00136947631836, "global_step": 218426, "epoch": 1805} {"train_loss": -41.52370071411133, "global_step": 218427, "epoch": 1805} {"train_loss": -42.4029655456543, "global_step": 218428, "epoch": 1805} {"train_loss": -41.153133392333984, "global_step": 218429, "epoch": 1805} {"train_loss": -40.92562484741211, "global_step": 218430, "epoch": 1805} {"train_loss": -41.85572052001953, "global_step": 218431, "epoch": 1805} {"train_loss": -42.02838897705078, "global_step": 218432, "epoch": 1805} {"train_loss": -42.01470947265625, "global_step": 218433, "epoch": 1805} {"train_loss": -40.829307556152344, "global_step": 218434, "epoch": 1805} {"train_loss": -41.563194274902344, "global_step": 218435, "epoch": 1805} {"train_loss": -41.99152755737305, "global_step": 218436, "epoch": 1805} {"train_loss": -42.269813537597656, "global_step": 218437, "epoch": 1805} {"train_loss": -42.16852951049805, "global_step": 218438, "epoch": 1805} {"train_loss": -41.89179611206055, "global_step": 218439, "epoch": 1805} {"train_loss": -42.17466354370117, "global_step": 218440, "epoch": 1805} {"train_loss": -42.35809326171875, "global_step": 218441, "epoch": 1805} {"train_loss": -41.51909255981445, "global_step": 218442, "epoch": 1805} {"train_loss": -41.5260124206543, "global_step": 218443, "epoch": 1805} {"train_loss": -42.266902923583984, "global_step": 218444, "epoch": 1805} {"train_loss": -42.52417755126953, "global_step": 218445, "epoch": 1805} {"train_loss": -41.93312454223633, "global_step": 218446, "epoch": 1805} {"train_loss": -42.06616973876953, "global_step": 218447, "epoch": 1805} {"train_loss": -42.15108108520508, "global_step": 218448, "epoch": 1805} {"train_loss": -42.354793548583984, "global_step": 218449, "epoch": 1805} {"train_loss": -41.73322296142578, "global_step": 218450, "epoch": 1805} {"train_loss": -41.539363861083984, "global_step": 218451, "epoch": 1805} {"train_loss": -42.510555267333984, "global_step": 218452, "epoch": 1805} {"train_loss": -42.14826202392578, "global_step": 218453, "epoch": 1805} {"train_loss": -41.53828048706055, "global_step": 218454, "epoch": 1805} {"train_loss": -42.215816497802734, "global_step": 218455, "epoch": 1805} {"train_loss": -42.070960998535156, "global_step": 218456, "epoch": 1805} {"train_loss": -42.59853744506836, "global_step": 218457, "epoch": 1805} {"train_loss": -41.513553619384766, "global_step": 218458, "epoch": 1805} {"train_loss": -42.684661865234375, "global_step": 218459, "epoch": 1805} {"train_loss": -43.25087356567383, "global_step": 218460, "epoch": 1805} {"train_loss": -42.0741081237793, "global_step": 218461, "epoch": 1805} {"train_loss": -42.36497497558594, "global_step": 218462, "epoch": 1805} {"train_loss": -42.01689147949219, "global_step": 218463, "epoch": 1805} {"train_loss": -42.63729476928711, "global_step": 218464, "epoch": 1805} {"train_loss": -41.5921745300293, "global_step": 218465, "epoch": 1805} {"train_loss": -42.699867248535156, "global_step": 218466, "epoch": 1805} {"train_loss": -41.34785842895508, "global_step": 218467, "epoch": 1805} {"train_loss": -41.38893508911133, "global_step": 218468, "epoch": 1805} {"train_loss": -42.402984619140625, "global_step": 218469, "epoch": 1805} {"train_loss": -41.42838668823242, "global_step": 218470, "epoch": 1805} {"train_loss": -41.559661865234375, "global_step": 218471, "epoch": 1805} {"train_loss": -42.1089973449707, "global_step": 218472, "epoch": 1805} {"train_loss": -41.08252716064453, "global_step": 218473, "epoch": 1805} {"train_loss": -40.71207046508789, "global_step": 218474, "epoch": 1805} {"train_loss": -41.7464599609375, "global_step": 218475, "epoch": 1805} {"train_loss": -41.67478561401367, "global_step": 218476, "epoch": 1805} {"train_loss": -39.40087890625, "global_step": 218477, "epoch": 1805} {"train_loss": -38.88645553588867, "global_step": 218478, "epoch": 1805} {"train_loss": -40.51735305786133, "global_step": 218479, "epoch": 1805} {"train_loss": -40.83330154418945, "global_step": 218480, "epoch": 1805} {"train_loss": -40.05231857299805, "global_step": 218481, "epoch": 1805} {"train_loss": -39.31464767456055, "global_step": 218482, "epoch": 1805} {"train_loss": -41.26945877075195, "global_step": 218483, "epoch": 1805} {"train_loss": -40.30039978027344, "global_step": 218484, "epoch": 1805} {"train_loss": -41.564693450927734, "global_step": 218485, "epoch": 1805} {"train_loss": -41.07430648803711, "global_step": 218486, "epoch": 1805} {"train_loss": -40.42934799194336, "global_step": 218487, "epoch": 1805} {"train_loss": -41.8799934387207, "global_step": 218488, "epoch": 1805} {"train_loss": -41.49140930175781, "global_step": 218489, "epoch": 1805} {"train_loss": -41.56425476074219, "global_step": 218490, "epoch": 1805} {"train_loss": -41.24463653564453, "global_step": 218491, "epoch": 1805} {"train_loss": -41.42761993408203, "global_step": 218492, "epoch": 1805} {"train_loss": -41.928016662597656, "global_step": 218493, "epoch": 1805} {"train_loss": -40.61918258666992, "global_step": 218494, "epoch": 1805} {"train_loss": -41.64631271362305, "global_step": 218495, "epoch": 1805} {"train_loss": -40.761077880859375, "global_step": 218496, "epoch": 1805} {"train_loss": -41.03827667236328, "global_step": 218497, "epoch": 1805} {"train_loss": -41.41508102416992, "global_step": 218498, "epoch": 1805} {"train_loss": -40.787269592285156, "global_step": 218499, "epoch": 1805} {"train_loss": -40.85978317260742, "global_step": 218500, "epoch": 1805} {"train_loss": -39.40398025512695, "global_step": 218501, "epoch": 1805} {"train_loss": -35.664161682128906, "global_step": 218502, "epoch": 1805} {"train_loss": -34.34194564819336, "global_step": 218503, "epoch": 1805} {"train_loss": -36.41740798950195, "global_step": 218504, "epoch": 1805} {"train_loss": -40.41473388671875, "global_step": 218505, "epoch": 1805} {"train_loss": -37.099430084228516, "global_step": 218506, "epoch": 1805} {"train_loss": -38.914154052734375, "global_step": 218507, "epoch": 1805} {"train_loss": -39.960201263427734, "global_step": 218508, "epoch": 1805} {"train_loss": -37.79962158203125, "global_step": 218509, "epoch": 1805} {"train_loss": -39.78530502319336, "global_step": 218510, "epoch": 1805} {"train_loss": -40.687721252441406, "global_step": 218511, "epoch": 1805} {"train_loss": -39.754798889160156, "global_step": 218512, "epoch": 1805} {"train_loss": -41.2839469909668, "global_step": 218513, "epoch": 1805} {"train_loss": -41.28562545776367, "global_step": 218514, "epoch": 1805} {"train_loss": -41.652557373046875, "global_step": 218515, "epoch": 1805} {"train_loss": -41.66270065307617, "global_step": 218516, "epoch": 1805} {"train_loss": -41.775943756103516, "global_step": 218517, "epoch": 1805} {"train_loss": -41.795921325683594, "global_step": 218518, "epoch": 1805} {"train_loss": -41.7095947265625, "global_step": 218519, "epoch": 1805} {"train_loss": -42.4189453125, "global_step": 218520, "epoch": 1805} {"train_loss": -42.23147201538086, "global_step": 218521, "epoch": 1805} {"train_loss": -42.37250900268555, "global_step": 218522, "epoch": 1805} {"train_loss": -41.948570251464844, "global_step": 218523, "epoch": 1805} {"train_loss": -41.97800064086914, "global_step": 218524, "epoch": 1805} {"train_loss": -41.19163818989904, "global_step": 218525, "epoch": 1805, "val_loss": 2556500.5} {"train_loss": -42.32183074951172, "global_step": 218526, "epoch": 1806} {"train_loss": -42.02517318725586, "global_step": 218527, "epoch": 1806} {"train_loss": -42.395729064941406, "global_step": 218528, "epoch": 1806} {"train_loss": -42.00163650512695, "global_step": 218529, "epoch": 1806} {"train_loss": -42.003021240234375, "global_step": 218530, "epoch": 1806} {"train_loss": -42.490203857421875, "global_step": 218531, "epoch": 1806} {"train_loss": -41.383056640625, "global_step": 218532, "epoch": 1806} {"train_loss": -42.17586898803711, "global_step": 218533, "epoch": 1806} {"train_loss": -42.65850830078125, "global_step": 218534, "epoch": 1806} {"train_loss": -42.283077239990234, "global_step": 218535, "epoch": 1806} {"train_loss": -42.66917037963867, "global_step": 218536, "epoch": 1806} {"train_loss": -42.24589157104492, "global_step": 218537, "epoch": 1806} {"train_loss": -42.762874603271484, "global_step": 218538, "epoch": 1806} {"train_loss": -42.47434997558594, "global_step": 218539, "epoch": 1806} {"train_loss": -41.61882781982422, "global_step": 218540, "epoch": 1806} {"train_loss": -42.863380432128906, "global_step": 218541, "epoch": 1806} {"train_loss": -42.47010040283203, "global_step": 218542, "epoch": 1806} {"train_loss": -42.6126823425293, "global_step": 218543, "epoch": 1806} {"train_loss": -42.25642776489258, "global_step": 218544, "epoch": 1806} {"train_loss": -42.649085998535156, "global_step": 218545, "epoch": 1806} {"train_loss": -42.76963424682617, "global_step": 218546, "epoch": 1806} {"train_loss": -42.53715515136719, "global_step": 218547, "epoch": 1806} {"train_loss": -42.85956954956055, "global_step": 218548, "epoch": 1806} {"train_loss": -42.24724197387695, "global_step": 218549, "epoch": 1806} {"train_loss": -42.502376556396484, "global_step": 218550, "epoch": 1806} {"train_loss": -42.38856506347656, "global_step": 218551, "epoch": 1806} {"train_loss": -42.59963607788086, "global_step": 218552, "epoch": 1806} {"train_loss": -42.01045608520508, "global_step": 218553, "epoch": 1806} {"train_loss": -42.707275390625, "global_step": 218554, "epoch": 1806} {"train_loss": -42.49367904663086, "global_step": 218555, "epoch": 1806} {"train_loss": -41.98415756225586, "global_step": 218556, "epoch": 1806} {"train_loss": -41.553367614746094, "global_step": 218557, "epoch": 1806} {"train_loss": -41.50114059448242, "global_step": 218558, "epoch": 1806} {"train_loss": -41.18362045288086, "global_step": 218559, "epoch": 1806} {"train_loss": -42.934051513671875, "global_step": 218560, "epoch": 1806} {"train_loss": -42.296443939208984, "global_step": 218561, "epoch": 1806} {"train_loss": -41.156124114990234, "global_step": 218562, "epoch": 1806} {"train_loss": -41.89543533325195, "global_step": 218563, "epoch": 1806} {"train_loss": -42.83472442626953, "global_step": 218564, "epoch": 1806} {"train_loss": -41.39731979370117, "global_step": 218565, "epoch": 1806} {"train_loss": -40.40328598022461, "global_step": 218566, "epoch": 1806} {"train_loss": -41.15207290649414, "global_step": 218567, "epoch": 1806} {"train_loss": -42.83759307861328, "global_step": 218568, "epoch": 1806} {"train_loss": -42.40924072265625, "global_step": 218569, "epoch": 1806} {"train_loss": -42.08552169799805, "global_step": 218570, "epoch": 1806} {"train_loss": -42.42811965942383, "global_step": 218571, "epoch": 1806} {"train_loss": -43.01927185058594, "global_step": 218572, "epoch": 1806} {"train_loss": -42.5675163269043, "global_step": 218573, "epoch": 1806} {"train_loss": -43.14738845825195, "global_step": 218574, "epoch": 1806} {"train_loss": -42.2509651184082, "global_step": 218575, "epoch": 1806} {"train_loss": -42.504295349121094, "global_step": 218576, "epoch": 1806} {"train_loss": -43.05158233642578, "global_step": 218577, "epoch": 1806} {"train_loss": -42.58600997924805, "global_step": 218578, "epoch": 1806} {"train_loss": -41.38047790527344, "global_step": 218579, "epoch": 1806} {"train_loss": -40.80634307861328, "global_step": 218580, "epoch": 1806} {"train_loss": -41.650367736816406, "global_step": 218581, "epoch": 1806} {"train_loss": -41.91378402709961, "global_step": 218582, "epoch": 1806} {"train_loss": -42.4481086730957, "global_step": 218583, "epoch": 1806} {"train_loss": -41.67932891845703, "global_step": 218584, "epoch": 1806} {"train_loss": -42.96720886230469, "global_step": 218585, "epoch": 1806} {"train_loss": -42.519866943359375, "global_step": 218586, "epoch": 1806} {"train_loss": -42.47084426879883, "global_step": 218587, "epoch": 1806} {"train_loss": -43.44941329956055, "global_step": 218588, "epoch": 1806} {"train_loss": -42.606407165527344, "global_step": 218589, "epoch": 1806} {"train_loss": -42.57546615600586, "global_step": 218590, "epoch": 1806} {"train_loss": -42.665584564208984, "global_step": 218591, "epoch": 1806} {"train_loss": -42.64625930786133, "global_step": 218592, "epoch": 1806} {"train_loss": -41.7317008972168, "global_step": 218593, "epoch": 1806} {"train_loss": -43.316314697265625, "global_step": 218594, "epoch": 1806} {"train_loss": -43.17037582397461, "global_step": 218595, "epoch": 1806} {"train_loss": -42.90069580078125, "global_step": 218596, "epoch": 1806} {"train_loss": -42.47473907470703, "global_step": 218597, "epoch": 1806} {"train_loss": -42.454647064208984, "global_step": 218598, "epoch": 1806} {"train_loss": -42.34505081176758, "global_step": 218599, "epoch": 1806} {"train_loss": -42.74405288696289, "global_step": 218600, "epoch": 1806} {"train_loss": -42.68143844604492, "global_step": 218601, "epoch": 1806} {"train_loss": -42.82230758666992, "global_step": 218602, "epoch": 1806} {"train_loss": -42.71796417236328, "global_step": 218603, "epoch": 1806} {"train_loss": -42.90629196166992, "global_step": 218604, "epoch": 1806} {"train_loss": -43.114219665527344, "global_step": 218605, "epoch": 1806} {"train_loss": -42.485389709472656, "global_step": 218606, "epoch": 1806} {"train_loss": -42.65788269042969, "global_step": 218607, "epoch": 1806} {"train_loss": -43.082313537597656, "global_step": 218608, "epoch": 1806} {"train_loss": -42.2325439453125, "global_step": 218609, "epoch": 1806} {"train_loss": -42.651912689208984, "global_step": 218610, "epoch": 1806} {"train_loss": -42.84248352050781, "global_step": 218611, "epoch": 1806} {"train_loss": -42.97246551513672, "global_step": 218612, "epoch": 1806} {"train_loss": -40.915679931640625, "global_step": 218613, "epoch": 1806} {"train_loss": -41.336421966552734, "global_step": 218614, "epoch": 1806} {"train_loss": -42.034324645996094, "global_step": 218615, "epoch": 1806} {"train_loss": -42.18598556518555, "global_step": 218616, "epoch": 1806} {"train_loss": -38.88648986816406, "global_step": 218617, "epoch": 1806} {"train_loss": -35.19761276245117, "global_step": 218618, "epoch": 1806} {"train_loss": -36.91829299926758, "global_step": 218619, "epoch": 1806} {"train_loss": -39.70117950439453, "global_step": 218620, "epoch": 1806} {"train_loss": -29.839941024780273, "global_step": 218621, "epoch": 1806} {"train_loss": -34.89802169799805, "global_step": 218622, "epoch": 1806} {"train_loss": -41.38143539428711, "global_step": 218623, "epoch": 1806} {"train_loss": -36.498897552490234, "global_step": 218624, "epoch": 1806} {"train_loss": -39.30150604248047, "global_step": 218625, "epoch": 1806} {"train_loss": -40.790225982666016, "global_step": 218626, "epoch": 1806} {"train_loss": -38.90603256225586, "global_step": 218627, "epoch": 1806} {"train_loss": -36.7816047668457, "global_step": 218628, "epoch": 1806} {"train_loss": -39.4891471862793, "global_step": 218629, "epoch": 1806} {"train_loss": -39.409027099609375, "global_step": 218630, "epoch": 1806} {"train_loss": -39.561790466308594, "global_step": 218631, "epoch": 1806} {"train_loss": -39.75680160522461, "global_step": 218632, "epoch": 1806} {"train_loss": -39.14130401611328, "global_step": 218633, "epoch": 1806} {"train_loss": -38.52136993408203, "global_step": 218634, "epoch": 1806} {"train_loss": -39.97966003417969, "global_step": 218635, "epoch": 1806} {"train_loss": -38.47256088256836, "global_step": 218636, "epoch": 1806} {"train_loss": -38.46071243286133, "global_step": 218637, "epoch": 1806} {"train_loss": -40.17374801635742, "global_step": 218638, "epoch": 1806} {"train_loss": -37.79352569580078, "global_step": 218639, "epoch": 1806} {"train_loss": -40.21281814575195, "global_step": 218640, "epoch": 1806} {"train_loss": -39.48629379272461, "global_step": 218641, "epoch": 1806} {"train_loss": -40.28065490722656, "global_step": 218642, "epoch": 1806} {"train_loss": -40.4130744934082, "global_step": 218643, "epoch": 1806} {"train_loss": -39.82548522949219, "global_step": 218644, "epoch": 1806} {"train_loss": -40.77947998046875, "global_step": 218645, "epoch": 1806} {"train_loss": -41.437151049779466, "global_step": 218646, "epoch": 1806, "val_loss": 2620865.75} {"train_loss": -41.410438537597656, "global_step": 218647, "epoch": 1807} {"train_loss": -39.33315658569336, "global_step": 218648, "epoch": 1807} {"train_loss": -41.482215881347656, "global_step": 218649, "epoch": 1807} {"train_loss": -41.25782012939453, "global_step": 218650, "epoch": 1807} {"train_loss": -40.76179885864258, "global_step": 218651, "epoch": 1807} {"train_loss": -42.12351989746094, "global_step": 218652, "epoch": 1807} {"train_loss": -41.08395004272461, "global_step": 218653, "epoch": 1807} {"train_loss": -41.2182731628418, "global_step": 218654, "epoch": 1807} {"train_loss": -41.35445785522461, "global_step": 218655, "epoch": 1807} {"train_loss": -41.44166564941406, "global_step": 218656, "epoch": 1807} {"train_loss": -40.88820266723633, "global_step": 218657, "epoch": 1807} {"train_loss": -41.97991943359375, "global_step": 218658, "epoch": 1807} {"train_loss": -41.762359619140625, "global_step": 218659, "epoch": 1807} {"train_loss": -41.73591232299805, "global_step": 218660, "epoch": 1807} {"train_loss": -41.85334396362305, "global_step": 218661, "epoch": 1807} {"train_loss": -41.76721954345703, "global_step": 218662, "epoch": 1807} {"train_loss": -42.11640167236328, "global_step": 218663, "epoch": 1807} {"train_loss": -42.470947265625, "global_step": 218664, "epoch": 1807} {"train_loss": -42.050052642822266, "global_step": 218665, "epoch": 1807} {"train_loss": -41.81678009033203, "global_step": 218666, "epoch": 1807} {"train_loss": -42.64946365356445, "global_step": 218667, "epoch": 1807} {"train_loss": -42.20417022705078, "global_step": 218668, "epoch": 1807} {"train_loss": -42.371585845947266, "global_step": 218669, "epoch": 1807} {"train_loss": -42.4670295715332, "global_step": 218670, "epoch": 1807} {"train_loss": -42.70676803588867, "global_step": 218671, "epoch": 1807} {"train_loss": -42.312583923339844, "global_step": 218672, "epoch": 1807} {"train_loss": -42.67490005493164, "global_step": 218673, "epoch": 1807} {"train_loss": -42.77002716064453, "global_step": 218674, "epoch": 1807} {"train_loss": -42.73488235473633, "global_step": 218675, "epoch": 1807} {"train_loss": -42.76716232299805, "global_step": 218676, "epoch": 1807} {"train_loss": -42.48347091674805, "global_step": 218677, "epoch": 1807} {"train_loss": -42.48127365112305, "global_step": 218678, "epoch": 1807} {"train_loss": -42.642822265625, "global_step": 218679, "epoch": 1807} {"train_loss": -42.40622329711914, "global_step": 218680, "epoch": 1807} {"train_loss": -42.954036712646484, "global_step": 218681, "epoch": 1807} {"train_loss": -42.83125305175781, "global_step": 218682, "epoch": 1807} {"train_loss": -42.994014739990234, "global_step": 218683, "epoch": 1807} {"train_loss": -43.31245040893555, "global_step": 218684, "epoch": 1807} {"train_loss": -42.968109130859375, "global_step": 218685, "epoch": 1807} {"train_loss": -42.7118034362793, "global_step": 218686, "epoch": 1807} {"train_loss": -43.02558135986328, "global_step": 218687, "epoch": 1807} {"train_loss": -42.54289627075195, "global_step": 218688, "epoch": 1807} {"train_loss": -42.79981994628906, "global_step": 218689, "epoch": 1807} {"train_loss": -43.192256927490234, "global_step": 218690, "epoch": 1807} {"train_loss": -43.20933151245117, "global_step": 218691, "epoch": 1807} {"train_loss": -42.56429672241211, "global_step": 218692, "epoch": 1807} {"train_loss": -43.309959411621094, "global_step": 218693, "epoch": 1807} {"train_loss": -43.25474166870117, "global_step": 218694, "epoch": 1807} {"train_loss": -42.95228576660156, "global_step": 218695, "epoch": 1807} {"train_loss": -43.15711212158203, "global_step": 218696, "epoch": 1807} {"train_loss": -43.235328674316406, "global_step": 218697, "epoch": 1807} {"train_loss": -42.73103332519531, "global_step": 218698, "epoch": 1807} {"train_loss": -42.98519515991211, "global_step": 218699, "epoch": 1807} {"train_loss": -42.79975509643555, "global_step": 218700, "epoch": 1807} {"train_loss": -43.080909729003906, "global_step": 218701, "epoch": 1807} {"train_loss": -43.286590576171875, "global_step": 218702, "epoch": 1807} {"train_loss": -43.33313751220703, "global_step": 218703, "epoch": 1807} {"train_loss": -43.41730880737305, "global_step": 218704, "epoch": 1807} {"train_loss": -43.1402473449707, "global_step": 218705, "epoch": 1807} {"train_loss": -42.56485366821289, "global_step": 218706, "epoch": 1807} {"train_loss": -42.93076705932617, "global_step": 218707, "epoch": 1807} {"train_loss": -43.13048553466797, "global_step": 218708, "epoch": 1807} {"train_loss": -42.48209762573242, "global_step": 218709, "epoch": 1807} {"train_loss": -42.18679428100586, "global_step": 218710, "epoch": 1807} {"train_loss": -42.2028923034668, "global_step": 218711, "epoch": 1807} {"train_loss": -41.66781234741211, "global_step": 218712, "epoch": 1807} {"train_loss": -41.156494140625, "global_step": 218713, "epoch": 1807} {"train_loss": -41.4783821105957, "global_step": 218714, "epoch": 1807} {"train_loss": -39.105281829833984, "global_step": 218715, "epoch": 1807} {"train_loss": -32.748382568359375, "global_step": 218716, "epoch": 1807} {"train_loss": -18.08363914489746, "global_step": 218717, "epoch": 1807} {"train_loss": -9.207133293151855, "global_step": 218718, "epoch": 1807} {"train_loss": 5.6246747970581055, "global_step": 218719, "epoch": 1807} {"train_loss": -13.744699478149414, "global_step": 218720, "epoch": 1807} {"train_loss": -30.651508331298828, "global_step": 218721, "epoch": 1807} {"train_loss": -16.498138427734375, "global_step": 218722, "epoch": 1807} {"train_loss": -29.573877334594727, "global_step": 218723, "epoch": 1807} {"train_loss": -24.063312530517578, "global_step": 218724, "epoch": 1807} {"train_loss": -31.718297958374023, "global_step": 218725, "epoch": 1807} {"train_loss": -33.1825065612793, "global_step": 218726, "epoch": 1807} {"train_loss": -34.306129455566406, "global_step": 218727, "epoch": 1807} {"train_loss": -34.36789321899414, "global_step": 218728, "epoch": 1807} {"train_loss": -35.45016098022461, "global_step": 218729, "epoch": 1807} {"train_loss": -36.44974136352539, "global_step": 218730, "epoch": 1807} {"train_loss": -35.022315979003906, "global_step": 218731, "epoch": 1807} {"train_loss": -37.99907302856445, "global_step": 218732, "epoch": 1807} {"train_loss": -35.430999755859375, "global_step": 218733, "epoch": 1807} {"train_loss": -37.54705810546875, "global_step": 218734, "epoch": 1807} {"train_loss": -35.98069381713867, "global_step": 218735, "epoch": 1807} {"train_loss": -38.46741485595703, "global_step": 218736, "epoch": 1807} {"train_loss": -38.822078704833984, "global_step": 218737, "epoch": 1807} {"train_loss": -37.66695022583008, "global_step": 218738, "epoch": 1807} {"train_loss": -39.53301239013672, "global_step": 218739, "epoch": 1807} {"train_loss": -39.83523941040039, "global_step": 218740, "epoch": 1807} {"train_loss": -38.68510055541992, "global_step": 218741, "epoch": 1807} {"train_loss": -39.04193878173828, "global_step": 218742, "epoch": 1807} {"train_loss": -39.571563720703125, "global_step": 218743, "epoch": 1807} {"train_loss": -39.86628341674805, "global_step": 218744, "epoch": 1807} {"train_loss": -39.50357437133789, "global_step": 218745, "epoch": 1807} {"train_loss": -39.55747604370117, "global_step": 218746, "epoch": 1807} {"train_loss": -39.856266021728516, "global_step": 218747, "epoch": 1807} {"train_loss": -40.39284896850586, "global_step": 218748, "epoch": 1807} {"train_loss": -40.8286247253418, "global_step": 218749, "epoch": 1807} {"train_loss": -39.853759765625, "global_step": 218750, "epoch": 1807} {"train_loss": -40.46738815307617, "global_step": 218751, "epoch": 1807} {"train_loss": -40.30207061767578, "global_step": 218752, "epoch": 1807} {"train_loss": -40.73809814453125, "global_step": 218753, "epoch": 1807} {"train_loss": -40.59776306152344, "global_step": 218754, "epoch": 1807} {"train_loss": -40.12378692626953, "global_step": 218755, "epoch": 1807} {"train_loss": -40.58930587768555, "global_step": 218756, "epoch": 1807} {"train_loss": -40.84126663208008, "global_step": 218757, "epoch": 1807} {"train_loss": -40.64756393432617, "global_step": 218758, "epoch": 1807} {"train_loss": -40.719642639160156, "global_step": 218759, "epoch": 1807} {"train_loss": -41.19975662231445, "global_step": 218760, "epoch": 1807} {"train_loss": -40.91714096069336, "global_step": 218761, "epoch": 1807} {"train_loss": -40.84354782104492, "global_step": 218762, "epoch": 1807} {"train_loss": -41.16050338745117, "global_step": 218763, "epoch": 1807} {"train_loss": -41.272212982177734, "global_step": 218764, "epoch": 1807} {"train_loss": -40.98322677612305, "global_step": 218765, "epoch": 1807} {"train_loss": -41.22294235229492, "global_step": 218766, "epoch": 1807} {"train_loss": -39.35506123944747, "global_step": 218767, "epoch": 1807, "val_loss": 2533632.0} {"train_loss": -41.69667434692383, "global_step": 218768, "epoch": 1808} {"train_loss": -40.98103713989258, "global_step": 218769, "epoch": 1808} {"train_loss": -41.485870361328125, "global_step": 218770, "epoch": 1808} {"train_loss": -41.7650260925293, "global_step": 218771, "epoch": 1808} {"train_loss": -41.304134368896484, "global_step": 218772, "epoch": 1808} {"train_loss": -41.769901275634766, "global_step": 218773, "epoch": 1808} {"train_loss": -41.6625862121582, "global_step": 218774, "epoch": 1808} {"train_loss": -41.52519607543945, "global_step": 218775, "epoch": 1808} {"train_loss": -41.91584396362305, "global_step": 218776, "epoch": 1808} {"train_loss": -41.71699523925781, "global_step": 218777, "epoch": 1808} {"train_loss": -41.92245101928711, "global_step": 218778, "epoch": 1808} {"train_loss": -42.16292953491211, "global_step": 218779, "epoch": 1808} {"train_loss": -42.036128997802734, "global_step": 218780, "epoch": 1808} {"train_loss": -41.91341781616211, "global_step": 218781, "epoch": 1808} {"train_loss": -42.317596435546875, "global_step": 218782, "epoch": 1808} {"train_loss": -41.920265197753906, "global_step": 218783, "epoch": 1808} {"train_loss": -42.140052795410156, "global_step": 218784, "epoch": 1808} {"train_loss": -42.19808578491211, "global_step": 218785, "epoch": 1808} {"train_loss": -42.04215621948242, "global_step": 218786, "epoch": 1808} {"train_loss": -42.0809440612793, "global_step": 218787, "epoch": 1808} {"train_loss": -42.251441955566406, "global_step": 218788, "epoch": 1808} {"train_loss": -41.78961181640625, "global_step": 218789, "epoch": 1808} {"train_loss": -42.22880172729492, "global_step": 218790, "epoch": 1808} {"train_loss": -42.33887481689453, "global_step": 218791, "epoch": 1808} {"train_loss": -42.3036003112793, "global_step": 218792, "epoch": 1808} {"train_loss": -42.33807373046875, "global_step": 218793, "epoch": 1808} {"train_loss": -42.48016357421875, "global_step": 218794, "epoch": 1808} {"train_loss": -42.15239334106445, "global_step": 218795, "epoch": 1808} {"train_loss": -42.31473922729492, "global_step": 218796, "epoch": 1808} {"train_loss": -42.516937255859375, "global_step": 218797, "epoch": 1808} {"train_loss": -42.32711410522461, "global_step": 218798, "epoch": 1808} {"train_loss": -42.819374084472656, "global_step": 218799, "epoch": 1808} {"train_loss": -42.49055862426758, "global_step": 218800, "epoch": 1808} {"train_loss": -42.60152053833008, "global_step": 218801, "epoch": 1808} {"train_loss": -42.52481460571289, "global_step": 218802, "epoch": 1808} {"train_loss": -42.63875961303711, "global_step": 218803, "epoch": 1808} {"train_loss": -42.4422492980957, "global_step": 218804, "epoch": 1808} {"train_loss": -42.63452911376953, "global_step": 218805, "epoch": 1808} {"train_loss": -42.72469711303711, "global_step": 218806, "epoch": 1808} {"train_loss": -42.505348205566406, "global_step": 218807, "epoch": 1808} {"train_loss": -42.47710037231445, "global_step": 218808, "epoch": 1808} {"train_loss": -43.12539291381836, "global_step": 218809, "epoch": 1808} {"train_loss": -42.203399658203125, "global_step": 218810, "epoch": 1808} {"train_loss": -42.738468170166016, "global_step": 218811, "epoch": 1808} {"train_loss": -42.74188232421875, "global_step": 218812, "epoch": 1808} {"train_loss": -43.01603698730469, "global_step": 218813, "epoch": 1808} {"train_loss": -42.86790084838867, "global_step": 218814, "epoch": 1808} {"train_loss": -42.4776496887207, "global_step": 218815, "epoch": 1808} {"train_loss": -42.89491653442383, "global_step": 218816, "epoch": 1808} {"train_loss": -42.90642166137695, "global_step": 218817, "epoch": 1808} {"train_loss": -42.65583419799805, "global_step": 218818, "epoch": 1808} {"train_loss": -43.02635192871094, "global_step": 218819, "epoch": 1808} {"train_loss": -43.282440185546875, "global_step": 218820, "epoch": 1808} {"train_loss": -42.6829948425293, "global_step": 218821, "epoch": 1808} {"train_loss": -43.1800422668457, "global_step": 218822, "epoch": 1808} {"train_loss": -42.86578369140625, "global_step": 218823, "epoch": 1808} {"train_loss": -43.18560028076172, "global_step": 218824, "epoch": 1808} {"train_loss": -43.19120407104492, "global_step": 218825, "epoch": 1808} {"train_loss": -42.792999267578125, "global_step": 218826, "epoch": 1808} {"train_loss": -42.91374588012695, "global_step": 218827, "epoch": 1808} {"train_loss": -43.28545379638672, "global_step": 218828, "epoch": 1808} {"train_loss": -42.82807159423828, "global_step": 218829, "epoch": 1808} {"train_loss": -43.20963668823242, "global_step": 218830, "epoch": 1808} {"train_loss": -43.144412994384766, "global_step": 218831, "epoch": 1808} {"train_loss": -43.04179763793945, "global_step": 218832, "epoch": 1808} {"train_loss": -43.385292053222656, "global_step": 218833, "epoch": 1808} {"train_loss": -43.50674057006836, "global_step": 218834, "epoch": 1808} {"train_loss": -42.95927047729492, "global_step": 218835, "epoch": 1808} {"train_loss": -43.411773681640625, "global_step": 218836, "epoch": 1808} {"train_loss": -43.03506088256836, "global_step": 218837, "epoch": 1808} {"train_loss": -43.543514251708984, "global_step": 218838, "epoch": 1808} {"train_loss": -43.3211669921875, "global_step": 218839, "epoch": 1808} {"train_loss": -43.45136260986328, "global_step": 218840, "epoch": 1808} {"train_loss": -43.038055419921875, "global_step": 218841, "epoch": 1808} {"train_loss": -43.279109954833984, "global_step": 218842, "epoch": 1808} {"train_loss": -42.78939437866211, "global_step": 218843, "epoch": 1808} {"train_loss": -43.34771728515625, "global_step": 218844, "epoch": 1808} {"train_loss": -42.865196228027344, "global_step": 218845, "epoch": 1808} {"train_loss": -42.914302825927734, "global_step": 218846, "epoch": 1808} {"train_loss": -43.024784088134766, "global_step": 218847, "epoch": 1808} {"train_loss": -43.05549240112305, "global_step": 218848, "epoch": 1808} {"train_loss": -43.34562301635742, "global_step": 218849, "epoch": 1808} {"train_loss": -42.12188720703125, "global_step": 218850, "epoch": 1808} {"train_loss": -42.88612747192383, "global_step": 218851, "epoch": 1808} {"train_loss": -43.7586555480957, "global_step": 218852, "epoch": 1808} {"train_loss": -43.00794219970703, "global_step": 218853, "epoch": 1808} {"train_loss": -42.9337272644043, "global_step": 218854, "epoch": 1808} {"train_loss": -43.236263275146484, "global_step": 218855, "epoch": 1808} {"train_loss": -42.45051193237305, "global_step": 218856, "epoch": 1808} {"train_loss": -42.98220443725586, "global_step": 218857, "epoch": 1808} {"train_loss": -42.960201263427734, "global_step": 218858, "epoch": 1808} {"train_loss": -42.5863151550293, "global_step": 218859, "epoch": 1808} {"train_loss": -42.08686447143555, "global_step": 218860, "epoch": 1808} {"train_loss": -42.734928131103516, "global_step": 218861, "epoch": 1808} {"train_loss": -42.2932014465332, "global_step": 218862, "epoch": 1808} {"train_loss": -42.01844024658203, "global_step": 218863, "epoch": 1808} {"train_loss": -41.52392578125, "global_step": 218864, "epoch": 1808} {"train_loss": -40.051361083984375, "global_step": 218865, "epoch": 1808} {"train_loss": -41.49592590332031, "global_step": 218866, "epoch": 1808} {"train_loss": -42.8409309387207, "global_step": 218867, "epoch": 1808} {"train_loss": -41.53495788574219, "global_step": 218868, "epoch": 1808} {"train_loss": -39.68648147583008, "global_step": 218869, "epoch": 1808} {"train_loss": -39.139556884765625, "global_step": 218870, "epoch": 1808} {"train_loss": -40.85505294799805, "global_step": 218871, "epoch": 1808} {"train_loss": -41.5064582824707, "global_step": 218872, "epoch": 1808} {"train_loss": -41.27244186401367, "global_step": 218873, "epoch": 1808} {"train_loss": -40.268428802490234, "global_step": 218874, "epoch": 1808} {"train_loss": -41.36682891845703, "global_step": 218875, "epoch": 1808} {"train_loss": -41.4855842590332, "global_step": 218876, "epoch": 1808} {"train_loss": -40.66259765625, "global_step": 218877, "epoch": 1808} {"train_loss": -42.02225112915039, "global_step": 218878, "epoch": 1808} {"train_loss": -41.35531234741211, "global_step": 218879, "epoch": 1808} {"train_loss": -42.0322265625, "global_step": 218880, "epoch": 1808} {"train_loss": -40.19157028198242, "global_step": 218881, "epoch": 1808} {"train_loss": -42.04494857788086, "global_step": 218882, "epoch": 1808} {"train_loss": -41.77523422241211, "global_step": 218883, "epoch": 1808} {"train_loss": -41.17129135131836, "global_step": 218884, "epoch": 1808} {"train_loss": -41.2513542175293, "global_step": 218885, "epoch": 1808} {"train_loss": -41.770320892333984, "global_step": 218886, "epoch": 1808} {"train_loss": -41.504756927490234, "global_step": 218887, "epoch": 1808} {"train_loss": -42.31168261441317, "global_step": 218888, "epoch": 1808, "val_loss": 2528016.0} {"train_loss": -41.994178771972656, "global_step": 218889, "epoch": 1809} {"train_loss": -42.822845458984375, "global_step": 218890, "epoch": 1809} {"train_loss": -42.029449462890625, "global_step": 218891, "epoch": 1809} {"train_loss": -42.46476364135742, "global_step": 218892, "epoch": 1809} {"train_loss": -42.45839309692383, "global_step": 218893, "epoch": 1809} {"train_loss": -42.64554977416992, "global_step": 218894, "epoch": 1809} {"train_loss": -42.00712203979492, "global_step": 218895, "epoch": 1809} {"train_loss": -43.052913665771484, "global_step": 218896, "epoch": 1809} {"train_loss": -42.633419036865234, "global_step": 218897, "epoch": 1809} {"train_loss": -42.38947677612305, "global_step": 218898, "epoch": 1809} {"train_loss": -42.60854721069336, "global_step": 218899, "epoch": 1809} {"train_loss": -42.685020446777344, "global_step": 218900, "epoch": 1809} {"train_loss": -42.502967834472656, "global_step": 218901, "epoch": 1809} {"train_loss": -41.77777099609375, "global_step": 218902, "epoch": 1809} {"train_loss": -42.16358947753906, "global_step": 218903, "epoch": 1809} {"train_loss": -42.94624328613281, "global_step": 218904, "epoch": 1809} {"train_loss": -42.943458557128906, "global_step": 218905, "epoch": 1809} {"train_loss": -42.74912643432617, "global_step": 218906, "epoch": 1809} {"train_loss": -43.095733642578125, "global_step": 218907, "epoch": 1809} {"train_loss": -42.64421463012695, "global_step": 218908, "epoch": 1809} {"train_loss": -42.467071533203125, "global_step": 218909, "epoch": 1809} {"train_loss": -42.981624603271484, "global_step": 218910, "epoch": 1809} {"train_loss": -42.69084548950195, "global_step": 218911, "epoch": 1809} {"train_loss": -42.39323043823242, "global_step": 218912, "epoch": 1809} {"train_loss": -42.1567497253418, "global_step": 218913, "epoch": 1809} {"train_loss": -41.65784454345703, "global_step": 218914, "epoch": 1809} {"train_loss": -42.26392364501953, "global_step": 218915, "epoch": 1809} {"train_loss": -41.41340255737305, "global_step": 218916, "epoch": 1809} {"train_loss": -41.783058166503906, "global_step": 218917, "epoch": 1809} {"train_loss": -42.058250427246094, "global_step": 218918, "epoch": 1809} {"train_loss": -41.9499397277832, "global_step": 218919, "epoch": 1809} {"train_loss": -42.9504508972168, "global_step": 218920, "epoch": 1809} {"train_loss": -41.520816802978516, "global_step": 218921, "epoch": 1809} {"train_loss": -40.824947357177734, "global_step": 218922, "epoch": 1809} {"train_loss": -42.84028244018555, "global_step": 218923, "epoch": 1809} {"train_loss": -42.63169479370117, "global_step": 218924, "epoch": 1809} {"train_loss": -41.72694778442383, "global_step": 218925, "epoch": 1809} {"train_loss": -42.337547302246094, "global_step": 218926, "epoch": 1809} {"train_loss": -42.58335494995117, "global_step": 218927, "epoch": 1809} {"train_loss": -42.92165756225586, "global_step": 218928, "epoch": 1809} {"train_loss": -42.1129035949707, "global_step": 218929, "epoch": 1809} {"train_loss": -41.866268157958984, "global_step": 218930, "epoch": 1809} {"train_loss": -42.87807083129883, "global_step": 218931, "epoch": 1809} {"train_loss": -42.51312255859375, "global_step": 218932, "epoch": 1809} {"train_loss": -42.558876037597656, "global_step": 218933, "epoch": 1809} {"train_loss": -42.809539794921875, "global_step": 218934, "epoch": 1809} {"train_loss": -43.11529541015625, "global_step": 218935, "epoch": 1809} {"train_loss": -43.36063766479492, "global_step": 218936, "epoch": 1809} {"train_loss": -42.96395492553711, "global_step": 218937, "epoch": 1809} {"train_loss": -43.27957534790039, "global_step": 218938, "epoch": 1809} {"train_loss": -43.093379974365234, "global_step": 218939, "epoch": 1809} {"train_loss": -43.37801742553711, "global_step": 218940, "epoch": 1809} {"train_loss": -42.74466323852539, "global_step": 218941, "epoch": 1809} {"train_loss": -43.22713851928711, "global_step": 218942, "epoch": 1809} {"train_loss": -43.47382736206055, "global_step": 218943, "epoch": 1809} {"train_loss": -43.06885528564453, "global_step": 218944, "epoch": 1809} {"train_loss": -42.46097946166992, "global_step": 218945, "epoch": 1809} {"train_loss": -42.54465866088867, "global_step": 218946, "epoch": 1809} {"train_loss": -42.32698440551758, "global_step": 218947, "epoch": 1809} {"train_loss": -42.736358642578125, "global_step": 218948, "epoch": 1809} {"train_loss": -41.8889274597168, "global_step": 218949, "epoch": 1809} {"train_loss": -41.657325744628906, "global_step": 218950, "epoch": 1809} {"train_loss": -42.34006881713867, "global_step": 218951, "epoch": 1809} {"train_loss": -42.0057258605957, "global_step": 218952, "epoch": 1809} {"train_loss": -42.63546371459961, "global_step": 218953, "epoch": 1809} {"train_loss": -42.18118667602539, "global_step": 218954, "epoch": 1809} {"train_loss": -42.99520492553711, "global_step": 218955, "epoch": 1809} {"train_loss": -41.53974151611328, "global_step": 218956, "epoch": 1809} {"train_loss": -41.061073303222656, "global_step": 218957, "epoch": 1809} {"train_loss": -42.021461486816406, "global_step": 218958, "epoch": 1809} {"train_loss": -42.656063079833984, "global_step": 218959, "epoch": 1809} {"train_loss": -41.46928405761719, "global_step": 218960, "epoch": 1809} {"train_loss": -40.47951126098633, "global_step": 218961, "epoch": 1809} {"train_loss": -41.63618469238281, "global_step": 218962, "epoch": 1809} {"train_loss": -41.261966705322266, "global_step": 218963, "epoch": 1809} {"train_loss": -40.51792526245117, "global_step": 218964, "epoch": 1809} {"train_loss": -40.52296447753906, "global_step": 218965, "epoch": 1809} {"train_loss": -42.05302429199219, "global_step": 218966, "epoch": 1809} {"train_loss": -42.54453659057617, "global_step": 218967, "epoch": 1809} {"train_loss": -40.35992431640625, "global_step": 218968, "epoch": 1809} {"train_loss": -39.92207336425781, "global_step": 218969, "epoch": 1809} {"train_loss": -40.64734649658203, "global_step": 218970, "epoch": 1809} {"train_loss": -39.119850158691406, "global_step": 218971, "epoch": 1809} {"train_loss": -41.00443649291992, "global_step": 218972, "epoch": 1809} {"train_loss": -42.370849609375, "global_step": 218973, "epoch": 1809} {"train_loss": -41.35413360595703, "global_step": 218974, "epoch": 1809} {"train_loss": -41.76015853881836, "global_step": 218975, "epoch": 1809} {"train_loss": -42.03261184692383, "global_step": 218976, "epoch": 1809} {"train_loss": -42.04854202270508, "global_step": 218977, "epoch": 1809} {"train_loss": -40.74180221557617, "global_step": 218978, "epoch": 1809} {"train_loss": -38.23761749267578, "global_step": 218979, "epoch": 1809} {"train_loss": -37.081275939941406, "global_step": 218980, "epoch": 1809} {"train_loss": -36.80448913574219, "global_step": 218981, "epoch": 1809} {"train_loss": -40.28117752075195, "global_step": 218982, "epoch": 1809} {"train_loss": -40.630496978759766, "global_step": 218983, "epoch": 1809} {"train_loss": -38.0941162109375, "global_step": 218984, "epoch": 1809} {"train_loss": -39.36956787109375, "global_step": 218985, "epoch": 1809} {"train_loss": -42.34754180908203, "global_step": 218986, "epoch": 1809} {"train_loss": -36.77562713623047, "global_step": 218987, "epoch": 1809} {"train_loss": -38.55331039428711, "global_step": 218988, "epoch": 1809} {"train_loss": -41.83952713012695, "global_step": 218989, "epoch": 1809} {"train_loss": -39.9509391784668, "global_step": 218990, "epoch": 1809} {"train_loss": -40.010704040527344, "global_step": 218991, "epoch": 1809} {"train_loss": -41.393306732177734, "global_step": 218992, "epoch": 1809} {"train_loss": -40.184486389160156, "global_step": 218993, "epoch": 1809} {"train_loss": -41.279823303222656, "global_step": 218994, "epoch": 1809} {"train_loss": -41.74057388305664, "global_step": 218995, "epoch": 1809} {"train_loss": -38.83677291870117, "global_step": 218996, "epoch": 1809} {"train_loss": -41.27299880981445, "global_step": 218997, "epoch": 1809} {"train_loss": -40.784584045410156, "global_step": 218998, "epoch": 1809} {"train_loss": -39.887428283691406, "global_step": 218999, "epoch": 1809} {"train_loss": -41.25248718261719, "global_step": 219000, "epoch": 1809} {"train_loss": -41.37109375, "global_step": 219001, "epoch": 1809} {"train_loss": -42.14815902709961, "global_step": 219002, "epoch": 1809} {"train_loss": -41.04136276245117, "global_step": 219003, "epoch": 1809} {"train_loss": -41.30036544799805, "global_step": 219004, "epoch": 1809} {"train_loss": -41.86088562011719, "global_step": 219005, "epoch": 1809} {"train_loss": -42.29877853393555, "global_step": 219006, "epoch": 1809} {"train_loss": -42.059226989746094, "global_step": 219007, "epoch": 1809} {"train_loss": -41.925758361816406, "global_step": 219008, "epoch": 1809} {"train_loss": -41.72376679980065, "global_step": 219009, "epoch": 1809, "val_loss": 2541588.0} {"train_loss": -42.23094177246094, "global_step": 219010, "epoch": 1810} {"train_loss": -42.026912689208984, "global_step": 219011, "epoch": 1810} {"train_loss": -41.709877014160156, "global_step": 219012, "epoch": 1810} {"train_loss": -42.3958854675293, "global_step": 219013, "epoch": 1810} {"train_loss": -42.72629165649414, "global_step": 219014, "epoch": 1810} {"train_loss": -42.74338912963867, "global_step": 219015, "epoch": 1810} {"train_loss": -42.746864318847656, "global_step": 219016, "epoch": 1810} {"train_loss": -42.96406555175781, "global_step": 219017, "epoch": 1810} {"train_loss": -43.13691329956055, "global_step": 219018, "epoch": 1810} {"train_loss": -42.817501068115234, "global_step": 219019, "epoch": 1810} {"train_loss": -42.86631774902344, "global_step": 219020, "epoch": 1810} {"train_loss": -43.115596771240234, "global_step": 219021, "epoch": 1810} {"train_loss": -42.79385757446289, "global_step": 219022, "epoch": 1810} {"train_loss": -42.92109680175781, "global_step": 219023, "epoch": 1810} {"train_loss": -42.52934265136719, "global_step": 219024, "epoch": 1810} {"train_loss": -43.18880081176758, "global_step": 219025, "epoch": 1810} {"train_loss": -42.35505294799805, "global_step": 219026, "epoch": 1810} {"train_loss": -42.890777587890625, "global_step": 219027, "epoch": 1810} {"train_loss": -42.98169708251953, "global_step": 219028, "epoch": 1810} {"train_loss": -42.67647933959961, "global_step": 219029, "epoch": 1810} {"train_loss": -42.96992874145508, "global_step": 219030, "epoch": 1810} {"train_loss": -43.01605987548828, "global_step": 219031, "epoch": 1810} {"train_loss": -43.515506744384766, "global_step": 219032, "epoch": 1810} {"train_loss": -43.0986328125, "global_step": 219033, "epoch": 1810} {"train_loss": -43.44861602783203, "global_step": 219034, "epoch": 1810} {"train_loss": -43.373844146728516, "global_step": 219035, "epoch": 1810} {"train_loss": -42.972164154052734, "global_step": 219036, "epoch": 1810} {"train_loss": -43.09684371948242, "global_step": 219037, "epoch": 1810} {"train_loss": -43.76179122924805, "global_step": 219038, "epoch": 1810} {"train_loss": -43.781978607177734, "global_step": 219039, "epoch": 1810} {"train_loss": -43.34890365600586, "global_step": 219040, "epoch": 1810} {"train_loss": -42.99958038330078, "global_step": 219041, "epoch": 1810} {"train_loss": -43.30284118652344, "global_step": 219042, "epoch": 1810} {"train_loss": -43.045257568359375, "global_step": 219043, "epoch": 1810} {"train_loss": -43.33110427856445, "global_step": 219044, "epoch": 1810} {"train_loss": -42.573089599609375, "global_step": 219045, "epoch": 1810} {"train_loss": -43.083168029785156, "global_step": 219046, "epoch": 1810} {"train_loss": -42.81344223022461, "global_step": 219047, "epoch": 1810} {"train_loss": -42.495967864990234, "global_step": 219048, "epoch": 1810} {"train_loss": -42.808040618896484, "global_step": 219049, "epoch": 1810} {"train_loss": -42.457515716552734, "global_step": 219050, "epoch": 1810} {"train_loss": -42.60757064819336, "global_step": 219051, "epoch": 1810} {"train_loss": -43.470237731933594, "global_step": 219052, "epoch": 1810} {"train_loss": -42.889400482177734, "global_step": 219053, "epoch": 1810} {"train_loss": -42.7033576965332, "global_step": 219054, "epoch": 1810} {"train_loss": -40.521278381347656, "global_step": 219055, "epoch": 1810} {"train_loss": -42.60830307006836, "global_step": 219056, "epoch": 1810} {"train_loss": -42.70777130126953, "global_step": 219057, "epoch": 1810} {"train_loss": -43.37763214111328, "global_step": 219058, "epoch": 1810} {"train_loss": -42.747493743896484, "global_step": 219059, "epoch": 1810} {"train_loss": -42.64048385620117, "global_step": 219060, "epoch": 1810} {"train_loss": -41.3266716003418, "global_step": 219061, "epoch": 1810} {"train_loss": -42.60811233520508, "global_step": 219062, "epoch": 1810} {"train_loss": -41.60352325439453, "global_step": 219063, "epoch": 1810} {"train_loss": -42.80084228515625, "global_step": 219064, "epoch": 1810} {"train_loss": -42.30521774291992, "global_step": 219065, "epoch": 1810} {"train_loss": -42.4985466003418, "global_step": 219066, "epoch": 1810} {"train_loss": -43.11542510986328, "global_step": 219067, "epoch": 1810} {"train_loss": -38.75606918334961, "global_step": 219068, "epoch": 1810} {"train_loss": -42.28934860229492, "global_step": 219069, "epoch": 1810} {"train_loss": -41.40118408203125, "global_step": 219070, "epoch": 1810} {"train_loss": -43.01130294799805, "global_step": 219071, "epoch": 1810} {"train_loss": -41.99911117553711, "global_step": 219072, "epoch": 1810} {"train_loss": -35.586544036865234, "global_step": 219073, "epoch": 1810} {"train_loss": -34.292579650878906, "global_step": 219074, "epoch": 1810} {"train_loss": -37.283565521240234, "global_step": 219075, "epoch": 1810} {"train_loss": -40.172542572021484, "global_step": 219076, "epoch": 1810} {"train_loss": -40.35665512084961, "global_step": 219077, "epoch": 1810} {"train_loss": -37.95158004760742, "global_step": 219078, "epoch": 1810} {"train_loss": -41.08079147338867, "global_step": 219079, "epoch": 1810} {"train_loss": -38.95404815673828, "global_step": 219080, "epoch": 1810} {"train_loss": -39.793880462646484, "global_step": 219081, "epoch": 1810} {"train_loss": -38.47050857543945, "global_step": 219082, "epoch": 1810} {"train_loss": -38.78351593017578, "global_step": 219083, "epoch": 1810} {"train_loss": -40.83748245239258, "global_step": 219084, "epoch": 1810} {"train_loss": -41.05567169189453, "global_step": 219085, "epoch": 1810} {"train_loss": -40.68678283691406, "global_step": 219086, "epoch": 1810} {"train_loss": -40.69382858276367, "global_step": 219087, "epoch": 1810} {"train_loss": -41.31431198120117, "global_step": 219088, "epoch": 1810} {"train_loss": -41.34569549560547, "global_step": 219089, "epoch": 1810} {"train_loss": -39.8213996887207, "global_step": 219090, "epoch": 1810} {"train_loss": -41.44350051879883, "global_step": 219091, "epoch": 1810} {"train_loss": -41.919342041015625, "global_step": 219092, "epoch": 1810} {"train_loss": -41.40056228637695, "global_step": 219093, "epoch": 1810} {"train_loss": -39.9810791015625, "global_step": 219094, "epoch": 1810} {"train_loss": -41.52409362792969, "global_step": 219095, "epoch": 1810} {"train_loss": -42.18952941894531, "global_step": 219096, "epoch": 1810} {"train_loss": -41.983612060546875, "global_step": 219097, "epoch": 1810} {"train_loss": -41.526973724365234, "global_step": 219098, "epoch": 1810} {"train_loss": -38.745540618896484, "global_step": 219099, "epoch": 1810} {"train_loss": -41.52814483642578, "global_step": 219100, "epoch": 1810} {"train_loss": -39.406551361083984, "global_step": 219101, "epoch": 1810} {"train_loss": -40.81412887573242, "global_step": 219102, "epoch": 1810} {"train_loss": -41.59810256958008, "global_step": 219103, "epoch": 1810} {"train_loss": -41.515960693359375, "global_step": 219104, "epoch": 1810} {"train_loss": -38.50094223022461, "global_step": 219105, "epoch": 1810} {"train_loss": -40.636634826660156, "global_step": 219106, "epoch": 1810} {"train_loss": -39.76531219482422, "global_step": 219107, "epoch": 1810} {"train_loss": -41.41815185546875, "global_step": 219108, "epoch": 1810} {"train_loss": -41.521148681640625, "global_step": 219109, "epoch": 1810} {"train_loss": -39.06510543823242, "global_step": 219110, "epoch": 1810} {"train_loss": -40.66382598876953, "global_step": 219111, "epoch": 1810} {"train_loss": -42.14542770385742, "global_step": 219112, "epoch": 1810} {"train_loss": -40.6647834777832, "global_step": 219113, "epoch": 1810} {"train_loss": -38.379844665527344, "global_step": 219114, "epoch": 1810} {"train_loss": -41.19807815551758, "global_step": 219115, "epoch": 1810} {"train_loss": -38.258514404296875, "global_step": 219116, "epoch": 1810} {"train_loss": -41.59341812133789, "global_step": 219117, "epoch": 1810} {"train_loss": -40.078773498535156, "global_step": 219118, "epoch": 1810} {"train_loss": -41.06987380981445, "global_step": 219119, "epoch": 1810} {"train_loss": -40.79533767700195, "global_step": 219120, "epoch": 1810} {"train_loss": -40.85590362548828, "global_step": 219121, "epoch": 1810} {"train_loss": -40.25809860229492, "global_step": 219122, "epoch": 1810} {"train_loss": -40.24052810668945, "global_step": 219123, "epoch": 1810} {"train_loss": -39.774505615234375, "global_step": 219124, "epoch": 1810} {"train_loss": -41.93251037597656, "global_step": 219125, "epoch": 1810} {"train_loss": -40.21369171142578, "global_step": 219126, "epoch": 1810} {"train_loss": -41.84559631347656, "global_step": 219127, "epoch": 1810} {"train_loss": -41.798458099365234, "global_step": 219128, "epoch": 1810} {"train_loss": -42.40092849731445, "global_step": 219129, "epoch": 1810} {"train_loss": -41.57069110082201, "global_step": 219130, "epoch": 1810, "val_loss": 2443994.25} {"train_loss": -40.97362518310547, "global_step": 219131, "epoch": 1811} {"train_loss": -38.892784118652344, "global_step": 219132, "epoch": 1811} {"train_loss": -41.307350158691406, "global_step": 219133, "epoch": 1811} {"train_loss": -41.30355453491211, "global_step": 219134, "epoch": 1811} {"train_loss": -40.895240783691406, "global_step": 219135, "epoch": 1811} {"train_loss": -41.2133674621582, "global_step": 219136, "epoch": 1811} {"train_loss": -42.514366149902344, "global_step": 219137, "epoch": 1811} {"train_loss": -40.369510650634766, "global_step": 219138, "epoch": 1811} {"train_loss": -42.132259368896484, "global_step": 219139, "epoch": 1811} {"train_loss": -40.7535514831543, "global_step": 219140, "epoch": 1811} {"train_loss": -41.3787956237793, "global_step": 219141, "epoch": 1811} {"train_loss": -40.7192497253418, "global_step": 219142, "epoch": 1811} {"train_loss": -40.90617752075195, "global_step": 219143, "epoch": 1811} {"train_loss": -40.498409271240234, "global_step": 219144, "epoch": 1811} {"train_loss": -41.48991394042969, "global_step": 219145, "epoch": 1811} {"train_loss": -40.51777267456055, "global_step": 219146, "epoch": 1811} {"train_loss": -40.5822639465332, "global_step": 219147, "epoch": 1811} {"train_loss": -41.59332275390625, "global_step": 219148, "epoch": 1811} {"train_loss": -41.65079879760742, "global_step": 219149, "epoch": 1811} {"train_loss": -41.60285568237305, "global_step": 219150, "epoch": 1811} {"train_loss": -42.36503219604492, "global_step": 219151, "epoch": 1811} {"train_loss": -41.407649993896484, "global_step": 219152, "epoch": 1811} {"train_loss": -40.991580963134766, "global_step": 219153, "epoch": 1811} {"train_loss": -41.43083953857422, "global_step": 219154, "epoch": 1811} {"train_loss": -40.94314193725586, "global_step": 219155, "epoch": 1811} {"train_loss": -41.45081329345703, "global_step": 219156, "epoch": 1811} {"train_loss": -41.324520111083984, "global_step": 219157, "epoch": 1811} {"train_loss": -41.511661529541016, "global_step": 219158, "epoch": 1811} {"train_loss": -42.24233627319336, "global_step": 219159, "epoch": 1811} {"train_loss": -40.65120315551758, "global_step": 219160, "epoch": 1811} {"train_loss": -41.80950927734375, "global_step": 219161, "epoch": 1811} {"train_loss": -41.28346633911133, "global_step": 219162, "epoch": 1811} {"train_loss": -35.261775970458984, "global_step": 219163, "epoch": 1811} {"train_loss": -41.09973907470703, "global_step": 219164, "epoch": 1811} {"train_loss": -39.59437942504883, "global_step": 219165, "epoch": 1811} {"train_loss": -37.73151779174805, "global_step": 219166, "epoch": 1811} {"train_loss": -42.08485794067383, "global_step": 219167, "epoch": 1811} {"train_loss": -40.57849884033203, "global_step": 219168, "epoch": 1811} {"train_loss": -38.81610107421875, "global_step": 219169, "epoch": 1811} {"train_loss": -41.56081008911133, "global_step": 219170, "epoch": 1811} {"train_loss": -37.17473220825195, "global_step": 219171, "epoch": 1811} {"train_loss": -41.049922943115234, "global_step": 219172, "epoch": 1811} {"train_loss": -35.341552734375, "global_step": 219173, "epoch": 1811} {"train_loss": -38.43854522705078, "global_step": 219174, "epoch": 1811} {"train_loss": -41.34444808959961, "global_step": 219175, "epoch": 1811} {"train_loss": -41.6460075378418, "global_step": 219176, "epoch": 1811} {"train_loss": -40.370201110839844, "global_step": 219177, "epoch": 1811} {"train_loss": -23.96768569946289, "global_step": 219178, "epoch": 1811} {"train_loss": -35.09120559692383, "global_step": 219179, "epoch": 1811} {"train_loss": -40.8201904296875, "global_step": 219180, "epoch": 1811} {"train_loss": -34.65425491333008, "global_step": 219181, "epoch": 1811} {"train_loss": -37.895851135253906, "global_step": 219182, "epoch": 1811} {"train_loss": -40.62281036376953, "global_step": 219183, "epoch": 1811} {"train_loss": -41.319915771484375, "global_step": 219184, "epoch": 1811} {"train_loss": -38.726253509521484, "global_step": 219185, "epoch": 1811} {"train_loss": -41.04947280883789, "global_step": 219186, "epoch": 1811} {"train_loss": -39.48173522949219, "global_step": 219187, "epoch": 1811} {"train_loss": -37.92159652709961, "global_step": 219188, "epoch": 1811} {"train_loss": -38.32474899291992, "global_step": 219189, "epoch": 1811} {"train_loss": -37.341854095458984, "global_step": 219190, "epoch": 1811} {"train_loss": -40.9085578918457, "global_step": 219191, "epoch": 1811} {"train_loss": -41.01263427734375, "global_step": 219192, "epoch": 1811} {"train_loss": -38.03574752807617, "global_step": 219193, "epoch": 1811} {"train_loss": -39.704654693603516, "global_step": 219194, "epoch": 1811} {"train_loss": -38.0267333984375, "global_step": 219195, "epoch": 1811} {"train_loss": -39.30036544799805, "global_step": 219196, "epoch": 1811} {"train_loss": -39.46371078491211, "global_step": 219197, "epoch": 1811} {"train_loss": -37.81941604614258, "global_step": 219198, "epoch": 1811} {"train_loss": -37.3983268737793, "global_step": 219199, "epoch": 1811} {"train_loss": -40.27075958251953, "global_step": 219200, "epoch": 1811} {"train_loss": -38.06934356689453, "global_step": 219201, "epoch": 1811} {"train_loss": -41.16564178466797, "global_step": 219202, "epoch": 1811} {"train_loss": -40.03013229370117, "global_step": 219203, "epoch": 1811} {"train_loss": -38.71834182739258, "global_step": 219204, "epoch": 1811} {"train_loss": -40.660518646240234, "global_step": 219205, "epoch": 1811} {"train_loss": -39.74641036987305, "global_step": 219206, "epoch": 1811} {"train_loss": -37.49916458129883, "global_step": 219207, "epoch": 1811} {"train_loss": -39.599098205566406, "global_step": 219208, "epoch": 1811} {"train_loss": -41.293853759765625, "global_step": 219209, "epoch": 1811} {"train_loss": -38.179439544677734, "global_step": 219210, "epoch": 1811} {"train_loss": -40.23933029174805, "global_step": 219211, "epoch": 1811} {"train_loss": -39.21147537231445, "global_step": 219212, "epoch": 1811} {"train_loss": -38.65329360961914, "global_step": 219213, "epoch": 1811} {"train_loss": -40.32586669921875, "global_step": 219214, "epoch": 1811} {"train_loss": -40.1427001953125, "global_step": 219215, "epoch": 1811} {"train_loss": -37.93727111816406, "global_step": 219216, "epoch": 1811} {"train_loss": -40.09202194213867, "global_step": 219217, "epoch": 1811} {"train_loss": -41.15260696411133, "global_step": 219218, "epoch": 1811} {"train_loss": -39.94086456298828, "global_step": 219219, "epoch": 1811} {"train_loss": -40.132259368896484, "global_step": 219220, "epoch": 1811} {"train_loss": -40.973960876464844, "global_step": 219221, "epoch": 1811} {"train_loss": -40.1739616394043, "global_step": 219222, "epoch": 1811} {"train_loss": -40.33013916015625, "global_step": 219223, "epoch": 1811} {"train_loss": -40.75457763671875, "global_step": 219224, "epoch": 1811} {"train_loss": -41.07683181762695, "global_step": 219225, "epoch": 1811} {"train_loss": -40.91910934448242, "global_step": 219226, "epoch": 1811} {"train_loss": -40.96692657470703, "global_step": 219227, "epoch": 1811} {"train_loss": -40.6309814453125, "global_step": 219228, "epoch": 1811} {"train_loss": -39.10615921020508, "global_step": 219229, "epoch": 1811} {"train_loss": -40.62618637084961, "global_step": 219230, "epoch": 1811} {"train_loss": -40.72417449951172, "global_step": 219231, "epoch": 1811} {"train_loss": -41.339412689208984, "global_step": 219232, "epoch": 1811} {"train_loss": -41.35892868041992, "global_step": 219233, "epoch": 1811} {"train_loss": -41.17418670654297, "global_step": 219234, "epoch": 1811} {"train_loss": -41.60215759277344, "global_step": 219235, "epoch": 1811} {"train_loss": -40.20454025268555, "global_step": 219236, "epoch": 1811} {"train_loss": -41.973487854003906, "global_step": 219237, "epoch": 1811} {"train_loss": -41.95246505737305, "global_step": 219238, "epoch": 1811} {"train_loss": -41.55388641357422, "global_step": 219239, "epoch": 1811} {"train_loss": -40.67850875854492, "global_step": 219240, "epoch": 1811} {"train_loss": -41.207183837890625, "global_step": 219241, "epoch": 1811} {"train_loss": -41.21904754638672, "global_step": 219242, "epoch": 1811} {"train_loss": -41.81937789916992, "global_step": 219243, "epoch": 1811} {"train_loss": -41.69540023803711, "global_step": 219244, "epoch": 1811} {"train_loss": -41.998504638671875, "global_step": 219245, "epoch": 1811} {"train_loss": -42.10396957397461, "global_step": 219246, "epoch": 1811} {"train_loss": -41.4152946472168, "global_step": 219247, "epoch": 1811} {"train_loss": -41.610897064208984, "global_step": 219248, "epoch": 1811} {"train_loss": -41.9868049621582, "global_step": 219249, "epoch": 1811} {"train_loss": -41.11371994018555, "global_step": 219250, "epoch": 1811} {"train_loss": -40.157556707208805, "global_step": 219251, "epoch": 1811, "val_loss": 2505139.5} {"train_loss": -41.59193801879883, "global_step": 219252, "epoch": 1812} {"train_loss": -41.97084426879883, "global_step": 219253, "epoch": 1812} {"train_loss": -42.78436279296875, "global_step": 219254, "epoch": 1812} {"train_loss": -41.35823440551758, "global_step": 219255, "epoch": 1812} {"train_loss": -41.82516098022461, "global_step": 219256, "epoch": 1812} {"train_loss": -41.38167953491211, "global_step": 219257, "epoch": 1812} {"train_loss": -42.44181442260742, "global_step": 219258, "epoch": 1812} {"train_loss": -41.953670501708984, "global_step": 219259, "epoch": 1812} {"train_loss": -42.17501449584961, "global_step": 219260, "epoch": 1812} {"train_loss": -41.667564392089844, "global_step": 219261, "epoch": 1812} {"train_loss": -41.50078201293945, "global_step": 219262, "epoch": 1812} {"train_loss": -42.578975677490234, "global_step": 219263, "epoch": 1812} {"train_loss": -42.448604583740234, "global_step": 219264, "epoch": 1812} {"train_loss": -42.70310974121094, "global_step": 219265, "epoch": 1812} {"train_loss": -42.802642822265625, "global_step": 219266, "epoch": 1812} {"train_loss": -42.07026290893555, "global_step": 219267, "epoch": 1812} {"train_loss": -41.94112777709961, "global_step": 219268, "epoch": 1812} {"train_loss": -42.35366439819336, "global_step": 219269, "epoch": 1812} {"train_loss": -42.4271125793457, "global_step": 219270, "epoch": 1812} {"train_loss": -42.216644287109375, "global_step": 219271, "epoch": 1812} {"train_loss": -42.46853256225586, "global_step": 219272, "epoch": 1812} {"train_loss": -42.513912200927734, "global_step": 219273, "epoch": 1812} {"train_loss": -41.86178207397461, "global_step": 219274, "epoch": 1812} {"train_loss": -42.91177749633789, "global_step": 219275, "epoch": 1812} {"train_loss": -41.87226104736328, "global_step": 219276, "epoch": 1812} {"train_loss": -42.064544677734375, "global_step": 219277, "epoch": 1812} {"train_loss": -42.308773040771484, "global_step": 219278, "epoch": 1812} {"train_loss": -42.62754440307617, "global_step": 219279, "epoch": 1812} {"train_loss": -42.15791320800781, "global_step": 219280, "epoch": 1812} {"train_loss": -42.193233489990234, "global_step": 219281, "epoch": 1812} {"train_loss": -42.70772171020508, "global_step": 219282, "epoch": 1812} {"train_loss": -42.74219512939453, "global_step": 219283, "epoch": 1812} {"train_loss": -42.1663932800293, "global_step": 219284, "epoch": 1812} {"train_loss": -42.431488037109375, "global_step": 219285, "epoch": 1812} {"train_loss": -42.75484085083008, "global_step": 219286, "epoch": 1812} {"train_loss": -42.27194595336914, "global_step": 219287, "epoch": 1812} {"train_loss": -42.436012268066406, "global_step": 219288, "epoch": 1812} {"train_loss": -42.50230026245117, "global_step": 219289, "epoch": 1812} {"train_loss": -40.97819137573242, "global_step": 219290, "epoch": 1812} {"train_loss": -41.587581634521484, "global_step": 219291, "epoch": 1812} {"train_loss": -40.165645599365234, "global_step": 219292, "epoch": 1812} {"train_loss": -39.874053955078125, "global_step": 219293, "epoch": 1812} {"train_loss": -41.53633499145508, "global_step": 219294, "epoch": 1812} {"train_loss": -42.14272689819336, "global_step": 219295, "epoch": 1812} {"train_loss": -40.53769302368164, "global_step": 219296, "epoch": 1812} {"train_loss": -42.4222412109375, "global_step": 219297, "epoch": 1812} {"train_loss": -40.20949935913086, "global_step": 219298, "epoch": 1812} {"train_loss": -41.34806442260742, "global_step": 219299, "epoch": 1812} {"train_loss": -42.079383850097656, "global_step": 219300, "epoch": 1812} {"train_loss": -41.33296585083008, "global_step": 219301, "epoch": 1812} {"train_loss": -42.280086517333984, "global_step": 219302, "epoch": 1812} {"train_loss": -41.65378189086914, "global_step": 219303, "epoch": 1812} {"train_loss": -41.717689514160156, "global_step": 219304, "epoch": 1812} {"train_loss": -40.86300277709961, "global_step": 219305, "epoch": 1812} {"train_loss": -41.65909194946289, "global_step": 219306, "epoch": 1812} {"train_loss": -41.26647186279297, "global_step": 219307, "epoch": 1812} {"train_loss": -41.79659652709961, "global_step": 219308, "epoch": 1812} {"train_loss": -41.75228500366211, "global_step": 219309, "epoch": 1812} {"train_loss": -42.34785842895508, "global_step": 219310, "epoch": 1812} {"train_loss": -40.68674850463867, "global_step": 219311, "epoch": 1812} {"train_loss": -41.432411193847656, "global_step": 219312, "epoch": 1812} {"train_loss": -41.58740234375, "global_step": 219313, "epoch": 1812} {"train_loss": -40.869903564453125, "global_step": 219314, "epoch": 1812} {"train_loss": -41.1254997253418, "global_step": 219315, "epoch": 1812} {"train_loss": -41.47220993041992, "global_step": 219316, "epoch": 1812} {"train_loss": -39.24247360229492, "global_step": 219317, "epoch": 1812} {"train_loss": -39.26802062988281, "global_step": 219318, "epoch": 1812} {"train_loss": -41.38613510131836, "global_step": 219319, "epoch": 1812} {"train_loss": -39.11731719970703, "global_step": 219320, "epoch": 1812} {"train_loss": -38.59734344482422, "global_step": 219321, "epoch": 1812} {"train_loss": -39.93427276611328, "global_step": 219322, "epoch": 1812} {"train_loss": -40.20884704589844, "global_step": 219323, "epoch": 1812} {"train_loss": -41.35700607299805, "global_step": 219324, "epoch": 1812} {"train_loss": -39.4357795715332, "global_step": 219325, "epoch": 1812} {"train_loss": -37.58649444580078, "global_step": 219326, "epoch": 1812} {"train_loss": -39.13373947143555, "global_step": 219327, "epoch": 1812} {"train_loss": -38.2024040222168, "global_step": 219328, "epoch": 1812} {"train_loss": -41.1383056640625, "global_step": 219329, "epoch": 1812} {"train_loss": -37.285667419433594, "global_step": 219330, "epoch": 1812} {"train_loss": -40.869083404541016, "global_step": 219331, "epoch": 1812} {"train_loss": -37.515777587890625, "global_step": 219332, "epoch": 1812} {"train_loss": -37.97196578979492, "global_step": 219333, "epoch": 1812} {"train_loss": -34.25844192504883, "global_step": 219334, "epoch": 1812} {"train_loss": -39.82645797729492, "global_step": 219335, "epoch": 1812} {"train_loss": -37.92305374145508, "global_step": 219336, "epoch": 1812} {"train_loss": -38.956295013427734, "global_step": 219337, "epoch": 1812} {"train_loss": -38.39168930053711, "global_step": 219338, "epoch": 1812} {"train_loss": -41.02447509765625, "global_step": 219339, "epoch": 1812} {"train_loss": -40.31261444091797, "global_step": 219340, "epoch": 1812} {"train_loss": -40.93069076538086, "global_step": 219341, "epoch": 1812} {"train_loss": -40.1573371887207, "global_step": 219342, "epoch": 1812} {"train_loss": -40.389251708984375, "global_step": 219343, "epoch": 1812} {"train_loss": -41.8193244934082, "global_step": 219344, "epoch": 1812} {"train_loss": -40.67573928833008, "global_step": 219345, "epoch": 1812} {"train_loss": -41.65617752075195, "global_step": 219346, "epoch": 1812} {"train_loss": -41.284629821777344, "global_step": 219347, "epoch": 1812} {"train_loss": -42.10076904296875, "global_step": 219348, "epoch": 1812} {"train_loss": -41.39447021484375, "global_step": 219349, "epoch": 1812} {"train_loss": -42.356048583984375, "global_step": 219350, "epoch": 1812} {"train_loss": -42.02579879760742, "global_step": 219351, "epoch": 1812} {"train_loss": -41.41115951538086, "global_step": 219352, "epoch": 1812} {"train_loss": -42.17307662963867, "global_step": 219353, "epoch": 1812} {"train_loss": -41.78243637084961, "global_step": 219354, "epoch": 1812} {"train_loss": -42.18031692504883, "global_step": 219355, "epoch": 1812} {"train_loss": -42.293731689453125, "global_step": 219356, "epoch": 1812} {"train_loss": -42.155025482177734, "global_step": 219357, "epoch": 1812} {"train_loss": -42.479244232177734, "global_step": 219358, "epoch": 1812} {"train_loss": -42.527252197265625, "global_step": 219359, "epoch": 1812} {"train_loss": -43.201995849609375, "global_step": 219360, "epoch": 1812} {"train_loss": -42.823787689208984, "global_step": 219361, "epoch": 1812} {"train_loss": -42.27067947387695, "global_step": 219362, "epoch": 1812} {"train_loss": -42.36050033569336, "global_step": 219363, "epoch": 1812} {"train_loss": -42.49985885620117, "global_step": 219364, "epoch": 1812} {"train_loss": -42.83041000366211, "global_step": 219365, "epoch": 1812} {"train_loss": -43.198055267333984, "global_step": 219366, "epoch": 1812} {"train_loss": -42.59525680541992, "global_step": 219367, "epoch": 1812} {"train_loss": -43.15754318237305, "global_step": 219368, "epoch": 1812} {"train_loss": -42.96500778198242, "global_step": 219369, "epoch": 1812} {"train_loss": -43.019710540771484, "global_step": 219370, "epoch": 1812} {"train_loss": -42.51129150390625, "global_step": 219371, "epoch": 1812} {"train_loss": -41.399194260274086, "global_step": 219372, "epoch": 1812, "val_loss": 2622342.75} {"train_loss": -42.24235153198242, "global_step": 219373, "epoch": 1813} {"train_loss": -42.91357421875, "global_step": 219374, "epoch": 1813} {"train_loss": -42.81966781616211, "global_step": 219375, "epoch": 1813} {"train_loss": -42.9370002746582, "global_step": 219376, "epoch": 1813} {"train_loss": -42.815467834472656, "global_step": 219377, "epoch": 1813} {"train_loss": -42.86949157714844, "global_step": 219378, "epoch": 1813} {"train_loss": -43.141204833984375, "global_step": 219379, "epoch": 1813} {"train_loss": -42.77976989746094, "global_step": 219380, "epoch": 1813} {"train_loss": -42.82227325439453, "global_step": 219381, "epoch": 1813} {"train_loss": -43.08760452270508, "global_step": 219382, "epoch": 1813} {"train_loss": -43.27745819091797, "global_step": 219383, "epoch": 1813} {"train_loss": -42.97831344604492, "global_step": 219384, "epoch": 1813} {"train_loss": -42.501869201660156, "global_step": 219385, "epoch": 1813} {"train_loss": -42.87543869018555, "global_step": 219386, "epoch": 1813} {"train_loss": -43.289520263671875, "global_step": 219387, "epoch": 1813} {"train_loss": -41.88566207885742, "global_step": 219388, "epoch": 1813} {"train_loss": -43.13119125366211, "global_step": 219389, "epoch": 1813} {"train_loss": -43.49768829345703, "global_step": 219390, "epoch": 1813} {"train_loss": -43.212074279785156, "global_step": 219391, "epoch": 1813} {"train_loss": -43.05637741088867, "global_step": 219392, "epoch": 1813} {"train_loss": -43.41604232788086, "global_step": 219393, "epoch": 1813} {"train_loss": -42.63134002685547, "global_step": 219394, "epoch": 1813} {"train_loss": -43.0938835144043, "global_step": 219395, "epoch": 1813} {"train_loss": -43.15034103393555, "global_step": 219396, "epoch": 1813} {"train_loss": -42.76056671142578, "global_step": 219397, "epoch": 1813} {"train_loss": -42.84261703491211, "global_step": 219398, "epoch": 1813} {"train_loss": -42.48545455932617, "global_step": 219399, "epoch": 1813} {"train_loss": -42.42585372924805, "global_step": 219400, "epoch": 1813} {"train_loss": -42.703861236572266, "global_step": 219401, "epoch": 1813} {"train_loss": -43.042232513427734, "global_step": 219402, "epoch": 1813} {"train_loss": -42.54890823364258, "global_step": 219403, "epoch": 1813} {"train_loss": -42.0164909362793, "global_step": 219404, "epoch": 1813} {"train_loss": -42.63592529296875, "global_step": 219405, "epoch": 1813} {"train_loss": -43.419960021972656, "global_step": 219406, "epoch": 1813} {"train_loss": -42.91802978515625, "global_step": 219407, "epoch": 1813} {"train_loss": -40.94340896606445, "global_step": 219408, "epoch": 1813} {"train_loss": -42.801055908203125, "global_step": 219409, "epoch": 1813} {"train_loss": -43.4582405090332, "global_step": 219410, "epoch": 1813} {"train_loss": -42.09383010864258, "global_step": 219411, "epoch": 1813} {"train_loss": -41.3690185546875, "global_step": 219412, "epoch": 1813} {"train_loss": -42.617279052734375, "global_step": 219413, "epoch": 1813} {"train_loss": -42.964778900146484, "global_step": 219414, "epoch": 1813} {"train_loss": -43.21769332885742, "global_step": 219415, "epoch": 1813} {"train_loss": -41.42041015625, "global_step": 219416, "epoch": 1813} {"train_loss": -41.365482330322266, "global_step": 219417, "epoch": 1813} {"train_loss": -37.76038360595703, "global_step": 219418, "epoch": 1813} {"train_loss": -42.40217208862305, "global_step": 219419, "epoch": 1813} {"train_loss": -43.33515930175781, "global_step": 219420, "epoch": 1813} {"train_loss": -42.820899963378906, "global_step": 219421, "epoch": 1813} {"train_loss": -42.579471588134766, "global_step": 219422, "epoch": 1813} {"train_loss": -43.0639762878418, "global_step": 219423, "epoch": 1813} {"train_loss": -43.159271240234375, "global_step": 219424, "epoch": 1813} {"train_loss": -43.48884201049805, "global_step": 219425, "epoch": 1813} {"train_loss": -42.981998443603516, "global_step": 219426, "epoch": 1813} {"train_loss": -41.30367660522461, "global_step": 219427, "epoch": 1813} {"train_loss": -43.42511749267578, "global_step": 219428, "epoch": 1813} {"train_loss": -42.87739181518555, "global_step": 219429, "epoch": 1813} {"train_loss": -41.936668395996094, "global_step": 219430, "epoch": 1813} {"train_loss": -41.83963394165039, "global_step": 219431, "epoch": 1813} {"train_loss": -42.896053314208984, "global_step": 219432, "epoch": 1813} {"train_loss": -43.02204132080078, "global_step": 219433, "epoch": 1813} {"train_loss": -42.3351936340332, "global_step": 219434, "epoch": 1813} {"train_loss": -42.94865798950195, "global_step": 219435, "epoch": 1813} {"train_loss": -43.494422912597656, "global_step": 219436, "epoch": 1813} {"train_loss": -41.96651840209961, "global_step": 219437, "epoch": 1813} {"train_loss": -42.610599517822266, "global_step": 219438, "epoch": 1813} {"train_loss": -42.6587028503418, "global_step": 219439, "epoch": 1813} {"train_loss": -41.94801712036133, "global_step": 219440, "epoch": 1813} {"train_loss": -41.53334045410156, "global_step": 219441, "epoch": 1813} {"train_loss": -41.4417724609375, "global_step": 219442, "epoch": 1813} {"train_loss": -42.030738830566406, "global_step": 219443, "epoch": 1813} {"train_loss": -42.100494384765625, "global_step": 219444, "epoch": 1813} {"train_loss": -41.914398193359375, "global_step": 219445, "epoch": 1813} {"train_loss": -39.696197509765625, "global_step": 219446, "epoch": 1813} {"train_loss": -38.12150955200195, "global_step": 219447, "epoch": 1813} {"train_loss": -40.11796951293945, "global_step": 219448, "epoch": 1813} {"train_loss": -40.24417495727539, "global_step": 219449, "epoch": 1813} {"train_loss": -38.977203369140625, "global_step": 219450, "epoch": 1813} {"train_loss": -40.4347038269043, "global_step": 219451, "epoch": 1813} {"train_loss": -42.31136703491211, "global_step": 219452, "epoch": 1813} {"train_loss": -40.655147552490234, "global_step": 219453, "epoch": 1813} {"train_loss": -38.85317611694336, "global_step": 219454, "epoch": 1813} {"train_loss": -40.46220016479492, "global_step": 219455, "epoch": 1813} {"train_loss": -41.28231430053711, "global_step": 219456, "epoch": 1813} {"train_loss": -42.2615852355957, "global_step": 219457, "epoch": 1813} {"train_loss": -40.92879104614258, "global_step": 219458, "epoch": 1813} {"train_loss": -40.59759521484375, "global_step": 219459, "epoch": 1813} {"train_loss": -41.47176742553711, "global_step": 219460, "epoch": 1813} {"train_loss": -41.7306022644043, "global_step": 219461, "epoch": 1813} {"train_loss": -41.70599365234375, "global_step": 219462, "epoch": 1813} {"train_loss": -39.926795959472656, "global_step": 219463, "epoch": 1813} {"train_loss": -38.37565231323242, "global_step": 219464, "epoch": 1813} {"train_loss": -42.511329650878906, "global_step": 219465, "epoch": 1813} {"train_loss": -38.445560455322266, "global_step": 219466, "epoch": 1813} {"train_loss": -39.96595001220703, "global_step": 219467, "epoch": 1813} {"train_loss": -41.50471115112305, "global_step": 219468, "epoch": 1813} {"train_loss": -40.45266342163086, "global_step": 219469, "epoch": 1813} {"train_loss": -37.17169189453125, "global_step": 219470, "epoch": 1813} {"train_loss": -40.25776290893555, "global_step": 219471, "epoch": 1813} {"train_loss": -40.54191970825195, "global_step": 219472, "epoch": 1813} {"train_loss": -38.812522888183594, "global_step": 219473, "epoch": 1813} {"train_loss": -40.99226760864258, "global_step": 219474, "epoch": 1813} {"train_loss": -39.598873138427734, "global_step": 219475, "epoch": 1813} {"train_loss": -40.33919143676758, "global_step": 219476, "epoch": 1813} {"train_loss": -42.204158782958984, "global_step": 219477, "epoch": 1813} {"train_loss": -37.51783752441406, "global_step": 219478, "epoch": 1813} {"train_loss": -39.76040267944336, "global_step": 219479, "epoch": 1813} {"train_loss": -41.454219818115234, "global_step": 219480, "epoch": 1813} {"train_loss": -39.732025146484375, "global_step": 219481, "epoch": 1813} {"train_loss": -42.09867477416992, "global_step": 219482, "epoch": 1813} {"train_loss": -39.20618438720703, "global_step": 219483, "epoch": 1813} {"train_loss": -39.9296760559082, "global_step": 219484, "epoch": 1813} {"train_loss": -40.631195068359375, "global_step": 219485, "epoch": 1813} {"train_loss": -37.35329055786133, "global_step": 219486, "epoch": 1813} {"train_loss": -41.70025634765625, "global_step": 219487, "epoch": 1813} {"train_loss": -39.77540588378906, "global_step": 219488, "epoch": 1813} {"train_loss": -41.42988967895508, "global_step": 219489, "epoch": 1813} {"train_loss": -40.028968811035156, "global_step": 219490, "epoch": 1813} {"train_loss": -41.48979949951172, "global_step": 219491, "epoch": 1813} {"train_loss": -41.42207717895508, "global_step": 219492, "epoch": 1813} {"train_loss": -41.686985488765494, "global_step": 219493, "epoch": 1813, "val_loss": 2621454.75} {"train_loss": -42.207149505615234, "global_step": 219494, "epoch": 1814} {"train_loss": -40.177459716796875, "global_step": 219495, "epoch": 1814} {"train_loss": -42.45608901977539, "global_step": 219496, "epoch": 1814} {"train_loss": -40.4102897644043, "global_step": 219497, "epoch": 1814} {"train_loss": -42.67161560058594, "global_step": 219498, "epoch": 1814} {"train_loss": -39.644596099853516, "global_step": 219499, "epoch": 1814} {"train_loss": -41.14095687866211, "global_step": 219500, "epoch": 1814} {"train_loss": -41.73891067504883, "global_step": 219501, "epoch": 1814} {"train_loss": -40.76431655883789, "global_step": 219502, "epoch": 1814} {"train_loss": -41.56536865234375, "global_step": 219503, "epoch": 1814} {"train_loss": -40.20112991333008, "global_step": 219504, "epoch": 1814} {"train_loss": -41.33232498168945, "global_step": 219505, "epoch": 1814} {"train_loss": -41.50242614746094, "global_step": 219506, "epoch": 1814} {"train_loss": -42.25149154663086, "global_step": 219507, "epoch": 1814} {"train_loss": -41.03157424926758, "global_step": 219508, "epoch": 1814} {"train_loss": -41.26158142089844, "global_step": 219509, "epoch": 1814} {"train_loss": -40.30778884887695, "global_step": 219510, "epoch": 1814} {"train_loss": -41.62660598754883, "global_step": 219511, "epoch": 1814} {"train_loss": -42.019832611083984, "global_step": 219512, "epoch": 1814} {"train_loss": -41.23893356323242, "global_step": 219513, "epoch": 1814} {"train_loss": -41.527130126953125, "global_step": 219514, "epoch": 1814} {"train_loss": -41.623836517333984, "global_step": 219515, "epoch": 1814} {"train_loss": -41.896114349365234, "global_step": 219516, "epoch": 1814} {"train_loss": -41.769535064697266, "global_step": 219517, "epoch": 1814} {"train_loss": -41.88800048828125, "global_step": 219518, "epoch": 1814} {"train_loss": -41.11442184448242, "global_step": 219519, "epoch": 1814} {"train_loss": -42.06580352783203, "global_step": 219520, "epoch": 1814} {"train_loss": -41.233070373535156, "global_step": 219521, "epoch": 1814} {"train_loss": -42.568946838378906, "global_step": 219522, "epoch": 1814} {"train_loss": -41.598121643066406, "global_step": 219523, "epoch": 1814} {"train_loss": -41.710018157958984, "global_step": 219524, "epoch": 1814} {"train_loss": -42.13581466674805, "global_step": 219525, "epoch": 1814} {"train_loss": -42.210018157958984, "global_step": 219526, "epoch": 1814} {"train_loss": -42.058677673339844, "global_step": 219527, "epoch": 1814} {"train_loss": -42.863685607910156, "global_step": 219528, "epoch": 1814} {"train_loss": -42.01216506958008, "global_step": 219529, "epoch": 1814} {"train_loss": -42.86769485473633, "global_step": 219530, "epoch": 1814} {"train_loss": -42.796791076660156, "global_step": 219531, "epoch": 1814} {"train_loss": -43.441226959228516, "global_step": 219532, "epoch": 1814} {"train_loss": -42.7780876159668, "global_step": 219533, "epoch": 1814} {"train_loss": -42.99187088012695, "global_step": 219534, "epoch": 1814} {"train_loss": -43.08061599731445, "global_step": 219535, "epoch": 1814} {"train_loss": -42.961177825927734, "global_step": 219536, "epoch": 1814} {"train_loss": -42.45002365112305, "global_step": 219537, "epoch": 1814} {"train_loss": -43.14397430419922, "global_step": 219538, "epoch": 1814} {"train_loss": -43.28652572631836, "global_step": 219539, "epoch": 1814} {"train_loss": -42.87209701538086, "global_step": 219540, "epoch": 1814} {"train_loss": -42.98361587524414, "global_step": 219541, "epoch": 1814} {"train_loss": -42.50397872924805, "global_step": 219542, "epoch": 1814} {"train_loss": -42.66697311401367, "global_step": 219543, "epoch": 1814} {"train_loss": -43.088356018066406, "global_step": 219544, "epoch": 1814} {"train_loss": -42.619747161865234, "global_step": 219545, "epoch": 1814} {"train_loss": -40.371986389160156, "global_step": 219546, "epoch": 1814} {"train_loss": -42.08054733276367, "global_step": 219547, "epoch": 1814} {"train_loss": -43.33187484741211, "global_step": 219548, "epoch": 1814} {"train_loss": -42.81868362426758, "global_step": 219549, "epoch": 1814} {"train_loss": -42.146114349365234, "global_step": 219550, "epoch": 1814} {"train_loss": -40.5816764831543, "global_step": 219551, "epoch": 1814} {"train_loss": -39.50172805786133, "global_step": 219552, "epoch": 1814} {"train_loss": -39.495479583740234, "global_step": 219553, "epoch": 1814} {"train_loss": -42.53255844116211, "global_step": 219554, "epoch": 1814} {"train_loss": -42.31129837036133, "global_step": 219555, "epoch": 1814} {"train_loss": -41.80561065673828, "global_step": 219556, "epoch": 1814} {"train_loss": -40.368099212646484, "global_step": 219557, "epoch": 1814} {"train_loss": -42.06898880004883, "global_step": 219558, "epoch": 1814} {"train_loss": -42.74294662475586, "global_step": 219559, "epoch": 1814} {"train_loss": -41.7061653137207, "global_step": 219560, "epoch": 1814} {"train_loss": -42.2194938659668, "global_step": 219561, "epoch": 1814} {"train_loss": -42.65258026123047, "global_step": 219562, "epoch": 1814} {"train_loss": -39.84840774536133, "global_step": 219563, "epoch": 1814} {"train_loss": -41.81501007080078, "global_step": 219564, "epoch": 1814} {"train_loss": -42.018733978271484, "global_step": 219565, "epoch": 1814} {"train_loss": -41.487159729003906, "global_step": 219566, "epoch": 1814} {"train_loss": -40.23295974731445, "global_step": 219567, "epoch": 1814} {"train_loss": -41.26386642456055, "global_step": 219568, "epoch": 1814} {"train_loss": -41.62037658691406, "global_step": 219569, "epoch": 1814} {"train_loss": -41.13771438598633, "global_step": 219570, "epoch": 1814} {"train_loss": -41.59973907470703, "global_step": 219571, "epoch": 1814} {"train_loss": -41.05120086669922, "global_step": 219572, "epoch": 1814} {"train_loss": -41.16538619995117, "global_step": 219573, "epoch": 1814} {"train_loss": -41.26060104370117, "global_step": 219574, "epoch": 1814} {"train_loss": -39.39352035522461, "global_step": 219575, "epoch": 1814} {"train_loss": -41.09810256958008, "global_step": 219576, "epoch": 1814} {"train_loss": -42.18351364135742, "global_step": 219577, "epoch": 1814} {"train_loss": -38.944759368896484, "global_step": 219578, "epoch": 1814} {"train_loss": -41.051395416259766, "global_step": 219579, "epoch": 1814} {"train_loss": -40.4503288269043, "global_step": 219580, "epoch": 1814} {"train_loss": -36.74565505981445, "global_step": 219581, "epoch": 1814} {"train_loss": -36.08751678466797, "global_step": 219582, "epoch": 1814} {"train_loss": -32.2025146484375, "global_step": 219583, "epoch": 1814} {"train_loss": -21.427276611328125, "global_step": 219584, "epoch": 1814} {"train_loss": -31.859272003173828, "global_step": 219585, "epoch": 1814} {"train_loss": -27.626636505126953, "global_step": 219586, "epoch": 1814} {"train_loss": -34.50093460083008, "global_step": 219587, "epoch": 1814} {"train_loss": -30.258264541625977, "global_step": 219588, "epoch": 1814} {"train_loss": -31.00640296936035, "global_step": 219589, "epoch": 1814} {"train_loss": -34.82790756225586, "global_step": 219590, "epoch": 1814} {"train_loss": -33.57233428955078, "global_step": 219591, "epoch": 1814} {"train_loss": -33.6545524597168, "global_step": 219592, "epoch": 1814} {"train_loss": -34.744327545166016, "global_step": 219593, "epoch": 1814} {"train_loss": -34.8839111328125, "global_step": 219594, "epoch": 1814} {"train_loss": -37.6273307800293, "global_step": 219595, "epoch": 1814} {"train_loss": -33.99117660522461, "global_step": 219596, "epoch": 1814} {"train_loss": -37.84114456176758, "global_step": 219597, "epoch": 1814} {"train_loss": -37.37067794799805, "global_step": 219598, "epoch": 1814} {"train_loss": -35.77727127075195, "global_step": 219599, "epoch": 1814} {"train_loss": -39.7819709777832, "global_step": 219600, "epoch": 1814} {"train_loss": -37.13935089111328, "global_step": 219601, "epoch": 1814} {"train_loss": -38.888954162597656, "global_step": 219602, "epoch": 1814} {"train_loss": -39.54549789428711, "global_step": 219603, "epoch": 1814} {"train_loss": -39.3148307800293, "global_step": 219604, "epoch": 1814} {"train_loss": -39.300899505615234, "global_step": 219605, "epoch": 1814} {"train_loss": -40.63242721557617, "global_step": 219606, "epoch": 1814} {"train_loss": -38.7080192565918, "global_step": 219607, "epoch": 1814} {"train_loss": -38.6121711730957, "global_step": 219608, "epoch": 1814} {"train_loss": -40.34259796142578, "global_step": 219609, "epoch": 1814} {"train_loss": -39.92263412475586, "global_step": 219610, "epoch": 1814} {"train_loss": -39.8626823425293, "global_step": 219611, "epoch": 1814} {"train_loss": -40.69607162475586, "global_step": 219612, "epoch": 1814} {"train_loss": -40.60152816772461, "global_step": 219613, "epoch": 1814} {"train_loss": -40.15885285306568, "global_step": 219614, "epoch": 1814, "val_loss": 2528805.0} {"train_loss": -39.920188903808594, "global_step": 219615, "epoch": 1815} {"train_loss": -41.19868087768555, "global_step": 219616, "epoch": 1815} {"train_loss": -40.68593978881836, "global_step": 219617, "epoch": 1815} {"train_loss": -40.24064254760742, "global_step": 219618, "epoch": 1815} {"train_loss": -40.83772659301758, "global_step": 219619, "epoch": 1815} {"train_loss": -40.9719123840332, "global_step": 219620, "epoch": 1815} {"train_loss": -41.067630767822266, "global_step": 219621, "epoch": 1815} {"train_loss": -40.242881774902344, "global_step": 219622, "epoch": 1815} {"train_loss": -41.42171859741211, "global_step": 219623, "epoch": 1815} {"train_loss": -41.09048080444336, "global_step": 219624, "epoch": 1815} {"train_loss": -41.358795166015625, "global_step": 219625, "epoch": 1815} {"train_loss": -42.06534957885742, "global_step": 219626, "epoch": 1815} {"train_loss": -41.087623596191406, "global_step": 219627, "epoch": 1815} {"train_loss": -40.74876022338867, "global_step": 219628, "epoch": 1815} {"train_loss": -40.853389739990234, "global_step": 219629, "epoch": 1815} {"train_loss": -41.50789260864258, "global_step": 219630, "epoch": 1815} {"train_loss": -41.65113067626953, "global_step": 219631, "epoch": 1815} {"train_loss": -41.33069610595703, "global_step": 219632, "epoch": 1815} {"train_loss": -41.50144577026367, "global_step": 219633, "epoch": 1815} {"train_loss": -41.89535903930664, "global_step": 219634, "epoch": 1815} {"train_loss": -41.04008102416992, "global_step": 219635, "epoch": 1815} {"train_loss": -41.75569534301758, "global_step": 219636, "epoch": 1815} {"train_loss": -41.79053497314453, "global_step": 219637, "epoch": 1815} {"train_loss": -41.41764450073242, "global_step": 219638, "epoch": 1815} {"train_loss": -38.93824005126953, "global_step": 219639, "epoch": 1815} {"train_loss": -41.7879524230957, "global_step": 219640, "epoch": 1815} {"train_loss": -41.98893356323242, "global_step": 219641, "epoch": 1815} {"train_loss": -41.846858978271484, "global_step": 219642, "epoch": 1815} {"train_loss": -41.789642333984375, "global_step": 219643, "epoch": 1815} {"train_loss": -42.0466194152832, "global_step": 219644, "epoch": 1815} {"train_loss": -41.78373336791992, "global_step": 219645, "epoch": 1815} {"train_loss": -42.09739303588867, "global_step": 219646, "epoch": 1815} {"train_loss": -42.078243255615234, "global_step": 219647, "epoch": 1815} {"train_loss": -42.363616943359375, "global_step": 219648, "epoch": 1815} {"train_loss": -42.006710052490234, "global_step": 219649, "epoch": 1815} {"train_loss": -42.31486511230469, "global_step": 219650, "epoch": 1815} {"train_loss": -41.7124137878418, "global_step": 219651, "epoch": 1815} {"train_loss": -42.43817901611328, "global_step": 219652, "epoch": 1815} {"train_loss": -42.54411315917969, "global_step": 219653, "epoch": 1815} {"train_loss": -42.145755767822266, "global_step": 219654, "epoch": 1815} {"train_loss": -42.403663635253906, "global_step": 219655, "epoch": 1815} {"train_loss": -42.706565856933594, "global_step": 219656, "epoch": 1815} {"train_loss": -42.842342376708984, "global_step": 219657, "epoch": 1815} {"train_loss": -42.54909133911133, "global_step": 219658, "epoch": 1815} {"train_loss": -41.472694396972656, "global_step": 219659, "epoch": 1815} {"train_loss": -42.627044677734375, "global_step": 219660, "epoch": 1815} {"train_loss": -42.35540008544922, "global_step": 219661, "epoch": 1815} {"train_loss": -41.39177322387695, "global_step": 219662, "epoch": 1815} {"train_loss": -42.63931655883789, "global_step": 219663, "epoch": 1815} {"train_loss": -42.53620147705078, "global_step": 219664, "epoch": 1815} {"train_loss": -41.46161651611328, "global_step": 219665, "epoch": 1815} {"train_loss": -42.9871711730957, "global_step": 219666, "epoch": 1815} {"train_loss": -41.54221725463867, "global_step": 219667, "epoch": 1815} {"train_loss": -41.578495025634766, "global_step": 219668, "epoch": 1815} {"train_loss": -41.15134811401367, "global_step": 219669, "epoch": 1815} {"train_loss": -40.224586486816406, "global_step": 219670, "epoch": 1815} {"train_loss": -41.890567779541016, "global_step": 219671, "epoch": 1815} {"train_loss": -42.794227600097656, "global_step": 219672, "epoch": 1815} {"train_loss": -41.05617904663086, "global_step": 219673, "epoch": 1815} {"train_loss": -41.056758880615234, "global_step": 219674, "epoch": 1815} {"train_loss": -39.75543975830078, "global_step": 219675, "epoch": 1815} {"train_loss": -42.591529846191406, "global_step": 219676, "epoch": 1815} {"train_loss": -40.55686569213867, "global_step": 219677, "epoch": 1815} {"train_loss": -42.25918197631836, "global_step": 219678, "epoch": 1815} {"train_loss": -40.66177749633789, "global_step": 219679, "epoch": 1815} {"train_loss": -39.089881896972656, "global_step": 219680, "epoch": 1815} {"train_loss": -37.33523178100586, "global_step": 219681, "epoch": 1815} {"train_loss": -41.77180099487305, "global_step": 219682, "epoch": 1815} {"train_loss": -41.17932891845703, "global_step": 219683, "epoch": 1815} {"train_loss": -42.18555450439453, "global_step": 219684, "epoch": 1815} {"train_loss": -41.281558990478516, "global_step": 219685, "epoch": 1815} {"train_loss": -38.53363037109375, "global_step": 219686, "epoch": 1815} {"train_loss": -41.63712692260742, "global_step": 219687, "epoch": 1815} {"train_loss": -39.3889274597168, "global_step": 219688, "epoch": 1815} {"train_loss": -40.239463806152344, "global_step": 219689, "epoch": 1815} {"train_loss": -41.80434036254883, "global_step": 219690, "epoch": 1815} {"train_loss": -40.5352897644043, "global_step": 219691, "epoch": 1815} {"train_loss": -42.15610885620117, "global_step": 219692, "epoch": 1815} {"train_loss": -41.829341888427734, "global_step": 219693, "epoch": 1815} {"train_loss": -41.875831604003906, "global_step": 219694, "epoch": 1815} {"train_loss": -42.38818359375, "global_step": 219695, "epoch": 1815} {"train_loss": -41.529029846191406, "global_step": 219696, "epoch": 1815} {"train_loss": -42.776283264160156, "global_step": 219697, "epoch": 1815} {"train_loss": -41.748939514160156, "global_step": 219698, "epoch": 1815} {"train_loss": -42.27827072143555, "global_step": 219699, "epoch": 1815} {"train_loss": -42.61347579956055, "global_step": 219700, "epoch": 1815} {"train_loss": -42.133174896240234, "global_step": 219701, "epoch": 1815} {"train_loss": -42.136138916015625, "global_step": 219702, "epoch": 1815} {"train_loss": -42.65449142456055, "global_step": 219703, "epoch": 1815} {"train_loss": -42.38075637817383, "global_step": 219704, "epoch": 1815} {"train_loss": -42.13761520385742, "global_step": 219705, "epoch": 1815} {"train_loss": -42.45589828491211, "global_step": 219706, "epoch": 1815} {"train_loss": -42.269630432128906, "global_step": 219707, "epoch": 1815} {"train_loss": -42.11589050292969, "global_step": 219708, "epoch": 1815} {"train_loss": -42.32188415527344, "global_step": 219709, "epoch": 1815} {"train_loss": -42.4000244140625, "global_step": 219710, "epoch": 1815} {"train_loss": -42.64729690551758, "global_step": 219711, "epoch": 1815} {"train_loss": -42.172237396240234, "global_step": 219712, "epoch": 1815} {"train_loss": -42.506187438964844, "global_step": 219713, "epoch": 1815} {"train_loss": -43.157936096191406, "global_step": 219714, "epoch": 1815} {"train_loss": -42.41354751586914, "global_step": 219715, "epoch": 1815} {"train_loss": -42.86457824707031, "global_step": 219716, "epoch": 1815} {"train_loss": -42.60444259643555, "global_step": 219717, "epoch": 1815} {"train_loss": -42.95313262939453, "global_step": 219718, "epoch": 1815} {"train_loss": -42.576499938964844, "global_step": 219719, "epoch": 1815} {"train_loss": -43.0455207824707, "global_step": 219720, "epoch": 1815} {"train_loss": -42.41929244995117, "global_step": 219721, "epoch": 1815} {"train_loss": -42.17387390136719, "global_step": 219722, "epoch": 1815} {"train_loss": -42.4697265625, "global_step": 219723, "epoch": 1815} {"train_loss": -41.986244201660156, "global_step": 219724, "epoch": 1815} {"train_loss": -42.479427337646484, "global_step": 219725, "epoch": 1815} {"train_loss": -42.4716911315918, "global_step": 219726, "epoch": 1815} {"train_loss": -42.02998352050781, "global_step": 219727, "epoch": 1815} {"train_loss": -42.443267822265625, "global_step": 219728, "epoch": 1815} {"train_loss": -42.62446975708008, "global_step": 219729, "epoch": 1815} {"train_loss": -42.0808219909668, "global_step": 219730, "epoch": 1815} {"train_loss": -42.91227722167969, "global_step": 219731, "epoch": 1815} {"train_loss": -42.78947830200195, "global_step": 219732, "epoch": 1815} {"train_loss": -42.86035919189453, "global_step": 219733, "epoch": 1815} {"train_loss": -42.41838836669922, "global_step": 219734, "epoch": 1815} {"train_loss": -41.76714753710534, "global_step": 219735, "epoch": 1815, "val_loss": 2527751.75} {"train_loss": -43.174678802490234, "global_step": 219736, "epoch": 1816} {"train_loss": -40.763275146484375, "global_step": 219737, "epoch": 1816} {"train_loss": -42.80507278442383, "global_step": 219738, "epoch": 1816} {"train_loss": -41.68611526489258, "global_step": 219739, "epoch": 1816} {"train_loss": -42.31888961791992, "global_step": 219740, "epoch": 1816} {"train_loss": -43.13719940185547, "global_step": 219741, "epoch": 1816} {"train_loss": -42.203338623046875, "global_step": 219742, "epoch": 1816} {"train_loss": -41.62711715698242, "global_step": 219743, "epoch": 1816} {"train_loss": -42.70720291137695, "global_step": 219744, "epoch": 1816} {"train_loss": -42.087764739990234, "global_step": 219745, "epoch": 1816} {"train_loss": -41.543190002441406, "global_step": 219746, "epoch": 1816} {"train_loss": -41.47349166870117, "global_step": 219747, "epoch": 1816} {"train_loss": -42.52703857421875, "global_step": 219748, "epoch": 1816} {"train_loss": -41.68408203125, "global_step": 219749, "epoch": 1816} {"train_loss": -41.493289947509766, "global_step": 219750, "epoch": 1816} {"train_loss": -42.144264221191406, "global_step": 219751, "epoch": 1816} {"train_loss": -41.73850631713867, "global_step": 219752, "epoch": 1816} {"train_loss": -42.14707565307617, "global_step": 219753, "epoch": 1816} {"train_loss": -42.59229278564453, "global_step": 219754, "epoch": 1816} {"train_loss": -43.07387161254883, "global_step": 219755, "epoch": 1816} {"train_loss": -42.349761962890625, "global_step": 219756, "epoch": 1816} {"train_loss": -42.44973373413086, "global_step": 219757, "epoch": 1816} {"train_loss": -41.8945198059082, "global_step": 219758, "epoch": 1816} {"train_loss": -41.926082611083984, "global_step": 219759, "epoch": 1816} {"train_loss": -42.066402435302734, "global_step": 219760, "epoch": 1816} {"train_loss": -40.6473503112793, "global_step": 219761, "epoch": 1816} {"train_loss": -39.399906158447266, "global_step": 219762, "epoch": 1816} {"train_loss": -39.449703216552734, "global_step": 219763, "epoch": 1816} {"train_loss": -39.913875579833984, "global_step": 219764, "epoch": 1816} {"train_loss": -41.08465576171875, "global_step": 219765, "epoch": 1816} {"train_loss": -40.01961898803711, "global_step": 219766, "epoch": 1816} {"train_loss": -41.17867660522461, "global_step": 219767, "epoch": 1816} {"train_loss": -41.33658981323242, "global_step": 219768, "epoch": 1816} {"train_loss": -42.12982940673828, "global_step": 219769, "epoch": 1816} {"train_loss": -42.501705169677734, "global_step": 219770, "epoch": 1816} {"train_loss": -42.141693115234375, "global_step": 219771, "epoch": 1816} {"train_loss": -41.81462478637695, "global_step": 219772, "epoch": 1816} {"train_loss": -42.49259567260742, "global_step": 219773, "epoch": 1816} {"train_loss": -41.5155029296875, "global_step": 219774, "epoch": 1816} {"train_loss": -42.1409912109375, "global_step": 219775, "epoch": 1816} {"train_loss": -41.790889739990234, "global_step": 219776, "epoch": 1816} {"train_loss": -40.949501037597656, "global_step": 219777, "epoch": 1816} {"train_loss": -39.290077209472656, "global_step": 219778, "epoch": 1816} {"train_loss": -42.287513732910156, "global_step": 219779, "epoch": 1816} {"train_loss": -41.66301345825195, "global_step": 219780, "epoch": 1816} {"train_loss": -40.1776123046875, "global_step": 219781, "epoch": 1816} {"train_loss": -40.420570373535156, "global_step": 219782, "epoch": 1816} {"train_loss": -39.966278076171875, "global_step": 219783, "epoch": 1816} {"train_loss": -38.01869583129883, "global_step": 219784, "epoch": 1816} {"train_loss": -40.6071662902832, "global_step": 219785, "epoch": 1816} {"train_loss": -39.05424118041992, "global_step": 219786, "epoch": 1816} {"train_loss": -38.9512939453125, "global_step": 219787, "epoch": 1816} {"train_loss": -39.45954513549805, "global_step": 219788, "epoch": 1816} {"train_loss": -39.75230407714844, "global_step": 219789, "epoch": 1816} {"train_loss": -38.829524993896484, "global_step": 219790, "epoch": 1816} {"train_loss": -39.79456329345703, "global_step": 219791, "epoch": 1816} {"train_loss": -36.217681884765625, "global_step": 219792, "epoch": 1816} {"train_loss": -39.81328201293945, "global_step": 219793, "epoch": 1816} {"train_loss": -40.640968322753906, "global_step": 219794, "epoch": 1816} {"train_loss": -39.920448303222656, "global_step": 219795, "epoch": 1816} {"train_loss": -41.064571380615234, "global_step": 219796, "epoch": 1816} {"train_loss": -39.850433349609375, "global_step": 219797, "epoch": 1816} {"train_loss": -38.56986618041992, "global_step": 219798, "epoch": 1816} {"train_loss": -41.13127517700195, "global_step": 219799, "epoch": 1816} {"train_loss": -41.68585968017578, "global_step": 219800, "epoch": 1816} {"train_loss": -41.92528533935547, "global_step": 219801, "epoch": 1816} {"train_loss": -42.184242248535156, "global_step": 219802, "epoch": 1816} {"train_loss": -42.318275451660156, "global_step": 219803, "epoch": 1816} {"train_loss": -42.40034866333008, "global_step": 219804, "epoch": 1816} {"train_loss": -42.086517333984375, "global_step": 219805, "epoch": 1816} {"train_loss": -41.61853790283203, "global_step": 219806, "epoch": 1816} {"train_loss": -42.34566879272461, "global_step": 219807, "epoch": 1816} {"train_loss": -41.510372161865234, "global_step": 219808, "epoch": 1816} {"train_loss": -38.47900390625, "global_step": 219809, "epoch": 1816} {"train_loss": -41.60376739501953, "global_step": 219810, "epoch": 1816} {"train_loss": -42.15724182128906, "global_step": 219811, "epoch": 1816} {"train_loss": -41.849796295166016, "global_step": 219812, "epoch": 1816} {"train_loss": -41.83770751953125, "global_step": 219813, "epoch": 1816} {"train_loss": -41.135128021240234, "global_step": 219814, "epoch": 1816} {"train_loss": -39.03866195678711, "global_step": 219815, "epoch": 1816} {"train_loss": -42.18692398071289, "global_step": 219816, "epoch": 1816} {"train_loss": -40.8711051940918, "global_step": 219817, "epoch": 1816} {"train_loss": -42.082820892333984, "global_step": 219818, "epoch": 1816} {"train_loss": -41.80863571166992, "global_step": 219819, "epoch": 1816} {"train_loss": -42.01535415649414, "global_step": 219820, "epoch": 1816} {"train_loss": -42.27492904663086, "global_step": 219821, "epoch": 1816} {"train_loss": -41.9418830871582, "global_step": 219822, "epoch": 1816} {"train_loss": -41.88887023925781, "global_step": 219823, "epoch": 1816} {"train_loss": -42.02626419067383, "global_step": 219824, "epoch": 1816} {"train_loss": -41.949710845947266, "global_step": 219825, "epoch": 1816} {"train_loss": -42.35593795776367, "global_step": 219826, "epoch": 1816} {"train_loss": -42.56199264526367, "global_step": 219827, "epoch": 1816} {"train_loss": -41.26121520996094, "global_step": 219828, "epoch": 1816} {"train_loss": -42.14942169189453, "global_step": 219829, "epoch": 1816} {"train_loss": -42.66766357421875, "global_step": 219830, "epoch": 1816} {"train_loss": -42.71177673339844, "global_step": 219831, "epoch": 1816} {"train_loss": -42.19573974609375, "global_step": 219832, "epoch": 1816} {"train_loss": -39.99870681762695, "global_step": 219833, "epoch": 1816} {"train_loss": -42.07316207885742, "global_step": 219834, "epoch": 1816} {"train_loss": -41.061370849609375, "global_step": 219835, "epoch": 1816} {"train_loss": -42.29413986206055, "global_step": 219836, "epoch": 1816} {"train_loss": -43.17210388183594, "global_step": 219837, "epoch": 1816} {"train_loss": -42.54083251953125, "global_step": 219838, "epoch": 1816} {"train_loss": -43.12318420410156, "global_step": 219839, "epoch": 1816} {"train_loss": -43.05973434448242, "global_step": 219840, "epoch": 1816} {"train_loss": -40.07073974609375, "global_step": 219841, "epoch": 1816} {"train_loss": -42.007598876953125, "global_step": 219842, "epoch": 1816} {"train_loss": -42.73415756225586, "global_step": 219843, "epoch": 1816} {"train_loss": -42.69061279296875, "global_step": 219844, "epoch": 1816} {"train_loss": -42.285003662109375, "global_step": 219845, "epoch": 1816} {"train_loss": -42.90452575683594, "global_step": 219846, "epoch": 1816} {"train_loss": -43.01816940307617, "global_step": 219847, "epoch": 1816} {"train_loss": -42.9487190246582, "global_step": 219848, "epoch": 1816} {"train_loss": -42.755348205566406, "global_step": 219849, "epoch": 1816} {"train_loss": -42.969459533691406, "global_step": 219850, "epoch": 1816} {"train_loss": -42.51298141479492, "global_step": 219851, "epoch": 1816} {"train_loss": -42.79249954223633, "global_step": 219852, "epoch": 1816} {"train_loss": -42.854000091552734, "global_step": 219853, "epoch": 1816} {"train_loss": -43.277122497558594, "global_step": 219854, "epoch": 1816} {"train_loss": -42.83564376831055, "global_step": 219855, "epoch": 1816} {"train_loss": -41.55032153168985, "global_step": 219856, "epoch": 1816, "val_loss": 2538957.75} {"train_loss": -42.611427307128906, "global_step": 219857, "epoch": 1817} {"train_loss": -43.24598693847656, "global_step": 219858, "epoch": 1817} {"train_loss": -42.7991828918457, "global_step": 219859, "epoch": 1817} {"train_loss": -43.16481399536133, "global_step": 219860, "epoch": 1817} {"train_loss": -42.3690299987793, "global_step": 219861, "epoch": 1817} {"train_loss": -42.154197692871094, "global_step": 219862, "epoch": 1817} {"train_loss": -43.249576568603516, "global_step": 219863, "epoch": 1817} {"train_loss": -42.76715850830078, "global_step": 219864, "epoch": 1817} {"train_loss": -43.0208625793457, "global_step": 219865, "epoch": 1817} {"train_loss": -43.09024429321289, "global_step": 219866, "epoch": 1817} {"train_loss": -43.10539245605469, "global_step": 219867, "epoch": 1817} {"train_loss": -42.80244827270508, "global_step": 219868, "epoch": 1817} {"train_loss": -43.09711456298828, "global_step": 219869, "epoch": 1817} {"train_loss": -42.5303840637207, "global_step": 219870, "epoch": 1817} {"train_loss": -42.759708404541016, "global_step": 219871, "epoch": 1817} {"train_loss": -42.77140426635742, "global_step": 219872, "epoch": 1817} {"train_loss": -43.32708740234375, "global_step": 219873, "epoch": 1817} {"train_loss": -42.1397590637207, "global_step": 219874, "epoch": 1817} {"train_loss": -42.41806411743164, "global_step": 219875, "epoch": 1817} {"train_loss": -41.961647033691406, "global_step": 219876, "epoch": 1817} {"train_loss": -42.760799407958984, "global_step": 219877, "epoch": 1817} {"train_loss": -42.376136779785156, "global_step": 219878, "epoch": 1817} {"train_loss": -42.738624572753906, "global_step": 219879, "epoch": 1817} {"train_loss": -42.921974182128906, "global_step": 219880, "epoch": 1817} {"train_loss": -43.36874008178711, "global_step": 219881, "epoch": 1817} {"train_loss": -42.36952590942383, "global_step": 219882, "epoch": 1817} {"train_loss": -43.23827362060547, "global_step": 219883, "epoch": 1817} {"train_loss": -42.54232406616211, "global_step": 219884, "epoch": 1817} {"train_loss": -42.99176025390625, "global_step": 219885, "epoch": 1817} {"train_loss": -43.01752853393555, "global_step": 219886, "epoch": 1817} {"train_loss": -42.5015869140625, "global_step": 219887, "epoch": 1817} {"train_loss": -41.8908576965332, "global_step": 219888, "epoch": 1817} {"train_loss": -41.576454162597656, "global_step": 219889, "epoch": 1817} {"train_loss": -42.334381103515625, "global_step": 219890, "epoch": 1817} {"train_loss": -41.22657012939453, "global_step": 219891, "epoch": 1817} {"train_loss": -39.74819564819336, "global_step": 219892, "epoch": 1817} {"train_loss": -39.03923416137695, "global_step": 219893, "epoch": 1817} {"train_loss": -39.4637336730957, "global_step": 219894, "epoch": 1817} {"train_loss": -42.217098236083984, "global_step": 219895, "epoch": 1817} {"train_loss": -42.153499603271484, "global_step": 219896, "epoch": 1817} {"train_loss": -38.5062255859375, "global_step": 219897, "epoch": 1817} {"train_loss": -42.162353515625, "global_step": 219898, "epoch": 1817} {"train_loss": -42.60663986206055, "global_step": 219899, "epoch": 1817} {"train_loss": -41.985939025878906, "global_step": 219900, "epoch": 1817} {"train_loss": -41.62969970703125, "global_step": 219901, "epoch": 1817} {"train_loss": -41.96533966064453, "global_step": 219902, "epoch": 1817} {"train_loss": -42.233394622802734, "global_step": 219903, "epoch": 1817} {"train_loss": -41.17667770385742, "global_step": 219904, "epoch": 1817} {"train_loss": -42.019535064697266, "global_step": 219905, "epoch": 1817} {"train_loss": -42.775657653808594, "global_step": 219906, "epoch": 1817} {"train_loss": -42.13426971435547, "global_step": 219907, "epoch": 1817} {"train_loss": -39.03483581542969, "global_step": 219908, "epoch": 1817} {"train_loss": -41.46009063720703, "global_step": 219909, "epoch": 1817} {"train_loss": -41.69428253173828, "global_step": 219910, "epoch": 1817} {"train_loss": -39.60854721069336, "global_step": 219911, "epoch": 1817} {"train_loss": -42.24760818481445, "global_step": 219912, "epoch": 1817} {"train_loss": -41.82509231567383, "global_step": 219913, "epoch": 1817} {"train_loss": -40.7391471862793, "global_step": 219914, "epoch": 1817} {"train_loss": -42.22478103637695, "global_step": 219915, "epoch": 1817} {"train_loss": -42.0860595703125, "global_step": 219916, "epoch": 1817} {"train_loss": -41.915748596191406, "global_step": 219917, "epoch": 1817} {"train_loss": -41.671810150146484, "global_step": 219918, "epoch": 1817} {"train_loss": -40.27344512939453, "global_step": 219919, "epoch": 1817} {"train_loss": -41.1413459777832, "global_step": 219920, "epoch": 1817} {"train_loss": -42.40022659301758, "global_step": 219921, "epoch": 1817} {"train_loss": -41.94710922241211, "global_step": 219922, "epoch": 1817} {"train_loss": -42.045257568359375, "global_step": 219923, "epoch": 1817} {"train_loss": -41.04219436645508, "global_step": 219924, "epoch": 1817} {"train_loss": -42.97500228881836, "global_step": 219925, "epoch": 1817} {"train_loss": -41.48221969604492, "global_step": 219926, "epoch": 1817} {"train_loss": -42.40148162841797, "global_step": 219927, "epoch": 1817} {"train_loss": -42.78544235229492, "global_step": 219928, "epoch": 1817} {"train_loss": -42.13633346557617, "global_step": 219929, "epoch": 1817} {"train_loss": -42.988521575927734, "global_step": 219930, "epoch": 1817} {"train_loss": -42.009639739990234, "global_step": 219931, "epoch": 1817} {"train_loss": -40.7891845703125, "global_step": 219932, "epoch": 1817} {"train_loss": -40.85684585571289, "global_step": 219933, "epoch": 1817} {"train_loss": -41.229793548583984, "global_step": 219934, "epoch": 1817} {"train_loss": -41.9502067565918, "global_step": 219935, "epoch": 1817} {"train_loss": -42.433162689208984, "global_step": 219936, "epoch": 1817} {"train_loss": -42.4953498840332, "global_step": 219937, "epoch": 1817} {"train_loss": -42.096534729003906, "global_step": 219938, "epoch": 1817} {"train_loss": -42.8098258972168, "global_step": 219939, "epoch": 1817} {"train_loss": -42.68787384033203, "global_step": 219940, "epoch": 1817} {"train_loss": -42.2484016418457, "global_step": 219941, "epoch": 1817} {"train_loss": -42.80638122558594, "global_step": 219942, "epoch": 1817} {"train_loss": -42.39413070678711, "global_step": 219943, "epoch": 1817} {"train_loss": -41.70425033569336, "global_step": 219944, "epoch": 1817} {"train_loss": -40.06705856323242, "global_step": 219945, "epoch": 1817} {"train_loss": -40.55813217163086, "global_step": 219946, "epoch": 1817} {"train_loss": -42.21982955932617, "global_step": 219947, "epoch": 1817} {"train_loss": -40.73306655883789, "global_step": 219948, "epoch": 1817} {"train_loss": -38.56498336791992, "global_step": 219949, "epoch": 1817} {"train_loss": -39.6584358215332, "global_step": 219950, "epoch": 1817} {"train_loss": -41.46795654296875, "global_step": 219951, "epoch": 1817} {"train_loss": -39.99254608154297, "global_step": 219952, "epoch": 1817} {"train_loss": -42.212886810302734, "global_step": 219953, "epoch": 1817} {"train_loss": -41.12562942504883, "global_step": 219954, "epoch": 1817} {"train_loss": -39.90517807006836, "global_step": 219955, "epoch": 1817} {"train_loss": -42.398372650146484, "global_step": 219956, "epoch": 1817} {"train_loss": -39.801910400390625, "global_step": 219957, "epoch": 1817} {"train_loss": -40.0385627746582, "global_step": 219958, "epoch": 1817} {"train_loss": -41.077110290527344, "global_step": 219959, "epoch": 1817} {"train_loss": -38.82023239135742, "global_step": 219960, "epoch": 1817} {"train_loss": -40.576148986816406, "global_step": 219961, "epoch": 1817} {"train_loss": -36.419036865234375, "global_step": 219962, "epoch": 1817} {"train_loss": -38.08974838256836, "global_step": 219963, "epoch": 1817} {"train_loss": -39.982704162597656, "global_step": 219964, "epoch": 1817} {"train_loss": -34.49072265625, "global_step": 219965, "epoch": 1817} {"train_loss": -40.02935791015625, "global_step": 219966, "epoch": 1817} {"train_loss": -36.57808303833008, "global_step": 219967, "epoch": 1817} {"train_loss": -34.689090728759766, "global_step": 219968, "epoch": 1817} {"train_loss": -35.60390853881836, "global_step": 219969, "epoch": 1817} {"train_loss": -36.27981185913086, "global_step": 219970, "epoch": 1817} {"train_loss": -35.69755172729492, "global_step": 219971, "epoch": 1817} {"train_loss": -36.95734786987305, "global_step": 219972, "epoch": 1817} {"train_loss": -37.73537826538086, "global_step": 219973, "epoch": 1817} {"train_loss": -37.31437301635742, "global_step": 219974, "epoch": 1817} {"train_loss": -37.05322265625, "global_step": 219975, "epoch": 1817} {"train_loss": -38.27500534057617, "global_step": 219976, "epoch": 1817} {"train_loss": -41.198388123315226, "global_step": 219977, "epoch": 1817, "val_loss": 2538278.25} {"train_loss": -39.1706428527832, "global_step": 219978, "epoch": 1818} {"train_loss": -38.57546615600586, "global_step": 219979, "epoch": 1818} {"train_loss": -39.254215240478516, "global_step": 219980, "epoch": 1818} {"train_loss": -39.83982467651367, "global_step": 219981, "epoch": 1818} {"train_loss": -39.621456146240234, "global_step": 219982, "epoch": 1818} {"train_loss": -40.94662094116211, "global_step": 219983, "epoch": 1818} {"train_loss": -40.90787887573242, "global_step": 219984, "epoch": 1818} {"train_loss": -40.06053161621094, "global_step": 219985, "epoch": 1818} {"train_loss": -40.91328811645508, "global_step": 219986, "epoch": 1818} {"train_loss": -41.414215087890625, "global_step": 219987, "epoch": 1818} {"train_loss": -41.162235260009766, "global_step": 219988, "epoch": 1818} {"train_loss": -41.237361907958984, "global_step": 219989, "epoch": 1818} {"train_loss": -41.30083465576172, "global_step": 219990, "epoch": 1818} {"train_loss": -40.628173828125, "global_step": 219991, "epoch": 1818} {"train_loss": -40.492008209228516, "global_step": 219992, "epoch": 1818} {"train_loss": -40.720733642578125, "global_step": 219993, "epoch": 1818} {"train_loss": -41.755348205566406, "global_step": 219994, "epoch": 1818} {"train_loss": -40.75771713256836, "global_step": 219995, "epoch": 1818} {"train_loss": -40.63070297241211, "global_step": 219996, "epoch": 1818} {"train_loss": -40.634422302246094, "global_step": 219997, "epoch": 1818} {"train_loss": -39.810791015625, "global_step": 219998, "epoch": 1818} {"train_loss": -41.646095275878906, "global_step": 219999, "epoch": 1818} {"train_loss": -40.41036605834961, "global_step": 220000, "epoch": 1818} {"train_loss": -41.46847152709961, "global_step": 220001, "epoch": 1818} {"train_loss": -41.25404357910156, "global_step": 220002, "epoch": 1818} {"train_loss": -40.884437561035156, "global_step": 220003, "epoch": 1818} {"train_loss": -42.2595329284668, "global_step": 220004, "epoch": 1818} {"train_loss": -40.209266662597656, "global_step": 220005, "epoch": 1818} {"train_loss": -41.98164749145508, "global_step": 220006, "epoch": 1818} {"train_loss": -41.794761657714844, "global_step": 220007, "epoch": 1818} {"train_loss": -41.077449798583984, "global_step": 220008, "epoch": 1818} {"train_loss": -42.90945816040039, "global_step": 220009, "epoch": 1818} {"train_loss": -40.47654342651367, "global_step": 220010, "epoch": 1818} {"train_loss": -41.68804931640625, "global_step": 220011, "epoch": 1818} {"train_loss": -42.12163543701172, "global_step": 220012, "epoch": 1818} {"train_loss": -41.2850341796875, "global_step": 220013, "epoch": 1818} {"train_loss": -42.254817962646484, "global_step": 220014, "epoch": 1818} {"train_loss": -41.77775192260742, "global_step": 220015, "epoch": 1818} {"train_loss": -41.49850082397461, "global_step": 220016, "epoch": 1818} {"train_loss": -42.691253662109375, "global_step": 220017, "epoch": 1818} {"train_loss": -42.15108108520508, "global_step": 220018, "epoch": 1818} {"train_loss": -42.28670120239258, "global_step": 220019, "epoch": 1818} {"train_loss": -42.83211898803711, "global_step": 220020, "epoch": 1818} {"train_loss": -42.472450256347656, "global_step": 220021, "epoch": 1818} {"train_loss": -42.89459991455078, "global_step": 220022, "epoch": 1818} {"train_loss": -41.877864837646484, "global_step": 220023, "epoch": 1818} {"train_loss": -42.678829193115234, "global_step": 220024, "epoch": 1818} {"train_loss": -42.55580139160156, "global_step": 220025, "epoch": 1818} {"train_loss": -43.0786018371582, "global_step": 220026, "epoch": 1818} {"train_loss": -42.661537170410156, "global_step": 220027, "epoch": 1818} {"train_loss": -42.97798538208008, "global_step": 220028, "epoch": 1818} {"train_loss": -41.436248779296875, "global_step": 220029, "epoch": 1818} {"train_loss": -43.16988754272461, "global_step": 220030, "epoch": 1818} {"train_loss": -42.13620376586914, "global_step": 220031, "epoch": 1818} {"train_loss": -42.92569351196289, "global_step": 220032, "epoch": 1818} {"train_loss": -43.1081428527832, "global_step": 220033, "epoch": 1818} {"train_loss": -42.17608642578125, "global_step": 220034, "epoch": 1818} {"train_loss": -42.730987548828125, "global_step": 220035, "epoch": 1818} {"train_loss": -43.10661697387695, "global_step": 220036, "epoch": 1818} {"train_loss": -42.60503387451172, "global_step": 220037, "epoch": 1818} {"train_loss": -43.10297393798828, "global_step": 220038, "epoch": 1818} {"train_loss": -43.04122543334961, "global_step": 220039, "epoch": 1818} {"train_loss": -43.46387481689453, "global_step": 220040, "epoch": 1818} {"train_loss": -43.13494873046875, "global_step": 220041, "epoch": 1818} {"train_loss": -43.07087707519531, "global_step": 220042, "epoch": 1818} {"train_loss": -43.39127731323242, "global_step": 220043, "epoch": 1818} {"train_loss": -42.95161056518555, "global_step": 220044, "epoch": 1818} {"train_loss": -43.5447998046875, "global_step": 220045, "epoch": 1818} {"train_loss": -43.69065856933594, "global_step": 220046, "epoch": 1818} {"train_loss": -43.658660888671875, "global_step": 220047, "epoch": 1818} {"train_loss": -43.5625114440918, "global_step": 220048, "epoch": 1818} {"train_loss": -43.17112350463867, "global_step": 220049, "epoch": 1818} {"train_loss": -43.34352493286133, "global_step": 220050, "epoch": 1818} {"train_loss": -43.6649169921875, "global_step": 220051, "epoch": 1818} {"train_loss": -43.498477935791016, "global_step": 220052, "epoch": 1818} {"train_loss": -43.05863571166992, "global_step": 220053, "epoch": 1818} {"train_loss": -43.77252197265625, "global_step": 220054, "epoch": 1818} {"train_loss": -43.81313705444336, "global_step": 220055, "epoch": 1818} {"train_loss": -43.79757308959961, "global_step": 220056, "epoch": 1818} {"train_loss": -43.5196647644043, "global_step": 220057, "epoch": 1818} {"train_loss": -43.8117790222168, "global_step": 220058, "epoch": 1818} {"train_loss": -43.92449188232422, "global_step": 220059, "epoch": 1818} {"train_loss": -43.44330978393555, "global_step": 220060, "epoch": 1818} {"train_loss": -43.40943908691406, "global_step": 220061, "epoch": 1818} {"train_loss": -43.863643646240234, "global_step": 220062, "epoch": 1818} {"train_loss": -43.30854034423828, "global_step": 220063, "epoch": 1818} {"train_loss": -43.41663360595703, "global_step": 220064, "epoch": 1818} {"train_loss": -43.441837310791016, "global_step": 220065, "epoch": 1818} {"train_loss": -43.12935256958008, "global_step": 220066, "epoch": 1818} {"train_loss": -43.79862594604492, "global_step": 220067, "epoch": 1818} {"train_loss": -43.63258743286133, "global_step": 220068, "epoch": 1818} {"train_loss": -43.98643493652344, "global_step": 220069, "epoch": 1818} {"train_loss": -43.541927337646484, "global_step": 220070, "epoch": 1818} {"train_loss": -41.8203125, "global_step": 220071, "epoch": 1818} {"train_loss": -39.9658088684082, "global_step": 220072, "epoch": 1818} {"train_loss": -39.569149017333984, "global_step": 220073, "epoch": 1818} {"train_loss": -38.88338088989258, "global_step": 220074, "epoch": 1818} {"train_loss": -39.72307205200195, "global_step": 220075, "epoch": 1818} {"train_loss": -40.34904098510742, "global_step": 220076, "epoch": 1818} {"train_loss": -42.0673942565918, "global_step": 220077, "epoch": 1818} {"train_loss": -39.779903411865234, "global_step": 220078, "epoch": 1818} {"train_loss": -40.01784133911133, "global_step": 220079, "epoch": 1818} {"train_loss": -40.04220199584961, "global_step": 220080, "epoch": 1818} {"train_loss": -40.305755615234375, "global_step": 220081, "epoch": 1818} {"train_loss": -40.91268539428711, "global_step": 220082, "epoch": 1818} {"train_loss": -41.37348175048828, "global_step": 220083, "epoch": 1818} {"train_loss": -40.40364074707031, "global_step": 220084, "epoch": 1818} {"train_loss": -40.717952728271484, "global_step": 220085, "epoch": 1818} {"train_loss": -41.52621078491211, "global_step": 220086, "epoch": 1818} {"train_loss": -42.5028076171875, "global_step": 220087, "epoch": 1818} {"train_loss": -42.858375549316406, "global_step": 220088, "epoch": 1818} {"train_loss": -40.823974609375, "global_step": 220089, "epoch": 1818} {"train_loss": -38.99431610107422, "global_step": 220090, "epoch": 1818} {"train_loss": -42.45591354370117, "global_step": 220091, "epoch": 1818} {"train_loss": -39.64311981201172, "global_step": 220092, "epoch": 1818} {"train_loss": -42.49555587768555, "global_step": 220093, "epoch": 1818} {"train_loss": -39.56059646606445, "global_step": 220094, "epoch": 1818} {"train_loss": -42.4782829284668, "global_step": 220095, "epoch": 1818} {"train_loss": -39.24931716918945, "global_step": 220096, "epoch": 1818} {"train_loss": -40.03084182739258, "global_step": 220097, "epoch": 1818} {"train_loss": -41.87412693874895, "global_step": 220098, "epoch": 1818, "val_loss": 2609644.25} {"train_loss": -38.86933517456055, "global_step": 220099, "epoch": 1819} {"train_loss": -37.527076721191406, "global_step": 220100, "epoch": 1819} {"train_loss": -41.49240493774414, "global_step": 220101, "epoch": 1819} {"train_loss": -36.697349548339844, "global_step": 220102, "epoch": 1819} {"train_loss": -41.27035140991211, "global_step": 220103, "epoch": 1819} {"train_loss": -38.21274948120117, "global_step": 220104, "epoch": 1819} {"train_loss": -41.715396881103516, "global_step": 220105, "epoch": 1819} {"train_loss": -40.183250427246094, "global_step": 220106, "epoch": 1819} {"train_loss": -40.67084884643555, "global_step": 220107, "epoch": 1819} {"train_loss": -39.958213806152344, "global_step": 220108, "epoch": 1819} {"train_loss": -41.049495697021484, "global_step": 220109, "epoch": 1819} {"train_loss": -41.161067962646484, "global_step": 220110, "epoch": 1819} {"train_loss": -40.239418029785156, "global_step": 220111, "epoch": 1819} {"train_loss": -40.87877655029297, "global_step": 220112, "epoch": 1819} {"train_loss": -40.05705642700195, "global_step": 220113, "epoch": 1819} {"train_loss": -40.859153747558594, "global_step": 220114, "epoch": 1819} {"train_loss": -41.14039611816406, "global_step": 220115, "epoch": 1819} {"train_loss": -40.13625717163086, "global_step": 220116, "epoch": 1819} {"train_loss": -40.864288330078125, "global_step": 220117, "epoch": 1819} {"train_loss": -40.692989349365234, "global_step": 220118, "epoch": 1819} {"train_loss": -40.78213119506836, "global_step": 220119, "epoch": 1819} {"train_loss": -39.622947692871094, "global_step": 220120, "epoch": 1819} {"train_loss": -40.1735725402832, "global_step": 220121, "epoch": 1819} {"train_loss": -40.837738037109375, "global_step": 220122, "epoch": 1819} {"train_loss": -41.65214157104492, "global_step": 220123, "epoch": 1819} {"train_loss": -40.87919998168945, "global_step": 220124, "epoch": 1819} {"train_loss": -40.99519729614258, "global_step": 220125, "epoch": 1819} {"train_loss": -40.69709777832031, "global_step": 220126, "epoch": 1819} {"train_loss": -41.62457275390625, "global_step": 220127, "epoch": 1819} {"train_loss": -41.12058639526367, "global_step": 220128, "epoch": 1819} {"train_loss": -41.702571868896484, "global_step": 220129, "epoch": 1819} {"train_loss": -40.13095474243164, "global_step": 220130, "epoch": 1819} {"train_loss": -42.25777053833008, "global_step": 220131, "epoch": 1819} {"train_loss": -40.21116256713867, "global_step": 220132, "epoch": 1819} {"train_loss": -41.79312515258789, "global_step": 220133, "epoch": 1819} {"train_loss": -42.87288284301758, "global_step": 220134, "epoch": 1819} {"train_loss": -41.24628448486328, "global_step": 220135, "epoch": 1819} {"train_loss": -42.889251708984375, "global_step": 220136, "epoch": 1819} {"train_loss": -42.61308670043945, "global_step": 220137, "epoch": 1819} {"train_loss": -42.00956344604492, "global_step": 220138, "epoch": 1819} {"train_loss": -42.801025390625, "global_step": 220139, "epoch": 1819} {"train_loss": -42.79745864868164, "global_step": 220140, "epoch": 1819} {"train_loss": -42.19179916381836, "global_step": 220141, "epoch": 1819} {"train_loss": -42.58849334716797, "global_step": 220142, "epoch": 1819} {"train_loss": -42.449310302734375, "global_step": 220143, "epoch": 1819} {"train_loss": -42.16627883911133, "global_step": 220144, "epoch": 1819} {"train_loss": -43.2784423828125, "global_step": 220145, "epoch": 1819} {"train_loss": -42.20127868652344, "global_step": 220146, "epoch": 1819} {"train_loss": -42.86336898803711, "global_step": 220147, "epoch": 1819} {"train_loss": -43.075469970703125, "global_step": 220148, "epoch": 1819} {"train_loss": -42.553890228271484, "global_step": 220149, "epoch": 1819} {"train_loss": -43.0423698425293, "global_step": 220150, "epoch": 1819} {"train_loss": -43.02008819580078, "global_step": 220151, "epoch": 1819} {"train_loss": -42.80335235595703, "global_step": 220152, "epoch": 1819} {"train_loss": -43.07358932495117, "global_step": 220153, "epoch": 1819} {"train_loss": -42.93605041503906, "global_step": 220154, "epoch": 1819} {"train_loss": -43.0290641784668, "global_step": 220155, "epoch": 1819} {"train_loss": -42.97614669799805, "global_step": 220156, "epoch": 1819} {"train_loss": -43.363155364990234, "global_step": 220157, "epoch": 1819} {"train_loss": -42.80177688598633, "global_step": 220158, "epoch": 1819} {"train_loss": -43.37708282470703, "global_step": 220159, "epoch": 1819} {"train_loss": -43.62234115600586, "global_step": 220160, "epoch": 1819} {"train_loss": -43.38778305053711, "global_step": 220161, "epoch": 1819} {"train_loss": -42.785125732421875, "global_step": 220162, "epoch": 1819} {"train_loss": -43.463375091552734, "global_step": 220163, "epoch": 1819} {"train_loss": -43.28960037231445, "global_step": 220164, "epoch": 1819} {"train_loss": -41.66823959350586, "global_step": 220165, "epoch": 1819} {"train_loss": -42.16455078125, "global_step": 220166, "epoch": 1819} {"train_loss": -43.12297058105469, "global_step": 220167, "epoch": 1819} {"train_loss": -42.28496170043945, "global_step": 220168, "epoch": 1819} {"train_loss": -42.545833587646484, "global_step": 220169, "epoch": 1819} {"train_loss": -43.0297737121582, "global_step": 220170, "epoch": 1819} {"train_loss": -43.1938591003418, "global_step": 220171, "epoch": 1819} {"train_loss": -42.63433074951172, "global_step": 220172, "epoch": 1819} {"train_loss": -43.47845458984375, "global_step": 220173, "epoch": 1819} {"train_loss": -43.45466232299805, "global_step": 220174, "epoch": 1819} {"train_loss": -42.99497604370117, "global_step": 220175, "epoch": 1819} {"train_loss": -42.793575286865234, "global_step": 220176, "epoch": 1819} {"train_loss": -42.983375549316406, "global_step": 220177, "epoch": 1819} {"train_loss": -43.217201232910156, "global_step": 220178, "epoch": 1819} {"train_loss": -43.32514953613281, "global_step": 220179, "epoch": 1819} {"train_loss": -43.878868103027344, "global_step": 220180, "epoch": 1819} {"train_loss": -43.3997688293457, "global_step": 220181, "epoch": 1819} {"train_loss": -43.46189498901367, "global_step": 220182, "epoch": 1819} {"train_loss": -43.16205978393555, "global_step": 220183, "epoch": 1819} {"train_loss": -42.773250579833984, "global_step": 220184, "epoch": 1819} {"train_loss": -42.055416107177734, "global_step": 220185, "epoch": 1819} {"train_loss": -40.99220275878906, "global_step": 220186, "epoch": 1819} {"train_loss": -43.59208297729492, "global_step": 220187, "epoch": 1819} {"train_loss": -42.300472259521484, "global_step": 220188, "epoch": 1819} {"train_loss": -39.409053802490234, "global_step": 220189, "epoch": 1819} {"train_loss": -43.21027755737305, "global_step": 220190, "epoch": 1819} {"train_loss": -41.03377914428711, "global_step": 220191, "epoch": 1819} {"train_loss": -40.069454193115234, "global_step": 220192, "epoch": 1819} {"train_loss": -43.19157791137695, "global_step": 220193, "epoch": 1819} {"train_loss": -37.50703048706055, "global_step": 220194, "epoch": 1819} {"train_loss": -40.99910354614258, "global_step": 220195, "epoch": 1819} {"train_loss": -35.259822845458984, "global_step": 220196, "epoch": 1819} {"train_loss": -33.99296951293945, "global_step": 220197, "epoch": 1819} {"train_loss": -31.780460357666016, "global_step": 220198, "epoch": 1819} {"train_loss": -32.97987365722656, "global_step": 220199, "epoch": 1819} {"train_loss": -35.59743881225586, "global_step": 220200, "epoch": 1819} {"train_loss": -34.08928680419922, "global_step": 220201, "epoch": 1819} {"train_loss": -37.05824661254883, "global_step": 220202, "epoch": 1819} {"train_loss": -35.91021728515625, "global_step": 220203, "epoch": 1819} {"train_loss": -37.742794036865234, "global_step": 220204, "epoch": 1819} {"train_loss": -37.82854461669922, "global_step": 220205, "epoch": 1819} {"train_loss": -36.09822082519531, "global_step": 220206, "epoch": 1819} {"train_loss": -36.799217224121094, "global_step": 220207, "epoch": 1819} {"train_loss": -37.55149459838867, "global_step": 220208, "epoch": 1819} {"train_loss": -38.89982986450195, "global_step": 220209, "epoch": 1819} {"train_loss": -39.01688766479492, "global_step": 220210, "epoch": 1819} {"train_loss": -38.27581024169922, "global_step": 220211, "epoch": 1819} {"train_loss": -38.837432861328125, "global_step": 220212, "epoch": 1819} {"train_loss": -38.27022933959961, "global_step": 220213, "epoch": 1819} {"train_loss": -39.71123504638672, "global_step": 220214, "epoch": 1819} {"train_loss": -39.997066497802734, "global_step": 220215, "epoch": 1819} {"train_loss": -39.77679443359375, "global_step": 220216, "epoch": 1819} {"train_loss": -40.277313232421875, "global_step": 220217, "epoch": 1819} {"train_loss": -40.9765510559082, "global_step": 220218, "epoch": 1819} {"train_loss": -40.9606298651577, "global_step": 220219, "epoch": 1819, "val_loss": 2534771.75} {"train_loss": -40.6987419128418, "global_step": 220220, "epoch": 1820} {"train_loss": -39.6919059753418, "global_step": 220221, "epoch": 1820} {"train_loss": -41.05602264404297, "global_step": 220222, "epoch": 1820} {"train_loss": -40.40289306640625, "global_step": 220223, "epoch": 1820} {"train_loss": -41.003143310546875, "global_step": 220224, "epoch": 1820} {"train_loss": -41.04592514038086, "global_step": 220225, "epoch": 1820} {"train_loss": -41.364986419677734, "global_step": 220226, "epoch": 1820} {"train_loss": -41.50239181518555, "global_step": 220227, "epoch": 1820} {"train_loss": -41.43147659301758, "global_step": 220228, "epoch": 1820} {"train_loss": -42.24935531616211, "global_step": 220229, "epoch": 1820} {"train_loss": -40.81702423095703, "global_step": 220230, "epoch": 1820} {"train_loss": -41.3707275390625, "global_step": 220231, "epoch": 1820} {"train_loss": -42.617042541503906, "global_step": 220232, "epoch": 1820} {"train_loss": -42.19790267944336, "global_step": 220233, "epoch": 1820} {"train_loss": -41.87080001831055, "global_step": 220234, "epoch": 1820} {"train_loss": -41.463661193847656, "global_step": 220235, "epoch": 1820} {"train_loss": -42.60110855102539, "global_step": 220236, "epoch": 1820} {"train_loss": -42.44504928588867, "global_step": 220237, "epoch": 1820} {"train_loss": -41.833961486816406, "global_step": 220238, "epoch": 1820} {"train_loss": -41.991085052490234, "global_step": 220239, "epoch": 1820} {"train_loss": -42.54158401489258, "global_step": 220240, "epoch": 1820} {"train_loss": -42.721656799316406, "global_step": 220241, "epoch": 1820} {"train_loss": -42.1531982421875, "global_step": 220242, "epoch": 1820} {"train_loss": -41.86903762817383, "global_step": 220243, "epoch": 1820} {"train_loss": -42.0463981628418, "global_step": 220244, "epoch": 1820} {"train_loss": -42.88166427612305, "global_step": 220245, "epoch": 1820} {"train_loss": -41.500770568847656, "global_step": 220246, "epoch": 1820} {"train_loss": -42.48989486694336, "global_step": 220247, "epoch": 1820} {"train_loss": -42.52912139892578, "global_step": 220248, "epoch": 1820} {"train_loss": -41.93463897705078, "global_step": 220249, "epoch": 1820} {"train_loss": -42.40394592285156, "global_step": 220250, "epoch": 1820} {"train_loss": -42.94886779785156, "global_step": 220251, "epoch": 1820} {"train_loss": -42.981056213378906, "global_step": 220252, "epoch": 1820} {"train_loss": -42.78733825683594, "global_step": 220253, "epoch": 1820} {"train_loss": -42.49242401123047, "global_step": 220254, "epoch": 1820} {"train_loss": -42.81109619140625, "global_step": 220255, "epoch": 1820} {"train_loss": -43.21759796142578, "global_step": 220256, "epoch": 1820} {"train_loss": -42.99739456176758, "global_step": 220257, "epoch": 1820} {"train_loss": -43.24813461303711, "global_step": 220258, "epoch": 1820} {"train_loss": -43.72336959838867, "global_step": 220259, "epoch": 1820} {"train_loss": -42.836952209472656, "global_step": 220260, "epoch": 1820} {"train_loss": -42.36738204956055, "global_step": 220261, "epoch": 1820} {"train_loss": -42.97707748413086, "global_step": 220262, "epoch": 1820} {"train_loss": -43.33530807495117, "global_step": 220263, "epoch": 1820} {"train_loss": -43.58027648925781, "global_step": 220264, "epoch": 1820} {"train_loss": -42.817161560058594, "global_step": 220265, "epoch": 1820} {"train_loss": -43.31593704223633, "global_step": 220266, "epoch": 1820} {"train_loss": -43.87908172607422, "global_step": 220267, "epoch": 1820} {"train_loss": -43.61149978637695, "global_step": 220268, "epoch": 1820} {"train_loss": -43.28504180908203, "global_step": 220269, "epoch": 1820} {"train_loss": -43.07666778564453, "global_step": 220270, "epoch": 1820} {"train_loss": -43.63167190551758, "global_step": 220271, "epoch": 1820} {"train_loss": -43.61515426635742, "global_step": 220272, "epoch": 1820} {"train_loss": -43.46448516845703, "global_step": 220273, "epoch": 1820} {"train_loss": -43.539302825927734, "global_step": 220274, "epoch": 1820} {"train_loss": -43.47414779663086, "global_step": 220275, "epoch": 1820} {"train_loss": -43.41138458251953, "global_step": 220276, "epoch": 1820} {"train_loss": -43.127647399902344, "global_step": 220277, "epoch": 1820} {"train_loss": -42.80898666381836, "global_step": 220278, "epoch": 1820} {"train_loss": -43.812286376953125, "global_step": 220279, "epoch": 1820} {"train_loss": -43.949241638183594, "global_step": 220280, "epoch": 1820} {"train_loss": -43.19112014770508, "global_step": 220281, "epoch": 1820} {"train_loss": -42.931495666503906, "global_step": 220282, "epoch": 1820} {"train_loss": -42.758663177490234, "global_step": 220283, "epoch": 1820} {"train_loss": -43.0117301940918, "global_step": 220284, "epoch": 1820} {"train_loss": -43.2718505859375, "global_step": 220285, "epoch": 1820} {"train_loss": -43.337520599365234, "global_step": 220286, "epoch": 1820} {"train_loss": -43.07916259765625, "global_step": 220287, "epoch": 1820} {"train_loss": -42.836605072021484, "global_step": 220288, "epoch": 1820} {"train_loss": -42.904296875, "global_step": 220289, "epoch": 1820} {"train_loss": -43.40038299560547, "global_step": 220290, "epoch": 1820} {"train_loss": -43.43418884277344, "global_step": 220291, "epoch": 1820} {"train_loss": -43.06499481201172, "global_step": 220292, "epoch": 1820} {"train_loss": -42.170589447021484, "global_step": 220293, "epoch": 1820} {"train_loss": -40.15339279174805, "global_step": 220294, "epoch": 1820} {"train_loss": -43.156402587890625, "global_step": 220295, "epoch": 1820} {"train_loss": -42.073707580566406, "global_step": 220296, "epoch": 1820} {"train_loss": -39.67665481567383, "global_step": 220297, "epoch": 1820} {"train_loss": -42.9138298034668, "global_step": 220298, "epoch": 1820} {"train_loss": -40.0161018371582, "global_step": 220299, "epoch": 1820} {"train_loss": -41.7347526550293, "global_step": 220300, "epoch": 1820} {"train_loss": -41.60889434814453, "global_step": 220301, "epoch": 1820} {"train_loss": -41.0314826965332, "global_step": 220302, "epoch": 1820} {"train_loss": -41.34806442260742, "global_step": 220303, "epoch": 1820} {"train_loss": -42.039058685302734, "global_step": 220304, "epoch": 1820} {"train_loss": -41.61079788208008, "global_step": 220305, "epoch": 1820} {"train_loss": -40.867061614990234, "global_step": 220306, "epoch": 1820} {"train_loss": -42.554405212402344, "global_step": 220307, "epoch": 1820} {"train_loss": -39.93160629272461, "global_step": 220308, "epoch": 1820} {"train_loss": -41.110816955566406, "global_step": 220309, "epoch": 1820} {"train_loss": -43.29246520996094, "global_step": 220310, "epoch": 1820} {"train_loss": -40.590023040771484, "global_step": 220311, "epoch": 1820} {"train_loss": -43.171173095703125, "global_step": 220312, "epoch": 1820} {"train_loss": -41.154396057128906, "global_step": 220313, "epoch": 1820} {"train_loss": -41.555137634277344, "global_step": 220314, "epoch": 1820} {"train_loss": -42.953956604003906, "global_step": 220315, "epoch": 1820} {"train_loss": -41.968475341796875, "global_step": 220316, "epoch": 1820} {"train_loss": -42.98090744018555, "global_step": 220317, "epoch": 1820} {"train_loss": -42.48316192626953, "global_step": 220318, "epoch": 1820} {"train_loss": -43.24552536010742, "global_step": 220319, "epoch": 1820} {"train_loss": -43.0386962890625, "global_step": 220320, "epoch": 1820} {"train_loss": -42.33083724975586, "global_step": 220321, "epoch": 1820} {"train_loss": -42.704856872558594, "global_step": 220322, "epoch": 1820} {"train_loss": -42.87919235229492, "global_step": 220323, "epoch": 1820} {"train_loss": -41.29755401611328, "global_step": 220324, "epoch": 1820} {"train_loss": -42.19279861450195, "global_step": 220325, "epoch": 1820} {"train_loss": -41.90546417236328, "global_step": 220326, "epoch": 1820} {"train_loss": -43.45469284057617, "global_step": 220327, "epoch": 1820} {"train_loss": -42.28372573852539, "global_step": 220328, "epoch": 1820} {"train_loss": -41.3427619934082, "global_step": 220329, "epoch": 1820} {"train_loss": -41.733154296875, "global_step": 220330, "epoch": 1820} {"train_loss": -41.99146270751953, "global_step": 220331, "epoch": 1820} {"train_loss": -42.22379684448242, "global_step": 220332, "epoch": 1820} {"train_loss": -42.59843063354492, "global_step": 220333, "epoch": 1820} {"train_loss": -43.2686882019043, "global_step": 220334, "epoch": 1820} {"train_loss": -42.21611404418945, "global_step": 220335, "epoch": 1820} {"train_loss": -41.58129119873047, "global_step": 220336, "epoch": 1820} {"train_loss": -40.44540023803711, "global_step": 220337, "epoch": 1820} {"train_loss": -41.250885009765625, "global_step": 220338, "epoch": 1820} {"train_loss": -38.35189437866211, "global_step": 220339, "epoch": 1820} {"train_loss": -42.2734267179631, "global_step": 220340, "epoch": 1820, "val_loss": 2536029.25} {"train_loss": -42.28479766845703, "global_step": 220341, "epoch": 1821} {"train_loss": -40.598915100097656, "global_step": 220342, "epoch": 1821} {"train_loss": -40.53358840942383, "global_step": 220343, "epoch": 1821} {"train_loss": -40.62033462524414, "global_step": 220344, "epoch": 1821} {"train_loss": -41.6219482421875, "global_step": 220345, "epoch": 1821} {"train_loss": -40.89514923095703, "global_step": 220346, "epoch": 1821} {"train_loss": -41.50664138793945, "global_step": 220347, "epoch": 1821} {"train_loss": -42.39070510864258, "global_step": 220348, "epoch": 1821} {"train_loss": -42.36643600463867, "global_step": 220349, "epoch": 1821} {"train_loss": -42.954097747802734, "global_step": 220350, "epoch": 1821} {"train_loss": -42.48988723754883, "global_step": 220351, "epoch": 1821} {"train_loss": -42.660377502441406, "global_step": 220352, "epoch": 1821} {"train_loss": -41.840633392333984, "global_step": 220353, "epoch": 1821} {"train_loss": -42.608726501464844, "global_step": 220354, "epoch": 1821} {"train_loss": -41.92716979980469, "global_step": 220355, "epoch": 1821} {"train_loss": -41.29413604736328, "global_step": 220356, "epoch": 1821} {"train_loss": -42.17499542236328, "global_step": 220357, "epoch": 1821} {"train_loss": -42.267608642578125, "global_step": 220358, "epoch": 1821} {"train_loss": -41.72994613647461, "global_step": 220359, "epoch": 1821} {"train_loss": -42.27750015258789, "global_step": 220360, "epoch": 1821} {"train_loss": -42.096519470214844, "global_step": 220361, "epoch": 1821} {"train_loss": -41.5225830078125, "global_step": 220362, "epoch": 1821} {"train_loss": -42.3934326171875, "global_step": 220363, "epoch": 1821} {"train_loss": -42.60738754272461, "global_step": 220364, "epoch": 1821} {"train_loss": -42.07563781738281, "global_step": 220365, "epoch": 1821} {"train_loss": -41.617713928222656, "global_step": 220366, "epoch": 1821} {"train_loss": -42.013084411621094, "global_step": 220367, "epoch": 1821} {"train_loss": -40.117645263671875, "global_step": 220368, "epoch": 1821} {"train_loss": -42.18844223022461, "global_step": 220369, "epoch": 1821} {"train_loss": -41.782779693603516, "global_step": 220370, "epoch": 1821} {"train_loss": -40.967769622802734, "global_step": 220371, "epoch": 1821} {"train_loss": -41.46525192260742, "global_step": 220372, "epoch": 1821} {"train_loss": -40.865596771240234, "global_step": 220373, "epoch": 1821} {"train_loss": -42.59243392944336, "global_step": 220374, "epoch": 1821} {"train_loss": -41.95695495605469, "global_step": 220375, "epoch": 1821} {"train_loss": -41.59349822998047, "global_step": 220376, "epoch": 1821} {"train_loss": -41.81916427612305, "global_step": 220377, "epoch": 1821} {"train_loss": -40.85527420043945, "global_step": 220378, "epoch": 1821} {"train_loss": -42.417049407958984, "global_step": 220379, "epoch": 1821} {"train_loss": -42.77362823486328, "global_step": 220380, "epoch": 1821} {"train_loss": -41.438812255859375, "global_step": 220381, "epoch": 1821} {"train_loss": -42.93129348754883, "global_step": 220382, "epoch": 1821} {"train_loss": -42.42332458496094, "global_step": 220383, "epoch": 1821} {"train_loss": -42.1225700378418, "global_step": 220384, "epoch": 1821} {"train_loss": -42.31355667114258, "global_step": 220385, "epoch": 1821} {"train_loss": -42.54059600830078, "global_step": 220386, "epoch": 1821} {"train_loss": -42.49245071411133, "global_step": 220387, "epoch": 1821} {"train_loss": -41.4306755065918, "global_step": 220388, "epoch": 1821} {"train_loss": -42.52809143066406, "global_step": 220389, "epoch": 1821} {"train_loss": -43.39215087890625, "global_step": 220390, "epoch": 1821} {"train_loss": -42.732643127441406, "global_step": 220391, "epoch": 1821} {"train_loss": -42.97266387939453, "global_step": 220392, "epoch": 1821} {"train_loss": -43.41645431518555, "global_step": 220393, "epoch": 1821} {"train_loss": -42.45380401611328, "global_step": 220394, "epoch": 1821} {"train_loss": -42.72412872314453, "global_step": 220395, "epoch": 1821} {"train_loss": -43.24152755737305, "global_step": 220396, "epoch": 1821} {"train_loss": -43.25631332397461, "global_step": 220397, "epoch": 1821} {"train_loss": -43.3059196472168, "global_step": 220398, "epoch": 1821} {"train_loss": -42.90934371948242, "global_step": 220399, "epoch": 1821} {"train_loss": -43.61696243286133, "global_step": 220400, "epoch": 1821} {"train_loss": -43.005348205566406, "global_step": 220401, "epoch": 1821} {"train_loss": -43.135009765625, "global_step": 220402, "epoch": 1821} {"train_loss": -42.82908630371094, "global_step": 220403, "epoch": 1821} {"train_loss": -42.676551818847656, "global_step": 220404, "epoch": 1821} {"train_loss": -43.192073822021484, "global_step": 220405, "epoch": 1821} {"train_loss": -43.42915725708008, "global_step": 220406, "epoch": 1821} {"train_loss": -42.86007308959961, "global_step": 220407, "epoch": 1821} {"train_loss": -43.09952926635742, "global_step": 220408, "epoch": 1821} {"train_loss": -43.62153244018555, "global_step": 220409, "epoch": 1821} {"train_loss": -43.11997604370117, "global_step": 220410, "epoch": 1821} {"train_loss": -42.95115661621094, "global_step": 220411, "epoch": 1821} {"train_loss": -43.75676345825195, "global_step": 220412, "epoch": 1821} {"train_loss": -42.8745002746582, "global_step": 220413, "epoch": 1821} {"train_loss": -42.96025085449219, "global_step": 220414, "epoch": 1821} {"train_loss": -43.2552604675293, "global_step": 220415, "epoch": 1821} {"train_loss": -41.972354888916016, "global_step": 220416, "epoch": 1821} {"train_loss": -42.67132568359375, "global_step": 220417, "epoch": 1821} {"train_loss": -43.339900970458984, "global_step": 220418, "epoch": 1821} {"train_loss": -42.33976364135742, "global_step": 220419, "epoch": 1821} {"train_loss": -42.68314743041992, "global_step": 220420, "epoch": 1821} {"train_loss": -41.971195220947266, "global_step": 220421, "epoch": 1821} {"train_loss": -41.7288818359375, "global_step": 220422, "epoch": 1821} {"train_loss": -42.908504486083984, "global_step": 220423, "epoch": 1821} {"train_loss": -41.540287017822266, "global_step": 220424, "epoch": 1821} {"train_loss": -42.560359954833984, "global_step": 220425, "epoch": 1821} {"train_loss": -41.794490814208984, "global_step": 220426, "epoch": 1821} {"train_loss": -41.058895111083984, "global_step": 220427, "epoch": 1821} {"train_loss": -41.84769058227539, "global_step": 220428, "epoch": 1821} {"train_loss": -40.389198303222656, "global_step": 220429, "epoch": 1821} {"train_loss": -41.50935363769531, "global_step": 220430, "epoch": 1821} {"train_loss": -41.75606918334961, "global_step": 220431, "epoch": 1821} {"train_loss": -41.781436920166016, "global_step": 220432, "epoch": 1821} {"train_loss": -42.27824783325195, "global_step": 220433, "epoch": 1821} {"train_loss": -41.98843002319336, "global_step": 220434, "epoch": 1821} {"train_loss": -41.18525695800781, "global_step": 220435, "epoch": 1821} {"train_loss": -42.39606475830078, "global_step": 220436, "epoch": 1821} {"train_loss": -42.25346755981445, "global_step": 220437, "epoch": 1821} {"train_loss": -40.71523666381836, "global_step": 220438, "epoch": 1821} {"train_loss": -42.204036712646484, "global_step": 220439, "epoch": 1821} {"train_loss": -39.60139083862305, "global_step": 220440, "epoch": 1821} {"train_loss": -41.683589935302734, "global_step": 220441, "epoch": 1821} {"train_loss": -41.24169158935547, "global_step": 220442, "epoch": 1821} {"train_loss": -38.77204513549805, "global_step": 220443, "epoch": 1821} {"train_loss": -40.54433822631836, "global_step": 220444, "epoch": 1821} {"train_loss": -38.77494430541992, "global_step": 220445, "epoch": 1821} {"train_loss": -41.215370178222656, "global_step": 220446, "epoch": 1821} {"train_loss": -39.65664291381836, "global_step": 220447, "epoch": 1821} {"train_loss": -41.21571731567383, "global_step": 220448, "epoch": 1821} {"train_loss": -40.03342819213867, "global_step": 220449, "epoch": 1821} {"train_loss": -42.22576904296875, "global_step": 220450, "epoch": 1821} {"train_loss": -40.3841438293457, "global_step": 220451, "epoch": 1821} {"train_loss": -42.12714767456055, "global_step": 220452, "epoch": 1821} {"train_loss": -40.40776824951172, "global_step": 220453, "epoch": 1821} {"train_loss": -42.35724639892578, "global_step": 220454, "epoch": 1821} {"train_loss": -40.28101348876953, "global_step": 220455, "epoch": 1821} {"train_loss": -42.67594528198242, "global_step": 220456, "epoch": 1821} {"train_loss": -40.08834457397461, "global_step": 220457, "epoch": 1821} {"train_loss": -43.22896194458008, "global_step": 220458, "epoch": 1821} {"train_loss": -41.32155227661133, "global_step": 220459, "epoch": 1821} {"train_loss": -42.22886276245117, "global_step": 220460, "epoch": 1821} {"train_loss": -42.00599831194917, "global_step": 220461, "epoch": 1821, "val_loss": 2619619.0} {"train_loss": -42.48679733276367, "global_step": 220462, "epoch": 1822} {"train_loss": -42.2479133605957, "global_step": 220463, "epoch": 1822} {"train_loss": -43.036773681640625, "global_step": 220464, "epoch": 1822} {"train_loss": -42.21125030517578, "global_step": 220465, "epoch": 1822} {"train_loss": -42.20170211791992, "global_step": 220466, "epoch": 1822} {"train_loss": -41.90095901489258, "global_step": 220467, "epoch": 1822} {"train_loss": -42.58549118041992, "global_step": 220468, "epoch": 1822} {"train_loss": -42.84474563598633, "global_step": 220469, "epoch": 1822} {"train_loss": -42.08636474609375, "global_step": 220470, "epoch": 1822} {"train_loss": -42.192989349365234, "global_step": 220471, "epoch": 1822} {"train_loss": -42.96889877319336, "global_step": 220472, "epoch": 1822} {"train_loss": -42.5953483581543, "global_step": 220473, "epoch": 1822} {"train_loss": -42.93239212036133, "global_step": 220474, "epoch": 1822} {"train_loss": -43.003231048583984, "global_step": 220475, "epoch": 1822} {"train_loss": -43.165836334228516, "global_step": 220476, "epoch": 1822} {"train_loss": -42.019351959228516, "global_step": 220477, "epoch": 1822} {"train_loss": -42.751895904541016, "global_step": 220478, "epoch": 1822} {"train_loss": -42.22402572631836, "global_step": 220479, "epoch": 1822} {"train_loss": -42.717071533203125, "global_step": 220480, "epoch": 1822} {"train_loss": -42.718055725097656, "global_step": 220481, "epoch": 1822} {"train_loss": -42.24304962158203, "global_step": 220482, "epoch": 1822} {"train_loss": -41.681114196777344, "global_step": 220483, "epoch": 1822} {"train_loss": -40.21900939941406, "global_step": 220484, "epoch": 1822} {"train_loss": -41.54643630981445, "global_step": 220485, "epoch": 1822} {"train_loss": -42.309661865234375, "global_step": 220486, "epoch": 1822} {"train_loss": -41.56867980957031, "global_step": 220487, "epoch": 1822} {"train_loss": -41.63569259643555, "global_step": 220488, "epoch": 1822} {"train_loss": -42.80473709106445, "global_step": 220489, "epoch": 1822} {"train_loss": -40.68042755126953, "global_step": 220490, "epoch": 1822} {"train_loss": -41.77532958984375, "global_step": 220491, "epoch": 1822} {"train_loss": -41.37827682495117, "global_step": 220492, "epoch": 1822} {"train_loss": -41.501216888427734, "global_step": 220493, "epoch": 1822} {"train_loss": -40.592735290527344, "global_step": 220494, "epoch": 1822} {"train_loss": -41.46770477294922, "global_step": 220495, "epoch": 1822} {"train_loss": -41.063941955566406, "global_step": 220496, "epoch": 1822} {"train_loss": -42.548641204833984, "global_step": 220497, "epoch": 1822} {"train_loss": -42.05097198486328, "global_step": 220498, "epoch": 1822} {"train_loss": -41.06103515625, "global_step": 220499, "epoch": 1822} {"train_loss": -42.37034606933594, "global_step": 220500, "epoch": 1822} {"train_loss": -42.7416877746582, "global_step": 220501, "epoch": 1822} {"train_loss": -42.50040817260742, "global_step": 220502, "epoch": 1822} {"train_loss": -42.090023040771484, "global_step": 220503, "epoch": 1822} {"train_loss": -42.18684005737305, "global_step": 220504, "epoch": 1822} {"train_loss": -42.77627182006836, "global_step": 220505, "epoch": 1822} {"train_loss": -42.66355895996094, "global_step": 220506, "epoch": 1822} {"train_loss": -42.146331787109375, "global_step": 220507, "epoch": 1822} {"train_loss": -43.211952209472656, "global_step": 220508, "epoch": 1822} {"train_loss": -42.12784957885742, "global_step": 220509, "epoch": 1822} {"train_loss": -41.37078857421875, "global_step": 220510, "epoch": 1822} {"train_loss": -42.72511672973633, "global_step": 220511, "epoch": 1822} {"train_loss": -40.697509765625, "global_step": 220512, "epoch": 1822} {"train_loss": -41.00932693481445, "global_step": 220513, "epoch": 1822} {"train_loss": -43.040618896484375, "global_step": 220514, "epoch": 1822} {"train_loss": -39.79677200317383, "global_step": 220515, "epoch": 1822} {"train_loss": -43.10681915283203, "global_step": 220516, "epoch": 1822} {"train_loss": -38.7560920715332, "global_step": 220517, "epoch": 1822} {"train_loss": -42.4398193359375, "global_step": 220518, "epoch": 1822} {"train_loss": -37.82910919189453, "global_step": 220519, "epoch": 1822} {"train_loss": -41.5863037109375, "global_step": 220520, "epoch": 1822} {"train_loss": -36.238826751708984, "global_step": 220521, "epoch": 1822} {"train_loss": -37.75665283203125, "global_step": 220522, "epoch": 1822} {"train_loss": -35.67197799682617, "global_step": 220523, "epoch": 1822} {"train_loss": -34.47855758666992, "global_step": 220524, "epoch": 1822} {"train_loss": -37.307403564453125, "global_step": 220525, "epoch": 1822} {"train_loss": -35.325252532958984, "global_step": 220526, "epoch": 1822} {"train_loss": -37.985198974609375, "global_step": 220527, "epoch": 1822} {"train_loss": -36.5754508972168, "global_step": 220528, "epoch": 1822} {"train_loss": -37.21584701538086, "global_step": 220529, "epoch": 1822} {"train_loss": -36.23722457885742, "global_step": 220530, "epoch": 1822} {"train_loss": -36.07453155517578, "global_step": 220531, "epoch": 1822} {"train_loss": -37.499210357666016, "global_step": 220532, "epoch": 1822} {"train_loss": -37.941917419433594, "global_step": 220533, "epoch": 1822} {"train_loss": -37.3170280456543, "global_step": 220534, "epoch": 1822} {"train_loss": -37.65900802612305, "global_step": 220535, "epoch": 1822} {"train_loss": -37.73665237426758, "global_step": 220536, "epoch": 1822} {"train_loss": -38.18284225463867, "global_step": 220537, "epoch": 1822} {"train_loss": -37.44013214111328, "global_step": 220538, "epoch": 1822} {"train_loss": -37.7310905456543, "global_step": 220539, "epoch": 1822} {"train_loss": -38.30353546142578, "global_step": 220540, "epoch": 1822} {"train_loss": -37.70396041870117, "global_step": 220541, "epoch": 1822} {"train_loss": -38.48202133178711, "global_step": 220542, "epoch": 1822} {"train_loss": -38.657920837402344, "global_step": 220543, "epoch": 1822} {"train_loss": -38.07863998413086, "global_step": 220544, "epoch": 1822} {"train_loss": -38.063926696777344, "global_step": 220545, "epoch": 1822} {"train_loss": -38.62146759033203, "global_step": 220546, "epoch": 1822} {"train_loss": -39.18564987182617, "global_step": 220547, "epoch": 1822} {"train_loss": -38.288612365722656, "global_step": 220548, "epoch": 1822} {"train_loss": -39.14884567260742, "global_step": 220549, "epoch": 1822} {"train_loss": -39.09857177734375, "global_step": 220550, "epoch": 1822} {"train_loss": -39.57905197143555, "global_step": 220551, "epoch": 1822} {"train_loss": -39.19424057006836, "global_step": 220552, "epoch": 1822} {"train_loss": -39.20822525024414, "global_step": 220553, "epoch": 1822} {"train_loss": -39.3062858581543, "global_step": 220554, "epoch": 1822} {"train_loss": -39.84355545043945, "global_step": 220555, "epoch": 1822} {"train_loss": -39.281585693359375, "global_step": 220556, "epoch": 1822} {"train_loss": -39.103363037109375, "global_step": 220557, "epoch": 1822} {"train_loss": -40.358638763427734, "global_step": 220558, "epoch": 1822} {"train_loss": -39.687660217285156, "global_step": 220559, "epoch": 1822} {"train_loss": -40.06644821166992, "global_step": 220560, "epoch": 1822} {"train_loss": -40.389949798583984, "global_step": 220561, "epoch": 1822} {"train_loss": -39.955108642578125, "global_step": 220562, "epoch": 1822} {"train_loss": -39.35211181640625, "global_step": 220563, "epoch": 1822} {"train_loss": -40.1394157409668, "global_step": 220564, "epoch": 1822} {"train_loss": -37.78547286987305, "global_step": 220565, "epoch": 1822} {"train_loss": -39.45918655395508, "global_step": 220566, "epoch": 1822} {"train_loss": -40.04450607299805, "global_step": 220567, "epoch": 1822} {"train_loss": -40.397300720214844, "global_step": 220568, "epoch": 1822} {"train_loss": -38.85658645629883, "global_step": 220569, "epoch": 1822} {"train_loss": -27.24183464050293, "global_step": 220570, "epoch": 1822} {"train_loss": -40.22785186767578, "global_step": 220571, "epoch": 1822} {"train_loss": -36.46001052856445, "global_step": 220572, "epoch": 1822} {"train_loss": -38.36196517944336, "global_step": 220573, "epoch": 1822} {"train_loss": -39.20884323120117, "global_step": 220574, "epoch": 1822} {"train_loss": -40.33925247192383, "global_step": 220575, "epoch": 1822} {"train_loss": -39.36526870727539, "global_step": 220576, "epoch": 1822} {"train_loss": -39.90125274658203, "global_step": 220577, "epoch": 1822} {"train_loss": -39.93012619018555, "global_step": 220578, "epoch": 1822} {"train_loss": -40.223060607910156, "global_step": 220579, "epoch": 1822} {"train_loss": -36.378456115722656, "global_step": 220580, "epoch": 1822} {"train_loss": -38.02335739135742, "global_step": 220581, "epoch": 1822} {"train_loss": -40.08583287956301, "global_step": 220582, "epoch": 1822, "val_loss": 2569776.75} {"train_loss": -36.27914047241211, "global_step": 220583, "epoch": 1823} {"train_loss": -41.54535675048828, "global_step": 220584, "epoch": 1823} {"train_loss": -40.61116409301758, "global_step": 220585, "epoch": 1823} {"train_loss": -36.67316436767578, "global_step": 220586, "epoch": 1823} {"train_loss": -39.58034896850586, "global_step": 220587, "epoch": 1823} {"train_loss": -38.929439544677734, "global_step": 220588, "epoch": 1823} {"train_loss": -38.503963470458984, "global_step": 220589, "epoch": 1823} {"train_loss": -39.2555046081543, "global_step": 220590, "epoch": 1823} {"train_loss": -38.953487396240234, "global_step": 220591, "epoch": 1823} {"train_loss": -36.677398681640625, "global_step": 220592, "epoch": 1823} {"train_loss": -39.51374435424805, "global_step": 220593, "epoch": 1823} {"train_loss": -37.83718490600586, "global_step": 220594, "epoch": 1823} {"train_loss": -38.7082405090332, "global_step": 220595, "epoch": 1823} {"train_loss": -36.129150390625, "global_step": 220596, "epoch": 1823} {"train_loss": -39.20382308959961, "global_step": 220597, "epoch": 1823} {"train_loss": -40.0395393371582, "global_step": 220598, "epoch": 1823} {"train_loss": -40.25640869140625, "global_step": 220599, "epoch": 1823} {"train_loss": -29.90650749206543, "global_step": 220600, "epoch": 1823} {"train_loss": -36.113380432128906, "global_step": 220601, "epoch": 1823} {"train_loss": -40.26470947265625, "global_step": 220602, "epoch": 1823} {"train_loss": -40.50974655151367, "global_step": 220603, "epoch": 1823} {"train_loss": -37.944091796875, "global_step": 220604, "epoch": 1823} {"train_loss": -37.27980422973633, "global_step": 220605, "epoch": 1823} {"train_loss": -39.68610382080078, "global_step": 220606, "epoch": 1823} {"train_loss": -39.11314010620117, "global_step": 220607, "epoch": 1823} {"train_loss": -38.75291061401367, "global_step": 220608, "epoch": 1823} {"train_loss": -40.23659896850586, "global_step": 220609, "epoch": 1823} {"train_loss": -39.35509490966797, "global_step": 220610, "epoch": 1823} {"train_loss": -40.37311553955078, "global_step": 220611, "epoch": 1823} {"train_loss": -39.947181701660156, "global_step": 220612, "epoch": 1823} {"train_loss": -40.24923324584961, "global_step": 220613, "epoch": 1823} {"train_loss": -40.23563766479492, "global_step": 220614, "epoch": 1823} {"train_loss": -40.393959045410156, "global_step": 220615, "epoch": 1823} {"train_loss": -39.53212356567383, "global_step": 220616, "epoch": 1823} {"train_loss": -38.88804244995117, "global_step": 220617, "epoch": 1823} {"train_loss": -41.71862030029297, "global_step": 220618, "epoch": 1823} {"train_loss": -40.51833724975586, "global_step": 220619, "epoch": 1823} {"train_loss": -40.92798614501953, "global_step": 220620, "epoch": 1823} {"train_loss": -40.65216827392578, "global_step": 220621, "epoch": 1823} {"train_loss": -40.219337463378906, "global_step": 220622, "epoch": 1823} {"train_loss": -41.24998092651367, "global_step": 220623, "epoch": 1823} {"train_loss": -40.536537170410156, "global_step": 220624, "epoch": 1823} {"train_loss": -41.457088470458984, "global_step": 220625, "epoch": 1823} {"train_loss": -41.70493698120117, "global_step": 220626, "epoch": 1823} {"train_loss": -40.78505325317383, "global_step": 220627, "epoch": 1823} {"train_loss": -41.55369186401367, "global_step": 220628, "epoch": 1823} {"train_loss": -41.22761154174805, "global_step": 220629, "epoch": 1823} {"train_loss": -41.364803314208984, "global_step": 220630, "epoch": 1823} {"train_loss": -41.43178939819336, "global_step": 220631, "epoch": 1823} {"train_loss": -41.418949127197266, "global_step": 220632, "epoch": 1823} {"train_loss": -41.6998405456543, "global_step": 220633, "epoch": 1823} {"train_loss": -42.03396987915039, "global_step": 220634, "epoch": 1823} {"train_loss": -41.922096252441406, "global_step": 220635, "epoch": 1823} {"train_loss": -41.89494705200195, "global_step": 220636, "epoch": 1823} {"train_loss": -41.7456169128418, "global_step": 220637, "epoch": 1823} {"train_loss": -41.908363342285156, "global_step": 220638, "epoch": 1823} {"train_loss": -42.3432731628418, "global_step": 220639, "epoch": 1823} {"train_loss": -42.160858154296875, "global_step": 220640, "epoch": 1823} {"train_loss": -42.62043380737305, "global_step": 220641, "epoch": 1823} {"train_loss": -42.372249603271484, "global_step": 220642, "epoch": 1823} {"train_loss": -42.04717254638672, "global_step": 220643, "epoch": 1823} {"train_loss": -42.216835021972656, "global_step": 220644, "epoch": 1823} {"train_loss": -42.51123046875, "global_step": 220645, "epoch": 1823} {"train_loss": -42.15664291381836, "global_step": 220646, "epoch": 1823} {"train_loss": -42.869834899902344, "global_step": 220647, "epoch": 1823} {"train_loss": -42.356380462646484, "global_step": 220648, "epoch": 1823} {"train_loss": -42.322120666503906, "global_step": 220649, "epoch": 1823} {"train_loss": -42.26479721069336, "global_step": 220650, "epoch": 1823} {"train_loss": -42.29688262939453, "global_step": 220651, "epoch": 1823} {"train_loss": -42.21944808959961, "global_step": 220652, "epoch": 1823} {"train_loss": -41.976112365722656, "global_step": 220653, "epoch": 1823} {"train_loss": -42.2321662902832, "global_step": 220654, "epoch": 1823} {"train_loss": -42.71391677856445, "global_step": 220655, "epoch": 1823} {"train_loss": -42.6699333190918, "global_step": 220656, "epoch": 1823} {"train_loss": -41.97216796875, "global_step": 220657, "epoch": 1823} {"train_loss": -42.804931640625, "global_step": 220658, "epoch": 1823} {"train_loss": -41.967098236083984, "global_step": 220659, "epoch": 1823} {"train_loss": -42.60200119018555, "global_step": 220660, "epoch": 1823} {"train_loss": -42.32061767578125, "global_step": 220661, "epoch": 1823} {"train_loss": -43.206947326660156, "global_step": 220662, "epoch": 1823} {"train_loss": -42.44831085205078, "global_step": 220663, "epoch": 1823} {"train_loss": -42.77432632446289, "global_step": 220664, "epoch": 1823} {"train_loss": -43.34963607788086, "global_step": 220665, "epoch": 1823} {"train_loss": -42.78857421875, "global_step": 220666, "epoch": 1823} {"train_loss": -42.88045883178711, "global_step": 220667, "epoch": 1823} {"train_loss": -42.453643798828125, "global_step": 220668, "epoch": 1823} {"train_loss": -42.37694549560547, "global_step": 220669, "epoch": 1823} {"train_loss": -42.91714096069336, "global_step": 220670, "epoch": 1823} {"train_loss": -43.34817123413086, "global_step": 220671, "epoch": 1823} {"train_loss": -43.09956741333008, "global_step": 220672, "epoch": 1823} {"train_loss": -42.79900360107422, "global_step": 220673, "epoch": 1823} {"train_loss": -42.6439094543457, "global_step": 220674, "epoch": 1823} {"train_loss": -42.19057846069336, "global_step": 220675, "epoch": 1823} {"train_loss": -42.01652145385742, "global_step": 220676, "epoch": 1823} {"train_loss": -42.3792610168457, "global_step": 220677, "epoch": 1823} {"train_loss": -43.07453536987305, "global_step": 220678, "epoch": 1823} {"train_loss": -43.122589111328125, "global_step": 220679, "epoch": 1823} {"train_loss": -41.04366683959961, "global_step": 220680, "epoch": 1823} {"train_loss": -42.3403434753418, "global_step": 220681, "epoch": 1823} {"train_loss": -42.723567962646484, "global_step": 220682, "epoch": 1823} {"train_loss": -40.95961380004883, "global_step": 220683, "epoch": 1823} {"train_loss": -42.338985443115234, "global_step": 220684, "epoch": 1823} {"train_loss": -42.64101791381836, "global_step": 220685, "epoch": 1823} {"train_loss": -40.04928207397461, "global_step": 220686, "epoch": 1823} {"train_loss": -41.28779220581055, "global_step": 220687, "epoch": 1823} {"train_loss": -42.27294921875, "global_step": 220688, "epoch": 1823} {"train_loss": -40.88459396362305, "global_step": 220689, "epoch": 1823} {"train_loss": -42.35687255859375, "global_step": 220690, "epoch": 1823} {"train_loss": -39.214900970458984, "global_step": 220691, "epoch": 1823} {"train_loss": -39.59891891479492, "global_step": 220692, "epoch": 1823} {"train_loss": -41.36882019042969, "global_step": 220693, "epoch": 1823} {"train_loss": -40.96753692626953, "global_step": 220694, "epoch": 1823} {"train_loss": -36.612266540527344, "global_step": 220695, "epoch": 1823} {"train_loss": -41.297393798828125, "global_step": 220696, "epoch": 1823} {"train_loss": -36.591346740722656, "global_step": 220697, "epoch": 1823} {"train_loss": -41.7554931640625, "global_step": 220698, "epoch": 1823} {"train_loss": -40.593963623046875, "global_step": 220699, "epoch": 1823} {"train_loss": -40.64936065673828, "global_step": 220700, "epoch": 1823} {"train_loss": -40.99730682373047, "global_step": 220701, "epoch": 1823} {"train_loss": -40.36012268066406, "global_step": 220702, "epoch": 1823} {"train_loss": -40.908520012847646, "global_step": 220703, "epoch": 1823, "val_loss": 2608622.25} {"train_loss": -40.28580856323242, "global_step": 220704, "epoch": 1824} {"train_loss": -41.110530853271484, "global_step": 220705, "epoch": 1824} {"train_loss": -41.5496711730957, "global_step": 220706, "epoch": 1824} {"train_loss": -40.5310173034668, "global_step": 220707, "epoch": 1824} {"train_loss": -41.58146286010742, "global_step": 220708, "epoch": 1824} {"train_loss": -41.702266693115234, "global_step": 220709, "epoch": 1824} {"train_loss": -39.93656539916992, "global_step": 220710, "epoch": 1824} {"train_loss": -41.36948776245117, "global_step": 220711, "epoch": 1824} {"train_loss": -38.12543487548828, "global_step": 220712, "epoch": 1824} {"train_loss": -40.06593704223633, "global_step": 220713, "epoch": 1824} {"train_loss": -39.93025588989258, "global_step": 220714, "epoch": 1824} {"train_loss": -41.08681869506836, "global_step": 220715, "epoch": 1824} {"train_loss": -40.254417419433594, "global_step": 220716, "epoch": 1824} {"train_loss": -39.39692306518555, "global_step": 220717, "epoch": 1824} {"train_loss": -40.369537353515625, "global_step": 220718, "epoch": 1824} {"train_loss": -41.47724533081055, "global_step": 220719, "epoch": 1824} {"train_loss": -39.50193405151367, "global_step": 220720, "epoch": 1824} {"train_loss": -38.14243698120117, "global_step": 220721, "epoch": 1824} {"train_loss": -41.024539947509766, "global_step": 220722, "epoch": 1824} {"train_loss": -40.587825775146484, "global_step": 220723, "epoch": 1824} {"train_loss": -40.171321868896484, "global_step": 220724, "epoch": 1824} {"train_loss": -40.794219970703125, "global_step": 220725, "epoch": 1824} {"train_loss": -40.0726318359375, "global_step": 220726, "epoch": 1824} {"train_loss": -42.12836837768555, "global_step": 220727, "epoch": 1824} {"train_loss": -40.04502487182617, "global_step": 220728, "epoch": 1824} {"train_loss": -41.4537467956543, "global_step": 220729, "epoch": 1824} {"train_loss": -38.96671676635742, "global_step": 220730, "epoch": 1824} {"train_loss": -39.51521301269531, "global_step": 220731, "epoch": 1824} {"train_loss": -41.22853469848633, "global_step": 220732, "epoch": 1824} {"train_loss": -39.0658073425293, "global_step": 220733, "epoch": 1824} {"train_loss": -40.03030776977539, "global_step": 220734, "epoch": 1824} {"train_loss": -40.55685043334961, "global_step": 220735, "epoch": 1824} {"train_loss": -39.623390197753906, "global_step": 220736, "epoch": 1824} {"train_loss": -42.112857818603516, "global_step": 220737, "epoch": 1824} {"train_loss": -40.58103561401367, "global_step": 220738, "epoch": 1824} {"train_loss": -41.015132904052734, "global_step": 220739, "epoch": 1824} {"train_loss": -40.82770919799805, "global_step": 220740, "epoch": 1824} {"train_loss": -40.081451416015625, "global_step": 220741, "epoch": 1824} {"train_loss": -42.393917083740234, "global_step": 220742, "epoch": 1824} {"train_loss": -40.781612396240234, "global_step": 220743, "epoch": 1824} {"train_loss": -42.26008224487305, "global_step": 220744, "epoch": 1824} {"train_loss": -41.157230377197266, "global_step": 220745, "epoch": 1824} {"train_loss": -41.324771881103516, "global_step": 220746, "epoch": 1824} {"train_loss": -41.22797393798828, "global_step": 220747, "epoch": 1824} {"train_loss": -41.958702087402344, "global_step": 220748, "epoch": 1824} {"train_loss": -40.865150451660156, "global_step": 220749, "epoch": 1824} {"train_loss": -42.07429504394531, "global_step": 220750, "epoch": 1824} {"train_loss": -41.14476013183594, "global_step": 220751, "epoch": 1824} {"train_loss": -41.73905563354492, "global_step": 220752, "epoch": 1824} {"train_loss": -41.23427963256836, "global_step": 220753, "epoch": 1824} {"train_loss": -42.209232330322266, "global_step": 220754, "epoch": 1824} {"train_loss": -41.957275390625, "global_step": 220755, "epoch": 1824} {"train_loss": -42.049957275390625, "global_step": 220756, "epoch": 1824} {"train_loss": -42.67162322998047, "global_step": 220757, "epoch": 1824} {"train_loss": -42.41887664794922, "global_step": 220758, "epoch": 1824} {"train_loss": -42.0993537902832, "global_step": 220759, "epoch": 1824} {"train_loss": -42.1010627746582, "global_step": 220760, "epoch": 1824} {"train_loss": -41.92345428466797, "global_step": 220761, "epoch": 1824} {"train_loss": -41.902992248535156, "global_step": 220762, "epoch": 1824} {"train_loss": -42.58652114868164, "global_step": 220763, "epoch": 1824} {"train_loss": -42.31046676635742, "global_step": 220764, "epoch": 1824} {"train_loss": -42.208961486816406, "global_step": 220765, "epoch": 1824} {"train_loss": -41.68724060058594, "global_step": 220766, "epoch": 1824} {"train_loss": -42.023956298828125, "global_step": 220767, "epoch": 1824} {"train_loss": -42.42049026489258, "global_step": 220768, "epoch": 1824} {"train_loss": -42.40668487548828, "global_step": 220769, "epoch": 1824} {"train_loss": -42.653289794921875, "global_step": 220770, "epoch": 1824} {"train_loss": -42.75389862060547, "global_step": 220771, "epoch": 1824} {"train_loss": -42.77000045776367, "global_step": 220772, "epoch": 1824} {"train_loss": -41.92734909057617, "global_step": 220773, "epoch": 1824} {"train_loss": -42.56007766723633, "global_step": 220774, "epoch": 1824} {"train_loss": -42.94038772583008, "global_step": 220775, "epoch": 1824} {"train_loss": -42.50754928588867, "global_step": 220776, "epoch": 1824} {"train_loss": -43.30259704589844, "global_step": 220777, "epoch": 1824} {"train_loss": -42.231380462646484, "global_step": 220778, "epoch": 1824} {"train_loss": -41.44588851928711, "global_step": 220779, "epoch": 1824} {"train_loss": -41.914093017578125, "global_step": 220780, "epoch": 1824} {"train_loss": -43.21236801147461, "global_step": 220781, "epoch": 1824} {"train_loss": -41.346195220947266, "global_step": 220782, "epoch": 1824} {"train_loss": -41.56428146362305, "global_step": 220783, "epoch": 1824} {"train_loss": -43.1248893737793, "global_step": 220784, "epoch": 1824} {"train_loss": -41.5837516784668, "global_step": 220785, "epoch": 1824} {"train_loss": -42.31116485595703, "global_step": 220786, "epoch": 1824} {"train_loss": -42.636444091796875, "global_step": 220787, "epoch": 1824} {"train_loss": -42.26527786254883, "global_step": 220788, "epoch": 1824} {"train_loss": -42.50251388549805, "global_step": 220789, "epoch": 1824} {"train_loss": -43.01823043823242, "global_step": 220790, "epoch": 1824} {"train_loss": -40.56317901611328, "global_step": 220791, "epoch": 1824} {"train_loss": -43.34529495239258, "global_step": 220792, "epoch": 1824} {"train_loss": -41.40976333618164, "global_step": 220793, "epoch": 1824} {"train_loss": -41.63657760620117, "global_step": 220794, "epoch": 1824} {"train_loss": -41.69572830200195, "global_step": 220795, "epoch": 1824} {"train_loss": -41.88943099975586, "global_step": 220796, "epoch": 1824} {"train_loss": -42.43172073364258, "global_step": 220797, "epoch": 1824} {"train_loss": -42.560611724853516, "global_step": 220798, "epoch": 1824} {"train_loss": -41.296356201171875, "global_step": 220799, "epoch": 1824} {"train_loss": -42.68915939331055, "global_step": 220800, "epoch": 1824} {"train_loss": -42.62003707885742, "global_step": 220801, "epoch": 1824} {"train_loss": -42.834449768066406, "global_step": 220802, "epoch": 1824} {"train_loss": -41.65999221801758, "global_step": 220803, "epoch": 1824} {"train_loss": -42.20367431640625, "global_step": 220804, "epoch": 1824} {"train_loss": -41.785675048828125, "global_step": 220805, "epoch": 1824} {"train_loss": -42.614463806152344, "global_step": 220806, "epoch": 1824} {"train_loss": -41.16880416870117, "global_step": 220807, "epoch": 1824} {"train_loss": -41.035709381103516, "global_step": 220808, "epoch": 1824} {"train_loss": -42.717620849609375, "global_step": 220809, "epoch": 1824} {"train_loss": -41.458255767822266, "global_step": 220810, "epoch": 1824} {"train_loss": -41.993141174316406, "global_step": 220811, "epoch": 1824} {"train_loss": -40.91748046875, "global_step": 220812, "epoch": 1824} {"train_loss": -42.281837463378906, "global_step": 220813, "epoch": 1824} {"train_loss": -42.035400390625, "global_step": 220814, "epoch": 1824} {"train_loss": -41.372528076171875, "global_step": 220815, "epoch": 1824} {"train_loss": -42.29140853881836, "global_step": 220816, "epoch": 1824} {"train_loss": -40.86619567871094, "global_step": 220817, "epoch": 1824} {"train_loss": -42.29754638671875, "global_step": 220818, "epoch": 1824} {"train_loss": -42.41485595703125, "global_step": 220819, "epoch": 1824} {"train_loss": -41.891441345214844, "global_step": 220820, "epoch": 1824} {"train_loss": -41.665592193603516, "global_step": 220821, "epoch": 1824} {"train_loss": -40.96156692504883, "global_step": 220822, "epoch": 1824} {"train_loss": -41.49068069458008, "global_step": 220823, "epoch": 1824} {"train_loss": -41.51960953011, "global_step": 220824, "epoch": 1824, "val_loss": 2612342.75} {"train_loss": -42.47101974487305, "global_step": 220825, "epoch": 1825} {"train_loss": -41.672569274902344, "global_step": 220826, "epoch": 1825} {"train_loss": -40.11309051513672, "global_step": 220827, "epoch": 1825} {"train_loss": -41.989131927490234, "global_step": 220828, "epoch": 1825} {"train_loss": -42.28120803833008, "global_step": 220829, "epoch": 1825} {"train_loss": -41.86008834838867, "global_step": 220830, "epoch": 1825} {"train_loss": -42.3886833190918, "global_step": 220831, "epoch": 1825} {"train_loss": -41.86439895629883, "global_step": 220832, "epoch": 1825} {"train_loss": -42.3792724609375, "global_step": 220833, "epoch": 1825} {"train_loss": -42.71616744995117, "global_step": 220834, "epoch": 1825} {"train_loss": -42.24261474609375, "global_step": 220835, "epoch": 1825} {"train_loss": -42.14198684692383, "global_step": 220836, "epoch": 1825} {"train_loss": -42.62531280517578, "global_step": 220837, "epoch": 1825} {"train_loss": -43.12483215332031, "global_step": 220838, "epoch": 1825} {"train_loss": -42.05572509765625, "global_step": 220839, "epoch": 1825} {"train_loss": -42.24782180786133, "global_step": 220840, "epoch": 1825} {"train_loss": -42.858428955078125, "global_step": 220841, "epoch": 1825} {"train_loss": -42.39274215698242, "global_step": 220842, "epoch": 1825} {"train_loss": -42.20972442626953, "global_step": 220843, "epoch": 1825} {"train_loss": -42.099422454833984, "global_step": 220844, "epoch": 1825} {"train_loss": -41.9843864440918, "global_step": 220845, "epoch": 1825} {"train_loss": -40.722923278808594, "global_step": 220846, "epoch": 1825} {"train_loss": -41.38530731201172, "global_step": 220847, "epoch": 1825} {"train_loss": -42.21865463256836, "global_step": 220848, "epoch": 1825} {"train_loss": -42.77395248413086, "global_step": 220849, "epoch": 1825} {"train_loss": -40.421966552734375, "global_step": 220850, "epoch": 1825} {"train_loss": -41.65788650512695, "global_step": 220851, "epoch": 1825} {"train_loss": -42.25138473510742, "global_step": 220852, "epoch": 1825} {"train_loss": -41.76428985595703, "global_step": 220853, "epoch": 1825} {"train_loss": -41.08660888671875, "global_step": 220854, "epoch": 1825} {"train_loss": -42.71433639526367, "global_step": 220855, "epoch": 1825} {"train_loss": -42.15393829345703, "global_step": 220856, "epoch": 1825} {"train_loss": -41.24717330932617, "global_step": 220857, "epoch": 1825} {"train_loss": -41.85931396484375, "global_step": 220858, "epoch": 1825} {"train_loss": -42.428932189941406, "global_step": 220859, "epoch": 1825} {"train_loss": -41.804012298583984, "global_step": 220860, "epoch": 1825} {"train_loss": -42.41689682006836, "global_step": 220861, "epoch": 1825} {"train_loss": -42.407020568847656, "global_step": 220862, "epoch": 1825} {"train_loss": -42.25045394897461, "global_step": 220863, "epoch": 1825} {"train_loss": -42.823909759521484, "global_step": 220864, "epoch": 1825} {"train_loss": -43.002193450927734, "global_step": 220865, "epoch": 1825} {"train_loss": -42.720035552978516, "global_step": 220866, "epoch": 1825} {"train_loss": -43.57410430908203, "global_step": 220867, "epoch": 1825} {"train_loss": -42.438270568847656, "global_step": 220868, "epoch": 1825} {"train_loss": -42.908912658691406, "global_step": 220869, "epoch": 1825} {"train_loss": -42.993839263916016, "global_step": 220870, "epoch": 1825} {"train_loss": -42.174461364746094, "global_step": 220871, "epoch": 1825} {"train_loss": -42.42811965942383, "global_step": 220872, "epoch": 1825} {"train_loss": -42.12508773803711, "global_step": 220873, "epoch": 1825} {"train_loss": -43.20745086669922, "global_step": 220874, "epoch": 1825} {"train_loss": -41.950748443603516, "global_step": 220875, "epoch": 1825} {"train_loss": -42.11507797241211, "global_step": 220876, "epoch": 1825} {"train_loss": -43.04974365234375, "global_step": 220877, "epoch": 1825} {"train_loss": -43.24785232543945, "global_step": 220878, "epoch": 1825} {"train_loss": -42.90430450439453, "global_step": 220879, "epoch": 1825} {"train_loss": -42.465476989746094, "global_step": 220880, "epoch": 1825} {"train_loss": -42.58051300048828, "global_step": 220881, "epoch": 1825} {"train_loss": -42.95337677001953, "global_step": 220882, "epoch": 1825} {"train_loss": -43.14931869506836, "global_step": 220883, "epoch": 1825} {"train_loss": -43.08537673950195, "global_step": 220884, "epoch": 1825} {"train_loss": -43.07755661010742, "global_step": 220885, "epoch": 1825} {"train_loss": -42.560997009277344, "global_step": 220886, "epoch": 1825} {"train_loss": -43.32271194458008, "global_step": 220887, "epoch": 1825} {"train_loss": -43.635528564453125, "global_step": 220888, "epoch": 1825} {"train_loss": -42.876529693603516, "global_step": 220889, "epoch": 1825} {"train_loss": -43.62491989135742, "global_step": 220890, "epoch": 1825} {"train_loss": -43.014400482177734, "global_step": 220891, "epoch": 1825} {"train_loss": -43.450191497802734, "global_step": 220892, "epoch": 1825} {"train_loss": -43.648963928222656, "global_step": 220893, "epoch": 1825} {"train_loss": -43.25572967529297, "global_step": 220894, "epoch": 1825} {"train_loss": -42.7858772277832, "global_step": 220895, "epoch": 1825} {"train_loss": -42.64602279663086, "global_step": 220896, "epoch": 1825} {"train_loss": -43.21725845336914, "global_step": 220897, "epoch": 1825} {"train_loss": -42.98926544189453, "global_step": 220898, "epoch": 1825} {"train_loss": -41.508419036865234, "global_step": 220899, "epoch": 1825} {"train_loss": -42.82869338989258, "global_step": 220900, "epoch": 1825} {"train_loss": -42.630104064941406, "global_step": 220901, "epoch": 1825} {"train_loss": -43.36552810668945, "global_step": 220902, "epoch": 1825} {"train_loss": -42.677093505859375, "global_step": 220903, "epoch": 1825} {"train_loss": -42.16252517700195, "global_step": 220904, "epoch": 1825} {"train_loss": -42.8247184753418, "global_step": 220905, "epoch": 1825} {"train_loss": -42.98849868774414, "global_step": 220906, "epoch": 1825} {"train_loss": -41.342872619628906, "global_step": 220907, "epoch": 1825} {"train_loss": -43.06490707397461, "global_step": 220908, "epoch": 1825} {"train_loss": -42.33084487915039, "global_step": 220909, "epoch": 1825} {"train_loss": -41.4189567565918, "global_step": 220910, "epoch": 1825} {"train_loss": -42.6615104675293, "global_step": 220911, "epoch": 1825} {"train_loss": -42.73189926147461, "global_step": 220912, "epoch": 1825} {"train_loss": -42.62539291381836, "global_step": 220913, "epoch": 1825} {"train_loss": -41.503692626953125, "global_step": 220914, "epoch": 1825} {"train_loss": -40.944496154785156, "global_step": 220915, "epoch": 1825} {"train_loss": -42.79970932006836, "global_step": 220916, "epoch": 1825} {"train_loss": -40.970550537109375, "global_step": 220917, "epoch": 1825} {"train_loss": -40.80169677734375, "global_step": 220918, "epoch": 1825} {"train_loss": -41.77525329589844, "global_step": 220919, "epoch": 1825} {"train_loss": -38.34773635864258, "global_step": 220920, "epoch": 1825} {"train_loss": -38.9576530456543, "global_step": 220921, "epoch": 1825} {"train_loss": -41.27851104736328, "global_step": 220922, "epoch": 1825} {"train_loss": -33.04360580444336, "global_step": 220923, "epoch": 1825} {"train_loss": -37.11522674560547, "global_step": 220924, "epoch": 1825} {"train_loss": -39.68599319458008, "global_step": 220925, "epoch": 1825} {"train_loss": -36.444549560546875, "global_step": 220926, "epoch": 1825} {"train_loss": -41.71232223510742, "global_step": 220927, "epoch": 1825} {"train_loss": -38.548805236816406, "global_step": 220928, "epoch": 1825} {"train_loss": -40.65998458862305, "global_step": 220929, "epoch": 1825} {"train_loss": -40.2234001159668, "global_step": 220930, "epoch": 1825} {"train_loss": -38.809349060058594, "global_step": 220931, "epoch": 1825} {"train_loss": -39.24560546875, "global_step": 220932, "epoch": 1825} {"train_loss": -41.18340301513672, "global_step": 220933, "epoch": 1825} {"train_loss": -39.882843017578125, "global_step": 220934, "epoch": 1825} {"train_loss": -40.995849609375, "global_step": 220935, "epoch": 1825} {"train_loss": -40.20986557006836, "global_step": 220936, "epoch": 1825} {"train_loss": -41.53678512573242, "global_step": 220937, "epoch": 1825} {"train_loss": -41.058074951171875, "global_step": 220938, "epoch": 1825} {"train_loss": -41.565860748291016, "global_step": 220939, "epoch": 1825} {"train_loss": -40.979496002197266, "global_step": 220940, "epoch": 1825} {"train_loss": -41.37540817260742, "global_step": 220941, "epoch": 1825} {"train_loss": -41.280338287353516, "global_step": 220942, "epoch": 1825} {"train_loss": -42.263397216796875, "global_step": 220943, "epoch": 1825} {"train_loss": -42.1036491394043, "global_step": 220944, "epoch": 1825} {"train_loss": -41.879780729940116, "global_step": 220945, "epoch": 1825, "val_loss": 2629210.75} {"train_loss": -42.35615158081055, "global_step": 220946, "epoch": 1826} {"train_loss": -42.4552116394043, "global_step": 220947, "epoch": 1826} {"train_loss": -42.125797271728516, "global_step": 220948, "epoch": 1826} {"train_loss": -42.29022216796875, "global_step": 220949, "epoch": 1826} {"train_loss": -41.58749008178711, "global_step": 220950, "epoch": 1826} {"train_loss": -42.05583572387695, "global_step": 220951, "epoch": 1826} {"train_loss": -42.65639877319336, "global_step": 220952, "epoch": 1826} {"train_loss": -41.841373443603516, "global_step": 220953, "epoch": 1826} {"train_loss": -42.09728240966797, "global_step": 220954, "epoch": 1826} {"train_loss": -42.72898483276367, "global_step": 220955, "epoch": 1826} {"train_loss": -42.785789489746094, "global_step": 220956, "epoch": 1826} {"train_loss": -42.39670944213867, "global_step": 220957, "epoch": 1826} {"train_loss": -41.631099700927734, "global_step": 220958, "epoch": 1826} {"train_loss": -41.645442962646484, "global_step": 220959, "epoch": 1826} {"train_loss": -42.8383674621582, "global_step": 220960, "epoch": 1826} {"train_loss": -42.342041015625, "global_step": 220961, "epoch": 1826} {"train_loss": -42.90847396850586, "global_step": 220962, "epoch": 1826} {"train_loss": -42.18404769897461, "global_step": 220963, "epoch": 1826} {"train_loss": -42.6372184753418, "global_step": 220964, "epoch": 1826} {"train_loss": -42.905250549316406, "global_step": 220965, "epoch": 1826} {"train_loss": -43.02482223510742, "global_step": 220966, "epoch": 1826} {"train_loss": -42.487098693847656, "global_step": 220967, "epoch": 1826} {"train_loss": -42.45465850830078, "global_step": 220968, "epoch": 1826} {"train_loss": -42.877586364746094, "global_step": 220969, "epoch": 1826} {"train_loss": -42.72970962524414, "global_step": 220970, "epoch": 1826} {"train_loss": -42.85331344604492, "global_step": 220971, "epoch": 1826} {"train_loss": -42.554744720458984, "global_step": 220972, "epoch": 1826} {"train_loss": -42.84904098510742, "global_step": 220973, "epoch": 1826} {"train_loss": -42.99407958984375, "global_step": 220974, "epoch": 1826} {"train_loss": -42.60665512084961, "global_step": 220975, "epoch": 1826} {"train_loss": -43.40631103515625, "global_step": 220976, "epoch": 1826} {"train_loss": -43.4872932434082, "global_step": 220977, "epoch": 1826} {"train_loss": -43.5973014831543, "global_step": 220978, "epoch": 1826} {"train_loss": -42.837799072265625, "global_step": 220979, "epoch": 1826} {"train_loss": -43.093299865722656, "global_step": 220980, "epoch": 1826} {"train_loss": -42.8853645324707, "global_step": 220981, "epoch": 1826} {"train_loss": -43.168418884277344, "global_step": 220982, "epoch": 1826} {"train_loss": -43.15033721923828, "global_step": 220983, "epoch": 1826} {"train_loss": -43.1968879699707, "global_step": 220984, "epoch": 1826} {"train_loss": -43.95881271362305, "global_step": 220985, "epoch": 1826} {"train_loss": -43.007667541503906, "global_step": 220986, "epoch": 1826} {"train_loss": -42.82514190673828, "global_step": 220987, "epoch": 1826} {"train_loss": -42.180908203125, "global_step": 220988, "epoch": 1826} {"train_loss": -42.18769073486328, "global_step": 220989, "epoch": 1826} {"train_loss": -42.936893463134766, "global_step": 220990, "epoch": 1826} {"train_loss": -43.152748107910156, "global_step": 220991, "epoch": 1826} {"train_loss": -43.46320343017578, "global_step": 220992, "epoch": 1826} {"train_loss": -43.30125045776367, "global_step": 220993, "epoch": 1826} {"train_loss": -42.954864501953125, "global_step": 220994, "epoch": 1826} {"train_loss": -43.53156661987305, "global_step": 220995, "epoch": 1826} {"train_loss": -42.34061813354492, "global_step": 220996, "epoch": 1826} {"train_loss": -42.40857696533203, "global_step": 220997, "epoch": 1826} {"train_loss": -42.949947357177734, "global_step": 220998, "epoch": 1826} {"train_loss": -43.10606002807617, "global_step": 220999, "epoch": 1826} {"train_loss": -42.355438232421875, "global_step": 221000, "epoch": 1826} {"train_loss": -42.373756408691406, "global_step": 221001, "epoch": 1826} {"train_loss": -42.6497917175293, "global_step": 221002, "epoch": 1826} {"train_loss": -42.03120040893555, "global_step": 221003, "epoch": 1826} {"train_loss": -41.42649459838867, "global_step": 221004, "epoch": 1826} {"train_loss": -42.35630416870117, "global_step": 221005, "epoch": 1826} {"train_loss": -42.852840423583984, "global_step": 221006, "epoch": 1826} {"train_loss": -41.57833480834961, "global_step": 221007, "epoch": 1826} {"train_loss": -41.90001678466797, "global_step": 221008, "epoch": 1826} {"train_loss": -43.139381408691406, "global_step": 221009, "epoch": 1826} {"train_loss": -41.61997604370117, "global_step": 221010, "epoch": 1826} {"train_loss": -41.4842643737793, "global_step": 221011, "epoch": 1826} {"train_loss": -43.39925765991211, "global_step": 221012, "epoch": 1826} {"train_loss": -42.87826919555664, "global_step": 221013, "epoch": 1826} {"train_loss": -42.43082809448242, "global_step": 221014, "epoch": 1826} {"train_loss": -41.641109466552734, "global_step": 221015, "epoch": 1826} {"train_loss": -42.056400299072266, "global_step": 221016, "epoch": 1826} {"train_loss": -41.6822509765625, "global_step": 221017, "epoch": 1826} {"train_loss": -39.722740173339844, "global_step": 221018, "epoch": 1826} {"train_loss": -42.47233200073242, "global_step": 221019, "epoch": 1826} {"train_loss": -38.1113166809082, "global_step": 221020, "epoch": 1826} {"train_loss": -39.57863998413086, "global_step": 221021, "epoch": 1826} {"train_loss": -36.32406234741211, "global_step": 221022, "epoch": 1826} {"train_loss": -31.443603515625, "global_step": 221023, "epoch": 1826} {"train_loss": -35.476661682128906, "global_step": 221024, "epoch": 1826} {"train_loss": -35.92024612426758, "global_step": 221025, "epoch": 1826} {"train_loss": -33.2124137878418, "global_step": 221026, "epoch": 1826} {"train_loss": -33.244747161865234, "global_step": 221027, "epoch": 1826} {"train_loss": -40.93291091918945, "global_step": 221028, "epoch": 1826} {"train_loss": -38.72638702392578, "global_step": 221029, "epoch": 1826} {"train_loss": -40.45118713378906, "global_step": 221030, "epoch": 1826} {"train_loss": -41.26177978515625, "global_step": 221031, "epoch": 1826} {"train_loss": -41.14557647705078, "global_step": 221032, "epoch": 1826} {"train_loss": -40.27802276611328, "global_step": 221033, "epoch": 1826} {"train_loss": -41.5237922668457, "global_step": 221034, "epoch": 1826} {"train_loss": -40.73659133911133, "global_step": 221035, "epoch": 1826} {"train_loss": -40.47916030883789, "global_step": 221036, "epoch": 1826} {"train_loss": -40.69868087768555, "global_step": 221037, "epoch": 1826} {"train_loss": -41.287967681884766, "global_step": 221038, "epoch": 1826} {"train_loss": -40.33754348754883, "global_step": 221039, "epoch": 1826} {"train_loss": -41.614166259765625, "global_step": 221040, "epoch": 1826} {"train_loss": -40.52241897583008, "global_step": 221041, "epoch": 1826} {"train_loss": -41.28664779663086, "global_step": 221042, "epoch": 1826} {"train_loss": -41.209800720214844, "global_step": 221043, "epoch": 1826} {"train_loss": -41.521278381347656, "global_step": 221044, "epoch": 1826} {"train_loss": -41.40839767456055, "global_step": 221045, "epoch": 1826} {"train_loss": -41.75651931762695, "global_step": 221046, "epoch": 1826} {"train_loss": -41.689971923828125, "global_step": 221047, "epoch": 1826} {"train_loss": -42.4066162109375, "global_step": 221048, "epoch": 1826} {"train_loss": -41.457847595214844, "global_step": 221049, "epoch": 1826} {"train_loss": -41.970802307128906, "global_step": 221050, "epoch": 1826} {"train_loss": -42.190853118896484, "global_step": 221051, "epoch": 1826} {"train_loss": -42.01499938964844, "global_step": 221052, "epoch": 1826} {"train_loss": -42.433650970458984, "global_step": 221053, "epoch": 1826} {"train_loss": -41.858978271484375, "global_step": 221054, "epoch": 1826} {"train_loss": -42.120361328125, "global_step": 221055, "epoch": 1826} {"train_loss": -42.06732940673828, "global_step": 221056, "epoch": 1826} {"train_loss": -42.08085250854492, "global_step": 221057, "epoch": 1826} {"train_loss": -41.77881622314453, "global_step": 221058, "epoch": 1826} {"train_loss": -42.13142776489258, "global_step": 221059, "epoch": 1826} {"train_loss": -42.294185638427734, "global_step": 221060, "epoch": 1826} {"train_loss": -42.39530944824219, "global_step": 221061, "epoch": 1826} {"train_loss": -42.40965270996094, "global_step": 221062, "epoch": 1826} {"train_loss": -42.70058822631836, "global_step": 221063, "epoch": 1826} {"train_loss": -42.59494400024414, "global_step": 221064, "epoch": 1826} {"train_loss": -43.02555465698242, "global_step": 221065, "epoch": 1826} {"train_loss": -41.76456697322121, "global_step": 221066, "epoch": 1826, "val_loss": 2591782.0} {"train_loss": -43.197322845458984, "global_step": 221067, "epoch": 1827} {"train_loss": -42.638710021972656, "global_step": 221068, "epoch": 1827} {"train_loss": -43.46101760864258, "global_step": 221069, "epoch": 1827} {"train_loss": -43.44762420654297, "global_step": 221070, "epoch": 1827} {"train_loss": -43.244441986083984, "global_step": 221071, "epoch": 1827} {"train_loss": -43.00635528564453, "global_step": 221072, "epoch": 1827} {"train_loss": -43.020111083984375, "global_step": 221073, "epoch": 1827} {"train_loss": -43.70665740966797, "global_step": 221074, "epoch": 1827} {"train_loss": -42.81132888793945, "global_step": 221075, "epoch": 1827} {"train_loss": -43.06843948364258, "global_step": 221076, "epoch": 1827} {"train_loss": -42.65408706665039, "global_step": 221077, "epoch": 1827} {"train_loss": -43.6557731628418, "global_step": 221078, "epoch": 1827} {"train_loss": -43.314510345458984, "global_step": 221079, "epoch": 1827} {"train_loss": -43.237403869628906, "global_step": 221080, "epoch": 1827} {"train_loss": -43.636898040771484, "global_step": 221081, "epoch": 1827} {"train_loss": -43.40861892700195, "global_step": 221082, "epoch": 1827} {"train_loss": -43.31471633911133, "global_step": 221083, "epoch": 1827} {"train_loss": -43.54385757446289, "global_step": 221084, "epoch": 1827} {"train_loss": -42.62165451049805, "global_step": 221085, "epoch": 1827} {"train_loss": -43.33697509765625, "global_step": 221086, "epoch": 1827} {"train_loss": -43.66495132446289, "global_step": 221087, "epoch": 1827} {"train_loss": -43.22699737548828, "global_step": 221088, "epoch": 1827} {"train_loss": -43.803672790527344, "global_step": 221089, "epoch": 1827} {"train_loss": -42.91182327270508, "global_step": 221090, "epoch": 1827} {"train_loss": -42.66851806640625, "global_step": 221091, "epoch": 1827} {"train_loss": -43.01072311401367, "global_step": 221092, "epoch": 1827} {"train_loss": -43.077369689941406, "global_step": 221093, "epoch": 1827} {"train_loss": -42.37272262573242, "global_step": 221094, "epoch": 1827} {"train_loss": -43.40645217895508, "global_step": 221095, "epoch": 1827} {"train_loss": -41.31525802612305, "global_step": 221096, "epoch": 1827} {"train_loss": -43.11368942260742, "global_step": 221097, "epoch": 1827} {"train_loss": -43.089195251464844, "global_step": 221098, "epoch": 1827} {"train_loss": -43.02298355102539, "global_step": 221099, "epoch": 1827} {"train_loss": -42.02577590942383, "global_step": 221100, "epoch": 1827} {"train_loss": -41.58576583862305, "global_step": 221101, "epoch": 1827} {"train_loss": -43.29793167114258, "global_step": 221102, "epoch": 1827} {"train_loss": -43.47570037841797, "global_step": 221103, "epoch": 1827} {"train_loss": -42.676780700683594, "global_step": 221104, "epoch": 1827} {"train_loss": -42.342140197753906, "global_step": 221105, "epoch": 1827} {"train_loss": -43.70454788208008, "global_step": 221106, "epoch": 1827} {"train_loss": -42.161563873291016, "global_step": 221107, "epoch": 1827} {"train_loss": -40.54874801635742, "global_step": 221108, "epoch": 1827} {"train_loss": -42.8437614440918, "global_step": 221109, "epoch": 1827} {"train_loss": -41.47723388671875, "global_step": 221110, "epoch": 1827} {"train_loss": -41.5157585144043, "global_step": 221111, "epoch": 1827} {"train_loss": -42.927059173583984, "global_step": 221112, "epoch": 1827} {"train_loss": -41.510433197021484, "global_step": 221113, "epoch": 1827} {"train_loss": -39.513702392578125, "global_step": 221114, "epoch": 1827} {"train_loss": -42.36870193481445, "global_step": 221115, "epoch": 1827} {"train_loss": -39.79622268676758, "global_step": 221116, "epoch": 1827} {"train_loss": -42.03017807006836, "global_step": 221117, "epoch": 1827} {"train_loss": -41.674930572509766, "global_step": 221118, "epoch": 1827} {"train_loss": -42.065467834472656, "global_step": 221119, "epoch": 1827} {"train_loss": -42.94453048706055, "global_step": 221120, "epoch": 1827} {"train_loss": -41.33559799194336, "global_step": 221121, "epoch": 1827} {"train_loss": -42.509918212890625, "global_step": 221122, "epoch": 1827} {"train_loss": -42.805572509765625, "global_step": 221123, "epoch": 1827} {"train_loss": -42.558082580566406, "global_step": 221124, "epoch": 1827} {"train_loss": -41.15087890625, "global_step": 221125, "epoch": 1827} {"train_loss": -43.0876579284668, "global_step": 221126, "epoch": 1827} {"train_loss": -42.30208206176758, "global_step": 221127, "epoch": 1827} {"train_loss": -41.25814437866211, "global_step": 221128, "epoch": 1827} {"train_loss": -41.32941436767578, "global_step": 221129, "epoch": 1827} {"train_loss": -42.20866012573242, "global_step": 221130, "epoch": 1827} {"train_loss": -40.67607498168945, "global_step": 221131, "epoch": 1827} {"train_loss": -40.57854461669922, "global_step": 221132, "epoch": 1827} {"train_loss": -42.221710205078125, "global_step": 221133, "epoch": 1827} {"train_loss": -39.784488677978516, "global_step": 221134, "epoch": 1827} {"train_loss": -41.45060348510742, "global_step": 221135, "epoch": 1827} {"train_loss": -41.514801025390625, "global_step": 221136, "epoch": 1827} {"train_loss": -42.310081481933594, "global_step": 221137, "epoch": 1827} {"train_loss": -42.699119567871094, "global_step": 221138, "epoch": 1827} {"train_loss": -41.471370697021484, "global_step": 221139, "epoch": 1827} {"train_loss": -42.17030715942383, "global_step": 221140, "epoch": 1827} {"train_loss": -40.785823822021484, "global_step": 221141, "epoch": 1827} {"train_loss": -41.76109313964844, "global_step": 221142, "epoch": 1827} {"train_loss": -41.86931228637695, "global_step": 221143, "epoch": 1827} {"train_loss": -39.7796745300293, "global_step": 221144, "epoch": 1827} {"train_loss": -41.921051025390625, "global_step": 221145, "epoch": 1827} {"train_loss": -40.71984100341797, "global_step": 221146, "epoch": 1827} {"train_loss": -42.056556701660156, "global_step": 221147, "epoch": 1827} {"train_loss": -41.412227630615234, "global_step": 221148, "epoch": 1827} {"train_loss": -41.921512603759766, "global_step": 221149, "epoch": 1827} {"train_loss": -41.35591506958008, "global_step": 221150, "epoch": 1827} {"train_loss": -41.31915283203125, "global_step": 221151, "epoch": 1827} {"train_loss": -42.126708984375, "global_step": 221152, "epoch": 1827} {"train_loss": -41.20038604736328, "global_step": 221153, "epoch": 1827} {"train_loss": -41.73032760620117, "global_step": 221154, "epoch": 1827} {"train_loss": -42.48604965209961, "global_step": 221155, "epoch": 1827} {"train_loss": -42.096221923828125, "global_step": 221156, "epoch": 1827} {"train_loss": -42.88944625854492, "global_step": 221157, "epoch": 1827} {"train_loss": -42.302894592285156, "global_step": 221158, "epoch": 1827} {"train_loss": -41.653289794921875, "global_step": 221159, "epoch": 1827} {"train_loss": -42.176513671875, "global_step": 221160, "epoch": 1827} {"train_loss": -42.4664421081543, "global_step": 221161, "epoch": 1827} {"train_loss": -41.06412124633789, "global_step": 221162, "epoch": 1827} {"train_loss": -42.62492752075195, "global_step": 221163, "epoch": 1827} {"train_loss": -42.12919998168945, "global_step": 221164, "epoch": 1827} {"train_loss": -42.24042510986328, "global_step": 221165, "epoch": 1827} {"train_loss": -41.98431396484375, "global_step": 221166, "epoch": 1827} {"train_loss": -41.97446823120117, "global_step": 221167, "epoch": 1827} {"train_loss": -41.53940200805664, "global_step": 221168, "epoch": 1827} {"train_loss": -42.5672607421875, "global_step": 221169, "epoch": 1827} {"train_loss": -42.20402908325195, "global_step": 221170, "epoch": 1827} {"train_loss": -42.6882209777832, "global_step": 221171, "epoch": 1827} {"train_loss": -42.33519744873047, "global_step": 221172, "epoch": 1827} {"train_loss": -42.595638275146484, "global_step": 221173, "epoch": 1827} {"train_loss": -43.010738372802734, "global_step": 221174, "epoch": 1827} {"train_loss": -42.980186462402344, "global_step": 221175, "epoch": 1827} {"train_loss": -42.73478317260742, "global_step": 221176, "epoch": 1827} {"train_loss": -42.81705856323242, "global_step": 221177, "epoch": 1827} {"train_loss": -42.87774658203125, "global_step": 221178, "epoch": 1827} {"train_loss": -42.97589111328125, "global_step": 221179, "epoch": 1827} {"train_loss": -43.450191497802734, "global_step": 221180, "epoch": 1827} {"train_loss": -43.183589935302734, "global_step": 221181, "epoch": 1827} {"train_loss": -43.10051345825195, "global_step": 221182, "epoch": 1827} {"train_loss": -42.9178581237793, "global_step": 221183, "epoch": 1827} {"train_loss": -43.393672943115234, "global_step": 221184, "epoch": 1827} {"train_loss": -43.12506866455078, "global_step": 221185, "epoch": 1827} {"train_loss": -43.300865173339844, "global_step": 221186, "epoch": 1827} {"train_loss": -42.35600230319441, "global_step": 221187, "epoch": 1827, "val_loss": 2620856.25} {"train_loss": -42.72553634643555, "global_step": 221188, "epoch": 1828} {"train_loss": -42.603267669677734, "global_step": 221189, "epoch": 1828} {"train_loss": -42.6971321105957, "global_step": 221190, "epoch": 1828} {"train_loss": -43.09798812866211, "global_step": 221191, "epoch": 1828} {"train_loss": -43.59682083129883, "global_step": 221192, "epoch": 1828} {"train_loss": -42.16043472290039, "global_step": 221193, "epoch": 1828} {"train_loss": -40.373809814453125, "global_step": 221194, "epoch": 1828} {"train_loss": -40.36406326293945, "global_step": 221195, "epoch": 1828} {"train_loss": -42.499977111816406, "global_step": 221196, "epoch": 1828} {"train_loss": -42.85969161987305, "global_step": 221197, "epoch": 1828} {"train_loss": -41.792449951171875, "global_step": 221198, "epoch": 1828} {"train_loss": -40.46698760986328, "global_step": 221199, "epoch": 1828} {"train_loss": -41.1685791015625, "global_step": 221200, "epoch": 1828} {"train_loss": -42.68003463745117, "global_step": 221201, "epoch": 1828} {"train_loss": -41.21077346801758, "global_step": 221202, "epoch": 1828} {"train_loss": -40.78984451293945, "global_step": 221203, "epoch": 1828} {"train_loss": -42.38857650756836, "global_step": 221204, "epoch": 1828} {"train_loss": -39.50956344604492, "global_step": 221205, "epoch": 1828} {"train_loss": -41.4851188659668, "global_step": 221206, "epoch": 1828} {"train_loss": -38.51288986206055, "global_step": 221207, "epoch": 1828} {"train_loss": -39.91770553588867, "global_step": 221208, "epoch": 1828} {"train_loss": -42.275840759277344, "global_step": 221209, "epoch": 1828} {"train_loss": -41.3730583190918, "global_step": 221210, "epoch": 1828} {"train_loss": -39.602108001708984, "global_step": 221211, "epoch": 1828} {"train_loss": -41.04548263549805, "global_step": 221212, "epoch": 1828} {"train_loss": -41.819278717041016, "global_step": 221213, "epoch": 1828} {"train_loss": -39.66106414794922, "global_step": 221214, "epoch": 1828} {"train_loss": -41.535888671875, "global_step": 221215, "epoch": 1828} {"train_loss": -42.64297866821289, "global_step": 221216, "epoch": 1828} {"train_loss": -40.53534698486328, "global_step": 221217, "epoch": 1828} {"train_loss": -41.45404052734375, "global_step": 221218, "epoch": 1828} {"train_loss": -42.32627487182617, "global_step": 221219, "epoch": 1828} {"train_loss": -40.55115509033203, "global_step": 221220, "epoch": 1828} {"train_loss": -42.78157424926758, "global_step": 221221, "epoch": 1828} {"train_loss": -41.167144775390625, "global_step": 221222, "epoch": 1828} {"train_loss": -41.8272819519043, "global_step": 221223, "epoch": 1828} {"train_loss": -41.341732025146484, "global_step": 221224, "epoch": 1828} {"train_loss": -39.8637580871582, "global_step": 221225, "epoch": 1828} {"train_loss": -40.97488021850586, "global_step": 221226, "epoch": 1828} {"train_loss": -41.88676071166992, "global_step": 221227, "epoch": 1828} {"train_loss": -43.021766662597656, "global_step": 221228, "epoch": 1828} {"train_loss": -42.3038444519043, "global_step": 221229, "epoch": 1828} {"train_loss": -39.74997329711914, "global_step": 221230, "epoch": 1828} {"train_loss": -41.18445587158203, "global_step": 221231, "epoch": 1828} {"train_loss": -42.753292083740234, "global_step": 221232, "epoch": 1828} {"train_loss": -42.488258361816406, "global_step": 221233, "epoch": 1828} {"train_loss": -41.7057991027832, "global_step": 221234, "epoch": 1828} {"train_loss": -41.795989990234375, "global_step": 221235, "epoch": 1828} {"train_loss": -42.65798568725586, "global_step": 221236, "epoch": 1828} {"train_loss": -39.866031646728516, "global_step": 221237, "epoch": 1828} {"train_loss": -41.399574279785156, "global_step": 221238, "epoch": 1828} {"train_loss": -40.940853118896484, "global_step": 221239, "epoch": 1828} {"train_loss": -39.108253479003906, "global_step": 221240, "epoch": 1828} {"train_loss": -42.230289459228516, "global_step": 221241, "epoch": 1828} {"train_loss": -40.35497283935547, "global_step": 221242, "epoch": 1828} {"train_loss": -39.56632614135742, "global_step": 221243, "epoch": 1828} {"train_loss": -42.582767486572266, "global_step": 221244, "epoch": 1828} {"train_loss": -38.23468017578125, "global_step": 221245, "epoch": 1828} {"train_loss": -37.72636795043945, "global_step": 221246, "epoch": 1828} {"train_loss": -38.681922912597656, "global_step": 221247, "epoch": 1828} {"train_loss": -38.3586540222168, "global_step": 221248, "epoch": 1828} {"train_loss": -39.112220764160156, "global_step": 221249, "epoch": 1828} {"train_loss": -41.05623245239258, "global_step": 221250, "epoch": 1828} {"train_loss": -40.34825134277344, "global_step": 221251, "epoch": 1828} {"train_loss": -40.083961486816406, "global_step": 221252, "epoch": 1828} {"train_loss": -40.22040939331055, "global_step": 221253, "epoch": 1828} {"train_loss": -41.475582122802734, "global_step": 221254, "epoch": 1828} {"train_loss": -41.44704055786133, "global_step": 221255, "epoch": 1828} {"train_loss": -40.714691162109375, "global_step": 221256, "epoch": 1828} {"train_loss": -41.98320388793945, "global_step": 221257, "epoch": 1828} {"train_loss": -40.15636444091797, "global_step": 221258, "epoch": 1828} {"train_loss": -40.80126953125, "global_step": 221259, "epoch": 1828} {"train_loss": -41.180641174316406, "global_step": 221260, "epoch": 1828} {"train_loss": -42.2351188659668, "global_step": 221261, "epoch": 1828} {"train_loss": -42.35968780517578, "global_step": 221262, "epoch": 1828} {"train_loss": -41.36058044433594, "global_step": 221263, "epoch": 1828} {"train_loss": -42.91105270385742, "global_step": 221264, "epoch": 1828} {"train_loss": -42.0521125793457, "global_step": 221265, "epoch": 1828} {"train_loss": -42.42217254638672, "global_step": 221266, "epoch": 1828} {"train_loss": -42.21078109741211, "global_step": 221267, "epoch": 1828} {"train_loss": -41.68906784057617, "global_step": 221268, "epoch": 1828} {"train_loss": -42.78086471557617, "global_step": 221269, "epoch": 1828} {"train_loss": -42.39177322387695, "global_step": 221270, "epoch": 1828} {"train_loss": -41.61738204956055, "global_step": 221271, "epoch": 1828} {"train_loss": -42.227394104003906, "global_step": 221272, "epoch": 1828} {"train_loss": -42.899932861328125, "global_step": 221273, "epoch": 1828} {"train_loss": -42.475215911865234, "global_step": 221274, "epoch": 1828} {"train_loss": -42.613426208496094, "global_step": 221275, "epoch": 1828} {"train_loss": -43.052974700927734, "global_step": 221276, "epoch": 1828} {"train_loss": -42.68086624145508, "global_step": 221277, "epoch": 1828} {"train_loss": -43.00764465332031, "global_step": 221278, "epoch": 1828} {"train_loss": -42.1833381652832, "global_step": 221279, "epoch": 1828} {"train_loss": -43.41799545288086, "global_step": 221280, "epoch": 1828} {"train_loss": -42.196414947509766, "global_step": 221281, "epoch": 1828} {"train_loss": -42.9493522644043, "global_step": 221282, "epoch": 1828} {"train_loss": -42.516815185546875, "global_step": 221283, "epoch": 1828} {"train_loss": -43.008949279785156, "global_step": 221284, "epoch": 1828} {"train_loss": -42.8338623046875, "global_step": 221285, "epoch": 1828} {"train_loss": -42.70414733886719, "global_step": 221286, "epoch": 1828} {"train_loss": -42.822479248046875, "global_step": 221287, "epoch": 1828} {"train_loss": -43.31913375854492, "global_step": 221288, "epoch": 1828} {"train_loss": -42.992183685302734, "global_step": 221289, "epoch": 1828} {"train_loss": -42.69211196899414, "global_step": 221290, "epoch": 1828} {"train_loss": -42.999935150146484, "global_step": 221291, "epoch": 1828} {"train_loss": -43.12017822265625, "global_step": 221292, "epoch": 1828} {"train_loss": -42.613887786865234, "global_step": 221293, "epoch": 1828} {"train_loss": -43.090858459472656, "global_step": 221294, "epoch": 1828} {"train_loss": -42.668331146240234, "global_step": 221295, "epoch": 1828} {"train_loss": -42.765010833740234, "global_step": 221296, "epoch": 1828} {"train_loss": -43.346763610839844, "global_step": 221297, "epoch": 1828} {"train_loss": -42.996463775634766, "global_step": 221298, "epoch": 1828} {"train_loss": -42.6335563659668, "global_step": 221299, "epoch": 1828} {"train_loss": -43.40752029418945, "global_step": 221300, "epoch": 1828} {"train_loss": -42.59469223022461, "global_step": 221301, "epoch": 1828} {"train_loss": -42.65760803222656, "global_step": 221302, "epoch": 1828} {"train_loss": -41.981658935546875, "global_step": 221303, "epoch": 1828} {"train_loss": -41.2740364074707, "global_step": 221304, "epoch": 1828} {"train_loss": -41.35976791381836, "global_step": 221305, "epoch": 1828} {"train_loss": -42.84354782104492, "global_step": 221306, "epoch": 1828} {"train_loss": -41.47730255126953, "global_step": 221307, "epoch": 1828} {"train_loss": -41.68349214033647, "global_step": 221308, "epoch": 1828, "val_loss": 2561122.25} {"train_loss": -40.56411361694336, "global_step": 221309, "epoch": 1829} {"train_loss": -42.26359176635742, "global_step": 221310, "epoch": 1829} {"train_loss": -39.52881622314453, "global_step": 221311, "epoch": 1829} {"train_loss": -42.89350509643555, "global_step": 221312, "epoch": 1829} {"train_loss": -40.3765983581543, "global_step": 221313, "epoch": 1829} {"train_loss": -42.16029739379883, "global_step": 221314, "epoch": 1829} {"train_loss": -40.92441940307617, "global_step": 221315, "epoch": 1829} {"train_loss": -40.880096435546875, "global_step": 221316, "epoch": 1829} {"train_loss": -42.27614974975586, "global_step": 221317, "epoch": 1829} {"train_loss": -41.78457260131836, "global_step": 221318, "epoch": 1829} {"train_loss": -40.50430679321289, "global_step": 221319, "epoch": 1829} {"train_loss": -42.92063522338867, "global_step": 221320, "epoch": 1829} {"train_loss": -40.653377532958984, "global_step": 221321, "epoch": 1829} {"train_loss": -40.71335983276367, "global_step": 221322, "epoch": 1829} {"train_loss": -41.685272216796875, "global_step": 221323, "epoch": 1829} {"train_loss": -41.70156478881836, "global_step": 221324, "epoch": 1829} {"train_loss": -41.791622161865234, "global_step": 221325, "epoch": 1829} {"train_loss": -41.3511848449707, "global_step": 221326, "epoch": 1829} {"train_loss": -39.39704513549805, "global_step": 221327, "epoch": 1829} {"train_loss": -41.6198616027832, "global_step": 221328, "epoch": 1829} {"train_loss": -40.8423957824707, "global_step": 221329, "epoch": 1829} {"train_loss": -41.90505599975586, "global_step": 221330, "epoch": 1829} {"train_loss": -39.50641632080078, "global_step": 221331, "epoch": 1829} {"train_loss": -43.144287109375, "global_step": 221332, "epoch": 1829} {"train_loss": -39.017452239990234, "global_step": 221333, "epoch": 1829} {"train_loss": -41.7043342590332, "global_step": 221334, "epoch": 1829} {"train_loss": -40.60039520263672, "global_step": 221335, "epoch": 1829} {"train_loss": -41.3657341003418, "global_step": 221336, "epoch": 1829} {"train_loss": -41.536109924316406, "global_step": 221337, "epoch": 1829} {"train_loss": -41.05428695678711, "global_step": 221338, "epoch": 1829} {"train_loss": -40.783748626708984, "global_step": 221339, "epoch": 1829} {"train_loss": -42.57951354980469, "global_step": 221340, "epoch": 1829} {"train_loss": -40.276790618896484, "global_step": 221341, "epoch": 1829} {"train_loss": -42.45819091796875, "global_step": 221342, "epoch": 1829} {"train_loss": -40.6175422668457, "global_step": 221343, "epoch": 1829} {"train_loss": -42.0763053894043, "global_step": 221344, "epoch": 1829} {"train_loss": -41.42792510986328, "global_step": 221345, "epoch": 1829} {"train_loss": -41.99496078491211, "global_step": 221346, "epoch": 1829} {"train_loss": -41.92973327636719, "global_step": 221347, "epoch": 1829} {"train_loss": -42.90554428100586, "global_step": 221348, "epoch": 1829} {"train_loss": -41.823341369628906, "global_step": 221349, "epoch": 1829} {"train_loss": -42.70115280151367, "global_step": 221350, "epoch": 1829} {"train_loss": -42.37947463989258, "global_step": 221351, "epoch": 1829} {"train_loss": -42.3511848449707, "global_step": 221352, "epoch": 1829} {"train_loss": -42.449275970458984, "global_step": 221353, "epoch": 1829} {"train_loss": -42.516727447509766, "global_step": 221354, "epoch": 1829} {"train_loss": -42.3836669921875, "global_step": 221355, "epoch": 1829} {"train_loss": -42.50984573364258, "global_step": 221356, "epoch": 1829} {"train_loss": -42.73428726196289, "global_step": 221357, "epoch": 1829} {"train_loss": -42.40985107421875, "global_step": 221358, "epoch": 1829} {"train_loss": -41.91569519042969, "global_step": 221359, "epoch": 1829} {"train_loss": -43.35003662109375, "global_step": 221360, "epoch": 1829} {"train_loss": -42.09965133666992, "global_step": 221361, "epoch": 1829} {"train_loss": -42.60554122924805, "global_step": 221362, "epoch": 1829} {"train_loss": -42.70985412597656, "global_step": 221363, "epoch": 1829} {"train_loss": -42.660247802734375, "global_step": 221364, "epoch": 1829} {"train_loss": -42.77845764160156, "global_step": 221365, "epoch": 1829} {"train_loss": -43.19286346435547, "global_step": 221366, "epoch": 1829} {"train_loss": -43.021846771240234, "global_step": 221367, "epoch": 1829} {"train_loss": -42.91325759887695, "global_step": 221368, "epoch": 1829} {"train_loss": -43.65999221801758, "global_step": 221369, "epoch": 1829} {"train_loss": -43.212947845458984, "global_step": 221370, "epoch": 1829} {"train_loss": -43.130428314208984, "global_step": 221371, "epoch": 1829} {"train_loss": -42.7530517578125, "global_step": 221372, "epoch": 1829} {"train_loss": -43.41802215576172, "global_step": 221373, "epoch": 1829} {"train_loss": -43.490997314453125, "global_step": 221374, "epoch": 1829} {"train_loss": -43.308834075927734, "global_step": 221375, "epoch": 1829} {"train_loss": -43.606746673583984, "global_step": 221376, "epoch": 1829} {"train_loss": -43.61798858642578, "global_step": 221377, "epoch": 1829} {"train_loss": -43.5638313293457, "global_step": 221378, "epoch": 1829} {"train_loss": -43.558773040771484, "global_step": 221379, "epoch": 1829} {"train_loss": -43.47736358642578, "global_step": 221380, "epoch": 1829} {"train_loss": -42.18609619140625, "global_step": 221381, "epoch": 1829} {"train_loss": -42.2985954284668, "global_step": 221382, "epoch": 1829} {"train_loss": -42.825103759765625, "global_step": 221383, "epoch": 1829} {"train_loss": -42.59017562866211, "global_step": 221384, "epoch": 1829} {"train_loss": -42.03341293334961, "global_step": 221385, "epoch": 1829} {"train_loss": -42.85198974609375, "global_step": 221386, "epoch": 1829} {"train_loss": -42.20036697387695, "global_step": 221387, "epoch": 1829} {"train_loss": -41.87350082397461, "global_step": 221388, "epoch": 1829} {"train_loss": -42.659400939941406, "global_step": 221389, "epoch": 1829} {"train_loss": -42.14435577392578, "global_step": 221390, "epoch": 1829} {"train_loss": -43.17584991455078, "global_step": 221391, "epoch": 1829} {"train_loss": -42.54634475708008, "global_step": 221392, "epoch": 1829} {"train_loss": -41.61930847167969, "global_step": 221393, "epoch": 1829} {"train_loss": -43.154144287109375, "global_step": 221394, "epoch": 1829} {"train_loss": -43.03900909423828, "global_step": 221395, "epoch": 1829} {"train_loss": -42.930904388427734, "global_step": 221396, "epoch": 1829} {"train_loss": -43.22026443481445, "global_step": 221397, "epoch": 1829} {"train_loss": -42.678802490234375, "global_step": 221398, "epoch": 1829} {"train_loss": -42.3591423034668, "global_step": 221399, "epoch": 1829} {"train_loss": -42.85492706298828, "global_step": 221400, "epoch": 1829} {"train_loss": -43.244022369384766, "global_step": 221401, "epoch": 1829} {"train_loss": -41.79753875732422, "global_step": 221402, "epoch": 1829} {"train_loss": -42.41533279418945, "global_step": 221403, "epoch": 1829} {"train_loss": -42.40251541137695, "global_step": 221404, "epoch": 1829} {"train_loss": -42.68031311035156, "global_step": 221405, "epoch": 1829} {"train_loss": -42.604434967041016, "global_step": 221406, "epoch": 1829} {"train_loss": -42.4963493347168, "global_step": 221407, "epoch": 1829} {"train_loss": -43.37926483154297, "global_step": 221408, "epoch": 1829} {"train_loss": -42.014190673828125, "global_step": 221409, "epoch": 1829} {"train_loss": -41.49213409423828, "global_step": 221410, "epoch": 1829} {"train_loss": -43.37675094604492, "global_step": 221411, "epoch": 1829} {"train_loss": -42.83538818359375, "global_step": 221412, "epoch": 1829} {"train_loss": -43.2152214050293, "global_step": 221413, "epoch": 1829} {"train_loss": -42.423973083496094, "global_step": 221414, "epoch": 1829} {"train_loss": -42.349822998046875, "global_step": 221415, "epoch": 1829} {"train_loss": -41.960445404052734, "global_step": 221416, "epoch": 1829} {"train_loss": -42.639827728271484, "global_step": 221417, "epoch": 1829} {"train_loss": -43.188411712646484, "global_step": 221418, "epoch": 1829} {"train_loss": -42.09041976928711, "global_step": 221419, "epoch": 1829} {"train_loss": -43.483402252197266, "global_step": 221420, "epoch": 1829} {"train_loss": -42.869789123535156, "global_step": 221421, "epoch": 1829} {"train_loss": -43.15726089477539, "global_step": 221422, "epoch": 1829} {"train_loss": -43.78047561645508, "global_step": 221423, "epoch": 1829} {"train_loss": -42.99385070800781, "global_step": 221424, "epoch": 1829} {"train_loss": -43.39614486694336, "global_step": 221425, "epoch": 1829} {"train_loss": -43.4720458984375, "global_step": 221426, "epoch": 1829} {"train_loss": -43.41633987426758, "global_step": 221427, "epoch": 1829} {"train_loss": -43.055721282958984, "global_step": 221428, "epoch": 1829} {"train_loss": -42.298540446383896, "global_step": 221429, "epoch": 1829, "val_loss": 2585096.25} {"train_loss": -42.745033264160156, "global_step": 221430, "epoch": 1830} {"train_loss": -42.7229118347168, "global_step": 221431, "epoch": 1830} {"train_loss": -42.718475341796875, "global_step": 221432, "epoch": 1830} {"train_loss": -43.1099739074707, "global_step": 221433, "epoch": 1830} {"train_loss": -42.88462448120117, "global_step": 221434, "epoch": 1830} {"train_loss": -42.990447998046875, "global_step": 221435, "epoch": 1830} {"train_loss": -43.22246170043945, "global_step": 221436, "epoch": 1830} {"train_loss": -43.67509841918945, "global_step": 221437, "epoch": 1830} {"train_loss": -43.5863037109375, "global_step": 221438, "epoch": 1830} {"train_loss": -44.09867477416992, "global_step": 221439, "epoch": 1830} {"train_loss": -43.794647216796875, "global_step": 221440, "epoch": 1830} {"train_loss": -43.55559158325195, "global_step": 221441, "epoch": 1830} {"train_loss": -43.59780502319336, "global_step": 221442, "epoch": 1830} {"train_loss": -44.036415100097656, "global_step": 221443, "epoch": 1830} {"train_loss": -43.372310638427734, "global_step": 221444, "epoch": 1830} {"train_loss": -43.417510986328125, "global_step": 221445, "epoch": 1830} {"train_loss": -42.134437561035156, "global_step": 221446, "epoch": 1830} {"train_loss": -40.565040588378906, "global_step": 221447, "epoch": 1830} {"train_loss": -43.37847137451172, "global_step": 221448, "epoch": 1830} {"train_loss": -42.574520111083984, "global_step": 221449, "epoch": 1830} {"train_loss": -41.3065185546875, "global_step": 221450, "epoch": 1830} {"train_loss": -41.15474319458008, "global_step": 221451, "epoch": 1830} {"train_loss": -42.22397232055664, "global_step": 221452, "epoch": 1830} {"train_loss": -42.84196090698242, "global_step": 221453, "epoch": 1830} {"train_loss": -40.151527404785156, "global_step": 221454, "epoch": 1830} {"train_loss": -43.050636291503906, "global_step": 221455, "epoch": 1830} {"train_loss": -43.22883987426758, "global_step": 221456, "epoch": 1830} {"train_loss": -42.719215393066406, "global_step": 221457, "epoch": 1830} {"train_loss": -42.30924606323242, "global_step": 221458, "epoch": 1830} {"train_loss": -42.09310531616211, "global_step": 221459, "epoch": 1830} {"train_loss": -43.03047180175781, "global_step": 221460, "epoch": 1830} {"train_loss": -42.67351150512695, "global_step": 221461, "epoch": 1830} {"train_loss": -41.74839401245117, "global_step": 221462, "epoch": 1830} {"train_loss": -43.11655807495117, "global_step": 221463, "epoch": 1830} {"train_loss": -42.624935150146484, "global_step": 221464, "epoch": 1830} {"train_loss": -42.358497619628906, "global_step": 221465, "epoch": 1830} {"train_loss": -41.39393997192383, "global_step": 221466, "epoch": 1830} {"train_loss": -40.456356048583984, "global_step": 221467, "epoch": 1830} {"train_loss": -43.06120681762695, "global_step": 221468, "epoch": 1830} {"train_loss": -41.60236358642578, "global_step": 221469, "epoch": 1830} {"train_loss": -41.324127197265625, "global_step": 221470, "epoch": 1830} {"train_loss": -42.61109161376953, "global_step": 221471, "epoch": 1830} {"train_loss": -41.215904235839844, "global_step": 221472, "epoch": 1830} {"train_loss": -41.627349853515625, "global_step": 221473, "epoch": 1830} {"train_loss": -41.92289352416992, "global_step": 221474, "epoch": 1830} {"train_loss": -40.13261795043945, "global_step": 221475, "epoch": 1830} {"train_loss": -41.20928955078125, "global_step": 221476, "epoch": 1830} {"train_loss": -42.569942474365234, "global_step": 221477, "epoch": 1830} {"train_loss": -42.66239547729492, "global_step": 221478, "epoch": 1830} {"train_loss": -41.37826156616211, "global_step": 221479, "epoch": 1830} {"train_loss": -40.41904830932617, "global_step": 221480, "epoch": 1830} {"train_loss": -42.33155822753906, "global_step": 221481, "epoch": 1830} {"train_loss": -42.203975677490234, "global_step": 221482, "epoch": 1830} {"train_loss": -41.118709564208984, "global_step": 221483, "epoch": 1830} {"train_loss": -42.02960968017578, "global_step": 221484, "epoch": 1830} {"train_loss": -39.52339172363281, "global_step": 221485, "epoch": 1830} {"train_loss": -43.04041290283203, "global_step": 221486, "epoch": 1830} {"train_loss": -41.873046875, "global_step": 221487, "epoch": 1830} {"train_loss": -42.103614807128906, "global_step": 221488, "epoch": 1830} {"train_loss": -41.42757797241211, "global_step": 221489, "epoch": 1830} {"train_loss": -41.271663665771484, "global_step": 221490, "epoch": 1830} {"train_loss": -41.79265213012695, "global_step": 221491, "epoch": 1830} {"train_loss": -43.29471969604492, "global_step": 221492, "epoch": 1830} {"train_loss": -42.11854934692383, "global_step": 221493, "epoch": 1830} {"train_loss": -41.27105712890625, "global_step": 221494, "epoch": 1830} {"train_loss": -39.72317123413086, "global_step": 221495, "epoch": 1830} {"train_loss": -41.428348541259766, "global_step": 221496, "epoch": 1830} {"train_loss": -42.190528869628906, "global_step": 221497, "epoch": 1830} {"train_loss": -40.76784133911133, "global_step": 221498, "epoch": 1830} {"train_loss": -39.690956115722656, "global_step": 221499, "epoch": 1830} {"train_loss": -39.98867416381836, "global_step": 221500, "epoch": 1830} {"train_loss": -42.930870056152344, "global_step": 221501, "epoch": 1830} {"train_loss": -39.832271575927734, "global_step": 221502, "epoch": 1830} {"train_loss": -40.093597412109375, "global_step": 221503, "epoch": 1830} {"train_loss": -42.53535842895508, "global_step": 221504, "epoch": 1830} {"train_loss": -40.020389556884766, "global_step": 221505, "epoch": 1830} {"train_loss": -39.75708770751953, "global_step": 221506, "epoch": 1830} {"train_loss": -42.2318229675293, "global_step": 221507, "epoch": 1830} {"train_loss": -37.67205810546875, "global_step": 221508, "epoch": 1830} {"train_loss": -38.467384338378906, "global_step": 221509, "epoch": 1830} {"train_loss": -40.62763214111328, "global_step": 221510, "epoch": 1830} {"train_loss": -40.73715591430664, "global_step": 221511, "epoch": 1830} {"train_loss": -39.6068229675293, "global_step": 221512, "epoch": 1830} {"train_loss": -40.795711517333984, "global_step": 221513, "epoch": 1830} {"train_loss": -41.32368850708008, "global_step": 221514, "epoch": 1830} {"train_loss": -39.40581512451172, "global_step": 221515, "epoch": 1830} {"train_loss": -42.171756744384766, "global_step": 221516, "epoch": 1830} {"train_loss": -40.86198043823242, "global_step": 221517, "epoch": 1830} {"train_loss": -41.91485595703125, "global_step": 221518, "epoch": 1830} {"train_loss": -41.353816986083984, "global_step": 221519, "epoch": 1830} {"train_loss": -41.59857177734375, "global_step": 221520, "epoch": 1830} {"train_loss": -41.836814880371094, "global_step": 221521, "epoch": 1830} {"train_loss": -40.99555587768555, "global_step": 221522, "epoch": 1830} {"train_loss": -42.00962448120117, "global_step": 221523, "epoch": 1830} {"train_loss": -42.27883529663086, "global_step": 221524, "epoch": 1830} {"train_loss": -42.36110305786133, "global_step": 221525, "epoch": 1830} {"train_loss": -42.74065017700195, "global_step": 221526, "epoch": 1830} {"train_loss": -42.194026947021484, "global_step": 221527, "epoch": 1830} {"train_loss": -42.811798095703125, "global_step": 221528, "epoch": 1830} {"train_loss": -42.32351303100586, "global_step": 221529, "epoch": 1830} {"train_loss": -42.06423568725586, "global_step": 221530, "epoch": 1830} {"train_loss": -42.79749298095703, "global_step": 221531, "epoch": 1830} {"train_loss": -41.53826904296875, "global_step": 221532, "epoch": 1830} {"train_loss": -42.574100494384766, "global_step": 221533, "epoch": 1830} {"train_loss": -42.17448425292969, "global_step": 221534, "epoch": 1830} {"train_loss": -42.95094299316406, "global_step": 221535, "epoch": 1830} {"train_loss": -42.83209991455078, "global_step": 221536, "epoch": 1830} {"train_loss": -42.98194122314453, "global_step": 221537, "epoch": 1830} {"train_loss": -43.0516471862793, "global_step": 221538, "epoch": 1830} {"train_loss": -42.6633415222168, "global_step": 221539, "epoch": 1830} {"train_loss": -43.26960372924805, "global_step": 221540, "epoch": 1830} {"train_loss": -42.73152160644531, "global_step": 221541, "epoch": 1830} {"train_loss": -42.975215911865234, "global_step": 221542, "epoch": 1830} {"train_loss": -42.9656867980957, "global_step": 221543, "epoch": 1830} {"train_loss": -43.0561637878418, "global_step": 221544, "epoch": 1830} {"train_loss": -43.10906982421875, "global_step": 221545, "epoch": 1830} {"train_loss": -43.0191764831543, "global_step": 221546, "epoch": 1830} {"train_loss": -43.03931427001953, "global_step": 221547, "epoch": 1830} {"train_loss": -43.194541931152344, "global_step": 221548, "epoch": 1830} {"train_loss": -42.73340606689453, "global_step": 221549, "epoch": 1830} {"train_loss": -42.0143109786609, "global_step": 221550, "epoch": 1830, "val_loss": 2484091.75} {"train_loss": -43.33687210083008, "global_step": 221551, "epoch": 1831} {"train_loss": -42.987892150878906, "global_step": 221552, "epoch": 1831} {"train_loss": -43.37337112426758, "global_step": 221553, "epoch": 1831} {"train_loss": -43.71525955200195, "global_step": 221554, "epoch": 1831} {"train_loss": -43.196022033691406, "global_step": 221555, "epoch": 1831} {"train_loss": -43.15604019165039, "global_step": 221556, "epoch": 1831} {"train_loss": -43.28524398803711, "global_step": 221557, "epoch": 1831} {"train_loss": -43.07511520385742, "global_step": 221558, "epoch": 1831} {"train_loss": -42.968780517578125, "global_step": 221559, "epoch": 1831} {"train_loss": -43.73733901977539, "global_step": 221560, "epoch": 1831} {"train_loss": -43.73482894897461, "global_step": 221561, "epoch": 1831} {"train_loss": -43.778045654296875, "global_step": 221562, "epoch": 1831} {"train_loss": -43.65279769897461, "global_step": 221563, "epoch": 1831} {"train_loss": -43.28719711303711, "global_step": 221564, "epoch": 1831} {"train_loss": -43.190673828125, "global_step": 221565, "epoch": 1831} {"train_loss": -43.20309066772461, "global_step": 221566, "epoch": 1831} {"train_loss": -43.10852813720703, "global_step": 221567, "epoch": 1831} {"train_loss": -42.18870162963867, "global_step": 221568, "epoch": 1831} {"train_loss": -43.51095962524414, "global_step": 221569, "epoch": 1831} {"train_loss": -43.84299850463867, "global_step": 221570, "epoch": 1831} {"train_loss": -43.374237060546875, "global_step": 221571, "epoch": 1831} {"train_loss": -43.59150314331055, "global_step": 221572, "epoch": 1831} {"train_loss": -43.920936584472656, "global_step": 221573, "epoch": 1831} {"train_loss": -43.12581253051758, "global_step": 221574, "epoch": 1831} {"train_loss": -42.455848693847656, "global_step": 221575, "epoch": 1831} {"train_loss": -42.50368881225586, "global_step": 221576, "epoch": 1831} {"train_loss": -43.35619354248047, "global_step": 221577, "epoch": 1831} {"train_loss": -42.70660400390625, "global_step": 221578, "epoch": 1831} {"train_loss": -42.23460006713867, "global_step": 221579, "epoch": 1831} {"train_loss": -42.404659271240234, "global_step": 221580, "epoch": 1831} {"train_loss": -42.93996810913086, "global_step": 221581, "epoch": 1831} {"train_loss": -43.45134353637695, "global_step": 221582, "epoch": 1831} {"train_loss": -42.066062927246094, "global_step": 221583, "epoch": 1831} {"train_loss": -42.57378005981445, "global_step": 221584, "epoch": 1831} {"train_loss": -43.108638763427734, "global_step": 221585, "epoch": 1831} {"train_loss": -42.942291259765625, "global_step": 221586, "epoch": 1831} {"train_loss": -43.2121696472168, "global_step": 221587, "epoch": 1831} {"train_loss": -42.61611557006836, "global_step": 221588, "epoch": 1831} {"train_loss": -42.099300384521484, "global_step": 221589, "epoch": 1831} {"train_loss": -42.47274398803711, "global_step": 221590, "epoch": 1831} {"train_loss": -42.645320892333984, "global_step": 221591, "epoch": 1831} {"train_loss": -41.98453140258789, "global_step": 221592, "epoch": 1831} {"train_loss": -41.84626007080078, "global_step": 221593, "epoch": 1831} {"train_loss": -40.34016799926758, "global_step": 221594, "epoch": 1831} {"train_loss": -34.226829528808594, "global_step": 221595, "epoch": 1831} {"train_loss": -26.69736099243164, "global_step": 221596, "epoch": 1831} {"train_loss": -26.87908363342285, "global_step": 221597, "epoch": 1831} {"train_loss": -33.66980743408203, "global_step": 221598, "epoch": 1831} {"train_loss": -38.39424514770508, "global_step": 221599, "epoch": 1831} {"train_loss": -34.246028900146484, "global_step": 221600, "epoch": 1831} {"train_loss": -36.549468994140625, "global_step": 221601, "epoch": 1831} {"train_loss": -39.315853118896484, "global_step": 221602, "epoch": 1831} {"train_loss": -36.969181060791016, "global_step": 221603, "epoch": 1831} {"train_loss": -40.84334182739258, "global_step": 221604, "epoch": 1831} {"train_loss": -36.219627380371094, "global_step": 221605, "epoch": 1831} {"train_loss": -41.11245346069336, "global_step": 221606, "epoch": 1831} {"train_loss": -38.278656005859375, "global_step": 221607, "epoch": 1831} {"train_loss": -40.065673828125, "global_step": 221608, "epoch": 1831} {"train_loss": -40.74758529663086, "global_step": 221609, "epoch": 1831} {"train_loss": -40.91025161743164, "global_step": 221610, "epoch": 1831} {"train_loss": -40.87226486206055, "global_step": 221611, "epoch": 1831} {"train_loss": -40.941200256347656, "global_step": 221612, "epoch": 1831} {"train_loss": -40.85572814941406, "global_step": 221613, "epoch": 1831} {"train_loss": -41.37221908569336, "global_step": 221614, "epoch": 1831} {"train_loss": -40.308502197265625, "global_step": 221615, "epoch": 1831} {"train_loss": -41.53629684448242, "global_step": 221616, "epoch": 1831} {"train_loss": -40.80278778076172, "global_step": 221617, "epoch": 1831} {"train_loss": -41.65168380737305, "global_step": 221618, "epoch": 1831} {"train_loss": -41.362548828125, "global_step": 221619, "epoch": 1831} {"train_loss": -41.66823959350586, "global_step": 221620, "epoch": 1831} {"train_loss": -40.97060775756836, "global_step": 221621, "epoch": 1831} {"train_loss": -41.944339752197266, "global_step": 221622, "epoch": 1831} {"train_loss": -41.280757904052734, "global_step": 221623, "epoch": 1831} {"train_loss": -41.82455062866211, "global_step": 221624, "epoch": 1831} {"train_loss": -41.42002487182617, "global_step": 221625, "epoch": 1831} {"train_loss": -41.38686752319336, "global_step": 221626, "epoch": 1831} {"train_loss": -42.0866813659668, "global_step": 221627, "epoch": 1831} {"train_loss": -41.399959564208984, "global_step": 221628, "epoch": 1831} {"train_loss": -41.77495574951172, "global_step": 221629, "epoch": 1831} {"train_loss": -41.71375274658203, "global_step": 221630, "epoch": 1831} {"train_loss": -42.34450149536133, "global_step": 221631, "epoch": 1831} {"train_loss": -41.742332458496094, "global_step": 221632, "epoch": 1831} {"train_loss": -42.40177917480469, "global_step": 221633, "epoch": 1831} {"train_loss": -41.37449264526367, "global_step": 221634, "epoch": 1831} {"train_loss": -41.398216247558594, "global_step": 221635, "epoch": 1831} {"train_loss": -42.825653076171875, "global_step": 221636, "epoch": 1831} {"train_loss": -41.25444412231445, "global_step": 221637, "epoch": 1831} {"train_loss": -43.0479736328125, "global_step": 221638, "epoch": 1831} {"train_loss": -42.00168991088867, "global_step": 221639, "epoch": 1831} {"train_loss": -42.58297348022461, "global_step": 221640, "epoch": 1831} {"train_loss": -43.09540557861328, "global_step": 221641, "epoch": 1831} {"train_loss": -42.32328414916992, "global_step": 221642, "epoch": 1831} {"train_loss": -43.09515380859375, "global_step": 221643, "epoch": 1831} {"train_loss": -42.34535598754883, "global_step": 221644, "epoch": 1831} {"train_loss": -42.474063873291016, "global_step": 221645, "epoch": 1831} {"train_loss": -43.228614807128906, "global_step": 221646, "epoch": 1831} {"train_loss": -42.66366195678711, "global_step": 221647, "epoch": 1831} {"train_loss": -42.910743713378906, "global_step": 221648, "epoch": 1831} {"train_loss": -42.97862243652344, "global_step": 221649, "epoch": 1831} {"train_loss": -43.02729415893555, "global_step": 221650, "epoch": 1831} {"train_loss": -43.39878845214844, "global_step": 221651, "epoch": 1831} {"train_loss": -42.81757736206055, "global_step": 221652, "epoch": 1831} {"train_loss": -43.2958869934082, "global_step": 221653, "epoch": 1831} {"train_loss": -43.3046760559082, "global_step": 221654, "epoch": 1831} {"train_loss": -43.369258880615234, "global_step": 221655, "epoch": 1831} {"train_loss": -43.352413177490234, "global_step": 221656, "epoch": 1831} {"train_loss": -43.403743743896484, "global_step": 221657, "epoch": 1831} {"train_loss": -43.39186477661133, "global_step": 221658, "epoch": 1831} {"train_loss": -43.4892578125, "global_step": 221659, "epoch": 1831} {"train_loss": -43.27777862548828, "global_step": 221660, "epoch": 1831} {"train_loss": -43.4909553527832, "global_step": 221661, "epoch": 1831} {"train_loss": -43.760772705078125, "global_step": 221662, "epoch": 1831} {"train_loss": -43.50586700439453, "global_step": 221663, "epoch": 1831} {"train_loss": -42.98907470703125, "global_step": 221664, "epoch": 1831} {"train_loss": -39.98835754394531, "global_step": 221665, "epoch": 1831} {"train_loss": -43.30170440673828, "global_step": 221666, "epoch": 1831} {"train_loss": -43.528926849365234, "global_step": 221667, "epoch": 1831} {"train_loss": -43.670101165771484, "global_step": 221668, "epoch": 1831} {"train_loss": -43.383522033691406, "global_step": 221669, "epoch": 1831} {"train_loss": -43.07118225097656, "global_step": 221670, "epoch": 1831} {"train_loss": -41.80812985443872, "global_step": 221671, "epoch": 1831, "val_loss": 2658026.0} {"train_loss": -43.71079635620117, "global_step": 221672, "epoch": 1832} {"train_loss": -43.392982482910156, "global_step": 221673, "epoch": 1832} {"train_loss": -43.40581130981445, "global_step": 221674, "epoch": 1832} {"train_loss": -43.584529876708984, "global_step": 221675, "epoch": 1832} {"train_loss": -43.08415985107422, "global_step": 221676, "epoch": 1832} {"train_loss": -32.70988082885742, "global_step": 221677, "epoch": 1832} {"train_loss": -42.6952018737793, "global_step": 221678, "epoch": 1832} {"train_loss": -42.03156280517578, "global_step": 221679, "epoch": 1832} {"train_loss": -42.3543815612793, "global_step": 221680, "epoch": 1832} {"train_loss": -43.24360275268555, "global_step": 221681, "epoch": 1832} {"train_loss": -43.22929000854492, "global_step": 221682, "epoch": 1832} {"train_loss": -41.868621826171875, "global_step": 221683, "epoch": 1832} {"train_loss": -40.834590911865234, "global_step": 221684, "epoch": 1832} {"train_loss": -40.801124572753906, "global_step": 221685, "epoch": 1832} {"train_loss": -41.859901428222656, "global_step": 221686, "epoch": 1832} {"train_loss": -41.094783782958984, "global_step": 221687, "epoch": 1832} {"train_loss": -41.445777893066406, "global_step": 221688, "epoch": 1832} {"train_loss": -40.21045684814453, "global_step": 221689, "epoch": 1832} {"train_loss": -41.08197021484375, "global_step": 221690, "epoch": 1832} {"train_loss": -41.7097053527832, "global_step": 221691, "epoch": 1832} {"train_loss": -39.443843841552734, "global_step": 221692, "epoch": 1832} {"train_loss": -41.179168701171875, "global_step": 221693, "epoch": 1832} {"train_loss": -41.85818099975586, "global_step": 221694, "epoch": 1832} {"train_loss": -39.28432846069336, "global_step": 221695, "epoch": 1832} {"train_loss": -39.287166595458984, "global_step": 221696, "epoch": 1832} {"train_loss": -40.577911376953125, "global_step": 221697, "epoch": 1832} {"train_loss": -36.24671936035156, "global_step": 221698, "epoch": 1832} {"train_loss": -41.691802978515625, "global_step": 221699, "epoch": 1832} {"train_loss": -39.65851974487305, "global_step": 221700, "epoch": 1832} {"train_loss": -40.856536865234375, "global_step": 221701, "epoch": 1832} {"train_loss": -39.556427001953125, "global_step": 221702, "epoch": 1832} {"train_loss": -40.1204833984375, "global_step": 221703, "epoch": 1832} {"train_loss": -38.11127853393555, "global_step": 221704, "epoch": 1832} {"train_loss": -40.7291374206543, "global_step": 221705, "epoch": 1832} {"train_loss": -41.00790023803711, "global_step": 221706, "epoch": 1832} {"train_loss": -37.34200668334961, "global_step": 221707, "epoch": 1832} {"train_loss": -40.20764923095703, "global_step": 221708, "epoch": 1832} {"train_loss": -38.2957878112793, "global_step": 221709, "epoch": 1832} {"train_loss": -40.70308303833008, "global_step": 221710, "epoch": 1832} {"train_loss": -40.61480712890625, "global_step": 221711, "epoch": 1832} {"train_loss": -40.575347900390625, "global_step": 221712, "epoch": 1832} {"train_loss": -38.69552230834961, "global_step": 221713, "epoch": 1832} {"train_loss": -40.82154846191406, "global_step": 221714, "epoch": 1832} {"train_loss": -41.36357879638672, "global_step": 221715, "epoch": 1832} {"train_loss": -41.71902084350586, "global_step": 221716, "epoch": 1832} {"train_loss": -41.819881439208984, "global_step": 221717, "epoch": 1832} {"train_loss": -40.56898498535156, "global_step": 221718, "epoch": 1832} {"train_loss": -41.548744201660156, "global_step": 221719, "epoch": 1832} {"train_loss": -40.876277923583984, "global_step": 221720, "epoch": 1832} {"train_loss": -41.53006362915039, "global_step": 221721, "epoch": 1832} {"train_loss": -42.076805114746094, "global_step": 221722, "epoch": 1832} {"train_loss": -41.7645378112793, "global_step": 221723, "epoch": 1832} {"train_loss": -41.32758712768555, "global_step": 221724, "epoch": 1832} {"train_loss": -41.042938232421875, "global_step": 221725, "epoch": 1832} {"train_loss": -40.50138473510742, "global_step": 221726, "epoch": 1832} {"train_loss": -40.13389205932617, "global_step": 221727, "epoch": 1832} {"train_loss": -41.5136604309082, "global_step": 221728, "epoch": 1832} {"train_loss": -39.001136779785156, "global_step": 221729, "epoch": 1832} {"train_loss": -36.62207794189453, "global_step": 221730, "epoch": 1832} {"train_loss": -41.127017974853516, "global_step": 221731, "epoch": 1832} {"train_loss": -41.17551040649414, "global_step": 221732, "epoch": 1832} {"train_loss": -39.79933547973633, "global_step": 221733, "epoch": 1832} {"train_loss": -41.59159469604492, "global_step": 221734, "epoch": 1832} {"train_loss": -41.36027145385742, "global_step": 221735, "epoch": 1832} {"train_loss": -41.27860641479492, "global_step": 221736, "epoch": 1832} {"train_loss": -41.606529235839844, "global_step": 221737, "epoch": 1832} {"train_loss": -41.982818603515625, "global_step": 221738, "epoch": 1832} {"train_loss": -42.44039535522461, "global_step": 221739, "epoch": 1832} {"train_loss": -41.69160079956055, "global_step": 221740, "epoch": 1832} {"train_loss": -41.805641174316406, "global_step": 221741, "epoch": 1832} {"train_loss": -42.075782775878906, "global_step": 221742, "epoch": 1832} {"train_loss": -42.57108688354492, "global_step": 221743, "epoch": 1832} {"train_loss": -41.78052520751953, "global_step": 221744, "epoch": 1832} {"train_loss": -41.40541458129883, "global_step": 221745, "epoch": 1832} {"train_loss": -42.168941497802734, "global_step": 221746, "epoch": 1832} {"train_loss": -42.488441467285156, "global_step": 221747, "epoch": 1832} {"train_loss": -42.83258819580078, "global_step": 221748, "epoch": 1832} {"train_loss": -42.45277404785156, "global_step": 221749, "epoch": 1832} {"train_loss": -42.3446159362793, "global_step": 221750, "epoch": 1832} {"train_loss": -42.01263427734375, "global_step": 221751, "epoch": 1832} {"train_loss": -42.840755462646484, "global_step": 221752, "epoch": 1832} {"train_loss": -42.129066467285156, "global_step": 221753, "epoch": 1832} {"train_loss": -42.46901321411133, "global_step": 221754, "epoch": 1832} {"train_loss": -42.56103515625, "global_step": 221755, "epoch": 1832} {"train_loss": -42.9407844543457, "global_step": 221756, "epoch": 1832} {"train_loss": -42.40641403198242, "global_step": 221757, "epoch": 1832} {"train_loss": -42.581912994384766, "global_step": 221758, "epoch": 1832} {"train_loss": -42.994056701660156, "global_step": 221759, "epoch": 1832} {"train_loss": -42.569087982177734, "global_step": 221760, "epoch": 1832} {"train_loss": -43.31480026245117, "global_step": 221761, "epoch": 1832} {"train_loss": -42.0583381652832, "global_step": 221762, "epoch": 1832} {"train_loss": -42.1041145324707, "global_step": 221763, "epoch": 1832} {"train_loss": -42.03093338012695, "global_step": 221764, "epoch": 1832} {"train_loss": -43.09450912475586, "global_step": 221765, "epoch": 1832} {"train_loss": -42.85011291503906, "global_step": 221766, "epoch": 1832} {"train_loss": -42.73199462890625, "global_step": 221767, "epoch": 1832} {"train_loss": -43.12428665161133, "global_step": 221768, "epoch": 1832} {"train_loss": -43.067176818847656, "global_step": 221769, "epoch": 1832} {"train_loss": -42.619136810302734, "global_step": 221770, "epoch": 1832} {"train_loss": -42.78969192504883, "global_step": 221771, "epoch": 1832} {"train_loss": -43.29103088378906, "global_step": 221772, "epoch": 1832} {"train_loss": -42.59412384033203, "global_step": 221773, "epoch": 1832} {"train_loss": -43.206050872802734, "global_step": 221774, "epoch": 1832} {"train_loss": -42.91566848754883, "global_step": 221775, "epoch": 1832} {"train_loss": -42.97036361694336, "global_step": 221776, "epoch": 1832} {"train_loss": -42.02632522583008, "global_step": 221777, "epoch": 1832} {"train_loss": -41.94005584716797, "global_step": 221778, "epoch": 1832} {"train_loss": -41.48935317993164, "global_step": 221779, "epoch": 1832} {"train_loss": -42.309913635253906, "global_step": 221780, "epoch": 1832} {"train_loss": -43.1474609375, "global_step": 221781, "epoch": 1832} {"train_loss": -41.66511917114258, "global_step": 221782, "epoch": 1832} {"train_loss": -41.15065383911133, "global_step": 221783, "epoch": 1832} {"train_loss": -40.67879867553711, "global_step": 221784, "epoch": 1832} {"train_loss": -40.43488311767578, "global_step": 221785, "epoch": 1832} {"train_loss": -42.0208854675293, "global_step": 221786, "epoch": 1832} {"train_loss": -42.43272399902344, "global_step": 221787, "epoch": 1832} {"train_loss": -38.92234802246094, "global_step": 221788, "epoch": 1832} {"train_loss": -42.53312683105469, "global_step": 221789, "epoch": 1832} {"train_loss": -38.10728073120117, "global_step": 221790, "epoch": 1832} {"train_loss": -39.474159240722656, "global_step": 221791, "epoch": 1832} {"train_loss": -41.38234862020193, "global_step": 221792, "epoch": 1832, "val_loss": 2573970.75} {"train_loss": -40.08986282348633, "global_step": 221793, "epoch": 1833} {"train_loss": -39.40985107421875, "global_step": 221794, "epoch": 1833} {"train_loss": -40.84198760986328, "global_step": 221795, "epoch": 1833} {"train_loss": -38.06692886352539, "global_step": 221796, "epoch": 1833} {"train_loss": -42.0576057434082, "global_step": 221797, "epoch": 1833} {"train_loss": -38.19199752807617, "global_step": 221798, "epoch": 1833} {"train_loss": -41.61062240600586, "global_step": 221799, "epoch": 1833} {"train_loss": -39.21273422241211, "global_step": 221800, "epoch": 1833} {"train_loss": -36.09101104736328, "global_step": 221801, "epoch": 1833} {"train_loss": -35.96644592285156, "global_step": 221802, "epoch": 1833} {"train_loss": -39.811824798583984, "global_step": 221803, "epoch": 1833} {"train_loss": -41.97629928588867, "global_step": 221804, "epoch": 1833} {"train_loss": -38.89204788208008, "global_step": 221805, "epoch": 1833} {"train_loss": -37.62577438354492, "global_step": 221806, "epoch": 1833} {"train_loss": -40.05584716796875, "global_step": 221807, "epoch": 1833} {"train_loss": -41.860267639160156, "global_step": 221808, "epoch": 1833} {"train_loss": -40.18561553955078, "global_step": 221809, "epoch": 1833} {"train_loss": -40.5445556640625, "global_step": 221810, "epoch": 1833} {"train_loss": -41.393096923828125, "global_step": 221811, "epoch": 1833} {"train_loss": -41.60655212402344, "global_step": 221812, "epoch": 1833} {"train_loss": -41.06525421142578, "global_step": 221813, "epoch": 1833} {"train_loss": -41.71052551269531, "global_step": 221814, "epoch": 1833} {"train_loss": -41.98681640625, "global_step": 221815, "epoch": 1833} {"train_loss": -40.820858001708984, "global_step": 221816, "epoch": 1833} {"train_loss": -41.884090423583984, "global_step": 221817, "epoch": 1833} {"train_loss": -41.889183044433594, "global_step": 221818, "epoch": 1833} {"train_loss": -41.386383056640625, "global_step": 221819, "epoch": 1833} {"train_loss": -42.459503173828125, "global_step": 221820, "epoch": 1833} {"train_loss": -41.4764518737793, "global_step": 221821, "epoch": 1833} {"train_loss": -42.113948822021484, "global_step": 221822, "epoch": 1833} {"train_loss": -42.53998565673828, "global_step": 221823, "epoch": 1833} {"train_loss": -41.30784225463867, "global_step": 221824, "epoch": 1833} {"train_loss": -42.37102508544922, "global_step": 221825, "epoch": 1833} {"train_loss": -42.2714729309082, "global_step": 221826, "epoch": 1833} {"train_loss": -41.53936767578125, "global_step": 221827, "epoch": 1833} {"train_loss": -42.149147033691406, "global_step": 221828, "epoch": 1833} {"train_loss": -41.9173698425293, "global_step": 221829, "epoch": 1833} {"train_loss": -41.056915283203125, "global_step": 221830, "epoch": 1833} {"train_loss": -42.604217529296875, "global_step": 221831, "epoch": 1833} {"train_loss": -43.07353591918945, "global_step": 221832, "epoch": 1833} {"train_loss": -41.892513275146484, "global_step": 221833, "epoch": 1833} {"train_loss": -42.17695236206055, "global_step": 221834, "epoch": 1833} {"train_loss": -41.801475524902344, "global_step": 221835, "epoch": 1833} {"train_loss": -42.878902435302734, "global_step": 221836, "epoch": 1833} {"train_loss": -42.01918411254883, "global_step": 221837, "epoch": 1833} {"train_loss": -42.66123580932617, "global_step": 221838, "epoch": 1833} {"train_loss": -42.42115020751953, "global_step": 221839, "epoch": 1833} {"train_loss": -41.78050994873047, "global_step": 221840, "epoch": 1833} {"train_loss": -42.84096145629883, "global_step": 221841, "epoch": 1833} {"train_loss": -42.28664016723633, "global_step": 221842, "epoch": 1833} {"train_loss": -42.89160919189453, "global_step": 221843, "epoch": 1833} {"train_loss": -42.69690704345703, "global_step": 221844, "epoch": 1833} {"train_loss": -42.48931884765625, "global_step": 221845, "epoch": 1833} {"train_loss": -42.61080551147461, "global_step": 221846, "epoch": 1833} {"train_loss": -42.90339660644531, "global_step": 221847, "epoch": 1833} {"train_loss": -42.705989837646484, "global_step": 221848, "epoch": 1833} {"train_loss": -42.59275436401367, "global_step": 221849, "epoch": 1833} {"train_loss": -42.6022834777832, "global_step": 221850, "epoch": 1833} {"train_loss": -42.572662353515625, "global_step": 221851, "epoch": 1833} {"train_loss": -42.23716354370117, "global_step": 221852, "epoch": 1833} {"train_loss": -41.99897384643555, "global_step": 221853, "epoch": 1833} {"train_loss": -42.76180648803711, "global_step": 221854, "epoch": 1833} {"train_loss": -42.80671310424805, "global_step": 221855, "epoch": 1833} {"train_loss": -41.74560546875, "global_step": 221856, "epoch": 1833} {"train_loss": -43.04368209838867, "global_step": 221857, "epoch": 1833} {"train_loss": -42.215370178222656, "global_step": 221858, "epoch": 1833} {"train_loss": -43.372684478759766, "global_step": 221859, "epoch": 1833} {"train_loss": -43.25104904174805, "global_step": 221860, "epoch": 1833} {"train_loss": -42.841400146484375, "global_step": 221861, "epoch": 1833} {"train_loss": -41.87174606323242, "global_step": 221862, "epoch": 1833} {"train_loss": -42.88359069824219, "global_step": 221863, "epoch": 1833} {"train_loss": -43.02903366088867, "global_step": 221864, "epoch": 1833} {"train_loss": -41.822628021240234, "global_step": 221865, "epoch": 1833} {"train_loss": -41.922698974609375, "global_step": 221866, "epoch": 1833} {"train_loss": -42.74345397949219, "global_step": 221867, "epoch": 1833} {"train_loss": -42.27851104736328, "global_step": 221868, "epoch": 1833} {"train_loss": -43.04513168334961, "global_step": 221869, "epoch": 1833} {"train_loss": -42.5416259765625, "global_step": 221870, "epoch": 1833} {"train_loss": -41.76858139038086, "global_step": 221871, "epoch": 1833} {"train_loss": -42.99260330200195, "global_step": 221872, "epoch": 1833} {"train_loss": -43.085296630859375, "global_step": 221873, "epoch": 1833} {"train_loss": -43.369972229003906, "global_step": 221874, "epoch": 1833} {"train_loss": -43.13054275512695, "global_step": 221875, "epoch": 1833} {"train_loss": -42.12766647338867, "global_step": 221876, "epoch": 1833} {"train_loss": -42.96024703979492, "global_step": 221877, "epoch": 1833} {"train_loss": -42.56296157836914, "global_step": 221878, "epoch": 1833} {"train_loss": -42.48934555053711, "global_step": 221879, "epoch": 1833} {"train_loss": -43.555213928222656, "global_step": 221880, "epoch": 1833} {"train_loss": -42.981727600097656, "global_step": 221881, "epoch": 1833} {"train_loss": -42.162986755371094, "global_step": 221882, "epoch": 1833} {"train_loss": -43.31513595581055, "global_step": 221883, "epoch": 1833} {"train_loss": -43.0977668762207, "global_step": 221884, "epoch": 1833} {"train_loss": -43.4099235534668, "global_step": 221885, "epoch": 1833} {"train_loss": -42.7199821472168, "global_step": 221886, "epoch": 1833} {"train_loss": -43.25162124633789, "global_step": 221887, "epoch": 1833} {"train_loss": -43.1910514831543, "global_step": 221888, "epoch": 1833} {"train_loss": -42.436641693115234, "global_step": 221889, "epoch": 1833} {"train_loss": -42.62392044067383, "global_step": 221890, "epoch": 1833} {"train_loss": -42.88520431518555, "global_step": 221891, "epoch": 1833} {"train_loss": -42.530391693115234, "global_step": 221892, "epoch": 1833} {"train_loss": -42.54230499267578, "global_step": 221893, "epoch": 1833} {"train_loss": -43.265625, "global_step": 221894, "epoch": 1833} {"train_loss": -41.9576530456543, "global_step": 221895, "epoch": 1833} {"train_loss": -42.80703353881836, "global_step": 221896, "epoch": 1833} {"train_loss": -41.807369232177734, "global_step": 221897, "epoch": 1833} {"train_loss": -43.05712127685547, "global_step": 221898, "epoch": 1833} {"train_loss": -42.84098815917969, "global_step": 221899, "epoch": 1833} {"train_loss": -42.747920989990234, "global_step": 221900, "epoch": 1833} {"train_loss": -42.45842361450195, "global_step": 221901, "epoch": 1833} {"train_loss": -42.61341094970703, "global_step": 221902, "epoch": 1833} {"train_loss": -42.01825714111328, "global_step": 221903, "epoch": 1833} {"train_loss": -42.8277587890625, "global_step": 221904, "epoch": 1833} {"train_loss": -42.597408294677734, "global_step": 221905, "epoch": 1833} {"train_loss": -43.419490814208984, "global_step": 221906, "epoch": 1833} {"train_loss": -42.39616012573242, "global_step": 221907, "epoch": 1833} {"train_loss": -43.19585418701172, "global_step": 221908, "epoch": 1833} {"train_loss": -42.720558166503906, "global_step": 221909, "epoch": 1833} {"train_loss": -43.44779968261719, "global_step": 221910, "epoch": 1833} {"train_loss": -42.321659088134766, "global_step": 221911, "epoch": 1833} {"train_loss": -43.3916015625, "global_step": 221912, "epoch": 1833} {"train_loss": -42.04613794374072, "global_step": 221913, "epoch": 1833, "val_loss": 2486461.75} {"train_loss": -42.783546447753906, "global_step": 221914, "epoch": 1834} {"train_loss": -42.304290771484375, "global_step": 221915, "epoch": 1834} {"train_loss": -41.319698333740234, "global_step": 221916, "epoch": 1834} {"train_loss": -39.976993560791016, "global_step": 221917, "epoch": 1834} {"train_loss": -42.844818115234375, "global_step": 221918, "epoch": 1834} {"train_loss": -41.3848876953125, "global_step": 221919, "epoch": 1834} {"train_loss": -41.783233642578125, "global_step": 221920, "epoch": 1834} {"train_loss": -42.08932113647461, "global_step": 221921, "epoch": 1834} {"train_loss": -40.07981872558594, "global_step": 221922, "epoch": 1834} {"train_loss": -42.15253829956055, "global_step": 221923, "epoch": 1834} {"train_loss": -42.77620315551758, "global_step": 221924, "epoch": 1834} {"train_loss": -42.22163772583008, "global_step": 221925, "epoch": 1834} {"train_loss": -42.937034606933594, "global_step": 221926, "epoch": 1834} {"train_loss": -41.05982208251953, "global_step": 221927, "epoch": 1834} {"train_loss": -42.48012924194336, "global_step": 221928, "epoch": 1834} {"train_loss": -41.0981330871582, "global_step": 221929, "epoch": 1834} {"train_loss": -40.92031478881836, "global_step": 221930, "epoch": 1834} {"train_loss": -42.43796920776367, "global_step": 221931, "epoch": 1834} {"train_loss": -39.89814376831055, "global_step": 221932, "epoch": 1834} {"train_loss": -41.73179244995117, "global_step": 221933, "epoch": 1834} {"train_loss": -41.13554000854492, "global_step": 221934, "epoch": 1834} {"train_loss": -41.466854095458984, "global_step": 221935, "epoch": 1834} {"train_loss": -38.55126953125, "global_step": 221936, "epoch": 1834} {"train_loss": -42.34138488769531, "global_step": 221937, "epoch": 1834} {"train_loss": -36.371456146240234, "global_step": 221938, "epoch": 1834} {"train_loss": -37.538604736328125, "global_step": 221939, "epoch": 1834} {"train_loss": -38.6479377746582, "global_step": 221940, "epoch": 1834} {"train_loss": -39.34096908569336, "global_step": 221941, "epoch": 1834} {"train_loss": -40.5959358215332, "global_step": 221942, "epoch": 1834} {"train_loss": -40.577266693115234, "global_step": 221943, "epoch": 1834} {"train_loss": -36.68703842163086, "global_step": 221944, "epoch": 1834} {"train_loss": -41.81753158569336, "global_step": 221945, "epoch": 1834} {"train_loss": -39.678977966308594, "global_step": 221946, "epoch": 1834} {"train_loss": -38.17702865600586, "global_step": 221947, "epoch": 1834} {"train_loss": -40.73967361450195, "global_step": 221948, "epoch": 1834} {"train_loss": -41.7402458190918, "global_step": 221949, "epoch": 1834} {"train_loss": -37.94465255737305, "global_step": 221950, "epoch": 1834} {"train_loss": -42.423919677734375, "global_step": 221951, "epoch": 1834} {"train_loss": -40.02667999267578, "global_step": 221952, "epoch": 1834} {"train_loss": -41.10850524902344, "global_step": 221953, "epoch": 1834} {"train_loss": -40.50649642944336, "global_step": 221954, "epoch": 1834} {"train_loss": -39.0452995300293, "global_step": 221955, "epoch": 1834} {"train_loss": -42.34224319458008, "global_step": 221956, "epoch": 1834} {"train_loss": -39.5599479675293, "global_step": 221957, "epoch": 1834} {"train_loss": -40.72288131713867, "global_step": 221958, "epoch": 1834} {"train_loss": -41.10512161254883, "global_step": 221959, "epoch": 1834} {"train_loss": -41.03731155395508, "global_step": 221960, "epoch": 1834} {"train_loss": -42.3346061706543, "global_step": 221961, "epoch": 1834} {"train_loss": -41.36862564086914, "global_step": 221962, "epoch": 1834} {"train_loss": -41.9614143371582, "global_step": 221963, "epoch": 1834} {"train_loss": -41.75396728515625, "global_step": 221964, "epoch": 1834} {"train_loss": -41.63291549682617, "global_step": 221965, "epoch": 1834} {"train_loss": -41.86724853515625, "global_step": 221966, "epoch": 1834} {"train_loss": -41.14974594116211, "global_step": 221967, "epoch": 1834} {"train_loss": -41.487361907958984, "global_step": 221968, "epoch": 1834} {"train_loss": -42.015174865722656, "global_step": 221969, "epoch": 1834} {"train_loss": -42.27118682861328, "global_step": 221970, "epoch": 1834} {"train_loss": -42.51862716674805, "global_step": 221971, "epoch": 1834} {"train_loss": -42.19282150268555, "global_step": 221972, "epoch": 1834} {"train_loss": -42.629695892333984, "global_step": 221973, "epoch": 1834} {"train_loss": -41.59550857543945, "global_step": 221974, "epoch": 1834} {"train_loss": -42.455162048339844, "global_step": 221975, "epoch": 1834} {"train_loss": -41.582916259765625, "global_step": 221976, "epoch": 1834} {"train_loss": -41.71540832519531, "global_step": 221977, "epoch": 1834} {"train_loss": -42.3332405090332, "global_step": 221978, "epoch": 1834} {"train_loss": -42.54642105102539, "global_step": 221979, "epoch": 1834} {"train_loss": -42.38467025756836, "global_step": 221980, "epoch": 1834} {"train_loss": -43.050601959228516, "global_step": 221981, "epoch": 1834} {"train_loss": -42.54293441772461, "global_step": 221982, "epoch": 1834} {"train_loss": -42.86320114135742, "global_step": 221983, "epoch": 1834} {"train_loss": -43.40797805786133, "global_step": 221984, "epoch": 1834} {"train_loss": -43.155181884765625, "global_step": 221985, "epoch": 1834} {"train_loss": -42.877933502197266, "global_step": 221986, "epoch": 1834} {"train_loss": -43.73550033569336, "global_step": 221987, "epoch": 1834} {"train_loss": -43.14389419555664, "global_step": 221988, "epoch": 1834} {"train_loss": -42.8526611328125, "global_step": 221989, "epoch": 1834} {"train_loss": -43.210548400878906, "global_step": 221990, "epoch": 1834} {"train_loss": -43.59421920776367, "global_step": 221991, "epoch": 1834} {"train_loss": -42.694461822509766, "global_step": 221992, "epoch": 1834} {"train_loss": -43.38255310058594, "global_step": 221993, "epoch": 1834} {"train_loss": -43.66694259643555, "global_step": 221994, "epoch": 1834} {"train_loss": -43.1023063659668, "global_step": 221995, "epoch": 1834} {"train_loss": -43.694671630859375, "global_step": 221996, "epoch": 1834} {"train_loss": -43.473201751708984, "global_step": 221997, "epoch": 1834} {"train_loss": -43.49346160888672, "global_step": 221998, "epoch": 1834} {"train_loss": -43.72197341918945, "global_step": 221999, "epoch": 1834} {"train_loss": -43.75461959838867, "global_step": 222000, "epoch": 1834} {"train_loss": -43.355552673339844, "global_step": 222001, "epoch": 1834} {"train_loss": -43.62758255004883, "global_step": 222002, "epoch": 1834} {"train_loss": -43.57841110229492, "global_step": 222003, "epoch": 1834} {"train_loss": -43.76570129394531, "global_step": 222004, "epoch": 1834} {"train_loss": -43.557796478271484, "global_step": 222005, "epoch": 1834} {"train_loss": -44.162784576416016, "global_step": 222006, "epoch": 1834} {"train_loss": -43.90528106689453, "global_step": 222007, "epoch": 1834} {"train_loss": -43.44919967651367, "global_step": 222008, "epoch": 1834} {"train_loss": -43.52751541137695, "global_step": 222009, "epoch": 1834} {"train_loss": -43.779293060302734, "global_step": 222010, "epoch": 1834} {"train_loss": -43.29956817626953, "global_step": 222011, "epoch": 1834} {"train_loss": -43.66904830932617, "global_step": 222012, "epoch": 1834} {"train_loss": -43.871334075927734, "global_step": 222013, "epoch": 1834} {"train_loss": -43.88871383666992, "global_step": 222014, "epoch": 1834} {"train_loss": -43.75702667236328, "global_step": 222015, "epoch": 1834} {"train_loss": -43.203365325927734, "global_step": 222016, "epoch": 1834} {"train_loss": -42.963592529296875, "global_step": 222017, "epoch": 1834} {"train_loss": -43.830169677734375, "global_step": 222018, "epoch": 1834} {"train_loss": -43.14802169799805, "global_step": 222019, "epoch": 1834} {"train_loss": -42.90848922729492, "global_step": 222020, "epoch": 1834} {"train_loss": -42.51789855957031, "global_step": 222021, "epoch": 1834} {"train_loss": -41.7440299987793, "global_step": 222022, "epoch": 1834} {"train_loss": -42.66920471191406, "global_step": 222023, "epoch": 1834} {"train_loss": -43.23942947387695, "global_step": 222024, "epoch": 1834} {"train_loss": -43.516754150390625, "global_step": 222025, "epoch": 1834} {"train_loss": -43.6932487487793, "global_step": 222026, "epoch": 1834} {"train_loss": -42.801578521728516, "global_step": 222027, "epoch": 1834} {"train_loss": -42.79856872558594, "global_step": 222028, "epoch": 1834} {"train_loss": -42.395301818847656, "global_step": 222029, "epoch": 1834} {"train_loss": -41.98068618774414, "global_step": 222030, "epoch": 1834} {"train_loss": -42.156429290771484, "global_step": 222031, "epoch": 1834} {"train_loss": -41.69913864135742, "global_step": 222032, "epoch": 1834} {"train_loss": -40.93986511230469, "global_step": 222033, "epoch": 1834} {"train_loss": -42.028228759765625, "global_step": 222034, "epoch": 1834, "val_loss": 2523760.75} {"train_loss": -43.29658126831055, "global_step": 222035, "epoch": 1835} {"train_loss": -40.232093811035156, "global_step": 222036, "epoch": 1835} {"train_loss": -41.05224609375, "global_step": 222037, "epoch": 1835} {"train_loss": -42.9480094909668, "global_step": 222038, "epoch": 1835} {"train_loss": -42.114532470703125, "global_step": 222039, "epoch": 1835} {"train_loss": -40.86026382446289, "global_step": 222040, "epoch": 1835} {"train_loss": -40.96235275268555, "global_step": 222041, "epoch": 1835} {"train_loss": -41.479373931884766, "global_step": 222042, "epoch": 1835} {"train_loss": -42.350345611572266, "global_step": 222043, "epoch": 1835} {"train_loss": -42.5748176574707, "global_step": 222044, "epoch": 1835} {"train_loss": -41.008541107177734, "global_step": 222045, "epoch": 1835} {"train_loss": -39.96236038208008, "global_step": 222046, "epoch": 1835} {"train_loss": -41.914310455322266, "global_step": 222047, "epoch": 1835} {"train_loss": -39.02535629272461, "global_step": 222048, "epoch": 1835} {"train_loss": -40.27628707885742, "global_step": 222049, "epoch": 1835} {"train_loss": -41.19834899902344, "global_step": 222050, "epoch": 1835} {"train_loss": -40.851863861083984, "global_step": 222051, "epoch": 1835} {"train_loss": -41.42527389526367, "global_step": 222052, "epoch": 1835} {"train_loss": -41.98800277709961, "global_step": 222053, "epoch": 1835} {"train_loss": -42.40829086303711, "global_step": 222054, "epoch": 1835} {"train_loss": -42.14113998413086, "global_step": 222055, "epoch": 1835} {"train_loss": -41.388458251953125, "global_step": 222056, "epoch": 1835} {"train_loss": -41.90549850463867, "global_step": 222057, "epoch": 1835} {"train_loss": -42.32732009887695, "global_step": 222058, "epoch": 1835} {"train_loss": -42.29116439819336, "global_step": 222059, "epoch": 1835} {"train_loss": -41.93304443359375, "global_step": 222060, "epoch": 1835} {"train_loss": -42.42644119262695, "global_step": 222061, "epoch": 1835} {"train_loss": -43.34510803222656, "global_step": 222062, "epoch": 1835} {"train_loss": -41.16645431518555, "global_step": 222063, "epoch": 1835} {"train_loss": -42.94703674316406, "global_step": 222064, "epoch": 1835} {"train_loss": -41.89022445678711, "global_step": 222065, "epoch": 1835} {"train_loss": -41.754058837890625, "global_step": 222066, "epoch": 1835} {"train_loss": -41.8712272644043, "global_step": 222067, "epoch": 1835} {"train_loss": -42.552162170410156, "global_step": 222068, "epoch": 1835} {"train_loss": -43.02756881713867, "global_step": 222069, "epoch": 1835} {"train_loss": -41.564208984375, "global_step": 222070, "epoch": 1835} {"train_loss": -43.0987548828125, "global_step": 222071, "epoch": 1835} {"train_loss": -42.013771057128906, "global_step": 222072, "epoch": 1835} {"train_loss": -42.042869567871094, "global_step": 222073, "epoch": 1835} {"train_loss": -42.145206451416016, "global_step": 222074, "epoch": 1835} {"train_loss": -42.453285217285156, "global_step": 222075, "epoch": 1835} {"train_loss": -43.168880462646484, "global_step": 222076, "epoch": 1835} {"train_loss": -42.924285888671875, "global_step": 222077, "epoch": 1835} {"train_loss": -42.766597747802734, "global_step": 222078, "epoch": 1835} {"train_loss": -43.54269027709961, "global_step": 222079, "epoch": 1835} {"train_loss": -42.5751838684082, "global_step": 222080, "epoch": 1835} {"train_loss": -42.35862350463867, "global_step": 222081, "epoch": 1835} {"train_loss": -43.188720703125, "global_step": 222082, "epoch": 1835} {"train_loss": -43.23641586303711, "global_step": 222083, "epoch": 1835} {"train_loss": -43.28098678588867, "global_step": 222084, "epoch": 1835} {"train_loss": -43.24897766113281, "global_step": 222085, "epoch": 1835} {"train_loss": -42.7607536315918, "global_step": 222086, "epoch": 1835} {"train_loss": -42.403106689453125, "global_step": 222087, "epoch": 1835} {"train_loss": -42.663326263427734, "global_step": 222088, "epoch": 1835} {"train_loss": -42.99807357788086, "global_step": 222089, "epoch": 1835} {"train_loss": -42.7894287109375, "global_step": 222090, "epoch": 1835} {"train_loss": -41.47054672241211, "global_step": 222091, "epoch": 1835} {"train_loss": -42.13303756713867, "global_step": 222092, "epoch": 1835} {"train_loss": -43.591278076171875, "global_step": 222093, "epoch": 1835} {"train_loss": -41.58005905151367, "global_step": 222094, "epoch": 1835} {"train_loss": -43.24169921875, "global_step": 222095, "epoch": 1835} {"train_loss": -42.122066497802734, "global_step": 222096, "epoch": 1835} {"train_loss": -42.9604606628418, "global_step": 222097, "epoch": 1835} {"train_loss": -43.06504821777344, "global_step": 222098, "epoch": 1835} {"train_loss": -42.99724578857422, "global_step": 222099, "epoch": 1835} {"train_loss": -42.84298324584961, "global_step": 222100, "epoch": 1835} {"train_loss": -43.05918502807617, "global_step": 222101, "epoch": 1835} {"train_loss": -42.94002151489258, "global_step": 222102, "epoch": 1835} {"train_loss": -42.28884506225586, "global_step": 222103, "epoch": 1835} {"train_loss": -43.37744140625, "global_step": 222104, "epoch": 1835} {"train_loss": -43.14323043823242, "global_step": 222105, "epoch": 1835} {"train_loss": -42.86530685424805, "global_step": 222106, "epoch": 1835} {"train_loss": -42.085716247558594, "global_step": 222107, "epoch": 1835} {"train_loss": -41.47390365600586, "global_step": 222108, "epoch": 1835} {"train_loss": -42.42118453979492, "global_step": 222109, "epoch": 1835} {"train_loss": -43.059844970703125, "global_step": 222110, "epoch": 1835} {"train_loss": -41.613685607910156, "global_step": 222111, "epoch": 1835} {"train_loss": -40.69887924194336, "global_step": 222112, "epoch": 1835} {"train_loss": -41.92451477050781, "global_step": 222113, "epoch": 1835} {"train_loss": -40.706172943115234, "global_step": 222114, "epoch": 1835} {"train_loss": -41.691192626953125, "global_step": 222115, "epoch": 1835} {"train_loss": -41.252750396728516, "global_step": 222116, "epoch": 1835} {"train_loss": -42.04815673828125, "global_step": 222117, "epoch": 1835} {"train_loss": -41.450618743896484, "global_step": 222118, "epoch": 1835} {"train_loss": -40.67945098876953, "global_step": 222119, "epoch": 1835} {"train_loss": -42.32859420776367, "global_step": 222120, "epoch": 1835} {"train_loss": -41.21242904663086, "global_step": 222121, "epoch": 1835} {"train_loss": -41.441864013671875, "global_step": 222122, "epoch": 1835} {"train_loss": -41.85920715332031, "global_step": 222123, "epoch": 1835} {"train_loss": -41.55971908569336, "global_step": 222124, "epoch": 1835} {"train_loss": -41.57048797607422, "global_step": 222125, "epoch": 1835} {"train_loss": -41.891475677490234, "global_step": 222126, "epoch": 1835} {"train_loss": -41.90847396850586, "global_step": 222127, "epoch": 1835} {"train_loss": -42.741268157958984, "global_step": 222128, "epoch": 1835} {"train_loss": -42.30234146118164, "global_step": 222129, "epoch": 1835} {"train_loss": -43.13054275512695, "global_step": 222130, "epoch": 1835} {"train_loss": -42.82513427734375, "global_step": 222131, "epoch": 1835} {"train_loss": -42.798458099365234, "global_step": 222132, "epoch": 1835} {"train_loss": -41.990699768066406, "global_step": 222133, "epoch": 1835} {"train_loss": -42.36031723022461, "global_step": 222134, "epoch": 1835} {"train_loss": -42.91457748413086, "global_step": 222135, "epoch": 1835} {"train_loss": -42.76129150390625, "global_step": 222136, "epoch": 1835} {"train_loss": -43.20234298706055, "global_step": 222137, "epoch": 1835} {"train_loss": -42.3874626159668, "global_step": 222138, "epoch": 1835} {"train_loss": -42.53107833862305, "global_step": 222139, "epoch": 1835} {"train_loss": -43.336483001708984, "global_step": 222140, "epoch": 1835} {"train_loss": -42.86959457397461, "global_step": 222141, "epoch": 1835} {"train_loss": -42.9771728515625, "global_step": 222142, "epoch": 1835} {"train_loss": -43.284339904785156, "global_step": 222143, "epoch": 1835} {"train_loss": -42.320594787597656, "global_step": 222144, "epoch": 1835} {"train_loss": -43.098751068115234, "global_step": 222145, "epoch": 1835} {"train_loss": -42.56715774536133, "global_step": 222146, "epoch": 1835} {"train_loss": -41.76356506347656, "global_step": 222147, "epoch": 1835} {"train_loss": -42.81816101074219, "global_step": 222148, "epoch": 1835} {"train_loss": -40.93210983276367, "global_step": 222149, "epoch": 1835} {"train_loss": -42.0619010925293, "global_step": 222150, "epoch": 1835} {"train_loss": -41.852230072021484, "global_step": 222151, "epoch": 1835} {"train_loss": -40.58498001098633, "global_step": 222152, "epoch": 1835} {"train_loss": -42.48756408691406, "global_step": 222153, "epoch": 1835} {"train_loss": -40.8000602722168, "global_step": 222154, "epoch": 1835} {"train_loss": -42.19248946639132, "global_step": 222155, "epoch": 1835, "val_loss": 2569623.75} {"train_loss": -40.1850471496582, "global_step": 222156, "epoch": 1836} {"train_loss": -42.987335205078125, "global_step": 222157, "epoch": 1836} {"train_loss": -41.748409271240234, "global_step": 222158, "epoch": 1836} {"train_loss": -42.5274772644043, "global_step": 222159, "epoch": 1836} {"train_loss": -41.64052200317383, "global_step": 222160, "epoch": 1836} {"train_loss": -42.519317626953125, "global_step": 222161, "epoch": 1836} {"train_loss": -40.56379699707031, "global_step": 222162, "epoch": 1836} {"train_loss": -42.705440521240234, "global_step": 222163, "epoch": 1836} {"train_loss": -41.98348617553711, "global_step": 222164, "epoch": 1836} {"train_loss": -42.7315673828125, "global_step": 222165, "epoch": 1836} {"train_loss": -42.255977630615234, "global_step": 222166, "epoch": 1836} {"train_loss": -42.77372360229492, "global_step": 222167, "epoch": 1836} {"train_loss": -42.76505661010742, "global_step": 222168, "epoch": 1836} {"train_loss": -42.18976974487305, "global_step": 222169, "epoch": 1836} {"train_loss": -43.018402099609375, "global_step": 222170, "epoch": 1836} {"train_loss": -42.7353630065918, "global_step": 222171, "epoch": 1836} {"train_loss": -42.37276840209961, "global_step": 222172, "epoch": 1836} {"train_loss": -42.68696975708008, "global_step": 222173, "epoch": 1836} {"train_loss": -41.83415222167969, "global_step": 222174, "epoch": 1836} {"train_loss": -42.82538986206055, "global_step": 222175, "epoch": 1836} {"train_loss": -42.33954620361328, "global_step": 222176, "epoch": 1836} {"train_loss": -42.64522933959961, "global_step": 222177, "epoch": 1836} {"train_loss": -41.920501708984375, "global_step": 222178, "epoch": 1836} {"train_loss": -42.9787483215332, "global_step": 222179, "epoch": 1836} {"train_loss": -42.88339614868164, "global_step": 222180, "epoch": 1836} {"train_loss": -41.901344299316406, "global_step": 222181, "epoch": 1836} {"train_loss": -43.13842010498047, "global_step": 222182, "epoch": 1836} {"train_loss": -42.26375961303711, "global_step": 222183, "epoch": 1836} {"train_loss": -41.81088638305664, "global_step": 222184, "epoch": 1836} {"train_loss": -42.2074089050293, "global_step": 222185, "epoch": 1836} {"train_loss": -42.388816833496094, "global_step": 222186, "epoch": 1836} {"train_loss": -42.992034912109375, "global_step": 222187, "epoch": 1836} {"train_loss": -43.58610153198242, "global_step": 222188, "epoch": 1836} {"train_loss": -43.1756591796875, "global_step": 222189, "epoch": 1836} {"train_loss": -42.790802001953125, "global_step": 222190, "epoch": 1836} {"train_loss": -41.90271759033203, "global_step": 222191, "epoch": 1836} {"train_loss": -42.29706954956055, "global_step": 222192, "epoch": 1836} {"train_loss": -40.501522064208984, "global_step": 222193, "epoch": 1836} {"train_loss": -42.95533752441406, "global_step": 222194, "epoch": 1836} {"train_loss": -43.04349899291992, "global_step": 222195, "epoch": 1836} {"train_loss": -42.82969284057617, "global_step": 222196, "epoch": 1836} {"train_loss": -42.41694259643555, "global_step": 222197, "epoch": 1836} {"train_loss": -42.08121871948242, "global_step": 222198, "epoch": 1836} {"train_loss": -42.81999206542969, "global_step": 222199, "epoch": 1836} {"train_loss": -43.01618576049805, "global_step": 222200, "epoch": 1836} {"train_loss": -43.06978988647461, "global_step": 222201, "epoch": 1836} {"train_loss": -42.92376708984375, "global_step": 222202, "epoch": 1836} {"train_loss": -43.153079986572266, "global_step": 222203, "epoch": 1836} {"train_loss": -43.384681701660156, "global_step": 222204, "epoch": 1836} {"train_loss": -43.244422912597656, "global_step": 222205, "epoch": 1836} {"train_loss": -43.808753967285156, "global_step": 222206, "epoch": 1836} {"train_loss": -43.1715202331543, "global_step": 222207, "epoch": 1836} {"train_loss": -43.0205192565918, "global_step": 222208, "epoch": 1836} {"train_loss": -43.55888366699219, "global_step": 222209, "epoch": 1836} {"train_loss": -43.13188934326172, "global_step": 222210, "epoch": 1836} {"train_loss": -43.683631896972656, "global_step": 222211, "epoch": 1836} {"train_loss": -43.295265197753906, "global_step": 222212, "epoch": 1836} {"train_loss": -42.99219512939453, "global_step": 222213, "epoch": 1836} {"train_loss": -43.75654220581055, "global_step": 222214, "epoch": 1836} {"train_loss": -43.415504455566406, "global_step": 222215, "epoch": 1836} {"train_loss": -43.60652542114258, "global_step": 222216, "epoch": 1836} {"train_loss": -43.63479995727539, "global_step": 222217, "epoch": 1836} {"train_loss": -43.71169662475586, "global_step": 222218, "epoch": 1836} {"train_loss": -43.38351058959961, "global_step": 222219, "epoch": 1836} {"train_loss": -43.201194763183594, "global_step": 222220, "epoch": 1836} {"train_loss": -43.62989807128906, "global_step": 222221, "epoch": 1836} {"train_loss": -43.01069259643555, "global_step": 222222, "epoch": 1836} {"train_loss": -43.901885986328125, "global_step": 222223, "epoch": 1836} {"train_loss": -43.6629524230957, "global_step": 222224, "epoch": 1836} {"train_loss": -42.524810791015625, "global_step": 222225, "epoch": 1836} {"train_loss": -43.262611389160156, "global_step": 222226, "epoch": 1836} {"train_loss": -42.625186920166016, "global_step": 222227, "epoch": 1836} {"train_loss": -43.1409797668457, "global_step": 222228, "epoch": 1836} {"train_loss": -42.56827163696289, "global_step": 222229, "epoch": 1836} {"train_loss": -42.94208908081055, "global_step": 222230, "epoch": 1836} {"train_loss": -43.599037170410156, "global_step": 222231, "epoch": 1836} {"train_loss": -43.63215637207031, "global_step": 222232, "epoch": 1836} {"train_loss": -43.17499542236328, "global_step": 222233, "epoch": 1836} {"train_loss": -42.42206954956055, "global_step": 222234, "epoch": 1836} {"train_loss": -42.17950439453125, "global_step": 222235, "epoch": 1836} {"train_loss": -42.68415451049805, "global_step": 222236, "epoch": 1836} {"train_loss": -43.34340286254883, "global_step": 222237, "epoch": 1836} {"train_loss": -42.35580825805664, "global_step": 222238, "epoch": 1836} {"train_loss": -43.414283752441406, "global_step": 222239, "epoch": 1836} {"train_loss": -42.10106658935547, "global_step": 222240, "epoch": 1836} {"train_loss": -39.73456954956055, "global_step": 222241, "epoch": 1836} {"train_loss": -41.30373764038086, "global_step": 222242, "epoch": 1836} {"train_loss": -43.44581985473633, "global_step": 222243, "epoch": 1836} {"train_loss": -41.329429626464844, "global_step": 222244, "epoch": 1836} {"train_loss": -39.74018478393555, "global_step": 222245, "epoch": 1836} {"train_loss": -43.337257385253906, "global_step": 222246, "epoch": 1836} {"train_loss": -39.919593811035156, "global_step": 222247, "epoch": 1836} {"train_loss": -37.352256774902344, "global_step": 222248, "epoch": 1836} {"train_loss": -36.28615951538086, "global_step": 222249, "epoch": 1836} {"train_loss": -32.6234016418457, "global_step": 222250, "epoch": 1836} {"train_loss": -36.96918869018555, "global_step": 222251, "epoch": 1836} {"train_loss": -38.00432205200195, "global_step": 222252, "epoch": 1836} {"train_loss": -34.56163024902344, "global_step": 222253, "epoch": 1836} {"train_loss": -40.25936508178711, "global_step": 222254, "epoch": 1836} {"train_loss": -37.24654006958008, "global_step": 222255, "epoch": 1836} {"train_loss": -39.61432647705078, "global_step": 222256, "epoch": 1836} {"train_loss": -39.157325744628906, "global_step": 222257, "epoch": 1836} {"train_loss": -38.795143127441406, "global_step": 222258, "epoch": 1836} {"train_loss": -37.98768615722656, "global_step": 222259, "epoch": 1836} {"train_loss": -39.135860443115234, "global_step": 222260, "epoch": 1836} {"train_loss": -37.75874328613281, "global_step": 222261, "epoch": 1836} {"train_loss": -40.04891586303711, "global_step": 222262, "epoch": 1836} {"train_loss": -38.25880813598633, "global_step": 222263, "epoch": 1836} {"train_loss": -36.93726348876953, "global_step": 222264, "epoch": 1836} {"train_loss": -42.16819763183594, "global_step": 222265, "epoch": 1836} {"train_loss": -39.46149826049805, "global_step": 222266, "epoch": 1836} {"train_loss": -38.78166198730469, "global_step": 222267, "epoch": 1836} {"train_loss": -41.34911346435547, "global_step": 222268, "epoch": 1836} {"train_loss": -38.26557159423828, "global_step": 222269, "epoch": 1836} {"train_loss": -36.80915451049805, "global_step": 222270, "epoch": 1836} {"train_loss": -40.735172271728516, "global_step": 222271, "epoch": 1836} {"train_loss": -39.96562957763672, "global_step": 222272, "epoch": 1836} {"train_loss": -39.07616424560547, "global_step": 222273, "epoch": 1836} {"train_loss": -39.411102294921875, "global_step": 222274, "epoch": 1836} {"train_loss": -40.65900421142578, "global_step": 222275, "epoch": 1836} {"train_loss": -41.67451082970485, "global_step": 222276, "epoch": 1836, "val_loss": 2626552.0} {"train_loss": -41.042205810546875, "global_step": 222277, "epoch": 1837} {"train_loss": -40.78218460083008, "global_step": 222278, "epoch": 1837} {"train_loss": -40.41666793823242, "global_step": 222279, "epoch": 1837} {"train_loss": -41.516510009765625, "global_step": 222280, "epoch": 1837} {"train_loss": -41.26406478881836, "global_step": 222281, "epoch": 1837} {"train_loss": -41.49314498901367, "global_step": 222282, "epoch": 1837} {"train_loss": -41.020416259765625, "global_step": 222283, "epoch": 1837} {"train_loss": -41.73631286621094, "global_step": 222284, "epoch": 1837} {"train_loss": -41.74135208129883, "global_step": 222285, "epoch": 1837} {"train_loss": -42.23309326171875, "global_step": 222286, "epoch": 1837} {"train_loss": -41.499427795410156, "global_step": 222287, "epoch": 1837} {"train_loss": -42.170570373535156, "global_step": 222288, "epoch": 1837} {"train_loss": -42.58208084106445, "global_step": 222289, "epoch": 1837} {"train_loss": -42.22703170776367, "global_step": 222290, "epoch": 1837} {"train_loss": -42.09193801879883, "global_step": 222291, "epoch": 1837} {"train_loss": -42.54288864135742, "global_step": 222292, "epoch": 1837} {"train_loss": -42.457420349121094, "global_step": 222293, "epoch": 1837} {"train_loss": -42.65961456298828, "global_step": 222294, "epoch": 1837} {"train_loss": -42.62150573730469, "global_step": 222295, "epoch": 1837} {"train_loss": -42.5546989440918, "global_step": 222296, "epoch": 1837} {"train_loss": -42.84794235229492, "global_step": 222297, "epoch": 1837} {"train_loss": -42.514949798583984, "global_step": 222298, "epoch": 1837} {"train_loss": -42.659088134765625, "global_step": 222299, "epoch": 1837} {"train_loss": -42.38918685913086, "global_step": 222300, "epoch": 1837} {"train_loss": -43.00423049926758, "global_step": 222301, "epoch": 1837} {"train_loss": -42.49631881713867, "global_step": 222302, "epoch": 1837} {"train_loss": -43.11920166015625, "global_step": 222303, "epoch": 1837} {"train_loss": -42.768280029296875, "global_step": 222304, "epoch": 1837} {"train_loss": -43.19606399536133, "global_step": 222305, "epoch": 1837} {"train_loss": -42.54348373413086, "global_step": 222306, "epoch": 1837} {"train_loss": -42.270198822021484, "global_step": 222307, "epoch": 1837} {"train_loss": -43.44862365722656, "global_step": 222308, "epoch": 1837} {"train_loss": -43.330902099609375, "global_step": 222309, "epoch": 1837} {"train_loss": -42.932315826416016, "global_step": 222310, "epoch": 1837} {"train_loss": -43.15993881225586, "global_step": 222311, "epoch": 1837} {"train_loss": -43.06831359863281, "global_step": 222312, "epoch": 1837} {"train_loss": -43.55149459838867, "global_step": 222313, "epoch": 1837} {"train_loss": -43.18324661254883, "global_step": 222314, "epoch": 1837} {"train_loss": -43.16645050048828, "global_step": 222315, "epoch": 1837} {"train_loss": -42.322383880615234, "global_step": 222316, "epoch": 1837} {"train_loss": -43.75847244262695, "global_step": 222317, "epoch": 1837} {"train_loss": -43.438724517822266, "global_step": 222318, "epoch": 1837} {"train_loss": -42.80986404418945, "global_step": 222319, "epoch": 1837} {"train_loss": -43.38741683959961, "global_step": 222320, "epoch": 1837} {"train_loss": -43.305233001708984, "global_step": 222321, "epoch": 1837} {"train_loss": -43.2927360534668, "global_step": 222322, "epoch": 1837} {"train_loss": -43.28557586669922, "global_step": 222323, "epoch": 1837} {"train_loss": -43.01422882080078, "global_step": 222324, "epoch": 1837} {"train_loss": -43.640289306640625, "global_step": 222325, "epoch": 1837} {"train_loss": -42.94215393066406, "global_step": 222326, "epoch": 1837} {"train_loss": -43.2506217956543, "global_step": 222327, "epoch": 1837} {"train_loss": -43.48482131958008, "global_step": 222328, "epoch": 1837} {"train_loss": -43.86471176147461, "global_step": 222329, "epoch": 1837} {"train_loss": -42.35737991333008, "global_step": 222330, "epoch": 1837} {"train_loss": -43.172447204589844, "global_step": 222331, "epoch": 1837} {"train_loss": -43.80353927612305, "global_step": 222332, "epoch": 1837} {"train_loss": -43.00259017944336, "global_step": 222333, "epoch": 1837} {"train_loss": -43.48159408569336, "global_step": 222334, "epoch": 1837} {"train_loss": -43.576107025146484, "global_step": 222335, "epoch": 1837} {"train_loss": -42.875553131103516, "global_step": 222336, "epoch": 1837} {"train_loss": -42.673492431640625, "global_step": 222337, "epoch": 1837} {"train_loss": -42.32664489746094, "global_step": 222338, "epoch": 1837} {"train_loss": -43.1694450378418, "global_step": 222339, "epoch": 1837} {"train_loss": -43.98720169067383, "global_step": 222340, "epoch": 1837} {"train_loss": -43.21689987182617, "global_step": 222341, "epoch": 1837} {"train_loss": -40.950618743896484, "global_step": 222342, "epoch": 1837} {"train_loss": -39.39590072631836, "global_step": 222343, "epoch": 1837} {"train_loss": -42.401092529296875, "global_step": 222344, "epoch": 1837} {"train_loss": -42.54450225830078, "global_step": 222345, "epoch": 1837} {"train_loss": -39.704864501953125, "global_step": 222346, "epoch": 1837} {"train_loss": -43.17106246948242, "global_step": 222347, "epoch": 1837} {"train_loss": -39.98029327392578, "global_step": 222348, "epoch": 1837} {"train_loss": -41.05678176879883, "global_step": 222349, "epoch": 1837} {"train_loss": -42.826290130615234, "global_step": 222350, "epoch": 1837} {"train_loss": -41.52944564819336, "global_step": 222351, "epoch": 1837} {"train_loss": -40.748233795166016, "global_step": 222352, "epoch": 1837} {"train_loss": -41.285240173339844, "global_step": 222353, "epoch": 1837} {"train_loss": -42.06427001953125, "global_step": 222354, "epoch": 1837} {"train_loss": -39.89560317993164, "global_step": 222355, "epoch": 1837} {"train_loss": -41.58441162109375, "global_step": 222356, "epoch": 1837} {"train_loss": -42.0718994140625, "global_step": 222357, "epoch": 1837} {"train_loss": -42.044158935546875, "global_step": 222358, "epoch": 1837} {"train_loss": -42.226192474365234, "global_step": 222359, "epoch": 1837} {"train_loss": -41.828548431396484, "global_step": 222360, "epoch": 1837} {"train_loss": -41.89215850830078, "global_step": 222361, "epoch": 1837} {"train_loss": -41.86115264892578, "global_step": 222362, "epoch": 1837} {"train_loss": -41.57325744628906, "global_step": 222363, "epoch": 1837} {"train_loss": -41.7066764831543, "global_step": 222364, "epoch": 1837} {"train_loss": -41.140926361083984, "global_step": 222365, "epoch": 1837} {"train_loss": -41.99258041381836, "global_step": 222366, "epoch": 1837} {"train_loss": -41.52836608886719, "global_step": 222367, "epoch": 1837} {"train_loss": -39.83888626098633, "global_step": 222368, "epoch": 1837} {"train_loss": -40.80039596557617, "global_step": 222369, "epoch": 1837} {"train_loss": -39.80031967163086, "global_step": 222370, "epoch": 1837} {"train_loss": -40.60536575317383, "global_step": 222371, "epoch": 1837} {"train_loss": -41.6011962890625, "global_step": 222372, "epoch": 1837} {"train_loss": -40.87685012817383, "global_step": 222373, "epoch": 1837} {"train_loss": -42.548274993896484, "global_step": 222374, "epoch": 1837} {"train_loss": -40.37800979614258, "global_step": 222375, "epoch": 1837} {"train_loss": -39.64338302612305, "global_step": 222376, "epoch": 1837} {"train_loss": -38.624507904052734, "global_step": 222377, "epoch": 1837} {"train_loss": -37.1417121887207, "global_step": 222378, "epoch": 1837} {"train_loss": -40.12156295776367, "global_step": 222379, "epoch": 1837} {"train_loss": -41.872554779052734, "global_step": 222380, "epoch": 1837} {"train_loss": -38.05875778198242, "global_step": 222381, "epoch": 1837} {"train_loss": -40.458580017089844, "global_step": 222382, "epoch": 1837} {"train_loss": -36.6341438293457, "global_step": 222383, "epoch": 1837} {"train_loss": -40.34861373901367, "global_step": 222384, "epoch": 1837} {"train_loss": -36.80177688598633, "global_step": 222385, "epoch": 1837} {"train_loss": -37.366512298583984, "global_step": 222386, "epoch": 1837} {"train_loss": -30.022674560546875, "global_step": 222387, "epoch": 1837} {"train_loss": -38.070064544677734, "global_step": 222388, "epoch": 1837} {"train_loss": -38.302982330322266, "global_step": 222389, "epoch": 1837} {"train_loss": -39.477779388427734, "global_step": 222390, "epoch": 1837} {"train_loss": -37.37665557861328, "global_step": 222391, "epoch": 1837} {"train_loss": -36.53631591796875, "global_step": 222392, "epoch": 1837} {"train_loss": -36.59675216674805, "global_step": 222393, "epoch": 1837} {"train_loss": -37.04037094116211, "global_step": 222394, "epoch": 1837} {"train_loss": -37.555362701416016, "global_step": 222395, "epoch": 1837} {"train_loss": -38.82367706298828, "global_step": 222396, "epoch": 1837} {"train_loss": -41.473348727896195, "global_step": 222397, "epoch": 1837, "val_loss": 3011256.0} {"train_loss": -38.72584915161133, "global_step": 222398, "epoch": 1838} {"train_loss": -37.571895599365234, "global_step": 222399, "epoch": 1838} {"train_loss": -37.264156341552734, "global_step": 222400, "epoch": 1838} {"train_loss": -39.452789306640625, "global_step": 222401, "epoch": 1838} {"train_loss": -40.04365158081055, "global_step": 222402, "epoch": 1838} {"train_loss": -37.799251556396484, "global_step": 222403, "epoch": 1838} {"train_loss": -35.67852020263672, "global_step": 222404, "epoch": 1838} {"train_loss": -37.30615234375, "global_step": 222405, "epoch": 1838} {"train_loss": -36.37506866455078, "global_step": 222406, "epoch": 1838} {"train_loss": -37.13214874267578, "global_step": 222407, "epoch": 1838} {"train_loss": -38.4306640625, "global_step": 222408, "epoch": 1838} {"train_loss": -38.509803771972656, "global_step": 222409, "epoch": 1838} {"train_loss": -38.398597717285156, "global_step": 222410, "epoch": 1838} {"train_loss": -40.14541244506836, "global_step": 222411, "epoch": 1838} {"train_loss": -41.174617767333984, "global_step": 222412, "epoch": 1838} {"train_loss": -40.08095932006836, "global_step": 222413, "epoch": 1838} {"train_loss": -37.446624755859375, "global_step": 222414, "epoch": 1838} {"train_loss": -39.05381393432617, "global_step": 222415, "epoch": 1838} {"train_loss": -38.73627853393555, "global_step": 222416, "epoch": 1838} {"train_loss": -39.07453155517578, "global_step": 222417, "epoch": 1838} {"train_loss": -40.93717575073242, "global_step": 222418, "epoch": 1838} {"train_loss": -39.380367279052734, "global_step": 222419, "epoch": 1838} {"train_loss": -39.12446212768555, "global_step": 222420, "epoch": 1838} {"train_loss": -37.54973602294922, "global_step": 222421, "epoch": 1838} {"train_loss": -41.211708068847656, "global_step": 222422, "epoch": 1838} {"train_loss": -40.07802963256836, "global_step": 222423, "epoch": 1838} {"train_loss": -40.89213943481445, "global_step": 222424, "epoch": 1838} {"train_loss": -41.05202865600586, "global_step": 222425, "epoch": 1838} {"train_loss": -41.16010665893555, "global_step": 222426, "epoch": 1838} {"train_loss": -40.34638977050781, "global_step": 222427, "epoch": 1838} {"train_loss": -39.79220199584961, "global_step": 222428, "epoch": 1838} {"train_loss": -40.061832427978516, "global_step": 222429, "epoch": 1838} {"train_loss": -41.17971420288086, "global_step": 222430, "epoch": 1838} {"train_loss": -40.82453536987305, "global_step": 222431, "epoch": 1838} {"train_loss": -41.23444366455078, "global_step": 222432, "epoch": 1838} {"train_loss": -41.4483757019043, "global_step": 222433, "epoch": 1838} {"train_loss": -41.45023727416992, "global_step": 222434, "epoch": 1838} {"train_loss": -41.01227569580078, "global_step": 222435, "epoch": 1838} {"train_loss": -41.64805221557617, "global_step": 222436, "epoch": 1838} {"train_loss": -41.1218376159668, "global_step": 222437, "epoch": 1838} {"train_loss": -40.875240325927734, "global_step": 222438, "epoch": 1838} {"train_loss": -41.719058990478516, "global_step": 222439, "epoch": 1838} {"train_loss": -41.33830642700195, "global_step": 222440, "epoch": 1838} {"train_loss": -41.153018951416016, "global_step": 222441, "epoch": 1838} {"train_loss": -41.7557373046875, "global_step": 222442, "epoch": 1838} {"train_loss": -41.66231918334961, "global_step": 222443, "epoch": 1838} {"train_loss": -41.475032806396484, "global_step": 222444, "epoch": 1838} {"train_loss": -42.44929885864258, "global_step": 222445, "epoch": 1838} {"train_loss": -41.25271224975586, "global_step": 222446, "epoch": 1838} {"train_loss": -40.76799011230469, "global_step": 222447, "epoch": 1838} {"train_loss": -41.298519134521484, "global_step": 222448, "epoch": 1838} {"train_loss": -41.1550407409668, "global_step": 222449, "epoch": 1838} {"train_loss": -41.94791030883789, "global_step": 222450, "epoch": 1838} {"train_loss": -41.4841194152832, "global_step": 222451, "epoch": 1838} {"train_loss": -42.2875862121582, "global_step": 222452, "epoch": 1838} {"train_loss": -42.37546920776367, "global_step": 222453, "epoch": 1838} {"train_loss": -41.758235931396484, "global_step": 222454, "epoch": 1838} {"train_loss": -41.64915466308594, "global_step": 222455, "epoch": 1838} {"train_loss": -41.61689376831055, "global_step": 222456, "epoch": 1838} {"train_loss": -42.25053787231445, "global_step": 222457, "epoch": 1838} {"train_loss": -42.055843353271484, "global_step": 222458, "epoch": 1838} {"train_loss": -41.437713623046875, "global_step": 222459, "epoch": 1838} {"train_loss": -42.343650817871094, "global_step": 222460, "epoch": 1838} {"train_loss": -40.20497512817383, "global_step": 222461, "epoch": 1838} {"train_loss": -41.68330383300781, "global_step": 222462, "epoch": 1838} {"train_loss": -42.2850456237793, "global_step": 222463, "epoch": 1838} {"train_loss": -41.58393478393555, "global_step": 222464, "epoch": 1838} {"train_loss": -41.189308166503906, "global_step": 222465, "epoch": 1838} {"train_loss": -43.142066955566406, "global_step": 222466, "epoch": 1838} {"train_loss": -41.7545280456543, "global_step": 222467, "epoch": 1838} {"train_loss": -41.884300231933594, "global_step": 222468, "epoch": 1838} {"train_loss": -42.6715202331543, "global_step": 222469, "epoch": 1838} {"train_loss": -41.684364318847656, "global_step": 222470, "epoch": 1838} {"train_loss": -42.12025833129883, "global_step": 222471, "epoch": 1838} {"train_loss": -42.12457275390625, "global_step": 222472, "epoch": 1838} {"train_loss": -41.572181701660156, "global_step": 222473, "epoch": 1838} {"train_loss": -42.70492935180664, "global_step": 222474, "epoch": 1838} {"train_loss": -42.783233642578125, "global_step": 222475, "epoch": 1838} {"train_loss": -41.745548248291016, "global_step": 222476, "epoch": 1838} {"train_loss": -42.80535888671875, "global_step": 222477, "epoch": 1838} {"train_loss": -41.63102340698242, "global_step": 222478, "epoch": 1838} {"train_loss": -41.764225006103516, "global_step": 222479, "epoch": 1838} {"train_loss": -42.60152816772461, "global_step": 222480, "epoch": 1838} {"train_loss": -42.424964904785156, "global_step": 222481, "epoch": 1838} {"train_loss": -42.11442184448242, "global_step": 222482, "epoch": 1838} {"train_loss": -42.58474349975586, "global_step": 222483, "epoch": 1838} {"train_loss": -41.9353141784668, "global_step": 222484, "epoch": 1838} {"train_loss": -42.94318771362305, "global_step": 222485, "epoch": 1838} {"train_loss": -42.222225189208984, "global_step": 222486, "epoch": 1838} {"train_loss": -42.18205642700195, "global_step": 222487, "epoch": 1838} {"train_loss": -42.00625228881836, "global_step": 222488, "epoch": 1838} {"train_loss": -42.5661506652832, "global_step": 222489, "epoch": 1838} {"train_loss": -40.91951370239258, "global_step": 222490, "epoch": 1838} {"train_loss": -41.56045150756836, "global_step": 222491, "epoch": 1838} {"train_loss": -41.895565032958984, "global_step": 222492, "epoch": 1838} {"train_loss": -42.168975830078125, "global_step": 222493, "epoch": 1838} {"train_loss": -42.09862518310547, "global_step": 222494, "epoch": 1838} {"train_loss": -42.29931640625, "global_step": 222495, "epoch": 1838} {"train_loss": -41.90774154663086, "global_step": 222496, "epoch": 1838} {"train_loss": -41.4650764465332, "global_step": 222497, "epoch": 1838} {"train_loss": -42.76294708251953, "global_step": 222498, "epoch": 1838} {"train_loss": -42.520179748535156, "global_step": 222499, "epoch": 1838} {"train_loss": -41.24156951904297, "global_step": 222500, "epoch": 1838} {"train_loss": -43.02587890625, "global_step": 222501, "epoch": 1838} {"train_loss": -42.55518341064453, "global_step": 222502, "epoch": 1838} {"train_loss": -41.572505950927734, "global_step": 222503, "epoch": 1838} {"train_loss": -42.417816162109375, "global_step": 222504, "epoch": 1838} {"train_loss": -42.469364166259766, "global_step": 222505, "epoch": 1838} {"train_loss": -41.336368560791016, "global_step": 222506, "epoch": 1838} {"train_loss": -41.8867073059082, "global_step": 222507, "epoch": 1838} {"train_loss": -42.130470275878906, "global_step": 222508, "epoch": 1838} {"train_loss": -42.201141357421875, "global_step": 222509, "epoch": 1838} {"train_loss": -41.75181198120117, "global_step": 222510, "epoch": 1838} {"train_loss": -42.091461181640625, "global_step": 222511, "epoch": 1838} {"train_loss": -42.03006362915039, "global_step": 222512, "epoch": 1838} {"train_loss": -42.85758590698242, "global_step": 222513, "epoch": 1838} {"train_loss": -42.54718780517578, "global_step": 222514, "epoch": 1838} {"train_loss": -41.89018630981445, "global_step": 222515, "epoch": 1838} {"train_loss": -42.13578414916992, "global_step": 222516, "epoch": 1838} {"train_loss": -42.187522888183594, "global_step": 222517, "epoch": 1838} {"train_loss": -41.14753360590659, "global_step": 222518, "epoch": 1838, "val_loss": 2535659.0} {"train_loss": -42.13358688354492, "global_step": 222519, "epoch": 1839} {"train_loss": -41.548091888427734, "global_step": 222520, "epoch": 1839} {"train_loss": -42.366519927978516, "global_step": 222521, "epoch": 1839} {"train_loss": -41.72724533081055, "global_step": 222522, "epoch": 1839} {"train_loss": -41.223270416259766, "global_step": 222523, "epoch": 1839} {"train_loss": -42.783447265625, "global_step": 222524, "epoch": 1839} {"train_loss": -42.281272888183594, "global_step": 222525, "epoch": 1839} {"train_loss": -41.17741012573242, "global_step": 222526, "epoch": 1839} {"train_loss": -40.78451156616211, "global_step": 222527, "epoch": 1839} {"train_loss": -41.14432907104492, "global_step": 222528, "epoch": 1839} {"train_loss": -42.009422302246094, "global_step": 222529, "epoch": 1839} {"train_loss": -42.461669921875, "global_step": 222530, "epoch": 1839} {"train_loss": -41.24540328979492, "global_step": 222531, "epoch": 1839} {"train_loss": -41.20396041870117, "global_step": 222532, "epoch": 1839} {"train_loss": -42.61622619628906, "global_step": 222533, "epoch": 1839} {"train_loss": -41.926509857177734, "global_step": 222534, "epoch": 1839} {"train_loss": -42.17164993286133, "global_step": 222535, "epoch": 1839} {"train_loss": -41.60456085205078, "global_step": 222536, "epoch": 1839} {"train_loss": -40.73755645751953, "global_step": 222537, "epoch": 1839} {"train_loss": -43.06168746948242, "global_step": 222538, "epoch": 1839} {"train_loss": -41.7810173034668, "global_step": 222539, "epoch": 1839} {"train_loss": -40.54256057739258, "global_step": 222540, "epoch": 1839} {"train_loss": -42.38840103149414, "global_step": 222541, "epoch": 1839} {"train_loss": -42.9488410949707, "global_step": 222542, "epoch": 1839} {"train_loss": -42.35870361328125, "global_step": 222543, "epoch": 1839} {"train_loss": -41.608734130859375, "global_step": 222544, "epoch": 1839} {"train_loss": -42.543521881103516, "global_step": 222545, "epoch": 1839} {"train_loss": -42.67984390258789, "global_step": 222546, "epoch": 1839} {"train_loss": -42.69727325439453, "global_step": 222547, "epoch": 1839} {"train_loss": -42.839874267578125, "global_step": 222548, "epoch": 1839} {"train_loss": -43.26328659057617, "global_step": 222549, "epoch": 1839} {"train_loss": -42.75547409057617, "global_step": 222550, "epoch": 1839} {"train_loss": -42.491790771484375, "global_step": 222551, "epoch": 1839} {"train_loss": -42.7006950378418, "global_step": 222552, "epoch": 1839} {"train_loss": -42.596187591552734, "global_step": 222553, "epoch": 1839} {"train_loss": -42.87324142456055, "global_step": 222554, "epoch": 1839} {"train_loss": -41.83449172973633, "global_step": 222555, "epoch": 1839} {"train_loss": -42.2955207824707, "global_step": 222556, "epoch": 1839} {"train_loss": -42.53485870361328, "global_step": 222557, "epoch": 1839} {"train_loss": -41.26279830932617, "global_step": 222558, "epoch": 1839} {"train_loss": -42.13230514526367, "global_step": 222559, "epoch": 1839} {"train_loss": -42.328609466552734, "global_step": 222560, "epoch": 1839} {"train_loss": -41.35693359375, "global_step": 222561, "epoch": 1839} {"train_loss": -42.16736602783203, "global_step": 222562, "epoch": 1839} {"train_loss": -41.32731628417969, "global_step": 222563, "epoch": 1839} {"train_loss": -41.27126693725586, "global_step": 222564, "epoch": 1839} {"train_loss": -42.76840591430664, "global_step": 222565, "epoch": 1839} {"train_loss": -41.80532455444336, "global_step": 222566, "epoch": 1839} {"train_loss": -41.522457122802734, "global_step": 222567, "epoch": 1839} {"train_loss": -40.72161102294922, "global_step": 222568, "epoch": 1839} {"train_loss": -40.63393020629883, "global_step": 222569, "epoch": 1839} {"train_loss": -42.53737258911133, "global_step": 222570, "epoch": 1839} {"train_loss": -42.6347541809082, "global_step": 222571, "epoch": 1839} {"train_loss": -42.80892562866211, "global_step": 222572, "epoch": 1839} {"train_loss": -42.700679779052734, "global_step": 222573, "epoch": 1839} {"train_loss": -42.06026840209961, "global_step": 222574, "epoch": 1839} {"train_loss": -42.24392318725586, "global_step": 222575, "epoch": 1839} {"train_loss": -42.36558532714844, "global_step": 222576, "epoch": 1839} {"train_loss": -42.926876068115234, "global_step": 222577, "epoch": 1839} {"train_loss": -41.8568229675293, "global_step": 222578, "epoch": 1839} {"train_loss": -42.20956802368164, "global_step": 222579, "epoch": 1839} {"train_loss": -42.65829086303711, "global_step": 222580, "epoch": 1839} {"train_loss": -43.112552642822266, "global_step": 222581, "epoch": 1839} {"train_loss": -43.13069152832031, "global_step": 222582, "epoch": 1839} {"train_loss": -43.22386169433594, "global_step": 222583, "epoch": 1839} {"train_loss": -42.7027473449707, "global_step": 222584, "epoch": 1839} {"train_loss": -42.68015670776367, "global_step": 222585, "epoch": 1839} {"train_loss": -43.05112838745117, "global_step": 222586, "epoch": 1839} {"train_loss": -42.44725799560547, "global_step": 222587, "epoch": 1839} {"train_loss": -42.13032150268555, "global_step": 222588, "epoch": 1839} {"train_loss": -42.56379699707031, "global_step": 222589, "epoch": 1839} {"train_loss": -43.22007369995117, "global_step": 222590, "epoch": 1839} {"train_loss": -42.73828125, "global_step": 222591, "epoch": 1839} {"train_loss": -42.518165588378906, "global_step": 222592, "epoch": 1839} {"train_loss": -41.50431442260742, "global_step": 222593, "epoch": 1839} {"train_loss": -41.94175338745117, "global_step": 222594, "epoch": 1839} {"train_loss": -42.276573181152344, "global_step": 222595, "epoch": 1839} {"train_loss": -42.832305908203125, "global_step": 222596, "epoch": 1839} {"train_loss": -43.02888488769531, "global_step": 222597, "epoch": 1839} {"train_loss": -43.141265869140625, "global_step": 222598, "epoch": 1839} {"train_loss": -43.06303787231445, "global_step": 222599, "epoch": 1839} {"train_loss": -42.050960540771484, "global_step": 222600, "epoch": 1839} {"train_loss": -41.5913200378418, "global_step": 222601, "epoch": 1839} {"train_loss": -41.978370666503906, "global_step": 222602, "epoch": 1839} {"train_loss": -40.428001403808594, "global_step": 222603, "epoch": 1839} {"train_loss": -41.70200729370117, "global_step": 222604, "epoch": 1839} {"train_loss": -42.62812042236328, "global_step": 222605, "epoch": 1839} {"train_loss": -42.48710250854492, "global_step": 222606, "epoch": 1839} {"train_loss": -42.34710693359375, "global_step": 222607, "epoch": 1839} {"train_loss": -42.593841552734375, "global_step": 222608, "epoch": 1839} {"train_loss": -41.65922164916992, "global_step": 222609, "epoch": 1839} {"train_loss": -42.25373077392578, "global_step": 222610, "epoch": 1839} {"train_loss": -42.22843933105469, "global_step": 222611, "epoch": 1839} {"train_loss": -41.86739730834961, "global_step": 222612, "epoch": 1839} {"train_loss": -41.67755889892578, "global_step": 222613, "epoch": 1839} {"train_loss": -42.00673294067383, "global_step": 222614, "epoch": 1839} {"train_loss": -41.76762771606445, "global_step": 222615, "epoch": 1839} {"train_loss": -41.67009735107422, "global_step": 222616, "epoch": 1839} {"train_loss": -41.960506439208984, "global_step": 222617, "epoch": 1839} {"train_loss": -41.98140335083008, "global_step": 222618, "epoch": 1839} {"train_loss": -41.858665466308594, "global_step": 222619, "epoch": 1839} {"train_loss": -42.23645782470703, "global_step": 222620, "epoch": 1839} {"train_loss": -42.13948059082031, "global_step": 222621, "epoch": 1839} {"train_loss": -41.434852600097656, "global_step": 222622, "epoch": 1839} {"train_loss": -42.20103073120117, "global_step": 222623, "epoch": 1839} {"train_loss": -42.9374885559082, "global_step": 222624, "epoch": 1839} {"train_loss": -42.327186584472656, "global_step": 222625, "epoch": 1839} {"train_loss": -42.28131103515625, "global_step": 222626, "epoch": 1839} {"train_loss": -40.0609130859375, "global_step": 222627, "epoch": 1839} {"train_loss": -40.87326431274414, "global_step": 222628, "epoch": 1839} {"train_loss": -41.47565460205078, "global_step": 222629, "epoch": 1839} {"train_loss": -40.39160919189453, "global_step": 222630, "epoch": 1839} {"train_loss": -39.23595428466797, "global_step": 222631, "epoch": 1839} {"train_loss": -38.711116790771484, "global_step": 222632, "epoch": 1839} {"train_loss": -40.4197883605957, "global_step": 222633, "epoch": 1839} {"train_loss": -37.92463302612305, "global_step": 222634, "epoch": 1839} {"train_loss": -36.140296936035156, "global_step": 222635, "epoch": 1839} {"train_loss": -39.62583541870117, "global_step": 222636, "epoch": 1839} {"train_loss": -34.84126663208008, "global_step": 222637, "epoch": 1839} {"train_loss": -39.66054153442383, "global_step": 222638, "epoch": 1839} {"train_loss": -41.79935017104977, "global_step": 222639, "epoch": 1839, "val_loss": 2538123.0} {"train_loss": -42.607906341552734, "global_step": 222640, "epoch": 1840} {"train_loss": -36.651527404785156, "global_step": 222641, "epoch": 1840} {"train_loss": -37.513946533203125, "global_step": 222642, "epoch": 1840} {"train_loss": -39.68313217163086, "global_step": 222643, "epoch": 1840} {"train_loss": -39.24281692504883, "global_step": 222644, "epoch": 1840} {"train_loss": -38.630733489990234, "global_step": 222645, "epoch": 1840} {"train_loss": -41.72564697265625, "global_step": 222646, "epoch": 1840} {"train_loss": -38.601890563964844, "global_step": 222647, "epoch": 1840} {"train_loss": -40.632598876953125, "global_step": 222648, "epoch": 1840} {"train_loss": -41.334808349609375, "global_step": 222649, "epoch": 1840} {"train_loss": -39.484256744384766, "global_step": 222650, "epoch": 1840} {"train_loss": -41.065650939941406, "global_step": 222651, "epoch": 1840} {"train_loss": -39.67826461791992, "global_step": 222652, "epoch": 1840} {"train_loss": -40.36248779296875, "global_step": 222653, "epoch": 1840} {"train_loss": -39.37516403198242, "global_step": 222654, "epoch": 1840} {"train_loss": -41.05021286010742, "global_step": 222655, "epoch": 1840} {"train_loss": -41.73588180541992, "global_step": 222656, "epoch": 1840} {"train_loss": -41.722591400146484, "global_step": 222657, "epoch": 1840} {"train_loss": -41.1125373840332, "global_step": 222658, "epoch": 1840} {"train_loss": -42.08881378173828, "global_step": 222659, "epoch": 1840} {"train_loss": -42.443572998046875, "global_step": 222660, "epoch": 1840} {"train_loss": -41.55607986450195, "global_step": 222661, "epoch": 1840} {"train_loss": -42.185157775878906, "global_step": 222662, "epoch": 1840} {"train_loss": -41.904518127441406, "global_step": 222663, "epoch": 1840} {"train_loss": -41.9633903503418, "global_step": 222664, "epoch": 1840} {"train_loss": -42.46248245239258, "global_step": 222665, "epoch": 1840} {"train_loss": -41.90436935424805, "global_step": 222666, "epoch": 1840} {"train_loss": -42.4530143737793, "global_step": 222667, "epoch": 1840} {"train_loss": -42.19569396972656, "global_step": 222668, "epoch": 1840} {"train_loss": -42.62356185913086, "global_step": 222669, "epoch": 1840} {"train_loss": -42.75127410888672, "global_step": 222670, "epoch": 1840} {"train_loss": -42.41617965698242, "global_step": 222671, "epoch": 1840} {"train_loss": -42.64124298095703, "global_step": 222672, "epoch": 1840} {"train_loss": -42.42061233520508, "global_step": 222673, "epoch": 1840} {"train_loss": -42.83189392089844, "global_step": 222674, "epoch": 1840} {"train_loss": -42.75333786010742, "global_step": 222675, "epoch": 1840} {"train_loss": -42.072933197021484, "global_step": 222676, "epoch": 1840} {"train_loss": -42.557655334472656, "global_step": 222677, "epoch": 1840} {"train_loss": -43.08563232421875, "global_step": 222678, "epoch": 1840} {"train_loss": -43.07780456542969, "global_step": 222679, "epoch": 1840} {"train_loss": -42.43116760253906, "global_step": 222680, "epoch": 1840} {"train_loss": -42.39287185668945, "global_step": 222681, "epoch": 1840} {"train_loss": -43.113582611083984, "global_step": 222682, "epoch": 1840} {"train_loss": -41.1981315612793, "global_step": 222683, "epoch": 1840} {"train_loss": -41.14370346069336, "global_step": 222684, "epoch": 1840} {"train_loss": -43.031436920166016, "global_step": 222685, "epoch": 1840} {"train_loss": -42.06496047973633, "global_step": 222686, "epoch": 1840} {"train_loss": -42.14830780029297, "global_step": 222687, "epoch": 1840} {"train_loss": -42.506038665771484, "global_step": 222688, "epoch": 1840} {"train_loss": -42.65505599975586, "global_step": 222689, "epoch": 1840} {"train_loss": -41.79658126831055, "global_step": 222690, "epoch": 1840} {"train_loss": -42.65780258178711, "global_step": 222691, "epoch": 1840} {"train_loss": -42.41538619995117, "global_step": 222692, "epoch": 1840} {"train_loss": -42.11735916137695, "global_step": 222693, "epoch": 1840} {"train_loss": -42.682769775390625, "global_step": 222694, "epoch": 1840} {"train_loss": -42.55585861206055, "global_step": 222695, "epoch": 1840} {"train_loss": -42.26691818237305, "global_step": 222696, "epoch": 1840} {"train_loss": -42.43555450439453, "global_step": 222697, "epoch": 1840} {"train_loss": -41.8632926940918, "global_step": 222698, "epoch": 1840} {"train_loss": -40.48224639892578, "global_step": 222699, "epoch": 1840} {"train_loss": -37.51723861694336, "global_step": 222700, "epoch": 1840} {"train_loss": -39.80514144897461, "global_step": 222701, "epoch": 1840} {"train_loss": -33.96995162963867, "global_step": 222702, "epoch": 1840} {"train_loss": -21.701913833618164, "global_step": 222703, "epoch": 1840} {"train_loss": -31.2442684173584, "global_step": 222704, "epoch": 1840} {"train_loss": -28.347143173217773, "global_step": 222705, "epoch": 1840} {"train_loss": -33.62875747680664, "global_step": 222706, "epoch": 1840} {"train_loss": -25.32111167907715, "global_step": 222707, "epoch": 1840} {"train_loss": -34.55667495727539, "global_step": 222708, "epoch": 1840} {"train_loss": -28.97710609436035, "global_step": 222709, "epoch": 1840} {"train_loss": -33.27790451049805, "global_step": 222710, "epoch": 1840} {"train_loss": -33.811805725097656, "global_step": 222711, "epoch": 1840} {"train_loss": -32.1524658203125, "global_step": 222712, "epoch": 1840} {"train_loss": -34.594337463378906, "global_step": 222713, "epoch": 1840} {"train_loss": -34.38140869140625, "global_step": 222714, "epoch": 1840} {"train_loss": -33.2446403503418, "global_step": 222715, "epoch": 1840} {"train_loss": -35.31126022338867, "global_step": 222716, "epoch": 1840} {"train_loss": -35.39720153808594, "global_step": 222717, "epoch": 1840} {"train_loss": -34.5930290222168, "global_step": 222718, "epoch": 1840} {"train_loss": -35.283451080322266, "global_step": 222719, "epoch": 1840} {"train_loss": -36.18158721923828, "global_step": 222720, "epoch": 1840} {"train_loss": -34.958099365234375, "global_step": 222721, "epoch": 1840} {"train_loss": -35.4481086730957, "global_step": 222722, "epoch": 1840} {"train_loss": -35.76994705200195, "global_step": 222723, "epoch": 1840} {"train_loss": -36.02242660522461, "global_step": 222724, "epoch": 1840} {"train_loss": -36.1180419921875, "global_step": 222725, "epoch": 1840} {"train_loss": -35.90468215942383, "global_step": 222726, "epoch": 1840} {"train_loss": -36.23354721069336, "global_step": 222727, "epoch": 1840} {"train_loss": -37.12095642089844, "global_step": 222728, "epoch": 1840} {"train_loss": -36.70455551147461, "global_step": 222729, "epoch": 1840} {"train_loss": -37.83302688598633, "global_step": 222730, "epoch": 1840} {"train_loss": -36.86968994140625, "global_step": 222731, "epoch": 1840} {"train_loss": -36.592159271240234, "global_step": 222732, "epoch": 1840} {"train_loss": -36.88724899291992, "global_step": 222733, "epoch": 1840} {"train_loss": -37.10697937011719, "global_step": 222734, "epoch": 1840} {"train_loss": -37.0189208984375, "global_step": 222735, "epoch": 1840} {"train_loss": -37.22969436645508, "global_step": 222736, "epoch": 1840} {"train_loss": -37.14604568481445, "global_step": 222737, "epoch": 1840} {"train_loss": -37.29179000854492, "global_step": 222738, "epoch": 1840} {"train_loss": -36.854888916015625, "global_step": 222739, "epoch": 1840} {"train_loss": -35.6639289855957, "global_step": 222740, "epoch": 1840} {"train_loss": -36.92734909057617, "global_step": 222741, "epoch": 1840} {"train_loss": -37.476585388183594, "global_step": 222742, "epoch": 1840} {"train_loss": -36.38383102416992, "global_step": 222743, "epoch": 1840} {"train_loss": -35.49570846557617, "global_step": 222744, "epoch": 1840} {"train_loss": -37.95123291015625, "global_step": 222745, "epoch": 1840} {"train_loss": -37.05744171142578, "global_step": 222746, "epoch": 1840} {"train_loss": -37.06269454956055, "global_step": 222747, "epoch": 1840} {"train_loss": -38.286441802978516, "global_step": 222748, "epoch": 1840} {"train_loss": -37.20850372314453, "global_step": 222749, "epoch": 1840} {"train_loss": -38.34823226928711, "global_step": 222750, "epoch": 1840} {"train_loss": -37.81315994262695, "global_step": 222751, "epoch": 1840} {"train_loss": -38.19294357299805, "global_step": 222752, "epoch": 1840} {"train_loss": -38.06238555908203, "global_step": 222753, "epoch": 1840} {"train_loss": -38.503570556640625, "global_step": 222754, "epoch": 1840} {"train_loss": -38.28152084350586, "global_step": 222755, "epoch": 1840} {"train_loss": -38.07914352416992, "global_step": 222756, "epoch": 1840} {"train_loss": -38.90517807006836, "global_step": 222757, "epoch": 1840} {"train_loss": -38.7663688659668, "global_step": 222758, "epoch": 1840} {"train_loss": -39.08738327026367, "global_step": 222759, "epoch": 1840} {"train_loss": -38.65467930628248, "global_step": 222760, "epoch": 1840, "val_loss": 2556047.25} {"train_loss": -39.003135681152344, "global_step": 222761, "epoch": 1841} {"train_loss": -39.122222900390625, "global_step": 222762, "epoch": 1841} {"train_loss": -39.119590759277344, "global_step": 222763, "epoch": 1841} {"train_loss": -39.2159538269043, "global_step": 222764, "epoch": 1841} {"train_loss": -38.878238677978516, "global_step": 222765, "epoch": 1841} {"train_loss": -39.066768646240234, "global_step": 222766, "epoch": 1841} {"train_loss": -39.70023727416992, "global_step": 222767, "epoch": 1841} {"train_loss": -39.33931350708008, "global_step": 222768, "epoch": 1841} {"train_loss": -39.36884689331055, "global_step": 222769, "epoch": 1841} {"train_loss": -39.59292221069336, "global_step": 222770, "epoch": 1841} {"train_loss": -39.52787399291992, "global_step": 222771, "epoch": 1841} {"train_loss": -40.2276611328125, "global_step": 222772, "epoch": 1841} {"train_loss": -39.6319694519043, "global_step": 222773, "epoch": 1841} {"train_loss": -39.119537353515625, "global_step": 222774, "epoch": 1841} {"train_loss": -38.3337287902832, "global_step": 222775, "epoch": 1841} {"train_loss": -39.21281051635742, "global_step": 222776, "epoch": 1841} {"train_loss": -39.30543518066406, "global_step": 222777, "epoch": 1841} {"train_loss": -39.17856979370117, "global_step": 222778, "epoch": 1841} {"train_loss": -39.3059196472168, "global_step": 222779, "epoch": 1841} {"train_loss": -39.67435073852539, "global_step": 222780, "epoch": 1841} {"train_loss": -39.18119430541992, "global_step": 222781, "epoch": 1841} {"train_loss": -39.043739318847656, "global_step": 222782, "epoch": 1841} {"train_loss": -40.11162185668945, "global_step": 222783, "epoch": 1841} {"train_loss": -39.74235916137695, "global_step": 222784, "epoch": 1841} {"train_loss": -40.382144927978516, "global_step": 222785, "epoch": 1841} {"train_loss": -40.102359771728516, "global_step": 222786, "epoch": 1841} {"train_loss": -40.073211669921875, "global_step": 222787, "epoch": 1841} {"train_loss": -40.58041000366211, "global_step": 222788, "epoch": 1841} {"train_loss": -39.81756591796875, "global_step": 222789, "epoch": 1841} {"train_loss": -39.911136627197266, "global_step": 222790, "epoch": 1841} {"train_loss": -39.716529846191406, "global_step": 222791, "epoch": 1841} {"train_loss": -40.06974411010742, "global_step": 222792, "epoch": 1841} {"train_loss": -40.38961410522461, "global_step": 222793, "epoch": 1841} {"train_loss": -39.88145065307617, "global_step": 222794, "epoch": 1841} {"train_loss": -39.94312286376953, "global_step": 222795, "epoch": 1841} {"train_loss": -39.87733840942383, "global_step": 222796, "epoch": 1841} {"train_loss": -40.682613372802734, "global_step": 222797, "epoch": 1841} {"train_loss": -40.9011344909668, "global_step": 222798, "epoch": 1841} {"train_loss": -40.88187789916992, "global_step": 222799, "epoch": 1841} {"train_loss": -40.49428939819336, "global_step": 222800, "epoch": 1841} {"train_loss": -40.95096969604492, "global_step": 222801, "epoch": 1841} {"train_loss": -40.730430603027344, "global_step": 222802, "epoch": 1841} {"train_loss": -40.22422409057617, "global_step": 222803, "epoch": 1841} {"train_loss": -40.84391403198242, "global_step": 222804, "epoch": 1841} {"train_loss": -40.11650466918945, "global_step": 222805, "epoch": 1841} {"train_loss": -39.941036224365234, "global_step": 222806, "epoch": 1841} {"train_loss": -40.45219802856445, "global_step": 222807, "epoch": 1841} {"train_loss": -40.273189544677734, "global_step": 222808, "epoch": 1841} {"train_loss": -40.38786697387695, "global_step": 222809, "epoch": 1841} {"train_loss": -40.876747131347656, "global_step": 222810, "epoch": 1841} {"train_loss": -39.88044357299805, "global_step": 222811, "epoch": 1841} {"train_loss": -40.85129928588867, "global_step": 222812, "epoch": 1841} {"train_loss": -40.37604522705078, "global_step": 222813, "epoch": 1841} {"train_loss": -40.37470626831055, "global_step": 222814, "epoch": 1841} {"train_loss": -40.26548385620117, "global_step": 222815, "epoch": 1841} {"train_loss": -39.66643142700195, "global_step": 222816, "epoch": 1841} {"train_loss": -40.32744216918945, "global_step": 222817, "epoch": 1841} {"train_loss": -39.968475341796875, "global_step": 222818, "epoch": 1841} {"train_loss": -39.899139404296875, "global_step": 222819, "epoch": 1841} {"train_loss": -38.42596435546875, "global_step": 222820, "epoch": 1841} {"train_loss": -38.79221725463867, "global_step": 222821, "epoch": 1841} {"train_loss": -40.0509033203125, "global_step": 222822, "epoch": 1841} {"train_loss": -39.838287353515625, "global_step": 222823, "epoch": 1841} {"train_loss": -39.04090118408203, "global_step": 222824, "epoch": 1841} {"train_loss": -38.74628829956055, "global_step": 222825, "epoch": 1841} {"train_loss": -39.49618148803711, "global_step": 222826, "epoch": 1841} {"train_loss": -40.52822494506836, "global_step": 222827, "epoch": 1841} {"train_loss": -39.29047775268555, "global_step": 222828, "epoch": 1841} {"train_loss": -38.884037017822266, "global_step": 222829, "epoch": 1841} {"train_loss": -41.05413818359375, "global_step": 222830, "epoch": 1841} {"train_loss": -40.133140563964844, "global_step": 222831, "epoch": 1841} {"train_loss": -40.599117279052734, "global_step": 222832, "epoch": 1841} {"train_loss": -40.173316955566406, "global_step": 222833, "epoch": 1841} {"train_loss": -39.98285675048828, "global_step": 222834, "epoch": 1841} {"train_loss": -39.93093490600586, "global_step": 222835, "epoch": 1841} {"train_loss": -40.345184326171875, "global_step": 222836, "epoch": 1841} {"train_loss": -40.12180709838867, "global_step": 222837, "epoch": 1841} {"train_loss": -39.98337936401367, "global_step": 222838, "epoch": 1841} {"train_loss": -40.07659149169922, "global_step": 222839, "epoch": 1841} {"train_loss": -39.24596405029297, "global_step": 222840, "epoch": 1841} {"train_loss": -38.27854537963867, "global_step": 222841, "epoch": 1841} {"train_loss": -39.39081954956055, "global_step": 222842, "epoch": 1841} {"train_loss": -38.47444152832031, "global_step": 222843, "epoch": 1841} {"train_loss": -40.146705627441406, "global_step": 222844, "epoch": 1841} {"train_loss": -39.17861557006836, "global_step": 222845, "epoch": 1841} {"train_loss": -38.506103515625, "global_step": 222846, "epoch": 1841} {"train_loss": -39.29722213745117, "global_step": 222847, "epoch": 1841} {"train_loss": -39.25295639038086, "global_step": 222848, "epoch": 1841} {"train_loss": -40.39408874511719, "global_step": 222849, "epoch": 1841} {"train_loss": -40.53889846801758, "global_step": 222850, "epoch": 1841} {"train_loss": -40.563262939453125, "global_step": 222851, "epoch": 1841} {"train_loss": -40.94559097290039, "global_step": 222852, "epoch": 1841} {"train_loss": -40.335731506347656, "global_step": 222853, "epoch": 1841} {"train_loss": -41.05411911010742, "global_step": 222854, "epoch": 1841} {"train_loss": -40.826786041259766, "global_step": 222855, "epoch": 1841} {"train_loss": -40.726383209228516, "global_step": 222856, "epoch": 1841} {"train_loss": -40.88494873046875, "global_step": 222857, "epoch": 1841} {"train_loss": -40.86605453491211, "global_step": 222858, "epoch": 1841} {"train_loss": -39.81678009033203, "global_step": 222859, "epoch": 1841} {"train_loss": -40.37295150756836, "global_step": 222860, "epoch": 1841} {"train_loss": -40.928035736083984, "global_step": 222861, "epoch": 1841} {"train_loss": -41.365081787109375, "global_step": 222862, "epoch": 1841} {"train_loss": -40.864376068115234, "global_step": 222863, "epoch": 1841} {"train_loss": -41.24570846557617, "global_step": 222864, "epoch": 1841} {"train_loss": -40.8498420715332, "global_step": 222865, "epoch": 1841} {"train_loss": -41.65225601196289, "global_step": 222866, "epoch": 1841} {"train_loss": -41.14101791381836, "global_step": 222867, "epoch": 1841} {"train_loss": -41.08009719848633, "global_step": 222868, "epoch": 1841} {"train_loss": -41.10103225708008, "global_step": 222869, "epoch": 1841} {"train_loss": -41.11100387573242, "global_step": 222870, "epoch": 1841} {"train_loss": -41.05184555053711, "global_step": 222871, "epoch": 1841} {"train_loss": -40.08577346801758, "global_step": 222872, "epoch": 1841} {"train_loss": -40.78184127807617, "global_step": 222873, "epoch": 1841} {"train_loss": -40.63071823120117, "global_step": 222874, "epoch": 1841} {"train_loss": -41.048614501953125, "global_step": 222875, "epoch": 1841} {"train_loss": -41.511810302734375, "global_step": 222876, "epoch": 1841} {"train_loss": -41.312782287597656, "global_step": 222877, "epoch": 1841} {"train_loss": -41.020259857177734, "global_step": 222878, "epoch": 1841} {"train_loss": -40.380889892578125, "global_step": 222879, "epoch": 1841} {"train_loss": -40.664058685302734, "global_step": 222880, "epoch": 1841} {"train_loss": -40.08381602389753, "global_step": 222881, "epoch": 1841, "val_loss": 2546463.5} {"train_loss": -41.10501480102539, "global_step": 222882, "epoch": 1842} {"train_loss": -40.84870529174805, "global_step": 222883, "epoch": 1842} {"train_loss": -40.71712112426758, "global_step": 222884, "epoch": 1842} {"train_loss": -39.92876052856445, "global_step": 222885, "epoch": 1842} {"train_loss": -40.923011779785156, "global_step": 222886, "epoch": 1842} {"train_loss": -40.31329345703125, "global_step": 222887, "epoch": 1842} {"train_loss": -41.175201416015625, "global_step": 222888, "epoch": 1842} {"train_loss": -41.89265060424805, "global_step": 222889, "epoch": 1842} {"train_loss": -41.13833999633789, "global_step": 222890, "epoch": 1842} {"train_loss": -41.924072265625, "global_step": 222891, "epoch": 1842} {"train_loss": -40.703712463378906, "global_step": 222892, "epoch": 1842} {"train_loss": -40.69453811645508, "global_step": 222893, "epoch": 1842} {"train_loss": -41.19416427612305, "global_step": 222894, "epoch": 1842} {"train_loss": -41.78875732421875, "global_step": 222895, "epoch": 1842} {"train_loss": -40.485530853271484, "global_step": 222896, "epoch": 1842} {"train_loss": -40.05216598510742, "global_step": 222897, "epoch": 1842} {"train_loss": -38.73622131347656, "global_step": 222898, "epoch": 1842} {"train_loss": -40.446372985839844, "global_step": 222899, "epoch": 1842} {"train_loss": -39.25575256347656, "global_step": 222900, "epoch": 1842} {"train_loss": -37.85075759887695, "global_step": 222901, "epoch": 1842} {"train_loss": -38.880157470703125, "global_step": 222902, "epoch": 1842} {"train_loss": -39.62131881713867, "global_step": 222903, "epoch": 1842} {"train_loss": -39.66695785522461, "global_step": 222904, "epoch": 1842} {"train_loss": -39.814697265625, "global_step": 222905, "epoch": 1842} {"train_loss": -40.33528137207031, "global_step": 222906, "epoch": 1842} {"train_loss": -40.460811614990234, "global_step": 222907, "epoch": 1842} {"train_loss": -40.88035202026367, "global_step": 222908, "epoch": 1842} {"train_loss": -38.53927230834961, "global_step": 222909, "epoch": 1842} {"train_loss": -40.45547103881836, "global_step": 222910, "epoch": 1842} {"train_loss": -40.2025032043457, "global_step": 222911, "epoch": 1842} {"train_loss": -40.372344970703125, "global_step": 222912, "epoch": 1842} {"train_loss": -40.893314361572266, "global_step": 222913, "epoch": 1842} {"train_loss": -41.34816360473633, "global_step": 222914, "epoch": 1842} {"train_loss": -41.15825271606445, "global_step": 222915, "epoch": 1842} {"train_loss": -38.159969329833984, "global_step": 222916, "epoch": 1842} {"train_loss": -39.293914794921875, "global_step": 222917, "epoch": 1842} {"train_loss": -40.457244873046875, "global_step": 222918, "epoch": 1842} {"train_loss": -41.445858001708984, "global_step": 222919, "epoch": 1842} {"train_loss": -40.1771125793457, "global_step": 222920, "epoch": 1842} {"train_loss": -41.38494873046875, "global_step": 222921, "epoch": 1842} {"train_loss": -40.56239700317383, "global_step": 222922, "epoch": 1842} {"train_loss": -40.41950988769531, "global_step": 222923, "epoch": 1842} {"train_loss": -38.78448486328125, "global_step": 222924, "epoch": 1842} {"train_loss": -39.62716293334961, "global_step": 222925, "epoch": 1842} {"train_loss": -41.04819869995117, "global_step": 222926, "epoch": 1842} {"train_loss": -40.253273010253906, "global_step": 222927, "epoch": 1842} {"train_loss": -38.58443832397461, "global_step": 222928, "epoch": 1842} {"train_loss": -39.82666015625, "global_step": 222929, "epoch": 1842} {"train_loss": -41.003353118896484, "global_step": 222930, "epoch": 1842} {"train_loss": -40.79256057739258, "global_step": 222931, "epoch": 1842} {"train_loss": -40.43949890136719, "global_step": 222932, "epoch": 1842} {"train_loss": -40.43195724487305, "global_step": 222933, "epoch": 1842} {"train_loss": -39.07084655761719, "global_step": 222934, "epoch": 1842} {"train_loss": -39.456573486328125, "global_step": 222935, "epoch": 1842} {"train_loss": -40.64667892456055, "global_step": 222936, "epoch": 1842} {"train_loss": -40.35540771484375, "global_step": 222937, "epoch": 1842} {"train_loss": -41.280033111572266, "global_step": 222938, "epoch": 1842} {"train_loss": -39.999141693115234, "global_step": 222939, "epoch": 1842} {"train_loss": -38.17271423339844, "global_step": 222940, "epoch": 1842} {"train_loss": -39.244422912597656, "global_step": 222941, "epoch": 1842} {"train_loss": -39.056819915771484, "global_step": 222942, "epoch": 1842} {"train_loss": -39.80570602416992, "global_step": 222943, "epoch": 1842} {"train_loss": -40.064849853515625, "global_step": 222944, "epoch": 1842} {"train_loss": -39.535465240478516, "global_step": 222945, "epoch": 1842} {"train_loss": -39.036773681640625, "global_step": 222946, "epoch": 1842} {"train_loss": -41.13222885131836, "global_step": 222947, "epoch": 1842} {"train_loss": -40.1389045715332, "global_step": 222948, "epoch": 1842} {"train_loss": -39.44635009765625, "global_step": 222949, "epoch": 1842} {"train_loss": -40.5428581237793, "global_step": 222950, "epoch": 1842} {"train_loss": -40.9096565246582, "global_step": 222951, "epoch": 1842} {"train_loss": -41.41721725463867, "global_step": 222952, "epoch": 1842} {"train_loss": -39.73848342895508, "global_step": 222953, "epoch": 1842} {"train_loss": -40.70939636230469, "global_step": 222954, "epoch": 1842} {"train_loss": -38.81201171875, "global_step": 222955, "epoch": 1842} {"train_loss": -40.05656814575195, "global_step": 222956, "epoch": 1842} {"train_loss": -39.458152770996094, "global_step": 222957, "epoch": 1842} {"train_loss": -40.986080169677734, "global_step": 222958, "epoch": 1842} {"train_loss": -39.451969146728516, "global_step": 222959, "epoch": 1842} {"train_loss": -40.450843811035156, "global_step": 222960, "epoch": 1842} {"train_loss": -40.217445373535156, "global_step": 222961, "epoch": 1842} {"train_loss": -40.477046966552734, "global_step": 222962, "epoch": 1842} {"train_loss": -40.44420623779297, "global_step": 222963, "epoch": 1842} {"train_loss": -40.56785202026367, "global_step": 222964, "epoch": 1842} {"train_loss": -39.91449737548828, "global_step": 222965, "epoch": 1842} {"train_loss": -40.375396728515625, "global_step": 222966, "epoch": 1842} {"train_loss": -40.24796676635742, "global_step": 222967, "epoch": 1842} {"train_loss": -41.338165283203125, "global_step": 222968, "epoch": 1842} {"train_loss": -40.38156509399414, "global_step": 222969, "epoch": 1842} {"train_loss": -40.531436920166016, "global_step": 222970, "epoch": 1842} {"train_loss": -39.713008880615234, "global_step": 222971, "epoch": 1842} {"train_loss": -38.83290100097656, "global_step": 222972, "epoch": 1842} {"train_loss": -40.434059143066406, "global_step": 222973, "epoch": 1842} {"train_loss": -39.75352096557617, "global_step": 222974, "epoch": 1842} {"train_loss": -40.743587493896484, "global_step": 222975, "epoch": 1842} {"train_loss": -40.21527099609375, "global_step": 222976, "epoch": 1842} {"train_loss": -41.38877487182617, "global_step": 222977, "epoch": 1842} {"train_loss": -40.85683059692383, "global_step": 222978, "epoch": 1842} {"train_loss": -41.71376419067383, "global_step": 222979, "epoch": 1842} {"train_loss": -40.6671028137207, "global_step": 222980, "epoch": 1842} {"train_loss": -40.25809860229492, "global_step": 222981, "epoch": 1842} {"train_loss": -40.698577880859375, "global_step": 222982, "epoch": 1842} {"train_loss": -38.897621154785156, "global_step": 222983, "epoch": 1842} {"train_loss": -40.82268524169922, "global_step": 222984, "epoch": 1842} {"train_loss": -40.52573776245117, "global_step": 222985, "epoch": 1842} {"train_loss": -39.355281829833984, "global_step": 222986, "epoch": 1842} {"train_loss": -40.123573303222656, "global_step": 222987, "epoch": 1842} {"train_loss": -37.102230072021484, "global_step": 222988, "epoch": 1842} {"train_loss": -39.88298416137695, "global_step": 222989, "epoch": 1842} {"train_loss": -41.04475021362305, "global_step": 222990, "epoch": 1842} {"train_loss": -39.88803482055664, "global_step": 222991, "epoch": 1842} {"train_loss": -40.16069412231445, "global_step": 222992, "epoch": 1842} {"train_loss": -41.055908203125, "global_step": 222993, "epoch": 1842} {"train_loss": -39.29243850708008, "global_step": 222994, "epoch": 1842} {"train_loss": -37.50432205200195, "global_step": 222995, "epoch": 1842} {"train_loss": -34.99028396606445, "global_step": 222996, "epoch": 1842} {"train_loss": -34.28840255737305, "global_step": 222997, "epoch": 1842} {"train_loss": -39.61734390258789, "global_step": 222998, "epoch": 1842} {"train_loss": -36.2904167175293, "global_step": 222999, "epoch": 1842} {"train_loss": -31.213104248046875, "global_step": 223000, "epoch": 1842} {"train_loss": -38.9476318359375, "global_step": 223001, "epoch": 1842} {"train_loss": -39.93509809635887, "global_step": 223002, "epoch": 1842, "val_loss": 3165907.25} {"train_loss": -35.463531494140625, "global_step": 223003, "epoch": 1843} {"train_loss": -39.683040618896484, "global_step": 223004, "epoch": 1843} {"train_loss": -33.75164794921875, "global_step": 223005, "epoch": 1843} {"train_loss": -37.880184173583984, "global_step": 223006, "epoch": 1843} {"train_loss": -38.9152946472168, "global_step": 223007, "epoch": 1843} {"train_loss": -38.547237396240234, "global_step": 223008, "epoch": 1843} {"train_loss": -38.3116455078125, "global_step": 223009, "epoch": 1843} {"train_loss": -38.695343017578125, "global_step": 223010, "epoch": 1843} {"train_loss": -37.740684509277344, "global_step": 223011, "epoch": 1843} {"train_loss": -40.1655387878418, "global_step": 223012, "epoch": 1843} {"train_loss": -39.159446716308594, "global_step": 223013, "epoch": 1843} {"train_loss": -39.91127014160156, "global_step": 223014, "epoch": 1843} {"train_loss": -37.98867416381836, "global_step": 223015, "epoch": 1843} {"train_loss": -38.6713981628418, "global_step": 223016, "epoch": 1843} {"train_loss": -40.04594039916992, "global_step": 223017, "epoch": 1843} {"train_loss": -37.7277946472168, "global_step": 223018, "epoch": 1843} {"train_loss": -39.207550048828125, "global_step": 223019, "epoch": 1843} {"train_loss": -39.050167083740234, "global_step": 223020, "epoch": 1843} {"train_loss": -40.151878356933594, "global_step": 223021, "epoch": 1843} {"train_loss": -37.812801361083984, "global_step": 223022, "epoch": 1843} {"train_loss": -37.007606506347656, "global_step": 223023, "epoch": 1843} {"train_loss": -36.08778762817383, "global_step": 223024, "epoch": 1843} {"train_loss": -39.39571762084961, "global_step": 223025, "epoch": 1843} {"train_loss": -37.42930603027344, "global_step": 223026, "epoch": 1843} {"train_loss": -39.32852554321289, "global_step": 223027, "epoch": 1843} {"train_loss": -38.55678939819336, "global_step": 223028, "epoch": 1843} {"train_loss": -39.48003005981445, "global_step": 223029, "epoch": 1843} {"train_loss": -38.2954216003418, "global_step": 223030, "epoch": 1843} {"train_loss": -39.202110290527344, "global_step": 223031, "epoch": 1843} {"train_loss": -37.43667221069336, "global_step": 223032, "epoch": 1843} {"train_loss": -38.78990173339844, "global_step": 223033, "epoch": 1843} {"train_loss": -38.515682220458984, "global_step": 223034, "epoch": 1843} {"train_loss": -39.66041946411133, "global_step": 223035, "epoch": 1843} {"train_loss": -40.26763916015625, "global_step": 223036, "epoch": 1843} {"train_loss": -40.229454040527344, "global_step": 223037, "epoch": 1843} {"train_loss": -39.973018646240234, "global_step": 223038, "epoch": 1843} {"train_loss": -37.97990036010742, "global_step": 223039, "epoch": 1843} {"train_loss": -39.51356887817383, "global_step": 223040, "epoch": 1843} {"train_loss": -39.84967803955078, "global_step": 223041, "epoch": 1843} {"train_loss": -39.7113151550293, "global_step": 223042, "epoch": 1843} {"train_loss": -40.23301696777344, "global_step": 223043, "epoch": 1843} {"train_loss": -38.331764221191406, "global_step": 223044, "epoch": 1843} {"train_loss": -38.546302795410156, "global_step": 223045, "epoch": 1843} {"train_loss": -39.877742767333984, "global_step": 223046, "epoch": 1843} {"train_loss": -39.64688491821289, "global_step": 223047, "epoch": 1843} {"train_loss": -39.908016204833984, "global_step": 223048, "epoch": 1843} {"train_loss": -39.23733139038086, "global_step": 223049, "epoch": 1843} {"train_loss": -38.586055755615234, "global_step": 223050, "epoch": 1843} {"train_loss": -39.32168960571289, "global_step": 223051, "epoch": 1843} {"train_loss": -40.46472930908203, "global_step": 223052, "epoch": 1843} {"train_loss": -38.66541290283203, "global_step": 223053, "epoch": 1843} {"train_loss": -39.633087158203125, "global_step": 223054, "epoch": 1843} {"train_loss": -40.62443161010742, "global_step": 223055, "epoch": 1843} {"train_loss": -39.474395751953125, "global_step": 223056, "epoch": 1843} {"train_loss": -39.621337890625, "global_step": 223057, "epoch": 1843} {"train_loss": -40.517337799072266, "global_step": 223058, "epoch": 1843} {"train_loss": -40.30010986328125, "global_step": 223059, "epoch": 1843} {"train_loss": -39.816314697265625, "global_step": 223060, "epoch": 1843} {"train_loss": -40.62990188598633, "global_step": 223061, "epoch": 1843} {"train_loss": -39.977455139160156, "global_step": 223062, "epoch": 1843} {"train_loss": -41.06661605834961, "global_step": 223063, "epoch": 1843} {"train_loss": -41.23298263549805, "global_step": 223064, "epoch": 1843} {"train_loss": -40.173561096191406, "global_step": 223065, "epoch": 1843} {"train_loss": -38.255531311035156, "global_step": 223066, "epoch": 1843} {"train_loss": -40.3729133605957, "global_step": 223067, "epoch": 1843} {"train_loss": -40.589351654052734, "global_step": 223068, "epoch": 1843} {"train_loss": -38.409271240234375, "global_step": 223069, "epoch": 1843} {"train_loss": -41.02162551879883, "global_step": 223070, "epoch": 1843} {"train_loss": -40.8970832824707, "global_step": 223071, "epoch": 1843} {"train_loss": -40.71331787109375, "global_step": 223072, "epoch": 1843} {"train_loss": -41.32969665527344, "global_step": 223073, "epoch": 1843} {"train_loss": -40.72591781616211, "global_step": 223074, "epoch": 1843} {"train_loss": -40.124324798583984, "global_step": 223075, "epoch": 1843} {"train_loss": -40.7313117980957, "global_step": 223076, "epoch": 1843} {"train_loss": -39.8066291809082, "global_step": 223077, "epoch": 1843} {"train_loss": -40.64004135131836, "global_step": 223078, "epoch": 1843} {"train_loss": -39.22450637817383, "global_step": 223079, "epoch": 1843} {"train_loss": -41.22096633911133, "global_step": 223080, "epoch": 1843} {"train_loss": -41.08837890625, "global_step": 223081, "epoch": 1843} {"train_loss": -40.97139358520508, "global_step": 223082, "epoch": 1843} {"train_loss": -40.78774642944336, "global_step": 223083, "epoch": 1843} {"train_loss": -41.44458770751953, "global_step": 223084, "epoch": 1843} {"train_loss": -41.12282180786133, "global_step": 223085, "epoch": 1843} {"train_loss": -41.15920639038086, "global_step": 223086, "epoch": 1843} {"train_loss": -41.117774963378906, "global_step": 223087, "epoch": 1843} {"train_loss": -38.84708786010742, "global_step": 223088, "epoch": 1843} {"train_loss": -41.13571548461914, "global_step": 223089, "epoch": 1843} {"train_loss": -41.21687316894531, "global_step": 223090, "epoch": 1843} {"train_loss": -40.27983474731445, "global_step": 223091, "epoch": 1843} {"train_loss": -40.69356155395508, "global_step": 223092, "epoch": 1843} {"train_loss": -40.354488372802734, "global_step": 223093, "epoch": 1843} {"train_loss": -41.565826416015625, "global_step": 223094, "epoch": 1843} {"train_loss": -40.9378776550293, "global_step": 223095, "epoch": 1843} {"train_loss": -41.05745315551758, "global_step": 223096, "epoch": 1843} {"train_loss": -40.34464645385742, "global_step": 223097, "epoch": 1843} {"train_loss": -41.53968048095703, "global_step": 223098, "epoch": 1843} {"train_loss": -41.184242248535156, "global_step": 223099, "epoch": 1843} {"train_loss": -41.387245178222656, "global_step": 223100, "epoch": 1843} {"train_loss": -38.872005462646484, "global_step": 223101, "epoch": 1843} {"train_loss": -38.54920196533203, "global_step": 223102, "epoch": 1843} {"train_loss": -40.8758430480957, "global_step": 223103, "epoch": 1843} {"train_loss": -41.702659606933594, "global_step": 223104, "epoch": 1843} {"train_loss": -40.93660354614258, "global_step": 223105, "epoch": 1843} {"train_loss": -39.55721664428711, "global_step": 223106, "epoch": 1843} {"train_loss": -39.736122131347656, "global_step": 223107, "epoch": 1843} {"train_loss": -41.513431549072266, "global_step": 223108, "epoch": 1843} {"train_loss": -40.74187469482422, "global_step": 223109, "epoch": 1843} {"train_loss": -39.212890625, "global_step": 223110, "epoch": 1843} {"train_loss": -36.209964752197266, "global_step": 223111, "epoch": 1843} {"train_loss": -40.653926849365234, "global_step": 223112, "epoch": 1843} {"train_loss": -40.305152893066406, "global_step": 223113, "epoch": 1843} {"train_loss": -41.06332015991211, "global_step": 223114, "epoch": 1843} {"train_loss": -37.13871765136719, "global_step": 223115, "epoch": 1843} {"train_loss": -38.67800521850586, "global_step": 223116, "epoch": 1843} {"train_loss": -41.19092559814453, "global_step": 223117, "epoch": 1843} {"train_loss": -39.12106704711914, "global_step": 223118, "epoch": 1843} {"train_loss": -36.2841682434082, "global_step": 223119, "epoch": 1843} {"train_loss": -40.07513427734375, "global_step": 223120, "epoch": 1843} {"train_loss": -39.14686965942383, "global_step": 223121, "epoch": 1843} {"train_loss": -36.255489349365234, "global_step": 223122, "epoch": 1843} {"train_loss": -39.5557012006271, "global_step": 223123, "epoch": 1843, "val_loss": 2672620.25} {"train_loss": -38.04547119140625, "global_step": 223124, "epoch": 1844} {"train_loss": -36.136993408203125, "global_step": 223125, "epoch": 1844} {"train_loss": -38.23690414428711, "global_step": 223126, "epoch": 1844} {"train_loss": -39.07158279418945, "global_step": 223127, "epoch": 1844} {"train_loss": -39.08662796020508, "global_step": 223128, "epoch": 1844} {"train_loss": -35.32197189331055, "global_step": 223129, "epoch": 1844} {"train_loss": -40.33968734741211, "global_step": 223130, "epoch": 1844} {"train_loss": -35.95608139038086, "global_step": 223131, "epoch": 1844} {"train_loss": -38.72245407104492, "global_step": 223132, "epoch": 1844} {"train_loss": -40.302242279052734, "global_step": 223133, "epoch": 1844} {"train_loss": -37.90658187866211, "global_step": 223134, "epoch": 1844} {"train_loss": -40.817604064941406, "global_step": 223135, "epoch": 1844} {"train_loss": -40.29437255859375, "global_step": 223136, "epoch": 1844} {"train_loss": -40.16485595703125, "global_step": 223137, "epoch": 1844} {"train_loss": -40.869415283203125, "global_step": 223138, "epoch": 1844} {"train_loss": -40.23168182373047, "global_step": 223139, "epoch": 1844} {"train_loss": -37.087764739990234, "global_step": 223140, "epoch": 1844} {"train_loss": -39.56675338745117, "global_step": 223141, "epoch": 1844} {"train_loss": -39.264381408691406, "global_step": 223142, "epoch": 1844} {"train_loss": -39.709495544433594, "global_step": 223143, "epoch": 1844} {"train_loss": -40.60036087036133, "global_step": 223144, "epoch": 1844} {"train_loss": -38.76691436767578, "global_step": 223145, "epoch": 1844} {"train_loss": -40.803428649902344, "global_step": 223146, "epoch": 1844} {"train_loss": -40.02164840698242, "global_step": 223147, "epoch": 1844} {"train_loss": -40.49333572387695, "global_step": 223148, "epoch": 1844} {"train_loss": -41.465755462646484, "global_step": 223149, "epoch": 1844} {"train_loss": -39.344688415527344, "global_step": 223150, "epoch": 1844} {"train_loss": -40.517425537109375, "global_step": 223151, "epoch": 1844} {"train_loss": -41.41901397705078, "global_step": 223152, "epoch": 1844} {"train_loss": -40.70259094238281, "global_step": 223153, "epoch": 1844} {"train_loss": -40.692020416259766, "global_step": 223154, "epoch": 1844} {"train_loss": -40.73479080200195, "global_step": 223155, "epoch": 1844} {"train_loss": -41.12439727783203, "global_step": 223156, "epoch": 1844} {"train_loss": -41.131202697753906, "global_step": 223157, "epoch": 1844} {"train_loss": -39.52740478515625, "global_step": 223158, "epoch": 1844} {"train_loss": -40.34613800048828, "global_step": 223159, "epoch": 1844} {"train_loss": -41.60174560546875, "global_step": 223160, "epoch": 1844} {"train_loss": -41.064666748046875, "global_step": 223161, "epoch": 1844} {"train_loss": -41.440032958984375, "global_step": 223162, "epoch": 1844} {"train_loss": -41.278438568115234, "global_step": 223163, "epoch": 1844} {"train_loss": -40.7381706237793, "global_step": 223164, "epoch": 1844} {"train_loss": -40.14902877807617, "global_step": 223165, "epoch": 1844} {"train_loss": -41.10371780395508, "global_step": 223166, "epoch": 1844} {"train_loss": -41.675106048583984, "global_step": 223167, "epoch": 1844} {"train_loss": -40.931884765625, "global_step": 223168, "epoch": 1844} {"train_loss": -41.07191467285156, "global_step": 223169, "epoch": 1844} {"train_loss": -41.35136032104492, "global_step": 223170, "epoch": 1844} {"train_loss": -41.115089416503906, "global_step": 223171, "epoch": 1844} {"train_loss": -41.45835494995117, "global_step": 223172, "epoch": 1844} {"train_loss": -41.40068435668945, "global_step": 223173, "epoch": 1844} {"train_loss": -41.61110305786133, "global_step": 223174, "epoch": 1844} {"train_loss": -41.6822395324707, "global_step": 223175, "epoch": 1844} {"train_loss": -41.249298095703125, "global_step": 223176, "epoch": 1844} {"train_loss": -38.98780059814453, "global_step": 223177, "epoch": 1844} {"train_loss": -41.372467041015625, "global_step": 223178, "epoch": 1844} {"train_loss": -41.22208786010742, "global_step": 223179, "epoch": 1844} {"train_loss": -41.06990432739258, "global_step": 223180, "epoch": 1844} {"train_loss": -41.008140563964844, "global_step": 223181, "epoch": 1844} {"train_loss": -37.75765609741211, "global_step": 223182, "epoch": 1844} {"train_loss": -40.329341888427734, "global_step": 223183, "epoch": 1844} {"train_loss": -42.0699462890625, "global_step": 223184, "epoch": 1844} {"train_loss": -39.256019592285156, "global_step": 223185, "epoch": 1844} {"train_loss": -40.951332092285156, "global_step": 223186, "epoch": 1844} {"train_loss": -41.756500244140625, "global_step": 223187, "epoch": 1844} {"train_loss": -39.95010757446289, "global_step": 223188, "epoch": 1844} {"train_loss": -41.42018508911133, "global_step": 223189, "epoch": 1844} {"train_loss": -40.728614807128906, "global_step": 223190, "epoch": 1844} {"train_loss": -41.16619110107422, "global_step": 223191, "epoch": 1844} {"train_loss": -40.27307891845703, "global_step": 223192, "epoch": 1844} {"train_loss": -41.7627067565918, "global_step": 223193, "epoch": 1844} {"train_loss": -41.14191436767578, "global_step": 223194, "epoch": 1844} {"train_loss": -41.41267013549805, "global_step": 223195, "epoch": 1844} {"train_loss": -42.32841110229492, "global_step": 223196, "epoch": 1844} {"train_loss": -40.70275115966797, "global_step": 223197, "epoch": 1844} {"train_loss": -41.8082389831543, "global_step": 223198, "epoch": 1844} {"train_loss": -41.397212982177734, "global_step": 223199, "epoch": 1844} {"train_loss": -41.38948440551758, "global_step": 223200, "epoch": 1844} {"train_loss": -40.650550842285156, "global_step": 223201, "epoch": 1844} {"train_loss": -42.04688262939453, "global_step": 223202, "epoch": 1844} {"train_loss": -41.948665618896484, "global_step": 223203, "epoch": 1844} {"train_loss": -40.465396881103516, "global_step": 223204, "epoch": 1844} {"train_loss": -40.908660888671875, "global_step": 223205, "epoch": 1844} {"train_loss": -41.8680419921875, "global_step": 223206, "epoch": 1844} {"train_loss": -41.681373596191406, "global_step": 223207, "epoch": 1844} {"train_loss": -41.09161376953125, "global_step": 223208, "epoch": 1844} {"train_loss": -41.13663864135742, "global_step": 223209, "epoch": 1844} {"train_loss": -41.84471893310547, "global_step": 223210, "epoch": 1844} {"train_loss": -41.53487014770508, "global_step": 223211, "epoch": 1844} {"train_loss": -42.055999755859375, "global_step": 223212, "epoch": 1844} {"train_loss": -41.79316711425781, "global_step": 223213, "epoch": 1844} {"train_loss": -42.133113861083984, "global_step": 223214, "epoch": 1844} {"train_loss": -42.1917610168457, "global_step": 223215, "epoch": 1844} {"train_loss": -41.98846435546875, "global_step": 223216, "epoch": 1844} {"train_loss": -42.080726623535156, "global_step": 223217, "epoch": 1844} {"train_loss": -42.21123504638672, "global_step": 223218, "epoch": 1844} {"train_loss": -41.21210479736328, "global_step": 223219, "epoch": 1844} {"train_loss": -41.54352569580078, "global_step": 223220, "epoch": 1844} {"train_loss": -39.18510055541992, "global_step": 223221, "epoch": 1844} {"train_loss": -41.7635498046875, "global_step": 223222, "epoch": 1844} {"train_loss": -41.74011993408203, "global_step": 223223, "epoch": 1844} {"train_loss": -40.764892578125, "global_step": 223224, "epoch": 1844} {"train_loss": -39.653141021728516, "global_step": 223225, "epoch": 1844} {"train_loss": -38.066524505615234, "global_step": 223226, "epoch": 1844} {"train_loss": -37.21005630493164, "global_step": 223227, "epoch": 1844} {"train_loss": -39.29679870605469, "global_step": 223228, "epoch": 1844} {"train_loss": -36.687965393066406, "global_step": 223229, "epoch": 1844} {"train_loss": -34.676002502441406, "global_step": 223230, "epoch": 1844} {"train_loss": -36.13896560668945, "global_step": 223231, "epoch": 1844} {"train_loss": -38.60335922241211, "global_step": 223232, "epoch": 1844} {"train_loss": -41.391963958740234, "global_step": 223233, "epoch": 1844} {"train_loss": -35.978050231933594, "global_step": 223234, "epoch": 1844} {"train_loss": -39.21697235107422, "global_step": 223235, "epoch": 1844} {"train_loss": -39.32375717163086, "global_step": 223236, "epoch": 1844} {"train_loss": -40.19601058959961, "global_step": 223237, "epoch": 1844} {"train_loss": -40.284523010253906, "global_step": 223238, "epoch": 1844} {"train_loss": -41.06781768798828, "global_step": 223239, "epoch": 1844} {"train_loss": -40.80811309814453, "global_step": 223240, "epoch": 1844} {"train_loss": -38.986175537109375, "global_step": 223241, "epoch": 1844} {"train_loss": -40.733219146728516, "global_step": 223242, "epoch": 1844} {"train_loss": -40.08699035644531, "global_step": 223243, "epoch": 1844} {"train_loss": -40.33938554495819, "global_step": 223244, "epoch": 1844, "val_loss": 2533982.75} {"train_loss": -41.47874069213867, "global_step": 223245, "epoch": 1845} {"train_loss": -40.355899810791016, "global_step": 223246, "epoch": 1845} {"train_loss": -40.804988861083984, "global_step": 223247, "epoch": 1845} {"train_loss": -41.0923957824707, "global_step": 223248, "epoch": 1845} {"train_loss": -40.73595428466797, "global_step": 223249, "epoch": 1845} {"train_loss": -40.49241256713867, "global_step": 223250, "epoch": 1845} {"train_loss": -40.18378829956055, "global_step": 223251, "epoch": 1845} {"train_loss": -39.96551513671875, "global_step": 223252, "epoch": 1845} {"train_loss": -40.5488395690918, "global_step": 223253, "epoch": 1845} {"train_loss": -40.63640594482422, "global_step": 223254, "epoch": 1845} {"train_loss": -40.79690170288086, "global_step": 223255, "epoch": 1845} {"train_loss": -41.552608489990234, "global_step": 223256, "epoch": 1845} {"train_loss": -41.71857833862305, "global_step": 223257, "epoch": 1845} {"train_loss": -41.301265716552734, "global_step": 223258, "epoch": 1845} {"train_loss": -41.269737243652344, "global_step": 223259, "epoch": 1845} {"train_loss": -40.92049026489258, "global_step": 223260, "epoch": 1845} {"train_loss": -41.82229232788086, "global_step": 223261, "epoch": 1845} {"train_loss": -40.51133346557617, "global_step": 223262, "epoch": 1845} {"train_loss": -41.85251998901367, "global_step": 223263, "epoch": 1845} {"train_loss": -41.346771240234375, "global_step": 223264, "epoch": 1845} {"train_loss": -41.50208282470703, "global_step": 223265, "epoch": 1845} {"train_loss": -41.213680267333984, "global_step": 223266, "epoch": 1845} {"train_loss": -40.623809814453125, "global_step": 223267, "epoch": 1845} {"train_loss": -41.37358474731445, "global_step": 223268, "epoch": 1845} {"train_loss": -39.97321701049805, "global_step": 223269, "epoch": 1845} {"train_loss": -34.69978713989258, "global_step": 223270, "epoch": 1845} {"train_loss": -40.79547119140625, "global_step": 223271, "epoch": 1845} {"train_loss": -40.918487548828125, "global_step": 223272, "epoch": 1845} {"train_loss": -40.27720642089844, "global_step": 223273, "epoch": 1845} {"train_loss": -41.3741569519043, "global_step": 223274, "epoch": 1845} {"train_loss": -38.91995620727539, "global_step": 223275, "epoch": 1845} {"train_loss": -40.41481399536133, "global_step": 223276, "epoch": 1845} {"train_loss": -39.872283935546875, "global_step": 223277, "epoch": 1845} {"train_loss": -41.49796676635742, "global_step": 223278, "epoch": 1845} {"train_loss": -41.207183837890625, "global_step": 223279, "epoch": 1845} {"train_loss": -39.45022201538086, "global_step": 223280, "epoch": 1845} {"train_loss": -39.60192108154297, "global_step": 223281, "epoch": 1845} {"train_loss": -38.36975860595703, "global_step": 223282, "epoch": 1845} {"train_loss": -40.46223831176758, "global_step": 223283, "epoch": 1845} {"train_loss": -40.90253829956055, "global_step": 223284, "epoch": 1845} {"train_loss": -37.37480163574219, "global_step": 223285, "epoch": 1845} {"train_loss": -41.035614013671875, "global_step": 223286, "epoch": 1845} {"train_loss": -41.45596694946289, "global_step": 223287, "epoch": 1845} {"train_loss": -41.013885498046875, "global_step": 223288, "epoch": 1845} {"train_loss": -40.759559631347656, "global_step": 223289, "epoch": 1845} {"train_loss": -40.5720100402832, "global_step": 223290, "epoch": 1845} {"train_loss": -41.50431442260742, "global_step": 223291, "epoch": 1845} {"train_loss": -39.38876724243164, "global_step": 223292, "epoch": 1845} {"train_loss": -40.825111389160156, "global_step": 223293, "epoch": 1845} {"train_loss": -39.70880889892578, "global_step": 223294, "epoch": 1845} {"train_loss": -41.33094787597656, "global_step": 223295, "epoch": 1845} {"train_loss": -39.83644104003906, "global_step": 223296, "epoch": 1845} {"train_loss": -39.35343551635742, "global_step": 223297, "epoch": 1845} {"train_loss": -37.434566497802734, "global_step": 223298, "epoch": 1845} {"train_loss": -38.593013763427734, "global_step": 223299, "epoch": 1845} {"train_loss": -40.19719314575195, "global_step": 223300, "epoch": 1845} {"train_loss": -25.373870849609375, "global_step": 223301, "epoch": 1845} {"train_loss": -39.48670196533203, "global_step": 223302, "epoch": 1845} {"train_loss": -39.431209564208984, "global_step": 223303, "epoch": 1845} {"train_loss": -37.35761642456055, "global_step": 223304, "epoch": 1845} {"train_loss": -31.463403701782227, "global_step": 223305, "epoch": 1845} {"train_loss": -39.80390548706055, "global_step": 223306, "epoch": 1845} {"train_loss": -38.93632125854492, "global_step": 223307, "epoch": 1845} {"train_loss": -38.90357971191406, "global_step": 223308, "epoch": 1845} {"train_loss": -35.880035400390625, "global_step": 223309, "epoch": 1845} {"train_loss": -38.35425567626953, "global_step": 223310, "epoch": 1845} {"train_loss": -32.35421371459961, "global_step": 223311, "epoch": 1845} {"train_loss": -32.582733154296875, "global_step": 223312, "epoch": 1845} {"train_loss": -34.28827667236328, "global_step": 223313, "epoch": 1845} {"train_loss": -38.6637077331543, "global_step": 223314, "epoch": 1845} {"train_loss": -38.04578399658203, "global_step": 223315, "epoch": 1845} {"train_loss": -34.42204666137695, "global_step": 223316, "epoch": 1845} {"train_loss": -35.41657638549805, "global_step": 223317, "epoch": 1845} {"train_loss": -35.4044303894043, "global_step": 223318, "epoch": 1845} {"train_loss": -37.899227142333984, "global_step": 223319, "epoch": 1845} {"train_loss": -36.91810607910156, "global_step": 223320, "epoch": 1845} {"train_loss": -37.408203125, "global_step": 223321, "epoch": 1845} {"train_loss": -37.722816467285156, "global_step": 223322, "epoch": 1845} {"train_loss": -38.96528625488281, "global_step": 223323, "epoch": 1845} {"train_loss": -38.336673736572266, "global_step": 223324, "epoch": 1845} {"train_loss": -39.305999755859375, "global_step": 223325, "epoch": 1845} {"train_loss": -35.04597091674805, "global_step": 223326, "epoch": 1845} {"train_loss": -36.38483810424805, "global_step": 223327, "epoch": 1845} {"train_loss": -37.82012176513672, "global_step": 223328, "epoch": 1845} {"train_loss": -36.488399505615234, "global_step": 223329, "epoch": 1845} {"train_loss": -38.61427307128906, "global_step": 223330, "epoch": 1845} {"train_loss": -37.219051361083984, "global_step": 223331, "epoch": 1845} {"train_loss": -36.750091552734375, "global_step": 223332, "epoch": 1845} {"train_loss": -39.75533676147461, "global_step": 223333, "epoch": 1845} {"train_loss": -38.678585052490234, "global_step": 223334, "epoch": 1845} {"train_loss": -38.73299789428711, "global_step": 223335, "epoch": 1845} {"train_loss": -38.88200378417969, "global_step": 223336, "epoch": 1845} {"train_loss": -36.47563171386719, "global_step": 223337, "epoch": 1845} {"train_loss": -39.057899475097656, "global_step": 223338, "epoch": 1845} {"train_loss": -39.84467315673828, "global_step": 223339, "epoch": 1845} {"train_loss": -37.317970275878906, "global_step": 223340, "epoch": 1845} {"train_loss": -40.09755325317383, "global_step": 223341, "epoch": 1845} {"train_loss": -38.63039016723633, "global_step": 223342, "epoch": 1845} {"train_loss": -36.580135345458984, "global_step": 223343, "epoch": 1845} {"train_loss": -40.31650924682617, "global_step": 223344, "epoch": 1845} {"train_loss": -37.07529830932617, "global_step": 223345, "epoch": 1845} {"train_loss": -36.177635192871094, "global_step": 223346, "epoch": 1845} {"train_loss": -39.48270797729492, "global_step": 223347, "epoch": 1845} {"train_loss": -37.13956069946289, "global_step": 223348, "epoch": 1845} {"train_loss": -38.54230880737305, "global_step": 223349, "epoch": 1845} {"train_loss": -39.85810089111328, "global_step": 223350, "epoch": 1845} {"train_loss": -38.701515197753906, "global_step": 223351, "epoch": 1845} {"train_loss": -39.107112884521484, "global_step": 223352, "epoch": 1845} {"train_loss": -39.364013671875, "global_step": 223353, "epoch": 1845} {"train_loss": -40.47507858276367, "global_step": 223354, "epoch": 1845} {"train_loss": -39.776851654052734, "global_step": 223355, "epoch": 1845} {"train_loss": -39.89496994018555, "global_step": 223356, "epoch": 1845} {"train_loss": -39.49135971069336, "global_step": 223357, "epoch": 1845} {"train_loss": -40.1908073425293, "global_step": 223358, "epoch": 1845} {"train_loss": -39.75983810424805, "global_step": 223359, "epoch": 1845} {"train_loss": -39.679443359375, "global_step": 223360, "epoch": 1845} {"train_loss": -40.703216552734375, "global_step": 223361, "epoch": 1845} {"train_loss": -39.507720947265625, "global_step": 223362, "epoch": 1845} {"train_loss": -39.317508697509766, "global_step": 223363, "epoch": 1845} {"train_loss": -40.63572692871094, "global_step": 223364, "epoch": 1845} {"train_loss": -39.04354185309292, "global_step": 223365, "epoch": 1845, "val_loss": 2795086.0} {"train_loss": -40.702396392822266, "global_step": 223366, "epoch": 1846} {"train_loss": -40.88486862182617, "global_step": 223367, "epoch": 1846} {"train_loss": -40.778812408447266, "global_step": 223368, "epoch": 1846} {"train_loss": -41.011627197265625, "global_step": 223369, "epoch": 1846} {"train_loss": -40.246456146240234, "global_step": 223370, "epoch": 1846} {"train_loss": -40.41862487792969, "global_step": 223371, "epoch": 1846} {"train_loss": -40.68953323364258, "global_step": 223372, "epoch": 1846} {"train_loss": -40.50883102416992, "global_step": 223373, "epoch": 1846} {"train_loss": -40.998626708984375, "global_step": 223374, "epoch": 1846} {"train_loss": -40.44511795043945, "global_step": 223375, "epoch": 1846} {"train_loss": -40.42179489135742, "global_step": 223376, "epoch": 1846} {"train_loss": -41.24789810180664, "global_step": 223377, "epoch": 1846} {"train_loss": -40.1744270324707, "global_step": 223378, "epoch": 1846} {"train_loss": -40.42013931274414, "global_step": 223379, "epoch": 1846} {"train_loss": -40.639923095703125, "global_step": 223380, "epoch": 1846} {"train_loss": -40.46354293823242, "global_step": 223381, "epoch": 1846} {"train_loss": -41.09500503540039, "global_step": 223382, "epoch": 1846} {"train_loss": -40.624794006347656, "global_step": 223383, "epoch": 1846} {"train_loss": -40.97477722167969, "global_step": 223384, "epoch": 1846} {"train_loss": -40.68501663208008, "global_step": 223385, "epoch": 1846} {"train_loss": -40.067996978759766, "global_step": 223386, "epoch": 1846} {"train_loss": -40.613582611083984, "global_step": 223387, "epoch": 1846} {"train_loss": -41.3480339050293, "global_step": 223388, "epoch": 1846} {"train_loss": -40.12964630126953, "global_step": 223389, "epoch": 1846} {"train_loss": -41.85108184814453, "global_step": 223390, "epoch": 1846} {"train_loss": -40.60028839111328, "global_step": 223391, "epoch": 1846} {"train_loss": -39.900115966796875, "global_step": 223392, "epoch": 1846} {"train_loss": -40.92666244506836, "global_step": 223393, "epoch": 1846} {"train_loss": -41.12076950073242, "global_step": 223394, "epoch": 1846} {"train_loss": -41.232337951660156, "global_step": 223395, "epoch": 1846} {"train_loss": -40.868289947509766, "global_step": 223396, "epoch": 1846} {"train_loss": -40.82501220703125, "global_step": 223397, "epoch": 1846} {"train_loss": -41.49267578125, "global_step": 223398, "epoch": 1846} {"train_loss": -41.0361328125, "global_step": 223399, "epoch": 1846} {"train_loss": -40.8974609375, "global_step": 223400, "epoch": 1846} {"train_loss": -40.77979278564453, "global_step": 223401, "epoch": 1846} {"train_loss": -41.086708068847656, "global_step": 223402, "epoch": 1846} {"train_loss": -41.56781768798828, "global_step": 223403, "epoch": 1846} {"train_loss": -41.039710998535156, "global_step": 223404, "epoch": 1846} {"train_loss": -41.10301208496094, "global_step": 223405, "epoch": 1846} {"train_loss": -41.85451889038086, "global_step": 223406, "epoch": 1846} {"train_loss": -41.089759826660156, "global_step": 223407, "epoch": 1846} {"train_loss": -41.5909538269043, "global_step": 223408, "epoch": 1846} {"train_loss": -40.60701370239258, "global_step": 223409, "epoch": 1846} {"train_loss": -41.854217529296875, "global_step": 223410, "epoch": 1846} {"train_loss": -41.69757080078125, "global_step": 223411, "epoch": 1846} {"train_loss": -41.96486282348633, "global_step": 223412, "epoch": 1846} {"train_loss": -41.83637619018555, "global_step": 223413, "epoch": 1846} {"train_loss": -41.8067741394043, "global_step": 223414, "epoch": 1846} {"train_loss": -41.266387939453125, "global_step": 223415, "epoch": 1846} {"train_loss": -41.12393569946289, "global_step": 223416, "epoch": 1846} {"train_loss": -41.7982292175293, "global_step": 223417, "epoch": 1846} {"train_loss": -41.51617431640625, "global_step": 223418, "epoch": 1846} {"train_loss": -41.322608947753906, "global_step": 223419, "epoch": 1846} {"train_loss": -40.70015335083008, "global_step": 223420, "epoch": 1846} {"train_loss": -41.71042251586914, "global_step": 223421, "epoch": 1846} {"train_loss": -41.97291946411133, "global_step": 223422, "epoch": 1846} {"train_loss": -40.624202728271484, "global_step": 223423, "epoch": 1846} {"train_loss": -42.06779861450195, "global_step": 223424, "epoch": 1846} {"train_loss": -40.4771614074707, "global_step": 223425, "epoch": 1846} {"train_loss": -40.52180099487305, "global_step": 223426, "epoch": 1846} {"train_loss": -41.15810775756836, "global_step": 223427, "epoch": 1846} {"train_loss": -40.514766693115234, "global_step": 223428, "epoch": 1846} {"train_loss": -40.86921310424805, "global_step": 223429, "epoch": 1846} {"train_loss": -38.81992721557617, "global_step": 223430, "epoch": 1846} {"train_loss": -33.437374114990234, "global_step": 223431, "epoch": 1846} {"train_loss": -29.742023468017578, "global_step": 223432, "epoch": 1846} {"train_loss": -33.222869873046875, "global_step": 223433, "epoch": 1846} {"train_loss": -37.294281005859375, "global_step": 223434, "epoch": 1846} {"train_loss": -37.23011016845703, "global_step": 223435, "epoch": 1846} {"train_loss": -35.39675521850586, "global_step": 223436, "epoch": 1846} {"train_loss": -31.194263458251953, "global_step": 223437, "epoch": 1846} {"train_loss": -34.10866928100586, "global_step": 223438, "epoch": 1846} {"train_loss": -24.763065338134766, "global_step": 223439, "epoch": 1846} {"train_loss": -23.141847610473633, "global_step": 223440, "epoch": 1846} {"train_loss": -34.1898193359375, "global_step": 223441, "epoch": 1846} {"train_loss": -37.6337890625, "global_step": 223442, "epoch": 1846} {"train_loss": -32.106658935546875, "global_step": 223443, "epoch": 1846} {"train_loss": -34.72199630737305, "global_step": 223444, "epoch": 1846} {"train_loss": -38.428863525390625, "global_step": 223445, "epoch": 1846} {"train_loss": -28.246103286743164, "global_step": 223446, "epoch": 1846} {"train_loss": -37.24280548095703, "global_step": 223447, "epoch": 1846} {"train_loss": -36.71158218383789, "global_step": 223448, "epoch": 1846} {"train_loss": -33.961421966552734, "global_step": 223449, "epoch": 1846} {"train_loss": -35.634796142578125, "global_step": 223450, "epoch": 1846} {"train_loss": -38.329383850097656, "global_step": 223451, "epoch": 1846} {"train_loss": -35.26177978515625, "global_step": 223452, "epoch": 1846} {"train_loss": -34.648033142089844, "global_step": 223453, "epoch": 1846} {"train_loss": -37.82133102416992, "global_step": 223454, "epoch": 1846} {"train_loss": -38.83238983154297, "global_step": 223455, "epoch": 1846} {"train_loss": -38.2510871887207, "global_step": 223456, "epoch": 1846} {"train_loss": -37.15727233886719, "global_step": 223457, "epoch": 1846} {"train_loss": -38.771724700927734, "global_step": 223458, "epoch": 1846} {"train_loss": -37.5223388671875, "global_step": 223459, "epoch": 1846} {"train_loss": -38.746803283691406, "global_step": 223460, "epoch": 1846} {"train_loss": -38.08885192871094, "global_step": 223461, "epoch": 1846} {"train_loss": -39.34843063354492, "global_step": 223462, "epoch": 1846} {"train_loss": -38.87329864501953, "global_step": 223463, "epoch": 1846} {"train_loss": -39.72690963745117, "global_step": 223464, "epoch": 1846} {"train_loss": -40.20331954956055, "global_step": 223465, "epoch": 1846} {"train_loss": -39.62162780761719, "global_step": 223466, "epoch": 1846} {"train_loss": -39.268428802490234, "global_step": 223467, "epoch": 1846} {"train_loss": -39.54330062866211, "global_step": 223468, "epoch": 1846} {"train_loss": -39.926666259765625, "global_step": 223469, "epoch": 1846} {"train_loss": -39.805843353271484, "global_step": 223470, "epoch": 1846} {"train_loss": -39.59690475463867, "global_step": 223471, "epoch": 1846} {"train_loss": -39.350032806396484, "global_step": 223472, "epoch": 1846} {"train_loss": -40.31588363647461, "global_step": 223473, "epoch": 1846} {"train_loss": -39.099117279052734, "global_step": 223474, "epoch": 1846} {"train_loss": -39.69203567504883, "global_step": 223475, "epoch": 1846} {"train_loss": -40.26332473754883, "global_step": 223476, "epoch": 1846} {"train_loss": -39.71084213256836, "global_step": 223477, "epoch": 1846} {"train_loss": -39.97737503051758, "global_step": 223478, "epoch": 1846} {"train_loss": -40.24431228637695, "global_step": 223479, "epoch": 1846} {"train_loss": -40.073463439941406, "global_step": 223480, "epoch": 1846} {"train_loss": -40.67973709106445, "global_step": 223481, "epoch": 1846} {"train_loss": -40.64187240600586, "global_step": 223482, "epoch": 1846} {"train_loss": -40.192623138427734, "global_step": 223483, "epoch": 1846} {"train_loss": -40.200538635253906, "global_step": 223484, "epoch": 1846} {"train_loss": -40.24708938598633, "global_step": 223485, "epoch": 1846} {"train_loss": -39.19022873807545, "global_step": 223486, "epoch": 1846, "val_loss": 2615025.75} {"train_loss": -40.2364501953125, "global_step": 223487, "epoch": 1847} {"train_loss": -40.94472122192383, "global_step": 223488, "epoch": 1847} {"train_loss": -40.2959098815918, "global_step": 223489, "epoch": 1847} {"train_loss": -40.66718292236328, "global_step": 223490, "epoch": 1847} {"train_loss": -40.78618240356445, "global_step": 223491, "epoch": 1847} {"train_loss": -40.49605178833008, "global_step": 223492, "epoch": 1847} {"train_loss": -40.959529876708984, "global_step": 223493, "epoch": 1847} {"train_loss": -39.91316604614258, "global_step": 223494, "epoch": 1847} {"train_loss": -41.09357452392578, "global_step": 223495, "epoch": 1847} {"train_loss": -40.786163330078125, "global_step": 223496, "epoch": 1847} {"train_loss": -40.89054489135742, "global_step": 223497, "epoch": 1847} {"train_loss": -41.41957092285156, "global_step": 223498, "epoch": 1847} {"train_loss": -41.14863204956055, "global_step": 223499, "epoch": 1847} {"train_loss": -41.48577880859375, "global_step": 223500, "epoch": 1847} {"train_loss": -41.21139144897461, "global_step": 223501, "epoch": 1847} {"train_loss": -41.30467987060547, "global_step": 223502, "epoch": 1847} {"train_loss": -41.43036651611328, "global_step": 223503, "epoch": 1847} {"train_loss": -41.538509368896484, "global_step": 223504, "epoch": 1847} {"train_loss": -40.7634162902832, "global_step": 223505, "epoch": 1847} {"train_loss": -41.61553192138672, "global_step": 223506, "epoch": 1847} {"train_loss": -41.2081184387207, "global_step": 223507, "epoch": 1847} {"train_loss": -41.7395133972168, "global_step": 223508, "epoch": 1847} {"train_loss": -41.27880859375, "global_step": 223509, "epoch": 1847} {"train_loss": -41.78902816772461, "global_step": 223510, "epoch": 1847} {"train_loss": -41.61861801147461, "global_step": 223511, "epoch": 1847} {"train_loss": -41.50703430175781, "global_step": 223512, "epoch": 1847} {"train_loss": -41.938507080078125, "global_step": 223513, "epoch": 1847} {"train_loss": -41.904090881347656, "global_step": 223514, "epoch": 1847} {"train_loss": -41.96706008911133, "global_step": 223515, "epoch": 1847} {"train_loss": -41.9857292175293, "global_step": 223516, "epoch": 1847} {"train_loss": -41.6324462890625, "global_step": 223517, "epoch": 1847} {"train_loss": -41.74971008300781, "global_step": 223518, "epoch": 1847} {"train_loss": -42.20615005493164, "global_step": 223519, "epoch": 1847} {"train_loss": -41.7653694152832, "global_step": 223520, "epoch": 1847} {"train_loss": -41.6452751159668, "global_step": 223521, "epoch": 1847} {"train_loss": -40.127986907958984, "global_step": 223522, "epoch": 1847} {"train_loss": -41.63523864746094, "global_step": 223523, "epoch": 1847} {"train_loss": -41.86550521850586, "global_step": 223524, "epoch": 1847} {"train_loss": -40.40642547607422, "global_step": 223525, "epoch": 1847} {"train_loss": -41.36110305786133, "global_step": 223526, "epoch": 1847} {"train_loss": -41.01790237426758, "global_step": 223527, "epoch": 1847} {"train_loss": -41.02546310424805, "global_step": 223528, "epoch": 1847} {"train_loss": -37.1823844909668, "global_step": 223529, "epoch": 1847} {"train_loss": -41.9650764465332, "global_step": 223530, "epoch": 1847} {"train_loss": -42.06235885620117, "global_step": 223531, "epoch": 1847} {"train_loss": -40.9953498840332, "global_step": 223532, "epoch": 1847} {"train_loss": -40.152565002441406, "global_step": 223533, "epoch": 1847} {"train_loss": -40.09929275512695, "global_step": 223534, "epoch": 1847} {"train_loss": -41.685665130615234, "global_step": 223535, "epoch": 1847} {"train_loss": -41.00710678100586, "global_step": 223536, "epoch": 1847} {"train_loss": -41.31964111328125, "global_step": 223537, "epoch": 1847} {"train_loss": -41.710140228271484, "global_step": 223538, "epoch": 1847} {"train_loss": -40.61478805541992, "global_step": 223539, "epoch": 1847} {"train_loss": -41.74531173706055, "global_step": 223540, "epoch": 1847} {"train_loss": -41.47673416137695, "global_step": 223541, "epoch": 1847} {"train_loss": -42.09051513671875, "global_step": 223542, "epoch": 1847} {"train_loss": -41.36256790161133, "global_step": 223543, "epoch": 1847} {"train_loss": -41.55143356323242, "global_step": 223544, "epoch": 1847} {"train_loss": -41.7648811340332, "global_step": 223545, "epoch": 1847} {"train_loss": -41.913787841796875, "global_step": 223546, "epoch": 1847} {"train_loss": -40.50088119506836, "global_step": 223547, "epoch": 1847} {"train_loss": -30.717121124267578, "global_step": 223548, "epoch": 1847} {"train_loss": -41.6643180847168, "global_step": 223549, "epoch": 1847} {"train_loss": -41.0648078918457, "global_step": 223550, "epoch": 1847} {"train_loss": -39.107460021972656, "global_step": 223551, "epoch": 1847} {"train_loss": -41.37671661376953, "global_step": 223552, "epoch": 1847} {"train_loss": -41.907772064208984, "global_step": 223553, "epoch": 1847} {"train_loss": -41.24448776245117, "global_step": 223554, "epoch": 1847} {"train_loss": -37.73805236816406, "global_step": 223555, "epoch": 1847} {"train_loss": -27.77411460876465, "global_step": 223556, "epoch": 1847} {"train_loss": -40.87665939331055, "global_step": 223557, "epoch": 1847} {"train_loss": -41.157772064208984, "global_step": 223558, "epoch": 1847} {"train_loss": -36.86459732055664, "global_step": 223559, "epoch": 1847} {"train_loss": -37.81524658203125, "global_step": 223560, "epoch": 1847} {"train_loss": -37.997833251953125, "global_step": 223561, "epoch": 1847} {"train_loss": -33.30279541015625, "global_step": 223562, "epoch": 1847} {"train_loss": -34.64805221557617, "global_step": 223563, "epoch": 1847} {"train_loss": -39.278011322021484, "global_step": 223564, "epoch": 1847} {"train_loss": -40.0127067565918, "global_step": 223565, "epoch": 1847} {"train_loss": -38.346900939941406, "global_step": 223566, "epoch": 1847} {"train_loss": -39.930381774902344, "global_step": 223567, "epoch": 1847} {"train_loss": -38.4718132019043, "global_step": 223568, "epoch": 1847} {"train_loss": -39.07767105102539, "global_step": 223569, "epoch": 1847} {"train_loss": -40.21528244018555, "global_step": 223570, "epoch": 1847} {"train_loss": -38.203861236572266, "global_step": 223571, "epoch": 1847} {"train_loss": -38.87568664550781, "global_step": 223572, "epoch": 1847} {"train_loss": -40.13065719604492, "global_step": 223573, "epoch": 1847} {"train_loss": -39.566261291503906, "global_step": 223574, "epoch": 1847} {"train_loss": -40.61465072631836, "global_step": 223575, "epoch": 1847} {"train_loss": -36.639041900634766, "global_step": 223576, "epoch": 1847} {"train_loss": -38.228511810302734, "global_step": 223577, "epoch": 1847} {"train_loss": -40.84100341796875, "global_step": 223578, "epoch": 1847} {"train_loss": -40.87617111206055, "global_step": 223579, "epoch": 1847} {"train_loss": -36.86176681518555, "global_step": 223580, "epoch": 1847} {"train_loss": -39.9937629699707, "global_step": 223581, "epoch": 1847} {"train_loss": -38.88270950317383, "global_step": 223582, "epoch": 1847} {"train_loss": -40.6576042175293, "global_step": 223583, "epoch": 1847} {"train_loss": -40.61591720581055, "global_step": 223584, "epoch": 1847} {"train_loss": -40.052581787109375, "global_step": 223585, "epoch": 1847} {"train_loss": -39.37457275390625, "global_step": 223586, "epoch": 1847} {"train_loss": -39.84465408325195, "global_step": 223587, "epoch": 1847} {"train_loss": -40.47124099731445, "global_step": 223588, "epoch": 1847} {"train_loss": -40.12313461303711, "global_step": 223589, "epoch": 1847} {"train_loss": -40.58740234375, "global_step": 223590, "epoch": 1847} {"train_loss": -39.49064636230469, "global_step": 223591, "epoch": 1847} {"train_loss": -35.827999114990234, "global_step": 223592, "epoch": 1847} {"train_loss": -40.59996795654297, "global_step": 223593, "epoch": 1847} {"train_loss": -40.58546447753906, "global_step": 223594, "epoch": 1847} {"train_loss": -40.08332061767578, "global_step": 223595, "epoch": 1847} {"train_loss": -39.7548828125, "global_step": 223596, "epoch": 1847} {"train_loss": -40.5728759765625, "global_step": 223597, "epoch": 1847} {"train_loss": -40.8825569152832, "global_step": 223598, "epoch": 1847} {"train_loss": -40.968021392822266, "global_step": 223599, "epoch": 1847} {"train_loss": -40.833839416503906, "global_step": 223600, "epoch": 1847} {"train_loss": -41.28731918334961, "global_step": 223601, "epoch": 1847} {"train_loss": -41.27962875366211, "global_step": 223602, "epoch": 1847} {"train_loss": -40.22602462768555, "global_step": 223603, "epoch": 1847} {"train_loss": -40.622920989990234, "global_step": 223604, "epoch": 1847} {"train_loss": -39.77183151245117, "global_step": 223605, "epoch": 1847} {"train_loss": -39.257537841796875, "global_step": 223606, "epoch": 1847} {"train_loss": -40.238913528190174, "global_step": 223607, "epoch": 1847, "val_loss": 2454545.75} {"train_loss": -39.329833984375, "global_step": 223608, "epoch": 1848} {"train_loss": -41.58783721923828, "global_step": 223609, "epoch": 1848} {"train_loss": -39.056880950927734, "global_step": 223610, "epoch": 1848} {"train_loss": -41.55222702026367, "global_step": 223611, "epoch": 1848} {"train_loss": -41.2015266418457, "global_step": 223612, "epoch": 1848} {"train_loss": -41.13554763793945, "global_step": 223613, "epoch": 1848} {"train_loss": -41.10380935668945, "global_step": 223614, "epoch": 1848} {"train_loss": -41.538124084472656, "global_step": 223615, "epoch": 1848} {"train_loss": -40.57718276977539, "global_step": 223616, "epoch": 1848} {"train_loss": -40.411964416503906, "global_step": 223617, "epoch": 1848} {"train_loss": -39.83797073364258, "global_step": 223618, "epoch": 1848} {"train_loss": -40.9732551574707, "global_step": 223619, "epoch": 1848} {"train_loss": -41.3953742980957, "global_step": 223620, "epoch": 1848} {"train_loss": -41.049293518066406, "global_step": 223621, "epoch": 1848} {"train_loss": -40.95571517944336, "global_step": 223622, "epoch": 1848} {"train_loss": -40.99254608154297, "global_step": 223623, "epoch": 1848} {"train_loss": -41.72391891479492, "global_step": 223624, "epoch": 1848} {"train_loss": -40.926937103271484, "global_step": 223625, "epoch": 1848} {"train_loss": -41.70003128051758, "global_step": 223626, "epoch": 1848} {"train_loss": -40.9441032409668, "global_step": 223627, "epoch": 1848} {"train_loss": -41.608882904052734, "global_step": 223628, "epoch": 1848} {"train_loss": -41.430908203125, "global_step": 223629, "epoch": 1848} {"train_loss": -38.45455551147461, "global_step": 223630, "epoch": 1848} {"train_loss": -41.22298049926758, "global_step": 223631, "epoch": 1848} {"train_loss": -41.252716064453125, "global_step": 223632, "epoch": 1848} {"train_loss": -40.20211410522461, "global_step": 223633, "epoch": 1848} {"train_loss": -40.6939697265625, "global_step": 223634, "epoch": 1848} {"train_loss": -40.755435943603516, "global_step": 223635, "epoch": 1848} {"train_loss": -40.47419357299805, "global_step": 223636, "epoch": 1848} {"train_loss": -40.532936096191406, "global_step": 223637, "epoch": 1848} {"train_loss": -40.382057189941406, "global_step": 223638, "epoch": 1848} {"train_loss": -41.371238708496094, "global_step": 223639, "epoch": 1848} {"train_loss": -39.490596771240234, "global_step": 223640, "epoch": 1848} {"train_loss": -40.139286041259766, "global_step": 223641, "epoch": 1848} {"train_loss": -40.576148986816406, "global_step": 223642, "epoch": 1848} {"train_loss": -42.058868408203125, "global_step": 223643, "epoch": 1848} {"train_loss": -41.078704833984375, "global_step": 223644, "epoch": 1848} {"train_loss": -38.199344635009766, "global_step": 223645, "epoch": 1848} {"train_loss": -41.85921096801758, "global_step": 223646, "epoch": 1848} {"train_loss": -41.83810806274414, "global_step": 223647, "epoch": 1848} {"train_loss": -41.5118522644043, "global_step": 223648, "epoch": 1848} {"train_loss": -41.63441848754883, "global_step": 223649, "epoch": 1848} {"train_loss": -41.10246658325195, "global_step": 223650, "epoch": 1848} {"train_loss": -41.8171501159668, "global_step": 223651, "epoch": 1848} {"train_loss": -40.65917205810547, "global_step": 223652, "epoch": 1848} {"train_loss": -41.70343780517578, "global_step": 223653, "epoch": 1848} {"train_loss": -41.917022705078125, "global_step": 223654, "epoch": 1848} {"train_loss": -41.25912857055664, "global_step": 223655, "epoch": 1848} {"train_loss": -41.487098693847656, "global_step": 223656, "epoch": 1848} {"train_loss": -40.48695755004883, "global_step": 223657, "epoch": 1848} {"train_loss": -41.41671371459961, "global_step": 223658, "epoch": 1848} {"train_loss": -40.65278625488281, "global_step": 223659, "epoch": 1848} {"train_loss": -38.885841369628906, "global_step": 223660, "epoch": 1848} {"train_loss": -41.38496780395508, "global_step": 223661, "epoch": 1848} {"train_loss": -40.53739547729492, "global_step": 223662, "epoch": 1848} {"train_loss": -40.18805694580078, "global_step": 223663, "epoch": 1848} {"train_loss": -39.52119064331055, "global_step": 223664, "epoch": 1848} {"train_loss": -40.79888916015625, "global_step": 223665, "epoch": 1848} {"train_loss": -41.57021713256836, "global_step": 223666, "epoch": 1848} {"train_loss": -41.457862854003906, "global_step": 223667, "epoch": 1848} {"train_loss": -40.60089111328125, "global_step": 223668, "epoch": 1848} {"train_loss": -40.3267822265625, "global_step": 223669, "epoch": 1848} {"train_loss": -40.058345794677734, "global_step": 223670, "epoch": 1848} {"train_loss": -39.25503921508789, "global_step": 223671, "epoch": 1848} {"train_loss": -38.59275436401367, "global_step": 223672, "epoch": 1848} {"train_loss": -38.76312255859375, "global_step": 223673, "epoch": 1848} {"train_loss": -40.4467887878418, "global_step": 223674, "epoch": 1848} {"train_loss": -40.526920318603516, "global_step": 223675, "epoch": 1848} {"train_loss": -38.44449234008789, "global_step": 223676, "epoch": 1848} {"train_loss": -39.753456115722656, "global_step": 223677, "epoch": 1848} {"train_loss": -41.20711135864258, "global_step": 223678, "epoch": 1848} {"train_loss": -41.1928596496582, "global_step": 223679, "epoch": 1848} {"train_loss": -38.6613655090332, "global_step": 223680, "epoch": 1848} {"train_loss": -40.20785140991211, "global_step": 223681, "epoch": 1848} {"train_loss": -41.1518669128418, "global_step": 223682, "epoch": 1848} {"train_loss": -40.13658142089844, "global_step": 223683, "epoch": 1848} {"train_loss": -38.73030090332031, "global_step": 223684, "epoch": 1848} {"train_loss": -41.06882858276367, "global_step": 223685, "epoch": 1848} {"train_loss": -39.577796936035156, "global_step": 223686, "epoch": 1848} {"train_loss": -39.94584655761719, "global_step": 223687, "epoch": 1848} {"train_loss": -40.38446044921875, "global_step": 223688, "epoch": 1848} {"train_loss": -40.0673713684082, "global_step": 223689, "epoch": 1848} {"train_loss": -40.09304428100586, "global_step": 223690, "epoch": 1848} {"train_loss": -41.18686294555664, "global_step": 223691, "epoch": 1848} {"train_loss": -40.289039611816406, "global_step": 223692, "epoch": 1848} {"train_loss": -40.18915939331055, "global_step": 223693, "epoch": 1848} {"train_loss": -40.191192626953125, "global_step": 223694, "epoch": 1848} {"train_loss": -40.165348052978516, "global_step": 223695, "epoch": 1848} {"train_loss": -40.89043045043945, "global_step": 223696, "epoch": 1848} {"train_loss": -40.24034881591797, "global_step": 223697, "epoch": 1848} {"train_loss": -40.96464920043945, "global_step": 223698, "epoch": 1848} {"train_loss": -40.32814407348633, "global_step": 223699, "epoch": 1848} {"train_loss": -40.61281967163086, "global_step": 223700, "epoch": 1848} {"train_loss": -41.477325439453125, "global_step": 223701, "epoch": 1848} {"train_loss": -40.8884391784668, "global_step": 223702, "epoch": 1848} {"train_loss": -40.76176452636719, "global_step": 223703, "epoch": 1848} {"train_loss": -40.994327545166016, "global_step": 223704, "epoch": 1848} {"train_loss": -39.38556671142578, "global_step": 223705, "epoch": 1848} {"train_loss": -41.361602783203125, "global_step": 223706, "epoch": 1848} {"train_loss": -40.60438919067383, "global_step": 223707, "epoch": 1848} {"train_loss": -41.22285842895508, "global_step": 223708, "epoch": 1848} {"train_loss": -41.18959426879883, "global_step": 223709, "epoch": 1848} {"train_loss": -41.352115631103516, "global_step": 223710, "epoch": 1848} {"train_loss": -41.68922424316406, "global_step": 223711, "epoch": 1848} {"train_loss": -41.19424057006836, "global_step": 223712, "epoch": 1848} {"train_loss": -40.731048583984375, "global_step": 223713, "epoch": 1848} {"train_loss": -41.51375961303711, "global_step": 223714, "epoch": 1848} {"train_loss": -41.602561950683594, "global_step": 223715, "epoch": 1848} {"train_loss": -41.438819885253906, "global_step": 223716, "epoch": 1848} {"train_loss": -41.69569778442383, "global_step": 223717, "epoch": 1848} {"train_loss": -41.406307220458984, "global_step": 223718, "epoch": 1848} {"train_loss": -41.45241928100586, "global_step": 223719, "epoch": 1848} {"train_loss": -41.92538070678711, "global_step": 223720, "epoch": 1848} {"train_loss": -41.06099319458008, "global_step": 223721, "epoch": 1848} {"train_loss": -41.895408630371094, "global_step": 223722, "epoch": 1848} {"train_loss": -42.211212158203125, "global_step": 223723, "epoch": 1848} {"train_loss": -41.634883880615234, "global_step": 223724, "epoch": 1848} {"train_loss": -42.318092346191406, "global_step": 223725, "epoch": 1848} {"train_loss": -42.04667282104492, "global_step": 223726, "epoch": 1848} {"train_loss": -41.970272064208984, "global_step": 223727, "epoch": 1848} {"train_loss": -40.78701693952576, "global_step": 223728, "epoch": 1848, "val_loss": 2466877.25} {"train_loss": -41.76464080810547, "global_step": 223729, "epoch": 1849} {"train_loss": -42.14045333862305, "global_step": 223730, "epoch": 1849} {"train_loss": -41.927978515625, "global_step": 223731, "epoch": 1849} {"train_loss": -41.41953659057617, "global_step": 223732, "epoch": 1849} {"train_loss": -42.37409591674805, "global_step": 223733, "epoch": 1849} {"train_loss": -41.006771087646484, "global_step": 223734, "epoch": 1849} {"train_loss": -41.22519302368164, "global_step": 223735, "epoch": 1849} {"train_loss": -42.440895080566406, "global_step": 223736, "epoch": 1849} {"train_loss": -41.764827728271484, "global_step": 223737, "epoch": 1849} {"train_loss": -41.50517272949219, "global_step": 223738, "epoch": 1849} {"train_loss": -41.46625900268555, "global_step": 223739, "epoch": 1849} {"train_loss": -41.69545364379883, "global_step": 223740, "epoch": 1849} {"train_loss": -41.41980743408203, "global_step": 223741, "epoch": 1849} {"train_loss": -38.905784606933594, "global_step": 223742, "epoch": 1849} {"train_loss": -39.438392639160156, "global_step": 223743, "epoch": 1849} {"train_loss": -40.76241683959961, "global_step": 223744, "epoch": 1849} {"train_loss": -40.74564743041992, "global_step": 223745, "epoch": 1849} {"train_loss": -41.674922943115234, "global_step": 223746, "epoch": 1849} {"train_loss": -39.38656997680664, "global_step": 223747, "epoch": 1849} {"train_loss": -36.6848030090332, "global_step": 223748, "epoch": 1849} {"train_loss": -24.13882827758789, "global_step": 223749, "epoch": 1849} {"train_loss": -22.179248809814453, "global_step": 223750, "epoch": 1849} {"train_loss": -38.44573974609375, "global_step": 223751, "epoch": 1849} {"train_loss": -35.22787094116211, "global_step": 223752, "epoch": 1849} {"train_loss": -28.8437442779541, "global_step": 223753, "epoch": 1849} {"train_loss": -40.53407287597656, "global_step": 223754, "epoch": 1849} {"train_loss": -30.471899032592773, "global_step": 223755, "epoch": 1849} {"train_loss": -35.09461212158203, "global_step": 223756, "epoch": 1849} {"train_loss": -33.42860794067383, "global_step": 223757, "epoch": 1849} {"train_loss": -32.96497344970703, "global_step": 223758, "epoch": 1849} {"train_loss": -35.46736145019531, "global_step": 223759, "epoch": 1849} {"train_loss": -32.26134490966797, "global_step": 223760, "epoch": 1849} {"train_loss": -37.4130859375, "global_step": 223761, "epoch": 1849} {"train_loss": -37.86789321899414, "global_step": 223762, "epoch": 1849} {"train_loss": -35.46803283691406, "global_step": 223763, "epoch": 1849} {"train_loss": -39.229331970214844, "global_step": 223764, "epoch": 1849} {"train_loss": -36.9958381652832, "global_step": 223765, "epoch": 1849} {"train_loss": -39.442176818847656, "global_step": 223766, "epoch": 1849} {"train_loss": -38.06940841674805, "global_step": 223767, "epoch": 1849} {"train_loss": -38.074134826660156, "global_step": 223768, "epoch": 1849} {"train_loss": -38.718605041503906, "global_step": 223769, "epoch": 1849} {"train_loss": -38.4736442565918, "global_step": 223770, "epoch": 1849} {"train_loss": -38.777408599853516, "global_step": 223771, "epoch": 1849} {"train_loss": -39.03280258178711, "global_step": 223772, "epoch": 1849} {"train_loss": -39.7540283203125, "global_step": 223773, "epoch": 1849} {"train_loss": -39.73038101196289, "global_step": 223774, "epoch": 1849} {"train_loss": -40.412879943847656, "global_step": 223775, "epoch": 1849} {"train_loss": -39.075775146484375, "global_step": 223776, "epoch": 1849} {"train_loss": -40.05585861206055, "global_step": 223777, "epoch": 1849} {"train_loss": -40.1132926940918, "global_step": 223778, "epoch": 1849} {"train_loss": -39.8526611328125, "global_step": 223779, "epoch": 1849} {"train_loss": -40.80638122558594, "global_step": 223780, "epoch": 1849} {"train_loss": -40.022579193115234, "global_step": 223781, "epoch": 1849} {"train_loss": -40.244293212890625, "global_step": 223782, "epoch": 1849} {"train_loss": -40.767860412597656, "global_step": 223783, "epoch": 1849} {"train_loss": -40.61202621459961, "global_step": 223784, "epoch": 1849} {"train_loss": -40.728153228759766, "global_step": 223785, "epoch": 1849} {"train_loss": -40.56809616088867, "global_step": 223786, "epoch": 1849} {"train_loss": -41.31672286987305, "global_step": 223787, "epoch": 1849} {"train_loss": -41.067073822021484, "global_step": 223788, "epoch": 1849} {"train_loss": -41.15440368652344, "global_step": 223789, "epoch": 1849} {"train_loss": -41.085853576660156, "global_step": 223790, "epoch": 1849} {"train_loss": -39.53614807128906, "global_step": 223791, "epoch": 1849} {"train_loss": -40.82583236694336, "global_step": 223792, "epoch": 1849} {"train_loss": -41.4955940246582, "global_step": 223793, "epoch": 1849} {"train_loss": -41.25175857543945, "global_step": 223794, "epoch": 1849} {"train_loss": -40.458736419677734, "global_step": 223795, "epoch": 1849} {"train_loss": -40.56050109863281, "global_step": 223796, "epoch": 1849} {"train_loss": -41.20111083984375, "global_step": 223797, "epoch": 1849} {"train_loss": -41.349788665771484, "global_step": 223798, "epoch": 1849} {"train_loss": -40.694515228271484, "global_step": 223799, "epoch": 1849} {"train_loss": -40.54624557495117, "global_step": 223800, "epoch": 1849} {"train_loss": -41.41411590576172, "global_step": 223801, "epoch": 1849} {"train_loss": -41.02849197387695, "global_step": 223802, "epoch": 1849} {"train_loss": -41.250118255615234, "global_step": 223803, "epoch": 1849} {"train_loss": -41.22041702270508, "global_step": 223804, "epoch": 1849} {"train_loss": -41.05027389526367, "global_step": 223805, "epoch": 1849} {"train_loss": -41.84657669067383, "global_step": 223806, "epoch": 1849} {"train_loss": -41.38186264038086, "global_step": 223807, "epoch": 1849} {"train_loss": -41.9073371887207, "global_step": 223808, "epoch": 1849} {"train_loss": -41.95893478393555, "global_step": 223809, "epoch": 1849} {"train_loss": -41.84131622314453, "global_step": 223810, "epoch": 1849} {"train_loss": -42.04895782470703, "global_step": 223811, "epoch": 1849} {"train_loss": -41.877418518066406, "global_step": 223812, "epoch": 1849} {"train_loss": -41.78118896484375, "global_step": 223813, "epoch": 1849} {"train_loss": -41.523799896240234, "global_step": 223814, "epoch": 1849} {"train_loss": -42.040138244628906, "global_step": 223815, "epoch": 1849} {"train_loss": -41.229740142822266, "global_step": 223816, "epoch": 1849} {"train_loss": -41.71672439575195, "global_step": 223817, "epoch": 1849} {"train_loss": -41.9659309387207, "global_step": 223818, "epoch": 1849} {"train_loss": -42.03225326538086, "global_step": 223819, "epoch": 1849} {"train_loss": -40.32612228393555, "global_step": 223820, "epoch": 1849} {"train_loss": -41.8104248046875, "global_step": 223821, "epoch": 1849} {"train_loss": -41.88301467895508, "global_step": 223822, "epoch": 1849} {"train_loss": -41.67979049682617, "global_step": 223823, "epoch": 1849} {"train_loss": -37.79286575317383, "global_step": 223824, "epoch": 1849} {"train_loss": -41.39199447631836, "global_step": 223825, "epoch": 1849} {"train_loss": -41.75838851928711, "global_step": 223826, "epoch": 1849} {"train_loss": -40.675010681152344, "global_step": 223827, "epoch": 1849} {"train_loss": -39.29603576660156, "global_step": 223828, "epoch": 1849} {"train_loss": -40.15079879760742, "global_step": 223829, "epoch": 1849} {"train_loss": -40.808746337890625, "global_step": 223830, "epoch": 1849} {"train_loss": -41.3609619140625, "global_step": 223831, "epoch": 1849} {"train_loss": -40.79697799682617, "global_step": 223832, "epoch": 1849} {"train_loss": -39.63463592529297, "global_step": 223833, "epoch": 1849} {"train_loss": -40.870174407958984, "global_step": 223834, "epoch": 1849} {"train_loss": -41.13411331176758, "global_step": 223835, "epoch": 1849} {"train_loss": -40.801361083984375, "global_step": 223836, "epoch": 1849} {"train_loss": -38.85413360595703, "global_step": 223837, "epoch": 1849} {"train_loss": -41.30198287963867, "global_step": 223838, "epoch": 1849} {"train_loss": -38.901424407958984, "global_step": 223839, "epoch": 1849} {"train_loss": -35.6529655456543, "global_step": 223840, "epoch": 1849} {"train_loss": -39.78238296508789, "global_step": 223841, "epoch": 1849} {"train_loss": -33.84940719604492, "global_step": 223842, "epoch": 1849} {"train_loss": -40.48196029663086, "global_step": 223843, "epoch": 1849} {"train_loss": -31.49595069885254, "global_step": 223844, "epoch": 1849} {"train_loss": -33.994529724121094, "global_step": 223845, "epoch": 1849} {"train_loss": -35.2374382019043, "global_step": 223846, "epoch": 1849} {"train_loss": -33.96309280395508, "global_step": 223847, "epoch": 1849} {"train_loss": -27.134449005126953, "global_step": 223848, "epoch": 1849} {"train_loss": -39.2431068262778, "global_step": 223849, "epoch": 1849, "val_loss": 2491399.25} {"train_loss": -37.49612808227539, "global_step": 223850, "epoch": 1850} {"train_loss": -27.6716251373291, "global_step": 223851, "epoch": 1850} {"train_loss": -28.91731071472168, "global_step": 223852, "epoch": 1850} {"train_loss": -28.590057373046875, "global_step": 223853, "epoch": 1850} {"train_loss": -37.074161529541016, "global_step": 223854, "epoch": 1850} {"train_loss": -35.237098693847656, "global_step": 223855, "epoch": 1850} {"train_loss": -34.313480377197266, "global_step": 223856, "epoch": 1850} {"train_loss": -33.98756790161133, "global_step": 223857, "epoch": 1850} {"train_loss": -34.372623443603516, "global_step": 223858, "epoch": 1850} {"train_loss": -31.5369815826416, "global_step": 223859, "epoch": 1850} {"train_loss": -34.49188232421875, "global_step": 223860, "epoch": 1850} {"train_loss": -34.249088287353516, "global_step": 223861, "epoch": 1850} {"train_loss": -35.93052291870117, "global_step": 223862, "epoch": 1850} {"train_loss": -36.0258903503418, "global_step": 223863, "epoch": 1850} {"train_loss": -35.730506896972656, "global_step": 223864, "epoch": 1850} {"train_loss": -35.16366195678711, "global_step": 223865, "epoch": 1850} {"train_loss": -35.68606948852539, "global_step": 223866, "epoch": 1850} {"train_loss": -31.51727867126465, "global_step": 223867, "epoch": 1850} {"train_loss": -36.60441970825195, "global_step": 223868, "epoch": 1850} {"train_loss": -33.727630615234375, "global_step": 223869, "epoch": 1850} {"train_loss": -35.57244873046875, "global_step": 223870, "epoch": 1850} {"train_loss": -37.06352615356445, "global_step": 223871, "epoch": 1850} {"train_loss": -37.18323516845703, "global_step": 223872, "epoch": 1850} {"train_loss": -36.73726272583008, "global_step": 223873, "epoch": 1850} {"train_loss": -36.91249465942383, "global_step": 223874, "epoch": 1850} {"train_loss": -37.21876907348633, "global_step": 223875, "epoch": 1850} {"train_loss": -38.099674224853516, "global_step": 223876, "epoch": 1850} {"train_loss": -37.86334228515625, "global_step": 223877, "epoch": 1850} {"train_loss": -37.18886184692383, "global_step": 223878, "epoch": 1850} {"train_loss": -37.90840530395508, "global_step": 223879, "epoch": 1850} {"train_loss": -37.37015914916992, "global_step": 223880, "epoch": 1850} {"train_loss": -38.9525032043457, "global_step": 223881, "epoch": 1850} {"train_loss": -38.71855545043945, "global_step": 223882, "epoch": 1850} {"train_loss": -38.30312728881836, "global_step": 223883, "epoch": 1850} {"train_loss": -38.908599853515625, "global_step": 223884, "epoch": 1850} {"train_loss": -38.960933685302734, "global_step": 223885, "epoch": 1850} {"train_loss": -38.9066276550293, "global_step": 223886, "epoch": 1850} {"train_loss": -38.40704345703125, "global_step": 223887, "epoch": 1850} {"train_loss": -38.335906982421875, "global_step": 223888, "epoch": 1850} {"train_loss": -37.8554573059082, "global_step": 223889, "epoch": 1850} {"train_loss": -38.448944091796875, "global_step": 223890, "epoch": 1850} {"train_loss": -39.19125747680664, "global_step": 223891, "epoch": 1850} {"train_loss": -38.88800811767578, "global_step": 223892, "epoch": 1850} {"train_loss": -38.34572982788086, "global_step": 223893, "epoch": 1850} {"train_loss": -39.94916534423828, "global_step": 223894, "epoch": 1850} {"train_loss": -39.42991256713867, "global_step": 223895, "epoch": 1850} {"train_loss": -38.75954818725586, "global_step": 223896, "epoch": 1850} {"train_loss": -39.379032135009766, "global_step": 223897, "epoch": 1850} {"train_loss": -39.332603454589844, "global_step": 223898, "epoch": 1850} {"train_loss": -38.93044662475586, "global_step": 223899, "epoch": 1850} {"train_loss": -39.095314025878906, "global_step": 223900, "epoch": 1850} {"train_loss": -39.177711486816406, "global_step": 223901, "epoch": 1850} {"train_loss": -39.154624938964844, "global_step": 223902, "epoch": 1850} {"train_loss": -38.704524993896484, "global_step": 223903, "epoch": 1850} {"train_loss": -38.8736686706543, "global_step": 223904, "epoch": 1850} {"train_loss": -39.68467330932617, "global_step": 223905, "epoch": 1850} {"train_loss": -39.034698486328125, "global_step": 223906, "epoch": 1850} {"train_loss": -39.413387298583984, "global_step": 223907, "epoch": 1850} {"train_loss": -39.56809616088867, "global_step": 223908, "epoch": 1850} {"train_loss": -39.69426345825195, "global_step": 223909, "epoch": 1850} {"train_loss": -38.40777587890625, "global_step": 223910, "epoch": 1850} {"train_loss": -39.57722854614258, "global_step": 223911, "epoch": 1850} {"train_loss": -40.36134338378906, "global_step": 223912, "epoch": 1850} {"train_loss": -39.9537353515625, "global_step": 223913, "epoch": 1850} {"train_loss": -39.468563079833984, "global_step": 223914, "epoch": 1850} {"train_loss": -38.94398880004883, "global_step": 223915, "epoch": 1850} {"train_loss": -39.1087646484375, "global_step": 223916, "epoch": 1850} {"train_loss": -39.93336486816406, "global_step": 223917, "epoch": 1850} {"train_loss": -39.81229782104492, "global_step": 223918, "epoch": 1850} {"train_loss": -40.013427734375, "global_step": 223919, "epoch": 1850} {"train_loss": -39.90007781982422, "global_step": 223920, "epoch": 1850} {"train_loss": -39.68048858642578, "global_step": 223921, "epoch": 1850} {"train_loss": -39.59806442260742, "global_step": 223922, "epoch": 1850} {"train_loss": -40.252498626708984, "global_step": 223923, "epoch": 1850} {"train_loss": -39.92485046386719, "global_step": 223924, "epoch": 1850} {"train_loss": -40.20471954345703, "global_step": 223925, "epoch": 1850} {"train_loss": -40.40127944946289, "global_step": 223926, "epoch": 1850} {"train_loss": -40.45541000366211, "global_step": 223927, "epoch": 1850} {"train_loss": -39.80717468261719, "global_step": 223928, "epoch": 1850} {"train_loss": -40.61979675292969, "global_step": 223929, "epoch": 1850} {"train_loss": -40.33354949951172, "global_step": 223930, "epoch": 1850} {"train_loss": -39.82229232788086, "global_step": 223931, "epoch": 1850} {"train_loss": -38.44140625, "global_step": 223932, "epoch": 1850} {"train_loss": -40.78428268432617, "global_step": 223933, "epoch": 1850} {"train_loss": -37.19920349121094, "global_step": 223934, "epoch": 1850} {"train_loss": -39.558502197265625, "global_step": 223935, "epoch": 1850} {"train_loss": -39.89319610595703, "global_step": 223936, "epoch": 1850} {"train_loss": -39.88041305541992, "global_step": 223937, "epoch": 1850} {"train_loss": -38.73471450805664, "global_step": 223938, "epoch": 1850} {"train_loss": -38.729217529296875, "global_step": 223939, "epoch": 1850} {"train_loss": -39.92224884033203, "global_step": 223940, "epoch": 1850} {"train_loss": -39.18184280395508, "global_step": 223941, "epoch": 1850} {"train_loss": -39.1240119934082, "global_step": 223942, "epoch": 1850} {"train_loss": -40.287837982177734, "global_step": 223943, "epoch": 1850} {"train_loss": -39.799739837646484, "global_step": 223944, "epoch": 1850} {"train_loss": -40.37929916381836, "global_step": 223945, "epoch": 1850} {"train_loss": -39.96822738647461, "global_step": 223946, "epoch": 1850} {"train_loss": -39.665008544921875, "global_step": 223947, "epoch": 1850} {"train_loss": -38.22211837768555, "global_step": 223948, "epoch": 1850} {"train_loss": -40.00476837158203, "global_step": 223949, "epoch": 1850} {"train_loss": -40.256263732910156, "global_step": 223950, "epoch": 1850} {"train_loss": -40.820491790771484, "global_step": 223951, "epoch": 1850} {"train_loss": -38.218841552734375, "global_step": 223952, "epoch": 1850} {"train_loss": -39.33127975463867, "global_step": 223953, "epoch": 1850} {"train_loss": -40.552772521972656, "global_step": 223954, "epoch": 1850} {"train_loss": -40.19691848754883, "global_step": 223955, "epoch": 1850} {"train_loss": -39.7642936706543, "global_step": 223956, "epoch": 1850} {"train_loss": -40.38079071044922, "global_step": 223957, "epoch": 1850} {"train_loss": -40.25265121459961, "global_step": 223958, "epoch": 1850} {"train_loss": -40.13608932495117, "global_step": 223959, "epoch": 1850} {"train_loss": -40.48670196533203, "global_step": 223960, "epoch": 1850} {"train_loss": -40.27739334106445, "global_step": 223961, "epoch": 1850} {"train_loss": -40.236572265625, "global_step": 223962, "epoch": 1850} {"train_loss": -40.573570251464844, "global_step": 223963, "epoch": 1850} {"train_loss": -40.8509635925293, "global_step": 223964, "epoch": 1850} {"train_loss": -40.369136810302734, "global_step": 223965, "epoch": 1850} {"train_loss": -40.176734924316406, "global_step": 223966, "epoch": 1850} {"train_loss": -40.73860549926758, "global_step": 223967, "epoch": 1850} {"train_loss": -40.231754302978516, "global_step": 223968, "epoch": 1850} {"train_loss": -41.11046600341797, "global_step": 223969, "epoch": 1850} {"train_loss": -38.42613478731518, "global_step": 223970, "epoch": 1850, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4400000": 1.0, "test/sim_max_reward_4400001": 0.0, "test/sim_max_reward_4400002": 1.0, "test/sim_max_reward_4400003": 1.0, "test/sim_max_reward_4400004": 1.0, "test/sim_max_reward_4400005": 1.0, "test/sim_max_reward_4400006": 1.0, "test/sim_max_reward_4400007": 1.0, "test/sim_max_reward_4400008": 1.0, "test/sim_max_reward_4400009": 1.0, "test/sim_max_reward_4400010": 1.0, "test/sim_max_reward_4400011": 1.0, "test/sim_max_reward_4400012": 1.0, "test/sim_max_reward_4400013": 1.0, "test/sim_max_reward_4400014": 1.0, "test/sim_max_reward_4400015": 1.0, "test/sim_max_reward_4400016": 1.0, "test/sim_max_reward_4400017": 1.0, "test/sim_max_reward_4400018": 1.0, "test/sim_max_reward_4400019": 1.0, "test/sim_max_reward_4400020": 1.0, "test/sim_max_reward_4400021": 1.0, "train/mean_score": 1.0, "test/mean_score": 0.9545454545454546, "val_loss": 2481249.0} {"train_loss": -41.1396598815918, "global_step": 223971, "epoch": 1851} {"train_loss": -41.1947135925293, "global_step": 223972, "epoch": 1851} {"train_loss": -40.476654052734375, "global_step": 223973, "epoch": 1851} {"train_loss": -40.858638763427734, "global_step": 223974, "epoch": 1851} {"train_loss": -40.427581787109375, "global_step": 223975, "epoch": 1851} {"train_loss": -40.785091400146484, "global_step": 223976, "epoch": 1851} {"train_loss": -40.97126007080078, "global_step": 223977, "epoch": 1851} {"train_loss": -39.86643981933594, "global_step": 223978, "epoch": 1851} {"train_loss": -40.61124801635742, "global_step": 223979, "epoch": 1851} {"train_loss": -40.81354904174805, "global_step": 223980, "epoch": 1851} {"train_loss": -39.757991790771484, "global_step": 223981, "epoch": 1851} {"train_loss": -39.84001159667969, "global_step": 223982, "epoch": 1851} {"train_loss": -40.574241638183594, "global_step": 223983, "epoch": 1851} {"train_loss": -41.637001037597656, "global_step": 223984, "epoch": 1851} {"train_loss": -39.76429748535156, "global_step": 223985, "epoch": 1851} {"train_loss": -40.463016510009766, "global_step": 223986, "epoch": 1851} {"train_loss": -40.447509765625, "global_step": 223987, "epoch": 1851} {"train_loss": -40.98685836791992, "global_step": 223988, "epoch": 1851} {"train_loss": -40.82625961303711, "global_step": 223989, "epoch": 1851} {"train_loss": -41.26005172729492, "global_step": 223990, "epoch": 1851} {"train_loss": -40.943702697753906, "global_step": 223991, "epoch": 1851} {"train_loss": -41.171260833740234, "global_step": 223992, "epoch": 1851} {"train_loss": -40.40948486328125, "global_step": 223993, "epoch": 1851} {"train_loss": -40.71181106567383, "global_step": 223994, "epoch": 1851} {"train_loss": -41.26296615600586, "global_step": 223995, "epoch": 1851} {"train_loss": -40.377960205078125, "global_step": 223996, "epoch": 1851} {"train_loss": -41.375179290771484, "global_step": 223997, "epoch": 1851} {"train_loss": -41.211544036865234, "global_step": 223998, "epoch": 1851} {"train_loss": -41.85964584350586, "global_step": 223999, "epoch": 1851} {"train_loss": -41.0091438293457, "global_step": 224000, "epoch": 1851} {"train_loss": -41.590389251708984, "global_step": 224001, "epoch": 1851} {"train_loss": -41.8590087890625, "global_step": 224002, "epoch": 1851} {"train_loss": -41.517696380615234, "global_step": 224003, "epoch": 1851} {"train_loss": -41.52248764038086, "global_step": 224004, "epoch": 1851} {"train_loss": -40.434364318847656, "global_step": 224005, "epoch": 1851} {"train_loss": -40.20752716064453, "global_step": 224006, "epoch": 1851} {"train_loss": -41.41975021362305, "global_step": 224007, "epoch": 1851} {"train_loss": -41.94948959350586, "global_step": 224008, "epoch": 1851} {"train_loss": -41.24176025390625, "global_step": 224009, "epoch": 1851} {"train_loss": -41.39142990112305, "global_step": 224010, "epoch": 1851} {"train_loss": -40.932613372802734, "global_step": 224011, "epoch": 1851} {"train_loss": -41.868736267089844, "global_step": 224012, "epoch": 1851} {"train_loss": -41.22716522216797, "global_step": 224013, "epoch": 1851} {"train_loss": -42.056400299072266, "global_step": 224014, "epoch": 1851} {"train_loss": -41.925533294677734, "global_step": 224015, "epoch": 1851} {"train_loss": -40.6683464050293, "global_step": 224016, "epoch": 1851} {"train_loss": -41.0267219543457, "global_step": 224017, "epoch": 1851} {"train_loss": -40.392906188964844, "global_step": 224018, "epoch": 1851} {"train_loss": -40.17220687866211, "global_step": 224019, "epoch": 1851} {"train_loss": -37.94132995605469, "global_step": 224020, "epoch": 1851} {"train_loss": -38.36887741088867, "global_step": 224021, "epoch": 1851} {"train_loss": -37.662933349609375, "global_step": 224022, "epoch": 1851} {"train_loss": -39.15132522583008, "global_step": 224023, "epoch": 1851} {"train_loss": -40.9896125793457, "global_step": 224024, "epoch": 1851} {"train_loss": -40.47652053833008, "global_step": 224025, "epoch": 1851} {"train_loss": -40.659080505371094, "global_step": 224026, "epoch": 1851} {"train_loss": -41.12340545654297, "global_step": 224027, "epoch": 1851} {"train_loss": -41.049861907958984, "global_step": 224028, "epoch": 1851} {"train_loss": -40.430747985839844, "global_step": 224029, "epoch": 1851} {"train_loss": -40.462711334228516, "global_step": 224030, "epoch": 1851} {"train_loss": -41.80900955200195, "global_step": 224031, "epoch": 1851} {"train_loss": -40.50067901611328, "global_step": 224032, "epoch": 1851} {"train_loss": -39.472469329833984, "global_step": 224033, "epoch": 1851} {"train_loss": -41.21453094482422, "global_step": 224034, "epoch": 1851} {"train_loss": -41.43778610229492, "global_step": 224035, "epoch": 1851} {"train_loss": -40.0169792175293, "global_step": 224036, "epoch": 1851} {"train_loss": -40.55757522583008, "global_step": 224037, "epoch": 1851} {"train_loss": -40.88100814819336, "global_step": 224038, "epoch": 1851} {"train_loss": -39.65486145019531, "global_step": 224039, "epoch": 1851} {"train_loss": -41.27425765991211, "global_step": 224040, "epoch": 1851} {"train_loss": -41.382049560546875, "global_step": 224041, "epoch": 1851} {"train_loss": -38.98320770263672, "global_step": 224042, "epoch": 1851} {"train_loss": -40.141700744628906, "global_step": 224043, "epoch": 1851} {"train_loss": -40.82648849487305, "global_step": 224044, "epoch": 1851} {"train_loss": -39.494171142578125, "global_step": 224045, "epoch": 1851} {"train_loss": -40.34617614746094, "global_step": 224046, "epoch": 1851} {"train_loss": -40.69324493408203, "global_step": 224047, "epoch": 1851} {"train_loss": -40.75636672973633, "global_step": 224048, "epoch": 1851} {"train_loss": -40.620338439941406, "global_step": 224049, "epoch": 1851} {"train_loss": -40.591487884521484, "global_step": 224050, "epoch": 1851} {"train_loss": -41.08280563354492, "global_step": 224051, "epoch": 1851} {"train_loss": -41.61898422241211, "global_step": 224052, "epoch": 1851} {"train_loss": -41.89112854003906, "global_step": 224053, "epoch": 1851} {"train_loss": -41.53407669067383, "global_step": 224054, "epoch": 1851} {"train_loss": -41.2009162902832, "global_step": 224055, "epoch": 1851} {"train_loss": -41.60370635986328, "global_step": 224056, "epoch": 1851} {"train_loss": -41.51149368286133, "global_step": 224057, "epoch": 1851} {"train_loss": -37.979427337646484, "global_step": 224058, "epoch": 1851} {"train_loss": -42.132110595703125, "global_step": 224059, "epoch": 1851} {"train_loss": -41.42060089111328, "global_step": 224060, "epoch": 1851} {"train_loss": -40.937679290771484, "global_step": 224061, "epoch": 1851} {"train_loss": -41.26930618286133, "global_step": 224062, "epoch": 1851} {"train_loss": -41.17333984375, "global_step": 224063, "epoch": 1851} {"train_loss": -41.077335357666016, "global_step": 224064, "epoch": 1851} {"train_loss": -40.865028381347656, "global_step": 224065, "epoch": 1851} {"train_loss": -41.2216796875, "global_step": 224066, "epoch": 1851} {"train_loss": -40.828304290771484, "global_step": 224067, "epoch": 1851} {"train_loss": -41.6816520690918, "global_step": 224068, "epoch": 1851} {"train_loss": -41.82011795043945, "global_step": 224069, "epoch": 1851} {"train_loss": -41.95723342895508, "global_step": 224070, "epoch": 1851} {"train_loss": -40.26809310913086, "global_step": 224071, "epoch": 1851} {"train_loss": -41.308998107910156, "global_step": 224072, "epoch": 1851} {"train_loss": -41.289764404296875, "global_step": 224073, "epoch": 1851} {"train_loss": -38.56907272338867, "global_step": 224074, "epoch": 1851} {"train_loss": -37.77128219604492, "global_step": 224075, "epoch": 1851} {"train_loss": -41.60700607299805, "global_step": 224076, "epoch": 1851} {"train_loss": -41.52791976928711, "global_step": 224077, "epoch": 1851} {"train_loss": -40.46650314331055, "global_step": 224078, "epoch": 1851} {"train_loss": -40.22397994995117, "global_step": 224079, "epoch": 1851} {"train_loss": -39.60407638549805, "global_step": 224080, "epoch": 1851} {"train_loss": -42.03933334350586, "global_step": 224081, "epoch": 1851} {"train_loss": -40.897361755371094, "global_step": 224082, "epoch": 1851} {"train_loss": -40.61322784423828, "global_step": 224083, "epoch": 1851} {"train_loss": -40.84933090209961, "global_step": 224084, "epoch": 1851} {"train_loss": -40.66611862182617, "global_step": 224085, "epoch": 1851} {"train_loss": -41.50527572631836, "global_step": 224086, "epoch": 1851} {"train_loss": -41.17812728881836, "global_step": 224087, "epoch": 1851} {"train_loss": -40.51835632324219, "global_step": 224088, "epoch": 1851} {"train_loss": -42.198482513427734, "global_step": 224089, "epoch": 1851} {"train_loss": -40.10349655151367, "global_step": 224090, "epoch": 1851} {"train_loss": -40.78357270926483, "global_step": 224091, "epoch": 1851, "val_loss": 2548621.0} {"train_loss": -42.17405319213867, "global_step": 224092, "epoch": 1852} {"train_loss": -41.80343246459961, "global_step": 224093, "epoch": 1852} {"train_loss": -41.27457809448242, "global_step": 224094, "epoch": 1852} {"train_loss": -41.09623336791992, "global_step": 224095, "epoch": 1852} {"train_loss": -41.80859375, "global_step": 224096, "epoch": 1852} {"train_loss": -41.85906982421875, "global_step": 224097, "epoch": 1852} {"train_loss": -41.176963806152344, "global_step": 224098, "epoch": 1852} {"train_loss": -41.4821891784668, "global_step": 224099, "epoch": 1852} {"train_loss": -42.410377502441406, "global_step": 224100, "epoch": 1852} {"train_loss": -41.25169372558594, "global_step": 224101, "epoch": 1852} {"train_loss": -42.40594482421875, "global_step": 224102, "epoch": 1852} {"train_loss": -42.289276123046875, "global_step": 224103, "epoch": 1852} {"train_loss": -42.34114456176758, "global_step": 224104, "epoch": 1852} {"train_loss": -42.05708694458008, "global_step": 224105, "epoch": 1852} {"train_loss": -42.185115814208984, "global_step": 224106, "epoch": 1852} {"train_loss": -42.5752067565918, "global_step": 224107, "epoch": 1852} {"train_loss": -42.562530517578125, "global_step": 224108, "epoch": 1852} {"train_loss": -42.01277160644531, "global_step": 224109, "epoch": 1852} {"train_loss": -41.30031204223633, "global_step": 224110, "epoch": 1852} {"train_loss": -40.9874382019043, "global_step": 224111, "epoch": 1852} {"train_loss": -42.555904388427734, "global_step": 224112, "epoch": 1852} {"train_loss": -42.38895797729492, "global_step": 224113, "epoch": 1852} {"train_loss": -42.23729705810547, "global_step": 224114, "epoch": 1852} {"train_loss": -42.029052734375, "global_step": 224115, "epoch": 1852} {"train_loss": -42.256595611572266, "global_step": 224116, "epoch": 1852} {"train_loss": -42.029354095458984, "global_step": 224117, "epoch": 1852} {"train_loss": -42.24106979370117, "global_step": 224118, "epoch": 1852} {"train_loss": -42.55538558959961, "global_step": 224119, "epoch": 1852} {"train_loss": -41.82141876220703, "global_step": 224120, "epoch": 1852} {"train_loss": -42.3498420715332, "global_step": 224121, "epoch": 1852} {"train_loss": -42.26664352416992, "global_step": 224122, "epoch": 1852} {"train_loss": -42.498191833496094, "global_step": 224123, "epoch": 1852} {"train_loss": -41.46440505981445, "global_step": 224124, "epoch": 1852} {"train_loss": -42.74237060546875, "global_step": 224125, "epoch": 1852} {"train_loss": -42.515419006347656, "global_step": 224126, "epoch": 1852} {"train_loss": -42.88051223754883, "global_step": 224127, "epoch": 1852} {"train_loss": -42.696189880371094, "global_step": 224128, "epoch": 1852} {"train_loss": -42.824501037597656, "global_step": 224129, "epoch": 1852} {"train_loss": -42.466102600097656, "global_step": 224130, "epoch": 1852} {"train_loss": -42.506927490234375, "global_step": 224131, "epoch": 1852} {"train_loss": -42.4926872253418, "global_step": 224132, "epoch": 1852} {"train_loss": -41.612789154052734, "global_step": 224133, "epoch": 1852} {"train_loss": -42.26374435424805, "global_step": 224134, "epoch": 1852} {"train_loss": -42.88936996459961, "global_step": 224135, "epoch": 1852} {"train_loss": -42.8101692199707, "global_step": 224136, "epoch": 1852} {"train_loss": -42.75593185424805, "global_step": 224137, "epoch": 1852} {"train_loss": -42.755306243896484, "global_step": 224138, "epoch": 1852} {"train_loss": -41.522132873535156, "global_step": 224139, "epoch": 1852} {"train_loss": -41.75651931762695, "global_step": 224140, "epoch": 1852} {"train_loss": -40.50220489501953, "global_step": 224141, "epoch": 1852} {"train_loss": -37.64418411254883, "global_step": 224142, "epoch": 1852} {"train_loss": -37.88450622558594, "global_step": 224143, "epoch": 1852} {"train_loss": -39.45964431762695, "global_step": 224144, "epoch": 1852} {"train_loss": -41.32969284057617, "global_step": 224145, "epoch": 1852} {"train_loss": -39.241844177246094, "global_step": 224146, "epoch": 1852} {"train_loss": -34.46208572387695, "global_step": 224147, "epoch": 1852} {"train_loss": -37.558956146240234, "global_step": 224148, "epoch": 1852} {"train_loss": -39.29133987426758, "global_step": 224149, "epoch": 1852} {"train_loss": -37.39385986328125, "global_step": 224150, "epoch": 1852} {"train_loss": -40.184730529785156, "global_step": 224151, "epoch": 1852} {"train_loss": -39.46049499511719, "global_step": 224152, "epoch": 1852} {"train_loss": -35.894287109375, "global_step": 224153, "epoch": 1852} {"train_loss": -38.89503860473633, "global_step": 224154, "epoch": 1852} {"train_loss": -40.7376823425293, "global_step": 224155, "epoch": 1852} {"train_loss": -37.720157623291016, "global_step": 224156, "epoch": 1852} {"train_loss": -41.41958236694336, "global_step": 224157, "epoch": 1852} {"train_loss": -39.41752243041992, "global_step": 224158, "epoch": 1852} {"train_loss": -40.127357482910156, "global_step": 224159, "epoch": 1852} {"train_loss": -40.017513275146484, "global_step": 224160, "epoch": 1852} {"train_loss": -39.83028793334961, "global_step": 224161, "epoch": 1852} {"train_loss": -41.20452117919922, "global_step": 224162, "epoch": 1852} {"train_loss": -40.47309112548828, "global_step": 224163, "epoch": 1852} {"train_loss": -39.8423957824707, "global_step": 224164, "epoch": 1852} {"train_loss": -41.709171295166016, "global_step": 224165, "epoch": 1852} {"train_loss": -39.360260009765625, "global_step": 224166, "epoch": 1852} {"train_loss": -41.126747131347656, "global_step": 224167, "epoch": 1852} {"train_loss": -41.164791107177734, "global_step": 224168, "epoch": 1852} {"train_loss": -41.297943115234375, "global_step": 224169, "epoch": 1852} {"train_loss": -41.232513427734375, "global_step": 224170, "epoch": 1852} {"train_loss": -41.534603118896484, "global_step": 224171, "epoch": 1852} {"train_loss": -41.65187454223633, "global_step": 224172, "epoch": 1852} {"train_loss": -41.600990295410156, "global_step": 224173, "epoch": 1852} {"train_loss": -41.84641647338867, "global_step": 224174, "epoch": 1852} {"train_loss": -41.705238342285156, "global_step": 224175, "epoch": 1852} {"train_loss": -41.11362838745117, "global_step": 224176, "epoch": 1852} {"train_loss": -41.60333251953125, "global_step": 224177, "epoch": 1852} {"train_loss": -41.59599685668945, "global_step": 224178, "epoch": 1852} {"train_loss": -42.04448318481445, "global_step": 224179, "epoch": 1852} {"train_loss": -42.10128402709961, "global_step": 224180, "epoch": 1852} {"train_loss": -41.8487663269043, "global_step": 224181, "epoch": 1852} {"train_loss": -41.797340393066406, "global_step": 224182, "epoch": 1852} {"train_loss": -41.788291931152344, "global_step": 224183, "epoch": 1852} {"train_loss": -42.01806640625, "global_step": 224184, "epoch": 1852} {"train_loss": -41.55636978149414, "global_step": 224185, "epoch": 1852} {"train_loss": -41.99431228637695, "global_step": 224186, "epoch": 1852} {"train_loss": -42.2264518737793, "global_step": 224187, "epoch": 1852} {"train_loss": -42.004798889160156, "global_step": 224188, "epoch": 1852} {"train_loss": -42.22356033325195, "global_step": 224189, "epoch": 1852} {"train_loss": -41.745086669921875, "global_step": 224190, "epoch": 1852} {"train_loss": -41.78083038330078, "global_step": 224191, "epoch": 1852} {"train_loss": -39.952762603759766, "global_step": 224192, "epoch": 1852} {"train_loss": -39.3609504699707, "global_step": 224193, "epoch": 1852} {"train_loss": -39.46165084838867, "global_step": 224194, "epoch": 1852} {"train_loss": -41.87017822265625, "global_step": 224195, "epoch": 1852} {"train_loss": -41.55369186401367, "global_step": 224196, "epoch": 1852} {"train_loss": -40.509132385253906, "global_step": 224197, "epoch": 1852} {"train_loss": -41.187469482421875, "global_step": 224198, "epoch": 1852} {"train_loss": -41.28544616699219, "global_step": 224199, "epoch": 1852} {"train_loss": -38.676265716552734, "global_step": 224200, "epoch": 1852} {"train_loss": -41.52605438232422, "global_step": 224201, "epoch": 1852} {"train_loss": -40.764671325683594, "global_step": 224202, "epoch": 1852} {"train_loss": -41.07528305053711, "global_step": 224203, "epoch": 1852} {"train_loss": -41.680171966552734, "global_step": 224204, "epoch": 1852} {"train_loss": -40.93824768066406, "global_step": 224205, "epoch": 1852} {"train_loss": -40.72625732421875, "global_step": 224206, "epoch": 1852} {"train_loss": -40.87410354614258, "global_step": 224207, "epoch": 1852} {"train_loss": -41.68477249145508, "global_step": 224208, "epoch": 1852} {"train_loss": -40.217674255371094, "global_step": 224209, "epoch": 1852} {"train_loss": -41.60197830200195, "global_step": 224210, "epoch": 1852} {"train_loss": -42.24789047241211, "global_step": 224211, "epoch": 1852} {"train_loss": -41.216205849135214, "global_step": 224212, "epoch": 1852, "val_loss": 2489562.75} {"train_loss": -41.85451889038086, "global_step": 224213, "epoch": 1853} {"train_loss": -41.840450286865234, "global_step": 224214, "epoch": 1853} {"train_loss": -41.596885681152344, "global_step": 224215, "epoch": 1853} {"train_loss": -40.7900505065918, "global_step": 224216, "epoch": 1853} {"train_loss": -41.68832015991211, "global_step": 224217, "epoch": 1853} {"train_loss": -42.3908576965332, "global_step": 224218, "epoch": 1853} {"train_loss": -41.81492233276367, "global_step": 224219, "epoch": 1853} {"train_loss": -41.94882583618164, "global_step": 224220, "epoch": 1853} {"train_loss": -42.269100189208984, "global_step": 224221, "epoch": 1853} {"train_loss": -41.82802963256836, "global_step": 224222, "epoch": 1853} {"train_loss": -42.34326934814453, "global_step": 224223, "epoch": 1853} {"train_loss": -42.66837692260742, "global_step": 224224, "epoch": 1853} {"train_loss": -41.9824104309082, "global_step": 224225, "epoch": 1853} {"train_loss": -42.418575286865234, "global_step": 224226, "epoch": 1853} {"train_loss": -41.13068771362305, "global_step": 224227, "epoch": 1853} {"train_loss": -41.147708892822266, "global_step": 224228, "epoch": 1853} {"train_loss": -42.72940444946289, "global_step": 224229, "epoch": 1853} {"train_loss": -42.10436248779297, "global_step": 224230, "epoch": 1853} {"train_loss": -41.89674758911133, "global_step": 224231, "epoch": 1853} {"train_loss": -42.21628952026367, "global_step": 224232, "epoch": 1853} {"train_loss": -42.047420501708984, "global_step": 224233, "epoch": 1853} {"train_loss": -42.543636322021484, "global_step": 224234, "epoch": 1853} {"train_loss": -41.99112319946289, "global_step": 224235, "epoch": 1853} {"train_loss": -42.25484848022461, "global_step": 224236, "epoch": 1853} {"train_loss": -42.65262985229492, "global_step": 224237, "epoch": 1853} {"train_loss": -42.62005615234375, "global_step": 224238, "epoch": 1853} {"train_loss": -42.12238311767578, "global_step": 224239, "epoch": 1853} {"train_loss": -41.32529830932617, "global_step": 224240, "epoch": 1853} {"train_loss": -42.57643508911133, "global_step": 224241, "epoch": 1853} {"train_loss": -42.54610824584961, "global_step": 224242, "epoch": 1853} {"train_loss": -40.96201705932617, "global_step": 224243, "epoch": 1853} {"train_loss": -41.361610412597656, "global_step": 224244, "epoch": 1853} {"train_loss": -42.77234649658203, "global_step": 224245, "epoch": 1853} {"train_loss": -41.3912467956543, "global_step": 224246, "epoch": 1853} {"train_loss": -42.230079650878906, "global_step": 224247, "epoch": 1853} {"train_loss": -41.946346282958984, "global_step": 224248, "epoch": 1853} {"train_loss": -40.05998611450195, "global_step": 224249, "epoch": 1853} {"train_loss": -41.673858642578125, "global_step": 224250, "epoch": 1853} {"train_loss": -41.870582580566406, "global_step": 224251, "epoch": 1853} {"train_loss": -41.28791046142578, "global_step": 224252, "epoch": 1853} {"train_loss": -40.32168197631836, "global_step": 224253, "epoch": 1853} {"train_loss": -41.98826599121094, "global_step": 224254, "epoch": 1853} {"train_loss": -40.10081100463867, "global_step": 224255, "epoch": 1853} {"train_loss": -40.80110549926758, "global_step": 224256, "epoch": 1853} {"train_loss": -39.631038665771484, "global_step": 224257, "epoch": 1853} {"train_loss": -40.536617279052734, "global_step": 224258, "epoch": 1853} {"train_loss": -40.402198791503906, "global_step": 224259, "epoch": 1853} {"train_loss": -41.68516540527344, "global_step": 224260, "epoch": 1853} {"train_loss": -40.52988815307617, "global_step": 224261, "epoch": 1853} {"train_loss": -34.61930465698242, "global_step": 224262, "epoch": 1853} {"train_loss": -40.21167755126953, "global_step": 224263, "epoch": 1853} {"train_loss": -41.51906204223633, "global_step": 224264, "epoch": 1853} {"train_loss": -42.186763763427734, "global_step": 224265, "epoch": 1853} {"train_loss": -40.936519622802734, "global_step": 224266, "epoch": 1853} {"train_loss": -41.38798904418945, "global_step": 224267, "epoch": 1853} {"train_loss": -40.91938018798828, "global_step": 224268, "epoch": 1853} {"train_loss": -40.46648406982422, "global_step": 224269, "epoch": 1853} {"train_loss": -41.57587814331055, "global_step": 224270, "epoch": 1853} {"train_loss": -40.589481353759766, "global_step": 224271, "epoch": 1853} {"train_loss": -40.21321105957031, "global_step": 224272, "epoch": 1853} {"train_loss": -41.76266098022461, "global_step": 224273, "epoch": 1853} {"train_loss": -40.65966796875, "global_step": 224274, "epoch": 1853} {"train_loss": -42.3486328125, "global_step": 224275, "epoch": 1853} {"train_loss": -41.0079460144043, "global_step": 224276, "epoch": 1853} {"train_loss": -41.18958282470703, "global_step": 224277, "epoch": 1853} {"train_loss": -41.32918930053711, "global_step": 224278, "epoch": 1853} {"train_loss": -36.86541748046875, "global_step": 224279, "epoch": 1853} {"train_loss": -41.224056243896484, "global_step": 224280, "epoch": 1853} {"train_loss": -41.416358947753906, "global_step": 224281, "epoch": 1853} {"train_loss": -41.084720611572266, "global_step": 224282, "epoch": 1853} {"train_loss": -39.934627532958984, "global_step": 224283, "epoch": 1853} {"train_loss": -41.7775993347168, "global_step": 224284, "epoch": 1853} {"train_loss": -38.86484909057617, "global_step": 224285, "epoch": 1853} {"train_loss": -37.91907501220703, "global_step": 224286, "epoch": 1853} {"train_loss": -40.426212310791016, "global_step": 224287, "epoch": 1853} {"train_loss": -35.84060287475586, "global_step": 224288, "epoch": 1853} {"train_loss": -39.92307662963867, "global_step": 224289, "epoch": 1853} {"train_loss": -33.057552337646484, "global_step": 224290, "epoch": 1853} {"train_loss": -35.48073196411133, "global_step": 224291, "epoch": 1853} {"train_loss": -37.4029426574707, "global_step": 224292, "epoch": 1853} {"train_loss": -37.58026123046875, "global_step": 224293, "epoch": 1853} {"train_loss": -31.67988395690918, "global_step": 224294, "epoch": 1853} {"train_loss": -36.03993606567383, "global_step": 224295, "epoch": 1853} {"train_loss": -36.34547805786133, "global_step": 224296, "epoch": 1853} {"train_loss": -39.349552154541016, "global_step": 224297, "epoch": 1853} {"train_loss": -39.46012496948242, "global_step": 224298, "epoch": 1853} {"train_loss": -37.016273498535156, "global_step": 224299, "epoch": 1853} {"train_loss": -38.4520263671875, "global_step": 224300, "epoch": 1853} {"train_loss": -39.3284797668457, "global_step": 224301, "epoch": 1853} {"train_loss": -37.72461700439453, "global_step": 224302, "epoch": 1853} {"train_loss": -33.332881927490234, "global_step": 224303, "epoch": 1853} {"train_loss": -35.995948791503906, "global_step": 224304, "epoch": 1853} {"train_loss": -38.10164260864258, "global_step": 224305, "epoch": 1853} {"train_loss": -37.628265380859375, "global_step": 224306, "epoch": 1853} {"train_loss": -38.842525482177734, "global_step": 224307, "epoch": 1853} {"train_loss": -41.03761672973633, "global_step": 224308, "epoch": 1853} {"train_loss": -37.43330001831055, "global_step": 224309, "epoch": 1853} {"train_loss": -40.18699264526367, "global_step": 224310, "epoch": 1853} {"train_loss": -35.2652702331543, "global_step": 224311, "epoch": 1853} {"train_loss": -40.0516471862793, "global_step": 224312, "epoch": 1853} {"train_loss": -38.718849182128906, "global_step": 224313, "epoch": 1853} {"train_loss": -37.390586853027344, "global_step": 224314, "epoch": 1853} {"train_loss": -40.20648193359375, "global_step": 224315, "epoch": 1853} {"train_loss": -38.346492767333984, "global_step": 224316, "epoch": 1853} {"train_loss": -39.46220779418945, "global_step": 224317, "epoch": 1853} {"train_loss": -37.38502883911133, "global_step": 224318, "epoch": 1853} {"train_loss": -40.011348724365234, "global_step": 224319, "epoch": 1853} {"train_loss": -37.18706512451172, "global_step": 224320, "epoch": 1853} {"train_loss": -38.854061126708984, "global_step": 224321, "epoch": 1853} {"train_loss": -39.541080474853516, "global_step": 224322, "epoch": 1853} {"train_loss": -37.925045013427734, "global_step": 224323, "epoch": 1853} {"train_loss": -40.17953109741211, "global_step": 224324, "epoch": 1853} {"train_loss": -38.292274475097656, "global_step": 224325, "epoch": 1853} {"train_loss": -40.051570892333984, "global_step": 224326, "epoch": 1853} {"train_loss": -34.9338264465332, "global_step": 224327, "epoch": 1853} {"train_loss": -38.6242561340332, "global_step": 224328, "epoch": 1853} {"train_loss": -39.97273254394531, "global_step": 224329, "epoch": 1853} {"train_loss": -39.92012405395508, "global_step": 224330, "epoch": 1853} {"train_loss": -37.709468841552734, "global_step": 224331, "epoch": 1853} {"train_loss": -40.46516799926758, "global_step": 224332, "epoch": 1853} {"train_loss": -40.02981127589202, "global_step": 224333, "epoch": 1853, "val_loss": 2578112.25} {"train_loss": -40.688453674316406, "global_step": 224334, "epoch": 1854} {"train_loss": -39.26907730102539, "global_step": 224335, "epoch": 1854} {"train_loss": -39.4538459777832, "global_step": 224336, "epoch": 1854} {"train_loss": -40.670654296875, "global_step": 224337, "epoch": 1854} {"train_loss": -39.02036666870117, "global_step": 224338, "epoch": 1854} {"train_loss": -40.327518463134766, "global_step": 224339, "epoch": 1854} {"train_loss": -40.32554244995117, "global_step": 224340, "epoch": 1854} {"train_loss": -40.21173095703125, "global_step": 224341, "epoch": 1854} {"train_loss": -40.6953125, "global_step": 224342, "epoch": 1854} {"train_loss": -40.66947555541992, "global_step": 224343, "epoch": 1854} {"train_loss": -40.1178092956543, "global_step": 224344, "epoch": 1854} {"train_loss": -40.75260925292969, "global_step": 224345, "epoch": 1854} {"train_loss": -40.235572814941406, "global_step": 224346, "epoch": 1854} {"train_loss": -40.85213088989258, "global_step": 224347, "epoch": 1854} {"train_loss": -39.67594909667969, "global_step": 224348, "epoch": 1854} {"train_loss": -40.76771926879883, "global_step": 224349, "epoch": 1854} {"train_loss": -38.88127136230469, "global_step": 224350, "epoch": 1854} {"train_loss": -39.4768180847168, "global_step": 224351, "epoch": 1854} {"train_loss": -40.16132354736328, "global_step": 224352, "epoch": 1854} {"train_loss": -41.279388427734375, "global_step": 224353, "epoch": 1854} {"train_loss": -41.25065612792969, "global_step": 224354, "epoch": 1854} {"train_loss": -41.36722946166992, "global_step": 224355, "epoch": 1854} {"train_loss": -41.4803352355957, "global_step": 224356, "epoch": 1854} {"train_loss": -40.87263107299805, "global_step": 224357, "epoch": 1854} {"train_loss": -40.45065689086914, "global_step": 224358, "epoch": 1854} {"train_loss": -41.2016716003418, "global_step": 224359, "epoch": 1854} {"train_loss": -41.37446212768555, "global_step": 224360, "epoch": 1854} {"train_loss": -41.44185256958008, "global_step": 224361, "epoch": 1854} {"train_loss": -39.5641975402832, "global_step": 224362, "epoch": 1854} {"train_loss": -40.61273193359375, "global_step": 224363, "epoch": 1854} {"train_loss": -40.913021087646484, "global_step": 224364, "epoch": 1854} {"train_loss": -41.48356246948242, "global_step": 224365, "epoch": 1854} {"train_loss": -41.8818473815918, "global_step": 224366, "epoch": 1854} {"train_loss": -41.431339263916016, "global_step": 224367, "epoch": 1854} {"train_loss": -41.932247161865234, "global_step": 224368, "epoch": 1854} {"train_loss": -41.25783920288086, "global_step": 224369, "epoch": 1854} {"train_loss": -41.61613845825195, "global_step": 224370, "epoch": 1854} {"train_loss": -41.47085189819336, "global_step": 224371, "epoch": 1854} {"train_loss": -41.81620407104492, "global_step": 224372, "epoch": 1854} {"train_loss": -40.36928176879883, "global_step": 224373, "epoch": 1854} {"train_loss": -41.53498458862305, "global_step": 224374, "epoch": 1854} {"train_loss": -42.11150360107422, "global_step": 224375, "epoch": 1854} {"train_loss": -41.4735221862793, "global_step": 224376, "epoch": 1854} {"train_loss": -41.34882736206055, "global_step": 224377, "epoch": 1854} {"train_loss": -42.14260482788086, "global_step": 224378, "epoch": 1854} {"train_loss": -41.960296630859375, "global_step": 224379, "epoch": 1854} {"train_loss": -41.841758728027344, "global_step": 224380, "epoch": 1854} {"train_loss": -42.035560607910156, "global_step": 224381, "epoch": 1854} {"train_loss": -41.81620407104492, "global_step": 224382, "epoch": 1854} {"train_loss": -42.046356201171875, "global_step": 224383, "epoch": 1854} {"train_loss": -41.84346008300781, "global_step": 224384, "epoch": 1854} {"train_loss": -40.39192199707031, "global_step": 224385, "epoch": 1854} {"train_loss": -39.139503479003906, "global_step": 224386, "epoch": 1854} {"train_loss": -41.954750061035156, "global_step": 224387, "epoch": 1854} {"train_loss": -41.854393005371094, "global_step": 224388, "epoch": 1854} {"train_loss": -41.40284729003906, "global_step": 224389, "epoch": 1854} {"train_loss": -42.287437438964844, "global_step": 224390, "epoch": 1854} {"train_loss": -41.734107971191406, "global_step": 224391, "epoch": 1854} {"train_loss": -42.24363327026367, "global_step": 224392, "epoch": 1854} {"train_loss": -42.02231216430664, "global_step": 224393, "epoch": 1854} {"train_loss": -42.04697799682617, "global_step": 224394, "epoch": 1854} {"train_loss": -41.80356979370117, "global_step": 224395, "epoch": 1854} {"train_loss": -41.41391372680664, "global_step": 224396, "epoch": 1854} {"train_loss": -42.04526901245117, "global_step": 224397, "epoch": 1854} {"train_loss": -41.91435623168945, "global_step": 224398, "epoch": 1854} {"train_loss": -41.02724838256836, "global_step": 224399, "epoch": 1854} {"train_loss": -42.327796936035156, "global_step": 224400, "epoch": 1854} {"train_loss": -41.57758712768555, "global_step": 224401, "epoch": 1854} {"train_loss": -42.02790069580078, "global_step": 224402, "epoch": 1854} {"train_loss": -42.14507293701172, "global_step": 224403, "epoch": 1854} {"train_loss": -41.604366302490234, "global_step": 224404, "epoch": 1854} {"train_loss": -41.47608947753906, "global_step": 224405, "epoch": 1854} {"train_loss": -40.999847412109375, "global_step": 224406, "epoch": 1854} {"train_loss": -40.57393264770508, "global_step": 224407, "epoch": 1854} {"train_loss": -41.77180099487305, "global_step": 224408, "epoch": 1854} {"train_loss": -42.3101692199707, "global_step": 224409, "epoch": 1854} {"train_loss": -41.065528869628906, "global_step": 224410, "epoch": 1854} {"train_loss": -40.432701110839844, "global_step": 224411, "epoch": 1854} {"train_loss": -41.646339416503906, "global_step": 224412, "epoch": 1854} {"train_loss": -41.02853012084961, "global_step": 224413, "epoch": 1854} {"train_loss": -41.83840560913086, "global_step": 224414, "epoch": 1854} {"train_loss": -41.63895034790039, "global_step": 224415, "epoch": 1854} {"train_loss": -40.670997619628906, "global_step": 224416, "epoch": 1854} {"train_loss": -41.69165802001953, "global_step": 224417, "epoch": 1854} {"train_loss": -42.084991455078125, "global_step": 224418, "epoch": 1854} {"train_loss": -41.5460319519043, "global_step": 224419, "epoch": 1854} {"train_loss": -42.46480941772461, "global_step": 224420, "epoch": 1854} {"train_loss": -42.23647689819336, "global_step": 224421, "epoch": 1854} {"train_loss": -42.076534271240234, "global_step": 224422, "epoch": 1854} {"train_loss": -42.16643142700195, "global_step": 224423, "epoch": 1854} {"train_loss": -41.58045959472656, "global_step": 224424, "epoch": 1854} {"train_loss": -42.046974182128906, "global_step": 224425, "epoch": 1854} {"train_loss": -42.47831344604492, "global_step": 224426, "epoch": 1854} {"train_loss": -42.20634078979492, "global_step": 224427, "epoch": 1854} {"train_loss": -41.857688903808594, "global_step": 224428, "epoch": 1854} {"train_loss": -42.413970947265625, "global_step": 224429, "epoch": 1854} {"train_loss": -41.09883499145508, "global_step": 224430, "epoch": 1854} {"train_loss": -40.26363754272461, "global_step": 224431, "epoch": 1854} {"train_loss": -38.47243118286133, "global_step": 224432, "epoch": 1854} {"train_loss": -35.36503982543945, "global_step": 224433, "epoch": 1854} {"train_loss": -34.247100830078125, "global_step": 224434, "epoch": 1854} {"train_loss": -38.952301025390625, "global_step": 224435, "epoch": 1854} {"train_loss": -41.25825881958008, "global_step": 224436, "epoch": 1854} {"train_loss": -39.920711517333984, "global_step": 224437, "epoch": 1854} {"train_loss": -39.13578414916992, "global_step": 224438, "epoch": 1854} {"train_loss": -40.230201721191406, "global_step": 224439, "epoch": 1854} {"train_loss": -40.79670715332031, "global_step": 224440, "epoch": 1854} {"train_loss": -40.904476165771484, "global_step": 224441, "epoch": 1854} {"train_loss": -39.3650016784668, "global_step": 224442, "epoch": 1854} {"train_loss": -40.58950424194336, "global_step": 224443, "epoch": 1854} {"train_loss": -39.47540283203125, "global_step": 224444, "epoch": 1854} {"train_loss": -40.61716842651367, "global_step": 224445, "epoch": 1854} {"train_loss": -40.7860107421875, "global_step": 224446, "epoch": 1854} {"train_loss": -41.78664779663086, "global_step": 224447, "epoch": 1854} {"train_loss": -40.90324783325195, "global_step": 224448, "epoch": 1854} {"train_loss": -41.52030563354492, "global_step": 224449, "epoch": 1854} {"train_loss": -41.335411071777344, "global_step": 224450, "epoch": 1854} {"train_loss": -40.01374435424805, "global_step": 224451, "epoch": 1854} {"train_loss": -40.781124114990234, "global_step": 224452, "epoch": 1854} {"train_loss": -40.811744689941406, "global_step": 224453, "epoch": 1854} {"train_loss": -41.010365005367056, "global_step": 224454, "epoch": 1854, "val_loss": 2627568.75} {"train_loss": -41.20181655883789, "global_step": 224455, "epoch": 1855} {"train_loss": -40.78179931640625, "global_step": 224456, "epoch": 1855} {"train_loss": -40.01789093017578, "global_step": 224457, "epoch": 1855} {"train_loss": -41.05002975463867, "global_step": 224458, "epoch": 1855} {"train_loss": -40.8967170715332, "global_step": 224459, "epoch": 1855} {"train_loss": -41.38906478881836, "global_step": 224460, "epoch": 1855} {"train_loss": -41.82503890991211, "global_step": 224461, "epoch": 1855} {"train_loss": -41.57796859741211, "global_step": 224462, "epoch": 1855} {"train_loss": -41.81306076049805, "global_step": 224463, "epoch": 1855} {"train_loss": -41.08340072631836, "global_step": 224464, "epoch": 1855} {"train_loss": -41.6661491394043, "global_step": 224465, "epoch": 1855} {"train_loss": -42.00010681152344, "global_step": 224466, "epoch": 1855} {"train_loss": -41.9760856628418, "global_step": 224467, "epoch": 1855} {"train_loss": -41.62049102783203, "global_step": 224468, "epoch": 1855} {"train_loss": -41.257904052734375, "global_step": 224469, "epoch": 1855} {"train_loss": -41.728759765625, "global_step": 224470, "epoch": 1855} {"train_loss": -41.77162551879883, "global_step": 224471, "epoch": 1855} {"train_loss": -41.932979583740234, "global_step": 224472, "epoch": 1855} {"train_loss": -41.188961029052734, "global_step": 224473, "epoch": 1855} {"train_loss": -41.61841583251953, "global_step": 224474, "epoch": 1855} {"train_loss": -41.87439727783203, "global_step": 224475, "epoch": 1855} {"train_loss": -41.63557434082031, "global_step": 224476, "epoch": 1855} {"train_loss": -41.42743682861328, "global_step": 224477, "epoch": 1855} {"train_loss": -42.10802459716797, "global_step": 224478, "epoch": 1855} {"train_loss": -41.34247589111328, "global_step": 224479, "epoch": 1855} {"train_loss": -42.37623977661133, "global_step": 224480, "epoch": 1855} {"train_loss": -42.06722640991211, "global_step": 224481, "epoch": 1855} {"train_loss": -41.68928909301758, "global_step": 224482, "epoch": 1855} {"train_loss": -40.87895202636719, "global_step": 224483, "epoch": 1855} {"train_loss": -42.150882720947266, "global_step": 224484, "epoch": 1855} {"train_loss": -42.18478012084961, "global_step": 224485, "epoch": 1855} {"train_loss": -42.69231414794922, "global_step": 224486, "epoch": 1855} {"train_loss": -42.6124267578125, "global_step": 224487, "epoch": 1855} {"train_loss": -41.66432571411133, "global_step": 224488, "epoch": 1855} {"train_loss": -42.37638473510742, "global_step": 224489, "epoch": 1855} {"train_loss": -42.25765609741211, "global_step": 224490, "epoch": 1855} {"train_loss": -41.54023361206055, "global_step": 224491, "epoch": 1855} {"train_loss": -42.11652374267578, "global_step": 224492, "epoch": 1855} {"train_loss": -42.47321701049805, "global_step": 224493, "epoch": 1855} {"train_loss": -41.926509857177734, "global_step": 224494, "epoch": 1855} {"train_loss": -41.913795471191406, "global_step": 224495, "epoch": 1855} {"train_loss": -41.705535888671875, "global_step": 224496, "epoch": 1855} {"train_loss": -42.04777145385742, "global_step": 224497, "epoch": 1855} {"train_loss": -42.288246154785156, "global_step": 224498, "epoch": 1855} {"train_loss": -42.026039123535156, "global_step": 224499, "epoch": 1855} {"train_loss": -42.49360275268555, "global_step": 224500, "epoch": 1855} {"train_loss": -42.04998779296875, "global_step": 224501, "epoch": 1855} {"train_loss": -42.432464599609375, "global_step": 224502, "epoch": 1855} {"train_loss": -42.337371826171875, "global_step": 224503, "epoch": 1855} {"train_loss": -42.50437545776367, "global_step": 224504, "epoch": 1855} {"train_loss": -42.31483840942383, "global_step": 224505, "epoch": 1855} {"train_loss": -41.86184310913086, "global_step": 224506, "epoch": 1855} {"train_loss": -41.61603927612305, "global_step": 224507, "epoch": 1855} {"train_loss": -42.668678283691406, "global_step": 224508, "epoch": 1855} {"train_loss": -42.1252326965332, "global_step": 224509, "epoch": 1855} {"train_loss": -43.052467346191406, "global_step": 224510, "epoch": 1855} {"train_loss": -42.828060150146484, "global_step": 224511, "epoch": 1855} {"train_loss": -41.8372917175293, "global_step": 224512, "epoch": 1855} {"train_loss": -42.92681884765625, "global_step": 224513, "epoch": 1855} {"train_loss": -42.813262939453125, "global_step": 224514, "epoch": 1855} {"train_loss": -42.25852584838867, "global_step": 224515, "epoch": 1855} {"train_loss": -42.60504913330078, "global_step": 224516, "epoch": 1855} {"train_loss": -41.793514251708984, "global_step": 224517, "epoch": 1855} {"train_loss": -41.52769088745117, "global_step": 224518, "epoch": 1855} {"train_loss": -41.28242111206055, "global_step": 224519, "epoch": 1855} {"train_loss": -41.69989776611328, "global_step": 224520, "epoch": 1855} {"train_loss": -42.464141845703125, "global_step": 224521, "epoch": 1855} {"train_loss": -42.779354095458984, "global_step": 224522, "epoch": 1855} {"train_loss": -43.03804397583008, "global_step": 224523, "epoch": 1855} {"train_loss": -42.85512161254883, "global_step": 224524, "epoch": 1855} {"train_loss": -42.806880950927734, "global_step": 224525, "epoch": 1855} {"train_loss": -42.97553634643555, "global_step": 224526, "epoch": 1855} {"train_loss": -42.891902923583984, "global_step": 224527, "epoch": 1855} {"train_loss": -42.481624603271484, "global_step": 224528, "epoch": 1855} {"train_loss": -42.12263107299805, "global_step": 224529, "epoch": 1855} {"train_loss": -41.86981201171875, "global_step": 224530, "epoch": 1855} {"train_loss": -40.0184440612793, "global_step": 224531, "epoch": 1855} {"train_loss": -36.41410446166992, "global_step": 224532, "epoch": 1855} {"train_loss": -30.78150749206543, "global_step": 224533, "epoch": 1855} {"train_loss": -33.14324951171875, "global_step": 224534, "epoch": 1855} {"train_loss": -40.2147216796875, "global_step": 224535, "epoch": 1855} {"train_loss": -37.88434600830078, "global_step": 224536, "epoch": 1855} {"train_loss": -35.15595245361328, "global_step": 224537, "epoch": 1855} {"train_loss": -40.37660217285156, "global_step": 224538, "epoch": 1855} {"train_loss": -39.579830169677734, "global_step": 224539, "epoch": 1855} {"train_loss": -39.54108428955078, "global_step": 224540, "epoch": 1855} {"train_loss": -40.50460433959961, "global_step": 224541, "epoch": 1855} {"train_loss": -39.36238098144531, "global_step": 224542, "epoch": 1855} {"train_loss": -40.85243606567383, "global_step": 224543, "epoch": 1855} {"train_loss": -38.47708511352539, "global_step": 224544, "epoch": 1855} {"train_loss": -41.547462463378906, "global_step": 224545, "epoch": 1855} {"train_loss": -39.59315872192383, "global_step": 224546, "epoch": 1855} {"train_loss": -41.54505157470703, "global_step": 224547, "epoch": 1855} {"train_loss": -39.2302131652832, "global_step": 224548, "epoch": 1855} {"train_loss": -41.6353759765625, "global_step": 224549, "epoch": 1855} {"train_loss": -40.9709587097168, "global_step": 224550, "epoch": 1855} {"train_loss": -42.15147018432617, "global_step": 224551, "epoch": 1855} {"train_loss": -41.25004196166992, "global_step": 224552, "epoch": 1855} {"train_loss": -41.7071418762207, "global_step": 224553, "epoch": 1855} {"train_loss": -41.41584777832031, "global_step": 224554, "epoch": 1855} {"train_loss": -40.851314544677734, "global_step": 224555, "epoch": 1855} {"train_loss": -42.31861114501953, "global_step": 224556, "epoch": 1855} {"train_loss": -40.96051025390625, "global_step": 224557, "epoch": 1855} {"train_loss": -40.80874252319336, "global_step": 224558, "epoch": 1855} {"train_loss": -41.54329299926758, "global_step": 224559, "epoch": 1855} {"train_loss": -41.111934661865234, "global_step": 224560, "epoch": 1855} {"train_loss": -40.6854362487793, "global_step": 224561, "epoch": 1855} {"train_loss": -41.6893196105957, "global_step": 224562, "epoch": 1855} {"train_loss": -40.398414611816406, "global_step": 224563, "epoch": 1855} {"train_loss": -41.14931869506836, "global_step": 224564, "epoch": 1855} {"train_loss": -41.154212951660156, "global_step": 224565, "epoch": 1855} {"train_loss": -40.25297927856445, "global_step": 224566, "epoch": 1855} {"train_loss": -41.96046829223633, "global_step": 224567, "epoch": 1855} {"train_loss": -40.83152770996094, "global_step": 224568, "epoch": 1855} {"train_loss": -42.448246002197266, "global_step": 224569, "epoch": 1855} {"train_loss": -41.54473876953125, "global_step": 224570, "epoch": 1855} {"train_loss": -41.747161865234375, "global_step": 224571, "epoch": 1855} {"train_loss": -42.12371826171875, "global_step": 224572, "epoch": 1855} {"train_loss": -41.910423278808594, "global_step": 224573, "epoch": 1855} {"train_loss": -41.43986129760742, "global_step": 224574, "epoch": 1855} {"train_loss": -41.349648767266395, "global_step": 224575, "epoch": 1855, "val_loss": 2824484.75} {"train_loss": -40.961029052734375, "global_step": 224576, "epoch": 1856} {"train_loss": -41.59971618652344, "global_step": 224577, "epoch": 1856} {"train_loss": -41.345035552978516, "global_step": 224578, "epoch": 1856} {"train_loss": -40.751522064208984, "global_step": 224579, "epoch": 1856} {"train_loss": -42.0491943359375, "global_step": 224580, "epoch": 1856} {"train_loss": -41.50850296020508, "global_step": 224581, "epoch": 1856} {"train_loss": -40.42924118041992, "global_step": 224582, "epoch": 1856} {"train_loss": -41.905757904052734, "global_step": 224583, "epoch": 1856} {"train_loss": -41.898345947265625, "global_step": 224584, "epoch": 1856} {"train_loss": -41.38636779785156, "global_step": 224585, "epoch": 1856} {"train_loss": -41.75059127807617, "global_step": 224586, "epoch": 1856} {"train_loss": -41.526302337646484, "global_step": 224587, "epoch": 1856} {"train_loss": -41.41079330444336, "global_step": 224588, "epoch": 1856} {"train_loss": -41.64649200439453, "global_step": 224589, "epoch": 1856} {"train_loss": -41.38283920288086, "global_step": 224590, "epoch": 1856} {"train_loss": -42.01189041137695, "global_step": 224591, "epoch": 1856} {"train_loss": -41.26060104370117, "global_step": 224592, "epoch": 1856} {"train_loss": -41.90537643432617, "global_step": 224593, "epoch": 1856} {"train_loss": -41.84751892089844, "global_step": 224594, "epoch": 1856} {"train_loss": -41.539031982421875, "global_step": 224595, "epoch": 1856} {"train_loss": -42.185340881347656, "global_step": 224596, "epoch": 1856} {"train_loss": -41.84231185913086, "global_step": 224597, "epoch": 1856} {"train_loss": -41.8813591003418, "global_step": 224598, "epoch": 1856} {"train_loss": -41.82741165161133, "global_step": 224599, "epoch": 1856} {"train_loss": -42.15442657470703, "global_step": 224600, "epoch": 1856} {"train_loss": -42.031333923339844, "global_step": 224601, "epoch": 1856} {"train_loss": -41.761756896972656, "global_step": 224602, "epoch": 1856} {"train_loss": -42.21855163574219, "global_step": 224603, "epoch": 1856} {"train_loss": -42.028076171875, "global_step": 224604, "epoch": 1856} {"train_loss": -42.257484436035156, "global_step": 224605, "epoch": 1856} {"train_loss": -41.5661506652832, "global_step": 224606, "epoch": 1856} {"train_loss": -42.06888961791992, "global_step": 224607, "epoch": 1856} {"train_loss": -42.53510284423828, "global_step": 224608, "epoch": 1856} {"train_loss": -42.36305236816406, "global_step": 224609, "epoch": 1856} {"train_loss": -41.92301559448242, "global_step": 224610, "epoch": 1856} {"train_loss": -42.55998611450195, "global_step": 224611, "epoch": 1856} {"train_loss": -42.921390533447266, "global_step": 224612, "epoch": 1856} {"train_loss": -42.2368278503418, "global_step": 224613, "epoch": 1856} {"train_loss": -42.15700149536133, "global_step": 224614, "epoch": 1856} {"train_loss": -42.34989929199219, "global_step": 224615, "epoch": 1856} {"train_loss": -42.03510665893555, "global_step": 224616, "epoch": 1856} {"train_loss": -42.685298919677734, "global_step": 224617, "epoch": 1856} {"train_loss": -41.4378776550293, "global_step": 224618, "epoch": 1856} {"train_loss": -41.84916305541992, "global_step": 224619, "epoch": 1856} {"train_loss": -41.738922119140625, "global_step": 224620, "epoch": 1856} {"train_loss": -42.40667724609375, "global_step": 224621, "epoch": 1856} {"train_loss": -42.5930061340332, "global_step": 224622, "epoch": 1856} {"train_loss": -41.045101165771484, "global_step": 224623, "epoch": 1856} {"train_loss": -41.514156341552734, "global_step": 224624, "epoch": 1856} {"train_loss": -41.45420455932617, "global_step": 224625, "epoch": 1856} {"train_loss": -40.54846954345703, "global_step": 224626, "epoch": 1856} {"train_loss": -42.175113677978516, "global_step": 224627, "epoch": 1856} {"train_loss": -34.947818756103516, "global_step": 224628, "epoch": 1856} {"train_loss": -39.42008590698242, "global_step": 224629, "epoch": 1856} {"train_loss": -39.57255172729492, "global_step": 224630, "epoch": 1856} {"train_loss": -42.3186149597168, "global_step": 224631, "epoch": 1856} {"train_loss": -41.0452766418457, "global_step": 224632, "epoch": 1856} {"train_loss": -39.58625030517578, "global_step": 224633, "epoch": 1856} {"train_loss": -37.79098892211914, "global_step": 224634, "epoch": 1856} {"train_loss": -40.23531723022461, "global_step": 224635, "epoch": 1856} {"train_loss": -39.38054275512695, "global_step": 224636, "epoch": 1856} {"train_loss": -37.01411437988281, "global_step": 224637, "epoch": 1856} {"train_loss": -35.79106903076172, "global_step": 224638, "epoch": 1856} {"train_loss": -40.533477783203125, "global_step": 224639, "epoch": 1856} {"train_loss": -38.11750793457031, "global_step": 224640, "epoch": 1856} {"train_loss": -35.338104248046875, "global_step": 224641, "epoch": 1856} {"train_loss": -39.6427116394043, "global_step": 224642, "epoch": 1856} {"train_loss": -39.979923248291016, "global_step": 224643, "epoch": 1856} {"train_loss": -36.325374603271484, "global_step": 224644, "epoch": 1856} {"train_loss": -38.63298797607422, "global_step": 224645, "epoch": 1856} {"train_loss": -40.45901107788086, "global_step": 224646, "epoch": 1856} {"train_loss": -38.352813720703125, "global_step": 224647, "epoch": 1856} {"train_loss": -40.84537887573242, "global_step": 224648, "epoch": 1856} {"train_loss": -39.63405227661133, "global_step": 224649, "epoch": 1856} {"train_loss": -35.587432861328125, "global_step": 224650, "epoch": 1856} {"train_loss": -38.00542449951172, "global_step": 224651, "epoch": 1856} {"train_loss": -39.86911392211914, "global_step": 224652, "epoch": 1856} {"train_loss": -40.648799896240234, "global_step": 224653, "epoch": 1856} {"train_loss": -38.013858795166016, "global_step": 224654, "epoch": 1856} {"train_loss": -40.606781005859375, "global_step": 224655, "epoch": 1856} {"train_loss": -39.66339874267578, "global_step": 224656, "epoch": 1856} {"train_loss": -39.73863220214844, "global_step": 224657, "epoch": 1856} {"train_loss": -41.2723503112793, "global_step": 224658, "epoch": 1856} {"train_loss": -39.84782409667969, "global_step": 224659, "epoch": 1856} {"train_loss": -41.5174674987793, "global_step": 224660, "epoch": 1856} {"train_loss": -40.71107864379883, "global_step": 224661, "epoch": 1856} {"train_loss": -41.2324333190918, "global_step": 224662, "epoch": 1856} {"train_loss": -36.30281066894531, "global_step": 224663, "epoch": 1856} {"train_loss": -41.47133255004883, "global_step": 224664, "epoch": 1856} {"train_loss": -38.306922912597656, "global_step": 224665, "epoch": 1856} {"train_loss": -41.47422790527344, "global_step": 224666, "epoch": 1856} {"train_loss": -40.836204528808594, "global_step": 224667, "epoch": 1856} {"train_loss": -41.21796798706055, "global_step": 224668, "epoch": 1856} {"train_loss": -40.45303726196289, "global_step": 224669, "epoch": 1856} {"train_loss": -40.66317367553711, "global_step": 224670, "epoch": 1856} {"train_loss": -40.72822952270508, "global_step": 224671, "epoch": 1856} {"train_loss": -41.79146194458008, "global_step": 224672, "epoch": 1856} {"train_loss": -40.17240524291992, "global_step": 224673, "epoch": 1856} {"train_loss": -40.295867919921875, "global_step": 224674, "epoch": 1856} {"train_loss": -42.027923583984375, "global_step": 224675, "epoch": 1856} {"train_loss": -41.44550323486328, "global_step": 224676, "epoch": 1856} {"train_loss": -41.76298141479492, "global_step": 224677, "epoch": 1856} {"train_loss": -41.97231674194336, "global_step": 224678, "epoch": 1856} {"train_loss": -41.53971481323242, "global_step": 224679, "epoch": 1856} {"train_loss": -41.878395080566406, "global_step": 224680, "epoch": 1856} {"train_loss": -41.91679382324219, "global_step": 224681, "epoch": 1856} {"train_loss": -41.52941131591797, "global_step": 224682, "epoch": 1856} {"train_loss": -41.98588180541992, "global_step": 224683, "epoch": 1856} {"train_loss": -40.38174057006836, "global_step": 224684, "epoch": 1856} {"train_loss": -41.07447814941406, "global_step": 224685, "epoch": 1856} {"train_loss": -41.38473892211914, "global_step": 224686, "epoch": 1856} {"train_loss": -42.04026412963867, "global_step": 224687, "epoch": 1856} {"train_loss": -42.41134262084961, "global_step": 224688, "epoch": 1856} {"train_loss": -41.67210388183594, "global_step": 224689, "epoch": 1856} {"train_loss": -42.360694885253906, "global_step": 224690, "epoch": 1856} {"train_loss": -41.958831787109375, "global_step": 224691, "epoch": 1856} {"train_loss": -42.05411911010742, "global_step": 224692, "epoch": 1856} {"train_loss": -41.624267578125, "global_step": 224693, "epoch": 1856} {"train_loss": -41.860939025878906, "global_step": 224694, "epoch": 1856} {"train_loss": -42.673458099365234, "global_step": 224695, "epoch": 1856} {"train_loss": -40.8720026883212, "global_step": 224696, "epoch": 1856, "val_loss": 2744411.0} {"train_loss": -42.19777297973633, "global_step": 224697, "epoch": 1857} {"train_loss": -41.09889602661133, "global_step": 224698, "epoch": 1857} {"train_loss": -41.620582580566406, "global_step": 224699, "epoch": 1857} {"train_loss": -41.787288665771484, "global_step": 224700, "epoch": 1857} {"train_loss": -42.16168975830078, "global_step": 224701, "epoch": 1857} {"train_loss": -41.351844787597656, "global_step": 224702, "epoch": 1857} {"train_loss": -42.544063568115234, "global_step": 224703, "epoch": 1857} {"train_loss": -42.25350570678711, "global_step": 224704, "epoch": 1857} {"train_loss": -42.25153732299805, "global_step": 224705, "epoch": 1857} {"train_loss": -41.3754768371582, "global_step": 224706, "epoch": 1857} {"train_loss": -42.483665466308594, "global_step": 224707, "epoch": 1857} {"train_loss": -40.414424896240234, "global_step": 224708, "epoch": 1857} {"train_loss": -41.66521072387695, "global_step": 224709, "epoch": 1857} {"train_loss": -42.02676773071289, "global_step": 224710, "epoch": 1857} {"train_loss": -42.85992431640625, "global_step": 224711, "epoch": 1857} {"train_loss": -39.954654693603516, "global_step": 224712, "epoch": 1857} {"train_loss": -42.602108001708984, "global_step": 224713, "epoch": 1857} {"train_loss": -41.79879379272461, "global_step": 224714, "epoch": 1857} {"train_loss": -39.80758285522461, "global_step": 224715, "epoch": 1857} {"train_loss": -41.71208572387695, "global_step": 224716, "epoch": 1857} {"train_loss": -42.78721237182617, "global_step": 224717, "epoch": 1857} {"train_loss": -39.8487548828125, "global_step": 224718, "epoch": 1857} {"train_loss": -41.53779602050781, "global_step": 224719, "epoch": 1857} {"train_loss": -42.156044006347656, "global_step": 224720, "epoch": 1857} {"train_loss": -40.267433166503906, "global_step": 224721, "epoch": 1857} {"train_loss": -40.7867317199707, "global_step": 224722, "epoch": 1857} {"train_loss": -41.3286247253418, "global_step": 224723, "epoch": 1857} {"train_loss": -41.85702133178711, "global_step": 224724, "epoch": 1857} {"train_loss": -40.95991516113281, "global_step": 224725, "epoch": 1857} {"train_loss": -41.7335319519043, "global_step": 224726, "epoch": 1857} {"train_loss": -41.39254379272461, "global_step": 224727, "epoch": 1857} {"train_loss": -41.363582611083984, "global_step": 224728, "epoch": 1857} {"train_loss": -41.98173904418945, "global_step": 224729, "epoch": 1857} {"train_loss": -41.20659255981445, "global_step": 224730, "epoch": 1857} {"train_loss": -41.38455581665039, "global_step": 224731, "epoch": 1857} {"train_loss": -41.489707946777344, "global_step": 224732, "epoch": 1857} {"train_loss": -41.51480484008789, "global_step": 224733, "epoch": 1857} {"train_loss": -41.62662124633789, "global_step": 224734, "epoch": 1857} {"train_loss": -41.14297103881836, "global_step": 224735, "epoch": 1857} {"train_loss": -41.916255950927734, "global_step": 224736, "epoch": 1857} {"train_loss": -40.9886589050293, "global_step": 224737, "epoch": 1857} {"train_loss": -41.96915817260742, "global_step": 224738, "epoch": 1857} {"train_loss": -40.1674690246582, "global_step": 224739, "epoch": 1857} {"train_loss": -39.998687744140625, "global_step": 224740, "epoch": 1857} {"train_loss": -40.582740783691406, "global_step": 224741, "epoch": 1857} {"train_loss": -38.18748474121094, "global_step": 224742, "epoch": 1857} {"train_loss": -40.855010986328125, "global_step": 224743, "epoch": 1857} {"train_loss": -40.834693908691406, "global_step": 224744, "epoch": 1857} {"train_loss": -39.94502639770508, "global_step": 224745, "epoch": 1857} {"train_loss": -41.204612731933594, "global_step": 224746, "epoch": 1857} {"train_loss": -41.71025085449219, "global_step": 224747, "epoch": 1857} {"train_loss": -40.69050216674805, "global_step": 224748, "epoch": 1857} {"train_loss": -42.157936096191406, "global_step": 224749, "epoch": 1857} {"train_loss": -41.22504425048828, "global_step": 224750, "epoch": 1857} {"train_loss": -40.900691986083984, "global_step": 224751, "epoch": 1857} {"train_loss": -42.26881408691406, "global_step": 224752, "epoch": 1857} {"train_loss": -41.4307975769043, "global_step": 224753, "epoch": 1857} {"train_loss": -41.97214889526367, "global_step": 224754, "epoch": 1857} {"train_loss": -41.51104736328125, "global_step": 224755, "epoch": 1857} {"train_loss": -41.43171691894531, "global_step": 224756, "epoch": 1857} {"train_loss": -42.10210037231445, "global_step": 224757, "epoch": 1857} {"train_loss": -42.580108642578125, "global_step": 224758, "epoch": 1857} {"train_loss": -42.20478439331055, "global_step": 224759, "epoch": 1857} {"train_loss": -42.142086029052734, "global_step": 224760, "epoch": 1857} {"train_loss": -42.25039291381836, "global_step": 224761, "epoch": 1857} {"train_loss": -39.58182907104492, "global_step": 224762, "epoch": 1857} {"train_loss": -42.09632873535156, "global_step": 224763, "epoch": 1857} {"train_loss": -42.34477615356445, "global_step": 224764, "epoch": 1857} {"train_loss": -41.44508743286133, "global_step": 224765, "epoch": 1857} {"train_loss": -40.563758850097656, "global_step": 224766, "epoch": 1857} {"train_loss": -41.249237060546875, "global_step": 224767, "epoch": 1857} {"train_loss": -42.19395065307617, "global_step": 224768, "epoch": 1857} {"train_loss": -41.764339447021484, "global_step": 224769, "epoch": 1857} {"train_loss": -41.9568977355957, "global_step": 224770, "epoch": 1857} {"train_loss": -41.79808807373047, "global_step": 224771, "epoch": 1857} {"train_loss": -40.90653610229492, "global_step": 224772, "epoch": 1857} {"train_loss": -41.41168975830078, "global_step": 224773, "epoch": 1857} {"train_loss": -42.36494064331055, "global_step": 224774, "epoch": 1857} {"train_loss": -42.03770065307617, "global_step": 224775, "epoch": 1857} {"train_loss": -41.51249313354492, "global_step": 224776, "epoch": 1857} {"train_loss": -41.54049301147461, "global_step": 224777, "epoch": 1857} {"train_loss": -41.1157341003418, "global_step": 224778, "epoch": 1857} {"train_loss": -41.73838424682617, "global_step": 224779, "epoch": 1857} {"train_loss": -42.032535552978516, "global_step": 224780, "epoch": 1857} {"train_loss": -40.5281867980957, "global_step": 224781, "epoch": 1857} {"train_loss": -42.51999282836914, "global_step": 224782, "epoch": 1857} {"train_loss": -41.654266357421875, "global_step": 224783, "epoch": 1857} {"train_loss": -42.405086517333984, "global_step": 224784, "epoch": 1857} {"train_loss": -42.02004623413086, "global_step": 224785, "epoch": 1857} {"train_loss": -42.1455192565918, "global_step": 224786, "epoch": 1857} {"train_loss": -41.29795837402344, "global_step": 224787, "epoch": 1857} {"train_loss": -41.463802337646484, "global_step": 224788, "epoch": 1857} {"train_loss": -38.448646545410156, "global_step": 224789, "epoch": 1857} {"train_loss": -42.52764892578125, "global_step": 224790, "epoch": 1857} {"train_loss": -40.904781341552734, "global_step": 224791, "epoch": 1857} {"train_loss": -42.58146286010742, "global_step": 224792, "epoch": 1857} {"train_loss": -41.75079345703125, "global_step": 224793, "epoch": 1857} {"train_loss": -41.44430160522461, "global_step": 224794, "epoch": 1857} {"train_loss": -42.124454498291016, "global_step": 224795, "epoch": 1857} {"train_loss": -41.5086555480957, "global_step": 224796, "epoch": 1857} {"train_loss": -41.77292251586914, "global_step": 224797, "epoch": 1857} {"train_loss": -41.99763870239258, "global_step": 224798, "epoch": 1857} {"train_loss": -41.35095977783203, "global_step": 224799, "epoch": 1857} {"train_loss": -42.2890625, "global_step": 224800, "epoch": 1857} {"train_loss": -42.36511993408203, "global_step": 224801, "epoch": 1857} {"train_loss": -42.2219123840332, "global_step": 224802, "epoch": 1857} {"train_loss": -41.74180221557617, "global_step": 224803, "epoch": 1857} {"train_loss": -42.377113342285156, "global_step": 224804, "epoch": 1857} {"train_loss": -42.33956527709961, "global_step": 224805, "epoch": 1857} {"train_loss": -42.08577346801758, "global_step": 224806, "epoch": 1857} {"train_loss": -42.21200180053711, "global_step": 224807, "epoch": 1857} {"train_loss": -42.745513916015625, "global_step": 224808, "epoch": 1857} {"train_loss": -42.52938461303711, "global_step": 224809, "epoch": 1857} {"train_loss": -42.22508239746094, "global_step": 224810, "epoch": 1857} {"train_loss": -42.0712890625, "global_step": 224811, "epoch": 1857} {"train_loss": -42.534698486328125, "global_step": 224812, "epoch": 1857} {"train_loss": -41.69640350341797, "global_step": 224813, "epoch": 1857} {"train_loss": -42.22945785522461, "global_step": 224814, "epoch": 1857} {"train_loss": -41.978145599365234, "global_step": 224815, "epoch": 1857} {"train_loss": -42.2178840637207, "global_step": 224816, "epoch": 1857} {"train_loss": -41.605353773132826, "global_step": 224817, "epoch": 1857, "val_loss": 2626878.25} {"train_loss": -42.27910232543945, "global_step": 224818, "epoch": 1858} {"train_loss": -42.07767868041992, "global_step": 224819, "epoch": 1858} {"train_loss": -42.07052230834961, "global_step": 224820, "epoch": 1858} {"train_loss": -42.36213302612305, "global_step": 224821, "epoch": 1858} {"train_loss": -42.377899169921875, "global_step": 224822, "epoch": 1858} {"train_loss": -41.955013275146484, "global_step": 224823, "epoch": 1858} {"train_loss": -42.27924728393555, "global_step": 224824, "epoch": 1858} {"train_loss": -41.64692306518555, "global_step": 224825, "epoch": 1858} {"train_loss": -41.785709381103516, "global_step": 224826, "epoch": 1858} {"train_loss": -42.5888786315918, "global_step": 224827, "epoch": 1858} {"train_loss": -42.65146255493164, "global_step": 224828, "epoch": 1858} {"train_loss": -42.98103713989258, "global_step": 224829, "epoch": 1858} {"train_loss": -41.48335647583008, "global_step": 224830, "epoch": 1858} {"train_loss": -41.91264724731445, "global_step": 224831, "epoch": 1858} {"train_loss": -42.3437614440918, "global_step": 224832, "epoch": 1858} {"train_loss": -42.75776672363281, "global_step": 224833, "epoch": 1858} {"train_loss": -42.2546501159668, "global_step": 224834, "epoch": 1858} {"train_loss": -41.67596435546875, "global_step": 224835, "epoch": 1858} {"train_loss": -42.74762725830078, "global_step": 224836, "epoch": 1858} {"train_loss": -42.629180908203125, "global_step": 224837, "epoch": 1858} {"train_loss": -42.285518646240234, "global_step": 224838, "epoch": 1858} {"train_loss": -42.867584228515625, "global_step": 224839, "epoch": 1858} {"train_loss": -40.98897933959961, "global_step": 224840, "epoch": 1858} {"train_loss": -42.71086883544922, "global_step": 224841, "epoch": 1858} {"train_loss": -43.022743225097656, "global_step": 224842, "epoch": 1858} {"train_loss": -42.04585647583008, "global_step": 224843, "epoch": 1858} {"train_loss": -41.34226608276367, "global_step": 224844, "epoch": 1858} {"train_loss": -41.645118713378906, "global_step": 224845, "epoch": 1858} {"train_loss": -41.43747329711914, "global_step": 224846, "epoch": 1858} {"train_loss": -41.67180252075195, "global_step": 224847, "epoch": 1858} {"train_loss": -42.072608947753906, "global_step": 224848, "epoch": 1858} {"train_loss": -42.17384719848633, "global_step": 224849, "epoch": 1858} {"train_loss": -39.32184600830078, "global_step": 224850, "epoch": 1858} {"train_loss": -39.38740158081055, "global_step": 224851, "epoch": 1858} {"train_loss": -36.80768966674805, "global_step": 224852, "epoch": 1858} {"train_loss": -39.99241256713867, "global_step": 224853, "epoch": 1858} {"train_loss": -40.25941848754883, "global_step": 224854, "epoch": 1858} {"train_loss": -38.90989303588867, "global_step": 224855, "epoch": 1858} {"train_loss": -41.95368576049805, "global_step": 224856, "epoch": 1858} {"train_loss": -41.291542053222656, "global_step": 224857, "epoch": 1858} {"train_loss": -40.263607025146484, "global_step": 224858, "epoch": 1858} {"train_loss": -39.21786880493164, "global_step": 224859, "epoch": 1858} {"train_loss": -41.4449577331543, "global_step": 224860, "epoch": 1858} {"train_loss": -40.664424896240234, "global_step": 224861, "epoch": 1858} {"train_loss": -41.001338958740234, "global_step": 224862, "epoch": 1858} {"train_loss": -41.33350372314453, "global_step": 224863, "epoch": 1858} {"train_loss": -22.547256469726562, "global_step": 224864, "epoch": 1858} {"train_loss": -40.47787857055664, "global_step": 224865, "epoch": 1858} {"train_loss": -40.82550048828125, "global_step": 224866, "epoch": 1858} {"train_loss": -40.5194206237793, "global_step": 224867, "epoch": 1858} {"train_loss": -40.52376937866211, "global_step": 224868, "epoch": 1858} {"train_loss": -40.53237533569336, "global_step": 224869, "epoch": 1858} {"train_loss": -39.54500961303711, "global_step": 224870, "epoch": 1858} {"train_loss": -40.76032257080078, "global_step": 224871, "epoch": 1858} {"train_loss": -39.33098602294922, "global_step": 224872, "epoch": 1858} {"train_loss": -41.139984130859375, "global_step": 224873, "epoch": 1858} {"train_loss": -40.02622985839844, "global_step": 224874, "epoch": 1858} {"train_loss": -40.18263244628906, "global_step": 224875, "epoch": 1858} {"train_loss": -38.720882415771484, "global_step": 224876, "epoch": 1858} {"train_loss": -37.12200927734375, "global_step": 224877, "epoch": 1858} {"train_loss": -40.80329513549805, "global_step": 224878, "epoch": 1858} {"train_loss": -41.558162689208984, "global_step": 224879, "epoch": 1858} {"train_loss": -39.49662399291992, "global_step": 224880, "epoch": 1858} {"train_loss": -40.96749496459961, "global_step": 224881, "epoch": 1858} {"train_loss": -41.75166702270508, "global_step": 224882, "epoch": 1858} {"train_loss": -40.765384674072266, "global_step": 224883, "epoch": 1858} {"train_loss": -38.303794860839844, "global_step": 224884, "epoch": 1858} {"train_loss": -41.8576545715332, "global_step": 224885, "epoch": 1858} {"train_loss": -40.59429931640625, "global_step": 224886, "epoch": 1858} {"train_loss": -41.59981155395508, "global_step": 224887, "epoch": 1858} {"train_loss": -40.922847747802734, "global_step": 224888, "epoch": 1858} {"train_loss": -40.29522705078125, "global_step": 224889, "epoch": 1858} {"train_loss": -40.71260452270508, "global_step": 224890, "epoch": 1858} {"train_loss": -39.537994384765625, "global_step": 224891, "epoch": 1858} {"train_loss": -38.69383239746094, "global_step": 224892, "epoch": 1858} {"train_loss": -39.00657272338867, "global_step": 224893, "epoch": 1858} {"train_loss": -39.022151947021484, "global_step": 224894, "epoch": 1858} {"train_loss": -41.44314193725586, "global_step": 224895, "epoch": 1858} {"train_loss": -40.07941818237305, "global_step": 224896, "epoch": 1858} {"train_loss": -40.65497970581055, "global_step": 224897, "epoch": 1858} {"train_loss": -40.681705474853516, "global_step": 224898, "epoch": 1858} {"train_loss": -39.4069709777832, "global_step": 224899, "epoch": 1858} {"train_loss": -40.18302536010742, "global_step": 224900, "epoch": 1858} {"train_loss": -38.61161422729492, "global_step": 224901, "epoch": 1858} {"train_loss": -38.565147399902344, "global_step": 224902, "epoch": 1858} {"train_loss": -40.51249313354492, "global_step": 224903, "epoch": 1858} {"train_loss": -40.789100646972656, "global_step": 224904, "epoch": 1858} {"train_loss": -39.43461990356445, "global_step": 224905, "epoch": 1858} {"train_loss": -40.10039138793945, "global_step": 224906, "epoch": 1858} {"train_loss": -40.22586441040039, "global_step": 224907, "epoch": 1858} {"train_loss": -39.87336349487305, "global_step": 224908, "epoch": 1858} {"train_loss": -38.00672149658203, "global_step": 224909, "epoch": 1858} {"train_loss": -40.983642578125, "global_step": 224910, "epoch": 1858} {"train_loss": -40.791168212890625, "global_step": 224911, "epoch": 1858} {"train_loss": -38.20917510986328, "global_step": 224912, "epoch": 1858} {"train_loss": -40.65909957885742, "global_step": 224913, "epoch": 1858} {"train_loss": -40.9302978515625, "global_step": 224914, "epoch": 1858} {"train_loss": -40.6652717590332, "global_step": 224915, "epoch": 1858} {"train_loss": -41.24630355834961, "global_step": 224916, "epoch": 1858} {"train_loss": -40.33152389526367, "global_step": 224917, "epoch": 1858} {"train_loss": -41.62855529785156, "global_step": 224918, "epoch": 1858} {"train_loss": -41.65789794921875, "global_step": 224919, "epoch": 1858} {"train_loss": -41.12884521484375, "global_step": 224920, "epoch": 1858} {"train_loss": -41.83100509643555, "global_step": 224921, "epoch": 1858} {"train_loss": -37.84641647338867, "global_step": 224922, "epoch": 1858} {"train_loss": -41.57501983642578, "global_step": 224923, "epoch": 1858} {"train_loss": -41.832069396972656, "global_step": 224924, "epoch": 1858} {"train_loss": -41.304439544677734, "global_step": 224925, "epoch": 1858} {"train_loss": -41.79812240600586, "global_step": 224926, "epoch": 1858} {"train_loss": -41.305049896240234, "global_step": 224927, "epoch": 1858} {"train_loss": -38.53984451293945, "global_step": 224928, "epoch": 1858} {"train_loss": -40.14540481567383, "global_step": 224929, "epoch": 1858} {"train_loss": -41.521610260009766, "global_step": 224930, "epoch": 1858} {"train_loss": -41.42534255981445, "global_step": 224931, "epoch": 1858} {"train_loss": -41.563087463378906, "global_step": 224932, "epoch": 1858} {"train_loss": -41.332271575927734, "global_step": 224933, "epoch": 1858} {"train_loss": -40.285301208496094, "global_step": 224934, "epoch": 1858} {"train_loss": -40.73354721069336, "global_step": 224935, "epoch": 1858} {"train_loss": -41.43073654174805, "global_step": 224936, "epoch": 1858} {"train_loss": -36.529476165771484, "global_step": 224937, "epoch": 1858} {"train_loss": -40.64705594906137, "global_step": 224938, "epoch": 1858, "val_loss": 2749577.25} {"train_loss": -42.042110443115234, "global_step": 224939, "epoch": 1859} {"train_loss": -41.55670928955078, "global_step": 224940, "epoch": 1859} {"train_loss": -23.594690322875977, "global_step": 224941, "epoch": 1859} {"train_loss": -40.67192459106445, "global_step": 224942, "epoch": 1859} {"train_loss": -39.179168701171875, "global_step": 224943, "epoch": 1859} {"train_loss": -39.38619613647461, "global_step": 224944, "epoch": 1859} {"train_loss": -36.97743606567383, "global_step": 224945, "epoch": 1859} {"train_loss": -36.812435150146484, "global_step": 224946, "epoch": 1859} {"train_loss": -38.62456130981445, "global_step": 224947, "epoch": 1859} {"train_loss": -22.262880325317383, "global_step": 224948, "epoch": 1859} {"train_loss": -37.3725471496582, "global_step": 224949, "epoch": 1859} {"train_loss": -40.092308044433594, "global_step": 224950, "epoch": 1859} {"train_loss": -25.546255111694336, "global_step": 224951, "epoch": 1859} {"train_loss": -39.92608642578125, "global_step": 224952, "epoch": 1859} {"train_loss": -38.98751449584961, "global_step": 224953, "epoch": 1859} {"train_loss": -37.96613311767578, "global_step": 224954, "epoch": 1859} {"train_loss": -35.98025894165039, "global_step": 224955, "epoch": 1859} {"train_loss": -37.40083694458008, "global_step": 224956, "epoch": 1859} {"train_loss": -36.13883590698242, "global_step": 224957, "epoch": 1859} {"train_loss": -37.736671447753906, "global_step": 224958, "epoch": 1859} {"train_loss": -31.73797607421875, "global_step": 224959, "epoch": 1859} {"train_loss": -36.9259147644043, "global_step": 224960, "epoch": 1859} {"train_loss": -35.444793701171875, "global_step": 224961, "epoch": 1859} {"train_loss": -39.6146125793457, "global_step": 224962, "epoch": 1859} {"train_loss": -39.95680618286133, "global_step": 224963, "epoch": 1859} {"train_loss": -38.70857620239258, "global_step": 224964, "epoch": 1859} {"train_loss": -37.75686264038086, "global_step": 224965, "epoch": 1859} {"train_loss": -36.550994873046875, "global_step": 224966, "epoch": 1859} {"train_loss": -39.47391891479492, "global_step": 224967, "epoch": 1859} {"train_loss": -38.33879852294922, "global_step": 224968, "epoch": 1859} {"train_loss": -40.599082946777344, "global_step": 224969, "epoch": 1859} {"train_loss": -40.33823776245117, "global_step": 224970, "epoch": 1859} {"train_loss": -39.44767761230469, "global_step": 224971, "epoch": 1859} {"train_loss": -40.6264533996582, "global_step": 224972, "epoch": 1859} {"train_loss": -39.65058135986328, "global_step": 224973, "epoch": 1859} {"train_loss": -40.24332809448242, "global_step": 224974, "epoch": 1859} {"train_loss": -40.527931213378906, "global_step": 224975, "epoch": 1859} {"train_loss": -40.388816833496094, "global_step": 224976, "epoch": 1859} {"train_loss": -38.70475387573242, "global_step": 224977, "epoch": 1859} {"train_loss": -39.116363525390625, "global_step": 224978, "epoch": 1859} {"train_loss": -37.78868865966797, "global_step": 224979, "epoch": 1859} {"train_loss": -40.15930938720703, "global_step": 224980, "epoch": 1859} {"train_loss": -39.80436325073242, "global_step": 224981, "epoch": 1859} {"train_loss": -38.63186264038086, "global_step": 224982, "epoch": 1859} {"train_loss": -39.65964126586914, "global_step": 224983, "epoch": 1859} {"train_loss": -39.890254974365234, "global_step": 224984, "epoch": 1859} {"train_loss": -40.68656539916992, "global_step": 224985, "epoch": 1859} {"train_loss": -40.3233528137207, "global_step": 224986, "epoch": 1859} {"train_loss": -40.61759567260742, "global_step": 224987, "epoch": 1859} {"train_loss": -40.37856674194336, "global_step": 224988, "epoch": 1859} {"train_loss": -40.57725143432617, "global_step": 224989, "epoch": 1859} {"train_loss": -40.5875358581543, "global_step": 224990, "epoch": 1859} {"train_loss": -41.07447814941406, "global_step": 224991, "epoch": 1859} {"train_loss": -40.6722526550293, "global_step": 224992, "epoch": 1859} {"train_loss": -40.72776412963867, "global_step": 224993, "epoch": 1859} {"train_loss": -40.71294021606445, "global_step": 224994, "epoch": 1859} {"train_loss": -41.65371322631836, "global_step": 224995, "epoch": 1859} {"train_loss": -41.113037109375, "global_step": 224996, "epoch": 1859} {"train_loss": -40.808074951171875, "global_step": 224997, "epoch": 1859} {"train_loss": -41.626625061035156, "global_step": 224998, "epoch": 1859} {"train_loss": -40.57132339477539, "global_step": 224999, "epoch": 1859} {"train_loss": -39.696041107177734, "global_step": 225000, "epoch": 1859} {"train_loss": -41.54621887207031, "global_step": 225001, "epoch": 1859} {"train_loss": -38.58914566040039, "global_step": 225002, "epoch": 1859} {"train_loss": -40.77927780151367, "global_step": 225003, "epoch": 1859} {"train_loss": -41.03813552856445, "global_step": 225004, "epoch": 1859} {"train_loss": -41.30833053588867, "global_step": 225005, "epoch": 1859} {"train_loss": -40.941932678222656, "global_step": 225006, "epoch": 1859} {"train_loss": -41.0827751159668, "global_step": 225007, "epoch": 1859} {"train_loss": -41.220951080322266, "global_step": 225008, "epoch": 1859} {"train_loss": -40.993038177490234, "global_step": 225009, "epoch": 1859} {"train_loss": -40.971126556396484, "global_step": 225010, "epoch": 1859} {"train_loss": -41.050018310546875, "global_step": 225011, "epoch": 1859} {"train_loss": -40.74160385131836, "global_step": 225012, "epoch": 1859} {"train_loss": -41.5712776184082, "global_step": 225013, "epoch": 1859} {"train_loss": -41.771759033203125, "global_step": 225014, "epoch": 1859} {"train_loss": -40.74147415161133, "global_step": 225015, "epoch": 1859} {"train_loss": -41.73295974731445, "global_step": 225016, "epoch": 1859} {"train_loss": -42.21375274658203, "global_step": 225017, "epoch": 1859} {"train_loss": -42.35207748413086, "global_step": 225018, "epoch": 1859} {"train_loss": -41.19777297973633, "global_step": 225019, "epoch": 1859} {"train_loss": -41.848236083984375, "global_step": 225020, "epoch": 1859} {"train_loss": -41.029850006103516, "global_step": 225021, "epoch": 1859} {"train_loss": -41.862239837646484, "global_step": 225022, "epoch": 1859} {"train_loss": -42.083251953125, "global_step": 225023, "epoch": 1859} {"train_loss": -41.976741790771484, "global_step": 225024, "epoch": 1859} {"train_loss": -42.067264556884766, "global_step": 225025, "epoch": 1859} {"train_loss": -41.93233108520508, "global_step": 225026, "epoch": 1859} {"train_loss": -40.89796829223633, "global_step": 225027, "epoch": 1859} {"train_loss": -40.12382125854492, "global_step": 225028, "epoch": 1859} {"train_loss": -41.141754150390625, "global_step": 225029, "epoch": 1859} {"train_loss": -41.85649490356445, "global_step": 225030, "epoch": 1859} {"train_loss": -39.67312240600586, "global_step": 225031, "epoch": 1859} {"train_loss": -41.66554641723633, "global_step": 225032, "epoch": 1859} {"train_loss": -41.91001510620117, "global_step": 225033, "epoch": 1859} {"train_loss": -41.7984504699707, "global_step": 225034, "epoch": 1859} {"train_loss": -41.93940734863281, "global_step": 225035, "epoch": 1859} {"train_loss": -42.17444610595703, "global_step": 225036, "epoch": 1859} {"train_loss": -41.01426315307617, "global_step": 225037, "epoch": 1859} {"train_loss": -42.01994705200195, "global_step": 225038, "epoch": 1859} {"train_loss": -41.392208099365234, "global_step": 225039, "epoch": 1859} {"train_loss": -41.63739013671875, "global_step": 225040, "epoch": 1859} {"train_loss": -41.8310432434082, "global_step": 225041, "epoch": 1859} {"train_loss": -42.69526290893555, "global_step": 225042, "epoch": 1859} {"train_loss": -42.07612991333008, "global_step": 225043, "epoch": 1859} {"train_loss": -41.44261932373047, "global_step": 225044, "epoch": 1859} {"train_loss": -41.95707702636719, "global_step": 225045, "epoch": 1859} {"train_loss": -40.87750244140625, "global_step": 225046, "epoch": 1859} {"train_loss": -41.33454132080078, "global_step": 225047, "epoch": 1859} {"train_loss": -42.0174446105957, "global_step": 225048, "epoch": 1859} {"train_loss": -41.666194915771484, "global_step": 225049, "epoch": 1859} {"train_loss": -42.562965393066406, "global_step": 225050, "epoch": 1859} {"train_loss": -42.1453971862793, "global_step": 225051, "epoch": 1859} {"train_loss": -42.36883544921875, "global_step": 225052, "epoch": 1859} {"train_loss": -41.5472297668457, "global_step": 225053, "epoch": 1859} {"train_loss": -42.249061584472656, "global_step": 225054, "epoch": 1859} {"train_loss": -42.44050979614258, "global_step": 225055, "epoch": 1859} {"train_loss": -41.839168548583984, "global_step": 225056, "epoch": 1859} {"train_loss": -41.57477951049805, "global_step": 225057, "epoch": 1859} {"train_loss": -41.88175582885742, "global_step": 225058, "epoch": 1859} {"train_loss": -40.00198819814635, "global_step": 225059, "epoch": 1859, "val_loss": 2693191.0} {"train_loss": -41.593299865722656, "global_step": 225060, "epoch": 1860} {"train_loss": -41.047576904296875, "global_step": 225061, "epoch": 1860} {"train_loss": -40.99064254760742, "global_step": 225062, "epoch": 1860} {"train_loss": -40.86830520629883, "global_step": 225063, "epoch": 1860} {"train_loss": -40.47321319580078, "global_step": 225064, "epoch": 1860} {"train_loss": -40.64829635620117, "global_step": 225065, "epoch": 1860} {"train_loss": -41.10774612426758, "global_step": 225066, "epoch": 1860} {"train_loss": -38.37981033325195, "global_step": 225067, "epoch": 1860} {"train_loss": -35.4814453125, "global_step": 225068, "epoch": 1860} {"train_loss": -37.1369743347168, "global_step": 225069, "epoch": 1860} {"train_loss": -40.87590789794922, "global_step": 225070, "epoch": 1860} {"train_loss": -35.703643798828125, "global_step": 225071, "epoch": 1860} {"train_loss": -34.55928421020508, "global_step": 225072, "epoch": 1860} {"train_loss": -38.91215133666992, "global_step": 225073, "epoch": 1860} {"train_loss": -38.670894622802734, "global_step": 225074, "epoch": 1860} {"train_loss": -36.792457580566406, "global_step": 225075, "epoch": 1860} {"train_loss": -38.588356018066406, "global_step": 225076, "epoch": 1860} {"train_loss": -38.15916442871094, "global_step": 225077, "epoch": 1860} {"train_loss": -34.2687873840332, "global_step": 225078, "epoch": 1860} {"train_loss": -38.87667465209961, "global_step": 225079, "epoch": 1860} {"train_loss": -37.184810638427734, "global_step": 225080, "epoch": 1860} {"train_loss": -34.399749755859375, "global_step": 225081, "epoch": 1860} {"train_loss": -37.15358352661133, "global_step": 225082, "epoch": 1860} {"train_loss": -37.23289489746094, "global_step": 225083, "epoch": 1860} {"train_loss": -38.087406158447266, "global_step": 225084, "epoch": 1860} {"train_loss": -38.767578125, "global_step": 225085, "epoch": 1860} {"train_loss": -39.539058685302734, "global_step": 225086, "epoch": 1860} {"train_loss": -40.10896301269531, "global_step": 225087, "epoch": 1860} {"train_loss": -39.4373779296875, "global_step": 225088, "epoch": 1860} {"train_loss": -40.20008087158203, "global_step": 225089, "epoch": 1860} {"train_loss": -39.299964904785156, "global_step": 225090, "epoch": 1860} {"train_loss": -40.3084831237793, "global_step": 225091, "epoch": 1860} {"train_loss": -40.92428207397461, "global_step": 225092, "epoch": 1860} {"train_loss": -40.787940979003906, "global_step": 225093, "epoch": 1860} {"train_loss": -40.87228012084961, "global_step": 225094, "epoch": 1860} {"train_loss": -40.14730453491211, "global_step": 225095, "epoch": 1860} {"train_loss": -41.00360107421875, "global_step": 225096, "epoch": 1860} {"train_loss": -40.071048736572266, "global_step": 225097, "epoch": 1860} {"train_loss": -41.111324310302734, "global_step": 225098, "epoch": 1860} {"train_loss": -40.4874153137207, "global_step": 225099, "epoch": 1860} {"train_loss": -41.16067123413086, "global_step": 225100, "epoch": 1860} {"train_loss": -40.79977035522461, "global_step": 225101, "epoch": 1860} {"train_loss": -40.70817184448242, "global_step": 225102, "epoch": 1860} {"train_loss": -41.46979522705078, "global_step": 225103, "epoch": 1860} {"train_loss": -39.182533264160156, "global_step": 225104, "epoch": 1860} {"train_loss": -41.04289627075195, "global_step": 225105, "epoch": 1860} {"train_loss": -41.124610900878906, "global_step": 225106, "epoch": 1860} {"train_loss": -40.90713882446289, "global_step": 225107, "epoch": 1860} {"train_loss": -41.43500900268555, "global_step": 225108, "epoch": 1860} {"train_loss": -40.62925338745117, "global_step": 225109, "epoch": 1860} {"train_loss": -41.22536849975586, "global_step": 225110, "epoch": 1860} {"train_loss": -40.840118408203125, "global_step": 225111, "epoch": 1860} {"train_loss": -41.14878845214844, "global_step": 225112, "epoch": 1860} {"train_loss": -41.62343215942383, "global_step": 225113, "epoch": 1860} {"train_loss": -41.5800895690918, "global_step": 225114, "epoch": 1860} {"train_loss": -41.078269958496094, "global_step": 225115, "epoch": 1860} {"train_loss": -41.03062057495117, "global_step": 225116, "epoch": 1860} {"train_loss": -40.42112350463867, "global_step": 225117, "epoch": 1860} {"train_loss": -41.173484802246094, "global_step": 225118, "epoch": 1860} {"train_loss": -41.99406433105469, "global_step": 225119, "epoch": 1860} {"train_loss": -41.46991729736328, "global_step": 225120, "epoch": 1860} {"train_loss": -41.460594177246094, "global_step": 225121, "epoch": 1860} {"train_loss": -41.90037155151367, "global_step": 225122, "epoch": 1860} {"train_loss": -40.869869232177734, "global_step": 225123, "epoch": 1860} {"train_loss": -41.92930603027344, "global_step": 225124, "epoch": 1860} {"train_loss": -41.566341400146484, "global_step": 225125, "epoch": 1860} {"train_loss": -41.309017181396484, "global_step": 225126, "epoch": 1860} {"train_loss": -41.69979476928711, "global_step": 225127, "epoch": 1860} {"train_loss": -41.916080474853516, "global_step": 225128, "epoch": 1860} {"train_loss": -41.89918899536133, "global_step": 225129, "epoch": 1860} {"train_loss": -42.23203659057617, "global_step": 225130, "epoch": 1860} {"train_loss": -42.13786697387695, "global_step": 225131, "epoch": 1860} {"train_loss": -41.33439254760742, "global_step": 225132, "epoch": 1860} {"train_loss": -42.45132064819336, "global_step": 225133, "epoch": 1860} {"train_loss": -41.98930358886719, "global_step": 225134, "epoch": 1860} {"train_loss": -42.016822814941406, "global_step": 225135, "epoch": 1860} {"train_loss": -42.56155014038086, "global_step": 225136, "epoch": 1860} {"train_loss": -41.89884567260742, "global_step": 225137, "epoch": 1860} {"train_loss": -41.56917190551758, "global_step": 225138, "epoch": 1860} {"train_loss": -42.121620178222656, "global_step": 225139, "epoch": 1860} {"train_loss": -41.87626266479492, "global_step": 225140, "epoch": 1860} {"train_loss": -41.989410400390625, "global_step": 225141, "epoch": 1860} {"train_loss": -42.28657913208008, "global_step": 225142, "epoch": 1860} {"train_loss": -42.54933547973633, "global_step": 225143, "epoch": 1860} {"train_loss": -42.2242431640625, "global_step": 225144, "epoch": 1860} {"train_loss": -42.3754768371582, "global_step": 225145, "epoch": 1860} {"train_loss": -42.239479064941406, "global_step": 225146, "epoch": 1860} {"train_loss": -42.146236419677734, "global_step": 225147, "epoch": 1860} {"train_loss": -41.518951416015625, "global_step": 225148, "epoch": 1860} {"train_loss": -42.75577926635742, "global_step": 225149, "epoch": 1860} {"train_loss": -42.662445068359375, "global_step": 225150, "epoch": 1860} {"train_loss": -41.97231674194336, "global_step": 225151, "epoch": 1860} {"train_loss": -42.53489303588867, "global_step": 225152, "epoch": 1860} {"train_loss": -42.17513656616211, "global_step": 225153, "epoch": 1860} {"train_loss": -41.09824752807617, "global_step": 225154, "epoch": 1860} {"train_loss": -42.06182861328125, "global_step": 225155, "epoch": 1860} {"train_loss": -42.611419677734375, "global_step": 225156, "epoch": 1860} {"train_loss": -42.94521713256836, "global_step": 225157, "epoch": 1860} {"train_loss": -42.6922492980957, "global_step": 225158, "epoch": 1860} {"train_loss": -42.44130325317383, "global_step": 225159, "epoch": 1860} {"train_loss": -42.05375289916992, "global_step": 225160, "epoch": 1860} {"train_loss": -42.332698822021484, "global_step": 225161, "epoch": 1860} {"train_loss": -41.80281448364258, "global_step": 225162, "epoch": 1860} {"train_loss": -42.8621940612793, "global_step": 225163, "epoch": 1860} {"train_loss": -42.13734436035156, "global_step": 225164, "epoch": 1860} {"train_loss": -42.7441520690918, "global_step": 225165, "epoch": 1860} {"train_loss": -42.93672561645508, "global_step": 225166, "epoch": 1860} {"train_loss": -42.518104553222656, "global_step": 225167, "epoch": 1860} {"train_loss": -42.77683639526367, "global_step": 225168, "epoch": 1860} {"train_loss": -42.64046859741211, "global_step": 225169, "epoch": 1860} {"train_loss": -42.78680419921875, "global_step": 225170, "epoch": 1860} {"train_loss": -41.23143768310547, "global_step": 225171, "epoch": 1860} {"train_loss": -41.7823486328125, "global_step": 225172, "epoch": 1860} {"train_loss": -40.365840911865234, "global_step": 225173, "epoch": 1860} {"train_loss": -42.06482696533203, "global_step": 225174, "epoch": 1860} {"train_loss": -42.683265686035156, "global_step": 225175, "epoch": 1860} {"train_loss": -42.180843353271484, "global_step": 225176, "epoch": 1860} {"train_loss": -42.17414474487305, "global_step": 225177, "epoch": 1860} {"train_loss": -42.552371978759766, "global_step": 225178, "epoch": 1860} {"train_loss": -42.594581604003906, "global_step": 225179, "epoch": 1860} {"train_loss": -40.91238305588399, "global_step": 225180, "epoch": 1860, "val_loss": 2586894.75} {"train_loss": -43.013790130615234, "global_step": 225181, "epoch": 1861} {"train_loss": -42.636199951171875, "global_step": 225182, "epoch": 1861} {"train_loss": -43.01533126831055, "global_step": 225183, "epoch": 1861} {"train_loss": -42.25978469848633, "global_step": 225184, "epoch": 1861} {"train_loss": -42.782264709472656, "global_step": 225185, "epoch": 1861} {"train_loss": -42.85729217529297, "global_step": 225186, "epoch": 1861} {"train_loss": -42.51975631713867, "global_step": 225187, "epoch": 1861} {"train_loss": -42.95814895629883, "global_step": 225188, "epoch": 1861} {"train_loss": -42.68428039550781, "global_step": 225189, "epoch": 1861} {"train_loss": -42.86643600463867, "global_step": 225190, "epoch": 1861} {"train_loss": -42.791141510009766, "global_step": 225191, "epoch": 1861} {"train_loss": -41.32126998901367, "global_step": 225192, "epoch": 1861} {"train_loss": -40.92543411254883, "global_step": 225193, "epoch": 1861} {"train_loss": -42.224727630615234, "global_step": 225194, "epoch": 1861} {"train_loss": -41.18735885620117, "global_step": 225195, "epoch": 1861} {"train_loss": -39.9958610534668, "global_step": 225196, "epoch": 1861} {"train_loss": -42.64444351196289, "global_step": 225197, "epoch": 1861} {"train_loss": -40.240684509277344, "global_step": 225198, "epoch": 1861} {"train_loss": -40.84955978393555, "global_step": 225199, "epoch": 1861} {"train_loss": -42.20284652709961, "global_step": 225200, "epoch": 1861} {"train_loss": -41.274776458740234, "global_step": 225201, "epoch": 1861} {"train_loss": -42.20479202270508, "global_step": 225202, "epoch": 1861} {"train_loss": -42.257747650146484, "global_step": 225203, "epoch": 1861} {"train_loss": -41.98220443725586, "global_step": 225204, "epoch": 1861} {"train_loss": -42.345855712890625, "global_step": 225205, "epoch": 1861} {"train_loss": -41.55743408203125, "global_step": 225206, "epoch": 1861} {"train_loss": -41.79941940307617, "global_step": 225207, "epoch": 1861} {"train_loss": -42.050392150878906, "global_step": 225208, "epoch": 1861} {"train_loss": -41.22990798950195, "global_step": 225209, "epoch": 1861} {"train_loss": -42.25880813598633, "global_step": 225210, "epoch": 1861} {"train_loss": -42.44503402709961, "global_step": 225211, "epoch": 1861} {"train_loss": -41.09465026855469, "global_step": 225212, "epoch": 1861} {"train_loss": -39.38262176513672, "global_step": 225213, "epoch": 1861} {"train_loss": -37.93040084838867, "global_step": 225214, "epoch": 1861} {"train_loss": -39.38583755493164, "global_step": 225215, "epoch": 1861} {"train_loss": -40.5718994140625, "global_step": 225216, "epoch": 1861} {"train_loss": -41.1630973815918, "global_step": 225217, "epoch": 1861} {"train_loss": -38.607967376708984, "global_step": 225218, "epoch": 1861} {"train_loss": -38.237545013427734, "global_step": 225219, "epoch": 1861} {"train_loss": -40.447383880615234, "global_step": 225220, "epoch": 1861} {"train_loss": -40.47458267211914, "global_step": 225221, "epoch": 1861} {"train_loss": -39.854087829589844, "global_step": 225222, "epoch": 1861} {"train_loss": -40.34241485595703, "global_step": 225223, "epoch": 1861} {"train_loss": -40.29948425292969, "global_step": 225224, "epoch": 1861} {"train_loss": -40.32875061035156, "global_step": 225225, "epoch": 1861} {"train_loss": -40.604400634765625, "global_step": 225226, "epoch": 1861} {"train_loss": -40.5561408996582, "global_step": 225227, "epoch": 1861} {"train_loss": -41.040367126464844, "global_step": 225228, "epoch": 1861} {"train_loss": -38.48580551147461, "global_step": 225229, "epoch": 1861} {"train_loss": -39.35288619995117, "global_step": 225230, "epoch": 1861} {"train_loss": -25.234907150268555, "global_step": 225231, "epoch": 1861} {"train_loss": -41.06364822387695, "global_step": 225232, "epoch": 1861} {"train_loss": -39.66085433959961, "global_step": 225233, "epoch": 1861} {"train_loss": -38.84556579589844, "global_step": 225234, "epoch": 1861} {"train_loss": -41.371551513671875, "global_step": 225235, "epoch": 1861} {"train_loss": -39.91077423095703, "global_step": 225236, "epoch": 1861} {"train_loss": -40.728981018066406, "global_step": 225237, "epoch": 1861} {"train_loss": -39.60393142700195, "global_step": 225238, "epoch": 1861} {"train_loss": -37.958438873291016, "global_step": 225239, "epoch": 1861} {"train_loss": -35.22406005859375, "global_step": 225240, "epoch": 1861} {"train_loss": -38.872093200683594, "global_step": 225241, "epoch": 1861} {"train_loss": -32.824859619140625, "global_step": 225242, "epoch": 1861} {"train_loss": -41.12248229980469, "global_step": 225243, "epoch": 1861} {"train_loss": -38.83881378173828, "global_step": 225244, "epoch": 1861} {"train_loss": -35.00368881225586, "global_step": 225245, "epoch": 1861} {"train_loss": -31.864866256713867, "global_step": 225246, "epoch": 1861} {"train_loss": -33.675289154052734, "global_step": 225247, "epoch": 1861} {"train_loss": -37.05438232421875, "global_step": 225248, "epoch": 1861} {"train_loss": -35.83452606201172, "global_step": 225249, "epoch": 1861} {"train_loss": -36.103233337402344, "global_step": 225250, "epoch": 1861} {"train_loss": -39.38389205932617, "global_step": 225251, "epoch": 1861} {"train_loss": -39.15409469604492, "global_step": 225252, "epoch": 1861} {"train_loss": -30.148483276367188, "global_step": 225253, "epoch": 1861} {"train_loss": -38.62335968017578, "global_step": 225254, "epoch": 1861} {"train_loss": -38.82625961303711, "global_step": 225255, "epoch": 1861} {"train_loss": -37.48514175415039, "global_step": 225256, "epoch": 1861} {"train_loss": -20.834150314331055, "global_step": 225257, "epoch": 1861} {"train_loss": -36.3421630859375, "global_step": 225258, "epoch": 1861} {"train_loss": -34.18595504760742, "global_step": 225259, "epoch": 1861} {"train_loss": -37.364376068115234, "global_step": 225260, "epoch": 1861} {"train_loss": -33.73492431640625, "global_step": 225261, "epoch": 1861} {"train_loss": -38.33153533935547, "global_step": 225262, "epoch": 1861} {"train_loss": -32.21451950073242, "global_step": 225263, "epoch": 1861} {"train_loss": -39.561859130859375, "global_step": 225264, "epoch": 1861} {"train_loss": -35.46198272705078, "global_step": 225265, "epoch": 1861} {"train_loss": -38.4688720703125, "global_step": 225266, "epoch": 1861} {"train_loss": -38.75040817260742, "global_step": 225267, "epoch": 1861} {"train_loss": -36.113094329833984, "global_step": 225268, "epoch": 1861} {"train_loss": -39.070289611816406, "global_step": 225269, "epoch": 1861} {"train_loss": -33.647090911865234, "global_step": 225270, "epoch": 1861} {"train_loss": -37.125118255615234, "global_step": 225271, "epoch": 1861} {"train_loss": -37.189308166503906, "global_step": 225272, "epoch": 1861} {"train_loss": -39.09066390991211, "global_step": 225273, "epoch": 1861} {"train_loss": -39.274776458740234, "global_step": 225274, "epoch": 1861} {"train_loss": -36.79370880126953, "global_step": 225275, "epoch": 1861} {"train_loss": -31.173730850219727, "global_step": 225276, "epoch": 1861} {"train_loss": -37.77927017211914, "global_step": 225277, "epoch": 1861} {"train_loss": -36.65536117553711, "global_step": 225278, "epoch": 1861} {"train_loss": -38.261348724365234, "global_step": 225279, "epoch": 1861} {"train_loss": -38.92318344116211, "global_step": 225280, "epoch": 1861} {"train_loss": -38.427162170410156, "global_step": 225281, "epoch": 1861} {"train_loss": -36.83127975463867, "global_step": 225282, "epoch": 1861} {"train_loss": -40.0534782409668, "global_step": 225283, "epoch": 1861} {"train_loss": -39.2347412109375, "global_step": 225284, "epoch": 1861} {"train_loss": -38.621543884277344, "global_step": 225285, "epoch": 1861} {"train_loss": -39.045387268066406, "global_step": 225286, "epoch": 1861} {"train_loss": -40.6118278503418, "global_step": 225287, "epoch": 1861} {"train_loss": -39.95620346069336, "global_step": 225288, "epoch": 1861} {"train_loss": -39.5803108215332, "global_step": 225289, "epoch": 1861} {"train_loss": -40.276710510253906, "global_step": 225290, "epoch": 1861} {"train_loss": -39.950496673583984, "global_step": 225291, "epoch": 1861} {"train_loss": -40.317073822021484, "global_step": 225292, "epoch": 1861} {"train_loss": -39.84770584106445, "global_step": 225293, "epoch": 1861} {"train_loss": -39.6472053527832, "global_step": 225294, "epoch": 1861} {"train_loss": -40.18550491333008, "global_step": 225295, "epoch": 1861} {"train_loss": -39.84364700317383, "global_step": 225296, "epoch": 1861} {"train_loss": -39.74943923950195, "global_step": 225297, "epoch": 1861} {"train_loss": -37.80826950073242, "global_step": 225298, "epoch": 1861} {"train_loss": -40.97112274169922, "global_step": 225299, "epoch": 1861} {"train_loss": -40.43703842163086, "global_step": 225300, "epoch": 1861} {"train_loss": -39.0428072716579, "global_step": 225301, "epoch": 1861, "val_loss": 2647592.75} {"train_loss": -40.34013366699219, "global_step": 225302, "epoch": 1862} {"train_loss": -40.6363410949707, "global_step": 225303, "epoch": 1862} {"train_loss": -40.30825424194336, "global_step": 225304, "epoch": 1862} {"train_loss": -40.232120513916016, "global_step": 225305, "epoch": 1862} {"train_loss": -40.890899658203125, "global_step": 225306, "epoch": 1862} {"train_loss": -40.55792236328125, "global_step": 225307, "epoch": 1862} {"train_loss": -40.747779846191406, "global_step": 225308, "epoch": 1862} {"train_loss": -40.583251953125, "global_step": 225309, "epoch": 1862} {"train_loss": -40.001373291015625, "global_step": 225310, "epoch": 1862} {"train_loss": -40.90126419067383, "global_step": 225311, "epoch": 1862} {"train_loss": -40.8434944152832, "global_step": 225312, "epoch": 1862} {"train_loss": -40.913082122802734, "global_step": 225313, "epoch": 1862} {"train_loss": -40.26350784301758, "global_step": 225314, "epoch": 1862} {"train_loss": -41.27073287963867, "global_step": 225315, "epoch": 1862} {"train_loss": -40.89596176147461, "global_step": 225316, "epoch": 1862} {"train_loss": -41.38640213012695, "global_step": 225317, "epoch": 1862} {"train_loss": -39.839393615722656, "global_step": 225318, "epoch": 1862} {"train_loss": -40.26667404174805, "global_step": 225319, "epoch": 1862} {"train_loss": -40.67229080200195, "global_step": 225320, "epoch": 1862} {"train_loss": -41.09505081176758, "global_step": 225321, "epoch": 1862} {"train_loss": -40.91315841674805, "global_step": 225322, "epoch": 1862} {"train_loss": -40.189308166503906, "global_step": 225323, "epoch": 1862} {"train_loss": -41.39889144897461, "global_step": 225324, "epoch": 1862} {"train_loss": -41.01268768310547, "global_step": 225325, "epoch": 1862} {"train_loss": -40.9663200378418, "global_step": 225326, "epoch": 1862} {"train_loss": -41.15731430053711, "global_step": 225327, "epoch": 1862} {"train_loss": -41.38490295410156, "global_step": 225328, "epoch": 1862} {"train_loss": -41.472469329833984, "global_step": 225329, "epoch": 1862} {"train_loss": -41.703495025634766, "global_step": 225330, "epoch": 1862} {"train_loss": -41.93770980834961, "global_step": 225331, "epoch": 1862} {"train_loss": -41.824729919433594, "global_step": 225332, "epoch": 1862} {"train_loss": -41.02100372314453, "global_step": 225333, "epoch": 1862} {"train_loss": -40.9693603515625, "global_step": 225334, "epoch": 1862} {"train_loss": -41.3228874206543, "global_step": 225335, "epoch": 1862} {"train_loss": -41.226318359375, "global_step": 225336, "epoch": 1862} {"train_loss": -41.064422607421875, "global_step": 225337, "epoch": 1862} {"train_loss": -41.79792404174805, "global_step": 225338, "epoch": 1862} {"train_loss": -41.172786712646484, "global_step": 225339, "epoch": 1862} {"train_loss": -42.2208251953125, "global_step": 225340, "epoch": 1862} {"train_loss": -41.197879791259766, "global_step": 225341, "epoch": 1862} {"train_loss": -41.69358444213867, "global_step": 225342, "epoch": 1862} {"train_loss": -42.031124114990234, "global_step": 225343, "epoch": 1862} {"train_loss": -41.717044830322266, "global_step": 225344, "epoch": 1862} {"train_loss": -42.06629180908203, "global_step": 225345, "epoch": 1862} {"train_loss": -41.774253845214844, "global_step": 225346, "epoch": 1862} {"train_loss": -42.10503387451172, "global_step": 225347, "epoch": 1862} {"train_loss": -41.9054069519043, "global_step": 225348, "epoch": 1862} {"train_loss": -42.31965637207031, "global_step": 225349, "epoch": 1862} {"train_loss": -42.52069854736328, "global_step": 225350, "epoch": 1862} {"train_loss": -41.98675537109375, "global_step": 225351, "epoch": 1862} {"train_loss": -42.371826171875, "global_step": 225352, "epoch": 1862} {"train_loss": -42.3338737487793, "global_step": 225353, "epoch": 1862} {"train_loss": -42.42676544189453, "global_step": 225354, "epoch": 1862} {"train_loss": -41.75596237182617, "global_step": 225355, "epoch": 1862} {"train_loss": -42.47418212890625, "global_step": 225356, "epoch": 1862} {"train_loss": -41.944000244140625, "global_step": 225357, "epoch": 1862} {"train_loss": -42.12620162963867, "global_step": 225358, "epoch": 1862} {"train_loss": -42.45196533203125, "global_step": 225359, "epoch": 1862} {"train_loss": -42.43268585205078, "global_step": 225360, "epoch": 1862} {"train_loss": -41.77701950073242, "global_step": 225361, "epoch": 1862} {"train_loss": -41.925045013427734, "global_step": 225362, "epoch": 1862} {"train_loss": -42.60643005371094, "global_step": 225363, "epoch": 1862} {"train_loss": -42.35923767089844, "global_step": 225364, "epoch": 1862} {"train_loss": -42.40263748168945, "global_step": 225365, "epoch": 1862} {"train_loss": -42.680702209472656, "global_step": 225366, "epoch": 1862} {"train_loss": -42.611907958984375, "global_step": 225367, "epoch": 1862} {"train_loss": -42.76826858520508, "global_step": 225368, "epoch": 1862} {"train_loss": -41.81439971923828, "global_step": 225369, "epoch": 1862} {"train_loss": -42.29817581176758, "global_step": 225370, "epoch": 1862} {"train_loss": -42.607666015625, "global_step": 225371, "epoch": 1862} {"train_loss": -42.7484130859375, "global_step": 225372, "epoch": 1862} {"train_loss": -42.27614974975586, "global_step": 225373, "epoch": 1862} {"train_loss": -42.582027435302734, "global_step": 225374, "epoch": 1862} {"train_loss": -41.85897445678711, "global_step": 225375, "epoch": 1862} {"train_loss": -42.35762405395508, "global_step": 225376, "epoch": 1862} {"train_loss": -42.792232513427734, "global_step": 225377, "epoch": 1862} {"train_loss": -41.12202835083008, "global_step": 225378, "epoch": 1862} {"train_loss": -41.35267639160156, "global_step": 225379, "epoch": 1862} {"train_loss": -40.032989501953125, "global_step": 225380, "epoch": 1862} {"train_loss": -38.93449783325195, "global_step": 225381, "epoch": 1862} {"train_loss": -33.031803131103516, "global_step": 225382, "epoch": 1862} {"train_loss": -26.68549919128418, "global_step": 225383, "epoch": 1862} {"train_loss": -19.553436279296875, "global_step": 225384, "epoch": 1862} {"train_loss": -37.452178955078125, "global_step": 225385, "epoch": 1862} {"train_loss": -34.7484130859375, "global_step": 225386, "epoch": 1862} {"train_loss": -16.837602615356445, "global_step": 225387, "epoch": 1862} {"train_loss": -33.042110443115234, "global_step": 225388, "epoch": 1862} {"train_loss": -36.0011100769043, "global_step": 225389, "epoch": 1862} {"train_loss": -30.675323486328125, "global_step": 225390, "epoch": 1862} {"train_loss": -32.11661148071289, "global_step": 225391, "epoch": 1862} {"train_loss": -32.011695861816406, "global_step": 225392, "epoch": 1862} {"train_loss": -28.951696395874023, "global_step": 225393, "epoch": 1862} {"train_loss": -28.970539093017578, "global_step": 225394, "epoch": 1862} {"train_loss": -30.238367080688477, "global_step": 225395, "epoch": 1862} {"train_loss": -25.10982322692871, "global_step": 225396, "epoch": 1862} {"train_loss": -32.11865997314453, "global_step": 225397, "epoch": 1862} {"train_loss": -18.85968780517578, "global_step": 225398, "epoch": 1862} {"train_loss": -33.52782440185547, "global_step": 225399, "epoch": 1862} {"train_loss": -33.114906311035156, "global_step": 225400, "epoch": 1862} {"train_loss": -28.935773849487305, "global_step": 225401, "epoch": 1862} {"train_loss": -35.36820602416992, "global_step": 225402, "epoch": 1862} {"train_loss": -34.11695098876953, "global_step": 225403, "epoch": 1862} {"train_loss": -37.0310173034668, "global_step": 225404, "epoch": 1862} {"train_loss": -33.65606689453125, "global_step": 225405, "epoch": 1862} {"train_loss": -37.24253463745117, "global_step": 225406, "epoch": 1862} {"train_loss": -39.34613800048828, "global_step": 225407, "epoch": 1862} {"train_loss": -37.425628662109375, "global_step": 225408, "epoch": 1862} {"train_loss": -36.864131927490234, "global_step": 225409, "epoch": 1862} {"train_loss": -38.627197265625, "global_step": 225410, "epoch": 1862} {"train_loss": -38.53705978393555, "global_step": 225411, "epoch": 1862} {"train_loss": -38.745113372802734, "global_step": 225412, "epoch": 1862} {"train_loss": -38.224395751953125, "global_step": 225413, "epoch": 1862} {"train_loss": -38.28871536254883, "global_step": 225414, "epoch": 1862} {"train_loss": -39.11320495605469, "global_step": 225415, "epoch": 1862} {"train_loss": -38.906070709228516, "global_step": 225416, "epoch": 1862} {"train_loss": -39.298118591308594, "global_step": 225417, "epoch": 1862} {"train_loss": -39.13105392456055, "global_step": 225418, "epoch": 1862} {"train_loss": -38.16995620727539, "global_step": 225419, "epoch": 1862} {"train_loss": -38.65498352050781, "global_step": 225420, "epoch": 1862} {"train_loss": -38.96135330200195, "global_step": 225421, "epoch": 1862} {"train_loss": -38.91310261497813, "global_step": 225422, "epoch": 1862, "val_loss": 2588640.75} {"train_loss": -39.8004035949707, "global_step": 225423, "epoch": 1863} {"train_loss": -39.17625045776367, "global_step": 225424, "epoch": 1863} {"train_loss": -39.666847229003906, "global_step": 225425, "epoch": 1863} {"train_loss": -40.18347930908203, "global_step": 225426, "epoch": 1863} {"train_loss": -39.982276916503906, "global_step": 225427, "epoch": 1863} {"train_loss": -39.45755386352539, "global_step": 225428, "epoch": 1863} {"train_loss": -40.145591735839844, "global_step": 225429, "epoch": 1863} {"train_loss": -39.60934066772461, "global_step": 225430, "epoch": 1863} {"train_loss": -40.34464645385742, "global_step": 225431, "epoch": 1863} {"train_loss": -40.128700256347656, "global_step": 225432, "epoch": 1863} {"train_loss": -40.406097412109375, "global_step": 225433, "epoch": 1863} {"train_loss": -40.239288330078125, "global_step": 225434, "epoch": 1863} {"train_loss": -40.29789352416992, "global_step": 225435, "epoch": 1863} {"train_loss": -40.614376068115234, "global_step": 225436, "epoch": 1863} {"train_loss": -40.13367462158203, "global_step": 225437, "epoch": 1863} {"train_loss": -40.7299919128418, "global_step": 225438, "epoch": 1863} {"train_loss": -40.27505111694336, "global_step": 225439, "epoch": 1863} {"train_loss": -40.163673400878906, "global_step": 225440, "epoch": 1863} {"train_loss": -40.949703216552734, "global_step": 225441, "epoch": 1863} {"train_loss": -40.38386917114258, "global_step": 225442, "epoch": 1863} {"train_loss": -40.78017807006836, "global_step": 225443, "epoch": 1863} {"train_loss": -40.153072357177734, "global_step": 225444, "epoch": 1863} {"train_loss": -41.31171798706055, "global_step": 225445, "epoch": 1863} {"train_loss": -40.865108489990234, "global_step": 225446, "epoch": 1863} {"train_loss": -40.31361389160156, "global_step": 225447, "epoch": 1863} {"train_loss": -40.940250396728516, "global_step": 225448, "epoch": 1863} {"train_loss": -41.37459182739258, "global_step": 225449, "epoch": 1863} {"train_loss": -40.098655700683594, "global_step": 225450, "epoch": 1863} {"train_loss": -41.11479568481445, "global_step": 225451, "epoch": 1863} {"train_loss": -40.59917449951172, "global_step": 225452, "epoch": 1863} {"train_loss": -41.32748031616211, "global_step": 225453, "epoch": 1863} {"train_loss": -41.147674560546875, "global_step": 225454, "epoch": 1863} {"train_loss": -41.43390655517578, "global_step": 225455, "epoch": 1863} {"train_loss": -41.16131591796875, "global_step": 225456, "epoch": 1863} {"train_loss": -41.29574203491211, "global_step": 225457, "epoch": 1863} {"train_loss": -41.34502029418945, "global_step": 225458, "epoch": 1863} {"train_loss": -40.858619689941406, "global_step": 225459, "epoch": 1863} {"train_loss": -41.071739196777344, "global_step": 225460, "epoch": 1863} {"train_loss": -41.577125549316406, "global_step": 225461, "epoch": 1863} {"train_loss": -41.45820999145508, "global_step": 225462, "epoch": 1863} {"train_loss": -41.40764236450195, "global_step": 225463, "epoch": 1863} {"train_loss": -41.72101593017578, "global_step": 225464, "epoch": 1863} {"train_loss": -41.53288269042969, "global_step": 225465, "epoch": 1863} {"train_loss": -41.42730712890625, "global_step": 225466, "epoch": 1863} {"train_loss": -41.58066940307617, "global_step": 225467, "epoch": 1863} {"train_loss": -41.35091781616211, "global_step": 225468, "epoch": 1863} {"train_loss": -41.59560775756836, "global_step": 225469, "epoch": 1863} {"train_loss": -41.94625473022461, "global_step": 225470, "epoch": 1863} {"train_loss": -42.061763763427734, "global_step": 225471, "epoch": 1863} {"train_loss": -41.53139877319336, "global_step": 225472, "epoch": 1863} {"train_loss": -42.126792907714844, "global_step": 225473, "epoch": 1863} {"train_loss": -41.253414154052734, "global_step": 225474, "epoch": 1863} {"train_loss": -42.145389556884766, "global_step": 225475, "epoch": 1863} {"train_loss": -41.70134735107422, "global_step": 225476, "epoch": 1863} {"train_loss": -41.47100830078125, "global_step": 225477, "epoch": 1863} {"train_loss": -41.99046325683594, "global_step": 225478, "epoch": 1863} {"train_loss": -42.2062873840332, "global_step": 225479, "epoch": 1863} {"train_loss": -41.85725021362305, "global_step": 225480, "epoch": 1863} {"train_loss": -42.01987075805664, "global_step": 225481, "epoch": 1863} {"train_loss": -42.31357955932617, "global_step": 225482, "epoch": 1863} {"train_loss": -41.5832633972168, "global_step": 225483, "epoch": 1863} {"train_loss": -42.26796340942383, "global_step": 225484, "epoch": 1863} {"train_loss": -41.84473419189453, "global_step": 225485, "epoch": 1863} {"train_loss": -42.463008880615234, "global_step": 225486, "epoch": 1863} {"train_loss": -42.048011779785156, "global_step": 225487, "epoch": 1863} {"train_loss": -42.634925842285156, "global_step": 225488, "epoch": 1863} {"train_loss": -42.33405685424805, "global_step": 225489, "epoch": 1863} {"train_loss": -42.40678787231445, "global_step": 225490, "epoch": 1863} {"train_loss": -41.447017669677734, "global_step": 225491, "epoch": 1863} {"train_loss": -42.26677322387695, "global_step": 225492, "epoch": 1863} {"train_loss": -42.0106315612793, "global_step": 225493, "epoch": 1863} {"train_loss": -42.578975677490234, "global_step": 225494, "epoch": 1863} {"train_loss": -42.34382247924805, "global_step": 225495, "epoch": 1863} {"train_loss": -42.63651657104492, "global_step": 225496, "epoch": 1863} {"train_loss": -42.28315734863281, "global_step": 225497, "epoch": 1863} {"train_loss": -42.30673599243164, "global_step": 225498, "epoch": 1863} {"train_loss": -42.59633255004883, "global_step": 225499, "epoch": 1863} {"train_loss": -41.96492004394531, "global_step": 225500, "epoch": 1863} {"train_loss": -42.7579231262207, "global_step": 225501, "epoch": 1863} {"train_loss": -41.8577995300293, "global_step": 225502, "epoch": 1863} {"train_loss": -42.29879379272461, "global_step": 225503, "epoch": 1863} {"train_loss": -42.418758392333984, "global_step": 225504, "epoch": 1863} {"train_loss": -42.50847244262695, "global_step": 225505, "epoch": 1863} {"train_loss": -42.42635726928711, "global_step": 225506, "epoch": 1863} {"train_loss": -42.455474853515625, "global_step": 225507, "epoch": 1863} {"train_loss": -42.10653305053711, "global_step": 225508, "epoch": 1863} {"train_loss": -42.61284255981445, "global_step": 225509, "epoch": 1863} {"train_loss": -42.395145416259766, "global_step": 225510, "epoch": 1863} {"train_loss": -42.67665100097656, "global_step": 225511, "epoch": 1863} {"train_loss": -42.86813735961914, "global_step": 225512, "epoch": 1863} {"train_loss": -42.75516891479492, "global_step": 225513, "epoch": 1863} {"train_loss": -42.199275970458984, "global_step": 225514, "epoch": 1863} {"train_loss": -42.676063537597656, "global_step": 225515, "epoch": 1863} {"train_loss": -41.588436126708984, "global_step": 225516, "epoch": 1863} {"train_loss": -42.62248992919922, "global_step": 225517, "epoch": 1863} {"train_loss": -42.56394958496094, "global_step": 225518, "epoch": 1863} {"train_loss": -42.141517639160156, "global_step": 225519, "epoch": 1863} {"train_loss": -42.552486419677734, "global_step": 225520, "epoch": 1863} {"train_loss": -42.599510192871094, "global_step": 225521, "epoch": 1863} {"train_loss": -42.13621139526367, "global_step": 225522, "epoch": 1863} {"train_loss": -41.35372543334961, "global_step": 225523, "epoch": 1863} {"train_loss": -39.14053726196289, "global_step": 225524, "epoch": 1863} {"train_loss": -37.39848709106445, "global_step": 225525, "epoch": 1863} {"train_loss": -39.253257751464844, "global_step": 225526, "epoch": 1863} {"train_loss": -38.935970306396484, "global_step": 225527, "epoch": 1863} {"train_loss": -34.11466979980469, "global_step": 225528, "epoch": 1863} {"train_loss": -17.52596092224121, "global_step": 225529, "epoch": 1863} {"train_loss": -3.5304715633392334, "global_step": 225530, "epoch": 1863} {"train_loss": -13.832262992858887, "global_step": 225531, "epoch": 1863} {"train_loss": -35.32465744018555, "global_step": 225532, "epoch": 1863} {"train_loss": -23.195093154907227, "global_step": 225533, "epoch": 1863} {"train_loss": -29.236896514892578, "global_step": 225534, "epoch": 1863} {"train_loss": -30.0966796875, "global_step": 225535, "epoch": 1863} {"train_loss": -32.77167510986328, "global_step": 225536, "epoch": 1863} {"train_loss": -33.1054573059082, "global_step": 225537, "epoch": 1863} {"train_loss": -32.5230712890625, "global_step": 225538, "epoch": 1863} {"train_loss": -35.097259521484375, "global_step": 225539, "epoch": 1863} {"train_loss": -35.68080520629883, "global_step": 225540, "epoch": 1863} {"train_loss": -36.50214767456055, "global_step": 225541, "epoch": 1863} {"train_loss": -33.4498176574707, "global_step": 225542, "epoch": 1863} {"train_loss": -39.75229634332263, "global_step": 225543, "epoch": 1863, "val_loss": 2527043.25} {"train_loss": -34.4001579284668, "global_step": 225544, "epoch": 1864} {"train_loss": -37.863746643066406, "global_step": 225545, "epoch": 1864} {"train_loss": -37.913570404052734, "global_step": 225546, "epoch": 1864} {"train_loss": -36.72883224487305, "global_step": 225547, "epoch": 1864} {"train_loss": -38.55526351928711, "global_step": 225548, "epoch": 1864} {"train_loss": -38.05916976928711, "global_step": 225549, "epoch": 1864} {"train_loss": -39.094539642333984, "global_step": 225550, "epoch": 1864} {"train_loss": -39.23484420776367, "global_step": 225551, "epoch": 1864} {"train_loss": -38.56630325317383, "global_step": 225552, "epoch": 1864} {"train_loss": -39.80470657348633, "global_step": 225553, "epoch": 1864} {"train_loss": -38.12783432006836, "global_step": 225554, "epoch": 1864} {"train_loss": -39.10554885864258, "global_step": 225555, "epoch": 1864} {"train_loss": -39.62069320678711, "global_step": 225556, "epoch": 1864} {"train_loss": -39.02436828613281, "global_step": 225557, "epoch": 1864} {"train_loss": -39.137786865234375, "global_step": 225558, "epoch": 1864} {"train_loss": -39.923805236816406, "global_step": 225559, "epoch": 1864} {"train_loss": -39.76615524291992, "global_step": 225560, "epoch": 1864} {"train_loss": -39.79716873168945, "global_step": 225561, "epoch": 1864} {"train_loss": -39.37974548339844, "global_step": 225562, "epoch": 1864} {"train_loss": -39.66184616088867, "global_step": 225563, "epoch": 1864} {"train_loss": -39.8236083984375, "global_step": 225564, "epoch": 1864} {"train_loss": -40.17747116088867, "global_step": 225565, "epoch": 1864} {"train_loss": -40.58182907104492, "global_step": 225566, "epoch": 1864} {"train_loss": -40.5362663269043, "global_step": 225567, "epoch": 1864} {"train_loss": -40.2421989440918, "global_step": 225568, "epoch": 1864} {"train_loss": -39.16763687133789, "global_step": 225569, "epoch": 1864} {"train_loss": -40.59475326538086, "global_step": 225570, "epoch": 1864} {"train_loss": -40.60979461669922, "global_step": 225571, "epoch": 1864} {"train_loss": -40.68343734741211, "global_step": 225572, "epoch": 1864} {"train_loss": -40.7980842590332, "global_step": 225573, "epoch": 1864} {"train_loss": -40.72128677368164, "global_step": 225574, "epoch": 1864} {"train_loss": -40.5236701965332, "global_step": 225575, "epoch": 1864} {"train_loss": -40.792449951171875, "global_step": 225576, "epoch": 1864} {"train_loss": -40.943607330322266, "global_step": 225577, "epoch": 1864} {"train_loss": -40.919307708740234, "global_step": 225578, "epoch": 1864} {"train_loss": -40.873863220214844, "global_step": 225579, "epoch": 1864} {"train_loss": -40.8764762878418, "global_step": 225580, "epoch": 1864} {"train_loss": -41.0938835144043, "global_step": 225581, "epoch": 1864} {"train_loss": -41.18941116333008, "global_step": 225582, "epoch": 1864} {"train_loss": -39.289459228515625, "global_step": 225583, "epoch": 1864} {"train_loss": -40.998409271240234, "global_step": 225584, "epoch": 1864} {"train_loss": -41.27675247192383, "global_step": 225585, "epoch": 1864} {"train_loss": -41.365901947021484, "global_step": 225586, "epoch": 1864} {"train_loss": -41.117042541503906, "global_step": 225587, "epoch": 1864} {"train_loss": -41.21278762817383, "global_step": 225588, "epoch": 1864} {"train_loss": -41.1875, "global_step": 225589, "epoch": 1864} {"train_loss": -40.90067672729492, "global_step": 225590, "epoch": 1864} {"train_loss": -41.205074310302734, "global_step": 225591, "epoch": 1864} {"train_loss": -41.1759033203125, "global_step": 225592, "epoch": 1864} {"train_loss": -41.28181457519531, "global_step": 225593, "epoch": 1864} {"train_loss": -41.600135803222656, "global_step": 225594, "epoch": 1864} {"train_loss": -41.63077926635742, "global_step": 225595, "epoch": 1864} {"train_loss": -41.6601676940918, "global_step": 225596, "epoch": 1864} {"train_loss": -39.68408966064453, "global_step": 225597, "epoch": 1864} {"train_loss": -41.62240219116211, "global_step": 225598, "epoch": 1864} {"train_loss": -41.539859771728516, "global_step": 225599, "epoch": 1864} {"train_loss": -41.6741943359375, "global_step": 225600, "epoch": 1864} {"train_loss": -41.46561813354492, "global_step": 225601, "epoch": 1864} {"train_loss": -41.4813346862793, "global_step": 225602, "epoch": 1864} {"train_loss": -41.552154541015625, "global_step": 225603, "epoch": 1864} {"train_loss": -41.41012191772461, "global_step": 225604, "epoch": 1864} {"train_loss": -41.74065017700195, "global_step": 225605, "epoch": 1864} {"train_loss": -41.58051300048828, "global_step": 225606, "epoch": 1864} {"train_loss": -41.92666244506836, "global_step": 225607, "epoch": 1864} {"train_loss": -41.62275695800781, "global_step": 225608, "epoch": 1864} {"train_loss": -41.63955307006836, "global_step": 225609, "epoch": 1864} {"train_loss": -41.93191146850586, "global_step": 225610, "epoch": 1864} {"train_loss": -41.85173416137695, "global_step": 225611, "epoch": 1864} {"train_loss": -42.04707717895508, "global_step": 225612, "epoch": 1864} {"train_loss": -41.92641067504883, "global_step": 225613, "epoch": 1864} {"train_loss": -42.08038330078125, "global_step": 225614, "epoch": 1864} {"train_loss": -39.99296188354492, "global_step": 225615, "epoch": 1864} {"train_loss": -41.887298583984375, "global_step": 225616, "epoch": 1864} {"train_loss": -42.112159729003906, "global_step": 225617, "epoch": 1864} {"train_loss": -42.15172576904297, "global_step": 225618, "epoch": 1864} {"train_loss": -42.4675178527832, "global_step": 225619, "epoch": 1864} {"train_loss": -42.20927047729492, "global_step": 225620, "epoch": 1864} {"train_loss": -42.372989654541016, "global_step": 225621, "epoch": 1864} {"train_loss": -42.07398223876953, "global_step": 225622, "epoch": 1864} {"train_loss": -40.19712448120117, "global_step": 225623, "epoch": 1864} {"train_loss": -41.77545928955078, "global_step": 225624, "epoch": 1864} {"train_loss": -42.48020553588867, "global_step": 225625, "epoch": 1864} {"train_loss": -41.856788635253906, "global_step": 225626, "epoch": 1864} {"train_loss": -41.6805534362793, "global_step": 225627, "epoch": 1864} {"train_loss": -42.48012924194336, "global_step": 225628, "epoch": 1864} {"train_loss": -42.38210678100586, "global_step": 225629, "epoch": 1864} {"train_loss": -42.576515197753906, "global_step": 225630, "epoch": 1864} {"train_loss": -41.548091888427734, "global_step": 225631, "epoch": 1864} {"train_loss": -42.67256546020508, "global_step": 225632, "epoch": 1864} {"train_loss": -42.41996383666992, "global_step": 225633, "epoch": 1864} {"train_loss": -42.180599212646484, "global_step": 225634, "epoch": 1864} {"train_loss": -42.7271728515625, "global_step": 225635, "epoch": 1864} {"train_loss": -42.32050704956055, "global_step": 225636, "epoch": 1864} {"train_loss": -42.501800537109375, "global_step": 225637, "epoch": 1864} {"train_loss": -42.23307418823242, "global_step": 225638, "epoch": 1864} {"train_loss": -42.47227096557617, "global_step": 225639, "epoch": 1864} {"train_loss": -42.528316497802734, "global_step": 225640, "epoch": 1864} {"train_loss": -42.800262451171875, "global_step": 225641, "epoch": 1864} {"train_loss": -42.0590934753418, "global_step": 225642, "epoch": 1864} {"train_loss": -42.37752914428711, "global_step": 225643, "epoch": 1864} {"train_loss": -42.306339263916016, "global_step": 225644, "epoch": 1864} {"train_loss": -42.23002243041992, "global_step": 225645, "epoch": 1864} {"train_loss": -42.52980422973633, "global_step": 225646, "epoch": 1864} {"train_loss": -42.10600280761719, "global_step": 225647, "epoch": 1864} {"train_loss": -42.20664596557617, "global_step": 225648, "epoch": 1864} {"train_loss": -40.70122146606445, "global_step": 225649, "epoch": 1864} {"train_loss": -42.800289154052734, "global_step": 225650, "epoch": 1864} {"train_loss": -41.87495040893555, "global_step": 225651, "epoch": 1864} {"train_loss": -42.96238327026367, "global_step": 225652, "epoch": 1864} {"train_loss": -42.7855339050293, "global_step": 225653, "epoch": 1864} {"train_loss": -42.78888702392578, "global_step": 225654, "epoch": 1864} {"train_loss": -42.656063079833984, "global_step": 225655, "epoch": 1864} {"train_loss": -43.24744415283203, "global_step": 225656, "epoch": 1864} {"train_loss": -42.5782585144043, "global_step": 225657, "epoch": 1864} {"train_loss": -42.53718566894531, "global_step": 225658, "epoch": 1864} {"train_loss": -43.30024337768555, "global_step": 225659, "epoch": 1864} {"train_loss": -42.9513053894043, "global_step": 225660, "epoch": 1864} {"train_loss": -42.756961822509766, "global_step": 225661, "epoch": 1864} {"train_loss": -43.04206085205078, "global_step": 225662, "epoch": 1864} {"train_loss": -42.46316146850586, "global_step": 225663, "epoch": 1864} {"train_loss": -41.19243230898518, "global_step": 225664, "epoch": 1864, "val_loss": 2666061.75} {"train_loss": -42.785465240478516, "global_step": 225665, "epoch": 1865} {"train_loss": -42.411922454833984, "global_step": 225666, "epoch": 1865} {"train_loss": -43.172523498535156, "global_step": 225667, "epoch": 1865} {"train_loss": -42.567970275878906, "global_step": 225668, "epoch": 1865} {"train_loss": -43.07821273803711, "global_step": 225669, "epoch": 1865} {"train_loss": -42.24181365966797, "global_step": 225670, "epoch": 1865} {"train_loss": -40.80083465576172, "global_step": 225671, "epoch": 1865} {"train_loss": -42.77161407470703, "global_step": 225672, "epoch": 1865} {"train_loss": -41.996360778808594, "global_step": 225673, "epoch": 1865} {"train_loss": -42.0779914855957, "global_step": 225674, "epoch": 1865} {"train_loss": -42.70457077026367, "global_step": 225675, "epoch": 1865} {"train_loss": -42.27752685546875, "global_step": 225676, "epoch": 1865} {"train_loss": -42.22983932495117, "global_step": 225677, "epoch": 1865} {"train_loss": -43.35073471069336, "global_step": 225678, "epoch": 1865} {"train_loss": -42.8143424987793, "global_step": 225679, "epoch": 1865} {"train_loss": -41.38416290283203, "global_step": 225680, "epoch": 1865} {"train_loss": -43.08319091796875, "global_step": 225681, "epoch": 1865} {"train_loss": -42.40082931518555, "global_step": 225682, "epoch": 1865} {"train_loss": -43.17341232299805, "global_step": 225683, "epoch": 1865} {"train_loss": -42.66798782348633, "global_step": 225684, "epoch": 1865} {"train_loss": -43.21556091308594, "global_step": 225685, "epoch": 1865} {"train_loss": -42.696929931640625, "global_step": 225686, "epoch": 1865} {"train_loss": -42.1098747253418, "global_step": 225687, "epoch": 1865} {"train_loss": -42.07551574707031, "global_step": 225688, "epoch": 1865} {"train_loss": -42.50484848022461, "global_step": 225689, "epoch": 1865} {"train_loss": -42.70345687866211, "global_step": 225690, "epoch": 1865} {"train_loss": -42.3946647644043, "global_step": 225691, "epoch": 1865} {"train_loss": -42.67037582397461, "global_step": 225692, "epoch": 1865} {"train_loss": -42.689002990722656, "global_step": 225693, "epoch": 1865} {"train_loss": -42.21922302246094, "global_step": 225694, "epoch": 1865} {"train_loss": -41.96670150756836, "global_step": 225695, "epoch": 1865} {"train_loss": -42.62363052368164, "global_step": 225696, "epoch": 1865} {"train_loss": -42.38282775878906, "global_step": 225697, "epoch": 1865} {"train_loss": -42.23090362548828, "global_step": 225698, "epoch": 1865} {"train_loss": -42.56170654296875, "global_step": 225699, "epoch": 1865} {"train_loss": -42.205223083496094, "global_step": 225700, "epoch": 1865} {"train_loss": -42.59601974487305, "global_step": 225701, "epoch": 1865} {"train_loss": -42.161651611328125, "global_step": 225702, "epoch": 1865} {"train_loss": -41.454586029052734, "global_step": 225703, "epoch": 1865} {"train_loss": -38.35646438598633, "global_step": 225704, "epoch": 1865} {"train_loss": -42.3443489074707, "global_step": 225705, "epoch": 1865} {"train_loss": -40.49150848388672, "global_step": 225706, "epoch": 1865} {"train_loss": -42.54917526245117, "global_step": 225707, "epoch": 1865} {"train_loss": -42.42060470581055, "global_step": 225708, "epoch": 1865} {"train_loss": -41.98646926879883, "global_step": 225709, "epoch": 1865} {"train_loss": -38.518882751464844, "global_step": 225710, "epoch": 1865} {"train_loss": -40.74663162231445, "global_step": 225711, "epoch": 1865} {"train_loss": -39.81842041015625, "global_step": 225712, "epoch": 1865} {"train_loss": -32.4665641784668, "global_step": 225713, "epoch": 1865} {"train_loss": -39.80805587768555, "global_step": 225714, "epoch": 1865} {"train_loss": -41.066890716552734, "global_step": 225715, "epoch": 1865} {"train_loss": -41.378143310546875, "global_step": 225716, "epoch": 1865} {"train_loss": -37.91338348388672, "global_step": 225717, "epoch": 1865} {"train_loss": -34.5335693359375, "global_step": 225718, "epoch": 1865} {"train_loss": -36.578834533691406, "global_step": 225719, "epoch": 1865} {"train_loss": -40.29435348510742, "global_step": 225720, "epoch": 1865} {"train_loss": -39.984439849853516, "global_step": 225721, "epoch": 1865} {"train_loss": -40.0836296081543, "global_step": 225722, "epoch": 1865} {"train_loss": -37.97943115234375, "global_step": 225723, "epoch": 1865} {"train_loss": -38.06443786621094, "global_step": 225724, "epoch": 1865} {"train_loss": -39.839393615722656, "global_step": 225725, "epoch": 1865} {"train_loss": -39.22032928466797, "global_step": 225726, "epoch": 1865} {"train_loss": -39.53178024291992, "global_step": 225727, "epoch": 1865} {"train_loss": -40.16969680786133, "global_step": 225728, "epoch": 1865} {"train_loss": -41.7646369934082, "global_step": 225729, "epoch": 1865} {"train_loss": -38.14150619506836, "global_step": 225730, "epoch": 1865} {"train_loss": -41.67097091674805, "global_step": 225731, "epoch": 1865} {"train_loss": -39.17024612426758, "global_step": 225732, "epoch": 1865} {"train_loss": -39.73687744140625, "global_step": 225733, "epoch": 1865} {"train_loss": -38.58407211303711, "global_step": 225734, "epoch": 1865} {"train_loss": -40.74945831298828, "global_step": 225735, "epoch": 1865} {"train_loss": -40.43192672729492, "global_step": 225736, "epoch": 1865} {"train_loss": -41.809993743896484, "global_step": 225737, "epoch": 1865} {"train_loss": -36.01108932495117, "global_step": 225738, "epoch": 1865} {"train_loss": -30.575271606445312, "global_step": 225739, "epoch": 1865} {"train_loss": -38.80323791503906, "global_step": 225740, "epoch": 1865} {"train_loss": -37.791290283203125, "global_step": 225741, "epoch": 1865} {"train_loss": -39.69267272949219, "global_step": 225742, "epoch": 1865} {"train_loss": -39.27998733520508, "global_step": 225743, "epoch": 1865} {"train_loss": -38.40128707885742, "global_step": 225744, "epoch": 1865} {"train_loss": -40.93943786621094, "global_step": 225745, "epoch": 1865} {"train_loss": -41.502742767333984, "global_step": 225746, "epoch": 1865} {"train_loss": -40.57595443725586, "global_step": 225747, "epoch": 1865} {"train_loss": -41.30269241333008, "global_step": 225748, "epoch": 1865} {"train_loss": -40.25756072998047, "global_step": 225749, "epoch": 1865} {"train_loss": -39.04606628417969, "global_step": 225750, "epoch": 1865} {"train_loss": -39.373046875, "global_step": 225751, "epoch": 1865} {"train_loss": -40.34128952026367, "global_step": 225752, "epoch": 1865} {"train_loss": -40.951663970947266, "global_step": 225753, "epoch": 1865} {"train_loss": -40.67423629760742, "global_step": 225754, "epoch": 1865} {"train_loss": -37.52043914794922, "global_step": 225755, "epoch": 1865} {"train_loss": -37.985939025878906, "global_step": 225756, "epoch": 1865} {"train_loss": -39.60601806640625, "global_step": 225757, "epoch": 1865} {"train_loss": -35.68288040161133, "global_step": 225758, "epoch": 1865} {"train_loss": -41.05460739135742, "global_step": 225759, "epoch": 1865} {"train_loss": -41.07110595703125, "global_step": 225760, "epoch": 1865} {"train_loss": -41.2946662902832, "global_step": 225761, "epoch": 1865} {"train_loss": -40.96511459350586, "global_step": 225762, "epoch": 1865} {"train_loss": -40.59981155395508, "global_step": 225763, "epoch": 1865} {"train_loss": -39.21034240722656, "global_step": 225764, "epoch": 1865} {"train_loss": -37.693389892578125, "global_step": 225765, "epoch": 1865} {"train_loss": -39.19443130493164, "global_step": 225766, "epoch": 1865} {"train_loss": -39.442344665527344, "global_step": 225767, "epoch": 1865} {"train_loss": -40.97311019897461, "global_step": 225768, "epoch": 1865} {"train_loss": -38.27462387084961, "global_step": 225769, "epoch": 1865} {"train_loss": -40.14814376831055, "global_step": 225770, "epoch": 1865} {"train_loss": -40.90994644165039, "global_step": 225771, "epoch": 1865} {"train_loss": -41.499629974365234, "global_step": 225772, "epoch": 1865} {"train_loss": -41.707515716552734, "global_step": 225773, "epoch": 1865} {"train_loss": -40.089447021484375, "global_step": 225774, "epoch": 1865} {"train_loss": -39.69561767578125, "global_step": 225775, "epoch": 1865} {"train_loss": -40.885719299316406, "global_step": 225776, "epoch": 1865} {"train_loss": -40.890953063964844, "global_step": 225777, "epoch": 1865} {"train_loss": -41.49936294555664, "global_step": 225778, "epoch": 1865} {"train_loss": -42.158931732177734, "global_step": 225779, "epoch": 1865} {"train_loss": -41.8631591796875, "global_step": 225780, "epoch": 1865} {"train_loss": -41.93168258666992, "global_step": 225781, "epoch": 1865} {"train_loss": -41.7940673828125, "global_step": 225782, "epoch": 1865} {"train_loss": -41.760581970214844, "global_step": 225783, "epoch": 1865} {"train_loss": -41.63125228881836, "global_step": 225784, "epoch": 1865} {"train_loss": -40.65874777549554, "global_step": 225785, "epoch": 1865, "val_loss": 2702829.25} {"train_loss": -37.80471420288086, "global_step": 225786, "epoch": 1866} {"train_loss": -41.82602310180664, "global_step": 225787, "epoch": 1866} {"train_loss": -41.581932067871094, "global_step": 225788, "epoch": 1866} {"train_loss": -40.10977554321289, "global_step": 225789, "epoch": 1866} {"train_loss": -41.02548599243164, "global_step": 225790, "epoch": 1866} {"train_loss": -41.446590423583984, "global_step": 225791, "epoch": 1866} {"train_loss": -41.91705322265625, "global_step": 225792, "epoch": 1866} {"train_loss": -41.79411697387695, "global_step": 225793, "epoch": 1866} {"train_loss": -41.45050811767578, "global_step": 225794, "epoch": 1866} {"train_loss": -40.218196868896484, "global_step": 225795, "epoch": 1866} {"train_loss": -41.89860153198242, "global_step": 225796, "epoch": 1866} {"train_loss": -42.52018356323242, "global_step": 225797, "epoch": 1866} {"train_loss": -42.02303695678711, "global_step": 225798, "epoch": 1866} {"train_loss": -41.42564010620117, "global_step": 225799, "epoch": 1866} {"train_loss": -41.61476516723633, "global_step": 225800, "epoch": 1866} {"train_loss": -40.76605987548828, "global_step": 225801, "epoch": 1866} {"train_loss": -41.70806121826172, "global_step": 225802, "epoch": 1866} {"train_loss": -41.61801528930664, "global_step": 225803, "epoch": 1866} {"train_loss": -40.56604766845703, "global_step": 225804, "epoch": 1866} {"train_loss": -41.71306610107422, "global_step": 225805, "epoch": 1866} {"train_loss": -41.67548751831055, "global_step": 225806, "epoch": 1866} {"train_loss": -42.31132125854492, "global_step": 225807, "epoch": 1866} {"train_loss": -42.2289924621582, "global_step": 225808, "epoch": 1866} {"train_loss": -42.54146957397461, "global_step": 225809, "epoch": 1866} {"train_loss": -42.27171325683594, "global_step": 225810, "epoch": 1866} {"train_loss": -41.38557434082031, "global_step": 225811, "epoch": 1866} {"train_loss": -42.97719955444336, "global_step": 225812, "epoch": 1866} {"train_loss": -42.41823959350586, "global_step": 225813, "epoch": 1866} {"train_loss": -42.19715118408203, "global_step": 225814, "epoch": 1866} {"train_loss": -42.0589485168457, "global_step": 225815, "epoch": 1866} {"train_loss": -42.51572799682617, "global_step": 225816, "epoch": 1866} {"train_loss": -40.61421585083008, "global_step": 225817, "epoch": 1866} {"train_loss": -42.702423095703125, "global_step": 225818, "epoch": 1866} {"train_loss": -42.10836410522461, "global_step": 225819, "epoch": 1866} {"train_loss": -42.67729568481445, "global_step": 225820, "epoch": 1866} {"train_loss": -42.30611801147461, "global_step": 225821, "epoch": 1866} {"train_loss": -42.45661163330078, "global_step": 225822, "epoch": 1866} {"train_loss": -42.434749603271484, "global_step": 225823, "epoch": 1866} {"train_loss": -42.04464340209961, "global_step": 225824, "epoch": 1866} {"train_loss": -42.483211517333984, "global_step": 225825, "epoch": 1866} {"train_loss": -42.85016632080078, "global_step": 225826, "epoch": 1866} {"train_loss": -42.924171447753906, "global_step": 225827, "epoch": 1866} {"train_loss": -42.62674331665039, "global_step": 225828, "epoch": 1866} {"train_loss": -42.57732009887695, "global_step": 225829, "epoch": 1866} {"train_loss": -42.645179748535156, "global_step": 225830, "epoch": 1866} {"train_loss": -42.789283752441406, "global_step": 225831, "epoch": 1866} {"train_loss": -43.26471710205078, "global_step": 225832, "epoch": 1866} {"train_loss": -42.116519927978516, "global_step": 225833, "epoch": 1866} {"train_loss": -42.811676025390625, "global_step": 225834, "epoch": 1866} {"train_loss": -40.130767822265625, "global_step": 225835, "epoch": 1866} {"train_loss": -42.85443878173828, "global_step": 225836, "epoch": 1866} {"train_loss": -42.621307373046875, "global_step": 225837, "epoch": 1866} {"train_loss": -41.465576171875, "global_step": 225838, "epoch": 1866} {"train_loss": -41.82135772705078, "global_step": 225839, "epoch": 1866} {"train_loss": -41.58722686767578, "global_step": 225840, "epoch": 1866} {"train_loss": -42.75605010986328, "global_step": 225841, "epoch": 1866} {"train_loss": -42.10586166381836, "global_step": 225842, "epoch": 1866} {"train_loss": -42.52197265625, "global_step": 225843, "epoch": 1866} {"train_loss": -43.0426025390625, "global_step": 225844, "epoch": 1866} {"train_loss": -41.72024154663086, "global_step": 225845, "epoch": 1866} {"train_loss": -41.782432556152344, "global_step": 225846, "epoch": 1866} {"train_loss": -42.179744720458984, "global_step": 225847, "epoch": 1866} {"train_loss": -42.315372467041016, "global_step": 225848, "epoch": 1866} {"train_loss": -42.12836456298828, "global_step": 225849, "epoch": 1866} {"train_loss": -41.15267562866211, "global_step": 225850, "epoch": 1866} {"train_loss": -41.59148406982422, "global_step": 225851, "epoch": 1866} {"train_loss": -41.73881912231445, "global_step": 225852, "epoch": 1866} {"train_loss": -41.76975631713867, "global_step": 225853, "epoch": 1866} {"train_loss": -41.54146957397461, "global_step": 225854, "epoch": 1866} {"train_loss": -42.0629997253418, "global_step": 225855, "epoch": 1866} {"train_loss": -41.86151885986328, "global_step": 225856, "epoch": 1866} {"train_loss": -42.38216781616211, "global_step": 225857, "epoch": 1866} {"train_loss": -42.6596794128418, "global_step": 225858, "epoch": 1866} {"train_loss": -41.92829895019531, "global_step": 225859, "epoch": 1866} {"train_loss": -42.0653190612793, "global_step": 225860, "epoch": 1866} {"train_loss": -41.8912239074707, "global_step": 225861, "epoch": 1866} {"train_loss": -41.9558219909668, "global_step": 225862, "epoch": 1866} {"train_loss": -42.29954528808594, "global_step": 225863, "epoch": 1866} {"train_loss": -41.8823356628418, "global_step": 225864, "epoch": 1866} {"train_loss": -42.51577377319336, "global_step": 225865, "epoch": 1866} {"train_loss": -42.162593841552734, "global_step": 225866, "epoch": 1866} {"train_loss": -42.01821517944336, "global_step": 225867, "epoch": 1866} {"train_loss": -40.95381546020508, "global_step": 225868, "epoch": 1866} {"train_loss": -41.864295959472656, "global_step": 225869, "epoch": 1866} {"train_loss": -42.073890686035156, "global_step": 225870, "epoch": 1866} {"train_loss": -41.98234558105469, "global_step": 225871, "epoch": 1866} {"train_loss": -40.49869918823242, "global_step": 225872, "epoch": 1866} {"train_loss": -43.6246337890625, "global_step": 225873, "epoch": 1866} {"train_loss": -42.08964920043945, "global_step": 225874, "epoch": 1866} {"train_loss": -41.692237854003906, "global_step": 225875, "epoch": 1866} {"train_loss": -42.01652145385742, "global_step": 225876, "epoch": 1866} {"train_loss": -39.21647262573242, "global_step": 225877, "epoch": 1866} {"train_loss": -40.990516662597656, "global_step": 225878, "epoch": 1866} {"train_loss": -40.9954948425293, "global_step": 225879, "epoch": 1866} {"train_loss": -41.44554901123047, "global_step": 225880, "epoch": 1866} {"train_loss": -39.60591506958008, "global_step": 225881, "epoch": 1866} {"train_loss": -41.916046142578125, "global_step": 225882, "epoch": 1866} {"train_loss": -42.18400192260742, "global_step": 225883, "epoch": 1866} {"train_loss": -42.215511322021484, "global_step": 225884, "epoch": 1866} {"train_loss": -40.5793571472168, "global_step": 225885, "epoch": 1866} {"train_loss": -41.69009017944336, "global_step": 225886, "epoch": 1866} {"train_loss": -40.59269332885742, "global_step": 225887, "epoch": 1866} {"train_loss": -41.727325439453125, "global_step": 225888, "epoch": 1866} {"train_loss": -42.450042724609375, "global_step": 225889, "epoch": 1866} {"train_loss": -40.09214401245117, "global_step": 225890, "epoch": 1866} {"train_loss": -41.6991081237793, "global_step": 225891, "epoch": 1866} {"train_loss": -40.24809646606445, "global_step": 225892, "epoch": 1866} {"train_loss": -41.48740768432617, "global_step": 225893, "epoch": 1866} {"train_loss": -40.79789352416992, "global_step": 225894, "epoch": 1866} {"train_loss": -35.29764175415039, "global_step": 225895, "epoch": 1866} {"train_loss": -38.72811508178711, "global_step": 225896, "epoch": 1866} {"train_loss": -37.34624099731445, "global_step": 225897, "epoch": 1866} {"train_loss": -39.88093948364258, "global_step": 225898, "epoch": 1866} {"train_loss": -41.66486358642578, "global_step": 225899, "epoch": 1866} {"train_loss": -40.99311065673828, "global_step": 225900, "epoch": 1866} {"train_loss": -40.77729034423828, "global_step": 225901, "epoch": 1866} {"train_loss": -39.67649841308594, "global_step": 225902, "epoch": 1866} {"train_loss": -40.496517181396484, "global_step": 225903, "epoch": 1866} {"train_loss": -40.97843933105469, "global_step": 225904, "epoch": 1866} {"train_loss": -41.86552429199219, "global_step": 225905, "epoch": 1866} {"train_loss": -41.62998971860271, "global_step": 225906, "epoch": 1866, "val_loss": 2638553.5} {"train_loss": -42.14569091796875, "global_step": 225907, "epoch": 1867} {"train_loss": -42.08205795288086, "global_step": 225908, "epoch": 1867} {"train_loss": -41.562618255615234, "global_step": 225909, "epoch": 1867} {"train_loss": -40.01271438598633, "global_step": 225910, "epoch": 1867} {"train_loss": -42.302242279052734, "global_step": 225911, "epoch": 1867} {"train_loss": -40.5531005859375, "global_step": 225912, "epoch": 1867} {"train_loss": -41.44240951538086, "global_step": 225913, "epoch": 1867} {"train_loss": -41.64675521850586, "global_step": 225914, "epoch": 1867} {"train_loss": -40.50568389892578, "global_step": 225915, "epoch": 1867} {"train_loss": -41.40273666381836, "global_step": 225916, "epoch": 1867} {"train_loss": -40.55575180053711, "global_step": 225917, "epoch": 1867} {"train_loss": -41.669795989990234, "global_step": 225918, "epoch": 1867} {"train_loss": -41.88357162475586, "global_step": 225919, "epoch": 1867} {"train_loss": -41.03416061401367, "global_step": 225920, "epoch": 1867} {"train_loss": -41.44927978515625, "global_step": 225921, "epoch": 1867} {"train_loss": -41.212120056152344, "global_step": 225922, "epoch": 1867} {"train_loss": -41.32217025756836, "global_step": 225923, "epoch": 1867} {"train_loss": -41.686824798583984, "global_step": 225924, "epoch": 1867} {"train_loss": -41.973209381103516, "global_step": 225925, "epoch": 1867} {"train_loss": -42.097747802734375, "global_step": 225926, "epoch": 1867} {"train_loss": -40.8537712097168, "global_step": 225927, "epoch": 1867} {"train_loss": -41.12005615234375, "global_step": 225928, "epoch": 1867} {"train_loss": -33.67338180541992, "global_step": 225929, "epoch": 1867} {"train_loss": -39.97813415527344, "global_step": 225930, "epoch": 1867} {"train_loss": -40.251991271972656, "global_step": 225931, "epoch": 1867} {"train_loss": -40.9918212890625, "global_step": 225932, "epoch": 1867} {"train_loss": -39.061256408691406, "global_step": 225933, "epoch": 1867} {"train_loss": -40.86025619506836, "global_step": 225934, "epoch": 1867} {"train_loss": -42.013938903808594, "global_step": 225935, "epoch": 1867} {"train_loss": -39.906517028808594, "global_step": 225936, "epoch": 1867} {"train_loss": -41.06943893432617, "global_step": 225937, "epoch": 1867} {"train_loss": -41.368228912353516, "global_step": 225938, "epoch": 1867} {"train_loss": -41.36042404174805, "global_step": 225939, "epoch": 1867} {"train_loss": -41.1749382019043, "global_step": 225940, "epoch": 1867} {"train_loss": -40.65700912475586, "global_step": 225941, "epoch": 1867} {"train_loss": -40.419429779052734, "global_step": 225942, "epoch": 1867} {"train_loss": -41.57503890991211, "global_step": 225943, "epoch": 1867} {"train_loss": -36.23846435546875, "global_step": 225944, "epoch": 1867} {"train_loss": -40.6200065612793, "global_step": 225945, "epoch": 1867} {"train_loss": -41.665679931640625, "global_step": 225946, "epoch": 1867} {"train_loss": -41.528446197509766, "global_step": 225947, "epoch": 1867} {"train_loss": -42.108028411865234, "global_step": 225948, "epoch": 1867} {"train_loss": -40.703792572021484, "global_step": 225949, "epoch": 1867} {"train_loss": -42.16301345825195, "global_step": 225950, "epoch": 1867} {"train_loss": -40.927242279052734, "global_step": 225951, "epoch": 1867} {"train_loss": -41.68317794799805, "global_step": 225952, "epoch": 1867} {"train_loss": -40.47279739379883, "global_step": 225953, "epoch": 1867} {"train_loss": -40.7150993347168, "global_step": 225954, "epoch": 1867} {"train_loss": -39.20703887939453, "global_step": 225955, "epoch": 1867} {"train_loss": -39.94002151489258, "global_step": 225956, "epoch": 1867} {"train_loss": -40.78220748901367, "global_step": 225957, "epoch": 1867} {"train_loss": -34.33218765258789, "global_step": 225958, "epoch": 1867} {"train_loss": -37.82509994506836, "global_step": 225959, "epoch": 1867} {"train_loss": -41.44546127319336, "global_step": 225960, "epoch": 1867} {"train_loss": -41.7050895690918, "global_step": 225961, "epoch": 1867} {"train_loss": -40.57123947143555, "global_step": 225962, "epoch": 1867} {"train_loss": -39.7108154296875, "global_step": 225963, "epoch": 1867} {"train_loss": -40.36857223510742, "global_step": 225964, "epoch": 1867} {"train_loss": -39.146240234375, "global_step": 225965, "epoch": 1867} {"train_loss": -40.82038116455078, "global_step": 225966, "epoch": 1867} {"train_loss": -39.038082122802734, "global_step": 225967, "epoch": 1867} {"train_loss": -40.618099212646484, "global_step": 225968, "epoch": 1867} {"train_loss": -36.93841552734375, "global_step": 225969, "epoch": 1867} {"train_loss": -36.95003128051758, "global_step": 225970, "epoch": 1867} {"train_loss": -40.307716369628906, "global_step": 225971, "epoch": 1867} {"train_loss": -38.91062545776367, "global_step": 225972, "epoch": 1867} {"train_loss": -40.390193939208984, "global_step": 225973, "epoch": 1867} {"train_loss": -38.29448318481445, "global_step": 225974, "epoch": 1867} {"train_loss": -32.585689544677734, "global_step": 225975, "epoch": 1867} {"train_loss": -36.11275863647461, "global_step": 225976, "epoch": 1867} {"train_loss": -37.93888473510742, "global_step": 225977, "epoch": 1867} {"train_loss": -37.069915771484375, "global_step": 225978, "epoch": 1867} {"train_loss": -30.884387969970703, "global_step": 225979, "epoch": 1867} {"train_loss": -35.32185745239258, "global_step": 225980, "epoch": 1867} {"train_loss": -35.40006637573242, "global_step": 225981, "epoch": 1867} {"train_loss": -35.4119987487793, "global_step": 225982, "epoch": 1867} {"train_loss": -33.21220779418945, "global_step": 225983, "epoch": 1867} {"train_loss": -35.14026641845703, "global_step": 225984, "epoch": 1867} {"train_loss": -6.95202112197876, "global_step": 225985, "epoch": 1867} {"train_loss": -27.676095962524414, "global_step": 225986, "epoch": 1867} {"train_loss": -33.25117111206055, "global_step": 225987, "epoch": 1867} {"train_loss": -35.25239181518555, "global_step": 225988, "epoch": 1867} {"train_loss": -28.864648818969727, "global_step": 225989, "epoch": 1867} {"train_loss": -33.640838623046875, "global_step": 225990, "epoch": 1867} {"train_loss": -30.526824951171875, "global_step": 225991, "epoch": 1867} {"train_loss": -32.24933624267578, "global_step": 225992, "epoch": 1867} {"train_loss": -17.42592430114746, "global_step": 225993, "epoch": 1867} {"train_loss": -32.80219268798828, "global_step": 225994, "epoch": 1867} {"train_loss": -26.137189865112305, "global_step": 225995, "epoch": 1867} {"train_loss": -32.348453521728516, "global_step": 225996, "epoch": 1867} {"train_loss": -32.739418029785156, "global_step": 225997, "epoch": 1867} {"train_loss": -32.23981857299805, "global_step": 225998, "epoch": 1867} {"train_loss": -35.099151611328125, "global_step": 225999, "epoch": 1867} {"train_loss": -34.190372467041016, "global_step": 226000, "epoch": 1867} {"train_loss": -36.20403289794922, "global_step": 226001, "epoch": 1867} {"train_loss": -35.72943115234375, "global_step": 226002, "epoch": 1867} {"train_loss": -36.07754898071289, "global_step": 226003, "epoch": 1867} {"train_loss": -36.26377487182617, "global_step": 226004, "epoch": 1867} {"train_loss": -32.11436080932617, "global_step": 226005, "epoch": 1867} {"train_loss": -32.91856384277344, "global_step": 226006, "epoch": 1867} {"train_loss": -29.630462646484375, "global_step": 226007, "epoch": 1867} {"train_loss": -36.31545639038086, "global_step": 226008, "epoch": 1867} {"train_loss": -35.895591735839844, "global_step": 226009, "epoch": 1867} {"train_loss": -37.46148681640625, "global_step": 226010, "epoch": 1867} {"train_loss": -37.54624557495117, "global_step": 226011, "epoch": 1867} {"train_loss": -36.6867790222168, "global_step": 226012, "epoch": 1867} {"train_loss": -37.03754425048828, "global_step": 226013, "epoch": 1867} {"train_loss": -37.39313888549805, "global_step": 226014, "epoch": 1867} {"train_loss": -35.84589767456055, "global_step": 226015, "epoch": 1867} {"train_loss": -37.047969818115234, "global_step": 226016, "epoch": 1867} {"train_loss": -37.142330169677734, "global_step": 226017, "epoch": 1867} {"train_loss": -35.0980224609375, "global_step": 226018, "epoch": 1867} {"train_loss": -37.83978271484375, "global_step": 226019, "epoch": 1867} {"train_loss": -37.527015686035156, "global_step": 226020, "epoch": 1867} {"train_loss": -37.21604537963867, "global_step": 226021, "epoch": 1867} {"train_loss": -38.2431755065918, "global_step": 226022, "epoch": 1867} {"train_loss": -37.64240646362305, "global_step": 226023, "epoch": 1867} {"train_loss": -36.08087921142578, "global_step": 226024, "epoch": 1867} {"train_loss": -38.49088668823242, "global_step": 226025, "epoch": 1867} {"train_loss": -37.33413314819336, "global_step": 226026, "epoch": 1867} {"train_loss": -37.606477331524054, "global_step": 226027, "epoch": 1867, "val_loss": 2616693.75} {"train_loss": -37.20407485961914, "global_step": 226028, "epoch": 1868} {"train_loss": -38.0654296875, "global_step": 226029, "epoch": 1868} {"train_loss": -38.271419525146484, "global_step": 226030, "epoch": 1868} {"train_loss": -37.51913833618164, "global_step": 226031, "epoch": 1868} {"train_loss": -37.706966400146484, "global_step": 226032, "epoch": 1868} {"train_loss": -38.34553909301758, "global_step": 226033, "epoch": 1868} {"train_loss": -38.24783706665039, "global_step": 226034, "epoch": 1868} {"train_loss": -38.27920913696289, "global_step": 226035, "epoch": 1868} {"train_loss": -37.940773010253906, "global_step": 226036, "epoch": 1868} {"train_loss": -38.32638168334961, "global_step": 226037, "epoch": 1868} {"train_loss": -38.004913330078125, "global_step": 226038, "epoch": 1868} {"train_loss": -38.7137451171875, "global_step": 226039, "epoch": 1868} {"train_loss": -37.50440216064453, "global_step": 226040, "epoch": 1868} {"train_loss": -37.88459396362305, "global_step": 226041, "epoch": 1868} {"train_loss": -38.013275146484375, "global_step": 226042, "epoch": 1868} {"train_loss": -38.85567855834961, "global_step": 226043, "epoch": 1868} {"train_loss": -38.92686080932617, "global_step": 226044, "epoch": 1868} {"train_loss": -38.88732147216797, "global_step": 226045, "epoch": 1868} {"train_loss": -39.005985260009766, "global_step": 226046, "epoch": 1868} {"train_loss": -38.66329574584961, "global_step": 226047, "epoch": 1868} {"train_loss": -39.43909454345703, "global_step": 226048, "epoch": 1868} {"train_loss": -39.071380615234375, "global_step": 226049, "epoch": 1868} {"train_loss": -39.52513885498047, "global_step": 226050, "epoch": 1868} {"train_loss": -39.29389190673828, "global_step": 226051, "epoch": 1868} {"train_loss": -39.71017837524414, "global_step": 226052, "epoch": 1868} {"train_loss": -39.29121398925781, "global_step": 226053, "epoch": 1868} {"train_loss": -37.13551712036133, "global_step": 226054, "epoch": 1868} {"train_loss": -38.953887939453125, "global_step": 226055, "epoch": 1868} {"train_loss": -39.31589889526367, "global_step": 226056, "epoch": 1868} {"train_loss": -39.827980041503906, "global_step": 226057, "epoch": 1868} {"train_loss": -39.3143424987793, "global_step": 226058, "epoch": 1868} {"train_loss": -38.82261276245117, "global_step": 226059, "epoch": 1868} {"train_loss": -39.45398712158203, "global_step": 226060, "epoch": 1868} {"train_loss": -39.19057846069336, "global_step": 226061, "epoch": 1868} {"train_loss": -39.60374069213867, "global_step": 226062, "epoch": 1868} {"train_loss": -39.42168045043945, "global_step": 226063, "epoch": 1868} {"train_loss": -39.94301986694336, "global_step": 226064, "epoch": 1868} {"train_loss": -39.57805633544922, "global_step": 226065, "epoch": 1868} {"train_loss": -39.90833282470703, "global_step": 226066, "epoch": 1868} {"train_loss": -39.56916427612305, "global_step": 226067, "epoch": 1868} {"train_loss": -39.22502517700195, "global_step": 226068, "epoch": 1868} {"train_loss": -40.22793197631836, "global_step": 226069, "epoch": 1868} {"train_loss": -40.226898193359375, "global_step": 226070, "epoch": 1868} {"train_loss": -40.319580078125, "global_step": 226071, "epoch": 1868} {"train_loss": -39.984397888183594, "global_step": 226072, "epoch": 1868} {"train_loss": -40.565006256103516, "global_step": 226073, "epoch": 1868} {"train_loss": -40.55870056152344, "global_step": 226074, "epoch": 1868} {"train_loss": -39.13302230834961, "global_step": 226075, "epoch": 1868} {"train_loss": -39.976654052734375, "global_step": 226076, "epoch": 1868} {"train_loss": -39.001625061035156, "global_step": 226077, "epoch": 1868} {"train_loss": -39.73347091674805, "global_step": 226078, "epoch": 1868} {"train_loss": -40.286312103271484, "global_step": 226079, "epoch": 1868} {"train_loss": -40.09452819824219, "global_step": 226080, "epoch": 1868} {"train_loss": -40.19694137573242, "global_step": 226081, "epoch": 1868} {"train_loss": -39.799537658691406, "global_step": 226082, "epoch": 1868} {"train_loss": -39.82451248168945, "global_step": 226083, "epoch": 1868} {"train_loss": -40.1179084777832, "global_step": 226084, "epoch": 1868} {"train_loss": -40.75376892089844, "global_step": 226085, "epoch": 1868} {"train_loss": -40.824886322021484, "global_step": 226086, "epoch": 1868} {"train_loss": -39.683082580566406, "global_step": 226087, "epoch": 1868} {"train_loss": -40.43332290649414, "global_step": 226088, "epoch": 1868} {"train_loss": -40.74869155883789, "global_step": 226089, "epoch": 1868} {"train_loss": -41.16144561767578, "global_step": 226090, "epoch": 1868} {"train_loss": -40.1488037109375, "global_step": 226091, "epoch": 1868} {"train_loss": -40.778072357177734, "global_step": 226092, "epoch": 1868} {"train_loss": -39.894161224365234, "global_step": 226093, "epoch": 1868} {"train_loss": -39.631587982177734, "global_step": 226094, "epoch": 1868} {"train_loss": -40.90089797973633, "global_step": 226095, "epoch": 1868} {"train_loss": -40.54329299926758, "global_step": 226096, "epoch": 1868} {"train_loss": -40.4051513671875, "global_step": 226097, "epoch": 1868} {"train_loss": -40.403987884521484, "global_step": 226098, "epoch": 1868} {"train_loss": -40.00046920776367, "global_step": 226099, "epoch": 1868} {"train_loss": -41.353111267089844, "global_step": 226100, "epoch": 1868} {"train_loss": -41.296546936035156, "global_step": 226101, "epoch": 1868} {"train_loss": -41.01210403442383, "global_step": 226102, "epoch": 1868} {"train_loss": -41.21756362915039, "global_step": 226103, "epoch": 1868} {"train_loss": -41.00436019897461, "global_step": 226104, "epoch": 1868} {"train_loss": -39.85995101928711, "global_step": 226105, "epoch": 1868} {"train_loss": -40.854366302490234, "global_step": 226106, "epoch": 1868} {"train_loss": -41.426021575927734, "global_step": 226107, "epoch": 1868} {"train_loss": -41.37907028198242, "global_step": 226108, "epoch": 1868} {"train_loss": -40.68357467651367, "global_step": 226109, "epoch": 1868} {"train_loss": -41.09143829345703, "global_step": 226110, "epoch": 1868} {"train_loss": -40.68166732788086, "global_step": 226111, "epoch": 1868} {"train_loss": -41.89571762084961, "global_step": 226112, "epoch": 1868} {"train_loss": -40.99951171875, "global_step": 226113, "epoch": 1868} {"train_loss": -41.769935607910156, "global_step": 226114, "epoch": 1868} {"train_loss": -41.24656295776367, "global_step": 226115, "epoch": 1868} {"train_loss": -41.2901496887207, "global_step": 226116, "epoch": 1868} {"train_loss": -41.07407760620117, "global_step": 226117, "epoch": 1868} {"train_loss": -41.56759262084961, "global_step": 226118, "epoch": 1868} {"train_loss": -41.6158561706543, "global_step": 226119, "epoch": 1868} {"train_loss": -41.5400390625, "global_step": 226120, "epoch": 1868} {"train_loss": -40.981319427490234, "global_step": 226121, "epoch": 1868} {"train_loss": -41.36491012573242, "global_step": 226122, "epoch": 1868} {"train_loss": -41.72789001464844, "global_step": 226123, "epoch": 1868} {"train_loss": -41.733882904052734, "global_step": 226124, "epoch": 1868} {"train_loss": -40.69680404663086, "global_step": 226125, "epoch": 1868} {"train_loss": -41.00959396362305, "global_step": 226126, "epoch": 1868} {"train_loss": -41.24086380004883, "global_step": 226127, "epoch": 1868} {"train_loss": -41.4424934387207, "global_step": 226128, "epoch": 1868} {"train_loss": -41.568782806396484, "global_step": 226129, "epoch": 1868} {"train_loss": -41.49229049682617, "global_step": 226130, "epoch": 1868} {"train_loss": -40.75641632080078, "global_step": 226131, "epoch": 1868} {"train_loss": -41.15395736694336, "global_step": 226132, "epoch": 1868} {"train_loss": -41.059326171875, "global_step": 226133, "epoch": 1868} {"train_loss": -41.30019760131836, "global_step": 226134, "epoch": 1868} {"train_loss": -41.19561767578125, "global_step": 226135, "epoch": 1868} {"train_loss": -41.1829833984375, "global_step": 226136, "epoch": 1868} {"train_loss": -40.92464828491211, "global_step": 226137, "epoch": 1868} {"train_loss": -41.69470977783203, "global_step": 226138, "epoch": 1868} {"train_loss": -41.249088287353516, "global_step": 226139, "epoch": 1868} {"train_loss": -41.86187744140625, "global_step": 226140, "epoch": 1868} {"train_loss": -41.71438217163086, "global_step": 226141, "epoch": 1868} {"train_loss": -41.6807975769043, "global_step": 226142, "epoch": 1868} {"train_loss": -41.8477668762207, "global_step": 226143, "epoch": 1868} {"train_loss": -41.780059814453125, "global_step": 226144, "epoch": 1868} {"train_loss": -41.2598991394043, "global_step": 226145, "epoch": 1868} {"train_loss": -41.63939666748047, "global_step": 226146, "epoch": 1868} {"train_loss": -41.73073959350586, "global_step": 226147, "epoch": 1868} {"train_loss": -40.1706129026807, "global_step": 226148, "epoch": 1868, "val_loss": 2585885.75} {"train_loss": -41.509883880615234, "global_step": 226149, "epoch": 1869} {"train_loss": -41.7171516418457, "global_step": 226150, "epoch": 1869} {"train_loss": -40.96023178100586, "global_step": 226151, "epoch": 1869} {"train_loss": -40.66939163208008, "global_step": 226152, "epoch": 1869} {"train_loss": -41.46600341796875, "global_step": 226153, "epoch": 1869} {"train_loss": -41.70743179321289, "global_step": 226154, "epoch": 1869} {"train_loss": -42.056617736816406, "global_step": 226155, "epoch": 1869} {"train_loss": -41.62667465209961, "global_step": 226156, "epoch": 1869} {"train_loss": -41.95436096191406, "global_step": 226157, "epoch": 1869} {"train_loss": -41.77424240112305, "global_step": 226158, "epoch": 1869} {"train_loss": -41.8363037109375, "global_step": 226159, "epoch": 1869} {"train_loss": -42.29768753051758, "global_step": 226160, "epoch": 1869} {"train_loss": -41.76119613647461, "global_step": 226161, "epoch": 1869} {"train_loss": -41.98450469970703, "global_step": 226162, "epoch": 1869} {"train_loss": -42.31269073486328, "global_step": 226163, "epoch": 1869} {"train_loss": -41.820655822753906, "global_step": 226164, "epoch": 1869} {"train_loss": -42.328765869140625, "global_step": 226165, "epoch": 1869} {"train_loss": -42.06272888183594, "global_step": 226166, "epoch": 1869} {"train_loss": -42.07915115356445, "global_step": 226167, "epoch": 1869} {"train_loss": -41.363555908203125, "global_step": 226168, "epoch": 1869} {"train_loss": -41.31476974487305, "global_step": 226169, "epoch": 1869} {"train_loss": -41.08051300048828, "global_step": 226170, "epoch": 1869} {"train_loss": -40.68569564819336, "global_step": 226171, "epoch": 1869} {"train_loss": -40.700653076171875, "global_step": 226172, "epoch": 1869} {"train_loss": -39.4775390625, "global_step": 226173, "epoch": 1869} {"train_loss": -38.22261047363281, "global_step": 226174, "epoch": 1869} {"train_loss": -37.865291595458984, "global_step": 226175, "epoch": 1869} {"train_loss": -40.47135925292969, "global_step": 226176, "epoch": 1869} {"train_loss": -41.852027893066406, "global_step": 226177, "epoch": 1869} {"train_loss": -40.213111877441406, "global_step": 226178, "epoch": 1869} {"train_loss": -37.2691764831543, "global_step": 226179, "epoch": 1869} {"train_loss": -37.38801193237305, "global_step": 226180, "epoch": 1869} {"train_loss": -39.8373908996582, "global_step": 226181, "epoch": 1869} {"train_loss": -41.60715103149414, "global_step": 226182, "epoch": 1869} {"train_loss": -41.269081115722656, "global_step": 226183, "epoch": 1869} {"train_loss": -39.50332260131836, "global_step": 226184, "epoch": 1869} {"train_loss": -40.763763427734375, "global_step": 226185, "epoch": 1869} {"train_loss": -40.54912185668945, "global_step": 226186, "epoch": 1869} {"train_loss": -40.844295501708984, "global_step": 226187, "epoch": 1869} {"train_loss": -40.00204849243164, "global_step": 226188, "epoch": 1869} {"train_loss": -40.22443771362305, "global_step": 226189, "epoch": 1869} {"train_loss": -41.44791793823242, "global_step": 226190, "epoch": 1869} {"train_loss": -40.69730758666992, "global_step": 226191, "epoch": 1869} {"train_loss": -40.52352523803711, "global_step": 226192, "epoch": 1869} {"train_loss": -40.66392517089844, "global_step": 226193, "epoch": 1869} {"train_loss": -41.356903076171875, "global_step": 226194, "epoch": 1869} {"train_loss": -41.61046600341797, "global_step": 226195, "epoch": 1869} {"train_loss": -40.99835968017578, "global_step": 226196, "epoch": 1869} {"train_loss": -41.42585754394531, "global_step": 226197, "epoch": 1869} {"train_loss": -41.63187789916992, "global_step": 226198, "epoch": 1869} {"train_loss": -42.076229095458984, "global_step": 226199, "epoch": 1869} {"train_loss": -42.13214874267578, "global_step": 226200, "epoch": 1869} {"train_loss": -41.34488296508789, "global_step": 226201, "epoch": 1869} {"train_loss": -41.898902893066406, "global_step": 226202, "epoch": 1869} {"train_loss": -42.191627502441406, "global_step": 226203, "epoch": 1869} {"train_loss": -42.01877975463867, "global_step": 226204, "epoch": 1869} {"train_loss": -42.15277862548828, "global_step": 226205, "epoch": 1869} {"train_loss": -40.88233184814453, "global_step": 226206, "epoch": 1869} {"train_loss": -41.88468551635742, "global_step": 226207, "epoch": 1869} {"train_loss": -41.91995620727539, "global_step": 226208, "epoch": 1869} {"train_loss": -41.487178802490234, "global_step": 226209, "epoch": 1869} {"train_loss": -42.12561798095703, "global_step": 226210, "epoch": 1869} {"train_loss": -41.4267692565918, "global_step": 226211, "epoch": 1869} {"train_loss": -41.980098724365234, "global_step": 226212, "epoch": 1869} {"train_loss": -41.37479782104492, "global_step": 226213, "epoch": 1869} {"train_loss": -41.649024963378906, "global_step": 226214, "epoch": 1869} {"train_loss": -40.97990798950195, "global_step": 226215, "epoch": 1869} {"train_loss": -41.93328094482422, "global_step": 226216, "epoch": 1869} {"train_loss": -41.67822265625, "global_step": 226217, "epoch": 1869} {"train_loss": -42.04164505004883, "global_step": 226218, "epoch": 1869} {"train_loss": -41.590667724609375, "global_step": 226219, "epoch": 1869} {"train_loss": -41.89219284057617, "global_step": 226220, "epoch": 1869} {"train_loss": -41.76109313964844, "global_step": 226221, "epoch": 1869} {"train_loss": -42.12411117553711, "global_step": 226222, "epoch": 1869} {"train_loss": -41.98794174194336, "global_step": 226223, "epoch": 1869} {"train_loss": -40.717445373535156, "global_step": 226224, "epoch": 1869} {"train_loss": -42.5071907043457, "global_step": 226225, "epoch": 1869} {"train_loss": -41.68574523925781, "global_step": 226226, "epoch": 1869} {"train_loss": -42.243865966796875, "global_step": 226227, "epoch": 1869} {"train_loss": -41.80621337890625, "global_step": 226228, "epoch": 1869} {"train_loss": -42.25856399536133, "global_step": 226229, "epoch": 1869} {"train_loss": -41.68171691894531, "global_step": 226230, "epoch": 1869} {"train_loss": -39.134639739990234, "global_step": 226231, "epoch": 1869} {"train_loss": -41.094520568847656, "global_step": 226232, "epoch": 1869} {"train_loss": -41.452022552490234, "global_step": 226233, "epoch": 1869} {"train_loss": -41.23501205444336, "global_step": 226234, "epoch": 1869} {"train_loss": -41.82725524902344, "global_step": 226235, "epoch": 1869} {"train_loss": -41.41858673095703, "global_step": 226236, "epoch": 1869} {"train_loss": -42.01678466796875, "global_step": 226237, "epoch": 1869} {"train_loss": -41.9398193359375, "global_step": 226238, "epoch": 1869} {"train_loss": -41.55301284790039, "global_step": 226239, "epoch": 1869} {"train_loss": -41.32252883911133, "global_step": 226240, "epoch": 1869} {"train_loss": -41.82822799682617, "global_step": 226241, "epoch": 1869} {"train_loss": -42.19248580932617, "global_step": 226242, "epoch": 1869} {"train_loss": -42.02262496948242, "global_step": 226243, "epoch": 1869} {"train_loss": -41.68777084350586, "global_step": 226244, "epoch": 1869} {"train_loss": -42.01699447631836, "global_step": 226245, "epoch": 1869} {"train_loss": -41.95576095581055, "global_step": 226246, "epoch": 1869} {"train_loss": -38.95018768310547, "global_step": 226247, "epoch": 1869} {"train_loss": -41.679222106933594, "global_step": 226248, "epoch": 1869} {"train_loss": -41.84757614135742, "global_step": 226249, "epoch": 1869} {"train_loss": -40.396175384521484, "global_step": 226250, "epoch": 1869} {"train_loss": -40.548397064208984, "global_step": 226251, "epoch": 1869} {"train_loss": -40.27614212036133, "global_step": 226252, "epoch": 1869} {"train_loss": -42.24131393432617, "global_step": 226253, "epoch": 1869} {"train_loss": -41.805572509765625, "global_step": 226254, "epoch": 1869} {"train_loss": -40.89120101928711, "global_step": 226255, "epoch": 1869} {"train_loss": -41.80363845825195, "global_step": 226256, "epoch": 1869} {"train_loss": -41.749977111816406, "global_step": 226257, "epoch": 1869} {"train_loss": -41.658607482910156, "global_step": 226258, "epoch": 1869} {"train_loss": -42.11566925048828, "global_step": 226259, "epoch": 1869} {"train_loss": -42.15831756591797, "global_step": 226260, "epoch": 1869} {"train_loss": -41.61286544799805, "global_step": 226261, "epoch": 1869} {"train_loss": -35.79655456542969, "global_step": 226262, "epoch": 1869} {"train_loss": -41.59048080444336, "global_step": 226263, "epoch": 1869} {"train_loss": -41.11359786987305, "global_step": 226264, "epoch": 1869} {"train_loss": -42.42111587524414, "global_step": 226265, "epoch": 1869} {"train_loss": -41.27003860473633, "global_step": 226266, "epoch": 1869} {"train_loss": -40.9102897644043, "global_step": 226267, "epoch": 1869} {"train_loss": -42.0709228515625, "global_step": 226268, "epoch": 1869} {"train_loss": -41.25628554919535, "global_step": 226269, "epoch": 1869, "val_loss": 2602083.75} {"train_loss": -41.16761016845703, "global_step": 226270, "epoch": 1870} {"train_loss": -41.10682678222656, "global_step": 226271, "epoch": 1870} {"train_loss": -40.08565139770508, "global_step": 226272, "epoch": 1870} {"train_loss": -41.8834342956543, "global_step": 226273, "epoch": 1870} {"train_loss": -41.18959045410156, "global_step": 226274, "epoch": 1870} {"train_loss": -40.93726348876953, "global_step": 226275, "epoch": 1870} {"train_loss": -41.01710510253906, "global_step": 226276, "epoch": 1870} {"train_loss": -41.04753494262695, "global_step": 226277, "epoch": 1870} {"train_loss": -41.9346923828125, "global_step": 226278, "epoch": 1870} {"train_loss": -40.68550109863281, "global_step": 226279, "epoch": 1870} {"train_loss": -39.997432708740234, "global_step": 226280, "epoch": 1870} {"train_loss": -41.7070198059082, "global_step": 226281, "epoch": 1870} {"train_loss": -39.825462341308594, "global_step": 226282, "epoch": 1870} {"train_loss": -41.34992980957031, "global_step": 226283, "epoch": 1870} {"train_loss": -41.65446472167969, "global_step": 226284, "epoch": 1870} {"train_loss": -40.79157638549805, "global_step": 226285, "epoch": 1870} {"train_loss": -41.01436996459961, "global_step": 226286, "epoch": 1870} {"train_loss": -41.97243881225586, "global_step": 226287, "epoch": 1870} {"train_loss": -40.5456428527832, "global_step": 226288, "epoch": 1870} {"train_loss": -40.43611526489258, "global_step": 226289, "epoch": 1870} {"train_loss": -41.12306594848633, "global_step": 226290, "epoch": 1870} {"train_loss": -39.062355041503906, "global_step": 226291, "epoch": 1870} {"train_loss": -40.63027572631836, "global_step": 226292, "epoch": 1870} {"train_loss": -40.09749984741211, "global_step": 226293, "epoch": 1870} {"train_loss": -39.362754821777344, "global_step": 226294, "epoch": 1870} {"train_loss": -41.032875061035156, "global_step": 226295, "epoch": 1870} {"train_loss": -39.71638488769531, "global_step": 226296, "epoch": 1870} {"train_loss": -41.12582015991211, "global_step": 226297, "epoch": 1870} {"train_loss": -41.22570037841797, "global_step": 226298, "epoch": 1870} {"train_loss": -41.00745391845703, "global_step": 226299, "epoch": 1870} {"train_loss": -39.8301887512207, "global_step": 226300, "epoch": 1870} {"train_loss": -41.2755126953125, "global_step": 226301, "epoch": 1870} {"train_loss": -40.607662200927734, "global_step": 226302, "epoch": 1870} {"train_loss": -40.965003967285156, "global_step": 226303, "epoch": 1870} {"train_loss": -39.5891227722168, "global_step": 226304, "epoch": 1870} {"train_loss": -41.746742248535156, "global_step": 226305, "epoch": 1870} {"train_loss": -40.7971305847168, "global_step": 226306, "epoch": 1870} {"train_loss": -41.018455505371094, "global_step": 226307, "epoch": 1870} {"train_loss": -41.2224006652832, "global_step": 226308, "epoch": 1870} {"train_loss": -40.79069519042969, "global_step": 226309, "epoch": 1870} {"train_loss": -40.913246154785156, "global_step": 226310, "epoch": 1870} {"train_loss": -41.71167755126953, "global_step": 226311, "epoch": 1870} {"train_loss": -39.851741790771484, "global_step": 226312, "epoch": 1870} {"train_loss": -39.939361572265625, "global_step": 226313, "epoch": 1870} {"train_loss": -42.10018539428711, "global_step": 226314, "epoch": 1870} {"train_loss": -40.479225158691406, "global_step": 226315, "epoch": 1870} {"train_loss": -40.20549774169922, "global_step": 226316, "epoch": 1870} {"train_loss": -41.616695404052734, "global_step": 226317, "epoch": 1870} {"train_loss": -39.00692367553711, "global_step": 226318, "epoch": 1870} {"train_loss": -38.75428009033203, "global_step": 226319, "epoch": 1870} {"train_loss": -41.51676940917969, "global_step": 226320, "epoch": 1870} {"train_loss": -39.954559326171875, "global_step": 226321, "epoch": 1870} {"train_loss": -40.251644134521484, "global_step": 226322, "epoch": 1870} {"train_loss": -41.62199020385742, "global_step": 226323, "epoch": 1870} {"train_loss": -37.52057647705078, "global_step": 226324, "epoch": 1870} {"train_loss": -39.4223747253418, "global_step": 226325, "epoch": 1870} {"train_loss": -40.93207550048828, "global_step": 226326, "epoch": 1870} {"train_loss": -38.52163314819336, "global_step": 226327, "epoch": 1870} {"train_loss": -41.700035095214844, "global_step": 226328, "epoch": 1870} {"train_loss": -38.89435958862305, "global_step": 226329, "epoch": 1870} {"train_loss": -40.54367446899414, "global_step": 226330, "epoch": 1870} {"train_loss": -40.8620719909668, "global_step": 226331, "epoch": 1870} {"train_loss": -41.06410598754883, "global_step": 226332, "epoch": 1870} {"train_loss": -41.60697937011719, "global_step": 226333, "epoch": 1870} {"train_loss": -41.048011779785156, "global_step": 226334, "epoch": 1870} {"train_loss": -41.82765579223633, "global_step": 226335, "epoch": 1870} {"train_loss": -41.90511703491211, "global_step": 226336, "epoch": 1870} {"train_loss": -41.59442138671875, "global_step": 226337, "epoch": 1870} {"train_loss": -42.38045883178711, "global_step": 226338, "epoch": 1870} {"train_loss": -42.05576705932617, "global_step": 226339, "epoch": 1870} {"train_loss": -42.11928939819336, "global_step": 226340, "epoch": 1870} {"train_loss": -41.31037521362305, "global_step": 226341, "epoch": 1870} {"train_loss": -42.24058151245117, "global_step": 226342, "epoch": 1870} {"train_loss": -42.25372314453125, "global_step": 226343, "epoch": 1870} {"train_loss": -42.43462371826172, "global_step": 226344, "epoch": 1870} {"train_loss": -41.73916244506836, "global_step": 226345, "epoch": 1870} {"train_loss": -42.39992904663086, "global_step": 226346, "epoch": 1870} {"train_loss": -42.04909896850586, "global_step": 226347, "epoch": 1870} {"train_loss": -41.62333679199219, "global_step": 226348, "epoch": 1870} {"train_loss": -42.34088134765625, "global_step": 226349, "epoch": 1870} {"train_loss": -41.77576446533203, "global_step": 226350, "epoch": 1870} {"train_loss": -42.192562103271484, "global_step": 226351, "epoch": 1870} {"train_loss": -42.31588363647461, "global_step": 226352, "epoch": 1870} {"train_loss": -42.21137619018555, "global_step": 226353, "epoch": 1870} {"train_loss": -43.0164680480957, "global_step": 226354, "epoch": 1870} {"train_loss": -42.33948516845703, "global_step": 226355, "epoch": 1870} {"train_loss": -42.412410736083984, "global_step": 226356, "epoch": 1870} {"train_loss": -42.53679275512695, "global_step": 226357, "epoch": 1870} {"train_loss": -42.6112060546875, "global_step": 226358, "epoch": 1870} {"train_loss": -42.49868392944336, "global_step": 226359, "epoch": 1870} {"train_loss": -42.50149154663086, "global_step": 226360, "epoch": 1870} {"train_loss": -42.79702377319336, "global_step": 226361, "epoch": 1870} {"train_loss": -42.65708923339844, "global_step": 226362, "epoch": 1870} {"train_loss": -42.54473876953125, "global_step": 226363, "epoch": 1870} {"train_loss": -42.61356735229492, "global_step": 226364, "epoch": 1870} {"train_loss": -42.56238555908203, "global_step": 226365, "epoch": 1870} {"train_loss": -42.84850311279297, "global_step": 226366, "epoch": 1870} {"train_loss": -42.79038619995117, "global_step": 226367, "epoch": 1870} {"train_loss": -42.71067428588867, "global_step": 226368, "epoch": 1870} {"train_loss": -42.878780364990234, "global_step": 226369, "epoch": 1870} {"train_loss": -43.03667068481445, "global_step": 226370, "epoch": 1870} {"train_loss": -42.7390251159668, "global_step": 226371, "epoch": 1870} {"train_loss": -43.0972900390625, "global_step": 226372, "epoch": 1870} {"train_loss": -42.5560302734375, "global_step": 226373, "epoch": 1870} {"train_loss": -42.157283782958984, "global_step": 226374, "epoch": 1870} {"train_loss": -43.2846794128418, "global_step": 226375, "epoch": 1870} {"train_loss": -42.844844818115234, "global_step": 226376, "epoch": 1870} {"train_loss": -43.06550216674805, "global_step": 226377, "epoch": 1870} {"train_loss": -43.04757308959961, "global_step": 226378, "epoch": 1870} {"train_loss": -42.623687744140625, "global_step": 226379, "epoch": 1870} {"train_loss": -43.00148391723633, "global_step": 226380, "epoch": 1870} {"train_loss": -42.847774505615234, "global_step": 226381, "epoch": 1870} {"train_loss": -43.12876510620117, "global_step": 226382, "epoch": 1870} {"train_loss": -43.21562576293945, "global_step": 226383, "epoch": 1870} {"train_loss": -42.69164276123047, "global_step": 226384, "epoch": 1870} {"train_loss": -42.019561767578125, "global_step": 226385, "epoch": 1870} {"train_loss": -42.41370391845703, "global_step": 226386, "epoch": 1870} {"train_loss": -42.22446060180664, "global_step": 226387, "epoch": 1870} {"train_loss": -41.7067756652832, "global_step": 226388, "epoch": 1870} {"train_loss": -42.5255126953125, "global_step": 226389, "epoch": 1870} {"train_loss": -41.484994021329015, "global_step": 226390, "epoch": 1870, "val_loss": 2606138.75} {"train_loss": -42.230133056640625, "global_step": 226391, "epoch": 1871} {"train_loss": -42.2711296081543, "global_step": 226392, "epoch": 1871} {"train_loss": -41.42897415161133, "global_step": 226393, "epoch": 1871} {"train_loss": -39.59865951538086, "global_step": 226394, "epoch": 1871} {"train_loss": -32.24787139892578, "global_step": 226395, "epoch": 1871} {"train_loss": -17.221393585205078, "global_step": 226396, "epoch": 1871} {"train_loss": -10.401389122009277, "global_step": 226397, "epoch": 1871} {"train_loss": -24.841785430908203, "global_step": 226398, "epoch": 1871} {"train_loss": -38.65963363647461, "global_step": 226399, "epoch": 1871} {"train_loss": -14.795187950134277, "global_step": 226400, "epoch": 1871} {"train_loss": -32.295650482177734, "global_step": 226401, "epoch": 1871} {"train_loss": -30.144025802612305, "global_step": 226402, "epoch": 1871} {"train_loss": -27.20912742614746, "global_step": 226403, "epoch": 1871} {"train_loss": -36.28829574584961, "global_step": 226404, "epoch": 1871} {"train_loss": -29.759153366088867, "global_step": 226405, "epoch": 1871} {"train_loss": -35.0565185546875, "global_step": 226406, "epoch": 1871} {"train_loss": -34.69189453125, "global_step": 226407, "epoch": 1871} {"train_loss": -33.2720947265625, "global_step": 226408, "epoch": 1871} {"train_loss": -37.33580780029297, "global_step": 226409, "epoch": 1871} {"train_loss": -34.89472198486328, "global_step": 226410, "epoch": 1871} {"train_loss": -38.45111846923828, "global_step": 226411, "epoch": 1871} {"train_loss": -36.77802658081055, "global_step": 226412, "epoch": 1871} {"train_loss": -37.2639274597168, "global_step": 226413, "epoch": 1871} {"train_loss": -39.536231994628906, "global_step": 226414, "epoch": 1871} {"train_loss": -38.18495559692383, "global_step": 226415, "epoch": 1871} {"train_loss": -38.5049934387207, "global_step": 226416, "epoch": 1871} {"train_loss": -39.731239318847656, "global_step": 226417, "epoch": 1871} {"train_loss": -38.688941955566406, "global_step": 226418, "epoch": 1871} {"train_loss": -38.15849685668945, "global_step": 226419, "epoch": 1871} {"train_loss": -40.32960891723633, "global_step": 226420, "epoch": 1871} {"train_loss": -39.2082633972168, "global_step": 226421, "epoch": 1871} {"train_loss": -39.88658142089844, "global_step": 226422, "epoch": 1871} {"train_loss": -40.812355041503906, "global_step": 226423, "epoch": 1871} {"train_loss": -39.850807189941406, "global_step": 226424, "epoch": 1871} {"train_loss": -40.15044021606445, "global_step": 226425, "epoch": 1871} {"train_loss": -41.404884338378906, "global_step": 226426, "epoch": 1871} {"train_loss": -40.252201080322266, "global_step": 226427, "epoch": 1871} {"train_loss": -40.60554885864258, "global_step": 226428, "epoch": 1871} {"train_loss": -40.819122314453125, "global_step": 226429, "epoch": 1871} {"train_loss": -40.763427734375, "global_step": 226430, "epoch": 1871} {"train_loss": -40.8525276184082, "global_step": 226431, "epoch": 1871} {"train_loss": -41.39472579956055, "global_step": 226432, "epoch": 1871} {"train_loss": -40.96550369262695, "global_step": 226433, "epoch": 1871} {"train_loss": -40.76274490356445, "global_step": 226434, "epoch": 1871} {"train_loss": -40.98553466796875, "global_step": 226435, "epoch": 1871} {"train_loss": -40.910823822021484, "global_step": 226436, "epoch": 1871} {"train_loss": -40.97802734375, "global_step": 226437, "epoch": 1871} {"train_loss": -41.68939208984375, "global_step": 226438, "epoch": 1871} {"train_loss": -41.4022216796875, "global_step": 226439, "epoch": 1871} {"train_loss": -41.20198059082031, "global_step": 226440, "epoch": 1871} {"train_loss": -41.547119140625, "global_step": 226441, "epoch": 1871} {"train_loss": -41.5977783203125, "global_step": 226442, "epoch": 1871} {"train_loss": -41.4015998840332, "global_step": 226443, "epoch": 1871} {"train_loss": -41.64342498779297, "global_step": 226444, "epoch": 1871} {"train_loss": -41.599056243896484, "global_step": 226445, "epoch": 1871} {"train_loss": -41.886592864990234, "global_step": 226446, "epoch": 1871} {"train_loss": -42.03864669799805, "global_step": 226447, "epoch": 1871} {"train_loss": -42.11838912963867, "global_step": 226448, "epoch": 1871} {"train_loss": -41.53074264526367, "global_step": 226449, "epoch": 1871} {"train_loss": -41.80947494506836, "global_step": 226450, "epoch": 1871} {"train_loss": -41.91849899291992, "global_step": 226451, "epoch": 1871} {"train_loss": -41.954715728759766, "global_step": 226452, "epoch": 1871} {"train_loss": -42.26177978515625, "global_step": 226453, "epoch": 1871} {"train_loss": -42.14842987060547, "global_step": 226454, "epoch": 1871} {"train_loss": -42.189632415771484, "global_step": 226455, "epoch": 1871} {"train_loss": -41.9971923828125, "global_step": 226456, "epoch": 1871} {"train_loss": -42.030494689941406, "global_step": 226457, "epoch": 1871} {"train_loss": -41.99660873413086, "global_step": 226458, "epoch": 1871} {"train_loss": -41.59174728393555, "global_step": 226459, "epoch": 1871} {"train_loss": -42.01995849609375, "global_step": 226460, "epoch": 1871} {"train_loss": -42.761505126953125, "global_step": 226461, "epoch": 1871} {"train_loss": -42.25354766845703, "global_step": 226462, "epoch": 1871} {"train_loss": -42.11338806152344, "global_step": 226463, "epoch": 1871} {"train_loss": -42.097049713134766, "global_step": 226464, "epoch": 1871} {"train_loss": -42.64413070678711, "global_step": 226465, "epoch": 1871} {"train_loss": -41.974483489990234, "global_step": 226466, "epoch": 1871} {"train_loss": -42.15958786010742, "global_step": 226467, "epoch": 1871} {"train_loss": -42.54645538330078, "global_step": 226468, "epoch": 1871} {"train_loss": -42.590293884277344, "global_step": 226469, "epoch": 1871} {"train_loss": -42.34084701538086, "global_step": 226470, "epoch": 1871} {"train_loss": -42.535186767578125, "global_step": 226471, "epoch": 1871} {"train_loss": -42.434017181396484, "global_step": 226472, "epoch": 1871} {"train_loss": -42.25943374633789, "global_step": 226473, "epoch": 1871} {"train_loss": -42.39607238769531, "global_step": 226474, "epoch": 1871} {"train_loss": -42.40580749511719, "global_step": 226475, "epoch": 1871} {"train_loss": -42.577083587646484, "global_step": 226476, "epoch": 1871} {"train_loss": -42.075477600097656, "global_step": 226477, "epoch": 1871} {"train_loss": -42.61774444580078, "global_step": 226478, "epoch": 1871} {"train_loss": -42.81134796142578, "global_step": 226479, "epoch": 1871} {"train_loss": -42.394405364990234, "global_step": 226480, "epoch": 1871} {"train_loss": -43.282920837402344, "global_step": 226481, "epoch": 1871} {"train_loss": -42.54030227661133, "global_step": 226482, "epoch": 1871} {"train_loss": -42.85615539550781, "global_step": 226483, "epoch": 1871} {"train_loss": -42.590919494628906, "global_step": 226484, "epoch": 1871} {"train_loss": -42.997982025146484, "global_step": 226485, "epoch": 1871} {"train_loss": -42.63106155395508, "global_step": 226486, "epoch": 1871} {"train_loss": -42.948299407958984, "global_step": 226487, "epoch": 1871} {"train_loss": -42.952762603759766, "global_step": 226488, "epoch": 1871} {"train_loss": -42.39510726928711, "global_step": 226489, "epoch": 1871} {"train_loss": -42.6699104309082, "global_step": 226490, "epoch": 1871} {"train_loss": -43.12042999267578, "global_step": 226491, "epoch": 1871} {"train_loss": -42.80632400512695, "global_step": 226492, "epoch": 1871} {"train_loss": -43.13825607299805, "global_step": 226493, "epoch": 1871} {"train_loss": -42.80293273925781, "global_step": 226494, "epoch": 1871} {"train_loss": -42.69474411010742, "global_step": 226495, "epoch": 1871} {"train_loss": -43.1839714050293, "global_step": 226496, "epoch": 1871} {"train_loss": -42.798866271972656, "global_step": 226497, "epoch": 1871} {"train_loss": -42.89508819580078, "global_step": 226498, "epoch": 1871} {"train_loss": -42.72589111328125, "global_step": 226499, "epoch": 1871} {"train_loss": -43.03612518310547, "global_step": 226500, "epoch": 1871} {"train_loss": -42.56275177001953, "global_step": 226501, "epoch": 1871} {"train_loss": -42.29372024536133, "global_step": 226502, "epoch": 1871} {"train_loss": -42.01365280151367, "global_step": 226503, "epoch": 1871} {"train_loss": -42.58058547973633, "global_step": 226504, "epoch": 1871} {"train_loss": -42.3471794128418, "global_step": 226505, "epoch": 1871} {"train_loss": -42.90199661254883, "global_step": 226506, "epoch": 1871} {"train_loss": -42.513648986816406, "global_step": 226507, "epoch": 1871} {"train_loss": -42.13236618041992, "global_step": 226508, "epoch": 1871} {"train_loss": -42.07481384277344, "global_step": 226509, "epoch": 1871} {"train_loss": -41.96267318725586, "global_step": 226510, "epoch": 1871} {"train_loss": -40.01863013023187, "global_step": 226511, "epoch": 1871, "val_loss": 2580969.25} {"train_loss": -40.79962921142578, "global_step": 226512, "epoch": 1872} {"train_loss": -40.21154022216797, "global_step": 226513, "epoch": 1872} {"train_loss": -39.814002990722656, "global_step": 226514, "epoch": 1872} {"train_loss": -36.18190002441406, "global_step": 226515, "epoch": 1872} {"train_loss": -32.54111862182617, "global_step": 226516, "epoch": 1872} {"train_loss": -34.38612747192383, "global_step": 226517, "epoch": 1872} {"train_loss": -40.43647766113281, "global_step": 226518, "epoch": 1872} {"train_loss": -41.97329330444336, "global_step": 226519, "epoch": 1872} {"train_loss": -38.058773040771484, "global_step": 226520, "epoch": 1872} {"train_loss": -40.88515090942383, "global_step": 226521, "epoch": 1872} {"train_loss": -40.83942794799805, "global_step": 226522, "epoch": 1872} {"train_loss": -35.21133041381836, "global_step": 226523, "epoch": 1872} {"train_loss": -39.416175842285156, "global_step": 226524, "epoch": 1872} {"train_loss": -39.545814514160156, "global_step": 226525, "epoch": 1872} {"train_loss": -39.94621658325195, "global_step": 226526, "epoch": 1872} {"train_loss": -40.88286590576172, "global_step": 226527, "epoch": 1872} {"train_loss": -41.130096435546875, "global_step": 226528, "epoch": 1872} {"train_loss": -41.320716857910156, "global_step": 226529, "epoch": 1872} {"train_loss": -40.6026725769043, "global_step": 226530, "epoch": 1872} {"train_loss": -41.19590377807617, "global_step": 226531, "epoch": 1872} {"train_loss": -40.481964111328125, "global_step": 226532, "epoch": 1872} {"train_loss": -41.484676361083984, "global_step": 226533, "epoch": 1872} {"train_loss": -41.12351608276367, "global_step": 226534, "epoch": 1872} {"train_loss": -40.88718795776367, "global_step": 226535, "epoch": 1872} {"train_loss": -41.42818832397461, "global_step": 226536, "epoch": 1872} {"train_loss": -41.903560638427734, "global_step": 226537, "epoch": 1872} {"train_loss": -41.11800003051758, "global_step": 226538, "epoch": 1872} {"train_loss": -40.90140914916992, "global_step": 226539, "epoch": 1872} {"train_loss": -42.41339111328125, "global_step": 226540, "epoch": 1872} {"train_loss": -41.64057540893555, "global_step": 226541, "epoch": 1872} {"train_loss": -41.35930252075195, "global_step": 226542, "epoch": 1872} {"train_loss": -41.100555419921875, "global_step": 226543, "epoch": 1872} {"train_loss": -42.07633590698242, "global_step": 226544, "epoch": 1872} {"train_loss": -41.054908752441406, "global_step": 226545, "epoch": 1872} {"train_loss": -41.10931396484375, "global_step": 226546, "epoch": 1872} {"train_loss": -42.108428955078125, "global_step": 226547, "epoch": 1872} {"train_loss": -41.15727615356445, "global_step": 226548, "epoch": 1872} {"train_loss": -41.823707580566406, "global_step": 226549, "epoch": 1872} {"train_loss": -41.72896957397461, "global_step": 226550, "epoch": 1872} {"train_loss": -41.3740348815918, "global_step": 226551, "epoch": 1872} {"train_loss": -41.594642639160156, "global_step": 226552, "epoch": 1872} {"train_loss": -41.85422897338867, "global_step": 226553, "epoch": 1872} {"train_loss": -42.36420822143555, "global_step": 226554, "epoch": 1872} {"train_loss": -41.02793884277344, "global_step": 226555, "epoch": 1872} {"train_loss": -42.21446228027344, "global_step": 226556, "epoch": 1872} {"train_loss": -42.227760314941406, "global_step": 226557, "epoch": 1872} {"train_loss": -41.970855712890625, "global_step": 226558, "epoch": 1872} {"train_loss": -42.40354537963867, "global_step": 226559, "epoch": 1872} {"train_loss": -40.81556701660156, "global_step": 226560, "epoch": 1872} {"train_loss": -41.5356559753418, "global_step": 226561, "epoch": 1872} {"train_loss": -41.64558029174805, "global_step": 226562, "epoch": 1872} {"train_loss": -42.39553451538086, "global_step": 226563, "epoch": 1872} {"train_loss": -41.984718322753906, "global_step": 226564, "epoch": 1872} {"train_loss": -41.906185150146484, "global_step": 226565, "epoch": 1872} {"train_loss": -42.262733459472656, "global_step": 226566, "epoch": 1872} {"train_loss": -42.531105041503906, "global_step": 226567, "epoch": 1872} {"train_loss": -42.3766975402832, "global_step": 226568, "epoch": 1872} {"train_loss": -42.17057418823242, "global_step": 226569, "epoch": 1872} {"train_loss": -42.89390182495117, "global_step": 226570, "epoch": 1872} {"train_loss": -42.457271575927734, "global_step": 226571, "epoch": 1872} {"train_loss": -42.47724533081055, "global_step": 226572, "epoch": 1872} {"train_loss": -42.546390533447266, "global_step": 226573, "epoch": 1872} {"train_loss": -42.384765625, "global_step": 226574, "epoch": 1872} {"train_loss": -41.97634506225586, "global_step": 226575, "epoch": 1872} {"train_loss": -42.84589767456055, "global_step": 226576, "epoch": 1872} {"train_loss": -42.34892654418945, "global_step": 226577, "epoch": 1872} {"train_loss": -42.697872161865234, "global_step": 226578, "epoch": 1872} {"train_loss": -42.582801818847656, "global_step": 226579, "epoch": 1872} {"train_loss": -42.724918365478516, "global_step": 226580, "epoch": 1872} {"train_loss": -42.86086654663086, "global_step": 226581, "epoch": 1872} {"train_loss": -42.73188018798828, "global_step": 226582, "epoch": 1872} {"train_loss": -42.538028717041016, "global_step": 226583, "epoch": 1872} {"train_loss": -43.156524658203125, "global_step": 226584, "epoch": 1872} {"train_loss": -43.009639739990234, "global_step": 226585, "epoch": 1872} {"train_loss": -42.844966888427734, "global_step": 226586, "epoch": 1872} {"train_loss": -42.903751373291016, "global_step": 226587, "epoch": 1872} {"train_loss": -43.052223205566406, "global_step": 226588, "epoch": 1872} {"train_loss": -43.14856719970703, "global_step": 226589, "epoch": 1872} {"train_loss": -43.146846771240234, "global_step": 226590, "epoch": 1872} {"train_loss": -42.94224166870117, "global_step": 226591, "epoch": 1872} {"train_loss": -43.453853607177734, "global_step": 226592, "epoch": 1872} {"train_loss": -42.63554763793945, "global_step": 226593, "epoch": 1872} {"train_loss": -42.99215316772461, "global_step": 226594, "epoch": 1872} {"train_loss": -42.35888671875, "global_step": 226595, "epoch": 1872} {"train_loss": -42.59369659423828, "global_step": 226596, "epoch": 1872} {"train_loss": -42.88172149658203, "global_step": 226597, "epoch": 1872} {"train_loss": -43.113006591796875, "global_step": 226598, "epoch": 1872} {"train_loss": -41.779048919677734, "global_step": 226599, "epoch": 1872} {"train_loss": -40.2609748840332, "global_step": 226600, "epoch": 1872} {"train_loss": -40.062068939208984, "global_step": 226601, "epoch": 1872} {"train_loss": -42.64681625366211, "global_step": 226602, "epoch": 1872} {"train_loss": -42.6710319519043, "global_step": 226603, "epoch": 1872} {"train_loss": -41.9497184753418, "global_step": 226604, "epoch": 1872} {"train_loss": -42.48075485229492, "global_step": 226605, "epoch": 1872} {"train_loss": -42.48258590698242, "global_step": 226606, "epoch": 1872} {"train_loss": -42.375038146972656, "global_step": 226607, "epoch": 1872} {"train_loss": -42.037471771240234, "global_step": 226608, "epoch": 1872} {"train_loss": -41.46617889404297, "global_step": 226609, "epoch": 1872} {"train_loss": -41.707313537597656, "global_step": 226610, "epoch": 1872} {"train_loss": -40.833290100097656, "global_step": 226611, "epoch": 1872} {"train_loss": -39.529354095458984, "global_step": 226612, "epoch": 1872} {"train_loss": -39.81184005737305, "global_step": 226613, "epoch": 1872} {"train_loss": -40.618141174316406, "global_step": 226614, "epoch": 1872} {"train_loss": -41.666358947753906, "global_step": 226615, "epoch": 1872} {"train_loss": -41.34678268432617, "global_step": 226616, "epoch": 1872} {"train_loss": -41.96043395996094, "global_step": 226617, "epoch": 1872} {"train_loss": -40.85451126098633, "global_step": 226618, "epoch": 1872} {"train_loss": -40.4205207824707, "global_step": 226619, "epoch": 1872} {"train_loss": -42.74407958984375, "global_step": 226620, "epoch": 1872} {"train_loss": -42.296730041503906, "global_step": 226621, "epoch": 1872} {"train_loss": -41.2239990234375, "global_step": 226622, "epoch": 1872} {"train_loss": -41.0461540222168, "global_step": 226623, "epoch": 1872} {"train_loss": -41.766902923583984, "global_step": 226624, "epoch": 1872} {"train_loss": -42.2696533203125, "global_step": 226625, "epoch": 1872} {"train_loss": -42.06935501098633, "global_step": 226626, "epoch": 1872} {"train_loss": -41.75047302246094, "global_step": 226627, "epoch": 1872} {"train_loss": -42.22060012817383, "global_step": 226628, "epoch": 1872} {"train_loss": -41.31926345825195, "global_step": 226629, "epoch": 1872} {"train_loss": -41.09339141845703, "global_step": 226630, "epoch": 1872} {"train_loss": -41.22105026245117, "global_step": 226631, "epoch": 1872} {"train_loss": -41.48837567163893, "global_step": 226632, "epoch": 1872, "val_loss": 2716884.0} {"train_loss": -40.71656036376953, "global_step": 226633, "epoch": 1873} {"train_loss": -40.891151428222656, "global_step": 226634, "epoch": 1873} {"train_loss": -41.683624267578125, "global_step": 226635, "epoch": 1873} {"train_loss": -41.62421798706055, "global_step": 226636, "epoch": 1873} {"train_loss": -41.63994216918945, "global_step": 226637, "epoch": 1873} {"train_loss": -41.71632766723633, "global_step": 226638, "epoch": 1873} {"train_loss": -41.351173400878906, "global_step": 226639, "epoch": 1873} {"train_loss": -41.13926315307617, "global_step": 226640, "epoch": 1873} {"train_loss": -41.651058197021484, "global_step": 226641, "epoch": 1873} {"train_loss": -40.13173294067383, "global_step": 226642, "epoch": 1873} {"train_loss": -40.48230743408203, "global_step": 226643, "epoch": 1873} {"train_loss": -41.965545654296875, "global_step": 226644, "epoch": 1873} {"train_loss": -41.98213577270508, "global_step": 226645, "epoch": 1873} {"train_loss": -41.471187591552734, "global_step": 226646, "epoch": 1873} {"train_loss": -41.04355239868164, "global_step": 226647, "epoch": 1873} {"train_loss": -42.22539138793945, "global_step": 226648, "epoch": 1873} {"train_loss": -41.3066291809082, "global_step": 226649, "epoch": 1873} {"train_loss": -41.56742858886719, "global_step": 226650, "epoch": 1873} {"train_loss": -41.98637008666992, "global_step": 226651, "epoch": 1873} {"train_loss": -40.21158218383789, "global_step": 226652, "epoch": 1873} {"train_loss": -41.02396774291992, "global_step": 226653, "epoch": 1873} {"train_loss": -41.68593215942383, "global_step": 226654, "epoch": 1873} {"train_loss": -38.35134506225586, "global_step": 226655, "epoch": 1873} {"train_loss": -40.856048583984375, "global_step": 226656, "epoch": 1873} {"train_loss": -41.732337951660156, "global_step": 226657, "epoch": 1873} {"train_loss": -39.96128463745117, "global_step": 226658, "epoch": 1873} {"train_loss": -39.55283737182617, "global_step": 226659, "epoch": 1873} {"train_loss": -41.439208984375, "global_step": 226660, "epoch": 1873} {"train_loss": -40.89286422729492, "global_step": 226661, "epoch": 1873} {"train_loss": -39.068031311035156, "global_step": 226662, "epoch": 1873} {"train_loss": -41.44401931762695, "global_step": 226663, "epoch": 1873} {"train_loss": -40.415096282958984, "global_step": 226664, "epoch": 1873} {"train_loss": -38.560359954833984, "global_step": 226665, "epoch": 1873} {"train_loss": -41.301368713378906, "global_step": 226666, "epoch": 1873} {"train_loss": -41.7854118347168, "global_step": 226667, "epoch": 1873} {"train_loss": -39.60736083984375, "global_step": 226668, "epoch": 1873} {"train_loss": -42.5086784362793, "global_step": 226669, "epoch": 1873} {"train_loss": -41.054317474365234, "global_step": 226670, "epoch": 1873} {"train_loss": -41.22464370727539, "global_step": 226671, "epoch": 1873} {"train_loss": -42.01529312133789, "global_step": 226672, "epoch": 1873} {"train_loss": -41.21159744262695, "global_step": 226673, "epoch": 1873} {"train_loss": -42.01485061645508, "global_step": 226674, "epoch": 1873} {"train_loss": -40.575035095214844, "global_step": 226675, "epoch": 1873} {"train_loss": -41.27543258666992, "global_step": 226676, "epoch": 1873} {"train_loss": -42.65216064453125, "global_step": 226677, "epoch": 1873} {"train_loss": -41.43115997314453, "global_step": 226678, "epoch": 1873} {"train_loss": -41.7802848815918, "global_step": 226679, "epoch": 1873} {"train_loss": -41.13322830200195, "global_step": 226680, "epoch": 1873} {"train_loss": -42.33064651489258, "global_step": 226681, "epoch": 1873} {"train_loss": -41.75244903564453, "global_step": 226682, "epoch": 1873} {"train_loss": -42.504756927490234, "global_step": 226683, "epoch": 1873} {"train_loss": -42.16522979736328, "global_step": 226684, "epoch": 1873} {"train_loss": -41.838600158691406, "global_step": 226685, "epoch": 1873} {"train_loss": -42.1132698059082, "global_step": 226686, "epoch": 1873} {"train_loss": -41.79410934448242, "global_step": 226687, "epoch": 1873} {"train_loss": -42.25709915161133, "global_step": 226688, "epoch": 1873} {"train_loss": -42.341796875, "global_step": 226689, "epoch": 1873} {"train_loss": -42.279510498046875, "global_step": 226690, "epoch": 1873} {"train_loss": -43.0977783203125, "global_step": 226691, "epoch": 1873} {"train_loss": -41.421600341796875, "global_step": 226692, "epoch": 1873} {"train_loss": -42.2213020324707, "global_step": 226693, "epoch": 1873} {"train_loss": -42.75715255737305, "global_step": 226694, "epoch": 1873} {"train_loss": -42.449642181396484, "global_step": 226695, "epoch": 1873} {"train_loss": -42.4455680847168, "global_step": 226696, "epoch": 1873} {"train_loss": -42.66938018798828, "global_step": 226697, "epoch": 1873} {"train_loss": -42.96847152709961, "global_step": 226698, "epoch": 1873} {"train_loss": -43.16838455200195, "global_step": 226699, "epoch": 1873} {"train_loss": -42.43290710449219, "global_step": 226700, "epoch": 1873} {"train_loss": -42.64822769165039, "global_step": 226701, "epoch": 1873} {"train_loss": -43.275394439697266, "global_step": 226702, "epoch": 1873} {"train_loss": -43.04425048828125, "global_step": 226703, "epoch": 1873} {"train_loss": -42.698516845703125, "global_step": 226704, "epoch": 1873} {"train_loss": -42.378501892089844, "global_step": 226705, "epoch": 1873} {"train_loss": -42.584285736083984, "global_step": 226706, "epoch": 1873} {"train_loss": -42.116371154785156, "global_step": 226707, "epoch": 1873} {"train_loss": -42.547332763671875, "global_step": 226708, "epoch": 1873} {"train_loss": -42.73374557495117, "global_step": 226709, "epoch": 1873} {"train_loss": -42.57487106323242, "global_step": 226710, "epoch": 1873} {"train_loss": -42.86118698120117, "global_step": 226711, "epoch": 1873} {"train_loss": -41.79171371459961, "global_step": 226712, "epoch": 1873} {"train_loss": -41.81551742553711, "global_step": 226713, "epoch": 1873} {"train_loss": -42.876338958740234, "global_step": 226714, "epoch": 1873} {"train_loss": -42.13296127319336, "global_step": 226715, "epoch": 1873} {"train_loss": -41.30060958862305, "global_step": 226716, "epoch": 1873} {"train_loss": -42.77838134765625, "global_step": 226717, "epoch": 1873} {"train_loss": -42.1351432800293, "global_step": 226718, "epoch": 1873} {"train_loss": -42.744903564453125, "global_step": 226719, "epoch": 1873} {"train_loss": -42.17518997192383, "global_step": 226720, "epoch": 1873} {"train_loss": -42.65620803833008, "global_step": 226721, "epoch": 1873} {"train_loss": -42.341922760009766, "global_step": 226722, "epoch": 1873} {"train_loss": -41.80961227416992, "global_step": 226723, "epoch": 1873} {"train_loss": -42.40644073486328, "global_step": 226724, "epoch": 1873} {"train_loss": -42.37550735473633, "global_step": 226725, "epoch": 1873} {"train_loss": -41.93217086791992, "global_step": 226726, "epoch": 1873} {"train_loss": -42.1377067565918, "global_step": 226727, "epoch": 1873} {"train_loss": -42.50107955932617, "global_step": 226728, "epoch": 1873} {"train_loss": -42.41426086425781, "global_step": 226729, "epoch": 1873} {"train_loss": -40.47309494018555, "global_step": 226730, "epoch": 1873} {"train_loss": -41.678585052490234, "global_step": 226731, "epoch": 1873} {"train_loss": -42.28731918334961, "global_step": 226732, "epoch": 1873} {"train_loss": -41.496028900146484, "global_step": 226733, "epoch": 1873} {"train_loss": -42.23604965209961, "global_step": 226734, "epoch": 1873} {"train_loss": -42.39646530151367, "global_step": 226735, "epoch": 1873} {"train_loss": -42.1546630859375, "global_step": 226736, "epoch": 1873} {"train_loss": -42.399269104003906, "global_step": 226737, "epoch": 1873} {"train_loss": -42.54914474487305, "global_step": 226738, "epoch": 1873} {"train_loss": -42.3115348815918, "global_step": 226739, "epoch": 1873} {"train_loss": -42.55398178100586, "global_step": 226740, "epoch": 1873} {"train_loss": -42.02452850341797, "global_step": 226741, "epoch": 1873} {"train_loss": -42.4420280456543, "global_step": 226742, "epoch": 1873} {"train_loss": -42.100257873535156, "global_step": 226743, "epoch": 1873} {"train_loss": -42.44392395019531, "global_step": 226744, "epoch": 1873} {"train_loss": -42.47857666015625, "global_step": 226745, "epoch": 1873} {"train_loss": -41.97294235229492, "global_step": 226746, "epoch": 1873} {"train_loss": -42.125648498535156, "global_step": 226747, "epoch": 1873} {"train_loss": -42.33687973022461, "global_step": 226748, "epoch": 1873} {"train_loss": -41.943145751953125, "global_step": 226749, "epoch": 1873} {"train_loss": -42.383419036865234, "global_step": 226750, "epoch": 1873} {"train_loss": -42.95490264892578, "global_step": 226751, "epoch": 1873} {"train_loss": -41.50022506713867, "global_step": 226752, "epoch": 1873} {"train_loss": -41.823579961603336, "global_step": 226753, "epoch": 1873, "val_loss": 2603104.25} {"train_loss": -41.96725845336914, "global_step": 226754, "epoch": 1874} {"train_loss": -40.680267333984375, "global_step": 226755, "epoch": 1874} {"train_loss": -42.26904296875, "global_step": 226756, "epoch": 1874} {"train_loss": -41.99123001098633, "global_step": 226757, "epoch": 1874} {"train_loss": -42.00116729736328, "global_step": 226758, "epoch": 1874} {"train_loss": -42.07926559448242, "global_step": 226759, "epoch": 1874} {"train_loss": -40.92203903198242, "global_step": 226760, "epoch": 1874} {"train_loss": -40.94922637939453, "global_step": 226761, "epoch": 1874} {"train_loss": -41.082393646240234, "global_step": 226762, "epoch": 1874} {"train_loss": -41.73187255859375, "global_step": 226763, "epoch": 1874} {"train_loss": -40.714664459228516, "global_step": 226764, "epoch": 1874} {"train_loss": -41.57381820678711, "global_step": 226765, "epoch": 1874} {"train_loss": -40.69500732421875, "global_step": 226766, "epoch": 1874} {"train_loss": -42.1638069152832, "global_step": 226767, "epoch": 1874} {"train_loss": -41.85274124145508, "global_step": 226768, "epoch": 1874} {"train_loss": -40.785362243652344, "global_step": 226769, "epoch": 1874} {"train_loss": -41.52421569824219, "global_step": 226770, "epoch": 1874} {"train_loss": -41.0763053894043, "global_step": 226771, "epoch": 1874} {"train_loss": -41.724029541015625, "global_step": 226772, "epoch": 1874} {"train_loss": -42.986053466796875, "global_step": 226773, "epoch": 1874} {"train_loss": -41.6216926574707, "global_step": 226774, "epoch": 1874} {"train_loss": -39.9520263671875, "global_step": 226775, "epoch": 1874} {"train_loss": -39.31018829345703, "global_step": 226776, "epoch": 1874} {"train_loss": -40.871334075927734, "global_step": 226777, "epoch": 1874} {"train_loss": -41.23014450073242, "global_step": 226778, "epoch": 1874} {"train_loss": -42.29761505126953, "global_step": 226779, "epoch": 1874} {"train_loss": -38.84368133544922, "global_step": 226780, "epoch": 1874} {"train_loss": -42.31367874145508, "global_step": 226781, "epoch": 1874} {"train_loss": -41.37788009643555, "global_step": 226782, "epoch": 1874} {"train_loss": -41.7192497253418, "global_step": 226783, "epoch": 1874} {"train_loss": -40.61552047729492, "global_step": 226784, "epoch": 1874} {"train_loss": -40.847320556640625, "global_step": 226785, "epoch": 1874} {"train_loss": -39.81207275390625, "global_step": 226786, "epoch": 1874} {"train_loss": -41.87276840209961, "global_step": 226787, "epoch": 1874} {"train_loss": -38.73200607299805, "global_step": 226788, "epoch": 1874} {"train_loss": -41.51130294799805, "global_step": 226789, "epoch": 1874} {"train_loss": -41.996219635009766, "global_step": 226790, "epoch": 1874} {"train_loss": -41.25551986694336, "global_step": 226791, "epoch": 1874} {"train_loss": -41.636756896972656, "global_step": 226792, "epoch": 1874} {"train_loss": -40.07427215576172, "global_step": 226793, "epoch": 1874} {"train_loss": -42.43802261352539, "global_step": 226794, "epoch": 1874} {"train_loss": -40.78736877441406, "global_step": 226795, "epoch": 1874} {"train_loss": -38.8363037109375, "global_step": 226796, "epoch": 1874} {"train_loss": -40.49307632446289, "global_step": 226797, "epoch": 1874} {"train_loss": -41.173828125, "global_step": 226798, "epoch": 1874} {"train_loss": -40.9802131652832, "global_step": 226799, "epoch": 1874} {"train_loss": -40.490333557128906, "global_step": 226800, "epoch": 1874} {"train_loss": -40.38044357299805, "global_step": 226801, "epoch": 1874} {"train_loss": -41.99613571166992, "global_step": 226802, "epoch": 1874} {"train_loss": -41.20531463623047, "global_step": 226803, "epoch": 1874} {"train_loss": -38.07285690307617, "global_step": 226804, "epoch": 1874} {"train_loss": -40.31746292114258, "global_step": 226805, "epoch": 1874} {"train_loss": -40.375030517578125, "global_step": 226806, "epoch": 1874} {"train_loss": -41.11698532104492, "global_step": 226807, "epoch": 1874} {"train_loss": -41.294368743896484, "global_step": 226808, "epoch": 1874} {"train_loss": -40.610107421875, "global_step": 226809, "epoch": 1874} {"train_loss": -42.01581954956055, "global_step": 226810, "epoch": 1874} {"train_loss": -42.09809112548828, "global_step": 226811, "epoch": 1874} {"train_loss": -41.0882682800293, "global_step": 226812, "epoch": 1874} {"train_loss": -41.22846221923828, "global_step": 226813, "epoch": 1874} {"train_loss": -41.7620849609375, "global_step": 226814, "epoch": 1874} {"train_loss": -40.93451690673828, "global_step": 226815, "epoch": 1874} {"train_loss": -41.734615325927734, "global_step": 226816, "epoch": 1874} {"train_loss": -42.02779006958008, "global_step": 226817, "epoch": 1874} {"train_loss": -41.13599395751953, "global_step": 226818, "epoch": 1874} {"train_loss": -39.43189239501953, "global_step": 226819, "epoch": 1874} {"train_loss": -42.09876251220703, "global_step": 226820, "epoch": 1874} {"train_loss": -37.26546859741211, "global_step": 226821, "epoch": 1874} {"train_loss": -40.53961181640625, "global_step": 226822, "epoch": 1874} {"train_loss": -41.51832962036133, "global_step": 226823, "epoch": 1874} {"train_loss": -42.03909683227539, "global_step": 226824, "epoch": 1874} {"train_loss": -42.05036163330078, "global_step": 226825, "epoch": 1874} {"train_loss": -40.41168975830078, "global_step": 226826, "epoch": 1874} {"train_loss": -41.776336669921875, "global_step": 226827, "epoch": 1874} {"train_loss": -42.214996337890625, "global_step": 226828, "epoch": 1874} {"train_loss": -40.09943389892578, "global_step": 226829, "epoch": 1874} {"train_loss": -40.85421371459961, "global_step": 226830, "epoch": 1874} {"train_loss": -40.9121208190918, "global_step": 226831, "epoch": 1874} {"train_loss": -41.80961990356445, "global_step": 226832, "epoch": 1874} {"train_loss": -41.3647346496582, "global_step": 226833, "epoch": 1874} {"train_loss": -42.55611038208008, "global_step": 226834, "epoch": 1874} {"train_loss": -41.81324005126953, "global_step": 226835, "epoch": 1874} {"train_loss": -41.70363235473633, "global_step": 226836, "epoch": 1874} {"train_loss": -42.52061080932617, "global_step": 226837, "epoch": 1874} {"train_loss": -41.92524719238281, "global_step": 226838, "epoch": 1874} {"train_loss": -40.744056701660156, "global_step": 226839, "epoch": 1874} {"train_loss": -40.04978561401367, "global_step": 226840, "epoch": 1874} {"train_loss": -41.19800567626953, "global_step": 226841, "epoch": 1874} {"train_loss": -40.843143463134766, "global_step": 226842, "epoch": 1874} {"train_loss": -41.60767364501953, "global_step": 226843, "epoch": 1874} {"train_loss": -41.99416732788086, "global_step": 226844, "epoch": 1874} {"train_loss": -38.5948600769043, "global_step": 226845, "epoch": 1874} {"train_loss": -40.16935348510742, "global_step": 226846, "epoch": 1874} {"train_loss": -40.99345779418945, "global_step": 226847, "epoch": 1874} {"train_loss": -34.363441467285156, "global_step": 226848, "epoch": 1874} {"train_loss": -41.4676628112793, "global_step": 226849, "epoch": 1874} {"train_loss": -32.34371566772461, "global_step": 226850, "epoch": 1874} {"train_loss": -40.784332275390625, "global_step": 226851, "epoch": 1874} {"train_loss": -41.46786880493164, "global_step": 226852, "epoch": 1874} {"train_loss": -38.222694396972656, "global_step": 226853, "epoch": 1874} {"train_loss": -39.87470245361328, "global_step": 226854, "epoch": 1874} {"train_loss": -37.84189987182617, "global_step": 226855, "epoch": 1874} {"train_loss": -41.655818939208984, "global_step": 226856, "epoch": 1874} {"train_loss": -41.84797286987305, "global_step": 226857, "epoch": 1874} {"train_loss": -40.820289611816406, "global_step": 226858, "epoch": 1874} {"train_loss": -40.42975997924805, "global_step": 226859, "epoch": 1874} {"train_loss": -41.997474670410156, "global_step": 226860, "epoch": 1874} {"train_loss": -40.64127731323242, "global_step": 226861, "epoch": 1874} {"train_loss": -41.69300079345703, "global_step": 226862, "epoch": 1874} {"train_loss": -41.55713653564453, "global_step": 226863, "epoch": 1874} {"train_loss": -41.65205764770508, "global_step": 226864, "epoch": 1874} {"train_loss": -41.344364166259766, "global_step": 226865, "epoch": 1874} {"train_loss": -37.65116500854492, "global_step": 226866, "epoch": 1874} {"train_loss": -40.393558502197266, "global_step": 226867, "epoch": 1874} {"train_loss": -41.232879638671875, "global_step": 226868, "epoch": 1874} {"train_loss": -36.63352584838867, "global_step": 226869, "epoch": 1874} {"train_loss": -40.78384017944336, "global_step": 226870, "epoch": 1874} {"train_loss": -38.23469924926758, "global_step": 226871, "epoch": 1874} {"train_loss": -39.846405029296875, "global_step": 226872, "epoch": 1874} {"train_loss": -40.58574295043945, "global_step": 226873, "epoch": 1874} {"train_loss": -40.83680346780572, "global_step": 226874, "epoch": 1874, "val_loss": 2679305.25} {"train_loss": -40.385467529296875, "global_step": 226875, "epoch": 1875} {"train_loss": -41.89848709106445, "global_step": 226876, "epoch": 1875} {"train_loss": -39.348602294921875, "global_step": 226877, "epoch": 1875} {"train_loss": -40.3661994934082, "global_step": 226878, "epoch": 1875} {"train_loss": -37.06533432006836, "global_step": 226879, "epoch": 1875} {"train_loss": -40.304229736328125, "global_step": 226880, "epoch": 1875} {"train_loss": -34.11708450317383, "global_step": 226881, "epoch": 1875} {"train_loss": -39.73942184448242, "global_step": 226882, "epoch": 1875} {"train_loss": -41.5269775390625, "global_step": 226883, "epoch": 1875} {"train_loss": -41.963348388671875, "global_step": 226884, "epoch": 1875} {"train_loss": -41.30510330200195, "global_step": 226885, "epoch": 1875} {"train_loss": -38.98219299316406, "global_step": 226886, "epoch": 1875} {"train_loss": -28.541488647460938, "global_step": 226887, "epoch": 1875} {"train_loss": -34.922882080078125, "global_step": 226888, "epoch": 1875} {"train_loss": -39.26607131958008, "global_step": 226889, "epoch": 1875} {"train_loss": -40.273616790771484, "global_step": 226890, "epoch": 1875} {"train_loss": -38.257293701171875, "global_step": 226891, "epoch": 1875} {"train_loss": -35.36353302001953, "global_step": 226892, "epoch": 1875} {"train_loss": -38.82024002075195, "global_step": 226893, "epoch": 1875} {"train_loss": -39.91718292236328, "global_step": 226894, "epoch": 1875} {"train_loss": -40.17500686645508, "global_step": 226895, "epoch": 1875} {"train_loss": -41.008235931396484, "global_step": 226896, "epoch": 1875} {"train_loss": -37.90507125854492, "global_step": 226897, "epoch": 1875} {"train_loss": -41.457000732421875, "global_step": 226898, "epoch": 1875} {"train_loss": -38.130069732666016, "global_step": 226899, "epoch": 1875} {"train_loss": -40.05918502807617, "global_step": 226900, "epoch": 1875} {"train_loss": -38.652435302734375, "global_step": 226901, "epoch": 1875} {"train_loss": -39.374977111816406, "global_step": 226902, "epoch": 1875} {"train_loss": -36.11817169189453, "global_step": 226903, "epoch": 1875} {"train_loss": -40.29579162597656, "global_step": 226904, "epoch": 1875} {"train_loss": -39.81840515136719, "global_step": 226905, "epoch": 1875} {"train_loss": -39.86589813232422, "global_step": 226906, "epoch": 1875} {"train_loss": -40.48630142211914, "global_step": 226907, "epoch": 1875} {"train_loss": -39.26282501220703, "global_step": 226908, "epoch": 1875} {"train_loss": -40.24549102783203, "global_step": 226909, "epoch": 1875} {"train_loss": -40.431495666503906, "global_step": 226910, "epoch": 1875} {"train_loss": -40.43227767944336, "global_step": 226911, "epoch": 1875} {"train_loss": -40.81533432006836, "global_step": 226912, "epoch": 1875} {"train_loss": -41.2227897644043, "global_step": 226913, "epoch": 1875} {"train_loss": -41.298927307128906, "global_step": 226914, "epoch": 1875} {"train_loss": -40.642757415771484, "global_step": 226915, "epoch": 1875} {"train_loss": -40.137855529785156, "global_step": 226916, "epoch": 1875} {"train_loss": -41.29964828491211, "global_step": 226917, "epoch": 1875} {"train_loss": -39.70259475708008, "global_step": 226918, "epoch": 1875} {"train_loss": -40.87559509277344, "global_step": 226919, "epoch": 1875} {"train_loss": -41.34186935424805, "global_step": 226920, "epoch": 1875} {"train_loss": -40.499481201171875, "global_step": 226921, "epoch": 1875} {"train_loss": -40.71001434326172, "global_step": 226922, "epoch": 1875} {"train_loss": -38.67153549194336, "global_step": 226923, "epoch": 1875} {"train_loss": -40.99599075317383, "global_step": 226924, "epoch": 1875} {"train_loss": -41.306514739990234, "global_step": 226925, "epoch": 1875} {"train_loss": -41.3836784362793, "global_step": 226926, "epoch": 1875} {"train_loss": -40.09584426879883, "global_step": 226927, "epoch": 1875} {"train_loss": -42.03014373779297, "global_step": 226928, "epoch": 1875} {"train_loss": -41.10248947143555, "global_step": 226929, "epoch": 1875} {"train_loss": -41.8558464050293, "global_step": 226930, "epoch": 1875} {"train_loss": -41.73896408081055, "global_step": 226931, "epoch": 1875} {"train_loss": -40.60426712036133, "global_step": 226932, "epoch": 1875} {"train_loss": -41.875343322753906, "global_step": 226933, "epoch": 1875} {"train_loss": -41.47755813598633, "global_step": 226934, "epoch": 1875} {"train_loss": -41.610267639160156, "global_step": 226935, "epoch": 1875} {"train_loss": -40.760986328125, "global_step": 226936, "epoch": 1875} {"train_loss": -41.718971252441406, "global_step": 226937, "epoch": 1875} {"train_loss": -41.6799430847168, "global_step": 226938, "epoch": 1875} {"train_loss": -40.790035247802734, "global_step": 226939, "epoch": 1875} {"train_loss": -42.01198959350586, "global_step": 226940, "epoch": 1875} {"train_loss": -40.489925384521484, "global_step": 226941, "epoch": 1875} {"train_loss": -41.46356964111328, "global_step": 226942, "epoch": 1875} {"train_loss": -42.238800048828125, "global_step": 226943, "epoch": 1875} {"train_loss": -41.57263946533203, "global_step": 226944, "epoch": 1875} {"train_loss": -41.520870208740234, "global_step": 226945, "epoch": 1875} {"train_loss": -42.22632598876953, "global_step": 226946, "epoch": 1875} {"train_loss": -41.37391662597656, "global_step": 226947, "epoch": 1875} {"train_loss": -41.74921798706055, "global_step": 226948, "epoch": 1875} {"train_loss": -41.81685256958008, "global_step": 226949, "epoch": 1875} {"train_loss": -42.32670211791992, "global_step": 226950, "epoch": 1875} {"train_loss": -42.230079650878906, "global_step": 226951, "epoch": 1875} {"train_loss": -41.629066467285156, "global_step": 226952, "epoch": 1875} {"train_loss": -41.93487548828125, "global_step": 226953, "epoch": 1875} {"train_loss": -42.70622253417969, "global_step": 226954, "epoch": 1875} {"train_loss": -42.0091667175293, "global_step": 226955, "epoch": 1875} {"train_loss": -40.66610336303711, "global_step": 226956, "epoch": 1875} {"train_loss": -42.15128707885742, "global_step": 226957, "epoch": 1875} {"train_loss": -41.61506271362305, "global_step": 226958, "epoch": 1875} {"train_loss": -42.2588996887207, "global_step": 226959, "epoch": 1875} {"train_loss": -41.96718978881836, "global_step": 226960, "epoch": 1875} {"train_loss": -42.030311584472656, "global_step": 226961, "epoch": 1875} {"train_loss": -42.54762649536133, "global_step": 226962, "epoch": 1875} {"train_loss": -42.487972259521484, "global_step": 226963, "epoch": 1875} {"train_loss": -41.811927795410156, "global_step": 226964, "epoch": 1875} {"train_loss": -42.315650939941406, "global_step": 226965, "epoch": 1875} {"train_loss": -42.23293685913086, "global_step": 226966, "epoch": 1875} {"train_loss": -42.1142463684082, "global_step": 226967, "epoch": 1875} {"train_loss": -42.150634765625, "global_step": 226968, "epoch": 1875} {"train_loss": -42.33599090576172, "global_step": 226969, "epoch": 1875} {"train_loss": -42.233455657958984, "global_step": 226970, "epoch": 1875} {"train_loss": -41.800777435302734, "global_step": 226971, "epoch": 1875} {"train_loss": -42.43646240234375, "global_step": 226972, "epoch": 1875} {"train_loss": -42.52981185913086, "global_step": 226973, "epoch": 1875} {"train_loss": -42.605384826660156, "global_step": 226974, "epoch": 1875} {"train_loss": -42.85466003417969, "global_step": 226975, "epoch": 1875} {"train_loss": -42.6969108581543, "global_step": 226976, "epoch": 1875} {"train_loss": -42.310638427734375, "global_step": 226977, "epoch": 1875} {"train_loss": -42.47556686401367, "global_step": 226978, "epoch": 1875} {"train_loss": -42.24919891357422, "global_step": 226979, "epoch": 1875} {"train_loss": -42.38202667236328, "global_step": 226980, "epoch": 1875} {"train_loss": -42.73555374145508, "global_step": 226981, "epoch": 1875} {"train_loss": -42.48801040649414, "global_step": 226982, "epoch": 1875} {"train_loss": -42.05161666870117, "global_step": 226983, "epoch": 1875} {"train_loss": -41.430294036865234, "global_step": 226984, "epoch": 1875} {"train_loss": -42.145076751708984, "global_step": 226985, "epoch": 1875} {"train_loss": -42.84134292602539, "global_step": 226986, "epoch": 1875} {"train_loss": -41.6746711730957, "global_step": 226987, "epoch": 1875} {"train_loss": -42.25567626953125, "global_step": 226988, "epoch": 1875} {"train_loss": -42.52293014526367, "global_step": 226989, "epoch": 1875} {"train_loss": -41.19973373413086, "global_step": 226990, "epoch": 1875} {"train_loss": -41.09659957885742, "global_step": 226991, "epoch": 1875} {"train_loss": -42.49046325683594, "global_step": 226992, "epoch": 1875} {"train_loss": -42.42086410522461, "global_step": 226993, "epoch": 1875} {"train_loss": -42.098812103271484, "global_step": 226994, "epoch": 1875} {"train_loss": -40.91521302530588, "global_step": 226995, "epoch": 1875, "val_loss": 2556185.75} {"train_loss": -42.378292083740234, "global_step": 226996, "epoch": 1876} {"train_loss": -41.560909271240234, "global_step": 226997, "epoch": 1876} {"train_loss": -40.978126525878906, "global_step": 226998, "epoch": 1876} {"train_loss": -41.594276428222656, "global_step": 226999, "epoch": 1876} {"train_loss": -40.51879119873047, "global_step": 227000, "epoch": 1876} {"train_loss": -39.954498291015625, "global_step": 227001, "epoch": 1876} {"train_loss": -41.13505172729492, "global_step": 227002, "epoch": 1876} {"train_loss": -42.13591384887695, "global_step": 227003, "epoch": 1876} {"train_loss": -41.301795959472656, "global_step": 227004, "epoch": 1876} {"train_loss": -42.06426239013672, "global_step": 227005, "epoch": 1876} {"train_loss": -39.979408264160156, "global_step": 227006, "epoch": 1876} {"train_loss": -40.11669921875, "global_step": 227007, "epoch": 1876} {"train_loss": -41.14316940307617, "global_step": 227008, "epoch": 1876} {"train_loss": -41.20503616333008, "global_step": 227009, "epoch": 1876} {"train_loss": -38.424476623535156, "global_step": 227010, "epoch": 1876} {"train_loss": -39.498470306396484, "global_step": 227011, "epoch": 1876} {"train_loss": -40.01955032348633, "global_step": 227012, "epoch": 1876} {"train_loss": -40.87014389038086, "global_step": 227013, "epoch": 1876} {"train_loss": -40.73213577270508, "global_step": 227014, "epoch": 1876} {"train_loss": -41.55012130737305, "global_step": 227015, "epoch": 1876} {"train_loss": -39.324459075927734, "global_step": 227016, "epoch": 1876} {"train_loss": -38.25701904296875, "global_step": 227017, "epoch": 1876} {"train_loss": -39.609920501708984, "global_step": 227018, "epoch": 1876} {"train_loss": -39.7997932434082, "global_step": 227019, "epoch": 1876} {"train_loss": -41.48011016845703, "global_step": 227020, "epoch": 1876} {"train_loss": -40.914485931396484, "global_step": 227021, "epoch": 1876} {"train_loss": -40.38571548461914, "global_step": 227022, "epoch": 1876} {"train_loss": -41.2684440612793, "global_step": 227023, "epoch": 1876} {"train_loss": -40.46477127075195, "global_step": 227024, "epoch": 1876} {"train_loss": -39.871673583984375, "global_step": 227025, "epoch": 1876} {"train_loss": -41.18897247314453, "global_step": 227026, "epoch": 1876} {"train_loss": -40.71773147583008, "global_step": 227027, "epoch": 1876} {"train_loss": -41.542903900146484, "global_step": 227028, "epoch": 1876} {"train_loss": -41.586753845214844, "global_step": 227029, "epoch": 1876} {"train_loss": -41.874000549316406, "global_step": 227030, "epoch": 1876} {"train_loss": -41.57465362548828, "global_step": 227031, "epoch": 1876} {"train_loss": -41.87372589111328, "global_step": 227032, "epoch": 1876} {"train_loss": -42.40924072265625, "global_step": 227033, "epoch": 1876} {"train_loss": -41.94301223754883, "global_step": 227034, "epoch": 1876} {"train_loss": -42.560813903808594, "global_step": 227035, "epoch": 1876} {"train_loss": -42.3634033203125, "global_step": 227036, "epoch": 1876} {"train_loss": -42.063270568847656, "global_step": 227037, "epoch": 1876} {"train_loss": -41.836788177490234, "global_step": 227038, "epoch": 1876} {"train_loss": -42.13585662841797, "global_step": 227039, "epoch": 1876} {"train_loss": -40.73141098022461, "global_step": 227040, "epoch": 1876} {"train_loss": -42.15216064453125, "global_step": 227041, "epoch": 1876} {"train_loss": -25.30280876159668, "global_step": 227042, "epoch": 1876} {"train_loss": -41.70095443725586, "global_step": 227043, "epoch": 1876} {"train_loss": -41.725528717041016, "global_step": 227044, "epoch": 1876} {"train_loss": -40.084712982177734, "global_step": 227045, "epoch": 1876} {"train_loss": -40.025543212890625, "global_step": 227046, "epoch": 1876} {"train_loss": -38.98940658569336, "global_step": 227047, "epoch": 1876} {"train_loss": -40.45621871948242, "global_step": 227048, "epoch": 1876} {"train_loss": -33.39131164550781, "global_step": 227049, "epoch": 1876} {"train_loss": -40.77525329589844, "global_step": 227050, "epoch": 1876} {"train_loss": -40.09507369995117, "global_step": 227051, "epoch": 1876} {"train_loss": -41.20783233642578, "global_step": 227052, "epoch": 1876} {"train_loss": -41.122650146484375, "global_step": 227053, "epoch": 1876} {"train_loss": -40.26166534423828, "global_step": 227054, "epoch": 1876} {"train_loss": -41.49479293823242, "global_step": 227055, "epoch": 1876} {"train_loss": -41.576751708984375, "global_step": 227056, "epoch": 1876} {"train_loss": -41.83308792114258, "global_step": 227057, "epoch": 1876} {"train_loss": -40.60569381713867, "global_step": 227058, "epoch": 1876} {"train_loss": -41.2872428894043, "global_step": 227059, "epoch": 1876} {"train_loss": -42.03647994995117, "global_step": 227060, "epoch": 1876} {"train_loss": -41.26465606689453, "global_step": 227061, "epoch": 1876} {"train_loss": -39.5643424987793, "global_step": 227062, "epoch": 1876} {"train_loss": -41.353633880615234, "global_step": 227063, "epoch": 1876} {"train_loss": -40.98458480834961, "global_step": 227064, "epoch": 1876} {"train_loss": -42.096195220947266, "global_step": 227065, "epoch": 1876} {"train_loss": -41.83989334106445, "global_step": 227066, "epoch": 1876} {"train_loss": -41.17342758178711, "global_step": 227067, "epoch": 1876} {"train_loss": -39.92190170288086, "global_step": 227068, "epoch": 1876} {"train_loss": -39.87618637084961, "global_step": 227069, "epoch": 1876} {"train_loss": -41.06740188598633, "global_step": 227070, "epoch": 1876} {"train_loss": -41.8137092590332, "global_step": 227071, "epoch": 1876} {"train_loss": -41.318092346191406, "global_step": 227072, "epoch": 1876} {"train_loss": -41.3489875793457, "global_step": 227073, "epoch": 1876} {"train_loss": -41.9131965637207, "global_step": 227074, "epoch": 1876} {"train_loss": -41.353309631347656, "global_step": 227075, "epoch": 1876} {"train_loss": -39.14773178100586, "global_step": 227076, "epoch": 1876} {"train_loss": -40.98800277709961, "global_step": 227077, "epoch": 1876} {"train_loss": -41.1527214050293, "global_step": 227078, "epoch": 1876} {"train_loss": -41.90570068359375, "global_step": 227079, "epoch": 1876} {"train_loss": -41.84798049926758, "global_step": 227080, "epoch": 1876} {"train_loss": -42.36524200439453, "global_step": 227081, "epoch": 1876} {"train_loss": -42.28440475463867, "global_step": 227082, "epoch": 1876} {"train_loss": -41.23799514770508, "global_step": 227083, "epoch": 1876} {"train_loss": -41.55022048950195, "global_step": 227084, "epoch": 1876} {"train_loss": -41.10856246948242, "global_step": 227085, "epoch": 1876} {"train_loss": -41.811378479003906, "global_step": 227086, "epoch": 1876} {"train_loss": -42.2650260925293, "global_step": 227087, "epoch": 1876} {"train_loss": -42.39118957519531, "global_step": 227088, "epoch": 1876} {"train_loss": -42.346187591552734, "global_step": 227089, "epoch": 1876} {"train_loss": -40.12846374511719, "global_step": 227090, "epoch": 1876} {"train_loss": -42.2779541015625, "global_step": 227091, "epoch": 1876} {"train_loss": -38.99137496948242, "global_step": 227092, "epoch": 1876} {"train_loss": -40.66140365600586, "global_step": 227093, "epoch": 1876} {"train_loss": -41.99147415161133, "global_step": 227094, "epoch": 1876} {"train_loss": -42.46006393432617, "global_step": 227095, "epoch": 1876} {"train_loss": -40.91915512084961, "global_step": 227096, "epoch": 1876} {"train_loss": -41.25559616088867, "global_step": 227097, "epoch": 1876} {"train_loss": -41.61137771606445, "global_step": 227098, "epoch": 1876} {"train_loss": -41.95246887207031, "global_step": 227099, "epoch": 1876} {"train_loss": -41.52809524536133, "global_step": 227100, "epoch": 1876} {"train_loss": -41.84479904174805, "global_step": 227101, "epoch": 1876} {"train_loss": -42.25763702392578, "global_step": 227102, "epoch": 1876} {"train_loss": -41.77056121826172, "global_step": 227103, "epoch": 1876} {"train_loss": -40.599853515625, "global_step": 227104, "epoch": 1876} {"train_loss": -42.518165588378906, "global_step": 227105, "epoch": 1876} {"train_loss": -40.275428771972656, "global_step": 227106, "epoch": 1876} {"train_loss": -40.605098724365234, "global_step": 227107, "epoch": 1876} {"train_loss": -40.08568572998047, "global_step": 227108, "epoch": 1876} {"train_loss": -41.39675521850586, "global_step": 227109, "epoch": 1876} {"train_loss": -41.061058044433594, "global_step": 227110, "epoch": 1876} {"train_loss": -42.2928581237793, "global_step": 227111, "epoch": 1876} {"train_loss": -42.07909393310547, "global_step": 227112, "epoch": 1876} {"train_loss": -41.63112258911133, "global_step": 227113, "epoch": 1876} {"train_loss": -40.43412780761719, "global_step": 227114, "epoch": 1876} {"train_loss": -41.908180236816406, "global_step": 227115, "epoch": 1876} {"train_loss": -40.96971056283998, "global_step": 227116, "epoch": 1876, "val_loss": 2631553.5} {"train_loss": -40.9254035949707, "global_step": 227117, "epoch": 1877} {"train_loss": -40.96583938598633, "global_step": 227118, "epoch": 1877} {"train_loss": -41.42948532104492, "global_step": 227119, "epoch": 1877} {"train_loss": -41.62522506713867, "global_step": 227120, "epoch": 1877} {"train_loss": -40.870643615722656, "global_step": 227121, "epoch": 1877} {"train_loss": -42.251953125, "global_step": 227122, "epoch": 1877} {"train_loss": -39.10966491699219, "global_step": 227123, "epoch": 1877} {"train_loss": -41.26850891113281, "global_step": 227124, "epoch": 1877} {"train_loss": -41.45501708984375, "global_step": 227125, "epoch": 1877} {"train_loss": -41.0350227355957, "global_step": 227126, "epoch": 1877} {"train_loss": -41.88322830200195, "global_step": 227127, "epoch": 1877} {"train_loss": -41.675384521484375, "global_step": 227128, "epoch": 1877} {"train_loss": -40.93137741088867, "global_step": 227129, "epoch": 1877} {"train_loss": -41.72364807128906, "global_step": 227130, "epoch": 1877} {"train_loss": -42.630245208740234, "global_step": 227131, "epoch": 1877} {"train_loss": -40.68752670288086, "global_step": 227132, "epoch": 1877} {"train_loss": -41.701534271240234, "global_step": 227133, "epoch": 1877} {"train_loss": -42.25605392456055, "global_step": 227134, "epoch": 1877} {"train_loss": -40.36286544799805, "global_step": 227135, "epoch": 1877} {"train_loss": -41.37584686279297, "global_step": 227136, "epoch": 1877} {"train_loss": -42.39336013793945, "global_step": 227137, "epoch": 1877} {"train_loss": -42.16428756713867, "global_step": 227138, "epoch": 1877} {"train_loss": -42.473506927490234, "global_step": 227139, "epoch": 1877} {"train_loss": -41.72446823120117, "global_step": 227140, "epoch": 1877} {"train_loss": -42.37946701049805, "global_step": 227141, "epoch": 1877} {"train_loss": -34.608673095703125, "global_step": 227142, "epoch": 1877} {"train_loss": -42.0789680480957, "global_step": 227143, "epoch": 1877} {"train_loss": -41.58039474487305, "global_step": 227144, "epoch": 1877} {"train_loss": -41.24471664428711, "global_step": 227145, "epoch": 1877} {"train_loss": -41.603145599365234, "global_step": 227146, "epoch": 1877} {"train_loss": -41.06454086303711, "global_step": 227147, "epoch": 1877} {"train_loss": -38.61550521850586, "global_step": 227148, "epoch": 1877} {"train_loss": -40.1098518371582, "global_step": 227149, "epoch": 1877} {"train_loss": -39.68893051147461, "global_step": 227150, "epoch": 1877} {"train_loss": -40.33050537109375, "global_step": 227151, "epoch": 1877} {"train_loss": -40.493736267089844, "global_step": 227152, "epoch": 1877} {"train_loss": -29.863691329956055, "global_step": 227153, "epoch": 1877} {"train_loss": -37.75691604614258, "global_step": 227154, "epoch": 1877} {"train_loss": -40.985145568847656, "global_step": 227155, "epoch": 1877} {"train_loss": -40.5008544921875, "global_step": 227156, "epoch": 1877} {"train_loss": -40.6942024230957, "global_step": 227157, "epoch": 1877} {"train_loss": -39.001583099365234, "global_step": 227158, "epoch": 1877} {"train_loss": -41.16201400756836, "global_step": 227159, "epoch": 1877} {"train_loss": -39.93406677246094, "global_step": 227160, "epoch": 1877} {"train_loss": -39.25950241088867, "global_step": 227161, "epoch": 1877} {"train_loss": -39.6704216003418, "global_step": 227162, "epoch": 1877} {"train_loss": -40.49806594848633, "global_step": 227163, "epoch": 1877} {"train_loss": -38.66254806518555, "global_step": 227164, "epoch": 1877} {"train_loss": -38.958858489990234, "global_step": 227165, "epoch": 1877} {"train_loss": -29.546049118041992, "global_step": 227166, "epoch": 1877} {"train_loss": -38.15219497680664, "global_step": 227167, "epoch": 1877} {"train_loss": -40.26826095581055, "global_step": 227168, "epoch": 1877} {"train_loss": -38.53058624267578, "global_step": 227169, "epoch": 1877} {"train_loss": -39.885902404785156, "global_step": 227170, "epoch": 1877} {"train_loss": -35.21255111694336, "global_step": 227171, "epoch": 1877} {"train_loss": -37.926734924316406, "global_step": 227172, "epoch": 1877} {"train_loss": -38.16091537475586, "global_step": 227173, "epoch": 1877} {"train_loss": -36.35840606689453, "global_step": 227174, "epoch": 1877} {"train_loss": -40.24563217163086, "global_step": 227175, "epoch": 1877} {"train_loss": -33.254913330078125, "global_step": 227176, "epoch": 1877} {"train_loss": -37.37498092651367, "global_step": 227177, "epoch": 1877} {"train_loss": -35.28597640991211, "global_step": 227178, "epoch": 1877} {"train_loss": -39.36519241333008, "global_step": 227179, "epoch": 1877} {"train_loss": -38.68712615966797, "global_step": 227180, "epoch": 1877} {"train_loss": -31.843326568603516, "global_step": 227181, "epoch": 1877} {"train_loss": -40.19027328491211, "global_step": 227182, "epoch": 1877} {"train_loss": -36.58835983276367, "global_step": 227183, "epoch": 1877} {"train_loss": -36.363624572753906, "global_step": 227184, "epoch": 1877} {"train_loss": -37.1415901184082, "global_step": 227185, "epoch": 1877} {"train_loss": -39.19281768798828, "global_step": 227186, "epoch": 1877} {"train_loss": -38.739925384521484, "global_step": 227187, "epoch": 1877} {"train_loss": -37.48055648803711, "global_step": 227188, "epoch": 1877} {"train_loss": -38.32655715942383, "global_step": 227189, "epoch": 1877} {"train_loss": -37.71841049194336, "global_step": 227190, "epoch": 1877} {"train_loss": -37.656734466552734, "global_step": 227191, "epoch": 1877} {"train_loss": -38.21525192260742, "global_step": 227192, "epoch": 1877} {"train_loss": -39.2725715637207, "global_step": 227193, "epoch": 1877} {"train_loss": -40.06686019897461, "global_step": 227194, "epoch": 1877} {"train_loss": -40.71171188354492, "global_step": 227195, "epoch": 1877} {"train_loss": -40.7603874206543, "global_step": 227196, "epoch": 1877} {"train_loss": -40.952537536621094, "global_step": 227197, "epoch": 1877} {"train_loss": -40.82938003540039, "global_step": 227198, "epoch": 1877} {"train_loss": -40.36479187011719, "global_step": 227199, "epoch": 1877} {"train_loss": -40.820045471191406, "global_step": 227200, "epoch": 1877} {"train_loss": -40.94639205932617, "global_step": 227201, "epoch": 1877} {"train_loss": -40.520423889160156, "global_step": 227202, "epoch": 1877} {"train_loss": -40.86024856567383, "global_step": 227203, "epoch": 1877} {"train_loss": -41.02578353881836, "global_step": 227204, "epoch": 1877} {"train_loss": -40.31808853149414, "global_step": 227205, "epoch": 1877} {"train_loss": -40.5352668762207, "global_step": 227206, "epoch": 1877} {"train_loss": -41.36873245239258, "global_step": 227207, "epoch": 1877} {"train_loss": -40.11870193481445, "global_step": 227208, "epoch": 1877} {"train_loss": -40.71159744262695, "global_step": 227209, "epoch": 1877} {"train_loss": -40.156959533691406, "global_step": 227210, "epoch": 1877} {"train_loss": -41.264068603515625, "global_step": 227211, "epoch": 1877} {"train_loss": -41.029964447021484, "global_step": 227212, "epoch": 1877} {"train_loss": -41.71022415161133, "global_step": 227213, "epoch": 1877} {"train_loss": -38.403873443603516, "global_step": 227214, "epoch": 1877} {"train_loss": -39.65414047241211, "global_step": 227215, "epoch": 1877} {"train_loss": -41.36227035522461, "global_step": 227216, "epoch": 1877} {"train_loss": -41.32229232788086, "global_step": 227217, "epoch": 1877} {"train_loss": -41.229705810546875, "global_step": 227218, "epoch": 1877} {"train_loss": -41.879940032958984, "global_step": 227219, "epoch": 1877} {"train_loss": -40.72298812866211, "global_step": 227220, "epoch": 1877} {"train_loss": -40.915340423583984, "global_step": 227221, "epoch": 1877} {"train_loss": -41.462459564208984, "global_step": 227222, "epoch": 1877} {"train_loss": -41.34194564819336, "global_step": 227223, "epoch": 1877} {"train_loss": -41.14951705932617, "global_step": 227224, "epoch": 1877} {"train_loss": -41.63920211791992, "global_step": 227225, "epoch": 1877} {"train_loss": -41.72138595581055, "global_step": 227226, "epoch": 1877} {"train_loss": -41.786800384521484, "global_step": 227227, "epoch": 1877} {"train_loss": -39.62665557861328, "global_step": 227228, "epoch": 1877} {"train_loss": -40.512245178222656, "global_step": 227229, "epoch": 1877} {"train_loss": -40.904136657714844, "global_step": 227230, "epoch": 1877} {"train_loss": -41.18229293823242, "global_step": 227231, "epoch": 1877} {"train_loss": -41.71340560913086, "global_step": 227232, "epoch": 1877} {"train_loss": -40.83759307861328, "global_step": 227233, "epoch": 1877} {"train_loss": -41.61280059814453, "global_step": 227234, "epoch": 1877} {"train_loss": -41.478878021240234, "global_step": 227235, "epoch": 1877} {"train_loss": -41.62990188598633, "global_step": 227236, "epoch": 1877} {"train_loss": -39.94589327977709, "global_step": 227237, "epoch": 1877, "val_loss": 2578625.0} {"train_loss": -41.22119140625, "global_step": 227238, "epoch": 1878} {"train_loss": -42.17682647705078, "global_step": 227239, "epoch": 1878} {"train_loss": -41.76057815551758, "global_step": 227240, "epoch": 1878} {"train_loss": -40.7246208190918, "global_step": 227241, "epoch": 1878} {"train_loss": -41.896728515625, "global_step": 227242, "epoch": 1878} {"train_loss": -41.23781967163086, "global_step": 227243, "epoch": 1878} {"train_loss": -42.30637741088867, "global_step": 227244, "epoch": 1878} {"train_loss": -41.490882873535156, "global_step": 227245, "epoch": 1878} {"train_loss": -42.197052001953125, "global_step": 227246, "epoch": 1878} {"train_loss": -41.87200927734375, "global_step": 227247, "epoch": 1878} {"train_loss": -41.581451416015625, "global_step": 227248, "epoch": 1878} {"train_loss": -42.50886535644531, "global_step": 227249, "epoch": 1878} {"train_loss": -41.26195526123047, "global_step": 227250, "epoch": 1878} {"train_loss": -41.2295036315918, "global_step": 227251, "epoch": 1878} {"train_loss": -42.223148345947266, "global_step": 227252, "epoch": 1878} {"train_loss": -41.84807205200195, "global_step": 227253, "epoch": 1878} {"train_loss": -40.59598922729492, "global_step": 227254, "epoch": 1878} {"train_loss": -42.284889221191406, "global_step": 227255, "epoch": 1878} {"train_loss": -41.99370193481445, "global_step": 227256, "epoch": 1878} {"train_loss": -41.932044982910156, "global_step": 227257, "epoch": 1878} {"train_loss": -41.88017272949219, "global_step": 227258, "epoch": 1878} {"train_loss": -39.70097732543945, "global_step": 227259, "epoch": 1878} {"train_loss": -41.978492736816406, "global_step": 227260, "epoch": 1878} {"train_loss": -42.136512756347656, "global_step": 227261, "epoch": 1878} {"train_loss": -41.148284912109375, "global_step": 227262, "epoch": 1878} {"train_loss": -41.708953857421875, "global_step": 227263, "epoch": 1878} {"train_loss": -40.164161682128906, "global_step": 227264, "epoch": 1878} {"train_loss": -40.61222457885742, "global_step": 227265, "epoch": 1878} {"train_loss": -42.407676696777344, "global_step": 227266, "epoch": 1878} {"train_loss": -42.05938720703125, "global_step": 227267, "epoch": 1878} {"train_loss": -42.541439056396484, "global_step": 227268, "epoch": 1878} {"train_loss": -42.098907470703125, "global_step": 227269, "epoch": 1878} {"train_loss": -42.53181838989258, "global_step": 227270, "epoch": 1878} {"train_loss": -39.74101638793945, "global_step": 227271, "epoch": 1878} {"train_loss": -41.66097640991211, "global_step": 227272, "epoch": 1878} {"train_loss": -38.54906463623047, "global_step": 227273, "epoch": 1878} {"train_loss": -41.914642333984375, "global_step": 227274, "epoch": 1878} {"train_loss": -41.736507415771484, "global_step": 227275, "epoch": 1878} {"train_loss": -42.21609115600586, "global_step": 227276, "epoch": 1878} {"train_loss": -39.768184661865234, "global_step": 227277, "epoch": 1878} {"train_loss": -41.98391342163086, "global_step": 227278, "epoch": 1878} {"train_loss": -41.770912170410156, "global_step": 227279, "epoch": 1878} {"train_loss": -41.058902740478516, "global_step": 227280, "epoch": 1878} {"train_loss": -42.4532585144043, "global_step": 227281, "epoch": 1878} {"train_loss": -42.125274658203125, "global_step": 227282, "epoch": 1878} {"train_loss": -41.762760162353516, "global_step": 227283, "epoch": 1878} {"train_loss": -41.77912521362305, "global_step": 227284, "epoch": 1878} {"train_loss": -41.67280960083008, "global_step": 227285, "epoch": 1878} {"train_loss": -41.37101364135742, "global_step": 227286, "epoch": 1878} {"train_loss": -36.005592346191406, "global_step": 227287, "epoch": 1878} {"train_loss": -41.84025192260742, "global_step": 227288, "epoch": 1878} {"train_loss": -41.417640686035156, "global_step": 227289, "epoch": 1878} {"train_loss": -41.99972152709961, "global_step": 227290, "epoch": 1878} {"train_loss": -42.319366455078125, "global_step": 227291, "epoch": 1878} {"train_loss": -39.09619903564453, "global_step": 227292, "epoch": 1878} {"train_loss": -39.4752082824707, "global_step": 227293, "epoch": 1878} {"train_loss": -41.0530891418457, "global_step": 227294, "epoch": 1878} {"train_loss": -41.67686080932617, "global_step": 227295, "epoch": 1878} {"train_loss": -41.832061767578125, "global_step": 227296, "epoch": 1878} {"train_loss": -41.383113861083984, "global_step": 227297, "epoch": 1878} {"train_loss": -38.216590881347656, "global_step": 227298, "epoch": 1878} {"train_loss": -41.02092361450195, "global_step": 227299, "epoch": 1878} {"train_loss": -40.57925033569336, "global_step": 227300, "epoch": 1878} {"train_loss": -41.19070053100586, "global_step": 227301, "epoch": 1878} {"train_loss": -40.64967727661133, "global_step": 227302, "epoch": 1878} {"train_loss": -39.35321807861328, "global_step": 227303, "epoch": 1878} {"train_loss": -41.2297248840332, "global_step": 227304, "epoch": 1878} {"train_loss": -40.94755935668945, "global_step": 227305, "epoch": 1878} {"train_loss": -40.94626998901367, "global_step": 227306, "epoch": 1878} {"train_loss": -38.89463424682617, "global_step": 227307, "epoch": 1878} {"train_loss": -41.29291915893555, "global_step": 227308, "epoch": 1878} {"train_loss": -40.65105056762695, "global_step": 227309, "epoch": 1878} {"train_loss": -39.9071159362793, "global_step": 227310, "epoch": 1878} {"train_loss": -40.55120849609375, "global_step": 227311, "epoch": 1878} {"train_loss": -40.430484771728516, "global_step": 227312, "epoch": 1878} {"train_loss": -41.5318717956543, "global_step": 227313, "epoch": 1878} {"train_loss": -37.3922119140625, "global_step": 227314, "epoch": 1878} {"train_loss": -40.79097366333008, "global_step": 227315, "epoch": 1878} {"train_loss": -39.961849212646484, "global_step": 227316, "epoch": 1878} {"train_loss": -37.07338333129883, "global_step": 227317, "epoch": 1878} {"train_loss": -38.91660690307617, "global_step": 227318, "epoch": 1878} {"train_loss": -39.319061279296875, "global_step": 227319, "epoch": 1878} {"train_loss": -40.62679672241211, "global_step": 227320, "epoch": 1878} {"train_loss": -40.80282211303711, "global_step": 227321, "epoch": 1878} {"train_loss": -40.789791107177734, "global_step": 227322, "epoch": 1878} {"train_loss": -41.25749588012695, "global_step": 227323, "epoch": 1878} {"train_loss": -41.195125579833984, "global_step": 227324, "epoch": 1878} {"train_loss": -39.98975372314453, "global_step": 227325, "epoch": 1878} {"train_loss": -41.49735641479492, "global_step": 227326, "epoch": 1878} {"train_loss": -39.62570571899414, "global_step": 227327, "epoch": 1878} {"train_loss": -40.351863861083984, "global_step": 227328, "epoch": 1878} {"train_loss": -40.67967224121094, "global_step": 227329, "epoch": 1878} {"train_loss": -40.74989318847656, "global_step": 227330, "epoch": 1878} {"train_loss": -41.33689498901367, "global_step": 227331, "epoch": 1878} {"train_loss": -40.49253463745117, "global_step": 227332, "epoch": 1878} {"train_loss": -40.78121566772461, "global_step": 227333, "epoch": 1878} {"train_loss": -41.64906311035156, "global_step": 227334, "epoch": 1878} {"train_loss": -40.45479965209961, "global_step": 227335, "epoch": 1878} {"train_loss": -39.04755783081055, "global_step": 227336, "epoch": 1878} {"train_loss": -40.7867317199707, "global_step": 227337, "epoch": 1878} {"train_loss": -39.27366256713867, "global_step": 227338, "epoch": 1878} {"train_loss": -41.371089935302734, "global_step": 227339, "epoch": 1878} {"train_loss": -41.55475997924805, "global_step": 227340, "epoch": 1878} {"train_loss": -40.3254280090332, "global_step": 227341, "epoch": 1878} {"train_loss": -41.59737777709961, "global_step": 227342, "epoch": 1878} {"train_loss": -41.15745162963867, "global_step": 227343, "epoch": 1878} {"train_loss": -40.22536849975586, "global_step": 227344, "epoch": 1878} {"train_loss": -41.89617156982422, "global_step": 227345, "epoch": 1878} {"train_loss": -42.07849884033203, "global_step": 227346, "epoch": 1878} {"train_loss": -41.37390899658203, "global_step": 227347, "epoch": 1878} {"train_loss": -42.26774597167969, "global_step": 227348, "epoch": 1878} {"train_loss": -41.430423736572266, "global_step": 227349, "epoch": 1878} {"train_loss": -42.157100677490234, "global_step": 227350, "epoch": 1878} {"train_loss": -42.3406867980957, "global_step": 227351, "epoch": 1878} {"train_loss": -42.470176696777344, "global_step": 227352, "epoch": 1878} {"train_loss": -42.17134094238281, "global_step": 227353, "epoch": 1878} {"train_loss": -41.9886360168457, "global_step": 227354, "epoch": 1878} {"train_loss": -41.681007385253906, "global_step": 227355, "epoch": 1878} {"train_loss": -41.40718460083008, "global_step": 227356, "epoch": 1878} {"train_loss": -41.451202392578125, "global_step": 227357, "epoch": 1878} {"train_loss": -41.06346322682278, "global_step": 227358, "epoch": 1878, "val_loss": 2572694.25} {"train_loss": -41.63420486450195, "global_step": 227359, "epoch": 1879} {"train_loss": -42.42774200439453, "global_step": 227360, "epoch": 1879} {"train_loss": -41.847694396972656, "global_step": 227361, "epoch": 1879} {"train_loss": -41.667110443115234, "global_step": 227362, "epoch": 1879} {"train_loss": -42.90535354614258, "global_step": 227363, "epoch": 1879} {"train_loss": -41.93317794799805, "global_step": 227364, "epoch": 1879} {"train_loss": -41.560176849365234, "global_step": 227365, "epoch": 1879} {"train_loss": -41.418296813964844, "global_step": 227366, "epoch": 1879} {"train_loss": -41.2648811340332, "global_step": 227367, "epoch": 1879} {"train_loss": -42.274452209472656, "global_step": 227368, "epoch": 1879} {"train_loss": -42.39987564086914, "global_step": 227369, "epoch": 1879} {"train_loss": -42.0012321472168, "global_step": 227370, "epoch": 1879} {"train_loss": -42.81060791015625, "global_step": 227371, "epoch": 1879} {"train_loss": -42.33846664428711, "global_step": 227372, "epoch": 1879} {"train_loss": -41.90351486206055, "global_step": 227373, "epoch": 1879} {"train_loss": -41.27671432495117, "global_step": 227374, "epoch": 1879} {"train_loss": -41.733421325683594, "global_step": 227375, "epoch": 1879} {"train_loss": -42.30009460449219, "global_step": 227376, "epoch": 1879} {"train_loss": -42.63124084472656, "global_step": 227377, "epoch": 1879} {"train_loss": -43.182315826416016, "global_step": 227378, "epoch": 1879} {"train_loss": -42.59618377685547, "global_step": 227379, "epoch": 1879} {"train_loss": -42.892669677734375, "global_step": 227380, "epoch": 1879} {"train_loss": -41.09497833251953, "global_step": 227381, "epoch": 1879} {"train_loss": -42.52525329589844, "global_step": 227382, "epoch": 1879} {"train_loss": -40.845420837402344, "global_step": 227383, "epoch": 1879} {"train_loss": -40.32794189453125, "global_step": 227384, "epoch": 1879} {"train_loss": -41.67479705810547, "global_step": 227385, "epoch": 1879} {"train_loss": -41.15897750854492, "global_step": 227386, "epoch": 1879} {"train_loss": -42.20881271362305, "global_step": 227387, "epoch": 1879} {"train_loss": -35.53627014160156, "global_step": 227388, "epoch": 1879} {"train_loss": -42.082984924316406, "global_step": 227389, "epoch": 1879} {"train_loss": -41.95160675048828, "global_step": 227390, "epoch": 1879} {"train_loss": -39.85261917114258, "global_step": 227391, "epoch": 1879} {"train_loss": -40.8901481628418, "global_step": 227392, "epoch": 1879} {"train_loss": -40.73214340209961, "global_step": 227393, "epoch": 1879} {"train_loss": -40.33809280395508, "global_step": 227394, "epoch": 1879} {"train_loss": -39.17081832885742, "global_step": 227395, "epoch": 1879} {"train_loss": -40.440765380859375, "global_step": 227396, "epoch": 1879} {"train_loss": -39.539398193359375, "global_step": 227397, "epoch": 1879} {"train_loss": -38.48733139038086, "global_step": 227398, "epoch": 1879} {"train_loss": -40.43056106567383, "global_step": 227399, "epoch": 1879} {"train_loss": -36.242549896240234, "global_step": 227400, "epoch": 1879} {"train_loss": -36.77621078491211, "global_step": 227401, "epoch": 1879} {"train_loss": -38.54402542114258, "global_step": 227402, "epoch": 1879} {"train_loss": -39.61232376098633, "global_step": 227403, "epoch": 1879} {"train_loss": -33.431671142578125, "global_step": 227404, "epoch": 1879} {"train_loss": -37.65164566040039, "global_step": 227405, "epoch": 1879} {"train_loss": -33.58344268798828, "global_step": 227406, "epoch": 1879} {"train_loss": -39.70667266845703, "global_step": 227407, "epoch": 1879} {"train_loss": -35.51578903198242, "global_step": 227408, "epoch": 1879} {"train_loss": -36.340999603271484, "global_step": 227409, "epoch": 1879} {"train_loss": -39.58372116088867, "global_step": 227410, "epoch": 1879} {"train_loss": -35.613555908203125, "global_step": 227411, "epoch": 1879} {"train_loss": -38.293907165527344, "global_step": 227412, "epoch": 1879} {"train_loss": -38.97993469238281, "global_step": 227413, "epoch": 1879} {"train_loss": -37.755306243896484, "global_step": 227414, "epoch": 1879} {"train_loss": -38.77476501464844, "global_step": 227415, "epoch": 1879} {"train_loss": -39.93851852416992, "global_step": 227416, "epoch": 1879} {"train_loss": -39.94517135620117, "global_step": 227417, "epoch": 1879} {"train_loss": -38.06960678100586, "global_step": 227418, "epoch": 1879} {"train_loss": -39.80009078979492, "global_step": 227419, "epoch": 1879} {"train_loss": -40.41394805908203, "global_step": 227420, "epoch": 1879} {"train_loss": -40.19493103027344, "global_step": 227421, "epoch": 1879} {"train_loss": -40.584556579589844, "global_step": 227422, "epoch": 1879} {"train_loss": -40.3255500793457, "global_step": 227423, "epoch": 1879} {"train_loss": -41.09395217895508, "global_step": 227424, "epoch": 1879} {"train_loss": -39.77589797973633, "global_step": 227425, "epoch": 1879} {"train_loss": -39.498905181884766, "global_step": 227426, "epoch": 1879} {"train_loss": -40.34088897705078, "global_step": 227427, "epoch": 1879} {"train_loss": -40.831031799316406, "global_step": 227428, "epoch": 1879} {"train_loss": -40.01349639892578, "global_step": 227429, "epoch": 1879} {"train_loss": -40.56324768066406, "global_step": 227430, "epoch": 1879} {"train_loss": -40.98423385620117, "global_step": 227431, "epoch": 1879} {"train_loss": -40.901527404785156, "global_step": 227432, "epoch": 1879} {"train_loss": -40.89083480834961, "global_step": 227433, "epoch": 1879} {"train_loss": -41.42441940307617, "global_step": 227434, "epoch": 1879} {"train_loss": -40.7189826965332, "global_step": 227435, "epoch": 1879} {"train_loss": -40.8577880859375, "global_step": 227436, "epoch": 1879} {"train_loss": -41.043514251708984, "global_step": 227437, "epoch": 1879} {"train_loss": -41.172298431396484, "global_step": 227438, "epoch": 1879} {"train_loss": -40.915462493896484, "global_step": 227439, "epoch": 1879} {"train_loss": -40.49149703979492, "global_step": 227440, "epoch": 1879} {"train_loss": -41.238948822021484, "global_step": 227441, "epoch": 1879} {"train_loss": -40.92280960083008, "global_step": 227442, "epoch": 1879} {"train_loss": -42.01078414916992, "global_step": 227443, "epoch": 1879} {"train_loss": -41.60236740112305, "global_step": 227444, "epoch": 1879} {"train_loss": -40.97482681274414, "global_step": 227445, "epoch": 1879} {"train_loss": -41.96038055419922, "global_step": 227446, "epoch": 1879} {"train_loss": -40.66897964477539, "global_step": 227447, "epoch": 1879} {"train_loss": -41.43429183959961, "global_step": 227448, "epoch": 1879} {"train_loss": -39.15155792236328, "global_step": 227449, "epoch": 1879} {"train_loss": -40.691558837890625, "global_step": 227450, "epoch": 1879} {"train_loss": -41.82094955444336, "global_step": 227451, "epoch": 1879} {"train_loss": -34.75224685668945, "global_step": 227452, "epoch": 1879} {"train_loss": -41.46980285644531, "global_step": 227453, "epoch": 1879} {"train_loss": -41.48262405395508, "global_step": 227454, "epoch": 1879} {"train_loss": -41.11883544921875, "global_step": 227455, "epoch": 1879} {"train_loss": -40.98773193359375, "global_step": 227456, "epoch": 1879} {"train_loss": -41.505836486816406, "global_step": 227457, "epoch": 1879} {"train_loss": -41.101966857910156, "global_step": 227458, "epoch": 1879} {"train_loss": -42.05302047729492, "global_step": 227459, "epoch": 1879} {"train_loss": -40.54008483886719, "global_step": 227460, "epoch": 1879} {"train_loss": -40.69001007080078, "global_step": 227461, "epoch": 1879} {"train_loss": -40.92399215698242, "global_step": 227462, "epoch": 1879} {"train_loss": -41.24933624267578, "global_step": 227463, "epoch": 1879} {"train_loss": -41.38939666748047, "global_step": 227464, "epoch": 1879} {"train_loss": -40.11006546020508, "global_step": 227465, "epoch": 1879} {"train_loss": -42.322784423828125, "global_step": 227466, "epoch": 1879} {"train_loss": -40.12548828125, "global_step": 227467, "epoch": 1879} {"train_loss": -42.74081039428711, "global_step": 227468, "epoch": 1879} {"train_loss": -39.84782028198242, "global_step": 227469, "epoch": 1879} {"train_loss": -40.203304290771484, "global_step": 227470, "epoch": 1879} {"train_loss": -41.731056213378906, "global_step": 227471, "epoch": 1879} {"train_loss": -40.448387145996094, "global_step": 227472, "epoch": 1879} {"train_loss": -41.52285385131836, "global_step": 227473, "epoch": 1879} {"train_loss": -42.19574737548828, "global_step": 227474, "epoch": 1879} {"train_loss": -42.2733268737793, "global_step": 227475, "epoch": 1879} {"train_loss": -42.0085563659668, "global_step": 227476, "epoch": 1879} {"train_loss": -42.25251770019531, "global_step": 227477, "epoch": 1879} {"train_loss": -41.96150207519531, "global_step": 227478, "epoch": 1879} {"train_loss": -40.556524765392965, "global_step": 227479, "epoch": 1879, "val_loss": 2591929.0} {"train_loss": -42.26887130737305, "global_step": 227480, "epoch": 1880} {"train_loss": -42.04127883911133, "global_step": 227481, "epoch": 1880} {"train_loss": -41.53132247924805, "global_step": 227482, "epoch": 1880} {"train_loss": -41.06244659423828, "global_step": 227483, "epoch": 1880} {"train_loss": -41.88235092163086, "global_step": 227484, "epoch": 1880} {"train_loss": -42.6180419921875, "global_step": 227485, "epoch": 1880} {"train_loss": -42.33674621582031, "global_step": 227486, "epoch": 1880} {"train_loss": -42.88900375366211, "global_step": 227487, "epoch": 1880} {"train_loss": -42.03916931152344, "global_step": 227488, "epoch": 1880} {"train_loss": -42.48301696777344, "global_step": 227489, "epoch": 1880} {"train_loss": -42.36629867553711, "global_step": 227490, "epoch": 1880} {"train_loss": -41.428321838378906, "global_step": 227491, "epoch": 1880} {"train_loss": -42.53366470336914, "global_step": 227492, "epoch": 1880} {"train_loss": -42.652374267578125, "global_step": 227493, "epoch": 1880} {"train_loss": -42.21588134765625, "global_step": 227494, "epoch": 1880} {"train_loss": -42.52651596069336, "global_step": 227495, "epoch": 1880} {"train_loss": -42.948421478271484, "global_step": 227496, "epoch": 1880} {"train_loss": -42.739105224609375, "global_step": 227497, "epoch": 1880} {"train_loss": -42.41254425048828, "global_step": 227498, "epoch": 1880} {"train_loss": -42.2574577331543, "global_step": 227499, "epoch": 1880} {"train_loss": -42.653053283691406, "global_step": 227500, "epoch": 1880} {"train_loss": -42.25843048095703, "global_step": 227501, "epoch": 1880} {"train_loss": -42.700008392333984, "global_step": 227502, "epoch": 1880} {"train_loss": -41.463356018066406, "global_step": 227503, "epoch": 1880} {"train_loss": -42.334835052490234, "global_step": 227504, "epoch": 1880} {"train_loss": -41.8317756652832, "global_step": 227505, "epoch": 1880} {"train_loss": -41.639259338378906, "global_step": 227506, "epoch": 1880} {"train_loss": -42.013893127441406, "global_step": 227507, "epoch": 1880} {"train_loss": -42.54425811767578, "global_step": 227508, "epoch": 1880} {"train_loss": -42.04949951171875, "global_step": 227509, "epoch": 1880} {"train_loss": -37.2761344909668, "global_step": 227510, "epoch": 1880} {"train_loss": -41.761085510253906, "global_step": 227511, "epoch": 1880} {"train_loss": -41.3508186340332, "global_step": 227512, "epoch": 1880} {"train_loss": -40.48140335083008, "global_step": 227513, "epoch": 1880} {"train_loss": -40.647274017333984, "global_step": 227514, "epoch": 1880} {"train_loss": -40.37550735473633, "global_step": 227515, "epoch": 1880} {"train_loss": -40.70463180541992, "global_step": 227516, "epoch": 1880} {"train_loss": -42.106319427490234, "global_step": 227517, "epoch": 1880} {"train_loss": -42.470855712890625, "global_step": 227518, "epoch": 1880} {"train_loss": -41.4715461730957, "global_step": 227519, "epoch": 1880} {"train_loss": -39.87897872924805, "global_step": 227520, "epoch": 1880} {"train_loss": -40.745628356933594, "global_step": 227521, "epoch": 1880} {"train_loss": -42.2602424621582, "global_step": 227522, "epoch": 1880} {"train_loss": -40.97917556762695, "global_step": 227523, "epoch": 1880} {"train_loss": -40.875423431396484, "global_step": 227524, "epoch": 1880} {"train_loss": -38.729095458984375, "global_step": 227525, "epoch": 1880} {"train_loss": -39.35235595703125, "global_step": 227526, "epoch": 1880} {"train_loss": -40.29085922241211, "global_step": 227527, "epoch": 1880} {"train_loss": -40.00820541381836, "global_step": 227528, "epoch": 1880} {"train_loss": -35.710018157958984, "global_step": 227529, "epoch": 1880} {"train_loss": -30.004072189331055, "global_step": 227530, "epoch": 1880} {"train_loss": -31.7659912109375, "global_step": 227531, "epoch": 1880} {"train_loss": -36.00384521484375, "global_step": 227532, "epoch": 1880} {"train_loss": -38.729331970214844, "global_step": 227533, "epoch": 1880} {"train_loss": -37.07722473144531, "global_step": 227534, "epoch": 1880} {"train_loss": -38.269649505615234, "global_step": 227535, "epoch": 1880} {"train_loss": -37.250885009765625, "global_step": 227536, "epoch": 1880} {"train_loss": -36.98763656616211, "global_step": 227537, "epoch": 1880} {"train_loss": -39.689552307128906, "global_step": 227538, "epoch": 1880} {"train_loss": -36.28375244140625, "global_step": 227539, "epoch": 1880} {"train_loss": -38.822906494140625, "global_step": 227540, "epoch": 1880} {"train_loss": -38.90861129760742, "global_step": 227541, "epoch": 1880} {"train_loss": -37.7311897277832, "global_step": 227542, "epoch": 1880} {"train_loss": -39.40180206298828, "global_step": 227543, "epoch": 1880} {"train_loss": -35.71995544433594, "global_step": 227544, "epoch": 1880} {"train_loss": -38.865535736083984, "global_step": 227545, "epoch": 1880} {"train_loss": -37.10584259033203, "global_step": 227546, "epoch": 1880} {"train_loss": -39.90171432495117, "global_step": 227547, "epoch": 1880} {"train_loss": -36.79328536987305, "global_step": 227548, "epoch": 1880} {"train_loss": -40.15555191040039, "global_step": 227549, "epoch": 1880} {"train_loss": -37.323856353759766, "global_step": 227550, "epoch": 1880} {"train_loss": -41.02545928955078, "global_step": 227551, "epoch": 1880} {"train_loss": -37.641265869140625, "global_step": 227552, "epoch": 1880} {"train_loss": -40.63534164428711, "global_step": 227553, "epoch": 1880} {"train_loss": -37.53666305541992, "global_step": 227554, "epoch": 1880} {"train_loss": -40.486690521240234, "global_step": 227555, "epoch": 1880} {"train_loss": -38.622352600097656, "global_step": 227556, "epoch": 1880} {"train_loss": -40.2870979309082, "global_step": 227557, "epoch": 1880} {"train_loss": -39.45656204223633, "global_step": 227558, "epoch": 1880} {"train_loss": -40.195430755615234, "global_step": 227559, "epoch": 1880} {"train_loss": -40.28312683105469, "global_step": 227560, "epoch": 1880} {"train_loss": -40.254302978515625, "global_step": 227561, "epoch": 1880} {"train_loss": -41.012359619140625, "global_step": 227562, "epoch": 1880} {"train_loss": -40.70092010498047, "global_step": 227563, "epoch": 1880} {"train_loss": -41.18207550048828, "global_step": 227564, "epoch": 1880} {"train_loss": -40.899898529052734, "global_step": 227565, "epoch": 1880} {"train_loss": -40.74004364013672, "global_step": 227566, "epoch": 1880} {"train_loss": -41.32331466674805, "global_step": 227567, "epoch": 1880} {"train_loss": -41.0438346862793, "global_step": 227568, "epoch": 1880} {"train_loss": -41.5828857421875, "global_step": 227569, "epoch": 1880} {"train_loss": -41.13117218017578, "global_step": 227570, "epoch": 1880} {"train_loss": -41.37568283081055, "global_step": 227571, "epoch": 1880} {"train_loss": -41.237449645996094, "global_step": 227572, "epoch": 1880} {"train_loss": -41.35055923461914, "global_step": 227573, "epoch": 1880} {"train_loss": -41.16151809692383, "global_step": 227574, "epoch": 1880} {"train_loss": -41.59798049926758, "global_step": 227575, "epoch": 1880} {"train_loss": -41.53780746459961, "global_step": 227576, "epoch": 1880} {"train_loss": -41.42776107788086, "global_step": 227577, "epoch": 1880} {"train_loss": -41.72249221801758, "global_step": 227578, "epoch": 1880} {"train_loss": -41.49336624145508, "global_step": 227579, "epoch": 1880} {"train_loss": -41.64384078979492, "global_step": 227580, "epoch": 1880} {"train_loss": -41.66157913208008, "global_step": 227581, "epoch": 1880} {"train_loss": -41.13496017456055, "global_step": 227582, "epoch": 1880} {"train_loss": -41.447078704833984, "global_step": 227583, "epoch": 1880} {"train_loss": -41.9698600769043, "global_step": 227584, "epoch": 1880} {"train_loss": -40.95963668823242, "global_step": 227585, "epoch": 1880} {"train_loss": -41.88557052612305, "global_step": 227586, "epoch": 1880} {"train_loss": -42.00433349609375, "global_step": 227587, "epoch": 1880} {"train_loss": -41.71963119506836, "global_step": 227588, "epoch": 1880} {"train_loss": -41.90272903442383, "global_step": 227589, "epoch": 1880} {"train_loss": -42.08492660522461, "global_step": 227590, "epoch": 1880} {"train_loss": -41.43770980834961, "global_step": 227591, "epoch": 1880} {"train_loss": -42.23044967651367, "global_step": 227592, "epoch": 1880} {"train_loss": -41.637237548828125, "global_step": 227593, "epoch": 1880} {"train_loss": -42.175289154052734, "global_step": 227594, "epoch": 1880} {"train_loss": -42.07011032104492, "global_step": 227595, "epoch": 1880} {"train_loss": -41.974857330322266, "global_step": 227596, "epoch": 1880} {"train_loss": -42.365352630615234, "global_step": 227597, "epoch": 1880} {"train_loss": -41.60463333129883, "global_step": 227598, "epoch": 1880} {"train_loss": -42.38533401489258, "global_step": 227599, "epoch": 1880} {"train_loss": -40.61020126027509, "global_step": 227600, "epoch": 1880, "val_loss": 2539223.0} {"train_loss": -42.53310775756836, "global_step": 227601, "epoch": 1881} {"train_loss": -41.76013946533203, "global_step": 227602, "epoch": 1881} {"train_loss": -42.561283111572266, "global_step": 227603, "epoch": 1881} {"train_loss": -41.84872055053711, "global_step": 227604, "epoch": 1881} {"train_loss": -42.65877151489258, "global_step": 227605, "epoch": 1881} {"train_loss": -42.2349739074707, "global_step": 227606, "epoch": 1881} {"train_loss": -42.4462890625, "global_step": 227607, "epoch": 1881} {"train_loss": -42.16508865356445, "global_step": 227608, "epoch": 1881} {"train_loss": -42.35567855834961, "global_step": 227609, "epoch": 1881} {"train_loss": -42.08769607543945, "global_step": 227610, "epoch": 1881} {"train_loss": -42.17057800292969, "global_step": 227611, "epoch": 1881} {"train_loss": -42.84159851074219, "global_step": 227612, "epoch": 1881} {"train_loss": -42.175533294677734, "global_step": 227613, "epoch": 1881} {"train_loss": -43.109596252441406, "global_step": 227614, "epoch": 1881} {"train_loss": -41.69259262084961, "global_step": 227615, "epoch": 1881} {"train_loss": -42.56943893432617, "global_step": 227616, "epoch": 1881} {"train_loss": -42.29497528076172, "global_step": 227617, "epoch": 1881} {"train_loss": -42.469207763671875, "global_step": 227618, "epoch": 1881} {"train_loss": -42.95656967163086, "global_step": 227619, "epoch": 1881} {"train_loss": -42.64419174194336, "global_step": 227620, "epoch": 1881} {"train_loss": -42.77568435668945, "global_step": 227621, "epoch": 1881} {"train_loss": -42.75106430053711, "global_step": 227622, "epoch": 1881} {"train_loss": -42.93423843383789, "global_step": 227623, "epoch": 1881} {"train_loss": -41.69034957885742, "global_step": 227624, "epoch": 1881} {"train_loss": -41.821102142333984, "global_step": 227625, "epoch": 1881} {"train_loss": -42.87149429321289, "global_step": 227626, "epoch": 1881} {"train_loss": -42.54888916015625, "global_step": 227627, "epoch": 1881} {"train_loss": -42.9796142578125, "global_step": 227628, "epoch": 1881} {"train_loss": -42.43167495727539, "global_step": 227629, "epoch": 1881} {"train_loss": -41.533634185791016, "global_step": 227630, "epoch": 1881} {"train_loss": -41.120948791503906, "global_step": 227631, "epoch": 1881} {"train_loss": -40.83020782470703, "global_step": 227632, "epoch": 1881} {"train_loss": -41.8317756652832, "global_step": 227633, "epoch": 1881} {"train_loss": -42.23245620727539, "global_step": 227634, "epoch": 1881} {"train_loss": -42.60638427734375, "global_step": 227635, "epoch": 1881} {"train_loss": -41.2186164855957, "global_step": 227636, "epoch": 1881} {"train_loss": -40.631465911865234, "global_step": 227637, "epoch": 1881} {"train_loss": -41.19816589355469, "global_step": 227638, "epoch": 1881} {"train_loss": -42.26467514038086, "global_step": 227639, "epoch": 1881} {"train_loss": -36.910675048828125, "global_step": 227640, "epoch": 1881} {"train_loss": -34.64013671875, "global_step": 227641, "epoch": 1881} {"train_loss": -39.246334075927734, "global_step": 227642, "epoch": 1881} {"train_loss": -41.69962692260742, "global_step": 227643, "epoch": 1881} {"train_loss": -38.223876953125, "global_step": 227644, "epoch": 1881} {"train_loss": -36.75, "global_step": 227645, "epoch": 1881} {"train_loss": -40.339202880859375, "global_step": 227646, "epoch": 1881} {"train_loss": -41.819091796875, "global_step": 227647, "epoch": 1881} {"train_loss": -40.676937103271484, "global_step": 227648, "epoch": 1881} {"train_loss": -39.003353118896484, "global_step": 227649, "epoch": 1881} {"train_loss": -42.208675384521484, "global_step": 227650, "epoch": 1881} {"train_loss": -40.36416244506836, "global_step": 227651, "epoch": 1881} {"train_loss": -41.502540588378906, "global_step": 227652, "epoch": 1881} {"train_loss": -39.76234436035156, "global_step": 227653, "epoch": 1881} {"train_loss": -41.13247299194336, "global_step": 227654, "epoch": 1881} {"train_loss": -41.03123092651367, "global_step": 227655, "epoch": 1881} {"train_loss": -40.554054260253906, "global_step": 227656, "epoch": 1881} {"train_loss": -41.043697357177734, "global_step": 227657, "epoch": 1881} {"train_loss": -40.263057708740234, "global_step": 227658, "epoch": 1881} {"train_loss": -40.78432846069336, "global_step": 227659, "epoch": 1881} {"train_loss": -41.5262565612793, "global_step": 227660, "epoch": 1881} {"train_loss": -41.252803802490234, "global_step": 227661, "epoch": 1881} {"train_loss": -40.82316207885742, "global_step": 227662, "epoch": 1881} {"train_loss": -40.58842849731445, "global_step": 227663, "epoch": 1881} {"train_loss": -40.73480987548828, "global_step": 227664, "epoch": 1881} {"train_loss": -42.4964714050293, "global_step": 227665, "epoch": 1881} {"train_loss": -41.21752166748047, "global_step": 227666, "epoch": 1881} {"train_loss": -42.168373107910156, "global_step": 227667, "epoch": 1881} {"train_loss": -39.583892822265625, "global_step": 227668, "epoch": 1881} {"train_loss": -41.155555725097656, "global_step": 227669, "epoch": 1881} {"train_loss": -41.400203704833984, "global_step": 227670, "epoch": 1881} {"train_loss": -41.822731018066406, "global_step": 227671, "epoch": 1881} {"train_loss": -42.411556243896484, "global_step": 227672, "epoch": 1881} {"train_loss": -42.18895721435547, "global_step": 227673, "epoch": 1881} {"train_loss": -41.6114387512207, "global_step": 227674, "epoch": 1881} {"train_loss": -42.05598068237305, "global_step": 227675, "epoch": 1881} {"train_loss": -40.44085693359375, "global_step": 227676, "epoch": 1881} {"train_loss": -42.040794372558594, "global_step": 227677, "epoch": 1881} {"train_loss": -42.10818099975586, "global_step": 227678, "epoch": 1881} {"train_loss": -39.665687561035156, "global_step": 227679, "epoch": 1881} {"train_loss": -41.52836227416992, "global_step": 227680, "epoch": 1881} {"train_loss": -41.773616790771484, "global_step": 227681, "epoch": 1881} {"train_loss": -41.85770797729492, "global_step": 227682, "epoch": 1881} {"train_loss": -41.542030334472656, "global_step": 227683, "epoch": 1881} {"train_loss": -41.807552337646484, "global_step": 227684, "epoch": 1881} {"train_loss": -42.164249420166016, "global_step": 227685, "epoch": 1881} {"train_loss": -42.17787551879883, "global_step": 227686, "epoch": 1881} {"train_loss": -41.87342071533203, "global_step": 227687, "epoch": 1881} {"train_loss": -41.58199691772461, "global_step": 227688, "epoch": 1881} {"train_loss": -42.1121826171875, "global_step": 227689, "epoch": 1881} {"train_loss": -41.789947509765625, "global_step": 227690, "epoch": 1881} {"train_loss": -42.20314025878906, "global_step": 227691, "epoch": 1881} {"train_loss": -42.52212142944336, "global_step": 227692, "epoch": 1881} {"train_loss": -41.913265228271484, "global_step": 227693, "epoch": 1881} {"train_loss": -39.48383712768555, "global_step": 227694, "epoch": 1881} {"train_loss": -42.21940612792969, "global_step": 227695, "epoch": 1881} {"train_loss": -42.4984245300293, "global_step": 227696, "epoch": 1881} {"train_loss": -40.21192169189453, "global_step": 227697, "epoch": 1881} {"train_loss": -42.58443832397461, "global_step": 227698, "epoch": 1881} {"train_loss": -42.26503372192383, "global_step": 227699, "epoch": 1881} {"train_loss": -42.46515655517578, "global_step": 227700, "epoch": 1881} {"train_loss": -40.63932418823242, "global_step": 227701, "epoch": 1881} {"train_loss": -38.282867431640625, "global_step": 227702, "epoch": 1881} {"train_loss": -41.30820846557617, "global_step": 227703, "epoch": 1881} {"train_loss": -33.0421142578125, "global_step": 227704, "epoch": 1881} {"train_loss": -34.17167282104492, "global_step": 227705, "epoch": 1881} {"train_loss": -34.836280822753906, "global_step": 227706, "epoch": 1881} {"train_loss": -36.873653411865234, "global_step": 227707, "epoch": 1881} {"train_loss": -39.066864013671875, "global_step": 227708, "epoch": 1881} {"train_loss": -29.246923446655273, "global_step": 227709, "epoch": 1881} {"train_loss": -37.865447998046875, "global_step": 227710, "epoch": 1881} {"train_loss": -35.75279998779297, "global_step": 227711, "epoch": 1881} {"train_loss": -40.228397369384766, "global_step": 227712, "epoch": 1881} {"train_loss": -37.55741500854492, "global_step": 227713, "epoch": 1881} {"train_loss": -39.431373596191406, "global_step": 227714, "epoch": 1881} {"train_loss": -39.71448516845703, "global_step": 227715, "epoch": 1881} {"train_loss": -39.39457321166992, "global_step": 227716, "epoch": 1881} {"train_loss": -38.47008514404297, "global_step": 227717, "epoch": 1881} {"train_loss": -39.8818473815918, "global_step": 227718, "epoch": 1881} {"train_loss": -37.41013717651367, "global_step": 227719, "epoch": 1881} {"train_loss": -40.36709213256836, "global_step": 227720, "epoch": 1881} {"train_loss": -40.86020283659628, "global_step": 227721, "epoch": 1881, "val_loss": 2627939.0} {"train_loss": -39.4596061706543, "global_step": 227722, "epoch": 1882} {"train_loss": -40.076847076416016, "global_step": 227723, "epoch": 1882} {"train_loss": -39.646392822265625, "global_step": 227724, "epoch": 1882} {"train_loss": -39.76561737060547, "global_step": 227725, "epoch": 1882} {"train_loss": -40.111976623535156, "global_step": 227726, "epoch": 1882} {"train_loss": -40.791255950927734, "global_step": 227727, "epoch": 1882} {"train_loss": -41.11152648925781, "global_step": 227728, "epoch": 1882} {"train_loss": -39.276878356933594, "global_step": 227729, "epoch": 1882} {"train_loss": -40.06136703491211, "global_step": 227730, "epoch": 1882} {"train_loss": -40.210655212402344, "global_step": 227731, "epoch": 1882} {"train_loss": -40.30446243286133, "global_step": 227732, "epoch": 1882} {"train_loss": -39.77815246582031, "global_step": 227733, "epoch": 1882} {"train_loss": -40.987998962402344, "global_step": 227734, "epoch": 1882} {"train_loss": -40.21114730834961, "global_step": 227735, "epoch": 1882} {"train_loss": -40.72089767456055, "global_step": 227736, "epoch": 1882} {"train_loss": -40.33631134033203, "global_step": 227737, "epoch": 1882} {"train_loss": -40.38072204589844, "global_step": 227738, "epoch": 1882} {"train_loss": -39.78902053833008, "global_step": 227739, "epoch": 1882} {"train_loss": -40.23793029785156, "global_step": 227740, "epoch": 1882} {"train_loss": -39.64234161376953, "global_step": 227741, "epoch": 1882} {"train_loss": -40.6207160949707, "global_step": 227742, "epoch": 1882} {"train_loss": -41.35357666015625, "global_step": 227743, "epoch": 1882} {"train_loss": -41.42414474487305, "global_step": 227744, "epoch": 1882} {"train_loss": -40.33779525756836, "global_step": 227745, "epoch": 1882} {"train_loss": -40.56110763549805, "global_step": 227746, "epoch": 1882} {"train_loss": -40.74568176269531, "global_step": 227747, "epoch": 1882} {"train_loss": -41.60577392578125, "global_step": 227748, "epoch": 1882} {"train_loss": -40.787933349609375, "global_step": 227749, "epoch": 1882} {"train_loss": -40.10000228881836, "global_step": 227750, "epoch": 1882} {"train_loss": -39.54305648803711, "global_step": 227751, "epoch": 1882} {"train_loss": -40.745052337646484, "global_step": 227752, "epoch": 1882} {"train_loss": -40.63821029663086, "global_step": 227753, "epoch": 1882} {"train_loss": -41.096614837646484, "global_step": 227754, "epoch": 1882} {"train_loss": -41.0257682800293, "global_step": 227755, "epoch": 1882} {"train_loss": -41.6983757019043, "global_step": 227756, "epoch": 1882} {"train_loss": -41.155548095703125, "global_step": 227757, "epoch": 1882} {"train_loss": -40.50720977783203, "global_step": 227758, "epoch": 1882} {"train_loss": -41.8675651550293, "global_step": 227759, "epoch": 1882} {"train_loss": -40.956729888916016, "global_step": 227760, "epoch": 1882} {"train_loss": -41.307838439941406, "global_step": 227761, "epoch": 1882} {"train_loss": -41.34958267211914, "global_step": 227762, "epoch": 1882} {"train_loss": -41.67616271972656, "global_step": 227763, "epoch": 1882} {"train_loss": -40.85728073120117, "global_step": 227764, "epoch": 1882} {"train_loss": -41.97530746459961, "global_step": 227765, "epoch": 1882} {"train_loss": -41.7673225402832, "global_step": 227766, "epoch": 1882} {"train_loss": -40.45530319213867, "global_step": 227767, "epoch": 1882} {"train_loss": -41.62173080444336, "global_step": 227768, "epoch": 1882} {"train_loss": -41.76654815673828, "global_step": 227769, "epoch": 1882} {"train_loss": -41.46158981323242, "global_step": 227770, "epoch": 1882} {"train_loss": -41.44522476196289, "global_step": 227771, "epoch": 1882} {"train_loss": -42.669918060302734, "global_step": 227772, "epoch": 1882} {"train_loss": -42.18775177001953, "global_step": 227773, "epoch": 1882} {"train_loss": -42.30683135986328, "global_step": 227774, "epoch": 1882} {"train_loss": -41.97956085205078, "global_step": 227775, "epoch": 1882} {"train_loss": -41.65703582763672, "global_step": 227776, "epoch": 1882} {"train_loss": -42.480712890625, "global_step": 227777, "epoch": 1882} {"train_loss": -42.37916946411133, "global_step": 227778, "epoch": 1882} {"train_loss": -42.0689582824707, "global_step": 227779, "epoch": 1882} {"train_loss": -42.04773712158203, "global_step": 227780, "epoch": 1882} {"train_loss": -42.904212951660156, "global_step": 227781, "epoch": 1882} {"train_loss": -42.19508743286133, "global_step": 227782, "epoch": 1882} {"train_loss": -42.316566467285156, "global_step": 227783, "epoch": 1882} {"train_loss": -40.86686325073242, "global_step": 227784, "epoch": 1882} {"train_loss": -42.11387634277344, "global_step": 227785, "epoch": 1882} {"train_loss": -42.1165657043457, "global_step": 227786, "epoch": 1882} {"train_loss": -42.148983001708984, "global_step": 227787, "epoch": 1882} {"train_loss": -42.13246154785156, "global_step": 227788, "epoch": 1882} {"train_loss": -42.2526741027832, "global_step": 227789, "epoch": 1882} {"train_loss": -40.97488021850586, "global_step": 227790, "epoch": 1882} {"train_loss": -42.16013717651367, "global_step": 227791, "epoch": 1882} {"train_loss": -42.25856399536133, "global_step": 227792, "epoch": 1882} {"train_loss": -42.674522399902344, "global_step": 227793, "epoch": 1882} {"train_loss": -42.22872543334961, "global_step": 227794, "epoch": 1882} {"train_loss": -42.30720138549805, "global_step": 227795, "epoch": 1882} {"train_loss": -42.403682708740234, "global_step": 227796, "epoch": 1882} {"train_loss": -42.1403694152832, "global_step": 227797, "epoch": 1882} {"train_loss": -42.86845779418945, "global_step": 227798, "epoch": 1882} {"train_loss": -42.689308166503906, "global_step": 227799, "epoch": 1882} {"train_loss": -42.526123046875, "global_step": 227800, "epoch": 1882} {"train_loss": -42.49453353881836, "global_step": 227801, "epoch": 1882} {"train_loss": -43.0805549621582, "global_step": 227802, "epoch": 1882} {"train_loss": -42.478668212890625, "global_step": 227803, "epoch": 1882} {"train_loss": -42.47291946411133, "global_step": 227804, "epoch": 1882} {"train_loss": -42.80060958862305, "global_step": 227805, "epoch": 1882} {"train_loss": -42.809120178222656, "global_step": 227806, "epoch": 1882} {"train_loss": -41.75263595581055, "global_step": 227807, "epoch": 1882} {"train_loss": -42.691162109375, "global_step": 227808, "epoch": 1882} {"train_loss": -43.550411224365234, "global_step": 227809, "epoch": 1882} {"train_loss": -42.243194580078125, "global_step": 227810, "epoch": 1882} {"train_loss": -42.187232971191406, "global_step": 227811, "epoch": 1882} {"train_loss": -42.372127532958984, "global_step": 227812, "epoch": 1882} {"train_loss": -42.399940490722656, "global_step": 227813, "epoch": 1882} {"train_loss": -41.3626823425293, "global_step": 227814, "epoch": 1882} {"train_loss": -39.97310256958008, "global_step": 227815, "epoch": 1882} {"train_loss": -42.62679672241211, "global_step": 227816, "epoch": 1882} {"train_loss": -40.69797897338867, "global_step": 227817, "epoch": 1882} {"train_loss": -39.72221755981445, "global_step": 227818, "epoch": 1882} {"train_loss": -40.94740676879883, "global_step": 227819, "epoch": 1882} {"train_loss": -40.1164436340332, "global_step": 227820, "epoch": 1882} {"train_loss": -40.256187438964844, "global_step": 227821, "epoch": 1882} {"train_loss": -41.74946975708008, "global_step": 227822, "epoch": 1882} {"train_loss": -39.954463958740234, "global_step": 227823, "epoch": 1882} {"train_loss": -36.73264694213867, "global_step": 227824, "epoch": 1882} {"train_loss": -39.93531799316406, "global_step": 227825, "epoch": 1882} {"train_loss": -39.70134735107422, "global_step": 227826, "epoch": 1882} {"train_loss": -34.48142623901367, "global_step": 227827, "epoch": 1882} {"train_loss": -29.041234970092773, "global_step": 227828, "epoch": 1882} {"train_loss": -36.636940002441406, "global_step": 227829, "epoch": 1882} {"train_loss": -29.183713912963867, "global_step": 227830, "epoch": 1882} {"train_loss": -34.360687255859375, "global_step": 227831, "epoch": 1882} {"train_loss": -33.7130241394043, "global_step": 227832, "epoch": 1882} {"train_loss": -37.3632698059082, "global_step": 227833, "epoch": 1882} {"train_loss": -33.23904037475586, "global_step": 227834, "epoch": 1882} {"train_loss": -38.41840362548828, "global_step": 227835, "epoch": 1882} {"train_loss": -34.66846466064453, "global_step": 227836, "epoch": 1882} {"train_loss": -37.51617431640625, "global_step": 227837, "epoch": 1882} {"train_loss": -38.07345199584961, "global_step": 227838, "epoch": 1882} {"train_loss": -38.90855026245117, "global_step": 227839, "epoch": 1882} {"train_loss": -38.60076904296875, "global_step": 227840, "epoch": 1882} {"train_loss": -39.03420639038086, "global_step": 227841, "epoch": 1882} {"train_loss": -40.577808979129, "global_step": 227842, "epoch": 1882, "val_loss": 2506976.25} {"train_loss": -38.8684196472168, "global_step": 227843, "epoch": 1883} {"train_loss": -38.438472747802734, "global_step": 227844, "epoch": 1883} {"train_loss": -39.956172943115234, "global_step": 227845, "epoch": 1883} {"train_loss": -38.74911880493164, "global_step": 227846, "epoch": 1883} {"train_loss": -38.75262451171875, "global_step": 227847, "epoch": 1883} {"train_loss": -41.11070251464844, "global_step": 227848, "epoch": 1883} {"train_loss": -40.11354446411133, "global_step": 227849, "epoch": 1883} {"train_loss": -40.02570724487305, "global_step": 227850, "epoch": 1883} {"train_loss": -39.49453353881836, "global_step": 227851, "epoch": 1883} {"train_loss": -41.184383392333984, "global_step": 227852, "epoch": 1883} {"train_loss": -40.04209899902344, "global_step": 227853, "epoch": 1883} {"train_loss": -38.458045959472656, "global_step": 227854, "epoch": 1883} {"train_loss": -40.65909957885742, "global_step": 227855, "epoch": 1883} {"train_loss": -40.235633850097656, "global_step": 227856, "epoch": 1883} {"train_loss": -40.57918167114258, "global_step": 227857, "epoch": 1883} {"train_loss": -40.15150833129883, "global_step": 227858, "epoch": 1883} {"train_loss": -40.63608932495117, "global_step": 227859, "epoch": 1883} {"train_loss": -38.57835006713867, "global_step": 227860, "epoch": 1883} {"train_loss": -39.4907341003418, "global_step": 227861, "epoch": 1883} {"train_loss": -39.96054458618164, "global_step": 227862, "epoch": 1883} {"train_loss": -36.83049011230469, "global_step": 227863, "epoch": 1883} {"train_loss": -40.447662353515625, "global_step": 227864, "epoch": 1883} {"train_loss": -40.296146392822266, "global_step": 227865, "epoch": 1883} {"train_loss": -41.226924896240234, "global_step": 227866, "epoch": 1883} {"train_loss": -41.14454650878906, "global_step": 227867, "epoch": 1883} {"train_loss": -40.692413330078125, "global_step": 227868, "epoch": 1883} {"train_loss": -40.829830169677734, "global_step": 227869, "epoch": 1883} {"train_loss": -39.69800567626953, "global_step": 227870, "epoch": 1883} {"train_loss": -41.37077713012695, "global_step": 227871, "epoch": 1883} {"train_loss": -40.91387939453125, "global_step": 227872, "epoch": 1883} {"train_loss": -41.240135192871094, "global_step": 227873, "epoch": 1883} {"train_loss": -41.61318588256836, "global_step": 227874, "epoch": 1883} {"train_loss": -41.151424407958984, "global_step": 227875, "epoch": 1883} {"train_loss": -41.153358459472656, "global_step": 227876, "epoch": 1883} {"train_loss": -40.65224075317383, "global_step": 227877, "epoch": 1883} {"train_loss": -41.36586380004883, "global_step": 227878, "epoch": 1883} {"train_loss": -39.279693603515625, "global_step": 227879, "epoch": 1883} {"train_loss": -40.564205169677734, "global_step": 227880, "epoch": 1883} {"train_loss": -41.62990188598633, "global_step": 227881, "epoch": 1883} {"train_loss": -41.43014144897461, "global_step": 227882, "epoch": 1883} {"train_loss": -41.14509201049805, "global_step": 227883, "epoch": 1883} {"train_loss": -41.13808822631836, "global_step": 227884, "epoch": 1883} {"train_loss": -41.61579132080078, "global_step": 227885, "epoch": 1883} {"train_loss": -41.29741668701172, "global_step": 227886, "epoch": 1883} {"train_loss": -36.435638427734375, "global_step": 227887, "epoch": 1883} {"train_loss": -41.36564254760742, "global_step": 227888, "epoch": 1883} {"train_loss": -41.62156295776367, "global_step": 227889, "epoch": 1883} {"train_loss": -42.14524459838867, "global_step": 227890, "epoch": 1883} {"train_loss": -41.17878341674805, "global_step": 227891, "epoch": 1883} {"train_loss": -40.961727142333984, "global_step": 227892, "epoch": 1883} {"train_loss": -41.40139389038086, "global_step": 227893, "epoch": 1883} {"train_loss": -41.83523178100586, "global_step": 227894, "epoch": 1883} {"train_loss": -40.738868713378906, "global_step": 227895, "epoch": 1883} {"train_loss": -41.87739944458008, "global_step": 227896, "epoch": 1883} {"train_loss": -41.37276840209961, "global_step": 227897, "epoch": 1883} {"train_loss": -41.58247756958008, "global_step": 227898, "epoch": 1883} {"train_loss": -38.417694091796875, "global_step": 227899, "epoch": 1883} {"train_loss": -41.54319381713867, "global_step": 227900, "epoch": 1883} {"train_loss": -41.5406608581543, "global_step": 227901, "epoch": 1883} {"train_loss": -42.07646560668945, "global_step": 227902, "epoch": 1883} {"train_loss": -41.754695892333984, "global_step": 227903, "epoch": 1883} {"train_loss": -41.33026885986328, "global_step": 227904, "epoch": 1883} {"train_loss": -42.28379440307617, "global_step": 227905, "epoch": 1883} {"train_loss": -41.831233978271484, "global_step": 227906, "epoch": 1883} {"train_loss": -42.434608459472656, "global_step": 227907, "epoch": 1883} {"train_loss": -40.237239837646484, "global_step": 227908, "epoch": 1883} {"train_loss": -40.1720085144043, "global_step": 227909, "epoch": 1883} {"train_loss": -41.3824577331543, "global_step": 227910, "epoch": 1883} {"train_loss": -42.206695556640625, "global_step": 227911, "epoch": 1883} {"train_loss": -42.38152313232422, "global_step": 227912, "epoch": 1883} {"train_loss": -41.70542526245117, "global_step": 227913, "epoch": 1883} {"train_loss": -41.293392181396484, "global_step": 227914, "epoch": 1883} {"train_loss": -42.26420974731445, "global_step": 227915, "epoch": 1883} {"train_loss": -39.900299072265625, "global_step": 227916, "epoch": 1883} {"train_loss": -42.01528549194336, "global_step": 227917, "epoch": 1883} {"train_loss": -41.65509033203125, "global_step": 227918, "epoch": 1883} {"train_loss": -42.58795928955078, "global_step": 227919, "epoch": 1883} {"train_loss": -42.8802604675293, "global_step": 227920, "epoch": 1883} {"train_loss": -41.878326416015625, "global_step": 227921, "epoch": 1883} {"train_loss": -41.67323303222656, "global_step": 227922, "epoch": 1883} {"train_loss": -42.06477737426758, "global_step": 227923, "epoch": 1883} {"train_loss": -41.71077346801758, "global_step": 227924, "epoch": 1883} {"train_loss": -42.365631103515625, "global_step": 227925, "epoch": 1883} {"train_loss": -42.33552169799805, "global_step": 227926, "epoch": 1883} {"train_loss": -42.82981491088867, "global_step": 227927, "epoch": 1883} {"train_loss": -41.48823928833008, "global_step": 227928, "epoch": 1883} {"train_loss": -40.91199493408203, "global_step": 227929, "epoch": 1883} {"train_loss": -41.505496978759766, "global_step": 227930, "epoch": 1883} {"train_loss": -42.86649703979492, "global_step": 227931, "epoch": 1883} {"train_loss": -41.41917037963867, "global_step": 227932, "epoch": 1883} {"train_loss": -38.44179153442383, "global_step": 227933, "epoch": 1883} {"train_loss": -40.74898910522461, "global_step": 227934, "epoch": 1883} {"train_loss": -41.94633102416992, "global_step": 227935, "epoch": 1883} {"train_loss": -39.40752029418945, "global_step": 227936, "epoch": 1883} {"train_loss": -40.423580169677734, "global_step": 227937, "epoch": 1883} {"train_loss": -42.11994552612305, "global_step": 227938, "epoch": 1883} {"train_loss": -39.78878402709961, "global_step": 227939, "epoch": 1883} {"train_loss": -39.974365234375, "global_step": 227940, "epoch": 1883} {"train_loss": -40.23796844482422, "global_step": 227941, "epoch": 1883} {"train_loss": -41.598602294921875, "global_step": 227942, "epoch": 1883} {"train_loss": -41.05641174316406, "global_step": 227943, "epoch": 1883} {"train_loss": -40.48275375366211, "global_step": 227944, "epoch": 1883} {"train_loss": -41.154640197753906, "global_step": 227945, "epoch": 1883} {"train_loss": -41.43598175048828, "global_step": 227946, "epoch": 1883} {"train_loss": -39.62995529174805, "global_step": 227947, "epoch": 1883} {"train_loss": -41.058082580566406, "global_step": 227948, "epoch": 1883} {"train_loss": -42.2504768371582, "global_step": 227949, "epoch": 1883} {"train_loss": -40.29868698120117, "global_step": 227950, "epoch": 1883} {"train_loss": -41.93877029418945, "global_step": 227951, "epoch": 1883} {"train_loss": -41.843238830566406, "global_step": 227952, "epoch": 1883} {"train_loss": -41.225711822509766, "global_step": 227953, "epoch": 1883} {"train_loss": -41.73908615112305, "global_step": 227954, "epoch": 1883} {"train_loss": -42.47883987426758, "global_step": 227955, "epoch": 1883} {"train_loss": -41.36299514770508, "global_step": 227956, "epoch": 1883} {"train_loss": -42.44099044799805, "global_step": 227957, "epoch": 1883} {"train_loss": -42.765289306640625, "global_step": 227958, "epoch": 1883} {"train_loss": -42.4318733215332, "global_step": 227959, "epoch": 1883} {"train_loss": -41.98857498168945, "global_step": 227960, "epoch": 1883} {"train_loss": -42.73908615112305, "global_step": 227961, "epoch": 1883} {"train_loss": -39.078392028808594, "global_step": 227962, "epoch": 1883} {"train_loss": -40.99092212393264, "global_step": 227963, "epoch": 1883, "val_loss": 2555246.25} {"train_loss": -42.5556640625, "global_step": 227964, "epoch": 1884} {"train_loss": -42.03533172607422, "global_step": 227965, "epoch": 1884} {"train_loss": -42.146217346191406, "global_step": 227966, "epoch": 1884} {"train_loss": -42.19179916381836, "global_step": 227967, "epoch": 1884} {"train_loss": -42.45318603515625, "global_step": 227968, "epoch": 1884} {"train_loss": -40.23634719848633, "global_step": 227969, "epoch": 1884} {"train_loss": -40.98957443237305, "global_step": 227970, "epoch": 1884} {"train_loss": -42.01859664916992, "global_step": 227971, "epoch": 1884} {"train_loss": -42.3842887878418, "global_step": 227972, "epoch": 1884} {"train_loss": -41.856075286865234, "global_step": 227973, "epoch": 1884} {"train_loss": -41.49795150756836, "global_step": 227974, "epoch": 1884} {"train_loss": -41.80373001098633, "global_step": 227975, "epoch": 1884} {"train_loss": -42.34834671020508, "global_step": 227976, "epoch": 1884} {"train_loss": -41.65816879272461, "global_step": 227977, "epoch": 1884} {"train_loss": -42.53057861328125, "global_step": 227978, "epoch": 1884} {"train_loss": -41.509010314941406, "global_step": 227979, "epoch": 1884} {"train_loss": -42.70394515991211, "global_step": 227980, "epoch": 1884} {"train_loss": -41.79038619995117, "global_step": 227981, "epoch": 1884} {"train_loss": -42.457923889160156, "global_step": 227982, "epoch": 1884} {"train_loss": -42.4804801940918, "global_step": 227983, "epoch": 1884} {"train_loss": -39.4653434753418, "global_step": 227984, "epoch": 1884} {"train_loss": -41.49898910522461, "global_step": 227985, "epoch": 1884} {"train_loss": -41.84894561767578, "global_step": 227986, "epoch": 1884} {"train_loss": -41.597686767578125, "global_step": 227987, "epoch": 1884} {"train_loss": -41.53215408325195, "global_step": 227988, "epoch": 1884} {"train_loss": -40.968746185302734, "global_step": 227989, "epoch": 1884} {"train_loss": -41.577972412109375, "global_step": 227990, "epoch": 1884} {"train_loss": -41.26533126831055, "global_step": 227991, "epoch": 1884} {"train_loss": -42.03426742553711, "global_step": 227992, "epoch": 1884} {"train_loss": -40.835262298583984, "global_step": 227993, "epoch": 1884} {"train_loss": -42.2496452331543, "global_step": 227994, "epoch": 1884} {"train_loss": -42.17201232910156, "global_step": 227995, "epoch": 1884} {"train_loss": -41.5013542175293, "global_step": 227996, "epoch": 1884} {"train_loss": -42.61347579956055, "global_step": 227997, "epoch": 1884} {"train_loss": -41.51115036010742, "global_step": 227998, "epoch": 1884} {"train_loss": -42.029518127441406, "global_step": 227999, "epoch": 1884} {"train_loss": -42.387264251708984, "global_step": 228000, "epoch": 1884} {"train_loss": -41.899505615234375, "global_step": 228001, "epoch": 1884} {"train_loss": -42.21519088745117, "global_step": 228002, "epoch": 1884} {"train_loss": -42.189083099365234, "global_step": 228003, "epoch": 1884} {"train_loss": -41.890625, "global_step": 228004, "epoch": 1884} {"train_loss": -42.0892219543457, "global_step": 228005, "epoch": 1884} {"train_loss": -41.76356887817383, "global_step": 228006, "epoch": 1884} {"train_loss": -40.63007736206055, "global_step": 228007, "epoch": 1884} {"train_loss": -40.08890914916992, "global_step": 228008, "epoch": 1884} {"train_loss": -41.43158721923828, "global_step": 228009, "epoch": 1884} {"train_loss": -42.12112045288086, "global_step": 228010, "epoch": 1884} {"train_loss": -41.72819137573242, "global_step": 228011, "epoch": 1884} {"train_loss": -40.899288177490234, "global_step": 228012, "epoch": 1884} {"train_loss": -41.09334945678711, "global_step": 228013, "epoch": 1884} {"train_loss": -41.96107482910156, "global_step": 228014, "epoch": 1884} {"train_loss": -42.41282653808594, "global_step": 228015, "epoch": 1884} {"train_loss": -41.514400482177734, "global_step": 228016, "epoch": 1884} {"train_loss": -42.07487106323242, "global_step": 228017, "epoch": 1884} {"train_loss": -41.9571647644043, "global_step": 228018, "epoch": 1884} {"train_loss": -41.000118255615234, "global_step": 228019, "epoch": 1884} {"train_loss": -40.77459716796875, "global_step": 228020, "epoch": 1884} {"train_loss": -41.231327056884766, "global_step": 228021, "epoch": 1884} {"train_loss": -40.8310661315918, "global_step": 228022, "epoch": 1884} {"train_loss": -41.680076599121094, "global_step": 228023, "epoch": 1884} {"train_loss": -40.09824752807617, "global_step": 228024, "epoch": 1884} {"train_loss": -40.66694259643555, "global_step": 228025, "epoch": 1884} {"train_loss": -41.92120361328125, "global_step": 228026, "epoch": 1884} {"train_loss": -41.63978958129883, "global_step": 228027, "epoch": 1884} {"train_loss": -40.78593826293945, "global_step": 228028, "epoch": 1884} {"train_loss": -40.18257522583008, "global_step": 228029, "epoch": 1884} {"train_loss": -41.19776916503906, "global_step": 228030, "epoch": 1884} {"train_loss": -40.131935119628906, "global_step": 228031, "epoch": 1884} {"train_loss": -41.78836441040039, "global_step": 228032, "epoch": 1884} {"train_loss": -41.04301071166992, "global_step": 228033, "epoch": 1884} {"train_loss": -41.43810272216797, "global_step": 228034, "epoch": 1884} {"train_loss": -42.629417419433594, "global_step": 228035, "epoch": 1884} {"train_loss": -41.77206039428711, "global_step": 228036, "epoch": 1884} {"train_loss": -40.61653137207031, "global_step": 228037, "epoch": 1884} {"train_loss": -42.368019104003906, "global_step": 228038, "epoch": 1884} {"train_loss": -41.85918426513672, "global_step": 228039, "epoch": 1884} {"train_loss": -41.67484664916992, "global_step": 228040, "epoch": 1884} {"train_loss": -42.76235580444336, "global_step": 228041, "epoch": 1884} {"train_loss": -41.42119216918945, "global_step": 228042, "epoch": 1884} {"train_loss": -41.64851760864258, "global_step": 228043, "epoch": 1884} {"train_loss": -42.39773178100586, "global_step": 228044, "epoch": 1884} {"train_loss": -41.537322998046875, "global_step": 228045, "epoch": 1884} {"train_loss": -41.74606704711914, "global_step": 228046, "epoch": 1884} {"train_loss": -33.561519622802734, "global_step": 228047, "epoch": 1884} {"train_loss": -41.80012130737305, "global_step": 228048, "epoch": 1884} {"train_loss": -41.46513366699219, "global_step": 228049, "epoch": 1884} {"train_loss": -42.40373611450195, "global_step": 228050, "epoch": 1884} {"train_loss": -41.19725036621094, "global_step": 228051, "epoch": 1884} {"train_loss": -41.14299392700195, "global_step": 228052, "epoch": 1884} {"train_loss": -42.35795974731445, "global_step": 228053, "epoch": 1884} {"train_loss": -42.14956283569336, "global_step": 228054, "epoch": 1884} {"train_loss": -41.501953125, "global_step": 228055, "epoch": 1884} {"train_loss": -42.427616119384766, "global_step": 228056, "epoch": 1884} {"train_loss": -38.870269775390625, "global_step": 228057, "epoch": 1884} {"train_loss": -41.6154670715332, "global_step": 228058, "epoch": 1884} {"train_loss": -42.265682220458984, "global_step": 228059, "epoch": 1884} {"train_loss": -40.35226058959961, "global_step": 228060, "epoch": 1884} {"train_loss": -41.63259506225586, "global_step": 228061, "epoch": 1884} {"train_loss": -41.281063079833984, "global_step": 228062, "epoch": 1884} {"train_loss": -40.326271057128906, "global_step": 228063, "epoch": 1884} {"train_loss": -41.79548263549805, "global_step": 228064, "epoch": 1884} {"train_loss": -41.16162872314453, "global_step": 228065, "epoch": 1884} {"train_loss": -42.21574020385742, "global_step": 228066, "epoch": 1884} {"train_loss": -41.39251708984375, "global_step": 228067, "epoch": 1884} {"train_loss": -42.16535568237305, "global_step": 228068, "epoch": 1884} {"train_loss": -40.94577407836914, "global_step": 228069, "epoch": 1884} {"train_loss": -41.71786117553711, "global_step": 228070, "epoch": 1884} {"train_loss": -42.37891387939453, "global_step": 228071, "epoch": 1884} {"train_loss": -42.297706604003906, "global_step": 228072, "epoch": 1884} {"train_loss": -41.72711181640625, "global_step": 228073, "epoch": 1884} {"train_loss": -41.93671417236328, "global_step": 228074, "epoch": 1884} {"train_loss": -42.167266845703125, "global_step": 228075, "epoch": 1884} {"train_loss": -42.392574310302734, "global_step": 228076, "epoch": 1884} {"train_loss": -41.777652740478516, "global_step": 228077, "epoch": 1884} {"train_loss": -42.620113372802734, "global_step": 228078, "epoch": 1884} {"train_loss": -41.84968185424805, "global_step": 228079, "epoch": 1884} {"train_loss": -42.25931930541992, "global_step": 228080, "epoch": 1884} {"train_loss": -41.2653923034668, "global_step": 228081, "epoch": 1884} {"train_loss": -42.036781311035156, "global_step": 228082, "epoch": 1884} {"train_loss": -42.38507080078125, "global_step": 228083, "epoch": 1884} {"train_loss": -41.588222030765756, "global_step": 228084, "epoch": 1884, "val_loss": 2674414.75} {"train_loss": -42.40487289428711, "global_step": 228085, "epoch": 1885} {"train_loss": -41.655120849609375, "global_step": 228086, "epoch": 1885} {"train_loss": -42.8079948425293, "global_step": 228087, "epoch": 1885} {"train_loss": -42.11249923706055, "global_step": 228088, "epoch": 1885} {"train_loss": -42.678314208984375, "global_step": 228089, "epoch": 1885} {"train_loss": -41.68882751464844, "global_step": 228090, "epoch": 1885} {"train_loss": -42.13941192626953, "global_step": 228091, "epoch": 1885} {"train_loss": -42.21235275268555, "global_step": 228092, "epoch": 1885} {"train_loss": -42.37258529663086, "global_step": 228093, "epoch": 1885} {"train_loss": -42.90189743041992, "global_step": 228094, "epoch": 1885} {"train_loss": -41.9505615234375, "global_step": 228095, "epoch": 1885} {"train_loss": -42.62064743041992, "global_step": 228096, "epoch": 1885} {"train_loss": -42.19009017944336, "global_step": 228097, "epoch": 1885} {"train_loss": -42.22025680541992, "global_step": 228098, "epoch": 1885} {"train_loss": -42.083003997802734, "global_step": 228099, "epoch": 1885} {"train_loss": -41.72140121459961, "global_step": 228100, "epoch": 1885} {"train_loss": -41.986820220947266, "global_step": 228101, "epoch": 1885} {"train_loss": -41.870235443115234, "global_step": 228102, "epoch": 1885} {"train_loss": -40.762550354003906, "global_step": 228103, "epoch": 1885} {"train_loss": -41.38843536376953, "global_step": 228104, "epoch": 1885} {"train_loss": -42.53089904785156, "global_step": 228105, "epoch": 1885} {"train_loss": -42.525611877441406, "global_step": 228106, "epoch": 1885} {"train_loss": -42.25339889526367, "global_step": 228107, "epoch": 1885} {"train_loss": -39.90363693237305, "global_step": 228108, "epoch": 1885} {"train_loss": -38.4593620300293, "global_step": 228109, "epoch": 1885} {"train_loss": -40.75248336791992, "global_step": 228110, "epoch": 1885} {"train_loss": -39.30452346801758, "global_step": 228111, "epoch": 1885} {"train_loss": -40.676029205322266, "global_step": 228112, "epoch": 1885} {"train_loss": -39.742549896240234, "global_step": 228113, "epoch": 1885} {"train_loss": -41.5348014831543, "global_step": 228114, "epoch": 1885} {"train_loss": -39.554473876953125, "global_step": 228115, "epoch": 1885} {"train_loss": -40.56118392944336, "global_step": 228116, "epoch": 1885} {"train_loss": -38.90240478515625, "global_step": 228117, "epoch": 1885} {"train_loss": -41.3348503112793, "global_step": 228118, "epoch": 1885} {"train_loss": -41.32148742675781, "global_step": 228119, "epoch": 1885} {"train_loss": -42.096771240234375, "global_step": 228120, "epoch": 1885} {"train_loss": -39.58061599731445, "global_step": 228121, "epoch": 1885} {"train_loss": -40.5128288269043, "global_step": 228122, "epoch": 1885} {"train_loss": -39.62587356567383, "global_step": 228123, "epoch": 1885} {"train_loss": -39.20448684692383, "global_step": 228124, "epoch": 1885} {"train_loss": -41.49688720703125, "global_step": 228125, "epoch": 1885} {"train_loss": -41.2086067199707, "global_step": 228126, "epoch": 1885} {"train_loss": -40.97840118408203, "global_step": 228127, "epoch": 1885} {"train_loss": -40.0557746887207, "global_step": 228128, "epoch": 1885} {"train_loss": -41.049591064453125, "global_step": 228129, "epoch": 1885} {"train_loss": -41.75813674926758, "global_step": 228130, "epoch": 1885} {"train_loss": -39.99835205078125, "global_step": 228131, "epoch": 1885} {"train_loss": -41.351104736328125, "global_step": 228132, "epoch": 1885} {"train_loss": -41.42216110229492, "global_step": 228133, "epoch": 1885} {"train_loss": -40.90528106689453, "global_step": 228134, "epoch": 1885} {"train_loss": -41.41732406616211, "global_step": 228135, "epoch": 1885} {"train_loss": -36.664337158203125, "global_step": 228136, "epoch": 1885} {"train_loss": -40.71181106567383, "global_step": 228137, "epoch": 1885} {"train_loss": -41.518611907958984, "global_step": 228138, "epoch": 1885} {"train_loss": -39.4111442565918, "global_step": 228139, "epoch": 1885} {"train_loss": -39.89028549194336, "global_step": 228140, "epoch": 1885} {"train_loss": -41.29103469848633, "global_step": 228141, "epoch": 1885} {"train_loss": -40.30588150024414, "global_step": 228142, "epoch": 1885} {"train_loss": -41.68760299682617, "global_step": 228143, "epoch": 1885} {"train_loss": -41.77103042602539, "global_step": 228144, "epoch": 1885} {"train_loss": -42.1552619934082, "global_step": 228145, "epoch": 1885} {"train_loss": -41.8034782409668, "global_step": 228146, "epoch": 1885} {"train_loss": -40.177734375, "global_step": 228147, "epoch": 1885} {"train_loss": -40.8773307800293, "global_step": 228148, "epoch": 1885} {"train_loss": -40.10405731201172, "global_step": 228149, "epoch": 1885} {"train_loss": -40.0899543762207, "global_step": 228150, "epoch": 1885} {"train_loss": -40.15767288208008, "global_step": 228151, "epoch": 1885} {"train_loss": -39.71566390991211, "global_step": 228152, "epoch": 1885} {"train_loss": -39.975460052490234, "global_step": 228153, "epoch": 1885} {"train_loss": -41.995826721191406, "global_step": 228154, "epoch": 1885} {"train_loss": -42.11804962158203, "global_step": 228155, "epoch": 1885} {"train_loss": -42.088775634765625, "global_step": 228156, "epoch": 1885} {"train_loss": -41.06818389892578, "global_step": 228157, "epoch": 1885} {"train_loss": -40.01309585571289, "global_step": 228158, "epoch": 1885} {"train_loss": -42.77899169921875, "global_step": 228159, "epoch": 1885} {"train_loss": -42.39219284057617, "global_step": 228160, "epoch": 1885} {"train_loss": -42.03483963012695, "global_step": 228161, "epoch": 1885} {"train_loss": -39.244510650634766, "global_step": 228162, "epoch": 1885} {"train_loss": -41.92829513549805, "global_step": 228163, "epoch": 1885} {"train_loss": -41.327728271484375, "global_step": 228164, "epoch": 1885} {"train_loss": -42.5704345703125, "global_step": 228165, "epoch": 1885} {"train_loss": -33.60134506225586, "global_step": 228166, "epoch": 1885} {"train_loss": -37.84403610229492, "global_step": 228167, "epoch": 1885} {"train_loss": -33.98276901245117, "global_step": 228168, "epoch": 1885} {"train_loss": -40.89239501953125, "global_step": 228169, "epoch": 1885} {"train_loss": -39.73776626586914, "global_step": 228170, "epoch": 1885} {"train_loss": -39.58087158203125, "global_step": 228171, "epoch": 1885} {"train_loss": -40.9638557434082, "global_step": 228172, "epoch": 1885} {"train_loss": -39.305721282958984, "global_step": 228173, "epoch": 1885} {"train_loss": -42.08308792114258, "global_step": 228174, "epoch": 1885} {"train_loss": -40.058570861816406, "global_step": 228175, "epoch": 1885} {"train_loss": -40.16978073120117, "global_step": 228176, "epoch": 1885} {"train_loss": -40.360164642333984, "global_step": 228177, "epoch": 1885} {"train_loss": -39.75059127807617, "global_step": 228178, "epoch": 1885} {"train_loss": -41.47111129760742, "global_step": 228179, "epoch": 1885} {"train_loss": -40.904632568359375, "global_step": 228180, "epoch": 1885} {"train_loss": -40.98424530029297, "global_step": 228181, "epoch": 1885} {"train_loss": -40.02497863769531, "global_step": 228182, "epoch": 1885} {"train_loss": -40.42188262939453, "global_step": 228183, "epoch": 1885} {"train_loss": -40.733524322509766, "global_step": 228184, "epoch": 1885} {"train_loss": -40.16085433959961, "global_step": 228185, "epoch": 1885} {"train_loss": -39.3929557800293, "global_step": 228186, "epoch": 1885} {"train_loss": -41.372222900390625, "global_step": 228187, "epoch": 1885} {"train_loss": -40.76034164428711, "global_step": 228188, "epoch": 1885} {"train_loss": -37.932003021240234, "global_step": 228189, "epoch": 1885} {"train_loss": -40.57950210571289, "global_step": 228190, "epoch": 1885} {"train_loss": -41.95601272583008, "global_step": 228191, "epoch": 1885} {"train_loss": -42.34481430053711, "global_step": 228192, "epoch": 1885} {"train_loss": -41.86616897583008, "global_step": 228193, "epoch": 1885} {"train_loss": -40.896053314208984, "global_step": 228194, "epoch": 1885} {"train_loss": -39.5606803894043, "global_step": 228195, "epoch": 1885} {"train_loss": -41.23817825317383, "global_step": 228196, "epoch": 1885} {"train_loss": -40.55725860595703, "global_step": 228197, "epoch": 1885} {"train_loss": -41.89940643310547, "global_step": 228198, "epoch": 1885} {"train_loss": -41.88179397583008, "global_step": 228199, "epoch": 1885} {"train_loss": -41.86233901977539, "global_step": 228200, "epoch": 1885} {"train_loss": -42.19866943359375, "global_step": 228201, "epoch": 1885} {"train_loss": -41.37759780883789, "global_step": 228202, "epoch": 1885} {"train_loss": -41.95976638793945, "global_step": 228203, "epoch": 1885} {"train_loss": -41.5294303894043, "global_step": 228204, "epoch": 1885} {"train_loss": -40.89155209754124, "global_step": 228205, "epoch": 1885, "val_loss": 2541533.25} {"train_loss": -40.779720306396484, "global_step": 228206, "epoch": 1886} {"train_loss": -42.01543045043945, "global_step": 228207, "epoch": 1886} {"train_loss": -42.10173797607422, "global_step": 228208, "epoch": 1886} {"train_loss": -41.9542236328125, "global_step": 228209, "epoch": 1886} {"train_loss": -40.400634765625, "global_step": 228210, "epoch": 1886} {"train_loss": -42.70994186401367, "global_step": 228211, "epoch": 1886} {"train_loss": -42.234127044677734, "global_step": 228212, "epoch": 1886} {"train_loss": -40.43058395385742, "global_step": 228213, "epoch": 1886} {"train_loss": -42.099647521972656, "global_step": 228214, "epoch": 1886} {"train_loss": -41.120784759521484, "global_step": 228215, "epoch": 1886} {"train_loss": -41.348602294921875, "global_step": 228216, "epoch": 1886} {"train_loss": -41.871559143066406, "global_step": 228217, "epoch": 1886} {"train_loss": -42.42128372192383, "global_step": 228218, "epoch": 1886} {"train_loss": -43.03524398803711, "global_step": 228219, "epoch": 1886} {"train_loss": -42.154693603515625, "global_step": 228220, "epoch": 1886} {"train_loss": -42.242183685302734, "global_step": 228221, "epoch": 1886} {"train_loss": -42.0110969543457, "global_step": 228222, "epoch": 1886} {"train_loss": -40.775203704833984, "global_step": 228223, "epoch": 1886} {"train_loss": -42.736297607421875, "global_step": 228224, "epoch": 1886} {"train_loss": -42.4248161315918, "global_step": 228225, "epoch": 1886} {"train_loss": -41.665828704833984, "global_step": 228226, "epoch": 1886} {"train_loss": -42.13356399536133, "global_step": 228227, "epoch": 1886} {"train_loss": -42.23398971557617, "global_step": 228228, "epoch": 1886} {"train_loss": -42.03913116455078, "global_step": 228229, "epoch": 1886} {"train_loss": -41.5818977355957, "global_step": 228230, "epoch": 1886} {"train_loss": -42.745086669921875, "global_step": 228231, "epoch": 1886} {"train_loss": -41.935909271240234, "global_step": 228232, "epoch": 1886} {"train_loss": -42.9667854309082, "global_step": 228233, "epoch": 1886} {"train_loss": -41.38297653198242, "global_step": 228234, "epoch": 1886} {"train_loss": -42.37051010131836, "global_step": 228235, "epoch": 1886} {"train_loss": -40.10029602050781, "global_step": 228236, "epoch": 1886} {"train_loss": -41.75557327270508, "global_step": 228237, "epoch": 1886} {"train_loss": -41.6169319152832, "global_step": 228238, "epoch": 1886} {"train_loss": -42.175880432128906, "global_step": 228239, "epoch": 1886} {"train_loss": -40.68791580200195, "global_step": 228240, "epoch": 1886} {"train_loss": -42.38794708251953, "global_step": 228241, "epoch": 1886} {"train_loss": -42.679351806640625, "global_step": 228242, "epoch": 1886} {"train_loss": -42.113399505615234, "global_step": 228243, "epoch": 1886} {"train_loss": -42.019264221191406, "global_step": 228244, "epoch": 1886} {"train_loss": -38.6007080078125, "global_step": 228245, "epoch": 1886} {"train_loss": -42.5040397644043, "global_step": 228246, "epoch": 1886} {"train_loss": -38.524471282958984, "global_step": 228247, "epoch": 1886} {"train_loss": -42.26726150512695, "global_step": 228248, "epoch": 1886} {"train_loss": -42.60379409790039, "global_step": 228249, "epoch": 1886} {"train_loss": -42.61967849731445, "global_step": 228250, "epoch": 1886} {"train_loss": -41.38102340698242, "global_step": 228251, "epoch": 1886} {"train_loss": -33.57502365112305, "global_step": 228252, "epoch": 1886} {"train_loss": -31.880523681640625, "global_step": 228253, "epoch": 1886} {"train_loss": -40.68362045288086, "global_step": 228254, "epoch": 1886} {"train_loss": -35.862464904785156, "global_step": 228255, "epoch": 1886} {"train_loss": -41.918617248535156, "global_step": 228256, "epoch": 1886} {"train_loss": -40.184181213378906, "global_step": 228257, "epoch": 1886} {"train_loss": -36.21171188354492, "global_step": 228258, "epoch": 1886} {"train_loss": -35.2435188293457, "global_step": 228259, "epoch": 1886} {"train_loss": -36.93954086303711, "global_step": 228260, "epoch": 1886} {"train_loss": -35.25054168701172, "global_step": 228261, "epoch": 1886} {"train_loss": -36.75343704223633, "global_step": 228262, "epoch": 1886} {"train_loss": -36.143131256103516, "global_step": 228263, "epoch": 1886} {"train_loss": -40.29413986206055, "global_step": 228264, "epoch": 1886} {"train_loss": -39.204891204833984, "global_step": 228265, "epoch": 1886} {"train_loss": -39.666561126708984, "global_step": 228266, "epoch": 1886} {"train_loss": -36.453346252441406, "global_step": 228267, "epoch": 1886} {"train_loss": -36.94652557373047, "global_step": 228268, "epoch": 1886} {"train_loss": -39.10948944091797, "global_step": 228269, "epoch": 1886} {"train_loss": -26.21494483947754, "global_step": 228270, "epoch": 1886} {"train_loss": -38.26845169067383, "global_step": 228271, "epoch": 1886} {"train_loss": -35.399898529052734, "global_step": 228272, "epoch": 1886} {"train_loss": -39.87146759033203, "global_step": 228273, "epoch": 1886} {"train_loss": -38.854408264160156, "global_step": 228274, "epoch": 1886} {"train_loss": -37.416351318359375, "global_step": 228275, "epoch": 1886} {"train_loss": -39.04952621459961, "global_step": 228276, "epoch": 1886} {"train_loss": -34.01576232910156, "global_step": 228277, "epoch": 1886} {"train_loss": -38.38903045654297, "global_step": 228278, "epoch": 1886} {"train_loss": -34.054500579833984, "global_step": 228279, "epoch": 1886} {"train_loss": -35.71625900268555, "global_step": 228280, "epoch": 1886} {"train_loss": -38.64780807495117, "global_step": 228281, "epoch": 1886} {"train_loss": -40.19855880737305, "global_step": 228282, "epoch": 1886} {"train_loss": -38.149349212646484, "global_step": 228283, "epoch": 1886} {"train_loss": -40.45120620727539, "global_step": 228284, "epoch": 1886} {"train_loss": -36.905426025390625, "global_step": 228285, "epoch": 1886} {"train_loss": -38.40248107910156, "global_step": 228286, "epoch": 1886} {"train_loss": -39.98960494995117, "global_step": 228287, "epoch": 1886} {"train_loss": -38.41755294799805, "global_step": 228288, "epoch": 1886} {"train_loss": -39.02202224731445, "global_step": 228289, "epoch": 1886} {"train_loss": -38.790767669677734, "global_step": 228290, "epoch": 1886} {"train_loss": -40.178279876708984, "global_step": 228291, "epoch": 1886} {"train_loss": -32.35838317871094, "global_step": 228292, "epoch": 1886} {"train_loss": -40.228240966796875, "global_step": 228293, "epoch": 1886} {"train_loss": -37.408973693847656, "global_step": 228294, "epoch": 1886} {"train_loss": -39.882080078125, "global_step": 228295, "epoch": 1886} {"train_loss": -39.5885124206543, "global_step": 228296, "epoch": 1886} {"train_loss": -38.88581466674805, "global_step": 228297, "epoch": 1886} {"train_loss": -36.53511428833008, "global_step": 228298, "epoch": 1886} {"train_loss": -40.30955123901367, "global_step": 228299, "epoch": 1886} {"train_loss": -40.11896514892578, "global_step": 228300, "epoch": 1886} {"train_loss": -40.765380859375, "global_step": 228301, "epoch": 1886} {"train_loss": -37.08136749267578, "global_step": 228302, "epoch": 1886} {"train_loss": -40.59741973876953, "global_step": 228303, "epoch": 1886} {"train_loss": -40.135009765625, "global_step": 228304, "epoch": 1886} {"train_loss": -41.38174819946289, "global_step": 228305, "epoch": 1886} {"train_loss": -39.440032958984375, "global_step": 228306, "epoch": 1886} {"train_loss": -41.21219253540039, "global_step": 228307, "epoch": 1886} {"train_loss": -40.7568244934082, "global_step": 228308, "epoch": 1886} {"train_loss": -40.4626350402832, "global_step": 228309, "epoch": 1886} {"train_loss": -40.63438034057617, "global_step": 228310, "epoch": 1886} {"train_loss": -40.58956527709961, "global_step": 228311, "epoch": 1886} {"train_loss": -40.83259582519531, "global_step": 228312, "epoch": 1886} {"train_loss": -40.576351165771484, "global_step": 228313, "epoch": 1886} {"train_loss": -40.82210922241211, "global_step": 228314, "epoch": 1886} {"train_loss": -40.5760498046875, "global_step": 228315, "epoch": 1886} {"train_loss": -41.10308837890625, "global_step": 228316, "epoch": 1886} {"train_loss": -40.84092330932617, "global_step": 228317, "epoch": 1886} {"train_loss": -40.66298294067383, "global_step": 228318, "epoch": 1886} {"train_loss": -40.96022415161133, "global_step": 228319, "epoch": 1886} {"train_loss": -40.586204528808594, "global_step": 228320, "epoch": 1886} {"train_loss": -40.497955322265625, "global_step": 228321, "epoch": 1886} {"train_loss": -39.63801956176758, "global_step": 228322, "epoch": 1886} {"train_loss": -40.91713333129883, "global_step": 228323, "epoch": 1886} {"train_loss": -39.67179489135742, "global_step": 228324, "epoch": 1886} {"train_loss": -41.53279495239258, "global_step": 228325, "epoch": 1886} {"train_loss": -39.82041983170943, "global_step": 228326, "epoch": 1886, "val_loss": 2596560.25} {"train_loss": -41.19265365600586, "global_step": 228327, "epoch": 1887} {"train_loss": -41.944580078125, "global_step": 228328, "epoch": 1887} {"train_loss": -41.0797119140625, "global_step": 228329, "epoch": 1887} {"train_loss": -41.02602005004883, "global_step": 228330, "epoch": 1887} {"train_loss": -41.301300048828125, "global_step": 228331, "epoch": 1887} {"train_loss": -41.709556579589844, "global_step": 228332, "epoch": 1887} {"train_loss": -41.56953811645508, "global_step": 228333, "epoch": 1887} {"train_loss": -41.82282638549805, "global_step": 228334, "epoch": 1887} {"train_loss": -41.634605407714844, "global_step": 228335, "epoch": 1887} {"train_loss": -41.643409729003906, "global_step": 228336, "epoch": 1887} {"train_loss": -41.716487884521484, "global_step": 228337, "epoch": 1887} {"train_loss": -41.46355056762695, "global_step": 228338, "epoch": 1887} {"train_loss": -41.169498443603516, "global_step": 228339, "epoch": 1887} {"train_loss": -41.349483489990234, "global_step": 228340, "epoch": 1887} {"train_loss": -40.760475158691406, "global_step": 228341, "epoch": 1887} {"train_loss": -41.57886505126953, "global_step": 228342, "epoch": 1887} {"train_loss": -41.771968841552734, "global_step": 228343, "epoch": 1887} {"train_loss": -42.1921501159668, "global_step": 228344, "epoch": 1887} {"train_loss": -42.14190673828125, "global_step": 228345, "epoch": 1887} {"train_loss": -41.634246826171875, "global_step": 228346, "epoch": 1887} {"train_loss": -41.37360763549805, "global_step": 228347, "epoch": 1887} {"train_loss": -41.8176383972168, "global_step": 228348, "epoch": 1887} {"train_loss": -42.264705657958984, "global_step": 228349, "epoch": 1887} {"train_loss": -42.261512756347656, "global_step": 228350, "epoch": 1887} {"train_loss": -42.451507568359375, "global_step": 228351, "epoch": 1887} {"train_loss": -41.537452697753906, "global_step": 228352, "epoch": 1887} {"train_loss": -41.56060791015625, "global_step": 228353, "epoch": 1887} {"train_loss": -42.42346954345703, "global_step": 228354, "epoch": 1887} {"train_loss": -42.41412353515625, "global_step": 228355, "epoch": 1887} {"train_loss": -41.83433151245117, "global_step": 228356, "epoch": 1887} {"train_loss": -42.149322509765625, "global_step": 228357, "epoch": 1887} {"train_loss": -42.15479278564453, "global_step": 228358, "epoch": 1887} {"train_loss": -41.9058952331543, "global_step": 228359, "epoch": 1887} {"train_loss": -42.2967529296875, "global_step": 228360, "epoch": 1887} {"train_loss": -41.988887786865234, "global_step": 228361, "epoch": 1887} {"train_loss": -42.22224426269531, "global_step": 228362, "epoch": 1887} {"train_loss": -41.9215087890625, "global_step": 228363, "epoch": 1887} {"train_loss": -41.80310821533203, "global_step": 228364, "epoch": 1887} {"train_loss": -41.47260284423828, "global_step": 228365, "epoch": 1887} {"train_loss": -42.545387268066406, "global_step": 228366, "epoch": 1887} {"train_loss": -42.3493766784668, "global_step": 228367, "epoch": 1887} {"train_loss": -42.36564254760742, "global_step": 228368, "epoch": 1887} {"train_loss": -42.502471923828125, "global_step": 228369, "epoch": 1887} {"train_loss": -42.67433547973633, "global_step": 228370, "epoch": 1887} {"train_loss": -42.3564453125, "global_step": 228371, "epoch": 1887} {"train_loss": -42.60380935668945, "global_step": 228372, "epoch": 1887} {"train_loss": -42.16779327392578, "global_step": 228373, "epoch": 1887} {"train_loss": -42.64677047729492, "global_step": 228374, "epoch": 1887} {"train_loss": -42.333961486816406, "global_step": 228375, "epoch": 1887} {"train_loss": -40.42477035522461, "global_step": 228376, "epoch": 1887} {"train_loss": -42.05308151245117, "global_step": 228377, "epoch": 1887} {"train_loss": -41.679168701171875, "global_step": 228378, "epoch": 1887} {"train_loss": -40.83522415161133, "global_step": 228379, "epoch": 1887} {"train_loss": -39.365577697753906, "global_step": 228380, "epoch": 1887} {"train_loss": -40.465450286865234, "global_step": 228381, "epoch": 1887} {"train_loss": -42.46079635620117, "global_step": 228382, "epoch": 1887} {"train_loss": -41.93531036376953, "global_step": 228383, "epoch": 1887} {"train_loss": -40.54047393798828, "global_step": 228384, "epoch": 1887} {"train_loss": -40.57737731933594, "global_step": 228385, "epoch": 1887} {"train_loss": -38.770782470703125, "global_step": 228386, "epoch": 1887} {"train_loss": -40.009761810302734, "global_step": 228387, "epoch": 1887} {"train_loss": -42.16993713378906, "global_step": 228388, "epoch": 1887} {"train_loss": -40.91379928588867, "global_step": 228389, "epoch": 1887} {"train_loss": -39.54462814331055, "global_step": 228390, "epoch": 1887} {"train_loss": -41.51905059814453, "global_step": 228391, "epoch": 1887} {"train_loss": -41.92859649658203, "global_step": 228392, "epoch": 1887} {"train_loss": -40.704158782958984, "global_step": 228393, "epoch": 1887} {"train_loss": -41.692115783691406, "global_step": 228394, "epoch": 1887} {"train_loss": -41.94523239135742, "global_step": 228395, "epoch": 1887} {"train_loss": -40.70298385620117, "global_step": 228396, "epoch": 1887} {"train_loss": -41.7318229675293, "global_step": 228397, "epoch": 1887} {"train_loss": -41.93941879272461, "global_step": 228398, "epoch": 1887} {"train_loss": -40.60892868041992, "global_step": 228399, "epoch": 1887} {"train_loss": -39.89647674560547, "global_step": 228400, "epoch": 1887} {"train_loss": -38.40592575073242, "global_step": 228401, "epoch": 1887} {"train_loss": -39.78365707397461, "global_step": 228402, "epoch": 1887} {"train_loss": -41.894710540771484, "global_step": 228403, "epoch": 1887} {"train_loss": -41.14616012573242, "global_step": 228404, "epoch": 1887} {"train_loss": -39.92648696899414, "global_step": 228405, "epoch": 1887} {"train_loss": -41.251041412353516, "global_step": 228406, "epoch": 1887} {"train_loss": -39.91920852661133, "global_step": 228407, "epoch": 1887} {"train_loss": -39.051570892333984, "global_step": 228408, "epoch": 1887} {"train_loss": -40.66523361206055, "global_step": 228409, "epoch": 1887} {"train_loss": -40.86750030517578, "global_step": 228410, "epoch": 1887} {"train_loss": -40.88543701171875, "global_step": 228411, "epoch": 1887} {"train_loss": -40.310787200927734, "global_step": 228412, "epoch": 1887} {"train_loss": -41.19267272949219, "global_step": 228413, "epoch": 1887} {"train_loss": -41.732276916503906, "global_step": 228414, "epoch": 1887} {"train_loss": -40.85091781616211, "global_step": 228415, "epoch": 1887} {"train_loss": -42.42709732055664, "global_step": 228416, "epoch": 1887} {"train_loss": -42.26823425292969, "global_step": 228417, "epoch": 1887} {"train_loss": -41.59587860107422, "global_step": 228418, "epoch": 1887} {"train_loss": -41.70453643798828, "global_step": 228419, "epoch": 1887} {"train_loss": -41.92207336425781, "global_step": 228420, "epoch": 1887} {"train_loss": -41.3011474609375, "global_step": 228421, "epoch": 1887} {"train_loss": -41.83320999145508, "global_step": 228422, "epoch": 1887} {"train_loss": -41.723384857177734, "global_step": 228423, "epoch": 1887} {"train_loss": -41.56586837768555, "global_step": 228424, "epoch": 1887} {"train_loss": -41.90282440185547, "global_step": 228425, "epoch": 1887} {"train_loss": -42.240665435791016, "global_step": 228426, "epoch": 1887} {"train_loss": -42.3661994934082, "global_step": 228427, "epoch": 1887} {"train_loss": -41.90918731689453, "global_step": 228428, "epoch": 1887} {"train_loss": -42.202125549316406, "global_step": 228429, "epoch": 1887} {"train_loss": -42.31136703491211, "global_step": 228430, "epoch": 1887} {"train_loss": -42.30582046508789, "global_step": 228431, "epoch": 1887} {"train_loss": -40.766014099121094, "global_step": 228432, "epoch": 1887} {"train_loss": -41.925533294677734, "global_step": 228433, "epoch": 1887} {"train_loss": -41.98472595214844, "global_step": 228434, "epoch": 1887} {"train_loss": -42.1427001953125, "global_step": 228435, "epoch": 1887} {"train_loss": -41.23505401611328, "global_step": 228436, "epoch": 1887} {"train_loss": -42.40922927856445, "global_step": 228437, "epoch": 1887} {"train_loss": -41.38687515258789, "global_step": 228438, "epoch": 1887} {"train_loss": -42.020389556884766, "global_step": 228439, "epoch": 1887} {"train_loss": -41.08370590209961, "global_step": 228440, "epoch": 1887} {"train_loss": -41.41219711303711, "global_step": 228441, "epoch": 1887} {"train_loss": -40.279659271240234, "global_step": 228442, "epoch": 1887} {"train_loss": -40.66572952270508, "global_step": 228443, "epoch": 1887} {"train_loss": -39.9763069152832, "global_step": 228444, "epoch": 1887} {"train_loss": -40.51362991333008, "global_step": 228445, "epoch": 1887} {"train_loss": -39.7049446105957, "global_step": 228446, "epoch": 1887} {"train_loss": -41.46229449185458, "global_step": 228447, "epoch": 1887, "val_loss": 2580446.25} {"train_loss": -40.8667106628418, "global_step": 228448, "epoch": 1888} {"train_loss": -41.375858306884766, "global_step": 228449, "epoch": 1888} {"train_loss": -42.199649810791016, "global_step": 228450, "epoch": 1888} {"train_loss": -42.463050842285156, "global_step": 228451, "epoch": 1888} {"train_loss": -40.63241195678711, "global_step": 228452, "epoch": 1888} {"train_loss": -39.937828063964844, "global_step": 228453, "epoch": 1888} {"train_loss": -38.522586822509766, "global_step": 228454, "epoch": 1888} {"train_loss": -41.96961975097656, "global_step": 228455, "epoch": 1888} {"train_loss": -41.06504440307617, "global_step": 228456, "epoch": 1888} {"train_loss": -39.70795440673828, "global_step": 228457, "epoch": 1888} {"train_loss": -41.3017692565918, "global_step": 228458, "epoch": 1888} {"train_loss": -41.510414123535156, "global_step": 228459, "epoch": 1888} {"train_loss": -39.91685104370117, "global_step": 228460, "epoch": 1888} {"train_loss": -42.026580810546875, "global_step": 228461, "epoch": 1888} {"train_loss": -41.29574203491211, "global_step": 228462, "epoch": 1888} {"train_loss": -39.15903854370117, "global_step": 228463, "epoch": 1888} {"train_loss": -42.19904327392578, "global_step": 228464, "epoch": 1888} {"train_loss": -40.56187057495117, "global_step": 228465, "epoch": 1888} {"train_loss": -39.410884857177734, "global_step": 228466, "epoch": 1888} {"train_loss": -41.06325149536133, "global_step": 228467, "epoch": 1888} {"train_loss": -41.10260009765625, "global_step": 228468, "epoch": 1888} {"train_loss": -41.91964340209961, "global_step": 228469, "epoch": 1888} {"train_loss": -42.077884674072266, "global_step": 228470, "epoch": 1888} {"train_loss": -41.8484001159668, "global_step": 228471, "epoch": 1888} {"train_loss": -41.84818649291992, "global_step": 228472, "epoch": 1888} {"train_loss": -42.01106643676758, "global_step": 228473, "epoch": 1888} {"train_loss": -42.185001373291016, "global_step": 228474, "epoch": 1888} {"train_loss": -41.82350158691406, "global_step": 228475, "epoch": 1888} {"train_loss": -42.35602569580078, "global_step": 228476, "epoch": 1888} {"train_loss": -41.79751205444336, "global_step": 228477, "epoch": 1888} {"train_loss": -40.72050857543945, "global_step": 228478, "epoch": 1888} {"train_loss": -42.4768180847168, "global_step": 228479, "epoch": 1888} {"train_loss": -40.51125717163086, "global_step": 228480, "epoch": 1888} {"train_loss": -41.7730712890625, "global_step": 228481, "epoch": 1888} {"train_loss": -40.10098648071289, "global_step": 228482, "epoch": 1888} {"train_loss": -42.08496856689453, "global_step": 228483, "epoch": 1888} {"train_loss": -41.82371139526367, "global_step": 228484, "epoch": 1888} {"train_loss": -41.841468811035156, "global_step": 228485, "epoch": 1888} {"train_loss": -41.406097412109375, "global_step": 228486, "epoch": 1888} {"train_loss": -41.24282455444336, "global_step": 228487, "epoch": 1888} {"train_loss": -42.71290969848633, "global_step": 228488, "epoch": 1888} {"train_loss": -42.67755126953125, "global_step": 228489, "epoch": 1888} {"train_loss": -42.201908111572266, "global_step": 228490, "epoch": 1888} {"train_loss": -42.28994369506836, "global_step": 228491, "epoch": 1888} {"train_loss": -40.52322769165039, "global_step": 228492, "epoch": 1888} {"train_loss": -41.82731246948242, "global_step": 228493, "epoch": 1888} {"train_loss": -42.867244720458984, "global_step": 228494, "epoch": 1888} {"train_loss": -43.00870895385742, "global_step": 228495, "epoch": 1888} {"train_loss": -41.553802490234375, "global_step": 228496, "epoch": 1888} {"train_loss": -42.826473236083984, "global_step": 228497, "epoch": 1888} {"train_loss": -42.6975212097168, "global_step": 228498, "epoch": 1888} {"train_loss": -39.91126251220703, "global_step": 228499, "epoch": 1888} {"train_loss": -42.534908294677734, "global_step": 228500, "epoch": 1888} {"train_loss": -42.57526779174805, "global_step": 228501, "epoch": 1888} {"train_loss": -42.51668930053711, "global_step": 228502, "epoch": 1888} {"train_loss": -38.636024475097656, "global_step": 228503, "epoch": 1888} {"train_loss": -41.92054748535156, "global_step": 228504, "epoch": 1888} {"train_loss": -42.58675765991211, "global_step": 228505, "epoch": 1888} {"train_loss": -42.830726623535156, "global_step": 228506, "epoch": 1888} {"train_loss": -43.116973876953125, "global_step": 228507, "epoch": 1888} {"train_loss": -42.56455612182617, "global_step": 228508, "epoch": 1888} {"train_loss": -41.89227294921875, "global_step": 228509, "epoch": 1888} {"train_loss": -42.132747650146484, "global_step": 228510, "epoch": 1888} {"train_loss": -42.81189727783203, "global_step": 228511, "epoch": 1888} {"train_loss": -41.25849533081055, "global_step": 228512, "epoch": 1888} {"train_loss": -40.877479553222656, "global_step": 228513, "epoch": 1888} {"train_loss": -41.576416015625, "global_step": 228514, "epoch": 1888} {"train_loss": -42.03426742553711, "global_step": 228515, "epoch": 1888} {"train_loss": -42.82683181762695, "global_step": 228516, "epoch": 1888} {"train_loss": -33.6890754699707, "global_step": 228517, "epoch": 1888} {"train_loss": -41.33738327026367, "global_step": 228518, "epoch": 1888} {"train_loss": -35.1429557800293, "global_step": 228519, "epoch": 1888} {"train_loss": -41.202980041503906, "global_step": 228520, "epoch": 1888} {"train_loss": -41.98549270629883, "global_step": 228521, "epoch": 1888} {"train_loss": -41.78695297241211, "global_step": 228522, "epoch": 1888} {"train_loss": -41.357295989990234, "global_step": 228523, "epoch": 1888} {"train_loss": -41.75698471069336, "global_step": 228524, "epoch": 1888} {"train_loss": -35.959896087646484, "global_step": 228525, "epoch": 1888} {"train_loss": -41.69172668457031, "global_step": 228526, "epoch": 1888} {"train_loss": -42.030025482177734, "global_step": 228527, "epoch": 1888} {"train_loss": -40.82073974609375, "global_step": 228528, "epoch": 1888} {"train_loss": -40.73390579223633, "global_step": 228529, "epoch": 1888} {"train_loss": -40.67458724975586, "global_step": 228530, "epoch": 1888} {"train_loss": -41.3118782043457, "global_step": 228531, "epoch": 1888} {"train_loss": -41.38685607910156, "global_step": 228532, "epoch": 1888} {"train_loss": -41.83245849609375, "global_step": 228533, "epoch": 1888} {"train_loss": -41.32011032104492, "global_step": 228534, "epoch": 1888} {"train_loss": -41.44602584838867, "global_step": 228535, "epoch": 1888} {"train_loss": -42.032283782958984, "global_step": 228536, "epoch": 1888} {"train_loss": -40.367191314697266, "global_step": 228537, "epoch": 1888} {"train_loss": -40.2510871887207, "global_step": 228538, "epoch": 1888} {"train_loss": -41.90040969848633, "global_step": 228539, "epoch": 1888} {"train_loss": -40.62046813964844, "global_step": 228540, "epoch": 1888} {"train_loss": -41.00434112548828, "global_step": 228541, "epoch": 1888} {"train_loss": -34.94989776611328, "global_step": 228542, "epoch": 1888} {"train_loss": -40.4992790222168, "global_step": 228543, "epoch": 1888} {"train_loss": -40.40798568725586, "global_step": 228544, "epoch": 1888} {"train_loss": -42.156314849853516, "global_step": 228545, "epoch": 1888} {"train_loss": -40.64536666870117, "global_step": 228546, "epoch": 1888} {"train_loss": -39.72187423706055, "global_step": 228547, "epoch": 1888} {"train_loss": -41.4868278503418, "global_step": 228548, "epoch": 1888} {"train_loss": -42.156612396240234, "global_step": 228549, "epoch": 1888} {"train_loss": -40.217498779296875, "global_step": 228550, "epoch": 1888} {"train_loss": -42.14132308959961, "global_step": 228551, "epoch": 1888} {"train_loss": -41.53193283081055, "global_step": 228552, "epoch": 1888} {"train_loss": -41.449520111083984, "global_step": 228553, "epoch": 1888} {"train_loss": -41.065494537353516, "global_step": 228554, "epoch": 1888} {"train_loss": -41.716304779052734, "global_step": 228555, "epoch": 1888} {"train_loss": -41.390220642089844, "global_step": 228556, "epoch": 1888} {"train_loss": -40.731937408447266, "global_step": 228557, "epoch": 1888} {"train_loss": -37.214141845703125, "global_step": 228558, "epoch": 1888} {"train_loss": -41.063907623291016, "global_step": 228559, "epoch": 1888} {"train_loss": -40.602760314941406, "global_step": 228560, "epoch": 1888} {"train_loss": -39.323883056640625, "global_step": 228561, "epoch": 1888} {"train_loss": -39.85163497924805, "global_step": 228562, "epoch": 1888} {"train_loss": -41.62025451660156, "global_step": 228563, "epoch": 1888} {"train_loss": -39.77722930908203, "global_step": 228564, "epoch": 1888} {"train_loss": -39.41004943847656, "global_step": 228565, "epoch": 1888} {"train_loss": -39.168148040771484, "global_step": 228566, "epoch": 1888} {"train_loss": -39.263240814208984, "global_step": 228567, "epoch": 1888} {"train_loss": -41.11159509075575, "global_step": 228568, "epoch": 1888, "val_loss": 2685637.0} {"train_loss": -39.593505859375, "global_step": 228569, "epoch": 1889} {"train_loss": -40.81559371948242, "global_step": 228570, "epoch": 1889} {"train_loss": -42.083961486816406, "global_step": 228571, "epoch": 1889} {"train_loss": -39.03972244262695, "global_step": 228572, "epoch": 1889} {"train_loss": -40.93701934814453, "global_step": 228573, "epoch": 1889} {"train_loss": -41.383880615234375, "global_step": 228574, "epoch": 1889} {"train_loss": -42.382022857666016, "global_step": 228575, "epoch": 1889} {"train_loss": -41.91993713378906, "global_step": 228576, "epoch": 1889} {"train_loss": -41.84331512451172, "global_step": 228577, "epoch": 1889} {"train_loss": -37.371158599853516, "global_step": 228578, "epoch": 1889} {"train_loss": -41.69865036010742, "global_step": 228579, "epoch": 1889} {"train_loss": -41.697566986083984, "global_step": 228580, "epoch": 1889} {"train_loss": -38.39653778076172, "global_step": 228581, "epoch": 1889} {"train_loss": -42.000526428222656, "global_step": 228582, "epoch": 1889} {"train_loss": -39.02997970581055, "global_step": 228583, "epoch": 1889} {"train_loss": -40.01183319091797, "global_step": 228584, "epoch": 1889} {"train_loss": -41.418365478515625, "global_step": 228585, "epoch": 1889} {"train_loss": -41.121334075927734, "global_step": 228586, "epoch": 1889} {"train_loss": -42.130470275878906, "global_step": 228587, "epoch": 1889} {"train_loss": -42.07536697387695, "global_step": 228588, "epoch": 1889} {"train_loss": -40.38945007324219, "global_step": 228589, "epoch": 1889} {"train_loss": -40.99872970581055, "global_step": 228590, "epoch": 1889} {"train_loss": -41.43548583984375, "global_step": 228591, "epoch": 1889} {"train_loss": -41.840206146240234, "global_step": 228592, "epoch": 1889} {"train_loss": -42.14942169189453, "global_step": 228593, "epoch": 1889} {"train_loss": -42.08652877807617, "global_step": 228594, "epoch": 1889} {"train_loss": -41.822540283203125, "global_step": 228595, "epoch": 1889} {"train_loss": -40.74345779418945, "global_step": 228596, "epoch": 1889} {"train_loss": -40.775634765625, "global_step": 228597, "epoch": 1889} {"train_loss": -40.8092155456543, "global_step": 228598, "epoch": 1889} {"train_loss": -42.16346740722656, "global_step": 228599, "epoch": 1889} {"train_loss": -42.27570724487305, "global_step": 228600, "epoch": 1889} {"train_loss": -41.75535202026367, "global_step": 228601, "epoch": 1889} {"train_loss": -41.9202995300293, "global_step": 228602, "epoch": 1889} {"train_loss": -41.544471740722656, "global_step": 228603, "epoch": 1889} {"train_loss": -41.89323425292969, "global_step": 228604, "epoch": 1889} {"train_loss": -42.00761795043945, "global_step": 228605, "epoch": 1889} {"train_loss": -40.98960876464844, "global_step": 228606, "epoch": 1889} {"train_loss": -42.22300720214844, "global_step": 228607, "epoch": 1889} {"train_loss": -41.25105667114258, "global_step": 228608, "epoch": 1889} {"train_loss": -40.90449142456055, "global_step": 228609, "epoch": 1889} {"train_loss": -40.887725830078125, "global_step": 228610, "epoch": 1889} {"train_loss": -40.972877502441406, "global_step": 228611, "epoch": 1889} {"train_loss": -41.913333892822266, "global_step": 228612, "epoch": 1889} {"train_loss": -42.31917190551758, "global_step": 228613, "epoch": 1889} {"train_loss": -40.07685470581055, "global_step": 228614, "epoch": 1889} {"train_loss": -40.93135452270508, "global_step": 228615, "epoch": 1889} {"train_loss": -41.86396408081055, "global_step": 228616, "epoch": 1889} {"train_loss": -40.10860824584961, "global_step": 228617, "epoch": 1889} {"train_loss": -40.613037109375, "global_step": 228618, "epoch": 1889} {"train_loss": -40.724544525146484, "global_step": 228619, "epoch": 1889} {"train_loss": -42.20331573486328, "global_step": 228620, "epoch": 1889} {"train_loss": -41.17849349975586, "global_step": 228621, "epoch": 1889} {"train_loss": -39.73584747314453, "global_step": 228622, "epoch": 1889} {"train_loss": -40.95276641845703, "global_step": 228623, "epoch": 1889} {"train_loss": -42.26814651489258, "global_step": 228624, "epoch": 1889} {"train_loss": -39.50425338745117, "global_step": 228625, "epoch": 1889} {"train_loss": -39.44118118286133, "global_step": 228626, "epoch": 1889} {"train_loss": -40.29156494140625, "global_step": 228627, "epoch": 1889} {"train_loss": -41.720054626464844, "global_step": 228628, "epoch": 1889} {"train_loss": -38.56986618041992, "global_step": 228629, "epoch": 1889} {"train_loss": -38.867305755615234, "global_step": 228630, "epoch": 1889} {"train_loss": -42.13070297241211, "global_step": 228631, "epoch": 1889} {"train_loss": -41.04706573486328, "global_step": 228632, "epoch": 1889} {"train_loss": -41.62224197387695, "global_step": 228633, "epoch": 1889} {"train_loss": -42.00384521484375, "global_step": 228634, "epoch": 1889} {"train_loss": -42.139503479003906, "global_step": 228635, "epoch": 1889} {"train_loss": -39.92641067504883, "global_step": 228636, "epoch": 1889} {"train_loss": -41.448463439941406, "global_step": 228637, "epoch": 1889} {"train_loss": -41.696380615234375, "global_step": 228638, "epoch": 1889} {"train_loss": -42.51198196411133, "global_step": 228639, "epoch": 1889} {"train_loss": -41.72265625, "global_step": 228640, "epoch": 1889} {"train_loss": -41.831878662109375, "global_step": 228641, "epoch": 1889} {"train_loss": -41.788944244384766, "global_step": 228642, "epoch": 1889} {"train_loss": -41.86983871459961, "global_step": 228643, "epoch": 1889} {"train_loss": -42.23414611816406, "global_step": 228644, "epoch": 1889} {"train_loss": -41.24211502075195, "global_step": 228645, "epoch": 1889} {"train_loss": -40.96119689941406, "global_step": 228646, "epoch": 1889} {"train_loss": -41.67744445800781, "global_step": 228647, "epoch": 1889} {"train_loss": -41.34939193725586, "global_step": 228648, "epoch": 1889} {"train_loss": -41.52854919433594, "global_step": 228649, "epoch": 1889} {"train_loss": -41.34287643432617, "global_step": 228650, "epoch": 1889} {"train_loss": -41.67692184448242, "global_step": 228651, "epoch": 1889} {"train_loss": -42.22062301635742, "global_step": 228652, "epoch": 1889} {"train_loss": -41.87653350830078, "global_step": 228653, "epoch": 1889} {"train_loss": -41.989967346191406, "global_step": 228654, "epoch": 1889} {"train_loss": -42.25665283203125, "global_step": 228655, "epoch": 1889} {"train_loss": -42.05283737182617, "global_step": 228656, "epoch": 1889} {"train_loss": -42.0267448425293, "global_step": 228657, "epoch": 1889} {"train_loss": -42.67869567871094, "global_step": 228658, "epoch": 1889} {"train_loss": -41.695682525634766, "global_step": 228659, "epoch": 1889} {"train_loss": -41.00638961791992, "global_step": 228660, "epoch": 1889} {"train_loss": -42.117958068847656, "global_step": 228661, "epoch": 1889} {"train_loss": -41.56982421875, "global_step": 228662, "epoch": 1889} {"train_loss": -41.574371337890625, "global_step": 228663, "epoch": 1889} {"train_loss": -41.100624084472656, "global_step": 228664, "epoch": 1889} {"train_loss": -41.34914779663086, "global_step": 228665, "epoch": 1889} {"train_loss": -42.0494499206543, "global_step": 228666, "epoch": 1889} {"train_loss": -42.125213623046875, "global_step": 228667, "epoch": 1889} {"train_loss": -42.3614616394043, "global_step": 228668, "epoch": 1889} {"train_loss": -41.93701934814453, "global_step": 228669, "epoch": 1889} {"train_loss": -40.86566162109375, "global_step": 228670, "epoch": 1889} {"train_loss": -39.3106689453125, "global_step": 228671, "epoch": 1889} {"train_loss": -41.99380111694336, "global_step": 228672, "epoch": 1889} {"train_loss": -40.509796142578125, "global_step": 228673, "epoch": 1889} {"train_loss": -41.565731048583984, "global_step": 228674, "epoch": 1889} {"train_loss": -40.1987419128418, "global_step": 228675, "epoch": 1889} {"train_loss": -41.23320388793945, "global_step": 228676, "epoch": 1889} {"train_loss": -41.39337158203125, "global_step": 228677, "epoch": 1889} {"train_loss": -41.6077880859375, "global_step": 228678, "epoch": 1889} {"train_loss": -41.890625, "global_step": 228679, "epoch": 1889} {"train_loss": -40.91062545776367, "global_step": 228680, "epoch": 1889} {"train_loss": -41.2983283996582, "global_step": 228681, "epoch": 1889} {"train_loss": -41.42177200317383, "global_step": 228682, "epoch": 1889} {"train_loss": -41.771087646484375, "global_step": 228683, "epoch": 1889} {"train_loss": -42.290435791015625, "global_step": 228684, "epoch": 1889} {"train_loss": -41.49302291870117, "global_step": 228685, "epoch": 1889} {"train_loss": -42.29549789428711, "global_step": 228686, "epoch": 1889} {"train_loss": -41.71780014038086, "global_step": 228687, "epoch": 1889} {"train_loss": -41.690677642822266, "global_step": 228688, "epoch": 1889} {"train_loss": -41.317489056547814, "global_step": 228689, "epoch": 1889, "val_loss": 2516502.25} {"train_loss": -42.3801383972168, "global_step": 228690, "epoch": 1890} {"train_loss": -42.323150634765625, "global_step": 228691, "epoch": 1890} {"train_loss": -41.4198112487793, "global_step": 228692, "epoch": 1890} {"train_loss": -41.93058776855469, "global_step": 228693, "epoch": 1890} {"train_loss": -42.1126708984375, "global_step": 228694, "epoch": 1890} {"train_loss": -40.733787536621094, "global_step": 228695, "epoch": 1890} {"train_loss": -42.09657669067383, "global_step": 228696, "epoch": 1890} {"train_loss": -42.071285247802734, "global_step": 228697, "epoch": 1890} {"train_loss": -42.28773498535156, "global_step": 228698, "epoch": 1890} {"train_loss": -42.51631164550781, "global_step": 228699, "epoch": 1890} {"train_loss": -41.22877883911133, "global_step": 228700, "epoch": 1890} {"train_loss": -41.41123962402344, "global_step": 228701, "epoch": 1890} {"train_loss": -42.09035873413086, "global_step": 228702, "epoch": 1890} {"train_loss": -42.07716369628906, "global_step": 228703, "epoch": 1890} {"train_loss": -41.62771224975586, "global_step": 228704, "epoch": 1890} {"train_loss": -42.11532974243164, "global_step": 228705, "epoch": 1890} {"train_loss": -42.53375244140625, "global_step": 228706, "epoch": 1890} {"train_loss": -42.823638916015625, "global_step": 228707, "epoch": 1890} {"train_loss": -42.34196853637695, "global_step": 228708, "epoch": 1890} {"train_loss": -42.4239501953125, "global_step": 228709, "epoch": 1890} {"train_loss": -43.2821159362793, "global_step": 228710, "epoch": 1890} {"train_loss": -41.55193328857422, "global_step": 228711, "epoch": 1890} {"train_loss": -42.39480972290039, "global_step": 228712, "epoch": 1890} {"train_loss": -42.36138916015625, "global_step": 228713, "epoch": 1890} {"train_loss": -43.31549835205078, "global_step": 228714, "epoch": 1890} {"train_loss": -42.492828369140625, "global_step": 228715, "epoch": 1890} {"train_loss": -42.7665901184082, "global_step": 228716, "epoch": 1890} {"train_loss": -42.3248291015625, "global_step": 228717, "epoch": 1890} {"train_loss": -41.566078186035156, "global_step": 228718, "epoch": 1890} {"train_loss": -41.11377716064453, "global_step": 228719, "epoch": 1890} {"train_loss": -41.77785873413086, "global_step": 228720, "epoch": 1890} {"train_loss": -42.86782455444336, "global_step": 228721, "epoch": 1890} {"train_loss": -41.360164642333984, "global_step": 228722, "epoch": 1890} {"train_loss": -37.98676300048828, "global_step": 228723, "epoch": 1890} {"train_loss": -38.934322357177734, "global_step": 228724, "epoch": 1890} {"train_loss": -41.47941970825195, "global_step": 228725, "epoch": 1890} {"train_loss": -40.67363357543945, "global_step": 228726, "epoch": 1890} {"train_loss": -38.77711486816406, "global_step": 228727, "epoch": 1890} {"train_loss": -41.28373336791992, "global_step": 228728, "epoch": 1890} {"train_loss": -42.09951400756836, "global_step": 228729, "epoch": 1890} {"train_loss": -40.683834075927734, "global_step": 228730, "epoch": 1890} {"train_loss": -40.68233871459961, "global_step": 228731, "epoch": 1890} {"train_loss": -36.936866760253906, "global_step": 228732, "epoch": 1890} {"train_loss": -39.307167053222656, "global_step": 228733, "epoch": 1890} {"train_loss": -41.075279235839844, "global_step": 228734, "epoch": 1890} {"train_loss": -41.207275390625, "global_step": 228735, "epoch": 1890} {"train_loss": -38.635162353515625, "global_step": 228736, "epoch": 1890} {"train_loss": -39.0463981628418, "global_step": 228737, "epoch": 1890} {"train_loss": -41.88485336303711, "global_step": 228738, "epoch": 1890} {"train_loss": -38.32392120361328, "global_step": 228739, "epoch": 1890} {"train_loss": -32.41847610473633, "global_step": 228740, "epoch": 1890} {"train_loss": -39.6701545715332, "global_step": 228741, "epoch": 1890} {"train_loss": -39.48580551147461, "global_step": 228742, "epoch": 1890} {"train_loss": -32.12186050415039, "global_step": 228743, "epoch": 1890} {"train_loss": -40.58007049560547, "global_step": 228744, "epoch": 1890} {"train_loss": -36.99019241333008, "global_step": 228745, "epoch": 1890} {"train_loss": -37.33032989501953, "global_step": 228746, "epoch": 1890} {"train_loss": -40.42325973510742, "global_step": 228747, "epoch": 1890} {"train_loss": -37.10054016113281, "global_step": 228748, "epoch": 1890} {"train_loss": -39.980857849121094, "global_step": 228749, "epoch": 1890} {"train_loss": -39.8928108215332, "global_step": 228750, "epoch": 1890} {"train_loss": -40.59831619262695, "global_step": 228751, "epoch": 1890} {"train_loss": -40.63662338256836, "global_step": 228752, "epoch": 1890} {"train_loss": -40.59507369995117, "global_step": 228753, "epoch": 1890} {"train_loss": -40.5202751159668, "global_step": 228754, "epoch": 1890} {"train_loss": -40.477596282958984, "global_step": 228755, "epoch": 1890} {"train_loss": -41.27439498901367, "global_step": 228756, "epoch": 1890} {"train_loss": -40.08169174194336, "global_step": 228757, "epoch": 1890} {"train_loss": -41.51638412475586, "global_step": 228758, "epoch": 1890} {"train_loss": -40.56025314331055, "global_step": 228759, "epoch": 1890} {"train_loss": -40.840423583984375, "global_step": 228760, "epoch": 1890} {"train_loss": -40.841835021972656, "global_step": 228761, "epoch": 1890} {"train_loss": -40.96394729614258, "global_step": 228762, "epoch": 1890} {"train_loss": -41.33089065551758, "global_step": 228763, "epoch": 1890} {"train_loss": -41.02817153930664, "global_step": 228764, "epoch": 1890} {"train_loss": -41.15952682495117, "global_step": 228765, "epoch": 1890} {"train_loss": -41.766632080078125, "global_step": 228766, "epoch": 1890} {"train_loss": -40.8481559753418, "global_step": 228767, "epoch": 1890} {"train_loss": -42.07670974731445, "global_step": 228768, "epoch": 1890} {"train_loss": -41.36955261230469, "global_step": 228769, "epoch": 1890} {"train_loss": -42.25741195678711, "global_step": 228770, "epoch": 1890} {"train_loss": -41.17377853393555, "global_step": 228771, "epoch": 1890} {"train_loss": -42.539894104003906, "global_step": 228772, "epoch": 1890} {"train_loss": -41.34603500366211, "global_step": 228773, "epoch": 1890} {"train_loss": -42.302207946777344, "global_step": 228774, "epoch": 1890} {"train_loss": -41.551090240478516, "global_step": 228775, "epoch": 1890} {"train_loss": -41.97624206542969, "global_step": 228776, "epoch": 1890} {"train_loss": -42.139190673828125, "global_step": 228777, "epoch": 1890} {"train_loss": -42.00162887573242, "global_step": 228778, "epoch": 1890} {"train_loss": -42.322505950927734, "global_step": 228779, "epoch": 1890} {"train_loss": -42.36957931518555, "global_step": 228780, "epoch": 1890} {"train_loss": -42.424068450927734, "global_step": 228781, "epoch": 1890} {"train_loss": -42.38738250732422, "global_step": 228782, "epoch": 1890} {"train_loss": -42.08203125, "global_step": 228783, "epoch": 1890} {"train_loss": -42.53156280517578, "global_step": 228784, "epoch": 1890} {"train_loss": -42.520572662353516, "global_step": 228785, "epoch": 1890} {"train_loss": -42.924888610839844, "global_step": 228786, "epoch": 1890} {"train_loss": -42.449581146240234, "global_step": 228787, "epoch": 1890} {"train_loss": -42.80410385131836, "global_step": 228788, "epoch": 1890} {"train_loss": -42.749427795410156, "global_step": 228789, "epoch": 1890} {"train_loss": -42.25220489501953, "global_step": 228790, "epoch": 1890} {"train_loss": -42.617835998535156, "global_step": 228791, "epoch": 1890} {"train_loss": -42.91304397583008, "global_step": 228792, "epoch": 1890} {"train_loss": -42.93247604370117, "global_step": 228793, "epoch": 1890} {"train_loss": -42.71734619140625, "global_step": 228794, "epoch": 1890} {"train_loss": -42.84151840209961, "global_step": 228795, "epoch": 1890} {"train_loss": -43.32278060913086, "global_step": 228796, "epoch": 1890} {"train_loss": -42.344703674316406, "global_step": 228797, "epoch": 1890} {"train_loss": -42.344337463378906, "global_step": 228798, "epoch": 1890} {"train_loss": -42.18400192260742, "global_step": 228799, "epoch": 1890} {"train_loss": -43.19649887084961, "global_step": 228800, "epoch": 1890} {"train_loss": -43.0434455871582, "global_step": 228801, "epoch": 1890} {"train_loss": -42.70897674560547, "global_step": 228802, "epoch": 1890} {"train_loss": -43.193817138671875, "global_step": 228803, "epoch": 1890} {"train_loss": -42.81095504760742, "global_step": 228804, "epoch": 1890} {"train_loss": -43.16365432739258, "global_step": 228805, "epoch": 1890} {"train_loss": -43.06689453125, "global_step": 228806, "epoch": 1890} {"train_loss": -43.02289962768555, "global_step": 228807, "epoch": 1890} {"train_loss": -42.89142990112305, "global_step": 228808, "epoch": 1890} {"train_loss": -42.46247482299805, "global_step": 228809, "epoch": 1890} {"train_loss": -41.37906854802912, "global_step": 228810, "epoch": 1890, "val_loss": 2554850.75} {"train_loss": -42.504150390625, "global_step": 228811, "epoch": 1891} {"train_loss": -42.993797302246094, "global_step": 228812, "epoch": 1891} {"train_loss": -42.589813232421875, "global_step": 228813, "epoch": 1891} {"train_loss": -43.10813522338867, "global_step": 228814, "epoch": 1891} {"train_loss": -43.28057861328125, "global_step": 228815, "epoch": 1891} {"train_loss": -43.396278381347656, "global_step": 228816, "epoch": 1891} {"train_loss": -42.51443099975586, "global_step": 228817, "epoch": 1891} {"train_loss": -43.29471206665039, "global_step": 228818, "epoch": 1891} {"train_loss": -42.62234115600586, "global_step": 228819, "epoch": 1891} {"train_loss": -42.4948844909668, "global_step": 228820, "epoch": 1891} {"train_loss": -43.18112564086914, "global_step": 228821, "epoch": 1891} {"train_loss": -42.352928161621094, "global_step": 228822, "epoch": 1891} {"train_loss": -43.09129333496094, "global_step": 228823, "epoch": 1891} {"train_loss": -42.837615966796875, "global_step": 228824, "epoch": 1891} {"train_loss": -43.08361053466797, "global_step": 228825, "epoch": 1891} {"train_loss": -42.92490768432617, "global_step": 228826, "epoch": 1891} {"train_loss": -42.53456497192383, "global_step": 228827, "epoch": 1891} {"train_loss": -41.935665130615234, "global_step": 228828, "epoch": 1891} {"train_loss": -41.36274337768555, "global_step": 228829, "epoch": 1891} {"train_loss": -41.587528228759766, "global_step": 228830, "epoch": 1891} {"train_loss": -42.379638671875, "global_step": 228831, "epoch": 1891} {"train_loss": -42.23368453979492, "global_step": 228832, "epoch": 1891} {"train_loss": -43.215335845947266, "global_step": 228833, "epoch": 1891} {"train_loss": -42.109283447265625, "global_step": 228834, "epoch": 1891} {"train_loss": -41.736270904541016, "global_step": 228835, "epoch": 1891} {"train_loss": -42.25942611694336, "global_step": 228836, "epoch": 1891} {"train_loss": -42.32623291015625, "global_step": 228837, "epoch": 1891} {"train_loss": -42.38994216918945, "global_step": 228838, "epoch": 1891} {"train_loss": -41.988399505615234, "global_step": 228839, "epoch": 1891} {"train_loss": -42.65061569213867, "global_step": 228840, "epoch": 1891} {"train_loss": -41.90022659301758, "global_step": 228841, "epoch": 1891} {"train_loss": -41.71158981323242, "global_step": 228842, "epoch": 1891} {"train_loss": -42.057586669921875, "global_step": 228843, "epoch": 1891} {"train_loss": -41.68509292602539, "global_step": 228844, "epoch": 1891} {"train_loss": -41.986793518066406, "global_step": 228845, "epoch": 1891} {"train_loss": -42.78001403808594, "global_step": 228846, "epoch": 1891} {"train_loss": -42.26191329956055, "global_step": 228847, "epoch": 1891} {"train_loss": -41.5039176940918, "global_step": 228848, "epoch": 1891} {"train_loss": -41.76157760620117, "global_step": 228849, "epoch": 1891} {"train_loss": -41.078731536865234, "global_step": 228850, "epoch": 1891} {"train_loss": -41.83552932739258, "global_step": 228851, "epoch": 1891} {"train_loss": -42.84135437011719, "global_step": 228852, "epoch": 1891} {"train_loss": -42.053070068359375, "global_step": 228853, "epoch": 1891} {"train_loss": -41.18935012817383, "global_step": 228854, "epoch": 1891} {"train_loss": -42.40290451049805, "global_step": 228855, "epoch": 1891} {"train_loss": -41.93045425415039, "global_step": 228856, "epoch": 1891} {"train_loss": -42.50837326049805, "global_step": 228857, "epoch": 1891} {"train_loss": -42.32508087158203, "global_step": 228858, "epoch": 1891} {"train_loss": -41.78818893432617, "global_step": 228859, "epoch": 1891} {"train_loss": -41.28150939941406, "global_step": 228860, "epoch": 1891} {"train_loss": -41.54698944091797, "global_step": 228861, "epoch": 1891} {"train_loss": -42.18880844116211, "global_step": 228862, "epoch": 1891} {"train_loss": -41.202613830566406, "global_step": 228863, "epoch": 1891} {"train_loss": -41.09136962890625, "global_step": 228864, "epoch": 1891} {"train_loss": -42.050968170166016, "global_step": 228865, "epoch": 1891} {"train_loss": -42.300289154052734, "global_step": 228866, "epoch": 1891} {"train_loss": -42.392940521240234, "global_step": 228867, "epoch": 1891} {"train_loss": -41.81958770751953, "global_step": 228868, "epoch": 1891} {"train_loss": -40.87260437011719, "global_step": 228869, "epoch": 1891} {"train_loss": -41.6317253112793, "global_step": 228870, "epoch": 1891} {"train_loss": -41.155487060546875, "global_step": 228871, "epoch": 1891} {"train_loss": -42.319976806640625, "global_step": 228872, "epoch": 1891} {"train_loss": -41.475074768066406, "global_step": 228873, "epoch": 1891} {"train_loss": -40.87097930908203, "global_step": 228874, "epoch": 1891} {"train_loss": -41.75576400756836, "global_step": 228875, "epoch": 1891} {"train_loss": -41.536808013916016, "global_step": 228876, "epoch": 1891} {"train_loss": -40.789039611816406, "global_step": 228877, "epoch": 1891} {"train_loss": -39.65058517456055, "global_step": 228878, "epoch": 1891} {"train_loss": -40.96718215942383, "global_step": 228879, "epoch": 1891} {"train_loss": -41.28731155395508, "global_step": 228880, "epoch": 1891} {"train_loss": -40.77985763549805, "global_step": 228881, "epoch": 1891} {"train_loss": -42.01459884643555, "global_step": 228882, "epoch": 1891} {"train_loss": -41.908016204833984, "global_step": 228883, "epoch": 1891} {"train_loss": -41.96792221069336, "global_step": 228884, "epoch": 1891} {"train_loss": -41.6469841003418, "global_step": 228885, "epoch": 1891} {"train_loss": -41.53514099121094, "global_step": 228886, "epoch": 1891} {"train_loss": -41.63459014892578, "global_step": 228887, "epoch": 1891} {"train_loss": -42.81529235839844, "global_step": 228888, "epoch": 1891} {"train_loss": -41.02790069580078, "global_step": 228889, "epoch": 1891} {"train_loss": -41.230831146240234, "global_step": 228890, "epoch": 1891} {"train_loss": -42.690425872802734, "global_step": 228891, "epoch": 1891} {"train_loss": -41.23153305053711, "global_step": 228892, "epoch": 1891} {"train_loss": -41.04084014892578, "global_step": 228893, "epoch": 1891} {"train_loss": -42.49503707885742, "global_step": 228894, "epoch": 1891} {"train_loss": -41.712703704833984, "global_step": 228895, "epoch": 1891} {"train_loss": -40.598079681396484, "global_step": 228896, "epoch": 1891} {"train_loss": -42.24506759643555, "global_step": 228897, "epoch": 1891} {"train_loss": -42.63165283203125, "global_step": 228898, "epoch": 1891} {"train_loss": -41.36149215698242, "global_step": 228899, "epoch": 1891} {"train_loss": -41.9259147644043, "global_step": 228900, "epoch": 1891} {"train_loss": -41.297462463378906, "global_step": 228901, "epoch": 1891} {"train_loss": -41.00453567504883, "global_step": 228902, "epoch": 1891} {"train_loss": -43.026912689208984, "global_step": 228903, "epoch": 1891} {"train_loss": -41.311744689941406, "global_step": 228904, "epoch": 1891} {"train_loss": -41.505855560302734, "global_step": 228905, "epoch": 1891} {"train_loss": -42.58285903930664, "global_step": 228906, "epoch": 1891} {"train_loss": -41.96473693847656, "global_step": 228907, "epoch": 1891} {"train_loss": -41.94791793823242, "global_step": 228908, "epoch": 1891} {"train_loss": -42.4222412109375, "global_step": 228909, "epoch": 1891} {"train_loss": -42.60917663574219, "global_step": 228910, "epoch": 1891} {"train_loss": -42.86956787109375, "global_step": 228911, "epoch": 1891} {"train_loss": -41.6162223815918, "global_step": 228912, "epoch": 1891} {"train_loss": -42.5046272277832, "global_step": 228913, "epoch": 1891} {"train_loss": -42.419490814208984, "global_step": 228914, "epoch": 1891} {"train_loss": -41.885345458984375, "global_step": 228915, "epoch": 1891} {"train_loss": -42.128170013427734, "global_step": 228916, "epoch": 1891} {"train_loss": -42.56673812866211, "global_step": 228917, "epoch": 1891} {"train_loss": -42.65752029418945, "global_step": 228918, "epoch": 1891} {"train_loss": -42.303436279296875, "global_step": 228919, "epoch": 1891} {"train_loss": -42.51655578613281, "global_step": 228920, "epoch": 1891} {"train_loss": -43.28187942504883, "global_step": 228921, "epoch": 1891} {"train_loss": -42.81010818481445, "global_step": 228922, "epoch": 1891} {"train_loss": -42.865135192871094, "global_step": 228923, "epoch": 1891} {"train_loss": -42.131710052490234, "global_step": 228924, "epoch": 1891} {"train_loss": -42.544349670410156, "global_step": 228925, "epoch": 1891} {"train_loss": -42.87700653076172, "global_step": 228926, "epoch": 1891} {"train_loss": -42.656288146972656, "global_step": 228927, "epoch": 1891} {"train_loss": -42.57705307006836, "global_step": 228928, "epoch": 1891} {"train_loss": -43.18156051635742, "global_step": 228929, "epoch": 1891} {"train_loss": -43.029640197753906, "global_step": 228930, "epoch": 1891} {"train_loss": -42.095247158334274, "global_step": 228931, "epoch": 1891, "val_loss": 2552235.25} {"train_loss": -42.83871078491211, "global_step": 228932, "epoch": 1892} {"train_loss": -42.816280364990234, "global_step": 228933, "epoch": 1892} {"train_loss": -43.27080154418945, "global_step": 228934, "epoch": 1892} {"train_loss": -42.47631072998047, "global_step": 228935, "epoch": 1892} {"train_loss": -42.49232864379883, "global_step": 228936, "epoch": 1892} {"train_loss": -42.78667068481445, "global_step": 228937, "epoch": 1892} {"train_loss": -43.23764419555664, "global_step": 228938, "epoch": 1892} {"train_loss": -42.72694396972656, "global_step": 228939, "epoch": 1892} {"train_loss": -43.320045471191406, "global_step": 228940, "epoch": 1892} {"train_loss": -42.44147872924805, "global_step": 228941, "epoch": 1892} {"train_loss": -41.86065673828125, "global_step": 228942, "epoch": 1892} {"train_loss": -41.16889953613281, "global_step": 228943, "epoch": 1892} {"train_loss": -42.970252990722656, "global_step": 228944, "epoch": 1892} {"train_loss": -42.86274337768555, "global_step": 228945, "epoch": 1892} {"train_loss": -41.34280014038086, "global_step": 228946, "epoch": 1892} {"train_loss": -41.962127685546875, "global_step": 228947, "epoch": 1892} {"train_loss": -42.2235107421875, "global_step": 228948, "epoch": 1892} {"train_loss": -43.06847381591797, "global_step": 228949, "epoch": 1892} {"train_loss": -41.450660705566406, "global_step": 228950, "epoch": 1892} {"train_loss": -38.71338653564453, "global_step": 228951, "epoch": 1892} {"train_loss": -37.10187911987305, "global_step": 228952, "epoch": 1892} {"train_loss": -41.10041809082031, "global_step": 228953, "epoch": 1892} {"train_loss": -40.88917541503906, "global_step": 228954, "epoch": 1892} {"train_loss": -41.16482162475586, "global_step": 228955, "epoch": 1892} {"train_loss": -39.95994186401367, "global_step": 228956, "epoch": 1892} {"train_loss": -36.21345138549805, "global_step": 228957, "epoch": 1892} {"train_loss": -40.98782730102539, "global_step": 228958, "epoch": 1892} {"train_loss": -39.98344039916992, "global_step": 228959, "epoch": 1892} {"train_loss": -39.667762756347656, "global_step": 228960, "epoch": 1892} {"train_loss": -40.605289459228516, "global_step": 228961, "epoch": 1892} {"train_loss": -40.73259735107422, "global_step": 228962, "epoch": 1892} {"train_loss": -40.902801513671875, "global_step": 228963, "epoch": 1892} {"train_loss": -42.28896713256836, "global_step": 228964, "epoch": 1892} {"train_loss": -41.04087448120117, "global_step": 228965, "epoch": 1892} {"train_loss": -41.150386810302734, "global_step": 228966, "epoch": 1892} {"train_loss": -41.987789154052734, "global_step": 228967, "epoch": 1892} {"train_loss": -41.78944778442383, "global_step": 228968, "epoch": 1892} {"train_loss": -42.08323287963867, "global_step": 228969, "epoch": 1892} {"train_loss": -41.568092346191406, "global_step": 228970, "epoch": 1892} {"train_loss": -42.4452018737793, "global_step": 228971, "epoch": 1892} {"train_loss": -39.14498519897461, "global_step": 228972, "epoch": 1892} {"train_loss": -42.43758773803711, "global_step": 228973, "epoch": 1892} {"train_loss": -41.38916778564453, "global_step": 228974, "epoch": 1892} {"train_loss": -42.27106857299805, "global_step": 228975, "epoch": 1892} {"train_loss": -41.09856033325195, "global_step": 228976, "epoch": 1892} {"train_loss": -41.4048957824707, "global_step": 228977, "epoch": 1892} {"train_loss": -42.25136947631836, "global_step": 228978, "epoch": 1892} {"train_loss": -42.36556625366211, "global_step": 228979, "epoch": 1892} {"train_loss": -38.12651443481445, "global_step": 228980, "epoch": 1892} {"train_loss": -41.39323806762695, "global_step": 228981, "epoch": 1892} {"train_loss": -41.05744171142578, "global_step": 228982, "epoch": 1892} {"train_loss": -40.270565032958984, "global_step": 228983, "epoch": 1892} {"train_loss": -40.333858489990234, "global_step": 228984, "epoch": 1892} {"train_loss": -41.353553771972656, "global_step": 228985, "epoch": 1892} {"train_loss": -41.36043930053711, "global_step": 228986, "epoch": 1892} {"train_loss": -41.242164611816406, "global_step": 228987, "epoch": 1892} {"train_loss": -40.6141357421875, "global_step": 228988, "epoch": 1892} {"train_loss": -40.12275314331055, "global_step": 228989, "epoch": 1892} {"train_loss": -40.67708206176758, "global_step": 228990, "epoch": 1892} {"train_loss": -40.7994499206543, "global_step": 228991, "epoch": 1892} {"train_loss": -39.96511459350586, "global_step": 228992, "epoch": 1892} {"train_loss": -39.27545166015625, "global_step": 228993, "epoch": 1892} {"train_loss": -37.082313537597656, "global_step": 228994, "epoch": 1892} {"train_loss": -39.819087982177734, "global_step": 228995, "epoch": 1892} {"train_loss": -41.19768142700195, "global_step": 228996, "epoch": 1892} {"train_loss": -38.616329193115234, "global_step": 228997, "epoch": 1892} {"train_loss": -39.494022369384766, "global_step": 228998, "epoch": 1892} {"train_loss": -40.31106185913086, "global_step": 228999, "epoch": 1892} {"train_loss": -38.9806022644043, "global_step": 229000, "epoch": 1892} {"train_loss": -39.34402084350586, "global_step": 229001, "epoch": 1892} {"train_loss": -39.76939392089844, "global_step": 229002, "epoch": 1892} {"train_loss": -40.84663009643555, "global_step": 229003, "epoch": 1892} {"train_loss": -38.02004623413086, "global_step": 229004, "epoch": 1892} {"train_loss": -39.0539665222168, "global_step": 229005, "epoch": 1892} {"train_loss": -39.263187408447266, "global_step": 229006, "epoch": 1892} {"train_loss": -36.967159271240234, "global_step": 229007, "epoch": 1892} {"train_loss": -36.60834884643555, "global_step": 229008, "epoch": 1892} {"train_loss": -39.299556732177734, "global_step": 229009, "epoch": 1892} {"train_loss": -38.26980209350586, "global_step": 229010, "epoch": 1892} {"train_loss": -40.45625305175781, "global_step": 229011, "epoch": 1892} {"train_loss": -36.568363189697266, "global_step": 229012, "epoch": 1892} {"train_loss": -38.72076416015625, "global_step": 229013, "epoch": 1892} {"train_loss": -40.631385803222656, "global_step": 229014, "epoch": 1892} {"train_loss": -38.81222152709961, "global_step": 229015, "epoch": 1892} {"train_loss": -39.723487854003906, "global_step": 229016, "epoch": 1892} {"train_loss": -31.228086471557617, "global_step": 229017, "epoch": 1892} {"train_loss": -36.42133331298828, "global_step": 229018, "epoch": 1892} {"train_loss": -32.45295333862305, "global_step": 229019, "epoch": 1892} {"train_loss": -39.73683547973633, "global_step": 229020, "epoch": 1892} {"train_loss": -39.23280715942383, "global_step": 229021, "epoch": 1892} {"train_loss": -34.994441986083984, "global_step": 229022, "epoch": 1892} {"train_loss": -32.93319320678711, "global_step": 229023, "epoch": 1892} {"train_loss": -27.37052345275879, "global_step": 229024, "epoch": 1892} {"train_loss": -37.078155517578125, "global_step": 229025, "epoch": 1892} {"train_loss": -36.213722229003906, "global_step": 229026, "epoch": 1892} {"train_loss": -29.565275192260742, "global_step": 229027, "epoch": 1892} {"train_loss": -38.66242218017578, "global_step": 229028, "epoch": 1892} {"train_loss": -34.14691925048828, "global_step": 229029, "epoch": 1892} {"train_loss": -36.9828987121582, "global_step": 229030, "epoch": 1892} {"train_loss": -38.49188232421875, "global_step": 229031, "epoch": 1892} {"train_loss": -36.93993377685547, "global_step": 229032, "epoch": 1892} {"train_loss": -33.747066497802734, "global_step": 229033, "epoch": 1892} {"train_loss": -35.92448806762695, "global_step": 229034, "epoch": 1892} {"train_loss": -36.438961029052734, "global_step": 229035, "epoch": 1892} {"train_loss": -33.68483352661133, "global_step": 229036, "epoch": 1892} {"train_loss": -34.6843376159668, "global_step": 229037, "epoch": 1892} {"train_loss": -33.63047409057617, "global_step": 229038, "epoch": 1892} {"train_loss": -39.7396354675293, "global_step": 229039, "epoch": 1892} {"train_loss": -35.949806213378906, "global_step": 229040, "epoch": 1892} {"train_loss": -35.81109619140625, "global_step": 229041, "epoch": 1892} {"train_loss": -38.86470413208008, "global_step": 229042, "epoch": 1892} {"train_loss": -36.33525848388672, "global_step": 229043, "epoch": 1892} {"train_loss": -35.35908126831055, "global_step": 229044, "epoch": 1892} {"train_loss": -38.47678756713867, "global_step": 229045, "epoch": 1892} {"train_loss": -38.31166458129883, "global_step": 229046, "epoch": 1892} {"train_loss": -38.69773483276367, "global_step": 229047, "epoch": 1892} {"train_loss": -35.171791076660156, "global_step": 229048, "epoch": 1892} {"train_loss": -37.31843185424805, "global_step": 229049, "epoch": 1892} {"train_loss": -38.91586685180664, "global_step": 229050, "epoch": 1892} {"train_loss": -38.04679870605469, "global_step": 229051, "epoch": 1892} {"train_loss": -39.28108610988649, "global_step": 229052, "epoch": 1892, "val_loss": 2563790.0} {"train_loss": -38.03371810913086, "global_step": 229053, "epoch": 1893} {"train_loss": -38.65594482421875, "global_step": 229054, "epoch": 1893} {"train_loss": -39.22405242919922, "global_step": 229055, "epoch": 1893} {"train_loss": -38.7895393371582, "global_step": 229056, "epoch": 1893} {"train_loss": -39.39353561401367, "global_step": 229057, "epoch": 1893} {"train_loss": -38.35908126831055, "global_step": 229058, "epoch": 1893} {"train_loss": -39.77037048339844, "global_step": 229059, "epoch": 1893} {"train_loss": -40.32612228393555, "global_step": 229060, "epoch": 1893} {"train_loss": -38.497493743896484, "global_step": 229061, "epoch": 1893} {"train_loss": -39.17945098876953, "global_step": 229062, "epoch": 1893} {"train_loss": -40.35873031616211, "global_step": 229063, "epoch": 1893} {"train_loss": -40.31146240234375, "global_step": 229064, "epoch": 1893} {"train_loss": -40.157588958740234, "global_step": 229065, "epoch": 1893} {"train_loss": -40.316070556640625, "global_step": 229066, "epoch": 1893} {"train_loss": -40.11197280883789, "global_step": 229067, "epoch": 1893} {"train_loss": -39.955196380615234, "global_step": 229068, "epoch": 1893} {"train_loss": -40.428279876708984, "global_step": 229069, "epoch": 1893} {"train_loss": -40.42864227294922, "global_step": 229070, "epoch": 1893} {"train_loss": -40.44062423706055, "global_step": 229071, "epoch": 1893} {"train_loss": -40.094661712646484, "global_step": 229072, "epoch": 1893} {"train_loss": -39.8067741394043, "global_step": 229073, "epoch": 1893} {"train_loss": -39.95130920410156, "global_step": 229074, "epoch": 1893} {"train_loss": -39.59396743774414, "global_step": 229075, "epoch": 1893} {"train_loss": -40.41352844238281, "global_step": 229076, "epoch": 1893} {"train_loss": -40.93574142456055, "global_step": 229077, "epoch": 1893} {"train_loss": -41.10956573486328, "global_step": 229078, "epoch": 1893} {"train_loss": -39.66290283203125, "global_step": 229079, "epoch": 1893} {"train_loss": -41.067386627197266, "global_step": 229080, "epoch": 1893} {"train_loss": -41.21908187866211, "global_step": 229081, "epoch": 1893} {"train_loss": -40.938812255859375, "global_step": 229082, "epoch": 1893} {"train_loss": -41.121002197265625, "global_step": 229083, "epoch": 1893} {"train_loss": -40.77485275268555, "global_step": 229084, "epoch": 1893} {"train_loss": -40.19790267944336, "global_step": 229085, "epoch": 1893} {"train_loss": -40.78725814819336, "global_step": 229086, "epoch": 1893} {"train_loss": -40.519107818603516, "global_step": 229087, "epoch": 1893} {"train_loss": -40.93083953857422, "global_step": 229088, "epoch": 1893} {"train_loss": -40.75489044189453, "global_step": 229089, "epoch": 1893} {"train_loss": -41.08468246459961, "global_step": 229090, "epoch": 1893} {"train_loss": -40.4130859375, "global_step": 229091, "epoch": 1893} {"train_loss": -39.94035720825195, "global_step": 229092, "epoch": 1893} {"train_loss": -41.66215896606445, "global_step": 229093, "epoch": 1893} {"train_loss": -41.057552337646484, "global_step": 229094, "epoch": 1893} {"train_loss": -40.837196350097656, "global_step": 229095, "epoch": 1893} {"train_loss": -41.49267578125, "global_step": 229096, "epoch": 1893} {"train_loss": -41.63783645629883, "global_step": 229097, "epoch": 1893} {"train_loss": -41.41931915283203, "global_step": 229098, "epoch": 1893} {"train_loss": -40.546199798583984, "global_step": 229099, "epoch": 1893} {"train_loss": -40.67189407348633, "global_step": 229100, "epoch": 1893} {"train_loss": -41.54611587524414, "global_step": 229101, "epoch": 1893} {"train_loss": -41.574798583984375, "global_step": 229102, "epoch": 1893} {"train_loss": -41.01913070678711, "global_step": 229103, "epoch": 1893} {"train_loss": -41.2231330871582, "global_step": 229104, "epoch": 1893} {"train_loss": -41.34239959716797, "global_step": 229105, "epoch": 1893} {"train_loss": -41.18536376953125, "global_step": 229106, "epoch": 1893} {"train_loss": -41.420745849609375, "global_step": 229107, "epoch": 1893} {"train_loss": -41.775550842285156, "global_step": 229108, "epoch": 1893} {"train_loss": -41.93160629272461, "global_step": 229109, "epoch": 1893} {"train_loss": -41.6894416809082, "global_step": 229110, "epoch": 1893} {"train_loss": -41.31229019165039, "global_step": 229111, "epoch": 1893} {"train_loss": -40.79717254638672, "global_step": 229112, "epoch": 1893} {"train_loss": -41.1555290222168, "global_step": 229113, "epoch": 1893} {"train_loss": -42.1735954284668, "global_step": 229114, "epoch": 1893} {"train_loss": -40.276180267333984, "global_step": 229115, "epoch": 1893} {"train_loss": -42.00104522705078, "global_step": 229116, "epoch": 1893} {"train_loss": -41.346405029296875, "global_step": 229117, "epoch": 1893} {"train_loss": -41.8237419128418, "global_step": 229118, "epoch": 1893} {"train_loss": -42.102718353271484, "global_step": 229119, "epoch": 1893} {"train_loss": -41.61662673950195, "global_step": 229120, "epoch": 1893} {"train_loss": -41.346256256103516, "global_step": 229121, "epoch": 1893} {"train_loss": -41.48161315917969, "global_step": 229122, "epoch": 1893} {"train_loss": -41.52299118041992, "global_step": 229123, "epoch": 1893} {"train_loss": -42.266841888427734, "global_step": 229124, "epoch": 1893} {"train_loss": -41.890079498291016, "global_step": 229125, "epoch": 1893} {"train_loss": -41.56776428222656, "global_step": 229126, "epoch": 1893} {"train_loss": -41.00237274169922, "global_step": 229127, "epoch": 1893} {"train_loss": -41.07976150512695, "global_step": 229128, "epoch": 1893} {"train_loss": -41.50992965698242, "global_step": 229129, "epoch": 1893} {"train_loss": -42.13181686401367, "global_step": 229130, "epoch": 1893} {"train_loss": -42.32712936401367, "global_step": 229131, "epoch": 1893} {"train_loss": -41.96816635131836, "global_step": 229132, "epoch": 1893} {"train_loss": -40.92182922363281, "global_step": 229133, "epoch": 1893} {"train_loss": -41.63701248168945, "global_step": 229134, "epoch": 1893} {"train_loss": -41.553340911865234, "global_step": 229135, "epoch": 1893} {"train_loss": -40.730262756347656, "global_step": 229136, "epoch": 1893} {"train_loss": -41.0352668762207, "global_step": 229137, "epoch": 1893} {"train_loss": -40.32428741455078, "global_step": 229138, "epoch": 1893} {"train_loss": -41.85868453979492, "global_step": 229139, "epoch": 1893} {"train_loss": -41.77592849731445, "global_step": 229140, "epoch": 1893} {"train_loss": -41.754207611083984, "global_step": 229141, "epoch": 1893} {"train_loss": -41.347076416015625, "global_step": 229142, "epoch": 1893} {"train_loss": -41.70109939575195, "global_step": 229143, "epoch": 1893} {"train_loss": -41.913543701171875, "global_step": 229144, "epoch": 1893} {"train_loss": -41.78642272949219, "global_step": 229145, "epoch": 1893} {"train_loss": -40.5982551574707, "global_step": 229146, "epoch": 1893} {"train_loss": -42.52727508544922, "global_step": 229147, "epoch": 1893} {"train_loss": -39.8121337890625, "global_step": 229148, "epoch": 1893} {"train_loss": -41.900630950927734, "global_step": 229149, "epoch": 1893} {"train_loss": -42.276161193847656, "global_step": 229150, "epoch": 1893} {"train_loss": -40.640254974365234, "global_step": 229151, "epoch": 1893} {"train_loss": -42.19674301147461, "global_step": 229152, "epoch": 1893} {"train_loss": -42.26140213012695, "global_step": 229153, "epoch": 1893} {"train_loss": -41.63400650024414, "global_step": 229154, "epoch": 1893} {"train_loss": -40.92728805541992, "global_step": 229155, "epoch": 1893} {"train_loss": -40.359737396240234, "global_step": 229156, "epoch": 1893} {"train_loss": -40.93270492553711, "global_step": 229157, "epoch": 1893} {"train_loss": -41.693599700927734, "global_step": 229158, "epoch": 1893} {"train_loss": -40.7353515625, "global_step": 229159, "epoch": 1893} {"train_loss": -40.24958419799805, "global_step": 229160, "epoch": 1893} {"train_loss": -39.86433792114258, "global_step": 229161, "epoch": 1893} {"train_loss": -41.90542221069336, "global_step": 229162, "epoch": 1893} {"train_loss": -41.09304428100586, "global_step": 229163, "epoch": 1893} {"train_loss": -41.165802001953125, "global_step": 229164, "epoch": 1893} {"train_loss": -40.128265380859375, "global_step": 229165, "epoch": 1893} {"train_loss": -39.59552001953125, "global_step": 229166, "epoch": 1893} {"train_loss": -41.554107666015625, "global_step": 229167, "epoch": 1893} {"train_loss": -41.885921478271484, "global_step": 229168, "epoch": 1893} {"train_loss": -41.38740158081055, "global_step": 229169, "epoch": 1893} {"train_loss": -41.068721771240234, "global_step": 229170, "epoch": 1893} {"train_loss": -41.31699752807617, "global_step": 229171, "epoch": 1893} {"train_loss": -41.72711181640625, "global_step": 229172, "epoch": 1893} {"train_loss": -40.94181943530879, "global_step": 229173, "epoch": 1893, "val_loss": 2611183.75} {"train_loss": -41.27765655517578, "global_step": 229174, "epoch": 1894} {"train_loss": -40.93376159667969, "global_step": 229175, "epoch": 1894} {"train_loss": -41.032981872558594, "global_step": 229176, "epoch": 1894} {"train_loss": -41.38134765625, "global_step": 229177, "epoch": 1894} {"train_loss": -41.315818786621094, "global_step": 229178, "epoch": 1894} {"train_loss": -40.20808792114258, "global_step": 229179, "epoch": 1894} {"train_loss": -41.5141487121582, "global_step": 229180, "epoch": 1894} {"train_loss": -40.998268127441406, "global_step": 229181, "epoch": 1894} {"train_loss": -40.258358001708984, "global_step": 229182, "epoch": 1894} {"train_loss": -41.695526123046875, "global_step": 229183, "epoch": 1894} {"train_loss": -41.3193473815918, "global_step": 229184, "epoch": 1894} {"train_loss": -41.93265151977539, "global_step": 229185, "epoch": 1894} {"train_loss": -41.349674224853516, "global_step": 229186, "epoch": 1894} {"train_loss": -41.30030822753906, "global_step": 229187, "epoch": 1894} {"train_loss": -41.737369537353516, "global_step": 229188, "epoch": 1894} {"train_loss": -41.16714096069336, "global_step": 229189, "epoch": 1894} {"train_loss": -41.074039459228516, "global_step": 229190, "epoch": 1894} {"train_loss": -41.384971618652344, "global_step": 229191, "epoch": 1894} {"train_loss": -40.68060302734375, "global_step": 229192, "epoch": 1894} {"train_loss": -41.04232406616211, "global_step": 229193, "epoch": 1894} {"train_loss": -41.23733139038086, "global_step": 229194, "epoch": 1894} {"train_loss": -41.941932678222656, "global_step": 229195, "epoch": 1894} {"train_loss": -40.696556091308594, "global_step": 229196, "epoch": 1894} {"train_loss": -40.750816345214844, "global_step": 229197, "epoch": 1894} {"train_loss": -41.56983947753906, "global_step": 229198, "epoch": 1894} {"train_loss": -40.6948356628418, "global_step": 229199, "epoch": 1894} {"train_loss": -41.38806915283203, "global_step": 229200, "epoch": 1894} {"train_loss": -40.10907745361328, "global_step": 229201, "epoch": 1894} {"train_loss": -41.80741500854492, "global_step": 229202, "epoch": 1894} {"train_loss": -41.347557067871094, "global_step": 229203, "epoch": 1894} {"train_loss": -41.45499801635742, "global_step": 229204, "epoch": 1894} {"train_loss": -41.12715148925781, "global_step": 229205, "epoch": 1894} {"train_loss": -40.73755645751953, "global_step": 229206, "epoch": 1894} {"train_loss": -41.79353713989258, "global_step": 229207, "epoch": 1894} {"train_loss": -41.28181076049805, "global_step": 229208, "epoch": 1894} {"train_loss": -41.67490005493164, "global_step": 229209, "epoch": 1894} {"train_loss": -41.22001266479492, "global_step": 229210, "epoch": 1894} {"train_loss": -42.32404708862305, "global_step": 229211, "epoch": 1894} {"train_loss": -41.82400131225586, "global_step": 229212, "epoch": 1894} {"train_loss": -41.370277404785156, "global_step": 229213, "epoch": 1894} {"train_loss": -41.42823028564453, "global_step": 229214, "epoch": 1894} {"train_loss": -42.24225616455078, "global_step": 229215, "epoch": 1894} {"train_loss": -41.67608642578125, "global_step": 229216, "epoch": 1894} {"train_loss": -42.14573287963867, "global_step": 229217, "epoch": 1894} {"train_loss": -40.95635986328125, "global_step": 229218, "epoch": 1894} {"train_loss": -42.08638000488281, "global_step": 229219, "epoch": 1894} {"train_loss": -42.07074737548828, "global_step": 229220, "epoch": 1894} {"train_loss": -42.336395263671875, "global_step": 229221, "epoch": 1894} {"train_loss": -42.13898849487305, "global_step": 229222, "epoch": 1894} {"train_loss": -42.18058395385742, "global_step": 229223, "epoch": 1894} {"train_loss": -41.619171142578125, "global_step": 229224, "epoch": 1894} {"train_loss": -41.57304763793945, "global_step": 229225, "epoch": 1894} {"train_loss": -42.52565383911133, "global_step": 229226, "epoch": 1894} {"train_loss": -41.549095153808594, "global_step": 229227, "epoch": 1894} {"train_loss": -41.87472152709961, "global_step": 229228, "epoch": 1894} {"train_loss": -42.260738372802734, "global_step": 229229, "epoch": 1894} {"train_loss": -42.67485809326172, "global_step": 229230, "epoch": 1894} {"train_loss": -41.317440032958984, "global_step": 229231, "epoch": 1894} {"train_loss": -42.25469970703125, "global_step": 229232, "epoch": 1894} {"train_loss": -42.08010482788086, "global_step": 229233, "epoch": 1894} {"train_loss": -41.64996337890625, "global_step": 229234, "epoch": 1894} {"train_loss": -40.7152214050293, "global_step": 229235, "epoch": 1894} {"train_loss": -42.32015609741211, "global_step": 229236, "epoch": 1894} {"train_loss": -41.8771858215332, "global_step": 229237, "epoch": 1894} {"train_loss": -41.994991302490234, "global_step": 229238, "epoch": 1894} {"train_loss": -42.14680099487305, "global_step": 229239, "epoch": 1894} {"train_loss": -41.86152267456055, "global_step": 229240, "epoch": 1894} {"train_loss": -41.9803581237793, "global_step": 229241, "epoch": 1894} {"train_loss": -40.521480560302734, "global_step": 229242, "epoch": 1894} {"train_loss": -42.39767074584961, "global_step": 229243, "epoch": 1894} {"train_loss": -42.38069534301758, "global_step": 229244, "epoch": 1894} {"train_loss": -41.69451904296875, "global_step": 229245, "epoch": 1894} {"train_loss": -42.1491584777832, "global_step": 229246, "epoch": 1894} {"train_loss": -41.59259033203125, "global_step": 229247, "epoch": 1894} {"train_loss": -42.32399368286133, "global_step": 229248, "epoch": 1894} {"train_loss": -41.19977569580078, "global_step": 229249, "epoch": 1894} {"train_loss": -42.18873977661133, "global_step": 229250, "epoch": 1894} {"train_loss": -41.744873046875, "global_step": 229251, "epoch": 1894} {"train_loss": -40.349159240722656, "global_step": 229252, "epoch": 1894} {"train_loss": -41.83579635620117, "global_step": 229253, "epoch": 1894} {"train_loss": -41.838478088378906, "global_step": 229254, "epoch": 1894} {"train_loss": -41.25165557861328, "global_step": 229255, "epoch": 1894} {"train_loss": -42.03896713256836, "global_step": 229256, "epoch": 1894} {"train_loss": -41.02610397338867, "global_step": 229257, "epoch": 1894} {"train_loss": -39.1558837890625, "global_step": 229258, "epoch": 1894} {"train_loss": -38.66335678100586, "global_step": 229259, "epoch": 1894} {"train_loss": -41.163204193115234, "global_step": 229260, "epoch": 1894} {"train_loss": -41.42146682739258, "global_step": 229261, "epoch": 1894} {"train_loss": -41.203399658203125, "global_step": 229262, "epoch": 1894} {"train_loss": -38.91786575317383, "global_step": 229263, "epoch": 1894} {"train_loss": -40.044898986816406, "global_step": 229264, "epoch": 1894} {"train_loss": -41.08913803100586, "global_step": 229265, "epoch": 1894} {"train_loss": -40.59798812866211, "global_step": 229266, "epoch": 1894} {"train_loss": -38.89509201049805, "global_step": 229267, "epoch": 1894} {"train_loss": -39.83816146850586, "global_step": 229268, "epoch": 1894} {"train_loss": -41.856117248535156, "global_step": 229269, "epoch": 1894} {"train_loss": -38.473541259765625, "global_step": 229270, "epoch": 1894} {"train_loss": -38.750301361083984, "global_step": 229271, "epoch": 1894} {"train_loss": -41.314613342285156, "global_step": 229272, "epoch": 1894} {"train_loss": -40.73339080810547, "global_step": 229273, "epoch": 1894} {"train_loss": -40.55884552001953, "global_step": 229274, "epoch": 1894} {"train_loss": -41.071903228759766, "global_step": 229275, "epoch": 1894} {"train_loss": -39.989681243896484, "global_step": 229276, "epoch": 1894} {"train_loss": -39.0224723815918, "global_step": 229277, "epoch": 1894} {"train_loss": -39.915618896484375, "global_step": 229278, "epoch": 1894} {"train_loss": -39.22197341918945, "global_step": 229279, "epoch": 1894} {"train_loss": -40.75047302246094, "global_step": 229280, "epoch": 1894} {"train_loss": -38.86491775512695, "global_step": 229281, "epoch": 1894} {"train_loss": -40.04328918457031, "global_step": 229282, "epoch": 1894} {"train_loss": -35.93141555786133, "global_step": 229283, "epoch": 1894} {"train_loss": -39.44089889526367, "global_step": 229284, "epoch": 1894} {"train_loss": -35.5003776550293, "global_step": 229285, "epoch": 1894} {"train_loss": -39.943992614746094, "global_step": 229286, "epoch": 1894} {"train_loss": -35.124420166015625, "global_step": 229287, "epoch": 1894} {"train_loss": -40.79290771484375, "global_step": 229288, "epoch": 1894} {"train_loss": -35.94990921020508, "global_step": 229289, "epoch": 1894} {"train_loss": -39.546932220458984, "global_step": 229290, "epoch": 1894} {"train_loss": -39.564788818359375, "global_step": 229291, "epoch": 1894} {"train_loss": -38.2027702331543, "global_step": 229292, "epoch": 1894} {"train_loss": -40.73576736450195, "global_step": 229293, "epoch": 1894} {"train_loss": -40.934624443369465, "global_step": 229294, "epoch": 1894, "val_loss": 2598410.75} {"train_loss": -41.10497283935547, "global_step": 229295, "epoch": 1895} {"train_loss": -40.288753509521484, "global_step": 229296, "epoch": 1895} {"train_loss": -41.132476806640625, "global_step": 229297, "epoch": 1895} {"train_loss": -41.35744857788086, "global_step": 229298, "epoch": 1895} {"train_loss": -41.27194595336914, "global_step": 229299, "epoch": 1895} {"train_loss": -40.408721923828125, "global_step": 229300, "epoch": 1895} {"train_loss": -40.5789680480957, "global_step": 229301, "epoch": 1895} {"train_loss": -41.1578483581543, "global_step": 229302, "epoch": 1895} {"train_loss": -40.39157485961914, "global_step": 229303, "epoch": 1895} {"train_loss": -39.995689392089844, "global_step": 229304, "epoch": 1895} {"train_loss": -41.29475402832031, "global_step": 229305, "epoch": 1895} {"train_loss": -40.3714599609375, "global_step": 229306, "epoch": 1895} {"train_loss": -41.35546875, "global_step": 229307, "epoch": 1895} {"train_loss": -41.2643928527832, "global_step": 229308, "epoch": 1895} {"train_loss": -41.3299446105957, "global_step": 229309, "epoch": 1895} {"train_loss": -41.05486297607422, "global_step": 229310, "epoch": 1895} {"train_loss": -41.537574768066406, "global_step": 229311, "epoch": 1895} {"train_loss": -42.22957229614258, "global_step": 229312, "epoch": 1895} {"train_loss": -41.5623664855957, "global_step": 229313, "epoch": 1895} {"train_loss": -41.77709197998047, "global_step": 229314, "epoch": 1895} {"train_loss": -41.289119720458984, "global_step": 229315, "epoch": 1895} {"train_loss": -41.581390380859375, "global_step": 229316, "epoch": 1895} {"train_loss": -42.26976013183594, "global_step": 229317, "epoch": 1895} {"train_loss": -41.423397064208984, "global_step": 229318, "epoch": 1895} {"train_loss": -42.57576370239258, "global_step": 229319, "epoch": 1895} {"train_loss": -41.9058952331543, "global_step": 229320, "epoch": 1895} {"train_loss": -41.37258529663086, "global_step": 229321, "epoch": 1895} {"train_loss": -42.08198165893555, "global_step": 229322, "epoch": 1895} {"train_loss": -42.15790557861328, "global_step": 229323, "epoch": 1895} {"train_loss": -41.869178771972656, "global_step": 229324, "epoch": 1895} {"train_loss": -42.05601119995117, "global_step": 229325, "epoch": 1895} {"train_loss": -42.347869873046875, "global_step": 229326, "epoch": 1895} {"train_loss": -42.32512283325195, "global_step": 229327, "epoch": 1895} {"train_loss": -42.211578369140625, "global_step": 229328, "epoch": 1895} {"train_loss": -42.28411102294922, "global_step": 229329, "epoch": 1895} {"train_loss": -42.19610595703125, "global_step": 229330, "epoch": 1895} {"train_loss": -42.311920166015625, "global_step": 229331, "epoch": 1895} {"train_loss": -41.704833984375, "global_step": 229332, "epoch": 1895} {"train_loss": -42.48163604736328, "global_step": 229333, "epoch": 1895} {"train_loss": -42.167110443115234, "global_step": 229334, "epoch": 1895} {"train_loss": -41.40210723876953, "global_step": 229335, "epoch": 1895} {"train_loss": -42.39528274536133, "global_step": 229336, "epoch": 1895} {"train_loss": -42.59914779663086, "global_step": 229337, "epoch": 1895} {"train_loss": -42.14543533325195, "global_step": 229338, "epoch": 1895} {"train_loss": -42.179718017578125, "global_step": 229339, "epoch": 1895} {"train_loss": -40.724830627441406, "global_step": 229340, "epoch": 1895} {"train_loss": -42.14921188354492, "global_step": 229341, "epoch": 1895} {"train_loss": -42.68970489501953, "global_step": 229342, "epoch": 1895} {"train_loss": -42.33433151245117, "global_step": 229343, "epoch": 1895} {"train_loss": -42.51564407348633, "global_step": 229344, "epoch": 1895} {"train_loss": -42.87223815917969, "global_step": 229345, "epoch": 1895} {"train_loss": -42.518131256103516, "global_step": 229346, "epoch": 1895} {"train_loss": -42.20013427734375, "global_step": 229347, "epoch": 1895} {"train_loss": -42.162418365478516, "global_step": 229348, "epoch": 1895} {"train_loss": -42.94838333129883, "global_step": 229349, "epoch": 1895} {"train_loss": -42.891937255859375, "global_step": 229350, "epoch": 1895} {"train_loss": -42.4865837097168, "global_step": 229351, "epoch": 1895} {"train_loss": -41.40091323852539, "global_step": 229352, "epoch": 1895} {"train_loss": -40.08034133911133, "global_step": 229353, "epoch": 1895} {"train_loss": -39.21596908569336, "global_step": 229354, "epoch": 1895} {"train_loss": -39.84160614013672, "global_step": 229355, "epoch": 1895} {"train_loss": -41.88357925415039, "global_step": 229356, "epoch": 1895} {"train_loss": -42.6954460144043, "global_step": 229357, "epoch": 1895} {"train_loss": -41.88285446166992, "global_step": 229358, "epoch": 1895} {"train_loss": -41.33063507080078, "global_step": 229359, "epoch": 1895} {"train_loss": -41.35490798950195, "global_step": 229360, "epoch": 1895} {"train_loss": -42.044864654541016, "global_step": 229361, "epoch": 1895} {"train_loss": -41.559051513671875, "global_step": 229362, "epoch": 1895} {"train_loss": -41.11207962036133, "global_step": 229363, "epoch": 1895} {"train_loss": -41.7951545715332, "global_step": 229364, "epoch": 1895} {"train_loss": -43.083641052246094, "global_step": 229365, "epoch": 1895} {"train_loss": -41.78660202026367, "global_step": 229366, "epoch": 1895} {"train_loss": -40.74674606323242, "global_step": 229367, "epoch": 1895} {"train_loss": -40.85614013671875, "global_step": 229368, "epoch": 1895} {"train_loss": -42.88307571411133, "global_step": 229369, "epoch": 1895} {"train_loss": -40.86037063598633, "global_step": 229370, "epoch": 1895} {"train_loss": -41.61725616455078, "global_step": 229371, "epoch": 1895} {"train_loss": -40.951900482177734, "global_step": 229372, "epoch": 1895} {"train_loss": -41.8992805480957, "global_step": 229373, "epoch": 1895} {"train_loss": -41.15461349487305, "global_step": 229374, "epoch": 1895} {"train_loss": -38.2286262512207, "global_step": 229375, "epoch": 1895} {"train_loss": -36.701393127441406, "global_step": 229376, "epoch": 1895} {"train_loss": -40.82351303100586, "global_step": 229377, "epoch": 1895} {"train_loss": -40.83058166503906, "global_step": 229378, "epoch": 1895} {"train_loss": -39.533721923828125, "global_step": 229379, "epoch": 1895} {"train_loss": -41.29217529296875, "global_step": 229380, "epoch": 1895} {"train_loss": -40.99945068359375, "global_step": 229381, "epoch": 1895} {"train_loss": -40.023040771484375, "global_step": 229382, "epoch": 1895} {"train_loss": -39.2489013671875, "global_step": 229383, "epoch": 1895} {"train_loss": -41.32693099975586, "global_step": 229384, "epoch": 1895} {"train_loss": -41.14689636230469, "global_step": 229385, "epoch": 1895} {"train_loss": -40.1422233581543, "global_step": 229386, "epoch": 1895} {"train_loss": -41.228878021240234, "global_step": 229387, "epoch": 1895} {"train_loss": -41.212432861328125, "global_step": 229388, "epoch": 1895} {"train_loss": -40.613555908203125, "global_step": 229389, "epoch": 1895} {"train_loss": -41.91379928588867, "global_step": 229390, "epoch": 1895} {"train_loss": -40.620758056640625, "global_step": 229391, "epoch": 1895} {"train_loss": -41.2287712097168, "global_step": 229392, "epoch": 1895} {"train_loss": -41.74081039428711, "global_step": 229393, "epoch": 1895} {"train_loss": -40.55836868286133, "global_step": 229394, "epoch": 1895} {"train_loss": -41.41503143310547, "global_step": 229395, "epoch": 1895} {"train_loss": -39.661094665527344, "global_step": 229396, "epoch": 1895} {"train_loss": -41.105316162109375, "global_step": 229397, "epoch": 1895} {"train_loss": -41.103450775146484, "global_step": 229398, "epoch": 1895} {"train_loss": -39.8655891418457, "global_step": 229399, "epoch": 1895} {"train_loss": -42.06032943725586, "global_step": 229400, "epoch": 1895} {"train_loss": -40.99788284301758, "global_step": 229401, "epoch": 1895} {"train_loss": -42.27762222290039, "global_step": 229402, "epoch": 1895} {"train_loss": -41.139705657958984, "global_step": 229403, "epoch": 1895} {"train_loss": -41.58625411987305, "global_step": 229404, "epoch": 1895} {"train_loss": -41.7136116027832, "global_step": 229405, "epoch": 1895} {"train_loss": -41.167667388916016, "global_step": 229406, "epoch": 1895} {"train_loss": -41.61772537231445, "global_step": 229407, "epoch": 1895} {"train_loss": -41.45769119262695, "global_step": 229408, "epoch": 1895} {"train_loss": -40.43756866455078, "global_step": 229409, "epoch": 1895} {"train_loss": -41.28316116333008, "global_step": 229410, "epoch": 1895} {"train_loss": -40.58295440673828, "global_step": 229411, "epoch": 1895} {"train_loss": -41.972312927246094, "global_step": 229412, "epoch": 1895} {"train_loss": -40.854248046875, "global_step": 229413, "epoch": 1895} {"train_loss": -41.361270904541016, "global_step": 229414, "epoch": 1895} {"train_loss": -41.38669166880206, "global_step": 229415, "epoch": 1895, "val_loss": 2597022.0} {"train_loss": -41.566200256347656, "global_step": 229416, "epoch": 1896} {"train_loss": -42.22492599487305, "global_step": 229417, "epoch": 1896} {"train_loss": -42.13300323486328, "global_step": 229418, "epoch": 1896} {"train_loss": -41.949222564697266, "global_step": 229419, "epoch": 1896} {"train_loss": -41.29136657714844, "global_step": 229420, "epoch": 1896} {"train_loss": -41.85512924194336, "global_step": 229421, "epoch": 1896} {"train_loss": -42.33171844482422, "global_step": 229422, "epoch": 1896} {"train_loss": -41.953914642333984, "global_step": 229423, "epoch": 1896} {"train_loss": -42.55552291870117, "global_step": 229424, "epoch": 1896} {"train_loss": -42.257869720458984, "global_step": 229425, "epoch": 1896} {"train_loss": -42.04338455200195, "global_step": 229426, "epoch": 1896} {"train_loss": -42.27370071411133, "global_step": 229427, "epoch": 1896} {"train_loss": -42.123924255371094, "global_step": 229428, "epoch": 1896} {"train_loss": -42.595664978027344, "global_step": 229429, "epoch": 1896} {"train_loss": -41.829952239990234, "global_step": 229430, "epoch": 1896} {"train_loss": -42.19222640991211, "global_step": 229431, "epoch": 1896} {"train_loss": -41.82828140258789, "global_step": 229432, "epoch": 1896} {"train_loss": -42.50910568237305, "global_step": 229433, "epoch": 1896} {"train_loss": -42.49302291870117, "global_step": 229434, "epoch": 1896} {"train_loss": -42.61686706542969, "global_step": 229435, "epoch": 1896} {"train_loss": -42.76264190673828, "global_step": 229436, "epoch": 1896} {"train_loss": -42.207374572753906, "global_step": 229437, "epoch": 1896} {"train_loss": -42.531715393066406, "global_step": 229438, "epoch": 1896} {"train_loss": -42.35275650024414, "global_step": 229439, "epoch": 1896} {"train_loss": -42.73299789428711, "global_step": 229440, "epoch": 1896} {"train_loss": -42.97490310668945, "global_step": 229441, "epoch": 1896} {"train_loss": -43.07253646850586, "global_step": 229442, "epoch": 1896} {"train_loss": -42.40848922729492, "global_step": 229443, "epoch": 1896} {"train_loss": -42.77265548706055, "global_step": 229444, "epoch": 1896} {"train_loss": -43.14155197143555, "global_step": 229445, "epoch": 1896} {"train_loss": -43.03766632080078, "global_step": 229446, "epoch": 1896} {"train_loss": -42.81064987182617, "global_step": 229447, "epoch": 1896} {"train_loss": -42.89211654663086, "global_step": 229448, "epoch": 1896} {"train_loss": -43.065608978271484, "global_step": 229449, "epoch": 1896} {"train_loss": -42.84562301635742, "global_step": 229450, "epoch": 1896} {"train_loss": -43.001338958740234, "global_step": 229451, "epoch": 1896} {"train_loss": -42.92873001098633, "global_step": 229452, "epoch": 1896} {"train_loss": -42.59838104248047, "global_step": 229453, "epoch": 1896} {"train_loss": -42.76546859741211, "global_step": 229454, "epoch": 1896} {"train_loss": -42.12089157104492, "global_step": 229455, "epoch": 1896} {"train_loss": -42.642093658447266, "global_step": 229456, "epoch": 1896} {"train_loss": -42.406654357910156, "global_step": 229457, "epoch": 1896} {"train_loss": -41.8441276550293, "global_step": 229458, "epoch": 1896} {"train_loss": -42.503597259521484, "global_step": 229459, "epoch": 1896} {"train_loss": -43.02356719970703, "global_step": 229460, "epoch": 1896} {"train_loss": -42.37577438354492, "global_step": 229461, "epoch": 1896} {"train_loss": -42.0482292175293, "global_step": 229462, "epoch": 1896} {"train_loss": -41.60691452026367, "global_step": 229463, "epoch": 1896} {"train_loss": -42.29780960083008, "global_step": 229464, "epoch": 1896} {"train_loss": -41.764320373535156, "global_step": 229465, "epoch": 1896} {"train_loss": -41.10100173950195, "global_step": 229466, "epoch": 1896} {"train_loss": -41.270904541015625, "global_step": 229467, "epoch": 1896} {"train_loss": -39.64008712768555, "global_step": 229468, "epoch": 1896} {"train_loss": -39.55460739135742, "global_step": 229469, "epoch": 1896} {"train_loss": -38.77523422241211, "global_step": 229470, "epoch": 1896} {"train_loss": -38.76365280151367, "global_step": 229471, "epoch": 1896} {"train_loss": -36.11127471923828, "global_step": 229472, "epoch": 1896} {"train_loss": -36.42120361328125, "global_step": 229473, "epoch": 1896} {"train_loss": -40.89298629760742, "global_step": 229474, "epoch": 1896} {"train_loss": -40.407386779785156, "global_step": 229475, "epoch": 1896} {"train_loss": -34.344173431396484, "global_step": 229476, "epoch": 1896} {"train_loss": -32.81039047241211, "global_step": 229477, "epoch": 1896} {"train_loss": -40.060794830322266, "global_step": 229478, "epoch": 1896} {"train_loss": -36.943603515625, "global_step": 229479, "epoch": 1896} {"train_loss": -38.37008285522461, "global_step": 229480, "epoch": 1896} {"train_loss": -41.760372161865234, "global_step": 229481, "epoch": 1896} {"train_loss": -39.873619079589844, "global_step": 229482, "epoch": 1896} {"train_loss": -41.817378997802734, "global_step": 229483, "epoch": 1896} {"train_loss": -40.62717819213867, "global_step": 229484, "epoch": 1896} {"train_loss": -41.100337982177734, "global_step": 229485, "epoch": 1896} {"train_loss": -41.62088394165039, "global_step": 229486, "epoch": 1896} {"train_loss": -40.50603103637695, "global_step": 229487, "epoch": 1896} {"train_loss": -41.37966537475586, "global_step": 229488, "epoch": 1896} {"train_loss": -41.96887969970703, "global_step": 229489, "epoch": 1896} {"train_loss": -40.965293884277344, "global_step": 229490, "epoch": 1896} {"train_loss": -42.3839111328125, "global_step": 229491, "epoch": 1896} {"train_loss": -41.6081657409668, "global_step": 229492, "epoch": 1896} {"train_loss": -41.796234130859375, "global_step": 229493, "epoch": 1896} {"train_loss": -42.27275466918945, "global_step": 229494, "epoch": 1896} {"train_loss": -41.886104583740234, "global_step": 229495, "epoch": 1896} {"train_loss": -42.45355987548828, "global_step": 229496, "epoch": 1896} {"train_loss": -41.57328414916992, "global_step": 229497, "epoch": 1896} {"train_loss": -42.4257926940918, "global_step": 229498, "epoch": 1896} {"train_loss": -41.962825775146484, "global_step": 229499, "epoch": 1896} {"train_loss": -42.44076919555664, "global_step": 229500, "epoch": 1896} {"train_loss": -42.0228157043457, "global_step": 229501, "epoch": 1896} {"train_loss": -42.092037200927734, "global_step": 229502, "epoch": 1896} {"train_loss": -42.48025131225586, "global_step": 229503, "epoch": 1896} {"train_loss": -41.33073043823242, "global_step": 229504, "epoch": 1896} {"train_loss": -41.890865325927734, "global_step": 229505, "epoch": 1896} {"train_loss": -41.922054290771484, "global_step": 229506, "epoch": 1896} {"train_loss": -42.694190979003906, "global_step": 229507, "epoch": 1896} {"train_loss": -41.980525970458984, "global_step": 229508, "epoch": 1896} {"train_loss": -41.26554489135742, "global_step": 229509, "epoch": 1896} {"train_loss": -41.33259201049805, "global_step": 229510, "epoch": 1896} {"train_loss": -42.43889617919922, "global_step": 229511, "epoch": 1896} {"train_loss": -42.501007080078125, "global_step": 229512, "epoch": 1896} {"train_loss": -41.58386993408203, "global_step": 229513, "epoch": 1896} {"train_loss": -42.13942337036133, "global_step": 229514, "epoch": 1896} {"train_loss": -42.29913330078125, "global_step": 229515, "epoch": 1896} {"train_loss": -41.42649459838867, "global_step": 229516, "epoch": 1896} {"train_loss": -36.894371032714844, "global_step": 229517, "epoch": 1896} {"train_loss": -41.65659713745117, "global_step": 229518, "epoch": 1896} {"train_loss": -38.506160736083984, "global_step": 229519, "epoch": 1896} {"train_loss": -41.29060363769531, "global_step": 229520, "epoch": 1896} {"train_loss": -39.415557861328125, "global_step": 229521, "epoch": 1896} {"train_loss": -40.28512191772461, "global_step": 229522, "epoch": 1896} {"train_loss": -41.07602310180664, "global_step": 229523, "epoch": 1896} {"train_loss": -41.480812072753906, "global_step": 229524, "epoch": 1896} {"train_loss": -37.833431243896484, "global_step": 229525, "epoch": 1896} {"train_loss": -40.36593246459961, "global_step": 229526, "epoch": 1896} {"train_loss": -40.713226318359375, "global_step": 229527, "epoch": 1896} {"train_loss": -40.69808578491211, "global_step": 229528, "epoch": 1896} {"train_loss": -40.08112335205078, "global_step": 229529, "epoch": 1896} {"train_loss": -38.560665130615234, "global_step": 229530, "epoch": 1896} {"train_loss": -40.96613311767578, "global_step": 229531, "epoch": 1896} {"train_loss": -36.86137008666992, "global_step": 229532, "epoch": 1896} {"train_loss": -39.673561096191406, "global_step": 229533, "epoch": 1896} {"train_loss": -36.823158264160156, "global_step": 229534, "epoch": 1896} {"train_loss": -39.67672348022461, "global_step": 229535, "epoch": 1896} {"train_loss": -41.25732267395524, "global_step": 229536, "epoch": 1896, "val_loss": 2560006.25} {"train_loss": -41.15648651123047, "global_step": 229537, "epoch": 1897} {"train_loss": -40.45747375488281, "global_step": 229538, "epoch": 1897} {"train_loss": -33.4234733581543, "global_step": 229539, "epoch": 1897} {"train_loss": -38.94116973876953, "global_step": 229540, "epoch": 1897} {"train_loss": -34.11762237548828, "global_step": 229541, "epoch": 1897} {"train_loss": -34.90666198730469, "global_step": 229542, "epoch": 1897} {"train_loss": -38.0415153503418, "global_step": 229543, "epoch": 1897} {"train_loss": -32.89817428588867, "global_step": 229544, "epoch": 1897} {"train_loss": -35.75811767578125, "global_step": 229545, "epoch": 1897} {"train_loss": -35.97396469116211, "global_step": 229546, "epoch": 1897} {"train_loss": -38.528839111328125, "global_step": 229547, "epoch": 1897} {"train_loss": -35.56377029418945, "global_step": 229548, "epoch": 1897} {"train_loss": -37.12294387817383, "global_step": 229549, "epoch": 1897} {"train_loss": -38.45940017700195, "global_step": 229550, "epoch": 1897} {"train_loss": -35.23507308959961, "global_step": 229551, "epoch": 1897} {"train_loss": -38.36684799194336, "global_step": 229552, "epoch": 1897} {"train_loss": -39.4822998046875, "global_step": 229553, "epoch": 1897} {"train_loss": -38.67417526245117, "global_step": 229554, "epoch": 1897} {"train_loss": -39.231666564941406, "global_step": 229555, "epoch": 1897} {"train_loss": -38.39196014404297, "global_step": 229556, "epoch": 1897} {"train_loss": -39.38890075683594, "global_step": 229557, "epoch": 1897} {"train_loss": -37.834537506103516, "global_step": 229558, "epoch": 1897} {"train_loss": -37.9151725769043, "global_step": 229559, "epoch": 1897} {"train_loss": -38.79118728637695, "global_step": 229560, "epoch": 1897} {"train_loss": -39.10780715942383, "global_step": 229561, "epoch": 1897} {"train_loss": -36.286643981933594, "global_step": 229562, "epoch": 1897} {"train_loss": -39.864540100097656, "global_step": 229563, "epoch": 1897} {"train_loss": -39.78882598876953, "global_step": 229564, "epoch": 1897} {"train_loss": -39.616233825683594, "global_step": 229565, "epoch": 1897} {"train_loss": -39.02924346923828, "global_step": 229566, "epoch": 1897} {"train_loss": -37.85712432861328, "global_step": 229567, "epoch": 1897} {"train_loss": -38.86745834350586, "global_step": 229568, "epoch": 1897} {"train_loss": -39.86530685424805, "global_step": 229569, "epoch": 1897} {"train_loss": -40.45122146606445, "global_step": 229570, "epoch": 1897} {"train_loss": -39.730281829833984, "global_step": 229571, "epoch": 1897} {"train_loss": -40.006587982177734, "global_step": 229572, "epoch": 1897} {"train_loss": -39.28181838989258, "global_step": 229573, "epoch": 1897} {"train_loss": -40.38975143432617, "global_step": 229574, "epoch": 1897} {"train_loss": -40.97697067260742, "global_step": 229575, "epoch": 1897} {"train_loss": -39.78486251831055, "global_step": 229576, "epoch": 1897} {"train_loss": -40.89347457885742, "global_step": 229577, "epoch": 1897} {"train_loss": -39.86505889892578, "global_step": 229578, "epoch": 1897} {"train_loss": -40.966339111328125, "global_step": 229579, "epoch": 1897} {"train_loss": -41.14857864379883, "global_step": 229580, "epoch": 1897} {"train_loss": -40.81681442260742, "global_step": 229581, "epoch": 1897} {"train_loss": -40.6584587097168, "global_step": 229582, "epoch": 1897} {"train_loss": -40.16976547241211, "global_step": 229583, "epoch": 1897} {"train_loss": -40.68722152709961, "global_step": 229584, "epoch": 1897} {"train_loss": -40.985145568847656, "global_step": 229585, "epoch": 1897} {"train_loss": -40.914554595947266, "global_step": 229586, "epoch": 1897} {"train_loss": -41.35723876953125, "global_step": 229587, "epoch": 1897} {"train_loss": -41.526363372802734, "global_step": 229588, "epoch": 1897} {"train_loss": -39.99782180786133, "global_step": 229589, "epoch": 1897} {"train_loss": -41.41374588012695, "global_step": 229590, "epoch": 1897} {"train_loss": -41.39893341064453, "global_step": 229591, "epoch": 1897} {"train_loss": -41.34934997558594, "global_step": 229592, "epoch": 1897} {"train_loss": -41.36539077758789, "global_step": 229593, "epoch": 1897} {"train_loss": -41.35095977783203, "global_step": 229594, "epoch": 1897} {"train_loss": -39.825496673583984, "global_step": 229595, "epoch": 1897} {"train_loss": -41.02360153198242, "global_step": 229596, "epoch": 1897} {"train_loss": -41.74140548706055, "global_step": 229597, "epoch": 1897} {"train_loss": -41.04803466796875, "global_step": 229598, "epoch": 1897} {"train_loss": -41.10831832885742, "global_step": 229599, "epoch": 1897} {"train_loss": -41.33736038208008, "global_step": 229600, "epoch": 1897} {"train_loss": -41.6452751159668, "global_step": 229601, "epoch": 1897} {"train_loss": -40.98706817626953, "global_step": 229602, "epoch": 1897} {"train_loss": -40.582462310791016, "global_step": 229603, "epoch": 1897} {"train_loss": -41.459136962890625, "global_step": 229604, "epoch": 1897} {"train_loss": -41.67481231689453, "global_step": 229605, "epoch": 1897} {"train_loss": -42.13227462768555, "global_step": 229606, "epoch": 1897} {"train_loss": -42.09489059448242, "global_step": 229607, "epoch": 1897} {"train_loss": -41.38572692871094, "global_step": 229608, "epoch": 1897} {"train_loss": -41.841400146484375, "global_step": 229609, "epoch": 1897} {"train_loss": -41.997657775878906, "global_step": 229610, "epoch": 1897} {"train_loss": -41.7701301574707, "global_step": 229611, "epoch": 1897} {"train_loss": -41.77983474731445, "global_step": 229612, "epoch": 1897} {"train_loss": -41.467891693115234, "global_step": 229613, "epoch": 1897} {"train_loss": -41.383880615234375, "global_step": 229614, "epoch": 1897} {"train_loss": -41.3376350402832, "global_step": 229615, "epoch": 1897} {"train_loss": -42.19199752807617, "global_step": 229616, "epoch": 1897} {"train_loss": -42.27907943725586, "global_step": 229617, "epoch": 1897} {"train_loss": -41.752620697021484, "global_step": 229618, "epoch": 1897} {"train_loss": -42.25779342651367, "global_step": 229619, "epoch": 1897} {"train_loss": -42.03693771362305, "global_step": 229620, "epoch": 1897} {"train_loss": -42.33999252319336, "global_step": 229621, "epoch": 1897} {"train_loss": -41.831703186035156, "global_step": 229622, "epoch": 1897} {"train_loss": -41.78829574584961, "global_step": 229623, "epoch": 1897} {"train_loss": -41.977115631103516, "global_step": 229624, "epoch": 1897} {"train_loss": -42.590904235839844, "global_step": 229625, "epoch": 1897} {"train_loss": -41.98256301879883, "global_step": 229626, "epoch": 1897} {"train_loss": -42.1821403503418, "global_step": 229627, "epoch": 1897} {"train_loss": -41.93256378173828, "global_step": 229628, "epoch": 1897} {"train_loss": -42.09986877441406, "global_step": 229629, "epoch": 1897} {"train_loss": -42.497718811035156, "global_step": 229630, "epoch": 1897} {"train_loss": -42.15095901489258, "global_step": 229631, "epoch": 1897} {"train_loss": -42.14802169799805, "global_step": 229632, "epoch": 1897} {"train_loss": -42.53802490234375, "global_step": 229633, "epoch": 1897} {"train_loss": -42.36858367919922, "global_step": 229634, "epoch": 1897} {"train_loss": -41.6925163269043, "global_step": 229635, "epoch": 1897} {"train_loss": -42.138790130615234, "global_step": 229636, "epoch": 1897} {"train_loss": -42.56765365600586, "global_step": 229637, "epoch": 1897} {"train_loss": -42.30518341064453, "global_step": 229638, "epoch": 1897} {"train_loss": -41.94199752807617, "global_step": 229639, "epoch": 1897} {"train_loss": -42.85333251953125, "global_step": 229640, "epoch": 1897} {"train_loss": -42.270240783691406, "global_step": 229641, "epoch": 1897} {"train_loss": -42.17213821411133, "global_step": 229642, "epoch": 1897} {"train_loss": -42.13179397583008, "global_step": 229643, "epoch": 1897} {"train_loss": -42.56886291503906, "global_step": 229644, "epoch": 1897} {"train_loss": -42.247371673583984, "global_step": 229645, "epoch": 1897} {"train_loss": -41.45860290527344, "global_step": 229646, "epoch": 1897} {"train_loss": -42.34051513671875, "global_step": 229647, "epoch": 1897} {"train_loss": -42.39267349243164, "global_step": 229648, "epoch": 1897} {"train_loss": -41.790733337402344, "global_step": 229649, "epoch": 1897} {"train_loss": -42.49453353881836, "global_step": 229650, "epoch": 1897} {"train_loss": -42.44538497924805, "global_step": 229651, "epoch": 1897} {"train_loss": -42.925315856933594, "global_step": 229652, "epoch": 1897} {"train_loss": -42.066341400146484, "global_step": 229653, "epoch": 1897} {"train_loss": -42.66162109375, "global_step": 229654, "epoch": 1897} {"train_loss": -41.93368148803711, "global_step": 229655, "epoch": 1897} {"train_loss": -42.01787185668945, "global_step": 229656, "epoch": 1897} {"train_loss": -40.569944964952704, "global_step": 229657, "epoch": 1897, "val_loss": 2488951.0} {"train_loss": -42.27322006225586, "global_step": 229658, "epoch": 1898} {"train_loss": -42.457611083984375, "global_step": 229659, "epoch": 1898} {"train_loss": -42.612545013427734, "global_step": 229660, "epoch": 1898} {"train_loss": -42.2391471862793, "global_step": 229661, "epoch": 1898} {"train_loss": -42.90117645263672, "global_step": 229662, "epoch": 1898} {"train_loss": -41.80819320678711, "global_step": 229663, "epoch": 1898} {"train_loss": -41.94791793823242, "global_step": 229664, "epoch": 1898} {"train_loss": -41.90586471557617, "global_step": 229665, "epoch": 1898} {"train_loss": -41.16107177734375, "global_step": 229666, "epoch": 1898} {"train_loss": -39.2309684753418, "global_step": 229667, "epoch": 1898} {"train_loss": -37.66730499267578, "global_step": 229668, "epoch": 1898} {"train_loss": -40.5417594909668, "global_step": 229669, "epoch": 1898} {"train_loss": -42.477333068847656, "global_step": 229670, "epoch": 1898} {"train_loss": -42.17140579223633, "global_step": 229671, "epoch": 1898} {"train_loss": -41.725181579589844, "global_step": 229672, "epoch": 1898} {"train_loss": -41.29966354370117, "global_step": 229673, "epoch": 1898} {"train_loss": -42.114017486572266, "global_step": 229674, "epoch": 1898} {"train_loss": -42.21139144897461, "global_step": 229675, "epoch": 1898} {"train_loss": -42.68973159790039, "global_step": 229676, "epoch": 1898} {"train_loss": -42.74311447143555, "global_step": 229677, "epoch": 1898} {"train_loss": -42.061866760253906, "global_step": 229678, "epoch": 1898} {"train_loss": -42.43979263305664, "global_step": 229679, "epoch": 1898} {"train_loss": -42.80060577392578, "global_step": 229680, "epoch": 1898} {"train_loss": -42.21307373046875, "global_step": 229681, "epoch": 1898} {"train_loss": -42.73929977416992, "global_step": 229682, "epoch": 1898} {"train_loss": -42.56960678100586, "global_step": 229683, "epoch": 1898} {"train_loss": -42.38322067260742, "global_step": 229684, "epoch": 1898} {"train_loss": -42.1850700378418, "global_step": 229685, "epoch": 1898} {"train_loss": -41.83987045288086, "global_step": 229686, "epoch": 1898} {"train_loss": -41.828147888183594, "global_step": 229687, "epoch": 1898} {"train_loss": -42.78645706176758, "global_step": 229688, "epoch": 1898} {"train_loss": -42.38041305541992, "global_step": 229689, "epoch": 1898} {"train_loss": -42.14344787597656, "global_step": 229690, "epoch": 1898} {"train_loss": -42.7701301574707, "global_step": 229691, "epoch": 1898} {"train_loss": -42.83596420288086, "global_step": 229692, "epoch": 1898} {"train_loss": -42.54150390625, "global_step": 229693, "epoch": 1898} {"train_loss": -42.473995208740234, "global_step": 229694, "epoch": 1898} {"train_loss": -42.299800872802734, "global_step": 229695, "epoch": 1898} {"train_loss": -42.1252555847168, "global_step": 229696, "epoch": 1898} {"train_loss": -42.17024612426758, "global_step": 229697, "epoch": 1898} {"train_loss": -42.121665954589844, "global_step": 229698, "epoch": 1898} {"train_loss": -42.25281524658203, "global_step": 229699, "epoch": 1898} {"train_loss": -41.4222526550293, "global_step": 229700, "epoch": 1898} {"train_loss": -40.650543212890625, "global_step": 229701, "epoch": 1898} {"train_loss": -40.95493698120117, "global_step": 229702, "epoch": 1898} {"train_loss": -40.627254486083984, "global_step": 229703, "epoch": 1898} {"train_loss": -39.79060363769531, "global_step": 229704, "epoch": 1898} {"train_loss": -39.73564147949219, "global_step": 229705, "epoch": 1898} {"train_loss": -41.45089340209961, "global_step": 229706, "epoch": 1898} {"train_loss": -42.571998596191406, "global_step": 229707, "epoch": 1898} {"train_loss": -41.84768295288086, "global_step": 229708, "epoch": 1898} {"train_loss": -38.95994186401367, "global_step": 229709, "epoch": 1898} {"train_loss": -39.6899299621582, "global_step": 229710, "epoch": 1898} {"train_loss": -42.40757369995117, "global_step": 229711, "epoch": 1898} {"train_loss": -42.04734420776367, "global_step": 229712, "epoch": 1898} {"train_loss": -41.96282196044922, "global_step": 229713, "epoch": 1898} {"train_loss": -41.257381439208984, "global_step": 229714, "epoch": 1898} {"train_loss": -42.089210510253906, "global_step": 229715, "epoch": 1898} {"train_loss": -41.74790573120117, "global_step": 229716, "epoch": 1898} {"train_loss": -42.14836883544922, "global_step": 229717, "epoch": 1898} {"train_loss": -41.622947692871094, "global_step": 229718, "epoch": 1898} {"train_loss": -42.244659423828125, "global_step": 229719, "epoch": 1898} {"train_loss": -42.864585876464844, "global_step": 229720, "epoch": 1898} {"train_loss": -41.006690979003906, "global_step": 229721, "epoch": 1898} {"train_loss": -42.14908981323242, "global_step": 229722, "epoch": 1898} {"train_loss": -41.721595764160156, "global_step": 229723, "epoch": 1898} {"train_loss": -42.47450637817383, "global_step": 229724, "epoch": 1898} {"train_loss": -32.164649963378906, "global_step": 229725, "epoch": 1898} {"train_loss": -40.31527328491211, "global_step": 229726, "epoch": 1898} {"train_loss": -41.08079528808594, "global_step": 229727, "epoch": 1898} {"train_loss": -37.4610710144043, "global_step": 229728, "epoch": 1898} {"train_loss": -35.797157287597656, "global_step": 229729, "epoch": 1898} {"train_loss": -39.475341796875, "global_step": 229730, "epoch": 1898} {"train_loss": -41.1340217590332, "global_step": 229731, "epoch": 1898} {"train_loss": -39.376197814941406, "global_step": 229732, "epoch": 1898} {"train_loss": -40.31093978881836, "global_step": 229733, "epoch": 1898} {"train_loss": -41.68680953979492, "global_step": 229734, "epoch": 1898} {"train_loss": -37.512176513671875, "global_step": 229735, "epoch": 1898} {"train_loss": -38.90571212768555, "global_step": 229736, "epoch": 1898} {"train_loss": -41.100643157958984, "global_step": 229737, "epoch": 1898} {"train_loss": -41.312198638916016, "global_step": 229738, "epoch": 1898} {"train_loss": -39.58681869506836, "global_step": 229739, "epoch": 1898} {"train_loss": -41.450843811035156, "global_step": 229740, "epoch": 1898} {"train_loss": -37.47282028198242, "global_step": 229741, "epoch": 1898} {"train_loss": -40.93242645263672, "global_step": 229742, "epoch": 1898} {"train_loss": -37.19376754760742, "global_step": 229743, "epoch": 1898} {"train_loss": -37.927276611328125, "global_step": 229744, "epoch": 1898} {"train_loss": -41.2039680480957, "global_step": 229745, "epoch": 1898} {"train_loss": -39.93441390991211, "global_step": 229746, "epoch": 1898} {"train_loss": -40.70990753173828, "global_step": 229747, "epoch": 1898} {"train_loss": -41.68158721923828, "global_step": 229748, "epoch": 1898} {"train_loss": -40.992305755615234, "global_step": 229749, "epoch": 1898} {"train_loss": -40.815277099609375, "global_step": 229750, "epoch": 1898} {"train_loss": -39.59012985229492, "global_step": 229751, "epoch": 1898} {"train_loss": -38.942176818847656, "global_step": 229752, "epoch": 1898} {"train_loss": -40.05198669433594, "global_step": 229753, "epoch": 1898} {"train_loss": -41.67997741699219, "global_step": 229754, "epoch": 1898} {"train_loss": -38.9762077331543, "global_step": 229755, "epoch": 1898} {"train_loss": -41.26856231689453, "global_step": 229756, "epoch": 1898} {"train_loss": -41.286964416503906, "global_step": 229757, "epoch": 1898} {"train_loss": -41.64519119262695, "global_step": 229758, "epoch": 1898} {"train_loss": -41.31398010253906, "global_step": 229759, "epoch": 1898} {"train_loss": -40.90699005126953, "global_step": 229760, "epoch": 1898} {"train_loss": -41.82434844970703, "global_step": 229761, "epoch": 1898} {"train_loss": -40.88785934448242, "global_step": 229762, "epoch": 1898} {"train_loss": -40.376766204833984, "global_step": 229763, "epoch": 1898} {"train_loss": -40.431087493896484, "global_step": 229764, "epoch": 1898} {"train_loss": -40.06575393676758, "global_step": 229765, "epoch": 1898} {"train_loss": -41.67210006713867, "global_step": 229766, "epoch": 1898} {"train_loss": -39.94758224487305, "global_step": 229767, "epoch": 1898} {"train_loss": -41.046424865722656, "global_step": 229768, "epoch": 1898} {"train_loss": -42.17923355102539, "global_step": 229769, "epoch": 1898} {"train_loss": -40.375057220458984, "global_step": 229770, "epoch": 1898} {"train_loss": -41.88026428222656, "global_step": 229771, "epoch": 1898} {"train_loss": -40.899009704589844, "global_step": 229772, "epoch": 1898} {"train_loss": -41.25004196166992, "global_step": 229773, "epoch": 1898} {"train_loss": -40.63700485229492, "global_step": 229774, "epoch": 1898} {"train_loss": -41.67220687866211, "global_step": 229775, "epoch": 1898} {"train_loss": -40.46109390258789, "global_step": 229776, "epoch": 1898} {"train_loss": -41.65023422241211, "global_step": 229777, "epoch": 1898} {"train_loss": -41.099582230749206, "global_step": 229778, "epoch": 1898, "val_loss": 2822851.25} {"train_loss": -41.959320068359375, "global_step": 229779, "epoch": 1899} {"train_loss": -41.35834884643555, "global_step": 229780, "epoch": 1899} {"train_loss": -42.49668502807617, "global_step": 229781, "epoch": 1899} {"train_loss": -42.07035446166992, "global_step": 229782, "epoch": 1899} {"train_loss": -40.30915451049805, "global_step": 229783, "epoch": 1899} {"train_loss": -40.77971267700195, "global_step": 229784, "epoch": 1899} {"train_loss": -41.089393615722656, "global_step": 229785, "epoch": 1899} {"train_loss": -41.84765625, "global_step": 229786, "epoch": 1899} {"train_loss": -40.313228607177734, "global_step": 229787, "epoch": 1899} {"train_loss": -41.41117858886719, "global_step": 229788, "epoch": 1899} {"train_loss": -41.2443962097168, "global_step": 229789, "epoch": 1899} {"train_loss": -40.38542938232422, "global_step": 229790, "epoch": 1899} {"train_loss": -41.72940444946289, "global_step": 229791, "epoch": 1899} {"train_loss": -38.486488342285156, "global_step": 229792, "epoch": 1899} {"train_loss": -41.126949310302734, "global_step": 229793, "epoch": 1899} {"train_loss": -41.93117904663086, "global_step": 229794, "epoch": 1899} {"train_loss": -41.485755920410156, "global_step": 229795, "epoch": 1899} {"train_loss": -41.26148223876953, "global_step": 229796, "epoch": 1899} {"train_loss": -41.36790466308594, "global_step": 229797, "epoch": 1899} {"train_loss": -41.69863510131836, "global_step": 229798, "epoch": 1899} {"train_loss": -41.43810272216797, "global_step": 229799, "epoch": 1899} {"train_loss": -40.68006134033203, "global_step": 229800, "epoch": 1899} {"train_loss": -39.72200012207031, "global_step": 229801, "epoch": 1899} {"train_loss": -39.060890197753906, "global_step": 229802, "epoch": 1899} {"train_loss": -40.08280563354492, "global_step": 229803, "epoch": 1899} {"train_loss": -40.472965240478516, "global_step": 229804, "epoch": 1899} {"train_loss": -36.71427917480469, "global_step": 229805, "epoch": 1899} {"train_loss": -40.849605560302734, "global_step": 229806, "epoch": 1899} {"train_loss": -40.07028579711914, "global_step": 229807, "epoch": 1899} {"train_loss": -35.7114372253418, "global_step": 229808, "epoch": 1899} {"train_loss": -35.6780891418457, "global_step": 229809, "epoch": 1899} {"train_loss": -39.1139030456543, "global_step": 229810, "epoch": 1899} {"train_loss": -34.94392776489258, "global_step": 229811, "epoch": 1899} {"train_loss": -37.658382415771484, "global_step": 229812, "epoch": 1899} {"train_loss": -37.94258499145508, "global_step": 229813, "epoch": 1899} {"train_loss": -35.39626693725586, "global_step": 229814, "epoch": 1899} {"train_loss": -39.60722732543945, "global_step": 229815, "epoch": 1899} {"train_loss": -39.87150573730469, "global_step": 229816, "epoch": 1899} {"train_loss": -39.44805908203125, "global_step": 229817, "epoch": 1899} {"train_loss": -39.97945785522461, "global_step": 229818, "epoch": 1899} {"train_loss": -38.94971466064453, "global_step": 229819, "epoch": 1899} {"train_loss": -40.82422637939453, "global_step": 229820, "epoch": 1899} {"train_loss": -38.42759323120117, "global_step": 229821, "epoch": 1899} {"train_loss": -41.65603256225586, "global_step": 229822, "epoch": 1899} {"train_loss": -38.543094635009766, "global_step": 229823, "epoch": 1899} {"train_loss": -38.84000778198242, "global_step": 229824, "epoch": 1899} {"train_loss": -39.480342864990234, "global_step": 229825, "epoch": 1899} {"train_loss": -40.58106231689453, "global_step": 229826, "epoch": 1899} {"train_loss": -39.85022735595703, "global_step": 229827, "epoch": 1899} {"train_loss": -39.74922180175781, "global_step": 229828, "epoch": 1899} {"train_loss": -40.36731719970703, "global_step": 229829, "epoch": 1899} {"train_loss": -40.201904296875, "global_step": 229830, "epoch": 1899} {"train_loss": -39.65907287597656, "global_step": 229831, "epoch": 1899} {"train_loss": -41.895259857177734, "global_step": 229832, "epoch": 1899} {"train_loss": -40.516170501708984, "global_step": 229833, "epoch": 1899} {"train_loss": -41.229583740234375, "global_step": 229834, "epoch": 1899} {"train_loss": -40.658878326416016, "global_step": 229835, "epoch": 1899} {"train_loss": -40.765846252441406, "global_step": 229836, "epoch": 1899} {"train_loss": -41.33744430541992, "global_step": 229837, "epoch": 1899} {"train_loss": -41.084716796875, "global_step": 229838, "epoch": 1899} {"train_loss": -40.7536735534668, "global_step": 229839, "epoch": 1899} {"train_loss": -40.74068832397461, "global_step": 229840, "epoch": 1899} {"train_loss": -41.64461135864258, "global_step": 229841, "epoch": 1899} {"train_loss": -40.16590881347656, "global_step": 229842, "epoch": 1899} {"train_loss": -40.815895080566406, "global_step": 229843, "epoch": 1899} {"train_loss": -40.81379699707031, "global_step": 229844, "epoch": 1899} {"train_loss": -41.259517669677734, "global_step": 229845, "epoch": 1899} {"train_loss": -41.49678039550781, "global_step": 229846, "epoch": 1899} {"train_loss": -40.69935607910156, "global_step": 229847, "epoch": 1899} {"train_loss": -41.6588134765625, "global_step": 229848, "epoch": 1899} {"train_loss": -41.77016830444336, "global_step": 229849, "epoch": 1899} {"train_loss": -41.6858024597168, "global_step": 229850, "epoch": 1899} {"train_loss": -42.068519592285156, "global_step": 229851, "epoch": 1899} {"train_loss": -41.261260986328125, "global_step": 229852, "epoch": 1899} {"train_loss": -41.78770065307617, "global_step": 229853, "epoch": 1899} {"train_loss": -41.732147216796875, "global_step": 229854, "epoch": 1899} {"train_loss": -42.12117385864258, "global_step": 229855, "epoch": 1899} {"train_loss": -40.57265853881836, "global_step": 229856, "epoch": 1899} {"train_loss": -42.3673095703125, "global_step": 229857, "epoch": 1899} {"train_loss": -42.25531005859375, "global_step": 229858, "epoch": 1899} {"train_loss": -40.82554244995117, "global_step": 229859, "epoch": 1899} {"train_loss": -42.02412033081055, "global_step": 229860, "epoch": 1899} {"train_loss": -42.293697357177734, "global_step": 229861, "epoch": 1899} {"train_loss": -42.13850021362305, "global_step": 229862, "epoch": 1899} {"train_loss": -42.33624267578125, "global_step": 229863, "epoch": 1899} {"train_loss": -41.39349365234375, "global_step": 229864, "epoch": 1899} {"train_loss": -40.35651779174805, "global_step": 229865, "epoch": 1899} {"train_loss": -42.08639144897461, "global_step": 229866, "epoch": 1899} {"train_loss": -42.3382453918457, "global_step": 229867, "epoch": 1899} {"train_loss": -41.728023529052734, "global_step": 229868, "epoch": 1899} {"train_loss": -42.09099578857422, "global_step": 229869, "epoch": 1899} {"train_loss": -42.070396423339844, "global_step": 229870, "epoch": 1899} {"train_loss": -42.05350875854492, "global_step": 229871, "epoch": 1899} {"train_loss": -41.093292236328125, "global_step": 229872, "epoch": 1899} {"train_loss": -42.066139221191406, "global_step": 229873, "epoch": 1899} {"train_loss": -42.05882263183594, "global_step": 229874, "epoch": 1899} {"train_loss": -42.22983932495117, "global_step": 229875, "epoch": 1899} {"train_loss": -41.858272552490234, "global_step": 229876, "epoch": 1899} {"train_loss": -42.37934112548828, "global_step": 229877, "epoch": 1899} {"train_loss": -40.38656997680664, "global_step": 229878, "epoch": 1899} {"train_loss": -42.13239288330078, "global_step": 229879, "epoch": 1899} {"train_loss": -42.0993766784668, "global_step": 229880, "epoch": 1899} {"train_loss": -42.65800857543945, "global_step": 229881, "epoch": 1899} {"train_loss": -40.85470962524414, "global_step": 229882, "epoch": 1899} {"train_loss": -42.645687103271484, "global_step": 229883, "epoch": 1899} {"train_loss": -42.38033676147461, "global_step": 229884, "epoch": 1899} {"train_loss": -38.90450668334961, "global_step": 229885, "epoch": 1899} {"train_loss": -42.695411682128906, "global_step": 229886, "epoch": 1899} {"train_loss": -42.237979888916016, "global_step": 229887, "epoch": 1899} {"train_loss": -39.76736831665039, "global_step": 229888, "epoch": 1899} {"train_loss": -41.8321533203125, "global_step": 229889, "epoch": 1899} {"train_loss": -39.900875091552734, "global_step": 229890, "epoch": 1899} {"train_loss": -17.21375846862793, "global_step": 229891, "epoch": 1899} {"train_loss": -39.57170486450195, "global_step": 229892, "epoch": 1899} {"train_loss": -41.77324676513672, "global_step": 229893, "epoch": 1899} {"train_loss": -32.654232025146484, "global_step": 229894, "epoch": 1899} {"train_loss": -38.08538055419922, "global_step": 229895, "epoch": 1899} {"train_loss": -28.59095573425293, "global_step": 229896, "epoch": 1899} {"train_loss": -38.45856475830078, "global_step": 229897, "epoch": 1899} {"train_loss": -40.834171295166016, "global_step": 229898, "epoch": 1899} {"train_loss": -40.34307104693956, "global_step": 229899, "epoch": 1899, "val_loss": 3435737.75} {"train_loss": -38.42681884765625, "global_step": 229900, "epoch": 1900} {"train_loss": -39.17720413208008, "global_step": 229901, "epoch": 1900} {"train_loss": -36.8684196472168, "global_step": 229902, "epoch": 1900} {"train_loss": -38.9580078125, "global_step": 229903, "epoch": 1900} {"train_loss": -34.72014236450195, "global_step": 229904, "epoch": 1900} {"train_loss": -39.6875114440918, "global_step": 229905, "epoch": 1900} {"train_loss": -41.078914642333984, "global_step": 229906, "epoch": 1900} {"train_loss": -37.76607894897461, "global_step": 229907, "epoch": 1900} {"train_loss": -37.56258773803711, "global_step": 229908, "epoch": 1900} {"train_loss": -37.061248779296875, "global_step": 229909, "epoch": 1900} {"train_loss": -38.14125442504883, "global_step": 229910, "epoch": 1900} {"train_loss": -38.864967346191406, "global_step": 229911, "epoch": 1900} {"train_loss": -40.644691467285156, "global_step": 229912, "epoch": 1900} {"train_loss": -39.370513916015625, "global_step": 229913, "epoch": 1900} {"train_loss": -40.414512634277344, "global_step": 229914, "epoch": 1900} {"train_loss": -40.836666107177734, "global_step": 229915, "epoch": 1900} {"train_loss": -40.126075744628906, "global_step": 229916, "epoch": 1900} {"train_loss": -39.87250900268555, "global_step": 229917, "epoch": 1900} {"train_loss": -40.64226150512695, "global_step": 229918, "epoch": 1900} {"train_loss": -40.215667724609375, "global_step": 229919, "epoch": 1900} {"train_loss": -36.132476806640625, "global_step": 229920, "epoch": 1900} {"train_loss": -39.669097900390625, "global_step": 229921, "epoch": 1900} {"train_loss": -39.60662841796875, "global_step": 229922, "epoch": 1900} {"train_loss": -39.59054183959961, "global_step": 229923, "epoch": 1900} {"train_loss": -39.50723648071289, "global_step": 229924, "epoch": 1900} {"train_loss": -39.17499923706055, "global_step": 229925, "epoch": 1900} {"train_loss": -39.218055725097656, "global_step": 229926, "epoch": 1900} {"train_loss": -37.927608489990234, "global_step": 229927, "epoch": 1900} {"train_loss": -39.40478515625, "global_step": 229928, "epoch": 1900} {"train_loss": -39.383583068847656, "global_step": 229929, "epoch": 1900} {"train_loss": -39.8291130065918, "global_step": 229930, "epoch": 1900} {"train_loss": -39.41398239135742, "global_step": 229931, "epoch": 1900} {"train_loss": -38.187843322753906, "global_step": 229932, "epoch": 1900} {"train_loss": -40.89704513549805, "global_step": 229933, "epoch": 1900} {"train_loss": -39.13178634643555, "global_step": 229934, "epoch": 1900} {"train_loss": -40.91306686401367, "global_step": 229935, "epoch": 1900} {"train_loss": -40.315948486328125, "global_step": 229936, "epoch": 1900} {"train_loss": -38.727935791015625, "global_step": 229937, "epoch": 1900} {"train_loss": -41.2562141418457, "global_step": 229938, "epoch": 1900} {"train_loss": -41.55195236206055, "global_step": 229939, "epoch": 1900} {"train_loss": -40.94784164428711, "global_step": 229940, "epoch": 1900} {"train_loss": -41.015968322753906, "global_step": 229941, "epoch": 1900} {"train_loss": -41.013343811035156, "global_step": 229942, "epoch": 1900} {"train_loss": -39.93019485473633, "global_step": 229943, "epoch": 1900} {"train_loss": -40.31929397583008, "global_step": 229944, "epoch": 1900} {"train_loss": -39.90774154663086, "global_step": 229945, "epoch": 1900} {"train_loss": -38.63725280761719, "global_step": 229946, "epoch": 1900} {"train_loss": -39.2618522644043, "global_step": 229947, "epoch": 1900} {"train_loss": -41.07141876220703, "global_step": 229948, "epoch": 1900} {"train_loss": -41.736080169677734, "global_step": 229949, "epoch": 1900} {"train_loss": -40.821407318115234, "global_step": 229950, "epoch": 1900} {"train_loss": -41.12496566772461, "global_step": 229951, "epoch": 1900} {"train_loss": -40.822025299072266, "global_step": 229952, "epoch": 1900} {"train_loss": -40.66156768798828, "global_step": 229953, "epoch": 1900} {"train_loss": -41.24459457397461, "global_step": 229954, "epoch": 1900} {"train_loss": -40.75215148925781, "global_step": 229955, "epoch": 1900} {"train_loss": -41.40407180786133, "global_step": 229956, "epoch": 1900} {"train_loss": -41.44511032104492, "global_step": 229957, "epoch": 1900} {"train_loss": -40.62589645385742, "global_step": 229958, "epoch": 1900} {"train_loss": -40.802371978759766, "global_step": 229959, "epoch": 1900} {"train_loss": -39.62002182006836, "global_step": 229960, "epoch": 1900} {"train_loss": -41.53641891479492, "global_step": 229961, "epoch": 1900} {"train_loss": -38.82230758666992, "global_step": 229962, "epoch": 1900} {"train_loss": -40.48917770385742, "global_step": 229963, "epoch": 1900} {"train_loss": -41.70393753051758, "global_step": 229964, "epoch": 1900} {"train_loss": -40.66122055053711, "global_step": 229965, "epoch": 1900} {"train_loss": -39.813472747802734, "global_step": 229966, "epoch": 1900} {"train_loss": -41.24978256225586, "global_step": 229967, "epoch": 1900} {"train_loss": -41.70222854614258, "global_step": 229968, "epoch": 1900} {"train_loss": -41.19721603393555, "global_step": 229969, "epoch": 1900} {"train_loss": -40.120216369628906, "global_step": 229970, "epoch": 1900} {"train_loss": -41.098575592041016, "global_step": 229971, "epoch": 1900} {"train_loss": -41.11885452270508, "global_step": 229972, "epoch": 1900} {"train_loss": -40.417510986328125, "global_step": 229973, "epoch": 1900} {"train_loss": -42.42481231689453, "global_step": 229974, "epoch": 1900} {"train_loss": -40.23586654663086, "global_step": 229975, "epoch": 1900} {"train_loss": -41.69106674194336, "global_step": 229976, "epoch": 1900} {"train_loss": -41.636505126953125, "global_step": 229977, "epoch": 1900} {"train_loss": -41.650390625, "global_step": 229978, "epoch": 1900} {"train_loss": -41.28144454956055, "global_step": 229979, "epoch": 1900} {"train_loss": -41.788795471191406, "global_step": 229980, "epoch": 1900} {"train_loss": -42.33604049682617, "global_step": 229981, "epoch": 1900} {"train_loss": -40.93524169921875, "global_step": 229982, "epoch": 1900} {"train_loss": -40.88838577270508, "global_step": 229983, "epoch": 1900} {"train_loss": -41.1840934753418, "global_step": 229984, "epoch": 1900} {"train_loss": -41.90745162963867, "global_step": 229985, "epoch": 1900} {"train_loss": -41.970314025878906, "global_step": 229986, "epoch": 1900} {"train_loss": -42.171661376953125, "global_step": 229987, "epoch": 1900} {"train_loss": -41.4693489074707, "global_step": 229988, "epoch": 1900} {"train_loss": -42.1415901184082, "global_step": 229989, "epoch": 1900} {"train_loss": -42.37654113769531, "global_step": 229990, "epoch": 1900} {"train_loss": -42.435298919677734, "global_step": 229991, "epoch": 1900} {"train_loss": -41.73468017578125, "global_step": 229992, "epoch": 1900} {"train_loss": -41.67673873901367, "global_step": 229993, "epoch": 1900} {"train_loss": -41.2052001953125, "global_step": 229994, "epoch": 1900} {"train_loss": -40.655235290527344, "global_step": 229995, "epoch": 1900} {"train_loss": -42.10618209838867, "global_step": 229996, "epoch": 1900} {"train_loss": -42.62260055541992, "global_step": 229997, "epoch": 1900} {"train_loss": -42.50807189941406, "global_step": 229998, "epoch": 1900} {"train_loss": -42.26172637939453, "global_step": 229999, "epoch": 1900} {"train_loss": -42.17662048339844, "global_step": 230000, "epoch": 1900} {"train_loss": -42.46010208129883, "global_step": 230001, "epoch": 1900} {"train_loss": -42.20820236206055, "global_step": 230002, "epoch": 1900} {"train_loss": -41.84798812866211, "global_step": 230003, "epoch": 1900} {"train_loss": -41.51686477661133, "global_step": 230004, "epoch": 1900} {"train_loss": -42.206851959228516, "global_step": 230005, "epoch": 1900} {"train_loss": -42.27950668334961, "global_step": 230006, "epoch": 1900} {"train_loss": -41.98281478881836, "global_step": 230007, "epoch": 1900} {"train_loss": -42.657161712646484, "global_step": 230008, "epoch": 1900} {"train_loss": -41.86484909057617, "global_step": 230009, "epoch": 1900} {"train_loss": -42.18001937866211, "global_step": 230010, "epoch": 1900} {"train_loss": -41.4058837890625, "global_step": 230011, "epoch": 1900} {"train_loss": -42.18874740600586, "global_step": 230012, "epoch": 1900} {"train_loss": -41.63946533203125, "global_step": 230013, "epoch": 1900} {"train_loss": -40.901790618896484, "global_step": 230014, "epoch": 1900} {"train_loss": -41.50416946411133, "global_step": 230015, "epoch": 1900} {"train_loss": -41.621337890625, "global_step": 230016, "epoch": 1900} {"train_loss": -41.49372482299805, "global_step": 230017, "epoch": 1900} {"train_loss": -41.7848014831543, "global_step": 230018, "epoch": 1900} {"train_loss": -41.42253494262695, "global_step": 230019, "epoch": 1900} {"train_loss": -40.645103454589844, "global_step": 230020, "epoch": 1900, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 0.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4400000": 1.0, "test/sim_max_reward_4400001": 1.0, "test/sim_max_reward_4400002": 1.0, "test/sim_max_reward_4400003": 1.0, "test/sim_max_reward_4400004": 1.0, "test/sim_max_reward_4400005": 1.0, "test/sim_max_reward_4400006": 1.0, "test/sim_max_reward_4400007": 1.0, "test/sim_max_reward_4400008": 1.0, "test/sim_max_reward_4400009": 1.0, "test/sim_max_reward_4400010": 1.0, "test/sim_max_reward_4400011": 1.0, "test/sim_max_reward_4400012": 1.0, "test/sim_max_reward_4400013": 1.0, "test/sim_max_reward_4400014": 1.0, "test/sim_max_reward_4400015": 1.0, "test/sim_max_reward_4400016": 1.0, "test/sim_max_reward_4400017": 1.0, "test/sim_max_reward_4400018": 1.0, "test/sim_max_reward_4400019": 1.0, "test/sim_max_reward_4400020": 1.0, "test/sim_max_reward_4400021": 1.0, "train/mean_score": 0.8333333333333334, "test/mean_score": 1.0, "val_loss": 2683892.0} {"train_loss": -39.53562545776367, "global_step": 230021, "epoch": 1901} {"train_loss": -40.65778350830078, "global_step": 230022, "epoch": 1901} {"train_loss": -41.08687973022461, "global_step": 230023, "epoch": 1901} {"train_loss": -39.514808654785156, "global_step": 230024, "epoch": 1901} {"train_loss": -40.88422393798828, "global_step": 230025, "epoch": 1901} {"train_loss": -40.183143615722656, "global_step": 230026, "epoch": 1901} {"train_loss": -40.474788665771484, "global_step": 230027, "epoch": 1901} {"train_loss": -42.031856536865234, "global_step": 230028, "epoch": 1901} {"train_loss": -41.114376068115234, "global_step": 230029, "epoch": 1901} {"train_loss": -41.70326232910156, "global_step": 230030, "epoch": 1901} {"train_loss": -41.54127883911133, "global_step": 230031, "epoch": 1901} {"train_loss": -41.06507110595703, "global_step": 230032, "epoch": 1901} {"train_loss": -39.51315689086914, "global_step": 230033, "epoch": 1901} {"train_loss": -41.84381866455078, "global_step": 230034, "epoch": 1901} {"train_loss": -42.23134231567383, "global_step": 230035, "epoch": 1901} {"train_loss": -41.46232223510742, "global_step": 230036, "epoch": 1901} {"train_loss": -41.23486328125, "global_step": 230037, "epoch": 1901} {"train_loss": -41.01826095581055, "global_step": 230038, "epoch": 1901} {"train_loss": -41.798011779785156, "global_step": 230039, "epoch": 1901} {"train_loss": -40.559852600097656, "global_step": 230040, "epoch": 1901} {"train_loss": -41.22929000854492, "global_step": 230041, "epoch": 1901} {"train_loss": -41.708229064941406, "global_step": 230042, "epoch": 1901} {"train_loss": -42.030174255371094, "global_step": 230043, "epoch": 1901} {"train_loss": -41.736244201660156, "global_step": 230044, "epoch": 1901} {"train_loss": -42.46785354614258, "global_step": 230045, "epoch": 1901} {"train_loss": -41.4026985168457, "global_step": 230046, "epoch": 1901} {"train_loss": -40.87221908569336, "global_step": 230047, "epoch": 1901} {"train_loss": -41.3797492980957, "global_step": 230048, "epoch": 1901} {"train_loss": -42.219383239746094, "global_step": 230049, "epoch": 1901} {"train_loss": -41.141170501708984, "global_step": 230050, "epoch": 1901} {"train_loss": -39.18656539916992, "global_step": 230051, "epoch": 1901} {"train_loss": -39.892234802246094, "global_step": 230052, "epoch": 1901} {"train_loss": -40.30323791503906, "global_step": 230053, "epoch": 1901} {"train_loss": -42.200355529785156, "global_step": 230054, "epoch": 1901} {"train_loss": -42.138973236083984, "global_step": 230055, "epoch": 1901} {"train_loss": -41.074928283691406, "global_step": 230056, "epoch": 1901} {"train_loss": -41.831138610839844, "global_step": 230057, "epoch": 1901} {"train_loss": -42.42743682861328, "global_step": 230058, "epoch": 1901} {"train_loss": -42.46288299560547, "global_step": 230059, "epoch": 1901} {"train_loss": -41.01344680786133, "global_step": 230060, "epoch": 1901} {"train_loss": -41.9377555847168, "global_step": 230061, "epoch": 1901} {"train_loss": -42.401363372802734, "global_step": 230062, "epoch": 1901} {"train_loss": -42.77678298950195, "global_step": 230063, "epoch": 1901} {"train_loss": -41.430931091308594, "global_step": 230064, "epoch": 1901} {"train_loss": -42.657630920410156, "global_step": 230065, "epoch": 1901} {"train_loss": -42.00980758666992, "global_step": 230066, "epoch": 1901} {"train_loss": -41.56987762451172, "global_step": 230067, "epoch": 1901} {"train_loss": -41.867713928222656, "global_step": 230068, "epoch": 1901} {"train_loss": -41.612022399902344, "global_step": 230069, "epoch": 1901} {"train_loss": -40.674434661865234, "global_step": 230070, "epoch": 1901} {"train_loss": -39.83589553833008, "global_step": 230071, "epoch": 1901} {"train_loss": -39.87915802001953, "global_step": 230072, "epoch": 1901} {"train_loss": -40.354244232177734, "global_step": 230073, "epoch": 1901} {"train_loss": -41.831146240234375, "global_step": 230074, "epoch": 1901} {"train_loss": -40.5537109375, "global_step": 230075, "epoch": 1901} {"train_loss": -40.848114013671875, "global_step": 230076, "epoch": 1901} {"train_loss": -42.26933288574219, "global_step": 230077, "epoch": 1901} {"train_loss": -41.357269287109375, "global_step": 230078, "epoch": 1901} {"train_loss": -41.81428527832031, "global_step": 230079, "epoch": 1901} {"train_loss": -41.35299301147461, "global_step": 230080, "epoch": 1901} {"train_loss": -39.58210372924805, "global_step": 230081, "epoch": 1901} {"train_loss": -37.952205657958984, "global_step": 230082, "epoch": 1901} {"train_loss": -38.952003479003906, "global_step": 230083, "epoch": 1901} {"train_loss": -41.37722396850586, "global_step": 230084, "epoch": 1901} {"train_loss": -39.890716552734375, "global_step": 230085, "epoch": 1901} {"train_loss": -41.25470733642578, "global_step": 230086, "epoch": 1901} {"train_loss": -41.099552154541016, "global_step": 230087, "epoch": 1901} {"train_loss": -41.394004821777344, "global_step": 230088, "epoch": 1901} {"train_loss": -41.09649658203125, "global_step": 230089, "epoch": 1901} {"train_loss": -40.05328369140625, "global_step": 230090, "epoch": 1901} {"train_loss": -40.47734832763672, "global_step": 230091, "epoch": 1901} {"train_loss": -41.72367858886719, "global_step": 230092, "epoch": 1901} {"train_loss": -41.8148078918457, "global_step": 230093, "epoch": 1901} {"train_loss": -42.061702728271484, "global_step": 230094, "epoch": 1901} {"train_loss": -41.695899963378906, "global_step": 230095, "epoch": 1901} {"train_loss": -42.10502624511719, "global_step": 230096, "epoch": 1901} {"train_loss": -42.31544876098633, "global_step": 230097, "epoch": 1901} {"train_loss": -40.91167068481445, "global_step": 230098, "epoch": 1901} {"train_loss": -40.65234375, "global_step": 230099, "epoch": 1901} {"train_loss": -41.790428161621094, "global_step": 230100, "epoch": 1901} {"train_loss": -41.802494049072266, "global_step": 230101, "epoch": 1901} {"train_loss": -42.10429382324219, "global_step": 230102, "epoch": 1901} {"train_loss": -40.72684860229492, "global_step": 230103, "epoch": 1901} {"train_loss": -42.27696990966797, "global_step": 230104, "epoch": 1901} {"train_loss": -42.03733444213867, "global_step": 230105, "epoch": 1901} {"train_loss": -41.89003372192383, "global_step": 230106, "epoch": 1901} {"train_loss": -40.63882064819336, "global_step": 230107, "epoch": 1901} {"train_loss": -39.74881362915039, "global_step": 230108, "epoch": 1901} {"train_loss": -38.83496856689453, "global_step": 230109, "epoch": 1901} {"train_loss": -40.73129653930664, "global_step": 230110, "epoch": 1901} {"train_loss": -40.90635681152344, "global_step": 230111, "epoch": 1901} {"train_loss": -41.29652786254883, "global_step": 230112, "epoch": 1901} {"train_loss": -39.77212142944336, "global_step": 230113, "epoch": 1901} {"train_loss": -39.50741958618164, "global_step": 230114, "epoch": 1901} {"train_loss": -39.06997299194336, "global_step": 230115, "epoch": 1901} {"train_loss": -39.99208450317383, "global_step": 230116, "epoch": 1901} {"train_loss": -40.80625534057617, "global_step": 230117, "epoch": 1901} {"train_loss": -40.53127670288086, "global_step": 230118, "epoch": 1901} {"train_loss": -41.742156982421875, "global_step": 230119, "epoch": 1901} {"train_loss": -40.20632553100586, "global_step": 230120, "epoch": 1901} {"train_loss": -40.54497146606445, "global_step": 230121, "epoch": 1901} {"train_loss": -41.1612663269043, "global_step": 230122, "epoch": 1901} {"train_loss": -40.701534271240234, "global_step": 230123, "epoch": 1901} {"train_loss": -41.64409637451172, "global_step": 230124, "epoch": 1901} {"train_loss": -41.10912322998047, "global_step": 230125, "epoch": 1901} {"train_loss": -40.15812301635742, "global_step": 230126, "epoch": 1901} {"train_loss": -40.49312973022461, "global_step": 230127, "epoch": 1901} {"train_loss": -40.230873107910156, "global_step": 230128, "epoch": 1901} {"train_loss": -40.56281280517578, "global_step": 230129, "epoch": 1901} {"train_loss": -41.48830032348633, "global_step": 230130, "epoch": 1901} {"train_loss": -40.73566818237305, "global_step": 230131, "epoch": 1901} {"train_loss": -41.138877868652344, "global_step": 230132, "epoch": 1901} {"train_loss": -39.6297492980957, "global_step": 230133, "epoch": 1901} {"train_loss": -41.237728118896484, "global_step": 230134, "epoch": 1901} {"train_loss": -40.07029342651367, "global_step": 230135, "epoch": 1901} {"train_loss": -41.704132080078125, "global_step": 230136, "epoch": 1901} {"train_loss": -40.97916793823242, "global_step": 230137, "epoch": 1901} {"train_loss": -39.317440032958984, "global_step": 230138, "epoch": 1901} {"train_loss": -41.92329788208008, "global_step": 230139, "epoch": 1901} {"train_loss": -39.688838958740234, "global_step": 230140, "epoch": 1901} {"train_loss": -41.03613612277449, "global_step": 230141, "epoch": 1901, "val_loss": 2674765.25} {"train_loss": -41.07107162475586, "global_step": 230142, "epoch": 1902} {"train_loss": -40.58586883544922, "global_step": 230143, "epoch": 1902} {"train_loss": -41.321346282958984, "global_step": 230144, "epoch": 1902} {"train_loss": -40.47336196899414, "global_step": 230145, "epoch": 1902} {"train_loss": -42.19042205810547, "global_step": 230146, "epoch": 1902} {"train_loss": -39.500267028808594, "global_step": 230147, "epoch": 1902} {"train_loss": -39.75413131713867, "global_step": 230148, "epoch": 1902} {"train_loss": -41.89376449584961, "global_step": 230149, "epoch": 1902} {"train_loss": -39.00625228881836, "global_step": 230150, "epoch": 1902} {"train_loss": -41.40068054199219, "global_step": 230151, "epoch": 1902} {"train_loss": -40.041133880615234, "global_step": 230152, "epoch": 1902} {"train_loss": -40.30862045288086, "global_step": 230153, "epoch": 1902} {"train_loss": -40.10494613647461, "global_step": 230154, "epoch": 1902} {"train_loss": -38.80558395385742, "global_step": 230155, "epoch": 1902} {"train_loss": -39.87412643432617, "global_step": 230156, "epoch": 1902} {"train_loss": -41.0462532043457, "global_step": 230157, "epoch": 1902} {"train_loss": -40.02252197265625, "global_step": 230158, "epoch": 1902} {"train_loss": -42.19441604614258, "global_step": 230159, "epoch": 1902} {"train_loss": -41.087860107421875, "global_step": 230160, "epoch": 1902} {"train_loss": -41.30906295776367, "global_step": 230161, "epoch": 1902} {"train_loss": -41.046775817871094, "global_step": 230162, "epoch": 1902} {"train_loss": -41.79743576049805, "global_step": 230163, "epoch": 1902} {"train_loss": -41.6057243347168, "global_step": 230164, "epoch": 1902} {"train_loss": -42.389137268066406, "global_step": 230165, "epoch": 1902} {"train_loss": -41.69569778442383, "global_step": 230166, "epoch": 1902} {"train_loss": -41.93315505981445, "global_step": 230167, "epoch": 1902} {"train_loss": -41.501068115234375, "global_step": 230168, "epoch": 1902} {"train_loss": -41.953853607177734, "global_step": 230169, "epoch": 1902} {"train_loss": -41.788734436035156, "global_step": 230170, "epoch": 1902} {"train_loss": -42.444313049316406, "global_step": 230171, "epoch": 1902} {"train_loss": -41.928009033203125, "global_step": 230172, "epoch": 1902} {"train_loss": -41.22888946533203, "global_step": 230173, "epoch": 1902} {"train_loss": -41.78457260131836, "global_step": 230174, "epoch": 1902} {"train_loss": -42.55497360229492, "global_step": 230175, "epoch": 1902} {"train_loss": -41.94140625, "global_step": 230176, "epoch": 1902} {"train_loss": -42.08089828491211, "global_step": 230177, "epoch": 1902} {"train_loss": -42.066497802734375, "global_step": 230178, "epoch": 1902} {"train_loss": -41.93901824951172, "global_step": 230179, "epoch": 1902} {"train_loss": -41.948646545410156, "global_step": 230180, "epoch": 1902} {"train_loss": -42.24562454223633, "global_step": 230181, "epoch": 1902} {"train_loss": -41.89618682861328, "global_step": 230182, "epoch": 1902} {"train_loss": -42.396541595458984, "global_step": 230183, "epoch": 1902} {"train_loss": -42.66215133666992, "global_step": 230184, "epoch": 1902} {"train_loss": -42.074676513671875, "global_step": 230185, "epoch": 1902} {"train_loss": -42.44171905517578, "global_step": 230186, "epoch": 1902} {"train_loss": -41.59163284301758, "global_step": 230187, "epoch": 1902} {"train_loss": -42.16632080078125, "global_step": 230188, "epoch": 1902} {"train_loss": -41.739498138427734, "global_step": 230189, "epoch": 1902} {"train_loss": -42.806331634521484, "global_step": 230190, "epoch": 1902} {"train_loss": -42.29556655883789, "global_step": 230191, "epoch": 1902} {"train_loss": -41.8979606628418, "global_step": 230192, "epoch": 1902} {"train_loss": -41.3805046081543, "global_step": 230193, "epoch": 1902} {"train_loss": -42.629112243652344, "global_step": 230194, "epoch": 1902} {"train_loss": -42.673030853271484, "global_step": 230195, "epoch": 1902} {"train_loss": -42.6973876953125, "global_step": 230196, "epoch": 1902} {"train_loss": -42.67654037475586, "global_step": 230197, "epoch": 1902} {"train_loss": -43.10836410522461, "global_step": 230198, "epoch": 1902} {"train_loss": -42.708717346191406, "global_step": 230199, "epoch": 1902} {"train_loss": -42.32209014892578, "global_step": 230200, "epoch": 1902} {"train_loss": -41.22785186767578, "global_step": 230201, "epoch": 1902} {"train_loss": -38.73836898803711, "global_step": 230202, "epoch": 1902} {"train_loss": -42.20576477050781, "global_step": 230203, "epoch": 1902} {"train_loss": -42.68877029418945, "global_step": 230204, "epoch": 1902} {"train_loss": -42.36222457885742, "global_step": 230205, "epoch": 1902} {"train_loss": -39.77141571044922, "global_step": 230206, "epoch": 1902} {"train_loss": -40.9410514831543, "global_step": 230207, "epoch": 1902} {"train_loss": -42.558631896972656, "global_step": 230208, "epoch": 1902} {"train_loss": -42.73994064331055, "global_step": 230209, "epoch": 1902} {"train_loss": -42.70166015625, "global_step": 230210, "epoch": 1902} {"train_loss": -42.259361267089844, "global_step": 230211, "epoch": 1902} {"train_loss": -42.9942512512207, "global_step": 230212, "epoch": 1902} {"train_loss": -41.716285705566406, "global_step": 230213, "epoch": 1902} {"train_loss": -42.56538772583008, "global_step": 230214, "epoch": 1902} {"train_loss": -42.74078369140625, "global_step": 230215, "epoch": 1902} {"train_loss": -42.81111145019531, "global_step": 230216, "epoch": 1902} {"train_loss": -42.70553207397461, "global_step": 230217, "epoch": 1902} {"train_loss": -40.83518600463867, "global_step": 230218, "epoch": 1902} {"train_loss": -42.2330436706543, "global_step": 230219, "epoch": 1902} {"train_loss": -42.06385040283203, "global_step": 230220, "epoch": 1902} {"train_loss": -42.341365814208984, "global_step": 230221, "epoch": 1902} {"train_loss": -40.14441680908203, "global_step": 230222, "epoch": 1902} {"train_loss": -38.162200927734375, "global_step": 230223, "epoch": 1902} {"train_loss": -42.804256439208984, "global_step": 230224, "epoch": 1902} {"train_loss": -41.1141471862793, "global_step": 230225, "epoch": 1902} {"train_loss": -40.800907135009766, "global_step": 230226, "epoch": 1902} {"train_loss": -42.845458984375, "global_step": 230227, "epoch": 1902} {"train_loss": -42.403446197509766, "global_step": 230228, "epoch": 1902} {"train_loss": -42.22544860839844, "global_step": 230229, "epoch": 1902} {"train_loss": -42.581825256347656, "global_step": 230230, "epoch": 1902} {"train_loss": -41.520652770996094, "global_step": 230231, "epoch": 1902} {"train_loss": -41.79752731323242, "global_step": 230232, "epoch": 1902} {"train_loss": -41.96042251586914, "global_step": 230233, "epoch": 1902} {"train_loss": -38.77653121948242, "global_step": 230234, "epoch": 1902} {"train_loss": -41.460853576660156, "global_step": 230235, "epoch": 1902} {"train_loss": -40.86695098876953, "global_step": 230236, "epoch": 1902} {"train_loss": -39.1758918762207, "global_step": 230237, "epoch": 1902} {"train_loss": -40.23368453979492, "global_step": 230238, "epoch": 1902} {"train_loss": -41.24434280395508, "global_step": 230239, "epoch": 1902} {"train_loss": -40.54104232788086, "global_step": 230240, "epoch": 1902} {"train_loss": -40.99727249145508, "global_step": 230241, "epoch": 1902} {"train_loss": -40.363014221191406, "global_step": 230242, "epoch": 1902} {"train_loss": -42.05180740356445, "global_step": 230243, "epoch": 1902} {"train_loss": -40.82501220703125, "global_step": 230244, "epoch": 1902} {"train_loss": -41.75959777832031, "global_step": 230245, "epoch": 1902} {"train_loss": -41.60549545288086, "global_step": 230246, "epoch": 1902} {"train_loss": -40.3408203125, "global_step": 230247, "epoch": 1902} {"train_loss": -39.886287689208984, "global_step": 230248, "epoch": 1902} {"train_loss": -40.89630126953125, "global_step": 230249, "epoch": 1902} {"train_loss": -37.994686126708984, "global_step": 230250, "epoch": 1902} {"train_loss": -38.60547637939453, "global_step": 230251, "epoch": 1902} {"train_loss": -39.688812255859375, "global_step": 230252, "epoch": 1902} {"train_loss": -39.70469284057617, "global_step": 230253, "epoch": 1902} {"train_loss": -39.38323974609375, "global_step": 230254, "epoch": 1902} {"train_loss": -41.286964416503906, "global_step": 230255, "epoch": 1902} {"train_loss": -40.804908752441406, "global_step": 230256, "epoch": 1902} {"train_loss": -41.77315902709961, "global_step": 230257, "epoch": 1902} {"train_loss": -40.969844818115234, "global_step": 230258, "epoch": 1902} {"train_loss": -41.255531311035156, "global_step": 230259, "epoch": 1902} {"train_loss": -41.61836624145508, "global_step": 230260, "epoch": 1902} {"train_loss": -41.2767333984375, "global_step": 230261, "epoch": 1902} {"train_loss": -41.414928152541485, "global_step": 230262, "epoch": 1902, "val_loss": 2601530.5} {"train_loss": -41.92119598388672, "global_step": 230263, "epoch": 1903} {"train_loss": -41.56483840942383, "global_step": 230264, "epoch": 1903} {"train_loss": -41.98472213745117, "global_step": 230265, "epoch": 1903} {"train_loss": -41.02988815307617, "global_step": 230266, "epoch": 1903} {"train_loss": -42.35575866699219, "global_step": 230267, "epoch": 1903} {"train_loss": -40.65901565551758, "global_step": 230268, "epoch": 1903} {"train_loss": -41.2994384765625, "global_step": 230269, "epoch": 1903} {"train_loss": -41.88424301147461, "global_step": 230270, "epoch": 1903} {"train_loss": -38.93988800048828, "global_step": 230271, "epoch": 1903} {"train_loss": -41.65065002441406, "global_step": 230272, "epoch": 1903} {"train_loss": -42.08212661743164, "global_step": 230273, "epoch": 1903} {"train_loss": -42.49909210205078, "global_step": 230274, "epoch": 1903} {"train_loss": -41.919620513916016, "global_step": 230275, "epoch": 1903} {"train_loss": -39.79571533203125, "global_step": 230276, "epoch": 1903} {"train_loss": -41.956398010253906, "global_step": 230277, "epoch": 1903} {"train_loss": -42.178707122802734, "global_step": 230278, "epoch": 1903} {"train_loss": -42.53200912475586, "global_step": 230279, "epoch": 1903} {"train_loss": -42.181671142578125, "global_step": 230280, "epoch": 1903} {"train_loss": -42.48369598388672, "global_step": 230281, "epoch": 1903} {"train_loss": -36.35368347167969, "global_step": 230282, "epoch": 1903} {"train_loss": -41.11185836791992, "global_step": 230283, "epoch": 1903} {"train_loss": -41.25416946411133, "global_step": 230284, "epoch": 1903} {"train_loss": -38.04768371582031, "global_step": 230285, "epoch": 1903} {"train_loss": -41.55762481689453, "global_step": 230286, "epoch": 1903} {"train_loss": -41.47126007080078, "global_step": 230287, "epoch": 1903} {"train_loss": -39.97333908081055, "global_step": 230288, "epoch": 1903} {"train_loss": -42.100704193115234, "global_step": 230289, "epoch": 1903} {"train_loss": -41.71137237548828, "global_step": 230290, "epoch": 1903} {"train_loss": -41.6147575378418, "global_step": 230291, "epoch": 1903} {"train_loss": -42.32707595825195, "global_step": 230292, "epoch": 1903} {"train_loss": -41.71512985229492, "global_step": 230293, "epoch": 1903} {"train_loss": -41.11098098754883, "global_step": 230294, "epoch": 1903} {"train_loss": -42.10907745361328, "global_step": 230295, "epoch": 1903} {"train_loss": -40.24402618408203, "global_step": 230296, "epoch": 1903} {"train_loss": -42.74318313598633, "global_step": 230297, "epoch": 1903} {"train_loss": -41.5060920715332, "global_step": 230298, "epoch": 1903} {"train_loss": -41.26852035522461, "global_step": 230299, "epoch": 1903} {"train_loss": -41.699642181396484, "global_step": 230300, "epoch": 1903} {"train_loss": -41.87395095825195, "global_step": 230301, "epoch": 1903} {"train_loss": -41.980220794677734, "global_step": 230302, "epoch": 1903} {"train_loss": -41.59552001953125, "global_step": 230303, "epoch": 1903} {"train_loss": -41.79436111450195, "global_step": 230304, "epoch": 1903} {"train_loss": -42.17130661010742, "global_step": 230305, "epoch": 1903} {"train_loss": -39.3735466003418, "global_step": 230306, "epoch": 1903} {"train_loss": -42.00669479370117, "global_step": 230307, "epoch": 1903} {"train_loss": -42.604122161865234, "global_step": 230308, "epoch": 1903} {"train_loss": -42.71696853637695, "global_step": 230309, "epoch": 1903} {"train_loss": -42.332366943359375, "global_step": 230310, "epoch": 1903} {"train_loss": -41.156951904296875, "global_step": 230311, "epoch": 1903} {"train_loss": -41.506446838378906, "global_step": 230312, "epoch": 1903} {"train_loss": -42.23102569580078, "global_step": 230313, "epoch": 1903} {"train_loss": -42.49711990356445, "global_step": 230314, "epoch": 1903} {"train_loss": -41.053707122802734, "global_step": 230315, "epoch": 1903} {"train_loss": -40.86240768432617, "global_step": 230316, "epoch": 1903} {"train_loss": -39.40447998046875, "global_step": 230317, "epoch": 1903} {"train_loss": -41.777584075927734, "global_step": 230318, "epoch": 1903} {"train_loss": -42.19269943237305, "global_step": 230319, "epoch": 1903} {"train_loss": -42.44721603393555, "global_step": 230320, "epoch": 1903} {"train_loss": -42.43879318237305, "global_step": 230321, "epoch": 1903} {"train_loss": -40.42008972167969, "global_step": 230322, "epoch": 1903} {"train_loss": -41.13764572143555, "global_step": 230323, "epoch": 1903} {"train_loss": -41.86600112915039, "global_step": 230324, "epoch": 1903} {"train_loss": -41.58817672729492, "global_step": 230325, "epoch": 1903} {"train_loss": -42.5704345703125, "global_step": 230326, "epoch": 1903} {"train_loss": -39.131961822509766, "global_step": 230327, "epoch": 1903} {"train_loss": -39.37587356567383, "global_step": 230328, "epoch": 1903} {"train_loss": -39.04369354248047, "global_step": 230329, "epoch": 1903} {"train_loss": -40.22858810424805, "global_step": 230330, "epoch": 1903} {"train_loss": -40.64839553833008, "global_step": 230331, "epoch": 1903} {"train_loss": -38.19984817504883, "global_step": 230332, "epoch": 1903} {"train_loss": -35.8304443359375, "global_step": 230333, "epoch": 1903} {"train_loss": -33.81853103637695, "global_step": 230334, "epoch": 1903} {"train_loss": -40.300140380859375, "global_step": 230335, "epoch": 1903} {"train_loss": -39.21870803833008, "global_step": 230336, "epoch": 1903} {"train_loss": -37.11991500854492, "global_step": 230337, "epoch": 1903} {"train_loss": -41.475955963134766, "global_step": 230338, "epoch": 1903} {"train_loss": -37.732330322265625, "global_step": 230339, "epoch": 1903} {"train_loss": -39.1175537109375, "global_step": 230340, "epoch": 1903} {"train_loss": -40.266536712646484, "global_step": 230341, "epoch": 1903} {"train_loss": -38.125328063964844, "global_step": 230342, "epoch": 1903} {"train_loss": -40.15525436401367, "global_step": 230343, "epoch": 1903} {"train_loss": -38.783363342285156, "global_step": 230344, "epoch": 1903} {"train_loss": -41.6448974609375, "global_step": 230345, "epoch": 1903} {"train_loss": -38.454952239990234, "global_step": 230346, "epoch": 1903} {"train_loss": -40.640472412109375, "global_step": 230347, "epoch": 1903} {"train_loss": -39.31293487548828, "global_step": 230348, "epoch": 1903} {"train_loss": -41.22319030761719, "global_step": 230349, "epoch": 1903} {"train_loss": -39.662498474121094, "global_step": 230350, "epoch": 1903} {"train_loss": -42.00788497924805, "global_step": 230351, "epoch": 1903} {"train_loss": -40.664154052734375, "global_step": 230352, "epoch": 1903} {"train_loss": -41.92920684814453, "global_step": 230353, "epoch": 1903} {"train_loss": -40.5886116027832, "global_step": 230354, "epoch": 1903} {"train_loss": -41.088802337646484, "global_step": 230355, "epoch": 1903} {"train_loss": -40.45078659057617, "global_step": 230356, "epoch": 1903} {"train_loss": -41.68086242675781, "global_step": 230357, "epoch": 1903} {"train_loss": -39.31407165527344, "global_step": 230358, "epoch": 1903} {"train_loss": -40.715576171875, "global_step": 230359, "epoch": 1903} {"train_loss": -40.9296875, "global_step": 230360, "epoch": 1903} {"train_loss": -41.9654655456543, "global_step": 230361, "epoch": 1903} {"train_loss": -41.33210372924805, "global_step": 230362, "epoch": 1903} {"train_loss": -41.357818603515625, "global_step": 230363, "epoch": 1903} {"train_loss": -41.26164627075195, "global_step": 230364, "epoch": 1903} {"train_loss": -42.007423400878906, "global_step": 230365, "epoch": 1903} {"train_loss": -41.769771575927734, "global_step": 230366, "epoch": 1903} {"train_loss": -41.86838912963867, "global_step": 230367, "epoch": 1903} {"train_loss": -41.8403205871582, "global_step": 230368, "epoch": 1903} {"train_loss": -41.89620590209961, "global_step": 230369, "epoch": 1903} {"train_loss": -42.33710479736328, "global_step": 230370, "epoch": 1903} {"train_loss": -42.48739242553711, "global_step": 230371, "epoch": 1903} {"train_loss": -41.82887649536133, "global_step": 230372, "epoch": 1903} {"train_loss": -42.06270217895508, "global_step": 230373, "epoch": 1903} {"train_loss": -40.970550537109375, "global_step": 230374, "epoch": 1903} {"train_loss": -42.219390869140625, "global_step": 230375, "epoch": 1903} {"train_loss": -42.437774658203125, "global_step": 230376, "epoch": 1903} {"train_loss": -42.108314514160156, "global_step": 230377, "epoch": 1903} {"train_loss": -41.88618087768555, "global_step": 230378, "epoch": 1903} {"train_loss": -41.79435348510742, "global_step": 230379, "epoch": 1903} {"train_loss": -41.71826934814453, "global_step": 230380, "epoch": 1903} {"train_loss": -40.119964599609375, "global_step": 230381, "epoch": 1903} {"train_loss": -42.50263214111328, "global_step": 230382, "epoch": 1903} {"train_loss": -41.03270749809328, "global_step": 230383, "epoch": 1903, "val_loss": 3690638.0} {"train_loss": -40.87651824951172, "global_step": 230384, "epoch": 1904} {"train_loss": -40.35317611694336, "global_step": 230385, "epoch": 1904} {"train_loss": -40.74583053588867, "global_step": 230386, "epoch": 1904} {"train_loss": -38.08183288574219, "global_step": 230387, "epoch": 1904} {"train_loss": -42.10770797729492, "global_step": 230388, "epoch": 1904} {"train_loss": -42.185821533203125, "global_step": 230389, "epoch": 1904} {"train_loss": -41.25566482543945, "global_step": 230390, "epoch": 1904} {"train_loss": -40.0348014831543, "global_step": 230391, "epoch": 1904} {"train_loss": -35.75413131713867, "global_step": 230392, "epoch": 1904} {"train_loss": -42.039215087890625, "global_step": 230393, "epoch": 1904} {"train_loss": -41.47701644897461, "global_step": 230394, "epoch": 1904} {"train_loss": -42.49745559692383, "global_step": 230395, "epoch": 1904} {"train_loss": -41.599185943603516, "global_step": 230396, "epoch": 1904} {"train_loss": -41.990840911865234, "global_step": 230397, "epoch": 1904} {"train_loss": -42.31373977661133, "global_step": 230398, "epoch": 1904} {"train_loss": -39.777496337890625, "global_step": 230399, "epoch": 1904} {"train_loss": -36.78581619262695, "global_step": 230400, "epoch": 1904} {"train_loss": -38.7377815246582, "global_step": 230401, "epoch": 1904} {"train_loss": -41.92641067504883, "global_step": 230402, "epoch": 1904} {"train_loss": -40.791316986083984, "global_step": 230403, "epoch": 1904} {"train_loss": -37.64033889770508, "global_step": 230404, "epoch": 1904} {"train_loss": -41.98539352416992, "global_step": 230405, "epoch": 1904} {"train_loss": -40.52913284301758, "global_step": 230406, "epoch": 1904} {"train_loss": -40.482059478759766, "global_step": 230407, "epoch": 1904} {"train_loss": -37.06251525878906, "global_step": 230408, "epoch": 1904} {"train_loss": -39.11274337768555, "global_step": 230409, "epoch": 1904} {"train_loss": -41.157691955566406, "global_step": 230410, "epoch": 1904} {"train_loss": -40.5181884765625, "global_step": 230411, "epoch": 1904} {"train_loss": -40.10718536376953, "global_step": 230412, "epoch": 1904} {"train_loss": -40.732845306396484, "global_step": 230413, "epoch": 1904} {"train_loss": -38.00238037109375, "global_step": 230414, "epoch": 1904} {"train_loss": -39.87612533569336, "global_step": 230415, "epoch": 1904} {"train_loss": -41.872798919677734, "global_step": 230416, "epoch": 1904} {"train_loss": -40.890838623046875, "global_step": 230417, "epoch": 1904} {"train_loss": -40.68525314331055, "global_step": 230418, "epoch": 1904} {"train_loss": -41.91379165649414, "global_step": 230419, "epoch": 1904} {"train_loss": -40.25838851928711, "global_step": 230420, "epoch": 1904} {"train_loss": -39.87868881225586, "global_step": 230421, "epoch": 1904} {"train_loss": -37.74467849731445, "global_step": 230422, "epoch": 1904} {"train_loss": -38.96366500854492, "global_step": 230423, "epoch": 1904} {"train_loss": -37.4798698425293, "global_step": 230424, "epoch": 1904} {"train_loss": -39.32741928100586, "global_step": 230425, "epoch": 1904} {"train_loss": -40.488441467285156, "global_step": 230426, "epoch": 1904} {"train_loss": -35.25002670288086, "global_step": 230427, "epoch": 1904} {"train_loss": -37.989532470703125, "global_step": 230428, "epoch": 1904} {"train_loss": -40.344215393066406, "global_step": 230429, "epoch": 1904} {"train_loss": -40.9688606262207, "global_step": 230430, "epoch": 1904} {"train_loss": -41.48087692260742, "global_step": 230431, "epoch": 1904} {"train_loss": -41.702144622802734, "global_step": 230432, "epoch": 1904} {"train_loss": -41.692012786865234, "global_step": 230433, "epoch": 1904} {"train_loss": -40.47893524169922, "global_step": 230434, "epoch": 1904} {"train_loss": -40.72758102416992, "global_step": 230435, "epoch": 1904} {"train_loss": -38.45792770385742, "global_step": 230436, "epoch": 1904} {"train_loss": -40.361454010009766, "global_step": 230437, "epoch": 1904} {"train_loss": -37.72172546386719, "global_step": 230438, "epoch": 1904} {"train_loss": -41.64030075073242, "global_step": 230439, "epoch": 1904} {"train_loss": -40.15592956542969, "global_step": 230440, "epoch": 1904} {"train_loss": -40.693885803222656, "global_step": 230441, "epoch": 1904} {"train_loss": -40.14208984375, "global_step": 230442, "epoch": 1904} {"train_loss": -39.763275146484375, "global_step": 230443, "epoch": 1904} {"train_loss": -41.64576721191406, "global_step": 230444, "epoch": 1904} {"train_loss": -38.99821090698242, "global_step": 230445, "epoch": 1904} {"train_loss": -39.88338851928711, "global_step": 230446, "epoch": 1904} {"train_loss": -40.05161666870117, "global_step": 230447, "epoch": 1904} {"train_loss": -41.70650863647461, "global_step": 230448, "epoch": 1904} {"train_loss": -41.638092041015625, "global_step": 230449, "epoch": 1904} {"train_loss": -41.47896194458008, "global_step": 230450, "epoch": 1904} {"train_loss": -41.3846549987793, "global_step": 230451, "epoch": 1904} {"train_loss": -40.52460861206055, "global_step": 230452, "epoch": 1904} {"train_loss": -39.88962936401367, "global_step": 230453, "epoch": 1904} {"train_loss": -40.3328971862793, "global_step": 230454, "epoch": 1904} {"train_loss": -37.65712356567383, "global_step": 230455, "epoch": 1904} {"train_loss": -42.00740051269531, "global_step": 230456, "epoch": 1904} {"train_loss": -39.720333099365234, "global_step": 230457, "epoch": 1904} {"train_loss": -41.90848922729492, "global_step": 230458, "epoch": 1904} {"train_loss": -42.093605041503906, "global_step": 230459, "epoch": 1904} {"train_loss": -41.33683395385742, "global_step": 230460, "epoch": 1904} {"train_loss": -40.22713088989258, "global_step": 230461, "epoch": 1904} {"train_loss": -41.79461669921875, "global_step": 230462, "epoch": 1904} {"train_loss": -41.876216888427734, "global_step": 230463, "epoch": 1904} {"train_loss": -41.564781188964844, "global_step": 230464, "epoch": 1904} {"train_loss": -40.36586380004883, "global_step": 230465, "epoch": 1904} {"train_loss": -41.707637786865234, "global_step": 230466, "epoch": 1904} {"train_loss": -42.353092193603516, "global_step": 230467, "epoch": 1904} {"train_loss": -41.900089263916016, "global_step": 230468, "epoch": 1904} {"train_loss": -41.640968322753906, "global_step": 230469, "epoch": 1904} {"train_loss": -41.61470413208008, "global_step": 230470, "epoch": 1904} {"train_loss": -41.29170608520508, "global_step": 230471, "epoch": 1904} {"train_loss": -42.08401107788086, "global_step": 230472, "epoch": 1904} {"train_loss": -40.732032775878906, "global_step": 230473, "epoch": 1904} {"train_loss": -40.913570404052734, "global_step": 230474, "epoch": 1904} {"train_loss": -40.452850341796875, "global_step": 230475, "epoch": 1904} {"train_loss": -41.650718688964844, "global_step": 230476, "epoch": 1904} {"train_loss": -41.82883834838867, "global_step": 230477, "epoch": 1904} {"train_loss": -40.7032585144043, "global_step": 230478, "epoch": 1904} {"train_loss": -41.94926834106445, "global_step": 230479, "epoch": 1904} {"train_loss": -41.530975341796875, "global_step": 230480, "epoch": 1904} {"train_loss": -41.13059997558594, "global_step": 230481, "epoch": 1904} {"train_loss": -41.29185104370117, "global_step": 230482, "epoch": 1904} {"train_loss": -41.344154357910156, "global_step": 230483, "epoch": 1904} {"train_loss": -40.12352752685547, "global_step": 230484, "epoch": 1904} {"train_loss": -42.11310577392578, "global_step": 230485, "epoch": 1904} {"train_loss": -41.46173858642578, "global_step": 230486, "epoch": 1904} {"train_loss": -41.428096771240234, "global_step": 230487, "epoch": 1904} {"train_loss": -41.754024505615234, "global_step": 230488, "epoch": 1904} {"train_loss": -42.0518684387207, "global_step": 230489, "epoch": 1904} {"train_loss": -41.3013916015625, "global_step": 230490, "epoch": 1904} {"train_loss": -41.95200729370117, "global_step": 230491, "epoch": 1904} {"train_loss": -41.95392990112305, "global_step": 230492, "epoch": 1904} {"train_loss": -41.70371627807617, "global_step": 230493, "epoch": 1904} {"train_loss": -41.77936553955078, "global_step": 230494, "epoch": 1904} {"train_loss": -42.0587272644043, "global_step": 230495, "epoch": 1904} {"train_loss": -42.689029693603516, "global_step": 230496, "epoch": 1904} {"train_loss": -41.56336212158203, "global_step": 230497, "epoch": 1904} {"train_loss": -42.14793014526367, "global_step": 230498, "epoch": 1904} {"train_loss": -40.962337493896484, "global_step": 230499, "epoch": 1904} {"train_loss": -41.17287063598633, "global_step": 230500, "epoch": 1904} {"train_loss": -42.16876983642578, "global_step": 230501, "epoch": 1904} {"train_loss": -41.71620559692383, "global_step": 230502, "epoch": 1904} {"train_loss": -41.33786392211914, "global_step": 230503, "epoch": 1904} {"train_loss": -40.724863572554156, "global_step": 230504, "epoch": 1904, "val_loss": 2694640.5} {"train_loss": -41.75194549560547, "global_step": 230505, "epoch": 1905} {"train_loss": -42.0414924621582, "global_step": 230506, "epoch": 1905} {"train_loss": -42.20088195800781, "global_step": 230507, "epoch": 1905} {"train_loss": -42.14484405517578, "global_step": 230508, "epoch": 1905} {"train_loss": -41.68782424926758, "global_step": 230509, "epoch": 1905} {"train_loss": -41.73743438720703, "global_step": 230510, "epoch": 1905} {"train_loss": -42.22200012207031, "global_step": 230511, "epoch": 1905} {"train_loss": -42.19358444213867, "global_step": 230512, "epoch": 1905} {"train_loss": -42.60797119140625, "global_step": 230513, "epoch": 1905} {"train_loss": -42.69265365600586, "global_step": 230514, "epoch": 1905} {"train_loss": -41.85628128051758, "global_step": 230515, "epoch": 1905} {"train_loss": -40.93825912475586, "global_step": 230516, "epoch": 1905} {"train_loss": -42.463253021240234, "global_step": 230517, "epoch": 1905} {"train_loss": -42.28493881225586, "global_step": 230518, "epoch": 1905} {"train_loss": -42.4663200378418, "global_step": 230519, "epoch": 1905} {"train_loss": -42.09064865112305, "global_step": 230520, "epoch": 1905} {"train_loss": -42.411285400390625, "global_step": 230521, "epoch": 1905} {"train_loss": -42.19722366333008, "global_step": 230522, "epoch": 1905} {"train_loss": -41.73163986206055, "global_step": 230523, "epoch": 1905} {"train_loss": -42.141380310058594, "global_step": 230524, "epoch": 1905} {"train_loss": -42.26168441772461, "global_step": 230525, "epoch": 1905} {"train_loss": -42.20501708984375, "global_step": 230526, "epoch": 1905} {"train_loss": -42.64332962036133, "global_step": 230527, "epoch": 1905} {"train_loss": -41.85268783569336, "global_step": 230528, "epoch": 1905} {"train_loss": -40.9987678527832, "global_step": 230529, "epoch": 1905} {"train_loss": -42.5394401550293, "global_step": 230530, "epoch": 1905} {"train_loss": -42.54561233520508, "global_step": 230531, "epoch": 1905} {"train_loss": -41.80995559692383, "global_step": 230532, "epoch": 1905} {"train_loss": -42.60341262817383, "global_step": 230533, "epoch": 1905} {"train_loss": -41.1967658996582, "global_step": 230534, "epoch": 1905} {"train_loss": -41.29001998901367, "global_step": 230535, "epoch": 1905} {"train_loss": -41.192623138427734, "global_step": 230536, "epoch": 1905} {"train_loss": -42.24628448486328, "global_step": 230537, "epoch": 1905} {"train_loss": -41.34846115112305, "global_step": 230538, "epoch": 1905} {"train_loss": -41.2153434753418, "global_step": 230539, "epoch": 1905} {"train_loss": -38.124244689941406, "global_step": 230540, "epoch": 1905} {"train_loss": -41.33222198486328, "global_step": 230541, "epoch": 1905} {"train_loss": -41.25593948364258, "global_step": 230542, "epoch": 1905} {"train_loss": -40.78779220581055, "global_step": 230543, "epoch": 1905} {"train_loss": -38.67287826538086, "global_step": 230544, "epoch": 1905} {"train_loss": -40.79377365112305, "global_step": 230545, "epoch": 1905} {"train_loss": -41.403564453125, "global_step": 230546, "epoch": 1905} {"train_loss": -39.700862884521484, "global_step": 230547, "epoch": 1905} {"train_loss": -41.147369384765625, "global_step": 230548, "epoch": 1905} {"train_loss": -40.532936096191406, "global_step": 230549, "epoch": 1905} {"train_loss": -41.467994689941406, "global_step": 230550, "epoch": 1905} {"train_loss": -40.516414642333984, "global_step": 230551, "epoch": 1905} {"train_loss": -40.91276550292969, "global_step": 230552, "epoch": 1905} {"train_loss": -41.740882873535156, "global_step": 230553, "epoch": 1905} {"train_loss": -41.16856002807617, "global_step": 230554, "epoch": 1905} {"train_loss": -41.07444763183594, "global_step": 230555, "epoch": 1905} {"train_loss": -40.06460189819336, "global_step": 230556, "epoch": 1905} {"train_loss": -42.205047607421875, "global_step": 230557, "epoch": 1905} {"train_loss": -41.04364776611328, "global_step": 230558, "epoch": 1905} {"train_loss": -41.609222412109375, "global_step": 230559, "epoch": 1905} {"train_loss": -41.062408447265625, "global_step": 230560, "epoch": 1905} {"train_loss": -41.613155364990234, "global_step": 230561, "epoch": 1905} {"train_loss": -41.78788375854492, "global_step": 230562, "epoch": 1905} {"train_loss": -41.00119400024414, "global_step": 230563, "epoch": 1905} {"train_loss": -41.6254997253418, "global_step": 230564, "epoch": 1905} {"train_loss": -42.2474250793457, "global_step": 230565, "epoch": 1905} {"train_loss": -41.990413665771484, "global_step": 230566, "epoch": 1905} {"train_loss": -41.063026428222656, "global_step": 230567, "epoch": 1905} {"train_loss": -42.018924713134766, "global_step": 230568, "epoch": 1905} {"train_loss": -41.66584396362305, "global_step": 230569, "epoch": 1905} {"train_loss": -41.50640869140625, "global_step": 230570, "epoch": 1905} {"train_loss": -41.350746154785156, "global_step": 230571, "epoch": 1905} {"train_loss": -41.059513092041016, "global_step": 230572, "epoch": 1905} {"train_loss": -41.218780517578125, "global_step": 230573, "epoch": 1905} {"train_loss": -42.18603515625, "global_step": 230574, "epoch": 1905} {"train_loss": -42.86360549926758, "global_step": 230575, "epoch": 1905} {"train_loss": -41.635982513427734, "global_step": 230576, "epoch": 1905} {"train_loss": -42.1684455871582, "global_step": 230577, "epoch": 1905} {"train_loss": -42.03361129760742, "global_step": 230578, "epoch": 1905} {"train_loss": -41.64414596557617, "global_step": 230579, "epoch": 1905} {"train_loss": -42.41266632080078, "global_step": 230580, "epoch": 1905} {"train_loss": -42.81726837158203, "global_step": 230581, "epoch": 1905} {"train_loss": -41.43132019042969, "global_step": 230582, "epoch": 1905} {"train_loss": -41.43185043334961, "global_step": 230583, "epoch": 1905} {"train_loss": -42.77356719970703, "global_step": 230584, "epoch": 1905} {"train_loss": -41.32143783569336, "global_step": 230585, "epoch": 1905} {"train_loss": -42.10499954223633, "global_step": 230586, "epoch": 1905} {"train_loss": -42.13478469848633, "global_step": 230587, "epoch": 1905} {"train_loss": -42.42109298706055, "global_step": 230588, "epoch": 1905} {"train_loss": -42.58893966674805, "global_step": 230589, "epoch": 1905} {"train_loss": -42.768165588378906, "global_step": 230590, "epoch": 1905} {"train_loss": -43.121070861816406, "global_step": 230591, "epoch": 1905} {"train_loss": -42.78031539916992, "global_step": 230592, "epoch": 1905} {"train_loss": -42.363075256347656, "global_step": 230593, "epoch": 1905} {"train_loss": -42.472633361816406, "global_step": 230594, "epoch": 1905} {"train_loss": -42.310604095458984, "global_step": 230595, "epoch": 1905} {"train_loss": -41.81230926513672, "global_step": 230596, "epoch": 1905} {"train_loss": -41.70874786376953, "global_step": 230597, "epoch": 1905} {"train_loss": -41.88175582885742, "global_step": 230598, "epoch": 1905} {"train_loss": -41.2889289855957, "global_step": 230599, "epoch": 1905} {"train_loss": -42.0341796875, "global_step": 230600, "epoch": 1905} {"train_loss": -42.771854400634766, "global_step": 230601, "epoch": 1905} {"train_loss": -41.219390869140625, "global_step": 230602, "epoch": 1905} {"train_loss": -42.58809280395508, "global_step": 230603, "epoch": 1905} {"train_loss": -41.03388595581055, "global_step": 230604, "epoch": 1905} {"train_loss": -42.38578796386719, "global_step": 230605, "epoch": 1905} {"train_loss": -42.716915130615234, "global_step": 230606, "epoch": 1905} {"train_loss": -41.00260543823242, "global_step": 230607, "epoch": 1905} {"train_loss": -41.201839447021484, "global_step": 230608, "epoch": 1905} {"train_loss": -42.68711853027344, "global_step": 230609, "epoch": 1905} {"train_loss": -39.9426155090332, "global_step": 230610, "epoch": 1905} {"train_loss": -41.288997650146484, "global_step": 230611, "epoch": 1905} {"train_loss": -41.51124572753906, "global_step": 230612, "epoch": 1905} {"train_loss": -42.0030403137207, "global_step": 230613, "epoch": 1905} {"train_loss": -41.1717414855957, "global_step": 230614, "epoch": 1905} {"train_loss": -39.01243209838867, "global_step": 230615, "epoch": 1905} {"train_loss": -39.4748649597168, "global_step": 230616, "epoch": 1905} {"train_loss": -41.56373977661133, "global_step": 230617, "epoch": 1905} {"train_loss": -41.86960983276367, "global_step": 230618, "epoch": 1905} {"train_loss": -41.61297607421875, "global_step": 230619, "epoch": 1905} {"train_loss": -39.47541046142578, "global_step": 230620, "epoch": 1905} {"train_loss": -38.31196212768555, "global_step": 230621, "epoch": 1905} {"train_loss": -41.609596252441406, "global_step": 230622, "epoch": 1905} {"train_loss": -42.32884979248047, "global_step": 230623, "epoch": 1905} {"train_loss": -41.67544174194336, "global_step": 230624, "epoch": 1905} {"train_loss": -41.618656063867995, "global_step": 230625, "epoch": 1905, "val_loss": 2611159.25} {"train_loss": -42.2012939453125, "global_step": 230626, "epoch": 1906} {"train_loss": -42.04045486450195, "global_step": 230627, "epoch": 1906} {"train_loss": -41.8671760559082, "global_step": 230628, "epoch": 1906} {"train_loss": -41.60915756225586, "global_step": 230629, "epoch": 1906} {"train_loss": -38.90053176879883, "global_step": 230630, "epoch": 1906} {"train_loss": -41.52680206298828, "global_step": 230631, "epoch": 1906} {"train_loss": -40.39638900756836, "global_step": 230632, "epoch": 1906} {"train_loss": -41.091243743896484, "global_step": 230633, "epoch": 1906} {"train_loss": -42.12791061401367, "global_step": 230634, "epoch": 1906} {"train_loss": -39.77642822265625, "global_step": 230635, "epoch": 1906} {"train_loss": -40.74300765991211, "global_step": 230636, "epoch": 1906} {"train_loss": -41.17326736450195, "global_step": 230637, "epoch": 1906} {"train_loss": -39.74879837036133, "global_step": 230638, "epoch": 1906} {"train_loss": -41.543701171875, "global_step": 230639, "epoch": 1906} {"train_loss": -40.520652770996094, "global_step": 230640, "epoch": 1906} {"train_loss": -41.042572021484375, "global_step": 230641, "epoch": 1906} {"train_loss": -41.7287483215332, "global_step": 230642, "epoch": 1906} {"train_loss": -40.92792510986328, "global_step": 230643, "epoch": 1906} {"train_loss": -39.967506408691406, "global_step": 230644, "epoch": 1906} {"train_loss": -41.1389274597168, "global_step": 230645, "epoch": 1906} {"train_loss": -40.45413589477539, "global_step": 230646, "epoch": 1906} {"train_loss": -41.089149475097656, "global_step": 230647, "epoch": 1906} {"train_loss": -41.2923583984375, "global_step": 230648, "epoch": 1906} {"train_loss": -41.03107833862305, "global_step": 230649, "epoch": 1906} {"train_loss": -41.446285247802734, "global_step": 230650, "epoch": 1906} {"train_loss": -42.1392936706543, "global_step": 230651, "epoch": 1906} {"train_loss": -41.43513107299805, "global_step": 230652, "epoch": 1906} {"train_loss": -42.11301803588867, "global_step": 230653, "epoch": 1906} {"train_loss": -42.052032470703125, "global_step": 230654, "epoch": 1906} {"train_loss": -42.17063903808594, "global_step": 230655, "epoch": 1906} {"train_loss": -42.41754150390625, "global_step": 230656, "epoch": 1906} {"train_loss": -41.752906799316406, "global_step": 230657, "epoch": 1906} {"train_loss": -42.18612289428711, "global_step": 230658, "epoch": 1906} {"train_loss": -42.50257110595703, "global_step": 230659, "epoch": 1906} {"train_loss": -41.52745819091797, "global_step": 230660, "epoch": 1906} {"train_loss": -41.62897491455078, "global_step": 230661, "epoch": 1906} {"train_loss": -42.0944938659668, "global_step": 230662, "epoch": 1906} {"train_loss": -41.256309509277344, "global_step": 230663, "epoch": 1906} {"train_loss": -42.0103759765625, "global_step": 230664, "epoch": 1906} {"train_loss": -41.96281814575195, "global_step": 230665, "epoch": 1906} {"train_loss": -42.4107780456543, "global_step": 230666, "epoch": 1906} {"train_loss": -41.34091567993164, "global_step": 230667, "epoch": 1906} {"train_loss": -42.63736343383789, "global_step": 230668, "epoch": 1906} {"train_loss": -42.68042755126953, "global_step": 230669, "epoch": 1906} {"train_loss": -41.84914779663086, "global_step": 230670, "epoch": 1906} {"train_loss": -41.06404113769531, "global_step": 230671, "epoch": 1906} {"train_loss": -42.41132736206055, "global_step": 230672, "epoch": 1906} {"train_loss": -42.8543815612793, "global_step": 230673, "epoch": 1906} {"train_loss": -41.968135833740234, "global_step": 230674, "epoch": 1906} {"train_loss": -42.35647201538086, "global_step": 230675, "epoch": 1906} {"train_loss": -42.68059539794922, "global_step": 230676, "epoch": 1906} {"train_loss": -42.405242919921875, "global_step": 230677, "epoch": 1906} {"train_loss": -42.853633880615234, "global_step": 230678, "epoch": 1906} {"train_loss": -41.79119873046875, "global_step": 230679, "epoch": 1906} {"train_loss": -42.03147506713867, "global_step": 230680, "epoch": 1906} {"train_loss": -41.377079010009766, "global_step": 230681, "epoch": 1906} {"train_loss": -42.06520462036133, "global_step": 230682, "epoch": 1906} {"train_loss": -42.02090072631836, "global_step": 230683, "epoch": 1906} {"train_loss": -42.283782958984375, "global_step": 230684, "epoch": 1906} {"train_loss": -42.26433181762695, "global_step": 230685, "epoch": 1906} {"train_loss": -42.661128997802734, "global_step": 230686, "epoch": 1906} {"train_loss": -41.972145080566406, "global_step": 230687, "epoch": 1906} {"train_loss": -41.744266510009766, "global_step": 230688, "epoch": 1906} {"train_loss": -42.42431640625, "global_step": 230689, "epoch": 1906} {"train_loss": -41.80963897705078, "global_step": 230690, "epoch": 1906} {"train_loss": -42.36430358886719, "global_step": 230691, "epoch": 1906} {"train_loss": -42.67952346801758, "global_step": 230692, "epoch": 1906} {"train_loss": -42.33651351928711, "global_step": 230693, "epoch": 1906} {"train_loss": -42.23011016845703, "global_step": 230694, "epoch": 1906} {"train_loss": -42.118621826171875, "global_step": 230695, "epoch": 1906} {"train_loss": -41.965572357177734, "global_step": 230696, "epoch": 1906} {"train_loss": -42.27006149291992, "global_step": 230697, "epoch": 1906} {"train_loss": -40.59756088256836, "global_step": 230698, "epoch": 1906} {"train_loss": -38.96076583862305, "global_step": 230699, "epoch": 1906} {"train_loss": -41.45563888549805, "global_step": 230700, "epoch": 1906} {"train_loss": -42.19329071044922, "global_step": 230701, "epoch": 1906} {"train_loss": -41.41012954711914, "global_step": 230702, "epoch": 1906} {"train_loss": -40.643531799316406, "global_step": 230703, "epoch": 1906} {"train_loss": -39.90403366088867, "global_step": 230704, "epoch": 1906} {"train_loss": -41.76493453979492, "global_step": 230705, "epoch": 1906} {"train_loss": -41.07229232788086, "global_step": 230706, "epoch": 1906} {"train_loss": -38.72022247314453, "global_step": 230707, "epoch": 1906} {"train_loss": -41.32661437988281, "global_step": 230708, "epoch": 1906} {"train_loss": -41.06417465209961, "global_step": 230709, "epoch": 1906} {"train_loss": -37.9350471496582, "global_step": 230710, "epoch": 1906} {"train_loss": -41.491390228271484, "global_step": 230711, "epoch": 1906} {"train_loss": -41.055789947509766, "global_step": 230712, "epoch": 1906} {"train_loss": -40.88616180419922, "global_step": 230713, "epoch": 1906} {"train_loss": -38.510528564453125, "global_step": 230714, "epoch": 1906} {"train_loss": -41.59108352661133, "global_step": 230715, "epoch": 1906} {"train_loss": -41.267982482910156, "global_step": 230716, "epoch": 1906} {"train_loss": -40.37089157104492, "global_step": 230717, "epoch": 1906} {"train_loss": -41.60108184814453, "global_step": 230718, "epoch": 1906} {"train_loss": -39.47854232788086, "global_step": 230719, "epoch": 1906} {"train_loss": -41.88231658935547, "global_step": 230720, "epoch": 1906} {"train_loss": -40.49348831176758, "global_step": 230721, "epoch": 1906} {"train_loss": -40.65092086791992, "global_step": 230722, "epoch": 1906} {"train_loss": -40.148780822753906, "global_step": 230723, "epoch": 1906} {"train_loss": -39.05353927612305, "global_step": 230724, "epoch": 1906} {"train_loss": -40.51198196411133, "global_step": 230725, "epoch": 1906} {"train_loss": -40.799041748046875, "global_step": 230726, "epoch": 1906} {"train_loss": -41.40599822998047, "global_step": 230727, "epoch": 1906} {"train_loss": -41.7791748046875, "global_step": 230728, "epoch": 1906} {"train_loss": -37.530860900878906, "global_step": 230729, "epoch": 1906} {"train_loss": -39.44448471069336, "global_step": 230730, "epoch": 1906} {"train_loss": -42.17333984375, "global_step": 230731, "epoch": 1906} {"train_loss": -41.7325553894043, "global_step": 230732, "epoch": 1906} {"train_loss": -40.6771354675293, "global_step": 230733, "epoch": 1906} {"train_loss": -41.025028228759766, "global_step": 230734, "epoch": 1906} {"train_loss": -40.125484466552734, "global_step": 230735, "epoch": 1906} {"train_loss": -40.72175216674805, "global_step": 230736, "epoch": 1906} {"train_loss": -38.40834045410156, "global_step": 230737, "epoch": 1906} {"train_loss": -39.90550994873047, "global_step": 230738, "epoch": 1906} {"train_loss": -41.22869110107422, "global_step": 230739, "epoch": 1906} {"train_loss": -41.20753479003906, "global_step": 230740, "epoch": 1906} {"train_loss": -41.62800979614258, "global_step": 230741, "epoch": 1906} {"train_loss": -40.78337860107422, "global_step": 230742, "epoch": 1906} {"train_loss": -41.8830451965332, "global_step": 230743, "epoch": 1906} {"train_loss": -41.9196891784668, "global_step": 230744, "epoch": 1906} {"train_loss": -41.332122802734375, "global_step": 230745, "epoch": 1906} {"train_loss": -41.30599723374548, "global_step": 230746, "epoch": 1906, "val_loss": 2648730.5} {"train_loss": -40.768524169921875, "global_step": 230747, "epoch": 1907} {"train_loss": -38.52614212036133, "global_step": 230748, "epoch": 1907} {"train_loss": -41.17915725708008, "global_step": 230749, "epoch": 1907} {"train_loss": -41.77293014526367, "global_step": 230750, "epoch": 1907} {"train_loss": -33.51690673828125, "global_step": 230751, "epoch": 1907} {"train_loss": -38.056209564208984, "global_step": 230752, "epoch": 1907} {"train_loss": -39.24538040161133, "global_step": 230753, "epoch": 1907} {"train_loss": -39.01285934448242, "global_step": 230754, "epoch": 1907} {"train_loss": -38.628177642822266, "global_step": 230755, "epoch": 1907} {"train_loss": -39.57709884643555, "global_step": 230756, "epoch": 1907} {"train_loss": -38.735511779785156, "global_step": 230757, "epoch": 1907} {"train_loss": -37.74016189575195, "global_step": 230758, "epoch": 1907} {"train_loss": -38.83675003051758, "global_step": 230759, "epoch": 1907} {"train_loss": -37.48407745361328, "global_step": 230760, "epoch": 1907} {"train_loss": -37.91887283325195, "global_step": 230761, "epoch": 1907} {"train_loss": -40.03347396850586, "global_step": 230762, "epoch": 1907} {"train_loss": -19.922042846679688, "global_step": 230763, "epoch": 1907} {"train_loss": -38.93235397338867, "global_step": 230764, "epoch": 1907} {"train_loss": -39.591583251953125, "global_step": 230765, "epoch": 1907} {"train_loss": -38.620086669921875, "global_step": 230766, "epoch": 1907} {"train_loss": -39.63460159301758, "global_step": 230767, "epoch": 1907} {"train_loss": -39.553871154785156, "global_step": 230768, "epoch": 1907} {"train_loss": -37.69033432006836, "global_step": 230769, "epoch": 1907} {"train_loss": -39.20073318481445, "global_step": 230770, "epoch": 1907} {"train_loss": -39.13302230834961, "global_step": 230771, "epoch": 1907} {"train_loss": -39.08488845825195, "global_step": 230772, "epoch": 1907} {"train_loss": -39.438480377197266, "global_step": 230773, "epoch": 1907} {"train_loss": -39.699398040771484, "global_step": 230774, "epoch": 1907} {"train_loss": -35.954647064208984, "global_step": 230775, "epoch": 1907} {"train_loss": -39.9830436706543, "global_step": 230776, "epoch": 1907} {"train_loss": -37.10879135131836, "global_step": 230777, "epoch": 1907} {"train_loss": -39.548675537109375, "global_step": 230778, "epoch": 1907} {"train_loss": -39.35414123535156, "global_step": 230779, "epoch": 1907} {"train_loss": -40.43564987182617, "global_step": 230780, "epoch": 1907} {"train_loss": -39.32135009765625, "global_step": 230781, "epoch": 1907} {"train_loss": -40.43589401245117, "global_step": 230782, "epoch": 1907} {"train_loss": -39.377716064453125, "global_step": 230783, "epoch": 1907} {"train_loss": -40.58713912963867, "global_step": 230784, "epoch": 1907} {"train_loss": -40.43191146850586, "global_step": 230785, "epoch": 1907} {"train_loss": -40.92462158203125, "global_step": 230786, "epoch": 1907} {"train_loss": -39.90815353393555, "global_step": 230787, "epoch": 1907} {"train_loss": -41.30408477783203, "global_step": 230788, "epoch": 1907} {"train_loss": -41.47005844116211, "global_step": 230789, "epoch": 1907} {"train_loss": -40.9060173034668, "global_step": 230790, "epoch": 1907} {"train_loss": -39.898250579833984, "global_step": 230791, "epoch": 1907} {"train_loss": -39.621150970458984, "global_step": 230792, "epoch": 1907} {"train_loss": -41.32627487182617, "global_step": 230793, "epoch": 1907} {"train_loss": -40.03779983520508, "global_step": 230794, "epoch": 1907} {"train_loss": -41.56033706665039, "global_step": 230795, "epoch": 1907} {"train_loss": -41.16585922241211, "global_step": 230796, "epoch": 1907} {"train_loss": -41.81523513793945, "global_step": 230797, "epoch": 1907} {"train_loss": -40.902950286865234, "global_step": 230798, "epoch": 1907} {"train_loss": -40.8757209777832, "global_step": 230799, "epoch": 1907} {"train_loss": -41.444435119628906, "global_step": 230800, "epoch": 1907} {"train_loss": -40.36637878417969, "global_step": 230801, "epoch": 1907} {"train_loss": -41.30725860595703, "global_step": 230802, "epoch": 1907} {"train_loss": -41.54603576660156, "global_step": 230803, "epoch": 1907} {"train_loss": -40.42162322998047, "global_step": 230804, "epoch": 1907} {"train_loss": -41.153377532958984, "global_step": 230805, "epoch": 1907} {"train_loss": -40.66211700439453, "global_step": 230806, "epoch": 1907} {"train_loss": -41.1555061340332, "global_step": 230807, "epoch": 1907} {"train_loss": -41.28904724121094, "global_step": 230808, "epoch": 1907} {"train_loss": -42.29497146606445, "global_step": 230809, "epoch": 1907} {"train_loss": -41.269100189208984, "global_step": 230810, "epoch": 1907} {"train_loss": -41.509063720703125, "global_step": 230811, "epoch": 1907} {"train_loss": -41.9588623046875, "global_step": 230812, "epoch": 1907} {"train_loss": -41.1926155090332, "global_step": 230813, "epoch": 1907} {"train_loss": -41.942169189453125, "global_step": 230814, "epoch": 1907} {"train_loss": -42.02531051635742, "global_step": 230815, "epoch": 1907} {"train_loss": -41.28847122192383, "global_step": 230816, "epoch": 1907} {"train_loss": -41.85279083251953, "global_step": 230817, "epoch": 1907} {"train_loss": -42.48643112182617, "global_step": 230818, "epoch": 1907} {"train_loss": -41.7017936706543, "global_step": 230819, "epoch": 1907} {"train_loss": -41.71476745605469, "global_step": 230820, "epoch": 1907} {"train_loss": -41.929683685302734, "global_step": 230821, "epoch": 1907} {"train_loss": -42.322052001953125, "global_step": 230822, "epoch": 1907} {"train_loss": -41.9482421875, "global_step": 230823, "epoch": 1907} {"train_loss": -41.91770553588867, "global_step": 230824, "epoch": 1907} {"train_loss": -42.16051483154297, "global_step": 230825, "epoch": 1907} {"train_loss": -42.34774398803711, "global_step": 230826, "epoch": 1907} {"train_loss": -40.830169677734375, "global_step": 230827, "epoch": 1907} {"train_loss": -42.550960540771484, "global_step": 230828, "epoch": 1907} {"train_loss": -42.181819915771484, "global_step": 230829, "epoch": 1907} {"train_loss": -41.6248893737793, "global_step": 230830, "epoch": 1907} {"train_loss": -42.392940521240234, "global_step": 230831, "epoch": 1907} {"train_loss": -40.54987335205078, "global_step": 230832, "epoch": 1907} {"train_loss": -42.54506301879883, "global_step": 230833, "epoch": 1907} {"train_loss": -42.29404067993164, "global_step": 230834, "epoch": 1907} {"train_loss": -41.77253723144531, "global_step": 230835, "epoch": 1907} {"train_loss": -42.62089157104492, "global_step": 230836, "epoch": 1907} {"train_loss": -41.790096282958984, "global_step": 230837, "epoch": 1907} {"train_loss": -42.68427276611328, "global_step": 230838, "epoch": 1907} {"train_loss": -42.3173828125, "global_step": 230839, "epoch": 1907} {"train_loss": -42.19607162475586, "global_step": 230840, "epoch": 1907} {"train_loss": -41.557960510253906, "global_step": 230841, "epoch": 1907} {"train_loss": -41.699066162109375, "global_step": 230842, "epoch": 1907} {"train_loss": -42.29266357421875, "global_step": 230843, "epoch": 1907} {"train_loss": -42.03696823120117, "global_step": 230844, "epoch": 1907} {"train_loss": -41.99941635131836, "global_step": 230845, "epoch": 1907} {"train_loss": -41.86711502075195, "global_step": 230846, "epoch": 1907} {"train_loss": -41.82905197143555, "global_step": 230847, "epoch": 1907} {"train_loss": -42.15717315673828, "global_step": 230848, "epoch": 1907} {"train_loss": -42.067604064941406, "global_step": 230849, "epoch": 1907} {"train_loss": -41.909366607666016, "global_step": 230850, "epoch": 1907} {"train_loss": -42.32052230834961, "global_step": 230851, "epoch": 1907} {"train_loss": -42.89017105102539, "global_step": 230852, "epoch": 1907} {"train_loss": -42.671485900878906, "global_step": 230853, "epoch": 1907} {"train_loss": -42.387550354003906, "global_step": 230854, "epoch": 1907} {"train_loss": -42.6813850402832, "global_step": 230855, "epoch": 1907} {"train_loss": -42.4973030090332, "global_step": 230856, "epoch": 1907} {"train_loss": -41.75798416137695, "global_step": 230857, "epoch": 1907} {"train_loss": -38.055816650390625, "global_step": 230858, "epoch": 1907} {"train_loss": -31.2352294921875, "global_step": 230859, "epoch": 1907} {"train_loss": -31.498905181884766, "global_step": 230860, "epoch": 1907} {"train_loss": -38.381160736083984, "global_step": 230861, "epoch": 1907} {"train_loss": -40.839271545410156, "global_step": 230862, "epoch": 1907} {"train_loss": -41.64211654663086, "global_step": 230863, "epoch": 1907} {"train_loss": -39.83966064453125, "global_step": 230864, "epoch": 1907} {"train_loss": -40.04570388793945, "global_step": 230865, "epoch": 1907} {"train_loss": -42.10423278808594, "global_step": 230866, "epoch": 1907} {"train_loss": -40.40227940456926, "global_step": 230867, "epoch": 1907, "val_loss": 2594086.75} {"train_loss": -40.53461456298828, "global_step": 230868, "epoch": 1908} {"train_loss": -42.5999755859375, "global_step": 230869, "epoch": 1908} {"train_loss": -41.03725051879883, "global_step": 230870, "epoch": 1908} {"train_loss": -41.22945785522461, "global_step": 230871, "epoch": 1908} {"train_loss": -41.8171272277832, "global_step": 230872, "epoch": 1908} {"train_loss": -40.5269889831543, "global_step": 230873, "epoch": 1908} {"train_loss": -42.11227035522461, "global_step": 230874, "epoch": 1908} {"train_loss": -41.23843002319336, "global_step": 230875, "epoch": 1908} {"train_loss": -42.21476364135742, "global_step": 230876, "epoch": 1908} {"train_loss": -40.94275665283203, "global_step": 230877, "epoch": 1908} {"train_loss": -40.64754867553711, "global_step": 230878, "epoch": 1908} {"train_loss": -41.699806213378906, "global_step": 230879, "epoch": 1908} {"train_loss": -40.4156608581543, "global_step": 230880, "epoch": 1908} {"train_loss": -40.866729736328125, "global_step": 230881, "epoch": 1908} {"train_loss": -40.455806732177734, "global_step": 230882, "epoch": 1908} {"train_loss": -42.232460021972656, "global_step": 230883, "epoch": 1908} {"train_loss": -40.555564880371094, "global_step": 230884, "epoch": 1908} {"train_loss": -41.91231918334961, "global_step": 230885, "epoch": 1908} {"train_loss": -40.645721435546875, "global_step": 230886, "epoch": 1908} {"train_loss": -41.743919372558594, "global_step": 230887, "epoch": 1908} {"train_loss": -41.20436477661133, "global_step": 230888, "epoch": 1908} {"train_loss": -40.78506088256836, "global_step": 230889, "epoch": 1908} {"train_loss": -40.49442672729492, "global_step": 230890, "epoch": 1908} {"train_loss": -41.62375259399414, "global_step": 230891, "epoch": 1908} {"train_loss": -41.1777229309082, "global_step": 230892, "epoch": 1908} {"train_loss": -42.4882926940918, "global_step": 230893, "epoch": 1908} {"train_loss": -41.2691535949707, "global_step": 230894, "epoch": 1908} {"train_loss": -42.19049835205078, "global_step": 230895, "epoch": 1908} {"train_loss": -40.903541564941406, "global_step": 230896, "epoch": 1908} {"train_loss": -42.23311233520508, "global_step": 230897, "epoch": 1908} {"train_loss": -42.36463165283203, "global_step": 230898, "epoch": 1908} {"train_loss": -42.48286819458008, "global_step": 230899, "epoch": 1908} {"train_loss": -42.66885757446289, "global_step": 230900, "epoch": 1908} {"train_loss": -42.34373092651367, "global_step": 230901, "epoch": 1908} {"train_loss": -42.10177230834961, "global_step": 230902, "epoch": 1908} {"train_loss": -42.052459716796875, "global_step": 230903, "epoch": 1908} {"train_loss": -42.35617446899414, "global_step": 230904, "epoch": 1908} {"train_loss": -42.395572662353516, "global_step": 230905, "epoch": 1908} {"train_loss": -40.85984420776367, "global_step": 230906, "epoch": 1908} {"train_loss": -41.75881576538086, "global_step": 230907, "epoch": 1908} {"train_loss": -41.541954040527344, "global_step": 230908, "epoch": 1908} {"train_loss": -41.61652755737305, "global_step": 230909, "epoch": 1908} {"train_loss": -42.6851806640625, "global_step": 230910, "epoch": 1908} {"train_loss": -41.65627670288086, "global_step": 230911, "epoch": 1908} {"train_loss": -36.54194259643555, "global_step": 230912, "epoch": 1908} {"train_loss": -40.16297149658203, "global_step": 230913, "epoch": 1908} {"train_loss": -41.576148986816406, "global_step": 230914, "epoch": 1908} {"train_loss": -41.79740524291992, "global_step": 230915, "epoch": 1908} {"train_loss": -41.8160285949707, "global_step": 230916, "epoch": 1908} {"train_loss": -41.659366607666016, "global_step": 230917, "epoch": 1908} {"train_loss": -42.033363342285156, "global_step": 230918, "epoch": 1908} {"train_loss": -42.055233001708984, "global_step": 230919, "epoch": 1908} {"train_loss": -38.816890716552734, "global_step": 230920, "epoch": 1908} {"train_loss": -40.728851318359375, "global_step": 230921, "epoch": 1908} {"train_loss": -41.425811767578125, "global_step": 230922, "epoch": 1908} {"train_loss": -42.52392578125, "global_step": 230923, "epoch": 1908} {"train_loss": -41.01581573486328, "global_step": 230924, "epoch": 1908} {"train_loss": -41.145931243896484, "global_step": 230925, "epoch": 1908} {"train_loss": -40.92481231689453, "global_step": 230926, "epoch": 1908} {"train_loss": -41.50865936279297, "global_step": 230927, "epoch": 1908} {"train_loss": -41.35467529296875, "global_step": 230928, "epoch": 1908} {"train_loss": -41.14495849609375, "global_step": 230929, "epoch": 1908} {"train_loss": -37.4092903137207, "global_step": 230930, "epoch": 1908} {"train_loss": -39.62586212158203, "global_step": 230931, "epoch": 1908} {"train_loss": -39.83767318725586, "global_step": 230932, "epoch": 1908} {"train_loss": -37.17555618286133, "global_step": 230933, "epoch": 1908} {"train_loss": -33.648582458496094, "global_step": 230934, "epoch": 1908} {"train_loss": -19.43375587463379, "global_step": 230935, "epoch": 1908} {"train_loss": -38.3739128112793, "global_step": 230936, "epoch": 1908} {"train_loss": -36.180171966552734, "global_step": 230937, "epoch": 1908} {"train_loss": -31.6685791015625, "global_step": 230938, "epoch": 1908} {"train_loss": -36.541961669921875, "global_step": 230939, "epoch": 1908} {"train_loss": -35.868873596191406, "global_step": 230940, "epoch": 1908} {"train_loss": -35.14735794067383, "global_step": 230941, "epoch": 1908} {"train_loss": -36.777992248535156, "global_step": 230942, "epoch": 1908} {"train_loss": -37.331050872802734, "global_step": 230943, "epoch": 1908} {"train_loss": -37.546630859375, "global_step": 230944, "epoch": 1908} {"train_loss": -37.25905227661133, "global_step": 230945, "epoch": 1908} {"train_loss": -39.57289505004883, "global_step": 230946, "epoch": 1908} {"train_loss": -35.31401443481445, "global_step": 230947, "epoch": 1908} {"train_loss": -34.165157318115234, "global_step": 230948, "epoch": 1908} {"train_loss": -37.26814270019531, "global_step": 230949, "epoch": 1908} {"train_loss": -37.20277786254883, "global_step": 230950, "epoch": 1908} {"train_loss": -34.60280227661133, "global_step": 230951, "epoch": 1908} {"train_loss": -21.782751083374023, "global_step": 230952, "epoch": 1908} {"train_loss": -30.732946395874023, "global_step": 230953, "epoch": 1908} {"train_loss": -37.7457160949707, "global_step": 230954, "epoch": 1908} {"train_loss": -39.47250747680664, "global_step": 230955, "epoch": 1908} {"train_loss": -37.874977111816406, "global_step": 230956, "epoch": 1908} {"train_loss": -36.79104232788086, "global_step": 230957, "epoch": 1908} {"train_loss": -35.98584747314453, "global_step": 230958, "epoch": 1908} {"train_loss": -36.94773483276367, "global_step": 230959, "epoch": 1908} {"train_loss": -35.52661895751953, "global_step": 230960, "epoch": 1908} {"train_loss": -36.80320358276367, "global_step": 230961, "epoch": 1908} {"train_loss": -32.507545471191406, "global_step": 230962, "epoch": 1908} {"train_loss": -37.117835998535156, "global_step": 230963, "epoch": 1908} {"train_loss": -37.27644729614258, "global_step": 230964, "epoch": 1908} {"train_loss": -36.614315032958984, "global_step": 230965, "epoch": 1908} {"train_loss": -34.70677947998047, "global_step": 230966, "epoch": 1908} {"train_loss": -37.955020904541016, "global_step": 230967, "epoch": 1908} {"train_loss": -37.14484405517578, "global_step": 230968, "epoch": 1908} {"train_loss": -34.195068359375, "global_step": 230969, "epoch": 1908} {"train_loss": -39.05414581298828, "global_step": 230970, "epoch": 1908} {"train_loss": -38.70417404174805, "global_step": 230971, "epoch": 1908} {"train_loss": -36.5439338684082, "global_step": 230972, "epoch": 1908} {"train_loss": -38.62372970581055, "global_step": 230973, "epoch": 1908} {"train_loss": -39.262718200683594, "global_step": 230974, "epoch": 1908} {"train_loss": -38.37691879272461, "global_step": 230975, "epoch": 1908} {"train_loss": -38.32842254638672, "global_step": 230976, "epoch": 1908} {"train_loss": -39.02128219604492, "global_step": 230977, "epoch": 1908} {"train_loss": -37.72124099731445, "global_step": 230978, "epoch": 1908} {"train_loss": -36.77431869506836, "global_step": 230979, "epoch": 1908} {"train_loss": -39.65627670288086, "global_step": 230980, "epoch": 1908} {"train_loss": -37.51898956298828, "global_step": 230981, "epoch": 1908} {"train_loss": -38.84416580200195, "global_step": 230982, "epoch": 1908} {"train_loss": -39.57973098754883, "global_step": 230983, "epoch": 1908} {"train_loss": -39.14666748046875, "global_step": 230984, "epoch": 1908} {"train_loss": -39.264957427978516, "global_step": 230985, "epoch": 1908} {"train_loss": -39.0968132019043, "global_step": 230986, "epoch": 1908} {"train_loss": -39.36944580078125, "global_step": 230987, "epoch": 1908} {"train_loss": -39.05899301639273, "global_step": 230988, "epoch": 1908, "val_loss": 2512943.75} {"train_loss": -39.52136993408203, "global_step": 230989, "epoch": 1909} {"train_loss": -39.143836975097656, "global_step": 230990, "epoch": 1909} {"train_loss": -39.71471405029297, "global_step": 230991, "epoch": 1909} {"train_loss": -40.5148811340332, "global_step": 230992, "epoch": 1909} {"train_loss": -39.50981903076172, "global_step": 230993, "epoch": 1909} {"train_loss": -40.036651611328125, "global_step": 230994, "epoch": 1909} {"train_loss": -39.393768310546875, "global_step": 230995, "epoch": 1909} {"train_loss": -39.42432403564453, "global_step": 230996, "epoch": 1909} {"train_loss": -40.79282760620117, "global_step": 230997, "epoch": 1909} {"train_loss": -40.30684280395508, "global_step": 230998, "epoch": 1909} {"train_loss": -40.151634216308594, "global_step": 230999, "epoch": 1909} {"train_loss": -39.9883918762207, "global_step": 231000, "epoch": 1909} {"train_loss": -40.287532806396484, "global_step": 231001, "epoch": 1909} {"train_loss": -40.595245361328125, "global_step": 231002, "epoch": 1909} {"train_loss": -39.91094970703125, "global_step": 231003, "epoch": 1909} {"train_loss": -40.20933151245117, "global_step": 231004, "epoch": 1909} {"train_loss": -40.557796478271484, "global_step": 231005, "epoch": 1909} {"train_loss": -40.368682861328125, "global_step": 231006, "epoch": 1909} {"train_loss": -40.30753707885742, "global_step": 231007, "epoch": 1909} {"train_loss": -41.0440559387207, "global_step": 231008, "epoch": 1909} {"train_loss": -40.10693359375, "global_step": 231009, "epoch": 1909} {"train_loss": -39.7463493347168, "global_step": 231010, "epoch": 1909} {"train_loss": -40.37032699584961, "global_step": 231011, "epoch": 1909} {"train_loss": -40.18855285644531, "global_step": 231012, "epoch": 1909} {"train_loss": -39.97875213623047, "global_step": 231013, "epoch": 1909} {"train_loss": -41.39729690551758, "global_step": 231014, "epoch": 1909} {"train_loss": -39.71375274658203, "global_step": 231015, "epoch": 1909} {"train_loss": -40.18836212158203, "global_step": 231016, "epoch": 1909} {"train_loss": -40.857215881347656, "global_step": 231017, "epoch": 1909} {"train_loss": -41.190147399902344, "global_step": 231018, "epoch": 1909} {"train_loss": -40.9190673828125, "global_step": 231019, "epoch": 1909} {"train_loss": -40.053035736083984, "global_step": 231020, "epoch": 1909} {"train_loss": -41.156978607177734, "global_step": 231021, "epoch": 1909} {"train_loss": -41.44404220581055, "global_step": 231022, "epoch": 1909} {"train_loss": -41.133663177490234, "global_step": 231023, "epoch": 1909} {"train_loss": -40.906532287597656, "global_step": 231024, "epoch": 1909} {"train_loss": -40.89838409423828, "global_step": 231025, "epoch": 1909} {"train_loss": -41.05344772338867, "global_step": 231026, "epoch": 1909} {"train_loss": -41.079769134521484, "global_step": 231027, "epoch": 1909} {"train_loss": -41.07236862182617, "global_step": 231028, "epoch": 1909} {"train_loss": -40.83600997924805, "global_step": 231029, "epoch": 1909} {"train_loss": -40.2464485168457, "global_step": 231030, "epoch": 1909} {"train_loss": -40.295745849609375, "global_step": 231031, "epoch": 1909} {"train_loss": -41.27045822143555, "global_step": 231032, "epoch": 1909} {"train_loss": -41.4967155456543, "global_step": 231033, "epoch": 1909} {"train_loss": -40.82950973510742, "global_step": 231034, "epoch": 1909} {"train_loss": -41.75071334838867, "global_step": 231035, "epoch": 1909} {"train_loss": -41.28395462036133, "global_step": 231036, "epoch": 1909} {"train_loss": -41.818416595458984, "global_step": 231037, "epoch": 1909} {"train_loss": -41.767818450927734, "global_step": 231038, "epoch": 1909} {"train_loss": -41.152320861816406, "global_step": 231039, "epoch": 1909} {"train_loss": -40.26081466674805, "global_step": 231040, "epoch": 1909} {"train_loss": -41.916133880615234, "global_step": 231041, "epoch": 1909} {"train_loss": -41.97028350830078, "global_step": 231042, "epoch": 1909} {"train_loss": -40.387428283691406, "global_step": 231043, "epoch": 1909} {"train_loss": -40.884883880615234, "global_step": 231044, "epoch": 1909} {"train_loss": -41.705406188964844, "global_step": 231045, "epoch": 1909} {"train_loss": -41.584068298339844, "global_step": 231046, "epoch": 1909} {"train_loss": -41.85038375854492, "global_step": 231047, "epoch": 1909} {"train_loss": -41.90153884887695, "global_step": 231048, "epoch": 1909} {"train_loss": -41.26255416870117, "global_step": 231049, "epoch": 1909} {"train_loss": -41.406063079833984, "global_step": 231050, "epoch": 1909} {"train_loss": -41.885223388671875, "global_step": 231051, "epoch": 1909} {"train_loss": -41.496498107910156, "global_step": 231052, "epoch": 1909} {"train_loss": -42.24072265625, "global_step": 231053, "epoch": 1909} {"train_loss": -41.96194076538086, "global_step": 231054, "epoch": 1909} {"train_loss": -41.9397087097168, "global_step": 231055, "epoch": 1909} {"train_loss": -41.81568145751953, "global_step": 231056, "epoch": 1909} {"train_loss": -41.58837127685547, "global_step": 231057, "epoch": 1909} {"train_loss": -41.8248405456543, "global_step": 231058, "epoch": 1909} {"train_loss": -42.03355026245117, "global_step": 231059, "epoch": 1909} {"train_loss": -42.13235855102539, "global_step": 231060, "epoch": 1909} {"train_loss": -40.6259880065918, "global_step": 231061, "epoch": 1909} {"train_loss": -42.02912139892578, "global_step": 231062, "epoch": 1909} {"train_loss": -41.93233871459961, "global_step": 231063, "epoch": 1909} {"train_loss": -41.51715850830078, "global_step": 231064, "epoch": 1909} {"train_loss": -42.31355667114258, "global_step": 231065, "epoch": 1909} {"train_loss": -40.17367172241211, "global_step": 231066, "epoch": 1909} {"train_loss": -38.50251388549805, "global_step": 231067, "epoch": 1909} {"train_loss": -41.11685562133789, "global_step": 231068, "epoch": 1909} {"train_loss": -37.840389251708984, "global_step": 231069, "epoch": 1909} {"train_loss": -41.394248962402344, "global_step": 231070, "epoch": 1909} {"train_loss": -39.91240310668945, "global_step": 231071, "epoch": 1909} {"train_loss": -40.217403411865234, "global_step": 231072, "epoch": 1909} {"train_loss": -40.84278106689453, "global_step": 231073, "epoch": 1909} {"train_loss": -39.23773193359375, "global_step": 231074, "epoch": 1909} {"train_loss": -40.777099609375, "global_step": 231075, "epoch": 1909} {"train_loss": -39.047481536865234, "global_step": 231076, "epoch": 1909} {"train_loss": -41.64686965942383, "global_step": 231077, "epoch": 1909} {"train_loss": -40.337005615234375, "global_step": 231078, "epoch": 1909} {"train_loss": -41.09492874145508, "global_step": 231079, "epoch": 1909} {"train_loss": -41.212677001953125, "global_step": 231080, "epoch": 1909} {"train_loss": -40.728023529052734, "global_step": 231081, "epoch": 1909} {"train_loss": -40.938392639160156, "global_step": 231082, "epoch": 1909} {"train_loss": -41.330753326416016, "global_step": 231083, "epoch": 1909} {"train_loss": -39.8654670715332, "global_step": 231084, "epoch": 1909} {"train_loss": -41.015296936035156, "global_step": 231085, "epoch": 1909} {"train_loss": -41.06620407104492, "global_step": 231086, "epoch": 1909} {"train_loss": -40.400787353515625, "global_step": 231087, "epoch": 1909} {"train_loss": -40.68447494506836, "global_step": 231088, "epoch": 1909} {"train_loss": -40.78382110595703, "global_step": 231089, "epoch": 1909} {"train_loss": -41.247005462646484, "global_step": 231090, "epoch": 1909} {"train_loss": -40.29690170288086, "global_step": 231091, "epoch": 1909} {"train_loss": -41.30814743041992, "global_step": 231092, "epoch": 1909} {"train_loss": -41.5939826965332, "global_step": 231093, "epoch": 1909} {"train_loss": -41.214839935302734, "global_step": 231094, "epoch": 1909} {"train_loss": -41.333168029785156, "global_step": 231095, "epoch": 1909} {"train_loss": -40.54930877685547, "global_step": 231096, "epoch": 1909} {"train_loss": -40.99409103393555, "global_step": 231097, "epoch": 1909} {"train_loss": -41.255008697509766, "global_step": 231098, "epoch": 1909} {"train_loss": -40.908931732177734, "global_step": 231099, "epoch": 1909} {"train_loss": -39.959224700927734, "global_step": 231100, "epoch": 1909} {"train_loss": -41.41933822631836, "global_step": 231101, "epoch": 1909} {"train_loss": -40.960792541503906, "global_step": 231102, "epoch": 1909} {"train_loss": -40.48795700073242, "global_step": 231103, "epoch": 1909} {"train_loss": -40.15092849731445, "global_step": 231104, "epoch": 1909} {"train_loss": -40.562469482421875, "global_step": 231105, "epoch": 1909} {"train_loss": -41.0389518737793, "global_step": 231106, "epoch": 1909} {"train_loss": -41.32118606567383, "global_step": 231107, "epoch": 1909} {"train_loss": -41.3217887878418, "global_step": 231108, "epoch": 1909} {"train_loss": -40.81848352605646, "global_step": 231109, "epoch": 1909, "val_loss": 2494857.75} {"train_loss": -41.74509811401367, "global_step": 231110, "epoch": 1910} {"train_loss": -41.68397521972656, "global_step": 231111, "epoch": 1910} {"train_loss": -41.27240753173828, "global_step": 231112, "epoch": 1910} {"train_loss": -41.338600158691406, "global_step": 231113, "epoch": 1910} {"train_loss": -41.49567794799805, "global_step": 231114, "epoch": 1910} {"train_loss": -41.094085693359375, "global_step": 231115, "epoch": 1910} {"train_loss": -41.15827178955078, "global_step": 231116, "epoch": 1910} {"train_loss": -41.80241775512695, "global_step": 231117, "epoch": 1910} {"train_loss": -40.338314056396484, "global_step": 231118, "epoch": 1910} {"train_loss": -41.64787673950195, "global_step": 231119, "epoch": 1910} {"train_loss": -40.284908294677734, "global_step": 231120, "epoch": 1910} {"train_loss": -41.22450637817383, "global_step": 231121, "epoch": 1910} {"train_loss": -42.22014617919922, "global_step": 231122, "epoch": 1910} {"train_loss": -41.63212203979492, "global_step": 231123, "epoch": 1910} {"train_loss": -40.992042541503906, "global_step": 231124, "epoch": 1910} {"train_loss": -41.45782470703125, "global_step": 231125, "epoch": 1910} {"train_loss": -40.61161804199219, "global_step": 231126, "epoch": 1910} {"train_loss": -42.10712814331055, "global_step": 231127, "epoch": 1910} {"train_loss": -41.5404052734375, "global_step": 231128, "epoch": 1910} {"train_loss": -41.99115753173828, "global_step": 231129, "epoch": 1910} {"train_loss": -41.56370544433594, "global_step": 231130, "epoch": 1910} {"train_loss": -41.4176139831543, "global_step": 231131, "epoch": 1910} {"train_loss": -42.03998947143555, "global_step": 231132, "epoch": 1910} {"train_loss": -41.7121696472168, "global_step": 231133, "epoch": 1910} {"train_loss": -41.105098724365234, "global_step": 231134, "epoch": 1910} {"train_loss": -42.26494216918945, "global_step": 231135, "epoch": 1910} {"train_loss": -42.0659294128418, "global_step": 231136, "epoch": 1910} {"train_loss": -42.1251335144043, "global_step": 231137, "epoch": 1910} {"train_loss": -41.761783599853516, "global_step": 231138, "epoch": 1910} {"train_loss": -41.9904899597168, "global_step": 231139, "epoch": 1910} {"train_loss": -41.51668167114258, "global_step": 231140, "epoch": 1910} {"train_loss": -42.431827545166016, "global_step": 231141, "epoch": 1910} {"train_loss": -42.251522064208984, "global_step": 231142, "epoch": 1910} {"train_loss": -42.21392059326172, "global_step": 231143, "epoch": 1910} {"train_loss": -40.35824966430664, "global_step": 231144, "epoch": 1910} {"train_loss": -42.28124237060547, "global_step": 231145, "epoch": 1910} {"train_loss": -41.183074951171875, "global_step": 231146, "epoch": 1910} {"train_loss": -42.228633880615234, "global_step": 231147, "epoch": 1910} {"train_loss": -40.49980545043945, "global_step": 231148, "epoch": 1910} {"train_loss": -42.518733978271484, "global_step": 231149, "epoch": 1910} {"train_loss": -42.0703239440918, "global_step": 231150, "epoch": 1910} {"train_loss": -42.36125946044922, "global_step": 231151, "epoch": 1910} {"train_loss": -42.4345817565918, "global_step": 231152, "epoch": 1910} {"train_loss": -42.30316162109375, "global_step": 231153, "epoch": 1910} {"train_loss": -41.15261459350586, "global_step": 231154, "epoch": 1910} {"train_loss": -42.790435791015625, "global_step": 231155, "epoch": 1910} {"train_loss": -41.94523239135742, "global_step": 231156, "epoch": 1910} {"train_loss": -41.52846908569336, "global_step": 231157, "epoch": 1910} {"train_loss": -42.439544677734375, "global_step": 231158, "epoch": 1910} {"train_loss": -41.611873626708984, "global_step": 231159, "epoch": 1910} {"train_loss": -42.1507453918457, "global_step": 231160, "epoch": 1910} {"train_loss": -42.023616790771484, "global_step": 231161, "epoch": 1910} {"train_loss": -41.312435150146484, "global_step": 231162, "epoch": 1910} {"train_loss": -40.52260971069336, "global_step": 231163, "epoch": 1910} {"train_loss": -41.64217758178711, "global_step": 231164, "epoch": 1910} {"train_loss": -40.72562026977539, "global_step": 231165, "epoch": 1910} {"train_loss": -41.822566986083984, "global_step": 231166, "epoch": 1910} {"train_loss": -40.026554107666016, "global_step": 231167, "epoch": 1910} {"train_loss": -41.32655334472656, "global_step": 231168, "epoch": 1910} {"train_loss": -39.06736373901367, "global_step": 231169, "epoch": 1910} {"train_loss": -41.1220588684082, "global_step": 231170, "epoch": 1910} {"train_loss": -39.540706634521484, "global_step": 231171, "epoch": 1910} {"train_loss": -39.206974029541016, "global_step": 231172, "epoch": 1910} {"train_loss": -42.247169494628906, "global_step": 231173, "epoch": 1910} {"train_loss": -40.907745361328125, "global_step": 231174, "epoch": 1910} {"train_loss": -40.32300567626953, "global_step": 231175, "epoch": 1910} {"train_loss": -40.087703704833984, "global_step": 231176, "epoch": 1910} {"train_loss": -41.81958770751953, "global_step": 231177, "epoch": 1910} {"train_loss": -40.78627395629883, "global_step": 231178, "epoch": 1910} {"train_loss": -41.374996185302734, "global_step": 231179, "epoch": 1910} {"train_loss": -41.55448532104492, "global_step": 231180, "epoch": 1910} {"train_loss": -38.93272018432617, "global_step": 231181, "epoch": 1910} {"train_loss": -39.93498611450195, "global_step": 231182, "epoch": 1910} {"train_loss": -37.949066162109375, "global_step": 231183, "epoch": 1910} {"train_loss": -38.23017501831055, "global_step": 231184, "epoch": 1910} {"train_loss": -13.353294372558594, "global_step": 231185, "epoch": 1910} {"train_loss": -40.572418212890625, "global_step": 231186, "epoch": 1910} {"train_loss": -39.8519172668457, "global_step": 231187, "epoch": 1910} {"train_loss": -39.80063247680664, "global_step": 231188, "epoch": 1910} {"train_loss": -18.427593231201172, "global_step": 231189, "epoch": 1910} {"train_loss": -37.45756149291992, "global_step": 231190, "epoch": 1910} {"train_loss": -35.68211364746094, "global_step": 231191, "epoch": 1910} {"train_loss": -38.12514877319336, "global_step": 231192, "epoch": 1910} {"train_loss": -26.094207763671875, "global_step": 231193, "epoch": 1910} {"train_loss": 13.130072593688965, "global_step": 231194, "epoch": 1910} {"train_loss": -32.58137893676758, "global_step": 231195, "epoch": 1910} {"train_loss": -35.002437591552734, "global_step": 231196, "epoch": 1910} {"train_loss": -28.400846481323242, "global_step": 231197, "epoch": 1910} {"train_loss": -31.156896591186523, "global_step": 231198, "epoch": 1910} {"train_loss": -12.214746475219727, "global_step": 231199, "epoch": 1910} {"train_loss": -27.864002227783203, "global_step": 231200, "epoch": 1910} {"train_loss": -29.395587921142578, "global_step": 231201, "epoch": 1910} {"train_loss": -36.44900894165039, "global_step": 231202, "epoch": 1910} {"train_loss": -36.16339874267578, "global_step": 231203, "epoch": 1910} {"train_loss": -34.63481521606445, "global_step": 231204, "epoch": 1910} {"train_loss": -35.19823455810547, "global_step": 231205, "epoch": 1910} {"train_loss": -35.6585807800293, "global_step": 231206, "epoch": 1910} {"train_loss": -36.17897415161133, "global_step": 231207, "epoch": 1910} {"train_loss": -35.50455093383789, "global_step": 231208, "epoch": 1910} {"train_loss": -35.348106384277344, "global_step": 231209, "epoch": 1910} {"train_loss": -35.05269241333008, "global_step": 231210, "epoch": 1910} {"train_loss": -37.0927734375, "global_step": 231211, "epoch": 1910} {"train_loss": -35.80514144897461, "global_step": 231212, "epoch": 1910} {"train_loss": -37.22430419921875, "global_step": 231213, "epoch": 1910} {"train_loss": -37.763832092285156, "global_step": 231214, "epoch": 1910} {"train_loss": -36.367000579833984, "global_step": 231215, "epoch": 1910} {"train_loss": -36.237361907958984, "global_step": 231216, "epoch": 1910} {"train_loss": -37.39596176147461, "global_step": 231217, "epoch": 1910} {"train_loss": -37.378204345703125, "global_step": 231218, "epoch": 1910} {"train_loss": -37.434322357177734, "global_step": 231219, "epoch": 1910} {"train_loss": -38.3643684387207, "global_step": 231220, "epoch": 1910} {"train_loss": -38.071346282958984, "global_step": 231221, "epoch": 1910} {"train_loss": -37.55414581298828, "global_step": 231222, "epoch": 1910} {"train_loss": -37.402748107910156, "global_step": 231223, "epoch": 1910} {"train_loss": -37.13291549682617, "global_step": 231224, "epoch": 1910} {"train_loss": -37.46882247924805, "global_step": 231225, "epoch": 1910} {"train_loss": -38.29047393798828, "global_step": 231226, "epoch": 1910} {"train_loss": -37.102901458740234, "global_step": 231227, "epoch": 1910} {"train_loss": -38.19533157348633, "global_step": 231228, "epoch": 1910} {"train_loss": -37.25967025756836, "global_step": 231229, "epoch": 1910} {"train_loss": -38.344518574801356, "global_step": 231230, "epoch": 1910, "val_loss": 2651747.0} {"train_loss": -37.70991897583008, "global_step": 231231, "epoch": 1911} {"train_loss": -37.99123764038086, "global_step": 231232, "epoch": 1911} {"train_loss": -37.94621658325195, "global_step": 231233, "epoch": 1911} {"train_loss": -38.63848114013672, "global_step": 231234, "epoch": 1911} {"train_loss": -37.37388229370117, "global_step": 231235, "epoch": 1911} {"train_loss": -38.67304611206055, "global_step": 231236, "epoch": 1911} {"train_loss": -38.15235137939453, "global_step": 231237, "epoch": 1911} {"train_loss": -38.77024841308594, "global_step": 231238, "epoch": 1911} {"train_loss": -38.34462356567383, "global_step": 231239, "epoch": 1911} {"train_loss": -38.63822555541992, "global_step": 231240, "epoch": 1911} {"train_loss": -38.45703125, "global_step": 231241, "epoch": 1911} {"train_loss": -39.1739616394043, "global_step": 231242, "epoch": 1911} {"train_loss": -38.59415817260742, "global_step": 231243, "epoch": 1911} {"train_loss": -38.54850387573242, "global_step": 231244, "epoch": 1911} {"train_loss": -39.19725799560547, "global_step": 231245, "epoch": 1911} {"train_loss": -38.840980529785156, "global_step": 231246, "epoch": 1911} {"train_loss": -39.35000228881836, "global_step": 231247, "epoch": 1911} {"train_loss": -38.57839584350586, "global_step": 231248, "epoch": 1911} {"train_loss": -39.38395309448242, "global_step": 231249, "epoch": 1911} {"train_loss": -40.0764274597168, "global_step": 231250, "epoch": 1911} {"train_loss": -39.79557418823242, "global_step": 231251, "epoch": 1911} {"train_loss": -39.23908996582031, "global_step": 231252, "epoch": 1911} {"train_loss": -38.92115020751953, "global_step": 231253, "epoch": 1911} {"train_loss": -39.829315185546875, "global_step": 231254, "epoch": 1911} {"train_loss": -39.470027923583984, "global_step": 231255, "epoch": 1911} {"train_loss": -39.49406814575195, "global_step": 231256, "epoch": 1911} {"train_loss": -38.94727325439453, "global_step": 231257, "epoch": 1911} {"train_loss": -39.75954818725586, "global_step": 231258, "epoch": 1911} {"train_loss": -39.916473388671875, "global_step": 231259, "epoch": 1911} {"train_loss": -39.92017364501953, "global_step": 231260, "epoch": 1911} {"train_loss": -39.22367858886719, "global_step": 231261, "epoch": 1911} {"train_loss": -39.635711669921875, "global_step": 231262, "epoch": 1911} {"train_loss": -40.113155364990234, "global_step": 231263, "epoch": 1911} {"train_loss": -39.94038009643555, "global_step": 231264, "epoch": 1911} {"train_loss": -40.02675247192383, "global_step": 231265, "epoch": 1911} {"train_loss": -40.133026123046875, "global_step": 231266, "epoch": 1911} {"train_loss": -39.703453063964844, "global_step": 231267, "epoch": 1911} {"train_loss": -39.866249084472656, "global_step": 231268, "epoch": 1911} {"train_loss": -39.3940315246582, "global_step": 231269, "epoch": 1911} {"train_loss": -40.356689453125, "global_step": 231270, "epoch": 1911} {"train_loss": -40.215065002441406, "global_step": 231271, "epoch": 1911} {"train_loss": -40.018672943115234, "global_step": 231272, "epoch": 1911} {"train_loss": -40.46315383911133, "global_step": 231273, "epoch": 1911} {"train_loss": -40.46649169921875, "global_step": 231274, "epoch": 1911} {"train_loss": -39.85017013549805, "global_step": 231275, "epoch": 1911} {"train_loss": -40.004093170166016, "global_step": 231276, "epoch": 1911} {"train_loss": -40.287811279296875, "global_step": 231277, "epoch": 1911} {"train_loss": -40.90979766845703, "global_step": 231278, "epoch": 1911} {"train_loss": -40.74770736694336, "global_step": 231279, "epoch": 1911} {"train_loss": -40.39399337768555, "global_step": 231280, "epoch": 1911} {"train_loss": -40.165489196777344, "global_step": 231281, "epoch": 1911} {"train_loss": -41.13213348388672, "global_step": 231282, "epoch": 1911} {"train_loss": -40.907012939453125, "global_step": 231283, "epoch": 1911} {"train_loss": -40.07178497314453, "global_step": 231284, "epoch": 1911} {"train_loss": -39.82045364379883, "global_step": 231285, "epoch": 1911} {"train_loss": -41.2420768737793, "global_step": 231286, "epoch": 1911} {"train_loss": -40.812652587890625, "global_step": 231287, "epoch": 1911} {"train_loss": -40.88393783569336, "global_step": 231288, "epoch": 1911} {"train_loss": -40.915679931640625, "global_step": 231289, "epoch": 1911} {"train_loss": -41.05495834350586, "global_step": 231290, "epoch": 1911} {"train_loss": -39.69867706298828, "global_step": 231291, "epoch": 1911} {"train_loss": -40.00045394897461, "global_step": 231292, "epoch": 1911} {"train_loss": -41.590206146240234, "global_step": 231293, "epoch": 1911} {"train_loss": -41.25849914550781, "global_step": 231294, "epoch": 1911} {"train_loss": -40.859519958496094, "global_step": 231295, "epoch": 1911} {"train_loss": -41.36331558227539, "global_step": 231296, "epoch": 1911} {"train_loss": -41.07909393310547, "global_step": 231297, "epoch": 1911} {"train_loss": -41.48450469970703, "global_step": 231298, "epoch": 1911} {"train_loss": -40.576725006103516, "global_step": 231299, "epoch": 1911} {"train_loss": -40.85095977783203, "global_step": 231300, "epoch": 1911} {"train_loss": -41.106842041015625, "global_step": 231301, "epoch": 1911} {"train_loss": -40.787899017333984, "global_step": 231302, "epoch": 1911} {"train_loss": -41.389190673828125, "global_step": 231303, "epoch": 1911} {"train_loss": -40.88650894165039, "global_step": 231304, "epoch": 1911} {"train_loss": -41.8209342956543, "global_step": 231305, "epoch": 1911} {"train_loss": -40.055885314941406, "global_step": 231306, "epoch": 1911} {"train_loss": -41.83203887939453, "global_step": 231307, "epoch": 1911} {"train_loss": -41.231239318847656, "global_step": 231308, "epoch": 1911} {"train_loss": -41.98529815673828, "global_step": 231309, "epoch": 1911} {"train_loss": -41.36613845825195, "global_step": 231310, "epoch": 1911} {"train_loss": -40.89456558227539, "global_step": 231311, "epoch": 1911} {"train_loss": -41.79278564453125, "global_step": 231312, "epoch": 1911} {"train_loss": -41.1009635925293, "global_step": 231313, "epoch": 1911} {"train_loss": -41.5733528137207, "global_step": 231314, "epoch": 1911} {"train_loss": -40.868751525878906, "global_step": 231315, "epoch": 1911} {"train_loss": -41.05012893676758, "global_step": 231316, "epoch": 1911} {"train_loss": -41.49922561645508, "global_step": 231317, "epoch": 1911} {"train_loss": -42.11664962768555, "global_step": 231318, "epoch": 1911} {"train_loss": -41.034332275390625, "global_step": 231319, "epoch": 1911} {"train_loss": -42.080318450927734, "global_step": 231320, "epoch": 1911} {"train_loss": -41.61219787597656, "global_step": 231321, "epoch": 1911} {"train_loss": -40.44193649291992, "global_step": 231322, "epoch": 1911} {"train_loss": -41.36358642578125, "global_step": 231323, "epoch": 1911} {"train_loss": -40.90958786010742, "global_step": 231324, "epoch": 1911} {"train_loss": -40.888179779052734, "global_step": 231325, "epoch": 1911} {"train_loss": -42.52540969848633, "global_step": 231326, "epoch": 1911} {"train_loss": -42.459144592285156, "global_step": 231327, "epoch": 1911} {"train_loss": -41.73357009887695, "global_step": 231328, "epoch": 1911} {"train_loss": -40.9686393737793, "global_step": 231329, "epoch": 1911} {"train_loss": -41.0350456237793, "global_step": 231330, "epoch": 1911} {"train_loss": -41.30344772338867, "global_step": 231331, "epoch": 1911} {"train_loss": -41.91969680786133, "global_step": 231332, "epoch": 1911} {"train_loss": -41.99924850463867, "global_step": 231333, "epoch": 1911} {"train_loss": -40.54985427856445, "global_step": 231334, "epoch": 1911} {"train_loss": -40.741207122802734, "global_step": 231335, "epoch": 1911} {"train_loss": -41.35706329345703, "global_step": 231336, "epoch": 1911} {"train_loss": -41.13949203491211, "global_step": 231337, "epoch": 1911} {"train_loss": -39.800838470458984, "global_step": 231338, "epoch": 1911} {"train_loss": -40.701019287109375, "global_step": 231339, "epoch": 1911} {"train_loss": -40.9384765625, "global_step": 231340, "epoch": 1911} {"train_loss": -41.25035858154297, "global_step": 231341, "epoch": 1911} {"train_loss": -39.800350189208984, "global_step": 231342, "epoch": 1911} {"train_loss": -39.34770965576172, "global_step": 231343, "epoch": 1911} {"train_loss": -40.40125274658203, "global_step": 231344, "epoch": 1911} {"train_loss": -41.65818405151367, "global_step": 231345, "epoch": 1911} {"train_loss": -39.74597930908203, "global_step": 231346, "epoch": 1911} {"train_loss": -41.14418029785156, "global_step": 231347, "epoch": 1911} {"train_loss": -41.20597457885742, "global_step": 231348, "epoch": 1911} {"train_loss": -39.67829132080078, "global_step": 231349, "epoch": 1911} {"train_loss": -40.017822265625, "global_step": 231350, "epoch": 1911} {"train_loss": -40.33777590034422, "global_step": 231351, "epoch": 1911, "val_loss": 2627594.0} {"train_loss": -40.8456916809082, "global_step": 231352, "epoch": 1912} {"train_loss": -41.39616775512695, "global_step": 231353, "epoch": 1912} {"train_loss": -40.95840072631836, "global_step": 231354, "epoch": 1912} {"train_loss": -38.99803161621094, "global_step": 231355, "epoch": 1912} {"train_loss": -40.41021728515625, "global_step": 231356, "epoch": 1912} {"train_loss": -40.19468307495117, "global_step": 231357, "epoch": 1912} {"train_loss": -41.015560150146484, "global_step": 231358, "epoch": 1912} {"train_loss": -40.0262336730957, "global_step": 231359, "epoch": 1912} {"train_loss": -39.67635726928711, "global_step": 231360, "epoch": 1912} {"train_loss": -39.85200119018555, "global_step": 231361, "epoch": 1912} {"train_loss": -41.44198989868164, "global_step": 231362, "epoch": 1912} {"train_loss": -39.95904541015625, "global_step": 231363, "epoch": 1912} {"train_loss": -40.17827224731445, "global_step": 231364, "epoch": 1912} {"train_loss": -40.9133186340332, "global_step": 231365, "epoch": 1912} {"train_loss": -40.33308029174805, "global_step": 231366, "epoch": 1912} {"train_loss": -40.40629959106445, "global_step": 231367, "epoch": 1912} {"train_loss": -41.45686721801758, "global_step": 231368, "epoch": 1912} {"train_loss": -40.105281829833984, "global_step": 231369, "epoch": 1912} {"train_loss": -41.04841613769531, "global_step": 231370, "epoch": 1912} {"train_loss": -40.71782684326172, "global_step": 231371, "epoch": 1912} {"train_loss": -40.50537109375, "global_step": 231372, "epoch": 1912} {"train_loss": -40.07052993774414, "global_step": 231373, "epoch": 1912} {"train_loss": -41.80550003051758, "global_step": 231374, "epoch": 1912} {"train_loss": -41.012718200683594, "global_step": 231375, "epoch": 1912} {"train_loss": -40.69953536987305, "global_step": 231376, "epoch": 1912} {"train_loss": -41.56067657470703, "global_step": 231377, "epoch": 1912} {"train_loss": -40.78076934814453, "global_step": 231378, "epoch": 1912} {"train_loss": -42.21172332763672, "global_step": 231379, "epoch": 1912} {"train_loss": -41.160709381103516, "global_step": 231380, "epoch": 1912} {"train_loss": -41.60869216918945, "global_step": 231381, "epoch": 1912} {"train_loss": -40.8372688293457, "global_step": 231382, "epoch": 1912} {"train_loss": -41.75503158569336, "global_step": 231383, "epoch": 1912} {"train_loss": -40.42755889892578, "global_step": 231384, "epoch": 1912} {"train_loss": -40.543975830078125, "global_step": 231385, "epoch": 1912} {"train_loss": -41.24425506591797, "global_step": 231386, "epoch": 1912} {"train_loss": -41.80337142944336, "global_step": 231387, "epoch": 1912} {"train_loss": -41.274044036865234, "global_step": 231388, "epoch": 1912} {"train_loss": -41.390235900878906, "global_step": 231389, "epoch": 1912} {"train_loss": -41.25447082519531, "global_step": 231390, "epoch": 1912} {"train_loss": -40.734764099121094, "global_step": 231391, "epoch": 1912} {"train_loss": -41.11984634399414, "global_step": 231392, "epoch": 1912} {"train_loss": -39.943843841552734, "global_step": 231393, "epoch": 1912} {"train_loss": -40.5109977722168, "global_step": 231394, "epoch": 1912} {"train_loss": -41.45155715942383, "global_step": 231395, "epoch": 1912} {"train_loss": -41.58396530151367, "global_step": 231396, "epoch": 1912} {"train_loss": -39.600826263427734, "global_step": 231397, "epoch": 1912} {"train_loss": -40.57156753540039, "global_step": 231398, "epoch": 1912} {"train_loss": -40.61285400390625, "global_step": 231399, "epoch": 1912} {"train_loss": -40.60611343383789, "global_step": 231400, "epoch": 1912} {"train_loss": -42.0446891784668, "global_step": 231401, "epoch": 1912} {"train_loss": -41.44746017456055, "global_step": 231402, "epoch": 1912} {"train_loss": -39.50069046020508, "global_step": 231403, "epoch": 1912} {"train_loss": -41.26433181762695, "global_step": 231404, "epoch": 1912} {"train_loss": -41.1890869140625, "global_step": 231405, "epoch": 1912} {"train_loss": -40.87702941894531, "global_step": 231406, "epoch": 1912} {"train_loss": -39.67576599121094, "global_step": 231407, "epoch": 1912} {"train_loss": -38.160343170166016, "global_step": 231408, "epoch": 1912} {"train_loss": -38.7985725402832, "global_step": 231409, "epoch": 1912} {"train_loss": -39.81223678588867, "global_step": 231410, "epoch": 1912} {"train_loss": -41.96026611328125, "global_step": 231411, "epoch": 1912} {"train_loss": -40.466617584228516, "global_step": 231412, "epoch": 1912} {"train_loss": -40.62656784057617, "global_step": 231413, "epoch": 1912} {"train_loss": -41.11566162109375, "global_step": 231414, "epoch": 1912} {"train_loss": -40.91094970703125, "global_step": 231415, "epoch": 1912} {"train_loss": -40.88068389892578, "global_step": 231416, "epoch": 1912} {"train_loss": -41.45779800415039, "global_step": 231417, "epoch": 1912} {"train_loss": -40.90976333618164, "global_step": 231418, "epoch": 1912} {"train_loss": -41.788082122802734, "global_step": 231419, "epoch": 1912} {"train_loss": -41.210731506347656, "global_step": 231420, "epoch": 1912} {"train_loss": -41.9389762878418, "global_step": 231421, "epoch": 1912} {"train_loss": -41.38902282714844, "global_step": 231422, "epoch": 1912} {"train_loss": -41.317378997802734, "global_step": 231423, "epoch": 1912} {"train_loss": -41.62910079956055, "global_step": 231424, "epoch": 1912} {"train_loss": -40.72037887573242, "global_step": 231425, "epoch": 1912} {"train_loss": -41.3609619140625, "global_step": 231426, "epoch": 1912} {"train_loss": -41.334632873535156, "global_step": 231427, "epoch": 1912} {"train_loss": -41.71662521362305, "global_step": 231428, "epoch": 1912} {"train_loss": -41.80366897583008, "global_step": 231429, "epoch": 1912} {"train_loss": -41.60587692260742, "global_step": 231430, "epoch": 1912} {"train_loss": -42.000423431396484, "global_step": 231431, "epoch": 1912} {"train_loss": -41.5566520690918, "global_step": 231432, "epoch": 1912} {"train_loss": -42.61384963989258, "global_step": 231433, "epoch": 1912} {"train_loss": -41.7743034362793, "global_step": 231434, "epoch": 1912} {"train_loss": -41.65113067626953, "global_step": 231435, "epoch": 1912} {"train_loss": -41.96187210083008, "global_step": 231436, "epoch": 1912} {"train_loss": -41.63985824584961, "global_step": 231437, "epoch": 1912} {"train_loss": -42.3015251159668, "global_step": 231438, "epoch": 1912} {"train_loss": -42.05752182006836, "global_step": 231439, "epoch": 1912} {"train_loss": -42.24094772338867, "global_step": 231440, "epoch": 1912} {"train_loss": -42.126548767089844, "global_step": 231441, "epoch": 1912} {"train_loss": -40.72465133666992, "global_step": 231442, "epoch": 1912} {"train_loss": -42.28318405151367, "global_step": 231443, "epoch": 1912} {"train_loss": -41.897552490234375, "global_step": 231444, "epoch": 1912} {"train_loss": -41.47105407714844, "global_step": 231445, "epoch": 1912} {"train_loss": -41.32033920288086, "global_step": 231446, "epoch": 1912} {"train_loss": -41.89408493041992, "global_step": 231447, "epoch": 1912} {"train_loss": -41.91475296020508, "global_step": 231448, "epoch": 1912} {"train_loss": -41.12014389038086, "global_step": 231449, "epoch": 1912} {"train_loss": -40.644229888916016, "global_step": 231450, "epoch": 1912} {"train_loss": -39.98543930053711, "global_step": 231451, "epoch": 1912} {"train_loss": -41.47544479370117, "global_step": 231452, "epoch": 1912} {"train_loss": -42.477569580078125, "global_step": 231453, "epoch": 1912} {"train_loss": -42.12651062011719, "global_step": 231454, "epoch": 1912} {"train_loss": -42.371238708496094, "global_step": 231455, "epoch": 1912} {"train_loss": -41.31804275512695, "global_step": 231456, "epoch": 1912} {"train_loss": -40.91475296020508, "global_step": 231457, "epoch": 1912} {"train_loss": -41.806915283203125, "global_step": 231458, "epoch": 1912} {"train_loss": -41.00962448120117, "global_step": 231459, "epoch": 1912} {"train_loss": -42.082191467285156, "global_step": 231460, "epoch": 1912} {"train_loss": -41.57532501220703, "global_step": 231461, "epoch": 1912} {"train_loss": -42.27546310424805, "global_step": 231462, "epoch": 1912} {"train_loss": -41.1949577331543, "global_step": 231463, "epoch": 1912} {"train_loss": -41.45327377319336, "global_step": 231464, "epoch": 1912} {"train_loss": -42.36701583862305, "global_step": 231465, "epoch": 1912} {"train_loss": -41.87092208862305, "global_step": 231466, "epoch": 1912} {"train_loss": -42.08332061767578, "global_step": 231467, "epoch": 1912} {"train_loss": -42.2394905090332, "global_step": 231468, "epoch": 1912} {"train_loss": -41.24137496948242, "global_step": 231469, "epoch": 1912} {"train_loss": -42.6124382019043, "global_step": 231470, "epoch": 1912} {"train_loss": -40.9419059753418, "global_step": 231471, "epoch": 1912} {"train_loss": -41.16156195017917, "global_step": 231472, "epoch": 1912, "val_loss": 2705425.25} {"train_loss": -41.11130905151367, "global_step": 231473, "epoch": 1913} {"train_loss": -40.074588775634766, "global_step": 231474, "epoch": 1913} {"train_loss": -41.82072448730469, "global_step": 231475, "epoch": 1913} {"train_loss": -41.31124496459961, "global_step": 231476, "epoch": 1913} {"train_loss": -39.951412200927734, "global_step": 231477, "epoch": 1913} {"train_loss": -40.030601501464844, "global_step": 231478, "epoch": 1913} {"train_loss": -40.72285842895508, "global_step": 231479, "epoch": 1913} {"train_loss": -40.8978385925293, "global_step": 231480, "epoch": 1913} {"train_loss": -40.91947555541992, "global_step": 231481, "epoch": 1913} {"train_loss": -40.7358512878418, "global_step": 231482, "epoch": 1913} {"train_loss": -40.21438217163086, "global_step": 231483, "epoch": 1913} {"train_loss": -39.30227279663086, "global_step": 231484, "epoch": 1913} {"train_loss": -41.497093200683594, "global_step": 231485, "epoch": 1913} {"train_loss": -41.67906951904297, "global_step": 231486, "epoch": 1913} {"train_loss": -37.127925872802734, "global_step": 231487, "epoch": 1913} {"train_loss": -39.1723518371582, "global_step": 231488, "epoch": 1913} {"train_loss": -39.33507537841797, "global_step": 231489, "epoch": 1913} {"train_loss": -38.99554443359375, "global_step": 231490, "epoch": 1913} {"train_loss": -40.827754974365234, "global_step": 231491, "epoch": 1913} {"train_loss": -38.08620071411133, "global_step": 231492, "epoch": 1913} {"train_loss": -38.34566879272461, "global_step": 231493, "epoch": 1913} {"train_loss": -40.783782958984375, "global_step": 231494, "epoch": 1913} {"train_loss": -40.10193634033203, "global_step": 231495, "epoch": 1913} {"train_loss": -40.963043212890625, "global_step": 231496, "epoch": 1913} {"train_loss": -40.00579833984375, "global_step": 231497, "epoch": 1913} {"train_loss": -39.7309455871582, "global_step": 231498, "epoch": 1913} {"train_loss": -41.1907958984375, "global_step": 231499, "epoch": 1913} {"train_loss": -40.170928955078125, "global_step": 231500, "epoch": 1913} {"train_loss": -41.24671173095703, "global_step": 231501, "epoch": 1913} {"train_loss": -40.47718048095703, "global_step": 231502, "epoch": 1913} {"train_loss": -41.66993713378906, "global_step": 231503, "epoch": 1913} {"train_loss": -41.45542526245117, "global_step": 231504, "epoch": 1913} {"train_loss": -40.920047760009766, "global_step": 231505, "epoch": 1913} {"train_loss": -40.91652297973633, "global_step": 231506, "epoch": 1913} {"train_loss": -38.801116943359375, "global_step": 231507, "epoch": 1913} {"train_loss": -40.231689453125, "global_step": 231508, "epoch": 1913} {"train_loss": -40.81793975830078, "global_step": 231509, "epoch": 1913} {"train_loss": -41.47529220581055, "global_step": 231510, "epoch": 1913} {"train_loss": -41.37466812133789, "global_step": 231511, "epoch": 1913} {"train_loss": -42.10516357421875, "global_step": 231512, "epoch": 1913} {"train_loss": -41.5306282043457, "global_step": 231513, "epoch": 1913} {"train_loss": -41.64243698120117, "global_step": 231514, "epoch": 1913} {"train_loss": -42.126747131347656, "global_step": 231515, "epoch": 1913} {"train_loss": -41.3538703918457, "global_step": 231516, "epoch": 1913} {"train_loss": -39.17020797729492, "global_step": 231517, "epoch": 1913} {"train_loss": -40.80365753173828, "global_step": 231518, "epoch": 1913} {"train_loss": -41.84522247314453, "global_step": 231519, "epoch": 1913} {"train_loss": -40.7523078918457, "global_step": 231520, "epoch": 1913} {"train_loss": -39.865108489990234, "global_step": 231521, "epoch": 1913} {"train_loss": -40.34128952026367, "global_step": 231522, "epoch": 1913} {"train_loss": -40.381343841552734, "global_step": 231523, "epoch": 1913} {"train_loss": -40.4275016784668, "global_step": 231524, "epoch": 1913} {"train_loss": -40.537166595458984, "global_step": 231525, "epoch": 1913} {"train_loss": -40.677284240722656, "global_step": 231526, "epoch": 1913} {"train_loss": -41.199337005615234, "global_step": 231527, "epoch": 1913} {"train_loss": -41.269287109375, "global_step": 231528, "epoch": 1913} {"train_loss": -41.23982238769531, "global_step": 231529, "epoch": 1913} {"train_loss": -39.38772201538086, "global_step": 231530, "epoch": 1913} {"train_loss": -41.51186752319336, "global_step": 231531, "epoch": 1913} {"train_loss": -41.2208366394043, "global_step": 231532, "epoch": 1913} {"train_loss": -41.008697509765625, "global_step": 231533, "epoch": 1913} {"train_loss": -39.806556701660156, "global_step": 231534, "epoch": 1913} {"train_loss": -41.452880859375, "global_step": 231535, "epoch": 1913} {"train_loss": -41.6401481628418, "global_step": 231536, "epoch": 1913} {"train_loss": -41.129981994628906, "global_step": 231537, "epoch": 1913} {"train_loss": -40.96685791015625, "global_step": 231538, "epoch": 1913} {"train_loss": -41.12966537475586, "global_step": 231539, "epoch": 1913} {"train_loss": -41.77704620361328, "global_step": 231540, "epoch": 1913} {"train_loss": -40.94388961791992, "global_step": 231541, "epoch": 1913} {"train_loss": -40.60818862915039, "global_step": 231542, "epoch": 1913} {"train_loss": -39.48804473876953, "global_step": 231543, "epoch": 1913} {"train_loss": -37.1294059753418, "global_step": 231544, "epoch": 1913} {"train_loss": -39.420467376708984, "global_step": 231545, "epoch": 1913} {"train_loss": -41.11415100097656, "global_step": 231546, "epoch": 1913} {"train_loss": -40.292789459228516, "global_step": 231547, "epoch": 1913} {"train_loss": -37.94306182861328, "global_step": 231548, "epoch": 1913} {"train_loss": -41.12075424194336, "global_step": 231549, "epoch": 1913} {"train_loss": -34.98220443725586, "global_step": 231550, "epoch": 1913} {"train_loss": -39.08785629272461, "global_step": 231551, "epoch": 1913} {"train_loss": -35.60061264038086, "global_step": 231552, "epoch": 1913} {"train_loss": -38.47019577026367, "global_step": 231553, "epoch": 1913} {"train_loss": -35.9882698059082, "global_step": 231554, "epoch": 1913} {"train_loss": -34.15937805175781, "global_step": 231555, "epoch": 1913} {"train_loss": -35.679988861083984, "global_step": 231556, "epoch": 1913} {"train_loss": -39.295166015625, "global_step": 231557, "epoch": 1913} {"train_loss": -38.03083038330078, "global_step": 231558, "epoch": 1913} {"train_loss": -34.51481628417969, "global_step": 231559, "epoch": 1913} {"train_loss": -34.95366287231445, "global_step": 231560, "epoch": 1913} {"train_loss": -36.94972610473633, "global_step": 231561, "epoch": 1913} {"train_loss": -38.23300552368164, "global_step": 231562, "epoch": 1913} {"train_loss": -35.18819808959961, "global_step": 231563, "epoch": 1913} {"train_loss": -37.53225326538086, "global_step": 231564, "epoch": 1913} {"train_loss": -32.234893798828125, "global_step": 231565, "epoch": 1913} {"train_loss": -38.7008056640625, "global_step": 231566, "epoch": 1913} {"train_loss": -33.54840850830078, "global_step": 231567, "epoch": 1913} {"train_loss": -35.785552978515625, "global_step": 231568, "epoch": 1913} {"train_loss": -38.996341705322266, "global_step": 231569, "epoch": 1913} {"train_loss": -38.680999755859375, "global_step": 231570, "epoch": 1913} {"train_loss": -35.800472259521484, "global_step": 231571, "epoch": 1913} {"train_loss": -34.074317932128906, "global_step": 231572, "epoch": 1913} {"train_loss": -38.69198226928711, "global_step": 231573, "epoch": 1913} {"train_loss": -34.62628173828125, "global_step": 231574, "epoch": 1913} {"train_loss": -36.719993591308594, "global_step": 231575, "epoch": 1913} {"train_loss": -34.42623519897461, "global_step": 231576, "epoch": 1913} {"train_loss": -39.36833953857422, "global_step": 231577, "epoch": 1913} {"train_loss": -36.75681686401367, "global_step": 231578, "epoch": 1913} {"train_loss": -37.335052490234375, "global_step": 231579, "epoch": 1913} {"train_loss": -36.23887252807617, "global_step": 231580, "epoch": 1913} {"train_loss": -36.77031707763672, "global_step": 231581, "epoch": 1913} {"train_loss": -36.45954513549805, "global_step": 231582, "epoch": 1913} {"train_loss": -37.209712982177734, "global_step": 231583, "epoch": 1913} {"train_loss": -39.30532455444336, "global_step": 231584, "epoch": 1913} {"train_loss": -37.86833572387695, "global_step": 231585, "epoch": 1913} {"train_loss": -37.807735443115234, "global_step": 231586, "epoch": 1913} {"train_loss": -38.436126708984375, "global_step": 231587, "epoch": 1913} {"train_loss": -38.927947998046875, "global_step": 231588, "epoch": 1913} {"train_loss": -38.19387435913086, "global_step": 231589, "epoch": 1913} {"train_loss": -38.57249450683594, "global_step": 231590, "epoch": 1913} {"train_loss": -38.58223342895508, "global_step": 231591, "epoch": 1913} {"train_loss": -36.81618118286133, "global_step": 231592, "epoch": 1913} {"train_loss": -39.20872920012671, "global_step": 231593, "epoch": 1913, "val_loss": 2761711.75} {"train_loss": -39.37678527832031, "global_step": 231594, "epoch": 1914} {"train_loss": -39.53241729736328, "global_step": 231595, "epoch": 1914} {"train_loss": -38.858489990234375, "global_step": 231596, "epoch": 1914} {"train_loss": -39.91008758544922, "global_step": 231597, "epoch": 1914} {"train_loss": -39.454586029052734, "global_step": 231598, "epoch": 1914} {"train_loss": -40.45104217529297, "global_step": 231599, "epoch": 1914} {"train_loss": -39.91286849975586, "global_step": 231600, "epoch": 1914} {"train_loss": -39.55234909057617, "global_step": 231601, "epoch": 1914} {"train_loss": -39.35802459716797, "global_step": 231602, "epoch": 1914} {"train_loss": -38.63776397705078, "global_step": 231603, "epoch": 1914} {"train_loss": -38.530601501464844, "global_step": 231604, "epoch": 1914} {"train_loss": -38.789161682128906, "global_step": 231605, "epoch": 1914} {"train_loss": -39.400264739990234, "global_step": 231606, "epoch": 1914} {"train_loss": -39.40127182006836, "global_step": 231607, "epoch": 1914} {"train_loss": -40.10839080810547, "global_step": 231608, "epoch": 1914} {"train_loss": -40.083595275878906, "global_step": 231609, "epoch": 1914} {"train_loss": -40.19306564331055, "global_step": 231610, "epoch": 1914} {"train_loss": -40.31083297729492, "global_step": 231611, "epoch": 1914} {"train_loss": -40.13227081298828, "global_step": 231612, "epoch": 1914} {"train_loss": -40.96401596069336, "global_step": 231613, "epoch": 1914} {"train_loss": -38.6367301940918, "global_step": 231614, "epoch": 1914} {"train_loss": -40.23923873901367, "global_step": 231615, "epoch": 1914} {"train_loss": -39.57978057861328, "global_step": 231616, "epoch": 1914} {"train_loss": -40.37042999267578, "global_step": 231617, "epoch": 1914} {"train_loss": -40.59579849243164, "global_step": 231618, "epoch": 1914} {"train_loss": -40.930912017822266, "global_step": 231619, "epoch": 1914} {"train_loss": -40.050209045410156, "global_step": 231620, "epoch": 1914} {"train_loss": -39.55242919921875, "global_step": 231621, "epoch": 1914} {"train_loss": -41.063819885253906, "global_step": 231622, "epoch": 1914} {"train_loss": -41.05973815917969, "global_step": 231623, "epoch": 1914} {"train_loss": -40.43326187133789, "global_step": 231624, "epoch": 1914} {"train_loss": -40.76245880126953, "global_step": 231625, "epoch": 1914} {"train_loss": -40.961456298828125, "global_step": 231626, "epoch": 1914} {"train_loss": -40.8229866027832, "global_step": 231627, "epoch": 1914} {"train_loss": -40.6926383972168, "global_step": 231628, "epoch": 1914} {"train_loss": -41.23456954956055, "global_step": 231629, "epoch": 1914} {"train_loss": -41.430728912353516, "global_step": 231630, "epoch": 1914} {"train_loss": -41.010498046875, "global_step": 231631, "epoch": 1914} {"train_loss": -41.41827392578125, "global_step": 231632, "epoch": 1914} {"train_loss": -41.24811553955078, "global_step": 231633, "epoch": 1914} {"train_loss": -41.187984466552734, "global_step": 231634, "epoch": 1914} {"train_loss": -40.4874382019043, "global_step": 231635, "epoch": 1914} {"train_loss": -41.490638732910156, "global_step": 231636, "epoch": 1914} {"train_loss": -41.79859924316406, "global_step": 231637, "epoch": 1914} {"train_loss": -41.60409164428711, "global_step": 231638, "epoch": 1914} {"train_loss": -41.6727409362793, "global_step": 231639, "epoch": 1914} {"train_loss": -41.69331741333008, "global_step": 231640, "epoch": 1914} {"train_loss": -41.02490997314453, "global_step": 231641, "epoch": 1914} {"train_loss": -41.56963348388672, "global_step": 231642, "epoch": 1914} {"train_loss": -41.607696533203125, "global_step": 231643, "epoch": 1914} {"train_loss": -40.982948303222656, "global_step": 231644, "epoch": 1914} {"train_loss": -40.97551345825195, "global_step": 231645, "epoch": 1914} {"train_loss": -41.647254943847656, "global_step": 231646, "epoch": 1914} {"train_loss": -41.17715835571289, "global_step": 231647, "epoch": 1914} {"train_loss": -41.9964485168457, "global_step": 231648, "epoch": 1914} {"train_loss": -41.91202163696289, "global_step": 231649, "epoch": 1914} {"train_loss": -42.28763961791992, "global_step": 231650, "epoch": 1914} {"train_loss": -41.19032669067383, "global_step": 231651, "epoch": 1914} {"train_loss": -41.77953338623047, "global_step": 231652, "epoch": 1914} {"train_loss": -41.77962875366211, "global_step": 231653, "epoch": 1914} {"train_loss": -41.5444450378418, "global_step": 231654, "epoch": 1914} {"train_loss": -41.92746353149414, "global_step": 231655, "epoch": 1914} {"train_loss": -41.62293243408203, "global_step": 231656, "epoch": 1914} {"train_loss": -41.873023986816406, "global_step": 231657, "epoch": 1914} {"train_loss": -42.2970085144043, "global_step": 231658, "epoch": 1914} {"train_loss": -42.063232421875, "global_step": 231659, "epoch": 1914} {"train_loss": -42.00542068481445, "global_step": 231660, "epoch": 1914} {"train_loss": -42.11975860595703, "global_step": 231661, "epoch": 1914} {"train_loss": -41.1650505065918, "global_step": 231662, "epoch": 1914} {"train_loss": -42.42985916137695, "global_step": 231663, "epoch": 1914} {"train_loss": -42.06074142456055, "global_step": 231664, "epoch": 1914} {"train_loss": -42.37245178222656, "global_step": 231665, "epoch": 1914} {"train_loss": -41.09585952758789, "global_step": 231666, "epoch": 1914} {"train_loss": -41.66426467895508, "global_step": 231667, "epoch": 1914} {"train_loss": -42.31053924560547, "global_step": 231668, "epoch": 1914} {"train_loss": -42.19160461425781, "global_step": 231669, "epoch": 1914} {"train_loss": -41.90684127807617, "global_step": 231670, "epoch": 1914} {"train_loss": -42.00355911254883, "global_step": 231671, "epoch": 1914} {"train_loss": -41.926456451416016, "global_step": 231672, "epoch": 1914} {"train_loss": -42.130615234375, "global_step": 231673, "epoch": 1914} {"train_loss": -42.253047943115234, "global_step": 231674, "epoch": 1914} {"train_loss": -41.6502685546875, "global_step": 231675, "epoch": 1914} {"train_loss": -41.47402572631836, "global_step": 231676, "epoch": 1914} {"train_loss": -42.11935043334961, "global_step": 231677, "epoch": 1914} {"train_loss": -41.481204986572266, "global_step": 231678, "epoch": 1914} {"train_loss": -42.46942901611328, "global_step": 231679, "epoch": 1914} {"train_loss": -42.603477478027344, "global_step": 231680, "epoch": 1914} {"train_loss": -41.9554443359375, "global_step": 231681, "epoch": 1914} {"train_loss": -42.47154998779297, "global_step": 231682, "epoch": 1914} {"train_loss": -41.59663009643555, "global_step": 231683, "epoch": 1914} {"train_loss": -42.446815490722656, "global_step": 231684, "epoch": 1914} {"train_loss": -41.530330657958984, "global_step": 231685, "epoch": 1914} {"train_loss": -41.0654296875, "global_step": 231686, "epoch": 1914} {"train_loss": -41.99257278442383, "global_step": 231687, "epoch": 1914} {"train_loss": -42.379817962646484, "global_step": 231688, "epoch": 1914} {"train_loss": -41.1910285949707, "global_step": 231689, "epoch": 1914} {"train_loss": -42.26386260986328, "global_step": 231690, "epoch": 1914} {"train_loss": -42.475406646728516, "global_step": 231691, "epoch": 1914} {"train_loss": -42.792205810546875, "global_step": 231692, "epoch": 1914} {"train_loss": -42.1104621887207, "global_step": 231693, "epoch": 1914} {"train_loss": -42.59855651855469, "global_step": 231694, "epoch": 1914} {"train_loss": -41.63245391845703, "global_step": 231695, "epoch": 1914} {"train_loss": -42.7015266418457, "global_step": 231696, "epoch": 1914} {"train_loss": -41.97249221801758, "global_step": 231697, "epoch": 1914} {"train_loss": -42.499027252197266, "global_step": 231698, "epoch": 1914} {"train_loss": -42.73706817626953, "global_step": 231699, "epoch": 1914} {"train_loss": -41.94449996948242, "global_step": 231700, "epoch": 1914} {"train_loss": -42.31118392944336, "global_step": 231701, "epoch": 1914} {"train_loss": -42.3864860534668, "global_step": 231702, "epoch": 1914} {"train_loss": -42.8194694519043, "global_step": 231703, "epoch": 1914} {"train_loss": -41.984962463378906, "global_step": 231704, "epoch": 1914} {"train_loss": -41.7490119934082, "global_step": 231705, "epoch": 1914} {"train_loss": -41.5353889465332, "global_step": 231706, "epoch": 1914} {"train_loss": -41.31508255004883, "global_step": 231707, "epoch": 1914} {"train_loss": -40.811378479003906, "global_step": 231708, "epoch": 1914} {"train_loss": -41.45936965942383, "global_step": 231709, "epoch": 1914} {"train_loss": -40.93507766723633, "global_step": 231710, "epoch": 1914} {"train_loss": -41.92902755737305, "global_step": 231711, "epoch": 1914} {"train_loss": -41.53245162963867, "global_step": 231712, "epoch": 1914} {"train_loss": -40.53242874145508, "global_step": 231713, "epoch": 1914} {"train_loss": -41.25777551950502, "global_step": 231714, "epoch": 1914, "val_loss": 2592019.5} {"train_loss": -40.903316497802734, "global_step": 231715, "epoch": 1915} {"train_loss": -41.928829193115234, "global_step": 231716, "epoch": 1915} {"train_loss": -39.017982482910156, "global_step": 231717, "epoch": 1915} {"train_loss": -39.988346099853516, "global_step": 231718, "epoch": 1915} {"train_loss": -37.84035110473633, "global_step": 231719, "epoch": 1915} {"train_loss": -38.6058349609375, "global_step": 231720, "epoch": 1915} {"train_loss": -40.56571578979492, "global_step": 231721, "epoch": 1915} {"train_loss": -41.050140380859375, "global_step": 231722, "epoch": 1915} {"train_loss": -41.237056732177734, "global_step": 231723, "epoch": 1915} {"train_loss": -39.997066497802734, "global_step": 231724, "epoch": 1915} {"train_loss": -40.50012969970703, "global_step": 231725, "epoch": 1915} {"train_loss": -41.314788818359375, "global_step": 231726, "epoch": 1915} {"train_loss": -40.632240295410156, "global_step": 231727, "epoch": 1915} {"train_loss": -41.30795669555664, "global_step": 231728, "epoch": 1915} {"train_loss": -40.81209182739258, "global_step": 231729, "epoch": 1915} {"train_loss": -39.93309020996094, "global_step": 231730, "epoch": 1915} {"train_loss": -40.79104995727539, "global_step": 231731, "epoch": 1915} {"train_loss": -39.078651428222656, "global_step": 231732, "epoch": 1915} {"train_loss": -36.116695404052734, "global_step": 231733, "epoch": 1915} {"train_loss": -40.40780258178711, "global_step": 231734, "epoch": 1915} {"train_loss": -40.025123596191406, "global_step": 231735, "epoch": 1915} {"train_loss": -36.66158676147461, "global_step": 231736, "epoch": 1915} {"train_loss": -40.207618713378906, "global_step": 231737, "epoch": 1915} {"train_loss": -38.52241134643555, "global_step": 231738, "epoch": 1915} {"train_loss": -41.627655029296875, "global_step": 231739, "epoch": 1915} {"train_loss": -38.2457275390625, "global_step": 231740, "epoch": 1915} {"train_loss": -39.4290885925293, "global_step": 231741, "epoch": 1915} {"train_loss": -40.16743087768555, "global_step": 231742, "epoch": 1915} {"train_loss": -40.51847839355469, "global_step": 231743, "epoch": 1915} {"train_loss": -39.68464660644531, "global_step": 231744, "epoch": 1915} {"train_loss": -40.2060661315918, "global_step": 231745, "epoch": 1915} {"train_loss": -40.81988525390625, "global_step": 231746, "epoch": 1915} {"train_loss": -39.210784912109375, "global_step": 231747, "epoch": 1915} {"train_loss": -41.41377639770508, "global_step": 231748, "epoch": 1915} {"train_loss": -38.73280715942383, "global_step": 231749, "epoch": 1915} {"train_loss": -41.7615852355957, "global_step": 231750, "epoch": 1915} {"train_loss": -41.07917785644531, "global_step": 231751, "epoch": 1915} {"train_loss": -39.76852035522461, "global_step": 231752, "epoch": 1915} {"train_loss": -41.10992431640625, "global_step": 231753, "epoch": 1915} {"train_loss": -40.8343505859375, "global_step": 231754, "epoch": 1915} {"train_loss": -40.33751678466797, "global_step": 231755, "epoch": 1915} {"train_loss": -41.42574691772461, "global_step": 231756, "epoch": 1915} {"train_loss": -38.255577087402344, "global_step": 231757, "epoch": 1915} {"train_loss": -42.01899337768555, "global_step": 231758, "epoch": 1915} {"train_loss": -40.409053802490234, "global_step": 231759, "epoch": 1915} {"train_loss": -39.988433837890625, "global_step": 231760, "epoch": 1915} {"train_loss": -41.80933380126953, "global_step": 231761, "epoch": 1915} {"train_loss": -40.237064361572266, "global_step": 231762, "epoch": 1915} {"train_loss": -39.26240158081055, "global_step": 231763, "epoch": 1915} {"train_loss": -40.901458740234375, "global_step": 231764, "epoch": 1915} {"train_loss": -41.906036376953125, "global_step": 231765, "epoch": 1915} {"train_loss": -40.22808837890625, "global_step": 231766, "epoch": 1915} {"train_loss": -41.673274993896484, "global_step": 231767, "epoch": 1915} {"train_loss": -41.376930236816406, "global_step": 231768, "epoch": 1915} {"train_loss": -41.36127853393555, "global_step": 231769, "epoch": 1915} {"train_loss": -41.376197814941406, "global_step": 231770, "epoch": 1915} {"train_loss": -41.68240737915039, "global_step": 231771, "epoch": 1915} {"train_loss": -41.89605712890625, "global_step": 231772, "epoch": 1915} {"train_loss": -40.9004020690918, "global_step": 231773, "epoch": 1915} {"train_loss": -41.252254486083984, "global_step": 231774, "epoch": 1915} {"train_loss": -41.6971549987793, "global_step": 231775, "epoch": 1915} {"train_loss": -41.3709831237793, "global_step": 231776, "epoch": 1915} {"train_loss": -40.80381393432617, "global_step": 231777, "epoch": 1915} {"train_loss": -42.26678466796875, "global_step": 231778, "epoch": 1915} {"train_loss": -42.320823669433594, "global_step": 231779, "epoch": 1915} {"train_loss": -40.821292877197266, "global_step": 231780, "epoch": 1915} {"train_loss": -41.688507080078125, "global_step": 231781, "epoch": 1915} {"train_loss": -42.06626510620117, "global_step": 231782, "epoch": 1915} {"train_loss": -41.389835357666016, "global_step": 231783, "epoch": 1915} {"train_loss": -39.897518157958984, "global_step": 231784, "epoch": 1915} {"train_loss": -41.53019332885742, "global_step": 231785, "epoch": 1915} {"train_loss": -42.00198745727539, "global_step": 231786, "epoch": 1915} {"train_loss": -41.03215789794922, "global_step": 231787, "epoch": 1915} {"train_loss": -40.86514663696289, "global_step": 231788, "epoch": 1915} {"train_loss": -42.38859939575195, "global_step": 231789, "epoch": 1915} {"train_loss": -41.37793731689453, "global_step": 231790, "epoch": 1915} {"train_loss": -41.28865051269531, "global_step": 231791, "epoch": 1915} {"train_loss": -42.71108627319336, "global_step": 231792, "epoch": 1915} {"train_loss": -41.90770721435547, "global_step": 231793, "epoch": 1915} {"train_loss": -41.89207077026367, "global_step": 231794, "epoch": 1915} {"train_loss": -41.901607513427734, "global_step": 231795, "epoch": 1915} {"train_loss": -42.795047760009766, "global_step": 231796, "epoch": 1915} {"train_loss": -42.08905029296875, "global_step": 231797, "epoch": 1915} {"train_loss": -42.29030990600586, "global_step": 231798, "epoch": 1915} {"train_loss": -42.955078125, "global_step": 231799, "epoch": 1915} {"train_loss": -42.62259292602539, "global_step": 231800, "epoch": 1915} {"train_loss": -42.59827423095703, "global_step": 231801, "epoch": 1915} {"train_loss": -42.9245719909668, "global_step": 231802, "epoch": 1915} {"train_loss": -43.08137512207031, "global_step": 231803, "epoch": 1915} {"train_loss": -42.64180374145508, "global_step": 231804, "epoch": 1915} {"train_loss": -42.198848724365234, "global_step": 231805, "epoch": 1915} {"train_loss": -41.80898666381836, "global_step": 231806, "epoch": 1915} {"train_loss": -42.13941192626953, "global_step": 231807, "epoch": 1915} {"train_loss": -42.67999267578125, "global_step": 231808, "epoch": 1915} {"train_loss": -41.977935791015625, "global_step": 231809, "epoch": 1915} {"train_loss": -42.63660430908203, "global_step": 231810, "epoch": 1915} {"train_loss": -42.794158935546875, "global_step": 231811, "epoch": 1915} {"train_loss": -42.105133056640625, "global_step": 231812, "epoch": 1915} {"train_loss": -41.3141975402832, "global_step": 231813, "epoch": 1915} {"train_loss": -41.217681884765625, "global_step": 231814, "epoch": 1915} {"train_loss": -41.97739791870117, "global_step": 231815, "epoch": 1915} {"train_loss": -42.62424850463867, "global_step": 231816, "epoch": 1915} {"train_loss": -41.77577590942383, "global_step": 231817, "epoch": 1915} {"train_loss": -42.663185119628906, "global_step": 231818, "epoch": 1915} {"train_loss": -41.02788162231445, "global_step": 231819, "epoch": 1915} {"train_loss": -37.95633316040039, "global_step": 231820, "epoch": 1915} {"train_loss": -35.289485931396484, "global_step": 231821, "epoch": 1915} {"train_loss": -31.326364517211914, "global_step": 231822, "epoch": 1915} {"train_loss": -40.329341888427734, "global_step": 231823, "epoch": 1915} {"train_loss": -39.53865051269531, "global_step": 231824, "epoch": 1915} {"train_loss": -31.644514083862305, "global_step": 231825, "epoch": 1915} {"train_loss": -32.48683547973633, "global_step": 231826, "epoch": 1915} {"train_loss": -36.487361907958984, "global_step": 231827, "epoch": 1915} {"train_loss": -37.21318435668945, "global_step": 231828, "epoch": 1915} {"train_loss": -37.62646484375, "global_step": 231829, "epoch": 1915} {"train_loss": -38.57343673706055, "global_step": 231830, "epoch": 1915} {"train_loss": -38.19942092895508, "global_step": 231831, "epoch": 1915} {"train_loss": -39.31782531738281, "global_step": 231832, "epoch": 1915} {"train_loss": -38.24735641479492, "global_step": 231833, "epoch": 1915} {"train_loss": -38.61708068847656, "global_step": 231834, "epoch": 1915} {"train_loss": -40.49192075492922, "global_step": 231835, "epoch": 1915, "val_loss": 2579014.75} {"train_loss": -40.29852294921875, "global_step": 231836, "epoch": 1916} {"train_loss": -38.87944030761719, "global_step": 231837, "epoch": 1916} {"train_loss": -40.72823715209961, "global_step": 231838, "epoch": 1916} {"train_loss": -39.14792251586914, "global_step": 231839, "epoch": 1916} {"train_loss": -38.93614959716797, "global_step": 231840, "epoch": 1916} {"train_loss": -40.93949508666992, "global_step": 231841, "epoch": 1916} {"train_loss": -39.527984619140625, "global_step": 231842, "epoch": 1916} {"train_loss": -41.58319854736328, "global_step": 231843, "epoch": 1916} {"train_loss": -39.78257369995117, "global_step": 231844, "epoch": 1916} {"train_loss": -40.976531982421875, "global_step": 231845, "epoch": 1916} {"train_loss": -41.285091400146484, "global_step": 231846, "epoch": 1916} {"train_loss": -40.75142288208008, "global_step": 231847, "epoch": 1916} {"train_loss": -41.37144088745117, "global_step": 231848, "epoch": 1916} {"train_loss": -40.794368743896484, "global_step": 231849, "epoch": 1916} {"train_loss": -40.94783401489258, "global_step": 231850, "epoch": 1916} {"train_loss": -41.114139556884766, "global_step": 231851, "epoch": 1916} {"train_loss": -41.296993255615234, "global_step": 231852, "epoch": 1916} {"train_loss": -41.24396514892578, "global_step": 231853, "epoch": 1916} {"train_loss": -41.721832275390625, "global_step": 231854, "epoch": 1916} {"train_loss": -41.87146759033203, "global_step": 231855, "epoch": 1916} {"train_loss": -41.359920501708984, "global_step": 231856, "epoch": 1916} {"train_loss": -42.37843322753906, "global_step": 231857, "epoch": 1916} {"train_loss": -41.37043380737305, "global_step": 231858, "epoch": 1916} {"train_loss": -42.2457389831543, "global_step": 231859, "epoch": 1916} {"train_loss": -41.75556182861328, "global_step": 231860, "epoch": 1916} {"train_loss": -41.898155212402344, "global_step": 231861, "epoch": 1916} {"train_loss": -41.58369064331055, "global_step": 231862, "epoch": 1916} {"train_loss": -41.77581787109375, "global_step": 231863, "epoch": 1916} {"train_loss": -41.87791061401367, "global_step": 231864, "epoch": 1916} {"train_loss": -41.58644485473633, "global_step": 231865, "epoch": 1916} {"train_loss": -42.35713577270508, "global_step": 231866, "epoch": 1916} {"train_loss": -41.17869567871094, "global_step": 231867, "epoch": 1916} {"train_loss": -42.03901290893555, "global_step": 231868, "epoch": 1916} {"train_loss": -40.852298736572266, "global_step": 231869, "epoch": 1916} {"train_loss": -42.043304443359375, "global_step": 231870, "epoch": 1916} {"train_loss": -42.048095703125, "global_step": 231871, "epoch": 1916} {"train_loss": -42.42818832397461, "global_step": 231872, "epoch": 1916} {"train_loss": -42.15348434448242, "global_step": 231873, "epoch": 1916} {"train_loss": -41.30984115600586, "global_step": 231874, "epoch": 1916} {"train_loss": -42.768917083740234, "global_step": 231875, "epoch": 1916} {"train_loss": -41.269615173339844, "global_step": 231876, "epoch": 1916} {"train_loss": -41.85710144042969, "global_step": 231877, "epoch": 1916} {"train_loss": -41.93443298339844, "global_step": 231878, "epoch": 1916} {"train_loss": -42.171852111816406, "global_step": 231879, "epoch": 1916} {"train_loss": -42.07087707519531, "global_step": 231880, "epoch": 1916} {"train_loss": -41.86829376220703, "global_step": 231881, "epoch": 1916} {"train_loss": -42.34952163696289, "global_step": 231882, "epoch": 1916} {"train_loss": -41.79841995239258, "global_step": 231883, "epoch": 1916} {"train_loss": -42.321285247802734, "global_step": 231884, "epoch": 1916} {"train_loss": -42.09839630126953, "global_step": 231885, "epoch": 1916} {"train_loss": -42.125755310058594, "global_step": 231886, "epoch": 1916} {"train_loss": -42.508338928222656, "global_step": 231887, "epoch": 1916} {"train_loss": -42.00689697265625, "global_step": 231888, "epoch": 1916} {"train_loss": -42.806087493896484, "global_step": 231889, "epoch": 1916} {"train_loss": -42.01870346069336, "global_step": 231890, "epoch": 1916} {"train_loss": -42.3236083984375, "global_step": 231891, "epoch": 1916} {"train_loss": -42.932804107666016, "global_step": 231892, "epoch": 1916} {"train_loss": -42.611385345458984, "global_step": 231893, "epoch": 1916} {"train_loss": -42.47822189331055, "global_step": 231894, "epoch": 1916} {"train_loss": -42.85036087036133, "global_step": 231895, "epoch": 1916} {"train_loss": -42.633602142333984, "global_step": 231896, "epoch": 1916} {"train_loss": -42.65043258666992, "global_step": 231897, "epoch": 1916} {"train_loss": -42.55867004394531, "global_step": 231898, "epoch": 1916} {"train_loss": -42.640899658203125, "global_step": 231899, "epoch": 1916} {"train_loss": -43.02555847167969, "global_step": 231900, "epoch": 1916} {"train_loss": -42.93209457397461, "global_step": 231901, "epoch": 1916} {"train_loss": -42.29348373413086, "global_step": 231902, "epoch": 1916} {"train_loss": -42.81819152832031, "global_step": 231903, "epoch": 1916} {"train_loss": -42.540626525878906, "global_step": 231904, "epoch": 1916} {"train_loss": -42.8079833984375, "global_step": 231905, "epoch": 1916} {"train_loss": -42.0211296081543, "global_step": 231906, "epoch": 1916} {"train_loss": -42.8311653137207, "global_step": 231907, "epoch": 1916} {"train_loss": -42.661529541015625, "global_step": 231908, "epoch": 1916} {"train_loss": -42.880123138427734, "global_step": 231909, "epoch": 1916} {"train_loss": -42.613338470458984, "global_step": 231910, "epoch": 1916} {"train_loss": -42.685543060302734, "global_step": 231911, "epoch": 1916} {"train_loss": -43.010005950927734, "global_step": 231912, "epoch": 1916} {"train_loss": -42.99546813964844, "global_step": 231913, "epoch": 1916} {"train_loss": -42.37096405029297, "global_step": 231914, "epoch": 1916} {"train_loss": -42.45231246948242, "global_step": 231915, "epoch": 1916} {"train_loss": -41.01568603515625, "global_step": 231916, "epoch": 1916} {"train_loss": -41.99396514892578, "global_step": 231917, "epoch": 1916} {"train_loss": -42.21210861206055, "global_step": 231918, "epoch": 1916} {"train_loss": -42.96087646484375, "global_step": 231919, "epoch": 1916} {"train_loss": -42.33748245239258, "global_step": 231920, "epoch": 1916} {"train_loss": -42.731624603271484, "global_step": 231921, "epoch": 1916} {"train_loss": -42.19580078125, "global_step": 231922, "epoch": 1916} {"train_loss": -42.687843322753906, "global_step": 231923, "epoch": 1916} {"train_loss": -42.31748580932617, "global_step": 231924, "epoch": 1916} {"train_loss": -42.01963424682617, "global_step": 231925, "epoch": 1916} {"train_loss": -42.15036392211914, "global_step": 231926, "epoch": 1916} {"train_loss": -42.707881927490234, "global_step": 231927, "epoch": 1916} {"train_loss": -42.55633544921875, "global_step": 231928, "epoch": 1916} {"train_loss": -41.993648529052734, "global_step": 231929, "epoch": 1916} {"train_loss": -40.84151840209961, "global_step": 231930, "epoch": 1916} {"train_loss": -41.43352508544922, "global_step": 231931, "epoch": 1916} {"train_loss": -41.80994415283203, "global_step": 231932, "epoch": 1916} {"train_loss": -42.65913009643555, "global_step": 231933, "epoch": 1916} {"train_loss": -41.658302307128906, "global_step": 231934, "epoch": 1916} {"train_loss": -40.17950439453125, "global_step": 231935, "epoch": 1916} {"train_loss": -40.4692268371582, "global_step": 231936, "epoch": 1916} {"train_loss": -40.9822998046875, "global_step": 231937, "epoch": 1916} {"train_loss": -40.65864944458008, "global_step": 231938, "epoch": 1916} {"train_loss": -40.96403121948242, "global_step": 231939, "epoch": 1916} {"train_loss": -40.29899215698242, "global_step": 231940, "epoch": 1916} {"train_loss": -41.555171966552734, "global_step": 231941, "epoch": 1916} {"train_loss": -41.919273376464844, "global_step": 231942, "epoch": 1916} {"train_loss": -39.63535690307617, "global_step": 231943, "epoch": 1916} {"train_loss": -38.35503387451172, "global_step": 231944, "epoch": 1916} {"train_loss": -41.39943313598633, "global_step": 231945, "epoch": 1916} {"train_loss": -42.12141036987305, "global_step": 231946, "epoch": 1916} {"train_loss": -39.890689849853516, "global_step": 231947, "epoch": 1916} {"train_loss": -42.07936477661133, "global_step": 231948, "epoch": 1916} {"train_loss": -41.81950378417969, "global_step": 231949, "epoch": 1916} {"train_loss": -41.26846694946289, "global_step": 231950, "epoch": 1916} {"train_loss": -42.107479095458984, "global_step": 231951, "epoch": 1916} {"train_loss": -42.206634521484375, "global_step": 231952, "epoch": 1916} {"train_loss": -41.97800827026367, "global_step": 231953, "epoch": 1916} {"train_loss": -42.500728607177734, "global_step": 231954, "epoch": 1916} {"train_loss": -42.48894119262695, "global_step": 231955, "epoch": 1916} {"train_loss": -41.7845166103899, "global_step": 231956, "epoch": 1916, "val_loss": 2565984.75} {"train_loss": -42.79171371459961, "global_step": 231957, "epoch": 1917} {"train_loss": -42.03815841674805, "global_step": 231958, "epoch": 1917} {"train_loss": -41.79429244995117, "global_step": 231959, "epoch": 1917} {"train_loss": -42.46647262573242, "global_step": 231960, "epoch": 1917} {"train_loss": -42.55707931518555, "global_step": 231961, "epoch": 1917} {"train_loss": -42.02964401245117, "global_step": 231962, "epoch": 1917} {"train_loss": -42.65252685546875, "global_step": 231963, "epoch": 1917} {"train_loss": -42.30039596557617, "global_step": 231964, "epoch": 1917} {"train_loss": -42.17334747314453, "global_step": 231965, "epoch": 1917} {"train_loss": -42.12946701049805, "global_step": 231966, "epoch": 1917} {"train_loss": -42.57046127319336, "global_step": 231967, "epoch": 1917} {"train_loss": -41.86246871948242, "global_step": 231968, "epoch": 1917} {"train_loss": -42.41150665283203, "global_step": 231969, "epoch": 1917} {"train_loss": -42.74905014038086, "global_step": 231970, "epoch": 1917} {"train_loss": -41.94100570678711, "global_step": 231971, "epoch": 1917} {"train_loss": -41.52385330200195, "global_step": 231972, "epoch": 1917} {"train_loss": -42.76901626586914, "global_step": 231973, "epoch": 1917} {"train_loss": -41.05696487426758, "global_step": 231974, "epoch": 1917} {"train_loss": -42.290985107421875, "global_step": 231975, "epoch": 1917} {"train_loss": -43.03916549682617, "global_step": 231976, "epoch": 1917} {"train_loss": -42.12343978881836, "global_step": 231977, "epoch": 1917} {"train_loss": -41.80086898803711, "global_step": 231978, "epoch": 1917} {"train_loss": -41.61466598510742, "global_step": 231979, "epoch": 1917} {"train_loss": -41.62726974487305, "global_step": 231980, "epoch": 1917} {"train_loss": -41.51850128173828, "global_step": 231981, "epoch": 1917} {"train_loss": -42.58673858642578, "global_step": 231982, "epoch": 1917} {"train_loss": -41.56230926513672, "global_step": 231983, "epoch": 1917} {"train_loss": -40.72462844848633, "global_step": 231984, "epoch": 1917} {"train_loss": -41.05147171020508, "global_step": 231985, "epoch": 1917} {"train_loss": -41.39711380004883, "global_step": 231986, "epoch": 1917} {"train_loss": -42.58716583251953, "global_step": 231987, "epoch": 1917} {"train_loss": -40.225765228271484, "global_step": 231988, "epoch": 1917} {"train_loss": -38.777191162109375, "global_step": 231989, "epoch": 1917} {"train_loss": -41.274635314941406, "global_step": 231990, "epoch": 1917} {"train_loss": -40.61457061767578, "global_step": 231991, "epoch": 1917} {"train_loss": -39.19161605834961, "global_step": 231992, "epoch": 1917} {"train_loss": -36.634334564208984, "global_step": 231993, "epoch": 1917} {"train_loss": -40.56004333496094, "global_step": 231994, "epoch": 1917} {"train_loss": -42.07770538330078, "global_step": 231995, "epoch": 1917} {"train_loss": -39.25593948364258, "global_step": 231996, "epoch": 1917} {"train_loss": -38.64310836791992, "global_step": 231997, "epoch": 1917} {"train_loss": -41.09840774536133, "global_step": 231998, "epoch": 1917} {"train_loss": -40.50889587402344, "global_step": 231999, "epoch": 1917} {"train_loss": -38.70527267456055, "global_step": 232000, "epoch": 1917} {"train_loss": -41.050567626953125, "global_step": 232001, "epoch": 1917} {"train_loss": -39.40121078491211, "global_step": 232002, "epoch": 1917} {"train_loss": -37.50070571899414, "global_step": 232003, "epoch": 1917} {"train_loss": -41.052520751953125, "global_step": 232004, "epoch": 1917} {"train_loss": -40.03335189819336, "global_step": 232005, "epoch": 1917} {"train_loss": -39.61346435546875, "global_step": 232006, "epoch": 1917} {"train_loss": -41.41847610473633, "global_step": 232007, "epoch": 1917} {"train_loss": -40.17544174194336, "global_step": 232008, "epoch": 1917} {"train_loss": -40.90083312988281, "global_step": 232009, "epoch": 1917} {"train_loss": -41.099666595458984, "global_step": 232010, "epoch": 1917} {"train_loss": -38.64350509643555, "global_step": 232011, "epoch": 1917} {"train_loss": -40.811431884765625, "global_step": 232012, "epoch": 1917} {"train_loss": -41.041358947753906, "global_step": 232013, "epoch": 1917} {"train_loss": -39.994537353515625, "global_step": 232014, "epoch": 1917} {"train_loss": -41.296966552734375, "global_step": 232015, "epoch": 1917} {"train_loss": -40.433902740478516, "global_step": 232016, "epoch": 1917} {"train_loss": -41.50168228149414, "global_step": 232017, "epoch": 1917} {"train_loss": -41.2736930847168, "global_step": 232018, "epoch": 1917} {"train_loss": -41.78955841064453, "global_step": 232019, "epoch": 1917} {"train_loss": -40.7502555847168, "global_step": 232020, "epoch": 1917} {"train_loss": -42.02378463745117, "global_step": 232021, "epoch": 1917} {"train_loss": -41.14873123168945, "global_step": 232022, "epoch": 1917} {"train_loss": -41.988155364990234, "global_step": 232023, "epoch": 1917} {"train_loss": -41.93924331665039, "global_step": 232024, "epoch": 1917} {"train_loss": -41.35079574584961, "global_step": 232025, "epoch": 1917} {"train_loss": -41.72376251220703, "global_step": 232026, "epoch": 1917} {"train_loss": -42.21649932861328, "global_step": 232027, "epoch": 1917} {"train_loss": -41.753292083740234, "global_step": 232028, "epoch": 1917} {"train_loss": -42.19232177734375, "global_step": 232029, "epoch": 1917} {"train_loss": -41.11562728881836, "global_step": 232030, "epoch": 1917} {"train_loss": -41.89970779418945, "global_step": 232031, "epoch": 1917} {"train_loss": -42.02513885498047, "global_step": 232032, "epoch": 1917} {"train_loss": -41.83688735961914, "global_step": 232033, "epoch": 1917} {"train_loss": -42.06348419189453, "global_step": 232034, "epoch": 1917} {"train_loss": -42.25661849975586, "global_step": 232035, "epoch": 1917} {"train_loss": -42.53983688354492, "global_step": 232036, "epoch": 1917} {"train_loss": -42.05587387084961, "global_step": 232037, "epoch": 1917} {"train_loss": -42.35233688354492, "global_step": 232038, "epoch": 1917} {"train_loss": -42.202552795410156, "global_step": 232039, "epoch": 1917} {"train_loss": -42.45847702026367, "global_step": 232040, "epoch": 1917} {"train_loss": -42.484352111816406, "global_step": 232041, "epoch": 1917} {"train_loss": -42.7251091003418, "global_step": 232042, "epoch": 1917} {"train_loss": -42.63649368286133, "global_step": 232043, "epoch": 1917} {"train_loss": -42.22350311279297, "global_step": 232044, "epoch": 1917} {"train_loss": -42.74911117553711, "global_step": 232045, "epoch": 1917} {"train_loss": -42.92995834350586, "global_step": 232046, "epoch": 1917} {"train_loss": -42.65814208984375, "global_step": 232047, "epoch": 1917} {"train_loss": -42.75642013549805, "global_step": 232048, "epoch": 1917} {"train_loss": -42.02431106567383, "global_step": 232049, "epoch": 1917} {"train_loss": -42.447383880615234, "global_step": 232050, "epoch": 1917} {"train_loss": -42.3681755065918, "global_step": 232051, "epoch": 1917} {"train_loss": -42.36143112182617, "global_step": 232052, "epoch": 1917} {"train_loss": -42.54189682006836, "global_step": 232053, "epoch": 1917} {"train_loss": -42.209869384765625, "global_step": 232054, "epoch": 1917} {"train_loss": -42.8411979675293, "global_step": 232055, "epoch": 1917} {"train_loss": -43.014217376708984, "global_step": 232056, "epoch": 1917} {"train_loss": -42.51736068725586, "global_step": 232057, "epoch": 1917} {"train_loss": -42.77621078491211, "global_step": 232058, "epoch": 1917} {"train_loss": -43.019012451171875, "global_step": 232059, "epoch": 1917} {"train_loss": -42.374996185302734, "global_step": 232060, "epoch": 1917} {"train_loss": -42.690425872802734, "global_step": 232061, "epoch": 1917} {"train_loss": -42.36770248413086, "global_step": 232062, "epoch": 1917} {"train_loss": -41.52085876464844, "global_step": 232063, "epoch": 1917} {"train_loss": -41.273712158203125, "global_step": 232064, "epoch": 1917} {"train_loss": -43.20563888549805, "global_step": 232065, "epoch": 1917} {"train_loss": -41.75972366333008, "global_step": 232066, "epoch": 1917} {"train_loss": -42.358882904052734, "global_step": 232067, "epoch": 1917} {"train_loss": -41.73524856567383, "global_step": 232068, "epoch": 1917} {"train_loss": -42.603206634521484, "global_step": 232069, "epoch": 1917} {"train_loss": -42.39511489868164, "global_step": 232070, "epoch": 1917} {"train_loss": -42.494232177734375, "global_step": 232071, "epoch": 1917} {"train_loss": -42.68197250366211, "global_step": 232072, "epoch": 1917} {"train_loss": -42.8504524230957, "global_step": 232073, "epoch": 1917} {"train_loss": -43.46421813964844, "global_step": 232074, "epoch": 1917} {"train_loss": -42.41093444824219, "global_step": 232075, "epoch": 1917} {"train_loss": -42.026607513427734, "global_step": 232076, "epoch": 1917} {"train_loss": -41.67046163889987, "global_step": 232077, "epoch": 1917, "val_loss": 2638092.25} {"train_loss": -42.1364860534668, "global_step": 232078, "epoch": 1918} {"train_loss": -40.21024703979492, "global_step": 232079, "epoch": 1918} {"train_loss": -41.8458366394043, "global_step": 232080, "epoch": 1918} {"train_loss": -41.72508239746094, "global_step": 232081, "epoch": 1918} {"train_loss": -41.3573112487793, "global_step": 232082, "epoch": 1918} {"train_loss": -40.61738586425781, "global_step": 232083, "epoch": 1918} {"train_loss": -42.22298049926758, "global_step": 232084, "epoch": 1918} {"train_loss": -40.87532424926758, "global_step": 232085, "epoch": 1918} {"train_loss": -40.485652923583984, "global_step": 232086, "epoch": 1918} {"train_loss": -40.50707244873047, "global_step": 232087, "epoch": 1918} {"train_loss": -42.24760055541992, "global_step": 232088, "epoch": 1918} {"train_loss": -40.187408447265625, "global_step": 232089, "epoch": 1918} {"train_loss": -39.838130950927734, "global_step": 232090, "epoch": 1918} {"train_loss": -41.83798599243164, "global_step": 232091, "epoch": 1918} {"train_loss": -38.77714157104492, "global_step": 232092, "epoch": 1918} {"train_loss": -40.0307731628418, "global_step": 232093, "epoch": 1918} {"train_loss": -42.12667465209961, "global_step": 232094, "epoch": 1918} {"train_loss": -37.946678161621094, "global_step": 232095, "epoch": 1918} {"train_loss": -41.37200164794922, "global_step": 232096, "epoch": 1918} {"train_loss": -40.6907844543457, "global_step": 232097, "epoch": 1918} {"train_loss": -40.5247917175293, "global_step": 232098, "epoch": 1918} {"train_loss": -41.46699523925781, "global_step": 232099, "epoch": 1918} {"train_loss": -41.53691864013672, "global_step": 232100, "epoch": 1918} {"train_loss": -41.00514221191406, "global_step": 232101, "epoch": 1918} {"train_loss": -42.1500358581543, "global_step": 232102, "epoch": 1918} {"train_loss": -41.11787414550781, "global_step": 232103, "epoch": 1918} {"train_loss": -42.13411331176758, "global_step": 232104, "epoch": 1918} {"train_loss": -41.71604537963867, "global_step": 232105, "epoch": 1918} {"train_loss": -41.1388053894043, "global_step": 232106, "epoch": 1918} {"train_loss": -42.75739669799805, "global_step": 232107, "epoch": 1918} {"train_loss": -41.801517486572266, "global_step": 232108, "epoch": 1918} {"train_loss": -39.7887077331543, "global_step": 232109, "epoch": 1918} {"train_loss": -42.03252410888672, "global_step": 232110, "epoch": 1918} {"train_loss": -41.8771858215332, "global_step": 232111, "epoch": 1918} {"train_loss": -42.198707580566406, "global_step": 232112, "epoch": 1918} {"train_loss": -41.69570541381836, "global_step": 232113, "epoch": 1918} {"train_loss": -42.25726318359375, "global_step": 232114, "epoch": 1918} {"train_loss": -42.11601638793945, "global_step": 232115, "epoch": 1918} {"train_loss": -41.55976104736328, "global_step": 232116, "epoch": 1918} {"train_loss": -41.1847038269043, "global_step": 232117, "epoch": 1918} {"train_loss": -41.78266143798828, "global_step": 232118, "epoch": 1918} {"train_loss": -39.71781921386719, "global_step": 232119, "epoch": 1918} {"train_loss": -41.09389877319336, "global_step": 232120, "epoch": 1918} {"train_loss": -41.7054557800293, "global_step": 232121, "epoch": 1918} {"train_loss": -42.234718322753906, "global_step": 232122, "epoch": 1918} {"train_loss": -37.3922119140625, "global_step": 232123, "epoch": 1918} {"train_loss": -40.741485595703125, "global_step": 232124, "epoch": 1918} {"train_loss": -42.542327880859375, "global_step": 232125, "epoch": 1918} {"train_loss": -41.67764663696289, "global_step": 232126, "epoch": 1918} {"train_loss": -41.57950973510742, "global_step": 232127, "epoch": 1918} {"train_loss": -41.88300704956055, "global_step": 232128, "epoch": 1918} {"train_loss": -42.253536224365234, "global_step": 232129, "epoch": 1918} {"train_loss": -40.812992095947266, "global_step": 232130, "epoch": 1918} {"train_loss": -40.87506103515625, "global_step": 232131, "epoch": 1918} {"train_loss": -40.805973052978516, "global_step": 232132, "epoch": 1918} {"train_loss": -39.55792236328125, "global_step": 232133, "epoch": 1918} {"train_loss": -41.34978103637695, "global_step": 232134, "epoch": 1918} {"train_loss": -42.798828125, "global_step": 232135, "epoch": 1918} {"train_loss": -42.03782272338867, "global_step": 232136, "epoch": 1918} {"train_loss": -41.966217041015625, "global_step": 232137, "epoch": 1918} {"train_loss": -42.01701736450195, "global_step": 232138, "epoch": 1918} {"train_loss": -40.693031311035156, "global_step": 232139, "epoch": 1918} {"train_loss": -41.651302337646484, "global_step": 232140, "epoch": 1918} {"train_loss": -42.46100616455078, "global_step": 232141, "epoch": 1918} {"train_loss": -41.65673828125, "global_step": 232142, "epoch": 1918} {"train_loss": -40.59583282470703, "global_step": 232143, "epoch": 1918} {"train_loss": -41.53993606567383, "global_step": 232144, "epoch": 1918} {"train_loss": -42.59385299682617, "global_step": 232145, "epoch": 1918} {"train_loss": -42.6408805847168, "global_step": 232146, "epoch": 1918} {"train_loss": -40.9107780456543, "global_step": 232147, "epoch": 1918} {"train_loss": -40.01255798339844, "global_step": 232148, "epoch": 1918} {"train_loss": -41.63471603393555, "global_step": 232149, "epoch": 1918} {"train_loss": -40.51211929321289, "global_step": 232150, "epoch": 1918} {"train_loss": -41.508216857910156, "global_step": 232151, "epoch": 1918} {"train_loss": -41.95253372192383, "global_step": 232152, "epoch": 1918} {"train_loss": -41.94014358520508, "global_step": 232153, "epoch": 1918} {"train_loss": -41.59450149536133, "global_step": 232154, "epoch": 1918} {"train_loss": -41.383392333984375, "global_step": 232155, "epoch": 1918} {"train_loss": -41.575706481933594, "global_step": 232156, "epoch": 1918} {"train_loss": -41.202178955078125, "global_step": 232157, "epoch": 1918} {"train_loss": -41.925716400146484, "global_step": 232158, "epoch": 1918} {"train_loss": -41.82169723510742, "global_step": 232159, "epoch": 1918} {"train_loss": -37.52808380126953, "global_step": 232160, "epoch": 1918} {"train_loss": -42.35784912109375, "global_step": 232161, "epoch": 1918} {"train_loss": -42.65522766113281, "global_step": 232162, "epoch": 1918} {"train_loss": -42.0157470703125, "global_step": 232163, "epoch": 1918} {"train_loss": -41.84475326538086, "global_step": 232164, "epoch": 1918} {"train_loss": -35.00150680541992, "global_step": 232165, "epoch": 1918} {"train_loss": -41.335567474365234, "global_step": 232166, "epoch": 1918} {"train_loss": -41.14796829223633, "global_step": 232167, "epoch": 1918} {"train_loss": -42.30879211425781, "global_step": 232168, "epoch": 1918} {"train_loss": -41.74900436401367, "global_step": 232169, "epoch": 1918} {"train_loss": -41.997859954833984, "global_step": 232170, "epoch": 1918} {"train_loss": -41.879310607910156, "global_step": 232171, "epoch": 1918} {"train_loss": -41.19924545288086, "global_step": 232172, "epoch": 1918} {"train_loss": -42.00575637817383, "global_step": 232173, "epoch": 1918} {"train_loss": -41.748626708984375, "global_step": 232174, "epoch": 1918} {"train_loss": -39.07243728637695, "global_step": 232175, "epoch": 1918} {"train_loss": -41.18430709838867, "global_step": 232176, "epoch": 1918} {"train_loss": -34.86261749267578, "global_step": 232177, "epoch": 1918} {"train_loss": -38.75388717651367, "global_step": 232178, "epoch": 1918} {"train_loss": -40.4792594909668, "global_step": 232179, "epoch": 1918} {"train_loss": -36.55576705932617, "global_step": 232180, "epoch": 1918} {"train_loss": -38.5246696472168, "global_step": 232181, "epoch": 1918} {"train_loss": -41.379756927490234, "global_step": 232182, "epoch": 1918} {"train_loss": -34.57263946533203, "global_step": 232183, "epoch": 1918} {"train_loss": -39.69157409667969, "global_step": 232184, "epoch": 1918} {"train_loss": -37.15207290649414, "global_step": 232185, "epoch": 1918} {"train_loss": -41.398738861083984, "global_step": 232186, "epoch": 1918} {"train_loss": -37.05748748779297, "global_step": 232187, "epoch": 1918} {"train_loss": -40.51524353027344, "global_step": 232188, "epoch": 1918} {"train_loss": -39.190486907958984, "global_step": 232189, "epoch": 1918} {"train_loss": -40.5986442565918, "global_step": 232190, "epoch": 1918} {"train_loss": -40.51640701293945, "global_step": 232191, "epoch": 1918} {"train_loss": -39.06557846069336, "global_step": 232192, "epoch": 1918} {"train_loss": -40.643795013427734, "global_step": 232193, "epoch": 1918} {"train_loss": -40.979766845703125, "global_step": 232194, "epoch": 1918} {"train_loss": -38.48142623901367, "global_step": 232195, "epoch": 1918} {"train_loss": -41.39204406738281, "global_step": 232196, "epoch": 1918} {"train_loss": -40.200408935546875, "global_step": 232197, "epoch": 1918} {"train_loss": -40.88857250371255, "global_step": 232198, "epoch": 1918, "val_loss": 2597138.0} {"train_loss": -39.9283332824707, "global_step": 232199, "epoch": 1919} {"train_loss": -41.64274215698242, "global_step": 232200, "epoch": 1919} {"train_loss": -40.8213005065918, "global_step": 232201, "epoch": 1919} {"train_loss": -39.735652923583984, "global_step": 232202, "epoch": 1919} {"train_loss": -40.306880950927734, "global_step": 232203, "epoch": 1919} {"train_loss": -41.06919479370117, "global_step": 232204, "epoch": 1919} {"train_loss": -41.2005500793457, "global_step": 232205, "epoch": 1919} {"train_loss": -41.30107116699219, "global_step": 232206, "epoch": 1919} {"train_loss": -41.63386154174805, "global_step": 232207, "epoch": 1919} {"train_loss": -41.755409240722656, "global_step": 232208, "epoch": 1919} {"train_loss": -41.51673889160156, "global_step": 232209, "epoch": 1919} {"train_loss": -41.65047073364258, "global_step": 232210, "epoch": 1919} {"train_loss": -40.47853088378906, "global_step": 232211, "epoch": 1919} {"train_loss": -41.641441345214844, "global_step": 232212, "epoch": 1919} {"train_loss": -41.820953369140625, "global_step": 232213, "epoch": 1919} {"train_loss": -42.20563888549805, "global_step": 232214, "epoch": 1919} {"train_loss": -41.04216384887695, "global_step": 232215, "epoch": 1919} {"train_loss": -41.578460693359375, "global_step": 232216, "epoch": 1919} {"train_loss": -42.35976791381836, "global_step": 232217, "epoch": 1919} {"train_loss": -41.86518478393555, "global_step": 232218, "epoch": 1919} {"train_loss": -42.572608947753906, "global_step": 232219, "epoch": 1919} {"train_loss": -41.198055267333984, "global_step": 232220, "epoch": 1919} {"train_loss": -41.74338912963867, "global_step": 232221, "epoch": 1919} {"train_loss": -42.3216667175293, "global_step": 232222, "epoch": 1919} {"train_loss": -42.0773811340332, "global_step": 232223, "epoch": 1919} {"train_loss": -42.52702713012695, "global_step": 232224, "epoch": 1919} {"train_loss": -41.914058685302734, "global_step": 232225, "epoch": 1919} {"train_loss": -42.48433303833008, "global_step": 232226, "epoch": 1919} {"train_loss": -42.82218551635742, "global_step": 232227, "epoch": 1919} {"train_loss": -41.66472625732422, "global_step": 232228, "epoch": 1919} {"train_loss": -42.520294189453125, "global_step": 232229, "epoch": 1919} {"train_loss": -42.1224479675293, "global_step": 232230, "epoch": 1919} {"train_loss": -42.46128463745117, "global_step": 232231, "epoch": 1919} {"train_loss": -42.12548065185547, "global_step": 232232, "epoch": 1919} {"train_loss": -42.56476593017578, "global_step": 232233, "epoch": 1919} {"train_loss": -42.33707809448242, "global_step": 232234, "epoch": 1919} {"train_loss": -41.6265983581543, "global_step": 232235, "epoch": 1919} {"train_loss": -41.54395294189453, "global_step": 232236, "epoch": 1919} {"train_loss": -42.1622428894043, "global_step": 232237, "epoch": 1919} {"train_loss": -40.65065002441406, "global_step": 232238, "epoch": 1919} {"train_loss": -42.49699783325195, "global_step": 232239, "epoch": 1919} {"train_loss": -41.65714645385742, "global_step": 232240, "epoch": 1919} {"train_loss": -40.9349250793457, "global_step": 232241, "epoch": 1919} {"train_loss": -41.68233871459961, "global_step": 232242, "epoch": 1919} {"train_loss": -41.34168243408203, "global_step": 232243, "epoch": 1919} {"train_loss": -40.340511322021484, "global_step": 232244, "epoch": 1919} {"train_loss": -42.41218948364258, "global_step": 232245, "epoch": 1919} {"train_loss": -40.518455505371094, "global_step": 232246, "epoch": 1919} {"train_loss": -42.244911193847656, "global_step": 232247, "epoch": 1919} {"train_loss": -41.51223373413086, "global_step": 232248, "epoch": 1919} {"train_loss": -42.14652633666992, "global_step": 232249, "epoch": 1919} {"train_loss": -41.66227340698242, "global_step": 232250, "epoch": 1919} {"train_loss": -42.011383056640625, "global_step": 232251, "epoch": 1919} {"train_loss": -42.142330169677734, "global_step": 232252, "epoch": 1919} {"train_loss": -41.27016067504883, "global_step": 232253, "epoch": 1919} {"train_loss": -41.08063888549805, "global_step": 232254, "epoch": 1919} {"train_loss": -41.15664291381836, "global_step": 232255, "epoch": 1919} {"train_loss": -41.101192474365234, "global_step": 232256, "epoch": 1919} {"train_loss": -41.44804000854492, "global_step": 232257, "epoch": 1919} {"train_loss": -41.25234603881836, "global_step": 232258, "epoch": 1919} {"train_loss": -38.92573928833008, "global_step": 232259, "epoch": 1919} {"train_loss": -41.47466278076172, "global_step": 232260, "epoch": 1919} {"train_loss": -40.51610565185547, "global_step": 232261, "epoch": 1919} {"train_loss": -40.89078903198242, "global_step": 232262, "epoch": 1919} {"train_loss": -40.603023529052734, "global_step": 232263, "epoch": 1919} {"train_loss": -41.19125747680664, "global_step": 232264, "epoch": 1919} {"train_loss": -36.015045166015625, "global_step": 232265, "epoch": 1919} {"train_loss": -40.85311508178711, "global_step": 232266, "epoch": 1919} {"train_loss": -40.501277923583984, "global_step": 232267, "epoch": 1919} {"train_loss": -41.46294021606445, "global_step": 232268, "epoch": 1919} {"train_loss": -41.19028091430664, "global_step": 232269, "epoch": 1919} {"train_loss": -40.749267578125, "global_step": 232270, "epoch": 1919} {"train_loss": -41.4008903503418, "global_step": 232271, "epoch": 1919} {"train_loss": -41.795135498046875, "global_step": 232272, "epoch": 1919} {"train_loss": -40.11742401123047, "global_step": 232273, "epoch": 1919} {"train_loss": -39.524532318115234, "global_step": 232274, "epoch": 1919} {"train_loss": -41.112178802490234, "global_step": 232275, "epoch": 1919} {"train_loss": -41.40313720703125, "global_step": 232276, "epoch": 1919} {"train_loss": -41.100921630859375, "global_step": 232277, "epoch": 1919} {"train_loss": -40.37183380126953, "global_step": 232278, "epoch": 1919} {"train_loss": -42.08916091918945, "global_step": 232279, "epoch": 1919} {"train_loss": -40.375946044921875, "global_step": 232280, "epoch": 1919} {"train_loss": -41.17911148071289, "global_step": 232281, "epoch": 1919} {"train_loss": -40.05216598510742, "global_step": 232282, "epoch": 1919} {"train_loss": -42.177154541015625, "global_step": 232283, "epoch": 1919} {"train_loss": -41.53899383544922, "global_step": 232284, "epoch": 1919} {"train_loss": -39.72053909301758, "global_step": 232285, "epoch": 1919} {"train_loss": -40.2651481628418, "global_step": 232286, "epoch": 1919} {"train_loss": -41.83814239501953, "global_step": 232287, "epoch": 1919} {"train_loss": -41.29543685913086, "global_step": 232288, "epoch": 1919} {"train_loss": -38.653865814208984, "global_step": 232289, "epoch": 1919} {"train_loss": -39.94601821899414, "global_step": 232290, "epoch": 1919} {"train_loss": -40.240779876708984, "global_step": 232291, "epoch": 1919} {"train_loss": -40.82599639892578, "global_step": 232292, "epoch": 1919} {"train_loss": -40.89768600463867, "global_step": 232293, "epoch": 1919} {"train_loss": -40.865169525146484, "global_step": 232294, "epoch": 1919} {"train_loss": -39.46942138671875, "global_step": 232295, "epoch": 1919} {"train_loss": -41.16401290893555, "global_step": 232296, "epoch": 1919} {"train_loss": -40.923309326171875, "global_step": 232297, "epoch": 1919} {"train_loss": -40.65877914428711, "global_step": 232298, "epoch": 1919} {"train_loss": -40.288448333740234, "global_step": 232299, "epoch": 1919} {"train_loss": -41.64542770385742, "global_step": 232300, "epoch": 1919} {"train_loss": -41.5370979309082, "global_step": 232301, "epoch": 1919} {"train_loss": -42.54767990112305, "global_step": 232302, "epoch": 1919} {"train_loss": -42.21349334716797, "global_step": 232303, "epoch": 1919} {"train_loss": -36.39608383178711, "global_step": 232304, "epoch": 1919} {"train_loss": -40.074581146240234, "global_step": 232305, "epoch": 1919} {"train_loss": -41.91950225830078, "global_step": 232306, "epoch": 1919} {"train_loss": -41.74861145019531, "global_step": 232307, "epoch": 1919} {"train_loss": -38.631893157958984, "global_step": 232308, "epoch": 1919} {"train_loss": -40.91581344604492, "global_step": 232309, "epoch": 1919} {"train_loss": -40.58839797973633, "global_step": 232310, "epoch": 1919} {"train_loss": -34.59358596801758, "global_step": 232311, "epoch": 1919} {"train_loss": -41.17892074584961, "global_step": 232312, "epoch": 1919} {"train_loss": -40.70931625366211, "global_step": 232313, "epoch": 1919} {"train_loss": -40.184505462646484, "global_step": 232314, "epoch": 1919} {"train_loss": -40.9520263671875, "global_step": 232315, "epoch": 1919} {"train_loss": -39.08979797363281, "global_step": 232316, "epoch": 1919} {"train_loss": -31.428979873657227, "global_step": 232317, "epoch": 1919} {"train_loss": -40.2861213684082, "global_step": 232318, "epoch": 1919} {"train_loss": -40.95896131342108, "global_step": 232319, "epoch": 1919, "val_loss": 2597291.25} {"train_loss": -38.411094665527344, "global_step": 232320, "epoch": 1920} {"train_loss": -36.924983978271484, "global_step": 232321, "epoch": 1920} {"train_loss": -40.1644401550293, "global_step": 232322, "epoch": 1920} {"train_loss": -38.05107498168945, "global_step": 232323, "epoch": 1920} {"train_loss": -37.71805953979492, "global_step": 232324, "epoch": 1920} {"train_loss": -39.59204864501953, "global_step": 232325, "epoch": 1920} {"train_loss": -30.8337459564209, "global_step": 232326, "epoch": 1920} {"train_loss": -34.514827728271484, "global_step": 232327, "epoch": 1920} {"train_loss": -39.661529541015625, "global_step": 232328, "epoch": 1920} {"train_loss": -38.047752380371094, "global_step": 232329, "epoch": 1920} {"train_loss": -38.963619232177734, "global_step": 232330, "epoch": 1920} {"train_loss": -40.905181884765625, "global_step": 232331, "epoch": 1920} {"train_loss": -33.596336364746094, "global_step": 232332, "epoch": 1920} {"train_loss": -33.02850341796875, "global_step": 232333, "epoch": 1920} {"train_loss": -40.56814956665039, "global_step": 232334, "epoch": 1920} {"train_loss": -37.76633071899414, "global_step": 232335, "epoch": 1920} {"train_loss": -38.95397186279297, "global_step": 232336, "epoch": 1920} {"train_loss": -38.089996337890625, "global_step": 232337, "epoch": 1920} {"train_loss": -39.36923599243164, "global_step": 232338, "epoch": 1920} {"train_loss": -40.39292526245117, "global_step": 232339, "epoch": 1920} {"train_loss": -34.971519470214844, "global_step": 232340, "epoch": 1920} {"train_loss": -40.42564010620117, "global_step": 232341, "epoch": 1920} {"train_loss": -39.363094329833984, "global_step": 232342, "epoch": 1920} {"train_loss": -39.722869873046875, "global_step": 232343, "epoch": 1920} {"train_loss": -41.228973388671875, "global_step": 232344, "epoch": 1920} {"train_loss": -40.37582778930664, "global_step": 232345, "epoch": 1920} {"train_loss": -39.76949691772461, "global_step": 232346, "epoch": 1920} {"train_loss": -39.914405822753906, "global_step": 232347, "epoch": 1920} {"train_loss": -40.46196746826172, "global_step": 232348, "epoch": 1920} {"train_loss": -40.18360137939453, "global_step": 232349, "epoch": 1920} {"train_loss": -40.509891510009766, "global_step": 232350, "epoch": 1920} {"train_loss": -40.6085090637207, "global_step": 232351, "epoch": 1920} {"train_loss": -39.94987106323242, "global_step": 232352, "epoch": 1920} {"train_loss": -40.06061935424805, "global_step": 232353, "epoch": 1920} {"train_loss": -40.36338424682617, "global_step": 232354, "epoch": 1920} {"train_loss": -40.34223175048828, "global_step": 232355, "epoch": 1920} {"train_loss": -40.60540771484375, "global_step": 232356, "epoch": 1920} {"train_loss": -38.815731048583984, "global_step": 232357, "epoch": 1920} {"train_loss": -39.81929397583008, "global_step": 232358, "epoch": 1920} {"train_loss": -41.2482795715332, "global_step": 232359, "epoch": 1920} {"train_loss": -40.4010124206543, "global_step": 232360, "epoch": 1920} {"train_loss": -41.748504638671875, "global_step": 232361, "epoch": 1920} {"train_loss": -41.46355438232422, "global_step": 232362, "epoch": 1920} {"train_loss": -40.97629928588867, "global_step": 232363, "epoch": 1920} {"train_loss": -40.35844039916992, "global_step": 232364, "epoch": 1920} {"train_loss": -41.91572570800781, "global_step": 232365, "epoch": 1920} {"train_loss": -39.81913375854492, "global_step": 232366, "epoch": 1920} {"train_loss": -41.31570053100586, "global_step": 232367, "epoch": 1920} {"train_loss": -41.04462432861328, "global_step": 232368, "epoch": 1920} {"train_loss": -41.86322021484375, "global_step": 232369, "epoch": 1920} {"train_loss": -41.60602951049805, "global_step": 232370, "epoch": 1920} {"train_loss": -41.83411407470703, "global_step": 232371, "epoch": 1920} {"train_loss": -40.21780014038086, "global_step": 232372, "epoch": 1920} {"train_loss": -40.898887634277344, "global_step": 232373, "epoch": 1920} {"train_loss": -41.928829193115234, "global_step": 232374, "epoch": 1920} {"train_loss": -41.14541244506836, "global_step": 232375, "epoch": 1920} {"train_loss": -41.33246994018555, "global_step": 232376, "epoch": 1920} {"train_loss": -40.67681884765625, "global_step": 232377, "epoch": 1920} {"train_loss": -41.56892013549805, "global_step": 232378, "epoch": 1920} {"train_loss": -41.9387321472168, "global_step": 232379, "epoch": 1920} {"train_loss": -41.67856216430664, "global_step": 232380, "epoch": 1920} {"train_loss": -40.1366081237793, "global_step": 232381, "epoch": 1920} {"train_loss": -41.58270263671875, "global_step": 232382, "epoch": 1920} {"train_loss": -40.51829528808594, "global_step": 232383, "epoch": 1920} {"train_loss": -41.11412811279297, "global_step": 232384, "epoch": 1920} {"train_loss": -41.99451446533203, "global_step": 232385, "epoch": 1920} {"train_loss": -42.15595245361328, "global_step": 232386, "epoch": 1920} {"train_loss": -41.71002960205078, "global_step": 232387, "epoch": 1920} {"train_loss": -41.76800537109375, "global_step": 232388, "epoch": 1920} {"train_loss": -39.41019821166992, "global_step": 232389, "epoch": 1920} {"train_loss": -39.49123001098633, "global_step": 232390, "epoch": 1920} {"train_loss": -40.51241683959961, "global_step": 232391, "epoch": 1920} {"train_loss": -42.023345947265625, "global_step": 232392, "epoch": 1920} {"train_loss": -40.3982048034668, "global_step": 232393, "epoch": 1920} {"train_loss": -40.123687744140625, "global_step": 232394, "epoch": 1920} {"train_loss": -41.78596115112305, "global_step": 232395, "epoch": 1920} {"train_loss": -41.79251480102539, "global_step": 232396, "epoch": 1920} {"train_loss": -41.692230224609375, "global_step": 232397, "epoch": 1920} {"train_loss": -41.16196823120117, "global_step": 232398, "epoch": 1920} {"train_loss": -40.14957046508789, "global_step": 232399, "epoch": 1920} {"train_loss": -42.068519592285156, "global_step": 232400, "epoch": 1920} {"train_loss": -41.943363189697266, "global_step": 232401, "epoch": 1920} {"train_loss": -41.810943603515625, "global_step": 232402, "epoch": 1920} {"train_loss": -41.4372444152832, "global_step": 232403, "epoch": 1920} {"train_loss": -42.451534271240234, "global_step": 232404, "epoch": 1920} {"train_loss": -40.13676071166992, "global_step": 232405, "epoch": 1920} {"train_loss": -41.67072296142578, "global_step": 232406, "epoch": 1920} {"train_loss": -37.42304611206055, "global_step": 232407, "epoch": 1920} {"train_loss": -42.007606506347656, "global_step": 232408, "epoch": 1920} {"train_loss": -42.1305046081543, "global_step": 232409, "epoch": 1920} {"train_loss": -41.967342376708984, "global_step": 232410, "epoch": 1920} {"train_loss": -41.987274169921875, "global_step": 232411, "epoch": 1920} {"train_loss": -42.46024703979492, "global_step": 232412, "epoch": 1920} {"train_loss": -40.056121826171875, "global_step": 232413, "epoch": 1920} {"train_loss": -39.4857063293457, "global_step": 232414, "epoch": 1920} {"train_loss": -42.51947021484375, "global_step": 232415, "epoch": 1920} {"train_loss": -40.30703353881836, "global_step": 232416, "epoch": 1920} {"train_loss": -41.632965087890625, "global_step": 232417, "epoch": 1920} {"train_loss": -40.80154037475586, "global_step": 232418, "epoch": 1920} {"train_loss": -40.27244186401367, "global_step": 232419, "epoch": 1920} {"train_loss": -41.90203857421875, "global_step": 232420, "epoch": 1920} {"train_loss": -42.03281784057617, "global_step": 232421, "epoch": 1920} {"train_loss": -41.537357330322266, "global_step": 232422, "epoch": 1920} {"train_loss": -41.8968505859375, "global_step": 232423, "epoch": 1920} {"train_loss": -39.743648529052734, "global_step": 232424, "epoch": 1920} {"train_loss": -41.18803787231445, "global_step": 232425, "epoch": 1920} {"train_loss": -40.5771484375, "global_step": 232426, "epoch": 1920} {"train_loss": -40.61428451538086, "global_step": 232427, "epoch": 1920} {"train_loss": -41.48101806640625, "global_step": 232428, "epoch": 1920} {"train_loss": -39.27956008911133, "global_step": 232429, "epoch": 1920} {"train_loss": -41.68534469604492, "global_step": 232430, "epoch": 1920} {"train_loss": -39.03242111206055, "global_step": 232431, "epoch": 1920} {"train_loss": -41.46455383300781, "global_step": 232432, "epoch": 1920} {"train_loss": -41.36732864379883, "global_step": 232433, "epoch": 1920} {"train_loss": -40.471736907958984, "global_step": 232434, "epoch": 1920} {"train_loss": -39.528114318847656, "global_step": 232435, "epoch": 1920} {"train_loss": -41.01020050048828, "global_step": 232436, "epoch": 1920} {"train_loss": -40.7462158203125, "global_step": 232437, "epoch": 1920} {"train_loss": -40.57136154174805, "global_step": 232438, "epoch": 1920} {"train_loss": -40.8856201171875, "global_step": 232439, "epoch": 1920} {"train_loss": -40.341031807513275, "global_step": 232440, "epoch": 1920, "val_loss": 2660108.25} {"train_loss": -41.367855072021484, "global_step": 232441, "epoch": 1921} {"train_loss": -41.845733642578125, "global_step": 232442, "epoch": 1921} {"train_loss": -41.27611541748047, "global_step": 232443, "epoch": 1921} {"train_loss": -39.965118408203125, "global_step": 232444, "epoch": 1921} {"train_loss": -41.84279251098633, "global_step": 232445, "epoch": 1921} {"train_loss": -41.680721282958984, "global_step": 232446, "epoch": 1921} {"train_loss": -39.646915435791016, "global_step": 232447, "epoch": 1921} {"train_loss": -37.90901565551758, "global_step": 232448, "epoch": 1921} {"train_loss": -40.45778274536133, "global_step": 232449, "epoch": 1921} {"train_loss": -38.79177474975586, "global_step": 232450, "epoch": 1921} {"train_loss": -37.86129379272461, "global_step": 232451, "epoch": 1921} {"train_loss": -37.28359603881836, "global_step": 232452, "epoch": 1921} {"train_loss": -37.87843704223633, "global_step": 232453, "epoch": 1921} {"train_loss": -42.191650390625, "global_step": 232454, "epoch": 1921} {"train_loss": -39.02476119995117, "global_step": 232455, "epoch": 1921} {"train_loss": -39.12131881713867, "global_step": 232456, "epoch": 1921} {"train_loss": -41.06013870239258, "global_step": 232457, "epoch": 1921} {"train_loss": -40.35000228881836, "global_step": 232458, "epoch": 1921} {"train_loss": -40.5627555847168, "global_step": 232459, "epoch": 1921} {"train_loss": -39.99166488647461, "global_step": 232460, "epoch": 1921} {"train_loss": -41.76031494140625, "global_step": 232461, "epoch": 1921} {"train_loss": -41.44333267211914, "global_step": 232462, "epoch": 1921} {"train_loss": -41.20786666870117, "global_step": 232463, "epoch": 1921} {"train_loss": -41.33203125, "global_step": 232464, "epoch": 1921} {"train_loss": -41.875823974609375, "global_step": 232465, "epoch": 1921} {"train_loss": -42.067535400390625, "global_step": 232466, "epoch": 1921} {"train_loss": -42.23017120361328, "global_step": 232467, "epoch": 1921} {"train_loss": -41.63640594482422, "global_step": 232468, "epoch": 1921} {"train_loss": -41.8536262512207, "global_step": 232469, "epoch": 1921} {"train_loss": -41.78937530517578, "global_step": 232470, "epoch": 1921} {"train_loss": -41.815704345703125, "global_step": 232471, "epoch": 1921} {"train_loss": -41.60047912597656, "global_step": 232472, "epoch": 1921} {"train_loss": -41.8909797668457, "global_step": 232473, "epoch": 1921} {"train_loss": -42.27747344970703, "global_step": 232474, "epoch": 1921} {"train_loss": -40.90842819213867, "global_step": 232475, "epoch": 1921} {"train_loss": -41.92197799682617, "global_step": 232476, "epoch": 1921} {"train_loss": -41.142372131347656, "global_step": 232477, "epoch": 1921} {"train_loss": -40.55637741088867, "global_step": 232478, "epoch": 1921} {"train_loss": -42.04999542236328, "global_step": 232479, "epoch": 1921} {"train_loss": -41.88459777832031, "global_step": 232480, "epoch": 1921} {"train_loss": -41.87693405151367, "global_step": 232481, "epoch": 1921} {"train_loss": -42.52753829956055, "global_step": 232482, "epoch": 1921} {"train_loss": -42.29508590698242, "global_step": 232483, "epoch": 1921} {"train_loss": -42.313941955566406, "global_step": 232484, "epoch": 1921} {"train_loss": -41.50064468383789, "global_step": 232485, "epoch": 1921} {"train_loss": -42.36867141723633, "global_step": 232486, "epoch": 1921} {"train_loss": -41.20410919189453, "global_step": 232487, "epoch": 1921} {"train_loss": -41.849388122558594, "global_step": 232488, "epoch": 1921} {"train_loss": -39.57484817504883, "global_step": 232489, "epoch": 1921} {"train_loss": -41.923038482666016, "global_step": 232490, "epoch": 1921} {"train_loss": -42.0082893371582, "global_step": 232491, "epoch": 1921} {"train_loss": -42.335060119628906, "global_step": 232492, "epoch": 1921} {"train_loss": -42.0857048034668, "global_step": 232493, "epoch": 1921} {"train_loss": -41.71906661987305, "global_step": 232494, "epoch": 1921} {"train_loss": -42.4733772277832, "global_step": 232495, "epoch": 1921} {"train_loss": -42.208377838134766, "global_step": 232496, "epoch": 1921} {"train_loss": -41.94150924682617, "global_step": 232497, "epoch": 1921} {"train_loss": -42.020301818847656, "global_step": 232498, "epoch": 1921} {"train_loss": -41.439208984375, "global_step": 232499, "epoch": 1921} {"train_loss": -42.53907775878906, "global_step": 232500, "epoch": 1921} {"train_loss": -42.48577117919922, "global_step": 232501, "epoch": 1921} {"train_loss": -42.96786117553711, "global_step": 232502, "epoch": 1921} {"train_loss": -42.364715576171875, "global_step": 232503, "epoch": 1921} {"train_loss": -42.19415283203125, "global_step": 232504, "epoch": 1921} {"train_loss": -42.64563751220703, "global_step": 232505, "epoch": 1921} {"train_loss": -42.42302322387695, "global_step": 232506, "epoch": 1921} {"train_loss": -42.58022689819336, "global_step": 232507, "epoch": 1921} {"train_loss": -42.723846435546875, "global_step": 232508, "epoch": 1921} {"train_loss": -41.08638000488281, "global_step": 232509, "epoch": 1921} {"train_loss": -41.937843322753906, "global_step": 232510, "epoch": 1921} {"train_loss": -42.786983489990234, "global_step": 232511, "epoch": 1921} {"train_loss": -40.56548309326172, "global_step": 232512, "epoch": 1921} {"train_loss": -40.53443145751953, "global_step": 232513, "epoch": 1921} {"train_loss": -42.46778106689453, "global_step": 232514, "epoch": 1921} {"train_loss": -42.4190673828125, "global_step": 232515, "epoch": 1921} {"train_loss": -42.42885208129883, "global_step": 232516, "epoch": 1921} {"train_loss": -42.459938049316406, "global_step": 232517, "epoch": 1921} {"train_loss": -42.26166534423828, "global_step": 232518, "epoch": 1921} {"train_loss": -41.782508850097656, "global_step": 232519, "epoch": 1921} {"train_loss": -42.9597053527832, "global_step": 232520, "epoch": 1921} {"train_loss": -41.688087463378906, "global_step": 232521, "epoch": 1921} {"train_loss": -41.34980392456055, "global_step": 232522, "epoch": 1921} {"train_loss": -41.4362907409668, "global_step": 232523, "epoch": 1921} {"train_loss": -40.8011474609375, "global_step": 232524, "epoch": 1921} {"train_loss": -41.73601150512695, "global_step": 232525, "epoch": 1921} {"train_loss": -39.492923736572266, "global_step": 232526, "epoch": 1921} {"train_loss": -39.89775466918945, "global_step": 232527, "epoch": 1921} {"train_loss": -38.80109786987305, "global_step": 232528, "epoch": 1921} {"train_loss": -40.92910385131836, "global_step": 232529, "epoch": 1921} {"train_loss": -39.72749328613281, "global_step": 232530, "epoch": 1921} {"train_loss": -41.07172775268555, "global_step": 232531, "epoch": 1921} {"train_loss": -38.386451721191406, "global_step": 232532, "epoch": 1921} {"train_loss": -40.21217346191406, "global_step": 232533, "epoch": 1921} {"train_loss": -38.202362060546875, "global_step": 232534, "epoch": 1921} {"train_loss": -39.2301139831543, "global_step": 232535, "epoch": 1921} {"train_loss": -40.087646484375, "global_step": 232536, "epoch": 1921} {"train_loss": -37.8033561706543, "global_step": 232537, "epoch": 1921} {"train_loss": -39.77128219604492, "global_step": 232538, "epoch": 1921} {"train_loss": -38.297637939453125, "global_step": 232539, "epoch": 1921} {"train_loss": -40.64725875854492, "global_step": 232540, "epoch": 1921} {"train_loss": -39.75490188598633, "global_step": 232541, "epoch": 1921} {"train_loss": -40.19094467163086, "global_step": 232542, "epoch": 1921} {"train_loss": -37.46691131591797, "global_step": 232543, "epoch": 1921} {"train_loss": -39.76772689819336, "global_step": 232544, "epoch": 1921} {"train_loss": -40.79557800292969, "global_step": 232545, "epoch": 1921} {"train_loss": -37.129051208496094, "global_step": 232546, "epoch": 1921} {"train_loss": -40.89246368408203, "global_step": 232547, "epoch": 1921} {"train_loss": -40.357818603515625, "global_step": 232548, "epoch": 1921} {"train_loss": -40.88418197631836, "global_step": 232549, "epoch": 1921} {"train_loss": -40.54777145385742, "global_step": 232550, "epoch": 1921} {"train_loss": -39.835262298583984, "global_step": 232551, "epoch": 1921} {"train_loss": -40.77649688720703, "global_step": 232552, "epoch": 1921} {"train_loss": -39.560638427734375, "global_step": 232553, "epoch": 1921} {"train_loss": -40.824092864990234, "global_step": 232554, "epoch": 1921} {"train_loss": -40.95685577392578, "global_step": 232555, "epoch": 1921} {"train_loss": -41.354591369628906, "global_step": 232556, "epoch": 1921} {"train_loss": -40.466827392578125, "global_step": 232557, "epoch": 1921} {"train_loss": -42.38059616088867, "global_step": 232558, "epoch": 1921} {"train_loss": -41.36075973510742, "global_step": 232559, "epoch": 1921} {"train_loss": -39.90138626098633, "global_step": 232560, "epoch": 1921} {"train_loss": -41.01070306320821, "global_step": 232561, "epoch": 1921, "val_loss": 2621750.25} {"train_loss": -40.81508255004883, "global_step": 232562, "epoch": 1922} {"train_loss": -41.324893951416016, "global_step": 232563, "epoch": 1922} {"train_loss": -41.425350189208984, "global_step": 232564, "epoch": 1922} {"train_loss": -41.94004821777344, "global_step": 232565, "epoch": 1922} {"train_loss": -40.556697845458984, "global_step": 232566, "epoch": 1922} {"train_loss": -41.35820388793945, "global_step": 232567, "epoch": 1922} {"train_loss": -40.842018127441406, "global_step": 232568, "epoch": 1922} {"train_loss": -41.81845474243164, "global_step": 232569, "epoch": 1922} {"train_loss": -41.492252349853516, "global_step": 232570, "epoch": 1922} {"train_loss": -41.117794036865234, "global_step": 232571, "epoch": 1922} {"train_loss": -41.772850036621094, "global_step": 232572, "epoch": 1922} {"train_loss": -42.333831787109375, "global_step": 232573, "epoch": 1922} {"train_loss": -41.641422271728516, "global_step": 232574, "epoch": 1922} {"train_loss": -41.75858688354492, "global_step": 232575, "epoch": 1922} {"train_loss": -40.85903549194336, "global_step": 232576, "epoch": 1922} {"train_loss": -42.4652214050293, "global_step": 232577, "epoch": 1922} {"train_loss": -41.73487854003906, "global_step": 232578, "epoch": 1922} {"train_loss": -41.98380661010742, "global_step": 232579, "epoch": 1922} {"train_loss": -42.171016693115234, "global_step": 232580, "epoch": 1922} {"train_loss": -42.258155822753906, "global_step": 232581, "epoch": 1922} {"train_loss": -41.99092483520508, "global_step": 232582, "epoch": 1922} {"train_loss": -41.081634521484375, "global_step": 232583, "epoch": 1922} {"train_loss": -42.557376861572266, "global_step": 232584, "epoch": 1922} {"train_loss": -42.2787971496582, "global_step": 232585, "epoch": 1922} {"train_loss": -41.359859466552734, "global_step": 232586, "epoch": 1922} {"train_loss": -40.62948989868164, "global_step": 232587, "epoch": 1922} {"train_loss": -42.505332946777344, "global_step": 232588, "epoch": 1922} {"train_loss": -41.9508171081543, "global_step": 232589, "epoch": 1922} {"train_loss": -42.3016357421875, "global_step": 232590, "epoch": 1922} {"train_loss": -42.01820755004883, "global_step": 232591, "epoch": 1922} {"train_loss": -42.36192321777344, "global_step": 232592, "epoch": 1922} {"train_loss": -42.96956253051758, "global_step": 232593, "epoch": 1922} {"train_loss": -37.889381408691406, "global_step": 232594, "epoch": 1922} {"train_loss": -42.65277862548828, "global_step": 232595, "epoch": 1922} {"train_loss": -42.4139518737793, "global_step": 232596, "epoch": 1922} {"train_loss": -42.303253173828125, "global_step": 232597, "epoch": 1922} {"train_loss": -42.86524200439453, "global_step": 232598, "epoch": 1922} {"train_loss": -42.87176513671875, "global_step": 232599, "epoch": 1922} {"train_loss": -42.407588958740234, "global_step": 232600, "epoch": 1922} {"train_loss": -42.67204284667969, "global_step": 232601, "epoch": 1922} {"train_loss": -42.37986373901367, "global_step": 232602, "epoch": 1922} {"train_loss": -41.89359664916992, "global_step": 232603, "epoch": 1922} {"train_loss": -42.81332015991211, "global_step": 232604, "epoch": 1922} {"train_loss": -42.7363395690918, "global_step": 232605, "epoch": 1922} {"train_loss": -42.042598724365234, "global_step": 232606, "epoch": 1922} {"train_loss": -42.90925979614258, "global_step": 232607, "epoch": 1922} {"train_loss": -42.36585998535156, "global_step": 232608, "epoch": 1922} {"train_loss": -41.88832473754883, "global_step": 232609, "epoch": 1922} {"train_loss": -42.33694076538086, "global_step": 232610, "epoch": 1922} {"train_loss": -42.520233154296875, "global_step": 232611, "epoch": 1922} {"train_loss": -41.19926071166992, "global_step": 232612, "epoch": 1922} {"train_loss": -41.3945426940918, "global_step": 232613, "epoch": 1922} {"train_loss": -40.24534606933594, "global_step": 232614, "epoch": 1922} {"train_loss": -41.13444900512695, "global_step": 232615, "epoch": 1922} {"train_loss": -42.44251251220703, "global_step": 232616, "epoch": 1922} {"train_loss": -42.398494720458984, "global_step": 232617, "epoch": 1922} {"train_loss": -42.35700607299805, "global_step": 232618, "epoch": 1922} {"train_loss": -40.30353927612305, "global_step": 232619, "epoch": 1922} {"train_loss": -41.728050231933594, "global_step": 232620, "epoch": 1922} {"train_loss": -41.38041305541992, "global_step": 232621, "epoch": 1922} {"train_loss": -39.0745964050293, "global_step": 232622, "epoch": 1922} {"train_loss": -39.555450439453125, "global_step": 232623, "epoch": 1922} {"train_loss": -41.08102035522461, "global_step": 232624, "epoch": 1922} {"train_loss": -41.533912658691406, "global_step": 232625, "epoch": 1922} {"train_loss": -41.4345817565918, "global_step": 232626, "epoch": 1922} {"train_loss": -40.63557052612305, "global_step": 232627, "epoch": 1922} {"train_loss": -41.280921936035156, "global_step": 232628, "epoch": 1922} {"train_loss": -42.81431198120117, "global_step": 232629, "epoch": 1922} {"train_loss": -41.82717514038086, "global_step": 232630, "epoch": 1922} {"train_loss": -41.6129150390625, "global_step": 232631, "epoch": 1922} {"train_loss": -41.6207275390625, "global_step": 232632, "epoch": 1922} {"train_loss": -42.09855270385742, "global_step": 232633, "epoch": 1922} {"train_loss": -41.68351745605469, "global_step": 232634, "epoch": 1922} {"train_loss": -42.116371154785156, "global_step": 232635, "epoch": 1922} {"train_loss": -42.41730499267578, "global_step": 232636, "epoch": 1922} {"train_loss": -42.11642837524414, "global_step": 232637, "epoch": 1922} {"train_loss": -42.72321319580078, "global_step": 232638, "epoch": 1922} {"train_loss": -42.28456115722656, "global_step": 232639, "epoch": 1922} {"train_loss": -41.794158935546875, "global_step": 232640, "epoch": 1922} {"train_loss": -42.15959548950195, "global_step": 232641, "epoch": 1922} {"train_loss": -40.565155029296875, "global_step": 232642, "epoch": 1922} {"train_loss": -40.279151916503906, "global_step": 232643, "epoch": 1922} {"train_loss": -38.3934440612793, "global_step": 232644, "epoch": 1922} {"train_loss": -34.369754791259766, "global_step": 232645, "epoch": 1922} {"train_loss": -31.16936683654785, "global_step": 232646, "epoch": 1922} {"train_loss": -32.905487060546875, "global_step": 232647, "epoch": 1922} {"train_loss": -39.7974967956543, "global_step": 232648, "epoch": 1922} {"train_loss": -41.65972900390625, "global_step": 232649, "epoch": 1922} {"train_loss": -38.60248947143555, "global_step": 232650, "epoch": 1922} {"train_loss": -41.28725051879883, "global_step": 232651, "epoch": 1922} {"train_loss": -39.576873779296875, "global_step": 232652, "epoch": 1922} {"train_loss": -38.469329833984375, "global_step": 232653, "epoch": 1922} {"train_loss": -41.833709716796875, "global_step": 232654, "epoch": 1922} {"train_loss": -40.6222038269043, "global_step": 232655, "epoch": 1922} {"train_loss": -40.16558074951172, "global_step": 232656, "epoch": 1922} {"train_loss": -41.03260040283203, "global_step": 232657, "epoch": 1922} {"train_loss": -40.98977279663086, "global_step": 232658, "epoch": 1922} {"train_loss": -41.09196472167969, "global_step": 232659, "epoch": 1922} {"train_loss": -41.26921844482422, "global_step": 232660, "epoch": 1922} {"train_loss": -42.000728607177734, "global_step": 232661, "epoch": 1922} {"train_loss": -41.596900939941406, "global_step": 232662, "epoch": 1922} {"train_loss": -41.081268310546875, "global_step": 232663, "epoch": 1922} {"train_loss": -41.83589553833008, "global_step": 232664, "epoch": 1922} {"train_loss": -41.77326965332031, "global_step": 232665, "epoch": 1922} {"train_loss": -41.74945831298828, "global_step": 232666, "epoch": 1922} {"train_loss": -42.35026931762695, "global_step": 232667, "epoch": 1922} {"train_loss": -41.57678985595703, "global_step": 232668, "epoch": 1922} {"train_loss": -41.80825424194336, "global_step": 232669, "epoch": 1922} {"train_loss": -41.501033782958984, "global_step": 232670, "epoch": 1922} {"train_loss": -41.89931869506836, "global_step": 232671, "epoch": 1922} {"train_loss": -41.7021598815918, "global_step": 232672, "epoch": 1922} {"train_loss": -41.013885498046875, "global_step": 232673, "epoch": 1922} {"train_loss": -41.442928314208984, "global_step": 232674, "epoch": 1922} {"train_loss": -42.56943893432617, "global_step": 232675, "epoch": 1922} {"train_loss": -42.06952667236328, "global_step": 232676, "epoch": 1922} {"train_loss": -41.84493637084961, "global_step": 232677, "epoch": 1922} {"train_loss": -42.23366928100586, "global_step": 232678, "epoch": 1922} {"train_loss": -42.02415084838867, "global_step": 232679, "epoch": 1922} {"train_loss": -42.05705642700195, "global_step": 232680, "epoch": 1922} {"train_loss": -42.60157012939453, "global_step": 232681, "epoch": 1922} {"train_loss": -41.38129429777792, "global_step": 232682, "epoch": 1922, "val_loss": 2658928.75} {"train_loss": -42.63900375366211, "global_step": 232683, "epoch": 1923} {"train_loss": -42.19956588745117, "global_step": 232684, "epoch": 1923} {"train_loss": -42.33438491821289, "global_step": 232685, "epoch": 1923} {"train_loss": -42.27920150756836, "global_step": 232686, "epoch": 1923} {"train_loss": -42.13705825805664, "global_step": 232687, "epoch": 1923} {"train_loss": -42.774959564208984, "global_step": 232688, "epoch": 1923} {"train_loss": -42.43341827392578, "global_step": 232689, "epoch": 1923} {"train_loss": -42.03976058959961, "global_step": 232690, "epoch": 1923} {"train_loss": -42.068355560302734, "global_step": 232691, "epoch": 1923} {"train_loss": -41.921791076660156, "global_step": 232692, "epoch": 1923} {"train_loss": -41.56446075439453, "global_step": 232693, "epoch": 1923} {"train_loss": -41.699676513671875, "global_step": 232694, "epoch": 1923} {"train_loss": -42.729976654052734, "global_step": 232695, "epoch": 1923} {"train_loss": -42.124786376953125, "global_step": 232696, "epoch": 1923} {"train_loss": -41.60721969604492, "global_step": 232697, "epoch": 1923} {"train_loss": -43.03458786010742, "global_step": 232698, "epoch": 1923} {"train_loss": -42.45499801635742, "global_step": 232699, "epoch": 1923} {"train_loss": -41.346038818359375, "global_step": 232700, "epoch": 1923} {"train_loss": -42.49279022216797, "global_step": 232701, "epoch": 1923} {"train_loss": -41.65773391723633, "global_step": 232702, "epoch": 1923} {"train_loss": -42.657020568847656, "global_step": 232703, "epoch": 1923} {"train_loss": -41.68781661987305, "global_step": 232704, "epoch": 1923} {"train_loss": -40.86592483520508, "global_step": 232705, "epoch": 1923} {"train_loss": -42.45252227783203, "global_step": 232706, "epoch": 1923} {"train_loss": -43.11917495727539, "global_step": 232707, "epoch": 1923} {"train_loss": -42.78373336791992, "global_step": 232708, "epoch": 1923} {"train_loss": -42.66553497314453, "global_step": 232709, "epoch": 1923} {"train_loss": -42.85537338256836, "global_step": 232710, "epoch": 1923} {"train_loss": -42.56039047241211, "global_step": 232711, "epoch": 1923} {"train_loss": -42.88347244262695, "global_step": 232712, "epoch": 1923} {"train_loss": -42.756954193115234, "global_step": 232713, "epoch": 1923} {"train_loss": -42.149349212646484, "global_step": 232714, "epoch": 1923} {"train_loss": -42.575801849365234, "global_step": 232715, "epoch": 1923} {"train_loss": -42.36098861694336, "global_step": 232716, "epoch": 1923} {"train_loss": -42.83750534057617, "global_step": 232717, "epoch": 1923} {"train_loss": -41.69984817504883, "global_step": 232718, "epoch": 1923} {"train_loss": -41.35993194580078, "global_step": 232719, "epoch": 1923} {"train_loss": -43.119754791259766, "global_step": 232720, "epoch": 1923} {"train_loss": -42.601444244384766, "global_step": 232721, "epoch": 1923} {"train_loss": -42.49190139770508, "global_step": 232722, "epoch": 1923} {"train_loss": -42.07624053955078, "global_step": 232723, "epoch": 1923} {"train_loss": -42.56620407104492, "global_step": 232724, "epoch": 1923} {"train_loss": -42.353328704833984, "global_step": 232725, "epoch": 1923} {"train_loss": -42.94771194458008, "global_step": 232726, "epoch": 1923} {"train_loss": -40.28341293334961, "global_step": 232727, "epoch": 1923} {"train_loss": -42.82329177856445, "global_step": 232728, "epoch": 1923} {"train_loss": -42.47890853881836, "global_step": 232729, "epoch": 1923} {"train_loss": -42.63859176635742, "global_step": 232730, "epoch": 1923} {"train_loss": -43.02950668334961, "global_step": 232731, "epoch": 1923} {"train_loss": -41.868995666503906, "global_step": 232732, "epoch": 1923} {"train_loss": -40.04424285888672, "global_step": 232733, "epoch": 1923} {"train_loss": -38.621639251708984, "global_step": 232734, "epoch": 1923} {"train_loss": -39.654083251953125, "global_step": 232735, "epoch": 1923} {"train_loss": -41.036312103271484, "global_step": 232736, "epoch": 1923} {"train_loss": -40.4169807434082, "global_step": 232737, "epoch": 1923} {"train_loss": -39.206478118896484, "global_step": 232738, "epoch": 1923} {"train_loss": -39.07476043701172, "global_step": 232739, "epoch": 1923} {"train_loss": -40.8740119934082, "global_step": 232740, "epoch": 1923} {"train_loss": -40.14396286010742, "global_step": 232741, "epoch": 1923} {"train_loss": -39.10124588012695, "global_step": 232742, "epoch": 1923} {"train_loss": -40.78950119018555, "global_step": 232743, "epoch": 1923} {"train_loss": -40.00136947631836, "global_step": 232744, "epoch": 1923} {"train_loss": -40.73053741455078, "global_step": 232745, "epoch": 1923} {"train_loss": -40.716651916503906, "global_step": 232746, "epoch": 1923} {"train_loss": -42.227386474609375, "global_step": 232747, "epoch": 1923} {"train_loss": -40.9278450012207, "global_step": 232748, "epoch": 1923} {"train_loss": -41.599639892578125, "global_step": 232749, "epoch": 1923} {"train_loss": -41.9813346862793, "global_step": 232750, "epoch": 1923} {"train_loss": -38.406612396240234, "global_step": 232751, "epoch": 1923} {"train_loss": -40.90943145751953, "global_step": 232752, "epoch": 1923} {"train_loss": -40.43646240234375, "global_step": 232753, "epoch": 1923} {"train_loss": -39.616424560546875, "global_step": 232754, "epoch": 1923} {"train_loss": -41.062984466552734, "global_step": 232755, "epoch": 1923} {"train_loss": -39.875091552734375, "global_step": 232756, "epoch": 1923} {"train_loss": -41.8313102722168, "global_step": 232757, "epoch": 1923} {"train_loss": -40.547855377197266, "global_step": 232758, "epoch": 1923} {"train_loss": -40.957088470458984, "global_step": 232759, "epoch": 1923} {"train_loss": -41.0947151184082, "global_step": 232760, "epoch": 1923} {"train_loss": -41.32493591308594, "global_step": 232761, "epoch": 1923} {"train_loss": -41.42369842529297, "global_step": 232762, "epoch": 1923} {"train_loss": -41.65141677856445, "global_step": 232763, "epoch": 1923} {"train_loss": -41.53923797607422, "global_step": 232764, "epoch": 1923} {"train_loss": -42.369686126708984, "global_step": 232765, "epoch": 1923} {"train_loss": -41.72856903076172, "global_step": 232766, "epoch": 1923} {"train_loss": -40.57442855834961, "global_step": 232767, "epoch": 1923} {"train_loss": -41.79061508178711, "global_step": 232768, "epoch": 1923} {"train_loss": -41.760223388671875, "global_step": 232769, "epoch": 1923} {"train_loss": -42.288917541503906, "global_step": 232770, "epoch": 1923} {"train_loss": -41.50600814819336, "global_step": 232771, "epoch": 1923} {"train_loss": -41.97724914550781, "global_step": 232772, "epoch": 1923} {"train_loss": -42.48107147216797, "global_step": 232773, "epoch": 1923} {"train_loss": -41.21503829956055, "global_step": 232774, "epoch": 1923} {"train_loss": -42.05996322631836, "global_step": 232775, "epoch": 1923} {"train_loss": -41.205360412597656, "global_step": 232776, "epoch": 1923} {"train_loss": -41.53821563720703, "global_step": 232777, "epoch": 1923} {"train_loss": -41.93958282470703, "global_step": 232778, "epoch": 1923} {"train_loss": -41.984901428222656, "global_step": 232779, "epoch": 1923} {"train_loss": -42.387752532958984, "global_step": 232780, "epoch": 1923} {"train_loss": -41.24755859375, "global_step": 232781, "epoch": 1923} {"train_loss": -42.23159408569336, "global_step": 232782, "epoch": 1923} {"train_loss": -42.16621398925781, "global_step": 232783, "epoch": 1923} {"train_loss": -42.0966911315918, "global_step": 232784, "epoch": 1923} {"train_loss": -42.042842864990234, "global_step": 232785, "epoch": 1923} {"train_loss": -41.8609733581543, "global_step": 232786, "epoch": 1923} {"train_loss": -42.09869384765625, "global_step": 232787, "epoch": 1923} {"train_loss": -42.825069427490234, "global_step": 232788, "epoch": 1923} {"train_loss": -42.395118713378906, "global_step": 232789, "epoch": 1923} {"train_loss": -42.587337493896484, "global_step": 232790, "epoch": 1923} {"train_loss": -41.79897689819336, "global_step": 232791, "epoch": 1923} {"train_loss": -41.38788986206055, "global_step": 232792, "epoch": 1923} {"train_loss": -42.296180725097656, "global_step": 232793, "epoch": 1923} {"train_loss": -42.384185791015625, "global_step": 232794, "epoch": 1923} {"train_loss": -42.020240783691406, "global_step": 232795, "epoch": 1923} {"train_loss": -42.34208297729492, "global_step": 232796, "epoch": 1923} {"train_loss": -40.9844856262207, "global_step": 232797, "epoch": 1923} {"train_loss": -42.27377700805664, "global_step": 232798, "epoch": 1923} {"train_loss": -42.62042999267578, "global_step": 232799, "epoch": 1923} {"train_loss": -42.47411346435547, "global_step": 232800, "epoch": 1923} {"train_loss": -43.04244613647461, "global_step": 232801, "epoch": 1923} {"train_loss": -42.69855880737305, "global_step": 232802, "epoch": 1923} {"train_loss": -41.754297619023596, "global_step": 232803, "epoch": 1923, "val_loss": 2658005.0} {"train_loss": -42.16101837158203, "global_step": 232804, "epoch": 1924} {"train_loss": -41.93410873413086, "global_step": 232805, "epoch": 1924} {"train_loss": -43.04536056518555, "global_step": 232806, "epoch": 1924} {"train_loss": -42.48386764526367, "global_step": 232807, "epoch": 1924} {"train_loss": -43.11980056762695, "global_step": 232808, "epoch": 1924} {"train_loss": -43.215816497802734, "global_step": 232809, "epoch": 1924} {"train_loss": -42.329872131347656, "global_step": 232810, "epoch": 1924} {"train_loss": -42.89754867553711, "global_step": 232811, "epoch": 1924} {"train_loss": -42.51070022583008, "global_step": 232812, "epoch": 1924} {"train_loss": -42.343502044677734, "global_step": 232813, "epoch": 1924} {"train_loss": -42.60691452026367, "global_step": 232814, "epoch": 1924} {"train_loss": -41.68199920654297, "global_step": 232815, "epoch": 1924} {"train_loss": -43.61343765258789, "global_step": 232816, "epoch": 1924} {"train_loss": -42.454833984375, "global_step": 232817, "epoch": 1924} {"train_loss": -42.64128494262695, "global_step": 232818, "epoch": 1924} {"train_loss": -43.479209899902344, "global_step": 232819, "epoch": 1924} {"train_loss": -41.91925048828125, "global_step": 232820, "epoch": 1924} {"train_loss": -42.59623336791992, "global_step": 232821, "epoch": 1924} {"train_loss": -43.47712326049805, "global_step": 232822, "epoch": 1924} {"train_loss": -42.31283187866211, "global_step": 232823, "epoch": 1924} {"train_loss": -43.66123580932617, "global_step": 232824, "epoch": 1924} {"train_loss": -43.55654525756836, "global_step": 232825, "epoch": 1924} {"train_loss": -42.9309196472168, "global_step": 232826, "epoch": 1924} {"train_loss": -42.71791458129883, "global_step": 232827, "epoch": 1924} {"train_loss": -42.69143295288086, "global_step": 232828, "epoch": 1924} {"train_loss": -42.75029373168945, "global_step": 232829, "epoch": 1924} {"train_loss": -42.42536163330078, "global_step": 232830, "epoch": 1924} {"train_loss": -43.076114654541016, "global_step": 232831, "epoch": 1924} {"train_loss": -42.75487518310547, "global_step": 232832, "epoch": 1924} {"train_loss": -42.8395881652832, "global_step": 232833, "epoch": 1924} {"train_loss": -43.50321578979492, "global_step": 232834, "epoch": 1924} {"train_loss": -43.42464828491211, "global_step": 232835, "epoch": 1924} {"train_loss": -43.1038932800293, "global_step": 232836, "epoch": 1924} {"train_loss": -43.36912536621094, "global_step": 232837, "epoch": 1924} {"train_loss": -42.2458381652832, "global_step": 232838, "epoch": 1924} {"train_loss": -42.61042404174805, "global_step": 232839, "epoch": 1924} {"train_loss": -42.48177719116211, "global_step": 232840, "epoch": 1924} {"train_loss": -42.67695999145508, "global_step": 232841, "epoch": 1924} {"train_loss": -42.85322189331055, "global_step": 232842, "epoch": 1924} {"train_loss": -42.99607467651367, "global_step": 232843, "epoch": 1924} {"train_loss": -42.718475341796875, "global_step": 232844, "epoch": 1924} {"train_loss": -43.336448669433594, "global_step": 232845, "epoch": 1924} {"train_loss": -42.5421028137207, "global_step": 232846, "epoch": 1924} {"train_loss": -42.81196212768555, "global_step": 232847, "epoch": 1924} {"train_loss": -42.73308181762695, "global_step": 232848, "epoch": 1924} {"train_loss": -41.744991302490234, "global_step": 232849, "epoch": 1924} {"train_loss": -42.663448333740234, "global_step": 232850, "epoch": 1924} {"train_loss": -42.2009391784668, "global_step": 232851, "epoch": 1924} {"train_loss": -42.535770416259766, "global_step": 232852, "epoch": 1924} {"train_loss": -43.47620391845703, "global_step": 232853, "epoch": 1924} {"train_loss": -42.01850509643555, "global_step": 232854, "epoch": 1924} {"train_loss": -41.808780670166016, "global_step": 232855, "epoch": 1924} {"train_loss": -42.47599411010742, "global_step": 232856, "epoch": 1924} {"train_loss": -41.74197769165039, "global_step": 232857, "epoch": 1924} {"train_loss": -40.412696838378906, "global_step": 232858, "epoch": 1924} {"train_loss": -42.74816131591797, "global_step": 232859, "epoch": 1924} {"train_loss": -41.0153923034668, "global_step": 232860, "epoch": 1924} {"train_loss": -39.595638275146484, "global_step": 232861, "epoch": 1924} {"train_loss": -35.7050666809082, "global_step": 232862, "epoch": 1924} {"train_loss": -24.54788589477539, "global_step": 232863, "epoch": 1924} {"train_loss": -15.041259765625, "global_step": 232864, "epoch": 1924} {"train_loss": -26.661176681518555, "global_step": 232865, "epoch": 1924} {"train_loss": -39.256263732910156, "global_step": 232866, "epoch": 1924} {"train_loss": -37.1499137878418, "global_step": 232867, "epoch": 1924} {"train_loss": -32.783363342285156, "global_step": 232868, "epoch": 1924} {"train_loss": -40.483009338378906, "global_step": 232869, "epoch": 1924} {"train_loss": -34.33826446533203, "global_step": 232870, "epoch": 1924} {"train_loss": -38.344993591308594, "global_step": 232871, "epoch": 1924} {"train_loss": -36.164093017578125, "global_step": 232872, "epoch": 1924} {"train_loss": -37.206539154052734, "global_step": 232873, "epoch": 1924} {"train_loss": -38.15342712402344, "global_step": 232874, "epoch": 1924} {"train_loss": -35.71958541870117, "global_step": 232875, "epoch": 1924} {"train_loss": -37.839881896972656, "global_step": 232876, "epoch": 1924} {"train_loss": -36.15584945678711, "global_step": 232877, "epoch": 1924} {"train_loss": -39.670013427734375, "global_step": 232878, "epoch": 1924} {"train_loss": -37.51422882080078, "global_step": 232879, "epoch": 1924} {"train_loss": -39.4714241027832, "global_step": 232880, "epoch": 1924} {"train_loss": -38.0001106262207, "global_step": 232881, "epoch": 1924} {"train_loss": -40.40788650512695, "global_step": 232882, "epoch": 1924} {"train_loss": -38.835487365722656, "global_step": 232883, "epoch": 1924} {"train_loss": -40.077030181884766, "global_step": 232884, "epoch": 1924} {"train_loss": -40.3582878112793, "global_step": 232885, "epoch": 1924} {"train_loss": -39.68532943725586, "global_step": 232886, "epoch": 1924} {"train_loss": -40.29830551147461, "global_step": 232887, "epoch": 1924} {"train_loss": -40.615535736083984, "global_step": 232888, "epoch": 1924} {"train_loss": -41.58504867553711, "global_step": 232889, "epoch": 1924} {"train_loss": -39.857967376708984, "global_step": 232890, "epoch": 1924} {"train_loss": -39.93364334106445, "global_step": 232891, "epoch": 1924} {"train_loss": -40.69130325317383, "global_step": 232892, "epoch": 1924} {"train_loss": -41.21961212158203, "global_step": 232893, "epoch": 1924} {"train_loss": -41.154632568359375, "global_step": 232894, "epoch": 1924} {"train_loss": -41.198421478271484, "global_step": 232895, "epoch": 1924} {"train_loss": -41.18836212158203, "global_step": 232896, "epoch": 1924} {"train_loss": -40.68825912475586, "global_step": 232897, "epoch": 1924} {"train_loss": -40.5356330871582, "global_step": 232898, "epoch": 1924} {"train_loss": -40.99302291870117, "global_step": 232899, "epoch": 1924} {"train_loss": -40.28357696533203, "global_step": 232900, "epoch": 1924} {"train_loss": -41.20729446411133, "global_step": 232901, "epoch": 1924} {"train_loss": -41.60988998413086, "global_step": 232902, "epoch": 1924} {"train_loss": -41.427486419677734, "global_step": 232903, "epoch": 1924} {"train_loss": -41.1967887878418, "global_step": 232904, "epoch": 1924} {"train_loss": -41.87807083129883, "global_step": 232905, "epoch": 1924} {"train_loss": -41.83665084838867, "global_step": 232906, "epoch": 1924} {"train_loss": -41.67845916748047, "global_step": 232907, "epoch": 1924} {"train_loss": -41.69417953491211, "global_step": 232908, "epoch": 1924} {"train_loss": -42.22582244873047, "global_step": 232909, "epoch": 1924} {"train_loss": -41.38986587524414, "global_step": 232910, "epoch": 1924} {"train_loss": -42.203609466552734, "global_step": 232911, "epoch": 1924} {"train_loss": -41.8641357421875, "global_step": 232912, "epoch": 1924} {"train_loss": -42.41533660888672, "global_step": 232913, "epoch": 1924} {"train_loss": -38.48237991333008, "global_step": 232914, "epoch": 1924} {"train_loss": -42.20286178588867, "global_step": 232915, "epoch": 1924} {"train_loss": -41.632938385009766, "global_step": 232916, "epoch": 1924} {"train_loss": -40.864742279052734, "global_step": 232917, "epoch": 1924} {"train_loss": -40.67573928833008, "global_step": 232918, "epoch": 1924} {"train_loss": -41.59535217285156, "global_step": 232919, "epoch": 1924} {"train_loss": -38.58204650878906, "global_step": 232920, "epoch": 1924} {"train_loss": -40.4511833190918, "global_step": 232921, "epoch": 1924} {"train_loss": -42.05530548095703, "global_step": 232922, "epoch": 1924} {"train_loss": -41.2945671081543, "global_step": 232923, "epoch": 1924} {"train_loss": -40.75707296891646, "global_step": 232924, "epoch": 1924, "val_loss": 2752056.0} {"train_loss": -40.023292541503906, "global_step": 232925, "epoch": 1925} {"train_loss": -37.98470687866211, "global_step": 232926, "epoch": 1925} {"train_loss": -41.32557678222656, "global_step": 232927, "epoch": 1925} {"train_loss": -40.66356658935547, "global_step": 232928, "epoch": 1925} {"train_loss": -39.72554016113281, "global_step": 232929, "epoch": 1925} {"train_loss": -41.338043212890625, "global_step": 232930, "epoch": 1925} {"train_loss": -39.20601272583008, "global_step": 232931, "epoch": 1925} {"train_loss": -39.006622314453125, "global_step": 232932, "epoch": 1925} {"train_loss": -39.69214630126953, "global_step": 232933, "epoch": 1925} {"train_loss": -39.848663330078125, "global_step": 232934, "epoch": 1925} {"train_loss": -38.4382209777832, "global_step": 232935, "epoch": 1925} {"train_loss": -37.811641693115234, "global_step": 232936, "epoch": 1925} {"train_loss": -40.478477478027344, "global_step": 232937, "epoch": 1925} {"train_loss": -41.298133850097656, "global_step": 232938, "epoch": 1925} {"train_loss": -38.86747360229492, "global_step": 232939, "epoch": 1925} {"train_loss": -40.98496627807617, "global_step": 232940, "epoch": 1925} {"train_loss": -38.91055679321289, "global_step": 232941, "epoch": 1925} {"train_loss": -19.49408531188965, "global_step": 232942, "epoch": 1925} {"train_loss": -38.71318435668945, "global_step": 232943, "epoch": 1925} {"train_loss": -39.85637283325195, "global_step": 232944, "epoch": 1925} {"train_loss": -37.22944259643555, "global_step": 232945, "epoch": 1925} {"train_loss": -40.51587677001953, "global_step": 232946, "epoch": 1925} {"train_loss": -40.884559631347656, "global_step": 232947, "epoch": 1925} {"train_loss": -40.225975036621094, "global_step": 232948, "epoch": 1925} {"train_loss": -37.98408889770508, "global_step": 232949, "epoch": 1925} {"train_loss": -40.386749267578125, "global_step": 232950, "epoch": 1925} {"train_loss": -40.15998840332031, "global_step": 232951, "epoch": 1925} {"train_loss": -40.90250778198242, "global_step": 232952, "epoch": 1925} {"train_loss": -39.9827880859375, "global_step": 232953, "epoch": 1925} {"train_loss": -37.603302001953125, "global_step": 232954, "epoch": 1925} {"train_loss": -39.56423568725586, "global_step": 232955, "epoch": 1925} {"train_loss": -38.7880973815918, "global_step": 232956, "epoch": 1925} {"train_loss": -39.71295166015625, "global_step": 232957, "epoch": 1925} {"train_loss": -37.8876838684082, "global_step": 232958, "epoch": 1925} {"train_loss": -38.180301666259766, "global_step": 232959, "epoch": 1925} {"train_loss": -39.999446868896484, "global_step": 232960, "epoch": 1925} {"train_loss": -39.77150344848633, "global_step": 232961, "epoch": 1925} {"train_loss": -41.4210319519043, "global_step": 232962, "epoch": 1925} {"train_loss": -40.2105827331543, "global_step": 232963, "epoch": 1925} {"train_loss": -40.09718322753906, "global_step": 232964, "epoch": 1925} {"train_loss": -40.79792404174805, "global_step": 232965, "epoch": 1925} {"train_loss": -40.72365188598633, "global_step": 232966, "epoch": 1925} {"train_loss": -40.30503845214844, "global_step": 232967, "epoch": 1925} {"train_loss": -41.18867111206055, "global_step": 232968, "epoch": 1925} {"train_loss": -40.617610931396484, "global_step": 232969, "epoch": 1925} {"train_loss": -40.86604690551758, "global_step": 232970, "epoch": 1925} {"train_loss": -40.56642532348633, "global_step": 232971, "epoch": 1925} {"train_loss": -41.51176071166992, "global_step": 232972, "epoch": 1925} {"train_loss": -40.5089225769043, "global_step": 232973, "epoch": 1925} {"train_loss": -38.971893310546875, "global_step": 232974, "epoch": 1925} {"train_loss": -41.60783767700195, "global_step": 232975, "epoch": 1925} {"train_loss": -41.25083541870117, "global_step": 232976, "epoch": 1925} {"train_loss": -41.271297454833984, "global_step": 232977, "epoch": 1925} {"train_loss": -41.513607025146484, "global_step": 232978, "epoch": 1925} {"train_loss": -38.28458786010742, "global_step": 232979, "epoch": 1925} {"train_loss": -40.783447265625, "global_step": 232980, "epoch": 1925} {"train_loss": -42.02451705932617, "global_step": 232981, "epoch": 1925} {"train_loss": -40.954586029052734, "global_step": 232982, "epoch": 1925} {"train_loss": -41.29262924194336, "global_step": 232983, "epoch": 1925} {"train_loss": -41.51042938232422, "global_step": 232984, "epoch": 1925} {"train_loss": -41.20823287963867, "global_step": 232985, "epoch": 1925} {"train_loss": -42.003726959228516, "global_step": 232986, "epoch": 1925} {"train_loss": -41.27568435668945, "global_step": 232987, "epoch": 1925} {"train_loss": -41.21589279174805, "global_step": 232988, "epoch": 1925} {"train_loss": -41.555049896240234, "global_step": 232989, "epoch": 1925} {"train_loss": -39.35427474975586, "global_step": 232990, "epoch": 1925} {"train_loss": -41.60752487182617, "global_step": 232991, "epoch": 1925} {"train_loss": -42.0842399597168, "global_step": 232992, "epoch": 1925} {"train_loss": -41.230682373046875, "global_step": 232993, "epoch": 1925} {"train_loss": -41.458126068115234, "global_step": 232994, "epoch": 1925} {"train_loss": -41.57364273071289, "global_step": 232995, "epoch": 1925} {"train_loss": -40.72927474975586, "global_step": 232996, "epoch": 1925} {"train_loss": -41.847618103027344, "global_step": 232997, "epoch": 1925} {"train_loss": -41.1278076171875, "global_step": 232998, "epoch": 1925} {"train_loss": -40.50492477416992, "global_step": 232999, "epoch": 1925} {"train_loss": -40.011165618896484, "global_step": 233000, "epoch": 1925} {"train_loss": -39.32878112792969, "global_step": 233001, "epoch": 1925} {"train_loss": -41.9110107421875, "global_step": 233002, "epoch": 1925} {"train_loss": -41.564754486083984, "global_step": 233003, "epoch": 1925} {"train_loss": -40.69968795776367, "global_step": 233004, "epoch": 1925} {"train_loss": -41.57453536987305, "global_step": 233005, "epoch": 1925} {"train_loss": -41.23069381713867, "global_step": 233006, "epoch": 1925} {"train_loss": -42.023040771484375, "global_step": 233007, "epoch": 1925} {"train_loss": -41.94112014770508, "global_step": 233008, "epoch": 1925} {"train_loss": -41.053993225097656, "global_step": 233009, "epoch": 1925} {"train_loss": -41.83049392700195, "global_step": 233010, "epoch": 1925} {"train_loss": -41.4251823425293, "global_step": 233011, "epoch": 1925} {"train_loss": -42.5873908996582, "global_step": 233012, "epoch": 1925} {"train_loss": -42.09627151489258, "global_step": 233013, "epoch": 1925} {"train_loss": -42.62066650390625, "global_step": 233014, "epoch": 1925} {"train_loss": -41.29113006591797, "global_step": 233015, "epoch": 1925} {"train_loss": -42.39030075073242, "global_step": 233016, "epoch": 1925} {"train_loss": -42.04530715942383, "global_step": 233017, "epoch": 1925} {"train_loss": -42.011260986328125, "global_step": 233018, "epoch": 1925} {"train_loss": -42.388633728027344, "global_step": 233019, "epoch": 1925} {"train_loss": -41.87171936035156, "global_step": 233020, "epoch": 1925} {"train_loss": -42.56267166137695, "global_step": 233021, "epoch": 1925} {"train_loss": -42.9351692199707, "global_step": 233022, "epoch": 1925} {"train_loss": -42.15532302856445, "global_step": 233023, "epoch": 1925} {"train_loss": -42.276729583740234, "global_step": 233024, "epoch": 1925} {"train_loss": -41.67157745361328, "global_step": 233025, "epoch": 1925} {"train_loss": -42.337276458740234, "global_step": 233026, "epoch": 1925} {"train_loss": -42.2227783203125, "global_step": 233027, "epoch": 1925} {"train_loss": -42.266719818115234, "global_step": 233028, "epoch": 1925} {"train_loss": -42.08618927001953, "global_step": 233029, "epoch": 1925} {"train_loss": -42.49433517456055, "global_step": 233030, "epoch": 1925} {"train_loss": -42.74656295776367, "global_step": 233031, "epoch": 1925} {"train_loss": -42.90460968017578, "global_step": 233032, "epoch": 1925} {"train_loss": -41.453033447265625, "global_step": 233033, "epoch": 1925} {"train_loss": -42.4947624206543, "global_step": 233034, "epoch": 1925} {"train_loss": -42.71525192260742, "global_step": 233035, "epoch": 1925} {"train_loss": -42.26516342163086, "global_step": 233036, "epoch": 1925} {"train_loss": -42.32929229736328, "global_step": 233037, "epoch": 1925} {"train_loss": -43.007137298583984, "global_step": 233038, "epoch": 1925} {"train_loss": -42.65160369873047, "global_step": 233039, "epoch": 1925} {"train_loss": -42.33561325073242, "global_step": 233040, "epoch": 1925} {"train_loss": -42.27858352661133, "global_step": 233041, "epoch": 1925} {"train_loss": -41.850486755371094, "global_step": 233042, "epoch": 1925} {"train_loss": -42.634681701660156, "global_step": 233043, "epoch": 1925} {"train_loss": -42.59843826293945, "global_step": 233044, "epoch": 1925} {"train_loss": -40.77917545097919, "global_step": 233045, "epoch": 1925, "val_loss": 2719709.75} {"train_loss": -42.823944091796875, "global_step": 233046, "epoch": 1926} {"train_loss": -43.18459701538086, "global_step": 233047, "epoch": 1926} {"train_loss": -42.747230529785156, "global_step": 233048, "epoch": 1926} {"train_loss": -42.53575897216797, "global_step": 233049, "epoch": 1926} {"train_loss": -42.679473876953125, "global_step": 233050, "epoch": 1926} {"train_loss": -42.823360443115234, "global_step": 233051, "epoch": 1926} {"train_loss": -42.877197265625, "global_step": 233052, "epoch": 1926} {"train_loss": -42.59920120239258, "global_step": 233053, "epoch": 1926} {"train_loss": -42.75718307495117, "global_step": 233054, "epoch": 1926} {"train_loss": -42.23846435546875, "global_step": 233055, "epoch": 1926} {"train_loss": -41.499141693115234, "global_step": 233056, "epoch": 1926} {"train_loss": -42.5577507019043, "global_step": 233057, "epoch": 1926} {"train_loss": -41.81942367553711, "global_step": 233058, "epoch": 1926} {"train_loss": -41.35563278198242, "global_step": 233059, "epoch": 1926} {"train_loss": -41.504512786865234, "global_step": 233060, "epoch": 1926} {"train_loss": -41.21083068847656, "global_step": 233061, "epoch": 1926} {"train_loss": -40.548404693603516, "global_step": 233062, "epoch": 1926} {"train_loss": -41.5212287902832, "global_step": 233063, "epoch": 1926} {"train_loss": -42.3550910949707, "global_step": 233064, "epoch": 1926} {"train_loss": -42.520320892333984, "global_step": 233065, "epoch": 1926} {"train_loss": -42.22842025756836, "global_step": 233066, "epoch": 1926} {"train_loss": -41.074851989746094, "global_step": 233067, "epoch": 1926} {"train_loss": -40.415645599365234, "global_step": 233068, "epoch": 1926} {"train_loss": -40.88029098510742, "global_step": 233069, "epoch": 1926} {"train_loss": -42.0153923034668, "global_step": 233070, "epoch": 1926} {"train_loss": -42.963985443115234, "global_step": 233071, "epoch": 1926} {"train_loss": -41.00624465942383, "global_step": 233072, "epoch": 1926} {"train_loss": -41.06974792480469, "global_step": 233073, "epoch": 1926} {"train_loss": -41.59443283081055, "global_step": 233074, "epoch": 1926} {"train_loss": -41.70759582519531, "global_step": 233075, "epoch": 1926} {"train_loss": -38.17695617675781, "global_step": 233076, "epoch": 1926} {"train_loss": -38.42064666748047, "global_step": 233077, "epoch": 1926} {"train_loss": -41.1628532409668, "global_step": 233078, "epoch": 1926} {"train_loss": -38.00269317626953, "global_step": 233079, "epoch": 1926} {"train_loss": -31.342941284179688, "global_step": 233080, "epoch": 1926} {"train_loss": -37.85745620727539, "global_step": 233081, "epoch": 1926} {"train_loss": -41.045040130615234, "global_step": 233082, "epoch": 1926} {"train_loss": -36.3355712890625, "global_step": 233083, "epoch": 1926} {"train_loss": -38.247039794921875, "global_step": 233084, "epoch": 1926} {"train_loss": -40.1209716796875, "global_step": 233085, "epoch": 1926} {"train_loss": -39.22089767456055, "global_step": 233086, "epoch": 1926} {"train_loss": -40.51861572265625, "global_step": 233087, "epoch": 1926} {"train_loss": -38.99250411987305, "global_step": 233088, "epoch": 1926} {"train_loss": -36.47783279418945, "global_step": 233089, "epoch": 1926} {"train_loss": -39.700103759765625, "global_step": 233090, "epoch": 1926} {"train_loss": -39.29542922973633, "global_step": 233091, "epoch": 1926} {"train_loss": -38.891578674316406, "global_step": 233092, "epoch": 1926} {"train_loss": -40.04372024536133, "global_step": 233093, "epoch": 1926} {"train_loss": -39.94763946533203, "global_step": 233094, "epoch": 1926} {"train_loss": -39.89961242675781, "global_step": 233095, "epoch": 1926} {"train_loss": -40.311275482177734, "global_step": 233096, "epoch": 1926} {"train_loss": -39.53567123413086, "global_step": 233097, "epoch": 1926} {"train_loss": -40.963409423828125, "global_step": 233098, "epoch": 1926} {"train_loss": -39.49552536010742, "global_step": 233099, "epoch": 1926} {"train_loss": -40.02233123779297, "global_step": 233100, "epoch": 1926} {"train_loss": -40.68097686767578, "global_step": 233101, "epoch": 1926} {"train_loss": -41.503841400146484, "global_step": 233102, "epoch": 1926} {"train_loss": -40.635841369628906, "global_step": 233103, "epoch": 1926} {"train_loss": -40.86286544799805, "global_step": 233104, "epoch": 1926} {"train_loss": -40.912288665771484, "global_step": 233105, "epoch": 1926} {"train_loss": -41.437435150146484, "global_step": 233106, "epoch": 1926} {"train_loss": -41.038848876953125, "global_step": 233107, "epoch": 1926} {"train_loss": -41.099220275878906, "global_step": 233108, "epoch": 1926} {"train_loss": -41.58189010620117, "global_step": 233109, "epoch": 1926} {"train_loss": -41.5873908996582, "global_step": 233110, "epoch": 1926} {"train_loss": -41.65747833251953, "global_step": 233111, "epoch": 1926} {"train_loss": -41.41343688964844, "global_step": 233112, "epoch": 1926} {"train_loss": -41.60783004760742, "global_step": 233113, "epoch": 1926} {"train_loss": -41.69500732421875, "global_step": 233114, "epoch": 1926} {"train_loss": -41.30221176147461, "global_step": 233115, "epoch": 1926} {"train_loss": -41.73645782470703, "global_step": 233116, "epoch": 1926} {"train_loss": -41.72929000854492, "global_step": 233117, "epoch": 1926} {"train_loss": -40.752647399902344, "global_step": 233118, "epoch": 1926} {"train_loss": -42.49467086791992, "global_step": 233119, "epoch": 1926} {"train_loss": -41.986549377441406, "global_step": 233120, "epoch": 1926} {"train_loss": -42.13513946533203, "global_step": 233121, "epoch": 1926} {"train_loss": -42.13758087158203, "global_step": 233122, "epoch": 1926} {"train_loss": -42.50545883178711, "global_step": 233123, "epoch": 1926} {"train_loss": -41.724151611328125, "global_step": 233124, "epoch": 1926} {"train_loss": -41.759437561035156, "global_step": 233125, "epoch": 1926} {"train_loss": -42.4073600769043, "global_step": 233126, "epoch": 1926} {"train_loss": -42.33345413208008, "global_step": 233127, "epoch": 1926} {"train_loss": -42.49796676635742, "global_step": 233128, "epoch": 1926} {"train_loss": -42.14775466918945, "global_step": 233129, "epoch": 1926} {"train_loss": -41.983577728271484, "global_step": 233130, "epoch": 1926} {"train_loss": -42.49007797241211, "global_step": 233131, "epoch": 1926} {"train_loss": -42.65336990356445, "global_step": 233132, "epoch": 1926} {"train_loss": -42.43722152709961, "global_step": 233133, "epoch": 1926} {"train_loss": -42.16901397705078, "global_step": 233134, "epoch": 1926} {"train_loss": -42.526363372802734, "global_step": 233135, "epoch": 1926} {"train_loss": -42.864051818847656, "global_step": 233136, "epoch": 1926} {"train_loss": -42.45933151245117, "global_step": 233137, "epoch": 1926} {"train_loss": -42.593177795410156, "global_step": 233138, "epoch": 1926} {"train_loss": -42.747989654541016, "global_step": 233139, "epoch": 1926} {"train_loss": -42.48057174682617, "global_step": 233140, "epoch": 1926} {"train_loss": -42.53167724609375, "global_step": 233141, "epoch": 1926} {"train_loss": -42.91535949707031, "global_step": 233142, "epoch": 1926} {"train_loss": -42.25385665893555, "global_step": 233143, "epoch": 1926} {"train_loss": -42.824462890625, "global_step": 233144, "epoch": 1926} {"train_loss": -42.607852935791016, "global_step": 233145, "epoch": 1926} {"train_loss": -42.63672637939453, "global_step": 233146, "epoch": 1926} {"train_loss": -42.94683837890625, "global_step": 233147, "epoch": 1926} {"train_loss": -42.87017822265625, "global_step": 233148, "epoch": 1926} {"train_loss": -42.95640182495117, "global_step": 233149, "epoch": 1926} {"train_loss": -43.09299850463867, "global_step": 233150, "epoch": 1926} {"train_loss": -42.92210006713867, "global_step": 233151, "epoch": 1926} {"train_loss": -42.708736419677734, "global_step": 233152, "epoch": 1926} {"train_loss": -42.767391204833984, "global_step": 233153, "epoch": 1926} {"train_loss": -42.85734558105469, "global_step": 233154, "epoch": 1926} {"train_loss": -42.69110870361328, "global_step": 233155, "epoch": 1926} {"train_loss": -42.85639190673828, "global_step": 233156, "epoch": 1926} {"train_loss": -42.53889465332031, "global_step": 233157, "epoch": 1926} {"train_loss": -43.40222930908203, "global_step": 233158, "epoch": 1926} {"train_loss": -42.809688568115234, "global_step": 233159, "epoch": 1926} {"train_loss": -43.28986358642578, "global_step": 233160, "epoch": 1926} {"train_loss": -42.36473083496094, "global_step": 233161, "epoch": 1926} {"train_loss": -42.91101837158203, "global_step": 233162, "epoch": 1926} {"train_loss": -43.094581604003906, "global_step": 233163, "epoch": 1926} {"train_loss": -42.76608657836914, "global_step": 233164, "epoch": 1926} {"train_loss": -42.02178955078125, "global_step": 233165, "epoch": 1926} {"train_loss": -41.495490996305605, "global_step": 233166, "epoch": 1926, "val_loss": 2772137.25} {"train_loss": -40.856197357177734, "global_step": 233167, "epoch": 1927} {"train_loss": -42.0787467956543, "global_step": 233168, "epoch": 1927} {"train_loss": -43.60235595703125, "global_step": 233169, "epoch": 1927} {"train_loss": -41.65139389038086, "global_step": 233170, "epoch": 1927} {"train_loss": -42.78413009643555, "global_step": 233171, "epoch": 1927} {"train_loss": -42.58251953125, "global_step": 233172, "epoch": 1927} {"train_loss": -42.142738342285156, "global_step": 233173, "epoch": 1927} {"train_loss": -42.96650314331055, "global_step": 233174, "epoch": 1927} {"train_loss": -41.5604248046875, "global_step": 233175, "epoch": 1927} {"train_loss": -41.25837326049805, "global_step": 233176, "epoch": 1927} {"train_loss": -41.762264251708984, "global_step": 233177, "epoch": 1927} {"train_loss": -40.88814926147461, "global_step": 233178, "epoch": 1927} {"train_loss": -41.78115463256836, "global_step": 233179, "epoch": 1927} {"train_loss": -41.471858978271484, "global_step": 233180, "epoch": 1927} {"train_loss": -41.01161193847656, "global_step": 233181, "epoch": 1927} {"train_loss": -42.10441207885742, "global_step": 233182, "epoch": 1927} {"train_loss": -42.06573486328125, "global_step": 233183, "epoch": 1927} {"train_loss": -41.15972137451172, "global_step": 233184, "epoch": 1927} {"train_loss": -42.60398483276367, "global_step": 233185, "epoch": 1927} {"train_loss": -42.158382415771484, "global_step": 233186, "epoch": 1927} {"train_loss": -41.905738830566406, "global_step": 233187, "epoch": 1927} {"train_loss": -40.91834259033203, "global_step": 233188, "epoch": 1927} {"train_loss": -31.571847915649414, "global_step": 233189, "epoch": 1927} {"train_loss": -37.49250030517578, "global_step": 233190, "epoch": 1927} {"train_loss": -38.21864318847656, "global_step": 233191, "epoch": 1927} {"train_loss": -40.52106857299805, "global_step": 233192, "epoch": 1927} {"train_loss": -41.066314697265625, "global_step": 233193, "epoch": 1927} {"train_loss": -38.606563568115234, "global_step": 233194, "epoch": 1927} {"train_loss": -40.12434005737305, "global_step": 233195, "epoch": 1927} {"train_loss": -40.016815185546875, "global_step": 233196, "epoch": 1927} {"train_loss": -34.02522659301758, "global_step": 233197, "epoch": 1927} {"train_loss": -35.13875961303711, "global_step": 233198, "epoch": 1927} {"train_loss": -12.090510368347168, "global_step": 233199, "epoch": 1927} {"train_loss": -27.228515625, "global_step": 233200, "epoch": 1927} {"train_loss": -34.620216369628906, "global_step": 233201, "epoch": 1927} {"train_loss": -31.1219482421875, "global_step": 233202, "epoch": 1927} {"train_loss": -20.732236862182617, "global_step": 233203, "epoch": 1927} {"train_loss": -36.2702751159668, "global_step": 233204, "epoch": 1927} {"train_loss": -28.069990158081055, "global_step": 233205, "epoch": 1927} {"train_loss": -38.23739242553711, "global_step": 233206, "epoch": 1927} {"train_loss": -30.73653221130371, "global_step": 233207, "epoch": 1927} {"train_loss": -34.47297286987305, "global_step": 233208, "epoch": 1927} {"train_loss": -33.169612884521484, "global_step": 233209, "epoch": 1927} {"train_loss": -36.84804916381836, "global_step": 233210, "epoch": 1927} {"train_loss": -36.627288818359375, "global_step": 233211, "epoch": 1927} {"train_loss": -34.7612419128418, "global_step": 233212, "epoch": 1927} {"train_loss": -32.477020263671875, "global_step": 233213, "epoch": 1927} {"train_loss": -38.218257904052734, "global_step": 233214, "epoch": 1927} {"train_loss": -36.906341552734375, "global_step": 233215, "epoch": 1927} {"train_loss": -36.888309478759766, "global_step": 233216, "epoch": 1927} {"train_loss": -37.776458740234375, "global_step": 233217, "epoch": 1927} {"train_loss": -36.86695098876953, "global_step": 233218, "epoch": 1927} {"train_loss": -39.15619659423828, "global_step": 233219, "epoch": 1927} {"train_loss": -38.740821838378906, "global_step": 233220, "epoch": 1927} {"train_loss": -38.35508728027344, "global_step": 233221, "epoch": 1927} {"train_loss": -39.345096588134766, "global_step": 233222, "epoch": 1927} {"train_loss": -37.80021286010742, "global_step": 233223, "epoch": 1927} {"train_loss": -38.03104019165039, "global_step": 233224, "epoch": 1927} {"train_loss": -39.56474685668945, "global_step": 233225, "epoch": 1927} {"train_loss": -38.03512191772461, "global_step": 233226, "epoch": 1927} {"train_loss": -37.79935836791992, "global_step": 233227, "epoch": 1927} {"train_loss": -37.980709075927734, "global_step": 233228, "epoch": 1927} {"train_loss": -39.2415771484375, "global_step": 233229, "epoch": 1927} {"train_loss": -39.45011520385742, "global_step": 233230, "epoch": 1927} {"train_loss": -39.92797088623047, "global_step": 233231, "epoch": 1927} {"train_loss": -39.789764404296875, "global_step": 233232, "epoch": 1927} {"train_loss": -39.1192741394043, "global_step": 233233, "epoch": 1927} {"train_loss": -39.16436767578125, "global_step": 233234, "epoch": 1927} {"train_loss": -38.60774612426758, "global_step": 233235, "epoch": 1927} {"train_loss": -39.9328727722168, "global_step": 233236, "epoch": 1927} {"train_loss": -38.77799987792969, "global_step": 233237, "epoch": 1927} {"train_loss": -40.17171859741211, "global_step": 233238, "epoch": 1927} {"train_loss": -38.20692825317383, "global_step": 233239, "epoch": 1927} {"train_loss": -39.84012222290039, "global_step": 233240, "epoch": 1927} {"train_loss": -40.174495697021484, "global_step": 233241, "epoch": 1927} {"train_loss": -39.53145980834961, "global_step": 233242, "epoch": 1927} {"train_loss": -37.998470306396484, "global_step": 233243, "epoch": 1927} {"train_loss": -39.04191207885742, "global_step": 233244, "epoch": 1927} {"train_loss": -39.93128204345703, "global_step": 233245, "epoch": 1927} {"train_loss": -40.1578483581543, "global_step": 233246, "epoch": 1927} {"train_loss": -40.77531814575195, "global_step": 233247, "epoch": 1927} {"train_loss": -39.72285461425781, "global_step": 233248, "epoch": 1927} {"train_loss": -40.602169036865234, "global_step": 233249, "epoch": 1927} {"train_loss": -40.24885940551758, "global_step": 233250, "epoch": 1927} {"train_loss": -40.22791290283203, "global_step": 233251, "epoch": 1927} {"train_loss": -40.487972259521484, "global_step": 233252, "epoch": 1927} {"train_loss": -40.16981887817383, "global_step": 233253, "epoch": 1927} {"train_loss": -40.81049728393555, "global_step": 233254, "epoch": 1927} {"train_loss": -40.96809768676758, "global_step": 233255, "epoch": 1927} {"train_loss": -40.429969787597656, "global_step": 233256, "epoch": 1927} {"train_loss": -40.12089920043945, "global_step": 233257, "epoch": 1927} {"train_loss": -40.64406967163086, "global_step": 233258, "epoch": 1927} {"train_loss": -41.01528549194336, "global_step": 233259, "epoch": 1927} {"train_loss": -41.22964096069336, "global_step": 233260, "epoch": 1927} {"train_loss": -40.57357406616211, "global_step": 233261, "epoch": 1927} {"train_loss": -40.898128509521484, "global_step": 233262, "epoch": 1927} {"train_loss": -40.613521575927734, "global_step": 233263, "epoch": 1927} {"train_loss": -40.4207763671875, "global_step": 233264, "epoch": 1927} {"train_loss": -41.46485900878906, "global_step": 233265, "epoch": 1927} {"train_loss": -41.4779052734375, "global_step": 233266, "epoch": 1927} {"train_loss": -40.27541732788086, "global_step": 233267, "epoch": 1927} {"train_loss": -40.96440887451172, "global_step": 233268, "epoch": 1927} {"train_loss": -41.166927337646484, "global_step": 233269, "epoch": 1927} {"train_loss": -41.010379791259766, "global_step": 233270, "epoch": 1927} {"train_loss": -41.1641960144043, "global_step": 233271, "epoch": 1927} {"train_loss": -41.06757354736328, "global_step": 233272, "epoch": 1927} {"train_loss": -41.626220703125, "global_step": 233273, "epoch": 1927} {"train_loss": -41.54438400268555, "global_step": 233274, "epoch": 1927} {"train_loss": -41.40291213989258, "global_step": 233275, "epoch": 1927} {"train_loss": -40.887481689453125, "global_step": 233276, "epoch": 1927} {"train_loss": -41.272132873535156, "global_step": 233277, "epoch": 1927} {"train_loss": -41.62164306640625, "global_step": 233278, "epoch": 1927} {"train_loss": -41.211788177490234, "global_step": 233279, "epoch": 1927} {"train_loss": -40.116024017333984, "global_step": 233280, "epoch": 1927} {"train_loss": -41.408233642578125, "global_step": 233281, "epoch": 1927} {"train_loss": -41.82838821411133, "global_step": 233282, "epoch": 1927} {"train_loss": -41.66532516479492, "global_step": 233283, "epoch": 1927} {"train_loss": -41.79708480834961, "global_step": 233284, "epoch": 1927} {"train_loss": -40.9423942565918, "global_step": 233285, "epoch": 1927} {"train_loss": -41.948394775390625, "global_step": 233286, "epoch": 1927} {"train_loss": -39.05300152203268, "global_step": 233287, "epoch": 1927, "val_loss": 2665815.75} {"train_loss": -41.89993667602539, "global_step": 233288, "epoch": 1928} {"train_loss": -41.830650329589844, "global_step": 233289, "epoch": 1928} {"train_loss": -41.21585464477539, "global_step": 233290, "epoch": 1928} {"train_loss": -41.89627456665039, "global_step": 233291, "epoch": 1928} {"train_loss": -41.38724899291992, "global_step": 233292, "epoch": 1928} {"train_loss": -41.54343795776367, "global_step": 233293, "epoch": 1928} {"train_loss": -42.33071517944336, "global_step": 233294, "epoch": 1928} {"train_loss": -41.80495834350586, "global_step": 233295, "epoch": 1928} {"train_loss": -41.992645263671875, "global_step": 233296, "epoch": 1928} {"train_loss": -42.12661361694336, "global_step": 233297, "epoch": 1928} {"train_loss": -42.113983154296875, "global_step": 233298, "epoch": 1928} {"train_loss": -42.049720764160156, "global_step": 233299, "epoch": 1928} {"train_loss": -42.29522705078125, "global_step": 233300, "epoch": 1928} {"train_loss": -42.600765228271484, "global_step": 233301, "epoch": 1928} {"train_loss": -41.7379035949707, "global_step": 233302, "epoch": 1928} {"train_loss": -42.21198654174805, "global_step": 233303, "epoch": 1928} {"train_loss": -41.78169631958008, "global_step": 233304, "epoch": 1928} {"train_loss": -42.35113525390625, "global_step": 233305, "epoch": 1928} {"train_loss": -41.89385223388672, "global_step": 233306, "epoch": 1928} {"train_loss": -41.72592544555664, "global_step": 233307, "epoch": 1928} {"train_loss": -42.1572380065918, "global_step": 233308, "epoch": 1928} {"train_loss": -41.472164154052734, "global_step": 233309, "epoch": 1928} {"train_loss": -42.2199592590332, "global_step": 233310, "epoch": 1928} {"train_loss": -41.4764289855957, "global_step": 233311, "epoch": 1928} {"train_loss": -42.59187698364258, "global_step": 233312, "epoch": 1928} {"train_loss": -41.864540100097656, "global_step": 233313, "epoch": 1928} {"train_loss": -42.89599609375, "global_step": 233314, "epoch": 1928} {"train_loss": -42.36383819580078, "global_step": 233315, "epoch": 1928} {"train_loss": -42.481422424316406, "global_step": 233316, "epoch": 1928} {"train_loss": -42.791500091552734, "global_step": 233317, "epoch": 1928} {"train_loss": -41.2828483581543, "global_step": 233318, "epoch": 1928} {"train_loss": -41.93282699584961, "global_step": 233319, "epoch": 1928} {"train_loss": -42.24631881713867, "global_step": 233320, "epoch": 1928} {"train_loss": -41.963050842285156, "global_step": 233321, "epoch": 1928} {"train_loss": -42.56881332397461, "global_step": 233322, "epoch": 1928} {"train_loss": -42.17729949951172, "global_step": 233323, "epoch": 1928} {"train_loss": -42.53566360473633, "global_step": 233324, "epoch": 1928} {"train_loss": -43.08179473876953, "global_step": 233325, "epoch": 1928} {"train_loss": -42.2083740234375, "global_step": 233326, "epoch": 1928} {"train_loss": -42.199703216552734, "global_step": 233327, "epoch": 1928} {"train_loss": -41.80579376220703, "global_step": 233328, "epoch": 1928} {"train_loss": -41.77032470703125, "global_step": 233329, "epoch": 1928} {"train_loss": -42.7442626953125, "global_step": 233330, "epoch": 1928} {"train_loss": -42.73491668701172, "global_step": 233331, "epoch": 1928} {"train_loss": -42.4106559753418, "global_step": 233332, "epoch": 1928} {"train_loss": -43.05859375, "global_step": 233333, "epoch": 1928} {"train_loss": -42.775543212890625, "global_step": 233334, "epoch": 1928} {"train_loss": -42.64613723754883, "global_step": 233335, "epoch": 1928} {"train_loss": -41.93992233276367, "global_step": 233336, "epoch": 1928} {"train_loss": -41.47001647949219, "global_step": 233337, "epoch": 1928} {"train_loss": -41.033599853515625, "global_step": 233338, "epoch": 1928} {"train_loss": -39.887752532958984, "global_step": 233339, "epoch": 1928} {"train_loss": -38.379207611083984, "global_step": 233340, "epoch": 1928} {"train_loss": -38.69977951049805, "global_step": 233341, "epoch": 1928} {"train_loss": -42.01759719848633, "global_step": 233342, "epoch": 1928} {"train_loss": -42.41512680053711, "global_step": 233343, "epoch": 1928} {"train_loss": -40.28663635253906, "global_step": 233344, "epoch": 1928} {"train_loss": -40.20306396484375, "global_step": 233345, "epoch": 1928} {"train_loss": -39.857276916503906, "global_step": 233346, "epoch": 1928} {"train_loss": -41.658565521240234, "global_step": 233347, "epoch": 1928} {"train_loss": -41.54838943481445, "global_step": 233348, "epoch": 1928} {"train_loss": -42.09614944458008, "global_step": 233349, "epoch": 1928} {"train_loss": -39.994667053222656, "global_step": 233350, "epoch": 1928} {"train_loss": -41.72566604614258, "global_step": 233351, "epoch": 1928} {"train_loss": -41.17548751831055, "global_step": 233352, "epoch": 1928} {"train_loss": -39.701229095458984, "global_step": 233353, "epoch": 1928} {"train_loss": -37.891021728515625, "global_step": 233354, "epoch": 1928} {"train_loss": -40.743011474609375, "global_step": 233355, "epoch": 1928} {"train_loss": -41.632869720458984, "global_step": 233356, "epoch": 1928} {"train_loss": -40.00366973876953, "global_step": 233357, "epoch": 1928} {"train_loss": -40.50872039794922, "global_step": 233358, "epoch": 1928} {"train_loss": -39.97669982910156, "global_step": 233359, "epoch": 1928} {"train_loss": -38.883453369140625, "global_step": 233360, "epoch": 1928} {"train_loss": -41.780189514160156, "global_step": 233361, "epoch": 1928} {"train_loss": -40.66917037963867, "global_step": 233362, "epoch": 1928} {"train_loss": -41.47690963745117, "global_step": 233363, "epoch": 1928} {"train_loss": -40.40482711791992, "global_step": 233364, "epoch": 1928} {"train_loss": -41.823822021484375, "global_step": 233365, "epoch": 1928} {"train_loss": -41.52248001098633, "global_step": 233366, "epoch": 1928} {"train_loss": -41.65006637573242, "global_step": 233367, "epoch": 1928} {"train_loss": -40.370941162109375, "global_step": 233368, "epoch": 1928} {"train_loss": -42.1673583984375, "global_step": 233369, "epoch": 1928} {"train_loss": -40.009578704833984, "global_step": 233370, "epoch": 1928} {"train_loss": -42.33824157714844, "global_step": 233371, "epoch": 1928} {"train_loss": -40.27813720703125, "global_step": 233372, "epoch": 1928} {"train_loss": -42.22541809082031, "global_step": 233373, "epoch": 1928} {"train_loss": -40.41217803955078, "global_step": 233374, "epoch": 1928} {"train_loss": -40.79555130004883, "global_step": 233375, "epoch": 1928} {"train_loss": -40.983253479003906, "global_step": 233376, "epoch": 1928} {"train_loss": -41.972434997558594, "global_step": 233377, "epoch": 1928} {"train_loss": -41.88581848144531, "global_step": 233378, "epoch": 1928} {"train_loss": -41.82761764526367, "global_step": 233379, "epoch": 1928} {"train_loss": -42.20389175415039, "global_step": 233380, "epoch": 1928} {"train_loss": -42.49503707885742, "global_step": 233381, "epoch": 1928} {"train_loss": -41.65675354003906, "global_step": 233382, "epoch": 1928} {"train_loss": -41.1248779296875, "global_step": 233383, "epoch": 1928} {"train_loss": -42.37310028076172, "global_step": 233384, "epoch": 1928} {"train_loss": -41.84282302856445, "global_step": 233385, "epoch": 1928} {"train_loss": -41.27912902832031, "global_step": 233386, "epoch": 1928} {"train_loss": -42.299068450927734, "global_step": 233387, "epoch": 1928} {"train_loss": -42.65351104736328, "global_step": 233388, "epoch": 1928} {"train_loss": -42.042388916015625, "global_step": 233389, "epoch": 1928} {"train_loss": -42.42440414428711, "global_step": 233390, "epoch": 1928} {"train_loss": -42.200191497802734, "global_step": 233391, "epoch": 1928} {"train_loss": -40.63359451293945, "global_step": 233392, "epoch": 1928} {"train_loss": -41.32191848754883, "global_step": 233393, "epoch": 1928} {"train_loss": -41.71685791015625, "global_step": 233394, "epoch": 1928} {"train_loss": -41.269683837890625, "global_step": 233395, "epoch": 1928} {"train_loss": -41.80033493041992, "global_step": 233396, "epoch": 1928} {"train_loss": -41.76643371582031, "global_step": 233397, "epoch": 1928} {"train_loss": -41.274784088134766, "global_step": 233398, "epoch": 1928} {"train_loss": -40.75457763671875, "global_step": 233399, "epoch": 1928} {"train_loss": -42.279823303222656, "global_step": 233400, "epoch": 1928} {"train_loss": -41.82465744018555, "global_step": 233401, "epoch": 1928} {"train_loss": -41.725250244140625, "global_step": 233402, "epoch": 1928} {"train_loss": -40.83306121826172, "global_step": 233403, "epoch": 1928} {"train_loss": -41.953033447265625, "global_step": 233404, "epoch": 1928} {"train_loss": -40.151695251464844, "global_step": 233405, "epoch": 1928} {"train_loss": -39.854461669921875, "global_step": 233406, "epoch": 1928} {"train_loss": -40.13204574584961, "global_step": 233407, "epoch": 1928} {"train_loss": -41.550623081932386, "global_step": 233408, "epoch": 1928, "val_loss": 2733107.25} {"train_loss": -40.87681198120117, "global_step": 233409, "epoch": 1929} {"train_loss": -41.9616584777832, "global_step": 233410, "epoch": 1929} {"train_loss": -41.26775360107422, "global_step": 233411, "epoch": 1929} {"train_loss": -41.66292190551758, "global_step": 233412, "epoch": 1929} {"train_loss": -42.2744140625, "global_step": 233413, "epoch": 1929} {"train_loss": -42.18415069580078, "global_step": 233414, "epoch": 1929} {"train_loss": -42.19503402709961, "global_step": 233415, "epoch": 1929} {"train_loss": -42.27897262573242, "global_step": 233416, "epoch": 1929} {"train_loss": -41.85017395019531, "global_step": 233417, "epoch": 1929} {"train_loss": -41.978004455566406, "global_step": 233418, "epoch": 1929} {"train_loss": -41.69066619873047, "global_step": 233419, "epoch": 1929} {"train_loss": -41.778663635253906, "global_step": 233420, "epoch": 1929} {"train_loss": -41.296905517578125, "global_step": 233421, "epoch": 1929} {"train_loss": -42.50457000732422, "global_step": 233422, "epoch": 1929} {"train_loss": -41.15353012084961, "global_step": 233423, "epoch": 1929} {"train_loss": -42.636592864990234, "global_step": 233424, "epoch": 1929} {"train_loss": -42.368804931640625, "global_step": 233425, "epoch": 1929} {"train_loss": -41.44801712036133, "global_step": 233426, "epoch": 1929} {"train_loss": -41.63185501098633, "global_step": 233427, "epoch": 1929} {"train_loss": -42.04597091674805, "global_step": 233428, "epoch": 1929} {"train_loss": -42.050575256347656, "global_step": 233429, "epoch": 1929} {"train_loss": -41.52392578125, "global_step": 233430, "epoch": 1929} {"train_loss": -41.15830612182617, "global_step": 233431, "epoch": 1929} {"train_loss": -41.22783279418945, "global_step": 233432, "epoch": 1929} {"train_loss": -41.737300872802734, "global_step": 233433, "epoch": 1929} {"train_loss": -41.633174896240234, "global_step": 233434, "epoch": 1929} {"train_loss": -42.16825866699219, "global_step": 233435, "epoch": 1929} {"train_loss": -41.59058380126953, "global_step": 233436, "epoch": 1929} {"train_loss": -42.93815231323242, "global_step": 233437, "epoch": 1929} {"train_loss": -41.75974655151367, "global_step": 233438, "epoch": 1929} {"train_loss": -42.57686233520508, "global_step": 233439, "epoch": 1929} {"train_loss": -42.35614013671875, "global_step": 233440, "epoch": 1929} {"train_loss": -42.47549819946289, "global_step": 233441, "epoch": 1929} {"train_loss": -42.25894546508789, "global_step": 233442, "epoch": 1929} {"train_loss": -42.88604736328125, "global_step": 233443, "epoch": 1929} {"train_loss": -42.379615783691406, "global_step": 233444, "epoch": 1929} {"train_loss": -42.18368148803711, "global_step": 233445, "epoch": 1929} {"train_loss": -42.6499137878418, "global_step": 233446, "epoch": 1929} {"train_loss": -41.40740966796875, "global_step": 233447, "epoch": 1929} {"train_loss": -41.79021453857422, "global_step": 233448, "epoch": 1929} {"train_loss": -41.50029373168945, "global_step": 233449, "epoch": 1929} {"train_loss": -42.12424850463867, "global_step": 233450, "epoch": 1929} {"train_loss": -41.390541076660156, "global_step": 233451, "epoch": 1929} {"train_loss": -41.7319450378418, "global_step": 233452, "epoch": 1929} {"train_loss": -42.56527328491211, "global_step": 233453, "epoch": 1929} {"train_loss": -41.79478073120117, "global_step": 233454, "epoch": 1929} {"train_loss": -42.37587356567383, "global_step": 233455, "epoch": 1929} {"train_loss": -42.641212463378906, "global_step": 233456, "epoch": 1929} {"train_loss": -42.785125732421875, "global_step": 233457, "epoch": 1929} {"train_loss": -41.67976760864258, "global_step": 233458, "epoch": 1929} {"train_loss": -41.1180305480957, "global_step": 233459, "epoch": 1929} {"train_loss": -39.92841720581055, "global_step": 233460, "epoch": 1929} {"train_loss": -40.65790557861328, "global_step": 233461, "epoch": 1929} {"train_loss": -41.63343811035156, "global_step": 233462, "epoch": 1929} {"train_loss": -42.578834533691406, "global_step": 233463, "epoch": 1929} {"train_loss": -41.89238357543945, "global_step": 233464, "epoch": 1929} {"train_loss": -41.94853973388672, "global_step": 233465, "epoch": 1929} {"train_loss": -42.848594665527344, "global_step": 233466, "epoch": 1929} {"train_loss": -43.159095764160156, "global_step": 233467, "epoch": 1929} {"train_loss": -42.369667053222656, "global_step": 233468, "epoch": 1929} {"train_loss": -41.50732421875, "global_step": 233469, "epoch": 1929} {"train_loss": -42.32019805908203, "global_step": 233470, "epoch": 1929} {"train_loss": -42.739906311035156, "global_step": 233471, "epoch": 1929} {"train_loss": -42.230552673339844, "global_step": 233472, "epoch": 1929} {"train_loss": -41.75178146362305, "global_step": 233473, "epoch": 1929} {"train_loss": -40.119876861572266, "global_step": 233474, "epoch": 1929} {"train_loss": -41.26045608520508, "global_step": 233475, "epoch": 1929} {"train_loss": -41.75221252441406, "global_step": 233476, "epoch": 1929} {"train_loss": -40.21455001831055, "global_step": 233477, "epoch": 1929} {"train_loss": -39.57504653930664, "global_step": 233478, "epoch": 1929} {"train_loss": -39.38234329223633, "global_step": 233479, "epoch": 1929} {"train_loss": -42.42037582397461, "global_step": 233480, "epoch": 1929} {"train_loss": -40.715660095214844, "global_step": 233481, "epoch": 1929} {"train_loss": -39.52912139892578, "global_step": 233482, "epoch": 1929} {"train_loss": -41.15645217895508, "global_step": 233483, "epoch": 1929} {"train_loss": -41.24508285522461, "global_step": 233484, "epoch": 1929} {"train_loss": -36.930171966552734, "global_step": 233485, "epoch": 1929} {"train_loss": -41.48594284057617, "global_step": 233486, "epoch": 1929} {"train_loss": -41.378604888916016, "global_step": 233487, "epoch": 1929} {"train_loss": -40.31834411621094, "global_step": 233488, "epoch": 1929} {"train_loss": -41.12186813354492, "global_step": 233489, "epoch": 1929} {"train_loss": -42.555606842041016, "global_step": 233490, "epoch": 1929} {"train_loss": -41.85551071166992, "global_step": 233491, "epoch": 1929} {"train_loss": -41.9619140625, "global_step": 233492, "epoch": 1929} {"train_loss": -41.64085006713867, "global_step": 233493, "epoch": 1929} {"train_loss": -42.469905853271484, "global_step": 233494, "epoch": 1929} {"train_loss": -42.120723724365234, "global_step": 233495, "epoch": 1929} {"train_loss": -41.59601974487305, "global_step": 233496, "epoch": 1929} {"train_loss": -42.45232009887695, "global_step": 233497, "epoch": 1929} {"train_loss": -41.89931106567383, "global_step": 233498, "epoch": 1929} {"train_loss": -41.83736801147461, "global_step": 233499, "epoch": 1929} {"train_loss": -42.344642639160156, "global_step": 233500, "epoch": 1929} {"train_loss": -42.13216781616211, "global_step": 233501, "epoch": 1929} {"train_loss": -41.299468994140625, "global_step": 233502, "epoch": 1929} {"train_loss": -42.38714599609375, "global_step": 233503, "epoch": 1929} {"train_loss": -42.16352462768555, "global_step": 233504, "epoch": 1929} {"train_loss": -42.518272399902344, "global_step": 233505, "epoch": 1929} {"train_loss": -42.67619705200195, "global_step": 233506, "epoch": 1929} {"train_loss": -41.67652130126953, "global_step": 233507, "epoch": 1929} {"train_loss": -42.22309875488281, "global_step": 233508, "epoch": 1929} {"train_loss": -42.17190933227539, "global_step": 233509, "epoch": 1929} {"train_loss": -42.54658126831055, "global_step": 233510, "epoch": 1929} {"train_loss": -42.3540153503418, "global_step": 233511, "epoch": 1929} {"train_loss": -42.7193489074707, "global_step": 233512, "epoch": 1929} {"train_loss": -42.799171447753906, "global_step": 233513, "epoch": 1929} {"train_loss": -42.295406341552734, "global_step": 233514, "epoch": 1929} {"train_loss": -42.53257369995117, "global_step": 233515, "epoch": 1929} {"train_loss": -43.13232421875, "global_step": 233516, "epoch": 1929} {"train_loss": -42.32354736328125, "global_step": 233517, "epoch": 1929} {"train_loss": -42.557918548583984, "global_step": 233518, "epoch": 1929} {"train_loss": -43.254695892333984, "global_step": 233519, "epoch": 1929} {"train_loss": -42.727027893066406, "global_step": 233520, "epoch": 1929} {"train_loss": -42.759639739990234, "global_step": 233521, "epoch": 1929} {"train_loss": -42.80535125732422, "global_step": 233522, "epoch": 1929} {"train_loss": -42.600677490234375, "global_step": 233523, "epoch": 1929} {"train_loss": -42.930110931396484, "global_step": 233524, "epoch": 1929} {"train_loss": -43.3358039855957, "global_step": 233525, "epoch": 1929} {"train_loss": -43.33137893676758, "global_step": 233526, "epoch": 1929} {"train_loss": -43.46159744262695, "global_step": 233527, "epoch": 1929} {"train_loss": -43.038902282714844, "global_step": 233528, "epoch": 1929} {"train_loss": -41.930747670575606, "global_step": 233529, "epoch": 1929, "val_loss": 2736980.5} {"train_loss": -43.069068908691406, "global_step": 233530, "epoch": 1930} {"train_loss": -43.002662658691406, "global_step": 233531, "epoch": 1930} {"train_loss": -42.240638732910156, "global_step": 233532, "epoch": 1930} {"train_loss": -42.52302932739258, "global_step": 233533, "epoch": 1930} {"train_loss": -42.87617111206055, "global_step": 233534, "epoch": 1930} {"train_loss": -42.43007278442383, "global_step": 233535, "epoch": 1930} {"train_loss": -42.13869857788086, "global_step": 233536, "epoch": 1930} {"train_loss": -42.59251022338867, "global_step": 233537, "epoch": 1930} {"train_loss": -42.39744567871094, "global_step": 233538, "epoch": 1930} {"train_loss": -42.349212646484375, "global_step": 233539, "epoch": 1930} {"train_loss": -42.400917053222656, "global_step": 233540, "epoch": 1930} {"train_loss": -42.551673889160156, "global_step": 233541, "epoch": 1930} {"train_loss": -42.08847427368164, "global_step": 233542, "epoch": 1930} {"train_loss": -41.67288589477539, "global_step": 233543, "epoch": 1930} {"train_loss": -42.6281623840332, "global_step": 233544, "epoch": 1930} {"train_loss": -42.46686935424805, "global_step": 233545, "epoch": 1930} {"train_loss": -41.65580749511719, "global_step": 233546, "epoch": 1930} {"train_loss": -42.19547653198242, "global_step": 233547, "epoch": 1930} {"train_loss": -42.505271911621094, "global_step": 233548, "epoch": 1930} {"train_loss": -42.050594329833984, "global_step": 233549, "epoch": 1930} {"train_loss": -41.764617919921875, "global_step": 233550, "epoch": 1930} {"train_loss": -41.94485855102539, "global_step": 233551, "epoch": 1930} {"train_loss": -41.478981018066406, "global_step": 233552, "epoch": 1930} {"train_loss": -40.773338317871094, "global_step": 233553, "epoch": 1930} {"train_loss": -40.52688217163086, "global_step": 233554, "epoch": 1930} {"train_loss": -37.812103271484375, "global_step": 233555, "epoch": 1930} {"train_loss": -34.804901123046875, "global_step": 233556, "epoch": 1930} {"train_loss": -38.043975830078125, "global_step": 233557, "epoch": 1930} {"train_loss": -36.54340744018555, "global_step": 233558, "epoch": 1930} {"train_loss": -29.69534683227539, "global_step": 233559, "epoch": 1930} {"train_loss": -36.17987823486328, "global_step": 233560, "epoch": 1930} {"train_loss": -35.604576110839844, "global_step": 233561, "epoch": 1930} {"train_loss": -28.76356315612793, "global_step": 233562, "epoch": 1930} {"train_loss": -31.838565826416016, "global_step": 233563, "epoch": 1930} {"train_loss": -34.56987380981445, "global_step": 233564, "epoch": 1930} {"train_loss": -31.473526000976562, "global_step": 233565, "epoch": 1930} {"train_loss": -37.6602668762207, "global_step": 233566, "epoch": 1930} {"train_loss": -33.88229751586914, "global_step": 233567, "epoch": 1930} {"train_loss": -38.79920196533203, "global_step": 233568, "epoch": 1930} {"train_loss": -32.987789154052734, "global_step": 233569, "epoch": 1930} {"train_loss": -39.83487319946289, "global_step": 233570, "epoch": 1930} {"train_loss": -36.46116638183594, "global_step": 233571, "epoch": 1930} {"train_loss": -39.40920639038086, "global_step": 233572, "epoch": 1930} {"train_loss": -36.269073486328125, "global_step": 233573, "epoch": 1930} {"train_loss": -39.1859016418457, "global_step": 233574, "epoch": 1930} {"train_loss": -36.464778900146484, "global_step": 233575, "epoch": 1930} {"train_loss": -39.717384338378906, "global_step": 233576, "epoch": 1930} {"train_loss": -35.28815460205078, "global_step": 233577, "epoch": 1930} {"train_loss": -40.451873779296875, "global_step": 233578, "epoch": 1930} {"train_loss": -37.14129638671875, "global_step": 233579, "epoch": 1930} {"train_loss": -40.20809555053711, "global_step": 233580, "epoch": 1930} {"train_loss": -39.46354293823242, "global_step": 233581, "epoch": 1930} {"train_loss": -40.18682861328125, "global_step": 233582, "epoch": 1930} {"train_loss": -40.24638366699219, "global_step": 233583, "epoch": 1930} {"train_loss": -40.270301818847656, "global_step": 233584, "epoch": 1930} {"train_loss": -40.5160026550293, "global_step": 233585, "epoch": 1930} {"train_loss": -40.79671096801758, "global_step": 233586, "epoch": 1930} {"train_loss": -40.25409698486328, "global_step": 233587, "epoch": 1930} {"train_loss": -40.27398681640625, "global_step": 233588, "epoch": 1930} {"train_loss": -40.3786735534668, "global_step": 233589, "epoch": 1930} {"train_loss": -40.89863204956055, "global_step": 233590, "epoch": 1930} {"train_loss": -41.020164489746094, "global_step": 233591, "epoch": 1930} {"train_loss": -40.512847900390625, "global_step": 233592, "epoch": 1930} {"train_loss": -40.6703987121582, "global_step": 233593, "epoch": 1930} {"train_loss": -41.071388244628906, "global_step": 233594, "epoch": 1930} {"train_loss": -41.11730194091797, "global_step": 233595, "epoch": 1930} {"train_loss": -41.04262161254883, "global_step": 233596, "epoch": 1930} {"train_loss": -41.261390686035156, "global_step": 233597, "epoch": 1930} {"train_loss": -41.32794952392578, "global_step": 233598, "epoch": 1930} {"train_loss": -41.18090057373047, "global_step": 233599, "epoch": 1930} {"train_loss": -41.53371047973633, "global_step": 233600, "epoch": 1930} {"train_loss": -41.59051513671875, "global_step": 233601, "epoch": 1930} {"train_loss": -41.57267761230469, "global_step": 233602, "epoch": 1930} {"train_loss": -41.330718994140625, "global_step": 233603, "epoch": 1930} {"train_loss": -42.1741828918457, "global_step": 233604, "epoch": 1930} {"train_loss": -41.59368133544922, "global_step": 233605, "epoch": 1930} {"train_loss": -41.64766311645508, "global_step": 233606, "epoch": 1930} {"train_loss": -41.123355865478516, "global_step": 233607, "epoch": 1930} {"train_loss": -42.02530288696289, "global_step": 233608, "epoch": 1930} {"train_loss": -41.38751983642578, "global_step": 233609, "epoch": 1930} {"train_loss": -41.995418548583984, "global_step": 233610, "epoch": 1930} {"train_loss": -41.72431182861328, "global_step": 233611, "epoch": 1930} {"train_loss": -41.79174041748047, "global_step": 233612, "epoch": 1930} {"train_loss": -41.241329193115234, "global_step": 233613, "epoch": 1930} {"train_loss": -41.72039031982422, "global_step": 233614, "epoch": 1930} {"train_loss": -42.04169845581055, "global_step": 233615, "epoch": 1930} {"train_loss": -42.16689682006836, "global_step": 233616, "epoch": 1930} {"train_loss": -42.37797927856445, "global_step": 233617, "epoch": 1930} {"train_loss": -41.87955093383789, "global_step": 233618, "epoch": 1930} {"train_loss": -41.98628616333008, "global_step": 233619, "epoch": 1930} {"train_loss": -42.006256103515625, "global_step": 233620, "epoch": 1930} {"train_loss": -42.4129638671875, "global_step": 233621, "epoch": 1930} {"train_loss": -42.75585174560547, "global_step": 233622, "epoch": 1930} {"train_loss": -42.11912155151367, "global_step": 233623, "epoch": 1930} {"train_loss": -41.74872970581055, "global_step": 233624, "epoch": 1930} {"train_loss": -42.61586380004883, "global_step": 233625, "epoch": 1930} {"train_loss": -42.13663864135742, "global_step": 233626, "epoch": 1930} {"train_loss": -42.380775451660156, "global_step": 233627, "epoch": 1930} {"train_loss": -42.8458251953125, "global_step": 233628, "epoch": 1930} {"train_loss": -42.639129638671875, "global_step": 233629, "epoch": 1930} {"train_loss": -42.57819747924805, "global_step": 233630, "epoch": 1930} {"train_loss": -42.63983917236328, "global_step": 233631, "epoch": 1930} {"train_loss": -42.55353546142578, "global_step": 233632, "epoch": 1930} {"train_loss": -42.41719436645508, "global_step": 233633, "epoch": 1930} {"train_loss": -42.617801666259766, "global_step": 233634, "epoch": 1930} {"train_loss": -42.34677505493164, "global_step": 233635, "epoch": 1930} {"train_loss": -42.02305221557617, "global_step": 233636, "epoch": 1930} {"train_loss": -42.55596923828125, "global_step": 233637, "epoch": 1930} {"train_loss": -42.44169616699219, "global_step": 233638, "epoch": 1930} {"train_loss": -42.6148567199707, "global_step": 233639, "epoch": 1930} {"train_loss": -42.401878356933594, "global_step": 233640, "epoch": 1930} {"train_loss": -43.24866485595703, "global_step": 233641, "epoch": 1930} {"train_loss": -42.68956756591797, "global_step": 233642, "epoch": 1930} {"train_loss": -42.52413558959961, "global_step": 233643, "epoch": 1930} {"train_loss": -42.95878219604492, "global_step": 233644, "epoch": 1930} {"train_loss": -43.3231315612793, "global_step": 233645, "epoch": 1930} {"train_loss": -42.64004135131836, "global_step": 233646, "epoch": 1930} {"train_loss": -42.84821701049805, "global_step": 233647, "epoch": 1930} {"train_loss": -42.65660858154297, "global_step": 233648, "epoch": 1930} {"train_loss": -43.785369873046875, "global_step": 233649, "epoch": 1930} {"train_loss": -40.67233552223395, "global_step": 233650, "epoch": 1930, "val_loss": 2727211.25} {"train_loss": -43.05869674682617, "global_step": 233651, "epoch": 1931} {"train_loss": -42.798980712890625, "global_step": 233652, "epoch": 1931} {"train_loss": -43.114376068115234, "global_step": 233653, "epoch": 1931} {"train_loss": -42.981117248535156, "global_step": 233654, "epoch": 1931} {"train_loss": -43.27157211303711, "global_step": 233655, "epoch": 1931} {"train_loss": -42.976348876953125, "global_step": 233656, "epoch": 1931} {"train_loss": -43.11016082763672, "global_step": 233657, "epoch": 1931} {"train_loss": -41.60242462158203, "global_step": 233658, "epoch": 1931} {"train_loss": -43.26810836791992, "global_step": 233659, "epoch": 1931} {"train_loss": -42.3325080871582, "global_step": 233660, "epoch": 1931} {"train_loss": -42.26357650756836, "global_step": 233661, "epoch": 1931} {"train_loss": -42.290061950683594, "global_step": 233662, "epoch": 1931} {"train_loss": -39.022945404052734, "global_step": 233663, "epoch": 1931} {"train_loss": -36.152645111083984, "global_step": 233664, "epoch": 1931} {"train_loss": -22.986736297607422, "global_step": 233665, "epoch": 1931} {"train_loss": -19.162460327148438, "global_step": 233666, "epoch": 1931} {"train_loss": -31.96109390258789, "global_step": 233667, "epoch": 1931} {"train_loss": -40.496131896972656, "global_step": 233668, "epoch": 1931} {"train_loss": -30.575149536132812, "global_step": 233669, "epoch": 1931} {"train_loss": -35.28571701049805, "global_step": 233670, "epoch": 1931} {"train_loss": -38.8596305847168, "global_step": 233671, "epoch": 1931} {"train_loss": -29.290021896362305, "global_step": 233672, "epoch": 1931} {"train_loss": -40.47272491455078, "global_step": 233673, "epoch": 1931} {"train_loss": -32.227996826171875, "global_step": 233674, "epoch": 1931} {"train_loss": -40.639095306396484, "global_step": 233675, "epoch": 1931} {"train_loss": -33.5888786315918, "global_step": 233676, "epoch": 1931} {"train_loss": -40.53948974609375, "global_step": 233677, "epoch": 1931} {"train_loss": -36.13932418823242, "global_step": 233678, "epoch": 1931} {"train_loss": -40.39371871948242, "global_step": 233679, "epoch": 1931} {"train_loss": -36.15022659301758, "global_step": 233680, "epoch": 1931} {"train_loss": -40.73861312866211, "global_step": 233681, "epoch": 1931} {"train_loss": -38.68068313598633, "global_step": 233682, "epoch": 1931} {"train_loss": -41.171348571777344, "global_step": 233683, "epoch": 1931} {"train_loss": -39.519100189208984, "global_step": 233684, "epoch": 1931} {"train_loss": -39.97856521606445, "global_step": 233685, "epoch": 1931} {"train_loss": -40.81903076171875, "global_step": 233686, "epoch": 1931} {"train_loss": -40.07441329956055, "global_step": 233687, "epoch": 1931} {"train_loss": -41.42885971069336, "global_step": 233688, "epoch": 1931} {"train_loss": -40.293983459472656, "global_step": 233689, "epoch": 1931} {"train_loss": -40.41312789916992, "global_step": 233690, "epoch": 1931} {"train_loss": -41.77241134643555, "global_step": 233691, "epoch": 1931} {"train_loss": -40.28791427612305, "global_step": 233692, "epoch": 1931} {"train_loss": -41.69009017944336, "global_step": 233693, "epoch": 1931} {"train_loss": -41.089210510253906, "global_step": 233694, "epoch": 1931} {"train_loss": -41.220211029052734, "global_step": 233695, "epoch": 1931} {"train_loss": -42.05723190307617, "global_step": 233696, "epoch": 1931} {"train_loss": -41.31782150268555, "global_step": 233697, "epoch": 1931} {"train_loss": -41.88053512573242, "global_step": 233698, "epoch": 1931} {"train_loss": -41.88845443725586, "global_step": 233699, "epoch": 1931} {"train_loss": -41.37764358520508, "global_step": 233700, "epoch": 1931} {"train_loss": -41.76190948486328, "global_step": 233701, "epoch": 1931} {"train_loss": -41.50129318237305, "global_step": 233702, "epoch": 1931} {"train_loss": -42.29048538208008, "global_step": 233703, "epoch": 1931} {"train_loss": -41.86967849731445, "global_step": 233704, "epoch": 1931} {"train_loss": -41.42749786376953, "global_step": 233705, "epoch": 1931} {"train_loss": -42.45562744140625, "global_step": 233706, "epoch": 1931} {"train_loss": -41.812435150146484, "global_step": 233707, "epoch": 1931} {"train_loss": -42.183921813964844, "global_step": 233708, "epoch": 1931} {"train_loss": -42.392799377441406, "global_step": 233709, "epoch": 1931} {"train_loss": -41.71393966674805, "global_step": 233710, "epoch": 1931} {"train_loss": -42.176849365234375, "global_step": 233711, "epoch": 1931} {"train_loss": -42.148948669433594, "global_step": 233712, "epoch": 1931} {"train_loss": -41.77457809448242, "global_step": 233713, "epoch": 1931} {"train_loss": -42.46949768066406, "global_step": 233714, "epoch": 1931} {"train_loss": -42.30049514770508, "global_step": 233715, "epoch": 1931} {"train_loss": -42.59724807739258, "global_step": 233716, "epoch": 1931} {"train_loss": -42.653934478759766, "global_step": 233717, "epoch": 1931} {"train_loss": -42.60918045043945, "global_step": 233718, "epoch": 1931} {"train_loss": -42.9527473449707, "global_step": 233719, "epoch": 1931} {"train_loss": -42.708011627197266, "global_step": 233720, "epoch": 1931} {"train_loss": -42.872249603271484, "global_step": 233721, "epoch": 1931} {"train_loss": -42.497257232666016, "global_step": 233722, "epoch": 1931} {"train_loss": -43.09566879272461, "global_step": 233723, "epoch": 1931} {"train_loss": -42.400875091552734, "global_step": 233724, "epoch": 1931} {"train_loss": -43.19629669189453, "global_step": 233725, "epoch": 1931} {"train_loss": -42.57150650024414, "global_step": 233726, "epoch": 1931} {"train_loss": -42.57451248168945, "global_step": 233727, "epoch": 1931} {"train_loss": -42.92806625366211, "global_step": 233728, "epoch": 1931} {"train_loss": -43.1719970703125, "global_step": 233729, "epoch": 1931} {"train_loss": -42.68490219116211, "global_step": 233730, "epoch": 1931} {"train_loss": -43.23088455200195, "global_step": 233731, "epoch": 1931} {"train_loss": -43.15866470336914, "global_step": 233732, "epoch": 1931} {"train_loss": -42.6026611328125, "global_step": 233733, "epoch": 1931} {"train_loss": -42.842002868652344, "global_step": 233734, "epoch": 1931} {"train_loss": -43.25307083129883, "global_step": 233735, "epoch": 1931} {"train_loss": -43.009521484375, "global_step": 233736, "epoch": 1931} {"train_loss": -43.21992111206055, "global_step": 233737, "epoch": 1931} {"train_loss": -43.419189453125, "global_step": 233738, "epoch": 1931} {"train_loss": -43.589141845703125, "global_step": 233739, "epoch": 1931} {"train_loss": -42.88874435424805, "global_step": 233740, "epoch": 1931} {"train_loss": -43.56830978393555, "global_step": 233741, "epoch": 1931} {"train_loss": -42.74555587768555, "global_step": 233742, "epoch": 1931} {"train_loss": -43.1054573059082, "global_step": 233743, "epoch": 1931} {"train_loss": -43.393550872802734, "global_step": 233744, "epoch": 1931} {"train_loss": -43.6113166809082, "global_step": 233745, "epoch": 1931} {"train_loss": -43.70327377319336, "global_step": 233746, "epoch": 1931} {"train_loss": -43.35175704956055, "global_step": 233747, "epoch": 1931} {"train_loss": -43.5267333984375, "global_step": 233748, "epoch": 1931} {"train_loss": -43.953853607177734, "global_step": 233749, "epoch": 1931} {"train_loss": -43.19611358642578, "global_step": 233750, "epoch": 1931} {"train_loss": -41.62750244140625, "global_step": 233751, "epoch": 1931} {"train_loss": -43.714080810546875, "global_step": 233752, "epoch": 1931} {"train_loss": -43.16083526611328, "global_step": 233753, "epoch": 1931} {"train_loss": -43.491783142089844, "global_step": 233754, "epoch": 1931} {"train_loss": -43.36274337768555, "global_step": 233755, "epoch": 1931} {"train_loss": -42.72498321533203, "global_step": 233756, "epoch": 1931} {"train_loss": -43.25946807861328, "global_step": 233757, "epoch": 1931} {"train_loss": -43.96485137939453, "global_step": 233758, "epoch": 1931} {"train_loss": -43.05499267578125, "global_step": 233759, "epoch": 1931} {"train_loss": -42.54075622558594, "global_step": 233760, "epoch": 1931} {"train_loss": -41.9738655090332, "global_step": 233761, "epoch": 1931} {"train_loss": -42.160614013671875, "global_step": 233762, "epoch": 1931} {"train_loss": -43.391090393066406, "global_step": 233763, "epoch": 1931} {"train_loss": -41.61716842651367, "global_step": 233764, "epoch": 1931} {"train_loss": -39.87557601928711, "global_step": 233765, "epoch": 1931} {"train_loss": -38.95871353149414, "global_step": 233766, "epoch": 1931} {"train_loss": -40.85770797729492, "global_step": 233767, "epoch": 1931} {"train_loss": -42.79954147338867, "global_step": 233768, "epoch": 1931} {"train_loss": -41.881561279296875, "global_step": 233769, "epoch": 1931} {"train_loss": -38.56563949584961, "global_step": 233770, "epoch": 1931} {"train_loss": -41.11416964885617, "global_step": 233771, "epoch": 1931, "val_loss": 2674815.25} {"train_loss": -41.348201751708984, "global_step": 233772, "epoch": 1932} {"train_loss": -42.27499008178711, "global_step": 233773, "epoch": 1932} {"train_loss": -41.430782318115234, "global_step": 233774, "epoch": 1932} {"train_loss": -40.64088821411133, "global_step": 233775, "epoch": 1932} {"train_loss": -42.31844711303711, "global_step": 233776, "epoch": 1932} {"train_loss": -43.08096694946289, "global_step": 233777, "epoch": 1932} {"train_loss": -41.08612823486328, "global_step": 233778, "epoch": 1932} {"train_loss": -42.0733757019043, "global_step": 233779, "epoch": 1932} {"train_loss": -42.361446380615234, "global_step": 233780, "epoch": 1932} {"train_loss": -40.8748664855957, "global_step": 233781, "epoch": 1932} {"train_loss": -41.23286056518555, "global_step": 233782, "epoch": 1932} {"train_loss": -42.306068420410156, "global_step": 233783, "epoch": 1932} {"train_loss": -42.60308837890625, "global_step": 233784, "epoch": 1932} {"train_loss": -41.78453063964844, "global_step": 233785, "epoch": 1932} {"train_loss": -42.541603088378906, "global_step": 233786, "epoch": 1932} {"train_loss": -42.60178756713867, "global_step": 233787, "epoch": 1932} {"train_loss": -42.59833908081055, "global_step": 233788, "epoch": 1932} {"train_loss": -42.86106491088867, "global_step": 233789, "epoch": 1932} {"train_loss": -42.63630294799805, "global_step": 233790, "epoch": 1932} {"train_loss": -40.93353271484375, "global_step": 233791, "epoch": 1932} {"train_loss": -41.674373626708984, "global_step": 233792, "epoch": 1932} {"train_loss": -40.962005615234375, "global_step": 233793, "epoch": 1932} {"train_loss": -42.44942092895508, "global_step": 233794, "epoch": 1932} {"train_loss": -41.39929962158203, "global_step": 233795, "epoch": 1932} {"train_loss": -41.975162506103516, "global_step": 233796, "epoch": 1932} {"train_loss": -40.938594818115234, "global_step": 233797, "epoch": 1932} {"train_loss": -41.38511276245117, "global_step": 233798, "epoch": 1932} {"train_loss": -42.07902908325195, "global_step": 233799, "epoch": 1932} {"train_loss": -42.240108489990234, "global_step": 233800, "epoch": 1932} {"train_loss": -40.685096740722656, "global_step": 233801, "epoch": 1932} {"train_loss": -42.81426239013672, "global_step": 233802, "epoch": 1932} {"train_loss": -42.113983154296875, "global_step": 233803, "epoch": 1932} {"train_loss": -41.486995697021484, "global_step": 233804, "epoch": 1932} {"train_loss": -41.1339111328125, "global_step": 233805, "epoch": 1932} {"train_loss": -41.74528121948242, "global_step": 233806, "epoch": 1932} {"train_loss": -41.290252685546875, "global_step": 233807, "epoch": 1932} {"train_loss": -42.07863998413086, "global_step": 233808, "epoch": 1932} {"train_loss": -42.34039306640625, "global_step": 233809, "epoch": 1932} {"train_loss": -40.793373107910156, "global_step": 233810, "epoch": 1932} {"train_loss": -42.67852783203125, "global_step": 233811, "epoch": 1932} {"train_loss": -40.527587890625, "global_step": 233812, "epoch": 1932} {"train_loss": -40.53193283081055, "global_step": 233813, "epoch": 1932} {"train_loss": -43.10527420043945, "global_step": 233814, "epoch": 1932} {"train_loss": -42.01161575317383, "global_step": 233815, "epoch": 1932} {"train_loss": -40.355159759521484, "global_step": 233816, "epoch": 1932} {"train_loss": -43.024417877197266, "global_step": 233817, "epoch": 1932} {"train_loss": -42.01841354370117, "global_step": 233818, "epoch": 1932} {"train_loss": -41.47958755493164, "global_step": 233819, "epoch": 1932} {"train_loss": -42.14673614501953, "global_step": 233820, "epoch": 1932} {"train_loss": -41.67555618286133, "global_step": 233821, "epoch": 1932} {"train_loss": -41.598384857177734, "global_step": 233822, "epoch": 1932} {"train_loss": -42.52431106567383, "global_step": 233823, "epoch": 1932} {"train_loss": -41.163326263427734, "global_step": 233824, "epoch": 1932} {"train_loss": -41.284645080566406, "global_step": 233825, "epoch": 1932} {"train_loss": -39.69000244140625, "global_step": 233826, "epoch": 1932} {"train_loss": -40.15188217163086, "global_step": 233827, "epoch": 1932} {"train_loss": -43.081817626953125, "global_step": 233828, "epoch": 1932} {"train_loss": -40.415584564208984, "global_step": 233829, "epoch": 1932} {"train_loss": -39.44343185424805, "global_step": 233830, "epoch": 1932} {"train_loss": -38.538734436035156, "global_step": 233831, "epoch": 1932} {"train_loss": -40.508331298828125, "global_step": 233832, "epoch": 1932} {"train_loss": -41.61234664916992, "global_step": 233833, "epoch": 1932} {"train_loss": -41.30318832397461, "global_step": 233834, "epoch": 1932} {"train_loss": -41.28859329223633, "global_step": 233835, "epoch": 1932} {"train_loss": -41.1718864440918, "global_step": 233836, "epoch": 1932} {"train_loss": -42.537654876708984, "global_step": 233837, "epoch": 1932} {"train_loss": -41.02567672729492, "global_step": 233838, "epoch": 1932} {"train_loss": -42.466407775878906, "global_step": 233839, "epoch": 1932} {"train_loss": -42.05208969116211, "global_step": 233840, "epoch": 1932} {"train_loss": -41.59904098510742, "global_step": 233841, "epoch": 1932} {"train_loss": -41.60829544067383, "global_step": 233842, "epoch": 1932} {"train_loss": -41.621578216552734, "global_step": 233843, "epoch": 1932} {"train_loss": -42.57598876953125, "global_step": 233844, "epoch": 1932} {"train_loss": -41.804420471191406, "global_step": 233845, "epoch": 1932} {"train_loss": -41.85475158691406, "global_step": 233846, "epoch": 1932} {"train_loss": -41.65167236328125, "global_step": 233847, "epoch": 1932} {"train_loss": -41.94547653198242, "global_step": 233848, "epoch": 1932} {"train_loss": -42.134613037109375, "global_step": 233849, "epoch": 1932} {"train_loss": -42.78573226928711, "global_step": 233850, "epoch": 1932} {"train_loss": -41.6911735534668, "global_step": 233851, "epoch": 1932} {"train_loss": -42.62942123413086, "global_step": 233852, "epoch": 1932} {"train_loss": -42.41923141479492, "global_step": 233853, "epoch": 1932} {"train_loss": -42.18642044067383, "global_step": 233854, "epoch": 1932} {"train_loss": -43.18204116821289, "global_step": 233855, "epoch": 1932} {"train_loss": -42.7567253112793, "global_step": 233856, "epoch": 1932} {"train_loss": -42.77668762207031, "global_step": 233857, "epoch": 1932} {"train_loss": -43.270511627197266, "global_step": 233858, "epoch": 1932} {"train_loss": -42.82278060913086, "global_step": 233859, "epoch": 1932} {"train_loss": -42.907649993896484, "global_step": 233860, "epoch": 1932} {"train_loss": -42.89439010620117, "global_step": 233861, "epoch": 1932} {"train_loss": -42.440162658691406, "global_step": 233862, "epoch": 1932} {"train_loss": -42.57843017578125, "global_step": 233863, "epoch": 1932} {"train_loss": -40.528419494628906, "global_step": 233864, "epoch": 1932} {"train_loss": -42.53457260131836, "global_step": 233865, "epoch": 1932} {"train_loss": -42.89311599731445, "global_step": 233866, "epoch": 1932} {"train_loss": -42.88552474975586, "global_step": 233867, "epoch": 1932} {"train_loss": -42.45466232299805, "global_step": 233868, "epoch": 1932} {"train_loss": -43.05875778198242, "global_step": 233869, "epoch": 1932} {"train_loss": -42.510467529296875, "global_step": 233870, "epoch": 1932} {"train_loss": -42.412879943847656, "global_step": 233871, "epoch": 1932} {"train_loss": -43.2559928894043, "global_step": 233872, "epoch": 1932} {"train_loss": -42.5098991394043, "global_step": 233873, "epoch": 1932} {"train_loss": -42.78682327270508, "global_step": 233874, "epoch": 1932} {"train_loss": -42.91729736328125, "global_step": 233875, "epoch": 1932} {"train_loss": -41.94111251831055, "global_step": 233876, "epoch": 1932} {"train_loss": -42.45759963989258, "global_step": 233877, "epoch": 1932} {"train_loss": -41.82999801635742, "global_step": 233878, "epoch": 1932} {"train_loss": -40.7487678527832, "global_step": 233879, "epoch": 1932} {"train_loss": -43.05595779418945, "global_step": 233880, "epoch": 1932} {"train_loss": -41.5856819152832, "global_step": 233881, "epoch": 1932} {"train_loss": -42.81355667114258, "global_step": 233882, "epoch": 1932} {"train_loss": -41.6194953918457, "global_step": 233883, "epoch": 1932} {"train_loss": -41.842838287353516, "global_step": 233884, "epoch": 1932} {"train_loss": -41.5301513671875, "global_step": 233885, "epoch": 1932} {"train_loss": -41.247840881347656, "global_step": 233886, "epoch": 1932} {"train_loss": -41.59503936767578, "global_step": 233887, "epoch": 1932} {"train_loss": -41.00075149536133, "global_step": 233888, "epoch": 1932} {"train_loss": -41.04884338378906, "global_step": 233889, "epoch": 1932} {"train_loss": -42.10317611694336, "global_step": 233890, "epoch": 1932} {"train_loss": -41.807308197021484, "global_step": 233891, "epoch": 1932} {"train_loss": -41.882346003508765, "global_step": 233892, "epoch": 1932, "val_loss": 2557050.0} {"train_loss": -42.54568099975586, "global_step": 233893, "epoch": 1933} {"train_loss": -42.0002326965332, "global_step": 233894, "epoch": 1933} {"train_loss": -42.589508056640625, "global_step": 233895, "epoch": 1933} {"train_loss": -42.1035270690918, "global_step": 233896, "epoch": 1933} {"train_loss": -41.80985641479492, "global_step": 233897, "epoch": 1933} {"train_loss": -42.497493743896484, "global_step": 233898, "epoch": 1933} {"train_loss": -42.147403717041016, "global_step": 233899, "epoch": 1933} {"train_loss": -40.82773971557617, "global_step": 233900, "epoch": 1933} {"train_loss": -41.593910217285156, "global_step": 233901, "epoch": 1933} {"train_loss": -42.44019317626953, "global_step": 233902, "epoch": 1933} {"train_loss": -41.68082809448242, "global_step": 233903, "epoch": 1933} {"train_loss": -41.67877960205078, "global_step": 233904, "epoch": 1933} {"train_loss": -42.79731369018555, "global_step": 233905, "epoch": 1933} {"train_loss": -42.25843048095703, "global_step": 233906, "epoch": 1933} {"train_loss": -42.080257415771484, "global_step": 233907, "epoch": 1933} {"train_loss": -41.38413619995117, "global_step": 233908, "epoch": 1933} {"train_loss": -39.82913589477539, "global_step": 233909, "epoch": 1933} {"train_loss": -42.869667053222656, "global_step": 233910, "epoch": 1933} {"train_loss": -43.16859817504883, "global_step": 233911, "epoch": 1933} {"train_loss": -41.273475646972656, "global_step": 233912, "epoch": 1933} {"train_loss": -40.6234130859375, "global_step": 233913, "epoch": 1933} {"train_loss": -42.9499626159668, "global_step": 233914, "epoch": 1933} {"train_loss": -42.206146240234375, "global_step": 233915, "epoch": 1933} {"train_loss": -39.6448860168457, "global_step": 233916, "epoch": 1933} {"train_loss": -41.5117301940918, "global_step": 233917, "epoch": 1933} {"train_loss": -42.569236755371094, "global_step": 233918, "epoch": 1933} {"train_loss": -41.866092681884766, "global_step": 233919, "epoch": 1933} {"train_loss": -40.93851852416992, "global_step": 233920, "epoch": 1933} {"train_loss": -41.55767822265625, "global_step": 233921, "epoch": 1933} {"train_loss": -42.333580017089844, "global_step": 233922, "epoch": 1933} {"train_loss": -40.8679313659668, "global_step": 233923, "epoch": 1933} {"train_loss": -39.6602668762207, "global_step": 233924, "epoch": 1933} {"train_loss": -41.519832611083984, "global_step": 233925, "epoch": 1933} {"train_loss": -42.241546630859375, "global_step": 233926, "epoch": 1933} {"train_loss": -40.72488021850586, "global_step": 233927, "epoch": 1933} {"train_loss": -42.34473419189453, "global_step": 233928, "epoch": 1933} {"train_loss": -42.39780044555664, "global_step": 233929, "epoch": 1933} {"train_loss": -42.79413986206055, "global_step": 233930, "epoch": 1933} {"train_loss": -42.348690032958984, "global_step": 233931, "epoch": 1933} {"train_loss": -43.136714935302734, "global_step": 233932, "epoch": 1933} {"train_loss": -41.676597595214844, "global_step": 233933, "epoch": 1933} {"train_loss": -41.242340087890625, "global_step": 233934, "epoch": 1933} {"train_loss": -42.8909797668457, "global_step": 233935, "epoch": 1933} {"train_loss": -42.224178314208984, "global_step": 233936, "epoch": 1933} {"train_loss": -41.389583587646484, "global_step": 233937, "epoch": 1933} {"train_loss": -42.45576095581055, "global_step": 233938, "epoch": 1933} {"train_loss": -42.28012466430664, "global_step": 233939, "epoch": 1933} {"train_loss": -41.464874267578125, "global_step": 233940, "epoch": 1933} {"train_loss": -42.29719543457031, "global_step": 233941, "epoch": 1933} {"train_loss": -42.475582122802734, "global_step": 233942, "epoch": 1933} {"train_loss": -41.468849182128906, "global_step": 233943, "epoch": 1933} {"train_loss": -42.39646530151367, "global_step": 233944, "epoch": 1933} {"train_loss": -41.60751724243164, "global_step": 233945, "epoch": 1933} {"train_loss": -43.17731857299805, "global_step": 233946, "epoch": 1933} {"train_loss": -43.13225173950195, "global_step": 233947, "epoch": 1933} {"train_loss": -42.598392486572266, "global_step": 233948, "epoch": 1933} {"train_loss": -42.983760833740234, "global_step": 233949, "epoch": 1933} {"train_loss": -41.54323959350586, "global_step": 233950, "epoch": 1933} {"train_loss": -42.00596237182617, "global_step": 233951, "epoch": 1933} {"train_loss": -43.38352584838867, "global_step": 233952, "epoch": 1933} {"train_loss": -42.228309631347656, "global_step": 233953, "epoch": 1933} {"train_loss": -42.04735565185547, "global_step": 233954, "epoch": 1933} {"train_loss": -42.40482711791992, "global_step": 233955, "epoch": 1933} {"train_loss": -42.981605529785156, "global_step": 233956, "epoch": 1933} {"train_loss": -42.41744613647461, "global_step": 233957, "epoch": 1933} {"train_loss": -41.75413131713867, "global_step": 233958, "epoch": 1933} {"train_loss": -42.97949981689453, "global_step": 233959, "epoch": 1933} {"train_loss": -40.41764831542969, "global_step": 233960, "epoch": 1933} {"train_loss": -39.00128936767578, "global_step": 233961, "epoch": 1933} {"train_loss": -40.3181037902832, "global_step": 233962, "epoch": 1933} {"train_loss": -42.68425369262695, "global_step": 233963, "epoch": 1933} {"train_loss": -42.30143737792969, "global_step": 233964, "epoch": 1933} {"train_loss": -38.561195373535156, "global_step": 233965, "epoch": 1933} {"train_loss": -42.769989013671875, "global_step": 233966, "epoch": 1933} {"train_loss": -42.3726921081543, "global_step": 233967, "epoch": 1933} {"train_loss": -41.741188049316406, "global_step": 233968, "epoch": 1933} {"train_loss": -39.8770751953125, "global_step": 233969, "epoch": 1933} {"train_loss": -42.34159469604492, "global_step": 233970, "epoch": 1933} {"train_loss": -42.074867248535156, "global_step": 233971, "epoch": 1933} {"train_loss": -40.676212310791016, "global_step": 233972, "epoch": 1933} {"train_loss": -42.083824157714844, "global_step": 233973, "epoch": 1933} {"train_loss": -31.8485107421875, "global_step": 233974, "epoch": 1933} {"train_loss": -40.25564193725586, "global_step": 233975, "epoch": 1933} {"train_loss": -41.107234954833984, "global_step": 233976, "epoch": 1933} {"train_loss": -39.413124084472656, "global_step": 233977, "epoch": 1933} {"train_loss": -40.32737350463867, "global_step": 233978, "epoch": 1933} {"train_loss": -41.459083557128906, "global_step": 233979, "epoch": 1933} {"train_loss": -42.31829071044922, "global_step": 233980, "epoch": 1933} {"train_loss": -41.79411697387695, "global_step": 233981, "epoch": 1933} {"train_loss": -42.45662307739258, "global_step": 233982, "epoch": 1933} {"train_loss": -37.713844299316406, "global_step": 233983, "epoch": 1933} {"train_loss": -40.97368240356445, "global_step": 233984, "epoch": 1933} {"train_loss": -42.44446563720703, "global_step": 233985, "epoch": 1933} {"train_loss": -40.464927673339844, "global_step": 233986, "epoch": 1933} {"train_loss": -38.09672164916992, "global_step": 233987, "epoch": 1933} {"train_loss": -39.28144454956055, "global_step": 233988, "epoch": 1933} {"train_loss": -42.16594696044922, "global_step": 233989, "epoch": 1933} {"train_loss": -41.3392219543457, "global_step": 233990, "epoch": 1933} {"train_loss": -41.55268859863281, "global_step": 233991, "epoch": 1933} {"train_loss": -40.252986907958984, "global_step": 233992, "epoch": 1933} {"train_loss": -35.23423385620117, "global_step": 233993, "epoch": 1933} {"train_loss": -32.12312316894531, "global_step": 233994, "epoch": 1933} {"train_loss": -40.198936462402344, "global_step": 233995, "epoch": 1933} {"train_loss": -39.324951171875, "global_step": 233996, "epoch": 1933} {"train_loss": -36.26192855834961, "global_step": 233997, "epoch": 1933} {"train_loss": -37.59522247314453, "global_step": 233998, "epoch": 1933} {"train_loss": -41.3852424621582, "global_step": 233999, "epoch": 1933} {"train_loss": -39.63837814331055, "global_step": 234000, "epoch": 1933} {"train_loss": -41.43075180053711, "global_step": 234001, "epoch": 1933} {"train_loss": -34.89193344116211, "global_step": 234002, "epoch": 1933} {"train_loss": -39.18500900268555, "global_step": 234003, "epoch": 1933} {"train_loss": -40.857872009277344, "global_step": 234004, "epoch": 1933} {"train_loss": -39.624366760253906, "global_step": 234005, "epoch": 1933} {"train_loss": -40.68357467651367, "global_step": 234006, "epoch": 1933} {"train_loss": -37.91935729980469, "global_step": 234007, "epoch": 1933} {"train_loss": -40.70249938964844, "global_step": 234008, "epoch": 1933} {"train_loss": -41.697994232177734, "global_step": 234009, "epoch": 1933} {"train_loss": -40.94950485229492, "global_step": 234010, "epoch": 1933} {"train_loss": -41.67158126831055, "global_step": 234011, "epoch": 1933} {"train_loss": -38.89127731323242, "global_step": 234012, "epoch": 1933} {"train_loss": -41.14883280982656, "global_step": 234013, "epoch": 1933, "val_loss": 2606331.5} {"train_loss": -39.174842834472656, "global_step": 234014, "epoch": 1934} {"train_loss": -40.82981491088867, "global_step": 234015, "epoch": 1934} {"train_loss": -40.22965621948242, "global_step": 234016, "epoch": 1934} {"train_loss": -40.065616607666016, "global_step": 234017, "epoch": 1934} {"train_loss": -39.44680404663086, "global_step": 234018, "epoch": 1934} {"train_loss": -40.310359954833984, "global_step": 234019, "epoch": 1934} {"train_loss": -41.22665023803711, "global_step": 234020, "epoch": 1934} {"train_loss": -40.81686782836914, "global_step": 234021, "epoch": 1934} {"train_loss": -40.771629333496094, "global_step": 234022, "epoch": 1934} {"train_loss": -41.84891128540039, "global_step": 234023, "epoch": 1934} {"train_loss": -40.79215621948242, "global_step": 234024, "epoch": 1934} {"train_loss": -40.35702133178711, "global_step": 234025, "epoch": 1934} {"train_loss": -41.217708587646484, "global_step": 234026, "epoch": 1934} {"train_loss": -41.30393981933594, "global_step": 234027, "epoch": 1934} {"train_loss": -39.70178985595703, "global_step": 234028, "epoch": 1934} {"train_loss": -42.28186798095703, "global_step": 234029, "epoch": 1934} {"train_loss": -40.775142669677734, "global_step": 234030, "epoch": 1934} {"train_loss": -41.031280517578125, "global_step": 234031, "epoch": 1934} {"train_loss": -41.567848205566406, "global_step": 234032, "epoch": 1934} {"train_loss": -40.88651657104492, "global_step": 234033, "epoch": 1934} {"train_loss": -41.80750274658203, "global_step": 234034, "epoch": 1934} {"train_loss": -42.032257080078125, "global_step": 234035, "epoch": 1934} {"train_loss": -41.9625358581543, "global_step": 234036, "epoch": 1934} {"train_loss": -41.907623291015625, "global_step": 234037, "epoch": 1934} {"train_loss": -42.078453063964844, "global_step": 234038, "epoch": 1934} {"train_loss": -41.68928146362305, "global_step": 234039, "epoch": 1934} {"train_loss": -42.1504020690918, "global_step": 234040, "epoch": 1934} {"train_loss": -41.54665756225586, "global_step": 234041, "epoch": 1934} {"train_loss": -42.19951248168945, "global_step": 234042, "epoch": 1934} {"train_loss": -42.079833984375, "global_step": 234043, "epoch": 1934} {"train_loss": -42.47969055175781, "global_step": 234044, "epoch": 1934} {"train_loss": -41.44965362548828, "global_step": 234045, "epoch": 1934} {"train_loss": -42.21525192260742, "global_step": 234046, "epoch": 1934} {"train_loss": -41.77704620361328, "global_step": 234047, "epoch": 1934} {"train_loss": -42.35680389404297, "global_step": 234048, "epoch": 1934} {"train_loss": -42.78767013549805, "global_step": 234049, "epoch": 1934} {"train_loss": -42.33927536010742, "global_step": 234050, "epoch": 1934} {"train_loss": -40.234432220458984, "global_step": 234051, "epoch": 1934} {"train_loss": -41.290435791015625, "global_step": 234052, "epoch": 1934} {"train_loss": -42.1260871887207, "global_step": 234053, "epoch": 1934} {"train_loss": -42.91979217529297, "global_step": 234054, "epoch": 1934} {"train_loss": -42.37710189819336, "global_step": 234055, "epoch": 1934} {"train_loss": -41.88431930541992, "global_step": 234056, "epoch": 1934} {"train_loss": -42.290687561035156, "global_step": 234057, "epoch": 1934} {"train_loss": -42.909446716308594, "global_step": 234058, "epoch": 1934} {"train_loss": -42.782989501953125, "global_step": 234059, "epoch": 1934} {"train_loss": -42.53915786743164, "global_step": 234060, "epoch": 1934} {"train_loss": -42.51594161987305, "global_step": 234061, "epoch": 1934} {"train_loss": -42.163143157958984, "global_step": 234062, "epoch": 1934} {"train_loss": -42.38836669921875, "global_step": 234063, "epoch": 1934} {"train_loss": -42.61623001098633, "global_step": 234064, "epoch": 1934} {"train_loss": -42.764617919921875, "global_step": 234065, "epoch": 1934} {"train_loss": -42.20992660522461, "global_step": 234066, "epoch": 1934} {"train_loss": -42.47772979736328, "global_step": 234067, "epoch": 1934} {"train_loss": -42.3796501159668, "global_step": 234068, "epoch": 1934} {"train_loss": -42.740699768066406, "global_step": 234069, "epoch": 1934} {"train_loss": -42.41707992553711, "global_step": 234070, "epoch": 1934} {"train_loss": -42.498958587646484, "global_step": 234071, "epoch": 1934} {"train_loss": -42.9455680847168, "global_step": 234072, "epoch": 1934} {"train_loss": -41.448944091796875, "global_step": 234073, "epoch": 1934} {"train_loss": -40.24067306518555, "global_step": 234074, "epoch": 1934} {"train_loss": -42.33376693725586, "global_step": 234075, "epoch": 1934} {"train_loss": -42.93866729736328, "global_step": 234076, "epoch": 1934} {"train_loss": -42.023441314697266, "global_step": 234077, "epoch": 1934} {"train_loss": -40.647823333740234, "global_step": 234078, "epoch": 1934} {"train_loss": -42.242958068847656, "global_step": 234079, "epoch": 1934} {"train_loss": -42.74702072143555, "global_step": 234080, "epoch": 1934} {"train_loss": -42.282344818115234, "global_step": 234081, "epoch": 1934} {"train_loss": -41.04745864868164, "global_step": 234082, "epoch": 1934} {"train_loss": -41.86698532104492, "global_step": 234083, "epoch": 1934} {"train_loss": -42.17849349975586, "global_step": 234084, "epoch": 1934} {"train_loss": -42.93388366699219, "global_step": 234085, "epoch": 1934} {"train_loss": -42.2597770690918, "global_step": 234086, "epoch": 1934} {"train_loss": -42.877174377441406, "global_step": 234087, "epoch": 1934} {"train_loss": -43.11209487915039, "global_step": 234088, "epoch": 1934} {"train_loss": -42.5387077331543, "global_step": 234089, "epoch": 1934} {"train_loss": -42.859710693359375, "global_step": 234090, "epoch": 1934} {"train_loss": -43.379520416259766, "global_step": 234091, "epoch": 1934} {"train_loss": -42.64109802246094, "global_step": 234092, "epoch": 1934} {"train_loss": -42.57520294189453, "global_step": 234093, "epoch": 1934} {"train_loss": -42.78983688354492, "global_step": 234094, "epoch": 1934} {"train_loss": -42.83990478515625, "global_step": 234095, "epoch": 1934} {"train_loss": -42.6977424621582, "global_step": 234096, "epoch": 1934} {"train_loss": -43.134864807128906, "global_step": 234097, "epoch": 1934} {"train_loss": -42.94081115722656, "global_step": 234098, "epoch": 1934} {"train_loss": -43.17257308959961, "global_step": 234099, "epoch": 1934} {"train_loss": -43.16036605834961, "global_step": 234100, "epoch": 1934} {"train_loss": -42.47127914428711, "global_step": 234101, "epoch": 1934} {"train_loss": -42.61472702026367, "global_step": 234102, "epoch": 1934} {"train_loss": -43.05550003051758, "global_step": 234103, "epoch": 1934} {"train_loss": -42.28280258178711, "global_step": 234104, "epoch": 1934} {"train_loss": -42.89779281616211, "global_step": 234105, "epoch": 1934} {"train_loss": -42.1723747253418, "global_step": 234106, "epoch": 1934} {"train_loss": -41.905799865722656, "global_step": 234107, "epoch": 1934} {"train_loss": -41.37173080444336, "global_step": 234108, "epoch": 1934} {"train_loss": -41.091461181640625, "global_step": 234109, "epoch": 1934} {"train_loss": -41.048492431640625, "global_step": 234110, "epoch": 1934} {"train_loss": -42.35783004760742, "global_step": 234111, "epoch": 1934} {"train_loss": -42.51750946044922, "global_step": 234112, "epoch": 1934} {"train_loss": -42.40107727050781, "global_step": 234113, "epoch": 1934} {"train_loss": -41.615718841552734, "global_step": 234114, "epoch": 1934} {"train_loss": -42.43192672729492, "global_step": 234115, "epoch": 1934} {"train_loss": -42.606544494628906, "global_step": 234116, "epoch": 1934} {"train_loss": -42.270294189453125, "global_step": 234117, "epoch": 1934} {"train_loss": -40.8099250793457, "global_step": 234118, "epoch": 1934} {"train_loss": -41.09926986694336, "global_step": 234119, "epoch": 1934} {"train_loss": -43.01935577392578, "global_step": 234120, "epoch": 1934} {"train_loss": -40.91255569458008, "global_step": 234121, "epoch": 1934} {"train_loss": -41.06538391113281, "global_step": 234122, "epoch": 1934} {"train_loss": -41.551910400390625, "global_step": 234123, "epoch": 1934} {"train_loss": -42.986629486083984, "global_step": 234124, "epoch": 1934} {"train_loss": -41.44661331176758, "global_step": 234125, "epoch": 1934} {"train_loss": -41.78451156616211, "global_step": 234126, "epoch": 1934} {"train_loss": -42.308692932128906, "global_step": 234127, "epoch": 1934} {"train_loss": -41.021766662597656, "global_step": 234128, "epoch": 1934} {"train_loss": -42.44245147705078, "global_step": 234129, "epoch": 1934} {"train_loss": -42.496192932128906, "global_step": 234130, "epoch": 1934} {"train_loss": -42.44704818725586, "global_step": 234131, "epoch": 1934} {"train_loss": -42.008575439453125, "global_step": 234132, "epoch": 1934} {"train_loss": -39.5643424987793, "global_step": 234133, "epoch": 1934} {"train_loss": -41.942241542595475, "global_step": 234134, "epoch": 1934, "val_loss": 2614700.75} {"train_loss": -41.731685638427734, "global_step": 234135, "epoch": 1935} {"train_loss": -41.35965347290039, "global_step": 234136, "epoch": 1935} {"train_loss": -42.663856506347656, "global_step": 234137, "epoch": 1935} {"train_loss": -42.09089279174805, "global_step": 234138, "epoch": 1935} {"train_loss": -42.43992233276367, "global_step": 234139, "epoch": 1935} {"train_loss": -41.96586227416992, "global_step": 234140, "epoch": 1935} {"train_loss": -41.71682357788086, "global_step": 234141, "epoch": 1935} {"train_loss": -42.42499923706055, "global_step": 234142, "epoch": 1935} {"train_loss": -41.47072982788086, "global_step": 234143, "epoch": 1935} {"train_loss": -42.018089294433594, "global_step": 234144, "epoch": 1935} {"train_loss": -42.925994873046875, "global_step": 234145, "epoch": 1935} {"train_loss": -42.59477615356445, "global_step": 234146, "epoch": 1935} {"train_loss": -42.6242561340332, "global_step": 234147, "epoch": 1935} {"train_loss": -40.85315704345703, "global_step": 234148, "epoch": 1935} {"train_loss": -41.55874252319336, "global_step": 234149, "epoch": 1935} {"train_loss": -42.013301849365234, "global_step": 234150, "epoch": 1935} {"train_loss": -42.09100341796875, "global_step": 234151, "epoch": 1935} {"train_loss": -41.85371017456055, "global_step": 234152, "epoch": 1935} {"train_loss": -42.35175323486328, "global_step": 234153, "epoch": 1935} {"train_loss": -42.73820114135742, "global_step": 234154, "epoch": 1935} {"train_loss": -40.4863395690918, "global_step": 234155, "epoch": 1935} {"train_loss": -40.3700065612793, "global_step": 234156, "epoch": 1935} {"train_loss": -40.784088134765625, "global_step": 234157, "epoch": 1935} {"train_loss": -37.68081283569336, "global_step": 234158, "epoch": 1935} {"train_loss": -40.73099899291992, "global_step": 234159, "epoch": 1935} {"train_loss": -41.984920501708984, "global_step": 234160, "epoch": 1935} {"train_loss": -41.5646858215332, "global_step": 234161, "epoch": 1935} {"train_loss": -40.61867904663086, "global_step": 234162, "epoch": 1935} {"train_loss": -40.027652740478516, "global_step": 234163, "epoch": 1935} {"train_loss": -40.65180206298828, "global_step": 234164, "epoch": 1935} {"train_loss": -42.22191619873047, "global_step": 234165, "epoch": 1935} {"train_loss": -40.714839935302734, "global_step": 234166, "epoch": 1935} {"train_loss": -35.897804260253906, "global_step": 234167, "epoch": 1935} {"train_loss": -41.92329025268555, "global_step": 234168, "epoch": 1935} {"train_loss": -41.26822280883789, "global_step": 234169, "epoch": 1935} {"train_loss": -39.559757232666016, "global_step": 234170, "epoch": 1935} {"train_loss": -41.212646484375, "global_step": 234171, "epoch": 1935} {"train_loss": -40.45089340209961, "global_step": 234172, "epoch": 1935} {"train_loss": -39.51536560058594, "global_step": 234173, "epoch": 1935} {"train_loss": -39.29248046875, "global_step": 234174, "epoch": 1935} {"train_loss": -37.815670013427734, "global_step": 234175, "epoch": 1935} {"train_loss": -39.14579391479492, "global_step": 234176, "epoch": 1935} {"train_loss": -39.39166259765625, "global_step": 234177, "epoch": 1935} {"train_loss": -41.26163864135742, "global_step": 234178, "epoch": 1935} {"train_loss": -38.26910400390625, "global_step": 234179, "epoch": 1935} {"train_loss": -39.832088470458984, "global_step": 234180, "epoch": 1935} {"train_loss": -39.03679275512695, "global_step": 234181, "epoch": 1935} {"train_loss": -38.43547439575195, "global_step": 234182, "epoch": 1935} {"train_loss": -40.237037658691406, "global_step": 234183, "epoch": 1935} {"train_loss": -40.64308166503906, "global_step": 234184, "epoch": 1935} {"train_loss": -41.181854248046875, "global_step": 234185, "epoch": 1935} {"train_loss": -7.388993740081787, "global_step": 234186, "epoch": 1935} {"train_loss": -39.53836441040039, "global_step": 234187, "epoch": 1935} {"train_loss": -37.507362365722656, "global_step": 234188, "epoch": 1935} {"train_loss": -33.12275314331055, "global_step": 234189, "epoch": 1935} {"train_loss": -22.672286987304688, "global_step": 234190, "epoch": 1935} {"train_loss": -33.13460159301758, "global_step": 234191, "epoch": 1935} {"train_loss": -27.80600357055664, "global_step": 234192, "epoch": 1935} {"train_loss": -38.707244873046875, "global_step": 234193, "epoch": 1935} {"train_loss": -37.884552001953125, "global_step": 234194, "epoch": 1935} {"train_loss": -35.55295181274414, "global_step": 234195, "epoch": 1935} {"train_loss": -36.2271842956543, "global_step": 234196, "epoch": 1935} {"train_loss": -39.00433349609375, "global_step": 234197, "epoch": 1935} {"train_loss": -36.23162078857422, "global_step": 234198, "epoch": 1935} {"train_loss": -39.31136703491211, "global_step": 234199, "epoch": 1935} {"train_loss": -36.913818359375, "global_step": 234200, "epoch": 1935} {"train_loss": -35.01460266113281, "global_step": 234201, "epoch": 1935} {"train_loss": -39.632598876953125, "global_step": 234202, "epoch": 1935} {"train_loss": -38.75072479248047, "global_step": 234203, "epoch": 1935} {"train_loss": -38.25129699707031, "global_step": 234204, "epoch": 1935} {"train_loss": -38.19100570678711, "global_step": 234205, "epoch": 1935} {"train_loss": -37.616302490234375, "global_step": 234206, "epoch": 1935} {"train_loss": -38.564754486083984, "global_step": 234207, "epoch": 1935} {"train_loss": -39.230682373046875, "global_step": 234208, "epoch": 1935} {"train_loss": -40.4989128112793, "global_step": 234209, "epoch": 1935} {"train_loss": -39.7042350769043, "global_step": 234210, "epoch": 1935} {"train_loss": -38.234554290771484, "global_step": 234211, "epoch": 1935} {"train_loss": -39.11989974975586, "global_step": 234212, "epoch": 1935} {"train_loss": -40.44255447387695, "global_step": 234213, "epoch": 1935} {"train_loss": -40.12860107421875, "global_step": 234214, "epoch": 1935} {"train_loss": -38.9419059753418, "global_step": 234215, "epoch": 1935} {"train_loss": -40.832054138183594, "global_step": 234216, "epoch": 1935} {"train_loss": -40.910499572753906, "global_step": 234217, "epoch": 1935} {"train_loss": -40.251014709472656, "global_step": 234218, "epoch": 1935} {"train_loss": -40.922428131103516, "global_step": 234219, "epoch": 1935} {"train_loss": -39.21507263183594, "global_step": 234220, "epoch": 1935} {"train_loss": -40.902732849121094, "global_step": 234221, "epoch": 1935} {"train_loss": -40.886104583740234, "global_step": 234222, "epoch": 1935} {"train_loss": -40.1894416809082, "global_step": 234223, "epoch": 1935} {"train_loss": -40.708675384521484, "global_step": 234224, "epoch": 1935} {"train_loss": -40.32362747192383, "global_step": 234225, "epoch": 1935} {"train_loss": -39.35637664794922, "global_step": 234226, "epoch": 1935} {"train_loss": -40.81669998168945, "global_step": 234227, "epoch": 1935} {"train_loss": -41.592525482177734, "global_step": 234228, "epoch": 1935} {"train_loss": -41.22269058227539, "global_step": 234229, "epoch": 1935} {"train_loss": -40.97343063354492, "global_step": 234230, "epoch": 1935} {"train_loss": -41.37466812133789, "global_step": 234231, "epoch": 1935} {"train_loss": -41.713409423828125, "global_step": 234232, "epoch": 1935} {"train_loss": -40.97616195678711, "global_step": 234233, "epoch": 1935} {"train_loss": -41.155452728271484, "global_step": 234234, "epoch": 1935} {"train_loss": -41.555233001708984, "global_step": 234235, "epoch": 1935} {"train_loss": -41.39564895629883, "global_step": 234236, "epoch": 1935} {"train_loss": -41.24048614501953, "global_step": 234237, "epoch": 1935} {"train_loss": -41.53351593017578, "global_step": 234238, "epoch": 1935} {"train_loss": -41.609886169433594, "global_step": 234239, "epoch": 1935} {"train_loss": -41.41141891479492, "global_step": 234240, "epoch": 1935} {"train_loss": -41.654232025146484, "global_step": 234241, "epoch": 1935} {"train_loss": -41.15562057495117, "global_step": 234242, "epoch": 1935} {"train_loss": -41.27735137939453, "global_step": 234243, "epoch": 1935} {"train_loss": -42.00861740112305, "global_step": 234244, "epoch": 1935} {"train_loss": -41.43380355834961, "global_step": 234245, "epoch": 1935} {"train_loss": -41.753726959228516, "global_step": 234246, "epoch": 1935} {"train_loss": -41.2840576171875, "global_step": 234247, "epoch": 1935} {"train_loss": -41.47747802734375, "global_step": 234248, "epoch": 1935} {"train_loss": -42.0330696105957, "global_step": 234249, "epoch": 1935} {"train_loss": -41.5863037109375, "global_step": 234250, "epoch": 1935} {"train_loss": -42.320770263671875, "global_step": 234251, "epoch": 1935} {"train_loss": -41.384273529052734, "global_step": 234252, "epoch": 1935} {"train_loss": -41.987239837646484, "global_step": 234253, "epoch": 1935} {"train_loss": -42.05938720703125, "global_step": 234254, "epoch": 1935} {"train_loss": -39.79876899325158, "global_step": 234255, "epoch": 1935, "val_loss": 2670319.25} {"train_loss": -42.45966339111328, "global_step": 234256, "epoch": 1936} {"train_loss": -41.33439254760742, "global_step": 234257, "epoch": 1936} {"train_loss": -42.458858489990234, "global_step": 234258, "epoch": 1936} {"train_loss": -42.135589599609375, "global_step": 234259, "epoch": 1936} {"train_loss": -42.3701057434082, "global_step": 234260, "epoch": 1936} {"train_loss": -43.0177001953125, "global_step": 234261, "epoch": 1936} {"train_loss": -42.107948303222656, "global_step": 234262, "epoch": 1936} {"train_loss": -42.17995834350586, "global_step": 234263, "epoch": 1936} {"train_loss": -42.81011962890625, "global_step": 234264, "epoch": 1936} {"train_loss": -41.984806060791016, "global_step": 234265, "epoch": 1936} {"train_loss": -42.68888473510742, "global_step": 234266, "epoch": 1936} {"train_loss": -42.45985794067383, "global_step": 234267, "epoch": 1936} {"train_loss": -42.759239196777344, "global_step": 234268, "epoch": 1936} {"train_loss": -42.027130126953125, "global_step": 234269, "epoch": 1936} {"train_loss": -41.5922737121582, "global_step": 234270, "epoch": 1936} {"train_loss": -42.297664642333984, "global_step": 234271, "epoch": 1936} {"train_loss": -41.59647750854492, "global_step": 234272, "epoch": 1936} {"train_loss": -42.84931182861328, "global_step": 234273, "epoch": 1936} {"train_loss": -41.821529388427734, "global_step": 234274, "epoch": 1936} {"train_loss": -41.938148498535156, "global_step": 234275, "epoch": 1936} {"train_loss": -42.377925872802734, "global_step": 234276, "epoch": 1936} {"train_loss": -41.45848083496094, "global_step": 234277, "epoch": 1936} {"train_loss": -41.96771240234375, "global_step": 234278, "epoch": 1936} {"train_loss": -42.46720504760742, "global_step": 234279, "epoch": 1936} {"train_loss": -41.992977142333984, "global_step": 234280, "epoch": 1936} {"train_loss": -40.90090560913086, "global_step": 234281, "epoch": 1936} {"train_loss": -41.62824249267578, "global_step": 234282, "epoch": 1936} {"train_loss": -41.97772216796875, "global_step": 234283, "epoch": 1936} {"train_loss": -41.33230972290039, "global_step": 234284, "epoch": 1936} {"train_loss": -41.94566345214844, "global_step": 234285, "epoch": 1936} {"train_loss": -41.668087005615234, "global_step": 234286, "epoch": 1936} {"train_loss": -40.93280029296875, "global_step": 234287, "epoch": 1936} {"train_loss": -42.551307678222656, "global_step": 234288, "epoch": 1936} {"train_loss": -42.36344528198242, "global_step": 234289, "epoch": 1936} {"train_loss": -42.115699768066406, "global_step": 234290, "epoch": 1936} {"train_loss": -42.54330825805664, "global_step": 234291, "epoch": 1936} {"train_loss": -42.441341400146484, "global_step": 234292, "epoch": 1936} {"train_loss": -41.59406280517578, "global_step": 234293, "epoch": 1936} {"train_loss": -41.40528106689453, "global_step": 234294, "epoch": 1936} {"train_loss": -43.00239944458008, "global_step": 234295, "epoch": 1936} {"train_loss": -42.21950149536133, "global_step": 234296, "epoch": 1936} {"train_loss": -41.32383346557617, "global_step": 234297, "epoch": 1936} {"train_loss": -42.56371307373047, "global_step": 234298, "epoch": 1936} {"train_loss": -41.96173095703125, "global_step": 234299, "epoch": 1936} {"train_loss": -42.30522537231445, "global_step": 234300, "epoch": 1936} {"train_loss": -41.48076248168945, "global_step": 234301, "epoch": 1936} {"train_loss": -41.797760009765625, "global_step": 234302, "epoch": 1936} {"train_loss": -41.84360885620117, "global_step": 234303, "epoch": 1936} {"train_loss": -40.43278884887695, "global_step": 234304, "epoch": 1936} {"train_loss": -39.93088150024414, "global_step": 234305, "epoch": 1936} {"train_loss": -38.83028793334961, "global_step": 234306, "epoch": 1936} {"train_loss": -42.83543014526367, "global_step": 234307, "epoch": 1936} {"train_loss": -41.218929290771484, "global_step": 234308, "epoch": 1936} {"train_loss": -40.07844161987305, "global_step": 234309, "epoch": 1936} {"train_loss": -39.72126388549805, "global_step": 234310, "epoch": 1936} {"train_loss": -41.20319747924805, "global_step": 234311, "epoch": 1936} {"train_loss": -41.29132080078125, "global_step": 234312, "epoch": 1936} {"train_loss": -41.16891098022461, "global_step": 234313, "epoch": 1936} {"train_loss": -41.39493942260742, "global_step": 234314, "epoch": 1936} {"train_loss": -39.3040885925293, "global_step": 234315, "epoch": 1936} {"train_loss": -41.58073806762695, "global_step": 234316, "epoch": 1936} {"train_loss": -40.2939567565918, "global_step": 234317, "epoch": 1936} {"train_loss": -40.59419631958008, "global_step": 234318, "epoch": 1936} {"train_loss": -41.43000030517578, "global_step": 234319, "epoch": 1936} {"train_loss": -41.28011703491211, "global_step": 234320, "epoch": 1936} {"train_loss": -41.66591262817383, "global_step": 234321, "epoch": 1936} {"train_loss": -41.95589065551758, "global_step": 234322, "epoch": 1936} {"train_loss": -40.27035903930664, "global_step": 234323, "epoch": 1936} {"train_loss": -41.37192153930664, "global_step": 234324, "epoch": 1936} {"train_loss": -41.42656326293945, "global_step": 234325, "epoch": 1936} {"train_loss": -41.54620361328125, "global_step": 234326, "epoch": 1936} {"train_loss": -41.11518096923828, "global_step": 234327, "epoch": 1936} {"train_loss": -42.069862365722656, "global_step": 234328, "epoch": 1936} {"train_loss": -41.377197265625, "global_step": 234329, "epoch": 1936} {"train_loss": -42.19562530517578, "global_step": 234330, "epoch": 1936} {"train_loss": -41.430335998535156, "global_step": 234331, "epoch": 1936} {"train_loss": -40.90644073486328, "global_step": 234332, "epoch": 1936} {"train_loss": -42.21103286743164, "global_step": 234333, "epoch": 1936} {"train_loss": -41.28571701049805, "global_step": 234334, "epoch": 1936} {"train_loss": -41.233551025390625, "global_step": 234335, "epoch": 1936} {"train_loss": -41.25761032104492, "global_step": 234336, "epoch": 1936} {"train_loss": -40.93947982788086, "global_step": 234337, "epoch": 1936} {"train_loss": -41.888031005859375, "global_step": 234338, "epoch": 1936} {"train_loss": -42.11079406738281, "global_step": 234339, "epoch": 1936} {"train_loss": -41.41804504394531, "global_step": 234340, "epoch": 1936} {"train_loss": -42.18311309814453, "global_step": 234341, "epoch": 1936} {"train_loss": -41.324928283691406, "global_step": 234342, "epoch": 1936} {"train_loss": -41.75331497192383, "global_step": 234343, "epoch": 1936} {"train_loss": -41.59593200683594, "global_step": 234344, "epoch": 1936} {"train_loss": -40.96566390991211, "global_step": 234345, "epoch": 1936} {"train_loss": -42.13563919067383, "global_step": 234346, "epoch": 1936} {"train_loss": -40.090572357177734, "global_step": 234347, "epoch": 1936} {"train_loss": -40.975894927978516, "global_step": 234348, "epoch": 1936} {"train_loss": -40.282691955566406, "global_step": 234349, "epoch": 1936} {"train_loss": -42.046104431152344, "global_step": 234350, "epoch": 1936} {"train_loss": -40.26729965209961, "global_step": 234351, "epoch": 1936} {"train_loss": -41.05323028564453, "global_step": 234352, "epoch": 1936} {"train_loss": -42.13595199584961, "global_step": 234353, "epoch": 1936} {"train_loss": -40.278900146484375, "global_step": 234354, "epoch": 1936} {"train_loss": -41.83774185180664, "global_step": 234355, "epoch": 1936} {"train_loss": -41.177345275878906, "global_step": 234356, "epoch": 1936} {"train_loss": -41.257320404052734, "global_step": 234357, "epoch": 1936} {"train_loss": -41.71653366088867, "global_step": 234358, "epoch": 1936} {"train_loss": -41.425010681152344, "global_step": 234359, "epoch": 1936} {"train_loss": -41.145137786865234, "global_step": 234360, "epoch": 1936} {"train_loss": -42.440067291259766, "global_step": 234361, "epoch": 1936} {"train_loss": -41.672542572021484, "global_step": 234362, "epoch": 1936} {"train_loss": -41.33652114868164, "global_step": 234363, "epoch": 1936} {"train_loss": -41.793251037597656, "global_step": 234364, "epoch": 1936} {"train_loss": -42.22467803955078, "global_step": 234365, "epoch": 1936} {"train_loss": -42.06623077392578, "global_step": 234366, "epoch": 1936} {"train_loss": -42.03196716308594, "global_step": 234367, "epoch": 1936} {"train_loss": -41.69014358520508, "global_step": 234368, "epoch": 1936} {"train_loss": -42.488365173339844, "global_step": 234369, "epoch": 1936} {"train_loss": -42.12470626831055, "global_step": 234370, "epoch": 1936} {"train_loss": -41.852664947509766, "global_step": 234371, "epoch": 1936} {"train_loss": -41.86693572998047, "global_step": 234372, "epoch": 1936} {"train_loss": -42.84334945678711, "global_step": 234373, "epoch": 1936} {"train_loss": -42.71913528442383, "global_step": 234374, "epoch": 1936} {"train_loss": -42.313621520996094, "global_step": 234375, "epoch": 1936} {"train_loss": -41.66149527179308, "global_step": 234376, "epoch": 1936, "val_loss": 2715170.25} {"train_loss": -43.179378509521484, "global_step": 234377, "epoch": 1937} {"train_loss": -42.59528732299805, "global_step": 234378, "epoch": 1937} {"train_loss": -42.34988021850586, "global_step": 234379, "epoch": 1937} {"train_loss": -41.77994918823242, "global_step": 234380, "epoch": 1937} {"train_loss": -42.18477249145508, "global_step": 234381, "epoch": 1937} {"train_loss": -41.95846176147461, "global_step": 234382, "epoch": 1937} {"train_loss": -42.44036865234375, "global_step": 234383, "epoch": 1937} {"train_loss": -42.486412048339844, "global_step": 234384, "epoch": 1937} {"train_loss": -42.49283981323242, "global_step": 234385, "epoch": 1937} {"train_loss": -42.14619064331055, "global_step": 234386, "epoch": 1937} {"train_loss": -40.002349853515625, "global_step": 234387, "epoch": 1937} {"train_loss": -41.86719512939453, "global_step": 234388, "epoch": 1937} {"train_loss": -41.567665100097656, "global_step": 234389, "epoch": 1937} {"train_loss": -41.258174896240234, "global_step": 234390, "epoch": 1937} {"train_loss": -39.82087326049805, "global_step": 234391, "epoch": 1937} {"train_loss": -39.63789367675781, "global_step": 234392, "epoch": 1937} {"train_loss": -37.68160629272461, "global_step": 234393, "epoch": 1937} {"train_loss": -42.17680740356445, "global_step": 234394, "epoch": 1937} {"train_loss": -40.18622589111328, "global_step": 234395, "epoch": 1937} {"train_loss": -39.29187774658203, "global_step": 234396, "epoch": 1937} {"train_loss": -37.614315032958984, "global_step": 234397, "epoch": 1937} {"train_loss": -37.338951110839844, "global_step": 234398, "epoch": 1937} {"train_loss": -39.11982345581055, "global_step": 234399, "epoch": 1937} {"train_loss": -41.45939254760742, "global_step": 234400, "epoch": 1937} {"train_loss": -35.765193939208984, "global_step": 234401, "epoch": 1937} {"train_loss": -38.67502975463867, "global_step": 234402, "epoch": 1937} {"train_loss": -39.30312728881836, "global_step": 234403, "epoch": 1937} {"train_loss": -41.00275421142578, "global_step": 234404, "epoch": 1937} {"train_loss": -38.07206344604492, "global_step": 234405, "epoch": 1937} {"train_loss": -34.55232620239258, "global_step": 234406, "epoch": 1937} {"train_loss": -38.40314483642578, "global_step": 234407, "epoch": 1937} {"train_loss": -40.75782012939453, "global_step": 234408, "epoch": 1937} {"train_loss": -37.95866775512695, "global_step": 234409, "epoch": 1937} {"train_loss": -39.07611083984375, "global_step": 234410, "epoch": 1937} {"train_loss": -37.87571334838867, "global_step": 234411, "epoch": 1937} {"train_loss": -35.67356872558594, "global_step": 234412, "epoch": 1937} {"train_loss": -37.88126754760742, "global_step": 234413, "epoch": 1937} {"train_loss": -40.387046813964844, "global_step": 234414, "epoch": 1937} {"train_loss": -39.184383392333984, "global_step": 234415, "epoch": 1937} {"train_loss": -40.77049255371094, "global_step": 234416, "epoch": 1937} {"train_loss": -40.7965202331543, "global_step": 234417, "epoch": 1937} {"train_loss": -39.765811920166016, "global_step": 234418, "epoch": 1937} {"train_loss": -40.997676849365234, "global_step": 234419, "epoch": 1937} {"train_loss": -40.103755950927734, "global_step": 234420, "epoch": 1937} {"train_loss": -40.765193939208984, "global_step": 234421, "epoch": 1937} {"train_loss": -40.465728759765625, "global_step": 234422, "epoch": 1937} {"train_loss": -41.70343017578125, "global_step": 234423, "epoch": 1937} {"train_loss": -41.04994201660156, "global_step": 234424, "epoch": 1937} {"train_loss": -41.799827575683594, "global_step": 234425, "epoch": 1937} {"train_loss": -40.02793502807617, "global_step": 234426, "epoch": 1937} {"train_loss": -39.29193878173828, "global_step": 234427, "epoch": 1937} {"train_loss": -39.93311309814453, "global_step": 234428, "epoch": 1937} {"train_loss": -41.1124267578125, "global_step": 234429, "epoch": 1937} {"train_loss": -41.412391662597656, "global_step": 234430, "epoch": 1937} {"train_loss": -39.2633171081543, "global_step": 234431, "epoch": 1937} {"train_loss": -41.0175895690918, "global_step": 234432, "epoch": 1937} {"train_loss": -41.5058479309082, "global_step": 234433, "epoch": 1937} {"train_loss": -41.74431610107422, "global_step": 234434, "epoch": 1937} {"train_loss": -41.18939971923828, "global_step": 234435, "epoch": 1937} {"train_loss": -41.64605712890625, "global_step": 234436, "epoch": 1937} {"train_loss": -41.84357833862305, "global_step": 234437, "epoch": 1937} {"train_loss": -41.258460998535156, "global_step": 234438, "epoch": 1937} {"train_loss": -41.576942443847656, "global_step": 234439, "epoch": 1937} {"train_loss": -41.772037506103516, "global_step": 234440, "epoch": 1937} {"train_loss": -41.60715866088867, "global_step": 234441, "epoch": 1937} {"train_loss": -40.71709442138672, "global_step": 234442, "epoch": 1937} {"train_loss": -41.88604736328125, "global_step": 234443, "epoch": 1937} {"train_loss": -41.65365219116211, "global_step": 234444, "epoch": 1937} {"train_loss": -41.29584503173828, "global_step": 234445, "epoch": 1937} {"train_loss": -40.83740234375, "global_step": 234446, "epoch": 1937} {"train_loss": -42.156707763671875, "global_step": 234447, "epoch": 1937} {"train_loss": -41.55518341064453, "global_step": 234448, "epoch": 1937} {"train_loss": -42.17343521118164, "global_step": 234449, "epoch": 1937} {"train_loss": -42.500362396240234, "global_step": 234450, "epoch": 1937} {"train_loss": -42.27153778076172, "global_step": 234451, "epoch": 1937} {"train_loss": -41.68416213989258, "global_step": 234452, "epoch": 1937} {"train_loss": -42.18333053588867, "global_step": 234453, "epoch": 1937} {"train_loss": -41.89247131347656, "global_step": 234454, "epoch": 1937} {"train_loss": -33.54197311401367, "global_step": 234455, "epoch": 1937} {"train_loss": -42.11758041381836, "global_step": 234456, "epoch": 1937} {"train_loss": -42.55423355102539, "global_step": 234457, "epoch": 1937} {"train_loss": -41.934059143066406, "global_step": 234458, "epoch": 1937} {"train_loss": -36.073638916015625, "global_step": 234459, "epoch": 1937} {"train_loss": -42.74573516845703, "global_step": 234460, "epoch": 1937} {"train_loss": -42.29365158081055, "global_step": 234461, "epoch": 1937} {"train_loss": -42.37606430053711, "global_step": 234462, "epoch": 1937} {"train_loss": -40.8170166015625, "global_step": 234463, "epoch": 1937} {"train_loss": -42.55424118041992, "global_step": 234464, "epoch": 1937} {"train_loss": -41.16155242919922, "global_step": 234465, "epoch": 1937} {"train_loss": -41.58845138549805, "global_step": 234466, "epoch": 1937} {"train_loss": -40.179561614990234, "global_step": 234467, "epoch": 1937} {"train_loss": -40.45713424682617, "global_step": 234468, "epoch": 1937} {"train_loss": -42.23974609375, "global_step": 234469, "epoch": 1937} {"train_loss": -42.634952545166016, "global_step": 234470, "epoch": 1937} {"train_loss": -41.12599563598633, "global_step": 234471, "epoch": 1937} {"train_loss": -42.134742736816406, "global_step": 234472, "epoch": 1937} {"train_loss": -41.132015228271484, "global_step": 234473, "epoch": 1937} {"train_loss": -42.04240798950195, "global_step": 234474, "epoch": 1937} {"train_loss": -42.54160690307617, "global_step": 234475, "epoch": 1937} {"train_loss": -41.7413330078125, "global_step": 234476, "epoch": 1937} {"train_loss": -42.327877044677734, "global_step": 234477, "epoch": 1937} {"train_loss": -42.4598503112793, "global_step": 234478, "epoch": 1937} {"train_loss": -42.372108459472656, "global_step": 234479, "epoch": 1937} {"train_loss": -42.5003776550293, "global_step": 234480, "epoch": 1937} {"train_loss": -42.40143585205078, "global_step": 234481, "epoch": 1937} {"train_loss": -42.33207702636719, "global_step": 234482, "epoch": 1937} {"train_loss": -42.41771697998047, "global_step": 234483, "epoch": 1937} {"train_loss": -41.991268157958984, "global_step": 234484, "epoch": 1937} {"train_loss": -41.62507629394531, "global_step": 234485, "epoch": 1937} {"train_loss": -42.688167572021484, "global_step": 234486, "epoch": 1937} {"train_loss": -43.190799713134766, "global_step": 234487, "epoch": 1937} {"train_loss": -42.19804000854492, "global_step": 234488, "epoch": 1937} {"train_loss": -43.04544448852539, "global_step": 234489, "epoch": 1937} {"train_loss": -42.56953811645508, "global_step": 234490, "epoch": 1937} {"train_loss": -42.8619499206543, "global_step": 234491, "epoch": 1937} {"train_loss": -41.953426361083984, "global_step": 234492, "epoch": 1937} {"train_loss": -42.452667236328125, "global_step": 234493, "epoch": 1937} {"train_loss": -42.63863754272461, "global_step": 234494, "epoch": 1937} {"train_loss": -41.58066940307617, "global_step": 234495, "epoch": 1937} {"train_loss": -42.36525344848633, "global_step": 234496, "epoch": 1937} {"train_loss": -41.00223326880084, "global_step": 234497, "epoch": 1937, "val_loss": 2666250.25} {"train_loss": -42.75761795043945, "global_step": 234498, "epoch": 1938} {"train_loss": -42.82001495361328, "global_step": 234499, "epoch": 1938} {"train_loss": -42.98454666137695, "global_step": 234500, "epoch": 1938} {"train_loss": -41.92179489135742, "global_step": 234501, "epoch": 1938} {"train_loss": -42.55855178833008, "global_step": 234502, "epoch": 1938} {"train_loss": -42.63243865966797, "global_step": 234503, "epoch": 1938} {"train_loss": -42.28440475463867, "global_step": 234504, "epoch": 1938} {"train_loss": -42.33570861816406, "global_step": 234505, "epoch": 1938} {"train_loss": -42.611793518066406, "global_step": 234506, "epoch": 1938} {"train_loss": -42.37111282348633, "global_step": 234507, "epoch": 1938} {"train_loss": -42.44049072265625, "global_step": 234508, "epoch": 1938} {"train_loss": -42.89569091796875, "global_step": 234509, "epoch": 1938} {"train_loss": -43.041385650634766, "global_step": 234510, "epoch": 1938} {"train_loss": -42.18955612182617, "global_step": 234511, "epoch": 1938} {"train_loss": -42.739837646484375, "global_step": 234512, "epoch": 1938} {"train_loss": -42.39927291870117, "global_step": 234513, "epoch": 1938} {"train_loss": -41.82997512817383, "global_step": 234514, "epoch": 1938} {"train_loss": -43.02366256713867, "global_step": 234515, "epoch": 1938} {"train_loss": -43.45265197753906, "global_step": 234516, "epoch": 1938} {"train_loss": -43.1709098815918, "global_step": 234517, "epoch": 1938} {"train_loss": -42.893226623535156, "global_step": 234518, "epoch": 1938} {"train_loss": -42.95099639892578, "global_step": 234519, "epoch": 1938} {"train_loss": -42.01218032836914, "global_step": 234520, "epoch": 1938} {"train_loss": -41.099666595458984, "global_step": 234521, "epoch": 1938} {"train_loss": -41.7956428527832, "global_step": 234522, "epoch": 1938} {"train_loss": -42.6972541809082, "global_step": 234523, "epoch": 1938} {"train_loss": -42.35194778442383, "global_step": 234524, "epoch": 1938} {"train_loss": -43.035675048828125, "global_step": 234525, "epoch": 1938} {"train_loss": -42.44196701049805, "global_step": 234526, "epoch": 1938} {"train_loss": -42.96376419067383, "global_step": 234527, "epoch": 1938} {"train_loss": -42.2159423828125, "global_step": 234528, "epoch": 1938} {"train_loss": -42.08393478393555, "global_step": 234529, "epoch": 1938} {"train_loss": -42.705379486083984, "global_step": 234530, "epoch": 1938} {"train_loss": -41.8494758605957, "global_step": 234531, "epoch": 1938} {"train_loss": -41.55632400512695, "global_step": 234532, "epoch": 1938} {"train_loss": -42.773311614990234, "global_step": 234533, "epoch": 1938} {"train_loss": -42.385250091552734, "global_step": 234534, "epoch": 1938} {"train_loss": -42.45802688598633, "global_step": 234535, "epoch": 1938} {"train_loss": -43.202396392822266, "global_step": 234536, "epoch": 1938} {"train_loss": -42.2728385925293, "global_step": 234537, "epoch": 1938} {"train_loss": -43.19093704223633, "global_step": 234538, "epoch": 1938} {"train_loss": -42.65926742553711, "global_step": 234539, "epoch": 1938} {"train_loss": -42.36444091796875, "global_step": 234540, "epoch": 1938} {"train_loss": -43.2917594909668, "global_step": 234541, "epoch": 1938} {"train_loss": -42.52748489379883, "global_step": 234542, "epoch": 1938} {"train_loss": -42.81514358520508, "global_step": 234543, "epoch": 1938} {"train_loss": -42.173194885253906, "global_step": 234544, "epoch": 1938} {"train_loss": -42.849300384521484, "global_step": 234545, "epoch": 1938} {"train_loss": -42.75345993041992, "global_step": 234546, "epoch": 1938} {"train_loss": -42.978023529052734, "global_step": 234547, "epoch": 1938} {"train_loss": -41.86796951293945, "global_step": 234548, "epoch": 1938} {"train_loss": -41.8648796081543, "global_step": 234549, "epoch": 1938} {"train_loss": -41.690860748291016, "global_step": 234550, "epoch": 1938} {"train_loss": -42.163997650146484, "global_step": 234551, "epoch": 1938} {"train_loss": -42.06360626220703, "global_step": 234552, "epoch": 1938} {"train_loss": -42.738765716552734, "global_step": 234553, "epoch": 1938} {"train_loss": -42.49956512451172, "global_step": 234554, "epoch": 1938} {"train_loss": -41.284183502197266, "global_step": 234555, "epoch": 1938} {"train_loss": -40.9640998840332, "global_step": 234556, "epoch": 1938} {"train_loss": -41.06772994995117, "global_step": 234557, "epoch": 1938} {"train_loss": -40.07432556152344, "global_step": 234558, "epoch": 1938} {"train_loss": -42.3299446105957, "global_step": 234559, "epoch": 1938} {"train_loss": -42.254215240478516, "global_step": 234560, "epoch": 1938} {"train_loss": -42.63407516479492, "global_step": 234561, "epoch": 1938} {"train_loss": -42.74810791015625, "global_step": 234562, "epoch": 1938} {"train_loss": -41.38051986694336, "global_step": 234563, "epoch": 1938} {"train_loss": -41.09005355834961, "global_step": 234564, "epoch": 1938} {"train_loss": -42.0474967956543, "global_step": 234565, "epoch": 1938} {"train_loss": -42.19208526611328, "global_step": 234566, "epoch": 1938} {"train_loss": -40.97060012817383, "global_step": 234567, "epoch": 1938} {"train_loss": -42.67076873779297, "global_step": 234568, "epoch": 1938} {"train_loss": -41.91455078125, "global_step": 234569, "epoch": 1938} {"train_loss": -38.82793045043945, "global_step": 234570, "epoch": 1938} {"train_loss": -41.640174865722656, "global_step": 234571, "epoch": 1938} {"train_loss": -41.785240173339844, "global_step": 234572, "epoch": 1938} {"train_loss": -41.9206657409668, "global_step": 234573, "epoch": 1938} {"train_loss": -40.88362503051758, "global_step": 234574, "epoch": 1938} {"train_loss": -38.93435287475586, "global_step": 234575, "epoch": 1938} {"train_loss": -40.69797897338867, "global_step": 234576, "epoch": 1938} {"train_loss": -42.3515739440918, "global_step": 234577, "epoch": 1938} {"train_loss": -40.7615966796875, "global_step": 234578, "epoch": 1938} {"train_loss": -40.65742492675781, "global_step": 234579, "epoch": 1938} {"train_loss": -40.96767807006836, "global_step": 234580, "epoch": 1938} {"train_loss": -42.45476150512695, "global_step": 234581, "epoch": 1938} {"train_loss": -41.74416732788086, "global_step": 234582, "epoch": 1938} {"train_loss": -40.45985794067383, "global_step": 234583, "epoch": 1938} {"train_loss": -41.741817474365234, "global_step": 234584, "epoch": 1938} {"train_loss": -41.733924865722656, "global_step": 234585, "epoch": 1938} {"train_loss": -39.909393310546875, "global_step": 234586, "epoch": 1938} {"train_loss": -40.01388931274414, "global_step": 234587, "epoch": 1938} {"train_loss": -42.37717819213867, "global_step": 234588, "epoch": 1938} {"train_loss": -40.843788146972656, "global_step": 234589, "epoch": 1938} {"train_loss": -39.99576950073242, "global_step": 234590, "epoch": 1938} {"train_loss": -41.771575927734375, "global_step": 234591, "epoch": 1938} {"train_loss": -41.25640106201172, "global_step": 234592, "epoch": 1938} {"train_loss": -41.06989669799805, "global_step": 234593, "epoch": 1938} {"train_loss": -42.61281204223633, "global_step": 234594, "epoch": 1938} {"train_loss": -37.623165130615234, "global_step": 234595, "epoch": 1938} {"train_loss": -42.55125045776367, "global_step": 234596, "epoch": 1938} {"train_loss": -38.47298812866211, "global_step": 234597, "epoch": 1938} {"train_loss": -40.00470733642578, "global_step": 234598, "epoch": 1938} {"train_loss": -41.31535720825195, "global_step": 234599, "epoch": 1938} {"train_loss": -37.28630828857422, "global_step": 234600, "epoch": 1938} {"train_loss": -40.176551818847656, "global_step": 234601, "epoch": 1938} {"train_loss": -36.474666595458984, "global_step": 234602, "epoch": 1938} {"train_loss": -42.053409576416016, "global_step": 234603, "epoch": 1938} {"train_loss": -37.919883728027344, "global_step": 234604, "epoch": 1938} {"train_loss": -40.68504333496094, "global_step": 234605, "epoch": 1938} {"train_loss": -40.482295989990234, "global_step": 234606, "epoch": 1938} {"train_loss": -39.10980224609375, "global_step": 234607, "epoch": 1938} {"train_loss": -42.23482894897461, "global_step": 234608, "epoch": 1938} {"train_loss": -40.023590087890625, "global_step": 234609, "epoch": 1938} {"train_loss": -40.84697341918945, "global_step": 234610, "epoch": 1938} {"train_loss": -41.829158782958984, "global_step": 234611, "epoch": 1938} {"train_loss": -40.82884979248047, "global_step": 234612, "epoch": 1938} {"train_loss": -41.177249908447266, "global_step": 234613, "epoch": 1938} {"train_loss": -42.28205490112305, "global_step": 234614, "epoch": 1938} {"train_loss": -41.69404220581055, "global_step": 234615, "epoch": 1938} {"train_loss": -41.87334060668945, "global_step": 234616, "epoch": 1938} {"train_loss": -41.98798370361328, "global_step": 234617, "epoch": 1938} {"train_loss": -41.71342654267618, "global_step": 234618, "epoch": 1938, "val_loss": 2641014.5} {"train_loss": -42.01837158203125, "global_step": 234619, "epoch": 1939} {"train_loss": -41.98759078979492, "global_step": 234620, "epoch": 1939} {"train_loss": -42.40262985229492, "global_step": 234621, "epoch": 1939} {"train_loss": -42.092071533203125, "global_step": 234622, "epoch": 1939} {"train_loss": -42.40044021606445, "global_step": 234623, "epoch": 1939} {"train_loss": -42.396507263183594, "global_step": 234624, "epoch": 1939} {"train_loss": -42.22372055053711, "global_step": 234625, "epoch": 1939} {"train_loss": -42.241485595703125, "global_step": 234626, "epoch": 1939} {"train_loss": -42.078853607177734, "global_step": 234627, "epoch": 1939} {"train_loss": -42.50349044799805, "global_step": 234628, "epoch": 1939} {"train_loss": -43.003013610839844, "global_step": 234629, "epoch": 1939} {"train_loss": -42.580562591552734, "global_step": 234630, "epoch": 1939} {"train_loss": -41.83146667480469, "global_step": 234631, "epoch": 1939} {"train_loss": -42.38058090209961, "global_step": 234632, "epoch": 1939} {"train_loss": -42.88731002807617, "global_step": 234633, "epoch": 1939} {"train_loss": -41.58236312866211, "global_step": 234634, "epoch": 1939} {"train_loss": -42.97488784790039, "global_step": 234635, "epoch": 1939} {"train_loss": -42.06121826171875, "global_step": 234636, "epoch": 1939} {"train_loss": -42.94188690185547, "global_step": 234637, "epoch": 1939} {"train_loss": -42.18679428100586, "global_step": 234638, "epoch": 1939} {"train_loss": -41.99592590332031, "global_step": 234639, "epoch": 1939} {"train_loss": -42.391448974609375, "global_step": 234640, "epoch": 1939} {"train_loss": -42.35429382324219, "global_step": 234641, "epoch": 1939} {"train_loss": -42.464202880859375, "global_step": 234642, "epoch": 1939} {"train_loss": -40.88203048706055, "global_step": 234643, "epoch": 1939} {"train_loss": -41.682491302490234, "global_step": 234644, "epoch": 1939} {"train_loss": -41.75666809082031, "global_step": 234645, "epoch": 1939} {"train_loss": -42.29923629760742, "global_step": 234646, "epoch": 1939} {"train_loss": -40.929622650146484, "global_step": 234647, "epoch": 1939} {"train_loss": -42.721431732177734, "global_step": 234648, "epoch": 1939} {"train_loss": -41.027748107910156, "global_step": 234649, "epoch": 1939} {"train_loss": -40.38288497924805, "global_step": 234650, "epoch": 1939} {"train_loss": -41.10270309448242, "global_step": 234651, "epoch": 1939} {"train_loss": -42.49799346923828, "global_step": 234652, "epoch": 1939} {"train_loss": -41.861846923828125, "global_step": 234653, "epoch": 1939} {"train_loss": -41.06937789916992, "global_step": 234654, "epoch": 1939} {"train_loss": -42.76894760131836, "global_step": 234655, "epoch": 1939} {"train_loss": -42.03263473510742, "global_step": 234656, "epoch": 1939} {"train_loss": -42.43885040283203, "global_step": 234657, "epoch": 1939} {"train_loss": -42.71210861206055, "global_step": 234658, "epoch": 1939} {"train_loss": -42.663997650146484, "global_step": 234659, "epoch": 1939} {"train_loss": -42.35374450683594, "global_step": 234660, "epoch": 1939} {"train_loss": -42.75019454956055, "global_step": 234661, "epoch": 1939} {"train_loss": -42.38652420043945, "global_step": 234662, "epoch": 1939} {"train_loss": -42.27170944213867, "global_step": 234663, "epoch": 1939} {"train_loss": -43.472110748291016, "global_step": 234664, "epoch": 1939} {"train_loss": -42.26765060424805, "global_step": 234665, "epoch": 1939} {"train_loss": -42.5599479675293, "global_step": 234666, "epoch": 1939} {"train_loss": -42.68257141113281, "global_step": 234667, "epoch": 1939} {"train_loss": -42.87362289428711, "global_step": 234668, "epoch": 1939} {"train_loss": -42.78345489501953, "global_step": 234669, "epoch": 1939} {"train_loss": -42.964290618896484, "global_step": 234670, "epoch": 1939} {"train_loss": -43.71169662475586, "global_step": 234671, "epoch": 1939} {"train_loss": -41.37910079956055, "global_step": 234672, "epoch": 1939} {"train_loss": -42.665184020996094, "global_step": 234673, "epoch": 1939} {"train_loss": -42.1126823425293, "global_step": 234674, "epoch": 1939} {"train_loss": -42.889488220214844, "global_step": 234675, "epoch": 1939} {"train_loss": -42.67352294921875, "global_step": 234676, "epoch": 1939} {"train_loss": -42.59828567504883, "global_step": 234677, "epoch": 1939} {"train_loss": -43.500640869140625, "global_step": 234678, "epoch": 1939} {"train_loss": -42.691070556640625, "global_step": 234679, "epoch": 1939} {"train_loss": -42.67881393432617, "global_step": 234680, "epoch": 1939} {"train_loss": -43.217926025390625, "global_step": 234681, "epoch": 1939} {"train_loss": -41.96051025390625, "global_step": 234682, "epoch": 1939} {"train_loss": -42.243343353271484, "global_step": 234683, "epoch": 1939} {"train_loss": -42.627891540527344, "global_step": 234684, "epoch": 1939} {"train_loss": -41.45716094970703, "global_step": 234685, "epoch": 1939} {"train_loss": -41.90924072265625, "global_step": 234686, "epoch": 1939} {"train_loss": -42.514957427978516, "global_step": 234687, "epoch": 1939} {"train_loss": -42.57265853881836, "global_step": 234688, "epoch": 1939} {"train_loss": -39.4726676940918, "global_step": 234689, "epoch": 1939} {"train_loss": -41.369300842285156, "global_step": 234690, "epoch": 1939} {"train_loss": -43.351783752441406, "global_step": 234691, "epoch": 1939} {"train_loss": -42.27889633178711, "global_step": 234692, "epoch": 1939} {"train_loss": -42.5013313293457, "global_step": 234693, "epoch": 1939} {"train_loss": -43.4931755065918, "global_step": 234694, "epoch": 1939} {"train_loss": -43.184051513671875, "global_step": 234695, "epoch": 1939} {"train_loss": -41.75948715209961, "global_step": 234696, "epoch": 1939} {"train_loss": -42.26717758178711, "global_step": 234697, "epoch": 1939} {"train_loss": -42.718597412109375, "global_step": 234698, "epoch": 1939} {"train_loss": -42.63665771484375, "global_step": 234699, "epoch": 1939} {"train_loss": -42.38763427734375, "global_step": 234700, "epoch": 1939} {"train_loss": -40.811073303222656, "global_step": 234701, "epoch": 1939} {"train_loss": -41.1279411315918, "global_step": 234702, "epoch": 1939} {"train_loss": -42.7952995300293, "global_step": 234703, "epoch": 1939} {"train_loss": -41.824798583984375, "global_step": 234704, "epoch": 1939} {"train_loss": -41.903133392333984, "global_step": 234705, "epoch": 1939} {"train_loss": -41.76932144165039, "global_step": 234706, "epoch": 1939} {"train_loss": -41.66962814331055, "global_step": 234707, "epoch": 1939} {"train_loss": -42.278594970703125, "global_step": 234708, "epoch": 1939} {"train_loss": -41.990665435791016, "global_step": 234709, "epoch": 1939} {"train_loss": -41.8028678894043, "global_step": 234710, "epoch": 1939} {"train_loss": -41.7077522277832, "global_step": 234711, "epoch": 1939} {"train_loss": -41.43561935424805, "global_step": 234712, "epoch": 1939} {"train_loss": -42.53342819213867, "global_step": 234713, "epoch": 1939} {"train_loss": -42.31008529663086, "global_step": 234714, "epoch": 1939} {"train_loss": -42.05491256713867, "global_step": 234715, "epoch": 1939} {"train_loss": -42.12790298461914, "global_step": 234716, "epoch": 1939} {"train_loss": -43.00858688354492, "global_step": 234717, "epoch": 1939} {"train_loss": -41.91266632080078, "global_step": 234718, "epoch": 1939} {"train_loss": -42.16645431518555, "global_step": 234719, "epoch": 1939} {"train_loss": -42.449066162109375, "global_step": 234720, "epoch": 1939} {"train_loss": -41.990596771240234, "global_step": 234721, "epoch": 1939} {"train_loss": -42.677223205566406, "global_step": 234722, "epoch": 1939} {"train_loss": -42.05217361450195, "global_step": 234723, "epoch": 1939} {"train_loss": -40.30012130737305, "global_step": 234724, "epoch": 1939} {"train_loss": -42.30297088623047, "global_step": 234725, "epoch": 1939} {"train_loss": -42.3195686340332, "global_step": 234726, "epoch": 1939} {"train_loss": -41.05841064453125, "global_step": 234727, "epoch": 1939} {"train_loss": -41.96140670776367, "global_step": 234728, "epoch": 1939} {"train_loss": -42.8261833190918, "global_step": 234729, "epoch": 1939} {"train_loss": -42.464317321777344, "global_step": 234730, "epoch": 1939} {"train_loss": -42.26650619506836, "global_step": 234731, "epoch": 1939} {"train_loss": -41.2224235534668, "global_step": 234732, "epoch": 1939} {"train_loss": -42.886837005615234, "global_step": 234733, "epoch": 1939} {"train_loss": -42.392601013183594, "global_step": 234734, "epoch": 1939} {"train_loss": -42.554439544677734, "global_step": 234735, "epoch": 1939} {"train_loss": -42.8579216003418, "global_step": 234736, "epoch": 1939} {"train_loss": -42.671875, "global_step": 234737, "epoch": 1939} {"train_loss": -41.4806022644043, "global_step": 234738, "epoch": 1939} {"train_loss": -42.23352564661956, "global_step": 234739, "epoch": 1939, "val_loss": 2691984.0} {"train_loss": -43.10969924926758, "global_step": 234740, "epoch": 1940} {"train_loss": -42.73392105102539, "global_step": 234741, "epoch": 1940} {"train_loss": -43.081356048583984, "global_step": 234742, "epoch": 1940} {"train_loss": -42.94691848754883, "global_step": 234743, "epoch": 1940} {"train_loss": -43.4380989074707, "global_step": 234744, "epoch": 1940} {"train_loss": -42.89762496948242, "global_step": 234745, "epoch": 1940} {"train_loss": -43.062923431396484, "global_step": 234746, "epoch": 1940} {"train_loss": -42.633094787597656, "global_step": 234747, "epoch": 1940} {"train_loss": -43.04476547241211, "global_step": 234748, "epoch": 1940} {"train_loss": -43.3161735534668, "global_step": 234749, "epoch": 1940} {"train_loss": -43.04302215576172, "global_step": 234750, "epoch": 1940} {"train_loss": -42.93410110473633, "global_step": 234751, "epoch": 1940} {"train_loss": -42.53404235839844, "global_step": 234752, "epoch": 1940} {"train_loss": -43.25667190551758, "global_step": 234753, "epoch": 1940} {"train_loss": -42.575111389160156, "global_step": 234754, "epoch": 1940} {"train_loss": -43.10911178588867, "global_step": 234755, "epoch": 1940} {"train_loss": -42.43693923950195, "global_step": 234756, "epoch": 1940} {"train_loss": -41.663818359375, "global_step": 234757, "epoch": 1940} {"train_loss": -42.529945373535156, "global_step": 234758, "epoch": 1940} {"train_loss": -41.698848724365234, "global_step": 234759, "epoch": 1940} {"train_loss": -41.07734680175781, "global_step": 234760, "epoch": 1940} {"train_loss": -42.24772262573242, "global_step": 234761, "epoch": 1940} {"train_loss": -42.78825759887695, "global_step": 234762, "epoch": 1940} {"train_loss": -41.84112548828125, "global_step": 234763, "epoch": 1940} {"train_loss": -42.6151237487793, "global_step": 234764, "epoch": 1940} {"train_loss": -41.3160400390625, "global_step": 234765, "epoch": 1940} {"train_loss": -41.965118408203125, "global_step": 234766, "epoch": 1940} {"train_loss": -41.07558059692383, "global_step": 234767, "epoch": 1940} {"train_loss": -41.695003509521484, "global_step": 234768, "epoch": 1940} {"train_loss": -41.19060134887695, "global_step": 234769, "epoch": 1940} {"train_loss": -39.626502990722656, "global_step": 234770, "epoch": 1940} {"train_loss": -39.613922119140625, "global_step": 234771, "epoch": 1940} {"train_loss": -38.894630432128906, "global_step": 234772, "epoch": 1940} {"train_loss": -36.8999137878418, "global_step": 234773, "epoch": 1940} {"train_loss": -40.12411117553711, "global_step": 234774, "epoch": 1940} {"train_loss": -36.91980743408203, "global_step": 234775, "epoch": 1940} {"train_loss": -39.30482864379883, "global_step": 234776, "epoch": 1940} {"train_loss": -40.42045211791992, "global_step": 234777, "epoch": 1940} {"train_loss": -40.96947479248047, "global_step": 234778, "epoch": 1940} {"train_loss": -39.790611267089844, "global_step": 234779, "epoch": 1940} {"train_loss": -42.00689697265625, "global_step": 234780, "epoch": 1940} {"train_loss": -39.373329162597656, "global_step": 234781, "epoch": 1940} {"train_loss": -42.6969108581543, "global_step": 234782, "epoch": 1940} {"train_loss": -39.752071380615234, "global_step": 234783, "epoch": 1940} {"train_loss": -39.07711410522461, "global_step": 234784, "epoch": 1940} {"train_loss": -41.33176040649414, "global_step": 234785, "epoch": 1940} {"train_loss": -40.780731201171875, "global_step": 234786, "epoch": 1940} {"train_loss": -37.817745208740234, "global_step": 234787, "epoch": 1940} {"train_loss": -41.83414840698242, "global_step": 234788, "epoch": 1940} {"train_loss": -38.60475158691406, "global_step": 234789, "epoch": 1940} {"train_loss": -40.431884765625, "global_step": 234790, "epoch": 1940} {"train_loss": -40.49116134643555, "global_step": 234791, "epoch": 1940} {"train_loss": -40.455318450927734, "global_step": 234792, "epoch": 1940} {"train_loss": -40.20466613769531, "global_step": 234793, "epoch": 1940} {"train_loss": -40.20772933959961, "global_step": 234794, "epoch": 1940} {"train_loss": -40.86861801147461, "global_step": 234795, "epoch": 1940} {"train_loss": -40.3604736328125, "global_step": 234796, "epoch": 1940} {"train_loss": -41.748329162597656, "global_step": 234797, "epoch": 1940} {"train_loss": -40.56681442260742, "global_step": 234798, "epoch": 1940} {"train_loss": -41.47322463989258, "global_step": 234799, "epoch": 1940} {"train_loss": -40.94488525390625, "global_step": 234800, "epoch": 1940} {"train_loss": -41.22444152832031, "global_step": 234801, "epoch": 1940} {"train_loss": -41.18148422241211, "global_step": 234802, "epoch": 1940} {"train_loss": -42.23488235473633, "global_step": 234803, "epoch": 1940} {"train_loss": -41.29212188720703, "global_step": 234804, "epoch": 1940} {"train_loss": -41.52814483642578, "global_step": 234805, "epoch": 1940} {"train_loss": -41.509857177734375, "global_step": 234806, "epoch": 1940} {"train_loss": -42.051578521728516, "global_step": 234807, "epoch": 1940} {"train_loss": -41.96623611450195, "global_step": 234808, "epoch": 1940} {"train_loss": -41.91189956665039, "global_step": 234809, "epoch": 1940} {"train_loss": -41.50612258911133, "global_step": 234810, "epoch": 1940} {"train_loss": -42.06565475463867, "global_step": 234811, "epoch": 1940} {"train_loss": -41.694393157958984, "global_step": 234812, "epoch": 1940} {"train_loss": -43.078041076660156, "global_step": 234813, "epoch": 1940} {"train_loss": -41.721248626708984, "global_step": 234814, "epoch": 1940} {"train_loss": -42.77598571777344, "global_step": 234815, "epoch": 1940} {"train_loss": -42.165283203125, "global_step": 234816, "epoch": 1940} {"train_loss": -42.19560623168945, "global_step": 234817, "epoch": 1940} {"train_loss": -43.04026412963867, "global_step": 234818, "epoch": 1940} {"train_loss": -42.4835319519043, "global_step": 234819, "epoch": 1940} {"train_loss": -42.65230941772461, "global_step": 234820, "epoch": 1940} {"train_loss": -42.68025588989258, "global_step": 234821, "epoch": 1940} {"train_loss": -42.22703552246094, "global_step": 234822, "epoch": 1940} {"train_loss": -42.66420364379883, "global_step": 234823, "epoch": 1940} {"train_loss": -42.211524963378906, "global_step": 234824, "epoch": 1940} {"train_loss": -41.44962692260742, "global_step": 234825, "epoch": 1940} {"train_loss": -42.81245422363281, "global_step": 234826, "epoch": 1940} {"train_loss": -42.67824935913086, "global_step": 234827, "epoch": 1940} {"train_loss": -42.243892669677734, "global_step": 234828, "epoch": 1940} {"train_loss": -42.614803314208984, "global_step": 234829, "epoch": 1940} {"train_loss": -43.329505920410156, "global_step": 234830, "epoch": 1940} {"train_loss": -42.7952766418457, "global_step": 234831, "epoch": 1940} {"train_loss": -42.84762954711914, "global_step": 234832, "epoch": 1940} {"train_loss": -42.4361686706543, "global_step": 234833, "epoch": 1940} {"train_loss": -42.8689079284668, "global_step": 234834, "epoch": 1940} {"train_loss": -42.11882400512695, "global_step": 234835, "epoch": 1940} {"train_loss": -43.076576232910156, "global_step": 234836, "epoch": 1940} {"train_loss": -42.462093353271484, "global_step": 234837, "epoch": 1940} {"train_loss": -42.209835052490234, "global_step": 234838, "epoch": 1940} {"train_loss": -41.95634078979492, "global_step": 234839, "epoch": 1940} {"train_loss": -42.622276306152344, "global_step": 234840, "epoch": 1940} {"train_loss": -43.03571319580078, "global_step": 234841, "epoch": 1940} {"train_loss": -42.91550827026367, "global_step": 234842, "epoch": 1940} {"train_loss": -43.157989501953125, "global_step": 234843, "epoch": 1940} {"train_loss": -43.30780792236328, "global_step": 234844, "epoch": 1940} {"train_loss": -42.94842529296875, "global_step": 234845, "epoch": 1940} {"train_loss": -43.090858459472656, "global_step": 234846, "epoch": 1940} {"train_loss": -42.9568977355957, "global_step": 234847, "epoch": 1940} {"train_loss": -42.80665969848633, "global_step": 234848, "epoch": 1940} {"train_loss": -43.35247802734375, "global_step": 234849, "epoch": 1940} {"train_loss": -43.226863861083984, "global_step": 234850, "epoch": 1940} {"train_loss": -43.40119934082031, "global_step": 234851, "epoch": 1940} {"train_loss": -43.05387496948242, "global_step": 234852, "epoch": 1940} {"train_loss": -43.15544509887695, "global_step": 234853, "epoch": 1940} {"train_loss": -43.63471221923828, "global_step": 234854, "epoch": 1940} {"train_loss": -43.399940490722656, "global_step": 234855, "epoch": 1940} {"train_loss": -42.79484176635742, "global_step": 234856, "epoch": 1940} {"train_loss": -43.150638580322266, "global_step": 234857, "epoch": 1940} {"train_loss": -43.68319320678711, "global_step": 234858, "epoch": 1940} {"train_loss": -43.42545700073242, "global_step": 234859, "epoch": 1940} {"train_loss": -41.91718970054437, "global_step": 234860, "epoch": 1940, "val_loss": 2711879.25} {"train_loss": -43.264156341552734, "global_step": 234861, "epoch": 1941} {"train_loss": -43.49311065673828, "global_step": 234862, "epoch": 1941} {"train_loss": -42.87731170654297, "global_step": 234863, "epoch": 1941} {"train_loss": -42.55245590209961, "global_step": 234864, "epoch": 1941} {"train_loss": -42.47827911376953, "global_step": 234865, "epoch": 1941} {"train_loss": -42.67198181152344, "global_step": 234866, "epoch": 1941} {"train_loss": -42.418121337890625, "global_step": 234867, "epoch": 1941} {"train_loss": -41.94307327270508, "global_step": 234868, "epoch": 1941} {"train_loss": -43.02290725708008, "global_step": 234869, "epoch": 1941} {"train_loss": -41.841915130615234, "global_step": 234870, "epoch": 1941} {"train_loss": -39.86420822143555, "global_step": 234871, "epoch": 1941} {"train_loss": -35.0768928527832, "global_step": 234872, "epoch": 1941} {"train_loss": -30.135168075561523, "global_step": 234873, "epoch": 1941} {"train_loss": -37.587249755859375, "global_step": 234874, "epoch": 1941} {"train_loss": -32.541439056396484, "global_step": 234875, "epoch": 1941} {"train_loss": -35.5899543762207, "global_step": 234876, "epoch": 1941} {"train_loss": -27.780242919921875, "global_step": 234877, "epoch": 1941} {"train_loss": -35.8065299987793, "global_step": 234878, "epoch": 1941} {"train_loss": -32.14318084716797, "global_step": 234879, "epoch": 1941} {"train_loss": -34.21182632446289, "global_step": 234880, "epoch": 1941} {"train_loss": -37.692779541015625, "global_step": 234881, "epoch": 1941} {"train_loss": -32.94266891479492, "global_step": 234882, "epoch": 1941} {"train_loss": -32.36553955078125, "global_step": 234883, "epoch": 1941} {"train_loss": -35.69158172607422, "global_step": 234884, "epoch": 1941} {"train_loss": -38.35554122924805, "global_step": 234885, "epoch": 1941} {"train_loss": -34.4493522644043, "global_step": 234886, "epoch": 1941} {"train_loss": -35.86225509643555, "global_step": 234887, "epoch": 1941} {"train_loss": -38.71577072143555, "global_step": 234888, "epoch": 1941} {"train_loss": -38.7425537109375, "global_step": 234889, "epoch": 1941} {"train_loss": -38.935359954833984, "global_step": 234890, "epoch": 1941} {"train_loss": -38.467376708984375, "global_step": 234891, "epoch": 1941} {"train_loss": -40.53041458129883, "global_step": 234892, "epoch": 1941} {"train_loss": -39.00225830078125, "global_step": 234893, "epoch": 1941} {"train_loss": -38.15726852416992, "global_step": 234894, "epoch": 1941} {"train_loss": -40.35974884033203, "global_step": 234895, "epoch": 1941} {"train_loss": -40.6984977722168, "global_step": 234896, "epoch": 1941} {"train_loss": -40.924468994140625, "global_step": 234897, "epoch": 1941} {"train_loss": -40.33360290527344, "global_step": 234898, "epoch": 1941} {"train_loss": -40.52177047729492, "global_step": 234899, "epoch": 1941} {"train_loss": -40.828575134277344, "global_step": 234900, "epoch": 1941} {"train_loss": -40.81854248046875, "global_step": 234901, "epoch": 1941} {"train_loss": -40.4654426574707, "global_step": 234902, "epoch": 1941} {"train_loss": -40.9405403137207, "global_step": 234903, "epoch": 1941} {"train_loss": -41.794551849365234, "global_step": 234904, "epoch": 1941} {"train_loss": -41.39390563964844, "global_step": 234905, "epoch": 1941} {"train_loss": -41.91669845581055, "global_step": 234906, "epoch": 1941} {"train_loss": -40.84646987915039, "global_step": 234907, "epoch": 1941} {"train_loss": -41.478729248046875, "global_step": 234908, "epoch": 1941} {"train_loss": -41.67999267578125, "global_step": 234909, "epoch": 1941} {"train_loss": -41.78031921386719, "global_step": 234910, "epoch": 1941} {"train_loss": -41.81596755981445, "global_step": 234911, "epoch": 1941} {"train_loss": -41.910743713378906, "global_step": 234912, "epoch": 1941} {"train_loss": -41.86570358276367, "global_step": 234913, "epoch": 1941} {"train_loss": -41.41555404663086, "global_step": 234914, "epoch": 1941} {"train_loss": -42.4006233215332, "global_step": 234915, "epoch": 1941} {"train_loss": -41.96058654785156, "global_step": 234916, "epoch": 1941} {"train_loss": -42.07318878173828, "global_step": 234917, "epoch": 1941} {"train_loss": -41.658809661865234, "global_step": 234918, "epoch": 1941} {"train_loss": -41.96583938598633, "global_step": 234919, "epoch": 1941} {"train_loss": -42.27454376220703, "global_step": 234920, "epoch": 1941} {"train_loss": -42.48460006713867, "global_step": 234921, "epoch": 1941} {"train_loss": -42.343421936035156, "global_step": 234922, "epoch": 1941} {"train_loss": -42.40139389038086, "global_step": 234923, "epoch": 1941} {"train_loss": -42.46699142456055, "global_step": 234924, "epoch": 1941} {"train_loss": -41.869720458984375, "global_step": 234925, "epoch": 1941} {"train_loss": -42.8060417175293, "global_step": 234926, "epoch": 1941} {"train_loss": -42.686641693115234, "global_step": 234927, "epoch": 1941} {"train_loss": -42.575645446777344, "global_step": 234928, "epoch": 1941} {"train_loss": -42.439613342285156, "global_step": 234929, "epoch": 1941} {"train_loss": -42.37727737426758, "global_step": 234930, "epoch": 1941} {"train_loss": -42.418861389160156, "global_step": 234931, "epoch": 1941} {"train_loss": -42.19059371948242, "global_step": 234932, "epoch": 1941} {"train_loss": -42.45170211791992, "global_step": 234933, "epoch": 1941} {"train_loss": -42.48090362548828, "global_step": 234934, "epoch": 1941} {"train_loss": -42.511714935302734, "global_step": 234935, "epoch": 1941} {"train_loss": -42.864315032958984, "global_step": 234936, "epoch": 1941} {"train_loss": -42.60451889038086, "global_step": 234937, "epoch": 1941} {"train_loss": -43.029781341552734, "global_step": 234938, "epoch": 1941} {"train_loss": -43.37372970581055, "global_step": 234939, "epoch": 1941} {"train_loss": -43.00288009643555, "global_step": 234940, "epoch": 1941} {"train_loss": -43.1770133972168, "global_step": 234941, "epoch": 1941} {"train_loss": -43.09797286987305, "global_step": 234942, "epoch": 1941} {"train_loss": -43.16874694824219, "global_step": 234943, "epoch": 1941} {"train_loss": -43.06339645385742, "global_step": 234944, "epoch": 1941} {"train_loss": -43.405757904052734, "global_step": 234945, "epoch": 1941} {"train_loss": -43.297664642333984, "global_step": 234946, "epoch": 1941} {"train_loss": -43.2693977355957, "global_step": 234947, "epoch": 1941} {"train_loss": -43.35947799682617, "global_step": 234948, "epoch": 1941} {"train_loss": -42.89574432373047, "global_step": 234949, "epoch": 1941} {"train_loss": -43.190921783447266, "global_step": 234950, "epoch": 1941} {"train_loss": -43.2187614440918, "global_step": 234951, "epoch": 1941} {"train_loss": -43.39645004272461, "global_step": 234952, "epoch": 1941} {"train_loss": -43.19393539428711, "global_step": 234953, "epoch": 1941} {"train_loss": -43.6773681640625, "global_step": 234954, "epoch": 1941} {"train_loss": -42.91936111450195, "global_step": 234955, "epoch": 1941} {"train_loss": -43.544246673583984, "global_step": 234956, "epoch": 1941} {"train_loss": -43.291015625, "global_step": 234957, "epoch": 1941} {"train_loss": -43.28684616088867, "global_step": 234958, "epoch": 1941} {"train_loss": -42.691768646240234, "global_step": 234959, "epoch": 1941} {"train_loss": -42.2684440612793, "global_step": 234960, "epoch": 1941} {"train_loss": -42.28989791870117, "global_step": 234961, "epoch": 1941} {"train_loss": -42.72147750854492, "global_step": 234962, "epoch": 1941} {"train_loss": -43.72362518310547, "global_step": 234963, "epoch": 1941} {"train_loss": -43.835723876953125, "global_step": 234964, "epoch": 1941} {"train_loss": -43.18649673461914, "global_step": 234965, "epoch": 1941} {"train_loss": -43.32784652709961, "global_step": 234966, "epoch": 1941} {"train_loss": -43.131404876708984, "global_step": 234967, "epoch": 1941} {"train_loss": -43.46280288696289, "global_step": 234968, "epoch": 1941} {"train_loss": -43.40336227416992, "global_step": 234969, "epoch": 1941} {"train_loss": -43.748260498046875, "global_step": 234970, "epoch": 1941} {"train_loss": -43.57048416137695, "global_step": 234971, "epoch": 1941} {"train_loss": -43.32198715209961, "global_step": 234972, "epoch": 1941} {"train_loss": -43.29119873046875, "global_step": 234973, "epoch": 1941} {"train_loss": -43.618961334228516, "global_step": 234974, "epoch": 1941} {"train_loss": -43.62758255004883, "global_step": 234975, "epoch": 1941} {"train_loss": -43.757179260253906, "global_step": 234976, "epoch": 1941} {"train_loss": -43.34611892700195, "global_step": 234977, "epoch": 1941} {"train_loss": -43.60931396484375, "global_step": 234978, "epoch": 1941} {"train_loss": -43.62700271606445, "global_step": 234979, "epoch": 1941} {"train_loss": -42.66933822631836, "global_step": 234980, "epoch": 1941} {"train_loss": -41.22309542884511, "global_step": 234981, "epoch": 1941, "val_loss": 2696218.25} {"train_loss": -42.5626335144043, "global_step": 234982, "epoch": 1942} {"train_loss": -42.43721008300781, "global_step": 234983, "epoch": 1942} {"train_loss": -42.65299606323242, "global_step": 234984, "epoch": 1942} {"train_loss": -43.52675247192383, "global_step": 234985, "epoch": 1942} {"train_loss": -40.7833366394043, "global_step": 234986, "epoch": 1942} {"train_loss": -40.23800277709961, "global_step": 234987, "epoch": 1942} {"train_loss": -40.47361755371094, "global_step": 234988, "epoch": 1942} {"train_loss": -39.08669662475586, "global_step": 234989, "epoch": 1942} {"train_loss": -39.41720199584961, "global_step": 234990, "epoch": 1942} {"train_loss": -41.80917739868164, "global_step": 234991, "epoch": 1942} {"train_loss": -42.15675735473633, "global_step": 234992, "epoch": 1942} {"train_loss": -41.25496292114258, "global_step": 234993, "epoch": 1942} {"train_loss": -40.48612594604492, "global_step": 234994, "epoch": 1942} {"train_loss": -41.77417755126953, "global_step": 234995, "epoch": 1942} {"train_loss": -41.02412796020508, "global_step": 234996, "epoch": 1942} {"train_loss": -42.58749008178711, "global_step": 234997, "epoch": 1942} {"train_loss": -41.13718795776367, "global_step": 234998, "epoch": 1942} {"train_loss": -39.58745193481445, "global_step": 234999, "epoch": 1942} {"train_loss": -41.858882904052734, "global_step": 235000, "epoch": 1942} {"train_loss": -40.86762619018555, "global_step": 235001, "epoch": 1942} {"train_loss": -41.6049919128418, "global_step": 235002, "epoch": 1942} {"train_loss": -41.37677001953125, "global_step": 235003, "epoch": 1942} {"train_loss": -41.16962432861328, "global_step": 235004, "epoch": 1942} {"train_loss": -42.51675033569336, "global_step": 235005, "epoch": 1942} {"train_loss": -40.28672790527344, "global_step": 235006, "epoch": 1942} {"train_loss": -41.08463668823242, "global_step": 235007, "epoch": 1942} {"train_loss": -40.809669494628906, "global_step": 235008, "epoch": 1942} {"train_loss": -41.90304183959961, "global_step": 235009, "epoch": 1942} {"train_loss": -40.09098434448242, "global_step": 235010, "epoch": 1942} {"train_loss": -41.00801086425781, "global_step": 235011, "epoch": 1942} {"train_loss": -40.87661361694336, "global_step": 235012, "epoch": 1942} {"train_loss": -42.46757888793945, "global_step": 235013, "epoch": 1942} {"train_loss": -40.51313781738281, "global_step": 235014, "epoch": 1942} {"train_loss": -40.78501510620117, "global_step": 235015, "epoch": 1942} {"train_loss": -40.55105209350586, "global_step": 235016, "epoch": 1942} {"train_loss": -40.487491607666016, "global_step": 235017, "epoch": 1942} {"train_loss": -39.990447998046875, "global_step": 235018, "epoch": 1942} {"train_loss": -40.91767883300781, "global_step": 235019, "epoch": 1942} {"train_loss": -40.42726516723633, "global_step": 235020, "epoch": 1942} {"train_loss": -41.94474411010742, "global_step": 235021, "epoch": 1942} {"train_loss": -41.2313117980957, "global_step": 235022, "epoch": 1942} {"train_loss": -41.464229583740234, "global_step": 235023, "epoch": 1942} {"train_loss": -40.97623062133789, "global_step": 235024, "epoch": 1942} {"train_loss": -41.87115478515625, "global_step": 235025, "epoch": 1942} {"train_loss": -41.7728385925293, "global_step": 235026, "epoch": 1942} {"train_loss": -42.03364944458008, "global_step": 235027, "epoch": 1942} {"train_loss": -41.82072830200195, "global_step": 235028, "epoch": 1942} {"train_loss": -41.916343688964844, "global_step": 235029, "epoch": 1942} {"train_loss": -41.9728889465332, "global_step": 235030, "epoch": 1942} {"train_loss": -42.28300857543945, "global_step": 235031, "epoch": 1942} {"train_loss": -41.52695846557617, "global_step": 235032, "epoch": 1942} {"train_loss": -41.61997604370117, "global_step": 235033, "epoch": 1942} {"train_loss": -42.37116622924805, "global_step": 235034, "epoch": 1942} {"train_loss": -43.02354431152344, "global_step": 235035, "epoch": 1942} {"train_loss": -42.873138427734375, "global_step": 235036, "epoch": 1942} {"train_loss": -42.39071273803711, "global_step": 235037, "epoch": 1942} {"train_loss": -42.760066986083984, "global_step": 235038, "epoch": 1942} {"train_loss": -42.76972579956055, "global_step": 235039, "epoch": 1942} {"train_loss": -42.07624435424805, "global_step": 235040, "epoch": 1942} {"train_loss": -42.983917236328125, "global_step": 235041, "epoch": 1942} {"train_loss": -42.6292839050293, "global_step": 235042, "epoch": 1942} {"train_loss": -43.0485725402832, "global_step": 235043, "epoch": 1942} {"train_loss": -42.684837341308594, "global_step": 235044, "epoch": 1942} {"train_loss": -43.58740997314453, "global_step": 235045, "epoch": 1942} {"train_loss": -42.96653366088867, "global_step": 235046, "epoch": 1942} {"train_loss": -42.5133056640625, "global_step": 235047, "epoch": 1942} {"train_loss": -43.52653884887695, "global_step": 235048, "epoch": 1942} {"train_loss": -42.79974365234375, "global_step": 235049, "epoch": 1942} {"train_loss": -42.714115142822266, "global_step": 235050, "epoch": 1942} {"train_loss": -42.735321044921875, "global_step": 235051, "epoch": 1942} {"train_loss": -42.63795471191406, "global_step": 235052, "epoch": 1942} {"train_loss": -43.763179779052734, "global_step": 235053, "epoch": 1942} {"train_loss": -42.709381103515625, "global_step": 235054, "epoch": 1942} {"train_loss": -43.04243850708008, "global_step": 235055, "epoch": 1942} {"train_loss": -43.01540756225586, "global_step": 235056, "epoch": 1942} {"train_loss": -43.021461486816406, "global_step": 235057, "epoch": 1942} {"train_loss": -43.463253021240234, "global_step": 235058, "epoch": 1942} {"train_loss": -42.94301986694336, "global_step": 235059, "epoch": 1942} {"train_loss": -43.752197265625, "global_step": 235060, "epoch": 1942} {"train_loss": -43.45484924316406, "global_step": 235061, "epoch": 1942} {"train_loss": -42.45305252075195, "global_step": 235062, "epoch": 1942} {"train_loss": -43.32143783569336, "global_step": 235063, "epoch": 1942} {"train_loss": -42.69499206542969, "global_step": 235064, "epoch": 1942} {"train_loss": -43.02413558959961, "global_step": 235065, "epoch": 1942} {"train_loss": -42.6495361328125, "global_step": 235066, "epoch": 1942} {"train_loss": -42.52564239501953, "global_step": 235067, "epoch": 1942} {"train_loss": -42.978668212890625, "global_step": 235068, "epoch": 1942} {"train_loss": -43.1827392578125, "global_step": 235069, "epoch": 1942} {"train_loss": -43.16264343261719, "global_step": 235070, "epoch": 1942} {"train_loss": -43.3353271484375, "global_step": 235071, "epoch": 1942} {"train_loss": -43.189613342285156, "global_step": 235072, "epoch": 1942} {"train_loss": -43.23335647583008, "global_step": 235073, "epoch": 1942} {"train_loss": -43.36693572998047, "global_step": 235074, "epoch": 1942} {"train_loss": -43.49776840209961, "global_step": 235075, "epoch": 1942} {"train_loss": -43.638580322265625, "global_step": 235076, "epoch": 1942} {"train_loss": -43.099998474121094, "global_step": 235077, "epoch": 1942} {"train_loss": -43.7130012512207, "global_step": 235078, "epoch": 1942} {"train_loss": -43.99507141113281, "global_step": 235079, "epoch": 1942} {"train_loss": -43.31026840209961, "global_step": 235080, "epoch": 1942} {"train_loss": -43.421016693115234, "global_step": 235081, "epoch": 1942} {"train_loss": -43.47406768798828, "global_step": 235082, "epoch": 1942} {"train_loss": -43.52506637573242, "global_step": 235083, "epoch": 1942} {"train_loss": -43.100791931152344, "global_step": 235084, "epoch": 1942} {"train_loss": -42.87398910522461, "global_step": 235085, "epoch": 1942} {"train_loss": -42.49394226074219, "global_step": 235086, "epoch": 1942} {"train_loss": -41.44614791870117, "global_step": 235087, "epoch": 1942} {"train_loss": -40.52892303466797, "global_step": 235088, "epoch": 1942} {"train_loss": -39.180824279785156, "global_step": 235089, "epoch": 1942} {"train_loss": -41.585540771484375, "global_step": 235090, "epoch": 1942} {"train_loss": -42.71519088745117, "global_step": 235091, "epoch": 1942} {"train_loss": -42.386714935302734, "global_step": 235092, "epoch": 1942} {"train_loss": -40.740474700927734, "global_step": 235093, "epoch": 1942} {"train_loss": -36.57881164550781, "global_step": 235094, "epoch": 1942} {"train_loss": -42.60722351074219, "global_step": 235095, "epoch": 1942} {"train_loss": -36.572505950927734, "global_step": 235096, "epoch": 1942} {"train_loss": -39.44449996948242, "global_step": 235097, "epoch": 1942} {"train_loss": -40.522884368896484, "global_step": 235098, "epoch": 1942} {"train_loss": -33.635101318359375, "global_step": 235099, "epoch": 1942} {"train_loss": -37.7315559387207, "global_step": 235100, "epoch": 1942} {"train_loss": -40.31169509887695, "global_step": 235101, "epoch": 1942} {"train_loss": -41.83853616005133, "global_step": 235102, "epoch": 1942, "val_loss": 2716018.0} {"train_loss": -39.40707778930664, "global_step": 235103, "epoch": 1943} {"train_loss": -39.92112350463867, "global_step": 235104, "epoch": 1943} {"train_loss": -37.855369567871094, "global_step": 235105, "epoch": 1943} {"train_loss": -38.84648513793945, "global_step": 235106, "epoch": 1943} {"train_loss": -40.600494384765625, "global_step": 235107, "epoch": 1943} {"train_loss": -40.86336898803711, "global_step": 235108, "epoch": 1943} {"train_loss": -39.97199630737305, "global_step": 235109, "epoch": 1943} {"train_loss": -40.40997314453125, "global_step": 235110, "epoch": 1943} {"train_loss": -41.24088668823242, "global_step": 235111, "epoch": 1943} {"train_loss": -39.6671142578125, "global_step": 235112, "epoch": 1943} {"train_loss": -38.38242721557617, "global_step": 235113, "epoch": 1943} {"train_loss": -40.237876892089844, "global_step": 235114, "epoch": 1943} {"train_loss": -41.80812072753906, "global_step": 235115, "epoch": 1943} {"train_loss": -40.1513786315918, "global_step": 235116, "epoch": 1943} {"train_loss": -41.686344146728516, "global_step": 235117, "epoch": 1943} {"train_loss": -40.85248947143555, "global_step": 235118, "epoch": 1943} {"train_loss": -40.10232162475586, "global_step": 235119, "epoch": 1943} {"train_loss": -41.5576286315918, "global_step": 235120, "epoch": 1943} {"train_loss": -41.24917221069336, "global_step": 235121, "epoch": 1943} {"train_loss": -40.3630485534668, "global_step": 235122, "epoch": 1943} {"train_loss": -40.95928955078125, "global_step": 235123, "epoch": 1943} {"train_loss": -40.78333282470703, "global_step": 235124, "epoch": 1943} {"train_loss": -41.12225341796875, "global_step": 235125, "epoch": 1943} {"train_loss": -41.572845458984375, "global_step": 235126, "epoch": 1943} {"train_loss": -41.222900390625, "global_step": 235127, "epoch": 1943} {"train_loss": -40.617225646972656, "global_step": 235128, "epoch": 1943} {"train_loss": -41.57220458984375, "global_step": 235129, "epoch": 1943} {"train_loss": -41.0677490234375, "global_step": 235130, "epoch": 1943} {"train_loss": -41.14271926879883, "global_step": 235131, "epoch": 1943} {"train_loss": -42.045772552490234, "global_step": 235132, "epoch": 1943} {"train_loss": -41.42177200317383, "global_step": 235133, "epoch": 1943} {"train_loss": -40.81037521362305, "global_step": 235134, "epoch": 1943} {"train_loss": -42.00541305541992, "global_step": 235135, "epoch": 1943} {"train_loss": -41.320980072021484, "global_step": 235136, "epoch": 1943} {"train_loss": -42.159759521484375, "global_step": 235137, "epoch": 1943} {"train_loss": -42.31130599975586, "global_step": 235138, "epoch": 1943} {"train_loss": -41.98578643798828, "global_step": 235139, "epoch": 1943} {"train_loss": -41.82990646362305, "global_step": 235140, "epoch": 1943} {"train_loss": -42.42706298828125, "global_step": 235141, "epoch": 1943} {"train_loss": -42.30852508544922, "global_step": 235142, "epoch": 1943} {"train_loss": -42.37752914428711, "global_step": 235143, "epoch": 1943} {"train_loss": -42.293392181396484, "global_step": 235144, "epoch": 1943} {"train_loss": -42.610107421875, "global_step": 235145, "epoch": 1943} {"train_loss": -42.693634033203125, "global_step": 235146, "epoch": 1943} {"train_loss": -43.03706359863281, "global_step": 235147, "epoch": 1943} {"train_loss": -42.77659225463867, "global_step": 235148, "epoch": 1943} {"train_loss": -42.65018081665039, "global_step": 235149, "epoch": 1943} {"train_loss": -42.5665397644043, "global_step": 235150, "epoch": 1943} {"train_loss": -43.0720100402832, "global_step": 235151, "epoch": 1943} {"train_loss": -43.31641387939453, "global_step": 235152, "epoch": 1943} {"train_loss": -42.851348876953125, "global_step": 235153, "epoch": 1943} {"train_loss": -43.550228118896484, "global_step": 235154, "epoch": 1943} {"train_loss": -42.636592864990234, "global_step": 235155, "epoch": 1943} {"train_loss": -43.170166015625, "global_step": 235156, "epoch": 1943} {"train_loss": -42.83168411254883, "global_step": 235157, "epoch": 1943} {"train_loss": -43.066524505615234, "global_step": 235158, "epoch": 1943} {"train_loss": -43.16215133666992, "global_step": 235159, "epoch": 1943} {"train_loss": -42.89683151245117, "global_step": 235160, "epoch": 1943} {"train_loss": -43.166873931884766, "global_step": 235161, "epoch": 1943} {"train_loss": -43.114070892333984, "global_step": 235162, "epoch": 1943} {"train_loss": -43.08451461791992, "global_step": 235163, "epoch": 1943} {"train_loss": -43.372982025146484, "global_step": 235164, "epoch": 1943} {"train_loss": -43.212032318115234, "global_step": 235165, "epoch": 1943} {"train_loss": -42.8791389465332, "global_step": 235166, "epoch": 1943} {"train_loss": -43.551185607910156, "global_step": 235167, "epoch": 1943} {"train_loss": -43.73493576049805, "global_step": 235168, "epoch": 1943} {"train_loss": -43.22311019897461, "global_step": 235169, "epoch": 1943} {"train_loss": -43.5416145324707, "global_step": 235170, "epoch": 1943} {"train_loss": -43.209754943847656, "global_step": 235171, "epoch": 1943} {"train_loss": -43.24258804321289, "global_step": 235172, "epoch": 1943} {"train_loss": -43.423133850097656, "global_step": 235173, "epoch": 1943} {"train_loss": -42.693214416503906, "global_step": 235174, "epoch": 1943} {"train_loss": -43.232887268066406, "global_step": 235175, "epoch": 1943} {"train_loss": -43.104225158691406, "global_step": 235176, "epoch": 1943} {"train_loss": -43.738739013671875, "global_step": 235177, "epoch": 1943} {"train_loss": -43.78306198120117, "global_step": 235178, "epoch": 1943} {"train_loss": -43.596229553222656, "global_step": 235179, "epoch": 1943} {"train_loss": -43.92047882080078, "global_step": 235180, "epoch": 1943} {"train_loss": -43.407920837402344, "global_step": 235181, "epoch": 1943} {"train_loss": -44.08515548706055, "global_step": 235182, "epoch": 1943} {"train_loss": -43.35518264770508, "global_step": 235183, "epoch": 1943} {"train_loss": -44.072235107421875, "global_step": 235184, "epoch": 1943} {"train_loss": -43.74556350708008, "global_step": 235185, "epoch": 1943} {"train_loss": -43.90690994262695, "global_step": 235186, "epoch": 1943} {"train_loss": -44.05585861206055, "global_step": 235187, "epoch": 1943} {"train_loss": -44.03493881225586, "global_step": 235188, "epoch": 1943} {"train_loss": -44.120811462402344, "global_step": 235189, "epoch": 1943} {"train_loss": -43.51700973510742, "global_step": 235190, "epoch": 1943} {"train_loss": -44.176021575927734, "global_step": 235191, "epoch": 1943} {"train_loss": -43.5239143371582, "global_step": 235192, "epoch": 1943} {"train_loss": -43.84267807006836, "global_step": 235193, "epoch": 1943} {"train_loss": -44.01498031616211, "global_step": 235194, "epoch": 1943} {"train_loss": -43.8103141784668, "global_step": 235195, "epoch": 1943} {"train_loss": -43.878658294677734, "global_step": 235196, "epoch": 1943} {"train_loss": -43.878170013427734, "global_step": 235197, "epoch": 1943} {"train_loss": -43.94353103637695, "global_step": 235198, "epoch": 1943} {"train_loss": -43.861534118652344, "global_step": 235199, "epoch": 1943} {"train_loss": -43.32026290893555, "global_step": 235200, "epoch": 1943} {"train_loss": -43.93788528442383, "global_step": 235201, "epoch": 1943} {"train_loss": -43.756683349609375, "global_step": 235202, "epoch": 1943} {"train_loss": -43.6454963684082, "global_step": 235203, "epoch": 1943} {"train_loss": -43.772254943847656, "global_step": 235204, "epoch": 1943} {"train_loss": -43.507469177246094, "global_step": 235205, "epoch": 1943} {"train_loss": -43.65520095825195, "global_step": 235206, "epoch": 1943} {"train_loss": -43.7180290222168, "global_step": 235207, "epoch": 1943} {"train_loss": -43.30058670043945, "global_step": 235208, "epoch": 1943} {"train_loss": -43.20515060424805, "global_step": 235209, "epoch": 1943} {"train_loss": -43.74648666381836, "global_step": 235210, "epoch": 1943} {"train_loss": -42.88190841674805, "global_step": 235211, "epoch": 1943} {"train_loss": -40.96906661987305, "global_step": 235212, "epoch": 1943} {"train_loss": -39.456668853759766, "global_step": 235213, "epoch": 1943} {"train_loss": -43.12106704711914, "global_step": 235214, "epoch": 1943} {"train_loss": -42.99197006225586, "global_step": 235215, "epoch": 1943} {"train_loss": -42.06827163696289, "global_step": 235216, "epoch": 1943} {"train_loss": -40.71128463745117, "global_step": 235217, "epoch": 1943} {"train_loss": -41.92393112182617, "global_step": 235218, "epoch": 1943} {"train_loss": -42.7125244140625, "global_step": 235219, "epoch": 1943} {"train_loss": -41.734832763671875, "global_step": 235220, "epoch": 1943} {"train_loss": -42.454524993896484, "global_step": 235221, "epoch": 1943} {"train_loss": -42.26259994506836, "global_step": 235222, "epoch": 1943} {"train_loss": -42.41131437317399, "global_step": 235223, "epoch": 1943, "val_loss": 2687240.75} {"train_loss": -41.04639434814453, "global_step": 235224, "epoch": 1944} {"train_loss": -40.289588928222656, "global_step": 235225, "epoch": 1944} {"train_loss": -42.762115478515625, "global_step": 235226, "epoch": 1944} {"train_loss": -41.27203369140625, "global_step": 235227, "epoch": 1944} {"train_loss": -39.173377990722656, "global_step": 235228, "epoch": 1944} {"train_loss": -39.72058868408203, "global_step": 235229, "epoch": 1944} {"train_loss": -41.5030632019043, "global_step": 235230, "epoch": 1944} {"train_loss": -40.399078369140625, "global_step": 235231, "epoch": 1944} {"train_loss": -41.57434844970703, "global_step": 235232, "epoch": 1944} {"train_loss": -41.909847259521484, "global_step": 235233, "epoch": 1944} {"train_loss": -41.668148040771484, "global_step": 235234, "epoch": 1944} {"train_loss": -41.552207946777344, "global_step": 235235, "epoch": 1944} {"train_loss": -42.09466552734375, "global_step": 235236, "epoch": 1944} {"train_loss": -41.44919967651367, "global_step": 235237, "epoch": 1944} {"train_loss": -41.66115951538086, "global_step": 235238, "epoch": 1944} {"train_loss": -41.7849235534668, "global_step": 235239, "epoch": 1944} {"train_loss": -41.830787658691406, "global_step": 235240, "epoch": 1944} {"train_loss": -40.940895080566406, "global_step": 235241, "epoch": 1944} {"train_loss": -39.94013214111328, "global_step": 235242, "epoch": 1944} {"train_loss": -40.89813995361328, "global_step": 235243, "epoch": 1944} {"train_loss": -43.0204963684082, "global_step": 235244, "epoch": 1944} {"train_loss": -41.708831787109375, "global_step": 235245, "epoch": 1944} {"train_loss": -41.018978118896484, "global_step": 235246, "epoch": 1944} {"train_loss": -41.56171417236328, "global_step": 235247, "epoch": 1944} {"train_loss": -41.725276947021484, "global_step": 235248, "epoch": 1944} {"train_loss": -42.93396759033203, "global_step": 235249, "epoch": 1944} {"train_loss": -42.77663803100586, "global_step": 235250, "epoch": 1944} {"train_loss": -42.14442825317383, "global_step": 235251, "epoch": 1944} {"train_loss": -42.67848587036133, "global_step": 235252, "epoch": 1944} {"train_loss": -42.392696380615234, "global_step": 235253, "epoch": 1944} {"train_loss": -42.09526062011719, "global_step": 235254, "epoch": 1944} {"train_loss": -42.28158950805664, "global_step": 235255, "epoch": 1944} {"train_loss": -42.98272705078125, "global_step": 235256, "epoch": 1944} {"train_loss": -42.410858154296875, "global_step": 235257, "epoch": 1944} {"train_loss": -42.443077087402344, "global_step": 235258, "epoch": 1944} {"train_loss": -42.77073287963867, "global_step": 235259, "epoch": 1944} {"train_loss": -43.05037307739258, "global_step": 235260, "epoch": 1944} {"train_loss": -42.463924407958984, "global_step": 235261, "epoch": 1944} {"train_loss": -43.183082580566406, "global_step": 235262, "epoch": 1944} {"train_loss": -43.25407409667969, "global_step": 235263, "epoch": 1944} {"train_loss": -42.43988037109375, "global_step": 235264, "epoch": 1944} {"train_loss": -43.20562744140625, "global_step": 235265, "epoch": 1944} {"train_loss": -43.2120475769043, "global_step": 235266, "epoch": 1944} {"train_loss": -43.37382888793945, "global_step": 235267, "epoch": 1944} {"train_loss": -42.0625114440918, "global_step": 235268, "epoch": 1944} {"train_loss": -42.19609069824219, "global_step": 235269, "epoch": 1944} {"train_loss": -42.62717056274414, "global_step": 235270, "epoch": 1944} {"train_loss": -41.30537033081055, "global_step": 235271, "epoch": 1944} {"train_loss": -41.11971664428711, "global_step": 235272, "epoch": 1944} {"train_loss": -42.52901840209961, "global_step": 235273, "epoch": 1944} {"train_loss": -41.85444259643555, "global_step": 235274, "epoch": 1944} {"train_loss": -41.7514762878418, "global_step": 235275, "epoch": 1944} {"train_loss": -42.932350158691406, "global_step": 235276, "epoch": 1944} {"train_loss": -42.70135498046875, "global_step": 235277, "epoch": 1944} {"train_loss": -42.78506088256836, "global_step": 235278, "epoch": 1944} {"train_loss": -42.13835906982422, "global_step": 235279, "epoch": 1944} {"train_loss": -42.477752685546875, "global_step": 235280, "epoch": 1944} {"train_loss": -43.38578414916992, "global_step": 235281, "epoch": 1944} {"train_loss": -42.4244270324707, "global_step": 235282, "epoch": 1944} {"train_loss": -41.96258544921875, "global_step": 235283, "epoch": 1944} {"train_loss": -42.450199127197266, "global_step": 235284, "epoch": 1944} {"train_loss": -42.78936004638672, "global_step": 235285, "epoch": 1944} {"train_loss": -43.24037551879883, "global_step": 235286, "epoch": 1944} {"train_loss": -43.42854690551758, "global_step": 235287, "epoch": 1944} {"train_loss": -42.948421478271484, "global_step": 235288, "epoch": 1944} {"train_loss": -42.58012771606445, "global_step": 235289, "epoch": 1944} {"train_loss": -42.52062225341797, "global_step": 235290, "epoch": 1944} {"train_loss": -42.85650634765625, "global_step": 235291, "epoch": 1944} {"train_loss": -43.754390716552734, "global_step": 235292, "epoch": 1944} {"train_loss": -42.61709213256836, "global_step": 235293, "epoch": 1944} {"train_loss": -42.56296920776367, "global_step": 235294, "epoch": 1944} {"train_loss": -42.15859603881836, "global_step": 235295, "epoch": 1944} {"train_loss": -42.90796661376953, "global_step": 235296, "epoch": 1944} {"train_loss": -43.338443756103516, "global_step": 235297, "epoch": 1944} {"train_loss": -43.135169982910156, "global_step": 235298, "epoch": 1944} {"train_loss": -43.058258056640625, "global_step": 235299, "epoch": 1944} {"train_loss": -42.39128494262695, "global_step": 235300, "epoch": 1944} {"train_loss": -42.94265365600586, "global_step": 235301, "epoch": 1944} {"train_loss": -43.5518798828125, "global_step": 235302, "epoch": 1944} {"train_loss": -42.95057678222656, "global_step": 235303, "epoch": 1944} {"train_loss": -41.670509338378906, "global_step": 235304, "epoch": 1944} {"train_loss": -42.21971130371094, "global_step": 235305, "epoch": 1944} {"train_loss": -43.03356170654297, "global_step": 235306, "epoch": 1944} {"train_loss": -43.48664093017578, "global_step": 235307, "epoch": 1944} {"train_loss": -42.8049430847168, "global_step": 235308, "epoch": 1944} {"train_loss": -41.7717170715332, "global_step": 235309, "epoch": 1944} {"train_loss": -41.96450424194336, "global_step": 235310, "epoch": 1944} {"train_loss": -43.251399993896484, "global_step": 235311, "epoch": 1944} {"train_loss": -43.095367431640625, "global_step": 235312, "epoch": 1944} {"train_loss": -42.449913024902344, "global_step": 235313, "epoch": 1944} {"train_loss": -42.212989807128906, "global_step": 235314, "epoch": 1944} {"train_loss": -42.9195671081543, "global_step": 235315, "epoch": 1944} {"train_loss": -42.612709045410156, "global_step": 235316, "epoch": 1944} {"train_loss": -42.91789627075195, "global_step": 235317, "epoch": 1944} {"train_loss": -42.821990966796875, "global_step": 235318, "epoch": 1944} {"train_loss": -43.346317291259766, "global_step": 235319, "epoch": 1944} {"train_loss": -43.40367126464844, "global_step": 235320, "epoch": 1944} {"train_loss": -42.14223861694336, "global_step": 235321, "epoch": 1944} {"train_loss": -40.72483825683594, "global_step": 235322, "epoch": 1944} {"train_loss": -43.51704788208008, "global_step": 235323, "epoch": 1944} {"train_loss": -41.59053421020508, "global_step": 235324, "epoch": 1944} {"train_loss": -39.66046142578125, "global_step": 235325, "epoch": 1944} {"train_loss": -40.882850646972656, "global_step": 235326, "epoch": 1944} {"train_loss": -43.63210678100586, "global_step": 235327, "epoch": 1944} {"train_loss": -42.623165130615234, "global_step": 235328, "epoch": 1944} {"train_loss": -41.24617385864258, "global_step": 235329, "epoch": 1944} {"train_loss": -40.176753997802734, "global_step": 235330, "epoch": 1944} {"train_loss": -42.92897415161133, "global_step": 235331, "epoch": 1944} {"train_loss": -42.4952278137207, "global_step": 235332, "epoch": 1944} {"train_loss": -42.93335723876953, "global_step": 235333, "epoch": 1944} {"train_loss": -41.45407485961914, "global_step": 235334, "epoch": 1944} {"train_loss": -41.60299301147461, "global_step": 235335, "epoch": 1944} {"train_loss": -42.6908073425293, "global_step": 235336, "epoch": 1944} {"train_loss": -43.2336540222168, "global_step": 235337, "epoch": 1944} {"train_loss": -41.87459182739258, "global_step": 235338, "epoch": 1944} {"train_loss": -41.76301193237305, "global_step": 235339, "epoch": 1944} {"train_loss": -43.305416107177734, "global_step": 235340, "epoch": 1944} {"train_loss": -42.26753234863281, "global_step": 235341, "epoch": 1944} {"train_loss": -43.42217254638672, "global_step": 235342, "epoch": 1944} {"train_loss": -42.94728469848633, "global_step": 235343, "epoch": 1944} {"train_loss": -42.284945117540595, "global_step": 235344, "epoch": 1944, "val_loss": 2662265.0} {"train_loss": -43.429256439208984, "global_step": 235345, "epoch": 1945} {"train_loss": -43.21470642089844, "global_step": 235346, "epoch": 1945} {"train_loss": -43.3551139831543, "global_step": 235347, "epoch": 1945} {"train_loss": -43.26127243041992, "global_step": 235348, "epoch": 1945} {"train_loss": -42.95071792602539, "global_step": 235349, "epoch": 1945} {"train_loss": -43.10834884643555, "global_step": 235350, "epoch": 1945} {"train_loss": -41.8126106262207, "global_step": 235351, "epoch": 1945} {"train_loss": -41.525691986083984, "global_step": 235352, "epoch": 1945} {"train_loss": -42.07737731933594, "global_step": 235353, "epoch": 1945} {"train_loss": -42.70039367675781, "global_step": 235354, "epoch": 1945} {"train_loss": -43.18826675415039, "global_step": 235355, "epoch": 1945} {"train_loss": -43.17983627319336, "global_step": 235356, "epoch": 1945} {"train_loss": -43.5059814453125, "global_step": 235357, "epoch": 1945} {"train_loss": -42.93305587768555, "global_step": 235358, "epoch": 1945} {"train_loss": -43.29937744140625, "global_step": 235359, "epoch": 1945} {"train_loss": -43.55867004394531, "global_step": 235360, "epoch": 1945} {"train_loss": -43.27570724487305, "global_step": 235361, "epoch": 1945} {"train_loss": -42.862972259521484, "global_step": 235362, "epoch": 1945} {"train_loss": -43.24690628051758, "global_step": 235363, "epoch": 1945} {"train_loss": -43.407833099365234, "global_step": 235364, "epoch": 1945} {"train_loss": -42.741539001464844, "global_step": 235365, "epoch": 1945} {"train_loss": -42.99982833862305, "global_step": 235366, "epoch": 1945} {"train_loss": -43.28219985961914, "global_step": 235367, "epoch": 1945} {"train_loss": -42.412681579589844, "global_step": 235368, "epoch": 1945} {"train_loss": -41.79811096191406, "global_step": 235369, "epoch": 1945} {"train_loss": -41.56698226928711, "global_step": 235370, "epoch": 1945} {"train_loss": -43.474342346191406, "global_step": 235371, "epoch": 1945} {"train_loss": -42.09815216064453, "global_step": 235372, "epoch": 1945} {"train_loss": -41.736080169677734, "global_step": 235373, "epoch": 1945} {"train_loss": -43.5361328125, "global_step": 235374, "epoch": 1945} {"train_loss": -42.45844650268555, "global_step": 235375, "epoch": 1945} {"train_loss": -42.058589935302734, "global_step": 235376, "epoch": 1945} {"train_loss": -42.800411224365234, "global_step": 235377, "epoch": 1945} {"train_loss": -42.359466552734375, "global_step": 235378, "epoch": 1945} {"train_loss": -42.45054244995117, "global_step": 235379, "epoch": 1945} {"train_loss": -42.155914306640625, "global_step": 235380, "epoch": 1945} {"train_loss": -42.498199462890625, "global_step": 235381, "epoch": 1945} {"train_loss": -42.50644302368164, "global_step": 235382, "epoch": 1945} {"train_loss": -42.93164825439453, "global_step": 235383, "epoch": 1945} {"train_loss": -42.216060638427734, "global_step": 235384, "epoch": 1945} {"train_loss": -42.651710510253906, "global_step": 235385, "epoch": 1945} {"train_loss": -42.62385940551758, "global_step": 235386, "epoch": 1945} {"train_loss": -42.816650390625, "global_step": 235387, "epoch": 1945} {"train_loss": -42.2043571472168, "global_step": 235388, "epoch": 1945} {"train_loss": -42.7525520324707, "global_step": 235389, "epoch": 1945} {"train_loss": -42.724422454833984, "global_step": 235390, "epoch": 1945} {"train_loss": -43.18049240112305, "global_step": 235391, "epoch": 1945} {"train_loss": -42.74464416503906, "global_step": 235392, "epoch": 1945} {"train_loss": -42.66183090209961, "global_step": 235393, "epoch": 1945} {"train_loss": -42.99131393432617, "global_step": 235394, "epoch": 1945} {"train_loss": -42.283599853515625, "global_step": 235395, "epoch": 1945} {"train_loss": -43.52310562133789, "global_step": 235396, "epoch": 1945} {"train_loss": -43.031978607177734, "global_step": 235397, "epoch": 1945} {"train_loss": -43.39826583862305, "global_step": 235398, "epoch": 1945} {"train_loss": -43.01142120361328, "global_step": 235399, "epoch": 1945} {"train_loss": -41.48942947387695, "global_step": 235400, "epoch": 1945} {"train_loss": -42.71870803833008, "global_step": 235401, "epoch": 1945} {"train_loss": -42.83695602416992, "global_step": 235402, "epoch": 1945} {"train_loss": -42.176673889160156, "global_step": 235403, "epoch": 1945} {"train_loss": -40.51850509643555, "global_step": 235404, "epoch": 1945} {"train_loss": -41.69834518432617, "global_step": 235405, "epoch": 1945} {"train_loss": -43.08382797241211, "global_step": 235406, "epoch": 1945} {"train_loss": -42.660614013671875, "global_step": 235407, "epoch": 1945} {"train_loss": -41.1618766784668, "global_step": 235408, "epoch": 1945} {"train_loss": -42.54392623901367, "global_step": 235409, "epoch": 1945} {"train_loss": -43.902488708496094, "global_step": 235410, "epoch": 1945} {"train_loss": -42.0887565612793, "global_step": 235411, "epoch": 1945} {"train_loss": -42.32002258300781, "global_step": 235412, "epoch": 1945} {"train_loss": -42.799747467041016, "global_step": 235413, "epoch": 1945} {"train_loss": -43.409217834472656, "global_step": 235414, "epoch": 1945} {"train_loss": -43.442626953125, "global_step": 235415, "epoch": 1945} {"train_loss": -43.63385772705078, "global_step": 235416, "epoch": 1945} {"train_loss": -43.2856559753418, "global_step": 235417, "epoch": 1945} {"train_loss": -43.79673767089844, "global_step": 235418, "epoch": 1945} {"train_loss": -43.54005432128906, "global_step": 235419, "epoch": 1945} {"train_loss": -43.36192321777344, "global_step": 235420, "epoch": 1945} {"train_loss": -43.762939453125, "global_step": 235421, "epoch": 1945} {"train_loss": -43.75994110107422, "global_step": 235422, "epoch": 1945} {"train_loss": -43.197235107421875, "global_step": 235423, "epoch": 1945} {"train_loss": -43.17141342163086, "global_step": 235424, "epoch": 1945} {"train_loss": -42.7361946105957, "global_step": 235425, "epoch": 1945} {"train_loss": -43.1073112487793, "global_step": 235426, "epoch": 1945} {"train_loss": -44.04511260986328, "global_step": 235427, "epoch": 1945} {"train_loss": -42.23788070678711, "global_step": 235428, "epoch": 1945} {"train_loss": -40.40242385864258, "global_step": 235429, "epoch": 1945} {"train_loss": -40.72675704956055, "global_step": 235430, "epoch": 1945} {"train_loss": -42.38767623901367, "global_step": 235431, "epoch": 1945} {"train_loss": -42.05168533325195, "global_step": 235432, "epoch": 1945} {"train_loss": -39.7417106628418, "global_step": 235433, "epoch": 1945} {"train_loss": -42.95449447631836, "global_step": 235434, "epoch": 1945} {"train_loss": -41.3701286315918, "global_step": 235435, "epoch": 1945} {"train_loss": -39.43085861206055, "global_step": 235436, "epoch": 1945} {"train_loss": -42.72825241088867, "global_step": 235437, "epoch": 1945} {"train_loss": -40.59785842895508, "global_step": 235438, "epoch": 1945} {"train_loss": -40.49799346923828, "global_step": 235439, "epoch": 1945} {"train_loss": -42.715938568115234, "global_step": 235440, "epoch": 1945} {"train_loss": -41.09782028198242, "global_step": 235441, "epoch": 1945} {"train_loss": -41.1292724609375, "global_step": 235442, "epoch": 1945} {"train_loss": -42.4937629699707, "global_step": 235443, "epoch": 1945} {"train_loss": -41.56609344482422, "global_step": 235444, "epoch": 1945} {"train_loss": -41.74454879760742, "global_step": 235445, "epoch": 1945} {"train_loss": -42.74343490600586, "global_step": 235446, "epoch": 1945} {"train_loss": -41.65529251098633, "global_step": 235447, "epoch": 1945} {"train_loss": -43.49605941772461, "global_step": 235448, "epoch": 1945} {"train_loss": -42.18398666381836, "global_step": 235449, "epoch": 1945} {"train_loss": -40.87886047363281, "global_step": 235450, "epoch": 1945} {"train_loss": -41.45450973510742, "global_step": 235451, "epoch": 1945} {"train_loss": -42.40875244140625, "global_step": 235452, "epoch": 1945} {"train_loss": -41.616371154785156, "global_step": 235453, "epoch": 1945} {"train_loss": -41.080543518066406, "global_step": 235454, "epoch": 1945} {"train_loss": -42.580074310302734, "global_step": 235455, "epoch": 1945} {"train_loss": -42.55747604370117, "global_step": 235456, "epoch": 1945} {"train_loss": -42.54191970825195, "global_step": 235457, "epoch": 1945} {"train_loss": -42.228790283203125, "global_step": 235458, "epoch": 1945} {"train_loss": -42.56560516357422, "global_step": 235459, "epoch": 1945} {"train_loss": -42.01435089111328, "global_step": 235460, "epoch": 1945} {"train_loss": -42.40407180786133, "global_step": 235461, "epoch": 1945} {"train_loss": -42.758056640625, "global_step": 235462, "epoch": 1945} {"train_loss": -42.27960205078125, "global_step": 235463, "epoch": 1945} {"train_loss": -42.015472412109375, "global_step": 235464, "epoch": 1945} {"train_loss": -42.50260509144176, "global_step": 235465, "epoch": 1945, "val_loss": 2623490.25} {"train_loss": -42.41328811645508, "global_step": 235466, "epoch": 1946} {"train_loss": -40.96156692504883, "global_step": 235467, "epoch": 1946} {"train_loss": -41.48353958129883, "global_step": 235468, "epoch": 1946} {"train_loss": -40.028934478759766, "global_step": 235469, "epoch": 1946} {"train_loss": -41.2110710144043, "global_step": 235470, "epoch": 1946} {"train_loss": -41.94948959350586, "global_step": 235471, "epoch": 1946} {"train_loss": -38.406829833984375, "global_step": 235472, "epoch": 1946} {"train_loss": -32.431514739990234, "global_step": 235473, "epoch": 1946} {"train_loss": -40.985565185546875, "global_step": 235474, "epoch": 1946} {"train_loss": -34.499935150146484, "global_step": 235475, "epoch": 1946} {"train_loss": -39.55814743041992, "global_step": 235476, "epoch": 1946} {"train_loss": -37.36582565307617, "global_step": 235477, "epoch": 1946} {"train_loss": -38.81600570678711, "global_step": 235478, "epoch": 1946} {"train_loss": -39.44950866699219, "global_step": 235479, "epoch": 1946} {"train_loss": -33.816741943359375, "global_step": 235480, "epoch": 1946} {"train_loss": -34.0842170715332, "global_step": 235481, "epoch": 1946} {"train_loss": -38.903709411621094, "global_step": 235482, "epoch": 1946} {"train_loss": -37.91450119018555, "global_step": 235483, "epoch": 1946} {"train_loss": -37.10296630859375, "global_step": 235484, "epoch": 1946} {"train_loss": -37.198150634765625, "global_step": 235485, "epoch": 1946} {"train_loss": -35.23064041137695, "global_step": 235486, "epoch": 1946} {"train_loss": -36.2209587097168, "global_step": 235487, "epoch": 1946} {"train_loss": -34.830204010009766, "global_step": 235488, "epoch": 1946} {"train_loss": -37.0914421081543, "global_step": 235489, "epoch": 1946} {"train_loss": -33.2588996887207, "global_step": 235490, "epoch": 1946} {"train_loss": -38.79822540283203, "global_step": 235491, "epoch": 1946} {"train_loss": -39.0957145690918, "global_step": 235492, "epoch": 1946} {"train_loss": -37.01081466674805, "global_step": 235493, "epoch": 1946} {"train_loss": -32.55545425415039, "global_step": 235494, "epoch": 1946} {"train_loss": -36.26577377319336, "global_step": 235495, "epoch": 1946} {"train_loss": -38.31691360473633, "global_step": 235496, "epoch": 1946} {"train_loss": -40.19460678100586, "global_step": 235497, "epoch": 1946} {"train_loss": -39.16422653198242, "global_step": 235498, "epoch": 1946} {"train_loss": -39.85425567626953, "global_step": 235499, "epoch": 1946} {"train_loss": -37.872459411621094, "global_step": 235500, "epoch": 1946} {"train_loss": -38.37290573120117, "global_step": 235501, "epoch": 1946} {"train_loss": -39.62205505371094, "global_step": 235502, "epoch": 1946} {"train_loss": -39.15729904174805, "global_step": 235503, "epoch": 1946} {"train_loss": -39.7955322265625, "global_step": 235504, "epoch": 1946} {"train_loss": -40.70094680786133, "global_step": 235505, "epoch": 1946} {"train_loss": -40.90447998046875, "global_step": 235506, "epoch": 1946} {"train_loss": -40.49782943725586, "global_step": 235507, "epoch": 1946} {"train_loss": -37.84239196777344, "global_step": 235508, "epoch": 1946} {"train_loss": -40.05567169189453, "global_step": 235509, "epoch": 1946} {"train_loss": -39.13276672363281, "global_step": 235510, "epoch": 1946} {"train_loss": -40.79927444458008, "global_step": 235511, "epoch": 1946} {"train_loss": -40.3464469909668, "global_step": 235512, "epoch": 1946} {"train_loss": -39.35355758666992, "global_step": 235513, "epoch": 1946} {"train_loss": -41.0752067565918, "global_step": 235514, "epoch": 1946} {"train_loss": -41.607215881347656, "global_step": 235515, "epoch": 1946} {"train_loss": -41.67961502075195, "global_step": 235516, "epoch": 1946} {"train_loss": -41.116756439208984, "global_step": 235517, "epoch": 1946} {"train_loss": -41.294986724853516, "global_step": 235518, "epoch": 1946} {"train_loss": -40.951454162597656, "global_step": 235519, "epoch": 1946} {"train_loss": -41.09400177001953, "global_step": 235520, "epoch": 1946} {"train_loss": -41.77252960205078, "global_step": 235521, "epoch": 1946} {"train_loss": -40.79840087890625, "global_step": 235522, "epoch": 1946} {"train_loss": -41.56817626953125, "global_step": 235523, "epoch": 1946} {"train_loss": -41.66303253173828, "global_step": 235524, "epoch": 1946} {"train_loss": -41.90164566040039, "global_step": 235525, "epoch": 1946} {"train_loss": -41.29104232788086, "global_step": 235526, "epoch": 1946} {"train_loss": -41.987464904785156, "global_step": 235527, "epoch": 1946} {"train_loss": -41.6562385559082, "global_step": 235528, "epoch": 1946} {"train_loss": -41.41263961791992, "global_step": 235529, "epoch": 1946} {"train_loss": -41.46996307373047, "global_step": 235530, "epoch": 1946} {"train_loss": -41.82114791870117, "global_step": 235531, "epoch": 1946} {"train_loss": -42.06874465942383, "global_step": 235532, "epoch": 1946} {"train_loss": -42.2149543762207, "global_step": 235533, "epoch": 1946} {"train_loss": -41.89475631713867, "global_step": 235534, "epoch": 1946} {"train_loss": -41.81473922729492, "global_step": 235535, "epoch": 1946} {"train_loss": -40.84664535522461, "global_step": 235536, "epoch": 1946} {"train_loss": -42.124183654785156, "global_step": 235537, "epoch": 1946} {"train_loss": -41.61128616333008, "global_step": 235538, "epoch": 1946} {"train_loss": -41.9340934753418, "global_step": 235539, "epoch": 1946} {"train_loss": -41.714935302734375, "global_step": 235540, "epoch": 1946} {"train_loss": -42.643768310546875, "global_step": 235541, "epoch": 1946} {"train_loss": -42.638362884521484, "global_step": 235542, "epoch": 1946} {"train_loss": -42.21537399291992, "global_step": 235543, "epoch": 1946} {"train_loss": -41.93996810913086, "global_step": 235544, "epoch": 1946} {"train_loss": -42.66677474975586, "global_step": 235545, "epoch": 1946} {"train_loss": -42.37732696533203, "global_step": 235546, "epoch": 1946} {"train_loss": -42.235145568847656, "global_step": 235547, "epoch": 1946} {"train_loss": -42.718902587890625, "global_step": 235548, "epoch": 1946} {"train_loss": -42.577335357666016, "global_step": 235549, "epoch": 1946} {"train_loss": -43.430023193359375, "global_step": 235550, "epoch": 1946} {"train_loss": -42.93986129760742, "global_step": 235551, "epoch": 1946} {"train_loss": -42.49669647216797, "global_step": 235552, "epoch": 1946} {"train_loss": -42.11557388305664, "global_step": 235553, "epoch": 1946} {"train_loss": -42.923274993896484, "global_step": 235554, "epoch": 1946} {"train_loss": -42.47930145263672, "global_step": 235555, "epoch": 1946} {"train_loss": -43.433204650878906, "global_step": 235556, "epoch": 1946} {"train_loss": -42.54522705078125, "global_step": 235557, "epoch": 1946} {"train_loss": -43.170108795166016, "global_step": 235558, "epoch": 1946} {"train_loss": -43.213844299316406, "global_step": 235559, "epoch": 1946} {"train_loss": -42.75901412963867, "global_step": 235560, "epoch": 1946} {"train_loss": -42.92234420776367, "global_step": 235561, "epoch": 1946} {"train_loss": -42.498573303222656, "global_step": 235562, "epoch": 1946} {"train_loss": -42.33348083496094, "global_step": 235563, "epoch": 1946} {"train_loss": -42.88922119140625, "global_step": 235564, "epoch": 1946} {"train_loss": -42.41883850097656, "global_step": 235565, "epoch": 1946} {"train_loss": -43.56257247924805, "global_step": 235566, "epoch": 1946} {"train_loss": -43.17043685913086, "global_step": 235567, "epoch": 1946} {"train_loss": -43.10201644897461, "global_step": 235568, "epoch": 1946} {"train_loss": -43.65279769897461, "global_step": 235569, "epoch": 1946} {"train_loss": -42.92246627807617, "global_step": 235570, "epoch": 1946} {"train_loss": -42.91823959350586, "global_step": 235571, "epoch": 1946} {"train_loss": -42.82163619995117, "global_step": 235572, "epoch": 1946} {"train_loss": -42.46989822387695, "global_step": 235573, "epoch": 1946} {"train_loss": -42.71198272705078, "global_step": 235574, "epoch": 1946} {"train_loss": -43.31637191772461, "global_step": 235575, "epoch": 1946} {"train_loss": -42.989723205566406, "global_step": 235576, "epoch": 1946} {"train_loss": -42.990848541259766, "global_step": 235577, "epoch": 1946} {"train_loss": -43.07147979736328, "global_step": 235578, "epoch": 1946} {"train_loss": -42.54891586303711, "global_step": 235579, "epoch": 1946} {"train_loss": -42.541378021240234, "global_step": 235580, "epoch": 1946} {"train_loss": -41.58269119262695, "global_step": 235581, "epoch": 1946} {"train_loss": -41.891143798828125, "global_step": 235582, "epoch": 1946} {"train_loss": -41.3916015625, "global_step": 235583, "epoch": 1946} {"train_loss": -40.59054183959961, "global_step": 235584, "epoch": 1946} {"train_loss": -38.89069366455078, "global_step": 235585, "epoch": 1946} {"train_loss": -40.664236210594495, "global_step": 235586, "epoch": 1946, "val_loss": 2605585.25} {"train_loss": -41.20750045776367, "global_step": 235587, "epoch": 1947} {"train_loss": -36.049041748046875, "global_step": 235588, "epoch": 1947} {"train_loss": -42.12502670288086, "global_step": 235589, "epoch": 1947} {"train_loss": -33.980831146240234, "global_step": 235590, "epoch": 1947} {"train_loss": -34.38985824584961, "global_step": 235591, "epoch": 1947} {"train_loss": -37.26382064819336, "global_step": 235592, "epoch": 1947} {"train_loss": -37.9102668762207, "global_step": 235593, "epoch": 1947} {"train_loss": -35.123470306396484, "global_step": 235594, "epoch": 1947} {"train_loss": -38.459136962890625, "global_step": 235595, "epoch": 1947} {"train_loss": -37.50038528442383, "global_step": 235596, "epoch": 1947} {"train_loss": -38.31623077392578, "global_step": 235597, "epoch": 1947} {"train_loss": -40.046424865722656, "global_step": 235598, "epoch": 1947} {"train_loss": -38.491764068603516, "global_step": 235599, "epoch": 1947} {"train_loss": -40.47541427612305, "global_step": 235600, "epoch": 1947} {"train_loss": -38.0698356628418, "global_step": 235601, "epoch": 1947} {"train_loss": -39.40473556518555, "global_step": 235602, "epoch": 1947} {"train_loss": -39.3968505859375, "global_step": 235603, "epoch": 1947} {"train_loss": -39.73651885986328, "global_step": 235604, "epoch": 1947} {"train_loss": -37.95014190673828, "global_step": 235605, "epoch": 1947} {"train_loss": -40.7663459777832, "global_step": 235606, "epoch": 1947} {"train_loss": -40.0599479675293, "global_step": 235607, "epoch": 1947} {"train_loss": -41.11735153198242, "global_step": 235608, "epoch": 1947} {"train_loss": -40.0471305847168, "global_step": 235609, "epoch": 1947} {"train_loss": -40.15808868408203, "global_step": 235610, "epoch": 1947} {"train_loss": -41.51032257080078, "global_step": 235611, "epoch": 1947} {"train_loss": -40.511199951171875, "global_step": 235612, "epoch": 1947} {"train_loss": -41.71085739135742, "global_step": 235613, "epoch": 1947} {"train_loss": -40.75016784667969, "global_step": 235614, "epoch": 1947} {"train_loss": -41.87679672241211, "global_step": 235615, "epoch": 1947} {"train_loss": -40.9099006652832, "global_step": 235616, "epoch": 1947} {"train_loss": -42.37869644165039, "global_step": 235617, "epoch": 1947} {"train_loss": -41.53516387939453, "global_step": 235618, "epoch": 1947} {"train_loss": -41.4832763671875, "global_step": 235619, "epoch": 1947} {"train_loss": -41.79301071166992, "global_step": 235620, "epoch": 1947} {"train_loss": -42.1419792175293, "global_step": 235621, "epoch": 1947} {"train_loss": -42.14097595214844, "global_step": 235622, "epoch": 1947} {"train_loss": -42.17366409301758, "global_step": 235623, "epoch": 1947} {"train_loss": -41.69503402709961, "global_step": 235624, "epoch": 1947} {"train_loss": -42.22840118408203, "global_step": 235625, "epoch": 1947} {"train_loss": -42.2191047668457, "global_step": 235626, "epoch": 1947} {"train_loss": -42.47984313964844, "global_step": 235627, "epoch": 1947} {"train_loss": -42.12662887573242, "global_step": 235628, "epoch": 1947} {"train_loss": -42.35586166381836, "global_step": 235629, "epoch": 1947} {"train_loss": -42.81667709350586, "global_step": 235630, "epoch": 1947} {"train_loss": -42.21156692504883, "global_step": 235631, "epoch": 1947} {"train_loss": -42.910919189453125, "global_step": 235632, "epoch": 1947} {"train_loss": -42.39752960205078, "global_step": 235633, "epoch": 1947} {"train_loss": -42.62288284301758, "global_step": 235634, "epoch": 1947} {"train_loss": -42.19767761230469, "global_step": 235635, "epoch": 1947} {"train_loss": -42.433868408203125, "global_step": 235636, "epoch": 1947} {"train_loss": -42.895015716552734, "global_step": 235637, "epoch": 1947} {"train_loss": -42.649383544921875, "global_step": 235638, "epoch": 1947} {"train_loss": -42.427303314208984, "global_step": 235639, "epoch": 1947} {"train_loss": -42.83820724487305, "global_step": 235640, "epoch": 1947} {"train_loss": -43.13808822631836, "global_step": 235641, "epoch": 1947} {"train_loss": -42.78693771362305, "global_step": 235642, "epoch": 1947} {"train_loss": -42.315589904785156, "global_step": 235643, "epoch": 1947} {"train_loss": -42.7576789855957, "global_step": 235644, "epoch": 1947} {"train_loss": -42.98124694824219, "global_step": 235645, "epoch": 1947} {"train_loss": -42.5226936340332, "global_step": 235646, "epoch": 1947} {"train_loss": -42.98163986206055, "global_step": 235647, "epoch": 1947} {"train_loss": -42.843990325927734, "global_step": 235648, "epoch": 1947} {"train_loss": -43.51449203491211, "global_step": 235649, "epoch": 1947} {"train_loss": -42.80048370361328, "global_step": 235650, "epoch": 1947} {"train_loss": -43.1962890625, "global_step": 235651, "epoch": 1947} {"train_loss": -42.748931884765625, "global_step": 235652, "epoch": 1947} {"train_loss": -42.846248626708984, "global_step": 235653, "epoch": 1947} {"train_loss": -42.05447006225586, "global_step": 235654, "epoch": 1947} {"train_loss": -43.24835205078125, "global_step": 235655, "epoch": 1947} {"train_loss": -42.24824905395508, "global_step": 235656, "epoch": 1947} {"train_loss": -43.08838653564453, "global_step": 235657, "epoch": 1947} {"train_loss": -42.96088409423828, "global_step": 235658, "epoch": 1947} {"train_loss": -42.44941329956055, "global_step": 235659, "epoch": 1947} {"train_loss": -41.3420524597168, "global_step": 235660, "epoch": 1947} {"train_loss": -39.111690521240234, "global_step": 235661, "epoch": 1947} {"train_loss": -39.45100021362305, "global_step": 235662, "epoch": 1947} {"train_loss": -42.40010452270508, "global_step": 235663, "epoch": 1947} {"train_loss": -39.41190719604492, "global_step": 235664, "epoch": 1947} {"train_loss": -38.99946212768555, "global_step": 235665, "epoch": 1947} {"train_loss": -41.595314025878906, "global_step": 235666, "epoch": 1947} {"train_loss": -39.097564697265625, "global_step": 235667, "epoch": 1947} {"train_loss": -41.67112350463867, "global_step": 235668, "epoch": 1947} {"train_loss": -41.924922943115234, "global_step": 235669, "epoch": 1947} {"train_loss": -40.52564239501953, "global_step": 235670, "epoch": 1947} {"train_loss": -41.56532287597656, "global_step": 235671, "epoch": 1947} {"train_loss": -41.83233642578125, "global_step": 235672, "epoch": 1947} {"train_loss": -38.82332229614258, "global_step": 235673, "epoch": 1947} {"train_loss": -41.947967529296875, "global_step": 235674, "epoch": 1947} {"train_loss": -41.16171646118164, "global_step": 235675, "epoch": 1947} {"train_loss": -40.53606033325195, "global_step": 235676, "epoch": 1947} {"train_loss": -42.266693115234375, "global_step": 235677, "epoch": 1947} {"train_loss": -36.92005157470703, "global_step": 235678, "epoch": 1947} {"train_loss": -42.225772857666016, "global_step": 235679, "epoch": 1947} {"train_loss": -38.28616714477539, "global_step": 235680, "epoch": 1947} {"train_loss": -41.38947677612305, "global_step": 235681, "epoch": 1947} {"train_loss": -39.89506912231445, "global_step": 235682, "epoch": 1947} {"train_loss": -40.95574951171875, "global_step": 235683, "epoch": 1947} {"train_loss": -39.19668197631836, "global_step": 235684, "epoch": 1947} {"train_loss": -40.09476852416992, "global_step": 235685, "epoch": 1947} {"train_loss": -40.31131362915039, "global_step": 235686, "epoch": 1947} {"train_loss": -40.75714874267578, "global_step": 235687, "epoch": 1947} {"train_loss": -41.064884185791016, "global_step": 235688, "epoch": 1947} {"train_loss": -39.1262321472168, "global_step": 235689, "epoch": 1947} {"train_loss": -41.28460693359375, "global_step": 235690, "epoch": 1947} {"train_loss": -41.23040771484375, "global_step": 235691, "epoch": 1947} {"train_loss": -42.00600814819336, "global_step": 235692, "epoch": 1947} {"train_loss": -41.68641662597656, "global_step": 235693, "epoch": 1947} {"train_loss": -41.6450080871582, "global_step": 235694, "epoch": 1947} {"train_loss": -41.104278564453125, "global_step": 235695, "epoch": 1947} {"train_loss": -41.73548126220703, "global_step": 235696, "epoch": 1947} {"train_loss": -42.47364044189453, "global_step": 235697, "epoch": 1947} {"train_loss": -41.09259796142578, "global_step": 235698, "epoch": 1947} {"train_loss": -41.424373626708984, "global_step": 235699, "epoch": 1947} {"train_loss": -41.78745651245117, "global_step": 235700, "epoch": 1947} {"train_loss": -43.034881591796875, "global_step": 235701, "epoch": 1947} {"train_loss": -42.6309928894043, "global_step": 235702, "epoch": 1947} {"train_loss": -42.4891357421875, "global_step": 235703, "epoch": 1947} {"train_loss": -41.43837356567383, "global_step": 235704, "epoch": 1947} {"train_loss": -41.99898910522461, "global_step": 235705, "epoch": 1947} {"train_loss": -42.73289108276367, "global_step": 235706, "epoch": 1947} {"train_loss": -41.08647877716821, "global_step": 235707, "epoch": 1947, "val_loss": 2620197.25} {"train_loss": -42.261898040771484, "global_step": 235708, "epoch": 1948} {"train_loss": -40.348201751708984, "global_step": 235709, "epoch": 1948} {"train_loss": -40.83198165893555, "global_step": 235710, "epoch": 1948} {"train_loss": -42.3426513671875, "global_step": 235711, "epoch": 1948} {"train_loss": -42.43449401855469, "global_step": 235712, "epoch": 1948} {"train_loss": -41.41815948486328, "global_step": 235713, "epoch": 1948} {"train_loss": -40.84899139404297, "global_step": 235714, "epoch": 1948} {"train_loss": -42.70291519165039, "global_step": 235715, "epoch": 1948} {"train_loss": -41.24178695678711, "global_step": 235716, "epoch": 1948} {"train_loss": -39.58244323730469, "global_step": 235717, "epoch": 1948} {"train_loss": -41.89040756225586, "global_step": 235718, "epoch": 1948} {"train_loss": -42.11458969116211, "global_step": 235719, "epoch": 1948} {"train_loss": -41.318016052246094, "global_step": 235720, "epoch": 1948} {"train_loss": -39.843746185302734, "global_step": 235721, "epoch": 1948} {"train_loss": -40.62754440307617, "global_step": 235722, "epoch": 1948} {"train_loss": -41.985877990722656, "global_step": 235723, "epoch": 1948} {"train_loss": -41.26722717285156, "global_step": 235724, "epoch": 1948} {"train_loss": -40.18878173828125, "global_step": 235725, "epoch": 1948} {"train_loss": -41.5081672668457, "global_step": 235726, "epoch": 1948} {"train_loss": -41.31109619140625, "global_step": 235727, "epoch": 1948} {"train_loss": -39.409950256347656, "global_step": 235728, "epoch": 1948} {"train_loss": -42.39593505859375, "global_step": 235729, "epoch": 1948} {"train_loss": -37.63697052001953, "global_step": 235730, "epoch": 1948} {"train_loss": -42.008670806884766, "global_step": 235731, "epoch": 1948} {"train_loss": -39.35915756225586, "global_step": 235732, "epoch": 1948} {"train_loss": -39.465267181396484, "global_step": 235733, "epoch": 1948} {"train_loss": -41.32059860229492, "global_step": 235734, "epoch": 1948} {"train_loss": -40.31928253173828, "global_step": 235735, "epoch": 1948} {"train_loss": -41.46234130859375, "global_step": 235736, "epoch": 1948} {"train_loss": -40.50798416137695, "global_step": 235737, "epoch": 1948} {"train_loss": -41.366939544677734, "global_step": 235738, "epoch": 1948} {"train_loss": -40.45353317260742, "global_step": 235739, "epoch": 1948} {"train_loss": -41.62569808959961, "global_step": 235740, "epoch": 1948} {"train_loss": -40.9332160949707, "global_step": 235741, "epoch": 1948} {"train_loss": -40.30586242675781, "global_step": 235742, "epoch": 1948} {"train_loss": -41.41789627075195, "global_step": 235743, "epoch": 1948} {"train_loss": -40.678245544433594, "global_step": 235744, "epoch": 1948} {"train_loss": -40.51389694213867, "global_step": 235745, "epoch": 1948} {"train_loss": -41.13264083862305, "global_step": 235746, "epoch": 1948} {"train_loss": -40.46976089477539, "global_step": 235747, "epoch": 1948} {"train_loss": -41.221107482910156, "global_step": 235748, "epoch": 1948} {"train_loss": -40.649696350097656, "global_step": 235749, "epoch": 1948} {"train_loss": -41.69114685058594, "global_step": 235750, "epoch": 1948} {"train_loss": -41.03971481323242, "global_step": 235751, "epoch": 1948} {"train_loss": -42.061614990234375, "global_step": 235752, "epoch": 1948} {"train_loss": -41.242828369140625, "global_step": 235753, "epoch": 1948} {"train_loss": -41.82857894897461, "global_step": 235754, "epoch": 1948} {"train_loss": -40.95827865600586, "global_step": 235755, "epoch": 1948} {"train_loss": -41.90786361694336, "global_step": 235756, "epoch": 1948} {"train_loss": -41.74768829345703, "global_step": 235757, "epoch": 1948} {"train_loss": -41.21617889404297, "global_step": 235758, "epoch": 1948} {"train_loss": -42.065406799316406, "global_step": 235759, "epoch": 1948} {"train_loss": -41.817256927490234, "global_step": 235760, "epoch": 1948} {"train_loss": -41.1672248840332, "global_step": 235761, "epoch": 1948} {"train_loss": -41.548709869384766, "global_step": 235762, "epoch": 1948} {"train_loss": -42.5757942199707, "global_step": 235763, "epoch": 1948} {"train_loss": -42.03196334838867, "global_step": 235764, "epoch": 1948} {"train_loss": -42.050472259521484, "global_step": 235765, "epoch": 1948} {"train_loss": -42.802162170410156, "global_step": 235766, "epoch": 1948} {"train_loss": -41.87322998046875, "global_step": 235767, "epoch": 1948} {"train_loss": -42.63268280029297, "global_step": 235768, "epoch": 1948} {"train_loss": -41.92525100708008, "global_step": 235769, "epoch": 1948} {"train_loss": -42.137977600097656, "global_step": 235770, "epoch": 1948} {"train_loss": -42.24019241333008, "global_step": 235771, "epoch": 1948} {"train_loss": -42.392757415771484, "global_step": 235772, "epoch": 1948} {"train_loss": -41.925384521484375, "global_step": 235773, "epoch": 1948} {"train_loss": -42.68996047973633, "global_step": 235774, "epoch": 1948} {"train_loss": -42.889644622802734, "global_step": 235775, "epoch": 1948} {"train_loss": -42.58803939819336, "global_step": 235776, "epoch": 1948} {"train_loss": -42.65266418457031, "global_step": 235777, "epoch": 1948} {"train_loss": -42.967613220214844, "global_step": 235778, "epoch": 1948} {"train_loss": -42.2806510925293, "global_step": 235779, "epoch": 1948} {"train_loss": -43.18046188354492, "global_step": 235780, "epoch": 1948} {"train_loss": -42.92897415161133, "global_step": 235781, "epoch": 1948} {"train_loss": -42.571800231933594, "global_step": 235782, "epoch": 1948} {"train_loss": -42.728755950927734, "global_step": 235783, "epoch": 1948} {"train_loss": -42.981056213378906, "global_step": 235784, "epoch": 1948} {"train_loss": -42.816749572753906, "global_step": 235785, "epoch": 1948} {"train_loss": -43.37105178833008, "global_step": 235786, "epoch": 1948} {"train_loss": -43.15715026855469, "global_step": 235787, "epoch": 1948} {"train_loss": -43.07405090332031, "global_step": 235788, "epoch": 1948} {"train_loss": -43.1712532043457, "global_step": 235789, "epoch": 1948} {"train_loss": -43.337425231933594, "global_step": 235790, "epoch": 1948} {"train_loss": -43.469295501708984, "global_step": 235791, "epoch": 1948} {"train_loss": -43.22440719604492, "global_step": 235792, "epoch": 1948} {"train_loss": -43.38465118408203, "global_step": 235793, "epoch": 1948} {"train_loss": -43.54594802856445, "global_step": 235794, "epoch": 1948} {"train_loss": -43.52089309692383, "global_step": 235795, "epoch": 1948} {"train_loss": -43.33388900756836, "global_step": 235796, "epoch": 1948} {"train_loss": -43.491432189941406, "global_step": 235797, "epoch": 1948} {"train_loss": -43.705078125, "global_step": 235798, "epoch": 1948} {"train_loss": -42.33521270751953, "global_step": 235799, "epoch": 1948} {"train_loss": -43.301700592041016, "global_step": 235800, "epoch": 1948} {"train_loss": -43.313690185546875, "global_step": 235801, "epoch": 1948} {"train_loss": -43.55245590209961, "global_step": 235802, "epoch": 1948} {"train_loss": -42.68528366088867, "global_step": 235803, "epoch": 1948} {"train_loss": -43.23054122924805, "global_step": 235804, "epoch": 1948} {"train_loss": -43.412479400634766, "global_step": 235805, "epoch": 1948} {"train_loss": -42.6336669921875, "global_step": 235806, "epoch": 1948} {"train_loss": -42.68943786621094, "global_step": 235807, "epoch": 1948} {"train_loss": -43.23398971557617, "global_step": 235808, "epoch": 1948} {"train_loss": -42.180362701416016, "global_step": 235809, "epoch": 1948} {"train_loss": -42.632232666015625, "global_step": 235810, "epoch": 1948} {"train_loss": -43.537010192871094, "global_step": 235811, "epoch": 1948} {"train_loss": -42.4608268737793, "global_step": 235812, "epoch": 1948} {"train_loss": -42.57265853881836, "global_step": 235813, "epoch": 1948} {"train_loss": -43.31663131713867, "global_step": 235814, "epoch": 1948} {"train_loss": -43.22481918334961, "global_step": 235815, "epoch": 1948} {"train_loss": -42.70437240600586, "global_step": 235816, "epoch": 1948} {"train_loss": -43.33112335205078, "global_step": 235817, "epoch": 1948} {"train_loss": -42.9518928527832, "global_step": 235818, "epoch": 1948} {"train_loss": -42.620723724365234, "global_step": 235819, "epoch": 1948} {"train_loss": -42.764854431152344, "global_step": 235820, "epoch": 1948} {"train_loss": -42.53175735473633, "global_step": 235821, "epoch": 1948} {"train_loss": -41.484130859375, "global_step": 235822, "epoch": 1948} {"train_loss": -41.946807861328125, "global_step": 235823, "epoch": 1948} {"train_loss": -42.52582550048828, "global_step": 235824, "epoch": 1948} {"train_loss": -42.82254409790039, "global_step": 235825, "epoch": 1948} {"train_loss": -41.564456939697266, "global_step": 235826, "epoch": 1948} {"train_loss": -41.14210891723633, "global_step": 235827, "epoch": 1948} {"train_loss": -42.015869109098574, "global_step": 235828, "epoch": 1948, "val_loss": 2642094.25} {"train_loss": -41.78194808959961, "global_step": 235829, "epoch": 1949} {"train_loss": -40.87084197998047, "global_step": 235830, "epoch": 1949} {"train_loss": -41.04456329345703, "global_step": 235831, "epoch": 1949} {"train_loss": -41.32094192504883, "global_step": 235832, "epoch": 1949} {"train_loss": -40.71493911743164, "global_step": 235833, "epoch": 1949} {"train_loss": -42.1139030456543, "global_step": 235834, "epoch": 1949} {"train_loss": -43.19013595581055, "global_step": 235835, "epoch": 1949} {"train_loss": -41.0860481262207, "global_step": 235836, "epoch": 1949} {"train_loss": -39.557281494140625, "global_step": 235837, "epoch": 1949} {"train_loss": -41.6596794128418, "global_step": 235838, "epoch": 1949} {"train_loss": -42.714454650878906, "global_step": 235839, "epoch": 1949} {"train_loss": -42.138755798339844, "global_step": 235840, "epoch": 1949} {"train_loss": -42.2049560546875, "global_step": 235841, "epoch": 1949} {"train_loss": -43.020381927490234, "global_step": 235842, "epoch": 1949} {"train_loss": -41.733577728271484, "global_step": 235843, "epoch": 1949} {"train_loss": -41.72217559814453, "global_step": 235844, "epoch": 1949} {"train_loss": -42.94987869262695, "global_step": 235845, "epoch": 1949} {"train_loss": -42.02682113647461, "global_step": 235846, "epoch": 1949} {"train_loss": -42.34687423706055, "global_step": 235847, "epoch": 1949} {"train_loss": -42.84650802612305, "global_step": 235848, "epoch": 1949} {"train_loss": -41.987483978271484, "global_step": 235849, "epoch": 1949} {"train_loss": -41.29280471801758, "global_step": 235850, "epoch": 1949} {"train_loss": -42.977901458740234, "global_step": 235851, "epoch": 1949} {"train_loss": -42.775474548339844, "global_step": 235852, "epoch": 1949} {"train_loss": -42.523773193359375, "global_step": 235853, "epoch": 1949} {"train_loss": -43.16571807861328, "global_step": 235854, "epoch": 1949} {"train_loss": -42.98580551147461, "global_step": 235855, "epoch": 1949} {"train_loss": -43.0003662109375, "global_step": 235856, "epoch": 1949} {"train_loss": -43.283607482910156, "global_step": 235857, "epoch": 1949} {"train_loss": -42.22932052612305, "global_step": 235858, "epoch": 1949} {"train_loss": -42.8791618347168, "global_step": 235859, "epoch": 1949} {"train_loss": -42.350589752197266, "global_step": 235860, "epoch": 1949} {"train_loss": -41.992305755615234, "global_step": 235861, "epoch": 1949} {"train_loss": -43.07257080078125, "global_step": 235862, "epoch": 1949} {"train_loss": -42.84864807128906, "global_step": 235863, "epoch": 1949} {"train_loss": -42.135223388671875, "global_step": 235864, "epoch": 1949} {"train_loss": -42.32716751098633, "global_step": 235865, "epoch": 1949} {"train_loss": -42.7433967590332, "global_step": 235866, "epoch": 1949} {"train_loss": -42.82046127319336, "global_step": 235867, "epoch": 1949} {"train_loss": -42.5871467590332, "global_step": 235868, "epoch": 1949} {"train_loss": -42.47874069213867, "global_step": 235869, "epoch": 1949} {"train_loss": -42.645538330078125, "global_step": 235870, "epoch": 1949} {"train_loss": -43.07488250732422, "global_step": 235871, "epoch": 1949} {"train_loss": -43.09609603881836, "global_step": 235872, "epoch": 1949} {"train_loss": -42.96894454956055, "global_step": 235873, "epoch": 1949} {"train_loss": -43.284515380859375, "global_step": 235874, "epoch": 1949} {"train_loss": -43.464759826660156, "global_step": 235875, "epoch": 1949} {"train_loss": -43.38655090332031, "global_step": 235876, "epoch": 1949} {"train_loss": -43.43085861206055, "global_step": 235877, "epoch": 1949} {"train_loss": -43.52838897705078, "global_step": 235878, "epoch": 1949} {"train_loss": -43.77759552001953, "global_step": 235879, "epoch": 1949} {"train_loss": -43.38124084472656, "global_step": 235880, "epoch": 1949} {"train_loss": -42.102779388427734, "global_step": 235881, "epoch": 1949} {"train_loss": -43.52607727050781, "global_step": 235882, "epoch": 1949} {"train_loss": -43.64193344116211, "global_step": 235883, "epoch": 1949} {"train_loss": -43.0566520690918, "global_step": 235884, "epoch": 1949} {"train_loss": -43.639564514160156, "global_step": 235885, "epoch": 1949} {"train_loss": -43.138885498046875, "global_step": 235886, "epoch": 1949} {"train_loss": -42.16718292236328, "global_step": 235887, "epoch": 1949} {"train_loss": -42.686397552490234, "global_step": 235888, "epoch": 1949} {"train_loss": -43.327415466308594, "global_step": 235889, "epoch": 1949} {"train_loss": -43.39805221557617, "global_step": 235890, "epoch": 1949} {"train_loss": -43.48887252807617, "global_step": 235891, "epoch": 1949} {"train_loss": -43.43931198120117, "global_step": 235892, "epoch": 1949} {"train_loss": -43.23472595214844, "global_step": 235893, "epoch": 1949} {"train_loss": -43.21450424194336, "global_step": 235894, "epoch": 1949} {"train_loss": -42.968910217285156, "global_step": 235895, "epoch": 1949} {"train_loss": -43.604217529296875, "global_step": 235896, "epoch": 1949} {"train_loss": -43.775718688964844, "global_step": 235897, "epoch": 1949} {"train_loss": -43.05550003051758, "global_step": 235898, "epoch": 1949} {"train_loss": -43.37642288208008, "global_step": 235899, "epoch": 1949} {"train_loss": -43.431400299072266, "global_step": 235900, "epoch": 1949} {"train_loss": -43.062644958496094, "global_step": 235901, "epoch": 1949} {"train_loss": -43.08106231689453, "global_step": 235902, "epoch": 1949} {"train_loss": -42.83783721923828, "global_step": 235903, "epoch": 1949} {"train_loss": -42.37881088256836, "global_step": 235904, "epoch": 1949} {"train_loss": -41.3072395324707, "global_step": 235905, "epoch": 1949} {"train_loss": -42.42516326904297, "global_step": 235906, "epoch": 1949} {"train_loss": -43.102500915527344, "global_step": 235907, "epoch": 1949} {"train_loss": -42.251922607421875, "global_step": 235908, "epoch": 1949} {"train_loss": -42.60956954956055, "global_step": 235909, "epoch": 1949} {"train_loss": -41.4825439453125, "global_step": 235910, "epoch": 1949} {"train_loss": -41.78258514404297, "global_step": 235911, "epoch": 1949} {"train_loss": -42.73027420043945, "global_step": 235912, "epoch": 1949} {"train_loss": -41.127376556396484, "global_step": 235913, "epoch": 1949} {"train_loss": -42.26359176635742, "global_step": 235914, "epoch": 1949} {"train_loss": -42.85015869140625, "global_step": 235915, "epoch": 1949} {"train_loss": -42.93842697143555, "global_step": 235916, "epoch": 1949} {"train_loss": -42.236236572265625, "global_step": 235917, "epoch": 1949} {"train_loss": -42.73591995239258, "global_step": 235918, "epoch": 1949} {"train_loss": -41.27345275878906, "global_step": 235919, "epoch": 1949} {"train_loss": -42.27348709106445, "global_step": 235920, "epoch": 1949} {"train_loss": -43.094970703125, "global_step": 235921, "epoch": 1949} {"train_loss": -42.49394607543945, "global_step": 235922, "epoch": 1949} {"train_loss": -42.33278274536133, "global_step": 235923, "epoch": 1949} {"train_loss": -43.13481140136719, "global_step": 235924, "epoch": 1949} {"train_loss": -42.23545837402344, "global_step": 235925, "epoch": 1949} {"train_loss": -42.5404167175293, "global_step": 235926, "epoch": 1949} {"train_loss": -42.96440505981445, "global_step": 235927, "epoch": 1949} {"train_loss": -42.820899963378906, "global_step": 235928, "epoch": 1949} {"train_loss": -43.50407028198242, "global_step": 235929, "epoch": 1949} {"train_loss": -43.20063400268555, "global_step": 235930, "epoch": 1949} {"train_loss": -41.62146759033203, "global_step": 235931, "epoch": 1949} {"train_loss": -42.60508346557617, "global_step": 235932, "epoch": 1949} {"train_loss": -40.91100311279297, "global_step": 235933, "epoch": 1949} {"train_loss": -42.08662796020508, "global_step": 235934, "epoch": 1949} {"train_loss": -41.757972717285156, "global_step": 235935, "epoch": 1949} {"train_loss": -42.0113525390625, "global_step": 235936, "epoch": 1949} {"train_loss": -41.51857376098633, "global_step": 235937, "epoch": 1949} {"train_loss": -42.33798599243164, "global_step": 235938, "epoch": 1949} {"train_loss": -42.8148078918457, "global_step": 235939, "epoch": 1949} {"train_loss": -41.45939254760742, "global_step": 235940, "epoch": 1949} {"train_loss": -41.911407470703125, "global_step": 235941, "epoch": 1949} {"train_loss": -43.458126068115234, "global_step": 235942, "epoch": 1949} {"train_loss": -42.06947708129883, "global_step": 235943, "epoch": 1949} {"train_loss": -42.780452728271484, "global_step": 235944, "epoch": 1949} {"train_loss": -42.74979782104492, "global_step": 235945, "epoch": 1949} {"train_loss": -42.296875, "global_step": 235946, "epoch": 1949} {"train_loss": -42.268733978271484, "global_step": 235947, "epoch": 1949} {"train_loss": -43.30824279785156, "global_step": 235948, "epoch": 1949} {"train_loss": -42.557840142368285, "global_step": 235949, "epoch": 1949, "val_loss": 2579363.0} {"train_loss": -40.90790557861328, "global_step": 235950, "epoch": 1950} {"train_loss": -41.73173141479492, "global_step": 235951, "epoch": 1950} {"train_loss": -42.614501953125, "global_step": 235952, "epoch": 1950} {"train_loss": -42.51510238647461, "global_step": 235953, "epoch": 1950} {"train_loss": -42.72817611694336, "global_step": 235954, "epoch": 1950} {"train_loss": -42.49542236328125, "global_step": 235955, "epoch": 1950} {"train_loss": -42.422237396240234, "global_step": 235956, "epoch": 1950} {"train_loss": -42.42745590209961, "global_step": 235957, "epoch": 1950} {"train_loss": -42.73778533935547, "global_step": 235958, "epoch": 1950} {"train_loss": -41.907711029052734, "global_step": 235959, "epoch": 1950} {"train_loss": -42.60492706298828, "global_step": 235960, "epoch": 1950} {"train_loss": -42.978939056396484, "global_step": 235961, "epoch": 1950} {"train_loss": -41.4434928894043, "global_step": 235962, "epoch": 1950} {"train_loss": -41.718719482421875, "global_step": 235963, "epoch": 1950} {"train_loss": -41.35250473022461, "global_step": 235964, "epoch": 1950} {"train_loss": -43.39207077026367, "global_step": 235965, "epoch": 1950} {"train_loss": -43.103694915771484, "global_step": 235966, "epoch": 1950} {"train_loss": -42.8213005065918, "global_step": 235967, "epoch": 1950} {"train_loss": -42.624481201171875, "global_step": 235968, "epoch": 1950} {"train_loss": -42.999168395996094, "global_step": 235969, "epoch": 1950} {"train_loss": -41.936336517333984, "global_step": 235970, "epoch": 1950} {"train_loss": -42.61807632446289, "global_step": 235971, "epoch": 1950} {"train_loss": -42.15719223022461, "global_step": 235972, "epoch": 1950} {"train_loss": -42.54397201538086, "global_step": 235973, "epoch": 1950} {"train_loss": -43.48331832885742, "global_step": 235974, "epoch": 1950} {"train_loss": -40.7132682800293, "global_step": 235975, "epoch": 1950} {"train_loss": -41.065216064453125, "global_step": 235976, "epoch": 1950} {"train_loss": -41.65897750854492, "global_step": 235977, "epoch": 1950} {"train_loss": -42.140663146972656, "global_step": 235978, "epoch": 1950} {"train_loss": -41.518245697021484, "global_step": 235979, "epoch": 1950} {"train_loss": -41.40008544921875, "global_step": 235980, "epoch": 1950} {"train_loss": -40.97856140136719, "global_step": 235981, "epoch": 1950} {"train_loss": -41.89752960205078, "global_step": 235982, "epoch": 1950} {"train_loss": -41.821022033691406, "global_step": 235983, "epoch": 1950} {"train_loss": -40.85419464111328, "global_step": 235984, "epoch": 1950} {"train_loss": -41.43292236328125, "global_step": 235985, "epoch": 1950} {"train_loss": -42.63643264770508, "global_step": 235986, "epoch": 1950} {"train_loss": -41.25004196166992, "global_step": 235987, "epoch": 1950} {"train_loss": -41.75474166870117, "global_step": 235988, "epoch": 1950} {"train_loss": -39.8314094543457, "global_step": 235989, "epoch": 1950} {"train_loss": -41.69628143310547, "global_step": 235990, "epoch": 1950} {"train_loss": -41.36532211303711, "global_step": 235991, "epoch": 1950} {"train_loss": -41.3362922668457, "global_step": 235992, "epoch": 1950} {"train_loss": -42.9807014465332, "global_step": 235993, "epoch": 1950} {"train_loss": -42.4089469909668, "global_step": 235994, "epoch": 1950} {"train_loss": -41.41078567504883, "global_step": 235995, "epoch": 1950} {"train_loss": -41.370540618896484, "global_step": 235996, "epoch": 1950} {"train_loss": -42.505165100097656, "global_step": 235997, "epoch": 1950} {"train_loss": -42.551273345947266, "global_step": 235998, "epoch": 1950} {"train_loss": -42.65200424194336, "global_step": 235999, "epoch": 1950} {"train_loss": -42.97465896606445, "global_step": 236000, "epoch": 1950} {"train_loss": -43.23979568481445, "global_step": 236001, "epoch": 1950} {"train_loss": -41.80465316772461, "global_step": 236002, "epoch": 1950} {"train_loss": -41.971534729003906, "global_step": 236003, "epoch": 1950} {"train_loss": -42.482723236083984, "global_step": 236004, "epoch": 1950} {"train_loss": -40.94298553466797, "global_step": 236005, "epoch": 1950} {"train_loss": -40.813323974609375, "global_step": 236006, "epoch": 1950} {"train_loss": -42.37276840209961, "global_step": 236007, "epoch": 1950} {"train_loss": -42.71955108642578, "global_step": 236008, "epoch": 1950} {"train_loss": -42.79248809814453, "global_step": 236009, "epoch": 1950} {"train_loss": -42.78536605834961, "global_step": 236010, "epoch": 1950} {"train_loss": -42.029762268066406, "global_step": 236011, "epoch": 1950} {"train_loss": -42.5643424987793, "global_step": 236012, "epoch": 1950} {"train_loss": -42.739803314208984, "global_step": 236013, "epoch": 1950} {"train_loss": -42.60905838012695, "global_step": 236014, "epoch": 1950} {"train_loss": -42.5893440246582, "global_step": 236015, "epoch": 1950} {"train_loss": -42.783538818359375, "global_step": 236016, "epoch": 1950} {"train_loss": -42.44754409790039, "global_step": 236017, "epoch": 1950} {"train_loss": -42.60920333862305, "global_step": 236018, "epoch": 1950} {"train_loss": -42.59579086303711, "global_step": 236019, "epoch": 1950} {"train_loss": -42.835182189941406, "global_step": 236020, "epoch": 1950} {"train_loss": -42.746429443359375, "global_step": 236021, "epoch": 1950} {"train_loss": -42.670555114746094, "global_step": 236022, "epoch": 1950} {"train_loss": -42.66013717651367, "global_step": 236023, "epoch": 1950} {"train_loss": -42.929317474365234, "global_step": 236024, "epoch": 1950} {"train_loss": -42.493072509765625, "global_step": 236025, "epoch": 1950} {"train_loss": -42.55564880371094, "global_step": 236026, "epoch": 1950} {"train_loss": -43.0142707824707, "global_step": 236027, "epoch": 1950} {"train_loss": -43.0826530456543, "global_step": 236028, "epoch": 1950} {"train_loss": -42.539241790771484, "global_step": 236029, "epoch": 1950} {"train_loss": -41.39220428466797, "global_step": 236030, "epoch": 1950} {"train_loss": -40.283199310302734, "global_step": 236031, "epoch": 1950} {"train_loss": -42.7034797668457, "global_step": 236032, "epoch": 1950} {"train_loss": -41.135650634765625, "global_step": 236033, "epoch": 1950} {"train_loss": -39.612972259521484, "global_step": 236034, "epoch": 1950} {"train_loss": -40.55488204956055, "global_step": 236035, "epoch": 1950} {"train_loss": -42.3920783996582, "global_step": 236036, "epoch": 1950} {"train_loss": -41.719459533691406, "global_step": 236037, "epoch": 1950} {"train_loss": -40.42348861694336, "global_step": 236038, "epoch": 1950} {"train_loss": -41.546600341796875, "global_step": 236039, "epoch": 1950} {"train_loss": -41.756263732910156, "global_step": 236040, "epoch": 1950} {"train_loss": -41.52423858642578, "global_step": 236041, "epoch": 1950} {"train_loss": -41.7921028137207, "global_step": 236042, "epoch": 1950} {"train_loss": -42.048187255859375, "global_step": 236043, "epoch": 1950} {"train_loss": -42.15018081665039, "global_step": 236044, "epoch": 1950} {"train_loss": -42.26006317138672, "global_step": 236045, "epoch": 1950} {"train_loss": -42.129512786865234, "global_step": 236046, "epoch": 1950} {"train_loss": -42.630611419677734, "global_step": 236047, "epoch": 1950} {"train_loss": -42.61481857299805, "global_step": 236048, "epoch": 1950} {"train_loss": -41.932769775390625, "global_step": 236049, "epoch": 1950} {"train_loss": -41.94191360473633, "global_step": 236050, "epoch": 1950} {"train_loss": -42.20595932006836, "global_step": 236051, "epoch": 1950} {"train_loss": -41.819095611572266, "global_step": 236052, "epoch": 1950} {"train_loss": -42.39436721801758, "global_step": 236053, "epoch": 1950} {"train_loss": -41.42808151245117, "global_step": 236054, "epoch": 1950} {"train_loss": -42.654327392578125, "global_step": 236055, "epoch": 1950} {"train_loss": -42.36491394042969, "global_step": 236056, "epoch": 1950} {"train_loss": -42.78115463256836, "global_step": 236057, "epoch": 1950} {"train_loss": -42.065059661865234, "global_step": 236058, "epoch": 1950} {"train_loss": -42.332332611083984, "global_step": 236059, "epoch": 1950} {"train_loss": -42.7510871887207, "global_step": 236060, "epoch": 1950} {"train_loss": -42.18687057495117, "global_step": 236061, "epoch": 1950} {"train_loss": -43.210811614990234, "global_step": 236062, "epoch": 1950} {"train_loss": -42.3933219909668, "global_step": 236063, "epoch": 1950} {"train_loss": -43.00078582763672, "global_step": 236064, "epoch": 1950} {"train_loss": -43.283992767333984, "global_step": 236065, "epoch": 1950} {"train_loss": -43.27079391479492, "global_step": 236066, "epoch": 1950} {"train_loss": -43.36021423339844, "global_step": 236067, "epoch": 1950} {"train_loss": -43.25023651123047, "global_step": 236068, "epoch": 1950} {"train_loss": -43.2472038269043, "global_step": 236069, "epoch": 1950} {"train_loss": -42.188043011121515, "global_step": 236070, "epoch": 1950, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4400000": 1.0, "test/sim_max_reward_4400001": 1.0, "test/sim_max_reward_4400002": 1.0, "test/sim_max_reward_4400003": 1.0, "test/sim_max_reward_4400004": 1.0, "test/sim_max_reward_4400005": 1.0, "test/sim_max_reward_4400006": 1.0, "test/sim_max_reward_4400007": 1.0, "test/sim_max_reward_4400008": 1.0, "test/sim_max_reward_4400009": 1.0, "test/sim_max_reward_4400010": 1.0, "test/sim_max_reward_4400011": 1.0, "test/sim_max_reward_4400012": 1.0, "test/sim_max_reward_4400013": 1.0, "test/sim_max_reward_4400014": 1.0, "test/sim_max_reward_4400015": 1.0, "test/sim_max_reward_4400016": 1.0, "test/sim_max_reward_4400017": 1.0, "test/sim_max_reward_4400018": 1.0, "test/sim_max_reward_4400019": 1.0, "test/sim_max_reward_4400020": 1.0, "test/sim_max_reward_4400021": 1.0, "train/mean_score": 1.0, "test/mean_score": 1.0, "val_loss": 2606937.25} {"train_loss": -43.43793869018555, "global_step": 236071, "epoch": 1951} {"train_loss": -43.52181625366211, "global_step": 236072, "epoch": 1951} {"train_loss": -43.4109992980957, "global_step": 236073, "epoch": 1951} {"train_loss": -43.40068435668945, "global_step": 236074, "epoch": 1951} {"train_loss": -43.84904098510742, "global_step": 236075, "epoch": 1951} {"train_loss": -43.323204040527344, "global_step": 236076, "epoch": 1951} {"train_loss": -43.07588195800781, "global_step": 236077, "epoch": 1951} {"train_loss": -43.53084945678711, "global_step": 236078, "epoch": 1951} {"train_loss": -43.42436218261719, "global_step": 236079, "epoch": 1951} {"train_loss": -43.77706527709961, "global_step": 236080, "epoch": 1951} {"train_loss": -43.43545150756836, "global_step": 236081, "epoch": 1951} {"train_loss": -43.6944694519043, "global_step": 236082, "epoch": 1951} {"train_loss": -43.78289794921875, "global_step": 236083, "epoch": 1951} {"train_loss": -43.761077880859375, "global_step": 236084, "epoch": 1951} {"train_loss": -43.361427307128906, "global_step": 236085, "epoch": 1951} {"train_loss": -43.4217643737793, "global_step": 236086, "epoch": 1951} {"train_loss": -43.792572021484375, "global_step": 236087, "epoch": 1951} {"train_loss": -42.80577850341797, "global_step": 236088, "epoch": 1951} {"train_loss": -42.66179275512695, "global_step": 236089, "epoch": 1951} {"train_loss": -43.97101593017578, "global_step": 236090, "epoch": 1951} {"train_loss": -43.23698043823242, "global_step": 236091, "epoch": 1951} {"train_loss": -42.76152420043945, "global_step": 236092, "epoch": 1951} {"train_loss": -41.89311981201172, "global_step": 236093, "epoch": 1951} {"train_loss": -42.449092864990234, "global_step": 236094, "epoch": 1951} {"train_loss": -42.61438751220703, "global_step": 236095, "epoch": 1951} {"train_loss": -42.35200881958008, "global_step": 236096, "epoch": 1951} {"train_loss": -40.37016677856445, "global_step": 236097, "epoch": 1951} {"train_loss": -42.6660270690918, "global_step": 236098, "epoch": 1951} {"train_loss": -43.28778076171875, "global_step": 236099, "epoch": 1951} {"train_loss": -42.973304748535156, "global_step": 236100, "epoch": 1951} {"train_loss": -41.4983024597168, "global_step": 236101, "epoch": 1951} {"train_loss": -41.23848342895508, "global_step": 236102, "epoch": 1951} {"train_loss": -42.246517181396484, "global_step": 236103, "epoch": 1951} {"train_loss": -43.02775573730469, "global_step": 236104, "epoch": 1951} {"train_loss": -41.90861511230469, "global_step": 236105, "epoch": 1951} {"train_loss": -39.92156219482422, "global_step": 236106, "epoch": 1951} {"train_loss": -41.41067123413086, "global_step": 236107, "epoch": 1951} {"train_loss": -43.193992614746094, "global_step": 236108, "epoch": 1951} {"train_loss": -42.961483001708984, "global_step": 236109, "epoch": 1951} {"train_loss": -43.19175338745117, "global_step": 236110, "epoch": 1951} {"train_loss": -42.08056640625, "global_step": 236111, "epoch": 1951} {"train_loss": -42.08692169189453, "global_step": 236112, "epoch": 1951} {"train_loss": -43.01639938354492, "global_step": 236113, "epoch": 1951} {"train_loss": -41.244449615478516, "global_step": 236114, "epoch": 1951} {"train_loss": -42.462242126464844, "global_step": 236115, "epoch": 1951} {"train_loss": -43.004798889160156, "global_step": 236116, "epoch": 1951} {"train_loss": -42.87470626831055, "global_step": 236117, "epoch": 1951} {"train_loss": -42.7877197265625, "global_step": 236118, "epoch": 1951} {"train_loss": -42.841827392578125, "global_step": 236119, "epoch": 1951} {"train_loss": -43.33091354370117, "global_step": 236120, "epoch": 1951} {"train_loss": -43.03304672241211, "global_step": 236121, "epoch": 1951} {"train_loss": -43.33086013793945, "global_step": 236122, "epoch": 1951} {"train_loss": -43.47600173950195, "global_step": 236123, "epoch": 1951} {"train_loss": -42.42790603637695, "global_step": 236124, "epoch": 1951} {"train_loss": -43.56417465209961, "global_step": 236125, "epoch": 1951} {"train_loss": -42.7255744934082, "global_step": 236126, "epoch": 1951} {"train_loss": -43.26336669921875, "global_step": 236127, "epoch": 1951} {"train_loss": -41.963409423828125, "global_step": 236128, "epoch": 1951} {"train_loss": -42.09275436401367, "global_step": 236129, "epoch": 1951} {"train_loss": -41.768798828125, "global_step": 236130, "epoch": 1951} {"train_loss": -42.64007568359375, "global_step": 236131, "epoch": 1951} {"train_loss": -42.293922424316406, "global_step": 236132, "epoch": 1951} {"train_loss": -42.682621002197266, "global_step": 236133, "epoch": 1951} {"train_loss": -41.550933837890625, "global_step": 236134, "epoch": 1951} {"train_loss": -43.342323303222656, "global_step": 236135, "epoch": 1951} {"train_loss": -42.124183654785156, "global_step": 236136, "epoch": 1951} {"train_loss": -41.22216796875, "global_step": 236137, "epoch": 1951} {"train_loss": -42.45181655883789, "global_step": 236138, "epoch": 1951} {"train_loss": -42.0825080871582, "global_step": 236139, "epoch": 1951} {"train_loss": -41.761558532714844, "global_step": 236140, "epoch": 1951} {"train_loss": -40.988677978515625, "global_step": 236141, "epoch": 1951} {"train_loss": -41.46931838989258, "global_step": 236142, "epoch": 1951} {"train_loss": -42.194313049316406, "global_step": 236143, "epoch": 1951} {"train_loss": -42.721435546875, "global_step": 236144, "epoch": 1951} {"train_loss": -41.666847229003906, "global_step": 236145, "epoch": 1951} {"train_loss": -41.68202590942383, "global_step": 236146, "epoch": 1951} {"train_loss": -40.58592987060547, "global_step": 236147, "epoch": 1951} {"train_loss": -38.14007568359375, "global_step": 236148, "epoch": 1951} {"train_loss": -41.756080627441406, "global_step": 236149, "epoch": 1951} {"train_loss": -41.95515060424805, "global_step": 236150, "epoch": 1951} {"train_loss": -42.194671630859375, "global_step": 236151, "epoch": 1951} {"train_loss": -41.66976547241211, "global_step": 236152, "epoch": 1951} {"train_loss": -41.74129104614258, "global_step": 236153, "epoch": 1951} {"train_loss": -42.7026481628418, "global_step": 236154, "epoch": 1951} {"train_loss": -41.44196701049805, "global_step": 236155, "epoch": 1951} {"train_loss": -41.4649658203125, "global_step": 236156, "epoch": 1951} {"train_loss": -41.25141525268555, "global_step": 236157, "epoch": 1951} {"train_loss": -43.15360641479492, "global_step": 236158, "epoch": 1951} {"train_loss": -41.75080490112305, "global_step": 236159, "epoch": 1951} {"train_loss": -40.30112838745117, "global_step": 236160, "epoch": 1951} {"train_loss": -42.195220947265625, "global_step": 236161, "epoch": 1951} {"train_loss": -43.443267822265625, "global_step": 236162, "epoch": 1951} {"train_loss": -42.45030975341797, "global_step": 236163, "epoch": 1951} {"train_loss": -42.45307159423828, "global_step": 236164, "epoch": 1951} {"train_loss": -41.70907211303711, "global_step": 236165, "epoch": 1951} {"train_loss": -42.35859680175781, "global_step": 236166, "epoch": 1951} {"train_loss": -42.05137252807617, "global_step": 236167, "epoch": 1951} {"train_loss": -42.467529296875, "global_step": 236168, "epoch": 1951} {"train_loss": -42.117462158203125, "global_step": 236169, "epoch": 1951} {"train_loss": -42.80940246582031, "global_step": 236170, "epoch": 1951} {"train_loss": -41.028018951416016, "global_step": 236171, "epoch": 1951} {"train_loss": -42.137672424316406, "global_step": 236172, "epoch": 1951} {"train_loss": -42.434288024902344, "global_step": 236173, "epoch": 1951} {"train_loss": -41.85551834106445, "global_step": 236174, "epoch": 1951} {"train_loss": -42.20022201538086, "global_step": 236175, "epoch": 1951} {"train_loss": -42.744693756103516, "global_step": 236176, "epoch": 1951} {"train_loss": -41.597652435302734, "global_step": 236177, "epoch": 1951} {"train_loss": -42.056392669677734, "global_step": 236178, "epoch": 1951} {"train_loss": -43.28711700439453, "global_step": 236179, "epoch": 1951} {"train_loss": -42.29350662231445, "global_step": 236180, "epoch": 1951} {"train_loss": -42.68132400512695, "global_step": 236181, "epoch": 1951} {"train_loss": -42.50059509277344, "global_step": 236182, "epoch": 1951} {"train_loss": -39.17424392700195, "global_step": 236183, "epoch": 1951} {"train_loss": -41.58428955078125, "global_step": 236184, "epoch": 1951} {"train_loss": -41.71308135986328, "global_step": 236185, "epoch": 1951} {"train_loss": -39.30093002319336, "global_step": 236186, "epoch": 1951} {"train_loss": -41.85517501831055, "global_step": 236187, "epoch": 1951} {"train_loss": -38.94125747680664, "global_step": 236188, "epoch": 1951} {"train_loss": -43.00773239135742, "global_step": 236189, "epoch": 1951} {"train_loss": -38.99928665161133, "global_step": 236190, "epoch": 1951} {"train_loss": -42.30430845780806, "global_step": 236191, "epoch": 1951, "val_loss": 2571765.75} {"train_loss": -39.45103454589844, "global_step": 236192, "epoch": 1952} {"train_loss": -41.71464538574219, "global_step": 236193, "epoch": 1952} {"train_loss": -41.63837432861328, "global_step": 236194, "epoch": 1952} {"train_loss": -39.68245315551758, "global_step": 236195, "epoch": 1952} {"train_loss": -42.6317024230957, "global_step": 236196, "epoch": 1952} {"train_loss": -39.05202865600586, "global_step": 236197, "epoch": 1952} {"train_loss": -42.563968658447266, "global_step": 236198, "epoch": 1952} {"train_loss": -40.71747970581055, "global_step": 236199, "epoch": 1952} {"train_loss": -41.557125091552734, "global_step": 236200, "epoch": 1952} {"train_loss": -41.45283889770508, "global_step": 236201, "epoch": 1952} {"train_loss": -42.25922775268555, "global_step": 236202, "epoch": 1952} {"train_loss": -42.19425582885742, "global_step": 236203, "epoch": 1952} {"train_loss": -42.17476272583008, "global_step": 236204, "epoch": 1952} {"train_loss": -42.17893981933594, "global_step": 236205, "epoch": 1952} {"train_loss": -42.03428268432617, "global_step": 236206, "epoch": 1952} {"train_loss": -42.008819580078125, "global_step": 236207, "epoch": 1952} {"train_loss": -42.120357513427734, "global_step": 236208, "epoch": 1952} {"train_loss": -42.34113693237305, "global_step": 236209, "epoch": 1952} {"train_loss": -42.7113151550293, "global_step": 236210, "epoch": 1952} {"train_loss": -42.4429931640625, "global_step": 236211, "epoch": 1952} {"train_loss": -42.912960052490234, "global_step": 236212, "epoch": 1952} {"train_loss": -42.78084945678711, "global_step": 236213, "epoch": 1952} {"train_loss": -43.07167434692383, "global_step": 236214, "epoch": 1952} {"train_loss": -42.988983154296875, "global_step": 236215, "epoch": 1952} {"train_loss": -43.110877990722656, "global_step": 236216, "epoch": 1952} {"train_loss": -42.70504379272461, "global_step": 236217, "epoch": 1952} {"train_loss": -42.98031234741211, "global_step": 236218, "epoch": 1952} {"train_loss": -42.9030876159668, "global_step": 236219, "epoch": 1952} {"train_loss": -43.19696807861328, "global_step": 236220, "epoch": 1952} {"train_loss": -42.767478942871094, "global_step": 236221, "epoch": 1952} {"train_loss": -43.179481506347656, "global_step": 236222, "epoch": 1952} {"train_loss": -43.268184661865234, "global_step": 236223, "epoch": 1952} {"train_loss": -43.0323371887207, "global_step": 236224, "epoch": 1952} {"train_loss": -43.320953369140625, "global_step": 236225, "epoch": 1952} {"train_loss": -43.2496337890625, "global_step": 236226, "epoch": 1952} {"train_loss": -43.61163330078125, "global_step": 236227, "epoch": 1952} {"train_loss": -42.84024429321289, "global_step": 236228, "epoch": 1952} {"train_loss": -43.99506759643555, "global_step": 236229, "epoch": 1952} {"train_loss": -43.24233627319336, "global_step": 236230, "epoch": 1952} {"train_loss": -43.87931823730469, "global_step": 236231, "epoch": 1952} {"train_loss": -43.69721221923828, "global_step": 236232, "epoch": 1952} {"train_loss": -43.13300704956055, "global_step": 236233, "epoch": 1952} {"train_loss": -43.32497787475586, "global_step": 236234, "epoch": 1952} {"train_loss": -43.68913650512695, "global_step": 236235, "epoch": 1952} {"train_loss": -43.305397033691406, "global_step": 236236, "epoch": 1952} {"train_loss": -43.48875045776367, "global_step": 236237, "epoch": 1952} {"train_loss": -43.32984161376953, "global_step": 236238, "epoch": 1952} {"train_loss": -43.636592864990234, "global_step": 236239, "epoch": 1952} {"train_loss": -43.505306243896484, "global_step": 236240, "epoch": 1952} {"train_loss": -43.48747634887695, "global_step": 236241, "epoch": 1952} {"train_loss": -43.62699508666992, "global_step": 236242, "epoch": 1952} {"train_loss": -42.97418212890625, "global_step": 236243, "epoch": 1952} {"train_loss": -42.098304748535156, "global_step": 236244, "epoch": 1952} {"train_loss": -42.045745849609375, "global_step": 236245, "epoch": 1952} {"train_loss": -40.87971878051758, "global_step": 236246, "epoch": 1952} {"train_loss": -39.46075439453125, "global_step": 236247, "epoch": 1952} {"train_loss": -43.23693084716797, "global_step": 236248, "epoch": 1952} {"train_loss": -40.85121154785156, "global_step": 236249, "epoch": 1952} {"train_loss": -38.12741470336914, "global_step": 236250, "epoch": 1952} {"train_loss": -42.060909271240234, "global_step": 236251, "epoch": 1952} {"train_loss": -36.247798919677734, "global_step": 236252, "epoch": 1952} {"train_loss": -36.15534210205078, "global_step": 236253, "epoch": 1952} {"train_loss": -40.6536979675293, "global_step": 236254, "epoch": 1952} {"train_loss": -37.59684371948242, "global_step": 236255, "epoch": 1952} {"train_loss": -39.65296936035156, "global_step": 236256, "epoch": 1952} {"train_loss": -37.538761138916016, "global_step": 236257, "epoch": 1952} {"train_loss": -39.66911697387695, "global_step": 236258, "epoch": 1952} {"train_loss": -38.14472961425781, "global_step": 236259, "epoch": 1952} {"train_loss": -41.93508529663086, "global_step": 236260, "epoch": 1952} {"train_loss": -39.52186965942383, "global_step": 236261, "epoch": 1952} {"train_loss": -40.65133285522461, "global_step": 236262, "epoch": 1952} {"train_loss": -40.50593185424805, "global_step": 236263, "epoch": 1952} {"train_loss": -40.03606033325195, "global_step": 236264, "epoch": 1952} {"train_loss": -41.947906494140625, "global_step": 236265, "epoch": 1952} {"train_loss": -39.921688079833984, "global_step": 236266, "epoch": 1952} {"train_loss": -40.7603645324707, "global_step": 236267, "epoch": 1952} {"train_loss": -41.30416488647461, "global_step": 236268, "epoch": 1952} {"train_loss": -41.342403411865234, "global_step": 236269, "epoch": 1952} {"train_loss": -41.985992431640625, "global_step": 236270, "epoch": 1952} {"train_loss": -41.894771575927734, "global_step": 236271, "epoch": 1952} {"train_loss": -41.848388671875, "global_step": 236272, "epoch": 1952} {"train_loss": -41.74589920043945, "global_step": 236273, "epoch": 1952} {"train_loss": -41.960411071777344, "global_step": 236274, "epoch": 1952} {"train_loss": -42.45684814453125, "global_step": 236275, "epoch": 1952} {"train_loss": -42.181575775146484, "global_step": 236276, "epoch": 1952} {"train_loss": -42.737667083740234, "global_step": 236277, "epoch": 1952} {"train_loss": -42.46124267578125, "global_step": 236278, "epoch": 1952} {"train_loss": -42.56737518310547, "global_step": 236279, "epoch": 1952} {"train_loss": -42.1417121887207, "global_step": 236280, "epoch": 1952} {"train_loss": -42.24756622314453, "global_step": 236281, "epoch": 1952} {"train_loss": -42.682918548583984, "global_step": 236282, "epoch": 1952} {"train_loss": -41.722381591796875, "global_step": 236283, "epoch": 1952} {"train_loss": -42.456905364990234, "global_step": 236284, "epoch": 1952} {"train_loss": -40.9454460144043, "global_step": 236285, "epoch": 1952} {"train_loss": -42.563232421875, "global_step": 236286, "epoch": 1952} {"train_loss": -40.326168060302734, "global_step": 236287, "epoch": 1952} {"train_loss": -42.819068908691406, "global_step": 236288, "epoch": 1952} {"train_loss": -40.88509750366211, "global_step": 236289, "epoch": 1952} {"train_loss": -42.50416564941406, "global_step": 236290, "epoch": 1952} {"train_loss": -40.90729522705078, "global_step": 236291, "epoch": 1952} {"train_loss": -43.42676544189453, "global_step": 236292, "epoch": 1952} {"train_loss": -41.9483642578125, "global_step": 236293, "epoch": 1952} {"train_loss": -43.0806884765625, "global_step": 236294, "epoch": 1952} {"train_loss": -42.58588790893555, "global_step": 236295, "epoch": 1952} {"train_loss": -42.81256866455078, "global_step": 236296, "epoch": 1952} {"train_loss": -42.29502487182617, "global_step": 236297, "epoch": 1952} {"train_loss": -43.03863525390625, "global_step": 236298, "epoch": 1952} {"train_loss": -42.789894104003906, "global_step": 236299, "epoch": 1952} {"train_loss": -43.133487701416016, "global_step": 236300, "epoch": 1952} {"train_loss": -43.16365051269531, "global_step": 236301, "epoch": 1952} {"train_loss": -42.56997299194336, "global_step": 236302, "epoch": 1952} {"train_loss": -43.33846664428711, "global_step": 236303, "epoch": 1952} {"train_loss": -43.11174011230469, "global_step": 236304, "epoch": 1952} {"train_loss": -43.07952880859375, "global_step": 236305, "epoch": 1952} {"train_loss": -42.872013092041016, "global_step": 236306, "epoch": 1952} {"train_loss": -43.68323516845703, "global_step": 236307, "epoch": 1952} {"train_loss": -43.20290756225586, "global_step": 236308, "epoch": 1952} {"train_loss": -43.14900207519531, "global_step": 236309, "epoch": 1952} {"train_loss": -43.37868881225586, "global_step": 236310, "epoch": 1952} {"train_loss": -43.309661865234375, "global_step": 236311, "epoch": 1952} {"train_loss": -42.02799855381989, "global_step": 236312, "epoch": 1952, "val_loss": 2635180.25} {"train_loss": -42.59524154663086, "global_step": 236313, "epoch": 1953} {"train_loss": -43.526817321777344, "global_step": 236314, "epoch": 1953} {"train_loss": -42.208492279052734, "global_step": 236315, "epoch": 1953} {"train_loss": -41.852352142333984, "global_step": 236316, "epoch": 1953} {"train_loss": -41.80927276611328, "global_step": 236317, "epoch": 1953} {"train_loss": -41.62019729614258, "global_step": 236318, "epoch": 1953} {"train_loss": -41.93857955932617, "global_step": 236319, "epoch": 1953} {"train_loss": -42.85618209838867, "global_step": 236320, "epoch": 1953} {"train_loss": -43.32355880737305, "global_step": 236321, "epoch": 1953} {"train_loss": -42.75788116455078, "global_step": 236322, "epoch": 1953} {"train_loss": -42.951698303222656, "global_step": 236323, "epoch": 1953} {"train_loss": -42.7476921081543, "global_step": 236324, "epoch": 1953} {"train_loss": -43.129608154296875, "global_step": 236325, "epoch": 1953} {"train_loss": -42.91215133666992, "global_step": 236326, "epoch": 1953} {"train_loss": -42.6995964050293, "global_step": 236327, "epoch": 1953} {"train_loss": -42.830318450927734, "global_step": 236328, "epoch": 1953} {"train_loss": -42.431610107421875, "global_step": 236329, "epoch": 1953} {"train_loss": -41.91675567626953, "global_step": 236330, "epoch": 1953} {"train_loss": -43.21666717529297, "global_step": 236331, "epoch": 1953} {"train_loss": -42.76884841918945, "global_step": 236332, "epoch": 1953} {"train_loss": -41.009334564208984, "global_step": 236333, "epoch": 1953} {"train_loss": -42.585933685302734, "global_step": 236334, "epoch": 1953} {"train_loss": -43.21430587768555, "global_step": 236335, "epoch": 1953} {"train_loss": -41.64073181152344, "global_step": 236336, "epoch": 1953} {"train_loss": -41.98636245727539, "global_step": 236337, "epoch": 1953} {"train_loss": -43.18839645385742, "global_step": 236338, "epoch": 1953} {"train_loss": -41.84566116333008, "global_step": 236339, "epoch": 1953} {"train_loss": -39.85345458984375, "global_step": 236340, "epoch": 1953} {"train_loss": -41.84304428100586, "global_step": 236341, "epoch": 1953} {"train_loss": -42.4513053894043, "global_step": 236342, "epoch": 1953} {"train_loss": -42.012245178222656, "global_step": 236343, "epoch": 1953} {"train_loss": -42.37104415893555, "global_step": 236344, "epoch": 1953} {"train_loss": -41.277191162109375, "global_step": 236345, "epoch": 1953} {"train_loss": -40.00105285644531, "global_step": 236346, "epoch": 1953} {"train_loss": -42.84939193725586, "global_step": 236347, "epoch": 1953} {"train_loss": -41.08454132080078, "global_step": 236348, "epoch": 1953} {"train_loss": -41.702392578125, "global_step": 236349, "epoch": 1953} {"train_loss": -43.19301223754883, "global_step": 236350, "epoch": 1953} {"train_loss": -42.65140914916992, "global_step": 236351, "epoch": 1953} {"train_loss": -42.61362838745117, "global_step": 236352, "epoch": 1953} {"train_loss": -43.64875030517578, "global_step": 236353, "epoch": 1953} {"train_loss": -42.637489318847656, "global_step": 236354, "epoch": 1953} {"train_loss": -41.78517532348633, "global_step": 236355, "epoch": 1953} {"train_loss": -43.32428741455078, "global_step": 236356, "epoch": 1953} {"train_loss": -43.58583450317383, "global_step": 236357, "epoch": 1953} {"train_loss": -42.82304763793945, "global_step": 236358, "epoch": 1953} {"train_loss": -43.07624435424805, "global_step": 236359, "epoch": 1953} {"train_loss": -43.330928802490234, "global_step": 236360, "epoch": 1953} {"train_loss": -42.79410934448242, "global_step": 236361, "epoch": 1953} {"train_loss": -42.7482795715332, "global_step": 236362, "epoch": 1953} {"train_loss": -42.91415023803711, "global_step": 236363, "epoch": 1953} {"train_loss": -42.86426544189453, "global_step": 236364, "epoch": 1953} {"train_loss": -43.13962936401367, "global_step": 236365, "epoch": 1953} {"train_loss": -43.51616287231445, "global_step": 236366, "epoch": 1953} {"train_loss": -42.39309310913086, "global_step": 236367, "epoch": 1953} {"train_loss": -43.510860443115234, "global_step": 236368, "epoch": 1953} {"train_loss": -43.09626770019531, "global_step": 236369, "epoch": 1953} {"train_loss": -43.12548828125, "global_step": 236370, "epoch": 1953} {"train_loss": -43.319637298583984, "global_step": 236371, "epoch": 1953} {"train_loss": -43.06646728515625, "global_step": 236372, "epoch": 1953} {"train_loss": -43.073543548583984, "global_step": 236373, "epoch": 1953} {"train_loss": -43.37655258178711, "global_step": 236374, "epoch": 1953} {"train_loss": -43.16396713256836, "global_step": 236375, "epoch": 1953} {"train_loss": -43.727718353271484, "global_step": 236376, "epoch": 1953} {"train_loss": -43.975284576416016, "global_step": 236377, "epoch": 1953} {"train_loss": -43.06760787963867, "global_step": 236378, "epoch": 1953} {"train_loss": -43.49348068237305, "global_step": 236379, "epoch": 1953} {"train_loss": -43.474945068359375, "global_step": 236380, "epoch": 1953} {"train_loss": -42.917823791503906, "global_step": 236381, "epoch": 1953} {"train_loss": -43.40303421020508, "global_step": 236382, "epoch": 1953} {"train_loss": -42.73530197143555, "global_step": 236383, "epoch": 1953} {"train_loss": -42.193641662597656, "global_step": 236384, "epoch": 1953} {"train_loss": -43.77589416503906, "global_step": 236385, "epoch": 1953} {"train_loss": -41.37485885620117, "global_step": 236386, "epoch": 1953} {"train_loss": -43.379676818847656, "global_step": 236387, "epoch": 1953} {"train_loss": -41.48927688598633, "global_step": 236388, "epoch": 1953} {"train_loss": -41.823421478271484, "global_step": 236389, "epoch": 1953} {"train_loss": -41.724857330322266, "global_step": 236390, "epoch": 1953} {"train_loss": -40.71757507324219, "global_step": 236391, "epoch": 1953} {"train_loss": -42.1577262878418, "global_step": 236392, "epoch": 1953} {"train_loss": -42.06208038330078, "global_step": 236393, "epoch": 1953} {"train_loss": -41.30427932739258, "global_step": 236394, "epoch": 1953} {"train_loss": -40.91368865966797, "global_step": 236395, "epoch": 1953} {"train_loss": -38.96236801147461, "global_step": 236396, "epoch": 1953} {"train_loss": -42.577877044677734, "global_step": 236397, "epoch": 1953} {"train_loss": -42.09004211425781, "global_step": 236398, "epoch": 1953} {"train_loss": -42.32902145385742, "global_step": 236399, "epoch": 1953} {"train_loss": -42.82593536376953, "global_step": 236400, "epoch": 1953} {"train_loss": -42.408775329589844, "global_step": 236401, "epoch": 1953} {"train_loss": -42.281986236572266, "global_step": 236402, "epoch": 1953} {"train_loss": -42.55403137207031, "global_step": 236403, "epoch": 1953} {"train_loss": -42.90351486206055, "global_step": 236404, "epoch": 1953} {"train_loss": -42.73159408569336, "global_step": 236405, "epoch": 1953} {"train_loss": -42.73072052001953, "global_step": 236406, "epoch": 1953} {"train_loss": -42.58351516723633, "global_step": 236407, "epoch": 1953} {"train_loss": -43.197322845458984, "global_step": 236408, "epoch": 1953} {"train_loss": -42.24622344970703, "global_step": 236409, "epoch": 1953} {"train_loss": -42.55373764038086, "global_step": 236410, "epoch": 1953} {"train_loss": -42.830787658691406, "global_step": 236411, "epoch": 1953} {"train_loss": -42.38111114501953, "global_step": 236412, "epoch": 1953} {"train_loss": -42.73295211791992, "global_step": 236413, "epoch": 1953} {"train_loss": -42.42698669433594, "global_step": 236414, "epoch": 1953} {"train_loss": -42.94104766845703, "global_step": 236415, "epoch": 1953} {"train_loss": -41.44462203979492, "global_step": 236416, "epoch": 1953} {"train_loss": -41.19989776611328, "global_step": 236417, "epoch": 1953} {"train_loss": -41.89509963989258, "global_step": 236418, "epoch": 1953} {"train_loss": -41.6391487121582, "global_step": 236419, "epoch": 1953} {"train_loss": -42.000892639160156, "global_step": 236420, "epoch": 1953} {"train_loss": -42.637752532958984, "global_step": 236421, "epoch": 1953} {"train_loss": -42.55869674682617, "global_step": 236422, "epoch": 1953} {"train_loss": -41.48997497558594, "global_step": 236423, "epoch": 1953} {"train_loss": -41.8674430847168, "global_step": 236424, "epoch": 1953} {"train_loss": -42.763771057128906, "global_step": 236425, "epoch": 1953} {"train_loss": -41.16717529296875, "global_step": 236426, "epoch": 1953} {"train_loss": -40.57448959350586, "global_step": 236427, "epoch": 1953} {"train_loss": -42.39565658569336, "global_step": 236428, "epoch": 1953} {"train_loss": -42.067100524902344, "global_step": 236429, "epoch": 1953} {"train_loss": -40.8773307800293, "global_step": 236430, "epoch": 1953} {"train_loss": -42.849124908447266, "global_step": 236431, "epoch": 1953} {"train_loss": -42.37407684326172, "global_step": 236432, "epoch": 1953} {"train_loss": -42.41337352153683, "global_step": 236433, "epoch": 1953, "val_loss": 2710855.0} {"train_loss": -42.20791244506836, "global_step": 236434, "epoch": 1954} {"train_loss": -41.935997009277344, "global_step": 236435, "epoch": 1954} {"train_loss": -41.956451416015625, "global_step": 236436, "epoch": 1954} {"train_loss": -42.847511291503906, "global_step": 236437, "epoch": 1954} {"train_loss": -40.7203369140625, "global_step": 236438, "epoch": 1954} {"train_loss": -42.053192138671875, "global_step": 236439, "epoch": 1954} {"train_loss": -42.393463134765625, "global_step": 236440, "epoch": 1954} {"train_loss": -41.17267608642578, "global_step": 236441, "epoch": 1954} {"train_loss": -43.04106521606445, "global_step": 236442, "epoch": 1954} {"train_loss": -41.56282424926758, "global_step": 236443, "epoch": 1954} {"train_loss": -43.1278190612793, "global_step": 236444, "epoch": 1954} {"train_loss": -41.77585983276367, "global_step": 236445, "epoch": 1954} {"train_loss": -41.86524963378906, "global_step": 236446, "epoch": 1954} {"train_loss": -42.04676055908203, "global_step": 236447, "epoch": 1954} {"train_loss": -41.8524284362793, "global_step": 236448, "epoch": 1954} {"train_loss": -42.842952728271484, "global_step": 236449, "epoch": 1954} {"train_loss": -42.813106536865234, "global_step": 236450, "epoch": 1954} {"train_loss": -41.024024963378906, "global_step": 236451, "epoch": 1954} {"train_loss": -41.78776931762695, "global_step": 236452, "epoch": 1954} {"train_loss": -42.13067626953125, "global_step": 236453, "epoch": 1954} {"train_loss": -42.667701721191406, "global_step": 236454, "epoch": 1954} {"train_loss": -43.034725189208984, "global_step": 236455, "epoch": 1954} {"train_loss": -42.962459564208984, "global_step": 236456, "epoch": 1954} {"train_loss": -42.2420768737793, "global_step": 236457, "epoch": 1954} {"train_loss": -43.18251037597656, "global_step": 236458, "epoch": 1954} {"train_loss": -41.01076889038086, "global_step": 236459, "epoch": 1954} {"train_loss": -42.20322799682617, "global_step": 236460, "epoch": 1954} {"train_loss": -43.257930755615234, "global_step": 236461, "epoch": 1954} {"train_loss": -42.24058151245117, "global_step": 236462, "epoch": 1954} {"train_loss": -42.0308837890625, "global_step": 236463, "epoch": 1954} {"train_loss": -42.50812911987305, "global_step": 236464, "epoch": 1954} {"train_loss": -42.92983627319336, "global_step": 236465, "epoch": 1954} {"train_loss": -42.70463180541992, "global_step": 236466, "epoch": 1954} {"train_loss": -42.380409240722656, "global_step": 236467, "epoch": 1954} {"train_loss": -42.5948600769043, "global_step": 236468, "epoch": 1954} {"train_loss": -42.66645812988281, "global_step": 236469, "epoch": 1954} {"train_loss": -43.24772262573242, "global_step": 236470, "epoch": 1954} {"train_loss": -42.32058334350586, "global_step": 236471, "epoch": 1954} {"train_loss": -42.819862365722656, "global_step": 236472, "epoch": 1954} {"train_loss": -42.44013977050781, "global_step": 236473, "epoch": 1954} {"train_loss": -42.839229583740234, "global_step": 236474, "epoch": 1954} {"train_loss": -42.37333297729492, "global_step": 236475, "epoch": 1954} {"train_loss": -42.82501220703125, "global_step": 236476, "epoch": 1954} {"train_loss": -42.54945755004883, "global_step": 236477, "epoch": 1954} {"train_loss": -43.37500762939453, "global_step": 236478, "epoch": 1954} {"train_loss": -42.42269515991211, "global_step": 236479, "epoch": 1954} {"train_loss": -43.497291564941406, "global_step": 236480, "epoch": 1954} {"train_loss": -43.008113861083984, "global_step": 236481, "epoch": 1954} {"train_loss": -42.356719970703125, "global_step": 236482, "epoch": 1954} {"train_loss": -42.86140441894531, "global_step": 236483, "epoch": 1954} {"train_loss": -43.0296630859375, "global_step": 236484, "epoch": 1954} {"train_loss": -41.84291458129883, "global_step": 236485, "epoch": 1954} {"train_loss": -42.87083053588867, "global_step": 236486, "epoch": 1954} {"train_loss": -42.529850006103516, "global_step": 236487, "epoch": 1954} {"train_loss": -42.288570404052734, "global_step": 236488, "epoch": 1954} {"train_loss": -42.58424758911133, "global_step": 236489, "epoch": 1954} {"train_loss": -43.336639404296875, "global_step": 236490, "epoch": 1954} {"train_loss": -42.399192810058594, "global_step": 236491, "epoch": 1954} {"train_loss": -43.11477279663086, "global_step": 236492, "epoch": 1954} {"train_loss": -43.31925582885742, "global_step": 236493, "epoch": 1954} {"train_loss": -42.24860382080078, "global_step": 236494, "epoch": 1954} {"train_loss": -42.844749450683594, "global_step": 236495, "epoch": 1954} {"train_loss": -42.1548957824707, "global_step": 236496, "epoch": 1954} {"train_loss": -43.23112106323242, "global_step": 236497, "epoch": 1954} {"train_loss": -42.47539520263672, "global_step": 236498, "epoch": 1954} {"train_loss": -43.4697380065918, "global_step": 236499, "epoch": 1954} {"train_loss": -43.73154830932617, "global_step": 236500, "epoch": 1954} {"train_loss": -43.731353759765625, "global_step": 236501, "epoch": 1954} {"train_loss": -43.45587158203125, "global_step": 236502, "epoch": 1954} {"train_loss": -43.56132507324219, "global_step": 236503, "epoch": 1954} {"train_loss": -43.28911590576172, "global_step": 236504, "epoch": 1954} {"train_loss": -43.31124496459961, "global_step": 236505, "epoch": 1954} {"train_loss": -43.43703842163086, "global_step": 236506, "epoch": 1954} {"train_loss": -43.40201950073242, "global_step": 236507, "epoch": 1954} {"train_loss": -43.888118743896484, "global_step": 236508, "epoch": 1954} {"train_loss": -43.795013427734375, "global_step": 236509, "epoch": 1954} {"train_loss": -43.80641174316406, "global_step": 236510, "epoch": 1954} {"train_loss": -43.64763641357422, "global_step": 236511, "epoch": 1954} {"train_loss": -43.31257247924805, "global_step": 236512, "epoch": 1954} {"train_loss": -43.73308181762695, "global_step": 236513, "epoch": 1954} {"train_loss": -43.73765563964844, "global_step": 236514, "epoch": 1954} {"train_loss": -43.7092399597168, "global_step": 236515, "epoch": 1954} {"train_loss": -44.086055755615234, "global_step": 236516, "epoch": 1954} {"train_loss": -43.2630615234375, "global_step": 236517, "epoch": 1954} {"train_loss": -43.75753402709961, "global_step": 236518, "epoch": 1954} {"train_loss": -43.76283645629883, "global_step": 236519, "epoch": 1954} {"train_loss": -42.916622161865234, "global_step": 236520, "epoch": 1954} {"train_loss": -43.27141189575195, "global_step": 236521, "epoch": 1954} {"train_loss": -44.03375244140625, "global_step": 236522, "epoch": 1954} {"train_loss": -43.68603515625, "global_step": 236523, "epoch": 1954} {"train_loss": -43.653770446777344, "global_step": 236524, "epoch": 1954} {"train_loss": -43.231971740722656, "global_step": 236525, "epoch": 1954} {"train_loss": -44.00124740600586, "global_step": 236526, "epoch": 1954} {"train_loss": -44.090538024902344, "global_step": 236527, "epoch": 1954} {"train_loss": -44.08403396606445, "global_step": 236528, "epoch": 1954} {"train_loss": -43.79343795776367, "global_step": 236529, "epoch": 1954} {"train_loss": -44.0640869140625, "global_step": 236530, "epoch": 1954} {"train_loss": -43.42765426635742, "global_step": 236531, "epoch": 1954} {"train_loss": -44.01716995239258, "global_step": 236532, "epoch": 1954} {"train_loss": -43.6938362121582, "global_step": 236533, "epoch": 1954} {"train_loss": -43.55039596557617, "global_step": 236534, "epoch": 1954} {"train_loss": -42.9140739440918, "global_step": 236535, "epoch": 1954} {"train_loss": -41.03446578979492, "global_step": 236536, "epoch": 1954} {"train_loss": -41.8288459777832, "global_step": 236537, "epoch": 1954} {"train_loss": -43.862518310546875, "global_step": 236538, "epoch": 1954} {"train_loss": -41.46687316894531, "global_step": 236539, "epoch": 1954} {"train_loss": -40.202999114990234, "global_step": 236540, "epoch": 1954} {"train_loss": -41.446224212646484, "global_step": 236541, "epoch": 1954} {"train_loss": -43.29955291748047, "global_step": 236542, "epoch": 1954} {"train_loss": -39.973052978515625, "global_step": 236543, "epoch": 1954} {"train_loss": -39.516300201416016, "global_step": 236544, "epoch": 1954} {"train_loss": -41.76441192626953, "global_step": 236545, "epoch": 1954} {"train_loss": -42.75093078613281, "global_step": 236546, "epoch": 1954} {"train_loss": -41.178279876708984, "global_step": 236547, "epoch": 1954} {"train_loss": -41.05881881713867, "global_step": 236548, "epoch": 1954} {"train_loss": -41.596046447753906, "global_step": 236549, "epoch": 1954} {"train_loss": -40.115020751953125, "global_step": 236550, "epoch": 1954} {"train_loss": -41.15209197998047, "global_step": 236551, "epoch": 1954} {"train_loss": -41.299312591552734, "global_step": 236552, "epoch": 1954} {"train_loss": -38.58912658691406, "global_step": 236553, "epoch": 1954} {"train_loss": -42.64343867026085, "global_step": 236554, "epoch": 1954, "val_loss": 2594341.25} {"train_loss": -39.782958984375, "global_step": 236555, "epoch": 1955} {"train_loss": -39.74930953979492, "global_step": 236556, "epoch": 1955} {"train_loss": -42.503173828125, "global_step": 236557, "epoch": 1955} {"train_loss": -40.49381637573242, "global_step": 236558, "epoch": 1955} {"train_loss": -40.850765228271484, "global_step": 236559, "epoch": 1955} {"train_loss": -40.990074157714844, "global_step": 236560, "epoch": 1955} {"train_loss": -42.15303039550781, "global_step": 236561, "epoch": 1955} {"train_loss": -42.65443420410156, "global_step": 236562, "epoch": 1955} {"train_loss": -42.06460189819336, "global_step": 236563, "epoch": 1955} {"train_loss": -42.81688690185547, "global_step": 236564, "epoch": 1955} {"train_loss": -42.38881301879883, "global_step": 236565, "epoch": 1955} {"train_loss": -41.72043991088867, "global_step": 236566, "epoch": 1955} {"train_loss": -42.96916580200195, "global_step": 236567, "epoch": 1955} {"train_loss": -42.96759796142578, "global_step": 236568, "epoch": 1955} {"train_loss": -42.92232131958008, "global_step": 236569, "epoch": 1955} {"train_loss": -42.77972412109375, "global_step": 236570, "epoch": 1955} {"train_loss": -42.15890121459961, "global_step": 236571, "epoch": 1955} {"train_loss": -42.76859664916992, "global_step": 236572, "epoch": 1955} {"train_loss": -42.23660659790039, "global_step": 236573, "epoch": 1955} {"train_loss": -41.82746124267578, "global_step": 236574, "epoch": 1955} {"train_loss": -42.68643569946289, "global_step": 236575, "epoch": 1955} {"train_loss": -43.049930572509766, "global_step": 236576, "epoch": 1955} {"train_loss": -42.57651901245117, "global_step": 236577, "epoch": 1955} {"train_loss": -42.35536575317383, "global_step": 236578, "epoch": 1955} {"train_loss": -43.007659912109375, "global_step": 236579, "epoch": 1955} {"train_loss": -43.85519790649414, "global_step": 236580, "epoch": 1955} {"train_loss": -42.7823600769043, "global_step": 236581, "epoch": 1955} {"train_loss": -42.73236846923828, "global_step": 236582, "epoch": 1955} {"train_loss": -42.80290603637695, "global_step": 236583, "epoch": 1955} {"train_loss": -42.25095748901367, "global_step": 236584, "epoch": 1955} {"train_loss": -42.333465576171875, "global_step": 236585, "epoch": 1955} {"train_loss": -42.415767669677734, "global_step": 236586, "epoch": 1955} {"train_loss": -41.501338958740234, "global_step": 236587, "epoch": 1955} {"train_loss": -43.13827133178711, "global_step": 236588, "epoch": 1955} {"train_loss": -42.724021911621094, "global_step": 236589, "epoch": 1955} {"train_loss": -42.94063949584961, "global_step": 236590, "epoch": 1955} {"train_loss": -42.35846710205078, "global_step": 236591, "epoch": 1955} {"train_loss": -42.23265075683594, "global_step": 236592, "epoch": 1955} {"train_loss": -43.35371780395508, "global_step": 236593, "epoch": 1955} {"train_loss": -42.81022262573242, "global_step": 236594, "epoch": 1955} {"train_loss": -42.065433502197266, "global_step": 236595, "epoch": 1955} {"train_loss": -41.85991668701172, "global_step": 236596, "epoch": 1955} {"train_loss": -43.45551681518555, "global_step": 236597, "epoch": 1955} {"train_loss": -43.034847259521484, "global_step": 236598, "epoch": 1955} {"train_loss": -42.58628845214844, "global_step": 236599, "epoch": 1955} {"train_loss": -43.27901840209961, "global_step": 236600, "epoch": 1955} {"train_loss": -42.53667068481445, "global_step": 236601, "epoch": 1955} {"train_loss": -40.16577911376953, "global_step": 236602, "epoch": 1955} {"train_loss": -41.02400588989258, "global_step": 236603, "epoch": 1955} {"train_loss": -43.10243225097656, "global_step": 236604, "epoch": 1955} {"train_loss": -41.6775016784668, "global_step": 236605, "epoch": 1955} {"train_loss": -41.88617706298828, "global_step": 236606, "epoch": 1955} {"train_loss": -42.15049743652344, "global_step": 236607, "epoch": 1955} {"train_loss": -42.96998977661133, "global_step": 236608, "epoch": 1955} {"train_loss": -43.015830993652344, "global_step": 236609, "epoch": 1955} {"train_loss": -42.10325241088867, "global_step": 236610, "epoch": 1955} {"train_loss": -42.230289459228516, "global_step": 236611, "epoch": 1955} {"train_loss": -43.02191162109375, "global_step": 236612, "epoch": 1955} {"train_loss": -41.72779083251953, "global_step": 236613, "epoch": 1955} {"train_loss": -41.6210823059082, "global_step": 236614, "epoch": 1955} {"train_loss": -42.865455627441406, "global_step": 236615, "epoch": 1955} {"train_loss": -42.04667282104492, "global_step": 236616, "epoch": 1955} {"train_loss": -42.30139923095703, "global_step": 236617, "epoch": 1955} {"train_loss": -43.01692581176758, "global_step": 236618, "epoch": 1955} {"train_loss": -42.28755187988281, "global_step": 236619, "epoch": 1955} {"train_loss": -42.917545318603516, "global_step": 236620, "epoch": 1955} {"train_loss": -43.00580596923828, "global_step": 236621, "epoch": 1955} {"train_loss": -42.745662689208984, "global_step": 236622, "epoch": 1955} {"train_loss": -42.57314682006836, "global_step": 236623, "epoch": 1955} {"train_loss": -42.67938232421875, "global_step": 236624, "epoch": 1955} {"train_loss": -42.42606735229492, "global_step": 236625, "epoch": 1955} {"train_loss": -42.20522689819336, "global_step": 236626, "epoch": 1955} {"train_loss": -43.048011779785156, "global_step": 236627, "epoch": 1955} {"train_loss": -42.73031234741211, "global_step": 236628, "epoch": 1955} {"train_loss": -43.074440002441406, "global_step": 236629, "epoch": 1955} {"train_loss": -42.31364059448242, "global_step": 236630, "epoch": 1955} {"train_loss": -43.02398681640625, "global_step": 236631, "epoch": 1955} {"train_loss": -42.74070358276367, "global_step": 236632, "epoch": 1955} {"train_loss": -42.38099670410156, "global_step": 236633, "epoch": 1955} {"train_loss": -42.504905700683594, "global_step": 236634, "epoch": 1955} {"train_loss": -42.730831146240234, "global_step": 236635, "epoch": 1955} {"train_loss": -43.88873291015625, "global_step": 236636, "epoch": 1955} {"train_loss": -42.53538131713867, "global_step": 236637, "epoch": 1955} {"train_loss": -43.08420944213867, "global_step": 236638, "epoch": 1955} {"train_loss": -43.14840316772461, "global_step": 236639, "epoch": 1955} {"train_loss": -42.86641311645508, "global_step": 236640, "epoch": 1955} {"train_loss": -43.17800521850586, "global_step": 236641, "epoch": 1955} {"train_loss": -42.73258590698242, "global_step": 236642, "epoch": 1955} {"train_loss": -43.18732452392578, "global_step": 236643, "epoch": 1955} {"train_loss": -42.808265686035156, "global_step": 236644, "epoch": 1955} {"train_loss": -43.19175338745117, "global_step": 236645, "epoch": 1955} {"train_loss": -43.431087493896484, "global_step": 236646, "epoch": 1955} {"train_loss": -43.454715728759766, "global_step": 236647, "epoch": 1955} {"train_loss": -43.34077072143555, "global_step": 236648, "epoch": 1955} {"train_loss": -42.72726058959961, "global_step": 236649, "epoch": 1955} {"train_loss": -42.88654708862305, "global_step": 236650, "epoch": 1955} {"train_loss": -43.395416259765625, "global_step": 236651, "epoch": 1955} {"train_loss": -43.7584342956543, "global_step": 236652, "epoch": 1955} {"train_loss": -43.49636459350586, "global_step": 236653, "epoch": 1955} {"train_loss": -43.7903938293457, "global_step": 236654, "epoch": 1955} {"train_loss": -43.69182205200195, "global_step": 236655, "epoch": 1955} {"train_loss": -43.820743560791016, "global_step": 236656, "epoch": 1955} {"train_loss": -43.89534378051758, "global_step": 236657, "epoch": 1955} {"train_loss": -43.798828125, "global_step": 236658, "epoch": 1955} {"train_loss": -43.83689498901367, "global_step": 236659, "epoch": 1955} {"train_loss": -43.931190490722656, "global_step": 236660, "epoch": 1955} {"train_loss": -43.96199035644531, "global_step": 236661, "epoch": 1955} {"train_loss": -43.83533477783203, "global_step": 236662, "epoch": 1955} {"train_loss": -44.08973693847656, "global_step": 236663, "epoch": 1955} {"train_loss": -43.91376876831055, "global_step": 236664, "epoch": 1955} {"train_loss": -43.52299880981445, "global_step": 236665, "epoch": 1955} {"train_loss": -43.17938232421875, "global_step": 236666, "epoch": 1955} {"train_loss": -43.669002532958984, "global_step": 236667, "epoch": 1955} {"train_loss": -43.47306442260742, "global_step": 236668, "epoch": 1955} {"train_loss": -43.641273498535156, "global_step": 236669, "epoch": 1955} {"train_loss": -43.60776901245117, "global_step": 236670, "epoch": 1955} {"train_loss": -43.797489166259766, "global_step": 236671, "epoch": 1955} {"train_loss": -43.23183822631836, "global_step": 236672, "epoch": 1955} {"train_loss": -42.26483917236328, "global_step": 236673, "epoch": 1955} {"train_loss": -43.033241271972656, "global_step": 236674, "epoch": 1955} {"train_loss": -42.72370942170955, "global_step": 236675, "epoch": 1955, "val_loss": 2642022.25} {"train_loss": -41.413818359375, "global_step": 236676, "epoch": 1956} {"train_loss": -42.04597091674805, "global_step": 236677, "epoch": 1956} {"train_loss": -41.51780319213867, "global_step": 236678, "epoch": 1956} {"train_loss": -42.261390686035156, "global_step": 236679, "epoch": 1956} {"train_loss": -42.6335563659668, "global_step": 236680, "epoch": 1956} {"train_loss": -41.96799850463867, "global_step": 236681, "epoch": 1956} {"train_loss": -40.42742156982422, "global_step": 236682, "epoch": 1956} {"train_loss": -42.39632797241211, "global_step": 236683, "epoch": 1956} {"train_loss": -42.229801177978516, "global_step": 236684, "epoch": 1956} {"train_loss": -41.70228958129883, "global_step": 236685, "epoch": 1956} {"train_loss": -41.188880920410156, "global_step": 236686, "epoch": 1956} {"train_loss": -41.87779235839844, "global_step": 236687, "epoch": 1956} {"train_loss": -42.24681854248047, "global_step": 236688, "epoch": 1956} {"train_loss": -39.08808898925781, "global_step": 236689, "epoch": 1956} {"train_loss": -39.60295486450195, "global_step": 236690, "epoch": 1956} {"train_loss": -42.74321746826172, "global_step": 236691, "epoch": 1956} {"train_loss": -41.79487991333008, "global_step": 236692, "epoch": 1956} {"train_loss": -41.616912841796875, "global_step": 236693, "epoch": 1956} {"train_loss": -42.34421157836914, "global_step": 236694, "epoch": 1956} {"train_loss": -41.27504348754883, "global_step": 236695, "epoch": 1956} {"train_loss": -41.686981201171875, "global_step": 236696, "epoch": 1956} {"train_loss": -42.67632293701172, "global_step": 236697, "epoch": 1956} {"train_loss": -40.92369079589844, "global_step": 236698, "epoch": 1956} {"train_loss": -41.46843338012695, "global_step": 236699, "epoch": 1956} {"train_loss": -42.41428756713867, "global_step": 236700, "epoch": 1956} {"train_loss": -40.71909713745117, "global_step": 236701, "epoch": 1956} {"train_loss": -42.8461799621582, "global_step": 236702, "epoch": 1956} {"train_loss": -42.32241439819336, "global_step": 236703, "epoch": 1956} {"train_loss": -41.846370697021484, "global_step": 236704, "epoch": 1956} {"train_loss": -42.84437561035156, "global_step": 236705, "epoch": 1956} {"train_loss": -42.21699142456055, "global_step": 236706, "epoch": 1956} {"train_loss": -42.46735382080078, "global_step": 236707, "epoch": 1956} {"train_loss": -42.77724075317383, "global_step": 236708, "epoch": 1956} {"train_loss": -41.664608001708984, "global_step": 236709, "epoch": 1956} {"train_loss": -42.446632385253906, "global_step": 236710, "epoch": 1956} {"train_loss": -42.78214645385742, "global_step": 236711, "epoch": 1956} {"train_loss": -41.67586135864258, "global_step": 236712, "epoch": 1956} {"train_loss": -43.01779556274414, "global_step": 236713, "epoch": 1956} {"train_loss": -41.974578857421875, "global_step": 236714, "epoch": 1956} {"train_loss": -42.794586181640625, "global_step": 236715, "epoch": 1956} {"train_loss": -41.99579620361328, "global_step": 236716, "epoch": 1956} {"train_loss": -42.166542053222656, "global_step": 236717, "epoch": 1956} {"train_loss": -42.74150848388672, "global_step": 236718, "epoch": 1956} {"train_loss": -42.18278503417969, "global_step": 236719, "epoch": 1956} {"train_loss": -41.68462371826172, "global_step": 236720, "epoch": 1956} {"train_loss": -43.54085922241211, "global_step": 236721, "epoch": 1956} {"train_loss": -41.72860336303711, "global_step": 236722, "epoch": 1956} {"train_loss": -43.01240158081055, "global_step": 236723, "epoch": 1956} {"train_loss": -42.417049407958984, "global_step": 236724, "epoch": 1956} {"train_loss": -43.2605094909668, "global_step": 236725, "epoch": 1956} {"train_loss": -43.038185119628906, "global_step": 236726, "epoch": 1956} {"train_loss": -42.42189407348633, "global_step": 236727, "epoch": 1956} {"train_loss": -43.160858154296875, "global_step": 236728, "epoch": 1956} {"train_loss": -43.08845901489258, "global_step": 236729, "epoch": 1956} {"train_loss": -43.452728271484375, "global_step": 236730, "epoch": 1956} {"train_loss": -42.94669723510742, "global_step": 236731, "epoch": 1956} {"train_loss": -43.09709167480469, "global_step": 236732, "epoch": 1956} {"train_loss": -43.10238265991211, "global_step": 236733, "epoch": 1956} {"train_loss": -42.637271881103516, "global_step": 236734, "epoch": 1956} {"train_loss": -43.69721603393555, "global_step": 236735, "epoch": 1956} {"train_loss": -42.241573333740234, "global_step": 236736, "epoch": 1956} {"train_loss": -43.62299728393555, "global_step": 236737, "epoch": 1956} {"train_loss": -43.435760498046875, "global_step": 236738, "epoch": 1956} {"train_loss": -42.4364128112793, "global_step": 236739, "epoch": 1956} {"train_loss": -43.47435760498047, "global_step": 236740, "epoch": 1956} {"train_loss": -43.41360092163086, "global_step": 236741, "epoch": 1956} {"train_loss": -43.037471771240234, "global_step": 236742, "epoch": 1956} {"train_loss": -42.91813278198242, "global_step": 236743, "epoch": 1956} {"train_loss": -43.5533447265625, "global_step": 236744, "epoch": 1956} {"train_loss": -43.549373626708984, "global_step": 236745, "epoch": 1956} {"train_loss": -43.505714416503906, "global_step": 236746, "epoch": 1956} {"train_loss": -42.82391357421875, "global_step": 236747, "epoch": 1956} {"train_loss": -43.70595169067383, "global_step": 236748, "epoch": 1956} {"train_loss": -43.498016357421875, "global_step": 236749, "epoch": 1956} {"train_loss": -43.10983657836914, "global_step": 236750, "epoch": 1956} {"train_loss": -43.401790618896484, "global_step": 236751, "epoch": 1956} {"train_loss": -43.88926315307617, "global_step": 236752, "epoch": 1956} {"train_loss": -43.87822341918945, "global_step": 236753, "epoch": 1956} {"train_loss": -43.116615295410156, "global_step": 236754, "epoch": 1956} {"train_loss": -42.85563659667969, "global_step": 236755, "epoch": 1956} {"train_loss": -40.9552116394043, "global_step": 236756, "epoch": 1956} {"train_loss": -41.97675704956055, "global_step": 236757, "epoch": 1956} {"train_loss": -42.68860626220703, "global_step": 236758, "epoch": 1956} {"train_loss": -43.502708435058594, "global_step": 236759, "epoch": 1956} {"train_loss": -43.386966705322266, "global_step": 236760, "epoch": 1956} {"train_loss": -40.922271728515625, "global_step": 236761, "epoch": 1956} {"train_loss": -40.43782424926758, "global_step": 236762, "epoch": 1956} {"train_loss": -42.18019104003906, "global_step": 236763, "epoch": 1956} {"train_loss": -42.41545486450195, "global_step": 236764, "epoch": 1956} {"train_loss": -43.533058166503906, "global_step": 236765, "epoch": 1956} {"train_loss": -42.43679428100586, "global_step": 236766, "epoch": 1956} {"train_loss": -42.15621566772461, "global_step": 236767, "epoch": 1956} {"train_loss": -43.24309158325195, "global_step": 236768, "epoch": 1956} {"train_loss": -42.978912353515625, "global_step": 236769, "epoch": 1956} {"train_loss": -43.57554244995117, "global_step": 236770, "epoch": 1956} {"train_loss": -42.338111877441406, "global_step": 236771, "epoch": 1956} {"train_loss": -43.10480880737305, "global_step": 236772, "epoch": 1956} {"train_loss": -42.66009521484375, "global_step": 236773, "epoch": 1956} {"train_loss": -43.36623001098633, "global_step": 236774, "epoch": 1956} {"train_loss": -42.665130615234375, "global_step": 236775, "epoch": 1956} {"train_loss": -42.818172454833984, "global_step": 236776, "epoch": 1956} {"train_loss": -43.28883743286133, "global_step": 236777, "epoch": 1956} {"train_loss": -42.44538497924805, "global_step": 236778, "epoch": 1956} {"train_loss": -42.969635009765625, "global_step": 236779, "epoch": 1956} {"train_loss": -43.625301361083984, "global_step": 236780, "epoch": 1956} {"train_loss": -42.81376266479492, "global_step": 236781, "epoch": 1956} {"train_loss": -42.210628509521484, "global_step": 236782, "epoch": 1956} {"train_loss": -42.47031784057617, "global_step": 236783, "epoch": 1956} {"train_loss": -43.10920333862305, "global_step": 236784, "epoch": 1956} {"train_loss": -43.644161224365234, "global_step": 236785, "epoch": 1956} {"train_loss": -42.12385559082031, "global_step": 236786, "epoch": 1956} {"train_loss": -41.6488037109375, "global_step": 236787, "epoch": 1956} {"train_loss": -42.54319381713867, "global_step": 236788, "epoch": 1956} {"train_loss": -41.999149322509766, "global_step": 236789, "epoch": 1956} {"train_loss": -43.24197006225586, "global_step": 236790, "epoch": 1956} {"train_loss": -43.185455322265625, "global_step": 236791, "epoch": 1956} {"train_loss": -41.9090576171875, "global_step": 236792, "epoch": 1956} {"train_loss": -42.76261520385742, "global_step": 236793, "epoch": 1956} {"train_loss": -43.3975830078125, "global_step": 236794, "epoch": 1956} {"train_loss": -42.46027374267578, "global_step": 236795, "epoch": 1956} {"train_loss": -42.52182473427008, "global_step": 236796, "epoch": 1956, "val_loss": 2700575.75} {"train_loss": -42.891197204589844, "global_step": 236797, "epoch": 1957} {"train_loss": -41.724239349365234, "global_step": 236798, "epoch": 1957} {"train_loss": -42.10244369506836, "global_step": 236799, "epoch": 1957} {"train_loss": -42.90019607543945, "global_step": 236800, "epoch": 1957} {"train_loss": -41.69320297241211, "global_step": 236801, "epoch": 1957} {"train_loss": -41.763702392578125, "global_step": 236802, "epoch": 1957} {"train_loss": -43.316158294677734, "global_step": 236803, "epoch": 1957} {"train_loss": -42.67737579345703, "global_step": 236804, "epoch": 1957} {"train_loss": -41.22190475463867, "global_step": 236805, "epoch": 1957} {"train_loss": -40.85756301879883, "global_step": 236806, "epoch": 1957} {"train_loss": -41.049964904785156, "global_step": 236807, "epoch": 1957} {"train_loss": -42.199954986572266, "global_step": 236808, "epoch": 1957} {"train_loss": -42.50269317626953, "global_step": 236809, "epoch": 1957} {"train_loss": -41.553348541259766, "global_step": 236810, "epoch": 1957} {"train_loss": -39.99030685424805, "global_step": 236811, "epoch": 1957} {"train_loss": -42.76286315917969, "global_step": 236812, "epoch": 1957} {"train_loss": -41.08924102783203, "global_step": 236813, "epoch": 1957} {"train_loss": -41.890625, "global_step": 236814, "epoch": 1957} {"train_loss": -41.73167037963867, "global_step": 236815, "epoch": 1957} {"train_loss": -42.205299377441406, "global_step": 236816, "epoch": 1957} {"train_loss": -41.728492736816406, "global_step": 236817, "epoch": 1957} {"train_loss": -42.7426872253418, "global_step": 236818, "epoch": 1957} {"train_loss": -41.64342498779297, "global_step": 236819, "epoch": 1957} {"train_loss": -41.561744689941406, "global_step": 236820, "epoch": 1957} {"train_loss": -41.09674835205078, "global_step": 236821, "epoch": 1957} {"train_loss": -41.90363693237305, "global_step": 236822, "epoch": 1957} {"train_loss": -41.52997589111328, "global_step": 236823, "epoch": 1957} {"train_loss": -42.810123443603516, "global_step": 236824, "epoch": 1957} {"train_loss": -41.41926956176758, "global_step": 236825, "epoch": 1957} {"train_loss": -43.03862762451172, "global_step": 236826, "epoch": 1957} {"train_loss": -41.1556510925293, "global_step": 236827, "epoch": 1957} {"train_loss": -41.866127014160156, "global_step": 236828, "epoch": 1957} {"train_loss": -42.64421463012695, "global_step": 236829, "epoch": 1957} {"train_loss": -42.84391403198242, "global_step": 236830, "epoch": 1957} {"train_loss": -41.13710021972656, "global_step": 236831, "epoch": 1957} {"train_loss": -42.77732467651367, "global_step": 236832, "epoch": 1957} {"train_loss": -41.926937103271484, "global_step": 236833, "epoch": 1957} {"train_loss": -41.5968132019043, "global_step": 236834, "epoch": 1957} {"train_loss": -41.754634857177734, "global_step": 236835, "epoch": 1957} {"train_loss": -40.625728607177734, "global_step": 236836, "epoch": 1957} {"train_loss": -41.44630813598633, "global_step": 236837, "epoch": 1957} {"train_loss": -42.42774963378906, "global_step": 236838, "epoch": 1957} {"train_loss": -42.121585845947266, "global_step": 236839, "epoch": 1957} {"train_loss": -42.298583984375, "global_step": 236840, "epoch": 1957} {"train_loss": -42.376426696777344, "global_step": 236841, "epoch": 1957} {"train_loss": -42.05506134033203, "global_step": 236842, "epoch": 1957} {"train_loss": -41.867462158203125, "global_step": 236843, "epoch": 1957} {"train_loss": -42.28371810913086, "global_step": 236844, "epoch": 1957} {"train_loss": -43.27640151977539, "global_step": 236845, "epoch": 1957} {"train_loss": -42.72199249267578, "global_step": 236846, "epoch": 1957} {"train_loss": -42.908267974853516, "global_step": 236847, "epoch": 1957} {"train_loss": -42.70292282104492, "global_step": 236848, "epoch": 1957} {"train_loss": -42.75240707397461, "global_step": 236849, "epoch": 1957} {"train_loss": -42.020286560058594, "global_step": 236850, "epoch": 1957} {"train_loss": -43.27753829956055, "global_step": 236851, "epoch": 1957} {"train_loss": -43.16523361206055, "global_step": 236852, "epoch": 1957} {"train_loss": -43.42097091674805, "global_step": 236853, "epoch": 1957} {"train_loss": -43.432220458984375, "global_step": 236854, "epoch": 1957} {"train_loss": -42.96200180053711, "global_step": 236855, "epoch": 1957} {"train_loss": -43.27772903442383, "global_step": 236856, "epoch": 1957} {"train_loss": -43.20408248901367, "global_step": 236857, "epoch": 1957} {"train_loss": -43.553924560546875, "global_step": 236858, "epoch": 1957} {"train_loss": -43.23853302001953, "global_step": 236859, "epoch": 1957} {"train_loss": -42.380126953125, "global_step": 236860, "epoch": 1957} {"train_loss": -43.47121810913086, "global_step": 236861, "epoch": 1957} {"train_loss": -42.50685501098633, "global_step": 236862, "epoch": 1957} {"train_loss": -43.61481475830078, "global_step": 236863, "epoch": 1957} {"train_loss": -43.614776611328125, "global_step": 236864, "epoch": 1957} {"train_loss": -42.698951721191406, "global_step": 236865, "epoch": 1957} {"train_loss": -41.72578048706055, "global_step": 236866, "epoch": 1957} {"train_loss": -42.16975402832031, "global_step": 236867, "epoch": 1957} {"train_loss": -43.10542678833008, "global_step": 236868, "epoch": 1957} {"train_loss": -42.793697357177734, "global_step": 236869, "epoch": 1957} {"train_loss": -41.293216705322266, "global_step": 236870, "epoch": 1957} {"train_loss": -41.32914352416992, "global_step": 236871, "epoch": 1957} {"train_loss": -42.962642669677734, "global_step": 236872, "epoch": 1957} {"train_loss": -43.594093322753906, "global_step": 236873, "epoch": 1957} {"train_loss": -43.923797607421875, "global_step": 236874, "epoch": 1957} {"train_loss": -42.66603469848633, "global_step": 236875, "epoch": 1957} {"train_loss": -42.62544631958008, "global_step": 236876, "epoch": 1957} {"train_loss": -43.74151611328125, "global_step": 236877, "epoch": 1957} {"train_loss": -43.08149337768555, "global_step": 236878, "epoch": 1957} {"train_loss": -42.64012145996094, "global_step": 236879, "epoch": 1957} {"train_loss": -42.026031494140625, "global_step": 236880, "epoch": 1957} {"train_loss": -43.15958786010742, "global_step": 236881, "epoch": 1957} {"train_loss": -43.289581298828125, "global_step": 236882, "epoch": 1957} {"train_loss": -43.26625442504883, "global_step": 236883, "epoch": 1957} {"train_loss": -42.03300094604492, "global_step": 236884, "epoch": 1957} {"train_loss": -42.51121139526367, "global_step": 236885, "epoch": 1957} {"train_loss": -43.49100875854492, "global_step": 236886, "epoch": 1957} {"train_loss": -41.52969741821289, "global_step": 236887, "epoch": 1957} {"train_loss": -40.88111114501953, "global_step": 236888, "epoch": 1957} {"train_loss": -43.23911666870117, "global_step": 236889, "epoch": 1957} {"train_loss": -42.85269546508789, "global_step": 236890, "epoch": 1957} {"train_loss": -42.89136505126953, "global_step": 236891, "epoch": 1957} {"train_loss": -43.66194534301758, "global_step": 236892, "epoch": 1957} {"train_loss": -42.04173278808594, "global_step": 236893, "epoch": 1957} {"train_loss": -42.70167922973633, "global_step": 236894, "epoch": 1957} {"train_loss": -43.721839904785156, "global_step": 236895, "epoch": 1957} {"train_loss": -42.25735092163086, "global_step": 236896, "epoch": 1957} {"train_loss": -42.44974899291992, "global_step": 236897, "epoch": 1957} {"train_loss": -43.36507034301758, "global_step": 236898, "epoch": 1957} {"train_loss": -42.96734619140625, "global_step": 236899, "epoch": 1957} {"train_loss": -43.95109939575195, "global_step": 236900, "epoch": 1957} {"train_loss": -42.98275375366211, "global_step": 236901, "epoch": 1957} {"train_loss": -43.46438217163086, "global_step": 236902, "epoch": 1957} {"train_loss": -43.695430755615234, "global_step": 236903, "epoch": 1957} {"train_loss": -42.71158981323242, "global_step": 236904, "epoch": 1957} {"train_loss": -43.67497634887695, "global_step": 236905, "epoch": 1957} {"train_loss": -43.164337158203125, "global_step": 236906, "epoch": 1957} {"train_loss": -43.5251579284668, "global_step": 236907, "epoch": 1957} {"train_loss": -43.54671859741211, "global_step": 236908, "epoch": 1957} {"train_loss": -43.167564392089844, "global_step": 236909, "epoch": 1957} {"train_loss": -43.81597900390625, "global_step": 236910, "epoch": 1957} {"train_loss": -43.18325424194336, "global_step": 236911, "epoch": 1957} {"train_loss": -42.60298538208008, "global_step": 236912, "epoch": 1957} {"train_loss": -43.16070556640625, "global_step": 236913, "epoch": 1957} {"train_loss": -42.859344482421875, "global_step": 236914, "epoch": 1957} {"train_loss": -43.73337173461914, "global_step": 236915, "epoch": 1957} {"train_loss": -42.64418411254883, "global_step": 236916, "epoch": 1957} {"train_loss": -42.54353877926661, "global_step": 236917, "epoch": 1957, "val_loss": 2612429.25} {"train_loss": -44.11333084106445, "global_step": 236918, "epoch": 1958} {"train_loss": -43.316551208496094, "global_step": 236919, "epoch": 1958} {"train_loss": -43.693904876708984, "global_step": 236920, "epoch": 1958} {"train_loss": -42.69150924682617, "global_step": 236921, "epoch": 1958} {"train_loss": -43.541526794433594, "global_step": 236922, "epoch": 1958} {"train_loss": -42.73119354248047, "global_step": 236923, "epoch": 1958} {"train_loss": -43.50724411010742, "global_step": 236924, "epoch": 1958} {"train_loss": -43.52016067504883, "global_step": 236925, "epoch": 1958} {"train_loss": -43.19899368286133, "global_step": 236926, "epoch": 1958} {"train_loss": -42.08365249633789, "global_step": 236927, "epoch": 1958} {"train_loss": -42.224891662597656, "global_step": 236928, "epoch": 1958} {"train_loss": -43.300899505615234, "global_step": 236929, "epoch": 1958} {"train_loss": -43.672950744628906, "global_step": 236930, "epoch": 1958} {"train_loss": -43.29533004760742, "global_step": 236931, "epoch": 1958} {"train_loss": -43.46030044555664, "global_step": 236932, "epoch": 1958} {"train_loss": -43.1735954284668, "global_step": 236933, "epoch": 1958} {"train_loss": -43.59589385986328, "global_step": 236934, "epoch": 1958} {"train_loss": -43.99367904663086, "global_step": 236935, "epoch": 1958} {"train_loss": -43.122314453125, "global_step": 236936, "epoch": 1958} {"train_loss": -43.11890411376953, "global_step": 236937, "epoch": 1958} {"train_loss": -41.300445556640625, "global_step": 236938, "epoch": 1958} {"train_loss": -39.81509017944336, "global_step": 236939, "epoch": 1958} {"train_loss": -42.834442138671875, "global_step": 236940, "epoch": 1958} {"train_loss": -42.85920333862305, "global_step": 236941, "epoch": 1958} {"train_loss": -41.55123519897461, "global_step": 236942, "epoch": 1958} {"train_loss": -37.4094352722168, "global_step": 236943, "epoch": 1958} {"train_loss": -43.11515426635742, "global_step": 236944, "epoch": 1958} {"train_loss": -35.2706298828125, "global_step": 236945, "epoch": 1958} {"train_loss": -25.34208106994629, "global_step": 236946, "epoch": 1958} {"train_loss": -38.5156364440918, "global_step": 236947, "epoch": 1958} {"train_loss": -41.5186767578125, "global_step": 236948, "epoch": 1958} {"train_loss": -37.25208282470703, "global_step": 236949, "epoch": 1958} {"train_loss": -40.91811752319336, "global_step": 236950, "epoch": 1958} {"train_loss": -40.113563537597656, "global_step": 236951, "epoch": 1958} {"train_loss": -37.92558288574219, "global_step": 236952, "epoch": 1958} {"train_loss": -40.49323654174805, "global_step": 236953, "epoch": 1958} {"train_loss": -41.36175537109375, "global_step": 236954, "epoch": 1958} {"train_loss": -40.74055862426758, "global_step": 236955, "epoch": 1958} {"train_loss": -40.584774017333984, "global_step": 236956, "epoch": 1958} {"train_loss": -40.708213806152344, "global_step": 236957, "epoch": 1958} {"train_loss": -41.425437927246094, "global_step": 236958, "epoch": 1958} {"train_loss": -41.87110900878906, "global_step": 236959, "epoch": 1958} {"train_loss": -41.57527542114258, "global_step": 236960, "epoch": 1958} {"train_loss": -40.975563049316406, "global_step": 236961, "epoch": 1958} {"train_loss": -41.22040557861328, "global_step": 236962, "epoch": 1958} {"train_loss": -41.637672424316406, "global_step": 236963, "epoch": 1958} {"train_loss": -42.5472526550293, "global_step": 236964, "epoch": 1958} {"train_loss": -42.384124755859375, "global_step": 236965, "epoch": 1958} {"train_loss": -42.459259033203125, "global_step": 236966, "epoch": 1958} {"train_loss": -42.0370979309082, "global_step": 236967, "epoch": 1958} {"train_loss": -42.904815673828125, "global_step": 236968, "epoch": 1958} {"train_loss": -41.70158767700195, "global_step": 236969, "epoch": 1958} {"train_loss": -42.16524887084961, "global_step": 236970, "epoch": 1958} {"train_loss": -42.45863723754883, "global_step": 236971, "epoch": 1958} {"train_loss": -41.90853500366211, "global_step": 236972, "epoch": 1958} {"train_loss": -42.79229736328125, "global_step": 236973, "epoch": 1958} {"train_loss": -42.53154373168945, "global_step": 236974, "epoch": 1958} {"train_loss": -42.518611907958984, "global_step": 236975, "epoch": 1958} {"train_loss": -42.277565002441406, "global_step": 236976, "epoch": 1958} {"train_loss": -42.86959457397461, "global_step": 236977, "epoch": 1958} {"train_loss": -41.91074752807617, "global_step": 236978, "epoch": 1958} {"train_loss": -42.80271530151367, "global_step": 236979, "epoch": 1958} {"train_loss": -43.28184509277344, "global_step": 236980, "epoch": 1958} {"train_loss": -43.1114387512207, "global_step": 236981, "epoch": 1958} {"train_loss": -42.8048210144043, "global_step": 236982, "epoch": 1958} {"train_loss": -42.94326400756836, "global_step": 236983, "epoch": 1958} {"train_loss": -43.47389221191406, "global_step": 236984, "epoch": 1958} {"train_loss": -43.38979721069336, "global_step": 236985, "epoch": 1958} {"train_loss": -43.400428771972656, "global_step": 236986, "epoch": 1958} {"train_loss": -43.33173370361328, "global_step": 236987, "epoch": 1958} {"train_loss": -43.2750244140625, "global_step": 236988, "epoch": 1958} {"train_loss": -43.5341796875, "global_step": 236989, "epoch": 1958} {"train_loss": -43.67726135253906, "global_step": 236990, "epoch": 1958} {"train_loss": -43.65583038330078, "global_step": 236991, "epoch": 1958} {"train_loss": -43.648921966552734, "global_step": 236992, "epoch": 1958} {"train_loss": -43.58572006225586, "global_step": 236993, "epoch": 1958} {"train_loss": -43.638458251953125, "global_step": 236994, "epoch": 1958} {"train_loss": -43.585784912109375, "global_step": 236995, "epoch": 1958} {"train_loss": -43.9516716003418, "global_step": 236996, "epoch": 1958} {"train_loss": -43.16501235961914, "global_step": 236997, "epoch": 1958} {"train_loss": -43.096736907958984, "global_step": 236998, "epoch": 1958} {"train_loss": -43.76925277709961, "global_step": 236999, "epoch": 1958} {"train_loss": -43.557918548583984, "global_step": 237000, "epoch": 1958} {"train_loss": -43.69123458862305, "global_step": 237001, "epoch": 1958} {"train_loss": -43.62054443359375, "global_step": 237002, "epoch": 1958} {"train_loss": -43.33352279663086, "global_step": 237003, "epoch": 1958} {"train_loss": -44.137054443359375, "global_step": 237004, "epoch": 1958} {"train_loss": -43.946990966796875, "global_step": 237005, "epoch": 1958} {"train_loss": -43.524532318115234, "global_step": 237006, "epoch": 1958} {"train_loss": -43.425289154052734, "global_step": 237007, "epoch": 1958} {"train_loss": -43.68036651611328, "global_step": 237008, "epoch": 1958} {"train_loss": -43.77919387817383, "global_step": 237009, "epoch": 1958} {"train_loss": -43.93357467651367, "global_step": 237010, "epoch": 1958} {"train_loss": -43.51107406616211, "global_step": 237011, "epoch": 1958} {"train_loss": -43.39564895629883, "global_step": 237012, "epoch": 1958} {"train_loss": -43.886383056640625, "global_step": 237013, "epoch": 1958} {"train_loss": -43.61477279663086, "global_step": 237014, "epoch": 1958} {"train_loss": -43.440757751464844, "global_step": 237015, "epoch": 1958} {"train_loss": -43.74037551879883, "global_step": 237016, "epoch": 1958} {"train_loss": -44.22943115234375, "global_step": 237017, "epoch": 1958} {"train_loss": -43.99483871459961, "global_step": 237018, "epoch": 1958} {"train_loss": -44.3121223449707, "global_step": 237019, "epoch": 1958} {"train_loss": -42.72092819213867, "global_step": 237020, "epoch": 1958} {"train_loss": -42.743446350097656, "global_step": 237021, "epoch": 1958} {"train_loss": -43.72391891479492, "global_step": 237022, "epoch": 1958} {"train_loss": -44.070255279541016, "global_step": 237023, "epoch": 1958} {"train_loss": -42.53375244140625, "global_step": 237024, "epoch": 1958} {"train_loss": -43.12000274658203, "global_step": 237025, "epoch": 1958} {"train_loss": -43.06856155395508, "global_step": 237026, "epoch": 1958} {"train_loss": -41.35065841674805, "global_step": 237027, "epoch": 1958} {"train_loss": -40.84173583984375, "global_step": 237028, "epoch": 1958} {"train_loss": -41.96684646606445, "global_step": 237029, "epoch": 1958} {"train_loss": -42.512664794921875, "global_step": 237030, "epoch": 1958} {"train_loss": -41.936866760253906, "global_step": 237031, "epoch": 1958} {"train_loss": -42.19566345214844, "global_step": 237032, "epoch": 1958} {"train_loss": -42.589988708496094, "global_step": 237033, "epoch": 1958} {"train_loss": -42.494972229003906, "global_step": 237034, "epoch": 1958} {"train_loss": -40.380062103271484, "global_step": 237035, "epoch": 1958} {"train_loss": -43.01036071777344, "global_step": 237036, "epoch": 1958} {"train_loss": -42.18927764892578, "global_step": 237037, "epoch": 1958} {"train_loss": -42.39995122546992, "global_step": 237038, "epoch": 1958, "val_loss": 2635333.0} {"train_loss": -43.20670700073242, "global_step": 237039, "epoch": 1959} {"train_loss": -42.9050178527832, "global_step": 237040, "epoch": 1959} {"train_loss": -42.06959915161133, "global_step": 237041, "epoch": 1959} {"train_loss": -43.368080139160156, "global_step": 237042, "epoch": 1959} {"train_loss": -41.090545654296875, "global_step": 237043, "epoch": 1959} {"train_loss": -42.88019561767578, "global_step": 237044, "epoch": 1959} {"train_loss": -40.81295394897461, "global_step": 237045, "epoch": 1959} {"train_loss": -42.20595169067383, "global_step": 237046, "epoch": 1959} {"train_loss": -41.507080078125, "global_step": 237047, "epoch": 1959} {"train_loss": -40.95652770996094, "global_step": 237048, "epoch": 1959} {"train_loss": -42.209503173828125, "global_step": 237049, "epoch": 1959} {"train_loss": -40.41841506958008, "global_step": 237050, "epoch": 1959} {"train_loss": -41.33686447143555, "global_step": 237051, "epoch": 1959} {"train_loss": -41.53778076171875, "global_step": 237052, "epoch": 1959} {"train_loss": -38.17873764038086, "global_step": 237053, "epoch": 1959} {"train_loss": -41.42760467529297, "global_step": 237054, "epoch": 1959} {"train_loss": -40.96666717529297, "global_step": 237055, "epoch": 1959} {"train_loss": -42.075130462646484, "global_step": 237056, "epoch": 1959} {"train_loss": -41.86737823486328, "global_step": 237057, "epoch": 1959} {"train_loss": -35.91032028198242, "global_step": 237058, "epoch": 1959} {"train_loss": -41.09847640991211, "global_step": 237059, "epoch": 1959} {"train_loss": -38.69575119018555, "global_step": 237060, "epoch": 1959} {"train_loss": -39.467185974121094, "global_step": 237061, "epoch": 1959} {"train_loss": -41.60310745239258, "global_step": 237062, "epoch": 1959} {"train_loss": -26.075336456298828, "global_step": 237063, "epoch": 1959} {"train_loss": -37.77523422241211, "global_step": 237064, "epoch": 1959} {"train_loss": -31.2056884765625, "global_step": 237065, "epoch": 1959} {"train_loss": -38.85912322998047, "global_step": 237066, "epoch": 1959} {"train_loss": -37.450775146484375, "global_step": 237067, "epoch": 1959} {"train_loss": -33.80384063720703, "global_step": 237068, "epoch": 1959} {"train_loss": -36.23533248901367, "global_step": 237069, "epoch": 1959} {"train_loss": -37.723609924316406, "global_step": 237070, "epoch": 1959} {"train_loss": -38.95378112792969, "global_step": 237071, "epoch": 1959} {"train_loss": -38.90480422973633, "global_step": 237072, "epoch": 1959} {"train_loss": -34.1119499206543, "global_step": 237073, "epoch": 1959} {"train_loss": -38.28192138671875, "global_step": 237074, "epoch": 1959} {"train_loss": -35.3985710144043, "global_step": 237075, "epoch": 1959} {"train_loss": -38.25930404663086, "global_step": 237076, "epoch": 1959} {"train_loss": -38.400047302246094, "global_step": 237077, "epoch": 1959} {"train_loss": -38.596797943115234, "global_step": 237078, "epoch": 1959} {"train_loss": -38.31366729736328, "global_step": 237079, "epoch": 1959} {"train_loss": -38.40522384643555, "global_step": 237080, "epoch": 1959} {"train_loss": -37.6707649230957, "global_step": 237081, "epoch": 1959} {"train_loss": -37.5283317565918, "global_step": 237082, "epoch": 1959} {"train_loss": -38.10171127319336, "global_step": 237083, "epoch": 1959} {"train_loss": -37.08119583129883, "global_step": 237084, "epoch": 1959} {"train_loss": -38.492164611816406, "global_step": 237085, "epoch": 1959} {"train_loss": -39.558013916015625, "global_step": 237086, "epoch": 1959} {"train_loss": -40.380760192871094, "global_step": 237087, "epoch": 1959} {"train_loss": -39.72206497192383, "global_step": 237088, "epoch": 1959} {"train_loss": -40.529762268066406, "global_step": 237089, "epoch": 1959} {"train_loss": -38.79655075073242, "global_step": 237090, "epoch": 1959} {"train_loss": -39.70368576049805, "global_step": 237091, "epoch": 1959} {"train_loss": -40.007179260253906, "global_step": 237092, "epoch": 1959} {"train_loss": -37.30574417114258, "global_step": 237093, "epoch": 1959} {"train_loss": -40.20750045776367, "global_step": 237094, "epoch": 1959} {"train_loss": -40.15100860595703, "global_step": 237095, "epoch": 1959} {"train_loss": -40.139827728271484, "global_step": 237096, "epoch": 1959} {"train_loss": -40.524044036865234, "global_step": 237097, "epoch": 1959} {"train_loss": -40.38348388671875, "global_step": 237098, "epoch": 1959} {"train_loss": -40.35603713989258, "global_step": 237099, "epoch": 1959} {"train_loss": -40.94866180419922, "global_step": 237100, "epoch": 1959} {"train_loss": -39.81877136230469, "global_step": 237101, "epoch": 1959} {"train_loss": -40.37856674194336, "global_step": 237102, "epoch": 1959} {"train_loss": -40.80733108520508, "global_step": 237103, "epoch": 1959} {"train_loss": -40.327632904052734, "global_step": 237104, "epoch": 1959} {"train_loss": -41.69429397583008, "global_step": 237105, "epoch": 1959} {"train_loss": -40.826629638671875, "global_step": 237106, "epoch": 1959} {"train_loss": -41.302669525146484, "global_step": 237107, "epoch": 1959} {"train_loss": -41.37499237060547, "global_step": 237108, "epoch": 1959} {"train_loss": -41.81680679321289, "global_step": 237109, "epoch": 1959} {"train_loss": -41.51710510253906, "global_step": 237110, "epoch": 1959} {"train_loss": -41.42820358276367, "global_step": 237111, "epoch": 1959} {"train_loss": -41.567134857177734, "global_step": 237112, "epoch": 1959} {"train_loss": -41.84468460083008, "global_step": 237113, "epoch": 1959} {"train_loss": -40.67966842651367, "global_step": 237114, "epoch": 1959} {"train_loss": -41.471771240234375, "global_step": 237115, "epoch": 1959} {"train_loss": -41.46721649169922, "global_step": 237116, "epoch": 1959} {"train_loss": -41.241817474365234, "global_step": 237117, "epoch": 1959} {"train_loss": -41.74039840698242, "global_step": 237118, "epoch": 1959} {"train_loss": -41.792049407958984, "global_step": 237119, "epoch": 1959} {"train_loss": -41.60441970825195, "global_step": 237120, "epoch": 1959} {"train_loss": -42.32252502441406, "global_step": 237121, "epoch": 1959} {"train_loss": -41.94763946533203, "global_step": 237122, "epoch": 1959} {"train_loss": -41.541072845458984, "global_step": 237123, "epoch": 1959} {"train_loss": -42.30892562866211, "global_step": 237124, "epoch": 1959} {"train_loss": -41.71371078491211, "global_step": 237125, "epoch": 1959} {"train_loss": -42.51909255981445, "global_step": 237126, "epoch": 1959} {"train_loss": -41.522010803222656, "global_step": 237127, "epoch": 1959} {"train_loss": -41.68697738647461, "global_step": 237128, "epoch": 1959} {"train_loss": -42.614200592041016, "global_step": 237129, "epoch": 1959} {"train_loss": -41.72774887084961, "global_step": 237130, "epoch": 1959} {"train_loss": -42.4976692199707, "global_step": 237131, "epoch": 1959} {"train_loss": -42.44219970703125, "global_step": 237132, "epoch": 1959} {"train_loss": -42.530330657958984, "global_step": 237133, "epoch": 1959} {"train_loss": -43.137367248535156, "global_step": 237134, "epoch": 1959} {"train_loss": -42.5114860534668, "global_step": 237135, "epoch": 1959} {"train_loss": -42.79419708251953, "global_step": 237136, "epoch": 1959} {"train_loss": -42.62512969970703, "global_step": 237137, "epoch": 1959} {"train_loss": -42.55781936645508, "global_step": 237138, "epoch": 1959} {"train_loss": -42.85205841064453, "global_step": 237139, "epoch": 1959} {"train_loss": -42.38497543334961, "global_step": 237140, "epoch": 1959} {"train_loss": -43.01998519897461, "global_step": 237141, "epoch": 1959} {"train_loss": -42.96399688720703, "global_step": 237142, "epoch": 1959} {"train_loss": -42.88823699951172, "global_step": 237143, "epoch": 1959} {"train_loss": -43.27781295776367, "global_step": 237144, "epoch": 1959} {"train_loss": -43.12441635131836, "global_step": 237145, "epoch": 1959} {"train_loss": -43.236183166503906, "global_step": 237146, "epoch": 1959} {"train_loss": -42.66598129272461, "global_step": 237147, "epoch": 1959} {"train_loss": -42.205928802490234, "global_step": 237148, "epoch": 1959} {"train_loss": -43.432735443115234, "global_step": 237149, "epoch": 1959} {"train_loss": -43.02640914916992, "global_step": 237150, "epoch": 1959} {"train_loss": -42.7216911315918, "global_step": 237151, "epoch": 1959} {"train_loss": -42.323970794677734, "global_step": 237152, "epoch": 1959} {"train_loss": -42.48845291137695, "global_step": 237153, "epoch": 1959} {"train_loss": -43.176734924316406, "global_step": 237154, "epoch": 1959} {"train_loss": -42.860382080078125, "global_step": 237155, "epoch": 1959} {"train_loss": -42.67130661010742, "global_step": 237156, "epoch": 1959} {"train_loss": -42.24812316894531, "global_step": 237157, "epoch": 1959} {"train_loss": -43.04268264770508, "global_step": 237158, "epoch": 1959} {"train_loss": -40.637787653394966, "global_step": 237159, "epoch": 1959, "val_loss": 2714136.75} {"train_loss": -43.087890625, "global_step": 237160, "epoch": 1960} {"train_loss": -43.37534713745117, "global_step": 237161, "epoch": 1960} {"train_loss": -41.810054779052734, "global_step": 237162, "epoch": 1960} {"train_loss": -43.335426330566406, "global_step": 237163, "epoch": 1960} {"train_loss": -44.00366973876953, "global_step": 237164, "epoch": 1960} {"train_loss": -42.674800872802734, "global_step": 237165, "epoch": 1960} {"train_loss": -43.08018112182617, "global_step": 237166, "epoch": 1960} {"train_loss": -42.985511779785156, "global_step": 237167, "epoch": 1960} {"train_loss": -41.28443908691406, "global_step": 237168, "epoch": 1960} {"train_loss": -37.83479690551758, "global_step": 237169, "epoch": 1960} {"train_loss": -37.07123947143555, "global_step": 237170, "epoch": 1960} {"train_loss": -39.749847412109375, "global_step": 237171, "epoch": 1960} {"train_loss": -38.39156723022461, "global_step": 237172, "epoch": 1960} {"train_loss": -39.09481430053711, "global_step": 237173, "epoch": 1960} {"train_loss": -38.646148681640625, "global_step": 237174, "epoch": 1960} {"train_loss": -38.63969039916992, "global_step": 237175, "epoch": 1960} {"train_loss": -41.21117401123047, "global_step": 237176, "epoch": 1960} {"train_loss": -39.18803024291992, "global_step": 237177, "epoch": 1960} {"train_loss": -36.565040588378906, "global_step": 237178, "epoch": 1960} {"train_loss": -40.181617736816406, "global_step": 237179, "epoch": 1960} {"train_loss": -40.262413024902344, "global_step": 237180, "epoch": 1960} {"train_loss": -40.407630920410156, "global_step": 237181, "epoch": 1960} {"train_loss": -41.662166595458984, "global_step": 237182, "epoch": 1960} {"train_loss": -42.072181701660156, "global_step": 237183, "epoch": 1960} {"train_loss": -41.23999786376953, "global_step": 237184, "epoch": 1960} {"train_loss": -40.79610824584961, "global_step": 237185, "epoch": 1960} {"train_loss": -39.831661224365234, "global_step": 237186, "epoch": 1960} {"train_loss": -41.782527923583984, "global_step": 237187, "epoch": 1960} {"train_loss": -42.28033447265625, "global_step": 237188, "epoch": 1960} {"train_loss": -41.946468353271484, "global_step": 237189, "epoch": 1960} {"train_loss": -41.986270904541016, "global_step": 237190, "epoch": 1960} {"train_loss": -42.4036750793457, "global_step": 237191, "epoch": 1960} {"train_loss": -41.175167083740234, "global_step": 237192, "epoch": 1960} {"train_loss": -42.19569778442383, "global_step": 237193, "epoch": 1960} {"train_loss": -42.87264633178711, "global_step": 237194, "epoch": 1960} {"train_loss": -41.26277160644531, "global_step": 237195, "epoch": 1960} {"train_loss": -42.765499114990234, "global_step": 237196, "epoch": 1960} {"train_loss": -41.33248519897461, "global_step": 237197, "epoch": 1960} {"train_loss": -41.71993637084961, "global_step": 237198, "epoch": 1960} {"train_loss": -41.85665512084961, "global_step": 237199, "epoch": 1960} {"train_loss": -40.441307067871094, "global_step": 237200, "epoch": 1960} {"train_loss": -41.4071159362793, "global_step": 237201, "epoch": 1960} {"train_loss": -42.638999938964844, "global_step": 237202, "epoch": 1960} {"train_loss": -42.45876693725586, "global_step": 237203, "epoch": 1960} {"train_loss": -42.69283676147461, "global_step": 237204, "epoch": 1960} {"train_loss": -42.47365951538086, "global_step": 237205, "epoch": 1960} {"train_loss": -41.31978988647461, "global_step": 237206, "epoch": 1960} {"train_loss": -42.0672721862793, "global_step": 237207, "epoch": 1960} {"train_loss": -40.0037956237793, "global_step": 237208, "epoch": 1960} {"train_loss": -41.57863998413086, "global_step": 237209, "epoch": 1960} {"train_loss": -41.402347564697266, "global_step": 237210, "epoch": 1960} {"train_loss": -41.151546478271484, "global_step": 237211, "epoch": 1960} {"train_loss": -41.79008102416992, "global_step": 237212, "epoch": 1960} {"train_loss": -42.18424606323242, "global_step": 237213, "epoch": 1960} {"train_loss": -40.398555755615234, "global_step": 237214, "epoch": 1960} {"train_loss": -41.25703811645508, "global_step": 237215, "epoch": 1960} {"train_loss": -32.1890983581543, "global_step": 237216, "epoch": 1960} {"train_loss": -42.538238525390625, "global_step": 237217, "epoch": 1960} {"train_loss": -41.84248733520508, "global_step": 237218, "epoch": 1960} {"train_loss": -34.28151321411133, "global_step": 237219, "epoch": 1960} {"train_loss": -38.99796676635742, "global_step": 237220, "epoch": 1960} {"train_loss": -39.5606803894043, "global_step": 237221, "epoch": 1960} {"train_loss": -41.45868682861328, "global_step": 237222, "epoch": 1960} {"train_loss": -41.30038070678711, "global_step": 237223, "epoch": 1960} {"train_loss": -36.352020263671875, "global_step": 237224, "epoch": 1960} {"train_loss": -32.44940948486328, "global_step": 237225, "epoch": 1960} {"train_loss": -38.8255500793457, "global_step": 237226, "epoch": 1960} {"train_loss": -40.50693893432617, "global_step": 237227, "epoch": 1960} {"train_loss": -39.48209762573242, "global_step": 237228, "epoch": 1960} {"train_loss": -39.39701461791992, "global_step": 237229, "epoch": 1960} {"train_loss": -40.30017852783203, "global_step": 237230, "epoch": 1960} {"train_loss": -39.88433837890625, "global_step": 237231, "epoch": 1960} {"train_loss": -39.87747573852539, "global_step": 237232, "epoch": 1960} {"train_loss": -37.2887077331543, "global_step": 237233, "epoch": 1960} {"train_loss": -41.31698226928711, "global_step": 237234, "epoch": 1960} {"train_loss": -42.44660949707031, "global_step": 237235, "epoch": 1960} {"train_loss": -40.29198455810547, "global_step": 237236, "epoch": 1960} {"train_loss": -41.23187255859375, "global_step": 237237, "epoch": 1960} {"train_loss": -41.45961380004883, "global_step": 237238, "epoch": 1960} {"train_loss": -39.30758285522461, "global_step": 237239, "epoch": 1960} {"train_loss": -41.32594299316406, "global_step": 237240, "epoch": 1960} {"train_loss": -42.4835090637207, "global_step": 237241, "epoch": 1960} {"train_loss": -41.992164611816406, "global_step": 237242, "epoch": 1960} {"train_loss": -41.497093200683594, "global_step": 237243, "epoch": 1960} {"train_loss": -41.1477165222168, "global_step": 237244, "epoch": 1960} {"train_loss": -42.1955680847168, "global_step": 237245, "epoch": 1960} {"train_loss": -41.142757415771484, "global_step": 237246, "epoch": 1960} {"train_loss": -42.46900939941406, "global_step": 237247, "epoch": 1960} {"train_loss": -41.53736114501953, "global_step": 237248, "epoch": 1960} {"train_loss": -42.66923904418945, "global_step": 237249, "epoch": 1960} {"train_loss": -42.3568000793457, "global_step": 237250, "epoch": 1960} {"train_loss": -42.45493698120117, "global_step": 237251, "epoch": 1960} {"train_loss": -40.94478988647461, "global_step": 237252, "epoch": 1960} {"train_loss": -38.102474212646484, "global_step": 237253, "epoch": 1960} {"train_loss": -42.67688751220703, "global_step": 237254, "epoch": 1960} {"train_loss": -41.994659423828125, "global_step": 237255, "epoch": 1960} {"train_loss": -42.01023483276367, "global_step": 237256, "epoch": 1960} {"train_loss": -42.27549362182617, "global_step": 237257, "epoch": 1960} {"train_loss": -41.62702178955078, "global_step": 237258, "epoch": 1960} {"train_loss": -41.436336517333984, "global_step": 237259, "epoch": 1960} {"train_loss": -42.20823287963867, "global_step": 237260, "epoch": 1960} {"train_loss": -38.74192428588867, "global_step": 237261, "epoch": 1960} {"train_loss": -42.3154296875, "global_step": 237262, "epoch": 1960} {"train_loss": -41.06842803955078, "global_step": 237263, "epoch": 1960} {"train_loss": -42.35007858276367, "global_step": 237264, "epoch": 1960} {"train_loss": -39.31134796142578, "global_step": 237265, "epoch": 1960} {"train_loss": -41.840179443359375, "global_step": 237266, "epoch": 1960} {"train_loss": -41.77389907836914, "global_step": 237267, "epoch": 1960} {"train_loss": -42.514339447021484, "global_step": 237268, "epoch": 1960} {"train_loss": -42.28831100463867, "global_step": 237269, "epoch": 1960} {"train_loss": -43.00333786010742, "global_step": 237270, "epoch": 1960} {"train_loss": -42.505855560302734, "global_step": 237271, "epoch": 1960} {"train_loss": -41.800228118896484, "global_step": 237272, "epoch": 1960} {"train_loss": -42.05970001220703, "global_step": 237273, "epoch": 1960} {"train_loss": -42.61540603637695, "global_step": 237274, "epoch": 1960} {"train_loss": -41.915199279785156, "global_step": 237275, "epoch": 1960} {"train_loss": -43.32705307006836, "global_step": 237276, "epoch": 1960} {"train_loss": -42.949581146240234, "global_step": 237277, "epoch": 1960} {"train_loss": -42.63627243041992, "global_step": 237278, "epoch": 1960} {"train_loss": -42.695343017578125, "global_step": 237279, "epoch": 1960} {"train_loss": -41.05278768618245, "global_step": 237280, "epoch": 1960, "val_loss": 2594773.25} {"train_loss": -42.92145538330078, "global_step": 237281, "epoch": 1961} {"train_loss": -43.0220947265625, "global_step": 237282, "epoch": 1961} {"train_loss": -42.376258850097656, "global_step": 237283, "epoch": 1961} {"train_loss": -42.569580078125, "global_step": 237284, "epoch": 1961} {"train_loss": -41.968048095703125, "global_step": 237285, "epoch": 1961} {"train_loss": -40.81512451171875, "global_step": 237286, "epoch": 1961} {"train_loss": -42.265228271484375, "global_step": 237287, "epoch": 1961} {"train_loss": -42.63066101074219, "global_step": 237288, "epoch": 1961} {"train_loss": -42.33587646484375, "global_step": 237289, "epoch": 1961} {"train_loss": -43.21165084838867, "global_step": 237290, "epoch": 1961} {"train_loss": -41.8203125, "global_step": 237291, "epoch": 1961} {"train_loss": -41.22589111328125, "global_step": 237292, "epoch": 1961} {"train_loss": -41.788753509521484, "global_step": 237293, "epoch": 1961} {"train_loss": -41.580909729003906, "global_step": 237294, "epoch": 1961} {"train_loss": -41.16312789916992, "global_step": 237295, "epoch": 1961} {"train_loss": -42.251590728759766, "global_step": 237296, "epoch": 1961} {"train_loss": -41.04780960083008, "global_step": 237297, "epoch": 1961} {"train_loss": -41.76726150512695, "global_step": 237298, "epoch": 1961} {"train_loss": -42.67506790161133, "global_step": 237299, "epoch": 1961} {"train_loss": -41.68885803222656, "global_step": 237300, "epoch": 1961} {"train_loss": -40.4699592590332, "global_step": 237301, "epoch": 1961} {"train_loss": -41.030155181884766, "global_step": 237302, "epoch": 1961} {"train_loss": -41.10128402709961, "global_step": 237303, "epoch": 1961} {"train_loss": -42.326080322265625, "global_step": 237304, "epoch": 1961} {"train_loss": -42.508636474609375, "global_step": 237305, "epoch": 1961} {"train_loss": -41.15904235839844, "global_step": 237306, "epoch": 1961} {"train_loss": -42.375423431396484, "global_step": 237307, "epoch": 1961} {"train_loss": -40.2015266418457, "global_step": 237308, "epoch": 1961} {"train_loss": -36.846038818359375, "global_step": 237309, "epoch": 1961} {"train_loss": -41.26784896850586, "global_step": 237310, "epoch": 1961} {"train_loss": -39.469154357910156, "global_step": 237311, "epoch": 1961} {"train_loss": -40.33797073364258, "global_step": 237312, "epoch": 1961} {"train_loss": -36.92070388793945, "global_step": 237313, "epoch": 1961} {"train_loss": -39.865753173828125, "global_step": 237314, "epoch": 1961} {"train_loss": -39.14448165893555, "global_step": 237315, "epoch": 1961} {"train_loss": -40.74924850463867, "global_step": 237316, "epoch": 1961} {"train_loss": -40.14884948730469, "global_step": 237317, "epoch": 1961} {"train_loss": -39.22410583496094, "global_step": 237318, "epoch": 1961} {"train_loss": -39.86397933959961, "global_step": 237319, "epoch": 1961} {"train_loss": -41.365028381347656, "global_step": 237320, "epoch": 1961} {"train_loss": -41.62009811401367, "global_step": 237321, "epoch": 1961} {"train_loss": -40.470088958740234, "global_step": 237322, "epoch": 1961} {"train_loss": -41.70939254760742, "global_step": 237323, "epoch": 1961} {"train_loss": -40.735782623291016, "global_step": 237324, "epoch": 1961} {"train_loss": -41.637542724609375, "global_step": 237325, "epoch": 1961} {"train_loss": -40.948150634765625, "global_step": 237326, "epoch": 1961} {"train_loss": -41.26066589355469, "global_step": 237327, "epoch": 1961} {"train_loss": -41.15073013305664, "global_step": 237328, "epoch": 1961} {"train_loss": -41.984840393066406, "global_step": 237329, "epoch": 1961} {"train_loss": -40.852394104003906, "global_step": 237330, "epoch": 1961} {"train_loss": -41.4567756652832, "global_step": 237331, "epoch": 1961} {"train_loss": -42.26316833496094, "global_step": 237332, "epoch": 1961} {"train_loss": -42.4232177734375, "global_step": 237333, "epoch": 1961} {"train_loss": -41.88460922241211, "global_step": 237334, "epoch": 1961} {"train_loss": -42.21888732910156, "global_step": 237335, "epoch": 1961} {"train_loss": -41.382972717285156, "global_step": 237336, "epoch": 1961} {"train_loss": -42.052181243896484, "global_step": 237337, "epoch": 1961} {"train_loss": -42.55574417114258, "global_step": 237338, "epoch": 1961} {"train_loss": -42.45951461791992, "global_step": 237339, "epoch": 1961} {"train_loss": -41.94282150268555, "global_step": 237340, "epoch": 1961} {"train_loss": -43.249427795410156, "global_step": 237341, "epoch": 1961} {"train_loss": -42.22488021850586, "global_step": 237342, "epoch": 1961} {"train_loss": -43.000221252441406, "global_step": 237343, "epoch": 1961} {"train_loss": -42.45366287231445, "global_step": 237344, "epoch": 1961} {"train_loss": -42.480140686035156, "global_step": 237345, "epoch": 1961} {"train_loss": -42.4865837097168, "global_step": 237346, "epoch": 1961} {"train_loss": -41.96964645385742, "global_step": 237347, "epoch": 1961} {"train_loss": -41.97336959838867, "global_step": 237348, "epoch": 1961} {"train_loss": -41.578739166259766, "global_step": 237349, "epoch": 1961} {"train_loss": -41.71210861206055, "global_step": 237350, "epoch": 1961} {"train_loss": -41.885597229003906, "global_step": 237351, "epoch": 1961} {"train_loss": -42.19857406616211, "global_step": 237352, "epoch": 1961} {"train_loss": -42.0575065612793, "global_step": 237353, "epoch": 1961} {"train_loss": -42.733673095703125, "global_step": 237354, "epoch": 1961} {"train_loss": -41.87173080444336, "global_step": 237355, "epoch": 1961} {"train_loss": -41.833106994628906, "global_step": 237356, "epoch": 1961} {"train_loss": -41.613014221191406, "global_step": 237357, "epoch": 1961} {"train_loss": -42.825294494628906, "global_step": 237358, "epoch": 1961} {"train_loss": -41.71906280517578, "global_step": 237359, "epoch": 1961} {"train_loss": -41.494197845458984, "global_step": 237360, "epoch": 1961} {"train_loss": -41.30796432495117, "global_step": 237361, "epoch": 1961} {"train_loss": -42.322303771972656, "global_step": 237362, "epoch": 1961} {"train_loss": -41.79539108276367, "global_step": 237363, "epoch": 1961} {"train_loss": -39.46409225463867, "global_step": 237364, "epoch": 1961} {"train_loss": -39.75514602661133, "global_step": 237365, "epoch": 1961} {"train_loss": -41.92129898071289, "global_step": 237366, "epoch": 1961} {"train_loss": -42.36452865600586, "global_step": 237367, "epoch": 1961} {"train_loss": -40.02485656738281, "global_step": 237368, "epoch": 1961} {"train_loss": -41.590267181396484, "global_step": 237369, "epoch": 1961} {"train_loss": -41.84748458862305, "global_step": 237370, "epoch": 1961} {"train_loss": -40.829627990722656, "global_step": 237371, "epoch": 1961} {"train_loss": -40.67461013793945, "global_step": 237372, "epoch": 1961} {"train_loss": -41.691463470458984, "global_step": 237373, "epoch": 1961} {"train_loss": -42.1216926574707, "global_step": 237374, "epoch": 1961} {"train_loss": -40.3372802734375, "global_step": 237375, "epoch": 1961} {"train_loss": -41.27492141723633, "global_step": 237376, "epoch": 1961} {"train_loss": -42.725467681884766, "global_step": 237377, "epoch": 1961} {"train_loss": -42.9018440246582, "global_step": 237378, "epoch": 1961} {"train_loss": -40.574668884277344, "global_step": 237379, "epoch": 1961} {"train_loss": -40.128936767578125, "global_step": 237380, "epoch": 1961} {"train_loss": -42.88229751586914, "global_step": 237381, "epoch": 1961} {"train_loss": -40.268211364746094, "global_step": 237382, "epoch": 1961} {"train_loss": -42.10310363769531, "global_step": 237383, "epoch": 1961} {"train_loss": -42.13401412963867, "global_step": 237384, "epoch": 1961} {"train_loss": -41.23927307128906, "global_step": 237385, "epoch": 1961} {"train_loss": -42.5413703918457, "global_step": 237386, "epoch": 1961} {"train_loss": -40.71232986450195, "global_step": 237387, "epoch": 1961} {"train_loss": -41.37546920776367, "global_step": 237388, "epoch": 1961} {"train_loss": -42.411006927490234, "global_step": 237389, "epoch": 1961} {"train_loss": -40.84450912475586, "global_step": 237390, "epoch": 1961} {"train_loss": -42.86470413208008, "global_step": 237391, "epoch": 1961} {"train_loss": -42.770851135253906, "global_step": 237392, "epoch": 1961} {"train_loss": -41.65195846557617, "global_step": 237393, "epoch": 1961} {"train_loss": -42.3255615234375, "global_step": 237394, "epoch": 1961} {"train_loss": -42.17411804199219, "global_step": 237395, "epoch": 1961} {"train_loss": -42.46363067626953, "global_step": 237396, "epoch": 1961} {"train_loss": -42.75584030151367, "global_step": 237397, "epoch": 1961} {"train_loss": -42.7659912109375, "global_step": 237398, "epoch": 1961} {"train_loss": -42.296607971191406, "global_step": 237399, "epoch": 1961} {"train_loss": -42.86224365234375, "global_step": 237400, "epoch": 1961} {"train_loss": -41.60286183002567, "global_step": 237401, "epoch": 1961, "val_loss": 2526185.0} {"train_loss": -42.13204574584961, "global_step": 237402, "epoch": 1962} {"train_loss": -43.08599853515625, "global_step": 237403, "epoch": 1962} {"train_loss": -42.44091796875, "global_step": 237404, "epoch": 1962} {"train_loss": -42.265201568603516, "global_step": 237405, "epoch": 1962} {"train_loss": -42.58517074584961, "global_step": 237406, "epoch": 1962} {"train_loss": -42.97626495361328, "global_step": 237407, "epoch": 1962} {"train_loss": -42.45172119140625, "global_step": 237408, "epoch": 1962} {"train_loss": -42.880001068115234, "global_step": 237409, "epoch": 1962} {"train_loss": -43.053749084472656, "global_step": 237410, "epoch": 1962} {"train_loss": -42.660888671875, "global_step": 237411, "epoch": 1962} {"train_loss": -42.75474166870117, "global_step": 237412, "epoch": 1962} {"train_loss": -42.28607177734375, "global_step": 237413, "epoch": 1962} {"train_loss": -43.06637191772461, "global_step": 237414, "epoch": 1962} {"train_loss": -42.830177307128906, "global_step": 237415, "epoch": 1962} {"train_loss": -42.88603591918945, "global_step": 237416, "epoch": 1962} {"train_loss": -43.23857116699219, "global_step": 237417, "epoch": 1962} {"train_loss": -42.71220779418945, "global_step": 237418, "epoch": 1962} {"train_loss": -43.071807861328125, "global_step": 237419, "epoch": 1962} {"train_loss": -43.55485153198242, "global_step": 237420, "epoch": 1962} {"train_loss": -43.1719970703125, "global_step": 237421, "epoch": 1962} {"train_loss": -43.084774017333984, "global_step": 237422, "epoch": 1962} {"train_loss": -43.31757354736328, "global_step": 237423, "epoch": 1962} {"train_loss": -43.01691436767578, "global_step": 237424, "epoch": 1962} {"train_loss": -43.32783126831055, "global_step": 237425, "epoch": 1962} {"train_loss": -41.68955612182617, "global_step": 237426, "epoch": 1962} {"train_loss": -43.71083068847656, "global_step": 237427, "epoch": 1962} {"train_loss": -43.72392654418945, "global_step": 237428, "epoch": 1962} {"train_loss": -43.607749938964844, "global_step": 237429, "epoch": 1962} {"train_loss": -43.69247055053711, "global_step": 237430, "epoch": 1962} {"train_loss": -43.07839584350586, "global_step": 237431, "epoch": 1962} {"train_loss": -43.27499008178711, "global_step": 237432, "epoch": 1962} {"train_loss": -43.786651611328125, "global_step": 237433, "epoch": 1962} {"train_loss": -43.781429290771484, "global_step": 237434, "epoch": 1962} {"train_loss": -43.90354537963867, "global_step": 237435, "epoch": 1962} {"train_loss": -43.21395492553711, "global_step": 237436, "epoch": 1962} {"train_loss": -43.05892562866211, "global_step": 237437, "epoch": 1962} {"train_loss": -42.547096252441406, "global_step": 237438, "epoch": 1962} {"train_loss": -42.757205963134766, "global_step": 237439, "epoch": 1962} {"train_loss": -43.48787307739258, "global_step": 237440, "epoch": 1962} {"train_loss": -42.862308502197266, "global_step": 237441, "epoch": 1962} {"train_loss": -42.83390426635742, "global_step": 237442, "epoch": 1962} {"train_loss": -42.20055389404297, "global_step": 237443, "epoch": 1962} {"train_loss": -43.32573318481445, "global_step": 237444, "epoch": 1962} {"train_loss": -41.95000457763672, "global_step": 237445, "epoch": 1962} {"train_loss": -39.352203369140625, "global_step": 237446, "epoch": 1962} {"train_loss": -41.322635650634766, "global_step": 237447, "epoch": 1962} {"train_loss": -42.99433898925781, "global_step": 237448, "epoch": 1962} {"train_loss": -41.744991302490234, "global_step": 237449, "epoch": 1962} {"train_loss": -41.8014030456543, "global_step": 237450, "epoch": 1962} {"train_loss": -42.77545928955078, "global_step": 237451, "epoch": 1962} {"train_loss": -42.27828598022461, "global_step": 237452, "epoch": 1962} {"train_loss": -40.05660629272461, "global_step": 237453, "epoch": 1962} {"train_loss": -40.32680130004883, "global_step": 237454, "epoch": 1962} {"train_loss": -37.139320373535156, "global_step": 237455, "epoch": 1962} {"train_loss": -41.82249069213867, "global_step": 237456, "epoch": 1962} {"train_loss": -40.785858154296875, "global_step": 237457, "epoch": 1962} {"train_loss": -39.162391662597656, "global_step": 237458, "epoch": 1962} {"train_loss": -42.42763900756836, "global_step": 237459, "epoch": 1962} {"train_loss": -39.495880126953125, "global_step": 237460, "epoch": 1962} {"train_loss": -40.145103454589844, "global_step": 237461, "epoch": 1962} {"train_loss": -40.564022064208984, "global_step": 237462, "epoch": 1962} {"train_loss": -41.625244140625, "global_step": 237463, "epoch": 1962} {"train_loss": -41.204219818115234, "global_step": 237464, "epoch": 1962} {"train_loss": -39.361297607421875, "global_step": 237465, "epoch": 1962} {"train_loss": -41.59232711791992, "global_step": 237466, "epoch": 1962} {"train_loss": -41.88124465942383, "global_step": 237467, "epoch": 1962} {"train_loss": -39.24506759643555, "global_step": 237468, "epoch": 1962} {"train_loss": -42.18645095825195, "global_step": 237469, "epoch": 1962} {"train_loss": -41.29392623901367, "global_step": 237470, "epoch": 1962} {"train_loss": -40.834747314453125, "global_step": 237471, "epoch": 1962} {"train_loss": -41.843868255615234, "global_step": 237472, "epoch": 1962} {"train_loss": -41.317771911621094, "global_step": 237473, "epoch": 1962} {"train_loss": -40.634273529052734, "global_step": 237474, "epoch": 1962} {"train_loss": -42.5594596862793, "global_step": 237475, "epoch": 1962} {"train_loss": -40.67261505126953, "global_step": 237476, "epoch": 1962} {"train_loss": -40.50887680053711, "global_step": 237477, "epoch": 1962} {"train_loss": -42.41334915161133, "global_step": 237478, "epoch": 1962} {"train_loss": -40.82059860229492, "global_step": 237479, "epoch": 1962} {"train_loss": -41.917659759521484, "global_step": 237480, "epoch": 1962} {"train_loss": -42.91921615600586, "global_step": 237481, "epoch": 1962} {"train_loss": -42.454315185546875, "global_step": 237482, "epoch": 1962} {"train_loss": -42.861305236816406, "global_step": 237483, "epoch": 1962} {"train_loss": -41.9800910949707, "global_step": 237484, "epoch": 1962} {"train_loss": -42.71339797973633, "global_step": 237485, "epoch": 1962} {"train_loss": -42.5523681640625, "global_step": 237486, "epoch": 1962} {"train_loss": -42.32784652709961, "global_step": 237487, "epoch": 1962} {"train_loss": -42.94161605834961, "global_step": 237488, "epoch": 1962} {"train_loss": -43.1721305847168, "global_step": 237489, "epoch": 1962} {"train_loss": -42.938106536865234, "global_step": 237490, "epoch": 1962} {"train_loss": -43.49306869506836, "global_step": 237491, "epoch": 1962} {"train_loss": -43.60390090942383, "global_step": 237492, "epoch": 1962} {"train_loss": -42.85810852050781, "global_step": 237493, "epoch": 1962} {"train_loss": -42.8958740234375, "global_step": 237494, "epoch": 1962} {"train_loss": -43.099849700927734, "global_step": 237495, "epoch": 1962} {"train_loss": -43.47307205200195, "global_step": 237496, "epoch": 1962} {"train_loss": -43.43499755859375, "global_step": 237497, "epoch": 1962} {"train_loss": -43.18889236450195, "global_step": 237498, "epoch": 1962} {"train_loss": -43.437564849853516, "global_step": 237499, "epoch": 1962} {"train_loss": -43.383056640625, "global_step": 237500, "epoch": 1962} {"train_loss": -43.57345199584961, "global_step": 237501, "epoch": 1962} {"train_loss": -43.41514205932617, "global_step": 237502, "epoch": 1962} {"train_loss": -42.91443634033203, "global_step": 237503, "epoch": 1962} {"train_loss": -42.87726974487305, "global_step": 237504, "epoch": 1962} {"train_loss": -42.41032028198242, "global_step": 237505, "epoch": 1962} {"train_loss": -43.56926345825195, "global_step": 237506, "epoch": 1962} {"train_loss": -43.208160400390625, "global_step": 237507, "epoch": 1962} {"train_loss": -42.959285736083984, "global_step": 237508, "epoch": 1962} {"train_loss": -42.72833251953125, "global_step": 237509, "epoch": 1962} {"train_loss": -42.42427062988281, "global_step": 237510, "epoch": 1962} {"train_loss": -43.31789779663086, "global_step": 237511, "epoch": 1962} {"train_loss": -43.45797348022461, "global_step": 237512, "epoch": 1962} {"train_loss": -43.643924713134766, "global_step": 237513, "epoch": 1962} {"train_loss": -43.66608810424805, "global_step": 237514, "epoch": 1962} {"train_loss": -44.080467224121094, "global_step": 237515, "epoch": 1962} {"train_loss": -42.969764709472656, "global_step": 237516, "epoch": 1962} {"train_loss": -43.39263153076172, "global_step": 237517, "epoch": 1962} {"train_loss": -43.491912841796875, "global_step": 237518, "epoch": 1962} {"train_loss": -42.813045501708984, "global_step": 237519, "epoch": 1962} {"train_loss": -43.16878890991211, "global_step": 237520, "epoch": 1962} {"train_loss": -43.612693786621094, "global_step": 237521, "epoch": 1962} {"train_loss": -42.46990550648082, "global_step": 237522, "epoch": 1962, "val_loss": 2579414.0} {"train_loss": -43.49177169799805, "global_step": 237523, "epoch": 1963} {"train_loss": -43.48356246948242, "global_step": 237524, "epoch": 1963} {"train_loss": -42.51385498046875, "global_step": 237525, "epoch": 1963} {"train_loss": -41.08026123046875, "global_step": 237526, "epoch": 1963} {"train_loss": -39.94601058959961, "global_step": 237527, "epoch": 1963} {"train_loss": -42.558807373046875, "global_step": 237528, "epoch": 1963} {"train_loss": -43.31438064575195, "global_step": 237529, "epoch": 1963} {"train_loss": -38.771053314208984, "global_step": 237530, "epoch": 1963} {"train_loss": -34.51040267944336, "global_step": 237531, "epoch": 1963} {"train_loss": -32.133575439453125, "global_step": 237532, "epoch": 1963} {"train_loss": -26.263351440429688, "global_step": 237533, "epoch": 1963} {"train_loss": -32.01974105834961, "global_step": 237534, "epoch": 1963} {"train_loss": -36.748191833496094, "global_step": 237535, "epoch": 1963} {"train_loss": -28.172758102416992, "global_step": 237536, "epoch": 1963} {"train_loss": -36.3236198425293, "global_step": 237537, "epoch": 1963} {"train_loss": -34.03695297241211, "global_step": 237538, "epoch": 1963} {"train_loss": -35.35511016845703, "global_step": 237539, "epoch": 1963} {"train_loss": -38.1098518371582, "global_step": 237540, "epoch": 1963} {"train_loss": -35.77705383300781, "global_step": 237541, "epoch": 1963} {"train_loss": -37.9068717956543, "global_step": 237542, "epoch": 1963} {"train_loss": -35.84462356567383, "global_step": 237543, "epoch": 1963} {"train_loss": -39.552520751953125, "global_step": 237544, "epoch": 1963} {"train_loss": -36.88611602783203, "global_step": 237545, "epoch": 1963} {"train_loss": -37.310359954833984, "global_step": 237546, "epoch": 1963} {"train_loss": -36.87531661987305, "global_step": 237547, "epoch": 1963} {"train_loss": -39.24752426147461, "global_step": 237548, "epoch": 1963} {"train_loss": -37.81767654418945, "global_step": 237549, "epoch": 1963} {"train_loss": -40.26886749267578, "global_step": 237550, "epoch": 1963} {"train_loss": -38.744712829589844, "global_step": 237551, "epoch": 1963} {"train_loss": -40.28291702270508, "global_step": 237552, "epoch": 1963} {"train_loss": -39.2091064453125, "global_step": 237553, "epoch": 1963} {"train_loss": -40.4525032043457, "global_step": 237554, "epoch": 1963} {"train_loss": -39.99372100830078, "global_step": 237555, "epoch": 1963} {"train_loss": -40.164119720458984, "global_step": 237556, "epoch": 1963} {"train_loss": -41.13248825073242, "global_step": 237557, "epoch": 1963} {"train_loss": -40.09552001953125, "global_step": 237558, "epoch": 1963} {"train_loss": -40.88837432861328, "global_step": 237559, "epoch": 1963} {"train_loss": -41.117034912109375, "global_step": 237560, "epoch": 1963} {"train_loss": -41.62194061279297, "global_step": 237561, "epoch": 1963} {"train_loss": -41.31174850463867, "global_step": 237562, "epoch": 1963} {"train_loss": -41.805274963378906, "global_step": 237563, "epoch": 1963} {"train_loss": -41.558101654052734, "global_step": 237564, "epoch": 1963} {"train_loss": -41.656005859375, "global_step": 237565, "epoch": 1963} {"train_loss": -41.98072052001953, "global_step": 237566, "epoch": 1963} {"train_loss": -41.54438400268555, "global_step": 237567, "epoch": 1963} {"train_loss": -41.62263870239258, "global_step": 237568, "epoch": 1963} {"train_loss": -41.78547286987305, "global_step": 237569, "epoch": 1963} {"train_loss": -41.92597579956055, "global_step": 237570, "epoch": 1963} {"train_loss": -42.5106086730957, "global_step": 237571, "epoch": 1963} {"train_loss": -41.7336311340332, "global_step": 237572, "epoch": 1963} {"train_loss": -42.57847595214844, "global_step": 237573, "epoch": 1963} {"train_loss": -42.53921127319336, "global_step": 237574, "epoch": 1963} {"train_loss": -42.540950775146484, "global_step": 237575, "epoch": 1963} {"train_loss": -42.48055648803711, "global_step": 237576, "epoch": 1963} {"train_loss": -42.96866226196289, "global_step": 237577, "epoch": 1963} {"train_loss": -42.68315887451172, "global_step": 237578, "epoch": 1963} {"train_loss": -42.570858001708984, "global_step": 237579, "epoch": 1963} {"train_loss": -43.04779815673828, "global_step": 237580, "epoch": 1963} {"train_loss": -42.8996467590332, "global_step": 237581, "epoch": 1963} {"train_loss": -42.706512451171875, "global_step": 237582, "epoch": 1963} {"train_loss": -42.5550422668457, "global_step": 237583, "epoch": 1963} {"train_loss": -42.9650993347168, "global_step": 237584, "epoch": 1963} {"train_loss": -43.431880950927734, "global_step": 237585, "epoch": 1963} {"train_loss": -42.490413665771484, "global_step": 237586, "epoch": 1963} {"train_loss": -43.2536506652832, "global_step": 237587, "epoch": 1963} {"train_loss": -42.97837448120117, "global_step": 237588, "epoch": 1963} {"train_loss": -43.11436080932617, "global_step": 237589, "epoch": 1963} {"train_loss": -43.174163818359375, "global_step": 237590, "epoch": 1963} {"train_loss": -43.37732696533203, "global_step": 237591, "epoch": 1963} {"train_loss": -43.15227127075195, "global_step": 237592, "epoch": 1963} {"train_loss": -42.95321273803711, "global_step": 237593, "epoch": 1963} {"train_loss": -43.3367919921875, "global_step": 237594, "epoch": 1963} {"train_loss": -43.9302978515625, "global_step": 237595, "epoch": 1963} {"train_loss": -42.18987274169922, "global_step": 237596, "epoch": 1963} {"train_loss": -42.675567626953125, "global_step": 237597, "epoch": 1963} {"train_loss": -43.1041374206543, "global_step": 237598, "epoch": 1963} {"train_loss": -42.25386428833008, "global_step": 237599, "epoch": 1963} {"train_loss": -43.40412521362305, "global_step": 237600, "epoch": 1963} {"train_loss": -43.34452819824219, "global_step": 237601, "epoch": 1963} {"train_loss": -42.83384704589844, "global_step": 237602, "epoch": 1963} {"train_loss": -43.524227142333984, "global_step": 237603, "epoch": 1963} {"train_loss": -43.65566635131836, "global_step": 237604, "epoch": 1963} {"train_loss": -43.7587890625, "global_step": 237605, "epoch": 1963} {"train_loss": -43.27680587768555, "global_step": 237606, "epoch": 1963} {"train_loss": -43.50145721435547, "global_step": 237607, "epoch": 1963} {"train_loss": -43.65367126464844, "global_step": 237608, "epoch": 1963} {"train_loss": -43.41130065917969, "global_step": 237609, "epoch": 1963} {"train_loss": -43.7014045715332, "global_step": 237610, "epoch": 1963} {"train_loss": -43.92555618286133, "global_step": 237611, "epoch": 1963} {"train_loss": -43.74385070800781, "global_step": 237612, "epoch": 1963} {"train_loss": -43.76925277709961, "global_step": 237613, "epoch": 1963} {"train_loss": -44.06819534301758, "global_step": 237614, "epoch": 1963} {"train_loss": -44.03178787231445, "global_step": 237615, "epoch": 1963} {"train_loss": -43.7325553894043, "global_step": 237616, "epoch": 1963} {"train_loss": -43.5643424987793, "global_step": 237617, "epoch": 1963} {"train_loss": -43.09834671020508, "global_step": 237618, "epoch": 1963} {"train_loss": -43.188568115234375, "global_step": 237619, "epoch": 1963} {"train_loss": -43.72076416015625, "global_step": 237620, "epoch": 1963} {"train_loss": -43.941375732421875, "global_step": 237621, "epoch": 1963} {"train_loss": -43.85968780517578, "global_step": 237622, "epoch": 1963} {"train_loss": -43.37420654296875, "global_step": 237623, "epoch": 1963} {"train_loss": -43.44514846801758, "global_step": 237624, "epoch": 1963} {"train_loss": -43.337703704833984, "global_step": 237625, "epoch": 1963} {"train_loss": -43.51416015625, "global_step": 237626, "epoch": 1963} {"train_loss": -43.802547454833984, "global_step": 237627, "epoch": 1963} {"train_loss": -43.21466064453125, "global_step": 237628, "epoch": 1963} {"train_loss": -41.8856315612793, "global_step": 237629, "epoch": 1963} {"train_loss": -41.978363037109375, "global_step": 237630, "epoch": 1963} {"train_loss": -40.19641876220703, "global_step": 237631, "epoch": 1963} {"train_loss": -42.559444427490234, "global_step": 237632, "epoch": 1963} {"train_loss": -42.44404983520508, "global_step": 237633, "epoch": 1963} {"train_loss": -42.3524055480957, "global_step": 237634, "epoch": 1963} {"train_loss": -40.624549865722656, "global_step": 237635, "epoch": 1963} {"train_loss": -39.51369857788086, "global_step": 237636, "epoch": 1963} {"train_loss": -42.50823974609375, "global_step": 237637, "epoch": 1963} {"train_loss": -43.746795654296875, "global_step": 237638, "epoch": 1963} {"train_loss": -41.635074615478516, "global_step": 237639, "epoch": 1963} {"train_loss": -38.889163970947266, "global_step": 237640, "epoch": 1963} {"train_loss": -38.62295150756836, "global_step": 237641, "epoch": 1963} {"train_loss": -38.359283447265625, "global_step": 237642, "epoch": 1963} {"train_loss": -41.22303675817064, "global_step": 237643, "epoch": 1963, "val_loss": 2627314.75} {"train_loss": -41.134403228759766, "global_step": 237644, "epoch": 1964} {"train_loss": -40.04738998413086, "global_step": 237645, "epoch": 1964} {"train_loss": -42.50164031982422, "global_step": 237646, "epoch": 1964} {"train_loss": -42.26289749145508, "global_step": 237647, "epoch": 1964} {"train_loss": -40.0264778137207, "global_step": 237648, "epoch": 1964} {"train_loss": -40.52942657470703, "global_step": 237649, "epoch": 1964} {"train_loss": -42.42665100097656, "global_step": 237650, "epoch": 1964} {"train_loss": -41.03956985473633, "global_step": 237651, "epoch": 1964} {"train_loss": -39.75394821166992, "global_step": 237652, "epoch": 1964} {"train_loss": -43.28239822387695, "global_step": 237653, "epoch": 1964} {"train_loss": -40.39406204223633, "global_step": 237654, "epoch": 1964} {"train_loss": -41.345245361328125, "global_step": 237655, "epoch": 1964} {"train_loss": -42.26167678833008, "global_step": 237656, "epoch": 1964} {"train_loss": -41.83662033081055, "global_step": 237657, "epoch": 1964} {"train_loss": -41.422298431396484, "global_step": 237658, "epoch": 1964} {"train_loss": -42.63395690917969, "global_step": 237659, "epoch": 1964} {"train_loss": -42.328922271728516, "global_step": 237660, "epoch": 1964} {"train_loss": -42.45197677612305, "global_step": 237661, "epoch": 1964} {"train_loss": -42.84000015258789, "global_step": 237662, "epoch": 1964} {"train_loss": -41.90366744995117, "global_step": 237663, "epoch": 1964} {"train_loss": -42.259639739990234, "global_step": 237664, "epoch": 1964} {"train_loss": -42.82075119018555, "global_step": 237665, "epoch": 1964} {"train_loss": -42.190284729003906, "global_step": 237666, "epoch": 1964} {"train_loss": -42.81245803833008, "global_step": 237667, "epoch": 1964} {"train_loss": -42.92421340942383, "global_step": 237668, "epoch": 1964} {"train_loss": -43.11375045776367, "global_step": 237669, "epoch": 1964} {"train_loss": -43.03329086303711, "global_step": 237670, "epoch": 1964} {"train_loss": -42.56420135498047, "global_step": 237671, "epoch": 1964} {"train_loss": -43.18777084350586, "global_step": 237672, "epoch": 1964} {"train_loss": -43.1976318359375, "global_step": 237673, "epoch": 1964} {"train_loss": -43.20469284057617, "global_step": 237674, "epoch": 1964} {"train_loss": -42.50360870361328, "global_step": 237675, "epoch": 1964} {"train_loss": -42.4399528503418, "global_step": 237676, "epoch": 1964} {"train_loss": -42.84251022338867, "global_step": 237677, "epoch": 1964} {"train_loss": -42.10441589355469, "global_step": 237678, "epoch": 1964} {"train_loss": -42.972930908203125, "global_step": 237679, "epoch": 1964} {"train_loss": -43.23749542236328, "global_step": 237680, "epoch": 1964} {"train_loss": -43.32942581176758, "global_step": 237681, "epoch": 1964} {"train_loss": -43.081478118896484, "global_step": 237682, "epoch": 1964} {"train_loss": -43.65987777709961, "global_step": 237683, "epoch": 1964} {"train_loss": -43.36908721923828, "global_step": 237684, "epoch": 1964} {"train_loss": -43.20704650878906, "global_step": 237685, "epoch": 1964} {"train_loss": -43.02225112915039, "global_step": 237686, "epoch": 1964} {"train_loss": -43.148563385009766, "global_step": 237687, "epoch": 1964} {"train_loss": -41.755062103271484, "global_step": 237688, "epoch": 1964} {"train_loss": -43.00445556640625, "global_step": 237689, "epoch": 1964} {"train_loss": -44.02421951293945, "global_step": 237690, "epoch": 1964} {"train_loss": -43.414649963378906, "global_step": 237691, "epoch": 1964} {"train_loss": -42.911190032958984, "global_step": 237692, "epoch": 1964} {"train_loss": -43.539466857910156, "global_step": 237693, "epoch": 1964} {"train_loss": -42.644287109375, "global_step": 237694, "epoch": 1964} {"train_loss": -42.43762969970703, "global_step": 237695, "epoch": 1964} {"train_loss": -42.56711959838867, "global_step": 237696, "epoch": 1964} {"train_loss": -43.983306884765625, "global_step": 237697, "epoch": 1964} {"train_loss": -43.47259521484375, "global_step": 237698, "epoch": 1964} {"train_loss": -41.88135528564453, "global_step": 237699, "epoch": 1964} {"train_loss": -43.14760971069336, "global_step": 237700, "epoch": 1964} {"train_loss": -40.799617767333984, "global_step": 237701, "epoch": 1964} {"train_loss": -40.66996383666992, "global_step": 237702, "epoch": 1964} {"train_loss": -42.301055908203125, "global_step": 237703, "epoch": 1964} {"train_loss": -42.30717086791992, "global_step": 237704, "epoch": 1964} {"train_loss": -43.21207809448242, "global_step": 237705, "epoch": 1964} {"train_loss": -42.479610443115234, "global_step": 237706, "epoch": 1964} {"train_loss": -41.64781188964844, "global_step": 237707, "epoch": 1964} {"train_loss": -43.18477249145508, "global_step": 237708, "epoch": 1964} {"train_loss": -42.58906173706055, "global_step": 237709, "epoch": 1964} {"train_loss": -43.56681442260742, "global_step": 237710, "epoch": 1964} {"train_loss": -42.13875961303711, "global_step": 237711, "epoch": 1964} {"train_loss": -43.40023422241211, "global_step": 237712, "epoch": 1964} {"train_loss": -41.88447952270508, "global_step": 237713, "epoch": 1964} {"train_loss": -42.50563049316406, "global_step": 237714, "epoch": 1964} {"train_loss": -42.23496627807617, "global_step": 237715, "epoch": 1964} {"train_loss": -38.57028579711914, "global_step": 237716, "epoch": 1964} {"train_loss": -42.69245147705078, "global_step": 237717, "epoch": 1964} {"train_loss": -42.35188674926758, "global_step": 237718, "epoch": 1964} {"train_loss": -43.2601432800293, "global_step": 237719, "epoch": 1964} {"train_loss": -42.6729621887207, "global_step": 237720, "epoch": 1964} {"train_loss": -43.12205123901367, "global_step": 237721, "epoch": 1964} {"train_loss": -42.180213928222656, "global_step": 237722, "epoch": 1964} {"train_loss": -42.702693939208984, "global_step": 237723, "epoch": 1964} {"train_loss": -40.30723571777344, "global_step": 237724, "epoch": 1964} {"train_loss": -42.72884750366211, "global_step": 237725, "epoch": 1964} {"train_loss": -42.157283782958984, "global_step": 237726, "epoch": 1964} {"train_loss": -42.64013671875, "global_step": 237727, "epoch": 1964} {"train_loss": -41.67525863647461, "global_step": 237728, "epoch": 1964} {"train_loss": -43.32416915893555, "global_step": 237729, "epoch": 1964} {"train_loss": -41.872047424316406, "global_step": 237730, "epoch": 1964} {"train_loss": -42.57950210571289, "global_step": 237731, "epoch": 1964} {"train_loss": -40.96961975097656, "global_step": 237732, "epoch": 1964} {"train_loss": -42.555110931396484, "global_step": 237733, "epoch": 1964} {"train_loss": -41.032772064208984, "global_step": 237734, "epoch": 1964} {"train_loss": -39.5399284362793, "global_step": 237735, "epoch": 1964} {"train_loss": -38.5297966003418, "global_step": 237736, "epoch": 1964} {"train_loss": -39.71942901611328, "global_step": 237737, "epoch": 1964} {"train_loss": -41.76691818237305, "global_step": 237738, "epoch": 1964} {"train_loss": -41.05631637573242, "global_step": 237739, "epoch": 1964} {"train_loss": -42.95747375488281, "global_step": 237740, "epoch": 1964} {"train_loss": -40.48582077026367, "global_step": 237741, "epoch": 1964} {"train_loss": -41.07495880126953, "global_step": 237742, "epoch": 1964} {"train_loss": -42.253414154052734, "global_step": 237743, "epoch": 1964} {"train_loss": -40.79240036010742, "global_step": 237744, "epoch": 1964} {"train_loss": -41.69955062866211, "global_step": 237745, "epoch": 1964} {"train_loss": -41.10024642944336, "global_step": 237746, "epoch": 1964} {"train_loss": -41.36872482299805, "global_step": 237747, "epoch": 1964} {"train_loss": -42.32912826538086, "global_step": 237748, "epoch": 1964} {"train_loss": -39.35095977783203, "global_step": 237749, "epoch": 1964} {"train_loss": -42.476932525634766, "global_step": 237750, "epoch": 1964} {"train_loss": -40.95990753173828, "global_step": 237751, "epoch": 1964} {"train_loss": -41.1351432800293, "global_step": 237752, "epoch": 1964} {"train_loss": -41.14219284057617, "global_step": 237753, "epoch": 1964} {"train_loss": -42.258018493652344, "global_step": 237754, "epoch": 1964} {"train_loss": -41.351341247558594, "global_step": 237755, "epoch": 1964} {"train_loss": -40.06653594970703, "global_step": 237756, "epoch": 1964} {"train_loss": -41.429134368896484, "global_step": 237757, "epoch": 1964} {"train_loss": -41.934593200683594, "global_step": 237758, "epoch": 1964} {"train_loss": -39.938575744628906, "global_step": 237759, "epoch": 1964} {"train_loss": -40.519744873046875, "global_step": 237760, "epoch": 1964} {"train_loss": -42.244964599609375, "global_step": 237761, "epoch": 1964} {"train_loss": -42.1381721496582, "global_step": 237762, "epoch": 1964} {"train_loss": -42.31685256958008, "global_step": 237763, "epoch": 1964} {"train_loss": -42.08178152919801, "global_step": 237764, "epoch": 1964, "val_loss": 2682378.5} {"train_loss": -42.27699661254883, "global_step": 237765, "epoch": 1965} {"train_loss": -42.1418571472168, "global_step": 237766, "epoch": 1965} {"train_loss": -43.02934646606445, "global_step": 237767, "epoch": 1965} {"train_loss": -40.66650390625, "global_step": 237768, "epoch": 1965} {"train_loss": -42.31435012817383, "global_step": 237769, "epoch": 1965} {"train_loss": -43.008052825927734, "global_step": 237770, "epoch": 1965} {"train_loss": -42.35321807861328, "global_step": 237771, "epoch": 1965} {"train_loss": -42.471004486083984, "global_step": 237772, "epoch": 1965} {"train_loss": -42.42888641357422, "global_step": 237773, "epoch": 1965} {"train_loss": -43.156768798828125, "global_step": 237774, "epoch": 1965} {"train_loss": -42.413368225097656, "global_step": 237775, "epoch": 1965} {"train_loss": -42.18303298950195, "global_step": 237776, "epoch": 1965} {"train_loss": -43.04006576538086, "global_step": 237777, "epoch": 1965} {"train_loss": -42.86139678955078, "global_step": 237778, "epoch": 1965} {"train_loss": -43.399261474609375, "global_step": 237779, "epoch": 1965} {"train_loss": -43.090736389160156, "global_step": 237780, "epoch": 1965} {"train_loss": -43.556236267089844, "global_step": 237781, "epoch": 1965} {"train_loss": -42.809810638427734, "global_step": 237782, "epoch": 1965} {"train_loss": -42.25786209106445, "global_step": 237783, "epoch": 1965} {"train_loss": -41.95064926147461, "global_step": 237784, "epoch": 1965} {"train_loss": -42.0148811340332, "global_step": 237785, "epoch": 1965} {"train_loss": -40.87601089477539, "global_step": 237786, "epoch": 1965} {"train_loss": -41.0606803894043, "global_step": 237787, "epoch": 1965} {"train_loss": -42.716949462890625, "global_step": 237788, "epoch": 1965} {"train_loss": -42.88959503173828, "global_step": 237789, "epoch": 1965} {"train_loss": -41.79374313354492, "global_step": 237790, "epoch": 1965} {"train_loss": -42.96702575683594, "global_step": 237791, "epoch": 1965} {"train_loss": -42.785255432128906, "global_step": 237792, "epoch": 1965} {"train_loss": -42.08979797363281, "global_step": 237793, "epoch": 1965} {"train_loss": -43.3614616394043, "global_step": 237794, "epoch": 1965} {"train_loss": -42.34389877319336, "global_step": 237795, "epoch": 1965} {"train_loss": -43.36982345581055, "global_step": 237796, "epoch": 1965} {"train_loss": -43.456024169921875, "global_step": 237797, "epoch": 1965} {"train_loss": -42.494625091552734, "global_step": 237798, "epoch": 1965} {"train_loss": -43.453857421875, "global_step": 237799, "epoch": 1965} {"train_loss": -42.30891036987305, "global_step": 237800, "epoch": 1965} {"train_loss": -43.12139129638672, "global_step": 237801, "epoch": 1965} {"train_loss": -43.277740478515625, "global_step": 237802, "epoch": 1965} {"train_loss": -43.293575286865234, "global_step": 237803, "epoch": 1965} {"train_loss": -43.29790496826172, "global_step": 237804, "epoch": 1965} {"train_loss": -41.969825744628906, "global_step": 237805, "epoch": 1965} {"train_loss": -40.923065185546875, "global_step": 237806, "epoch": 1965} {"train_loss": -42.01195526123047, "global_step": 237807, "epoch": 1965} {"train_loss": -42.55625534057617, "global_step": 237808, "epoch": 1965} {"train_loss": -43.52357482910156, "global_step": 237809, "epoch": 1965} {"train_loss": -42.71181869506836, "global_step": 237810, "epoch": 1965} {"train_loss": -43.33669662475586, "global_step": 237811, "epoch": 1965} {"train_loss": -43.340999603271484, "global_step": 237812, "epoch": 1965} {"train_loss": -42.719337463378906, "global_step": 237813, "epoch": 1965} {"train_loss": -43.385799407958984, "global_step": 237814, "epoch": 1965} {"train_loss": -43.91233444213867, "global_step": 237815, "epoch": 1965} {"train_loss": -43.18589782714844, "global_step": 237816, "epoch": 1965} {"train_loss": -43.80012512207031, "global_step": 237817, "epoch": 1965} {"train_loss": -42.885860443115234, "global_step": 237818, "epoch": 1965} {"train_loss": -43.18899154663086, "global_step": 237819, "epoch": 1965} {"train_loss": -43.27952194213867, "global_step": 237820, "epoch": 1965} {"train_loss": -43.611175537109375, "global_step": 237821, "epoch": 1965} {"train_loss": -43.59165573120117, "global_step": 237822, "epoch": 1965} {"train_loss": -43.30584716796875, "global_step": 237823, "epoch": 1965} {"train_loss": -43.555946350097656, "global_step": 237824, "epoch": 1965} {"train_loss": -43.051509857177734, "global_step": 237825, "epoch": 1965} {"train_loss": -42.569496154785156, "global_step": 237826, "epoch": 1965} {"train_loss": -43.382991790771484, "global_step": 237827, "epoch": 1965} {"train_loss": -43.29079818725586, "global_step": 237828, "epoch": 1965} {"train_loss": -43.11506271362305, "global_step": 237829, "epoch": 1965} {"train_loss": -43.4515380859375, "global_step": 237830, "epoch": 1965} {"train_loss": -43.27207565307617, "global_step": 237831, "epoch": 1965} {"train_loss": -43.71268844604492, "global_step": 237832, "epoch": 1965} {"train_loss": -42.88998794555664, "global_step": 237833, "epoch": 1965} {"train_loss": -42.5398063659668, "global_step": 237834, "epoch": 1965} {"train_loss": -42.21781539916992, "global_step": 237835, "epoch": 1965} {"train_loss": -42.66227340698242, "global_step": 237836, "epoch": 1965} {"train_loss": -42.61943054199219, "global_step": 237837, "epoch": 1965} {"train_loss": -43.215938568115234, "global_step": 237838, "epoch": 1965} {"train_loss": -43.21368408203125, "global_step": 237839, "epoch": 1965} {"train_loss": -42.571075439453125, "global_step": 237840, "epoch": 1965} {"train_loss": -42.35846710205078, "global_step": 237841, "epoch": 1965} {"train_loss": -40.9799690246582, "global_step": 237842, "epoch": 1965} {"train_loss": -41.99160385131836, "global_step": 237843, "epoch": 1965} {"train_loss": -42.640960693359375, "global_step": 237844, "epoch": 1965} {"train_loss": -42.193912506103516, "global_step": 237845, "epoch": 1965} {"train_loss": -41.238677978515625, "global_step": 237846, "epoch": 1965} {"train_loss": -42.04418182373047, "global_step": 237847, "epoch": 1965} {"train_loss": -42.85773468017578, "global_step": 237848, "epoch": 1965} {"train_loss": -42.981868743896484, "global_step": 237849, "epoch": 1965} {"train_loss": -42.338592529296875, "global_step": 237850, "epoch": 1965} {"train_loss": -42.553321838378906, "global_step": 237851, "epoch": 1965} {"train_loss": -41.95292282104492, "global_step": 237852, "epoch": 1965} {"train_loss": -42.798866271972656, "global_step": 237853, "epoch": 1965} {"train_loss": -42.441490173339844, "global_step": 237854, "epoch": 1965} {"train_loss": -42.6393928527832, "global_step": 237855, "epoch": 1965} {"train_loss": -42.01335525512695, "global_step": 237856, "epoch": 1965} {"train_loss": -41.2673225402832, "global_step": 237857, "epoch": 1965} {"train_loss": -41.15721130371094, "global_step": 237858, "epoch": 1965} {"train_loss": -42.1275634765625, "global_step": 237859, "epoch": 1965} {"train_loss": -43.02927780151367, "global_step": 237860, "epoch": 1965} {"train_loss": -41.9027214050293, "global_step": 237861, "epoch": 1965} {"train_loss": -42.56035232543945, "global_step": 237862, "epoch": 1965} {"train_loss": -40.88640213012695, "global_step": 237863, "epoch": 1965} {"train_loss": -39.28375244140625, "global_step": 237864, "epoch": 1965} {"train_loss": -43.086490631103516, "global_step": 237865, "epoch": 1965} {"train_loss": -38.92218017578125, "global_step": 237866, "epoch": 1965} {"train_loss": -41.76859664916992, "global_step": 237867, "epoch": 1965} {"train_loss": -42.76295852661133, "global_step": 237868, "epoch": 1965} {"train_loss": -41.82780075073242, "global_step": 237869, "epoch": 1965} {"train_loss": -40.705806732177734, "global_step": 237870, "epoch": 1965} {"train_loss": -42.31000518798828, "global_step": 237871, "epoch": 1965} {"train_loss": -42.553619384765625, "global_step": 237872, "epoch": 1965} {"train_loss": -42.04337692260742, "global_step": 237873, "epoch": 1965} {"train_loss": -42.587738037109375, "global_step": 237874, "epoch": 1965} {"train_loss": -43.04966735839844, "global_step": 237875, "epoch": 1965} {"train_loss": -40.53550338745117, "global_step": 237876, "epoch": 1965} {"train_loss": -41.05418014526367, "global_step": 237877, "epoch": 1965} {"train_loss": -42.6952018737793, "global_step": 237878, "epoch": 1965} {"train_loss": -39.10299301147461, "global_step": 237879, "epoch": 1965} {"train_loss": -40.02675247192383, "global_step": 237880, "epoch": 1965} {"train_loss": -41.058990478515625, "global_step": 237881, "epoch": 1965} {"train_loss": -41.64433670043945, "global_step": 237882, "epoch": 1965} {"train_loss": -42.0139274597168, "global_step": 237883, "epoch": 1965} {"train_loss": -41.903804779052734, "global_step": 237884, "epoch": 1965} {"train_loss": -42.435944896098995, "global_step": 237885, "epoch": 1965, "val_loss": 2643157.75} {"train_loss": -43.174530029296875, "global_step": 237886, "epoch": 1966} {"train_loss": -41.760372161865234, "global_step": 237887, "epoch": 1966} {"train_loss": -43.20856857299805, "global_step": 237888, "epoch": 1966} {"train_loss": -42.11030960083008, "global_step": 237889, "epoch": 1966} {"train_loss": -42.76312255859375, "global_step": 237890, "epoch": 1966} {"train_loss": -42.202552795410156, "global_step": 237891, "epoch": 1966} {"train_loss": -43.134613037109375, "global_step": 237892, "epoch": 1966} {"train_loss": -42.729042053222656, "global_step": 237893, "epoch": 1966} {"train_loss": -42.20374298095703, "global_step": 237894, "epoch": 1966} {"train_loss": -43.26975631713867, "global_step": 237895, "epoch": 1966} {"train_loss": -41.33620071411133, "global_step": 237896, "epoch": 1966} {"train_loss": -41.18630599975586, "global_step": 237897, "epoch": 1966} {"train_loss": -42.737281799316406, "global_step": 237898, "epoch": 1966} {"train_loss": -42.534664154052734, "global_step": 237899, "epoch": 1966} {"train_loss": -42.10870361328125, "global_step": 237900, "epoch": 1966} {"train_loss": -42.69246292114258, "global_step": 237901, "epoch": 1966} {"train_loss": -42.61080551147461, "global_step": 237902, "epoch": 1966} {"train_loss": -42.97102737426758, "global_step": 237903, "epoch": 1966} {"train_loss": -43.262393951416016, "global_step": 237904, "epoch": 1966} {"train_loss": -42.97023391723633, "global_step": 237905, "epoch": 1966} {"train_loss": -42.030982971191406, "global_step": 237906, "epoch": 1966} {"train_loss": -42.70035934448242, "global_step": 237907, "epoch": 1966} {"train_loss": -42.246925354003906, "global_step": 237908, "epoch": 1966} {"train_loss": -42.16960525512695, "global_step": 237909, "epoch": 1966} {"train_loss": -42.83273696899414, "global_step": 237910, "epoch": 1966} {"train_loss": -41.980377197265625, "global_step": 237911, "epoch": 1966} {"train_loss": -43.31414794921875, "global_step": 237912, "epoch": 1966} {"train_loss": -42.95104217529297, "global_step": 237913, "epoch": 1966} {"train_loss": -43.0711669921875, "global_step": 237914, "epoch": 1966} {"train_loss": -42.75685501098633, "global_step": 237915, "epoch": 1966} {"train_loss": -42.4639892578125, "global_step": 237916, "epoch": 1966} {"train_loss": -42.711280822753906, "global_step": 237917, "epoch": 1966} {"train_loss": -42.950782775878906, "global_step": 237918, "epoch": 1966} {"train_loss": -42.720088958740234, "global_step": 237919, "epoch": 1966} {"train_loss": -42.65149688720703, "global_step": 237920, "epoch": 1966} {"train_loss": -42.821407318115234, "global_step": 237921, "epoch": 1966} {"train_loss": -42.59343338012695, "global_step": 237922, "epoch": 1966} {"train_loss": -43.132301330566406, "global_step": 237923, "epoch": 1966} {"train_loss": -43.35714340209961, "global_step": 237924, "epoch": 1966} {"train_loss": -43.054527282714844, "global_step": 237925, "epoch": 1966} {"train_loss": -42.559959411621094, "global_step": 237926, "epoch": 1966} {"train_loss": -43.579566955566406, "global_step": 237927, "epoch": 1966} {"train_loss": -42.828338623046875, "global_step": 237928, "epoch": 1966} {"train_loss": -44.03390121459961, "global_step": 237929, "epoch": 1966} {"train_loss": -42.893917083740234, "global_step": 237930, "epoch": 1966} {"train_loss": -43.46851348876953, "global_step": 237931, "epoch": 1966} {"train_loss": -43.1776123046875, "global_step": 237932, "epoch": 1966} {"train_loss": -43.70429229736328, "global_step": 237933, "epoch": 1966} {"train_loss": -43.35111618041992, "global_step": 237934, "epoch": 1966} {"train_loss": -42.75837707519531, "global_step": 237935, "epoch": 1966} {"train_loss": -43.10858154296875, "global_step": 237936, "epoch": 1966} {"train_loss": -42.6241569519043, "global_step": 237937, "epoch": 1966} {"train_loss": -42.383243560791016, "global_step": 237938, "epoch": 1966} {"train_loss": -43.85728073120117, "global_step": 237939, "epoch": 1966} {"train_loss": -42.5766716003418, "global_step": 237940, "epoch": 1966} {"train_loss": -42.24198532104492, "global_step": 237941, "epoch": 1966} {"train_loss": -43.16358947753906, "global_step": 237942, "epoch": 1966} {"train_loss": -41.91962814331055, "global_step": 237943, "epoch": 1966} {"train_loss": -41.6177864074707, "global_step": 237944, "epoch": 1966} {"train_loss": -40.86226272583008, "global_step": 237945, "epoch": 1966} {"train_loss": -41.33820343017578, "global_step": 237946, "epoch": 1966} {"train_loss": -42.21885299682617, "global_step": 237947, "epoch": 1966} {"train_loss": -40.81507110595703, "global_step": 237948, "epoch": 1966} {"train_loss": -41.920711517333984, "global_step": 237949, "epoch": 1966} {"train_loss": -40.68634796142578, "global_step": 237950, "epoch": 1966} {"train_loss": -42.565486907958984, "global_step": 237951, "epoch": 1966} {"train_loss": -41.904170989990234, "global_step": 237952, "epoch": 1966} {"train_loss": -42.09086990356445, "global_step": 237953, "epoch": 1966} {"train_loss": -42.5594596862793, "global_step": 237954, "epoch": 1966} {"train_loss": -41.56734085083008, "global_step": 237955, "epoch": 1966} {"train_loss": -42.095924377441406, "global_step": 237956, "epoch": 1966} {"train_loss": -40.43635177612305, "global_step": 237957, "epoch": 1966} {"train_loss": -41.5308723449707, "global_step": 237958, "epoch": 1966} {"train_loss": -40.355682373046875, "global_step": 237959, "epoch": 1966} {"train_loss": -42.00680160522461, "global_step": 237960, "epoch": 1966} {"train_loss": -40.12380599975586, "global_step": 237961, "epoch": 1966} {"train_loss": -41.329166412353516, "global_step": 237962, "epoch": 1966} {"train_loss": -41.565032958984375, "global_step": 237963, "epoch": 1966} {"train_loss": -41.735076904296875, "global_step": 237964, "epoch": 1966} {"train_loss": -42.04999542236328, "global_step": 237965, "epoch": 1966} {"train_loss": -41.121299743652344, "global_step": 237966, "epoch": 1966} {"train_loss": -41.846961975097656, "global_step": 237967, "epoch": 1966} {"train_loss": -42.76882553100586, "global_step": 237968, "epoch": 1966} {"train_loss": -41.981422424316406, "global_step": 237969, "epoch": 1966} {"train_loss": -41.9995002746582, "global_step": 237970, "epoch": 1966} {"train_loss": -42.279632568359375, "global_step": 237971, "epoch": 1966} {"train_loss": -42.08679962158203, "global_step": 237972, "epoch": 1966} {"train_loss": -41.01054000854492, "global_step": 237973, "epoch": 1966} {"train_loss": -42.43974685668945, "global_step": 237974, "epoch": 1966} {"train_loss": -42.721351623535156, "global_step": 237975, "epoch": 1966} {"train_loss": -42.08907699584961, "global_step": 237976, "epoch": 1966} {"train_loss": -40.912986755371094, "global_step": 237977, "epoch": 1966} {"train_loss": -42.92158126831055, "global_step": 237978, "epoch": 1966} {"train_loss": -42.66520309448242, "global_step": 237979, "epoch": 1966} {"train_loss": -40.6923713684082, "global_step": 237980, "epoch": 1966} {"train_loss": -42.880218505859375, "global_step": 237981, "epoch": 1966} {"train_loss": -41.996402740478516, "global_step": 237982, "epoch": 1966} {"train_loss": -42.58749008178711, "global_step": 237983, "epoch": 1966} {"train_loss": -41.85824203491211, "global_step": 237984, "epoch": 1966} {"train_loss": -42.0321044921875, "global_step": 237985, "epoch": 1966} {"train_loss": -42.978271484375, "global_step": 237986, "epoch": 1966} {"train_loss": -42.46310043334961, "global_step": 237987, "epoch": 1966} {"train_loss": -42.16831588745117, "global_step": 237988, "epoch": 1966} {"train_loss": -42.992733001708984, "global_step": 237989, "epoch": 1966} {"train_loss": -42.94321060180664, "global_step": 237990, "epoch": 1966} {"train_loss": -43.635005950927734, "global_step": 237991, "epoch": 1966} {"train_loss": -42.53644943237305, "global_step": 237992, "epoch": 1966} {"train_loss": -43.49199295043945, "global_step": 237993, "epoch": 1966} {"train_loss": -43.164058685302734, "global_step": 237994, "epoch": 1966} {"train_loss": -43.881710052490234, "global_step": 237995, "epoch": 1966} {"train_loss": -42.63798141479492, "global_step": 237996, "epoch": 1966} {"train_loss": -43.77093505859375, "global_step": 237997, "epoch": 1966} {"train_loss": -43.309879302978516, "global_step": 237998, "epoch": 1966} {"train_loss": -43.284912109375, "global_step": 237999, "epoch": 1966} {"train_loss": -43.36320495605469, "global_step": 238000, "epoch": 1966} {"train_loss": -43.37997817993164, "global_step": 238001, "epoch": 1966} {"train_loss": -43.559326171875, "global_step": 238002, "epoch": 1966} {"train_loss": -43.6934700012207, "global_step": 238003, "epoch": 1966} {"train_loss": -43.938236236572266, "global_step": 238004, "epoch": 1966} {"train_loss": -43.44464874267578, "global_step": 238005, "epoch": 1966} {"train_loss": -42.49996856815559, "global_step": 238006, "epoch": 1966, "val_loss": 2624439.5} {"train_loss": -43.48856735229492, "global_step": 238007, "epoch": 1967} {"train_loss": -44.07594680786133, "global_step": 238008, "epoch": 1967} {"train_loss": -43.44870376586914, "global_step": 238009, "epoch": 1967} {"train_loss": -43.394283294677734, "global_step": 238010, "epoch": 1967} {"train_loss": -44.12629318237305, "global_step": 238011, "epoch": 1967} {"train_loss": -43.970523834228516, "global_step": 238012, "epoch": 1967} {"train_loss": -43.78679275512695, "global_step": 238013, "epoch": 1967} {"train_loss": -43.83585739135742, "global_step": 238014, "epoch": 1967} {"train_loss": -44.15353775024414, "global_step": 238015, "epoch": 1967} {"train_loss": -44.136653900146484, "global_step": 238016, "epoch": 1967} {"train_loss": -43.43409729003906, "global_step": 238017, "epoch": 1967} {"train_loss": -42.16930389404297, "global_step": 238018, "epoch": 1967} {"train_loss": -41.397579193115234, "global_step": 238019, "epoch": 1967} {"train_loss": -42.81827163696289, "global_step": 238020, "epoch": 1967} {"train_loss": -43.51310729980469, "global_step": 238021, "epoch": 1967} {"train_loss": -43.1894416809082, "global_step": 238022, "epoch": 1967} {"train_loss": -43.87744140625, "global_step": 238023, "epoch": 1967} {"train_loss": -43.72856521606445, "global_step": 238024, "epoch": 1967} {"train_loss": -43.74321746826172, "global_step": 238025, "epoch": 1967} {"train_loss": -43.05135726928711, "global_step": 238026, "epoch": 1967} {"train_loss": -42.745052337646484, "global_step": 238027, "epoch": 1967} {"train_loss": -43.677772521972656, "global_step": 238028, "epoch": 1967} {"train_loss": -43.9136962890625, "global_step": 238029, "epoch": 1967} {"train_loss": -43.0889892578125, "global_step": 238030, "epoch": 1967} {"train_loss": -43.14700698852539, "global_step": 238031, "epoch": 1967} {"train_loss": -43.90357208251953, "global_step": 238032, "epoch": 1967} {"train_loss": -43.8552360534668, "global_step": 238033, "epoch": 1967} {"train_loss": -43.51822280883789, "global_step": 238034, "epoch": 1967} {"train_loss": -43.36369705200195, "global_step": 238035, "epoch": 1967} {"train_loss": -43.80107879638672, "global_step": 238036, "epoch": 1967} {"train_loss": -43.96574783325195, "global_step": 238037, "epoch": 1967} {"train_loss": -43.26361083984375, "global_step": 238038, "epoch": 1967} {"train_loss": -43.87816619873047, "global_step": 238039, "epoch": 1967} {"train_loss": -43.42838668823242, "global_step": 238040, "epoch": 1967} {"train_loss": -43.6456413269043, "global_step": 238041, "epoch": 1967} {"train_loss": -43.618465423583984, "global_step": 238042, "epoch": 1967} {"train_loss": -43.726593017578125, "global_step": 238043, "epoch": 1967} {"train_loss": -42.91285705566406, "global_step": 238044, "epoch": 1967} {"train_loss": -42.99927520751953, "global_step": 238045, "epoch": 1967} {"train_loss": -41.07725524902344, "global_step": 238046, "epoch": 1967} {"train_loss": -40.725521087646484, "global_step": 238047, "epoch": 1967} {"train_loss": -42.52469253540039, "global_step": 238048, "epoch": 1967} {"train_loss": -43.07754135131836, "global_step": 238049, "epoch": 1967} {"train_loss": -42.33712387084961, "global_step": 238050, "epoch": 1967} {"train_loss": -37.72724151611328, "global_step": 238051, "epoch": 1967} {"train_loss": -36.83613204956055, "global_step": 238052, "epoch": 1967} {"train_loss": -40.98067855834961, "global_step": 238053, "epoch": 1967} {"train_loss": -38.32166290283203, "global_step": 238054, "epoch": 1967} {"train_loss": -37.597408294677734, "global_step": 238055, "epoch": 1967} {"train_loss": -38.195159912109375, "global_step": 238056, "epoch": 1967} {"train_loss": -37.14295196533203, "global_step": 238057, "epoch": 1967} {"train_loss": -37.65523147583008, "global_step": 238058, "epoch": 1967} {"train_loss": -37.90550231933594, "global_step": 238059, "epoch": 1967} {"train_loss": -38.24256896972656, "global_step": 238060, "epoch": 1967} {"train_loss": -37.997093200683594, "global_step": 238061, "epoch": 1967} {"train_loss": -39.916316986083984, "global_step": 238062, "epoch": 1967} {"train_loss": -40.53666305541992, "global_step": 238063, "epoch": 1967} {"train_loss": -40.51410675048828, "global_step": 238064, "epoch": 1967} {"train_loss": -40.3875617980957, "global_step": 238065, "epoch": 1967} {"train_loss": -40.61613845825195, "global_step": 238066, "epoch": 1967} {"train_loss": -38.56338119506836, "global_step": 238067, "epoch": 1967} {"train_loss": -41.056575775146484, "global_step": 238068, "epoch": 1967} {"train_loss": -39.23353958129883, "global_step": 238069, "epoch": 1967} {"train_loss": -40.67617416381836, "global_step": 238070, "epoch": 1967} {"train_loss": -41.85994338989258, "global_step": 238071, "epoch": 1967} {"train_loss": -41.555519104003906, "global_step": 238072, "epoch": 1967} {"train_loss": -42.37113952636719, "global_step": 238073, "epoch": 1967} {"train_loss": -41.2698860168457, "global_step": 238074, "epoch": 1967} {"train_loss": -40.3466682434082, "global_step": 238075, "epoch": 1967} {"train_loss": -41.09130859375, "global_step": 238076, "epoch": 1967} {"train_loss": -40.776649475097656, "global_step": 238077, "epoch": 1967} {"train_loss": -41.85394287109375, "global_step": 238078, "epoch": 1967} {"train_loss": -42.870845794677734, "global_step": 238079, "epoch": 1967} {"train_loss": -41.390098571777344, "global_step": 238080, "epoch": 1967} {"train_loss": -42.496978759765625, "global_step": 238081, "epoch": 1967} {"train_loss": -42.01980209350586, "global_step": 238082, "epoch": 1967} {"train_loss": -42.65592575073242, "global_step": 238083, "epoch": 1967} {"train_loss": -42.17327880859375, "global_step": 238084, "epoch": 1967} {"train_loss": -43.42323684692383, "global_step": 238085, "epoch": 1967} {"train_loss": -42.802364349365234, "global_step": 238086, "epoch": 1967} {"train_loss": -43.49332046508789, "global_step": 238087, "epoch": 1967} {"train_loss": -42.41261291503906, "global_step": 238088, "epoch": 1967} {"train_loss": -43.71434783935547, "global_step": 238089, "epoch": 1967} {"train_loss": -42.79807662963867, "global_step": 238090, "epoch": 1967} {"train_loss": -43.17812728881836, "global_step": 238091, "epoch": 1967} {"train_loss": -42.84345626831055, "global_step": 238092, "epoch": 1967} {"train_loss": -42.55258560180664, "global_step": 238093, "epoch": 1967} {"train_loss": -42.68507766723633, "global_step": 238094, "epoch": 1967} {"train_loss": -41.61824417114258, "global_step": 238095, "epoch": 1967} {"train_loss": -40.14221954345703, "global_step": 238096, "epoch": 1967} {"train_loss": -42.1591682434082, "global_step": 238097, "epoch": 1967} {"train_loss": -42.872318267822266, "global_step": 238098, "epoch": 1967} {"train_loss": -43.39945602416992, "global_step": 238099, "epoch": 1967} {"train_loss": -43.11775207519531, "global_step": 238100, "epoch": 1967} {"train_loss": -43.1801872253418, "global_step": 238101, "epoch": 1967} {"train_loss": -43.33781433105469, "global_step": 238102, "epoch": 1967} {"train_loss": -42.92180252075195, "global_step": 238103, "epoch": 1967} {"train_loss": -37.382144927978516, "global_step": 238104, "epoch": 1967} {"train_loss": -40.90970993041992, "global_step": 238105, "epoch": 1967} {"train_loss": -42.9705924987793, "global_step": 238106, "epoch": 1967} {"train_loss": -43.018943786621094, "global_step": 238107, "epoch": 1967} {"train_loss": -42.970916748046875, "global_step": 238108, "epoch": 1967} {"train_loss": -42.12559509277344, "global_step": 238109, "epoch": 1967} {"train_loss": -42.081119537353516, "global_step": 238110, "epoch": 1967} {"train_loss": -41.75825119018555, "global_step": 238111, "epoch": 1967} {"train_loss": -41.18752670288086, "global_step": 238112, "epoch": 1967} {"train_loss": -41.69407272338867, "global_step": 238113, "epoch": 1967} {"train_loss": -41.121517181396484, "global_step": 238114, "epoch": 1967} {"train_loss": -41.016658782958984, "global_step": 238115, "epoch": 1967} {"train_loss": -41.62410354614258, "global_step": 238116, "epoch": 1967} {"train_loss": -41.51118850708008, "global_step": 238117, "epoch": 1967} {"train_loss": -37.741485595703125, "global_step": 238118, "epoch": 1967} {"train_loss": -39.632537841796875, "global_step": 238119, "epoch": 1967} {"train_loss": -40.70111083984375, "global_step": 238120, "epoch": 1967} {"train_loss": -36.18132400512695, "global_step": 238121, "epoch": 1967} {"train_loss": -41.16079330444336, "global_step": 238122, "epoch": 1967} {"train_loss": -40.81990051269531, "global_step": 238123, "epoch": 1967} {"train_loss": -41.771297454833984, "global_step": 238124, "epoch": 1967} {"train_loss": -41.00545120239258, "global_step": 238125, "epoch": 1967} {"train_loss": -41.41585159301758, "global_step": 238126, "epoch": 1967} {"train_loss": -41.86981579488959, "global_step": 238127, "epoch": 1967, "val_loss": 2507351.75} {"train_loss": -42.058616638183594, "global_step": 238128, "epoch": 1968} {"train_loss": -40.48808288574219, "global_step": 238129, "epoch": 1968} {"train_loss": -40.257076263427734, "global_step": 238130, "epoch": 1968} {"train_loss": -41.497825622558594, "global_step": 238131, "epoch": 1968} {"train_loss": -42.133365631103516, "global_step": 238132, "epoch": 1968} {"train_loss": -41.5428466796875, "global_step": 238133, "epoch": 1968} {"train_loss": -39.593658447265625, "global_step": 238134, "epoch": 1968} {"train_loss": -42.571632385253906, "global_step": 238135, "epoch": 1968} {"train_loss": -37.665157318115234, "global_step": 238136, "epoch": 1968} {"train_loss": -41.825775146484375, "global_step": 238137, "epoch": 1968} {"train_loss": -40.522369384765625, "global_step": 238138, "epoch": 1968} {"train_loss": -41.650081634521484, "global_step": 238139, "epoch": 1968} {"train_loss": -41.796932220458984, "global_step": 238140, "epoch": 1968} {"train_loss": -42.4960823059082, "global_step": 238141, "epoch": 1968} {"train_loss": -40.332271575927734, "global_step": 238142, "epoch": 1968} {"train_loss": -40.37561798095703, "global_step": 238143, "epoch": 1968} {"train_loss": -41.421810150146484, "global_step": 238144, "epoch": 1968} {"train_loss": -42.04195022583008, "global_step": 238145, "epoch": 1968} {"train_loss": -41.3084831237793, "global_step": 238146, "epoch": 1968} {"train_loss": -40.65877151489258, "global_step": 238147, "epoch": 1968} {"train_loss": -42.18613815307617, "global_step": 238148, "epoch": 1968} {"train_loss": -42.81533432006836, "global_step": 238149, "epoch": 1968} {"train_loss": -42.34525680541992, "global_step": 238150, "epoch": 1968} {"train_loss": -39.6689567565918, "global_step": 238151, "epoch": 1968} {"train_loss": -41.20835494995117, "global_step": 238152, "epoch": 1968} {"train_loss": -42.59849166870117, "global_step": 238153, "epoch": 1968} {"train_loss": -41.86082077026367, "global_step": 238154, "epoch": 1968} {"train_loss": -42.155757904052734, "global_step": 238155, "epoch": 1968} {"train_loss": -42.46108627319336, "global_step": 238156, "epoch": 1968} {"train_loss": -42.68212890625, "global_step": 238157, "epoch": 1968} {"train_loss": -42.663421630859375, "global_step": 238158, "epoch": 1968} {"train_loss": -42.94700241088867, "global_step": 238159, "epoch": 1968} {"train_loss": -42.05059814453125, "global_step": 238160, "epoch": 1968} {"train_loss": -41.8995475769043, "global_step": 238161, "epoch": 1968} {"train_loss": -42.93566131591797, "global_step": 238162, "epoch": 1968} {"train_loss": -41.97699737548828, "global_step": 238163, "epoch": 1968} {"train_loss": -42.37146759033203, "global_step": 238164, "epoch": 1968} {"train_loss": -43.1331672668457, "global_step": 238165, "epoch": 1968} {"train_loss": -42.516666412353516, "global_step": 238166, "epoch": 1968} {"train_loss": -41.6875114440918, "global_step": 238167, "epoch": 1968} {"train_loss": -42.70100784301758, "global_step": 238168, "epoch": 1968} {"train_loss": -42.769615173339844, "global_step": 238169, "epoch": 1968} {"train_loss": -42.507179260253906, "global_step": 238170, "epoch": 1968} {"train_loss": -41.305450439453125, "global_step": 238171, "epoch": 1968} {"train_loss": -43.19169998168945, "global_step": 238172, "epoch": 1968} {"train_loss": -41.93225860595703, "global_step": 238173, "epoch": 1968} {"train_loss": -42.980770111083984, "global_step": 238174, "epoch": 1968} {"train_loss": -42.24528884887695, "global_step": 238175, "epoch": 1968} {"train_loss": -42.69527053833008, "global_step": 238176, "epoch": 1968} {"train_loss": -42.77676010131836, "global_step": 238177, "epoch": 1968} {"train_loss": -43.00648880004883, "global_step": 238178, "epoch": 1968} {"train_loss": -42.63948059082031, "global_step": 238179, "epoch": 1968} {"train_loss": -42.9914665222168, "global_step": 238180, "epoch": 1968} {"train_loss": -42.62434005737305, "global_step": 238181, "epoch": 1968} {"train_loss": -41.50096893310547, "global_step": 238182, "epoch": 1968} {"train_loss": -43.100013732910156, "global_step": 238183, "epoch": 1968} {"train_loss": -42.992286682128906, "global_step": 238184, "epoch": 1968} {"train_loss": -43.56052780151367, "global_step": 238185, "epoch": 1968} {"train_loss": -41.817562103271484, "global_step": 238186, "epoch": 1968} {"train_loss": -42.12686538696289, "global_step": 238187, "epoch": 1968} {"train_loss": -43.02314376831055, "global_step": 238188, "epoch": 1968} {"train_loss": -43.23945236206055, "global_step": 238189, "epoch": 1968} {"train_loss": -42.729835510253906, "global_step": 238190, "epoch": 1968} {"train_loss": -43.15517807006836, "global_step": 238191, "epoch": 1968} {"train_loss": -42.67397689819336, "global_step": 238192, "epoch": 1968} {"train_loss": -43.47867965698242, "global_step": 238193, "epoch": 1968} {"train_loss": -43.106666564941406, "global_step": 238194, "epoch": 1968} {"train_loss": -43.16542434692383, "global_step": 238195, "epoch": 1968} {"train_loss": -42.773799896240234, "global_step": 238196, "epoch": 1968} {"train_loss": -43.4111328125, "global_step": 238197, "epoch": 1968} {"train_loss": -43.13411331176758, "global_step": 238198, "epoch": 1968} {"train_loss": -42.068572998046875, "global_step": 238199, "epoch": 1968} {"train_loss": -42.856788635253906, "global_step": 238200, "epoch": 1968} {"train_loss": -43.379737854003906, "global_step": 238201, "epoch": 1968} {"train_loss": -43.329681396484375, "global_step": 238202, "epoch": 1968} {"train_loss": -43.24977111816406, "global_step": 238203, "epoch": 1968} {"train_loss": -42.77252197265625, "global_step": 238204, "epoch": 1968} {"train_loss": -43.256568908691406, "global_step": 238205, "epoch": 1968} {"train_loss": -43.8228759765625, "global_step": 238206, "epoch": 1968} {"train_loss": -42.7829704284668, "global_step": 238207, "epoch": 1968} {"train_loss": -42.71866989135742, "global_step": 238208, "epoch": 1968} {"train_loss": -42.72943878173828, "global_step": 238209, "epoch": 1968} {"train_loss": -42.64313507080078, "global_step": 238210, "epoch": 1968} {"train_loss": -42.92539978027344, "global_step": 238211, "epoch": 1968} {"train_loss": -42.24287796020508, "global_step": 238212, "epoch": 1968} {"train_loss": -41.98529052734375, "global_step": 238213, "epoch": 1968} {"train_loss": -42.71001434326172, "global_step": 238214, "epoch": 1968} {"train_loss": -43.39225387573242, "global_step": 238215, "epoch": 1968} {"train_loss": -43.76838302612305, "global_step": 238216, "epoch": 1968} {"train_loss": -42.69989013671875, "global_step": 238217, "epoch": 1968} {"train_loss": -42.53681564331055, "global_step": 238218, "epoch": 1968} {"train_loss": -42.9693717956543, "global_step": 238219, "epoch": 1968} {"train_loss": -41.54744338989258, "global_step": 238220, "epoch": 1968} {"train_loss": -42.0161018371582, "global_step": 238221, "epoch": 1968} {"train_loss": -42.31901931762695, "global_step": 238222, "epoch": 1968} {"train_loss": -42.43549346923828, "global_step": 238223, "epoch": 1968} {"train_loss": -42.715885162353516, "global_step": 238224, "epoch": 1968} {"train_loss": -42.29452133178711, "global_step": 238225, "epoch": 1968} {"train_loss": -42.241249084472656, "global_step": 238226, "epoch": 1968} {"train_loss": -39.42201614379883, "global_step": 238227, "epoch": 1968} {"train_loss": -39.458858489990234, "global_step": 238228, "epoch": 1968} {"train_loss": -41.32217788696289, "global_step": 238229, "epoch": 1968} {"train_loss": -42.781124114990234, "global_step": 238230, "epoch": 1968} {"train_loss": -40.202125549316406, "global_step": 238231, "epoch": 1968} {"train_loss": -41.5616569519043, "global_step": 238232, "epoch": 1968} {"train_loss": -42.637847900390625, "global_step": 238233, "epoch": 1968} {"train_loss": -41.97791290283203, "global_step": 238234, "epoch": 1968} {"train_loss": -43.093894958496094, "global_step": 238235, "epoch": 1968} {"train_loss": -42.36662673950195, "global_step": 238236, "epoch": 1968} {"train_loss": -42.459999084472656, "global_step": 238237, "epoch": 1968} {"train_loss": -42.69074630737305, "global_step": 238238, "epoch": 1968} {"train_loss": -43.287803649902344, "global_step": 238239, "epoch": 1968} {"train_loss": -42.50706100463867, "global_step": 238240, "epoch": 1968} {"train_loss": -42.96964645385742, "global_step": 238241, "epoch": 1968} {"train_loss": -42.72605514526367, "global_step": 238242, "epoch": 1968} {"train_loss": -43.37945556640625, "global_step": 238243, "epoch": 1968} {"train_loss": -42.917781829833984, "global_step": 238244, "epoch": 1968} {"train_loss": -42.244449615478516, "global_step": 238245, "epoch": 1968} {"train_loss": -41.57662582397461, "global_step": 238246, "epoch": 1968} {"train_loss": -42.68620681762695, "global_step": 238247, "epoch": 1968} {"train_loss": -42.27610857624653, "global_step": 238248, "epoch": 1968, "val_loss": 2616750.25} {"train_loss": -42.76384353637695, "global_step": 238249, "epoch": 1969} {"train_loss": -42.9007453918457, "global_step": 238250, "epoch": 1969} {"train_loss": -43.07469177246094, "global_step": 238251, "epoch": 1969} {"train_loss": -43.049774169921875, "global_step": 238252, "epoch": 1969} {"train_loss": -43.2965202331543, "global_step": 238253, "epoch": 1969} {"train_loss": -42.11014175415039, "global_step": 238254, "epoch": 1969} {"train_loss": -42.870113372802734, "global_step": 238255, "epoch": 1969} {"train_loss": -42.54990768432617, "global_step": 238256, "epoch": 1969} {"train_loss": -42.99091720581055, "global_step": 238257, "epoch": 1969} {"train_loss": -42.541114807128906, "global_step": 238258, "epoch": 1969} {"train_loss": -43.439083099365234, "global_step": 238259, "epoch": 1969} {"train_loss": -43.348262786865234, "global_step": 238260, "epoch": 1969} {"train_loss": -42.796958923339844, "global_step": 238261, "epoch": 1969} {"train_loss": -43.08388900756836, "global_step": 238262, "epoch": 1969} {"train_loss": -42.98389434814453, "global_step": 238263, "epoch": 1969} {"train_loss": -43.5310173034668, "global_step": 238264, "epoch": 1969} {"train_loss": -42.98341751098633, "global_step": 238265, "epoch": 1969} {"train_loss": -41.69361114501953, "global_step": 238266, "epoch": 1969} {"train_loss": -43.66118240356445, "global_step": 238267, "epoch": 1969} {"train_loss": -43.24467849731445, "global_step": 238268, "epoch": 1969} {"train_loss": -42.82143783569336, "global_step": 238269, "epoch": 1969} {"train_loss": -43.16959762573242, "global_step": 238270, "epoch": 1969} {"train_loss": -43.611454010009766, "global_step": 238271, "epoch": 1969} {"train_loss": -43.155357360839844, "global_step": 238272, "epoch": 1969} {"train_loss": -42.98956298828125, "global_step": 238273, "epoch": 1969} {"train_loss": -43.21645736694336, "global_step": 238274, "epoch": 1969} {"train_loss": -43.76937484741211, "global_step": 238275, "epoch": 1969} {"train_loss": -42.52553176879883, "global_step": 238276, "epoch": 1969} {"train_loss": -41.99006271362305, "global_step": 238277, "epoch": 1969} {"train_loss": -40.5971794128418, "global_step": 238278, "epoch": 1969} {"train_loss": -40.69480514526367, "global_step": 238279, "epoch": 1969} {"train_loss": -38.46645736694336, "global_step": 238280, "epoch": 1969} {"train_loss": -41.78337860107422, "global_step": 238281, "epoch": 1969} {"train_loss": -42.654598236083984, "global_step": 238282, "epoch": 1969} {"train_loss": -40.39689254760742, "global_step": 238283, "epoch": 1969} {"train_loss": -37.84037399291992, "global_step": 238284, "epoch": 1969} {"train_loss": -40.92428207397461, "global_step": 238285, "epoch": 1969} {"train_loss": -41.101173400878906, "global_step": 238286, "epoch": 1969} {"train_loss": -38.285465240478516, "global_step": 238287, "epoch": 1969} {"train_loss": -39.378883361816406, "global_step": 238288, "epoch": 1969} {"train_loss": -37.84949493408203, "global_step": 238289, "epoch": 1969} {"train_loss": -40.25934982299805, "global_step": 238290, "epoch": 1969} {"train_loss": -39.66452407836914, "global_step": 238291, "epoch": 1969} {"train_loss": -39.021724700927734, "global_step": 238292, "epoch": 1969} {"train_loss": -41.89496612548828, "global_step": 238293, "epoch": 1969} {"train_loss": -40.352195739746094, "global_step": 238294, "epoch": 1969} {"train_loss": -42.48666000366211, "global_step": 238295, "epoch": 1969} {"train_loss": -39.958709716796875, "global_step": 238296, "epoch": 1969} {"train_loss": -41.10152053833008, "global_step": 238297, "epoch": 1969} {"train_loss": -41.342689514160156, "global_step": 238298, "epoch": 1969} {"train_loss": -42.350440979003906, "global_step": 238299, "epoch": 1969} {"train_loss": -41.53306198120117, "global_step": 238300, "epoch": 1969} {"train_loss": -41.873104095458984, "global_step": 238301, "epoch": 1969} {"train_loss": -42.02885055541992, "global_step": 238302, "epoch": 1969} {"train_loss": -42.196556091308594, "global_step": 238303, "epoch": 1969} {"train_loss": -42.24363327026367, "global_step": 238304, "epoch": 1969} {"train_loss": -42.47951889038086, "global_step": 238305, "epoch": 1969} {"train_loss": -42.77534103393555, "global_step": 238306, "epoch": 1969} {"train_loss": -42.37367630004883, "global_step": 238307, "epoch": 1969} {"train_loss": -40.4832878112793, "global_step": 238308, "epoch": 1969} {"train_loss": -40.6558952331543, "global_step": 238309, "epoch": 1969} {"train_loss": -41.656761169433594, "global_step": 238310, "epoch": 1969} {"train_loss": -42.78702163696289, "global_step": 238311, "epoch": 1969} {"train_loss": -41.75399398803711, "global_step": 238312, "epoch": 1969} {"train_loss": -43.062965393066406, "global_step": 238313, "epoch": 1969} {"train_loss": -42.648345947265625, "global_step": 238314, "epoch": 1969} {"train_loss": -42.88727951049805, "global_step": 238315, "epoch": 1969} {"train_loss": -42.39065170288086, "global_step": 238316, "epoch": 1969} {"train_loss": -42.76063537597656, "global_step": 238317, "epoch": 1969} {"train_loss": -42.75048065185547, "global_step": 238318, "epoch": 1969} {"train_loss": -42.20246887207031, "global_step": 238319, "epoch": 1969} {"train_loss": -43.40956115722656, "global_step": 238320, "epoch": 1969} {"train_loss": -42.47335433959961, "global_step": 238321, "epoch": 1969} {"train_loss": -42.87765121459961, "global_step": 238322, "epoch": 1969} {"train_loss": -42.345375061035156, "global_step": 238323, "epoch": 1969} {"train_loss": -43.11613845825195, "global_step": 238324, "epoch": 1969} {"train_loss": -42.71799087524414, "global_step": 238325, "epoch": 1969} {"train_loss": -43.34324264526367, "global_step": 238326, "epoch": 1969} {"train_loss": -42.56230545043945, "global_step": 238327, "epoch": 1969} {"train_loss": -42.77798080444336, "global_step": 238328, "epoch": 1969} {"train_loss": -41.983455657958984, "global_step": 238329, "epoch": 1969} {"train_loss": -42.03920364379883, "global_step": 238330, "epoch": 1969} {"train_loss": -43.46052169799805, "global_step": 238331, "epoch": 1969} {"train_loss": -42.957489013671875, "global_step": 238332, "epoch": 1969} {"train_loss": -43.02006530761719, "global_step": 238333, "epoch": 1969} {"train_loss": -42.333160400390625, "global_step": 238334, "epoch": 1969} {"train_loss": -42.4872932434082, "global_step": 238335, "epoch": 1969} {"train_loss": -43.287471771240234, "global_step": 238336, "epoch": 1969} {"train_loss": -42.72052764892578, "global_step": 238337, "epoch": 1969} {"train_loss": -42.82282257080078, "global_step": 238338, "epoch": 1969} {"train_loss": -43.246002197265625, "global_step": 238339, "epoch": 1969} {"train_loss": -43.37147903442383, "global_step": 238340, "epoch": 1969} {"train_loss": -42.31476593017578, "global_step": 238341, "epoch": 1969} {"train_loss": -42.9450798034668, "global_step": 238342, "epoch": 1969} {"train_loss": -43.16168212890625, "global_step": 238343, "epoch": 1969} {"train_loss": -43.307769775390625, "global_step": 238344, "epoch": 1969} {"train_loss": -43.137451171875, "global_step": 238345, "epoch": 1969} {"train_loss": -42.89976119995117, "global_step": 238346, "epoch": 1969} {"train_loss": -43.1075439453125, "global_step": 238347, "epoch": 1969} {"train_loss": -43.44807815551758, "global_step": 238348, "epoch": 1969} {"train_loss": -43.292701721191406, "global_step": 238349, "epoch": 1969} {"train_loss": -43.92253875732422, "global_step": 238350, "epoch": 1969} {"train_loss": -43.390724182128906, "global_step": 238351, "epoch": 1969} {"train_loss": -42.16048812866211, "global_step": 238352, "epoch": 1969} {"train_loss": -42.97311019897461, "global_step": 238353, "epoch": 1969} {"train_loss": -42.999813079833984, "global_step": 238354, "epoch": 1969} {"train_loss": -41.256717681884766, "global_step": 238355, "epoch": 1969} {"train_loss": -42.65536117553711, "global_step": 238356, "epoch": 1969} {"train_loss": -43.02974319458008, "global_step": 238357, "epoch": 1969} {"train_loss": -42.586368560791016, "global_step": 238358, "epoch": 1969} {"train_loss": -43.0984001159668, "global_step": 238359, "epoch": 1969} {"train_loss": -43.15683364868164, "global_step": 238360, "epoch": 1969} {"train_loss": -41.90433883666992, "global_step": 238361, "epoch": 1969} {"train_loss": -41.970909118652344, "global_step": 238362, "epoch": 1969} {"train_loss": -43.0263671875, "global_step": 238363, "epoch": 1969} {"train_loss": -43.72694778442383, "global_step": 238364, "epoch": 1969} {"train_loss": -42.701393127441406, "global_step": 238365, "epoch": 1969} {"train_loss": -41.2894401550293, "global_step": 238366, "epoch": 1969} {"train_loss": -40.37177658081055, "global_step": 238367, "epoch": 1969} {"train_loss": -42.028072357177734, "global_step": 238368, "epoch": 1969} {"train_loss": -42.26491073734504, "global_step": 238369, "epoch": 1969, "val_loss": 2703124.0} {"train_loss": -39.26556396484375, "global_step": 238370, "epoch": 1970} {"train_loss": -41.40094757080078, "global_step": 238371, "epoch": 1970} {"train_loss": -37.345523834228516, "global_step": 238372, "epoch": 1970} {"train_loss": -38.668453216552734, "global_step": 238373, "epoch": 1970} {"train_loss": -36.55351638793945, "global_step": 238374, "epoch": 1970} {"train_loss": -38.80537796020508, "global_step": 238375, "epoch": 1970} {"train_loss": -39.92884826660156, "global_step": 238376, "epoch": 1970} {"train_loss": -38.90385055541992, "global_step": 238377, "epoch": 1970} {"train_loss": -42.076019287109375, "global_step": 238378, "epoch": 1970} {"train_loss": -38.481781005859375, "global_step": 238379, "epoch": 1970} {"train_loss": -40.6304817199707, "global_step": 238380, "epoch": 1970} {"train_loss": -37.91086959838867, "global_step": 238381, "epoch": 1970} {"train_loss": -39.19404220581055, "global_step": 238382, "epoch": 1970} {"train_loss": -41.27777862548828, "global_step": 238383, "epoch": 1970} {"train_loss": -38.455810546875, "global_step": 238384, "epoch": 1970} {"train_loss": -41.5550651550293, "global_step": 238385, "epoch": 1970} {"train_loss": -38.10255813598633, "global_step": 238386, "epoch": 1970} {"train_loss": -41.5622673034668, "global_step": 238387, "epoch": 1970} {"train_loss": -39.59504318237305, "global_step": 238388, "epoch": 1970} {"train_loss": -40.771507263183594, "global_step": 238389, "epoch": 1970} {"train_loss": -41.545135498046875, "global_step": 238390, "epoch": 1970} {"train_loss": -40.565608978271484, "global_step": 238391, "epoch": 1970} {"train_loss": -42.38570022583008, "global_step": 238392, "epoch": 1970} {"train_loss": -39.78940200805664, "global_step": 238393, "epoch": 1970} {"train_loss": -41.71096420288086, "global_step": 238394, "epoch": 1970} {"train_loss": -41.24116897583008, "global_step": 238395, "epoch": 1970} {"train_loss": -40.408756256103516, "global_step": 238396, "epoch": 1970} {"train_loss": -40.6102294921875, "global_step": 238397, "epoch": 1970} {"train_loss": -41.67475128173828, "global_step": 238398, "epoch": 1970} {"train_loss": -41.85004806518555, "global_step": 238399, "epoch": 1970} {"train_loss": -41.147212982177734, "global_step": 238400, "epoch": 1970} {"train_loss": -42.00244903564453, "global_step": 238401, "epoch": 1970} {"train_loss": -42.46151351928711, "global_step": 238402, "epoch": 1970} {"train_loss": -41.87407302856445, "global_step": 238403, "epoch": 1970} {"train_loss": -42.131954193115234, "global_step": 238404, "epoch": 1970} {"train_loss": -42.46382522583008, "global_step": 238405, "epoch": 1970} {"train_loss": -42.443050384521484, "global_step": 238406, "epoch": 1970} {"train_loss": -43.27471923828125, "global_step": 238407, "epoch": 1970} {"train_loss": -42.50844955444336, "global_step": 238408, "epoch": 1970} {"train_loss": -42.652610778808594, "global_step": 238409, "epoch": 1970} {"train_loss": -42.557064056396484, "global_step": 238410, "epoch": 1970} {"train_loss": -43.421688079833984, "global_step": 238411, "epoch": 1970} {"train_loss": -42.1572151184082, "global_step": 238412, "epoch": 1970} {"train_loss": -43.16839599609375, "global_step": 238413, "epoch": 1970} {"train_loss": -42.77126693725586, "global_step": 238414, "epoch": 1970} {"train_loss": -43.11940002441406, "global_step": 238415, "epoch": 1970} {"train_loss": -43.162227630615234, "global_step": 238416, "epoch": 1970} {"train_loss": -43.23334884643555, "global_step": 238417, "epoch": 1970} {"train_loss": -43.72993087768555, "global_step": 238418, "epoch": 1970} {"train_loss": -43.626312255859375, "global_step": 238419, "epoch": 1970} {"train_loss": -42.91176986694336, "global_step": 238420, "epoch": 1970} {"train_loss": -43.63249588012695, "global_step": 238421, "epoch": 1970} {"train_loss": -43.42767333984375, "global_step": 238422, "epoch": 1970} {"train_loss": -42.890926361083984, "global_step": 238423, "epoch": 1970} {"train_loss": -43.7210693359375, "global_step": 238424, "epoch": 1970} {"train_loss": -43.661800384521484, "global_step": 238425, "epoch": 1970} {"train_loss": -43.599220275878906, "global_step": 238426, "epoch": 1970} {"train_loss": -43.63767623901367, "global_step": 238427, "epoch": 1970} {"train_loss": -43.5927619934082, "global_step": 238428, "epoch": 1970} {"train_loss": -43.593021392822266, "global_step": 238429, "epoch": 1970} {"train_loss": -43.419921875, "global_step": 238430, "epoch": 1970} {"train_loss": -43.62451934814453, "global_step": 238431, "epoch": 1970} {"train_loss": -43.73421859741211, "global_step": 238432, "epoch": 1970} {"train_loss": -43.48870086669922, "global_step": 238433, "epoch": 1970} {"train_loss": -43.537960052490234, "global_step": 238434, "epoch": 1970} {"train_loss": -43.188262939453125, "global_step": 238435, "epoch": 1970} {"train_loss": -43.36977767944336, "global_step": 238436, "epoch": 1970} {"train_loss": -43.25770950317383, "global_step": 238437, "epoch": 1970} {"train_loss": -42.9456672668457, "global_step": 238438, "epoch": 1970} {"train_loss": -43.42231369018555, "global_step": 238439, "epoch": 1970} {"train_loss": -43.48586654663086, "global_step": 238440, "epoch": 1970} {"train_loss": -43.3382682800293, "global_step": 238441, "epoch": 1970} {"train_loss": -43.70159912109375, "global_step": 238442, "epoch": 1970} {"train_loss": -43.02981185913086, "global_step": 238443, "epoch": 1970} {"train_loss": -43.04536056518555, "global_step": 238444, "epoch": 1970} {"train_loss": -43.118690490722656, "global_step": 238445, "epoch": 1970} {"train_loss": -42.94486618041992, "global_step": 238446, "epoch": 1970} {"train_loss": -43.34931182861328, "global_step": 238447, "epoch": 1970} {"train_loss": -42.35871505737305, "global_step": 238448, "epoch": 1970} {"train_loss": -42.661319732666016, "global_step": 238449, "epoch": 1970} {"train_loss": -42.8316650390625, "global_step": 238450, "epoch": 1970} {"train_loss": -43.241172790527344, "global_step": 238451, "epoch": 1970} {"train_loss": -41.545501708984375, "global_step": 238452, "epoch": 1970} {"train_loss": -41.57479476928711, "global_step": 238453, "epoch": 1970} {"train_loss": -40.87770462036133, "global_step": 238454, "epoch": 1970} {"train_loss": -41.09487533569336, "global_step": 238455, "epoch": 1970} {"train_loss": -42.03254699707031, "global_step": 238456, "epoch": 1970} {"train_loss": -42.79829025268555, "global_step": 238457, "epoch": 1970} {"train_loss": -41.88166427612305, "global_step": 238458, "epoch": 1970} {"train_loss": -42.29587936401367, "global_step": 238459, "epoch": 1970} {"train_loss": -42.54351806640625, "global_step": 238460, "epoch": 1970} {"train_loss": -43.308746337890625, "global_step": 238461, "epoch": 1970} {"train_loss": -42.670875549316406, "global_step": 238462, "epoch": 1970} {"train_loss": -41.7183952331543, "global_step": 238463, "epoch": 1970} {"train_loss": -42.095821380615234, "global_step": 238464, "epoch": 1970} {"train_loss": -43.58422088623047, "global_step": 238465, "epoch": 1970} {"train_loss": -41.69279479980469, "global_step": 238466, "epoch": 1970} {"train_loss": -40.33463668823242, "global_step": 238467, "epoch": 1970} {"train_loss": -41.224334716796875, "global_step": 238468, "epoch": 1970} {"train_loss": -43.16190719604492, "global_step": 238469, "epoch": 1970} {"train_loss": -40.80649948120117, "global_step": 238470, "epoch": 1970} {"train_loss": -41.85553741455078, "global_step": 238471, "epoch": 1970} {"train_loss": -42.07450485229492, "global_step": 238472, "epoch": 1970} {"train_loss": -40.99319076538086, "global_step": 238473, "epoch": 1970} {"train_loss": -41.11903762817383, "global_step": 238474, "epoch": 1970} {"train_loss": -42.36159133911133, "global_step": 238475, "epoch": 1970} {"train_loss": -42.341033935546875, "global_step": 238476, "epoch": 1970} {"train_loss": -42.15705108642578, "global_step": 238477, "epoch": 1970} {"train_loss": -42.20710372924805, "global_step": 238478, "epoch": 1970} {"train_loss": -41.77793884277344, "global_step": 238479, "epoch": 1970} {"train_loss": -42.41096115112305, "global_step": 238480, "epoch": 1970} {"train_loss": -41.90150833129883, "global_step": 238481, "epoch": 1970} {"train_loss": -42.75861358642578, "global_step": 238482, "epoch": 1970} {"train_loss": -42.4663200378418, "global_step": 238483, "epoch": 1970} {"train_loss": -42.33921432495117, "global_step": 238484, "epoch": 1970} {"train_loss": -41.229671478271484, "global_step": 238485, "epoch": 1970} {"train_loss": -41.663673400878906, "global_step": 238486, "epoch": 1970} {"train_loss": -42.2214469909668, "global_step": 238487, "epoch": 1970} {"train_loss": -42.50613021850586, "global_step": 238488, "epoch": 1970} {"train_loss": -41.0882568359375, "global_step": 238489, "epoch": 1970} {"train_loss": -41.95383806465086, "global_step": 238490, "epoch": 1970, "val_loss": 2630455.0} {"train_loss": -42.17013168334961, "global_step": 238491, "epoch": 1971} {"train_loss": -42.73933792114258, "global_step": 238492, "epoch": 1971} {"train_loss": -40.635128021240234, "global_step": 238493, "epoch": 1971} {"train_loss": -41.69617462158203, "global_step": 238494, "epoch": 1971} {"train_loss": -42.76344299316406, "global_step": 238495, "epoch": 1971} {"train_loss": -41.41988754272461, "global_step": 238496, "epoch": 1971} {"train_loss": -42.5712890625, "global_step": 238497, "epoch": 1971} {"train_loss": -41.58348083496094, "global_step": 238498, "epoch": 1971} {"train_loss": -41.684913635253906, "global_step": 238499, "epoch": 1971} {"train_loss": -41.706966400146484, "global_step": 238500, "epoch": 1971} {"train_loss": -40.958580017089844, "global_step": 238501, "epoch": 1971} {"train_loss": -41.88651657104492, "global_step": 238502, "epoch": 1971} {"train_loss": -41.096588134765625, "global_step": 238503, "epoch": 1971} {"train_loss": -41.57286071777344, "global_step": 238504, "epoch": 1971} {"train_loss": -42.32243728637695, "global_step": 238505, "epoch": 1971} {"train_loss": -41.98032760620117, "global_step": 238506, "epoch": 1971} {"train_loss": -41.9550666809082, "global_step": 238507, "epoch": 1971} {"train_loss": -42.80141830444336, "global_step": 238508, "epoch": 1971} {"train_loss": -42.630332946777344, "global_step": 238509, "epoch": 1971} {"train_loss": -42.32611846923828, "global_step": 238510, "epoch": 1971} {"train_loss": -42.20821762084961, "global_step": 238511, "epoch": 1971} {"train_loss": -42.74123764038086, "global_step": 238512, "epoch": 1971} {"train_loss": -42.6974983215332, "global_step": 238513, "epoch": 1971} {"train_loss": -43.3310432434082, "global_step": 238514, "epoch": 1971} {"train_loss": -42.27801513671875, "global_step": 238515, "epoch": 1971} {"train_loss": -43.12617874145508, "global_step": 238516, "epoch": 1971} {"train_loss": -42.725337982177734, "global_step": 238517, "epoch": 1971} {"train_loss": -43.009178161621094, "global_step": 238518, "epoch": 1971} {"train_loss": -43.37434005737305, "global_step": 238519, "epoch": 1971} {"train_loss": -43.2766227722168, "global_step": 238520, "epoch": 1971} {"train_loss": -43.311241149902344, "global_step": 238521, "epoch": 1971} {"train_loss": -43.030452728271484, "global_step": 238522, "epoch": 1971} {"train_loss": -43.634334564208984, "global_step": 238523, "epoch": 1971} {"train_loss": -43.67020034790039, "global_step": 238524, "epoch": 1971} {"train_loss": -43.600337982177734, "global_step": 238525, "epoch": 1971} {"train_loss": -43.306549072265625, "global_step": 238526, "epoch": 1971} {"train_loss": -43.658687591552734, "global_step": 238527, "epoch": 1971} {"train_loss": -43.87821578979492, "global_step": 238528, "epoch": 1971} {"train_loss": -43.71548080444336, "global_step": 238529, "epoch": 1971} {"train_loss": -43.99203109741211, "global_step": 238530, "epoch": 1971} {"train_loss": -43.86017608642578, "global_step": 238531, "epoch": 1971} {"train_loss": -43.14604949951172, "global_step": 238532, "epoch": 1971} {"train_loss": -43.639122009277344, "global_step": 238533, "epoch": 1971} {"train_loss": -43.87457275390625, "global_step": 238534, "epoch": 1971} {"train_loss": -44.04795455932617, "global_step": 238535, "epoch": 1971} {"train_loss": -43.84676742553711, "global_step": 238536, "epoch": 1971} {"train_loss": -43.812198638916016, "global_step": 238537, "epoch": 1971} {"train_loss": -44.214935302734375, "global_step": 238538, "epoch": 1971} {"train_loss": -43.954227447509766, "global_step": 238539, "epoch": 1971} {"train_loss": -44.204811096191406, "global_step": 238540, "epoch": 1971} {"train_loss": -43.5924186706543, "global_step": 238541, "epoch": 1971} {"train_loss": -44.1912956237793, "global_step": 238542, "epoch": 1971} {"train_loss": -43.76412582397461, "global_step": 238543, "epoch": 1971} {"train_loss": -44.281044006347656, "global_step": 238544, "epoch": 1971} {"train_loss": -43.99698257446289, "global_step": 238545, "epoch": 1971} {"train_loss": -44.17988967895508, "global_step": 238546, "epoch": 1971} {"train_loss": -43.97469711303711, "global_step": 238547, "epoch": 1971} {"train_loss": -44.45552062988281, "global_step": 238548, "epoch": 1971} {"train_loss": -43.798980712890625, "global_step": 238549, "epoch": 1971} {"train_loss": -43.84882736206055, "global_step": 238550, "epoch": 1971} {"train_loss": -44.289100646972656, "global_step": 238551, "epoch": 1971} {"train_loss": -44.331417083740234, "global_step": 238552, "epoch": 1971} {"train_loss": -44.349464416503906, "global_step": 238553, "epoch": 1971} {"train_loss": -44.478363037109375, "global_step": 238554, "epoch": 1971} {"train_loss": -44.043495178222656, "global_step": 238555, "epoch": 1971} {"train_loss": -43.956966400146484, "global_step": 238556, "epoch": 1971} {"train_loss": -43.83982467651367, "global_step": 238557, "epoch": 1971} {"train_loss": -43.73971176147461, "global_step": 238558, "epoch": 1971} {"train_loss": -44.41559982299805, "global_step": 238559, "epoch": 1971} {"train_loss": -44.02144241333008, "global_step": 238560, "epoch": 1971} {"train_loss": -44.50148010253906, "global_step": 238561, "epoch": 1971} {"train_loss": -43.796260833740234, "global_step": 238562, "epoch": 1971} {"train_loss": -42.50706100463867, "global_step": 238563, "epoch": 1971} {"train_loss": -43.6004753112793, "global_step": 238564, "epoch": 1971} {"train_loss": -44.2438850402832, "global_step": 238565, "epoch": 1971} {"train_loss": -44.44477462768555, "global_step": 238566, "epoch": 1971} {"train_loss": -44.161354064941406, "global_step": 238567, "epoch": 1971} {"train_loss": -42.93193435668945, "global_step": 238568, "epoch": 1971} {"train_loss": -41.42205810546875, "global_step": 238569, "epoch": 1971} {"train_loss": -42.26103591918945, "global_step": 238570, "epoch": 1971} {"train_loss": -42.39988708496094, "global_step": 238571, "epoch": 1971} {"train_loss": -43.119651794433594, "global_step": 238572, "epoch": 1971} {"train_loss": -44.0810546875, "global_step": 238573, "epoch": 1971} {"train_loss": -44.03505325317383, "global_step": 238574, "epoch": 1971} {"train_loss": -43.2809944152832, "global_step": 238575, "epoch": 1971} {"train_loss": -43.95803451538086, "global_step": 238576, "epoch": 1971} {"train_loss": -43.55768966674805, "global_step": 238577, "epoch": 1971} {"train_loss": -42.800254821777344, "global_step": 238578, "epoch": 1971} {"train_loss": -42.054054260253906, "global_step": 238579, "epoch": 1971} {"train_loss": -42.22266387939453, "global_step": 238580, "epoch": 1971} {"train_loss": -42.12276840209961, "global_step": 238581, "epoch": 1971} {"train_loss": -41.73828125, "global_step": 238582, "epoch": 1971} {"train_loss": -42.49784851074219, "global_step": 238583, "epoch": 1971} {"train_loss": -42.9539909362793, "global_step": 238584, "epoch": 1971} {"train_loss": -43.201412200927734, "global_step": 238585, "epoch": 1971} {"train_loss": -42.17433547973633, "global_step": 238586, "epoch": 1971} {"train_loss": -40.131385803222656, "global_step": 238587, "epoch": 1971} {"train_loss": -40.05987548828125, "global_step": 238588, "epoch": 1971} {"train_loss": -42.257076263427734, "global_step": 238589, "epoch": 1971} {"train_loss": -41.78352355957031, "global_step": 238590, "epoch": 1971} {"train_loss": -40.90595626831055, "global_step": 238591, "epoch": 1971} {"train_loss": -40.7000846862793, "global_step": 238592, "epoch": 1971} {"train_loss": -41.79341506958008, "global_step": 238593, "epoch": 1971} {"train_loss": -42.50927734375, "global_step": 238594, "epoch": 1971} {"train_loss": -41.51523208618164, "global_step": 238595, "epoch": 1971} {"train_loss": -41.3133659362793, "global_step": 238596, "epoch": 1971} {"train_loss": -42.90737533569336, "global_step": 238597, "epoch": 1971} {"train_loss": -42.75598907470703, "global_step": 238598, "epoch": 1971} {"train_loss": -41.859718322753906, "global_step": 238599, "epoch": 1971} {"train_loss": -42.37938690185547, "global_step": 238600, "epoch": 1971} {"train_loss": -42.895381927490234, "global_step": 238601, "epoch": 1971} {"train_loss": -42.63719940185547, "global_step": 238602, "epoch": 1971} {"train_loss": -41.21677780151367, "global_step": 238603, "epoch": 1971} {"train_loss": -41.13176345825195, "global_step": 238604, "epoch": 1971} {"train_loss": -41.324195861816406, "global_step": 238605, "epoch": 1971} {"train_loss": -43.40623092651367, "global_step": 238606, "epoch": 1971} {"train_loss": -41.946529388427734, "global_step": 238607, "epoch": 1971} {"train_loss": -42.708160400390625, "global_step": 238608, "epoch": 1971} {"train_loss": -43.37260818481445, "global_step": 238609, "epoch": 1971} {"train_loss": -41.37159729003906, "global_step": 238610, "epoch": 1971} {"train_loss": -42.891280056031285, "global_step": 238611, "epoch": 1971, "val_loss": 2570128.0} {"train_loss": -42.01278305053711, "global_step": 238612, "epoch": 1972} {"train_loss": -42.01212692260742, "global_step": 238613, "epoch": 1972} {"train_loss": -42.7251091003418, "global_step": 238614, "epoch": 1972} {"train_loss": -41.85991287231445, "global_step": 238615, "epoch": 1972} {"train_loss": -42.82157897949219, "global_step": 238616, "epoch": 1972} {"train_loss": -41.42047119140625, "global_step": 238617, "epoch": 1972} {"train_loss": -41.79695510864258, "global_step": 238618, "epoch": 1972} {"train_loss": -42.559078216552734, "global_step": 238619, "epoch": 1972} {"train_loss": -41.283241271972656, "global_step": 238620, "epoch": 1972} {"train_loss": -42.21280288696289, "global_step": 238621, "epoch": 1972} {"train_loss": -41.5051383972168, "global_step": 238622, "epoch": 1972} {"train_loss": -42.86141586303711, "global_step": 238623, "epoch": 1972} {"train_loss": -41.15224075317383, "global_step": 238624, "epoch": 1972} {"train_loss": -42.08396530151367, "global_step": 238625, "epoch": 1972} {"train_loss": -42.106563568115234, "global_step": 238626, "epoch": 1972} {"train_loss": -42.26802444458008, "global_step": 238627, "epoch": 1972} {"train_loss": -40.99677276611328, "global_step": 238628, "epoch": 1972} {"train_loss": -40.653560638427734, "global_step": 238629, "epoch": 1972} {"train_loss": -42.7789192199707, "global_step": 238630, "epoch": 1972} {"train_loss": -41.92112350463867, "global_step": 238631, "epoch": 1972} {"train_loss": -41.23789596557617, "global_step": 238632, "epoch": 1972} {"train_loss": -41.66496276855469, "global_step": 238633, "epoch": 1972} {"train_loss": -40.20813751220703, "global_step": 238634, "epoch": 1972} {"train_loss": -41.327125549316406, "global_step": 238635, "epoch": 1972} {"train_loss": -39.81245422363281, "global_step": 238636, "epoch": 1972} {"train_loss": -42.33711624145508, "global_step": 238637, "epoch": 1972} {"train_loss": -40.97682571411133, "global_step": 238638, "epoch": 1972} {"train_loss": -42.210506439208984, "global_step": 238639, "epoch": 1972} {"train_loss": -41.72929763793945, "global_step": 238640, "epoch": 1972} {"train_loss": -42.63485336303711, "global_step": 238641, "epoch": 1972} {"train_loss": -42.440208435058594, "global_step": 238642, "epoch": 1972} {"train_loss": -41.57909393310547, "global_step": 238643, "epoch": 1972} {"train_loss": -41.78792190551758, "global_step": 238644, "epoch": 1972} {"train_loss": -42.63199996948242, "global_step": 238645, "epoch": 1972} {"train_loss": -42.46955108642578, "global_step": 238646, "epoch": 1972} {"train_loss": -41.874507904052734, "global_step": 238647, "epoch": 1972} {"train_loss": -42.76771545410156, "global_step": 238648, "epoch": 1972} {"train_loss": -40.741790771484375, "global_step": 238649, "epoch": 1972} {"train_loss": -41.86106491088867, "global_step": 238650, "epoch": 1972} {"train_loss": -41.257625579833984, "global_step": 238651, "epoch": 1972} {"train_loss": -42.449256896972656, "global_step": 238652, "epoch": 1972} {"train_loss": -40.8157958984375, "global_step": 238653, "epoch": 1972} {"train_loss": -42.56687545776367, "global_step": 238654, "epoch": 1972} {"train_loss": -41.219478607177734, "global_step": 238655, "epoch": 1972} {"train_loss": -43.23774337768555, "global_step": 238656, "epoch": 1972} {"train_loss": -42.8064079284668, "global_step": 238657, "epoch": 1972} {"train_loss": -42.796836853027344, "global_step": 238658, "epoch": 1972} {"train_loss": -43.428260803222656, "global_step": 238659, "epoch": 1972} {"train_loss": -42.90663528442383, "global_step": 238660, "epoch": 1972} {"train_loss": -42.595455169677734, "global_step": 238661, "epoch": 1972} {"train_loss": -43.31705856323242, "global_step": 238662, "epoch": 1972} {"train_loss": -42.656829833984375, "global_step": 238663, "epoch": 1972} {"train_loss": -43.48369598388672, "global_step": 238664, "epoch": 1972} {"train_loss": -43.2852668762207, "global_step": 238665, "epoch": 1972} {"train_loss": -43.540618896484375, "global_step": 238666, "epoch": 1972} {"train_loss": -43.4543342590332, "global_step": 238667, "epoch": 1972} {"train_loss": -43.90713119506836, "global_step": 238668, "epoch": 1972} {"train_loss": -42.96112060546875, "global_step": 238669, "epoch": 1972} {"train_loss": -43.856014251708984, "global_step": 238670, "epoch": 1972} {"train_loss": -43.72847366333008, "global_step": 238671, "epoch": 1972} {"train_loss": -43.5886116027832, "global_step": 238672, "epoch": 1972} {"train_loss": -43.67252731323242, "global_step": 238673, "epoch": 1972} {"train_loss": -43.76994705200195, "global_step": 238674, "epoch": 1972} {"train_loss": -42.762237548828125, "global_step": 238675, "epoch": 1972} {"train_loss": -43.81499099731445, "global_step": 238676, "epoch": 1972} {"train_loss": -43.09912109375, "global_step": 238677, "epoch": 1972} {"train_loss": -43.38150405883789, "global_step": 238678, "epoch": 1972} {"train_loss": -43.796207427978516, "global_step": 238679, "epoch": 1972} {"train_loss": -43.688899993896484, "global_step": 238680, "epoch": 1972} {"train_loss": -42.95029830932617, "global_step": 238681, "epoch": 1972} {"train_loss": -43.2764778137207, "global_step": 238682, "epoch": 1972} {"train_loss": -42.164581298828125, "global_step": 238683, "epoch": 1972} {"train_loss": -40.940826416015625, "global_step": 238684, "epoch": 1972} {"train_loss": -42.64004135131836, "global_step": 238685, "epoch": 1972} {"train_loss": -40.50432586669922, "global_step": 238686, "epoch": 1972} {"train_loss": -39.71158218383789, "global_step": 238687, "epoch": 1972} {"train_loss": -42.51945114135742, "global_step": 238688, "epoch": 1972} {"train_loss": -41.865081787109375, "global_step": 238689, "epoch": 1972} {"train_loss": -39.64764404296875, "global_step": 238690, "epoch": 1972} {"train_loss": -41.66313171386719, "global_step": 238691, "epoch": 1972} {"train_loss": -40.79716491699219, "global_step": 238692, "epoch": 1972} {"train_loss": -40.98087692260742, "global_step": 238693, "epoch": 1972} {"train_loss": -41.7702751159668, "global_step": 238694, "epoch": 1972} {"train_loss": -39.995277404785156, "global_step": 238695, "epoch": 1972} {"train_loss": -38.92477035522461, "global_step": 238696, "epoch": 1972} {"train_loss": -41.315547943115234, "global_step": 238697, "epoch": 1972} {"train_loss": -39.48219299316406, "global_step": 238698, "epoch": 1972} {"train_loss": -41.801109313964844, "global_step": 238699, "epoch": 1972} {"train_loss": -40.444488525390625, "global_step": 238700, "epoch": 1972} {"train_loss": -39.20150375366211, "global_step": 238701, "epoch": 1972} {"train_loss": -42.2724723815918, "global_step": 238702, "epoch": 1972} {"train_loss": -38.51106262207031, "global_step": 238703, "epoch": 1972} {"train_loss": -42.051143646240234, "global_step": 238704, "epoch": 1972} {"train_loss": -41.53982162475586, "global_step": 238705, "epoch": 1972} {"train_loss": -40.67414474487305, "global_step": 238706, "epoch": 1972} {"train_loss": -42.80995178222656, "global_step": 238707, "epoch": 1972} {"train_loss": -39.12065505981445, "global_step": 238708, "epoch": 1972} {"train_loss": -41.31600570678711, "global_step": 238709, "epoch": 1972} {"train_loss": -41.0846061706543, "global_step": 238710, "epoch": 1972} {"train_loss": -41.32725524902344, "global_step": 238711, "epoch": 1972} {"train_loss": -41.828826904296875, "global_step": 238712, "epoch": 1972} {"train_loss": -41.05500411987305, "global_step": 238713, "epoch": 1972} {"train_loss": -40.6133918762207, "global_step": 238714, "epoch": 1972} {"train_loss": -41.92484664916992, "global_step": 238715, "epoch": 1972} {"train_loss": -41.984474182128906, "global_step": 238716, "epoch": 1972} {"train_loss": -42.02653503417969, "global_step": 238717, "epoch": 1972} {"train_loss": -38.4119758605957, "global_step": 238718, "epoch": 1972} {"train_loss": -42.7708740234375, "global_step": 238719, "epoch": 1972} {"train_loss": -41.1684455871582, "global_step": 238720, "epoch": 1972} {"train_loss": -41.7405891418457, "global_step": 238721, "epoch": 1972} {"train_loss": -42.199623107910156, "global_step": 238722, "epoch": 1972} {"train_loss": -41.44862747192383, "global_step": 238723, "epoch": 1972} {"train_loss": -42.19025421142578, "global_step": 238724, "epoch": 1972} {"train_loss": -41.15595626831055, "global_step": 238725, "epoch": 1972} {"train_loss": -42.89973831176758, "global_step": 238726, "epoch": 1972} {"train_loss": -42.45305252075195, "global_step": 238727, "epoch": 1972} {"train_loss": -42.989620208740234, "global_step": 238728, "epoch": 1972} {"train_loss": -42.36049270629883, "global_step": 238729, "epoch": 1972} {"train_loss": -42.51839828491211, "global_step": 238730, "epoch": 1972} {"train_loss": -42.599220275878906, "global_step": 238731, "epoch": 1972} {"train_loss": -41.95029238235852, "global_step": 238732, "epoch": 1972, "val_loss": 2573305.0} {"train_loss": -43.33819580078125, "global_step": 238733, "epoch": 1973} {"train_loss": -42.8065071105957, "global_step": 238734, "epoch": 1973} {"train_loss": -42.95465850830078, "global_step": 238735, "epoch": 1973} {"train_loss": -43.43008804321289, "global_step": 238736, "epoch": 1973} {"train_loss": -43.440704345703125, "global_step": 238737, "epoch": 1973} {"train_loss": -43.19679641723633, "global_step": 238738, "epoch": 1973} {"train_loss": -42.97262954711914, "global_step": 238739, "epoch": 1973} {"train_loss": -42.66178512573242, "global_step": 238740, "epoch": 1973} {"train_loss": -42.86730194091797, "global_step": 238741, "epoch": 1973} {"train_loss": -43.475643157958984, "global_step": 238742, "epoch": 1973} {"train_loss": -42.70463180541992, "global_step": 238743, "epoch": 1973} {"train_loss": -43.165714263916016, "global_step": 238744, "epoch": 1973} {"train_loss": -43.74355697631836, "global_step": 238745, "epoch": 1973} {"train_loss": -42.64567184448242, "global_step": 238746, "epoch": 1973} {"train_loss": -43.338619232177734, "global_step": 238747, "epoch": 1973} {"train_loss": -43.462989807128906, "global_step": 238748, "epoch": 1973} {"train_loss": -43.5472412109375, "global_step": 238749, "epoch": 1973} {"train_loss": -43.162410736083984, "global_step": 238750, "epoch": 1973} {"train_loss": -43.50770568847656, "global_step": 238751, "epoch": 1973} {"train_loss": -43.37150955200195, "global_step": 238752, "epoch": 1973} {"train_loss": -43.40861892700195, "global_step": 238753, "epoch": 1973} {"train_loss": -41.60260772705078, "global_step": 238754, "epoch": 1973} {"train_loss": -42.198036193847656, "global_step": 238755, "epoch": 1973} {"train_loss": -43.470314025878906, "global_step": 238756, "epoch": 1973} {"train_loss": -43.60141372680664, "global_step": 238757, "epoch": 1973} {"train_loss": -43.49973678588867, "global_step": 238758, "epoch": 1973} {"train_loss": -42.27548599243164, "global_step": 238759, "epoch": 1973} {"train_loss": -42.29553985595703, "global_step": 238760, "epoch": 1973} {"train_loss": -43.50568389892578, "global_step": 238761, "epoch": 1973} {"train_loss": -43.54153060913086, "global_step": 238762, "epoch": 1973} {"train_loss": -42.11660385131836, "global_step": 238763, "epoch": 1973} {"train_loss": -42.66062545776367, "global_step": 238764, "epoch": 1973} {"train_loss": -43.76182174682617, "global_step": 238765, "epoch": 1973} {"train_loss": -42.739986419677734, "global_step": 238766, "epoch": 1973} {"train_loss": -42.294158935546875, "global_step": 238767, "epoch": 1973} {"train_loss": -42.23244857788086, "global_step": 238768, "epoch": 1973} {"train_loss": -43.48807907104492, "global_step": 238769, "epoch": 1973} {"train_loss": -42.3600959777832, "global_step": 238770, "epoch": 1973} {"train_loss": -41.3336296081543, "global_step": 238771, "epoch": 1973} {"train_loss": -43.04326629638672, "global_step": 238772, "epoch": 1973} {"train_loss": -41.79572677612305, "global_step": 238773, "epoch": 1973} {"train_loss": -41.343482971191406, "global_step": 238774, "epoch": 1973} {"train_loss": -43.2995719909668, "global_step": 238775, "epoch": 1973} {"train_loss": -43.02175521850586, "global_step": 238776, "epoch": 1973} {"train_loss": -42.84245300292969, "global_step": 238777, "epoch": 1973} {"train_loss": -43.57615280151367, "global_step": 238778, "epoch": 1973} {"train_loss": -42.158546447753906, "global_step": 238779, "epoch": 1973} {"train_loss": -41.1104850769043, "global_step": 238780, "epoch": 1973} {"train_loss": -41.73276901245117, "global_step": 238781, "epoch": 1973} {"train_loss": -42.6204719543457, "global_step": 238782, "epoch": 1973} {"train_loss": -43.466835021972656, "global_step": 238783, "epoch": 1973} {"train_loss": -40.30413818359375, "global_step": 238784, "epoch": 1973} {"train_loss": -41.72478485107422, "global_step": 238785, "epoch": 1973} {"train_loss": -43.215309143066406, "global_step": 238786, "epoch": 1973} {"train_loss": -41.01015090942383, "global_step": 238787, "epoch": 1973} {"train_loss": -42.45478439331055, "global_step": 238788, "epoch": 1973} {"train_loss": -43.2211799621582, "global_step": 238789, "epoch": 1973} {"train_loss": -41.40892028808594, "global_step": 238790, "epoch": 1973} {"train_loss": -42.8176155090332, "global_step": 238791, "epoch": 1973} {"train_loss": -41.86823654174805, "global_step": 238792, "epoch": 1973} {"train_loss": -42.54586410522461, "global_step": 238793, "epoch": 1973} {"train_loss": -42.954750061035156, "global_step": 238794, "epoch": 1973} {"train_loss": -36.59316635131836, "global_step": 238795, "epoch": 1973} {"train_loss": -42.52294158935547, "global_step": 238796, "epoch": 1973} {"train_loss": -36.01396560668945, "global_step": 238797, "epoch": 1973} {"train_loss": -40.031917572021484, "global_step": 238798, "epoch": 1973} {"train_loss": -42.4254150390625, "global_step": 238799, "epoch": 1973} {"train_loss": -41.93621063232422, "global_step": 238800, "epoch": 1973} {"train_loss": -40.79009246826172, "global_step": 238801, "epoch": 1973} {"train_loss": -38.664085388183594, "global_step": 238802, "epoch": 1973} {"train_loss": -41.205013275146484, "global_step": 238803, "epoch": 1973} {"train_loss": -33.848854064941406, "global_step": 238804, "epoch": 1973} {"train_loss": -33.701412200927734, "global_step": 238805, "epoch": 1973} {"train_loss": -35.30866622924805, "global_step": 238806, "epoch": 1973} {"train_loss": -39.60247802734375, "global_step": 238807, "epoch": 1973} {"train_loss": -38.87385177612305, "global_step": 238808, "epoch": 1973} {"train_loss": -39.674102783203125, "global_step": 238809, "epoch": 1973} {"train_loss": -35.712093353271484, "global_step": 238810, "epoch": 1973} {"train_loss": -33.880733489990234, "global_step": 238811, "epoch": 1973} {"train_loss": -41.0693473815918, "global_step": 238812, "epoch": 1973} {"train_loss": -39.8438720703125, "global_step": 238813, "epoch": 1973} {"train_loss": -37.6001091003418, "global_step": 238814, "epoch": 1973} {"train_loss": -40.239864349365234, "global_step": 238815, "epoch": 1973} {"train_loss": -41.316707611083984, "global_step": 238816, "epoch": 1973} {"train_loss": -39.81355667114258, "global_step": 238817, "epoch": 1973} {"train_loss": -38.958309173583984, "global_step": 238818, "epoch": 1973} {"train_loss": -36.03654098510742, "global_step": 238819, "epoch": 1973} {"train_loss": -40.8907356262207, "global_step": 238820, "epoch": 1973} {"train_loss": -40.73427963256836, "global_step": 238821, "epoch": 1973} {"train_loss": -39.76664352416992, "global_step": 238822, "epoch": 1973} {"train_loss": -40.215877532958984, "global_step": 238823, "epoch": 1973} {"train_loss": -39.49319076538086, "global_step": 238824, "epoch": 1973} {"train_loss": -39.975486755371094, "global_step": 238825, "epoch": 1973} {"train_loss": -40.927978515625, "global_step": 238826, "epoch": 1973} {"train_loss": -38.63088607788086, "global_step": 238827, "epoch": 1973} {"train_loss": -39.64069747924805, "global_step": 238828, "epoch": 1973} {"train_loss": -39.391693115234375, "global_step": 238829, "epoch": 1973} {"train_loss": -40.6962776184082, "global_step": 238830, "epoch": 1973} {"train_loss": -40.024147033691406, "global_step": 238831, "epoch": 1973} {"train_loss": -38.219329833984375, "global_step": 238832, "epoch": 1973} {"train_loss": -41.88165283203125, "global_step": 238833, "epoch": 1973} {"train_loss": -38.85293197631836, "global_step": 238834, "epoch": 1973} {"train_loss": -39.67833709716797, "global_step": 238835, "epoch": 1973} {"train_loss": -41.17460250854492, "global_step": 238836, "epoch": 1973} {"train_loss": -39.82744216918945, "global_step": 238837, "epoch": 1973} {"train_loss": -39.7926025390625, "global_step": 238838, "epoch": 1973} {"train_loss": -41.48786163330078, "global_step": 238839, "epoch": 1973} {"train_loss": -41.167484283447266, "global_step": 238840, "epoch": 1973} {"train_loss": -39.72405242919922, "global_step": 238841, "epoch": 1973} {"train_loss": -41.885746002197266, "global_step": 238842, "epoch": 1973} {"train_loss": -41.05791091918945, "global_step": 238843, "epoch": 1973} {"train_loss": -41.772090911865234, "global_step": 238844, "epoch": 1973} {"train_loss": -41.27817916870117, "global_step": 238845, "epoch": 1973} {"train_loss": -41.34237289428711, "global_step": 238846, "epoch": 1973} {"train_loss": -40.893341064453125, "global_step": 238847, "epoch": 1973} {"train_loss": -41.73711013793945, "global_step": 238848, "epoch": 1973} {"train_loss": -41.69422912597656, "global_step": 238849, "epoch": 1973} {"train_loss": -42.25215148925781, "global_step": 238850, "epoch": 1973} {"train_loss": -41.08588790893555, "global_step": 238851, "epoch": 1973} {"train_loss": -41.7016716003418, "global_step": 238852, "epoch": 1973} {"train_loss": -41.29037882276803, "global_step": 238853, "epoch": 1973, "val_loss": 2720846.25} {"train_loss": -40.82346725463867, "global_step": 238854, "epoch": 1974} {"train_loss": -42.09312057495117, "global_step": 238855, "epoch": 1974} {"train_loss": -42.15056228637695, "global_step": 238856, "epoch": 1974} {"train_loss": -41.947731018066406, "global_step": 238857, "epoch": 1974} {"train_loss": -41.90827560424805, "global_step": 238858, "epoch": 1974} {"train_loss": -41.830413818359375, "global_step": 238859, "epoch": 1974} {"train_loss": -42.59836196899414, "global_step": 238860, "epoch": 1974} {"train_loss": -40.83327865600586, "global_step": 238861, "epoch": 1974} {"train_loss": -42.28371047973633, "global_step": 238862, "epoch": 1974} {"train_loss": -42.4795036315918, "global_step": 238863, "epoch": 1974} {"train_loss": -41.69694137573242, "global_step": 238864, "epoch": 1974} {"train_loss": -41.895050048828125, "global_step": 238865, "epoch": 1974} {"train_loss": -42.47538375854492, "global_step": 238866, "epoch": 1974} {"train_loss": -42.260597229003906, "global_step": 238867, "epoch": 1974} {"train_loss": -41.65020751953125, "global_step": 238868, "epoch": 1974} {"train_loss": -42.06571578979492, "global_step": 238869, "epoch": 1974} {"train_loss": -41.94199752807617, "global_step": 238870, "epoch": 1974} {"train_loss": -42.563411712646484, "global_step": 238871, "epoch": 1974} {"train_loss": -42.26426315307617, "global_step": 238872, "epoch": 1974} {"train_loss": -41.98223876953125, "global_step": 238873, "epoch": 1974} {"train_loss": -42.9487419128418, "global_step": 238874, "epoch": 1974} {"train_loss": -41.901031494140625, "global_step": 238875, "epoch": 1974} {"train_loss": -42.73115539550781, "global_step": 238876, "epoch": 1974} {"train_loss": -42.412567138671875, "global_step": 238877, "epoch": 1974} {"train_loss": -42.953914642333984, "global_step": 238878, "epoch": 1974} {"train_loss": -43.43826675415039, "global_step": 238879, "epoch": 1974} {"train_loss": -42.81752014160156, "global_step": 238880, "epoch": 1974} {"train_loss": -43.905616760253906, "global_step": 238881, "epoch": 1974} {"train_loss": -42.612709045410156, "global_step": 238882, "epoch": 1974} {"train_loss": -43.43450927734375, "global_step": 238883, "epoch": 1974} {"train_loss": -43.26886749267578, "global_step": 238884, "epoch": 1974} {"train_loss": -42.85042953491211, "global_step": 238885, "epoch": 1974} {"train_loss": -43.0347900390625, "global_step": 238886, "epoch": 1974} {"train_loss": -42.62335205078125, "global_step": 238887, "epoch": 1974} {"train_loss": -43.646949768066406, "global_step": 238888, "epoch": 1974} {"train_loss": -43.185787200927734, "global_step": 238889, "epoch": 1974} {"train_loss": -42.748409271240234, "global_step": 238890, "epoch": 1974} {"train_loss": -42.93741989135742, "global_step": 238891, "epoch": 1974} {"train_loss": -43.33549118041992, "global_step": 238892, "epoch": 1974} {"train_loss": -44.00264358520508, "global_step": 238893, "epoch": 1974} {"train_loss": -43.14536666870117, "global_step": 238894, "epoch": 1974} {"train_loss": -42.76742172241211, "global_step": 238895, "epoch": 1974} {"train_loss": -43.44696044921875, "global_step": 238896, "epoch": 1974} {"train_loss": -42.77439498901367, "global_step": 238897, "epoch": 1974} {"train_loss": -43.11967086791992, "global_step": 238898, "epoch": 1974} {"train_loss": -43.93074417114258, "global_step": 238899, "epoch": 1974} {"train_loss": -42.652706146240234, "global_step": 238900, "epoch": 1974} {"train_loss": -42.56598663330078, "global_step": 238901, "epoch": 1974} {"train_loss": -43.060302734375, "global_step": 238902, "epoch": 1974} {"train_loss": -43.21736145019531, "global_step": 238903, "epoch": 1974} {"train_loss": -43.21555709838867, "global_step": 238904, "epoch": 1974} {"train_loss": -43.917205810546875, "global_step": 238905, "epoch": 1974} {"train_loss": -43.316070556640625, "global_step": 238906, "epoch": 1974} {"train_loss": -42.56447219848633, "global_step": 238907, "epoch": 1974} {"train_loss": -42.03760528564453, "global_step": 238908, "epoch": 1974} {"train_loss": -43.11049270629883, "global_step": 238909, "epoch": 1974} {"train_loss": -43.581363677978516, "global_step": 238910, "epoch": 1974} {"train_loss": -42.687313079833984, "global_step": 238911, "epoch": 1974} {"train_loss": -42.64579391479492, "global_step": 238912, "epoch": 1974} {"train_loss": -42.847286224365234, "global_step": 238913, "epoch": 1974} {"train_loss": -42.62147521972656, "global_step": 238914, "epoch": 1974} {"train_loss": -43.59450149536133, "global_step": 238915, "epoch": 1974} {"train_loss": -42.36698913574219, "global_step": 238916, "epoch": 1974} {"train_loss": -42.041133880615234, "global_step": 238917, "epoch": 1974} {"train_loss": -43.217044830322266, "global_step": 238918, "epoch": 1974} {"train_loss": -42.548404693603516, "global_step": 238919, "epoch": 1974} {"train_loss": -42.82474899291992, "global_step": 238920, "epoch": 1974} {"train_loss": -43.55282211303711, "global_step": 238921, "epoch": 1974} {"train_loss": -42.9214973449707, "global_step": 238922, "epoch": 1974} {"train_loss": -42.396888732910156, "global_step": 238923, "epoch": 1974} {"train_loss": -42.718135833740234, "global_step": 238924, "epoch": 1974} {"train_loss": -42.63628005981445, "global_step": 238925, "epoch": 1974} {"train_loss": -42.12150955200195, "global_step": 238926, "epoch": 1974} {"train_loss": -41.770050048828125, "global_step": 238927, "epoch": 1974} {"train_loss": -42.0654411315918, "global_step": 238928, "epoch": 1974} {"train_loss": -42.29806900024414, "global_step": 238929, "epoch": 1974} {"train_loss": -42.97597885131836, "global_step": 238930, "epoch": 1974} {"train_loss": -42.37183380126953, "global_step": 238931, "epoch": 1974} {"train_loss": -42.8458251953125, "global_step": 238932, "epoch": 1974} {"train_loss": -43.31442642211914, "global_step": 238933, "epoch": 1974} {"train_loss": -42.7248420715332, "global_step": 238934, "epoch": 1974} {"train_loss": -41.9206657409668, "global_step": 238935, "epoch": 1974} {"train_loss": -41.6074333190918, "global_step": 238936, "epoch": 1974} {"train_loss": -42.966339111328125, "global_step": 238937, "epoch": 1974} {"train_loss": -43.29413986206055, "global_step": 238938, "epoch": 1974} {"train_loss": -40.657073974609375, "global_step": 238939, "epoch": 1974} {"train_loss": -39.179664611816406, "global_step": 238940, "epoch": 1974} {"train_loss": -38.38044357299805, "global_step": 238941, "epoch": 1974} {"train_loss": -41.476226806640625, "global_step": 238942, "epoch": 1974} {"train_loss": -41.507591247558594, "global_step": 238943, "epoch": 1974} {"train_loss": -40.448883056640625, "global_step": 238944, "epoch": 1974} {"train_loss": -39.747413635253906, "global_step": 238945, "epoch": 1974} {"train_loss": -40.387725830078125, "global_step": 238946, "epoch": 1974} {"train_loss": -38.622867584228516, "global_step": 238947, "epoch": 1974} {"train_loss": -41.15700912475586, "global_step": 238948, "epoch": 1974} {"train_loss": -42.085018157958984, "global_step": 238949, "epoch": 1974} {"train_loss": -40.0117073059082, "global_step": 238950, "epoch": 1974} {"train_loss": -41.803340911865234, "global_step": 238951, "epoch": 1974} {"train_loss": -40.087982177734375, "global_step": 238952, "epoch": 1974} {"train_loss": -40.32767868041992, "global_step": 238953, "epoch": 1974} {"train_loss": -41.07556915283203, "global_step": 238954, "epoch": 1974} {"train_loss": -39.85962677001953, "global_step": 238955, "epoch": 1974} {"train_loss": -41.83060836791992, "global_step": 238956, "epoch": 1974} {"train_loss": -38.90546417236328, "global_step": 238957, "epoch": 1974} {"train_loss": -42.5776481628418, "global_step": 238958, "epoch": 1974} {"train_loss": -40.512481689453125, "global_step": 238959, "epoch": 1974} {"train_loss": -40.64593505859375, "global_step": 238960, "epoch": 1974} {"train_loss": -40.76201629638672, "global_step": 238961, "epoch": 1974} {"train_loss": -41.7056770324707, "global_step": 238962, "epoch": 1974} {"train_loss": -40.62682342529297, "global_step": 238963, "epoch": 1974} {"train_loss": -39.6987419128418, "global_step": 238964, "epoch": 1974} {"train_loss": -41.662879943847656, "global_step": 238965, "epoch": 1974} {"train_loss": -40.46502685546875, "global_step": 238966, "epoch": 1974} {"train_loss": -40.62397003173828, "global_step": 238967, "epoch": 1974} {"train_loss": -40.80881881713867, "global_step": 238968, "epoch": 1974} {"train_loss": -41.37464904785156, "global_step": 238969, "epoch": 1974} {"train_loss": -41.02295684814453, "global_step": 238970, "epoch": 1974} {"train_loss": -41.546226501464844, "global_step": 238971, "epoch": 1974} {"train_loss": -41.81142807006836, "global_step": 238972, "epoch": 1974} {"train_loss": -41.1732292175293, "global_step": 238973, "epoch": 1974} {"train_loss": -42.07981503699437, "global_step": 238974, "epoch": 1974, "val_loss": 2673987.75} {"train_loss": -42.29909896850586, "global_step": 238975, "epoch": 1975} {"train_loss": -40.25992965698242, "global_step": 238976, "epoch": 1975} {"train_loss": -41.4059944152832, "global_step": 238977, "epoch": 1975} {"train_loss": -41.19945526123047, "global_step": 238978, "epoch": 1975} {"train_loss": -40.33222198486328, "global_step": 238979, "epoch": 1975} {"train_loss": -41.978172302246094, "global_step": 238980, "epoch": 1975} {"train_loss": -41.71242904663086, "global_step": 238981, "epoch": 1975} {"train_loss": -41.131431579589844, "global_step": 238982, "epoch": 1975} {"train_loss": -42.80047607421875, "global_step": 238983, "epoch": 1975} {"train_loss": -41.2539176940918, "global_step": 238984, "epoch": 1975} {"train_loss": -41.83852767944336, "global_step": 238985, "epoch": 1975} {"train_loss": -43.35579299926758, "global_step": 238986, "epoch": 1975} {"train_loss": -41.75019073486328, "global_step": 238987, "epoch": 1975} {"train_loss": -42.1058349609375, "global_step": 238988, "epoch": 1975} {"train_loss": -42.319496154785156, "global_step": 238989, "epoch": 1975} {"train_loss": -41.6303596496582, "global_step": 238990, "epoch": 1975} {"train_loss": -43.06793212890625, "global_step": 238991, "epoch": 1975} {"train_loss": -41.83443832397461, "global_step": 238992, "epoch": 1975} {"train_loss": -42.06515884399414, "global_step": 238993, "epoch": 1975} {"train_loss": -42.22793197631836, "global_step": 238994, "epoch": 1975} {"train_loss": -42.20241165161133, "global_step": 238995, "epoch": 1975} {"train_loss": -42.73102569580078, "global_step": 238996, "epoch": 1975} {"train_loss": -41.53266525268555, "global_step": 238997, "epoch": 1975} {"train_loss": -42.41365051269531, "global_step": 238998, "epoch": 1975} {"train_loss": -42.80908966064453, "global_step": 238999, "epoch": 1975} {"train_loss": -41.876853942871094, "global_step": 239000, "epoch": 1975} {"train_loss": -42.8529052734375, "global_step": 239001, "epoch": 1975} {"train_loss": -41.773460388183594, "global_step": 239002, "epoch": 1975} {"train_loss": -43.11707305908203, "global_step": 239003, "epoch": 1975} {"train_loss": -42.84383773803711, "global_step": 239004, "epoch": 1975} {"train_loss": -42.74521255493164, "global_step": 239005, "epoch": 1975} {"train_loss": -42.596275329589844, "global_step": 239006, "epoch": 1975} {"train_loss": -43.44071578979492, "global_step": 239007, "epoch": 1975} {"train_loss": -42.0413932800293, "global_step": 239008, "epoch": 1975} {"train_loss": -43.0604362487793, "global_step": 239009, "epoch": 1975} {"train_loss": -42.30430221557617, "global_step": 239010, "epoch": 1975} {"train_loss": -42.820796966552734, "global_step": 239011, "epoch": 1975} {"train_loss": -43.1092414855957, "global_step": 239012, "epoch": 1975} {"train_loss": -43.304344177246094, "global_step": 239013, "epoch": 1975} {"train_loss": -43.53605270385742, "global_step": 239014, "epoch": 1975} {"train_loss": -43.67094039916992, "global_step": 239015, "epoch": 1975} {"train_loss": -43.27903747558594, "global_step": 239016, "epoch": 1975} {"train_loss": -43.32794952392578, "global_step": 239017, "epoch": 1975} {"train_loss": -43.519771575927734, "global_step": 239018, "epoch": 1975} {"train_loss": -43.641231536865234, "global_step": 239019, "epoch": 1975} {"train_loss": -43.71229553222656, "global_step": 239020, "epoch": 1975} {"train_loss": -43.78852462768555, "global_step": 239021, "epoch": 1975} {"train_loss": -43.624149322509766, "global_step": 239022, "epoch": 1975} {"train_loss": -42.670467376708984, "global_step": 239023, "epoch": 1975} {"train_loss": -43.399208068847656, "global_step": 239024, "epoch": 1975} {"train_loss": -43.75315475463867, "global_step": 239025, "epoch": 1975} {"train_loss": -43.573448181152344, "global_step": 239026, "epoch": 1975} {"train_loss": -43.984092712402344, "global_step": 239027, "epoch": 1975} {"train_loss": -44.075740814208984, "global_step": 239028, "epoch": 1975} {"train_loss": -43.225582122802734, "global_step": 239029, "epoch": 1975} {"train_loss": -43.41013717651367, "global_step": 239030, "epoch": 1975} {"train_loss": -42.97101974487305, "global_step": 239031, "epoch": 1975} {"train_loss": -44.28193283081055, "global_step": 239032, "epoch": 1975} {"train_loss": -43.12694549560547, "global_step": 239033, "epoch": 1975} {"train_loss": -43.316104888916016, "global_step": 239034, "epoch": 1975} {"train_loss": -42.011077880859375, "global_step": 239035, "epoch": 1975} {"train_loss": -43.678470611572266, "global_step": 239036, "epoch": 1975} {"train_loss": -43.6327018737793, "global_step": 239037, "epoch": 1975} {"train_loss": -42.878822326660156, "global_step": 239038, "epoch": 1975} {"train_loss": -42.75638961791992, "global_step": 239039, "epoch": 1975} {"train_loss": -43.36919403076172, "global_step": 239040, "epoch": 1975} {"train_loss": -40.97930145263672, "global_step": 239041, "epoch": 1975} {"train_loss": -40.14797592163086, "global_step": 239042, "epoch": 1975} {"train_loss": -37.88078689575195, "global_step": 239043, "epoch": 1975} {"train_loss": -39.421722412109375, "global_step": 239044, "epoch": 1975} {"train_loss": -40.818817138671875, "global_step": 239045, "epoch": 1975} {"train_loss": -39.783721923828125, "global_step": 239046, "epoch": 1975} {"train_loss": -40.565486907958984, "global_step": 239047, "epoch": 1975} {"train_loss": -41.572750091552734, "global_step": 239048, "epoch": 1975} {"train_loss": -39.15509796142578, "global_step": 239049, "epoch": 1975} {"train_loss": -42.445037841796875, "global_step": 239050, "epoch": 1975} {"train_loss": -42.30271530151367, "global_step": 239051, "epoch": 1975} {"train_loss": -41.018409729003906, "global_step": 239052, "epoch": 1975} {"train_loss": -40.7697868347168, "global_step": 239053, "epoch": 1975} {"train_loss": -41.228790283203125, "global_step": 239054, "epoch": 1975} {"train_loss": -40.71108627319336, "global_step": 239055, "epoch": 1975} {"train_loss": -41.473854064941406, "global_step": 239056, "epoch": 1975} {"train_loss": -40.14658737182617, "global_step": 239057, "epoch": 1975} {"train_loss": -41.515625, "global_step": 239058, "epoch": 1975} {"train_loss": -41.2348518371582, "global_step": 239059, "epoch": 1975} {"train_loss": -42.31521224975586, "global_step": 239060, "epoch": 1975} {"train_loss": -42.04118728637695, "global_step": 239061, "epoch": 1975} {"train_loss": -41.602081298828125, "global_step": 239062, "epoch": 1975} {"train_loss": -42.316070556640625, "global_step": 239063, "epoch": 1975} {"train_loss": -42.20673370361328, "global_step": 239064, "epoch": 1975} {"train_loss": -41.80961990356445, "global_step": 239065, "epoch": 1975} {"train_loss": -41.720577239990234, "global_step": 239066, "epoch": 1975} {"train_loss": -42.927764892578125, "global_step": 239067, "epoch": 1975} {"train_loss": -41.46964645385742, "global_step": 239068, "epoch": 1975} {"train_loss": -40.38068771362305, "global_step": 239069, "epoch": 1975} {"train_loss": -41.69611740112305, "global_step": 239070, "epoch": 1975} {"train_loss": -41.8221549987793, "global_step": 239071, "epoch": 1975} {"train_loss": -42.5307502746582, "global_step": 239072, "epoch": 1975} {"train_loss": -42.53106689453125, "global_step": 239073, "epoch": 1975} {"train_loss": -42.42557144165039, "global_step": 239074, "epoch": 1975} {"train_loss": -42.682838439941406, "global_step": 239075, "epoch": 1975} {"train_loss": -43.209529876708984, "global_step": 239076, "epoch": 1975} {"train_loss": -42.46944046020508, "global_step": 239077, "epoch": 1975} {"train_loss": -42.487728118896484, "global_step": 239078, "epoch": 1975} {"train_loss": -42.52021789550781, "global_step": 239079, "epoch": 1975} {"train_loss": -43.26479721069336, "global_step": 239080, "epoch": 1975} {"train_loss": -43.092220306396484, "global_step": 239081, "epoch": 1975} {"train_loss": -42.78985595703125, "global_step": 239082, "epoch": 1975} {"train_loss": -43.17385482788086, "global_step": 239083, "epoch": 1975} {"train_loss": -43.29941940307617, "global_step": 239084, "epoch": 1975} {"train_loss": -42.82034683227539, "global_step": 239085, "epoch": 1975} {"train_loss": -43.46519088745117, "global_step": 239086, "epoch": 1975} {"train_loss": -43.09420394897461, "global_step": 239087, "epoch": 1975} {"train_loss": -43.659786224365234, "global_step": 239088, "epoch": 1975} {"train_loss": -43.42445755004883, "global_step": 239089, "epoch": 1975} {"train_loss": -43.19268798828125, "global_step": 239090, "epoch": 1975} {"train_loss": -43.209251403808594, "global_step": 239091, "epoch": 1975} {"train_loss": -42.73429489135742, "global_step": 239092, "epoch": 1975} {"train_loss": -43.4881706237793, "global_step": 239093, "epoch": 1975} {"train_loss": -43.898799896240234, "global_step": 239094, "epoch": 1975} {"train_loss": -42.371443031247985, "global_step": 239095, "epoch": 1975, "val_loss": 2685010.0} {"train_loss": -43.16592025756836, "global_step": 239096, "epoch": 1976} {"train_loss": -43.862098693847656, "global_step": 239097, "epoch": 1976} {"train_loss": -43.11135482788086, "global_step": 239098, "epoch": 1976} {"train_loss": -43.26311111450195, "global_step": 239099, "epoch": 1976} {"train_loss": -42.773311614990234, "global_step": 239100, "epoch": 1976} {"train_loss": -43.38493347167969, "global_step": 239101, "epoch": 1976} {"train_loss": -43.101985931396484, "global_step": 239102, "epoch": 1976} {"train_loss": -43.09677505493164, "global_step": 239103, "epoch": 1976} {"train_loss": -42.85338592529297, "global_step": 239104, "epoch": 1976} {"train_loss": -43.55121612548828, "global_step": 239105, "epoch": 1976} {"train_loss": -43.483882904052734, "global_step": 239106, "epoch": 1976} {"train_loss": -43.4023551940918, "global_step": 239107, "epoch": 1976} {"train_loss": -43.51747512817383, "global_step": 239108, "epoch": 1976} {"train_loss": -43.5869026184082, "global_step": 239109, "epoch": 1976} {"train_loss": -43.263362884521484, "global_step": 239110, "epoch": 1976} {"train_loss": -43.80608367919922, "global_step": 239111, "epoch": 1976} {"train_loss": -43.868412017822266, "global_step": 239112, "epoch": 1976} {"train_loss": -43.86753845214844, "global_step": 239113, "epoch": 1976} {"train_loss": -43.81874465942383, "global_step": 239114, "epoch": 1976} {"train_loss": -43.68620681762695, "global_step": 239115, "epoch": 1976} {"train_loss": -44.3460693359375, "global_step": 239116, "epoch": 1976} {"train_loss": -43.831024169921875, "global_step": 239117, "epoch": 1976} {"train_loss": -43.687599182128906, "global_step": 239118, "epoch": 1976} {"train_loss": -43.41831588745117, "global_step": 239119, "epoch": 1976} {"train_loss": -42.83051300048828, "global_step": 239120, "epoch": 1976} {"train_loss": -43.46285629272461, "global_step": 239121, "epoch": 1976} {"train_loss": -42.47227478027344, "global_step": 239122, "epoch": 1976} {"train_loss": -43.81708526611328, "global_step": 239123, "epoch": 1976} {"train_loss": -44.284969329833984, "global_step": 239124, "epoch": 1976} {"train_loss": -43.784584045410156, "global_step": 239125, "epoch": 1976} {"train_loss": -41.731300354003906, "global_step": 239126, "epoch": 1976} {"train_loss": -39.34579086303711, "global_step": 239127, "epoch": 1976} {"train_loss": -43.062774658203125, "global_step": 239128, "epoch": 1976} {"train_loss": -42.179012298583984, "global_step": 239129, "epoch": 1976} {"train_loss": -42.133277893066406, "global_step": 239130, "epoch": 1976} {"train_loss": -40.219482421875, "global_step": 239131, "epoch": 1976} {"train_loss": -41.73262405395508, "global_step": 239132, "epoch": 1976} {"train_loss": -43.21833419799805, "global_step": 239133, "epoch": 1976} {"train_loss": -42.20270919799805, "global_step": 239134, "epoch": 1976} {"train_loss": -41.23920822143555, "global_step": 239135, "epoch": 1976} {"train_loss": -40.59746551513672, "global_step": 239136, "epoch": 1976} {"train_loss": -42.25614547729492, "global_step": 239137, "epoch": 1976} {"train_loss": -42.334205627441406, "global_step": 239138, "epoch": 1976} {"train_loss": -42.17791748046875, "global_step": 239139, "epoch": 1976} {"train_loss": -41.357662200927734, "global_step": 239140, "epoch": 1976} {"train_loss": -42.01102828979492, "global_step": 239141, "epoch": 1976} {"train_loss": -41.298519134521484, "global_step": 239142, "epoch": 1976} {"train_loss": -41.150115966796875, "global_step": 239143, "epoch": 1976} {"train_loss": -39.50712966918945, "global_step": 239144, "epoch": 1976} {"train_loss": -42.213661193847656, "global_step": 239145, "epoch": 1976} {"train_loss": -40.769775390625, "global_step": 239146, "epoch": 1976} {"train_loss": -39.17165756225586, "global_step": 239147, "epoch": 1976} {"train_loss": -42.78832244873047, "global_step": 239148, "epoch": 1976} {"train_loss": -39.518821716308594, "global_step": 239149, "epoch": 1976} {"train_loss": -40.960304260253906, "global_step": 239150, "epoch": 1976} {"train_loss": -42.586185455322266, "global_step": 239151, "epoch": 1976} {"train_loss": -40.9829216003418, "global_step": 239152, "epoch": 1976} {"train_loss": -40.81895446777344, "global_step": 239153, "epoch": 1976} {"train_loss": -42.957115173339844, "global_step": 239154, "epoch": 1976} {"train_loss": -39.84956741333008, "global_step": 239155, "epoch": 1976} {"train_loss": -42.065433502197266, "global_step": 239156, "epoch": 1976} {"train_loss": -41.05540084838867, "global_step": 239157, "epoch": 1976} {"train_loss": -41.815731048583984, "global_step": 239158, "epoch": 1976} {"train_loss": -41.51631164550781, "global_step": 239159, "epoch": 1976} {"train_loss": -42.3825798034668, "global_step": 239160, "epoch": 1976} {"train_loss": -41.24308395385742, "global_step": 239161, "epoch": 1976} {"train_loss": -42.278564453125, "global_step": 239162, "epoch": 1976} {"train_loss": -41.7017707824707, "global_step": 239163, "epoch": 1976} {"train_loss": -40.97910690307617, "global_step": 239164, "epoch": 1976} {"train_loss": -42.13804626464844, "global_step": 239165, "epoch": 1976} {"train_loss": -41.655765533447266, "global_step": 239166, "epoch": 1976} {"train_loss": -42.178871154785156, "global_step": 239167, "epoch": 1976} {"train_loss": -42.31599044799805, "global_step": 239168, "epoch": 1976} {"train_loss": -41.77901077270508, "global_step": 239169, "epoch": 1976} {"train_loss": -42.43301010131836, "global_step": 239170, "epoch": 1976} {"train_loss": -42.02036666870117, "global_step": 239171, "epoch": 1976} {"train_loss": -42.57917404174805, "global_step": 239172, "epoch": 1976} {"train_loss": -43.17527770996094, "global_step": 239173, "epoch": 1976} {"train_loss": -42.687408447265625, "global_step": 239174, "epoch": 1976} {"train_loss": -41.66559600830078, "global_step": 239175, "epoch": 1976} {"train_loss": -42.4342041015625, "global_step": 239176, "epoch": 1976} {"train_loss": -42.635231018066406, "global_step": 239177, "epoch": 1976} {"train_loss": -42.74609375, "global_step": 239178, "epoch": 1976} {"train_loss": -42.291439056396484, "global_step": 239179, "epoch": 1976} {"train_loss": -42.1128044128418, "global_step": 239180, "epoch": 1976} {"train_loss": -42.9713020324707, "global_step": 239181, "epoch": 1976} {"train_loss": -43.022705078125, "global_step": 239182, "epoch": 1976} {"train_loss": -42.881011962890625, "global_step": 239183, "epoch": 1976} {"train_loss": -43.166481018066406, "global_step": 239184, "epoch": 1976} {"train_loss": -43.03580856323242, "global_step": 239185, "epoch": 1976} {"train_loss": -43.40907669067383, "global_step": 239186, "epoch": 1976} {"train_loss": -43.337310791015625, "global_step": 239187, "epoch": 1976} {"train_loss": -42.72214889526367, "global_step": 239188, "epoch": 1976} {"train_loss": -43.369468688964844, "global_step": 239189, "epoch": 1976} {"train_loss": -42.526336669921875, "global_step": 239190, "epoch": 1976} {"train_loss": -42.86576843261719, "global_step": 239191, "epoch": 1976} {"train_loss": -43.62872314453125, "global_step": 239192, "epoch": 1976} {"train_loss": -42.817970275878906, "global_step": 239193, "epoch": 1976} {"train_loss": -43.59933090209961, "global_step": 239194, "epoch": 1976} {"train_loss": -43.38851547241211, "global_step": 239195, "epoch": 1976} {"train_loss": -43.412784576416016, "global_step": 239196, "epoch": 1976} {"train_loss": -43.71321487426758, "global_step": 239197, "epoch": 1976} {"train_loss": -43.816097259521484, "global_step": 239198, "epoch": 1976} {"train_loss": -43.08716583251953, "global_step": 239199, "epoch": 1976} {"train_loss": -43.9774284362793, "global_step": 239200, "epoch": 1976} {"train_loss": -43.0422248840332, "global_step": 239201, "epoch": 1976} {"train_loss": -43.78159713745117, "global_step": 239202, "epoch": 1976} {"train_loss": -43.237213134765625, "global_step": 239203, "epoch": 1976} {"train_loss": -43.758968353271484, "global_step": 239204, "epoch": 1976} {"train_loss": -43.825679779052734, "global_step": 239205, "epoch": 1976} {"train_loss": -42.646820068359375, "global_step": 239206, "epoch": 1976} {"train_loss": -43.80335235595703, "global_step": 239207, "epoch": 1976} {"train_loss": -43.55614471435547, "global_step": 239208, "epoch": 1976} {"train_loss": -43.747108459472656, "global_step": 239209, "epoch": 1976} {"train_loss": -43.93146896362305, "global_step": 239210, "epoch": 1976} {"train_loss": -43.70510482788086, "global_step": 239211, "epoch": 1976} {"train_loss": -43.9588737487793, "global_step": 239212, "epoch": 1976} {"train_loss": -44.310123443603516, "global_step": 239213, "epoch": 1976} {"train_loss": -43.870967864990234, "global_step": 239214, "epoch": 1976} {"train_loss": -44.14992904663086, "global_step": 239215, "epoch": 1976} {"train_loss": -42.663641464611715, "global_step": 239216, "epoch": 1976, "val_loss": 2677819.25} {"train_loss": -43.78547286987305, "global_step": 239217, "epoch": 1977} {"train_loss": -43.700714111328125, "global_step": 239218, "epoch": 1977} {"train_loss": -43.54960250854492, "global_step": 239219, "epoch": 1977} {"train_loss": -42.74379348754883, "global_step": 239220, "epoch": 1977} {"train_loss": -43.60935592651367, "global_step": 239221, "epoch": 1977} {"train_loss": -43.543251037597656, "global_step": 239222, "epoch": 1977} {"train_loss": -44.4426155090332, "global_step": 239223, "epoch": 1977} {"train_loss": -43.8543815612793, "global_step": 239224, "epoch": 1977} {"train_loss": -43.66896438598633, "global_step": 239225, "epoch": 1977} {"train_loss": -43.75723648071289, "global_step": 239226, "epoch": 1977} {"train_loss": -42.445335388183594, "global_step": 239227, "epoch": 1977} {"train_loss": -39.673763275146484, "global_step": 239228, "epoch": 1977} {"train_loss": -39.68699264526367, "global_step": 239229, "epoch": 1977} {"train_loss": -42.203834533691406, "global_step": 239230, "epoch": 1977} {"train_loss": -43.00828552246094, "global_step": 239231, "epoch": 1977} {"train_loss": -41.06687927246094, "global_step": 239232, "epoch": 1977} {"train_loss": -40.50799560546875, "global_step": 239233, "epoch": 1977} {"train_loss": -42.31211471557617, "global_step": 239234, "epoch": 1977} {"train_loss": -43.971961975097656, "global_step": 239235, "epoch": 1977} {"train_loss": -42.37781524658203, "global_step": 239236, "epoch": 1977} {"train_loss": -42.38149642944336, "global_step": 239237, "epoch": 1977} {"train_loss": -41.97571563720703, "global_step": 239238, "epoch": 1977} {"train_loss": -43.36384201049805, "global_step": 239239, "epoch": 1977} {"train_loss": -42.5937614440918, "global_step": 239240, "epoch": 1977} {"train_loss": -42.8714485168457, "global_step": 239241, "epoch": 1977} {"train_loss": -43.054744720458984, "global_step": 239242, "epoch": 1977} {"train_loss": -42.54950714111328, "global_step": 239243, "epoch": 1977} {"train_loss": -42.575950622558594, "global_step": 239244, "epoch": 1977} {"train_loss": -42.82350540161133, "global_step": 239245, "epoch": 1977} {"train_loss": -43.03358840942383, "global_step": 239246, "epoch": 1977} {"train_loss": -42.73051452636719, "global_step": 239247, "epoch": 1977} {"train_loss": -41.94735336303711, "global_step": 239248, "epoch": 1977} {"train_loss": -39.328426361083984, "global_step": 239249, "epoch": 1977} {"train_loss": -41.540706634521484, "global_step": 239250, "epoch": 1977} {"train_loss": -41.862945556640625, "global_step": 239251, "epoch": 1977} {"train_loss": -41.84308624267578, "global_step": 239252, "epoch": 1977} {"train_loss": -40.945884704589844, "global_step": 239253, "epoch": 1977} {"train_loss": -42.42781448364258, "global_step": 239254, "epoch": 1977} {"train_loss": -42.71250534057617, "global_step": 239255, "epoch": 1977} {"train_loss": -40.58657455444336, "global_step": 239256, "epoch": 1977} {"train_loss": -41.474727630615234, "global_step": 239257, "epoch": 1977} {"train_loss": -40.091854095458984, "global_step": 239258, "epoch": 1977} {"train_loss": -42.65810775756836, "global_step": 239259, "epoch": 1977} {"train_loss": -40.290714263916016, "global_step": 239260, "epoch": 1977} {"train_loss": -42.118709564208984, "global_step": 239261, "epoch": 1977} {"train_loss": -41.355712890625, "global_step": 239262, "epoch": 1977} {"train_loss": -41.80713653564453, "global_step": 239263, "epoch": 1977} {"train_loss": -42.80110549926758, "global_step": 239264, "epoch": 1977} {"train_loss": -41.002079010009766, "global_step": 239265, "epoch": 1977} {"train_loss": -42.568763732910156, "global_step": 239266, "epoch": 1977} {"train_loss": -42.170467376708984, "global_step": 239267, "epoch": 1977} {"train_loss": -42.30780029296875, "global_step": 239268, "epoch": 1977} {"train_loss": -43.538246154785156, "global_step": 239269, "epoch": 1977} {"train_loss": -42.47370529174805, "global_step": 239270, "epoch": 1977} {"train_loss": -41.824092864990234, "global_step": 239271, "epoch": 1977} {"train_loss": -43.47636032104492, "global_step": 239272, "epoch": 1977} {"train_loss": -42.82129669189453, "global_step": 239273, "epoch": 1977} {"train_loss": -42.38213348388672, "global_step": 239274, "epoch": 1977} {"train_loss": -44.2652587890625, "global_step": 239275, "epoch": 1977} {"train_loss": -42.49980926513672, "global_step": 239276, "epoch": 1977} {"train_loss": -42.773170471191406, "global_step": 239277, "epoch": 1977} {"train_loss": -41.8868522644043, "global_step": 239278, "epoch": 1977} {"train_loss": -41.5275764465332, "global_step": 239279, "epoch": 1977} {"train_loss": -43.14963150024414, "global_step": 239280, "epoch": 1977} {"train_loss": -43.07448959350586, "global_step": 239281, "epoch": 1977} {"train_loss": -42.54408645629883, "global_step": 239282, "epoch": 1977} {"train_loss": -42.9387321472168, "global_step": 239283, "epoch": 1977} {"train_loss": -43.05732345581055, "global_step": 239284, "epoch": 1977} {"train_loss": -43.150211334228516, "global_step": 239285, "epoch": 1977} {"train_loss": -43.205928802490234, "global_step": 239286, "epoch": 1977} {"train_loss": -42.90940475463867, "global_step": 239287, "epoch": 1977} {"train_loss": -42.41530990600586, "global_step": 239288, "epoch": 1977} {"train_loss": -43.1285400390625, "global_step": 239289, "epoch": 1977} {"train_loss": -43.557106018066406, "global_step": 239290, "epoch": 1977} {"train_loss": -42.71745681762695, "global_step": 239291, "epoch": 1977} {"train_loss": -43.636375427246094, "global_step": 239292, "epoch": 1977} {"train_loss": -42.997474670410156, "global_step": 239293, "epoch": 1977} {"train_loss": -43.585601806640625, "global_step": 239294, "epoch": 1977} {"train_loss": -43.32958221435547, "global_step": 239295, "epoch": 1977} {"train_loss": -43.111141204833984, "global_step": 239296, "epoch": 1977} {"train_loss": -42.34711837768555, "global_step": 239297, "epoch": 1977} {"train_loss": -42.88396453857422, "global_step": 239298, "epoch": 1977} {"train_loss": -43.32820510864258, "global_step": 239299, "epoch": 1977} {"train_loss": -43.179527282714844, "global_step": 239300, "epoch": 1977} {"train_loss": -42.81145095825195, "global_step": 239301, "epoch": 1977} {"train_loss": -42.754634857177734, "global_step": 239302, "epoch": 1977} {"train_loss": -43.27260971069336, "global_step": 239303, "epoch": 1977} {"train_loss": -42.573829650878906, "global_step": 239304, "epoch": 1977} {"train_loss": -42.55862045288086, "global_step": 239305, "epoch": 1977} {"train_loss": -42.91605758666992, "global_step": 239306, "epoch": 1977} {"train_loss": -43.20716857910156, "global_step": 239307, "epoch": 1977} {"train_loss": -43.11397933959961, "global_step": 239308, "epoch": 1977} {"train_loss": -43.65243148803711, "global_step": 239309, "epoch": 1977} {"train_loss": -42.93815231323242, "global_step": 239310, "epoch": 1977} {"train_loss": -42.963523864746094, "global_step": 239311, "epoch": 1977} {"train_loss": -43.887550354003906, "global_step": 239312, "epoch": 1977} {"train_loss": -43.4753532409668, "global_step": 239313, "epoch": 1977} {"train_loss": -41.51539611816406, "global_step": 239314, "epoch": 1977} {"train_loss": -42.77374267578125, "global_step": 239315, "epoch": 1977} {"train_loss": -42.83464431762695, "global_step": 239316, "epoch": 1977} {"train_loss": -40.98104476928711, "global_step": 239317, "epoch": 1977} {"train_loss": -41.225154876708984, "global_step": 239318, "epoch": 1977} {"train_loss": -42.096534729003906, "global_step": 239319, "epoch": 1977} {"train_loss": -40.59077835083008, "global_step": 239320, "epoch": 1977} {"train_loss": -40.752376556396484, "global_step": 239321, "epoch": 1977} {"train_loss": -40.19894027709961, "global_step": 239322, "epoch": 1977} {"train_loss": -42.891448974609375, "global_step": 239323, "epoch": 1977} {"train_loss": -40.40982437133789, "global_step": 239324, "epoch": 1977} {"train_loss": -42.68351364135742, "global_step": 239325, "epoch": 1977} {"train_loss": -41.385005950927734, "global_step": 239326, "epoch": 1977} {"train_loss": -41.6672477722168, "global_step": 239327, "epoch": 1977} {"train_loss": -42.79783248901367, "global_step": 239328, "epoch": 1977} {"train_loss": -41.306488037109375, "global_step": 239329, "epoch": 1977} {"train_loss": -42.6496467590332, "global_step": 239330, "epoch": 1977} {"train_loss": -42.38076400756836, "global_step": 239331, "epoch": 1977} {"train_loss": -42.401275634765625, "global_step": 239332, "epoch": 1977} {"train_loss": -43.41575241088867, "global_step": 239333, "epoch": 1977} {"train_loss": -42.06626510620117, "global_step": 239334, "epoch": 1977} {"train_loss": -42.047203063964844, "global_step": 239335, "epoch": 1977} {"train_loss": -41.85128402709961, "global_step": 239336, "epoch": 1977} {"train_loss": -42.453875833306434, "global_step": 239337, "epoch": 1977, "val_loss": 2662603.0} {"train_loss": -43.251625061035156, "global_step": 239338, "epoch": 1978} {"train_loss": -42.27386474609375, "global_step": 239339, "epoch": 1978} {"train_loss": -42.49061965942383, "global_step": 239340, "epoch": 1978} {"train_loss": -42.15439987182617, "global_step": 239341, "epoch": 1978} {"train_loss": -42.27754592895508, "global_step": 239342, "epoch": 1978} {"train_loss": -42.85862350463867, "global_step": 239343, "epoch": 1978} {"train_loss": -42.2531852722168, "global_step": 239344, "epoch": 1978} {"train_loss": -42.53799057006836, "global_step": 239345, "epoch": 1978} {"train_loss": -42.907203674316406, "global_step": 239346, "epoch": 1978} {"train_loss": -42.56882858276367, "global_step": 239347, "epoch": 1978} {"train_loss": -43.34931564331055, "global_step": 239348, "epoch": 1978} {"train_loss": -43.0534782409668, "global_step": 239349, "epoch": 1978} {"train_loss": -43.19160079956055, "global_step": 239350, "epoch": 1978} {"train_loss": -43.12993240356445, "global_step": 239351, "epoch": 1978} {"train_loss": -43.423797607421875, "global_step": 239352, "epoch": 1978} {"train_loss": -43.403228759765625, "global_step": 239353, "epoch": 1978} {"train_loss": -43.504180908203125, "global_step": 239354, "epoch": 1978} {"train_loss": -43.01005172729492, "global_step": 239355, "epoch": 1978} {"train_loss": -44.023738861083984, "global_step": 239356, "epoch": 1978} {"train_loss": -43.49972915649414, "global_step": 239357, "epoch": 1978} {"train_loss": -43.984169006347656, "global_step": 239358, "epoch": 1978} {"train_loss": -43.4746208190918, "global_step": 239359, "epoch": 1978} {"train_loss": -43.090087890625, "global_step": 239360, "epoch": 1978} {"train_loss": -42.855159759521484, "global_step": 239361, "epoch": 1978} {"train_loss": -43.75204086303711, "global_step": 239362, "epoch": 1978} {"train_loss": -43.6085319519043, "global_step": 239363, "epoch": 1978} {"train_loss": -42.78645706176758, "global_step": 239364, "epoch": 1978} {"train_loss": -43.4915885925293, "global_step": 239365, "epoch": 1978} {"train_loss": -43.58948516845703, "global_step": 239366, "epoch": 1978} {"train_loss": -43.68276596069336, "global_step": 239367, "epoch": 1978} {"train_loss": -43.48244094848633, "global_step": 239368, "epoch": 1978} {"train_loss": -42.93821334838867, "global_step": 239369, "epoch": 1978} {"train_loss": -43.62429428100586, "global_step": 239370, "epoch": 1978} {"train_loss": -43.289058685302734, "global_step": 239371, "epoch": 1978} {"train_loss": -42.3082389831543, "global_step": 239372, "epoch": 1978} {"train_loss": -42.71662902832031, "global_step": 239373, "epoch": 1978} {"train_loss": -43.475337982177734, "global_step": 239374, "epoch": 1978} {"train_loss": -42.34043884277344, "global_step": 239375, "epoch": 1978} {"train_loss": -42.7100715637207, "global_step": 239376, "epoch": 1978} {"train_loss": -43.28559494018555, "global_step": 239377, "epoch": 1978} {"train_loss": -43.01005935668945, "global_step": 239378, "epoch": 1978} {"train_loss": -42.30619430541992, "global_step": 239379, "epoch": 1978} {"train_loss": -43.09214782714844, "global_step": 239380, "epoch": 1978} {"train_loss": -41.88142776489258, "global_step": 239381, "epoch": 1978} {"train_loss": -42.48809051513672, "global_step": 239382, "epoch": 1978} {"train_loss": -42.672203063964844, "global_step": 239383, "epoch": 1978} {"train_loss": -43.10813903808594, "global_step": 239384, "epoch": 1978} {"train_loss": -43.22495651245117, "global_step": 239385, "epoch": 1978} {"train_loss": -42.57078552246094, "global_step": 239386, "epoch": 1978} {"train_loss": -42.27342224121094, "global_step": 239387, "epoch": 1978} {"train_loss": -43.153934478759766, "global_step": 239388, "epoch": 1978} {"train_loss": -41.442359924316406, "global_step": 239389, "epoch": 1978} {"train_loss": -43.21424102783203, "global_step": 239390, "epoch": 1978} {"train_loss": -41.76493835449219, "global_step": 239391, "epoch": 1978} {"train_loss": -42.608314514160156, "global_step": 239392, "epoch": 1978} {"train_loss": -43.315975189208984, "global_step": 239393, "epoch": 1978} {"train_loss": -41.820343017578125, "global_step": 239394, "epoch": 1978} {"train_loss": -43.298423767089844, "global_step": 239395, "epoch": 1978} {"train_loss": -43.17822265625, "global_step": 239396, "epoch": 1978} {"train_loss": -43.22627639770508, "global_step": 239397, "epoch": 1978} {"train_loss": -43.3654670715332, "global_step": 239398, "epoch": 1978} {"train_loss": -43.71214294433594, "global_step": 239399, "epoch": 1978} {"train_loss": -43.151424407958984, "global_step": 239400, "epoch": 1978} {"train_loss": -43.22210693359375, "global_step": 239401, "epoch": 1978} {"train_loss": -43.24583053588867, "global_step": 239402, "epoch": 1978} {"train_loss": -43.394859313964844, "global_step": 239403, "epoch": 1978} {"train_loss": -43.68941879272461, "global_step": 239404, "epoch": 1978} {"train_loss": -44.1331901550293, "global_step": 239405, "epoch": 1978} {"train_loss": -43.59600067138672, "global_step": 239406, "epoch": 1978} {"train_loss": -43.387569427490234, "global_step": 239407, "epoch": 1978} {"train_loss": -43.845375061035156, "global_step": 239408, "epoch": 1978} {"train_loss": -43.55344772338867, "global_step": 239409, "epoch": 1978} {"train_loss": -44.14427947998047, "global_step": 239410, "epoch": 1978} {"train_loss": -44.094905853271484, "global_step": 239411, "epoch": 1978} {"train_loss": -43.81437683105469, "global_step": 239412, "epoch": 1978} {"train_loss": -43.76215362548828, "global_step": 239413, "epoch": 1978} {"train_loss": -44.1272087097168, "global_step": 239414, "epoch": 1978} {"train_loss": -43.8095703125, "global_step": 239415, "epoch": 1978} {"train_loss": -44.340789794921875, "global_step": 239416, "epoch": 1978} {"train_loss": -44.39778137207031, "global_step": 239417, "epoch": 1978} {"train_loss": -43.51431655883789, "global_step": 239418, "epoch": 1978} {"train_loss": -42.65004348754883, "global_step": 239419, "epoch": 1978} {"train_loss": -41.26740646362305, "global_step": 239420, "epoch": 1978} {"train_loss": -41.710689544677734, "global_step": 239421, "epoch": 1978} {"train_loss": -43.39214324951172, "global_step": 239422, "epoch": 1978} {"train_loss": -43.21040725708008, "global_step": 239423, "epoch": 1978} {"train_loss": -41.74359130859375, "global_step": 239424, "epoch": 1978} {"train_loss": -43.0120849609375, "global_step": 239425, "epoch": 1978} {"train_loss": -43.20418930053711, "global_step": 239426, "epoch": 1978} {"train_loss": -42.72895431518555, "global_step": 239427, "epoch": 1978} {"train_loss": -43.120216369628906, "global_step": 239428, "epoch": 1978} {"train_loss": -42.986629486083984, "global_step": 239429, "epoch": 1978} {"train_loss": -41.766963958740234, "global_step": 239430, "epoch": 1978} {"train_loss": -43.45276641845703, "global_step": 239431, "epoch": 1978} {"train_loss": -43.04061508178711, "global_step": 239432, "epoch": 1978} {"train_loss": -41.65041732788086, "global_step": 239433, "epoch": 1978} {"train_loss": -42.460731506347656, "global_step": 239434, "epoch": 1978} {"train_loss": -43.22005844116211, "global_step": 239435, "epoch": 1978} {"train_loss": -43.07082748413086, "global_step": 239436, "epoch": 1978} {"train_loss": -41.944828033447266, "global_step": 239437, "epoch": 1978} {"train_loss": -42.08573913574219, "global_step": 239438, "epoch": 1978} {"train_loss": -42.95679473876953, "global_step": 239439, "epoch": 1978} {"train_loss": -43.2745361328125, "global_step": 239440, "epoch": 1978} {"train_loss": -42.16582107543945, "global_step": 239441, "epoch": 1978} {"train_loss": -42.33036804199219, "global_step": 239442, "epoch": 1978} {"train_loss": -42.74434280395508, "global_step": 239443, "epoch": 1978} {"train_loss": -43.85781478881836, "global_step": 239444, "epoch": 1978} {"train_loss": -41.97245788574219, "global_step": 239445, "epoch": 1978} {"train_loss": -38.612266540527344, "global_step": 239446, "epoch": 1978} {"train_loss": -43.49946975708008, "global_step": 239447, "epoch": 1978} {"train_loss": -41.421043395996094, "global_step": 239448, "epoch": 1978} {"train_loss": -39.50374984741211, "global_step": 239449, "epoch": 1978} {"train_loss": -42.00049591064453, "global_step": 239450, "epoch": 1978} {"train_loss": -41.93772506713867, "global_step": 239451, "epoch": 1978} {"train_loss": -42.274417877197266, "global_step": 239452, "epoch": 1978} {"train_loss": -41.031349182128906, "global_step": 239453, "epoch": 1978} {"train_loss": -40.79551696777344, "global_step": 239454, "epoch": 1978} {"train_loss": -40.85906982421875, "global_step": 239455, "epoch": 1978} {"train_loss": -42.59414291381836, "global_step": 239456, "epoch": 1978} {"train_loss": -39.99251937866211, "global_step": 239457, "epoch": 1978} {"train_loss": -42.834570388163414, "global_step": 239458, "epoch": 1978, "val_loss": 2646079.0} {"train_loss": -39.931251525878906, "global_step": 239459, "epoch": 1979} {"train_loss": -42.482173919677734, "global_step": 239460, "epoch": 1979} {"train_loss": -40.024200439453125, "global_step": 239461, "epoch": 1979} {"train_loss": -40.547611236572266, "global_step": 239462, "epoch": 1979} {"train_loss": -41.62239456176758, "global_step": 239463, "epoch": 1979} {"train_loss": -38.078575134277344, "global_step": 239464, "epoch": 1979} {"train_loss": -40.258506774902344, "global_step": 239465, "epoch": 1979} {"train_loss": -37.31663513183594, "global_step": 239466, "epoch": 1979} {"train_loss": -39.2352294921875, "global_step": 239467, "epoch": 1979} {"train_loss": -38.4937858581543, "global_step": 239468, "epoch": 1979} {"train_loss": -40.04068374633789, "global_step": 239469, "epoch": 1979} {"train_loss": -38.617393493652344, "global_step": 239470, "epoch": 1979} {"train_loss": -39.17978286743164, "global_step": 239471, "epoch": 1979} {"train_loss": -40.17216110229492, "global_step": 239472, "epoch": 1979} {"train_loss": -38.88446807861328, "global_step": 239473, "epoch": 1979} {"train_loss": -41.54815673828125, "global_step": 239474, "epoch": 1979} {"train_loss": -38.1269645690918, "global_step": 239475, "epoch": 1979} {"train_loss": -42.758113861083984, "global_step": 239476, "epoch": 1979} {"train_loss": -40.705196380615234, "global_step": 239477, "epoch": 1979} {"train_loss": -41.7411994934082, "global_step": 239478, "epoch": 1979} {"train_loss": -41.46721267700195, "global_step": 239479, "epoch": 1979} {"train_loss": -41.39059066772461, "global_step": 239480, "epoch": 1979} {"train_loss": -42.38019561767578, "global_step": 239481, "epoch": 1979} {"train_loss": -41.260494232177734, "global_step": 239482, "epoch": 1979} {"train_loss": -42.42885208129883, "global_step": 239483, "epoch": 1979} {"train_loss": -41.54221725463867, "global_step": 239484, "epoch": 1979} {"train_loss": -42.25605392456055, "global_step": 239485, "epoch": 1979} {"train_loss": -43.04023361206055, "global_step": 239486, "epoch": 1979} {"train_loss": -41.84566879272461, "global_step": 239487, "epoch": 1979} {"train_loss": -42.8939323425293, "global_step": 239488, "epoch": 1979} {"train_loss": -42.864192962646484, "global_step": 239489, "epoch": 1979} {"train_loss": -42.328121185302734, "global_step": 239490, "epoch": 1979} {"train_loss": -42.90311813354492, "global_step": 239491, "epoch": 1979} {"train_loss": -42.697872161865234, "global_step": 239492, "epoch": 1979} {"train_loss": -43.03892135620117, "global_step": 239493, "epoch": 1979} {"train_loss": -42.675777435302734, "global_step": 239494, "epoch": 1979} {"train_loss": -43.04814529418945, "global_step": 239495, "epoch": 1979} {"train_loss": -43.00437545776367, "global_step": 239496, "epoch": 1979} {"train_loss": -42.78069305419922, "global_step": 239497, "epoch": 1979} {"train_loss": -43.95203399658203, "global_step": 239498, "epoch": 1979} {"train_loss": -43.36328887939453, "global_step": 239499, "epoch": 1979} {"train_loss": -43.247005462646484, "global_step": 239500, "epoch": 1979} {"train_loss": -43.20539093017578, "global_step": 239501, "epoch": 1979} {"train_loss": -43.822391510009766, "global_step": 239502, "epoch": 1979} {"train_loss": -43.160152435302734, "global_step": 239503, "epoch": 1979} {"train_loss": -43.79779052734375, "global_step": 239504, "epoch": 1979} {"train_loss": -43.4112663269043, "global_step": 239505, "epoch": 1979} {"train_loss": -43.616065979003906, "global_step": 239506, "epoch": 1979} {"train_loss": -43.268375396728516, "global_step": 239507, "epoch": 1979} {"train_loss": -43.65139389038086, "global_step": 239508, "epoch": 1979} {"train_loss": -43.842403411865234, "global_step": 239509, "epoch": 1979} {"train_loss": -43.46210479736328, "global_step": 239510, "epoch": 1979} {"train_loss": -43.883811950683594, "global_step": 239511, "epoch": 1979} {"train_loss": -43.95297622680664, "global_step": 239512, "epoch": 1979} {"train_loss": -43.42120361328125, "global_step": 239513, "epoch": 1979} {"train_loss": -43.76567840576172, "global_step": 239514, "epoch": 1979} {"train_loss": -43.99818420410156, "global_step": 239515, "epoch": 1979} {"train_loss": -43.97239685058594, "global_step": 239516, "epoch": 1979} {"train_loss": -43.835693359375, "global_step": 239517, "epoch": 1979} {"train_loss": -44.54132843017578, "global_step": 239518, "epoch": 1979} {"train_loss": -43.93479537963867, "global_step": 239519, "epoch": 1979} {"train_loss": -44.19846725463867, "global_step": 239520, "epoch": 1979} {"train_loss": -43.9005126953125, "global_step": 239521, "epoch": 1979} {"train_loss": -44.21100997924805, "global_step": 239522, "epoch": 1979} {"train_loss": -44.186710357666016, "global_step": 239523, "epoch": 1979} {"train_loss": -44.05758285522461, "global_step": 239524, "epoch": 1979} {"train_loss": -44.24292755126953, "global_step": 239525, "epoch": 1979} {"train_loss": -43.80149459838867, "global_step": 239526, "epoch": 1979} {"train_loss": -43.8693962097168, "global_step": 239527, "epoch": 1979} {"train_loss": -43.975738525390625, "global_step": 239528, "epoch": 1979} {"train_loss": -44.5190544128418, "global_step": 239529, "epoch": 1979} {"train_loss": -44.329341888427734, "global_step": 239530, "epoch": 1979} {"train_loss": -43.74574661254883, "global_step": 239531, "epoch": 1979} {"train_loss": -43.59823989868164, "global_step": 239532, "epoch": 1979} {"train_loss": -43.822265625, "global_step": 239533, "epoch": 1979} {"train_loss": -44.3287239074707, "global_step": 239534, "epoch": 1979} {"train_loss": -43.9054069519043, "global_step": 239535, "epoch": 1979} {"train_loss": -43.024497985839844, "global_step": 239536, "epoch": 1979} {"train_loss": -43.798004150390625, "global_step": 239537, "epoch": 1979} {"train_loss": -41.7542724609375, "global_step": 239538, "epoch": 1979} {"train_loss": -40.286861419677734, "global_step": 239539, "epoch": 1979} {"train_loss": -42.039608001708984, "global_step": 239540, "epoch": 1979} {"train_loss": -41.67518997192383, "global_step": 239541, "epoch": 1979} {"train_loss": -42.55840301513672, "global_step": 239542, "epoch": 1979} {"train_loss": -43.47198486328125, "global_step": 239543, "epoch": 1979} {"train_loss": -42.97797393798828, "global_step": 239544, "epoch": 1979} {"train_loss": -42.58049011230469, "global_step": 239545, "epoch": 1979} {"train_loss": -42.172889709472656, "global_step": 239546, "epoch": 1979} {"train_loss": -43.25296401977539, "global_step": 239547, "epoch": 1979} {"train_loss": -42.25141525268555, "global_step": 239548, "epoch": 1979} {"train_loss": -39.61943435668945, "global_step": 239549, "epoch": 1979} {"train_loss": -42.9518928527832, "global_step": 239550, "epoch": 1979} {"train_loss": -40.254150390625, "global_step": 239551, "epoch": 1979} {"train_loss": -40.15946578979492, "global_step": 239552, "epoch": 1979} {"train_loss": -41.639122009277344, "global_step": 239553, "epoch": 1979} {"train_loss": -41.32766342163086, "global_step": 239554, "epoch": 1979} {"train_loss": -41.32786178588867, "global_step": 239555, "epoch": 1979} {"train_loss": -40.951107025146484, "global_step": 239556, "epoch": 1979} {"train_loss": -41.07093048095703, "global_step": 239557, "epoch": 1979} {"train_loss": -41.896995544433594, "global_step": 239558, "epoch": 1979} {"train_loss": -36.968082427978516, "global_step": 239559, "epoch": 1979} {"train_loss": -35.92139434814453, "global_step": 239560, "epoch": 1979} {"train_loss": -29.089468002319336, "global_step": 239561, "epoch": 1979} {"train_loss": -18.539464950561523, "global_step": 239562, "epoch": 1979} {"train_loss": -35.218849182128906, "global_step": 239563, "epoch": 1979} {"train_loss": -28.621994018554688, "global_step": 239564, "epoch": 1979} {"train_loss": -30.57146644592285, "global_step": 239565, "epoch": 1979} {"train_loss": -32.0635986328125, "global_step": 239566, "epoch": 1979} {"train_loss": -37.22476577758789, "global_step": 239567, "epoch": 1979} {"train_loss": -37.64298629760742, "global_step": 239568, "epoch": 1979} {"train_loss": -38.72479248046875, "global_step": 239569, "epoch": 1979} {"train_loss": -37.2282829284668, "global_step": 239570, "epoch": 1979} {"train_loss": -39.594966888427734, "global_step": 239571, "epoch": 1979} {"train_loss": -40.14448928833008, "global_step": 239572, "epoch": 1979} {"train_loss": -39.514766693115234, "global_step": 239573, "epoch": 1979} {"train_loss": -40.13441848754883, "global_step": 239574, "epoch": 1979} {"train_loss": -40.46510696411133, "global_step": 239575, "epoch": 1979} {"train_loss": -40.112388610839844, "global_step": 239576, "epoch": 1979} {"train_loss": -39.78219223022461, "global_step": 239577, "epoch": 1979} {"train_loss": -41.98929977416992, "global_step": 239578, "epoch": 1979} {"train_loss": -41.28704107300309, "global_step": 239579, "epoch": 1979, "val_loss": 2573622.75} {"train_loss": -41.656185150146484, "global_step": 239580, "epoch": 1980} {"train_loss": -40.14576721191406, "global_step": 239581, "epoch": 1980} {"train_loss": -40.8470573425293, "global_step": 239582, "epoch": 1980} {"train_loss": -41.04268264770508, "global_step": 239583, "epoch": 1980} {"train_loss": -41.10191345214844, "global_step": 239584, "epoch": 1980} {"train_loss": -41.8040657043457, "global_step": 239585, "epoch": 1980} {"train_loss": -41.36678695678711, "global_step": 239586, "epoch": 1980} {"train_loss": -41.80645751953125, "global_step": 239587, "epoch": 1980} {"train_loss": -41.71271514892578, "global_step": 239588, "epoch": 1980} {"train_loss": -42.106849670410156, "global_step": 239589, "epoch": 1980} {"train_loss": -42.12067794799805, "global_step": 239590, "epoch": 1980} {"train_loss": -41.335716247558594, "global_step": 239591, "epoch": 1980} {"train_loss": -42.18278503417969, "global_step": 239592, "epoch": 1980} {"train_loss": -41.741943359375, "global_step": 239593, "epoch": 1980} {"train_loss": -42.3813591003418, "global_step": 239594, "epoch": 1980} {"train_loss": -41.90547561645508, "global_step": 239595, "epoch": 1980} {"train_loss": -42.23466110229492, "global_step": 239596, "epoch": 1980} {"train_loss": -41.728275299072266, "global_step": 239597, "epoch": 1980} {"train_loss": -42.35543441772461, "global_step": 239598, "epoch": 1980} {"train_loss": -42.5003547668457, "global_step": 239599, "epoch": 1980} {"train_loss": -42.244056701660156, "global_step": 239600, "epoch": 1980} {"train_loss": -42.656978607177734, "global_step": 239601, "epoch": 1980} {"train_loss": -42.335262298583984, "global_step": 239602, "epoch": 1980} {"train_loss": -42.92995071411133, "global_step": 239603, "epoch": 1980} {"train_loss": -42.45737838745117, "global_step": 239604, "epoch": 1980} {"train_loss": -42.53558349609375, "global_step": 239605, "epoch": 1980} {"train_loss": -42.94336700439453, "global_step": 239606, "epoch": 1980} {"train_loss": -42.784576416015625, "global_step": 239607, "epoch": 1980} {"train_loss": -43.326534271240234, "global_step": 239608, "epoch": 1980} {"train_loss": -43.013824462890625, "global_step": 239609, "epoch": 1980} {"train_loss": -43.514713287353516, "global_step": 239610, "epoch": 1980} {"train_loss": -43.172794342041016, "global_step": 239611, "epoch": 1980} {"train_loss": -43.094417572021484, "global_step": 239612, "epoch": 1980} {"train_loss": -43.131710052490234, "global_step": 239613, "epoch": 1980} {"train_loss": -43.1704216003418, "global_step": 239614, "epoch": 1980} {"train_loss": -42.36322021484375, "global_step": 239615, "epoch": 1980} {"train_loss": -43.47283935546875, "global_step": 239616, "epoch": 1980} {"train_loss": -42.421993255615234, "global_step": 239617, "epoch": 1980} {"train_loss": -42.56891632080078, "global_step": 239618, "epoch": 1980} {"train_loss": -43.41788864135742, "global_step": 239619, "epoch": 1980} {"train_loss": -42.671443939208984, "global_step": 239620, "epoch": 1980} {"train_loss": -43.54249572753906, "global_step": 239621, "epoch": 1980} {"train_loss": -43.22441864013672, "global_step": 239622, "epoch": 1980} {"train_loss": -43.599185943603516, "global_step": 239623, "epoch": 1980} {"train_loss": -43.21839141845703, "global_step": 239624, "epoch": 1980} {"train_loss": -43.6663932800293, "global_step": 239625, "epoch": 1980} {"train_loss": -43.733638763427734, "global_step": 239626, "epoch": 1980} {"train_loss": -43.28203201293945, "global_step": 239627, "epoch": 1980} {"train_loss": -42.98179244995117, "global_step": 239628, "epoch": 1980} {"train_loss": -43.99799728393555, "global_step": 239629, "epoch": 1980} {"train_loss": -43.19953155517578, "global_step": 239630, "epoch": 1980} {"train_loss": -42.69175338745117, "global_step": 239631, "epoch": 1980} {"train_loss": -43.72395706176758, "global_step": 239632, "epoch": 1980} {"train_loss": -43.249053955078125, "global_step": 239633, "epoch": 1980} {"train_loss": -43.21208572387695, "global_step": 239634, "epoch": 1980} {"train_loss": -43.83570861816406, "global_step": 239635, "epoch": 1980} {"train_loss": -43.33273696899414, "global_step": 239636, "epoch": 1980} {"train_loss": -42.8792839050293, "global_step": 239637, "epoch": 1980} {"train_loss": -43.85482406616211, "global_step": 239638, "epoch": 1980} {"train_loss": -43.81580352783203, "global_step": 239639, "epoch": 1980} {"train_loss": -43.26108932495117, "global_step": 239640, "epoch": 1980} {"train_loss": -43.05036163330078, "global_step": 239641, "epoch": 1980} {"train_loss": -43.928218841552734, "global_step": 239642, "epoch": 1980} {"train_loss": -43.30979537963867, "global_step": 239643, "epoch": 1980} {"train_loss": -43.26008987426758, "global_step": 239644, "epoch": 1980} {"train_loss": -44.051483154296875, "global_step": 239645, "epoch": 1980} {"train_loss": -43.97847366333008, "global_step": 239646, "epoch": 1980} {"train_loss": -43.582088470458984, "global_step": 239647, "epoch": 1980} {"train_loss": -44.153350830078125, "global_step": 239648, "epoch": 1980} {"train_loss": -43.898101806640625, "global_step": 239649, "epoch": 1980} {"train_loss": -43.761104583740234, "global_step": 239650, "epoch": 1980} {"train_loss": -43.981929779052734, "global_step": 239651, "epoch": 1980} {"train_loss": -44.536251068115234, "global_step": 239652, "epoch": 1980} {"train_loss": -43.462703704833984, "global_step": 239653, "epoch": 1980} {"train_loss": -43.794376373291016, "global_step": 239654, "epoch": 1980} {"train_loss": -43.62430191040039, "global_step": 239655, "epoch": 1980} {"train_loss": -43.92021179199219, "global_step": 239656, "epoch": 1980} {"train_loss": -43.740787506103516, "global_step": 239657, "epoch": 1980} {"train_loss": -43.39524459838867, "global_step": 239658, "epoch": 1980} {"train_loss": -44.0211296081543, "global_step": 239659, "epoch": 1980} {"train_loss": -43.16145706176758, "global_step": 239660, "epoch": 1980} {"train_loss": -41.98379135131836, "global_step": 239661, "epoch": 1980} {"train_loss": -43.20540237426758, "global_step": 239662, "epoch": 1980} {"train_loss": -43.39030075073242, "global_step": 239663, "epoch": 1980} {"train_loss": -44.21228790283203, "global_step": 239664, "epoch": 1980} {"train_loss": -44.2034912109375, "global_step": 239665, "epoch": 1980} {"train_loss": -43.60222244262695, "global_step": 239666, "epoch": 1980} {"train_loss": -41.325233459472656, "global_step": 239667, "epoch": 1980} {"train_loss": -37.54939651489258, "global_step": 239668, "epoch": 1980} {"train_loss": -34.32110595703125, "global_step": 239669, "epoch": 1980} {"train_loss": -42.458534240722656, "global_step": 239670, "epoch": 1980} {"train_loss": -40.59271240234375, "global_step": 239671, "epoch": 1980} {"train_loss": -35.44682693481445, "global_step": 239672, "epoch": 1980} {"train_loss": -41.884742736816406, "global_step": 239673, "epoch": 1980} {"train_loss": -34.46821975708008, "global_step": 239674, "epoch": 1980} {"train_loss": -40.68125534057617, "global_step": 239675, "epoch": 1980} {"train_loss": -41.38005065917969, "global_step": 239676, "epoch": 1980} {"train_loss": -34.2284049987793, "global_step": 239677, "epoch": 1980} {"train_loss": -41.25410079956055, "global_step": 239678, "epoch": 1980} {"train_loss": -38.792484283447266, "global_step": 239679, "epoch": 1980} {"train_loss": -38.61103439331055, "global_step": 239680, "epoch": 1980} {"train_loss": -38.51641845703125, "global_step": 239681, "epoch": 1980} {"train_loss": -38.356319427490234, "global_step": 239682, "epoch": 1980} {"train_loss": -38.64517593383789, "global_step": 239683, "epoch": 1980} {"train_loss": -40.544132232666016, "global_step": 239684, "epoch": 1980} {"train_loss": -38.768585205078125, "global_step": 239685, "epoch": 1980} {"train_loss": -40.51227951049805, "global_step": 239686, "epoch": 1980} {"train_loss": -40.3106575012207, "global_step": 239687, "epoch": 1980} {"train_loss": -40.57133483886719, "global_step": 239688, "epoch": 1980} {"train_loss": -41.40703201293945, "global_step": 239689, "epoch": 1980} {"train_loss": -40.66776657104492, "global_step": 239690, "epoch": 1980} {"train_loss": -39.32172775268555, "global_step": 239691, "epoch": 1980} {"train_loss": -41.545814514160156, "global_step": 239692, "epoch": 1980} {"train_loss": -40.88121032714844, "global_step": 239693, "epoch": 1980} {"train_loss": -42.25444793701172, "global_step": 239694, "epoch": 1980} {"train_loss": -40.58536911010742, "global_step": 239695, "epoch": 1980} {"train_loss": -42.26107406616211, "global_step": 239696, "epoch": 1980} {"train_loss": -38.95841979980469, "global_step": 239697, "epoch": 1980} {"train_loss": -39.68788146972656, "global_step": 239698, "epoch": 1980} {"train_loss": -40.1495475769043, "global_step": 239699, "epoch": 1980} {"train_loss": -42.04247523536367, "global_step": 239700, "epoch": 1980, "val_loss": 2529587.75} {"train_loss": -40.7796745300293, "global_step": 239701, "epoch": 1981} {"train_loss": -41.27082061767578, "global_step": 239702, "epoch": 1981} {"train_loss": -39.39988327026367, "global_step": 239703, "epoch": 1981} {"train_loss": -41.51795196533203, "global_step": 239704, "epoch": 1981} {"train_loss": -41.431331634521484, "global_step": 239705, "epoch": 1981} {"train_loss": -41.25465393066406, "global_step": 239706, "epoch": 1981} {"train_loss": -41.023006439208984, "global_step": 239707, "epoch": 1981} {"train_loss": -42.281578063964844, "global_step": 239708, "epoch": 1981} {"train_loss": -42.353172302246094, "global_step": 239709, "epoch": 1981} {"train_loss": -42.22346115112305, "global_step": 239710, "epoch": 1981} {"train_loss": -40.874576568603516, "global_step": 239711, "epoch": 1981} {"train_loss": -41.83529281616211, "global_step": 239712, "epoch": 1981} {"train_loss": -42.10490798950195, "global_step": 239713, "epoch": 1981} {"train_loss": -42.09027862548828, "global_step": 239714, "epoch": 1981} {"train_loss": -42.64218521118164, "global_step": 239715, "epoch": 1981} {"train_loss": -41.05111312866211, "global_step": 239716, "epoch": 1981} {"train_loss": -42.02503204345703, "global_step": 239717, "epoch": 1981} {"train_loss": -42.01835250854492, "global_step": 239718, "epoch": 1981} {"train_loss": -41.63770294189453, "global_step": 239719, "epoch": 1981} {"train_loss": -42.66938400268555, "global_step": 239720, "epoch": 1981} {"train_loss": -40.147857666015625, "global_step": 239721, "epoch": 1981} {"train_loss": -41.68526077270508, "global_step": 239722, "epoch": 1981} {"train_loss": -37.943294525146484, "global_step": 239723, "epoch": 1981} {"train_loss": -42.100868225097656, "global_step": 239724, "epoch": 1981} {"train_loss": -42.428985595703125, "global_step": 239725, "epoch": 1981} {"train_loss": -41.49405288696289, "global_step": 239726, "epoch": 1981} {"train_loss": -43.111541748046875, "global_step": 239727, "epoch": 1981} {"train_loss": -42.65456008911133, "global_step": 239728, "epoch": 1981} {"train_loss": -41.93729782104492, "global_step": 239729, "epoch": 1981} {"train_loss": -43.32014083862305, "global_step": 239730, "epoch": 1981} {"train_loss": -41.70209884643555, "global_step": 239731, "epoch": 1981} {"train_loss": -42.62876510620117, "global_step": 239732, "epoch": 1981} {"train_loss": -41.7702751159668, "global_step": 239733, "epoch": 1981} {"train_loss": -43.254207611083984, "global_step": 239734, "epoch": 1981} {"train_loss": -42.61371994018555, "global_step": 239735, "epoch": 1981} {"train_loss": -43.08515167236328, "global_step": 239736, "epoch": 1981} {"train_loss": -43.09454345703125, "global_step": 239737, "epoch": 1981} {"train_loss": -42.306114196777344, "global_step": 239738, "epoch": 1981} {"train_loss": -42.64385986328125, "global_step": 239739, "epoch": 1981} {"train_loss": -43.34564971923828, "global_step": 239740, "epoch": 1981} {"train_loss": -43.13351058959961, "global_step": 239741, "epoch": 1981} {"train_loss": -43.07658004760742, "global_step": 239742, "epoch": 1981} {"train_loss": -43.57329177856445, "global_step": 239743, "epoch": 1981} {"train_loss": -43.531368255615234, "global_step": 239744, "epoch": 1981} {"train_loss": -43.25083541870117, "global_step": 239745, "epoch": 1981} {"train_loss": -43.49761962890625, "global_step": 239746, "epoch": 1981} {"train_loss": -42.415584564208984, "global_step": 239747, "epoch": 1981} {"train_loss": -43.40900802612305, "global_step": 239748, "epoch": 1981} {"train_loss": -43.46082305908203, "global_step": 239749, "epoch": 1981} {"train_loss": -43.15213394165039, "global_step": 239750, "epoch": 1981} {"train_loss": -42.8306999206543, "global_step": 239751, "epoch": 1981} {"train_loss": -43.142127990722656, "global_step": 239752, "epoch": 1981} {"train_loss": -43.50667190551758, "global_step": 239753, "epoch": 1981} {"train_loss": -43.8801383972168, "global_step": 239754, "epoch": 1981} {"train_loss": -43.436946868896484, "global_step": 239755, "epoch": 1981} {"train_loss": -43.146202087402344, "global_step": 239756, "epoch": 1981} {"train_loss": -43.97890853881836, "global_step": 239757, "epoch": 1981} {"train_loss": -43.75684356689453, "global_step": 239758, "epoch": 1981} {"train_loss": -44.3615837097168, "global_step": 239759, "epoch": 1981} {"train_loss": -43.552650451660156, "global_step": 239760, "epoch": 1981} {"train_loss": -44.2646484375, "global_step": 239761, "epoch": 1981} {"train_loss": -44.49646759033203, "global_step": 239762, "epoch": 1981} {"train_loss": -43.63871383666992, "global_step": 239763, "epoch": 1981} {"train_loss": -44.15711975097656, "global_step": 239764, "epoch": 1981} {"train_loss": -43.84858322143555, "global_step": 239765, "epoch": 1981} {"train_loss": -43.390926361083984, "global_step": 239766, "epoch": 1981} {"train_loss": -43.94702911376953, "global_step": 239767, "epoch": 1981} {"train_loss": -44.2030143737793, "global_step": 239768, "epoch": 1981} {"train_loss": -44.635711669921875, "global_step": 239769, "epoch": 1981} {"train_loss": -43.45078659057617, "global_step": 239770, "epoch": 1981} {"train_loss": -44.15190124511719, "global_step": 239771, "epoch": 1981} {"train_loss": -44.26764678955078, "global_step": 239772, "epoch": 1981} {"train_loss": -43.6772575378418, "global_step": 239773, "epoch": 1981} {"train_loss": -44.02809524536133, "global_step": 239774, "epoch": 1981} {"train_loss": -44.06623077392578, "global_step": 239775, "epoch": 1981} {"train_loss": -44.71563720703125, "global_step": 239776, "epoch": 1981} {"train_loss": -44.094329833984375, "global_step": 239777, "epoch": 1981} {"train_loss": -43.55356979370117, "global_step": 239778, "epoch": 1981} {"train_loss": -42.87354278564453, "global_step": 239779, "epoch": 1981} {"train_loss": -43.3757438659668, "global_step": 239780, "epoch": 1981} {"train_loss": -41.69987106323242, "global_step": 239781, "epoch": 1981} {"train_loss": -42.61907196044922, "global_step": 239782, "epoch": 1981} {"train_loss": -43.22258377075195, "global_step": 239783, "epoch": 1981} {"train_loss": -43.3203010559082, "global_step": 239784, "epoch": 1981} {"train_loss": -43.3472785949707, "global_step": 239785, "epoch": 1981} {"train_loss": -43.632503509521484, "global_step": 239786, "epoch": 1981} {"train_loss": -43.53568649291992, "global_step": 239787, "epoch": 1981} {"train_loss": -43.38867950439453, "global_step": 239788, "epoch": 1981} {"train_loss": -43.229034423828125, "global_step": 239789, "epoch": 1981} {"train_loss": -43.3437614440918, "global_step": 239790, "epoch": 1981} {"train_loss": -42.314754486083984, "global_step": 239791, "epoch": 1981} {"train_loss": -42.03425216674805, "global_step": 239792, "epoch": 1981} {"train_loss": -39.15544509887695, "global_step": 239793, "epoch": 1981} {"train_loss": -41.33359146118164, "global_step": 239794, "epoch": 1981} {"train_loss": -41.0345573425293, "global_step": 239795, "epoch": 1981} {"train_loss": -39.17665481567383, "global_step": 239796, "epoch": 1981} {"train_loss": -42.13060760498047, "global_step": 239797, "epoch": 1981} {"train_loss": -39.768890380859375, "global_step": 239798, "epoch": 1981} {"train_loss": -41.67366027832031, "global_step": 239799, "epoch": 1981} {"train_loss": -40.84465026855469, "global_step": 239800, "epoch": 1981} {"train_loss": -40.06182861328125, "global_step": 239801, "epoch": 1981} {"train_loss": -42.1404914855957, "global_step": 239802, "epoch": 1981} {"train_loss": -41.75690841674805, "global_step": 239803, "epoch": 1981} {"train_loss": -41.570735931396484, "global_step": 239804, "epoch": 1981} {"train_loss": -41.29381561279297, "global_step": 239805, "epoch": 1981} {"train_loss": -40.8836669921875, "global_step": 239806, "epoch": 1981} {"train_loss": -38.94808578491211, "global_step": 239807, "epoch": 1981} {"train_loss": -41.468074798583984, "global_step": 239808, "epoch": 1981} {"train_loss": -39.6170768737793, "global_step": 239809, "epoch": 1981} {"train_loss": -41.515235900878906, "global_step": 239810, "epoch": 1981} {"train_loss": -40.188026428222656, "global_step": 239811, "epoch": 1981} {"train_loss": -38.50491714477539, "global_step": 239812, "epoch": 1981} {"train_loss": -42.28886795043945, "global_step": 239813, "epoch": 1981} {"train_loss": -38.4099235534668, "global_step": 239814, "epoch": 1981} {"train_loss": -37.92608642578125, "global_step": 239815, "epoch": 1981} {"train_loss": -40.23856735229492, "global_step": 239816, "epoch": 1981} {"train_loss": -38.803672790527344, "global_step": 239817, "epoch": 1981} {"train_loss": -40.45952224731445, "global_step": 239818, "epoch": 1981} {"train_loss": -40.704254150390625, "global_step": 239819, "epoch": 1981} {"train_loss": -40.40203857421875, "global_step": 239820, "epoch": 1981} {"train_loss": -42.23978487125113, "global_step": 239821, "epoch": 1981, "val_loss": 2664778.25} {"train_loss": -41.55526351928711, "global_step": 239822, "epoch": 1982} {"train_loss": -41.02204895019531, "global_step": 239823, "epoch": 1982} {"train_loss": -41.92084884643555, "global_step": 239824, "epoch": 1982} {"train_loss": -41.728309631347656, "global_step": 239825, "epoch": 1982} {"train_loss": -42.017982482910156, "global_step": 239826, "epoch": 1982} {"train_loss": -41.827091217041016, "global_step": 239827, "epoch": 1982} {"train_loss": -41.86361312866211, "global_step": 239828, "epoch": 1982} {"train_loss": -42.393089294433594, "global_step": 239829, "epoch": 1982} {"train_loss": -42.47372055053711, "global_step": 239830, "epoch": 1982} {"train_loss": -41.81374740600586, "global_step": 239831, "epoch": 1982} {"train_loss": -41.378623962402344, "global_step": 239832, "epoch": 1982} {"train_loss": -41.867408752441406, "global_step": 239833, "epoch": 1982} {"train_loss": -42.99519729614258, "global_step": 239834, "epoch": 1982} {"train_loss": -42.18449783325195, "global_step": 239835, "epoch": 1982} {"train_loss": -42.64761734008789, "global_step": 239836, "epoch": 1982} {"train_loss": -42.75031280517578, "global_step": 239837, "epoch": 1982} {"train_loss": -42.5118408203125, "global_step": 239838, "epoch": 1982} {"train_loss": -42.53199005126953, "global_step": 239839, "epoch": 1982} {"train_loss": -42.90843963623047, "global_step": 239840, "epoch": 1982} {"train_loss": -42.39142990112305, "global_step": 239841, "epoch": 1982} {"train_loss": -42.06895065307617, "global_step": 239842, "epoch": 1982} {"train_loss": -42.71998596191406, "global_step": 239843, "epoch": 1982} {"train_loss": -42.382930755615234, "global_step": 239844, "epoch": 1982} {"train_loss": -42.066585540771484, "global_step": 239845, "epoch": 1982} {"train_loss": -43.00825881958008, "global_step": 239846, "epoch": 1982} {"train_loss": -42.52516174316406, "global_step": 239847, "epoch": 1982} {"train_loss": -43.10171890258789, "global_step": 239848, "epoch": 1982} {"train_loss": -43.258392333984375, "global_step": 239849, "epoch": 1982} {"train_loss": -41.63503646850586, "global_step": 239850, "epoch": 1982} {"train_loss": -42.8634147644043, "global_step": 239851, "epoch": 1982} {"train_loss": -43.26675033569336, "global_step": 239852, "epoch": 1982} {"train_loss": -43.10498809814453, "global_step": 239853, "epoch": 1982} {"train_loss": -43.6959342956543, "global_step": 239854, "epoch": 1982} {"train_loss": -42.45413589477539, "global_step": 239855, "epoch": 1982} {"train_loss": -43.27120590209961, "global_step": 239856, "epoch": 1982} {"train_loss": -43.3053092956543, "global_step": 239857, "epoch": 1982} {"train_loss": -42.55440139770508, "global_step": 239858, "epoch": 1982} {"train_loss": -42.858787536621094, "global_step": 239859, "epoch": 1982} {"train_loss": -43.617958068847656, "global_step": 239860, "epoch": 1982} {"train_loss": -43.344295501708984, "global_step": 239861, "epoch": 1982} {"train_loss": -43.096099853515625, "global_step": 239862, "epoch": 1982} {"train_loss": -43.4920539855957, "global_step": 239863, "epoch": 1982} {"train_loss": -43.85879898071289, "global_step": 239864, "epoch": 1982} {"train_loss": -42.94126892089844, "global_step": 239865, "epoch": 1982} {"train_loss": -42.90742492675781, "global_step": 239866, "epoch": 1982} {"train_loss": -43.70585250854492, "global_step": 239867, "epoch": 1982} {"train_loss": -43.285396575927734, "global_step": 239868, "epoch": 1982} {"train_loss": -43.301239013671875, "global_step": 239869, "epoch": 1982} {"train_loss": -42.93327713012695, "global_step": 239870, "epoch": 1982} {"train_loss": -43.072811126708984, "global_step": 239871, "epoch": 1982} {"train_loss": -43.563079833984375, "global_step": 239872, "epoch": 1982} {"train_loss": -43.5262565612793, "global_step": 239873, "epoch": 1982} {"train_loss": -43.65346145629883, "global_step": 239874, "epoch": 1982} {"train_loss": -43.653114318847656, "global_step": 239875, "epoch": 1982} {"train_loss": -44.028114318847656, "global_step": 239876, "epoch": 1982} {"train_loss": -43.89980697631836, "global_step": 239877, "epoch": 1982} {"train_loss": -43.26504898071289, "global_step": 239878, "epoch": 1982} {"train_loss": -43.28807067871094, "global_step": 239879, "epoch": 1982} {"train_loss": -43.515289306640625, "global_step": 239880, "epoch": 1982} {"train_loss": -43.9465446472168, "global_step": 239881, "epoch": 1982} {"train_loss": -44.0915412902832, "global_step": 239882, "epoch": 1982} {"train_loss": -43.840087890625, "global_step": 239883, "epoch": 1982} {"train_loss": -43.77204132080078, "global_step": 239884, "epoch": 1982} {"train_loss": -43.85670852661133, "global_step": 239885, "epoch": 1982} {"train_loss": -44.020687103271484, "global_step": 239886, "epoch": 1982} {"train_loss": -44.03326416015625, "global_step": 239887, "epoch": 1982} {"train_loss": -43.240901947021484, "global_step": 239888, "epoch": 1982} {"train_loss": -44.04642105102539, "global_step": 239889, "epoch": 1982} {"train_loss": -44.17482376098633, "global_step": 239890, "epoch": 1982} {"train_loss": -43.408958435058594, "global_step": 239891, "epoch": 1982} {"train_loss": -44.41366958618164, "global_step": 239892, "epoch": 1982} {"train_loss": -44.00471115112305, "global_step": 239893, "epoch": 1982} {"train_loss": -43.632110595703125, "global_step": 239894, "epoch": 1982} {"train_loss": -44.29914093017578, "global_step": 239895, "epoch": 1982} {"train_loss": -44.257911682128906, "global_step": 239896, "epoch": 1982} {"train_loss": -44.38252258300781, "global_step": 239897, "epoch": 1982} {"train_loss": -43.8285026550293, "global_step": 239898, "epoch": 1982} {"train_loss": -44.51025390625, "global_step": 239899, "epoch": 1982} {"train_loss": -43.857826232910156, "global_step": 239900, "epoch": 1982} {"train_loss": -44.21860122680664, "global_step": 239901, "epoch": 1982} {"train_loss": -43.65224838256836, "global_step": 239902, "epoch": 1982} {"train_loss": -44.885108947753906, "global_step": 239903, "epoch": 1982} {"train_loss": -44.385353088378906, "global_step": 239904, "epoch": 1982} {"train_loss": -44.2985725402832, "global_step": 239905, "epoch": 1982} {"train_loss": -43.66823959350586, "global_step": 239906, "epoch": 1982} {"train_loss": -40.35161209106445, "global_step": 239907, "epoch": 1982} {"train_loss": -39.21990966796875, "global_step": 239908, "epoch": 1982} {"train_loss": -37.0203857421875, "global_step": 239909, "epoch": 1982} {"train_loss": -43.91427230834961, "global_step": 239910, "epoch": 1982} {"train_loss": -40.95689010620117, "global_step": 239911, "epoch": 1982} {"train_loss": -35.845855712890625, "global_step": 239912, "epoch": 1982} {"train_loss": -33.96932601928711, "global_step": 239913, "epoch": 1982} {"train_loss": -31.194503784179688, "global_step": 239914, "epoch": 1982} {"train_loss": -34.79157638549805, "global_step": 239915, "epoch": 1982} {"train_loss": -33.647335052490234, "global_step": 239916, "epoch": 1982} {"train_loss": -35.250606536865234, "global_step": 239917, "epoch": 1982} {"train_loss": -33.53060531616211, "global_step": 239918, "epoch": 1982} {"train_loss": -35.2604866027832, "global_step": 239919, "epoch": 1982} {"train_loss": -33.46202087402344, "global_step": 239920, "epoch": 1982} {"train_loss": -35.53999710083008, "global_step": 239921, "epoch": 1982} {"train_loss": -36.731842041015625, "global_step": 239922, "epoch": 1982} {"train_loss": -35.46662139892578, "global_step": 239923, "epoch": 1982} {"train_loss": -36.517356872558594, "global_step": 239924, "epoch": 1982} {"train_loss": -35.58241653442383, "global_step": 239925, "epoch": 1982} {"train_loss": -34.41265106201172, "global_step": 239926, "epoch": 1982} {"train_loss": -37.859310150146484, "global_step": 239927, "epoch": 1982} {"train_loss": -37.07551574707031, "global_step": 239928, "epoch": 1982} {"train_loss": -36.8758659362793, "global_step": 239929, "epoch": 1982} {"train_loss": -37.63277816772461, "global_step": 239930, "epoch": 1982} {"train_loss": -36.970123291015625, "global_step": 239931, "epoch": 1982} {"train_loss": -37.44502639770508, "global_step": 239932, "epoch": 1982} {"train_loss": -37.65272903442383, "global_step": 239933, "epoch": 1982} {"train_loss": -37.869232177734375, "global_step": 239934, "epoch": 1982} {"train_loss": -38.947017669677734, "global_step": 239935, "epoch": 1982} {"train_loss": -39.166786193847656, "global_step": 239936, "epoch": 1982} {"train_loss": -39.17951202392578, "global_step": 239937, "epoch": 1982} {"train_loss": -39.31040573120117, "global_step": 239938, "epoch": 1982} {"train_loss": -40.39319610595703, "global_step": 239939, "epoch": 1982} {"train_loss": -39.166202545166016, "global_step": 239940, "epoch": 1982} {"train_loss": -41.576656341552734, "global_step": 239941, "epoch": 1982} {"train_loss": -41.39394930374524, "global_step": 239942, "epoch": 1982, "val_loss": 2689962.25} {"train_loss": -39.995479583740234, "global_step": 239943, "epoch": 1983} {"train_loss": -39.77640914916992, "global_step": 239944, "epoch": 1983} {"train_loss": -40.233245849609375, "global_step": 239945, "epoch": 1983} {"train_loss": -39.297607421875, "global_step": 239946, "epoch": 1983} {"train_loss": -40.488067626953125, "global_step": 239947, "epoch": 1983} {"train_loss": -40.110713958740234, "global_step": 239948, "epoch": 1983} {"train_loss": -40.7519645690918, "global_step": 239949, "epoch": 1983} {"train_loss": -40.331886291503906, "global_step": 239950, "epoch": 1983} {"train_loss": -41.12291717529297, "global_step": 239951, "epoch": 1983} {"train_loss": -40.18221664428711, "global_step": 239952, "epoch": 1983} {"train_loss": -40.453975677490234, "global_step": 239953, "epoch": 1983} {"train_loss": -40.90033721923828, "global_step": 239954, "epoch": 1983} {"train_loss": -40.55765914916992, "global_step": 239955, "epoch": 1983} {"train_loss": -42.143733978271484, "global_step": 239956, "epoch": 1983} {"train_loss": -38.22471237182617, "global_step": 239957, "epoch": 1983} {"train_loss": -41.01646041870117, "global_step": 239958, "epoch": 1983} {"train_loss": -41.809513092041016, "global_step": 239959, "epoch": 1983} {"train_loss": -41.775508880615234, "global_step": 239960, "epoch": 1983} {"train_loss": -41.921966552734375, "global_step": 239961, "epoch": 1983} {"train_loss": -42.178077697753906, "global_step": 239962, "epoch": 1983} {"train_loss": -41.65997314453125, "global_step": 239963, "epoch": 1983} {"train_loss": -40.51755905151367, "global_step": 239964, "epoch": 1983} {"train_loss": -41.198421478271484, "global_step": 239965, "epoch": 1983} {"train_loss": -42.513519287109375, "global_step": 239966, "epoch": 1983} {"train_loss": -41.1866569519043, "global_step": 239967, "epoch": 1983} {"train_loss": -40.35600662231445, "global_step": 239968, "epoch": 1983} {"train_loss": -42.369380950927734, "global_step": 239969, "epoch": 1983} {"train_loss": -42.46211624145508, "global_step": 239970, "epoch": 1983} {"train_loss": -41.72986602783203, "global_step": 239971, "epoch": 1983} {"train_loss": -42.925209045410156, "global_step": 239972, "epoch": 1983} {"train_loss": -42.07524871826172, "global_step": 239973, "epoch": 1983} {"train_loss": -41.816165924072266, "global_step": 239974, "epoch": 1983} {"train_loss": -41.06031036376953, "global_step": 239975, "epoch": 1983} {"train_loss": -43.05916213989258, "global_step": 239976, "epoch": 1983} {"train_loss": -42.62438201904297, "global_step": 239977, "epoch": 1983} {"train_loss": -43.04511260986328, "global_step": 239978, "epoch": 1983} {"train_loss": -41.84925842285156, "global_step": 239979, "epoch": 1983} {"train_loss": -42.805782318115234, "global_step": 239980, "epoch": 1983} {"train_loss": -42.37281036376953, "global_step": 239981, "epoch": 1983} {"train_loss": -43.05162048339844, "global_step": 239982, "epoch": 1983} {"train_loss": -42.86955642700195, "global_step": 239983, "epoch": 1983} {"train_loss": -42.95594024658203, "global_step": 239984, "epoch": 1983} {"train_loss": -42.35539627075195, "global_step": 239985, "epoch": 1983} {"train_loss": -41.60466384887695, "global_step": 239986, "epoch": 1983} {"train_loss": -43.007869720458984, "global_step": 239987, "epoch": 1983} {"train_loss": -42.379371643066406, "global_step": 239988, "epoch": 1983} {"train_loss": -41.98789978027344, "global_step": 239989, "epoch": 1983} {"train_loss": -43.374114990234375, "global_step": 239990, "epoch": 1983} {"train_loss": -42.786190032958984, "global_step": 239991, "epoch": 1983} {"train_loss": -42.1311149597168, "global_step": 239992, "epoch": 1983} {"train_loss": -43.27560806274414, "global_step": 239993, "epoch": 1983} {"train_loss": -42.5750732421875, "global_step": 239994, "epoch": 1983} {"train_loss": -42.735755920410156, "global_step": 239995, "epoch": 1983} {"train_loss": -42.90757751464844, "global_step": 239996, "epoch": 1983} {"train_loss": -42.4449348449707, "global_step": 239997, "epoch": 1983} {"train_loss": -41.708648681640625, "global_step": 239998, "epoch": 1983} {"train_loss": -42.10726547241211, "global_step": 239999, "epoch": 1983} {"train_loss": -43.162872314453125, "global_step": 240000, "epoch": 1983} {"train_loss": -43.38446807861328, "global_step": 240001, "epoch": 1983} {"train_loss": -42.80570983886719, "global_step": 240002, "epoch": 1983} {"train_loss": -43.200984954833984, "global_step": 240003, "epoch": 1983} {"train_loss": -42.388668060302734, "global_step": 240004, "epoch": 1983} {"train_loss": -43.08849334716797, "global_step": 240005, "epoch": 1983} {"train_loss": -43.2845344543457, "global_step": 240006, "epoch": 1983} {"train_loss": -42.43616485595703, "global_step": 240007, "epoch": 1983} {"train_loss": -43.658485412597656, "global_step": 240008, "epoch": 1983} {"train_loss": -43.24274826049805, "global_step": 240009, "epoch": 1983} {"train_loss": -42.81177520751953, "global_step": 240010, "epoch": 1983} {"train_loss": -43.197914123535156, "global_step": 240011, "epoch": 1983} {"train_loss": -43.27976608276367, "global_step": 240012, "epoch": 1983} {"train_loss": -43.41347885131836, "global_step": 240013, "epoch": 1983} {"train_loss": -43.470542907714844, "global_step": 240014, "epoch": 1983} {"train_loss": -43.153804779052734, "global_step": 240015, "epoch": 1983} {"train_loss": -43.33590316772461, "global_step": 240016, "epoch": 1983} {"train_loss": -42.207454681396484, "global_step": 240017, "epoch": 1983} {"train_loss": -42.57221221923828, "global_step": 240018, "epoch": 1983} {"train_loss": -43.22406768798828, "global_step": 240019, "epoch": 1983} {"train_loss": -43.556419372558594, "global_step": 240020, "epoch": 1983} {"train_loss": -43.42508316040039, "global_step": 240021, "epoch": 1983} {"train_loss": -42.72949981689453, "global_step": 240022, "epoch": 1983} {"train_loss": -40.63370895385742, "global_step": 240023, "epoch": 1983} {"train_loss": -40.55555725097656, "global_step": 240024, "epoch": 1983} {"train_loss": -41.863346099853516, "global_step": 240025, "epoch": 1983} {"train_loss": -40.7846794128418, "global_step": 240026, "epoch": 1983} {"train_loss": -39.513614654541016, "global_step": 240027, "epoch": 1983} {"train_loss": -38.89104080200195, "global_step": 240028, "epoch": 1983} {"train_loss": -39.819549560546875, "global_step": 240029, "epoch": 1983} {"train_loss": -39.579376220703125, "global_step": 240030, "epoch": 1983} {"train_loss": -40.09657669067383, "global_step": 240031, "epoch": 1983} {"train_loss": -39.67007064819336, "global_step": 240032, "epoch": 1983} {"train_loss": -40.94636154174805, "global_step": 240033, "epoch": 1983} {"train_loss": -40.70454025268555, "global_step": 240034, "epoch": 1983} {"train_loss": -40.12335205078125, "global_step": 240035, "epoch": 1983} {"train_loss": -40.315330505371094, "global_step": 240036, "epoch": 1983} {"train_loss": -40.4587287902832, "global_step": 240037, "epoch": 1983} {"train_loss": -41.21828079223633, "global_step": 240038, "epoch": 1983} {"train_loss": -41.416927337646484, "global_step": 240039, "epoch": 1983} {"train_loss": -41.863407135009766, "global_step": 240040, "epoch": 1983} {"train_loss": -40.4720573425293, "global_step": 240041, "epoch": 1983} {"train_loss": -41.03766632080078, "global_step": 240042, "epoch": 1983} {"train_loss": -41.907752990722656, "global_step": 240043, "epoch": 1983} {"train_loss": -41.84858322143555, "global_step": 240044, "epoch": 1983} {"train_loss": -42.21694564819336, "global_step": 240045, "epoch": 1983} {"train_loss": -41.2363395690918, "global_step": 240046, "epoch": 1983} {"train_loss": -42.4962158203125, "global_step": 240047, "epoch": 1983} {"train_loss": -41.34859848022461, "global_step": 240048, "epoch": 1983} {"train_loss": -42.43212890625, "global_step": 240049, "epoch": 1983} {"train_loss": -42.368408203125, "global_step": 240050, "epoch": 1983} {"train_loss": -42.54573440551758, "global_step": 240051, "epoch": 1983} {"train_loss": -42.61804962158203, "global_step": 240052, "epoch": 1983} {"train_loss": -42.49991226196289, "global_step": 240053, "epoch": 1983} {"train_loss": -42.44602966308594, "global_step": 240054, "epoch": 1983} {"train_loss": -42.64188766479492, "global_step": 240055, "epoch": 1983} {"train_loss": -43.30282211303711, "global_step": 240056, "epoch": 1983} {"train_loss": -42.93739318847656, "global_step": 240057, "epoch": 1983} {"train_loss": -42.286766052246094, "global_step": 240058, "epoch": 1983} {"train_loss": -42.758785247802734, "global_step": 240059, "epoch": 1983} {"train_loss": -42.3153076171875, "global_step": 240060, "epoch": 1983} {"train_loss": -41.68348693847656, "global_step": 240061, "epoch": 1983} {"train_loss": -42.51108932495117, "global_step": 240062, "epoch": 1983} {"train_loss": -41.866195899395905, "global_step": 240063, "epoch": 1983, "val_loss": 2538270.25} {"train_loss": -41.51078414916992, "global_step": 240064, "epoch": 1984} {"train_loss": -42.06222152709961, "global_step": 240065, "epoch": 1984} {"train_loss": -42.175048828125, "global_step": 240066, "epoch": 1984} {"train_loss": -42.03792953491211, "global_step": 240067, "epoch": 1984} {"train_loss": -41.96259689331055, "global_step": 240068, "epoch": 1984} {"train_loss": -42.28948974609375, "global_step": 240069, "epoch": 1984} {"train_loss": -41.45260238647461, "global_step": 240070, "epoch": 1984} {"train_loss": -42.6780891418457, "global_step": 240071, "epoch": 1984} {"train_loss": -42.53044891357422, "global_step": 240072, "epoch": 1984} {"train_loss": -42.45634078979492, "global_step": 240073, "epoch": 1984} {"train_loss": -42.38510513305664, "global_step": 240074, "epoch": 1984} {"train_loss": -41.44343566894531, "global_step": 240075, "epoch": 1984} {"train_loss": -42.96328353881836, "global_step": 240076, "epoch": 1984} {"train_loss": -41.98246383666992, "global_step": 240077, "epoch": 1984} {"train_loss": -42.7817497253418, "global_step": 240078, "epoch": 1984} {"train_loss": -43.136959075927734, "global_step": 240079, "epoch": 1984} {"train_loss": -42.58124923706055, "global_step": 240080, "epoch": 1984} {"train_loss": -42.80778503417969, "global_step": 240081, "epoch": 1984} {"train_loss": -42.621280670166016, "global_step": 240082, "epoch": 1984} {"train_loss": -43.20671844482422, "global_step": 240083, "epoch": 1984} {"train_loss": -42.67094039916992, "global_step": 240084, "epoch": 1984} {"train_loss": -43.20442199707031, "global_step": 240085, "epoch": 1984} {"train_loss": -42.98994445800781, "global_step": 240086, "epoch": 1984} {"train_loss": -43.5031623840332, "global_step": 240087, "epoch": 1984} {"train_loss": -43.27181625366211, "global_step": 240088, "epoch": 1984} {"train_loss": -43.20893096923828, "global_step": 240089, "epoch": 1984} {"train_loss": -43.318965911865234, "global_step": 240090, "epoch": 1984} {"train_loss": -43.62675094604492, "global_step": 240091, "epoch": 1984} {"train_loss": -43.167320251464844, "global_step": 240092, "epoch": 1984} {"train_loss": -43.65786361694336, "global_step": 240093, "epoch": 1984} {"train_loss": -43.38824462890625, "global_step": 240094, "epoch": 1984} {"train_loss": -43.57973098754883, "global_step": 240095, "epoch": 1984} {"train_loss": -43.08026885986328, "global_step": 240096, "epoch": 1984} {"train_loss": -42.69926452636719, "global_step": 240097, "epoch": 1984} {"train_loss": -41.17633819580078, "global_step": 240098, "epoch": 1984} {"train_loss": -42.049564361572266, "global_step": 240099, "epoch": 1984} {"train_loss": -43.04194641113281, "global_step": 240100, "epoch": 1984} {"train_loss": -42.558895111083984, "global_step": 240101, "epoch": 1984} {"train_loss": -43.24860382080078, "global_step": 240102, "epoch": 1984} {"train_loss": -43.26582717895508, "global_step": 240103, "epoch": 1984} {"train_loss": -43.911964416503906, "global_step": 240104, "epoch": 1984} {"train_loss": -41.949195861816406, "global_step": 240105, "epoch": 1984} {"train_loss": -43.06667709350586, "global_step": 240106, "epoch": 1984} {"train_loss": -43.687652587890625, "global_step": 240107, "epoch": 1984} {"train_loss": -43.550148010253906, "global_step": 240108, "epoch": 1984} {"train_loss": -42.77926254272461, "global_step": 240109, "epoch": 1984} {"train_loss": -43.115848541259766, "global_step": 240110, "epoch": 1984} {"train_loss": -43.175716400146484, "global_step": 240111, "epoch": 1984} {"train_loss": -43.59617614746094, "global_step": 240112, "epoch": 1984} {"train_loss": -42.95595932006836, "global_step": 240113, "epoch": 1984} {"train_loss": -43.60158157348633, "global_step": 240114, "epoch": 1984} {"train_loss": -43.636207580566406, "global_step": 240115, "epoch": 1984} {"train_loss": -42.78096389770508, "global_step": 240116, "epoch": 1984} {"train_loss": -43.41654586791992, "global_step": 240117, "epoch": 1984} {"train_loss": -43.682098388671875, "global_step": 240118, "epoch": 1984} {"train_loss": -43.3754997253418, "global_step": 240119, "epoch": 1984} {"train_loss": -43.654273986816406, "global_step": 240120, "epoch": 1984} {"train_loss": -42.699825286865234, "global_step": 240121, "epoch": 1984} {"train_loss": -43.549808502197266, "global_step": 240122, "epoch": 1984} {"train_loss": -43.89802169799805, "global_step": 240123, "epoch": 1984} {"train_loss": -42.947574615478516, "global_step": 240124, "epoch": 1984} {"train_loss": -43.0512809753418, "global_step": 240125, "epoch": 1984} {"train_loss": -42.9062614440918, "global_step": 240126, "epoch": 1984} {"train_loss": -42.70022964477539, "global_step": 240127, "epoch": 1984} {"train_loss": -42.85190963745117, "global_step": 240128, "epoch": 1984} {"train_loss": -43.38252258300781, "global_step": 240129, "epoch": 1984} {"train_loss": -44.15770721435547, "global_step": 240130, "epoch": 1984} {"train_loss": -42.04403305053711, "global_step": 240131, "epoch": 1984} {"train_loss": -41.93727493286133, "global_step": 240132, "epoch": 1984} {"train_loss": -42.816402435302734, "global_step": 240133, "epoch": 1984} {"train_loss": -43.29385757446289, "global_step": 240134, "epoch": 1984} {"train_loss": -41.89421081542969, "global_step": 240135, "epoch": 1984} {"train_loss": -43.102691650390625, "global_step": 240136, "epoch": 1984} {"train_loss": -41.58140182495117, "global_step": 240137, "epoch": 1984} {"train_loss": -42.45212936401367, "global_step": 240138, "epoch": 1984} {"train_loss": -42.956851959228516, "global_step": 240139, "epoch": 1984} {"train_loss": -43.87800216674805, "global_step": 240140, "epoch": 1984} {"train_loss": -42.67142868041992, "global_step": 240141, "epoch": 1984} {"train_loss": -42.21627426147461, "global_step": 240142, "epoch": 1984} {"train_loss": -42.96692657470703, "global_step": 240143, "epoch": 1984} {"train_loss": -43.22170639038086, "global_step": 240144, "epoch": 1984} {"train_loss": -42.49134826660156, "global_step": 240145, "epoch": 1984} {"train_loss": -42.082489013671875, "global_step": 240146, "epoch": 1984} {"train_loss": -42.87176513671875, "global_step": 240147, "epoch": 1984} {"train_loss": -42.092254638671875, "global_step": 240148, "epoch": 1984} {"train_loss": -43.21222686767578, "global_step": 240149, "epoch": 1984} {"train_loss": -41.43708419799805, "global_step": 240150, "epoch": 1984} {"train_loss": -42.86427688598633, "global_step": 240151, "epoch": 1984} {"train_loss": -42.544830322265625, "global_step": 240152, "epoch": 1984} {"train_loss": -41.966712951660156, "global_step": 240153, "epoch": 1984} {"train_loss": -41.189945220947266, "global_step": 240154, "epoch": 1984} {"train_loss": -41.625301361083984, "global_step": 240155, "epoch": 1984} {"train_loss": -41.273067474365234, "global_step": 240156, "epoch": 1984} {"train_loss": -40.90586853027344, "global_step": 240157, "epoch": 1984} {"train_loss": -41.17324447631836, "global_step": 240158, "epoch": 1984} {"train_loss": -42.90719223022461, "global_step": 240159, "epoch": 1984} {"train_loss": -43.00422668457031, "global_step": 240160, "epoch": 1984} {"train_loss": -41.1787109375, "global_step": 240161, "epoch": 1984} {"train_loss": -42.008480072021484, "global_step": 240162, "epoch": 1984} {"train_loss": -41.81797409057617, "global_step": 240163, "epoch": 1984} {"train_loss": -39.17678451538086, "global_step": 240164, "epoch": 1984} {"train_loss": -41.617515563964844, "global_step": 240165, "epoch": 1984} {"train_loss": -41.10691452026367, "global_step": 240166, "epoch": 1984} {"train_loss": -41.693538665771484, "global_step": 240167, "epoch": 1984} {"train_loss": -41.22287368774414, "global_step": 240168, "epoch": 1984} {"train_loss": -40.541961669921875, "global_step": 240169, "epoch": 1984} {"train_loss": -39.2811164855957, "global_step": 240170, "epoch": 1984} {"train_loss": -40.418460845947266, "global_step": 240171, "epoch": 1984} {"train_loss": -41.958797454833984, "global_step": 240172, "epoch": 1984} {"train_loss": -40.7884521484375, "global_step": 240173, "epoch": 1984} {"train_loss": -42.20905685424805, "global_step": 240174, "epoch": 1984} {"train_loss": -41.880409240722656, "global_step": 240175, "epoch": 1984} {"train_loss": -41.133949279785156, "global_step": 240176, "epoch": 1984} {"train_loss": -41.43284606933594, "global_step": 240177, "epoch": 1984} {"train_loss": -41.774269104003906, "global_step": 240178, "epoch": 1984} {"train_loss": -35.217525482177734, "global_step": 240179, "epoch": 1984} {"train_loss": -41.1256103515625, "global_step": 240180, "epoch": 1984} {"train_loss": -41.47745132446289, "global_step": 240181, "epoch": 1984} {"train_loss": -40.26066589355469, "global_step": 240182, "epoch": 1984} {"train_loss": -41.23286056518555, "global_step": 240183, "epoch": 1984} {"train_loss": -42.37416577930293, "global_step": 240184, "epoch": 1984, "val_loss": 2586262.5} {"train_loss": -39.966793060302734, "global_step": 240185, "epoch": 1985} {"train_loss": -42.25547409057617, "global_step": 240186, "epoch": 1985} {"train_loss": -38.1313362121582, "global_step": 240187, "epoch": 1985} {"train_loss": -40.170284271240234, "global_step": 240188, "epoch": 1985} {"train_loss": -40.69355010986328, "global_step": 240189, "epoch": 1985} {"train_loss": -38.636959075927734, "global_step": 240190, "epoch": 1985} {"train_loss": -42.814117431640625, "global_step": 240191, "epoch": 1985} {"train_loss": -39.30389404296875, "global_step": 240192, "epoch": 1985} {"train_loss": -42.223731994628906, "global_step": 240193, "epoch": 1985} {"train_loss": -40.93491744995117, "global_step": 240194, "epoch": 1985} {"train_loss": -40.302547454833984, "global_step": 240195, "epoch": 1985} {"train_loss": -42.581932067871094, "global_step": 240196, "epoch": 1985} {"train_loss": -39.14997482299805, "global_step": 240197, "epoch": 1985} {"train_loss": -41.437782287597656, "global_step": 240198, "epoch": 1985} {"train_loss": -41.066375732421875, "global_step": 240199, "epoch": 1985} {"train_loss": -41.560482025146484, "global_step": 240200, "epoch": 1985} {"train_loss": -41.43502426147461, "global_step": 240201, "epoch": 1985} {"train_loss": -40.70028305053711, "global_step": 240202, "epoch": 1985} {"train_loss": -42.04433059692383, "global_step": 240203, "epoch": 1985} {"train_loss": -41.1136589050293, "global_step": 240204, "epoch": 1985} {"train_loss": -42.04912185668945, "global_step": 240205, "epoch": 1985} {"train_loss": -42.43365478515625, "global_step": 240206, "epoch": 1985} {"train_loss": -42.47914123535156, "global_step": 240207, "epoch": 1985} {"train_loss": -42.280494689941406, "global_step": 240208, "epoch": 1985} {"train_loss": -41.13426208496094, "global_step": 240209, "epoch": 1985} {"train_loss": -42.81228256225586, "global_step": 240210, "epoch": 1985} {"train_loss": -39.47636032104492, "global_step": 240211, "epoch": 1985} {"train_loss": -42.523712158203125, "global_step": 240212, "epoch": 1985} {"train_loss": -42.44324493408203, "global_step": 240213, "epoch": 1985} {"train_loss": -42.93315505981445, "global_step": 240214, "epoch": 1985} {"train_loss": -43.31306076049805, "global_step": 240215, "epoch": 1985} {"train_loss": -42.59174728393555, "global_step": 240216, "epoch": 1985} {"train_loss": -42.558624267578125, "global_step": 240217, "epoch": 1985} {"train_loss": -42.71527862548828, "global_step": 240218, "epoch": 1985} {"train_loss": -42.42036056518555, "global_step": 240219, "epoch": 1985} {"train_loss": -43.013362884521484, "global_step": 240220, "epoch": 1985} {"train_loss": -42.602760314941406, "global_step": 240221, "epoch": 1985} {"train_loss": -43.12392044067383, "global_step": 240222, "epoch": 1985} {"train_loss": -43.22495651245117, "global_step": 240223, "epoch": 1985} {"train_loss": -43.01470184326172, "global_step": 240224, "epoch": 1985} {"train_loss": -42.86017990112305, "global_step": 240225, "epoch": 1985} {"train_loss": -43.00362777709961, "global_step": 240226, "epoch": 1985} {"train_loss": -43.283180236816406, "global_step": 240227, "epoch": 1985} {"train_loss": -42.80601119995117, "global_step": 240228, "epoch": 1985} {"train_loss": -42.8697509765625, "global_step": 240229, "epoch": 1985} {"train_loss": -43.191749572753906, "global_step": 240230, "epoch": 1985} {"train_loss": -43.012977600097656, "global_step": 240231, "epoch": 1985} {"train_loss": -43.10308837890625, "global_step": 240232, "epoch": 1985} {"train_loss": -43.29254913330078, "global_step": 240233, "epoch": 1985} {"train_loss": -43.57543182373047, "global_step": 240234, "epoch": 1985} {"train_loss": -43.364532470703125, "global_step": 240235, "epoch": 1985} {"train_loss": -43.1640625, "global_step": 240236, "epoch": 1985} {"train_loss": -43.83019256591797, "global_step": 240237, "epoch": 1985} {"train_loss": -43.85012435913086, "global_step": 240238, "epoch": 1985} {"train_loss": -43.75301742553711, "global_step": 240239, "epoch": 1985} {"train_loss": -40.10125732421875, "global_step": 240240, "epoch": 1985} {"train_loss": -42.52634048461914, "global_step": 240241, "epoch": 1985} {"train_loss": -42.71073532104492, "global_step": 240242, "epoch": 1985} {"train_loss": -43.92561340332031, "global_step": 240243, "epoch": 1985} {"train_loss": -43.658199310302734, "global_step": 240244, "epoch": 1985} {"train_loss": -43.49606704711914, "global_step": 240245, "epoch": 1985} {"train_loss": -43.04314041137695, "global_step": 240246, "epoch": 1985} {"train_loss": -42.91225814819336, "global_step": 240247, "epoch": 1985} {"train_loss": -43.37469482421875, "global_step": 240248, "epoch": 1985} {"train_loss": -43.21796417236328, "global_step": 240249, "epoch": 1985} {"train_loss": -42.234554290771484, "global_step": 240250, "epoch": 1985} {"train_loss": -43.214839935302734, "global_step": 240251, "epoch": 1985} {"train_loss": -43.61353302001953, "global_step": 240252, "epoch": 1985} {"train_loss": -43.653778076171875, "global_step": 240253, "epoch": 1985} {"train_loss": -43.580020904541016, "global_step": 240254, "epoch": 1985} {"train_loss": -41.32794952392578, "global_step": 240255, "epoch": 1985} {"train_loss": -43.144691467285156, "global_step": 240256, "epoch": 1985} {"train_loss": -43.07291793823242, "global_step": 240257, "epoch": 1985} {"train_loss": -43.64711380004883, "global_step": 240258, "epoch": 1985} {"train_loss": -43.793697357177734, "global_step": 240259, "epoch": 1985} {"train_loss": -42.04008102416992, "global_step": 240260, "epoch": 1985} {"train_loss": -42.50959396362305, "global_step": 240261, "epoch": 1985} {"train_loss": -41.505123138427734, "global_step": 240262, "epoch": 1985} {"train_loss": -41.82106018066406, "global_step": 240263, "epoch": 1985} {"train_loss": -41.127803802490234, "global_step": 240264, "epoch": 1985} {"train_loss": -42.60757064819336, "global_step": 240265, "epoch": 1985} {"train_loss": -43.503028869628906, "global_step": 240266, "epoch": 1985} {"train_loss": -43.66669845581055, "global_step": 240267, "epoch": 1985} {"train_loss": -43.328731536865234, "global_step": 240268, "epoch": 1985} {"train_loss": -43.14091110229492, "global_step": 240269, "epoch": 1985} {"train_loss": -42.91352462768555, "global_step": 240270, "epoch": 1985} {"train_loss": -43.74492263793945, "global_step": 240271, "epoch": 1985} {"train_loss": -43.42559814453125, "global_step": 240272, "epoch": 1985} {"train_loss": -42.09213638305664, "global_step": 240273, "epoch": 1985} {"train_loss": -44.17165756225586, "global_step": 240274, "epoch": 1985} {"train_loss": -44.182796478271484, "global_step": 240275, "epoch": 1985} {"train_loss": -44.03229522705078, "global_step": 240276, "epoch": 1985} {"train_loss": -43.64552688598633, "global_step": 240277, "epoch": 1985} {"train_loss": -44.25083541870117, "global_step": 240278, "epoch": 1985} {"train_loss": -43.56535720825195, "global_step": 240279, "epoch": 1985} {"train_loss": -43.285057067871094, "global_step": 240280, "epoch": 1985} {"train_loss": -42.30619430541992, "global_step": 240281, "epoch": 1985} {"train_loss": -43.22819900512695, "global_step": 240282, "epoch": 1985} {"train_loss": -43.256771087646484, "global_step": 240283, "epoch": 1985} {"train_loss": -43.64168930053711, "global_step": 240284, "epoch": 1985} {"train_loss": -42.81565856933594, "global_step": 240285, "epoch": 1985} {"train_loss": -42.40797805786133, "global_step": 240286, "epoch": 1985} {"train_loss": -43.23493194580078, "global_step": 240287, "epoch": 1985} {"train_loss": -42.950965881347656, "global_step": 240288, "epoch": 1985} {"train_loss": -42.78030014038086, "global_step": 240289, "epoch": 1985} {"train_loss": -42.23384094238281, "global_step": 240290, "epoch": 1985} {"train_loss": -43.28341293334961, "global_step": 240291, "epoch": 1985} {"train_loss": -43.98360061645508, "global_step": 240292, "epoch": 1985} {"train_loss": -42.8103141784668, "global_step": 240293, "epoch": 1985} {"train_loss": -42.92408752441406, "global_step": 240294, "epoch": 1985} {"train_loss": -42.078041076660156, "global_step": 240295, "epoch": 1985} {"train_loss": -41.723690032958984, "global_step": 240296, "epoch": 1985} {"train_loss": -42.314327239990234, "global_step": 240297, "epoch": 1985} {"train_loss": -41.31951904296875, "global_step": 240298, "epoch": 1985} {"train_loss": -41.45573043823242, "global_step": 240299, "epoch": 1985} {"train_loss": -41.960723876953125, "global_step": 240300, "epoch": 1985} {"train_loss": -41.782527923583984, "global_step": 240301, "epoch": 1985} {"train_loss": -43.989410400390625, "global_step": 240302, "epoch": 1985} {"train_loss": -42.5594482421875, "global_step": 240303, "epoch": 1985} {"train_loss": -42.022377014160156, "global_step": 240304, "epoch": 1985} {"train_loss": -42.52673778061039, "global_step": 240305, "epoch": 1985, "val_loss": 2545521.25} {"train_loss": -42.580787658691406, "global_step": 240306, "epoch": 1986} {"train_loss": -43.35383987426758, "global_step": 240307, "epoch": 1986} {"train_loss": -43.41762924194336, "global_step": 240308, "epoch": 1986} {"train_loss": -43.52092361450195, "global_step": 240309, "epoch": 1986} {"train_loss": -43.005653381347656, "global_step": 240310, "epoch": 1986} {"train_loss": -43.485557556152344, "global_step": 240311, "epoch": 1986} {"train_loss": -43.06978988647461, "global_step": 240312, "epoch": 1986} {"train_loss": -42.871185302734375, "global_step": 240313, "epoch": 1986} {"train_loss": -42.1492805480957, "global_step": 240314, "epoch": 1986} {"train_loss": -43.49502182006836, "global_step": 240315, "epoch": 1986} {"train_loss": -42.72845458984375, "global_step": 240316, "epoch": 1986} {"train_loss": -42.33637237548828, "global_step": 240317, "epoch": 1986} {"train_loss": -43.58802795410156, "global_step": 240318, "epoch": 1986} {"train_loss": -43.6515007019043, "global_step": 240319, "epoch": 1986} {"train_loss": -43.12287521362305, "global_step": 240320, "epoch": 1986} {"train_loss": -42.434810638427734, "global_step": 240321, "epoch": 1986} {"train_loss": -42.19990921020508, "global_step": 240322, "epoch": 1986} {"train_loss": -42.55326461791992, "global_step": 240323, "epoch": 1986} {"train_loss": -43.01859664916992, "global_step": 240324, "epoch": 1986} {"train_loss": -42.86149978637695, "global_step": 240325, "epoch": 1986} {"train_loss": -42.89226150512695, "global_step": 240326, "epoch": 1986} {"train_loss": -41.94883346557617, "global_step": 240327, "epoch": 1986} {"train_loss": -42.743797302246094, "global_step": 240328, "epoch": 1986} {"train_loss": -42.85665512084961, "global_step": 240329, "epoch": 1986} {"train_loss": -42.698482513427734, "global_step": 240330, "epoch": 1986} {"train_loss": -41.68644714355469, "global_step": 240331, "epoch": 1986} {"train_loss": -41.872982025146484, "global_step": 240332, "epoch": 1986} {"train_loss": -42.777156829833984, "global_step": 240333, "epoch": 1986} {"train_loss": -42.817684173583984, "global_step": 240334, "epoch": 1986} {"train_loss": -41.93087387084961, "global_step": 240335, "epoch": 1986} {"train_loss": -41.36845779418945, "global_step": 240336, "epoch": 1986} {"train_loss": -42.14811706542969, "global_step": 240337, "epoch": 1986} {"train_loss": -42.13349533081055, "global_step": 240338, "epoch": 1986} {"train_loss": -41.11962890625, "global_step": 240339, "epoch": 1986} {"train_loss": -40.59352493286133, "global_step": 240340, "epoch": 1986} {"train_loss": -43.26527404785156, "global_step": 240341, "epoch": 1986} {"train_loss": -42.92316818237305, "global_step": 240342, "epoch": 1986} {"train_loss": -41.293922424316406, "global_step": 240343, "epoch": 1986} {"train_loss": -43.45659255981445, "global_step": 240344, "epoch": 1986} {"train_loss": -43.13330078125, "global_step": 240345, "epoch": 1986} {"train_loss": -42.50074005126953, "global_step": 240346, "epoch": 1986} {"train_loss": -42.356117248535156, "global_step": 240347, "epoch": 1986} {"train_loss": -41.91526412963867, "global_step": 240348, "epoch": 1986} {"train_loss": -42.97859573364258, "global_step": 240349, "epoch": 1986} {"train_loss": -42.84263229370117, "global_step": 240350, "epoch": 1986} {"train_loss": -42.45318603515625, "global_step": 240351, "epoch": 1986} {"train_loss": -43.75136947631836, "global_step": 240352, "epoch": 1986} {"train_loss": -42.640769958496094, "global_step": 240353, "epoch": 1986} {"train_loss": -42.96196365356445, "global_step": 240354, "epoch": 1986} {"train_loss": -43.48612594604492, "global_step": 240355, "epoch": 1986} {"train_loss": -41.93904113769531, "global_step": 240356, "epoch": 1986} {"train_loss": -41.66489791870117, "global_step": 240357, "epoch": 1986} {"train_loss": -43.04691696166992, "global_step": 240358, "epoch": 1986} {"train_loss": -43.19440460205078, "global_step": 240359, "epoch": 1986} {"train_loss": -42.383453369140625, "global_step": 240360, "epoch": 1986} {"train_loss": -42.58968734741211, "global_step": 240361, "epoch": 1986} {"train_loss": -43.3365364074707, "global_step": 240362, "epoch": 1986} {"train_loss": -43.136470794677734, "global_step": 240363, "epoch": 1986} {"train_loss": -43.02605438232422, "global_step": 240364, "epoch": 1986} {"train_loss": -43.52406692504883, "global_step": 240365, "epoch": 1986} {"train_loss": -43.27511215209961, "global_step": 240366, "epoch": 1986} {"train_loss": -42.751220703125, "global_step": 240367, "epoch": 1986} {"train_loss": -43.20335388183594, "global_step": 240368, "epoch": 1986} {"train_loss": -43.87249755859375, "global_step": 240369, "epoch": 1986} {"train_loss": -43.98495101928711, "global_step": 240370, "epoch": 1986} {"train_loss": -43.13264846801758, "global_step": 240371, "epoch": 1986} {"train_loss": -43.24149703979492, "global_step": 240372, "epoch": 1986} {"train_loss": -42.844696044921875, "global_step": 240373, "epoch": 1986} {"train_loss": -42.93758773803711, "global_step": 240374, "epoch": 1986} {"train_loss": -42.9169807434082, "global_step": 240375, "epoch": 1986} {"train_loss": -43.106441497802734, "global_step": 240376, "epoch": 1986} {"train_loss": -44.09047317504883, "global_step": 240377, "epoch": 1986} {"train_loss": -38.88307571411133, "global_step": 240378, "epoch": 1986} {"train_loss": -41.883052825927734, "global_step": 240379, "epoch": 1986} {"train_loss": -40.79876708984375, "global_step": 240380, "epoch": 1986} {"train_loss": -40.46091842651367, "global_step": 240381, "epoch": 1986} {"train_loss": -42.290313720703125, "global_step": 240382, "epoch": 1986} {"train_loss": -40.45596694946289, "global_step": 240383, "epoch": 1986} {"train_loss": -39.383155822753906, "global_step": 240384, "epoch": 1986} {"train_loss": -41.620452880859375, "global_step": 240385, "epoch": 1986} {"train_loss": -40.35148239135742, "global_step": 240386, "epoch": 1986} {"train_loss": -39.25811767578125, "global_step": 240387, "epoch": 1986} {"train_loss": -41.580902099609375, "global_step": 240388, "epoch": 1986} {"train_loss": -38.70425033569336, "global_step": 240389, "epoch": 1986} {"train_loss": -40.18436813354492, "global_step": 240390, "epoch": 1986} {"train_loss": -41.67378616333008, "global_step": 240391, "epoch": 1986} {"train_loss": -40.5679931640625, "global_step": 240392, "epoch": 1986} {"train_loss": -42.042720794677734, "global_step": 240393, "epoch": 1986} {"train_loss": -41.691253662109375, "global_step": 240394, "epoch": 1986} {"train_loss": -41.59100341796875, "global_step": 240395, "epoch": 1986} {"train_loss": -41.20116424560547, "global_step": 240396, "epoch": 1986} {"train_loss": -40.990726470947266, "global_step": 240397, "epoch": 1986} {"train_loss": -43.01808547973633, "global_step": 240398, "epoch": 1986} {"train_loss": -41.199684143066406, "global_step": 240399, "epoch": 1986} {"train_loss": -41.278682708740234, "global_step": 240400, "epoch": 1986} {"train_loss": -41.764766693115234, "global_step": 240401, "epoch": 1986} {"train_loss": -42.00018310546875, "global_step": 240402, "epoch": 1986} {"train_loss": -41.67798614501953, "global_step": 240403, "epoch": 1986} {"train_loss": -40.3674430847168, "global_step": 240404, "epoch": 1986} {"train_loss": -41.6640510559082, "global_step": 240405, "epoch": 1986} {"train_loss": -41.7931022644043, "global_step": 240406, "epoch": 1986} {"train_loss": -40.26480484008789, "global_step": 240407, "epoch": 1986} {"train_loss": -40.18679428100586, "global_step": 240408, "epoch": 1986} {"train_loss": -41.88674545288086, "global_step": 240409, "epoch": 1986} {"train_loss": -40.20119857788086, "global_step": 240410, "epoch": 1986} {"train_loss": -40.9197883605957, "global_step": 240411, "epoch": 1986} {"train_loss": -42.15264892578125, "global_step": 240412, "epoch": 1986} {"train_loss": -41.34126663208008, "global_step": 240413, "epoch": 1986} {"train_loss": -42.154232025146484, "global_step": 240414, "epoch": 1986} {"train_loss": -41.568092346191406, "global_step": 240415, "epoch": 1986} {"train_loss": -41.98952865600586, "global_step": 240416, "epoch": 1986} {"train_loss": -41.9975471496582, "global_step": 240417, "epoch": 1986} {"train_loss": -41.993499755859375, "global_step": 240418, "epoch": 1986} {"train_loss": -41.29266357421875, "global_step": 240419, "epoch": 1986} {"train_loss": -42.430633544921875, "global_step": 240420, "epoch": 1986} {"train_loss": -42.366065979003906, "global_step": 240421, "epoch": 1986} {"train_loss": -41.8563232421875, "global_step": 240422, "epoch": 1986} {"train_loss": -42.76716995239258, "global_step": 240423, "epoch": 1986} {"train_loss": -42.581024169921875, "global_step": 240424, "epoch": 1986} {"train_loss": -42.07188415527344, "global_step": 240425, "epoch": 1986} {"train_loss": -42.190225995276585, "global_step": 240426, "epoch": 1986, "val_loss": 2488807.0} {"train_loss": -42.6095085144043, "global_step": 240427, "epoch": 1987} {"train_loss": -42.91848373413086, "global_step": 240428, "epoch": 1987} {"train_loss": -42.464942932128906, "global_step": 240429, "epoch": 1987} {"train_loss": -43.00104522705078, "global_step": 240430, "epoch": 1987} {"train_loss": -42.928489685058594, "global_step": 240431, "epoch": 1987} {"train_loss": -42.19856643676758, "global_step": 240432, "epoch": 1987} {"train_loss": -43.20774459838867, "global_step": 240433, "epoch": 1987} {"train_loss": -43.37934494018555, "global_step": 240434, "epoch": 1987} {"train_loss": -42.93256378173828, "global_step": 240435, "epoch": 1987} {"train_loss": -43.21416091918945, "global_step": 240436, "epoch": 1987} {"train_loss": -42.717411041259766, "global_step": 240437, "epoch": 1987} {"train_loss": -42.620723724365234, "global_step": 240438, "epoch": 1987} {"train_loss": -42.50919723510742, "global_step": 240439, "epoch": 1987} {"train_loss": -42.076622009277344, "global_step": 240440, "epoch": 1987} {"train_loss": -42.75489044189453, "global_step": 240441, "epoch": 1987} {"train_loss": -43.13334274291992, "global_step": 240442, "epoch": 1987} {"train_loss": -43.106895446777344, "global_step": 240443, "epoch": 1987} {"train_loss": -42.66581726074219, "global_step": 240444, "epoch": 1987} {"train_loss": -44.01581573486328, "global_step": 240445, "epoch": 1987} {"train_loss": -43.103397369384766, "global_step": 240446, "epoch": 1987} {"train_loss": -43.39730453491211, "global_step": 240447, "epoch": 1987} {"train_loss": -43.3157844543457, "global_step": 240448, "epoch": 1987} {"train_loss": -42.979427337646484, "global_step": 240449, "epoch": 1987} {"train_loss": -41.4869270324707, "global_step": 240450, "epoch": 1987} {"train_loss": -42.24345016479492, "global_step": 240451, "epoch": 1987} {"train_loss": -43.38751983642578, "global_step": 240452, "epoch": 1987} {"train_loss": -42.45375442504883, "global_step": 240453, "epoch": 1987} {"train_loss": -42.39695358276367, "global_step": 240454, "epoch": 1987} {"train_loss": -43.30373001098633, "global_step": 240455, "epoch": 1987} {"train_loss": -43.0860710144043, "global_step": 240456, "epoch": 1987} {"train_loss": -42.640865325927734, "global_step": 240457, "epoch": 1987} {"train_loss": -43.47646713256836, "global_step": 240458, "epoch": 1987} {"train_loss": -43.49921798706055, "global_step": 240459, "epoch": 1987} {"train_loss": -42.903953552246094, "global_step": 240460, "epoch": 1987} {"train_loss": -41.7376594543457, "global_step": 240461, "epoch": 1987} {"train_loss": -43.460540771484375, "global_step": 240462, "epoch": 1987} {"train_loss": -42.76134490966797, "global_step": 240463, "epoch": 1987} {"train_loss": -42.45551300048828, "global_step": 240464, "epoch": 1987} {"train_loss": -43.155067443847656, "global_step": 240465, "epoch": 1987} {"train_loss": -43.300079345703125, "global_step": 240466, "epoch": 1987} {"train_loss": -42.80058670043945, "global_step": 240467, "epoch": 1987} {"train_loss": -42.442378997802734, "global_step": 240468, "epoch": 1987} {"train_loss": -43.139827728271484, "global_step": 240469, "epoch": 1987} {"train_loss": -43.068084716796875, "global_step": 240470, "epoch": 1987} {"train_loss": -42.85840606689453, "global_step": 240471, "epoch": 1987} {"train_loss": -43.34652328491211, "global_step": 240472, "epoch": 1987} {"train_loss": -43.4697265625, "global_step": 240473, "epoch": 1987} {"train_loss": -42.39764404296875, "global_step": 240474, "epoch": 1987} {"train_loss": -42.874691009521484, "global_step": 240475, "epoch": 1987} {"train_loss": -43.04193115234375, "global_step": 240476, "epoch": 1987} {"train_loss": -41.45168685913086, "global_step": 240477, "epoch": 1987} {"train_loss": -43.721248626708984, "global_step": 240478, "epoch": 1987} {"train_loss": -43.00175094604492, "global_step": 240479, "epoch": 1987} {"train_loss": -42.746944427490234, "global_step": 240480, "epoch": 1987} {"train_loss": -42.88688278198242, "global_step": 240481, "epoch": 1987} {"train_loss": -42.82381820678711, "global_step": 240482, "epoch": 1987} {"train_loss": -42.74428176879883, "global_step": 240483, "epoch": 1987} {"train_loss": -43.05518341064453, "global_step": 240484, "epoch": 1987} {"train_loss": -42.71913528442383, "global_step": 240485, "epoch": 1987} {"train_loss": -42.73647689819336, "global_step": 240486, "epoch": 1987} {"train_loss": -42.46138000488281, "global_step": 240487, "epoch": 1987} {"train_loss": -43.55506134033203, "global_step": 240488, "epoch": 1987} {"train_loss": -43.40338134765625, "global_step": 240489, "epoch": 1987} {"train_loss": -42.95003890991211, "global_step": 240490, "epoch": 1987} {"train_loss": -42.983978271484375, "global_step": 240491, "epoch": 1987} {"train_loss": -43.12662887573242, "global_step": 240492, "epoch": 1987} {"train_loss": -44.03786849975586, "global_step": 240493, "epoch": 1987} {"train_loss": -43.3390007019043, "global_step": 240494, "epoch": 1987} {"train_loss": -43.00944137573242, "global_step": 240495, "epoch": 1987} {"train_loss": -43.01752471923828, "global_step": 240496, "epoch": 1987} {"train_loss": -44.02460861206055, "global_step": 240497, "epoch": 1987} {"train_loss": -42.34416580200195, "global_step": 240498, "epoch": 1987} {"train_loss": -43.589839935302734, "global_step": 240499, "epoch": 1987} {"train_loss": -43.13743209838867, "global_step": 240500, "epoch": 1987} {"train_loss": -43.731075286865234, "global_step": 240501, "epoch": 1987} {"train_loss": -43.722015380859375, "global_step": 240502, "epoch": 1987} {"train_loss": -44.2894287109375, "global_step": 240503, "epoch": 1987} {"train_loss": -43.9406852722168, "global_step": 240504, "epoch": 1987} {"train_loss": -43.60833740234375, "global_step": 240505, "epoch": 1987} {"train_loss": -42.18253707885742, "global_step": 240506, "epoch": 1987} {"train_loss": -44.12152099609375, "global_step": 240507, "epoch": 1987} {"train_loss": -43.666751861572266, "global_step": 240508, "epoch": 1987} {"train_loss": -42.54692459106445, "global_step": 240509, "epoch": 1987} {"train_loss": -43.0351448059082, "global_step": 240510, "epoch": 1987} {"train_loss": -43.83277893066406, "global_step": 240511, "epoch": 1987} {"train_loss": -43.84877395629883, "global_step": 240512, "epoch": 1987} {"train_loss": -42.85289001464844, "global_step": 240513, "epoch": 1987} {"train_loss": -42.59619140625, "global_step": 240514, "epoch": 1987} {"train_loss": -43.14896774291992, "global_step": 240515, "epoch": 1987} {"train_loss": -43.704769134521484, "global_step": 240516, "epoch": 1987} {"train_loss": -44.304386138916016, "global_step": 240517, "epoch": 1987} {"train_loss": -43.39652633666992, "global_step": 240518, "epoch": 1987} {"train_loss": -43.35067367553711, "global_step": 240519, "epoch": 1987} {"train_loss": -43.40493392944336, "global_step": 240520, "epoch": 1987} {"train_loss": -41.957496643066406, "global_step": 240521, "epoch": 1987} {"train_loss": -41.0218391418457, "global_step": 240522, "epoch": 1987} {"train_loss": -40.11311340332031, "global_step": 240523, "epoch": 1987} {"train_loss": -41.02627182006836, "global_step": 240524, "epoch": 1987} {"train_loss": -40.1800422668457, "global_step": 240525, "epoch": 1987} {"train_loss": -38.92206573486328, "global_step": 240526, "epoch": 1987} {"train_loss": -40.80522155761719, "global_step": 240527, "epoch": 1987} {"train_loss": -37.98421859741211, "global_step": 240528, "epoch": 1987} {"train_loss": -40.3179817199707, "global_step": 240529, "epoch": 1987} {"train_loss": -39.11468505859375, "global_step": 240530, "epoch": 1987} {"train_loss": -41.84638977050781, "global_step": 240531, "epoch": 1987} {"train_loss": -35.16718292236328, "global_step": 240532, "epoch": 1987} {"train_loss": -34.98125076293945, "global_step": 240533, "epoch": 1987} {"train_loss": -38.141117095947266, "global_step": 240534, "epoch": 1987} {"train_loss": -37.4378776550293, "global_step": 240535, "epoch": 1987} {"train_loss": -38.509178161621094, "global_step": 240536, "epoch": 1987} {"train_loss": -36.857269287109375, "global_step": 240537, "epoch": 1987} {"train_loss": -39.251136779785156, "global_step": 240538, "epoch": 1987} {"train_loss": -40.31956100463867, "global_step": 240539, "epoch": 1987} {"train_loss": -40.38587951660156, "global_step": 240540, "epoch": 1987} {"train_loss": -41.394832611083984, "global_step": 240541, "epoch": 1987} {"train_loss": -39.39939498901367, "global_step": 240542, "epoch": 1987} {"train_loss": -40.33610153198242, "global_step": 240543, "epoch": 1987} {"train_loss": -41.9810676574707, "global_step": 240544, "epoch": 1987} {"train_loss": -40.78103256225586, "global_step": 240545, "epoch": 1987} {"train_loss": -40.46439743041992, "global_step": 240546, "epoch": 1987} {"train_loss": -42.29327424104549, "global_step": 240547, "epoch": 1987, "val_loss": 2547017.75} {"train_loss": -39.10737228393555, "global_step": 240548, "epoch": 1988} {"train_loss": -40.24470520019531, "global_step": 240549, "epoch": 1988} {"train_loss": -41.46615219116211, "global_step": 240550, "epoch": 1988} {"train_loss": -41.920196533203125, "global_step": 240551, "epoch": 1988} {"train_loss": -41.66848373413086, "global_step": 240552, "epoch": 1988} {"train_loss": -41.917232513427734, "global_step": 240553, "epoch": 1988} {"train_loss": -42.018367767333984, "global_step": 240554, "epoch": 1988} {"train_loss": -42.30121612548828, "global_step": 240555, "epoch": 1988} {"train_loss": -41.18568801879883, "global_step": 240556, "epoch": 1988} {"train_loss": -41.036441802978516, "global_step": 240557, "epoch": 1988} {"train_loss": -42.89978790283203, "global_step": 240558, "epoch": 1988} {"train_loss": -41.62895584106445, "global_step": 240559, "epoch": 1988} {"train_loss": -41.50822448730469, "global_step": 240560, "epoch": 1988} {"train_loss": -42.09135818481445, "global_step": 240561, "epoch": 1988} {"train_loss": -41.60707092285156, "global_step": 240562, "epoch": 1988} {"train_loss": -42.926124572753906, "global_step": 240563, "epoch": 1988} {"train_loss": -42.8216667175293, "global_step": 240564, "epoch": 1988} {"train_loss": -41.085540771484375, "global_step": 240565, "epoch": 1988} {"train_loss": -41.94660186767578, "global_step": 240566, "epoch": 1988} {"train_loss": -42.53399658203125, "global_step": 240567, "epoch": 1988} {"train_loss": -42.153236389160156, "global_step": 240568, "epoch": 1988} {"train_loss": -43.33600997924805, "global_step": 240569, "epoch": 1988} {"train_loss": -42.294002532958984, "global_step": 240570, "epoch": 1988} {"train_loss": -42.32699203491211, "global_step": 240571, "epoch": 1988} {"train_loss": -43.12592697143555, "global_step": 240572, "epoch": 1988} {"train_loss": -41.5963020324707, "global_step": 240573, "epoch": 1988} {"train_loss": -42.8790283203125, "global_step": 240574, "epoch": 1988} {"train_loss": -42.784481048583984, "global_step": 240575, "epoch": 1988} {"train_loss": -42.47117614746094, "global_step": 240576, "epoch": 1988} {"train_loss": -42.14101791381836, "global_step": 240577, "epoch": 1988} {"train_loss": -43.488765716552734, "global_step": 240578, "epoch": 1988} {"train_loss": -42.15807342529297, "global_step": 240579, "epoch": 1988} {"train_loss": -42.84497833251953, "global_step": 240580, "epoch": 1988} {"train_loss": -43.086021423339844, "global_step": 240581, "epoch": 1988} {"train_loss": -42.29792404174805, "global_step": 240582, "epoch": 1988} {"train_loss": -43.031715393066406, "global_step": 240583, "epoch": 1988} {"train_loss": -41.850830078125, "global_step": 240584, "epoch": 1988} {"train_loss": -41.939353942871094, "global_step": 240585, "epoch": 1988} {"train_loss": -42.697635650634766, "global_step": 240586, "epoch": 1988} {"train_loss": -43.027000427246094, "global_step": 240587, "epoch": 1988} {"train_loss": -41.726253509521484, "global_step": 240588, "epoch": 1988} {"train_loss": -42.11617660522461, "global_step": 240589, "epoch": 1988} {"train_loss": -41.414974212646484, "global_step": 240590, "epoch": 1988} {"train_loss": -42.137874603271484, "global_step": 240591, "epoch": 1988} {"train_loss": -42.48869323730469, "global_step": 240592, "epoch": 1988} {"train_loss": -43.03391647338867, "global_step": 240593, "epoch": 1988} {"train_loss": -42.60004806518555, "global_step": 240594, "epoch": 1988} {"train_loss": -40.55720138549805, "global_step": 240595, "epoch": 1988} {"train_loss": -41.32804489135742, "global_step": 240596, "epoch": 1988} {"train_loss": -43.266822814941406, "global_step": 240597, "epoch": 1988} {"train_loss": -42.636512756347656, "global_step": 240598, "epoch": 1988} {"train_loss": -41.270198822021484, "global_step": 240599, "epoch": 1988} {"train_loss": -42.67351531982422, "global_step": 240600, "epoch": 1988} {"train_loss": -42.02339553833008, "global_step": 240601, "epoch": 1988} {"train_loss": -40.85622024536133, "global_step": 240602, "epoch": 1988} {"train_loss": -41.201927185058594, "global_step": 240603, "epoch": 1988} {"train_loss": -43.206687927246094, "global_step": 240604, "epoch": 1988} {"train_loss": -40.690956115722656, "global_step": 240605, "epoch": 1988} {"train_loss": -42.1623649597168, "global_step": 240606, "epoch": 1988} {"train_loss": -42.70133590698242, "global_step": 240607, "epoch": 1988} {"train_loss": -39.87519454956055, "global_step": 240608, "epoch": 1988} {"train_loss": -42.2769775390625, "global_step": 240609, "epoch": 1988} {"train_loss": -42.752925872802734, "global_step": 240610, "epoch": 1988} {"train_loss": -42.165428161621094, "global_step": 240611, "epoch": 1988} {"train_loss": -43.11933135986328, "global_step": 240612, "epoch": 1988} {"train_loss": -41.63100051879883, "global_step": 240613, "epoch": 1988} {"train_loss": -41.88331985473633, "global_step": 240614, "epoch": 1988} {"train_loss": -42.949493408203125, "global_step": 240615, "epoch": 1988} {"train_loss": -42.472164154052734, "global_step": 240616, "epoch": 1988} {"train_loss": -42.45441818237305, "global_step": 240617, "epoch": 1988} {"train_loss": -42.93803024291992, "global_step": 240618, "epoch": 1988} {"train_loss": -42.53116226196289, "global_step": 240619, "epoch": 1988} {"train_loss": -42.888885498046875, "global_step": 240620, "epoch": 1988} {"train_loss": -42.85578536987305, "global_step": 240621, "epoch": 1988} {"train_loss": -42.93331527709961, "global_step": 240622, "epoch": 1988} {"train_loss": -42.940185546875, "global_step": 240623, "epoch": 1988} {"train_loss": -43.51107406616211, "global_step": 240624, "epoch": 1988} {"train_loss": -43.369197845458984, "global_step": 240625, "epoch": 1988} {"train_loss": -43.41021728515625, "global_step": 240626, "epoch": 1988} {"train_loss": -42.815521240234375, "global_step": 240627, "epoch": 1988} {"train_loss": -42.89583206176758, "global_step": 240628, "epoch": 1988} {"train_loss": -43.89276885986328, "global_step": 240629, "epoch": 1988} {"train_loss": -43.2362174987793, "global_step": 240630, "epoch": 1988} {"train_loss": -42.97022247314453, "global_step": 240631, "epoch": 1988} {"train_loss": -43.159759521484375, "global_step": 240632, "epoch": 1988} {"train_loss": -43.63539123535156, "global_step": 240633, "epoch": 1988} {"train_loss": -43.066871643066406, "global_step": 240634, "epoch": 1988} {"train_loss": -43.6211051940918, "global_step": 240635, "epoch": 1988} {"train_loss": -43.90425109863281, "global_step": 240636, "epoch": 1988} {"train_loss": -43.28244400024414, "global_step": 240637, "epoch": 1988} {"train_loss": -42.70840835571289, "global_step": 240638, "epoch": 1988} {"train_loss": -42.803932189941406, "global_step": 240639, "epoch": 1988} {"train_loss": -42.669612884521484, "global_step": 240640, "epoch": 1988} {"train_loss": -43.30479049682617, "global_step": 240641, "epoch": 1988} {"train_loss": -42.66896057128906, "global_step": 240642, "epoch": 1988} {"train_loss": -42.842166900634766, "global_step": 240643, "epoch": 1988} {"train_loss": -42.85908126831055, "global_step": 240644, "epoch": 1988} {"train_loss": -43.541507720947266, "global_step": 240645, "epoch": 1988} {"train_loss": -44.57436752319336, "global_step": 240646, "epoch": 1988} {"train_loss": -43.55078887939453, "global_step": 240647, "epoch": 1988} {"train_loss": -43.35831832885742, "global_step": 240648, "epoch": 1988} {"train_loss": -43.5256462097168, "global_step": 240649, "epoch": 1988} {"train_loss": -43.9565315246582, "global_step": 240650, "epoch": 1988} {"train_loss": -43.31301498413086, "global_step": 240651, "epoch": 1988} {"train_loss": -42.632904052734375, "global_step": 240652, "epoch": 1988} {"train_loss": -41.402587890625, "global_step": 240653, "epoch": 1988} {"train_loss": -40.76313018798828, "global_step": 240654, "epoch": 1988} {"train_loss": -42.34596633911133, "global_step": 240655, "epoch": 1988} {"train_loss": -42.55576705932617, "global_step": 240656, "epoch": 1988} {"train_loss": -42.22538375854492, "global_step": 240657, "epoch": 1988} {"train_loss": -41.86064529418945, "global_step": 240658, "epoch": 1988} {"train_loss": -40.52870559692383, "global_step": 240659, "epoch": 1988} {"train_loss": -40.23359680175781, "global_step": 240660, "epoch": 1988} {"train_loss": -43.14925765991211, "global_step": 240661, "epoch": 1988} {"train_loss": -38.76491928100586, "global_step": 240662, "epoch": 1988} {"train_loss": -43.11422348022461, "global_step": 240663, "epoch": 1988} {"train_loss": -38.2026481628418, "global_step": 240664, "epoch": 1988} {"train_loss": -41.57076644897461, "global_step": 240665, "epoch": 1988} {"train_loss": -35.33876037597656, "global_step": 240666, "epoch": 1988} {"train_loss": -36.13130569458008, "global_step": 240667, "epoch": 1988} {"train_loss": -42.16478332015109, "global_step": 240668, "epoch": 1988, "val_loss": 2577964.25} {"train_loss": -38.63179397583008, "global_step": 240669, "epoch": 1989} {"train_loss": -38.81624984741211, "global_step": 240670, "epoch": 1989} {"train_loss": -37.41065979003906, "global_step": 240671, "epoch": 1989} {"train_loss": -39.80558395385742, "global_step": 240672, "epoch": 1989} {"train_loss": -39.6697998046875, "global_step": 240673, "epoch": 1989} {"train_loss": -38.939483642578125, "global_step": 240674, "epoch": 1989} {"train_loss": -40.203041076660156, "global_step": 240675, "epoch": 1989} {"train_loss": -40.2296028137207, "global_step": 240676, "epoch": 1989} {"train_loss": -41.51783752441406, "global_step": 240677, "epoch": 1989} {"train_loss": -39.614315032958984, "global_step": 240678, "epoch": 1989} {"train_loss": -39.40478515625, "global_step": 240679, "epoch": 1989} {"train_loss": -41.74451446533203, "global_step": 240680, "epoch": 1989} {"train_loss": -40.3542594909668, "global_step": 240681, "epoch": 1989} {"train_loss": -41.513431549072266, "global_step": 240682, "epoch": 1989} {"train_loss": -39.90812301635742, "global_step": 240683, "epoch": 1989} {"train_loss": -40.9083251953125, "global_step": 240684, "epoch": 1989} {"train_loss": -41.09904098510742, "global_step": 240685, "epoch": 1989} {"train_loss": -41.447689056396484, "global_step": 240686, "epoch": 1989} {"train_loss": -42.13841247558594, "global_step": 240687, "epoch": 1989} {"train_loss": -42.32600021362305, "global_step": 240688, "epoch": 1989} {"train_loss": -41.69761276245117, "global_step": 240689, "epoch": 1989} {"train_loss": -41.648895263671875, "global_step": 240690, "epoch": 1989} {"train_loss": -41.51534652709961, "global_step": 240691, "epoch": 1989} {"train_loss": -42.167781829833984, "global_step": 240692, "epoch": 1989} {"train_loss": -42.19057846069336, "global_step": 240693, "epoch": 1989} {"train_loss": -41.75965118408203, "global_step": 240694, "epoch": 1989} {"train_loss": -42.16513442993164, "global_step": 240695, "epoch": 1989} {"train_loss": -42.686702728271484, "global_step": 240696, "epoch": 1989} {"train_loss": -41.714210510253906, "global_step": 240697, "epoch": 1989} {"train_loss": -41.7783088684082, "global_step": 240698, "epoch": 1989} {"train_loss": -42.71163558959961, "global_step": 240699, "epoch": 1989} {"train_loss": -43.427337646484375, "global_step": 240700, "epoch": 1989} {"train_loss": -41.36531448364258, "global_step": 240701, "epoch": 1989} {"train_loss": -42.39532470703125, "global_step": 240702, "epoch": 1989} {"train_loss": -43.195526123046875, "global_step": 240703, "epoch": 1989} {"train_loss": -42.88881301879883, "global_step": 240704, "epoch": 1989} {"train_loss": -42.88790512084961, "global_step": 240705, "epoch": 1989} {"train_loss": -42.87986373901367, "global_step": 240706, "epoch": 1989} {"train_loss": -42.75042724609375, "global_step": 240707, "epoch": 1989} {"train_loss": -43.16571807861328, "global_step": 240708, "epoch": 1989} {"train_loss": -42.7791862487793, "global_step": 240709, "epoch": 1989} {"train_loss": -43.06471633911133, "global_step": 240710, "epoch": 1989} {"train_loss": -41.76754379272461, "global_step": 240711, "epoch": 1989} {"train_loss": -42.76983642578125, "global_step": 240712, "epoch": 1989} {"train_loss": -42.59101486206055, "global_step": 240713, "epoch": 1989} {"train_loss": -42.760379791259766, "global_step": 240714, "epoch": 1989} {"train_loss": -42.58781051635742, "global_step": 240715, "epoch": 1989} {"train_loss": -42.63975143432617, "global_step": 240716, "epoch": 1989} {"train_loss": -43.67649459838867, "global_step": 240717, "epoch": 1989} {"train_loss": -42.92527389526367, "global_step": 240718, "epoch": 1989} {"train_loss": -42.29777526855469, "global_step": 240719, "epoch": 1989} {"train_loss": -42.12003707885742, "global_step": 240720, "epoch": 1989} {"train_loss": -43.35346603393555, "global_step": 240721, "epoch": 1989} {"train_loss": -43.6824836730957, "global_step": 240722, "epoch": 1989} {"train_loss": -42.620845794677734, "global_step": 240723, "epoch": 1989} {"train_loss": -42.250972747802734, "global_step": 240724, "epoch": 1989} {"train_loss": -43.00420379638672, "global_step": 240725, "epoch": 1989} {"train_loss": -43.59736251831055, "global_step": 240726, "epoch": 1989} {"train_loss": -43.40036392211914, "global_step": 240727, "epoch": 1989} {"train_loss": -40.92574691772461, "global_step": 240728, "epoch": 1989} {"train_loss": -42.7645378112793, "global_step": 240729, "epoch": 1989} {"train_loss": -43.50798416137695, "global_step": 240730, "epoch": 1989} {"train_loss": -42.727760314941406, "global_step": 240731, "epoch": 1989} {"train_loss": -42.18104934692383, "global_step": 240732, "epoch": 1989} {"train_loss": -41.4669075012207, "global_step": 240733, "epoch": 1989} {"train_loss": -41.9376106262207, "global_step": 240734, "epoch": 1989} {"train_loss": -42.352638244628906, "global_step": 240735, "epoch": 1989} {"train_loss": -41.38768005371094, "global_step": 240736, "epoch": 1989} {"train_loss": -41.295021057128906, "global_step": 240737, "epoch": 1989} {"train_loss": -42.0223274230957, "global_step": 240738, "epoch": 1989} {"train_loss": -43.75797653198242, "global_step": 240739, "epoch": 1989} {"train_loss": -42.44590377807617, "global_step": 240740, "epoch": 1989} {"train_loss": -41.892845153808594, "global_step": 240741, "epoch": 1989} {"train_loss": -43.38037109375, "global_step": 240742, "epoch": 1989} {"train_loss": -42.35427474975586, "global_step": 240743, "epoch": 1989} {"train_loss": -38.95119857788086, "global_step": 240744, "epoch": 1989} {"train_loss": -42.339046478271484, "global_step": 240745, "epoch": 1989} {"train_loss": -43.122657775878906, "global_step": 240746, "epoch": 1989} {"train_loss": -43.362545013427734, "global_step": 240747, "epoch": 1989} {"train_loss": -42.302913665771484, "global_step": 240748, "epoch": 1989} {"train_loss": -42.9986572265625, "global_step": 240749, "epoch": 1989} {"train_loss": -42.82851791381836, "global_step": 240750, "epoch": 1989} {"train_loss": -41.355098724365234, "global_step": 240751, "epoch": 1989} {"train_loss": -41.56903076171875, "global_step": 240752, "epoch": 1989} {"train_loss": -42.81232833862305, "global_step": 240753, "epoch": 1989} {"train_loss": -43.17316436767578, "global_step": 240754, "epoch": 1989} {"train_loss": -42.84209060668945, "global_step": 240755, "epoch": 1989} {"train_loss": -43.40108871459961, "global_step": 240756, "epoch": 1989} {"train_loss": -42.509761810302734, "global_step": 240757, "epoch": 1989} {"train_loss": -43.10496139526367, "global_step": 240758, "epoch": 1989} {"train_loss": -43.46226119995117, "global_step": 240759, "epoch": 1989} {"train_loss": -42.933712005615234, "global_step": 240760, "epoch": 1989} {"train_loss": -43.2256965637207, "global_step": 240761, "epoch": 1989} {"train_loss": -43.375030517578125, "global_step": 240762, "epoch": 1989} {"train_loss": -41.30239486694336, "global_step": 240763, "epoch": 1989} {"train_loss": -43.259944915771484, "global_step": 240764, "epoch": 1989} {"train_loss": -42.58846664428711, "global_step": 240765, "epoch": 1989} {"train_loss": -42.71169662475586, "global_step": 240766, "epoch": 1989} {"train_loss": -42.8569221496582, "global_step": 240767, "epoch": 1989} {"train_loss": -43.15716552734375, "global_step": 240768, "epoch": 1989} {"train_loss": -42.70452880859375, "global_step": 240769, "epoch": 1989} {"train_loss": -43.030086517333984, "global_step": 240770, "epoch": 1989} {"train_loss": -42.44765853881836, "global_step": 240771, "epoch": 1989} {"train_loss": -43.29022979736328, "global_step": 240772, "epoch": 1989} {"train_loss": -41.94343948364258, "global_step": 240773, "epoch": 1989} {"train_loss": -43.13301467895508, "global_step": 240774, "epoch": 1989} {"train_loss": -41.5346794128418, "global_step": 240775, "epoch": 1989} {"train_loss": -43.58504867553711, "global_step": 240776, "epoch": 1989} {"train_loss": -43.098968505859375, "global_step": 240777, "epoch": 1989} {"train_loss": -40.197357177734375, "global_step": 240778, "epoch": 1989} {"train_loss": -42.6693000793457, "global_step": 240779, "epoch": 1989} {"train_loss": -42.10481643676758, "global_step": 240780, "epoch": 1989} {"train_loss": -42.96270751953125, "global_step": 240781, "epoch": 1989} {"train_loss": -42.750911712646484, "global_step": 240782, "epoch": 1989} {"train_loss": -42.68958282470703, "global_step": 240783, "epoch": 1989} {"train_loss": -42.05463790893555, "global_step": 240784, "epoch": 1989} {"train_loss": -41.59675216674805, "global_step": 240785, "epoch": 1989} {"train_loss": -42.06631088256836, "global_step": 240786, "epoch": 1989} {"train_loss": -39.39693069458008, "global_step": 240787, "epoch": 1989} {"train_loss": -39.45444869995117, "global_step": 240788, "epoch": 1989} {"train_loss": -42.05120130806915, "global_step": 240789, "epoch": 1989, "val_loss": 2780772.25} {"train_loss": -34.52982711791992, "global_step": 240790, "epoch": 1990} {"train_loss": -32.38302230834961, "global_step": 240791, "epoch": 1990} {"train_loss": -37.541717529296875, "global_step": 240792, "epoch": 1990} {"train_loss": -37.89722442626953, "global_step": 240793, "epoch": 1990} {"train_loss": -37.76619338989258, "global_step": 240794, "epoch": 1990} {"train_loss": -38.28793716430664, "global_step": 240795, "epoch": 1990} {"train_loss": -38.91164016723633, "global_step": 240796, "epoch": 1990} {"train_loss": -34.722259521484375, "global_step": 240797, "epoch": 1990} {"train_loss": -39.637874603271484, "global_step": 240798, "epoch": 1990} {"train_loss": -35.523738861083984, "global_step": 240799, "epoch": 1990} {"train_loss": -38.664306640625, "global_step": 240800, "epoch": 1990} {"train_loss": -34.90501022338867, "global_step": 240801, "epoch": 1990} {"train_loss": -37.37522506713867, "global_step": 240802, "epoch": 1990} {"train_loss": -39.181922912597656, "global_step": 240803, "epoch": 1990} {"train_loss": -36.56565856933594, "global_step": 240804, "epoch": 1990} {"train_loss": -36.63112258911133, "global_step": 240805, "epoch": 1990} {"train_loss": -38.75481033325195, "global_step": 240806, "epoch": 1990} {"train_loss": -38.46144485473633, "global_step": 240807, "epoch": 1990} {"train_loss": -39.351314544677734, "global_step": 240808, "epoch": 1990} {"train_loss": -39.803279876708984, "global_step": 240809, "epoch": 1990} {"train_loss": -39.374752044677734, "global_step": 240810, "epoch": 1990} {"train_loss": -40.67509841918945, "global_step": 240811, "epoch": 1990} {"train_loss": -40.82924270629883, "global_step": 240812, "epoch": 1990} {"train_loss": -40.28232955932617, "global_step": 240813, "epoch": 1990} {"train_loss": -40.661354064941406, "global_step": 240814, "epoch": 1990} {"train_loss": -40.88569259643555, "global_step": 240815, "epoch": 1990} {"train_loss": -40.57209396362305, "global_step": 240816, "epoch": 1990} {"train_loss": -39.92343521118164, "global_step": 240817, "epoch": 1990} {"train_loss": -40.638267517089844, "global_step": 240818, "epoch": 1990} {"train_loss": -41.8226318359375, "global_step": 240819, "epoch": 1990} {"train_loss": -41.16550827026367, "global_step": 240820, "epoch": 1990} {"train_loss": -40.022274017333984, "global_step": 240821, "epoch": 1990} {"train_loss": -41.8104248046875, "global_step": 240822, "epoch": 1990} {"train_loss": -41.81344223022461, "global_step": 240823, "epoch": 1990} {"train_loss": -41.649471282958984, "global_step": 240824, "epoch": 1990} {"train_loss": -41.995849609375, "global_step": 240825, "epoch": 1990} {"train_loss": -41.3834114074707, "global_step": 240826, "epoch": 1990} {"train_loss": -42.15392303466797, "global_step": 240827, "epoch": 1990} {"train_loss": -40.87419891357422, "global_step": 240828, "epoch": 1990} {"train_loss": -41.841102600097656, "global_step": 240829, "epoch": 1990} {"train_loss": -42.022613525390625, "global_step": 240830, "epoch": 1990} {"train_loss": -42.02243423461914, "global_step": 240831, "epoch": 1990} {"train_loss": -42.02068328857422, "global_step": 240832, "epoch": 1990} {"train_loss": -41.58126449584961, "global_step": 240833, "epoch": 1990} {"train_loss": -42.7763671875, "global_step": 240834, "epoch": 1990} {"train_loss": -41.77294921875, "global_step": 240835, "epoch": 1990} {"train_loss": -42.291534423828125, "global_step": 240836, "epoch": 1990} {"train_loss": -42.41799545288086, "global_step": 240837, "epoch": 1990} {"train_loss": -42.14164352416992, "global_step": 240838, "epoch": 1990} {"train_loss": -42.2364501953125, "global_step": 240839, "epoch": 1990} {"train_loss": -42.97024154663086, "global_step": 240840, "epoch": 1990} {"train_loss": -42.490333557128906, "global_step": 240841, "epoch": 1990} {"train_loss": -42.778629302978516, "global_step": 240842, "epoch": 1990} {"train_loss": -42.908843994140625, "global_step": 240843, "epoch": 1990} {"train_loss": -43.04510498046875, "global_step": 240844, "epoch": 1990} {"train_loss": -42.23305130004883, "global_step": 240845, "epoch": 1990} {"train_loss": -42.96570587158203, "global_step": 240846, "epoch": 1990} {"train_loss": -43.012481689453125, "global_step": 240847, "epoch": 1990} {"train_loss": -42.61140823364258, "global_step": 240848, "epoch": 1990} {"train_loss": -43.45242691040039, "global_step": 240849, "epoch": 1990} {"train_loss": -43.175209045410156, "global_step": 240850, "epoch": 1990} {"train_loss": -43.34102249145508, "global_step": 240851, "epoch": 1990} {"train_loss": -42.69654083251953, "global_step": 240852, "epoch": 1990} {"train_loss": -42.85713195800781, "global_step": 240853, "epoch": 1990} {"train_loss": -43.01282501220703, "global_step": 240854, "epoch": 1990} {"train_loss": -43.10388946533203, "global_step": 240855, "epoch": 1990} {"train_loss": -43.162322998046875, "global_step": 240856, "epoch": 1990} {"train_loss": -43.0826530456543, "global_step": 240857, "epoch": 1990} {"train_loss": -42.72443771362305, "global_step": 240858, "epoch": 1990} {"train_loss": -42.6800651550293, "global_step": 240859, "epoch": 1990} {"train_loss": -42.934688568115234, "global_step": 240860, "epoch": 1990} {"train_loss": -42.33652877807617, "global_step": 240861, "epoch": 1990} {"train_loss": -42.54719161987305, "global_step": 240862, "epoch": 1990} {"train_loss": -43.58767318725586, "global_step": 240863, "epoch": 1990} {"train_loss": -42.13092803955078, "global_step": 240864, "epoch": 1990} {"train_loss": -42.860511779785156, "global_step": 240865, "epoch": 1990} {"train_loss": -43.3707160949707, "global_step": 240866, "epoch": 1990} {"train_loss": -43.22825622558594, "global_step": 240867, "epoch": 1990} {"train_loss": -43.24872970581055, "global_step": 240868, "epoch": 1990} {"train_loss": -43.598445892333984, "global_step": 240869, "epoch": 1990} {"train_loss": -43.36451721191406, "global_step": 240870, "epoch": 1990} {"train_loss": -43.012020111083984, "global_step": 240871, "epoch": 1990} {"train_loss": -43.453834533691406, "global_step": 240872, "epoch": 1990} {"train_loss": -43.13274002075195, "global_step": 240873, "epoch": 1990} {"train_loss": -43.81743240356445, "global_step": 240874, "epoch": 1990} {"train_loss": -43.79880905151367, "global_step": 240875, "epoch": 1990} {"train_loss": -42.51156234741211, "global_step": 240876, "epoch": 1990} {"train_loss": -42.55647659301758, "global_step": 240877, "epoch": 1990} {"train_loss": -43.198394775390625, "global_step": 240878, "epoch": 1990} {"train_loss": -43.68447494506836, "global_step": 240879, "epoch": 1990} {"train_loss": -43.10976791381836, "global_step": 240880, "epoch": 1990} {"train_loss": -43.1780891418457, "global_step": 240881, "epoch": 1990} {"train_loss": -43.15037155151367, "global_step": 240882, "epoch": 1990} {"train_loss": -43.39945602416992, "global_step": 240883, "epoch": 1990} {"train_loss": -43.62295150756836, "global_step": 240884, "epoch": 1990} {"train_loss": -43.166954040527344, "global_step": 240885, "epoch": 1990} {"train_loss": -42.775787353515625, "global_step": 240886, "epoch": 1990} {"train_loss": -42.63606262207031, "global_step": 240887, "epoch": 1990} {"train_loss": -43.68781280517578, "global_step": 240888, "epoch": 1990} {"train_loss": -43.39842987060547, "global_step": 240889, "epoch": 1990} {"train_loss": -42.06116485595703, "global_step": 240890, "epoch": 1990} {"train_loss": -42.05868148803711, "global_step": 240891, "epoch": 1990} {"train_loss": -42.213218688964844, "global_step": 240892, "epoch": 1990} {"train_loss": -43.57828140258789, "global_step": 240893, "epoch": 1990} {"train_loss": -43.17055130004883, "global_step": 240894, "epoch": 1990} {"train_loss": -41.72780227661133, "global_step": 240895, "epoch": 1990} {"train_loss": -41.84058380126953, "global_step": 240896, "epoch": 1990} {"train_loss": -41.731693267822266, "global_step": 240897, "epoch": 1990} {"train_loss": -42.968544006347656, "global_step": 240898, "epoch": 1990} {"train_loss": -43.40876388549805, "global_step": 240899, "epoch": 1990} {"train_loss": -42.94609451293945, "global_step": 240900, "epoch": 1990} {"train_loss": -41.964210510253906, "global_step": 240901, "epoch": 1990} {"train_loss": -42.15955352783203, "global_step": 240902, "epoch": 1990} {"train_loss": -42.96291732788086, "global_step": 240903, "epoch": 1990} {"train_loss": -43.15250778198242, "global_step": 240904, "epoch": 1990} {"train_loss": -43.029720306396484, "global_step": 240905, "epoch": 1990} {"train_loss": -41.60032272338867, "global_step": 240906, "epoch": 1990} {"train_loss": -42.33469772338867, "global_step": 240907, "epoch": 1990} {"train_loss": -43.48024368286133, "global_step": 240908, "epoch": 1990} {"train_loss": -43.54429626464844, "global_step": 240909, "epoch": 1990} {"train_loss": -41.627381695203546, "global_step": 240910, "epoch": 1990, "val_loss": 2525597.5} {"train_loss": -42.93146896362305, "global_step": 240911, "epoch": 1991} {"train_loss": -43.65598678588867, "global_step": 240912, "epoch": 1991} {"train_loss": -42.375762939453125, "global_step": 240913, "epoch": 1991} {"train_loss": -42.13456344604492, "global_step": 240914, "epoch": 1991} {"train_loss": -42.64968490600586, "global_step": 240915, "epoch": 1991} {"train_loss": -43.12055969238281, "global_step": 240916, "epoch": 1991} {"train_loss": -43.296539306640625, "global_step": 240917, "epoch": 1991} {"train_loss": -43.632198333740234, "global_step": 240918, "epoch": 1991} {"train_loss": -41.8304328918457, "global_step": 240919, "epoch": 1991} {"train_loss": -41.795188903808594, "global_step": 240920, "epoch": 1991} {"train_loss": -42.01350784301758, "global_step": 240921, "epoch": 1991} {"train_loss": -42.92647933959961, "global_step": 240922, "epoch": 1991} {"train_loss": -41.56089401245117, "global_step": 240923, "epoch": 1991} {"train_loss": -41.85205841064453, "global_step": 240924, "epoch": 1991} {"train_loss": -43.629920959472656, "global_step": 240925, "epoch": 1991} {"train_loss": -41.8907470703125, "global_step": 240926, "epoch": 1991} {"train_loss": -42.40814208984375, "global_step": 240927, "epoch": 1991} {"train_loss": -43.25297164916992, "global_step": 240928, "epoch": 1991} {"train_loss": -42.15793991088867, "global_step": 240929, "epoch": 1991} {"train_loss": -42.7386474609375, "global_step": 240930, "epoch": 1991} {"train_loss": -42.63888168334961, "global_step": 240931, "epoch": 1991} {"train_loss": -42.4921875, "global_step": 240932, "epoch": 1991} {"train_loss": -41.65665817260742, "global_step": 240933, "epoch": 1991} {"train_loss": -43.71909713745117, "global_step": 240934, "epoch": 1991} {"train_loss": -43.37922286987305, "global_step": 240935, "epoch": 1991} {"train_loss": -41.91124725341797, "global_step": 240936, "epoch": 1991} {"train_loss": -38.27736282348633, "global_step": 240937, "epoch": 1991} {"train_loss": -42.58056640625, "global_step": 240938, "epoch": 1991} {"train_loss": -36.899105072021484, "global_step": 240939, "epoch": 1991} {"train_loss": -36.24692153930664, "global_step": 240940, "epoch": 1991} {"train_loss": -36.30036163330078, "global_step": 240941, "epoch": 1991} {"train_loss": -36.22555160522461, "global_step": 240942, "epoch": 1991} {"train_loss": -35.517333984375, "global_step": 240943, "epoch": 1991} {"train_loss": -35.96621322631836, "global_step": 240944, "epoch": 1991} {"train_loss": -36.948795318603516, "global_step": 240945, "epoch": 1991} {"train_loss": -36.24460220336914, "global_step": 240946, "epoch": 1991} {"train_loss": -37.15445327758789, "global_step": 240947, "epoch": 1991} {"train_loss": -36.170928955078125, "global_step": 240948, "epoch": 1991} {"train_loss": -36.62421417236328, "global_step": 240949, "epoch": 1991} {"train_loss": -35.922218322753906, "global_step": 240950, "epoch": 1991} {"train_loss": -36.83286666870117, "global_step": 240951, "epoch": 1991} {"train_loss": -36.84206771850586, "global_step": 240952, "epoch": 1991} {"train_loss": -36.27956771850586, "global_step": 240953, "epoch": 1991} {"train_loss": -36.364356994628906, "global_step": 240954, "epoch": 1991} {"train_loss": -36.697120666503906, "global_step": 240955, "epoch": 1991} {"train_loss": -37.1187858581543, "global_step": 240956, "epoch": 1991} {"train_loss": -37.21503448486328, "global_step": 240957, "epoch": 1991} {"train_loss": -37.73660659790039, "global_step": 240958, "epoch": 1991} {"train_loss": -37.52687454223633, "global_step": 240959, "epoch": 1991} {"train_loss": -37.477272033691406, "global_step": 240960, "epoch": 1991} {"train_loss": -37.884212493896484, "global_step": 240961, "epoch": 1991} {"train_loss": -37.21417236328125, "global_step": 240962, "epoch": 1991} {"train_loss": -37.73134994506836, "global_step": 240963, "epoch": 1991} {"train_loss": -38.5482177734375, "global_step": 240964, "epoch": 1991} {"train_loss": -38.11545944213867, "global_step": 240965, "epoch": 1991} {"train_loss": -38.193294525146484, "global_step": 240966, "epoch": 1991} {"train_loss": -38.311676025390625, "global_step": 240967, "epoch": 1991} {"train_loss": -37.73124313354492, "global_step": 240968, "epoch": 1991} {"train_loss": -37.766475677490234, "global_step": 240969, "epoch": 1991} {"train_loss": -37.6633415222168, "global_step": 240970, "epoch": 1991} {"train_loss": -38.051239013671875, "global_step": 240971, "epoch": 1991} {"train_loss": -37.09014892578125, "global_step": 240972, "epoch": 1991} {"train_loss": -36.20939254760742, "global_step": 240973, "epoch": 1991} {"train_loss": -38.375816345214844, "global_step": 240974, "epoch": 1991} {"train_loss": -38.2003288269043, "global_step": 240975, "epoch": 1991} {"train_loss": -37.2779655456543, "global_step": 240976, "epoch": 1991} {"train_loss": -38.255157470703125, "global_step": 240977, "epoch": 1991} {"train_loss": -36.173423767089844, "global_step": 240978, "epoch": 1991} {"train_loss": -36.81632614135742, "global_step": 240979, "epoch": 1991} {"train_loss": -37.90842819213867, "global_step": 240980, "epoch": 1991} {"train_loss": -36.90275955200195, "global_step": 240981, "epoch": 1991} {"train_loss": -38.433162689208984, "global_step": 240982, "epoch": 1991} {"train_loss": -38.00749969482422, "global_step": 240983, "epoch": 1991} {"train_loss": -37.54975128173828, "global_step": 240984, "epoch": 1991} {"train_loss": -39.263668060302734, "global_step": 240985, "epoch": 1991} {"train_loss": -37.996212005615234, "global_step": 240986, "epoch": 1991} {"train_loss": -38.887630462646484, "global_step": 240987, "epoch": 1991} {"train_loss": -38.58024978637695, "global_step": 240988, "epoch": 1991} {"train_loss": -38.78156661987305, "global_step": 240989, "epoch": 1991} {"train_loss": -39.085506439208984, "global_step": 240990, "epoch": 1991} {"train_loss": -38.19633865356445, "global_step": 240991, "epoch": 1991} {"train_loss": -38.70832061767578, "global_step": 240992, "epoch": 1991} {"train_loss": -38.3907470703125, "global_step": 240993, "epoch": 1991} {"train_loss": -39.3604621887207, "global_step": 240994, "epoch": 1991} {"train_loss": -38.21957778930664, "global_step": 240995, "epoch": 1991} {"train_loss": -39.76975631713867, "global_step": 240996, "epoch": 1991} {"train_loss": -38.86186599731445, "global_step": 240997, "epoch": 1991} {"train_loss": -38.58405303955078, "global_step": 240998, "epoch": 1991} {"train_loss": -39.11140823364258, "global_step": 240999, "epoch": 1991} {"train_loss": -38.51709747314453, "global_step": 241000, "epoch": 1991} {"train_loss": -38.985408782958984, "global_step": 241001, "epoch": 1991} {"train_loss": -38.8735466003418, "global_step": 241002, "epoch": 1991} {"train_loss": -39.05176544189453, "global_step": 241003, "epoch": 1991} {"train_loss": -39.47469711303711, "global_step": 241004, "epoch": 1991} {"train_loss": -39.61313247680664, "global_step": 241005, "epoch": 1991} {"train_loss": -39.784603118896484, "global_step": 241006, "epoch": 1991} {"train_loss": -39.36928939819336, "global_step": 241007, "epoch": 1991} {"train_loss": -40.299137115478516, "global_step": 241008, "epoch": 1991} {"train_loss": -39.38880920410156, "global_step": 241009, "epoch": 1991} {"train_loss": -39.75529098510742, "global_step": 241010, "epoch": 1991} {"train_loss": -39.056880950927734, "global_step": 241011, "epoch": 1991} {"train_loss": -38.84678649902344, "global_step": 241012, "epoch": 1991} {"train_loss": -39.861846923828125, "global_step": 241013, "epoch": 1991} {"train_loss": -39.730262756347656, "global_step": 241014, "epoch": 1991} {"train_loss": -39.74547576904297, "global_step": 241015, "epoch": 1991} {"train_loss": -39.59114456176758, "global_step": 241016, "epoch": 1991} {"train_loss": -38.6784782409668, "global_step": 241017, "epoch": 1991} {"train_loss": -38.79372024536133, "global_step": 241018, "epoch": 1991} {"train_loss": -39.07593536376953, "global_step": 241019, "epoch": 1991} {"train_loss": -40.25613784790039, "global_step": 241020, "epoch": 1991} {"train_loss": -39.38867950439453, "global_step": 241021, "epoch": 1991} {"train_loss": -39.1072998046875, "global_step": 241022, "epoch": 1991} {"train_loss": -38.977264404296875, "global_step": 241023, "epoch": 1991} {"train_loss": -39.980403900146484, "global_step": 241024, "epoch": 1991} {"train_loss": -39.868446350097656, "global_step": 241025, "epoch": 1991} {"train_loss": -39.9061279296875, "global_step": 241026, "epoch": 1991} {"train_loss": -40.332340240478516, "global_step": 241027, "epoch": 1991} {"train_loss": -40.121986389160156, "global_step": 241028, "epoch": 1991} {"train_loss": -40.54993438720703, "global_step": 241029, "epoch": 1991} {"train_loss": -39.47483444213867, "global_step": 241030, "epoch": 1991} {"train_loss": -39.21749543749596, "global_step": 241031, "epoch": 1991, "val_loss": 2521643.25} {"train_loss": -39.98346710205078, "global_step": 241032, "epoch": 1992} {"train_loss": -40.755062103271484, "global_step": 241033, "epoch": 1992} {"train_loss": -40.376888275146484, "global_step": 241034, "epoch": 1992} {"train_loss": -40.395484924316406, "global_step": 241035, "epoch": 1992} {"train_loss": -40.6395378112793, "global_step": 241036, "epoch": 1992} {"train_loss": -40.806209564208984, "global_step": 241037, "epoch": 1992} {"train_loss": -39.96713638305664, "global_step": 241038, "epoch": 1992} {"train_loss": -40.650299072265625, "global_step": 241039, "epoch": 1992} {"train_loss": -40.352264404296875, "global_step": 241040, "epoch": 1992} {"train_loss": -41.13434982299805, "global_step": 241041, "epoch": 1992} {"train_loss": -40.883419036865234, "global_step": 241042, "epoch": 1992} {"train_loss": -41.24969482421875, "global_step": 241043, "epoch": 1992} {"train_loss": -40.883174896240234, "global_step": 241044, "epoch": 1992} {"train_loss": -41.37485885620117, "global_step": 241045, "epoch": 1992} {"train_loss": -41.43645477294922, "global_step": 241046, "epoch": 1992} {"train_loss": -41.15547561645508, "global_step": 241047, "epoch": 1992} {"train_loss": -41.37567138671875, "global_step": 241048, "epoch": 1992} {"train_loss": -40.929649353027344, "global_step": 241049, "epoch": 1992} {"train_loss": -40.78717041015625, "global_step": 241050, "epoch": 1992} {"train_loss": -40.85291290283203, "global_step": 241051, "epoch": 1992} {"train_loss": -39.74684143066406, "global_step": 241052, "epoch": 1992} {"train_loss": -40.70286178588867, "global_step": 241053, "epoch": 1992} {"train_loss": -40.98733901977539, "global_step": 241054, "epoch": 1992} {"train_loss": -40.36624526977539, "global_step": 241055, "epoch": 1992} {"train_loss": -40.48798370361328, "global_step": 241056, "epoch": 1992} {"train_loss": -40.95622634887695, "global_step": 241057, "epoch": 1992} {"train_loss": -40.8670539855957, "global_step": 241058, "epoch": 1992} {"train_loss": -40.49705123901367, "global_step": 241059, "epoch": 1992} {"train_loss": -41.29395294189453, "global_step": 241060, "epoch": 1992} {"train_loss": -40.65735626220703, "global_step": 241061, "epoch": 1992} {"train_loss": -40.49281692504883, "global_step": 241062, "epoch": 1992} {"train_loss": -38.99000930786133, "global_step": 241063, "epoch": 1992} {"train_loss": -36.49589920043945, "global_step": 241064, "epoch": 1992} {"train_loss": -37.494815826416016, "global_step": 241065, "epoch": 1992} {"train_loss": -41.4713249206543, "global_step": 241066, "epoch": 1992} {"train_loss": -40.11735153198242, "global_step": 241067, "epoch": 1992} {"train_loss": -37.60133361816406, "global_step": 241068, "epoch": 1992} {"train_loss": -40.9578971862793, "global_step": 241069, "epoch": 1992} {"train_loss": -39.83803176879883, "global_step": 241070, "epoch": 1992} {"train_loss": -39.60093307495117, "global_step": 241071, "epoch": 1992} {"train_loss": -41.82231521606445, "global_step": 241072, "epoch": 1992} {"train_loss": -40.69550323486328, "global_step": 241073, "epoch": 1992} {"train_loss": -41.04848098754883, "global_step": 241074, "epoch": 1992} {"train_loss": -41.477840423583984, "global_step": 241075, "epoch": 1992} {"train_loss": -40.898799896240234, "global_step": 241076, "epoch": 1992} {"train_loss": -41.75825881958008, "global_step": 241077, "epoch": 1992} {"train_loss": -40.81509017944336, "global_step": 241078, "epoch": 1992} {"train_loss": -41.50632095336914, "global_step": 241079, "epoch": 1992} {"train_loss": -41.30278396606445, "global_step": 241080, "epoch": 1992} {"train_loss": -41.4657096862793, "global_step": 241081, "epoch": 1992} {"train_loss": -42.073036193847656, "global_step": 241082, "epoch": 1992} {"train_loss": -41.25536346435547, "global_step": 241083, "epoch": 1992} {"train_loss": -41.77205276489258, "global_step": 241084, "epoch": 1992} {"train_loss": -41.86172866821289, "global_step": 241085, "epoch": 1992} {"train_loss": -41.22610092163086, "global_step": 241086, "epoch": 1992} {"train_loss": -41.62792205810547, "global_step": 241087, "epoch": 1992} {"train_loss": -40.564788818359375, "global_step": 241088, "epoch": 1992} {"train_loss": -40.7744255065918, "global_step": 241089, "epoch": 1992} {"train_loss": -41.562171936035156, "global_step": 241090, "epoch": 1992} {"train_loss": -40.8631706237793, "global_step": 241091, "epoch": 1992} {"train_loss": -40.55908203125, "global_step": 241092, "epoch": 1992} {"train_loss": -40.570491790771484, "global_step": 241093, "epoch": 1992} {"train_loss": -41.938716888427734, "global_step": 241094, "epoch": 1992} {"train_loss": -41.910152435302734, "global_step": 241095, "epoch": 1992} {"train_loss": -41.92985916137695, "global_step": 241096, "epoch": 1992} {"train_loss": -42.091339111328125, "global_step": 241097, "epoch": 1992} {"train_loss": -41.99079513549805, "global_step": 241098, "epoch": 1992} {"train_loss": -40.219356536865234, "global_step": 241099, "epoch": 1992} {"train_loss": -41.9224967956543, "global_step": 241100, "epoch": 1992} {"train_loss": -42.21172332763672, "global_step": 241101, "epoch": 1992} {"train_loss": -42.015926361083984, "global_step": 241102, "epoch": 1992} {"train_loss": -41.8634147644043, "global_step": 241103, "epoch": 1992} {"train_loss": -35.80587387084961, "global_step": 241104, "epoch": 1992} {"train_loss": -41.38131332397461, "global_step": 241105, "epoch": 1992} {"train_loss": 35.40922164916992, "global_step": 241106, "epoch": 1992} {"train_loss": -31.71967887878418, "global_step": 241107, "epoch": 1992} {"train_loss": -18.91071319580078, "global_step": 241108, "epoch": 1992} {"train_loss": 58.13906478881836, "global_step": 241109, "epoch": 1992} {"train_loss": -9.469320297241211, "global_step": 241110, "epoch": 1992} {"train_loss": 32.4668083190918, "global_step": 241111, "epoch": 1992} {"train_loss": 5.311984539031982, "global_step": 241112, "epoch": 1992} {"train_loss": -16.6259822845459, "global_step": 241113, "epoch": 1992} {"train_loss": -20.86531639099121, "global_step": 241114, "epoch": 1992} {"train_loss": -7.940377712249756, "global_step": 241115, "epoch": 1992} {"train_loss": -17.549701690673828, "global_step": 241116, "epoch": 1992} {"train_loss": -8.513495445251465, "global_step": 241117, "epoch": 1992} {"train_loss": -21.829702377319336, "global_step": 241118, "epoch": 1992} {"train_loss": -27.31753921508789, "global_step": 241119, "epoch": 1992} {"train_loss": -24.420948028564453, "global_step": 241120, "epoch": 1992} {"train_loss": -22.9284725189209, "global_step": 241121, "epoch": 1992} {"train_loss": -28.104211807250977, "global_step": 241122, "epoch": 1992} {"train_loss": -31.150287628173828, "global_step": 241123, "epoch": 1992} {"train_loss": -32.076087951660156, "global_step": 241124, "epoch": 1992} {"train_loss": -30.992273330688477, "global_step": 241125, "epoch": 1992} {"train_loss": -32.24868392944336, "global_step": 241126, "epoch": 1992} {"train_loss": -32.59883117675781, "global_step": 241127, "epoch": 1992} {"train_loss": -32.853118896484375, "global_step": 241128, "epoch": 1992} {"train_loss": -32.66938781738281, "global_step": 241129, "epoch": 1992} {"train_loss": -32.68122863769531, "global_step": 241130, "epoch": 1992} {"train_loss": -34.38887023925781, "global_step": 241131, "epoch": 1992} {"train_loss": -33.26988983154297, "global_step": 241132, "epoch": 1992} {"train_loss": -32.41004180908203, "global_step": 241133, "epoch": 1992} {"train_loss": -33.16639709472656, "global_step": 241134, "epoch": 1992} {"train_loss": -34.03050994873047, "global_step": 241135, "epoch": 1992} {"train_loss": -34.08930206298828, "global_step": 241136, "epoch": 1992} {"train_loss": -33.580657958984375, "global_step": 241137, "epoch": 1992} {"train_loss": -33.33671188354492, "global_step": 241138, "epoch": 1992} {"train_loss": -32.79411697387695, "global_step": 241139, "epoch": 1992} {"train_loss": -32.93464660644531, "global_step": 241140, "epoch": 1992} {"train_loss": -34.05133819580078, "global_step": 241141, "epoch": 1992} {"train_loss": -34.43862533569336, "global_step": 241142, "epoch": 1992} {"train_loss": -34.568511962890625, "global_step": 241143, "epoch": 1992} {"train_loss": -34.97992706298828, "global_step": 241144, "epoch": 1992} {"train_loss": -34.3847770690918, "global_step": 241145, "epoch": 1992} {"train_loss": -34.02669906616211, "global_step": 241146, "epoch": 1992} {"train_loss": -33.508033752441406, "global_step": 241147, "epoch": 1992} {"train_loss": -34.9777946472168, "global_step": 241148, "epoch": 1992} {"train_loss": -34.460540771484375, "global_step": 241149, "epoch": 1992} {"train_loss": -35.186885833740234, "global_step": 241150, "epoch": 1992} {"train_loss": -34.77057647705078, "global_step": 241151, "epoch": 1992} {"train_loss": -34.29513903688793, "global_step": 241152, "epoch": 1992, "val_loss": 2533703.25} {"train_loss": -34.41490936279297, "global_step": 241153, "epoch": 1993} {"train_loss": -34.283905029296875, "global_step": 241154, "epoch": 1993} {"train_loss": -34.97654342651367, "global_step": 241155, "epoch": 1993} {"train_loss": -34.311222076416016, "global_step": 241156, "epoch": 1993} {"train_loss": -35.52668380737305, "global_step": 241157, "epoch": 1993} {"train_loss": -35.80876541137695, "global_step": 241158, "epoch": 1993} {"train_loss": -35.21273422241211, "global_step": 241159, "epoch": 1993} {"train_loss": -35.448486328125, "global_step": 241160, "epoch": 1993} {"train_loss": -35.53499984741211, "global_step": 241161, "epoch": 1993} {"train_loss": -34.23755645751953, "global_step": 241162, "epoch": 1993} {"train_loss": -35.34583282470703, "global_step": 241163, "epoch": 1993} {"train_loss": -35.36137008666992, "global_step": 241164, "epoch": 1993} {"train_loss": -36.35124206542969, "global_step": 241165, "epoch": 1993} {"train_loss": -36.40062713623047, "global_step": 241166, "epoch": 1993} {"train_loss": -36.61940383911133, "global_step": 241167, "epoch": 1993} {"train_loss": -36.34419250488281, "global_step": 241168, "epoch": 1993} {"train_loss": -36.5450553894043, "global_step": 241169, "epoch": 1993} {"train_loss": -36.73274612426758, "global_step": 241170, "epoch": 1993} {"train_loss": -36.645503997802734, "global_step": 241171, "epoch": 1993} {"train_loss": -36.730751037597656, "global_step": 241172, "epoch": 1993} {"train_loss": -36.46944808959961, "global_step": 241173, "epoch": 1993} {"train_loss": -37.08049392700195, "global_step": 241174, "epoch": 1993} {"train_loss": -35.55259323120117, "global_step": 241175, "epoch": 1993} {"train_loss": -36.99597930908203, "global_step": 241176, "epoch": 1993} {"train_loss": -36.42751693725586, "global_step": 241177, "epoch": 1993} {"train_loss": -36.332923889160156, "global_step": 241178, "epoch": 1993} {"train_loss": -35.88337326049805, "global_step": 241179, "epoch": 1993} {"train_loss": -36.847442626953125, "global_step": 241180, "epoch": 1993} {"train_loss": -36.737239837646484, "global_step": 241181, "epoch": 1993} {"train_loss": -36.46466827392578, "global_step": 241182, "epoch": 1993} {"train_loss": -36.642906188964844, "global_step": 241183, "epoch": 1993} {"train_loss": -37.07355880737305, "global_step": 241184, "epoch": 1993} {"train_loss": -36.32131576538086, "global_step": 241185, "epoch": 1993} {"train_loss": -36.5419807434082, "global_step": 241186, "epoch": 1993} {"train_loss": -36.68293380737305, "global_step": 241187, "epoch": 1993} {"train_loss": -36.669246673583984, "global_step": 241188, "epoch": 1993} {"train_loss": -38.12801742553711, "global_step": 241189, "epoch": 1993} {"train_loss": -36.9980354309082, "global_step": 241190, "epoch": 1993} {"train_loss": -36.71586990356445, "global_step": 241191, "epoch": 1993} {"train_loss": -37.130027770996094, "global_step": 241192, "epoch": 1993} {"train_loss": -36.5200080871582, "global_step": 241193, "epoch": 1993} {"train_loss": -37.03963088989258, "global_step": 241194, "epoch": 1993} {"train_loss": -37.44259262084961, "global_step": 241195, "epoch": 1993} {"train_loss": -36.88385009765625, "global_step": 241196, "epoch": 1993} {"train_loss": -37.29557418823242, "global_step": 241197, "epoch": 1993} {"train_loss": -37.40357208251953, "global_step": 241198, "epoch": 1993} {"train_loss": -37.135311126708984, "global_step": 241199, "epoch": 1993} {"train_loss": -37.789730072021484, "global_step": 241200, "epoch": 1993} {"train_loss": -36.84621810913086, "global_step": 241201, "epoch": 1993} {"train_loss": -37.073951721191406, "global_step": 241202, "epoch": 1993} {"train_loss": -36.882694244384766, "global_step": 241203, "epoch": 1993} {"train_loss": -38.37689208984375, "global_step": 241204, "epoch": 1993} {"train_loss": -37.80225372314453, "global_step": 241205, "epoch": 1993} {"train_loss": -37.230804443359375, "global_step": 241206, "epoch": 1993} {"train_loss": -36.994140625, "global_step": 241207, "epoch": 1993} {"train_loss": -37.70615768432617, "global_step": 241208, "epoch": 1993} {"train_loss": -37.8671875, "global_step": 241209, "epoch": 1993} {"train_loss": -37.17975997924805, "global_step": 241210, "epoch": 1993} {"train_loss": -37.35518264770508, "global_step": 241211, "epoch": 1993} {"train_loss": -37.57131576538086, "global_step": 241212, "epoch": 1993} {"train_loss": -37.63243865966797, "global_step": 241213, "epoch": 1993} {"train_loss": -37.7443733215332, "global_step": 241214, "epoch": 1993} {"train_loss": -37.83321762084961, "global_step": 241215, "epoch": 1993} {"train_loss": -36.60649490356445, "global_step": 241216, "epoch": 1993} {"train_loss": -37.975372314453125, "global_step": 241217, "epoch": 1993} {"train_loss": -37.93619918823242, "global_step": 241218, "epoch": 1993} {"train_loss": -37.49212646484375, "global_step": 241219, "epoch": 1993} {"train_loss": -38.1583137512207, "global_step": 241220, "epoch": 1993} {"train_loss": -37.945960998535156, "global_step": 241221, "epoch": 1993} {"train_loss": -38.11396408081055, "global_step": 241222, "epoch": 1993} {"train_loss": -37.98830795288086, "global_step": 241223, "epoch": 1993} {"train_loss": -37.28142166137695, "global_step": 241224, "epoch": 1993} {"train_loss": -37.86103057861328, "global_step": 241225, "epoch": 1993} {"train_loss": -38.288204193115234, "global_step": 241226, "epoch": 1993} {"train_loss": -37.199039459228516, "global_step": 241227, "epoch": 1993} {"train_loss": -39.002864837646484, "global_step": 241228, "epoch": 1993} {"train_loss": -38.9157829284668, "global_step": 241229, "epoch": 1993} {"train_loss": -38.5022087097168, "global_step": 241230, "epoch": 1993} {"train_loss": -38.19361114501953, "global_step": 241231, "epoch": 1993} {"train_loss": -38.458126068115234, "global_step": 241232, "epoch": 1993} {"train_loss": -38.470733642578125, "global_step": 241233, "epoch": 1993} {"train_loss": -38.18860626220703, "global_step": 241234, "epoch": 1993} {"train_loss": -39.301856994628906, "global_step": 241235, "epoch": 1993} {"train_loss": -38.05025863647461, "global_step": 241236, "epoch": 1993} {"train_loss": -37.83168411254883, "global_step": 241237, "epoch": 1993} {"train_loss": -37.8338737487793, "global_step": 241238, "epoch": 1993} {"train_loss": -39.039215087890625, "global_step": 241239, "epoch": 1993} {"train_loss": -39.275665283203125, "global_step": 241240, "epoch": 1993} {"train_loss": -38.34627151489258, "global_step": 241241, "epoch": 1993} {"train_loss": -39.271934509277344, "global_step": 241242, "epoch": 1993} {"train_loss": -38.14305877685547, "global_step": 241243, "epoch": 1993} {"train_loss": -38.89075469970703, "global_step": 241244, "epoch": 1993} {"train_loss": -39.17988204956055, "global_step": 241245, "epoch": 1993} {"train_loss": -38.62605285644531, "global_step": 241246, "epoch": 1993} {"train_loss": -39.07147216796875, "global_step": 241247, "epoch": 1993} {"train_loss": -38.33437728881836, "global_step": 241248, "epoch": 1993} {"train_loss": -37.40910339355469, "global_step": 241249, "epoch": 1993} {"train_loss": -39.08169174194336, "global_step": 241250, "epoch": 1993} {"train_loss": -39.283931732177734, "global_step": 241251, "epoch": 1993} {"train_loss": -38.42475128173828, "global_step": 241252, "epoch": 1993} {"train_loss": -39.108638763427734, "global_step": 241253, "epoch": 1993} {"train_loss": -39.09861373901367, "global_step": 241254, "epoch": 1993} {"train_loss": -38.436492919921875, "global_step": 241255, "epoch": 1993} {"train_loss": -39.65996170043945, "global_step": 241256, "epoch": 1993} {"train_loss": -38.33095169067383, "global_step": 241257, "epoch": 1993} {"train_loss": -39.27488327026367, "global_step": 241258, "epoch": 1993} {"train_loss": -39.446319580078125, "global_step": 241259, "epoch": 1993} {"train_loss": -38.894222259521484, "global_step": 241260, "epoch": 1993} {"train_loss": -38.45485305786133, "global_step": 241261, "epoch": 1993} {"train_loss": -39.04594039916992, "global_step": 241262, "epoch": 1993} {"train_loss": -39.89081573486328, "global_step": 241263, "epoch": 1993} {"train_loss": -38.9588623046875, "global_step": 241264, "epoch": 1993} {"train_loss": -39.98982620239258, "global_step": 241265, "epoch": 1993} {"train_loss": -38.76912307739258, "global_step": 241266, "epoch": 1993} {"train_loss": -38.82363510131836, "global_step": 241267, "epoch": 1993} {"train_loss": -38.72065353393555, "global_step": 241268, "epoch": 1993} {"train_loss": -38.91473388671875, "global_step": 241269, "epoch": 1993} {"train_loss": -39.18690872192383, "global_step": 241270, "epoch": 1993} {"train_loss": -39.58888626098633, "global_step": 241271, "epoch": 1993} {"train_loss": -39.590675354003906, "global_step": 241272, "epoch": 1993} {"train_loss": -37.56403054481696, "global_step": 241273, "epoch": 1993, "val_loss": 2548783.25} {"train_loss": -38.581459045410156, "global_step": 241274, "epoch": 1994} {"train_loss": -39.2805290222168, "global_step": 241275, "epoch": 1994} {"train_loss": -39.44940185546875, "global_step": 241276, "epoch": 1994} {"train_loss": -40.54905319213867, "global_step": 241277, "epoch": 1994} {"train_loss": -40.25014877319336, "global_step": 241278, "epoch": 1994} {"train_loss": -38.727420806884766, "global_step": 241279, "epoch": 1994} {"train_loss": -39.97831344604492, "global_step": 241280, "epoch": 1994} {"train_loss": -39.39512252807617, "global_step": 241281, "epoch": 1994} {"train_loss": -38.98612594604492, "global_step": 241282, "epoch": 1994} {"train_loss": -38.09035873413086, "global_step": 241283, "epoch": 1994} {"train_loss": -39.70728302001953, "global_step": 241284, "epoch": 1994} {"train_loss": -39.09394454956055, "global_step": 241285, "epoch": 1994} {"train_loss": -37.59641647338867, "global_step": 241286, "epoch": 1994} {"train_loss": -35.353816986083984, "global_step": 241287, "epoch": 1994} {"train_loss": -39.59331130981445, "global_step": 241288, "epoch": 1994} {"train_loss": -38.0078125, "global_step": 241289, "epoch": 1994} {"train_loss": -36.39433288574219, "global_step": 241290, "epoch": 1994} {"train_loss": -39.040191650390625, "global_step": 241291, "epoch": 1994} {"train_loss": -38.823299407958984, "global_step": 241292, "epoch": 1994} {"train_loss": -37.692955017089844, "global_step": 241293, "epoch": 1994} {"train_loss": -39.353328704833984, "global_step": 241294, "epoch": 1994} {"train_loss": -38.437896728515625, "global_step": 241295, "epoch": 1994} {"train_loss": -39.22029495239258, "global_step": 241296, "epoch": 1994} {"train_loss": -39.52701950073242, "global_step": 241297, "epoch": 1994} {"train_loss": -39.234657287597656, "global_step": 241298, "epoch": 1994} {"train_loss": -40.213130950927734, "global_step": 241299, "epoch": 1994} {"train_loss": -38.623287200927734, "global_step": 241300, "epoch": 1994} {"train_loss": -39.63920593261719, "global_step": 241301, "epoch": 1994} {"train_loss": -38.49969482421875, "global_step": 241302, "epoch": 1994} {"train_loss": -39.960906982421875, "global_step": 241303, "epoch": 1994} {"train_loss": -38.91008377075195, "global_step": 241304, "epoch": 1994} {"train_loss": -38.57632064819336, "global_step": 241305, "epoch": 1994} {"train_loss": -38.33539962768555, "global_step": 241306, "epoch": 1994} {"train_loss": -39.14895248413086, "global_step": 241307, "epoch": 1994} {"train_loss": -39.33394241333008, "global_step": 241308, "epoch": 1994} {"train_loss": -39.349544525146484, "global_step": 241309, "epoch": 1994} {"train_loss": -38.48482894897461, "global_step": 241310, "epoch": 1994} {"train_loss": -39.81720733642578, "global_step": 241311, "epoch": 1994} {"train_loss": -38.72703170776367, "global_step": 241312, "epoch": 1994} {"train_loss": -39.35012435913086, "global_step": 241313, "epoch": 1994} {"train_loss": -39.91817092895508, "global_step": 241314, "epoch": 1994} {"train_loss": -40.156776428222656, "global_step": 241315, "epoch": 1994} {"train_loss": -38.6408576965332, "global_step": 241316, "epoch": 1994} {"train_loss": -40.10909652709961, "global_step": 241317, "epoch": 1994} {"train_loss": -40.27146530151367, "global_step": 241318, "epoch": 1994} {"train_loss": -39.95447540283203, "global_step": 241319, "epoch": 1994} {"train_loss": -39.30116653442383, "global_step": 241320, "epoch": 1994} {"train_loss": -39.24492263793945, "global_step": 241321, "epoch": 1994} {"train_loss": -40.783138275146484, "global_step": 241322, "epoch": 1994} {"train_loss": -40.161293029785156, "global_step": 241323, "epoch": 1994} {"train_loss": -40.36499786376953, "global_step": 241324, "epoch": 1994} {"train_loss": -40.209163665771484, "global_step": 241325, "epoch": 1994} {"train_loss": -39.630035400390625, "global_step": 241326, "epoch": 1994} {"train_loss": -40.549835205078125, "global_step": 241327, "epoch": 1994} {"train_loss": -40.59794998168945, "global_step": 241328, "epoch": 1994} {"train_loss": -39.879615783691406, "global_step": 241329, "epoch": 1994} {"train_loss": -40.09405517578125, "global_step": 241330, "epoch": 1994} {"train_loss": -40.54934310913086, "global_step": 241331, "epoch": 1994} {"train_loss": -39.87565231323242, "global_step": 241332, "epoch": 1994} {"train_loss": -39.90348434448242, "global_step": 241333, "epoch": 1994} {"train_loss": -40.79606246948242, "global_step": 241334, "epoch": 1994} {"train_loss": -39.983558654785156, "global_step": 241335, "epoch": 1994} {"train_loss": -40.30677032470703, "global_step": 241336, "epoch": 1994} {"train_loss": -39.56608200073242, "global_step": 241337, "epoch": 1994} {"train_loss": -40.343177795410156, "global_step": 241338, "epoch": 1994} {"train_loss": -39.5910530090332, "global_step": 241339, "epoch": 1994} {"train_loss": -41.26978302001953, "global_step": 241340, "epoch": 1994} {"train_loss": -40.19778823852539, "global_step": 241341, "epoch": 1994} {"train_loss": -40.75358200073242, "global_step": 241342, "epoch": 1994} {"train_loss": -40.506351470947266, "global_step": 241343, "epoch": 1994} {"train_loss": -40.71976852416992, "global_step": 241344, "epoch": 1994} {"train_loss": -40.83669662475586, "global_step": 241345, "epoch": 1994} {"train_loss": -41.566898345947266, "global_step": 241346, "epoch": 1994} {"train_loss": -41.11124801635742, "global_step": 241347, "epoch": 1994} {"train_loss": -40.827484130859375, "global_step": 241348, "epoch": 1994} {"train_loss": -41.918479919433594, "global_step": 241349, "epoch": 1994} {"train_loss": -41.108741760253906, "global_step": 241350, "epoch": 1994} {"train_loss": -41.55287170410156, "global_step": 241351, "epoch": 1994} {"train_loss": -41.24354553222656, "global_step": 241352, "epoch": 1994} {"train_loss": -41.18726348876953, "global_step": 241353, "epoch": 1994} {"train_loss": -40.792579650878906, "global_step": 241354, "epoch": 1994} {"train_loss": -40.689029693603516, "global_step": 241355, "epoch": 1994} {"train_loss": -41.495540618896484, "global_step": 241356, "epoch": 1994} {"train_loss": -40.58552932739258, "global_step": 241357, "epoch": 1994} {"train_loss": -41.54266357421875, "global_step": 241358, "epoch": 1994} {"train_loss": -41.51747512817383, "global_step": 241359, "epoch": 1994} {"train_loss": -41.646034240722656, "global_step": 241360, "epoch": 1994} {"train_loss": -40.8947868347168, "global_step": 241361, "epoch": 1994} {"train_loss": -41.675357818603516, "global_step": 241362, "epoch": 1994} {"train_loss": -41.909149169921875, "global_step": 241363, "epoch": 1994} {"train_loss": -40.944515228271484, "global_step": 241364, "epoch": 1994} {"train_loss": -42.0387077331543, "global_step": 241365, "epoch": 1994} {"train_loss": -41.8631477355957, "global_step": 241366, "epoch": 1994} {"train_loss": -41.454925537109375, "global_step": 241367, "epoch": 1994} {"train_loss": -41.21132278442383, "global_step": 241368, "epoch": 1994} {"train_loss": -40.95772171020508, "global_step": 241369, "epoch": 1994} {"train_loss": -41.20235824584961, "global_step": 241370, "epoch": 1994} {"train_loss": -41.34121322631836, "global_step": 241371, "epoch": 1994} {"train_loss": -40.86127853393555, "global_step": 241372, "epoch": 1994} {"train_loss": -41.69108581542969, "global_step": 241373, "epoch": 1994} {"train_loss": -41.478755950927734, "global_step": 241374, "epoch": 1994} {"train_loss": -41.24884796142578, "global_step": 241375, "epoch": 1994} {"train_loss": -41.5361442565918, "global_step": 241376, "epoch": 1994} {"train_loss": -41.14017868041992, "global_step": 241377, "epoch": 1994} {"train_loss": -40.4774169921875, "global_step": 241378, "epoch": 1994} {"train_loss": -41.74264144897461, "global_step": 241379, "epoch": 1994} {"train_loss": -40.979427337646484, "global_step": 241380, "epoch": 1994} {"train_loss": -41.03933334350586, "global_step": 241381, "epoch": 1994} {"train_loss": -41.237815856933594, "global_step": 241382, "epoch": 1994} {"train_loss": -40.82788848876953, "global_step": 241383, "epoch": 1994} {"train_loss": -41.46562957763672, "global_step": 241384, "epoch": 1994} {"train_loss": -40.86933517456055, "global_step": 241385, "epoch": 1994} {"train_loss": -41.2918815612793, "global_step": 241386, "epoch": 1994} {"train_loss": -41.142581939697266, "global_step": 241387, "epoch": 1994} {"train_loss": -41.29902267456055, "global_step": 241388, "epoch": 1994} {"train_loss": -41.06181716918945, "global_step": 241389, "epoch": 1994} {"train_loss": -40.409908294677734, "global_step": 241390, "epoch": 1994} {"train_loss": -40.492706298828125, "global_step": 241391, "epoch": 1994} {"train_loss": -41.0442008972168, "global_step": 241392, "epoch": 1994} {"train_loss": -40.49570846557617, "global_step": 241393, "epoch": 1994} {"train_loss": -40.18617617394313, "global_step": 241394, "epoch": 1994, "val_loss": 2592820.25} {"train_loss": -41.35762405395508, "global_step": 241395, "epoch": 1995} {"train_loss": -41.3826904296875, "global_step": 241396, "epoch": 1995} {"train_loss": -41.89502716064453, "global_step": 241397, "epoch": 1995} {"train_loss": -41.51403045654297, "global_step": 241398, "epoch": 1995} {"train_loss": -41.75914764404297, "global_step": 241399, "epoch": 1995} {"train_loss": -40.694602966308594, "global_step": 241400, "epoch": 1995} {"train_loss": -40.60964584350586, "global_step": 241401, "epoch": 1995} {"train_loss": -42.16168975830078, "global_step": 241402, "epoch": 1995} {"train_loss": -41.00740432739258, "global_step": 241403, "epoch": 1995} {"train_loss": -40.61496353149414, "global_step": 241404, "epoch": 1995} {"train_loss": -40.29789352416992, "global_step": 241405, "epoch": 1995} {"train_loss": -41.513771057128906, "global_step": 241406, "epoch": 1995} {"train_loss": -41.10022735595703, "global_step": 241407, "epoch": 1995} {"train_loss": -40.42658233642578, "global_step": 241408, "epoch": 1995} {"train_loss": -40.56156539916992, "global_step": 241409, "epoch": 1995} {"train_loss": -40.483428955078125, "global_step": 241410, "epoch": 1995} {"train_loss": -38.31856155395508, "global_step": 241411, "epoch": 1995} {"train_loss": -39.16743850708008, "global_step": 241412, "epoch": 1995} {"train_loss": -41.11703109741211, "global_step": 241413, "epoch": 1995} {"train_loss": -40.0813102722168, "global_step": 241414, "epoch": 1995} {"train_loss": -39.33024215698242, "global_step": 241415, "epoch": 1995} {"train_loss": -40.34703826904297, "global_step": 241416, "epoch": 1995} {"train_loss": -40.830810546875, "global_step": 241417, "epoch": 1995} {"train_loss": -39.891963958740234, "global_step": 241418, "epoch": 1995} {"train_loss": -40.10646438598633, "global_step": 241419, "epoch": 1995} {"train_loss": -40.291168212890625, "global_step": 241420, "epoch": 1995} {"train_loss": -40.22705078125, "global_step": 241421, "epoch": 1995} {"train_loss": -40.94507598876953, "global_step": 241422, "epoch": 1995} {"train_loss": -40.60749053955078, "global_step": 241423, "epoch": 1995} {"train_loss": -40.794708251953125, "global_step": 241424, "epoch": 1995} {"train_loss": -41.0625114440918, "global_step": 241425, "epoch": 1995} {"train_loss": -40.82748031616211, "global_step": 241426, "epoch": 1995} {"train_loss": -40.26594161987305, "global_step": 241427, "epoch": 1995} {"train_loss": -41.16838455200195, "global_step": 241428, "epoch": 1995} {"train_loss": -41.17074203491211, "global_step": 241429, "epoch": 1995} {"train_loss": -40.59811019897461, "global_step": 241430, "epoch": 1995} {"train_loss": -40.283164978027344, "global_step": 241431, "epoch": 1995} {"train_loss": -38.9210090637207, "global_step": 241432, "epoch": 1995} {"train_loss": -36.40812301635742, "global_step": 241433, "epoch": 1995} {"train_loss": -32.72675704956055, "global_step": 241434, "epoch": 1995} {"train_loss": -34.707275390625, "global_step": 241435, "epoch": 1995} {"train_loss": -15.075332641601562, "global_step": 241436, "epoch": 1995} {"train_loss": -12.113212585449219, "global_step": 241437, "epoch": 1995} {"train_loss": -13.97027587890625, "global_step": 241438, "epoch": 1995} {"train_loss": -29.726964950561523, "global_step": 241439, "epoch": 1995} {"train_loss": -22.620311737060547, "global_step": 241440, "epoch": 1995} {"train_loss": -30.727405548095703, "global_step": 241441, "epoch": 1995} {"train_loss": -24.965795516967773, "global_step": 241442, "epoch": 1995} {"train_loss": -34.97601318359375, "global_step": 241443, "epoch": 1995} {"train_loss": -28.114887237548828, "global_step": 241444, "epoch": 1995} {"train_loss": -37.022705078125, "global_step": 241445, "epoch": 1995} {"train_loss": -31.646015167236328, "global_step": 241446, "epoch": 1995} {"train_loss": -35.813720703125, "global_step": 241447, "epoch": 1995} {"train_loss": -34.44197463989258, "global_step": 241448, "epoch": 1995} {"train_loss": -35.27701950073242, "global_step": 241449, "epoch": 1995} {"train_loss": -37.49846267700195, "global_step": 241450, "epoch": 1995} {"train_loss": -36.46946334838867, "global_step": 241451, "epoch": 1995} {"train_loss": -38.2322998046875, "global_step": 241452, "epoch": 1995} {"train_loss": -37.16899490356445, "global_step": 241453, "epoch": 1995} {"train_loss": -36.77010726928711, "global_step": 241454, "epoch": 1995} {"train_loss": -38.586090087890625, "global_step": 241455, "epoch": 1995} {"train_loss": -38.328346252441406, "global_step": 241456, "epoch": 1995} {"train_loss": -37.785797119140625, "global_step": 241457, "epoch": 1995} {"train_loss": -39.0537109375, "global_step": 241458, "epoch": 1995} {"train_loss": -38.997291564941406, "global_step": 241459, "epoch": 1995} {"train_loss": -37.68790817260742, "global_step": 241460, "epoch": 1995} {"train_loss": -38.51095199584961, "global_step": 241461, "epoch": 1995} {"train_loss": -39.09588623046875, "global_step": 241462, "epoch": 1995} {"train_loss": -38.51151657104492, "global_step": 241463, "epoch": 1995} {"train_loss": -39.2518196105957, "global_step": 241464, "epoch": 1995} {"train_loss": -39.18759536743164, "global_step": 241465, "epoch": 1995} {"train_loss": -38.850982666015625, "global_step": 241466, "epoch": 1995} {"train_loss": -38.79389190673828, "global_step": 241467, "epoch": 1995} {"train_loss": -40.13959503173828, "global_step": 241468, "epoch": 1995} {"train_loss": -38.190460205078125, "global_step": 241469, "epoch": 1995} {"train_loss": -39.61380386352539, "global_step": 241470, "epoch": 1995} {"train_loss": -39.33552932739258, "global_step": 241471, "epoch": 1995} {"train_loss": -39.303916931152344, "global_step": 241472, "epoch": 1995} {"train_loss": -39.574588775634766, "global_step": 241473, "epoch": 1995} {"train_loss": -40.28662109375, "global_step": 241474, "epoch": 1995} {"train_loss": -39.67015838623047, "global_step": 241475, "epoch": 1995} {"train_loss": -39.9393424987793, "global_step": 241476, "epoch": 1995} {"train_loss": -40.108428955078125, "global_step": 241477, "epoch": 1995} {"train_loss": -40.06098556518555, "global_step": 241478, "epoch": 1995} {"train_loss": -39.99150466918945, "global_step": 241479, "epoch": 1995} {"train_loss": -39.51884078979492, "global_step": 241480, "epoch": 1995} {"train_loss": -40.29237365722656, "global_step": 241481, "epoch": 1995} {"train_loss": -40.5327033996582, "global_step": 241482, "epoch": 1995} {"train_loss": -39.10197830200195, "global_step": 241483, "epoch": 1995} {"train_loss": -40.525428771972656, "global_step": 241484, "epoch": 1995} {"train_loss": -40.12051010131836, "global_step": 241485, "epoch": 1995} {"train_loss": -40.83360290527344, "global_step": 241486, "epoch": 1995} {"train_loss": -40.939998626708984, "global_step": 241487, "epoch": 1995} {"train_loss": -40.4133186340332, "global_step": 241488, "epoch": 1995} {"train_loss": -40.990478515625, "global_step": 241489, "epoch": 1995} {"train_loss": -39.72146224975586, "global_step": 241490, "epoch": 1995} {"train_loss": -40.3187255859375, "global_step": 241491, "epoch": 1995} {"train_loss": -40.546852111816406, "global_step": 241492, "epoch": 1995} {"train_loss": -40.56484603881836, "global_step": 241493, "epoch": 1995} {"train_loss": -40.918426513671875, "global_step": 241494, "epoch": 1995} {"train_loss": -40.493690490722656, "global_step": 241495, "epoch": 1995} {"train_loss": -40.54803466796875, "global_step": 241496, "epoch": 1995} {"train_loss": -40.28990936279297, "global_step": 241497, "epoch": 1995} {"train_loss": -40.98330307006836, "global_step": 241498, "epoch": 1995} {"train_loss": -41.224815368652344, "global_step": 241499, "epoch": 1995} {"train_loss": -41.1834831237793, "global_step": 241500, "epoch": 1995} {"train_loss": -41.22509765625, "global_step": 241501, "epoch": 1995} {"train_loss": -38.50454330444336, "global_step": 241502, "epoch": 1995} {"train_loss": -41.08036422729492, "global_step": 241503, "epoch": 1995} {"train_loss": -41.28924560546875, "global_step": 241504, "epoch": 1995} {"train_loss": -41.531898498535156, "global_step": 241505, "epoch": 1995} {"train_loss": -41.51637649536133, "global_step": 241506, "epoch": 1995} {"train_loss": -41.1764030456543, "global_step": 241507, "epoch": 1995} {"train_loss": -40.270782470703125, "global_step": 241508, "epoch": 1995} {"train_loss": -40.35374069213867, "global_step": 241509, "epoch": 1995} {"train_loss": -40.9649772644043, "global_step": 241510, "epoch": 1995} {"train_loss": -41.317848205566406, "global_step": 241511, "epoch": 1995} {"train_loss": -41.64667510986328, "global_step": 241512, "epoch": 1995} {"train_loss": -41.31600570678711, "global_step": 241513, "epoch": 1995} {"train_loss": -40.79338836669922, "global_step": 241514, "epoch": 1995} {"train_loss": -38.53574629854565, "global_step": 241515, "epoch": 1995, "val_loss": 2613310.25} {"train_loss": -40.91181182861328, "global_step": 241516, "epoch": 1996} {"train_loss": -38.59029769897461, "global_step": 241517, "epoch": 1996} {"train_loss": -40.497406005859375, "global_step": 241518, "epoch": 1996} {"train_loss": -35.724552154541016, "global_step": 241519, "epoch": 1996} {"train_loss": -40.97945022583008, "global_step": 241520, "epoch": 1996} {"train_loss": -40.75345993041992, "global_step": 241521, "epoch": 1996} {"train_loss": -41.35569381713867, "global_step": 241522, "epoch": 1996} {"train_loss": -39.951812744140625, "global_step": 241523, "epoch": 1996} {"train_loss": -39.281856536865234, "global_step": 241524, "epoch": 1996} {"train_loss": -34.48244094848633, "global_step": 241525, "epoch": 1996} {"train_loss": -35.55410385131836, "global_step": 241526, "epoch": 1996} {"train_loss": -37.87032699584961, "global_step": 241527, "epoch": 1996} {"train_loss": -41.14878463745117, "global_step": 241528, "epoch": 1996} {"train_loss": -40.774085998535156, "global_step": 241529, "epoch": 1996} {"train_loss": -37.40959548950195, "global_step": 241530, "epoch": 1996} {"train_loss": -29.335126876831055, "global_step": 241531, "epoch": 1996} {"train_loss": -34.55670928955078, "global_step": 241532, "epoch": 1996} {"train_loss": -35.35042953491211, "global_step": 241533, "epoch": 1996} {"train_loss": -38.86210250854492, "global_step": 241534, "epoch": 1996} {"train_loss": -30.381122589111328, "global_step": 241535, "epoch": 1996} {"train_loss": -27.92850685119629, "global_step": 241536, "epoch": 1996} {"train_loss": -17.466962814331055, "global_step": 241537, "epoch": 1996} {"train_loss": -11.728911399841309, "global_step": 241538, "epoch": 1996} {"train_loss": -34.55965042114258, "global_step": 241539, "epoch": 1996} {"train_loss": -34.054100036621094, "global_step": 241540, "epoch": 1996} {"train_loss": -28.130537033081055, "global_step": 241541, "epoch": 1996} {"train_loss": -28.062763214111328, "global_step": 241542, "epoch": 1996} {"train_loss": -26.0573673248291, "global_step": 241543, "epoch": 1996} {"train_loss": -17.284147262573242, "global_step": 241544, "epoch": 1996} {"train_loss": -35.19482421875, "global_step": 241545, "epoch": 1996} {"train_loss": -33.866310119628906, "global_step": 241546, "epoch": 1996} {"train_loss": -33.85990524291992, "global_step": 241547, "epoch": 1996} {"train_loss": -31.65337562561035, "global_step": 241548, "epoch": 1996} {"train_loss": -37.0618782043457, "global_step": 241549, "epoch": 1996} {"train_loss": -34.612220764160156, "global_step": 241550, "epoch": 1996} {"train_loss": -33.47693634033203, "global_step": 241551, "epoch": 1996} {"train_loss": -33.104915618896484, "global_step": 241552, "epoch": 1996} {"train_loss": -37.22285079956055, "global_step": 241553, "epoch": 1996} {"train_loss": -36.22344207763672, "global_step": 241554, "epoch": 1996} {"train_loss": -33.74390411376953, "global_step": 241555, "epoch": 1996} {"train_loss": -36.72298049926758, "global_step": 241556, "epoch": 1996} {"train_loss": -33.37600326538086, "global_step": 241557, "epoch": 1996} {"train_loss": -34.620887756347656, "global_step": 241558, "epoch": 1996} {"train_loss": -33.37322998046875, "global_step": 241559, "epoch": 1996} {"train_loss": -32.904911041259766, "global_step": 241560, "epoch": 1996} {"train_loss": -36.819271087646484, "global_step": 241561, "epoch": 1996} {"train_loss": -34.96015548706055, "global_step": 241562, "epoch": 1996} {"train_loss": -36.49001693725586, "global_step": 241563, "epoch": 1996} {"train_loss": -37.728023529052734, "global_step": 241564, "epoch": 1996} {"train_loss": -35.638179779052734, "global_step": 241565, "epoch": 1996} {"train_loss": -35.6916389465332, "global_step": 241566, "epoch": 1996} {"train_loss": -35.58100891113281, "global_step": 241567, "epoch": 1996} {"train_loss": -37.4939079284668, "global_step": 241568, "epoch": 1996} {"train_loss": -37.9704704284668, "global_step": 241569, "epoch": 1996} {"train_loss": -35.62483215332031, "global_step": 241570, "epoch": 1996} {"train_loss": -37.65956497192383, "global_step": 241571, "epoch": 1996} {"train_loss": -36.36865997314453, "global_step": 241572, "epoch": 1996} {"train_loss": -37.83183670043945, "global_step": 241573, "epoch": 1996} {"train_loss": -37.56641387939453, "global_step": 241574, "epoch": 1996} {"train_loss": -38.713706970214844, "global_step": 241575, "epoch": 1996} {"train_loss": -37.871883392333984, "global_step": 241576, "epoch": 1996} {"train_loss": -38.01699447631836, "global_step": 241577, "epoch": 1996} {"train_loss": -37.85176467895508, "global_step": 241578, "epoch": 1996} {"train_loss": -38.4764518737793, "global_step": 241579, "epoch": 1996} {"train_loss": -38.42579650878906, "global_step": 241580, "epoch": 1996} {"train_loss": -37.11507034301758, "global_step": 241581, "epoch": 1996} {"train_loss": -37.68729782104492, "global_step": 241582, "epoch": 1996} {"train_loss": -38.3848876953125, "global_step": 241583, "epoch": 1996} {"train_loss": -38.808345794677734, "global_step": 241584, "epoch": 1996} {"train_loss": -38.76509094238281, "global_step": 241585, "epoch": 1996} {"train_loss": -38.73051071166992, "global_step": 241586, "epoch": 1996} {"train_loss": -38.5899772644043, "global_step": 241587, "epoch": 1996} {"train_loss": -38.78437423706055, "global_step": 241588, "epoch": 1996} {"train_loss": -36.85093307495117, "global_step": 241589, "epoch": 1996} {"train_loss": -38.419960021972656, "global_step": 241590, "epoch": 1996} {"train_loss": -38.2385368347168, "global_step": 241591, "epoch": 1996} {"train_loss": -37.944026947021484, "global_step": 241592, "epoch": 1996} {"train_loss": -37.949371337890625, "global_step": 241593, "epoch": 1996} {"train_loss": -39.237979888916016, "global_step": 241594, "epoch": 1996} {"train_loss": -38.930641174316406, "global_step": 241595, "epoch": 1996} {"train_loss": -39.17091751098633, "global_step": 241596, "epoch": 1996} {"train_loss": -38.925941467285156, "global_step": 241597, "epoch": 1996} {"train_loss": -39.0386848449707, "global_step": 241598, "epoch": 1996} {"train_loss": -38.77456283569336, "global_step": 241599, "epoch": 1996} {"train_loss": -38.46240997314453, "global_step": 241600, "epoch": 1996} {"train_loss": -38.74134826660156, "global_step": 241601, "epoch": 1996} {"train_loss": -39.66908645629883, "global_step": 241602, "epoch": 1996} {"train_loss": -38.5047492980957, "global_step": 241603, "epoch": 1996} {"train_loss": -39.446014404296875, "global_step": 241604, "epoch": 1996} {"train_loss": -38.84817886352539, "global_step": 241605, "epoch": 1996} {"train_loss": -39.320552825927734, "global_step": 241606, "epoch": 1996} {"train_loss": -39.044063568115234, "global_step": 241607, "epoch": 1996} {"train_loss": -38.645301818847656, "global_step": 241608, "epoch": 1996} {"train_loss": -39.620361328125, "global_step": 241609, "epoch": 1996} {"train_loss": -39.40757751464844, "global_step": 241610, "epoch": 1996} {"train_loss": -39.27210235595703, "global_step": 241611, "epoch": 1996} {"train_loss": -39.79768753051758, "global_step": 241612, "epoch": 1996} {"train_loss": -39.74241256713867, "global_step": 241613, "epoch": 1996} {"train_loss": -40.3571662902832, "global_step": 241614, "epoch": 1996} {"train_loss": -39.49839782714844, "global_step": 241615, "epoch": 1996} {"train_loss": -39.18048858642578, "global_step": 241616, "epoch": 1996} {"train_loss": -39.89933395385742, "global_step": 241617, "epoch": 1996} {"train_loss": -39.17285919189453, "global_step": 241618, "epoch": 1996} {"train_loss": -40.15593338012695, "global_step": 241619, "epoch": 1996} {"train_loss": -40.45356750488281, "global_step": 241620, "epoch": 1996} {"train_loss": -39.888824462890625, "global_step": 241621, "epoch": 1996} {"train_loss": -39.225406646728516, "global_step": 241622, "epoch": 1996} {"train_loss": -40.41652297973633, "global_step": 241623, "epoch": 1996} {"train_loss": -40.47687530517578, "global_step": 241624, "epoch": 1996} {"train_loss": -40.36692810058594, "global_step": 241625, "epoch": 1996} {"train_loss": -40.445648193359375, "global_step": 241626, "epoch": 1996} {"train_loss": -40.07059860229492, "global_step": 241627, "epoch": 1996} {"train_loss": -40.30570602416992, "global_step": 241628, "epoch": 1996} {"train_loss": -40.63190841674805, "global_step": 241629, "epoch": 1996} {"train_loss": -39.872650146484375, "global_step": 241630, "epoch": 1996} {"train_loss": -39.68546676635742, "global_step": 241631, "epoch": 1996} {"train_loss": -40.37797164916992, "global_step": 241632, "epoch": 1996} {"train_loss": -39.91511154174805, "global_step": 241633, "epoch": 1996} {"train_loss": -39.92509841918945, "global_step": 241634, "epoch": 1996} {"train_loss": -40.458648681640625, "global_step": 241635, "epoch": 1996} {"train_loss": -36.96355747979535, "global_step": 241636, "epoch": 1996, "val_loss": 2679342.0} {"train_loss": -40.94033432006836, "global_step": 241637, "epoch": 1997} {"train_loss": -40.618560791015625, "global_step": 241638, "epoch": 1997} {"train_loss": -40.78202438354492, "global_step": 241639, "epoch": 1997} {"train_loss": -40.611602783203125, "global_step": 241640, "epoch": 1997} {"train_loss": -39.95229721069336, "global_step": 241641, "epoch": 1997} {"train_loss": -40.0577507019043, "global_step": 241642, "epoch": 1997} {"train_loss": -40.81714630126953, "global_step": 241643, "epoch": 1997} {"train_loss": -40.675228118896484, "global_step": 241644, "epoch": 1997} {"train_loss": -40.54629898071289, "global_step": 241645, "epoch": 1997} {"train_loss": -40.98073959350586, "global_step": 241646, "epoch": 1997} {"train_loss": -40.49598693847656, "global_step": 241647, "epoch": 1997} {"train_loss": -40.978240966796875, "global_step": 241648, "epoch": 1997} {"train_loss": -41.08651351928711, "global_step": 241649, "epoch": 1997} {"train_loss": -40.11088180541992, "global_step": 241650, "epoch": 1997} {"train_loss": -41.22176742553711, "global_step": 241651, "epoch": 1997} {"train_loss": -40.18642807006836, "global_step": 241652, "epoch": 1997} {"train_loss": -40.38142776489258, "global_step": 241653, "epoch": 1997} {"train_loss": -41.57451629638672, "global_step": 241654, "epoch": 1997} {"train_loss": -40.18416213989258, "global_step": 241655, "epoch": 1997} {"train_loss": -41.0431022644043, "global_step": 241656, "epoch": 1997} {"train_loss": -41.332061767578125, "global_step": 241657, "epoch": 1997} {"train_loss": -41.29438400268555, "global_step": 241658, "epoch": 1997} {"train_loss": -40.80625534057617, "global_step": 241659, "epoch": 1997} {"train_loss": -40.85459899902344, "global_step": 241660, "epoch": 1997} {"train_loss": -40.5561408996582, "global_step": 241661, "epoch": 1997} {"train_loss": -41.040626525878906, "global_step": 241662, "epoch": 1997} {"train_loss": -41.11454772949219, "global_step": 241663, "epoch": 1997} {"train_loss": -40.88875961303711, "global_step": 241664, "epoch": 1997} {"train_loss": -41.515316009521484, "global_step": 241665, "epoch": 1997} {"train_loss": -41.11225128173828, "global_step": 241666, "epoch": 1997} {"train_loss": -41.76707077026367, "global_step": 241667, "epoch": 1997} {"train_loss": -41.26572799682617, "global_step": 241668, "epoch": 1997} {"train_loss": -42.03239822387695, "global_step": 241669, "epoch": 1997} {"train_loss": -41.682308197021484, "global_step": 241670, "epoch": 1997} {"train_loss": -41.111324310302734, "global_step": 241671, "epoch": 1997} {"train_loss": -40.563289642333984, "global_step": 241672, "epoch": 1997} {"train_loss": -40.54055404663086, "global_step": 241673, "epoch": 1997} {"train_loss": -41.48850631713867, "global_step": 241674, "epoch": 1997} {"train_loss": -41.25539779663086, "global_step": 241675, "epoch": 1997} {"train_loss": -41.43846130371094, "global_step": 241676, "epoch": 1997} {"train_loss": -40.22282028198242, "global_step": 241677, "epoch": 1997} {"train_loss": -40.35805130004883, "global_step": 241678, "epoch": 1997} {"train_loss": -41.03278350830078, "global_step": 241679, "epoch": 1997} {"train_loss": -40.14210891723633, "global_step": 241680, "epoch": 1997} {"train_loss": -40.40400314331055, "global_step": 241681, "epoch": 1997} {"train_loss": -39.08493423461914, "global_step": 241682, "epoch": 1997} {"train_loss": -39.05622482299805, "global_step": 241683, "epoch": 1997} {"train_loss": -41.295654296875, "global_step": 241684, "epoch": 1997} {"train_loss": -41.56822204589844, "global_step": 241685, "epoch": 1997} {"train_loss": -41.04695129394531, "global_step": 241686, "epoch": 1997} {"train_loss": -39.24691390991211, "global_step": 241687, "epoch": 1997} {"train_loss": -41.296016693115234, "global_step": 241688, "epoch": 1997} {"train_loss": -41.20439147949219, "global_step": 241689, "epoch": 1997} {"train_loss": -39.65586471557617, "global_step": 241690, "epoch": 1997} {"train_loss": -39.726314544677734, "global_step": 241691, "epoch": 1997} {"train_loss": -41.24978256225586, "global_step": 241692, "epoch": 1997} {"train_loss": -40.45774459838867, "global_step": 241693, "epoch": 1997} {"train_loss": -40.36372375488281, "global_step": 241694, "epoch": 1997} {"train_loss": -41.034584045410156, "global_step": 241695, "epoch": 1997} {"train_loss": -39.8575325012207, "global_step": 241696, "epoch": 1997} {"train_loss": -39.09942626953125, "global_step": 241697, "epoch": 1997} {"train_loss": -41.16288757324219, "global_step": 241698, "epoch": 1997} {"train_loss": -40.64569854736328, "global_step": 241699, "epoch": 1997} {"train_loss": -40.5219841003418, "global_step": 241700, "epoch": 1997} {"train_loss": -41.3597412109375, "global_step": 241701, "epoch": 1997} {"train_loss": -39.767086029052734, "global_step": 241702, "epoch": 1997} {"train_loss": -40.51652145385742, "global_step": 241703, "epoch": 1997} {"train_loss": -41.684730529785156, "global_step": 241704, "epoch": 1997} {"train_loss": -41.34510040283203, "global_step": 241705, "epoch": 1997} {"train_loss": -41.150760650634766, "global_step": 241706, "epoch": 1997} {"train_loss": -41.09527587890625, "global_step": 241707, "epoch": 1997} {"train_loss": -40.63444900512695, "global_step": 241708, "epoch": 1997} {"train_loss": -40.05874252319336, "global_step": 241709, "epoch": 1997} {"train_loss": -41.026424407958984, "global_step": 241710, "epoch": 1997} {"train_loss": -40.70720672607422, "global_step": 241711, "epoch": 1997} {"train_loss": -41.331295013427734, "global_step": 241712, "epoch": 1997} {"train_loss": -41.82781982421875, "global_step": 241713, "epoch": 1997} {"train_loss": -40.80793762207031, "global_step": 241714, "epoch": 1997} {"train_loss": -41.53163528442383, "global_step": 241715, "epoch": 1997} {"train_loss": -39.42128372192383, "global_step": 241716, "epoch": 1997} {"train_loss": -41.55917739868164, "global_step": 241717, "epoch": 1997} {"train_loss": -41.25822830200195, "global_step": 241718, "epoch": 1997} {"train_loss": -41.04005432128906, "global_step": 241719, "epoch": 1997} {"train_loss": -41.288143157958984, "global_step": 241720, "epoch": 1997} {"train_loss": -41.68838119506836, "global_step": 241721, "epoch": 1997} {"train_loss": -41.599853515625, "global_step": 241722, "epoch": 1997} {"train_loss": -41.59882736206055, "global_step": 241723, "epoch": 1997} {"train_loss": -41.10913848876953, "global_step": 241724, "epoch": 1997} {"train_loss": -41.2874641418457, "global_step": 241725, "epoch": 1997} {"train_loss": -41.05698013305664, "global_step": 241726, "epoch": 1997} {"train_loss": -41.0700569152832, "global_step": 241727, "epoch": 1997} {"train_loss": -41.636138916015625, "global_step": 241728, "epoch": 1997} {"train_loss": -41.91596603393555, "global_step": 241729, "epoch": 1997} {"train_loss": -41.74532699584961, "global_step": 241730, "epoch": 1997} {"train_loss": -41.16916275024414, "global_step": 241731, "epoch": 1997} {"train_loss": -41.54811477661133, "global_step": 241732, "epoch": 1997} {"train_loss": -41.62466049194336, "global_step": 241733, "epoch": 1997} {"train_loss": -41.733272552490234, "global_step": 241734, "epoch": 1997} {"train_loss": -41.96586227416992, "global_step": 241735, "epoch": 1997} {"train_loss": -42.01002883911133, "global_step": 241736, "epoch": 1997} {"train_loss": -42.5670280456543, "global_step": 241737, "epoch": 1997} {"train_loss": -41.584808349609375, "global_step": 241738, "epoch": 1997} {"train_loss": -39.788570404052734, "global_step": 241739, "epoch": 1997} {"train_loss": -40.84067153930664, "global_step": 241740, "epoch": 1997} {"train_loss": -42.151973724365234, "global_step": 241741, "epoch": 1997} {"train_loss": -41.74079513549805, "global_step": 241742, "epoch": 1997} {"train_loss": -41.24151611328125, "global_step": 241743, "epoch": 1997} {"train_loss": -39.90485763549805, "global_step": 241744, "epoch": 1997} {"train_loss": -37.68044662475586, "global_step": 241745, "epoch": 1997} {"train_loss": -39.42628860473633, "global_step": 241746, "epoch": 1997} {"train_loss": -41.546382904052734, "global_step": 241747, "epoch": 1997} {"train_loss": -40.17442321777344, "global_step": 241748, "epoch": 1997} {"train_loss": -38.735511779785156, "global_step": 241749, "epoch": 1997} {"train_loss": -40.026485443115234, "global_step": 241750, "epoch": 1997} {"train_loss": -41.259620666503906, "global_step": 241751, "epoch": 1997} {"train_loss": -41.126827239990234, "global_step": 241752, "epoch": 1997} {"train_loss": -41.0609016418457, "global_step": 241753, "epoch": 1997} {"train_loss": -40.36480712890625, "global_step": 241754, "epoch": 1997} {"train_loss": -41.615901947021484, "global_step": 241755, "epoch": 1997} {"train_loss": -41.433876037597656, "global_step": 241756, "epoch": 1997} {"train_loss": -40.868080202213, "global_step": 241757, "epoch": 1997, "val_loss": 2661206.75} {"train_loss": -40.25332260131836, "global_step": 241758, "epoch": 1998} {"train_loss": -42.04804229736328, "global_step": 241759, "epoch": 1998} {"train_loss": -38.66328811645508, "global_step": 241760, "epoch": 1998} {"train_loss": -41.362525939941406, "global_step": 241761, "epoch": 1998} {"train_loss": -42.015380859375, "global_step": 241762, "epoch": 1998} {"train_loss": -40.994232177734375, "global_step": 241763, "epoch": 1998} {"train_loss": -41.6057014465332, "global_step": 241764, "epoch": 1998} {"train_loss": -40.71074295043945, "global_step": 241765, "epoch": 1998} {"train_loss": -39.97650146484375, "global_step": 241766, "epoch": 1998} {"train_loss": -41.4847526550293, "global_step": 241767, "epoch": 1998} {"train_loss": -40.840633392333984, "global_step": 241768, "epoch": 1998} {"train_loss": -40.070552825927734, "global_step": 241769, "epoch": 1998} {"train_loss": -41.7427978515625, "global_step": 241770, "epoch": 1998} {"train_loss": -40.5794792175293, "global_step": 241771, "epoch": 1998} {"train_loss": -41.065242767333984, "global_step": 241772, "epoch": 1998} {"train_loss": -41.8468132019043, "global_step": 241773, "epoch": 1998} {"train_loss": -41.57148361206055, "global_step": 241774, "epoch": 1998} {"train_loss": -41.517757415771484, "global_step": 241775, "epoch": 1998} {"train_loss": -42.142791748046875, "global_step": 241776, "epoch": 1998} {"train_loss": -41.720882415771484, "global_step": 241777, "epoch": 1998} {"train_loss": -42.12594223022461, "global_step": 241778, "epoch": 1998} {"train_loss": -41.59048843383789, "global_step": 241779, "epoch": 1998} {"train_loss": -41.31264114379883, "global_step": 241780, "epoch": 1998} {"train_loss": -42.27665710449219, "global_step": 241781, "epoch": 1998} {"train_loss": -41.18506622314453, "global_step": 241782, "epoch": 1998} {"train_loss": -42.616973876953125, "global_step": 241783, "epoch": 1998} {"train_loss": -42.111576080322266, "global_step": 241784, "epoch": 1998} {"train_loss": -42.37038803100586, "global_step": 241785, "epoch": 1998} {"train_loss": -42.48408126831055, "global_step": 241786, "epoch": 1998} {"train_loss": -42.151790618896484, "global_step": 241787, "epoch": 1998} {"train_loss": -41.62966537475586, "global_step": 241788, "epoch": 1998} {"train_loss": -42.42534637451172, "global_step": 241789, "epoch": 1998} {"train_loss": -42.297096252441406, "global_step": 241790, "epoch": 1998} {"train_loss": -41.824378967285156, "global_step": 241791, "epoch": 1998} {"train_loss": -42.388607025146484, "global_step": 241792, "epoch": 1998} {"train_loss": -41.86231231689453, "global_step": 241793, "epoch": 1998} {"train_loss": -41.49586868286133, "global_step": 241794, "epoch": 1998} {"train_loss": -41.336692810058594, "global_step": 241795, "epoch": 1998} {"train_loss": -42.7503547668457, "global_step": 241796, "epoch": 1998} {"train_loss": -41.62691116333008, "global_step": 241797, "epoch": 1998} {"train_loss": -42.5029411315918, "global_step": 241798, "epoch": 1998} {"train_loss": -42.19002914428711, "global_step": 241799, "epoch": 1998} {"train_loss": -42.63514709472656, "global_step": 241800, "epoch": 1998} {"train_loss": -42.39741134643555, "global_step": 241801, "epoch": 1998} {"train_loss": -42.84458923339844, "global_step": 241802, "epoch": 1998} {"train_loss": -42.40606689453125, "global_step": 241803, "epoch": 1998} {"train_loss": -42.65322494506836, "global_step": 241804, "epoch": 1998} {"train_loss": -42.79597473144531, "global_step": 241805, "epoch": 1998} {"train_loss": -42.327571868896484, "global_step": 241806, "epoch": 1998} {"train_loss": -42.69906234741211, "global_step": 241807, "epoch": 1998} {"train_loss": -42.90178680419922, "global_step": 241808, "epoch": 1998} {"train_loss": -42.42782211303711, "global_step": 241809, "epoch": 1998} {"train_loss": -42.95331573486328, "global_step": 241810, "epoch": 1998} {"train_loss": -41.85388946533203, "global_step": 241811, "epoch": 1998} {"train_loss": -41.92010498046875, "global_step": 241812, "epoch": 1998} {"train_loss": -42.37327194213867, "global_step": 241813, "epoch": 1998} {"train_loss": -42.634395599365234, "global_step": 241814, "epoch": 1998} {"train_loss": -42.62313461303711, "global_step": 241815, "epoch": 1998} {"train_loss": -42.322174072265625, "global_step": 241816, "epoch": 1998} {"train_loss": -42.14604949951172, "global_step": 241817, "epoch": 1998} {"train_loss": -42.533348083496094, "global_step": 241818, "epoch": 1998} {"train_loss": -42.292877197265625, "global_step": 241819, "epoch": 1998} {"train_loss": -42.69478225708008, "global_step": 241820, "epoch": 1998} {"train_loss": -43.18907165527344, "global_step": 241821, "epoch": 1998} {"train_loss": -42.54711151123047, "global_step": 241822, "epoch": 1998} {"train_loss": -41.383296966552734, "global_step": 241823, "epoch": 1998} {"train_loss": -41.643653869628906, "global_step": 241824, "epoch": 1998} {"train_loss": -42.594932556152344, "global_step": 241825, "epoch": 1998} {"train_loss": -43.01504135131836, "global_step": 241826, "epoch": 1998} {"train_loss": -42.588130950927734, "global_step": 241827, "epoch": 1998} {"train_loss": -42.47333526611328, "global_step": 241828, "epoch": 1998} {"train_loss": -41.93375778198242, "global_step": 241829, "epoch": 1998} {"train_loss": -42.516780853271484, "global_step": 241830, "epoch": 1998} {"train_loss": -41.90694808959961, "global_step": 241831, "epoch": 1998} {"train_loss": -41.68787384033203, "global_step": 241832, "epoch": 1998} {"train_loss": -42.96566390991211, "global_step": 241833, "epoch": 1998} {"train_loss": -41.65632247924805, "global_step": 241834, "epoch": 1998} {"train_loss": -42.592994689941406, "global_step": 241835, "epoch": 1998} {"train_loss": -42.63627243041992, "global_step": 241836, "epoch": 1998} {"train_loss": -42.97506332397461, "global_step": 241837, "epoch": 1998} {"train_loss": -42.445491790771484, "global_step": 241838, "epoch": 1998} {"train_loss": -43.122657775878906, "global_step": 241839, "epoch": 1998} {"train_loss": -41.80810546875, "global_step": 241840, "epoch": 1998} {"train_loss": -40.925987243652344, "global_step": 241841, "epoch": 1998} {"train_loss": -39.503944396972656, "global_step": 241842, "epoch": 1998} {"train_loss": -39.836585998535156, "global_step": 241843, "epoch": 1998} {"train_loss": -40.8847770690918, "global_step": 241844, "epoch": 1998} {"train_loss": -42.002037048339844, "global_step": 241845, "epoch": 1998} {"train_loss": -41.08887481689453, "global_step": 241846, "epoch": 1998} {"train_loss": -40.40327072143555, "global_step": 241847, "epoch": 1998} {"train_loss": -40.479637145996094, "global_step": 241848, "epoch": 1998} {"train_loss": -42.04288864135742, "global_step": 241849, "epoch": 1998} {"train_loss": -39.56968307495117, "global_step": 241850, "epoch": 1998} {"train_loss": -38.94551086425781, "global_step": 241851, "epoch": 1998} {"train_loss": -42.31355285644531, "global_step": 241852, "epoch": 1998} {"train_loss": -38.83932113647461, "global_step": 241853, "epoch": 1998} {"train_loss": -41.3062629699707, "global_step": 241854, "epoch": 1998} {"train_loss": -39.838623046875, "global_step": 241855, "epoch": 1998} {"train_loss": -40.00750732421875, "global_step": 241856, "epoch": 1998} {"train_loss": -41.031280517578125, "global_step": 241857, "epoch": 1998} {"train_loss": -41.3734016418457, "global_step": 241858, "epoch": 1998} {"train_loss": -41.201847076416016, "global_step": 241859, "epoch": 1998} {"train_loss": -41.51386642456055, "global_step": 241860, "epoch": 1998} {"train_loss": -41.627044677734375, "global_step": 241861, "epoch": 1998} {"train_loss": -42.207435607910156, "global_step": 241862, "epoch": 1998} {"train_loss": -42.963600158691406, "global_step": 241863, "epoch": 1998} {"train_loss": -42.11236572265625, "global_step": 241864, "epoch": 1998} {"train_loss": -42.29631423950195, "global_step": 241865, "epoch": 1998} {"train_loss": -40.757930755615234, "global_step": 241866, "epoch": 1998} {"train_loss": -40.39785385131836, "global_step": 241867, "epoch": 1998} {"train_loss": -40.39585876464844, "global_step": 241868, "epoch": 1998} {"train_loss": -40.6556282043457, "global_step": 241869, "epoch": 1998} {"train_loss": -40.80515670776367, "global_step": 241870, "epoch": 1998} {"train_loss": -40.53892135620117, "global_step": 241871, "epoch": 1998} {"train_loss": -40.87491989135742, "global_step": 241872, "epoch": 1998} {"train_loss": -41.20427703857422, "global_step": 241873, "epoch": 1998} {"train_loss": -41.13633346557617, "global_step": 241874, "epoch": 1998} {"train_loss": -40.77107620239258, "global_step": 241875, "epoch": 1998} {"train_loss": -41.47483444213867, "global_step": 241876, "epoch": 1998} {"train_loss": -40.897457122802734, "global_step": 241877, "epoch": 1998} {"train_loss": -41.66482874972761, "global_step": 241878, "epoch": 1998, "val_loss": 2651654.25} {"train_loss": -42.521297454833984, "global_step": 241879, "epoch": 1999} {"train_loss": -40.71873092651367, "global_step": 241880, "epoch": 1999} {"train_loss": -41.780921936035156, "global_step": 241881, "epoch": 1999} {"train_loss": -42.054107666015625, "global_step": 241882, "epoch": 1999} {"train_loss": -40.69404220581055, "global_step": 241883, "epoch": 1999} {"train_loss": -40.66624450683594, "global_step": 241884, "epoch": 1999} {"train_loss": -41.981143951416016, "global_step": 241885, "epoch": 1999} {"train_loss": -40.35030746459961, "global_step": 241886, "epoch": 1999} {"train_loss": -41.85251998901367, "global_step": 241887, "epoch": 1999} {"train_loss": -39.93333053588867, "global_step": 241888, "epoch": 1999} {"train_loss": -40.345638275146484, "global_step": 241889, "epoch": 1999} {"train_loss": -42.05077362060547, "global_step": 241890, "epoch": 1999} {"train_loss": -41.8935432434082, "global_step": 241891, "epoch": 1999} {"train_loss": -42.00613021850586, "global_step": 241892, "epoch": 1999} {"train_loss": -41.43867492675781, "global_step": 241893, "epoch": 1999} {"train_loss": -41.48531723022461, "global_step": 241894, "epoch": 1999} {"train_loss": -41.361148834228516, "global_step": 241895, "epoch": 1999} {"train_loss": -41.7417106628418, "global_step": 241896, "epoch": 1999} {"train_loss": -40.53462600708008, "global_step": 241897, "epoch": 1999} {"train_loss": -41.44027328491211, "global_step": 241898, "epoch": 1999} {"train_loss": -41.8067512512207, "global_step": 241899, "epoch": 1999} {"train_loss": -42.36614990234375, "global_step": 241900, "epoch": 1999} {"train_loss": -41.95027542114258, "global_step": 241901, "epoch": 1999} {"train_loss": -42.344112396240234, "global_step": 241902, "epoch": 1999} {"train_loss": -42.08238220214844, "global_step": 241903, "epoch": 1999} {"train_loss": -42.600341796875, "global_step": 241904, "epoch": 1999} {"train_loss": -42.76210403442383, "global_step": 241905, "epoch": 1999} {"train_loss": -41.824462890625, "global_step": 241906, "epoch": 1999} {"train_loss": -42.54194641113281, "global_step": 241907, "epoch": 1999} {"train_loss": -42.55741500854492, "global_step": 241908, "epoch": 1999} {"train_loss": -42.385009765625, "global_step": 241909, "epoch": 1999} {"train_loss": -42.485862731933594, "global_step": 241910, "epoch": 1999} {"train_loss": -42.4985237121582, "global_step": 241911, "epoch": 1999} {"train_loss": -42.2370719909668, "global_step": 241912, "epoch": 1999} {"train_loss": -42.29633712768555, "global_step": 241913, "epoch": 1999} {"train_loss": -42.81256866455078, "global_step": 241914, "epoch": 1999} {"train_loss": -42.30979919433594, "global_step": 241915, "epoch": 1999} {"train_loss": -42.882930755615234, "global_step": 241916, "epoch": 1999} {"train_loss": -42.75038146972656, "global_step": 241917, "epoch": 1999} {"train_loss": -42.61844253540039, "global_step": 241918, "epoch": 1999} {"train_loss": -41.75664138793945, "global_step": 241919, "epoch": 1999} {"train_loss": -42.643218994140625, "global_step": 241920, "epoch": 1999} {"train_loss": -43.2703857421875, "global_step": 241921, "epoch": 1999} {"train_loss": -42.578163146972656, "global_step": 241922, "epoch": 1999} {"train_loss": -42.76054000854492, "global_step": 241923, "epoch": 1999} {"train_loss": -43.042903900146484, "global_step": 241924, "epoch": 1999} {"train_loss": -42.503170013427734, "global_step": 241925, "epoch": 1999} {"train_loss": -43.38041305541992, "global_step": 241926, "epoch": 1999} {"train_loss": -42.84807205200195, "global_step": 241927, "epoch": 1999} {"train_loss": -42.851566314697266, "global_step": 241928, "epoch": 1999} {"train_loss": -42.879638671875, "global_step": 241929, "epoch": 1999} {"train_loss": -43.518795013427734, "global_step": 241930, "epoch": 1999} {"train_loss": -42.901363372802734, "global_step": 241931, "epoch": 1999} {"train_loss": -43.55126953125, "global_step": 241932, "epoch": 1999} {"train_loss": -43.2748908996582, "global_step": 241933, "epoch": 1999} {"train_loss": -43.1573486328125, "global_step": 241934, "epoch": 1999} {"train_loss": -43.7558708190918, "global_step": 241935, "epoch": 1999} {"train_loss": -43.586387634277344, "global_step": 241936, "epoch": 1999} {"train_loss": -43.45966339111328, "global_step": 241937, "epoch": 1999} {"train_loss": -43.59514236450195, "global_step": 241938, "epoch": 1999} {"train_loss": -43.1932487487793, "global_step": 241939, "epoch": 1999} {"train_loss": -43.415557861328125, "global_step": 241940, "epoch": 1999} {"train_loss": -43.37272644042969, "global_step": 241941, "epoch": 1999} {"train_loss": -43.482879638671875, "global_step": 241942, "epoch": 1999} {"train_loss": -43.03070068359375, "global_step": 241943, "epoch": 1999} {"train_loss": -43.6920280456543, "global_step": 241944, "epoch": 1999} {"train_loss": -43.862789154052734, "global_step": 241945, "epoch": 1999} {"train_loss": -43.2207145690918, "global_step": 241946, "epoch": 1999} {"train_loss": -42.618919372558594, "global_step": 241947, "epoch": 1999} {"train_loss": -42.3407096862793, "global_step": 241948, "epoch": 1999} {"train_loss": -43.27248764038086, "global_step": 241949, "epoch": 1999} {"train_loss": -42.448570251464844, "global_step": 241950, "epoch": 1999} {"train_loss": -41.35703659057617, "global_step": 241951, "epoch": 1999} {"train_loss": -42.516815185546875, "global_step": 241952, "epoch": 1999} {"train_loss": -42.51112365722656, "global_step": 241953, "epoch": 1999} {"train_loss": -41.84139633178711, "global_step": 241954, "epoch": 1999} {"train_loss": -43.213565826416016, "global_step": 241955, "epoch": 1999} {"train_loss": -42.86480712890625, "global_step": 241956, "epoch": 1999} {"train_loss": -41.34721755981445, "global_step": 241957, "epoch": 1999} {"train_loss": -40.72103500366211, "global_step": 241958, "epoch": 1999} {"train_loss": -41.527835845947266, "global_step": 241959, "epoch": 1999} {"train_loss": -42.413848876953125, "global_step": 241960, "epoch": 1999} {"train_loss": -41.8420295715332, "global_step": 241961, "epoch": 1999} {"train_loss": -42.53486251831055, "global_step": 241962, "epoch": 1999} {"train_loss": -42.43807601928711, "global_step": 241963, "epoch": 1999} {"train_loss": -41.3303337097168, "global_step": 241964, "epoch": 1999} {"train_loss": -42.99434280395508, "global_step": 241965, "epoch": 1999} {"train_loss": -43.40815353393555, "global_step": 241966, "epoch": 1999} {"train_loss": -42.35960006713867, "global_step": 241967, "epoch": 1999} {"train_loss": -43.42316818237305, "global_step": 241968, "epoch": 1999} {"train_loss": -42.98335266113281, "global_step": 241969, "epoch": 1999} {"train_loss": -43.09221267700195, "global_step": 241970, "epoch": 1999} {"train_loss": -43.1063346862793, "global_step": 241971, "epoch": 1999} {"train_loss": -43.272705078125, "global_step": 241972, "epoch": 1999} {"train_loss": -42.83477020263672, "global_step": 241973, "epoch": 1999} {"train_loss": -41.77678298950195, "global_step": 241974, "epoch": 1999} {"train_loss": -41.65555953979492, "global_step": 241975, "epoch": 1999} {"train_loss": -41.896095275878906, "global_step": 241976, "epoch": 1999} {"train_loss": -43.14337921142578, "global_step": 241977, "epoch": 1999} {"train_loss": -42.68398666381836, "global_step": 241978, "epoch": 1999} {"train_loss": -41.55575180053711, "global_step": 241979, "epoch": 1999} {"train_loss": -41.99874496459961, "global_step": 241980, "epoch": 1999} {"train_loss": -43.04001998901367, "global_step": 241981, "epoch": 1999} {"train_loss": -43.16053009033203, "global_step": 241982, "epoch": 1999} {"train_loss": -42.81682205200195, "global_step": 241983, "epoch": 1999} {"train_loss": -42.2633171081543, "global_step": 241984, "epoch": 1999} {"train_loss": -42.712520599365234, "global_step": 241985, "epoch": 1999} {"train_loss": -42.730037689208984, "global_step": 241986, "epoch": 1999} {"train_loss": -42.604095458984375, "global_step": 241987, "epoch": 1999} {"train_loss": -42.20842742919922, "global_step": 241988, "epoch": 1999} {"train_loss": -40.34718704223633, "global_step": 241989, "epoch": 1999} {"train_loss": -41.792625427246094, "global_step": 241990, "epoch": 1999} {"train_loss": -42.39484786987305, "global_step": 241991, "epoch": 1999} {"train_loss": -42.42220687866211, "global_step": 241992, "epoch": 1999} {"train_loss": -42.20075607299805, "global_step": 241993, "epoch": 1999} {"train_loss": -42.280113220214844, "global_step": 241994, "epoch": 1999} {"train_loss": -40.420745849609375, "global_step": 241995, "epoch": 1999} {"train_loss": -40.83979415893555, "global_step": 241996, "epoch": 1999} {"train_loss": -41.320220947265625, "global_step": 241997, "epoch": 1999} {"train_loss": -42.3961067199707, "global_step": 241998, "epoch": 1999} {"train_loss": -42.35933792492575, "global_step": 241999, "epoch": 1999, "val_loss": 2678677.0} {"train_loss": -41.973594665527344, "global_step": 242000, "epoch": 2000} {"train_loss": -42.06507110595703, "global_step": 242001, "epoch": 2000} {"train_loss": -41.3068962097168, "global_step": 242002, "epoch": 2000} {"train_loss": -42.765472412109375, "global_step": 242003, "epoch": 2000} {"train_loss": -41.41587829589844, "global_step": 242004, "epoch": 2000} {"train_loss": -41.6744499206543, "global_step": 242005, "epoch": 2000} {"train_loss": -42.480403900146484, "global_step": 242006, "epoch": 2000} {"train_loss": -41.80147933959961, "global_step": 242007, "epoch": 2000} {"train_loss": -40.51066207885742, "global_step": 242008, "epoch": 2000} {"train_loss": -42.52632141113281, "global_step": 242009, "epoch": 2000} {"train_loss": -40.06180953979492, "global_step": 242010, "epoch": 2000} {"train_loss": -39.055213928222656, "global_step": 242011, "epoch": 2000} {"train_loss": -42.27216339111328, "global_step": 242012, "epoch": 2000} {"train_loss": -38.80167770385742, "global_step": 242013, "epoch": 2000} {"train_loss": -41.22968292236328, "global_step": 242014, "epoch": 2000} {"train_loss": -38.50032424926758, "global_step": 242015, "epoch": 2000} {"train_loss": -37.093868255615234, "global_step": 242016, "epoch": 2000} {"train_loss": -39.02426528930664, "global_step": 242017, "epoch": 2000} {"train_loss": -38.509212493896484, "global_step": 242018, "epoch": 2000} {"train_loss": -39.87725830078125, "global_step": 242019, "epoch": 2000} {"train_loss": -39.978878021240234, "global_step": 242020, "epoch": 2000} {"train_loss": -40.468502044677734, "global_step": 242021, "epoch": 2000} {"train_loss": -40.141483306884766, "global_step": 242022, "epoch": 2000} {"train_loss": -40.89441680908203, "global_step": 242023, "epoch": 2000} {"train_loss": -41.67987060546875, "global_step": 242024, "epoch": 2000} {"train_loss": -38.58572006225586, "global_step": 242025, "epoch": 2000} {"train_loss": -40.23490524291992, "global_step": 242026, "epoch": 2000} {"train_loss": -40.77275085449219, "global_step": 242027, "epoch": 2000} {"train_loss": -39.941036224365234, "global_step": 242028, "epoch": 2000} {"train_loss": -39.870880126953125, "global_step": 242029, "epoch": 2000} {"train_loss": -40.98127365112305, "global_step": 242030, "epoch": 2000} {"train_loss": -40.811214447021484, "global_step": 242031, "epoch": 2000} {"train_loss": -41.3447265625, "global_step": 242032, "epoch": 2000} {"train_loss": -40.1169548034668, "global_step": 242033, "epoch": 2000} {"train_loss": -41.15864944458008, "global_step": 242034, "epoch": 2000} {"train_loss": -40.83742904663086, "global_step": 242035, "epoch": 2000} {"train_loss": -40.198421478271484, "global_step": 242036, "epoch": 2000} {"train_loss": -41.40870666503906, "global_step": 242037, "epoch": 2000} {"train_loss": -41.002479553222656, "global_step": 242038, "epoch": 2000} {"train_loss": -41.56789779663086, "global_step": 242039, "epoch": 2000} {"train_loss": -41.846763610839844, "global_step": 242040, "epoch": 2000} {"train_loss": -41.16943359375, "global_step": 242041, "epoch": 2000} {"train_loss": -42.18932342529297, "global_step": 242042, "epoch": 2000} {"train_loss": -42.441226959228516, "global_step": 242043, "epoch": 2000} {"train_loss": -41.53593826293945, "global_step": 242044, "epoch": 2000} {"train_loss": -41.47698211669922, "global_step": 242045, "epoch": 2000} {"train_loss": -42.739280700683594, "global_step": 242046, "epoch": 2000} {"train_loss": -41.79066467285156, "global_step": 242047, "epoch": 2000} {"train_loss": -41.932518005371094, "global_step": 242048, "epoch": 2000} {"train_loss": -42.14583969116211, "global_step": 242049, "epoch": 2000} {"train_loss": -42.51693344116211, "global_step": 242050, "epoch": 2000} {"train_loss": -42.62327194213867, "global_step": 242051, "epoch": 2000} {"train_loss": -42.24775695800781, "global_step": 242052, "epoch": 2000} {"train_loss": -42.83182907104492, "global_step": 242053, "epoch": 2000} {"train_loss": -42.50174331665039, "global_step": 242054, "epoch": 2000} {"train_loss": -42.476444244384766, "global_step": 242055, "epoch": 2000} {"train_loss": -43.08330154418945, "global_step": 242056, "epoch": 2000} {"train_loss": -42.13539123535156, "global_step": 242057, "epoch": 2000} {"train_loss": -43.07548522949219, "global_step": 242058, "epoch": 2000} {"train_loss": -42.74912643432617, "global_step": 242059, "epoch": 2000} {"train_loss": -42.925254821777344, "global_step": 242060, "epoch": 2000} {"train_loss": -43.67631149291992, "global_step": 242061, "epoch": 2000} {"train_loss": -42.66047286987305, "global_step": 242062, "epoch": 2000} {"train_loss": -43.01609420776367, "global_step": 242063, "epoch": 2000} {"train_loss": -43.166988372802734, "global_step": 242064, "epoch": 2000} {"train_loss": -43.54213333129883, "global_step": 242065, "epoch": 2000} {"train_loss": -43.22174072265625, "global_step": 242066, "epoch": 2000} {"train_loss": -43.62583541870117, "global_step": 242067, "epoch": 2000} {"train_loss": -43.11198425292969, "global_step": 242068, "epoch": 2000} {"train_loss": -43.38317108154297, "global_step": 242069, "epoch": 2000} {"train_loss": -43.00698471069336, "global_step": 242070, "epoch": 2000} {"train_loss": -43.485713958740234, "global_step": 242071, "epoch": 2000} {"train_loss": -43.16935348510742, "global_step": 242072, "epoch": 2000} {"train_loss": -43.180355072021484, "global_step": 242073, "epoch": 2000} {"train_loss": -43.3931884765625, "global_step": 242074, "epoch": 2000} {"train_loss": -43.37779235839844, "global_step": 242075, "epoch": 2000} {"train_loss": -42.89118576049805, "global_step": 242076, "epoch": 2000} {"train_loss": -43.35608673095703, "global_step": 242077, "epoch": 2000} {"train_loss": -43.503082275390625, "global_step": 242078, "epoch": 2000} {"train_loss": -43.54861068725586, "global_step": 242079, "epoch": 2000} {"train_loss": -43.6890983581543, "global_step": 242080, "epoch": 2000} {"train_loss": -43.7201042175293, "global_step": 242081, "epoch": 2000} {"train_loss": -43.57381057739258, "global_step": 242082, "epoch": 2000} {"train_loss": -42.827266693115234, "global_step": 242083, "epoch": 2000} {"train_loss": -41.91938400268555, "global_step": 242084, "epoch": 2000} {"train_loss": -43.68571090698242, "global_step": 242085, "epoch": 2000} {"train_loss": -43.2125129699707, "global_step": 242086, "epoch": 2000} {"train_loss": -42.916786193847656, "global_step": 242087, "epoch": 2000} {"train_loss": -41.96474838256836, "global_step": 242088, "epoch": 2000} {"train_loss": -43.657379150390625, "global_step": 242089, "epoch": 2000} {"train_loss": -43.51539993286133, "global_step": 242090, "epoch": 2000} {"train_loss": -43.13752365112305, "global_step": 242091, "epoch": 2000} {"train_loss": -43.27800750732422, "global_step": 242092, "epoch": 2000} {"train_loss": -43.257537841796875, "global_step": 242093, "epoch": 2000} {"train_loss": -42.4167594909668, "global_step": 242094, "epoch": 2000} {"train_loss": -42.0376091003418, "global_step": 242095, "epoch": 2000} {"train_loss": -43.463218688964844, "global_step": 242096, "epoch": 2000} {"train_loss": -42.56965255737305, "global_step": 242097, "epoch": 2000} {"train_loss": -41.98260498046875, "global_step": 242098, "epoch": 2000} {"train_loss": -42.443275451660156, "global_step": 242099, "epoch": 2000} {"train_loss": -40.2128791809082, "global_step": 242100, "epoch": 2000} {"train_loss": -43.6268424987793, "global_step": 242101, "epoch": 2000} {"train_loss": -41.060821533203125, "global_step": 242102, "epoch": 2000} {"train_loss": -40.12601852416992, "global_step": 242103, "epoch": 2000} {"train_loss": -42.161155700683594, "global_step": 242104, "epoch": 2000} {"train_loss": -38.133968353271484, "global_step": 242105, "epoch": 2000} {"train_loss": -39.80265808105469, "global_step": 242106, "epoch": 2000} {"train_loss": -40.81406021118164, "global_step": 242107, "epoch": 2000} {"train_loss": -38.65034103393555, "global_step": 242108, "epoch": 2000} {"train_loss": -41.14912796020508, "global_step": 242109, "epoch": 2000} {"train_loss": -38.35787582397461, "global_step": 242110, "epoch": 2000} {"train_loss": -40.835445404052734, "global_step": 242111, "epoch": 2000} {"train_loss": -39.069549560546875, "global_step": 242112, "epoch": 2000} {"train_loss": -40.33062744140625, "global_step": 242113, "epoch": 2000} {"train_loss": -39.89276885986328, "global_step": 242114, "epoch": 2000} {"train_loss": -41.322235107421875, "global_step": 242115, "epoch": 2000} {"train_loss": -38.69927215576172, "global_step": 242116, "epoch": 2000} {"train_loss": -41.470703125, "global_step": 242117, "epoch": 2000} {"train_loss": -40.269527435302734, "global_step": 242118, "epoch": 2000} {"train_loss": -41.19386672973633, "global_step": 242119, "epoch": 2000} {"train_loss": -41.67715280706232, "global_step": 242120, "epoch": 2000, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4400000": 1.0, "test/sim_max_reward_4400001": 1.0, "test/sim_max_reward_4400002": 1.0, "test/sim_max_reward_4400003": 1.0, "test/sim_max_reward_4400004": 1.0, "test/sim_max_reward_4400005": 1.0, "test/sim_max_reward_4400006": 1.0, "test/sim_max_reward_4400007": 1.0, "test/sim_max_reward_4400008": 1.0, "test/sim_max_reward_4400009": 1.0, "test/sim_max_reward_4400010": 1.0, "test/sim_max_reward_4400011": 1.0, "test/sim_max_reward_4400012": 1.0, "test/sim_max_reward_4400013": 1.0, "test/sim_max_reward_4400014": 1.0, "test/sim_max_reward_4400015": 1.0, "test/sim_max_reward_4400016": 1.0, "test/sim_max_reward_4400017": 1.0, "test/sim_max_reward_4400018": 1.0, "test/sim_max_reward_4400019": 1.0, "test/sim_max_reward_4400020": 1.0, "test/sim_max_reward_4400021": 1.0, "train/mean_score": 1.0, "test/mean_score": 1.0, "val_loss": 2685722.75} {"train_loss": -42.567386627197266, "global_step": 242121, "epoch": 2001} {"train_loss": -39.79996871948242, "global_step": 242122, "epoch": 2001} {"train_loss": -41.15690994262695, "global_step": 242123, "epoch": 2001} {"train_loss": -41.49047088623047, "global_step": 242124, "epoch": 2001} {"train_loss": -41.695465087890625, "global_step": 242125, "epoch": 2001} {"train_loss": -40.14750289916992, "global_step": 242126, "epoch": 2001} {"train_loss": -42.087493896484375, "global_step": 242127, "epoch": 2001} {"train_loss": -40.83291244506836, "global_step": 242128, "epoch": 2001} {"train_loss": -41.405879974365234, "global_step": 242129, "epoch": 2001} {"train_loss": -41.6912956237793, "global_step": 242130, "epoch": 2001} {"train_loss": -40.86357116699219, "global_step": 242131, "epoch": 2001} {"train_loss": -42.05839157104492, "global_step": 242132, "epoch": 2001} {"train_loss": -40.83649826049805, "global_step": 242133, "epoch": 2001} {"train_loss": -41.38216018676758, "global_step": 242134, "epoch": 2001} {"train_loss": -41.70621871948242, "global_step": 242135, "epoch": 2001} {"train_loss": -41.56351089477539, "global_step": 242136, "epoch": 2001} {"train_loss": -40.087303161621094, "global_step": 242137, "epoch": 2001} {"train_loss": -41.50648880004883, "global_step": 242138, "epoch": 2001} {"train_loss": -38.86224365234375, "global_step": 242139, "epoch": 2001} {"train_loss": -41.759185791015625, "global_step": 242140, "epoch": 2001} {"train_loss": -37.6700325012207, "global_step": 242141, "epoch": 2001} {"train_loss": -41.19418716430664, "global_step": 242142, "epoch": 2001} {"train_loss": -36.42694091796875, "global_step": 242143, "epoch": 2001} {"train_loss": -41.759517669677734, "global_step": 242144, "epoch": 2001} {"train_loss": -38.05107879638672, "global_step": 242145, "epoch": 2001} {"train_loss": -40.49613571166992, "global_step": 242146, "epoch": 2001} {"train_loss": -38.259620666503906, "global_step": 242147, "epoch": 2001} {"train_loss": -40.24306869506836, "global_step": 242148, "epoch": 2001} {"train_loss": -39.30559158325195, "global_step": 242149, "epoch": 2001} {"train_loss": -41.39169692993164, "global_step": 242150, "epoch": 2001} {"train_loss": -40.288814544677734, "global_step": 242151, "epoch": 2001} {"train_loss": -41.514766693115234, "global_step": 242152, "epoch": 2001} {"train_loss": -40.166107177734375, "global_step": 242153, "epoch": 2001} {"train_loss": -41.99674606323242, "global_step": 242154, "epoch": 2001} {"train_loss": -40.42057418823242, "global_step": 242155, "epoch": 2001} {"train_loss": -41.740570068359375, "global_step": 242156, "epoch": 2001} {"train_loss": -41.86198043823242, "global_step": 242157, "epoch": 2001} {"train_loss": -42.48189926147461, "global_step": 242158, "epoch": 2001} {"train_loss": -41.76966857910156, "global_step": 242159, "epoch": 2001} {"train_loss": -42.73918533325195, "global_step": 242160, "epoch": 2001} {"train_loss": -41.19614791870117, "global_step": 242161, "epoch": 2001} {"train_loss": -42.72693634033203, "global_step": 242162, "epoch": 2001} {"train_loss": -41.713958740234375, "global_step": 242163, "epoch": 2001} {"train_loss": -42.791603088378906, "global_step": 242164, "epoch": 2001} {"train_loss": -42.0663948059082, "global_step": 242165, "epoch": 2001} {"train_loss": -42.39959716796875, "global_step": 242166, "epoch": 2001} {"train_loss": -42.15461349487305, "global_step": 242167, "epoch": 2001} {"train_loss": -42.14248275756836, "global_step": 242168, "epoch": 2001} {"train_loss": -42.69399642944336, "global_step": 242169, "epoch": 2001} {"train_loss": -42.27821731567383, "global_step": 242170, "epoch": 2001} {"train_loss": -42.66378402709961, "global_step": 242171, "epoch": 2001} {"train_loss": -42.54644012451172, "global_step": 242172, "epoch": 2001} {"train_loss": -42.99873352050781, "global_step": 242173, "epoch": 2001} {"train_loss": -42.80303955078125, "global_step": 242174, "epoch": 2001} {"train_loss": -42.77019119262695, "global_step": 242175, "epoch": 2001} {"train_loss": -43.200984954833984, "global_step": 242176, "epoch": 2001} {"train_loss": -42.5523796081543, "global_step": 242177, "epoch": 2001} {"train_loss": -43.33079147338867, "global_step": 242178, "epoch": 2001} {"train_loss": -42.910072326660156, "global_step": 242179, "epoch": 2001} {"train_loss": -42.509986877441406, "global_step": 242180, "epoch": 2001} {"train_loss": -43.267208099365234, "global_step": 242181, "epoch": 2001} {"train_loss": -42.61905288696289, "global_step": 242182, "epoch": 2001} {"train_loss": -43.159889221191406, "global_step": 242183, "epoch": 2001} {"train_loss": -42.54933547973633, "global_step": 242184, "epoch": 2001} {"train_loss": -43.349273681640625, "global_step": 242185, "epoch": 2001} {"train_loss": -42.34260177612305, "global_step": 242186, "epoch": 2001} {"train_loss": -42.564552307128906, "global_step": 242187, "epoch": 2001} {"train_loss": -42.931419372558594, "global_step": 242188, "epoch": 2001} {"train_loss": -41.529781341552734, "global_step": 242189, "epoch": 2001} {"train_loss": -42.6960334777832, "global_step": 242190, "epoch": 2001} {"train_loss": -43.453712463378906, "global_step": 242191, "epoch": 2001} {"train_loss": -43.37512969970703, "global_step": 242192, "epoch": 2001} {"train_loss": -42.8277702331543, "global_step": 242193, "epoch": 2001} {"train_loss": -42.8096923828125, "global_step": 242194, "epoch": 2001} {"train_loss": -43.053592681884766, "global_step": 242195, "epoch": 2001} {"train_loss": -43.48189926147461, "global_step": 242196, "epoch": 2001} {"train_loss": -43.55546188354492, "global_step": 242197, "epoch": 2001} {"train_loss": -43.84003448486328, "global_step": 242198, "epoch": 2001} {"train_loss": -43.32166290283203, "global_step": 242199, "epoch": 2001} {"train_loss": -42.98828887939453, "global_step": 242200, "epoch": 2001} {"train_loss": -43.087398529052734, "global_step": 242201, "epoch": 2001} {"train_loss": -42.86618423461914, "global_step": 242202, "epoch": 2001} {"train_loss": -42.64611053466797, "global_step": 242203, "epoch": 2001} {"train_loss": -43.1083869934082, "global_step": 242204, "epoch": 2001} {"train_loss": -43.417415618896484, "global_step": 242205, "epoch": 2001} {"train_loss": -43.80634689331055, "global_step": 242206, "epoch": 2001} {"train_loss": -42.940006256103516, "global_step": 242207, "epoch": 2001} {"train_loss": -41.746212005615234, "global_step": 242208, "epoch": 2001} {"train_loss": -43.02517318725586, "global_step": 242209, "epoch": 2001} {"train_loss": -44.03070068359375, "global_step": 242210, "epoch": 2001} {"train_loss": -43.840579986572266, "global_step": 242211, "epoch": 2001} {"train_loss": -43.53742218017578, "global_step": 242212, "epoch": 2001} {"train_loss": -40.898983001708984, "global_step": 242213, "epoch": 2001} {"train_loss": -41.059722900390625, "global_step": 242214, "epoch": 2001} {"train_loss": -43.6193962097168, "global_step": 242215, "epoch": 2001} {"train_loss": -40.475128173828125, "global_step": 242216, "epoch": 2001} {"train_loss": -42.75747299194336, "global_step": 242217, "epoch": 2001} {"train_loss": -42.497901916503906, "global_step": 242218, "epoch": 2001} {"train_loss": -40.49811935424805, "global_step": 242219, "epoch": 2001} {"train_loss": -43.67692184448242, "global_step": 242220, "epoch": 2001} {"train_loss": -41.31840896606445, "global_step": 242221, "epoch": 2001} {"train_loss": -41.24828338623047, "global_step": 242222, "epoch": 2001} {"train_loss": -42.88283920288086, "global_step": 242223, "epoch": 2001} {"train_loss": -41.437225341796875, "global_step": 242224, "epoch": 2001} {"train_loss": -42.27663040161133, "global_step": 242225, "epoch": 2001} {"train_loss": -43.53566360473633, "global_step": 242226, "epoch": 2001} {"train_loss": -42.116153717041016, "global_step": 242227, "epoch": 2001} {"train_loss": -42.12932586669922, "global_step": 242228, "epoch": 2001} {"train_loss": -42.87580490112305, "global_step": 242229, "epoch": 2001} {"train_loss": -41.494384765625, "global_step": 242230, "epoch": 2001} {"train_loss": -42.982460021972656, "global_step": 242231, "epoch": 2001} {"train_loss": -41.530643463134766, "global_step": 242232, "epoch": 2001} {"train_loss": -43.316497802734375, "global_step": 242233, "epoch": 2001} {"train_loss": -42.470455169677734, "global_step": 242234, "epoch": 2001} {"train_loss": -42.17094421386719, "global_step": 242235, "epoch": 2001} {"train_loss": -43.18606948852539, "global_step": 242236, "epoch": 2001} {"train_loss": -42.14832305908203, "global_step": 242237, "epoch": 2001} {"train_loss": -41.77800369262695, "global_step": 242238, "epoch": 2001} {"train_loss": -41.92512893676758, "global_step": 242239, "epoch": 2001} {"train_loss": -41.85106658935547, "global_step": 242240, "epoch": 2001} {"train_loss": -42.02237285267223, "global_step": 242241, "epoch": 2001, "val_loss": 2677328.75} {"train_loss": -42.57241439819336, "global_step": 242242, "epoch": 2002} {"train_loss": -40.76450729370117, "global_step": 242243, "epoch": 2002} {"train_loss": -42.676265716552734, "global_step": 242244, "epoch": 2002} {"train_loss": -42.020198822021484, "global_step": 242245, "epoch": 2002} {"train_loss": -40.95390701293945, "global_step": 242246, "epoch": 2002} {"train_loss": -42.11448287963867, "global_step": 242247, "epoch": 2002} {"train_loss": -41.421199798583984, "global_step": 242248, "epoch": 2002} {"train_loss": -41.17239761352539, "global_step": 242249, "epoch": 2002} {"train_loss": -41.682350158691406, "global_step": 242250, "epoch": 2002} {"train_loss": -41.0594367980957, "global_step": 242251, "epoch": 2002} {"train_loss": -42.577144622802734, "global_step": 242252, "epoch": 2002} {"train_loss": -41.37870407104492, "global_step": 242253, "epoch": 2002} {"train_loss": -41.86163330078125, "global_step": 242254, "epoch": 2002} {"train_loss": -40.112510681152344, "global_step": 242255, "epoch": 2002} {"train_loss": -42.192562103271484, "global_step": 242256, "epoch": 2002} {"train_loss": -40.08833694458008, "global_step": 242257, "epoch": 2002} {"train_loss": -41.70586013793945, "global_step": 242258, "epoch": 2002} {"train_loss": -42.32339096069336, "global_step": 242259, "epoch": 2002} {"train_loss": -40.35223388671875, "global_step": 242260, "epoch": 2002} {"train_loss": -42.08389663696289, "global_step": 242261, "epoch": 2002} {"train_loss": -37.84175491333008, "global_step": 242262, "epoch": 2002} {"train_loss": -42.69492721557617, "global_step": 242263, "epoch": 2002} {"train_loss": -40.55790710449219, "global_step": 242264, "epoch": 2002} {"train_loss": -42.097373962402344, "global_step": 242265, "epoch": 2002} {"train_loss": -42.02617645263672, "global_step": 242266, "epoch": 2002} {"train_loss": -40.697906494140625, "global_step": 242267, "epoch": 2002} {"train_loss": -42.12662887573242, "global_step": 242268, "epoch": 2002} {"train_loss": -42.308143615722656, "global_step": 242269, "epoch": 2002} {"train_loss": -42.074981689453125, "global_step": 242270, "epoch": 2002} {"train_loss": -42.428123474121094, "global_step": 242271, "epoch": 2002} {"train_loss": -41.30814743041992, "global_step": 242272, "epoch": 2002} {"train_loss": -42.385475158691406, "global_step": 242273, "epoch": 2002} {"train_loss": -41.616981506347656, "global_step": 242274, "epoch": 2002} {"train_loss": -41.927001953125, "global_step": 242275, "epoch": 2002} {"train_loss": -40.896419525146484, "global_step": 242276, "epoch": 2002} {"train_loss": -42.16147994995117, "global_step": 242277, "epoch": 2002} {"train_loss": -40.70969772338867, "global_step": 242278, "epoch": 2002} {"train_loss": -41.47282791137695, "global_step": 242279, "epoch": 2002} {"train_loss": -42.02933883666992, "global_step": 242280, "epoch": 2002} {"train_loss": -41.16481399536133, "global_step": 242281, "epoch": 2002} {"train_loss": -41.96371841430664, "global_step": 242282, "epoch": 2002} {"train_loss": -42.65966796875, "global_step": 242283, "epoch": 2002} {"train_loss": -42.342681884765625, "global_step": 242284, "epoch": 2002} {"train_loss": -42.993812561035156, "global_step": 242285, "epoch": 2002} {"train_loss": -42.7947998046875, "global_step": 242286, "epoch": 2002} {"train_loss": -43.35590362548828, "global_step": 242287, "epoch": 2002} {"train_loss": -42.73672866821289, "global_step": 242288, "epoch": 2002} {"train_loss": -42.72761917114258, "global_step": 242289, "epoch": 2002} {"train_loss": -43.00055694580078, "global_step": 242290, "epoch": 2002} {"train_loss": -43.2118034362793, "global_step": 242291, "epoch": 2002} {"train_loss": -42.69122314453125, "global_step": 242292, "epoch": 2002} {"train_loss": -42.98960876464844, "global_step": 242293, "epoch": 2002} {"train_loss": -43.14448165893555, "global_step": 242294, "epoch": 2002} {"train_loss": -42.29403305053711, "global_step": 242295, "epoch": 2002} {"train_loss": -42.911319732666016, "global_step": 242296, "epoch": 2002} {"train_loss": -43.767486572265625, "global_step": 242297, "epoch": 2002} {"train_loss": -41.888771057128906, "global_step": 242298, "epoch": 2002} {"train_loss": -43.12059783935547, "global_step": 242299, "epoch": 2002} {"train_loss": -41.73442459106445, "global_step": 242300, "epoch": 2002} {"train_loss": -43.144317626953125, "global_step": 242301, "epoch": 2002} {"train_loss": -43.09221267700195, "global_step": 242302, "epoch": 2002} {"train_loss": -42.60059356689453, "global_step": 242303, "epoch": 2002} {"train_loss": -42.541770935058594, "global_step": 242304, "epoch": 2002} {"train_loss": -43.62998580932617, "global_step": 242305, "epoch": 2002} {"train_loss": -42.18278121948242, "global_step": 242306, "epoch": 2002} {"train_loss": -42.800296783447266, "global_step": 242307, "epoch": 2002} {"train_loss": -41.73221969604492, "global_step": 242308, "epoch": 2002} {"train_loss": -42.518104553222656, "global_step": 242309, "epoch": 2002} {"train_loss": -43.08077621459961, "global_step": 242310, "epoch": 2002} {"train_loss": -42.12690353393555, "global_step": 242311, "epoch": 2002} {"train_loss": -41.90995407104492, "global_step": 242312, "epoch": 2002} {"train_loss": -43.11985778808594, "global_step": 242313, "epoch": 2002} {"train_loss": -41.802886962890625, "global_step": 242314, "epoch": 2002} {"train_loss": -42.80903244018555, "global_step": 242315, "epoch": 2002} {"train_loss": -42.91357421875, "global_step": 242316, "epoch": 2002} {"train_loss": -41.539119720458984, "global_step": 242317, "epoch": 2002} {"train_loss": -42.88653564453125, "global_step": 242318, "epoch": 2002} {"train_loss": -43.71049880981445, "global_step": 242319, "epoch": 2002} {"train_loss": -42.75838088989258, "global_step": 242320, "epoch": 2002} {"train_loss": -43.56631088256836, "global_step": 242321, "epoch": 2002} {"train_loss": -42.863319396972656, "global_step": 242322, "epoch": 2002} {"train_loss": -42.416996002197266, "global_step": 242323, "epoch": 2002} {"train_loss": -43.227882385253906, "global_step": 242324, "epoch": 2002} {"train_loss": -43.12859344482422, "global_step": 242325, "epoch": 2002} {"train_loss": -42.73041534423828, "global_step": 242326, "epoch": 2002} {"train_loss": -43.384918212890625, "global_step": 242327, "epoch": 2002} {"train_loss": -43.29897689819336, "global_step": 242328, "epoch": 2002} {"train_loss": -43.23067092895508, "global_step": 242329, "epoch": 2002} {"train_loss": -43.90087890625, "global_step": 242330, "epoch": 2002} {"train_loss": -43.075408935546875, "global_step": 242331, "epoch": 2002} {"train_loss": -43.06846618652344, "global_step": 242332, "epoch": 2002} {"train_loss": -43.25263214111328, "global_step": 242333, "epoch": 2002} {"train_loss": -43.836212158203125, "global_step": 242334, "epoch": 2002} {"train_loss": -43.357521057128906, "global_step": 242335, "epoch": 2002} {"train_loss": -43.7004280090332, "global_step": 242336, "epoch": 2002} {"train_loss": -43.58219528198242, "global_step": 242337, "epoch": 2002} {"train_loss": -43.482025146484375, "global_step": 242338, "epoch": 2002} {"train_loss": -42.908729553222656, "global_step": 242339, "epoch": 2002} {"train_loss": -42.98362350463867, "global_step": 242340, "epoch": 2002} {"train_loss": -43.15462875366211, "global_step": 242341, "epoch": 2002} {"train_loss": -42.465511322021484, "global_step": 242342, "epoch": 2002} {"train_loss": -42.80428695678711, "global_step": 242343, "epoch": 2002} {"train_loss": -43.52734375, "global_step": 242344, "epoch": 2002} {"train_loss": -43.13763427734375, "global_step": 242345, "epoch": 2002} {"train_loss": -43.03974533081055, "global_step": 242346, "epoch": 2002} {"train_loss": -43.37295150756836, "global_step": 242347, "epoch": 2002} {"train_loss": -42.26408767700195, "global_step": 242348, "epoch": 2002} {"train_loss": -42.623626708984375, "global_step": 242349, "epoch": 2002} {"train_loss": -43.38346481323242, "global_step": 242350, "epoch": 2002} {"train_loss": -42.810035705566406, "global_step": 242351, "epoch": 2002} {"train_loss": -41.941471099853516, "global_step": 242352, "epoch": 2002} {"train_loss": -43.53425216674805, "global_step": 242353, "epoch": 2002} {"train_loss": -43.27405548095703, "global_step": 242354, "epoch": 2002} {"train_loss": -42.710933685302734, "global_step": 242355, "epoch": 2002} {"train_loss": -41.1053466796875, "global_step": 242356, "epoch": 2002} {"train_loss": -42.37385177612305, "global_step": 242357, "epoch": 2002} {"train_loss": -43.5988655090332, "global_step": 242358, "epoch": 2002} {"train_loss": -42.88532257080078, "global_step": 242359, "epoch": 2002} {"train_loss": -41.723541259765625, "global_step": 242360, "epoch": 2002} {"train_loss": -43.60608673095703, "global_step": 242361, "epoch": 2002} {"train_loss": -42.42830405747595, "global_step": 242362, "epoch": 2002, "val_loss": 2665675.5} {"train_loss": -42.14689254760742, "global_step": 242363, "epoch": 2003} {"train_loss": -43.06073760986328, "global_step": 242364, "epoch": 2003} {"train_loss": -42.10164260864258, "global_step": 242365, "epoch": 2003} {"train_loss": -42.00249099731445, "global_step": 242366, "epoch": 2003} {"train_loss": -43.01668167114258, "global_step": 242367, "epoch": 2003} {"train_loss": -41.19720458984375, "global_step": 242368, "epoch": 2003} {"train_loss": -41.64730453491211, "global_step": 242369, "epoch": 2003} {"train_loss": -43.23036575317383, "global_step": 242370, "epoch": 2003} {"train_loss": -42.1963005065918, "global_step": 242371, "epoch": 2003} {"train_loss": -40.81633758544922, "global_step": 242372, "epoch": 2003} {"train_loss": -42.6202278137207, "global_step": 242373, "epoch": 2003} {"train_loss": -42.353431701660156, "global_step": 242374, "epoch": 2003} {"train_loss": -42.846839904785156, "global_step": 242375, "epoch": 2003} {"train_loss": -42.96210861206055, "global_step": 242376, "epoch": 2003} {"train_loss": -42.48898696899414, "global_step": 242377, "epoch": 2003} {"train_loss": -42.59708786010742, "global_step": 242378, "epoch": 2003} {"train_loss": -40.99567413330078, "global_step": 242379, "epoch": 2003} {"train_loss": -43.26251983642578, "global_step": 242380, "epoch": 2003} {"train_loss": -41.542110443115234, "global_step": 242381, "epoch": 2003} {"train_loss": -41.92441177368164, "global_step": 242382, "epoch": 2003} {"train_loss": -43.0152587890625, "global_step": 242383, "epoch": 2003} {"train_loss": -40.55532455444336, "global_step": 242384, "epoch": 2003} {"train_loss": -41.29916000366211, "global_step": 242385, "epoch": 2003} {"train_loss": -42.39381790161133, "global_step": 242386, "epoch": 2003} {"train_loss": -41.55194854736328, "global_step": 242387, "epoch": 2003} {"train_loss": -42.163570404052734, "global_step": 242388, "epoch": 2003} {"train_loss": -38.624507904052734, "global_step": 242389, "epoch": 2003} {"train_loss": -39.30683517456055, "global_step": 242390, "epoch": 2003} {"train_loss": -41.05659103393555, "global_step": 242391, "epoch": 2003} {"train_loss": -38.6685905456543, "global_step": 242392, "epoch": 2003} {"train_loss": -40.87691879272461, "global_step": 242393, "epoch": 2003} {"train_loss": -37.3856086730957, "global_step": 242394, "epoch": 2003} {"train_loss": -41.195289611816406, "global_step": 242395, "epoch": 2003} {"train_loss": -38.9354362487793, "global_step": 242396, "epoch": 2003} {"train_loss": -32.5056266784668, "global_step": 242397, "epoch": 2003} {"train_loss": -37.77992630004883, "global_step": 242398, "epoch": 2003} {"train_loss": -38.12174987792969, "global_step": 242399, "epoch": 2003} {"train_loss": -35.6348762512207, "global_step": 242400, "epoch": 2003} {"train_loss": -37.34908676147461, "global_step": 242401, "epoch": 2003} {"train_loss": -37.151451110839844, "global_step": 242402, "epoch": 2003} {"train_loss": -39.169734954833984, "global_step": 242403, "epoch": 2003} {"train_loss": -38.328853607177734, "global_step": 242404, "epoch": 2003} {"train_loss": -40.47956466674805, "global_step": 242405, "epoch": 2003} {"train_loss": -38.460792541503906, "global_step": 242406, "epoch": 2003} {"train_loss": -36.6527099609375, "global_step": 242407, "epoch": 2003} {"train_loss": -39.11208724975586, "global_step": 242408, "epoch": 2003} {"train_loss": -37.68186569213867, "global_step": 242409, "epoch": 2003} {"train_loss": -39.05070114135742, "global_step": 242410, "epoch": 2003} {"train_loss": -39.54366683959961, "global_step": 242411, "epoch": 2003} {"train_loss": -39.509822845458984, "global_step": 242412, "epoch": 2003} {"train_loss": -40.28363800048828, "global_step": 242413, "epoch": 2003} {"train_loss": -38.706539154052734, "global_step": 242414, "epoch": 2003} {"train_loss": -41.76564407348633, "global_step": 242415, "epoch": 2003} {"train_loss": -40.43012619018555, "global_step": 242416, "epoch": 2003} {"train_loss": -41.69747543334961, "global_step": 242417, "epoch": 2003} {"train_loss": -40.43792724609375, "global_step": 242418, "epoch": 2003} {"train_loss": -41.53469467163086, "global_step": 242419, "epoch": 2003} {"train_loss": -39.554500579833984, "global_step": 242420, "epoch": 2003} {"train_loss": -40.4915885925293, "global_step": 242421, "epoch": 2003} {"train_loss": -41.343711853027344, "global_step": 242422, "epoch": 2003} {"train_loss": -40.73908615112305, "global_step": 242423, "epoch": 2003} {"train_loss": -41.751277923583984, "global_step": 242424, "epoch": 2003} {"train_loss": -41.338260650634766, "global_step": 242425, "epoch": 2003} {"train_loss": -41.81074905395508, "global_step": 242426, "epoch": 2003} {"train_loss": -42.186767578125, "global_step": 242427, "epoch": 2003} {"train_loss": -41.864559173583984, "global_step": 242428, "epoch": 2003} {"train_loss": -41.93693542480469, "global_step": 242429, "epoch": 2003} {"train_loss": -41.51226043701172, "global_step": 242430, "epoch": 2003} {"train_loss": -41.9180908203125, "global_step": 242431, "epoch": 2003} {"train_loss": -41.911651611328125, "global_step": 242432, "epoch": 2003} {"train_loss": -41.8266487121582, "global_step": 242433, "epoch": 2003} {"train_loss": -42.84008026123047, "global_step": 242434, "epoch": 2003} {"train_loss": -42.377681732177734, "global_step": 242435, "epoch": 2003} {"train_loss": -42.648597717285156, "global_step": 242436, "epoch": 2003} {"train_loss": -41.44318771362305, "global_step": 242437, "epoch": 2003} {"train_loss": -42.24787139892578, "global_step": 242438, "epoch": 2003} {"train_loss": -42.11698532104492, "global_step": 242439, "epoch": 2003} {"train_loss": -42.272212982177734, "global_step": 242440, "epoch": 2003} {"train_loss": -42.64997100830078, "global_step": 242441, "epoch": 2003} {"train_loss": -42.51969909667969, "global_step": 242442, "epoch": 2003} {"train_loss": -42.58115768432617, "global_step": 242443, "epoch": 2003} {"train_loss": -42.31908416748047, "global_step": 242444, "epoch": 2003} {"train_loss": -42.95218276977539, "global_step": 242445, "epoch": 2003} {"train_loss": -42.34275436401367, "global_step": 242446, "epoch": 2003} {"train_loss": -42.8140754699707, "global_step": 242447, "epoch": 2003} {"train_loss": -42.59623336791992, "global_step": 242448, "epoch": 2003} {"train_loss": -42.50669479370117, "global_step": 242449, "epoch": 2003} {"train_loss": -43.07863998413086, "global_step": 242450, "epoch": 2003} {"train_loss": -43.42438507080078, "global_step": 242451, "epoch": 2003} {"train_loss": -42.679805755615234, "global_step": 242452, "epoch": 2003} {"train_loss": -42.83565139770508, "global_step": 242453, "epoch": 2003} {"train_loss": -42.56466293334961, "global_step": 242454, "epoch": 2003} {"train_loss": -43.0238037109375, "global_step": 242455, "epoch": 2003} {"train_loss": -43.263858795166016, "global_step": 242456, "epoch": 2003} {"train_loss": -43.10163497924805, "global_step": 242457, "epoch": 2003} {"train_loss": -42.111820220947266, "global_step": 242458, "epoch": 2003} {"train_loss": -43.46854782104492, "global_step": 242459, "epoch": 2003} {"train_loss": -43.08927536010742, "global_step": 242460, "epoch": 2003} {"train_loss": -43.175384521484375, "global_step": 242461, "epoch": 2003} {"train_loss": -43.678070068359375, "global_step": 242462, "epoch": 2003} {"train_loss": -43.4588623046875, "global_step": 242463, "epoch": 2003} {"train_loss": -43.19376754760742, "global_step": 242464, "epoch": 2003} {"train_loss": -43.35107421875, "global_step": 242465, "epoch": 2003} {"train_loss": -41.687835693359375, "global_step": 242466, "epoch": 2003} {"train_loss": -42.90155792236328, "global_step": 242467, "epoch": 2003} {"train_loss": -43.810630798339844, "global_step": 242468, "epoch": 2003} {"train_loss": -42.864837646484375, "global_step": 242469, "epoch": 2003} {"train_loss": -42.553951263427734, "global_step": 242470, "epoch": 2003} {"train_loss": -43.2833366394043, "global_step": 242471, "epoch": 2003} {"train_loss": -43.34627151489258, "global_step": 242472, "epoch": 2003} {"train_loss": -43.768489837646484, "global_step": 242473, "epoch": 2003} {"train_loss": -43.22946548461914, "global_step": 242474, "epoch": 2003} {"train_loss": -43.32787322998047, "global_step": 242475, "epoch": 2003} {"train_loss": -43.82697677612305, "global_step": 242476, "epoch": 2003} {"train_loss": -43.915706634521484, "global_step": 242477, "epoch": 2003} {"train_loss": -43.33334732055664, "global_step": 242478, "epoch": 2003} {"train_loss": -43.57698059082031, "global_step": 242479, "epoch": 2003} {"train_loss": -43.38650894165039, "global_step": 242480, "epoch": 2003} {"train_loss": -43.90187454223633, "global_step": 242481, "epoch": 2003} {"train_loss": -42.59892654418945, "global_step": 242482, "epoch": 2003} {"train_loss": -41.575386520259634, "global_step": 242483, "epoch": 2003, "val_loss": 2676173.75} {"train_loss": -43.65045166015625, "global_step": 242484, "epoch": 2004} {"train_loss": -43.305294036865234, "global_step": 242485, "epoch": 2004} {"train_loss": -42.602474212646484, "global_step": 242486, "epoch": 2004} {"train_loss": -43.00404739379883, "global_step": 242487, "epoch": 2004} {"train_loss": -43.56608581542969, "global_step": 242488, "epoch": 2004} {"train_loss": -42.3968505859375, "global_step": 242489, "epoch": 2004} {"train_loss": -40.584205627441406, "global_step": 242490, "epoch": 2004} {"train_loss": -39.414241790771484, "global_step": 242491, "epoch": 2004} {"train_loss": -42.5156364440918, "global_step": 242492, "epoch": 2004} {"train_loss": -43.3264274597168, "global_step": 242493, "epoch": 2004} {"train_loss": -43.361629486083984, "global_step": 242494, "epoch": 2004} {"train_loss": -42.79973220825195, "global_step": 242495, "epoch": 2004} {"train_loss": -42.99622344970703, "global_step": 242496, "epoch": 2004} {"train_loss": -41.93989181518555, "global_step": 242497, "epoch": 2004} {"train_loss": -43.37190628051758, "global_step": 242498, "epoch": 2004} {"train_loss": -42.53413009643555, "global_step": 242499, "epoch": 2004} {"train_loss": -40.785640716552734, "global_step": 242500, "epoch": 2004} {"train_loss": -36.67560958862305, "global_step": 242501, "epoch": 2004} {"train_loss": -37.32259750366211, "global_step": 242502, "epoch": 2004} {"train_loss": -38.32636260986328, "global_step": 242503, "epoch": 2004} {"train_loss": -38.23116683959961, "global_step": 242504, "epoch": 2004} {"train_loss": -38.437896728515625, "global_step": 242505, "epoch": 2004} {"train_loss": -39.00734329223633, "global_step": 242506, "epoch": 2004} {"train_loss": -38.080238342285156, "global_step": 242507, "epoch": 2004} {"train_loss": -38.94277572631836, "global_step": 242508, "epoch": 2004} {"train_loss": -39.524169921875, "global_step": 242509, "epoch": 2004} {"train_loss": -38.37065505981445, "global_step": 242510, "epoch": 2004} {"train_loss": -39.025997161865234, "global_step": 242511, "epoch": 2004} {"train_loss": -39.296138763427734, "global_step": 242512, "epoch": 2004} {"train_loss": -39.93679428100586, "global_step": 242513, "epoch": 2004} {"train_loss": -41.514705657958984, "global_step": 242514, "epoch": 2004} {"train_loss": -39.63725280761719, "global_step": 242515, "epoch": 2004} {"train_loss": -40.71734619140625, "global_step": 242516, "epoch": 2004} {"train_loss": -41.3082275390625, "global_step": 242517, "epoch": 2004} {"train_loss": -41.56511688232422, "global_step": 242518, "epoch": 2004} {"train_loss": -42.645015716552734, "global_step": 242519, "epoch": 2004} {"train_loss": -41.99482345581055, "global_step": 242520, "epoch": 2004} {"train_loss": -41.70448684692383, "global_step": 242521, "epoch": 2004} {"train_loss": -42.29067611694336, "global_step": 242522, "epoch": 2004} {"train_loss": -42.086605072021484, "global_step": 242523, "epoch": 2004} {"train_loss": -41.74079132080078, "global_step": 242524, "epoch": 2004} {"train_loss": -41.24956130981445, "global_step": 242525, "epoch": 2004} {"train_loss": -41.607421875, "global_step": 242526, "epoch": 2004} {"train_loss": -42.908447265625, "global_step": 242527, "epoch": 2004} {"train_loss": -41.96918869018555, "global_step": 242528, "epoch": 2004} {"train_loss": -38.940093994140625, "global_step": 242529, "epoch": 2004} {"train_loss": -42.084510803222656, "global_step": 242530, "epoch": 2004} {"train_loss": -37.572723388671875, "global_step": 242531, "epoch": 2004} {"train_loss": -40.98340606689453, "global_step": 242532, "epoch": 2004} {"train_loss": -41.6078987121582, "global_step": 242533, "epoch": 2004} {"train_loss": -38.90277099609375, "global_step": 242534, "epoch": 2004} {"train_loss": -40.72014617919922, "global_step": 242535, "epoch": 2004} {"train_loss": -38.760536193847656, "global_step": 242536, "epoch": 2004} {"train_loss": -39.85602569580078, "global_step": 242537, "epoch": 2004} {"train_loss": -39.670013427734375, "global_step": 242538, "epoch": 2004} {"train_loss": -40.58295440673828, "global_step": 242539, "epoch": 2004} {"train_loss": -42.012447357177734, "global_step": 242540, "epoch": 2004} {"train_loss": -40.37424850463867, "global_step": 242541, "epoch": 2004} {"train_loss": -41.899391174316406, "global_step": 242542, "epoch": 2004} {"train_loss": -41.772579193115234, "global_step": 242543, "epoch": 2004} {"train_loss": -42.52476119995117, "global_step": 242544, "epoch": 2004} {"train_loss": -41.549285888671875, "global_step": 242545, "epoch": 2004} {"train_loss": -42.90129470825195, "global_step": 242546, "epoch": 2004} {"train_loss": -41.64386749267578, "global_step": 242547, "epoch": 2004} {"train_loss": -41.13143539428711, "global_step": 242548, "epoch": 2004} {"train_loss": -42.13666915893555, "global_step": 242549, "epoch": 2004} {"train_loss": -42.081966400146484, "global_step": 242550, "epoch": 2004} {"train_loss": -40.712196350097656, "global_step": 242551, "epoch": 2004} {"train_loss": -42.388309478759766, "global_step": 242552, "epoch": 2004} {"train_loss": -41.18292236328125, "global_step": 242553, "epoch": 2004} {"train_loss": -42.75692367553711, "global_step": 242554, "epoch": 2004} {"train_loss": -40.4099235534668, "global_step": 242555, "epoch": 2004} {"train_loss": -42.338661193847656, "global_step": 242556, "epoch": 2004} {"train_loss": -40.907379150390625, "global_step": 242557, "epoch": 2004} {"train_loss": -42.11288070678711, "global_step": 242558, "epoch": 2004} {"train_loss": -42.55411911010742, "global_step": 242559, "epoch": 2004} {"train_loss": -41.9771842956543, "global_step": 242560, "epoch": 2004} {"train_loss": -42.891326904296875, "global_step": 242561, "epoch": 2004} {"train_loss": -42.098201751708984, "global_step": 242562, "epoch": 2004} {"train_loss": -43.077701568603516, "global_step": 242563, "epoch": 2004} {"train_loss": -42.73963928222656, "global_step": 242564, "epoch": 2004} {"train_loss": -43.22359848022461, "global_step": 242565, "epoch": 2004} {"train_loss": -42.73243713378906, "global_step": 242566, "epoch": 2004} {"train_loss": -43.06853103637695, "global_step": 242567, "epoch": 2004} {"train_loss": -43.50217056274414, "global_step": 242568, "epoch": 2004} {"train_loss": -43.82232666015625, "global_step": 242569, "epoch": 2004} {"train_loss": -43.33070755004883, "global_step": 242570, "epoch": 2004} {"train_loss": -42.56121826171875, "global_step": 242571, "epoch": 2004} {"train_loss": -42.99382400512695, "global_step": 242572, "epoch": 2004} {"train_loss": -43.58362579345703, "global_step": 242573, "epoch": 2004} {"train_loss": -43.2855110168457, "global_step": 242574, "epoch": 2004} {"train_loss": -42.4938850402832, "global_step": 242575, "epoch": 2004} {"train_loss": -42.576942443847656, "global_step": 242576, "epoch": 2004} {"train_loss": -43.37141036987305, "global_step": 242577, "epoch": 2004} {"train_loss": -42.68479537963867, "global_step": 242578, "epoch": 2004} {"train_loss": -42.939002990722656, "global_step": 242579, "epoch": 2004} {"train_loss": -43.149349212646484, "global_step": 242580, "epoch": 2004} {"train_loss": -43.21505355834961, "global_step": 242581, "epoch": 2004} {"train_loss": -42.92467498779297, "global_step": 242582, "epoch": 2004} {"train_loss": -43.100154876708984, "global_step": 242583, "epoch": 2004} {"train_loss": -43.344642639160156, "global_step": 242584, "epoch": 2004} {"train_loss": -42.063289642333984, "global_step": 242585, "epoch": 2004} {"train_loss": -42.27953338623047, "global_step": 242586, "epoch": 2004} {"train_loss": -42.30292510986328, "global_step": 242587, "epoch": 2004} {"train_loss": -42.94063949584961, "global_step": 242588, "epoch": 2004} {"train_loss": -41.772430419921875, "global_step": 242589, "epoch": 2004} {"train_loss": -41.003204345703125, "global_step": 242590, "epoch": 2004} {"train_loss": -41.656951904296875, "global_step": 242591, "epoch": 2004} {"train_loss": -41.07172393798828, "global_step": 242592, "epoch": 2004} {"train_loss": -42.20162582397461, "global_step": 242593, "epoch": 2004} {"train_loss": -40.99407958984375, "global_step": 242594, "epoch": 2004} {"train_loss": -41.832305908203125, "global_step": 242595, "epoch": 2004} {"train_loss": -42.353633880615234, "global_step": 242596, "epoch": 2004} {"train_loss": -42.50307846069336, "global_step": 242597, "epoch": 2004} {"train_loss": -42.5490608215332, "global_step": 242598, "epoch": 2004} {"train_loss": -42.9044303894043, "global_step": 242599, "epoch": 2004} {"train_loss": -41.87665557861328, "global_step": 242600, "epoch": 2004} {"train_loss": -43.319271087646484, "global_step": 242601, "epoch": 2004} {"train_loss": -42.248287200927734, "global_step": 242602, "epoch": 2004} {"train_loss": -41.06545639038086, "global_step": 242603, "epoch": 2004} {"train_loss": -41.63250436073493, "global_step": 242604, "epoch": 2004, "val_loss": 2701086.75} {"train_loss": -41.512481689453125, "global_step": 242605, "epoch": 2005} {"train_loss": -42.70376968383789, "global_step": 242606, "epoch": 2005} {"train_loss": -42.447120666503906, "global_step": 242607, "epoch": 2005} {"train_loss": -41.847408294677734, "global_step": 242608, "epoch": 2005} {"train_loss": -42.99708938598633, "global_step": 242609, "epoch": 2005} {"train_loss": -42.38457107543945, "global_step": 242610, "epoch": 2005} {"train_loss": -40.442138671875, "global_step": 242611, "epoch": 2005} {"train_loss": -43.56929397583008, "global_step": 242612, "epoch": 2005} {"train_loss": -41.82114028930664, "global_step": 242613, "epoch": 2005} {"train_loss": -42.96784591674805, "global_step": 242614, "epoch": 2005} {"train_loss": -42.30669021606445, "global_step": 242615, "epoch": 2005} {"train_loss": -43.39046859741211, "global_step": 242616, "epoch": 2005} {"train_loss": -42.581817626953125, "global_step": 242617, "epoch": 2005} {"train_loss": -41.50413131713867, "global_step": 242618, "epoch": 2005} {"train_loss": -42.447349548339844, "global_step": 242619, "epoch": 2005} {"train_loss": -41.46027755737305, "global_step": 242620, "epoch": 2005} {"train_loss": -43.0389404296875, "global_step": 242621, "epoch": 2005} {"train_loss": -42.464935302734375, "global_step": 242622, "epoch": 2005} {"train_loss": -42.16652297973633, "global_step": 242623, "epoch": 2005} {"train_loss": -42.08280563354492, "global_step": 242624, "epoch": 2005} {"train_loss": -42.72739791870117, "global_step": 242625, "epoch": 2005} {"train_loss": -42.1093635559082, "global_step": 242626, "epoch": 2005} {"train_loss": -41.37236785888672, "global_step": 242627, "epoch": 2005} {"train_loss": -42.42710876464844, "global_step": 242628, "epoch": 2005} {"train_loss": -42.996829986572266, "global_step": 242629, "epoch": 2005} {"train_loss": -42.51178741455078, "global_step": 242630, "epoch": 2005} {"train_loss": -41.8316535949707, "global_step": 242631, "epoch": 2005} {"train_loss": -42.970924377441406, "global_step": 242632, "epoch": 2005} {"train_loss": -40.55704879760742, "global_step": 242633, "epoch": 2005} {"train_loss": -42.62664031982422, "global_step": 242634, "epoch": 2005} {"train_loss": -40.475685119628906, "global_step": 242635, "epoch": 2005} {"train_loss": -42.04281234741211, "global_step": 242636, "epoch": 2005} {"train_loss": -40.486305236816406, "global_step": 242637, "epoch": 2005} {"train_loss": -41.15839767456055, "global_step": 242638, "epoch": 2005} {"train_loss": -41.59429168701172, "global_step": 242639, "epoch": 2005} {"train_loss": -42.49956130981445, "global_step": 242640, "epoch": 2005} {"train_loss": -42.2054443359375, "global_step": 242641, "epoch": 2005} {"train_loss": -42.45379638671875, "global_step": 242642, "epoch": 2005} {"train_loss": -41.752044677734375, "global_step": 242643, "epoch": 2005} {"train_loss": -43.07126998901367, "global_step": 242644, "epoch": 2005} {"train_loss": -42.666622161865234, "global_step": 242645, "epoch": 2005} {"train_loss": -42.667266845703125, "global_step": 242646, "epoch": 2005} {"train_loss": -42.7327766418457, "global_step": 242647, "epoch": 2005} {"train_loss": -43.2647705078125, "global_step": 242648, "epoch": 2005} {"train_loss": -42.217376708984375, "global_step": 242649, "epoch": 2005} {"train_loss": -42.559661865234375, "global_step": 242650, "epoch": 2005} {"train_loss": -41.421363830566406, "global_step": 242651, "epoch": 2005} {"train_loss": -42.607967376708984, "global_step": 242652, "epoch": 2005} {"train_loss": -41.931915283203125, "global_step": 242653, "epoch": 2005} {"train_loss": -42.659812927246094, "global_step": 242654, "epoch": 2005} {"train_loss": -42.892486572265625, "global_step": 242655, "epoch": 2005} {"train_loss": -41.98261642456055, "global_step": 242656, "epoch": 2005} {"train_loss": -41.94388961791992, "global_step": 242657, "epoch": 2005} {"train_loss": -43.081207275390625, "global_step": 242658, "epoch": 2005} {"train_loss": -43.07318878173828, "global_step": 242659, "epoch": 2005} {"train_loss": -42.8105354309082, "global_step": 242660, "epoch": 2005} {"train_loss": -42.95872116088867, "global_step": 242661, "epoch": 2005} {"train_loss": -43.516082763671875, "global_step": 242662, "epoch": 2005} {"train_loss": -42.65548324584961, "global_step": 242663, "epoch": 2005} {"train_loss": -42.99569320678711, "global_step": 242664, "epoch": 2005} {"train_loss": -43.25423812866211, "global_step": 242665, "epoch": 2005} {"train_loss": -42.813079833984375, "global_step": 242666, "epoch": 2005} {"train_loss": -43.139137268066406, "global_step": 242667, "epoch": 2005} {"train_loss": -42.729671478271484, "global_step": 242668, "epoch": 2005} {"train_loss": -43.59928512573242, "global_step": 242669, "epoch": 2005} {"train_loss": -43.3056640625, "global_step": 242670, "epoch": 2005} {"train_loss": -43.27450180053711, "global_step": 242671, "epoch": 2005} {"train_loss": -42.67934799194336, "global_step": 242672, "epoch": 2005} {"train_loss": -43.441585540771484, "global_step": 242673, "epoch": 2005} {"train_loss": -43.674659729003906, "global_step": 242674, "epoch": 2005} {"train_loss": -43.158973693847656, "global_step": 242675, "epoch": 2005} {"train_loss": -43.0988883972168, "global_step": 242676, "epoch": 2005} {"train_loss": -42.25202178955078, "global_step": 242677, "epoch": 2005} {"train_loss": -40.41103744506836, "global_step": 242678, "epoch": 2005} {"train_loss": -43.07856750488281, "global_step": 242679, "epoch": 2005} {"train_loss": -42.92698669433594, "global_step": 242680, "epoch": 2005} {"train_loss": -41.94770431518555, "global_step": 242681, "epoch": 2005} {"train_loss": -43.3962287902832, "global_step": 242682, "epoch": 2005} {"train_loss": -42.88855743408203, "global_step": 242683, "epoch": 2005} {"train_loss": -42.181209564208984, "global_step": 242684, "epoch": 2005} {"train_loss": -42.358978271484375, "global_step": 242685, "epoch": 2005} {"train_loss": -43.018489837646484, "global_step": 242686, "epoch": 2005} {"train_loss": -41.40928268432617, "global_step": 242687, "epoch": 2005} {"train_loss": -42.26646423339844, "global_step": 242688, "epoch": 2005} {"train_loss": -42.44682693481445, "global_step": 242689, "epoch": 2005} {"train_loss": -42.124351501464844, "global_step": 242690, "epoch": 2005} {"train_loss": -42.71976852416992, "global_step": 242691, "epoch": 2005} {"train_loss": -42.220558166503906, "global_step": 242692, "epoch": 2005} {"train_loss": -42.9837760925293, "global_step": 242693, "epoch": 2005} {"train_loss": -41.69689178466797, "global_step": 242694, "epoch": 2005} {"train_loss": -43.03959274291992, "global_step": 242695, "epoch": 2005} {"train_loss": -43.11204147338867, "global_step": 242696, "epoch": 2005} {"train_loss": -41.87538528442383, "global_step": 242697, "epoch": 2005} {"train_loss": -42.126686096191406, "global_step": 242698, "epoch": 2005} {"train_loss": -43.0187873840332, "global_step": 242699, "epoch": 2005} {"train_loss": -43.59785079956055, "global_step": 242700, "epoch": 2005} {"train_loss": -44.063167572021484, "global_step": 242701, "epoch": 2005} {"train_loss": -43.2684211730957, "global_step": 242702, "epoch": 2005} {"train_loss": -42.998470306396484, "global_step": 242703, "epoch": 2005} {"train_loss": -42.917850494384766, "global_step": 242704, "epoch": 2005} {"train_loss": -43.611305236816406, "global_step": 242705, "epoch": 2005} {"train_loss": -43.36698913574219, "global_step": 242706, "epoch": 2005} {"train_loss": -43.1850700378418, "global_step": 242707, "epoch": 2005} {"train_loss": -44.2767219543457, "global_step": 242708, "epoch": 2005} {"train_loss": -43.772804260253906, "global_step": 242709, "epoch": 2005} {"train_loss": -43.38206100463867, "global_step": 242710, "epoch": 2005} {"train_loss": -43.67348861694336, "global_step": 242711, "epoch": 2005} {"train_loss": -43.816123962402344, "global_step": 242712, "epoch": 2005} {"train_loss": -43.23213195800781, "global_step": 242713, "epoch": 2005} {"train_loss": -42.947669982910156, "global_step": 242714, "epoch": 2005} {"train_loss": -43.98838806152344, "global_step": 242715, "epoch": 2005} {"train_loss": -43.68479537963867, "global_step": 242716, "epoch": 2005} {"train_loss": -42.42322540283203, "global_step": 242717, "epoch": 2005} {"train_loss": -40.83732223510742, "global_step": 242718, "epoch": 2005} {"train_loss": -42.93347930908203, "global_step": 242719, "epoch": 2005} {"train_loss": -39.809654235839844, "global_step": 242720, "epoch": 2005} {"train_loss": -42.776649475097656, "global_step": 242721, "epoch": 2005} {"train_loss": -37.104103088378906, "global_step": 242722, "epoch": 2005} {"train_loss": -37.440101623535156, "global_step": 242723, "epoch": 2005} {"train_loss": -38.42362594604492, "global_step": 242724, "epoch": 2005} {"train_loss": -42.40106866379415, "global_step": 242725, "epoch": 2005, "val_loss": 2652043.0} {"train_loss": -35.04743576049805, "global_step": 242726, "epoch": 2006} {"train_loss": -37.0624885559082, "global_step": 242727, "epoch": 2006} {"train_loss": -37.370941162109375, "global_step": 242728, "epoch": 2006} {"train_loss": -38.2492790222168, "global_step": 242729, "epoch": 2006} {"train_loss": -37.341793060302734, "global_step": 242730, "epoch": 2006} {"train_loss": -37.418312072753906, "global_step": 242731, "epoch": 2006} {"train_loss": -37.296024322509766, "global_step": 242732, "epoch": 2006} {"train_loss": -36.95344161987305, "global_step": 242733, "epoch": 2006} {"train_loss": -38.01139831542969, "global_step": 242734, "epoch": 2006} {"train_loss": -37.50210189819336, "global_step": 242735, "epoch": 2006} {"train_loss": -38.14309310913086, "global_step": 242736, "epoch": 2006} {"train_loss": -37.9307861328125, "global_step": 242737, "epoch": 2006} {"train_loss": -35.654319763183594, "global_step": 242738, "epoch": 2006} {"train_loss": -36.032283782958984, "global_step": 242739, "epoch": 2006} {"train_loss": -38.40489196777344, "global_step": 242740, "epoch": 2006} {"train_loss": -38.245819091796875, "global_step": 242741, "epoch": 2006} {"train_loss": -37.4538459777832, "global_step": 242742, "epoch": 2006} {"train_loss": -37.96146774291992, "global_step": 242743, "epoch": 2006} {"train_loss": -37.6132926940918, "global_step": 242744, "epoch": 2006} {"train_loss": -38.607521057128906, "global_step": 242745, "epoch": 2006} {"train_loss": -38.581214904785156, "global_step": 242746, "epoch": 2006} {"train_loss": -38.113094329833984, "global_step": 242747, "epoch": 2006} {"train_loss": -38.43617630004883, "global_step": 242748, "epoch": 2006} {"train_loss": -38.93699264526367, "global_step": 242749, "epoch": 2006} {"train_loss": -38.44881820678711, "global_step": 242750, "epoch": 2006} {"train_loss": -38.3675651550293, "global_step": 242751, "epoch": 2006} {"train_loss": -38.52392578125, "global_step": 242752, "epoch": 2006} {"train_loss": -38.61358642578125, "global_step": 242753, "epoch": 2006} {"train_loss": -39.32048797607422, "global_step": 242754, "epoch": 2006} {"train_loss": -39.210140228271484, "global_step": 242755, "epoch": 2006} {"train_loss": -37.15367889404297, "global_step": 242756, "epoch": 2006} {"train_loss": -39.70785140991211, "global_step": 242757, "epoch": 2006} {"train_loss": -38.968055725097656, "global_step": 242758, "epoch": 2006} {"train_loss": -38.89589309692383, "global_step": 242759, "epoch": 2006} {"train_loss": -39.1933479309082, "global_step": 242760, "epoch": 2006} {"train_loss": -39.58842086791992, "global_step": 242761, "epoch": 2006} {"train_loss": -39.64982223510742, "global_step": 242762, "epoch": 2006} {"train_loss": -39.312355041503906, "global_step": 242763, "epoch": 2006} {"train_loss": -39.11202621459961, "global_step": 242764, "epoch": 2006} {"train_loss": -38.87339401245117, "global_step": 242765, "epoch": 2006} {"train_loss": -38.72397994995117, "global_step": 242766, "epoch": 2006} {"train_loss": -39.214210510253906, "global_step": 242767, "epoch": 2006} {"train_loss": -40.3541259765625, "global_step": 242768, "epoch": 2006} {"train_loss": -38.48357391357422, "global_step": 242769, "epoch": 2006} {"train_loss": -38.0167236328125, "global_step": 242770, "epoch": 2006} {"train_loss": -39.484554290771484, "global_step": 242771, "epoch": 2006} {"train_loss": -39.64324188232422, "global_step": 242772, "epoch": 2006} {"train_loss": -38.16739273071289, "global_step": 242773, "epoch": 2006} {"train_loss": -39.401527404785156, "global_step": 242774, "epoch": 2006} {"train_loss": -39.92512893676758, "global_step": 242775, "epoch": 2006} {"train_loss": -39.034297943115234, "global_step": 242776, "epoch": 2006} {"train_loss": -40.205265045166016, "global_step": 242777, "epoch": 2006} {"train_loss": -39.82468795776367, "global_step": 242778, "epoch": 2006} {"train_loss": -39.94158935546875, "global_step": 242779, "epoch": 2006} {"train_loss": -40.382320404052734, "global_step": 242780, "epoch": 2006} {"train_loss": -39.94593048095703, "global_step": 242781, "epoch": 2006} {"train_loss": -40.53963851928711, "global_step": 242782, "epoch": 2006} {"train_loss": -39.995845794677734, "global_step": 242783, "epoch": 2006} {"train_loss": -40.09098434448242, "global_step": 242784, "epoch": 2006} {"train_loss": -40.3393669128418, "global_step": 242785, "epoch": 2006} {"train_loss": -40.10279083251953, "global_step": 242786, "epoch": 2006} {"train_loss": -40.4262580871582, "global_step": 242787, "epoch": 2006} {"train_loss": -40.75461196899414, "global_step": 242788, "epoch": 2006} {"train_loss": -40.851898193359375, "global_step": 242789, "epoch": 2006} {"train_loss": -40.50002670288086, "global_step": 242790, "epoch": 2006} {"train_loss": -39.8122444152832, "global_step": 242791, "epoch": 2006} {"train_loss": -40.71406173706055, "global_step": 242792, "epoch": 2006} {"train_loss": -40.072021484375, "global_step": 242793, "epoch": 2006} {"train_loss": -40.79404830932617, "global_step": 242794, "epoch": 2006} {"train_loss": -40.1453742980957, "global_step": 242795, "epoch": 2006} {"train_loss": -39.4190788269043, "global_step": 242796, "epoch": 2006} {"train_loss": -37.933040618896484, "global_step": 242797, "epoch": 2006} {"train_loss": -38.09321975708008, "global_step": 242798, "epoch": 2006} {"train_loss": -38.98141098022461, "global_step": 242799, "epoch": 2006} {"train_loss": -39.96773910522461, "global_step": 242800, "epoch": 2006} {"train_loss": -39.7411003112793, "global_step": 242801, "epoch": 2006} {"train_loss": -40.46255111694336, "global_step": 242802, "epoch": 2006} {"train_loss": -40.36558151245117, "global_step": 242803, "epoch": 2006} {"train_loss": -37.706947326660156, "global_step": 242804, "epoch": 2006} {"train_loss": -38.859859466552734, "global_step": 242805, "epoch": 2006} {"train_loss": -14.582423210144043, "global_step": 242806, "epoch": 2006} {"train_loss": -35.9641227722168, "global_step": 242807, "epoch": 2006} {"train_loss": -39.60322189331055, "global_step": 242808, "epoch": 2006} {"train_loss": -38.150245666503906, "global_step": 242809, "epoch": 2006} {"train_loss": -37.65462112426758, "global_step": 242810, "epoch": 2006} {"train_loss": -5.938172817230225, "global_step": 242811, "epoch": 2006} {"train_loss": -32.222042083740234, "global_step": 242812, "epoch": 2006} {"train_loss": -35.874752044677734, "global_step": 242813, "epoch": 2006} {"train_loss": -30.31243324279785, "global_step": 242814, "epoch": 2006} {"train_loss": -33.99082946777344, "global_step": 242815, "epoch": 2006} {"train_loss": -36.04061508178711, "global_step": 242816, "epoch": 2006} {"train_loss": -35.75448226928711, "global_step": 242817, "epoch": 2006} {"train_loss": -34.02997970581055, "global_step": 242818, "epoch": 2006} {"train_loss": -17.76404571533203, "global_step": 242819, "epoch": 2006} {"train_loss": -21.32262420654297, "global_step": 242820, "epoch": 2006} {"train_loss": -31.80959129333496, "global_step": 242821, "epoch": 2006} {"train_loss": -33.9920654296875, "global_step": 242822, "epoch": 2006} {"train_loss": -10.665289878845215, "global_step": 242823, "epoch": 2006} {"train_loss": -27.4136962890625, "global_step": 242824, "epoch": 2006} {"train_loss": -32.29320526123047, "global_step": 242825, "epoch": 2006} {"train_loss": -34.67856979370117, "global_step": 242826, "epoch": 2006} {"train_loss": -34.00458908081055, "global_step": 242827, "epoch": 2006} {"train_loss": -34.0904541015625, "global_step": 242828, "epoch": 2006} {"train_loss": -28.584091186523438, "global_step": 242829, "epoch": 2006} {"train_loss": -34.70782470703125, "global_step": 242830, "epoch": 2006} {"train_loss": -32.523250579833984, "global_step": 242831, "epoch": 2006} {"train_loss": -36.57732391357422, "global_step": 242832, "epoch": 2006} {"train_loss": -34.680538177490234, "global_step": 242833, "epoch": 2006} {"train_loss": -31.730670928955078, "global_step": 242834, "epoch": 2006} {"train_loss": -34.986446380615234, "global_step": 242835, "epoch": 2006} {"train_loss": -35.03723907470703, "global_step": 242836, "epoch": 2006} {"train_loss": -34.365421295166016, "global_step": 242837, "epoch": 2006} {"train_loss": -36.4145393371582, "global_step": 242838, "epoch": 2006} {"train_loss": -36.68617630004883, "global_step": 242839, "epoch": 2006} {"train_loss": -34.39694595336914, "global_step": 242840, "epoch": 2006} {"train_loss": -36.293392181396484, "global_step": 242841, "epoch": 2006} {"train_loss": -36.30558395385742, "global_step": 242842, "epoch": 2006} {"train_loss": -36.17100143432617, "global_step": 242843, "epoch": 2006} {"train_loss": -37.20305252075195, "global_step": 242844, "epoch": 2006} {"train_loss": -36.5999755859375, "global_step": 242845, "epoch": 2006} {"train_loss": -36.62174968483034, "global_step": 242846, "epoch": 2006, "val_loss": 2654341.25} {"train_loss": -37.75068283081055, "global_step": 242847, "epoch": 2007} {"train_loss": -36.7820930480957, "global_step": 242848, "epoch": 2007} {"train_loss": -35.91842269897461, "global_step": 242849, "epoch": 2007} {"train_loss": -36.438411712646484, "global_step": 242850, "epoch": 2007} {"train_loss": -37.22418975830078, "global_step": 242851, "epoch": 2007} {"train_loss": -37.365413665771484, "global_step": 242852, "epoch": 2007} {"train_loss": -37.49310302734375, "global_step": 242853, "epoch": 2007} {"train_loss": -37.566253662109375, "global_step": 242854, "epoch": 2007} {"train_loss": -37.47256088256836, "global_step": 242855, "epoch": 2007} {"train_loss": -38.2747917175293, "global_step": 242856, "epoch": 2007} {"train_loss": -36.664669036865234, "global_step": 242857, "epoch": 2007} {"train_loss": -37.741607666015625, "global_step": 242858, "epoch": 2007} {"train_loss": -37.57645797729492, "global_step": 242859, "epoch": 2007} {"train_loss": -38.015953063964844, "global_step": 242860, "epoch": 2007} {"train_loss": -38.244380950927734, "global_step": 242861, "epoch": 2007} {"train_loss": -37.6455078125, "global_step": 242862, "epoch": 2007} {"train_loss": -37.95908737182617, "global_step": 242863, "epoch": 2007} {"train_loss": -38.16080856323242, "global_step": 242864, "epoch": 2007} {"train_loss": -37.96881103515625, "global_step": 242865, "epoch": 2007} {"train_loss": -38.020538330078125, "global_step": 242866, "epoch": 2007} {"train_loss": -38.70675277709961, "global_step": 242867, "epoch": 2007} {"train_loss": -39.06324005126953, "global_step": 242868, "epoch": 2007} {"train_loss": -38.08756637573242, "global_step": 242869, "epoch": 2007} {"train_loss": -38.44919967651367, "global_step": 242870, "epoch": 2007} {"train_loss": -38.44294357299805, "global_step": 242871, "epoch": 2007} {"train_loss": -38.798336029052734, "global_step": 242872, "epoch": 2007} {"train_loss": -39.19289779663086, "global_step": 242873, "epoch": 2007} {"train_loss": -38.529842376708984, "global_step": 242874, "epoch": 2007} {"train_loss": -39.02240753173828, "global_step": 242875, "epoch": 2007} {"train_loss": -38.27579879760742, "global_step": 242876, "epoch": 2007} {"train_loss": -39.47646713256836, "global_step": 242877, "epoch": 2007} {"train_loss": -39.34771728515625, "global_step": 242878, "epoch": 2007} {"train_loss": -39.1286506652832, "global_step": 242879, "epoch": 2007} {"train_loss": -39.4669303894043, "global_step": 242880, "epoch": 2007} {"train_loss": -39.20662307739258, "global_step": 242881, "epoch": 2007} {"train_loss": -39.47114181518555, "global_step": 242882, "epoch": 2007} {"train_loss": -38.785621643066406, "global_step": 242883, "epoch": 2007} {"train_loss": -39.81846237182617, "global_step": 242884, "epoch": 2007} {"train_loss": -39.64053726196289, "global_step": 242885, "epoch": 2007} {"train_loss": -40.60625457763672, "global_step": 242886, "epoch": 2007} {"train_loss": -40.451416015625, "global_step": 242887, "epoch": 2007} {"train_loss": -39.37541580200195, "global_step": 242888, "epoch": 2007} {"train_loss": -40.80910873413086, "global_step": 242889, "epoch": 2007} {"train_loss": -39.88563919067383, "global_step": 242890, "epoch": 2007} {"train_loss": -41.002017974853516, "global_step": 242891, "epoch": 2007} {"train_loss": -40.714515686035156, "global_step": 242892, "epoch": 2007} {"train_loss": -41.22579574584961, "global_step": 242893, "epoch": 2007} {"train_loss": -40.37044906616211, "global_step": 242894, "epoch": 2007} {"train_loss": -41.498077392578125, "global_step": 242895, "epoch": 2007} {"train_loss": -40.77457809448242, "global_step": 242896, "epoch": 2007} {"train_loss": -41.510353088378906, "global_step": 242897, "epoch": 2007} {"train_loss": -41.00325393676758, "global_step": 242898, "epoch": 2007} {"train_loss": -41.67238235473633, "global_step": 242899, "epoch": 2007} {"train_loss": -41.04163360595703, "global_step": 242900, "epoch": 2007} {"train_loss": -40.9548454284668, "global_step": 242901, "epoch": 2007} {"train_loss": -41.0998649597168, "global_step": 242902, "epoch": 2007} {"train_loss": -41.343605041503906, "global_step": 242903, "epoch": 2007} {"train_loss": -41.537445068359375, "global_step": 242904, "epoch": 2007} {"train_loss": -41.479148864746094, "global_step": 242905, "epoch": 2007} {"train_loss": -41.39546585083008, "global_step": 242906, "epoch": 2007} {"train_loss": -41.291500091552734, "global_step": 242907, "epoch": 2007} {"train_loss": -41.102813720703125, "global_step": 242908, "epoch": 2007} {"train_loss": -41.33197021484375, "global_step": 242909, "epoch": 2007} {"train_loss": -42.21323776245117, "global_step": 242910, "epoch": 2007} {"train_loss": -42.056026458740234, "global_step": 242911, "epoch": 2007} {"train_loss": -42.146907806396484, "global_step": 242912, "epoch": 2007} {"train_loss": -41.55073165893555, "global_step": 242913, "epoch": 2007} {"train_loss": -41.11735916137695, "global_step": 242914, "epoch": 2007} {"train_loss": -42.256103515625, "global_step": 242915, "epoch": 2007} {"train_loss": -42.18807601928711, "global_step": 242916, "epoch": 2007} {"train_loss": -42.0982551574707, "global_step": 242917, "epoch": 2007} {"train_loss": -41.51902389526367, "global_step": 242918, "epoch": 2007} {"train_loss": -41.92992401123047, "global_step": 242919, "epoch": 2007} {"train_loss": -41.99555206298828, "global_step": 242920, "epoch": 2007} {"train_loss": -42.659088134765625, "global_step": 242921, "epoch": 2007} {"train_loss": -41.944007873535156, "global_step": 242922, "epoch": 2007} {"train_loss": -41.72214126586914, "global_step": 242923, "epoch": 2007} {"train_loss": -41.89460372924805, "global_step": 242924, "epoch": 2007} {"train_loss": -40.978450775146484, "global_step": 242925, "epoch": 2007} {"train_loss": -42.1645393371582, "global_step": 242926, "epoch": 2007} {"train_loss": -41.55378723144531, "global_step": 242927, "epoch": 2007} {"train_loss": -42.16737747192383, "global_step": 242928, "epoch": 2007} {"train_loss": -41.75083541870117, "global_step": 242929, "epoch": 2007} {"train_loss": -41.73777770996094, "global_step": 242930, "epoch": 2007} {"train_loss": -41.95534896850586, "global_step": 242931, "epoch": 2007} {"train_loss": -41.87420654296875, "global_step": 242932, "epoch": 2007} {"train_loss": -42.56947326660156, "global_step": 242933, "epoch": 2007} {"train_loss": -41.97913360595703, "global_step": 242934, "epoch": 2007} {"train_loss": -42.4700927734375, "global_step": 242935, "epoch": 2007} {"train_loss": -41.488712310791016, "global_step": 242936, "epoch": 2007} {"train_loss": -42.71747970581055, "global_step": 242937, "epoch": 2007} {"train_loss": -41.764984130859375, "global_step": 242938, "epoch": 2007} {"train_loss": -42.453521728515625, "global_step": 242939, "epoch": 2007} {"train_loss": -41.9010124206543, "global_step": 242940, "epoch": 2007} {"train_loss": -42.26173782348633, "global_step": 242941, "epoch": 2007} {"train_loss": -41.530635833740234, "global_step": 242942, "epoch": 2007} {"train_loss": -42.3759765625, "global_step": 242943, "epoch": 2007} {"train_loss": -42.340877532958984, "global_step": 242944, "epoch": 2007} {"train_loss": -41.223751068115234, "global_step": 242945, "epoch": 2007} {"train_loss": -42.905635833740234, "global_step": 242946, "epoch": 2007} {"train_loss": -40.7115364074707, "global_step": 242947, "epoch": 2007} {"train_loss": -39.932525634765625, "global_step": 242948, "epoch": 2007} {"train_loss": -41.6385612487793, "global_step": 242949, "epoch": 2007} {"train_loss": -40.62529373168945, "global_step": 242950, "epoch": 2007} {"train_loss": -41.22530746459961, "global_step": 242951, "epoch": 2007} {"train_loss": -41.290428161621094, "global_step": 242952, "epoch": 2007} {"train_loss": -40.88689041137695, "global_step": 242953, "epoch": 2007} {"train_loss": -41.885921478271484, "global_step": 242954, "epoch": 2007} {"train_loss": -40.43310546875, "global_step": 242955, "epoch": 2007} {"train_loss": -41.273162841796875, "global_step": 242956, "epoch": 2007} {"train_loss": -40.32111358642578, "global_step": 242957, "epoch": 2007} {"train_loss": -39.745182037353516, "global_step": 242958, "epoch": 2007} {"train_loss": -40.6532096862793, "global_step": 242959, "epoch": 2007} {"train_loss": -37.63373947143555, "global_step": 242960, "epoch": 2007} {"train_loss": -36.65013885498047, "global_step": 242961, "epoch": 2007} {"train_loss": -25.807636260986328, "global_step": 242962, "epoch": 2007} {"train_loss": -28.790124893188477, "global_step": 242963, "epoch": 2007} {"train_loss": -25.76190757751465, "global_step": 242964, "epoch": 2007} {"train_loss": -27.846832275390625, "global_step": 242965, "epoch": 2007} {"train_loss": -38.56987380981445, "global_step": 242966, "epoch": 2007} {"train_loss": -39.75614301823387, "global_step": 242967, "epoch": 2007, "val_loss": 2668888.75} {"train_loss": -37.810218811035156, "global_step": 242968, "epoch": 2008} {"train_loss": -35.61747360229492, "global_step": 242969, "epoch": 2008} {"train_loss": -38.04110336303711, "global_step": 242970, "epoch": 2008} {"train_loss": -36.027130126953125, "global_step": 242971, "epoch": 2008} {"train_loss": -38.193241119384766, "global_step": 242972, "epoch": 2008} {"train_loss": -37.52138900756836, "global_step": 242973, "epoch": 2008} {"train_loss": -38.50532150268555, "global_step": 242974, "epoch": 2008} {"train_loss": -37.93064498901367, "global_step": 242975, "epoch": 2008} {"train_loss": -38.49563980102539, "global_step": 242976, "epoch": 2008} {"train_loss": -38.75551223754883, "global_step": 242977, "epoch": 2008} {"train_loss": -38.481231689453125, "global_step": 242978, "epoch": 2008} {"train_loss": -38.895652770996094, "global_step": 242979, "epoch": 2008} {"train_loss": -38.75505447387695, "global_step": 242980, "epoch": 2008} {"train_loss": -39.23098373413086, "global_step": 242981, "epoch": 2008} {"train_loss": -39.166927337646484, "global_step": 242982, "epoch": 2008} {"train_loss": -39.317909240722656, "global_step": 242983, "epoch": 2008} {"train_loss": -39.16799545288086, "global_step": 242984, "epoch": 2008} {"train_loss": -38.92628860473633, "global_step": 242985, "epoch": 2008} {"train_loss": -39.583858489990234, "global_step": 242986, "epoch": 2008} {"train_loss": -39.512386322021484, "global_step": 242987, "epoch": 2008} {"train_loss": -39.53290557861328, "global_step": 242988, "epoch": 2008} {"train_loss": -39.73117446899414, "global_step": 242989, "epoch": 2008} {"train_loss": -39.2594108581543, "global_step": 242990, "epoch": 2008} {"train_loss": -39.434051513671875, "global_step": 242991, "epoch": 2008} {"train_loss": -39.78680419921875, "global_step": 242992, "epoch": 2008} {"train_loss": -39.271942138671875, "global_step": 242993, "epoch": 2008} {"train_loss": -39.48020553588867, "global_step": 242994, "epoch": 2008} {"train_loss": -39.95668411254883, "global_step": 242995, "epoch": 2008} {"train_loss": -39.96216583251953, "global_step": 242996, "epoch": 2008} {"train_loss": -40.04884719848633, "global_step": 242997, "epoch": 2008} {"train_loss": -40.40616989135742, "global_step": 242998, "epoch": 2008} {"train_loss": -40.151344299316406, "global_step": 242999, "epoch": 2008} {"train_loss": -39.911617279052734, "global_step": 243000, "epoch": 2008} {"train_loss": -40.28115463256836, "global_step": 243001, "epoch": 2008} {"train_loss": -39.87348556518555, "global_step": 243002, "epoch": 2008} {"train_loss": -40.00380325317383, "global_step": 243003, "epoch": 2008} {"train_loss": -40.11832809448242, "global_step": 243004, "epoch": 2008} {"train_loss": -40.23502731323242, "global_step": 243005, "epoch": 2008} {"train_loss": -40.01505661010742, "global_step": 243006, "epoch": 2008} {"train_loss": -40.452606201171875, "global_step": 243007, "epoch": 2008} {"train_loss": -40.700347900390625, "global_step": 243008, "epoch": 2008} {"train_loss": -39.987117767333984, "global_step": 243009, "epoch": 2008} {"train_loss": -40.61650466918945, "global_step": 243010, "epoch": 2008} {"train_loss": -39.84955978393555, "global_step": 243011, "epoch": 2008} {"train_loss": -40.47628402709961, "global_step": 243012, "epoch": 2008} {"train_loss": -40.851173400878906, "global_step": 243013, "epoch": 2008} {"train_loss": -40.67055130004883, "global_step": 243014, "epoch": 2008} {"train_loss": -40.90081787109375, "global_step": 243015, "epoch": 2008} {"train_loss": -40.998085021972656, "global_step": 243016, "epoch": 2008} {"train_loss": -40.75780487060547, "global_step": 243017, "epoch": 2008} {"train_loss": -40.2192497253418, "global_step": 243018, "epoch": 2008} {"train_loss": -41.07451248168945, "global_step": 243019, "epoch": 2008} {"train_loss": -40.400089263916016, "global_step": 243020, "epoch": 2008} {"train_loss": -40.97963333129883, "global_step": 243021, "epoch": 2008} {"train_loss": -40.94981002807617, "global_step": 243022, "epoch": 2008} {"train_loss": -40.99732971191406, "global_step": 243023, "epoch": 2008} {"train_loss": -41.04781723022461, "global_step": 243024, "epoch": 2008} {"train_loss": -41.035369873046875, "global_step": 243025, "epoch": 2008} {"train_loss": -40.782649993896484, "global_step": 243026, "epoch": 2008} {"train_loss": -40.89852523803711, "global_step": 243027, "epoch": 2008} {"train_loss": -41.14866256713867, "global_step": 243028, "epoch": 2008} {"train_loss": -40.740962982177734, "global_step": 243029, "epoch": 2008} {"train_loss": -41.289100646972656, "global_step": 243030, "epoch": 2008} {"train_loss": -41.00202560424805, "global_step": 243031, "epoch": 2008} {"train_loss": -41.45355987548828, "global_step": 243032, "epoch": 2008} {"train_loss": -41.44472885131836, "global_step": 243033, "epoch": 2008} {"train_loss": -41.224422454833984, "global_step": 243034, "epoch": 2008} {"train_loss": -40.8454475402832, "global_step": 243035, "epoch": 2008} {"train_loss": -41.21063232421875, "global_step": 243036, "epoch": 2008} {"train_loss": -40.271846771240234, "global_step": 243037, "epoch": 2008} {"train_loss": -36.3964958190918, "global_step": 243038, "epoch": 2008} {"train_loss": -25.32855987548828, "global_step": 243039, "epoch": 2008} {"train_loss": -5.436976909637451, "global_step": 243040, "epoch": 2008} {"train_loss": -27.504560470581055, "global_step": 243041, "epoch": 2008} {"train_loss": -36.65409469604492, "global_step": 243042, "epoch": 2008} {"train_loss": -25.557424545288086, "global_step": 243043, "epoch": 2008} {"train_loss": -38.52583694458008, "global_step": 243044, "epoch": 2008} {"train_loss": -29.312955856323242, "global_step": 243045, "epoch": 2008} {"train_loss": -37.65167236328125, "global_step": 243046, "epoch": 2008} {"train_loss": -33.1949348449707, "global_step": 243047, "epoch": 2008} {"train_loss": -38.33122634887695, "global_step": 243048, "epoch": 2008} {"train_loss": -38.36798858642578, "global_step": 243049, "epoch": 2008} {"train_loss": -35.91054916381836, "global_step": 243050, "epoch": 2008} {"train_loss": -39.050682067871094, "global_step": 243051, "epoch": 2008} {"train_loss": -37.55885696411133, "global_step": 243052, "epoch": 2008} {"train_loss": -36.1767463684082, "global_step": 243053, "epoch": 2008} {"train_loss": -39.085838317871094, "global_step": 243054, "epoch": 2008} {"train_loss": -37.50476837158203, "global_step": 243055, "epoch": 2008} {"train_loss": -38.89582061767578, "global_step": 243056, "epoch": 2008} {"train_loss": -39.38325119018555, "global_step": 243057, "epoch": 2008} {"train_loss": -38.2498779296875, "global_step": 243058, "epoch": 2008} {"train_loss": -39.06816864013672, "global_step": 243059, "epoch": 2008} {"train_loss": -39.055694580078125, "global_step": 243060, "epoch": 2008} {"train_loss": -39.50447463989258, "global_step": 243061, "epoch": 2008} {"train_loss": -39.767860412597656, "global_step": 243062, "epoch": 2008} {"train_loss": -40.38715744018555, "global_step": 243063, "epoch": 2008} {"train_loss": -39.81919860839844, "global_step": 243064, "epoch": 2008} {"train_loss": -40.33127975463867, "global_step": 243065, "epoch": 2008} {"train_loss": -39.95505142211914, "global_step": 243066, "epoch": 2008} {"train_loss": -40.248111724853516, "global_step": 243067, "epoch": 2008} {"train_loss": -40.12649917602539, "global_step": 243068, "epoch": 2008} {"train_loss": -40.29450225830078, "global_step": 243069, "epoch": 2008} {"train_loss": -40.47229766845703, "global_step": 243070, "epoch": 2008} {"train_loss": -40.01347732543945, "global_step": 243071, "epoch": 2008} {"train_loss": -40.82540512084961, "global_step": 243072, "epoch": 2008} {"train_loss": -40.638179779052734, "global_step": 243073, "epoch": 2008} {"train_loss": -40.28339767456055, "global_step": 243074, "epoch": 2008} {"train_loss": -40.48482894897461, "global_step": 243075, "epoch": 2008} {"train_loss": -40.653480529785156, "global_step": 243076, "epoch": 2008} {"train_loss": -40.7459716796875, "global_step": 243077, "epoch": 2008} {"train_loss": -40.81330108642578, "global_step": 243078, "epoch": 2008} {"train_loss": -40.417144775390625, "global_step": 243079, "epoch": 2008} {"train_loss": -40.81459426879883, "global_step": 243080, "epoch": 2008} {"train_loss": -40.70396041870117, "global_step": 243081, "epoch": 2008} {"train_loss": -40.797340393066406, "global_step": 243082, "epoch": 2008} {"train_loss": -40.9387321472168, "global_step": 243083, "epoch": 2008} {"train_loss": -41.2569694519043, "global_step": 243084, "epoch": 2008} {"train_loss": -41.0890998840332, "global_step": 243085, "epoch": 2008} {"train_loss": -41.41810989379883, "global_step": 243086, "epoch": 2008} {"train_loss": -40.4002799987793, "global_step": 243087, "epoch": 2008} {"train_loss": -38.98572002363599, "global_step": 243088, "epoch": 2008, "val_loss": 2674316.5} {"train_loss": -41.41465759277344, "global_step": 243089, "epoch": 2009} {"train_loss": -41.17735290527344, "global_step": 243090, "epoch": 2009} {"train_loss": -41.555946350097656, "global_step": 243091, "epoch": 2009} {"train_loss": -41.57777404785156, "global_step": 243092, "epoch": 2009} {"train_loss": -41.09478759765625, "global_step": 243093, "epoch": 2009} {"train_loss": -41.11585235595703, "global_step": 243094, "epoch": 2009} {"train_loss": -41.2363395690918, "global_step": 243095, "epoch": 2009} {"train_loss": -41.1707878112793, "global_step": 243096, "epoch": 2009} {"train_loss": -41.48218536376953, "global_step": 243097, "epoch": 2009} {"train_loss": -40.87964630126953, "global_step": 243098, "epoch": 2009} {"train_loss": -41.160011291503906, "global_step": 243099, "epoch": 2009} {"train_loss": -41.47539138793945, "global_step": 243100, "epoch": 2009} {"train_loss": -41.70569610595703, "global_step": 243101, "epoch": 2009} {"train_loss": -41.61963653564453, "global_step": 243102, "epoch": 2009} {"train_loss": -41.3844108581543, "global_step": 243103, "epoch": 2009} {"train_loss": -41.92934036254883, "global_step": 243104, "epoch": 2009} {"train_loss": -41.19887924194336, "global_step": 243105, "epoch": 2009} {"train_loss": -41.517581939697266, "global_step": 243106, "epoch": 2009} {"train_loss": -41.52151870727539, "global_step": 243107, "epoch": 2009} {"train_loss": -41.41117858886719, "global_step": 243108, "epoch": 2009} {"train_loss": -38.12418746948242, "global_step": 243109, "epoch": 2009} {"train_loss": -41.45115280151367, "global_step": 243110, "epoch": 2009} {"train_loss": -41.87913513183594, "global_step": 243111, "epoch": 2009} {"train_loss": -40.99287796020508, "global_step": 243112, "epoch": 2009} {"train_loss": -41.361907958984375, "global_step": 243113, "epoch": 2009} {"train_loss": -41.54165267944336, "global_step": 243114, "epoch": 2009} {"train_loss": -40.2538948059082, "global_step": 243115, "epoch": 2009} {"train_loss": -41.4648551940918, "global_step": 243116, "epoch": 2009} {"train_loss": -41.59043502807617, "global_step": 243117, "epoch": 2009} {"train_loss": -41.01974868774414, "global_step": 243118, "epoch": 2009} {"train_loss": -41.822120666503906, "global_step": 243119, "epoch": 2009} {"train_loss": -41.72062301635742, "global_step": 243120, "epoch": 2009} {"train_loss": -40.70841598510742, "global_step": 243121, "epoch": 2009} {"train_loss": -42.26047897338867, "global_step": 243122, "epoch": 2009} {"train_loss": -39.884883880615234, "global_step": 243123, "epoch": 2009} {"train_loss": -40.352657318115234, "global_step": 243124, "epoch": 2009} {"train_loss": -41.63269805908203, "global_step": 243125, "epoch": 2009} {"train_loss": -41.87349319458008, "global_step": 243126, "epoch": 2009} {"train_loss": -41.17533874511719, "global_step": 243127, "epoch": 2009} {"train_loss": -41.782508850097656, "global_step": 243128, "epoch": 2009} {"train_loss": -39.808502197265625, "global_step": 243129, "epoch": 2009} {"train_loss": -40.9753303527832, "global_step": 243130, "epoch": 2009} {"train_loss": -39.745208740234375, "global_step": 243131, "epoch": 2009} {"train_loss": -41.23379898071289, "global_step": 243132, "epoch": 2009} {"train_loss": -41.328922271728516, "global_step": 243133, "epoch": 2009} {"train_loss": -41.49463653564453, "global_step": 243134, "epoch": 2009} {"train_loss": -41.432090759277344, "global_step": 243135, "epoch": 2009} {"train_loss": -42.010459899902344, "global_step": 243136, "epoch": 2009} {"train_loss": -41.6269645690918, "global_step": 243137, "epoch": 2009} {"train_loss": -41.22701644897461, "global_step": 243138, "epoch": 2009} {"train_loss": -42.015628814697266, "global_step": 243139, "epoch": 2009} {"train_loss": -41.94739532470703, "global_step": 243140, "epoch": 2009} {"train_loss": -42.028255462646484, "global_step": 243141, "epoch": 2009} {"train_loss": -41.42417526245117, "global_step": 243142, "epoch": 2009} {"train_loss": -41.23727035522461, "global_step": 243143, "epoch": 2009} {"train_loss": -42.166351318359375, "global_step": 243144, "epoch": 2009} {"train_loss": -41.80437088012695, "global_step": 243145, "epoch": 2009} {"train_loss": -40.47139358520508, "global_step": 243146, "epoch": 2009} {"train_loss": -42.012481689453125, "global_step": 243147, "epoch": 2009} {"train_loss": -41.405086517333984, "global_step": 243148, "epoch": 2009} {"train_loss": -41.88916778564453, "global_step": 243149, "epoch": 2009} {"train_loss": -41.994564056396484, "global_step": 243150, "epoch": 2009} {"train_loss": -41.9647331237793, "global_step": 243151, "epoch": 2009} {"train_loss": -41.91694259643555, "global_step": 243152, "epoch": 2009} {"train_loss": -42.22274398803711, "global_step": 243153, "epoch": 2009} {"train_loss": -42.136741638183594, "global_step": 243154, "epoch": 2009} {"train_loss": -42.102874755859375, "global_step": 243155, "epoch": 2009} {"train_loss": -42.04990768432617, "global_step": 243156, "epoch": 2009} {"train_loss": -41.74264144897461, "global_step": 243157, "epoch": 2009} {"train_loss": -42.171043395996094, "global_step": 243158, "epoch": 2009} {"train_loss": -41.826385498046875, "global_step": 243159, "epoch": 2009} {"train_loss": -41.383766174316406, "global_step": 243160, "epoch": 2009} {"train_loss": -40.69139099121094, "global_step": 243161, "epoch": 2009} {"train_loss": -40.04788589477539, "global_step": 243162, "epoch": 2009} {"train_loss": -38.58241653442383, "global_step": 243163, "epoch": 2009} {"train_loss": -40.1953010559082, "global_step": 243164, "epoch": 2009} {"train_loss": -40.068721771240234, "global_step": 243165, "epoch": 2009} {"train_loss": -42.27596664428711, "global_step": 243166, "epoch": 2009} {"train_loss": -41.7911262512207, "global_step": 243167, "epoch": 2009} {"train_loss": -39.77208709716797, "global_step": 243168, "epoch": 2009} {"train_loss": -38.006866455078125, "global_step": 243169, "epoch": 2009} {"train_loss": -36.66463088989258, "global_step": 243170, "epoch": 2009} {"train_loss": -39.09523391723633, "global_step": 243171, "epoch": 2009} {"train_loss": -40.72052001953125, "global_step": 243172, "epoch": 2009} {"train_loss": -39.88743209838867, "global_step": 243173, "epoch": 2009} {"train_loss": -40.416927337646484, "global_step": 243174, "epoch": 2009} {"train_loss": -39.90803527832031, "global_step": 243175, "epoch": 2009} {"train_loss": -39.57319259643555, "global_step": 243176, "epoch": 2009} {"train_loss": -40.25138473510742, "global_step": 243177, "epoch": 2009} {"train_loss": -40.747493743896484, "global_step": 243178, "epoch": 2009} {"train_loss": -39.983612060546875, "global_step": 243179, "epoch": 2009} {"train_loss": -40.441349029541016, "global_step": 243180, "epoch": 2009} {"train_loss": -40.366607666015625, "global_step": 243181, "epoch": 2009} {"train_loss": -40.12171936035156, "global_step": 243182, "epoch": 2009} {"train_loss": -40.50321578979492, "global_step": 243183, "epoch": 2009} {"train_loss": -40.38979721069336, "global_step": 243184, "epoch": 2009} {"train_loss": -40.35334014892578, "global_step": 243185, "epoch": 2009} {"train_loss": -41.220863342285156, "global_step": 243186, "epoch": 2009} {"train_loss": -38.98173904418945, "global_step": 243187, "epoch": 2009} {"train_loss": -38.19082260131836, "global_step": 243188, "epoch": 2009} {"train_loss": -38.42788314819336, "global_step": 243189, "epoch": 2009} {"train_loss": -41.14387130737305, "global_step": 243190, "epoch": 2009} {"train_loss": -41.478004455566406, "global_step": 243191, "epoch": 2009} {"train_loss": -40.84016418457031, "global_step": 243192, "epoch": 2009} {"train_loss": -39.990760803222656, "global_step": 243193, "epoch": 2009} {"train_loss": -40.72200393676758, "global_step": 243194, "epoch": 2009} {"train_loss": -41.105953216552734, "global_step": 243195, "epoch": 2009} {"train_loss": -41.458492279052734, "global_step": 243196, "epoch": 2009} {"train_loss": -40.60767364501953, "global_step": 243197, "epoch": 2009} {"train_loss": -41.121089935302734, "global_step": 243198, "epoch": 2009} {"train_loss": -41.05799102783203, "global_step": 243199, "epoch": 2009} {"train_loss": -42.142295837402344, "global_step": 243200, "epoch": 2009} {"train_loss": -41.02926254272461, "global_step": 243201, "epoch": 2009} {"train_loss": -41.458492279052734, "global_step": 243202, "epoch": 2009} {"train_loss": -41.24880599975586, "global_step": 243203, "epoch": 2009} {"train_loss": -40.29168701171875, "global_step": 243204, "epoch": 2009} {"train_loss": -40.414363861083984, "global_step": 243205, "epoch": 2009} {"train_loss": -41.42750930786133, "global_step": 243206, "epoch": 2009} {"train_loss": -41.179969787597656, "global_step": 243207, "epoch": 2009} {"train_loss": -38.695594787597656, "global_step": 243208, "epoch": 2009} {"train_loss": -40.975117360264804, "global_step": 243209, "epoch": 2009, "val_loss": 2712409.0} {"train_loss": -41.066864013671875, "global_step": 243210, "epoch": 2010} {"train_loss": -41.894500732421875, "global_step": 243211, "epoch": 2010} {"train_loss": -41.90087890625, "global_step": 243212, "epoch": 2010} {"train_loss": -40.32174301147461, "global_step": 243213, "epoch": 2010} {"train_loss": -42.14989471435547, "global_step": 243214, "epoch": 2010} {"train_loss": -42.052852630615234, "global_step": 243215, "epoch": 2010} {"train_loss": -42.046966552734375, "global_step": 243216, "epoch": 2010} {"train_loss": -41.85832595825195, "global_step": 243217, "epoch": 2010} {"train_loss": -42.50007247924805, "global_step": 243218, "epoch": 2010} {"train_loss": -42.310791015625, "global_step": 243219, "epoch": 2010} {"train_loss": -42.15459060668945, "global_step": 243220, "epoch": 2010} {"train_loss": -42.08441925048828, "global_step": 243221, "epoch": 2010} {"train_loss": -41.45452880859375, "global_step": 243222, "epoch": 2010} {"train_loss": -42.19086837768555, "global_step": 243223, "epoch": 2010} {"train_loss": -42.190284729003906, "global_step": 243224, "epoch": 2010} {"train_loss": -42.13240051269531, "global_step": 243225, "epoch": 2010} {"train_loss": -41.33817672729492, "global_step": 243226, "epoch": 2010} {"train_loss": -42.12655258178711, "global_step": 243227, "epoch": 2010} {"train_loss": -41.92243576049805, "global_step": 243228, "epoch": 2010} {"train_loss": -40.96610641479492, "global_step": 243229, "epoch": 2010} {"train_loss": -41.821319580078125, "global_step": 243230, "epoch": 2010} {"train_loss": -41.51675033569336, "global_step": 243231, "epoch": 2010} {"train_loss": -40.95663070678711, "global_step": 243232, "epoch": 2010} {"train_loss": -41.711360931396484, "global_step": 243233, "epoch": 2010} {"train_loss": -41.75940704345703, "global_step": 243234, "epoch": 2010} {"train_loss": -42.15751266479492, "global_step": 243235, "epoch": 2010} {"train_loss": -41.96305465698242, "global_step": 243236, "epoch": 2010} {"train_loss": -41.36227035522461, "global_step": 243237, "epoch": 2010} {"train_loss": -42.42951202392578, "global_step": 243238, "epoch": 2010} {"train_loss": -42.557701110839844, "global_step": 243239, "epoch": 2010} {"train_loss": -42.47393798828125, "global_step": 243240, "epoch": 2010} {"train_loss": -42.47378158569336, "global_step": 243241, "epoch": 2010} {"train_loss": -42.075050354003906, "global_step": 243242, "epoch": 2010} {"train_loss": -42.15330123901367, "global_step": 243243, "epoch": 2010} {"train_loss": -41.771240234375, "global_step": 243244, "epoch": 2010} {"train_loss": -42.46342468261719, "global_step": 243245, "epoch": 2010} {"train_loss": -42.38572311401367, "global_step": 243246, "epoch": 2010} {"train_loss": -42.25089645385742, "global_step": 243247, "epoch": 2010} {"train_loss": -42.61862564086914, "global_step": 243248, "epoch": 2010} {"train_loss": -42.12137985229492, "global_step": 243249, "epoch": 2010} {"train_loss": -42.228614807128906, "global_step": 243250, "epoch": 2010} {"train_loss": -39.793392181396484, "global_step": 243251, "epoch": 2010} {"train_loss": -40.5135498046875, "global_step": 243252, "epoch": 2010} {"train_loss": -41.86666488647461, "global_step": 243253, "epoch": 2010} {"train_loss": -41.24822998046875, "global_step": 243254, "epoch": 2010} {"train_loss": -42.29844284057617, "global_step": 243255, "epoch": 2010} {"train_loss": -41.04218673706055, "global_step": 243256, "epoch": 2010} {"train_loss": -41.35702133178711, "global_step": 243257, "epoch": 2010} {"train_loss": -41.35908508300781, "global_step": 243258, "epoch": 2010} {"train_loss": -42.062721252441406, "global_step": 243259, "epoch": 2010} {"train_loss": -38.81700897216797, "global_step": 243260, "epoch": 2010} {"train_loss": -37.844173431396484, "global_step": 243261, "epoch": 2010} {"train_loss": -32.9543342590332, "global_step": 243262, "epoch": 2010} {"train_loss": -36.08467102050781, "global_step": 243263, "epoch": 2010} {"train_loss": -31.764968872070312, "global_step": 243264, "epoch": 2010} {"train_loss": -40.677001953125, "global_step": 243265, "epoch": 2010} {"train_loss": -41.201290130615234, "global_step": 243266, "epoch": 2010} {"train_loss": -38.19333267211914, "global_step": 243267, "epoch": 2010} {"train_loss": -41.426143646240234, "global_step": 243268, "epoch": 2010} {"train_loss": -37.1386604309082, "global_step": 243269, "epoch": 2010} {"train_loss": -37.00934600830078, "global_step": 243270, "epoch": 2010} {"train_loss": -40.287208557128906, "global_step": 243271, "epoch": 2010} {"train_loss": -40.0543098449707, "global_step": 243272, "epoch": 2010} {"train_loss": -39.35728073120117, "global_step": 243273, "epoch": 2010} {"train_loss": -40.555877685546875, "global_step": 243274, "epoch": 2010} {"train_loss": -40.72233963012695, "global_step": 243275, "epoch": 2010} {"train_loss": -35.99898910522461, "global_step": 243276, "epoch": 2010} {"train_loss": -40.003028869628906, "global_step": 243277, "epoch": 2010} {"train_loss": -37.3242301940918, "global_step": 243278, "epoch": 2010} {"train_loss": -37.361480712890625, "global_step": 243279, "epoch": 2010} {"train_loss": -39.787757873535156, "global_step": 243280, "epoch": 2010} {"train_loss": -39.227447509765625, "global_step": 243281, "epoch": 2010} {"train_loss": -41.065189361572266, "global_step": 243282, "epoch": 2010} {"train_loss": -39.875885009765625, "global_step": 243283, "epoch": 2010} {"train_loss": -40.681941986083984, "global_step": 243284, "epoch": 2010} {"train_loss": -38.10947799682617, "global_step": 243285, "epoch": 2010} {"train_loss": -38.799137115478516, "global_step": 243286, "epoch": 2010} {"train_loss": -39.8133659362793, "global_step": 243287, "epoch": 2010} {"train_loss": -39.861549377441406, "global_step": 243288, "epoch": 2010} {"train_loss": -40.073970794677734, "global_step": 243289, "epoch": 2010} {"train_loss": -40.09389877319336, "global_step": 243290, "epoch": 2010} {"train_loss": -40.0044059753418, "global_step": 243291, "epoch": 2010} {"train_loss": -39.95526123046875, "global_step": 243292, "epoch": 2010} {"train_loss": -41.310245513916016, "global_step": 243293, "epoch": 2010} {"train_loss": -37.478607177734375, "global_step": 243294, "epoch": 2010} {"train_loss": -36.88850021362305, "global_step": 243295, "epoch": 2010} {"train_loss": -35.655662536621094, "global_step": 243296, "epoch": 2010} {"train_loss": -39.07264709472656, "global_step": 243297, "epoch": 2010} {"train_loss": -39.78193283081055, "global_step": 243298, "epoch": 2010} {"train_loss": -40.16976547241211, "global_step": 243299, "epoch": 2010} {"train_loss": -40.54451370239258, "global_step": 243300, "epoch": 2010} {"train_loss": -38.66341018676758, "global_step": 243301, "epoch": 2010} {"train_loss": -40.828060150146484, "global_step": 243302, "epoch": 2010} {"train_loss": -40.54526901245117, "global_step": 243303, "epoch": 2010} {"train_loss": -40.918365478515625, "global_step": 243304, "epoch": 2010} {"train_loss": -39.20155715942383, "global_step": 243305, "epoch": 2010} {"train_loss": -41.3924560546875, "global_step": 243306, "epoch": 2010} {"train_loss": -40.7739143371582, "global_step": 243307, "epoch": 2010} {"train_loss": -39.717987060546875, "global_step": 243308, "epoch": 2010} {"train_loss": -41.19357681274414, "global_step": 243309, "epoch": 2010} {"train_loss": -40.23701858520508, "global_step": 243310, "epoch": 2010} {"train_loss": -40.79164123535156, "global_step": 243311, "epoch": 2010} {"train_loss": -39.609092712402344, "global_step": 243312, "epoch": 2010} {"train_loss": -40.078224182128906, "global_step": 243313, "epoch": 2010} {"train_loss": -40.3349723815918, "global_step": 243314, "epoch": 2010} {"train_loss": -40.39162826538086, "global_step": 243315, "epoch": 2010} {"train_loss": -41.09418487548828, "global_step": 243316, "epoch": 2010} {"train_loss": -40.155208587646484, "global_step": 243317, "epoch": 2010} {"train_loss": -41.32487869262695, "global_step": 243318, "epoch": 2010} {"train_loss": -41.57072067260742, "global_step": 243319, "epoch": 2010} {"train_loss": -39.88874435424805, "global_step": 243320, "epoch": 2010} {"train_loss": -39.45161056518555, "global_step": 243321, "epoch": 2010} {"train_loss": -41.27973556518555, "global_step": 243322, "epoch": 2010} {"train_loss": -39.24448776245117, "global_step": 243323, "epoch": 2010} {"train_loss": -40.36790084838867, "global_step": 243324, "epoch": 2010} {"train_loss": -40.22304153442383, "global_step": 243325, "epoch": 2010} {"train_loss": -41.658775329589844, "global_step": 243326, "epoch": 2010} {"train_loss": -41.61146545410156, "global_step": 243327, "epoch": 2010} {"train_loss": -40.41261672973633, "global_step": 243328, "epoch": 2010} {"train_loss": -41.162899017333984, "global_step": 243329, "epoch": 2010} {"train_loss": -40.48273685549901, "global_step": 243330, "epoch": 2010, "val_loss": 2611045.75} {"train_loss": -39.78825759887695, "global_step": 243331, "epoch": 2011} {"train_loss": -40.079280853271484, "global_step": 243332, "epoch": 2011} {"train_loss": -41.039466857910156, "global_step": 243333, "epoch": 2011} {"train_loss": -40.97520065307617, "global_step": 243334, "epoch": 2011} {"train_loss": -41.385704040527344, "global_step": 243335, "epoch": 2011} {"train_loss": -41.41215133666992, "global_step": 243336, "epoch": 2011} {"train_loss": -41.60929489135742, "global_step": 243337, "epoch": 2011} {"train_loss": -41.2127571105957, "global_step": 243338, "epoch": 2011} {"train_loss": -41.770751953125, "global_step": 243339, "epoch": 2011} {"train_loss": -41.2098388671875, "global_step": 243340, "epoch": 2011} {"train_loss": -41.16679763793945, "global_step": 243341, "epoch": 2011} {"train_loss": -41.17284393310547, "global_step": 243342, "epoch": 2011} {"train_loss": -42.18059158325195, "global_step": 243343, "epoch": 2011} {"train_loss": -41.6506462097168, "global_step": 243344, "epoch": 2011} {"train_loss": -41.3305549621582, "global_step": 243345, "epoch": 2011} {"train_loss": -41.49431228637695, "global_step": 243346, "epoch": 2011} {"train_loss": -40.38846969604492, "global_step": 243347, "epoch": 2011} {"train_loss": -41.85805130004883, "global_step": 243348, "epoch": 2011} {"train_loss": -40.990455627441406, "global_step": 243349, "epoch": 2011} {"train_loss": -41.05373001098633, "global_step": 243350, "epoch": 2011} {"train_loss": -42.439735412597656, "global_step": 243351, "epoch": 2011} {"train_loss": -41.53190994262695, "global_step": 243352, "epoch": 2011} {"train_loss": -41.41579055786133, "global_step": 243353, "epoch": 2011} {"train_loss": -41.14258575439453, "global_step": 243354, "epoch": 2011} {"train_loss": -41.85699462890625, "global_step": 243355, "epoch": 2011} {"train_loss": -42.426979064941406, "global_step": 243356, "epoch": 2011} {"train_loss": -41.695919036865234, "global_step": 243357, "epoch": 2011} {"train_loss": -41.561798095703125, "global_step": 243358, "epoch": 2011} {"train_loss": -41.874446868896484, "global_step": 243359, "epoch": 2011} {"train_loss": -40.07837677001953, "global_step": 243360, "epoch": 2011} {"train_loss": -42.23737335205078, "global_step": 243361, "epoch": 2011} {"train_loss": -42.41630172729492, "global_step": 243362, "epoch": 2011} {"train_loss": -41.5499382019043, "global_step": 243363, "epoch": 2011} {"train_loss": -42.1967887878418, "global_step": 243364, "epoch": 2011} {"train_loss": -41.716487884521484, "global_step": 243365, "epoch": 2011} {"train_loss": -41.92570114135742, "global_step": 243366, "epoch": 2011} {"train_loss": -41.65732192993164, "global_step": 243367, "epoch": 2011} {"train_loss": -41.916717529296875, "global_step": 243368, "epoch": 2011} {"train_loss": -42.135902404785156, "global_step": 243369, "epoch": 2011} {"train_loss": -42.4647331237793, "global_step": 243370, "epoch": 2011} {"train_loss": -42.40513229370117, "global_step": 243371, "epoch": 2011} {"train_loss": -41.77634811401367, "global_step": 243372, "epoch": 2011} {"train_loss": -42.19118118286133, "global_step": 243373, "epoch": 2011} {"train_loss": -42.111534118652344, "global_step": 243374, "epoch": 2011} {"train_loss": -42.024139404296875, "global_step": 243375, "epoch": 2011} {"train_loss": -42.036685943603516, "global_step": 243376, "epoch": 2011} {"train_loss": -42.1678466796875, "global_step": 243377, "epoch": 2011} {"train_loss": -42.671417236328125, "global_step": 243378, "epoch": 2011} {"train_loss": -42.55635452270508, "global_step": 243379, "epoch": 2011} {"train_loss": -42.13019561767578, "global_step": 243380, "epoch": 2011} {"train_loss": -42.44655990600586, "global_step": 243381, "epoch": 2011} {"train_loss": -42.69497299194336, "global_step": 243382, "epoch": 2011} {"train_loss": -43.139923095703125, "global_step": 243383, "epoch": 2011} {"train_loss": -42.720611572265625, "global_step": 243384, "epoch": 2011} {"train_loss": -41.793758392333984, "global_step": 243385, "epoch": 2011} {"train_loss": -41.826534271240234, "global_step": 243386, "epoch": 2011} {"train_loss": -42.142513275146484, "global_step": 243387, "epoch": 2011} {"train_loss": -40.52699661254883, "global_step": 243388, "epoch": 2011} {"train_loss": -41.73381042480469, "global_step": 243389, "epoch": 2011} {"train_loss": -39.849910736083984, "global_step": 243390, "epoch": 2011} {"train_loss": -40.64945602416992, "global_step": 243391, "epoch": 2011} {"train_loss": -38.73346710205078, "global_step": 243392, "epoch": 2011} {"train_loss": -39.557647705078125, "global_step": 243393, "epoch": 2011} {"train_loss": -41.87432861328125, "global_step": 243394, "epoch": 2011} {"train_loss": -41.4726676940918, "global_step": 243395, "epoch": 2011} {"train_loss": -39.56904983520508, "global_step": 243396, "epoch": 2011} {"train_loss": -39.1890754699707, "global_step": 243397, "epoch": 2011} {"train_loss": -38.30267333984375, "global_step": 243398, "epoch": 2011} {"train_loss": -39.751888275146484, "global_step": 243399, "epoch": 2011} {"train_loss": -38.12895584106445, "global_step": 243400, "epoch": 2011} {"train_loss": -39.52695846557617, "global_step": 243401, "epoch": 2011} {"train_loss": -39.943782806396484, "global_step": 243402, "epoch": 2011} {"train_loss": -38.26652908325195, "global_step": 243403, "epoch": 2011} {"train_loss": -40.32891082763672, "global_step": 243404, "epoch": 2011} {"train_loss": -40.63656234741211, "global_step": 243405, "epoch": 2011} {"train_loss": -37.19367599487305, "global_step": 243406, "epoch": 2011} {"train_loss": -40.75309371948242, "global_step": 243407, "epoch": 2011} {"train_loss": -39.65605163574219, "global_step": 243408, "epoch": 2011} {"train_loss": -40.46096420288086, "global_step": 243409, "epoch": 2011} {"train_loss": -40.7357292175293, "global_step": 243410, "epoch": 2011} {"train_loss": -40.36149978637695, "global_step": 243411, "epoch": 2011} {"train_loss": -41.61884689331055, "global_step": 243412, "epoch": 2011} {"train_loss": -41.143463134765625, "global_step": 243413, "epoch": 2011} {"train_loss": -40.996498107910156, "global_step": 243414, "epoch": 2011} {"train_loss": -41.69697189331055, "global_step": 243415, "epoch": 2011} {"train_loss": -40.83393096923828, "global_step": 243416, "epoch": 2011} {"train_loss": -41.10762405395508, "global_step": 243417, "epoch": 2011} {"train_loss": -40.43634796142578, "global_step": 243418, "epoch": 2011} {"train_loss": -42.42585372924805, "global_step": 243419, "epoch": 2011} {"train_loss": -40.31752395629883, "global_step": 243420, "epoch": 2011} {"train_loss": -41.18959045410156, "global_step": 243421, "epoch": 2011} {"train_loss": -41.791847229003906, "global_step": 243422, "epoch": 2011} {"train_loss": -42.123165130615234, "global_step": 243423, "epoch": 2011} {"train_loss": -42.35064697265625, "global_step": 243424, "epoch": 2011} {"train_loss": -40.57575225830078, "global_step": 243425, "epoch": 2011} {"train_loss": -41.412940979003906, "global_step": 243426, "epoch": 2011} {"train_loss": -40.6513557434082, "global_step": 243427, "epoch": 2011} {"train_loss": -41.778175354003906, "global_step": 243428, "epoch": 2011} {"train_loss": -41.390106201171875, "global_step": 243429, "epoch": 2011} {"train_loss": -41.40549850463867, "global_step": 243430, "epoch": 2011} {"train_loss": -40.65739822387695, "global_step": 243431, "epoch": 2011} {"train_loss": -41.81837463378906, "global_step": 243432, "epoch": 2011} {"train_loss": -41.383766174316406, "global_step": 243433, "epoch": 2011} {"train_loss": -41.660362243652344, "global_step": 243434, "epoch": 2011} {"train_loss": -42.27033615112305, "global_step": 243435, "epoch": 2011} {"train_loss": -41.79552459716797, "global_step": 243436, "epoch": 2011} {"train_loss": -42.191123962402344, "global_step": 243437, "epoch": 2011} {"train_loss": -42.2049446105957, "global_step": 243438, "epoch": 2011} {"train_loss": -41.951904296875, "global_step": 243439, "epoch": 2011} {"train_loss": -41.541847229003906, "global_step": 243440, "epoch": 2011} {"train_loss": -42.0120964050293, "global_step": 243441, "epoch": 2011} {"train_loss": -42.04096603393555, "global_step": 243442, "epoch": 2011} {"train_loss": -41.523338317871094, "global_step": 243443, "epoch": 2011} {"train_loss": -41.93247604370117, "global_step": 243444, "epoch": 2011} {"train_loss": -41.11763000488281, "global_step": 243445, "epoch": 2011} {"train_loss": -41.73023223876953, "global_step": 243446, "epoch": 2011} {"train_loss": -42.105255126953125, "global_step": 243447, "epoch": 2011} {"train_loss": -42.644771575927734, "global_step": 243448, "epoch": 2011} {"train_loss": -42.31554412841797, "global_step": 243449, "epoch": 2011} {"train_loss": -42.47309112548828, "global_step": 243450, "epoch": 2011} {"train_loss": -41.332718084666354, "global_step": 243451, "epoch": 2011, "val_loss": 2535025.0} {"train_loss": -42.1530647277832, "global_step": 243452, "epoch": 2012} {"train_loss": -42.429115295410156, "global_step": 243453, "epoch": 2012} {"train_loss": -42.74222946166992, "global_step": 243454, "epoch": 2012} {"train_loss": -42.458641052246094, "global_step": 243455, "epoch": 2012} {"train_loss": -42.01691818237305, "global_step": 243456, "epoch": 2012} {"train_loss": -42.60622024536133, "global_step": 243457, "epoch": 2012} {"train_loss": -42.23696517944336, "global_step": 243458, "epoch": 2012} {"train_loss": -42.28477096557617, "global_step": 243459, "epoch": 2012} {"train_loss": -43.04280471801758, "global_step": 243460, "epoch": 2012} {"train_loss": -42.77327346801758, "global_step": 243461, "epoch": 2012} {"train_loss": -42.892425537109375, "global_step": 243462, "epoch": 2012} {"train_loss": -42.80479049682617, "global_step": 243463, "epoch": 2012} {"train_loss": -42.97715377807617, "global_step": 243464, "epoch": 2012} {"train_loss": -41.69468307495117, "global_step": 243465, "epoch": 2012} {"train_loss": -42.35304641723633, "global_step": 243466, "epoch": 2012} {"train_loss": -42.7852897644043, "global_step": 243467, "epoch": 2012} {"train_loss": -42.445838928222656, "global_step": 243468, "epoch": 2012} {"train_loss": -42.93310546875, "global_step": 243469, "epoch": 2012} {"train_loss": -40.757591247558594, "global_step": 243470, "epoch": 2012} {"train_loss": -42.406494140625, "global_step": 243471, "epoch": 2012} {"train_loss": -42.32503890991211, "global_step": 243472, "epoch": 2012} {"train_loss": -42.29969787597656, "global_step": 243473, "epoch": 2012} {"train_loss": -42.09629440307617, "global_step": 243474, "epoch": 2012} {"train_loss": -42.85898971557617, "global_step": 243475, "epoch": 2012} {"train_loss": -42.5105094909668, "global_step": 243476, "epoch": 2012} {"train_loss": -41.919944763183594, "global_step": 243477, "epoch": 2012} {"train_loss": -42.26249313354492, "global_step": 243478, "epoch": 2012} {"train_loss": -41.64347457885742, "global_step": 243479, "epoch": 2012} {"train_loss": -41.7684440612793, "global_step": 243480, "epoch": 2012} {"train_loss": -41.72947692871094, "global_step": 243481, "epoch": 2012} {"train_loss": -42.068824768066406, "global_step": 243482, "epoch": 2012} {"train_loss": -41.60024642944336, "global_step": 243483, "epoch": 2012} {"train_loss": -41.35883712768555, "global_step": 243484, "epoch": 2012} {"train_loss": -42.392425537109375, "global_step": 243485, "epoch": 2012} {"train_loss": -39.74345397949219, "global_step": 243486, "epoch": 2012} {"train_loss": -38.48775863647461, "global_step": 243487, "epoch": 2012} {"train_loss": -41.28401565551758, "global_step": 243488, "epoch": 2012} {"train_loss": -35.490543365478516, "global_step": 243489, "epoch": 2012} {"train_loss": -28.6854305267334, "global_step": 243490, "epoch": 2012} {"train_loss": -37.36135482788086, "global_step": 243491, "epoch": 2012} {"train_loss": -40.471431732177734, "global_step": 243492, "epoch": 2012} {"train_loss": -36.6839714050293, "global_step": 243493, "epoch": 2012} {"train_loss": -38.7054328918457, "global_step": 243494, "epoch": 2012} {"train_loss": -37.69050979614258, "global_step": 243495, "epoch": 2012} {"train_loss": -39.46185302734375, "global_step": 243496, "epoch": 2012} {"train_loss": -41.2124137878418, "global_step": 243497, "epoch": 2012} {"train_loss": -40.49158477783203, "global_step": 243498, "epoch": 2012} {"train_loss": -40.20908737182617, "global_step": 243499, "epoch": 2012} {"train_loss": -39.78471755981445, "global_step": 243500, "epoch": 2012} {"train_loss": -40.908851623535156, "global_step": 243501, "epoch": 2012} {"train_loss": -40.42570877075195, "global_step": 243502, "epoch": 2012} {"train_loss": -40.11222457885742, "global_step": 243503, "epoch": 2012} {"train_loss": -40.25010299682617, "global_step": 243504, "epoch": 2012} {"train_loss": -38.1839714050293, "global_step": 243505, "epoch": 2012} {"train_loss": -40.81714630126953, "global_step": 243506, "epoch": 2012} {"train_loss": -40.41770553588867, "global_step": 243507, "epoch": 2012} {"train_loss": -41.86249542236328, "global_step": 243508, "epoch": 2012} {"train_loss": -41.09647750854492, "global_step": 243509, "epoch": 2012} {"train_loss": -39.90330123901367, "global_step": 243510, "epoch": 2012} {"train_loss": -41.594207763671875, "global_step": 243511, "epoch": 2012} {"train_loss": -38.46696090698242, "global_step": 243512, "epoch": 2012} {"train_loss": -41.57929611206055, "global_step": 243513, "epoch": 2012} {"train_loss": -41.39360427856445, "global_step": 243514, "epoch": 2012} {"train_loss": -42.01321792602539, "global_step": 243515, "epoch": 2012} {"train_loss": -41.245243072509766, "global_step": 243516, "epoch": 2012} {"train_loss": -41.555206298828125, "global_step": 243517, "epoch": 2012} {"train_loss": -41.54894256591797, "global_step": 243518, "epoch": 2012} {"train_loss": -42.41766357421875, "global_step": 243519, "epoch": 2012} {"train_loss": -41.750762939453125, "global_step": 243520, "epoch": 2012} {"train_loss": -42.212989807128906, "global_step": 243521, "epoch": 2012} {"train_loss": -42.30641555786133, "global_step": 243522, "epoch": 2012} {"train_loss": -41.50560760498047, "global_step": 243523, "epoch": 2012} {"train_loss": -42.02655792236328, "global_step": 243524, "epoch": 2012} {"train_loss": -41.8770866394043, "global_step": 243525, "epoch": 2012} {"train_loss": -42.6034049987793, "global_step": 243526, "epoch": 2012} {"train_loss": -42.341182708740234, "global_step": 243527, "epoch": 2012} {"train_loss": -41.846038818359375, "global_step": 243528, "epoch": 2012} {"train_loss": -42.156898498535156, "global_step": 243529, "epoch": 2012} {"train_loss": -41.786277770996094, "global_step": 243530, "epoch": 2012} {"train_loss": -42.26913070678711, "global_step": 243531, "epoch": 2012} {"train_loss": -42.55577850341797, "global_step": 243532, "epoch": 2012} {"train_loss": -41.949974060058594, "global_step": 243533, "epoch": 2012} {"train_loss": -42.2938346862793, "global_step": 243534, "epoch": 2012} {"train_loss": -42.40692901611328, "global_step": 243535, "epoch": 2012} {"train_loss": -42.655906677246094, "global_step": 243536, "epoch": 2012} {"train_loss": -42.221012115478516, "global_step": 243537, "epoch": 2012} {"train_loss": -42.57728958129883, "global_step": 243538, "epoch": 2012} {"train_loss": -42.504878997802734, "global_step": 243539, "epoch": 2012} {"train_loss": -42.781288146972656, "global_step": 243540, "epoch": 2012} {"train_loss": -42.7073974609375, "global_step": 243541, "epoch": 2012} {"train_loss": -42.535884857177734, "global_step": 243542, "epoch": 2012} {"train_loss": -42.711463928222656, "global_step": 243543, "epoch": 2012} {"train_loss": -42.103736877441406, "global_step": 243544, "epoch": 2012} {"train_loss": -42.08004379272461, "global_step": 243545, "epoch": 2012} {"train_loss": -42.484413146972656, "global_step": 243546, "epoch": 2012} {"train_loss": -42.69775390625, "global_step": 243547, "epoch": 2012} {"train_loss": -43.19093704223633, "global_step": 243548, "epoch": 2012} {"train_loss": -42.771392822265625, "global_step": 243549, "epoch": 2012} {"train_loss": -42.51417922973633, "global_step": 243550, "epoch": 2012} {"train_loss": -42.365596771240234, "global_step": 243551, "epoch": 2012} {"train_loss": -41.872840881347656, "global_step": 243552, "epoch": 2012} {"train_loss": -41.79972457885742, "global_step": 243553, "epoch": 2012} {"train_loss": -41.9458122253418, "global_step": 243554, "epoch": 2012} {"train_loss": -42.43697738647461, "global_step": 243555, "epoch": 2012} {"train_loss": -43.0147819519043, "global_step": 243556, "epoch": 2012} {"train_loss": -42.31089782714844, "global_step": 243557, "epoch": 2012} {"train_loss": -42.605281829833984, "global_step": 243558, "epoch": 2012} {"train_loss": -42.45920944213867, "global_step": 243559, "epoch": 2012} {"train_loss": -42.929840087890625, "global_step": 243560, "epoch": 2012} {"train_loss": -42.28884506225586, "global_step": 243561, "epoch": 2012} {"train_loss": -42.54307174682617, "global_step": 243562, "epoch": 2012} {"train_loss": -42.15055847167969, "global_step": 243563, "epoch": 2012} {"train_loss": -42.46772003173828, "global_step": 243564, "epoch": 2012} {"train_loss": -42.81534957885742, "global_step": 243565, "epoch": 2012} {"train_loss": -41.94104766845703, "global_step": 243566, "epoch": 2012} {"train_loss": -42.7302360534668, "global_step": 243567, "epoch": 2012} {"train_loss": -42.81684112548828, "global_step": 243568, "epoch": 2012} {"train_loss": -42.20368194580078, "global_step": 243569, "epoch": 2012} {"train_loss": -42.9455680847168, "global_step": 243570, "epoch": 2012} {"train_loss": -42.218807220458984, "global_step": 243571, "epoch": 2012} {"train_loss": -41.61499340278058, "global_step": 243572, "epoch": 2012, "val_loss": 2585099.75} {"train_loss": -41.67683792114258, "global_step": 243573, "epoch": 2013} {"train_loss": -42.86626434326172, "global_step": 243574, "epoch": 2013} {"train_loss": -42.1353759765625, "global_step": 243575, "epoch": 2013} {"train_loss": -42.88816452026367, "global_step": 243576, "epoch": 2013} {"train_loss": -42.318729400634766, "global_step": 243577, "epoch": 2013} {"train_loss": -42.39960861206055, "global_step": 243578, "epoch": 2013} {"train_loss": -42.17215347290039, "global_step": 243579, "epoch": 2013} {"train_loss": -42.603309631347656, "global_step": 243580, "epoch": 2013} {"train_loss": -43.2710075378418, "global_step": 243581, "epoch": 2013} {"train_loss": -42.95493698120117, "global_step": 243582, "epoch": 2013} {"train_loss": -42.28738021850586, "global_step": 243583, "epoch": 2013} {"train_loss": -41.9081916809082, "global_step": 243584, "epoch": 2013} {"train_loss": -42.70387649536133, "global_step": 243585, "epoch": 2013} {"train_loss": -42.26909637451172, "global_step": 243586, "epoch": 2013} {"train_loss": -41.806392669677734, "global_step": 243587, "epoch": 2013} {"train_loss": -41.58260726928711, "global_step": 243588, "epoch": 2013} {"train_loss": -42.082969665527344, "global_step": 243589, "epoch": 2013} {"train_loss": -42.88889694213867, "global_step": 243590, "epoch": 2013} {"train_loss": -41.97445297241211, "global_step": 243591, "epoch": 2013} {"train_loss": -43.11714172363281, "global_step": 243592, "epoch": 2013} {"train_loss": -42.05620574951172, "global_step": 243593, "epoch": 2013} {"train_loss": -41.08381271362305, "global_step": 243594, "epoch": 2013} {"train_loss": -42.13669204711914, "global_step": 243595, "epoch": 2013} {"train_loss": -41.92116165161133, "global_step": 243596, "epoch": 2013} {"train_loss": -41.52865982055664, "global_step": 243597, "epoch": 2013} {"train_loss": -43.06515121459961, "global_step": 243598, "epoch": 2013} {"train_loss": -41.29179763793945, "global_step": 243599, "epoch": 2013} {"train_loss": -41.9118537902832, "global_step": 243600, "epoch": 2013} {"train_loss": -42.641292572021484, "global_step": 243601, "epoch": 2013} {"train_loss": -41.87504196166992, "global_step": 243602, "epoch": 2013} {"train_loss": -41.700069427490234, "global_step": 243603, "epoch": 2013} {"train_loss": -42.514198303222656, "global_step": 243604, "epoch": 2013} {"train_loss": -41.0296630859375, "global_step": 243605, "epoch": 2013} {"train_loss": -40.35651397705078, "global_step": 243606, "epoch": 2013} {"train_loss": -35.878570556640625, "global_step": 243607, "epoch": 2013} {"train_loss": -42.0372314453125, "global_step": 243608, "epoch": 2013} {"train_loss": -40.05134201049805, "global_step": 243609, "epoch": 2013} {"train_loss": -37.95603561401367, "global_step": 243610, "epoch": 2013} {"train_loss": -40.773651123046875, "global_step": 243611, "epoch": 2013} {"train_loss": -41.230384826660156, "global_step": 243612, "epoch": 2013} {"train_loss": -37.240108489990234, "global_step": 243613, "epoch": 2013} {"train_loss": -33.365421295166016, "global_step": 243614, "epoch": 2013} {"train_loss": -37.749515533447266, "global_step": 243615, "epoch": 2013} {"train_loss": -38.24172592163086, "global_step": 243616, "epoch": 2013} {"train_loss": -40.437469482421875, "global_step": 243617, "epoch": 2013} {"train_loss": -39.53758239746094, "global_step": 243618, "epoch": 2013} {"train_loss": -39.837799072265625, "global_step": 243619, "epoch": 2013} {"train_loss": -40.11348342895508, "global_step": 243620, "epoch": 2013} {"train_loss": -40.240234375, "global_step": 243621, "epoch": 2013} {"train_loss": -34.186614990234375, "global_step": 243622, "epoch": 2013} {"train_loss": -34.901851654052734, "global_step": 243623, "epoch": 2013} {"train_loss": -34.079341888427734, "global_step": 243624, "epoch": 2013} {"train_loss": -39.813289642333984, "global_step": 243625, "epoch": 2013} {"train_loss": -35.187171936035156, "global_step": 243626, "epoch": 2013} {"train_loss": -40.665767669677734, "global_step": 243627, "epoch": 2013} {"train_loss": -40.20207595825195, "global_step": 243628, "epoch": 2013} {"train_loss": -25.623441696166992, "global_step": 243629, "epoch": 2013} {"train_loss": -37.85731887817383, "global_step": 243630, "epoch": 2013} {"train_loss": -37.76829147338867, "global_step": 243631, "epoch": 2013} {"train_loss": -40.45014190673828, "global_step": 243632, "epoch": 2013} {"train_loss": -38.12403869628906, "global_step": 243633, "epoch": 2013} {"train_loss": -37.446258544921875, "global_step": 243634, "epoch": 2013} {"train_loss": -26.666187286376953, "global_step": 243635, "epoch": 2013} {"train_loss": -39.368953704833984, "global_step": 243636, "epoch": 2013} {"train_loss": -38.10352325439453, "global_step": 243637, "epoch": 2013} {"train_loss": -37.74363327026367, "global_step": 243638, "epoch": 2013} {"train_loss": -32.26015853881836, "global_step": 243639, "epoch": 2013} {"train_loss": -20.262752532958984, "global_step": 243640, "epoch": 2013} {"train_loss": -32.3569221496582, "global_step": 243641, "epoch": 2013} {"train_loss": -38.050071716308594, "global_step": 243642, "epoch": 2013} {"train_loss": -35.61188507080078, "global_step": 243643, "epoch": 2013} {"train_loss": -32.79411697387695, "global_step": 243644, "epoch": 2013} {"train_loss": -39.17871856689453, "global_step": 243645, "epoch": 2013} {"train_loss": -30.681379318237305, "global_step": 243646, "epoch": 2013} {"train_loss": -36.74808883666992, "global_step": 243647, "epoch": 2013} {"train_loss": -38.681209564208984, "global_step": 243648, "epoch": 2013} {"train_loss": -36.77859115600586, "global_step": 243649, "epoch": 2013} {"train_loss": -38.57301330566406, "global_step": 243650, "epoch": 2013} {"train_loss": -39.291133880615234, "global_step": 243651, "epoch": 2013} {"train_loss": -38.71318054199219, "global_step": 243652, "epoch": 2013} {"train_loss": -34.88711166381836, "global_step": 243653, "epoch": 2013} {"train_loss": -37.43715286254883, "global_step": 243654, "epoch": 2013} {"train_loss": -34.10595703125, "global_step": 243655, "epoch": 2013} {"train_loss": -35.965667724609375, "global_step": 243656, "epoch": 2013} {"train_loss": -38.4769401550293, "global_step": 243657, "epoch": 2013} {"train_loss": -37.44111633300781, "global_step": 243658, "epoch": 2013} {"train_loss": -39.24631881713867, "global_step": 243659, "epoch": 2013} {"train_loss": -35.165443420410156, "global_step": 243660, "epoch": 2013} {"train_loss": -39.04072189331055, "global_step": 243661, "epoch": 2013} {"train_loss": -37.00898742675781, "global_step": 243662, "epoch": 2013} {"train_loss": -39.49924850463867, "global_step": 243663, "epoch": 2013} {"train_loss": -39.49006271362305, "global_step": 243664, "epoch": 2013} {"train_loss": -35.900691986083984, "global_step": 243665, "epoch": 2013} {"train_loss": -39.6730842590332, "global_step": 243666, "epoch": 2013} {"train_loss": -39.7162971496582, "global_step": 243667, "epoch": 2013} {"train_loss": -39.54436492919922, "global_step": 243668, "epoch": 2013} {"train_loss": -39.06932067871094, "global_step": 243669, "epoch": 2013} {"train_loss": -39.47525405883789, "global_step": 243670, "epoch": 2013} {"train_loss": -39.890777587890625, "global_step": 243671, "epoch": 2013} {"train_loss": -38.851070404052734, "global_step": 243672, "epoch": 2013} {"train_loss": -39.8449821472168, "global_step": 243673, "epoch": 2013} {"train_loss": -40.062042236328125, "global_step": 243674, "epoch": 2013} {"train_loss": -38.88824462890625, "global_step": 243675, "epoch": 2013} {"train_loss": -38.84832763671875, "global_step": 243676, "epoch": 2013} {"train_loss": -40.69178771972656, "global_step": 243677, "epoch": 2013} {"train_loss": -40.53986358642578, "global_step": 243678, "epoch": 2013} {"train_loss": -39.67839050292969, "global_step": 243679, "epoch": 2013} {"train_loss": -40.26375961303711, "global_step": 243680, "epoch": 2013} {"train_loss": -40.75587844848633, "global_step": 243681, "epoch": 2013} {"train_loss": -40.3565788269043, "global_step": 243682, "epoch": 2013} {"train_loss": -38.47123336791992, "global_step": 243683, "epoch": 2013} {"train_loss": -40.660343170166016, "global_step": 243684, "epoch": 2013} {"train_loss": -40.27871322631836, "global_step": 243685, "epoch": 2013} {"train_loss": -40.6895866394043, "global_step": 243686, "epoch": 2013} {"train_loss": -40.683128356933594, "global_step": 243687, "epoch": 2013} {"train_loss": -40.07442092895508, "global_step": 243688, "epoch": 2013} {"train_loss": -41.075904846191406, "global_step": 243689, "epoch": 2013} {"train_loss": -41.12826156616211, "global_step": 243690, "epoch": 2013} {"train_loss": -41.16402053833008, "global_step": 243691, "epoch": 2013} {"train_loss": -41.156211853027344, "global_step": 243692, "epoch": 2013} {"train_loss": -39.0994862327891, "global_step": 243693, "epoch": 2013, "val_loss": 2607985.75} {"train_loss": -40.14175033569336, "global_step": 243694, "epoch": 2014} {"train_loss": -40.31351852416992, "global_step": 243695, "epoch": 2014} {"train_loss": -41.63267135620117, "global_step": 243696, "epoch": 2014} {"train_loss": -41.25181198120117, "global_step": 243697, "epoch": 2014} {"train_loss": -41.158084869384766, "global_step": 243698, "epoch": 2014} {"train_loss": -40.89411544799805, "global_step": 243699, "epoch": 2014} {"train_loss": -41.320396423339844, "global_step": 243700, "epoch": 2014} {"train_loss": -41.476776123046875, "global_step": 243701, "epoch": 2014} {"train_loss": -41.416175842285156, "global_step": 243702, "epoch": 2014} {"train_loss": -41.04655075073242, "global_step": 243703, "epoch": 2014} {"train_loss": -41.095211029052734, "global_step": 243704, "epoch": 2014} {"train_loss": -41.2588005065918, "global_step": 243705, "epoch": 2014} {"train_loss": -40.89094924926758, "global_step": 243706, "epoch": 2014} {"train_loss": -41.66935729980469, "global_step": 243707, "epoch": 2014} {"train_loss": -41.38154983520508, "global_step": 243708, "epoch": 2014} {"train_loss": -41.71436309814453, "global_step": 243709, "epoch": 2014} {"train_loss": -41.586727142333984, "global_step": 243710, "epoch": 2014} {"train_loss": -41.687049865722656, "global_step": 243711, "epoch": 2014} {"train_loss": -41.97237014770508, "global_step": 243712, "epoch": 2014} {"train_loss": -40.60780334472656, "global_step": 243713, "epoch": 2014} {"train_loss": -41.3004264831543, "global_step": 243714, "epoch": 2014} {"train_loss": -39.88964080810547, "global_step": 243715, "epoch": 2014} {"train_loss": -41.36043930053711, "global_step": 243716, "epoch": 2014} {"train_loss": -41.861671447753906, "global_step": 243717, "epoch": 2014} {"train_loss": -40.81299591064453, "global_step": 243718, "epoch": 2014} {"train_loss": -41.75041961669922, "global_step": 243719, "epoch": 2014} {"train_loss": -41.07253646850586, "global_step": 243720, "epoch": 2014} {"train_loss": -41.40346908569336, "global_step": 243721, "epoch": 2014} {"train_loss": -41.59597396850586, "global_step": 243722, "epoch": 2014} {"train_loss": -41.241817474365234, "global_step": 243723, "epoch": 2014} {"train_loss": -41.33930587768555, "global_step": 243724, "epoch": 2014} {"train_loss": -40.81694412231445, "global_step": 243725, "epoch": 2014} {"train_loss": -42.29542922973633, "global_step": 243726, "epoch": 2014} {"train_loss": -42.42226028442383, "global_step": 243727, "epoch": 2014} {"train_loss": -42.11871337890625, "global_step": 243728, "epoch": 2014} {"train_loss": -42.32215118408203, "global_step": 243729, "epoch": 2014} {"train_loss": -39.916725158691406, "global_step": 243730, "epoch": 2014} {"train_loss": -41.8283805847168, "global_step": 243731, "epoch": 2014} {"train_loss": -42.29063034057617, "global_step": 243732, "epoch": 2014} {"train_loss": -41.13322830200195, "global_step": 243733, "epoch": 2014} {"train_loss": -41.550445556640625, "global_step": 243734, "epoch": 2014} {"train_loss": -41.95309829711914, "global_step": 243735, "epoch": 2014} {"train_loss": -41.84973907470703, "global_step": 243736, "epoch": 2014} {"train_loss": -41.42885971069336, "global_step": 243737, "epoch": 2014} {"train_loss": -42.11794662475586, "global_step": 243738, "epoch": 2014} {"train_loss": -41.53956985473633, "global_step": 243739, "epoch": 2014} {"train_loss": -40.9975471496582, "global_step": 243740, "epoch": 2014} {"train_loss": -41.980712890625, "global_step": 243741, "epoch": 2014} {"train_loss": -41.9751091003418, "global_step": 243742, "epoch": 2014} {"train_loss": -42.1293830871582, "global_step": 243743, "epoch": 2014} {"train_loss": -41.38051223754883, "global_step": 243744, "epoch": 2014} {"train_loss": -41.861507415771484, "global_step": 243745, "epoch": 2014} {"train_loss": -41.029666900634766, "global_step": 243746, "epoch": 2014} {"train_loss": -41.59546661376953, "global_step": 243747, "epoch": 2014} {"train_loss": -42.29180908203125, "global_step": 243748, "epoch": 2014} {"train_loss": -42.46760177612305, "global_step": 243749, "epoch": 2014} {"train_loss": -42.207855224609375, "global_step": 243750, "epoch": 2014} {"train_loss": -42.1424560546875, "global_step": 243751, "epoch": 2014} {"train_loss": -42.23177719116211, "global_step": 243752, "epoch": 2014} {"train_loss": -41.793067932128906, "global_step": 243753, "epoch": 2014} {"train_loss": -42.336669921875, "global_step": 243754, "epoch": 2014} {"train_loss": -42.12648391723633, "global_step": 243755, "epoch": 2014} {"train_loss": -42.666160583496094, "global_step": 243756, "epoch": 2014} {"train_loss": -41.84821319580078, "global_step": 243757, "epoch": 2014} {"train_loss": -42.32011032104492, "global_step": 243758, "epoch": 2014} {"train_loss": -42.512054443359375, "global_step": 243759, "epoch": 2014} {"train_loss": -42.48325729370117, "global_step": 243760, "epoch": 2014} {"train_loss": -42.15641403198242, "global_step": 243761, "epoch": 2014} {"train_loss": -41.50132369995117, "global_step": 243762, "epoch": 2014} {"train_loss": -42.0974235534668, "global_step": 243763, "epoch": 2014} {"train_loss": -42.46272659301758, "global_step": 243764, "epoch": 2014} {"train_loss": -41.145652770996094, "global_step": 243765, "epoch": 2014} {"train_loss": -42.4552116394043, "global_step": 243766, "epoch": 2014} {"train_loss": -42.402008056640625, "global_step": 243767, "epoch": 2014} {"train_loss": -42.38066864013672, "global_step": 243768, "epoch": 2014} {"train_loss": -42.335018157958984, "global_step": 243769, "epoch": 2014} {"train_loss": -42.40729522705078, "global_step": 243770, "epoch": 2014} {"train_loss": -43.022212982177734, "global_step": 243771, "epoch": 2014} {"train_loss": -41.988319396972656, "global_step": 243772, "epoch": 2014} {"train_loss": -42.38490676879883, "global_step": 243773, "epoch": 2014} {"train_loss": -41.73480987548828, "global_step": 243774, "epoch": 2014} {"train_loss": -41.555850982666016, "global_step": 243775, "epoch": 2014} {"train_loss": -42.3382682800293, "global_step": 243776, "epoch": 2014} {"train_loss": -42.1906852722168, "global_step": 243777, "epoch": 2014} {"train_loss": -41.38322067260742, "global_step": 243778, "epoch": 2014} {"train_loss": -38.47175216674805, "global_step": 243779, "epoch": 2014} {"train_loss": -39.11875534057617, "global_step": 243780, "epoch": 2014} {"train_loss": -41.03126907348633, "global_step": 243781, "epoch": 2014} {"train_loss": -42.105491638183594, "global_step": 243782, "epoch": 2014} {"train_loss": -40.11908721923828, "global_step": 243783, "epoch": 2014} {"train_loss": -39.40036392211914, "global_step": 243784, "epoch": 2014} {"train_loss": -41.2146110534668, "global_step": 243785, "epoch": 2014} {"train_loss": -42.23806381225586, "global_step": 243786, "epoch": 2014} {"train_loss": -41.99546432495117, "global_step": 243787, "epoch": 2014} {"train_loss": -40.81022262573242, "global_step": 243788, "epoch": 2014} {"train_loss": -41.796783447265625, "global_step": 243789, "epoch": 2014} {"train_loss": -42.19552230834961, "global_step": 243790, "epoch": 2014} {"train_loss": -41.806148529052734, "global_step": 243791, "epoch": 2014} {"train_loss": -41.112823486328125, "global_step": 243792, "epoch": 2014} {"train_loss": -41.47047805786133, "global_step": 243793, "epoch": 2014} {"train_loss": -41.74232864379883, "global_step": 243794, "epoch": 2014} {"train_loss": -42.8360481262207, "global_step": 243795, "epoch": 2014} {"train_loss": -42.529335021972656, "global_step": 243796, "epoch": 2014} {"train_loss": -42.28793716430664, "global_step": 243797, "epoch": 2014} {"train_loss": -42.31182098388672, "global_step": 243798, "epoch": 2014} {"train_loss": -42.06673812866211, "global_step": 243799, "epoch": 2014} {"train_loss": -42.29545974731445, "global_step": 243800, "epoch": 2014} {"train_loss": -41.903724670410156, "global_step": 243801, "epoch": 2014} {"train_loss": -42.254119873046875, "global_step": 243802, "epoch": 2014} {"train_loss": -42.382179260253906, "global_step": 243803, "epoch": 2014} {"train_loss": -42.55512237548828, "global_step": 243804, "epoch": 2014} {"train_loss": -42.498138427734375, "global_step": 243805, "epoch": 2014} {"train_loss": -42.444129943847656, "global_step": 243806, "epoch": 2014} {"train_loss": -42.5662727355957, "global_step": 243807, "epoch": 2014} {"train_loss": -42.357845306396484, "global_step": 243808, "epoch": 2014} {"train_loss": -41.28957748413086, "global_step": 243809, "epoch": 2014} {"train_loss": -42.53849411010742, "global_step": 243810, "epoch": 2014} {"train_loss": -42.257171630859375, "global_step": 243811, "epoch": 2014} {"train_loss": -42.91361618041992, "global_step": 243812, "epoch": 2014} {"train_loss": -42.746925354003906, "global_step": 243813, "epoch": 2014} {"train_loss": -41.72113818964682, "global_step": 243814, "epoch": 2014, "val_loss": 2554971.75} {"train_loss": -43.263423919677734, "global_step": 243815, "epoch": 2015} {"train_loss": -42.91009521484375, "global_step": 243816, "epoch": 2015} {"train_loss": -42.0798225402832, "global_step": 243817, "epoch": 2015} {"train_loss": -42.0560417175293, "global_step": 243818, "epoch": 2015} {"train_loss": -41.153072357177734, "global_step": 243819, "epoch": 2015} {"train_loss": -41.622188568115234, "global_step": 243820, "epoch": 2015} {"train_loss": -41.1993293762207, "global_step": 243821, "epoch": 2015} {"train_loss": -41.5127067565918, "global_step": 243822, "epoch": 2015} {"train_loss": -42.233741760253906, "global_step": 243823, "epoch": 2015} {"train_loss": -42.0017204284668, "global_step": 243824, "epoch": 2015} {"train_loss": -42.517208099365234, "global_step": 243825, "epoch": 2015} {"train_loss": -41.84134292602539, "global_step": 243826, "epoch": 2015} {"train_loss": -41.48789596557617, "global_step": 243827, "epoch": 2015} {"train_loss": -42.37457275390625, "global_step": 243828, "epoch": 2015} {"train_loss": -40.78666305541992, "global_step": 243829, "epoch": 2015} {"train_loss": -42.676795959472656, "global_step": 243830, "epoch": 2015} {"train_loss": -40.39918899536133, "global_step": 243831, "epoch": 2015} {"train_loss": -40.49161911010742, "global_step": 243832, "epoch": 2015} {"train_loss": -39.0482177734375, "global_step": 243833, "epoch": 2015} {"train_loss": -41.4307975769043, "global_step": 243834, "epoch": 2015} {"train_loss": -40.63493728637695, "global_step": 243835, "epoch": 2015} {"train_loss": -40.4602165222168, "global_step": 243836, "epoch": 2015} {"train_loss": -42.261451721191406, "global_step": 243837, "epoch": 2015} {"train_loss": -42.42616653442383, "global_step": 243838, "epoch": 2015} {"train_loss": -42.046810150146484, "global_step": 243839, "epoch": 2015} {"train_loss": -40.73781967163086, "global_step": 243840, "epoch": 2015} {"train_loss": -41.049190521240234, "global_step": 243841, "epoch": 2015} {"train_loss": -39.31914138793945, "global_step": 243842, "epoch": 2015} {"train_loss": -39.88475036621094, "global_step": 243843, "epoch": 2015} {"train_loss": -36.129295349121094, "global_step": 243844, "epoch": 2015} {"train_loss": -41.479488372802734, "global_step": 243845, "epoch": 2015} {"train_loss": -38.75704574584961, "global_step": 243846, "epoch": 2015} {"train_loss": -39.76554489135742, "global_step": 243847, "epoch": 2015} {"train_loss": -39.55349349975586, "global_step": 243848, "epoch": 2015} {"train_loss": -40.84957504272461, "global_step": 243849, "epoch": 2015} {"train_loss": -38.55631637573242, "global_step": 243850, "epoch": 2015} {"train_loss": -40.69343948364258, "global_step": 243851, "epoch": 2015} {"train_loss": -40.50141525268555, "global_step": 243852, "epoch": 2015} {"train_loss": -38.950439453125, "global_step": 243853, "epoch": 2015} {"train_loss": -39.601593017578125, "global_step": 243854, "epoch": 2015} {"train_loss": -41.030921936035156, "global_step": 243855, "epoch": 2015} {"train_loss": -40.46311569213867, "global_step": 243856, "epoch": 2015} {"train_loss": -42.1079216003418, "global_step": 243857, "epoch": 2015} {"train_loss": -39.514503479003906, "global_step": 243858, "epoch": 2015} {"train_loss": -40.69692611694336, "global_step": 243859, "epoch": 2015} {"train_loss": -41.1638298034668, "global_step": 243860, "epoch": 2015} {"train_loss": -38.165931701660156, "global_step": 243861, "epoch": 2015} {"train_loss": -41.3060302734375, "global_step": 243862, "epoch": 2015} {"train_loss": -39.3228874206543, "global_step": 243863, "epoch": 2015} {"train_loss": -42.30030059814453, "global_step": 243864, "epoch": 2015} {"train_loss": -39.579803466796875, "global_step": 243865, "epoch": 2015} {"train_loss": -42.1099853515625, "global_step": 243866, "epoch": 2015} {"train_loss": -41.3281364440918, "global_step": 243867, "epoch": 2015} {"train_loss": -40.46352767944336, "global_step": 243868, "epoch": 2015} {"train_loss": -41.219417572021484, "global_step": 243869, "epoch": 2015} {"train_loss": -40.6898307800293, "global_step": 243870, "epoch": 2015} {"train_loss": -41.38694381713867, "global_step": 243871, "epoch": 2015} {"train_loss": -41.21077346801758, "global_step": 243872, "epoch": 2015} {"train_loss": -40.43600082397461, "global_step": 243873, "epoch": 2015} {"train_loss": -40.74139404296875, "global_step": 243874, "epoch": 2015} {"train_loss": -42.20600891113281, "global_step": 243875, "epoch": 2015} {"train_loss": -41.3261833190918, "global_step": 243876, "epoch": 2015} {"train_loss": -41.67435836791992, "global_step": 243877, "epoch": 2015} {"train_loss": -41.96725082397461, "global_step": 243878, "epoch": 2015} {"train_loss": -42.012474060058594, "global_step": 243879, "epoch": 2015} {"train_loss": -41.5465087890625, "global_step": 243880, "epoch": 2015} {"train_loss": -42.10938262939453, "global_step": 243881, "epoch": 2015} {"train_loss": -42.01583480834961, "global_step": 243882, "epoch": 2015} {"train_loss": -41.93825149536133, "global_step": 243883, "epoch": 2015} {"train_loss": -41.83956527709961, "global_step": 243884, "epoch": 2015} {"train_loss": -41.881465911865234, "global_step": 243885, "epoch": 2015} {"train_loss": -41.628150939941406, "global_step": 243886, "epoch": 2015} {"train_loss": -41.40128707885742, "global_step": 243887, "epoch": 2015} {"train_loss": -41.88764190673828, "global_step": 243888, "epoch": 2015} {"train_loss": -41.85100555419922, "global_step": 243889, "epoch": 2015} {"train_loss": -41.76935577392578, "global_step": 243890, "epoch": 2015} {"train_loss": -42.33836364746094, "global_step": 243891, "epoch": 2015} {"train_loss": -41.72519302368164, "global_step": 243892, "epoch": 2015} {"train_loss": -41.74103546142578, "global_step": 243893, "epoch": 2015} {"train_loss": -42.62852096557617, "global_step": 243894, "epoch": 2015} {"train_loss": -40.915462493896484, "global_step": 243895, "epoch": 2015} {"train_loss": -39.82757568359375, "global_step": 243896, "epoch": 2015} {"train_loss": -42.20479202270508, "global_step": 243897, "epoch": 2015} {"train_loss": -42.188270568847656, "global_step": 243898, "epoch": 2015} {"train_loss": -40.965572357177734, "global_step": 243899, "epoch": 2015} {"train_loss": -42.63365173339844, "global_step": 243900, "epoch": 2015} {"train_loss": -41.562652587890625, "global_step": 243901, "epoch": 2015} {"train_loss": -40.692012786865234, "global_step": 243902, "epoch": 2015} {"train_loss": -41.83477783203125, "global_step": 243903, "epoch": 2015} {"train_loss": -41.65635299682617, "global_step": 243904, "epoch": 2015} {"train_loss": -41.645835876464844, "global_step": 243905, "epoch": 2015} {"train_loss": -42.32109451293945, "global_step": 243906, "epoch": 2015} {"train_loss": -42.327396392822266, "global_step": 243907, "epoch": 2015} {"train_loss": -41.68461990356445, "global_step": 243908, "epoch": 2015} {"train_loss": -42.08125686645508, "global_step": 243909, "epoch": 2015} {"train_loss": -41.979679107666016, "global_step": 243910, "epoch": 2015} {"train_loss": -41.116973876953125, "global_step": 243911, "epoch": 2015} {"train_loss": -41.927894592285156, "global_step": 243912, "epoch": 2015} {"train_loss": -42.281837463378906, "global_step": 243913, "epoch": 2015} {"train_loss": -42.556251525878906, "global_step": 243914, "epoch": 2015} {"train_loss": -42.664146423339844, "global_step": 243915, "epoch": 2015} {"train_loss": -42.605323791503906, "global_step": 243916, "epoch": 2015} {"train_loss": -41.342987060546875, "global_step": 243917, "epoch": 2015} {"train_loss": -41.20973587036133, "global_step": 243918, "epoch": 2015} {"train_loss": -42.87093734741211, "global_step": 243919, "epoch": 2015} {"train_loss": -42.175384521484375, "global_step": 243920, "epoch": 2015} {"train_loss": -42.3966064453125, "global_step": 243921, "epoch": 2015} {"train_loss": -42.8188362121582, "global_step": 243922, "epoch": 2015} {"train_loss": -42.62749481201172, "global_step": 243923, "epoch": 2015} {"train_loss": -42.55948257446289, "global_step": 243924, "epoch": 2015} {"train_loss": -42.37936782836914, "global_step": 243925, "epoch": 2015} {"train_loss": -42.750301361083984, "global_step": 243926, "epoch": 2015} {"train_loss": -43.0323371887207, "global_step": 243927, "epoch": 2015} {"train_loss": -43.061012268066406, "global_step": 243928, "epoch": 2015} {"train_loss": -42.576141357421875, "global_step": 243929, "epoch": 2015} {"train_loss": -42.959930419921875, "global_step": 243930, "epoch": 2015} {"train_loss": -34.938289642333984, "global_step": 243931, "epoch": 2015} {"train_loss": -42.72699737548828, "global_step": 243932, "epoch": 2015} {"train_loss": -42.328895568847656, "global_step": 243933, "epoch": 2015} {"train_loss": -42.11174392700195, "global_step": 243934, "epoch": 2015} {"train_loss": -41.38940587319618, "global_step": 243935, "epoch": 2015, "val_loss": 2580879.0} {"train_loss": -42.140174865722656, "global_step": 243936, "epoch": 2016} {"train_loss": -42.563232421875, "global_step": 243937, "epoch": 2016} {"train_loss": -42.71259307861328, "global_step": 243938, "epoch": 2016} {"train_loss": -41.763484954833984, "global_step": 243939, "epoch": 2016} {"train_loss": -41.57770919799805, "global_step": 243940, "epoch": 2016} {"train_loss": -42.85392379760742, "global_step": 243941, "epoch": 2016} {"train_loss": -42.5576171875, "global_step": 243942, "epoch": 2016} {"train_loss": -42.72422409057617, "global_step": 243943, "epoch": 2016} {"train_loss": -41.732337951660156, "global_step": 243944, "epoch": 2016} {"train_loss": -39.88381576538086, "global_step": 243945, "epoch": 2016} {"train_loss": -38.36611557006836, "global_step": 243946, "epoch": 2016} {"train_loss": -38.91646957397461, "global_step": 243947, "epoch": 2016} {"train_loss": -38.86245346069336, "global_step": 243948, "epoch": 2016} {"train_loss": -38.24612045288086, "global_step": 243949, "epoch": 2016} {"train_loss": -42.802513122558594, "global_step": 243950, "epoch": 2016} {"train_loss": -41.48949432373047, "global_step": 243951, "epoch": 2016} {"train_loss": -34.338626861572266, "global_step": 243952, "epoch": 2016} {"train_loss": -30.786123275756836, "global_step": 243953, "epoch": 2016} {"train_loss": -40.585968017578125, "global_step": 243954, "epoch": 2016} {"train_loss": -40.0822639465332, "global_step": 243955, "epoch": 2016} {"train_loss": -37.377681732177734, "global_step": 243956, "epoch": 2016} {"train_loss": -40.165122985839844, "global_step": 243957, "epoch": 2016} {"train_loss": -39.980106353759766, "global_step": 243958, "epoch": 2016} {"train_loss": -39.151763916015625, "global_step": 243959, "epoch": 2016} {"train_loss": -40.74055862426758, "global_step": 243960, "epoch": 2016} {"train_loss": -40.447265625, "global_step": 243961, "epoch": 2016} {"train_loss": -39.5823974609375, "global_step": 243962, "epoch": 2016} {"train_loss": -41.870487213134766, "global_step": 243963, "epoch": 2016} {"train_loss": -39.666290283203125, "global_step": 243964, "epoch": 2016} {"train_loss": -41.70187759399414, "global_step": 243965, "epoch": 2016} {"train_loss": -41.34788131713867, "global_step": 243966, "epoch": 2016} {"train_loss": -39.491424560546875, "global_step": 243967, "epoch": 2016} {"train_loss": -40.961238861083984, "global_step": 243968, "epoch": 2016} {"train_loss": -39.62545394897461, "global_step": 243969, "epoch": 2016} {"train_loss": -35.4090461730957, "global_step": 243970, "epoch": 2016} {"train_loss": -38.74311065673828, "global_step": 243971, "epoch": 2016} {"train_loss": -31.066953659057617, "global_step": 243972, "epoch": 2016} {"train_loss": -41.10969161987305, "global_step": 243973, "epoch": 2016} {"train_loss": -40.54606246948242, "global_step": 243974, "epoch": 2016} {"train_loss": -39.169551849365234, "global_step": 243975, "epoch": 2016} {"train_loss": -39.0972900390625, "global_step": 243976, "epoch": 2016} {"train_loss": -39.61288070678711, "global_step": 243977, "epoch": 2016} {"train_loss": -40.00481033325195, "global_step": 243978, "epoch": 2016} {"train_loss": -40.9613151550293, "global_step": 243979, "epoch": 2016} {"train_loss": -39.96533966064453, "global_step": 243980, "epoch": 2016} {"train_loss": -41.50800704956055, "global_step": 243981, "epoch": 2016} {"train_loss": -41.2907600402832, "global_step": 243982, "epoch": 2016} {"train_loss": -40.27486038208008, "global_step": 243983, "epoch": 2016} {"train_loss": -40.06658935546875, "global_step": 243984, "epoch": 2016} {"train_loss": -39.26873779296875, "global_step": 243985, "epoch": 2016} {"train_loss": -26.14114761352539, "global_step": 243986, "epoch": 2016} {"train_loss": -41.66665267944336, "global_step": 243987, "epoch": 2016} {"train_loss": -39.63569641113281, "global_step": 243988, "epoch": 2016} {"train_loss": -37.75094223022461, "global_step": 243989, "epoch": 2016} {"train_loss": -36.48794174194336, "global_step": 243990, "epoch": 2016} {"train_loss": -40.27848434448242, "global_step": 243991, "epoch": 2016} {"train_loss": -39.6485481262207, "global_step": 243992, "epoch": 2016} {"train_loss": -37.601924896240234, "global_step": 243993, "epoch": 2016} {"train_loss": -39.117919921875, "global_step": 243994, "epoch": 2016} {"train_loss": -41.39701461791992, "global_step": 243995, "epoch": 2016} {"train_loss": -31.740768432617188, "global_step": 243996, "epoch": 2016} {"train_loss": -39.35160446166992, "global_step": 243997, "epoch": 2016} {"train_loss": -40.530433654785156, "global_step": 243998, "epoch": 2016} {"train_loss": -40.458473205566406, "global_step": 243999, "epoch": 2016} {"train_loss": -39.88827133178711, "global_step": 244000, "epoch": 2016} {"train_loss": -41.47549057006836, "global_step": 244001, "epoch": 2016} {"train_loss": -40.90361785888672, "global_step": 244002, "epoch": 2016} {"train_loss": -40.592769622802734, "global_step": 244003, "epoch": 2016} {"train_loss": -36.642791748046875, "global_step": 244004, "epoch": 2016} {"train_loss": -39.8870735168457, "global_step": 244005, "epoch": 2016} {"train_loss": -39.91044998168945, "global_step": 244006, "epoch": 2016} {"train_loss": -40.4634895324707, "global_step": 244007, "epoch": 2016} {"train_loss": -36.553340911865234, "global_step": 244008, "epoch": 2016} {"train_loss": -40.9574089050293, "global_step": 244009, "epoch": 2016} {"train_loss": -39.6923942565918, "global_step": 244010, "epoch": 2016} {"train_loss": -40.218379974365234, "global_step": 244011, "epoch": 2016} {"train_loss": -41.265228271484375, "global_step": 244012, "epoch": 2016} {"train_loss": -41.11422348022461, "global_step": 244013, "epoch": 2016} {"train_loss": -40.7585563659668, "global_step": 244014, "epoch": 2016} {"train_loss": -39.97531509399414, "global_step": 244015, "epoch": 2016} {"train_loss": -41.32407760620117, "global_step": 244016, "epoch": 2016} {"train_loss": -41.04352951049805, "global_step": 244017, "epoch": 2016} {"train_loss": -40.95664978027344, "global_step": 244018, "epoch": 2016} {"train_loss": -40.99272155761719, "global_step": 244019, "epoch": 2016} {"train_loss": -39.9609260559082, "global_step": 244020, "epoch": 2016} {"train_loss": -40.56712341308594, "global_step": 244021, "epoch": 2016} {"train_loss": -41.292274475097656, "global_step": 244022, "epoch": 2016} {"train_loss": -41.51721954345703, "global_step": 244023, "epoch": 2016} {"train_loss": -40.42045211791992, "global_step": 244024, "epoch": 2016} {"train_loss": -41.10798263549805, "global_step": 244025, "epoch": 2016} {"train_loss": -41.197174072265625, "global_step": 244026, "epoch": 2016} {"train_loss": -39.37826156616211, "global_step": 244027, "epoch": 2016} {"train_loss": -41.74090576171875, "global_step": 244028, "epoch": 2016} {"train_loss": -40.14723587036133, "global_step": 244029, "epoch": 2016} {"train_loss": -41.164222717285156, "global_step": 244030, "epoch": 2016} {"train_loss": -40.72869873046875, "global_step": 244031, "epoch": 2016} {"train_loss": -41.49024963378906, "global_step": 244032, "epoch": 2016} {"train_loss": -40.786434173583984, "global_step": 244033, "epoch": 2016} {"train_loss": -41.40718078613281, "global_step": 244034, "epoch": 2016} {"train_loss": -41.92924880981445, "global_step": 244035, "epoch": 2016} {"train_loss": -40.9398193359375, "global_step": 244036, "epoch": 2016} {"train_loss": -41.725921630859375, "global_step": 244037, "epoch": 2016} {"train_loss": -41.43374252319336, "global_step": 244038, "epoch": 2016} {"train_loss": -41.24176788330078, "global_step": 244039, "epoch": 2016} {"train_loss": -41.81764602661133, "global_step": 244040, "epoch": 2016} {"train_loss": -40.40714645385742, "global_step": 244041, "epoch": 2016} {"train_loss": -42.267486572265625, "global_step": 244042, "epoch": 2016} {"train_loss": -41.75756072998047, "global_step": 244043, "epoch": 2016} {"train_loss": -41.75799560546875, "global_step": 244044, "epoch": 2016} {"train_loss": -42.07673263549805, "global_step": 244045, "epoch": 2016} {"train_loss": -41.55551528930664, "global_step": 244046, "epoch": 2016} {"train_loss": -41.80988693237305, "global_step": 244047, "epoch": 2016} {"train_loss": -40.79854202270508, "global_step": 244048, "epoch": 2016} {"train_loss": -41.137969970703125, "global_step": 244049, "epoch": 2016} {"train_loss": -41.01939010620117, "global_step": 244050, "epoch": 2016} {"train_loss": -42.087825775146484, "global_step": 244051, "epoch": 2016} {"train_loss": -42.369667053222656, "global_step": 244052, "epoch": 2016} {"train_loss": -41.64925765991211, "global_step": 244053, "epoch": 2016} {"train_loss": -42.45960235595703, "global_step": 244054, "epoch": 2016} {"train_loss": -42.51244354248047, "global_step": 244055, "epoch": 2016} {"train_loss": -40.17932176195885, "global_step": 244056, "epoch": 2016, "val_loss": 2596275.0} {"train_loss": -42.40174865722656, "global_step": 244057, "epoch": 2017} {"train_loss": -42.68679428100586, "global_step": 244058, "epoch": 2017} {"train_loss": -42.979366302490234, "global_step": 244059, "epoch": 2017} {"train_loss": -41.589778900146484, "global_step": 244060, "epoch": 2017} {"train_loss": -42.60859298706055, "global_step": 244061, "epoch": 2017} {"train_loss": -41.84343719482422, "global_step": 244062, "epoch": 2017} {"train_loss": -41.924373626708984, "global_step": 244063, "epoch": 2017} {"train_loss": -41.77760696411133, "global_step": 244064, "epoch": 2017} {"train_loss": -42.750205993652344, "global_step": 244065, "epoch": 2017} {"train_loss": -42.96795654296875, "global_step": 244066, "epoch": 2017} {"train_loss": -42.63458251953125, "global_step": 244067, "epoch": 2017} {"train_loss": -42.80203628540039, "global_step": 244068, "epoch": 2017} {"train_loss": -42.30295944213867, "global_step": 244069, "epoch": 2017} {"train_loss": -41.840389251708984, "global_step": 244070, "epoch": 2017} {"train_loss": -42.72346878051758, "global_step": 244071, "epoch": 2017} {"train_loss": -41.94973373413086, "global_step": 244072, "epoch": 2017} {"train_loss": -42.571163177490234, "global_step": 244073, "epoch": 2017} {"train_loss": -42.89556884765625, "global_step": 244074, "epoch": 2017} {"train_loss": -42.69686508178711, "global_step": 244075, "epoch": 2017} {"train_loss": -42.14068603515625, "global_step": 244076, "epoch": 2017} {"train_loss": -41.32037353515625, "global_step": 244077, "epoch": 2017} {"train_loss": -41.334197998046875, "global_step": 244078, "epoch": 2017} {"train_loss": -42.54826736450195, "global_step": 244079, "epoch": 2017} {"train_loss": -42.33575439453125, "global_step": 244080, "epoch": 2017} {"train_loss": -43.12067413330078, "global_step": 244081, "epoch": 2017} {"train_loss": -42.306148529052734, "global_step": 244082, "epoch": 2017} {"train_loss": -41.50354766845703, "global_step": 244083, "epoch": 2017} {"train_loss": -42.2108039855957, "global_step": 244084, "epoch": 2017} {"train_loss": -41.445709228515625, "global_step": 244085, "epoch": 2017} {"train_loss": -42.812652587890625, "global_step": 244086, "epoch": 2017} {"train_loss": -41.99049758911133, "global_step": 244087, "epoch": 2017} {"train_loss": -42.5831184387207, "global_step": 244088, "epoch": 2017} {"train_loss": -43.2072639465332, "global_step": 244089, "epoch": 2017} {"train_loss": -42.68354797363281, "global_step": 244090, "epoch": 2017} {"train_loss": -43.07307052612305, "global_step": 244091, "epoch": 2017} {"train_loss": -41.81155014038086, "global_step": 244092, "epoch": 2017} {"train_loss": -42.87471008300781, "global_step": 244093, "epoch": 2017} {"train_loss": -43.113460540771484, "global_step": 244094, "epoch": 2017} {"train_loss": -41.0566291809082, "global_step": 244095, "epoch": 2017} {"train_loss": -42.195003509521484, "global_step": 244096, "epoch": 2017} {"train_loss": -42.954010009765625, "global_step": 244097, "epoch": 2017} {"train_loss": -42.77903366088867, "global_step": 244098, "epoch": 2017} {"train_loss": -43.034725189208984, "global_step": 244099, "epoch": 2017} {"train_loss": -41.74942398071289, "global_step": 244100, "epoch": 2017} {"train_loss": -43.00484848022461, "global_step": 244101, "epoch": 2017} {"train_loss": -42.6075553894043, "global_step": 244102, "epoch": 2017} {"train_loss": -42.49598693847656, "global_step": 244103, "epoch": 2017} {"train_loss": -42.18611526489258, "global_step": 244104, "epoch": 2017} {"train_loss": -41.19150924682617, "global_step": 244105, "epoch": 2017} {"train_loss": -43.32953643798828, "global_step": 244106, "epoch": 2017} {"train_loss": -41.84846496582031, "global_step": 244107, "epoch": 2017} {"train_loss": -35.72746658325195, "global_step": 244108, "epoch": 2017} {"train_loss": -41.73929977416992, "global_step": 244109, "epoch": 2017} {"train_loss": -38.89973068237305, "global_step": 244110, "epoch": 2017} {"train_loss": -36.687049865722656, "global_step": 244111, "epoch": 2017} {"train_loss": -38.448036193847656, "global_step": 244112, "epoch": 2017} {"train_loss": -41.95917510986328, "global_step": 244113, "epoch": 2017} {"train_loss": -38.05994415283203, "global_step": 244114, "epoch": 2017} {"train_loss": -32.61173629760742, "global_step": 244115, "epoch": 2017} {"train_loss": -39.75505447387695, "global_step": 244116, "epoch": 2017} {"train_loss": -39.789833068847656, "global_step": 244117, "epoch": 2017} {"train_loss": -39.60301208496094, "global_step": 244118, "epoch": 2017} {"train_loss": -40.66274642944336, "global_step": 244119, "epoch": 2017} {"train_loss": -40.769615173339844, "global_step": 244120, "epoch": 2017} {"train_loss": -37.26766586303711, "global_step": 244121, "epoch": 2017} {"train_loss": -35.7689094543457, "global_step": 244122, "epoch": 2017} {"train_loss": -39.28525161743164, "global_step": 244123, "epoch": 2017} {"train_loss": -38.50075149536133, "global_step": 244124, "epoch": 2017} {"train_loss": -37.9428825378418, "global_step": 244125, "epoch": 2017} {"train_loss": -38.06697082519531, "global_step": 244126, "epoch": 2017} {"train_loss": -40.56365966796875, "global_step": 244127, "epoch": 2017} {"train_loss": -36.487464904785156, "global_step": 244128, "epoch": 2017} {"train_loss": -33.600826263427734, "global_step": 244129, "epoch": 2017} {"train_loss": -37.167572021484375, "global_step": 244130, "epoch": 2017} {"train_loss": -36.15261459350586, "global_step": 244131, "epoch": 2017} {"train_loss": -32.6409797668457, "global_step": 244132, "epoch": 2017} {"train_loss": -39.84782791137695, "global_step": 244133, "epoch": 2017} {"train_loss": -36.63715744018555, "global_step": 244134, "epoch": 2017} {"train_loss": -38.358985900878906, "global_step": 244135, "epoch": 2017} {"train_loss": -38.595516204833984, "global_step": 244136, "epoch": 2017} {"train_loss": -39.22029495239258, "global_step": 244137, "epoch": 2017} {"train_loss": -39.24615478515625, "global_step": 244138, "epoch": 2017} {"train_loss": -40.08354568481445, "global_step": 244139, "epoch": 2017} {"train_loss": -38.91170883178711, "global_step": 244140, "epoch": 2017} {"train_loss": -37.69126510620117, "global_step": 244141, "epoch": 2017} {"train_loss": -38.24492645263672, "global_step": 244142, "epoch": 2017} {"train_loss": -40.827362060546875, "global_step": 244143, "epoch": 2017} {"train_loss": -37.09270095825195, "global_step": 244144, "epoch": 2017} {"train_loss": -39.763118743896484, "global_step": 244145, "epoch": 2017} {"train_loss": -39.12775421142578, "global_step": 244146, "epoch": 2017} {"train_loss": -39.7583122253418, "global_step": 244147, "epoch": 2017} {"train_loss": -38.09711837768555, "global_step": 244148, "epoch": 2017} {"train_loss": -39.54836654663086, "global_step": 244149, "epoch": 2017} {"train_loss": -39.17813491821289, "global_step": 244150, "epoch": 2017} {"train_loss": -40.41615295410156, "global_step": 244151, "epoch": 2017} {"train_loss": -40.5098991394043, "global_step": 244152, "epoch": 2017} {"train_loss": -41.10960006713867, "global_step": 244153, "epoch": 2017} {"train_loss": -40.72732925415039, "global_step": 244154, "epoch": 2017} {"train_loss": -39.57106018066406, "global_step": 244155, "epoch": 2017} {"train_loss": -41.05305099487305, "global_step": 244156, "epoch": 2017} {"train_loss": -39.624568939208984, "global_step": 244157, "epoch": 2017} {"train_loss": -40.4547004699707, "global_step": 244158, "epoch": 2017} {"train_loss": -40.618839263916016, "global_step": 244159, "epoch": 2017} {"train_loss": -40.23130416870117, "global_step": 244160, "epoch": 2017} {"train_loss": -41.38629150390625, "global_step": 244161, "epoch": 2017} {"train_loss": -40.00362014770508, "global_step": 244162, "epoch": 2017} {"train_loss": -40.649349212646484, "global_step": 244163, "epoch": 2017} {"train_loss": -40.868953704833984, "global_step": 244164, "epoch": 2017} {"train_loss": -39.94818878173828, "global_step": 244165, "epoch": 2017} {"train_loss": -40.8466796875, "global_step": 244166, "epoch": 2017} {"train_loss": -41.230743408203125, "global_step": 244167, "epoch": 2017} {"train_loss": -39.72976303100586, "global_step": 244168, "epoch": 2017} {"train_loss": -40.8473014831543, "global_step": 244169, "epoch": 2017} {"train_loss": -40.639469146728516, "global_step": 244170, "epoch": 2017} {"train_loss": -41.48830795288086, "global_step": 244171, "epoch": 2017} {"train_loss": -41.24052047729492, "global_step": 244172, "epoch": 2017} {"train_loss": -41.72760009765625, "global_step": 244173, "epoch": 2017} {"train_loss": -40.58708572387695, "global_step": 244174, "epoch": 2017} {"train_loss": -41.19854736328125, "global_step": 244175, "epoch": 2017} {"train_loss": -41.68537521362305, "global_step": 244176, "epoch": 2017} {"train_loss": -40.57047615366534, "global_step": 244177, "epoch": 2017, "val_loss": 2597939.25} {"train_loss": -41.98097229003906, "global_step": 244178, "epoch": 2018} {"train_loss": -40.87101364135742, "global_step": 244179, "epoch": 2018} {"train_loss": -41.813720703125, "global_step": 244180, "epoch": 2018} {"train_loss": -41.89735794067383, "global_step": 244181, "epoch": 2018} {"train_loss": -41.866004943847656, "global_step": 244182, "epoch": 2018} {"train_loss": -42.1257438659668, "global_step": 244183, "epoch": 2018} {"train_loss": -42.06588363647461, "global_step": 244184, "epoch": 2018} {"train_loss": -41.91086196899414, "global_step": 244185, "epoch": 2018} {"train_loss": -42.32167434692383, "global_step": 244186, "epoch": 2018} {"train_loss": -42.00997543334961, "global_step": 244187, "epoch": 2018} {"train_loss": -41.257389068603516, "global_step": 244188, "epoch": 2018} {"train_loss": -42.65458297729492, "global_step": 244189, "epoch": 2018} {"train_loss": -42.01914596557617, "global_step": 244190, "epoch": 2018} {"train_loss": -41.66160202026367, "global_step": 244191, "epoch": 2018} {"train_loss": -41.80033493041992, "global_step": 244192, "epoch": 2018} {"train_loss": -42.11055374145508, "global_step": 244193, "epoch": 2018} {"train_loss": -42.55884552001953, "global_step": 244194, "epoch": 2018} {"train_loss": -42.43310546875, "global_step": 244195, "epoch": 2018} {"train_loss": -42.65873336791992, "global_step": 244196, "epoch": 2018} {"train_loss": -42.52921676635742, "global_step": 244197, "epoch": 2018} {"train_loss": -41.62007141113281, "global_step": 244198, "epoch": 2018} {"train_loss": -42.36427307128906, "global_step": 244199, "epoch": 2018} {"train_loss": -42.55929183959961, "global_step": 244200, "epoch": 2018} {"train_loss": -42.59767532348633, "global_step": 244201, "epoch": 2018} {"train_loss": -40.72356033325195, "global_step": 244202, "epoch": 2018} {"train_loss": -41.442935943603516, "global_step": 244203, "epoch": 2018} {"train_loss": -42.389984130859375, "global_step": 244204, "epoch": 2018} {"train_loss": -42.58769607543945, "global_step": 244205, "epoch": 2018} {"train_loss": -42.212310791015625, "global_step": 244206, "epoch": 2018} {"train_loss": -42.09259033203125, "global_step": 244207, "epoch": 2018} {"train_loss": -42.64583969116211, "global_step": 244208, "epoch": 2018} {"train_loss": -42.841705322265625, "global_step": 244209, "epoch": 2018} {"train_loss": -42.14125061035156, "global_step": 244210, "epoch": 2018} {"train_loss": -42.88918685913086, "global_step": 244211, "epoch": 2018} {"train_loss": -42.8752326965332, "global_step": 244212, "epoch": 2018} {"train_loss": -42.88513946533203, "global_step": 244213, "epoch": 2018} {"train_loss": -42.72361755371094, "global_step": 244214, "epoch": 2018} {"train_loss": -43.14485168457031, "global_step": 244215, "epoch": 2018} {"train_loss": -43.083831787109375, "global_step": 244216, "epoch": 2018} {"train_loss": -42.50027084350586, "global_step": 244217, "epoch": 2018} {"train_loss": -42.71041488647461, "global_step": 244218, "epoch": 2018} {"train_loss": -43.154659271240234, "global_step": 244219, "epoch": 2018} {"train_loss": -43.374568939208984, "global_step": 244220, "epoch": 2018} {"train_loss": -43.22454833984375, "global_step": 244221, "epoch": 2018} {"train_loss": -43.22874069213867, "global_step": 244222, "epoch": 2018} {"train_loss": -43.20022201538086, "global_step": 244223, "epoch": 2018} {"train_loss": -43.01776885986328, "global_step": 244224, "epoch": 2018} {"train_loss": -42.5750846862793, "global_step": 244225, "epoch": 2018} {"train_loss": -43.035762786865234, "global_step": 244226, "epoch": 2018} {"train_loss": -43.16868591308594, "global_step": 244227, "epoch": 2018} {"train_loss": -42.77173614501953, "global_step": 244228, "epoch": 2018} {"train_loss": -43.36408233642578, "global_step": 244229, "epoch": 2018} {"train_loss": -43.33244705200195, "global_step": 244230, "epoch": 2018} {"train_loss": -43.051239013671875, "global_step": 244231, "epoch": 2018} {"train_loss": -43.22218322753906, "global_step": 244232, "epoch": 2018} {"train_loss": -43.042755126953125, "global_step": 244233, "epoch": 2018} {"train_loss": -40.708335876464844, "global_step": 244234, "epoch": 2018} {"train_loss": -41.9826774597168, "global_step": 244235, "epoch": 2018} {"train_loss": -43.19015121459961, "global_step": 244236, "epoch": 2018} {"train_loss": -42.294734954833984, "global_step": 244237, "epoch": 2018} {"train_loss": -42.882041931152344, "global_step": 244238, "epoch": 2018} {"train_loss": -42.718624114990234, "global_step": 244239, "epoch": 2018} {"train_loss": -42.860591888427734, "global_step": 244240, "epoch": 2018} {"train_loss": -43.26027297973633, "global_step": 244241, "epoch": 2018} {"train_loss": -43.18233871459961, "global_step": 244242, "epoch": 2018} {"train_loss": -42.72279357910156, "global_step": 244243, "epoch": 2018} {"train_loss": -43.2501335144043, "global_step": 244244, "epoch": 2018} {"train_loss": -42.383949279785156, "global_step": 244245, "epoch": 2018} {"train_loss": -42.32926559448242, "global_step": 244246, "epoch": 2018} {"train_loss": -42.44794845581055, "global_step": 244247, "epoch": 2018} {"train_loss": -42.06424331665039, "global_step": 244248, "epoch": 2018} {"train_loss": -41.241634368896484, "global_step": 244249, "epoch": 2018} {"train_loss": -41.59010314941406, "global_step": 244250, "epoch": 2018} {"train_loss": -41.351619720458984, "global_step": 244251, "epoch": 2018} {"train_loss": -38.926856994628906, "global_step": 244252, "epoch": 2018} {"train_loss": -42.04193115234375, "global_step": 244253, "epoch": 2018} {"train_loss": -42.75112533569336, "global_step": 244254, "epoch": 2018} {"train_loss": -42.25836944580078, "global_step": 244255, "epoch": 2018} {"train_loss": -41.5888557434082, "global_step": 244256, "epoch": 2018} {"train_loss": -42.388118743896484, "global_step": 244257, "epoch": 2018} {"train_loss": -40.74042892456055, "global_step": 244258, "epoch": 2018} {"train_loss": -41.51130294799805, "global_step": 244259, "epoch": 2018} {"train_loss": -42.2020263671875, "global_step": 244260, "epoch": 2018} {"train_loss": -41.950679779052734, "global_step": 244261, "epoch": 2018} {"train_loss": -42.02047348022461, "global_step": 244262, "epoch": 2018} {"train_loss": -42.13179397583008, "global_step": 244263, "epoch": 2018} {"train_loss": -41.61212158203125, "global_step": 244264, "epoch": 2018} {"train_loss": -42.347835540771484, "global_step": 244265, "epoch": 2018} {"train_loss": -42.46947479248047, "global_step": 244266, "epoch": 2018} {"train_loss": -42.14994430541992, "global_step": 244267, "epoch": 2018} {"train_loss": -42.485984802246094, "global_step": 244268, "epoch": 2018} {"train_loss": -40.446815490722656, "global_step": 244269, "epoch": 2018} {"train_loss": -42.14466094970703, "global_step": 244270, "epoch": 2018} {"train_loss": -42.58736801147461, "global_step": 244271, "epoch": 2018} {"train_loss": -42.2807731628418, "global_step": 244272, "epoch": 2018} {"train_loss": -41.83492660522461, "global_step": 244273, "epoch": 2018} {"train_loss": -41.720985412597656, "global_step": 244274, "epoch": 2018} {"train_loss": -42.413326263427734, "global_step": 244275, "epoch": 2018} {"train_loss": -42.702266693115234, "global_step": 244276, "epoch": 2018} {"train_loss": -40.889896392822266, "global_step": 244277, "epoch": 2018} {"train_loss": -40.83614730834961, "global_step": 244278, "epoch": 2018} {"train_loss": -41.42325973510742, "global_step": 244279, "epoch": 2018} {"train_loss": -41.07659912109375, "global_step": 244280, "epoch": 2018} {"train_loss": -40.826393127441406, "global_step": 244281, "epoch": 2018} {"train_loss": -42.772857666015625, "global_step": 244282, "epoch": 2018} {"train_loss": -40.4737548828125, "global_step": 244283, "epoch": 2018} {"train_loss": -41.48567581176758, "global_step": 244284, "epoch": 2018} {"train_loss": -41.94361877441406, "global_step": 244285, "epoch": 2018} {"train_loss": -40.706050872802734, "global_step": 244286, "epoch": 2018} {"train_loss": -39.948909759521484, "global_step": 244287, "epoch": 2018} {"train_loss": -39.97267532348633, "global_step": 244288, "epoch": 2018} {"train_loss": -41.98774337768555, "global_step": 244289, "epoch": 2018} {"train_loss": -41.75230026245117, "global_step": 244290, "epoch": 2018} {"train_loss": -39.083282470703125, "global_step": 244291, "epoch": 2018} {"train_loss": -41.00629425048828, "global_step": 244292, "epoch": 2018} {"train_loss": -42.10893630981445, "global_step": 244293, "epoch": 2018} {"train_loss": -40.99483871459961, "global_step": 244294, "epoch": 2018} {"train_loss": -38.55397415161133, "global_step": 244295, "epoch": 2018} {"train_loss": -36.535396575927734, "global_step": 244296, "epoch": 2018} {"train_loss": -38.46869659423828, "global_step": 244297, "epoch": 2018} {"train_loss": -41.995144142592245, "global_step": 244298, "epoch": 2018, "val_loss": 2596309.0} {"train_loss": -40.890907287597656, "global_step": 244299, "epoch": 2019} {"train_loss": -38.44409942626953, "global_step": 244300, "epoch": 2019} {"train_loss": -38.04560089111328, "global_step": 244301, "epoch": 2019} {"train_loss": -41.537410736083984, "global_step": 244302, "epoch": 2019} {"train_loss": -40.32611083984375, "global_step": 244303, "epoch": 2019} {"train_loss": -39.778717041015625, "global_step": 244304, "epoch": 2019} {"train_loss": -38.658050537109375, "global_step": 244305, "epoch": 2019} {"train_loss": -41.53396224975586, "global_step": 244306, "epoch": 2019} {"train_loss": -40.175506591796875, "global_step": 244307, "epoch": 2019} {"train_loss": -40.448646545410156, "global_step": 244308, "epoch": 2019} {"train_loss": -41.40897750854492, "global_step": 244309, "epoch": 2019} {"train_loss": -41.59046173095703, "global_step": 244310, "epoch": 2019} {"train_loss": -41.17952346801758, "global_step": 244311, "epoch": 2019} {"train_loss": -41.90883255004883, "global_step": 244312, "epoch": 2019} {"train_loss": -41.244720458984375, "global_step": 244313, "epoch": 2019} {"train_loss": -40.16827392578125, "global_step": 244314, "epoch": 2019} {"train_loss": -41.272315979003906, "global_step": 244315, "epoch": 2019} {"train_loss": -41.70610046386719, "global_step": 244316, "epoch": 2019} {"train_loss": -39.99644470214844, "global_step": 244317, "epoch": 2019} {"train_loss": -42.16766357421875, "global_step": 244318, "epoch": 2019} {"train_loss": -40.9619026184082, "global_step": 244319, "epoch": 2019} {"train_loss": -42.084564208984375, "global_step": 244320, "epoch": 2019} {"train_loss": -41.10056686401367, "global_step": 244321, "epoch": 2019} {"train_loss": -42.585731506347656, "global_step": 244322, "epoch": 2019} {"train_loss": -42.032955169677734, "global_step": 244323, "epoch": 2019} {"train_loss": -40.87612533569336, "global_step": 244324, "epoch": 2019} {"train_loss": -40.84463119506836, "global_step": 244325, "epoch": 2019} {"train_loss": -40.45416259765625, "global_step": 244326, "epoch": 2019} {"train_loss": -41.577144622802734, "global_step": 244327, "epoch": 2019} {"train_loss": -40.880428314208984, "global_step": 244328, "epoch": 2019} {"train_loss": -41.89571762084961, "global_step": 244329, "epoch": 2019} {"train_loss": -41.34266662597656, "global_step": 244330, "epoch": 2019} {"train_loss": -42.34310531616211, "global_step": 244331, "epoch": 2019} {"train_loss": -41.1336555480957, "global_step": 244332, "epoch": 2019} {"train_loss": -41.21795654296875, "global_step": 244333, "epoch": 2019} {"train_loss": -41.04572296142578, "global_step": 244334, "epoch": 2019} {"train_loss": -41.805625915527344, "global_step": 244335, "epoch": 2019} {"train_loss": -40.36127853393555, "global_step": 244336, "epoch": 2019} {"train_loss": -42.2481575012207, "global_step": 244337, "epoch": 2019} {"train_loss": -41.231590270996094, "global_step": 244338, "epoch": 2019} {"train_loss": -40.95978546142578, "global_step": 244339, "epoch": 2019} {"train_loss": -42.7465934753418, "global_step": 244340, "epoch": 2019} {"train_loss": -41.81585693359375, "global_step": 244341, "epoch": 2019} {"train_loss": -40.5706787109375, "global_step": 244342, "epoch": 2019} {"train_loss": -42.16746520996094, "global_step": 244343, "epoch": 2019} {"train_loss": -39.78889846801758, "global_step": 244344, "epoch": 2019} {"train_loss": -42.095916748046875, "global_step": 244345, "epoch": 2019} {"train_loss": -41.63039779663086, "global_step": 244346, "epoch": 2019} {"train_loss": -42.13137435913086, "global_step": 244347, "epoch": 2019} {"train_loss": -41.480506896972656, "global_step": 244348, "epoch": 2019} {"train_loss": -40.79092788696289, "global_step": 244349, "epoch": 2019} {"train_loss": -41.968318939208984, "global_step": 244350, "epoch": 2019} {"train_loss": -41.403297424316406, "global_step": 244351, "epoch": 2019} {"train_loss": -42.02649688720703, "global_step": 244352, "epoch": 2019} {"train_loss": -41.62482833862305, "global_step": 244353, "epoch": 2019} {"train_loss": -41.4859733581543, "global_step": 244354, "epoch": 2019} {"train_loss": -42.43742752075195, "global_step": 244355, "epoch": 2019} {"train_loss": -41.55989456176758, "global_step": 244356, "epoch": 2019} {"train_loss": -42.80247116088867, "global_step": 244357, "epoch": 2019} {"train_loss": -42.09482955932617, "global_step": 244358, "epoch": 2019} {"train_loss": -41.09134292602539, "global_step": 244359, "epoch": 2019} {"train_loss": -42.184688568115234, "global_step": 244360, "epoch": 2019} {"train_loss": -42.25594711303711, "global_step": 244361, "epoch": 2019} {"train_loss": -41.93040084838867, "global_step": 244362, "epoch": 2019} {"train_loss": -42.57755661010742, "global_step": 244363, "epoch": 2019} {"train_loss": -38.348793029785156, "global_step": 244364, "epoch": 2019} {"train_loss": -42.17148971557617, "global_step": 244365, "epoch": 2019} {"train_loss": -41.383174896240234, "global_step": 244366, "epoch": 2019} {"train_loss": -42.380306243896484, "global_step": 244367, "epoch": 2019} {"train_loss": -40.5335807800293, "global_step": 244368, "epoch": 2019} {"train_loss": -42.565608978271484, "global_step": 244369, "epoch": 2019} {"train_loss": -42.94999694824219, "global_step": 244370, "epoch": 2019} {"train_loss": -42.5651741027832, "global_step": 244371, "epoch": 2019} {"train_loss": -41.55094528198242, "global_step": 244372, "epoch": 2019} {"train_loss": -41.53723907470703, "global_step": 244373, "epoch": 2019} {"train_loss": -41.085243225097656, "global_step": 244374, "epoch": 2019} {"train_loss": -41.005126953125, "global_step": 244375, "epoch": 2019} {"train_loss": -42.646968841552734, "global_step": 244376, "epoch": 2019} {"train_loss": -42.572166442871094, "global_step": 244377, "epoch": 2019} {"train_loss": -40.001522064208984, "global_step": 244378, "epoch": 2019} {"train_loss": -42.394630432128906, "global_step": 244379, "epoch": 2019} {"train_loss": -42.22237014770508, "global_step": 244380, "epoch": 2019} {"train_loss": -42.12423324584961, "global_step": 244381, "epoch": 2019} {"train_loss": -42.620086669921875, "global_step": 244382, "epoch": 2019} {"train_loss": -40.291683197021484, "global_step": 244383, "epoch": 2019} {"train_loss": -42.3762321472168, "global_step": 244384, "epoch": 2019} {"train_loss": -42.571102142333984, "global_step": 244385, "epoch": 2019} {"train_loss": -42.119014739990234, "global_step": 244386, "epoch": 2019} {"train_loss": -42.61275863647461, "global_step": 244387, "epoch": 2019} {"train_loss": -40.621551513671875, "global_step": 244388, "epoch": 2019} {"train_loss": -42.641136169433594, "global_step": 244389, "epoch": 2019} {"train_loss": -41.282981872558594, "global_step": 244390, "epoch": 2019} {"train_loss": -42.101043701171875, "global_step": 244391, "epoch": 2019} {"train_loss": -41.51192092895508, "global_step": 244392, "epoch": 2019} {"train_loss": -41.82297897338867, "global_step": 244393, "epoch": 2019} {"train_loss": -41.30091094970703, "global_step": 244394, "epoch": 2019} {"train_loss": -40.42938232421875, "global_step": 244395, "epoch": 2019} {"train_loss": -41.09785461425781, "global_step": 244396, "epoch": 2019} {"train_loss": -42.72051239013672, "global_step": 244397, "epoch": 2019} {"train_loss": -40.34698486328125, "global_step": 244398, "epoch": 2019} {"train_loss": -39.858524322509766, "global_step": 244399, "epoch": 2019} {"train_loss": -39.53098678588867, "global_step": 244400, "epoch": 2019} {"train_loss": -42.50116729736328, "global_step": 244401, "epoch": 2019} {"train_loss": -40.1187858581543, "global_step": 244402, "epoch": 2019} {"train_loss": -39.104854583740234, "global_step": 244403, "epoch": 2019} {"train_loss": -41.22597885131836, "global_step": 244404, "epoch": 2019} {"train_loss": -40.50995635986328, "global_step": 244405, "epoch": 2019} {"train_loss": -39.762577056884766, "global_step": 244406, "epoch": 2019} {"train_loss": -42.02119445800781, "global_step": 244407, "epoch": 2019} {"train_loss": -41.1091194152832, "global_step": 244408, "epoch": 2019} {"train_loss": -38.39925003051758, "global_step": 244409, "epoch": 2019} {"train_loss": -40.286067962646484, "global_step": 244410, "epoch": 2019} {"train_loss": -39.62441635131836, "global_step": 244411, "epoch": 2019} {"train_loss": -35.957550048828125, "global_step": 244412, "epoch": 2019} {"train_loss": -39.32582473754883, "global_step": 244413, "epoch": 2019} {"train_loss": -40.72724914550781, "global_step": 244414, "epoch": 2019} {"train_loss": -39.21392822265625, "global_step": 244415, "epoch": 2019} {"train_loss": -41.51316833496094, "global_step": 244416, "epoch": 2019} {"train_loss": -40.81510543823242, "global_step": 244417, "epoch": 2019} {"train_loss": -41.66239547729492, "global_step": 244418, "epoch": 2019} {"train_loss": -41.21235968849876, "global_step": 244419, "epoch": 2019, "val_loss": 2739526.75} {"train_loss": -41.552547454833984, "global_step": 244420, "epoch": 2020} {"train_loss": -36.24834060668945, "global_step": 244421, "epoch": 2020} {"train_loss": -41.7061882019043, "global_step": 244422, "epoch": 2020} {"train_loss": -40.6072883605957, "global_step": 244423, "epoch": 2020} {"train_loss": -41.34577178955078, "global_step": 244424, "epoch": 2020} {"train_loss": -40.83977508544922, "global_step": 244425, "epoch": 2020} {"train_loss": -42.26900100708008, "global_step": 244426, "epoch": 2020} {"train_loss": -40.1298713684082, "global_step": 244427, "epoch": 2020} {"train_loss": -40.82685470581055, "global_step": 244428, "epoch": 2020} {"train_loss": -40.50227355957031, "global_step": 244429, "epoch": 2020} {"train_loss": -41.807960510253906, "global_step": 244430, "epoch": 2020} {"train_loss": -40.232784271240234, "global_step": 244431, "epoch": 2020} {"train_loss": -41.287132263183594, "global_step": 244432, "epoch": 2020} {"train_loss": -41.44869613647461, "global_step": 244433, "epoch": 2020} {"train_loss": -41.687744140625, "global_step": 244434, "epoch": 2020} {"train_loss": -41.48133850097656, "global_step": 244435, "epoch": 2020} {"train_loss": -41.267520904541016, "global_step": 244436, "epoch": 2020} {"train_loss": -42.249488830566406, "global_step": 244437, "epoch": 2020} {"train_loss": -41.3556022644043, "global_step": 244438, "epoch": 2020} {"train_loss": -41.472957611083984, "global_step": 244439, "epoch": 2020} {"train_loss": -40.513526916503906, "global_step": 244440, "epoch": 2020} {"train_loss": -38.60514450073242, "global_step": 244441, "epoch": 2020} {"train_loss": -40.30900955200195, "global_step": 244442, "epoch": 2020} {"train_loss": -39.9124755859375, "global_step": 244443, "epoch": 2020} {"train_loss": -40.27167892456055, "global_step": 244444, "epoch": 2020} {"train_loss": -39.88552474975586, "global_step": 244445, "epoch": 2020} {"train_loss": -42.23109817504883, "global_step": 244446, "epoch": 2020} {"train_loss": -40.462310791015625, "global_step": 244447, "epoch": 2020} {"train_loss": -41.18206787109375, "global_step": 244448, "epoch": 2020} {"train_loss": -42.47636795043945, "global_step": 244449, "epoch": 2020} {"train_loss": -40.59564971923828, "global_step": 244450, "epoch": 2020} {"train_loss": -42.29076385498047, "global_step": 244451, "epoch": 2020} {"train_loss": -42.19851303100586, "global_step": 244452, "epoch": 2020} {"train_loss": -42.82767105102539, "global_step": 244453, "epoch": 2020} {"train_loss": -41.71397018432617, "global_step": 244454, "epoch": 2020} {"train_loss": -41.86735153198242, "global_step": 244455, "epoch": 2020} {"train_loss": -42.950477600097656, "global_step": 244456, "epoch": 2020} {"train_loss": -42.82351303100586, "global_step": 244457, "epoch": 2020} {"train_loss": -42.515869140625, "global_step": 244458, "epoch": 2020} {"train_loss": -41.933380126953125, "global_step": 244459, "epoch": 2020} {"train_loss": -41.4781608581543, "global_step": 244460, "epoch": 2020} {"train_loss": -40.16813278198242, "global_step": 244461, "epoch": 2020} {"train_loss": -42.734107971191406, "global_step": 244462, "epoch": 2020} {"train_loss": -42.562828063964844, "global_step": 244463, "epoch": 2020} {"train_loss": -42.24523162841797, "global_step": 244464, "epoch": 2020} {"train_loss": -42.15563201904297, "global_step": 244465, "epoch": 2020} {"train_loss": -42.3273811340332, "global_step": 244466, "epoch": 2020} {"train_loss": -41.499874114990234, "global_step": 244467, "epoch": 2020} {"train_loss": -42.17075729370117, "global_step": 244468, "epoch": 2020} {"train_loss": -42.90189743041992, "global_step": 244469, "epoch": 2020} {"train_loss": -41.22830581665039, "global_step": 244470, "epoch": 2020} {"train_loss": -42.93623352050781, "global_step": 244471, "epoch": 2020} {"train_loss": -42.52345657348633, "global_step": 244472, "epoch": 2020} {"train_loss": -41.56917953491211, "global_step": 244473, "epoch": 2020} {"train_loss": -41.86879348754883, "global_step": 244474, "epoch": 2020} {"train_loss": -42.959014892578125, "global_step": 244475, "epoch": 2020} {"train_loss": -42.306819915771484, "global_step": 244476, "epoch": 2020} {"train_loss": -42.53135681152344, "global_step": 244477, "epoch": 2020} {"train_loss": -42.11220932006836, "global_step": 244478, "epoch": 2020} {"train_loss": -42.5739631652832, "global_step": 244479, "epoch": 2020} {"train_loss": -42.86783981323242, "global_step": 244480, "epoch": 2020} {"train_loss": -41.82334899902344, "global_step": 244481, "epoch": 2020} {"train_loss": -42.634647369384766, "global_step": 244482, "epoch": 2020} {"train_loss": -42.75226593017578, "global_step": 244483, "epoch": 2020} {"train_loss": -42.206687927246094, "global_step": 244484, "epoch": 2020} {"train_loss": -42.041316986083984, "global_step": 244485, "epoch": 2020} {"train_loss": -42.97133255004883, "global_step": 244486, "epoch": 2020} {"train_loss": -41.77375030517578, "global_step": 244487, "epoch": 2020} {"train_loss": -42.9775390625, "global_step": 244488, "epoch": 2020} {"train_loss": -42.80020523071289, "global_step": 244489, "epoch": 2020} {"train_loss": -42.2609977722168, "global_step": 244490, "epoch": 2020} {"train_loss": -42.933135986328125, "global_step": 244491, "epoch": 2020} {"train_loss": -42.84968185424805, "global_step": 244492, "epoch": 2020} {"train_loss": -42.213050842285156, "global_step": 244493, "epoch": 2020} {"train_loss": -42.4884147644043, "global_step": 244494, "epoch": 2020} {"train_loss": -42.27573013305664, "global_step": 244495, "epoch": 2020} {"train_loss": -42.68218231201172, "global_step": 244496, "epoch": 2020} {"train_loss": -42.99147415161133, "global_step": 244497, "epoch": 2020} {"train_loss": -42.49724197387695, "global_step": 244498, "epoch": 2020} {"train_loss": -42.16215133666992, "global_step": 244499, "epoch": 2020} {"train_loss": -42.537574768066406, "global_step": 244500, "epoch": 2020} {"train_loss": -43.216617584228516, "global_step": 244501, "epoch": 2020} {"train_loss": -42.55565643310547, "global_step": 244502, "epoch": 2020} {"train_loss": -42.832611083984375, "global_step": 244503, "epoch": 2020} {"train_loss": -42.282588958740234, "global_step": 244504, "epoch": 2020} {"train_loss": -43.08762741088867, "global_step": 244505, "epoch": 2020} {"train_loss": -42.4471549987793, "global_step": 244506, "epoch": 2020} {"train_loss": -42.49636459350586, "global_step": 244507, "epoch": 2020} {"train_loss": -43.38601303100586, "global_step": 244508, "epoch": 2020} {"train_loss": -42.7181396484375, "global_step": 244509, "epoch": 2020} {"train_loss": -42.16436767578125, "global_step": 244510, "epoch": 2020} {"train_loss": -42.72473907470703, "global_step": 244511, "epoch": 2020} {"train_loss": -43.06624221801758, "global_step": 244512, "epoch": 2020} {"train_loss": -42.97038269042969, "global_step": 244513, "epoch": 2020} {"train_loss": -42.43011474609375, "global_step": 244514, "epoch": 2020} {"train_loss": -42.8292236328125, "global_step": 244515, "epoch": 2020} {"train_loss": -42.85247039794922, "global_step": 244516, "epoch": 2020} {"train_loss": -42.718746185302734, "global_step": 244517, "epoch": 2020} {"train_loss": -42.96601104736328, "global_step": 244518, "epoch": 2020} {"train_loss": -42.78194808959961, "global_step": 244519, "epoch": 2020} {"train_loss": -42.89197540283203, "global_step": 244520, "epoch": 2020} {"train_loss": -42.608795166015625, "global_step": 244521, "epoch": 2020} {"train_loss": -42.24695587158203, "global_step": 244522, "epoch": 2020} {"train_loss": -42.1988525390625, "global_step": 244523, "epoch": 2020} {"train_loss": -42.21713638305664, "global_step": 244524, "epoch": 2020} {"train_loss": -42.238014221191406, "global_step": 244525, "epoch": 2020} {"train_loss": -41.728511810302734, "global_step": 244526, "epoch": 2020} {"train_loss": -41.82076644897461, "global_step": 244527, "epoch": 2020} {"train_loss": -41.01422882080078, "global_step": 244528, "epoch": 2020} {"train_loss": -41.70908737182617, "global_step": 244529, "epoch": 2020} {"train_loss": -39.98492431640625, "global_step": 244530, "epoch": 2020} {"train_loss": -40.33503341674805, "global_step": 244531, "epoch": 2020} {"train_loss": -40.4419059753418, "global_step": 244532, "epoch": 2020} {"train_loss": -40.77177810668945, "global_step": 244533, "epoch": 2020} {"train_loss": -39.373321533203125, "global_step": 244534, "epoch": 2020} {"train_loss": -39.457115173339844, "global_step": 244535, "epoch": 2020} {"train_loss": -42.343055725097656, "global_step": 244536, "epoch": 2020} {"train_loss": -40.278316497802734, "global_step": 244537, "epoch": 2020} {"train_loss": -39.05044937133789, "global_step": 244538, "epoch": 2020} {"train_loss": -40.862037658691406, "global_step": 244539, "epoch": 2020} {"train_loss": -41.80048855868253, "global_step": 244540, "epoch": 2020, "val_loss": 2561693.0} {"train_loss": -42.12583541870117, "global_step": 244541, "epoch": 2021} {"train_loss": -41.0510139465332, "global_step": 244542, "epoch": 2021} {"train_loss": -40.30495834350586, "global_step": 244543, "epoch": 2021} {"train_loss": -42.72076416015625, "global_step": 244544, "epoch": 2021} {"train_loss": -40.99954605102539, "global_step": 244545, "epoch": 2021} {"train_loss": -40.12543487548828, "global_step": 244546, "epoch": 2021} {"train_loss": -41.81300735473633, "global_step": 244547, "epoch": 2021} {"train_loss": -41.304988861083984, "global_step": 244548, "epoch": 2021} {"train_loss": -41.65241241455078, "global_step": 244549, "epoch": 2021} {"train_loss": -42.323360443115234, "global_step": 244550, "epoch": 2021} {"train_loss": -41.570919036865234, "global_step": 244551, "epoch": 2021} {"train_loss": -41.693092346191406, "global_step": 244552, "epoch": 2021} {"train_loss": -42.5035285949707, "global_step": 244553, "epoch": 2021} {"train_loss": -42.3349609375, "global_step": 244554, "epoch": 2021} {"train_loss": -40.922950744628906, "global_step": 244555, "epoch": 2021} {"train_loss": -41.76953125, "global_step": 244556, "epoch": 2021} {"train_loss": -42.46061325073242, "global_step": 244557, "epoch": 2021} {"train_loss": -40.83864974975586, "global_step": 244558, "epoch": 2021} {"train_loss": -42.03474807739258, "global_step": 244559, "epoch": 2021} {"train_loss": -41.68183898925781, "global_step": 244560, "epoch": 2021} {"train_loss": -41.74349594116211, "global_step": 244561, "epoch": 2021} {"train_loss": -42.60633087158203, "global_step": 244562, "epoch": 2021} {"train_loss": -40.30927276611328, "global_step": 244563, "epoch": 2021} {"train_loss": -42.226478576660156, "global_step": 244564, "epoch": 2021} {"train_loss": -40.21714401245117, "global_step": 244565, "epoch": 2021} {"train_loss": -42.146087646484375, "global_step": 244566, "epoch": 2021} {"train_loss": -41.28734588623047, "global_step": 244567, "epoch": 2021} {"train_loss": -41.69407272338867, "global_step": 244568, "epoch": 2021} {"train_loss": -42.400264739990234, "global_step": 244569, "epoch": 2021} {"train_loss": -42.161376953125, "global_step": 244570, "epoch": 2021} {"train_loss": -42.37617111206055, "global_step": 244571, "epoch": 2021} {"train_loss": -41.64973831176758, "global_step": 244572, "epoch": 2021} {"train_loss": -42.45790100097656, "global_step": 244573, "epoch": 2021} {"train_loss": -42.55782699584961, "global_step": 244574, "epoch": 2021} {"train_loss": -41.53713607788086, "global_step": 244575, "epoch": 2021} {"train_loss": -42.469364166259766, "global_step": 244576, "epoch": 2021} {"train_loss": -42.87714767456055, "global_step": 244577, "epoch": 2021} {"train_loss": -41.84820556640625, "global_step": 244578, "epoch": 2021} {"train_loss": -42.13975143432617, "global_step": 244579, "epoch": 2021} {"train_loss": -42.308349609375, "global_step": 244580, "epoch": 2021} {"train_loss": -42.30440902709961, "global_step": 244581, "epoch": 2021} {"train_loss": -41.46538543701172, "global_step": 244582, "epoch": 2021} {"train_loss": -43.1739616394043, "global_step": 244583, "epoch": 2021} {"train_loss": -42.68159866333008, "global_step": 244584, "epoch": 2021} {"train_loss": -41.47136306762695, "global_step": 244585, "epoch": 2021} {"train_loss": -40.8422737121582, "global_step": 244586, "epoch": 2021} {"train_loss": -42.83538818359375, "global_step": 244587, "epoch": 2021} {"train_loss": -40.796810150146484, "global_step": 244588, "epoch": 2021} {"train_loss": -42.288818359375, "global_step": 244589, "epoch": 2021} {"train_loss": -41.66004943847656, "global_step": 244590, "epoch": 2021} {"train_loss": -41.468135833740234, "global_step": 244591, "epoch": 2021} {"train_loss": -42.57318878173828, "global_step": 244592, "epoch": 2021} {"train_loss": -42.44965362548828, "global_step": 244593, "epoch": 2021} {"train_loss": -42.14467239379883, "global_step": 244594, "epoch": 2021} {"train_loss": -41.15542221069336, "global_step": 244595, "epoch": 2021} {"train_loss": -41.863277435302734, "global_step": 244596, "epoch": 2021} {"train_loss": -42.032257080078125, "global_step": 244597, "epoch": 2021} {"train_loss": -42.86909866333008, "global_step": 244598, "epoch": 2021} {"train_loss": -42.5261344909668, "global_step": 244599, "epoch": 2021} {"train_loss": -41.22602081298828, "global_step": 244600, "epoch": 2021} {"train_loss": -42.88669967651367, "global_step": 244601, "epoch": 2021} {"train_loss": -42.18498992919922, "global_step": 244602, "epoch": 2021} {"train_loss": -42.12812423706055, "global_step": 244603, "epoch": 2021} {"train_loss": -42.400245666503906, "global_step": 244604, "epoch": 2021} {"train_loss": -42.305999755859375, "global_step": 244605, "epoch": 2021} {"train_loss": -42.8148307800293, "global_step": 244606, "epoch": 2021} {"train_loss": -42.00136184692383, "global_step": 244607, "epoch": 2021} {"train_loss": -41.38855743408203, "global_step": 244608, "epoch": 2021} {"train_loss": -42.958282470703125, "global_step": 244609, "epoch": 2021} {"train_loss": -42.78255081176758, "global_step": 244610, "epoch": 2021} {"train_loss": -42.527923583984375, "global_step": 244611, "epoch": 2021} {"train_loss": -41.903564453125, "global_step": 244612, "epoch": 2021} {"train_loss": -42.99120330810547, "global_step": 244613, "epoch": 2021} {"train_loss": -42.06850051879883, "global_step": 244614, "epoch": 2021} {"train_loss": -41.000404357910156, "global_step": 244615, "epoch": 2021} {"train_loss": -41.99555206298828, "global_step": 244616, "epoch": 2021} {"train_loss": -42.00715255737305, "global_step": 244617, "epoch": 2021} {"train_loss": -42.110267639160156, "global_step": 244618, "epoch": 2021} {"train_loss": -41.84232711791992, "global_step": 244619, "epoch": 2021} {"train_loss": -40.8066520690918, "global_step": 244620, "epoch": 2021} {"train_loss": -42.5296630859375, "global_step": 244621, "epoch": 2021} {"train_loss": -42.65597152709961, "global_step": 244622, "epoch": 2021} {"train_loss": -41.68977737426758, "global_step": 244623, "epoch": 2021} {"train_loss": -41.610958099365234, "global_step": 244624, "epoch": 2021} {"train_loss": -42.49464797973633, "global_step": 244625, "epoch": 2021} {"train_loss": -42.51324462890625, "global_step": 244626, "epoch": 2021} {"train_loss": -42.16633224487305, "global_step": 244627, "epoch": 2021} {"train_loss": -42.12354278564453, "global_step": 244628, "epoch": 2021} {"train_loss": -42.63442611694336, "global_step": 244629, "epoch": 2021} {"train_loss": -41.717281341552734, "global_step": 244630, "epoch": 2021} {"train_loss": -42.103172302246094, "global_step": 244631, "epoch": 2021} {"train_loss": -42.04266357421875, "global_step": 244632, "epoch": 2021} {"train_loss": -41.76115798950195, "global_step": 244633, "epoch": 2021} {"train_loss": -40.0069465637207, "global_step": 244634, "epoch": 2021} {"train_loss": -41.19902801513672, "global_step": 244635, "epoch": 2021} {"train_loss": -41.375667572021484, "global_step": 244636, "epoch": 2021} {"train_loss": -41.176395416259766, "global_step": 244637, "epoch": 2021} {"train_loss": -42.325191497802734, "global_step": 244638, "epoch": 2021} {"train_loss": -42.55063247680664, "global_step": 244639, "epoch": 2021} {"train_loss": -41.55268478393555, "global_step": 244640, "epoch": 2021} {"train_loss": -40.389278411865234, "global_step": 244641, "epoch": 2021} {"train_loss": -42.11152648925781, "global_step": 244642, "epoch": 2021} {"train_loss": -42.16082763671875, "global_step": 244643, "epoch": 2021} {"train_loss": -40.26648712158203, "global_step": 244644, "epoch": 2021} {"train_loss": -42.208003997802734, "global_step": 244645, "epoch": 2021} {"train_loss": -41.052223205566406, "global_step": 244646, "epoch": 2021} {"train_loss": -41.22113037109375, "global_step": 244647, "epoch": 2021} {"train_loss": -42.79230880737305, "global_step": 244648, "epoch": 2021} {"train_loss": -42.09011459350586, "global_step": 244649, "epoch": 2021} {"train_loss": -41.505516052246094, "global_step": 244650, "epoch": 2021} {"train_loss": -42.306549072265625, "global_step": 244651, "epoch": 2021} {"train_loss": -42.33604049682617, "global_step": 244652, "epoch": 2021} {"train_loss": -41.69736862182617, "global_step": 244653, "epoch": 2021} {"train_loss": -43.055389404296875, "global_step": 244654, "epoch": 2021} {"train_loss": -42.14759063720703, "global_step": 244655, "epoch": 2021} {"train_loss": -42.89864730834961, "global_step": 244656, "epoch": 2021} {"train_loss": -42.90715408325195, "global_step": 244657, "epoch": 2021} {"train_loss": -43.01193618774414, "global_step": 244658, "epoch": 2021} {"train_loss": -40.360206604003906, "global_step": 244659, "epoch": 2021} {"train_loss": -42.501522064208984, "global_step": 244660, "epoch": 2021} {"train_loss": -41.93668141640907, "global_step": 244661, "epoch": 2021, "val_loss": 2622520.75} {"train_loss": -43.10929489135742, "global_step": 244662, "epoch": 2022} {"train_loss": -42.80782699584961, "global_step": 244663, "epoch": 2022} {"train_loss": -43.1412353515625, "global_step": 244664, "epoch": 2022} {"train_loss": -43.09495544433594, "global_step": 244665, "epoch": 2022} {"train_loss": -42.84387969970703, "global_step": 244666, "epoch": 2022} {"train_loss": -42.7128791809082, "global_step": 244667, "epoch": 2022} {"train_loss": -43.39127731323242, "global_step": 244668, "epoch": 2022} {"train_loss": -43.64860534667969, "global_step": 244669, "epoch": 2022} {"train_loss": -43.56319808959961, "global_step": 244670, "epoch": 2022} {"train_loss": -43.119083404541016, "global_step": 244671, "epoch": 2022} {"train_loss": -43.540584564208984, "global_step": 244672, "epoch": 2022} {"train_loss": -43.380462646484375, "global_step": 244673, "epoch": 2022} {"train_loss": -43.32578659057617, "global_step": 244674, "epoch": 2022} {"train_loss": -42.72597122192383, "global_step": 244675, "epoch": 2022} {"train_loss": -43.7443733215332, "global_step": 244676, "epoch": 2022} {"train_loss": -43.69082260131836, "global_step": 244677, "epoch": 2022} {"train_loss": -42.93876266479492, "global_step": 244678, "epoch": 2022} {"train_loss": -43.312435150146484, "global_step": 244679, "epoch": 2022} {"train_loss": -43.5788688659668, "global_step": 244680, "epoch": 2022} {"train_loss": -42.8870735168457, "global_step": 244681, "epoch": 2022} {"train_loss": -42.1275749206543, "global_step": 244682, "epoch": 2022} {"train_loss": -43.08058547973633, "global_step": 244683, "epoch": 2022} {"train_loss": -43.49904251098633, "global_step": 244684, "epoch": 2022} {"train_loss": -43.0601692199707, "global_step": 244685, "epoch": 2022} {"train_loss": -42.630714416503906, "global_step": 244686, "epoch": 2022} {"train_loss": -43.06590270996094, "global_step": 244687, "epoch": 2022} {"train_loss": -43.51662063598633, "global_step": 244688, "epoch": 2022} {"train_loss": -42.137245178222656, "global_step": 244689, "epoch": 2022} {"train_loss": -36.247894287109375, "global_step": 244690, "epoch": 2022} {"train_loss": -37.654232025146484, "global_step": 244691, "epoch": 2022} {"train_loss": -41.84047317504883, "global_step": 244692, "epoch": 2022} {"train_loss": -40.91060256958008, "global_step": 244693, "epoch": 2022} {"train_loss": -40.91313552856445, "global_step": 244694, "epoch": 2022} {"train_loss": -41.78717803955078, "global_step": 244695, "epoch": 2022} {"train_loss": -41.85076904296875, "global_step": 244696, "epoch": 2022} {"train_loss": -40.896881103515625, "global_step": 244697, "epoch": 2022} {"train_loss": -41.27682113647461, "global_step": 244698, "epoch": 2022} {"train_loss": -41.59364700317383, "global_step": 244699, "epoch": 2022} {"train_loss": -41.637062072753906, "global_step": 244700, "epoch": 2022} {"train_loss": -41.239925384521484, "global_step": 244701, "epoch": 2022} {"train_loss": -41.57167434692383, "global_step": 244702, "epoch": 2022} {"train_loss": -41.37833786010742, "global_step": 244703, "epoch": 2022} {"train_loss": -39.46221923828125, "global_step": 244704, "epoch": 2022} {"train_loss": -42.050514221191406, "global_step": 244705, "epoch": 2022} {"train_loss": -38.7902717590332, "global_step": 244706, "epoch": 2022} {"train_loss": -35.35026168823242, "global_step": 244707, "epoch": 2022} {"train_loss": -40.87020492553711, "global_step": 244708, "epoch": 2022} {"train_loss": -40.758602142333984, "global_step": 244709, "epoch": 2022} {"train_loss": -41.448760986328125, "global_step": 244710, "epoch": 2022} {"train_loss": -40.28681564331055, "global_step": 244711, "epoch": 2022} {"train_loss": -40.54279708862305, "global_step": 244712, "epoch": 2022} {"train_loss": -41.54191207885742, "global_step": 244713, "epoch": 2022} {"train_loss": -39.5712890625, "global_step": 244714, "epoch": 2022} {"train_loss": -41.72737503051758, "global_step": 244715, "epoch": 2022} {"train_loss": -40.30816650390625, "global_step": 244716, "epoch": 2022} {"train_loss": -40.359710693359375, "global_step": 244717, "epoch": 2022} {"train_loss": -41.57221221923828, "global_step": 244718, "epoch": 2022} {"train_loss": -38.55073165893555, "global_step": 244719, "epoch": 2022} {"train_loss": -39.17998504638672, "global_step": 244720, "epoch": 2022} {"train_loss": -39.75398635864258, "global_step": 244721, "epoch": 2022} {"train_loss": -40.255550384521484, "global_step": 244722, "epoch": 2022} {"train_loss": -40.338375091552734, "global_step": 244723, "epoch": 2022} {"train_loss": -39.75343704223633, "global_step": 244724, "epoch": 2022} {"train_loss": -40.3262825012207, "global_step": 244725, "epoch": 2022} {"train_loss": -40.14545440673828, "global_step": 244726, "epoch": 2022} {"train_loss": -37.959434509277344, "global_step": 244727, "epoch": 2022} {"train_loss": -38.33761978149414, "global_step": 244728, "epoch": 2022} {"train_loss": -40.51839828491211, "global_step": 244729, "epoch": 2022} {"train_loss": -41.10889434814453, "global_step": 244730, "epoch": 2022} {"train_loss": -37.98847961425781, "global_step": 244731, "epoch": 2022} {"train_loss": -40.26969528198242, "global_step": 244732, "epoch": 2022} {"train_loss": -41.922969818115234, "global_step": 244733, "epoch": 2022} {"train_loss": -40.947113037109375, "global_step": 244734, "epoch": 2022} {"train_loss": -40.73525619506836, "global_step": 244735, "epoch": 2022} {"train_loss": -40.6449089050293, "global_step": 244736, "epoch": 2022} {"train_loss": -40.6463737487793, "global_step": 244737, "epoch": 2022} {"train_loss": -41.161651611328125, "global_step": 244738, "epoch": 2022} {"train_loss": -41.90121078491211, "global_step": 244739, "epoch": 2022} {"train_loss": -41.4879150390625, "global_step": 244740, "epoch": 2022} {"train_loss": -38.71486282348633, "global_step": 244741, "epoch": 2022} {"train_loss": -41.71722412109375, "global_step": 244742, "epoch": 2022} {"train_loss": -39.942440032958984, "global_step": 244743, "epoch": 2022} {"train_loss": -39.709938049316406, "global_step": 244744, "epoch": 2022} {"train_loss": -40.82958984375, "global_step": 244745, "epoch": 2022} {"train_loss": -40.84870147705078, "global_step": 244746, "epoch": 2022} {"train_loss": -41.96879959106445, "global_step": 244747, "epoch": 2022} {"train_loss": -41.08725357055664, "global_step": 244748, "epoch": 2022} {"train_loss": -40.79596710205078, "global_step": 244749, "epoch": 2022} {"train_loss": -39.550376892089844, "global_step": 244750, "epoch": 2022} {"train_loss": -39.43009567260742, "global_step": 244751, "epoch": 2022} {"train_loss": -41.31477737426758, "global_step": 244752, "epoch": 2022} {"train_loss": -41.49720001220703, "global_step": 244753, "epoch": 2022} {"train_loss": -42.250370025634766, "global_step": 244754, "epoch": 2022} {"train_loss": -42.674110412597656, "global_step": 244755, "epoch": 2022} {"train_loss": -42.319976806640625, "global_step": 244756, "epoch": 2022} {"train_loss": -41.91157913208008, "global_step": 244757, "epoch": 2022} {"train_loss": -42.0890007019043, "global_step": 244758, "epoch": 2022} {"train_loss": -42.014766693115234, "global_step": 244759, "epoch": 2022} {"train_loss": -42.18656539916992, "global_step": 244760, "epoch": 2022} {"train_loss": -42.673248291015625, "global_step": 244761, "epoch": 2022} {"train_loss": -41.420143127441406, "global_step": 244762, "epoch": 2022} {"train_loss": -42.296875, "global_step": 244763, "epoch": 2022} {"train_loss": -42.14091110229492, "global_step": 244764, "epoch": 2022} {"train_loss": -42.70296859741211, "global_step": 244765, "epoch": 2022} {"train_loss": -42.8220329284668, "global_step": 244766, "epoch": 2022} {"train_loss": -41.95471954345703, "global_step": 244767, "epoch": 2022} {"train_loss": -42.25514602661133, "global_step": 244768, "epoch": 2022} {"train_loss": -42.69245529174805, "global_step": 244769, "epoch": 2022} {"train_loss": -42.82372283935547, "global_step": 244770, "epoch": 2022} {"train_loss": -41.3621940612793, "global_step": 244771, "epoch": 2022} {"train_loss": -43.15301513671875, "global_step": 244772, "epoch": 2022} {"train_loss": -42.57987594604492, "global_step": 244773, "epoch": 2022} {"train_loss": -41.9686279296875, "global_step": 244774, "epoch": 2022} {"train_loss": -42.296058654785156, "global_step": 244775, "epoch": 2022} {"train_loss": -42.71218490600586, "global_step": 244776, "epoch": 2022} {"train_loss": -43.034912109375, "global_step": 244777, "epoch": 2022} {"train_loss": -42.86953353881836, "global_step": 244778, "epoch": 2022} {"train_loss": -43.203975677490234, "global_step": 244779, "epoch": 2022} {"train_loss": -42.77168273925781, "global_step": 244780, "epoch": 2022} {"train_loss": -42.08153533935547, "global_step": 244781, "epoch": 2022} {"train_loss": -41.526052648370914, "global_step": 244782, "epoch": 2022, "val_loss": 2670535.25} {"train_loss": -42.5985107421875, "global_step": 244783, "epoch": 2023} {"train_loss": -42.81660079956055, "global_step": 244784, "epoch": 2023} {"train_loss": -43.10810470581055, "global_step": 244785, "epoch": 2023} {"train_loss": -42.915008544921875, "global_step": 244786, "epoch": 2023} {"train_loss": -43.29495620727539, "global_step": 244787, "epoch": 2023} {"train_loss": -43.185577392578125, "global_step": 244788, "epoch": 2023} {"train_loss": -42.808834075927734, "global_step": 244789, "epoch": 2023} {"train_loss": -43.16962432861328, "global_step": 244790, "epoch": 2023} {"train_loss": -42.67355728149414, "global_step": 244791, "epoch": 2023} {"train_loss": -43.34196090698242, "global_step": 244792, "epoch": 2023} {"train_loss": -43.19173812866211, "global_step": 244793, "epoch": 2023} {"train_loss": -42.30541229248047, "global_step": 244794, "epoch": 2023} {"train_loss": -43.179786682128906, "global_step": 244795, "epoch": 2023} {"train_loss": -43.152320861816406, "global_step": 244796, "epoch": 2023} {"train_loss": -41.60324478149414, "global_step": 244797, "epoch": 2023} {"train_loss": -42.237525939941406, "global_step": 244798, "epoch": 2023} {"train_loss": -42.55436706542969, "global_step": 244799, "epoch": 2023} {"train_loss": -43.8420524597168, "global_step": 244800, "epoch": 2023} {"train_loss": -43.13836669921875, "global_step": 244801, "epoch": 2023} {"train_loss": -42.21940994262695, "global_step": 244802, "epoch": 2023} {"train_loss": -40.423519134521484, "global_step": 244803, "epoch": 2023} {"train_loss": -40.87246322631836, "global_step": 244804, "epoch": 2023} {"train_loss": -41.172607421875, "global_step": 244805, "epoch": 2023} {"train_loss": -39.430206298828125, "global_step": 244806, "epoch": 2023} {"train_loss": -36.818946838378906, "global_step": 244807, "epoch": 2023} {"train_loss": -38.35371017456055, "global_step": 244808, "epoch": 2023} {"train_loss": -36.53165817260742, "global_step": 244809, "epoch": 2023} {"train_loss": -34.72267532348633, "global_step": 244810, "epoch": 2023} {"train_loss": -39.43918991088867, "global_step": 244811, "epoch": 2023} {"train_loss": -40.462215423583984, "global_step": 244812, "epoch": 2023} {"train_loss": -39.728248596191406, "global_step": 244813, "epoch": 2023} {"train_loss": -40.53116226196289, "global_step": 244814, "epoch": 2023} {"train_loss": -37.55606460571289, "global_step": 244815, "epoch": 2023} {"train_loss": -39.89962387084961, "global_step": 244816, "epoch": 2023} {"train_loss": -41.44524383544922, "global_step": 244817, "epoch": 2023} {"train_loss": -40.07584762573242, "global_step": 244818, "epoch": 2023} {"train_loss": -42.05955123901367, "global_step": 244819, "epoch": 2023} {"train_loss": -41.909156799316406, "global_step": 244820, "epoch": 2023} {"train_loss": -41.67308807373047, "global_step": 244821, "epoch": 2023} {"train_loss": -41.76585006713867, "global_step": 244822, "epoch": 2023} {"train_loss": -41.265377044677734, "global_step": 244823, "epoch": 2023} {"train_loss": -42.183929443359375, "global_step": 244824, "epoch": 2023} {"train_loss": -41.29803466796875, "global_step": 244825, "epoch": 2023} {"train_loss": -42.007843017578125, "global_step": 244826, "epoch": 2023} {"train_loss": -40.27313232421875, "global_step": 244827, "epoch": 2023} {"train_loss": -41.34787368774414, "global_step": 244828, "epoch": 2023} {"train_loss": -41.70652389526367, "global_step": 244829, "epoch": 2023} {"train_loss": -40.56539535522461, "global_step": 244830, "epoch": 2023} {"train_loss": -41.983333587646484, "global_step": 244831, "epoch": 2023} {"train_loss": -39.97593307495117, "global_step": 244832, "epoch": 2023} {"train_loss": -40.607784271240234, "global_step": 244833, "epoch": 2023} {"train_loss": -41.673927307128906, "global_step": 244834, "epoch": 2023} {"train_loss": -40.458229064941406, "global_step": 244835, "epoch": 2023} {"train_loss": -42.083404541015625, "global_step": 244836, "epoch": 2023} {"train_loss": -40.875457763671875, "global_step": 244837, "epoch": 2023} {"train_loss": -42.53245162963867, "global_step": 244838, "epoch": 2023} {"train_loss": -41.22907257080078, "global_step": 244839, "epoch": 2023} {"train_loss": -42.5380859375, "global_step": 244840, "epoch": 2023} {"train_loss": -41.368892669677734, "global_step": 244841, "epoch": 2023} {"train_loss": -42.116939544677734, "global_step": 244842, "epoch": 2023} {"train_loss": -42.34403610229492, "global_step": 244843, "epoch": 2023} {"train_loss": -42.06682205200195, "global_step": 244844, "epoch": 2023} {"train_loss": -40.14854431152344, "global_step": 244845, "epoch": 2023} {"train_loss": -42.35775375366211, "global_step": 244846, "epoch": 2023} {"train_loss": -41.83053207397461, "global_step": 244847, "epoch": 2023} {"train_loss": -41.90663528442383, "global_step": 244848, "epoch": 2023} {"train_loss": -41.98225784301758, "global_step": 244849, "epoch": 2023} {"train_loss": -42.41899108886719, "global_step": 244850, "epoch": 2023} {"train_loss": -39.96819305419922, "global_step": 244851, "epoch": 2023} {"train_loss": -39.91121292114258, "global_step": 244852, "epoch": 2023} {"train_loss": -42.62786102294922, "global_step": 244853, "epoch": 2023} {"train_loss": -42.148162841796875, "global_step": 244854, "epoch": 2023} {"train_loss": -42.954185485839844, "global_step": 244855, "epoch": 2023} {"train_loss": -40.260467529296875, "global_step": 244856, "epoch": 2023} {"train_loss": -42.480751037597656, "global_step": 244857, "epoch": 2023} {"train_loss": -39.565460205078125, "global_step": 244858, "epoch": 2023} {"train_loss": -40.27348709106445, "global_step": 244859, "epoch": 2023} {"train_loss": -40.71206283569336, "global_step": 244860, "epoch": 2023} {"train_loss": -40.7736930847168, "global_step": 244861, "epoch": 2023} {"train_loss": -39.73384475708008, "global_step": 244862, "epoch": 2023} {"train_loss": -42.03461837768555, "global_step": 244863, "epoch": 2023} {"train_loss": -41.681068420410156, "global_step": 244864, "epoch": 2023} {"train_loss": -40.1678352355957, "global_step": 244865, "epoch": 2023} {"train_loss": -40.79788589477539, "global_step": 244866, "epoch": 2023} {"train_loss": -41.72675323486328, "global_step": 244867, "epoch": 2023} {"train_loss": -39.80253982543945, "global_step": 244868, "epoch": 2023} {"train_loss": -36.3840446472168, "global_step": 244869, "epoch": 2023} {"train_loss": -42.472023010253906, "global_step": 244870, "epoch": 2023} {"train_loss": -41.713409423828125, "global_step": 244871, "epoch": 2023} {"train_loss": -41.74355697631836, "global_step": 244872, "epoch": 2023} {"train_loss": -40.71126174926758, "global_step": 244873, "epoch": 2023} {"train_loss": -42.2313117980957, "global_step": 244874, "epoch": 2023} {"train_loss": -37.49280548095703, "global_step": 244875, "epoch": 2023} {"train_loss": -38.37533187866211, "global_step": 244876, "epoch": 2023} {"train_loss": -42.31464767456055, "global_step": 244877, "epoch": 2023} {"train_loss": -40.66093063354492, "global_step": 244878, "epoch": 2023} {"train_loss": -40.400691986083984, "global_step": 244879, "epoch": 2023} {"train_loss": -42.35688400268555, "global_step": 244880, "epoch": 2023} {"train_loss": -41.96482467651367, "global_step": 244881, "epoch": 2023} {"train_loss": -39.05083084106445, "global_step": 244882, "epoch": 2023} {"train_loss": -41.597023010253906, "global_step": 244883, "epoch": 2023} {"train_loss": -41.550716400146484, "global_step": 244884, "epoch": 2023} {"train_loss": -40.81505584716797, "global_step": 244885, "epoch": 2023} {"train_loss": -37.30660629272461, "global_step": 244886, "epoch": 2023} {"train_loss": -40.50138473510742, "global_step": 244887, "epoch": 2023} {"train_loss": -39.5455436706543, "global_step": 244888, "epoch": 2023} {"train_loss": -39.80118942260742, "global_step": 244889, "epoch": 2023} {"train_loss": -34.95713424682617, "global_step": 244890, "epoch": 2023} {"train_loss": -37.36420822143555, "global_step": 244891, "epoch": 2023} {"train_loss": -41.1600341796875, "global_step": 244892, "epoch": 2023} {"train_loss": -39.52521896362305, "global_step": 244893, "epoch": 2023} {"train_loss": -36.88304901123047, "global_step": 244894, "epoch": 2023} {"train_loss": -39.568302154541016, "global_step": 244895, "epoch": 2023} {"train_loss": -40.531368255615234, "global_step": 244896, "epoch": 2023} {"train_loss": -40.47269058227539, "global_step": 244897, "epoch": 2023} {"train_loss": -38.374874114990234, "global_step": 244898, "epoch": 2023} {"train_loss": -36.616432189941406, "global_step": 244899, "epoch": 2023} {"train_loss": -38.965606689453125, "global_step": 244900, "epoch": 2023} {"train_loss": -36.64823913574219, "global_step": 244901, "epoch": 2023} {"train_loss": -31.303625106811523, "global_step": 244902, "epoch": 2023} {"train_loss": -40.70813380785225, "global_step": 244903, "epoch": 2023, "val_loss": 2686853.0} {"train_loss": -39.12714767456055, "global_step": 244904, "epoch": 2024} {"train_loss": -40.52892303466797, "global_step": 244905, "epoch": 2024} {"train_loss": -33.7475700378418, "global_step": 244906, "epoch": 2024} {"train_loss": -38.05295944213867, "global_step": 244907, "epoch": 2024} {"train_loss": -38.739654541015625, "global_step": 244908, "epoch": 2024} {"train_loss": -39.056640625, "global_step": 244909, "epoch": 2024} {"train_loss": -32.90696716308594, "global_step": 244910, "epoch": 2024} {"train_loss": -38.02498245239258, "global_step": 244911, "epoch": 2024} {"train_loss": -37.27732467651367, "global_step": 244912, "epoch": 2024} {"train_loss": -39.82685852050781, "global_step": 244913, "epoch": 2024} {"train_loss": -37.753353118896484, "global_step": 244914, "epoch": 2024} {"train_loss": -35.83850860595703, "global_step": 244915, "epoch": 2024} {"train_loss": -39.43309783935547, "global_step": 244916, "epoch": 2024} {"train_loss": -39.33388900756836, "global_step": 244917, "epoch": 2024} {"train_loss": -39.09341049194336, "global_step": 244918, "epoch": 2024} {"train_loss": -39.37767791748047, "global_step": 244919, "epoch": 2024} {"train_loss": -32.20879364013672, "global_step": 244920, "epoch": 2024} {"train_loss": -38.56747055053711, "global_step": 244921, "epoch": 2024} {"train_loss": -38.58454895019531, "global_step": 244922, "epoch": 2024} {"train_loss": -40.53390121459961, "global_step": 244923, "epoch": 2024} {"train_loss": -36.65357208251953, "global_step": 244924, "epoch": 2024} {"train_loss": -38.89042282104492, "global_step": 244925, "epoch": 2024} {"train_loss": -37.78458786010742, "global_step": 244926, "epoch": 2024} {"train_loss": -39.570987701416016, "global_step": 244927, "epoch": 2024} {"train_loss": -40.15496063232422, "global_step": 244928, "epoch": 2024} {"train_loss": -38.16616439819336, "global_step": 244929, "epoch": 2024} {"train_loss": -38.750431060791016, "global_step": 244930, "epoch": 2024} {"train_loss": -38.19334030151367, "global_step": 244931, "epoch": 2024} {"train_loss": -39.16938400268555, "global_step": 244932, "epoch": 2024} {"train_loss": -39.69655990600586, "global_step": 244933, "epoch": 2024} {"train_loss": -38.8267936706543, "global_step": 244934, "epoch": 2024} {"train_loss": -38.12746047973633, "global_step": 244935, "epoch": 2024} {"train_loss": -39.58932113647461, "global_step": 244936, "epoch": 2024} {"train_loss": -40.39785385131836, "global_step": 244937, "epoch": 2024} {"train_loss": -40.818904876708984, "global_step": 244938, "epoch": 2024} {"train_loss": -40.26765823364258, "global_step": 244939, "epoch": 2024} {"train_loss": -39.13973617553711, "global_step": 244940, "epoch": 2024} {"train_loss": -40.43124008178711, "global_step": 244941, "epoch": 2024} {"train_loss": -40.656715393066406, "global_step": 244942, "epoch": 2024} {"train_loss": -39.957305908203125, "global_step": 244943, "epoch": 2024} {"train_loss": -40.97553253173828, "global_step": 244944, "epoch": 2024} {"train_loss": -41.0411376953125, "global_step": 244945, "epoch": 2024} {"train_loss": -39.81161117553711, "global_step": 244946, "epoch": 2024} {"train_loss": -39.56754684448242, "global_step": 244947, "epoch": 2024} {"train_loss": -40.957862854003906, "global_step": 244948, "epoch": 2024} {"train_loss": -39.867103576660156, "global_step": 244949, "epoch": 2024} {"train_loss": -39.633480072021484, "global_step": 244950, "epoch": 2024} {"train_loss": -40.80060577392578, "global_step": 244951, "epoch": 2024} {"train_loss": -40.30442428588867, "global_step": 244952, "epoch": 2024} {"train_loss": -40.89303207397461, "global_step": 244953, "epoch": 2024} {"train_loss": -40.24551010131836, "global_step": 244954, "epoch": 2024} {"train_loss": -40.545589447021484, "global_step": 244955, "epoch": 2024} {"train_loss": -40.49100112915039, "global_step": 244956, "epoch": 2024} {"train_loss": -40.85868453979492, "global_step": 244957, "epoch": 2024} {"train_loss": -41.1586799621582, "global_step": 244958, "epoch": 2024} {"train_loss": -41.02745819091797, "global_step": 244959, "epoch": 2024} {"train_loss": -40.23125076293945, "global_step": 244960, "epoch": 2024} {"train_loss": -41.39686965942383, "global_step": 244961, "epoch": 2024} {"train_loss": -41.177734375, "global_step": 244962, "epoch": 2024} {"train_loss": -41.08791732788086, "global_step": 244963, "epoch": 2024} {"train_loss": -39.274051666259766, "global_step": 244964, "epoch": 2024} {"train_loss": -41.334869384765625, "global_step": 244965, "epoch": 2024} {"train_loss": -41.07818603515625, "global_step": 244966, "epoch": 2024} {"train_loss": -41.550411224365234, "global_step": 244967, "epoch": 2024} {"train_loss": -41.8216552734375, "global_step": 244968, "epoch": 2024} {"train_loss": -41.20869064331055, "global_step": 244969, "epoch": 2024} {"train_loss": -41.55524826049805, "global_step": 244970, "epoch": 2024} {"train_loss": -41.26858901977539, "global_step": 244971, "epoch": 2024} {"train_loss": -41.03591537475586, "global_step": 244972, "epoch": 2024} {"train_loss": -41.10261154174805, "global_step": 244973, "epoch": 2024} {"train_loss": -41.113216400146484, "global_step": 244974, "epoch": 2024} {"train_loss": -41.13800811767578, "global_step": 244975, "epoch": 2024} {"train_loss": -42.3520393371582, "global_step": 244976, "epoch": 2024} {"train_loss": -41.10569381713867, "global_step": 244977, "epoch": 2024} {"train_loss": -41.4086799621582, "global_step": 244978, "epoch": 2024} {"train_loss": -40.38883972167969, "global_step": 244979, "epoch": 2024} {"train_loss": -41.96514892578125, "global_step": 244980, "epoch": 2024} {"train_loss": -41.12836456298828, "global_step": 244981, "epoch": 2024} {"train_loss": -41.63007736206055, "global_step": 244982, "epoch": 2024} {"train_loss": -41.673336029052734, "global_step": 244983, "epoch": 2024} {"train_loss": -41.57722854614258, "global_step": 244984, "epoch": 2024} {"train_loss": -41.72899627685547, "global_step": 244985, "epoch": 2024} {"train_loss": -41.77541732788086, "global_step": 244986, "epoch": 2024} {"train_loss": -41.88035202026367, "global_step": 244987, "epoch": 2024} {"train_loss": -41.360538482666016, "global_step": 244988, "epoch": 2024} {"train_loss": -41.81474685668945, "global_step": 244989, "epoch": 2024} {"train_loss": -41.73773956298828, "global_step": 244990, "epoch": 2024} {"train_loss": -42.2579345703125, "global_step": 244991, "epoch": 2024} {"train_loss": -41.7960319519043, "global_step": 244992, "epoch": 2024} {"train_loss": -41.64712142944336, "global_step": 244993, "epoch": 2024} {"train_loss": -41.082942962646484, "global_step": 244994, "epoch": 2024} {"train_loss": -42.552486419677734, "global_step": 244995, "epoch": 2024} {"train_loss": -40.00349807739258, "global_step": 244996, "epoch": 2024} {"train_loss": -41.56071090698242, "global_step": 244997, "epoch": 2024} {"train_loss": -41.565547943115234, "global_step": 244998, "epoch": 2024} {"train_loss": -41.24513244628906, "global_step": 244999, "epoch": 2024} {"train_loss": -41.285579681396484, "global_step": 245000, "epoch": 2024} {"train_loss": -41.97969436645508, "global_step": 245001, "epoch": 2024} {"train_loss": -41.14057540893555, "global_step": 245002, "epoch": 2024} {"train_loss": -40.74983215332031, "global_step": 245003, "epoch": 2024} {"train_loss": -42.06573486328125, "global_step": 245004, "epoch": 2024} {"train_loss": -41.80945587158203, "global_step": 245005, "epoch": 2024} {"train_loss": -41.926876068115234, "global_step": 245006, "epoch": 2024} {"train_loss": -42.161224365234375, "global_step": 245007, "epoch": 2024} {"train_loss": -42.09343719482422, "global_step": 245008, "epoch": 2024} {"train_loss": -41.24471664428711, "global_step": 245009, "epoch": 2024} {"train_loss": -40.949947357177734, "global_step": 245010, "epoch": 2024} {"train_loss": -42.02619552612305, "global_step": 245011, "epoch": 2024} {"train_loss": -40.947998046875, "global_step": 245012, "epoch": 2024} {"train_loss": -42.02035140991211, "global_step": 245013, "epoch": 2024} {"train_loss": -42.43282699584961, "global_step": 245014, "epoch": 2024} {"train_loss": -41.46200180053711, "global_step": 245015, "epoch": 2024} {"train_loss": -42.34842300415039, "global_step": 245016, "epoch": 2024} {"train_loss": -42.19308853149414, "global_step": 245017, "epoch": 2024} {"train_loss": -41.84203338623047, "global_step": 245018, "epoch": 2024} {"train_loss": -42.12936019897461, "global_step": 245019, "epoch": 2024} {"train_loss": -42.00269317626953, "global_step": 245020, "epoch": 2024} {"train_loss": -41.42926788330078, "global_step": 245021, "epoch": 2024} {"train_loss": -41.59638977050781, "global_step": 245022, "epoch": 2024} {"train_loss": -41.98575973510742, "global_step": 245023, "epoch": 2024} {"train_loss": -40.41924947943569, "global_step": 245024, "epoch": 2024, "val_loss": 2585519.0} {"train_loss": -41.74216842651367, "global_step": 245025, "epoch": 2025} {"train_loss": -42.05049514770508, "global_step": 245026, "epoch": 2025} {"train_loss": -42.590145111083984, "global_step": 245027, "epoch": 2025} {"train_loss": -42.416778564453125, "global_step": 245028, "epoch": 2025} {"train_loss": -42.30978012084961, "global_step": 245029, "epoch": 2025} {"train_loss": -41.10324478149414, "global_step": 245030, "epoch": 2025} {"train_loss": -42.78194046020508, "global_step": 245031, "epoch": 2025} {"train_loss": -42.0875129699707, "global_step": 245032, "epoch": 2025} {"train_loss": -42.756256103515625, "global_step": 245033, "epoch": 2025} {"train_loss": -42.39460372924805, "global_step": 245034, "epoch": 2025} {"train_loss": -41.816322326660156, "global_step": 245035, "epoch": 2025} {"train_loss": -42.74150848388672, "global_step": 245036, "epoch": 2025} {"train_loss": -42.47657775878906, "global_step": 245037, "epoch": 2025} {"train_loss": -42.5736198425293, "global_step": 245038, "epoch": 2025} {"train_loss": -42.481693267822266, "global_step": 245039, "epoch": 2025} {"train_loss": -41.82618713378906, "global_step": 245040, "epoch": 2025} {"train_loss": -41.523075103759766, "global_step": 245041, "epoch": 2025} {"train_loss": -42.50632858276367, "global_step": 245042, "epoch": 2025} {"train_loss": -43.30842590332031, "global_step": 245043, "epoch": 2025} {"train_loss": -42.26260757446289, "global_step": 245044, "epoch": 2025} {"train_loss": -42.466033935546875, "global_step": 245045, "epoch": 2025} {"train_loss": -42.34743881225586, "global_step": 245046, "epoch": 2025} {"train_loss": -42.450653076171875, "global_step": 245047, "epoch": 2025} {"train_loss": -42.37936019897461, "global_step": 245048, "epoch": 2025} {"train_loss": -42.05929946899414, "global_step": 245049, "epoch": 2025} {"train_loss": -42.75106430053711, "global_step": 245050, "epoch": 2025} {"train_loss": -41.7126350402832, "global_step": 245051, "epoch": 2025} {"train_loss": -41.58706283569336, "global_step": 245052, "epoch": 2025} {"train_loss": -43.0374641418457, "global_step": 245053, "epoch": 2025} {"train_loss": -42.18537139892578, "global_step": 245054, "epoch": 2025} {"train_loss": -42.164276123046875, "global_step": 245055, "epoch": 2025} {"train_loss": -41.00095748901367, "global_step": 245056, "epoch": 2025} {"train_loss": -40.52827072143555, "global_step": 245057, "epoch": 2025} {"train_loss": -39.291259765625, "global_step": 245058, "epoch": 2025} {"train_loss": -38.16823196411133, "global_step": 245059, "epoch": 2025} {"train_loss": -39.18408966064453, "global_step": 245060, "epoch": 2025} {"train_loss": -36.558380126953125, "global_step": 245061, "epoch": 2025} {"train_loss": -36.84672927856445, "global_step": 245062, "epoch": 2025} {"train_loss": -39.22200012207031, "global_step": 245063, "epoch": 2025} {"train_loss": -40.124183654785156, "global_step": 245064, "epoch": 2025} {"train_loss": -40.90324020385742, "global_step": 245065, "epoch": 2025} {"train_loss": -39.31145095825195, "global_step": 245066, "epoch": 2025} {"train_loss": -39.2328987121582, "global_step": 245067, "epoch": 2025} {"train_loss": -41.404293060302734, "global_step": 245068, "epoch": 2025} {"train_loss": -37.443214416503906, "global_step": 245069, "epoch": 2025} {"train_loss": -39.93044662475586, "global_step": 245070, "epoch": 2025} {"train_loss": -38.54346466064453, "global_step": 245071, "epoch": 2025} {"train_loss": -37.93782424926758, "global_step": 245072, "epoch": 2025} {"train_loss": -40.50979232788086, "global_step": 245073, "epoch": 2025} {"train_loss": -40.46474838256836, "global_step": 245074, "epoch": 2025} {"train_loss": -39.54459762573242, "global_step": 245075, "epoch": 2025} {"train_loss": -41.3349494934082, "global_step": 245076, "epoch": 2025} {"train_loss": -40.34070587158203, "global_step": 245077, "epoch": 2025} {"train_loss": -40.5836067199707, "global_step": 245078, "epoch": 2025} {"train_loss": -40.84735870361328, "global_step": 245079, "epoch": 2025} {"train_loss": -40.94482421875, "global_step": 245080, "epoch": 2025} {"train_loss": -40.287498474121094, "global_step": 245081, "epoch": 2025} {"train_loss": -37.31219482421875, "global_step": 245082, "epoch": 2025} {"train_loss": -40.56330108642578, "global_step": 245083, "epoch": 2025} {"train_loss": -41.08359909057617, "global_step": 245084, "epoch": 2025} {"train_loss": -40.246150970458984, "global_step": 245085, "epoch": 2025} {"train_loss": -41.58414840698242, "global_step": 245086, "epoch": 2025} {"train_loss": -40.89039993286133, "global_step": 245087, "epoch": 2025} {"train_loss": -41.29874801635742, "global_step": 245088, "epoch": 2025} {"train_loss": -40.887569427490234, "global_step": 245089, "epoch": 2025} {"train_loss": -41.76381301879883, "global_step": 245090, "epoch": 2025} {"train_loss": -41.7558708190918, "global_step": 245091, "epoch": 2025} {"train_loss": -40.87331771850586, "global_step": 245092, "epoch": 2025} {"train_loss": -41.41713333129883, "global_step": 245093, "epoch": 2025} {"train_loss": -41.8818473815918, "global_step": 245094, "epoch": 2025} {"train_loss": -41.571895599365234, "global_step": 245095, "epoch": 2025} {"train_loss": -42.2059211730957, "global_step": 245096, "epoch": 2025} {"train_loss": -41.472251892089844, "global_step": 245097, "epoch": 2025} {"train_loss": -42.14787673950195, "global_step": 245098, "epoch": 2025} {"train_loss": -41.69143295288086, "global_step": 245099, "epoch": 2025} {"train_loss": -42.24477005004883, "global_step": 245100, "epoch": 2025} {"train_loss": -42.70872497558594, "global_step": 245101, "epoch": 2025} {"train_loss": -41.83407211303711, "global_step": 245102, "epoch": 2025} {"train_loss": -42.3709602355957, "global_step": 245103, "epoch": 2025} {"train_loss": -42.18552780151367, "global_step": 245104, "epoch": 2025} {"train_loss": -42.5496940612793, "global_step": 245105, "epoch": 2025} {"train_loss": -42.47901153564453, "global_step": 245106, "epoch": 2025} {"train_loss": -42.6363639831543, "global_step": 245107, "epoch": 2025} {"train_loss": -42.703182220458984, "global_step": 245108, "epoch": 2025} {"train_loss": -42.35061264038086, "global_step": 245109, "epoch": 2025} {"train_loss": -42.54174041748047, "global_step": 245110, "epoch": 2025} {"train_loss": -42.54803466796875, "global_step": 245111, "epoch": 2025} {"train_loss": -40.99577713012695, "global_step": 245112, "epoch": 2025} {"train_loss": -42.777198791503906, "global_step": 245113, "epoch": 2025} {"train_loss": -42.06354522705078, "global_step": 245114, "epoch": 2025} {"train_loss": -42.188812255859375, "global_step": 245115, "epoch": 2025} {"train_loss": -42.516456604003906, "global_step": 245116, "epoch": 2025} {"train_loss": -42.78721237182617, "global_step": 245117, "epoch": 2025} {"train_loss": -41.47852325439453, "global_step": 245118, "epoch": 2025} {"train_loss": -42.311641693115234, "global_step": 245119, "epoch": 2025} {"train_loss": -42.370418548583984, "global_step": 245120, "epoch": 2025} {"train_loss": -42.17927932739258, "global_step": 245121, "epoch": 2025} {"train_loss": -41.85301208496094, "global_step": 245122, "epoch": 2025} {"train_loss": -41.77295684814453, "global_step": 245123, "epoch": 2025} {"train_loss": -41.55375289916992, "global_step": 245124, "epoch": 2025} {"train_loss": -42.329891204833984, "global_step": 245125, "epoch": 2025} {"train_loss": -41.684173583984375, "global_step": 245126, "epoch": 2025} {"train_loss": -41.40328598022461, "global_step": 245127, "epoch": 2025} {"train_loss": -42.94448471069336, "global_step": 245128, "epoch": 2025} {"train_loss": -41.59980392456055, "global_step": 245129, "epoch": 2025} {"train_loss": -42.80319595336914, "global_step": 245130, "epoch": 2025} {"train_loss": -42.20844268798828, "global_step": 245131, "epoch": 2025} {"train_loss": -41.423927307128906, "global_step": 245132, "epoch": 2025} {"train_loss": -42.37132263183594, "global_step": 245133, "epoch": 2025} {"train_loss": -42.75831985473633, "global_step": 245134, "epoch": 2025} {"train_loss": -42.78327178955078, "global_step": 245135, "epoch": 2025} {"train_loss": -43.06264114379883, "global_step": 245136, "epoch": 2025} {"train_loss": -41.664764404296875, "global_step": 245137, "epoch": 2025} {"train_loss": -43.00813293457031, "global_step": 245138, "epoch": 2025} {"train_loss": -41.99155044555664, "global_step": 245139, "epoch": 2025} {"train_loss": -41.91987609863281, "global_step": 245140, "epoch": 2025} {"train_loss": -42.33728790283203, "global_step": 245141, "epoch": 2025} {"train_loss": -42.10146713256836, "global_step": 245142, "epoch": 2025} {"train_loss": -42.688411712646484, "global_step": 245143, "epoch": 2025} {"train_loss": -42.62565231323242, "global_step": 245144, "epoch": 2025} {"train_loss": -41.54290475135993, "global_step": 245145, "epoch": 2025, "val_loss": 2618021.75} {"train_loss": -42.69010543823242, "global_step": 245146, "epoch": 2026} {"train_loss": -41.80147933959961, "global_step": 245147, "epoch": 2026} {"train_loss": -42.66432571411133, "global_step": 245148, "epoch": 2026} {"train_loss": -41.83510971069336, "global_step": 245149, "epoch": 2026} {"train_loss": -41.84117889404297, "global_step": 245150, "epoch": 2026} {"train_loss": -42.345829010009766, "global_step": 245151, "epoch": 2026} {"train_loss": -41.55475616455078, "global_step": 245152, "epoch": 2026} {"train_loss": -42.672298431396484, "global_step": 245153, "epoch": 2026} {"train_loss": -42.632652282714844, "global_step": 245154, "epoch": 2026} {"train_loss": -41.9211311340332, "global_step": 245155, "epoch": 2026} {"train_loss": -41.859291076660156, "global_step": 245156, "epoch": 2026} {"train_loss": -42.761146545410156, "global_step": 245157, "epoch": 2026} {"train_loss": -41.84794235229492, "global_step": 245158, "epoch": 2026} {"train_loss": -41.72564697265625, "global_step": 245159, "epoch": 2026} {"train_loss": -42.480384826660156, "global_step": 245160, "epoch": 2026} {"train_loss": -41.752777099609375, "global_step": 245161, "epoch": 2026} {"train_loss": -42.49111557006836, "global_step": 245162, "epoch": 2026} {"train_loss": -39.870330810546875, "global_step": 245163, "epoch": 2026} {"train_loss": -42.857582092285156, "global_step": 245164, "epoch": 2026} {"train_loss": -42.07792663574219, "global_step": 245165, "epoch": 2026} {"train_loss": -42.47439956665039, "global_step": 245166, "epoch": 2026} {"train_loss": -41.00709915161133, "global_step": 245167, "epoch": 2026} {"train_loss": -41.3000373840332, "global_step": 245168, "epoch": 2026} {"train_loss": -42.090572357177734, "global_step": 245169, "epoch": 2026} {"train_loss": -41.99595260620117, "global_step": 245170, "epoch": 2026} {"train_loss": -42.52571487426758, "global_step": 245171, "epoch": 2026} {"train_loss": -43.2298583984375, "global_step": 245172, "epoch": 2026} {"train_loss": -41.06135940551758, "global_step": 245173, "epoch": 2026} {"train_loss": -41.982967376708984, "global_step": 245174, "epoch": 2026} {"train_loss": -42.62758255004883, "global_step": 245175, "epoch": 2026} {"train_loss": -40.867713928222656, "global_step": 245176, "epoch": 2026} {"train_loss": -42.23104476928711, "global_step": 245177, "epoch": 2026} {"train_loss": -41.56654739379883, "global_step": 245178, "epoch": 2026} {"train_loss": -41.5376091003418, "global_step": 245179, "epoch": 2026} {"train_loss": -41.65704345703125, "global_step": 245180, "epoch": 2026} {"train_loss": -42.986629486083984, "global_step": 245181, "epoch": 2026} {"train_loss": -41.593746185302734, "global_step": 245182, "epoch": 2026} {"train_loss": -42.01749038696289, "global_step": 245183, "epoch": 2026} {"train_loss": -42.77916717529297, "global_step": 245184, "epoch": 2026} {"train_loss": -42.330726623535156, "global_step": 245185, "epoch": 2026} {"train_loss": -42.25703048706055, "global_step": 245186, "epoch": 2026} {"train_loss": -42.519500732421875, "global_step": 245187, "epoch": 2026} {"train_loss": -42.07807540893555, "global_step": 245188, "epoch": 2026} {"train_loss": -40.5152702331543, "global_step": 245189, "epoch": 2026} {"train_loss": -39.327308654785156, "global_step": 245190, "epoch": 2026} {"train_loss": -39.16876220703125, "global_step": 245191, "epoch": 2026} {"train_loss": -40.59510040283203, "global_step": 245192, "epoch": 2026} {"train_loss": -41.229793548583984, "global_step": 245193, "epoch": 2026} {"train_loss": -42.56513595581055, "global_step": 245194, "epoch": 2026} {"train_loss": -40.5260124206543, "global_step": 245195, "epoch": 2026} {"train_loss": -40.99379348754883, "global_step": 245196, "epoch": 2026} {"train_loss": -41.58872604370117, "global_step": 245197, "epoch": 2026} {"train_loss": -40.45518112182617, "global_step": 245198, "epoch": 2026} {"train_loss": -41.3499870300293, "global_step": 245199, "epoch": 2026} {"train_loss": -41.78789520263672, "global_step": 245200, "epoch": 2026} {"train_loss": -40.36014938354492, "global_step": 245201, "epoch": 2026} {"train_loss": -41.47817611694336, "global_step": 245202, "epoch": 2026} {"train_loss": -40.21308517456055, "global_step": 245203, "epoch": 2026} {"train_loss": -42.0876579284668, "global_step": 245204, "epoch": 2026} {"train_loss": -42.53358459472656, "global_step": 245205, "epoch": 2026} {"train_loss": -41.20123291015625, "global_step": 245206, "epoch": 2026} {"train_loss": -42.81429672241211, "global_step": 245207, "epoch": 2026} {"train_loss": -42.455257415771484, "global_step": 245208, "epoch": 2026} {"train_loss": -42.009220123291016, "global_step": 245209, "epoch": 2026} {"train_loss": -42.92267990112305, "global_step": 245210, "epoch": 2026} {"train_loss": -42.32581329345703, "global_step": 245211, "epoch": 2026} {"train_loss": -42.20778274536133, "global_step": 245212, "epoch": 2026} {"train_loss": -42.69637680053711, "global_step": 245213, "epoch": 2026} {"train_loss": -42.85609817504883, "global_step": 245214, "epoch": 2026} {"train_loss": -42.9111213684082, "global_step": 245215, "epoch": 2026} {"train_loss": -42.58953094482422, "global_step": 245216, "epoch": 2026} {"train_loss": -42.33647537231445, "global_step": 245217, "epoch": 2026} {"train_loss": -42.838539123535156, "global_step": 245218, "epoch": 2026} {"train_loss": -42.56394577026367, "global_step": 245219, "epoch": 2026} {"train_loss": -42.802303314208984, "global_step": 245220, "epoch": 2026} {"train_loss": -43.04221725463867, "global_step": 245221, "epoch": 2026} {"train_loss": -42.42069625854492, "global_step": 245222, "epoch": 2026} {"train_loss": -42.27457809448242, "global_step": 245223, "epoch": 2026} {"train_loss": -42.38433074951172, "global_step": 245224, "epoch": 2026} {"train_loss": -43.1495246887207, "global_step": 245225, "epoch": 2026} {"train_loss": -43.17496871948242, "global_step": 245226, "epoch": 2026} {"train_loss": -42.89748764038086, "global_step": 245227, "epoch": 2026} {"train_loss": -43.006744384765625, "global_step": 245228, "epoch": 2026} {"train_loss": -43.21088409423828, "global_step": 245229, "epoch": 2026} {"train_loss": -42.85357666015625, "global_step": 245230, "epoch": 2026} {"train_loss": -42.949581146240234, "global_step": 245231, "epoch": 2026} {"train_loss": -42.976951599121094, "global_step": 245232, "epoch": 2026} {"train_loss": -42.4521484375, "global_step": 245233, "epoch": 2026} {"train_loss": -43.65080642700195, "global_step": 245234, "epoch": 2026} {"train_loss": -42.83523178100586, "global_step": 245235, "epoch": 2026} {"train_loss": -43.06614303588867, "global_step": 245236, "epoch": 2026} {"train_loss": -42.520015716552734, "global_step": 245237, "epoch": 2026} {"train_loss": -42.58803939819336, "global_step": 245238, "epoch": 2026} {"train_loss": -43.43367004394531, "global_step": 245239, "epoch": 2026} {"train_loss": -43.24131393432617, "global_step": 245240, "epoch": 2026} {"train_loss": -43.282318115234375, "global_step": 245241, "epoch": 2026} {"train_loss": -42.50884246826172, "global_step": 245242, "epoch": 2026} {"train_loss": -43.34892654418945, "global_step": 245243, "epoch": 2026} {"train_loss": -42.48574447631836, "global_step": 245244, "epoch": 2026} {"train_loss": -42.612728118896484, "global_step": 245245, "epoch": 2026} {"train_loss": -41.763702392578125, "global_step": 245246, "epoch": 2026} {"train_loss": -41.42412567138672, "global_step": 245247, "epoch": 2026} {"train_loss": -42.35451126098633, "global_step": 245248, "epoch": 2026} {"train_loss": -42.7196044921875, "global_step": 245249, "epoch": 2026} {"train_loss": -43.04572296142578, "global_step": 245250, "epoch": 2026} {"train_loss": -42.611019134521484, "global_step": 245251, "epoch": 2026} {"train_loss": -42.2420654296875, "global_step": 245252, "epoch": 2026} {"train_loss": -43.338279724121094, "global_step": 245253, "epoch": 2026} {"train_loss": -43.33308029174805, "global_step": 245254, "epoch": 2026} {"train_loss": -42.885467529296875, "global_step": 245255, "epoch": 2026} {"train_loss": -42.84536361694336, "global_step": 245256, "epoch": 2026} {"train_loss": -43.196720123291016, "global_step": 245257, "epoch": 2026} {"train_loss": -42.908687591552734, "global_step": 245258, "epoch": 2026} {"train_loss": -41.48963928222656, "global_step": 245259, "epoch": 2026} {"train_loss": -42.06421661376953, "global_step": 245260, "epoch": 2026} {"train_loss": -42.630340576171875, "global_step": 245261, "epoch": 2026} {"train_loss": -43.09220504760742, "global_step": 245262, "epoch": 2026} {"train_loss": -42.11915969848633, "global_step": 245263, "epoch": 2026} {"train_loss": -42.78206253051758, "global_step": 245264, "epoch": 2026} {"train_loss": -42.267208099365234, "global_step": 245265, "epoch": 2026} {"train_loss": -42.21940291223447, "global_step": 245266, "epoch": 2026, "val_loss": 2565213.75} {"train_loss": -42.35341262817383, "global_step": 245267, "epoch": 2027} {"train_loss": -41.604217529296875, "global_step": 245268, "epoch": 2027} {"train_loss": -41.70164108276367, "global_step": 245269, "epoch": 2027} {"train_loss": -40.844722747802734, "global_step": 245270, "epoch": 2027} {"train_loss": -41.97037887573242, "global_step": 245271, "epoch": 2027} {"train_loss": -41.789493560791016, "global_step": 245272, "epoch": 2027} {"train_loss": -42.46788787841797, "global_step": 245273, "epoch": 2027} {"train_loss": -41.27585983276367, "global_step": 245274, "epoch": 2027} {"train_loss": -38.913658142089844, "global_step": 245275, "epoch": 2027} {"train_loss": -38.69892120361328, "global_step": 245276, "epoch": 2027} {"train_loss": -40.451080322265625, "global_step": 245277, "epoch": 2027} {"train_loss": -42.13496017456055, "global_step": 245278, "epoch": 2027} {"train_loss": -40.60063934326172, "global_step": 245279, "epoch": 2027} {"train_loss": -40.20023727416992, "global_step": 245280, "epoch": 2027} {"train_loss": -40.12287139892578, "global_step": 245281, "epoch": 2027} {"train_loss": -42.50699996948242, "global_step": 245282, "epoch": 2027} {"train_loss": -41.631282806396484, "global_step": 245283, "epoch": 2027} {"train_loss": -40.9263916015625, "global_step": 245284, "epoch": 2027} {"train_loss": -40.64935302734375, "global_step": 245285, "epoch": 2027} {"train_loss": -39.35929489135742, "global_step": 245286, "epoch": 2027} {"train_loss": -40.14936447143555, "global_step": 245287, "epoch": 2027} {"train_loss": -40.4886360168457, "global_step": 245288, "epoch": 2027} {"train_loss": -39.90388107299805, "global_step": 245289, "epoch": 2027} {"train_loss": -38.65003967285156, "global_step": 245290, "epoch": 2027} {"train_loss": -40.750328063964844, "global_step": 245291, "epoch": 2027} {"train_loss": -41.7653694152832, "global_step": 245292, "epoch": 2027} {"train_loss": -41.23101806640625, "global_step": 245293, "epoch": 2027} {"train_loss": -41.01698303222656, "global_step": 245294, "epoch": 2027} {"train_loss": -41.67133331298828, "global_step": 245295, "epoch": 2027} {"train_loss": -42.38700485229492, "global_step": 245296, "epoch": 2027} {"train_loss": -41.91082763671875, "global_step": 245297, "epoch": 2027} {"train_loss": -42.908260345458984, "global_step": 245298, "epoch": 2027} {"train_loss": -42.81576156616211, "global_step": 245299, "epoch": 2027} {"train_loss": -42.82121658325195, "global_step": 245300, "epoch": 2027} {"train_loss": -42.927608489990234, "global_step": 245301, "epoch": 2027} {"train_loss": -42.25178146362305, "global_step": 245302, "epoch": 2027} {"train_loss": -41.76426696777344, "global_step": 245303, "epoch": 2027} {"train_loss": -42.61158752441406, "global_step": 245304, "epoch": 2027} {"train_loss": -42.26738357543945, "global_step": 245305, "epoch": 2027} {"train_loss": -41.29740905761719, "global_step": 245306, "epoch": 2027} {"train_loss": -42.59475326538086, "global_step": 245307, "epoch": 2027} {"train_loss": -41.803802490234375, "global_step": 245308, "epoch": 2027} {"train_loss": -41.41340255737305, "global_step": 245309, "epoch": 2027} {"train_loss": -42.62554931640625, "global_step": 245310, "epoch": 2027} {"train_loss": -42.05662155151367, "global_step": 245311, "epoch": 2027} {"train_loss": -41.91274642944336, "global_step": 245312, "epoch": 2027} {"train_loss": -42.49626541137695, "global_step": 245313, "epoch": 2027} {"train_loss": -40.62963104248047, "global_step": 245314, "epoch": 2027} {"train_loss": -41.9513053894043, "global_step": 245315, "epoch": 2027} {"train_loss": -41.25550079345703, "global_step": 245316, "epoch": 2027} {"train_loss": -40.7443733215332, "global_step": 245317, "epoch": 2027} {"train_loss": -41.73830032348633, "global_step": 245318, "epoch": 2027} {"train_loss": -41.31935501098633, "global_step": 245319, "epoch": 2027} {"train_loss": -42.1944694519043, "global_step": 245320, "epoch": 2027} {"train_loss": -42.00913619995117, "global_step": 245321, "epoch": 2027} {"train_loss": -41.3610725402832, "global_step": 245322, "epoch": 2027} {"train_loss": -42.608314514160156, "global_step": 245323, "epoch": 2027} {"train_loss": -41.961280822753906, "global_step": 245324, "epoch": 2027} {"train_loss": -42.0539436340332, "global_step": 245325, "epoch": 2027} {"train_loss": -42.55436325073242, "global_step": 245326, "epoch": 2027} {"train_loss": -41.76667022705078, "global_step": 245327, "epoch": 2027} {"train_loss": -42.651851654052734, "global_step": 245328, "epoch": 2027} {"train_loss": -41.25355529785156, "global_step": 245329, "epoch": 2027} {"train_loss": -42.67063903808594, "global_step": 245330, "epoch": 2027} {"train_loss": -42.81193161010742, "global_step": 245331, "epoch": 2027} {"train_loss": -42.59156036376953, "global_step": 245332, "epoch": 2027} {"train_loss": -42.530372619628906, "global_step": 245333, "epoch": 2027} {"train_loss": -42.945858001708984, "global_step": 245334, "epoch": 2027} {"train_loss": -42.768287658691406, "global_step": 245335, "epoch": 2027} {"train_loss": -42.6722297668457, "global_step": 245336, "epoch": 2027} {"train_loss": -42.63479232788086, "global_step": 245337, "epoch": 2027} {"train_loss": -42.72884750366211, "global_step": 245338, "epoch": 2027} {"train_loss": -43.20327377319336, "global_step": 245339, "epoch": 2027} {"train_loss": -42.94908142089844, "global_step": 245340, "epoch": 2027} {"train_loss": -42.85244369506836, "global_step": 245341, "epoch": 2027} {"train_loss": -42.80929183959961, "global_step": 245342, "epoch": 2027} {"train_loss": -42.92493438720703, "global_step": 245343, "epoch": 2027} {"train_loss": -43.27863311767578, "global_step": 245344, "epoch": 2027} {"train_loss": -42.239532470703125, "global_step": 245345, "epoch": 2027} {"train_loss": -43.22909927368164, "global_step": 245346, "epoch": 2027} {"train_loss": -43.33253860473633, "global_step": 245347, "epoch": 2027} {"train_loss": -42.40568542480469, "global_step": 245348, "epoch": 2027} {"train_loss": -42.253379821777344, "global_step": 245349, "epoch": 2027} {"train_loss": -41.13703155517578, "global_step": 245350, "epoch": 2027} {"train_loss": -43.074459075927734, "global_step": 245351, "epoch": 2027} {"train_loss": -40.250160217285156, "global_step": 245352, "epoch": 2027} {"train_loss": -42.75960922241211, "global_step": 245353, "epoch": 2027} {"train_loss": -42.8823356628418, "global_step": 245354, "epoch": 2027} {"train_loss": -43.40316390991211, "global_step": 245355, "epoch": 2027} {"train_loss": -43.21845626831055, "global_step": 245356, "epoch": 2027} {"train_loss": -42.83858871459961, "global_step": 245357, "epoch": 2027} {"train_loss": -42.9835205078125, "global_step": 245358, "epoch": 2027} {"train_loss": -42.7228889465332, "global_step": 245359, "epoch": 2027} {"train_loss": -43.329254150390625, "global_step": 245360, "epoch": 2027} {"train_loss": -43.3427734375, "global_step": 245361, "epoch": 2027} {"train_loss": -43.38899612426758, "global_step": 245362, "epoch": 2027} {"train_loss": -43.18963623046875, "global_step": 245363, "epoch": 2027} {"train_loss": -42.64809799194336, "global_step": 245364, "epoch": 2027} {"train_loss": -39.93220520019531, "global_step": 245365, "epoch": 2027} {"train_loss": -42.61098861694336, "global_step": 245366, "epoch": 2027} {"train_loss": -42.945960998535156, "global_step": 245367, "epoch": 2027} {"train_loss": -42.467628479003906, "global_step": 245368, "epoch": 2027} {"train_loss": -42.45316696166992, "global_step": 245369, "epoch": 2027} {"train_loss": -40.984249114990234, "global_step": 245370, "epoch": 2027} {"train_loss": -38.11288070678711, "global_step": 245371, "epoch": 2027} {"train_loss": -35.32072830200195, "global_step": 245372, "epoch": 2027} {"train_loss": -30.79178810119629, "global_step": 245373, "epoch": 2027} {"train_loss": -36.74443435668945, "global_step": 245374, "epoch": 2027} {"train_loss": -41.099647521972656, "global_step": 245375, "epoch": 2027} {"train_loss": -40.75666427612305, "global_step": 245376, "epoch": 2027} {"train_loss": -39.33417510986328, "global_step": 245377, "epoch": 2027} {"train_loss": -40.66944122314453, "global_step": 245378, "epoch": 2027} {"train_loss": -41.608089447021484, "global_step": 245379, "epoch": 2027} {"train_loss": -38.4870719909668, "global_step": 245380, "epoch": 2027} {"train_loss": -40.07930374145508, "global_step": 245381, "epoch": 2027} {"train_loss": -41.43414306640625, "global_step": 245382, "epoch": 2027} {"train_loss": -40.32646942138672, "global_step": 245383, "epoch": 2027} {"train_loss": -42.32986068725586, "global_step": 245384, "epoch": 2027} {"train_loss": -41.20094680786133, "global_step": 245385, "epoch": 2027} {"train_loss": -40.76346206665039, "global_step": 245386, "epoch": 2027} {"train_loss": -41.59672491215477, "global_step": 245387, "epoch": 2027, "val_loss": 2525303.5} {"train_loss": -40.474788665771484, "global_step": 245388, "epoch": 2028} {"train_loss": -41.43027877807617, "global_step": 245389, "epoch": 2028} {"train_loss": -40.61638641357422, "global_step": 245390, "epoch": 2028} {"train_loss": -42.08171081542969, "global_step": 245391, "epoch": 2028} {"train_loss": -39.88212203979492, "global_step": 245392, "epoch": 2028} {"train_loss": -42.26682662963867, "global_step": 245393, "epoch": 2028} {"train_loss": -41.84786605834961, "global_step": 245394, "epoch": 2028} {"train_loss": -41.52535629272461, "global_step": 245395, "epoch": 2028} {"train_loss": -41.845943450927734, "global_step": 245396, "epoch": 2028} {"train_loss": -40.615421295166016, "global_step": 245397, "epoch": 2028} {"train_loss": -39.66053771972656, "global_step": 245398, "epoch": 2028} {"train_loss": -40.20229721069336, "global_step": 245399, "epoch": 2028} {"train_loss": -42.293941497802734, "global_step": 245400, "epoch": 2028} {"train_loss": -39.45695114135742, "global_step": 245401, "epoch": 2028} {"train_loss": -40.72520065307617, "global_step": 245402, "epoch": 2028} {"train_loss": -41.1639404296875, "global_step": 245403, "epoch": 2028} {"train_loss": -32.32023239135742, "global_step": 245404, "epoch": 2028} {"train_loss": -41.45144271850586, "global_step": 245405, "epoch": 2028} {"train_loss": -37.88065719604492, "global_step": 245406, "epoch": 2028} {"train_loss": -34.28691482543945, "global_step": 245407, "epoch": 2028} {"train_loss": -38.77291488647461, "global_step": 245408, "epoch": 2028} {"train_loss": -37.22062301635742, "global_step": 245409, "epoch": 2028} {"train_loss": -36.325618743896484, "global_step": 245410, "epoch": 2028} {"train_loss": -37.76957321166992, "global_step": 245411, "epoch": 2028} {"train_loss": -37.81110763549805, "global_step": 245412, "epoch": 2028} {"train_loss": -32.17008590698242, "global_step": 245413, "epoch": 2028} {"train_loss": -29.88953971862793, "global_step": 245414, "epoch": 2028} {"train_loss": -38.2870979309082, "global_step": 245415, "epoch": 2028} {"train_loss": -36.03190231323242, "global_step": 245416, "epoch": 2028} {"train_loss": -34.73552322387695, "global_step": 245417, "epoch": 2028} {"train_loss": -36.23818588256836, "global_step": 245418, "epoch": 2028} {"train_loss": -37.77888870239258, "global_step": 245419, "epoch": 2028} {"train_loss": -36.399452209472656, "global_step": 245420, "epoch": 2028} {"train_loss": -38.205528259277344, "global_step": 245421, "epoch": 2028} {"train_loss": -36.628173828125, "global_step": 245422, "epoch": 2028} {"train_loss": -38.113094329833984, "global_step": 245423, "epoch": 2028} {"train_loss": -37.76835250854492, "global_step": 245424, "epoch": 2028} {"train_loss": -40.00480270385742, "global_step": 245425, "epoch": 2028} {"train_loss": -39.28935241699219, "global_step": 245426, "epoch": 2028} {"train_loss": -38.84757614135742, "global_step": 245427, "epoch": 2028} {"train_loss": -37.648799896240234, "global_step": 245428, "epoch": 2028} {"train_loss": -39.05690383911133, "global_step": 245429, "epoch": 2028} {"train_loss": -38.71882247924805, "global_step": 245430, "epoch": 2028} {"train_loss": -39.92522048950195, "global_step": 245431, "epoch": 2028} {"train_loss": -40.0806884765625, "global_step": 245432, "epoch": 2028} {"train_loss": -37.312744140625, "global_step": 245433, "epoch": 2028} {"train_loss": -40.22841262817383, "global_step": 245434, "epoch": 2028} {"train_loss": -40.30520248413086, "global_step": 245435, "epoch": 2028} {"train_loss": -37.636505126953125, "global_step": 245436, "epoch": 2028} {"train_loss": -38.7394905090332, "global_step": 245437, "epoch": 2028} {"train_loss": -40.714969635009766, "global_step": 245438, "epoch": 2028} {"train_loss": -40.7547721862793, "global_step": 245439, "epoch": 2028} {"train_loss": -39.93770217895508, "global_step": 245440, "epoch": 2028} {"train_loss": -40.13008117675781, "global_step": 245441, "epoch": 2028} {"train_loss": -40.468040466308594, "global_step": 245442, "epoch": 2028} {"train_loss": -40.962520599365234, "global_step": 245443, "epoch": 2028} {"train_loss": -40.64085388183594, "global_step": 245444, "epoch": 2028} {"train_loss": -40.11454772949219, "global_step": 245445, "epoch": 2028} {"train_loss": -41.04291534423828, "global_step": 245446, "epoch": 2028} {"train_loss": -41.91917037963867, "global_step": 245447, "epoch": 2028} {"train_loss": -38.848209381103516, "global_step": 245448, "epoch": 2028} {"train_loss": -40.10852813720703, "global_step": 245449, "epoch": 2028} {"train_loss": -39.997989654541016, "global_step": 245450, "epoch": 2028} {"train_loss": -41.58351516723633, "global_step": 245451, "epoch": 2028} {"train_loss": -41.19136428833008, "global_step": 245452, "epoch": 2028} {"train_loss": -40.727996826171875, "global_step": 245453, "epoch": 2028} {"train_loss": -41.09295654296875, "global_step": 245454, "epoch": 2028} {"train_loss": -41.58197021484375, "global_step": 245455, "epoch": 2028} {"train_loss": -40.4218635559082, "global_step": 245456, "epoch": 2028} {"train_loss": -41.169151306152344, "global_step": 245457, "epoch": 2028} {"train_loss": -41.18413162231445, "global_step": 245458, "epoch": 2028} {"train_loss": -41.93667984008789, "global_step": 245459, "epoch": 2028} {"train_loss": -41.618831634521484, "global_step": 245460, "epoch": 2028} {"train_loss": -41.410499572753906, "global_step": 245461, "epoch": 2028} {"train_loss": -41.08750534057617, "global_step": 245462, "epoch": 2028} {"train_loss": -40.86210632324219, "global_step": 245463, "epoch": 2028} {"train_loss": -41.696128845214844, "global_step": 245464, "epoch": 2028} {"train_loss": -41.78693771362305, "global_step": 245465, "epoch": 2028} {"train_loss": -41.66206359863281, "global_step": 245466, "epoch": 2028} {"train_loss": -41.108367919921875, "global_step": 245467, "epoch": 2028} {"train_loss": -41.40312576293945, "global_step": 245468, "epoch": 2028} {"train_loss": -41.37398910522461, "global_step": 245469, "epoch": 2028} {"train_loss": -41.14789962768555, "global_step": 245470, "epoch": 2028} {"train_loss": -42.068084716796875, "global_step": 245471, "epoch": 2028} {"train_loss": -41.841949462890625, "global_step": 245472, "epoch": 2028} {"train_loss": -42.4322624206543, "global_step": 245473, "epoch": 2028} {"train_loss": -41.98611068725586, "global_step": 245474, "epoch": 2028} {"train_loss": -42.04159927368164, "global_step": 245475, "epoch": 2028} {"train_loss": -42.132076263427734, "global_step": 245476, "epoch": 2028} {"train_loss": -41.70547103881836, "global_step": 245477, "epoch": 2028} {"train_loss": -41.98876953125, "global_step": 245478, "epoch": 2028} {"train_loss": -41.72007751464844, "global_step": 245479, "epoch": 2028} {"train_loss": -42.317745208740234, "global_step": 245480, "epoch": 2028} {"train_loss": -42.1100959777832, "global_step": 245481, "epoch": 2028} {"train_loss": -41.96753692626953, "global_step": 245482, "epoch": 2028} {"train_loss": -41.27043533325195, "global_step": 245483, "epoch": 2028} {"train_loss": -41.47675323486328, "global_step": 245484, "epoch": 2028} {"train_loss": -41.56433868408203, "global_step": 245485, "epoch": 2028} {"train_loss": -39.78889846801758, "global_step": 245486, "epoch": 2028} {"train_loss": -41.872283935546875, "global_step": 245487, "epoch": 2028} {"train_loss": -42.50847244262695, "global_step": 245488, "epoch": 2028} {"train_loss": -41.6268424987793, "global_step": 245489, "epoch": 2028} {"train_loss": -42.90598678588867, "global_step": 245490, "epoch": 2028} {"train_loss": -42.75324630737305, "global_step": 245491, "epoch": 2028} {"train_loss": -41.992034912109375, "global_step": 245492, "epoch": 2028} {"train_loss": -42.13161849975586, "global_step": 245493, "epoch": 2028} {"train_loss": -42.398380279541016, "global_step": 245494, "epoch": 2028} {"train_loss": -42.330806732177734, "global_step": 245495, "epoch": 2028} {"train_loss": -42.33527755737305, "global_step": 245496, "epoch": 2028} {"train_loss": -41.262943267822266, "global_step": 245497, "epoch": 2028} {"train_loss": -42.206382751464844, "global_step": 245498, "epoch": 2028} {"train_loss": -41.576839447021484, "global_step": 245499, "epoch": 2028} {"train_loss": -41.993255615234375, "global_step": 245500, "epoch": 2028} {"train_loss": -40.0922737121582, "global_step": 245501, "epoch": 2028} {"train_loss": -42.84357452392578, "global_step": 245502, "epoch": 2028} {"train_loss": -41.905860900878906, "global_step": 245503, "epoch": 2028} {"train_loss": -42.639892578125, "global_step": 245504, "epoch": 2028} {"train_loss": -42.304115295410156, "global_step": 245505, "epoch": 2028} {"train_loss": -41.36581039428711, "global_step": 245506, "epoch": 2028} {"train_loss": -42.62836456298828, "global_step": 245507, "epoch": 2028} {"train_loss": -40.301324024673335, "global_step": 245508, "epoch": 2028, "val_loss": 2654601.0} {"train_loss": -42.13892364501953, "global_step": 245509, "epoch": 2029} {"train_loss": -42.435428619384766, "global_step": 245510, "epoch": 2029} {"train_loss": -42.04643630981445, "global_step": 245511, "epoch": 2029} {"train_loss": -43.115013122558594, "global_step": 245512, "epoch": 2029} {"train_loss": -42.81130599975586, "global_step": 245513, "epoch": 2029} {"train_loss": -41.443885803222656, "global_step": 245514, "epoch": 2029} {"train_loss": -42.60431671142578, "global_step": 245515, "epoch": 2029} {"train_loss": -43.10683822631836, "global_step": 245516, "epoch": 2029} {"train_loss": -42.76839828491211, "global_step": 245517, "epoch": 2029} {"train_loss": -42.549861907958984, "global_step": 245518, "epoch": 2029} {"train_loss": -42.59831237792969, "global_step": 245519, "epoch": 2029} {"train_loss": -42.4914665222168, "global_step": 245520, "epoch": 2029} {"train_loss": -42.62454605102539, "global_step": 245521, "epoch": 2029} {"train_loss": -42.377098083496094, "global_step": 245522, "epoch": 2029} {"train_loss": -42.35020446777344, "global_step": 245523, "epoch": 2029} {"train_loss": -42.873046875, "global_step": 245524, "epoch": 2029} {"train_loss": -42.88094711303711, "global_step": 245525, "epoch": 2029} {"train_loss": -42.558589935302734, "global_step": 245526, "epoch": 2029} {"train_loss": -42.9000358581543, "global_step": 245527, "epoch": 2029} {"train_loss": -42.88143539428711, "global_step": 245528, "epoch": 2029} {"train_loss": -42.794776916503906, "global_step": 245529, "epoch": 2029} {"train_loss": -43.1485595703125, "global_step": 245530, "epoch": 2029} {"train_loss": -43.45850372314453, "global_step": 245531, "epoch": 2029} {"train_loss": -41.8045539855957, "global_step": 245532, "epoch": 2029} {"train_loss": -42.720619201660156, "global_step": 245533, "epoch": 2029} {"train_loss": -39.825679779052734, "global_step": 245534, "epoch": 2029} {"train_loss": -40.66252899169922, "global_step": 245535, "epoch": 2029} {"train_loss": -42.006263732910156, "global_step": 245536, "epoch": 2029} {"train_loss": -38.7075080871582, "global_step": 245537, "epoch": 2029} {"train_loss": -40.332252502441406, "global_step": 245538, "epoch": 2029} {"train_loss": -37.2660026550293, "global_step": 245539, "epoch": 2029} {"train_loss": -42.19919967651367, "global_step": 245540, "epoch": 2029} {"train_loss": -42.618202209472656, "global_step": 245541, "epoch": 2029} {"train_loss": -38.69559860229492, "global_step": 245542, "epoch": 2029} {"train_loss": -39.71567916870117, "global_step": 245543, "epoch": 2029} {"train_loss": -40.59672546386719, "global_step": 245544, "epoch": 2029} {"train_loss": -41.066009521484375, "global_step": 245545, "epoch": 2029} {"train_loss": -41.977386474609375, "global_step": 245546, "epoch": 2029} {"train_loss": -39.64802932739258, "global_step": 245547, "epoch": 2029} {"train_loss": -41.2479362487793, "global_step": 245548, "epoch": 2029} {"train_loss": -42.45636749267578, "global_step": 245549, "epoch": 2029} {"train_loss": -40.04648208618164, "global_step": 245550, "epoch": 2029} {"train_loss": -40.007896423339844, "global_step": 245551, "epoch": 2029} {"train_loss": -39.669490814208984, "global_step": 245552, "epoch": 2029} {"train_loss": -42.2729606628418, "global_step": 245553, "epoch": 2029} {"train_loss": -39.86423873901367, "global_step": 245554, "epoch": 2029} {"train_loss": -38.47099685668945, "global_step": 245555, "epoch": 2029} {"train_loss": -39.88216018676758, "global_step": 245556, "epoch": 2029} {"train_loss": -41.23111343383789, "global_step": 245557, "epoch": 2029} {"train_loss": -41.06218338012695, "global_step": 245558, "epoch": 2029} {"train_loss": -38.02974319458008, "global_step": 245559, "epoch": 2029} {"train_loss": -39.62628936767578, "global_step": 245560, "epoch": 2029} {"train_loss": -38.2100944519043, "global_step": 245561, "epoch": 2029} {"train_loss": -36.23249435424805, "global_step": 245562, "epoch": 2029} {"train_loss": -38.86345291137695, "global_step": 245563, "epoch": 2029} {"train_loss": -38.22874069213867, "global_step": 245564, "epoch": 2029} {"train_loss": -40.83548355102539, "global_step": 245565, "epoch": 2029} {"train_loss": -39.162227630615234, "global_step": 245566, "epoch": 2029} {"train_loss": -38.94104766845703, "global_step": 245567, "epoch": 2029} {"train_loss": -39.27073669433594, "global_step": 245568, "epoch": 2029} {"train_loss": -37.15095901489258, "global_step": 245569, "epoch": 2029} {"train_loss": -39.96561813354492, "global_step": 245570, "epoch": 2029} {"train_loss": -38.58613586425781, "global_step": 245571, "epoch": 2029} {"train_loss": -38.95547103881836, "global_step": 245572, "epoch": 2029} {"train_loss": -38.75716781616211, "global_step": 245573, "epoch": 2029} {"train_loss": -37.220123291015625, "global_step": 245574, "epoch": 2029} {"train_loss": -39.3718376159668, "global_step": 245575, "epoch": 2029} {"train_loss": -40.893348693847656, "global_step": 245576, "epoch": 2029} {"train_loss": -39.23661422729492, "global_step": 245577, "epoch": 2029} {"train_loss": -41.491554260253906, "global_step": 245578, "epoch": 2029} {"train_loss": -40.14155960083008, "global_step": 245579, "epoch": 2029} {"train_loss": -39.424312591552734, "global_step": 245580, "epoch": 2029} {"train_loss": -40.264461517333984, "global_step": 245581, "epoch": 2029} {"train_loss": -39.89768600463867, "global_step": 245582, "epoch": 2029} {"train_loss": -41.61150360107422, "global_step": 245583, "epoch": 2029} {"train_loss": -38.493648529052734, "global_step": 245584, "epoch": 2029} {"train_loss": -40.986244201660156, "global_step": 245585, "epoch": 2029} {"train_loss": -40.272037506103516, "global_step": 245586, "epoch": 2029} {"train_loss": -40.58897018432617, "global_step": 245587, "epoch": 2029} {"train_loss": -41.06999969482422, "global_step": 245588, "epoch": 2029} {"train_loss": -40.62401580810547, "global_step": 245589, "epoch": 2029} {"train_loss": -41.46305847167969, "global_step": 245590, "epoch": 2029} {"train_loss": -41.3245735168457, "global_step": 245591, "epoch": 2029} {"train_loss": -40.130672454833984, "global_step": 245592, "epoch": 2029} {"train_loss": -40.63330841064453, "global_step": 245593, "epoch": 2029} {"train_loss": -41.455074310302734, "global_step": 245594, "epoch": 2029} {"train_loss": -41.29955291748047, "global_step": 245595, "epoch": 2029} {"train_loss": -41.91073989868164, "global_step": 245596, "epoch": 2029} {"train_loss": -41.77016067504883, "global_step": 245597, "epoch": 2029} {"train_loss": -41.4145622253418, "global_step": 245598, "epoch": 2029} {"train_loss": -41.90347671508789, "global_step": 245599, "epoch": 2029} {"train_loss": -41.32780075073242, "global_step": 245600, "epoch": 2029} {"train_loss": -41.25571823120117, "global_step": 245601, "epoch": 2029} {"train_loss": -40.926666259765625, "global_step": 245602, "epoch": 2029} {"train_loss": -41.969383239746094, "global_step": 245603, "epoch": 2029} {"train_loss": -41.35123062133789, "global_step": 245604, "epoch": 2029} {"train_loss": -41.6975212097168, "global_step": 245605, "epoch": 2029} {"train_loss": -41.50031280517578, "global_step": 245606, "epoch": 2029} {"train_loss": -41.89201736450195, "global_step": 245607, "epoch": 2029} {"train_loss": -41.74233627319336, "global_step": 245608, "epoch": 2029} {"train_loss": -41.31061553955078, "global_step": 245609, "epoch": 2029} {"train_loss": -42.138240814208984, "global_step": 245610, "epoch": 2029} {"train_loss": -41.82014083862305, "global_step": 245611, "epoch": 2029} {"train_loss": -41.79201889038086, "global_step": 245612, "epoch": 2029} {"train_loss": -41.88322830200195, "global_step": 245613, "epoch": 2029} {"train_loss": -42.35005569458008, "global_step": 245614, "epoch": 2029} {"train_loss": -42.341102600097656, "global_step": 245615, "epoch": 2029} {"train_loss": -40.69582748413086, "global_step": 245616, "epoch": 2029} {"train_loss": -41.482383728027344, "global_step": 245617, "epoch": 2029} {"train_loss": -41.215728759765625, "global_step": 245618, "epoch": 2029} {"train_loss": -42.528053283691406, "global_step": 245619, "epoch": 2029} {"train_loss": -42.508785247802734, "global_step": 245620, "epoch": 2029} {"train_loss": -41.837406158447266, "global_step": 245621, "epoch": 2029} {"train_loss": -42.168800354003906, "global_step": 245622, "epoch": 2029} {"train_loss": -42.78290939331055, "global_step": 245623, "epoch": 2029} {"train_loss": -40.89013671875, "global_step": 245624, "epoch": 2029} {"train_loss": -42.07723617553711, "global_step": 245625, "epoch": 2029} {"train_loss": -41.43450164794922, "global_step": 245626, "epoch": 2029} {"train_loss": -42.580970764160156, "global_step": 245627, "epoch": 2029} {"train_loss": -42.543209075927734, "global_step": 245628, "epoch": 2029} {"train_loss": -41.049777227984976, "global_step": 245629, "epoch": 2029, "val_loss": 2572266.0} {"train_loss": -42.50395584106445, "global_step": 245630, "epoch": 2030} {"train_loss": -42.14514923095703, "global_step": 245631, "epoch": 2030} {"train_loss": -42.08684539794922, "global_step": 245632, "epoch": 2030} {"train_loss": -42.962615966796875, "global_step": 245633, "epoch": 2030} {"train_loss": -41.84130859375, "global_step": 245634, "epoch": 2030} {"train_loss": -41.885169982910156, "global_step": 245635, "epoch": 2030} {"train_loss": -42.87831497192383, "global_step": 245636, "epoch": 2030} {"train_loss": -41.68310546875, "global_step": 245637, "epoch": 2030} {"train_loss": -41.32328414916992, "global_step": 245638, "epoch": 2030} {"train_loss": -42.808509826660156, "global_step": 245639, "epoch": 2030} {"train_loss": -42.20703125, "global_step": 245640, "epoch": 2030} {"train_loss": -42.95148849487305, "global_step": 245641, "epoch": 2030} {"train_loss": -43.110084533691406, "global_step": 245642, "epoch": 2030} {"train_loss": -42.85095977783203, "global_step": 245643, "epoch": 2030} {"train_loss": -42.19364929199219, "global_step": 245644, "epoch": 2030} {"train_loss": -42.8317756652832, "global_step": 245645, "epoch": 2030} {"train_loss": -42.76987838745117, "global_step": 245646, "epoch": 2030} {"train_loss": -41.7802619934082, "global_step": 245647, "epoch": 2030} {"train_loss": -42.47710037231445, "global_step": 245648, "epoch": 2030} {"train_loss": -41.53959274291992, "global_step": 245649, "epoch": 2030} {"train_loss": -41.6826286315918, "global_step": 245650, "epoch": 2030} {"train_loss": -42.606658935546875, "global_step": 245651, "epoch": 2030} {"train_loss": -42.739315032958984, "global_step": 245652, "epoch": 2030} {"train_loss": -42.2598876953125, "global_step": 245653, "epoch": 2030} {"train_loss": -42.658931732177734, "global_step": 245654, "epoch": 2030} {"train_loss": -39.57277297973633, "global_step": 245655, "epoch": 2030} {"train_loss": -42.35163497924805, "global_step": 245656, "epoch": 2030} {"train_loss": -41.048179626464844, "global_step": 245657, "epoch": 2030} {"train_loss": -43.04887390136719, "global_step": 245658, "epoch": 2030} {"train_loss": -42.48041915893555, "global_step": 245659, "epoch": 2030} {"train_loss": -42.001190185546875, "global_step": 245660, "epoch": 2030} {"train_loss": -41.78989791870117, "global_step": 245661, "epoch": 2030} {"train_loss": -41.65415573120117, "global_step": 245662, "epoch": 2030} {"train_loss": -41.62614822387695, "global_step": 245663, "epoch": 2030} {"train_loss": -40.75096130371094, "global_step": 245664, "epoch": 2030} {"train_loss": -40.953060150146484, "global_step": 245665, "epoch": 2030} {"train_loss": -41.6351318359375, "global_step": 245666, "epoch": 2030} {"train_loss": -41.388832092285156, "global_step": 245667, "epoch": 2030} {"train_loss": -41.46047592163086, "global_step": 245668, "epoch": 2030} {"train_loss": -40.99189758300781, "global_step": 245669, "epoch": 2030} {"train_loss": -42.72290802001953, "global_step": 245670, "epoch": 2030} {"train_loss": -41.915645599365234, "global_step": 245671, "epoch": 2030} {"train_loss": -41.22616195678711, "global_step": 245672, "epoch": 2030} {"train_loss": -42.44237518310547, "global_step": 245673, "epoch": 2030} {"train_loss": -41.70937728881836, "global_step": 245674, "epoch": 2030} {"train_loss": -42.36532211303711, "global_step": 245675, "epoch": 2030} {"train_loss": -42.59600830078125, "global_step": 245676, "epoch": 2030} {"train_loss": -42.576290130615234, "global_step": 245677, "epoch": 2030} {"train_loss": -42.202674865722656, "global_step": 245678, "epoch": 2030} {"train_loss": -42.47941207885742, "global_step": 245679, "epoch": 2030} {"train_loss": -41.61429214477539, "global_step": 245680, "epoch": 2030} {"train_loss": -38.54066848754883, "global_step": 245681, "epoch": 2030} {"train_loss": -36.09703063964844, "global_step": 245682, "epoch": 2030} {"train_loss": -42.43450164794922, "global_step": 245683, "epoch": 2030} {"train_loss": -41.960914611816406, "global_step": 245684, "epoch": 2030} {"train_loss": -42.30086135864258, "global_step": 245685, "epoch": 2030} {"train_loss": -41.07471466064453, "global_step": 245686, "epoch": 2030} {"train_loss": -42.647132873535156, "global_step": 245687, "epoch": 2030} {"train_loss": -42.406951904296875, "global_step": 245688, "epoch": 2030} {"train_loss": -41.58015060424805, "global_step": 245689, "epoch": 2030} {"train_loss": -42.471622467041016, "global_step": 245690, "epoch": 2030} {"train_loss": -42.1219482421875, "global_step": 245691, "epoch": 2030} {"train_loss": -41.993404388427734, "global_step": 245692, "epoch": 2030} {"train_loss": -42.537532806396484, "global_step": 245693, "epoch": 2030} {"train_loss": -41.89419174194336, "global_step": 245694, "epoch": 2030} {"train_loss": -41.03129196166992, "global_step": 245695, "epoch": 2030} {"train_loss": -42.3221435546875, "global_step": 245696, "epoch": 2030} {"train_loss": -41.377525329589844, "global_step": 245697, "epoch": 2030} {"train_loss": -42.55072021484375, "global_step": 245698, "epoch": 2030} {"train_loss": -42.75320816040039, "global_step": 245699, "epoch": 2030} {"train_loss": -42.520267486572266, "global_step": 245700, "epoch": 2030} {"train_loss": -41.40741729736328, "global_step": 245701, "epoch": 2030} {"train_loss": -40.59394073486328, "global_step": 245702, "epoch": 2030} {"train_loss": -41.75832748413086, "global_step": 245703, "epoch": 2030} {"train_loss": -41.6666374206543, "global_step": 245704, "epoch": 2030} {"train_loss": -41.39484405517578, "global_step": 245705, "epoch": 2030} {"train_loss": -41.31317901611328, "global_step": 245706, "epoch": 2030} {"train_loss": -41.876434326171875, "global_step": 245707, "epoch": 2030} {"train_loss": -41.88661575317383, "global_step": 245708, "epoch": 2030} {"train_loss": -42.4323616027832, "global_step": 245709, "epoch": 2030} {"train_loss": -41.581417083740234, "global_step": 245710, "epoch": 2030} {"train_loss": -41.28815460205078, "global_step": 245711, "epoch": 2030} {"train_loss": -42.81315231323242, "global_step": 245712, "epoch": 2030} {"train_loss": -40.79951858520508, "global_step": 245713, "epoch": 2030} {"train_loss": -42.110111236572266, "global_step": 245714, "epoch": 2030} {"train_loss": -41.94015884399414, "global_step": 245715, "epoch": 2030} {"train_loss": -41.4273567199707, "global_step": 245716, "epoch": 2030} {"train_loss": -42.337100982666016, "global_step": 245717, "epoch": 2030} {"train_loss": -39.86767578125, "global_step": 245718, "epoch": 2030} {"train_loss": -42.66549301147461, "global_step": 245719, "epoch": 2030} {"train_loss": -42.16987228393555, "global_step": 245720, "epoch": 2030} {"train_loss": -42.487361907958984, "global_step": 245721, "epoch": 2030} {"train_loss": -42.046566009521484, "global_step": 245722, "epoch": 2030} {"train_loss": -41.42148971557617, "global_step": 245723, "epoch": 2030} {"train_loss": -42.77081298828125, "global_step": 245724, "epoch": 2030} {"train_loss": -42.30813217163086, "global_step": 245725, "epoch": 2030} {"train_loss": -42.5767822265625, "global_step": 245726, "epoch": 2030} {"train_loss": -41.73519515991211, "global_step": 245727, "epoch": 2030} {"train_loss": -41.781272888183594, "global_step": 245728, "epoch": 2030} {"train_loss": -42.86056900024414, "global_step": 245729, "epoch": 2030} {"train_loss": -42.113460540771484, "global_step": 245730, "epoch": 2030} {"train_loss": -42.268009185791016, "global_step": 245731, "epoch": 2030} {"train_loss": -41.61269760131836, "global_step": 245732, "epoch": 2030} {"train_loss": -43.0717887878418, "global_step": 245733, "epoch": 2030} {"train_loss": -41.855491638183594, "global_step": 245734, "epoch": 2030} {"train_loss": -42.85334396362305, "global_step": 245735, "epoch": 2030} {"train_loss": -42.52413558959961, "global_step": 245736, "epoch": 2030} {"train_loss": -40.89234161376953, "global_step": 245737, "epoch": 2030} {"train_loss": -37.92139434814453, "global_step": 245738, "epoch": 2030} {"train_loss": -42.32969284057617, "global_step": 245739, "epoch": 2030} {"train_loss": -42.07910919189453, "global_step": 245740, "epoch": 2030} {"train_loss": -41.86220169067383, "global_step": 245741, "epoch": 2030} {"train_loss": -41.451534271240234, "global_step": 245742, "epoch": 2030} {"train_loss": -41.8825798034668, "global_step": 245743, "epoch": 2030} {"train_loss": -41.87812042236328, "global_step": 245744, "epoch": 2030} {"train_loss": -41.487701416015625, "global_step": 245745, "epoch": 2030} {"train_loss": -42.671077728271484, "global_step": 245746, "epoch": 2030} {"train_loss": -42.28081512451172, "global_step": 245747, "epoch": 2030} {"train_loss": -41.9793701171875, "global_step": 245748, "epoch": 2030} {"train_loss": -41.871925354003906, "global_step": 245749, "epoch": 2030} {"train_loss": -41.89626394224561, "global_step": 245750, "epoch": 2030, "val_loss": 2613222.75} {"train_loss": -40.868953704833984, "global_step": 245751, "epoch": 2031} {"train_loss": -39.6737174987793, "global_step": 245752, "epoch": 2031} {"train_loss": -42.689064025878906, "global_step": 245753, "epoch": 2031} {"train_loss": -41.95722198486328, "global_step": 245754, "epoch": 2031} {"train_loss": -41.206947326660156, "global_step": 245755, "epoch": 2031} {"train_loss": -38.37269973754883, "global_step": 245756, "epoch": 2031} {"train_loss": -35.43029022216797, "global_step": 245757, "epoch": 2031} {"train_loss": -41.888912200927734, "global_step": 245758, "epoch": 2031} {"train_loss": -42.49884033203125, "global_step": 245759, "epoch": 2031} {"train_loss": -40.3300666809082, "global_step": 245760, "epoch": 2031} {"train_loss": -42.37553405761719, "global_step": 245761, "epoch": 2031} {"train_loss": -41.48210906982422, "global_step": 245762, "epoch": 2031} {"train_loss": -41.678504943847656, "global_step": 245763, "epoch": 2031} {"train_loss": -40.94016647338867, "global_step": 245764, "epoch": 2031} {"train_loss": -39.5481071472168, "global_step": 245765, "epoch": 2031} {"train_loss": -40.95835494995117, "global_step": 245766, "epoch": 2031} {"train_loss": -42.19391632080078, "global_step": 245767, "epoch": 2031} {"train_loss": -42.146484375, "global_step": 245768, "epoch": 2031} {"train_loss": -38.996734619140625, "global_step": 245769, "epoch": 2031} {"train_loss": -39.00509262084961, "global_step": 245770, "epoch": 2031} {"train_loss": -42.38853073120117, "global_step": 245771, "epoch": 2031} {"train_loss": -42.14640426635742, "global_step": 245772, "epoch": 2031} {"train_loss": -38.78547668457031, "global_step": 245773, "epoch": 2031} {"train_loss": -41.225433349609375, "global_step": 245774, "epoch": 2031} {"train_loss": -41.763458251953125, "global_step": 245775, "epoch": 2031} {"train_loss": -41.7829704284668, "global_step": 245776, "epoch": 2031} {"train_loss": -38.46577835083008, "global_step": 245777, "epoch": 2031} {"train_loss": -41.21442794799805, "global_step": 245778, "epoch": 2031} {"train_loss": -40.8810920715332, "global_step": 245779, "epoch": 2031} {"train_loss": -42.102725982666016, "global_step": 245780, "epoch": 2031} {"train_loss": -42.725433349609375, "global_step": 245781, "epoch": 2031} {"train_loss": -41.262630462646484, "global_step": 245782, "epoch": 2031} {"train_loss": -34.5362548828125, "global_step": 245783, "epoch": 2031} {"train_loss": -41.42329025268555, "global_step": 245784, "epoch": 2031} {"train_loss": -41.519805908203125, "global_step": 245785, "epoch": 2031} {"train_loss": -38.5677604675293, "global_step": 245786, "epoch": 2031} {"train_loss": -41.77350997924805, "global_step": 245787, "epoch": 2031} {"train_loss": -40.59518051147461, "global_step": 245788, "epoch": 2031} {"train_loss": -40.20280075073242, "global_step": 245789, "epoch": 2031} {"train_loss": -40.38308334350586, "global_step": 245790, "epoch": 2031} {"train_loss": -41.9365234375, "global_step": 245791, "epoch": 2031} {"train_loss": -41.64491653442383, "global_step": 245792, "epoch": 2031} {"train_loss": -42.526153564453125, "global_step": 245793, "epoch": 2031} {"train_loss": -41.30419921875, "global_step": 245794, "epoch": 2031} {"train_loss": -39.19063186645508, "global_step": 245795, "epoch": 2031} {"train_loss": -39.7492561340332, "global_step": 245796, "epoch": 2031} {"train_loss": -41.20545196533203, "global_step": 245797, "epoch": 2031} {"train_loss": -38.543209075927734, "global_step": 245798, "epoch": 2031} {"train_loss": -36.53693389892578, "global_step": 245799, "epoch": 2031} {"train_loss": -30.461530685424805, "global_step": 245800, "epoch": 2031} {"train_loss": -39.900672912597656, "global_step": 245801, "epoch": 2031} {"train_loss": -39.27735900878906, "global_step": 245802, "epoch": 2031} {"train_loss": -40.79212188720703, "global_step": 245803, "epoch": 2031} {"train_loss": -40.719581604003906, "global_step": 245804, "epoch": 2031} {"train_loss": -38.44155502319336, "global_step": 245805, "epoch": 2031} {"train_loss": -34.78107452392578, "global_step": 245806, "epoch": 2031} {"train_loss": -34.894649505615234, "global_step": 245807, "epoch": 2031} {"train_loss": -40.55322265625, "global_step": 245808, "epoch": 2031} {"train_loss": -40.499244689941406, "global_step": 245809, "epoch": 2031} {"train_loss": -40.4133186340332, "global_step": 245810, "epoch": 2031} {"train_loss": -41.22749710083008, "global_step": 245811, "epoch": 2031} {"train_loss": -38.07554244995117, "global_step": 245812, "epoch": 2031} {"train_loss": -38.398521423339844, "global_step": 245813, "epoch": 2031} {"train_loss": -39.36104202270508, "global_step": 245814, "epoch": 2031} {"train_loss": -38.89943313598633, "global_step": 245815, "epoch": 2031} {"train_loss": -41.07249069213867, "global_step": 245816, "epoch": 2031} {"train_loss": -39.98079299926758, "global_step": 245817, "epoch": 2031} {"train_loss": -36.269935607910156, "global_step": 245818, "epoch": 2031} {"train_loss": -41.28940200805664, "global_step": 245819, "epoch": 2031} {"train_loss": -39.33137893676758, "global_step": 245820, "epoch": 2031} {"train_loss": -41.30636978149414, "global_step": 245821, "epoch": 2031} {"train_loss": -40.60372543334961, "global_step": 245822, "epoch": 2031} {"train_loss": -39.334346771240234, "global_step": 245823, "epoch": 2031} {"train_loss": -37.76366424560547, "global_step": 245824, "epoch": 2031} {"train_loss": -40.39384841918945, "global_step": 245825, "epoch": 2031} {"train_loss": -35.807804107666016, "global_step": 245826, "epoch": 2031} {"train_loss": -39.49568176269531, "global_step": 245827, "epoch": 2031} {"train_loss": -40.2930908203125, "global_step": 245828, "epoch": 2031} {"train_loss": -37.943634033203125, "global_step": 245829, "epoch": 2031} {"train_loss": -36.73054885864258, "global_step": 245830, "epoch": 2031} {"train_loss": -41.144447326660156, "global_step": 245831, "epoch": 2031} {"train_loss": -40.16940689086914, "global_step": 245832, "epoch": 2031} {"train_loss": -37.37861251831055, "global_step": 245833, "epoch": 2031} {"train_loss": -40.50532913208008, "global_step": 245834, "epoch": 2031} {"train_loss": -39.41826248168945, "global_step": 245835, "epoch": 2031} {"train_loss": -25.139135360717773, "global_step": 245836, "epoch": 2031} {"train_loss": -40.245391845703125, "global_step": 245837, "epoch": 2031} {"train_loss": -39.995384216308594, "global_step": 245838, "epoch": 2031} {"train_loss": -28.162750244140625, "global_step": 245839, "epoch": 2031} {"train_loss": 10.030596733093262, "global_step": 245840, "epoch": 2031} {"train_loss": -32.638057708740234, "global_step": 245841, "epoch": 2031} {"train_loss": -36.2771110534668, "global_step": 245842, "epoch": 2031} {"train_loss": -22.285133361816406, "global_step": 245843, "epoch": 2031} {"train_loss": 52.63148880004883, "global_step": 245844, "epoch": 2031} {"train_loss": -29.54150390625, "global_step": 245845, "epoch": 2031} {"train_loss": -24.984596252441406, "global_step": 245846, "epoch": 2031} {"train_loss": -34.71077346801758, "global_step": 245847, "epoch": 2031} {"train_loss": -34.292686462402344, "global_step": 245848, "epoch": 2031} {"train_loss": -26.759748458862305, "global_step": 245849, "epoch": 2031} {"train_loss": -23.641733169555664, "global_step": 245850, "epoch": 2031} {"train_loss": -20.91667938232422, "global_step": 245851, "epoch": 2031} {"train_loss": -17.94563865661621, "global_step": 245852, "epoch": 2031} {"train_loss": -28.055622100830078, "global_step": 245853, "epoch": 2031} {"train_loss": -31.08576011657715, "global_step": 245854, "epoch": 2031} {"train_loss": -29.3870906829834, "global_step": 245855, "epoch": 2031} {"train_loss": -25.272626876831055, "global_step": 245856, "epoch": 2031} {"train_loss": -33.1263542175293, "global_step": 245857, "epoch": 2031} {"train_loss": -29.90105628967285, "global_step": 245858, "epoch": 2031} {"train_loss": -33.24808883666992, "global_step": 245859, "epoch": 2031} {"train_loss": -30.998571395874023, "global_step": 245860, "epoch": 2031} {"train_loss": -32.72282791137695, "global_step": 245861, "epoch": 2031} {"train_loss": -33.757415771484375, "global_step": 245862, "epoch": 2031} {"train_loss": -34.3034782409668, "global_step": 245863, "epoch": 2031} {"train_loss": -34.8437385559082, "global_step": 245864, "epoch": 2031} {"train_loss": -33.26200485229492, "global_step": 245865, "epoch": 2031} {"train_loss": -34.603572845458984, "global_step": 245866, "epoch": 2031} {"train_loss": -34.661224365234375, "global_step": 245867, "epoch": 2031} {"train_loss": -33.60454177856445, "global_step": 245868, "epoch": 2031} {"train_loss": -34.8631706237793, "global_step": 245869, "epoch": 2031} {"train_loss": -35.213130950927734, "global_step": 245870, "epoch": 2031} {"train_loss": -36.2428930377172, "global_step": 245871, "epoch": 2031, "val_loss": 2533025.0} {"train_loss": -34.914791107177734, "global_step": 245872, "epoch": 2032} {"train_loss": -34.123531341552734, "global_step": 245873, "epoch": 2032} {"train_loss": -35.31622314453125, "global_step": 245874, "epoch": 2032} {"train_loss": -35.00111770629883, "global_step": 245875, "epoch": 2032} {"train_loss": -35.79343795776367, "global_step": 245876, "epoch": 2032} {"train_loss": -34.837677001953125, "global_step": 245877, "epoch": 2032} {"train_loss": -34.65533447265625, "global_step": 245878, "epoch": 2032} {"train_loss": -35.41415023803711, "global_step": 245879, "epoch": 2032} {"train_loss": -34.55451202392578, "global_step": 245880, "epoch": 2032} {"train_loss": -35.01906967163086, "global_step": 245881, "epoch": 2032} {"train_loss": -36.13154220581055, "global_step": 245882, "epoch": 2032} {"train_loss": -35.54825973510742, "global_step": 245883, "epoch": 2032} {"train_loss": -35.781803131103516, "global_step": 245884, "epoch": 2032} {"train_loss": -35.76228332519531, "global_step": 245885, "epoch": 2032} {"train_loss": -35.694618225097656, "global_step": 245886, "epoch": 2032} {"train_loss": -35.947689056396484, "global_step": 245887, "epoch": 2032} {"train_loss": -36.6026611328125, "global_step": 245888, "epoch": 2032} {"train_loss": -36.06302261352539, "global_step": 245889, "epoch": 2032} {"train_loss": -35.639312744140625, "global_step": 245890, "epoch": 2032} {"train_loss": -35.636451721191406, "global_step": 245891, "epoch": 2032} {"train_loss": -36.445926666259766, "global_step": 245892, "epoch": 2032} {"train_loss": -36.114253997802734, "global_step": 245893, "epoch": 2032} {"train_loss": -36.2841911315918, "global_step": 245894, "epoch": 2032} {"train_loss": -36.48053741455078, "global_step": 245895, "epoch": 2032} {"train_loss": -36.93673324584961, "global_step": 245896, "epoch": 2032} {"train_loss": -35.585418701171875, "global_step": 245897, "epoch": 2032} {"train_loss": -36.4578971862793, "global_step": 245898, "epoch": 2032} {"train_loss": -36.6712646484375, "global_step": 245899, "epoch": 2032} {"train_loss": -36.88221740722656, "global_step": 245900, "epoch": 2032} {"train_loss": -37.111114501953125, "global_step": 245901, "epoch": 2032} {"train_loss": -37.29964065551758, "global_step": 245902, "epoch": 2032} {"train_loss": -35.97348403930664, "global_step": 245903, "epoch": 2032} {"train_loss": -36.0251579284668, "global_step": 245904, "epoch": 2032} {"train_loss": -35.032005310058594, "global_step": 245905, "epoch": 2032} {"train_loss": -36.87178421020508, "global_step": 245906, "epoch": 2032} {"train_loss": -37.199703216552734, "global_step": 245907, "epoch": 2032} {"train_loss": -37.38520431518555, "global_step": 245908, "epoch": 2032} {"train_loss": -37.568603515625, "global_step": 245909, "epoch": 2032} {"train_loss": -37.66370391845703, "global_step": 245910, "epoch": 2032} {"train_loss": -37.24200439453125, "global_step": 245911, "epoch": 2032} {"train_loss": -36.480995178222656, "global_step": 245912, "epoch": 2032} {"train_loss": -37.67603302001953, "global_step": 245913, "epoch": 2032} {"train_loss": -37.4144401550293, "global_step": 245914, "epoch": 2032} {"train_loss": -38.391761779785156, "global_step": 245915, "epoch": 2032} {"train_loss": -37.414405822753906, "global_step": 245916, "epoch": 2032} {"train_loss": -37.188323974609375, "global_step": 245917, "epoch": 2032} {"train_loss": -37.26804733276367, "global_step": 245918, "epoch": 2032} {"train_loss": -38.11973190307617, "global_step": 245919, "epoch": 2032} {"train_loss": -37.24739074707031, "global_step": 245920, "epoch": 2032} {"train_loss": -37.36638259887695, "global_step": 245921, "epoch": 2032} {"train_loss": -38.71343231201172, "global_step": 245922, "epoch": 2032} {"train_loss": -37.39178466796875, "global_step": 245923, "epoch": 2032} {"train_loss": -37.234779357910156, "global_step": 245924, "epoch": 2032} {"train_loss": -37.928138732910156, "global_step": 245925, "epoch": 2032} {"train_loss": -37.300193786621094, "global_step": 245926, "epoch": 2032} {"train_loss": -38.46079635620117, "global_step": 245927, "epoch": 2032} {"train_loss": -37.49896240234375, "global_step": 245928, "epoch": 2032} {"train_loss": -38.19648361206055, "global_step": 245929, "epoch": 2032} {"train_loss": -38.58808517456055, "global_step": 245930, "epoch": 2032} {"train_loss": -37.82746124267578, "global_step": 245931, "epoch": 2032} {"train_loss": -37.84776306152344, "global_step": 245932, "epoch": 2032} {"train_loss": -38.74644088745117, "global_step": 245933, "epoch": 2032} {"train_loss": -38.7842903137207, "global_step": 245934, "epoch": 2032} {"train_loss": -38.53144454956055, "global_step": 245935, "epoch": 2032} {"train_loss": -39.17543029785156, "global_step": 245936, "epoch": 2032} {"train_loss": -37.417945861816406, "global_step": 245937, "epoch": 2032} {"train_loss": -38.3940544128418, "global_step": 245938, "epoch": 2032} {"train_loss": -38.0621223449707, "global_step": 245939, "epoch": 2032} {"train_loss": -38.66609573364258, "global_step": 245940, "epoch": 2032} {"train_loss": -37.91970443725586, "global_step": 245941, "epoch": 2032} {"train_loss": -38.80210494995117, "global_step": 245942, "epoch": 2032} {"train_loss": -37.77964401245117, "global_step": 245943, "epoch": 2032} {"train_loss": -38.37647247314453, "global_step": 245944, "epoch": 2032} {"train_loss": -40.1118278503418, "global_step": 245945, "epoch": 2032} {"train_loss": -38.75543212890625, "global_step": 245946, "epoch": 2032} {"train_loss": -38.08308792114258, "global_step": 245947, "epoch": 2032} {"train_loss": -38.628822326660156, "global_step": 245948, "epoch": 2032} {"train_loss": -39.30999755859375, "global_step": 245949, "epoch": 2032} {"train_loss": -39.250240325927734, "global_step": 245950, "epoch": 2032} {"train_loss": -39.248146057128906, "global_step": 245951, "epoch": 2032} {"train_loss": -37.2904052734375, "global_step": 245952, "epoch": 2032} {"train_loss": -38.63129806518555, "global_step": 245953, "epoch": 2032} {"train_loss": -40.205448150634766, "global_step": 245954, "epoch": 2032} {"train_loss": -39.49636459350586, "global_step": 245955, "epoch": 2032} {"train_loss": -38.98517990112305, "global_step": 245956, "epoch": 2032} {"train_loss": -38.810447692871094, "global_step": 245957, "epoch": 2032} {"train_loss": -39.25181198120117, "global_step": 245958, "epoch": 2032} {"train_loss": -38.42012405395508, "global_step": 245959, "epoch": 2032} {"train_loss": -38.66310119628906, "global_step": 245960, "epoch": 2032} {"train_loss": -40.030120849609375, "global_step": 245961, "epoch": 2032} {"train_loss": -37.95156478881836, "global_step": 245962, "epoch": 2032} {"train_loss": -40.266536712646484, "global_step": 245963, "epoch": 2032} {"train_loss": -39.4168701171875, "global_step": 245964, "epoch": 2032} {"train_loss": -39.2084846496582, "global_step": 245965, "epoch": 2032} {"train_loss": -39.53801727294922, "global_step": 245966, "epoch": 2032} {"train_loss": -39.037532806396484, "global_step": 245967, "epoch": 2032} {"train_loss": -39.039581298828125, "global_step": 245968, "epoch": 2032} {"train_loss": -40.464149475097656, "global_step": 245969, "epoch": 2032} {"train_loss": -40.259952545166016, "global_step": 245970, "epoch": 2032} {"train_loss": -39.36127853393555, "global_step": 245971, "epoch": 2032} {"train_loss": -39.19108581542969, "global_step": 245972, "epoch": 2032} {"train_loss": -38.33706283569336, "global_step": 245973, "epoch": 2032} {"train_loss": -39.75274658203125, "global_step": 245974, "epoch": 2032} {"train_loss": -39.66617965698242, "global_step": 245975, "epoch": 2032} {"train_loss": -40.339229583740234, "global_step": 245976, "epoch": 2032} {"train_loss": -38.7418327331543, "global_step": 245977, "epoch": 2032} {"train_loss": -39.41752243041992, "global_step": 245978, "epoch": 2032} {"train_loss": -40.0082893371582, "global_step": 245979, "epoch": 2032} {"train_loss": -39.46997833251953, "global_step": 245980, "epoch": 2032} {"train_loss": -39.17762756347656, "global_step": 245981, "epoch": 2032} {"train_loss": -39.80817794799805, "global_step": 245982, "epoch": 2032} {"train_loss": -39.56146240234375, "global_step": 245983, "epoch": 2032} {"train_loss": -39.61627960205078, "global_step": 245984, "epoch": 2032} {"train_loss": -40.03504180908203, "global_step": 245985, "epoch": 2032} {"train_loss": -40.482215881347656, "global_step": 245986, "epoch": 2032} {"train_loss": -39.53828048706055, "global_step": 245987, "epoch": 2032} {"train_loss": -39.629127502441406, "global_step": 245988, "epoch": 2032} {"train_loss": -41.41335678100586, "global_step": 245989, "epoch": 2032} {"train_loss": -40.672481536865234, "global_step": 245990, "epoch": 2032} {"train_loss": -39.960227966308594, "global_step": 245991, "epoch": 2032} {"train_loss": -37.90693100227797, "global_step": 245992, "epoch": 2032, "val_loss": 2572775.0} {"train_loss": -39.49953842163086, "global_step": 245993, "epoch": 2033} {"train_loss": -39.86075973510742, "global_step": 245994, "epoch": 2033} {"train_loss": -40.29551315307617, "global_step": 245995, "epoch": 2033} {"train_loss": -40.15517807006836, "global_step": 245996, "epoch": 2033} {"train_loss": -40.354122161865234, "global_step": 245997, "epoch": 2033} {"train_loss": -40.61903762817383, "global_step": 245998, "epoch": 2033} {"train_loss": -39.64362716674805, "global_step": 245999, "epoch": 2033} {"train_loss": -40.66838455200195, "global_step": 246000, "epoch": 2033} {"train_loss": -40.67080307006836, "global_step": 246001, "epoch": 2033} {"train_loss": -40.60129928588867, "global_step": 246002, "epoch": 2033} {"train_loss": -40.338375091552734, "global_step": 246003, "epoch": 2033} {"train_loss": -41.26945114135742, "global_step": 246004, "epoch": 2033} {"train_loss": -41.04308319091797, "global_step": 246005, "epoch": 2033} {"train_loss": -40.25203323364258, "global_step": 246006, "epoch": 2033} {"train_loss": -39.577728271484375, "global_step": 246007, "epoch": 2033} {"train_loss": -40.88704299926758, "global_step": 246008, "epoch": 2033} {"train_loss": -39.23557662963867, "global_step": 246009, "epoch": 2033} {"train_loss": -40.08919906616211, "global_step": 246010, "epoch": 2033} {"train_loss": -39.66756057739258, "global_step": 246011, "epoch": 2033} {"train_loss": -40.91851043701172, "global_step": 246012, "epoch": 2033} {"train_loss": -41.05181884765625, "global_step": 246013, "epoch": 2033} {"train_loss": -41.12401580810547, "global_step": 246014, "epoch": 2033} {"train_loss": -41.02529525756836, "global_step": 246015, "epoch": 2033} {"train_loss": -39.83146286010742, "global_step": 246016, "epoch": 2033} {"train_loss": -41.28512191772461, "global_step": 246017, "epoch": 2033} {"train_loss": -40.06962203979492, "global_step": 246018, "epoch": 2033} {"train_loss": -40.54603576660156, "global_step": 246019, "epoch": 2033} {"train_loss": -39.58021926879883, "global_step": 246020, "epoch": 2033} {"train_loss": -40.67171096801758, "global_step": 246021, "epoch": 2033} {"train_loss": -41.744606018066406, "global_step": 246022, "epoch": 2033} {"train_loss": -41.473323822021484, "global_step": 246023, "epoch": 2033} {"train_loss": -41.247127532958984, "global_step": 246024, "epoch": 2033} {"train_loss": -41.102577209472656, "global_step": 246025, "epoch": 2033} {"train_loss": -41.89997100830078, "global_step": 246026, "epoch": 2033} {"train_loss": -41.079715728759766, "global_step": 246027, "epoch": 2033} {"train_loss": -41.66178512573242, "global_step": 246028, "epoch": 2033} {"train_loss": -41.25193786621094, "global_step": 246029, "epoch": 2033} {"train_loss": -40.4398307800293, "global_step": 246030, "epoch": 2033} {"train_loss": -41.02907180786133, "global_step": 246031, "epoch": 2033} {"train_loss": -41.60160446166992, "global_step": 246032, "epoch": 2033} {"train_loss": -41.20204162597656, "global_step": 246033, "epoch": 2033} {"train_loss": -41.37885284423828, "global_step": 246034, "epoch": 2033} {"train_loss": -40.99538803100586, "global_step": 246035, "epoch": 2033} {"train_loss": -42.054420471191406, "global_step": 246036, "epoch": 2033} {"train_loss": -42.118896484375, "global_step": 246037, "epoch": 2033} {"train_loss": -40.94911575317383, "global_step": 246038, "epoch": 2033} {"train_loss": -41.59955978393555, "global_step": 246039, "epoch": 2033} {"train_loss": -40.29726791381836, "global_step": 246040, "epoch": 2033} {"train_loss": -41.19843673706055, "global_step": 246041, "epoch": 2033} {"train_loss": -40.9012451171875, "global_step": 246042, "epoch": 2033} {"train_loss": -41.70811462402344, "global_step": 246043, "epoch": 2033} {"train_loss": -40.92192077636719, "global_step": 246044, "epoch": 2033} {"train_loss": -41.44711685180664, "global_step": 246045, "epoch": 2033} {"train_loss": -41.98105239868164, "global_step": 246046, "epoch": 2033} {"train_loss": -41.06355667114258, "global_step": 246047, "epoch": 2033} {"train_loss": -40.761226654052734, "global_step": 246048, "epoch": 2033} {"train_loss": -40.40325164794922, "global_step": 246049, "epoch": 2033} {"train_loss": -41.33567428588867, "global_step": 246050, "epoch": 2033} {"train_loss": -40.971031188964844, "global_step": 246051, "epoch": 2033} {"train_loss": -41.51519775390625, "global_step": 246052, "epoch": 2033} {"train_loss": -40.743831634521484, "global_step": 246053, "epoch": 2033} {"train_loss": -41.39362716674805, "global_step": 246054, "epoch": 2033} {"train_loss": -42.113380432128906, "global_step": 246055, "epoch": 2033} {"train_loss": -40.62187194824219, "global_step": 246056, "epoch": 2033} {"train_loss": -40.676490783691406, "global_step": 246057, "epoch": 2033} {"train_loss": -41.383392333984375, "global_step": 246058, "epoch": 2033} {"train_loss": -41.24274826049805, "global_step": 246059, "epoch": 2033} {"train_loss": -40.692928314208984, "global_step": 246060, "epoch": 2033} {"train_loss": -42.125518798828125, "global_step": 246061, "epoch": 2033} {"train_loss": -41.13491439819336, "global_step": 246062, "epoch": 2033} {"train_loss": -40.72861099243164, "global_step": 246063, "epoch": 2033} {"train_loss": -41.26409912109375, "global_step": 246064, "epoch": 2033} {"train_loss": -41.02313995361328, "global_step": 246065, "epoch": 2033} {"train_loss": -37.80806350708008, "global_step": 246066, "epoch": 2033} {"train_loss": -40.9256706237793, "global_step": 246067, "epoch": 2033} {"train_loss": -41.38961410522461, "global_step": 246068, "epoch": 2033} {"train_loss": -40.06966781616211, "global_step": 246069, "epoch": 2033} {"train_loss": -35.80644226074219, "global_step": 246070, "epoch": 2033} {"train_loss": -26.433734893798828, "global_step": 246071, "epoch": 2033} {"train_loss": -7.31100606918335, "global_step": 246072, "epoch": 2033} {"train_loss": -21.33518409729004, "global_step": 246073, "epoch": 2033} {"train_loss": -39.36699295043945, "global_step": 246074, "epoch": 2033} {"train_loss": -35.022247314453125, "global_step": 246075, "epoch": 2033} {"train_loss": -35.7772216796875, "global_step": 246076, "epoch": 2033} {"train_loss": -39.227455139160156, "global_step": 246077, "epoch": 2033} {"train_loss": -33.45612716674805, "global_step": 246078, "epoch": 2033} {"train_loss": -38.98350143432617, "global_step": 246079, "epoch": 2033} {"train_loss": -32.90634536743164, "global_step": 246080, "epoch": 2033} {"train_loss": -41.22447204589844, "global_step": 246081, "epoch": 2033} {"train_loss": -36.91069030761719, "global_step": 246082, "epoch": 2033} {"train_loss": -40.087738037109375, "global_step": 246083, "epoch": 2033} {"train_loss": -35.847869873046875, "global_step": 246084, "epoch": 2033} {"train_loss": -39.25527572631836, "global_step": 246085, "epoch": 2033} {"train_loss": -38.314178466796875, "global_step": 246086, "epoch": 2033} {"train_loss": -39.313838958740234, "global_step": 246087, "epoch": 2033} {"train_loss": -38.332786560058594, "global_step": 246088, "epoch": 2033} {"train_loss": -39.201541900634766, "global_step": 246089, "epoch": 2033} {"train_loss": -39.208740234375, "global_step": 246090, "epoch": 2033} {"train_loss": -38.91929244995117, "global_step": 246091, "epoch": 2033} {"train_loss": -39.085636138916016, "global_step": 246092, "epoch": 2033} {"train_loss": -38.41994857788086, "global_step": 246093, "epoch": 2033} {"train_loss": -38.940269470214844, "global_step": 246094, "epoch": 2033} {"train_loss": -40.11172103881836, "global_step": 246095, "epoch": 2033} {"train_loss": -38.81916046142578, "global_step": 246096, "epoch": 2033} {"train_loss": -40.23855972290039, "global_step": 246097, "epoch": 2033} {"train_loss": -38.36761474609375, "global_step": 246098, "epoch": 2033} {"train_loss": -39.599609375, "global_step": 246099, "epoch": 2033} {"train_loss": -39.85834503173828, "global_step": 246100, "epoch": 2033} {"train_loss": -38.66691589355469, "global_step": 246101, "epoch": 2033} {"train_loss": -39.94075393676758, "global_step": 246102, "epoch": 2033} {"train_loss": -40.033119201660156, "global_step": 246103, "epoch": 2033} {"train_loss": -40.08805465698242, "global_step": 246104, "epoch": 2033} {"train_loss": -41.340694427490234, "global_step": 246105, "epoch": 2033} {"train_loss": -40.256710052490234, "global_step": 246106, "epoch": 2033} {"train_loss": -40.80503463745117, "global_step": 246107, "epoch": 2033} {"train_loss": -40.867408752441406, "global_step": 246108, "epoch": 2033} {"train_loss": -40.54701614379883, "global_step": 246109, "epoch": 2033} {"train_loss": -40.4288444519043, "global_step": 246110, "epoch": 2033} {"train_loss": -40.233558654785156, "global_step": 246111, "epoch": 2033} {"train_loss": -39.22951126098633, "global_step": 246112, "epoch": 2033} {"train_loss": -39.62418402916144, "global_step": 246113, "epoch": 2033, "val_loss": 2561279.5} {"train_loss": -40.510414123535156, "global_step": 246114, "epoch": 2034} {"train_loss": -41.08205795288086, "global_step": 246115, "epoch": 2034} {"train_loss": -40.228187561035156, "global_step": 246116, "epoch": 2034} {"train_loss": -40.694881439208984, "global_step": 246117, "epoch": 2034} {"train_loss": -40.375328063964844, "global_step": 246118, "epoch": 2034} {"train_loss": -41.718101501464844, "global_step": 246119, "epoch": 2034} {"train_loss": -41.29458236694336, "global_step": 246120, "epoch": 2034} {"train_loss": -40.817230224609375, "global_step": 246121, "epoch": 2034} {"train_loss": -40.99162673950195, "global_step": 246122, "epoch": 2034} {"train_loss": -40.99536895751953, "global_step": 246123, "epoch": 2034} {"train_loss": -41.807926177978516, "global_step": 246124, "epoch": 2034} {"train_loss": -41.15332794189453, "global_step": 246125, "epoch": 2034} {"train_loss": -41.445899963378906, "global_step": 246126, "epoch": 2034} {"train_loss": -40.61294174194336, "global_step": 246127, "epoch": 2034} {"train_loss": -40.77040100097656, "global_step": 246128, "epoch": 2034} {"train_loss": -41.018524169921875, "global_step": 246129, "epoch": 2034} {"train_loss": -41.001461029052734, "global_step": 246130, "epoch": 2034} {"train_loss": -41.480743408203125, "global_step": 246131, "epoch": 2034} {"train_loss": -41.77094268798828, "global_step": 246132, "epoch": 2034} {"train_loss": -41.54172897338867, "global_step": 246133, "epoch": 2034} {"train_loss": -41.23026657104492, "global_step": 246134, "epoch": 2034} {"train_loss": -40.605262756347656, "global_step": 246135, "epoch": 2034} {"train_loss": -41.097808837890625, "global_step": 246136, "epoch": 2034} {"train_loss": -40.598445892333984, "global_step": 246137, "epoch": 2034} {"train_loss": -41.338096618652344, "global_step": 246138, "epoch": 2034} {"train_loss": -42.079254150390625, "global_step": 246139, "epoch": 2034} {"train_loss": -41.32957077026367, "global_step": 246140, "epoch": 2034} {"train_loss": -41.51513671875, "global_step": 246141, "epoch": 2034} {"train_loss": -41.02785110473633, "global_step": 246142, "epoch": 2034} {"train_loss": -40.2550163269043, "global_step": 246143, "epoch": 2034} {"train_loss": -41.39837646484375, "global_step": 246144, "epoch": 2034} {"train_loss": -41.101070404052734, "global_step": 246145, "epoch": 2034} {"train_loss": -41.68939971923828, "global_step": 246146, "epoch": 2034} {"train_loss": -40.998165130615234, "global_step": 246147, "epoch": 2034} {"train_loss": -41.9513053894043, "global_step": 246148, "epoch": 2034} {"train_loss": -41.45096969604492, "global_step": 246149, "epoch": 2034} {"train_loss": -41.55582809448242, "global_step": 246150, "epoch": 2034} {"train_loss": -41.620235443115234, "global_step": 246151, "epoch": 2034} {"train_loss": -41.33776092529297, "global_step": 246152, "epoch": 2034} {"train_loss": -41.28163528442383, "global_step": 246153, "epoch": 2034} {"train_loss": -41.33956527709961, "global_step": 246154, "epoch": 2034} {"train_loss": -42.28202438354492, "global_step": 246155, "epoch": 2034} {"train_loss": -41.74636459350586, "global_step": 246156, "epoch": 2034} {"train_loss": -39.851654052734375, "global_step": 246157, "epoch": 2034} {"train_loss": -41.01782989501953, "global_step": 246158, "epoch": 2034} {"train_loss": -41.43877029418945, "global_step": 246159, "epoch": 2034} {"train_loss": -41.25996398925781, "global_step": 246160, "epoch": 2034} {"train_loss": -41.51099395751953, "global_step": 246161, "epoch": 2034} {"train_loss": -40.86355209350586, "global_step": 246162, "epoch": 2034} {"train_loss": -40.94166564941406, "global_step": 246163, "epoch": 2034} {"train_loss": -41.578643798828125, "global_step": 246164, "epoch": 2034} {"train_loss": -42.151607513427734, "global_step": 246165, "epoch": 2034} {"train_loss": -41.29231262207031, "global_step": 246166, "epoch": 2034} {"train_loss": -41.33603286743164, "global_step": 246167, "epoch": 2034} {"train_loss": -39.63893127441406, "global_step": 246168, "epoch": 2034} {"train_loss": -41.09037399291992, "global_step": 246169, "epoch": 2034} {"train_loss": -41.975624084472656, "global_step": 246170, "epoch": 2034} {"train_loss": -41.287635803222656, "global_step": 246171, "epoch": 2034} {"train_loss": -40.7655143737793, "global_step": 246172, "epoch": 2034} {"train_loss": -41.92903518676758, "global_step": 246173, "epoch": 2034} {"train_loss": -40.816097259521484, "global_step": 246174, "epoch": 2034} {"train_loss": -41.10951232910156, "global_step": 246175, "epoch": 2034} {"train_loss": -39.9027214050293, "global_step": 246176, "epoch": 2034} {"train_loss": -40.94118881225586, "global_step": 246177, "epoch": 2034} {"train_loss": -40.2985725402832, "global_step": 246178, "epoch": 2034} {"train_loss": -39.74766159057617, "global_step": 246179, "epoch": 2034} {"train_loss": -40.97579574584961, "global_step": 246180, "epoch": 2034} {"train_loss": -39.817230224609375, "global_step": 246181, "epoch": 2034} {"train_loss": -40.073604583740234, "global_step": 246182, "epoch": 2034} {"train_loss": -40.24102783203125, "global_step": 246183, "epoch": 2034} {"train_loss": -39.59074020385742, "global_step": 246184, "epoch": 2034} {"train_loss": -40.741004943847656, "global_step": 246185, "epoch": 2034} {"train_loss": -40.20280075073242, "global_step": 246186, "epoch": 2034} {"train_loss": -39.674530029296875, "global_step": 246187, "epoch": 2034} {"train_loss": -41.353267669677734, "global_step": 246188, "epoch": 2034} {"train_loss": -40.57499694824219, "global_step": 246189, "epoch": 2034} {"train_loss": -41.503814697265625, "global_step": 246190, "epoch": 2034} {"train_loss": -39.89316940307617, "global_step": 246191, "epoch": 2034} {"train_loss": -39.3480224609375, "global_step": 246192, "epoch": 2034} {"train_loss": -41.15571975708008, "global_step": 246193, "epoch": 2034} {"train_loss": -39.294654846191406, "global_step": 246194, "epoch": 2034} {"train_loss": -34.13422393798828, "global_step": 246195, "epoch": 2034} {"train_loss": -34.98887252807617, "global_step": 246196, "epoch": 2034} {"train_loss": -39.36307907104492, "global_step": 246197, "epoch": 2034} {"train_loss": -39.73592758178711, "global_step": 246198, "epoch": 2034} {"train_loss": -40.1205940246582, "global_step": 246199, "epoch": 2034} {"train_loss": -39.9927864074707, "global_step": 246200, "epoch": 2034} {"train_loss": -40.34253692626953, "global_step": 246201, "epoch": 2034} {"train_loss": -40.9362907409668, "global_step": 246202, "epoch": 2034} {"train_loss": -39.343406677246094, "global_step": 246203, "epoch": 2034} {"train_loss": -40.986507415771484, "global_step": 246204, "epoch": 2034} {"train_loss": -39.598182678222656, "global_step": 246205, "epoch": 2034} {"train_loss": -40.18046188354492, "global_step": 246206, "epoch": 2034} {"train_loss": -40.62376022338867, "global_step": 246207, "epoch": 2034} {"train_loss": -40.444087982177734, "global_step": 246208, "epoch": 2034} {"train_loss": -40.859127044677734, "global_step": 246209, "epoch": 2034} {"train_loss": -42.16176986694336, "global_step": 246210, "epoch": 2034} {"train_loss": -41.7899284362793, "global_step": 246211, "epoch": 2034} {"train_loss": -40.27197265625, "global_step": 246212, "epoch": 2034} {"train_loss": -41.11301803588867, "global_step": 246213, "epoch": 2034} {"train_loss": -39.848854064941406, "global_step": 246214, "epoch": 2034} {"train_loss": -41.655635833740234, "global_step": 246215, "epoch": 2034} {"train_loss": -39.90224838256836, "global_step": 246216, "epoch": 2034} {"train_loss": -41.107330322265625, "global_step": 246217, "epoch": 2034} {"train_loss": -40.50897216796875, "global_step": 246218, "epoch": 2034} {"train_loss": -40.966800689697266, "global_step": 246219, "epoch": 2034} {"train_loss": -39.971351623535156, "global_step": 246220, "epoch": 2034} {"train_loss": -40.67252731323242, "global_step": 246221, "epoch": 2034} {"train_loss": -40.50112533569336, "global_step": 246222, "epoch": 2034} {"train_loss": -40.244964599609375, "global_step": 246223, "epoch": 2034} {"train_loss": -40.14667510986328, "global_step": 246224, "epoch": 2034} {"train_loss": -39.91193771362305, "global_step": 246225, "epoch": 2034} {"train_loss": -41.15049743652344, "global_step": 246226, "epoch": 2034} {"train_loss": -40.56462097167969, "global_step": 246227, "epoch": 2034} {"train_loss": -39.78001022338867, "global_step": 246228, "epoch": 2034} {"train_loss": -40.9296989440918, "global_step": 246229, "epoch": 2034} {"train_loss": -40.56962203979492, "global_step": 246230, "epoch": 2034} {"train_loss": -41.98801040649414, "global_step": 246231, "epoch": 2034} {"train_loss": -39.31694030761719, "global_step": 246232, "epoch": 2034} {"train_loss": -41.14933395385742, "global_step": 246233, "epoch": 2034} {"train_loss": -40.721365810425816, "global_step": 246234, "epoch": 2034, "val_loss": 2571805.25} {"train_loss": -40.167842864990234, "global_step": 246235, "epoch": 2035} {"train_loss": -41.66044235229492, "global_step": 246236, "epoch": 2035} {"train_loss": -39.7993278503418, "global_step": 246237, "epoch": 2035} {"train_loss": -41.491249084472656, "global_step": 246238, "epoch": 2035} {"train_loss": -40.661502838134766, "global_step": 246239, "epoch": 2035} {"train_loss": -40.7003288269043, "global_step": 246240, "epoch": 2035} {"train_loss": -40.903865814208984, "global_step": 246241, "epoch": 2035} {"train_loss": -40.627803802490234, "global_step": 246242, "epoch": 2035} {"train_loss": -41.39143371582031, "global_step": 246243, "epoch": 2035} {"train_loss": -40.58751678466797, "global_step": 246244, "epoch": 2035} {"train_loss": -41.43461990356445, "global_step": 246245, "epoch": 2035} {"train_loss": -41.1755485534668, "global_step": 246246, "epoch": 2035} {"train_loss": -41.03597640991211, "global_step": 246247, "epoch": 2035} {"train_loss": -41.412715911865234, "global_step": 246248, "epoch": 2035} {"train_loss": -41.468074798583984, "global_step": 246249, "epoch": 2035} {"train_loss": -41.349342346191406, "global_step": 246250, "epoch": 2035} {"train_loss": -41.41517639160156, "global_step": 246251, "epoch": 2035} {"train_loss": -41.76860427856445, "global_step": 246252, "epoch": 2035} {"train_loss": -41.43549728393555, "global_step": 246253, "epoch": 2035} {"train_loss": -42.015174865722656, "global_step": 246254, "epoch": 2035} {"train_loss": -41.1309700012207, "global_step": 246255, "epoch": 2035} {"train_loss": -41.832420349121094, "global_step": 246256, "epoch": 2035} {"train_loss": -41.57699203491211, "global_step": 246257, "epoch": 2035} {"train_loss": -41.581485748291016, "global_step": 246258, "epoch": 2035} {"train_loss": -41.32992172241211, "global_step": 246259, "epoch": 2035} {"train_loss": -41.69758605957031, "global_step": 246260, "epoch": 2035} {"train_loss": -41.76319122314453, "global_step": 246261, "epoch": 2035} {"train_loss": -41.97370529174805, "global_step": 246262, "epoch": 2035} {"train_loss": -42.329345703125, "global_step": 246263, "epoch": 2035} {"train_loss": -42.298072814941406, "global_step": 246264, "epoch": 2035} {"train_loss": -41.58576583862305, "global_step": 246265, "epoch": 2035} {"train_loss": -42.22865676879883, "global_step": 246266, "epoch": 2035} {"train_loss": -42.17216491699219, "global_step": 246267, "epoch": 2035} {"train_loss": -42.16047286987305, "global_step": 246268, "epoch": 2035} {"train_loss": -42.09801483154297, "global_step": 246269, "epoch": 2035} {"train_loss": -41.7700309753418, "global_step": 246270, "epoch": 2035} {"train_loss": -42.74744415283203, "global_step": 246271, "epoch": 2035} {"train_loss": -42.40411376953125, "global_step": 246272, "epoch": 2035} {"train_loss": -42.12221908569336, "global_step": 246273, "epoch": 2035} {"train_loss": -42.89630889892578, "global_step": 246274, "epoch": 2035} {"train_loss": -42.934757232666016, "global_step": 246275, "epoch": 2035} {"train_loss": -42.953277587890625, "global_step": 246276, "epoch": 2035} {"train_loss": -42.87542724609375, "global_step": 246277, "epoch": 2035} {"train_loss": -42.186424255371094, "global_step": 246278, "epoch": 2035} {"train_loss": -42.72771072387695, "global_step": 246279, "epoch": 2035} {"train_loss": -42.98185348510742, "global_step": 246280, "epoch": 2035} {"train_loss": -42.605709075927734, "global_step": 246281, "epoch": 2035} {"train_loss": -42.41066360473633, "global_step": 246282, "epoch": 2035} {"train_loss": -42.67766189575195, "global_step": 246283, "epoch": 2035} {"train_loss": -43.135555267333984, "global_step": 246284, "epoch": 2035} {"train_loss": -42.429420471191406, "global_step": 246285, "epoch": 2035} {"train_loss": -41.78302764892578, "global_step": 246286, "epoch": 2035} {"train_loss": -42.92063522338867, "global_step": 246287, "epoch": 2035} {"train_loss": -42.97196578979492, "global_step": 246288, "epoch": 2035} {"train_loss": -41.980960845947266, "global_step": 246289, "epoch": 2035} {"train_loss": -42.021728515625, "global_step": 246290, "epoch": 2035} {"train_loss": -42.5947151184082, "global_step": 246291, "epoch": 2035} {"train_loss": -42.33875274658203, "global_step": 246292, "epoch": 2035} {"train_loss": -43.112525939941406, "global_step": 246293, "epoch": 2035} {"train_loss": -42.19444274902344, "global_step": 246294, "epoch": 2035} {"train_loss": -42.982200622558594, "global_step": 246295, "epoch": 2035} {"train_loss": -41.34711837768555, "global_step": 246296, "epoch": 2035} {"train_loss": -41.651241302490234, "global_step": 246297, "epoch": 2035} {"train_loss": -41.94965744018555, "global_step": 246298, "epoch": 2035} {"train_loss": -41.12557601928711, "global_step": 246299, "epoch": 2035} {"train_loss": -41.987850189208984, "global_step": 246300, "epoch": 2035} {"train_loss": -40.90050506591797, "global_step": 246301, "epoch": 2035} {"train_loss": -42.049278259277344, "global_step": 246302, "epoch": 2035} {"train_loss": -42.532649993896484, "global_step": 246303, "epoch": 2035} {"train_loss": -41.497737884521484, "global_step": 246304, "epoch": 2035} {"train_loss": -41.59914016723633, "global_step": 246305, "epoch": 2035} {"train_loss": -41.42348098754883, "global_step": 246306, "epoch": 2035} {"train_loss": -41.98055648803711, "global_step": 246307, "epoch": 2035} {"train_loss": -42.737892150878906, "global_step": 246308, "epoch": 2035} {"train_loss": -41.673336029052734, "global_step": 246309, "epoch": 2035} {"train_loss": -42.57931900024414, "global_step": 246310, "epoch": 2035} {"train_loss": -41.53049087524414, "global_step": 246311, "epoch": 2035} {"train_loss": -42.802066802978516, "global_step": 246312, "epoch": 2035} {"train_loss": -42.16312789916992, "global_step": 246313, "epoch": 2035} {"train_loss": -42.613712310791016, "global_step": 246314, "epoch": 2035} {"train_loss": -42.55733871459961, "global_step": 246315, "epoch": 2035} {"train_loss": -42.26358413696289, "global_step": 246316, "epoch": 2035} {"train_loss": -42.14602279663086, "global_step": 246317, "epoch": 2035} {"train_loss": -42.66341018676758, "global_step": 246318, "epoch": 2035} {"train_loss": -42.2450065612793, "global_step": 246319, "epoch": 2035} {"train_loss": -42.30019760131836, "global_step": 246320, "epoch": 2035} {"train_loss": -42.40184020996094, "global_step": 246321, "epoch": 2035} {"train_loss": -42.24766159057617, "global_step": 246322, "epoch": 2035} {"train_loss": -41.50324630737305, "global_step": 246323, "epoch": 2035} {"train_loss": -42.629974365234375, "global_step": 246324, "epoch": 2035} {"train_loss": -42.090816497802734, "global_step": 246325, "epoch": 2035} {"train_loss": -40.7490119934082, "global_step": 246326, "epoch": 2035} {"train_loss": -40.52368927001953, "global_step": 246327, "epoch": 2035} {"train_loss": -42.20347213745117, "global_step": 246328, "epoch": 2035} {"train_loss": -39.5279541015625, "global_step": 246329, "epoch": 2035} {"train_loss": -40.044960021972656, "global_step": 246330, "epoch": 2035} {"train_loss": -41.497039794921875, "global_step": 246331, "epoch": 2035} {"train_loss": -41.25138473510742, "global_step": 246332, "epoch": 2035} {"train_loss": -42.46120071411133, "global_step": 246333, "epoch": 2035} {"train_loss": -41.70396423339844, "global_step": 246334, "epoch": 2035} {"train_loss": -41.7182502746582, "global_step": 246335, "epoch": 2035} {"train_loss": -41.48583984375, "global_step": 246336, "epoch": 2035} {"train_loss": -40.392269134521484, "global_step": 246337, "epoch": 2035} {"train_loss": -38.179683685302734, "global_step": 246338, "epoch": 2035} {"train_loss": -38.899169921875, "global_step": 246339, "epoch": 2035} {"train_loss": -40.95510482788086, "global_step": 246340, "epoch": 2035} {"train_loss": -40.693851470947266, "global_step": 246341, "epoch": 2035} {"train_loss": -42.064796447753906, "global_step": 246342, "epoch": 2035} {"train_loss": -41.5471305847168, "global_step": 246343, "epoch": 2035} {"train_loss": -41.36393356323242, "global_step": 246344, "epoch": 2035} {"train_loss": -42.20066452026367, "global_step": 246345, "epoch": 2035} {"train_loss": -42.46406173706055, "global_step": 246346, "epoch": 2035} {"train_loss": -41.65919876098633, "global_step": 246347, "epoch": 2035} {"train_loss": -42.32976531982422, "global_step": 246348, "epoch": 2035} {"train_loss": -42.06747817993164, "global_step": 246349, "epoch": 2035} {"train_loss": -41.9764518737793, "global_step": 246350, "epoch": 2035} {"train_loss": -42.56660079956055, "global_step": 246351, "epoch": 2035} {"train_loss": -41.619873046875, "global_step": 246352, "epoch": 2035} {"train_loss": -41.38875961303711, "global_step": 246353, "epoch": 2035} {"train_loss": -42.337013244628906, "global_step": 246354, "epoch": 2035} {"train_loss": -41.80302299940882, "global_step": 246355, "epoch": 2035, "val_loss": 2548410.75} {"train_loss": -42.075748443603516, "global_step": 246356, "epoch": 2036} {"train_loss": -42.107696533203125, "global_step": 246357, "epoch": 2036} {"train_loss": -41.77936553955078, "global_step": 246358, "epoch": 2036} {"train_loss": -42.182289123535156, "global_step": 246359, "epoch": 2036} {"train_loss": -41.867122650146484, "global_step": 246360, "epoch": 2036} {"train_loss": -42.19959259033203, "global_step": 246361, "epoch": 2036} {"train_loss": -41.0992431640625, "global_step": 246362, "epoch": 2036} {"train_loss": -42.748268127441406, "global_step": 246363, "epoch": 2036} {"train_loss": -41.206783294677734, "global_step": 246364, "epoch": 2036} {"train_loss": -41.882259368896484, "global_step": 246365, "epoch": 2036} {"train_loss": -43.0745964050293, "global_step": 246366, "epoch": 2036} {"train_loss": -41.39555740356445, "global_step": 246367, "epoch": 2036} {"train_loss": -41.80924987792969, "global_step": 246368, "epoch": 2036} {"train_loss": -42.890926361083984, "global_step": 246369, "epoch": 2036} {"train_loss": -41.94693374633789, "global_step": 246370, "epoch": 2036} {"train_loss": -42.497737884521484, "global_step": 246371, "epoch": 2036} {"train_loss": -42.77647018432617, "global_step": 246372, "epoch": 2036} {"train_loss": -42.47719192504883, "global_step": 246373, "epoch": 2036} {"train_loss": -42.53049850463867, "global_step": 246374, "epoch": 2036} {"train_loss": -41.7234001159668, "global_step": 246375, "epoch": 2036} {"train_loss": -42.74212646484375, "global_step": 246376, "epoch": 2036} {"train_loss": -40.895782470703125, "global_step": 246377, "epoch": 2036} {"train_loss": -40.45457077026367, "global_step": 246378, "epoch": 2036} {"train_loss": -41.4107666015625, "global_step": 246379, "epoch": 2036} {"train_loss": -41.49597930908203, "global_step": 246380, "epoch": 2036} {"train_loss": -41.124168395996094, "global_step": 246381, "epoch": 2036} {"train_loss": -42.13431930541992, "global_step": 246382, "epoch": 2036} {"train_loss": -40.916168212890625, "global_step": 246383, "epoch": 2036} {"train_loss": -42.972469329833984, "global_step": 246384, "epoch": 2036} {"train_loss": -40.75678634643555, "global_step": 246385, "epoch": 2036} {"train_loss": -41.84465026855469, "global_step": 246386, "epoch": 2036} {"train_loss": -41.28598403930664, "global_step": 246387, "epoch": 2036} {"train_loss": -40.375144958496094, "global_step": 246388, "epoch": 2036} {"train_loss": -42.02580261230469, "global_step": 246389, "epoch": 2036} {"train_loss": -40.74277877807617, "global_step": 246390, "epoch": 2036} {"train_loss": -41.42240524291992, "global_step": 246391, "epoch": 2036} {"train_loss": -40.5732307434082, "global_step": 246392, "epoch": 2036} {"train_loss": -41.13723373413086, "global_step": 246393, "epoch": 2036} {"train_loss": -40.90288162231445, "global_step": 246394, "epoch": 2036} {"train_loss": -40.79132080078125, "global_step": 246395, "epoch": 2036} {"train_loss": -42.20130157470703, "global_step": 246396, "epoch": 2036} {"train_loss": -39.338741302490234, "global_step": 246397, "epoch": 2036} {"train_loss": -42.04452133178711, "global_step": 246398, "epoch": 2036} {"train_loss": -39.806175231933594, "global_step": 246399, "epoch": 2036} {"train_loss": -39.785552978515625, "global_step": 246400, "epoch": 2036} {"train_loss": -41.3260383605957, "global_step": 246401, "epoch": 2036} {"train_loss": -39.78315353393555, "global_step": 246402, "epoch": 2036} {"train_loss": -40.240291595458984, "global_step": 246403, "epoch": 2036} {"train_loss": -41.15824890136719, "global_step": 246404, "epoch": 2036} {"train_loss": -40.425270080566406, "global_step": 246405, "epoch": 2036} {"train_loss": -42.596168518066406, "global_step": 246406, "epoch": 2036} {"train_loss": -40.57349395751953, "global_step": 246407, "epoch": 2036} {"train_loss": -42.002685546875, "global_step": 246408, "epoch": 2036} {"train_loss": -40.93254852294922, "global_step": 246409, "epoch": 2036} {"train_loss": -42.00117111206055, "global_step": 246410, "epoch": 2036} {"train_loss": -41.173553466796875, "global_step": 246411, "epoch": 2036} {"train_loss": -41.08958053588867, "global_step": 246412, "epoch": 2036} {"train_loss": -39.97992706298828, "global_step": 246413, "epoch": 2036} {"train_loss": -40.2755241394043, "global_step": 246414, "epoch": 2036} {"train_loss": -41.776615142822266, "global_step": 246415, "epoch": 2036} {"train_loss": -41.160911560058594, "global_step": 246416, "epoch": 2036} {"train_loss": -41.69277572631836, "global_step": 246417, "epoch": 2036} {"train_loss": -41.449798583984375, "global_step": 246418, "epoch": 2036} {"train_loss": -42.5278434753418, "global_step": 246419, "epoch": 2036} {"train_loss": -41.423316955566406, "global_step": 246420, "epoch": 2036} {"train_loss": -42.440284729003906, "global_step": 246421, "epoch": 2036} {"train_loss": -41.52690887451172, "global_step": 246422, "epoch": 2036} {"train_loss": -42.1085205078125, "global_step": 246423, "epoch": 2036} {"train_loss": -42.160030364990234, "global_step": 246424, "epoch": 2036} {"train_loss": -41.71261215209961, "global_step": 246425, "epoch": 2036} {"train_loss": -42.070457458496094, "global_step": 246426, "epoch": 2036} {"train_loss": -41.14988327026367, "global_step": 246427, "epoch": 2036} {"train_loss": -41.76799011230469, "global_step": 246428, "epoch": 2036} {"train_loss": -42.26356887817383, "global_step": 246429, "epoch": 2036} {"train_loss": -41.6925048828125, "global_step": 246430, "epoch": 2036} {"train_loss": -39.97917175292969, "global_step": 246431, "epoch": 2036} {"train_loss": -40.119667053222656, "global_step": 246432, "epoch": 2036} {"train_loss": -41.84370803833008, "global_step": 246433, "epoch": 2036} {"train_loss": -42.32070541381836, "global_step": 246434, "epoch": 2036} {"train_loss": -41.82899475097656, "global_step": 246435, "epoch": 2036} {"train_loss": -41.8931884765625, "global_step": 246436, "epoch": 2036} {"train_loss": -42.88190841674805, "global_step": 246437, "epoch": 2036} {"train_loss": -41.6164665222168, "global_step": 246438, "epoch": 2036} {"train_loss": -41.0799560546875, "global_step": 246439, "epoch": 2036} {"train_loss": -41.56706619262695, "global_step": 246440, "epoch": 2036} {"train_loss": -42.070621490478516, "global_step": 246441, "epoch": 2036} {"train_loss": -38.741947174072266, "global_step": 246442, "epoch": 2036} {"train_loss": -33.26850509643555, "global_step": 246443, "epoch": 2036} {"train_loss": -36.17046356201172, "global_step": 246444, "epoch": 2036} {"train_loss": -41.40922164916992, "global_step": 246445, "epoch": 2036} {"train_loss": -39.177040100097656, "global_step": 246446, "epoch": 2036} {"train_loss": -37.70161819458008, "global_step": 246447, "epoch": 2036} {"train_loss": -41.44329071044922, "global_step": 246448, "epoch": 2036} {"train_loss": -40.53882598876953, "global_step": 246449, "epoch": 2036} {"train_loss": -40.18160629272461, "global_step": 246450, "epoch": 2036} {"train_loss": -42.316444396972656, "global_step": 246451, "epoch": 2036} {"train_loss": -41.01566696166992, "global_step": 246452, "epoch": 2036} {"train_loss": -42.54990768432617, "global_step": 246453, "epoch": 2036} {"train_loss": -41.199249267578125, "global_step": 246454, "epoch": 2036} {"train_loss": -41.156158447265625, "global_step": 246455, "epoch": 2036} {"train_loss": -41.681392669677734, "global_step": 246456, "epoch": 2036} {"train_loss": -41.955177307128906, "global_step": 246457, "epoch": 2036} {"train_loss": -42.16767501831055, "global_step": 246458, "epoch": 2036} {"train_loss": -41.04157257080078, "global_step": 246459, "epoch": 2036} {"train_loss": -42.49061965942383, "global_step": 246460, "epoch": 2036} {"train_loss": -41.222198486328125, "global_step": 246461, "epoch": 2036} {"train_loss": -42.0273323059082, "global_step": 246462, "epoch": 2036} {"train_loss": -42.45354461669922, "global_step": 246463, "epoch": 2036} {"train_loss": -41.41301345825195, "global_step": 246464, "epoch": 2036} {"train_loss": -41.46644592285156, "global_step": 246465, "epoch": 2036} {"train_loss": -41.646583557128906, "global_step": 246466, "epoch": 2036} {"train_loss": -42.57502365112305, "global_step": 246467, "epoch": 2036} {"train_loss": -42.24137878417969, "global_step": 246468, "epoch": 2036} {"train_loss": -42.41362380981445, "global_step": 246469, "epoch": 2036} {"train_loss": -42.33456039428711, "global_step": 246470, "epoch": 2036} {"train_loss": -42.51433181762695, "global_step": 246471, "epoch": 2036} {"train_loss": -42.10783767700195, "global_step": 246472, "epoch": 2036} {"train_loss": -42.7419548034668, "global_step": 246473, "epoch": 2036} {"train_loss": -42.94529342651367, "global_step": 246474, "epoch": 2036} {"train_loss": -41.98614501953125, "global_step": 246475, "epoch": 2036} {"train_loss": -41.4208165633777, "global_step": 246476, "epoch": 2036, "val_loss": 2519889.25} {"train_loss": -42.71711349487305, "global_step": 246477, "epoch": 2037} {"train_loss": -42.44869613647461, "global_step": 246478, "epoch": 2037} {"train_loss": -40.85232162475586, "global_step": 246479, "epoch": 2037} {"train_loss": -41.80865478515625, "global_step": 246480, "epoch": 2037} {"train_loss": -43.275390625, "global_step": 246481, "epoch": 2037} {"train_loss": -42.66856002807617, "global_step": 246482, "epoch": 2037} {"train_loss": -41.59718704223633, "global_step": 246483, "epoch": 2037} {"train_loss": -42.333587646484375, "global_step": 246484, "epoch": 2037} {"train_loss": -42.260398864746094, "global_step": 246485, "epoch": 2037} {"train_loss": -41.569942474365234, "global_step": 246486, "epoch": 2037} {"train_loss": -41.75643539428711, "global_step": 246487, "epoch": 2037} {"train_loss": -42.65016555786133, "global_step": 246488, "epoch": 2037} {"train_loss": -41.304237365722656, "global_step": 246489, "epoch": 2037} {"train_loss": -42.15979766845703, "global_step": 246490, "epoch": 2037} {"train_loss": -40.03678512573242, "global_step": 246491, "epoch": 2037} {"train_loss": -42.185272216796875, "global_step": 246492, "epoch": 2037} {"train_loss": -41.11691665649414, "global_step": 246493, "epoch": 2037} {"train_loss": -42.052162170410156, "global_step": 246494, "epoch": 2037} {"train_loss": -41.46072006225586, "global_step": 246495, "epoch": 2037} {"train_loss": -41.134029388427734, "global_step": 246496, "epoch": 2037} {"train_loss": -41.452701568603516, "global_step": 246497, "epoch": 2037} {"train_loss": -41.050777435302734, "global_step": 246498, "epoch": 2037} {"train_loss": -42.13972473144531, "global_step": 246499, "epoch": 2037} {"train_loss": -41.348846435546875, "global_step": 246500, "epoch": 2037} {"train_loss": -42.08600997924805, "global_step": 246501, "epoch": 2037} {"train_loss": -42.09945297241211, "global_step": 246502, "epoch": 2037} {"train_loss": -42.27947998046875, "global_step": 246503, "epoch": 2037} {"train_loss": -43.00360870361328, "global_step": 246504, "epoch": 2037} {"train_loss": -41.59678268432617, "global_step": 246505, "epoch": 2037} {"train_loss": -42.62751007080078, "global_step": 246506, "epoch": 2037} {"train_loss": -42.9517707824707, "global_step": 246507, "epoch": 2037} {"train_loss": -42.14805603027344, "global_step": 246508, "epoch": 2037} {"train_loss": -42.394874572753906, "global_step": 246509, "epoch": 2037} {"train_loss": -42.89644241333008, "global_step": 246510, "epoch": 2037} {"train_loss": -42.73298263549805, "global_step": 246511, "epoch": 2037} {"train_loss": -42.22060012817383, "global_step": 246512, "epoch": 2037} {"train_loss": -43.01206970214844, "global_step": 246513, "epoch": 2037} {"train_loss": -42.67656326293945, "global_step": 246514, "epoch": 2037} {"train_loss": -42.782135009765625, "global_step": 246515, "epoch": 2037} {"train_loss": -42.33571243286133, "global_step": 246516, "epoch": 2037} {"train_loss": -42.08867263793945, "global_step": 246517, "epoch": 2037} {"train_loss": -41.22528076171875, "global_step": 246518, "epoch": 2037} {"train_loss": -41.807674407958984, "global_step": 246519, "epoch": 2037} {"train_loss": -42.64924240112305, "global_step": 246520, "epoch": 2037} {"train_loss": -42.80207061767578, "global_step": 246521, "epoch": 2037} {"train_loss": -42.040279388427734, "global_step": 246522, "epoch": 2037} {"train_loss": -41.88015365600586, "global_step": 246523, "epoch": 2037} {"train_loss": -41.768943786621094, "global_step": 246524, "epoch": 2037} {"train_loss": -43.0355224609375, "global_step": 246525, "epoch": 2037} {"train_loss": -41.8075065612793, "global_step": 246526, "epoch": 2037} {"train_loss": -41.35389709472656, "global_step": 246527, "epoch": 2037} {"train_loss": -41.093196868896484, "global_step": 246528, "epoch": 2037} {"train_loss": -42.59633255004883, "global_step": 246529, "epoch": 2037} {"train_loss": -42.76650619506836, "global_step": 246530, "epoch": 2037} {"train_loss": -42.13998031616211, "global_step": 246531, "epoch": 2037} {"train_loss": -42.552127838134766, "global_step": 246532, "epoch": 2037} {"train_loss": -42.396888732910156, "global_step": 246533, "epoch": 2037} {"train_loss": -42.520626068115234, "global_step": 246534, "epoch": 2037} {"train_loss": -42.29666519165039, "global_step": 246535, "epoch": 2037} {"train_loss": -42.230316162109375, "global_step": 246536, "epoch": 2037} {"train_loss": -42.59979248046875, "global_step": 246537, "epoch": 2037} {"train_loss": -42.87184524536133, "global_step": 246538, "epoch": 2037} {"train_loss": -41.7366828918457, "global_step": 246539, "epoch": 2037} {"train_loss": -41.54240798950195, "global_step": 246540, "epoch": 2037} {"train_loss": -40.78652572631836, "global_step": 246541, "epoch": 2037} {"train_loss": -42.00872039794922, "global_step": 246542, "epoch": 2037} {"train_loss": -41.889522552490234, "global_step": 246543, "epoch": 2037} {"train_loss": -42.409542083740234, "global_step": 246544, "epoch": 2037} {"train_loss": -42.403106689453125, "global_step": 246545, "epoch": 2037} {"train_loss": -41.902496337890625, "global_step": 246546, "epoch": 2037} {"train_loss": -39.891883850097656, "global_step": 246547, "epoch": 2037} {"train_loss": -36.92106246948242, "global_step": 246548, "epoch": 2037} {"train_loss": -38.58095169067383, "global_step": 246549, "epoch": 2037} {"train_loss": -42.88649368286133, "global_step": 246550, "epoch": 2037} {"train_loss": -40.878173828125, "global_step": 246551, "epoch": 2037} {"train_loss": -40.682655334472656, "global_step": 246552, "epoch": 2037} {"train_loss": -41.579925537109375, "global_step": 246553, "epoch": 2037} {"train_loss": -40.65128707885742, "global_step": 246554, "epoch": 2037} {"train_loss": -41.446014404296875, "global_step": 246555, "epoch": 2037} {"train_loss": -42.10616683959961, "global_step": 246556, "epoch": 2037} {"train_loss": -41.54030990600586, "global_step": 246557, "epoch": 2037} {"train_loss": -41.77146530151367, "global_step": 246558, "epoch": 2037} {"train_loss": -40.678707122802734, "global_step": 246559, "epoch": 2037} {"train_loss": -40.48041915893555, "global_step": 246560, "epoch": 2037} {"train_loss": -40.6590690612793, "global_step": 246561, "epoch": 2037} {"train_loss": -41.67131805419922, "global_step": 246562, "epoch": 2037} {"train_loss": -36.668357849121094, "global_step": 246563, "epoch": 2037} {"train_loss": -42.04686737060547, "global_step": 246564, "epoch": 2037} {"train_loss": -41.241546630859375, "global_step": 246565, "epoch": 2037} {"train_loss": -39.98268508911133, "global_step": 246566, "epoch": 2037} {"train_loss": -41.0256462097168, "global_step": 246567, "epoch": 2037} {"train_loss": -40.86648178100586, "global_step": 246568, "epoch": 2037} {"train_loss": -40.30620193481445, "global_step": 246569, "epoch": 2037} {"train_loss": -41.26040267944336, "global_step": 246570, "epoch": 2037} {"train_loss": -42.17649459838867, "global_step": 246571, "epoch": 2037} {"train_loss": -41.77756118774414, "global_step": 246572, "epoch": 2037} {"train_loss": -41.3065299987793, "global_step": 246573, "epoch": 2037} {"train_loss": -42.23334884643555, "global_step": 246574, "epoch": 2037} {"train_loss": -40.86966323852539, "global_step": 246575, "epoch": 2037} {"train_loss": -41.54734802246094, "global_step": 246576, "epoch": 2037} {"train_loss": -40.98912811279297, "global_step": 246577, "epoch": 2037} {"train_loss": -43.00022506713867, "global_step": 246578, "epoch": 2037} {"train_loss": -41.78350830078125, "global_step": 246579, "epoch": 2037} {"train_loss": -42.206146240234375, "global_step": 246580, "epoch": 2037} {"train_loss": -41.98563003540039, "global_step": 246581, "epoch": 2037} {"train_loss": -42.559913635253906, "global_step": 246582, "epoch": 2037} {"train_loss": -42.4926643371582, "global_step": 246583, "epoch": 2037} {"train_loss": -42.8144645690918, "global_step": 246584, "epoch": 2037} {"train_loss": -42.27840805053711, "global_step": 246585, "epoch": 2037} {"train_loss": -42.59004592895508, "global_step": 246586, "epoch": 2037} {"train_loss": -41.35498809814453, "global_step": 246587, "epoch": 2037} {"train_loss": -42.739376068115234, "global_step": 246588, "epoch": 2037} {"train_loss": -41.437347412109375, "global_step": 246589, "epoch": 2037} {"train_loss": -42.739105224609375, "global_step": 246590, "epoch": 2037} {"train_loss": -41.842559814453125, "global_step": 246591, "epoch": 2037} {"train_loss": -41.49966812133789, "global_step": 246592, "epoch": 2037} {"train_loss": -42.950069427490234, "global_step": 246593, "epoch": 2037} {"train_loss": -42.13666534423828, "global_step": 246594, "epoch": 2037} {"train_loss": -43.038330078125, "global_step": 246595, "epoch": 2037} {"train_loss": -42.452789306640625, "global_step": 246596, "epoch": 2037} {"train_loss": -41.8158275824933, "global_step": 246597, "epoch": 2037, "val_loss": 2545283.75} {"train_loss": -42.8040771484375, "global_step": 246598, "epoch": 2038} {"train_loss": -38.780555725097656, "global_step": 246599, "epoch": 2038} {"train_loss": -42.441322326660156, "global_step": 246600, "epoch": 2038} {"train_loss": -42.591705322265625, "global_step": 246601, "epoch": 2038} {"train_loss": -42.84635543823242, "global_step": 246602, "epoch": 2038} {"train_loss": -42.397701263427734, "global_step": 246603, "epoch": 2038} {"train_loss": -42.07991409301758, "global_step": 246604, "epoch": 2038} {"train_loss": -43.05562973022461, "global_step": 246605, "epoch": 2038} {"train_loss": -42.215850830078125, "global_step": 246606, "epoch": 2038} {"train_loss": -42.089866638183594, "global_step": 246607, "epoch": 2038} {"train_loss": -42.464115142822266, "global_step": 246608, "epoch": 2038} {"train_loss": -41.48673629760742, "global_step": 246609, "epoch": 2038} {"train_loss": -41.355712890625, "global_step": 246610, "epoch": 2038} {"train_loss": -42.896392822265625, "global_step": 246611, "epoch": 2038} {"train_loss": -43.056556701660156, "global_step": 246612, "epoch": 2038} {"train_loss": -42.981868743896484, "global_step": 246613, "epoch": 2038} {"train_loss": -42.97211456298828, "global_step": 246614, "epoch": 2038} {"train_loss": -42.53487777709961, "global_step": 246615, "epoch": 2038} {"train_loss": -42.62665939331055, "global_step": 246616, "epoch": 2038} {"train_loss": -42.83513641357422, "global_step": 246617, "epoch": 2038} {"train_loss": -43.02289962768555, "global_step": 246618, "epoch": 2038} {"train_loss": -41.0234489440918, "global_step": 246619, "epoch": 2038} {"train_loss": -42.73146438598633, "global_step": 246620, "epoch": 2038} {"train_loss": -41.955230712890625, "global_step": 246621, "epoch": 2038} {"train_loss": -42.167144775390625, "global_step": 246622, "epoch": 2038} {"train_loss": -42.50224685668945, "global_step": 246623, "epoch": 2038} {"train_loss": -42.13603210449219, "global_step": 246624, "epoch": 2038} {"train_loss": -40.15458679199219, "global_step": 246625, "epoch": 2038} {"train_loss": -42.70615768432617, "global_step": 246626, "epoch": 2038} {"train_loss": -41.95780944824219, "global_step": 246627, "epoch": 2038} {"train_loss": -41.95520782470703, "global_step": 246628, "epoch": 2038} {"train_loss": -40.4483757019043, "global_step": 246629, "epoch": 2038} {"train_loss": -42.64667510986328, "global_step": 246630, "epoch": 2038} {"train_loss": -35.77769470214844, "global_step": 246631, "epoch": 2038} {"train_loss": -42.01105880737305, "global_step": 246632, "epoch": 2038} {"train_loss": -36.47829818725586, "global_step": 246633, "epoch": 2038} {"train_loss": -41.83452224731445, "global_step": 246634, "epoch": 2038} {"train_loss": -39.27816390991211, "global_step": 246635, "epoch": 2038} {"train_loss": -42.90764236450195, "global_step": 246636, "epoch": 2038} {"train_loss": -40.54079055786133, "global_step": 246637, "epoch": 2038} {"train_loss": -39.4000358581543, "global_step": 246638, "epoch": 2038} {"train_loss": -32.552757263183594, "global_step": 246639, "epoch": 2038} {"train_loss": -40.58824157714844, "global_step": 246640, "epoch": 2038} {"train_loss": -41.5831184387207, "global_step": 246641, "epoch": 2038} {"train_loss": -39.84425354003906, "global_step": 246642, "epoch": 2038} {"train_loss": -30.15199089050293, "global_step": 246643, "epoch": 2038} {"train_loss": -36.80574417114258, "global_step": 246644, "epoch": 2038} {"train_loss": -40.69074630737305, "global_step": 246645, "epoch": 2038} {"train_loss": -39.492210388183594, "global_step": 246646, "epoch": 2038} {"train_loss": -38.44997787475586, "global_step": 246647, "epoch": 2038} {"train_loss": -35.51729965209961, "global_step": 246648, "epoch": 2038} {"train_loss": -39.48847579956055, "global_step": 246649, "epoch": 2038} {"train_loss": -33.23011016845703, "global_step": 246650, "epoch": 2038} {"train_loss": -34.796016693115234, "global_step": 246651, "epoch": 2038} {"train_loss": -39.14778518676758, "global_step": 246652, "epoch": 2038} {"train_loss": -40.45160675048828, "global_step": 246653, "epoch": 2038} {"train_loss": -38.222537994384766, "global_step": 246654, "epoch": 2038} {"train_loss": -32.918975830078125, "global_step": 246655, "epoch": 2038} {"train_loss": -40.60750198364258, "global_step": 246656, "epoch": 2038} {"train_loss": -40.588722229003906, "global_step": 246657, "epoch": 2038} {"train_loss": -39.26374053955078, "global_step": 246658, "epoch": 2038} {"train_loss": -38.77057647705078, "global_step": 246659, "epoch": 2038} {"train_loss": -37.790321350097656, "global_step": 246660, "epoch": 2038} {"train_loss": -40.995113372802734, "global_step": 246661, "epoch": 2038} {"train_loss": -39.08372116088867, "global_step": 246662, "epoch": 2038} {"train_loss": -40.73952865600586, "global_step": 246663, "epoch": 2038} {"train_loss": -39.034305572509766, "global_step": 246664, "epoch": 2038} {"train_loss": -39.192359924316406, "global_step": 246665, "epoch": 2038} {"train_loss": -40.34775161743164, "global_step": 246666, "epoch": 2038} {"train_loss": -36.6834716796875, "global_step": 246667, "epoch": 2038} {"train_loss": -39.959999084472656, "global_step": 246668, "epoch": 2038} {"train_loss": -39.85826110839844, "global_step": 246669, "epoch": 2038} {"train_loss": -39.87737274169922, "global_step": 246670, "epoch": 2038} {"train_loss": -40.953495025634766, "global_step": 246671, "epoch": 2038} {"train_loss": -41.011478424072266, "global_step": 246672, "epoch": 2038} {"train_loss": -41.32999038696289, "global_step": 246673, "epoch": 2038} {"train_loss": -38.277034759521484, "global_step": 246674, "epoch": 2038} {"train_loss": -41.70012283325195, "global_step": 246675, "epoch": 2038} {"train_loss": -40.97353744506836, "global_step": 246676, "epoch": 2038} {"train_loss": -40.761817932128906, "global_step": 246677, "epoch": 2038} {"train_loss": -40.61397171020508, "global_step": 246678, "epoch": 2038} {"train_loss": -40.84048080444336, "global_step": 246679, "epoch": 2038} {"train_loss": -40.62989044189453, "global_step": 246680, "epoch": 2038} {"train_loss": -41.46771240234375, "global_step": 246681, "epoch": 2038} {"train_loss": -41.613433837890625, "global_step": 246682, "epoch": 2038} {"train_loss": -40.30866241455078, "global_step": 246683, "epoch": 2038} {"train_loss": -41.36471176147461, "global_step": 246684, "epoch": 2038} {"train_loss": -41.53574752807617, "global_step": 246685, "epoch": 2038} {"train_loss": -41.3033447265625, "global_step": 246686, "epoch": 2038} {"train_loss": -41.803157806396484, "global_step": 246687, "epoch": 2038} {"train_loss": -41.58902359008789, "global_step": 246688, "epoch": 2038} {"train_loss": -41.25897216796875, "global_step": 246689, "epoch": 2038} {"train_loss": -40.335941314697266, "global_step": 246690, "epoch": 2038} {"train_loss": -41.6546630859375, "global_step": 246691, "epoch": 2038} {"train_loss": -41.423213958740234, "global_step": 246692, "epoch": 2038} {"train_loss": -41.077999114990234, "global_step": 246693, "epoch": 2038} {"train_loss": -42.10239791870117, "global_step": 246694, "epoch": 2038} {"train_loss": -41.02219772338867, "global_step": 246695, "epoch": 2038} {"train_loss": -38.86536407470703, "global_step": 246696, "epoch": 2038} {"train_loss": -41.769569396972656, "global_step": 246697, "epoch": 2038} {"train_loss": -41.781776428222656, "global_step": 246698, "epoch": 2038} {"train_loss": -42.50300216674805, "global_step": 246699, "epoch": 2038} {"train_loss": -42.663509368896484, "global_step": 246700, "epoch": 2038} {"train_loss": -41.949527740478516, "global_step": 246701, "epoch": 2038} {"train_loss": -42.15305709838867, "global_step": 246702, "epoch": 2038} {"train_loss": -41.70233917236328, "global_step": 246703, "epoch": 2038} {"train_loss": -42.8993034362793, "global_step": 246704, "epoch": 2038} {"train_loss": -40.84733200073242, "global_step": 246705, "epoch": 2038} {"train_loss": -43.020050048828125, "global_step": 246706, "epoch": 2038} {"train_loss": -42.06429672241211, "global_step": 246707, "epoch": 2038} {"train_loss": -41.190731048583984, "global_step": 246708, "epoch": 2038} {"train_loss": -42.63499069213867, "global_step": 246709, "epoch": 2038} {"train_loss": -42.039695739746094, "global_step": 246710, "epoch": 2038} {"train_loss": -42.91636276245117, "global_step": 246711, "epoch": 2038} {"train_loss": -42.04897689819336, "global_step": 246712, "epoch": 2038} {"train_loss": -42.4636116027832, "global_step": 246713, "epoch": 2038} {"train_loss": -42.17866897583008, "global_step": 246714, "epoch": 2038} {"train_loss": -42.632625579833984, "global_step": 246715, "epoch": 2038} {"train_loss": -42.5413818359375, "global_step": 246716, "epoch": 2038} {"train_loss": -42.081146240234375, "global_step": 246717, "epoch": 2038} {"train_loss": -40.75842340327492, "global_step": 246718, "epoch": 2038, "val_loss": 2557877.0} {"train_loss": -42.0869026184082, "global_step": 246719, "epoch": 2039} {"train_loss": -42.42460632324219, "global_step": 246720, "epoch": 2039} {"train_loss": -42.86587142944336, "global_step": 246721, "epoch": 2039} {"train_loss": -42.46293640136719, "global_step": 246722, "epoch": 2039} {"train_loss": -42.522212982177734, "global_step": 246723, "epoch": 2039} {"train_loss": -41.91917037963867, "global_step": 246724, "epoch": 2039} {"train_loss": -42.93226623535156, "global_step": 246725, "epoch": 2039} {"train_loss": -42.1851806640625, "global_step": 246726, "epoch": 2039} {"train_loss": -42.864898681640625, "global_step": 246727, "epoch": 2039} {"train_loss": -43.01751708984375, "global_step": 246728, "epoch": 2039} {"train_loss": -42.35551071166992, "global_step": 246729, "epoch": 2039} {"train_loss": -43.474609375, "global_step": 246730, "epoch": 2039} {"train_loss": -42.77851486206055, "global_step": 246731, "epoch": 2039} {"train_loss": -42.808753967285156, "global_step": 246732, "epoch": 2039} {"train_loss": -42.4395866394043, "global_step": 246733, "epoch": 2039} {"train_loss": -42.146602630615234, "global_step": 246734, "epoch": 2039} {"train_loss": -41.52393341064453, "global_step": 246735, "epoch": 2039} {"train_loss": -43.207637786865234, "global_step": 246736, "epoch": 2039} {"train_loss": -43.41015625, "global_step": 246737, "epoch": 2039} {"train_loss": -42.60989761352539, "global_step": 246738, "epoch": 2039} {"train_loss": -42.94272994995117, "global_step": 246739, "epoch": 2039} {"train_loss": -43.06510925292969, "global_step": 246740, "epoch": 2039} {"train_loss": -43.4197998046875, "global_step": 246741, "epoch": 2039} {"train_loss": -43.04415512084961, "global_step": 246742, "epoch": 2039} {"train_loss": -42.57651901245117, "global_step": 246743, "epoch": 2039} {"train_loss": -43.03548049926758, "global_step": 246744, "epoch": 2039} {"train_loss": -42.38502502441406, "global_step": 246745, "epoch": 2039} {"train_loss": -42.06781768798828, "global_step": 246746, "epoch": 2039} {"train_loss": -43.08208084106445, "global_step": 246747, "epoch": 2039} {"train_loss": -42.90486145019531, "global_step": 246748, "epoch": 2039} {"train_loss": -41.33327865600586, "global_step": 246749, "epoch": 2039} {"train_loss": -42.49782943725586, "global_step": 246750, "epoch": 2039} {"train_loss": -41.7722282409668, "global_step": 246751, "epoch": 2039} {"train_loss": -42.22760009765625, "global_step": 246752, "epoch": 2039} {"train_loss": -40.24221420288086, "global_step": 246753, "epoch": 2039} {"train_loss": -40.99658203125, "global_step": 246754, "epoch": 2039} {"train_loss": -37.51045608520508, "global_step": 246755, "epoch": 2039} {"train_loss": -33.988853454589844, "global_step": 246756, "epoch": 2039} {"train_loss": -24.796327590942383, "global_step": 246757, "epoch": 2039} {"train_loss": -26.84364891052246, "global_step": 246758, "epoch": 2039} {"train_loss": -37.67303466796875, "global_step": 246759, "epoch": 2039} {"train_loss": -38.78466796875, "global_step": 246760, "epoch": 2039} {"train_loss": -35.14813995361328, "global_step": 246761, "epoch": 2039} {"train_loss": -33.4397087097168, "global_step": 246762, "epoch": 2039} {"train_loss": -34.9738883972168, "global_step": 246763, "epoch": 2039} {"train_loss": -31.989953994750977, "global_step": 246764, "epoch": 2039} {"train_loss": -37.18397903442383, "global_step": 246765, "epoch": 2039} {"train_loss": -33.59572982788086, "global_step": 246766, "epoch": 2039} {"train_loss": -35.103267669677734, "global_step": 246767, "epoch": 2039} {"train_loss": -37.9704704284668, "global_step": 246768, "epoch": 2039} {"train_loss": -31.745502471923828, "global_step": 246769, "epoch": 2039} {"train_loss": -40.0467414855957, "global_step": 246770, "epoch": 2039} {"train_loss": -33.921142578125, "global_step": 246771, "epoch": 2039} {"train_loss": -38.680145263671875, "global_step": 246772, "epoch": 2039} {"train_loss": -36.227657318115234, "global_step": 246773, "epoch": 2039} {"train_loss": -39.91974639892578, "global_step": 246774, "epoch": 2039} {"train_loss": -37.20067596435547, "global_step": 246775, "epoch": 2039} {"train_loss": -39.818763732910156, "global_step": 246776, "epoch": 2039} {"train_loss": -38.205501556396484, "global_step": 246777, "epoch": 2039} {"train_loss": -40.15948486328125, "global_step": 246778, "epoch": 2039} {"train_loss": -38.34914779663086, "global_step": 246779, "epoch": 2039} {"train_loss": -41.3556022644043, "global_step": 246780, "epoch": 2039} {"train_loss": -39.07839584350586, "global_step": 246781, "epoch": 2039} {"train_loss": -39.95363235473633, "global_step": 246782, "epoch": 2039} {"train_loss": -39.85871505737305, "global_step": 246783, "epoch": 2039} {"train_loss": -40.05380630493164, "global_step": 246784, "epoch": 2039} {"train_loss": -40.46502685546875, "global_step": 246785, "epoch": 2039} {"train_loss": -40.16572189331055, "global_step": 246786, "epoch": 2039} {"train_loss": -41.039581298828125, "global_step": 246787, "epoch": 2039} {"train_loss": -39.5292854309082, "global_step": 246788, "epoch": 2039} {"train_loss": -40.71267318725586, "global_step": 246789, "epoch": 2039} {"train_loss": -41.22939682006836, "global_step": 246790, "epoch": 2039} {"train_loss": -41.17014694213867, "global_step": 246791, "epoch": 2039} {"train_loss": -41.611881256103516, "global_step": 246792, "epoch": 2039} {"train_loss": -40.494388580322266, "global_step": 246793, "epoch": 2039} {"train_loss": -40.95575714111328, "global_step": 246794, "epoch": 2039} {"train_loss": -41.69645690917969, "global_step": 246795, "epoch": 2039} {"train_loss": -41.42254638671875, "global_step": 246796, "epoch": 2039} {"train_loss": -40.38491439819336, "global_step": 246797, "epoch": 2039} {"train_loss": -41.15867614746094, "global_step": 246798, "epoch": 2039} {"train_loss": -41.5804443359375, "global_step": 246799, "epoch": 2039} {"train_loss": -41.335540771484375, "global_step": 246800, "epoch": 2039} {"train_loss": -41.695533752441406, "global_step": 246801, "epoch": 2039} {"train_loss": -41.84261703491211, "global_step": 246802, "epoch": 2039} {"train_loss": -41.917415618896484, "global_step": 246803, "epoch": 2039} {"train_loss": -41.751197814941406, "global_step": 246804, "epoch": 2039} {"train_loss": -42.47965621948242, "global_step": 246805, "epoch": 2039} {"train_loss": -41.06238555908203, "global_step": 246806, "epoch": 2039} {"train_loss": -41.47956848144531, "global_step": 246807, "epoch": 2039} {"train_loss": -41.94447708129883, "global_step": 246808, "epoch": 2039} {"train_loss": -41.93040084838867, "global_step": 246809, "epoch": 2039} {"train_loss": -42.584285736083984, "global_step": 246810, "epoch": 2039} {"train_loss": -41.3973274230957, "global_step": 246811, "epoch": 2039} {"train_loss": -41.75467300415039, "global_step": 246812, "epoch": 2039} {"train_loss": -42.64100646972656, "global_step": 246813, "epoch": 2039} {"train_loss": -41.998207092285156, "global_step": 246814, "epoch": 2039} {"train_loss": -42.5833625793457, "global_step": 246815, "epoch": 2039} {"train_loss": -42.522377014160156, "global_step": 246816, "epoch": 2039} {"train_loss": -41.86713790893555, "global_step": 246817, "epoch": 2039} {"train_loss": -42.2908935546875, "global_step": 246818, "epoch": 2039} {"train_loss": -41.8541145324707, "global_step": 246819, "epoch": 2039} {"train_loss": -42.7978515625, "global_step": 246820, "epoch": 2039} {"train_loss": -41.868160247802734, "global_step": 246821, "epoch": 2039} {"train_loss": -42.46586227416992, "global_step": 246822, "epoch": 2039} {"train_loss": -42.20663070678711, "global_step": 246823, "epoch": 2039} {"train_loss": -42.055633544921875, "global_step": 246824, "epoch": 2039} {"train_loss": -43.058773040771484, "global_step": 246825, "epoch": 2039} {"train_loss": -42.50178527832031, "global_step": 246826, "epoch": 2039} {"train_loss": -42.611549377441406, "global_step": 246827, "epoch": 2039} {"train_loss": -42.47593307495117, "global_step": 246828, "epoch": 2039} {"train_loss": -42.97825241088867, "global_step": 246829, "epoch": 2039} {"train_loss": -42.586605072021484, "global_step": 246830, "epoch": 2039} {"train_loss": -42.341548919677734, "global_step": 246831, "epoch": 2039} {"train_loss": -42.764495849609375, "global_step": 246832, "epoch": 2039} {"train_loss": -42.782039642333984, "global_step": 246833, "epoch": 2039} {"train_loss": -43.01813507080078, "global_step": 246834, "epoch": 2039} {"train_loss": -42.871952056884766, "global_step": 246835, "epoch": 2039} {"train_loss": -42.533103942871094, "global_step": 246836, "epoch": 2039} {"train_loss": -42.326236724853516, "global_step": 246837, "epoch": 2039} {"train_loss": -42.72392654418945, "global_step": 246838, "epoch": 2039} {"train_loss": -40.7238905252504, "global_step": 246839, "epoch": 2039, "val_loss": 2537429.0} {"train_loss": -42.799163818359375, "global_step": 246840, "epoch": 2040} {"train_loss": -42.551856994628906, "global_step": 246841, "epoch": 2040} {"train_loss": -42.746395111083984, "global_step": 246842, "epoch": 2040} {"train_loss": -43.08372497558594, "global_step": 246843, "epoch": 2040} {"train_loss": -42.547142028808594, "global_step": 246844, "epoch": 2040} {"train_loss": -42.962623596191406, "global_step": 246845, "epoch": 2040} {"train_loss": -43.0412712097168, "global_step": 246846, "epoch": 2040} {"train_loss": -43.34636688232422, "global_step": 246847, "epoch": 2040} {"train_loss": -42.99177169799805, "global_step": 246848, "epoch": 2040} {"train_loss": -42.72840118408203, "global_step": 246849, "epoch": 2040} {"train_loss": -41.636409759521484, "global_step": 246850, "epoch": 2040} {"train_loss": -43.20331954956055, "global_step": 246851, "epoch": 2040} {"train_loss": -43.420654296875, "global_step": 246852, "epoch": 2040} {"train_loss": -42.61491775512695, "global_step": 246853, "epoch": 2040} {"train_loss": -43.03654861450195, "global_step": 246854, "epoch": 2040} {"train_loss": -43.02195739746094, "global_step": 246855, "epoch": 2040} {"train_loss": -42.08526611328125, "global_step": 246856, "epoch": 2040} {"train_loss": -42.716670989990234, "global_step": 246857, "epoch": 2040} {"train_loss": -41.99613952636719, "global_step": 246858, "epoch": 2040} {"train_loss": -43.737823486328125, "global_step": 246859, "epoch": 2040} {"train_loss": -43.356746673583984, "global_step": 246860, "epoch": 2040} {"train_loss": -42.751522064208984, "global_step": 246861, "epoch": 2040} {"train_loss": -43.26874923706055, "global_step": 246862, "epoch": 2040} {"train_loss": -43.62397766113281, "global_step": 246863, "epoch": 2040} {"train_loss": -43.08384323120117, "global_step": 246864, "epoch": 2040} {"train_loss": -42.67045974731445, "global_step": 246865, "epoch": 2040} {"train_loss": -42.706512451171875, "global_step": 246866, "epoch": 2040} {"train_loss": -43.07014083862305, "global_step": 246867, "epoch": 2040} {"train_loss": -43.56669998168945, "global_step": 246868, "epoch": 2040} {"train_loss": -42.73896408081055, "global_step": 246869, "epoch": 2040} {"train_loss": -42.90528869628906, "global_step": 246870, "epoch": 2040} {"train_loss": -42.9766731262207, "global_step": 246871, "epoch": 2040} {"train_loss": -42.55876541137695, "global_step": 246872, "epoch": 2040} {"train_loss": -43.170654296875, "global_step": 246873, "epoch": 2040} {"train_loss": -42.38336944580078, "global_step": 246874, "epoch": 2040} {"train_loss": -43.56824493408203, "global_step": 246875, "epoch": 2040} {"train_loss": -42.62240982055664, "global_step": 246876, "epoch": 2040} {"train_loss": -41.93902587890625, "global_step": 246877, "epoch": 2040} {"train_loss": -40.89012145996094, "global_step": 246878, "epoch": 2040} {"train_loss": -41.06937026977539, "global_step": 246879, "epoch": 2040} {"train_loss": -42.989952087402344, "global_step": 246880, "epoch": 2040} {"train_loss": -41.98810577392578, "global_step": 246881, "epoch": 2040} {"train_loss": -41.355472564697266, "global_step": 246882, "epoch": 2040} {"train_loss": -40.58879089355469, "global_step": 246883, "epoch": 2040} {"train_loss": -39.881317138671875, "global_step": 246884, "epoch": 2040} {"train_loss": -37.81520080566406, "global_step": 246885, "epoch": 2040} {"train_loss": -38.076961517333984, "global_step": 246886, "epoch": 2040} {"train_loss": -39.502010345458984, "global_step": 246887, "epoch": 2040} {"train_loss": -41.68441390991211, "global_step": 246888, "epoch": 2040} {"train_loss": -40.60663986206055, "global_step": 246889, "epoch": 2040} {"train_loss": -37.49351119995117, "global_step": 246890, "epoch": 2040} {"train_loss": -40.680965423583984, "global_step": 246891, "epoch": 2040} {"train_loss": -40.52163314819336, "global_step": 246892, "epoch": 2040} {"train_loss": -38.572811126708984, "global_step": 246893, "epoch": 2040} {"train_loss": -38.176265716552734, "global_step": 246894, "epoch": 2040} {"train_loss": -42.055633544921875, "global_step": 246895, "epoch": 2040} {"train_loss": -39.98405075073242, "global_step": 246896, "epoch": 2040} {"train_loss": -36.69003677368164, "global_step": 246897, "epoch": 2040} {"train_loss": -40.000946044921875, "global_step": 246898, "epoch": 2040} {"train_loss": -40.07421875, "global_step": 246899, "epoch": 2040} {"train_loss": -37.55759811401367, "global_step": 246900, "epoch": 2040} {"train_loss": -39.25345993041992, "global_step": 246901, "epoch": 2040} {"train_loss": -35.16318893432617, "global_step": 246902, "epoch": 2040} {"train_loss": -37.0641975402832, "global_step": 246903, "epoch": 2040} {"train_loss": -39.07057571411133, "global_step": 246904, "epoch": 2040} {"train_loss": -38.771236419677734, "global_step": 246905, "epoch": 2040} {"train_loss": -37.90631103515625, "global_step": 246906, "epoch": 2040} {"train_loss": -39.24848175048828, "global_step": 246907, "epoch": 2040} {"train_loss": -39.99850082397461, "global_step": 246908, "epoch": 2040} {"train_loss": -39.61555862426758, "global_step": 246909, "epoch": 2040} {"train_loss": -36.100257873535156, "global_step": 246910, "epoch": 2040} {"train_loss": -40.880943298339844, "global_step": 246911, "epoch": 2040} {"train_loss": -39.39345932006836, "global_step": 246912, "epoch": 2040} {"train_loss": -39.27001953125, "global_step": 246913, "epoch": 2040} {"train_loss": -39.563018798828125, "global_step": 246914, "epoch": 2040} {"train_loss": -39.72146224975586, "global_step": 246915, "epoch": 2040} {"train_loss": -37.68190002441406, "global_step": 246916, "epoch": 2040} {"train_loss": -40.913665771484375, "global_step": 246917, "epoch": 2040} {"train_loss": -39.74889373779297, "global_step": 246918, "epoch": 2040} {"train_loss": -40.52851867675781, "global_step": 246919, "epoch": 2040} {"train_loss": -40.29621505737305, "global_step": 246920, "epoch": 2040} {"train_loss": -40.28994369506836, "global_step": 246921, "epoch": 2040} {"train_loss": -40.682762145996094, "global_step": 246922, "epoch": 2040} {"train_loss": -39.49478530883789, "global_step": 246923, "epoch": 2040} {"train_loss": -41.04408645629883, "global_step": 246924, "epoch": 2040} {"train_loss": -38.781349182128906, "global_step": 246925, "epoch": 2040} {"train_loss": -40.866920471191406, "global_step": 246926, "epoch": 2040} {"train_loss": -39.37590408325195, "global_step": 246927, "epoch": 2040} {"train_loss": -39.809139251708984, "global_step": 246928, "epoch": 2040} {"train_loss": -31.560108184814453, "global_step": 246929, "epoch": 2040} {"train_loss": -41.06879806518555, "global_step": 246930, "epoch": 2040} {"train_loss": -37.73108673095703, "global_step": 246931, "epoch": 2040} {"train_loss": -41.04912567138672, "global_step": 246932, "epoch": 2040} {"train_loss": -39.934059143066406, "global_step": 246933, "epoch": 2040} {"train_loss": -36.5234489440918, "global_step": 246934, "epoch": 2040} {"train_loss": -39.06991195678711, "global_step": 246935, "epoch": 2040} {"train_loss": -39.89971160888672, "global_step": 246936, "epoch": 2040} {"train_loss": -39.94575119018555, "global_step": 246937, "epoch": 2040} {"train_loss": -38.776248931884766, "global_step": 246938, "epoch": 2040} {"train_loss": -39.0623893737793, "global_step": 246939, "epoch": 2040} {"train_loss": -37.433528900146484, "global_step": 246940, "epoch": 2040} {"train_loss": -39.46857833862305, "global_step": 246941, "epoch": 2040} {"train_loss": -40.5609016418457, "global_step": 246942, "epoch": 2040} {"train_loss": -41.09383773803711, "global_step": 246943, "epoch": 2040} {"train_loss": -39.61123275756836, "global_step": 246944, "epoch": 2040} {"train_loss": -40.11323928833008, "global_step": 246945, "epoch": 2040} {"train_loss": -39.73929977416992, "global_step": 246946, "epoch": 2040} {"train_loss": -40.529296875, "global_step": 246947, "epoch": 2040} {"train_loss": -38.585819244384766, "global_step": 246948, "epoch": 2040} {"train_loss": -38.3011360168457, "global_step": 246949, "epoch": 2040} {"train_loss": -40.93549728393555, "global_step": 246950, "epoch": 2040} {"train_loss": -39.92171096801758, "global_step": 246951, "epoch": 2040} {"train_loss": -40.47235107421875, "global_step": 246952, "epoch": 2040} {"train_loss": -41.02387237548828, "global_step": 246953, "epoch": 2040} {"train_loss": -40.64748764038086, "global_step": 246954, "epoch": 2040} {"train_loss": -40.592525482177734, "global_step": 246955, "epoch": 2040} {"train_loss": -39.12485885620117, "global_step": 246956, "epoch": 2040} {"train_loss": -40.08192825317383, "global_step": 246957, "epoch": 2040} {"train_loss": -40.66048049926758, "global_step": 246958, "epoch": 2040} {"train_loss": -40.745845794677734, "global_step": 246959, "epoch": 2040} {"train_loss": -40.600874309697424, "global_step": 246960, "epoch": 2040, "val_loss": 2464123.75} {"train_loss": -39.09038543701172, "global_step": 246961, "epoch": 2041} {"train_loss": -40.206600189208984, "global_step": 246962, "epoch": 2041} {"train_loss": -41.808013916015625, "global_step": 246963, "epoch": 2041} {"train_loss": -41.319427490234375, "global_step": 246964, "epoch": 2041} {"train_loss": -41.11448287963867, "global_step": 246965, "epoch": 2041} {"train_loss": -41.072731018066406, "global_step": 246966, "epoch": 2041} {"train_loss": -39.301422119140625, "global_step": 246967, "epoch": 2041} {"train_loss": -41.39978790283203, "global_step": 246968, "epoch": 2041} {"train_loss": -41.26438522338867, "global_step": 246969, "epoch": 2041} {"train_loss": -41.08817672729492, "global_step": 246970, "epoch": 2041} {"train_loss": -41.276344299316406, "global_step": 246971, "epoch": 2041} {"train_loss": -40.73006820678711, "global_step": 246972, "epoch": 2041} {"train_loss": -41.35190963745117, "global_step": 246973, "epoch": 2041} {"train_loss": -40.2777099609375, "global_step": 246974, "epoch": 2041} {"train_loss": -40.288291931152344, "global_step": 246975, "epoch": 2041} {"train_loss": -42.05335998535156, "global_step": 246976, "epoch": 2041} {"train_loss": -39.9653205871582, "global_step": 246977, "epoch": 2041} {"train_loss": -42.307979583740234, "global_step": 246978, "epoch": 2041} {"train_loss": -40.47115707397461, "global_step": 246979, "epoch": 2041} {"train_loss": -41.0026969909668, "global_step": 246980, "epoch": 2041} {"train_loss": -39.05363464355469, "global_step": 246981, "epoch": 2041} {"train_loss": -41.277217864990234, "global_step": 246982, "epoch": 2041} {"train_loss": -39.78558349609375, "global_step": 246983, "epoch": 2041} {"train_loss": -41.29629135131836, "global_step": 246984, "epoch": 2041} {"train_loss": -41.59884262084961, "global_step": 246985, "epoch": 2041} {"train_loss": -41.533626556396484, "global_step": 246986, "epoch": 2041} {"train_loss": -40.90433883666992, "global_step": 246987, "epoch": 2041} {"train_loss": -38.32107162475586, "global_step": 246988, "epoch": 2041} {"train_loss": -41.31792449951172, "global_step": 246989, "epoch": 2041} {"train_loss": -40.31132507324219, "global_step": 246990, "epoch": 2041} {"train_loss": -41.84969711303711, "global_step": 246991, "epoch": 2041} {"train_loss": -41.098514556884766, "global_step": 246992, "epoch": 2041} {"train_loss": -42.06535720825195, "global_step": 246993, "epoch": 2041} {"train_loss": -41.002174377441406, "global_step": 246994, "epoch": 2041} {"train_loss": -41.929561614990234, "global_step": 246995, "epoch": 2041} {"train_loss": -41.559627532958984, "global_step": 246996, "epoch": 2041} {"train_loss": -41.40456771850586, "global_step": 246997, "epoch": 2041} {"train_loss": -41.28779602050781, "global_step": 246998, "epoch": 2041} {"train_loss": -41.87805938720703, "global_step": 246999, "epoch": 2041} {"train_loss": -41.96320724487305, "global_step": 247000, "epoch": 2041} {"train_loss": -40.98447799682617, "global_step": 247001, "epoch": 2041} {"train_loss": -41.67299270629883, "global_step": 247002, "epoch": 2041} {"train_loss": -41.897682189941406, "global_step": 247003, "epoch": 2041} {"train_loss": -41.899776458740234, "global_step": 247004, "epoch": 2041} {"train_loss": -41.335670471191406, "global_step": 247005, "epoch": 2041} {"train_loss": -41.92521667480469, "global_step": 247006, "epoch": 2041} {"train_loss": -42.322025299072266, "global_step": 247007, "epoch": 2041} {"train_loss": -41.13199234008789, "global_step": 247008, "epoch": 2041} {"train_loss": -42.29401779174805, "global_step": 247009, "epoch": 2041} {"train_loss": -41.61235427856445, "global_step": 247010, "epoch": 2041} {"train_loss": -41.878578186035156, "global_step": 247011, "epoch": 2041} {"train_loss": -41.6672248840332, "global_step": 247012, "epoch": 2041} {"train_loss": -42.06752014160156, "global_step": 247013, "epoch": 2041} {"train_loss": -41.862056732177734, "global_step": 247014, "epoch": 2041} {"train_loss": -41.67287826538086, "global_step": 247015, "epoch": 2041} {"train_loss": -42.38102722167969, "global_step": 247016, "epoch": 2041} {"train_loss": -41.53169631958008, "global_step": 247017, "epoch": 2041} {"train_loss": -42.57483673095703, "global_step": 247018, "epoch": 2041} {"train_loss": -41.7718391418457, "global_step": 247019, "epoch": 2041} {"train_loss": -42.6939582824707, "global_step": 247020, "epoch": 2041} {"train_loss": -41.99542999267578, "global_step": 247021, "epoch": 2041} {"train_loss": -42.491363525390625, "global_step": 247022, "epoch": 2041} {"train_loss": -42.00300979614258, "global_step": 247023, "epoch": 2041} {"train_loss": -42.22258758544922, "global_step": 247024, "epoch": 2041} {"train_loss": -42.36111068725586, "global_step": 247025, "epoch": 2041} {"train_loss": -42.04071807861328, "global_step": 247026, "epoch": 2041} {"train_loss": -42.5140495300293, "global_step": 247027, "epoch": 2041} {"train_loss": -42.11849594116211, "global_step": 247028, "epoch": 2041} {"train_loss": -42.349945068359375, "global_step": 247029, "epoch": 2041} {"train_loss": -42.46198272705078, "global_step": 247030, "epoch": 2041} {"train_loss": -42.28894805908203, "global_step": 247031, "epoch": 2041} {"train_loss": -42.54035186767578, "global_step": 247032, "epoch": 2041} {"train_loss": -41.89801025390625, "global_step": 247033, "epoch": 2041} {"train_loss": -41.3304443359375, "global_step": 247034, "epoch": 2041} {"train_loss": -42.60752487182617, "global_step": 247035, "epoch": 2041} {"train_loss": -42.8789176940918, "global_step": 247036, "epoch": 2041} {"train_loss": -38.19340515136719, "global_step": 247037, "epoch": 2041} {"train_loss": -42.26666259765625, "global_step": 247038, "epoch": 2041} {"train_loss": -42.810333251953125, "global_step": 247039, "epoch": 2041} {"train_loss": -41.89310836791992, "global_step": 247040, "epoch": 2041} {"train_loss": -42.669898986816406, "global_step": 247041, "epoch": 2041} {"train_loss": -43.02436447143555, "global_step": 247042, "epoch": 2041} {"train_loss": -42.01334762573242, "global_step": 247043, "epoch": 2041} {"train_loss": -42.7346305847168, "global_step": 247044, "epoch": 2041} {"train_loss": -42.542667388916016, "global_step": 247045, "epoch": 2041} {"train_loss": -42.45819091796875, "global_step": 247046, "epoch": 2041} {"train_loss": -39.74242401123047, "global_step": 247047, "epoch": 2041} {"train_loss": -42.43801498413086, "global_step": 247048, "epoch": 2041} {"train_loss": -42.24402618408203, "global_step": 247049, "epoch": 2041} {"train_loss": -42.93354415893555, "global_step": 247050, "epoch": 2041} {"train_loss": -42.930416107177734, "global_step": 247051, "epoch": 2041} {"train_loss": -42.254669189453125, "global_step": 247052, "epoch": 2041} {"train_loss": -42.80338668823242, "global_step": 247053, "epoch": 2041} {"train_loss": -42.68331527709961, "global_step": 247054, "epoch": 2041} {"train_loss": -42.73093795776367, "global_step": 247055, "epoch": 2041} {"train_loss": -42.812294006347656, "global_step": 247056, "epoch": 2041} {"train_loss": -43.05705261230469, "global_step": 247057, "epoch": 2041} {"train_loss": -41.435848236083984, "global_step": 247058, "epoch": 2041} {"train_loss": -42.52790069580078, "global_step": 247059, "epoch": 2041} {"train_loss": -42.28915023803711, "global_step": 247060, "epoch": 2041} {"train_loss": -42.30652618408203, "global_step": 247061, "epoch": 2041} {"train_loss": -42.103797912597656, "global_step": 247062, "epoch": 2041} {"train_loss": -43.294063568115234, "global_step": 247063, "epoch": 2041} {"train_loss": -42.1654052734375, "global_step": 247064, "epoch": 2041} {"train_loss": -42.13755416870117, "global_step": 247065, "epoch": 2041} {"train_loss": -42.64765167236328, "global_step": 247066, "epoch": 2041} {"train_loss": -42.873260498046875, "global_step": 247067, "epoch": 2041} {"train_loss": -42.58689498901367, "global_step": 247068, "epoch": 2041} {"train_loss": -42.49160385131836, "global_step": 247069, "epoch": 2041} {"train_loss": -42.906394958496094, "global_step": 247070, "epoch": 2041} {"train_loss": -42.25525665283203, "global_step": 247071, "epoch": 2041} {"train_loss": -41.77632522583008, "global_step": 247072, "epoch": 2041} {"train_loss": -42.62215042114258, "global_step": 247073, "epoch": 2041} {"train_loss": -41.59267044067383, "global_step": 247074, "epoch": 2041} {"train_loss": -42.644954681396484, "global_step": 247075, "epoch": 2041} {"train_loss": -42.96560287475586, "global_step": 247076, "epoch": 2041} {"train_loss": -42.67912292480469, "global_step": 247077, "epoch": 2041} {"train_loss": -42.96949005126953, "global_step": 247078, "epoch": 2041} {"train_loss": -41.6701545715332, "global_step": 247079, "epoch": 2041} {"train_loss": -42.973480224609375, "global_step": 247080, "epoch": 2041} {"train_loss": -41.79982990863895, "global_step": 247081, "epoch": 2041, "val_loss": 2514542.25} {"train_loss": -42.48796463012695, "global_step": 247082, "epoch": 2042} {"train_loss": -42.32404708862305, "global_step": 247083, "epoch": 2042} {"train_loss": -42.539703369140625, "global_step": 247084, "epoch": 2042} {"train_loss": -43.2076416015625, "global_step": 247085, "epoch": 2042} {"train_loss": -42.268699645996094, "global_step": 247086, "epoch": 2042} {"train_loss": -41.17030715942383, "global_step": 247087, "epoch": 2042} {"train_loss": -42.22673034667969, "global_step": 247088, "epoch": 2042} {"train_loss": -42.8075065612793, "global_step": 247089, "epoch": 2042} {"train_loss": -41.65317916870117, "global_step": 247090, "epoch": 2042} {"train_loss": -43.104610443115234, "global_step": 247091, "epoch": 2042} {"train_loss": -42.72127151489258, "global_step": 247092, "epoch": 2042} {"train_loss": -40.97324752807617, "global_step": 247093, "epoch": 2042} {"train_loss": -43.269020080566406, "global_step": 247094, "epoch": 2042} {"train_loss": -41.054500579833984, "global_step": 247095, "epoch": 2042} {"train_loss": -42.0560417175293, "global_step": 247096, "epoch": 2042} {"train_loss": -41.93569564819336, "global_step": 247097, "epoch": 2042} {"train_loss": -41.09221267700195, "global_step": 247098, "epoch": 2042} {"train_loss": -40.193668365478516, "global_step": 247099, "epoch": 2042} {"train_loss": -42.42409133911133, "global_step": 247100, "epoch": 2042} {"train_loss": -42.177825927734375, "global_step": 247101, "epoch": 2042} {"train_loss": -41.539302825927734, "global_step": 247102, "epoch": 2042} {"train_loss": -41.90768051147461, "global_step": 247103, "epoch": 2042} {"train_loss": -40.5785026550293, "global_step": 247104, "epoch": 2042} {"train_loss": -42.232879638671875, "global_step": 247105, "epoch": 2042} {"train_loss": -41.106475830078125, "global_step": 247106, "epoch": 2042} {"train_loss": -40.349082946777344, "global_step": 247107, "epoch": 2042} {"train_loss": -40.857173919677734, "global_step": 247108, "epoch": 2042} {"train_loss": -42.05644607543945, "global_step": 247109, "epoch": 2042} {"train_loss": -42.05375289916992, "global_step": 247110, "epoch": 2042} {"train_loss": -41.64701461791992, "global_step": 247111, "epoch": 2042} {"train_loss": -40.39950180053711, "global_step": 247112, "epoch": 2042} {"train_loss": -38.70821762084961, "global_step": 247113, "epoch": 2042} {"train_loss": -39.6667594909668, "global_step": 247114, "epoch": 2042} {"train_loss": -40.27898406982422, "global_step": 247115, "epoch": 2042} {"train_loss": -41.621517181396484, "global_step": 247116, "epoch": 2042} {"train_loss": -41.241058349609375, "global_step": 247117, "epoch": 2042} {"train_loss": -41.08861541748047, "global_step": 247118, "epoch": 2042} {"train_loss": -41.42096710205078, "global_step": 247119, "epoch": 2042} {"train_loss": -42.733680725097656, "global_step": 247120, "epoch": 2042} {"train_loss": -41.47948455810547, "global_step": 247121, "epoch": 2042} {"train_loss": -41.776710510253906, "global_step": 247122, "epoch": 2042} {"train_loss": -42.71977615356445, "global_step": 247123, "epoch": 2042} {"train_loss": -41.29653549194336, "global_step": 247124, "epoch": 2042} {"train_loss": -40.79776382446289, "global_step": 247125, "epoch": 2042} {"train_loss": -41.78971481323242, "global_step": 247126, "epoch": 2042} {"train_loss": -42.92009353637695, "global_step": 247127, "epoch": 2042} {"train_loss": -41.477630615234375, "global_step": 247128, "epoch": 2042} {"train_loss": -41.86132049560547, "global_step": 247129, "epoch": 2042} {"train_loss": -42.38159942626953, "global_step": 247130, "epoch": 2042} {"train_loss": -40.90106964111328, "global_step": 247131, "epoch": 2042} {"train_loss": -38.26242446899414, "global_step": 247132, "epoch": 2042} {"train_loss": -40.11791229248047, "global_step": 247133, "epoch": 2042} {"train_loss": -41.68368148803711, "global_step": 247134, "epoch": 2042} {"train_loss": -40.900390625, "global_step": 247135, "epoch": 2042} {"train_loss": -40.54500961303711, "global_step": 247136, "epoch": 2042} {"train_loss": -41.9911003112793, "global_step": 247137, "epoch": 2042} {"train_loss": -40.51160430908203, "global_step": 247138, "epoch": 2042} {"train_loss": -40.82035446166992, "global_step": 247139, "epoch": 2042} {"train_loss": -40.673858642578125, "global_step": 247140, "epoch": 2042} {"train_loss": -40.32374954223633, "global_step": 247141, "epoch": 2042} {"train_loss": -40.35008239746094, "global_step": 247142, "epoch": 2042} {"train_loss": -40.83528518676758, "global_step": 247143, "epoch": 2042} {"train_loss": -40.80778503417969, "global_step": 247144, "epoch": 2042} {"train_loss": -40.925472259521484, "global_step": 247145, "epoch": 2042} {"train_loss": -41.68873977661133, "global_step": 247146, "epoch": 2042} {"train_loss": -41.28573226928711, "global_step": 247147, "epoch": 2042} {"train_loss": -42.07771682739258, "global_step": 247148, "epoch": 2042} {"train_loss": -40.90447998046875, "global_step": 247149, "epoch": 2042} {"train_loss": -42.270145416259766, "global_step": 247150, "epoch": 2042} {"train_loss": -40.98390197753906, "global_step": 247151, "epoch": 2042} {"train_loss": -41.77010726928711, "global_step": 247152, "epoch": 2042} {"train_loss": -41.64229965209961, "global_step": 247153, "epoch": 2042} {"train_loss": -41.17835235595703, "global_step": 247154, "epoch": 2042} {"train_loss": -42.1376953125, "global_step": 247155, "epoch": 2042} {"train_loss": -41.83481979370117, "global_step": 247156, "epoch": 2042} {"train_loss": -41.87583541870117, "global_step": 247157, "epoch": 2042} {"train_loss": -42.46090316772461, "global_step": 247158, "epoch": 2042} {"train_loss": -41.483001708984375, "global_step": 247159, "epoch": 2042} {"train_loss": -40.843990325927734, "global_step": 247160, "epoch": 2042} {"train_loss": -42.39033889770508, "global_step": 247161, "epoch": 2042} {"train_loss": -41.24745178222656, "global_step": 247162, "epoch": 2042} {"train_loss": -42.816104888916016, "global_step": 247163, "epoch": 2042} {"train_loss": -41.97334671020508, "global_step": 247164, "epoch": 2042} {"train_loss": -41.80447769165039, "global_step": 247165, "epoch": 2042} {"train_loss": -41.39109420776367, "global_step": 247166, "epoch": 2042} {"train_loss": -42.16785430908203, "global_step": 247167, "epoch": 2042} {"train_loss": -42.57404708862305, "global_step": 247168, "epoch": 2042} {"train_loss": -41.913326263427734, "global_step": 247169, "epoch": 2042} {"train_loss": -42.5596923828125, "global_step": 247170, "epoch": 2042} {"train_loss": -42.578407287597656, "global_step": 247171, "epoch": 2042} {"train_loss": -41.58142852783203, "global_step": 247172, "epoch": 2042} {"train_loss": -42.11326217651367, "global_step": 247173, "epoch": 2042} {"train_loss": -42.34920120239258, "global_step": 247174, "epoch": 2042} {"train_loss": -41.742652893066406, "global_step": 247175, "epoch": 2042} {"train_loss": -42.723934173583984, "global_step": 247176, "epoch": 2042} {"train_loss": -42.88838195800781, "global_step": 247177, "epoch": 2042} {"train_loss": -41.95599365234375, "global_step": 247178, "epoch": 2042} {"train_loss": -43.050323486328125, "global_step": 247179, "epoch": 2042} {"train_loss": -42.477970123291016, "global_step": 247180, "epoch": 2042} {"train_loss": -43.02103805541992, "global_step": 247181, "epoch": 2042} {"train_loss": -42.36549758911133, "global_step": 247182, "epoch": 2042} {"train_loss": -43.06267166137695, "global_step": 247183, "epoch": 2042} {"train_loss": -42.68562698364258, "global_step": 247184, "epoch": 2042} {"train_loss": -42.441741943359375, "global_step": 247185, "epoch": 2042} {"train_loss": -42.220497131347656, "global_step": 247186, "epoch": 2042} {"train_loss": -43.28359603881836, "global_step": 247187, "epoch": 2042} {"train_loss": -43.06035614013672, "global_step": 247188, "epoch": 2042} {"train_loss": -42.768455505371094, "global_step": 247189, "epoch": 2042} {"train_loss": -42.989131927490234, "global_step": 247190, "epoch": 2042} {"train_loss": -42.611324310302734, "global_step": 247191, "epoch": 2042} {"train_loss": -42.51191329956055, "global_step": 247192, "epoch": 2042} {"train_loss": -42.35932159423828, "global_step": 247193, "epoch": 2042} {"train_loss": -42.931419372558594, "global_step": 247194, "epoch": 2042} {"train_loss": -42.96240234375, "global_step": 247195, "epoch": 2042} {"train_loss": -42.89760208129883, "global_step": 247196, "epoch": 2042} {"train_loss": -43.02983093261719, "global_step": 247197, "epoch": 2042} {"train_loss": -41.950042724609375, "global_step": 247198, "epoch": 2042} {"train_loss": -43.50728988647461, "global_step": 247199, "epoch": 2042} {"train_loss": -41.35324478149414, "global_step": 247200, "epoch": 2042} {"train_loss": -42.91062545776367, "global_step": 247201, "epoch": 2042} {"train_loss": -41.818423436692925, "global_step": 247202, "epoch": 2042, "val_loss": 2525656.75} {"train_loss": -42.670589447021484, "global_step": 247203, "epoch": 2043} {"train_loss": -42.950313568115234, "global_step": 247204, "epoch": 2043} {"train_loss": -42.457664489746094, "global_step": 247205, "epoch": 2043} {"train_loss": -40.512855529785156, "global_step": 247206, "epoch": 2043} {"train_loss": -43.20882797241211, "global_step": 247207, "epoch": 2043} {"train_loss": -42.66709518432617, "global_step": 247208, "epoch": 2043} {"train_loss": -42.306976318359375, "global_step": 247209, "epoch": 2043} {"train_loss": -43.08842086791992, "global_step": 247210, "epoch": 2043} {"train_loss": -42.57932662963867, "global_step": 247211, "epoch": 2043} {"train_loss": -42.08429718017578, "global_step": 247212, "epoch": 2043} {"train_loss": -42.55719757080078, "global_step": 247213, "epoch": 2043} {"train_loss": -42.95033645629883, "global_step": 247214, "epoch": 2043} {"train_loss": -43.28879165649414, "global_step": 247215, "epoch": 2043} {"train_loss": -42.791603088378906, "global_step": 247216, "epoch": 2043} {"train_loss": -42.19098663330078, "global_step": 247217, "epoch": 2043} {"train_loss": -39.14934539794922, "global_step": 247218, "epoch": 2043} {"train_loss": -42.477752685546875, "global_step": 247219, "epoch": 2043} {"train_loss": -41.96399688720703, "global_step": 247220, "epoch": 2043} {"train_loss": -41.53220748901367, "global_step": 247221, "epoch": 2043} {"train_loss": -41.21905517578125, "global_step": 247222, "epoch": 2043} {"train_loss": -41.82273483276367, "global_step": 247223, "epoch": 2043} {"train_loss": -41.2285041809082, "global_step": 247224, "epoch": 2043} {"train_loss": -42.43004608154297, "global_step": 247225, "epoch": 2043} {"train_loss": -43.01324462890625, "global_step": 247226, "epoch": 2043} {"train_loss": -42.06245040893555, "global_step": 247227, "epoch": 2043} {"train_loss": -41.37581253051758, "global_step": 247228, "epoch": 2043} {"train_loss": -41.86574172973633, "global_step": 247229, "epoch": 2043} {"train_loss": -42.76997756958008, "global_step": 247230, "epoch": 2043} {"train_loss": -43.09632110595703, "global_step": 247231, "epoch": 2043} {"train_loss": -42.16834259033203, "global_step": 247232, "epoch": 2043} {"train_loss": -42.48295211791992, "global_step": 247233, "epoch": 2043} {"train_loss": -41.91169357299805, "global_step": 247234, "epoch": 2043} {"train_loss": -42.00239944458008, "global_step": 247235, "epoch": 2043} {"train_loss": -42.4425163269043, "global_step": 247236, "epoch": 2043} {"train_loss": -42.245845794677734, "global_step": 247237, "epoch": 2043} {"train_loss": -41.56662368774414, "global_step": 247238, "epoch": 2043} {"train_loss": -41.01768112182617, "global_step": 247239, "epoch": 2043} {"train_loss": -42.4302864074707, "global_step": 247240, "epoch": 2043} {"train_loss": -41.71472930908203, "global_step": 247241, "epoch": 2043} {"train_loss": -39.680885314941406, "global_step": 247242, "epoch": 2043} {"train_loss": -40.537261962890625, "global_step": 247243, "epoch": 2043} {"train_loss": -39.7038688659668, "global_step": 247244, "epoch": 2043} {"train_loss": -40.09565353393555, "global_step": 247245, "epoch": 2043} {"train_loss": -41.93943405151367, "global_step": 247246, "epoch": 2043} {"train_loss": -40.69273376464844, "global_step": 247247, "epoch": 2043} {"train_loss": -40.61945724487305, "global_step": 247248, "epoch": 2043} {"train_loss": -41.469276428222656, "global_step": 247249, "epoch": 2043} {"train_loss": -42.48145294189453, "global_step": 247250, "epoch": 2043} {"train_loss": -42.3143310546875, "global_step": 247251, "epoch": 2043} {"train_loss": -40.2672233581543, "global_step": 247252, "epoch": 2043} {"train_loss": -42.260250091552734, "global_step": 247253, "epoch": 2043} {"train_loss": -42.54972457885742, "global_step": 247254, "epoch": 2043} {"train_loss": -41.17607879638672, "global_step": 247255, "epoch": 2043} {"train_loss": -40.36610794067383, "global_step": 247256, "epoch": 2043} {"train_loss": -41.55979537963867, "global_step": 247257, "epoch": 2043} {"train_loss": -41.900611877441406, "global_step": 247258, "epoch": 2043} {"train_loss": -41.15036392211914, "global_step": 247259, "epoch": 2043} {"train_loss": -42.39387130737305, "global_step": 247260, "epoch": 2043} {"train_loss": -41.992088317871094, "global_step": 247261, "epoch": 2043} {"train_loss": -42.33170700073242, "global_step": 247262, "epoch": 2043} {"train_loss": -41.7003288269043, "global_step": 247263, "epoch": 2043} {"train_loss": -41.06276321411133, "global_step": 247264, "epoch": 2043} {"train_loss": -42.12900161743164, "global_step": 247265, "epoch": 2043} {"train_loss": -40.238014221191406, "global_step": 247266, "epoch": 2043} {"train_loss": -41.91176223754883, "global_step": 247267, "epoch": 2043} {"train_loss": -42.25260543823242, "global_step": 247268, "epoch": 2043} {"train_loss": -42.5843505859375, "global_step": 247269, "epoch": 2043} {"train_loss": -42.697296142578125, "global_step": 247270, "epoch": 2043} {"train_loss": -42.93511962890625, "global_step": 247271, "epoch": 2043} {"train_loss": -42.7050666809082, "global_step": 247272, "epoch": 2043} {"train_loss": -42.264461517333984, "global_step": 247273, "epoch": 2043} {"train_loss": -42.23385238647461, "global_step": 247274, "epoch": 2043} {"train_loss": -41.33286666870117, "global_step": 247275, "epoch": 2043} {"train_loss": -42.69965744018555, "global_step": 247276, "epoch": 2043} {"train_loss": -42.11252975463867, "global_step": 247277, "epoch": 2043} {"train_loss": -42.09986877441406, "global_step": 247278, "epoch": 2043} {"train_loss": -42.87949752807617, "global_step": 247279, "epoch": 2043} {"train_loss": -42.433753967285156, "global_step": 247280, "epoch": 2043} {"train_loss": -43.19926071166992, "global_step": 247281, "epoch": 2043} {"train_loss": -43.254920959472656, "global_step": 247282, "epoch": 2043} {"train_loss": -43.14522933959961, "global_step": 247283, "epoch": 2043} {"train_loss": -42.89265441894531, "global_step": 247284, "epoch": 2043} {"train_loss": -42.633724212646484, "global_step": 247285, "epoch": 2043} {"train_loss": -41.97036361694336, "global_step": 247286, "epoch": 2043} {"train_loss": -43.32968521118164, "global_step": 247287, "epoch": 2043} {"train_loss": -42.77296829223633, "global_step": 247288, "epoch": 2043} {"train_loss": -42.24479293823242, "global_step": 247289, "epoch": 2043} {"train_loss": -42.60427474975586, "global_step": 247290, "epoch": 2043} {"train_loss": -43.43171310424805, "global_step": 247291, "epoch": 2043} {"train_loss": -42.423072814941406, "global_step": 247292, "epoch": 2043} {"train_loss": -42.98869705200195, "global_step": 247293, "epoch": 2043} {"train_loss": -42.955810546875, "global_step": 247294, "epoch": 2043} {"train_loss": -42.592933654785156, "global_step": 247295, "epoch": 2043} {"train_loss": -43.09225845336914, "global_step": 247296, "epoch": 2043} {"train_loss": -42.89471435546875, "global_step": 247297, "epoch": 2043} {"train_loss": -42.558319091796875, "global_step": 247298, "epoch": 2043} {"train_loss": -43.0841064453125, "global_step": 247299, "epoch": 2043} {"train_loss": -42.621402740478516, "global_step": 247300, "epoch": 2043} {"train_loss": -42.04921340942383, "global_step": 247301, "epoch": 2043} {"train_loss": -42.83515167236328, "global_step": 247302, "epoch": 2043} {"train_loss": -43.21706771850586, "global_step": 247303, "epoch": 2043} {"train_loss": -41.710533142089844, "global_step": 247304, "epoch": 2043} {"train_loss": -39.943965911865234, "global_step": 247305, "epoch": 2043} {"train_loss": -43.04927444458008, "global_step": 247306, "epoch": 2043} {"train_loss": -41.919158935546875, "global_step": 247307, "epoch": 2043} {"train_loss": -40.51424789428711, "global_step": 247308, "epoch": 2043} {"train_loss": -43.66017532348633, "global_step": 247309, "epoch": 2043} {"train_loss": -43.18788146972656, "global_step": 247310, "epoch": 2043} {"train_loss": -41.772212982177734, "global_step": 247311, "epoch": 2043} {"train_loss": -43.308692932128906, "global_step": 247312, "epoch": 2043} {"train_loss": -42.7398681640625, "global_step": 247313, "epoch": 2043} {"train_loss": -39.99043655395508, "global_step": 247314, "epoch": 2043} {"train_loss": -41.59354782104492, "global_step": 247315, "epoch": 2043} {"train_loss": -41.269500732421875, "global_step": 247316, "epoch": 2043} {"train_loss": -41.326171875, "global_step": 247317, "epoch": 2043} {"train_loss": -42.95716094970703, "global_step": 247318, "epoch": 2043} {"train_loss": -43.30632400512695, "global_step": 247319, "epoch": 2043} {"train_loss": -42.13652038574219, "global_step": 247320, "epoch": 2043} {"train_loss": -43.0704231262207, "global_step": 247321, "epoch": 2043} {"train_loss": -42.83195114135742, "global_step": 247322, "epoch": 2043} {"train_loss": -42.13230703684909, "global_step": 247323, "epoch": 2043, "val_loss": 2531542.75} {"train_loss": -42.869441986083984, "global_step": 247324, "epoch": 2044} {"train_loss": -42.76020050048828, "global_step": 247325, "epoch": 2044} {"train_loss": -42.20913314819336, "global_step": 247326, "epoch": 2044} {"train_loss": -42.667091369628906, "global_step": 247327, "epoch": 2044} {"train_loss": -42.58942794799805, "global_step": 247328, "epoch": 2044} {"train_loss": -43.020050048828125, "global_step": 247329, "epoch": 2044} {"train_loss": -43.476871490478516, "global_step": 247330, "epoch": 2044} {"train_loss": -42.20745849609375, "global_step": 247331, "epoch": 2044} {"train_loss": -41.6175422668457, "global_step": 247332, "epoch": 2044} {"train_loss": -42.9842529296875, "global_step": 247333, "epoch": 2044} {"train_loss": -42.44021224975586, "global_step": 247334, "epoch": 2044} {"train_loss": -42.072608947753906, "global_step": 247335, "epoch": 2044} {"train_loss": -42.59621810913086, "global_step": 247336, "epoch": 2044} {"train_loss": -42.49955368041992, "global_step": 247337, "epoch": 2044} {"train_loss": -41.75986099243164, "global_step": 247338, "epoch": 2044} {"train_loss": -42.442378997802734, "global_step": 247339, "epoch": 2044} {"train_loss": -41.87300491333008, "global_step": 247340, "epoch": 2044} {"train_loss": -41.877193450927734, "global_step": 247341, "epoch": 2044} {"train_loss": -42.56266403198242, "global_step": 247342, "epoch": 2044} {"train_loss": -42.89625930786133, "global_step": 247343, "epoch": 2044} {"train_loss": -42.24945068359375, "global_step": 247344, "epoch": 2044} {"train_loss": -40.68131637573242, "global_step": 247345, "epoch": 2044} {"train_loss": -41.54063415527344, "global_step": 247346, "epoch": 2044} {"train_loss": -41.283843994140625, "global_step": 247347, "epoch": 2044} {"train_loss": -40.01100540161133, "global_step": 247348, "epoch": 2044} {"train_loss": -39.698665618896484, "global_step": 247349, "epoch": 2044} {"train_loss": -42.56608200073242, "global_step": 247350, "epoch": 2044} {"train_loss": -42.26765060424805, "global_step": 247351, "epoch": 2044} {"train_loss": -38.25397491455078, "global_step": 247352, "epoch": 2044} {"train_loss": -37.088619232177734, "global_step": 247353, "epoch": 2044} {"train_loss": -40.614662170410156, "global_step": 247354, "epoch": 2044} {"train_loss": -42.566070556640625, "global_step": 247355, "epoch": 2044} {"train_loss": -39.503997802734375, "global_step": 247356, "epoch": 2044} {"train_loss": -39.62327194213867, "global_step": 247357, "epoch": 2044} {"train_loss": -38.10501480102539, "global_step": 247358, "epoch": 2044} {"train_loss": -40.466064453125, "global_step": 247359, "epoch": 2044} {"train_loss": -39.61106491088867, "global_step": 247360, "epoch": 2044} {"train_loss": -36.47003173828125, "global_step": 247361, "epoch": 2044} {"train_loss": -38.70111083984375, "global_step": 247362, "epoch": 2044} {"train_loss": -35.634822845458984, "global_step": 247363, "epoch": 2044} {"train_loss": -41.092220306396484, "global_step": 247364, "epoch": 2044} {"train_loss": -39.945045471191406, "global_step": 247365, "epoch": 2044} {"train_loss": -35.440460205078125, "global_step": 247366, "epoch": 2044} {"train_loss": -41.8035888671875, "global_step": 247367, "epoch": 2044} {"train_loss": -38.76137924194336, "global_step": 247368, "epoch": 2044} {"train_loss": -41.3518180847168, "global_step": 247369, "epoch": 2044} {"train_loss": -40.1445426940918, "global_step": 247370, "epoch": 2044} {"train_loss": -41.46743392944336, "global_step": 247371, "epoch": 2044} {"train_loss": -40.59836959838867, "global_step": 247372, "epoch": 2044} {"train_loss": -37.78772735595703, "global_step": 247373, "epoch": 2044} {"train_loss": -37.87456130981445, "global_step": 247374, "epoch": 2044} {"train_loss": -37.50191116333008, "global_step": 247375, "epoch": 2044} {"train_loss": -40.3161506652832, "global_step": 247376, "epoch": 2044} {"train_loss": -41.3172492980957, "global_step": 247377, "epoch": 2044} {"train_loss": -40.294891357421875, "global_step": 247378, "epoch": 2044} {"train_loss": -40.57612609863281, "global_step": 247379, "epoch": 2044} {"train_loss": -38.494842529296875, "global_step": 247380, "epoch": 2044} {"train_loss": -41.27525329589844, "global_step": 247381, "epoch": 2044} {"train_loss": -41.1096076965332, "global_step": 247382, "epoch": 2044} {"train_loss": -41.63163757324219, "global_step": 247383, "epoch": 2044} {"train_loss": -41.65321731567383, "global_step": 247384, "epoch": 2044} {"train_loss": -40.251468658447266, "global_step": 247385, "epoch": 2044} {"train_loss": -41.74180221557617, "global_step": 247386, "epoch": 2044} {"train_loss": -40.811737060546875, "global_step": 247387, "epoch": 2044} {"train_loss": -42.03066635131836, "global_step": 247388, "epoch": 2044} {"train_loss": -42.02130126953125, "global_step": 247389, "epoch": 2044} {"train_loss": -41.551666259765625, "global_step": 247390, "epoch": 2044} {"train_loss": -41.75246810913086, "global_step": 247391, "epoch": 2044} {"train_loss": -42.35050582885742, "global_step": 247392, "epoch": 2044} {"train_loss": -42.00310516357422, "global_step": 247393, "epoch": 2044} {"train_loss": -41.19807815551758, "global_step": 247394, "epoch": 2044} {"train_loss": -38.74932861328125, "global_step": 247395, "epoch": 2044} {"train_loss": -41.828582763671875, "global_step": 247396, "epoch": 2044} {"train_loss": -42.81410598754883, "global_step": 247397, "epoch": 2044} {"train_loss": -42.12201690673828, "global_step": 247398, "epoch": 2044} {"train_loss": -41.20623779296875, "global_step": 247399, "epoch": 2044} {"train_loss": -42.09674072265625, "global_step": 247400, "epoch": 2044} {"train_loss": -41.63835906982422, "global_step": 247401, "epoch": 2044} {"train_loss": -42.443546295166016, "global_step": 247402, "epoch": 2044} {"train_loss": -39.419219970703125, "global_step": 247403, "epoch": 2044} {"train_loss": -41.68205642700195, "global_step": 247404, "epoch": 2044} {"train_loss": -42.73881149291992, "global_step": 247405, "epoch": 2044} {"train_loss": -42.00057601928711, "global_step": 247406, "epoch": 2044} {"train_loss": -42.03168869018555, "global_step": 247407, "epoch": 2044} {"train_loss": -42.70766830444336, "global_step": 247408, "epoch": 2044} {"train_loss": -41.21285629272461, "global_step": 247409, "epoch": 2044} {"train_loss": -42.17824935913086, "global_step": 247410, "epoch": 2044} {"train_loss": -41.94664764404297, "global_step": 247411, "epoch": 2044} {"train_loss": -42.06901168823242, "global_step": 247412, "epoch": 2044} {"train_loss": -42.73940658569336, "global_step": 247413, "epoch": 2044} {"train_loss": -42.25394821166992, "global_step": 247414, "epoch": 2044} {"train_loss": -41.85066604614258, "global_step": 247415, "epoch": 2044} {"train_loss": -43.02070236206055, "global_step": 247416, "epoch": 2044} {"train_loss": -42.04810333251953, "global_step": 247417, "epoch": 2044} {"train_loss": -42.36880111694336, "global_step": 247418, "epoch": 2044} {"train_loss": -43.266693115234375, "global_step": 247419, "epoch": 2044} {"train_loss": -42.62138366699219, "global_step": 247420, "epoch": 2044} {"train_loss": -43.353477478027344, "global_step": 247421, "epoch": 2044} {"train_loss": -42.31722640991211, "global_step": 247422, "epoch": 2044} {"train_loss": -42.27177810668945, "global_step": 247423, "epoch": 2044} {"train_loss": -43.11945724487305, "global_step": 247424, "epoch": 2044} {"train_loss": -42.186397552490234, "global_step": 247425, "epoch": 2044} {"train_loss": -42.67802047729492, "global_step": 247426, "epoch": 2044} {"train_loss": -42.75590133666992, "global_step": 247427, "epoch": 2044} {"train_loss": -42.958465576171875, "global_step": 247428, "epoch": 2044} {"train_loss": -41.37331771850586, "global_step": 247429, "epoch": 2044} {"train_loss": -43.144012451171875, "global_step": 247430, "epoch": 2044} {"train_loss": -42.74713134765625, "global_step": 247431, "epoch": 2044} {"train_loss": -43.206085205078125, "global_step": 247432, "epoch": 2044} {"train_loss": -43.377418518066406, "global_step": 247433, "epoch": 2044} {"train_loss": -42.75858688354492, "global_step": 247434, "epoch": 2044} {"train_loss": -43.19525909423828, "global_step": 247435, "epoch": 2044} {"train_loss": -42.645538330078125, "global_step": 247436, "epoch": 2044} {"train_loss": -43.49372100830078, "global_step": 247437, "epoch": 2044} {"train_loss": -43.4457893371582, "global_step": 247438, "epoch": 2044} {"train_loss": -43.368099212646484, "global_step": 247439, "epoch": 2044} {"train_loss": -42.85102081298828, "global_step": 247440, "epoch": 2044} {"train_loss": -42.403133392333984, "global_step": 247441, "epoch": 2044} {"train_loss": -42.827880859375, "global_step": 247442, "epoch": 2044} {"train_loss": -42.51481628417969, "global_step": 247443, "epoch": 2044} {"train_loss": -41.49767700699735, "global_step": 247444, "epoch": 2044, "val_loss": 2576932.75} {"train_loss": -43.587825775146484, "global_step": 247445, "epoch": 2045} {"train_loss": -43.48090362548828, "global_step": 247446, "epoch": 2045} {"train_loss": -43.030548095703125, "global_step": 247447, "epoch": 2045} {"train_loss": -42.992103576660156, "global_step": 247448, "epoch": 2045} {"train_loss": -43.77587127685547, "global_step": 247449, "epoch": 2045} {"train_loss": -42.67694854736328, "global_step": 247450, "epoch": 2045} {"train_loss": -41.89984893798828, "global_step": 247451, "epoch": 2045} {"train_loss": -42.74744415283203, "global_step": 247452, "epoch": 2045} {"train_loss": -43.26274871826172, "global_step": 247453, "epoch": 2045} {"train_loss": -42.384037017822266, "global_step": 247454, "epoch": 2045} {"train_loss": -42.377437591552734, "global_step": 247455, "epoch": 2045} {"train_loss": -42.77183151245117, "global_step": 247456, "epoch": 2045} {"train_loss": -42.870025634765625, "global_step": 247457, "epoch": 2045} {"train_loss": -43.206260681152344, "global_step": 247458, "epoch": 2045} {"train_loss": -42.374977111816406, "global_step": 247459, "epoch": 2045} {"train_loss": -41.9560432434082, "global_step": 247460, "epoch": 2045} {"train_loss": -42.08270263671875, "global_step": 247461, "epoch": 2045} {"train_loss": -41.72477340698242, "global_step": 247462, "epoch": 2045} {"train_loss": -42.16004180908203, "global_step": 247463, "epoch": 2045} {"train_loss": -42.997737884521484, "global_step": 247464, "epoch": 2045} {"train_loss": -42.16884994506836, "global_step": 247465, "epoch": 2045} {"train_loss": -41.45550537109375, "global_step": 247466, "epoch": 2045} {"train_loss": -42.5389518737793, "global_step": 247467, "epoch": 2045} {"train_loss": -40.87199020385742, "global_step": 247468, "epoch": 2045} {"train_loss": -39.63436508178711, "global_step": 247469, "epoch": 2045} {"train_loss": -41.30904769897461, "global_step": 247470, "epoch": 2045} {"train_loss": -39.883201599121094, "global_step": 247471, "epoch": 2045} {"train_loss": -37.80299377441406, "global_step": 247472, "epoch": 2045} {"train_loss": -41.315185546875, "global_step": 247473, "epoch": 2045} {"train_loss": -40.12611389160156, "global_step": 247474, "epoch": 2045} {"train_loss": -38.211029052734375, "global_step": 247475, "epoch": 2045} {"train_loss": -41.775970458984375, "global_step": 247476, "epoch": 2045} {"train_loss": -40.19045639038086, "global_step": 247477, "epoch": 2045} {"train_loss": -39.70534133911133, "global_step": 247478, "epoch": 2045} {"train_loss": -41.553184509277344, "global_step": 247479, "epoch": 2045} {"train_loss": -41.214115142822266, "global_step": 247480, "epoch": 2045} {"train_loss": -41.12675476074219, "global_step": 247481, "epoch": 2045} {"train_loss": -40.24208068847656, "global_step": 247482, "epoch": 2045} {"train_loss": -40.558746337890625, "global_step": 247483, "epoch": 2045} {"train_loss": -40.354427337646484, "global_step": 247484, "epoch": 2045} {"train_loss": -41.845733642578125, "global_step": 247485, "epoch": 2045} {"train_loss": -41.112648010253906, "global_step": 247486, "epoch": 2045} {"train_loss": -41.74384689331055, "global_step": 247487, "epoch": 2045} {"train_loss": -42.218231201171875, "global_step": 247488, "epoch": 2045} {"train_loss": -41.69479751586914, "global_step": 247489, "epoch": 2045} {"train_loss": -42.242305755615234, "global_step": 247490, "epoch": 2045} {"train_loss": -42.49732208251953, "global_step": 247491, "epoch": 2045} {"train_loss": -42.646278381347656, "global_step": 247492, "epoch": 2045} {"train_loss": -42.408363342285156, "global_step": 247493, "epoch": 2045} {"train_loss": -42.18781661987305, "global_step": 247494, "epoch": 2045} {"train_loss": -43.07684326171875, "global_step": 247495, "epoch": 2045} {"train_loss": -42.10784912109375, "global_step": 247496, "epoch": 2045} {"train_loss": -42.70276641845703, "global_step": 247497, "epoch": 2045} {"train_loss": -41.3517951965332, "global_step": 247498, "epoch": 2045} {"train_loss": -43.13496780395508, "global_step": 247499, "epoch": 2045} {"train_loss": -42.289154052734375, "global_step": 247500, "epoch": 2045} {"train_loss": -43.182865142822266, "global_step": 247501, "epoch": 2045} {"train_loss": -43.322357177734375, "global_step": 247502, "epoch": 2045} {"train_loss": -42.46438217163086, "global_step": 247503, "epoch": 2045} {"train_loss": -42.7841682434082, "global_step": 247504, "epoch": 2045} {"train_loss": -43.42878341674805, "global_step": 247505, "epoch": 2045} {"train_loss": -43.31059646606445, "global_step": 247506, "epoch": 2045} {"train_loss": -43.00294876098633, "global_step": 247507, "epoch": 2045} {"train_loss": -42.559051513671875, "global_step": 247508, "epoch": 2045} {"train_loss": -43.36213684082031, "global_step": 247509, "epoch": 2045} {"train_loss": -42.838260650634766, "global_step": 247510, "epoch": 2045} {"train_loss": -42.77244567871094, "global_step": 247511, "epoch": 2045} {"train_loss": -42.794189453125, "global_step": 247512, "epoch": 2045} {"train_loss": -43.33951950073242, "global_step": 247513, "epoch": 2045} {"train_loss": -42.747013092041016, "global_step": 247514, "epoch": 2045} {"train_loss": -43.0252685546875, "global_step": 247515, "epoch": 2045} {"train_loss": -43.167083740234375, "global_step": 247516, "epoch": 2045} {"train_loss": -43.17097091674805, "global_step": 247517, "epoch": 2045} {"train_loss": -42.98542022705078, "global_step": 247518, "epoch": 2045} {"train_loss": -43.401607513427734, "global_step": 247519, "epoch": 2045} {"train_loss": -43.23305130004883, "global_step": 247520, "epoch": 2045} {"train_loss": -42.72080612182617, "global_step": 247521, "epoch": 2045} {"train_loss": -43.55803298950195, "global_step": 247522, "epoch": 2045} {"train_loss": -42.90141677856445, "global_step": 247523, "epoch": 2045} {"train_loss": -42.7985954284668, "global_step": 247524, "epoch": 2045} {"train_loss": -43.582275390625, "global_step": 247525, "epoch": 2045} {"train_loss": -42.35537338256836, "global_step": 247526, "epoch": 2045} {"train_loss": -42.720001220703125, "global_step": 247527, "epoch": 2045} {"train_loss": -42.588863372802734, "global_step": 247528, "epoch": 2045} {"train_loss": -42.61995315551758, "global_step": 247529, "epoch": 2045} {"train_loss": -43.00912094116211, "global_step": 247530, "epoch": 2045} {"train_loss": -41.93966293334961, "global_step": 247531, "epoch": 2045} {"train_loss": -38.4974250793457, "global_step": 247532, "epoch": 2045} {"train_loss": -39.497703552246094, "global_step": 247533, "epoch": 2045} {"train_loss": -42.585540771484375, "global_step": 247534, "epoch": 2045} {"train_loss": -41.9593505859375, "global_step": 247535, "epoch": 2045} {"train_loss": -38.38385009765625, "global_step": 247536, "epoch": 2045} {"train_loss": -36.642879486083984, "global_step": 247537, "epoch": 2045} {"train_loss": -41.39146041870117, "global_step": 247538, "epoch": 2045} {"train_loss": -42.12775802612305, "global_step": 247539, "epoch": 2045} {"train_loss": -33.94468307495117, "global_step": 247540, "epoch": 2045} {"train_loss": -35.80559539794922, "global_step": 247541, "epoch": 2045} {"train_loss": -41.419429779052734, "global_step": 247542, "epoch": 2045} {"train_loss": -37.13630294799805, "global_step": 247543, "epoch": 2045} {"train_loss": -37.488136291503906, "global_step": 247544, "epoch": 2045} {"train_loss": -41.8994140625, "global_step": 247545, "epoch": 2045} {"train_loss": -40.32025146484375, "global_step": 247546, "epoch": 2045} {"train_loss": -41.943748474121094, "global_step": 247547, "epoch": 2045} {"train_loss": -41.782569885253906, "global_step": 247548, "epoch": 2045} {"train_loss": -41.322105407714844, "global_step": 247549, "epoch": 2045} {"train_loss": -42.77212142944336, "global_step": 247550, "epoch": 2045} {"train_loss": -42.40087890625, "global_step": 247551, "epoch": 2045} {"train_loss": -42.104373931884766, "global_step": 247552, "epoch": 2045} {"train_loss": -42.54964065551758, "global_step": 247553, "epoch": 2045} {"train_loss": -42.65141677856445, "global_step": 247554, "epoch": 2045} {"train_loss": -42.052425384521484, "global_step": 247555, "epoch": 2045} {"train_loss": -42.85577392578125, "global_step": 247556, "epoch": 2045} {"train_loss": -42.46798324584961, "global_step": 247557, "epoch": 2045} {"train_loss": -41.04248046875, "global_step": 247558, "epoch": 2045} {"train_loss": -42.33108901977539, "global_step": 247559, "epoch": 2045} {"train_loss": -42.8223876953125, "global_step": 247560, "epoch": 2045} {"train_loss": -42.79593276977539, "global_step": 247561, "epoch": 2045} {"train_loss": -42.74871063232422, "global_step": 247562, "epoch": 2045} {"train_loss": -42.97441101074219, "global_step": 247563, "epoch": 2045} {"train_loss": -43.1158561706543, "global_step": 247564, "epoch": 2045} {"train_loss": -41.88981366748652, "global_step": 247565, "epoch": 2045, "val_loss": 2583191.75} {"train_loss": -42.42537307739258, "global_step": 247566, "epoch": 2046} {"train_loss": -42.53131103515625, "global_step": 247567, "epoch": 2046} {"train_loss": -42.011756896972656, "global_step": 247568, "epoch": 2046} {"train_loss": -39.88589096069336, "global_step": 247569, "epoch": 2046} {"train_loss": -42.28821563720703, "global_step": 247570, "epoch": 2046} {"train_loss": -40.80913162231445, "global_step": 247571, "epoch": 2046} {"train_loss": -42.249488830566406, "global_step": 247572, "epoch": 2046} {"train_loss": -41.0802116394043, "global_step": 247573, "epoch": 2046} {"train_loss": -43.240814208984375, "global_step": 247574, "epoch": 2046} {"train_loss": -41.08321762084961, "global_step": 247575, "epoch": 2046} {"train_loss": -41.97098922729492, "global_step": 247576, "epoch": 2046} {"train_loss": -39.327877044677734, "global_step": 247577, "epoch": 2046} {"train_loss": -41.498191833496094, "global_step": 247578, "epoch": 2046} {"train_loss": -42.81850051879883, "global_step": 247579, "epoch": 2046} {"train_loss": -41.47721862792969, "global_step": 247580, "epoch": 2046} {"train_loss": -41.88737106323242, "global_step": 247581, "epoch": 2046} {"train_loss": -41.80365753173828, "global_step": 247582, "epoch": 2046} {"train_loss": -42.080230712890625, "global_step": 247583, "epoch": 2046} {"train_loss": -41.56605911254883, "global_step": 247584, "epoch": 2046} {"train_loss": -43.05474853515625, "global_step": 247585, "epoch": 2046} {"train_loss": -41.483604431152344, "global_step": 247586, "epoch": 2046} {"train_loss": -41.151580810546875, "global_step": 247587, "epoch": 2046} {"train_loss": -42.719722747802734, "global_step": 247588, "epoch": 2046} {"train_loss": -41.10624313354492, "global_step": 247589, "epoch": 2046} {"train_loss": -41.67062759399414, "global_step": 247590, "epoch": 2046} {"train_loss": -42.36610794067383, "global_step": 247591, "epoch": 2046} {"train_loss": -42.45064163208008, "global_step": 247592, "epoch": 2046} {"train_loss": -42.24177551269531, "global_step": 247593, "epoch": 2046} {"train_loss": -42.25686264038086, "global_step": 247594, "epoch": 2046} {"train_loss": -42.69819259643555, "global_step": 247595, "epoch": 2046} {"train_loss": -42.23919677734375, "global_step": 247596, "epoch": 2046} {"train_loss": -41.819149017333984, "global_step": 247597, "epoch": 2046} {"train_loss": -42.61179733276367, "global_step": 247598, "epoch": 2046} {"train_loss": -42.07343673706055, "global_step": 247599, "epoch": 2046} {"train_loss": -42.57932662963867, "global_step": 247600, "epoch": 2046} {"train_loss": -42.71672058105469, "global_step": 247601, "epoch": 2046} {"train_loss": -43.17546844482422, "global_step": 247602, "epoch": 2046} {"train_loss": -42.64790725708008, "global_step": 247603, "epoch": 2046} {"train_loss": -42.87741470336914, "global_step": 247604, "epoch": 2046} {"train_loss": -43.1888542175293, "global_step": 247605, "epoch": 2046} {"train_loss": -42.59208297729492, "global_step": 247606, "epoch": 2046} {"train_loss": -43.39752960205078, "global_step": 247607, "epoch": 2046} {"train_loss": -43.413387298583984, "global_step": 247608, "epoch": 2046} {"train_loss": -43.22774887084961, "global_step": 247609, "epoch": 2046} {"train_loss": -43.34202194213867, "global_step": 247610, "epoch": 2046} {"train_loss": -42.88755416870117, "global_step": 247611, "epoch": 2046} {"train_loss": -43.1732177734375, "global_step": 247612, "epoch": 2046} {"train_loss": -43.21199417114258, "global_step": 247613, "epoch": 2046} {"train_loss": -42.97780990600586, "global_step": 247614, "epoch": 2046} {"train_loss": -42.1772575378418, "global_step": 247615, "epoch": 2046} {"train_loss": -42.0692024230957, "global_step": 247616, "epoch": 2046} {"train_loss": -42.699066162109375, "global_step": 247617, "epoch": 2046} {"train_loss": -42.93669509887695, "global_step": 247618, "epoch": 2046} {"train_loss": -43.11061477661133, "global_step": 247619, "epoch": 2046} {"train_loss": -42.463523864746094, "global_step": 247620, "epoch": 2046} {"train_loss": -42.5643424987793, "global_step": 247621, "epoch": 2046} {"train_loss": -43.204566955566406, "global_step": 247622, "epoch": 2046} {"train_loss": -42.06103515625, "global_step": 247623, "epoch": 2046} {"train_loss": -41.899696350097656, "global_step": 247624, "epoch": 2046} {"train_loss": -42.03278732299805, "global_step": 247625, "epoch": 2046} {"train_loss": -42.56891632080078, "global_step": 247626, "epoch": 2046} {"train_loss": -41.918983459472656, "global_step": 247627, "epoch": 2046} {"train_loss": -42.2287712097168, "global_step": 247628, "epoch": 2046} {"train_loss": -43.02751922607422, "global_step": 247629, "epoch": 2046} {"train_loss": -43.39754867553711, "global_step": 247630, "epoch": 2046} {"train_loss": -43.0013313293457, "global_step": 247631, "epoch": 2046} {"train_loss": -41.80548095703125, "global_step": 247632, "epoch": 2046} {"train_loss": -43.009857177734375, "global_step": 247633, "epoch": 2046} {"train_loss": -42.539119720458984, "global_step": 247634, "epoch": 2046} {"train_loss": -41.93368148803711, "global_step": 247635, "epoch": 2046} {"train_loss": -42.85097885131836, "global_step": 247636, "epoch": 2046} {"train_loss": -42.83427047729492, "global_step": 247637, "epoch": 2046} {"train_loss": -40.80778884887695, "global_step": 247638, "epoch": 2046} {"train_loss": -40.601436614990234, "global_step": 247639, "epoch": 2046} {"train_loss": -42.91693878173828, "global_step": 247640, "epoch": 2046} {"train_loss": -40.58199691772461, "global_step": 247641, "epoch": 2046} {"train_loss": -40.16031265258789, "global_step": 247642, "epoch": 2046} {"train_loss": -42.50484085083008, "global_step": 247643, "epoch": 2046} {"train_loss": -42.75703811645508, "global_step": 247644, "epoch": 2046} {"train_loss": -39.25643539428711, "global_step": 247645, "epoch": 2046} {"train_loss": -39.323692321777344, "global_step": 247646, "epoch": 2046} {"train_loss": -40.21857452392578, "global_step": 247647, "epoch": 2046} {"train_loss": -40.33918380737305, "global_step": 247648, "epoch": 2046} {"train_loss": -41.51865005493164, "global_step": 247649, "epoch": 2046} {"train_loss": -42.055335998535156, "global_step": 247650, "epoch": 2046} {"train_loss": -39.07502365112305, "global_step": 247651, "epoch": 2046} {"train_loss": -39.11082077026367, "global_step": 247652, "epoch": 2046} {"train_loss": -41.058631896972656, "global_step": 247653, "epoch": 2046} {"train_loss": -40.89247131347656, "global_step": 247654, "epoch": 2046} {"train_loss": -40.90959167480469, "global_step": 247655, "epoch": 2046} {"train_loss": -38.964839935302734, "global_step": 247656, "epoch": 2046} {"train_loss": -41.847408294677734, "global_step": 247657, "epoch": 2046} {"train_loss": -37.0072135925293, "global_step": 247658, "epoch": 2046} {"train_loss": -40.357818603515625, "global_step": 247659, "epoch": 2046} {"train_loss": -39.79076385498047, "global_step": 247660, "epoch": 2046} {"train_loss": -39.755615234375, "global_step": 247661, "epoch": 2046} {"train_loss": -40.198272705078125, "global_step": 247662, "epoch": 2046} {"train_loss": -40.99176025390625, "global_step": 247663, "epoch": 2046} {"train_loss": -38.228816986083984, "global_step": 247664, "epoch": 2046} {"train_loss": -40.7646369934082, "global_step": 247665, "epoch": 2046} {"train_loss": -37.74105453491211, "global_step": 247666, "epoch": 2046} {"train_loss": -35.75442123413086, "global_step": 247667, "epoch": 2046} {"train_loss": -41.03364944458008, "global_step": 247668, "epoch": 2046} {"train_loss": -36.86983871459961, "global_step": 247669, "epoch": 2046} {"train_loss": -39.788936614990234, "global_step": 247670, "epoch": 2046} {"train_loss": -37.5606575012207, "global_step": 247671, "epoch": 2046} {"train_loss": -34.37192916870117, "global_step": 247672, "epoch": 2046} {"train_loss": -41.44991683959961, "global_step": 247673, "epoch": 2046} {"train_loss": -36.663551330566406, "global_step": 247674, "epoch": 2046} {"train_loss": -40.3954963684082, "global_step": 247675, "epoch": 2046} {"train_loss": -38.870018005371094, "global_step": 247676, "epoch": 2046} {"train_loss": -41.113494873046875, "global_step": 247677, "epoch": 2046} {"train_loss": -39.245689392089844, "global_step": 247678, "epoch": 2046} {"train_loss": -40.92678451538086, "global_step": 247679, "epoch": 2046} {"train_loss": -39.41010665893555, "global_step": 247680, "epoch": 2046} {"train_loss": -41.22563552856445, "global_step": 247681, "epoch": 2046} {"train_loss": -40.99506378173828, "global_step": 247682, "epoch": 2046} {"train_loss": -41.126808166503906, "global_step": 247683, "epoch": 2046} {"train_loss": -40.62610626220703, "global_step": 247684, "epoch": 2046} {"train_loss": -41.368282318115234, "global_step": 247685, "epoch": 2046} {"train_loss": -41.37451282217483, "global_step": 247686, "epoch": 2046, "val_loss": 2609677.0} {"train_loss": -41.99813461303711, "global_step": 247687, "epoch": 2047} {"train_loss": -40.44381332397461, "global_step": 247688, "epoch": 2047} {"train_loss": -41.68638229370117, "global_step": 247689, "epoch": 2047} {"train_loss": -40.96531295776367, "global_step": 247690, "epoch": 2047} {"train_loss": -40.7363166809082, "global_step": 247691, "epoch": 2047} {"train_loss": -41.13570785522461, "global_step": 247692, "epoch": 2047} {"train_loss": -40.850311279296875, "global_step": 247693, "epoch": 2047} {"train_loss": -40.80910110473633, "global_step": 247694, "epoch": 2047} {"train_loss": -40.57487106323242, "global_step": 247695, "epoch": 2047} {"train_loss": -42.01445770263672, "global_step": 247696, "epoch": 2047} {"train_loss": -40.471492767333984, "global_step": 247697, "epoch": 2047} {"train_loss": -42.58250045776367, "global_step": 247698, "epoch": 2047} {"train_loss": -40.71360397338867, "global_step": 247699, "epoch": 2047} {"train_loss": -42.48249435424805, "global_step": 247700, "epoch": 2047} {"train_loss": -41.37107467651367, "global_step": 247701, "epoch": 2047} {"train_loss": -42.23832321166992, "global_step": 247702, "epoch": 2047} {"train_loss": -42.41781234741211, "global_step": 247703, "epoch": 2047} {"train_loss": -42.79866409301758, "global_step": 247704, "epoch": 2047} {"train_loss": -42.77197265625, "global_step": 247705, "epoch": 2047} {"train_loss": -42.353023529052734, "global_step": 247706, "epoch": 2047} {"train_loss": -42.82617950439453, "global_step": 247707, "epoch": 2047} {"train_loss": -42.31599807739258, "global_step": 247708, "epoch": 2047} {"train_loss": -42.70093536376953, "global_step": 247709, "epoch": 2047} {"train_loss": -42.512290954589844, "global_step": 247710, "epoch": 2047} {"train_loss": -42.851688385009766, "global_step": 247711, "epoch": 2047} {"train_loss": -42.94343185424805, "global_step": 247712, "epoch": 2047} {"train_loss": -42.74905014038086, "global_step": 247713, "epoch": 2047} {"train_loss": -42.533843994140625, "global_step": 247714, "epoch": 2047} {"train_loss": -43.249427795410156, "global_step": 247715, "epoch": 2047} {"train_loss": -42.86371612548828, "global_step": 247716, "epoch": 2047} {"train_loss": -43.075801849365234, "global_step": 247717, "epoch": 2047} {"train_loss": -42.78840255737305, "global_step": 247718, "epoch": 2047} {"train_loss": -43.09702682495117, "global_step": 247719, "epoch": 2047} {"train_loss": -42.99018096923828, "global_step": 247720, "epoch": 2047} {"train_loss": -43.32965850830078, "global_step": 247721, "epoch": 2047} {"train_loss": -42.91558074951172, "global_step": 247722, "epoch": 2047} {"train_loss": -43.06580352783203, "global_step": 247723, "epoch": 2047} {"train_loss": -43.050819396972656, "global_step": 247724, "epoch": 2047} {"train_loss": -43.16542434692383, "global_step": 247725, "epoch": 2047} {"train_loss": -43.416786193847656, "global_step": 247726, "epoch": 2047} {"train_loss": -43.48325729370117, "global_step": 247727, "epoch": 2047} {"train_loss": -43.26398849487305, "global_step": 247728, "epoch": 2047} {"train_loss": -43.68286895751953, "global_step": 247729, "epoch": 2047} {"train_loss": -43.462554931640625, "global_step": 247730, "epoch": 2047} {"train_loss": -42.71159744262695, "global_step": 247731, "epoch": 2047} {"train_loss": -43.33195114135742, "global_step": 247732, "epoch": 2047} {"train_loss": -43.89310073852539, "global_step": 247733, "epoch": 2047} {"train_loss": -43.117645263671875, "global_step": 247734, "epoch": 2047} {"train_loss": -43.645301818847656, "global_step": 247735, "epoch": 2047} {"train_loss": -43.4025993347168, "global_step": 247736, "epoch": 2047} {"train_loss": -43.80867385864258, "global_step": 247737, "epoch": 2047} {"train_loss": -43.583377838134766, "global_step": 247738, "epoch": 2047} {"train_loss": -43.5431022644043, "global_step": 247739, "epoch": 2047} {"train_loss": -43.52717208862305, "global_step": 247740, "epoch": 2047} {"train_loss": -43.44710922241211, "global_step": 247741, "epoch": 2047} {"train_loss": -43.31021499633789, "global_step": 247742, "epoch": 2047} {"train_loss": -43.766353607177734, "global_step": 247743, "epoch": 2047} {"train_loss": -43.82487869262695, "global_step": 247744, "epoch": 2047} {"train_loss": -43.618743896484375, "global_step": 247745, "epoch": 2047} {"train_loss": -43.72096633911133, "global_step": 247746, "epoch": 2047} {"train_loss": -43.97097396850586, "global_step": 247747, "epoch": 2047} {"train_loss": -43.82247543334961, "global_step": 247748, "epoch": 2047} {"train_loss": -44.22593307495117, "global_step": 247749, "epoch": 2047} {"train_loss": -43.212623596191406, "global_step": 247750, "epoch": 2047} {"train_loss": -43.83897018432617, "global_step": 247751, "epoch": 2047} {"train_loss": -43.05204772949219, "global_step": 247752, "epoch": 2047} {"train_loss": -43.8829231262207, "global_step": 247753, "epoch": 2047} {"train_loss": -43.90402603149414, "global_step": 247754, "epoch": 2047} {"train_loss": -43.52457809448242, "global_step": 247755, "epoch": 2047} {"train_loss": -43.47092056274414, "global_step": 247756, "epoch": 2047} {"train_loss": -44.204750061035156, "global_step": 247757, "epoch": 2047} {"train_loss": -43.93467712402344, "global_step": 247758, "epoch": 2047} {"train_loss": -44.06321334838867, "global_step": 247759, "epoch": 2047} {"train_loss": -43.64970016479492, "global_step": 247760, "epoch": 2047} {"train_loss": -44.02728271484375, "global_step": 247761, "epoch": 2047} {"train_loss": -44.042842864990234, "global_step": 247762, "epoch": 2047} {"train_loss": -43.93955612182617, "global_step": 247763, "epoch": 2047} {"train_loss": -44.252647399902344, "global_step": 247764, "epoch": 2047} {"train_loss": -43.87721633911133, "global_step": 247765, "epoch": 2047} {"train_loss": -43.51072311401367, "global_step": 247766, "epoch": 2047} {"train_loss": -42.35877227783203, "global_step": 247767, "epoch": 2047} {"train_loss": -41.57369613647461, "global_step": 247768, "epoch": 2047} {"train_loss": -41.068641662597656, "global_step": 247769, "epoch": 2047} {"train_loss": -41.306331634521484, "global_step": 247770, "epoch": 2047} {"train_loss": -42.2721061706543, "global_step": 247771, "epoch": 2047} {"train_loss": -43.44376754760742, "global_step": 247772, "epoch": 2047} {"train_loss": -43.63108444213867, "global_step": 247773, "epoch": 2047} {"train_loss": -43.53001022338867, "global_step": 247774, "epoch": 2047} {"train_loss": -43.07888412475586, "global_step": 247775, "epoch": 2047} {"train_loss": -40.820716857910156, "global_step": 247776, "epoch": 2047} {"train_loss": -40.89149856567383, "global_step": 247777, "epoch": 2047} {"train_loss": -41.12226104736328, "global_step": 247778, "epoch": 2047} {"train_loss": -38.38543701171875, "global_step": 247779, "epoch": 2047} {"train_loss": -40.32155990600586, "global_step": 247780, "epoch": 2047} {"train_loss": -42.718505859375, "global_step": 247781, "epoch": 2047} {"train_loss": -42.7451057434082, "global_step": 247782, "epoch": 2047} {"train_loss": -40.66785430908203, "global_step": 247783, "epoch": 2047} {"train_loss": -38.79420852661133, "global_step": 247784, "epoch": 2047} {"train_loss": -41.06235885620117, "global_step": 247785, "epoch": 2047} {"train_loss": -42.80428695678711, "global_step": 247786, "epoch": 2047} {"train_loss": -42.173404693603516, "global_step": 247787, "epoch": 2047} {"train_loss": -41.13065719604492, "global_step": 247788, "epoch": 2047} {"train_loss": -42.40165328979492, "global_step": 247789, "epoch": 2047} {"train_loss": -42.05256271362305, "global_step": 247790, "epoch": 2047} {"train_loss": -41.864315032958984, "global_step": 247791, "epoch": 2047} {"train_loss": -41.360015869140625, "global_step": 247792, "epoch": 2047} {"train_loss": -43.00835037231445, "global_step": 247793, "epoch": 2047} {"train_loss": -42.605228424072266, "global_step": 247794, "epoch": 2047} {"train_loss": -40.973628997802734, "global_step": 247795, "epoch": 2047} {"train_loss": -41.980308532714844, "global_step": 247796, "epoch": 2047} {"train_loss": -40.8805046081543, "global_step": 247797, "epoch": 2047} {"train_loss": -41.018348693847656, "global_step": 247798, "epoch": 2047} {"train_loss": -41.331520080566406, "global_step": 247799, "epoch": 2047} {"train_loss": -41.74884796142578, "global_step": 247800, "epoch": 2047} {"train_loss": -41.210296630859375, "global_step": 247801, "epoch": 2047} {"train_loss": -41.66390609741211, "global_step": 247802, "epoch": 2047} {"train_loss": -41.77022933959961, "global_step": 247803, "epoch": 2047} {"train_loss": -42.33465576171875, "global_step": 247804, "epoch": 2047} {"train_loss": -41.52634811401367, "global_step": 247805, "epoch": 2047} {"train_loss": -41.14854049682617, "global_step": 247806, "epoch": 2047} {"train_loss": -42.52428020130504, "global_step": 247807, "epoch": 2047, "val_loss": 2583504.75} {"train_loss": -40.85719680786133, "global_step": 247808, "epoch": 2048} {"train_loss": -41.28894805908203, "global_step": 247809, "epoch": 2048} {"train_loss": -41.33173370361328, "global_step": 247810, "epoch": 2048} {"train_loss": -41.99897384643555, "global_step": 247811, "epoch": 2048} {"train_loss": -41.16055679321289, "global_step": 247812, "epoch": 2048} {"train_loss": -41.589717864990234, "global_step": 247813, "epoch": 2048} {"train_loss": -41.549415588378906, "global_step": 247814, "epoch": 2048} {"train_loss": -42.342933654785156, "global_step": 247815, "epoch": 2048} {"train_loss": -42.34440612792969, "global_step": 247816, "epoch": 2048} {"train_loss": -41.8565559387207, "global_step": 247817, "epoch": 2048} {"train_loss": -41.573604583740234, "global_step": 247818, "epoch": 2048} {"train_loss": -42.28764724731445, "global_step": 247819, "epoch": 2048} {"train_loss": -42.2129020690918, "global_step": 247820, "epoch": 2048} {"train_loss": -42.3853645324707, "global_step": 247821, "epoch": 2048} {"train_loss": -43.12451934814453, "global_step": 247822, "epoch": 2048} {"train_loss": -42.2928581237793, "global_step": 247823, "epoch": 2048} {"train_loss": -42.706058502197266, "global_step": 247824, "epoch": 2048} {"train_loss": -42.59210205078125, "global_step": 247825, "epoch": 2048} {"train_loss": -42.763885498046875, "global_step": 247826, "epoch": 2048} {"train_loss": -42.98249435424805, "global_step": 247827, "epoch": 2048} {"train_loss": -42.783111572265625, "global_step": 247828, "epoch": 2048} {"train_loss": -42.58114242553711, "global_step": 247829, "epoch": 2048} {"train_loss": -42.685855865478516, "global_step": 247830, "epoch": 2048} {"train_loss": -43.263587951660156, "global_step": 247831, "epoch": 2048} {"train_loss": -42.63911056518555, "global_step": 247832, "epoch": 2048} {"train_loss": -42.88100051879883, "global_step": 247833, "epoch": 2048} {"train_loss": -43.33544158935547, "global_step": 247834, "epoch": 2048} {"train_loss": -43.45802688598633, "global_step": 247835, "epoch": 2048} {"train_loss": -43.333492279052734, "global_step": 247836, "epoch": 2048} {"train_loss": -43.546199798583984, "global_step": 247837, "epoch": 2048} {"train_loss": -43.41118240356445, "global_step": 247838, "epoch": 2048} {"train_loss": -43.30568313598633, "global_step": 247839, "epoch": 2048} {"train_loss": -43.639095306396484, "global_step": 247840, "epoch": 2048} {"train_loss": -43.02982711791992, "global_step": 247841, "epoch": 2048} {"train_loss": -43.60769271850586, "global_step": 247842, "epoch": 2048} {"train_loss": -42.61967849731445, "global_step": 247843, "epoch": 2048} {"train_loss": -43.49054718017578, "global_step": 247844, "epoch": 2048} {"train_loss": -43.57658386230469, "global_step": 247845, "epoch": 2048} {"train_loss": -43.09331130981445, "global_step": 247846, "epoch": 2048} {"train_loss": -43.10982131958008, "global_step": 247847, "epoch": 2048} {"train_loss": -43.462318420410156, "global_step": 247848, "epoch": 2048} {"train_loss": -43.8026008605957, "global_step": 247849, "epoch": 2048} {"train_loss": -42.7723388671875, "global_step": 247850, "epoch": 2048} {"train_loss": -42.77924728393555, "global_step": 247851, "epoch": 2048} {"train_loss": -43.69553756713867, "global_step": 247852, "epoch": 2048} {"train_loss": -43.8761100769043, "global_step": 247853, "epoch": 2048} {"train_loss": -43.302947998046875, "global_step": 247854, "epoch": 2048} {"train_loss": -42.626888275146484, "global_step": 247855, "epoch": 2048} {"train_loss": -43.22840118408203, "global_step": 247856, "epoch": 2048} {"train_loss": -44.06648635864258, "global_step": 247857, "epoch": 2048} {"train_loss": -43.75102233886719, "global_step": 247858, "epoch": 2048} {"train_loss": -43.2685661315918, "global_step": 247859, "epoch": 2048} {"train_loss": -43.53074264526367, "global_step": 247860, "epoch": 2048} {"train_loss": -42.93714141845703, "global_step": 247861, "epoch": 2048} {"train_loss": -42.818172454833984, "global_step": 247862, "epoch": 2048} {"train_loss": -43.411922454833984, "global_step": 247863, "epoch": 2048} {"train_loss": -43.27678298950195, "global_step": 247864, "epoch": 2048} {"train_loss": -43.9468879699707, "global_step": 247865, "epoch": 2048} {"train_loss": -43.33060073852539, "global_step": 247866, "epoch": 2048} {"train_loss": -43.527706146240234, "global_step": 247867, "epoch": 2048} {"train_loss": -43.517494201660156, "global_step": 247868, "epoch": 2048} {"train_loss": -43.77729034423828, "global_step": 247869, "epoch": 2048} {"train_loss": -43.441097259521484, "global_step": 247870, "epoch": 2048} {"train_loss": -43.1662712097168, "global_step": 247871, "epoch": 2048} {"train_loss": -43.12744140625, "global_step": 247872, "epoch": 2048} {"train_loss": -42.761104583740234, "global_step": 247873, "epoch": 2048} {"train_loss": -42.07313919067383, "global_step": 247874, "epoch": 2048} {"train_loss": -41.58663558959961, "global_step": 247875, "epoch": 2048} {"train_loss": -41.78489303588867, "global_step": 247876, "epoch": 2048} {"train_loss": -40.9596061706543, "global_step": 247877, "epoch": 2048} {"train_loss": -41.411556243896484, "global_step": 247878, "epoch": 2048} {"train_loss": -41.38668441772461, "global_step": 247879, "epoch": 2048} {"train_loss": -42.276763916015625, "global_step": 247880, "epoch": 2048} {"train_loss": -43.22267532348633, "global_step": 247881, "epoch": 2048} {"train_loss": -42.78195571899414, "global_step": 247882, "epoch": 2048} {"train_loss": -42.03096389770508, "global_step": 247883, "epoch": 2048} {"train_loss": -42.34990310668945, "global_step": 247884, "epoch": 2048} {"train_loss": -42.8825569152832, "global_step": 247885, "epoch": 2048} {"train_loss": -42.88177490234375, "global_step": 247886, "epoch": 2048} {"train_loss": -41.828304290771484, "global_step": 247887, "epoch": 2048} {"train_loss": -40.97039794921875, "global_step": 247888, "epoch": 2048} {"train_loss": -42.195068359375, "global_step": 247889, "epoch": 2048} {"train_loss": -43.284236907958984, "global_step": 247890, "epoch": 2048} {"train_loss": -41.4595947265625, "global_step": 247891, "epoch": 2048} {"train_loss": -38.531646728515625, "global_step": 247892, "epoch": 2048} {"train_loss": -39.732177734375, "global_step": 247893, "epoch": 2048} {"train_loss": -41.09029769897461, "global_step": 247894, "epoch": 2048} {"train_loss": -42.323238372802734, "global_step": 247895, "epoch": 2048} {"train_loss": -40.535972595214844, "global_step": 247896, "epoch": 2048} {"train_loss": -39.56765365600586, "global_step": 247897, "epoch": 2048} {"train_loss": -39.191993713378906, "global_step": 247898, "epoch": 2048} {"train_loss": -42.77383041381836, "global_step": 247899, "epoch": 2048} {"train_loss": -40.729427337646484, "global_step": 247900, "epoch": 2048} {"train_loss": -39.41126251220703, "global_step": 247901, "epoch": 2048} {"train_loss": -42.04157257080078, "global_step": 247902, "epoch": 2048} {"train_loss": -42.07477951049805, "global_step": 247903, "epoch": 2048} {"train_loss": -38.278053283691406, "global_step": 247904, "epoch": 2048} {"train_loss": -40.971839904785156, "global_step": 247905, "epoch": 2048} {"train_loss": -42.368526458740234, "global_step": 247906, "epoch": 2048} {"train_loss": -40.27403259277344, "global_step": 247907, "epoch": 2048} {"train_loss": -42.28678512573242, "global_step": 247908, "epoch": 2048} {"train_loss": -40.979122161865234, "global_step": 247909, "epoch": 2048} {"train_loss": -40.79235076904297, "global_step": 247910, "epoch": 2048} {"train_loss": -41.17842483520508, "global_step": 247911, "epoch": 2048} {"train_loss": -42.30135726928711, "global_step": 247912, "epoch": 2048} {"train_loss": -41.696044921875, "global_step": 247913, "epoch": 2048} {"train_loss": -39.185821533203125, "global_step": 247914, "epoch": 2048} {"train_loss": -42.74283981323242, "global_step": 247915, "epoch": 2048} {"train_loss": -41.88006591796875, "global_step": 247916, "epoch": 2048} {"train_loss": -40.17499923706055, "global_step": 247917, "epoch": 2048} {"train_loss": -43.10858154296875, "global_step": 247918, "epoch": 2048} {"train_loss": -40.5379753112793, "global_step": 247919, "epoch": 2048} {"train_loss": -40.07855224609375, "global_step": 247920, "epoch": 2048} {"train_loss": -42.9631462097168, "global_step": 247921, "epoch": 2048} {"train_loss": -41.21263122558594, "global_step": 247922, "epoch": 2048} {"train_loss": -42.90654754638672, "global_step": 247923, "epoch": 2048} {"train_loss": -41.672115325927734, "global_step": 247924, "epoch": 2048} {"train_loss": -42.357032775878906, "global_step": 247925, "epoch": 2048} {"train_loss": -42.37569808959961, "global_step": 247926, "epoch": 2048} {"train_loss": -41.25615310668945, "global_step": 247927, "epoch": 2048} {"train_loss": -42.26063291691551, "global_step": 247928, "epoch": 2048, "val_loss": 2556426.75} {"train_loss": -41.84872055053711, "global_step": 247929, "epoch": 2049} {"train_loss": -43.01047897338867, "global_step": 247930, "epoch": 2049} {"train_loss": -42.51191711425781, "global_step": 247931, "epoch": 2049} {"train_loss": -42.903541564941406, "global_step": 247932, "epoch": 2049} {"train_loss": -42.48694610595703, "global_step": 247933, "epoch": 2049} {"train_loss": -42.2024040222168, "global_step": 247934, "epoch": 2049} {"train_loss": -42.75638961791992, "global_step": 247935, "epoch": 2049} {"train_loss": -42.71552276611328, "global_step": 247936, "epoch": 2049} {"train_loss": -42.59489059448242, "global_step": 247937, "epoch": 2049} {"train_loss": -43.12996292114258, "global_step": 247938, "epoch": 2049} {"train_loss": -42.6356315612793, "global_step": 247939, "epoch": 2049} {"train_loss": -43.09526824951172, "global_step": 247940, "epoch": 2049} {"train_loss": -42.24555206298828, "global_step": 247941, "epoch": 2049} {"train_loss": -43.04977035522461, "global_step": 247942, "epoch": 2049} {"train_loss": -43.30335235595703, "global_step": 247943, "epoch": 2049} {"train_loss": -42.73515701293945, "global_step": 247944, "epoch": 2049} {"train_loss": -43.59101486206055, "global_step": 247945, "epoch": 2049} {"train_loss": -42.4649772644043, "global_step": 247946, "epoch": 2049} {"train_loss": -43.01445388793945, "global_step": 247947, "epoch": 2049} {"train_loss": -42.872222900390625, "global_step": 247948, "epoch": 2049} {"train_loss": -43.63557052612305, "global_step": 247949, "epoch": 2049} {"train_loss": -43.295082092285156, "global_step": 247950, "epoch": 2049} {"train_loss": -42.518829345703125, "global_step": 247951, "epoch": 2049} {"train_loss": -43.46702194213867, "global_step": 247952, "epoch": 2049} {"train_loss": -43.193023681640625, "global_step": 247953, "epoch": 2049} {"train_loss": -43.42853546142578, "global_step": 247954, "epoch": 2049} {"train_loss": -43.38560104370117, "global_step": 247955, "epoch": 2049} {"train_loss": -43.69404220581055, "global_step": 247956, "epoch": 2049} {"train_loss": -43.548500061035156, "global_step": 247957, "epoch": 2049} {"train_loss": -43.30131149291992, "global_step": 247958, "epoch": 2049} {"train_loss": -43.619808197021484, "global_step": 247959, "epoch": 2049} {"train_loss": -43.84250259399414, "global_step": 247960, "epoch": 2049} {"train_loss": -43.391883850097656, "global_step": 247961, "epoch": 2049} {"train_loss": -43.70249557495117, "global_step": 247962, "epoch": 2049} {"train_loss": -44.12311935424805, "global_step": 247963, "epoch": 2049} {"train_loss": -42.60472869873047, "global_step": 247964, "epoch": 2049} {"train_loss": -43.95787048339844, "global_step": 247965, "epoch": 2049} {"train_loss": -43.78656768798828, "global_step": 247966, "epoch": 2049} {"train_loss": -43.768802642822266, "global_step": 247967, "epoch": 2049} {"train_loss": -43.7237663269043, "global_step": 247968, "epoch": 2049} {"train_loss": -44.21623992919922, "global_step": 247969, "epoch": 2049} {"train_loss": -43.042606353759766, "global_step": 247970, "epoch": 2049} {"train_loss": -43.609554290771484, "global_step": 247971, "epoch": 2049} {"train_loss": -43.78365707397461, "global_step": 247972, "epoch": 2049} {"train_loss": -43.4427490234375, "global_step": 247973, "epoch": 2049} {"train_loss": -43.27286148071289, "global_step": 247974, "epoch": 2049} {"train_loss": -43.0703010559082, "global_step": 247975, "epoch": 2049} {"train_loss": -43.23958969116211, "global_step": 247976, "epoch": 2049} {"train_loss": -43.735572814941406, "global_step": 247977, "epoch": 2049} {"train_loss": -43.842342376708984, "global_step": 247978, "epoch": 2049} {"train_loss": -42.40665817260742, "global_step": 247979, "epoch": 2049} {"train_loss": -43.62580108642578, "global_step": 247980, "epoch": 2049} {"train_loss": -43.83940124511719, "global_step": 247981, "epoch": 2049} {"train_loss": -43.077388763427734, "global_step": 247982, "epoch": 2049} {"train_loss": -43.2304573059082, "global_step": 247983, "epoch": 2049} {"train_loss": -43.708595275878906, "global_step": 247984, "epoch": 2049} {"train_loss": -43.376129150390625, "global_step": 247985, "epoch": 2049} {"train_loss": -43.3815803527832, "global_step": 247986, "epoch": 2049} {"train_loss": -44.37574005126953, "global_step": 247987, "epoch": 2049} {"train_loss": -44.09624481201172, "global_step": 247988, "epoch": 2049} {"train_loss": -40.8320198059082, "global_step": 247989, "epoch": 2049} {"train_loss": -43.954124450683594, "global_step": 247990, "epoch": 2049} {"train_loss": -43.71045684814453, "global_step": 247991, "epoch": 2049} {"train_loss": -44.05918502807617, "global_step": 247992, "epoch": 2049} {"train_loss": -43.90834426879883, "global_step": 247993, "epoch": 2049} {"train_loss": -43.18500518798828, "global_step": 247994, "epoch": 2049} {"train_loss": -41.694480895996094, "global_step": 247995, "epoch": 2049} {"train_loss": -42.12636947631836, "global_step": 247996, "epoch": 2049} {"train_loss": -42.116146087646484, "global_step": 247997, "epoch": 2049} {"train_loss": -42.798744201660156, "global_step": 247998, "epoch": 2049} {"train_loss": -42.72861862182617, "global_step": 247999, "epoch": 2049} {"train_loss": -42.05314254760742, "global_step": 248000, "epoch": 2049} {"train_loss": -40.29466247558594, "global_step": 248001, "epoch": 2049} {"train_loss": -41.49102783203125, "global_step": 248002, "epoch": 2049} {"train_loss": -43.35400390625, "global_step": 248003, "epoch": 2049} {"train_loss": -41.491241455078125, "global_step": 248004, "epoch": 2049} {"train_loss": -41.956295013427734, "global_step": 248005, "epoch": 2049} {"train_loss": -39.716373443603516, "global_step": 248006, "epoch": 2049} {"train_loss": -42.22956466674805, "global_step": 248007, "epoch": 2049} {"train_loss": -41.991973876953125, "global_step": 248008, "epoch": 2049} {"train_loss": -41.473941802978516, "global_step": 248009, "epoch": 2049} {"train_loss": -41.53608322143555, "global_step": 248010, "epoch": 2049} {"train_loss": -40.844478607177734, "global_step": 248011, "epoch": 2049} {"train_loss": -42.97636032104492, "global_step": 248012, "epoch": 2049} {"train_loss": -41.976356506347656, "global_step": 248013, "epoch": 2049} {"train_loss": -40.63969802856445, "global_step": 248014, "epoch": 2049} {"train_loss": -42.67137908935547, "global_step": 248015, "epoch": 2049} {"train_loss": -41.66478729248047, "global_step": 248016, "epoch": 2049} {"train_loss": -42.177425384521484, "global_step": 248017, "epoch": 2049} {"train_loss": -41.423274993896484, "global_step": 248018, "epoch": 2049} {"train_loss": -42.10877227783203, "global_step": 248019, "epoch": 2049} {"train_loss": -41.24675369262695, "global_step": 248020, "epoch": 2049} {"train_loss": -41.621246337890625, "global_step": 248021, "epoch": 2049} {"train_loss": -41.76902389526367, "global_step": 248022, "epoch": 2049} {"train_loss": -41.374122619628906, "global_step": 248023, "epoch": 2049} {"train_loss": -39.89632797241211, "global_step": 248024, "epoch": 2049} {"train_loss": -40.684505462646484, "global_step": 248025, "epoch": 2049} {"train_loss": -41.80413055419922, "global_step": 248026, "epoch": 2049} {"train_loss": -41.6291389465332, "global_step": 248027, "epoch": 2049} {"train_loss": -42.996761322021484, "global_step": 248028, "epoch": 2049} {"train_loss": -42.24360275268555, "global_step": 248029, "epoch": 2049} {"train_loss": -42.618404388427734, "global_step": 248030, "epoch": 2049} {"train_loss": -37.62250518798828, "global_step": 248031, "epoch": 2049} {"train_loss": -42.31153869628906, "global_step": 248032, "epoch": 2049} {"train_loss": -42.47917175292969, "global_step": 248033, "epoch": 2049} {"train_loss": -41.83256912231445, "global_step": 248034, "epoch": 2049} {"train_loss": -42.814002990722656, "global_step": 248035, "epoch": 2049} {"train_loss": -41.632198333740234, "global_step": 248036, "epoch": 2049} {"train_loss": -42.42924880981445, "global_step": 248037, "epoch": 2049} {"train_loss": -41.970149993896484, "global_step": 248038, "epoch": 2049} {"train_loss": -38.633949279785156, "global_step": 248039, "epoch": 2049} {"train_loss": -41.93316650390625, "global_step": 248040, "epoch": 2049} {"train_loss": -42.574241638183594, "global_step": 248041, "epoch": 2049} {"train_loss": -42.11357498168945, "global_step": 248042, "epoch": 2049} {"train_loss": -41.59260940551758, "global_step": 248043, "epoch": 2049} {"train_loss": -42.80865478515625, "global_step": 248044, "epoch": 2049} {"train_loss": -42.174285888671875, "global_step": 248045, "epoch": 2049} {"train_loss": -40.00484085083008, "global_step": 248046, "epoch": 2049} {"train_loss": -41.77461624145508, "global_step": 248047, "epoch": 2049} {"train_loss": -42.56690979003906, "global_step": 248048, "epoch": 2049} {"train_loss": -42.56522826517909, "global_step": 248049, "epoch": 2049, "val_loss": 2643363.0} {"train_loss": -42.501731872558594, "global_step": 248050, "epoch": 2050} {"train_loss": -41.61609649658203, "global_step": 248051, "epoch": 2050} {"train_loss": -42.580650329589844, "global_step": 248052, "epoch": 2050} {"train_loss": -43.1015739440918, "global_step": 248053, "epoch": 2050} {"train_loss": -43.15769577026367, "global_step": 248054, "epoch": 2050} {"train_loss": -39.4639778137207, "global_step": 248055, "epoch": 2050} {"train_loss": -42.15755844116211, "global_step": 248056, "epoch": 2050} {"train_loss": -43.03962326049805, "global_step": 248057, "epoch": 2050} {"train_loss": -41.64424514770508, "global_step": 248058, "epoch": 2050} {"train_loss": -42.724952697753906, "global_step": 248059, "epoch": 2050} {"train_loss": -42.9692497253418, "global_step": 248060, "epoch": 2050} {"train_loss": -41.98599624633789, "global_step": 248061, "epoch": 2050} {"train_loss": -40.75984573364258, "global_step": 248062, "epoch": 2050} {"train_loss": -39.35776901245117, "global_step": 248063, "epoch": 2050} {"train_loss": -42.81879425048828, "global_step": 248064, "epoch": 2050} {"train_loss": -42.163856506347656, "global_step": 248065, "epoch": 2050} {"train_loss": -42.25294876098633, "global_step": 248066, "epoch": 2050} {"train_loss": -41.994930267333984, "global_step": 248067, "epoch": 2050} {"train_loss": -40.920928955078125, "global_step": 248068, "epoch": 2050} {"train_loss": -41.12744903564453, "global_step": 248069, "epoch": 2050} {"train_loss": -41.79874038696289, "global_step": 248070, "epoch": 2050} {"train_loss": -36.562007904052734, "global_step": 248071, "epoch": 2050} {"train_loss": -41.62291717529297, "global_step": 248072, "epoch": 2050} {"train_loss": -41.39132308959961, "global_step": 248073, "epoch": 2050} {"train_loss": -40.19334030151367, "global_step": 248074, "epoch": 2050} {"train_loss": -41.53890609741211, "global_step": 248075, "epoch": 2050} {"train_loss": -42.680023193359375, "global_step": 248076, "epoch": 2050} {"train_loss": -42.79293441772461, "global_step": 248077, "epoch": 2050} {"train_loss": -38.479164123535156, "global_step": 248078, "epoch": 2050} {"train_loss": -41.4415397644043, "global_step": 248079, "epoch": 2050} {"train_loss": -41.81462478637695, "global_step": 248080, "epoch": 2050} {"train_loss": -41.79414367675781, "global_step": 248081, "epoch": 2050} {"train_loss": -42.12370681762695, "global_step": 248082, "epoch": 2050} {"train_loss": -40.4978141784668, "global_step": 248083, "epoch": 2050} {"train_loss": -42.138771057128906, "global_step": 248084, "epoch": 2050} {"train_loss": -36.459571838378906, "global_step": 248085, "epoch": 2050} {"train_loss": -40.22726058959961, "global_step": 248086, "epoch": 2050} {"train_loss": -40.681121826171875, "global_step": 248087, "epoch": 2050} {"train_loss": -42.119285583496094, "global_step": 248088, "epoch": 2050} {"train_loss": -41.30677795410156, "global_step": 248089, "epoch": 2050} {"train_loss": -33.03568649291992, "global_step": 248090, "epoch": 2050} {"train_loss": -39.95136642456055, "global_step": 248091, "epoch": 2050} {"train_loss": -38.33815383911133, "global_step": 248092, "epoch": 2050} {"train_loss": -36.87510299682617, "global_step": 248093, "epoch": 2050} {"train_loss": -41.31258010864258, "global_step": 248094, "epoch": 2050} {"train_loss": -40.29378890991211, "global_step": 248095, "epoch": 2050} {"train_loss": -40.74679183959961, "global_step": 248096, "epoch": 2050} {"train_loss": -37.4567756652832, "global_step": 248097, "epoch": 2050} {"train_loss": -41.23435592651367, "global_step": 248098, "epoch": 2050} {"train_loss": -37.942256927490234, "global_step": 248099, "epoch": 2050} {"train_loss": -41.02214431762695, "global_step": 248100, "epoch": 2050} {"train_loss": -40.16819381713867, "global_step": 248101, "epoch": 2050} {"train_loss": -40.13865661621094, "global_step": 248102, "epoch": 2050} {"train_loss": -36.592735290527344, "global_step": 248103, "epoch": 2050} {"train_loss": -42.446075439453125, "global_step": 248104, "epoch": 2050} {"train_loss": -40.98456954956055, "global_step": 248105, "epoch": 2050} {"train_loss": -38.76327133178711, "global_step": 248106, "epoch": 2050} {"train_loss": -32.476104736328125, "global_step": 248107, "epoch": 2050} {"train_loss": -39.11124801635742, "global_step": 248108, "epoch": 2050} {"train_loss": -17.27644157409668, "global_step": 248109, "epoch": 2050} {"train_loss": -38.1418571472168, "global_step": 248110, "epoch": 2050} {"train_loss": -37.950374603271484, "global_step": 248111, "epoch": 2050} {"train_loss": -37.74789047241211, "global_step": 248112, "epoch": 2050} {"train_loss": -35.53157043457031, "global_step": 248113, "epoch": 2050} {"train_loss": -40.19301223754883, "global_step": 248114, "epoch": 2050} {"train_loss": -35.16310501098633, "global_step": 248115, "epoch": 2050} {"train_loss": -37.141395568847656, "global_step": 248116, "epoch": 2050} {"train_loss": -35.18280792236328, "global_step": 248117, "epoch": 2050} {"train_loss": -36.11471176147461, "global_step": 248118, "epoch": 2050} {"train_loss": -37.875244140625, "global_step": 248119, "epoch": 2050} {"train_loss": -36.30596923828125, "global_step": 248120, "epoch": 2050} {"train_loss": -36.793819427490234, "global_step": 248121, "epoch": 2050} {"train_loss": -38.07464599609375, "global_step": 248122, "epoch": 2050} {"train_loss": -40.58191680908203, "global_step": 248123, "epoch": 2050} {"train_loss": -40.44613265991211, "global_step": 248124, "epoch": 2050} {"train_loss": -40.937923431396484, "global_step": 248125, "epoch": 2050} {"train_loss": -39.70585250854492, "global_step": 248126, "epoch": 2050} {"train_loss": -37.50215148925781, "global_step": 248127, "epoch": 2050} {"train_loss": -37.359554290771484, "global_step": 248128, "epoch": 2050} {"train_loss": -37.94465637207031, "global_step": 248129, "epoch": 2050} {"train_loss": -40.17840576171875, "global_step": 248130, "epoch": 2050} {"train_loss": -37.94468307495117, "global_step": 248131, "epoch": 2050} {"train_loss": -39.46418380737305, "global_step": 248132, "epoch": 2050} {"train_loss": -40.47453689575195, "global_step": 248133, "epoch": 2050} {"train_loss": -40.61418533325195, "global_step": 248134, "epoch": 2050} {"train_loss": -38.02041244506836, "global_step": 248135, "epoch": 2050} {"train_loss": -40.17147445678711, "global_step": 248136, "epoch": 2050} {"train_loss": -40.1244010925293, "global_step": 248137, "epoch": 2050} {"train_loss": -39.541175842285156, "global_step": 248138, "epoch": 2050} {"train_loss": -40.94956588745117, "global_step": 248139, "epoch": 2050} {"train_loss": -36.24741744995117, "global_step": 248140, "epoch": 2050} {"train_loss": -40.443939208984375, "global_step": 248141, "epoch": 2050} {"train_loss": -39.56462478637695, "global_step": 248142, "epoch": 2050} {"train_loss": -40.40133285522461, "global_step": 248143, "epoch": 2050} {"train_loss": -41.18973159790039, "global_step": 248144, "epoch": 2050} {"train_loss": -41.0811882019043, "global_step": 248145, "epoch": 2050} {"train_loss": -40.93412399291992, "global_step": 248146, "epoch": 2050} {"train_loss": -40.5042839050293, "global_step": 248147, "epoch": 2050} {"train_loss": -40.53221893310547, "global_step": 248148, "epoch": 2050} {"train_loss": -40.49001693725586, "global_step": 248149, "epoch": 2050} {"train_loss": -39.7029914855957, "global_step": 248150, "epoch": 2050} {"train_loss": -41.360958099365234, "global_step": 248151, "epoch": 2050} {"train_loss": -40.81138229370117, "global_step": 248152, "epoch": 2050} {"train_loss": -40.50042724609375, "global_step": 248153, "epoch": 2050} {"train_loss": -40.52298355102539, "global_step": 248154, "epoch": 2050} {"train_loss": -41.68939971923828, "global_step": 248155, "epoch": 2050} {"train_loss": -39.466121673583984, "global_step": 248156, "epoch": 2050} {"train_loss": -41.22898483276367, "global_step": 248157, "epoch": 2050} {"train_loss": -40.187984466552734, "global_step": 248158, "epoch": 2050} {"train_loss": -40.46065902709961, "global_step": 248159, "epoch": 2050} {"train_loss": -40.047691345214844, "global_step": 248160, "epoch": 2050} {"train_loss": -41.54316329956055, "global_step": 248161, "epoch": 2050} {"train_loss": -40.609718322753906, "global_step": 248162, "epoch": 2050} {"train_loss": -40.77995300292969, "global_step": 248163, "epoch": 2050} {"train_loss": -41.19475173950195, "global_step": 248164, "epoch": 2050} {"train_loss": -41.0459098815918, "global_step": 248165, "epoch": 2050} {"train_loss": -41.72761154174805, "global_step": 248166, "epoch": 2050} {"train_loss": -41.9568977355957, "global_step": 248167, "epoch": 2050} {"train_loss": -41.27393341064453, "global_step": 248168, "epoch": 2050} {"train_loss": -41.84882354736328, "global_step": 248169, "epoch": 2050} {"train_loss": -39.89582173686382, "global_step": 248170, "epoch": 2050, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4400000": 1.0, "test/sim_max_reward_4400001": 1.0, "test/sim_max_reward_4400002": 1.0, "test/sim_max_reward_4400003": 1.0, "test/sim_max_reward_4400004": 1.0, "test/sim_max_reward_4400005": 1.0, "test/sim_max_reward_4400006": 1.0, "test/sim_max_reward_4400007": 1.0, "test/sim_max_reward_4400008": 1.0, "test/sim_max_reward_4400009": 1.0, "test/sim_max_reward_4400010": 1.0, "test/sim_max_reward_4400011": 1.0, "test/sim_max_reward_4400012": 1.0, "test/sim_max_reward_4400013": 1.0, "test/sim_max_reward_4400014": 1.0, "test/sim_max_reward_4400015": 1.0, "test/sim_max_reward_4400016": 1.0, "test/sim_max_reward_4400017": 1.0, "test/sim_max_reward_4400018": 1.0, "test/sim_max_reward_4400019": 1.0, "test/sim_max_reward_4400020": 1.0, "test/sim_max_reward_4400021": 1.0, "train/mean_score": 1.0, "test/mean_score": 1.0, "val_loss": 2861503.0} {"train_loss": -42.191505432128906, "global_step": 248171, "epoch": 2051} {"train_loss": -41.88930130004883, "global_step": 248172, "epoch": 2051} {"train_loss": -41.74262237548828, "global_step": 248173, "epoch": 2051} {"train_loss": -40.72746658325195, "global_step": 248174, "epoch": 2051} {"train_loss": -41.735530853271484, "global_step": 248175, "epoch": 2051} {"train_loss": -41.19350051879883, "global_step": 248176, "epoch": 2051} {"train_loss": -41.76487350463867, "global_step": 248177, "epoch": 2051} {"train_loss": -41.0782585144043, "global_step": 248178, "epoch": 2051} {"train_loss": -41.38703918457031, "global_step": 248179, "epoch": 2051} {"train_loss": -41.92311096191406, "global_step": 248180, "epoch": 2051} {"train_loss": -42.35606002807617, "global_step": 248181, "epoch": 2051} {"train_loss": -41.89858627319336, "global_step": 248182, "epoch": 2051} {"train_loss": -41.83494186401367, "global_step": 248183, "epoch": 2051} {"train_loss": -42.4381217956543, "global_step": 248184, "epoch": 2051} {"train_loss": -41.40578842163086, "global_step": 248185, "epoch": 2051} {"train_loss": -42.8211784362793, "global_step": 248186, "epoch": 2051} {"train_loss": -42.44081497192383, "global_step": 248187, "epoch": 2051} {"train_loss": -42.754302978515625, "global_step": 248188, "epoch": 2051} {"train_loss": -42.12849044799805, "global_step": 248189, "epoch": 2051} {"train_loss": -42.29208755493164, "global_step": 248190, "epoch": 2051} {"train_loss": -42.535404205322266, "global_step": 248191, "epoch": 2051} {"train_loss": -42.70812225341797, "global_step": 248192, "epoch": 2051} {"train_loss": -42.59755325317383, "global_step": 248193, "epoch": 2051} {"train_loss": -41.62530517578125, "global_step": 248194, "epoch": 2051} {"train_loss": -41.38666534423828, "global_step": 248195, "epoch": 2051} {"train_loss": -40.53215408325195, "global_step": 248196, "epoch": 2051} {"train_loss": -41.328102111816406, "global_step": 248197, "epoch": 2051} {"train_loss": -42.43235397338867, "global_step": 248198, "epoch": 2051} {"train_loss": -42.355072021484375, "global_step": 248199, "epoch": 2051} {"train_loss": -42.59317398071289, "global_step": 248200, "epoch": 2051} {"train_loss": -42.76300811767578, "global_step": 248201, "epoch": 2051} {"train_loss": -42.27682113647461, "global_step": 248202, "epoch": 2051} {"train_loss": -42.337982177734375, "global_step": 248203, "epoch": 2051} {"train_loss": -42.140281677246094, "global_step": 248204, "epoch": 2051} {"train_loss": -41.593536376953125, "global_step": 248205, "epoch": 2051} {"train_loss": -42.91701126098633, "global_step": 248206, "epoch": 2051} {"train_loss": -42.84415817260742, "global_step": 248207, "epoch": 2051} {"train_loss": -42.625694274902344, "global_step": 248208, "epoch": 2051} {"train_loss": -42.64558029174805, "global_step": 248209, "epoch": 2051} {"train_loss": -42.74198913574219, "global_step": 248210, "epoch": 2051} {"train_loss": -43.129737854003906, "global_step": 248211, "epoch": 2051} {"train_loss": -40.658451080322266, "global_step": 248212, "epoch": 2051} {"train_loss": -42.650516510009766, "global_step": 248213, "epoch": 2051} {"train_loss": -42.561492919921875, "global_step": 248214, "epoch": 2051} {"train_loss": -42.5754280090332, "global_step": 248215, "epoch": 2051} {"train_loss": -43.1269416809082, "global_step": 248216, "epoch": 2051} {"train_loss": -42.50469970703125, "global_step": 248217, "epoch": 2051} {"train_loss": -42.240333557128906, "global_step": 248218, "epoch": 2051} {"train_loss": -42.782405853271484, "global_step": 248219, "epoch": 2051} {"train_loss": -42.293155670166016, "global_step": 248220, "epoch": 2051} {"train_loss": -42.532711029052734, "global_step": 248221, "epoch": 2051} {"train_loss": -41.3282470703125, "global_step": 248222, "epoch": 2051} {"train_loss": -42.43208694458008, "global_step": 248223, "epoch": 2051} {"train_loss": -42.560298919677734, "global_step": 248224, "epoch": 2051} {"train_loss": -41.91492462158203, "global_step": 248225, "epoch": 2051} {"train_loss": -40.43410110473633, "global_step": 248226, "epoch": 2051} {"train_loss": -42.532222747802734, "global_step": 248227, "epoch": 2051} {"train_loss": -41.50163650512695, "global_step": 248228, "epoch": 2051} {"train_loss": -42.8287467956543, "global_step": 248229, "epoch": 2051} {"train_loss": -42.47376251220703, "global_step": 248230, "epoch": 2051} {"train_loss": -42.37408447265625, "global_step": 248231, "epoch": 2051} {"train_loss": -40.4804573059082, "global_step": 248232, "epoch": 2051} {"train_loss": -42.119327545166016, "global_step": 248233, "epoch": 2051} {"train_loss": -40.748085021972656, "global_step": 248234, "epoch": 2051} {"train_loss": -42.09421920776367, "global_step": 248235, "epoch": 2051} {"train_loss": -39.53178024291992, "global_step": 248236, "epoch": 2051} {"train_loss": -41.45663070678711, "global_step": 248237, "epoch": 2051} {"train_loss": -41.25672149658203, "global_step": 248238, "epoch": 2051} {"train_loss": -40.99821090698242, "global_step": 248239, "epoch": 2051} {"train_loss": -42.49985885620117, "global_step": 248240, "epoch": 2051} {"train_loss": -41.469661712646484, "global_step": 248241, "epoch": 2051} {"train_loss": -41.31759262084961, "global_step": 248242, "epoch": 2051} {"train_loss": -41.436336517333984, "global_step": 248243, "epoch": 2051} {"train_loss": -41.79583740234375, "global_step": 248244, "epoch": 2051} {"train_loss": -41.4100341796875, "global_step": 248245, "epoch": 2051} {"train_loss": -41.19589614868164, "global_step": 248246, "epoch": 2051} {"train_loss": -43.358062744140625, "global_step": 248247, "epoch": 2051} {"train_loss": -41.706050872802734, "global_step": 248248, "epoch": 2051} {"train_loss": -39.52951431274414, "global_step": 248249, "epoch": 2051} {"train_loss": -34.4726676940918, "global_step": 248250, "epoch": 2051} {"train_loss": -40.47756576538086, "global_step": 248251, "epoch": 2051} {"train_loss": -33.2169189453125, "global_step": 248252, "epoch": 2051} {"train_loss": -30.461505889892578, "global_step": 248253, "epoch": 2051} {"train_loss": -35.6232795715332, "global_step": 248254, "epoch": 2051} {"train_loss": -41.07088088989258, "global_step": 248255, "epoch": 2051} {"train_loss": -32.74009323120117, "global_step": 248256, "epoch": 2051} {"train_loss": -36.32015609741211, "global_step": 248257, "epoch": 2051} {"train_loss": -39.7346305847168, "global_step": 248258, "epoch": 2051} {"train_loss": -36.32952880859375, "global_step": 248259, "epoch": 2051} {"train_loss": -38.643104553222656, "global_step": 248260, "epoch": 2051} {"train_loss": -40.62905502319336, "global_step": 248261, "epoch": 2051} {"train_loss": -39.69719314575195, "global_step": 248262, "epoch": 2051} {"train_loss": -40.00498580932617, "global_step": 248263, "epoch": 2051} {"train_loss": -38.92646026611328, "global_step": 248264, "epoch": 2051} {"train_loss": -41.13132858276367, "global_step": 248265, "epoch": 2051} {"train_loss": -40.5597038269043, "global_step": 248266, "epoch": 2051} {"train_loss": -39.957603454589844, "global_step": 248267, "epoch": 2051} {"train_loss": -41.197383880615234, "global_step": 248268, "epoch": 2051} {"train_loss": -40.592979431152344, "global_step": 248269, "epoch": 2051} {"train_loss": -39.935707092285156, "global_step": 248270, "epoch": 2051} {"train_loss": -41.16603469848633, "global_step": 248271, "epoch": 2051} {"train_loss": -41.12797164916992, "global_step": 248272, "epoch": 2051} {"train_loss": -41.060577392578125, "global_step": 248273, "epoch": 2051} {"train_loss": -40.677066802978516, "global_step": 248274, "epoch": 2051} {"train_loss": -41.547210693359375, "global_step": 248275, "epoch": 2051} {"train_loss": -41.34451675415039, "global_step": 248276, "epoch": 2051} {"train_loss": -41.07169723510742, "global_step": 248277, "epoch": 2051} {"train_loss": -40.71009063720703, "global_step": 248278, "epoch": 2051} {"train_loss": -41.631568908691406, "global_step": 248279, "epoch": 2051} {"train_loss": -41.29024887084961, "global_step": 248280, "epoch": 2051} {"train_loss": -42.07835006713867, "global_step": 248281, "epoch": 2051} {"train_loss": -42.12104415893555, "global_step": 248282, "epoch": 2051} {"train_loss": -41.98259735107422, "global_step": 248283, "epoch": 2051} {"train_loss": -41.13558578491211, "global_step": 248284, "epoch": 2051} {"train_loss": -41.19769287109375, "global_step": 248285, "epoch": 2051} {"train_loss": -41.11605453491211, "global_step": 248286, "epoch": 2051} {"train_loss": -40.81604766845703, "global_step": 248287, "epoch": 2051} {"train_loss": -41.639076232910156, "global_step": 248288, "epoch": 2051} {"train_loss": -41.52827072143555, "global_step": 248289, "epoch": 2051} {"train_loss": -41.94845199584961, "global_step": 248290, "epoch": 2051} {"train_loss": -41.18470089494689, "global_step": 248291, "epoch": 2051, "val_loss": 2576960.75} {"train_loss": -41.844993591308594, "global_step": 248292, "epoch": 2052} {"train_loss": -41.03584671020508, "global_step": 248293, "epoch": 2052} {"train_loss": -42.41994857788086, "global_step": 248294, "epoch": 2052} {"train_loss": -42.46533203125, "global_step": 248295, "epoch": 2052} {"train_loss": -42.25773239135742, "global_step": 248296, "epoch": 2052} {"train_loss": -42.80309295654297, "global_step": 248297, "epoch": 2052} {"train_loss": -40.16998291015625, "global_step": 248298, "epoch": 2052} {"train_loss": -42.46023178100586, "global_step": 248299, "epoch": 2052} {"train_loss": -42.82408905029297, "global_step": 248300, "epoch": 2052} {"train_loss": -42.88076400756836, "global_step": 248301, "epoch": 2052} {"train_loss": -42.934505462646484, "global_step": 248302, "epoch": 2052} {"train_loss": -42.13574981689453, "global_step": 248303, "epoch": 2052} {"train_loss": -43.0937614440918, "global_step": 248304, "epoch": 2052} {"train_loss": -42.922508239746094, "global_step": 248305, "epoch": 2052} {"train_loss": -42.163177490234375, "global_step": 248306, "epoch": 2052} {"train_loss": -42.35174560546875, "global_step": 248307, "epoch": 2052} {"train_loss": -42.94467544555664, "global_step": 248308, "epoch": 2052} {"train_loss": -42.38623809814453, "global_step": 248309, "epoch": 2052} {"train_loss": -42.57880783081055, "global_step": 248310, "epoch": 2052} {"train_loss": -42.909664154052734, "global_step": 248311, "epoch": 2052} {"train_loss": -42.351070404052734, "global_step": 248312, "epoch": 2052} {"train_loss": -40.55631637573242, "global_step": 248313, "epoch": 2052} {"train_loss": -42.24357223510742, "global_step": 248314, "epoch": 2052} {"train_loss": -42.672882080078125, "global_step": 248315, "epoch": 2052} {"train_loss": -42.007286071777344, "global_step": 248316, "epoch": 2052} {"train_loss": -38.92653274536133, "global_step": 248317, "epoch": 2052} {"train_loss": -42.087642669677734, "global_step": 248318, "epoch": 2052} {"train_loss": -42.6749267578125, "global_step": 248319, "epoch": 2052} {"train_loss": -41.5870361328125, "global_step": 248320, "epoch": 2052} {"train_loss": -42.82534408569336, "global_step": 248321, "epoch": 2052} {"train_loss": -42.62405014038086, "global_step": 248322, "epoch": 2052} {"train_loss": -42.49068832397461, "global_step": 248323, "epoch": 2052} {"train_loss": -43.30060958862305, "global_step": 248324, "epoch": 2052} {"train_loss": -42.75259017944336, "global_step": 248325, "epoch": 2052} {"train_loss": -40.84916687011719, "global_step": 248326, "epoch": 2052} {"train_loss": -42.69973373413086, "global_step": 248327, "epoch": 2052} {"train_loss": -42.588172912597656, "global_step": 248328, "epoch": 2052} {"train_loss": -42.85343551635742, "global_step": 248329, "epoch": 2052} {"train_loss": -36.729400634765625, "global_step": 248330, "epoch": 2052} {"train_loss": -40.19154739379883, "global_step": 248331, "epoch": 2052} {"train_loss": -42.33378601074219, "global_step": 248332, "epoch": 2052} {"train_loss": -41.508907318115234, "global_step": 248333, "epoch": 2052} {"train_loss": -42.356971740722656, "global_step": 248334, "epoch": 2052} {"train_loss": -40.58407211303711, "global_step": 248335, "epoch": 2052} {"train_loss": -40.922725677490234, "global_step": 248336, "epoch": 2052} {"train_loss": -41.31051254272461, "global_step": 248337, "epoch": 2052} {"train_loss": -40.78268051147461, "global_step": 248338, "epoch": 2052} {"train_loss": -39.78057861328125, "global_step": 248339, "epoch": 2052} {"train_loss": -39.8581428527832, "global_step": 248340, "epoch": 2052} {"train_loss": -41.789100646972656, "global_step": 248341, "epoch": 2052} {"train_loss": -41.200653076171875, "global_step": 248342, "epoch": 2052} {"train_loss": -41.85444641113281, "global_step": 248343, "epoch": 2052} {"train_loss": -41.944271087646484, "global_step": 248344, "epoch": 2052} {"train_loss": -42.060333251953125, "global_step": 248345, "epoch": 2052} {"train_loss": -42.863136291503906, "global_step": 248346, "epoch": 2052} {"train_loss": -42.354976654052734, "global_step": 248347, "epoch": 2052} {"train_loss": -40.60430908203125, "global_step": 248348, "epoch": 2052} {"train_loss": -40.70844650268555, "global_step": 248349, "epoch": 2052} {"train_loss": -42.00265121459961, "global_step": 248350, "epoch": 2052} {"train_loss": -40.26418685913086, "global_step": 248351, "epoch": 2052} {"train_loss": -41.57062530517578, "global_step": 248352, "epoch": 2052} {"train_loss": -36.59150314331055, "global_step": 248353, "epoch": 2052} {"train_loss": -39.614192962646484, "global_step": 248354, "epoch": 2052} {"train_loss": -40.6629524230957, "global_step": 248355, "epoch": 2052} {"train_loss": -42.580413818359375, "global_step": 248356, "epoch": 2052} {"train_loss": -41.016510009765625, "global_step": 248357, "epoch": 2052} {"train_loss": -41.86247634887695, "global_step": 248358, "epoch": 2052} {"train_loss": -41.831695556640625, "global_step": 248359, "epoch": 2052} {"train_loss": -41.91993713378906, "global_step": 248360, "epoch": 2052} {"train_loss": -39.65312576293945, "global_step": 248361, "epoch": 2052} {"train_loss": -41.352027893066406, "global_step": 248362, "epoch": 2052} {"train_loss": -40.4384765625, "global_step": 248363, "epoch": 2052} {"train_loss": -40.50678253173828, "global_step": 248364, "epoch": 2052} {"train_loss": -41.38908767700195, "global_step": 248365, "epoch": 2052} {"train_loss": -37.32466506958008, "global_step": 248366, "epoch": 2052} {"train_loss": -41.70680618286133, "global_step": 248367, "epoch": 2052} {"train_loss": -41.14892578125, "global_step": 248368, "epoch": 2052} {"train_loss": -42.550758361816406, "global_step": 248369, "epoch": 2052} {"train_loss": -41.4499626159668, "global_step": 248370, "epoch": 2052} {"train_loss": -42.58443069458008, "global_step": 248371, "epoch": 2052} {"train_loss": -41.86284255981445, "global_step": 248372, "epoch": 2052} {"train_loss": -41.67623519897461, "global_step": 248373, "epoch": 2052} {"train_loss": -41.60006332397461, "global_step": 248374, "epoch": 2052} {"train_loss": -41.72610092163086, "global_step": 248375, "epoch": 2052} {"train_loss": -39.62057113647461, "global_step": 248376, "epoch": 2052} {"train_loss": -40.03666687011719, "global_step": 248377, "epoch": 2052} {"train_loss": -41.212284088134766, "global_step": 248378, "epoch": 2052} {"train_loss": -42.66392135620117, "global_step": 248379, "epoch": 2052} {"train_loss": -39.987361907958984, "global_step": 248380, "epoch": 2052} {"train_loss": -40.51174545288086, "global_step": 248381, "epoch": 2052} {"train_loss": -37.586360931396484, "global_step": 248382, "epoch": 2052} {"train_loss": -39.202754974365234, "global_step": 248383, "epoch": 2052} {"train_loss": -39.020362854003906, "global_step": 248384, "epoch": 2052} {"train_loss": -41.72876739501953, "global_step": 248385, "epoch": 2052} {"train_loss": -41.916358947753906, "global_step": 248386, "epoch": 2052} {"train_loss": -36.792842864990234, "global_step": 248387, "epoch": 2052} {"train_loss": -36.375709533691406, "global_step": 248388, "epoch": 2052} {"train_loss": -36.647247314453125, "global_step": 248389, "epoch": 2052} {"train_loss": -40.736297607421875, "global_step": 248390, "epoch": 2052} {"train_loss": -40.54536056518555, "global_step": 248391, "epoch": 2052} {"train_loss": -41.333126068115234, "global_step": 248392, "epoch": 2052} {"train_loss": -41.02216720581055, "global_step": 248393, "epoch": 2052} {"train_loss": -41.31013107299805, "global_step": 248394, "epoch": 2052} {"train_loss": -41.3598747253418, "global_step": 248395, "epoch": 2052} {"train_loss": -41.53862380981445, "global_step": 248396, "epoch": 2052} {"train_loss": -37.63340377807617, "global_step": 248397, "epoch": 2052} {"train_loss": -36.28631591796875, "global_step": 248398, "epoch": 2052} {"train_loss": -38.962833404541016, "global_step": 248399, "epoch": 2052} {"train_loss": -36.25110626220703, "global_step": 248400, "epoch": 2052} {"train_loss": -40.766475677490234, "global_step": 248401, "epoch": 2052} {"train_loss": -40.70394515991211, "global_step": 248402, "epoch": 2052} {"train_loss": -39.37946701049805, "global_step": 248403, "epoch": 2052} {"train_loss": -39.53284454345703, "global_step": 248404, "epoch": 2052} {"train_loss": -40.81563949584961, "global_step": 248405, "epoch": 2052} {"train_loss": -41.78053665161133, "global_step": 248406, "epoch": 2052} {"train_loss": -39.356719970703125, "global_step": 248407, "epoch": 2052} {"train_loss": -36.088722229003906, "global_step": 248408, "epoch": 2052} {"train_loss": -37.23905563354492, "global_step": 248409, "epoch": 2052} {"train_loss": -39.361019134521484, "global_step": 248410, "epoch": 2052} {"train_loss": -40.48051834106445, "global_step": 248411, "epoch": 2052} {"train_loss": -40.99386215209961, "global_step": 248412, "epoch": 2052, "val_loss": 2657635.25} {"train_loss": -40.65449905395508, "global_step": 248413, "epoch": 2053} {"train_loss": -41.48162841796875, "global_step": 248414, "epoch": 2053} {"train_loss": -40.90523910522461, "global_step": 248415, "epoch": 2053} {"train_loss": -39.84664535522461, "global_step": 248416, "epoch": 2053} {"train_loss": -40.54722213745117, "global_step": 248417, "epoch": 2053} {"train_loss": -41.02922439575195, "global_step": 248418, "epoch": 2053} {"train_loss": -40.46841049194336, "global_step": 248419, "epoch": 2053} {"train_loss": -40.830936431884766, "global_step": 248420, "epoch": 2053} {"train_loss": -41.62272262573242, "global_step": 248421, "epoch": 2053} {"train_loss": -40.97323226928711, "global_step": 248422, "epoch": 2053} {"train_loss": -39.470863342285156, "global_step": 248423, "epoch": 2053} {"train_loss": -40.998565673828125, "global_step": 248424, "epoch": 2053} {"train_loss": -39.266807556152344, "global_step": 248425, "epoch": 2053} {"train_loss": -40.474185943603516, "global_step": 248426, "epoch": 2053} {"train_loss": -40.99254608154297, "global_step": 248427, "epoch": 2053} {"train_loss": -40.310340881347656, "global_step": 248428, "epoch": 2053} {"train_loss": -40.667030334472656, "global_step": 248429, "epoch": 2053} {"train_loss": -40.89711380004883, "global_step": 248430, "epoch": 2053} {"train_loss": -40.64748764038086, "global_step": 248431, "epoch": 2053} {"train_loss": -38.92286682128906, "global_step": 248432, "epoch": 2053} {"train_loss": -41.26272201538086, "global_step": 248433, "epoch": 2053} {"train_loss": -40.816810607910156, "global_step": 248434, "epoch": 2053} {"train_loss": -39.894466400146484, "global_step": 248435, "epoch": 2053} {"train_loss": -41.29205322265625, "global_step": 248436, "epoch": 2053} {"train_loss": -41.87432861328125, "global_step": 248437, "epoch": 2053} {"train_loss": -41.76456832885742, "global_step": 248438, "epoch": 2053} {"train_loss": -42.00171661376953, "global_step": 248439, "epoch": 2053} {"train_loss": -39.06032943725586, "global_step": 248440, "epoch": 2053} {"train_loss": -41.80869674682617, "global_step": 248441, "epoch": 2053} {"train_loss": -41.00082015991211, "global_step": 248442, "epoch": 2053} {"train_loss": -40.67407989501953, "global_step": 248443, "epoch": 2053} {"train_loss": -41.9196891784668, "global_step": 248444, "epoch": 2053} {"train_loss": -41.737422943115234, "global_step": 248445, "epoch": 2053} {"train_loss": -42.08558654785156, "global_step": 248446, "epoch": 2053} {"train_loss": -38.82867431640625, "global_step": 248447, "epoch": 2053} {"train_loss": -40.93896484375, "global_step": 248448, "epoch": 2053} {"train_loss": -40.79771041870117, "global_step": 248449, "epoch": 2053} {"train_loss": -38.982486724853516, "global_step": 248450, "epoch": 2053} {"train_loss": -41.9432373046875, "global_step": 248451, "epoch": 2053} {"train_loss": -42.14199447631836, "global_step": 248452, "epoch": 2053} {"train_loss": -41.8149299621582, "global_step": 248453, "epoch": 2053} {"train_loss": -42.25346755981445, "global_step": 248454, "epoch": 2053} {"train_loss": -42.15016555786133, "global_step": 248455, "epoch": 2053} {"train_loss": -42.08937454223633, "global_step": 248456, "epoch": 2053} {"train_loss": -42.30825424194336, "global_step": 248457, "epoch": 2053} {"train_loss": -41.83870315551758, "global_step": 248458, "epoch": 2053} {"train_loss": -40.50556182861328, "global_step": 248459, "epoch": 2053} {"train_loss": -42.58173751831055, "global_step": 248460, "epoch": 2053} {"train_loss": -42.35319137573242, "global_step": 248461, "epoch": 2053} {"train_loss": -42.08745193481445, "global_step": 248462, "epoch": 2053} {"train_loss": -42.06815719604492, "global_step": 248463, "epoch": 2053} {"train_loss": -40.43783187866211, "global_step": 248464, "epoch": 2053} {"train_loss": -42.19633865356445, "global_step": 248465, "epoch": 2053} {"train_loss": -40.95998001098633, "global_step": 248466, "epoch": 2053} {"train_loss": -42.343406677246094, "global_step": 248467, "epoch": 2053} {"train_loss": -42.724037170410156, "global_step": 248468, "epoch": 2053} {"train_loss": -40.1876335144043, "global_step": 248469, "epoch": 2053} {"train_loss": -42.36237716674805, "global_step": 248470, "epoch": 2053} {"train_loss": -41.99435806274414, "global_step": 248471, "epoch": 2053} {"train_loss": -41.69120788574219, "global_step": 248472, "epoch": 2053} {"train_loss": -42.60306930541992, "global_step": 248473, "epoch": 2053} {"train_loss": -42.27944564819336, "global_step": 248474, "epoch": 2053} {"train_loss": -42.43375778198242, "global_step": 248475, "epoch": 2053} {"train_loss": -42.54390335083008, "global_step": 248476, "epoch": 2053} {"train_loss": -42.28693771362305, "global_step": 248477, "epoch": 2053} {"train_loss": -42.016685485839844, "global_step": 248478, "epoch": 2053} {"train_loss": -40.796443939208984, "global_step": 248479, "epoch": 2053} {"train_loss": -42.18115234375, "global_step": 248480, "epoch": 2053} {"train_loss": -43.10565948486328, "global_step": 248481, "epoch": 2053} {"train_loss": -42.69643020629883, "global_step": 248482, "epoch": 2053} {"train_loss": -41.51951217651367, "global_step": 248483, "epoch": 2053} {"train_loss": -40.92389678955078, "global_step": 248484, "epoch": 2053} {"train_loss": -41.9205322265625, "global_step": 248485, "epoch": 2053} {"train_loss": -41.868507385253906, "global_step": 248486, "epoch": 2053} {"train_loss": -40.34797286987305, "global_step": 248487, "epoch": 2053} {"train_loss": -41.494483947753906, "global_step": 248488, "epoch": 2053} {"train_loss": -42.035179138183594, "global_step": 248489, "epoch": 2053} {"train_loss": -42.18363952636719, "global_step": 248490, "epoch": 2053} {"train_loss": -42.1153564453125, "global_step": 248491, "epoch": 2053} {"train_loss": -42.40497589111328, "global_step": 248492, "epoch": 2053} {"train_loss": -42.824337005615234, "global_step": 248493, "epoch": 2053} {"train_loss": -41.342620849609375, "global_step": 248494, "epoch": 2053} {"train_loss": -41.55984115600586, "global_step": 248495, "epoch": 2053} {"train_loss": -38.938751220703125, "global_step": 248496, "epoch": 2053} {"train_loss": -38.45082473754883, "global_step": 248497, "epoch": 2053} {"train_loss": -38.417049407958984, "global_step": 248498, "epoch": 2053} {"train_loss": -40.205623626708984, "global_step": 248499, "epoch": 2053} {"train_loss": -42.49538040161133, "global_step": 248500, "epoch": 2053} {"train_loss": -42.04119873046875, "global_step": 248501, "epoch": 2053} {"train_loss": -41.59027862548828, "global_step": 248502, "epoch": 2053} {"train_loss": -42.37769317626953, "global_step": 248503, "epoch": 2053} {"train_loss": -41.97042465209961, "global_step": 248504, "epoch": 2053} {"train_loss": -41.83393478393555, "global_step": 248505, "epoch": 2053} {"train_loss": -42.17466354370117, "global_step": 248506, "epoch": 2053} {"train_loss": -41.43318557739258, "global_step": 248507, "epoch": 2053} {"train_loss": -40.849815368652344, "global_step": 248508, "epoch": 2053} {"train_loss": -42.450294494628906, "global_step": 248509, "epoch": 2053} {"train_loss": -41.71708297729492, "global_step": 248510, "epoch": 2053} {"train_loss": -39.44608688354492, "global_step": 248511, "epoch": 2053} {"train_loss": -41.162349700927734, "global_step": 248512, "epoch": 2053} {"train_loss": -42.27399444580078, "global_step": 248513, "epoch": 2053} {"train_loss": -39.75188446044922, "global_step": 248514, "epoch": 2053} {"train_loss": -41.073055267333984, "global_step": 248515, "epoch": 2053} {"train_loss": -41.56884765625, "global_step": 248516, "epoch": 2053} {"train_loss": -41.42156219482422, "global_step": 248517, "epoch": 2053} {"train_loss": -41.670284271240234, "global_step": 248518, "epoch": 2053} {"train_loss": -42.09418487548828, "global_step": 248519, "epoch": 2053} {"train_loss": -40.37215805053711, "global_step": 248520, "epoch": 2053} {"train_loss": -42.45058822631836, "global_step": 248521, "epoch": 2053} {"train_loss": -40.6176872253418, "global_step": 248522, "epoch": 2053} {"train_loss": -40.9940185546875, "global_step": 248523, "epoch": 2053} {"train_loss": -42.155948638916016, "global_step": 248524, "epoch": 2053} {"train_loss": -41.1389274597168, "global_step": 248525, "epoch": 2053} {"train_loss": -41.967323303222656, "global_step": 248526, "epoch": 2053} {"train_loss": -40.23954391479492, "global_step": 248527, "epoch": 2053} {"train_loss": -41.36056137084961, "global_step": 248528, "epoch": 2053} {"train_loss": -42.16593551635742, "global_step": 248529, "epoch": 2053} {"train_loss": -41.9267692565918, "global_step": 248530, "epoch": 2053} {"train_loss": -42.53715133666992, "global_step": 248531, "epoch": 2053} {"train_loss": -41.129940032958984, "global_step": 248532, "epoch": 2053} {"train_loss": -41.34743474534721, "global_step": 248533, "epoch": 2053, "val_loss": 2507918.0} {"train_loss": -42.00909423828125, "global_step": 248534, "epoch": 2054} {"train_loss": -42.544715881347656, "global_step": 248535, "epoch": 2054} {"train_loss": -41.95897674560547, "global_step": 248536, "epoch": 2054} {"train_loss": -42.76869201660156, "global_step": 248537, "epoch": 2054} {"train_loss": -41.316707611083984, "global_step": 248538, "epoch": 2054} {"train_loss": -42.61039352416992, "global_step": 248539, "epoch": 2054} {"train_loss": -42.34585952758789, "global_step": 248540, "epoch": 2054} {"train_loss": -42.68077850341797, "global_step": 248541, "epoch": 2054} {"train_loss": -42.5547981262207, "global_step": 248542, "epoch": 2054} {"train_loss": -41.5916862487793, "global_step": 248543, "epoch": 2054} {"train_loss": -42.33893966674805, "global_step": 248544, "epoch": 2054} {"train_loss": -42.73976516723633, "global_step": 248545, "epoch": 2054} {"train_loss": -43.20351791381836, "global_step": 248546, "epoch": 2054} {"train_loss": -42.9449577331543, "global_step": 248547, "epoch": 2054} {"train_loss": -42.47506332397461, "global_step": 248548, "epoch": 2054} {"train_loss": -42.481544494628906, "global_step": 248549, "epoch": 2054} {"train_loss": -42.027950286865234, "global_step": 248550, "epoch": 2054} {"train_loss": -42.834835052490234, "global_step": 248551, "epoch": 2054} {"train_loss": -42.95316696166992, "global_step": 248552, "epoch": 2054} {"train_loss": -42.015106201171875, "global_step": 248553, "epoch": 2054} {"train_loss": -41.007381439208984, "global_step": 248554, "epoch": 2054} {"train_loss": -42.50218200683594, "global_step": 248555, "epoch": 2054} {"train_loss": -42.791107177734375, "global_step": 248556, "epoch": 2054} {"train_loss": -42.531375885009766, "global_step": 248557, "epoch": 2054} {"train_loss": -42.6019401550293, "global_step": 248558, "epoch": 2054} {"train_loss": -43.09086227416992, "global_step": 248559, "epoch": 2054} {"train_loss": -42.21247482299805, "global_step": 248560, "epoch": 2054} {"train_loss": -43.094058990478516, "global_step": 248561, "epoch": 2054} {"train_loss": -42.300418853759766, "global_step": 248562, "epoch": 2054} {"train_loss": -41.99909591674805, "global_step": 248563, "epoch": 2054} {"train_loss": -42.55526351928711, "global_step": 248564, "epoch": 2054} {"train_loss": -40.32366180419922, "global_step": 248565, "epoch": 2054} {"train_loss": -42.1474609375, "global_step": 248566, "epoch": 2054} {"train_loss": -42.4272346496582, "global_step": 248567, "epoch": 2054} {"train_loss": -41.05498504638672, "global_step": 248568, "epoch": 2054} {"train_loss": -41.449623107910156, "global_step": 248569, "epoch": 2054} {"train_loss": -42.45365524291992, "global_step": 248570, "epoch": 2054} {"train_loss": -42.9465446472168, "global_step": 248571, "epoch": 2054} {"train_loss": -42.14189529418945, "global_step": 248572, "epoch": 2054} {"train_loss": -39.52766036987305, "global_step": 248573, "epoch": 2054} {"train_loss": -40.1688232421875, "global_step": 248574, "epoch": 2054} {"train_loss": -41.642364501953125, "global_step": 248575, "epoch": 2054} {"train_loss": -37.954689025878906, "global_step": 248576, "epoch": 2054} {"train_loss": -36.189453125, "global_step": 248577, "epoch": 2054} {"train_loss": -41.12931442260742, "global_step": 248578, "epoch": 2054} {"train_loss": -42.49313735961914, "global_step": 248579, "epoch": 2054} {"train_loss": -37.37302780151367, "global_step": 248580, "epoch": 2054} {"train_loss": -36.855411529541016, "global_step": 248581, "epoch": 2054} {"train_loss": -40.9764518737793, "global_step": 248582, "epoch": 2054} {"train_loss": -40.02454376220703, "global_step": 248583, "epoch": 2054} {"train_loss": -37.847354888916016, "global_step": 248584, "epoch": 2054} {"train_loss": -40.192718505859375, "global_step": 248585, "epoch": 2054} {"train_loss": -38.753318786621094, "global_step": 248586, "epoch": 2054} {"train_loss": -40.6142692565918, "global_step": 248587, "epoch": 2054} {"train_loss": -40.73384475708008, "global_step": 248588, "epoch": 2054} {"train_loss": -36.85791015625, "global_step": 248589, "epoch": 2054} {"train_loss": -39.10884475708008, "global_step": 248590, "epoch": 2054} {"train_loss": -40.09968566894531, "global_step": 248591, "epoch": 2054} {"train_loss": -38.22908020019531, "global_step": 248592, "epoch": 2054} {"train_loss": -40.212215423583984, "global_step": 248593, "epoch": 2054} {"train_loss": -38.08524703979492, "global_step": 248594, "epoch": 2054} {"train_loss": -41.290069580078125, "global_step": 248595, "epoch": 2054} {"train_loss": -40.241432189941406, "global_step": 248596, "epoch": 2054} {"train_loss": -40.70408630371094, "global_step": 248597, "epoch": 2054} {"train_loss": -38.805397033691406, "global_step": 248598, "epoch": 2054} {"train_loss": -39.7065544128418, "global_step": 248599, "epoch": 2054} {"train_loss": -41.91374969482422, "global_step": 248600, "epoch": 2054} {"train_loss": -38.99144744873047, "global_step": 248601, "epoch": 2054} {"train_loss": -41.87749099731445, "global_step": 248602, "epoch": 2054} {"train_loss": -40.49854278564453, "global_step": 248603, "epoch": 2054} {"train_loss": -28.62066650390625, "global_step": 248604, "epoch": 2054} {"train_loss": -41.30735397338867, "global_step": 248605, "epoch": 2054} {"train_loss": -40.171722412109375, "global_step": 248606, "epoch": 2054} {"train_loss": -40.31499099731445, "global_step": 248607, "epoch": 2054} {"train_loss": -38.35990524291992, "global_step": 248608, "epoch": 2054} {"train_loss": -39.25404739379883, "global_step": 248609, "epoch": 2054} {"train_loss": -39.757442474365234, "global_step": 248610, "epoch": 2054} {"train_loss": -38.619171142578125, "global_step": 248611, "epoch": 2054} {"train_loss": -41.128658294677734, "global_step": 248612, "epoch": 2054} {"train_loss": -38.795108795166016, "global_step": 248613, "epoch": 2054} {"train_loss": -40.187564849853516, "global_step": 248614, "epoch": 2054} {"train_loss": -40.77621841430664, "global_step": 248615, "epoch": 2054} {"train_loss": -37.116554260253906, "global_step": 248616, "epoch": 2054} {"train_loss": -41.16917037963867, "global_step": 248617, "epoch": 2054} {"train_loss": -38.78392028808594, "global_step": 248618, "epoch": 2054} {"train_loss": -38.09623336791992, "global_step": 248619, "epoch": 2054} {"train_loss": -40.17351150512695, "global_step": 248620, "epoch": 2054} {"train_loss": -41.091732025146484, "global_step": 248621, "epoch": 2054} {"train_loss": -38.548439025878906, "global_step": 248622, "epoch": 2054} {"train_loss": -40.66266632080078, "global_step": 248623, "epoch": 2054} {"train_loss": -40.45712661743164, "global_step": 248624, "epoch": 2054} {"train_loss": -40.45549011230469, "global_step": 248625, "epoch": 2054} {"train_loss": -35.55160140991211, "global_step": 248626, "epoch": 2054} {"train_loss": -36.49546432495117, "global_step": 248627, "epoch": 2054} {"train_loss": -39.539913177490234, "global_step": 248628, "epoch": 2054} {"train_loss": -36.747230529785156, "global_step": 248629, "epoch": 2054} {"train_loss": -38.6595344543457, "global_step": 248630, "epoch": 2054} {"train_loss": -37.45173263549805, "global_step": 248631, "epoch": 2054} {"train_loss": -38.03731918334961, "global_step": 248632, "epoch": 2054} {"train_loss": -36.022613525390625, "global_step": 248633, "epoch": 2054} {"train_loss": -32.66375732421875, "global_step": 248634, "epoch": 2054} {"train_loss": -39.897281646728516, "global_step": 248635, "epoch": 2054} {"train_loss": -39.74200439453125, "global_step": 248636, "epoch": 2054} {"train_loss": -39.01896667480469, "global_step": 248637, "epoch": 2054} {"train_loss": -40.19304656982422, "global_step": 248638, "epoch": 2054} {"train_loss": -40.71247482299805, "global_step": 248639, "epoch": 2054} {"train_loss": -37.79785919189453, "global_step": 248640, "epoch": 2054} {"train_loss": -38.95772171020508, "global_step": 248641, "epoch": 2054} {"train_loss": -39.75081253051758, "global_step": 248642, "epoch": 2054} {"train_loss": -40.981727600097656, "global_step": 248643, "epoch": 2054} {"train_loss": -39.75212478637695, "global_step": 248644, "epoch": 2054} {"train_loss": -38.40664291381836, "global_step": 248645, "epoch": 2054} {"train_loss": -38.73167037963867, "global_step": 248646, "epoch": 2054} {"train_loss": -40.00703048706055, "global_step": 248647, "epoch": 2054} {"train_loss": -39.54890060424805, "global_step": 248648, "epoch": 2054} {"train_loss": -39.373416900634766, "global_step": 248649, "epoch": 2054} {"train_loss": -39.11865997314453, "global_step": 248650, "epoch": 2054} {"train_loss": -38.6804084777832, "global_step": 248651, "epoch": 2054} {"train_loss": -40.67340087890625, "global_step": 248652, "epoch": 2054} {"train_loss": -40.77109909057617, "global_step": 248653, "epoch": 2054} {"train_loss": -40.2219082540717, "global_step": 248654, "epoch": 2054, "val_loss": 2568846.25} {"train_loss": -40.54526138305664, "global_step": 248655, "epoch": 2055} {"train_loss": -39.28298568725586, "global_step": 248656, "epoch": 2055} {"train_loss": -40.66022872924805, "global_step": 248657, "epoch": 2055} {"train_loss": -41.3210563659668, "global_step": 248658, "epoch": 2055} {"train_loss": -41.303497314453125, "global_step": 248659, "epoch": 2055} {"train_loss": -41.029380798339844, "global_step": 248660, "epoch": 2055} {"train_loss": -40.01538848876953, "global_step": 248661, "epoch": 2055} {"train_loss": -38.64076614379883, "global_step": 248662, "epoch": 2055} {"train_loss": -40.93553161621094, "global_step": 248663, "epoch": 2055} {"train_loss": -37.3342399597168, "global_step": 248664, "epoch": 2055} {"train_loss": -41.133060455322266, "global_step": 248665, "epoch": 2055} {"train_loss": -41.78057861328125, "global_step": 248666, "epoch": 2055} {"train_loss": -40.81864929199219, "global_step": 248667, "epoch": 2055} {"train_loss": -38.72148132324219, "global_step": 248668, "epoch": 2055} {"train_loss": -40.22755432128906, "global_step": 248669, "epoch": 2055} {"train_loss": -40.24678039550781, "global_step": 248670, "epoch": 2055} {"train_loss": -41.01162338256836, "global_step": 248671, "epoch": 2055} {"train_loss": -38.578651428222656, "global_step": 248672, "epoch": 2055} {"train_loss": -40.68217086791992, "global_step": 248673, "epoch": 2055} {"train_loss": -40.79943084716797, "global_step": 248674, "epoch": 2055} {"train_loss": -40.90892028808594, "global_step": 248675, "epoch": 2055} {"train_loss": -40.5479736328125, "global_step": 248676, "epoch": 2055} {"train_loss": -39.09348678588867, "global_step": 248677, "epoch": 2055} {"train_loss": -39.084625244140625, "global_step": 248678, "epoch": 2055} {"train_loss": -41.79291534423828, "global_step": 248679, "epoch": 2055} {"train_loss": -41.25972366333008, "global_step": 248680, "epoch": 2055} {"train_loss": -40.898345947265625, "global_step": 248681, "epoch": 2055} {"train_loss": -41.059017181396484, "global_step": 248682, "epoch": 2055} {"train_loss": -39.592708587646484, "global_step": 248683, "epoch": 2055} {"train_loss": -41.37934112548828, "global_step": 248684, "epoch": 2055} {"train_loss": -41.26902389526367, "global_step": 248685, "epoch": 2055} {"train_loss": -41.20840835571289, "global_step": 248686, "epoch": 2055} {"train_loss": -42.23676300048828, "global_step": 248687, "epoch": 2055} {"train_loss": -41.05069351196289, "global_step": 248688, "epoch": 2055} {"train_loss": -41.60908889770508, "global_step": 248689, "epoch": 2055} {"train_loss": -41.67336654663086, "global_step": 248690, "epoch": 2055} {"train_loss": -41.63584518432617, "global_step": 248691, "epoch": 2055} {"train_loss": -41.699485778808594, "global_step": 248692, "epoch": 2055} {"train_loss": -41.25848388671875, "global_step": 248693, "epoch": 2055} {"train_loss": -41.11454391479492, "global_step": 248694, "epoch": 2055} {"train_loss": -39.6912841796875, "global_step": 248695, "epoch": 2055} {"train_loss": -41.525386810302734, "global_step": 248696, "epoch": 2055} {"train_loss": -42.002872467041016, "global_step": 248697, "epoch": 2055} {"train_loss": -41.73328399658203, "global_step": 248698, "epoch": 2055} {"train_loss": -41.817665100097656, "global_step": 248699, "epoch": 2055} {"train_loss": -41.39918899536133, "global_step": 248700, "epoch": 2055} {"train_loss": -42.259769439697266, "global_step": 248701, "epoch": 2055} {"train_loss": -42.25514602661133, "global_step": 248702, "epoch": 2055} {"train_loss": -41.91021728515625, "global_step": 248703, "epoch": 2055} {"train_loss": -40.99324417114258, "global_step": 248704, "epoch": 2055} {"train_loss": -41.535736083984375, "global_step": 248705, "epoch": 2055} {"train_loss": -42.426448822021484, "global_step": 248706, "epoch": 2055} {"train_loss": -41.3865852355957, "global_step": 248707, "epoch": 2055} {"train_loss": -41.0500373840332, "global_step": 248708, "epoch": 2055} {"train_loss": -41.788482666015625, "global_step": 248709, "epoch": 2055} {"train_loss": -41.62446975708008, "global_step": 248710, "epoch": 2055} {"train_loss": -42.33211898803711, "global_step": 248711, "epoch": 2055} {"train_loss": -41.39779281616211, "global_step": 248712, "epoch": 2055} {"train_loss": -42.09035873413086, "global_step": 248713, "epoch": 2055} {"train_loss": -42.28390884399414, "global_step": 248714, "epoch": 2055} {"train_loss": -34.49293518066406, "global_step": 248715, "epoch": 2055} {"train_loss": -42.147579193115234, "global_step": 248716, "epoch": 2055} {"train_loss": -39.8853645324707, "global_step": 248717, "epoch": 2055} {"train_loss": -41.717864990234375, "global_step": 248718, "epoch": 2055} {"train_loss": -42.01511764526367, "global_step": 248719, "epoch": 2055} {"train_loss": -41.54300308227539, "global_step": 248720, "epoch": 2055} {"train_loss": -41.47323226928711, "global_step": 248721, "epoch": 2055} {"train_loss": -41.91178512573242, "global_step": 248722, "epoch": 2055} {"train_loss": -41.23563766479492, "global_step": 248723, "epoch": 2055} {"train_loss": -40.60149002075195, "global_step": 248724, "epoch": 2055} {"train_loss": -42.1876335144043, "global_step": 248725, "epoch": 2055} {"train_loss": -41.95568084716797, "global_step": 248726, "epoch": 2055} {"train_loss": -42.0036506652832, "global_step": 248727, "epoch": 2055} {"train_loss": -41.52709197998047, "global_step": 248728, "epoch": 2055} {"train_loss": -40.503414154052734, "global_step": 248729, "epoch": 2055} {"train_loss": -41.779842376708984, "global_step": 248730, "epoch": 2055} {"train_loss": -42.26223373413086, "global_step": 248731, "epoch": 2055} {"train_loss": -40.99262237548828, "global_step": 248732, "epoch": 2055} {"train_loss": -41.979591369628906, "global_step": 248733, "epoch": 2055} {"train_loss": -42.18897247314453, "global_step": 248734, "epoch": 2055} {"train_loss": -42.42810821533203, "global_step": 248735, "epoch": 2055} {"train_loss": -42.15719223022461, "global_step": 248736, "epoch": 2055} {"train_loss": -41.94639587402344, "global_step": 248737, "epoch": 2055} {"train_loss": -41.937381744384766, "global_step": 248738, "epoch": 2055} {"train_loss": -41.69770431518555, "global_step": 248739, "epoch": 2055} {"train_loss": -42.268310546875, "global_step": 248740, "epoch": 2055} {"train_loss": -41.63727569580078, "global_step": 248741, "epoch": 2055} {"train_loss": -39.64777755737305, "global_step": 248742, "epoch": 2055} {"train_loss": -41.83330154418945, "global_step": 248743, "epoch": 2055} {"train_loss": -42.56754684448242, "global_step": 248744, "epoch": 2055} {"train_loss": -37.97260665893555, "global_step": 248745, "epoch": 2055} {"train_loss": -41.98084259033203, "global_step": 248746, "epoch": 2055} {"train_loss": -41.27556228637695, "global_step": 248747, "epoch": 2055} {"train_loss": -41.14006805419922, "global_step": 248748, "epoch": 2055} {"train_loss": -41.542354583740234, "global_step": 248749, "epoch": 2055} {"train_loss": -40.650936126708984, "global_step": 248750, "epoch": 2055} {"train_loss": -41.9140510559082, "global_step": 248751, "epoch": 2055} {"train_loss": -41.02961349487305, "global_step": 248752, "epoch": 2055} {"train_loss": -42.85464096069336, "global_step": 248753, "epoch": 2055} {"train_loss": -40.883087158203125, "global_step": 248754, "epoch": 2055} {"train_loss": -42.37263488769531, "global_step": 248755, "epoch": 2055} {"train_loss": -41.85811996459961, "global_step": 248756, "epoch": 2055} {"train_loss": -41.46918869018555, "global_step": 248757, "epoch": 2055} {"train_loss": -40.1114616394043, "global_step": 248758, "epoch": 2055} {"train_loss": -39.3718376159668, "global_step": 248759, "epoch": 2055} {"train_loss": -41.48652648925781, "global_step": 248760, "epoch": 2055} {"train_loss": -42.34939193725586, "global_step": 248761, "epoch": 2055} {"train_loss": -42.072967529296875, "global_step": 248762, "epoch": 2055} {"train_loss": -41.50101852416992, "global_step": 248763, "epoch": 2055} {"train_loss": -42.25565719604492, "global_step": 248764, "epoch": 2055} {"train_loss": -42.61124801635742, "global_step": 248765, "epoch": 2055} {"train_loss": -41.91888427734375, "global_step": 248766, "epoch": 2055} {"train_loss": -42.06695556640625, "global_step": 248767, "epoch": 2055} {"train_loss": -42.727317810058594, "global_step": 248768, "epoch": 2055} {"train_loss": -41.91355514526367, "global_step": 248769, "epoch": 2055} {"train_loss": -42.0335578918457, "global_step": 248770, "epoch": 2055} {"train_loss": -41.81032943725586, "global_step": 248771, "epoch": 2055} {"train_loss": -41.98884201049805, "global_step": 248772, "epoch": 2055} {"train_loss": -40.8754997253418, "global_step": 248773, "epoch": 2055} {"train_loss": -41.65833282470703, "global_step": 248774, "epoch": 2055} {"train_loss": -41.233389168731435, "global_step": 248775, "epoch": 2055, "val_loss": 2591753.75} {"train_loss": -41.68907928466797, "global_step": 248776, "epoch": 2056} {"train_loss": -41.86003875732422, "global_step": 248777, "epoch": 2056} {"train_loss": -41.38779830932617, "global_step": 248778, "epoch": 2056} {"train_loss": -42.18726348876953, "global_step": 248779, "epoch": 2056} {"train_loss": -41.93947982788086, "global_step": 248780, "epoch": 2056} {"train_loss": -41.664833068847656, "global_step": 248781, "epoch": 2056} {"train_loss": -41.71379470825195, "global_step": 248782, "epoch": 2056} {"train_loss": -41.95943832397461, "global_step": 248783, "epoch": 2056} {"train_loss": -41.59302520751953, "global_step": 248784, "epoch": 2056} {"train_loss": -42.125640869140625, "global_step": 248785, "epoch": 2056} {"train_loss": -42.3813591003418, "global_step": 248786, "epoch": 2056} {"train_loss": -42.098724365234375, "global_step": 248787, "epoch": 2056} {"train_loss": -41.91953659057617, "global_step": 248788, "epoch": 2056} {"train_loss": -41.728755950927734, "global_step": 248789, "epoch": 2056} {"train_loss": -41.594364166259766, "global_step": 248790, "epoch": 2056} {"train_loss": -40.713645935058594, "global_step": 248791, "epoch": 2056} {"train_loss": -42.50474548339844, "global_step": 248792, "epoch": 2056} {"train_loss": -40.16203689575195, "global_step": 248793, "epoch": 2056} {"train_loss": -40.56785202026367, "global_step": 248794, "epoch": 2056} {"train_loss": -40.577720642089844, "global_step": 248795, "epoch": 2056} {"train_loss": -42.04118347167969, "global_step": 248796, "epoch": 2056} {"train_loss": -40.59737777709961, "global_step": 248797, "epoch": 2056} {"train_loss": -38.30017852783203, "global_step": 248798, "epoch": 2056} {"train_loss": -38.973960876464844, "global_step": 248799, "epoch": 2056} {"train_loss": -36.0965576171875, "global_step": 248800, "epoch": 2056} {"train_loss": -38.802032470703125, "global_step": 248801, "epoch": 2056} {"train_loss": -40.07990264892578, "global_step": 248802, "epoch": 2056} {"train_loss": -37.62604522705078, "global_step": 248803, "epoch": 2056} {"train_loss": -33.08176803588867, "global_step": 248804, "epoch": 2056} {"train_loss": -33.4577751159668, "global_step": 248805, "epoch": 2056} {"train_loss": -40.31714630126953, "global_step": 248806, "epoch": 2056} {"train_loss": -40.117103576660156, "global_step": 248807, "epoch": 2056} {"train_loss": -38.647377014160156, "global_step": 248808, "epoch": 2056} {"train_loss": -41.107666015625, "global_step": 248809, "epoch": 2056} {"train_loss": -40.77922439575195, "global_step": 248810, "epoch": 2056} {"train_loss": -40.93561935424805, "global_step": 248811, "epoch": 2056} {"train_loss": -40.33695602416992, "global_step": 248812, "epoch": 2056} {"train_loss": -41.09794998168945, "global_step": 248813, "epoch": 2056} {"train_loss": -40.15161895751953, "global_step": 248814, "epoch": 2056} {"train_loss": -40.9127197265625, "global_step": 248815, "epoch": 2056} {"train_loss": -40.70680618286133, "global_step": 248816, "epoch": 2056} {"train_loss": -41.44884490966797, "global_step": 248817, "epoch": 2056} {"train_loss": -41.66200637817383, "global_step": 248818, "epoch": 2056} {"train_loss": -40.57353973388672, "global_step": 248819, "epoch": 2056} {"train_loss": -42.071041107177734, "global_step": 248820, "epoch": 2056} {"train_loss": -41.43296432495117, "global_step": 248821, "epoch": 2056} {"train_loss": -41.49557113647461, "global_step": 248822, "epoch": 2056} {"train_loss": -40.48092269897461, "global_step": 248823, "epoch": 2056} {"train_loss": -39.59749984741211, "global_step": 248824, "epoch": 2056} {"train_loss": -41.451904296875, "global_step": 248825, "epoch": 2056} {"train_loss": -41.511653900146484, "global_step": 248826, "epoch": 2056} {"train_loss": -41.598873138427734, "global_step": 248827, "epoch": 2056} {"train_loss": -40.60353469848633, "global_step": 248828, "epoch": 2056} {"train_loss": -41.370399475097656, "global_step": 248829, "epoch": 2056} {"train_loss": -41.153255462646484, "global_step": 248830, "epoch": 2056} {"train_loss": -42.505882263183594, "global_step": 248831, "epoch": 2056} {"train_loss": -41.68095397949219, "global_step": 248832, "epoch": 2056} {"train_loss": -42.23409652709961, "global_step": 248833, "epoch": 2056} {"train_loss": -42.31315231323242, "global_step": 248834, "epoch": 2056} {"train_loss": -42.3904914855957, "global_step": 248835, "epoch": 2056} {"train_loss": -42.615596771240234, "global_step": 248836, "epoch": 2056} {"train_loss": -42.243408203125, "global_step": 248837, "epoch": 2056} {"train_loss": -42.20961380004883, "global_step": 248838, "epoch": 2056} {"train_loss": -42.168941497802734, "global_step": 248839, "epoch": 2056} {"train_loss": -41.72607421875, "global_step": 248840, "epoch": 2056} {"train_loss": -42.06173324584961, "global_step": 248841, "epoch": 2056} {"train_loss": -42.56608200073242, "global_step": 248842, "epoch": 2056} {"train_loss": -42.419708251953125, "global_step": 248843, "epoch": 2056} {"train_loss": -42.3734130859375, "global_step": 248844, "epoch": 2056} {"train_loss": -41.66870880126953, "global_step": 248845, "epoch": 2056} {"train_loss": -40.74298095703125, "global_step": 248846, "epoch": 2056} {"train_loss": -42.46611404418945, "global_step": 248847, "epoch": 2056} {"train_loss": -42.39504623413086, "global_step": 248848, "epoch": 2056} {"train_loss": -40.21297073364258, "global_step": 248849, "epoch": 2056} {"train_loss": -42.18123245239258, "global_step": 248850, "epoch": 2056} {"train_loss": -42.644866943359375, "global_step": 248851, "epoch": 2056} {"train_loss": -42.76004409790039, "global_step": 248852, "epoch": 2056} {"train_loss": -42.76248550415039, "global_step": 248853, "epoch": 2056} {"train_loss": -42.173370361328125, "global_step": 248854, "epoch": 2056} {"train_loss": -42.403438568115234, "global_step": 248855, "epoch": 2056} {"train_loss": -42.35866928100586, "global_step": 248856, "epoch": 2056} {"train_loss": -41.706939697265625, "global_step": 248857, "epoch": 2056} {"train_loss": -41.422725677490234, "global_step": 248858, "epoch": 2056} {"train_loss": -41.39148712158203, "global_step": 248859, "epoch": 2056} {"train_loss": -40.69074249267578, "global_step": 248860, "epoch": 2056} {"train_loss": -42.83510971069336, "global_step": 248861, "epoch": 2056} {"train_loss": -41.97652053833008, "global_step": 248862, "epoch": 2056} {"train_loss": -42.460235595703125, "global_step": 248863, "epoch": 2056} {"train_loss": -41.36552429199219, "global_step": 248864, "epoch": 2056} {"train_loss": -42.268611907958984, "global_step": 248865, "epoch": 2056} {"train_loss": -41.225303649902344, "global_step": 248866, "epoch": 2056} {"train_loss": -42.645408630371094, "global_step": 248867, "epoch": 2056} {"train_loss": -41.431922912597656, "global_step": 248868, "epoch": 2056} {"train_loss": -42.93535232543945, "global_step": 248869, "epoch": 2056} {"train_loss": -42.383384704589844, "global_step": 248870, "epoch": 2056} {"train_loss": -42.91518020629883, "global_step": 248871, "epoch": 2056} {"train_loss": -42.734962463378906, "global_step": 248872, "epoch": 2056} {"train_loss": -42.463558197021484, "global_step": 248873, "epoch": 2056} {"train_loss": -42.5737419128418, "global_step": 248874, "epoch": 2056} {"train_loss": -42.136932373046875, "global_step": 248875, "epoch": 2056} {"train_loss": -42.29246139526367, "global_step": 248876, "epoch": 2056} {"train_loss": -41.911128997802734, "global_step": 248877, "epoch": 2056} {"train_loss": -42.68798065185547, "global_step": 248878, "epoch": 2056} {"train_loss": -41.2542610168457, "global_step": 248879, "epoch": 2056} {"train_loss": -42.01292037963867, "global_step": 248880, "epoch": 2056} {"train_loss": -41.486026763916016, "global_step": 248881, "epoch": 2056} {"train_loss": -42.54641342163086, "global_step": 248882, "epoch": 2056} {"train_loss": -41.77534866333008, "global_step": 248883, "epoch": 2056} {"train_loss": -42.56254959106445, "global_step": 248884, "epoch": 2056} {"train_loss": -42.358787536621094, "global_step": 248885, "epoch": 2056} {"train_loss": -41.515743255615234, "global_step": 248886, "epoch": 2056} {"train_loss": -42.730377197265625, "global_step": 248887, "epoch": 2056} {"train_loss": -42.4434814453125, "global_step": 248888, "epoch": 2056} {"train_loss": -42.26116943359375, "global_step": 248889, "epoch": 2056} {"train_loss": -42.96695327758789, "global_step": 248890, "epoch": 2056} {"train_loss": -42.270545959472656, "global_step": 248891, "epoch": 2056} {"train_loss": -41.59148025512695, "global_step": 248892, "epoch": 2056} {"train_loss": -41.98324203491211, "global_step": 248893, "epoch": 2056} {"train_loss": -42.407283782958984, "global_step": 248894, "epoch": 2056} {"train_loss": -42.697383880615234, "global_step": 248895, "epoch": 2056} {"train_loss": -41.38833097978072, "global_step": 248896, "epoch": 2056, "val_loss": 2537188.0} {"train_loss": -41.80642318725586, "global_step": 248897, "epoch": 2057} {"train_loss": -42.17517852783203, "global_step": 248898, "epoch": 2057} {"train_loss": -42.10995101928711, "global_step": 248899, "epoch": 2057} {"train_loss": -42.35109329223633, "global_step": 248900, "epoch": 2057} {"train_loss": -39.95806121826172, "global_step": 248901, "epoch": 2057} {"train_loss": -41.73783493041992, "global_step": 248902, "epoch": 2057} {"train_loss": -41.96909713745117, "global_step": 248903, "epoch": 2057} {"train_loss": -41.07392120361328, "global_step": 248904, "epoch": 2057} {"train_loss": -40.91193389892578, "global_step": 248905, "epoch": 2057} {"train_loss": -42.101951599121094, "global_step": 248906, "epoch": 2057} {"train_loss": -41.1178092956543, "global_step": 248907, "epoch": 2057} {"train_loss": -42.377864837646484, "global_step": 248908, "epoch": 2057} {"train_loss": -42.97028732299805, "global_step": 248909, "epoch": 2057} {"train_loss": -42.65705108642578, "global_step": 248910, "epoch": 2057} {"train_loss": -42.397186279296875, "global_step": 248911, "epoch": 2057} {"train_loss": -41.7575569152832, "global_step": 248912, "epoch": 2057} {"train_loss": -42.19684982299805, "global_step": 248913, "epoch": 2057} {"train_loss": -42.19108963012695, "global_step": 248914, "epoch": 2057} {"train_loss": -42.502925872802734, "global_step": 248915, "epoch": 2057} {"train_loss": -42.521175384521484, "global_step": 248916, "epoch": 2057} {"train_loss": -42.42095947265625, "global_step": 248917, "epoch": 2057} {"train_loss": -42.18695068359375, "global_step": 248918, "epoch": 2057} {"train_loss": -42.61574172973633, "global_step": 248919, "epoch": 2057} {"train_loss": -42.89908981323242, "global_step": 248920, "epoch": 2057} {"train_loss": -41.63909912109375, "global_step": 248921, "epoch": 2057} {"train_loss": -42.17353057861328, "global_step": 248922, "epoch": 2057} {"train_loss": -41.227691650390625, "global_step": 248923, "epoch": 2057} {"train_loss": -41.620452880859375, "global_step": 248924, "epoch": 2057} {"train_loss": -42.1411247253418, "global_step": 248925, "epoch": 2057} {"train_loss": -41.7614860534668, "global_step": 248926, "epoch": 2057} {"train_loss": -34.09026336669922, "global_step": 248927, "epoch": 2057} {"train_loss": -37.616737365722656, "global_step": 248928, "epoch": 2057} {"train_loss": -41.501800537109375, "global_step": 248929, "epoch": 2057} {"train_loss": -39.194305419921875, "global_step": 248930, "epoch": 2057} {"train_loss": -39.646942138671875, "global_step": 248931, "epoch": 2057} {"train_loss": -39.27998733520508, "global_step": 248932, "epoch": 2057} {"train_loss": -39.955135345458984, "global_step": 248933, "epoch": 2057} {"train_loss": -40.663604736328125, "global_step": 248934, "epoch": 2057} {"train_loss": -40.331783294677734, "global_step": 248935, "epoch": 2057} {"train_loss": -41.90888595581055, "global_step": 248936, "epoch": 2057} {"train_loss": -39.52983093261719, "global_step": 248937, "epoch": 2057} {"train_loss": -40.510005950927734, "global_step": 248938, "epoch": 2057} {"train_loss": -40.71406173706055, "global_step": 248939, "epoch": 2057} {"train_loss": -37.96139907836914, "global_step": 248940, "epoch": 2057} {"train_loss": -39.46293258666992, "global_step": 248941, "epoch": 2057} {"train_loss": -37.865272521972656, "global_step": 248942, "epoch": 2057} {"train_loss": -41.16266632080078, "global_step": 248943, "epoch": 2057} {"train_loss": -41.006351470947266, "global_step": 248944, "epoch": 2057} {"train_loss": -40.91384506225586, "global_step": 248945, "epoch": 2057} {"train_loss": -37.46466827392578, "global_step": 248946, "epoch": 2057} {"train_loss": -41.17679977416992, "global_step": 248947, "epoch": 2057} {"train_loss": -41.31010055541992, "global_step": 248948, "epoch": 2057} {"train_loss": -40.05662536621094, "global_step": 248949, "epoch": 2057} {"train_loss": -41.73436737060547, "global_step": 248950, "epoch": 2057} {"train_loss": -40.96558380126953, "global_step": 248951, "epoch": 2057} {"train_loss": -41.95220947265625, "global_step": 248952, "epoch": 2057} {"train_loss": -41.9344596862793, "global_step": 248953, "epoch": 2057} {"train_loss": -40.925777435302734, "global_step": 248954, "epoch": 2057} {"train_loss": -39.831661224365234, "global_step": 248955, "epoch": 2057} {"train_loss": -40.578704833984375, "global_step": 248956, "epoch": 2057} {"train_loss": -41.57145309448242, "global_step": 248957, "epoch": 2057} {"train_loss": -40.5210075378418, "global_step": 248958, "epoch": 2057} {"train_loss": -41.69424057006836, "global_step": 248959, "epoch": 2057} {"train_loss": -41.0389404296875, "global_step": 248960, "epoch": 2057} {"train_loss": -40.81022262573242, "global_step": 248961, "epoch": 2057} {"train_loss": -39.079708099365234, "global_step": 248962, "epoch": 2057} {"train_loss": -40.5211181640625, "global_step": 248963, "epoch": 2057} {"train_loss": -41.6455192565918, "global_step": 248964, "epoch": 2057} {"train_loss": -40.360836029052734, "global_step": 248965, "epoch": 2057} {"train_loss": -39.95037841796875, "global_step": 248966, "epoch": 2057} {"train_loss": -41.55086135864258, "global_step": 248967, "epoch": 2057} {"train_loss": -40.482513427734375, "global_step": 248968, "epoch": 2057} {"train_loss": -41.64626693725586, "global_step": 248969, "epoch": 2057} {"train_loss": -40.167823791503906, "global_step": 248970, "epoch": 2057} {"train_loss": -42.03536605834961, "global_step": 248971, "epoch": 2057} {"train_loss": -41.0418815612793, "global_step": 248972, "epoch": 2057} {"train_loss": -34.49195098876953, "global_step": 248973, "epoch": 2057} {"train_loss": -40.58742141723633, "global_step": 248974, "epoch": 2057} {"train_loss": -41.7088737487793, "global_step": 248975, "epoch": 2057} {"train_loss": -39.445308685302734, "global_step": 248976, "epoch": 2057} {"train_loss": -39.21598434448242, "global_step": 248977, "epoch": 2057} {"train_loss": -39.45989990234375, "global_step": 248978, "epoch": 2057} {"train_loss": -37.19390869140625, "global_step": 248979, "epoch": 2057} {"train_loss": -40.51922607421875, "global_step": 248980, "epoch": 2057} {"train_loss": -39.6437873840332, "global_step": 248981, "epoch": 2057} {"train_loss": -39.87260818481445, "global_step": 248982, "epoch": 2057} {"train_loss": -36.27863311767578, "global_step": 248983, "epoch": 2057} {"train_loss": -39.65790939331055, "global_step": 248984, "epoch": 2057} {"train_loss": -40.58476638793945, "global_step": 248985, "epoch": 2057} {"train_loss": -39.74397659301758, "global_step": 248986, "epoch": 2057} {"train_loss": -40.62112045288086, "global_step": 248987, "epoch": 2057} {"train_loss": -40.79743194580078, "global_step": 248988, "epoch": 2057} {"train_loss": -38.99400329589844, "global_step": 248989, "epoch": 2057} {"train_loss": -40.9296989440918, "global_step": 248990, "epoch": 2057} {"train_loss": -40.43875503540039, "global_step": 248991, "epoch": 2057} {"train_loss": -39.435089111328125, "global_step": 248992, "epoch": 2057} {"train_loss": -41.220951080322266, "global_step": 248993, "epoch": 2057} {"train_loss": -40.286556243896484, "global_step": 248994, "epoch": 2057} {"train_loss": -39.769622802734375, "global_step": 248995, "epoch": 2057} {"train_loss": -41.2949333190918, "global_step": 248996, "epoch": 2057} {"train_loss": -40.23463821411133, "global_step": 248997, "epoch": 2057} {"train_loss": -41.45441818237305, "global_step": 248998, "epoch": 2057} {"train_loss": -40.92457580566406, "global_step": 248999, "epoch": 2057} {"train_loss": -40.43898391723633, "global_step": 249000, "epoch": 2057} {"train_loss": -41.77802276611328, "global_step": 249001, "epoch": 2057} {"train_loss": -41.01441192626953, "global_step": 249002, "epoch": 2057} {"train_loss": -41.56056594848633, "global_step": 249003, "epoch": 2057} {"train_loss": -41.43067169189453, "global_step": 249004, "epoch": 2057} {"train_loss": -40.348018646240234, "global_step": 249005, "epoch": 2057} {"train_loss": -40.91265869140625, "global_step": 249006, "epoch": 2057} {"train_loss": -41.14677810668945, "global_step": 249007, "epoch": 2057} {"train_loss": -42.075016021728516, "global_step": 249008, "epoch": 2057} {"train_loss": -42.029903411865234, "global_step": 249009, "epoch": 2057} {"train_loss": -41.25162887573242, "global_step": 249010, "epoch": 2057} {"train_loss": -41.36321258544922, "global_step": 249011, "epoch": 2057} {"train_loss": -41.217281341552734, "global_step": 249012, "epoch": 2057} {"train_loss": -41.49915313720703, "global_step": 249013, "epoch": 2057} {"train_loss": -41.64252853393555, "global_step": 249014, "epoch": 2057} {"train_loss": -41.9989128112793, "global_step": 249015, "epoch": 2057} {"train_loss": -41.834407806396484, "global_step": 249016, "epoch": 2057} {"train_loss": -40.78327803178267, "global_step": 249017, "epoch": 2057, "val_loss": 2538255.75} {"train_loss": -42.10042953491211, "global_step": 249018, "epoch": 2058} {"train_loss": -41.14350128173828, "global_step": 249019, "epoch": 2058} {"train_loss": -42.475765228271484, "global_step": 249020, "epoch": 2058} {"train_loss": -42.24664306640625, "global_step": 249021, "epoch": 2058} {"train_loss": -42.316123962402344, "global_step": 249022, "epoch": 2058} {"train_loss": -42.20241165161133, "global_step": 249023, "epoch": 2058} {"train_loss": -41.845638275146484, "global_step": 249024, "epoch": 2058} {"train_loss": -41.697540283203125, "global_step": 249025, "epoch": 2058} {"train_loss": -42.287506103515625, "global_step": 249026, "epoch": 2058} {"train_loss": -41.753910064697266, "global_step": 249027, "epoch": 2058} {"train_loss": -42.34694290161133, "global_step": 249028, "epoch": 2058} {"train_loss": -41.961761474609375, "global_step": 249029, "epoch": 2058} {"train_loss": -41.496620178222656, "global_step": 249030, "epoch": 2058} {"train_loss": -42.49734115600586, "global_step": 249031, "epoch": 2058} {"train_loss": -42.1738395690918, "global_step": 249032, "epoch": 2058} {"train_loss": -41.91538619995117, "global_step": 249033, "epoch": 2058} {"train_loss": -41.29543685913086, "global_step": 249034, "epoch": 2058} {"train_loss": -42.3050422668457, "global_step": 249035, "epoch": 2058} {"train_loss": -42.580745697021484, "global_step": 249036, "epoch": 2058} {"train_loss": -42.127628326416016, "global_step": 249037, "epoch": 2058} {"train_loss": -42.76131820678711, "global_step": 249038, "epoch": 2058} {"train_loss": -41.63677978515625, "global_step": 249039, "epoch": 2058} {"train_loss": -42.52939987182617, "global_step": 249040, "epoch": 2058} {"train_loss": -41.667171478271484, "global_step": 249041, "epoch": 2058} {"train_loss": -42.621986389160156, "global_step": 249042, "epoch": 2058} {"train_loss": -42.750125885009766, "global_step": 249043, "epoch": 2058} {"train_loss": -42.99596405029297, "global_step": 249044, "epoch": 2058} {"train_loss": -42.933189392089844, "global_step": 249045, "epoch": 2058} {"train_loss": -42.45855712890625, "global_step": 249046, "epoch": 2058} {"train_loss": -43.07907485961914, "global_step": 249047, "epoch": 2058} {"train_loss": -42.60880661010742, "global_step": 249048, "epoch": 2058} {"train_loss": -42.94793701171875, "global_step": 249049, "epoch": 2058} {"train_loss": -42.67072677612305, "global_step": 249050, "epoch": 2058} {"train_loss": -42.59504699707031, "global_step": 249051, "epoch": 2058} {"train_loss": -42.71926498413086, "global_step": 249052, "epoch": 2058} {"train_loss": -42.34244918823242, "global_step": 249053, "epoch": 2058} {"train_loss": -41.97489547729492, "global_step": 249054, "epoch": 2058} {"train_loss": -42.912593841552734, "global_step": 249055, "epoch": 2058} {"train_loss": -41.962825775146484, "global_step": 249056, "epoch": 2058} {"train_loss": -41.61909866333008, "global_step": 249057, "epoch": 2058} {"train_loss": -42.60649490356445, "global_step": 249058, "epoch": 2058} {"train_loss": -43.30035400390625, "global_step": 249059, "epoch": 2058} {"train_loss": -42.556880950927734, "global_step": 249060, "epoch": 2058} {"train_loss": -43.021881103515625, "global_step": 249061, "epoch": 2058} {"train_loss": -42.81007766723633, "global_step": 249062, "epoch": 2058} {"train_loss": -42.5223388671875, "global_step": 249063, "epoch": 2058} {"train_loss": -43.0565185546875, "global_step": 249064, "epoch": 2058} {"train_loss": -43.46590042114258, "global_step": 249065, "epoch": 2058} {"train_loss": -42.70254135131836, "global_step": 249066, "epoch": 2058} {"train_loss": -43.32044219970703, "global_step": 249067, "epoch": 2058} {"train_loss": -43.54251480102539, "global_step": 249068, "epoch": 2058} {"train_loss": -42.7572135925293, "global_step": 249069, "epoch": 2058} {"train_loss": -42.08310317993164, "global_step": 249070, "epoch": 2058} {"train_loss": -42.21555709838867, "global_step": 249071, "epoch": 2058} {"train_loss": -42.41911697387695, "global_step": 249072, "epoch": 2058} {"train_loss": -42.80038070678711, "global_step": 249073, "epoch": 2058} {"train_loss": -40.776790618896484, "global_step": 249074, "epoch": 2058} {"train_loss": -41.74837875366211, "global_step": 249075, "epoch": 2058} {"train_loss": -43.01424789428711, "global_step": 249076, "epoch": 2058} {"train_loss": -43.052005767822266, "global_step": 249077, "epoch": 2058} {"train_loss": -42.00704574584961, "global_step": 249078, "epoch": 2058} {"train_loss": -40.28718566894531, "global_step": 249079, "epoch": 2058} {"train_loss": -42.12349319458008, "global_step": 249080, "epoch": 2058} {"train_loss": -41.357826232910156, "global_step": 249081, "epoch": 2058} {"train_loss": -39.20418930053711, "global_step": 249082, "epoch": 2058} {"train_loss": -38.40137481689453, "global_step": 249083, "epoch": 2058} {"train_loss": -41.699378967285156, "global_step": 249084, "epoch": 2058} {"train_loss": -42.536460876464844, "global_step": 249085, "epoch": 2058} {"train_loss": -41.133880615234375, "global_step": 249086, "epoch": 2058} {"train_loss": -40.58490753173828, "global_step": 249087, "epoch": 2058} {"train_loss": -41.128021240234375, "global_step": 249088, "epoch": 2058} {"train_loss": -41.743804931640625, "global_step": 249089, "epoch": 2058} {"train_loss": -41.60702133178711, "global_step": 249090, "epoch": 2058} {"train_loss": -42.04579162597656, "global_step": 249091, "epoch": 2058} {"train_loss": -41.3828010559082, "global_step": 249092, "epoch": 2058} {"train_loss": -40.562801361083984, "global_step": 249093, "epoch": 2058} {"train_loss": -42.055782318115234, "global_step": 249094, "epoch": 2058} {"train_loss": -42.38930892944336, "global_step": 249095, "epoch": 2058} {"train_loss": -40.61882019042969, "global_step": 249096, "epoch": 2058} {"train_loss": -40.5277099609375, "global_step": 249097, "epoch": 2058} {"train_loss": -42.175758361816406, "global_step": 249098, "epoch": 2058} {"train_loss": -41.94586181640625, "global_step": 249099, "epoch": 2058} {"train_loss": -42.73952865600586, "global_step": 249100, "epoch": 2058} {"train_loss": -42.54133224487305, "global_step": 249101, "epoch": 2058} {"train_loss": -42.54282760620117, "global_step": 249102, "epoch": 2058} {"train_loss": -42.764564514160156, "global_step": 249103, "epoch": 2058} {"train_loss": -43.04596710205078, "global_step": 249104, "epoch": 2058} {"train_loss": -42.2285270690918, "global_step": 249105, "epoch": 2058} {"train_loss": -42.23652267456055, "global_step": 249106, "epoch": 2058} {"train_loss": -43.481998443603516, "global_step": 249107, "epoch": 2058} {"train_loss": -42.27152633666992, "global_step": 249108, "epoch": 2058} {"train_loss": -42.47654724121094, "global_step": 249109, "epoch": 2058} {"train_loss": -42.36846923828125, "global_step": 249110, "epoch": 2058} {"train_loss": -41.40932846069336, "global_step": 249111, "epoch": 2058} {"train_loss": -42.56732177734375, "global_step": 249112, "epoch": 2058} {"train_loss": -43.013465881347656, "global_step": 249113, "epoch": 2058} {"train_loss": -42.61927032470703, "global_step": 249114, "epoch": 2058} {"train_loss": -42.3427619934082, "global_step": 249115, "epoch": 2058} {"train_loss": -39.709938049316406, "global_step": 249116, "epoch": 2058} {"train_loss": -43.24120330810547, "global_step": 249117, "epoch": 2058} {"train_loss": -42.79177474975586, "global_step": 249118, "epoch": 2058} {"train_loss": -38.9538688659668, "global_step": 249119, "epoch": 2058} {"train_loss": -42.6888427734375, "global_step": 249120, "epoch": 2058} {"train_loss": -43.2452278137207, "global_step": 249121, "epoch": 2058} {"train_loss": -42.97010040283203, "global_step": 249122, "epoch": 2058} {"train_loss": -41.476409912109375, "global_step": 249123, "epoch": 2058} {"train_loss": -40.460845947265625, "global_step": 249124, "epoch": 2058} {"train_loss": -42.90478515625, "global_step": 249125, "epoch": 2058} {"train_loss": -42.45091247558594, "global_step": 249126, "epoch": 2058} {"train_loss": -42.0488166809082, "global_step": 249127, "epoch": 2058} {"train_loss": -40.670494079589844, "global_step": 249128, "epoch": 2058} {"train_loss": -42.68378829956055, "global_step": 249129, "epoch": 2058} {"train_loss": -40.4853630065918, "global_step": 249130, "epoch": 2058} {"train_loss": -38.86058044433594, "global_step": 249131, "epoch": 2058} {"train_loss": -41.04372787475586, "global_step": 249132, "epoch": 2058} {"train_loss": -40.88629913330078, "global_step": 249133, "epoch": 2058} {"train_loss": -39.09632110595703, "global_step": 249134, "epoch": 2058} {"train_loss": -38.04323959350586, "global_step": 249135, "epoch": 2058} {"train_loss": -42.60335922241211, "global_step": 249136, "epoch": 2058} {"train_loss": -41.64071273803711, "global_step": 249137, "epoch": 2058} {"train_loss": -42.010296845239054, "global_step": 249138, "epoch": 2058, "val_loss": 3076336.25} {"train_loss": -41.5400390625, "global_step": 249139, "epoch": 2059} {"train_loss": -41.450321197509766, "global_step": 249140, "epoch": 2059} {"train_loss": -42.60274887084961, "global_step": 249141, "epoch": 2059} {"train_loss": -42.5224494934082, "global_step": 249142, "epoch": 2059} {"train_loss": -40.204097747802734, "global_step": 249143, "epoch": 2059} {"train_loss": -41.92153549194336, "global_step": 249144, "epoch": 2059} {"train_loss": -42.45490264892578, "global_step": 249145, "epoch": 2059} {"train_loss": -42.11492919921875, "global_step": 249146, "epoch": 2059} {"train_loss": -41.68775177001953, "global_step": 249147, "epoch": 2059} {"train_loss": -41.87213134765625, "global_step": 249148, "epoch": 2059} {"train_loss": -41.18072509765625, "global_step": 249149, "epoch": 2059} {"train_loss": -41.270748138427734, "global_step": 249150, "epoch": 2059} {"train_loss": -39.4747200012207, "global_step": 249151, "epoch": 2059} {"train_loss": -41.84596252441406, "global_step": 249152, "epoch": 2059} {"train_loss": -39.98857879638672, "global_step": 249153, "epoch": 2059} {"train_loss": -40.19053268432617, "global_step": 249154, "epoch": 2059} {"train_loss": -41.03626251220703, "global_step": 249155, "epoch": 2059} {"train_loss": -41.522457122802734, "global_step": 249156, "epoch": 2059} {"train_loss": -40.1148796081543, "global_step": 249157, "epoch": 2059} {"train_loss": -40.10791015625, "global_step": 249158, "epoch": 2059} {"train_loss": -40.087093353271484, "global_step": 249159, "epoch": 2059} {"train_loss": -39.731170654296875, "global_step": 249160, "epoch": 2059} {"train_loss": -40.272579193115234, "global_step": 249161, "epoch": 2059} {"train_loss": -42.442562103271484, "global_step": 249162, "epoch": 2059} {"train_loss": -39.272216796875, "global_step": 249163, "epoch": 2059} {"train_loss": -40.878822326660156, "global_step": 249164, "epoch": 2059} {"train_loss": -42.02207565307617, "global_step": 249165, "epoch": 2059} {"train_loss": -40.87158203125, "global_step": 249166, "epoch": 2059} {"train_loss": -35.42512130737305, "global_step": 249167, "epoch": 2059} {"train_loss": -40.39944076538086, "global_step": 249168, "epoch": 2059} {"train_loss": -41.10610580444336, "global_step": 249169, "epoch": 2059} {"train_loss": -38.47414779663086, "global_step": 249170, "epoch": 2059} {"train_loss": -38.67049026489258, "global_step": 249171, "epoch": 2059} {"train_loss": -40.75081253051758, "global_step": 249172, "epoch": 2059} {"train_loss": -41.300025939941406, "global_step": 249173, "epoch": 2059} {"train_loss": -38.383480072021484, "global_step": 249174, "epoch": 2059} {"train_loss": -39.31726837158203, "global_step": 249175, "epoch": 2059} {"train_loss": -41.3675651550293, "global_step": 249176, "epoch": 2059} {"train_loss": -38.944576263427734, "global_step": 249177, "epoch": 2059} {"train_loss": -40.94342803955078, "global_step": 249178, "epoch": 2059} {"train_loss": -40.825927734375, "global_step": 249179, "epoch": 2059} {"train_loss": -40.79483413696289, "global_step": 249180, "epoch": 2059} {"train_loss": -39.16424560546875, "global_step": 249181, "epoch": 2059} {"train_loss": -40.4597282409668, "global_step": 249182, "epoch": 2059} {"train_loss": -41.238956451416016, "global_step": 249183, "epoch": 2059} {"train_loss": -41.29328536987305, "global_step": 249184, "epoch": 2059} {"train_loss": -41.80482482910156, "global_step": 249185, "epoch": 2059} {"train_loss": -41.468074798583984, "global_step": 249186, "epoch": 2059} {"train_loss": -41.27386474609375, "global_step": 249187, "epoch": 2059} {"train_loss": -40.4608154296875, "global_step": 249188, "epoch": 2059} {"train_loss": -41.45515060424805, "global_step": 249189, "epoch": 2059} {"train_loss": -42.043724060058594, "global_step": 249190, "epoch": 2059} {"train_loss": -41.3105354309082, "global_step": 249191, "epoch": 2059} {"train_loss": -41.67072677612305, "global_step": 249192, "epoch": 2059} {"train_loss": -40.5610466003418, "global_step": 249193, "epoch": 2059} {"train_loss": -36.89509963989258, "global_step": 249194, "epoch": 2059} {"train_loss": -40.068824768066406, "global_step": 249195, "epoch": 2059} {"train_loss": -42.63615798950195, "global_step": 249196, "epoch": 2059} {"train_loss": -41.660709381103516, "global_step": 249197, "epoch": 2059} {"train_loss": -40.993064880371094, "global_step": 249198, "epoch": 2059} {"train_loss": -41.93202590942383, "global_step": 249199, "epoch": 2059} {"train_loss": -42.208412170410156, "global_step": 249200, "epoch": 2059} {"train_loss": -41.51698684692383, "global_step": 249201, "epoch": 2059} {"train_loss": -40.42142868041992, "global_step": 249202, "epoch": 2059} {"train_loss": -40.691749572753906, "global_step": 249203, "epoch": 2059} {"train_loss": -41.45547103881836, "global_step": 249204, "epoch": 2059} {"train_loss": -41.29519271850586, "global_step": 249205, "epoch": 2059} {"train_loss": -41.55504608154297, "global_step": 249206, "epoch": 2059} {"train_loss": -42.284908294677734, "global_step": 249207, "epoch": 2059} {"train_loss": -42.302040100097656, "global_step": 249208, "epoch": 2059} {"train_loss": -39.32831954956055, "global_step": 249209, "epoch": 2059} {"train_loss": -42.121124267578125, "global_step": 249210, "epoch": 2059} {"train_loss": -41.37716293334961, "global_step": 249211, "epoch": 2059} {"train_loss": -42.07011032104492, "global_step": 249212, "epoch": 2059} {"train_loss": -40.61444091796875, "global_step": 249213, "epoch": 2059} {"train_loss": -41.626426696777344, "global_step": 249214, "epoch": 2059} {"train_loss": -40.53236770629883, "global_step": 249215, "epoch": 2059} {"train_loss": -42.56501007080078, "global_step": 249216, "epoch": 2059} {"train_loss": -41.963680267333984, "global_step": 249217, "epoch": 2059} {"train_loss": -41.58181381225586, "global_step": 249218, "epoch": 2059} {"train_loss": -41.814361572265625, "global_step": 249219, "epoch": 2059} {"train_loss": -41.09060287475586, "global_step": 249220, "epoch": 2059} {"train_loss": -40.859859466552734, "global_step": 249221, "epoch": 2059} {"train_loss": -42.75739669799805, "global_step": 249222, "epoch": 2059} {"train_loss": -42.674957275390625, "global_step": 249223, "epoch": 2059} {"train_loss": -42.08974838256836, "global_step": 249224, "epoch": 2059} {"train_loss": -40.84314727783203, "global_step": 249225, "epoch": 2059} {"train_loss": -40.38357162475586, "global_step": 249226, "epoch": 2059} {"train_loss": -41.03278732299805, "global_step": 249227, "epoch": 2059} {"train_loss": -41.80029296875, "global_step": 249228, "epoch": 2059} {"train_loss": -41.635520935058594, "global_step": 249229, "epoch": 2059} {"train_loss": -41.771392822265625, "global_step": 249230, "epoch": 2059} {"train_loss": -42.67009353637695, "global_step": 249231, "epoch": 2059} {"train_loss": -42.0894889831543, "global_step": 249232, "epoch": 2059} {"train_loss": -41.476951599121094, "global_step": 249233, "epoch": 2059} {"train_loss": -42.11989974975586, "global_step": 249234, "epoch": 2059} {"train_loss": -42.22456741333008, "global_step": 249235, "epoch": 2059} {"train_loss": -42.287689208984375, "global_step": 249236, "epoch": 2059} {"train_loss": -41.9781608581543, "global_step": 249237, "epoch": 2059} {"train_loss": -41.19780349731445, "global_step": 249238, "epoch": 2059} {"train_loss": -42.12392807006836, "global_step": 249239, "epoch": 2059} {"train_loss": -41.40559768676758, "global_step": 249240, "epoch": 2059} {"train_loss": -42.41958236694336, "global_step": 249241, "epoch": 2059} {"train_loss": -42.08837890625, "global_step": 249242, "epoch": 2059} {"train_loss": -42.45820617675781, "global_step": 249243, "epoch": 2059} {"train_loss": -42.23040771484375, "global_step": 249244, "epoch": 2059} {"train_loss": -42.305992126464844, "global_step": 249245, "epoch": 2059} {"train_loss": -42.83161544799805, "global_step": 249246, "epoch": 2059} {"train_loss": -42.488216400146484, "global_step": 249247, "epoch": 2059} {"train_loss": -42.05553436279297, "global_step": 249248, "epoch": 2059} {"train_loss": -42.718772888183594, "global_step": 249249, "epoch": 2059} {"train_loss": -42.3350944519043, "global_step": 249250, "epoch": 2059} {"train_loss": -42.901588439941406, "global_step": 249251, "epoch": 2059} {"train_loss": -42.74711990356445, "global_step": 249252, "epoch": 2059} {"train_loss": -42.683406829833984, "global_step": 249253, "epoch": 2059} {"train_loss": -43.46653366088867, "global_step": 249254, "epoch": 2059} {"train_loss": -43.026275634765625, "global_step": 249255, "epoch": 2059} {"train_loss": -42.06252670288086, "global_step": 249256, "epoch": 2059} {"train_loss": -43.07146453857422, "global_step": 249257, "epoch": 2059} {"train_loss": -43.57426071166992, "global_step": 249258, "epoch": 2059} {"train_loss": -41.340271563569374, "global_step": 249259, "epoch": 2059, "val_loss": 2514226.25} {"train_loss": -41.35394287109375, "global_step": 249260, "epoch": 2060} {"train_loss": -42.64498519897461, "global_step": 249261, "epoch": 2060} {"train_loss": -43.29378128051758, "global_step": 249262, "epoch": 2060} {"train_loss": -42.579200744628906, "global_step": 249263, "epoch": 2060} {"train_loss": -42.457218170166016, "global_step": 249264, "epoch": 2060} {"train_loss": -43.31345748901367, "global_step": 249265, "epoch": 2060} {"train_loss": -42.4267692565918, "global_step": 249266, "epoch": 2060} {"train_loss": -41.723262786865234, "global_step": 249267, "epoch": 2060} {"train_loss": -40.28374099731445, "global_step": 249268, "epoch": 2060} {"train_loss": -40.16845703125, "global_step": 249269, "epoch": 2060} {"train_loss": -39.018707275390625, "global_step": 249270, "epoch": 2060} {"train_loss": -37.385066986083984, "global_step": 249271, "epoch": 2060} {"train_loss": -37.7241325378418, "global_step": 249272, "epoch": 2060} {"train_loss": -39.5991325378418, "global_step": 249273, "epoch": 2060} {"train_loss": -40.87648391723633, "global_step": 249274, "epoch": 2060} {"train_loss": -36.71236038208008, "global_step": 249275, "epoch": 2060} {"train_loss": -36.62474822998047, "global_step": 249276, "epoch": 2060} {"train_loss": -41.7138786315918, "global_step": 249277, "epoch": 2060} {"train_loss": -40.0996208190918, "global_step": 249278, "epoch": 2060} {"train_loss": -33.58537673950195, "global_step": 249279, "epoch": 2060} {"train_loss": -38.59622573852539, "global_step": 249280, "epoch": 2060} {"train_loss": -39.67909240722656, "global_step": 249281, "epoch": 2060} {"train_loss": -38.84367752075195, "global_step": 249282, "epoch": 2060} {"train_loss": -40.24170684814453, "global_step": 249283, "epoch": 2060} {"train_loss": -40.409210205078125, "global_step": 249284, "epoch": 2060} {"train_loss": -38.37455749511719, "global_step": 249285, "epoch": 2060} {"train_loss": -39.96549987792969, "global_step": 249286, "epoch": 2060} {"train_loss": -40.44027328491211, "global_step": 249287, "epoch": 2060} {"train_loss": -40.2294807434082, "global_step": 249288, "epoch": 2060} {"train_loss": -40.090267181396484, "global_step": 249289, "epoch": 2060} {"train_loss": -40.8062629699707, "global_step": 249290, "epoch": 2060} {"train_loss": -39.34111404418945, "global_step": 249291, "epoch": 2060} {"train_loss": -40.35407638549805, "global_step": 249292, "epoch": 2060} {"train_loss": -39.456600189208984, "global_step": 249293, "epoch": 2060} {"train_loss": -40.70835494995117, "global_step": 249294, "epoch": 2060} {"train_loss": -41.257102966308594, "global_step": 249295, "epoch": 2060} {"train_loss": -40.56795120239258, "global_step": 249296, "epoch": 2060} {"train_loss": -40.54206085205078, "global_step": 249297, "epoch": 2060} {"train_loss": -40.92763137817383, "global_step": 249298, "epoch": 2060} {"train_loss": -40.92856979370117, "global_step": 249299, "epoch": 2060} {"train_loss": -40.19528579711914, "global_step": 249300, "epoch": 2060} {"train_loss": -41.78036117553711, "global_step": 249301, "epoch": 2060} {"train_loss": -41.20882797241211, "global_step": 249302, "epoch": 2060} {"train_loss": -41.572021484375, "global_step": 249303, "epoch": 2060} {"train_loss": -41.06974792480469, "global_step": 249304, "epoch": 2060} {"train_loss": -41.96358108520508, "global_step": 249305, "epoch": 2060} {"train_loss": -41.544219970703125, "global_step": 249306, "epoch": 2060} {"train_loss": -41.824764251708984, "global_step": 249307, "epoch": 2060} {"train_loss": -41.972408294677734, "global_step": 249308, "epoch": 2060} {"train_loss": -42.145145416259766, "global_step": 249309, "epoch": 2060} {"train_loss": -42.056941986083984, "global_step": 249310, "epoch": 2060} {"train_loss": -42.03329086303711, "global_step": 249311, "epoch": 2060} {"train_loss": -42.132137298583984, "global_step": 249312, "epoch": 2060} {"train_loss": -42.09154510498047, "global_step": 249313, "epoch": 2060} {"train_loss": -41.66326904296875, "global_step": 249314, "epoch": 2060} {"train_loss": -42.488426208496094, "global_step": 249315, "epoch": 2060} {"train_loss": -42.140499114990234, "global_step": 249316, "epoch": 2060} {"train_loss": -42.469234466552734, "global_step": 249317, "epoch": 2060} {"train_loss": -42.34331130981445, "global_step": 249318, "epoch": 2060} {"train_loss": -42.690425872802734, "global_step": 249319, "epoch": 2060} {"train_loss": -42.52509689331055, "global_step": 249320, "epoch": 2060} {"train_loss": -42.24934768676758, "global_step": 249321, "epoch": 2060} {"train_loss": -42.5203971862793, "global_step": 249322, "epoch": 2060} {"train_loss": -42.68447494506836, "global_step": 249323, "epoch": 2060} {"train_loss": -41.635616302490234, "global_step": 249324, "epoch": 2060} {"train_loss": -42.68612289428711, "global_step": 249325, "epoch": 2060} {"train_loss": -41.13935852050781, "global_step": 249326, "epoch": 2060} {"train_loss": -42.295772552490234, "global_step": 249327, "epoch": 2060} {"train_loss": -42.76192855834961, "global_step": 249328, "epoch": 2060} {"train_loss": -42.37879943847656, "global_step": 249329, "epoch": 2060} {"train_loss": -41.66201400756836, "global_step": 249330, "epoch": 2060} {"train_loss": -41.7297477722168, "global_step": 249331, "epoch": 2060} {"train_loss": -42.35818099975586, "global_step": 249332, "epoch": 2060} {"train_loss": -43.02080154418945, "global_step": 249333, "epoch": 2060} {"train_loss": -42.6383056640625, "global_step": 249334, "epoch": 2060} {"train_loss": -43.30921936035156, "global_step": 249335, "epoch": 2060} {"train_loss": -42.18032455444336, "global_step": 249336, "epoch": 2060} {"train_loss": -42.27061080932617, "global_step": 249337, "epoch": 2060} {"train_loss": -42.115421295166016, "global_step": 249338, "epoch": 2060} {"train_loss": -42.633846282958984, "global_step": 249339, "epoch": 2060} {"train_loss": -43.0157585144043, "global_step": 249340, "epoch": 2060} {"train_loss": -42.723323822021484, "global_step": 249341, "epoch": 2060} {"train_loss": -43.14510726928711, "global_step": 249342, "epoch": 2060} {"train_loss": -43.04984664916992, "global_step": 249343, "epoch": 2060} {"train_loss": -42.97086715698242, "global_step": 249344, "epoch": 2060} {"train_loss": -43.59524154663086, "global_step": 249345, "epoch": 2060} {"train_loss": -43.2009162902832, "global_step": 249346, "epoch": 2060} {"train_loss": -43.5352668762207, "global_step": 249347, "epoch": 2060} {"train_loss": -42.867088317871094, "global_step": 249348, "epoch": 2060} {"train_loss": -42.03654098510742, "global_step": 249349, "epoch": 2060} {"train_loss": -41.11421585083008, "global_step": 249350, "epoch": 2060} {"train_loss": -39.006404876708984, "global_step": 249351, "epoch": 2060} {"train_loss": -37.6937370300293, "global_step": 249352, "epoch": 2060} {"train_loss": -36.97107696533203, "global_step": 249353, "epoch": 2060} {"train_loss": -41.20209884643555, "global_step": 249354, "epoch": 2060} {"train_loss": -42.04966735839844, "global_step": 249355, "epoch": 2060} {"train_loss": -33.5621337890625, "global_step": 249356, "epoch": 2060} {"train_loss": -24.275842666625977, "global_step": 249357, "epoch": 2060} {"train_loss": -32.475433349609375, "global_step": 249358, "epoch": 2060} {"train_loss": -40.86383819580078, "global_step": 249359, "epoch": 2060} {"train_loss": -20.722110748291016, "global_step": 249360, "epoch": 2060} {"train_loss": -27.59037208557129, "global_step": 249361, "epoch": 2060} {"train_loss": -38.60380172729492, "global_step": 249362, "epoch": 2060} {"train_loss": -28.282236099243164, "global_step": 249363, "epoch": 2060} {"train_loss": -41.0574951171875, "global_step": 249364, "epoch": 2060} {"train_loss": -33.08729934692383, "global_step": 249365, "epoch": 2060} {"train_loss": -41.64253616333008, "global_step": 249366, "epoch": 2060} {"train_loss": -34.625404357910156, "global_step": 249367, "epoch": 2060} {"train_loss": -40.90121078491211, "global_step": 249368, "epoch": 2060} {"train_loss": -37.836238861083984, "global_step": 249369, "epoch": 2060} {"train_loss": -39.96272659301758, "global_step": 249370, "epoch": 2060} {"train_loss": -40.295291900634766, "global_step": 249371, "epoch": 2060} {"train_loss": -36.53257369995117, "global_step": 249372, "epoch": 2060} {"train_loss": -38.20914840698242, "global_step": 249373, "epoch": 2060} {"train_loss": -37.75332260131836, "global_step": 249374, "epoch": 2060} {"train_loss": -40.44480514526367, "global_step": 249375, "epoch": 2060} {"train_loss": -39.8324089050293, "global_step": 249376, "epoch": 2060} {"train_loss": -40.029396057128906, "global_step": 249377, "epoch": 2060} {"train_loss": -41.748451232910156, "global_step": 249378, "epoch": 2060} {"train_loss": -40.55821990966797, "global_step": 249379, "epoch": 2060} {"train_loss": -40.24567033436673, "global_step": 249380, "epoch": 2060, "val_loss": 2598364.0} {"train_loss": -41.35569381713867, "global_step": 249381, "epoch": 2061} {"train_loss": -40.699241638183594, "global_step": 249382, "epoch": 2061} {"train_loss": -40.96260070800781, "global_step": 249383, "epoch": 2061} {"train_loss": -40.9296989440918, "global_step": 249384, "epoch": 2061} {"train_loss": -40.800254821777344, "global_step": 249385, "epoch": 2061} {"train_loss": -40.692909240722656, "global_step": 249386, "epoch": 2061} {"train_loss": -40.5262451171875, "global_step": 249387, "epoch": 2061} {"train_loss": -41.20586013793945, "global_step": 249388, "epoch": 2061} {"train_loss": -41.2298583984375, "global_step": 249389, "epoch": 2061} {"train_loss": -41.4847297668457, "global_step": 249390, "epoch": 2061} {"train_loss": -41.99575424194336, "global_step": 249391, "epoch": 2061} {"train_loss": -41.88923263549805, "global_step": 249392, "epoch": 2061} {"train_loss": -41.41654586791992, "global_step": 249393, "epoch": 2061} {"train_loss": -42.23713302612305, "global_step": 249394, "epoch": 2061} {"train_loss": -42.090145111083984, "global_step": 249395, "epoch": 2061} {"train_loss": -42.06694030761719, "global_step": 249396, "epoch": 2061} {"train_loss": -41.933895111083984, "global_step": 249397, "epoch": 2061} {"train_loss": -41.961605072021484, "global_step": 249398, "epoch": 2061} {"train_loss": -41.776241302490234, "global_step": 249399, "epoch": 2061} {"train_loss": -42.3641471862793, "global_step": 249400, "epoch": 2061} {"train_loss": -42.32807540893555, "global_step": 249401, "epoch": 2061} {"train_loss": -42.14539337158203, "global_step": 249402, "epoch": 2061} {"train_loss": -42.4368896484375, "global_step": 249403, "epoch": 2061} {"train_loss": -42.550113677978516, "global_step": 249404, "epoch": 2061} {"train_loss": -42.45316696166992, "global_step": 249405, "epoch": 2061} {"train_loss": -43.01481246948242, "global_step": 249406, "epoch": 2061} {"train_loss": -42.708038330078125, "global_step": 249407, "epoch": 2061} {"train_loss": -43.040016174316406, "global_step": 249408, "epoch": 2061} {"train_loss": -42.61649703979492, "global_step": 249409, "epoch": 2061} {"train_loss": -42.8046989440918, "global_step": 249410, "epoch": 2061} {"train_loss": -42.965335845947266, "global_step": 249411, "epoch": 2061} {"train_loss": -42.86989974975586, "global_step": 249412, "epoch": 2061} {"train_loss": -42.66651153564453, "global_step": 249413, "epoch": 2061} {"train_loss": -41.2952995300293, "global_step": 249414, "epoch": 2061} {"train_loss": -42.928829193115234, "global_step": 249415, "epoch": 2061} {"train_loss": -42.561519622802734, "global_step": 249416, "epoch": 2061} {"train_loss": -42.96124267578125, "global_step": 249417, "epoch": 2061} {"train_loss": -42.61697006225586, "global_step": 249418, "epoch": 2061} {"train_loss": -43.06232833862305, "global_step": 249419, "epoch": 2061} {"train_loss": -42.903076171875, "global_step": 249420, "epoch": 2061} {"train_loss": -42.3635139465332, "global_step": 249421, "epoch": 2061} {"train_loss": -43.20254898071289, "global_step": 249422, "epoch": 2061} {"train_loss": -42.54868698120117, "global_step": 249423, "epoch": 2061} {"train_loss": -42.72163009643555, "global_step": 249424, "epoch": 2061} {"train_loss": -43.05060958862305, "global_step": 249425, "epoch": 2061} {"train_loss": -43.185203552246094, "global_step": 249426, "epoch": 2061} {"train_loss": -43.29378128051758, "global_step": 249427, "epoch": 2061} {"train_loss": -43.37874984741211, "global_step": 249428, "epoch": 2061} {"train_loss": -42.903202056884766, "global_step": 249429, "epoch": 2061} {"train_loss": -41.20120620727539, "global_step": 249430, "epoch": 2061} {"train_loss": -42.67930221557617, "global_step": 249431, "epoch": 2061} {"train_loss": -42.810482025146484, "global_step": 249432, "epoch": 2061} {"train_loss": -42.6387825012207, "global_step": 249433, "epoch": 2061} {"train_loss": -42.62354278564453, "global_step": 249434, "epoch": 2061} {"train_loss": -43.65624237060547, "global_step": 249435, "epoch": 2061} {"train_loss": -42.77159118652344, "global_step": 249436, "epoch": 2061} {"train_loss": -43.03057098388672, "global_step": 249437, "epoch": 2061} {"train_loss": -42.92109680175781, "global_step": 249438, "epoch": 2061} {"train_loss": -43.5733757019043, "global_step": 249439, "epoch": 2061} {"train_loss": -43.684532165527344, "global_step": 249440, "epoch": 2061} {"train_loss": -43.48588943481445, "global_step": 249441, "epoch": 2061} {"train_loss": -43.794776916503906, "global_step": 249442, "epoch": 2061} {"train_loss": -43.148719787597656, "global_step": 249443, "epoch": 2061} {"train_loss": -43.62138366699219, "global_step": 249444, "epoch": 2061} {"train_loss": -42.161983489990234, "global_step": 249445, "epoch": 2061} {"train_loss": -43.575618743896484, "global_step": 249446, "epoch": 2061} {"train_loss": -43.45981216430664, "global_step": 249447, "epoch": 2061} {"train_loss": -42.39243698120117, "global_step": 249448, "epoch": 2061} {"train_loss": -42.879295349121094, "global_step": 249449, "epoch": 2061} {"train_loss": -42.3989143371582, "global_step": 249450, "epoch": 2061} {"train_loss": -43.12928771972656, "global_step": 249451, "epoch": 2061} {"train_loss": -41.19865036010742, "global_step": 249452, "epoch": 2061} {"train_loss": -41.53226852416992, "global_step": 249453, "epoch": 2061} {"train_loss": -40.938262939453125, "global_step": 249454, "epoch": 2061} {"train_loss": -42.2650146484375, "global_step": 249455, "epoch": 2061} {"train_loss": -42.737728118896484, "global_step": 249456, "epoch": 2061} {"train_loss": -42.51085662841797, "global_step": 249457, "epoch": 2061} {"train_loss": -41.002349853515625, "global_step": 249458, "epoch": 2061} {"train_loss": -39.254974365234375, "global_step": 249459, "epoch": 2061} {"train_loss": -42.23582458496094, "global_step": 249460, "epoch": 2061} {"train_loss": -42.794654846191406, "global_step": 249461, "epoch": 2061} {"train_loss": -41.297515869140625, "global_step": 249462, "epoch": 2061} {"train_loss": -41.76151657104492, "global_step": 249463, "epoch": 2061} {"train_loss": -41.89009475708008, "global_step": 249464, "epoch": 2061} {"train_loss": -42.24984359741211, "global_step": 249465, "epoch": 2061} {"train_loss": -42.22914505004883, "global_step": 249466, "epoch": 2061} {"train_loss": -41.62333297729492, "global_step": 249467, "epoch": 2061} {"train_loss": -41.388790130615234, "global_step": 249468, "epoch": 2061} {"train_loss": -42.581295013427734, "global_step": 249469, "epoch": 2061} {"train_loss": -41.594451904296875, "global_step": 249470, "epoch": 2061} {"train_loss": -42.039669036865234, "global_step": 249471, "epoch": 2061} {"train_loss": -42.41279220581055, "global_step": 249472, "epoch": 2061} {"train_loss": -42.05219268798828, "global_step": 249473, "epoch": 2061} {"train_loss": -42.55609130859375, "global_step": 249474, "epoch": 2061} {"train_loss": -42.50020217895508, "global_step": 249475, "epoch": 2061} {"train_loss": -42.3090705871582, "global_step": 249476, "epoch": 2061} {"train_loss": -42.868682861328125, "global_step": 249477, "epoch": 2061} {"train_loss": -42.08123779296875, "global_step": 249478, "epoch": 2061} {"train_loss": -42.81382369995117, "global_step": 249479, "epoch": 2061} {"train_loss": -43.061065673828125, "global_step": 249480, "epoch": 2061} {"train_loss": -42.57360076904297, "global_step": 249481, "epoch": 2061} {"train_loss": -42.898895263671875, "global_step": 249482, "epoch": 2061} {"train_loss": -42.59803009033203, "global_step": 249483, "epoch": 2061} {"train_loss": -43.19350814819336, "global_step": 249484, "epoch": 2061} {"train_loss": -43.07124710083008, "global_step": 249485, "epoch": 2061} {"train_loss": -42.75777816772461, "global_step": 249486, "epoch": 2061} {"train_loss": -43.110172271728516, "global_step": 249487, "epoch": 2061} {"train_loss": -42.52231979370117, "global_step": 249488, "epoch": 2061} {"train_loss": -42.793453216552734, "global_step": 249489, "epoch": 2061} {"train_loss": -42.3227424621582, "global_step": 249490, "epoch": 2061} {"train_loss": -43.28350830078125, "global_step": 249491, "epoch": 2061} {"train_loss": -43.10994338989258, "global_step": 249492, "epoch": 2061} {"train_loss": -43.00432586669922, "global_step": 249493, "epoch": 2061} {"train_loss": -42.116424560546875, "global_step": 249494, "epoch": 2061} {"train_loss": -42.55666732788086, "global_step": 249495, "epoch": 2061} {"train_loss": -42.148109436035156, "global_step": 249496, "epoch": 2061} {"train_loss": -42.323097229003906, "global_step": 249497, "epoch": 2061} {"train_loss": -41.36116409301758, "global_step": 249498, "epoch": 2061} {"train_loss": -42.7812385559082, "global_step": 249499, "epoch": 2061} {"train_loss": -40.942378997802734, "global_step": 249500, "epoch": 2061} {"train_loss": -42.34494787799425, "global_step": 249501, "epoch": 2061, "val_loss": 2504445.0} {"train_loss": -40.72898483276367, "global_step": 249502, "epoch": 2062} {"train_loss": -41.66689682006836, "global_step": 249503, "epoch": 2062} {"train_loss": -39.26664733886719, "global_step": 249504, "epoch": 2062} {"train_loss": -40.235713958740234, "global_step": 249505, "epoch": 2062} {"train_loss": -41.099342346191406, "global_step": 249506, "epoch": 2062} {"train_loss": -39.059200286865234, "global_step": 249507, "epoch": 2062} {"train_loss": -34.2046012878418, "global_step": 249508, "epoch": 2062} {"train_loss": -38.253944396972656, "global_step": 249509, "epoch": 2062} {"train_loss": -37.14104080200195, "global_step": 249510, "epoch": 2062} {"train_loss": -39.316688537597656, "global_step": 249511, "epoch": 2062} {"train_loss": -41.012813568115234, "global_step": 249512, "epoch": 2062} {"train_loss": -34.09955978393555, "global_step": 249513, "epoch": 2062} {"train_loss": -37.75849533081055, "global_step": 249514, "epoch": 2062} {"train_loss": -41.79053497314453, "global_step": 249515, "epoch": 2062} {"train_loss": -39.54875183105469, "global_step": 249516, "epoch": 2062} {"train_loss": -38.4599494934082, "global_step": 249517, "epoch": 2062} {"train_loss": -39.59028244018555, "global_step": 249518, "epoch": 2062} {"train_loss": -40.63044357299805, "global_step": 249519, "epoch": 2062} {"train_loss": -38.92560577392578, "global_step": 249520, "epoch": 2062} {"train_loss": -38.286949157714844, "global_step": 249521, "epoch": 2062} {"train_loss": -40.23373031616211, "global_step": 249522, "epoch": 2062} {"train_loss": -38.10439682006836, "global_step": 249523, "epoch": 2062} {"train_loss": -38.824764251708984, "global_step": 249524, "epoch": 2062} {"train_loss": -41.949859619140625, "global_step": 249525, "epoch": 2062} {"train_loss": -41.32122802734375, "global_step": 249526, "epoch": 2062} {"train_loss": -40.850135803222656, "global_step": 249527, "epoch": 2062} {"train_loss": -39.999507904052734, "global_step": 249528, "epoch": 2062} {"train_loss": -41.209651947021484, "global_step": 249529, "epoch": 2062} {"train_loss": -39.8355712890625, "global_step": 249530, "epoch": 2062} {"train_loss": -39.2868766784668, "global_step": 249531, "epoch": 2062} {"train_loss": -38.00167465209961, "global_step": 249532, "epoch": 2062} {"train_loss": -40.20655059814453, "global_step": 249533, "epoch": 2062} {"train_loss": -41.00973892211914, "global_step": 249534, "epoch": 2062} {"train_loss": -41.585208892822266, "global_step": 249535, "epoch": 2062} {"train_loss": -39.98613357543945, "global_step": 249536, "epoch": 2062} {"train_loss": -39.86178970336914, "global_step": 249537, "epoch": 2062} {"train_loss": -40.9195671081543, "global_step": 249538, "epoch": 2062} {"train_loss": -39.91469192504883, "global_step": 249539, "epoch": 2062} {"train_loss": -39.7971305847168, "global_step": 249540, "epoch": 2062} {"train_loss": -40.82735061645508, "global_step": 249541, "epoch": 2062} {"train_loss": -39.047245025634766, "global_step": 249542, "epoch": 2062} {"train_loss": -40.57200241088867, "global_step": 249543, "epoch": 2062} {"train_loss": -40.3073616027832, "global_step": 249544, "epoch": 2062} {"train_loss": -40.757991790771484, "global_step": 249545, "epoch": 2062} {"train_loss": -41.18772506713867, "global_step": 249546, "epoch": 2062} {"train_loss": -40.14360046386719, "global_step": 249547, "epoch": 2062} {"train_loss": -41.9661979675293, "global_step": 249548, "epoch": 2062} {"train_loss": -41.471858978271484, "global_step": 249549, "epoch": 2062} {"train_loss": -40.76306915283203, "global_step": 249550, "epoch": 2062} {"train_loss": -40.60589599609375, "global_step": 249551, "epoch": 2062} {"train_loss": -41.08601760864258, "global_step": 249552, "epoch": 2062} {"train_loss": -39.73747634887695, "global_step": 249553, "epoch": 2062} {"train_loss": -41.655059814453125, "global_step": 249554, "epoch": 2062} {"train_loss": -41.413021087646484, "global_step": 249555, "epoch": 2062} {"train_loss": -40.79265213012695, "global_step": 249556, "epoch": 2062} {"train_loss": -39.876033782958984, "global_step": 249557, "epoch": 2062} {"train_loss": -41.702232360839844, "global_step": 249558, "epoch": 2062} {"train_loss": -42.12563705444336, "global_step": 249559, "epoch": 2062} {"train_loss": -39.87885284423828, "global_step": 249560, "epoch": 2062} {"train_loss": -42.56621170043945, "global_step": 249561, "epoch": 2062} {"train_loss": -41.894344329833984, "global_step": 249562, "epoch": 2062} {"train_loss": -42.364192962646484, "global_step": 249563, "epoch": 2062} {"train_loss": -40.09670639038086, "global_step": 249564, "epoch": 2062} {"train_loss": -40.95991897583008, "global_step": 249565, "epoch": 2062} {"train_loss": -41.51092529296875, "global_step": 249566, "epoch": 2062} {"train_loss": -41.50008773803711, "global_step": 249567, "epoch": 2062} {"train_loss": -42.35444259643555, "global_step": 249568, "epoch": 2062} {"train_loss": -42.24188232421875, "global_step": 249569, "epoch": 2062} {"train_loss": -41.60303497314453, "global_step": 249570, "epoch": 2062} {"train_loss": -40.85589599609375, "global_step": 249571, "epoch": 2062} {"train_loss": -42.54579544067383, "global_step": 249572, "epoch": 2062} {"train_loss": -42.773681640625, "global_step": 249573, "epoch": 2062} {"train_loss": -41.79329299926758, "global_step": 249574, "epoch": 2062} {"train_loss": -41.31800079345703, "global_step": 249575, "epoch": 2062} {"train_loss": -41.48440170288086, "global_step": 249576, "epoch": 2062} {"train_loss": -42.763694763183594, "global_step": 249577, "epoch": 2062} {"train_loss": -42.584774017333984, "global_step": 249578, "epoch": 2062} {"train_loss": -42.973304748535156, "global_step": 249579, "epoch": 2062} {"train_loss": -42.04075241088867, "global_step": 249580, "epoch": 2062} {"train_loss": -42.3940315246582, "global_step": 249581, "epoch": 2062} {"train_loss": -43.070716857910156, "global_step": 249582, "epoch": 2062} {"train_loss": -42.30811309814453, "global_step": 249583, "epoch": 2062} {"train_loss": -43.07985305786133, "global_step": 249584, "epoch": 2062} {"train_loss": -42.55706024169922, "global_step": 249585, "epoch": 2062} {"train_loss": -42.90597152709961, "global_step": 249586, "epoch": 2062} {"train_loss": -42.60652542114258, "global_step": 249587, "epoch": 2062} {"train_loss": -40.70035934448242, "global_step": 249588, "epoch": 2062} {"train_loss": -42.41339874267578, "global_step": 249589, "epoch": 2062} {"train_loss": -41.260528564453125, "global_step": 249590, "epoch": 2062} {"train_loss": -42.32307052612305, "global_step": 249591, "epoch": 2062} {"train_loss": -42.284610748291016, "global_step": 249592, "epoch": 2062} {"train_loss": -42.64325714111328, "global_step": 249593, "epoch": 2062} {"train_loss": -42.93803024291992, "global_step": 249594, "epoch": 2062} {"train_loss": -42.82620620727539, "global_step": 249595, "epoch": 2062} {"train_loss": -43.08888626098633, "global_step": 249596, "epoch": 2062} {"train_loss": -43.139583587646484, "global_step": 249597, "epoch": 2062} {"train_loss": -40.80646514892578, "global_step": 249598, "epoch": 2062} {"train_loss": -42.745182037353516, "global_step": 249599, "epoch": 2062} {"train_loss": -43.431358337402344, "global_step": 249600, "epoch": 2062} {"train_loss": -40.99737548828125, "global_step": 249601, "epoch": 2062} {"train_loss": -43.19855880737305, "global_step": 249602, "epoch": 2062} {"train_loss": -42.30941390991211, "global_step": 249603, "epoch": 2062} {"train_loss": -42.7587890625, "global_step": 249604, "epoch": 2062} {"train_loss": -40.057594299316406, "global_step": 249605, "epoch": 2062} {"train_loss": -42.63751983642578, "global_step": 249606, "epoch": 2062} {"train_loss": -42.46875762939453, "global_step": 249607, "epoch": 2062} {"train_loss": -42.42235565185547, "global_step": 249608, "epoch": 2062} {"train_loss": -42.43535614013672, "global_step": 249609, "epoch": 2062} {"train_loss": -42.67743682861328, "global_step": 249610, "epoch": 2062} {"train_loss": -43.37892150878906, "global_step": 249611, "epoch": 2062} {"train_loss": -41.082923889160156, "global_step": 249612, "epoch": 2062} {"train_loss": -43.02641677856445, "global_step": 249613, "epoch": 2062} {"train_loss": -42.356563568115234, "global_step": 249614, "epoch": 2062} {"train_loss": -42.91476821899414, "global_step": 249615, "epoch": 2062} {"train_loss": -41.913612365722656, "global_step": 249616, "epoch": 2062} {"train_loss": -43.014259338378906, "global_step": 249617, "epoch": 2062} {"train_loss": -42.26776123046875, "global_step": 249618, "epoch": 2062} {"train_loss": -41.9947624206543, "global_step": 249619, "epoch": 2062} {"train_loss": -42.965728759765625, "global_step": 249620, "epoch": 2062} {"train_loss": -42.205013275146484, "global_step": 249621, "epoch": 2062} {"train_loss": -41.15186215235182, "global_step": 249622, "epoch": 2062, "val_loss": 2529013.25} {"train_loss": -42.50373077392578, "global_step": 249623, "epoch": 2063} {"train_loss": -42.578773498535156, "global_step": 249624, "epoch": 2063} {"train_loss": -42.956417083740234, "global_step": 249625, "epoch": 2063} {"train_loss": -42.71287155151367, "global_step": 249626, "epoch": 2063} {"train_loss": -42.884552001953125, "global_step": 249627, "epoch": 2063} {"train_loss": -43.24210739135742, "global_step": 249628, "epoch": 2063} {"train_loss": -41.941192626953125, "global_step": 249629, "epoch": 2063} {"train_loss": -42.771766662597656, "global_step": 249630, "epoch": 2063} {"train_loss": -43.28812789916992, "global_step": 249631, "epoch": 2063} {"train_loss": -43.05779266357422, "global_step": 249632, "epoch": 2063} {"train_loss": -42.86646270751953, "global_step": 249633, "epoch": 2063} {"train_loss": -43.03202438354492, "global_step": 249634, "epoch": 2063} {"train_loss": -42.31534957885742, "global_step": 249635, "epoch": 2063} {"train_loss": -42.6345329284668, "global_step": 249636, "epoch": 2063} {"train_loss": -43.13836669921875, "global_step": 249637, "epoch": 2063} {"train_loss": -41.50947952270508, "global_step": 249638, "epoch": 2063} {"train_loss": -42.592647552490234, "global_step": 249639, "epoch": 2063} {"train_loss": -43.161136627197266, "global_step": 249640, "epoch": 2063} {"train_loss": -42.21653366088867, "global_step": 249641, "epoch": 2063} {"train_loss": -41.81321334838867, "global_step": 249642, "epoch": 2063} {"train_loss": -42.99979782104492, "global_step": 249643, "epoch": 2063} {"train_loss": -43.46635818481445, "global_step": 249644, "epoch": 2063} {"train_loss": -42.792259216308594, "global_step": 249645, "epoch": 2063} {"train_loss": -42.817726135253906, "global_step": 249646, "epoch": 2063} {"train_loss": -43.043212890625, "global_step": 249647, "epoch": 2063} {"train_loss": -42.206695556640625, "global_step": 249648, "epoch": 2063} {"train_loss": -42.649688720703125, "global_step": 249649, "epoch": 2063} {"train_loss": -43.022125244140625, "global_step": 249650, "epoch": 2063} {"train_loss": -42.739498138427734, "global_step": 249651, "epoch": 2063} {"train_loss": -42.97351837158203, "global_step": 249652, "epoch": 2063} {"train_loss": -42.90066146850586, "global_step": 249653, "epoch": 2063} {"train_loss": -42.61374282836914, "global_step": 249654, "epoch": 2063} {"train_loss": -42.14140701293945, "global_step": 249655, "epoch": 2063} {"train_loss": -42.290225982666016, "global_step": 249656, "epoch": 2063} {"train_loss": -43.06283187866211, "global_step": 249657, "epoch": 2063} {"train_loss": -42.67656707763672, "global_step": 249658, "epoch": 2063} {"train_loss": -43.14361572265625, "global_step": 249659, "epoch": 2063} {"train_loss": -43.036991119384766, "global_step": 249660, "epoch": 2063} {"train_loss": -41.72370529174805, "global_step": 249661, "epoch": 2063} {"train_loss": -42.559417724609375, "global_step": 249662, "epoch": 2063} {"train_loss": -42.48366928100586, "global_step": 249663, "epoch": 2063} {"train_loss": -43.05622482299805, "global_step": 249664, "epoch": 2063} {"train_loss": -43.47391891479492, "global_step": 249665, "epoch": 2063} {"train_loss": -42.237911224365234, "global_step": 249666, "epoch": 2063} {"train_loss": -42.895660400390625, "global_step": 249667, "epoch": 2063} {"train_loss": -42.67560577392578, "global_step": 249668, "epoch": 2063} {"train_loss": -42.99420166015625, "global_step": 249669, "epoch": 2063} {"train_loss": -43.44277572631836, "global_step": 249670, "epoch": 2063} {"train_loss": -43.454891204833984, "global_step": 249671, "epoch": 2063} {"train_loss": -43.04201889038086, "global_step": 249672, "epoch": 2063} {"train_loss": -42.77610397338867, "global_step": 249673, "epoch": 2063} {"train_loss": -42.849525451660156, "global_step": 249674, "epoch": 2063} {"train_loss": -42.96784591674805, "global_step": 249675, "epoch": 2063} {"train_loss": -41.260494232177734, "global_step": 249676, "epoch": 2063} {"train_loss": -41.546321868896484, "global_step": 249677, "epoch": 2063} {"train_loss": -41.717315673828125, "global_step": 249678, "epoch": 2063} {"train_loss": -41.163875579833984, "global_step": 249679, "epoch": 2063} {"train_loss": -42.93255615234375, "global_step": 249680, "epoch": 2063} {"train_loss": -42.687801361083984, "global_step": 249681, "epoch": 2063} {"train_loss": -42.750152587890625, "global_step": 249682, "epoch": 2063} {"train_loss": -41.348934173583984, "global_step": 249683, "epoch": 2063} {"train_loss": -39.590702056884766, "global_step": 249684, "epoch": 2063} {"train_loss": -36.52564239501953, "global_step": 249685, "epoch": 2063} {"train_loss": -37.34699630737305, "global_step": 249686, "epoch": 2063} {"train_loss": -40.502803802490234, "global_step": 249687, "epoch": 2063} {"train_loss": -39.571266174316406, "global_step": 249688, "epoch": 2063} {"train_loss": -32.8591194152832, "global_step": 249689, "epoch": 2063} {"train_loss": -37.19634246826172, "global_step": 249690, "epoch": 2063} {"train_loss": -40.060768127441406, "global_step": 249691, "epoch": 2063} {"train_loss": -38.003414154052734, "global_step": 249692, "epoch": 2063} {"train_loss": -39.32769775390625, "global_step": 249693, "epoch": 2063} {"train_loss": -40.715450286865234, "global_step": 249694, "epoch": 2063} {"train_loss": -41.00593185424805, "global_step": 249695, "epoch": 2063} {"train_loss": -41.452266693115234, "global_step": 249696, "epoch": 2063} {"train_loss": -40.60765838623047, "global_step": 249697, "epoch": 2063} {"train_loss": -39.61075210571289, "global_step": 249698, "epoch": 2063} {"train_loss": -41.519996643066406, "global_step": 249699, "epoch": 2063} {"train_loss": -40.34330368041992, "global_step": 249700, "epoch": 2063} {"train_loss": -41.763526916503906, "global_step": 249701, "epoch": 2063} {"train_loss": -41.72761917114258, "global_step": 249702, "epoch": 2063} {"train_loss": -42.033695220947266, "global_step": 249703, "epoch": 2063} {"train_loss": -41.571128845214844, "global_step": 249704, "epoch": 2063} {"train_loss": -41.952789306640625, "global_step": 249705, "epoch": 2063} {"train_loss": -41.81173324584961, "global_step": 249706, "epoch": 2063} {"train_loss": -42.112754821777344, "global_step": 249707, "epoch": 2063} {"train_loss": -41.3387565612793, "global_step": 249708, "epoch": 2063} {"train_loss": -41.48102569580078, "global_step": 249709, "epoch": 2063} {"train_loss": -41.87326431274414, "global_step": 249710, "epoch": 2063} {"train_loss": -41.25222396850586, "global_step": 249711, "epoch": 2063} {"train_loss": -42.26033020019531, "global_step": 249712, "epoch": 2063} {"train_loss": -42.561092376708984, "global_step": 249713, "epoch": 2063} {"train_loss": -42.35665512084961, "global_step": 249714, "epoch": 2063} {"train_loss": -42.348628997802734, "global_step": 249715, "epoch": 2063} {"train_loss": -41.88912582397461, "global_step": 249716, "epoch": 2063} {"train_loss": -41.940494537353516, "global_step": 249717, "epoch": 2063} {"train_loss": -42.49283981323242, "global_step": 249718, "epoch": 2063} {"train_loss": -42.193145751953125, "global_step": 249719, "epoch": 2063} {"train_loss": -42.636234283447266, "global_step": 249720, "epoch": 2063} {"train_loss": -42.000343322753906, "global_step": 249721, "epoch": 2063} {"train_loss": -42.057125091552734, "global_step": 249722, "epoch": 2063} {"train_loss": -42.629554748535156, "global_step": 249723, "epoch": 2063} {"train_loss": -42.33048629760742, "global_step": 249724, "epoch": 2063} {"train_loss": -42.75349807739258, "global_step": 249725, "epoch": 2063} {"train_loss": -42.386226654052734, "global_step": 249726, "epoch": 2063} {"train_loss": -42.566978454589844, "global_step": 249727, "epoch": 2063} {"train_loss": -42.33510208129883, "global_step": 249728, "epoch": 2063} {"train_loss": -42.77693176269531, "global_step": 249729, "epoch": 2063} {"train_loss": -42.177467346191406, "global_step": 249730, "epoch": 2063} {"train_loss": -42.53052520751953, "global_step": 249731, "epoch": 2063} {"train_loss": -42.377071380615234, "global_step": 249732, "epoch": 2063} {"train_loss": -42.765777587890625, "global_step": 249733, "epoch": 2063} {"train_loss": -42.44514465332031, "global_step": 249734, "epoch": 2063} {"train_loss": -42.596309661865234, "global_step": 249735, "epoch": 2063} {"train_loss": -42.433563232421875, "global_step": 249736, "epoch": 2063} {"train_loss": -42.458892822265625, "global_step": 249737, "epoch": 2063} {"train_loss": -42.32251739501953, "global_step": 249738, "epoch": 2063} {"train_loss": -42.96199035644531, "global_step": 249739, "epoch": 2063} {"train_loss": -42.52232360839844, "global_step": 249740, "epoch": 2063} {"train_loss": -42.19221878051758, "global_step": 249741, "epoch": 2063} {"train_loss": -43.21283721923828, "global_step": 249742, "epoch": 2063} {"train_loss": -42.02332466692964, "global_step": 249743, "epoch": 2063, "val_loss": 2537782.25} {"train_loss": -42.74303436279297, "global_step": 249744, "epoch": 2064} {"train_loss": -42.88251495361328, "global_step": 249745, "epoch": 2064} {"train_loss": -43.026851654052734, "global_step": 249746, "epoch": 2064} {"train_loss": -43.42729568481445, "global_step": 249747, "epoch": 2064} {"train_loss": -42.3336181640625, "global_step": 249748, "epoch": 2064} {"train_loss": -43.40328598022461, "global_step": 249749, "epoch": 2064} {"train_loss": -43.03992462158203, "global_step": 249750, "epoch": 2064} {"train_loss": -43.00604248046875, "global_step": 249751, "epoch": 2064} {"train_loss": -43.272918701171875, "global_step": 249752, "epoch": 2064} {"train_loss": -43.052120208740234, "global_step": 249753, "epoch": 2064} {"train_loss": -43.3765983581543, "global_step": 249754, "epoch": 2064} {"train_loss": -42.79863357543945, "global_step": 249755, "epoch": 2064} {"train_loss": -42.97125244140625, "global_step": 249756, "epoch": 2064} {"train_loss": -42.53804016113281, "global_step": 249757, "epoch": 2064} {"train_loss": -43.1818962097168, "global_step": 249758, "epoch": 2064} {"train_loss": -42.6146354675293, "global_step": 249759, "epoch": 2064} {"train_loss": -42.10490798950195, "global_step": 249760, "epoch": 2064} {"train_loss": -42.89980697631836, "global_step": 249761, "epoch": 2064} {"train_loss": -43.09902572631836, "global_step": 249762, "epoch": 2064} {"train_loss": -43.6390495300293, "global_step": 249763, "epoch": 2064} {"train_loss": -43.616817474365234, "global_step": 249764, "epoch": 2064} {"train_loss": -42.90044021606445, "global_step": 249765, "epoch": 2064} {"train_loss": -43.141605377197266, "global_step": 249766, "epoch": 2064} {"train_loss": -43.47434997558594, "global_step": 249767, "epoch": 2064} {"train_loss": -42.86720657348633, "global_step": 249768, "epoch": 2064} {"train_loss": -42.5305061340332, "global_step": 249769, "epoch": 2064} {"train_loss": -42.52176284790039, "global_step": 249770, "epoch": 2064} {"train_loss": -43.41853713989258, "global_step": 249771, "epoch": 2064} {"train_loss": -42.79482650756836, "global_step": 249772, "epoch": 2064} {"train_loss": -43.595611572265625, "global_step": 249773, "epoch": 2064} {"train_loss": -42.172119140625, "global_step": 249774, "epoch": 2064} {"train_loss": -42.69044494628906, "global_step": 249775, "epoch": 2064} {"train_loss": -43.6693229675293, "global_step": 249776, "epoch": 2064} {"train_loss": -43.150054931640625, "global_step": 249777, "epoch": 2064} {"train_loss": -43.5175666809082, "global_step": 249778, "epoch": 2064} {"train_loss": -43.01976776123047, "global_step": 249779, "epoch": 2064} {"train_loss": -43.4068603515625, "global_step": 249780, "epoch": 2064} {"train_loss": -43.2724494934082, "global_step": 249781, "epoch": 2064} {"train_loss": -41.71323776245117, "global_step": 249782, "epoch": 2064} {"train_loss": -37.74849319458008, "global_step": 249783, "epoch": 2064} {"train_loss": -31.731130599975586, "global_step": 249784, "epoch": 2064} {"train_loss": -27.77978515625, "global_step": 249785, "epoch": 2064} {"train_loss": -37.528316497802734, "global_step": 249786, "epoch": 2064} {"train_loss": -41.693294525146484, "global_step": 249787, "epoch": 2064} {"train_loss": -32.37063980102539, "global_step": 249788, "epoch": 2064} {"train_loss": -29.1387882232666, "global_step": 249789, "epoch": 2064} {"train_loss": -41.46669387817383, "global_step": 249790, "epoch": 2064} {"train_loss": -37.18035888671875, "global_step": 249791, "epoch": 2064} {"train_loss": -39.1424446105957, "global_step": 249792, "epoch": 2064} {"train_loss": -40.587764739990234, "global_step": 249793, "epoch": 2064} {"train_loss": -34.970054626464844, "global_step": 249794, "epoch": 2064} {"train_loss": -41.188663482666016, "global_step": 249795, "epoch": 2064} {"train_loss": -37.62763595581055, "global_step": 249796, "epoch": 2064} {"train_loss": -41.525020599365234, "global_step": 249797, "epoch": 2064} {"train_loss": -38.14890670776367, "global_step": 249798, "epoch": 2064} {"train_loss": -41.70267868041992, "global_step": 249799, "epoch": 2064} {"train_loss": -39.22328567504883, "global_step": 249800, "epoch": 2064} {"train_loss": -40.835113525390625, "global_step": 249801, "epoch": 2064} {"train_loss": -40.855098724365234, "global_step": 249802, "epoch": 2064} {"train_loss": -41.77158737182617, "global_step": 249803, "epoch": 2064} {"train_loss": -40.9543571472168, "global_step": 249804, "epoch": 2064} {"train_loss": -42.5438232421875, "global_step": 249805, "epoch": 2064} {"train_loss": -41.92551803588867, "global_step": 249806, "epoch": 2064} {"train_loss": -42.15653610229492, "global_step": 249807, "epoch": 2064} {"train_loss": -41.1834831237793, "global_step": 249808, "epoch": 2064} {"train_loss": -42.74773025512695, "global_step": 249809, "epoch": 2064} {"train_loss": -42.40684127807617, "global_step": 249810, "epoch": 2064} {"train_loss": -42.5926399230957, "global_step": 249811, "epoch": 2064} {"train_loss": -42.58992385864258, "global_step": 249812, "epoch": 2064} {"train_loss": -42.35114669799805, "global_step": 249813, "epoch": 2064} {"train_loss": -42.67140579223633, "global_step": 249814, "epoch": 2064} {"train_loss": -42.486263275146484, "global_step": 249815, "epoch": 2064} {"train_loss": -43.01958084106445, "global_step": 249816, "epoch": 2064} {"train_loss": -42.42091751098633, "global_step": 249817, "epoch": 2064} {"train_loss": -42.98397445678711, "global_step": 249818, "epoch": 2064} {"train_loss": -42.50904083251953, "global_step": 249819, "epoch": 2064} {"train_loss": -43.08235549926758, "global_step": 249820, "epoch": 2064} {"train_loss": -42.7634391784668, "global_step": 249821, "epoch": 2064} {"train_loss": -42.62278366088867, "global_step": 249822, "epoch": 2064} {"train_loss": -43.054229736328125, "global_step": 249823, "epoch": 2064} {"train_loss": -43.02175521850586, "global_step": 249824, "epoch": 2064} {"train_loss": -43.102294921875, "global_step": 249825, "epoch": 2064} {"train_loss": -43.3111457824707, "global_step": 249826, "epoch": 2064} {"train_loss": -42.82902908325195, "global_step": 249827, "epoch": 2064} {"train_loss": -43.08546447753906, "global_step": 249828, "epoch": 2064} {"train_loss": -42.563690185546875, "global_step": 249829, "epoch": 2064} {"train_loss": -43.04823303222656, "global_step": 249830, "epoch": 2064} {"train_loss": -42.84212875366211, "global_step": 249831, "epoch": 2064} {"train_loss": -43.176780700683594, "global_step": 249832, "epoch": 2064} {"train_loss": -42.9444580078125, "global_step": 249833, "epoch": 2064} {"train_loss": -43.19503402709961, "global_step": 249834, "epoch": 2064} {"train_loss": -43.02185821533203, "global_step": 249835, "epoch": 2064} {"train_loss": -43.27312469482422, "global_step": 249836, "epoch": 2064} {"train_loss": -43.27030563354492, "global_step": 249837, "epoch": 2064} {"train_loss": -43.2504997253418, "global_step": 249838, "epoch": 2064} {"train_loss": -42.98983383178711, "global_step": 249839, "epoch": 2064} {"train_loss": -43.609928131103516, "global_step": 249840, "epoch": 2064} {"train_loss": -43.22496795654297, "global_step": 249841, "epoch": 2064} {"train_loss": -43.717411041259766, "global_step": 249842, "epoch": 2064} {"train_loss": -43.5438346862793, "global_step": 249843, "epoch": 2064} {"train_loss": -43.146827697753906, "global_step": 249844, "epoch": 2064} {"train_loss": -43.127113342285156, "global_step": 249845, "epoch": 2064} {"train_loss": -43.53107452392578, "global_step": 249846, "epoch": 2064} {"train_loss": -43.59968185424805, "global_step": 249847, "epoch": 2064} {"train_loss": -44.10589599609375, "global_step": 249848, "epoch": 2064} {"train_loss": -43.54834747314453, "global_step": 249849, "epoch": 2064} {"train_loss": -43.75434494018555, "global_step": 249850, "epoch": 2064} {"train_loss": -43.549747467041016, "global_step": 249851, "epoch": 2064} {"train_loss": -44.05263900756836, "global_step": 249852, "epoch": 2064} {"train_loss": -43.0268669128418, "global_step": 249853, "epoch": 2064} {"train_loss": -43.7667350769043, "global_step": 249854, "epoch": 2064} {"train_loss": -43.68517303466797, "global_step": 249855, "epoch": 2064} {"train_loss": -43.765377044677734, "global_step": 249856, "epoch": 2064} {"train_loss": -43.62520980834961, "global_step": 249857, "epoch": 2064} {"train_loss": -43.118221282958984, "global_step": 249858, "epoch": 2064} {"train_loss": -43.7690544128418, "global_step": 249859, "epoch": 2064} {"train_loss": -43.50334548950195, "global_step": 249860, "epoch": 2064} {"train_loss": -43.690528869628906, "global_step": 249861, "epoch": 2064} {"train_loss": -43.85285568237305, "global_step": 249862, "epoch": 2064} {"train_loss": -43.31728744506836, "global_step": 249863, "epoch": 2064} {"train_loss": -42.133511314707356, "global_step": 249864, "epoch": 2064, "val_loss": 2569334.0} {"train_loss": -43.01161193847656, "global_step": 249865, "epoch": 2065} {"train_loss": -43.67226028442383, "global_step": 249866, "epoch": 2065} {"train_loss": -43.65653610229492, "global_step": 249867, "epoch": 2065} {"train_loss": -43.70427322387695, "global_step": 249868, "epoch": 2065} {"train_loss": -43.59642791748047, "global_step": 249869, "epoch": 2065} {"train_loss": -43.89962387084961, "global_step": 249870, "epoch": 2065} {"train_loss": -43.96734619140625, "global_step": 249871, "epoch": 2065} {"train_loss": -43.143550872802734, "global_step": 249872, "epoch": 2065} {"train_loss": -42.90993881225586, "global_step": 249873, "epoch": 2065} {"train_loss": -42.9195556640625, "global_step": 249874, "epoch": 2065} {"train_loss": -43.437110900878906, "global_step": 249875, "epoch": 2065} {"train_loss": -43.37387466430664, "global_step": 249876, "epoch": 2065} {"train_loss": -43.42755126953125, "global_step": 249877, "epoch": 2065} {"train_loss": -43.218833923339844, "global_step": 249878, "epoch": 2065} {"train_loss": -42.44709014892578, "global_step": 249879, "epoch": 2065} {"train_loss": -42.43947219848633, "global_step": 249880, "epoch": 2065} {"train_loss": -42.7144889831543, "global_step": 249881, "epoch": 2065} {"train_loss": -41.89799118041992, "global_step": 249882, "epoch": 2065} {"train_loss": -40.48341751098633, "global_step": 249883, "epoch": 2065} {"train_loss": -37.07300567626953, "global_step": 249884, "epoch": 2065} {"train_loss": -40.256927490234375, "global_step": 249885, "epoch": 2065} {"train_loss": -39.35960006713867, "global_step": 249886, "epoch": 2065} {"train_loss": -40.22407913208008, "global_step": 249887, "epoch": 2065} {"train_loss": -41.743595123291016, "global_step": 249888, "epoch": 2065} {"train_loss": -40.356666564941406, "global_step": 249889, "epoch": 2065} {"train_loss": -41.12002182006836, "global_step": 249890, "epoch": 2065} {"train_loss": -41.260372161865234, "global_step": 249891, "epoch": 2065} {"train_loss": -41.617916107177734, "global_step": 249892, "epoch": 2065} {"train_loss": -41.15446090698242, "global_step": 249893, "epoch": 2065} {"train_loss": -41.316986083984375, "global_step": 249894, "epoch": 2065} {"train_loss": -41.05366897583008, "global_step": 249895, "epoch": 2065} {"train_loss": -41.439056396484375, "global_step": 249896, "epoch": 2065} {"train_loss": -41.30934143066406, "global_step": 249897, "epoch": 2065} {"train_loss": -39.69816207885742, "global_step": 249898, "epoch": 2065} {"train_loss": -37.821800231933594, "global_step": 249899, "epoch": 2065} {"train_loss": -41.3631706237793, "global_step": 249900, "epoch": 2065} {"train_loss": -42.47809600830078, "global_step": 249901, "epoch": 2065} {"train_loss": -38.01081085205078, "global_step": 249902, "epoch": 2065} {"train_loss": -38.97126007080078, "global_step": 249903, "epoch": 2065} {"train_loss": -41.80691909790039, "global_step": 249904, "epoch": 2065} {"train_loss": -37.74225997924805, "global_step": 249905, "epoch": 2065} {"train_loss": -41.470252990722656, "global_step": 249906, "epoch": 2065} {"train_loss": -39.67230987548828, "global_step": 249907, "epoch": 2065} {"train_loss": -39.32453536987305, "global_step": 249908, "epoch": 2065} {"train_loss": -41.23339080810547, "global_step": 249909, "epoch": 2065} {"train_loss": -40.677391052246094, "global_step": 249910, "epoch": 2065} {"train_loss": -41.15537643432617, "global_step": 249911, "epoch": 2065} {"train_loss": -39.348751068115234, "global_step": 249912, "epoch": 2065} {"train_loss": -42.444923400878906, "global_step": 249913, "epoch": 2065} {"train_loss": -40.07038879394531, "global_step": 249914, "epoch": 2065} {"train_loss": -42.12030792236328, "global_step": 249915, "epoch": 2065} {"train_loss": -41.60258102416992, "global_step": 249916, "epoch": 2065} {"train_loss": -42.323280334472656, "global_step": 249917, "epoch": 2065} {"train_loss": -41.62253952026367, "global_step": 249918, "epoch": 2065} {"train_loss": -41.81193542480469, "global_step": 249919, "epoch": 2065} {"train_loss": -42.24098587036133, "global_step": 249920, "epoch": 2065} {"train_loss": -41.91105270385742, "global_step": 249921, "epoch": 2065} {"train_loss": -41.98902130126953, "global_step": 249922, "epoch": 2065} {"train_loss": -40.952125549316406, "global_step": 249923, "epoch": 2065} {"train_loss": -42.055233001708984, "global_step": 249924, "epoch": 2065} {"train_loss": -41.87360382080078, "global_step": 249925, "epoch": 2065} {"train_loss": -41.994258880615234, "global_step": 249926, "epoch": 2065} {"train_loss": -41.8723258972168, "global_step": 249927, "epoch": 2065} {"train_loss": -42.500640869140625, "global_step": 249928, "epoch": 2065} {"train_loss": -42.16892623901367, "global_step": 249929, "epoch": 2065} {"train_loss": -42.69484329223633, "global_step": 249930, "epoch": 2065} {"train_loss": -42.940093994140625, "global_step": 249931, "epoch": 2065} {"train_loss": -43.0928840637207, "global_step": 249932, "epoch": 2065} {"train_loss": -42.52288055419922, "global_step": 249933, "epoch": 2065} {"train_loss": -42.726966857910156, "global_step": 249934, "epoch": 2065} {"train_loss": -42.50336456298828, "global_step": 249935, "epoch": 2065} {"train_loss": -42.718421936035156, "global_step": 249936, "epoch": 2065} {"train_loss": -42.92068099975586, "global_step": 249937, "epoch": 2065} {"train_loss": -42.93489074707031, "global_step": 249938, "epoch": 2065} {"train_loss": -42.78126907348633, "global_step": 249939, "epoch": 2065} {"train_loss": -42.896419525146484, "global_step": 249940, "epoch": 2065} {"train_loss": -42.533329010009766, "global_step": 249941, "epoch": 2065} {"train_loss": -43.25225830078125, "global_step": 249942, "epoch": 2065} {"train_loss": -42.968597412109375, "global_step": 249943, "epoch": 2065} {"train_loss": -43.00973129272461, "global_step": 249944, "epoch": 2065} {"train_loss": -42.59841537475586, "global_step": 249945, "epoch": 2065} {"train_loss": -43.220245361328125, "global_step": 249946, "epoch": 2065} {"train_loss": -42.9943733215332, "global_step": 249947, "epoch": 2065} {"train_loss": -43.10190963745117, "global_step": 249948, "epoch": 2065} {"train_loss": -42.814144134521484, "global_step": 249949, "epoch": 2065} {"train_loss": -43.25592803955078, "global_step": 249950, "epoch": 2065} {"train_loss": -43.12491989135742, "global_step": 249951, "epoch": 2065} {"train_loss": -43.09202194213867, "global_step": 249952, "epoch": 2065} {"train_loss": -43.38765335083008, "global_step": 249953, "epoch": 2065} {"train_loss": -43.44203567504883, "global_step": 249954, "epoch": 2065} {"train_loss": -43.29846954345703, "global_step": 249955, "epoch": 2065} {"train_loss": -43.67279815673828, "global_step": 249956, "epoch": 2065} {"train_loss": -43.14450454711914, "global_step": 249957, "epoch": 2065} {"train_loss": -43.34754180908203, "global_step": 249958, "epoch": 2065} {"train_loss": -43.550140380859375, "global_step": 249959, "epoch": 2065} {"train_loss": -42.61608123779297, "global_step": 249960, "epoch": 2065} {"train_loss": -43.01581954956055, "global_step": 249961, "epoch": 2065} {"train_loss": -43.6547966003418, "global_step": 249962, "epoch": 2065} {"train_loss": -43.139732360839844, "global_step": 249963, "epoch": 2065} {"train_loss": -43.285552978515625, "global_step": 249964, "epoch": 2065} {"train_loss": -43.50936508178711, "global_step": 249965, "epoch": 2065} {"train_loss": -43.146240234375, "global_step": 249966, "epoch": 2065} {"train_loss": -42.81171798706055, "global_step": 249967, "epoch": 2065} {"train_loss": -42.587703704833984, "global_step": 249968, "epoch": 2065} {"train_loss": -42.888648986816406, "global_step": 249969, "epoch": 2065} {"train_loss": -43.45426559448242, "global_step": 249970, "epoch": 2065} {"train_loss": -43.2961540222168, "global_step": 249971, "epoch": 2065} {"train_loss": -42.88582992553711, "global_step": 249972, "epoch": 2065} {"train_loss": -41.93149948120117, "global_step": 249973, "epoch": 2065} {"train_loss": -40.93195724487305, "global_step": 249974, "epoch": 2065} {"train_loss": -41.62908935546875, "global_step": 249975, "epoch": 2065} {"train_loss": -42.655189514160156, "global_step": 249976, "epoch": 2065} {"train_loss": -40.88747024536133, "global_step": 249977, "epoch": 2065} {"train_loss": -41.274452209472656, "global_step": 249978, "epoch": 2065} {"train_loss": -41.2524528503418, "global_step": 249979, "epoch": 2065} {"train_loss": -40.85000228881836, "global_step": 249980, "epoch": 2065} {"train_loss": -41.84236145019531, "global_step": 249981, "epoch": 2065} {"train_loss": -42.48151779174805, "global_step": 249982, "epoch": 2065} {"train_loss": -40.91545486450195, "global_step": 249983, "epoch": 2065} {"train_loss": -40.24020004272461, "global_step": 249984, "epoch": 2065} {"train_loss": -42.06369150965667, "global_step": 249985, "epoch": 2065, "val_loss": 2541905.0} {"train_loss": -43.42079162597656, "global_step": 249986, "epoch": 2066} {"train_loss": -42.54098892211914, "global_step": 249987, "epoch": 2066} {"train_loss": -41.94486618041992, "global_step": 249988, "epoch": 2066} {"train_loss": -42.06165313720703, "global_step": 249989, "epoch": 2066} {"train_loss": -42.765621185302734, "global_step": 249990, "epoch": 2066} {"train_loss": -42.27456283569336, "global_step": 249991, "epoch": 2066} {"train_loss": -41.854591369628906, "global_step": 249992, "epoch": 2066} {"train_loss": -42.965694427490234, "global_step": 249993, "epoch": 2066} {"train_loss": -42.5161018371582, "global_step": 249994, "epoch": 2066} {"train_loss": -42.8463249206543, "global_step": 249995, "epoch": 2066} {"train_loss": -42.939735412597656, "global_step": 249996, "epoch": 2066} {"train_loss": -42.52751159667969, "global_step": 249997, "epoch": 2066} {"train_loss": -42.8483772277832, "global_step": 249998, "epoch": 2066} {"train_loss": -42.649322509765625, "global_step": 249999, "epoch": 2066} {"train_loss": -42.377342224121094, "global_step": 250000, "epoch": 2066} {"train_loss": -41.853302001953125, "global_step": 250001, "epoch": 2066} {"train_loss": -42.86139678955078, "global_step": 250002, "epoch": 2066} {"train_loss": -39.84279251098633, "global_step": 250003, "epoch": 2066} {"train_loss": -43.430477142333984, "global_step": 250004, "epoch": 2066} {"train_loss": -42.07550811767578, "global_step": 250005, "epoch": 2066} {"train_loss": -42.703548431396484, "global_step": 250006, "epoch": 2066} {"train_loss": -43.231136322021484, "global_step": 250007, "epoch": 2066} {"train_loss": -43.04877471923828, "global_step": 250008, "epoch": 2066} {"train_loss": -42.73423385620117, "global_step": 250009, "epoch": 2066} {"train_loss": -43.19768524169922, "global_step": 250010, "epoch": 2066} {"train_loss": -43.090023040771484, "global_step": 250011, "epoch": 2066} {"train_loss": -43.2823486328125, "global_step": 250012, "epoch": 2066} {"train_loss": -42.67403030395508, "global_step": 250013, "epoch": 2066} {"train_loss": -41.74509811401367, "global_step": 250014, "epoch": 2066} {"train_loss": -43.66795349121094, "global_step": 250015, "epoch": 2066} {"train_loss": -42.87165451049805, "global_step": 250016, "epoch": 2066} {"train_loss": -42.21601486206055, "global_step": 250017, "epoch": 2066} {"train_loss": -43.067665100097656, "global_step": 250018, "epoch": 2066} {"train_loss": -43.44118881225586, "global_step": 250019, "epoch": 2066} {"train_loss": -42.6623649597168, "global_step": 250020, "epoch": 2066} {"train_loss": -43.206424713134766, "global_step": 250021, "epoch": 2066} {"train_loss": -43.48894500732422, "global_step": 250022, "epoch": 2066} {"train_loss": -43.46556091308594, "global_step": 250023, "epoch": 2066} {"train_loss": -43.63667297363281, "global_step": 250024, "epoch": 2066} {"train_loss": -43.353797912597656, "global_step": 250025, "epoch": 2066} {"train_loss": -43.617591857910156, "global_step": 250026, "epoch": 2066} {"train_loss": -43.536373138427734, "global_step": 250027, "epoch": 2066} {"train_loss": -43.045135498046875, "global_step": 250028, "epoch": 2066} {"train_loss": -43.54948806762695, "global_step": 250029, "epoch": 2066} {"train_loss": -42.986236572265625, "global_step": 250030, "epoch": 2066} {"train_loss": -43.380950927734375, "global_step": 250031, "epoch": 2066} {"train_loss": -42.97761917114258, "global_step": 250032, "epoch": 2066} {"train_loss": -42.92083740234375, "global_step": 250033, "epoch": 2066} {"train_loss": -41.75539016723633, "global_step": 250034, "epoch": 2066} {"train_loss": -42.45832061767578, "global_step": 250035, "epoch": 2066} {"train_loss": -42.898521423339844, "global_step": 250036, "epoch": 2066} {"train_loss": -42.7763557434082, "global_step": 250037, "epoch": 2066} {"train_loss": -43.8159065246582, "global_step": 250038, "epoch": 2066} {"train_loss": -43.55910110473633, "global_step": 250039, "epoch": 2066} {"train_loss": -43.547603607177734, "global_step": 250040, "epoch": 2066} {"train_loss": -43.536258697509766, "global_step": 250041, "epoch": 2066} {"train_loss": -43.53253173828125, "global_step": 250042, "epoch": 2066} {"train_loss": -41.305416107177734, "global_step": 250043, "epoch": 2066} {"train_loss": -42.7215461730957, "global_step": 250044, "epoch": 2066} {"train_loss": -44.043495178222656, "global_step": 250045, "epoch": 2066} {"train_loss": -43.66475296020508, "global_step": 250046, "epoch": 2066} {"train_loss": -35.03753662109375, "global_step": 250047, "epoch": 2066} {"train_loss": -42.05830001831055, "global_step": 250048, "epoch": 2066} {"train_loss": -37.51599884033203, "global_step": 250049, "epoch": 2066} {"train_loss": -42.65542984008789, "global_step": 250050, "epoch": 2066} {"train_loss": -39.44666290283203, "global_step": 250051, "epoch": 2066} {"train_loss": -27.09700584411621, "global_step": 250052, "epoch": 2066} {"train_loss": -30.031858444213867, "global_step": 250053, "epoch": 2066} {"train_loss": -30.58262062072754, "global_step": 250054, "epoch": 2066} {"train_loss": -37.87758255004883, "global_step": 250055, "epoch": 2066} {"train_loss": -39.251251220703125, "global_step": 250056, "epoch": 2066} {"train_loss": -34.89313507080078, "global_step": 250057, "epoch": 2066} {"train_loss": -20.31240463256836, "global_step": 250058, "epoch": 2066} {"train_loss": -37.27667999267578, "global_step": 250059, "epoch": 2066} {"train_loss": -33.45941162109375, "global_step": 250060, "epoch": 2066} {"train_loss": -12.275142669677734, "global_step": 250061, "epoch": 2066} {"train_loss": -37.23415756225586, "global_step": 250062, "epoch": 2066} {"train_loss": -18.359432220458984, "global_step": 250063, "epoch": 2066} {"train_loss": -32.596641540527344, "global_step": 250064, "epoch": 2066} {"train_loss": -33.20801544189453, "global_step": 250065, "epoch": 2066} {"train_loss": -29.15250587463379, "global_step": 250066, "epoch": 2066} {"train_loss": -26.632770538330078, "global_step": 250067, "epoch": 2066} {"train_loss": -31.55866050720215, "global_step": 250068, "epoch": 2066} {"train_loss": -32.83561325073242, "global_step": 250069, "epoch": 2066} {"train_loss": -33.40169906616211, "global_step": 250070, "epoch": 2066} {"train_loss": -33.00262451171875, "global_step": 250071, "epoch": 2066} {"train_loss": -32.706260681152344, "global_step": 250072, "epoch": 2066} {"train_loss": -32.858253479003906, "global_step": 250073, "epoch": 2066} {"train_loss": -31.898761749267578, "global_step": 250074, "epoch": 2066} {"train_loss": -34.041744232177734, "global_step": 250075, "epoch": 2066} {"train_loss": -37.515602111816406, "global_step": 250076, "epoch": 2066} {"train_loss": -35.66429901123047, "global_step": 250077, "epoch": 2066} {"train_loss": -35.12736892700195, "global_step": 250078, "epoch": 2066} {"train_loss": -35.65964889526367, "global_step": 250079, "epoch": 2066} {"train_loss": -36.142398834228516, "global_step": 250080, "epoch": 2066} {"train_loss": -39.333152770996094, "global_step": 250081, "epoch": 2066} {"train_loss": -35.17611312866211, "global_step": 250082, "epoch": 2066} {"train_loss": -38.8648567199707, "global_step": 250083, "epoch": 2066} {"train_loss": -35.94022750854492, "global_step": 250084, "epoch": 2066} {"train_loss": -39.33708572387695, "global_step": 250085, "epoch": 2066} {"train_loss": -38.45109176635742, "global_step": 250086, "epoch": 2066} {"train_loss": -38.43935775756836, "global_step": 250087, "epoch": 2066} {"train_loss": -37.202083587646484, "global_step": 250088, "epoch": 2066} {"train_loss": -39.3804817199707, "global_step": 250089, "epoch": 2066} {"train_loss": -37.551631927490234, "global_step": 250090, "epoch": 2066} {"train_loss": -38.86933517456055, "global_step": 250091, "epoch": 2066} {"train_loss": -38.66352081298828, "global_step": 250092, "epoch": 2066} {"train_loss": -39.38624954223633, "global_step": 250093, "epoch": 2066} {"train_loss": -38.716636657714844, "global_step": 250094, "epoch": 2066} {"train_loss": -37.07040786743164, "global_step": 250095, "epoch": 2066} {"train_loss": -38.62596130371094, "global_step": 250096, "epoch": 2066} {"train_loss": -36.06300735473633, "global_step": 250097, "epoch": 2066} {"train_loss": -38.73330307006836, "global_step": 250098, "epoch": 2066} {"train_loss": -39.285072326660156, "global_step": 250099, "epoch": 2066} {"train_loss": -39.91807556152344, "global_step": 250100, "epoch": 2066} {"train_loss": -40.11692428588867, "global_step": 250101, "epoch": 2066} {"train_loss": -39.69607162475586, "global_step": 250102, "epoch": 2066} {"train_loss": -39.697906494140625, "global_step": 250103, "epoch": 2066} {"train_loss": -39.09632873535156, "global_step": 250104, "epoch": 2066} {"train_loss": -39.27535629272461, "global_step": 250105, "epoch": 2066} {"train_loss": -39.146506207048404, "global_step": 250106, "epoch": 2066, "val_loss": 2597508.75} {"train_loss": -39.035499572753906, "global_step": 250107, "epoch": 2067} {"train_loss": -39.694122314453125, "global_step": 250108, "epoch": 2067} {"train_loss": -39.33010482788086, "global_step": 250109, "epoch": 2067} {"train_loss": -40.408538818359375, "global_step": 250110, "epoch": 2067} {"train_loss": -40.425601959228516, "global_step": 250111, "epoch": 2067} {"train_loss": -39.05513381958008, "global_step": 250112, "epoch": 2067} {"train_loss": -39.15625762939453, "global_step": 250113, "epoch": 2067} {"train_loss": -39.61776351928711, "global_step": 250114, "epoch": 2067} {"train_loss": -39.2784423828125, "global_step": 250115, "epoch": 2067} {"train_loss": -40.046085357666016, "global_step": 250116, "epoch": 2067} {"train_loss": -40.62531661987305, "global_step": 250117, "epoch": 2067} {"train_loss": -40.447914123535156, "global_step": 250118, "epoch": 2067} {"train_loss": -40.2825927734375, "global_step": 250119, "epoch": 2067} {"train_loss": -40.2686767578125, "global_step": 250120, "epoch": 2067} {"train_loss": -40.14327621459961, "global_step": 250121, "epoch": 2067} {"train_loss": -40.89030838012695, "global_step": 250122, "epoch": 2067} {"train_loss": -40.28670120239258, "global_step": 250123, "epoch": 2067} {"train_loss": -40.67672348022461, "global_step": 250124, "epoch": 2067} {"train_loss": -40.68984603881836, "global_step": 250125, "epoch": 2067} {"train_loss": -40.80012893676758, "global_step": 250126, "epoch": 2067} {"train_loss": -40.85524368286133, "global_step": 250127, "epoch": 2067} {"train_loss": -41.16835021972656, "global_step": 250128, "epoch": 2067} {"train_loss": -41.03044891357422, "global_step": 250129, "epoch": 2067} {"train_loss": -41.32731628417969, "global_step": 250130, "epoch": 2067} {"train_loss": -40.648250579833984, "global_step": 250131, "epoch": 2067} {"train_loss": -40.205780029296875, "global_step": 250132, "epoch": 2067} {"train_loss": -41.3096809387207, "global_step": 250133, "epoch": 2067} {"train_loss": -41.2567138671875, "global_step": 250134, "epoch": 2067} {"train_loss": -41.1208610534668, "global_step": 250135, "epoch": 2067} {"train_loss": -41.24219512939453, "global_step": 250136, "epoch": 2067} {"train_loss": -41.36627960205078, "global_step": 250137, "epoch": 2067} {"train_loss": -41.40962219238281, "global_step": 250138, "epoch": 2067} {"train_loss": -41.248939514160156, "global_step": 250139, "epoch": 2067} {"train_loss": -41.6451301574707, "global_step": 250140, "epoch": 2067} {"train_loss": -41.24619674682617, "global_step": 250141, "epoch": 2067} {"train_loss": -40.916236877441406, "global_step": 250142, "epoch": 2067} {"train_loss": -41.5890998840332, "global_step": 250143, "epoch": 2067} {"train_loss": -40.6395263671875, "global_step": 250144, "epoch": 2067} {"train_loss": -42.010990142822266, "global_step": 250145, "epoch": 2067} {"train_loss": -41.05196762084961, "global_step": 250146, "epoch": 2067} {"train_loss": -40.74723434448242, "global_step": 250147, "epoch": 2067} {"train_loss": -41.285499572753906, "global_step": 250148, "epoch": 2067} {"train_loss": -41.270484924316406, "global_step": 250149, "epoch": 2067} {"train_loss": -41.15301513671875, "global_step": 250150, "epoch": 2067} {"train_loss": -41.67478561401367, "global_step": 250151, "epoch": 2067} {"train_loss": -41.910335540771484, "global_step": 250152, "epoch": 2067} {"train_loss": -41.84525680541992, "global_step": 250153, "epoch": 2067} {"train_loss": -40.66465759277344, "global_step": 250154, "epoch": 2067} {"train_loss": -41.97341537475586, "global_step": 250155, "epoch": 2067} {"train_loss": -41.38967514038086, "global_step": 250156, "epoch": 2067} {"train_loss": -42.43769454956055, "global_step": 250157, "epoch": 2067} {"train_loss": -42.13459396362305, "global_step": 250158, "epoch": 2067} {"train_loss": -41.46649932861328, "global_step": 250159, "epoch": 2067} {"train_loss": -41.29989242553711, "global_step": 250160, "epoch": 2067} {"train_loss": -41.1533088684082, "global_step": 250161, "epoch": 2067} {"train_loss": -41.75748825073242, "global_step": 250162, "epoch": 2067} {"train_loss": -42.965919494628906, "global_step": 250163, "epoch": 2067} {"train_loss": -41.75386428833008, "global_step": 250164, "epoch": 2067} {"train_loss": -42.0275993347168, "global_step": 250165, "epoch": 2067} {"train_loss": -40.735530853271484, "global_step": 250166, "epoch": 2067} {"train_loss": -42.263187408447266, "global_step": 250167, "epoch": 2067} {"train_loss": -40.896114349365234, "global_step": 250168, "epoch": 2067} {"train_loss": -41.41310501098633, "global_step": 250169, "epoch": 2067} {"train_loss": -41.422080993652344, "global_step": 250170, "epoch": 2067} {"train_loss": -42.4084358215332, "global_step": 250171, "epoch": 2067} {"train_loss": -42.17367172241211, "global_step": 250172, "epoch": 2067} {"train_loss": -41.90278244018555, "global_step": 250173, "epoch": 2067} {"train_loss": -41.96635818481445, "global_step": 250174, "epoch": 2067} {"train_loss": -42.35266876220703, "global_step": 250175, "epoch": 2067} {"train_loss": -41.910743713378906, "global_step": 250176, "epoch": 2067} {"train_loss": -42.753841400146484, "global_step": 250177, "epoch": 2067} {"train_loss": -42.15755844116211, "global_step": 250178, "epoch": 2067} {"train_loss": -42.4001579284668, "global_step": 250179, "epoch": 2067} {"train_loss": -41.57694625854492, "global_step": 250180, "epoch": 2067} {"train_loss": -42.70382308959961, "global_step": 250181, "epoch": 2067} {"train_loss": -42.02431869506836, "global_step": 250182, "epoch": 2067} {"train_loss": -42.039466857910156, "global_step": 250183, "epoch": 2067} {"train_loss": -43.058712005615234, "global_step": 250184, "epoch": 2067} {"train_loss": -42.976409912109375, "global_step": 250185, "epoch": 2067} {"train_loss": -42.138370513916016, "global_step": 250186, "epoch": 2067} {"train_loss": -41.81193923950195, "global_step": 250187, "epoch": 2067} {"train_loss": -43.16556930541992, "global_step": 250188, "epoch": 2067} {"train_loss": -43.21318054199219, "global_step": 250189, "epoch": 2067} {"train_loss": -41.53001022338867, "global_step": 250190, "epoch": 2067} {"train_loss": -40.923770904541016, "global_step": 250191, "epoch": 2067} {"train_loss": -42.25570297241211, "global_step": 250192, "epoch": 2067} {"train_loss": -42.03248977661133, "global_step": 250193, "epoch": 2067} {"train_loss": -42.753482818603516, "global_step": 250194, "epoch": 2067} {"train_loss": -41.716583251953125, "global_step": 250195, "epoch": 2067} {"train_loss": -42.86252975463867, "global_step": 250196, "epoch": 2067} {"train_loss": -42.5000114440918, "global_step": 250197, "epoch": 2067} {"train_loss": -41.83900833129883, "global_step": 250198, "epoch": 2067} {"train_loss": -42.99856948852539, "global_step": 250199, "epoch": 2067} {"train_loss": -42.78339767456055, "global_step": 250200, "epoch": 2067} {"train_loss": -42.87258529663086, "global_step": 250201, "epoch": 2067} {"train_loss": -42.72065353393555, "global_step": 250202, "epoch": 2067} {"train_loss": -42.73305130004883, "global_step": 250203, "epoch": 2067} {"train_loss": -42.735382080078125, "global_step": 250204, "epoch": 2067} {"train_loss": -42.61600875854492, "global_step": 250205, "epoch": 2067} {"train_loss": -42.274478912353516, "global_step": 250206, "epoch": 2067} {"train_loss": -42.6798210144043, "global_step": 250207, "epoch": 2067} {"train_loss": -41.70171356201172, "global_step": 250208, "epoch": 2067} {"train_loss": -42.746883392333984, "global_step": 250209, "epoch": 2067} {"train_loss": -42.347023010253906, "global_step": 250210, "epoch": 2067} {"train_loss": -42.73154830932617, "global_step": 250211, "epoch": 2067} {"train_loss": -42.948787689208984, "global_step": 250212, "epoch": 2067} {"train_loss": -42.75521469116211, "global_step": 250213, "epoch": 2067} {"train_loss": -42.87083053588867, "global_step": 250214, "epoch": 2067} {"train_loss": -42.636287689208984, "global_step": 250215, "epoch": 2067} {"train_loss": -41.45620346069336, "global_step": 250216, "epoch": 2067} {"train_loss": -42.19139862060547, "global_step": 250217, "epoch": 2067} {"train_loss": -41.23067855834961, "global_step": 250218, "epoch": 2067} {"train_loss": -41.61373519897461, "global_step": 250219, "epoch": 2067} {"train_loss": -41.3655891418457, "global_step": 250220, "epoch": 2067} {"train_loss": -39.871402740478516, "global_step": 250221, "epoch": 2067} {"train_loss": -40.54598617553711, "global_step": 250222, "epoch": 2067} {"train_loss": -39.262939453125, "global_step": 250223, "epoch": 2067} {"train_loss": -40.1431999206543, "global_step": 250224, "epoch": 2067} {"train_loss": -38.5556755065918, "global_step": 250225, "epoch": 2067} {"train_loss": -40.56142807006836, "global_step": 250226, "epoch": 2067} {"train_loss": -41.45416943889019, "global_step": 250227, "epoch": 2067, "val_loss": 2660432.25} {"train_loss": -37.29960250854492, "global_step": 250228, "epoch": 2068} {"train_loss": -41.81365203857422, "global_step": 250229, "epoch": 2068} {"train_loss": -38.12565612792969, "global_step": 250230, "epoch": 2068} {"train_loss": -41.668540954589844, "global_step": 250231, "epoch": 2068} {"train_loss": -38.2235221862793, "global_step": 250232, "epoch": 2068} {"train_loss": -41.82392120361328, "global_step": 250233, "epoch": 2068} {"train_loss": -40.12347412109375, "global_step": 250234, "epoch": 2068} {"train_loss": -40.58051681518555, "global_step": 250235, "epoch": 2068} {"train_loss": -40.893672943115234, "global_step": 250236, "epoch": 2068} {"train_loss": -40.584754943847656, "global_step": 250237, "epoch": 2068} {"train_loss": -41.83253860473633, "global_step": 250238, "epoch": 2068} {"train_loss": -39.015132904052734, "global_step": 250239, "epoch": 2068} {"train_loss": -41.29541015625, "global_step": 250240, "epoch": 2068} {"train_loss": -41.11830139160156, "global_step": 250241, "epoch": 2068} {"train_loss": -39.768611907958984, "global_step": 250242, "epoch": 2068} {"train_loss": -41.55352783203125, "global_step": 250243, "epoch": 2068} {"train_loss": -39.18677520751953, "global_step": 250244, "epoch": 2068} {"train_loss": -40.32381820678711, "global_step": 250245, "epoch": 2068} {"train_loss": -40.300514221191406, "global_step": 250246, "epoch": 2068} {"train_loss": -39.926002502441406, "global_step": 250247, "epoch": 2068} {"train_loss": -41.4990234375, "global_step": 250248, "epoch": 2068} {"train_loss": -40.711517333984375, "global_step": 250249, "epoch": 2068} {"train_loss": -39.717830657958984, "global_step": 250250, "epoch": 2068} {"train_loss": -41.9465217590332, "global_step": 250251, "epoch": 2068} {"train_loss": -40.242061614990234, "global_step": 250252, "epoch": 2068} {"train_loss": -41.462215423583984, "global_step": 250253, "epoch": 2068} {"train_loss": -41.35744094848633, "global_step": 250254, "epoch": 2068} {"train_loss": -41.6439208984375, "global_step": 250255, "epoch": 2068} {"train_loss": -39.80630111694336, "global_step": 250256, "epoch": 2068} {"train_loss": -42.1919059753418, "global_step": 250257, "epoch": 2068} {"train_loss": -40.52416229248047, "global_step": 250258, "epoch": 2068} {"train_loss": -41.90313720703125, "global_step": 250259, "epoch": 2068} {"train_loss": -42.02073287963867, "global_step": 250260, "epoch": 2068} {"train_loss": -41.87443161010742, "global_step": 250261, "epoch": 2068} {"train_loss": -41.669525146484375, "global_step": 250262, "epoch": 2068} {"train_loss": -41.9878044128418, "global_step": 250263, "epoch": 2068} {"train_loss": -41.50885772705078, "global_step": 250264, "epoch": 2068} {"train_loss": -41.4282341003418, "global_step": 250265, "epoch": 2068} {"train_loss": -42.184932708740234, "global_step": 250266, "epoch": 2068} {"train_loss": -41.731502532958984, "global_step": 250267, "epoch": 2068} {"train_loss": -40.936607360839844, "global_step": 250268, "epoch": 2068} {"train_loss": -42.6054801940918, "global_step": 250269, "epoch": 2068} {"train_loss": -42.98794174194336, "global_step": 250270, "epoch": 2068} {"train_loss": -40.988773345947266, "global_step": 250271, "epoch": 2068} {"train_loss": -42.62506103515625, "global_step": 250272, "epoch": 2068} {"train_loss": -41.37320327758789, "global_step": 250273, "epoch": 2068} {"train_loss": -42.68732833862305, "global_step": 250274, "epoch": 2068} {"train_loss": -42.27030944824219, "global_step": 250275, "epoch": 2068} {"train_loss": -42.329681396484375, "global_step": 250276, "epoch": 2068} {"train_loss": -43.04638671875, "global_step": 250277, "epoch": 2068} {"train_loss": -42.41005325317383, "global_step": 250278, "epoch": 2068} {"train_loss": -42.23542022705078, "global_step": 250279, "epoch": 2068} {"train_loss": -42.62343215942383, "global_step": 250280, "epoch": 2068} {"train_loss": -43.15934371948242, "global_step": 250281, "epoch": 2068} {"train_loss": -42.1964111328125, "global_step": 250282, "epoch": 2068} {"train_loss": -42.82326889038086, "global_step": 250283, "epoch": 2068} {"train_loss": -42.64497375488281, "global_step": 250284, "epoch": 2068} {"train_loss": -42.5208625793457, "global_step": 250285, "epoch": 2068} {"train_loss": -43.004539489746094, "global_step": 250286, "epoch": 2068} {"train_loss": -42.95026397705078, "global_step": 250287, "epoch": 2068} {"train_loss": -42.678611755371094, "global_step": 250288, "epoch": 2068} {"train_loss": -42.61590576171875, "global_step": 250289, "epoch": 2068} {"train_loss": -42.171714782714844, "global_step": 250290, "epoch": 2068} {"train_loss": -43.04301071166992, "global_step": 250291, "epoch": 2068} {"train_loss": -43.16230010986328, "global_step": 250292, "epoch": 2068} {"train_loss": -43.37397384643555, "global_step": 250293, "epoch": 2068} {"train_loss": -42.82780456542969, "global_step": 250294, "epoch": 2068} {"train_loss": -42.937496185302734, "global_step": 250295, "epoch": 2068} {"train_loss": -42.613033294677734, "global_step": 250296, "epoch": 2068} {"train_loss": -42.77693176269531, "global_step": 250297, "epoch": 2068} {"train_loss": -43.0937614440918, "global_step": 250298, "epoch": 2068} {"train_loss": -42.31630325317383, "global_step": 250299, "epoch": 2068} {"train_loss": -41.825618743896484, "global_step": 250300, "epoch": 2068} {"train_loss": -41.878944396972656, "global_step": 250301, "epoch": 2068} {"train_loss": -40.64793014526367, "global_step": 250302, "epoch": 2068} {"train_loss": -40.335567474365234, "global_step": 250303, "epoch": 2068} {"train_loss": -41.52442169189453, "global_step": 250304, "epoch": 2068} {"train_loss": -42.54128646850586, "global_step": 250305, "epoch": 2068} {"train_loss": -41.4932861328125, "global_step": 250306, "epoch": 2068} {"train_loss": -40.110225677490234, "global_step": 250307, "epoch": 2068} {"train_loss": -39.47747802734375, "global_step": 250308, "epoch": 2068} {"train_loss": -40.008544921875, "global_step": 250309, "epoch": 2068} {"train_loss": -41.35313034057617, "global_step": 250310, "epoch": 2068} {"train_loss": -42.92113494873047, "global_step": 250311, "epoch": 2068} {"train_loss": -41.44626235961914, "global_step": 250312, "epoch": 2068} {"train_loss": -36.3658447265625, "global_step": 250313, "epoch": 2068} {"train_loss": -41.203548431396484, "global_step": 250314, "epoch": 2068} {"train_loss": -41.24439239501953, "global_step": 250315, "epoch": 2068} {"train_loss": -34.52057647705078, "global_step": 250316, "epoch": 2068} {"train_loss": -38.44437026977539, "global_step": 250317, "epoch": 2068} {"train_loss": -41.669471740722656, "global_step": 250318, "epoch": 2068} {"train_loss": -35.794952392578125, "global_step": 250319, "epoch": 2068} {"train_loss": -36.79846954345703, "global_step": 250320, "epoch": 2068} {"train_loss": -40.172218322753906, "global_step": 250321, "epoch": 2068} {"train_loss": -35.50914001464844, "global_step": 250322, "epoch": 2068} {"train_loss": -40.200443267822266, "global_step": 250323, "epoch": 2068} {"train_loss": -39.7838134765625, "global_step": 250324, "epoch": 2068} {"train_loss": -36.15614700317383, "global_step": 250325, "epoch": 2068} {"train_loss": -38.501258850097656, "global_step": 250326, "epoch": 2068} {"train_loss": -40.8585319519043, "global_step": 250327, "epoch": 2068} {"train_loss": -40.29884719848633, "global_step": 250328, "epoch": 2068} {"train_loss": -40.10411834716797, "global_step": 250329, "epoch": 2068} {"train_loss": -39.34306716918945, "global_step": 250330, "epoch": 2068} {"train_loss": -39.0450553894043, "global_step": 250331, "epoch": 2068} {"train_loss": -41.40333938598633, "global_step": 250332, "epoch": 2068} {"train_loss": -40.49032211303711, "global_step": 250333, "epoch": 2068} {"train_loss": -41.00794982910156, "global_step": 250334, "epoch": 2068} {"train_loss": -39.89126205444336, "global_step": 250335, "epoch": 2068} {"train_loss": -38.818904876708984, "global_step": 250336, "epoch": 2068} {"train_loss": -40.042083740234375, "global_step": 250337, "epoch": 2068} {"train_loss": -40.8636360168457, "global_step": 250338, "epoch": 2068} {"train_loss": -40.340328216552734, "global_step": 250339, "epoch": 2068} {"train_loss": -42.31229782104492, "global_step": 250340, "epoch": 2068} {"train_loss": -41.69464111328125, "global_step": 250341, "epoch": 2068} {"train_loss": -41.38517761230469, "global_step": 250342, "epoch": 2068} {"train_loss": -41.013179779052734, "global_step": 250343, "epoch": 2068} {"train_loss": -41.16487503051758, "global_step": 250344, "epoch": 2068} {"train_loss": -41.361568450927734, "global_step": 250345, "epoch": 2068} {"train_loss": -41.74799728393555, "global_step": 250346, "epoch": 2068} {"train_loss": -41.618743896484375, "global_step": 250347, "epoch": 2068} {"train_loss": -41.013627265110486, "global_step": 250348, "epoch": 2068, "val_loss": 2623201.75} {"train_loss": -42.070186614990234, "global_step": 250349, "epoch": 2069} {"train_loss": -42.00596237182617, "global_step": 250350, "epoch": 2069} {"train_loss": -41.70199203491211, "global_step": 250351, "epoch": 2069} {"train_loss": -42.310569763183594, "global_step": 250352, "epoch": 2069} {"train_loss": -42.15961837768555, "global_step": 250353, "epoch": 2069} {"train_loss": -42.1110725402832, "global_step": 250354, "epoch": 2069} {"train_loss": -42.08417892456055, "global_step": 250355, "epoch": 2069} {"train_loss": -42.41040802001953, "global_step": 250356, "epoch": 2069} {"train_loss": -42.647701263427734, "global_step": 250357, "epoch": 2069} {"train_loss": -42.025657653808594, "global_step": 250358, "epoch": 2069} {"train_loss": -42.514583587646484, "global_step": 250359, "epoch": 2069} {"train_loss": -42.24506759643555, "global_step": 250360, "epoch": 2069} {"train_loss": -42.80739974975586, "global_step": 250361, "epoch": 2069} {"train_loss": -42.3996696472168, "global_step": 250362, "epoch": 2069} {"train_loss": -42.69267272949219, "global_step": 250363, "epoch": 2069} {"train_loss": -42.778663635253906, "global_step": 250364, "epoch": 2069} {"train_loss": -42.34798812866211, "global_step": 250365, "epoch": 2069} {"train_loss": -42.47372055053711, "global_step": 250366, "epoch": 2069} {"train_loss": -42.36125564575195, "global_step": 250367, "epoch": 2069} {"train_loss": -42.300537109375, "global_step": 250368, "epoch": 2069} {"train_loss": -42.8714485168457, "global_step": 250369, "epoch": 2069} {"train_loss": -43.14034652709961, "global_step": 250370, "epoch": 2069} {"train_loss": -43.01519775390625, "global_step": 250371, "epoch": 2069} {"train_loss": -41.95695877075195, "global_step": 250372, "epoch": 2069} {"train_loss": -42.94688034057617, "global_step": 250373, "epoch": 2069} {"train_loss": -43.003997802734375, "global_step": 250374, "epoch": 2069} {"train_loss": -42.80295944213867, "global_step": 250375, "epoch": 2069} {"train_loss": -43.26799011230469, "global_step": 250376, "epoch": 2069} {"train_loss": -43.344825744628906, "global_step": 250377, "epoch": 2069} {"train_loss": -42.779239654541016, "global_step": 250378, "epoch": 2069} {"train_loss": -43.1014518737793, "global_step": 250379, "epoch": 2069} {"train_loss": -42.969146728515625, "global_step": 250380, "epoch": 2069} {"train_loss": -43.10279083251953, "global_step": 250381, "epoch": 2069} {"train_loss": -43.270381927490234, "global_step": 250382, "epoch": 2069} {"train_loss": -43.13819122314453, "global_step": 250383, "epoch": 2069} {"train_loss": -42.764278411865234, "global_step": 250384, "epoch": 2069} {"train_loss": -43.58420944213867, "global_step": 250385, "epoch": 2069} {"train_loss": -43.508602142333984, "global_step": 250386, "epoch": 2069} {"train_loss": -41.6847038269043, "global_step": 250387, "epoch": 2069} {"train_loss": -43.14026641845703, "global_step": 250388, "epoch": 2069} {"train_loss": -43.5072135925293, "global_step": 250389, "epoch": 2069} {"train_loss": -43.08694076538086, "global_step": 250390, "epoch": 2069} {"train_loss": -43.022613525390625, "global_step": 250391, "epoch": 2069} {"train_loss": -43.01597213745117, "global_step": 250392, "epoch": 2069} {"train_loss": -42.785072326660156, "global_step": 250393, "epoch": 2069} {"train_loss": -43.42676544189453, "global_step": 250394, "epoch": 2069} {"train_loss": -42.67837905883789, "global_step": 250395, "epoch": 2069} {"train_loss": -42.929439544677734, "global_step": 250396, "epoch": 2069} {"train_loss": -43.63431930541992, "global_step": 250397, "epoch": 2069} {"train_loss": -43.33244323730469, "global_step": 250398, "epoch": 2069} {"train_loss": -43.489967346191406, "global_step": 250399, "epoch": 2069} {"train_loss": -43.88536834716797, "global_step": 250400, "epoch": 2069} {"train_loss": -42.49418640136719, "global_step": 250401, "epoch": 2069} {"train_loss": -42.78253173828125, "global_step": 250402, "epoch": 2069} {"train_loss": -42.078887939453125, "global_step": 250403, "epoch": 2069} {"train_loss": -40.78596878051758, "global_step": 250404, "epoch": 2069} {"train_loss": -40.31026840209961, "global_step": 250405, "epoch": 2069} {"train_loss": -39.989742279052734, "global_step": 250406, "epoch": 2069} {"train_loss": -36.943878173828125, "global_step": 250407, "epoch": 2069} {"train_loss": -40.664764404296875, "global_step": 250408, "epoch": 2069} {"train_loss": -43.1850700378418, "global_step": 250409, "epoch": 2069} {"train_loss": -42.28071212768555, "global_step": 250410, "epoch": 2069} {"train_loss": -39.88614273071289, "global_step": 250411, "epoch": 2069} {"train_loss": -39.57695388793945, "global_step": 250412, "epoch": 2069} {"train_loss": -40.52768325805664, "global_step": 250413, "epoch": 2069} {"train_loss": -41.99850082397461, "global_step": 250414, "epoch": 2069} {"train_loss": -40.67741394042969, "global_step": 250415, "epoch": 2069} {"train_loss": -39.68927764892578, "global_step": 250416, "epoch": 2069} {"train_loss": -40.40494918823242, "global_step": 250417, "epoch": 2069} {"train_loss": -42.012969970703125, "global_step": 250418, "epoch": 2069} {"train_loss": -40.9526252746582, "global_step": 250419, "epoch": 2069} {"train_loss": -42.51381301879883, "global_step": 250420, "epoch": 2069} {"train_loss": -42.189205169677734, "global_step": 250421, "epoch": 2069} {"train_loss": -41.61394119262695, "global_step": 250422, "epoch": 2069} {"train_loss": -42.402687072753906, "global_step": 250423, "epoch": 2069} {"train_loss": -43.05215072631836, "global_step": 250424, "epoch": 2069} {"train_loss": -36.4832649230957, "global_step": 250425, "epoch": 2069} {"train_loss": -41.88517379760742, "global_step": 250426, "epoch": 2069} {"train_loss": -42.15053939819336, "global_step": 250427, "epoch": 2069} {"train_loss": -40.957027435302734, "global_step": 250428, "epoch": 2069} {"train_loss": -39.96323013305664, "global_step": 250429, "epoch": 2069} {"train_loss": -42.40748977661133, "global_step": 250430, "epoch": 2069} {"train_loss": -40.94965744018555, "global_step": 250431, "epoch": 2069} {"train_loss": -40.92755126953125, "global_step": 250432, "epoch": 2069} {"train_loss": -41.39155960083008, "global_step": 250433, "epoch": 2069} {"train_loss": -41.446449279785156, "global_step": 250434, "epoch": 2069} {"train_loss": -41.72975540161133, "global_step": 250435, "epoch": 2069} {"train_loss": -41.312835693359375, "global_step": 250436, "epoch": 2069} {"train_loss": -41.8208122253418, "global_step": 250437, "epoch": 2069} {"train_loss": -41.82075881958008, "global_step": 250438, "epoch": 2069} {"train_loss": -42.04642868041992, "global_step": 250439, "epoch": 2069} {"train_loss": -41.214569091796875, "global_step": 250440, "epoch": 2069} {"train_loss": -41.8351936340332, "global_step": 250441, "epoch": 2069} {"train_loss": -41.358741760253906, "global_step": 250442, "epoch": 2069} {"train_loss": -42.0274658203125, "global_step": 250443, "epoch": 2069} {"train_loss": -43.03226852416992, "global_step": 250444, "epoch": 2069} {"train_loss": -42.1869010925293, "global_step": 250445, "epoch": 2069} {"train_loss": -42.28680419921875, "global_step": 250446, "epoch": 2069} {"train_loss": -41.75532913208008, "global_step": 250447, "epoch": 2069} {"train_loss": -41.99148178100586, "global_step": 250448, "epoch": 2069} {"train_loss": -41.34067916870117, "global_step": 250449, "epoch": 2069} {"train_loss": -41.65069580078125, "global_step": 250450, "epoch": 2069} {"train_loss": -41.35728073120117, "global_step": 250451, "epoch": 2069} {"train_loss": -41.560760498046875, "global_step": 250452, "epoch": 2069} {"train_loss": -41.78585433959961, "global_step": 250453, "epoch": 2069} {"train_loss": -42.29939651489258, "global_step": 250454, "epoch": 2069} {"train_loss": -42.38747787475586, "global_step": 250455, "epoch": 2069} {"train_loss": -42.06888961791992, "global_step": 250456, "epoch": 2069} {"train_loss": -42.44672775268555, "global_step": 250457, "epoch": 2069} {"train_loss": -41.7213020324707, "global_step": 250458, "epoch": 2069} {"train_loss": -41.28680419921875, "global_step": 250459, "epoch": 2069} {"train_loss": -42.77682113647461, "global_step": 250460, "epoch": 2069} {"train_loss": -41.4411735534668, "global_step": 250461, "epoch": 2069} {"train_loss": -41.794490814208984, "global_step": 250462, "epoch": 2069} {"train_loss": -40.61857223510742, "global_step": 250463, "epoch": 2069} {"train_loss": -42.73814010620117, "global_step": 250464, "epoch": 2069} {"train_loss": -41.67864227294922, "global_step": 250465, "epoch": 2069} {"train_loss": -41.97550964355469, "global_step": 250466, "epoch": 2069} {"train_loss": -42.91337966918945, "global_step": 250467, "epoch": 2069} {"train_loss": -41.136993408203125, "global_step": 250468, "epoch": 2069} {"train_loss": -42.041804762911205, "global_step": 250469, "epoch": 2069, "val_loss": 2662818.0} {"train_loss": -42.08024215698242, "global_step": 250470, "epoch": 2070} {"train_loss": -40.84121322631836, "global_step": 250471, "epoch": 2070} {"train_loss": -40.707733154296875, "global_step": 250472, "epoch": 2070} {"train_loss": -42.28054428100586, "global_step": 250473, "epoch": 2070} {"train_loss": -39.145957946777344, "global_step": 250474, "epoch": 2070} {"train_loss": -40.10027313232422, "global_step": 250475, "epoch": 2070} {"train_loss": -42.24495315551758, "global_step": 250476, "epoch": 2070} {"train_loss": -40.925636291503906, "global_step": 250477, "epoch": 2070} {"train_loss": -42.070472717285156, "global_step": 250478, "epoch": 2070} {"train_loss": -41.99885177612305, "global_step": 250479, "epoch": 2070} {"train_loss": -40.89229202270508, "global_step": 250480, "epoch": 2070} {"train_loss": -42.348453521728516, "global_step": 250481, "epoch": 2070} {"train_loss": -41.75433349609375, "global_step": 250482, "epoch": 2070} {"train_loss": -41.419918060302734, "global_step": 250483, "epoch": 2070} {"train_loss": -42.49681854248047, "global_step": 250484, "epoch": 2070} {"train_loss": -42.24414825439453, "global_step": 250485, "epoch": 2070} {"train_loss": -42.60000228881836, "global_step": 250486, "epoch": 2070} {"train_loss": -42.371944427490234, "global_step": 250487, "epoch": 2070} {"train_loss": -42.77571105957031, "global_step": 250488, "epoch": 2070} {"train_loss": -42.893096923828125, "global_step": 250489, "epoch": 2070} {"train_loss": -42.4275016784668, "global_step": 250490, "epoch": 2070} {"train_loss": -43.046321868896484, "global_step": 250491, "epoch": 2070} {"train_loss": -42.8725700378418, "global_step": 250492, "epoch": 2070} {"train_loss": -43.180599212646484, "global_step": 250493, "epoch": 2070} {"train_loss": -43.39333724975586, "global_step": 250494, "epoch": 2070} {"train_loss": -43.25020217895508, "global_step": 250495, "epoch": 2070} {"train_loss": -42.93922805786133, "global_step": 250496, "epoch": 2070} {"train_loss": -42.991207122802734, "global_step": 250497, "epoch": 2070} {"train_loss": -43.00303268432617, "global_step": 250498, "epoch": 2070} {"train_loss": -43.40957260131836, "global_step": 250499, "epoch": 2070} {"train_loss": -43.31626510620117, "global_step": 250500, "epoch": 2070} {"train_loss": -43.08322525024414, "global_step": 250501, "epoch": 2070} {"train_loss": -42.794307708740234, "global_step": 250502, "epoch": 2070} {"train_loss": -43.37422561645508, "global_step": 250503, "epoch": 2070} {"train_loss": -43.03738021850586, "global_step": 250504, "epoch": 2070} {"train_loss": -43.59542465209961, "global_step": 250505, "epoch": 2070} {"train_loss": -43.5817756652832, "global_step": 250506, "epoch": 2070} {"train_loss": -42.975223541259766, "global_step": 250507, "epoch": 2070} {"train_loss": -43.193294525146484, "global_step": 250508, "epoch": 2070} {"train_loss": -42.4598503112793, "global_step": 250509, "epoch": 2070} {"train_loss": -42.95863723754883, "global_step": 250510, "epoch": 2070} {"train_loss": -43.26760482788086, "global_step": 250511, "epoch": 2070} {"train_loss": -43.01586151123047, "global_step": 250512, "epoch": 2070} {"train_loss": -43.05329132080078, "global_step": 250513, "epoch": 2070} {"train_loss": -42.833988189697266, "global_step": 250514, "epoch": 2070} {"train_loss": -43.458412170410156, "global_step": 250515, "epoch": 2070} {"train_loss": -42.40461349487305, "global_step": 250516, "epoch": 2070} {"train_loss": -43.65338897705078, "global_step": 250517, "epoch": 2070} {"train_loss": -43.39546203613281, "global_step": 250518, "epoch": 2070} {"train_loss": -42.871498107910156, "global_step": 250519, "epoch": 2070} {"train_loss": -42.6961555480957, "global_step": 250520, "epoch": 2070} {"train_loss": -43.49406051635742, "global_step": 250521, "epoch": 2070} {"train_loss": -42.71904373168945, "global_step": 250522, "epoch": 2070} {"train_loss": -42.72629165649414, "global_step": 250523, "epoch": 2070} {"train_loss": -40.99947738647461, "global_step": 250524, "epoch": 2070} {"train_loss": -43.38424301147461, "global_step": 250525, "epoch": 2070} {"train_loss": -41.50898361206055, "global_step": 250526, "epoch": 2070} {"train_loss": -42.92694854736328, "global_step": 250527, "epoch": 2070} {"train_loss": -43.37732696533203, "global_step": 250528, "epoch": 2070} {"train_loss": -42.4536018371582, "global_step": 250529, "epoch": 2070} {"train_loss": -42.54935836791992, "global_step": 250530, "epoch": 2070} {"train_loss": -42.131988525390625, "global_step": 250531, "epoch": 2070} {"train_loss": -42.57876205444336, "global_step": 250532, "epoch": 2070} {"train_loss": -42.80165481567383, "global_step": 250533, "epoch": 2070} {"train_loss": -40.374324798583984, "global_step": 250534, "epoch": 2070} {"train_loss": -40.54351806640625, "global_step": 250535, "epoch": 2070} {"train_loss": -43.293556213378906, "global_step": 250536, "epoch": 2070} {"train_loss": -40.14467239379883, "global_step": 250537, "epoch": 2070} {"train_loss": -42.4879264831543, "global_step": 250538, "epoch": 2070} {"train_loss": -43.5678596496582, "global_step": 250539, "epoch": 2070} {"train_loss": -42.76045227050781, "global_step": 250540, "epoch": 2070} {"train_loss": -43.05146408081055, "global_step": 250541, "epoch": 2070} {"train_loss": -43.64404296875, "global_step": 250542, "epoch": 2070} {"train_loss": -43.0997200012207, "global_step": 250543, "epoch": 2070} {"train_loss": -43.47039794921875, "global_step": 250544, "epoch": 2070} {"train_loss": -42.89000701904297, "global_step": 250545, "epoch": 2070} {"train_loss": -42.697235107421875, "global_step": 250546, "epoch": 2070} {"train_loss": -42.983299255371094, "global_step": 250547, "epoch": 2070} {"train_loss": -43.637855529785156, "global_step": 250548, "epoch": 2070} {"train_loss": -43.7298583984375, "global_step": 250549, "epoch": 2070} {"train_loss": -43.22257614135742, "global_step": 250550, "epoch": 2070} {"train_loss": -42.95705032348633, "global_step": 250551, "epoch": 2070} {"train_loss": -43.24315643310547, "global_step": 250552, "epoch": 2070} {"train_loss": -43.45737838745117, "global_step": 250553, "epoch": 2070} {"train_loss": -43.295265197753906, "global_step": 250554, "epoch": 2070} {"train_loss": -43.593257904052734, "global_step": 250555, "epoch": 2070} {"train_loss": -42.83349609375, "global_step": 250556, "epoch": 2070} {"train_loss": -42.923675537109375, "global_step": 250557, "epoch": 2070} {"train_loss": -42.950950622558594, "global_step": 250558, "epoch": 2070} {"train_loss": -42.5837516784668, "global_step": 250559, "epoch": 2070} {"train_loss": -43.546592712402344, "global_step": 250560, "epoch": 2070} {"train_loss": -43.00226593017578, "global_step": 250561, "epoch": 2070} {"train_loss": -43.3552360534668, "global_step": 250562, "epoch": 2070} {"train_loss": -43.004676818847656, "global_step": 250563, "epoch": 2070} {"train_loss": -43.810791015625, "global_step": 250564, "epoch": 2070} {"train_loss": -43.70371627807617, "global_step": 250565, "epoch": 2070} {"train_loss": -43.677730560302734, "global_step": 250566, "epoch": 2070} {"train_loss": -43.425106048583984, "global_step": 250567, "epoch": 2070} {"train_loss": -43.14248275756836, "global_step": 250568, "epoch": 2070} {"train_loss": -42.95066833496094, "global_step": 250569, "epoch": 2070} {"train_loss": -43.580711364746094, "global_step": 250570, "epoch": 2070} {"train_loss": -43.213470458984375, "global_step": 250571, "epoch": 2070} {"train_loss": -42.94717025756836, "global_step": 250572, "epoch": 2070} {"train_loss": -42.608978271484375, "global_step": 250573, "epoch": 2070} {"train_loss": -42.976539611816406, "global_step": 250574, "epoch": 2070} {"train_loss": -43.05388259887695, "global_step": 250575, "epoch": 2070} {"train_loss": -42.28542709350586, "global_step": 250576, "epoch": 2070} {"train_loss": -41.64168167114258, "global_step": 250577, "epoch": 2070} {"train_loss": -41.99062728881836, "global_step": 250578, "epoch": 2070} {"train_loss": -43.714454650878906, "global_step": 250579, "epoch": 2070} {"train_loss": -42.632869720458984, "global_step": 250580, "epoch": 2070} {"train_loss": -42.672454833984375, "global_step": 250581, "epoch": 2070} {"train_loss": -43.347225189208984, "global_step": 250582, "epoch": 2070} {"train_loss": -42.30733871459961, "global_step": 250583, "epoch": 2070} {"train_loss": -42.72392654418945, "global_step": 250584, "epoch": 2070} {"train_loss": -43.39528274536133, "global_step": 250585, "epoch": 2070} {"train_loss": -41.878997802734375, "global_step": 250586, "epoch": 2070} {"train_loss": -40.019954681396484, "global_step": 250587, "epoch": 2070} {"train_loss": -42.2976188659668, "global_step": 250588, "epoch": 2070} {"train_loss": -42.25783920288086, "global_step": 250589, "epoch": 2070} {"train_loss": -42.65220102987999, "global_step": 250590, "epoch": 2070, "val_loss": 2562740.75} {"train_loss": -39.54502487182617, "global_step": 250591, "epoch": 2071} {"train_loss": -42.2313232421875, "global_step": 250592, "epoch": 2071} {"train_loss": -41.839935302734375, "global_step": 250593, "epoch": 2071} {"train_loss": -41.3541374206543, "global_step": 250594, "epoch": 2071} {"train_loss": -42.27167892456055, "global_step": 250595, "epoch": 2071} {"train_loss": -42.00203323364258, "global_step": 250596, "epoch": 2071} {"train_loss": -40.895748138427734, "global_step": 250597, "epoch": 2071} {"train_loss": -41.19392013549805, "global_step": 250598, "epoch": 2071} {"train_loss": -42.87274169921875, "global_step": 250599, "epoch": 2071} {"train_loss": -41.52198028564453, "global_step": 250600, "epoch": 2071} {"train_loss": -40.760597229003906, "global_step": 250601, "epoch": 2071} {"train_loss": -41.880470275878906, "global_step": 250602, "epoch": 2071} {"train_loss": -42.01185607910156, "global_step": 250603, "epoch": 2071} {"train_loss": -40.699684143066406, "global_step": 250604, "epoch": 2071} {"train_loss": -41.32369613647461, "global_step": 250605, "epoch": 2071} {"train_loss": -42.17753982543945, "global_step": 250606, "epoch": 2071} {"train_loss": -41.487892150878906, "global_step": 250607, "epoch": 2071} {"train_loss": -41.72669219970703, "global_step": 250608, "epoch": 2071} {"train_loss": -43.0164909362793, "global_step": 250609, "epoch": 2071} {"train_loss": -40.85123825073242, "global_step": 250610, "epoch": 2071} {"train_loss": -41.7048454284668, "global_step": 250611, "epoch": 2071} {"train_loss": -42.260597229003906, "global_step": 250612, "epoch": 2071} {"train_loss": -39.486202239990234, "global_step": 250613, "epoch": 2071} {"train_loss": -40.95319747924805, "global_step": 250614, "epoch": 2071} {"train_loss": -42.085960388183594, "global_step": 250615, "epoch": 2071} {"train_loss": -39.6024284362793, "global_step": 250616, "epoch": 2071} {"train_loss": -41.80961227416992, "global_step": 250617, "epoch": 2071} {"train_loss": -40.934181213378906, "global_step": 250618, "epoch": 2071} {"train_loss": -40.88213348388672, "global_step": 250619, "epoch": 2071} {"train_loss": -40.73176193237305, "global_step": 250620, "epoch": 2071} {"train_loss": -40.8730354309082, "global_step": 250621, "epoch": 2071} {"train_loss": -39.71041488647461, "global_step": 250622, "epoch": 2071} {"train_loss": -30.475238800048828, "global_step": 250623, "epoch": 2071} {"train_loss": -36.82735824584961, "global_step": 250624, "epoch": 2071} {"train_loss": -36.99512481689453, "global_step": 250625, "epoch": 2071} {"train_loss": -40.12245559692383, "global_step": 250626, "epoch": 2071} {"train_loss": -36.07012176513672, "global_step": 250627, "epoch": 2071} {"train_loss": -41.08649826049805, "global_step": 250628, "epoch": 2071} {"train_loss": -34.79819869995117, "global_step": 250629, "epoch": 2071} {"train_loss": -37.43156814575195, "global_step": 250630, "epoch": 2071} {"train_loss": -39.47553634643555, "global_step": 250631, "epoch": 2071} {"train_loss": -38.198665618896484, "global_step": 250632, "epoch": 2071} {"train_loss": -41.17652130126953, "global_step": 250633, "epoch": 2071} {"train_loss": -38.04729080200195, "global_step": 250634, "epoch": 2071} {"train_loss": -40.71118927001953, "global_step": 250635, "epoch": 2071} {"train_loss": -40.26862335205078, "global_step": 250636, "epoch": 2071} {"train_loss": -40.747047424316406, "global_step": 250637, "epoch": 2071} {"train_loss": -40.383087158203125, "global_step": 250638, "epoch": 2071} {"train_loss": -41.50474166870117, "global_step": 250639, "epoch": 2071} {"train_loss": -40.675628662109375, "global_step": 250640, "epoch": 2071} {"train_loss": -41.08954620361328, "global_step": 250641, "epoch": 2071} {"train_loss": -41.642189025878906, "global_step": 250642, "epoch": 2071} {"train_loss": -40.694091796875, "global_step": 250643, "epoch": 2071} {"train_loss": -41.82802963256836, "global_step": 250644, "epoch": 2071} {"train_loss": -41.32033157348633, "global_step": 250645, "epoch": 2071} {"train_loss": -41.81832504272461, "global_step": 250646, "epoch": 2071} {"train_loss": -40.87571334838867, "global_step": 250647, "epoch": 2071} {"train_loss": -42.02909469604492, "global_step": 250648, "epoch": 2071} {"train_loss": -41.796142578125, "global_step": 250649, "epoch": 2071} {"train_loss": -41.74269485473633, "global_step": 250650, "epoch": 2071} {"train_loss": -42.04386901855469, "global_step": 250651, "epoch": 2071} {"train_loss": -42.14939498901367, "global_step": 250652, "epoch": 2071} {"train_loss": -42.32047653198242, "global_step": 250653, "epoch": 2071} {"train_loss": -42.169185638427734, "global_step": 250654, "epoch": 2071} {"train_loss": -42.71434020996094, "global_step": 250655, "epoch": 2071} {"train_loss": -42.704097747802734, "global_step": 250656, "epoch": 2071} {"train_loss": -42.81532287597656, "global_step": 250657, "epoch": 2071} {"train_loss": -42.549434661865234, "global_step": 250658, "epoch": 2071} {"train_loss": -42.77758026123047, "global_step": 250659, "epoch": 2071} {"train_loss": -42.87723922729492, "global_step": 250660, "epoch": 2071} {"train_loss": -42.34370040893555, "global_step": 250661, "epoch": 2071} {"train_loss": -42.57180404663086, "global_step": 250662, "epoch": 2071} {"train_loss": -42.398006439208984, "global_step": 250663, "epoch": 2071} {"train_loss": -42.89665603637695, "global_step": 250664, "epoch": 2071} {"train_loss": -42.77755355834961, "global_step": 250665, "epoch": 2071} {"train_loss": -43.195289611816406, "global_step": 250666, "epoch": 2071} {"train_loss": -43.099727630615234, "global_step": 250667, "epoch": 2071} {"train_loss": -42.84232711791992, "global_step": 250668, "epoch": 2071} {"train_loss": -43.01153564453125, "global_step": 250669, "epoch": 2071} {"train_loss": -43.027645111083984, "global_step": 250670, "epoch": 2071} {"train_loss": -43.2589225769043, "global_step": 250671, "epoch": 2071} {"train_loss": -43.08821487426758, "global_step": 250672, "epoch": 2071} {"train_loss": -43.495338439941406, "global_step": 250673, "epoch": 2071} {"train_loss": -43.2357292175293, "global_step": 250674, "epoch": 2071} {"train_loss": -43.334346771240234, "global_step": 250675, "epoch": 2071} {"train_loss": -43.28273391723633, "global_step": 250676, "epoch": 2071} {"train_loss": -43.544822692871094, "global_step": 250677, "epoch": 2071} {"train_loss": -43.3997688293457, "global_step": 250678, "epoch": 2071} {"train_loss": -43.09564208984375, "global_step": 250679, "epoch": 2071} {"train_loss": -43.67123031616211, "global_step": 250680, "epoch": 2071} {"train_loss": -43.66884231567383, "global_step": 250681, "epoch": 2071} {"train_loss": -43.430912017822266, "global_step": 250682, "epoch": 2071} {"train_loss": -43.7541618347168, "global_step": 250683, "epoch": 2071} {"train_loss": -43.25040054321289, "global_step": 250684, "epoch": 2071} {"train_loss": -43.552001953125, "global_step": 250685, "epoch": 2071} {"train_loss": -43.319068908691406, "global_step": 250686, "epoch": 2071} {"train_loss": -43.714195251464844, "global_step": 250687, "epoch": 2071} {"train_loss": -43.438758850097656, "global_step": 250688, "epoch": 2071} {"train_loss": -43.957550048828125, "global_step": 250689, "epoch": 2071} {"train_loss": -43.564239501953125, "global_step": 250690, "epoch": 2071} {"train_loss": -43.646629333496094, "global_step": 250691, "epoch": 2071} {"train_loss": -43.49420928955078, "global_step": 250692, "epoch": 2071} {"train_loss": -43.4032096862793, "global_step": 250693, "epoch": 2071} {"train_loss": -43.347713470458984, "global_step": 250694, "epoch": 2071} {"train_loss": -43.96503829956055, "global_step": 250695, "epoch": 2071} {"train_loss": -43.45160675048828, "global_step": 250696, "epoch": 2071} {"train_loss": -43.45672607421875, "global_step": 250697, "epoch": 2071} {"train_loss": -43.341949462890625, "global_step": 250698, "epoch": 2071} {"train_loss": -43.595977783203125, "global_step": 250699, "epoch": 2071} {"train_loss": -43.65415573120117, "global_step": 250700, "epoch": 2071} {"train_loss": -43.47987365722656, "global_step": 250701, "epoch": 2071} {"train_loss": -43.96577072143555, "global_step": 250702, "epoch": 2071} {"train_loss": -43.45612335205078, "global_step": 250703, "epoch": 2071} {"train_loss": -43.97647476196289, "global_step": 250704, "epoch": 2071} {"train_loss": -43.597267150878906, "global_step": 250705, "epoch": 2071} {"train_loss": -44.29201889038086, "global_step": 250706, "epoch": 2071} {"train_loss": -43.94362258911133, "global_step": 250707, "epoch": 2071} {"train_loss": -44.078155517578125, "global_step": 250708, "epoch": 2071} {"train_loss": -43.94353485107422, "global_step": 250709, "epoch": 2071} {"train_loss": -44.037933349609375, "global_step": 250710, "epoch": 2071} {"train_loss": -41.920165763413614, "global_step": 250711, "epoch": 2071, "val_loss": 2647727.25} {"train_loss": -43.733131408691406, "global_step": 250712, "epoch": 2072} {"train_loss": -43.70941925048828, "global_step": 250713, "epoch": 2072} {"train_loss": -43.846580505371094, "global_step": 250714, "epoch": 2072} {"train_loss": -44.01369857788086, "global_step": 250715, "epoch": 2072} {"train_loss": -44.428138732910156, "global_step": 250716, "epoch": 2072} {"train_loss": -43.890296936035156, "global_step": 250717, "epoch": 2072} {"train_loss": -43.68839645385742, "global_step": 250718, "epoch": 2072} {"train_loss": -43.66013717651367, "global_step": 250719, "epoch": 2072} {"train_loss": -43.795143127441406, "global_step": 250720, "epoch": 2072} {"train_loss": -43.9632682800293, "global_step": 250721, "epoch": 2072} {"train_loss": -44.0013313293457, "global_step": 250722, "epoch": 2072} {"train_loss": -43.758270263671875, "global_step": 250723, "epoch": 2072} {"train_loss": -43.88800048828125, "global_step": 250724, "epoch": 2072} {"train_loss": -42.45062255859375, "global_step": 250725, "epoch": 2072} {"train_loss": -43.4923095703125, "global_step": 250726, "epoch": 2072} {"train_loss": -43.692623138427734, "global_step": 250727, "epoch": 2072} {"train_loss": -43.80828857421875, "global_step": 250728, "epoch": 2072} {"train_loss": -43.28511428833008, "global_step": 250729, "epoch": 2072} {"train_loss": -42.530113220214844, "global_step": 250730, "epoch": 2072} {"train_loss": -40.705013275146484, "global_step": 250731, "epoch": 2072} {"train_loss": -37.02973556518555, "global_step": 250732, "epoch": 2072} {"train_loss": -32.766448974609375, "global_step": 250733, "epoch": 2072} {"train_loss": -25.679807662963867, "global_step": 250734, "epoch": 2072} {"train_loss": -31.20176124572754, "global_step": 250735, "epoch": 2072} {"train_loss": -39.4459228515625, "global_step": 250736, "epoch": 2072} {"train_loss": -33.14838790893555, "global_step": 250737, "epoch": 2072} {"train_loss": -33.399139404296875, "global_step": 250738, "epoch": 2072} {"train_loss": -38.970149993896484, "global_step": 250739, "epoch": 2072} {"train_loss": -39.677608489990234, "global_step": 250740, "epoch": 2072} {"train_loss": -39.6648063659668, "global_step": 250741, "epoch": 2072} {"train_loss": -39.19416046142578, "global_step": 250742, "epoch": 2072} {"train_loss": -40.23090744018555, "global_step": 250743, "epoch": 2072} {"train_loss": -40.6754035949707, "global_step": 250744, "epoch": 2072} {"train_loss": -40.37537384033203, "global_step": 250745, "epoch": 2072} {"train_loss": -41.1253776550293, "global_step": 250746, "epoch": 2072} {"train_loss": -41.03391647338867, "global_step": 250747, "epoch": 2072} {"train_loss": -41.112483978271484, "global_step": 250748, "epoch": 2072} {"train_loss": -41.50177001953125, "global_step": 250749, "epoch": 2072} {"train_loss": -42.16471481323242, "global_step": 250750, "epoch": 2072} {"train_loss": -41.713539123535156, "global_step": 250751, "epoch": 2072} {"train_loss": -42.15924072265625, "global_step": 250752, "epoch": 2072} {"train_loss": -42.25846862792969, "global_step": 250753, "epoch": 2072} {"train_loss": -42.3674430847168, "global_step": 250754, "epoch": 2072} {"train_loss": -42.506446838378906, "global_step": 250755, "epoch": 2072} {"train_loss": -42.264869689941406, "global_step": 250756, "epoch": 2072} {"train_loss": -41.7546501159668, "global_step": 250757, "epoch": 2072} {"train_loss": -41.96126937866211, "global_step": 250758, "epoch": 2072} {"train_loss": -42.41206741333008, "global_step": 250759, "epoch": 2072} {"train_loss": -42.59851837158203, "global_step": 250760, "epoch": 2072} {"train_loss": -41.94068145751953, "global_step": 250761, "epoch": 2072} {"train_loss": -41.79000473022461, "global_step": 250762, "epoch": 2072} {"train_loss": -42.76350402832031, "global_step": 250763, "epoch": 2072} {"train_loss": -41.98670959472656, "global_step": 250764, "epoch": 2072} {"train_loss": -42.84926986694336, "global_step": 250765, "epoch": 2072} {"train_loss": -42.209228515625, "global_step": 250766, "epoch": 2072} {"train_loss": -42.939186096191406, "global_step": 250767, "epoch": 2072} {"train_loss": -42.37510299682617, "global_step": 250768, "epoch": 2072} {"train_loss": -42.81719970703125, "global_step": 250769, "epoch": 2072} {"train_loss": -42.49856185913086, "global_step": 250770, "epoch": 2072} {"train_loss": -42.6847038269043, "global_step": 250771, "epoch": 2072} {"train_loss": -42.972862243652344, "global_step": 250772, "epoch": 2072} {"train_loss": -43.22578048706055, "global_step": 250773, "epoch": 2072} {"train_loss": -42.71303176879883, "global_step": 250774, "epoch": 2072} {"train_loss": -43.34992218017578, "global_step": 250775, "epoch": 2072} {"train_loss": -43.064056396484375, "global_step": 250776, "epoch": 2072} {"train_loss": -42.7142448425293, "global_step": 250777, "epoch": 2072} {"train_loss": -43.41456985473633, "global_step": 250778, "epoch": 2072} {"train_loss": -43.25342559814453, "global_step": 250779, "epoch": 2072} {"train_loss": -43.412593841552734, "global_step": 250780, "epoch": 2072} {"train_loss": -43.250328063964844, "global_step": 250781, "epoch": 2072} {"train_loss": -42.865631103515625, "global_step": 250782, "epoch": 2072} {"train_loss": -43.478553771972656, "global_step": 250783, "epoch": 2072} {"train_loss": -43.40479278564453, "global_step": 250784, "epoch": 2072} {"train_loss": -43.580848693847656, "global_step": 250785, "epoch": 2072} {"train_loss": -43.22111129760742, "global_step": 250786, "epoch": 2072} {"train_loss": -43.47900390625, "global_step": 250787, "epoch": 2072} {"train_loss": -43.588130950927734, "global_step": 250788, "epoch": 2072} {"train_loss": -43.48861312866211, "global_step": 250789, "epoch": 2072} {"train_loss": -43.42214584350586, "global_step": 250790, "epoch": 2072} {"train_loss": -43.727439880371094, "global_step": 250791, "epoch": 2072} {"train_loss": -43.455299377441406, "global_step": 250792, "epoch": 2072} {"train_loss": -43.69074630737305, "global_step": 250793, "epoch": 2072} {"train_loss": -43.25748825073242, "global_step": 250794, "epoch": 2072} {"train_loss": -43.52754211425781, "global_step": 250795, "epoch": 2072} {"train_loss": -43.17908477783203, "global_step": 250796, "epoch": 2072} {"train_loss": -39.517093658447266, "global_step": 250797, "epoch": 2072} {"train_loss": -43.18489074707031, "global_step": 250798, "epoch": 2072} {"train_loss": -40.589332580566406, "global_step": 250799, "epoch": 2072} {"train_loss": -43.7152214050293, "global_step": 250800, "epoch": 2072} {"train_loss": -39.516326904296875, "global_step": 250801, "epoch": 2072} {"train_loss": -17.866140365600586, "global_step": 250802, "epoch": 2072} {"train_loss": -42.18803024291992, "global_step": 250803, "epoch": 2072} {"train_loss": -20.9250545501709, "global_step": 250804, "epoch": 2072} {"train_loss": -34.16082763671875, "global_step": 250805, "epoch": 2072} {"train_loss": -35.03010177612305, "global_step": 250806, "epoch": 2072} {"train_loss": -28.390668869018555, "global_step": 250807, "epoch": 2072} {"train_loss": -16.470951080322266, "global_step": 250808, "epoch": 2072} {"train_loss": -27.425153732299805, "global_step": 250809, "epoch": 2072} {"train_loss": -7.7874040603637695, "global_step": 250810, "epoch": 2072} {"train_loss": -20.275436401367188, "global_step": 250811, "epoch": 2072} {"train_loss": -26.353139877319336, "global_step": 250812, "epoch": 2072} {"train_loss": -28.548086166381836, "global_step": 250813, "epoch": 2072} {"train_loss": -23.523300170898438, "global_step": 250814, "epoch": 2072} {"train_loss": -30.2507381439209, "global_step": 250815, "epoch": 2072} {"train_loss": -34.376277923583984, "global_step": 250816, "epoch": 2072} {"train_loss": -35.55345153808594, "global_step": 250817, "epoch": 2072} {"train_loss": -34.71303176879883, "global_step": 250818, "epoch": 2072} {"train_loss": -25.081117630004883, "global_step": 250819, "epoch": 2072} {"train_loss": -32.463802337646484, "global_step": 250820, "epoch": 2072} {"train_loss": -28.86234474182129, "global_step": 250821, "epoch": 2072} {"train_loss": -32.37109375, "global_step": 250822, "epoch": 2072} {"train_loss": -35.51915740966797, "global_step": 250823, "epoch": 2072} {"train_loss": -34.2581672668457, "global_step": 250824, "epoch": 2072} {"train_loss": -30.983488082885742, "global_step": 250825, "epoch": 2072} {"train_loss": -35.43918991088867, "global_step": 250826, "epoch": 2072} {"train_loss": -36.36858367919922, "global_step": 250827, "epoch": 2072} {"train_loss": -35.546749114990234, "global_step": 250828, "epoch": 2072} {"train_loss": -36.56576919555664, "global_step": 250829, "epoch": 2072} {"train_loss": -34.56272506713867, "global_step": 250830, "epoch": 2072} {"train_loss": -36.38422775268555, "global_step": 250831, "epoch": 2072} {"train_loss": -38.83314896418043, "global_step": 250832, "epoch": 2072, "val_loss": 2564923.75} {"train_loss": -36.999263763427734, "global_step": 250833, "epoch": 2073} {"train_loss": -37.69974899291992, "global_step": 250834, "epoch": 2073} {"train_loss": -36.958553314208984, "global_step": 250835, "epoch": 2073} {"train_loss": -37.28495407104492, "global_step": 250836, "epoch": 2073} {"train_loss": -38.11922073364258, "global_step": 250837, "epoch": 2073} {"train_loss": -38.52592849731445, "global_step": 250838, "epoch": 2073} {"train_loss": -38.43626403808594, "global_step": 250839, "epoch": 2073} {"train_loss": -37.59685134887695, "global_step": 250840, "epoch": 2073} {"train_loss": -37.759803771972656, "global_step": 250841, "epoch": 2073} {"train_loss": -38.0133171081543, "global_step": 250842, "epoch": 2073} {"train_loss": -37.14026641845703, "global_step": 250843, "epoch": 2073} {"train_loss": -38.28171920776367, "global_step": 250844, "epoch": 2073} {"train_loss": -37.6981086730957, "global_step": 250845, "epoch": 2073} {"train_loss": -37.02129364013672, "global_step": 250846, "epoch": 2073} {"train_loss": -38.34218978881836, "global_step": 250847, "epoch": 2073} {"train_loss": -38.17699432373047, "global_step": 250848, "epoch": 2073} {"train_loss": -37.82465744018555, "global_step": 250849, "epoch": 2073} {"train_loss": -38.7370719909668, "global_step": 250850, "epoch": 2073} {"train_loss": -39.52412414550781, "global_step": 250851, "epoch": 2073} {"train_loss": -37.688941955566406, "global_step": 250852, "epoch": 2073} {"train_loss": -37.80690383911133, "global_step": 250853, "epoch": 2073} {"train_loss": -38.92299270629883, "global_step": 250854, "epoch": 2073} {"train_loss": -38.789974212646484, "global_step": 250855, "epoch": 2073} {"train_loss": -38.2203254699707, "global_step": 250856, "epoch": 2073} {"train_loss": -38.38563919067383, "global_step": 250857, "epoch": 2073} {"train_loss": -37.839027404785156, "global_step": 250858, "epoch": 2073} {"train_loss": -39.3029670715332, "global_step": 250859, "epoch": 2073} {"train_loss": -38.528297424316406, "global_step": 250860, "epoch": 2073} {"train_loss": -40.04743576049805, "global_step": 250861, "epoch": 2073} {"train_loss": -39.66961669921875, "global_step": 250862, "epoch": 2073} {"train_loss": -38.63042068481445, "global_step": 250863, "epoch": 2073} {"train_loss": -39.666969299316406, "global_step": 250864, "epoch": 2073} {"train_loss": -39.572998046875, "global_step": 250865, "epoch": 2073} {"train_loss": -38.32447814941406, "global_step": 250866, "epoch": 2073} {"train_loss": -39.594451904296875, "global_step": 250867, "epoch": 2073} {"train_loss": -38.28837966918945, "global_step": 250868, "epoch": 2073} {"train_loss": -38.47793197631836, "global_step": 250869, "epoch": 2073} {"train_loss": -40.04781723022461, "global_step": 250870, "epoch": 2073} {"train_loss": -39.24241256713867, "global_step": 250871, "epoch": 2073} {"train_loss": -39.20632553100586, "global_step": 250872, "epoch": 2073} {"train_loss": -39.326942443847656, "global_step": 250873, "epoch": 2073} {"train_loss": -40.23257064819336, "global_step": 250874, "epoch": 2073} {"train_loss": -39.945899963378906, "global_step": 250875, "epoch": 2073} {"train_loss": -40.05785369873047, "global_step": 250876, "epoch": 2073} {"train_loss": -39.8037223815918, "global_step": 250877, "epoch": 2073} {"train_loss": -39.930198669433594, "global_step": 250878, "epoch": 2073} {"train_loss": -38.891441345214844, "global_step": 250879, "epoch": 2073} {"train_loss": -40.763763427734375, "global_step": 250880, "epoch": 2073} {"train_loss": -39.66372299194336, "global_step": 250881, "epoch": 2073} {"train_loss": -39.750755310058594, "global_step": 250882, "epoch": 2073} {"train_loss": -40.40829086303711, "global_step": 250883, "epoch": 2073} {"train_loss": -40.16539764404297, "global_step": 250884, "epoch": 2073} {"train_loss": -40.626949310302734, "global_step": 250885, "epoch": 2073} {"train_loss": -39.118587493896484, "global_step": 250886, "epoch": 2073} {"train_loss": -40.013824462890625, "global_step": 250887, "epoch": 2073} {"train_loss": -40.15999221801758, "global_step": 250888, "epoch": 2073} {"train_loss": -40.064239501953125, "global_step": 250889, "epoch": 2073} {"train_loss": -40.6481819152832, "global_step": 250890, "epoch": 2073} {"train_loss": -40.25625228881836, "global_step": 250891, "epoch": 2073} {"train_loss": -40.229270935058594, "global_step": 250892, "epoch": 2073} {"train_loss": -39.94314193725586, "global_step": 250893, "epoch": 2073} {"train_loss": -40.96099090576172, "global_step": 250894, "epoch": 2073} {"train_loss": -39.95530700683594, "global_step": 250895, "epoch": 2073} {"train_loss": -40.59220504760742, "global_step": 250896, "epoch": 2073} {"train_loss": -41.07860565185547, "global_step": 250897, "epoch": 2073} {"train_loss": -40.558448791503906, "global_step": 250898, "epoch": 2073} {"train_loss": -40.1732292175293, "global_step": 250899, "epoch": 2073} {"train_loss": -40.56324768066406, "global_step": 250900, "epoch": 2073} {"train_loss": -39.91545104980469, "global_step": 250901, "epoch": 2073} {"train_loss": -41.15704345703125, "global_step": 250902, "epoch": 2073} {"train_loss": -40.977535247802734, "global_step": 250903, "epoch": 2073} {"train_loss": -40.235050201416016, "global_step": 250904, "epoch": 2073} {"train_loss": -40.85287094116211, "global_step": 250905, "epoch": 2073} {"train_loss": -40.459468841552734, "global_step": 250906, "epoch": 2073} {"train_loss": -40.3624267578125, "global_step": 250907, "epoch": 2073} {"train_loss": -40.43804931640625, "global_step": 250908, "epoch": 2073} {"train_loss": -40.126373291015625, "global_step": 250909, "epoch": 2073} {"train_loss": -40.729087829589844, "global_step": 250910, "epoch": 2073} {"train_loss": -40.84820556640625, "global_step": 250911, "epoch": 2073} {"train_loss": -40.09440994262695, "global_step": 250912, "epoch": 2073} {"train_loss": -41.34320068359375, "global_step": 250913, "epoch": 2073} {"train_loss": -40.9449348449707, "global_step": 250914, "epoch": 2073} {"train_loss": -41.19291305541992, "global_step": 250915, "epoch": 2073} {"train_loss": -41.23646926879883, "global_step": 250916, "epoch": 2073} {"train_loss": -41.518768310546875, "global_step": 250917, "epoch": 2073} {"train_loss": -40.801944732666016, "global_step": 250918, "epoch": 2073} {"train_loss": -41.02177810668945, "global_step": 250919, "epoch": 2073} {"train_loss": -42.10114669799805, "global_step": 250920, "epoch": 2073} {"train_loss": -41.14684295654297, "global_step": 250921, "epoch": 2073} {"train_loss": -41.55547332763672, "global_step": 250922, "epoch": 2073} {"train_loss": -42.073036193847656, "global_step": 250923, "epoch": 2073} {"train_loss": -40.959266662597656, "global_step": 250924, "epoch": 2073} {"train_loss": -40.53424072265625, "global_step": 250925, "epoch": 2073} {"train_loss": -41.64306640625, "global_step": 250926, "epoch": 2073} {"train_loss": -40.71223068237305, "global_step": 250927, "epoch": 2073} {"train_loss": -40.24397659301758, "global_step": 250928, "epoch": 2073} {"train_loss": -40.94504928588867, "global_step": 250929, "epoch": 2073} {"train_loss": -41.12963104248047, "global_step": 250930, "epoch": 2073} {"train_loss": -41.58604049682617, "global_step": 250931, "epoch": 2073} {"train_loss": -41.735694885253906, "global_step": 250932, "epoch": 2073} {"train_loss": -42.47952651977539, "global_step": 250933, "epoch": 2073} {"train_loss": -41.064632415771484, "global_step": 250934, "epoch": 2073} {"train_loss": -41.68389892578125, "global_step": 250935, "epoch": 2073} {"train_loss": -41.577205657958984, "global_step": 250936, "epoch": 2073} {"train_loss": -40.83425521850586, "global_step": 250937, "epoch": 2073} {"train_loss": -42.09572219848633, "global_step": 250938, "epoch": 2073} {"train_loss": -42.36104965209961, "global_step": 250939, "epoch": 2073} {"train_loss": -42.17082977294922, "global_step": 250940, "epoch": 2073} {"train_loss": -41.73126983642578, "global_step": 250941, "epoch": 2073} {"train_loss": -41.4268913269043, "global_step": 250942, "epoch": 2073} {"train_loss": -41.97919845581055, "global_step": 250943, "epoch": 2073} {"train_loss": -41.42001724243164, "global_step": 250944, "epoch": 2073} {"train_loss": -41.81840896606445, "global_step": 250945, "epoch": 2073} {"train_loss": -41.60011672973633, "global_step": 250946, "epoch": 2073} {"train_loss": -41.39108657836914, "global_step": 250947, "epoch": 2073} {"train_loss": -42.60266876220703, "global_step": 250948, "epoch": 2073} {"train_loss": -41.98299789428711, "global_step": 250949, "epoch": 2073} {"train_loss": -41.75263977050781, "global_step": 250950, "epoch": 2073} {"train_loss": -42.10441589355469, "global_step": 250951, "epoch": 2073} {"train_loss": -42.187660217285156, "global_step": 250952, "epoch": 2073} {"train_loss": -40.070963394543355, "global_step": 250953, "epoch": 2073, "val_loss": 2643291.75} {"train_loss": -41.47268295288086, "global_step": 250954, "epoch": 2074} {"train_loss": -41.77858352661133, "global_step": 250955, "epoch": 2074} {"train_loss": -41.30878448486328, "global_step": 250956, "epoch": 2074} {"train_loss": -42.54248046875, "global_step": 250957, "epoch": 2074} {"train_loss": -41.9406623840332, "global_step": 250958, "epoch": 2074} {"train_loss": -41.38923263549805, "global_step": 250959, "epoch": 2074} {"train_loss": -42.357398986816406, "global_step": 250960, "epoch": 2074} {"train_loss": -41.75472640991211, "global_step": 250961, "epoch": 2074} {"train_loss": -42.1473274230957, "global_step": 250962, "epoch": 2074} {"train_loss": -42.385650634765625, "global_step": 250963, "epoch": 2074} {"train_loss": -42.136016845703125, "global_step": 250964, "epoch": 2074} {"train_loss": -41.70145797729492, "global_step": 250965, "epoch": 2074} {"train_loss": -42.46892547607422, "global_step": 250966, "epoch": 2074} {"train_loss": -42.432037353515625, "global_step": 250967, "epoch": 2074} {"train_loss": -41.67658233642578, "global_step": 250968, "epoch": 2074} {"train_loss": -42.16559982299805, "global_step": 250969, "epoch": 2074} {"train_loss": -42.426795959472656, "global_step": 250970, "epoch": 2074} {"train_loss": -41.94347381591797, "global_step": 250971, "epoch": 2074} {"train_loss": -42.224449157714844, "global_step": 250972, "epoch": 2074} {"train_loss": -42.786537170410156, "global_step": 250973, "epoch": 2074} {"train_loss": -42.545372009277344, "global_step": 250974, "epoch": 2074} {"train_loss": -41.71519088745117, "global_step": 250975, "epoch": 2074} {"train_loss": -42.3659782409668, "global_step": 250976, "epoch": 2074} {"train_loss": -41.4715690612793, "global_step": 250977, "epoch": 2074} {"train_loss": -40.22063446044922, "global_step": 250978, "epoch": 2074} {"train_loss": -41.41304397583008, "global_step": 250979, "epoch": 2074} {"train_loss": -41.92145919799805, "global_step": 250980, "epoch": 2074} {"train_loss": -41.696563720703125, "global_step": 250981, "epoch": 2074} {"train_loss": -40.91936492919922, "global_step": 250982, "epoch": 2074} {"train_loss": -42.39765548706055, "global_step": 250983, "epoch": 2074} {"train_loss": -41.5638542175293, "global_step": 250984, "epoch": 2074} {"train_loss": -40.539920806884766, "global_step": 250985, "epoch": 2074} {"train_loss": -41.63258743286133, "global_step": 250986, "epoch": 2074} {"train_loss": -42.23435592651367, "global_step": 250987, "epoch": 2074} {"train_loss": -41.9306526184082, "global_step": 250988, "epoch": 2074} {"train_loss": -41.78657913208008, "global_step": 250989, "epoch": 2074} {"train_loss": -40.97674560546875, "global_step": 250990, "epoch": 2074} {"train_loss": -41.685062408447266, "global_step": 250991, "epoch": 2074} {"train_loss": -41.542884826660156, "global_step": 250992, "epoch": 2074} {"train_loss": -41.7973747253418, "global_step": 250993, "epoch": 2074} {"train_loss": -42.21668243408203, "global_step": 250994, "epoch": 2074} {"train_loss": -42.166900634765625, "global_step": 250995, "epoch": 2074} {"train_loss": -41.36762619018555, "global_step": 250996, "epoch": 2074} {"train_loss": -42.39481735229492, "global_step": 250997, "epoch": 2074} {"train_loss": -41.93842697143555, "global_step": 250998, "epoch": 2074} {"train_loss": -41.470458984375, "global_step": 250999, "epoch": 2074} {"train_loss": -41.07441329956055, "global_step": 251000, "epoch": 2074} {"train_loss": -41.066017150878906, "global_step": 251001, "epoch": 2074} {"train_loss": -41.577606201171875, "global_step": 251002, "epoch": 2074} {"train_loss": -41.85721969604492, "global_step": 251003, "epoch": 2074} {"train_loss": -40.9273796081543, "global_step": 251004, "epoch": 2074} {"train_loss": -41.54238510131836, "global_step": 251005, "epoch": 2074} {"train_loss": -41.194515228271484, "global_step": 251006, "epoch": 2074} {"train_loss": -41.270057678222656, "global_step": 251007, "epoch": 2074} {"train_loss": -41.61094284057617, "global_step": 251008, "epoch": 2074} {"train_loss": -41.55149459838867, "global_step": 251009, "epoch": 2074} {"train_loss": -41.5550651550293, "global_step": 251010, "epoch": 2074} {"train_loss": -40.9847526550293, "global_step": 251011, "epoch": 2074} {"train_loss": -41.3067741394043, "global_step": 251012, "epoch": 2074} {"train_loss": -41.56838607788086, "global_step": 251013, "epoch": 2074} {"train_loss": -40.19637680053711, "global_step": 251014, "epoch": 2074} {"train_loss": -39.65643310546875, "global_step": 251015, "epoch": 2074} {"train_loss": -40.72021484375, "global_step": 251016, "epoch": 2074} {"train_loss": -40.7575569152832, "global_step": 251017, "epoch": 2074} {"train_loss": -41.52667236328125, "global_step": 251018, "epoch": 2074} {"train_loss": -41.218482971191406, "global_step": 251019, "epoch": 2074} {"train_loss": -41.6818733215332, "global_step": 251020, "epoch": 2074} {"train_loss": -41.383941650390625, "global_step": 251021, "epoch": 2074} {"train_loss": -42.117401123046875, "global_step": 251022, "epoch": 2074} {"train_loss": -40.99062728881836, "global_step": 251023, "epoch": 2074} {"train_loss": -42.13386154174805, "global_step": 251024, "epoch": 2074} {"train_loss": -41.607147216796875, "global_step": 251025, "epoch": 2074} {"train_loss": -40.918678283691406, "global_step": 251026, "epoch": 2074} {"train_loss": -41.721282958984375, "global_step": 251027, "epoch": 2074} {"train_loss": -40.98223114013672, "global_step": 251028, "epoch": 2074} {"train_loss": -41.715126037597656, "global_step": 251029, "epoch": 2074} {"train_loss": -42.09835433959961, "global_step": 251030, "epoch": 2074} {"train_loss": -41.04262161254883, "global_step": 251031, "epoch": 2074} {"train_loss": -41.72343826293945, "global_step": 251032, "epoch": 2074} {"train_loss": -41.672882080078125, "global_step": 251033, "epoch": 2074} {"train_loss": -41.831260681152344, "global_step": 251034, "epoch": 2074} {"train_loss": -42.223609924316406, "global_step": 251035, "epoch": 2074} {"train_loss": -42.07339096069336, "global_step": 251036, "epoch": 2074} {"train_loss": -42.198280334472656, "global_step": 251037, "epoch": 2074} {"train_loss": -42.199440002441406, "global_step": 251038, "epoch": 2074} {"train_loss": -41.33388137817383, "global_step": 251039, "epoch": 2074} {"train_loss": -41.388336181640625, "global_step": 251040, "epoch": 2074} {"train_loss": -40.97698974609375, "global_step": 251041, "epoch": 2074} {"train_loss": -41.32912826538086, "global_step": 251042, "epoch": 2074} {"train_loss": -41.77511978149414, "global_step": 251043, "epoch": 2074} {"train_loss": -41.365577697753906, "global_step": 251044, "epoch": 2074} {"train_loss": -41.51369857788086, "global_step": 251045, "epoch": 2074} {"train_loss": -42.46470642089844, "global_step": 251046, "epoch": 2074} {"train_loss": -41.43766403198242, "global_step": 251047, "epoch": 2074} {"train_loss": -41.8700065612793, "global_step": 251048, "epoch": 2074} {"train_loss": -41.73344802856445, "global_step": 251049, "epoch": 2074} {"train_loss": -38.49768829345703, "global_step": 251050, "epoch": 2074} {"train_loss": -41.38848114013672, "global_step": 251051, "epoch": 2074} {"train_loss": -41.1396484375, "global_step": 251052, "epoch": 2074} {"train_loss": -42.49298858642578, "global_step": 251053, "epoch": 2074} {"train_loss": -40.88499450683594, "global_step": 251054, "epoch": 2074} {"train_loss": -42.75327682495117, "global_step": 251055, "epoch": 2074} {"train_loss": -41.737892150878906, "global_step": 251056, "epoch": 2074} {"train_loss": -42.727081298828125, "global_step": 251057, "epoch": 2074} {"train_loss": -42.10531234741211, "global_step": 251058, "epoch": 2074} {"train_loss": -42.41769790649414, "global_step": 251059, "epoch": 2074} {"train_loss": -41.992225646972656, "global_step": 251060, "epoch": 2074} {"train_loss": -42.6110954284668, "global_step": 251061, "epoch": 2074} {"train_loss": -42.11897659301758, "global_step": 251062, "epoch": 2074} {"train_loss": -42.239620208740234, "global_step": 251063, "epoch": 2074} {"train_loss": -42.44486618041992, "global_step": 251064, "epoch": 2074} {"train_loss": -42.90266799926758, "global_step": 251065, "epoch": 2074} {"train_loss": -41.788265228271484, "global_step": 251066, "epoch": 2074} {"train_loss": -42.847564697265625, "global_step": 251067, "epoch": 2074} {"train_loss": -42.29331588745117, "global_step": 251068, "epoch": 2074} {"train_loss": -42.37080383300781, "global_step": 251069, "epoch": 2074} {"train_loss": -40.990970611572266, "global_step": 251070, "epoch": 2074} {"train_loss": -41.4945182800293, "global_step": 251071, "epoch": 2074} {"train_loss": -42.399715423583984, "global_step": 251072, "epoch": 2074} {"train_loss": -42.6931266784668, "global_step": 251073, "epoch": 2074} {"train_loss": -41.709776507921454, "global_step": 251074, "epoch": 2074, "val_loss": 2650368.75} {"train_loss": -40.798099517822266, "global_step": 251075, "epoch": 2075} {"train_loss": -38.02384567260742, "global_step": 251076, "epoch": 2075} {"train_loss": -30.736536026000977, "global_step": 251077, "epoch": 2075} {"train_loss": -35.803558349609375, "global_step": 251078, "epoch": 2075} {"train_loss": -41.58444595336914, "global_step": 251079, "epoch": 2075} {"train_loss": -36.05152130126953, "global_step": 251080, "epoch": 2075} {"train_loss": -35.0622673034668, "global_step": 251081, "epoch": 2075} {"train_loss": -41.42940902709961, "global_step": 251082, "epoch": 2075} {"train_loss": -35.495975494384766, "global_step": 251083, "epoch": 2075} {"train_loss": -40.89260482788086, "global_step": 251084, "epoch": 2075} {"train_loss": -37.83711624145508, "global_step": 251085, "epoch": 2075} {"train_loss": -37.4154167175293, "global_step": 251086, "epoch": 2075} {"train_loss": -41.70054244995117, "global_step": 251087, "epoch": 2075} {"train_loss": -37.62504959106445, "global_step": 251088, "epoch": 2075} {"train_loss": -39.81553268432617, "global_step": 251089, "epoch": 2075} {"train_loss": -38.0159797668457, "global_step": 251090, "epoch": 2075} {"train_loss": -40.1706657409668, "global_step": 251091, "epoch": 2075} {"train_loss": -40.08217239379883, "global_step": 251092, "epoch": 2075} {"train_loss": -40.823970794677734, "global_step": 251093, "epoch": 2075} {"train_loss": -40.600765228271484, "global_step": 251094, "epoch": 2075} {"train_loss": -41.756710052490234, "global_step": 251095, "epoch": 2075} {"train_loss": -39.89512252807617, "global_step": 251096, "epoch": 2075} {"train_loss": -41.36808776855469, "global_step": 251097, "epoch": 2075} {"train_loss": -40.512306213378906, "global_step": 251098, "epoch": 2075} {"train_loss": -41.35211944580078, "global_step": 251099, "epoch": 2075} {"train_loss": -42.04237747192383, "global_step": 251100, "epoch": 2075} {"train_loss": -41.92416000366211, "global_step": 251101, "epoch": 2075} {"train_loss": -41.55799102783203, "global_step": 251102, "epoch": 2075} {"train_loss": -41.168426513671875, "global_step": 251103, "epoch": 2075} {"train_loss": -41.44334030151367, "global_step": 251104, "epoch": 2075} {"train_loss": -40.532955169677734, "global_step": 251105, "epoch": 2075} {"train_loss": -41.52436065673828, "global_step": 251106, "epoch": 2075} {"train_loss": -41.289955139160156, "global_step": 251107, "epoch": 2075} {"train_loss": -41.85459518432617, "global_step": 251108, "epoch": 2075} {"train_loss": -41.59359359741211, "global_step": 251109, "epoch": 2075} {"train_loss": -41.58207321166992, "global_step": 251110, "epoch": 2075} {"train_loss": -41.1543083190918, "global_step": 251111, "epoch": 2075} {"train_loss": -42.4356803894043, "global_step": 251112, "epoch": 2075} {"train_loss": -41.37348556518555, "global_step": 251113, "epoch": 2075} {"train_loss": -41.475799560546875, "global_step": 251114, "epoch": 2075} {"train_loss": -41.46266555786133, "global_step": 251115, "epoch": 2075} {"train_loss": -42.24346923828125, "global_step": 251116, "epoch": 2075} {"train_loss": -42.48091506958008, "global_step": 251117, "epoch": 2075} {"train_loss": -42.16667938232422, "global_step": 251118, "epoch": 2075} {"train_loss": -42.28902816772461, "global_step": 251119, "epoch": 2075} {"train_loss": -42.28034591674805, "global_step": 251120, "epoch": 2075} {"train_loss": -42.100032806396484, "global_step": 251121, "epoch": 2075} {"train_loss": -42.51155090332031, "global_step": 251122, "epoch": 2075} {"train_loss": -42.72874069213867, "global_step": 251123, "epoch": 2075} {"train_loss": -42.1644287109375, "global_step": 251124, "epoch": 2075} {"train_loss": -42.79073715209961, "global_step": 251125, "epoch": 2075} {"train_loss": -42.525001525878906, "global_step": 251126, "epoch": 2075} {"train_loss": -42.147762298583984, "global_step": 251127, "epoch": 2075} {"train_loss": -42.45724868774414, "global_step": 251128, "epoch": 2075} {"train_loss": -42.35724639892578, "global_step": 251129, "epoch": 2075} {"train_loss": -42.89547348022461, "global_step": 251130, "epoch": 2075} {"train_loss": -42.37008285522461, "global_step": 251131, "epoch": 2075} {"train_loss": -42.70527267456055, "global_step": 251132, "epoch": 2075} {"train_loss": -42.024635314941406, "global_step": 251133, "epoch": 2075} {"train_loss": -42.66543197631836, "global_step": 251134, "epoch": 2075} {"train_loss": -42.02311325073242, "global_step": 251135, "epoch": 2075} {"train_loss": -42.82489776611328, "global_step": 251136, "epoch": 2075} {"train_loss": -43.17195510864258, "global_step": 251137, "epoch": 2075} {"train_loss": -43.6038818359375, "global_step": 251138, "epoch": 2075} {"train_loss": -42.67510986328125, "global_step": 251139, "epoch": 2075} {"train_loss": -42.92817306518555, "global_step": 251140, "epoch": 2075} {"train_loss": -42.18424987792969, "global_step": 251141, "epoch": 2075} {"train_loss": -43.184539794921875, "global_step": 251142, "epoch": 2075} {"train_loss": -43.2087287902832, "global_step": 251143, "epoch": 2075} {"train_loss": -42.727760314941406, "global_step": 251144, "epoch": 2075} {"train_loss": -43.413543701171875, "global_step": 251145, "epoch": 2075} {"train_loss": -42.76978302001953, "global_step": 251146, "epoch": 2075} {"train_loss": -42.14089584350586, "global_step": 251147, "epoch": 2075} {"train_loss": -42.592918395996094, "global_step": 251148, "epoch": 2075} {"train_loss": -43.346309661865234, "global_step": 251149, "epoch": 2075} {"train_loss": -43.212459564208984, "global_step": 251150, "epoch": 2075} {"train_loss": -42.4205322265625, "global_step": 251151, "epoch": 2075} {"train_loss": -42.651302337646484, "global_step": 251152, "epoch": 2075} {"train_loss": -43.00557327270508, "global_step": 251153, "epoch": 2075} {"train_loss": -43.071083068847656, "global_step": 251154, "epoch": 2075} {"train_loss": -42.509727478027344, "global_step": 251155, "epoch": 2075} {"train_loss": -42.814002990722656, "global_step": 251156, "epoch": 2075} {"train_loss": -43.56979751586914, "global_step": 251157, "epoch": 2075} {"train_loss": -43.3975830078125, "global_step": 251158, "epoch": 2075} {"train_loss": -42.43740463256836, "global_step": 251159, "epoch": 2075} {"train_loss": -42.89690017700195, "global_step": 251160, "epoch": 2075} {"train_loss": -42.9225959777832, "global_step": 251161, "epoch": 2075} {"train_loss": -42.738338470458984, "global_step": 251162, "epoch": 2075} {"train_loss": -43.15167999267578, "global_step": 251163, "epoch": 2075} {"train_loss": -43.28323745727539, "global_step": 251164, "epoch": 2075} {"train_loss": -42.73505783081055, "global_step": 251165, "epoch": 2075} {"train_loss": -43.41794967651367, "global_step": 251166, "epoch": 2075} {"train_loss": -42.304664611816406, "global_step": 251167, "epoch": 2075} {"train_loss": -43.32474899291992, "global_step": 251168, "epoch": 2075} {"train_loss": -43.644290924072266, "global_step": 251169, "epoch": 2075} {"train_loss": -41.27888107299805, "global_step": 251170, "epoch": 2075} {"train_loss": -39.40937042236328, "global_step": 251171, "epoch": 2075} {"train_loss": -42.29987716674805, "global_step": 251172, "epoch": 2075} {"train_loss": -42.51161575317383, "global_step": 251173, "epoch": 2075} {"train_loss": -41.79056167602539, "global_step": 251174, "epoch": 2075} {"train_loss": -42.7130126953125, "global_step": 251175, "epoch": 2075} {"train_loss": -42.073402404785156, "global_step": 251176, "epoch": 2075} {"train_loss": -42.982505798339844, "global_step": 251177, "epoch": 2075} {"train_loss": -41.306880950927734, "global_step": 251178, "epoch": 2075} {"train_loss": -41.647945404052734, "global_step": 251179, "epoch": 2075} {"train_loss": -41.565338134765625, "global_step": 251180, "epoch": 2075} {"train_loss": -42.625892639160156, "global_step": 251181, "epoch": 2075} {"train_loss": -42.63111877441406, "global_step": 251182, "epoch": 2075} {"train_loss": -41.5548210144043, "global_step": 251183, "epoch": 2075} {"train_loss": -41.28572082519531, "global_step": 251184, "epoch": 2075} {"train_loss": -42.06510543823242, "global_step": 251185, "epoch": 2075} {"train_loss": -41.76007080078125, "global_step": 251186, "epoch": 2075} {"train_loss": -41.78884506225586, "global_step": 251187, "epoch": 2075} {"train_loss": -42.76401901245117, "global_step": 251188, "epoch": 2075} {"train_loss": -42.728515625, "global_step": 251189, "epoch": 2075} {"train_loss": -41.87873077392578, "global_step": 251190, "epoch": 2075} {"train_loss": -40.119754791259766, "global_step": 251191, "epoch": 2075} {"train_loss": -41.4949836730957, "global_step": 251192, "epoch": 2075} {"train_loss": -41.25503158569336, "global_step": 251193, "epoch": 2075} {"train_loss": -39.24868392944336, "global_step": 251194, "epoch": 2075} {"train_loss": -41.58046424487406, "global_step": 251195, "epoch": 2075, "val_loss": 2643810.75} {"train_loss": -40.620670318603516, "global_step": 251196, "epoch": 2076} {"train_loss": -40.78683090209961, "global_step": 251197, "epoch": 2076} {"train_loss": -41.861785888671875, "global_step": 251198, "epoch": 2076} {"train_loss": -40.92354202270508, "global_step": 251199, "epoch": 2076} {"train_loss": -40.96371078491211, "global_step": 251200, "epoch": 2076} {"train_loss": -41.86003875732422, "global_step": 251201, "epoch": 2076} {"train_loss": -41.018104553222656, "global_step": 251202, "epoch": 2076} {"train_loss": -36.3031120300293, "global_step": 251203, "epoch": 2076} {"train_loss": -32.769142150878906, "global_step": 251204, "epoch": 2076} {"train_loss": -32.11759567260742, "global_step": 251205, "epoch": 2076} {"train_loss": -39.7475700378418, "global_step": 251206, "epoch": 2076} {"train_loss": -38.43511199951172, "global_step": 251207, "epoch": 2076} {"train_loss": -35.98237609863281, "global_step": 251208, "epoch": 2076} {"train_loss": -39.7927360534668, "global_step": 251209, "epoch": 2076} {"train_loss": -38.46247100830078, "global_step": 251210, "epoch": 2076} {"train_loss": -39.101844787597656, "global_step": 251211, "epoch": 2076} {"train_loss": -40.29449462890625, "global_step": 251212, "epoch": 2076} {"train_loss": -40.39905548095703, "global_step": 251213, "epoch": 2076} {"train_loss": -40.99937057495117, "global_step": 251214, "epoch": 2076} {"train_loss": -40.65675735473633, "global_step": 251215, "epoch": 2076} {"train_loss": -41.76569747924805, "global_step": 251216, "epoch": 2076} {"train_loss": -41.222572326660156, "global_step": 251217, "epoch": 2076} {"train_loss": -41.5918083190918, "global_step": 251218, "epoch": 2076} {"train_loss": -40.21761703491211, "global_step": 251219, "epoch": 2076} {"train_loss": -42.76423263549805, "global_step": 251220, "epoch": 2076} {"train_loss": -40.20469284057617, "global_step": 251221, "epoch": 2076} {"train_loss": -41.54095458984375, "global_step": 251222, "epoch": 2076} {"train_loss": -41.90665817260742, "global_step": 251223, "epoch": 2076} {"train_loss": -41.28257751464844, "global_step": 251224, "epoch": 2076} {"train_loss": -41.397789001464844, "global_step": 251225, "epoch": 2076} {"train_loss": -42.87282180786133, "global_step": 251226, "epoch": 2076} {"train_loss": -41.49276351928711, "global_step": 251227, "epoch": 2076} {"train_loss": -42.21405029296875, "global_step": 251228, "epoch": 2076} {"train_loss": -41.879920959472656, "global_step": 251229, "epoch": 2076} {"train_loss": -42.94671630859375, "global_step": 251230, "epoch": 2076} {"train_loss": -41.02147674560547, "global_step": 251231, "epoch": 2076} {"train_loss": -42.046993255615234, "global_step": 251232, "epoch": 2076} {"train_loss": -40.89175033569336, "global_step": 251233, "epoch": 2076} {"train_loss": -40.69829177856445, "global_step": 251234, "epoch": 2076} {"train_loss": -41.439998626708984, "global_step": 251235, "epoch": 2076} {"train_loss": -42.269893646240234, "global_step": 251236, "epoch": 2076} {"train_loss": -41.82888412475586, "global_step": 251237, "epoch": 2076} {"train_loss": -41.505096435546875, "global_step": 251238, "epoch": 2076} {"train_loss": -41.44854736328125, "global_step": 251239, "epoch": 2076} {"train_loss": -42.77785873413086, "global_step": 251240, "epoch": 2076} {"train_loss": -42.02116012573242, "global_step": 251241, "epoch": 2076} {"train_loss": -42.33160400390625, "global_step": 251242, "epoch": 2076} {"train_loss": -42.25891876220703, "global_step": 251243, "epoch": 2076} {"train_loss": -42.09931945800781, "global_step": 251244, "epoch": 2076} {"train_loss": -41.73971176147461, "global_step": 251245, "epoch": 2076} {"train_loss": -42.08435821533203, "global_step": 251246, "epoch": 2076} {"train_loss": -42.42701721191406, "global_step": 251247, "epoch": 2076} {"train_loss": -42.51327133178711, "global_step": 251248, "epoch": 2076} {"train_loss": -42.430728912353516, "global_step": 251249, "epoch": 2076} {"train_loss": -42.93717956542969, "global_step": 251250, "epoch": 2076} {"train_loss": -42.2978630065918, "global_step": 251251, "epoch": 2076} {"train_loss": -43.01001739501953, "global_step": 251252, "epoch": 2076} {"train_loss": -42.842689514160156, "global_step": 251253, "epoch": 2076} {"train_loss": -42.56411361694336, "global_step": 251254, "epoch": 2076} {"train_loss": -43.26792526245117, "global_step": 251255, "epoch": 2076} {"train_loss": -42.58106231689453, "global_step": 251256, "epoch": 2076} {"train_loss": -42.959232330322266, "global_step": 251257, "epoch": 2076} {"train_loss": -43.06683349609375, "global_step": 251258, "epoch": 2076} {"train_loss": -42.58940887451172, "global_step": 251259, "epoch": 2076} {"train_loss": -43.12467956542969, "global_step": 251260, "epoch": 2076} {"train_loss": -41.899986267089844, "global_step": 251261, "epoch": 2076} {"train_loss": -43.054473876953125, "global_step": 251262, "epoch": 2076} {"train_loss": -43.19272232055664, "global_step": 251263, "epoch": 2076} {"train_loss": -41.983154296875, "global_step": 251264, "epoch": 2076} {"train_loss": -42.65914535522461, "global_step": 251265, "epoch": 2076} {"train_loss": -43.220272064208984, "global_step": 251266, "epoch": 2076} {"train_loss": -43.19526290893555, "global_step": 251267, "epoch": 2076} {"train_loss": -43.4011344909668, "global_step": 251268, "epoch": 2076} {"train_loss": -43.0385856628418, "global_step": 251269, "epoch": 2076} {"train_loss": -43.21209716796875, "global_step": 251270, "epoch": 2076} {"train_loss": -43.328369140625, "global_step": 251271, "epoch": 2076} {"train_loss": -43.85997009277344, "global_step": 251272, "epoch": 2076} {"train_loss": -43.320899963378906, "global_step": 251273, "epoch": 2076} {"train_loss": -42.90400695800781, "global_step": 251274, "epoch": 2076} {"train_loss": -43.57349395751953, "global_step": 251275, "epoch": 2076} {"train_loss": -42.67045593261719, "global_step": 251276, "epoch": 2076} {"train_loss": -43.157833099365234, "global_step": 251277, "epoch": 2076} {"train_loss": -43.41646194458008, "global_step": 251278, "epoch": 2076} {"train_loss": -42.984596252441406, "global_step": 251279, "epoch": 2076} {"train_loss": -43.325992584228516, "global_step": 251280, "epoch": 2076} {"train_loss": -42.389549255371094, "global_step": 251281, "epoch": 2076} {"train_loss": -42.4925422668457, "global_step": 251282, "epoch": 2076} {"train_loss": -43.222312927246094, "global_step": 251283, "epoch": 2076} {"train_loss": -43.4599494934082, "global_step": 251284, "epoch": 2076} {"train_loss": -43.53640365600586, "global_step": 251285, "epoch": 2076} {"train_loss": -43.41303634643555, "global_step": 251286, "epoch": 2076} {"train_loss": -43.16217803955078, "global_step": 251287, "epoch": 2076} {"train_loss": -43.48214340209961, "global_step": 251288, "epoch": 2076} {"train_loss": -43.523406982421875, "global_step": 251289, "epoch": 2076} {"train_loss": -43.83945846557617, "global_step": 251290, "epoch": 2076} {"train_loss": -43.251678466796875, "global_step": 251291, "epoch": 2076} {"train_loss": -42.916908264160156, "global_step": 251292, "epoch": 2076} {"train_loss": -43.710693359375, "global_step": 251293, "epoch": 2076} {"train_loss": -43.139930725097656, "global_step": 251294, "epoch": 2076} {"train_loss": -43.57236862182617, "global_step": 251295, "epoch": 2076} {"train_loss": -42.956111907958984, "global_step": 251296, "epoch": 2076} {"train_loss": -43.82518768310547, "global_step": 251297, "epoch": 2076} {"train_loss": -40.55451583862305, "global_step": 251298, "epoch": 2076} {"train_loss": -43.018192291259766, "global_step": 251299, "epoch": 2076} {"train_loss": -43.07369613647461, "global_step": 251300, "epoch": 2076} {"train_loss": -43.43403625488281, "global_step": 251301, "epoch": 2076} {"train_loss": -43.717647552490234, "global_step": 251302, "epoch": 2076} {"train_loss": -43.676734924316406, "global_step": 251303, "epoch": 2076} {"train_loss": -43.19145584106445, "global_step": 251304, "epoch": 2076} {"train_loss": -43.23759078979492, "global_step": 251305, "epoch": 2076} {"train_loss": -43.179866790771484, "global_step": 251306, "epoch": 2076} {"train_loss": -42.398353576660156, "global_step": 251307, "epoch": 2076} {"train_loss": -43.81605529785156, "global_step": 251308, "epoch": 2076} {"train_loss": -42.62484359741211, "global_step": 251309, "epoch": 2076} {"train_loss": -42.3657341003418, "global_step": 251310, "epoch": 2076} {"train_loss": -42.842124938964844, "global_step": 251311, "epoch": 2076} {"train_loss": -42.733699798583984, "global_step": 251312, "epoch": 2076} {"train_loss": -43.41023635864258, "global_step": 251313, "epoch": 2076} {"train_loss": -42.76325988769531, "global_step": 251314, "epoch": 2076} {"train_loss": -43.19791030883789, "global_step": 251315, "epoch": 2076} {"train_loss": -42.049110412597656, "global_step": 251316, "epoch": 2076, "val_loss": 2660058.25} {"train_loss": -43.5794563293457, "global_step": 251317, "epoch": 2077} {"train_loss": -43.69804763793945, "global_step": 251318, "epoch": 2077} {"train_loss": -41.418697357177734, "global_step": 251319, "epoch": 2077} {"train_loss": -43.1400260925293, "global_step": 251320, "epoch": 2077} {"train_loss": -43.249794006347656, "global_step": 251321, "epoch": 2077} {"train_loss": -42.501220703125, "global_step": 251322, "epoch": 2077} {"train_loss": -42.41433334350586, "global_step": 251323, "epoch": 2077} {"train_loss": -43.4116096496582, "global_step": 251324, "epoch": 2077} {"train_loss": -39.353633880615234, "global_step": 251325, "epoch": 2077} {"train_loss": -42.760597229003906, "global_step": 251326, "epoch": 2077} {"train_loss": -41.3046875, "global_step": 251327, "epoch": 2077} {"train_loss": -41.08810806274414, "global_step": 251328, "epoch": 2077} {"train_loss": -42.74555587768555, "global_step": 251329, "epoch": 2077} {"train_loss": -37.42887496948242, "global_step": 251330, "epoch": 2077} {"train_loss": -42.87633514404297, "global_step": 251331, "epoch": 2077} {"train_loss": -40.64384078979492, "global_step": 251332, "epoch": 2077} {"train_loss": -41.06742858886719, "global_step": 251333, "epoch": 2077} {"train_loss": -43.03975296020508, "global_step": 251334, "epoch": 2077} {"train_loss": -41.40086364746094, "global_step": 251335, "epoch": 2077} {"train_loss": -42.20041275024414, "global_step": 251336, "epoch": 2077} {"train_loss": -42.521751403808594, "global_step": 251337, "epoch": 2077} {"train_loss": -41.78535079956055, "global_step": 251338, "epoch": 2077} {"train_loss": -41.713993072509766, "global_step": 251339, "epoch": 2077} {"train_loss": -41.98661422729492, "global_step": 251340, "epoch": 2077} {"train_loss": -41.59316635131836, "global_step": 251341, "epoch": 2077} {"train_loss": -42.05184555053711, "global_step": 251342, "epoch": 2077} {"train_loss": -40.639888763427734, "global_step": 251343, "epoch": 2077} {"train_loss": -41.63454055786133, "global_step": 251344, "epoch": 2077} {"train_loss": -41.50164794921875, "global_step": 251345, "epoch": 2077} {"train_loss": -42.239410400390625, "global_step": 251346, "epoch": 2077} {"train_loss": -42.64646911621094, "global_step": 251347, "epoch": 2077} {"train_loss": -41.13908004760742, "global_step": 251348, "epoch": 2077} {"train_loss": -41.459922790527344, "global_step": 251349, "epoch": 2077} {"train_loss": -40.94104766845703, "global_step": 251350, "epoch": 2077} {"train_loss": -42.03856658935547, "global_step": 251351, "epoch": 2077} {"train_loss": -41.25780487060547, "global_step": 251352, "epoch": 2077} {"train_loss": -41.929012298583984, "global_step": 251353, "epoch": 2077} {"train_loss": -37.46373748779297, "global_step": 251354, "epoch": 2077} {"train_loss": -31.178104400634766, "global_step": 251355, "epoch": 2077} {"train_loss": -38.78175735473633, "global_step": 251356, "epoch": 2077} {"train_loss": -41.51735305786133, "global_step": 251357, "epoch": 2077} {"train_loss": -41.45452880859375, "global_step": 251358, "epoch": 2077} {"train_loss": -40.46163558959961, "global_step": 251359, "epoch": 2077} {"train_loss": -40.557674407958984, "global_step": 251360, "epoch": 2077} {"train_loss": -40.18416213989258, "global_step": 251361, "epoch": 2077} {"train_loss": -40.433067321777344, "global_step": 251362, "epoch": 2077} {"train_loss": -38.54684066772461, "global_step": 251363, "epoch": 2077} {"train_loss": -41.299652099609375, "global_step": 251364, "epoch": 2077} {"train_loss": -39.56109619140625, "global_step": 251365, "epoch": 2077} {"train_loss": -41.456878662109375, "global_step": 251366, "epoch": 2077} {"train_loss": -41.1292839050293, "global_step": 251367, "epoch": 2077} {"train_loss": -41.749996185302734, "global_step": 251368, "epoch": 2077} {"train_loss": -40.4428825378418, "global_step": 251369, "epoch": 2077} {"train_loss": -40.70551681518555, "global_step": 251370, "epoch": 2077} {"train_loss": -39.77875900268555, "global_step": 251371, "epoch": 2077} {"train_loss": -39.852821350097656, "global_step": 251372, "epoch": 2077} {"train_loss": -40.71352005004883, "global_step": 251373, "epoch": 2077} {"train_loss": -42.03915023803711, "global_step": 251374, "epoch": 2077} {"train_loss": -37.42438507080078, "global_step": 251375, "epoch": 2077} {"train_loss": -38.945858001708984, "global_step": 251376, "epoch": 2077} {"train_loss": -41.878944396972656, "global_step": 251377, "epoch": 2077} {"train_loss": -41.58382797241211, "global_step": 251378, "epoch": 2077} {"train_loss": -41.8765869140625, "global_step": 251379, "epoch": 2077} {"train_loss": -40.58122253417969, "global_step": 251380, "epoch": 2077} {"train_loss": -39.857666015625, "global_step": 251381, "epoch": 2077} {"train_loss": -36.668514251708984, "global_step": 251382, "epoch": 2077} {"train_loss": -41.94584655761719, "global_step": 251383, "epoch": 2077} {"train_loss": -40.4929313659668, "global_step": 251384, "epoch": 2077} {"train_loss": -39.44470977783203, "global_step": 251385, "epoch": 2077} {"train_loss": -37.39493942260742, "global_step": 251386, "epoch": 2077} {"train_loss": -41.843055725097656, "global_step": 251387, "epoch": 2077} {"train_loss": -40.69907760620117, "global_step": 251388, "epoch": 2077} {"train_loss": -41.081356048583984, "global_step": 251389, "epoch": 2077} {"train_loss": -36.4710693359375, "global_step": 251390, "epoch": 2077} {"train_loss": -39.05754089355469, "global_step": 251391, "epoch": 2077} {"train_loss": -35.63484573364258, "global_step": 251392, "epoch": 2077} {"train_loss": -40.60492706298828, "global_step": 251393, "epoch": 2077} {"train_loss": -41.385955810546875, "global_step": 251394, "epoch": 2077} {"train_loss": -40.7556037902832, "global_step": 251395, "epoch": 2077} {"train_loss": -40.414520263671875, "global_step": 251396, "epoch": 2077} {"train_loss": -39.837589263916016, "global_step": 251397, "epoch": 2077} {"train_loss": -40.8211784362793, "global_step": 251398, "epoch": 2077} {"train_loss": -37.843929290771484, "global_step": 251399, "epoch": 2077} {"train_loss": -27.17399024963379, "global_step": 251400, "epoch": 2077} {"train_loss": -40.92496871948242, "global_step": 251401, "epoch": 2077} {"train_loss": -42.269752502441406, "global_step": 251402, "epoch": 2077} {"train_loss": -40.059993743896484, "global_step": 251403, "epoch": 2077} {"train_loss": -39.43634033203125, "global_step": 251404, "epoch": 2077} {"train_loss": -37.28825759887695, "global_step": 251405, "epoch": 2077} {"train_loss": -28.255481719970703, "global_step": 251406, "epoch": 2077} {"train_loss": -38.81797409057617, "global_step": 251407, "epoch": 2077} {"train_loss": -37.50897979736328, "global_step": 251408, "epoch": 2077} {"train_loss": -40.023311614990234, "global_step": 251409, "epoch": 2077} {"train_loss": -34.02103805541992, "global_step": 251410, "epoch": 2077} {"train_loss": -38.79370880126953, "global_step": 251411, "epoch": 2077} {"train_loss": -34.726287841796875, "global_step": 251412, "epoch": 2077} {"train_loss": -35.11042022705078, "global_step": 251413, "epoch": 2077} {"train_loss": -35.760498046875, "global_step": 251414, "epoch": 2077} {"train_loss": -34.7379035949707, "global_step": 251415, "epoch": 2077} {"train_loss": -35.60267639160156, "global_step": 251416, "epoch": 2077} {"train_loss": -38.213035583496094, "global_step": 251417, "epoch": 2077} {"train_loss": -38.443817138671875, "global_step": 251418, "epoch": 2077} {"train_loss": -38.24104690551758, "global_step": 251419, "epoch": 2077} {"train_loss": -36.2967643737793, "global_step": 251420, "epoch": 2077} {"train_loss": -36.653133392333984, "global_step": 251421, "epoch": 2077} {"train_loss": -40.98263168334961, "global_step": 251422, "epoch": 2077} {"train_loss": -38.468544006347656, "global_step": 251423, "epoch": 2077} {"train_loss": -39.46685791015625, "global_step": 251424, "epoch": 2077} {"train_loss": -36.50382614135742, "global_step": 251425, "epoch": 2077} {"train_loss": -36.69941329956055, "global_step": 251426, "epoch": 2077} {"train_loss": -36.77350997924805, "global_step": 251427, "epoch": 2077} {"train_loss": -37.387508392333984, "global_step": 251428, "epoch": 2077} {"train_loss": -40.278465270996094, "global_step": 251429, "epoch": 2077} {"train_loss": -36.927955627441406, "global_step": 251430, "epoch": 2077} {"train_loss": -39.913631439208984, "global_step": 251431, "epoch": 2077} {"train_loss": -38.76182556152344, "global_step": 251432, "epoch": 2077} {"train_loss": -37.6275749206543, "global_step": 251433, "epoch": 2077} {"train_loss": -39.09325408935547, "global_step": 251434, "epoch": 2077} {"train_loss": -36.87392044067383, "global_step": 251435, "epoch": 2077} {"train_loss": -40.68574905395508, "global_step": 251436, "epoch": 2077} {"train_loss": -39.713628422130235, "global_step": 251437, "epoch": 2077, "val_loss": 2468892.25} {"train_loss": -34.62314987182617, "global_step": 251438, "epoch": 2078} {"train_loss": -40.28005599975586, "global_step": 251439, "epoch": 2078} {"train_loss": -39.26813888549805, "global_step": 251440, "epoch": 2078} {"train_loss": -39.017662048339844, "global_step": 251441, "epoch": 2078} {"train_loss": -39.78643798828125, "global_step": 251442, "epoch": 2078} {"train_loss": -40.2450065612793, "global_step": 251443, "epoch": 2078} {"train_loss": -39.122840881347656, "global_step": 251444, "epoch": 2078} {"train_loss": -37.06218719482422, "global_step": 251445, "epoch": 2078} {"train_loss": -38.88704299926758, "global_step": 251446, "epoch": 2078} {"train_loss": -39.081459045410156, "global_step": 251447, "epoch": 2078} {"train_loss": -39.92353439331055, "global_step": 251448, "epoch": 2078} {"train_loss": -36.65610885620117, "global_step": 251449, "epoch": 2078} {"train_loss": -40.39891815185547, "global_step": 251450, "epoch": 2078} {"train_loss": -39.606483459472656, "global_step": 251451, "epoch": 2078} {"train_loss": -40.8349723815918, "global_step": 251452, "epoch": 2078} {"train_loss": -40.313812255859375, "global_step": 251453, "epoch": 2078} {"train_loss": -41.391265869140625, "global_step": 251454, "epoch": 2078} {"train_loss": -40.79550552368164, "global_step": 251455, "epoch": 2078} {"train_loss": -40.92690658569336, "global_step": 251456, "epoch": 2078} {"train_loss": -40.37730026245117, "global_step": 251457, "epoch": 2078} {"train_loss": -40.59907913208008, "global_step": 251458, "epoch": 2078} {"train_loss": -40.171504974365234, "global_step": 251459, "epoch": 2078} {"train_loss": -40.58494186401367, "global_step": 251460, "epoch": 2078} {"train_loss": -41.21065902709961, "global_step": 251461, "epoch": 2078} {"train_loss": -39.54446792602539, "global_step": 251462, "epoch": 2078} {"train_loss": -41.01418685913086, "global_step": 251463, "epoch": 2078} {"train_loss": -41.28163528442383, "global_step": 251464, "epoch": 2078} {"train_loss": -38.79336166381836, "global_step": 251465, "epoch": 2078} {"train_loss": -40.26231002807617, "global_step": 251466, "epoch": 2078} {"train_loss": -40.813087463378906, "global_step": 251467, "epoch": 2078} {"train_loss": -41.57759475708008, "global_step": 251468, "epoch": 2078} {"train_loss": -40.559600830078125, "global_step": 251469, "epoch": 2078} {"train_loss": -39.48905944824219, "global_step": 251470, "epoch": 2078} {"train_loss": -41.312381744384766, "global_step": 251471, "epoch": 2078} {"train_loss": -40.528629302978516, "global_step": 251472, "epoch": 2078} {"train_loss": -41.79391098022461, "global_step": 251473, "epoch": 2078} {"train_loss": -41.75703811645508, "global_step": 251474, "epoch": 2078} {"train_loss": -40.45915222167969, "global_step": 251475, "epoch": 2078} {"train_loss": -41.726295471191406, "global_step": 251476, "epoch": 2078} {"train_loss": -41.365238189697266, "global_step": 251477, "epoch": 2078} {"train_loss": -41.201515197753906, "global_step": 251478, "epoch": 2078} {"train_loss": -41.64813995361328, "global_step": 251479, "epoch": 2078} {"train_loss": -41.23661422729492, "global_step": 251480, "epoch": 2078} {"train_loss": -40.972450256347656, "global_step": 251481, "epoch": 2078} {"train_loss": -41.951961517333984, "global_step": 251482, "epoch": 2078} {"train_loss": -40.92765426635742, "global_step": 251483, "epoch": 2078} {"train_loss": -41.16105270385742, "global_step": 251484, "epoch": 2078} {"train_loss": -40.633419036865234, "global_step": 251485, "epoch": 2078} {"train_loss": -41.786251068115234, "global_step": 251486, "epoch": 2078} {"train_loss": -39.26227951049805, "global_step": 251487, "epoch": 2078} {"train_loss": -39.555843353271484, "global_step": 251488, "epoch": 2078} {"train_loss": -42.466346740722656, "global_step": 251489, "epoch": 2078} {"train_loss": -41.14466094970703, "global_step": 251490, "epoch": 2078} {"train_loss": -41.959686279296875, "global_step": 251491, "epoch": 2078} {"train_loss": -41.380550384521484, "global_step": 251492, "epoch": 2078} {"train_loss": -40.687782287597656, "global_step": 251493, "epoch": 2078} {"train_loss": -41.30862045288086, "global_step": 251494, "epoch": 2078} {"train_loss": -41.08877182006836, "global_step": 251495, "epoch": 2078} {"train_loss": -42.34526443481445, "global_step": 251496, "epoch": 2078} {"train_loss": -41.796722412109375, "global_step": 251497, "epoch": 2078} {"train_loss": -41.43345642089844, "global_step": 251498, "epoch": 2078} {"train_loss": -42.103607177734375, "global_step": 251499, "epoch": 2078} {"train_loss": -39.94904708862305, "global_step": 251500, "epoch": 2078} {"train_loss": -41.75019454956055, "global_step": 251501, "epoch": 2078} {"train_loss": -42.38381576538086, "global_step": 251502, "epoch": 2078} {"train_loss": -41.89303207397461, "global_step": 251503, "epoch": 2078} {"train_loss": -42.55988693237305, "global_step": 251504, "epoch": 2078} {"train_loss": -41.8177604675293, "global_step": 251505, "epoch": 2078} {"train_loss": -42.182281494140625, "global_step": 251506, "epoch": 2078} {"train_loss": -41.75880813598633, "global_step": 251507, "epoch": 2078} {"train_loss": -42.90618133544922, "global_step": 251508, "epoch": 2078} {"train_loss": -42.7362174987793, "global_step": 251509, "epoch": 2078} {"train_loss": -41.90938186645508, "global_step": 251510, "epoch": 2078} {"train_loss": -41.73290252685547, "global_step": 251511, "epoch": 2078} {"train_loss": -42.20259475708008, "global_step": 251512, "epoch": 2078} {"train_loss": -41.44196319580078, "global_step": 251513, "epoch": 2078} {"train_loss": -42.360164642333984, "global_step": 251514, "epoch": 2078} {"train_loss": -42.18159103393555, "global_step": 251515, "epoch": 2078} {"train_loss": -42.43330001831055, "global_step": 251516, "epoch": 2078} {"train_loss": -41.32551193237305, "global_step": 251517, "epoch": 2078} {"train_loss": -42.39629364013672, "global_step": 251518, "epoch": 2078} {"train_loss": -41.96358108520508, "global_step": 251519, "epoch": 2078} {"train_loss": -42.49898910522461, "global_step": 251520, "epoch": 2078} {"train_loss": -42.01643753051758, "global_step": 251521, "epoch": 2078} {"train_loss": -42.234676361083984, "global_step": 251522, "epoch": 2078} {"train_loss": -41.92692565917969, "global_step": 251523, "epoch": 2078} {"train_loss": -41.92756652832031, "global_step": 251524, "epoch": 2078} {"train_loss": -42.7912712097168, "global_step": 251525, "epoch": 2078} {"train_loss": -42.968162536621094, "global_step": 251526, "epoch": 2078} {"train_loss": -42.46989059448242, "global_step": 251527, "epoch": 2078} {"train_loss": -42.38374710083008, "global_step": 251528, "epoch": 2078} {"train_loss": -42.55790710449219, "global_step": 251529, "epoch": 2078} {"train_loss": -42.88743209838867, "global_step": 251530, "epoch": 2078} {"train_loss": -43.005287170410156, "global_step": 251531, "epoch": 2078} {"train_loss": -42.172725677490234, "global_step": 251532, "epoch": 2078} {"train_loss": -42.21110153198242, "global_step": 251533, "epoch": 2078} {"train_loss": -42.227394104003906, "global_step": 251534, "epoch": 2078} {"train_loss": -38.88964080810547, "global_step": 251535, "epoch": 2078} {"train_loss": -42.548828125, "global_step": 251536, "epoch": 2078} {"train_loss": -42.9370002746582, "global_step": 251537, "epoch": 2078} {"train_loss": -42.41980743408203, "global_step": 251538, "epoch": 2078} {"train_loss": -42.845916748046875, "global_step": 251539, "epoch": 2078} {"train_loss": -42.609466552734375, "global_step": 251540, "epoch": 2078} {"train_loss": -42.85328674316406, "global_step": 251541, "epoch": 2078} {"train_loss": -42.149349212646484, "global_step": 251542, "epoch": 2078} {"train_loss": -42.07202911376953, "global_step": 251543, "epoch": 2078} {"train_loss": -41.13269805908203, "global_step": 251544, "epoch": 2078} {"train_loss": -42.37724304199219, "global_step": 251545, "epoch": 2078} {"train_loss": -43.085384368896484, "global_step": 251546, "epoch": 2078} {"train_loss": -42.40391159057617, "global_step": 251547, "epoch": 2078} {"train_loss": -41.09590148925781, "global_step": 251548, "epoch": 2078} {"train_loss": -41.50043487548828, "global_step": 251549, "epoch": 2078} {"train_loss": -42.66816711425781, "global_step": 251550, "epoch": 2078} {"train_loss": -42.53428268432617, "global_step": 251551, "epoch": 2078} {"train_loss": -41.36749267578125, "global_step": 251552, "epoch": 2078} {"train_loss": -41.40797424316406, "global_step": 251553, "epoch": 2078} {"train_loss": -40.731422424316406, "global_step": 251554, "epoch": 2078} {"train_loss": -42.38474655151367, "global_step": 251555, "epoch": 2078} {"train_loss": -42.054298400878906, "global_step": 251556, "epoch": 2078} {"train_loss": -42.42286682128906, "global_step": 251557, "epoch": 2078} {"train_loss": -41.29252744312129, "global_step": 251558, "epoch": 2078, "val_loss": 2645881.75} {"train_loss": -42.14309310913086, "global_step": 251559, "epoch": 2079} {"train_loss": -42.112361907958984, "global_step": 251560, "epoch": 2079} {"train_loss": -41.903560638427734, "global_step": 251561, "epoch": 2079} {"train_loss": -42.54714584350586, "global_step": 251562, "epoch": 2079} {"train_loss": -41.921058654785156, "global_step": 251563, "epoch": 2079} {"train_loss": -40.0727424621582, "global_step": 251564, "epoch": 2079} {"train_loss": -42.93569564819336, "global_step": 251565, "epoch": 2079} {"train_loss": -40.03861999511719, "global_step": 251566, "epoch": 2079} {"train_loss": -42.424781799316406, "global_step": 251567, "epoch": 2079} {"train_loss": -42.72390365600586, "global_step": 251568, "epoch": 2079} {"train_loss": -42.64559555053711, "global_step": 251569, "epoch": 2079} {"train_loss": -42.914794921875, "global_step": 251570, "epoch": 2079} {"train_loss": -42.8680534362793, "global_step": 251571, "epoch": 2079} {"train_loss": -42.06149673461914, "global_step": 251572, "epoch": 2079} {"train_loss": -42.24991226196289, "global_step": 251573, "epoch": 2079} {"train_loss": -42.98249053955078, "global_step": 251574, "epoch": 2079} {"train_loss": -42.647491455078125, "global_step": 251575, "epoch": 2079} {"train_loss": -41.25993728637695, "global_step": 251576, "epoch": 2079} {"train_loss": -42.229591369628906, "global_step": 251577, "epoch": 2079} {"train_loss": -42.88407516479492, "global_step": 251578, "epoch": 2079} {"train_loss": -41.537620544433594, "global_step": 251579, "epoch": 2079} {"train_loss": -42.46294021606445, "global_step": 251580, "epoch": 2079} {"train_loss": -42.55747604370117, "global_step": 251581, "epoch": 2079} {"train_loss": -41.87733840942383, "global_step": 251582, "epoch": 2079} {"train_loss": -42.55401611328125, "global_step": 251583, "epoch": 2079} {"train_loss": -40.94973373413086, "global_step": 251584, "epoch": 2079} {"train_loss": -39.3520622253418, "global_step": 251585, "epoch": 2079} {"train_loss": -35.8430290222168, "global_step": 251586, "epoch": 2079} {"train_loss": -32.04594802856445, "global_step": 251587, "epoch": 2079} {"train_loss": -35.080657958984375, "global_step": 251588, "epoch": 2079} {"train_loss": -41.16468811035156, "global_step": 251589, "epoch": 2079} {"train_loss": -40.31979751586914, "global_step": 251590, "epoch": 2079} {"train_loss": -37.89381408691406, "global_step": 251591, "epoch": 2079} {"train_loss": -40.70465850830078, "global_step": 251592, "epoch": 2079} {"train_loss": -42.33736801147461, "global_step": 251593, "epoch": 2079} {"train_loss": -39.99774169921875, "global_step": 251594, "epoch": 2079} {"train_loss": -40.713138580322266, "global_step": 251595, "epoch": 2079} {"train_loss": -41.928070068359375, "global_step": 251596, "epoch": 2079} {"train_loss": -41.663394927978516, "global_step": 251597, "epoch": 2079} {"train_loss": -42.186485290527344, "global_step": 251598, "epoch": 2079} {"train_loss": -42.05513000488281, "global_step": 251599, "epoch": 2079} {"train_loss": -37.8117561340332, "global_step": 251600, "epoch": 2079} {"train_loss": -42.235084533691406, "global_step": 251601, "epoch": 2079} {"train_loss": -40.36526107788086, "global_step": 251602, "epoch": 2079} {"train_loss": -41.38344192504883, "global_step": 251603, "epoch": 2079} {"train_loss": -42.205169677734375, "global_step": 251604, "epoch": 2079} {"train_loss": -37.297481536865234, "global_step": 251605, "epoch": 2079} {"train_loss": -42.12412643432617, "global_step": 251606, "epoch": 2079} {"train_loss": -41.891231536865234, "global_step": 251607, "epoch": 2079} {"train_loss": -30.198551177978516, "global_step": 251608, "epoch": 2079} {"train_loss": -40.81637191772461, "global_step": 251609, "epoch": 2079} {"train_loss": -41.09642028808594, "global_step": 251610, "epoch": 2079} {"train_loss": -40.96230697631836, "global_step": 251611, "epoch": 2079} {"train_loss": -35.82562255859375, "global_step": 251612, "epoch": 2079} {"train_loss": -41.42584228515625, "global_step": 251613, "epoch": 2079} {"train_loss": -40.01896667480469, "global_step": 251614, "epoch": 2079} {"train_loss": -39.77824401855469, "global_step": 251615, "epoch": 2079} {"train_loss": -41.02427291870117, "global_step": 251616, "epoch": 2079} {"train_loss": -32.42839813232422, "global_step": 251617, "epoch": 2079} {"train_loss": -40.930904388427734, "global_step": 251618, "epoch": 2079} {"train_loss": -40.85136032104492, "global_step": 251619, "epoch": 2079} {"train_loss": -40.08696365356445, "global_step": 251620, "epoch": 2079} {"train_loss": -38.14794158935547, "global_step": 251621, "epoch": 2079} {"train_loss": -40.26131057739258, "global_step": 251622, "epoch": 2079} {"train_loss": -40.27141189575195, "global_step": 251623, "epoch": 2079} {"train_loss": -39.6995849609375, "global_step": 251624, "epoch": 2079} {"train_loss": -34.283447265625, "global_step": 251625, "epoch": 2079} {"train_loss": -38.66634750366211, "global_step": 251626, "epoch": 2079} {"train_loss": -40.88630294799805, "global_step": 251627, "epoch": 2079} {"train_loss": -40.61233139038086, "global_step": 251628, "epoch": 2079} {"train_loss": -40.31466293334961, "global_step": 251629, "epoch": 2079} {"train_loss": -39.46255111694336, "global_step": 251630, "epoch": 2079} {"train_loss": -38.045223236083984, "global_step": 251631, "epoch": 2079} {"train_loss": -39.297340393066406, "global_step": 251632, "epoch": 2079} {"train_loss": -40.98531723022461, "global_step": 251633, "epoch": 2079} {"train_loss": -39.55103302001953, "global_step": 251634, "epoch": 2079} {"train_loss": -41.28947067260742, "global_step": 251635, "epoch": 2079} {"train_loss": -40.72933578491211, "global_step": 251636, "epoch": 2079} {"train_loss": -40.261775970458984, "global_step": 251637, "epoch": 2079} {"train_loss": -38.93809127807617, "global_step": 251638, "epoch": 2079} {"train_loss": -38.57676315307617, "global_step": 251639, "epoch": 2079} {"train_loss": -40.433719635009766, "global_step": 251640, "epoch": 2079} {"train_loss": -41.0565299987793, "global_step": 251641, "epoch": 2079} {"train_loss": -35.22382354736328, "global_step": 251642, "epoch": 2079} {"train_loss": -39.42871856689453, "global_step": 251643, "epoch": 2079} {"train_loss": -37.525386810302734, "global_step": 251644, "epoch": 2079} {"train_loss": -40.118831634521484, "global_step": 251645, "epoch": 2079} {"train_loss": -40.87728500366211, "global_step": 251646, "epoch": 2079} {"train_loss": -40.6204719543457, "global_step": 251647, "epoch": 2079} {"train_loss": -41.25132369995117, "global_step": 251648, "epoch": 2079} {"train_loss": -37.32310104370117, "global_step": 251649, "epoch": 2079} {"train_loss": -34.45789337158203, "global_step": 251650, "epoch": 2079} {"train_loss": -39.174686431884766, "global_step": 251651, "epoch": 2079} {"train_loss": -38.10990524291992, "global_step": 251652, "epoch": 2079} {"train_loss": -39.672298431396484, "global_step": 251653, "epoch": 2079} {"train_loss": -39.330780029296875, "global_step": 251654, "epoch": 2079} {"train_loss": -40.634246826171875, "global_step": 251655, "epoch": 2079} {"train_loss": -39.961788177490234, "global_step": 251656, "epoch": 2079} {"train_loss": -40.656044006347656, "global_step": 251657, "epoch": 2079} {"train_loss": -40.77275848388672, "global_step": 251658, "epoch": 2079} {"train_loss": -41.143409729003906, "global_step": 251659, "epoch": 2079} {"train_loss": -40.31300735473633, "global_step": 251660, "epoch": 2079} {"train_loss": -40.98324203491211, "global_step": 251661, "epoch": 2079} {"train_loss": -40.30581283569336, "global_step": 251662, "epoch": 2079} {"train_loss": -36.30204391479492, "global_step": 251663, "epoch": 2079} {"train_loss": -40.80997848510742, "global_step": 251664, "epoch": 2079} {"train_loss": -40.534664154052734, "global_step": 251665, "epoch": 2079} {"train_loss": -40.829742431640625, "global_step": 251666, "epoch": 2079} {"train_loss": -41.48934555053711, "global_step": 251667, "epoch": 2079} {"train_loss": -42.027339935302734, "global_step": 251668, "epoch": 2079} {"train_loss": -41.599735260009766, "global_step": 251669, "epoch": 2079} {"train_loss": -40.659339904785156, "global_step": 251670, "epoch": 2079} {"train_loss": -37.73093032836914, "global_step": 251671, "epoch": 2079} {"train_loss": -40.34439468383789, "global_step": 251672, "epoch": 2079} {"train_loss": -41.397865295410156, "global_step": 251673, "epoch": 2079} {"train_loss": -41.591285705566406, "global_step": 251674, "epoch": 2079} {"train_loss": -41.32778549194336, "global_step": 251675, "epoch": 2079} {"train_loss": -41.55414581298828, "global_step": 251676, "epoch": 2079} {"train_loss": -42.06284713745117, "global_step": 251677, "epoch": 2079} {"train_loss": -41.13230895996094, "global_step": 251678, "epoch": 2079} {"train_loss": -40.25579266508749, "global_step": 251679, "epoch": 2079, "val_loss": 2657937.75} {"train_loss": -40.51765823364258, "global_step": 251680, "epoch": 2080} {"train_loss": -42.01039505004883, "global_step": 251681, "epoch": 2080} {"train_loss": -42.116058349609375, "global_step": 251682, "epoch": 2080} {"train_loss": -40.57707595825195, "global_step": 251683, "epoch": 2080} {"train_loss": -41.692787170410156, "global_step": 251684, "epoch": 2080} {"train_loss": -41.59587860107422, "global_step": 251685, "epoch": 2080} {"train_loss": -39.927215576171875, "global_step": 251686, "epoch": 2080} {"train_loss": -41.457550048828125, "global_step": 251687, "epoch": 2080} {"train_loss": -41.757118225097656, "global_step": 251688, "epoch": 2080} {"train_loss": -41.8911247253418, "global_step": 251689, "epoch": 2080} {"train_loss": -41.09563064575195, "global_step": 251690, "epoch": 2080} {"train_loss": -41.891902923583984, "global_step": 251691, "epoch": 2080} {"train_loss": -41.66129684448242, "global_step": 251692, "epoch": 2080} {"train_loss": -41.593894958496094, "global_step": 251693, "epoch": 2080} {"train_loss": -42.231300354003906, "global_step": 251694, "epoch": 2080} {"train_loss": -41.78031539916992, "global_step": 251695, "epoch": 2080} {"train_loss": -41.6268310546875, "global_step": 251696, "epoch": 2080} {"train_loss": -40.852386474609375, "global_step": 251697, "epoch": 2080} {"train_loss": -41.98299026489258, "global_step": 251698, "epoch": 2080} {"train_loss": -42.29575729370117, "global_step": 251699, "epoch": 2080} {"train_loss": -42.2041015625, "global_step": 251700, "epoch": 2080} {"train_loss": -42.1207160949707, "global_step": 251701, "epoch": 2080} {"train_loss": -42.305824279785156, "global_step": 251702, "epoch": 2080} {"train_loss": -40.996971130371094, "global_step": 251703, "epoch": 2080} {"train_loss": -38.69729232788086, "global_step": 251704, "epoch": 2080} {"train_loss": -41.376895904541016, "global_step": 251705, "epoch": 2080} {"train_loss": -42.50590133666992, "global_step": 251706, "epoch": 2080} {"train_loss": -42.23806381225586, "global_step": 251707, "epoch": 2080} {"train_loss": -42.40073776245117, "global_step": 251708, "epoch": 2080} {"train_loss": -42.49968338012695, "global_step": 251709, "epoch": 2080} {"train_loss": -42.510494232177734, "global_step": 251710, "epoch": 2080} {"train_loss": -42.38532638549805, "global_step": 251711, "epoch": 2080} {"train_loss": -41.028255462646484, "global_step": 251712, "epoch": 2080} {"train_loss": -42.806575775146484, "global_step": 251713, "epoch": 2080} {"train_loss": -41.58213424682617, "global_step": 251714, "epoch": 2080} {"train_loss": -42.16280746459961, "global_step": 251715, "epoch": 2080} {"train_loss": -42.88969802856445, "global_step": 251716, "epoch": 2080} {"train_loss": -40.634151458740234, "global_step": 251717, "epoch": 2080} {"train_loss": -41.44684982299805, "global_step": 251718, "epoch": 2080} {"train_loss": -41.91471481323242, "global_step": 251719, "epoch": 2080} {"train_loss": -42.84815216064453, "global_step": 251720, "epoch": 2080} {"train_loss": -41.73147201538086, "global_step": 251721, "epoch": 2080} {"train_loss": -42.65345764160156, "global_step": 251722, "epoch": 2080} {"train_loss": -42.53910827636719, "global_step": 251723, "epoch": 2080} {"train_loss": -42.49198532104492, "global_step": 251724, "epoch": 2080} {"train_loss": -42.93647003173828, "global_step": 251725, "epoch": 2080} {"train_loss": -42.09202194213867, "global_step": 251726, "epoch": 2080} {"train_loss": -42.43858337402344, "global_step": 251727, "epoch": 2080} {"train_loss": -42.8823356628418, "global_step": 251728, "epoch": 2080} {"train_loss": -42.65386962890625, "global_step": 251729, "epoch": 2080} {"train_loss": -42.31922912597656, "global_step": 251730, "epoch": 2080} {"train_loss": -43.13579177856445, "global_step": 251731, "epoch": 2080} {"train_loss": -42.654842376708984, "global_step": 251732, "epoch": 2080} {"train_loss": -42.274993896484375, "global_step": 251733, "epoch": 2080} {"train_loss": -43.02067184448242, "global_step": 251734, "epoch": 2080} {"train_loss": -42.18437576293945, "global_step": 251735, "epoch": 2080} {"train_loss": -42.925025939941406, "global_step": 251736, "epoch": 2080} {"train_loss": -41.868804931640625, "global_step": 251737, "epoch": 2080} {"train_loss": -42.50107955932617, "global_step": 251738, "epoch": 2080} {"train_loss": -42.80326461791992, "global_step": 251739, "epoch": 2080} {"train_loss": -42.249107360839844, "global_step": 251740, "epoch": 2080} {"train_loss": -43.067054748535156, "global_step": 251741, "epoch": 2080} {"train_loss": -42.782310485839844, "global_step": 251742, "epoch": 2080} {"train_loss": -42.088741302490234, "global_step": 251743, "epoch": 2080} {"train_loss": -42.9893913269043, "global_step": 251744, "epoch": 2080} {"train_loss": -42.766719818115234, "global_step": 251745, "epoch": 2080} {"train_loss": -43.21197509765625, "global_step": 251746, "epoch": 2080} {"train_loss": -41.1503791809082, "global_step": 251747, "epoch": 2080} {"train_loss": -43.13649368286133, "global_step": 251748, "epoch": 2080} {"train_loss": -42.77875900268555, "global_step": 251749, "epoch": 2080} {"train_loss": -41.24098587036133, "global_step": 251750, "epoch": 2080} {"train_loss": -42.2415885925293, "global_step": 251751, "epoch": 2080} {"train_loss": -42.77766799926758, "global_step": 251752, "epoch": 2080} {"train_loss": -42.37701416015625, "global_step": 251753, "epoch": 2080} {"train_loss": -43.072078704833984, "global_step": 251754, "epoch": 2080} {"train_loss": -42.482444763183594, "global_step": 251755, "epoch": 2080} {"train_loss": -42.86124801635742, "global_step": 251756, "epoch": 2080} {"train_loss": -42.24113082885742, "global_step": 251757, "epoch": 2080} {"train_loss": -42.061336517333984, "global_step": 251758, "epoch": 2080} {"train_loss": -42.98228073120117, "global_step": 251759, "epoch": 2080} {"train_loss": -42.59096908569336, "global_step": 251760, "epoch": 2080} {"train_loss": -42.23895263671875, "global_step": 251761, "epoch": 2080} {"train_loss": -42.682308197021484, "global_step": 251762, "epoch": 2080} {"train_loss": -41.489356994628906, "global_step": 251763, "epoch": 2080} {"train_loss": -42.19046401977539, "global_step": 251764, "epoch": 2080} {"train_loss": -42.73337936401367, "global_step": 251765, "epoch": 2080} {"train_loss": -42.68134689331055, "global_step": 251766, "epoch": 2080} {"train_loss": -42.17412567138672, "global_step": 251767, "epoch": 2080} {"train_loss": -40.533931732177734, "global_step": 251768, "epoch": 2080} {"train_loss": -35.93996047973633, "global_step": 251769, "epoch": 2080} {"train_loss": -31.205652236938477, "global_step": 251770, "epoch": 2080} {"train_loss": -32.84386444091797, "global_step": 251771, "epoch": 2080} {"train_loss": -35.33705520629883, "global_step": 251772, "epoch": 2080} {"train_loss": -41.01270294189453, "global_step": 251773, "epoch": 2080} {"train_loss": -41.71590042114258, "global_step": 251774, "epoch": 2080} {"train_loss": -37.48771667480469, "global_step": 251775, "epoch": 2080} {"train_loss": -36.583927154541016, "global_step": 251776, "epoch": 2080} {"train_loss": -40.6179313659668, "global_step": 251777, "epoch": 2080} {"train_loss": -40.33222579956055, "global_step": 251778, "epoch": 2080} {"train_loss": -41.81818771362305, "global_step": 251779, "epoch": 2080} {"train_loss": -40.18610382080078, "global_step": 251780, "epoch": 2080} {"train_loss": -40.758697509765625, "global_step": 251781, "epoch": 2080} {"train_loss": -41.84054183959961, "global_step": 251782, "epoch": 2080} {"train_loss": -40.190486907958984, "global_step": 251783, "epoch": 2080} {"train_loss": -41.4266357421875, "global_step": 251784, "epoch": 2080} {"train_loss": -39.72650146484375, "global_step": 251785, "epoch": 2080} {"train_loss": -40.14249801635742, "global_step": 251786, "epoch": 2080} {"train_loss": -38.409507751464844, "global_step": 251787, "epoch": 2080} {"train_loss": -40.50202941894531, "global_step": 251788, "epoch": 2080} {"train_loss": -38.83549880981445, "global_step": 251789, "epoch": 2080} {"train_loss": -40.91872024536133, "global_step": 251790, "epoch": 2080} {"train_loss": -40.13679122924805, "global_step": 251791, "epoch": 2080} {"train_loss": -40.82533264160156, "global_step": 251792, "epoch": 2080} {"train_loss": -40.9007682800293, "global_step": 251793, "epoch": 2080} {"train_loss": -41.59965133666992, "global_step": 251794, "epoch": 2080} {"train_loss": -41.381107330322266, "global_step": 251795, "epoch": 2080} {"train_loss": -41.55589294433594, "global_step": 251796, "epoch": 2080} {"train_loss": -41.28584671020508, "global_step": 251797, "epoch": 2080} {"train_loss": -42.2589111328125, "global_step": 251798, "epoch": 2080} {"train_loss": -40.2607536315918, "global_step": 251799, "epoch": 2080} {"train_loss": -41.47591398570163, "global_step": 251800, "epoch": 2080, "val_loss": 2668574.5} {"train_loss": -41.36042022705078, "global_step": 251801, "epoch": 2081} {"train_loss": -41.11909103393555, "global_step": 251802, "epoch": 2081} {"train_loss": -42.31611633300781, "global_step": 251803, "epoch": 2081} {"train_loss": -41.470672607421875, "global_step": 251804, "epoch": 2081} {"train_loss": -42.08749771118164, "global_step": 251805, "epoch": 2081} {"train_loss": -41.82770919799805, "global_step": 251806, "epoch": 2081} {"train_loss": -42.097755432128906, "global_step": 251807, "epoch": 2081} {"train_loss": -41.74509048461914, "global_step": 251808, "epoch": 2081} {"train_loss": -41.72867202758789, "global_step": 251809, "epoch": 2081} {"train_loss": -42.72021484375, "global_step": 251810, "epoch": 2081} {"train_loss": -41.511009216308594, "global_step": 251811, "epoch": 2081} {"train_loss": -41.89524459838867, "global_step": 251812, "epoch": 2081} {"train_loss": -42.30668258666992, "global_step": 251813, "epoch": 2081} {"train_loss": -41.94076156616211, "global_step": 251814, "epoch": 2081} {"train_loss": -41.748409271240234, "global_step": 251815, "epoch": 2081} {"train_loss": -41.83501052856445, "global_step": 251816, "epoch": 2081} {"train_loss": -42.2121696472168, "global_step": 251817, "epoch": 2081} {"train_loss": -42.604671478271484, "global_step": 251818, "epoch": 2081} {"train_loss": -42.17934799194336, "global_step": 251819, "epoch": 2081} {"train_loss": -41.51204299926758, "global_step": 251820, "epoch": 2081} {"train_loss": -42.90530776977539, "global_step": 251821, "epoch": 2081} {"train_loss": -41.71478271484375, "global_step": 251822, "epoch": 2081} {"train_loss": -42.0249137878418, "global_step": 251823, "epoch": 2081} {"train_loss": -42.393428802490234, "global_step": 251824, "epoch": 2081} {"train_loss": -41.81174850463867, "global_step": 251825, "epoch": 2081} {"train_loss": -42.206695556640625, "global_step": 251826, "epoch": 2081} {"train_loss": -41.9102897644043, "global_step": 251827, "epoch": 2081} {"train_loss": -41.7478141784668, "global_step": 251828, "epoch": 2081} {"train_loss": -42.853092193603516, "global_step": 251829, "epoch": 2081} {"train_loss": -42.0205192565918, "global_step": 251830, "epoch": 2081} {"train_loss": -41.48818588256836, "global_step": 251831, "epoch": 2081} {"train_loss": -42.73653030395508, "global_step": 251832, "epoch": 2081} {"train_loss": -41.84891891479492, "global_step": 251833, "epoch": 2081} {"train_loss": -42.79497146606445, "global_step": 251834, "epoch": 2081} {"train_loss": -42.24374008178711, "global_step": 251835, "epoch": 2081} {"train_loss": -42.1939811706543, "global_step": 251836, "epoch": 2081} {"train_loss": -42.47384262084961, "global_step": 251837, "epoch": 2081} {"train_loss": -42.96177291870117, "global_step": 251838, "epoch": 2081} {"train_loss": -42.498775482177734, "global_step": 251839, "epoch": 2081} {"train_loss": -42.59666061401367, "global_step": 251840, "epoch": 2081} {"train_loss": -42.3569221496582, "global_step": 251841, "epoch": 2081} {"train_loss": -42.92950439453125, "global_step": 251842, "epoch": 2081} {"train_loss": -42.74589538574219, "global_step": 251843, "epoch": 2081} {"train_loss": -41.38434982299805, "global_step": 251844, "epoch": 2081} {"train_loss": -43.1669807434082, "global_step": 251845, "epoch": 2081} {"train_loss": -43.1485595703125, "global_step": 251846, "epoch": 2081} {"train_loss": -43.067806243896484, "global_step": 251847, "epoch": 2081} {"train_loss": -43.17808151245117, "global_step": 251848, "epoch": 2081} {"train_loss": -43.66682052612305, "global_step": 251849, "epoch": 2081} {"train_loss": -42.620853424072266, "global_step": 251850, "epoch": 2081} {"train_loss": -42.46957015991211, "global_step": 251851, "epoch": 2081} {"train_loss": -43.54486083984375, "global_step": 251852, "epoch": 2081} {"train_loss": -42.650264739990234, "global_step": 251853, "epoch": 2081} {"train_loss": -43.260189056396484, "global_step": 251854, "epoch": 2081} {"train_loss": -43.1169548034668, "global_step": 251855, "epoch": 2081} {"train_loss": -43.41530227661133, "global_step": 251856, "epoch": 2081} {"train_loss": -42.53889083862305, "global_step": 251857, "epoch": 2081} {"train_loss": -42.097145080566406, "global_step": 251858, "epoch": 2081} {"train_loss": -42.794403076171875, "global_step": 251859, "epoch": 2081} {"train_loss": -42.79170227050781, "global_step": 251860, "epoch": 2081} {"train_loss": -42.99538040161133, "global_step": 251861, "epoch": 2081} {"train_loss": -42.80272674560547, "global_step": 251862, "epoch": 2081} {"train_loss": -43.159271240234375, "global_step": 251863, "epoch": 2081} {"train_loss": -43.067138671875, "global_step": 251864, "epoch": 2081} {"train_loss": -43.09264373779297, "global_step": 251865, "epoch": 2081} {"train_loss": -42.49076461791992, "global_step": 251866, "epoch": 2081} {"train_loss": -43.571685791015625, "global_step": 251867, "epoch": 2081} {"train_loss": -42.99821090698242, "global_step": 251868, "epoch": 2081} {"train_loss": -42.80951690673828, "global_step": 251869, "epoch": 2081} {"train_loss": -42.9549560546875, "global_step": 251870, "epoch": 2081} {"train_loss": -42.779266357421875, "global_step": 251871, "epoch": 2081} {"train_loss": -42.93528366088867, "global_step": 251872, "epoch": 2081} {"train_loss": -43.70891189575195, "global_step": 251873, "epoch": 2081} {"train_loss": -43.79134750366211, "global_step": 251874, "epoch": 2081} {"train_loss": -43.25344467163086, "global_step": 251875, "epoch": 2081} {"train_loss": -42.356292724609375, "global_step": 251876, "epoch": 2081} {"train_loss": -43.138729095458984, "global_step": 251877, "epoch": 2081} {"train_loss": -42.702640533447266, "global_step": 251878, "epoch": 2081} {"train_loss": -41.05531692504883, "global_step": 251879, "epoch": 2081} {"train_loss": -42.68600845336914, "global_step": 251880, "epoch": 2081} {"train_loss": -43.733028411865234, "global_step": 251881, "epoch": 2081} {"train_loss": -40.865509033203125, "global_step": 251882, "epoch": 2081} {"train_loss": -40.431175231933594, "global_step": 251883, "epoch": 2081} {"train_loss": -42.387691497802734, "global_step": 251884, "epoch": 2081} {"train_loss": -42.05906677246094, "global_step": 251885, "epoch": 2081} {"train_loss": -39.894203186035156, "global_step": 251886, "epoch": 2081} {"train_loss": -41.81635665893555, "global_step": 251887, "epoch": 2081} {"train_loss": -42.876853942871094, "global_step": 251888, "epoch": 2081} {"train_loss": -43.04667663574219, "global_step": 251889, "epoch": 2081} {"train_loss": -42.39828109741211, "global_step": 251890, "epoch": 2081} {"train_loss": -42.242069244384766, "global_step": 251891, "epoch": 2081} {"train_loss": -42.44478988647461, "global_step": 251892, "epoch": 2081} {"train_loss": -37.17362594604492, "global_step": 251893, "epoch": 2081} {"train_loss": -42.30702590942383, "global_step": 251894, "epoch": 2081} {"train_loss": -41.59540939331055, "global_step": 251895, "epoch": 2081} {"train_loss": -42.48619842529297, "global_step": 251896, "epoch": 2081} {"train_loss": -41.66318893432617, "global_step": 251897, "epoch": 2081} {"train_loss": -41.93798828125, "global_step": 251898, "epoch": 2081} {"train_loss": -39.501678466796875, "global_step": 251899, "epoch": 2081} {"train_loss": -42.61088943481445, "global_step": 251900, "epoch": 2081} {"train_loss": -42.795738220214844, "global_step": 251901, "epoch": 2081} {"train_loss": -42.67509841918945, "global_step": 251902, "epoch": 2081} {"train_loss": -42.19422149658203, "global_step": 251903, "epoch": 2081} {"train_loss": -41.85237503051758, "global_step": 251904, "epoch": 2081} {"train_loss": -40.41725158691406, "global_step": 251905, "epoch": 2081} {"train_loss": -36.07255172729492, "global_step": 251906, "epoch": 2081} {"train_loss": -36.90766525268555, "global_step": 251907, "epoch": 2081} {"train_loss": -41.539371490478516, "global_step": 251908, "epoch": 2081} {"train_loss": -42.53217315673828, "global_step": 251909, "epoch": 2081} {"train_loss": -41.42516326904297, "global_step": 251910, "epoch": 2081} {"train_loss": -39.91985321044922, "global_step": 251911, "epoch": 2081} {"train_loss": -40.78422546386719, "global_step": 251912, "epoch": 2081} {"train_loss": -34.896453857421875, "global_step": 251913, "epoch": 2081} {"train_loss": -37.49060821533203, "global_step": 251914, "epoch": 2081} {"train_loss": -40.10913848876953, "global_step": 251915, "epoch": 2081} {"train_loss": -40.66019821166992, "global_step": 251916, "epoch": 2081} {"train_loss": -39.97199630737305, "global_step": 251917, "epoch": 2081} {"train_loss": -42.18801498413086, "global_step": 251918, "epoch": 2081} {"train_loss": -38.176673889160156, "global_step": 251919, "epoch": 2081} {"train_loss": -36.83113479614258, "global_step": 251920, "epoch": 2081} {"train_loss": -41.83061377470158, "global_step": 251921, "epoch": 2081, "val_loss": 2665818.5} {"train_loss": -36.34711456298828, "global_step": 251922, "epoch": 2082} {"train_loss": -34.28048324584961, "global_step": 251923, "epoch": 2082} {"train_loss": -30.797779083251953, "global_step": 251924, "epoch": 2082} {"train_loss": -25.945104598999023, "global_step": 251925, "epoch": 2082} {"train_loss": -38.33139419555664, "global_step": 251926, "epoch": 2082} {"train_loss": -39.31515121459961, "global_step": 251927, "epoch": 2082} {"train_loss": -34.943824768066406, "global_step": 251928, "epoch": 2082} {"train_loss": -38.9539909362793, "global_step": 251929, "epoch": 2082} {"train_loss": -32.26340103149414, "global_step": 251930, "epoch": 2082} {"train_loss": -34.910030364990234, "global_step": 251931, "epoch": 2082} {"train_loss": -38.9975700378418, "global_step": 251932, "epoch": 2082} {"train_loss": -21.48527717590332, "global_step": 251933, "epoch": 2082} {"train_loss": -38.83182144165039, "global_step": 251934, "epoch": 2082} {"train_loss": -37.26997756958008, "global_step": 251935, "epoch": 2082} {"train_loss": -37.28761672973633, "global_step": 251936, "epoch": 2082} {"train_loss": -36.74200439453125, "global_step": 251937, "epoch": 2082} {"train_loss": -34.829742431640625, "global_step": 251938, "epoch": 2082} {"train_loss": -37.73886489868164, "global_step": 251939, "epoch": 2082} {"train_loss": -36.906227111816406, "global_step": 251940, "epoch": 2082} {"train_loss": -39.83424377441406, "global_step": 251941, "epoch": 2082} {"train_loss": -39.04873275756836, "global_step": 251942, "epoch": 2082} {"train_loss": -37.81482696533203, "global_step": 251943, "epoch": 2082} {"train_loss": -39.49697494506836, "global_step": 251944, "epoch": 2082} {"train_loss": -36.03776168823242, "global_step": 251945, "epoch": 2082} {"train_loss": -38.37955856323242, "global_step": 251946, "epoch": 2082} {"train_loss": -38.070980072021484, "global_step": 251947, "epoch": 2082} {"train_loss": -40.11594772338867, "global_step": 251948, "epoch": 2082} {"train_loss": -37.618839263916016, "global_step": 251949, "epoch": 2082} {"train_loss": -37.608272552490234, "global_step": 251950, "epoch": 2082} {"train_loss": -39.324195861816406, "global_step": 251951, "epoch": 2082} {"train_loss": -39.90853500366211, "global_step": 251952, "epoch": 2082} {"train_loss": -40.39986038208008, "global_step": 251953, "epoch": 2082} {"train_loss": -39.59619903564453, "global_step": 251954, "epoch": 2082} {"train_loss": -39.62403106689453, "global_step": 251955, "epoch": 2082} {"train_loss": -39.16329574584961, "global_step": 251956, "epoch": 2082} {"train_loss": -40.227027893066406, "global_step": 251957, "epoch": 2082} {"train_loss": -39.921485900878906, "global_step": 251958, "epoch": 2082} {"train_loss": -40.18231964111328, "global_step": 251959, "epoch": 2082} {"train_loss": -40.7675666809082, "global_step": 251960, "epoch": 2082} {"train_loss": -40.90370559692383, "global_step": 251961, "epoch": 2082} {"train_loss": -40.36492919921875, "global_step": 251962, "epoch": 2082} {"train_loss": -40.08916091918945, "global_step": 251963, "epoch": 2082} {"train_loss": -41.086273193359375, "global_step": 251964, "epoch": 2082} {"train_loss": -39.63372039794922, "global_step": 251965, "epoch": 2082} {"train_loss": -40.8819465637207, "global_step": 251966, "epoch": 2082} {"train_loss": -39.90145492553711, "global_step": 251967, "epoch": 2082} {"train_loss": -41.34550094604492, "global_step": 251968, "epoch": 2082} {"train_loss": -39.70768737792969, "global_step": 251969, "epoch": 2082} {"train_loss": -40.70447540283203, "global_step": 251970, "epoch": 2082} {"train_loss": -40.88563537597656, "global_step": 251971, "epoch": 2082} {"train_loss": -41.674522399902344, "global_step": 251972, "epoch": 2082} {"train_loss": -41.3525276184082, "global_step": 251973, "epoch": 2082} {"train_loss": -41.32979202270508, "global_step": 251974, "epoch": 2082} {"train_loss": -41.59632110595703, "global_step": 251975, "epoch": 2082} {"train_loss": -41.55506134033203, "global_step": 251976, "epoch": 2082} {"train_loss": -41.16972732543945, "global_step": 251977, "epoch": 2082} {"train_loss": -37.724525451660156, "global_step": 251978, "epoch": 2082} {"train_loss": -41.163299560546875, "global_step": 251979, "epoch": 2082} {"train_loss": -41.45180130004883, "global_step": 251980, "epoch": 2082} {"train_loss": -41.51253890991211, "global_step": 251981, "epoch": 2082} {"train_loss": -40.91207504272461, "global_step": 251982, "epoch": 2082} {"train_loss": -41.56258773803711, "global_step": 251983, "epoch": 2082} {"train_loss": -41.66567611694336, "global_step": 251984, "epoch": 2082} {"train_loss": -41.86933517456055, "global_step": 251985, "epoch": 2082} {"train_loss": -41.486061096191406, "global_step": 251986, "epoch": 2082} {"train_loss": -42.170101165771484, "global_step": 251987, "epoch": 2082} {"train_loss": -41.98567581176758, "global_step": 251988, "epoch": 2082} {"train_loss": -41.90708541870117, "global_step": 251989, "epoch": 2082} {"train_loss": -42.06070327758789, "global_step": 251990, "epoch": 2082} {"train_loss": -41.62174987792969, "global_step": 251991, "epoch": 2082} {"train_loss": -41.887577056884766, "global_step": 251992, "epoch": 2082} {"train_loss": -41.70538330078125, "global_step": 251993, "epoch": 2082} {"train_loss": -41.6021614074707, "global_step": 251994, "epoch": 2082} {"train_loss": -41.820552825927734, "global_step": 251995, "epoch": 2082} {"train_loss": -42.32646179199219, "global_step": 251996, "epoch": 2082} {"train_loss": -41.814273834228516, "global_step": 251997, "epoch": 2082} {"train_loss": -41.659751892089844, "global_step": 251998, "epoch": 2082} {"train_loss": -42.10481643676758, "global_step": 251999, "epoch": 2082} {"train_loss": -42.2733268737793, "global_step": 252000, "epoch": 2082} {"train_loss": -41.95331954956055, "global_step": 252001, "epoch": 2082} {"train_loss": -41.63129806518555, "global_step": 252002, "epoch": 2082} {"train_loss": -41.34279251098633, "global_step": 252003, "epoch": 2082} {"train_loss": -42.50626754760742, "global_step": 252004, "epoch": 2082} {"train_loss": -42.1635856628418, "global_step": 252005, "epoch": 2082} {"train_loss": -42.004573822021484, "global_step": 252006, "epoch": 2082} {"train_loss": -41.681922912597656, "global_step": 252007, "epoch": 2082} {"train_loss": -42.51802062988281, "global_step": 252008, "epoch": 2082} {"train_loss": -34.355587005615234, "global_step": 252009, "epoch": 2082} {"train_loss": -42.16063690185547, "global_step": 252010, "epoch": 2082} {"train_loss": -41.89981460571289, "global_step": 252011, "epoch": 2082} {"train_loss": -41.553375244140625, "global_step": 252012, "epoch": 2082} {"train_loss": -40.98347091674805, "global_step": 252013, "epoch": 2082} {"train_loss": -35.61955642700195, "global_step": 252014, "epoch": 2082} {"train_loss": -41.81203842163086, "global_step": 252015, "epoch": 2082} {"train_loss": -42.11310958862305, "global_step": 252016, "epoch": 2082} {"train_loss": -42.20071792602539, "global_step": 252017, "epoch": 2082} {"train_loss": -41.78882598876953, "global_step": 252018, "epoch": 2082} {"train_loss": -42.33332824707031, "global_step": 252019, "epoch": 2082} {"train_loss": -42.178382873535156, "global_step": 252020, "epoch": 2082} {"train_loss": -41.77932357788086, "global_step": 252021, "epoch": 2082} {"train_loss": -41.76955795288086, "global_step": 252022, "epoch": 2082} {"train_loss": -41.6683235168457, "global_step": 252023, "epoch": 2082} {"train_loss": -35.20725631713867, "global_step": 252024, "epoch": 2082} {"train_loss": -40.4177131652832, "global_step": 252025, "epoch": 2082} {"train_loss": -41.803810119628906, "global_step": 252026, "epoch": 2082} {"train_loss": -39.7408561706543, "global_step": 252027, "epoch": 2082} {"train_loss": -41.49030685424805, "global_step": 252028, "epoch": 2082} {"train_loss": -42.09859085083008, "global_step": 252029, "epoch": 2082} {"train_loss": -42.46525192260742, "global_step": 252030, "epoch": 2082} {"train_loss": -41.6735725402832, "global_step": 252031, "epoch": 2082} {"train_loss": -41.94826126098633, "global_step": 252032, "epoch": 2082} {"train_loss": -42.04706954956055, "global_step": 252033, "epoch": 2082} {"train_loss": -42.62266159057617, "global_step": 252034, "epoch": 2082} {"train_loss": -41.60441970825195, "global_step": 252035, "epoch": 2082} {"train_loss": -41.610382080078125, "global_step": 252036, "epoch": 2082} {"train_loss": -41.23234939575195, "global_step": 252037, "epoch": 2082} {"train_loss": -34.03110885620117, "global_step": 252038, "epoch": 2082} {"train_loss": -41.696678161621094, "global_step": 252039, "epoch": 2082} {"train_loss": -42.085968017578125, "global_step": 252040, "epoch": 2082} {"train_loss": -41.73555374145508, "global_step": 252041, "epoch": 2082} {"train_loss": -39.891024219103095, "global_step": 252042, "epoch": 2082, "val_loss": 2634474.0} {"train_loss": -41.685184478759766, "global_step": 252043, "epoch": 2083} {"train_loss": -40.8921012878418, "global_step": 252044, "epoch": 2083} {"train_loss": -41.360408782958984, "global_step": 252045, "epoch": 2083} {"train_loss": -41.37775802612305, "global_step": 252046, "epoch": 2083} {"train_loss": -41.84480667114258, "global_step": 252047, "epoch": 2083} {"train_loss": -40.96122360229492, "global_step": 252048, "epoch": 2083} {"train_loss": -42.6993522644043, "global_step": 252049, "epoch": 2083} {"train_loss": -42.3234977722168, "global_step": 252050, "epoch": 2083} {"train_loss": -41.200923919677734, "global_step": 252051, "epoch": 2083} {"train_loss": -41.5067024230957, "global_step": 252052, "epoch": 2083} {"train_loss": -42.03983688354492, "global_step": 252053, "epoch": 2083} {"train_loss": -41.80698776245117, "global_step": 252054, "epoch": 2083} {"train_loss": -41.811180114746094, "global_step": 252055, "epoch": 2083} {"train_loss": -42.082340240478516, "global_step": 252056, "epoch": 2083} {"train_loss": -41.918582916259766, "global_step": 252057, "epoch": 2083} {"train_loss": -42.505340576171875, "global_step": 252058, "epoch": 2083} {"train_loss": -40.60798645019531, "global_step": 252059, "epoch": 2083} {"train_loss": -41.50043869018555, "global_step": 252060, "epoch": 2083} {"train_loss": -42.42195510864258, "global_step": 252061, "epoch": 2083} {"train_loss": -42.33617401123047, "global_step": 252062, "epoch": 2083} {"train_loss": -41.91633224487305, "global_step": 252063, "epoch": 2083} {"train_loss": -41.989013671875, "global_step": 252064, "epoch": 2083} {"train_loss": -42.415836334228516, "global_step": 252065, "epoch": 2083} {"train_loss": -43.00016403198242, "global_step": 252066, "epoch": 2083} {"train_loss": -42.807525634765625, "global_step": 252067, "epoch": 2083} {"train_loss": -42.96578598022461, "global_step": 252068, "epoch": 2083} {"train_loss": -41.76627731323242, "global_step": 252069, "epoch": 2083} {"train_loss": -41.946773529052734, "global_step": 252070, "epoch": 2083} {"train_loss": -43.115291595458984, "global_step": 252071, "epoch": 2083} {"train_loss": -42.46642303466797, "global_step": 252072, "epoch": 2083} {"train_loss": -43.1569938659668, "global_step": 252073, "epoch": 2083} {"train_loss": -42.51436996459961, "global_step": 252074, "epoch": 2083} {"train_loss": -42.07949447631836, "global_step": 252075, "epoch": 2083} {"train_loss": -42.22930908203125, "global_step": 252076, "epoch": 2083} {"train_loss": -42.34089279174805, "global_step": 252077, "epoch": 2083} {"train_loss": -42.52619552612305, "global_step": 252078, "epoch": 2083} {"train_loss": -42.89837646484375, "global_step": 252079, "epoch": 2083} {"train_loss": -42.46953582763672, "global_step": 252080, "epoch": 2083} {"train_loss": -41.73413848876953, "global_step": 252081, "epoch": 2083} {"train_loss": -42.2605094909668, "global_step": 252082, "epoch": 2083} {"train_loss": -42.6915283203125, "global_step": 252083, "epoch": 2083} {"train_loss": -42.35501480102539, "global_step": 252084, "epoch": 2083} {"train_loss": -42.44916915893555, "global_step": 252085, "epoch": 2083} {"train_loss": -42.08028030395508, "global_step": 252086, "epoch": 2083} {"train_loss": -43.14759826660156, "global_step": 252087, "epoch": 2083} {"train_loss": -42.838043212890625, "global_step": 252088, "epoch": 2083} {"train_loss": -42.319854736328125, "global_step": 252089, "epoch": 2083} {"train_loss": -42.41965103149414, "global_step": 252090, "epoch": 2083} {"train_loss": -43.000579833984375, "global_step": 252091, "epoch": 2083} {"train_loss": -42.10886764526367, "global_step": 252092, "epoch": 2083} {"train_loss": -42.31996154785156, "global_step": 252093, "epoch": 2083} {"train_loss": -42.296932220458984, "global_step": 252094, "epoch": 2083} {"train_loss": -42.1376953125, "global_step": 252095, "epoch": 2083} {"train_loss": -42.016597747802734, "global_step": 252096, "epoch": 2083} {"train_loss": -40.9792594909668, "global_step": 252097, "epoch": 2083} {"train_loss": -40.82221603393555, "global_step": 252098, "epoch": 2083} {"train_loss": -40.86042022705078, "global_step": 252099, "epoch": 2083} {"train_loss": -41.885353088378906, "global_step": 252100, "epoch": 2083} {"train_loss": -42.59501266479492, "global_step": 252101, "epoch": 2083} {"train_loss": -42.4056282043457, "global_step": 252102, "epoch": 2083} {"train_loss": -42.10969161987305, "global_step": 252103, "epoch": 2083} {"train_loss": -42.223018646240234, "global_step": 252104, "epoch": 2083} {"train_loss": -42.365577697753906, "global_step": 252105, "epoch": 2083} {"train_loss": -42.252254486083984, "global_step": 252106, "epoch": 2083} {"train_loss": -40.86993408203125, "global_step": 252107, "epoch": 2083} {"train_loss": -42.07417297363281, "global_step": 252108, "epoch": 2083} {"train_loss": -41.19111251831055, "global_step": 252109, "epoch": 2083} {"train_loss": -42.52157211303711, "global_step": 252110, "epoch": 2083} {"train_loss": -41.34849166870117, "global_step": 252111, "epoch": 2083} {"train_loss": -40.7364501953125, "global_step": 252112, "epoch": 2083} {"train_loss": -40.50798416137695, "global_step": 252113, "epoch": 2083} {"train_loss": -39.869483947753906, "global_step": 252114, "epoch": 2083} {"train_loss": -40.80375289916992, "global_step": 252115, "epoch": 2083} {"train_loss": -41.41388702392578, "global_step": 252116, "epoch": 2083} {"train_loss": -40.7515983581543, "global_step": 252117, "epoch": 2083} {"train_loss": -38.31135177612305, "global_step": 252118, "epoch": 2083} {"train_loss": -39.58301544189453, "global_step": 252119, "epoch": 2083} {"train_loss": -41.35942077636719, "global_step": 252120, "epoch": 2083} {"train_loss": -41.853179931640625, "global_step": 252121, "epoch": 2083} {"train_loss": -41.542083740234375, "global_step": 252122, "epoch": 2083} {"train_loss": -41.04856491088867, "global_step": 252123, "epoch": 2083} {"train_loss": -42.38230514526367, "global_step": 252124, "epoch": 2083} {"train_loss": -41.389095306396484, "global_step": 252125, "epoch": 2083} {"train_loss": -40.06681442260742, "global_step": 252126, "epoch": 2083} {"train_loss": -41.324283599853516, "global_step": 252127, "epoch": 2083} {"train_loss": -42.28171920776367, "global_step": 252128, "epoch": 2083} {"train_loss": -41.9306755065918, "global_step": 252129, "epoch": 2083} {"train_loss": -42.20846176147461, "global_step": 252130, "epoch": 2083} {"train_loss": -42.48296356201172, "global_step": 252131, "epoch": 2083} {"train_loss": -42.15027618408203, "global_step": 252132, "epoch": 2083} {"train_loss": -42.014556884765625, "global_step": 252133, "epoch": 2083} {"train_loss": -41.013916015625, "global_step": 252134, "epoch": 2083} {"train_loss": -42.1406364440918, "global_step": 252135, "epoch": 2083} {"train_loss": -42.11661911010742, "global_step": 252136, "epoch": 2083} {"train_loss": -42.9207763671875, "global_step": 252137, "epoch": 2083} {"train_loss": -42.23712921142578, "global_step": 252138, "epoch": 2083} {"train_loss": -42.2530632019043, "global_step": 252139, "epoch": 2083} {"train_loss": -41.27692794799805, "global_step": 252140, "epoch": 2083} {"train_loss": -41.7902946472168, "global_step": 252141, "epoch": 2083} {"train_loss": -41.34712600708008, "global_step": 252142, "epoch": 2083} {"train_loss": -41.8565559387207, "global_step": 252143, "epoch": 2083} {"train_loss": -40.81441116333008, "global_step": 252144, "epoch": 2083} {"train_loss": -41.90787887573242, "global_step": 252145, "epoch": 2083} {"train_loss": -40.45711898803711, "global_step": 252146, "epoch": 2083} {"train_loss": -40.57993698120117, "global_step": 252147, "epoch": 2083} {"train_loss": -41.727603912353516, "global_step": 252148, "epoch": 2083} {"train_loss": -40.76520919799805, "global_step": 252149, "epoch": 2083} {"train_loss": -41.23598098754883, "global_step": 252150, "epoch": 2083} {"train_loss": -41.582427978515625, "global_step": 252151, "epoch": 2083} {"train_loss": -41.96804428100586, "global_step": 252152, "epoch": 2083} {"train_loss": -41.5746955871582, "global_step": 252153, "epoch": 2083} {"train_loss": -41.348236083984375, "global_step": 252154, "epoch": 2083} {"train_loss": -40.9947624206543, "global_step": 252155, "epoch": 2083} {"train_loss": -41.87648010253906, "global_step": 252156, "epoch": 2083} {"train_loss": -41.272945404052734, "global_step": 252157, "epoch": 2083} {"train_loss": -42.676361083984375, "global_step": 252158, "epoch": 2083} {"train_loss": -42.1820068359375, "global_step": 252159, "epoch": 2083} {"train_loss": -42.53188705444336, "global_step": 252160, "epoch": 2083} {"train_loss": -40.64582061767578, "global_step": 252161, "epoch": 2083} {"train_loss": -42.0054817199707, "global_step": 252162, "epoch": 2083} {"train_loss": -41.80832400991897, "global_step": 252163, "epoch": 2083, "val_loss": 2625285.0} {"train_loss": -42.82454299926758, "global_step": 252164, "epoch": 2084} {"train_loss": -41.396968841552734, "global_step": 252165, "epoch": 2084} {"train_loss": -41.92560577392578, "global_step": 252166, "epoch": 2084} {"train_loss": -41.17620849609375, "global_step": 252167, "epoch": 2084} {"train_loss": -42.05756759643555, "global_step": 252168, "epoch": 2084} {"train_loss": -42.49283218383789, "global_step": 252169, "epoch": 2084} {"train_loss": -41.939781188964844, "global_step": 252170, "epoch": 2084} {"train_loss": -41.73088455200195, "global_step": 252171, "epoch": 2084} {"train_loss": -42.3180046081543, "global_step": 252172, "epoch": 2084} {"train_loss": -42.1353874206543, "global_step": 252173, "epoch": 2084} {"train_loss": -42.85355758666992, "global_step": 252174, "epoch": 2084} {"train_loss": -42.00728988647461, "global_step": 252175, "epoch": 2084} {"train_loss": -42.70542907714844, "global_step": 252176, "epoch": 2084} {"train_loss": -42.59949493408203, "global_step": 252177, "epoch": 2084} {"train_loss": -42.42694091796875, "global_step": 252178, "epoch": 2084} {"train_loss": -42.86897659301758, "global_step": 252179, "epoch": 2084} {"train_loss": -42.87353515625, "global_step": 252180, "epoch": 2084} {"train_loss": -42.85224533081055, "global_step": 252181, "epoch": 2084} {"train_loss": -42.72185134887695, "global_step": 252182, "epoch": 2084} {"train_loss": -42.8769645690918, "global_step": 252183, "epoch": 2084} {"train_loss": -42.32059860229492, "global_step": 252184, "epoch": 2084} {"train_loss": -42.87153244018555, "global_step": 252185, "epoch": 2084} {"train_loss": -42.88871383666992, "global_step": 252186, "epoch": 2084} {"train_loss": -42.37977981567383, "global_step": 252187, "epoch": 2084} {"train_loss": -42.50762176513672, "global_step": 252188, "epoch": 2084} {"train_loss": -40.363441467285156, "global_step": 252189, "epoch": 2084} {"train_loss": -41.672828674316406, "global_step": 252190, "epoch": 2084} {"train_loss": -42.00674057006836, "global_step": 252191, "epoch": 2084} {"train_loss": -43.039100646972656, "global_step": 252192, "epoch": 2084} {"train_loss": -42.383140563964844, "global_step": 252193, "epoch": 2084} {"train_loss": -41.2672233581543, "global_step": 252194, "epoch": 2084} {"train_loss": -40.192630767822266, "global_step": 252195, "epoch": 2084} {"train_loss": -40.392486572265625, "global_step": 252196, "epoch": 2084} {"train_loss": -42.67144775390625, "global_step": 252197, "epoch": 2084} {"train_loss": -42.272857666015625, "global_step": 252198, "epoch": 2084} {"train_loss": -39.98482894897461, "global_step": 252199, "epoch": 2084} {"train_loss": -35.742191314697266, "global_step": 252200, "epoch": 2084} {"train_loss": -38.84466552734375, "global_step": 252201, "epoch": 2084} {"train_loss": -42.0605354309082, "global_step": 252202, "epoch": 2084} {"train_loss": -38.19340133666992, "global_step": 252203, "epoch": 2084} {"train_loss": -37.776912689208984, "global_step": 252204, "epoch": 2084} {"train_loss": -41.81245040893555, "global_step": 252205, "epoch": 2084} {"train_loss": -42.09589767456055, "global_step": 252206, "epoch": 2084} {"train_loss": -39.950965881347656, "global_step": 252207, "epoch": 2084} {"train_loss": -41.5245475769043, "global_step": 252208, "epoch": 2084} {"train_loss": -41.59405517578125, "global_step": 252209, "epoch": 2084} {"train_loss": -39.35940170288086, "global_step": 252210, "epoch": 2084} {"train_loss": -41.19451904296875, "global_step": 252211, "epoch": 2084} {"train_loss": -42.5141716003418, "global_step": 252212, "epoch": 2084} {"train_loss": -41.7797737121582, "global_step": 252213, "epoch": 2084} {"train_loss": -42.30751037597656, "global_step": 252214, "epoch": 2084} {"train_loss": -42.53387451171875, "global_step": 252215, "epoch": 2084} {"train_loss": -42.65827178955078, "global_step": 252216, "epoch": 2084} {"train_loss": -42.65940856933594, "global_step": 252217, "epoch": 2084} {"train_loss": -42.32152557373047, "global_step": 252218, "epoch": 2084} {"train_loss": -42.65631866455078, "global_step": 252219, "epoch": 2084} {"train_loss": -42.773399353027344, "global_step": 252220, "epoch": 2084} {"train_loss": -42.45697021484375, "global_step": 252221, "epoch": 2084} {"train_loss": -41.88410568237305, "global_step": 252222, "epoch": 2084} {"train_loss": -42.51350021362305, "global_step": 252223, "epoch": 2084} {"train_loss": -42.196144104003906, "global_step": 252224, "epoch": 2084} {"train_loss": -42.74824905395508, "global_step": 252225, "epoch": 2084} {"train_loss": -42.89656066894531, "global_step": 252226, "epoch": 2084} {"train_loss": -42.541744232177734, "global_step": 252227, "epoch": 2084} {"train_loss": -42.42672348022461, "global_step": 252228, "epoch": 2084} {"train_loss": -42.808040618896484, "global_step": 252229, "epoch": 2084} {"train_loss": -41.723751068115234, "global_step": 252230, "epoch": 2084} {"train_loss": -42.4932861328125, "global_step": 252231, "epoch": 2084} {"train_loss": -43.27553176879883, "global_step": 252232, "epoch": 2084} {"train_loss": -42.199703216552734, "global_step": 252233, "epoch": 2084} {"train_loss": -42.238983154296875, "global_step": 252234, "epoch": 2084} {"train_loss": -42.82245635986328, "global_step": 252235, "epoch": 2084} {"train_loss": -42.27051544189453, "global_step": 252236, "epoch": 2084} {"train_loss": -42.602943420410156, "global_step": 252237, "epoch": 2084} {"train_loss": -43.1248893737793, "global_step": 252238, "epoch": 2084} {"train_loss": -42.49050521850586, "global_step": 252239, "epoch": 2084} {"train_loss": -42.7938117980957, "global_step": 252240, "epoch": 2084} {"train_loss": -42.76241683959961, "global_step": 252241, "epoch": 2084} {"train_loss": -42.472042083740234, "global_step": 252242, "epoch": 2084} {"train_loss": -43.02749252319336, "global_step": 252243, "epoch": 2084} {"train_loss": -43.3404541015625, "global_step": 252244, "epoch": 2084} {"train_loss": -43.42594528198242, "global_step": 252245, "epoch": 2084} {"train_loss": -42.43480682373047, "global_step": 252246, "epoch": 2084} {"train_loss": -43.04484939575195, "global_step": 252247, "epoch": 2084} {"train_loss": -43.46186447143555, "global_step": 252248, "epoch": 2084} {"train_loss": -43.29037094116211, "global_step": 252249, "epoch": 2084} {"train_loss": -43.129356384277344, "global_step": 252250, "epoch": 2084} {"train_loss": -43.228755950927734, "global_step": 252251, "epoch": 2084} {"train_loss": -42.89073181152344, "global_step": 252252, "epoch": 2084} {"train_loss": -42.77033996582031, "global_step": 252253, "epoch": 2084} {"train_loss": -42.085601806640625, "global_step": 252254, "epoch": 2084} {"train_loss": -41.54189682006836, "global_step": 252255, "epoch": 2084} {"train_loss": -41.8322868347168, "global_step": 252256, "epoch": 2084} {"train_loss": -42.85675811767578, "global_step": 252257, "epoch": 2084} {"train_loss": -41.9901008605957, "global_step": 252258, "epoch": 2084} {"train_loss": -42.07405471801758, "global_step": 252259, "epoch": 2084} {"train_loss": -42.74692916870117, "global_step": 252260, "epoch": 2084} {"train_loss": -42.58112716674805, "global_step": 252261, "epoch": 2084} {"train_loss": -42.86086654663086, "global_step": 252262, "epoch": 2084} {"train_loss": -42.35820388793945, "global_step": 252263, "epoch": 2084} {"train_loss": -42.746822357177734, "global_step": 252264, "epoch": 2084} {"train_loss": -42.73158264160156, "global_step": 252265, "epoch": 2084} {"train_loss": -42.68392562866211, "global_step": 252266, "epoch": 2084} {"train_loss": -42.52073287963867, "global_step": 252267, "epoch": 2084} {"train_loss": -43.02328109741211, "global_step": 252268, "epoch": 2084} {"train_loss": -43.54554748535156, "global_step": 252269, "epoch": 2084} {"train_loss": -43.555660247802734, "global_step": 252270, "epoch": 2084} {"train_loss": -43.02923583984375, "global_step": 252271, "epoch": 2084} {"train_loss": -43.35494613647461, "global_step": 252272, "epoch": 2084} {"train_loss": -42.17844772338867, "global_step": 252273, "epoch": 2084} {"train_loss": -43.23170471191406, "global_step": 252274, "epoch": 2084} {"train_loss": -42.56589889526367, "global_step": 252275, "epoch": 2084} {"train_loss": -43.04890060424805, "global_step": 252276, "epoch": 2084} {"train_loss": -41.153282165527344, "global_step": 252277, "epoch": 2084} {"train_loss": -42.21363830566406, "global_step": 252278, "epoch": 2084} {"train_loss": -41.949920654296875, "global_step": 252279, "epoch": 2084} {"train_loss": -42.639549255371094, "global_step": 252280, "epoch": 2084} {"train_loss": -41.51284408569336, "global_step": 252281, "epoch": 2084} {"train_loss": -42.27007293701172, "global_step": 252282, "epoch": 2084} {"train_loss": -42.485382080078125, "global_step": 252283, "epoch": 2084} {"train_loss": -42.19982465633676, "global_step": 252284, "epoch": 2084, "val_loss": 2698948.0} {"train_loss": -42.669227600097656, "global_step": 252285, "epoch": 2085} {"train_loss": -42.90372848510742, "global_step": 252286, "epoch": 2085} {"train_loss": -43.09598922729492, "global_step": 252287, "epoch": 2085} {"train_loss": -42.46064758300781, "global_step": 252288, "epoch": 2085} {"train_loss": -42.88914108276367, "global_step": 252289, "epoch": 2085} {"train_loss": -42.948238372802734, "global_step": 252290, "epoch": 2085} {"train_loss": -42.733455657958984, "global_step": 252291, "epoch": 2085} {"train_loss": -42.884586334228516, "global_step": 252292, "epoch": 2085} {"train_loss": -42.906982421875, "global_step": 252293, "epoch": 2085} {"train_loss": -42.758506774902344, "global_step": 252294, "epoch": 2085} {"train_loss": -42.22142028808594, "global_step": 252295, "epoch": 2085} {"train_loss": -41.243099212646484, "global_step": 252296, "epoch": 2085} {"train_loss": -43.033756256103516, "global_step": 252297, "epoch": 2085} {"train_loss": -42.60769271850586, "global_step": 252298, "epoch": 2085} {"train_loss": -41.4958610534668, "global_step": 252299, "epoch": 2085} {"train_loss": -41.520591735839844, "global_step": 252300, "epoch": 2085} {"train_loss": -40.24852752685547, "global_step": 252301, "epoch": 2085} {"train_loss": -40.37293243408203, "global_step": 252302, "epoch": 2085} {"train_loss": -41.24562072753906, "global_step": 252303, "epoch": 2085} {"train_loss": -42.36625289916992, "global_step": 252304, "epoch": 2085} {"train_loss": -41.17002487182617, "global_step": 252305, "epoch": 2085} {"train_loss": -38.802425384521484, "global_step": 252306, "epoch": 2085} {"train_loss": -35.12649154663086, "global_step": 252307, "epoch": 2085} {"train_loss": -33.854305267333984, "global_step": 252308, "epoch": 2085} {"train_loss": -38.7270622253418, "global_step": 252309, "epoch": 2085} {"train_loss": -41.212135314941406, "global_step": 252310, "epoch": 2085} {"train_loss": -36.907779693603516, "global_step": 252311, "epoch": 2085} {"train_loss": -36.377254486083984, "global_step": 252312, "epoch": 2085} {"train_loss": -40.087154388427734, "global_step": 252313, "epoch": 2085} {"train_loss": -36.853031158447266, "global_step": 252314, "epoch": 2085} {"train_loss": -38.182777404785156, "global_step": 252315, "epoch": 2085} {"train_loss": -39.90755844116211, "global_step": 252316, "epoch": 2085} {"train_loss": -37.483062744140625, "global_step": 252317, "epoch": 2085} {"train_loss": -40.20412826538086, "global_step": 252318, "epoch": 2085} {"train_loss": -38.869049072265625, "global_step": 252319, "epoch": 2085} {"train_loss": -40.877838134765625, "global_step": 252320, "epoch": 2085} {"train_loss": -39.53922653198242, "global_step": 252321, "epoch": 2085} {"train_loss": -40.13955307006836, "global_step": 252322, "epoch": 2085} {"train_loss": -40.334205627441406, "global_step": 252323, "epoch": 2085} {"train_loss": -40.756309509277344, "global_step": 252324, "epoch": 2085} {"train_loss": -40.85100555419922, "global_step": 252325, "epoch": 2085} {"train_loss": -40.14847946166992, "global_step": 252326, "epoch": 2085} {"train_loss": -41.9718132019043, "global_step": 252327, "epoch": 2085} {"train_loss": -41.286949157714844, "global_step": 252328, "epoch": 2085} {"train_loss": -41.50238037109375, "global_step": 252329, "epoch": 2085} {"train_loss": -41.78485870361328, "global_step": 252330, "epoch": 2085} {"train_loss": -41.37592697143555, "global_step": 252331, "epoch": 2085} {"train_loss": -41.55636215209961, "global_step": 252332, "epoch": 2085} {"train_loss": -41.07447052001953, "global_step": 252333, "epoch": 2085} {"train_loss": -41.98445510864258, "global_step": 252334, "epoch": 2085} {"train_loss": -41.546607971191406, "global_step": 252335, "epoch": 2085} {"train_loss": -42.30294418334961, "global_step": 252336, "epoch": 2085} {"train_loss": -41.76803207397461, "global_step": 252337, "epoch": 2085} {"train_loss": -41.965293884277344, "global_step": 252338, "epoch": 2085} {"train_loss": -41.82524871826172, "global_step": 252339, "epoch": 2085} {"train_loss": -41.945926666259766, "global_step": 252340, "epoch": 2085} {"train_loss": -41.307533264160156, "global_step": 252341, "epoch": 2085} {"train_loss": -41.981964111328125, "global_step": 252342, "epoch": 2085} {"train_loss": -41.79108428955078, "global_step": 252343, "epoch": 2085} {"train_loss": -41.545166015625, "global_step": 252344, "epoch": 2085} {"train_loss": -42.173885345458984, "global_step": 252345, "epoch": 2085} {"train_loss": -41.93964767456055, "global_step": 252346, "epoch": 2085} {"train_loss": -42.67258834838867, "global_step": 252347, "epoch": 2085} {"train_loss": -41.92655944824219, "global_step": 252348, "epoch": 2085} {"train_loss": -42.453277587890625, "global_step": 252349, "epoch": 2085} {"train_loss": -42.07925033569336, "global_step": 252350, "epoch": 2085} {"train_loss": -41.58352279663086, "global_step": 252351, "epoch": 2085} {"train_loss": -42.05534744262695, "global_step": 252352, "epoch": 2085} {"train_loss": -42.127567291259766, "global_step": 252353, "epoch": 2085} {"train_loss": -42.21921920776367, "global_step": 252354, "epoch": 2085} {"train_loss": -43.017879486083984, "global_step": 252355, "epoch": 2085} {"train_loss": -42.314857482910156, "global_step": 252356, "epoch": 2085} {"train_loss": -42.62324142456055, "global_step": 252357, "epoch": 2085} {"train_loss": -42.726436614990234, "global_step": 252358, "epoch": 2085} {"train_loss": -42.86039352416992, "global_step": 252359, "epoch": 2085} {"train_loss": -42.4127082824707, "global_step": 252360, "epoch": 2085} {"train_loss": -42.98079299926758, "global_step": 252361, "epoch": 2085} {"train_loss": -42.64236831665039, "global_step": 252362, "epoch": 2085} {"train_loss": -42.596736907958984, "global_step": 252363, "epoch": 2085} {"train_loss": -42.839324951171875, "global_step": 252364, "epoch": 2085} {"train_loss": -43.07276153564453, "global_step": 252365, "epoch": 2085} {"train_loss": -42.753700256347656, "global_step": 252366, "epoch": 2085} {"train_loss": -42.85926818847656, "global_step": 252367, "epoch": 2085} {"train_loss": -42.81184005737305, "global_step": 252368, "epoch": 2085} {"train_loss": -43.683746337890625, "global_step": 252369, "epoch": 2085} {"train_loss": -42.708099365234375, "global_step": 252370, "epoch": 2085} {"train_loss": -42.70742416381836, "global_step": 252371, "epoch": 2085} {"train_loss": -42.37388610839844, "global_step": 252372, "epoch": 2085} {"train_loss": -43.19245529174805, "global_step": 252373, "epoch": 2085} {"train_loss": -43.241939544677734, "global_step": 252374, "epoch": 2085} {"train_loss": -43.248046875, "global_step": 252375, "epoch": 2085} {"train_loss": -42.986019134521484, "global_step": 252376, "epoch": 2085} {"train_loss": -43.32468795776367, "global_step": 252377, "epoch": 2085} {"train_loss": -43.36250686645508, "global_step": 252378, "epoch": 2085} {"train_loss": -43.38713836669922, "global_step": 252379, "epoch": 2085} {"train_loss": -43.69364547729492, "global_step": 252380, "epoch": 2085} {"train_loss": -43.49177169799805, "global_step": 252381, "epoch": 2085} {"train_loss": -43.28141403198242, "global_step": 252382, "epoch": 2085} {"train_loss": -43.079708099365234, "global_step": 252383, "epoch": 2085} {"train_loss": -43.83822250366211, "global_step": 252384, "epoch": 2085} {"train_loss": -42.80485153198242, "global_step": 252385, "epoch": 2085} {"train_loss": -43.56819534301758, "global_step": 252386, "epoch": 2085} {"train_loss": -43.49728012084961, "global_step": 252387, "epoch": 2085} {"train_loss": -43.47056579589844, "global_step": 252388, "epoch": 2085} {"train_loss": -43.22428512573242, "global_step": 252389, "epoch": 2085} {"train_loss": -43.413394927978516, "global_step": 252390, "epoch": 2085} {"train_loss": -43.6125602722168, "global_step": 252391, "epoch": 2085} {"train_loss": -43.48724365234375, "global_step": 252392, "epoch": 2085} {"train_loss": -43.296382904052734, "global_step": 252393, "epoch": 2085} {"train_loss": -43.23753356933594, "global_step": 252394, "epoch": 2085} {"train_loss": -43.5485725402832, "global_step": 252395, "epoch": 2085} {"train_loss": -43.738685607910156, "global_step": 252396, "epoch": 2085} {"train_loss": -42.95941925048828, "global_step": 252397, "epoch": 2085} {"train_loss": -40.2685661315918, "global_step": 252398, "epoch": 2085} {"train_loss": -43.739200592041016, "global_step": 252399, "epoch": 2085} {"train_loss": -41.7110710144043, "global_step": 252400, "epoch": 2085} {"train_loss": -43.327606201171875, "global_step": 252401, "epoch": 2085} {"train_loss": -42.51543426513672, "global_step": 252402, "epoch": 2085} {"train_loss": -43.65996170043945, "global_step": 252403, "epoch": 2085} {"train_loss": -41.97703170776367, "global_step": 252404, "epoch": 2085} {"train_loss": -41.880917289040305, "global_step": 252405, "epoch": 2085, "val_loss": 2695430.0} {"train_loss": -40.80710983276367, "global_step": 252406, "epoch": 2086} {"train_loss": -43.47704315185547, "global_step": 252407, "epoch": 2086} {"train_loss": -42.637474060058594, "global_step": 252408, "epoch": 2086} {"train_loss": -38.6274299621582, "global_step": 252409, "epoch": 2086} {"train_loss": -38.07992172241211, "global_step": 252410, "epoch": 2086} {"train_loss": -41.66550827026367, "global_step": 252411, "epoch": 2086} {"train_loss": -41.862545013427734, "global_step": 252412, "epoch": 2086} {"train_loss": -41.284603118896484, "global_step": 252413, "epoch": 2086} {"train_loss": -42.569149017333984, "global_step": 252414, "epoch": 2086} {"train_loss": -39.340450286865234, "global_step": 252415, "epoch": 2086} {"train_loss": -42.51618194580078, "global_step": 252416, "epoch": 2086} {"train_loss": -39.1225471496582, "global_step": 252417, "epoch": 2086} {"train_loss": -40.879329681396484, "global_step": 252418, "epoch": 2086} {"train_loss": -38.15647888183594, "global_step": 252419, "epoch": 2086} {"train_loss": -42.17196273803711, "global_step": 252420, "epoch": 2086} {"train_loss": -42.3586311340332, "global_step": 252421, "epoch": 2086} {"train_loss": -42.43009567260742, "global_step": 252422, "epoch": 2086} {"train_loss": -40.78840255737305, "global_step": 252423, "epoch": 2086} {"train_loss": -40.79621124267578, "global_step": 252424, "epoch": 2086} {"train_loss": -42.122154235839844, "global_step": 252425, "epoch": 2086} {"train_loss": -37.88057327270508, "global_step": 252426, "epoch": 2086} {"train_loss": -42.45748519897461, "global_step": 252427, "epoch": 2086} {"train_loss": -40.76957321166992, "global_step": 252428, "epoch": 2086} {"train_loss": -40.324790954589844, "global_step": 252429, "epoch": 2086} {"train_loss": -33.807708740234375, "global_step": 252430, "epoch": 2086} {"train_loss": -40.22486877441406, "global_step": 252431, "epoch": 2086} {"train_loss": -41.80387496948242, "global_step": 252432, "epoch": 2086} {"train_loss": -40.17879867553711, "global_step": 252433, "epoch": 2086} {"train_loss": -39.3128776550293, "global_step": 252434, "epoch": 2086} {"train_loss": -41.61497497558594, "global_step": 252435, "epoch": 2086} {"train_loss": -41.39823532104492, "global_step": 252436, "epoch": 2086} {"train_loss": -42.5252685546875, "global_step": 252437, "epoch": 2086} {"train_loss": -41.369041442871094, "global_step": 252438, "epoch": 2086} {"train_loss": -41.040401458740234, "global_step": 252439, "epoch": 2086} {"train_loss": -40.2414665222168, "global_step": 252440, "epoch": 2086} {"train_loss": -38.0988883972168, "global_step": 252441, "epoch": 2086} {"train_loss": -41.44432830810547, "global_step": 252442, "epoch": 2086} {"train_loss": -42.46426773071289, "global_step": 252443, "epoch": 2086} {"train_loss": -41.676513671875, "global_step": 252444, "epoch": 2086} {"train_loss": -40.83976745605469, "global_step": 252445, "epoch": 2086} {"train_loss": -39.94464111328125, "global_step": 252446, "epoch": 2086} {"train_loss": -39.99693298339844, "global_step": 252447, "epoch": 2086} {"train_loss": -40.00205612182617, "global_step": 252448, "epoch": 2086} {"train_loss": -42.20412826538086, "global_step": 252449, "epoch": 2086} {"train_loss": -42.29933547973633, "global_step": 252450, "epoch": 2086} {"train_loss": -43.033504486083984, "global_step": 252451, "epoch": 2086} {"train_loss": -41.941463470458984, "global_step": 252452, "epoch": 2086} {"train_loss": -42.9205322265625, "global_step": 252453, "epoch": 2086} {"train_loss": -42.297969818115234, "global_step": 252454, "epoch": 2086} {"train_loss": -42.61498260498047, "global_step": 252455, "epoch": 2086} {"train_loss": -42.484405517578125, "global_step": 252456, "epoch": 2086} {"train_loss": -40.731910705566406, "global_step": 252457, "epoch": 2086} {"train_loss": -42.45553970336914, "global_step": 252458, "epoch": 2086} {"train_loss": -41.80906295776367, "global_step": 252459, "epoch": 2086} {"train_loss": -40.87611389160156, "global_step": 252460, "epoch": 2086} {"train_loss": -42.58133316040039, "global_step": 252461, "epoch": 2086} {"train_loss": -40.90548324584961, "global_step": 252462, "epoch": 2086} {"train_loss": -41.899715423583984, "global_step": 252463, "epoch": 2086} {"train_loss": -42.51386642456055, "global_step": 252464, "epoch": 2086} {"train_loss": -41.62097930908203, "global_step": 252465, "epoch": 2086} {"train_loss": -42.661109924316406, "global_step": 252466, "epoch": 2086} {"train_loss": -41.81795120239258, "global_step": 252467, "epoch": 2086} {"train_loss": -41.610572814941406, "global_step": 252468, "epoch": 2086} {"train_loss": -40.91067123413086, "global_step": 252469, "epoch": 2086} {"train_loss": -42.2066764831543, "global_step": 252470, "epoch": 2086} {"train_loss": -40.93143844604492, "global_step": 252471, "epoch": 2086} {"train_loss": -42.18235778808594, "global_step": 252472, "epoch": 2086} {"train_loss": -40.87106704711914, "global_step": 252473, "epoch": 2086} {"train_loss": -41.83755111694336, "global_step": 252474, "epoch": 2086} {"train_loss": -41.36715316772461, "global_step": 252475, "epoch": 2086} {"train_loss": -41.722110748291016, "global_step": 252476, "epoch": 2086} {"train_loss": -41.55398178100586, "global_step": 252477, "epoch": 2086} {"train_loss": -42.66474533081055, "global_step": 252478, "epoch": 2086} {"train_loss": -41.98857498168945, "global_step": 252479, "epoch": 2086} {"train_loss": -41.72231674194336, "global_step": 252480, "epoch": 2086} {"train_loss": -42.88296127319336, "global_step": 252481, "epoch": 2086} {"train_loss": -42.04276657104492, "global_step": 252482, "epoch": 2086} {"train_loss": -41.711727142333984, "global_step": 252483, "epoch": 2086} {"train_loss": -42.816139221191406, "global_step": 252484, "epoch": 2086} {"train_loss": -41.64883804321289, "global_step": 252485, "epoch": 2086} {"train_loss": -42.2984504699707, "global_step": 252486, "epoch": 2086} {"train_loss": -42.26190185546875, "global_step": 252487, "epoch": 2086} {"train_loss": -41.94710922241211, "global_step": 252488, "epoch": 2086} {"train_loss": -43.086936950683594, "global_step": 252489, "epoch": 2086} {"train_loss": -42.2744140625, "global_step": 252490, "epoch": 2086} {"train_loss": -42.660736083984375, "global_step": 252491, "epoch": 2086} {"train_loss": -42.0506706237793, "global_step": 252492, "epoch": 2086} {"train_loss": -43.03577423095703, "global_step": 252493, "epoch": 2086} {"train_loss": -42.653289794921875, "global_step": 252494, "epoch": 2086} {"train_loss": -43.049835205078125, "global_step": 252495, "epoch": 2086} {"train_loss": -41.83857345581055, "global_step": 252496, "epoch": 2086} {"train_loss": -42.60636520385742, "global_step": 252497, "epoch": 2086} {"train_loss": -42.20928955078125, "global_step": 252498, "epoch": 2086} {"train_loss": -42.835609436035156, "global_step": 252499, "epoch": 2086} {"train_loss": -42.478519439697266, "global_step": 252500, "epoch": 2086} {"train_loss": -42.22322082519531, "global_step": 252501, "epoch": 2086} {"train_loss": -42.285552978515625, "global_step": 252502, "epoch": 2086} {"train_loss": -42.515201568603516, "global_step": 252503, "epoch": 2086} {"train_loss": -42.534053802490234, "global_step": 252504, "epoch": 2086} {"train_loss": -42.675628662109375, "global_step": 252505, "epoch": 2086} {"train_loss": -42.684993743896484, "global_step": 252506, "epoch": 2086} {"train_loss": -43.16252517700195, "global_step": 252507, "epoch": 2086} {"train_loss": -42.0038948059082, "global_step": 252508, "epoch": 2086} {"train_loss": -41.287498474121094, "global_step": 252509, "epoch": 2086} {"train_loss": -42.717559814453125, "global_step": 252510, "epoch": 2086} {"train_loss": -41.73994064331055, "global_step": 252511, "epoch": 2086} {"train_loss": -42.58075714111328, "global_step": 252512, "epoch": 2086} {"train_loss": -42.782527923583984, "global_step": 252513, "epoch": 2086} {"train_loss": -42.7739143371582, "global_step": 252514, "epoch": 2086} {"train_loss": -40.8260612487793, "global_step": 252515, "epoch": 2086} {"train_loss": -40.86747360229492, "global_step": 252516, "epoch": 2086} {"train_loss": -41.317691802978516, "global_step": 252517, "epoch": 2086} {"train_loss": -39.578765869140625, "global_step": 252518, "epoch": 2086} {"train_loss": -42.045997619628906, "global_step": 252519, "epoch": 2086} {"train_loss": -42.67021560668945, "global_step": 252520, "epoch": 2086} {"train_loss": -41.78367233276367, "global_step": 252521, "epoch": 2086} {"train_loss": -41.78353500366211, "global_step": 252522, "epoch": 2086} {"train_loss": -43.18903350830078, "global_step": 252523, "epoch": 2086} {"train_loss": -42.90610885620117, "global_step": 252524, "epoch": 2086} {"train_loss": -42.51736068725586, "global_step": 252525, "epoch": 2086} {"train_loss": -41.62592700296197, "global_step": 252526, "epoch": 2086, "val_loss": 2590357.0} {"train_loss": -42.70578384399414, "global_step": 252527, "epoch": 2087} {"train_loss": -42.50305938720703, "global_step": 252528, "epoch": 2087} {"train_loss": -42.023231506347656, "global_step": 252529, "epoch": 2087} {"train_loss": -42.13549041748047, "global_step": 252530, "epoch": 2087} {"train_loss": -41.79993438720703, "global_step": 252531, "epoch": 2087} {"train_loss": -41.89864730834961, "global_step": 252532, "epoch": 2087} {"train_loss": -43.022640228271484, "global_step": 252533, "epoch": 2087} {"train_loss": -42.49393844604492, "global_step": 252534, "epoch": 2087} {"train_loss": -41.007408142089844, "global_step": 252535, "epoch": 2087} {"train_loss": -40.88270568847656, "global_step": 252536, "epoch": 2087} {"train_loss": -41.91197204589844, "global_step": 252537, "epoch": 2087} {"train_loss": -42.77154541015625, "global_step": 252538, "epoch": 2087} {"train_loss": -42.13312530517578, "global_step": 252539, "epoch": 2087} {"train_loss": -41.115272521972656, "global_step": 252540, "epoch": 2087} {"train_loss": -42.64703369140625, "global_step": 252541, "epoch": 2087} {"train_loss": -43.10543441772461, "global_step": 252542, "epoch": 2087} {"train_loss": -42.69865798950195, "global_step": 252543, "epoch": 2087} {"train_loss": -41.84269332885742, "global_step": 252544, "epoch": 2087} {"train_loss": -40.84784698486328, "global_step": 252545, "epoch": 2087} {"train_loss": -42.18235397338867, "global_step": 252546, "epoch": 2087} {"train_loss": -41.607086181640625, "global_step": 252547, "epoch": 2087} {"train_loss": -42.459022521972656, "global_step": 252548, "epoch": 2087} {"train_loss": -41.983070373535156, "global_step": 252549, "epoch": 2087} {"train_loss": -41.8927001953125, "global_step": 252550, "epoch": 2087} {"train_loss": -42.79287338256836, "global_step": 252551, "epoch": 2087} {"train_loss": -42.87440490722656, "global_step": 252552, "epoch": 2087} {"train_loss": -42.41544723510742, "global_step": 252553, "epoch": 2087} {"train_loss": -42.52886962890625, "global_step": 252554, "epoch": 2087} {"train_loss": -41.746456146240234, "global_step": 252555, "epoch": 2087} {"train_loss": -42.09906005859375, "global_step": 252556, "epoch": 2087} {"train_loss": -41.699859619140625, "global_step": 252557, "epoch": 2087} {"train_loss": -36.76406478881836, "global_step": 252558, "epoch": 2087} {"train_loss": -41.94828414916992, "global_step": 252559, "epoch": 2087} {"train_loss": -41.896339416503906, "global_step": 252560, "epoch": 2087} {"train_loss": -39.324642181396484, "global_step": 252561, "epoch": 2087} {"train_loss": -40.62656784057617, "global_step": 252562, "epoch": 2087} {"train_loss": -42.06541061401367, "global_step": 252563, "epoch": 2087} {"train_loss": -41.66856002807617, "global_step": 252564, "epoch": 2087} {"train_loss": -41.23247528076172, "global_step": 252565, "epoch": 2087} {"train_loss": -40.15950393676758, "global_step": 252566, "epoch": 2087} {"train_loss": -29.72869300842285, "global_step": 252567, "epoch": 2087} {"train_loss": -34.951881408691406, "global_step": 252568, "epoch": 2087} {"train_loss": -40.197601318359375, "global_step": 252569, "epoch": 2087} {"train_loss": -36.9741096496582, "global_step": 252570, "epoch": 2087} {"train_loss": -38.873374938964844, "global_step": 252571, "epoch": 2087} {"train_loss": -40.82905197143555, "global_step": 252572, "epoch": 2087} {"train_loss": -37.8755989074707, "global_step": 252573, "epoch": 2087} {"train_loss": -39.47660827636719, "global_step": 252574, "epoch": 2087} {"train_loss": -39.281402587890625, "global_step": 252575, "epoch": 2087} {"train_loss": -39.17708206176758, "global_step": 252576, "epoch": 2087} {"train_loss": -39.55363082885742, "global_step": 252577, "epoch": 2087} {"train_loss": -41.43170928955078, "global_step": 252578, "epoch": 2087} {"train_loss": -39.45096969604492, "global_step": 252579, "epoch": 2087} {"train_loss": -39.654781341552734, "global_step": 252580, "epoch": 2087} {"train_loss": -40.9045295715332, "global_step": 252581, "epoch": 2087} {"train_loss": -37.83015441894531, "global_step": 252582, "epoch": 2087} {"train_loss": -40.516502380371094, "global_step": 252583, "epoch": 2087} {"train_loss": -40.2579460144043, "global_step": 252584, "epoch": 2087} {"train_loss": -37.793067932128906, "global_step": 252585, "epoch": 2087} {"train_loss": -36.97559356689453, "global_step": 252586, "epoch": 2087} {"train_loss": -38.52451705932617, "global_step": 252587, "epoch": 2087} {"train_loss": -26.61139488220215, "global_step": 252588, "epoch": 2087} {"train_loss": -35.927894592285156, "global_step": 252589, "epoch": 2087} {"train_loss": -35.26361083984375, "global_step": 252590, "epoch": 2087} {"train_loss": -38.583045959472656, "global_step": 252591, "epoch": 2087} {"train_loss": -39.10249710083008, "global_step": 252592, "epoch": 2087} {"train_loss": -33.0274543762207, "global_step": 252593, "epoch": 2087} {"train_loss": -37.96769714355469, "global_step": 252594, "epoch": 2087} {"train_loss": -36.01987075805664, "global_step": 252595, "epoch": 2087} {"train_loss": -38.86289596557617, "global_step": 252596, "epoch": 2087} {"train_loss": -33.1451530456543, "global_step": 252597, "epoch": 2087} {"train_loss": -34.35665512084961, "global_step": 252598, "epoch": 2087} {"train_loss": -38.08646774291992, "global_step": 252599, "epoch": 2087} {"train_loss": -38.33735275268555, "global_step": 252600, "epoch": 2087} {"train_loss": -36.08468246459961, "global_step": 252601, "epoch": 2087} {"train_loss": -39.177547454833984, "global_step": 252602, "epoch": 2087} {"train_loss": -37.55141830444336, "global_step": 252603, "epoch": 2087} {"train_loss": -38.74170684814453, "global_step": 252604, "epoch": 2087} {"train_loss": -39.27838897705078, "global_step": 252605, "epoch": 2087} {"train_loss": -38.58565139770508, "global_step": 252606, "epoch": 2087} {"train_loss": -39.229705810546875, "global_step": 252607, "epoch": 2087} {"train_loss": -38.20894241333008, "global_step": 252608, "epoch": 2087} {"train_loss": -36.90679168701172, "global_step": 252609, "epoch": 2087} {"train_loss": -39.59122848510742, "global_step": 252610, "epoch": 2087} {"train_loss": -39.88410568237305, "global_step": 252611, "epoch": 2087} {"train_loss": -37.96052169799805, "global_step": 252612, "epoch": 2087} {"train_loss": -38.829307556152344, "global_step": 252613, "epoch": 2087} {"train_loss": -39.68718338012695, "global_step": 252614, "epoch": 2087} {"train_loss": -39.829429626464844, "global_step": 252615, "epoch": 2087} {"train_loss": -39.2682991027832, "global_step": 252616, "epoch": 2087} {"train_loss": -38.82438278198242, "global_step": 252617, "epoch": 2087} {"train_loss": -40.06656265258789, "global_step": 252618, "epoch": 2087} {"train_loss": -38.9481201171875, "global_step": 252619, "epoch": 2087} {"train_loss": -40.17022705078125, "global_step": 252620, "epoch": 2087} {"train_loss": -40.25349044799805, "global_step": 252621, "epoch": 2087} {"train_loss": -39.486663818359375, "global_step": 252622, "epoch": 2087} {"train_loss": -40.70418930053711, "global_step": 252623, "epoch": 2087} {"train_loss": -40.456783294677734, "global_step": 252624, "epoch": 2087} {"train_loss": -40.20838165283203, "global_step": 252625, "epoch": 2087} {"train_loss": -41.262088775634766, "global_step": 252626, "epoch": 2087} {"train_loss": -39.585418701171875, "global_step": 252627, "epoch": 2087} {"train_loss": -41.09305953979492, "global_step": 252628, "epoch": 2087} {"train_loss": -40.46314239501953, "global_step": 252629, "epoch": 2087} {"train_loss": -41.0374870300293, "global_step": 252630, "epoch": 2087} {"train_loss": -41.55202865600586, "global_step": 252631, "epoch": 2087} {"train_loss": -39.790863037109375, "global_step": 252632, "epoch": 2087} {"train_loss": -41.27519607543945, "global_step": 252633, "epoch": 2087} {"train_loss": -41.72532653808594, "global_step": 252634, "epoch": 2087} {"train_loss": -40.854766845703125, "global_step": 252635, "epoch": 2087} {"train_loss": -40.62055206298828, "global_step": 252636, "epoch": 2087} {"train_loss": -40.90310287475586, "global_step": 252637, "epoch": 2087} {"train_loss": -40.82334518432617, "global_step": 252638, "epoch": 2087} {"train_loss": -41.59765625, "global_step": 252639, "epoch": 2087} {"train_loss": -41.294273376464844, "global_step": 252640, "epoch": 2087} {"train_loss": -41.301246643066406, "global_step": 252641, "epoch": 2087} {"train_loss": -40.822174072265625, "global_step": 252642, "epoch": 2087} {"train_loss": -41.0355224609375, "global_step": 252643, "epoch": 2087} {"train_loss": -40.149024963378906, "global_step": 252644, "epoch": 2087} {"train_loss": -41.31418991088867, "global_step": 252645, "epoch": 2087} {"train_loss": -41.98183822631836, "global_step": 252646, "epoch": 2087} {"train_loss": -39.89579073062613, "global_step": 252647, "epoch": 2087, "val_loss": 2642614.25} {"train_loss": -41.961368560791016, "global_step": 252648, "epoch": 2088} {"train_loss": -41.28823471069336, "global_step": 252649, "epoch": 2088} {"train_loss": -41.94392013549805, "global_step": 252650, "epoch": 2088} {"train_loss": -42.048580169677734, "global_step": 252651, "epoch": 2088} {"train_loss": -42.184627532958984, "global_step": 252652, "epoch": 2088} {"train_loss": -42.17145919799805, "global_step": 252653, "epoch": 2088} {"train_loss": -42.11122512817383, "global_step": 252654, "epoch": 2088} {"train_loss": -41.95608139038086, "global_step": 252655, "epoch": 2088} {"train_loss": -41.87163162231445, "global_step": 252656, "epoch": 2088} {"train_loss": -42.305965423583984, "global_step": 252657, "epoch": 2088} {"train_loss": -42.1453971862793, "global_step": 252658, "epoch": 2088} {"train_loss": -41.89056396484375, "global_step": 252659, "epoch": 2088} {"train_loss": -41.596065521240234, "global_step": 252660, "epoch": 2088} {"train_loss": -41.582977294921875, "global_step": 252661, "epoch": 2088} {"train_loss": -42.555301666259766, "global_step": 252662, "epoch": 2088} {"train_loss": -42.24238204956055, "global_step": 252663, "epoch": 2088} {"train_loss": -42.130775451660156, "global_step": 252664, "epoch": 2088} {"train_loss": -42.111873626708984, "global_step": 252665, "epoch": 2088} {"train_loss": -42.47251510620117, "global_step": 252666, "epoch": 2088} {"train_loss": -42.23158645629883, "global_step": 252667, "epoch": 2088} {"train_loss": -41.36504364013672, "global_step": 252668, "epoch": 2088} {"train_loss": -42.50896072387695, "global_step": 252669, "epoch": 2088} {"train_loss": -42.858154296875, "global_step": 252670, "epoch": 2088} {"train_loss": -42.43451690673828, "global_step": 252671, "epoch": 2088} {"train_loss": -42.88265609741211, "global_step": 252672, "epoch": 2088} {"train_loss": -39.89030075073242, "global_step": 252673, "epoch": 2088} {"train_loss": -42.29096221923828, "global_step": 252674, "epoch": 2088} {"train_loss": -41.27975082397461, "global_step": 252675, "epoch": 2088} {"train_loss": -42.646663665771484, "global_step": 252676, "epoch": 2088} {"train_loss": -42.47391891479492, "global_step": 252677, "epoch": 2088} {"train_loss": -42.27995681762695, "global_step": 252678, "epoch": 2088} {"train_loss": -42.76047897338867, "global_step": 252679, "epoch": 2088} {"train_loss": -42.126182556152344, "global_step": 252680, "epoch": 2088} {"train_loss": -40.50931930541992, "global_step": 252681, "epoch": 2088} {"train_loss": -42.49528884887695, "global_step": 252682, "epoch": 2088} {"train_loss": -42.675594329833984, "global_step": 252683, "epoch": 2088} {"train_loss": -42.09617614746094, "global_step": 252684, "epoch": 2088} {"train_loss": -42.941158294677734, "global_step": 252685, "epoch": 2088} {"train_loss": -42.59299850463867, "global_step": 252686, "epoch": 2088} {"train_loss": -42.27118682861328, "global_step": 252687, "epoch": 2088} {"train_loss": -42.65908432006836, "global_step": 252688, "epoch": 2088} {"train_loss": -42.497703552246094, "global_step": 252689, "epoch": 2088} {"train_loss": -42.824798583984375, "global_step": 252690, "epoch": 2088} {"train_loss": -42.36505126953125, "global_step": 252691, "epoch": 2088} {"train_loss": -40.80093002319336, "global_step": 252692, "epoch": 2088} {"train_loss": -42.91482925415039, "global_step": 252693, "epoch": 2088} {"train_loss": -42.396602630615234, "global_step": 252694, "epoch": 2088} {"train_loss": -42.96297836303711, "global_step": 252695, "epoch": 2088} {"train_loss": -41.3027458190918, "global_step": 252696, "epoch": 2088} {"train_loss": -42.36019515991211, "global_step": 252697, "epoch": 2088} {"train_loss": -42.48833084106445, "global_step": 252698, "epoch": 2088} {"train_loss": -42.47966384887695, "global_step": 252699, "epoch": 2088} {"train_loss": -39.6792106628418, "global_step": 252700, "epoch": 2088} {"train_loss": -42.0647087097168, "global_step": 252701, "epoch": 2088} {"train_loss": -41.74550247192383, "global_step": 252702, "epoch": 2088} {"train_loss": -41.40390396118164, "global_step": 252703, "epoch": 2088} {"train_loss": -41.86725616455078, "global_step": 252704, "epoch": 2088} {"train_loss": -41.5299186706543, "global_step": 252705, "epoch": 2088} {"train_loss": -42.002010345458984, "global_step": 252706, "epoch": 2088} {"train_loss": -41.46663284301758, "global_step": 252707, "epoch": 2088} {"train_loss": -40.3498649597168, "global_step": 252708, "epoch": 2088} {"train_loss": -40.47578048706055, "global_step": 252709, "epoch": 2088} {"train_loss": -41.589656829833984, "global_step": 252710, "epoch": 2088} {"train_loss": -41.312522888183594, "global_step": 252711, "epoch": 2088} {"train_loss": -40.80814743041992, "global_step": 252712, "epoch": 2088} {"train_loss": -42.467445373535156, "global_step": 252713, "epoch": 2088} {"train_loss": -41.69047164916992, "global_step": 252714, "epoch": 2088} {"train_loss": -39.96611404418945, "global_step": 252715, "epoch": 2088} {"train_loss": -37.286102294921875, "global_step": 252716, "epoch": 2088} {"train_loss": -40.444732666015625, "global_step": 252717, "epoch": 2088} {"train_loss": -41.4752082824707, "global_step": 252718, "epoch": 2088} {"train_loss": -38.933387756347656, "global_step": 252719, "epoch": 2088} {"train_loss": -41.17922592163086, "global_step": 252720, "epoch": 2088} {"train_loss": -41.821685791015625, "global_step": 252721, "epoch": 2088} {"train_loss": -41.91355514526367, "global_step": 252722, "epoch": 2088} {"train_loss": -41.585262298583984, "global_step": 252723, "epoch": 2088} {"train_loss": -41.978572845458984, "global_step": 252724, "epoch": 2088} {"train_loss": -40.57429122924805, "global_step": 252725, "epoch": 2088} {"train_loss": -41.71181869506836, "global_step": 252726, "epoch": 2088} {"train_loss": -41.76763153076172, "global_step": 252727, "epoch": 2088} {"train_loss": -41.34092330932617, "global_step": 252728, "epoch": 2088} {"train_loss": -41.67803955078125, "global_step": 252729, "epoch": 2088} {"train_loss": -42.10784149169922, "global_step": 252730, "epoch": 2088} {"train_loss": -41.45216751098633, "global_step": 252731, "epoch": 2088} {"train_loss": -42.266666412353516, "global_step": 252732, "epoch": 2088} {"train_loss": -41.805355072021484, "global_step": 252733, "epoch": 2088} {"train_loss": -40.46674728393555, "global_step": 252734, "epoch": 2088} {"train_loss": -42.35667037963867, "global_step": 252735, "epoch": 2088} {"train_loss": -40.50043487548828, "global_step": 252736, "epoch": 2088} {"train_loss": -42.58708953857422, "global_step": 252737, "epoch": 2088} {"train_loss": -41.0331916809082, "global_step": 252738, "epoch": 2088} {"train_loss": -41.63117599487305, "global_step": 252739, "epoch": 2088} {"train_loss": -42.06563949584961, "global_step": 252740, "epoch": 2088} {"train_loss": -41.6184196472168, "global_step": 252741, "epoch": 2088} {"train_loss": -42.519405364990234, "global_step": 252742, "epoch": 2088} {"train_loss": -41.839962005615234, "global_step": 252743, "epoch": 2088} {"train_loss": -41.39716720581055, "global_step": 252744, "epoch": 2088} {"train_loss": -41.77009963989258, "global_step": 252745, "epoch": 2088} {"train_loss": -42.59999465942383, "global_step": 252746, "epoch": 2088} {"train_loss": -42.45640182495117, "global_step": 252747, "epoch": 2088} {"train_loss": -41.590511322021484, "global_step": 252748, "epoch": 2088} {"train_loss": -42.4265022277832, "global_step": 252749, "epoch": 2088} {"train_loss": -42.3196907043457, "global_step": 252750, "epoch": 2088} {"train_loss": -42.1792106628418, "global_step": 252751, "epoch": 2088} {"train_loss": -42.573570251464844, "global_step": 252752, "epoch": 2088} {"train_loss": -41.23773956298828, "global_step": 252753, "epoch": 2088} {"train_loss": -41.16853332519531, "global_step": 252754, "epoch": 2088} {"train_loss": -41.2802619934082, "global_step": 252755, "epoch": 2088} {"train_loss": -42.19936752319336, "global_step": 252756, "epoch": 2088} {"train_loss": -41.81293869018555, "global_step": 252757, "epoch": 2088} {"train_loss": -42.50670623779297, "global_step": 252758, "epoch": 2088} {"train_loss": -42.888938903808594, "global_step": 252759, "epoch": 2088} {"train_loss": -42.15000534057617, "global_step": 252760, "epoch": 2088} {"train_loss": -42.41203689575195, "global_step": 252761, "epoch": 2088} {"train_loss": -42.686248779296875, "global_step": 252762, "epoch": 2088} {"train_loss": -40.29714584350586, "global_step": 252763, "epoch": 2088} {"train_loss": -41.994415283203125, "global_step": 252764, "epoch": 2088} {"train_loss": -42.1387939453125, "global_step": 252765, "epoch": 2088} {"train_loss": -42.32391357421875, "global_step": 252766, "epoch": 2088} {"train_loss": -42.75056457519531, "global_step": 252767, "epoch": 2088} {"train_loss": -41.827284347912496, "global_step": 252768, "epoch": 2088, "val_loss": 2616976.25} {"train_loss": -41.0357551574707, "global_step": 252769, "epoch": 2089} {"train_loss": -42.95234298706055, "global_step": 252770, "epoch": 2089} {"train_loss": -41.534996032714844, "global_step": 252771, "epoch": 2089} {"train_loss": -41.679054260253906, "global_step": 252772, "epoch": 2089} {"train_loss": -41.46028137207031, "global_step": 252773, "epoch": 2089} {"train_loss": -41.97222900390625, "global_step": 252774, "epoch": 2089} {"train_loss": -42.04195785522461, "global_step": 252775, "epoch": 2089} {"train_loss": -41.66875076293945, "global_step": 252776, "epoch": 2089} {"train_loss": -41.5327033996582, "global_step": 252777, "epoch": 2089} {"train_loss": -42.37089157104492, "global_step": 252778, "epoch": 2089} {"train_loss": -41.40340805053711, "global_step": 252779, "epoch": 2089} {"train_loss": -41.81930160522461, "global_step": 252780, "epoch": 2089} {"train_loss": -39.620967864990234, "global_step": 252781, "epoch": 2089} {"train_loss": -39.938819885253906, "global_step": 252782, "epoch": 2089} {"train_loss": -42.365779876708984, "global_step": 252783, "epoch": 2089} {"train_loss": -42.011451721191406, "global_step": 252784, "epoch": 2089} {"train_loss": -41.56931686401367, "global_step": 252785, "epoch": 2089} {"train_loss": -41.446285247802734, "global_step": 252786, "epoch": 2089} {"train_loss": -42.122676849365234, "global_step": 252787, "epoch": 2089} {"train_loss": -42.0117073059082, "global_step": 252788, "epoch": 2089} {"train_loss": -41.6123046875, "global_step": 252789, "epoch": 2089} {"train_loss": -42.15543746948242, "global_step": 252790, "epoch": 2089} {"train_loss": -42.124996185302734, "global_step": 252791, "epoch": 2089} {"train_loss": -41.62717819213867, "global_step": 252792, "epoch": 2089} {"train_loss": -43.06669235229492, "global_step": 252793, "epoch": 2089} {"train_loss": -42.418190002441406, "global_step": 252794, "epoch": 2089} {"train_loss": -42.25910568237305, "global_step": 252795, "epoch": 2089} {"train_loss": -42.111061096191406, "global_step": 252796, "epoch": 2089} {"train_loss": -42.80208969116211, "global_step": 252797, "epoch": 2089} {"train_loss": -42.53042984008789, "global_step": 252798, "epoch": 2089} {"train_loss": -42.40120315551758, "global_step": 252799, "epoch": 2089} {"train_loss": -42.634002685546875, "global_step": 252800, "epoch": 2089} {"train_loss": -41.91054916381836, "global_step": 252801, "epoch": 2089} {"train_loss": -42.14662551879883, "global_step": 252802, "epoch": 2089} {"train_loss": -43.17727279663086, "global_step": 252803, "epoch": 2089} {"train_loss": -41.988807678222656, "global_step": 252804, "epoch": 2089} {"train_loss": -40.7962760925293, "global_step": 252805, "epoch": 2089} {"train_loss": -42.9014892578125, "global_step": 252806, "epoch": 2089} {"train_loss": -42.72087860107422, "global_step": 252807, "epoch": 2089} {"train_loss": -42.2198486328125, "global_step": 252808, "epoch": 2089} {"train_loss": -42.69807815551758, "global_step": 252809, "epoch": 2089} {"train_loss": -42.65542221069336, "global_step": 252810, "epoch": 2089} {"train_loss": -43.140480041503906, "global_step": 252811, "epoch": 2089} {"train_loss": -42.756080627441406, "global_step": 252812, "epoch": 2089} {"train_loss": -42.552364349365234, "global_step": 252813, "epoch": 2089} {"train_loss": -42.45359420776367, "global_step": 252814, "epoch": 2089} {"train_loss": -41.81386947631836, "global_step": 252815, "epoch": 2089} {"train_loss": -42.50979232788086, "global_step": 252816, "epoch": 2089} {"train_loss": -43.16151809692383, "global_step": 252817, "epoch": 2089} {"train_loss": -42.558956146240234, "global_step": 252818, "epoch": 2089} {"train_loss": -42.536376953125, "global_step": 252819, "epoch": 2089} {"train_loss": -42.492042541503906, "global_step": 252820, "epoch": 2089} {"train_loss": -43.03333282470703, "global_step": 252821, "epoch": 2089} {"train_loss": -42.54296875, "global_step": 252822, "epoch": 2089} {"train_loss": -42.40920639038086, "global_step": 252823, "epoch": 2089} {"train_loss": -41.9835205078125, "global_step": 252824, "epoch": 2089} {"train_loss": -41.495880126953125, "global_step": 252825, "epoch": 2089} {"train_loss": -41.394073486328125, "global_step": 252826, "epoch": 2089} {"train_loss": -41.21037673950195, "global_step": 252827, "epoch": 2089} {"train_loss": -41.19970703125, "global_step": 252828, "epoch": 2089} {"train_loss": -42.233272552490234, "global_step": 252829, "epoch": 2089} {"train_loss": -42.73222732543945, "global_step": 252830, "epoch": 2089} {"train_loss": -41.938331604003906, "global_step": 252831, "epoch": 2089} {"train_loss": -41.200477600097656, "global_step": 252832, "epoch": 2089} {"train_loss": -39.44670486450195, "global_step": 252833, "epoch": 2089} {"train_loss": -39.4312858581543, "global_step": 252834, "epoch": 2089} {"train_loss": -35.788734436035156, "global_step": 252835, "epoch": 2089} {"train_loss": -39.0218505859375, "global_step": 252836, "epoch": 2089} {"train_loss": -42.447322845458984, "global_step": 252837, "epoch": 2089} {"train_loss": -42.445980072021484, "global_step": 252838, "epoch": 2089} {"train_loss": -40.791969299316406, "global_step": 252839, "epoch": 2089} {"train_loss": -42.48519515991211, "global_step": 252840, "epoch": 2089} {"train_loss": -42.82583999633789, "global_step": 252841, "epoch": 2089} {"train_loss": -41.82037353515625, "global_step": 252842, "epoch": 2089} {"train_loss": -40.92424392700195, "global_step": 252843, "epoch": 2089} {"train_loss": -41.69681167602539, "global_step": 252844, "epoch": 2089} {"train_loss": -42.34517288208008, "global_step": 252845, "epoch": 2089} {"train_loss": -42.78928756713867, "global_step": 252846, "epoch": 2089} {"train_loss": -42.41892623901367, "global_step": 252847, "epoch": 2089} {"train_loss": -41.955291748046875, "global_step": 252848, "epoch": 2089} {"train_loss": -42.53487777709961, "global_step": 252849, "epoch": 2089} {"train_loss": -41.92035675048828, "global_step": 252850, "epoch": 2089} {"train_loss": -42.119075775146484, "global_step": 252851, "epoch": 2089} {"train_loss": -39.62754821777344, "global_step": 252852, "epoch": 2089} {"train_loss": -41.51386642456055, "global_step": 252853, "epoch": 2089} {"train_loss": -41.1970329284668, "global_step": 252854, "epoch": 2089} {"train_loss": -40.56563186645508, "global_step": 252855, "epoch": 2089} {"train_loss": -40.58970260620117, "global_step": 252856, "epoch": 2089} {"train_loss": -43.092041015625, "global_step": 252857, "epoch": 2089} {"train_loss": -41.23088455200195, "global_step": 252858, "epoch": 2089} {"train_loss": -40.756629943847656, "global_step": 252859, "epoch": 2089} {"train_loss": -42.18709182739258, "global_step": 252860, "epoch": 2089} {"train_loss": -42.51583480834961, "global_step": 252861, "epoch": 2089} {"train_loss": -40.0867919921875, "global_step": 252862, "epoch": 2089} {"train_loss": -41.43384552001953, "global_step": 252863, "epoch": 2089} {"train_loss": -42.89924240112305, "global_step": 252864, "epoch": 2089} {"train_loss": -40.636295318603516, "global_step": 252865, "epoch": 2089} {"train_loss": -40.7724723815918, "global_step": 252866, "epoch": 2089} {"train_loss": -42.63235092163086, "global_step": 252867, "epoch": 2089} {"train_loss": -41.32305908203125, "global_step": 252868, "epoch": 2089} {"train_loss": -41.33262634277344, "global_step": 252869, "epoch": 2089} {"train_loss": -42.58777618408203, "global_step": 252870, "epoch": 2089} {"train_loss": -41.869258880615234, "global_step": 252871, "epoch": 2089} {"train_loss": -40.549320220947266, "global_step": 252872, "epoch": 2089} {"train_loss": -42.07587432861328, "global_step": 252873, "epoch": 2089} {"train_loss": -42.05097579956055, "global_step": 252874, "epoch": 2089} {"train_loss": -40.743927001953125, "global_step": 252875, "epoch": 2089} {"train_loss": -42.24293899536133, "global_step": 252876, "epoch": 2089} {"train_loss": -41.293121337890625, "global_step": 252877, "epoch": 2089} {"train_loss": -40.398807525634766, "global_step": 252878, "epoch": 2089} {"train_loss": -41.78083419799805, "global_step": 252879, "epoch": 2089} {"train_loss": -41.67527389526367, "global_step": 252880, "epoch": 2089} {"train_loss": -42.28291702270508, "global_step": 252881, "epoch": 2089} {"train_loss": -41.88496017456055, "global_step": 252882, "epoch": 2089} {"train_loss": -41.686641693115234, "global_step": 252883, "epoch": 2089} {"train_loss": -42.123836517333984, "global_step": 252884, "epoch": 2089} {"train_loss": -41.282405853271484, "global_step": 252885, "epoch": 2089} {"train_loss": -42.13419723510742, "global_step": 252886, "epoch": 2089} {"train_loss": -42.15852355957031, "global_step": 252887, "epoch": 2089} {"train_loss": -41.08369064331055, "global_step": 252888, "epoch": 2089} {"train_loss": -41.777503084545295, "global_step": 252889, "epoch": 2089, "val_loss": 2520027.0} {"train_loss": -42.4099006652832, "global_step": 252890, "epoch": 2090} {"train_loss": -34.882408142089844, "global_step": 252891, "epoch": 2090} {"train_loss": -41.8980827331543, "global_step": 252892, "epoch": 2090} {"train_loss": -41.174922943115234, "global_step": 252893, "epoch": 2090} {"train_loss": -40.2528190612793, "global_step": 252894, "epoch": 2090} {"train_loss": -41.3680534362793, "global_step": 252895, "epoch": 2090} {"train_loss": -40.20504379272461, "global_step": 252896, "epoch": 2090} {"train_loss": -42.306312561035156, "global_step": 252897, "epoch": 2090} {"train_loss": -39.842742919921875, "global_step": 252898, "epoch": 2090} {"train_loss": -37.955928802490234, "global_step": 252899, "epoch": 2090} {"train_loss": -42.03275680541992, "global_step": 252900, "epoch": 2090} {"train_loss": -40.59376907348633, "global_step": 252901, "epoch": 2090} {"train_loss": -41.78254699707031, "global_step": 252902, "epoch": 2090} {"train_loss": -41.6612548828125, "global_step": 252903, "epoch": 2090} {"train_loss": -40.80933380126953, "global_step": 252904, "epoch": 2090} {"train_loss": -41.51125717163086, "global_step": 252905, "epoch": 2090} {"train_loss": -40.33625411987305, "global_step": 252906, "epoch": 2090} {"train_loss": -40.16935348510742, "global_step": 252907, "epoch": 2090} {"train_loss": -41.82673263549805, "global_step": 252908, "epoch": 2090} {"train_loss": -41.13014602661133, "global_step": 252909, "epoch": 2090} {"train_loss": -35.98408508300781, "global_step": 252910, "epoch": 2090} {"train_loss": -41.37190628051758, "global_step": 252911, "epoch": 2090} {"train_loss": -40.723121643066406, "global_step": 252912, "epoch": 2090} {"train_loss": -41.38499450683594, "global_step": 252913, "epoch": 2090} {"train_loss": -41.38412857055664, "global_step": 252914, "epoch": 2090} {"train_loss": -41.856964111328125, "global_step": 252915, "epoch": 2090} {"train_loss": -40.565345764160156, "global_step": 252916, "epoch": 2090} {"train_loss": -41.8553466796875, "global_step": 252917, "epoch": 2090} {"train_loss": -41.8288688659668, "global_step": 252918, "epoch": 2090} {"train_loss": -40.070003509521484, "global_step": 252919, "epoch": 2090} {"train_loss": -41.64778518676758, "global_step": 252920, "epoch": 2090} {"train_loss": -42.17191696166992, "global_step": 252921, "epoch": 2090} {"train_loss": -41.27799606323242, "global_step": 252922, "epoch": 2090} {"train_loss": -42.758705139160156, "global_step": 252923, "epoch": 2090} {"train_loss": -39.911991119384766, "global_step": 252924, "epoch": 2090} {"train_loss": -40.67365646362305, "global_step": 252925, "epoch": 2090} {"train_loss": -41.55031967163086, "global_step": 252926, "epoch": 2090} {"train_loss": -39.640724182128906, "global_step": 252927, "epoch": 2090} {"train_loss": -39.09852981567383, "global_step": 252928, "epoch": 2090} {"train_loss": -42.446048736572266, "global_step": 252929, "epoch": 2090} {"train_loss": -41.329898834228516, "global_step": 252930, "epoch": 2090} {"train_loss": -42.22053909301758, "global_step": 252931, "epoch": 2090} {"train_loss": -40.969093322753906, "global_step": 252932, "epoch": 2090} {"train_loss": -41.84674835205078, "global_step": 252933, "epoch": 2090} {"train_loss": -42.057125091552734, "global_step": 252934, "epoch": 2090} {"train_loss": -41.0886116027832, "global_step": 252935, "epoch": 2090} {"train_loss": -41.76990509033203, "global_step": 252936, "epoch": 2090} {"train_loss": -40.948394775390625, "global_step": 252937, "epoch": 2090} {"train_loss": -42.24250030517578, "global_step": 252938, "epoch": 2090} {"train_loss": -41.28052520751953, "global_step": 252939, "epoch": 2090} {"train_loss": -40.20396041870117, "global_step": 252940, "epoch": 2090} {"train_loss": -40.25923538208008, "global_step": 252941, "epoch": 2090} {"train_loss": -40.829463958740234, "global_step": 252942, "epoch": 2090} {"train_loss": -42.3896484375, "global_step": 252943, "epoch": 2090} {"train_loss": -41.77788162231445, "global_step": 252944, "epoch": 2090} {"train_loss": -42.31307601928711, "global_step": 252945, "epoch": 2090} {"train_loss": -42.2297248840332, "global_step": 252946, "epoch": 2090} {"train_loss": -41.97323226928711, "global_step": 252947, "epoch": 2090} {"train_loss": -42.253536224365234, "global_step": 252948, "epoch": 2090} {"train_loss": -42.6460075378418, "global_step": 252949, "epoch": 2090} {"train_loss": -41.26508331298828, "global_step": 252950, "epoch": 2090} {"train_loss": -42.3952522277832, "global_step": 252951, "epoch": 2090} {"train_loss": -42.54051208496094, "global_step": 252952, "epoch": 2090} {"train_loss": -42.51652908325195, "global_step": 252953, "epoch": 2090} {"train_loss": -42.85503387451172, "global_step": 252954, "epoch": 2090} {"train_loss": -42.34682846069336, "global_step": 252955, "epoch": 2090} {"train_loss": -42.915496826171875, "global_step": 252956, "epoch": 2090} {"train_loss": -42.65681076049805, "global_step": 252957, "epoch": 2090} {"train_loss": -42.84102249145508, "global_step": 252958, "epoch": 2090} {"train_loss": -42.77511215209961, "global_step": 252959, "epoch": 2090} {"train_loss": -42.92893600463867, "global_step": 252960, "epoch": 2090} {"train_loss": -41.77113723754883, "global_step": 252961, "epoch": 2090} {"train_loss": -42.87144088745117, "global_step": 252962, "epoch": 2090} {"train_loss": -43.34904861450195, "global_step": 252963, "epoch": 2090} {"train_loss": -41.979156494140625, "global_step": 252964, "epoch": 2090} {"train_loss": -41.33870315551758, "global_step": 252965, "epoch": 2090} {"train_loss": -43.0570182800293, "global_step": 252966, "epoch": 2090} {"train_loss": -42.94940185546875, "global_step": 252967, "epoch": 2090} {"train_loss": -42.68561935424805, "global_step": 252968, "epoch": 2090} {"train_loss": -43.08241271972656, "global_step": 252969, "epoch": 2090} {"train_loss": -42.645713806152344, "global_step": 252970, "epoch": 2090} {"train_loss": -43.39239501953125, "global_step": 252971, "epoch": 2090} {"train_loss": -43.10579299926758, "global_step": 252972, "epoch": 2090} {"train_loss": -42.983245849609375, "global_step": 252973, "epoch": 2090} {"train_loss": -42.840736389160156, "global_step": 252974, "epoch": 2090} {"train_loss": -43.49284744262695, "global_step": 252975, "epoch": 2090} {"train_loss": -42.65903854370117, "global_step": 252976, "epoch": 2090} {"train_loss": -42.96330642700195, "global_step": 252977, "epoch": 2090} {"train_loss": -43.236778259277344, "global_step": 252978, "epoch": 2090} {"train_loss": -43.298458099365234, "global_step": 252979, "epoch": 2090} {"train_loss": -42.82773208618164, "global_step": 252980, "epoch": 2090} {"train_loss": -43.0900993347168, "global_step": 252981, "epoch": 2090} {"train_loss": -43.18276596069336, "global_step": 252982, "epoch": 2090} {"train_loss": -41.922550201416016, "global_step": 252983, "epoch": 2090} {"train_loss": -43.0058479309082, "global_step": 252984, "epoch": 2090} {"train_loss": -43.102142333984375, "global_step": 252985, "epoch": 2090} {"train_loss": -43.68452072143555, "global_step": 252986, "epoch": 2090} {"train_loss": -42.91197967529297, "global_step": 252987, "epoch": 2090} {"train_loss": -42.36318588256836, "global_step": 252988, "epoch": 2090} {"train_loss": -41.63416290283203, "global_step": 252989, "epoch": 2090} {"train_loss": -43.40517044067383, "global_step": 252990, "epoch": 2090} {"train_loss": -43.15367126464844, "global_step": 252991, "epoch": 2090} {"train_loss": -43.281246185302734, "global_step": 252992, "epoch": 2090} {"train_loss": -43.19096755981445, "global_step": 252993, "epoch": 2090} {"train_loss": -43.301937103271484, "global_step": 252994, "epoch": 2090} {"train_loss": -40.922515869140625, "global_step": 252995, "epoch": 2090} {"train_loss": -43.06708526611328, "global_step": 252996, "epoch": 2090} {"train_loss": -43.33518981933594, "global_step": 252997, "epoch": 2090} {"train_loss": -41.666175842285156, "global_step": 252998, "epoch": 2090} {"train_loss": -42.94636917114258, "global_step": 252999, "epoch": 2090} {"train_loss": -42.870643615722656, "global_step": 253000, "epoch": 2090} {"train_loss": -40.4102897644043, "global_step": 253001, "epoch": 2090} {"train_loss": -42.808677673339844, "global_step": 253002, "epoch": 2090} {"train_loss": -36.74143600463867, "global_step": 253003, "epoch": 2090} {"train_loss": -40.04914474487305, "global_step": 253004, "epoch": 2090} {"train_loss": -42.11561584472656, "global_step": 253005, "epoch": 2090} {"train_loss": -41.76140213012695, "global_step": 253006, "epoch": 2090} {"train_loss": -41.35140609741211, "global_step": 253007, "epoch": 2090} {"train_loss": -40.72517013549805, "global_step": 253008, "epoch": 2090} {"train_loss": -41.985130310058594, "global_step": 253009, "epoch": 2090} {"train_loss": -41.774600194505425, "global_step": 253010, "epoch": 2090, "val_loss": 2654495.25} {"train_loss": -41.176082611083984, "global_step": 253011, "epoch": 2091} {"train_loss": -38.13998794555664, "global_step": 253012, "epoch": 2091} {"train_loss": -39.77857208251953, "global_step": 253013, "epoch": 2091} {"train_loss": -41.879058837890625, "global_step": 253014, "epoch": 2091} {"train_loss": -25.272369384765625, "global_step": 253015, "epoch": 2091} {"train_loss": -38.15287780761719, "global_step": 253016, "epoch": 2091} {"train_loss": -36.93154525756836, "global_step": 253017, "epoch": 2091} {"train_loss": -38.28138732910156, "global_step": 253018, "epoch": 2091} {"train_loss": -36.90180206298828, "global_step": 253019, "epoch": 2091} {"train_loss": -35.601314544677734, "global_step": 253020, "epoch": 2091} {"train_loss": -39.54348373413086, "global_step": 253021, "epoch": 2091} {"train_loss": -37.966758728027344, "global_step": 253022, "epoch": 2091} {"train_loss": -38.75565719604492, "global_step": 253023, "epoch": 2091} {"train_loss": -38.98733901977539, "global_step": 253024, "epoch": 2091} {"train_loss": -39.02540969848633, "global_step": 253025, "epoch": 2091} {"train_loss": -31.865781784057617, "global_step": 253026, "epoch": 2091} {"train_loss": -40.64882278442383, "global_step": 253027, "epoch": 2091} {"train_loss": -38.83332443237305, "global_step": 253028, "epoch": 2091} {"train_loss": -37.59309005737305, "global_step": 253029, "epoch": 2091} {"train_loss": -39.53557586669922, "global_step": 253030, "epoch": 2091} {"train_loss": -38.057064056396484, "global_step": 253031, "epoch": 2091} {"train_loss": -33.66193389892578, "global_step": 253032, "epoch": 2091} {"train_loss": -38.12519454956055, "global_step": 253033, "epoch": 2091} {"train_loss": -40.22266387939453, "global_step": 253034, "epoch": 2091} {"train_loss": -37.47576904296875, "global_step": 253035, "epoch": 2091} {"train_loss": -40.09124755859375, "global_step": 253036, "epoch": 2091} {"train_loss": -39.80656814575195, "global_step": 253037, "epoch": 2091} {"train_loss": -38.87885284423828, "global_step": 253038, "epoch": 2091} {"train_loss": -39.05576705932617, "global_step": 253039, "epoch": 2091} {"train_loss": -39.16691970825195, "global_step": 253040, "epoch": 2091} {"train_loss": -39.85698318481445, "global_step": 253041, "epoch": 2091} {"train_loss": -35.61359405517578, "global_step": 253042, "epoch": 2091} {"train_loss": -39.71723175048828, "global_step": 253043, "epoch": 2091} {"train_loss": -39.84148025512695, "global_step": 253044, "epoch": 2091} {"train_loss": -40.025413513183594, "global_step": 253045, "epoch": 2091} {"train_loss": -37.81725311279297, "global_step": 253046, "epoch": 2091} {"train_loss": -39.327178955078125, "global_step": 253047, "epoch": 2091} {"train_loss": -40.22427749633789, "global_step": 253048, "epoch": 2091} {"train_loss": -39.24850082397461, "global_step": 253049, "epoch": 2091} {"train_loss": -39.79361343383789, "global_step": 253050, "epoch": 2091} {"train_loss": -40.693397521972656, "global_step": 253051, "epoch": 2091} {"train_loss": -41.1086311340332, "global_step": 253052, "epoch": 2091} {"train_loss": -39.83430862426758, "global_step": 253053, "epoch": 2091} {"train_loss": -40.78507614135742, "global_step": 253054, "epoch": 2091} {"train_loss": -41.31222152709961, "global_step": 253055, "epoch": 2091} {"train_loss": -40.06360626220703, "global_step": 253056, "epoch": 2091} {"train_loss": -41.38332748413086, "global_step": 253057, "epoch": 2091} {"train_loss": -40.608699798583984, "global_step": 253058, "epoch": 2091} {"train_loss": -41.1551513671875, "global_step": 253059, "epoch": 2091} {"train_loss": -40.684486389160156, "global_step": 253060, "epoch": 2091} {"train_loss": -40.91023254394531, "global_step": 253061, "epoch": 2091} {"train_loss": -39.763916015625, "global_step": 253062, "epoch": 2091} {"train_loss": -40.46590042114258, "global_step": 253063, "epoch": 2091} {"train_loss": -40.27968215942383, "global_step": 253064, "epoch": 2091} {"train_loss": -40.551734924316406, "global_step": 253065, "epoch": 2091} {"train_loss": -41.61529541015625, "global_step": 253066, "epoch": 2091} {"train_loss": -41.53479766845703, "global_step": 253067, "epoch": 2091} {"train_loss": -41.249691009521484, "global_step": 253068, "epoch": 2091} {"train_loss": -41.71204376220703, "global_step": 253069, "epoch": 2091} {"train_loss": -41.591835021972656, "global_step": 253070, "epoch": 2091} {"train_loss": -41.73602294921875, "global_step": 253071, "epoch": 2091} {"train_loss": -42.20631790161133, "global_step": 253072, "epoch": 2091} {"train_loss": -41.694557189941406, "global_step": 253073, "epoch": 2091} {"train_loss": -40.88661575317383, "global_step": 253074, "epoch": 2091} {"train_loss": -42.43199157714844, "global_step": 253075, "epoch": 2091} {"train_loss": -41.41241455078125, "global_step": 253076, "epoch": 2091} {"train_loss": -41.56299591064453, "global_step": 253077, "epoch": 2091} {"train_loss": -40.200531005859375, "global_step": 253078, "epoch": 2091} {"train_loss": -41.73921585083008, "global_step": 253079, "epoch": 2091} {"train_loss": -42.10014724731445, "global_step": 253080, "epoch": 2091} {"train_loss": -42.20267868041992, "global_step": 253081, "epoch": 2091} {"train_loss": -42.26483154296875, "global_step": 253082, "epoch": 2091} {"train_loss": -42.62507247924805, "global_step": 253083, "epoch": 2091} {"train_loss": -42.229007720947266, "global_step": 253084, "epoch": 2091} {"train_loss": -42.725074768066406, "global_step": 253085, "epoch": 2091} {"train_loss": -42.19037628173828, "global_step": 253086, "epoch": 2091} {"train_loss": -42.305938720703125, "global_step": 253087, "epoch": 2091} {"train_loss": -42.37190628051758, "global_step": 253088, "epoch": 2091} {"train_loss": -42.479759216308594, "global_step": 253089, "epoch": 2091} {"train_loss": -41.918209075927734, "global_step": 253090, "epoch": 2091} {"train_loss": -42.544471740722656, "global_step": 253091, "epoch": 2091} {"train_loss": -42.63248062133789, "global_step": 253092, "epoch": 2091} {"train_loss": -42.45286178588867, "global_step": 253093, "epoch": 2091} {"train_loss": -42.40327072143555, "global_step": 253094, "epoch": 2091} {"train_loss": -41.973087310791016, "global_step": 253095, "epoch": 2091} {"train_loss": -42.68955612182617, "global_step": 253096, "epoch": 2091} {"train_loss": -41.90715408325195, "global_step": 253097, "epoch": 2091} {"train_loss": -42.0297966003418, "global_step": 253098, "epoch": 2091} {"train_loss": -41.9375, "global_step": 253099, "epoch": 2091} {"train_loss": -42.55723190307617, "global_step": 253100, "epoch": 2091} {"train_loss": -42.3723258972168, "global_step": 253101, "epoch": 2091} {"train_loss": -41.320587158203125, "global_step": 253102, "epoch": 2091} {"train_loss": -41.56769943237305, "global_step": 253103, "epoch": 2091} {"train_loss": -42.8956184387207, "global_step": 253104, "epoch": 2091} {"train_loss": -42.11429977416992, "global_step": 253105, "epoch": 2091} {"train_loss": -42.416748046875, "global_step": 253106, "epoch": 2091} {"train_loss": -42.36760330200195, "global_step": 253107, "epoch": 2091} {"train_loss": -42.19509506225586, "global_step": 253108, "epoch": 2091} {"train_loss": -41.71871566772461, "global_step": 253109, "epoch": 2091} {"train_loss": -41.56800079345703, "global_step": 253110, "epoch": 2091} {"train_loss": -42.34825897216797, "global_step": 253111, "epoch": 2091} {"train_loss": -41.58381652832031, "global_step": 253112, "epoch": 2091} {"train_loss": -41.70945358276367, "global_step": 253113, "epoch": 2091} {"train_loss": -42.065853118896484, "global_step": 253114, "epoch": 2091} {"train_loss": -41.17713165283203, "global_step": 253115, "epoch": 2091} {"train_loss": -41.43130111694336, "global_step": 253116, "epoch": 2091} {"train_loss": -41.621925354003906, "global_step": 253117, "epoch": 2091} {"train_loss": -41.83205795288086, "global_step": 253118, "epoch": 2091} {"train_loss": -40.61368179321289, "global_step": 253119, "epoch": 2091} {"train_loss": -42.20756912231445, "global_step": 253120, "epoch": 2091} {"train_loss": -41.30757522583008, "global_step": 253121, "epoch": 2091} {"train_loss": -42.35696029663086, "global_step": 253122, "epoch": 2091} {"train_loss": -42.409481048583984, "global_step": 253123, "epoch": 2091} {"train_loss": -42.120357513427734, "global_step": 253124, "epoch": 2091} {"train_loss": -42.6191520690918, "global_step": 253125, "epoch": 2091} {"train_loss": -42.52445602416992, "global_step": 253126, "epoch": 2091} {"train_loss": -42.774356842041016, "global_step": 253127, "epoch": 2091} {"train_loss": -42.95134353637695, "global_step": 253128, "epoch": 2091} {"train_loss": -42.80573654174805, "global_step": 253129, "epoch": 2091} {"train_loss": -42.4195442199707, "global_step": 253130, "epoch": 2091} {"train_loss": -40.616567958485, "global_step": 253131, "epoch": 2091, "val_loss": 2589725.75} {"train_loss": -42.49900436401367, "global_step": 253132, "epoch": 2092} {"train_loss": -42.94957733154297, "global_step": 253133, "epoch": 2092} {"train_loss": -42.07772445678711, "global_step": 253134, "epoch": 2092} {"train_loss": -42.577735900878906, "global_step": 253135, "epoch": 2092} {"train_loss": -42.88152313232422, "global_step": 253136, "epoch": 2092} {"train_loss": -42.65529251098633, "global_step": 253137, "epoch": 2092} {"train_loss": -42.85422897338867, "global_step": 253138, "epoch": 2092} {"train_loss": -42.51973342895508, "global_step": 253139, "epoch": 2092} {"train_loss": -42.068180084228516, "global_step": 253140, "epoch": 2092} {"train_loss": -43.18301010131836, "global_step": 253141, "epoch": 2092} {"train_loss": -42.94532012939453, "global_step": 253142, "epoch": 2092} {"train_loss": -43.023738861083984, "global_step": 253143, "epoch": 2092} {"train_loss": -43.038658142089844, "global_step": 253144, "epoch": 2092} {"train_loss": -42.798683166503906, "global_step": 253145, "epoch": 2092} {"train_loss": -43.041961669921875, "global_step": 253146, "epoch": 2092} {"train_loss": -42.692138671875, "global_step": 253147, "epoch": 2092} {"train_loss": -42.581329345703125, "global_step": 253148, "epoch": 2092} {"train_loss": -43.075130462646484, "global_step": 253149, "epoch": 2092} {"train_loss": -42.9423942565918, "global_step": 253150, "epoch": 2092} {"train_loss": -42.92647933959961, "global_step": 253151, "epoch": 2092} {"train_loss": -42.399593353271484, "global_step": 253152, "epoch": 2092} {"train_loss": -41.12142562866211, "global_step": 253153, "epoch": 2092} {"train_loss": -39.866024017333984, "global_step": 253154, "epoch": 2092} {"train_loss": -36.74529266357422, "global_step": 253155, "epoch": 2092} {"train_loss": -33.13576889038086, "global_step": 253156, "epoch": 2092} {"train_loss": -33.768341064453125, "global_step": 253157, "epoch": 2092} {"train_loss": -36.58094787597656, "global_step": 253158, "epoch": 2092} {"train_loss": -40.31071090698242, "global_step": 253159, "epoch": 2092} {"train_loss": -31.965463638305664, "global_step": 253160, "epoch": 2092} {"train_loss": -35.08338928222656, "global_step": 253161, "epoch": 2092} {"train_loss": -40.2690315246582, "global_step": 253162, "epoch": 2092} {"train_loss": -37.69926071166992, "global_step": 253163, "epoch": 2092} {"train_loss": -38.52451705932617, "global_step": 253164, "epoch": 2092} {"train_loss": -37.36176300048828, "global_step": 253165, "epoch": 2092} {"train_loss": -39.17265701293945, "global_step": 253166, "epoch": 2092} {"train_loss": -38.75759506225586, "global_step": 253167, "epoch": 2092} {"train_loss": -38.09080123901367, "global_step": 253168, "epoch": 2092} {"train_loss": -40.9654426574707, "global_step": 253169, "epoch": 2092} {"train_loss": -39.33287811279297, "global_step": 253170, "epoch": 2092} {"train_loss": -41.492130279541016, "global_step": 253171, "epoch": 2092} {"train_loss": -38.78529739379883, "global_step": 253172, "epoch": 2092} {"train_loss": -39.64985656738281, "global_step": 253173, "epoch": 2092} {"train_loss": -40.89131546020508, "global_step": 253174, "epoch": 2092} {"train_loss": -39.002899169921875, "global_step": 253175, "epoch": 2092} {"train_loss": -40.89234161376953, "global_step": 253176, "epoch": 2092} {"train_loss": -40.37651062011719, "global_step": 253177, "epoch": 2092} {"train_loss": -40.84677505493164, "global_step": 253178, "epoch": 2092} {"train_loss": -40.5621223449707, "global_step": 253179, "epoch": 2092} {"train_loss": -41.64496994018555, "global_step": 253180, "epoch": 2092} {"train_loss": -40.66622543334961, "global_step": 253181, "epoch": 2092} {"train_loss": -41.997650146484375, "global_step": 253182, "epoch": 2092} {"train_loss": -41.310970306396484, "global_step": 253183, "epoch": 2092} {"train_loss": -41.25797653198242, "global_step": 253184, "epoch": 2092} {"train_loss": -41.23747634887695, "global_step": 253185, "epoch": 2092} {"train_loss": -41.8964729309082, "global_step": 253186, "epoch": 2092} {"train_loss": -40.80854797363281, "global_step": 253187, "epoch": 2092} {"train_loss": -41.51797103881836, "global_step": 253188, "epoch": 2092} {"train_loss": -41.36606979370117, "global_step": 253189, "epoch": 2092} {"train_loss": -41.49818801879883, "global_step": 253190, "epoch": 2092} {"train_loss": -41.911224365234375, "global_step": 253191, "epoch": 2092} {"train_loss": -41.835750579833984, "global_step": 253192, "epoch": 2092} {"train_loss": -41.714332580566406, "global_step": 253193, "epoch": 2092} {"train_loss": -41.743778228759766, "global_step": 253194, "epoch": 2092} {"train_loss": -42.0869255065918, "global_step": 253195, "epoch": 2092} {"train_loss": -42.036983489990234, "global_step": 253196, "epoch": 2092} {"train_loss": -41.85288619995117, "global_step": 253197, "epoch": 2092} {"train_loss": -42.36420822143555, "global_step": 253198, "epoch": 2092} {"train_loss": -42.2384147644043, "global_step": 253199, "epoch": 2092} {"train_loss": -42.40754318237305, "global_step": 253200, "epoch": 2092} {"train_loss": -42.241363525390625, "global_step": 253201, "epoch": 2092} {"train_loss": -42.485225677490234, "global_step": 253202, "epoch": 2092} {"train_loss": -42.3564567565918, "global_step": 253203, "epoch": 2092} {"train_loss": -42.40852737426758, "global_step": 253204, "epoch": 2092} {"train_loss": -42.13225173950195, "global_step": 253205, "epoch": 2092} {"train_loss": -42.692012786865234, "global_step": 253206, "epoch": 2092} {"train_loss": -41.80167770385742, "global_step": 253207, "epoch": 2092} {"train_loss": -42.3701057434082, "global_step": 253208, "epoch": 2092} {"train_loss": -42.03672409057617, "global_step": 253209, "epoch": 2092} {"train_loss": -42.22267532348633, "global_step": 253210, "epoch": 2092} {"train_loss": -42.80607223510742, "global_step": 253211, "epoch": 2092} {"train_loss": -41.91158676147461, "global_step": 253212, "epoch": 2092} {"train_loss": -42.47672653198242, "global_step": 253213, "epoch": 2092} {"train_loss": -42.243892669677734, "global_step": 253214, "epoch": 2092} {"train_loss": -42.52064895629883, "global_step": 253215, "epoch": 2092} {"train_loss": -42.4052848815918, "global_step": 253216, "epoch": 2092} {"train_loss": -42.588783264160156, "global_step": 253217, "epoch": 2092} {"train_loss": -42.40427780151367, "global_step": 253218, "epoch": 2092} {"train_loss": -42.44944381713867, "global_step": 253219, "epoch": 2092} {"train_loss": -42.724159240722656, "global_step": 253220, "epoch": 2092} {"train_loss": -42.50814437866211, "global_step": 253221, "epoch": 2092} {"train_loss": -42.31361389160156, "global_step": 253222, "epoch": 2092} {"train_loss": -42.61501693725586, "global_step": 253223, "epoch": 2092} {"train_loss": -43.01125717163086, "global_step": 253224, "epoch": 2092} {"train_loss": -43.332252502441406, "global_step": 253225, "epoch": 2092} {"train_loss": -42.61351013183594, "global_step": 253226, "epoch": 2092} {"train_loss": -42.711727142333984, "global_step": 253227, "epoch": 2092} {"train_loss": -43.03913879394531, "global_step": 253228, "epoch": 2092} {"train_loss": -43.26362228393555, "global_step": 253229, "epoch": 2092} {"train_loss": -42.62441635131836, "global_step": 253230, "epoch": 2092} {"train_loss": -42.44141387939453, "global_step": 253231, "epoch": 2092} {"train_loss": -43.04841232299805, "global_step": 253232, "epoch": 2092} {"train_loss": -42.79075241088867, "global_step": 253233, "epoch": 2092} {"train_loss": -42.42351150512695, "global_step": 253234, "epoch": 2092} {"train_loss": -42.90228271484375, "global_step": 253235, "epoch": 2092} {"train_loss": -43.37916946411133, "global_step": 253236, "epoch": 2092} {"train_loss": -41.87135696411133, "global_step": 253237, "epoch": 2092} {"train_loss": -42.50927734375, "global_step": 253238, "epoch": 2092} {"train_loss": -43.2736930847168, "global_step": 253239, "epoch": 2092} {"train_loss": -41.955562591552734, "global_step": 253240, "epoch": 2092} {"train_loss": -40.02265167236328, "global_step": 253241, "epoch": 2092} {"train_loss": -40.5324821472168, "global_step": 253242, "epoch": 2092} {"train_loss": -42.4556884765625, "global_step": 253243, "epoch": 2092} {"train_loss": -42.74898910522461, "global_step": 253244, "epoch": 2092} {"train_loss": -42.95314407348633, "global_step": 253245, "epoch": 2092} {"train_loss": -42.28736114501953, "global_step": 253246, "epoch": 2092} {"train_loss": -41.12807846069336, "global_step": 253247, "epoch": 2092} {"train_loss": -42.74696731567383, "global_step": 253248, "epoch": 2092} {"train_loss": -42.94919204711914, "global_step": 253249, "epoch": 2092} {"train_loss": -42.01599884033203, "global_step": 253250, "epoch": 2092} {"train_loss": -42.65829086303711, "global_step": 253251, "epoch": 2092} {"train_loss": -41.49862164899337, "global_step": 253252, "epoch": 2092, "val_loss": 2636233.25} {"train_loss": -43.10117721557617, "global_step": 253253, "epoch": 2093} {"train_loss": -42.27882766723633, "global_step": 253254, "epoch": 2093} {"train_loss": -42.18499755859375, "global_step": 253255, "epoch": 2093} {"train_loss": -42.76552963256836, "global_step": 253256, "epoch": 2093} {"train_loss": -42.73310470581055, "global_step": 253257, "epoch": 2093} {"train_loss": -40.399925231933594, "global_step": 253258, "epoch": 2093} {"train_loss": -42.305355072021484, "global_step": 253259, "epoch": 2093} {"train_loss": -42.5764045715332, "global_step": 253260, "epoch": 2093} {"train_loss": -41.298126220703125, "global_step": 253261, "epoch": 2093} {"train_loss": -40.46894073486328, "global_step": 253262, "epoch": 2093} {"train_loss": -41.86484909057617, "global_step": 253263, "epoch": 2093} {"train_loss": -43.133522033691406, "global_step": 253264, "epoch": 2093} {"train_loss": -40.7548942565918, "global_step": 253265, "epoch": 2093} {"train_loss": -41.460575103759766, "global_step": 253266, "epoch": 2093} {"train_loss": -41.70402526855469, "global_step": 253267, "epoch": 2093} {"train_loss": -38.99702072143555, "global_step": 253268, "epoch": 2093} {"train_loss": -41.147525787353516, "global_step": 253269, "epoch": 2093} {"train_loss": -41.74583435058594, "global_step": 253270, "epoch": 2093} {"train_loss": -39.48057174682617, "global_step": 253271, "epoch": 2093} {"train_loss": -40.3447265625, "global_step": 253272, "epoch": 2093} {"train_loss": -41.31830596923828, "global_step": 253273, "epoch": 2093} {"train_loss": -40.860252380371094, "global_step": 253274, "epoch": 2093} {"train_loss": -42.29096221923828, "global_step": 253275, "epoch": 2093} {"train_loss": -40.52842330932617, "global_step": 253276, "epoch": 2093} {"train_loss": -42.54842758178711, "global_step": 253277, "epoch": 2093} {"train_loss": -41.71323776245117, "global_step": 253278, "epoch": 2093} {"train_loss": -42.36315155029297, "global_step": 253279, "epoch": 2093} {"train_loss": -42.830970764160156, "global_step": 253280, "epoch": 2093} {"train_loss": -42.07373046875, "global_step": 253281, "epoch": 2093} {"train_loss": -42.91581344604492, "global_step": 253282, "epoch": 2093} {"train_loss": -41.765777587890625, "global_step": 253283, "epoch": 2093} {"train_loss": -42.73699188232422, "global_step": 253284, "epoch": 2093} {"train_loss": -42.57741165161133, "global_step": 253285, "epoch": 2093} {"train_loss": -42.224361419677734, "global_step": 253286, "epoch": 2093} {"train_loss": -42.26309585571289, "global_step": 253287, "epoch": 2093} {"train_loss": -42.656402587890625, "global_step": 253288, "epoch": 2093} {"train_loss": -42.44775390625, "global_step": 253289, "epoch": 2093} {"train_loss": -43.00382614135742, "global_step": 253290, "epoch": 2093} {"train_loss": -43.11202621459961, "global_step": 253291, "epoch": 2093} {"train_loss": -42.464263916015625, "global_step": 253292, "epoch": 2093} {"train_loss": -43.11289596557617, "global_step": 253293, "epoch": 2093} {"train_loss": -43.26701736450195, "global_step": 253294, "epoch": 2093} {"train_loss": -42.92829132080078, "global_step": 253295, "epoch": 2093} {"train_loss": -43.10075759887695, "global_step": 253296, "epoch": 2093} {"train_loss": -43.383056640625, "global_step": 253297, "epoch": 2093} {"train_loss": -43.446163177490234, "global_step": 253298, "epoch": 2093} {"train_loss": -42.1395378112793, "global_step": 253299, "epoch": 2093} {"train_loss": -43.25388717651367, "global_step": 253300, "epoch": 2093} {"train_loss": -42.94045639038086, "global_step": 253301, "epoch": 2093} {"train_loss": -43.464881896972656, "global_step": 253302, "epoch": 2093} {"train_loss": -42.18376159667969, "global_step": 253303, "epoch": 2093} {"train_loss": -43.21479415893555, "global_step": 253304, "epoch": 2093} {"train_loss": -43.15290069580078, "global_step": 253305, "epoch": 2093} {"train_loss": -43.1551399230957, "global_step": 253306, "epoch": 2093} {"train_loss": -43.255767822265625, "global_step": 253307, "epoch": 2093} {"train_loss": -43.417667388916016, "global_step": 253308, "epoch": 2093} {"train_loss": -43.05030059814453, "global_step": 253309, "epoch": 2093} {"train_loss": -43.01955795288086, "global_step": 253310, "epoch": 2093} {"train_loss": -43.80472946166992, "global_step": 253311, "epoch": 2093} {"train_loss": -43.40031814575195, "global_step": 253312, "epoch": 2093} {"train_loss": -43.447872161865234, "global_step": 253313, "epoch": 2093} {"train_loss": -42.51888656616211, "global_step": 253314, "epoch": 2093} {"train_loss": -43.362911224365234, "global_step": 253315, "epoch": 2093} {"train_loss": -43.13955307006836, "global_step": 253316, "epoch": 2093} {"train_loss": -43.23187255859375, "global_step": 253317, "epoch": 2093} {"train_loss": -43.193965911865234, "global_step": 253318, "epoch": 2093} {"train_loss": -43.28810119628906, "global_step": 253319, "epoch": 2093} {"train_loss": -43.06784439086914, "global_step": 253320, "epoch": 2093} {"train_loss": -43.450775146484375, "global_step": 253321, "epoch": 2093} {"train_loss": -42.74152755737305, "global_step": 253322, "epoch": 2093} {"train_loss": -43.2226676940918, "global_step": 253323, "epoch": 2093} {"train_loss": -42.332794189453125, "global_step": 253324, "epoch": 2093} {"train_loss": -42.291744232177734, "global_step": 253325, "epoch": 2093} {"train_loss": -42.69093704223633, "global_step": 253326, "epoch": 2093} {"train_loss": -42.22412872314453, "global_step": 253327, "epoch": 2093} {"train_loss": -41.850704193115234, "global_step": 253328, "epoch": 2093} {"train_loss": -43.46812057495117, "global_step": 253329, "epoch": 2093} {"train_loss": -43.637725830078125, "global_step": 253330, "epoch": 2093} {"train_loss": -43.43565368652344, "global_step": 253331, "epoch": 2093} {"train_loss": -42.74097442626953, "global_step": 253332, "epoch": 2093} {"train_loss": -43.01927185058594, "global_step": 253333, "epoch": 2093} {"train_loss": -42.962669372558594, "global_step": 253334, "epoch": 2093} {"train_loss": -42.869598388671875, "global_step": 253335, "epoch": 2093} {"train_loss": -42.48526382446289, "global_step": 253336, "epoch": 2093} {"train_loss": -42.69618606567383, "global_step": 253337, "epoch": 2093} {"train_loss": -42.2884407043457, "global_step": 253338, "epoch": 2093} {"train_loss": -42.19736862182617, "global_step": 253339, "epoch": 2093} {"train_loss": -42.84366989135742, "global_step": 253340, "epoch": 2093} {"train_loss": -41.849403381347656, "global_step": 253341, "epoch": 2093} {"train_loss": -38.56887435913086, "global_step": 253342, "epoch": 2093} {"train_loss": -40.291046142578125, "global_step": 253343, "epoch": 2093} {"train_loss": -42.028358459472656, "global_step": 253344, "epoch": 2093} {"train_loss": -42.141780853271484, "global_step": 253345, "epoch": 2093} {"train_loss": -42.279335021972656, "global_step": 253346, "epoch": 2093} {"train_loss": -42.46162033081055, "global_step": 253347, "epoch": 2093} {"train_loss": -42.1468620300293, "global_step": 253348, "epoch": 2093} {"train_loss": -41.242820739746094, "global_step": 253349, "epoch": 2093} {"train_loss": -42.23393630981445, "global_step": 253350, "epoch": 2093} {"train_loss": -43.02524948120117, "global_step": 253351, "epoch": 2093} {"train_loss": -40.26051712036133, "global_step": 253352, "epoch": 2093} {"train_loss": -41.2232551574707, "global_step": 253353, "epoch": 2093} {"train_loss": -41.14055633544922, "global_step": 253354, "epoch": 2093} {"train_loss": -42.448692321777344, "global_step": 253355, "epoch": 2093} {"train_loss": -40.471405029296875, "global_step": 253356, "epoch": 2093} {"train_loss": -40.31907653808594, "global_step": 253357, "epoch": 2093} {"train_loss": -41.91405487060547, "global_step": 253358, "epoch": 2093} {"train_loss": -40.74048614501953, "global_step": 253359, "epoch": 2093} {"train_loss": -42.28681564331055, "global_step": 253360, "epoch": 2093} {"train_loss": -42.064937591552734, "global_step": 253361, "epoch": 2093} {"train_loss": -41.12958526611328, "global_step": 253362, "epoch": 2093} {"train_loss": -42.78656005859375, "global_step": 253363, "epoch": 2093} {"train_loss": -41.82307434082031, "global_step": 253364, "epoch": 2093} {"train_loss": -41.135353088378906, "global_step": 253365, "epoch": 2093} {"train_loss": -42.28520584106445, "global_step": 253366, "epoch": 2093} {"train_loss": -40.905029296875, "global_step": 253367, "epoch": 2093} {"train_loss": -42.12864303588867, "global_step": 253368, "epoch": 2093} {"train_loss": -41.54948806762695, "global_step": 253369, "epoch": 2093} {"train_loss": -41.53094482421875, "global_step": 253370, "epoch": 2093} {"train_loss": -41.05056381225586, "global_step": 253371, "epoch": 2093} {"train_loss": -41.98817825317383, "global_step": 253372, "epoch": 2093} {"train_loss": -42.22948386452415, "global_step": 253373, "epoch": 2093, "val_loss": 2569198.5} {"train_loss": -42.94233322143555, "global_step": 253374, "epoch": 2094} {"train_loss": -42.4961051940918, "global_step": 253375, "epoch": 2094} {"train_loss": -40.22731399536133, "global_step": 253376, "epoch": 2094} {"train_loss": -42.17369842529297, "global_step": 253377, "epoch": 2094} {"train_loss": -42.44562911987305, "global_step": 253378, "epoch": 2094} {"train_loss": -40.53157424926758, "global_step": 253379, "epoch": 2094} {"train_loss": -42.497230529785156, "global_step": 253380, "epoch": 2094} {"train_loss": -42.857791900634766, "global_step": 253381, "epoch": 2094} {"train_loss": -42.610374450683594, "global_step": 253382, "epoch": 2094} {"train_loss": -43.05378341674805, "global_step": 253383, "epoch": 2094} {"train_loss": -42.57841491699219, "global_step": 253384, "epoch": 2094} {"train_loss": -42.00567626953125, "global_step": 253385, "epoch": 2094} {"train_loss": -42.43841552734375, "global_step": 253386, "epoch": 2094} {"train_loss": -42.578468322753906, "global_step": 253387, "epoch": 2094} {"train_loss": -42.65193557739258, "global_step": 253388, "epoch": 2094} {"train_loss": -40.7406120300293, "global_step": 253389, "epoch": 2094} {"train_loss": -42.60158920288086, "global_step": 253390, "epoch": 2094} {"train_loss": -42.52985382080078, "global_step": 253391, "epoch": 2094} {"train_loss": -42.1012077331543, "global_step": 253392, "epoch": 2094} {"train_loss": -41.82448959350586, "global_step": 253393, "epoch": 2094} {"train_loss": -41.64735794067383, "global_step": 253394, "epoch": 2094} {"train_loss": -42.639259338378906, "global_step": 253395, "epoch": 2094} {"train_loss": -42.78750228881836, "global_step": 253396, "epoch": 2094} {"train_loss": -41.787410736083984, "global_step": 253397, "epoch": 2094} {"train_loss": -42.947540283203125, "global_step": 253398, "epoch": 2094} {"train_loss": -42.8138542175293, "global_step": 253399, "epoch": 2094} {"train_loss": -43.123348236083984, "global_step": 253400, "epoch": 2094} {"train_loss": -42.4613151550293, "global_step": 253401, "epoch": 2094} {"train_loss": -43.1613655090332, "global_step": 253402, "epoch": 2094} {"train_loss": -42.94503402709961, "global_step": 253403, "epoch": 2094} {"train_loss": -42.68972396850586, "global_step": 253404, "epoch": 2094} {"train_loss": -41.9060173034668, "global_step": 253405, "epoch": 2094} {"train_loss": -43.06418991088867, "global_step": 253406, "epoch": 2094} {"train_loss": -41.896610260009766, "global_step": 253407, "epoch": 2094} {"train_loss": -42.86350631713867, "global_step": 253408, "epoch": 2094} {"train_loss": -43.172237396240234, "global_step": 253409, "epoch": 2094} {"train_loss": -42.81908416748047, "global_step": 253410, "epoch": 2094} {"train_loss": -42.967071533203125, "global_step": 253411, "epoch": 2094} {"train_loss": -42.691280364990234, "global_step": 253412, "epoch": 2094} {"train_loss": -42.58292770385742, "global_step": 253413, "epoch": 2094} {"train_loss": -43.500030517578125, "global_step": 253414, "epoch": 2094} {"train_loss": -43.48236846923828, "global_step": 253415, "epoch": 2094} {"train_loss": -42.62775802612305, "global_step": 253416, "epoch": 2094} {"train_loss": -43.298377990722656, "global_step": 253417, "epoch": 2094} {"train_loss": -42.532039642333984, "global_step": 253418, "epoch": 2094} {"train_loss": -43.608211517333984, "global_step": 253419, "epoch": 2094} {"train_loss": -43.476985931396484, "global_step": 253420, "epoch": 2094} {"train_loss": -41.94057083129883, "global_step": 253421, "epoch": 2094} {"train_loss": -42.971920013427734, "global_step": 253422, "epoch": 2094} {"train_loss": -43.4699592590332, "global_step": 253423, "epoch": 2094} {"train_loss": -42.78572463989258, "global_step": 253424, "epoch": 2094} {"train_loss": -42.96709442138672, "global_step": 253425, "epoch": 2094} {"train_loss": -43.569374084472656, "global_step": 253426, "epoch": 2094} {"train_loss": -43.39048767089844, "global_step": 253427, "epoch": 2094} {"train_loss": -43.18314743041992, "global_step": 253428, "epoch": 2094} {"train_loss": -43.63088607788086, "global_step": 253429, "epoch": 2094} {"train_loss": -41.48305892944336, "global_step": 253430, "epoch": 2094} {"train_loss": -42.9112663269043, "global_step": 253431, "epoch": 2094} {"train_loss": -41.970699310302734, "global_step": 253432, "epoch": 2094} {"train_loss": -42.972747802734375, "global_step": 253433, "epoch": 2094} {"train_loss": -43.663909912109375, "global_step": 253434, "epoch": 2094} {"train_loss": -42.79591369628906, "global_step": 253435, "epoch": 2094} {"train_loss": -43.035884857177734, "global_step": 253436, "epoch": 2094} {"train_loss": -43.716529846191406, "global_step": 253437, "epoch": 2094} {"train_loss": -43.86814498901367, "global_step": 253438, "epoch": 2094} {"train_loss": -43.50520706176758, "global_step": 253439, "epoch": 2094} {"train_loss": -43.033729553222656, "global_step": 253440, "epoch": 2094} {"train_loss": -42.277313232421875, "global_step": 253441, "epoch": 2094} {"train_loss": -43.509273529052734, "global_step": 253442, "epoch": 2094} {"train_loss": -43.06464767456055, "global_step": 253443, "epoch": 2094} {"train_loss": -43.355308532714844, "global_step": 253444, "epoch": 2094} {"train_loss": -43.894775390625, "global_step": 253445, "epoch": 2094} {"train_loss": -43.614803314208984, "global_step": 253446, "epoch": 2094} {"train_loss": -41.7986946105957, "global_step": 253447, "epoch": 2094} {"train_loss": -43.542781829833984, "global_step": 253448, "epoch": 2094} {"train_loss": -43.54636764526367, "global_step": 253449, "epoch": 2094} {"train_loss": -42.894805908203125, "global_step": 253450, "epoch": 2094} {"train_loss": -41.19187545776367, "global_step": 253451, "epoch": 2094} {"train_loss": -42.04581832885742, "global_step": 253452, "epoch": 2094} {"train_loss": -43.188838958740234, "global_step": 253453, "epoch": 2094} {"train_loss": -42.4349365234375, "global_step": 253454, "epoch": 2094} {"train_loss": -43.22488784790039, "global_step": 253455, "epoch": 2094} {"train_loss": -42.231719970703125, "global_step": 253456, "epoch": 2094} {"train_loss": -42.24691390991211, "global_step": 253457, "epoch": 2094} {"train_loss": -43.19808578491211, "global_step": 253458, "epoch": 2094} {"train_loss": -41.68463897705078, "global_step": 253459, "epoch": 2094} {"train_loss": -42.43745803833008, "global_step": 253460, "epoch": 2094} {"train_loss": -42.507904052734375, "global_step": 253461, "epoch": 2094} {"train_loss": -42.74665832519531, "global_step": 253462, "epoch": 2094} {"train_loss": -43.35316848754883, "global_step": 253463, "epoch": 2094} {"train_loss": -42.327064514160156, "global_step": 253464, "epoch": 2094} {"train_loss": -42.970272064208984, "global_step": 253465, "epoch": 2094} {"train_loss": -40.81814193725586, "global_step": 253466, "epoch": 2094} {"train_loss": -40.406551361083984, "global_step": 253467, "epoch": 2094} {"train_loss": -39.77214431762695, "global_step": 253468, "epoch": 2094} {"train_loss": -42.445411682128906, "global_step": 253469, "epoch": 2094} {"train_loss": -40.8317756652832, "global_step": 253470, "epoch": 2094} {"train_loss": -42.091583251953125, "global_step": 253471, "epoch": 2094} {"train_loss": -40.795806884765625, "global_step": 253472, "epoch": 2094} {"train_loss": -42.04706573486328, "global_step": 253473, "epoch": 2094} {"train_loss": -41.30683517456055, "global_step": 253474, "epoch": 2094} {"train_loss": -41.0112190246582, "global_step": 253475, "epoch": 2094} {"train_loss": -39.757484436035156, "global_step": 253476, "epoch": 2094} {"train_loss": -40.74799346923828, "global_step": 253477, "epoch": 2094} {"train_loss": -41.50835037231445, "global_step": 253478, "epoch": 2094} {"train_loss": -40.28938674926758, "global_step": 253479, "epoch": 2094} {"train_loss": -39.227962493896484, "global_step": 253480, "epoch": 2094} {"train_loss": -38.53257369995117, "global_step": 253481, "epoch": 2094} {"train_loss": -39.47298049926758, "global_step": 253482, "epoch": 2094} {"train_loss": -40.09125518798828, "global_step": 253483, "epoch": 2094} {"train_loss": -40.18741989135742, "global_step": 253484, "epoch": 2094} {"train_loss": -41.12449645996094, "global_step": 253485, "epoch": 2094} {"train_loss": -41.74171829223633, "global_step": 253486, "epoch": 2094} {"train_loss": -39.75788116455078, "global_step": 253487, "epoch": 2094} {"train_loss": -40.398746490478516, "global_step": 253488, "epoch": 2094} {"train_loss": -40.65995788574219, "global_step": 253489, "epoch": 2094} {"train_loss": -41.31930923461914, "global_step": 253490, "epoch": 2094} {"train_loss": -40.343055725097656, "global_step": 253491, "epoch": 2094} {"train_loss": -40.542842864990234, "global_step": 253492, "epoch": 2094} {"train_loss": -37.60718536376953, "global_step": 253493, "epoch": 2094} {"train_loss": -42.195243488658555, "global_step": 253494, "epoch": 2094, "val_loss": 3042351.25} {"train_loss": -37.20503234863281, "global_step": 253495, "epoch": 2095} {"train_loss": -39.97053146362305, "global_step": 253496, "epoch": 2095} {"train_loss": -39.74267578125, "global_step": 253497, "epoch": 2095} {"train_loss": -41.10258102416992, "global_step": 253498, "epoch": 2095} {"train_loss": -39.72003173828125, "global_step": 253499, "epoch": 2095} {"train_loss": -39.42030715942383, "global_step": 253500, "epoch": 2095} {"train_loss": -41.462772369384766, "global_step": 253501, "epoch": 2095} {"train_loss": -40.14944076538086, "global_step": 253502, "epoch": 2095} {"train_loss": -39.68648147583008, "global_step": 253503, "epoch": 2095} {"train_loss": -40.5013313293457, "global_step": 253504, "epoch": 2095} {"train_loss": -41.366065979003906, "global_step": 253505, "epoch": 2095} {"train_loss": -41.323997497558594, "global_step": 253506, "epoch": 2095} {"train_loss": -38.73374557495117, "global_step": 253507, "epoch": 2095} {"train_loss": -41.48604202270508, "global_step": 253508, "epoch": 2095} {"train_loss": -41.072181701660156, "global_step": 253509, "epoch": 2095} {"train_loss": -41.11476516723633, "global_step": 253510, "epoch": 2095} {"train_loss": -42.16536331176758, "global_step": 253511, "epoch": 2095} {"train_loss": -39.9859504699707, "global_step": 253512, "epoch": 2095} {"train_loss": -41.74308395385742, "global_step": 253513, "epoch": 2095} {"train_loss": -39.2575798034668, "global_step": 253514, "epoch": 2095} {"train_loss": -41.30811309814453, "global_step": 253515, "epoch": 2095} {"train_loss": -40.9704704284668, "global_step": 253516, "epoch": 2095} {"train_loss": -40.890323638916016, "global_step": 253517, "epoch": 2095} {"train_loss": -41.31555938720703, "global_step": 253518, "epoch": 2095} {"train_loss": -41.76028060913086, "global_step": 253519, "epoch": 2095} {"train_loss": -41.53003692626953, "global_step": 253520, "epoch": 2095} {"train_loss": -40.12150955200195, "global_step": 253521, "epoch": 2095} {"train_loss": -41.20683670043945, "global_step": 253522, "epoch": 2095} {"train_loss": -38.95183563232422, "global_step": 253523, "epoch": 2095} {"train_loss": -40.5193977355957, "global_step": 253524, "epoch": 2095} {"train_loss": -41.64863586425781, "global_step": 253525, "epoch": 2095} {"train_loss": -41.77376937866211, "global_step": 253526, "epoch": 2095} {"train_loss": -41.791683197021484, "global_step": 253527, "epoch": 2095} {"train_loss": -41.35832214355469, "global_step": 253528, "epoch": 2095} {"train_loss": -40.632781982421875, "global_step": 253529, "epoch": 2095} {"train_loss": -40.93793869018555, "global_step": 253530, "epoch": 2095} {"train_loss": -41.484779357910156, "global_step": 253531, "epoch": 2095} {"train_loss": -42.242984771728516, "global_step": 253532, "epoch": 2095} {"train_loss": -41.9552116394043, "global_step": 253533, "epoch": 2095} {"train_loss": -40.12941360473633, "global_step": 253534, "epoch": 2095} {"train_loss": -42.24093246459961, "global_step": 253535, "epoch": 2095} {"train_loss": -42.05552291870117, "global_step": 253536, "epoch": 2095} {"train_loss": -42.132633209228516, "global_step": 253537, "epoch": 2095} {"train_loss": -38.40161895751953, "global_step": 253538, "epoch": 2095} {"train_loss": -39.34956741333008, "global_step": 253539, "epoch": 2095} {"train_loss": -41.062957763671875, "global_step": 253540, "epoch": 2095} {"train_loss": -41.4069938659668, "global_step": 253541, "epoch": 2095} {"train_loss": -41.78466796875, "global_step": 253542, "epoch": 2095} {"train_loss": -42.047603607177734, "global_step": 253543, "epoch": 2095} {"train_loss": -41.60546875, "global_step": 253544, "epoch": 2095} {"train_loss": -38.91609573364258, "global_step": 253545, "epoch": 2095} {"train_loss": -41.89817428588867, "global_step": 253546, "epoch": 2095} {"train_loss": -41.72084426879883, "global_step": 253547, "epoch": 2095} {"train_loss": -37.915409088134766, "global_step": 253548, "epoch": 2095} {"train_loss": -40.524391174316406, "global_step": 253549, "epoch": 2095} {"train_loss": -36.93198776245117, "global_step": 253550, "epoch": 2095} {"train_loss": -41.64045333862305, "global_step": 253551, "epoch": 2095} {"train_loss": -41.4328498840332, "global_step": 253552, "epoch": 2095} {"train_loss": -41.81825256347656, "global_step": 253553, "epoch": 2095} {"train_loss": -39.390865325927734, "global_step": 253554, "epoch": 2095} {"train_loss": -39.639015197753906, "global_step": 253555, "epoch": 2095} {"train_loss": -41.5658073425293, "global_step": 253556, "epoch": 2095} {"train_loss": -41.670692443847656, "global_step": 253557, "epoch": 2095} {"train_loss": -41.47494125366211, "global_step": 253558, "epoch": 2095} {"train_loss": -40.833839416503906, "global_step": 253559, "epoch": 2095} {"train_loss": -41.2457160949707, "global_step": 253560, "epoch": 2095} {"train_loss": -41.509403228759766, "global_step": 253561, "epoch": 2095} {"train_loss": -42.3787956237793, "global_step": 253562, "epoch": 2095} {"train_loss": -40.724159240722656, "global_step": 253563, "epoch": 2095} {"train_loss": -41.19957733154297, "global_step": 253564, "epoch": 2095} {"train_loss": -39.60454559326172, "global_step": 253565, "epoch": 2095} {"train_loss": -40.1547737121582, "global_step": 253566, "epoch": 2095} {"train_loss": -41.14622116088867, "global_step": 253567, "epoch": 2095} {"train_loss": -42.12887191772461, "global_step": 253568, "epoch": 2095} {"train_loss": -39.60539627075195, "global_step": 253569, "epoch": 2095} {"train_loss": -42.60668182373047, "global_step": 253570, "epoch": 2095} {"train_loss": -40.663883209228516, "global_step": 253571, "epoch": 2095} {"train_loss": -40.24245071411133, "global_step": 253572, "epoch": 2095} {"train_loss": -41.864776611328125, "global_step": 253573, "epoch": 2095} {"train_loss": -41.86631393432617, "global_step": 253574, "epoch": 2095} {"train_loss": -42.13324737548828, "global_step": 253575, "epoch": 2095} {"train_loss": -40.40300750732422, "global_step": 253576, "epoch": 2095} {"train_loss": -40.54277801513672, "global_step": 253577, "epoch": 2095} {"train_loss": -42.041656494140625, "global_step": 253578, "epoch": 2095} {"train_loss": -40.26060485839844, "global_step": 253579, "epoch": 2095} {"train_loss": -41.17013168334961, "global_step": 253580, "epoch": 2095} {"train_loss": -42.17241287231445, "global_step": 253581, "epoch": 2095} {"train_loss": -39.819950103759766, "global_step": 253582, "epoch": 2095} {"train_loss": -41.94878387451172, "global_step": 253583, "epoch": 2095} {"train_loss": -41.48491287231445, "global_step": 253584, "epoch": 2095} {"train_loss": -42.634559631347656, "global_step": 253585, "epoch": 2095} {"train_loss": -42.679378509521484, "global_step": 253586, "epoch": 2095} {"train_loss": -42.05669021606445, "global_step": 253587, "epoch": 2095} {"train_loss": -41.36320877075195, "global_step": 253588, "epoch": 2095} {"train_loss": -42.18292236328125, "global_step": 253589, "epoch": 2095} {"train_loss": -42.2821159362793, "global_step": 253590, "epoch": 2095} {"train_loss": -40.26034164428711, "global_step": 253591, "epoch": 2095} {"train_loss": -42.4554328918457, "global_step": 253592, "epoch": 2095} {"train_loss": -41.114803314208984, "global_step": 253593, "epoch": 2095} {"train_loss": -41.63356399536133, "global_step": 253594, "epoch": 2095} {"train_loss": -42.447872161865234, "global_step": 253595, "epoch": 2095} {"train_loss": -42.367252349853516, "global_step": 253596, "epoch": 2095} {"train_loss": -42.94365310668945, "global_step": 253597, "epoch": 2095} {"train_loss": -42.88363265991211, "global_step": 253598, "epoch": 2095} {"train_loss": -42.522640228271484, "global_step": 253599, "epoch": 2095} {"train_loss": -42.26936340332031, "global_step": 253600, "epoch": 2095} {"train_loss": -42.37109375, "global_step": 253601, "epoch": 2095} {"train_loss": -42.55723190307617, "global_step": 253602, "epoch": 2095} {"train_loss": -42.73810577392578, "global_step": 253603, "epoch": 2095} {"train_loss": -43.34019470214844, "global_step": 253604, "epoch": 2095} {"train_loss": -42.21044158935547, "global_step": 253605, "epoch": 2095} {"train_loss": -42.817806243896484, "global_step": 253606, "epoch": 2095} {"train_loss": -43.37600326538086, "global_step": 253607, "epoch": 2095} {"train_loss": -42.53084182739258, "global_step": 253608, "epoch": 2095} {"train_loss": -42.48591232299805, "global_step": 253609, "epoch": 2095} {"train_loss": -42.70402526855469, "global_step": 253610, "epoch": 2095} {"train_loss": -42.60036849975586, "global_step": 253611, "epoch": 2095} {"train_loss": -43.418575286865234, "global_step": 253612, "epoch": 2095} {"train_loss": -43.365074157714844, "global_step": 253613, "epoch": 2095} {"train_loss": -42.787696838378906, "global_step": 253614, "epoch": 2095} {"train_loss": -41.28042577317924, "global_step": 253615, "epoch": 2095, "val_loss": 2648972.75} {"train_loss": -43.053802490234375, "global_step": 253616, "epoch": 2096} {"train_loss": -42.88729476928711, "global_step": 253617, "epoch": 2096} {"train_loss": -42.954994201660156, "global_step": 253618, "epoch": 2096} {"train_loss": -43.688411712646484, "global_step": 253619, "epoch": 2096} {"train_loss": -43.33687210083008, "global_step": 253620, "epoch": 2096} {"train_loss": -43.388954162597656, "global_step": 253621, "epoch": 2096} {"train_loss": -42.53985595703125, "global_step": 253622, "epoch": 2096} {"train_loss": -43.099605560302734, "global_step": 253623, "epoch": 2096} {"train_loss": -42.76215744018555, "global_step": 253624, "epoch": 2096} {"train_loss": -43.387664794921875, "global_step": 253625, "epoch": 2096} {"train_loss": -43.48147201538086, "global_step": 253626, "epoch": 2096} {"train_loss": -43.27935791015625, "global_step": 253627, "epoch": 2096} {"train_loss": -43.12548828125, "global_step": 253628, "epoch": 2096} {"train_loss": -41.53790283203125, "global_step": 253629, "epoch": 2096} {"train_loss": -43.203468322753906, "global_step": 253630, "epoch": 2096} {"train_loss": -42.35205841064453, "global_step": 253631, "epoch": 2096} {"train_loss": -42.26728057861328, "global_step": 253632, "epoch": 2096} {"train_loss": -43.476295471191406, "global_step": 253633, "epoch": 2096} {"train_loss": -42.1577262878418, "global_step": 253634, "epoch": 2096} {"train_loss": -40.900760650634766, "global_step": 253635, "epoch": 2096} {"train_loss": -39.26710891723633, "global_step": 253636, "epoch": 2096} {"train_loss": -37.63517379760742, "global_step": 253637, "epoch": 2096} {"train_loss": -40.1716194152832, "global_step": 253638, "epoch": 2096} {"train_loss": -41.18208312988281, "global_step": 253639, "epoch": 2096} {"train_loss": -41.58969497680664, "global_step": 253640, "epoch": 2096} {"train_loss": -42.563133239746094, "global_step": 253641, "epoch": 2096} {"train_loss": -43.187896728515625, "global_step": 253642, "epoch": 2096} {"train_loss": -42.189598083496094, "global_step": 253643, "epoch": 2096} {"train_loss": -42.01301956176758, "global_step": 253644, "epoch": 2096} {"train_loss": -41.5313835144043, "global_step": 253645, "epoch": 2096} {"train_loss": -42.59090042114258, "global_step": 253646, "epoch": 2096} {"train_loss": -43.15475082397461, "global_step": 253647, "epoch": 2096} {"train_loss": -42.40214920043945, "global_step": 253648, "epoch": 2096} {"train_loss": -42.105140686035156, "global_step": 253649, "epoch": 2096} {"train_loss": -43.226234436035156, "global_step": 253650, "epoch": 2096} {"train_loss": -41.4029426574707, "global_step": 253651, "epoch": 2096} {"train_loss": -42.16399002075195, "global_step": 253652, "epoch": 2096} {"train_loss": -42.63875198364258, "global_step": 253653, "epoch": 2096} {"train_loss": -41.766693115234375, "global_step": 253654, "epoch": 2096} {"train_loss": -39.23609161376953, "global_step": 253655, "epoch": 2096} {"train_loss": -41.69820785522461, "global_step": 253656, "epoch": 2096} {"train_loss": -42.122962951660156, "global_step": 253657, "epoch": 2096} {"train_loss": -41.993995666503906, "global_step": 253658, "epoch": 2096} {"train_loss": -41.88056182861328, "global_step": 253659, "epoch": 2096} {"train_loss": -42.22028350830078, "global_step": 253660, "epoch": 2096} {"train_loss": -42.32817077636719, "global_step": 253661, "epoch": 2096} {"train_loss": -42.31687545776367, "global_step": 253662, "epoch": 2096} {"train_loss": -42.195674896240234, "global_step": 253663, "epoch": 2096} {"train_loss": -42.120521545410156, "global_step": 253664, "epoch": 2096} {"train_loss": -42.606136322021484, "global_step": 253665, "epoch": 2096} {"train_loss": -42.95957946777344, "global_step": 253666, "epoch": 2096} {"train_loss": -42.46004104614258, "global_step": 253667, "epoch": 2096} {"train_loss": -42.39038848876953, "global_step": 253668, "epoch": 2096} {"train_loss": -43.8280029296875, "global_step": 253669, "epoch": 2096} {"train_loss": -42.69710922241211, "global_step": 253670, "epoch": 2096} {"train_loss": -41.974403381347656, "global_step": 253671, "epoch": 2096} {"train_loss": -42.2158203125, "global_step": 253672, "epoch": 2096} {"train_loss": -41.48237991333008, "global_step": 253673, "epoch": 2096} {"train_loss": -41.02836227416992, "global_step": 253674, "epoch": 2096} {"train_loss": -41.80938720703125, "global_step": 253675, "epoch": 2096} {"train_loss": -42.180721282958984, "global_step": 253676, "epoch": 2096} {"train_loss": -41.07316207885742, "global_step": 253677, "epoch": 2096} {"train_loss": -41.45731735229492, "global_step": 253678, "epoch": 2096} {"train_loss": -42.9564208984375, "global_step": 253679, "epoch": 2096} {"train_loss": -42.213134765625, "global_step": 253680, "epoch": 2096} {"train_loss": -41.92973709106445, "global_step": 253681, "epoch": 2096} {"train_loss": -41.88572692871094, "global_step": 253682, "epoch": 2096} {"train_loss": -43.537841796875, "global_step": 253683, "epoch": 2096} {"train_loss": -41.95975875854492, "global_step": 253684, "epoch": 2096} {"train_loss": -41.542701721191406, "global_step": 253685, "epoch": 2096} {"train_loss": -42.57081985473633, "global_step": 253686, "epoch": 2096} {"train_loss": -41.9046516418457, "global_step": 253687, "epoch": 2096} {"train_loss": -40.921165466308594, "global_step": 253688, "epoch": 2096} {"train_loss": -41.83903503417969, "global_step": 253689, "epoch": 2096} {"train_loss": -43.054443359375, "global_step": 253690, "epoch": 2096} {"train_loss": -42.38343048095703, "global_step": 253691, "epoch": 2096} {"train_loss": -41.55927658081055, "global_step": 253692, "epoch": 2096} {"train_loss": -42.96589279174805, "global_step": 253693, "epoch": 2096} {"train_loss": -42.440799713134766, "global_step": 253694, "epoch": 2096} {"train_loss": -42.64215087890625, "global_step": 253695, "epoch": 2096} {"train_loss": -42.50516128540039, "global_step": 253696, "epoch": 2096} {"train_loss": -42.76229476928711, "global_step": 253697, "epoch": 2096} {"train_loss": -42.70296859741211, "global_step": 253698, "epoch": 2096} {"train_loss": -43.14028549194336, "global_step": 253699, "epoch": 2096} {"train_loss": -42.654903411865234, "global_step": 253700, "epoch": 2096} {"train_loss": -42.4894905090332, "global_step": 253701, "epoch": 2096} {"train_loss": -43.1945915222168, "global_step": 253702, "epoch": 2096} {"train_loss": -43.27946853637695, "global_step": 253703, "epoch": 2096} {"train_loss": -43.07109451293945, "global_step": 253704, "epoch": 2096} {"train_loss": -42.52061080932617, "global_step": 253705, "epoch": 2096} {"train_loss": -43.28911209106445, "global_step": 253706, "epoch": 2096} {"train_loss": -43.32803726196289, "global_step": 253707, "epoch": 2096} {"train_loss": -42.515621185302734, "global_step": 253708, "epoch": 2096} {"train_loss": -42.98843002319336, "global_step": 253709, "epoch": 2096} {"train_loss": -43.005306243896484, "global_step": 253710, "epoch": 2096} {"train_loss": -43.58594512939453, "global_step": 253711, "epoch": 2096} {"train_loss": -42.86921310424805, "global_step": 253712, "epoch": 2096} {"train_loss": -42.69340896606445, "global_step": 253713, "epoch": 2096} {"train_loss": -43.07636642456055, "global_step": 253714, "epoch": 2096} {"train_loss": -42.57365036010742, "global_step": 253715, "epoch": 2096} {"train_loss": -42.90633773803711, "global_step": 253716, "epoch": 2096} {"train_loss": -43.19829177856445, "global_step": 253717, "epoch": 2096} {"train_loss": -42.91978073120117, "global_step": 253718, "epoch": 2096} {"train_loss": -42.285099029541016, "global_step": 253719, "epoch": 2096} {"train_loss": -43.1660270690918, "global_step": 253720, "epoch": 2096} {"train_loss": -41.995574951171875, "global_step": 253721, "epoch": 2096} {"train_loss": -41.47968673706055, "global_step": 253722, "epoch": 2096} {"train_loss": -42.55730056762695, "global_step": 253723, "epoch": 2096} {"train_loss": -43.29527282714844, "global_step": 253724, "epoch": 2096} {"train_loss": -42.17132568359375, "global_step": 253725, "epoch": 2096} {"train_loss": -41.19561767578125, "global_step": 253726, "epoch": 2096} {"train_loss": -40.16366958618164, "global_step": 253727, "epoch": 2096} {"train_loss": -42.03208541870117, "global_step": 253728, "epoch": 2096} {"train_loss": -42.16470718383789, "global_step": 253729, "epoch": 2096} {"train_loss": -41.54823684692383, "global_step": 253730, "epoch": 2096} {"train_loss": -41.724159240722656, "global_step": 253731, "epoch": 2096} {"train_loss": -42.55605697631836, "global_step": 253732, "epoch": 2096} {"train_loss": -42.90022659301758, "global_step": 253733, "epoch": 2096} {"train_loss": -42.81694030761719, "global_step": 253734, "epoch": 2096} {"train_loss": -43.346885681152344, "global_step": 253735, "epoch": 2096} {"train_loss": -42.34653589548158, "global_step": 253736, "epoch": 2096, "val_loss": 2700813.0} {"train_loss": -43.32712936401367, "global_step": 253737, "epoch": 2097} {"train_loss": -43.4180908203125, "global_step": 253738, "epoch": 2097} {"train_loss": -43.076107025146484, "global_step": 253739, "epoch": 2097} {"train_loss": -43.28868865966797, "global_step": 253740, "epoch": 2097} {"train_loss": -43.27216339111328, "global_step": 253741, "epoch": 2097} {"train_loss": -43.188568115234375, "global_step": 253742, "epoch": 2097} {"train_loss": -43.55353927612305, "global_step": 253743, "epoch": 2097} {"train_loss": -43.49993896484375, "global_step": 253744, "epoch": 2097} {"train_loss": -43.86513900756836, "global_step": 253745, "epoch": 2097} {"train_loss": -42.92292022705078, "global_step": 253746, "epoch": 2097} {"train_loss": -43.306941986083984, "global_step": 253747, "epoch": 2097} {"train_loss": -43.47855758666992, "global_step": 253748, "epoch": 2097} {"train_loss": -43.19832992553711, "global_step": 253749, "epoch": 2097} {"train_loss": -43.300106048583984, "global_step": 253750, "epoch": 2097} {"train_loss": -42.65633773803711, "global_step": 253751, "epoch": 2097} {"train_loss": -43.24406051635742, "global_step": 253752, "epoch": 2097} {"train_loss": -43.50150680541992, "global_step": 253753, "epoch": 2097} {"train_loss": -43.14542007446289, "global_step": 253754, "epoch": 2097} {"train_loss": -41.66672134399414, "global_step": 253755, "epoch": 2097} {"train_loss": -41.66230392456055, "global_step": 253756, "epoch": 2097} {"train_loss": -42.70905685424805, "global_step": 253757, "epoch": 2097} {"train_loss": -43.75117874145508, "global_step": 253758, "epoch": 2097} {"train_loss": -43.328182220458984, "global_step": 253759, "epoch": 2097} {"train_loss": -42.73942184448242, "global_step": 253760, "epoch": 2097} {"train_loss": -43.2285041809082, "global_step": 253761, "epoch": 2097} {"train_loss": -43.9055290222168, "global_step": 253762, "epoch": 2097} {"train_loss": -42.43128204345703, "global_step": 253763, "epoch": 2097} {"train_loss": -42.6245002746582, "global_step": 253764, "epoch": 2097} {"train_loss": -42.49691390991211, "global_step": 253765, "epoch": 2097} {"train_loss": -43.50202178955078, "global_step": 253766, "epoch": 2097} {"train_loss": -43.345252990722656, "global_step": 253767, "epoch": 2097} {"train_loss": -42.841064453125, "global_step": 253768, "epoch": 2097} {"train_loss": -42.42048263549805, "global_step": 253769, "epoch": 2097} {"train_loss": -42.358436584472656, "global_step": 253770, "epoch": 2097} {"train_loss": -42.734249114990234, "global_step": 253771, "epoch": 2097} {"train_loss": -42.55898666381836, "global_step": 253772, "epoch": 2097} {"train_loss": -42.474571228027344, "global_step": 253773, "epoch": 2097} {"train_loss": -42.25965118408203, "global_step": 253774, "epoch": 2097} {"train_loss": -41.13167190551758, "global_step": 253775, "epoch": 2097} {"train_loss": -42.3172607421875, "global_step": 253776, "epoch": 2097} {"train_loss": -43.586036682128906, "global_step": 253777, "epoch": 2097} {"train_loss": -41.48115921020508, "global_step": 253778, "epoch": 2097} {"train_loss": -41.98176193237305, "global_step": 253779, "epoch": 2097} {"train_loss": -43.11333465576172, "global_step": 253780, "epoch": 2097} {"train_loss": -42.5612907409668, "global_step": 253781, "epoch": 2097} {"train_loss": -40.34505081176758, "global_step": 253782, "epoch": 2097} {"train_loss": -41.17234802246094, "global_step": 253783, "epoch": 2097} {"train_loss": -41.36163330078125, "global_step": 253784, "epoch": 2097} {"train_loss": -42.32143020629883, "global_step": 253785, "epoch": 2097} {"train_loss": -38.926239013671875, "global_step": 253786, "epoch": 2097} {"train_loss": -41.90742111206055, "global_step": 253787, "epoch": 2097} {"train_loss": -38.43873977661133, "global_step": 253788, "epoch": 2097} {"train_loss": -39.903594970703125, "global_step": 253789, "epoch": 2097} {"train_loss": -39.494850158691406, "global_step": 253790, "epoch": 2097} {"train_loss": -41.123252868652344, "global_step": 253791, "epoch": 2097} {"train_loss": -40.10614776611328, "global_step": 253792, "epoch": 2097} {"train_loss": -38.946964263916016, "global_step": 253793, "epoch": 2097} {"train_loss": -41.4365234375, "global_step": 253794, "epoch": 2097} {"train_loss": -39.258941650390625, "global_step": 253795, "epoch": 2097} {"train_loss": -42.43857955932617, "global_step": 253796, "epoch": 2097} {"train_loss": -40.32061767578125, "global_step": 253797, "epoch": 2097} {"train_loss": -39.94013595581055, "global_step": 253798, "epoch": 2097} {"train_loss": -41.79764938354492, "global_step": 253799, "epoch": 2097} {"train_loss": -41.79921340942383, "global_step": 253800, "epoch": 2097} {"train_loss": -40.95318603515625, "global_step": 253801, "epoch": 2097} {"train_loss": -42.019596099853516, "global_step": 253802, "epoch": 2097} {"train_loss": -40.822723388671875, "global_step": 253803, "epoch": 2097} {"train_loss": -42.09907913208008, "global_step": 253804, "epoch": 2097} {"train_loss": -41.64972686767578, "global_step": 253805, "epoch": 2097} {"train_loss": -41.214290618896484, "global_step": 253806, "epoch": 2097} {"train_loss": -42.97670364379883, "global_step": 253807, "epoch": 2097} {"train_loss": -42.58901596069336, "global_step": 253808, "epoch": 2097} {"train_loss": -41.000972747802734, "global_step": 253809, "epoch": 2097} {"train_loss": -42.9175910949707, "global_step": 253810, "epoch": 2097} {"train_loss": -42.245697021484375, "global_step": 253811, "epoch": 2097} {"train_loss": -42.814598083496094, "global_step": 253812, "epoch": 2097} {"train_loss": -42.63418197631836, "global_step": 253813, "epoch": 2097} {"train_loss": -42.96226119995117, "global_step": 253814, "epoch": 2097} {"train_loss": -42.932220458984375, "global_step": 253815, "epoch": 2097} {"train_loss": -43.2303466796875, "global_step": 253816, "epoch": 2097} {"train_loss": -42.51864242553711, "global_step": 253817, "epoch": 2097} {"train_loss": -42.535884857177734, "global_step": 253818, "epoch": 2097} {"train_loss": -42.49079513549805, "global_step": 253819, "epoch": 2097} {"train_loss": -42.70833969116211, "global_step": 253820, "epoch": 2097} {"train_loss": -42.887046813964844, "global_step": 253821, "epoch": 2097} {"train_loss": -42.518306732177734, "global_step": 253822, "epoch": 2097} {"train_loss": -43.13369369506836, "global_step": 253823, "epoch": 2097} {"train_loss": -43.10319900512695, "global_step": 253824, "epoch": 2097} {"train_loss": -42.669857025146484, "global_step": 253825, "epoch": 2097} {"train_loss": -43.1016731262207, "global_step": 253826, "epoch": 2097} {"train_loss": -42.889034271240234, "global_step": 253827, "epoch": 2097} {"train_loss": -43.05424118041992, "global_step": 253828, "epoch": 2097} {"train_loss": -43.52383804321289, "global_step": 253829, "epoch": 2097} {"train_loss": -43.184417724609375, "global_step": 253830, "epoch": 2097} {"train_loss": -43.39893341064453, "global_step": 253831, "epoch": 2097} {"train_loss": -43.399261474609375, "global_step": 253832, "epoch": 2097} {"train_loss": -43.7148551940918, "global_step": 253833, "epoch": 2097} {"train_loss": -43.72509765625, "global_step": 253834, "epoch": 2097} {"train_loss": -43.53791046142578, "global_step": 253835, "epoch": 2097} {"train_loss": -43.312095642089844, "global_step": 253836, "epoch": 2097} {"train_loss": -43.37747573852539, "global_step": 253837, "epoch": 2097} {"train_loss": -43.41533279418945, "global_step": 253838, "epoch": 2097} {"train_loss": -43.80430603027344, "global_step": 253839, "epoch": 2097} {"train_loss": -43.86009216308594, "global_step": 253840, "epoch": 2097} {"train_loss": -43.0883903503418, "global_step": 253841, "epoch": 2097} {"train_loss": -43.13606643676758, "global_step": 253842, "epoch": 2097} {"train_loss": -43.979881286621094, "global_step": 253843, "epoch": 2097} {"train_loss": -43.54229736328125, "global_step": 253844, "epoch": 2097} {"train_loss": -42.89167022705078, "global_step": 253845, "epoch": 2097} {"train_loss": -43.00421142578125, "global_step": 253846, "epoch": 2097} {"train_loss": -42.49238967895508, "global_step": 253847, "epoch": 2097} {"train_loss": -42.850704193115234, "global_step": 253848, "epoch": 2097} {"train_loss": -43.616512298583984, "global_step": 253849, "epoch": 2097} {"train_loss": -42.217464447021484, "global_step": 253850, "epoch": 2097} {"train_loss": -41.444854736328125, "global_step": 253851, "epoch": 2097} {"train_loss": -39.978824615478516, "global_step": 253852, "epoch": 2097} {"train_loss": -40.046791076660156, "global_step": 253853, "epoch": 2097} {"train_loss": -40.438140869140625, "global_step": 253854, "epoch": 2097} {"train_loss": -39.85050582885742, "global_step": 253855, "epoch": 2097} {"train_loss": -41.31782913208008, "global_step": 253856, "epoch": 2097} {"train_loss": -42.3921299138345, "global_step": 253857, "epoch": 2097, "val_loss": 2728600.75} {"train_loss": -42.122161865234375, "global_step": 253858, "epoch": 2098} {"train_loss": -40.8809814453125, "global_step": 253859, "epoch": 2098} {"train_loss": -41.3996696472168, "global_step": 253860, "epoch": 2098} {"train_loss": -42.546566009521484, "global_step": 253861, "epoch": 2098} {"train_loss": -41.86814498901367, "global_step": 253862, "epoch": 2098} {"train_loss": -39.3004035949707, "global_step": 253863, "epoch": 2098} {"train_loss": -39.27898025512695, "global_step": 253864, "epoch": 2098} {"train_loss": -41.573585510253906, "global_step": 253865, "epoch": 2098} {"train_loss": -40.33823013305664, "global_step": 253866, "epoch": 2098} {"train_loss": -39.2365837097168, "global_step": 253867, "epoch": 2098} {"train_loss": -39.43076705932617, "global_step": 253868, "epoch": 2098} {"train_loss": -40.149658203125, "global_step": 253869, "epoch": 2098} {"train_loss": -38.72052764892578, "global_step": 253870, "epoch": 2098} {"train_loss": -39.627925872802734, "global_step": 253871, "epoch": 2098} {"train_loss": -40.07046127319336, "global_step": 253872, "epoch": 2098} {"train_loss": -42.703495025634766, "global_step": 253873, "epoch": 2098} {"train_loss": -38.6032600402832, "global_step": 253874, "epoch": 2098} {"train_loss": -41.74304962158203, "global_step": 253875, "epoch": 2098} {"train_loss": -40.49273681640625, "global_step": 253876, "epoch": 2098} {"train_loss": -41.59590530395508, "global_step": 253877, "epoch": 2098} {"train_loss": -39.60039138793945, "global_step": 253878, "epoch": 2098} {"train_loss": -41.19552230834961, "global_step": 253879, "epoch": 2098} {"train_loss": -40.259429931640625, "global_step": 253880, "epoch": 2098} {"train_loss": -41.25840377807617, "global_step": 253881, "epoch": 2098} {"train_loss": -41.847835540771484, "global_step": 253882, "epoch": 2098} {"train_loss": -39.36143112182617, "global_step": 253883, "epoch": 2098} {"train_loss": -41.40507125854492, "global_step": 253884, "epoch": 2098} {"train_loss": -41.641357421875, "global_step": 253885, "epoch": 2098} {"train_loss": -40.049659729003906, "global_step": 253886, "epoch": 2098} {"train_loss": -41.99959182739258, "global_step": 253887, "epoch": 2098} {"train_loss": -41.27009201049805, "global_step": 253888, "epoch": 2098} {"train_loss": -41.29437255859375, "global_step": 253889, "epoch": 2098} {"train_loss": -42.37195587158203, "global_step": 253890, "epoch": 2098} {"train_loss": -40.84261703491211, "global_step": 253891, "epoch": 2098} {"train_loss": -42.6740837097168, "global_step": 253892, "epoch": 2098} {"train_loss": -41.756080627441406, "global_step": 253893, "epoch": 2098} {"train_loss": -42.64277267456055, "global_step": 253894, "epoch": 2098} {"train_loss": -41.995601654052734, "global_step": 253895, "epoch": 2098} {"train_loss": -42.4119758605957, "global_step": 253896, "epoch": 2098} {"train_loss": -42.5532112121582, "global_step": 253897, "epoch": 2098} {"train_loss": -42.54194259643555, "global_step": 253898, "epoch": 2098} {"train_loss": -42.58725357055664, "global_step": 253899, "epoch": 2098} {"train_loss": -42.870845794677734, "global_step": 253900, "epoch": 2098} {"train_loss": -42.62477493286133, "global_step": 253901, "epoch": 2098} {"train_loss": -42.51399230957031, "global_step": 253902, "epoch": 2098} {"train_loss": -42.421531677246094, "global_step": 253903, "epoch": 2098} {"train_loss": -41.93412399291992, "global_step": 253904, "epoch": 2098} {"train_loss": -42.91111373901367, "global_step": 253905, "epoch": 2098} {"train_loss": -41.29196548461914, "global_step": 253906, "epoch": 2098} {"train_loss": -42.577632904052734, "global_step": 253907, "epoch": 2098} {"train_loss": -42.59624481201172, "global_step": 253908, "epoch": 2098} {"train_loss": -41.35765075683594, "global_step": 253909, "epoch": 2098} {"train_loss": -42.20667266845703, "global_step": 253910, "epoch": 2098} {"train_loss": -40.813018798828125, "global_step": 253911, "epoch": 2098} {"train_loss": -42.21995162963867, "global_step": 253912, "epoch": 2098} {"train_loss": -41.605159759521484, "global_step": 253913, "epoch": 2098} {"train_loss": -42.73716354370117, "global_step": 253914, "epoch": 2098} {"train_loss": -42.576637268066406, "global_step": 253915, "epoch": 2098} {"train_loss": -42.26953125, "global_step": 253916, "epoch": 2098} {"train_loss": -41.976932525634766, "global_step": 253917, "epoch": 2098} {"train_loss": -42.418819427490234, "global_step": 253918, "epoch": 2098} {"train_loss": -42.21040725708008, "global_step": 253919, "epoch": 2098} {"train_loss": -43.062530517578125, "global_step": 253920, "epoch": 2098} {"train_loss": -42.10634994506836, "global_step": 253921, "epoch": 2098} {"train_loss": -43.14491653442383, "global_step": 253922, "epoch": 2098} {"train_loss": -42.739646911621094, "global_step": 253923, "epoch": 2098} {"train_loss": -42.74254608154297, "global_step": 253924, "epoch": 2098} {"train_loss": -43.72428512573242, "global_step": 253925, "epoch": 2098} {"train_loss": -43.30045700073242, "global_step": 253926, "epoch": 2098} {"train_loss": -43.261051177978516, "global_step": 253927, "epoch": 2098} {"train_loss": -42.94035720825195, "global_step": 253928, "epoch": 2098} {"train_loss": -43.44989013671875, "global_step": 253929, "epoch": 2098} {"train_loss": -43.59064865112305, "global_step": 253930, "epoch": 2098} {"train_loss": -43.4854621887207, "global_step": 253931, "epoch": 2098} {"train_loss": -43.48883056640625, "global_step": 253932, "epoch": 2098} {"train_loss": -43.40357208251953, "global_step": 253933, "epoch": 2098} {"train_loss": -43.2138671875, "global_step": 253934, "epoch": 2098} {"train_loss": -43.55768585205078, "global_step": 253935, "epoch": 2098} {"train_loss": -43.58477783203125, "global_step": 253936, "epoch": 2098} {"train_loss": -43.97831344604492, "global_step": 253937, "epoch": 2098} {"train_loss": -43.84084701538086, "global_step": 253938, "epoch": 2098} {"train_loss": -43.20969772338867, "global_step": 253939, "epoch": 2098} {"train_loss": -43.993080139160156, "global_step": 253940, "epoch": 2098} {"train_loss": -43.381614685058594, "global_step": 253941, "epoch": 2098} {"train_loss": -43.54531478881836, "global_step": 253942, "epoch": 2098} {"train_loss": -43.6341438293457, "global_step": 253943, "epoch": 2098} {"train_loss": -43.32918167114258, "global_step": 253944, "epoch": 2098} {"train_loss": -43.650428771972656, "global_step": 253945, "epoch": 2098} {"train_loss": -43.1813850402832, "global_step": 253946, "epoch": 2098} {"train_loss": -43.6068000793457, "global_step": 253947, "epoch": 2098} {"train_loss": -43.411346435546875, "global_step": 253948, "epoch": 2098} {"train_loss": -44.10028076171875, "global_step": 253949, "epoch": 2098} {"train_loss": -43.18190383911133, "global_step": 253950, "epoch": 2098} {"train_loss": -43.55659103393555, "global_step": 253951, "epoch": 2098} {"train_loss": -44.33085250854492, "global_step": 253952, "epoch": 2098} {"train_loss": -43.75031661987305, "global_step": 253953, "epoch": 2098} {"train_loss": -43.79622268676758, "global_step": 253954, "epoch": 2098} {"train_loss": -44.1064453125, "global_step": 253955, "epoch": 2098} {"train_loss": -43.410247802734375, "global_step": 253956, "epoch": 2098} {"train_loss": -43.93251419067383, "global_step": 253957, "epoch": 2098} {"train_loss": -44.32102584838867, "global_step": 253958, "epoch": 2098} {"train_loss": -43.42112350463867, "global_step": 253959, "epoch": 2098} {"train_loss": -43.30324172973633, "global_step": 253960, "epoch": 2098} {"train_loss": -42.732017517089844, "global_step": 253961, "epoch": 2098} {"train_loss": -43.424373626708984, "global_step": 253962, "epoch": 2098} {"train_loss": -43.08696365356445, "global_step": 253963, "epoch": 2098} {"train_loss": -42.925262451171875, "global_step": 253964, "epoch": 2098} {"train_loss": -43.492034912109375, "global_step": 253965, "epoch": 2098} {"train_loss": -43.360137939453125, "global_step": 253966, "epoch": 2098} {"train_loss": -43.04807662963867, "global_step": 253967, "epoch": 2098} {"train_loss": -43.780487060546875, "global_step": 253968, "epoch": 2098} {"train_loss": -43.08066940307617, "global_step": 253969, "epoch": 2098} {"train_loss": -42.63352584838867, "global_step": 253970, "epoch": 2098} {"train_loss": -43.603973388671875, "global_step": 253971, "epoch": 2098} {"train_loss": -43.1128044128418, "global_step": 253972, "epoch": 2098} {"train_loss": -42.19929122924805, "global_step": 253973, "epoch": 2098} {"train_loss": -42.49274826049805, "global_step": 253974, "epoch": 2098} {"train_loss": -43.59855270385742, "global_step": 253975, "epoch": 2098} {"train_loss": -43.635616302490234, "global_step": 253976, "epoch": 2098} {"train_loss": -43.20077896118164, "global_step": 253977, "epoch": 2098} {"train_loss": -42.39048899500823, "global_step": 253978, "epoch": 2098, "val_loss": 2660676.75} {"train_loss": -43.86820983886719, "global_step": 253979, "epoch": 2099} {"train_loss": -43.183624267578125, "global_step": 253980, "epoch": 2099} {"train_loss": -43.32251739501953, "global_step": 253981, "epoch": 2099} {"train_loss": -42.491241455078125, "global_step": 253982, "epoch": 2099} {"train_loss": -41.62600326538086, "global_step": 253983, "epoch": 2099} {"train_loss": -40.945228576660156, "global_step": 253984, "epoch": 2099} {"train_loss": -41.506019592285156, "global_step": 253985, "epoch": 2099} {"train_loss": -42.25730514526367, "global_step": 253986, "epoch": 2099} {"train_loss": -43.48550033569336, "global_step": 253987, "epoch": 2099} {"train_loss": -42.744503021240234, "global_step": 253988, "epoch": 2099} {"train_loss": -41.66216278076172, "global_step": 253989, "epoch": 2099} {"train_loss": -40.95649337768555, "global_step": 253990, "epoch": 2099} {"train_loss": -42.975624084472656, "global_step": 253991, "epoch": 2099} {"train_loss": -43.642208099365234, "global_step": 253992, "epoch": 2099} {"train_loss": -40.55103302001953, "global_step": 253993, "epoch": 2099} {"train_loss": -40.69208908081055, "global_step": 253994, "epoch": 2099} {"train_loss": -42.72567367553711, "global_step": 253995, "epoch": 2099} {"train_loss": -42.0736198425293, "global_step": 253996, "epoch": 2099} {"train_loss": -41.233272552490234, "global_step": 253997, "epoch": 2099} {"train_loss": -41.84586715698242, "global_step": 253998, "epoch": 2099} {"train_loss": -43.465572357177734, "global_step": 253999, "epoch": 2099} {"train_loss": -42.217857360839844, "global_step": 254000, "epoch": 2099} {"train_loss": -43.122352600097656, "global_step": 254001, "epoch": 2099} {"train_loss": -42.12553405761719, "global_step": 254002, "epoch": 2099} {"train_loss": -40.629783630371094, "global_step": 254003, "epoch": 2099} {"train_loss": -41.44630813598633, "global_step": 254004, "epoch": 2099} {"train_loss": -42.6796989440918, "global_step": 254005, "epoch": 2099} {"train_loss": -40.33091735839844, "global_step": 254006, "epoch": 2099} {"train_loss": -41.12844467163086, "global_step": 254007, "epoch": 2099} {"train_loss": -41.46051025390625, "global_step": 254008, "epoch": 2099} {"train_loss": -40.72709274291992, "global_step": 254009, "epoch": 2099} {"train_loss": -42.41987609863281, "global_step": 254010, "epoch": 2099} {"train_loss": -40.8495979309082, "global_step": 254011, "epoch": 2099} {"train_loss": -43.30088424682617, "global_step": 254012, "epoch": 2099} {"train_loss": -41.63187789916992, "global_step": 254013, "epoch": 2099} {"train_loss": -41.18174362182617, "global_step": 254014, "epoch": 2099} {"train_loss": -43.30140686035156, "global_step": 254015, "epoch": 2099} {"train_loss": -41.754066467285156, "global_step": 254016, "epoch": 2099} {"train_loss": -42.022953033447266, "global_step": 254017, "epoch": 2099} {"train_loss": -42.0929069519043, "global_step": 254018, "epoch": 2099} {"train_loss": -43.20890426635742, "global_step": 254019, "epoch": 2099} {"train_loss": -42.76621627807617, "global_step": 254020, "epoch": 2099} {"train_loss": -42.92928695678711, "global_step": 254021, "epoch": 2099} {"train_loss": -41.48258590698242, "global_step": 254022, "epoch": 2099} {"train_loss": -42.67477035522461, "global_step": 254023, "epoch": 2099} {"train_loss": -43.10060119628906, "global_step": 254024, "epoch": 2099} {"train_loss": -42.7806510925293, "global_step": 254025, "epoch": 2099} {"train_loss": -42.93653106689453, "global_step": 254026, "epoch": 2099} {"train_loss": -43.07402038574219, "global_step": 254027, "epoch": 2099} {"train_loss": -43.298675537109375, "global_step": 254028, "epoch": 2099} {"train_loss": -42.95669174194336, "global_step": 254029, "epoch": 2099} {"train_loss": -43.10872268676758, "global_step": 254030, "epoch": 2099} {"train_loss": -43.31781768798828, "global_step": 254031, "epoch": 2099} {"train_loss": -43.38789749145508, "global_step": 254032, "epoch": 2099} {"train_loss": -42.92634963989258, "global_step": 254033, "epoch": 2099} {"train_loss": -43.55704879760742, "global_step": 254034, "epoch": 2099} {"train_loss": -43.57347869873047, "global_step": 254035, "epoch": 2099} {"train_loss": -43.38787841796875, "global_step": 254036, "epoch": 2099} {"train_loss": -43.93033981323242, "global_step": 254037, "epoch": 2099} {"train_loss": -43.582130432128906, "global_step": 254038, "epoch": 2099} {"train_loss": -42.938411712646484, "global_step": 254039, "epoch": 2099} {"train_loss": -43.55986785888672, "global_step": 254040, "epoch": 2099} {"train_loss": -43.6987190246582, "global_step": 254041, "epoch": 2099} {"train_loss": -44.096397399902344, "global_step": 254042, "epoch": 2099} {"train_loss": -44.08689880371094, "global_step": 254043, "epoch": 2099} {"train_loss": -43.17593002319336, "global_step": 254044, "epoch": 2099} {"train_loss": -42.45600128173828, "global_step": 254045, "epoch": 2099} {"train_loss": -41.634334564208984, "global_step": 254046, "epoch": 2099} {"train_loss": -42.889678955078125, "global_step": 254047, "epoch": 2099} {"train_loss": -43.83381271362305, "global_step": 254048, "epoch": 2099} {"train_loss": -43.07694625854492, "global_step": 254049, "epoch": 2099} {"train_loss": -42.666255950927734, "global_step": 254050, "epoch": 2099} {"train_loss": -42.72005844116211, "global_step": 254051, "epoch": 2099} {"train_loss": -42.53871536254883, "global_step": 254052, "epoch": 2099} {"train_loss": -43.53986358642578, "global_step": 254053, "epoch": 2099} {"train_loss": -43.296566009521484, "global_step": 254054, "epoch": 2099} {"train_loss": -42.900115966796875, "global_step": 254055, "epoch": 2099} {"train_loss": -42.574703216552734, "global_step": 254056, "epoch": 2099} {"train_loss": -43.106746673583984, "global_step": 254057, "epoch": 2099} {"train_loss": -43.288814544677734, "global_step": 254058, "epoch": 2099} {"train_loss": -43.53736877441406, "global_step": 254059, "epoch": 2099} {"train_loss": -43.736202239990234, "global_step": 254060, "epoch": 2099} {"train_loss": -42.890480041503906, "global_step": 254061, "epoch": 2099} {"train_loss": -41.103389739990234, "global_step": 254062, "epoch": 2099} {"train_loss": -38.88283920288086, "global_step": 254063, "epoch": 2099} {"train_loss": -40.925697326660156, "global_step": 254064, "epoch": 2099} {"train_loss": -42.210872650146484, "global_step": 254065, "epoch": 2099} {"train_loss": -41.24812698364258, "global_step": 254066, "epoch": 2099} {"train_loss": -41.2382698059082, "global_step": 254067, "epoch": 2099} {"train_loss": -41.86411666870117, "global_step": 254068, "epoch": 2099} {"train_loss": -41.164825439453125, "global_step": 254069, "epoch": 2099} {"train_loss": -42.63454055786133, "global_step": 254070, "epoch": 2099} {"train_loss": -42.75313949584961, "global_step": 254071, "epoch": 2099} {"train_loss": -41.75935363769531, "global_step": 254072, "epoch": 2099} {"train_loss": -41.272064208984375, "global_step": 254073, "epoch": 2099} {"train_loss": -42.02224349975586, "global_step": 254074, "epoch": 2099} {"train_loss": -42.42524337768555, "global_step": 254075, "epoch": 2099} {"train_loss": -42.4135856628418, "global_step": 254076, "epoch": 2099} {"train_loss": -42.705055236816406, "global_step": 254077, "epoch": 2099} {"train_loss": -42.66238021850586, "global_step": 254078, "epoch": 2099} {"train_loss": -43.03413009643555, "global_step": 254079, "epoch": 2099} {"train_loss": -42.85160827636719, "global_step": 254080, "epoch": 2099} {"train_loss": -43.063812255859375, "global_step": 254081, "epoch": 2099} {"train_loss": -43.162044525146484, "global_step": 254082, "epoch": 2099} {"train_loss": -42.688148498535156, "global_step": 254083, "epoch": 2099} {"train_loss": -43.0625, "global_step": 254084, "epoch": 2099} {"train_loss": -43.32993698120117, "global_step": 254085, "epoch": 2099} {"train_loss": -42.733123779296875, "global_step": 254086, "epoch": 2099} {"train_loss": -43.147117614746094, "global_step": 254087, "epoch": 2099} {"train_loss": -42.71689987182617, "global_step": 254088, "epoch": 2099} {"train_loss": -43.077362060546875, "global_step": 254089, "epoch": 2099} {"train_loss": -42.59883499145508, "global_step": 254090, "epoch": 2099} {"train_loss": -43.10307693481445, "global_step": 254091, "epoch": 2099} {"train_loss": -43.54575729370117, "global_step": 254092, "epoch": 2099} {"train_loss": -43.10667037963867, "global_step": 254093, "epoch": 2099} {"train_loss": -43.1346549987793, "global_step": 254094, "epoch": 2099} {"train_loss": -43.08083724975586, "global_step": 254095, "epoch": 2099} {"train_loss": -42.99502182006836, "global_step": 254096, "epoch": 2099} {"train_loss": -40.76776885986328, "global_step": 254097, "epoch": 2099} {"train_loss": -39.80610275268555, "global_step": 254098, "epoch": 2099} {"train_loss": -42.50404420963004, "global_step": 254099, "epoch": 2099, "val_loss": 2728193.25} {"train_loss": -42.65018844604492, "global_step": 254100, "epoch": 2100} {"train_loss": -40.17538070678711, "global_step": 254101, "epoch": 2100} {"train_loss": -42.8328742980957, "global_step": 254102, "epoch": 2100} {"train_loss": -42.54533004760742, "global_step": 254103, "epoch": 2100} {"train_loss": -40.85710144042969, "global_step": 254104, "epoch": 2100} {"train_loss": -42.954647064208984, "global_step": 254105, "epoch": 2100} {"train_loss": -42.462684631347656, "global_step": 254106, "epoch": 2100} {"train_loss": -42.70847702026367, "global_step": 254107, "epoch": 2100} {"train_loss": -43.660987854003906, "global_step": 254108, "epoch": 2100} {"train_loss": -43.2815055847168, "global_step": 254109, "epoch": 2100} {"train_loss": -43.56501007080078, "global_step": 254110, "epoch": 2100} {"train_loss": -43.00233459472656, "global_step": 254111, "epoch": 2100} {"train_loss": -42.521705627441406, "global_step": 254112, "epoch": 2100} {"train_loss": -43.379295349121094, "global_step": 254113, "epoch": 2100} {"train_loss": -43.10532760620117, "global_step": 254114, "epoch": 2100} {"train_loss": -42.673526763916016, "global_step": 254115, "epoch": 2100} {"train_loss": -43.39271926879883, "global_step": 254116, "epoch": 2100} {"train_loss": -43.259010314941406, "global_step": 254117, "epoch": 2100} {"train_loss": -43.349327087402344, "global_step": 254118, "epoch": 2100} {"train_loss": -42.85115432739258, "global_step": 254119, "epoch": 2100} {"train_loss": -41.764915466308594, "global_step": 254120, "epoch": 2100} {"train_loss": -43.657981872558594, "global_step": 254121, "epoch": 2100} {"train_loss": -42.90108871459961, "global_step": 254122, "epoch": 2100} {"train_loss": -43.1795539855957, "global_step": 254123, "epoch": 2100} {"train_loss": -42.440826416015625, "global_step": 254124, "epoch": 2100} {"train_loss": -42.65100860595703, "global_step": 254125, "epoch": 2100} {"train_loss": -43.44708251953125, "global_step": 254126, "epoch": 2100} {"train_loss": -41.59333419799805, "global_step": 254127, "epoch": 2100} {"train_loss": -43.237850189208984, "global_step": 254128, "epoch": 2100} {"train_loss": -43.4508171081543, "global_step": 254129, "epoch": 2100} {"train_loss": -41.62700653076172, "global_step": 254130, "epoch": 2100} {"train_loss": -42.59457778930664, "global_step": 254131, "epoch": 2100} {"train_loss": -43.11903762817383, "global_step": 254132, "epoch": 2100} {"train_loss": -41.61151123046875, "global_step": 254133, "epoch": 2100} {"train_loss": -43.26198959350586, "global_step": 254134, "epoch": 2100} {"train_loss": -42.906063079833984, "global_step": 254135, "epoch": 2100} {"train_loss": -42.149009704589844, "global_step": 254136, "epoch": 2100} {"train_loss": -42.540130615234375, "global_step": 254137, "epoch": 2100} {"train_loss": -41.346534729003906, "global_step": 254138, "epoch": 2100} {"train_loss": -41.913917541503906, "global_step": 254139, "epoch": 2100} {"train_loss": -42.622676849365234, "global_step": 254140, "epoch": 2100} {"train_loss": -41.66777038574219, "global_step": 254141, "epoch": 2100} {"train_loss": -43.509132385253906, "global_step": 254142, "epoch": 2100} {"train_loss": -42.827980041503906, "global_step": 254143, "epoch": 2100} {"train_loss": -42.13361358642578, "global_step": 254144, "epoch": 2100} {"train_loss": -42.12517166137695, "global_step": 254145, "epoch": 2100} {"train_loss": -42.385902404785156, "global_step": 254146, "epoch": 2100} {"train_loss": -42.4675178527832, "global_step": 254147, "epoch": 2100} {"train_loss": -43.06557846069336, "global_step": 254148, "epoch": 2100} {"train_loss": -43.39423370361328, "global_step": 254149, "epoch": 2100} {"train_loss": -41.860836029052734, "global_step": 254150, "epoch": 2100} {"train_loss": -42.67820358276367, "global_step": 254151, "epoch": 2100} {"train_loss": -42.55868148803711, "global_step": 254152, "epoch": 2100} {"train_loss": -43.03892517089844, "global_step": 254153, "epoch": 2100} {"train_loss": -42.48057174682617, "global_step": 254154, "epoch": 2100} {"train_loss": -42.69493865966797, "global_step": 254155, "epoch": 2100} {"train_loss": -43.40853500366211, "global_step": 254156, "epoch": 2100} {"train_loss": -42.95072555541992, "global_step": 254157, "epoch": 2100} {"train_loss": -43.49154281616211, "global_step": 254158, "epoch": 2100} {"train_loss": -43.42461013793945, "global_step": 254159, "epoch": 2100} {"train_loss": -43.1941032409668, "global_step": 254160, "epoch": 2100} {"train_loss": -43.35750198364258, "global_step": 254161, "epoch": 2100} {"train_loss": -42.62526321411133, "global_step": 254162, "epoch": 2100} {"train_loss": -41.07740020751953, "global_step": 254163, "epoch": 2100} {"train_loss": -41.57596969604492, "global_step": 254164, "epoch": 2100} {"train_loss": -43.649356842041016, "global_step": 254165, "epoch": 2100} {"train_loss": -42.435176849365234, "global_step": 254166, "epoch": 2100} {"train_loss": -40.29043197631836, "global_step": 254167, "epoch": 2100} {"train_loss": -38.536895751953125, "global_step": 254168, "epoch": 2100} {"train_loss": -41.601768493652344, "global_step": 254169, "epoch": 2100} {"train_loss": -34.889671325683594, "global_step": 254170, "epoch": 2100} {"train_loss": -38.23894119262695, "global_step": 254171, "epoch": 2100} {"train_loss": -42.51553726196289, "global_step": 254172, "epoch": 2100} {"train_loss": -40.61498260498047, "global_step": 254173, "epoch": 2100} {"train_loss": -37.53146743774414, "global_step": 254174, "epoch": 2100} {"train_loss": -38.97916793823242, "global_step": 254175, "epoch": 2100} {"train_loss": -42.13206100463867, "global_step": 254176, "epoch": 2100} {"train_loss": -42.00544357299805, "global_step": 254177, "epoch": 2100} {"train_loss": -41.65792465209961, "global_step": 254178, "epoch": 2100} {"train_loss": -42.17879867553711, "global_step": 254179, "epoch": 2100} {"train_loss": -41.9754638671875, "global_step": 254180, "epoch": 2100} {"train_loss": -42.678592681884766, "global_step": 254181, "epoch": 2100} {"train_loss": -41.939735412597656, "global_step": 254182, "epoch": 2100} {"train_loss": -42.26499557495117, "global_step": 254183, "epoch": 2100} {"train_loss": -41.90910720825195, "global_step": 254184, "epoch": 2100} {"train_loss": -42.481300354003906, "global_step": 254185, "epoch": 2100} {"train_loss": -42.7687873840332, "global_step": 254186, "epoch": 2100} {"train_loss": -42.9035758972168, "global_step": 254187, "epoch": 2100} {"train_loss": -43.03187561035156, "global_step": 254188, "epoch": 2100} {"train_loss": -43.239173889160156, "global_step": 254189, "epoch": 2100} {"train_loss": -42.68929672241211, "global_step": 254190, "epoch": 2100} {"train_loss": -43.2567138671875, "global_step": 254191, "epoch": 2100} {"train_loss": -42.91079330444336, "global_step": 254192, "epoch": 2100} {"train_loss": -43.494422912597656, "global_step": 254193, "epoch": 2100} {"train_loss": -43.56245803833008, "global_step": 254194, "epoch": 2100} {"train_loss": -42.430946350097656, "global_step": 254195, "epoch": 2100} {"train_loss": -43.62764358520508, "global_step": 254196, "epoch": 2100} {"train_loss": -43.26903533935547, "global_step": 254197, "epoch": 2100} {"train_loss": -43.534515380859375, "global_step": 254198, "epoch": 2100} {"train_loss": -43.233619689941406, "global_step": 254199, "epoch": 2100} {"train_loss": -43.32297134399414, "global_step": 254200, "epoch": 2100} {"train_loss": -43.308189392089844, "global_step": 254201, "epoch": 2100} {"train_loss": -43.807647705078125, "global_step": 254202, "epoch": 2100} {"train_loss": -43.58137512207031, "global_step": 254203, "epoch": 2100} {"train_loss": -43.649864196777344, "global_step": 254204, "epoch": 2100} {"train_loss": -43.60787582397461, "global_step": 254205, "epoch": 2100} {"train_loss": -43.64715576171875, "global_step": 254206, "epoch": 2100} {"train_loss": -44.0660285949707, "global_step": 254207, "epoch": 2100} {"train_loss": -43.87358856201172, "global_step": 254208, "epoch": 2100} {"train_loss": -43.8900032043457, "global_step": 254209, "epoch": 2100} {"train_loss": -43.68940734863281, "global_step": 254210, "epoch": 2100} {"train_loss": -43.52479553222656, "global_step": 254211, "epoch": 2100} {"train_loss": -43.67628860473633, "global_step": 254212, "epoch": 2100} {"train_loss": -43.87738800048828, "global_step": 254213, "epoch": 2100} {"train_loss": -44.04269027709961, "global_step": 254214, "epoch": 2100} {"train_loss": -43.865379333496094, "global_step": 254215, "epoch": 2100} {"train_loss": -44.50883865356445, "global_step": 254216, "epoch": 2100} {"train_loss": -43.641021728515625, "global_step": 254217, "epoch": 2100} {"train_loss": -44.29659652709961, "global_step": 254218, "epoch": 2100} {"train_loss": -44.340633392333984, "global_step": 254219, "epoch": 2100} {"train_loss": -42.632733368676554, "global_step": 254220, "epoch": 2100, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4400000": 1.0, "test/sim_max_reward_4400001": 1.0, "test/sim_max_reward_4400002": 1.0, "test/sim_max_reward_4400003": 1.0, "test/sim_max_reward_4400004": 1.0, "test/sim_max_reward_4400005": 1.0, "test/sim_max_reward_4400006": 1.0, "test/sim_max_reward_4400007": 1.0, "test/sim_max_reward_4400008": 1.0, "test/sim_max_reward_4400009": 1.0, "test/sim_max_reward_4400010": 1.0, "test/sim_max_reward_4400011": 1.0, "test/sim_max_reward_4400012": 1.0, "test/sim_max_reward_4400013": 1.0, "test/sim_max_reward_4400014": 1.0, "test/sim_max_reward_4400015": 1.0, "test/sim_max_reward_4400016": 1.0, "test/sim_max_reward_4400017": 1.0, "test/sim_max_reward_4400018": 1.0, "test/sim_max_reward_4400019": 1.0, "test/sim_max_reward_4400020": 1.0, "test/sim_max_reward_4400021": 1.0, "train/mean_score": 1.0, "test/mean_score": 1.0, "val_loss": 2667707.75} {"train_loss": -44.091365814208984, "global_step": 254221, "epoch": 2101} {"train_loss": -44.123985290527344, "global_step": 254222, "epoch": 2101} {"train_loss": -43.15690994262695, "global_step": 254223, "epoch": 2101} {"train_loss": -44.459320068359375, "global_step": 254224, "epoch": 2101} {"train_loss": -44.00693893432617, "global_step": 254225, "epoch": 2101} {"train_loss": -43.46268844604492, "global_step": 254226, "epoch": 2101} {"train_loss": -44.46953582763672, "global_step": 254227, "epoch": 2101} {"train_loss": -44.16523361206055, "global_step": 254228, "epoch": 2101} {"train_loss": -44.570281982421875, "global_step": 254229, "epoch": 2101} {"train_loss": -44.26519775390625, "global_step": 254230, "epoch": 2101} {"train_loss": -44.35976028442383, "global_step": 254231, "epoch": 2101} {"train_loss": -44.1373405456543, "global_step": 254232, "epoch": 2101} {"train_loss": -43.663848876953125, "global_step": 254233, "epoch": 2101} {"train_loss": -43.95618438720703, "global_step": 254234, "epoch": 2101} {"train_loss": -43.95258712768555, "global_step": 254235, "epoch": 2101} {"train_loss": -43.42744827270508, "global_step": 254236, "epoch": 2101} {"train_loss": -42.780059814453125, "global_step": 254237, "epoch": 2101} {"train_loss": -43.32807540893555, "global_step": 254238, "epoch": 2101} {"train_loss": -43.95014572143555, "global_step": 254239, "epoch": 2101} {"train_loss": -44.5150260925293, "global_step": 254240, "epoch": 2101} {"train_loss": -43.11074447631836, "global_step": 254241, "epoch": 2101} {"train_loss": -43.26642990112305, "global_step": 254242, "epoch": 2101} {"train_loss": -42.53424072265625, "global_step": 254243, "epoch": 2101} {"train_loss": -43.06572341918945, "global_step": 254244, "epoch": 2101} {"train_loss": -43.33472442626953, "global_step": 254245, "epoch": 2101} {"train_loss": -43.157161712646484, "global_step": 254246, "epoch": 2101} {"train_loss": -43.03252029418945, "global_step": 254247, "epoch": 2101} {"train_loss": -42.7072868347168, "global_step": 254248, "epoch": 2101} {"train_loss": -44.145973205566406, "global_step": 254249, "epoch": 2101} {"train_loss": -43.414634704589844, "global_step": 254250, "epoch": 2101} {"train_loss": -43.64298629760742, "global_step": 254251, "epoch": 2101} {"train_loss": -41.86635208129883, "global_step": 254252, "epoch": 2101} {"train_loss": -43.846229553222656, "global_step": 254253, "epoch": 2101} {"train_loss": -43.86842727661133, "global_step": 254254, "epoch": 2101} {"train_loss": -43.35685348510742, "global_step": 254255, "epoch": 2101} {"train_loss": -43.22095489501953, "global_step": 254256, "epoch": 2101} {"train_loss": -42.8809700012207, "global_step": 254257, "epoch": 2101} {"train_loss": -42.19501876831055, "global_step": 254258, "epoch": 2101} {"train_loss": -42.877166748046875, "global_step": 254259, "epoch": 2101} {"train_loss": -42.39814758300781, "global_step": 254260, "epoch": 2101} {"train_loss": -41.69300842285156, "global_step": 254261, "epoch": 2101} {"train_loss": -43.356719970703125, "global_step": 254262, "epoch": 2101} {"train_loss": -42.74404525756836, "global_step": 254263, "epoch": 2101} {"train_loss": -43.163299560546875, "global_step": 254264, "epoch": 2101} {"train_loss": -41.877593994140625, "global_step": 254265, "epoch": 2101} {"train_loss": -42.344181060791016, "global_step": 254266, "epoch": 2101} {"train_loss": -43.128501892089844, "global_step": 254267, "epoch": 2101} {"train_loss": -42.64995193481445, "global_step": 254268, "epoch": 2101} {"train_loss": -36.1197395324707, "global_step": 254269, "epoch": 2101} {"train_loss": -34.44575881958008, "global_step": 254270, "epoch": 2101} {"train_loss": -40.38611602783203, "global_step": 254271, "epoch": 2101} {"train_loss": -41.7026481628418, "global_step": 254272, "epoch": 2101} {"train_loss": -41.928070068359375, "global_step": 254273, "epoch": 2101} {"train_loss": -41.0141716003418, "global_step": 254274, "epoch": 2101} {"train_loss": -41.23622131347656, "global_step": 254275, "epoch": 2101} {"train_loss": -41.23215866088867, "global_step": 254276, "epoch": 2101} {"train_loss": -39.999000549316406, "global_step": 254277, "epoch": 2101} {"train_loss": -41.75689697265625, "global_step": 254278, "epoch": 2101} {"train_loss": -41.09092712402344, "global_step": 254279, "epoch": 2101} {"train_loss": -40.19882583618164, "global_step": 254280, "epoch": 2101} {"train_loss": -40.30819320678711, "global_step": 254281, "epoch": 2101} {"train_loss": -41.5986213684082, "global_step": 254282, "epoch": 2101} {"train_loss": -39.95847702026367, "global_step": 254283, "epoch": 2101} {"train_loss": -41.4881591796875, "global_step": 254284, "epoch": 2101} {"train_loss": -41.438289642333984, "global_step": 254285, "epoch": 2101} {"train_loss": -41.265621185302734, "global_step": 254286, "epoch": 2101} {"train_loss": -41.46498489379883, "global_step": 254287, "epoch": 2101} {"train_loss": -41.3255500793457, "global_step": 254288, "epoch": 2101} {"train_loss": -40.06453323364258, "global_step": 254289, "epoch": 2101} {"train_loss": -41.526187896728516, "global_step": 254290, "epoch": 2101} {"train_loss": -41.60102462768555, "global_step": 254291, "epoch": 2101} {"train_loss": -41.754913330078125, "global_step": 254292, "epoch": 2101} {"train_loss": -41.888816833496094, "global_step": 254293, "epoch": 2101} {"train_loss": -41.64259338378906, "global_step": 254294, "epoch": 2101} {"train_loss": -42.96379470825195, "global_step": 254295, "epoch": 2101} {"train_loss": -42.067691802978516, "global_step": 254296, "epoch": 2101} {"train_loss": -43.01749801635742, "global_step": 254297, "epoch": 2101} {"train_loss": -42.26288986206055, "global_step": 254298, "epoch": 2101} {"train_loss": -42.317840576171875, "global_step": 254299, "epoch": 2101} {"train_loss": -42.750099182128906, "global_step": 254300, "epoch": 2101} {"train_loss": -41.810874938964844, "global_step": 254301, "epoch": 2101} {"train_loss": -42.69930648803711, "global_step": 254302, "epoch": 2101} {"train_loss": -42.454017639160156, "global_step": 254303, "epoch": 2101} {"train_loss": -42.29465866088867, "global_step": 254304, "epoch": 2101} {"train_loss": -42.104949951171875, "global_step": 254305, "epoch": 2101} {"train_loss": -42.7337646484375, "global_step": 254306, "epoch": 2101} {"train_loss": -42.158321380615234, "global_step": 254307, "epoch": 2101} {"train_loss": -42.869873046875, "global_step": 254308, "epoch": 2101} {"train_loss": -42.908267974853516, "global_step": 254309, "epoch": 2101} {"train_loss": -42.71160125732422, "global_step": 254310, "epoch": 2101} {"train_loss": -43.43048858642578, "global_step": 254311, "epoch": 2101} {"train_loss": -43.25527572631836, "global_step": 254312, "epoch": 2101} {"train_loss": -43.13768768310547, "global_step": 254313, "epoch": 2101} {"train_loss": -43.16510009765625, "global_step": 254314, "epoch": 2101} {"train_loss": -43.157325744628906, "global_step": 254315, "epoch": 2101} {"train_loss": -42.90409851074219, "global_step": 254316, "epoch": 2101} {"train_loss": -43.70465850830078, "global_step": 254317, "epoch": 2101} {"train_loss": -43.10079574584961, "global_step": 254318, "epoch": 2101} {"train_loss": -42.87630081176758, "global_step": 254319, "epoch": 2101} {"train_loss": -43.25750732421875, "global_step": 254320, "epoch": 2101} {"train_loss": -42.76758575439453, "global_step": 254321, "epoch": 2101} {"train_loss": -43.652069091796875, "global_step": 254322, "epoch": 2101} {"train_loss": -42.79877853393555, "global_step": 254323, "epoch": 2101} {"train_loss": -43.30775833129883, "global_step": 254324, "epoch": 2101} {"train_loss": -43.07857131958008, "global_step": 254325, "epoch": 2101} {"train_loss": -43.51810836791992, "global_step": 254326, "epoch": 2101} {"train_loss": -44.02590560913086, "global_step": 254327, "epoch": 2101} {"train_loss": -43.8363151550293, "global_step": 254328, "epoch": 2101} {"train_loss": -43.64628219604492, "global_step": 254329, "epoch": 2101} {"train_loss": -43.494197845458984, "global_step": 254330, "epoch": 2101} {"train_loss": -43.53632736206055, "global_step": 254331, "epoch": 2101} {"train_loss": -43.87324142456055, "global_step": 254332, "epoch": 2101} {"train_loss": -44.2662239074707, "global_step": 254333, "epoch": 2101} {"train_loss": -43.91093826293945, "global_step": 254334, "epoch": 2101} {"train_loss": -43.4415397644043, "global_step": 254335, "epoch": 2101} {"train_loss": -43.84735870361328, "global_step": 254336, "epoch": 2101} {"train_loss": -44.17380905151367, "global_step": 254337, "epoch": 2101} {"train_loss": -44.14724349975586, "global_step": 254338, "epoch": 2101} {"train_loss": -43.595699310302734, "global_step": 254339, "epoch": 2101} {"train_loss": -43.76251220703125, "global_step": 254340, "epoch": 2101} {"train_loss": -42.71344438663199, "global_step": 254341, "epoch": 2101, "val_loss": 2672084.25} {"train_loss": -43.96379470825195, "global_step": 254342, "epoch": 2102} {"train_loss": -44.02689743041992, "global_step": 254343, "epoch": 2102} {"train_loss": -44.0166130065918, "global_step": 254344, "epoch": 2102} {"train_loss": -43.635047912597656, "global_step": 254345, "epoch": 2102} {"train_loss": -43.601680755615234, "global_step": 254346, "epoch": 2102} {"train_loss": -44.10621643066406, "global_step": 254347, "epoch": 2102} {"train_loss": -43.815738677978516, "global_step": 254348, "epoch": 2102} {"train_loss": -44.46004867553711, "global_step": 254349, "epoch": 2102} {"train_loss": -44.29054641723633, "global_step": 254350, "epoch": 2102} {"train_loss": -43.70304489135742, "global_step": 254351, "epoch": 2102} {"train_loss": -43.9532356262207, "global_step": 254352, "epoch": 2102} {"train_loss": -43.37141036987305, "global_step": 254353, "epoch": 2102} {"train_loss": -44.21626663208008, "global_step": 254354, "epoch": 2102} {"train_loss": -44.39480209350586, "global_step": 254355, "epoch": 2102} {"train_loss": -42.412071228027344, "global_step": 254356, "epoch": 2102} {"train_loss": -40.80367660522461, "global_step": 254357, "epoch": 2102} {"train_loss": -41.87504196166992, "global_step": 254358, "epoch": 2102} {"train_loss": -43.77044677734375, "global_step": 254359, "epoch": 2102} {"train_loss": -43.14121627807617, "global_step": 254360, "epoch": 2102} {"train_loss": -40.06303024291992, "global_step": 254361, "epoch": 2102} {"train_loss": -39.5687255859375, "global_step": 254362, "epoch": 2102} {"train_loss": -40.85995864868164, "global_step": 254363, "epoch": 2102} {"train_loss": -43.0988883972168, "global_step": 254364, "epoch": 2102} {"train_loss": -41.744136810302734, "global_step": 254365, "epoch": 2102} {"train_loss": -42.36732864379883, "global_step": 254366, "epoch": 2102} {"train_loss": -42.842891693115234, "global_step": 254367, "epoch": 2102} {"train_loss": -42.88258743286133, "global_step": 254368, "epoch": 2102} {"train_loss": -43.00757598876953, "global_step": 254369, "epoch": 2102} {"train_loss": -41.07176971435547, "global_step": 254370, "epoch": 2102} {"train_loss": -43.001556396484375, "global_step": 254371, "epoch": 2102} {"train_loss": -43.7866096496582, "global_step": 254372, "epoch": 2102} {"train_loss": -42.63896560668945, "global_step": 254373, "epoch": 2102} {"train_loss": -42.54547882080078, "global_step": 254374, "epoch": 2102} {"train_loss": -42.98519515991211, "global_step": 254375, "epoch": 2102} {"train_loss": -43.3279914855957, "global_step": 254376, "epoch": 2102} {"train_loss": -43.16398239135742, "global_step": 254377, "epoch": 2102} {"train_loss": -43.88320541381836, "global_step": 254378, "epoch": 2102} {"train_loss": -43.342472076416016, "global_step": 254379, "epoch": 2102} {"train_loss": -43.11599349975586, "global_step": 254380, "epoch": 2102} {"train_loss": -43.4606819152832, "global_step": 254381, "epoch": 2102} {"train_loss": -43.77912902832031, "global_step": 254382, "epoch": 2102} {"train_loss": -42.83234786987305, "global_step": 254383, "epoch": 2102} {"train_loss": -43.39854049682617, "global_step": 254384, "epoch": 2102} {"train_loss": -43.721717834472656, "global_step": 254385, "epoch": 2102} {"train_loss": -44.1026611328125, "global_step": 254386, "epoch": 2102} {"train_loss": -43.990787506103516, "global_step": 254387, "epoch": 2102} {"train_loss": -43.301368713378906, "global_step": 254388, "epoch": 2102} {"train_loss": -43.78926086425781, "global_step": 254389, "epoch": 2102} {"train_loss": -43.55778503417969, "global_step": 254390, "epoch": 2102} {"train_loss": -42.80677032470703, "global_step": 254391, "epoch": 2102} {"train_loss": -43.88505935668945, "global_step": 254392, "epoch": 2102} {"train_loss": -44.2074089050293, "global_step": 254393, "epoch": 2102} {"train_loss": -43.566219329833984, "global_step": 254394, "epoch": 2102} {"train_loss": -44.04319381713867, "global_step": 254395, "epoch": 2102} {"train_loss": -44.1147346496582, "global_step": 254396, "epoch": 2102} {"train_loss": -43.76019287109375, "global_step": 254397, "epoch": 2102} {"train_loss": -44.41542434692383, "global_step": 254398, "epoch": 2102} {"train_loss": -44.05697250366211, "global_step": 254399, "epoch": 2102} {"train_loss": -43.62160873413086, "global_step": 254400, "epoch": 2102} {"train_loss": -41.914913177490234, "global_step": 254401, "epoch": 2102} {"train_loss": -43.61945724487305, "global_step": 254402, "epoch": 2102} {"train_loss": -44.052818298339844, "global_step": 254403, "epoch": 2102} {"train_loss": -43.600074768066406, "global_step": 254404, "epoch": 2102} {"train_loss": -42.09339904785156, "global_step": 254405, "epoch": 2102} {"train_loss": -41.16390609741211, "global_step": 254406, "epoch": 2102} {"train_loss": -43.740089416503906, "global_step": 254407, "epoch": 2102} {"train_loss": -42.675350189208984, "global_step": 254408, "epoch": 2102} {"train_loss": -40.39268493652344, "global_step": 254409, "epoch": 2102} {"train_loss": -43.05617141723633, "global_step": 254410, "epoch": 2102} {"train_loss": -43.05448913574219, "global_step": 254411, "epoch": 2102} {"train_loss": -41.63674545288086, "global_step": 254412, "epoch": 2102} {"train_loss": -42.64180374145508, "global_step": 254413, "epoch": 2102} {"train_loss": -42.1049919128418, "global_step": 254414, "epoch": 2102} {"train_loss": -42.71586608886719, "global_step": 254415, "epoch": 2102} {"train_loss": -42.533058166503906, "global_step": 254416, "epoch": 2102} {"train_loss": -43.231746673583984, "global_step": 254417, "epoch": 2102} {"train_loss": -42.77225875854492, "global_step": 254418, "epoch": 2102} {"train_loss": -42.732574462890625, "global_step": 254419, "epoch": 2102} {"train_loss": -42.79266357421875, "global_step": 254420, "epoch": 2102} {"train_loss": -41.050594329833984, "global_step": 254421, "epoch": 2102} {"train_loss": -41.40199661254883, "global_step": 254422, "epoch": 2102} {"train_loss": -42.17017364501953, "global_step": 254423, "epoch": 2102} {"train_loss": -43.11179733276367, "global_step": 254424, "epoch": 2102} {"train_loss": -41.63339614868164, "global_step": 254425, "epoch": 2102} {"train_loss": -41.92240524291992, "global_step": 254426, "epoch": 2102} {"train_loss": -42.75205993652344, "global_step": 254427, "epoch": 2102} {"train_loss": -41.78188705444336, "global_step": 254428, "epoch": 2102} {"train_loss": -41.511932373046875, "global_step": 254429, "epoch": 2102} {"train_loss": -40.64150619506836, "global_step": 254430, "epoch": 2102} {"train_loss": -40.682960510253906, "global_step": 254431, "epoch": 2102} {"train_loss": -43.14873123168945, "global_step": 254432, "epoch": 2102} {"train_loss": -40.305667877197266, "global_step": 254433, "epoch": 2102} {"train_loss": -38.643436431884766, "global_step": 254434, "epoch": 2102} {"train_loss": -42.63865280151367, "global_step": 254435, "epoch": 2102} {"train_loss": -34.689659118652344, "global_step": 254436, "epoch": 2102} {"train_loss": -34.29171371459961, "global_step": 254437, "epoch": 2102} {"train_loss": -41.100006103515625, "global_step": 254438, "epoch": 2102} {"train_loss": -37.802398681640625, "global_step": 254439, "epoch": 2102} {"train_loss": -39.06492233276367, "global_step": 254440, "epoch": 2102} {"train_loss": -37.72389602661133, "global_step": 254441, "epoch": 2102} {"train_loss": -40.33915328979492, "global_step": 254442, "epoch": 2102} {"train_loss": -39.80419158935547, "global_step": 254443, "epoch": 2102} {"train_loss": -39.56895065307617, "global_step": 254444, "epoch": 2102} {"train_loss": -40.83633804321289, "global_step": 254445, "epoch": 2102} {"train_loss": -39.24201583862305, "global_step": 254446, "epoch": 2102} {"train_loss": -37.03750228881836, "global_step": 254447, "epoch": 2102} {"train_loss": -39.54098129272461, "global_step": 254448, "epoch": 2102} {"train_loss": -40.196197509765625, "global_step": 254449, "epoch": 2102} {"train_loss": -40.674072265625, "global_step": 254450, "epoch": 2102} {"train_loss": -40.52405548095703, "global_step": 254451, "epoch": 2102} {"train_loss": -39.56167221069336, "global_step": 254452, "epoch": 2102} {"train_loss": -41.51680374145508, "global_step": 254453, "epoch": 2102} {"train_loss": -39.491634368896484, "global_step": 254454, "epoch": 2102} {"train_loss": -41.69282913208008, "global_step": 254455, "epoch": 2102} {"train_loss": -39.66091537475586, "global_step": 254456, "epoch": 2102} {"train_loss": -41.20000076293945, "global_step": 254457, "epoch": 2102} {"train_loss": -39.71105194091797, "global_step": 254458, "epoch": 2102} {"train_loss": -41.62775802612305, "global_step": 254459, "epoch": 2102} {"train_loss": -39.97123336791992, "global_step": 254460, "epoch": 2102} {"train_loss": -41.406063079833984, "global_step": 254461, "epoch": 2102} {"train_loss": -42.12046069941245, "global_step": 254462, "epoch": 2102, "val_loss": 2575669.0} {"train_loss": -41.64541244506836, "global_step": 254463, "epoch": 2103} {"train_loss": -41.222206115722656, "global_step": 254464, "epoch": 2103} {"train_loss": -42.37849044799805, "global_step": 254465, "epoch": 2103} {"train_loss": -41.17782211303711, "global_step": 254466, "epoch": 2103} {"train_loss": -42.18484878540039, "global_step": 254467, "epoch": 2103} {"train_loss": -42.33285140991211, "global_step": 254468, "epoch": 2103} {"train_loss": -42.18185043334961, "global_step": 254469, "epoch": 2103} {"train_loss": -42.00938034057617, "global_step": 254470, "epoch": 2103} {"train_loss": -42.06059646606445, "global_step": 254471, "epoch": 2103} {"train_loss": -42.0091667175293, "global_step": 254472, "epoch": 2103} {"train_loss": -42.66814422607422, "global_step": 254473, "epoch": 2103} {"train_loss": -42.25301742553711, "global_step": 254474, "epoch": 2103} {"train_loss": -43.099761962890625, "global_step": 254475, "epoch": 2103} {"train_loss": -42.763912200927734, "global_step": 254476, "epoch": 2103} {"train_loss": -42.088478088378906, "global_step": 254477, "epoch": 2103} {"train_loss": -43.011287689208984, "global_step": 254478, "epoch": 2103} {"train_loss": -43.15224075317383, "global_step": 254479, "epoch": 2103} {"train_loss": -42.65774154663086, "global_step": 254480, "epoch": 2103} {"train_loss": -43.08437728881836, "global_step": 254481, "epoch": 2103} {"train_loss": -43.10064697265625, "global_step": 254482, "epoch": 2103} {"train_loss": -42.88340377807617, "global_step": 254483, "epoch": 2103} {"train_loss": -43.57640838623047, "global_step": 254484, "epoch": 2103} {"train_loss": -43.07941436767578, "global_step": 254485, "epoch": 2103} {"train_loss": -43.96455001831055, "global_step": 254486, "epoch": 2103} {"train_loss": -43.04437255859375, "global_step": 254487, "epoch": 2103} {"train_loss": -43.222328186035156, "global_step": 254488, "epoch": 2103} {"train_loss": -43.74142074584961, "global_step": 254489, "epoch": 2103} {"train_loss": -43.36906814575195, "global_step": 254490, "epoch": 2103} {"train_loss": -43.326053619384766, "global_step": 254491, "epoch": 2103} {"train_loss": -43.99105453491211, "global_step": 254492, "epoch": 2103} {"train_loss": -43.41109848022461, "global_step": 254493, "epoch": 2103} {"train_loss": -43.96002197265625, "global_step": 254494, "epoch": 2103} {"train_loss": -43.628509521484375, "global_step": 254495, "epoch": 2103} {"train_loss": -43.58953857421875, "global_step": 254496, "epoch": 2103} {"train_loss": -43.700496673583984, "global_step": 254497, "epoch": 2103} {"train_loss": -43.740875244140625, "global_step": 254498, "epoch": 2103} {"train_loss": -43.19071578979492, "global_step": 254499, "epoch": 2103} {"train_loss": -43.78959274291992, "global_step": 254500, "epoch": 2103} {"train_loss": -43.682640075683594, "global_step": 254501, "epoch": 2103} {"train_loss": -43.63356399536133, "global_step": 254502, "epoch": 2103} {"train_loss": -43.82426834106445, "global_step": 254503, "epoch": 2103} {"train_loss": -43.549129486083984, "global_step": 254504, "epoch": 2103} {"train_loss": -43.75094223022461, "global_step": 254505, "epoch": 2103} {"train_loss": -43.79647445678711, "global_step": 254506, "epoch": 2103} {"train_loss": -43.82548904418945, "global_step": 254507, "epoch": 2103} {"train_loss": -43.97166061401367, "global_step": 254508, "epoch": 2103} {"train_loss": -43.981197357177734, "global_step": 254509, "epoch": 2103} {"train_loss": -43.930572509765625, "global_step": 254510, "epoch": 2103} {"train_loss": -44.001625061035156, "global_step": 254511, "epoch": 2103} {"train_loss": -44.17190933227539, "global_step": 254512, "epoch": 2103} {"train_loss": -44.0273551940918, "global_step": 254513, "epoch": 2103} {"train_loss": -44.05543899536133, "global_step": 254514, "epoch": 2103} {"train_loss": -44.757686614990234, "global_step": 254515, "epoch": 2103} {"train_loss": -43.87126922607422, "global_step": 254516, "epoch": 2103} {"train_loss": -43.49543380737305, "global_step": 254517, "epoch": 2103} {"train_loss": -43.798377990722656, "global_step": 254518, "epoch": 2103} {"train_loss": -44.466339111328125, "global_step": 254519, "epoch": 2103} {"train_loss": -43.656246185302734, "global_step": 254520, "epoch": 2103} {"train_loss": -44.02373123168945, "global_step": 254521, "epoch": 2103} {"train_loss": -44.32632064819336, "global_step": 254522, "epoch": 2103} {"train_loss": -43.932838439941406, "global_step": 254523, "epoch": 2103} {"train_loss": -44.173397064208984, "global_step": 254524, "epoch": 2103} {"train_loss": -44.3010139465332, "global_step": 254525, "epoch": 2103} {"train_loss": -43.97883987426758, "global_step": 254526, "epoch": 2103} {"train_loss": -43.72654342651367, "global_step": 254527, "epoch": 2103} {"train_loss": -43.98777389526367, "global_step": 254528, "epoch": 2103} {"train_loss": -44.192665100097656, "global_step": 254529, "epoch": 2103} {"train_loss": -44.63774490356445, "global_step": 254530, "epoch": 2103} {"train_loss": -44.36863327026367, "global_step": 254531, "epoch": 2103} {"train_loss": -44.28133773803711, "global_step": 254532, "epoch": 2103} {"train_loss": -44.424068450927734, "global_step": 254533, "epoch": 2103} {"train_loss": -44.263187408447266, "global_step": 254534, "epoch": 2103} {"train_loss": -44.1894416809082, "global_step": 254535, "epoch": 2103} {"train_loss": -44.23810958862305, "global_step": 254536, "epoch": 2103} {"train_loss": -44.368934631347656, "global_step": 254537, "epoch": 2103} {"train_loss": -44.754310607910156, "global_step": 254538, "epoch": 2103} {"train_loss": -44.63900375366211, "global_step": 254539, "epoch": 2103} {"train_loss": -44.410499572753906, "global_step": 254540, "epoch": 2103} {"train_loss": -44.7204704284668, "global_step": 254541, "epoch": 2103} {"train_loss": -44.71460723876953, "global_step": 254542, "epoch": 2103} {"train_loss": -44.78833770751953, "global_step": 254543, "epoch": 2103} {"train_loss": -44.18550109863281, "global_step": 254544, "epoch": 2103} {"train_loss": -44.68572998046875, "global_step": 254545, "epoch": 2103} {"train_loss": -44.751277923583984, "global_step": 254546, "epoch": 2103} {"train_loss": -43.88832092285156, "global_step": 254547, "epoch": 2103} {"train_loss": -44.369537353515625, "global_step": 254548, "epoch": 2103} {"train_loss": -44.38350296020508, "global_step": 254549, "epoch": 2103} {"train_loss": -44.50025177001953, "global_step": 254550, "epoch": 2103} {"train_loss": -43.83541488647461, "global_step": 254551, "epoch": 2103} {"train_loss": -44.278076171875, "global_step": 254552, "epoch": 2103} {"train_loss": -44.13100814819336, "global_step": 254553, "epoch": 2103} {"train_loss": -43.46035385131836, "global_step": 254554, "epoch": 2103} {"train_loss": -43.782989501953125, "global_step": 254555, "epoch": 2103} {"train_loss": -43.72338104248047, "global_step": 254556, "epoch": 2103} {"train_loss": -43.463497161865234, "global_step": 254557, "epoch": 2103} {"train_loss": -42.71194076538086, "global_step": 254558, "epoch": 2103} {"train_loss": -40.602447509765625, "global_step": 254559, "epoch": 2103} {"train_loss": -38.55995178222656, "global_step": 254560, "epoch": 2103} {"train_loss": -40.856361389160156, "global_step": 254561, "epoch": 2103} {"train_loss": -42.6114387512207, "global_step": 254562, "epoch": 2103} {"train_loss": -42.82755661010742, "global_step": 254563, "epoch": 2103} {"train_loss": -42.106563568115234, "global_step": 254564, "epoch": 2103} {"train_loss": -43.60393524169922, "global_step": 254565, "epoch": 2103} {"train_loss": -43.23678970336914, "global_step": 254566, "epoch": 2103} {"train_loss": -42.3586311340332, "global_step": 254567, "epoch": 2103} {"train_loss": -38.80050277709961, "global_step": 254568, "epoch": 2103} {"train_loss": -35.66340255737305, "global_step": 254569, "epoch": 2103} {"train_loss": -39.08945083618164, "global_step": 254570, "epoch": 2103} {"train_loss": -42.74503707885742, "global_step": 254571, "epoch": 2103} {"train_loss": -38.440956115722656, "global_step": 254572, "epoch": 2103} {"train_loss": -42.33872604370117, "global_step": 254573, "epoch": 2103} {"train_loss": -37.56853485107422, "global_step": 254574, "epoch": 2103} {"train_loss": -37.58430480957031, "global_step": 254575, "epoch": 2103} {"train_loss": -41.90761184692383, "global_step": 254576, "epoch": 2103} {"train_loss": -36.87594223022461, "global_step": 254577, "epoch": 2103} {"train_loss": -38.3014030456543, "global_step": 254578, "epoch": 2103} {"train_loss": -42.6191520690918, "global_step": 254579, "epoch": 2103} {"train_loss": -38.966346740722656, "global_step": 254580, "epoch": 2103} {"train_loss": -40.61286163330078, "global_step": 254581, "epoch": 2103} {"train_loss": -41.6160888671875, "global_step": 254582, "epoch": 2103} {"train_loss": -42.943996366390515, "global_step": 254583, "epoch": 2103, "val_loss": 2597895.5} {"train_loss": -40.2676887512207, "global_step": 254584, "epoch": 2104} {"train_loss": -42.35589599609375, "global_step": 254585, "epoch": 2104} {"train_loss": -41.92774200439453, "global_step": 254586, "epoch": 2104} {"train_loss": -41.36961364746094, "global_step": 254587, "epoch": 2104} {"train_loss": -41.56003952026367, "global_step": 254588, "epoch": 2104} {"train_loss": -42.6534538269043, "global_step": 254589, "epoch": 2104} {"train_loss": -40.70438766479492, "global_step": 254590, "epoch": 2104} {"train_loss": -42.32453155517578, "global_step": 254591, "epoch": 2104} {"train_loss": -41.6331787109375, "global_step": 254592, "epoch": 2104} {"train_loss": -42.88790512084961, "global_step": 254593, "epoch": 2104} {"train_loss": -42.358551025390625, "global_step": 254594, "epoch": 2104} {"train_loss": -42.1910400390625, "global_step": 254595, "epoch": 2104} {"train_loss": -42.60828399658203, "global_step": 254596, "epoch": 2104} {"train_loss": -42.54096603393555, "global_step": 254597, "epoch": 2104} {"train_loss": -42.38724136352539, "global_step": 254598, "epoch": 2104} {"train_loss": -42.9244270324707, "global_step": 254599, "epoch": 2104} {"train_loss": -43.3140754699707, "global_step": 254600, "epoch": 2104} {"train_loss": -42.90410614013672, "global_step": 254601, "epoch": 2104} {"train_loss": -43.08187484741211, "global_step": 254602, "epoch": 2104} {"train_loss": -42.96662139892578, "global_step": 254603, "epoch": 2104} {"train_loss": -43.166748046875, "global_step": 254604, "epoch": 2104} {"train_loss": -43.55982208251953, "global_step": 254605, "epoch": 2104} {"train_loss": -42.94710922241211, "global_step": 254606, "epoch": 2104} {"train_loss": -43.3179931640625, "global_step": 254607, "epoch": 2104} {"train_loss": -42.97930908203125, "global_step": 254608, "epoch": 2104} {"train_loss": -43.315895080566406, "global_step": 254609, "epoch": 2104} {"train_loss": -43.25275421142578, "global_step": 254610, "epoch": 2104} {"train_loss": -43.30406951904297, "global_step": 254611, "epoch": 2104} {"train_loss": -42.83852767944336, "global_step": 254612, "epoch": 2104} {"train_loss": -43.34046173095703, "global_step": 254613, "epoch": 2104} {"train_loss": -43.3294792175293, "global_step": 254614, "epoch": 2104} {"train_loss": -43.01373291015625, "global_step": 254615, "epoch": 2104} {"train_loss": -42.9953727722168, "global_step": 254616, "epoch": 2104} {"train_loss": -43.43213653564453, "global_step": 254617, "epoch": 2104} {"train_loss": -43.6121940612793, "global_step": 254618, "epoch": 2104} {"train_loss": -43.776817321777344, "global_step": 254619, "epoch": 2104} {"train_loss": -43.53115463256836, "global_step": 254620, "epoch": 2104} {"train_loss": -44.1314811706543, "global_step": 254621, "epoch": 2104} {"train_loss": -43.627132415771484, "global_step": 254622, "epoch": 2104} {"train_loss": -43.990230560302734, "global_step": 254623, "epoch": 2104} {"train_loss": -44.0928840637207, "global_step": 254624, "epoch": 2104} {"train_loss": -43.726104736328125, "global_step": 254625, "epoch": 2104} {"train_loss": -43.37226867675781, "global_step": 254626, "epoch": 2104} {"train_loss": -43.75474548339844, "global_step": 254627, "epoch": 2104} {"train_loss": -43.88265609741211, "global_step": 254628, "epoch": 2104} {"train_loss": -43.5922966003418, "global_step": 254629, "epoch": 2104} {"train_loss": -44.1454963684082, "global_step": 254630, "epoch": 2104} {"train_loss": -44.09818649291992, "global_step": 254631, "epoch": 2104} {"train_loss": -43.62171173095703, "global_step": 254632, "epoch": 2104} {"train_loss": -44.06983184814453, "global_step": 254633, "epoch": 2104} {"train_loss": -44.2281494140625, "global_step": 254634, "epoch": 2104} {"train_loss": -43.564327239990234, "global_step": 254635, "epoch": 2104} {"train_loss": -43.85044860839844, "global_step": 254636, "epoch": 2104} {"train_loss": -44.2824592590332, "global_step": 254637, "epoch": 2104} {"train_loss": -43.86100387573242, "global_step": 254638, "epoch": 2104} {"train_loss": -44.02302932739258, "global_step": 254639, "epoch": 2104} {"train_loss": -44.52384567260742, "global_step": 254640, "epoch": 2104} {"train_loss": -44.187835693359375, "global_step": 254641, "epoch": 2104} {"train_loss": -44.09662628173828, "global_step": 254642, "epoch": 2104} {"train_loss": -44.229610443115234, "global_step": 254643, "epoch": 2104} {"train_loss": -44.382347106933594, "global_step": 254644, "epoch": 2104} {"train_loss": -43.469482421875, "global_step": 254645, "epoch": 2104} {"train_loss": -43.388851165771484, "global_step": 254646, "epoch": 2104} {"train_loss": -44.4107780456543, "global_step": 254647, "epoch": 2104} {"train_loss": -43.620758056640625, "global_step": 254648, "epoch": 2104} {"train_loss": -43.716609954833984, "global_step": 254649, "epoch": 2104} {"train_loss": -43.24602508544922, "global_step": 254650, "epoch": 2104} {"train_loss": -42.15242385864258, "global_step": 254651, "epoch": 2104} {"train_loss": -42.40224838256836, "global_step": 254652, "epoch": 2104} {"train_loss": -43.49589920043945, "global_step": 254653, "epoch": 2104} {"train_loss": -43.18471145629883, "global_step": 254654, "epoch": 2104} {"train_loss": -43.252296447753906, "global_step": 254655, "epoch": 2104} {"train_loss": -43.74822998046875, "global_step": 254656, "epoch": 2104} {"train_loss": -43.37917709350586, "global_step": 254657, "epoch": 2104} {"train_loss": -42.67013168334961, "global_step": 254658, "epoch": 2104} {"train_loss": -44.175594329833984, "global_step": 254659, "epoch": 2104} {"train_loss": -43.73106384277344, "global_step": 254660, "epoch": 2104} {"train_loss": -43.02877426147461, "global_step": 254661, "epoch": 2104} {"train_loss": -43.21842575073242, "global_step": 254662, "epoch": 2104} {"train_loss": -44.055850982666016, "global_step": 254663, "epoch": 2104} {"train_loss": -42.80507278442383, "global_step": 254664, "epoch": 2104} {"train_loss": -41.5674934387207, "global_step": 254665, "epoch": 2104} {"train_loss": -43.26424789428711, "global_step": 254666, "epoch": 2104} {"train_loss": -43.07697677612305, "global_step": 254667, "epoch": 2104} {"train_loss": -42.31386947631836, "global_step": 254668, "epoch": 2104} {"train_loss": -40.87092208862305, "global_step": 254669, "epoch": 2104} {"train_loss": -40.45772171020508, "global_step": 254670, "epoch": 2104} {"train_loss": -41.88296127319336, "global_step": 254671, "epoch": 2104} {"train_loss": -42.642276763916016, "global_step": 254672, "epoch": 2104} {"train_loss": -43.02400207519531, "global_step": 254673, "epoch": 2104} {"train_loss": -40.42192459106445, "global_step": 254674, "epoch": 2104} {"train_loss": -38.38136672973633, "global_step": 254675, "epoch": 2104} {"train_loss": -42.84080505371094, "global_step": 254676, "epoch": 2104} {"train_loss": -42.325862884521484, "global_step": 254677, "epoch": 2104} {"train_loss": -36.95935821533203, "global_step": 254678, "epoch": 2104} {"train_loss": -34.56381607055664, "global_step": 254679, "epoch": 2104} {"train_loss": -39.886322021484375, "global_step": 254680, "epoch": 2104} {"train_loss": -40.623199462890625, "global_step": 254681, "epoch": 2104} {"train_loss": -38.24296951293945, "global_step": 254682, "epoch": 2104} {"train_loss": -35.33042526245117, "global_step": 254683, "epoch": 2104} {"train_loss": -40.586509704589844, "global_step": 254684, "epoch": 2104} {"train_loss": -37.69468307495117, "global_step": 254685, "epoch": 2104} {"train_loss": -37.8992805480957, "global_step": 254686, "epoch": 2104} {"train_loss": -39.29512405395508, "global_step": 254687, "epoch": 2104} {"train_loss": -37.69953536987305, "global_step": 254688, "epoch": 2104} {"train_loss": -39.004920959472656, "global_step": 254689, "epoch": 2104} {"train_loss": -39.88816452026367, "global_step": 254690, "epoch": 2104} {"train_loss": -37.8797607421875, "global_step": 254691, "epoch": 2104} {"train_loss": -38.48613739013672, "global_step": 254692, "epoch": 2104} {"train_loss": -39.74052047729492, "global_step": 254693, "epoch": 2104} {"train_loss": -38.74361801147461, "global_step": 254694, "epoch": 2104} {"train_loss": -40.57857894897461, "global_step": 254695, "epoch": 2104} {"train_loss": -39.44260787963867, "global_step": 254696, "epoch": 2104} {"train_loss": -40.15869140625, "global_step": 254697, "epoch": 2104} {"train_loss": -40.1965217590332, "global_step": 254698, "epoch": 2104} {"train_loss": -40.218685150146484, "global_step": 254699, "epoch": 2104} {"train_loss": -40.63007736206055, "global_step": 254700, "epoch": 2104} {"train_loss": -40.64374542236328, "global_step": 254701, "epoch": 2104} {"train_loss": -40.939212799072266, "global_step": 254702, "epoch": 2104} {"train_loss": -42.0551872253418, "global_step": 254703, "epoch": 2104} {"train_loss": -42.18803910184498, "global_step": 254704, "epoch": 2104, "val_loss": 2616092.25} {"train_loss": -40.97233200073242, "global_step": 254705, "epoch": 2105} {"train_loss": -40.63492202758789, "global_step": 254706, "epoch": 2105} {"train_loss": -41.45522689819336, "global_step": 254707, "epoch": 2105} {"train_loss": -41.46401596069336, "global_step": 254708, "epoch": 2105} {"train_loss": -41.80399703979492, "global_step": 254709, "epoch": 2105} {"train_loss": -41.29052734375, "global_step": 254710, "epoch": 2105} {"train_loss": -42.00223922729492, "global_step": 254711, "epoch": 2105} {"train_loss": -41.37336349487305, "global_step": 254712, "epoch": 2105} {"train_loss": -42.41103744506836, "global_step": 254713, "epoch": 2105} {"train_loss": -42.16447067260742, "global_step": 254714, "epoch": 2105} {"train_loss": -42.280975341796875, "global_step": 254715, "epoch": 2105} {"train_loss": -42.12874984741211, "global_step": 254716, "epoch": 2105} {"train_loss": -42.564056396484375, "global_step": 254717, "epoch": 2105} {"train_loss": -42.68345260620117, "global_step": 254718, "epoch": 2105} {"train_loss": -42.75261306762695, "global_step": 254719, "epoch": 2105} {"train_loss": -42.86619186401367, "global_step": 254720, "epoch": 2105} {"train_loss": -42.52002716064453, "global_step": 254721, "epoch": 2105} {"train_loss": -43.193111419677734, "global_step": 254722, "epoch": 2105} {"train_loss": -42.589942932128906, "global_step": 254723, "epoch": 2105} {"train_loss": -42.833988189697266, "global_step": 254724, "epoch": 2105} {"train_loss": -43.11815643310547, "global_step": 254725, "epoch": 2105} {"train_loss": -42.64125442504883, "global_step": 254726, "epoch": 2105} {"train_loss": -42.99137878417969, "global_step": 254727, "epoch": 2105} {"train_loss": -43.30097961425781, "global_step": 254728, "epoch": 2105} {"train_loss": -43.39925765991211, "global_step": 254729, "epoch": 2105} {"train_loss": -43.151214599609375, "global_step": 254730, "epoch": 2105} {"train_loss": -42.946102142333984, "global_step": 254731, "epoch": 2105} {"train_loss": -43.50604248046875, "global_step": 254732, "epoch": 2105} {"train_loss": -42.903316497802734, "global_step": 254733, "epoch": 2105} {"train_loss": -43.551849365234375, "global_step": 254734, "epoch": 2105} {"train_loss": -43.57539749145508, "global_step": 254735, "epoch": 2105} {"train_loss": -43.595741271972656, "global_step": 254736, "epoch": 2105} {"train_loss": -43.50300979614258, "global_step": 254737, "epoch": 2105} {"train_loss": -43.702571868896484, "global_step": 254738, "epoch": 2105} {"train_loss": -43.6135139465332, "global_step": 254739, "epoch": 2105} {"train_loss": -43.37166976928711, "global_step": 254740, "epoch": 2105} {"train_loss": -43.990692138671875, "global_step": 254741, "epoch": 2105} {"train_loss": -43.87913513183594, "global_step": 254742, "epoch": 2105} {"train_loss": -43.76096725463867, "global_step": 254743, "epoch": 2105} {"train_loss": -44.05388259887695, "global_step": 254744, "epoch": 2105} {"train_loss": -43.91929626464844, "global_step": 254745, "epoch": 2105} {"train_loss": -44.135833740234375, "global_step": 254746, "epoch": 2105} {"train_loss": -43.61283493041992, "global_step": 254747, "epoch": 2105} {"train_loss": -43.95243453979492, "global_step": 254748, "epoch": 2105} {"train_loss": -44.0926628112793, "global_step": 254749, "epoch": 2105} {"train_loss": -43.94281005859375, "global_step": 254750, "epoch": 2105} {"train_loss": -43.57633972167969, "global_step": 254751, "epoch": 2105} {"train_loss": -43.83827590942383, "global_step": 254752, "epoch": 2105} {"train_loss": -43.922122955322266, "global_step": 254753, "epoch": 2105} {"train_loss": -43.936763763427734, "global_step": 254754, "epoch": 2105} {"train_loss": -44.09990310668945, "global_step": 254755, "epoch": 2105} {"train_loss": -44.05011749267578, "global_step": 254756, "epoch": 2105} {"train_loss": -44.128902435302734, "global_step": 254757, "epoch": 2105} {"train_loss": -44.46006393432617, "global_step": 254758, "epoch": 2105} {"train_loss": -43.77118682861328, "global_step": 254759, "epoch": 2105} {"train_loss": -43.96293258666992, "global_step": 254760, "epoch": 2105} {"train_loss": -43.97573471069336, "global_step": 254761, "epoch": 2105} {"train_loss": -44.4808464050293, "global_step": 254762, "epoch": 2105} {"train_loss": -44.393096923828125, "global_step": 254763, "epoch": 2105} {"train_loss": -44.22333526611328, "global_step": 254764, "epoch": 2105} {"train_loss": -44.22414779663086, "global_step": 254765, "epoch": 2105} {"train_loss": -44.34103775024414, "global_step": 254766, "epoch": 2105} {"train_loss": -44.474815368652344, "global_step": 254767, "epoch": 2105} {"train_loss": -44.2380256652832, "global_step": 254768, "epoch": 2105} {"train_loss": -43.8218879699707, "global_step": 254769, "epoch": 2105} {"train_loss": -43.834877014160156, "global_step": 254770, "epoch": 2105} {"train_loss": -44.62925338745117, "global_step": 254771, "epoch": 2105} {"train_loss": -44.285499572753906, "global_step": 254772, "epoch": 2105} {"train_loss": -44.52861785888672, "global_step": 254773, "epoch": 2105} {"train_loss": -44.33124923706055, "global_step": 254774, "epoch": 2105} {"train_loss": -44.464622497558594, "global_step": 254775, "epoch": 2105} {"train_loss": -44.4280891418457, "global_step": 254776, "epoch": 2105} {"train_loss": -44.5583381652832, "global_step": 254777, "epoch": 2105} {"train_loss": -44.321495056152344, "global_step": 254778, "epoch": 2105} {"train_loss": -44.52677536010742, "global_step": 254779, "epoch": 2105} {"train_loss": -44.824275970458984, "global_step": 254780, "epoch": 2105} {"train_loss": -44.3286018371582, "global_step": 254781, "epoch": 2105} {"train_loss": -44.56075668334961, "global_step": 254782, "epoch": 2105} {"train_loss": -44.38287353515625, "global_step": 254783, "epoch": 2105} {"train_loss": -44.4027214050293, "global_step": 254784, "epoch": 2105} {"train_loss": -44.56547927856445, "global_step": 254785, "epoch": 2105} {"train_loss": -44.605865478515625, "global_step": 254786, "epoch": 2105} {"train_loss": -44.12213897705078, "global_step": 254787, "epoch": 2105} {"train_loss": -44.24683380126953, "global_step": 254788, "epoch": 2105} {"train_loss": -43.678951263427734, "global_step": 254789, "epoch": 2105} {"train_loss": -42.68117904663086, "global_step": 254790, "epoch": 2105} {"train_loss": -41.97272491455078, "global_step": 254791, "epoch": 2105} {"train_loss": -42.83234405517578, "global_step": 254792, "epoch": 2105} {"train_loss": -43.34868240356445, "global_step": 254793, "epoch": 2105} {"train_loss": -41.63063049316406, "global_step": 254794, "epoch": 2105} {"train_loss": -38.8951530456543, "global_step": 254795, "epoch": 2105} {"train_loss": -38.03609848022461, "global_step": 254796, "epoch": 2105} {"train_loss": -42.35648727416992, "global_step": 254797, "epoch": 2105} {"train_loss": -32.441410064697266, "global_step": 254798, "epoch": 2105} {"train_loss": -33.77162551879883, "global_step": 254799, "epoch": 2105} {"train_loss": -19.515308380126953, "global_step": 254800, "epoch": 2105} {"train_loss": -15.712031364440918, "global_step": 254801, "epoch": 2105} {"train_loss": -24.348464965820312, "global_step": 254802, "epoch": 2105} {"train_loss": -17.2673397064209, "global_step": 254803, "epoch": 2105} {"train_loss": -28.74775505065918, "global_step": 254804, "epoch": 2105} {"train_loss": -27.483732223510742, "global_step": 254805, "epoch": 2105} {"train_loss": -21.63978385925293, "global_step": 254806, "epoch": 2105} {"train_loss": -27.476133346557617, "global_step": 254807, "epoch": 2105} {"train_loss": -32.62173843383789, "global_step": 254808, "epoch": 2105} {"train_loss": -25.95635986328125, "global_step": 254809, "epoch": 2105} {"train_loss": -27.755645751953125, "global_step": 254810, "epoch": 2105} {"train_loss": -33.122840881347656, "global_step": 254811, "epoch": 2105} {"train_loss": -32.14196014404297, "global_step": 254812, "epoch": 2105} {"train_loss": -31.355304718017578, "global_step": 254813, "epoch": 2105} {"train_loss": -31.23270034790039, "global_step": 254814, "epoch": 2105} {"train_loss": -33.64470291137695, "global_step": 254815, "epoch": 2105} {"train_loss": -33.90060043334961, "global_step": 254816, "epoch": 2105} {"train_loss": -33.08816146850586, "global_step": 254817, "epoch": 2105} {"train_loss": -34.12059783935547, "global_step": 254818, "epoch": 2105} {"train_loss": -33.87746810913086, "global_step": 254819, "epoch": 2105} {"train_loss": -35.733642578125, "global_step": 254820, "epoch": 2105} {"train_loss": -35.25934600830078, "global_step": 254821, "epoch": 2105} {"train_loss": -35.82755661010742, "global_step": 254822, "epoch": 2105} {"train_loss": -36.499656677246094, "global_step": 254823, "epoch": 2105} {"train_loss": -35.20232009887695, "global_step": 254824, "epoch": 2105} {"train_loss": -40.29883708638593, "global_step": 254825, "epoch": 2105, "val_loss": 2676126.5} {"train_loss": -37.96731185913086, "global_step": 254826, "epoch": 2106} {"train_loss": -37.040462493896484, "global_step": 254827, "epoch": 2106} {"train_loss": -37.9161376953125, "global_step": 254828, "epoch": 2106} {"train_loss": -37.56431198120117, "global_step": 254829, "epoch": 2106} {"train_loss": -37.81327438354492, "global_step": 254830, "epoch": 2106} {"train_loss": -38.2999382019043, "global_step": 254831, "epoch": 2106} {"train_loss": -37.01756286621094, "global_step": 254832, "epoch": 2106} {"train_loss": -37.63472366333008, "global_step": 254833, "epoch": 2106} {"train_loss": -38.34326934814453, "global_step": 254834, "epoch": 2106} {"train_loss": -38.84114456176758, "global_step": 254835, "epoch": 2106} {"train_loss": -37.47017288208008, "global_step": 254836, "epoch": 2106} {"train_loss": -39.408172607421875, "global_step": 254837, "epoch": 2106} {"train_loss": -39.34860610961914, "global_step": 254838, "epoch": 2106} {"train_loss": -38.8288688659668, "global_step": 254839, "epoch": 2106} {"train_loss": -38.88775634765625, "global_step": 254840, "epoch": 2106} {"train_loss": -39.52163314819336, "global_step": 254841, "epoch": 2106} {"train_loss": -39.15461730957031, "global_step": 254842, "epoch": 2106} {"train_loss": -39.6739501953125, "global_step": 254843, "epoch": 2106} {"train_loss": -40.26118087768555, "global_step": 254844, "epoch": 2106} {"train_loss": -40.60612869262695, "global_step": 254845, "epoch": 2106} {"train_loss": -39.91340255737305, "global_step": 254846, "epoch": 2106} {"train_loss": -40.157405853271484, "global_step": 254847, "epoch": 2106} {"train_loss": -40.93149185180664, "global_step": 254848, "epoch": 2106} {"train_loss": -40.569332122802734, "global_step": 254849, "epoch": 2106} {"train_loss": -40.678863525390625, "global_step": 254850, "epoch": 2106} {"train_loss": -41.30684280395508, "global_step": 254851, "epoch": 2106} {"train_loss": -41.160396575927734, "global_step": 254852, "epoch": 2106} {"train_loss": -41.222137451171875, "global_step": 254853, "epoch": 2106} {"train_loss": -41.05636978149414, "global_step": 254854, "epoch": 2106} {"train_loss": -42.16395950317383, "global_step": 254855, "epoch": 2106} {"train_loss": -42.21574783325195, "global_step": 254856, "epoch": 2106} {"train_loss": -41.7912712097168, "global_step": 254857, "epoch": 2106} {"train_loss": -41.54596710205078, "global_step": 254858, "epoch": 2106} {"train_loss": -42.11041259765625, "global_step": 254859, "epoch": 2106} {"train_loss": -42.00814437866211, "global_step": 254860, "epoch": 2106} {"train_loss": -42.4922981262207, "global_step": 254861, "epoch": 2106} {"train_loss": -41.77632522583008, "global_step": 254862, "epoch": 2106} {"train_loss": -42.309303283691406, "global_step": 254863, "epoch": 2106} {"train_loss": -42.64460372924805, "global_step": 254864, "epoch": 2106} {"train_loss": -42.94228744506836, "global_step": 254865, "epoch": 2106} {"train_loss": -42.91099166870117, "global_step": 254866, "epoch": 2106} {"train_loss": -42.86415481567383, "global_step": 254867, "epoch": 2106} {"train_loss": -42.930335998535156, "global_step": 254868, "epoch": 2106} {"train_loss": -43.27301025390625, "global_step": 254869, "epoch": 2106} {"train_loss": -43.102516174316406, "global_step": 254870, "epoch": 2106} {"train_loss": -43.01057052612305, "global_step": 254871, "epoch": 2106} {"train_loss": -43.52680587768555, "global_step": 254872, "epoch": 2106} {"train_loss": -43.27109909057617, "global_step": 254873, "epoch": 2106} {"train_loss": -43.54578399658203, "global_step": 254874, "epoch": 2106} {"train_loss": -43.46609878540039, "global_step": 254875, "epoch": 2106} {"train_loss": -43.328243255615234, "global_step": 254876, "epoch": 2106} {"train_loss": -43.23661422729492, "global_step": 254877, "epoch": 2106} {"train_loss": -43.54592514038086, "global_step": 254878, "epoch": 2106} {"train_loss": -43.79932403564453, "global_step": 254879, "epoch": 2106} {"train_loss": -43.697811126708984, "global_step": 254880, "epoch": 2106} {"train_loss": -43.792625427246094, "global_step": 254881, "epoch": 2106} {"train_loss": -43.62444305419922, "global_step": 254882, "epoch": 2106} {"train_loss": -44.192352294921875, "global_step": 254883, "epoch": 2106} {"train_loss": -43.85200119018555, "global_step": 254884, "epoch": 2106} {"train_loss": -43.86567306518555, "global_step": 254885, "epoch": 2106} {"train_loss": -43.89607238769531, "global_step": 254886, "epoch": 2106} {"train_loss": -43.872344970703125, "global_step": 254887, "epoch": 2106} {"train_loss": -43.75748062133789, "global_step": 254888, "epoch": 2106} {"train_loss": -43.87472152709961, "global_step": 254889, "epoch": 2106} {"train_loss": -44.0787467956543, "global_step": 254890, "epoch": 2106} {"train_loss": -43.66499328613281, "global_step": 254891, "epoch": 2106} {"train_loss": -44.11338424682617, "global_step": 254892, "epoch": 2106} {"train_loss": -44.28715896606445, "global_step": 254893, "epoch": 2106} {"train_loss": -44.04944610595703, "global_step": 254894, "epoch": 2106} {"train_loss": -44.19422149658203, "global_step": 254895, "epoch": 2106} {"train_loss": -43.96095275878906, "global_step": 254896, "epoch": 2106} {"train_loss": -43.74300765991211, "global_step": 254897, "epoch": 2106} {"train_loss": -44.576904296875, "global_step": 254898, "epoch": 2106} {"train_loss": -44.24892807006836, "global_step": 254899, "epoch": 2106} {"train_loss": -44.65494918823242, "global_step": 254900, "epoch": 2106} {"train_loss": -44.11420822143555, "global_step": 254901, "epoch": 2106} {"train_loss": -44.03043746948242, "global_step": 254902, "epoch": 2106} {"train_loss": -44.13740921020508, "global_step": 254903, "epoch": 2106} {"train_loss": -44.0695686340332, "global_step": 254904, "epoch": 2106} {"train_loss": -44.24059295654297, "global_step": 254905, "epoch": 2106} {"train_loss": -44.2918586730957, "global_step": 254906, "epoch": 2106} {"train_loss": -43.94550704956055, "global_step": 254907, "epoch": 2106} {"train_loss": -44.090293884277344, "global_step": 254908, "epoch": 2106} {"train_loss": -44.059818267822266, "global_step": 254909, "epoch": 2106} {"train_loss": -44.17197799682617, "global_step": 254910, "epoch": 2106} {"train_loss": -44.06891632080078, "global_step": 254911, "epoch": 2106} {"train_loss": -44.076786041259766, "global_step": 254912, "epoch": 2106} {"train_loss": -44.43048858642578, "global_step": 254913, "epoch": 2106} {"train_loss": -43.463600158691406, "global_step": 254914, "epoch": 2106} {"train_loss": -43.83736801147461, "global_step": 254915, "epoch": 2106} {"train_loss": -44.06587219238281, "global_step": 254916, "epoch": 2106} {"train_loss": -44.04194259643555, "global_step": 254917, "epoch": 2106} {"train_loss": -44.153194427490234, "global_step": 254918, "epoch": 2106} {"train_loss": -43.76032638549805, "global_step": 254919, "epoch": 2106} {"train_loss": -43.56089401245117, "global_step": 254920, "epoch": 2106} {"train_loss": -43.40458297729492, "global_step": 254921, "epoch": 2106} {"train_loss": -44.21337890625, "global_step": 254922, "epoch": 2106} {"train_loss": -42.74550247192383, "global_step": 254923, "epoch": 2106} {"train_loss": -41.85114288330078, "global_step": 254924, "epoch": 2106} {"train_loss": -43.73798751831055, "global_step": 254925, "epoch": 2106} {"train_loss": -43.37491989135742, "global_step": 254926, "epoch": 2106} {"train_loss": -42.562313079833984, "global_step": 254927, "epoch": 2106} {"train_loss": -43.276611328125, "global_step": 254928, "epoch": 2106} {"train_loss": -44.023502349853516, "global_step": 254929, "epoch": 2106} {"train_loss": -43.162391662597656, "global_step": 254930, "epoch": 2106} {"train_loss": -43.739688873291016, "global_step": 254931, "epoch": 2106} {"train_loss": -42.88167953491211, "global_step": 254932, "epoch": 2106} {"train_loss": -43.625038146972656, "global_step": 254933, "epoch": 2106} {"train_loss": -43.23031997680664, "global_step": 254934, "epoch": 2106} {"train_loss": -43.47677230834961, "global_step": 254935, "epoch": 2106} {"train_loss": -43.4853401184082, "global_step": 254936, "epoch": 2106} {"train_loss": -43.476314544677734, "global_step": 254937, "epoch": 2106} {"train_loss": -42.8813591003418, "global_step": 254938, "epoch": 2106} {"train_loss": -43.29231643676758, "global_step": 254939, "epoch": 2106} {"train_loss": -41.87730026245117, "global_step": 254940, "epoch": 2106} {"train_loss": -40.974971771240234, "global_step": 254941, "epoch": 2106} {"train_loss": -42.4537239074707, "global_step": 254942, "epoch": 2106} {"train_loss": -41.794124603271484, "global_step": 254943, "epoch": 2106} {"train_loss": -41.45717239379883, "global_step": 254944, "epoch": 2106} {"train_loss": -43.394622802734375, "global_step": 254945, "epoch": 2106} {"train_loss": -42.391924361552086, "global_step": 254946, "epoch": 2106, "val_loss": 2743772.75} {"train_loss": -39.440940856933594, "global_step": 254947, "epoch": 2107} {"train_loss": -41.677391052246094, "global_step": 254948, "epoch": 2107} {"train_loss": -40.09505844116211, "global_step": 254949, "epoch": 2107} {"train_loss": -42.6463737487793, "global_step": 254950, "epoch": 2107} {"train_loss": -42.57746124267578, "global_step": 254951, "epoch": 2107} {"train_loss": -41.524383544921875, "global_step": 254952, "epoch": 2107} {"train_loss": -40.404212951660156, "global_step": 254953, "epoch": 2107} {"train_loss": -40.61921310424805, "global_step": 254954, "epoch": 2107} {"train_loss": -42.33415603637695, "global_step": 254955, "epoch": 2107} {"train_loss": -40.9820556640625, "global_step": 254956, "epoch": 2107} {"train_loss": -42.3635139465332, "global_step": 254957, "epoch": 2107} {"train_loss": -42.08720016479492, "global_step": 254958, "epoch": 2107} {"train_loss": -42.84918975830078, "global_step": 254959, "epoch": 2107} {"train_loss": -42.05216979980469, "global_step": 254960, "epoch": 2107} {"train_loss": -42.33989334106445, "global_step": 254961, "epoch": 2107} {"train_loss": -41.986263275146484, "global_step": 254962, "epoch": 2107} {"train_loss": -42.64038848876953, "global_step": 254963, "epoch": 2107} {"train_loss": -41.59698486328125, "global_step": 254964, "epoch": 2107} {"train_loss": -42.030086517333984, "global_step": 254965, "epoch": 2107} {"train_loss": -42.01749038696289, "global_step": 254966, "epoch": 2107} {"train_loss": -41.46010208129883, "global_step": 254967, "epoch": 2107} {"train_loss": -42.86391830444336, "global_step": 254968, "epoch": 2107} {"train_loss": -41.79172897338867, "global_step": 254969, "epoch": 2107} {"train_loss": -43.76340103149414, "global_step": 254970, "epoch": 2107} {"train_loss": -40.9875373840332, "global_step": 254971, "epoch": 2107} {"train_loss": -42.5486946105957, "global_step": 254972, "epoch": 2107} {"train_loss": -42.24952697753906, "global_step": 254973, "epoch": 2107} {"train_loss": -41.55668640136719, "global_step": 254974, "epoch": 2107} {"train_loss": -39.35142517089844, "global_step": 254975, "epoch": 2107} {"train_loss": -41.70830154418945, "global_step": 254976, "epoch": 2107} {"train_loss": -41.2240104675293, "global_step": 254977, "epoch": 2107} {"train_loss": -41.35177230834961, "global_step": 254978, "epoch": 2107} {"train_loss": -39.889400482177734, "global_step": 254979, "epoch": 2107} {"train_loss": -41.93408966064453, "global_step": 254980, "epoch": 2107} {"train_loss": -42.5303840637207, "global_step": 254981, "epoch": 2107} {"train_loss": -40.79410934448242, "global_step": 254982, "epoch": 2107} {"train_loss": -42.37824249267578, "global_step": 254983, "epoch": 2107} {"train_loss": -42.11559295654297, "global_step": 254984, "epoch": 2107} {"train_loss": -41.696388244628906, "global_step": 254985, "epoch": 2107} {"train_loss": -43.21745681762695, "global_step": 254986, "epoch": 2107} {"train_loss": -41.387813568115234, "global_step": 254987, "epoch": 2107} {"train_loss": -42.47393798828125, "global_step": 254988, "epoch": 2107} {"train_loss": -42.329063415527344, "global_step": 254989, "epoch": 2107} {"train_loss": -43.31016159057617, "global_step": 254990, "epoch": 2107} {"train_loss": -42.70674514770508, "global_step": 254991, "epoch": 2107} {"train_loss": -43.18405532836914, "global_step": 254992, "epoch": 2107} {"train_loss": -43.07698440551758, "global_step": 254993, "epoch": 2107} {"train_loss": -42.66975021362305, "global_step": 254994, "epoch": 2107} {"train_loss": -43.77244186401367, "global_step": 254995, "epoch": 2107} {"train_loss": -43.05434036254883, "global_step": 254996, "epoch": 2107} {"train_loss": -43.47952651977539, "global_step": 254997, "epoch": 2107} {"train_loss": -43.53535079956055, "global_step": 254998, "epoch": 2107} {"train_loss": -43.251251220703125, "global_step": 254999, "epoch": 2107} {"train_loss": -43.69955062866211, "global_step": 255000, "epoch": 2107} {"train_loss": -43.10396957397461, "global_step": 255001, "epoch": 2107} {"train_loss": -43.712459564208984, "global_step": 255002, "epoch": 2107} {"train_loss": -43.4367561340332, "global_step": 255003, "epoch": 2107} {"train_loss": -44.046077728271484, "global_step": 255004, "epoch": 2107} {"train_loss": -43.87887191772461, "global_step": 255005, "epoch": 2107} {"train_loss": -43.81455612182617, "global_step": 255006, "epoch": 2107} {"train_loss": -43.89519500732422, "global_step": 255007, "epoch": 2107} {"train_loss": -43.97457504272461, "global_step": 255008, "epoch": 2107} {"train_loss": -44.178192138671875, "global_step": 255009, "epoch": 2107} {"train_loss": -44.18941879272461, "global_step": 255010, "epoch": 2107} {"train_loss": -44.099586486816406, "global_step": 255011, "epoch": 2107} {"train_loss": -44.07146072387695, "global_step": 255012, "epoch": 2107} {"train_loss": -43.971893310546875, "global_step": 255013, "epoch": 2107} {"train_loss": -44.14036560058594, "global_step": 255014, "epoch": 2107} {"train_loss": -44.52191162109375, "global_step": 255015, "epoch": 2107} {"train_loss": -44.0704460144043, "global_step": 255016, "epoch": 2107} {"train_loss": -44.22849655151367, "global_step": 255017, "epoch": 2107} {"train_loss": -43.82487106323242, "global_step": 255018, "epoch": 2107} {"train_loss": -44.2025260925293, "global_step": 255019, "epoch": 2107} {"train_loss": -44.23447799682617, "global_step": 255020, "epoch": 2107} {"train_loss": -44.43842697143555, "global_step": 255021, "epoch": 2107} {"train_loss": -44.18491744995117, "global_step": 255022, "epoch": 2107} {"train_loss": -44.0889892578125, "global_step": 255023, "epoch": 2107} {"train_loss": -44.2722053527832, "global_step": 255024, "epoch": 2107} {"train_loss": -44.27934646606445, "global_step": 255025, "epoch": 2107} {"train_loss": -43.65739822387695, "global_step": 255026, "epoch": 2107} {"train_loss": -43.98067092895508, "global_step": 255027, "epoch": 2107} {"train_loss": -44.4985466003418, "global_step": 255028, "epoch": 2107} {"train_loss": -44.480167388916016, "global_step": 255029, "epoch": 2107} {"train_loss": -44.099578857421875, "global_step": 255030, "epoch": 2107} {"train_loss": -44.54410934448242, "global_step": 255031, "epoch": 2107} {"train_loss": -43.7093391418457, "global_step": 255032, "epoch": 2107} {"train_loss": -44.614742279052734, "global_step": 255033, "epoch": 2107} {"train_loss": -43.363826751708984, "global_step": 255034, "epoch": 2107} {"train_loss": -42.859012603759766, "global_step": 255035, "epoch": 2107} {"train_loss": -42.35270309448242, "global_step": 255036, "epoch": 2107} {"train_loss": -44.00765609741211, "global_step": 255037, "epoch": 2107} {"train_loss": -43.94334030151367, "global_step": 255038, "epoch": 2107} {"train_loss": -42.78487014770508, "global_step": 255039, "epoch": 2107} {"train_loss": -42.72646713256836, "global_step": 255040, "epoch": 2107} {"train_loss": -43.05772018432617, "global_step": 255041, "epoch": 2107} {"train_loss": -42.23698806762695, "global_step": 255042, "epoch": 2107} {"train_loss": -43.57661056518555, "global_step": 255043, "epoch": 2107} {"train_loss": -43.24847412109375, "global_step": 255044, "epoch": 2107} {"train_loss": -42.92476272583008, "global_step": 255045, "epoch": 2107} {"train_loss": -43.39140701293945, "global_step": 255046, "epoch": 2107} {"train_loss": -43.87099075317383, "global_step": 255047, "epoch": 2107} {"train_loss": -42.35531234741211, "global_step": 255048, "epoch": 2107} {"train_loss": -43.24844741821289, "global_step": 255049, "epoch": 2107} {"train_loss": -44.09741973876953, "global_step": 255050, "epoch": 2107} {"train_loss": -43.248023986816406, "global_step": 255051, "epoch": 2107} {"train_loss": -41.85239791870117, "global_step": 255052, "epoch": 2107} {"train_loss": -42.04057693481445, "global_step": 255053, "epoch": 2107} {"train_loss": -43.269290924072266, "global_step": 255054, "epoch": 2107} {"train_loss": -41.994911193847656, "global_step": 255055, "epoch": 2107} {"train_loss": -39.867347717285156, "global_step": 255056, "epoch": 2107} {"train_loss": -42.903892517089844, "global_step": 255057, "epoch": 2107} {"train_loss": -39.926815032958984, "global_step": 255058, "epoch": 2107} {"train_loss": -40.83185577392578, "global_step": 255059, "epoch": 2107} {"train_loss": -42.54672622680664, "global_step": 255060, "epoch": 2107} {"train_loss": -37.35665512084961, "global_step": 255061, "epoch": 2107} {"train_loss": -38.48146438598633, "global_step": 255062, "epoch": 2107} {"train_loss": -39.74148941040039, "global_step": 255063, "epoch": 2107} {"train_loss": -39.57184600830078, "global_step": 255064, "epoch": 2107} {"train_loss": -41.687294006347656, "global_step": 255065, "epoch": 2107} {"train_loss": -40.62388229370117, "global_step": 255066, "epoch": 2107} {"train_loss": -42.631677769432386, "global_step": 255067, "epoch": 2107, "val_loss": 2626987.0} {"train_loss": -40.10819625854492, "global_step": 255068, "epoch": 2108} {"train_loss": -41.19457244873047, "global_step": 255069, "epoch": 2108} {"train_loss": -41.56659698486328, "global_step": 255070, "epoch": 2108} {"train_loss": -42.13946533203125, "global_step": 255071, "epoch": 2108} {"train_loss": -41.43316650390625, "global_step": 255072, "epoch": 2108} {"train_loss": -41.992366790771484, "global_step": 255073, "epoch": 2108} {"train_loss": -42.02381134033203, "global_step": 255074, "epoch": 2108} {"train_loss": -42.4453010559082, "global_step": 255075, "epoch": 2108} {"train_loss": -42.239234924316406, "global_step": 255076, "epoch": 2108} {"train_loss": -42.06753921508789, "global_step": 255077, "epoch": 2108} {"train_loss": -42.39252471923828, "global_step": 255078, "epoch": 2108} {"train_loss": -41.91286087036133, "global_step": 255079, "epoch": 2108} {"train_loss": -42.757667541503906, "global_step": 255080, "epoch": 2108} {"train_loss": -41.756439208984375, "global_step": 255081, "epoch": 2108} {"train_loss": -41.84858322143555, "global_step": 255082, "epoch": 2108} {"train_loss": -42.85628128051758, "global_step": 255083, "epoch": 2108} {"train_loss": -40.98584747314453, "global_step": 255084, "epoch": 2108} {"train_loss": -43.27214431762695, "global_step": 255085, "epoch": 2108} {"train_loss": -41.97467803955078, "global_step": 255086, "epoch": 2108} {"train_loss": -42.52018356323242, "global_step": 255087, "epoch": 2108} {"train_loss": -41.992366790771484, "global_step": 255088, "epoch": 2108} {"train_loss": -42.013671875, "global_step": 255089, "epoch": 2108} {"train_loss": -43.11723709106445, "global_step": 255090, "epoch": 2108} {"train_loss": -43.00997543334961, "global_step": 255091, "epoch": 2108} {"train_loss": -42.50886154174805, "global_step": 255092, "epoch": 2108} {"train_loss": -41.58271789550781, "global_step": 255093, "epoch": 2108} {"train_loss": -42.36760330200195, "global_step": 255094, "epoch": 2108} {"train_loss": -42.604793548583984, "global_step": 255095, "epoch": 2108} {"train_loss": -42.72121810913086, "global_step": 255096, "epoch": 2108} {"train_loss": -41.81300735473633, "global_step": 255097, "epoch": 2108} {"train_loss": -43.150508880615234, "global_step": 255098, "epoch": 2108} {"train_loss": -42.57207107543945, "global_step": 255099, "epoch": 2108} {"train_loss": -42.73684310913086, "global_step": 255100, "epoch": 2108} {"train_loss": -42.57139587402344, "global_step": 255101, "epoch": 2108} {"train_loss": -41.82111358642578, "global_step": 255102, "epoch": 2108} {"train_loss": -43.427364349365234, "global_step": 255103, "epoch": 2108} {"train_loss": -42.973602294921875, "global_step": 255104, "epoch": 2108} {"train_loss": -43.03322982788086, "global_step": 255105, "epoch": 2108} {"train_loss": -42.73759078979492, "global_step": 255106, "epoch": 2108} {"train_loss": -43.32692337036133, "global_step": 255107, "epoch": 2108} {"train_loss": -42.6151123046875, "global_step": 255108, "epoch": 2108} {"train_loss": -43.196048736572266, "global_step": 255109, "epoch": 2108} {"train_loss": -42.93223190307617, "global_step": 255110, "epoch": 2108} {"train_loss": -43.358394622802734, "global_step": 255111, "epoch": 2108} {"train_loss": -42.89651107788086, "global_step": 255112, "epoch": 2108} {"train_loss": -42.3453254699707, "global_step": 255113, "epoch": 2108} {"train_loss": -41.41227722167969, "global_step": 255114, "epoch": 2108} {"train_loss": -42.4450798034668, "global_step": 255115, "epoch": 2108} {"train_loss": -42.73552322387695, "global_step": 255116, "epoch": 2108} {"train_loss": -41.50697708129883, "global_step": 255117, "epoch": 2108} {"train_loss": -42.007568359375, "global_step": 255118, "epoch": 2108} {"train_loss": -42.68072509765625, "global_step": 255119, "epoch": 2108} {"train_loss": -42.23403549194336, "global_step": 255120, "epoch": 2108} {"train_loss": -42.83827590942383, "global_step": 255121, "epoch": 2108} {"train_loss": -42.81256866455078, "global_step": 255122, "epoch": 2108} {"train_loss": -43.05718994140625, "global_step": 255123, "epoch": 2108} {"train_loss": -43.017269134521484, "global_step": 255124, "epoch": 2108} {"train_loss": -43.248870849609375, "global_step": 255125, "epoch": 2108} {"train_loss": -43.77265548706055, "global_step": 255126, "epoch": 2108} {"train_loss": -43.25732421875, "global_step": 255127, "epoch": 2108} {"train_loss": -43.04268264770508, "global_step": 255128, "epoch": 2108} {"train_loss": -43.483062744140625, "global_step": 255129, "epoch": 2108} {"train_loss": -43.88814926147461, "global_step": 255130, "epoch": 2108} {"train_loss": -43.25762939453125, "global_step": 255131, "epoch": 2108} {"train_loss": -43.31698226928711, "global_step": 255132, "epoch": 2108} {"train_loss": -43.27122116088867, "global_step": 255133, "epoch": 2108} {"train_loss": -43.71796798706055, "global_step": 255134, "epoch": 2108} {"train_loss": -43.80884552001953, "global_step": 255135, "epoch": 2108} {"train_loss": -43.88489532470703, "global_step": 255136, "epoch": 2108} {"train_loss": -43.53761672973633, "global_step": 255137, "epoch": 2108} {"train_loss": -44.1652946472168, "global_step": 255138, "epoch": 2108} {"train_loss": -44.17156982421875, "global_step": 255139, "epoch": 2108} {"train_loss": -44.353946685791016, "global_step": 255140, "epoch": 2108} {"train_loss": -43.978607177734375, "global_step": 255141, "epoch": 2108} {"train_loss": -43.629180908203125, "global_step": 255142, "epoch": 2108} {"train_loss": -43.42299270629883, "global_step": 255143, "epoch": 2108} {"train_loss": -43.59006881713867, "global_step": 255144, "epoch": 2108} {"train_loss": -43.85652160644531, "global_step": 255145, "epoch": 2108} {"train_loss": -43.463130950927734, "global_step": 255146, "epoch": 2108} {"train_loss": -44.075355529785156, "global_step": 255147, "epoch": 2108} {"train_loss": -44.3593635559082, "global_step": 255148, "epoch": 2108} {"train_loss": -44.0869026184082, "global_step": 255149, "epoch": 2108} {"train_loss": -43.71001052856445, "global_step": 255150, "epoch": 2108} {"train_loss": -44.34198760986328, "global_step": 255151, "epoch": 2108} {"train_loss": -44.10566329956055, "global_step": 255152, "epoch": 2108} {"train_loss": -43.505130767822266, "global_step": 255153, "epoch": 2108} {"train_loss": -43.20557403564453, "global_step": 255154, "epoch": 2108} {"train_loss": -43.259559631347656, "global_step": 255155, "epoch": 2108} {"train_loss": -44.057308197021484, "global_step": 255156, "epoch": 2108} {"train_loss": -44.15790557861328, "global_step": 255157, "epoch": 2108} {"train_loss": -44.37678909301758, "global_step": 255158, "epoch": 2108} {"train_loss": -44.60084915161133, "global_step": 255159, "epoch": 2108} {"train_loss": -44.13261795043945, "global_step": 255160, "epoch": 2108} {"train_loss": -43.847900390625, "global_step": 255161, "epoch": 2108} {"train_loss": -43.24394989013672, "global_step": 255162, "epoch": 2108} {"train_loss": -43.94596481323242, "global_step": 255163, "epoch": 2108} {"train_loss": -44.2262077331543, "global_step": 255164, "epoch": 2108} {"train_loss": -44.269901275634766, "global_step": 255165, "epoch": 2108} {"train_loss": -43.956382751464844, "global_step": 255166, "epoch": 2108} {"train_loss": -43.56710433959961, "global_step": 255167, "epoch": 2108} {"train_loss": -42.54203414916992, "global_step": 255168, "epoch": 2108} {"train_loss": -41.09077072143555, "global_step": 255169, "epoch": 2108} {"train_loss": -42.646358489990234, "global_step": 255170, "epoch": 2108} {"train_loss": -44.14411163330078, "global_step": 255171, "epoch": 2108} {"train_loss": -43.72373580932617, "global_step": 255172, "epoch": 2108} {"train_loss": -43.8903694152832, "global_step": 255173, "epoch": 2108} {"train_loss": -43.97800064086914, "global_step": 255174, "epoch": 2108} {"train_loss": -43.42433547973633, "global_step": 255175, "epoch": 2108} {"train_loss": -43.26848220825195, "global_step": 255176, "epoch": 2108} {"train_loss": -43.71440505981445, "global_step": 255177, "epoch": 2108} {"train_loss": -42.83960723876953, "global_step": 255178, "epoch": 2108} {"train_loss": -41.73676681518555, "global_step": 255179, "epoch": 2108} {"train_loss": -43.32522201538086, "global_step": 255180, "epoch": 2108} {"train_loss": -41.986595153808594, "global_step": 255181, "epoch": 2108} {"train_loss": -40.146202087402344, "global_step": 255182, "epoch": 2108} {"train_loss": -41.5987434387207, "global_step": 255183, "epoch": 2108} {"train_loss": -43.46201705932617, "global_step": 255184, "epoch": 2108} {"train_loss": -41.45362854003906, "global_step": 255185, "epoch": 2108} {"train_loss": -40.60911178588867, "global_step": 255186, "epoch": 2108} {"train_loss": -41.46476364135742, "global_step": 255187, "epoch": 2108} {"train_loss": -42.90923983991639, "global_step": 255188, "epoch": 2108, "val_loss": 2669231.25} {"train_loss": -40.65869903564453, "global_step": 255189, "epoch": 2109} {"train_loss": -42.60546875, "global_step": 255190, "epoch": 2109} {"train_loss": -43.07398223876953, "global_step": 255191, "epoch": 2109} {"train_loss": -41.853187561035156, "global_step": 255192, "epoch": 2109} {"train_loss": -41.54641342163086, "global_step": 255193, "epoch": 2109} {"train_loss": -43.639259338378906, "global_step": 255194, "epoch": 2109} {"train_loss": -40.93037033081055, "global_step": 255195, "epoch": 2109} {"train_loss": -40.86262130737305, "global_step": 255196, "epoch": 2109} {"train_loss": -43.87670135498047, "global_step": 255197, "epoch": 2109} {"train_loss": -40.91919708251953, "global_step": 255198, "epoch": 2109} {"train_loss": -41.092891693115234, "global_step": 255199, "epoch": 2109} {"train_loss": -43.28435134887695, "global_step": 255200, "epoch": 2109} {"train_loss": -42.7161979675293, "global_step": 255201, "epoch": 2109} {"train_loss": -42.209266662597656, "global_step": 255202, "epoch": 2109} {"train_loss": -43.45863723754883, "global_step": 255203, "epoch": 2109} {"train_loss": -42.38722610473633, "global_step": 255204, "epoch": 2109} {"train_loss": -42.94780349731445, "global_step": 255205, "epoch": 2109} {"train_loss": -43.32672882080078, "global_step": 255206, "epoch": 2109} {"train_loss": -42.59846115112305, "global_step": 255207, "epoch": 2109} {"train_loss": -42.63116455078125, "global_step": 255208, "epoch": 2109} {"train_loss": -41.049720764160156, "global_step": 255209, "epoch": 2109} {"train_loss": -41.831756591796875, "global_step": 255210, "epoch": 2109} {"train_loss": -40.094825744628906, "global_step": 255211, "epoch": 2109} {"train_loss": -40.121273040771484, "global_step": 255212, "epoch": 2109} {"train_loss": -41.034690856933594, "global_step": 255213, "epoch": 2109} {"train_loss": -40.594032287597656, "global_step": 255214, "epoch": 2109} {"train_loss": -40.96231460571289, "global_step": 255215, "epoch": 2109} {"train_loss": -41.322845458984375, "global_step": 255216, "epoch": 2109} {"train_loss": -39.30321502685547, "global_step": 255217, "epoch": 2109} {"train_loss": -42.665321350097656, "global_step": 255218, "epoch": 2109} {"train_loss": -41.195533752441406, "global_step": 255219, "epoch": 2109} {"train_loss": -41.886749267578125, "global_step": 255220, "epoch": 2109} {"train_loss": -41.69852066040039, "global_step": 255221, "epoch": 2109} {"train_loss": -42.46095657348633, "global_step": 255222, "epoch": 2109} {"train_loss": -41.880611419677734, "global_step": 255223, "epoch": 2109} {"train_loss": -42.32431411743164, "global_step": 255224, "epoch": 2109} {"train_loss": -40.68319320678711, "global_step": 255225, "epoch": 2109} {"train_loss": -41.20307540893555, "global_step": 255226, "epoch": 2109} {"train_loss": -42.137264251708984, "global_step": 255227, "epoch": 2109} {"train_loss": -41.71607208251953, "global_step": 255228, "epoch": 2109} {"train_loss": -42.9826774597168, "global_step": 255229, "epoch": 2109} {"train_loss": -41.739471435546875, "global_step": 255230, "epoch": 2109} {"train_loss": -43.167205810546875, "global_step": 255231, "epoch": 2109} {"train_loss": -42.1507453918457, "global_step": 255232, "epoch": 2109} {"train_loss": -42.823150634765625, "global_step": 255233, "epoch": 2109} {"train_loss": -42.113746643066406, "global_step": 255234, "epoch": 2109} {"train_loss": -42.90839767456055, "global_step": 255235, "epoch": 2109} {"train_loss": -42.678985595703125, "global_step": 255236, "epoch": 2109} {"train_loss": -42.68132019042969, "global_step": 255237, "epoch": 2109} {"train_loss": -42.29312515258789, "global_step": 255238, "epoch": 2109} {"train_loss": -42.010772705078125, "global_step": 255239, "epoch": 2109} {"train_loss": -42.12588882446289, "global_step": 255240, "epoch": 2109} {"train_loss": -39.858123779296875, "global_step": 255241, "epoch": 2109} {"train_loss": -43.39915084838867, "global_step": 255242, "epoch": 2109} {"train_loss": -41.870296478271484, "global_step": 255243, "epoch": 2109} {"train_loss": -41.393653869628906, "global_step": 255244, "epoch": 2109} {"train_loss": -43.04497528076172, "global_step": 255245, "epoch": 2109} {"train_loss": -40.128143310546875, "global_step": 255246, "epoch": 2109} {"train_loss": -42.7206916809082, "global_step": 255247, "epoch": 2109} {"train_loss": -42.3787956237793, "global_step": 255248, "epoch": 2109} {"train_loss": -41.777957916259766, "global_step": 255249, "epoch": 2109} {"train_loss": -42.74414825439453, "global_step": 255250, "epoch": 2109} {"train_loss": -42.39133071899414, "global_step": 255251, "epoch": 2109} {"train_loss": -42.606502532958984, "global_step": 255252, "epoch": 2109} {"train_loss": -42.27103805541992, "global_step": 255253, "epoch": 2109} {"train_loss": -43.33338928222656, "global_step": 255254, "epoch": 2109} {"train_loss": -41.122596740722656, "global_step": 255255, "epoch": 2109} {"train_loss": -43.189083099365234, "global_step": 255256, "epoch": 2109} {"train_loss": -42.234432220458984, "global_step": 255257, "epoch": 2109} {"train_loss": -42.5441780090332, "global_step": 255258, "epoch": 2109} {"train_loss": -42.030975341796875, "global_step": 255259, "epoch": 2109} {"train_loss": -42.9561882019043, "global_step": 255260, "epoch": 2109} {"train_loss": -42.801719665527344, "global_step": 255261, "epoch": 2109} {"train_loss": -42.99274826049805, "global_step": 255262, "epoch": 2109} {"train_loss": -43.282100677490234, "global_step": 255263, "epoch": 2109} {"train_loss": -43.57354736328125, "global_step": 255264, "epoch": 2109} {"train_loss": -43.23800277709961, "global_step": 255265, "epoch": 2109} {"train_loss": -43.587467193603516, "global_step": 255266, "epoch": 2109} {"train_loss": -42.001827239990234, "global_step": 255267, "epoch": 2109} {"train_loss": -43.2607307434082, "global_step": 255268, "epoch": 2109} {"train_loss": -43.46826934814453, "global_step": 255269, "epoch": 2109} {"train_loss": -43.27543258666992, "global_step": 255270, "epoch": 2109} {"train_loss": -43.83978271484375, "global_step": 255271, "epoch": 2109} {"train_loss": -43.506649017333984, "global_step": 255272, "epoch": 2109} {"train_loss": -43.67342758178711, "global_step": 255273, "epoch": 2109} {"train_loss": -43.79179000854492, "global_step": 255274, "epoch": 2109} {"train_loss": -43.76058578491211, "global_step": 255275, "epoch": 2109} {"train_loss": -43.926239013671875, "global_step": 255276, "epoch": 2109} {"train_loss": -43.49414825439453, "global_step": 255277, "epoch": 2109} {"train_loss": -43.55674743652344, "global_step": 255278, "epoch": 2109} {"train_loss": -44.18787384033203, "global_step": 255279, "epoch": 2109} {"train_loss": -43.70702362060547, "global_step": 255280, "epoch": 2109} {"train_loss": -43.81190872192383, "global_step": 255281, "epoch": 2109} {"train_loss": -43.43235397338867, "global_step": 255282, "epoch": 2109} {"train_loss": -44.426021575927734, "global_step": 255283, "epoch": 2109} {"train_loss": -44.02486801147461, "global_step": 255284, "epoch": 2109} {"train_loss": -43.94961166381836, "global_step": 255285, "epoch": 2109} {"train_loss": -43.97321319580078, "global_step": 255286, "epoch": 2109} {"train_loss": -43.82625198364258, "global_step": 255287, "epoch": 2109} {"train_loss": -44.360347747802734, "global_step": 255288, "epoch": 2109} {"train_loss": -44.114349365234375, "global_step": 255289, "epoch": 2109} {"train_loss": -44.07015609741211, "global_step": 255290, "epoch": 2109} {"train_loss": -43.698543548583984, "global_step": 255291, "epoch": 2109} {"train_loss": -44.127349853515625, "global_step": 255292, "epoch": 2109} {"train_loss": -43.97209167480469, "global_step": 255293, "epoch": 2109} {"train_loss": -43.5648307800293, "global_step": 255294, "epoch": 2109} {"train_loss": -43.48260498046875, "global_step": 255295, "epoch": 2109} {"train_loss": -44.41741943359375, "global_step": 255296, "epoch": 2109} {"train_loss": -44.013370513916016, "global_step": 255297, "epoch": 2109} {"train_loss": -44.00574493408203, "global_step": 255298, "epoch": 2109} {"train_loss": -42.626827239990234, "global_step": 255299, "epoch": 2109} {"train_loss": -43.08687973022461, "global_step": 255300, "epoch": 2109} {"train_loss": -42.22773361206055, "global_step": 255301, "epoch": 2109} {"train_loss": -42.570709228515625, "global_step": 255302, "epoch": 2109} {"train_loss": -44.04534912109375, "global_step": 255303, "epoch": 2109} {"train_loss": -44.26149368286133, "global_step": 255304, "epoch": 2109} {"train_loss": -40.27565383911133, "global_step": 255305, "epoch": 2109} {"train_loss": -43.30295944213867, "global_step": 255306, "epoch": 2109} {"train_loss": -43.80007553100586, "global_step": 255307, "epoch": 2109} {"train_loss": -41.234554290771484, "global_step": 255308, "epoch": 2109} {"train_loss": -42.6001904385149, "global_step": 255309, "epoch": 2109, "val_loss": 2732706.0} {"train_loss": -42.536556243896484, "global_step": 255310, "epoch": 2110} {"train_loss": -40.135353088378906, "global_step": 255311, "epoch": 2110} {"train_loss": -41.28083801269531, "global_step": 255312, "epoch": 2110} {"train_loss": -40.90629196166992, "global_step": 255313, "epoch": 2110} {"train_loss": -39.186431884765625, "global_step": 255314, "epoch": 2110} {"train_loss": -39.47965621948242, "global_step": 255315, "epoch": 2110} {"train_loss": -41.955928802490234, "global_step": 255316, "epoch": 2110} {"train_loss": -40.00667190551758, "global_step": 255317, "epoch": 2110} {"train_loss": -40.91767501831055, "global_step": 255318, "epoch": 2110} {"train_loss": -41.02334213256836, "global_step": 255319, "epoch": 2110} {"train_loss": -40.446937561035156, "global_step": 255320, "epoch": 2110} {"train_loss": -41.560237884521484, "global_step": 255321, "epoch": 2110} {"train_loss": -41.33787155151367, "global_step": 255322, "epoch": 2110} {"train_loss": -40.26725769042969, "global_step": 255323, "epoch": 2110} {"train_loss": -42.337066650390625, "global_step": 255324, "epoch": 2110} {"train_loss": -39.546669006347656, "global_step": 255325, "epoch": 2110} {"train_loss": -42.49003219604492, "global_step": 255326, "epoch": 2110} {"train_loss": -40.099891662597656, "global_step": 255327, "epoch": 2110} {"train_loss": -40.63602066040039, "global_step": 255328, "epoch": 2110} {"train_loss": -41.47338104248047, "global_step": 255329, "epoch": 2110} {"train_loss": -40.936031341552734, "global_step": 255330, "epoch": 2110} {"train_loss": -41.38947677612305, "global_step": 255331, "epoch": 2110} {"train_loss": -41.48720932006836, "global_step": 255332, "epoch": 2110} {"train_loss": -39.86762619018555, "global_step": 255333, "epoch": 2110} {"train_loss": -42.414058685302734, "global_step": 255334, "epoch": 2110} {"train_loss": -41.78443145751953, "global_step": 255335, "epoch": 2110} {"train_loss": -41.38269805908203, "global_step": 255336, "epoch": 2110} {"train_loss": -41.4683837890625, "global_step": 255337, "epoch": 2110} {"train_loss": -42.43577194213867, "global_step": 255338, "epoch": 2110} {"train_loss": -43.448341369628906, "global_step": 255339, "epoch": 2110} {"train_loss": -41.112632751464844, "global_step": 255340, "epoch": 2110} {"train_loss": -42.24525833129883, "global_step": 255341, "epoch": 2110} {"train_loss": -41.88711166381836, "global_step": 255342, "epoch": 2110} {"train_loss": -43.08251953125, "global_step": 255343, "epoch": 2110} {"train_loss": -43.13333511352539, "global_step": 255344, "epoch": 2110} {"train_loss": -42.740943908691406, "global_step": 255345, "epoch": 2110} {"train_loss": -42.91511154174805, "global_step": 255346, "epoch": 2110} {"train_loss": -43.561988830566406, "global_step": 255347, "epoch": 2110} {"train_loss": -42.860347747802734, "global_step": 255348, "epoch": 2110} {"train_loss": -43.221466064453125, "global_step": 255349, "epoch": 2110} {"train_loss": -42.81940460205078, "global_step": 255350, "epoch": 2110} {"train_loss": -41.53782272338867, "global_step": 255351, "epoch": 2110} {"train_loss": -41.72726058959961, "global_step": 255352, "epoch": 2110} {"train_loss": -42.9641227722168, "global_step": 255353, "epoch": 2110} {"train_loss": -42.49585723876953, "global_step": 255354, "epoch": 2110} {"train_loss": -42.535865783691406, "global_step": 255355, "epoch": 2110} {"train_loss": -42.007080078125, "global_step": 255356, "epoch": 2110} {"train_loss": -41.72533416748047, "global_step": 255357, "epoch": 2110} {"train_loss": -43.2617301940918, "global_step": 255358, "epoch": 2110} {"train_loss": -42.366455078125, "global_step": 255359, "epoch": 2110} {"train_loss": -42.70328903198242, "global_step": 255360, "epoch": 2110} {"train_loss": -42.44432830810547, "global_step": 255361, "epoch": 2110} {"train_loss": -42.656524658203125, "global_step": 255362, "epoch": 2110} {"train_loss": -43.73637390136719, "global_step": 255363, "epoch": 2110} {"train_loss": -42.85675048828125, "global_step": 255364, "epoch": 2110} {"train_loss": -42.80813980102539, "global_step": 255365, "epoch": 2110} {"train_loss": -43.27665328979492, "global_step": 255366, "epoch": 2110} {"train_loss": -43.6082878112793, "global_step": 255367, "epoch": 2110} {"train_loss": -38.46953201293945, "global_step": 255368, "epoch": 2110} {"train_loss": -42.881858825683594, "global_step": 255369, "epoch": 2110} {"train_loss": -39.654212951660156, "global_step": 255370, "epoch": 2110} {"train_loss": -38.89057922363281, "global_step": 255371, "epoch": 2110} {"train_loss": -39.17112350463867, "global_step": 255372, "epoch": 2110} {"train_loss": -42.71672439575195, "global_step": 255373, "epoch": 2110} {"train_loss": -41.00849533081055, "global_step": 255374, "epoch": 2110} {"train_loss": -40.76594161987305, "global_step": 255375, "epoch": 2110} {"train_loss": -38.18519973754883, "global_step": 255376, "epoch": 2110} {"train_loss": -38.42007064819336, "global_step": 255377, "epoch": 2110} {"train_loss": -35.473445892333984, "global_step": 255378, "epoch": 2110} {"train_loss": -35.57080078125, "global_step": 255379, "epoch": 2110} {"train_loss": -31.726877212524414, "global_step": 255380, "epoch": 2110} {"train_loss": -27.87347412109375, "global_step": 255381, "epoch": 2110} {"train_loss": -38.634037017822266, "global_step": 255382, "epoch": 2110} {"train_loss": -27.24085807800293, "global_step": 255383, "epoch": 2110} {"train_loss": -31.21148109436035, "global_step": 255384, "epoch": 2110} {"train_loss": -34.473506927490234, "global_step": 255385, "epoch": 2110} {"train_loss": -34.178096771240234, "global_step": 255386, "epoch": 2110} {"train_loss": -36.66411590576172, "global_step": 255387, "epoch": 2110} {"train_loss": -38.84574508666992, "global_step": 255388, "epoch": 2110} {"train_loss": -36.1202278137207, "global_step": 255389, "epoch": 2110} {"train_loss": -37.3507194519043, "global_step": 255390, "epoch": 2110} {"train_loss": -33.919654846191406, "global_step": 255391, "epoch": 2110} {"train_loss": -34.021846771240234, "global_step": 255392, "epoch": 2110} {"train_loss": -36.27163314819336, "global_step": 255393, "epoch": 2110} {"train_loss": -36.09719467163086, "global_step": 255394, "epoch": 2110} {"train_loss": -36.66400146484375, "global_step": 255395, "epoch": 2110} {"train_loss": -35.656009674072266, "global_step": 255396, "epoch": 2110} {"train_loss": -39.88347244262695, "global_step": 255397, "epoch": 2110} {"train_loss": -38.256710052490234, "global_step": 255398, "epoch": 2110} {"train_loss": -37.30288314819336, "global_step": 255399, "epoch": 2110} {"train_loss": -37.45637130737305, "global_step": 255400, "epoch": 2110} {"train_loss": -38.9068603515625, "global_step": 255401, "epoch": 2110} {"train_loss": -40.5293083190918, "global_step": 255402, "epoch": 2110} {"train_loss": -38.90515899658203, "global_step": 255403, "epoch": 2110} {"train_loss": -38.1115608215332, "global_step": 255404, "epoch": 2110} {"train_loss": -39.12015914916992, "global_step": 255405, "epoch": 2110} {"train_loss": -38.692626953125, "global_step": 255406, "epoch": 2110} {"train_loss": -39.60504913330078, "global_step": 255407, "epoch": 2110} {"train_loss": -40.095550537109375, "global_step": 255408, "epoch": 2110} {"train_loss": -39.4708251953125, "global_step": 255409, "epoch": 2110} {"train_loss": -41.18199157714844, "global_step": 255410, "epoch": 2110} {"train_loss": -40.19484329223633, "global_step": 255411, "epoch": 2110} {"train_loss": -41.16306686401367, "global_step": 255412, "epoch": 2110} {"train_loss": -41.150184631347656, "global_step": 255413, "epoch": 2110} {"train_loss": -40.46703338623047, "global_step": 255414, "epoch": 2110} {"train_loss": -41.20401382446289, "global_step": 255415, "epoch": 2110} {"train_loss": -41.23927307128906, "global_step": 255416, "epoch": 2110} {"train_loss": -41.66852951049805, "global_step": 255417, "epoch": 2110} {"train_loss": -40.3232307434082, "global_step": 255418, "epoch": 2110} {"train_loss": -40.64391326904297, "global_step": 255419, "epoch": 2110} {"train_loss": -40.4503288269043, "global_step": 255420, "epoch": 2110} {"train_loss": -41.17304229736328, "global_step": 255421, "epoch": 2110} {"train_loss": -40.612586975097656, "global_step": 255422, "epoch": 2110} {"train_loss": -41.10268783569336, "global_step": 255423, "epoch": 2110} {"train_loss": -41.58805465698242, "global_step": 255424, "epoch": 2110} {"train_loss": -41.551231384277344, "global_step": 255425, "epoch": 2110} {"train_loss": -41.28766632080078, "global_step": 255426, "epoch": 2110} {"train_loss": -41.4065055847168, "global_step": 255427, "epoch": 2110} {"train_loss": -41.94477462768555, "global_step": 255428, "epoch": 2110} {"train_loss": -41.292518615722656, "global_step": 255429, "epoch": 2110} {"train_loss": -40.135223026118005, "global_step": 255430, "epoch": 2110, "val_loss": 2893781.25} {"train_loss": -41.68316650390625, "global_step": 255431, "epoch": 2111} {"train_loss": -42.16657257080078, "global_step": 255432, "epoch": 2111} {"train_loss": -41.689125061035156, "global_step": 255433, "epoch": 2111} {"train_loss": -41.280818939208984, "global_step": 255434, "epoch": 2111} {"train_loss": -41.088645935058594, "global_step": 255435, "epoch": 2111} {"train_loss": -41.8369026184082, "global_step": 255436, "epoch": 2111} {"train_loss": -41.052978515625, "global_step": 255437, "epoch": 2111} {"train_loss": -41.832088470458984, "global_step": 255438, "epoch": 2111} {"train_loss": -42.30562210083008, "global_step": 255439, "epoch": 2111} {"train_loss": -42.06346130371094, "global_step": 255440, "epoch": 2111} {"train_loss": -41.70998764038086, "global_step": 255441, "epoch": 2111} {"train_loss": -42.0866813659668, "global_step": 255442, "epoch": 2111} {"train_loss": -42.6701545715332, "global_step": 255443, "epoch": 2111} {"train_loss": -41.9099235534668, "global_step": 255444, "epoch": 2111} {"train_loss": -42.06643295288086, "global_step": 255445, "epoch": 2111} {"train_loss": -42.53657913208008, "global_step": 255446, "epoch": 2111} {"train_loss": -42.348907470703125, "global_step": 255447, "epoch": 2111} {"train_loss": -41.83177185058594, "global_step": 255448, "epoch": 2111} {"train_loss": -42.27923583984375, "global_step": 255449, "epoch": 2111} {"train_loss": -42.11896896362305, "global_step": 255450, "epoch": 2111} {"train_loss": -43.35645294189453, "global_step": 255451, "epoch": 2111} {"train_loss": -42.61051559448242, "global_step": 255452, "epoch": 2111} {"train_loss": -42.377838134765625, "global_step": 255453, "epoch": 2111} {"train_loss": -43.310821533203125, "global_step": 255454, "epoch": 2111} {"train_loss": -42.45000076293945, "global_step": 255455, "epoch": 2111} {"train_loss": -42.64400100708008, "global_step": 255456, "epoch": 2111} {"train_loss": -42.64495849609375, "global_step": 255457, "epoch": 2111} {"train_loss": -42.944053649902344, "global_step": 255458, "epoch": 2111} {"train_loss": -42.5097770690918, "global_step": 255459, "epoch": 2111} {"train_loss": -42.360111236572266, "global_step": 255460, "epoch": 2111} {"train_loss": -42.5841178894043, "global_step": 255461, "epoch": 2111} {"train_loss": -42.08468246459961, "global_step": 255462, "epoch": 2111} {"train_loss": -43.526397705078125, "global_step": 255463, "epoch": 2111} {"train_loss": -43.330841064453125, "global_step": 255464, "epoch": 2111} {"train_loss": -42.49410629272461, "global_step": 255465, "epoch": 2111} {"train_loss": -42.90779495239258, "global_step": 255466, "epoch": 2111} {"train_loss": -42.8072624206543, "global_step": 255467, "epoch": 2111} {"train_loss": -43.63029861450195, "global_step": 255468, "epoch": 2111} {"train_loss": -43.18587112426758, "global_step": 255469, "epoch": 2111} {"train_loss": -43.2515754699707, "global_step": 255470, "epoch": 2111} {"train_loss": -43.600093841552734, "global_step": 255471, "epoch": 2111} {"train_loss": -43.741641998291016, "global_step": 255472, "epoch": 2111} {"train_loss": -43.2412223815918, "global_step": 255473, "epoch": 2111} {"train_loss": -42.65419387817383, "global_step": 255474, "epoch": 2111} {"train_loss": -43.13209533691406, "global_step": 255475, "epoch": 2111} {"train_loss": -42.80556106567383, "global_step": 255476, "epoch": 2111} {"train_loss": -43.12950134277344, "global_step": 255477, "epoch": 2111} {"train_loss": -42.74996566772461, "global_step": 255478, "epoch": 2111} {"train_loss": -43.38962936401367, "global_step": 255479, "epoch": 2111} {"train_loss": -42.9482421875, "global_step": 255480, "epoch": 2111} {"train_loss": -42.967533111572266, "global_step": 255481, "epoch": 2111} {"train_loss": -43.1019401550293, "global_step": 255482, "epoch": 2111} {"train_loss": -42.439998626708984, "global_step": 255483, "epoch": 2111} {"train_loss": -42.705745697021484, "global_step": 255484, "epoch": 2111} {"train_loss": -43.27901077270508, "global_step": 255485, "epoch": 2111} {"train_loss": -42.482940673828125, "global_step": 255486, "epoch": 2111} {"train_loss": -41.358154296875, "global_step": 255487, "epoch": 2111} {"train_loss": -40.112972259521484, "global_step": 255488, "epoch": 2111} {"train_loss": -41.82954025268555, "global_step": 255489, "epoch": 2111} {"train_loss": -43.47575759887695, "global_step": 255490, "epoch": 2111} {"train_loss": -43.49446487426758, "global_step": 255491, "epoch": 2111} {"train_loss": -41.11900329589844, "global_step": 255492, "epoch": 2111} {"train_loss": -40.22330856323242, "global_step": 255493, "epoch": 2111} {"train_loss": -41.5821533203125, "global_step": 255494, "epoch": 2111} {"train_loss": -42.91025161743164, "global_step": 255495, "epoch": 2111} {"train_loss": -42.8367805480957, "global_step": 255496, "epoch": 2111} {"train_loss": -41.42873764038086, "global_step": 255497, "epoch": 2111} {"train_loss": -42.33675003051758, "global_step": 255498, "epoch": 2111} {"train_loss": -43.09285354614258, "global_step": 255499, "epoch": 2111} {"train_loss": -42.361427307128906, "global_step": 255500, "epoch": 2111} {"train_loss": -42.70728302001953, "global_step": 255501, "epoch": 2111} {"train_loss": -41.41633224487305, "global_step": 255502, "epoch": 2111} {"train_loss": -41.54779052734375, "global_step": 255503, "epoch": 2111} {"train_loss": -42.54055404663086, "global_step": 255504, "epoch": 2111} {"train_loss": -42.33045959472656, "global_step": 255505, "epoch": 2111} {"train_loss": -42.67108154296875, "global_step": 255506, "epoch": 2111} {"train_loss": -42.633296966552734, "global_step": 255507, "epoch": 2111} {"train_loss": -41.783321380615234, "global_step": 255508, "epoch": 2111} {"train_loss": -41.72980880737305, "global_step": 255509, "epoch": 2111} {"train_loss": -41.32517623901367, "global_step": 255510, "epoch": 2111} {"train_loss": -41.75187301635742, "global_step": 255511, "epoch": 2111} {"train_loss": -41.274200439453125, "global_step": 255512, "epoch": 2111} {"train_loss": -41.896339416503906, "global_step": 255513, "epoch": 2111} {"train_loss": -42.235511779785156, "global_step": 255514, "epoch": 2111} {"train_loss": -40.39595413208008, "global_step": 255515, "epoch": 2111} {"train_loss": -41.97457504272461, "global_step": 255516, "epoch": 2111} {"train_loss": -42.26406478881836, "global_step": 255517, "epoch": 2111} {"train_loss": -41.53031921386719, "global_step": 255518, "epoch": 2111} {"train_loss": -42.14730453491211, "global_step": 255519, "epoch": 2111} {"train_loss": -41.65327072143555, "global_step": 255520, "epoch": 2111} {"train_loss": -40.50257110595703, "global_step": 255521, "epoch": 2111} {"train_loss": -42.08088684082031, "global_step": 255522, "epoch": 2111} {"train_loss": -41.26662063598633, "global_step": 255523, "epoch": 2111} {"train_loss": -41.68351364135742, "global_step": 255524, "epoch": 2111} {"train_loss": -41.141883850097656, "global_step": 255525, "epoch": 2111} {"train_loss": -39.691505432128906, "global_step": 255526, "epoch": 2111} {"train_loss": -40.79505157470703, "global_step": 255527, "epoch": 2111} {"train_loss": -41.391788482666016, "global_step": 255528, "epoch": 2111} {"train_loss": -41.84785079956055, "global_step": 255529, "epoch": 2111} {"train_loss": -42.46314239501953, "global_step": 255530, "epoch": 2111} {"train_loss": -40.75223922729492, "global_step": 255531, "epoch": 2111} {"train_loss": -40.0174446105957, "global_step": 255532, "epoch": 2111} {"train_loss": -42.48917007446289, "global_step": 255533, "epoch": 2111} {"train_loss": -40.87788772583008, "global_step": 255534, "epoch": 2111} {"train_loss": -40.22275161743164, "global_step": 255535, "epoch": 2111} {"train_loss": -42.384952545166016, "global_step": 255536, "epoch": 2111} {"train_loss": -39.211029052734375, "global_step": 255537, "epoch": 2111} {"train_loss": -40.013492584228516, "global_step": 255538, "epoch": 2111} {"train_loss": -41.32810592651367, "global_step": 255539, "epoch": 2111} {"train_loss": -40.07356643676758, "global_step": 255540, "epoch": 2111} {"train_loss": -41.572750091552734, "global_step": 255541, "epoch": 2111} {"train_loss": -39.19547653198242, "global_step": 255542, "epoch": 2111} {"train_loss": -41.74042892456055, "global_step": 255543, "epoch": 2111} {"train_loss": -39.45722579956055, "global_step": 255544, "epoch": 2111} {"train_loss": -40.99300003051758, "global_step": 255545, "epoch": 2111} {"train_loss": -39.303123474121094, "global_step": 255546, "epoch": 2111} {"train_loss": -41.23177719116211, "global_step": 255547, "epoch": 2111} {"train_loss": -39.479637145996094, "global_step": 255548, "epoch": 2111} {"train_loss": -40.878482818603516, "global_step": 255549, "epoch": 2111} {"train_loss": -39.03825378417969, "global_step": 255550, "epoch": 2111} {"train_loss": -41.93627223495609, "global_step": 255551, "epoch": 2111, "val_loss": 2734720.25} {"train_loss": -38.01089096069336, "global_step": 255552, "epoch": 2112} {"train_loss": -41.62981414794922, "global_step": 255553, "epoch": 2112} {"train_loss": -38.93119430541992, "global_step": 255554, "epoch": 2112} {"train_loss": -40.15888595581055, "global_step": 255555, "epoch": 2112} {"train_loss": -39.98487091064453, "global_step": 255556, "epoch": 2112} {"train_loss": -37.550655364990234, "global_step": 255557, "epoch": 2112} {"train_loss": -41.621742248535156, "global_step": 255558, "epoch": 2112} {"train_loss": -39.051055908203125, "global_step": 255559, "epoch": 2112} {"train_loss": -40.852203369140625, "global_step": 255560, "epoch": 2112} {"train_loss": -40.0609245300293, "global_step": 255561, "epoch": 2112} {"train_loss": -39.339149475097656, "global_step": 255562, "epoch": 2112} {"train_loss": -42.390689849853516, "global_step": 255563, "epoch": 2112} {"train_loss": -39.91633987426758, "global_step": 255564, "epoch": 2112} {"train_loss": -43.03823471069336, "global_step": 255565, "epoch": 2112} {"train_loss": -41.30631637573242, "global_step": 255566, "epoch": 2112} {"train_loss": -41.74892044067383, "global_step": 255567, "epoch": 2112} {"train_loss": -42.25873565673828, "global_step": 255568, "epoch": 2112} {"train_loss": -41.86549758911133, "global_step": 255569, "epoch": 2112} {"train_loss": -42.23555374145508, "global_step": 255570, "epoch": 2112} {"train_loss": -42.628353118896484, "global_step": 255571, "epoch": 2112} {"train_loss": -42.47713851928711, "global_step": 255572, "epoch": 2112} {"train_loss": -41.94342041015625, "global_step": 255573, "epoch": 2112} {"train_loss": -41.524635314941406, "global_step": 255574, "epoch": 2112} {"train_loss": -42.55554962158203, "global_step": 255575, "epoch": 2112} {"train_loss": -42.1604118347168, "global_step": 255576, "epoch": 2112} {"train_loss": -42.03521728515625, "global_step": 255577, "epoch": 2112} {"train_loss": -42.215789794921875, "global_step": 255578, "epoch": 2112} {"train_loss": -42.13918685913086, "global_step": 255579, "epoch": 2112} {"train_loss": -43.01530838012695, "global_step": 255580, "epoch": 2112} {"train_loss": -42.732398986816406, "global_step": 255581, "epoch": 2112} {"train_loss": -42.57902145385742, "global_step": 255582, "epoch": 2112} {"train_loss": -42.20654296875, "global_step": 255583, "epoch": 2112} {"train_loss": -42.62876510620117, "global_step": 255584, "epoch": 2112} {"train_loss": -42.58509063720703, "global_step": 255585, "epoch": 2112} {"train_loss": -42.619747161865234, "global_step": 255586, "epoch": 2112} {"train_loss": -42.99628448486328, "global_step": 255587, "epoch": 2112} {"train_loss": -42.790679931640625, "global_step": 255588, "epoch": 2112} {"train_loss": -43.07727813720703, "global_step": 255589, "epoch": 2112} {"train_loss": -43.303157806396484, "global_step": 255590, "epoch": 2112} {"train_loss": -42.66233444213867, "global_step": 255591, "epoch": 2112} {"train_loss": -42.113582611083984, "global_step": 255592, "epoch": 2112} {"train_loss": -42.86490249633789, "global_step": 255593, "epoch": 2112} {"train_loss": -42.710079193115234, "global_step": 255594, "epoch": 2112} {"train_loss": -42.48330307006836, "global_step": 255595, "epoch": 2112} {"train_loss": -42.996307373046875, "global_step": 255596, "epoch": 2112} {"train_loss": -41.641963958740234, "global_step": 255597, "epoch": 2112} {"train_loss": -42.92218780517578, "global_step": 255598, "epoch": 2112} {"train_loss": -42.433284759521484, "global_step": 255599, "epoch": 2112} {"train_loss": -42.561439514160156, "global_step": 255600, "epoch": 2112} {"train_loss": -42.823211669921875, "global_step": 255601, "epoch": 2112} {"train_loss": -42.648372650146484, "global_step": 255602, "epoch": 2112} {"train_loss": -43.33246612548828, "global_step": 255603, "epoch": 2112} {"train_loss": -42.79330062866211, "global_step": 255604, "epoch": 2112} {"train_loss": -43.09893798828125, "global_step": 255605, "epoch": 2112} {"train_loss": -42.29859161376953, "global_step": 255606, "epoch": 2112} {"train_loss": -42.61040115356445, "global_step": 255607, "epoch": 2112} {"train_loss": -43.04864501953125, "global_step": 255608, "epoch": 2112} {"train_loss": -42.96799850463867, "global_step": 255609, "epoch": 2112} {"train_loss": -42.84235382080078, "global_step": 255610, "epoch": 2112} {"train_loss": -42.704410552978516, "global_step": 255611, "epoch": 2112} {"train_loss": -43.021484375, "global_step": 255612, "epoch": 2112} {"train_loss": -42.832801818847656, "global_step": 255613, "epoch": 2112} {"train_loss": -42.85408401489258, "global_step": 255614, "epoch": 2112} {"train_loss": -43.07281494140625, "global_step": 255615, "epoch": 2112} {"train_loss": -43.02492904663086, "global_step": 255616, "epoch": 2112} {"train_loss": -42.510597229003906, "global_step": 255617, "epoch": 2112} {"train_loss": -42.6427116394043, "global_step": 255618, "epoch": 2112} {"train_loss": -43.18458557128906, "global_step": 255619, "epoch": 2112} {"train_loss": -42.95009994506836, "global_step": 255620, "epoch": 2112} {"train_loss": -42.645851135253906, "global_step": 255621, "epoch": 2112} {"train_loss": -42.06487274169922, "global_step": 255622, "epoch": 2112} {"train_loss": -41.75132369995117, "global_step": 255623, "epoch": 2112} {"train_loss": -42.75092697143555, "global_step": 255624, "epoch": 2112} {"train_loss": -42.58700942993164, "global_step": 255625, "epoch": 2112} {"train_loss": -42.53036880493164, "global_step": 255626, "epoch": 2112} {"train_loss": -42.23737716674805, "global_step": 255627, "epoch": 2112} {"train_loss": -43.01176071166992, "global_step": 255628, "epoch": 2112} {"train_loss": -42.4445915222168, "global_step": 255629, "epoch": 2112} {"train_loss": -42.8829231262207, "global_step": 255630, "epoch": 2112} {"train_loss": -42.4783935546875, "global_step": 255631, "epoch": 2112} {"train_loss": -41.230552673339844, "global_step": 255632, "epoch": 2112} {"train_loss": -38.19527053833008, "global_step": 255633, "epoch": 2112} {"train_loss": -40.024837493896484, "global_step": 255634, "epoch": 2112} {"train_loss": -41.842708587646484, "global_step": 255635, "epoch": 2112} {"train_loss": -38.527225494384766, "global_step": 255636, "epoch": 2112} {"train_loss": -41.87254333496094, "global_step": 255637, "epoch": 2112} {"train_loss": -41.32815170288086, "global_step": 255638, "epoch": 2112} {"train_loss": -39.37699508666992, "global_step": 255639, "epoch": 2112} {"train_loss": -42.51351547241211, "global_step": 255640, "epoch": 2112} {"train_loss": -38.42287063598633, "global_step": 255641, "epoch": 2112} {"train_loss": -40.93362808227539, "global_step": 255642, "epoch": 2112} {"train_loss": -39.73679733276367, "global_step": 255643, "epoch": 2112} {"train_loss": -40.64155578613281, "global_step": 255644, "epoch": 2112} {"train_loss": -41.238136291503906, "global_step": 255645, "epoch": 2112} {"train_loss": -40.60047149658203, "global_step": 255646, "epoch": 2112} {"train_loss": -40.90475082397461, "global_step": 255647, "epoch": 2112} {"train_loss": -40.79619598388672, "global_step": 255648, "epoch": 2112} {"train_loss": -39.71664810180664, "global_step": 255649, "epoch": 2112} {"train_loss": -41.80976486206055, "global_step": 255650, "epoch": 2112} {"train_loss": -39.952091217041016, "global_step": 255651, "epoch": 2112} {"train_loss": -41.88691329956055, "global_step": 255652, "epoch": 2112} {"train_loss": -41.635833740234375, "global_step": 255653, "epoch": 2112} {"train_loss": -41.82545471191406, "global_step": 255654, "epoch": 2112} {"train_loss": -41.84870147705078, "global_step": 255655, "epoch": 2112} {"train_loss": -41.75106430053711, "global_step": 255656, "epoch": 2112} {"train_loss": -42.51548385620117, "global_step": 255657, "epoch": 2112} {"train_loss": -41.7442626953125, "global_step": 255658, "epoch": 2112} {"train_loss": -42.67723083496094, "global_step": 255659, "epoch": 2112} {"train_loss": -41.6388053894043, "global_step": 255660, "epoch": 2112} {"train_loss": -42.565467834472656, "global_step": 255661, "epoch": 2112} {"train_loss": -42.78973388671875, "global_step": 255662, "epoch": 2112} {"train_loss": -41.82124710083008, "global_step": 255663, "epoch": 2112} {"train_loss": -40.73991775512695, "global_step": 255664, "epoch": 2112} {"train_loss": -42.95396041870117, "global_step": 255665, "epoch": 2112} {"train_loss": -41.3447265625, "global_step": 255666, "epoch": 2112} {"train_loss": -40.9237174987793, "global_step": 255667, "epoch": 2112} {"train_loss": -42.2811279296875, "global_step": 255668, "epoch": 2112} {"train_loss": -42.982025146484375, "global_step": 255669, "epoch": 2112} {"train_loss": -41.50343704223633, "global_step": 255670, "epoch": 2112} {"train_loss": -42.372314453125, "global_step": 255671, "epoch": 2112} {"train_loss": -41.85556005052299, "global_step": 255672, "epoch": 2112, "val_loss": 2719066.75} {"train_loss": -42.228153228759766, "global_step": 255673, "epoch": 2113} {"train_loss": -42.11002731323242, "global_step": 255674, "epoch": 2113} {"train_loss": -43.32954406738281, "global_step": 255675, "epoch": 2113} {"train_loss": -43.09237289428711, "global_step": 255676, "epoch": 2113} {"train_loss": -42.869842529296875, "global_step": 255677, "epoch": 2113} {"train_loss": -43.342281341552734, "global_step": 255678, "epoch": 2113} {"train_loss": -42.42728805541992, "global_step": 255679, "epoch": 2113} {"train_loss": -42.73153305053711, "global_step": 255680, "epoch": 2113} {"train_loss": -43.01221466064453, "global_step": 255681, "epoch": 2113} {"train_loss": -42.123291015625, "global_step": 255682, "epoch": 2113} {"train_loss": -43.384464263916016, "global_step": 255683, "epoch": 2113} {"train_loss": -42.12051010131836, "global_step": 255684, "epoch": 2113} {"train_loss": -42.49321746826172, "global_step": 255685, "epoch": 2113} {"train_loss": -43.049591064453125, "global_step": 255686, "epoch": 2113} {"train_loss": -41.88204574584961, "global_step": 255687, "epoch": 2113} {"train_loss": -42.50002670288086, "global_step": 255688, "epoch": 2113} {"train_loss": -42.97977828979492, "global_step": 255689, "epoch": 2113} {"train_loss": -42.681243896484375, "global_step": 255690, "epoch": 2113} {"train_loss": -42.97721481323242, "global_step": 255691, "epoch": 2113} {"train_loss": -43.10124588012695, "global_step": 255692, "epoch": 2113} {"train_loss": -42.633480072021484, "global_step": 255693, "epoch": 2113} {"train_loss": -42.89701461791992, "global_step": 255694, "epoch": 2113} {"train_loss": -42.650691986083984, "global_step": 255695, "epoch": 2113} {"train_loss": -43.0421028137207, "global_step": 255696, "epoch": 2113} {"train_loss": -41.88855743408203, "global_step": 255697, "epoch": 2113} {"train_loss": -43.470977783203125, "global_step": 255698, "epoch": 2113} {"train_loss": -43.40129470825195, "global_step": 255699, "epoch": 2113} {"train_loss": -42.56150436401367, "global_step": 255700, "epoch": 2113} {"train_loss": -43.115325927734375, "global_step": 255701, "epoch": 2113} {"train_loss": -42.789390563964844, "global_step": 255702, "epoch": 2113} {"train_loss": -43.205108642578125, "global_step": 255703, "epoch": 2113} {"train_loss": -43.5335693359375, "global_step": 255704, "epoch": 2113} {"train_loss": -42.972896575927734, "global_step": 255705, "epoch": 2113} {"train_loss": -43.64815902709961, "global_step": 255706, "epoch": 2113} {"train_loss": -42.86187744140625, "global_step": 255707, "epoch": 2113} {"train_loss": -42.87018966674805, "global_step": 255708, "epoch": 2113} {"train_loss": -43.7835807800293, "global_step": 255709, "epoch": 2113} {"train_loss": -42.91267013549805, "global_step": 255710, "epoch": 2113} {"train_loss": -43.2950325012207, "global_step": 255711, "epoch": 2113} {"train_loss": -43.623592376708984, "global_step": 255712, "epoch": 2113} {"train_loss": -43.23305892944336, "global_step": 255713, "epoch": 2113} {"train_loss": -43.830230712890625, "global_step": 255714, "epoch": 2113} {"train_loss": -42.92327880859375, "global_step": 255715, "epoch": 2113} {"train_loss": -43.50011444091797, "global_step": 255716, "epoch": 2113} {"train_loss": -44.12825393676758, "global_step": 255717, "epoch": 2113} {"train_loss": -43.507686614990234, "global_step": 255718, "epoch": 2113} {"train_loss": -43.26234817504883, "global_step": 255719, "epoch": 2113} {"train_loss": -43.190547943115234, "global_step": 255720, "epoch": 2113} {"train_loss": -43.569026947021484, "global_step": 255721, "epoch": 2113} {"train_loss": -43.95612716674805, "global_step": 255722, "epoch": 2113} {"train_loss": -43.308170318603516, "global_step": 255723, "epoch": 2113} {"train_loss": -43.12811279296875, "global_step": 255724, "epoch": 2113} {"train_loss": -43.74208450317383, "global_step": 255725, "epoch": 2113} {"train_loss": -43.37534713745117, "global_step": 255726, "epoch": 2113} {"train_loss": -42.88617706298828, "global_step": 255727, "epoch": 2113} {"train_loss": -43.42427062988281, "global_step": 255728, "epoch": 2113} {"train_loss": -43.318206787109375, "global_step": 255729, "epoch": 2113} {"train_loss": -43.33127975463867, "global_step": 255730, "epoch": 2113} {"train_loss": -42.73812484741211, "global_step": 255731, "epoch": 2113} {"train_loss": -42.67660140991211, "global_step": 255732, "epoch": 2113} {"train_loss": -42.40599822998047, "global_step": 255733, "epoch": 2113} {"train_loss": -42.75669479370117, "global_step": 255734, "epoch": 2113} {"train_loss": -43.28437423706055, "global_step": 255735, "epoch": 2113} {"train_loss": -42.96316909790039, "global_step": 255736, "epoch": 2113} {"train_loss": -43.08158493041992, "global_step": 255737, "epoch": 2113} {"train_loss": -42.64474868774414, "global_step": 255738, "epoch": 2113} {"train_loss": -43.271949768066406, "global_step": 255739, "epoch": 2113} {"train_loss": -43.21577835083008, "global_step": 255740, "epoch": 2113} {"train_loss": -42.37740707397461, "global_step": 255741, "epoch": 2113} {"train_loss": -42.830543518066406, "global_step": 255742, "epoch": 2113} {"train_loss": -43.34440994262695, "global_step": 255743, "epoch": 2113} {"train_loss": -42.688045501708984, "global_step": 255744, "epoch": 2113} {"train_loss": -42.65761947631836, "global_step": 255745, "epoch": 2113} {"train_loss": -42.9726676940918, "global_step": 255746, "epoch": 2113} {"train_loss": -43.51859664916992, "global_step": 255747, "epoch": 2113} {"train_loss": -43.7401123046875, "global_step": 255748, "epoch": 2113} {"train_loss": -43.04848098754883, "global_step": 255749, "epoch": 2113} {"train_loss": -43.50223922729492, "global_step": 255750, "epoch": 2113} {"train_loss": -43.31242752075195, "global_step": 255751, "epoch": 2113} {"train_loss": -42.98046112060547, "global_step": 255752, "epoch": 2113} {"train_loss": -42.0457649230957, "global_step": 255753, "epoch": 2113} {"train_loss": -43.15751266479492, "global_step": 255754, "epoch": 2113} {"train_loss": -42.492897033691406, "global_step": 255755, "epoch": 2113} {"train_loss": -42.55510330200195, "global_step": 255756, "epoch": 2113} {"train_loss": -42.94567108154297, "global_step": 255757, "epoch": 2113} {"train_loss": -42.38077926635742, "global_step": 255758, "epoch": 2113} {"train_loss": -40.82794952392578, "global_step": 255759, "epoch": 2113} {"train_loss": -40.62906265258789, "global_step": 255760, "epoch": 2113} {"train_loss": -39.51685333251953, "global_step": 255761, "epoch": 2113} {"train_loss": -42.59973907470703, "global_step": 255762, "epoch": 2113} {"train_loss": -40.8165397644043, "global_step": 255763, "epoch": 2113} {"train_loss": -40.69426345825195, "global_step": 255764, "epoch": 2113} {"train_loss": -42.74283981323242, "global_step": 255765, "epoch": 2113} {"train_loss": -40.08784103393555, "global_step": 255766, "epoch": 2113} {"train_loss": -42.340824127197266, "global_step": 255767, "epoch": 2113} {"train_loss": -41.79100799560547, "global_step": 255768, "epoch": 2113} {"train_loss": -42.22123336791992, "global_step": 255769, "epoch": 2113} {"train_loss": -42.1427001953125, "global_step": 255770, "epoch": 2113} {"train_loss": -41.122642517089844, "global_step": 255771, "epoch": 2113} {"train_loss": -41.82430648803711, "global_step": 255772, "epoch": 2113} {"train_loss": -40.78740310668945, "global_step": 255773, "epoch": 2113} {"train_loss": -39.7786750793457, "global_step": 255774, "epoch": 2113} {"train_loss": -42.10039138793945, "global_step": 255775, "epoch": 2113} {"train_loss": -40.16704559326172, "global_step": 255776, "epoch": 2113} {"train_loss": -42.38214874267578, "global_step": 255777, "epoch": 2113} {"train_loss": -39.656898498535156, "global_step": 255778, "epoch": 2113} {"train_loss": -42.16675567626953, "global_step": 255779, "epoch": 2113} {"train_loss": -40.97941207885742, "global_step": 255780, "epoch": 2113} {"train_loss": -41.77510070800781, "global_step": 255781, "epoch": 2113} {"train_loss": -41.084266662597656, "global_step": 255782, "epoch": 2113} {"train_loss": -41.386474609375, "global_step": 255783, "epoch": 2113} {"train_loss": -41.798213958740234, "global_step": 255784, "epoch": 2113} {"train_loss": -42.52590560913086, "global_step": 255785, "epoch": 2113} {"train_loss": -42.453819274902344, "global_step": 255786, "epoch": 2113} {"train_loss": -41.316070556640625, "global_step": 255787, "epoch": 2113} {"train_loss": -43.15281295776367, "global_step": 255788, "epoch": 2113} {"train_loss": -42.10150146484375, "global_step": 255789, "epoch": 2113} {"train_loss": -42.71102523803711, "global_step": 255790, "epoch": 2113} {"train_loss": -43.09331130981445, "global_step": 255791, "epoch": 2113} {"train_loss": -42.269134521484375, "global_step": 255792, "epoch": 2113} {"train_loss": -42.594176111142495, "global_step": 255793, "epoch": 2113, "val_loss": 2682462.5} {"train_loss": -42.658992767333984, "global_step": 255794, "epoch": 2114} {"train_loss": -43.090511322021484, "global_step": 255795, "epoch": 2114} {"train_loss": -41.47517395019531, "global_step": 255796, "epoch": 2114} {"train_loss": -41.971588134765625, "global_step": 255797, "epoch": 2114} {"train_loss": -42.638267517089844, "global_step": 255798, "epoch": 2114} {"train_loss": -42.65247344970703, "global_step": 255799, "epoch": 2114} {"train_loss": -42.611629486083984, "global_step": 255800, "epoch": 2114} {"train_loss": -42.12907791137695, "global_step": 255801, "epoch": 2114} {"train_loss": -42.48637390136719, "global_step": 255802, "epoch": 2114} {"train_loss": -42.31714630126953, "global_step": 255803, "epoch": 2114} {"train_loss": -42.73784637451172, "global_step": 255804, "epoch": 2114} {"train_loss": -42.56563949584961, "global_step": 255805, "epoch": 2114} {"train_loss": -41.88037109375, "global_step": 255806, "epoch": 2114} {"train_loss": -41.7799072265625, "global_step": 255807, "epoch": 2114} {"train_loss": -42.36126708984375, "global_step": 255808, "epoch": 2114} {"train_loss": -41.9820556640625, "global_step": 255809, "epoch": 2114} {"train_loss": -42.431236267089844, "global_step": 255810, "epoch": 2114} {"train_loss": -41.398597717285156, "global_step": 255811, "epoch": 2114} {"train_loss": -42.650081634521484, "global_step": 255812, "epoch": 2114} {"train_loss": -42.65067672729492, "global_step": 255813, "epoch": 2114} {"train_loss": -42.402008056640625, "global_step": 255814, "epoch": 2114} {"train_loss": -41.97021484375, "global_step": 255815, "epoch": 2114} {"train_loss": -42.792030334472656, "global_step": 255816, "epoch": 2114} {"train_loss": -42.21379089355469, "global_step": 255817, "epoch": 2114} {"train_loss": -42.17094421386719, "global_step": 255818, "epoch": 2114} {"train_loss": -42.61100387573242, "global_step": 255819, "epoch": 2114} {"train_loss": -42.29252243041992, "global_step": 255820, "epoch": 2114} {"train_loss": -43.12184143066406, "global_step": 255821, "epoch": 2114} {"train_loss": -42.16408920288086, "global_step": 255822, "epoch": 2114} {"train_loss": -42.72726058959961, "global_step": 255823, "epoch": 2114} {"train_loss": -42.053279876708984, "global_step": 255824, "epoch": 2114} {"train_loss": -42.50973129272461, "global_step": 255825, "epoch": 2114} {"train_loss": -42.33399200439453, "global_step": 255826, "epoch": 2114} {"train_loss": -42.75859451293945, "global_step": 255827, "epoch": 2114} {"train_loss": -42.74066925048828, "global_step": 255828, "epoch": 2114} {"train_loss": -42.943145751953125, "global_step": 255829, "epoch": 2114} {"train_loss": -42.482234954833984, "global_step": 255830, "epoch": 2114} {"train_loss": -42.317928314208984, "global_step": 255831, "epoch": 2114} {"train_loss": -43.191410064697266, "global_step": 255832, "epoch": 2114} {"train_loss": -43.088966369628906, "global_step": 255833, "epoch": 2114} {"train_loss": -42.452308654785156, "global_step": 255834, "epoch": 2114} {"train_loss": -43.351200103759766, "global_step": 255835, "epoch": 2114} {"train_loss": -42.844276428222656, "global_step": 255836, "epoch": 2114} {"train_loss": -42.622657775878906, "global_step": 255837, "epoch": 2114} {"train_loss": -43.346553802490234, "global_step": 255838, "epoch": 2114} {"train_loss": -42.71329879760742, "global_step": 255839, "epoch": 2114} {"train_loss": -42.98511505126953, "global_step": 255840, "epoch": 2114} {"train_loss": -42.77383041381836, "global_step": 255841, "epoch": 2114} {"train_loss": -42.865352630615234, "global_step": 255842, "epoch": 2114} {"train_loss": -42.9729118347168, "global_step": 255843, "epoch": 2114} {"train_loss": -42.86111068725586, "global_step": 255844, "epoch": 2114} {"train_loss": -42.7895622253418, "global_step": 255845, "epoch": 2114} {"train_loss": -42.96333694458008, "global_step": 255846, "epoch": 2114} {"train_loss": -43.2779655456543, "global_step": 255847, "epoch": 2114} {"train_loss": -42.5416145324707, "global_step": 255848, "epoch": 2114} {"train_loss": -43.763851165771484, "global_step": 255849, "epoch": 2114} {"train_loss": -43.22933578491211, "global_step": 255850, "epoch": 2114} {"train_loss": -41.42402267456055, "global_step": 255851, "epoch": 2114} {"train_loss": -42.652069091796875, "global_step": 255852, "epoch": 2114} {"train_loss": -43.70762252807617, "global_step": 255853, "epoch": 2114} {"train_loss": -42.250545501708984, "global_step": 255854, "epoch": 2114} {"train_loss": -40.904571533203125, "global_step": 255855, "epoch": 2114} {"train_loss": -43.17705154418945, "global_step": 255856, "epoch": 2114} {"train_loss": -43.31416702270508, "global_step": 255857, "epoch": 2114} {"train_loss": -42.03397750854492, "global_step": 255858, "epoch": 2114} {"train_loss": -43.024658203125, "global_step": 255859, "epoch": 2114} {"train_loss": -43.531002044677734, "global_step": 255860, "epoch": 2114} {"train_loss": -41.37208938598633, "global_step": 255861, "epoch": 2114} {"train_loss": -43.249908447265625, "global_step": 255862, "epoch": 2114} {"train_loss": -41.55830001831055, "global_step": 255863, "epoch": 2114} {"train_loss": -38.70403289794922, "global_step": 255864, "epoch": 2114} {"train_loss": -42.788856506347656, "global_step": 255865, "epoch": 2114} {"train_loss": -41.329383850097656, "global_step": 255866, "epoch": 2114} {"train_loss": -40.93428421020508, "global_step": 255867, "epoch": 2114} {"train_loss": -42.9441032409668, "global_step": 255868, "epoch": 2114} {"train_loss": -41.16840362548828, "global_step": 255869, "epoch": 2114} {"train_loss": -41.711952209472656, "global_step": 255870, "epoch": 2114} {"train_loss": -41.899349212646484, "global_step": 255871, "epoch": 2114} {"train_loss": -42.76416015625, "global_step": 255872, "epoch": 2114} {"train_loss": -43.10578536987305, "global_step": 255873, "epoch": 2114} {"train_loss": -40.75716781616211, "global_step": 255874, "epoch": 2114} {"train_loss": -43.08057403564453, "global_step": 255875, "epoch": 2114} {"train_loss": -43.00775909423828, "global_step": 255876, "epoch": 2114} {"train_loss": -41.28533935546875, "global_step": 255877, "epoch": 2114} {"train_loss": -43.21887969970703, "global_step": 255878, "epoch": 2114} {"train_loss": -43.33243942260742, "global_step": 255879, "epoch": 2114} {"train_loss": -41.54298400878906, "global_step": 255880, "epoch": 2114} {"train_loss": -42.38557815551758, "global_step": 255881, "epoch": 2114} {"train_loss": -43.34433364868164, "global_step": 255882, "epoch": 2114} {"train_loss": -43.193115234375, "global_step": 255883, "epoch": 2114} {"train_loss": -43.06521224975586, "global_step": 255884, "epoch": 2114} {"train_loss": -43.15962219238281, "global_step": 255885, "epoch": 2114} {"train_loss": -42.71602249145508, "global_step": 255886, "epoch": 2114} {"train_loss": -43.09630584716797, "global_step": 255887, "epoch": 2114} {"train_loss": -43.7528190612793, "global_step": 255888, "epoch": 2114} {"train_loss": -43.461307525634766, "global_step": 255889, "epoch": 2114} {"train_loss": -43.439208984375, "global_step": 255890, "epoch": 2114} {"train_loss": -43.7331428527832, "global_step": 255891, "epoch": 2114} {"train_loss": -43.99504470825195, "global_step": 255892, "epoch": 2114} {"train_loss": -43.86265182495117, "global_step": 255893, "epoch": 2114} {"train_loss": -43.673912048339844, "global_step": 255894, "epoch": 2114} {"train_loss": -43.85210418701172, "global_step": 255895, "epoch": 2114} {"train_loss": -43.14132308959961, "global_step": 255896, "epoch": 2114} {"train_loss": -43.8166389465332, "global_step": 255897, "epoch": 2114} {"train_loss": -43.62553787231445, "global_step": 255898, "epoch": 2114} {"train_loss": -43.91361999511719, "global_step": 255899, "epoch": 2114} {"train_loss": -44.26435470581055, "global_step": 255900, "epoch": 2114} {"train_loss": -43.77307891845703, "global_step": 255901, "epoch": 2114} {"train_loss": -43.587913513183594, "global_step": 255902, "epoch": 2114} {"train_loss": -44.02817153930664, "global_step": 255903, "epoch": 2114} {"train_loss": -42.781654357910156, "global_step": 255904, "epoch": 2114} {"train_loss": -43.9852294921875, "global_step": 255905, "epoch": 2114} {"train_loss": -43.969661712646484, "global_step": 255906, "epoch": 2114} {"train_loss": -43.82408905029297, "global_step": 255907, "epoch": 2114} {"train_loss": -43.69698715209961, "global_step": 255908, "epoch": 2114} {"train_loss": -43.5440788269043, "global_step": 255909, "epoch": 2114} {"train_loss": -43.07567596435547, "global_step": 255910, "epoch": 2114} {"train_loss": -42.86788558959961, "global_step": 255911, "epoch": 2114} {"train_loss": -43.9584846496582, "global_step": 255912, "epoch": 2114} {"train_loss": -44.14216995239258, "global_step": 255913, "epoch": 2114} {"train_loss": -42.75592570659543, "global_step": 255914, "epoch": 2114, "val_loss": 2617990.25} {"train_loss": -43.93482208251953, "global_step": 255915, "epoch": 2115} {"train_loss": -42.48455810546875, "global_step": 255916, "epoch": 2115} {"train_loss": -43.79851150512695, "global_step": 255917, "epoch": 2115} {"train_loss": -43.19021224975586, "global_step": 255918, "epoch": 2115} {"train_loss": -43.45523452758789, "global_step": 255919, "epoch": 2115} {"train_loss": -44.06537628173828, "global_step": 255920, "epoch": 2115} {"train_loss": -42.499107360839844, "global_step": 255921, "epoch": 2115} {"train_loss": -43.002723693847656, "global_step": 255922, "epoch": 2115} {"train_loss": -43.59336471557617, "global_step": 255923, "epoch": 2115} {"train_loss": -43.674739837646484, "global_step": 255924, "epoch": 2115} {"train_loss": -42.5200080871582, "global_step": 255925, "epoch": 2115} {"train_loss": -41.33732223510742, "global_step": 255926, "epoch": 2115} {"train_loss": -42.751182556152344, "global_step": 255927, "epoch": 2115} {"train_loss": -43.94843292236328, "global_step": 255928, "epoch": 2115} {"train_loss": -43.85451126098633, "global_step": 255929, "epoch": 2115} {"train_loss": -44.172882080078125, "global_step": 255930, "epoch": 2115} {"train_loss": -43.9752197265625, "global_step": 255931, "epoch": 2115} {"train_loss": -43.594669342041016, "global_step": 255932, "epoch": 2115} {"train_loss": -43.77470016479492, "global_step": 255933, "epoch": 2115} {"train_loss": -43.837154388427734, "global_step": 255934, "epoch": 2115} {"train_loss": -43.89363479614258, "global_step": 255935, "epoch": 2115} {"train_loss": -43.19708251953125, "global_step": 255936, "epoch": 2115} {"train_loss": -43.107730865478516, "global_step": 255937, "epoch": 2115} {"train_loss": -43.466224670410156, "global_step": 255938, "epoch": 2115} {"train_loss": -43.55243682861328, "global_step": 255939, "epoch": 2115} {"train_loss": -42.99251174926758, "global_step": 255940, "epoch": 2115} {"train_loss": -43.72258377075195, "global_step": 255941, "epoch": 2115} {"train_loss": -43.70325469970703, "global_step": 255942, "epoch": 2115} {"train_loss": -42.288265228271484, "global_step": 255943, "epoch": 2115} {"train_loss": -42.836280822753906, "global_step": 255944, "epoch": 2115} {"train_loss": -42.29924392700195, "global_step": 255945, "epoch": 2115} {"train_loss": -41.32442855834961, "global_step": 255946, "epoch": 2115} {"train_loss": -42.319766998291016, "global_step": 255947, "epoch": 2115} {"train_loss": -41.65985107421875, "global_step": 255948, "epoch": 2115} {"train_loss": -42.870601654052734, "global_step": 255949, "epoch": 2115} {"train_loss": -41.62423324584961, "global_step": 255950, "epoch": 2115} {"train_loss": -41.507179260253906, "global_step": 255951, "epoch": 2115} {"train_loss": -42.82876205444336, "global_step": 255952, "epoch": 2115} {"train_loss": -41.587310791015625, "global_step": 255953, "epoch": 2115} {"train_loss": -42.730587005615234, "global_step": 255954, "epoch": 2115} {"train_loss": -43.193477630615234, "global_step": 255955, "epoch": 2115} {"train_loss": -40.613582611083984, "global_step": 255956, "epoch": 2115} {"train_loss": -41.8924446105957, "global_step": 255957, "epoch": 2115} {"train_loss": -42.53727722167969, "global_step": 255958, "epoch": 2115} {"train_loss": -42.04331588745117, "global_step": 255959, "epoch": 2115} {"train_loss": -42.5534782409668, "global_step": 255960, "epoch": 2115} {"train_loss": -43.278839111328125, "global_step": 255961, "epoch": 2115} {"train_loss": -42.887874603271484, "global_step": 255962, "epoch": 2115} {"train_loss": -42.78776550292969, "global_step": 255963, "epoch": 2115} {"train_loss": -43.26461410522461, "global_step": 255964, "epoch": 2115} {"train_loss": -42.49504470825195, "global_step": 255965, "epoch": 2115} {"train_loss": -42.54743576049805, "global_step": 255966, "epoch": 2115} {"train_loss": -43.24967956542969, "global_step": 255967, "epoch": 2115} {"train_loss": -42.55035400390625, "global_step": 255968, "epoch": 2115} {"train_loss": -42.6588249206543, "global_step": 255969, "epoch": 2115} {"train_loss": -42.76667404174805, "global_step": 255970, "epoch": 2115} {"train_loss": -42.78385543823242, "global_step": 255971, "epoch": 2115} {"train_loss": -44.08907699584961, "global_step": 255972, "epoch": 2115} {"train_loss": -43.42135238647461, "global_step": 255973, "epoch": 2115} {"train_loss": -43.64976119995117, "global_step": 255974, "epoch": 2115} {"train_loss": -42.37178039550781, "global_step": 255975, "epoch": 2115} {"train_loss": -42.3029670715332, "global_step": 255976, "epoch": 2115} {"train_loss": -43.080257415771484, "global_step": 255977, "epoch": 2115} {"train_loss": -42.581809997558594, "global_step": 255978, "epoch": 2115} {"train_loss": -42.51406478881836, "global_step": 255979, "epoch": 2115} {"train_loss": -41.24976348876953, "global_step": 255980, "epoch": 2115} {"train_loss": -41.640071868896484, "global_step": 255981, "epoch": 2115} {"train_loss": -42.07625961303711, "global_step": 255982, "epoch": 2115} {"train_loss": -43.079383850097656, "global_step": 255983, "epoch": 2115} {"train_loss": -42.70417022705078, "global_step": 255984, "epoch": 2115} {"train_loss": -40.9347038269043, "global_step": 255985, "epoch": 2115} {"train_loss": -40.94273376464844, "global_step": 255986, "epoch": 2115} {"train_loss": -43.541961669921875, "global_step": 255987, "epoch": 2115} {"train_loss": -41.99420928955078, "global_step": 255988, "epoch": 2115} {"train_loss": -40.92136764526367, "global_step": 255989, "epoch": 2115} {"train_loss": -42.458839416503906, "global_step": 255990, "epoch": 2115} {"train_loss": -42.69172286987305, "global_step": 255991, "epoch": 2115} {"train_loss": -43.19413375854492, "global_step": 255992, "epoch": 2115} {"train_loss": -41.98197555541992, "global_step": 255993, "epoch": 2115} {"train_loss": -42.661190032958984, "global_step": 255994, "epoch": 2115} {"train_loss": -42.68850326538086, "global_step": 255995, "epoch": 2115} {"train_loss": -42.27900695800781, "global_step": 255996, "epoch": 2115} {"train_loss": -41.54878616333008, "global_step": 255997, "epoch": 2115} {"train_loss": -43.02125549316406, "global_step": 255998, "epoch": 2115} {"train_loss": -42.6699333190918, "global_step": 255999, "epoch": 2115} {"train_loss": -42.0385856628418, "global_step": 256000, "epoch": 2115} {"train_loss": -43.217647552490234, "global_step": 256001, "epoch": 2115} {"train_loss": -40.245628356933594, "global_step": 256002, "epoch": 2115} {"train_loss": -41.607967376708984, "global_step": 256003, "epoch": 2115} {"train_loss": -41.61727523803711, "global_step": 256004, "epoch": 2115} {"train_loss": -41.436378479003906, "global_step": 256005, "epoch": 2115} {"train_loss": -42.70512771606445, "global_step": 256006, "epoch": 2115} {"train_loss": -41.708858489990234, "global_step": 256007, "epoch": 2115} {"train_loss": -40.446163177490234, "global_step": 256008, "epoch": 2115} {"train_loss": -42.62681198120117, "global_step": 256009, "epoch": 2115} {"train_loss": -40.08814239501953, "global_step": 256010, "epoch": 2115} {"train_loss": -42.61949157714844, "global_step": 256011, "epoch": 2115} {"train_loss": -40.57344055175781, "global_step": 256012, "epoch": 2115} {"train_loss": -42.18455505371094, "global_step": 256013, "epoch": 2115} {"train_loss": -41.847713470458984, "global_step": 256014, "epoch": 2115} {"train_loss": -42.81093978881836, "global_step": 256015, "epoch": 2115} {"train_loss": -41.347904205322266, "global_step": 256016, "epoch": 2115} {"train_loss": -42.237640380859375, "global_step": 256017, "epoch": 2115} {"train_loss": -42.704524993896484, "global_step": 256018, "epoch": 2115} {"train_loss": -42.88124465942383, "global_step": 256019, "epoch": 2115} {"train_loss": -42.7501220703125, "global_step": 256020, "epoch": 2115} {"train_loss": -42.98849105834961, "global_step": 256021, "epoch": 2115} {"train_loss": -42.30765914916992, "global_step": 256022, "epoch": 2115} {"train_loss": -42.609127044677734, "global_step": 256023, "epoch": 2115} {"train_loss": -42.79090118408203, "global_step": 256024, "epoch": 2115} {"train_loss": -42.81233215332031, "global_step": 256025, "epoch": 2115} {"train_loss": -43.08730697631836, "global_step": 256026, "epoch": 2115} {"train_loss": -42.78693771362305, "global_step": 256027, "epoch": 2115} {"train_loss": -42.288631439208984, "global_step": 256028, "epoch": 2115} {"train_loss": -42.18098831176758, "global_step": 256029, "epoch": 2115} {"train_loss": -43.1592903137207, "global_step": 256030, "epoch": 2115} {"train_loss": -43.37539291381836, "global_step": 256031, "epoch": 2115} {"train_loss": -43.215755462646484, "global_step": 256032, "epoch": 2115} {"train_loss": -42.972145080566406, "global_step": 256033, "epoch": 2115} {"train_loss": -42.936241149902344, "global_step": 256034, "epoch": 2115} {"train_loss": -42.611226641442165, "global_step": 256035, "epoch": 2115, "val_loss": 2707576.5} {"train_loss": -43.674495697021484, "global_step": 256036, "epoch": 2116} {"train_loss": -43.0785026550293, "global_step": 256037, "epoch": 2116} {"train_loss": -43.3621826171875, "global_step": 256038, "epoch": 2116} {"train_loss": -43.20111846923828, "global_step": 256039, "epoch": 2116} {"train_loss": -43.71602249145508, "global_step": 256040, "epoch": 2116} {"train_loss": -43.188568115234375, "global_step": 256041, "epoch": 2116} {"train_loss": -43.1103515625, "global_step": 256042, "epoch": 2116} {"train_loss": -43.20958709716797, "global_step": 256043, "epoch": 2116} {"train_loss": -43.81809997558594, "global_step": 256044, "epoch": 2116} {"train_loss": -43.15859603881836, "global_step": 256045, "epoch": 2116} {"train_loss": -43.831172943115234, "global_step": 256046, "epoch": 2116} {"train_loss": -43.223533630371094, "global_step": 256047, "epoch": 2116} {"train_loss": -42.913631439208984, "global_step": 256048, "epoch": 2116} {"train_loss": -43.46785354614258, "global_step": 256049, "epoch": 2116} {"train_loss": -43.38881301879883, "global_step": 256050, "epoch": 2116} {"train_loss": -42.6822395324707, "global_step": 256051, "epoch": 2116} {"train_loss": -42.0362434387207, "global_step": 256052, "epoch": 2116} {"train_loss": -43.164886474609375, "global_step": 256053, "epoch": 2116} {"train_loss": -42.382137298583984, "global_step": 256054, "epoch": 2116} {"train_loss": -43.837337493896484, "global_step": 256055, "epoch": 2116} {"train_loss": -41.5152702331543, "global_step": 256056, "epoch": 2116} {"train_loss": -42.40674591064453, "global_step": 256057, "epoch": 2116} {"train_loss": -43.31332778930664, "global_step": 256058, "epoch": 2116} {"train_loss": -43.822383880615234, "global_step": 256059, "epoch": 2116} {"train_loss": -42.60905075073242, "global_step": 256060, "epoch": 2116} {"train_loss": -43.17755889892578, "global_step": 256061, "epoch": 2116} {"train_loss": -43.678768157958984, "global_step": 256062, "epoch": 2116} {"train_loss": -43.73635482788086, "global_step": 256063, "epoch": 2116} {"train_loss": -44.02610778808594, "global_step": 256064, "epoch": 2116} {"train_loss": -43.88821029663086, "global_step": 256065, "epoch": 2116} {"train_loss": -44.1006965637207, "global_step": 256066, "epoch": 2116} {"train_loss": -43.881080627441406, "global_step": 256067, "epoch": 2116} {"train_loss": -43.661407470703125, "global_step": 256068, "epoch": 2116} {"train_loss": -43.966026306152344, "global_step": 256069, "epoch": 2116} {"train_loss": -43.5211067199707, "global_step": 256070, "epoch": 2116} {"train_loss": -43.37976837158203, "global_step": 256071, "epoch": 2116} {"train_loss": -43.607784271240234, "global_step": 256072, "epoch": 2116} {"train_loss": -44.0044059753418, "global_step": 256073, "epoch": 2116} {"train_loss": -43.57313537597656, "global_step": 256074, "epoch": 2116} {"train_loss": -44.36731719970703, "global_step": 256075, "epoch": 2116} {"train_loss": -42.922786712646484, "global_step": 256076, "epoch": 2116} {"train_loss": -42.97323989868164, "global_step": 256077, "epoch": 2116} {"train_loss": -41.654354095458984, "global_step": 256078, "epoch": 2116} {"train_loss": -37.9393310546875, "global_step": 256079, "epoch": 2116} {"train_loss": -41.687252044677734, "global_step": 256080, "epoch": 2116} {"train_loss": -37.214359283447266, "global_step": 256081, "epoch": 2116} {"train_loss": -36.362213134765625, "global_step": 256082, "epoch": 2116} {"train_loss": -35.49810028076172, "global_step": 256083, "epoch": 2116} {"train_loss": -36.42805099487305, "global_step": 256084, "epoch": 2116} {"train_loss": -35.47150421142578, "global_step": 256085, "epoch": 2116} {"train_loss": -35.87873458862305, "global_step": 256086, "epoch": 2116} {"train_loss": -35.925785064697266, "global_step": 256087, "epoch": 2116} {"train_loss": -35.57746505737305, "global_step": 256088, "epoch": 2116} {"train_loss": -35.81022262573242, "global_step": 256089, "epoch": 2116} {"train_loss": -36.238643646240234, "global_step": 256090, "epoch": 2116} {"train_loss": -36.2048225402832, "global_step": 256091, "epoch": 2116} {"train_loss": -36.672916412353516, "global_step": 256092, "epoch": 2116} {"train_loss": -37.15671920776367, "global_step": 256093, "epoch": 2116} {"train_loss": -36.614715576171875, "global_step": 256094, "epoch": 2116} {"train_loss": -37.22643280029297, "global_step": 256095, "epoch": 2116} {"train_loss": -36.71249008178711, "global_step": 256096, "epoch": 2116} {"train_loss": -36.49911117553711, "global_step": 256097, "epoch": 2116} {"train_loss": -37.530574798583984, "global_step": 256098, "epoch": 2116} {"train_loss": -37.01546859741211, "global_step": 256099, "epoch": 2116} {"train_loss": -37.20988845825195, "global_step": 256100, "epoch": 2116} {"train_loss": -37.63117980957031, "global_step": 256101, "epoch": 2116} {"train_loss": -37.89250183105469, "global_step": 256102, "epoch": 2116} {"train_loss": -37.551082611083984, "global_step": 256103, "epoch": 2116} {"train_loss": -37.270118713378906, "global_step": 256104, "epoch": 2116} {"train_loss": -37.102935791015625, "global_step": 256105, "epoch": 2116} {"train_loss": -36.71425247192383, "global_step": 256106, "epoch": 2116} {"train_loss": -37.842933654785156, "global_step": 256107, "epoch": 2116} {"train_loss": -37.215301513671875, "global_step": 256108, "epoch": 2116} {"train_loss": -38.7991943359375, "global_step": 256109, "epoch": 2116} {"train_loss": -37.442501068115234, "global_step": 256110, "epoch": 2116} {"train_loss": -37.197750091552734, "global_step": 256111, "epoch": 2116} {"train_loss": -38.226531982421875, "global_step": 256112, "epoch": 2116} {"train_loss": -37.163570404052734, "global_step": 256113, "epoch": 2116} {"train_loss": -38.58103561401367, "global_step": 256114, "epoch": 2116} {"train_loss": -36.77114486694336, "global_step": 256115, "epoch": 2116} {"train_loss": -37.546016693115234, "global_step": 256116, "epoch": 2116} {"train_loss": -36.7964973449707, "global_step": 256117, "epoch": 2116} {"train_loss": -38.58890151977539, "global_step": 256118, "epoch": 2116} {"train_loss": -37.733314514160156, "global_step": 256119, "epoch": 2116} {"train_loss": -37.57035827636719, "global_step": 256120, "epoch": 2116} {"train_loss": -38.50944137573242, "global_step": 256121, "epoch": 2116} {"train_loss": -37.96454620361328, "global_step": 256122, "epoch": 2116} {"train_loss": -38.246883392333984, "global_step": 256123, "epoch": 2116} {"train_loss": -38.25800704956055, "global_step": 256124, "epoch": 2116} {"train_loss": -38.3356819152832, "global_step": 256125, "epoch": 2116} {"train_loss": -37.788177490234375, "global_step": 256126, "epoch": 2116} {"train_loss": -38.16030502319336, "global_step": 256127, "epoch": 2116} {"train_loss": -38.47853469848633, "global_step": 256128, "epoch": 2116} {"train_loss": -39.07536697387695, "global_step": 256129, "epoch": 2116} {"train_loss": -39.1567268371582, "global_step": 256130, "epoch": 2116} {"train_loss": -38.571693420410156, "global_step": 256131, "epoch": 2116} {"train_loss": -39.22968673706055, "global_step": 256132, "epoch": 2116} {"train_loss": -39.265872955322266, "global_step": 256133, "epoch": 2116} {"train_loss": -39.47764587402344, "global_step": 256134, "epoch": 2116} {"train_loss": -38.533935546875, "global_step": 256135, "epoch": 2116} {"train_loss": -38.79165267944336, "global_step": 256136, "epoch": 2116} {"train_loss": -39.72780227661133, "global_step": 256137, "epoch": 2116} {"train_loss": -39.49203872680664, "global_step": 256138, "epoch": 2116} {"train_loss": -38.40095138549805, "global_step": 256139, "epoch": 2116} {"train_loss": -38.916290283203125, "global_step": 256140, "epoch": 2116} {"train_loss": -40.14263916015625, "global_step": 256141, "epoch": 2116} {"train_loss": -39.326271057128906, "global_step": 256142, "epoch": 2116} {"train_loss": -38.557884216308594, "global_step": 256143, "epoch": 2116} {"train_loss": -39.47500991821289, "global_step": 256144, "epoch": 2116} {"train_loss": -39.84796905517578, "global_step": 256145, "epoch": 2116} {"train_loss": -39.576568603515625, "global_step": 256146, "epoch": 2116} {"train_loss": -40.406036376953125, "global_step": 256147, "epoch": 2116} {"train_loss": -40.210365295410156, "global_step": 256148, "epoch": 2116} {"train_loss": -39.699867248535156, "global_step": 256149, "epoch": 2116} {"train_loss": -39.545936584472656, "global_step": 256150, "epoch": 2116} {"train_loss": -40.16728591918945, "global_step": 256151, "epoch": 2116} {"train_loss": -40.49080276489258, "global_step": 256152, "epoch": 2116} {"train_loss": -40.154762268066406, "global_step": 256153, "epoch": 2116} {"train_loss": -39.5368537902832, "global_step": 256154, "epoch": 2116} {"train_loss": -39.37852096557617, "global_step": 256155, "epoch": 2116} {"train_loss": -39.94321340765835, "global_step": 256156, "epoch": 2116, "val_loss": 2655229.25} {"train_loss": -39.968204498291016, "global_step": 256157, "epoch": 2117} {"train_loss": -40.654964447021484, "global_step": 256158, "epoch": 2117} {"train_loss": -40.45901870727539, "global_step": 256159, "epoch": 2117} {"train_loss": -40.72829818725586, "global_step": 256160, "epoch": 2117} {"train_loss": -40.42580032348633, "global_step": 256161, "epoch": 2117} {"train_loss": -40.8449821472168, "global_step": 256162, "epoch": 2117} {"train_loss": -40.44977569580078, "global_step": 256163, "epoch": 2117} {"train_loss": -40.86867904663086, "global_step": 256164, "epoch": 2117} {"train_loss": -40.57101058959961, "global_step": 256165, "epoch": 2117} {"train_loss": -40.746826171875, "global_step": 256166, "epoch": 2117} {"train_loss": -39.5009651184082, "global_step": 256167, "epoch": 2117} {"train_loss": -38.690147399902344, "global_step": 256168, "epoch": 2117} {"train_loss": -37.999794006347656, "global_step": 256169, "epoch": 2117} {"train_loss": -39.42324447631836, "global_step": 256170, "epoch": 2117} {"train_loss": -40.26273727416992, "global_step": 256171, "epoch": 2117} {"train_loss": -38.25477981567383, "global_step": 256172, "epoch": 2117} {"train_loss": -37.44221115112305, "global_step": 256173, "epoch": 2117} {"train_loss": -41.2356071472168, "global_step": 256174, "epoch": 2117} {"train_loss": -39.566585540771484, "global_step": 256175, "epoch": 2117} {"train_loss": -39.439815521240234, "global_step": 256176, "epoch": 2117} {"train_loss": -40.47245407104492, "global_step": 256177, "epoch": 2117} {"train_loss": -39.34342956542969, "global_step": 256178, "epoch": 2117} {"train_loss": -40.336055755615234, "global_step": 256179, "epoch": 2117} {"train_loss": -40.03409194946289, "global_step": 256180, "epoch": 2117} {"train_loss": -40.2169075012207, "global_step": 256181, "epoch": 2117} {"train_loss": -39.219696044921875, "global_step": 256182, "epoch": 2117} {"train_loss": -40.648677825927734, "global_step": 256183, "epoch": 2117} {"train_loss": -39.74064636230469, "global_step": 256184, "epoch": 2117} {"train_loss": -40.72087860107422, "global_step": 256185, "epoch": 2117} {"train_loss": -40.3366813659668, "global_step": 256186, "epoch": 2117} {"train_loss": -40.37351608276367, "global_step": 256187, "epoch": 2117} {"train_loss": -40.78363037109375, "global_step": 256188, "epoch": 2117} {"train_loss": -40.869625091552734, "global_step": 256189, "epoch": 2117} {"train_loss": -41.48640060424805, "global_step": 256190, "epoch": 2117} {"train_loss": -40.97869110107422, "global_step": 256191, "epoch": 2117} {"train_loss": -40.87134552001953, "global_step": 256192, "epoch": 2117} {"train_loss": -41.20029830932617, "global_step": 256193, "epoch": 2117} {"train_loss": -41.058197021484375, "global_step": 256194, "epoch": 2117} {"train_loss": -41.5643424987793, "global_step": 256195, "epoch": 2117} {"train_loss": -41.0194091796875, "global_step": 256196, "epoch": 2117} {"train_loss": -41.60532760620117, "global_step": 256197, "epoch": 2117} {"train_loss": -39.42348861694336, "global_step": 256198, "epoch": 2117} {"train_loss": -41.40442657470703, "global_step": 256199, "epoch": 2117} {"train_loss": -41.64460372924805, "global_step": 256200, "epoch": 2117} {"train_loss": -41.24153137207031, "global_step": 256201, "epoch": 2117} {"train_loss": -41.71431350708008, "global_step": 256202, "epoch": 2117} {"train_loss": -41.243648529052734, "global_step": 256203, "epoch": 2117} {"train_loss": -41.353031158447266, "global_step": 256204, "epoch": 2117} {"train_loss": -42.08258056640625, "global_step": 256205, "epoch": 2117} {"train_loss": -40.502559661865234, "global_step": 256206, "epoch": 2117} {"train_loss": -20.66712760925293, "global_step": 256207, "epoch": 2117} {"train_loss": -40.34833908081055, "global_step": 256208, "epoch": 2117} {"train_loss": -38.0343017578125, "global_step": 256209, "epoch": 2117} {"train_loss": -40.5356559753418, "global_step": 256210, "epoch": 2117} {"train_loss": -39.91067886352539, "global_step": 256211, "epoch": 2117} {"train_loss": -36.01096725463867, "global_step": 256212, "epoch": 2117} {"train_loss": -38.75471115112305, "global_step": 256213, "epoch": 2117} {"train_loss": -6.463009834289551, "global_step": 256214, "epoch": 2117} {"train_loss": -32.37013626098633, "global_step": 256215, "epoch": 2117} {"train_loss": -35.26462936401367, "global_step": 256216, "epoch": 2117} {"train_loss": -37.47377395629883, "global_step": 256217, "epoch": 2117} {"train_loss": -32.9593391418457, "global_step": 256218, "epoch": 2117} {"train_loss": -23.44428825378418, "global_step": 256219, "epoch": 2117} {"train_loss": -36.77150344848633, "global_step": 256220, "epoch": 2117} {"train_loss": -36.43264389038086, "global_step": 256221, "epoch": 2117} {"train_loss": -29.64569664001465, "global_step": 256222, "epoch": 2117} {"train_loss": -34.896419525146484, "global_step": 256223, "epoch": 2117} {"train_loss": -33.911766052246094, "global_step": 256224, "epoch": 2117} {"train_loss": -33.268104553222656, "global_step": 256225, "epoch": 2117} {"train_loss": -36.2678108215332, "global_step": 256226, "epoch": 2117} {"train_loss": -36.20428466796875, "global_step": 256227, "epoch": 2117} {"train_loss": -33.51613235473633, "global_step": 256228, "epoch": 2117} {"train_loss": -37.98685836791992, "global_step": 256229, "epoch": 2117} {"train_loss": -38.62491989135742, "global_step": 256230, "epoch": 2117} {"train_loss": -36.69419860839844, "global_step": 256231, "epoch": 2117} {"train_loss": -37.61857986450195, "global_step": 256232, "epoch": 2117} {"train_loss": -36.93862533569336, "global_step": 256233, "epoch": 2117} {"train_loss": -36.36305618286133, "global_step": 256234, "epoch": 2117} {"train_loss": -33.34458541870117, "global_step": 256235, "epoch": 2117} {"train_loss": -32.99650192260742, "global_step": 256236, "epoch": 2117} {"train_loss": -36.37253952026367, "global_step": 256237, "epoch": 2117} {"train_loss": -34.91655731201172, "global_step": 256238, "epoch": 2117} {"train_loss": -32.51910400390625, "global_step": 256239, "epoch": 2117} {"train_loss": -33.55698776245117, "global_step": 256240, "epoch": 2117} {"train_loss": -35.41189193725586, "global_step": 256241, "epoch": 2117} {"train_loss": -37.69392776489258, "global_step": 256242, "epoch": 2117} {"train_loss": -33.74198532104492, "global_step": 256243, "epoch": 2117} {"train_loss": -38.14300537109375, "global_step": 256244, "epoch": 2117} {"train_loss": -38.650917053222656, "global_step": 256245, "epoch": 2117} {"train_loss": -36.46140670776367, "global_step": 256246, "epoch": 2117} {"train_loss": -37.99472427368164, "global_step": 256247, "epoch": 2117} {"train_loss": -33.92277908325195, "global_step": 256248, "epoch": 2117} {"train_loss": -30.773807525634766, "global_step": 256249, "epoch": 2117} {"train_loss": -37.535457611083984, "global_step": 256250, "epoch": 2117} {"train_loss": -35.465877532958984, "global_step": 256251, "epoch": 2117} {"train_loss": -36.23724365234375, "global_step": 256252, "epoch": 2117} {"train_loss": -36.44047927856445, "global_step": 256253, "epoch": 2117} {"train_loss": -35.83675765991211, "global_step": 256254, "epoch": 2117} {"train_loss": -34.56415939331055, "global_step": 256255, "epoch": 2117} {"train_loss": -34.24959945678711, "global_step": 256256, "epoch": 2117} {"train_loss": -38.039852142333984, "global_step": 256257, "epoch": 2117} {"train_loss": -35.75959777832031, "global_step": 256258, "epoch": 2117} {"train_loss": -38.582435607910156, "global_step": 256259, "epoch": 2117} {"train_loss": -37.176025390625, "global_step": 256260, "epoch": 2117} {"train_loss": -38.4610481262207, "global_step": 256261, "epoch": 2117} {"train_loss": -36.85883712768555, "global_step": 256262, "epoch": 2117} {"train_loss": -37.14292907714844, "global_step": 256263, "epoch": 2117} {"train_loss": -37.0988655090332, "global_step": 256264, "epoch": 2117} {"train_loss": -36.91377258300781, "global_step": 256265, "epoch": 2117} {"train_loss": -37.157142639160156, "global_step": 256266, "epoch": 2117} {"train_loss": -37.79912567138672, "global_step": 256267, "epoch": 2117} {"train_loss": -37.14786911010742, "global_step": 256268, "epoch": 2117} {"train_loss": -37.140663146972656, "global_step": 256269, "epoch": 2117} {"train_loss": -37.65385055541992, "global_step": 256270, "epoch": 2117} {"train_loss": -37.877784729003906, "global_step": 256271, "epoch": 2117} {"train_loss": -38.34328079223633, "global_step": 256272, "epoch": 2117} {"train_loss": -36.7108154296875, "global_step": 256273, "epoch": 2117} {"train_loss": -38.6822395324707, "global_step": 256274, "epoch": 2117} {"train_loss": -38.4858283996582, "global_step": 256275, "epoch": 2117} {"train_loss": -38.389869689941406, "global_step": 256276, "epoch": 2117} {"train_loss": -37.56032564620341, "global_step": 256277, "epoch": 2117, "val_loss": 2684315.75} {"train_loss": -38.00954055786133, "global_step": 256278, "epoch": 2118} {"train_loss": -38.95954513549805, "global_step": 256279, "epoch": 2118} {"train_loss": -38.76448440551758, "global_step": 256280, "epoch": 2118} {"train_loss": -38.4050178527832, "global_step": 256281, "epoch": 2118} {"train_loss": -39.11591339111328, "global_step": 256282, "epoch": 2118} {"train_loss": -39.17684555053711, "global_step": 256283, "epoch": 2118} {"train_loss": -39.25371551513672, "global_step": 256284, "epoch": 2118} {"train_loss": -38.26752853393555, "global_step": 256285, "epoch": 2118} {"train_loss": -38.8557014465332, "global_step": 256286, "epoch": 2118} {"train_loss": -39.454952239990234, "global_step": 256287, "epoch": 2118} {"train_loss": -39.50555419921875, "global_step": 256288, "epoch": 2118} {"train_loss": -39.22053146362305, "global_step": 256289, "epoch": 2118} {"train_loss": -39.16195297241211, "global_step": 256290, "epoch": 2118} {"train_loss": -39.94749069213867, "global_step": 256291, "epoch": 2118} {"train_loss": -39.38323974609375, "global_step": 256292, "epoch": 2118} {"train_loss": -40.07514190673828, "global_step": 256293, "epoch": 2118} {"train_loss": -39.37209701538086, "global_step": 256294, "epoch": 2118} {"train_loss": -38.28148651123047, "global_step": 256295, "epoch": 2118} {"train_loss": -39.07783508300781, "global_step": 256296, "epoch": 2118} {"train_loss": -39.222312927246094, "global_step": 256297, "epoch": 2118} {"train_loss": -39.79484939575195, "global_step": 256298, "epoch": 2118} {"train_loss": -39.86817932128906, "global_step": 256299, "epoch": 2118} {"train_loss": -40.1320686340332, "global_step": 256300, "epoch": 2118} {"train_loss": -39.334869384765625, "global_step": 256301, "epoch": 2118} {"train_loss": -39.4465446472168, "global_step": 256302, "epoch": 2118} {"train_loss": -39.38359451293945, "global_step": 256303, "epoch": 2118} {"train_loss": -39.869972229003906, "global_step": 256304, "epoch": 2118} {"train_loss": -40.60111618041992, "global_step": 256305, "epoch": 2118} {"train_loss": -39.81103515625, "global_step": 256306, "epoch": 2118} {"train_loss": -39.98257064819336, "global_step": 256307, "epoch": 2118} {"train_loss": -40.13684844970703, "global_step": 256308, "epoch": 2118} {"train_loss": -40.069820404052734, "global_step": 256309, "epoch": 2118} {"train_loss": -40.33588790893555, "global_step": 256310, "epoch": 2118} {"train_loss": -39.857208251953125, "global_step": 256311, "epoch": 2118} {"train_loss": -39.04500198364258, "global_step": 256312, "epoch": 2118} {"train_loss": -40.77613067626953, "global_step": 256313, "epoch": 2118} {"train_loss": -40.440513610839844, "global_step": 256314, "epoch": 2118} {"train_loss": -40.247562408447266, "global_step": 256315, "epoch": 2118} {"train_loss": -38.62129592895508, "global_step": 256316, "epoch": 2118} {"train_loss": -35.33494567871094, "global_step": 256317, "epoch": 2118} {"train_loss": -35.04154586791992, "global_step": 256318, "epoch": 2118} {"train_loss": -39.68510055541992, "global_step": 256319, "epoch": 2118} {"train_loss": -36.732215881347656, "global_step": 256320, "epoch": 2118} {"train_loss": -34.49480056762695, "global_step": 256321, "epoch": 2118} {"train_loss": -36.81439971923828, "global_step": 256322, "epoch": 2118} {"train_loss": -38.46499252319336, "global_step": 256323, "epoch": 2118} {"train_loss": -36.027462005615234, "global_step": 256324, "epoch": 2118} {"train_loss": -40.26929473876953, "global_step": 256325, "epoch": 2118} {"train_loss": -36.47833251953125, "global_step": 256326, "epoch": 2118} {"train_loss": -38.53951644897461, "global_step": 256327, "epoch": 2118} {"train_loss": -36.42654037475586, "global_step": 256328, "epoch": 2118} {"train_loss": -39.066219329833984, "global_step": 256329, "epoch": 2118} {"train_loss": -37.08708953857422, "global_step": 256330, "epoch": 2118} {"train_loss": -39.604583740234375, "global_step": 256331, "epoch": 2118} {"train_loss": -36.274444580078125, "global_step": 256332, "epoch": 2118} {"train_loss": -39.53144073486328, "global_step": 256333, "epoch": 2118} {"train_loss": -37.87142562866211, "global_step": 256334, "epoch": 2118} {"train_loss": -40.52571487426758, "global_step": 256335, "epoch": 2118} {"train_loss": -39.9193000793457, "global_step": 256336, "epoch": 2118} {"train_loss": -39.136329650878906, "global_step": 256337, "epoch": 2118} {"train_loss": -38.7575798034668, "global_step": 256338, "epoch": 2118} {"train_loss": -38.95400619506836, "global_step": 256339, "epoch": 2118} {"train_loss": -40.29098129272461, "global_step": 256340, "epoch": 2118} {"train_loss": -39.94138717651367, "global_step": 256341, "epoch": 2118} {"train_loss": -39.7605094909668, "global_step": 256342, "epoch": 2118} {"train_loss": -39.451541900634766, "global_step": 256343, "epoch": 2118} {"train_loss": -40.5896110534668, "global_step": 256344, "epoch": 2118} {"train_loss": -39.999027252197266, "global_step": 256345, "epoch": 2118} {"train_loss": -40.517677307128906, "global_step": 256346, "epoch": 2118} {"train_loss": -40.35470199584961, "global_step": 256347, "epoch": 2118} {"train_loss": -39.87685012817383, "global_step": 256348, "epoch": 2118} {"train_loss": -41.068538665771484, "global_step": 256349, "epoch": 2118} {"train_loss": -40.64853286743164, "global_step": 256350, "epoch": 2118} {"train_loss": -39.78887176513672, "global_step": 256351, "epoch": 2118} {"train_loss": -40.45903396606445, "global_step": 256352, "epoch": 2118} {"train_loss": -39.80842971801758, "global_step": 256353, "epoch": 2118} {"train_loss": -40.939849853515625, "global_step": 256354, "epoch": 2118} {"train_loss": -40.941253662109375, "global_step": 256355, "epoch": 2118} {"train_loss": -40.91377639770508, "global_step": 256356, "epoch": 2118} {"train_loss": -41.08900833129883, "global_step": 256357, "epoch": 2118} {"train_loss": -40.5662841796875, "global_step": 256358, "epoch": 2118} {"train_loss": -40.889549255371094, "global_step": 256359, "epoch": 2118} {"train_loss": -40.76129913330078, "global_step": 256360, "epoch": 2118} {"train_loss": -40.777462005615234, "global_step": 256361, "epoch": 2118} {"train_loss": -41.40847396850586, "global_step": 256362, "epoch": 2118} {"train_loss": -41.114776611328125, "global_step": 256363, "epoch": 2118} {"train_loss": -41.11032485961914, "global_step": 256364, "epoch": 2118} {"train_loss": -41.2696418762207, "global_step": 256365, "epoch": 2118} {"train_loss": -40.968929290771484, "global_step": 256366, "epoch": 2118} {"train_loss": -40.29108810424805, "global_step": 256367, "epoch": 2118} {"train_loss": -40.831214904785156, "global_step": 256368, "epoch": 2118} {"train_loss": -40.0401496887207, "global_step": 256369, "epoch": 2118} {"train_loss": -40.73767852783203, "global_step": 256370, "epoch": 2118} {"train_loss": -41.240970611572266, "global_step": 256371, "epoch": 2118} {"train_loss": -40.384132385253906, "global_step": 256372, "epoch": 2118} {"train_loss": -39.035892486572266, "global_step": 256373, "epoch": 2118} {"train_loss": -39.29000473022461, "global_step": 256374, "epoch": 2118} {"train_loss": -41.47291564941406, "global_step": 256375, "epoch": 2118} {"train_loss": -40.94467544555664, "global_step": 256376, "epoch": 2118} {"train_loss": -39.272056579589844, "global_step": 256377, "epoch": 2118} {"train_loss": -40.68849182128906, "global_step": 256378, "epoch": 2118} {"train_loss": -41.156341552734375, "global_step": 256379, "epoch": 2118} {"train_loss": -38.9691162109375, "global_step": 256380, "epoch": 2118} {"train_loss": -41.04612350463867, "global_step": 256381, "epoch": 2118} {"train_loss": -41.056068420410156, "global_step": 256382, "epoch": 2118} {"train_loss": -41.47119140625, "global_step": 256383, "epoch": 2118} {"train_loss": -41.02089309692383, "global_step": 256384, "epoch": 2118} {"train_loss": -41.07255935668945, "global_step": 256385, "epoch": 2118} {"train_loss": -41.65864944458008, "global_step": 256386, "epoch": 2118} {"train_loss": -41.28218460083008, "global_step": 256387, "epoch": 2118} {"train_loss": -42.088348388671875, "global_step": 256388, "epoch": 2118} {"train_loss": -41.317115783691406, "global_step": 256389, "epoch": 2118} {"train_loss": -41.410160064697266, "global_step": 256390, "epoch": 2118} {"train_loss": -41.0523796081543, "global_step": 256391, "epoch": 2118} {"train_loss": -41.263301849365234, "global_step": 256392, "epoch": 2118} {"train_loss": -41.33727264404297, "global_step": 256393, "epoch": 2118} {"train_loss": -41.84931564331055, "global_step": 256394, "epoch": 2118} {"train_loss": -41.26020812988281, "global_step": 256395, "epoch": 2118} {"train_loss": -41.78617858886719, "global_step": 256396, "epoch": 2118} {"train_loss": -41.5026741027832, "global_step": 256397, "epoch": 2118} {"train_loss": -39.79687988659567, "global_step": 256398, "epoch": 2118, "val_loss": 2647996.75} {"train_loss": -41.73714828491211, "global_step": 256399, "epoch": 2119} {"train_loss": -41.8888053894043, "global_step": 256400, "epoch": 2119} {"train_loss": -41.347572326660156, "global_step": 256401, "epoch": 2119} {"train_loss": -42.053924560546875, "global_step": 256402, "epoch": 2119} {"train_loss": -40.724796295166016, "global_step": 256403, "epoch": 2119} {"train_loss": -41.39347839355469, "global_step": 256404, "epoch": 2119} {"train_loss": -39.72109603881836, "global_step": 256405, "epoch": 2119} {"train_loss": -40.88417434692383, "global_step": 256406, "epoch": 2119} {"train_loss": -42.472938537597656, "global_step": 256407, "epoch": 2119} {"train_loss": -42.03580856323242, "global_step": 256408, "epoch": 2119} {"train_loss": -42.06026840209961, "global_step": 256409, "epoch": 2119} {"train_loss": -40.70162582397461, "global_step": 256410, "epoch": 2119} {"train_loss": -39.43834686279297, "global_step": 256411, "epoch": 2119} {"train_loss": -42.241783142089844, "global_step": 256412, "epoch": 2119} {"train_loss": -41.42325973510742, "global_step": 256413, "epoch": 2119} {"train_loss": -41.681270599365234, "global_step": 256414, "epoch": 2119} {"train_loss": -42.486324310302734, "global_step": 256415, "epoch": 2119} {"train_loss": -41.0958366394043, "global_step": 256416, "epoch": 2119} {"train_loss": -41.982295989990234, "global_step": 256417, "epoch": 2119} {"train_loss": -41.10799026489258, "global_step": 256418, "epoch": 2119} {"train_loss": -42.05245590209961, "global_step": 256419, "epoch": 2119} {"train_loss": -42.4248046875, "global_step": 256420, "epoch": 2119} {"train_loss": -41.4443473815918, "global_step": 256421, "epoch": 2119} {"train_loss": -42.42280197143555, "global_step": 256422, "epoch": 2119} {"train_loss": -41.79219436645508, "global_step": 256423, "epoch": 2119} {"train_loss": -42.217506408691406, "global_step": 256424, "epoch": 2119} {"train_loss": -40.96689987182617, "global_step": 256425, "epoch": 2119} {"train_loss": -42.27561569213867, "global_step": 256426, "epoch": 2119} {"train_loss": -41.076087951660156, "global_step": 256427, "epoch": 2119} {"train_loss": -41.38838577270508, "global_step": 256428, "epoch": 2119} {"train_loss": -42.322166442871094, "global_step": 256429, "epoch": 2119} {"train_loss": -42.1330680847168, "global_step": 256430, "epoch": 2119} {"train_loss": -42.80146408081055, "global_step": 256431, "epoch": 2119} {"train_loss": -42.36353302001953, "global_step": 256432, "epoch": 2119} {"train_loss": -41.497894287109375, "global_step": 256433, "epoch": 2119} {"train_loss": -41.71543502807617, "global_step": 256434, "epoch": 2119} {"train_loss": -41.421180725097656, "global_step": 256435, "epoch": 2119} {"train_loss": -42.3268928527832, "global_step": 256436, "epoch": 2119} {"train_loss": -41.174072265625, "global_step": 256437, "epoch": 2119} {"train_loss": -40.176937103271484, "global_step": 256438, "epoch": 2119} {"train_loss": -40.82925033569336, "global_step": 256439, "epoch": 2119} {"train_loss": -40.70829391479492, "global_step": 256440, "epoch": 2119} {"train_loss": -39.08445739746094, "global_step": 256441, "epoch": 2119} {"train_loss": -40.237464904785156, "global_step": 256442, "epoch": 2119} {"train_loss": -42.55517578125, "global_step": 256443, "epoch": 2119} {"train_loss": -38.35578536987305, "global_step": 256444, "epoch": 2119} {"train_loss": -38.781150817871094, "global_step": 256445, "epoch": 2119} {"train_loss": -40.76930618286133, "global_step": 256446, "epoch": 2119} {"train_loss": -39.347625732421875, "global_step": 256447, "epoch": 2119} {"train_loss": -37.9400634765625, "global_step": 256448, "epoch": 2119} {"train_loss": -41.80561447143555, "global_step": 256449, "epoch": 2119} {"train_loss": -40.447425842285156, "global_step": 256450, "epoch": 2119} {"train_loss": -40.984352111816406, "global_step": 256451, "epoch": 2119} {"train_loss": -41.866268157958984, "global_step": 256452, "epoch": 2119} {"train_loss": -40.942420959472656, "global_step": 256453, "epoch": 2119} {"train_loss": -40.756893157958984, "global_step": 256454, "epoch": 2119} {"train_loss": -41.21772003173828, "global_step": 256455, "epoch": 2119} {"train_loss": -41.42011642456055, "global_step": 256456, "epoch": 2119} {"train_loss": -41.524349212646484, "global_step": 256457, "epoch": 2119} {"train_loss": -41.97346115112305, "global_step": 256458, "epoch": 2119} {"train_loss": -40.30595016479492, "global_step": 256459, "epoch": 2119} {"train_loss": -41.50606155395508, "global_step": 256460, "epoch": 2119} {"train_loss": -40.78815841674805, "global_step": 256461, "epoch": 2119} {"train_loss": -41.735965728759766, "global_step": 256462, "epoch": 2119} {"train_loss": -40.85895538330078, "global_step": 256463, "epoch": 2119} {"train_loss": -40.94614028930664, "global_step": 256464, "epoch": 2119} {"train_loss": -39.448143005371094, "global_step": 256465, "epoch": 2119} {"train_loss": -40.436744689941406, "global_step": 256466, "epoch": 2119} {"train_loss": -41.142852783203125, "global_step": 256467, "epoch": 2119} {"train_loss": -41.43623733520508, "global_step": 256468, "epoch": 2119} {"train_loss": -41.16162109375, "global_step": 256469, "epoch": 2119} {"train_loss": -41.86161422729492, "global_step": 256470, "epoch": 2119} {"train_loss": -40.682308197021484, "global_step": 256471, "epoch": 2119} {"train_loss": -41.86579513549805, "global_step": 256472, "epoch": 2119} {"train_loss": -38.406578063964844, "global_step": 256473, "epoch": 2119} {"train_loss": -40.72056198120117, "global_step": 256474, "epoch": 2119} {"train_loss": -40.57217025756836, "global_step": 256475, "epoch": 2119} {"train_loss": -41.8165397644043, "global_step": 256476, "epoch": 2119} {"train_loss": -41.98104476928711, "global_step": 256477, "epoch": 2119} {"train_loss": -39.72097396850586, "global_step": 256478, "epoch": 2119} {"train_loss": -41.79659652709961, "global_step": 256479, "epoch": 2119} {"train_loss": -41.26813507080078, "global_step": 256480, "epoch": 2119} {"train_loss": -41.168331146240234, "global_step": 256481, "epoch": 2119} {"train_loss": -40.68640899658203, "global_step": 256482, "epoch": 2119} {"train_loss": -41.11112976074219, "global_step": 256483, "epoch": 2119} {"train_loss": -38.950355529785156, "global_step": 256484, "epoch": 2119} {"train_loss": -41.21018981933594, "global_step": 256485, "epoch": 2119} {"train_loss": -40.79362106323242, "global_step": 256486, "epoch": 2119} {"train_loss": -39.1541748046875, "global_step": 256487, "epoch": 2119} {"train_loss": -38.98480224609375, "global_step": 256488, "epoch": 2119} {"train_loss": -40.81911087036133, "global_step": 256489, "epoch": 2119} {"train_loss": -37.91508483886719, "global_step": 256490, "epoch": 2119} {"train_loss": -39.98722457885742, "global_step": 256491, "epoch": 2119} {"train_loss": -36.77522659301758, "global_step": 256492, "epoch": 2119} {"train_loss": -38.64295959472656, "global_step": 256493, "epoch": 2119} {"train_loss": -38.78632736206055, "global_step": 256494, "epoch": 2119} {"train_loss": -38.79195785522461, "global_step": 256495, "epoch": 2119} {"train_loss": -40.271949768066406, "global_step": 256496, "epoch": 2119} {"train_loss": -39.61859130859375, "global_step": 256497, "epoch": 2119} {"train_loss": -39.42853546142578, "global_step": 256498, "epoch": 2119} {"train_loss": -37.894744873046875, "global_step": 256499, "epoch": 2119} {"train_loss": -41.08327102661133, "global_step": 256500, "epoch": 2119} {"train_loss": -36.208309173583984, "global_step": 256501, "epoch": 2119} {"train_loss": -40.005462646484375, "global_step": 256502, "epoch": 2119} {"train_loss": -37.09626388549805, "global_step": 256503, "epoch": 2119} {"train_loss": -36.92887496948242, "global_step": 256504, "epoch": 2119} {"train_loss": -31.477497100830078, "global_step": 256505, "epoch": 2119} {"train_loss": -37.961402893066406, "global_step": 256506, "epoch": 2119} {"train_loss": -34.266700744628906, "global_step": 256507, "epoch": 2119} {"train_loss": -35.7496223449707, "global_step": 256508, "epoch": 2119} {"train_loss": -29.846698760986328, "global_step": 256509, "epoch": 2119} {"train_loss": -36.165618896484375, "global_step": 256510, "epoch": 2119} {"train_loss": -33.6267204284668, "global_step": 256511, "epoch": 2119} {"train_loss": -34.344722747802734, "global_step": 256512, "epoch": 2119} {"train_loss": -32.055076599121094, "global_step": 256513, "epoch": 2119} {"train_loss": -31.879322052001953, "global_step": 256514, "epoch": 2119} {"train_loss": -34.3387451171875, "global_step": 256515, "epoch": 2119} {"train_loss": -34.96406173706055, "global_step": 256516, "epoch": 2119} {"train_loss": -31.75909996032715, "global_step": 256517, "epoch": 2119} {"train_loss": -30.320661544799805, "global_step": 256518, "epoch": 2119} {"train_loss": -39.79984787870045, "global_step": 256519, "epoch": 2119, "val_loss": 2478178.75} {"train_loss": -32.86245346069336, "global_step": 256520, "epoch": 2120} {"train_loss": -35.538543701171875, "global_step": 256521, "epoch": 2120} {"train_loss": -35.92608642578125, "global_step": 256522, "epoch": 2120} {"train_loss": -27.88483238220215, "global_step": 256523, "epoch": 2120} {"train_loss": -36.07571029663086, "global_step": 256524, "epoch": 2120} {"train_loss": -26.089298248291016, "global_step": 256525, "epoch": 2120} {"train_loss": -33.65571212768555, "global_step": 256526, "epoch": 2120} {"train_loss": -35.97652816772461, "global_step": 256527, "epoch": 2120} {"train_loss": -35.596885681152344, "global_step": 256528, "epoch": 2120} {"train_loss": -34.64698028564453, "global_step": 256529, "epoch": 2120} {"train_loss": -33.7720947265625, "global_step": 256530, "epoch": 2120} {"train_loss": -36.16804885864258, "global_step": 256531, "epoch": 2120} {"train_loss": -33.21186065673828, "global_step": 256532, "epoch": 2120} {"train_loss": -37.6086540222168, "global_step": 256533, "epoch": 2120} {"train_loss": -36.302894592285156, "global_step": 256534, "epoch": 2120} {"train_loss": -37.37166976928711, "global_step": 256535, "epoch": 2120} {"train_loss": -36.906185150146484, "global_step": 256536, "epoch": 2120} {"train_loss": -37.14736557006836, "global_step": 256537, "epoch": 2120} {"train_loss": -36.13030242919922, "global_step": 256538, "epoch": 2120} {"train_loss": -38.22837448120117, "global_step": 256539, "epoch": 2120} {"train_loss": -37.4538688659668, "global_step": 256540, "epoch": 2120} {"train_loss": -37.235713958740234, "global_step": 256541, "epoch": 2120} {"train_loss": -36.28053283691406, "global_step": 256542, "epoch": 2120} {"train_loss": -32.88991928100586, "global_step": 256543, "epoch": 2120} {"train_loss": -38.163944244384766, "global_step": 256544, "epoch": 2120} {"train_loss": -36.86137771606445, "global_step": 256545, "epoch": 2120} {"train_loss": -37.45918655395508, "global_step": 256546, "epoch": 2120} {"train_loss": -38.79386901855469, "global_step": 256547, "epoch": 2120} {"train_loss": -36.81489181518555, "global_step": 256548, "epoch": 2120} {"train_loss": -38.26359939575195, "global_step": 256549, "epoch": 2120} {"train_loss": -38.36967086791992, "global_step": 256550, "epoch": 2120} {"train_loss": -36.949432373046875, "global_step": 256551, "epoch": 2120} {"train_loss": -38.212310791015625, "global_step": 256552, "epoch": 2120} {"train_loss": -38.18121337890625, "global_step": 256553, "epoch": 2120} {"train_loss": -38.24089050292969, "global_step": 256554, "epoch": 2120} {"train_loss": -38.480812072753906, "global_step": 256555, "epoch": 2120} {"train_loss": -38.93776321411133, "global_step": 256556, "epoch": 2120} {"train_loss": -38.1817741394043, "global_step": 256557, "epoch": 2120} {"train_loss": -39.04268264770508, "global_step": 256558, "epoch": 2120} {"train_loss": -38.36753463745117, "global_step": 256559, "epoch": 2120} {"train_loss": -38.97209167480469, "global_step": 256560, "epoch": 2120} {"train_loss": -38.80961227416992, "global_step": 256561, "epoch": 2120} {"train_loss": -39.10845184326172, "global_step": 256562, "epoch": 2120} {"train_loss": -38.98948287963867, "global_step": 256563, "epoch": 2120} {"train_loss": -38.90311050415039, "global_step": 256564, "epoch": 2120} {"train_loss": -38.34112548828125, "global_step": 256565, "epoch": 2120} {"train_loss": -39.03440475463867, "global_step": 256566, "epoch": 2120} {"train_loss": -38.981353759765625, "global_step": 256567, "epoch": 2120} {"train_loss": -38.8822135925293, "global_step": 256568, "epoch": 2120} {"train_loss": -38.785919189453125, "global_step": 256569, "epoch": 2120} {"train_loss": -38.95343780517578, "global_step": 256570, "epoch": 2120} {"train_loss": -38.417701721191406, "global_step": 256571, "epoch": 2120} {"train_loss": -38.10763931274414, "global_step": 256572, "epoch": 2120} {"train_loss": -38.90529251098633, "global_step": 256573, "epoch": 2120} {"train_loss": -39.42927932739258, "global_step": 256574, "epoch": 2120} {"train_loss": -39.32270431518555, "global_step": 256575, "epoch": 2120} {"train_loss": -39.068660736083984, "global_step": 256576, "epoch": 2120} {"train_loss": -39.46208953857422, "global_step": 256577, "epoch": 2120} {"train_loss": -38.974761962890625, "global_step": 256578, "epoch": 2120} {"train_loss": -39.489906311035156, "global_step": 256579, "epoch": 2120} {"train_loss": -39.36997985839844, "global_step": 256580, "epoch": 2120} {"train_loss": -38.27340316772461, "global_step": 256581, "epoch": 2120} {"train_loss": -40.0294189453125, "global_step": 256582, "epoch": 2120} {"train_loss": -39.388641357421875, "global_step": 256583, "epoch": 2120} {"train_loss": -39.5971565246582, "global_step": 256584, "epoch": 2120} {"train_loss": -39.63063049316406, "global_step": 256585, "epoch": 2120} {"train_loss": -39.73151397705078, "global_step": 256586, "epoch": 2120} {"train_loss": -39.578853607177734, "global_step": 256587, "epoch": 2120} {"train_loss": -39.09265899658203, "global_step": 256588, "epoch": 2120} {"train_loss": -40.06181716918945, "global_step": 256589, "epoch": 2120} {"train_loss": -40.0080451965332, "global_step": 256590, "epoch": 2120} {"train_loss": -40.06380844116211, "global_step": 256591, "epoch": 2120} {"train_loss": -40.26028060913086, "global_step": 256592, "epoch": 2120} {"train_loss": -39.943843841552734, "global_step": 256593, "epoch": 2120} {"train_loss": -40.121551513671875, "global_step": 256594, "epoch": 2120} {"train_loss": -40.08366394042969, "global_step": 256595, "epoch": 2120} {"train_loss": -39.532135009765625, "global_step": 256596, "epoch": 2120} {"train_loss": -39.4871826171875, "global_step": 256597, "epoch": 2120} {"train_loss": -40.278812408447266, "global_step": 256598, "epoch": 2120} {"train_loss": -39.83991241455078, "global_step": 256599, "epoch": 2120} {"train_loss": -40.5141716003418, "global_step": 256600, "epoch": 2120} {"train_loss": -40.337257385253906, "global_step": 256601, "epoch": 2120} {"train_loss": -40.595314025878906, "global_step": 256602, "epoch": 2120} {"train_loss": -40.289222717285156, "global_step": 256603, "epoch": 2120} {"train_loss": -40.53432846069336, "global_step": 256604, "epoch": 2120} {"train_loss": -40.39468002319336, "global_step": 256605, "epoch": 2120} {"train_loss": -40.363582611083984, "global_step": 256606, "epoch": 2120} {"train_loss": -40.5522346496582, "global_step": 256607, "epoch": 2120} {"train_loss": -40.52906036376953, "global_step": 256608, "epoch": 2120} {"train_loss": -40.37178421020508, "global_step": 256609, "epoch": 2120} {"train_loss": -40.5681266784668, "global_step": 256610, "epoch": 2120} {"train_loss": -40.7138786315918, "global_step": 256611, "epoch": 2120} {"train_loss": -40.4040412902832, "global_step": 256612, "epoch": 2120} {"train_loss": -40.46356201171875, "global_step": 256613, "epoch": 2120} {"train_loss": -40.15495300292969, "global_step": 256614, "epoch": 2120} {"train_loss": -40.09443283081055, "global_step": 256615, "epoch": 2120} {"train_loss": -40.64712142944336, "global_step": 256616, "epoch": 2120} {"train_loss": -41.32271957397461, "global_step": 256617, "epoch": 2120} {"train_loss": -40.49357986450195, "global_step": 256618, "epoch": 2120} {"train_loss": -39.96644592285156, "global_step": 256619, "epoch": 2120} {"train_loss": -40.64483642578125, "global_step": 256620, "epoch": 2120} {"train_loss": -40.975772857666016, "global_step": 256621, "epoch": 2120} {"train_loss": -41.099952697753906, "global_step": 256622, "epoch": 2120} {"train_loss": -40.72537612915039, "global_step": 256623, "epoch": 2120} {"train_loss": -40.7689323425293, "global_step": 256624, "epoch": 2120} {"train_loss": -40.86314010620117, "global_step": 256625, "epoch": 2120} {"train_loss": -41.54165267944336, "global_step": 256626, "epoch": 2120} {"train_loss": -41.20344924926758, "global_step": 256627, "epoch": 2120} {"train_loss": -41.011356353759766, "global_step": 256628, "epoch": 2120} {"train_loss": -41.205684661865234, "global_step": 256629, "epoch": 2120} {"train_loss": -41.308837890625, "global_step": 256630, "epoch": 2120} {"train_loss": -41.007904052734375, "global_step": 256631, "epoch": 2120} {"train_loss": -41.0771484375, "global_step": 256632, "epoch": 2120} {"train_loss": -40.38706588745117, "global_step": 256633, "epoch": 2120} {"train_loss": -40.699134826660156, "global_step": 256634, "epoch": 2120} {"train_loss": -40.52431106567383, "global_step": 256635, "epoch": 2120} {"train_loss": -40.63593292236328, "global_step": 256636, "epoch": 2120} {"train_loss": -41.262672424316406, "global_step": 256637, "epoch": 2120} {"train_loss": -41.397727966308594, "global_step": 256638, "epoch": 2120} {"train_loss": -41.00941848754883, "global_step": 256639, "epoch": 2120} {"train_loss": -38.78333069667343, "global_step": 256640, "epoch": 2120, "val_loss": 2555230.0} {"train_loss": -40.2740478515625, "global_step": 256641, "epoch": 2121} {"train_loss": -41.118812561035156, "global_step": 256642, "epoch": 2121} {"train_loss": -41.17710494995117, "global_step": 256643, "epoch": 2121} {"train_loss": -41.03977584838867, "global_step": 256644, "epoch": 2121} {"train_loss": -38.53215026855469, "global_step": 256645, "epoch": 2121} {"train_loss": -34.90055465698242, "global_step": 256646, "epoch": 2121} {"train_loss": -37.42885971069336, "global_step": 256647, "epoch": 2121} {"train_loss": -41.32255935668945, "global_step": 256648, "epoch": 2121} {"train_loss": -38.07758712768555, "global_step": 256649, "epoch": 2121} {"train_loss": -37.622589111328125, "global_step": 256650, "epoch": 2121} {"train_loss": -40.905357360839844, "global_step": 256651, "epoch": 2121} {"train_loss": -36.47380447387695, "global_step": 256652, "epoch": 2121} {"train_loss": -37.91959762573242, "global_step": 256653, "epoch": 2121} {"train_loss": -40.97421646118164, "global_step": 256654, "epoch": 2121} {"train_loss": -39.01044845581055, "global_step": 256655, "epoch": 2121} {"train_loss": -40.19327926635742, "global_step": 256656, "epoch": 2121} {"train_loss": -39.566219329833984, "global_step": 256657, "epoch": 2121} {"train_loss": -41.1599006652832, "global_step": 256658, "epoch": 2121} {"train_loss": -38.947059631347656, "global_step": 256659, "epoch": 2121} {"train_loss": -40.68124771118164, "global_step": 256660, "epoch": 2121} {"train_loss": -40.588294982910156, "global_step": 256661, "epoch": 2121} {"train_loss": -41.599605560302734, "global_step": 256662, "epoch": 2121} {"train_loss": -41.23152542114258, "global_step": 256663, "epoch": 2121} {"train_loss": -41.513301849365234, "global_step": 256664, "epoch": 2121} {"train_loss": -41.31845474243164, "global_step": 256665, "epoch": 2121} {"train_loss": -41.14059066772461, "global_step": 256666, "epoch": 2121} {"train_loss": -41.08091354370117, "global_step": 256667, "epoch": 2121} {"train_loss": -41.3338737487793, "global_step": 256668, "epoch": 2121} {"train_loss": -41.67434310913086, "global_step": 256669, "epoch": 2121} {"train_loss": -41.62908935546875, "global_step": 256670, "epoch": 2121} {"train_loss": -40.63187789916992, "global_step": 256671, "epoch": 2121} {"train_loss": -41.92939376831055, "global_step": 256672, "epoch": 2121} {"train_loss": -41.319908142089844, "global_step": 256673, "epoch": 2121} {"train_loss": -41.893707275390625, "global_step": 256674, "epoch": 2121} {"train_loss": -41.34161376953125, "global_step": 256675, "epoch": 2121} {"train_loss": -41.53874588012695, "global_step": 256676, "epoch": 2121} {"train_loss": -41.00872802734375, "global_step": 256677, "epoch": 2121} {"train_loss": -41.458717346191406, "global_step": 256678, "epoch": 2121} {"train_loss": -41.20520782470703, "global_step": 256679, "epoch": 2121} {"train_loss": -41.43086624145508, "global_step": 256680, "epoch": 2121} {"train_loss": -41.770530700683594, "global_step": 256681, "epoch": 2121} {"train_loss": -41.72420883178711, "global_step": 256682, "epoch": 2121} {"train_loss": -39.467803955078125, "global_step": 256683, "epoch": 2121} {"train_loss": -41.82802963256836, "global_step": 256684, "epoch": 2121} {"train_loss": -41.224361419677734, "global_step": 256685, "epoch": 2121} {"train_loss": -41.36125564575195, "global_step": 256686, "epoch": 2121} {"train_loss": -41.5593376159668, "global_step": 256687, "epoch": 2121} {"train_loss": -41.84744644165039, "global_step": 256688, "epoch": 2121} {"train_loss": -41.5500373840332, "global_step": 256689, "epoch": 2121} {"train_loss": -39.97245407104492, "global_step": 256690, "epoch": 2121} {"train_loss": -41.378196716308594, "global_step": 256691, "epoch": 2121} {"train_loss": -41.426055908203125, "global_step": 256692, "epoch": 2121} {"train_loss": -41.36017990112305, "global_step": 256693, "epoch": 2121} {"train_loss": -41.3489990234375, "global_step": 256694, "epoch": 2121} {"train_loss": -41.45211410522461, "global_step": 256695, "epoch": 2121} {"train_loss": -41.67542266845703, "global_step": 256696, "epoch": 2121} {"train_loss": -41.025535583496094, "global_step": 256697, "epoch": 2121} {"train_loss": -41.39720153808594, "global_step": 256698, "epoch": 2121} {"train_loss": -41.54970932006836, "global_step": 256699, "epoch": 2121} {"train_loss": -41.53247833251953, "global_step": 256700, "epoch": 2121} {"train_loss": -41.52025604248047, "global_step": 256701, "epoch": 2121} {"train_loss": -40.63704299926758, "global_step": 256702, "epoch": 2121} {"train_loss": -41.05750274658203, "global_step": 256703, "epoch": 2121} {"train_loss": -40.71236801147461, "global_step": 256704, "epoch": 2121} {"train_loss": -41.85910415649414, "global_step": 256705, "epoch": 2121} {"train_loss": -39.354942321777344, "global_step": 256706, "epoch": 2121} {"train_loss": -39.92036437988281, "global_step": 256707, "epoch": 2121} {"train_loss": -40.54330062866211, "global_step": 256708, "epoch": 2121} {"train_loss": -41.56135177612305, "global_step": 256709, "epoch": 2121} {"train_loss": -41.69854736328125, "global_step": 256710, "epoch": 2121} {"train_loss": -40.48414993286133, "global_step": 256711, "epoch": 2121} {"train_loss": -40.39155197143555, "global_step": 256712, "epoch": 2121} {"train_loss": -42.119014739990234, "global_step": 256713, "epoch": 2121} {"train_loss": -42.032012939453125, "global_step": 256714, "epoch": 2121} {"train_loss": -41.88359451293945, "global_step": 256715, "epoch": 2121} {"train_loss": -41.89727783203125, "global_step": 256716, "epoch": 2121} {"train_loss": -41.487213134765625, "global_step": 256717, "epoch": 2121} {"train_loss": -41.39162063598633, "global_step": 256718, "epoch": 2121} {"train_loss": -41.02549743652344, "global_step": 256719, "epoch": 2121} {"train_loss": -41.9395866394043, "global_step": 256720, "epoch": 2121} {"train_loss": -42.00824737548828, "global_step": 256721, "epoch": 2121} {"train_loss": -41.294921875, "global_step": 256722, "epoch": 2121} {"train_loss": -41.65802764892578, "global_step": 256723, "epoch": 2121} {"train_loss": -41.61814498901367, "global_step": 256724, "epoch": 2121} {"train_loss": -41.42430877685547, "global_step": 256725, "epoch": 2121} {"train_loss": -39.957725524902344, "global_step": 256726, "epoch": 2121} {"train_loss": -38.81279754638672, "global_step": 256727, "epoch": 2121} {"train_loss": -37.753108978271484, "global_step": 256728, "epoch": 2121} {"train_loss": -33.797027587890625, "global_step": 256729, "epoch": 2121} {"train_loss": -33.058712005615234, "global_step": 256730, "epoch": 2121} {"train_loss": -37.258514404296875, "global_step": 256731, "epoch": 2121} {"train_loss": -42.063011169433594, "global_step": 256732, "epoch": 2121} {"train_loss": -40.091888427734375, "global_step": 256733, "epoch": 2121} {"train_loss": -40.11762619018555, "global_step": 256734, "epoch": 2121} {"train_loss": -41.658599853515625, "global_step": 256735, "epoch": 2121} {"train_loss": -40.51776123046875, "global_step": 256736, "epoch": 2121} {"train_loss": -40.91862106323242, "global_step": 256737, "epoch": 2121} {"train_loss": -41.44914245605469, "global_step": 256738, "epoch": 2121} {"train_loss": -41.178585052490234, "global_step": 256739, "epoch": 2121} {"train_loss": -41.63486862182617, "global_step": 256740, "epoch": 2121} {"train_loss": -41.365928649902344, "global_step": 256741, "epoch": 2121} {"train_loss": -41.53921890258789, "global_step": 256742, "epoch": 2121} {"train_loss": -41.74786376953125, "global_step": 256743, "epoch": 2121} {"train_loss": -41.86219024658203, "global_step": 256744, "epoch": 2121} {"train_loss": -41.52009963989258, "global_step": 256745, "epoch": 2121} {"train_loss": -41.90293884277344, "global_step": 256746, "epoch": 2121} {"train_loss": -41.900184631347656, "global_step": 256747, "epoch": 2121} {"train_loss": -41.91097640991211, "global_step": 256748, "epoch": 2121} {"train_loss": -41.351470947265625, "global_step": 256749, "epoch": 2121} {"train_loss": -41.7734375, "global_step": 256750, "epoch": 2121} {"train_loss": -41.81586837768555, "global_step": 256751, "epoch": 2121} {"train_loss": -42.566741943359375, "global_step": 256752, "epoch": 2121} {"train_loss": -42.42716598510742, "global_step": 256753, "epoch": 2121} {"train_loss": -41.73499298095703, "global_step": 256754, "epoch": 2121} {"train_loss": -42.1242790222168, "global_step": 256755, "epoch": 2121} {"train_loss": -42.07600402832031, "global_step": 256756, "epoch": 2121} {"train_loss": -42.36536407470703, "global_step": 256757, "epoch": 2121} {"train_loss": -42.06794357299805, "global_step": 256758, "epoch": 2121} {"train_loss": -41.688838958740234, "global_step": 256759, "epoch": 2121} {"train_loss": -42.21586608886719, "global_step": 256760, "epoch": 2121} {"train_loss": -40.8471272366106, "global_step": 256761, "epoch": 2121, "val_loss": 2614433.25} {"train_loss": -42.71061325073242, "global_step": 256762, "epoch": 2122} {"train_loss": -42.00302505493164, "global_step": 256763, "epoch": 2122} {"train_loss": -42.4593620300293, "global_step": 256764, "epoch": 2122} {"train_loss": -42.854949951171875, "global_step": 256765, "epoch": 2122} {"train_loss": -42.107872009277344, "global_step": 256766, "epoch": 2122} {"train_loss": -42.02273178100586, "global_step": 256767, "epoch": 2122} {"train_loss": -42.65219497680664, "global_step": 256768, "epoch": 2122} {"train_loss": -42.739620208740234, "global_step": 256769, "epoch": 2122} {"train_loss": -42.273929595947266, "global_step": 256770, "epoch": 2122} {"train_loss": -42.52290725708008, "global_step": 256771, "epoch": 2122} {"train_loss": -42.492366790771484, "global_step": 256772, "epoch": 2122} {"train_loss": -42.275238037109375, "global_step": 256773, "epoch": 2122} {"train_loss": -42.66471862792969, "global_step": 256774, "epoch": 2122} {"train_loss": -42.53927993774414, "global_step": 256775, "epoch": 2122} {"train_loss": -42.59915542602539, "global_step": 256776, "epoch": 2122} {"train_loss": -43.074302673339844, "global_step": 256777, "epoch": 2122} {"train_loss": -42.17283248901367, "global_step": 256778, "epoch": 2122} {"train_loss": -42.43342208862305, "global_step": 256779, "epoch": 2122} {"train_loss": -42.65131759643555, "global_step": 256780, "epoch": 2122} {"train_loss": -42.86487579345703, "global_step": 256781, "epoch": 2122} {"train_loss": -42.379913330078125, "global_step": 256782, "epoch": 2122} {"train_loss": -42.188228607177734, "global_step": 256783, "epoch": 2122} {"train_loss": -42.18296813964844, "global_step": 256784, "epoch": 2122} {"train_loss": -42.480037689208984, "global_step": 256785, "epoch": 2122} {"train_loss": -42.530818939208984, "global_step": 256786, "epoch": 2122} {"train_loss": -42.352012634277344, "global_step": 256787, "epoch": 2122} {"train_loss": -41.959537506103516, "global_step": 256788, "epoch": 2122} {"train_loss": -42.29856491088867, "global_step": 256789, "epoch": 2122} {"train_loss": -41.84992599487305, "global_step": 256790, "epoch": 2122} {"train_loss": -40.52506637573242, "global_step": 256791, "epoch": 2122} {"train_loss": -41.168975830078125, "global_step": 256792, "epoch": 2122} {"train_loss": -40.79450988769531, "global_step": 256793, "epoch": 2122} {"train_loss": -41.744930267333984, "global_step": 256794, "epoch": 2122} {"train_loss": -40.77300262451172, "global_step": 256795, "epoch": 2122} {"train_loss": -40.78133773803711, "global_step": 256796, "epoch": 2122} {"train_loss": -42.13025665283203, "global_step": 256797, "epoch": 2122} {"train_loss": -41.84275436401367, "global_step": 256798, "epoch": 2122} {"train_loss": -42.479217529296875, "global_step": 256799, "epoch": 2122} {"train_loss": -39.811859130859375, "global_step": 256800, "epoch": 2122} {"train_loss": -40.01510238647461, "global_step": 256801, "epoch": 2122} {"train_loss": -42.32743453979492, "global_step": 256802, "epoch": 2122} {"train_loss": -41.16129684448242, "global_step": 256803, "epoch": 2122} {"train_loss": -39.642581939697266, "global_step": 256804, "epoch": 2122} {"train_loss": -41.423675537109375, "global_step": 256805, "epoch": 2122} {"train_loss": -42.58848571777344, "global_step": 256806, "epoch": 2122} {"train_loss": -41.39011764526367, "global_step": 256807, "epoch": 2122} {"train_loss": -39.97945022583008, "global_step": 256808, "epoch": 2122} {"train_loss": -41.572723388671875, "global_step": 256809, "epoch": 2122} {"train_loss": -42.01143264770508, "global_step": 256810, "epoch": 2122} {"train_loss": -41.81315231323242, "global_step": 256811, "epoch": 2122} {"train_loss": -41.83110046386719, "global_step": 256812, "epoch": 2122} {"train_loss": -42.05535125732422, "global_step": 256813, "epoch": 2122} {"train_loss": -42.32126998901367, "global_step": 256814, "epoch": 2122} {"train_loss": -41.675079345703125, "global_step": 256815, "epoch": 2122} {"train_loss": -42.40869903564453, "global_step": 256816, "epoch": 2122} {"train_loss": -41.6746940612793, "global_step": 256817, "epoch": 2122} {"train_loss": -42.440696716308594, "global_step": 256818, "epoch": 2122} {"train_loss": -42.314083099365234, "global_step": 256819, "epoch": 2122} {"train_loss": -42.09864807128906, "global_step": 256820, "epoch": 2122} {"train_loss": -42.55686569213867, "global_step": 256821, "epoch": 2122} {"train_loss": -41.82387924194336, "global_step": 256822, "epoch": 2122} {"train_loss": -43.15806198120117, "global_step": 256823, "epoch": 2122} {"train_loss": -41.94614791870117, "global_step": 256824, "epoch": 2122} {"train_loss": -42.908199310302734, "global_step": 256825, "epoch": 2122} {"train_loss": -42.45310592651367, "global_step": 256826, "epoch": 2122} {"train_loss": -42.52688217163086, "global_step": 256827, "epoch": 2122} {"train_loss": -42.3898811340332, "global_step": 256828, "epoch": 2122} {"train_loss": -42.76568603515625, "global_step": 256829, "epoch": 2122} {"train_loss": -42.69110870361328, "global_step": 256830, "epoch": 2122} {"train_loss": -43.2015495300293, "global_step": 256831, "epoch": 2122} {"train_loss": -42.17308044433594, "global_step": 256832, "epoch": 2122} {"train_loss": -42.392398834228516, "global_step": 256833, "epoch": 2122} {"train_loss": -41.953208923339844, "global_step": 256834, "epoch": 2122} {"train_loss": -41.98683547973633, "global_step": 256835, "epoch": 2122} {"train_loss": -41.50960922241211, "global_step": 256836, "epoch": 2122} {"train_loss": -42.52067184448242, "global_step": 256837, "epoch": 2122} {"train_loss": -41.34328842163086, "global_step": 256838, "epoch": 2122} {"train_loss": -37.90110397338867, "global_step": 256839, "epoch": 2122} {"train_loss": -33.37601852416992, "global_step": 256840, "epoch": 2122} {"train_loss": -35.419593811035156, "global_step": 256841, "epoch": 2122} {"train_loss": -39.78599166870117, "global_step": 256842, "epoch": 2122} {"train_loss": -39.5238151550293, "global_step": 256843, "epoch": 2122} {"train_loss": -34.382076263427734, "global_step": 256844, "epoch": 2122} {"train_loss": -36.751956939697266, "global_step": 256845, "epoch": 2122} {"train_loss": -38.57867431640625, "global_step": 256846, "epoch": 2122} {"train_loss": -41.18113327026367, "global_step": 256847, "epoch": 2122} {"train_loss": -40.002586364746094, "global_step": 256848, "epoch": 2122} {"train_loss": -40.91805648803711, "global_step": 256849, "epoch": 2122} {"train_loss": -37.48877716064453, "global_step": 256850, "epoch": 2122} {"train_loss": -37.08265686035156, "global_step": 256851, "epoch": 2122} {"train_loss": -40.716094970703125, "global_step": 256852, "epoch": 2122} {"train_loss": -39.61188888549805, "global_step": 256853, "epoch": 2122} {"train_loss": -40.50285339355469, "global_step": 256854, "epoch": 2122} {"train_loss": -40.456417083740234, "global_step": 256855, "epoch": 2122} {"train_loss": -40.58955001831055, "global_step": 256856, "epoch": 2122} {"train_loss": -40.67363739013672, "global_step": 256857, "epoch": 2122} {"train_loss": -33.822139739990234, "global_step": 256858, "epoch": 2122} {"train_loss": -40.46636199951172, "global_step": 256859, "epoch": 2122} {"train_loss": -37.504371643066406, "global_step": 256860, "epoch": 2122} {"train_loss": -40.7011833190918, "global_step": 256861, "epoch": 2122} {"train_loss": -38.28791046142578, "global_step": 256862, "epoch": 2122} {"train_loss": -39.355712890625, "global_step": 256863, "epoch": 2122} {"train_loss": -40.596290588378906, "global_step": 256864, "epoch": 2122} {"train_loss": -41.6772575378418, "global_step": 256865, "epoch": 2122} {"train_loss": -40.18284225463867, "global_step": 256866, "epoch": 2122} {"train_loss": -41.46027755737305, "global_step": 256867, "epoch": 2122} {"train_loss": -41.20107650756836, "global_step": 256868, "epoch": 2122} {"train_loss": -39.729713439941406, "global_step": 256869, "epoch": 2122} {"train_loss": -41.32830810546875, "global_step": 256870, "epoch": 2122} {"train_loss": -39.48707962036133, "global_step": 256871, "epoch": 2122} {"train_loss": -40.020442962646484, "global_step": 256872, "epoch": 2122} {"train_loss": -41.20345687866211, "global_step": 256873, "epoch": 2122} {"train_loss": -37.79359817504883, "global_step": 256874, "epoch": 2122} {"train_loss": -39.63093185424805, "global_step": 256875, "epoch": 2122} {"train_loss": -40.97501754760742, "global_step": 256876, "epoch": 2122} {"train_loss": -39.460880279541016, "global_step": 256877, "epoch": 2122} {"train_loss": -40.751014709472656, "global_step": 256878, "epoch": 2122} {"train_loss": -40.841670989990234, "global_step": 256879, "epoch": 2122} {"train_loss": -41.415103912353516, "global_step": 256880, "epoch": 2122} {"train_loss": -40.90205764770508, "global_step": 256881, "epoch": 2122} {"train_loss": -41.09243850077479, "global_step": 256882, "epoch": 2122, "val_loss": 2612543.25} {"train_loss": -41.46794128417969, "global_step": 256883, "epoch": 2123} {"train_loss": -37.95733642578125, "global_step": 256884, "epoch": 2123} {"train_loss": -40.1291618347168, "global_step": 256885, "epoch": 2123} {"train_loss": -40.9510383605957, "global_step": 256886, "epoch": 2123} {"train_loss": -41.35585403442383, "global_step": 256887, "epoch": 2123} {"train_loss": -38.51005935668945, "global_step": 256888, "epoch": 2123} {"train_loss": -40.62992477416992, "global_step": 256889, "epoch": 2123} {"train_loss": -41.041778564453125, "global_step": 256890, "epoch": 2123} {"train_loss": -39.4437370300293, "global_step": 256891, "epoch": 2123} {"train_loss": -40.017738342285156, "global_step": 256892, "epoch": 2123} {"train_loss": -41.0539665222168, "global_step": 256893, "epoch": 2123} {"train_loss": -41.799957275390625, "global_step": 256894, "epoch": 2123} {"train_loss": -40.77549362182617, "global_step": 256895, "epoch": 2123} {"train_loss": -40.886653900146484, "global_step": 256896, "epoch": 2123} {"train_loss": -40.1042366027832, "global_step": 256897, "epoch": 2123} {"train_loss": -41.23260498046875, "global_step": 256898, "epoch": 2123} {"train_loss": -39.80222702026367, "global_step": 256899, "epoch": 2123} {"train_loss": -37.46364212036133, "global_step": 256900, "epoch": 2123} {"train_loss": -40.32598876953125, "global_step": 256901, "epoch": 2123} {"train_loss": -41.63222122192383, "global_step": 256902, "epoch": 2123} {"train_loss": -37.383060455322266, "global_step": 256903, "epoch": 2123} {"train_loss": -40.64558792114258, "global_step": 256904, "epoch": 2123} {"train_loss": -41.09042739868164, "global_step": 256905, "epoch": 2123} {"train_loss": -40.68024444580078, "global_step": 256906, "epoch": 2123} {"train_loss": -41.22526931762695, "global_step": 256907, "epoch": 2123} {"train_loss": -39.29480743408203, "global_step": 256908, "epoch": 2123} {"train_loss": -40.403358459472656, "global_step": 256909, "epoch": 2123} {"train_loss": -41.662742614746094, "global_step": 256910, "epoch": 2123} {"train_loss": -40.59942626953125, "global_step": 256911, "epoch": 2123} {"train_loss": -41.53110885620117, "global_step": 256912, "epoch": 2123} {"train_loss": -40.0891227722168, "global_step": 256913, "epoch": 2123} {"train_loss": -41.65089797973633, "global_step": 256914, "epoch": 2123} {"train_loss": -41.13301467895508, "global_step": 256915, "epoch": 2123} {"train_loss": -40.79792404174805, "global_step": 256916, "epoch": 2123} {"train_loss": -41.253334045410156, "global_step": 256917, "epoch": 2123} {"train_loss": -40.41090774536133, "global_step": 256918, "epoch": 2123} {"train_loss": -39.463924407958984, "global_step": 256919, "epoch": 2123} {"train_loss": -41.00614547729492, "global_step": 256920, "epoch": 2123} {"train_loss": -41.27005386352539, "global_step": 256921, "epoch": 2123} {"train_loss": -42.07673263549805, "global_step": 256922, "epoch": 2123} {"train_loss": -40.5880241394043, "global_step": 256923, "epoch": 2123} {"train_loss": -42.06977081298828, "global_step": 256924, "epoch": 2123} {"train_loss": -40.587135314941406, "global_step": 256925, "epoch": 2123} {"train_loss": -40.96059036254883, "global_step": 256926, "epoch": 2123} {"train_loss": -41.2126579284668, "global_step": 256927, "epoch": 2123} {"train_loss": -41.3674201965332, "global_step": 256928, "epoch": 2123} {"train_loss": -41.753936767578125, "global_step": 256929, "epoch": 2123} {"train_loss": -42.103816986083984, "global_step": 256930, "epoch": 2123} {"train_loss": -41.614295959472656, "global_step": 256931, "epoch": 2123} {"train_loss": -42.245758056640625, "global_step": 256932, "epoch": 2123} {"train_loss": -40.642921447753906, "global_step": 256933, "epoch": 2123} {"train_loss": -41.72694396972656, "global_step": 256934, "epoch": 2123} {"train_loss": -40.769256591796875, "global_step": 256935, "epoch": 2123} {"train_loss": -42.0279541015625, "global_step": 256936, "epoch": 2123} {"train_loss": -40.6533088684082, "global_step": 256937, "epoch": 2123} {"train_loss": -36.810970306396484, "global_step": 256938, "epoch": 2123} {"train_loss": -41.69302749633789, "global_step": 256939, "epoch": 2123} {"train_loss": -40.66767120361328, "global_step": 256940, "epoch": 2123} {"train_loss": -41.09457015991211, "global_step": 256941, "epoch": 2123} {"train_loss": -40.60640335083008, "global_step": 256942, "epoch": 2123} {"train_loss": -41.1636962890625, "global_step": 256943, "epoch": 2123} {"train_loss": -40.59077072143555, "global_step": 256944, "epoch": 2123} {"train_loss": -35.9172477722168, "global_step": 256945, "epoch": 2123} {"train_loss": -39.73296356201172, "global_step": 256946, "epoch": 2123} {"train_loss": -40.56211471557617, "global_step": 256947, "epoch": 2123} {"train_loss": -40.193241119384766, "global_step": 256948, "epoch": 2123} {"train_loss": -40.89341735839844, "global_step": 256949, "epoch": 2123} {"train_loss": -40.35829544067383, "global_step": 256950, "epoch": 2123} {"train_loss": -39.29199981689453, "global_step": 256951, "epoch": 2123} {"train_loss": -39.54176712036133, "global_step": 256952, "epoch": 2123} {"train_loss": -37.720611572265625, "global_step": 256953, "epoch": 2123} {"train_loss": -39.57194900512695, "global_step": 256954, "epoch": 2123} {"train_loss": -41.111263275146484, "global_step": 256955, "epoch": 2123} {"train_loss": -40.53970718383789, "global_step": 256956, "epoch": 2123} {"train_loss": -39.56092071533203, "global_step": 256957, "epoch": 2123} {"train_loss": -41.198360443115234, "global_step": 256958, "epoch": 2123} {"train_loss": -40.63824462890625, "global_step": 256959, "epoch": 2123} {"train_loss": -41.63421630859375, "global_step": 256960, "epoch": 2123} {"train_loss": -40.14575958251953, "global_step": 256961, "epoch": 2123} {"train_loss": -41.92513656616211, "global_step": 256962, "epoch": 2123} {"train_loss": -41.06958770751953, "global_step": 256963, "epoch": 2123} {"train_loss": -41.33396530151367, "global_step": 256964, "epoch": 2123} {"train_loss": -41.843299865722656, "global_step": 256965, "epoch": 2123} {"train_loss": -40.8149299621582, "global_step": 256966, "epoch": 2123} {"train_loss": -42.010257720947266, "global_step": 256967, "epoch": 2123} {"train_loss": -40.0621452331543, "global_step": 256968, "epoch": 2123} {"train_loss": -41.55088806152344, "global_step": 256969, "epoch": 2123} {"train_loss": -42.017940521240234, "global_step": 256970, "epoch": 2123} {"train_loss": -41.30424118041992, "global_step": 256971, "epoch": 2123} {"train_loss": -39.3768310546875, "global_step": 256972, "epoch": 2123} {"train_loss": -41.797061920166016, "global_step": 256973, "epoch": 2123} {"train_loss": -42.26253128051758, "global_step": 256974, "epoch": 2123} {"train_loss": -41.75740051269531, "global_step": 256975, "epoch": 2123} {"train_loss": -41.589080810546875, "global_step": 256976, "epoch": 2123} {"train_loss": -41.4342041015625, "global_step": 256977, "epoch": 2123} {"train_loss": -41.808902740478516, "global_step": 256978, "epoch": 2123} {"train_loss": -41.621795654296875, "global_step": 256979, "epoch": 2123} {"train_loss": -40.74983215332031, "global_step": 256980, "epoch": 2123} {"train_loss": -41.065826416015625, "global_step": 256981, "epoch": 2123} {"train_loss": -41.4387321472168, "global_step": 256982, "epoch": 2123} {"train_loss": -42.30125427246094, "global_step": 256983, "epoch": 2123} {"train_loss": -41.61799240112305, "global_step": 256984, "epoch": 2123} {"train_loss": -41.64759063720703, "global_step": 256985, "epoch": 2123} {"train_loss": -41.64944076538086, "global_step": 256986, "epoch": 2123} {"train_loss": -41.299171447753906, "global_step": 256987, "epoch": 2123} {"train_loss": -42.295562744140625, "global_step": 256988, "epoch": 2123} {"train_loss": -42.498477935791016, "global_step": 256989, "epoch": 2123} {"train_loss": -42.3155517578125, "global_step": 256990, "epoch": 2123} {"train_loss": -42.37358474731445, "global_step": 256991, "epoch": 2123} {"train_loss": -41.740478515625, "global_step": 256992, "epoch": 2123} {"train_loss": -42.036373138427734, "global_step": 256993, "epoch": 2123} {"train_loss": -41.721893310546875, "global_step": 256994, "epoch": 2123} {"train_loss": -42.550270080566406, "global_step": 256995, "epoch": 2123} {"train_loss": -43.049434661865234, "global_step": 256996, "epoch": 2123} {"train_loss": -42.51699447631836, "global_step": 256997, "epoch": 2123} {"train_loss": -42.50138473510742, "global_step": 256998, "epoch": 2123} {"train_loss": -42.12165069580078, "global_step": 256999, "epoch": 2123} {"train_loss": -42.058135986328125, "global_step": 257000, "epoch": 2123} {"train_loss": -41.855438232421875, "global_step": 257001, "epoch": 2123} {"train_loss": -42.44626235961914, "global_step": 257002, "epoch": 2123} {"train_loss": -40.954710274688466, "global_step": 257003, "epoch": 2123, "val_loss": 2557147.75} {"train_loss": -41.507911682128906, "global_step": 257004, "epoch": 2124} {"train_loss": -41.175086975097656, "global_step": 257005, "epoch": 2124} {"train_loss": -42.680355072021484, "global_step": 257006, "epoch": 2124} {"train_loss": -42.235172271728516, "global_step": 257007, "epoch": 2124} {"train_loss": -42.064231872558594, "global_step": 257008, "epoch": 2124} {"train_loss": -42.04864501953125, "global_step": 257009, "epoch": 2124} {"train_loss": -41.655338287353516, "global_step": 257010, "epoch": 2124} {"train_loss": -40.854591369628906, "global_step": 257011, "epoch": 2124} {"train_loss": -40.23503494262695, "global_step": 257012, "epoch": 2124} {"train_loss": -38.76582717895508, "global_step": 257013, "epoch": 2124} {"train_loss": -38.133811950683594, "global_step": 257014, "epoch": 2124} {"train_loss": -36.97954177856445, "global_step": 257015, "epoch": 2124} {"train_loss": -38.92200469970703, "global_step": 257016, "epoch": 2124} {"train_loss": -41.69771957397461, "global_step": 257017, "epoch": 2124} {"train_loss": -41.67306900024414, "global_step": 257018, "epoch": 2124} {"train_loss": -40.187862396240234, "global_step": 257019, "epoch": 2124} {"train_loss": -42.05502700805664, "global_step": 257020, "epoch": 2124} {"train_loss": -41.988826751708984, "global_step": 257021, "epoch": 2124} {"train_loss": -41.0495719909668, "global_step": 257022, "epoch": 2124} {"train_loss": -41.204803466796875, "global_step": 257023, "epoch": 2124} {"train_loss": -42.25666427612305, "global_step": 257024, "epoch": 2124} {"train_loss": -40.30241775512695, "global_step": 257025, "epoch": 2124} {"train_loss": -41.58822250366211, "global_step": 257026, "epoch": 2124} {"train_loss": -41.96208953857422, "global_step": 257027, "epoch": 2124} {"train_loss": -42.203121185302734, "global_step": 257028, "epoch": 2124} {"train_loss": -41.64295196533203, "global_step": 257029, "epoch": 2124} {"train_loss": -42.26310348510742, "global_step": 257030, "epoch": 2124} {"train_loss": -40.8668327331543, "global_step": 257031, "epoch": 2124} {"train_loss": -40.76807403564453, "global_step": 257032, "epoch": 2124} {"train_loss": -42.80082321166992, "global_step": 257033, "epoch": 2124} {"train_loss": -42.240657806396484, "global_step": 257034, "epoch": 2124} {"train_loss": -42.096126556396484, "global_step": 257035, "epoch": 2124} {"train_loss": -42.61904525756836, "global_step": 257036, "epoch": 2124} {"train_loss": -41.685546875, "global_step": 257037, "epoch": 2124} {"train_loss": -40.93457794189453, "global_step": 257038, "epoch": 2124} {"train_loss": -42.31707763671875, "global_step": 257039, "epoch": 2124} {"train_loss": -41.94704818725586, "global_step": 257040, "epoch": 2124} {"train_loss": -41.822608947753906, "global_step": 257041, "epoch": 2124} {"train_loss": -41.700740814208984, "global_step": 257042, "epoch": 2124} {"train_loss": -41.261234283447266, "global_step": 257043, "epoch": 2124} {"train_loss": -42.464412689208984, "global_step": 257044, "epoch": 2124} {"train_loss": -41.942264556884766, "global_step": 257045, "epoch": 2124} {"train_loss": -41.32145690917969, "global_step": 257046, "epoch": 2124} {"train_loss": -41.2855110168457, "global_step": 257047, "epoch": 2124} {"train_loss": -41.600887298583984, "global_step": 257048, "epoch": 2124} {"train_loss": -42.7929573059082, "global_step": 257049, "epoch": 2124} {"train_loss": -42.156715393066406, "global_step": 257050, "epoch": 2124} {"train_loss": -42.37340545654297, "global_step": 257051, "epoch": 2124} {"train_loss": -42.11376190185547, "global_step": 257052, "epoch": 2124} {"train_loss": -41.37375259399414, "global_step": 257053, "epoch": 2124} {"train_loss": -40.93815994262695, "global_step": 257054, "epoch": 2124} {"train_loss": -41.38774871826172, "global_step": 257055, "epoch": 2124} {"train_loss": -42.95396423339844, "global_step": 257056, "epoch": 2124} {"train_loss": -36.50445556640625, "global_step": 257057, "epoch": 2124} {"train_loss": -40.55476379394531, "global_step": 257058, "epoch": 2124} {"train_loss": -42.11491775512695, "global_step": 257059, "epoch": 2124} {"train_loss": -42.03948211669922, "global_step": 257060, "epoch": 2124} {"train_loss": -42.577999114990234, "global_step": 257061, "epoch": 2124} {"train_loss": -41.82456588745117, "global_step": 257062, "epoch": 2124} {"train_loss": -42.15671920776367, "global_step": 257063, "epoch": 2124} {"train_loss": -42.22529220581055, "global_step": 257064, "epoch": 2124} {"train_loss": -42.4982795715332, "global_step": 257065, "epoch": 2124} {"train_loss": -42.18259811401367, "global_step": 257066, "epoch": 2124} {"train_loss": -42.21466064453125, "global_step": 257067, "epoch": 2124} {"train_loss": -42.460655212402344, "global_step": 257068, "epoch": 2124} {"train_loss": -42.45985412597656, "global_step": 257069, "epoch": 2124} {"train_loss": -42.6236457824707, "global_step": 257070, "epoch": 2124} {"train_loss": -42.50931930541992, "global_step": 257071, "epoch": 2124} {"train_loss": -42.17751693725586, "global_step": 257072, "epoch": 2124} {"train_loss": -42.368404388427734, "global_step": 257073, "epoch": 2124} {"train_loss": -42.683719635009766, "global_step": 257074, "epoch": 2124} {"train_loss": -42.89469528198242, "global_step": 257075, "epoch": 2124} {"train_loss": -42.090492248535156, "global_step": 257076, "epoch": 2124} {"train_loss": -42.24261474609375, "global_step": 257077, "epoch": 2124} {"train_loss": -40.744564056396484, "global_step": 257078, "epoch": 2124} {"train_loss": -42.219608306884766, "global_step": 257079, "epoch": 2124} {"train_loss": -42.23114776611328, "global_step": 257080, "epoch": 2124} {"train_loss": -42.07906723022461, "global_step": 257081, "epoch": 2124} {"train_loss": -42.56964874267578, "global_step": 257082, "epoch": 2124} {"train_loss": -42.52471923828125, "global_step": 257083, "epoch": 2124} {"train_loss": -41.79629135131836, "global_step": 257084, "epoch": 2124} {"train_loss": -42.520870208740234, "global_step": 257085, "epoch": 2124} {"train_loss": -42.94259262084961, "global_step": 257086, "epoch": 2124} {"train_loss": -41.38151168823242, "global_step": 257087, "epoch": 2124} {"train_loss": -41.58448028564453, "global_step": 257088, "epoch": 2124} {"train_loss": -42.573760986328125, "global_step": 257089, "epoch": 2124} {"train_loss": -41.68599319458008, "global_step": 257090, "epoch": 2124} {"train_loss": -40.37478256225586, "global_step": 257091, "epoch": 2124} {"train_loss": -37.55249786376953, "global_step": 257092, "epoch": 2124} {"train_loss": -38.9397087097168, "global_step": 257093, "epoch": 2124} {"train_loss": -39.55275344848633, "global_step": 257094, "epoch": 2124} {"train_loss": -40.263179779052734, "global_step": 257095, "epoch": 2124} {"train_loss": -39.846858978271484, "global_step": 257096, "epoch": 2124} {"train_loss": -41.539268493652344, "global_step": 257097, "epoch": 2124} {"train_loss": -39.68922805786133, "global_step": 257098, "epoch": 2124} {"train_loss": -41.379756927490234, "global_step": 257099, "epoch": 2124} {"train_loss": -41.72657775878906, "global_step": 257100, "epoch": 2124} {"train_loss": -39.85424041748047, "global_step": 257101, "epoch": 2124} {"train_loss": -41.61334991455078, "global_step": 257102, "epoch": 2124} {"train_loss": -40.87256622314453, "global_step": 257103, "epoch": 2124} {"train_loss": -41.96485137939453, "global_step": 257104, "epoch": 2124} {"train_loss": -41.899593353271484, "global_step": 257105, "epoch": 2124} {"train_loss": -41.86605453491211, "global_step": 257106, "epoch": 2124} {"train_loss": -42.11234664916992, "global_step": 257107, "epoch": 2124} {"train_loss": -41.530330657958984, "global_step": 257108, "epoch": 2124} {"train_loss": -42.38058090209961, "global_step": 257109, "epoch": 2124} {"train_loss": -41.64427947998047, "global_step": 257110, "epoch": 2124} {"train_loss": -42.15360641479492, "global_step": 257111, "epoch": 2124} {"train_loss": -42.28375244140625, "global_step": 257112, "epoch": 2124} {"train_loss": -41.11909866333008, "global_step": 257113, "epoch": 2124} {"train_loss": -41.010772705078125, "global_step": 257114, "epoch": 2124} {"train_loss": -39.71604537963867, "global_step": 257115, "epoch": 2124} {"train_loss": -39.802860260009766, "global_step": 257116, "epoch": 2124} {"train_loss": -41.029415130615234, "global_step": 257117, "epoch": 2124} {"train_loss": -41.08098602294922, "global_step": 257118, "epoch": 2124} {"train_loss": -41.59734344482422, "global_step": 257119, "epoch": 2124} {"train_loss": -40.72724533081055, "global_step": 257120, "epoch": 2124} {"train_loss": -41.158058166503906, "global_step": 257121, "epoch": 2124} {"train_loss": -42.01755905151367, "global_step": 257122, "epoch": 2124} {"train_loss": -41.42129135131836, "global_step": 257123, "epoch": 2124} {"train_loss": -41.47599095746505, "global_step": 257124, "epoch": 2124, "val_loss": 2527880.25} {"train_loss": -41.657859802246094, "global_step": 257125, "epoch": 2125} {"train_loss": -41.905216217041016, "global_step": 257126, "epoch": 2125} {"train_loss": -42.190223693847656, "global_step": 257127, "epoch": 2125} {"train_loss": -42.512245178222656, "global_step": 257128, "epoch": 2125} {"train_loss": -41.92991256713867, "global_step": 257129, "epoch": 2125} {"train_loss": -42.53256607055664, "global_step": 257130, "epoch": 2125} {"train_loss": -42.54172134399414, "global_step": 257131, "epoch": 2125} {"train_loss": -42.65544128417969, "global_step": 257132, "epoch": 2125} {"train_loss": -42.04899215698242, "global_step": 257133, "epoch": 2125} {"train_loss": -42.27231979370117, "global_step": 257134, "epoch": 2125} {"train_loss": -42.713191986083984, "global_step": 257135, "epoch": 2125} {"train_loss": -43.03937911987305, "global_step": 257136, "epoch": 2125} {"train_loss": -42.61869430541992, "global_step": 257137, "epoch": 2125} {"train_loss": -42.307838439941406, "global_step": 257138, "epoch": 2125} {"train_loss": -42.5181770324707, "global_step": 257139, "epoch": 2125} {"train_loss": -42.559364318847656, "global_step": 257140, "epoch": 2125} {"train_loss": -42.21600341796875, "global_step": 257141, "epoch": 2125} {"train_loss": -42.678035736083984, "global_step": 257142, "epoch": 2125} {"train_loss": -42.319427490234375, "global_step": 257143, "epoch": 2125} {"train_loss": -41.443397521972656, "global_step": 257144, "epoch": 2125} {"train_loss": -41.5961799621582, "global_step": 257145, "epoch": 2125} {"train_loss": -42.534603118896484, "global_step": 257146, "epoch": 2125} {"train_loss": -42.78181838989258, "global_step": 257147, "epoch": 2125} {"train_loss": -41.343353271484375, "global_step": 257148, "epoch": 2125} {"train_loss": -42.83443069458008, "global_step": 257149, "epoch": 2125} {"train_loss": -42.729103088378906, "global_step": 257150, "epoch": 2125} {"train_loss": -42.16953659057617, "global_step": 257151, "epoch": 2125} {"train_loss": -42.304054260253906, "global_step": 257152, "epoch": 2125} {"train_loss": -42.666481018066406, "global_step": 257153, "epoch": 2125} {"train_loss": -40.850337982177734, "global_step": 257154, "epoch": 2125} {"train_loss": -41.96116256713867, "global_step": 257155, "epoch": 2125} {"train_loss": -42.62217330932617, "global_step": 257156, "epoch": 2125} {"train_loss": -41.50771713256836, "global_step": 257157, "epoch": 2125} {"train_loss": -41.95961380004883, "global_step": 257158, "epoch": 2125} {"train_loss": -42.05160903930664, "global_step": 257159, "epoch": 2125} {"train_loss": -42.7262077331543, "global_step": 257160, "epoch": 2125} {"train_loss": -42.41558837890625, "global_step": 257161, "epoch": 2125} {"train_loss": -41.94245910644531, "global_step": 257162, "epoch": 2125} {"train_loss": -41.50521469116211, "global_step": 257163, "epoch": 2125} {"train_loss": -42.74241256713867, "global_step": 257164, "epoch": 2125} {"train_loss": -40.95314407348633, "global_step": 257165, "epoch": 2125} {"train_loss": -40.96125411987305, "global_step": 257166, "epoch": 2125} {"train_loss": -42.09041976928711, "global_step": 257167, "epoch": 2125} {"train_loss": -42.29045486450195, "global_step": 257168, "epoch": 2125} {"train_loss": -41.3945198059082, "global_step": 257169, "epoch": 2125} {"train_loss": -41.38490676879883, "global_step": 257170, "epoch": 2125} {"train_loss": -41.91286849975586, "global_step": 257171, "epoch": 2125} {"train_loss": -42.634864807128906, "global_step": 257172, "epoch": 2125} {"train_loss": -42.266021728515625, "global_step": 257173, "epoch": 2125} {"train_loss": -41.77875900268555, "global_step": 257174, "epoch": 2125} {"train_loss": -40.885929107666016, "global_step": 257175, "epoch": 2125} {"train_loss": -42.03641891479492, "global_step": 257176, "epoch": 2125} {"train_loss": -42.674842834472656, "global_step": 257177, "epoch": 2125} {"train_loss": -40.64268112182617, "global_step": 257178, "epoch": 2125} {"train_loss": -43.14051055908203, "global_step": 257179, "epoch": 2125} {"train_loss": -42.7050666809082, "global_step": 257180, "epoch": 2125} {"train_loss": -42.3673210144043, "global_step": 257181, "epoch": 2125} {"train_loss": -42.55713653564453, "global_step": 257182, "epoch": 2125} {"train_loss": -43.11625671386719, "global_step": 257183, "epoch": 2125} {"train_loss": -42.72159194946289, "global_step": 257184, "epoch": 2125} {"train_loss": -42.69841003417969, "global_step": 257185, "epoch": 2125} {"train_loss": -43.31597137451172, "global_step": 257186, "epoch": 2125} {"train_loss": -42.714599609375, "global_step": 257187, "epoch": 2125} {"train_loss": -43.089656829833984, "global_step": 257188, "epoch": 2125} {"train_loss": -43.055885314941406, "global_step": 257189, "epoch": 2125} {"train_loss": -42.38363265991211, "global_step": 257190, "epoch": 2125} {"train_loss": -41.82209396362305, "global_step": 257191, "epoch": 2125} {"train_loss": -42.24055099487305, "global_step": 257192, "epoch": 2125} {"train_loss": -43.50153350830078, "global_step": 257193, "epoch": 2125} {"train_loss": -41.74470901489258, "global_step": 257194, "epoch": 2125} {"train_loss": -38.43202590942383, "global_step": 257195, "epoch": 2125} {"train_loss": -36.7517204284668, "global_step": 257196, "epoch": 2125} {"train_loss": -40.193668365478516, "global_step": 257197, "epoch": 2125} {"train_loss": -38.79301834106445, "global_step": 257198, "epoch": 2125} {"train_loss": -40.18437957763672, "global_step": 257199, "epoch": 2125} {"train_loss": -38.2337646484375, "global_step": 257200, "epoch": 2125} {"train_loss": -38.57895278930664, "global_step": 257201, "epoch": 2125} {"train_loss": -31.159595489501953, "global_step": 257202, "epoch": 2125} {"train_loss": -39.84708786010742, "global_step": 257203, "epoch": 2125} {"train_loss": -33.93531799316406, "global_step": 257204, "epoch": 2125} {"train_loss": -39.06964111328125, "global_step": 257205, "epoch": 2125} {"train_loss": -27.487884521484375, "global_step": 257206, "epoch": 2125} {"train_loss": -40.30173110961914, "global_step": 257207, "epoch": 2125} {"train_loss": -38.116512298583984, "global_step": 257208, "epoch": 2125} {"train_loss": -40.22455596923828, "global_step": 257209, "epoch": 2125} {"train_loss": -30.77311134338379, "global_step": 257210, "epoch": 2125} {"train_loss": -26.6246395111084, "global_step": 257211, "epoch": 2125} {"train_loss": -37.885406494140625, "global_step": 257212, "epoch": 2125} {"train_loss": -38.705169677734375, "global_step": 257213, "epoch": 2125} {"train_loss": -34.340572357177734, "global_step": 257214, "epoch": 2125} {"train_loss": -37.9545783996582, "global_step": 257215, "epoch": 2125} {"train_loss": -37.22401809692383, "global_step": 257216, "epoch": 2125} {"train_loss": -33.641963958740234, "global_step": 257217, "epoch": 2125} {"train_loss": -35.41071319580078, "global_step": 257218, "epoch": 2125} {"train_loss": -38.04827880859375, "global_step": 257219, "epoch": 2125} {"train_loss": -27.6949462890625, "global_step": 257220, "epoch": 2125} {"train_loss": -34.63917541503906, "global_step": 257221, "epoch": 2125} {"train_loss": -37.32682800292969, "global_step": 257222, "epoch": 2125} {"train_loss": -31.988224029541016, "global_step": 257223, "epoch": 2125} {"train_loss": -22.773717880249023, "global_step": 257224, "epoch": 2125} {"train_loss": -37.41187286376953, "global_step": 257225, "epoch": 2125} {"train_loss": -39.54536819458008, "global_step": 257226, "epoch": 2125} {"train_loss": -28.786773681640625, "global_step": 257227, "epoch": 2125} {"train_loss": -37.73929977416992, "global_step": 257228, "epoch": 2125} {"train_loss": -27.25843620300293, "global_step": 257229, "epoch": 2125} {"train_loss": -34.93379592895508, "global_step": 257230, "epoch": 2125} {"train_loss": -35.416786193847656, "global_step": 257231, "epoch": 2125} {"train_loss": -34.31382369995117, "global_step": 257232, "epoch": 2125} {"train_loss": -31.978321075439453, "global_step": 257233, "epoch": 2125} {"train_loss": -32.8284912109375, "global_step": 257234, "epoch": 2125} {"train_loss": -37.18873977661133, "global_step": 257235, "epoch": 2125} {"train_loss": -37.01127243041992, "global_step": 257236, "epoch": 2125} {"train_loss": -38.267486572265625, "global_step": 257237, "epoch": 2125} {"train_loss": -35.71571350097656, "global_step": 257238, "epoch": 2125} {"train_loss": -38.786922454833984, "global_step": 257239, "epoch": 2125} {"train_loss": -37.59727096557617, "global_step": 257240, "epoch": 2125} {"train_loss": -35.71919631958008, "global_step": 257241, "epoch": 2125} {"train_loss": -36.53377914428711, "global_step": 257242, "epoch": 2125} {"train_loss": -35.65361404418945, "global_step": 257243, "epoch": 2125} {"train_loss": -38.38860321044922, "global_step": 257244, "epoch": 2125} {"train_loss": -39.43894788253406, "global_step": 257245, "epoch": 2125, "val_loss": 3438324.75} {"train_loss": -37.47981643676758, "global_step": 257246, "epoch": 2126} {"train_loss": -37.450469970703125, "global_step": 257247, "epoch": 2126} {"train_loss": -36.0446891784668, "global_step": 257248, "epoch": 2126} {"train_loss": -36.56820297241211, "global_step": 257249, "epoch": 2126} {"train_loss": -38.649166107177734, "global_step": 257250, "epoch": 2126} {"train_loss": -37.95098876953125, "global_step": 257251, "epoch": 2126} {"train_loss": -38.479644775390625, "global_step": 257252, "epoch": 2126} {"train_loss": -38.50757598876953, "global_step": 257253, "epoch": 2126} {"train_loss": -37.43589401245117, "global_step": 257254, "epoch": 2126} {"train_loss": -38.94668197631836, "global_step": 257255, "epoch": 2126} {"train_loss": -39.28288650512695, "global_step": 257256, "epoch": 2126} {"train_loss": -38.528358459472656, "global_step": 257257, "epoch": 2126} {"train_loss": -39.10044860839844, "global_step": 257258, "epoch": 2126} {"train_loss": -37.71936798095703, "global_step": 257259, "epoch": 2126} {"train_loss": -39.13075637817383, "global_step": 257260, "epoch": 2126} {"train_loss": -38.52900314331055, "global_step": 257261, "epoch": 2126} {"train_loss": -39.40217590332031, "global_step": 257262, "epoch": 2126} {"train_loss": -39.879634857177734, "global_step": 257263, "epoch": 2126} {"train_loss": -38.82355499267578, "global_step": 257264, "epoch": 2126} {"train_loss": -39.605831146240234, "global_step": 257265, "epoch": 2126} {"train_loss": -39.68259811401367, "global_step": 257266, "epoch": 2126} {"train_loss": -39.827884674072266, "global_step": 257267, "epoch": 2126} {"train_loss": -40.048736572265625, "global_step": 257268, "epoch": 2126} {"train_loss": -40.17213439941406, "global_step": 257269, "epoch": 2126} {"train_loss": -39.78023910522461, "global_step": 257270, "epoch": 2126} {"train_loss": -39.74090576171875, "global_step": 257271, "epoch": 2126} {"train_loss": -40.20792770385742, "global_step": 257272, "epoch": 2126} {"train_loss": -40.167503356933594, "global_step": 257273, "epoch": 2126} {"train_loss": -40.06807327270508, "global_step": 257274, "epoch": 2126} {"train_loss": -40.19669723510742, "global_step": 257275, "epoch": 2126} {"train_loss": -40.13471221923828, "global_step": 257276, "epoch": 2126} {"train_loss": -39.912078857421875, "global_step": 257277, "epoch": 2126} {"train_loss": -39.425228118896484, "global_step": 257278, "epoch": 2126} {"train_loss": -39.458595275878906, "global_step": 257279, "epoch": 2126} {"train_loss": -40.733673095703125, "global_step": 257280, "epoch": 2126} {"train_loss": -39.526668548583984, "global_step": 257281, "epoch": 2126} {"train_loss": -39.23602294921875, "global_step": 257282, "epoch": 2126} {"train_loss": -40.75584030151367, "global_step": 257283, "epoch": 2126} {"train_loss": -40.47370529174805, "global_step": 257284, "epoch": 2126} {"train_loss": -40.439796447753906, "global_step": 257285, "epoch": 2126} {"train_loss": -40.66504669189453, "global_step": 257286, "epoch": 2126} {"train_loss": -40.58822250366211, "global_step": 257287, "epoch": 2126} {"train_loss": -40.9176025390625, "global_step": 257288, "epoch": 2126} {"train_loss": -40.942256927490234, "global_step": 257289, "epoch": 2126} {"train_loss": -41.16282272338867, "global_step": 257290, "epoch": 2126} {"train_loss": -40.647586822509766, "global_step": 257291, "epoch": 2126} {"train_loss": -40.828369140625, "global_step": 257292, "epoch": 2126} {"train_loss": -40.628902435302734, "global_step": 257293, "epoch": 2126} {"train_loss": -40.63835144042969, "global_step": 257294, "epoch": 2126} {"train_loss": -40.43753433227539, "global_step": 257295, "epoch": 2126} {"train_loss": -41.526493072509766, "global_step": 257296, "epoch": 2126} {"train_loss": -41.32977294921875, "global_step": 257297, "epoch": 2126} {"train_loss": -40.68110656738281, "global_step": 257298, "epoch": 2126} {"train_loss": -40.203712463378906, "global_step": 257299, "epoch": 2126} {"train_loss": -40.73728942871094, "global_step": 257300, "epoch": 2126} {"train_loss": -41.07966232299805, "global_step": 257301, "epoch": 2126} {"train_loss": -40.25630187988281, "global_step": 257302, "epoch": 2126} {"train_loss": -40.37717819213867, "global_step": 257303, "epoch": 2126} {"train_loss": -40.40617752075195, "global_step": 257304, "epoch": 2126} {"train_loss": -41.162227630615234, "global_step": 257305, "epoch": 2126} {"train_loss": -41.6026611328125, "global_step": 257306, "epoch": 2126} {"train_loss": -40.42320251464844, "global_step": 257307, "epoch": 2126} {"train_loss": -41.23698806762695, "global_step": 257308, "epoch": 2126} {"train_loss": -40.81563949584961, "global_step": 257309, "epoch": 2126} {"train_loss": -41.74065399169922, "global_step": 257310, "epoch": 2126} {"train_loss": -41.61574172973633, "global_step": 257311, "epoch": 2126} {"train_loss": -41.0233039855957, "global_step": 257312, "epoch": 2126} {"train_loss": -41.481201171875, "global_step": 257313, "epoch": 2126} {"train_loss": -41.44017791748047, "global_step": 257314, "epoch": 2126} {"train_loss": -41.14929962158203, "global_step": 257315, "epoch": 2126} {"train_loss": -41.408164978027344, "global_step": 257316, "epoch": 2126} {"train_loss": -41.02293014526367, "global_step": 257317, "epoch": 2126} {"train_loss": -41.634071350097656, "global_step": 257318, "epoch": 2126} {"train_loss": -41.44059371948242, "global_step": 257319, "epoch": 2126} {"train_loss": -42.03007888793945, "global_step": 257320, "epoch": 2126} {"train_loss": -41.226783752441406, "global_step": 257321, "epoch": 2126} {"train_loss": -41.08478927612305, "global_step": 257322, "epoch": 2126} {"train_loss": -41.21677780151367, "global_step": 257323, "epoch": 2126} {"train_loss": -41.3715934753418, "global_step": 257324, "epoch": 2126} {"train_loss": -41.94082260131836, "global_step": 257325, "epoch": 2126} {"train_loss": -41.075599670410156, "global_step": 257326, "epoch": 2126} {"train_loss": -41.559322357177734, "global_step": 257327, "epoch": 2126} {"train_loss": -42.184791564941406, "global_step": 257328, "epoch": 2126} {"train_loss": -41.60414505004883, "global_step": 257329, "epoch": 2126} {"train_loss": -41.00591278076172, "global_step": 257330, "epoch": 2126} {"train_loss": -41.50489044189453, "global_step": 257331, "epoch": 2126} {"train_loss": -41.8697509765625, "global_step": 257332, "epoch": 2126} {"train_loss": -41.45000457763672, "global_step": 257333, "epoch": 2126} {"train_loss": -42.076988220214844, "global_step": 257334, "epoch": 2126} {"train_loss": -42.040626525878906, "global_step": 257335, "epoch": 2126} {"train_loss": -41.856536865234375, "global_step": 257336, "epoch": 2126} {"train_loss": -42.2683219909668, "global_step": 257337, "epoch": 2126} {"train_loss": -41.60782241821289, "global_step": 257338, "epoch": 2126} {"train_loss": -39.67755126953125, "global_step": 257339, "epoch": 2126} {"train_loss": -41.92374801635742, "global_step": 257340, "epoch": 2126} {"train_loss": -41.385406494140625, "global_step": 257341, "epoch": 2126} {"train_loss": -41.65481185913086, "global_step": 257342, "epoch": 2126} {"train_loss": -41.953330993652344, "global_step": 257343, "epoch": 2126} {"train_loss": -41.37671661376953, "global_step": 257344, "epoch": 2126} {"train_loss": -42.58845138549805, "global_step": 257345, "epoch": 2126} {"train_loss": -42.08958053588867, "global_step": 257346, "epoch": 2126} {"train_loss": -41.704833984375, "global_step": 257347, "epoch": 2126} {"train_loss": -42.05726623535156, "global_step": 257348, "epoch": 2126} {"train_loss": -40.4088249206543, "global_step": 257349, "epoch": 2126} {"train_loss": -41.937252044677734, "global_step": 257350, "epoch": 2126} {"train_loss": -41.58353805541992, "global_step": 257351, "epoch": 2126} {"train_loss": -42.240787506103516, "global_step": 257352, "epoch": 2126} {"train_loss": -41.87811279296875, "global_step": 257353, "epoch": 2126} {"train_loss": -42.15327072143555, "global_step": 257354, "epoch": 2126} {"train_loss": -42.15532302856445, "global_step": 257355, "epoch": 2126} {"train_loss": -41.50821304321289, "global_step": 257356, "epoch": 2126} {"train_loss": -42.4171257019043, "global_step": 257357, "epoch": 2126} {"train_loss": -41.99079513549805, "global_step": 257358, "epoch": 2126} {"train_loss": -41.8133544921875, "global_step": 257359, "epoch": 2126} {"train_loss": -42.127140045166016, "global_step": 257360, "epoch": 2126} {"train_loss": -42.43414306640625, "global_step": 257361, "epoch": 2126} {"train_loss": -41.80991744995117, "global_step": 257362, "epoch": 2126} {"train_loss": -42.3864631652832, "global_step": 257363, "epoch": 2126} {"train_loss": -41.2564811706543, "global_step": 257364, "epoch": 2126} {"train_loss": -40.705562591552734, "global_step": 257365, "epoch": 2126} {"train_loss": -40.662356037738896, "global_step": 257366, "epoch": 2126, "val_loss": 2677732.0} {"train_loss": -42.38385009765625, "global_step": 257367, "epoch": 2127} {"train_loss": -42.22427749633789, "global_step": 257368, "epoch": 2127} {"train_loss": -42.285030364990234, "global_step": 257369, "epoch": 2127} {"train_loss": -41.13861083984375, "global_step": 257370, "epoch": 2127} {"train_loss": -42.34580612182617, "global_step": 257371, "epoch": 2127} {"train_loss": -41.876033782958984, "global_step": 257372, "epoch": 2127} {"train_loss": -42.693843841552734, "global_step": 257373, "epoch": 2127} {"train_loss": -40.740211486816406, "global_step": 257374, "epoch": 2127} {"train_loss": -41.59942626953125, "global_step": 257375, "epoch": 2127} {"train_loss": -38.87936019897461, "global_step": 257376, "epoch": 2127} {"train_loss": -32.67292404174805, "global_step": 257377, "epoch": 2127} {"train_loss": -28.942773818969727, "global_step": 257378, "epoch": 2127} {"train_loss": -37.20695495605469, "global_step": 257379, "epoch": 2127} {"train_loss": -41.92926788330078, "global_step": 257380, "epoch": 2127} {"train_loss": -35.17641830444336, "global_step": 257381, "epoch": 2127} {"train_loss": -32.316322326660156, "global_step": 257382, "epoch": 2127} {"train_loss": -40.509822845458984, "global_step": 257383, "epoch": 2127} {"train_loss": -40.843482971191406, "global_step": 257384, "epoch": 2127} {"train_loss": -39.074214935302734, "global_step": 257385, "epoch": 2127} {"train_loss": -41.61429977416992, "global_step": 257386, "epoch": 2127} {"train_loss": -36.871158599853516, "global_step": 257387, "epoch": 2127} {"train_loss": -41.4460563659668, "global_step": 257388, "epoch": 2127} {"train_loss": -40.601619720458984, "global_step": 257389, "epoch": 2127} {"train_loss": -41.41740036010742, "global_step": 257390, "epoch": 2127} {"train_loss": -40.6951904296875, "global_step": 257391, "epoch": 2127} {"train_loss": -40.254817962646484, "global_step": 257392, "epoch": 2127} {"train_loss": -41.2989616394043, "global_step": 257393, "epoch": 2127} {"train_loss": -40.849849700927734, "global_step": 257394, "epoch": 2127} {"train_loss": -41.84113693237305, "global_step": 257395, "epoch": 2127} {"train_loss": -38.09859085083008, "global_step": 257396, "epoch": 2127} {"train_loss": -41.606239318847656, "global_step": 257397, "epoch": 2127} {"train_loss": -40.37960433959961, "global_step": 257398, "epoch": 2127} {"train_loss": -39.143306732177734, "global_step": 257399, "epoch": 2127} {"train_loss": -41.00090789794922, "global_step": 257400, "epoch": 2127} {"train_loss": -41.609710693359375, "global_step": 257401, "epoch": 2127} {"train_loss": -40.38692092895508, "global_step": 257402, "epoch": 2127} {"train_loss": -41.506629943847656, "global_step": 257403, "epoch": 2127} {"train_loss": -41.23887252807617, "global_step": 257404, "epoch": 2127} {"train_loss": -41.203102111816406, "global_step": 257405, "epoch": 2127} {"train_loss": -41.57936096191406, "global_step": 257406, "epoch": 2127} {"train_loss": -39.88318634033203, "global_step": 257407, "epoch": 2127} {"train_loss": -40.84159851074219, "global_step": 257408, "epoch": 2127} {"train_loss": -41.751129150390625, "global_step": 257409, "epoch": 2127} {"train_loss": -41.60346603393555, "global_step": 257410, "epoch": 2127} {"train_loss": -41.2774658203125, "global_step": 257411, "epoch": 2127} {"train_loss": -41.5349235534668, "global_step": 257412, "epoch": 2127} {"train_loss": -41.706329345703125, "global_step": 257413, "epoch": 2127} {"train_loss": -42.18634796142578, "global_step": 257414, "epoch": 2127} {"train_loss": -40.131710052490234, "global_step": 257415, "epoch": 2127} {"train_loss": -42.00267791748047, "global_step": 257416, "epoch": 2127} {"train_loss": -41.65216064453125, "global_step": 257417, "epoch": 2127} {"train_loss": -41.68309020996094, "global_step": 257418, "epoch": 2127} {"train_loss": -42.53762435913086, "global_step": 257419, "epoch": 2127} {"train_loss": -41.786006927490234, "global_step": 257420, "epoch": 2127} {"train_loss": -42.15438461303711, "global_step": 257421, "epoch": 2127} {"train_loss": -41.903263092041016, "global_step": 257422, "epoch": 2127} {"train_loss": -42.0833740234375, "global_step": 257423, "epoch": 2127} {"train_loss": -42.551185607910156, "global_step": 257424, "epoch": 2127} {"train_loss": -40.767818450927734, "global_step": 257425, "epoch": 2127} {"train_loss": -41.63311767578125, "global_step": 257426, "epoch": 2127} {"train_loss": -41.794734954833984, "global_step": 257427, "epoch": 2127} {"train_loss": -40.66707229614258, "global_step": 257428, "epoch": 2127} {"train_loss": -41.450462341308594, "global_step": 257429, "epoch": 2127} {"train_loss": -41.87577438354492, "global_step": 257430, "epoch": 2127} {"train_loss": -41.79697799682617, "global_step": 257431, "epoch": 2127} {"train_loss": -42.51929473876953, "global_step": 257432, "epoch": 2127} {"train_loss": -41.007076263427734, "global_step": 257433, "epoch": 2127} {"train_loss": -41.87807083129883, "global_step": 257434, "epoch": 2127} {"train_loss": -42.1247444152832, "global_step": 257435, "epoch": 2127} {"train_loss": -42.339935302734375, "global_step": 257436, "epoch": 2127} {"train_loss": -42.50611877441406, "global_step": 257437, "epoch": 2127} {"train_loss": -41.931419372558594, "global_step": 257438, "epoch": 2127} {"train_loss": -41.69409942626953, "global_step": 257439, "epoch": 2127} {"train_loss": -42.44318389892578, "global_step": 257440, "epoch": 2127} {"train_loss": -41.404388427734375, "global_step": 257441, "epoch": 2127} {"train_loss": -41.62378692626953, "global_step": 257442, "epoch": 2127} {"train_loss": -42.24348449707031, "global_step": 257443, "epoch": 2127} {"train_loss": -41.87712860107422, "global_step": 257444, "epoch": 2127} {"train_loss": -42.6716423034668, "global_step": 257445, "epoch": 2127} {"train_loss": -42.021156311035156, "global_step": 257446, "epoch": 2127} {"train_loss": -41.65266036987305, "global_step": 257447, "epoch": 2127} {"train_loss": -41.560909271240234, "global_step": 257448, "epoch": 2127} {"train_loss": -42.21033477783203, "global_step": 257449, "epoch": 2127} {"train_loss": -41.380306243896484, "global_step": 257450, "epoch": 2127} {"train_loss": -42.05614471435547, "global_step": 257451, "epoch": 2127} {"train_loss": -42.21891403198242, "global_step": 257452, "epoch": 2127} {"train_loss": -40.54633331298828, "global_step": 257453, "epoch": 2127} {"train_loss": -40.4462890625, "global_step": 257454, "epoch": 2127} {"train_loss": -40.13943862915039, "global_step": 257455, "epoch": 2127} {"train_loss": -41.60529708862305, "global_step": 257456, "epoch": 2127} {"train_loss": -41.945003509521484, "global_step": 257457, "epoch": 2127} {"train_loss": -42.3471794128418, "global_step": 257458, "epoch": 2127} {"train_loss": -40.598785400390625, "global_step": 257459, "epoch": 2127} {"train_loss": -42.26731491088867, "global_step": 257460, "epoch": 2127} {"train_loss": -42.009220123291016, "global_step": 257461, "epoch": 2127} {"train_loss": -42.287593841552734, "global_step": 257462, "epoch": 2127} {"train_loss": -42.28165054321289, "global_step": 257463, "epoch": 2127} {"train_loss": -41.87324142456055, "global_step": 257464, "epoch": 2127} {"train_loss": -41.28591537475586, "global_step": 257465, "epoch": 2127} {"train_loss": -40.81289291381836, "global_step": 257466, "epoch": 2127} {"train_loss": -41.08612823486328, "global_step": 257467, "epoch": 2127} {"train_loss": -41.94788360595703, "global_step": 257468, "epoch": 2127} {"train_loss": -42.3776969909668, "global_step": 257469, "epoch": 2127} {"train_loss": -40.94277572631836, "global_step": 257470, "epoch": 2127} {"train_loss": -40.29719924926758, "global_step": 257471, "epoch": 2127} {"train_loss": -40.49867630004883, "global_step": 257472, "epoch": 2127} {"train_loss": -42.27419662475586, "global_step": 257473, "epoch": 2127} {"train_loss": -42.72963333129883, "global_step": 257474, "epoch": 2127} {"train_loss": -41.712921142578125, "global_step": 257475, "epoch": 2127} {"train_loss": -40.73490524291992, "global_step": 257476, "epoch": 2127} {"train_loss": -42.34212875366211, "global_step": 257477, "epoch": 2127} {"train_loss": -42.11160659790039, "global_step": 257478, "epoch": 2127} {"train_loss": -42.593345642089844, "global_step": 257479, "epoch": 2127} {"train_loss": -41.55998611450195, "global_step": 257480, "epoch": 2127} {"train_loss": -41.841793060302734, "global_step": 257481, "epoch": 2127} {"train_loss": -41.63824462890625, "global_step": 257482, "epoch": 2127} {"train_loss": -40.65138626098633, "global_step": 257483, "epoch": 2127} {"train_loss": -42.01443862915039, "global_step": 257484, "epoch": 2127} {"train_loss": -40.62944412231445, "global_step": 257485, "epoch": 2127} {"train_loss": -40.02513122558594, "global_step": 257486, "epoch": 2127} {"train_loss": -41.092710810259355, "global_step": 257487, "epoch": 2127, "val_loss": 2673656.75} {"train_loss": -41.7729377746582, "global_step": 257488, "epoch": 2128} {"train_loss": -42.42549514770508, "global_step": 257489, "epoch": 2128} {"train_loss": -42.077919006347656, "global_step": 257490, "epoch": 2128} {"train_loss": -41.23487091064453, "global_step": 257491, "epoch": 2128} {"train_loss": -41.638214111328125, "global_step": 257492, "epoch": 2128} {"train_loss": -41.56924057006836, "global_step": 257493, "epoch": 2128} {"train_loss": -42.91298294067383, "global_step": 257494, "epoch": 2128} {"train_loss": -42.05378341674805, "global_step": 257495, "epoch": 2128} {"train_loss": -41.29841232299805, "global_step": 257496, "epoch": 2128} {"train_loss": -42.49015808105469, "global_step": 257497, "epoch": 2128} {"train_loss": -42.121986389160156, "global_step": 257498, "epoch": 2128} {"train_loss": -42.26552963256836, "global_step": 257499, "epoch": 2128} {"train_loss": -41.454994201660156, "global_step": 257500, "epoch": 2128} {"train_loss": -42.76487731933594, "global_step": 257501, "epoch": 2128} {"train_loss": -42.463905334472656, "global_step": 257502, "epoch": 2128} {"train_loss": -41.45295333862305, "global_step": 257503, "epoch": 2128} {"train_loss": -41.96134948730469, "global_step": 257504, "epoch": 2128} {"train_loss": -42.3291015625, "global_step": 257505, "epoch": 2128} {"train_loss": -41.56729507446289, "global_step": 257506, "epoch": 2128} {"train_loss": -40.13813018798828, "global_step": 257507, "epoch": 2128} {"train_loss": -40.8680534362793, "global_step": 257508, "epoch": 2128} {"train_loss": -39.59602355957031, "global_step": 257509, "epoch": 2128} {"train_loss": -37.80916213989258, "global_step": 257510, "epoch": 2128} {"train_loss": -39.94248580932617, "global_step": 257511, "epoch": 2128} {"train_loss": -42.612735748291016, "global_step": 257512, "epoch": 2128} {"train_loss": -40.5820198059082, "global_step": 257513, "epoch": 2128} {"train_loss": -39.8797721862793, "global_step": 257514, "epoch": 2128} {"train_loss": -41.355709075927734, "global_step": 257515, "epoch": 2128} {"train_loss": -39.66353988647461, "global_step": 257516, "epoch": 2128} {"train_loss": -37.15143585205078, "global_step": 257517, "epoch": 2128} {"train_loss": -39.40858840942383, "global_step": 257518, "epoch": 2128} {"train_loss": -40.80308151245117, "global_step": 257519, "epoch": 2128} {"train_loss": -39.39544677734375, "global_step": 257520, "epoch": 2128} {"train_loss": -38.62128448486328, "global_step": 257521, "epoch": 2128} {"train_loss": -40.80373764038086, "global_step": 257522, "epoch": 2128} {"train_loss": -40.840694427490234, "global_step": 257523, "epoch": 2128} {"train_loss": -38.68105697631836, "global_step": 257524, "epoch": 2128} {"train_loss": -41.407249450683594, "global_step": 257525, "epoch": 2128} {"train_loss": -38.17997360229492, "global_step": 257526, "epoch": 2128} {"train_loss": -39.94987106323242, "global_step": 257527, "epoch": 2128} {"train_loss": -41.686275482177734, "global_step": 257528, "epoch": 2128} {"train_loss": -38.67569351196289, "global_step": 257529, "epoch": 2128} {"train_loss": -41.81428909301758, "global_step": 257530, "epoch": 2128} {"train_loss": -40.478675842285156, "global_step": 257531, "epoch": 2128} {"train_loss": -41.56327819824219, "global_step": 257532, "epoch": 2128} {"train_loss": -41.142478942871094, "global_step": 257533, "epoch": 2128} {"train_loss": -41.13154220581055, "global_step": 257534, "epoch": 2128} {"train_loss": -41.3509635925293, "global_step": 257535, "epoch": 2128} {"train_loss": -41.186767578125, "global_step": 257536, "epoch": 2128} {"train_loss": -41.57646179199219, "global_step": 257537, "epoch": 2128} {"train_loss": -41.67138671875, "global_step": 257538, "epoch": 2128} {"train_loss": -41.639827728271484, "global_step": 257539, "epoch": 2128} {"train_loss": -41.65776824951172, "global_step": 257540, "epoch": 2128} {"train_loss": -40.858821868896484, "global_step": 257541, "epoch": 2128} {"train_loss": -41.95254898071289, "global_step": 257542, "epoch": 2128} {"train_loss": -42.39274978637695, "global_step": 257543, "epoch": 2128} {"train_loss": -41.26167297363281, "global_step": 257544, "epoch": 2128} {"train_loss": -42.009918212890625, "global_step": 257545, "epoch": 2128} {"train_loss": -42.3039665222168, "global_step": 257546, "epoch": 2128} {"train_loss": -42.1738166809082, "global_step": 257547, "epoch": 2128} {"train_loss": -42.4853515625, "global_step": 257548, "epoch": 2128} {"train_loss": -42.4532356262207, "global_step": 257549, "epoch": 2128} {"train_loss": -42.22284698486328, "global_step": 257550, "epoch": 2128} {"train_loss": -42.0338134765625, "global_step": 257551, "epoch": 2128} {"train_loss": -42.316707611083984, "global_step": 257552, "epoch": 2128} {"train_loss": -42.784523010253906, "global_step": 257553, "epoch": 2128} {"train_loss": -42.074275970458984, "global_step": 257554, "epoch": 2128} {"train_loss": -42.48808670043945, "global_step": 257555, "epoch": 2128} {"train_loss": -42.157325744628906, "global_step": 257556, "epoch": 2128} {"train_loss": -42.184844970703125, "global_step": 257557, "epoch": 2128} {"train_loss": -42.858848571777344, "global_step": 257558, "epoch": 2128} {"train_loss": -42.643009185791016, "global_step": 257559, "epoch": 2128} {"train_loss": -42.452999114990234, "global_step": 257560, "epoch": 2128} {"train_loss": -42.629005432128906, "global_step": 257561, "epoch": 2128} {"train_loss": -42.423622131347656, "global_step": 257562, "epoch": 2128} {"train_loss": -42.83199691772461, "global_step": 257563, "epoch": 2128} {"train_loss": -41.4510612487793, "global_step": 257564, "epoch": 2128} {"train_loss": -42.72913360595703, "global_step": 257565, "epoch": 2128} {"train_loss": -42.01422882080078, "global_step": 257566, "epoch": 2128} {"train_loss": -42.331844329833984, "global_step": 257567, "epoch": 2128} {"train_loss": -43.03178024291992, "global_step": 257568, "epoch": 2128} {"train_loss": -42.9915657043457, "global_step": 257569, "epoch": 2128} {"train_loss": -43.245033264160156, "global_step": 257570, "epoch": 2128} {"train_loss": -42.71869659423828, "global_step": 257571, "epoch": 2128} {"train_loss": -42.29548645019531, "global_step": 257572, "epoch": 2128} {"train_loss": -42.52062225341797, "global_step": 257573, "epoch": 2128} {"train_loss": -42.5777702331543, "global_step": 257574, "epoch": 2128} {"train_loss": -42.42478561401367, "global_step": 257575, "epoch": 2128} {"train_loss": -41.857784271240234, "global_step": 257576, "epoch": 2128} {"train_loss": -42.9548225402832, "global_step": 257577, "epoch": 2128} {"train_loss": -40.726192474365234, "global_step": 257578, "epoch": 2128} {"train_loss": -42.5883903503418, "global_step": 257579, "epoch": 2128} {"train_loss": -42.560062408447266, "global_step": 257580, "epoch": 2128} {"train_loss": -42.63031005859375, "global_step": 257581, "epoch": 2128} {"train_loss": -41.73887634277344, "global_step": 257582, "epoch": 2128} {"train_loss": -42.967063903808594, "global_step": 257583, "epoch": 2128} {"train_loss": -42.88398361206055, "global_step": 257584, "epoch": 2128} {"train_loss": -41.278751373291016, "global_step": 257585, "epoch": 2128} {"train_loss": -42.4689826965332, "global_step": 257586, "epoch": 2128} {"train_loss": -42.28947448730469, "global_step": 257587, "epoch": 2128} {"train_loss": -42.40071105957031, "global_step": 257588, "epoch": 2128} {"train_loss": -42.72364044189453, "global_step": 257589, "epoch": 2128} {"train_loss": -43.19758987426758, "global_step": 257590, "epoch": 2128} {"train_loss": -42.79507064819336, "global_step": 257591, "epoch": 2128} {"train_loss": -41.73745346069336, "global_step": 257592, "epoch": 2128} {"train_loss": -43.186458587646484, "global_step": 257593, "epoch": 2128} {"train_loss": -41.42439651489258, "global_step": 257594, "epoch": 2128} {"train_loss": -42.424564361572266, "global_step": 257595, "epoch": 2128} {"train_loss": -43.07793426513672, "global_step": 257596, "epoch": 2128} {"train_loss": -43.1419792175293, "global_step": 257597, "epoch": 2128} {"train_loss": -42.65218734741211, "global_step": 257598, "epoch": 2128} {"train_loss": -42.566280364990234, "global_step": 257599, "epoch": 2128} {"train_loss": -43.2247314453125, "global_step": 257600, "epoch": 2128} {"train_loss": -42.18674087524414, "global_step": 257601, "epoch": 2128} {"train_loss": -41.131263732910156, "global_step": 257602, "epoch": 2128} {"train_loss": -42.0700569152832, "global_step": 257603, "epoch": 2128} {"train_loss": -42.969581604003906, "global_step": 257604, "epoch": 2128} {"train_loss": -42.51007843017578, "global_step": 257605, "epoch": 2128} {"train_loss": -42.8913688659668, "global_step": 257606, "epoch": 2128} {"train_loss": -43.269981384277344, "global_step": 257607, "epoch": 2128} {"train_loss": -41.77621803598956, "global_step": 257608, "epoch": 2128, "val_loss": 2618324.75} {"train_loss": -42.63722610473633, "global_step": 257609, "epoch": 2129} {"train_loss": -43.33639144897461, "global_step": 257610, "epoch": 2129} {"train_loss": -43.263694763183594, "global_step": 257611, "epoch": 2129} {"train_loss": -42.57558822631836, "global_step": 257612, "epoch": 2129} {"train_loss": -42.490509033203125, "global_step": 257613, "epoch": 2129} {"train_loss": -43.18714904785156, "global_step": 257614, "epoch": 2129} {"train_loss": -42.805809020996094, "global_step": 257615, "epoch": 2129} {"train_loss": -42.42052459716797, "global_step": 257616, "epoch": 2129} {"train_loss": -42.018917083740234, "global_step": 257617, "epoch": 2129} {"train_loss": -42.68743896484375, "global_step": 257618, "epoch": 2129} {"train_loss": -43.04637145996094, "global_step": 257619, "epoch": 2129} {"train_loss": -43.33678436279297, "global_step": 257620, "epoch": 2129} {"train_loss": -42.91384506225586, "global_step": 257621, "epoch": 2129} {"train_loss": -42.77557373046875, "global_step": 257622, "epoch": 2129} {"train_loss": -43.1278190612793, "global_step": 257623, "epoch": 2129} {"train_loss": -42.54306411743164, "global_step": 257624, "epoch": 2129} {"train_loss": -42.51706314086914, "global_step": 257625, "epoch": 2129} {"train_loss": -41.233551025390625, "global_step": 257626, "epoch": 2129} {"train_loss": -43.11311721801758, "global_step": 257627, "epoch": 2129} {"train_loss": -42.89576721191406, "global_step": 257628, "epoch": 2129} {"train_loss": -42.53797149658203, "global_step": 257629, "epoch": 2129} {"train_loss": -43.0474967956543, "global_step": 257630, "epoch": 2129} {"train_loss": -42.678871154785156, "global_step": 257631, "epoch": 2129} {"train_loss": -42.899169921875, "global_step": 257632, "epoch": 2129} {"train_loss": -39.3581657409668, "global_step": 257633, "epoch": 2129} {"train_loss": -41.982025146484375, "global_step": 257634, "epoch": 2129} {"train_loss": -41.94071960449219, "global_step": 257635, "epoch": 2129} {"train_loss": -41.6296272277832, "global_step": 257636, "epoch": 2129} {"train_loss": -39.267250061035156, "global_step": 257637, "epoch": 2129} {"train_loss": -38.531654357910156, "global_step": 257638, "epoch": 2129} {"train_loss": -37.77975082397461, "global_step": 257639, "epoch": 2129} {"train_loss": -38.44553756713867, "global_step": 257640, "epoch": 2129} {"train_loss": -39.953819274902344, "global_step": 257641, "epoch": 2129} {"train_loss": -37.43563461303711, "global_step": 257642, "epoch": 2129} {"train_loss": -39.18586349487305, "global_step": 257643, "epoch": 2129} {"train_loss": -37.098934173583984, "global_step": 257644, "epoch": 2129} {"train_loss": -41.478492736816406, "global_step": 257645, "epoch": 2129} {"train_loss": -37.0444450378418, "global_step": 257646, "epoch": 2129} {"train_loss": -39.891998291015625, "global_step": 257647, "epoch": 2129} {"train_loss": -40.55830764770508, "global_step": 257648, "epoch": 2129} {"train_loss": -40.594478607177734, "global_step": 257649, "epoch": 2129} {"train_loss": -40.187862396240234, "global_step": 257650, "epoch": 2129} {"train_loss": -40.75425338745117, "global_step": 257651, "epoch": 2129} {"train_loss": -35.95711898803711, "global_step": 257652, "epoch": 2129} {"train_loss": -40.20637130737305, "global_step": 257653, "epoch": 2129} {"train_loss": -38.12399673461914, "global_step": 257654, "epoch": 2129} {"train_loss": -37.99910354614258, "global_step": 257655, "epoch": 2129} {"train_loss": -39.879669189453125, "global_step": 257656, "epoch": 2129} {"train_loss": -38.89094161987305, "global_step": 257657, "epoch": 2129} {"train_loss": -39.6233024597168, "global_step": 257658, "epoch": 2129} {"train_loss": -39.43217849731445, "global_step": 257659, "epoch": 2129} {"train_loss": -39.250972747802734, "global_step": 257660, "epoch": 2129} {"train_loss": -40.8569221496582, "global_step": 257661, "epoch": 2129} {"train_loss": -39.522926330566406, "global_step": 257662, "epoch": 2129} {"train_loss": -38.735137939453125, "global_step": 257663, "epoch": 2129} {"train_loss": -39.833072662353516, "global_step": 257664, "epoch": 2129} {"train_loss": -37.7055778503418, "global_step": 257665, "epoch": 2129} {"train_loss": -39.57990646362305, "global_step": 257666, "epoch": 2129} {"train_loss": -41.692138671875, "global_step": 257667, "epoch": 2129} {"train_loss": -41.0243034362793, "global_step": 257668, "epoch": 2129} {"train_loss": -39.32394027709961, "global_step": 257669, "epoch": 2129} {"train_loss": -40.2719612121582, "global_step": 257670, "epoch": 2129} {"train_loss": -41.130306243896484, "global_step": 257671, "epoch": 2129} {"train_loss": -40.769840240478516, "global_step": 257672, "epoch": 2129} {"train_loss": -40.40974807739258, "global_step": 257673, "epoch": 2129} {"train_loss": -41.18849563598633, "global_step": 257674, "epoch": 2129} {"train_loss": -41.14561080932617, "global_step": 257675, "epoch": 2129} {"train_loss": -41.200469970703125, "global_step": 257676, "epoch": 2129} {"train_loss": -42.471229553222656, "global_step": 257677, "epoch": 2129} {"train_loss": -41.66865158081055, "global_step": 257678, "epoch": 2129} {"train_loss": -41.44697952270508, "global_step": 257679, "epoch": 2129} {"train_loss": -42.3393669128418, "global_step": 257680, "epoch": 2129} {"train_loss": -41.923702239990234, "global_step": 257681, "epoch": 2129} {"train_loss": -42.08480453491211, "global_step": 257682, "epoch": 2129} {"train_loss": -41.4348258972168, "global_step": 257683, "epoch": 2129} {"train_loss": -41.9354362487793, "global_step": 257684, "epoch": 2129} {"train_loss": -41.674198150634766, "global_step": 257685, "epoch": 2129} {"train_loss": -41.58154296875, "global_step": 257686, "epoch": 2129} {"train_loss": -42.46165466308594, "global_step": 257687, "epoch": 2129} {"train_loss": -42.28836441040039, "global_step": 257688, "epoch": 2129} {"train_loss": -42.17486572265625, "global_step": 257689, "epoch": 2129} {"train_loss": -42.38308334350586, "global_step": 257690, "epoch": 2129} {"train_loss": -41.04420471191406, "global_step": 257691, "epoch": 2129} {"train_loss": -42.22842025756836, "global_step": 257692, "epoch": 2129} {"train_loss": -42.31576156616211, "global_step": 257693, "epoch": 2129} {"train_loss": -42.03154373168945, "global_step": 257694, "epoch": 2129} {"train_loss": -42.3890380859375, "global_step": 257695, "epoch": 2129} {"train_loss": -42.15029525756836, "global_step": 257696, "epoch": 2129} {"train_loss": -41.77103805541992, "global_step": 257697, "epoch": 2129} {"train_loss": -42.88911819458008, "global_step": 257698, "epoch": 2129} {"train_loss": -42.460472106933594, "global_step": 257699, "epoch": 2129} {"train_loss": -42.57130813598633, "global_step": 257700, "epoch": 2129} {"train_loss": -42.95149612426758, "global_step": 257701, "epoch": 2129} {"train_loss": -42.24238967895508, "global_step": 257702, "epoch": 2129} {"train_loss": -42.64122009277344, "global_step": 257703, "epoch": 2129} {"train_loss": -42.446285247802734, "global_step": 257704, "epoch": 2129} {"train_loss": -42.95035934448242, "global_step": 257705, "epoch": 2129} {"train_loss": -42.76704025268555, "global_step": 257706, "epoch": 2129} {"train_loss": -43.04037094116211, "global_step": 257707, "epoch": 2129} {"train_loss": -41.93817138671875, "global_step": 257708, "epoch": 2129} {"train_loss": -42.5240478515625, "global_step": 257709, "epoch": 2129} {"train_loss": -43.262969970703125, "global_step": 257710, "epoch": 2129} {"train_loss": -42.873748779296875, "global_step": 257711, "epoch": 2129} {"train_loss": -43.37327194213867, "global_step": 257712, "epoch": 2129} {"train_loss": -42.8790397644043, "global_step": 257713, "epoch": 2129} {"train_loss": -42.092525482177734, "global_step": 257714, "epoch": 2129} {"train_loss": -43.4897575378418, "global_step": 257715, "epoch": 2129} {"train_loss": -41.18585968017578, "global_step": 257716, "epoch": 2129} {"train_loss": -42.63847732543945, "global_step": 257717, "epoch": 2129} {"train_loss": -43.03410720825195, "global_step": 257718, "epoch": 2129} {"train_loss": -43.16128921508789, "global_step": 257719, "epoch": 2129} {"train_loss": -41.97728729248047, "global_step": 257720, "epoch": 2129} {"train_loss": -38.22762680053711, "global_step": 257721, "epoch": 2129} {"train_loss": -39.93058776855469, "global_step": 257722, "epoch": 2129} {"train_loss": -43.0552978515625, "global_step": 257723, "epoch": 2129} {"train_loss": -41.13330078125, "global_step": 257724, "epoch": 2129} {"train_loss": -41.9769172668457, "global_step": 257725, "epoch": 2129} {"train_loss": -43.12864303588867, "global_step": 257726, "epoch": 2129} {"train_loss": -42.41371536254883, "global_step": 257727, "epoch": 2129} {"train_loss": -41.85427474975586, "global_step": 257728, "epoch": 2129} {"train_loss": -41.41041577551976, "global_step": 257729, "epoch": 2129, "val_loss": 2592430.25} {"train_loss": -42.35116195678711, "global_step": 257730, "epoch": 2130} {"train_loss": -42.82271957397461, "global_step": 257731, "epoch": 2130} {"train_loss": -41.43757247924805, "global_step": 257732, "epoch": 2130} {"train_loss": -42.95729446411133, "global_step": 257733, "epoch": 2130} {"train_loss": -42.65697479248047, "global_step": 257734, "epoch": 2130} {"train_loss": -42.68404769897461, "global_step": 257735, "epoch": 2130} {"train_loss": -41.72410202026367, "global_step": 257736, "epoch": 2130} {"train_loss": -42.17958068847656, "global_step": 257737, "epoch": 2130} {"train_loss": -42.802040100097656, "global_step": 257738, "epoch": 2130} {"train_loss": -25.192333221435547, "global_step": 257739, "epoch": 2130} {"train_loss": -39.20497512817383, "global_step": 257740, "epoch": 2130} {"train_loss": -41.28363800048828, "global_step": 257741, "epoch": 2130} {"train_loss": -42.16984176635742, "global_step": 257742, "epoch": 2130} {"train_loss": -41.273719787597656, "global_step": 257743, "epoch": 2130} {"train_loss": -39.174983978271484, "global_step": 257744, "epoch": 2130} {"train_loss": -40.7952880859375, "global_step": 257745, "epoch": 2130} {"train_loss": -31.657522201538086, "global_step": 257746, "epoch": 2130} {"train_loss": -40.29684066772461, "global_step": 257747, "epoch": 2130} {"train_loss": -41.801448822021484, "global_step": 257748, "epoch": 2130} {"train_loss": -40.96295166015625, "global_step": 257749, "epoch": 2130} {"train_loss": -42.04228591918945, "global_step": 257750, "epoch": 2130} {"train_loss": -30.03818702697754, "global_step": 257751, "epoch": 2130} {"train_loss": -41.19697189331055, "global_step": 257752, "epoch": 2130} {"train_loss": -39.558013916015625, "global_step": 257753, "epoch": 2130} {"train_loss": -41.50533676147461, "global_step": 257754, "epoch": 2130} {"train_loss": -40.085750579833984, "global_step": 257755, "epoch": 2130} {"train_loss": -37.26592254638672, "global_step": 257756, "epoch": 2130} {"train_loss": -39.85457229614258, "global_step": 257757, "epoch": 2130} {"train_loss": -40.78867721557617, "global_step": 257758, "epoch": 2130} {"train_loss": -41.00197982788086, "global_step": 257759, "epoch": 2130} {"train_loss": -40.68842697143555, "global_step": 257760, "epoch": 2130} {"train_loss": -36.07196044921875, "global_step": 257761, "epoch": 2130} {"train_loss": -40.00791549682617, "global_step": 257762, "epoch": 2130} {"train_loss": -40.88182067871094, "global_step": 257763, "epoch": 2130} {"train_loss": -40.133216857910156, "global_step": 257764, "epoch": 2130} {"train_loss": -38.342872619628906, "global_step": 257765, "epoch": 2130} {"train_loss": -41.55245590209961, "global_step": 257766, "epoch": 2130} {"train_loss": -41.16660690307617, "global_step": 257767, "epoch": 2130} {"train_loss": -37.499168395996094, "global_step": 257768, "epoch": 2130} {"train_loss": -40.07363510131836, "global_step": 257769, "epoch": 2130} {"train_loss": -32.98798370361328, "global_step": 257770, "epoch": 2130} {"train_loss": -41.66704177856445, "global_step": 257771, "epoch": 2130} {"train_loss": -41.22661209106445, "global_step": 257772, "epoch": 2130} {"train_loss": -39.579437255859375, "global_step": 257773, "epoch": 2130} {"train_loss": -39.47652053833008, "global_step": 257774, "epoch": 2130} {"train_loss": -41.323753356933594, "global_step": 257775, "epoch": 2130} {"train_loss": -41.28199768066406, "global_step": 257776, "epoch": 2130} {"train_loss": -40.776527404785156, "global_step": 257777, "epoch": 2130} {"train_loss": -39.60029220581055, "global_step": 257778, "epoch": 2130} {"train_loss": -40.35760498046875, "global_step": 257779, "epoch": 2130} {"train_loss": -39.95159912109375, "global_step": 257780, "epoch": 2130} {"train_loss": -40.846771240234375, "global_step": 257781, "epoch": 2130} {"train_loss": -41.309410095214844, "global_step": 257782, "epoch": 2130} {"train_loss": -40.444332122802734, "global_step": 257783, "epoch": 2130} {"train_loss": -41.136810302734375, "global_step": 257784, "epoch": 2130} {"train_loss": -41.57375717163086, "global_step": 257785, "epoch": 2130} {"train_loss": -40.44069290161133, "global_step": 257786, "epoch": 2130} {"train_loss": -40.437408447265625, "global_step": 257787, "epoch": 2130} {"train_loss": -41.572998046875, "global_step": 257788, "epoch": 2130} {"train_loss": -40.94266891479492, "global_step": 257789, "epoch": 2130} {"train_loss": -40.8115234375, "global_step": 257790, "epoch": 2130} {"train_loss": -38.468971252441406, "global_step": 257791, "epoch": 2130} {"train_loss": -41.18728256225586, "global_step": 257792, "epoch": 2130} {"train_loss": -40.74033737182617, "global_step": 257793, "epoch": 2130} {"train_loss": -40.324127197265625, "global_step": 257794, "epoch": 2130} {"train_loss": -40.44883346557617, "global_step": 257795, "epoch": 2130} {"train_loss": -39.51473617553711, "global_step": 257796, "epoch": 2130} {"train_loss": -40.32259750366211, "global_step": 257797, "epoch": 2130} {"train_loss": -41.19744873046875, "global_step": 257798, "epoch": 2130} {"train_loss": -41.67376708984375, "global_step": 257799, "epoch": 2130} {"train_loss": -41.60112380981445, "global_step": 257800, "epoch": 2130} {"train_loss": -41.68253707885742, "global_step": 257801, "epoch": 2130} {"train_loss": -41.416988372802734, "global_step": 257802, "epoch": 2130} {"train_loss": -41.971187591552734, "global_step": 257803, "epoch": 2130} {"train_loss": -41.35578536987305, "global_step": 257804, "epoch": 2130} {"train_loss": -41.42047119140625, "global_step": 257805, "epoch": 2130} {"train_loss": -41.91864013671875, "global_step": 257806, "epoch": 2130} {"train_loss": -41.93917465209961, "global_step": 257807, "epoch": 2130} {"train_loss": -40.8944206237793, "global_step": 257808, "epoch": 2130} {"train_loss": -41.72174072265625, "global_step": 257809, "epoch": 2130} {"train_loss": -41.860923767089844, "global_step": 257810, "epoch": 2130} {"train_loss": -41.424720764160156, "global_step": 257811, "epoch": 2130} {"train_loss": -42.09001922607422, "global_step": 257812, "epoch": 2130} {"train_loss": -41.784950256347656, "global_step": 257813, "epoch": 2130} {"train_loss": -39.984336853027344, "global_step": 257814, "epoch": 2130} {"train_loss": -42.03933334350586, "global_step": 257815, "epoch": 2130} {"train_loss": -42.08015060424805, "global_step": 257816, "epoch": 2130} {"train_loss": -41.68415832519531, "global_step": 257817, "epoch": 2130} {"train_loss": -41.66794967651367, "global_step": 257818, "epoch": 2130} {"train_loss": -41.64432907104492, "global_step": 257819, "epoch": 2130} {"train_loss": -42.00571060180664, "global_step": 257820, "epoch": 2130} {"train_loss": -41.95984649658203, "global_step": 257821, "epoch": 2130} {"train_loss": -42.5748291015625, "global_step": 257822, "epoch": 2130} {"train_loss": -42.647544860839844, "global_step": 257823, "epoch": 2130} {"train_loss": -43.0634651184082, "global_step": 257824, "epoch": 2130} {"train_loss": -42.67611312866211, "global_step": 257825, "epoch": 2130} {"train_loss": -41.71920394897461, "global_step": 257826, "epoch": 2130} {"train_loss": -41.7437629699707, "global_step": 257827, "epoch": 2130} {"train_loss": -40.469234466552734, "global_step": 257828, "epoch": 2130} {"train_loss": -42.17678451538086, "global_step": 257829, "epoch": 2130} {"train_loss": -41.16260528564453, "global_step": 257830, "epoch": 2130} {"train_loss": -42.335445404052734, "global_step": 257831, "epoch": 2130} {"train_loss": -42.50029754638672, "global_step": 257832, "epoch": 2130} {"train_loss": -42.01729965209961, "global_step": 257833, "epoch": 2130} {"train_loss": -42.014339447021484, "global_step": 257834, "epoch": 2130} {"train_loss": -40.87364196777344, "global_step": 257835, "epoch": 2130} {"train_loss": -42.65156173706055, "global_step": 257836, "epoch": 2130} {"train_loss": -42.49416732788086, "global_step": 257837, "epoch": 2130} {"train_loss": -42.58946990966797, "global_step": 257838, "epoch": 2130} {"train_loss": -42.67385482788086, "global_step": 257839, "epoch": 2130} {"train_loss": -41.443843841552734, "global_step": 257840, "epoch": 2130} {"train_loss": -42.08447265625, "global_step": 257841, "epoch": 2130} {"train_loss": -40.8963737487793, "global_step": 257842, "epoch": 2130} {"train_loss": -38.97773361206055, "global_step": 257843, "epoch": 2130} {"train_loss": -40.847190856933594, "global_step": 257844, "epoch": 2130} {"train_loss": -42.38740921020508, "global_step": 257845, "epoch": 2130} {"train_loss": -42.01789474487305, "global_step": 257846, "epoch": 2130} {"train_loss": -41.06206130981445, "global_step": 257847, "epoch": 2130} {"train_loss": -41.97945022583008, "global_step": 257848, "epoch": 2130} {"train_loss": -40.958065032958984, "global_step": 257849, "epoch": 2130} {"train_loss": -40.769637178783576, "global_step": 257850, "epoch": 2130, "val_loss": 2593906.5} {"train_loss": -40.64263153076172, "global_step": 257851, "epoch": 2131} {"train_loss": -42.151580810546875, "global_step": 257852, "epoch": 2131} {"train_loss": -40.17144775390625, "global_step": 257853, "epoch": 2131} {"train_loss": -42.030765533447266, "global_step": 257854, "epoch": 2131} {"train_loss": -42.26700210571289, "global_step": 257855, "epoch": 2131} {"train_loss": -40.94964599609375, "global_step": 257856, "epoch": 2131} {"train_loss": -42.47673416137695, "global_step": 257857, "epoch": 2131} {"train_loss": -41.49210739135742, "global_step": 257858, "epoch": 2131} {"train_loss": -41.86721420288086, "global_step": 257859, "epoch": 2131} {"train_loss": -41.932350158691406, "global_step": 257860, "epoch": 2131} {"train_loss": -41.2319450378418, "global_step": 257861, "epoch": 2131} {"train_loss": -39.75875473022461, "global_step": 257862, "epoch": 2131} {"train_loss": -38.0018424987793, "global_step": 257863, "epoch": 2131} {"train_loss": -37.45149612426758, "global_step": 257864, "epoch": 2131} {"train_loss": -40.94704055786133, "global_step": 257865, "epoch": 2131} {"train_loss": -41.316558837890625, "global_step": 257866, "epoch": 2131} {"train_loss": -35.79578399658203, "global_step": 257867, "epoch": 2131} {"train_loss": -33.72705841064453, "global_step": 257868, "epoch": 2131} {"train_loss": -42.17561721801758, "global_step": 257869, "epoch": 2131} {"train_loss": -36.91727828979492, "global_step": 257870, "epoch": 2131} {"train_loss": -38.96834182739258, "global_step": 257871, "epoch": 2131} {"train_loss": -41.30154037475586, "global_step": 257872, "epoch": 2131} {"train_loss": -38.66608428955078, "global_step": 257873, "epoch": 2131} {"train_loss": -41.72975540161133, "global_step": 257874, "epoch": 2131} {"train_loss": -40.02376174926758, "global_step": 257875, "epoch": 2131} {"train_loss": -40.15530014038086, "global_step": 257876, "epoch": 2131} {"train_loss": -41.47124099731445, "global_step": 257877, "epoch": 2131} {"train_loss": -40.903358459472656, "global_step": 257878, "epoch": 2131} {"train_loss": -42.05507278442383, "global_step": 257879, "epoch": 2131} {"train_loss": -40.53007125854492, "global_step": 257880, "epoch": 2131} {"train_loss": -41.98759460449219, "global_step": 257881, "epoch": 2131} {"train_loss": -41.542625427246094, "global_step": 257882, "epoch": 2131} {"train_loss": -42.115570068359375, "global_step": 257883, "epoch": 2131} {"train_loss": -41.13155746459961, "global_step": 257884, "epoch": 2131} {"train_loss": -42.33320236206055, "global_step": 257885, "epoch": 2131} {"train_loss": -41.78181076049805, "global_step": 257886, "epoch": 2131} {"train_loss": -42.178585052490234, "global_step": 257887, "epoch": 2131} {"train_loss": -39.92341232299805, "global_step": 257888, "epoch": 2131} {"train_loss": -41.98574447631836, "global_step": 257889, "epoch": 2131} {"train_loss": -42.46646499633789, "global_step": 257890, "epoch": 2131} {"train_loss": -41.99435806274414, "global_step": 257891, "epoch": 2131} {"train_loss": -42.26096725463867, "global_step": 257892, "epoch": 2131} {"train_loss": -42.312198638916016, "global_step": 257893, "epoch": 2131} {"train_loss": -41.81788635253906, "global_step": 257894, "epoch": 2131} {"train_loss": -41.97431182861328, "global_step": 257895, "epoch": 2131} {"train_loss": -42.24264144897461, "global_step": 257896, "epoch": 2131} {"train_loss": -42.336090087890625, "global_step": 257897, "epoch": 2131} {"train_loss": -41.848690032958984, "global_step": 257898, "epoch": 2131} {"train_loss": -37.90546798706055, "global_step": 257899, "epoch": 2131} {"train_loss": -42.44990158081055, "global_step": 257900, "epoch": 2131} {"train_loss": -42.12073516845703, "global_step": 257901, "epoch": 2131} {"train_loss": -42.1334228515625, "global_step": 257902, "epoch": 2131} {"train_loss": -42.454044342041016, "global_step": 257903, "epoch": 2131} {"train_loss": -42.04079818725586, "global_step": 257904, "epoch": 2131} {"train_loss": -42.51668167114258, "global_step": 257905, "epoch": 2131} {"train_loss": -42.3681526184082, "global_step": 257906, "epoch": 2131} {"train_loss": -41.63947296142578, "global_step": 257907, "epoch": 2131} {"train_loss": -42.47822570800781, "global_step": 257908, "epoch": 2131} {"train_loss": -42.423805236816406, "global_step": 257909, "epoch": 2131} {"train_loss": -42.964942932128906, "global_step": 257910, "epoch": 2131} {"train_loss": -42.3155517578125, "global_step": 257911, "epoch": 2131} {"train_loss": -42.2982292175293, "global_step": 257912, "epoch": 2131} {"train_loss": -42.506465911865234, "global_step": 257913, "epoch": 2131} {"train_loss": -41.64286422729492, "global_step": 257914, "epoch": 2131} {"train_loss": -42.635536193847656, "global_step": 257915, "epoch": 2131} {"train_loss": -42.06049346923828, "global_step": 257916, "epoch": 2131} {"train_loss": -42.26393508911133, "global_step": 257917, "epoch": 2131} {"train_loss": -42.52202606201172, "global_step": 257918, "epoch": 2131} {"train_loss": -42.58964920043945, "global_step": 257919, "epoch": 2131} {"train_loss": -42.75178527832031, "global_step": 257920, "epoch": 2131} {"train_loss": -42.510536193847656, "global_step": 257921, "epoch": 2131} {"train_loss": -42.71198272705078, "global_step": 257922, "epoch": 2131} {"train_loss": -42.75570297241211, "global_step": 257923, "epoch": 2131} {"train_loss": -42.10219955444336, "global_step": 257924, "epoch": 2131} {"train_loss": -42.53865432739258, "global_step": 257925, "epoch": 2131} {"train_loss": -42.48701858520508, "global_step": 257926, "epoch": 2131} {"train_loss": -42.151222229003906, "global_step": 257927, "epoch": 2131} {"train_loss": -42.571834564208984, "global_step": 257928, "epoch": 2131} {"train_loss": -39.91097640991211, "global_step": 257929, "epoch": 2131} {"train_loss": -40.7028923034668, "global_step": 257930, "epoch": 2131} {"train_loss": -42.18888473510742, "global_step": 257931, "epoch": 2131} {"train_loss": -43.27391815185547, "global_step": 257932, "epoch": 2131} {"train_loss": -41.677528381347656, "global_step": 257933, "epoch": 2131} {"train_loss": -39.35887908935547, "global_step": 257934, "epoch": 2131} {"train_loss": -41.10808181762695, "global_step": 257935, "epoch": 2131} {"train_loss": -42.657928466796875, "global_step": 257936, "epoch": 2131} {"train_loss": -40.8283805847168, "global_step": 257937, "epoch": 2131} {"train_loss": -39.008419036865234, "global_step": 257938, "epoch": 2131} {"train_loss": -41.716163635253906, "global_step": 257939, "epoch": 2131} {"train_loss": -42.00746536254883, "global_step": 257940, "epoch": 2131} {"train_loss": -41.91770935058594, "global_step": 257941, "epoch": 2131} {"train_loss": -41.56719970703125, "global_step": 257942, "epoch": 2131} {"train_loss": -42.1074104309082, "global_step": 257943, "epoch": 2131} {"train_loss": -41.909507751464844, "global_step": 257944, "epoch": 2131} {"train_loss": -41.92568588256836, "global_step": 257945, "epoch": 2131} {"train_loss": -41.69057846069336, "global_step": 257946, "epoch": 2131} {"train_loss": -42.740089416503906, "global_step": 257947, "epoch": 2131} {"train_loss": -41.82355880737305, "global_step": 257948, "epoch": 2131} {"train_loss": -40.97181701660156, "global_step": 257949, "epoch": 2131} {"train_loss": -41.954341888427734, "global_step": 257950, "epoch": 2131} {"train_loss": -41.632625579833984, "global_step": 257951, "epoch": 2131} {"train_loss": -42.03798294067383, "global_step": 257952, "epoch": 2131} {"train_loss": -41.413082122802734, "global_step": 257953, "epoch": 2131} {"train_loss": -41.94266891479492, "global_step": 257954, "epoch": 2131} {"train_loss": -41.851009368896484, "global_step": 257955, "epoch": 2131} {"train_loss": -39.76315689086914, "global_step": 257956, "epoch": 2131} {"train_loss": -40.57294845581055, "global_step": 257957, "epoch": 2131} {"train_loss": -41.72461700439453, "global_step": 257958, "epoch": 2131} {"train_loss": -42.62565994262695, "global_step": 257959, "epoch": 2131} {"train_loss": -40.586544036865234, "global_step": 257960, "epoch": 2131} {"train_loss": -42.305992126464844, "global_step": 257961, "epoch": 2131} {"train_loss": -42.760345458984375, "global_step": 257962, "epoch": 2131} {"train_loss": -41.15948486328125, "global_step": 257963, "epoch": 2131} {"train_loss": -41.536373138427734, "global_step": 257964, "epoch": 2131} {"train_loss": -40.91154861450195, "global_step": 257965, "epoch": 2131} {"train_loss": -41.243282318115234, "global_step": 257966, "epoch": 2131} {"train_loss": -42.20448684692383, "global_step": 257967, "epoch": 2131} {"train_loss": -41.829158782958984, "global_step": 257968, "epoch": 2131} {"train_loss": -38.009925842285156, "global_step": 257969, "epoch": 2131} {"train_loss": -42.63800811767578, "global_step": 257970, "epoch": 2131} {"train_loss": -41.439635599940274, "global_step": 257971, "epoch": 2131, "val_loss": 2566355.25} {"train_loss": -42.09490203857422, "global_step": 257972, "epoch": 2132} {"train_loss": -39.88473129272461, "global_step": 257973, "epoch": 2132} {"train_loss": -40.77572250366211, "global_step": 257974, "epoch": 2132} {"train_loss": -33.189762115478516, "global_step": 257975, "epoch": 2132} {"train_loss": -39.76301193237305, "global_step": 257976, "epoch": 2132} {"train_loss": -39.30814743041992, "global_step": 257977, "epoch": 2132} {"train_loss": -41.75095748901367, "global_step": 257978, "epoch": 2132} {"train_loss": -39.13350296020508, "global_step": 257979, "epoch": 2132} {"train_loss": -40.27671432495117, "global_step": 257980, "epoch": 2132} {"train_loss": -40.916194915771484, "global_step": 257981, "epoch": 2132} {"train_loss": -33.646949768066406, "global_step": 257982, "epoch": 2132} {"train_loss": -41.25478744506836, "global_step": 257983, "epoch": 2132} {"train_loss": -39.416473388671875, "global_step": 257984, "epoch": 2132} {"train_loss": -37.949974060058594, "global_step": 257985, "epoch": 2132} {"train_loss": -40.53471755981445, "global_step": 257986, "epoch": 2132} {"train_loss": -40.578712463378906, "global_step": 257987, "epoch": 2132} {"train_loss": -40.86227035522461, "global_step": 257988, "epoch": 2132} {"train_loss": -41.42652893066406, "global_step": 257989, "epoch": 2132} {"train_loss": -41.26249313354492, "global_step": 257990, "epoch": 2132} {"train_loss": -40.59896469116211, "global_step": 257991, "epoch": 2132} {"train_loss": -39.384246826171875, "global_step": 257992, "epoch": 2132} {"train_loss": -36.536190032958984, "global_step": 257993, "epoch": 2132} {"train_loss": -39.6334228515625, "global_step": 257994, "epoch": 2132} {"train_loss": -39.83778762817383, "global_step": 257995, "epoch": 2132} {"train_loss": -36.3042106628418, "global_step": 257996, "epoch": 2132} {"train_loss": -40.84493637084961, "global_step": 257997, "epoch": 2132} {"train_loss": -39.06830978393555, "global_step": 257998, "epoch": 2132} {"train_loss": -40.82735824584961, "global_step": 257999, "epoch": 2132} {"train_loss": -40.431026458740234, "global_step": 258000, "epoch": 2132} {"train_loss": -38.90997314453125, "global_step": 258001, "epoch": 2132} {"train_loss": -38.799373626708984, "global_step": 258002, "epoch": 2132} {"train_loss": -39.29452896118164, "global_step": 258003, "epoch": 2132} {"train_loss": -41.24909591674805, "global_step": 258004, "epoch": 2132} {"train_loss": -39.213905334472656, "global_step": 258005, "epoch": 2132} {"train_loss": -41.17106246948242, "global_step": 258006, "epoch": 2132} {"train_loss": -40.73420333862305, "global_step": 258007, "epoch": 2132} {"train_loss": -39.696624755859375, "global_step": 258008, "epoch": 2132} {"train_loss": -39.32155227661133, "global_step": 258009, "epoch": 2132} {"train_loss": -41.73374938964844, "global_step": 258010, "epoch": 2132} {"train_loss": -37.22391891479492, "global_step": 258011, "epoch": 2132} {"train_loss": -40.918827056884766, "global_step": 258012, "epoch": 2132} {"train_loss": -41.238521575927734, "global_step": 258013, "epoch": 2132} {"train_loss": -39.96818161010742, "global_step": 258014, "epoch": 2132} {"train_loss": -41.794654846191406, "global_step": 258015, "epoch": 2132} {"train_loss": -40.252079010009766, "global_step": 258016, "epoch": 2132} {"train_loss": -41.270870208740234, "global_step": 258017, "epoch": 2132} {"train_loss": -40.86463165283203, "global_step": 258018, "epoch": 2132} {"train_loss": -40.512550354003906, "global_step": 258019, "epoch": 2132} {"train_loss": -41.755165100097656, "global_step": 258020, "epoch": 2132} {"train_loss": -40.476436614990234, "global_step": 258021, "epoch": 2132} {"train_loss": -41.3038215637207, "global_step": 258022, "epoch": 2132} {"train_loss": -41.98488998413086, "global_step": 258023, "epoch": 2132} {"train_loss": -39.04090118408203, "global_step": 258024, "epoch": 2132} {"train_loss": -41.798885345458984, "global_step": 258025, "epoch": 2132} {"train_loss": -41.87181854248047, "global_step": 258026, "epoch": 2132} {"train_loss": -41.92245864868164, "global_step": 258027, "epoch": 2132} {"train_loss": -41.401947021484375, "global_step": 258028, "epoch": 2132} {"train_loss": -41.92557907104492, "global_step": 258029, "epoch": 2132} {"train_loss": -41.103511810302734, "global_step": 258030, "epoch": 2132} {"train_loss": -41.478271484375, "global_step": 258031, "epoch": 2132} {"train_loss": -41.411495208740234, "global_step": 258032, "epoch": 2132} {"train_loss": -41.83638381958008, "global_step": 258033, "epoch": 2132} {"train_loss": -41.73896408081055, "global_step": 258034, "epoch": 2132} {"train_loss": -40.2085075378418, "global_step": 258035, "epoch": 2132} {"train_loss": -42.00981521606445, "global_step": 258036, "epoch": 2132} {"train_loss": -41.55310821533203, "global_step": 258037, "epoch": 2132} {"train_loss": -41.8824577331543, "global_step": 258038, "epoch": 2132} {"train_loss": -41.22792434692383, "global_step": 258039, "epoch": 2132} {"train_loss": -41.44620132446289, "global_step": 258040, "epoch": 2132} {"train_loss": -41.08635330200195, "global_step": 258041, "epoch": 2132} {"train_loss": -42.058406829833984, "global_step": 258042, "epoch": 2132} {"train_loss": -42.13934326171875, "global_step": 258043, "epoch": 2132} {"train_loss": -42.324825286865234, "global_step": 258044, "epoch": 2132} {"train_loss": -42.69870376586914, "global_step": 258045, "epoch": 2132} {"train_loss": -42.69858932495117, "global_step": 258046, "epoch": 2132} {"train_loss": -41.922210693359375, "global_step": 258047, "epoch": 2132} {"train_loss": -41.7125129699707, "global_step": 258048, "epoch": 2132} {"train_loss": -41.6019401550293, "global_step": 258049, "epoch": 2132} {"train_loss": -42.73836898803711, "global_step": 258050, "epoch": 2132} {"train_loss": -42.92222213745117, "global_step": 258051, "epoch": 2132} {"train_loss": -42.76316452026367, "global_step": 258052, "epoch": 2132} {"train_loss": -41.92306900024414, "global_step": 258053, "epoch": 2132} {"train_loss": -41.94805908203125, "global_step": 258054, "epoch": 2132} {"train_loss": -42.68703842163086, "global_step": 258055, "epoch": 2132} {"train_loss": -42.872108459472656, "global_step": 258056, "epoch": 2132} {"train_loss": -42.10663986206055, "global_step": 258057, "epoch": 2132} {"train_loss": -42.823394775390625, "global_step": 258058, "epoch": 2132} {"train_loss": -42.641944885253906, "global_step": 258059, "epoch": 2132} {"train_loss": -40.779701232910156, "global_step": 258060, "epoch": 2132} {"train_loss": -42.95840072631836, "global_step": 258061, "epoch": 2132} {"train_loss": -42.588069915771484, "global_step": 258062, "epoch": 2132} {"train_loss": -41.588382720947266, "global_step": 258063, "epoch": 2132} {"train_loss": -42.293331146240234, "global_step": 258064, "epoch": 2132} {"train_loss": -42.1699333190918, "global_step": 258065, "epoch": 2132} {"train_loss": -42.634429931640625, "global_step": 258066, "epoch": 2132} {"train_loss": -41.39483642578125, "global_step": 258067, "epoch": 2132} {"train_loss": -42.895660400390625, "global_step": 258068, "epoch": 2132} {"train_loss": -42.27682113647461, "global_step": 258069, "epoch": 2132} {"train_loss": -41.100215911865234, "global_step": 258070, "epoch": 2132} {"train_loss": -39.884559631347656, "global_step": 258071, "epoch": 2132} {"train_loss": -41.56612777709961, "global_step": 258072, "epoch": 2132} {"train_loss": -42.60454177856445, "global_step": 258073, "epoch": 2132} {"train_loss": -41.859886169433594, "global_step": 258074, "epoch": 2132} {"train_loss": -42.89229965209961, "global_step": 258075, "epoch": 2132} {"train_loss": -42.240447998046875, "global_step": 258076, "epoch": 2132} {"train_loss": -41.32328414916992, "global_step": 258077, "epoch": 2132} {"train_loss": -42.21452713012695, "global_step": 258078, "epoch": 2132} {"train_loss": -43.04841232299805, "global_step": 258079, "epoch": 2132} {"train_loss": -42.601470947265625, "global_step": 258080, "epoch": 2132} {"train_loss": -42.8221321105957, "global_step": 258081, "epoch": 2132} {"train_loss": -43.255455017089844, "global_step": 258082, "epoch": 2132} {"train_loss": -42.865455627441406, "global_step": 258083, "epoch": 2132} {"train_loss": -42.26694869995117, "global_step": 258084, "epoch": 2132} {"train_loss": -43.1424446105957, "global_step": 258085, "epoch": 2132} {"train_loss": -41.57234573364258, "global_step": 258086, "epoch": 2132} {"train_loss": -41.881126403808594, "global_step": 258087, "epoch": 2132} {"train_loss": -42.08077621459961, "global_step": 258088, "epoch": 2132} {"train_loss": -42.390647888183594, "global_step": 258089, "epoch": 2132} {"train_loss": -41.50826644897461, "global_step": 258090, "epoch": 2132} {"train_loss": -43.12942123413086, "global_step": 258091, "epoch": 2132} {"train_loss": -41.13712118479831, "global_step": 258092, "epoch": 2132, "val_loss": 2772191.0} {"train_loss": -42.6333122253418, "global_step": 258093, "epoch": 2133} {"train_loss": -42.97700119018555, "global_step": 258094, "epoch": 2133} {"train_loss": -43.0811767578125, "global_step": 258095, "epoch": 2133} {"train_loss": -42.199825286865234, "global_step": 258096, "epoch": 2133} {"train_loss": -42.4128532409668, "global_step": 258097, "epoch": 2133} {"train_loss": -38.890907287597656, "global_step": 258098, "epoch": 2133} {"train_loss": -42.41400909423828, "global_step": 258099, "epoch": 2133} {"train_loss": -43.25932312011719, "global_step": 258100, "epoch": 2133} {"train_loss": -42.55473709106445, "global_step": 258101, "epoch": 2133} {"train_loss": -42.93264389038086, "global_step": 258102, "epoch": 2133} {"train_loss": -42.926204681396484, "global_step": 258103, "epoch": 2133} {"train_loss": -41.85848617553711, "global_step": 258104, "epoch": 2133} {"train_loss": -41.926509857177734, "global_step": 258105, "epoch": 2133} {"train_loss": -43.019588470458984, "global_step": 258106, "epoch": 2133} {"train_loss": -42.90032196044922, "global_step": 258107, "epoch": 2133} {"train_loss": -43.059566497802734, "global_step": 258108, "epoch": 2133} {"train_loss": -42.809661865234375, "global_step": 258109, "epoch": 2133} {"train_loss": -43.24201583862305, "global_step": 258110, "epoch": 2133} {"train_loss": -43.03965759277344, "global_step": 258111, "epoch": 2133} {"train_loss": -42.50630187988281, "global_step": 258112, "epoch": 2133} {"train_loss": -42.557151794433594, "global_step": 258113, "epoch": 2133} {"train_loss": -42.922542572021484, "global_step": 258114, "epoch": 2133} {"train_loss": -43.46291732788086, "global_step": 258115, "epoch": 2133} {"train_loss": -42.93275833129883, "global_step": 258116, "epoch": 2133} {"train_loss": -42.96515655517578, "global_step": 258117, "epoch": 2133} {"train_loss": -43.05906295776367, "global_step": 258118, "epoch": 2133} {"train_loss": -42.680335998535156, "global_step": 258119, "epoch": 2133} {"train_loss": -42.993019104003906, "global_step": 258120, "epoch": 2133} {"train_loss": -41.40713119506836, "global_step": 258121, "epoch": 2133} {"train_loss": -42.8485221862793, "global_step": 258122, "epoch": 2133} {"train_loss": -42.782325744628906, "global_step": 258123, "epoch": 2133} {"train_loss": -42.542198181152344, "global_step": 258124, "epoch": 2133} {"train_loss": -42.6602897644043, "global_step": 258125, "epoch": 2133} {"train_loss": -41.654197692871094, "global_step": 258126, "epoch": 2133} {"train_loss": -42.59513473510742, "global_step": 258127, "epoch": 2133} {"train_loss": -43.432716369628906, "global_step": 258128, "epoch": 2133} {"train_loss": -42.12035369873047, "global_step": 258129, "epoch": 2133} {"train_loss": -42.956844329833984, "global_step": 258130, "epoch": 2133} {"train_loss": -41.8620491027832, "global_step": 258131, "epoch": 2133} {"train_loss": -43.24126052856445, "global_step": 258132, "epoch": 2133} {"train_loss": -43.25642013549805, "global_step": 258133, "epoch": 2133} {"train_loss": -40.983192443847656, "global_step": 258134, "epoch": 2133} {"train_loss": -41.3187370300293, "global_step": 258135, "epoch": 2133} {"train_loss": -40.342132568359375, "global_step": 258136, "epoch": 2133} {"train_loss": -38.95228958129883, "global_step": 258137, "epoch": 2133} {"train_loss": -34.35853576660156, "global_step": 258138, "epoch": 2133} {"train_loss": -31.263504028320312, "global_step": 258139, "epoch": 2133} {"train_loss": -34.67633056640625, "global_step": 258140, "epoch": 2133} {"train_loss": -36.97053527832031, "global_step": 258141, "epoch": 2133} {"train_loss": -39.768985748291016, "global_step": 258142, "epoch": 2133} {"train_loss": -40.96479415893555, "global_step": 258143, "epoch": 2133} {"train_loss": -42.03446578979492, "global_step": 258144, "epoch": 2133} {"train_loss": -40.414669036865234, "global_step": 258145, "epoch": 2133} {"train_loss": -38.79552459716797, "global_step": 258146, "epoch": 2133} {"train_loss": -40.25682067871094, "global_step": 258147, "epoch": 2133} {"train_loss": -39.850929260253906, "global_step": 258148, "epoch": 2133} {"train_loss": -39.029754638671875, "global_step": 258149, "epoch": 2133} {"train_loss": -37.08779525756836, "global_step": 258150, "epoch": 2133} {"train_loss": -39.947811126708984, "global_step": 258151, "epoch": 2133} {"train_loss": -40.337730407714844, "global_step": 258152, "epoch": 2133} {"train_loss": -37.995357513427734, "global_step": 258153, "epoch": 2133} {"train_loss": -38.98263168334961, "global_step": 258154, "epoch": 2133} {"train_loss": -37.52975082397461, "global_step": 258155, "epoch": 2133} {"train_loss": -39.374874114990234, "global_step": 258156, "epoch": 2133} {"train_loss": -40.66405487060547, "global_step": 258157, "epoch": 2133} {"train_loss": -41.14429473876953, "global_step": 258158, "epoch": 2133} {"train_loss": -37.383541107177734, "global_step": 258159, "epoch": 2133} {"train_loss": -41.830413818359375, "global_step": 258160, "epoch": 2133} {"train_loss": -38.58534240722656, "global_step": 258161, "epoch": 2133} {"train_loss": -39.33659744262695, "global_step": 258162, "epoch": 2133} {"train_loss": -41.36473083496094, "global_step": 258163, "epoch": 2133} {"train_loss": -40.32638168334961, "global_step": 258164, "epoch": 2133} {"train_loss": -41.95781326293945, "global_step": 258165, "epoch": 2133} {"train_loss": -40.69812774658203, "global_step": 258166, "epoch": 2133} {"train_loss": -41.34968185424805, "global_step": 258167, "epoch": 2133} {"train_loss": -41.18819046020508, "global_step": 258168, "epoch": 2133} {"train_loss": -41.6838493347168, "global_step": 258169, "epoch": 2133} {"train_loss": -41.27130126953125, "global_step": 258170, "epoch": 2133} {"train_loss": -41.69526290893555, "global_step": 258171, "epoch": 2133} {"train_loss": -41.823524475097656, "global_step": 258172, "epoch": 2133} {"train_loss": -40.79859161376953, "global_step": 258173, "epoch": 2133} {"train_loss": -40.19569778442383, "global_step": 258174, "epoch": 2133} {"train_loss": -41.77521896362305, "global_step": 258175, "epoch": 2133} {"train_loss": -40.29889678955078, "global_step": 258176, "epoch": 2133} {"train_loss": -42.20539474487305, "global_step": 258177, "epoch": 2133} {"train_loss": -40.2845344543457, "global_step": 258178, "epoch": 2133} {"train_loss": -41.72910690307617, "global_step": 258179, "epoch": 2133} {"train_loss": -41.29753875732422, "global_step": 258180, "epoch": 2133} {"train_loss": -41.6119499206543, "global_step": 258181, "epoch": 2133} {"train_loss": -40.869606018066406, "global_step": 258182, "epoch": 2133} {"train_loss": -42.0913200378418, "global_step": 258183, "epoch": 2133} {"train_loss": -42.47801971435547, "global_step": 258184, "epoch": 2133} {"train_loss": -41.708465576171875, "global_step": 258185, "epoch": 2133} {"train_loss": -40.65803146362305, "global_step": 258186, "epoch": 2133} {"train_loss": -41.67261505126953, "global_step": 258187, "epoch": 2133} {"train_loss": -41.348453521728516, "global_step": 258188, "epoch": 2133} {"train_loss": -42.03618240356445, "global_step": 258189, "epoch": 2133} {"train_loss": -41.78309631347656, "global_step": 258190, "epoch": 2133} {"train_loss": -42.06241989135742, "global_step": 258191, "epoch": 2133} {"train_loss": -42.072505950927734, "global_step": 258192, "epoch": 2133} {"train_loss": -41.72864532470703, "global_step": 258193, "epoch": 2133} {"train_loss": -41.93110275268555, "global_step": 258194, "epoch": 2133} {"train_loss": -41.68410873413086, "global_step": 258195, "epoch": 2133} {"train_loss": -41.84503173828125, "global_step": 258196, "epoch": 2133} {"train_loss": -42.04838180541992, "global_step": 258197, "epoch": 2133} {"train_loss": -41.69076156616211, "global_step": 258198, "epoch": 2133} {"train_loss": -42.60856246948242, "global_step": 258199, "epoch": 2133} {"train_loss": -42.62409973144531, "global_step": 258200, "epoch": 2133} {"train_loss": -42.43185043334961, "global_step": 258201, "epoch": 2133} {"train_loss": -42.65185546875, "global_step": 258202, "epoch": 2133} {"train_loss": -42.90279006958008, "global_step": 258203, "epoch": 2133} {"train_loss": -42.885414123535156, "global_step": 258204, "epoch": 2133} {"train_loss": -42.51164627075195, "global_step": 258205, "epoch": 2133} {"train_loss": -42.78678512573242, "global_step": 258206, "epoch": 2133} {"train_loss": -42.080177307128906, "global_step": 258207, "epoch": 2133} {"train_loss": -42.76746368408203, "global_step": 258208, "epoch": 2133} {"train_loss": -42.55000686645508, "global_step": 258209, "epoch": 2133} {"train_loss": -43.078067779541016, "global_step": 258210, "epoch": 2133} {"train_loss": -43.156246185302734, "global_step": 258211, "epoch": 2133} {"train_loss": -42.91933822631836, "global_step": 258212, "epoch": 2133} {"train_loss": -41.391229550700544, "global_step": 258213, "epoch": 2133, "val_loss": 2748742.75} {"train_loss": -42.526119232177734, "global_step": 258214, "epoch": 2134} {"train_loss": -42.4528923034668, "global_step": 258215, "epoch": 2134} {"train_loss": -42.76119613647461, "global_step": 258216, "epoch": 2134} {"train_loss": -37.24532699584961, "global_step": 258217, "epoch": 2134} {"train_loss": -42.282264709472656, "global_step": 258218, "epoch": 2134} {"train_loss": -40.97529983520508, "global_step": 258219, "epoch": 2134} {"train_loss": -43.03239059448242, "global_step": 258220, "epoch": 2134} {"train_loss": -40.40718078613281, "global_step": 258221, "epoch": 2134} {"train_loss": -40.060150146484375, "global_step": 258222, "epoch": 2134} {"train_loss": -42.18840026855469, "global_step": 258223, "epoch": 2134} {"train_loss": -40.78615188598633, "global_step": 258224, "epoch": 2134} {"train_loss": -40.508968353271484, "global_step": 258225, "epoch": 2134} {"train_loss": -19.03067970275879, "global_step": 258226, "epoch": 2134} {"train_loss": -33.134033203125, "global_step": 258227, "epoch": 2134} {"train_loss": -36.171348571777344, "global_step": 258228, "epoch": 2134} {"train_loss": -39.04098129272461, "global_step": 258229, "epoch": 2134} {"train_loss": -36.50620651245117, "global_step": 258230, "epoch": 2134} {"train_loss": -39.04635238647461, "global_step": 258231, "epoch": 2134} {"train_loss": -36.07967758178711, "global_step": 258232, "epoch": 2134} {"train_loss": -39.129066467285156, "global_step": 258233, "epoch": 2134} {"train_loss": -38.4869270324707, "global_step": 258234, "epoch": 2134} {"train_loss": -37.09873580932617, "global_step": 258235, "epoch": 2134} {"train_loss": -37.98525619506836, "global_step": 258236, "epoch": 2134} {"train_loss": -37.2691535949707, "global_step": 258237, "epoch": 2134} {"train_loss": -34.78638458251953, "global_step": 258238, "epoch": 2134} {"train_loss": -36.6329460144043, "global_step": 258239, "epoch": 2134} {"train_loss": -38.67985153198242, "global_step": 258240, "epoch": 2134} {"train_loss": -35.67829132080078, "global_step": 258241, "epoch": 2134} {"train_loss": -39.21550750732422, "global_step": 258242, "epoch": 2134} {"train_loss": -39.674556732177734, "global_step": 258243, "epoch": 2134} {"train_loss": -36.929595947265625, "global_step": 258244, "epoch": 2134} {"train_loss": -36.37760543823242, "global_step": 258245, "epoch": 2134} {"train_loss": -37.479305267333984, "global_step": 258246, "epoch": 2134} {"train_loss": -37.98043441772461, "global_step": 258247, "epoch": 2134} {"train_loss": -31.815296173095703, "global_step": 258248, "epoch": 2134} {"train_loss": -37.74456787109375, "global_step": 258249, "epoch": 2134} {"train_loss": -37.81098937988281, "global_step": 258250, "epoch": 2134} {"train_loss": -39.85942459106445, "global_step": 258251, "epoch": 2134} {"train_loss": -36.89599609375, "global_step": 258252, "epoch": 2134} {"train_loss": -38.432437896728516, "global_step": 258253, "epoch": 2134} {"train_loss": -38.44916915893555, "global_step": 258254, "epoch": 2134} {"train_loss": -38.98212814331055, "global_step": 258255, "epoch": 2134} {"train_loss": -37.403175354003906, "global_step": 258256, "epoch": 2134} {"train_loss": -38.01217269897461, "global_step": 258257, "epoch": 2134} {"train_loss": -39.03506088256836, "global_step": 258258, "epoch": 2134} {"train_loss": -39.077144622802734, "global_step": 258259, "epoch": 2134} {"train_loss": -39.904178619384766, "global_step": 258260, "epoch": 2134} {"train_loss": -40.11040115356445, "global_step": 258261, "epoch": 2134} {"train_loss": -39.49056625366211, "global_step": 258262, "epoch": 2134} {"train_loss": -39.99711990356445, "global_step": 258263, "epoch": 2134} {"train_loss": -39.54148483276367, "global_step": 258264, "epoch": 2134} {"train_loss": -40.20894241333008, "global_step": 258265, "epoch": 2134} {"train_loss": -38.742427825927734, "global_step": 258266, "epoch": 2134} {"train_loss": -40.899532318115234, "global_step": 258267, "epoch": 2134} {"train_loss": -39.56387710571289, "global_step": 258268, "epoch": 2134} {"train_loss": -40.20836639404297, "global_step": 258269, "epoch": 2134} {"train_loss": -38.982765197753906, "global_step": 258270, "epoch": 2134} {"train_loss": -40.05100631713867, "global_step": 258271, "epoch": 2134} {"train_loss": -39.799800872802734, "global_step": 258272, "epoch": 2134} {"train_loss": -39.53164291381836, "global_step": 258273, "epoch": 2134} {"train_loss": -40.1700553894043, "global_step": 258274, "epoch": 2134} {"train_loss": -41.00801467895508, "global_step": 258275, "epoch": 2134} {"train_loss": -40.86085891723633, "global_step": 258276, "epoch": 2134} {"train_loss": -40.19627380371094, "global_step": 258277, "epoch": 2134} {"train_loss": -40.843017578125, "global_step": 258278, "epoch": 2134} {"train_loss": -40.730812072753906, "global_step": 258279, "epoch": 2134} {"train_loss": -40.90358352661133, "global_step": 258280, "epoch": 2134} {"train_loss": -41.429569244384766, "global_step": 258281, "epoch": 2134} {"train_loss": -39.99262237548828, "global_step": 258282, "epoch": 2134} {"train_loss": -41.49468994140625, "global_step": 258283, "epoch": 2134} {"train_loss": -41.87459945678711, "global_step": 258284, "epoch": 2134} {"train_loss": -41.290409088134766, "global_step": 258285, "epoch": 2134} {"train_loss": -41.33882141113281, "global_step": 258286, "epoch": 2134} {"train_loss": -41.154178619384766, "global_step": 258287, "epoch": 2134} {"train_loss": -41.311378479003906, "global_step": 258288, "epoch": 2134} {"train_loss": -41.27448272705078, "global_step": 258289, "epoch": 2134} {"train_loss": -41.50770950317383, "global_step": 258290, "epoch": 2134} {"train_loss": -41.92455291748047, "global_step": 258291, "epoch": 2134} {"train_loss": -41.12450408935547, "global_step": 258292, "epoch": 2134} {"train_loss": -40.68650436401367, "global_step": 258293, "epoch": 2134} {"train_loss": -42.0792121887207, "global_step": 258294, "epoch": 2134} {"train_loss": -41.55707550048828, "global_step": 258295, "epoch": 2134} {"train_loss": -40.14260482788086, "global_step": 258296, "epoch": 2134} {"train_loss": -40.743431091308594, "global_step": 258297, "epoch": 2134} {"train_loss": -40.9935417175293, "global_step": 258298, "epoch": 2134} {"train_loss": -41.95566940307617, "global_step": 258299, "epoch": 2134} {"train_loss": -41.97768783569336, "global_step": 258300, "epoch": 2134} {"train_loss": -41.36840057373047, "global_step": 258301, "epoch": 2134} {"train_loss": -42.39976119995117, "global_step": 258302, "epoch": 2134} {"train_loss": -42.08192443847656, "global_step": 258303, "epoch": 2134} {"train_loss": -41.55775833129883, "global_step": 258304, "epoch": 2134} {"train_loss": -41.987037658691406, "global_step": 258305, "epoch": 2134} {"train_loss": -41.14303970336914, "global_step": 258306, "epoch": 2134} {"train_loss": -41.71149444580078, "global_step": 258307, "epoch": 2134} {"train_loss": -42.46099853515625, "global_step": 258308, "epoch": 2134} {"train_loss": -41.97123336791992, "global_step": 258309, "epoch": 2134} {"train_loss": -41.85647201538086, "global_step": 258310, "epoch": 2134} {"train_loss": -42.637516021728516, "global_step": 258311, "epoch": 2134} {"train_loss": -42.58063888549805, "global_step": 258312, "epoch": 2134} {"train_loss": -41.71512222290039, "global_step": 258313, "epoch": 2134} {"train_loss": -42.357295989990234, "global_step": 258314, "epoch": 2134} {"train_loss": -42.140594482421875, "global_step": 258315, "epoch": 2134} {"train_loss": -41.807647705078125, "global_step": 258316, "epoch": 2134} {"train_loss": -42.563899993896484, "global_step": 258317, "epoch": 2134} {"train_loss": -42.40702438354492, "global_step": 258318, "epoch": 2134} {"train_loss": -42.31740951538086, "global_step": 258319, "epoch": 2134} {"train_loss": -41.235145568847656, "global_step": 258320, "epoch": 2134} {"train_loss": -42.941585540771484, "global_step": 258321, "epoch": 2134} {"train_loss": -42.47062683105469, "global_step": 258322, "epoch": 2134} {"train_loss": -42.22726058959961, "global_step": 258323, "epoch": 2134} {"train_loss": -43.0532341003418, "global_step": 258324, "epoch": 2134} {"train_loss": -42.7574577331543, "global_step": 258325, "epoch": 2134} {"train_loss": -42.01247787475586, "global_step": 258326, "epoch": 2134} {"train_loss": -42.80759811401367, "global_step": 258327, "epoch": 2134} {"train_loss": -41.62776565551758, "global_step": 258328, "epoch": 2134} {"train_loss": -42.12938690185547, "global_step": 258329, "epoch": 2134} {"train_loss": -41.990211486816406, "global_step": 258330, "epoch": 2134} {"train_loss": -41.29273223876953, "global_step": 258331, "epoch": 2134} {"train_loss": -42.42233657836914, "global_step": 258332, "epoch": 2134} {"train_loss": -42.636322021484375, "global_step": 258333, "epoch": 2134} {"train_loss": -40.092603809577376, "global_step": 258334, "epoch": 2134, "val_loss": 2578095.25} {"train_loss": -42.43550109863281, "global_step": 258335, "epoch": 2135} {"train_loss": -41.81623077392578, "global_step": 258336, "epoch": 2135} {"train_loss": -42.96576690673828, "global_step": 258337, "epoch": 2135} {"train_loss": -41.718101501464844, "global_step": 258338, "epoch": 2135} {"train_loss": -41.609375, "global_step": 258339, "epoch": 2135} {"train_loss": -42.2274169921875, "global_step": 258340, "epoch": 2135} {"train_loss": -41.96733474731445, "global_step": 258341, "epoch": 2135} {"train_loss": -41.08486557006836, "global_step": 258342, "epoch": 2135} {"train_loss": -40.40568923950195, "global_step": 258343, "epoch": 2135} {"train_loss": -40.061031341552734, "global_step": 258344, "epoch": 2135} {"train_loss": -42.47921371459961, "global_step": 258345, "epoch": 2135} {"train_loss": -38.807716369628906, "global_step": 258346, "epoch": 2135} {"train_loss": -40.01528549194336, "global_step": 258347, "epoch": 2135} {"train_loss": -39.21753692626953, "global_step": 258348, "epoch": 2135} {"train_loss": -40.581512451171875, "global_step": 258349, "epoch": 2135} {"train_loss": -38.2764778137207, "global_step": 258350, "epoch": 2135} {"train_loss": -39.68123245239258, "global_step": 258351, "epoch": 2135} {"train_loss": -36.37928009033203, "global_step": 258352, "epoch": 2135} {"train_loss": -38.21296310424805, "global_step": 258353, "epoch": 2135} {"train_loss": -39.23604965209961, "global_step": 258354, "epoch": 2135} {"train_loss": -38.84272384643555, "global_step": 258355, "epoch": 2135} {"train_loss": -39.78092575073242, "global_step": 258356, "epoch": 2135} {"train_loss": -40.003387451171875, "global_step": 258357, "epoch": 2135} {"train_loss": -39.99165725708008, "global_step": 258358, "epoch": 2135} {"train_loss": -37.49633026123047, "global_step": 258359, "epoch": 2135} {"train_loss": -40.67605209350586, "global_step": 258360, "epoch": 2135} {"train_loss": -36.28093338012695, "global_step": 258361, "epoch": 2135} {"train_loss": -38.63979721069336, "global_step": 258362, "epoch": 2135} {"train_loss": -35.909297943115234, "global_step": 258363, "epoch": 2135} {"train_loss": -37.910125732421875, "global_step": 258364, "epoch": 2135} {"train_loss": -38.6437873840332, "global_step": 258365, "epoch": 2135} {"train_loss": -38.30220413208008, "global_step": 258366, "epoch": 2135} {"train_loss": -38.220882415771484, "global_step": 258367, "epoch": 2135} {"train_loss": -40.103397369384766, "global_step": 258368, "epoch": 2135} {"train_loss": -36.10856628417969, "global_step": 258369, "epoch": 2135} {"train_loss": -40.552547454833984, "global_step": 258370, "epoch": 2135} {"train_loss": -37.67770767211914, "global_step": 258371, "epoch": 2135} {"train_loss": -38.30573654174805, "global_step": 258372, "epoch": 2135} {"train_loss": -39.862525939941406, "global_step": 258373, "epoch": 2135} {"train_loss": -40.161720275878906, "global_step": 258374, "epoch": 2135} {"train_loss": -39.610618591308594, "global_step": 258375, "epoch": 2135} {"train_loss": -39.78995895385742, "global_step": 258376, "epoch": 2135} {"train_loss": -40.19646072387695, "global_step": 258377, "epoch": 2135} {"train_loss": -40.47086715698242, "global_step": 258378, "epoch": 2135} {"train_loss": -40.48478317260742, "global_step": 258379, "epoch": 2135} {"train_loss": -41.2368049621582, "global_step": 258380, "epoch": 2135} {"train_loss": -39.98470687866211, "global_step": 258381, "epoch": 2135} {"train_loss": -40.535030364990234, "global_step": 258382, "epoch": 2135} {"train_loss": -40.472389221191406, "global_step": 258383, "epoch": 2135} {"train_loss": -41.54581832885742, "global_step": 258384, "epoch": 2135} {"train_loss": -40.19319534301758, "global_step": 258385, "epoch": 2135} {"train_loss": -41.114498138427734, "global_step": 258386, "epoch": 2135} {"train_loss": -41.41477584838867, "global_step": 258387, "epoch": 2135} {"train_loss": -41.75482940673828, "global_step": 258388, "epoch": 2135} {"train_loss": -40.99235153198242, "global_step": 258389, "epoch": 2135} {"train_loss": -41.699222564697266, "global_step": 258390, "epoch": 2135} {"train_loss": -42.168182373046875, "global_step": 258391, "epoch": 2135} {"train_loss": -41.32966995239258, "global_step": 258392, "epoch": 2135} {"train_loss": -41.65114974975586, "global_step": 258393, "epoch": 2135} {"train_loss": -41.9110107421875, "global_step": 258394, "epoch": 2135} {"train_loss": -42.00339889526367, "global_step": 258395, "epoch": 2135} {"train_loss": -41.63378143310547, "global_step": 258396, "epoch": 2135} {"train_loss": -42.078887939453125, "global_step": 258397, "epoch": 2135} {"train_loss": -42.275543212890625, "global_step": 258398, "epoch": 2135} {"train_loss": -42.53858184814453, "global_step": 258399, "epoch": 2135} {"train_loss": -41.88625717163086, "global_step": 258400, "epoch": 2135} {"train_loss": -42.27254867553711, "global_step": 258401, "epoch": 2135} {"train_loss": -42.385459899902344, "global_step": 258402, "epoch": 2135} {"train_loss": -42.30495071411133, "global_step": 258403, "epoch": 2135} {"train_loss": -41.41974639892578, "global_step": 258404, "epoch": 2135} {"train_loss": -41.717010498046875, "global_step": 258405, "epoch": 2135} {"train_loss": -41.69758224487305, "global_step": 258406, "epoch": 2135} {"train_loss": -42.93050765991211, "global_step": 258407, "epoch": 2135} {"train_loss": -41.957611083984375, "global_step": 258408, "epoch": 2135} {"train_loss": -42.53593063354492, "global_step": 258409, "epoch": 2135} {"train_loss": -42.39929962158203, "global_step": 258410, "epoch": 2135} {"train_loss": -42.39131164550781, "global_step": 258411, "epoch": 2135} {"train_loss": -42.78876495361328, "global_step": 258412, "epoch": 2135} {"train_loss": -42.57706832885742, "global_step": 258413, "epoch": 2135} {"train_loss": -43.253231048583984, "global_step": 258414, "epoch": 2135} {"train_loss": -42.29169845581055, "global_step": 258415, "epoch": 2135} {"train_loss": -42.67218780517578, "global_step": 258416, "epoch": 2135} {"train_loss": -42.100852966308594, "global_step": 258417, "epoch": 2135} {"train_loss": -42.77158737182617, "global_step": 258418, "epoch": 2135} {"train_loss": -42.72455596923828, "global_step": 258419, "epoch": 2135} {"train_loss": -43.183631896972656, "global_step": 258420, "epoch": 2135} {"train_loss": -42.71634292602539, "global_step": 258421, "epoch": 2135} {"train_loss": -43.158172607421875, "global_step": 258422, "epoch": 2135} {"train_loss": -42.86580276489258, "global_step": 258423, "epoch": 2135} {"train_loss": -42.738887786865234, "global_step": 258424, "epoch": 2135} {"train_loss": -43.3465576171875, "global_step": 258425, "epoch": 2135} {"train_loss": -42.77290725708008, "global_step": 258426, "epoch": 2135} {"train_loss": -42.71263885498047, "global_step": 258427, "epoch": 2135} {"train_loss": -43.2633056640625, "global_step": 258428, "epoch": 2135} {"train_loss": -42.59135818481445, "global_step": 258429, "epoch": 2135} {"train_loss": -43.17475509643555, "global_step": 258430, "epoch": 2135} {"train_loss": -42.911190032958984, "global_step": 258431, "epoch": 2135} {"train_loss": -43.4770393371582, "global_step": 258432, "epoch": 2135} {"train_loss": -43.2268180847168, "global_step": 258433, "epoch": 2135} {"train_loss": -42.47743606567383, "global_step": 258434, "epoch": 2135} {"train_loss": -43.62288284301758, "global_step": 258435, "epoch": 2135} {"train_loss": -43.536434173583984, "global_step": 258436, "epoch": 2135} {"train_loss": -42.832515716552734, "global_step": 258437, "epoch": 2135} {"train_loss": -42.85478591918945, "global_step": 258438, "epoch": 2135} {"train_loss": -43.215423583984375, "global_step": 258439, "epoch": 2135} {"train_loss": -42.4030876159668, "global_step": 258440, "epoch": 2135} {"train_loss": -43.722347259521484, "global_step": 258441, "epoch": 2135} {"train_loss": -43.13690948486328, "global_step": 258442, "epoch": 2135} {"train_loss": -43.20649337768555, "global_step": 258443, "epoch": 2135} {"train_loss": -43.13019943237305, "global_step": 258444, "epoch": 2135} {"train_loss": -41.73109817504883, "global_step": 258445, "epoch": 2135} {"train_loss": -42.3265266418457, "global_step": 258446, "epoch": 2135} {"train_loss": -43.08378219604492, "global_step": 258447, "epoch": 2135} {"train_loss": -42.94380187988281, "global_step": 258448, "epoch": 2135} {"train_loss": -43.225738525390625, "global_step": 258449, "epoch": 2135} {"train_loss": -43.632137298583984, "global_step": 258450, "epoch": 2135} {"train_loss": -43.2695426940918, "global_step": 258451, "epoch": 2135} {"train_loss": -43.511226654052734, "global_step": 258452, "epoch": 2135} {"train_loss": -43.037044525146484, "global_step": 258453, "epoch": 2135} {"train_loss": -43.196075439453125, "global_step": 258454, "epoch": 2135} {"train_loss": -41.385711764501146, "global_step": 258455, "epoch": 2135, "val_loss": 2576316.25} {"train_loss": -43.048736572265625, "global_step": 258456, "epoch": 2136} {"train_loss": -43.2779541015625, "global_step": 258457, "epoch": 2136} {"train_loss": -43.11854934692383, "global_step": 258458, "epoch": 2136} {"train_loss": -42.89583206176758, "global_step": 258459, "epoch": 2136} {"train_loss": -43.66796875, "global_step": 258460, "epoch": 2136} {"train_loss": -43.0263786315918, "global_step": 258461, "epoch": 2136} {"train_loss": -42.907310485839844, "global_step": 258462, "epoch": 2136} {"train_loss": -43.071266174316406, "global_step": 258463, "epoch": 2136} {"train_loss": -42.2332649230957, "global_step": 258464, "epoch": 2136} {"train_loss": -42.92246627807617, "global_step": 258465, "epoch": 2136} {"train_loss": -42.32282638549805, "global_step": 258466, "epoch": 2136} {"train_loss": -42.30585861206055, "global_step": 258467, "epoch": 2136} {"train_loss": -42.28567123413086, "global_step": 258468, "epoch": 2136} {"train_loss": -42.07063674926758, "global_step": 258469, "epoch": 2136} {"train_loss": -41.313602447509766, "global_step": 258470, "epoch": 2136} {"train_loss": -41.34963607788086, "global_step": 258471, "epoch": 2136} {"train_loss": -37.455047607421875, "global_step": 258472, "epoch": 2136} {"train_loss": -28.790821075439453, "global_step": 258473, "epoch": 2136} {"train_loss": -10.75458812713623, "global_step": 258474, "epoch": 2136} {"train_loss": -5.293290138244629, "global_step": 258475, "epoch": 2136} {"train_loss": -34.00338363647461, "global_step": 258476, "epoch": 2136} {"train_loss": -33.43246078491211, "global_step": 258477, "epoch": 2136} {"train_loss": -31.1009521484375, "global_step": 258478, "epoch": 2136} {"train_loss": -34.33231735229492, "global_step": 258479, "epoch": 2136} {"train_loss": -22.451379776000977, "global_step": 258480, "epoch": 2136} {"train_loss": -36.58392333984375, "global_step": 258481, "epoch": 2136} {"train_loss": -30.949417114257812, "global_step": 258482, "epoch": 2136} {"train_loss": -39.486419677734375, "global_step": 258483, "epoch": 2136} {"train_loss": -32.26650619506836, "global_step": 258484, "epoch": 2136} {"train_loss": -37.88883590698242, "global_step": 258485, "epoch": 2136} {"train_loss": -35.59765625, "global_step": 258486, "epoch": 2136} {"train_loss": -39.34944534301758, "global_step": 258487, "epoch": 2136} {"train_loss": -37.48793029785156, "global_step": 258488, "epoch": 2136} {"train_loss": -36.55131149291992, "global_step": 258489, "epoch": 2136} {"train_loss": -38.253536224365234, "global_step": 258490, "epoch": 2136} {"train_loss": -36.1894645690918, "global_step": 258491, "epoch": 2136} {"train_loss": -39.13773727416992, "global_step": 258492, "epoch": 2136} {"train_loss": -36.42920684814453, "global_step": 258493, "epoch": 2136} {"train_loss": -39.35380172729492, "global_step": 258494, "epoch": 2136} {"train_loss": -37.90346908569336, "global_step": 258495, "epoch": 2136} {"train_loss": -37.00159454345703, "global_step": 258496, "epoch": 2136} {"train_loss": -40.307342529296875, "global_step": 258497, "epoch": 2136} {"train_loss": -38.87018966674805, "global_step": 258498, "epoch": 2136} {"train_loss": -39.059383392333984, "global_step": 258499, "epoch": 2136} {"train_loss": -40.30124282836914, "global_step": 258500, "epoch": 2136} {"train_loss": -39.284786224365234, "global_step": 258501, "epoch": 2136} {"train_loss": -39.91630172729492, "global_step": 258502, "epoch": 2136} {"train_loss": -40.4984130859375, "global_step": 258503, "epoch": 2136} {"train_loss": -39.87422561645508, "global_step": 258504, "epoch": 2136} {"train_loss": -40.5754280090332, "global_step": 258505, "epoch": 2136} {"train_loss": -40.27511215209961, "global_step": 258506, "epoch": 2136} {"train_loss": -39.5300178527832, "global_step": 258507, "epoch": 2136} {"train_loss": -40.5740852355957, "global_step": 258508, "epoch": 2136} {"train_loss": -40.01296615600586, "global_step": 258509, "epoch": 2136} {"train_loss": -40.491756439208984, "global_step": 258510, "epoch": 2136} {"train_loss": -40.7400016784668, "global_step": 258511, "epoch": 2136} {"train_loss": -40.25387191772461, "global_step": 258512, "epoch": 2136} {"train_loss": -40.58742141723633, "global_step": 258513, "epoch": 2136} {"train_loss": -40.981746673583984, "global_step": 258514, "epoch": 2136} {"train_loss": -40.87111282348633, "global_step": 258515, "epoch": 2136} {"train_loss": -41.482669830322266, "global_step": 258516, "epoch": 2136} {"train_loss": -41.09476852416992, "global_step": 258517, "epoch": 2136} {"train_loss": -41.00596237182617, "global_step": 258518, "epoch": 2136} {"train_loss": -41.68177032470703, "global_step": 258519, "epoch": 2136} {"train_loss": -40.94099807739258, "global_step": 258520, "epoch": 2136} {"train_loss": -40.85110092163086, "global_step": 258521, "epoch": 2136} {"train_loss": -41.8879280090332, "global_step": 258522, "epoch": 2136} {"train_loss": -41.11965560913086, "global_step": 258523, "epoch": 2136} {"train_loss": -41.468780517578125, "global_step": 258524, "epoch": 2136} {"train_loss": -41.88995361328125, "global_step": 258525, "epoch": 2136} {"train_loss": -41.82062911987305, "global_step": 258526, "epoch": 2136} {"train_loss": -41.73533248901367, "global_step": 258527, "epoch": 2136} {"train_loss": -41.67057418823242, "global_step": 258528, "epoch": 2136} {"train_loss": -41.37049102783203, "global_step": 258529, "epoch": 2136} {"train_loss": -41.696144104003906, "global_step": 258530, "epoch": 2136} {"train_loss": -41.92912673950195, "global_step": 258531, "epoch": 2136} {"train_loss": -42.02170944213867, "global_step": 258532, "epoch": 2136} {"train_loss": -40.8002815246582, "global_step": 258533, "epoch": 2136} {"train_loss": -42.01665115356445, "global_step": 258534, "epoch": 2136} {"train_loss": -41.94215774536133, "global_step": 258535, "epoch": 2136} {"train_loss": -42.3615837097168, "global_step": 258536, "epoch": 2136} {"train_loss": -42.02108383178711, "global_step": 258537, "epoch": 2136} {"train_loss": -42.18373107910156, "global_step": 258538, "epoch": 2136} {"train_loss": -42.206966400146484, "global_step": 258539, "epoch": 2136} {"train_loss": -42.04099655151367, "global_step": 258540, "epoch": 2136} {"train_loss": -36.65156936645508, "global_step": 258541, "epoch": 2136} {"train_loss": -42.04548263549805, "global_step": 258542, "epoch": 2136} {"train_loss": -42.58091354370117, "global_step": 258543, "epoch": 2136} {"train_loss": -42.39130783081055, "global_step": 258544, "epoch": 2136} {"train_loss": -42.556514739990234, "global_step": 258545, "epoch": 2136} {"train_loss": -42.46148681640625, "global_step": 258546, "epoch": 2136} {"train_loss": -42.58047103881836, "global_step": 258547, "epoch": 2136} {"train_loss": -42.50264358520508, "global_step": 258548, "epoch": 2136} {"train_loss": -42.555686950683594, "global_step": 258549, "epoch": 2136} {"train_loss": -42.50783920288086, "global_step": 258550, "epoch": 2136} {"train_loss": -42.47898483276367, "global_step": 258551, "epoch": 2136} {"train_loss": -42.43866729736328, "global_step": 258552, "epoch": 2136} {"train_loss": -41.92782211303711, "global_step": 258553, "epoch": 2136} {"train_loss": -41.26993942260742, "global_step": 258554, "epoch": 2136} {"train_loss": -40.89410400390625, "global_step": 258555, "epoch": 2136} {"train_loss": -42.5615234375, "global_step": 258556, "epoch": 2136} {"train_loss": -42.86469650268555, "global_step": 258557, "epoch": 2136} {"train_loss": -42.570831298828125, "global_step": 258558, "epoch": 2136} {"train_loss": -42.618038177490234, "global_step": 258559, "epoch": 2136} {"train_loss": -42.3436279296875, "global_step": 258560, "epoch": 2136} {"train_loss": -42.65568161010742, "global_step": 258561, "epoch": 2136} {"train_loss": -42.20746994018555, "global_step": 258562, "epoch": 2136} {"train_loss": -42.23995590209961, "global_step": 258563, "epoch": 2136} {"train_loss": -42.47787857055664, "global_step": 258564, "epoch": 2136} {"train_loss": -42.51728439331055, "global_step": 258565, "epoch": 2136} {"train_loss": -42.82006072998047, "global_step": 258566, "epoch": 2136} {"train_loss": -43.020748138427734, "global_step": 258567, "epoch": 2136} {"train_loss": -43.61775207519531, "global_step": 258568, "epoch": 2136} {"train_loss": -42.5532341003418, "global_step": 258569, "epoch": 2136} {"train_loss": -42.620582580566406, "global_step": 258570, "epoch": 2136} {"train_loss": -42.62815475463867, "global_step": 258571, "epoch": 2136} {"train_loss": -42.341434478759766, "global_step": 258572, "epoch": 2136} {"train_loss": -42.909053802490234, "global_step": 258573, "epoch": 2136} {"train_loss": -42.89360046386719, "global_step": 258574, "epoch": 2136} {"train_loss": -42.54082107543945, "global_step": 258575, "epoch": 2136} {"train_loss": -39.98223159726986, "global_step": 258576, "epoch": 2136, "val_loss": 2657026.75} {"train_loss": -43.275917053222656, "global_step": 258577, "epoch": 2137} {"train_loss": -43.37025451660156, "global_step": 258578, "epoch": 2137} {"train_loss": -43.42036437988281, "global_step": 258579, "epoch": 2137} {"train_loss": -42.2584342956543, "global_step": 258580, "epoch": 2137} {"train_loss": -42.97512435913086, "global_step": 258581, "epoch": 2137} {"train_loss": -42.80903625488281, "global_step": 258582, "epoch": 2137} {"train_loss": -42.695945739746094, "global_step": 258583, "epoch": 2137} {"train_loss": -42.7645378112793, "global_step": 258584, "epoch": 2137} {"train_loss": -34.82387924194336, "global_step": 258585, "epoch": 2137} {"train_loss": -43.12068557739258, "global_step": 258586, "epoch": 2137} {"train_loss": -42.68057632446289, "global_step": 258587, "epoch": 2137} {"train_loss": -42.254512786865234, "global_step": 258588, "epoch": 2137} {"train_loss": -42.82432174682617, "global_step": 258589, "epoch": 2137} {"train_loss": -43.42799758911133, "global_step": 258590, "epoch": 2137} {"train_loss": -43.18418502807617, "global_step": 258591, "epoch": 2137} {"train_loss": -42.784271240234375, "global_step": 258592, "epoch": 2137} {"train_loss": -42.023521423339844, "global_step": 258593, "epoch": 2137} {"train_loss": -41.483863830566406, "global_step": 258594, "epoch": 2137} {"train_loss": -40.89806365966797, "global_step": 258595, "epoch": 2137} {"train_loss": -43.23445510864258, "global_step": 258596, "epoch": 2137} {"train_loss": -42.627357482910156, "global_step": 258597, "epoch": 2137} {"train_loss": -41.54537582397461, "global_step": 258598, "epoch": 2137} {"train_loss": -40.65093231201172, "global_step": 258599, "epoch": 2137} {"train_loss": -41.3013916015625, "global_step": 258600, "epoch": 2137} {"train_loss": -43.01039505004883, "global_step": 258601, "epoch": 2137} {"train_loss": -42.313072204589844, "global_step": 258602, "epoch": 2137} {"train_loss": -40.56046676635742, "global_step": 258603, "epoch": 2137} {"train_loss": -42.25031280517578, "global_step": 258604, "epoch": 2137} {"train_loss": -43.20662307739258, "global_step": 258605, "epoch": 2137} {"train_loss": -41.76740646362305, "global_step": 258606, "epoch": 2137} {"train_loss": -42.1966438293457, "global_step": 258607, "epoch": 2137} {"train_loss": -42.516624450683594, "global_step": 258608, "epoch": 2137} {"train_loss": -42.78255081176758, "global_step": 258609, "epoch": 2137} {"train_loss": -43.336341857910156, "global_step": 258610, "epoch": 2137} {"train_loss": -36.71376037597656, "global_step": 258611, "epoch": 2137} {"train_loss": -42.90291213989258, "global_step": 258612, "epoch": 2137} {"train_loss": -41.96009063720703, "global_step": 258613, "epoch": 2137} {"train_loss": -41.88494110107422, "global_step": 258614, "epoch": 2137} {"train_loss": -41.886207580566406, "global_step": 258615, "epoch": 2137} {"train_loss": -42.728370666503906, "global_step": 258616, "epoch": 2137} {"train_loss": -42.367305755615234, "global_step": 258617, "epoch": 2137} {"train_loss": -41.655433654785156, "global_step": 258618, "epoch": 2137} {"train_loss": -41.386844635009766, "global_step": 258619, "epoch": 2137} {"train_loss": -42.426307678222656, "global_step": 258620, "epoch": 2137} {"train_loss": -42.534515380859375, "global_step": 258621, "epoch": 2137} {"train_loss": -41.89968490600586, "global_step": 258622, "epoch": 2137} {"train_loss": -39.80220413208008, "global_step": 258623, "epoch": 2137} {"train_loss": -41.15876770019531, "global_step": 258624, "epoch": 2137} {"train_loss": -41.87202835083008, "global_step": 258625, "epoch": 2137} {"train_loss": -41.97494125366211, "global_step": 258626, "epoch": 2137} {"train_loss": -41.46938705444336, "global_step": 258627, "epoch": 2137} {"train_loss": -40.79350662231445, "global_step": 258628, "epoch": 2137} {"train_loss": -42.55577850341797, "global_step": 258629, "epoch": 2137} {"train_loss": -35.245113372802734, "global_step": 258630, "epoch": 2137} {"train_loss": -40.67466354370117, "global_step": 258631, "epoch": 2137} {"train_loss": -35.48588943481445, "global_step": 258632, "epoch": 2137} {"train_loss": -39.5743293762207, "global_step": 258633, "epoch": 2137} {"train_loss": -41.89089584350586, "global_step": 258634, "epoch": 2137} {"train_loss": -40.058372497558594, "global_step": 258635, "epoch": 2137} {"train_loss": -39.5649528503418, "global_step": 258636, "epoch": 2137} {"train_loss": -40.47306823730469, "global_step": 258637, "epoch": 2137} {"train_loss": -39.085323333740234, "global_step": 258638, "epoch": 2137} {"train_loss": -40.27269744873047, "global_step": 258639, "epoch": 2137} {"train_loss": -40.845638275146484, "global_step": 258640, "epoch": 2137} {"train_loss": -36.64602279663086, "global_step": 258641, "epoch": 2137} {"train_loss": -40.138946533203125, "global_step": 258642, "epoch": 2137} {"train_loss": -38.2231559753418, "global_step": 258643, "epoch": 2137} {"train_loss": -40.02048873901367, "global_step": 258644, "epoch": 2137} {"train_loss": -38.061397552490234, "global_step": 258645, "epoch": 2137} {"train_loss": -36.00117111206055, "global_step": 258646, "epoch": 2137} {"train_loss": -38.69379425048828, "global_step": 258647, "epoch": 2137} {"train_loss": -32.59959030151367, "global_step": 258648, "epoch": 2137} {"train_loss": -36.57912826538086, "global_step": 258649, "epoch": 2137} {"train_loss": -33.757564544677734, "global_step": 258650, "epoch": 2137} {"train_loss": -39.89030075073242, "global_step": 258651, "epoch": 2137} {"train_loss": -38.467620849609375, "global_step": 258652, "epoch": 2137} {"train_loss": -39.90522003173828, "global_step": 258653, "epoch": 2137} {"train_loss": -36.13035583496094, "global_step": 258654, "epoch": 2137} {"train_loss": -39.156978607177734, "global_step": 258655, "epoch": 2137} {"train_loss": -40.350643157958984, "global_step": 258656, "epoch": 2137} {"train_loss": -40.60533905029297, "global_step": 258657, "epoch": 2137} {"train_loss": -37.792030334472656, "global_step": 258658, "epoch": 2137} {"train_loss": -39.174652099609375, "global_step": 258659, "epoch": 2137} {"train_loss": -40.12711715698242, "global_step": 258660, "epoch": 2137} {"train_loss": -37.82525634765625, "global_step": 258661, "epoch": 2137} {"train_loss": -37.94525146484375, "global_step": 258662, "epoch": 2137} {"train_loss": -40.442138671875, "global_step": 258663, "epoch": 2137} {"train_loss": -37.06486892700195, "global_step": 258664, "epoch": 2137} {"train_loss": -39.55381393432617, "global_step": 258665, "epoch": 2137} {"train_loss": -39.7349853515625, "global_step": 258666, "epoch": 2137} {"train_loss": -36.1843376159668, "global_step": 258667, "epoch": 2137} {"train_loss": -37.37641525268555, "global_step": 258668, "epoch": 2137} {"train_loss": -38.99039077758789, "global_step": 258669, "epoch": 2137} {"train_loss": -39.6463508605957, "global_step": 258670, "epoch": 2137} {"train_loss": -38.75593185424805, "global_step": 258671, "epoch": 2137} {"train_loss": -40.15370178222656, "global_step": 258672, "epoch": 2137} {"train_loss": -38.71598434448242, "global_step": 258673, "epoch": 2137} {"train_loss": -38.00102233886719, "global_step": 258674, "epoch": 2137} {"train_loss": -38.52594757080078, "global_step": 258675, "epoch": 2137} {"train_loss": -39.25639724731445, "global_step": 258676, "epoch": 2137} {"train_loss": -39.329254150390625, "global_step": 258677, "epoch": 2137} {"train_loss": -36.24959945678711, "global_step": 258678, "epoch": 2137} {"train_loss": -40.88115310668945, "global_step": 258679, "epoch": 2137} {"train_loss": -36.71602249145508, "global_step": 258680, "epoch": 2137} {"train_loss": -39.160247802734375, "global_step": 258681, "epoch": 2137} {"train_loss": -39.90324020385742, "global_step": 258682, "epoch": 2137} {"train_loss": -39.3375244140625, "global_step": 258683, "epoch": 2137} {"train_loss": -40.103485107421875, "global_step": 258684, "epoch": 2137} {"train_loss": -40.80930709838867, "global_step": 258685, "epoch": 2137} {"train_loss": -39.9570426940918, "global_step": 258686, "epoch": 2137} {"train_loss": -40.359954833984375, "global_step": 258687, "epoch": 2137} {"train_loss": -40.37052536010742, "global_step": 258688, "epoch": 2137} {"train_loss": -40.75979232788086, "global_step": 258689, "epoch": 2137} {"train_loss": -39.68885040283203, "global_step": 258690, "epoch": 2137} {"train_loss": -40.848243713378906, "global_step": 258691, "epoch": 2137} {"train_loss": -40.376121520996094, "global_step": 258692, "epoch": 2137} {"train_loss": -41.51531982421875, "global_step": 258693, "epoch": 2137} {"train_loss": -40.720088958740234, "global_step": 258694, "epoch": 2137} {"train_loss": -41.078521728515625, "global_step": 258695, "epoch": 2137} {"train_loss": -39.30481719970703, "global_step": 258696, "epoch": 2137} {"train_loss": -40.3110058682024, "global_step": 258697, "epoch": 2137, "val_loss": 2590104.0} {"train_loss": -40.776023864746094, "global_step": 258698, "epoch": 2138} {"train_loss": -41.35463333129883, "global_step": 258699, "epoch": 2138} {"train_loss": -40.81930923461914, "global_step": 258700, "epoch": 2138} {"train_loss": -40.98173141479492, "global_step": 258701, "epoch": 2138} {"train_loss": -41.53071212768555, "global_step": 258702, "epoch": 2138} {"train_loss": -40.74772262573242, "global_step": 258703, "epoch": 2138} {"train_loss": -40.939414978027344, "global_step": 258704, "epoch": 2138} {"train_loss": -40.93729019165039, "global_step": 258705, "epoch": 2138} {"train_loss": -40.42029571533203, "global_step": 258706, "epoch": 2138} {"train_loss": -41.27616500854492, "global_step": 258707, "epoch": 2138} {"train_loss": -41.46137619018555, "global_step": 258708, "epoch": 2138} {"train_loss": -41.51814651489258, "global_step": 258709, "epoch": 2138} {"train_loss": -41.801475524902344, "global_step": 258710, "epoch": 2138} {"train_loss": -41.45354080200195, "global_step": 258711, "epoch": 2138} {"train_loss": -41.50007247924805, "global_step": 258712, "epoch": 2138} {"train_loss": -40.5935173034668, "global_step": 258713, "epoch": 2138} {"train_loss": -40.47410202026367, "global_step": 258714, "epoch": 2138} {"train_loss": -41.37543869018555, "global_step": 258715, "epoch": 2138} {"train_loss": -41.828792572021484, "global_step": 258716, "epoch": 2138} {"train_loss": -41.96623611450195, "global_step": 258717, "epoch": 2138} {"train_loss": -40.84626007080078, "global_step": 258718, "epoch": 2138} {"train_loss": -41.885650634765625, "global_step": 258719, "epoch": 2138} {"train_loss": -41.8396110534668, "global_step": 258720, "epoch": 2138} {"train_loss": -42.09353256225586, "global_step": 258721, "epoch": 2138} {"train_loss": -38.908607482910156, "global_step": 258722, "epoch": 2138} {"train_loss": -41.56720733642578, "global_step": 258723, "epoch": 2138} {"train_loss": -40.57386016845703, "global_step": 258724, "epoch": 2138} {"train_loss": -41.212806701660156, "global_step": 258725, "epoch": 2138} {"train_loss": -41.55860137939453, "global_step": 258726, "epoch": 2138} {"train_loss": -41.904876708984375, "global_step": 258727, "epoch": 2138} {"train_loss": -41.81562042236328, "global_step": 258728, "epoch": 2138} {"train_loss": -42.08375549316406, "global_step": 258729, "epoch": 2138} {"train_loss": -41.40704345703125, "global_step": 258730, "epoch": 2138} {"train_loss": -42.04034423828125, "global_step": 258731, "epoch": 2138} {"train_loss": -40.97317123413086, "global_step": 258732, "epoch": 2138} {"train_loss": -41.82510757446289, "global_step": 258733, "epoch": 2138} {"train_loss": -42.10586929321289, "global_step": 258734, "epoch": 2138} {"train_loss": -42.07267379760742, "global_step": 258735, "epoch": 2138} {"train_loss": -41.0916862487793, "global_step": 258736, "epoch": 2138} {"train_loss": -41.02482223510742, "global_step": 258737, "epoch": 2138} {"train_loss": -41.879695892333984, "global_step": 258738, "epoch": 2138} {"train_loss": -40.942535400390625, "global_step": 258739, "epoch": 2138} {"train_loss": -41.255340576171875, "global_step": 258740, "epoch": 2138} {"train_loss": -41.69977569580078, "global_step": 258741, "epoch": 2138} {"train_loss": -42.16122055053711, "global_step": 258742, "epoch": 2138} {"train_loss": -41.92280960083008, "global_step": 258743, "epoch": 2138} {"train_loss": -41.75803756713867, "global_step": 258744, "epoch": 2138} {"train_loss": -41.93024826049805, "global_step": 258745, "epoch": 2138} {"train_loss": -41.7796516418457, "global_step": 258746, "epoch": 2138} {"train_loss": -40.71383285522461, "global_step": 258747, "epoch": 2138} {"train_loss": -41.983272552490234, "global_step": 258748, "epoch": 2138} {"train_loss": -41.59367370605469, "global_step": 258749, "epoch": 2138} {"train_loss": -42.2872314453125, "global_step": 258750, "epoch": 2138} {"train_loss": -41.98261260986328, "global_step": 258751, "epoch": 2138} {"train_loss": -41.28901672363281, "global_step": 258752, "epoch": 2138} {"train_loss": -42.26852035522461, "global_step": 258753, "epoch": 2138} {"train_loss": -40.9338493347168, "global_step": 258754, "epoch": 2138} {"train_loss": -42.267730712890625, "global_step": 258755, "epoch": 2138} {"train_loss": -42.47005081176758, "global_step": 258756, "epoch": 2138} {"train_loss": -40.96821212768555, "global_step": 258757, "epoch": 2138} {"train_loss": -42.45530700683594, "global_step": 258758, "epoch": 2138} {"train_loss": -41.93195724487305, "global_step": 258759, "epoch": 2138} {"train_loss": -42.04072189331055, "global_step": 258760, "epoch": 2138} {"train_loss": -42.39479446411133, "global_step": 258761, "epoch": 2138} {"train_loss": -42.08734130859375, "global_step": 258762, "epoch": 2138} {"train_loss": -41.49717330932617, "global_step": 258763, "epoch": 2138} {"train_loss": -41.802486419677734, "global_step": 258764, "epoch": 2138} {"train_loss": -42.45295333862305, "global_step": 258765, "epoch": 2138} {"train_loss": -41.42986297607422, "global_step": 258766, "epoch": 2138} {"train_loss": -42.384918212890625, "global_step": 258767, "epoch": 2138} {"train_loss": -41.779296875, "global_step": 258768, "epoch": 2138} {"train_loss": -41.974422454833984, "global_step": 258769, "epoch": 2138} {"train_loss": -41.94553756713867, "global_step": 258770, "epoch": 2138} {"train_loss": -42.8505973815918, "global_step": 258771, "epoch": 2138} {"train_loss": -42.149959564208984, "global_step": 258772, "epoch": 2138} {"train_loss": -37.94492721557617, "global_step": 258773, "epoch": 2138} {"train_loss": -42.39932632446289, "global_step": 258774, "epoch": 2138} {"train_loss": -41.929317474365234, "global_step": 258775, "epoch": 2138} {"train_loss": -41.71223068237305, "global_step": 258776, "epoch": 2138} {"train_loss": -38.946929931640625, "global_step": 258777, "epoch": 2138} {"train_loss": -40.36085891723633, "global_step": 258778, "epoch": 2138} {"train_loss": -39.16792678833008, "global_step": 258779, "epoch": 2138} {"train_loss": -38.83340835571289, "global_step": 258780, "epoch": 2138} {"train_loss": -41.5661506652832, "global_step": 258781, "epoch": 2138} {"train_loss": -38.98090362548828, "global_step": 258782, "epoch": 2138} {"train_loss": -40.04061508178711, "global_step": 258783, "epoch": 2138} {"train_loss": -39.38966751098633, "global_step": 258784, "epoch": 2138} {"train_loss": -40.83769607543945, "global_step": 258785, "epoch": 2138} {"train_loss": -40.15975570678711, "global_step": 258786, "epoch": 2138} {"train_loss": -37.24250411987305, "global_step": 258787, "epoch": 2138} {"train_loss": -41.874847412109375, "global_step": 258788, "epoch": 2138} {"train_loss": -41.37611770629883, "global_step": 258789, "epoch": 2138} {"train_loss": -40.729347229003906, "global_step": 258790, "epoch": 2138} {"train_loss": -40.56885528564453, "global_step": 258791, "epoch": 2138} {"train_loss": -40.62642288208008, "global_step": 258792, "epoch": 2138} {"train_loss": -40.1878662109375, "global_step": 258793, "epoch": 2138} {"train_loss": -40.42365264892578, "global_step": 258794, "epoch": 2138} {"train_loss": -41.22926330566406, "global_step": 258795, "epoch": 2138} {"train_loss": -40.65161895751953, "global_step": 258796, "epoch": 2138} {"train_loss": -40.75187301635742, "global_step": 258797, "epoch": 2138} {"train_loss": -39.968475341796875, "global_step": 258798, "epoch": 2138} {"train_loss": -39.52620315551758, "global_step": 258799, "epoch": 2138} {"train_loss": -39.686378479003906, "global_step": 258800, "epoch": 2138} {"train_loss": -40.18975830078125, "global_step": 258801, "epoch": 2138} {"train_loss": -40.59992599487305, "global_step": 258802, "epoch": 2138} {"train_loss": -40.855796813964844, "global_step": 258803, "epoch": 2138} {"train_loss": -41.83356857299805, "global_step": 258804, "epoch": 2138} {"train_loss": -39.96509552001953, "global_step": 258805, "epoch": 2138} {"train_loss": -40.90105056762695, "global_step": 258806, "epoch": 2138} {"train_loss": -41.783538818359375, "global_step": 258807, "epoch": 2138} {"train_loss": -39.8682861328125, "global_step": 258808, "epoch": 2138} {"train_loss": -40.74921798706055, "global_step": 258809, "epoch": 2138} {"train_loss": -39.22998809814453, "global_step": 258810, "epoch": 2138} {"train_loss": -41.34474563598633, "global_step": 258811, "epoch": 2138} {"train_loss": -40.97972869873047, "global_step": 258812, "epoch": 2138} {"train_loss": -41.470184326171875, "global_step": 258813, "epoch": 2138} {"train_loss": -41.31231689453125, "global_step": 258814, "epoch": 2138} {"train_loss": -41.625404357910156, "global_step": 258815, "epoch": 2138} {"train_loss": -36.92702102661133, "global_step": 258816, "epoch": 2138} {"train_loss": -41.11373519897461, "global_step": 258817, "epoch": 2138} {"train_loss": -41.136625494838746, "global_step": 258818, "epoch": 2138, "val_loss": 2603065.5} {"train_loss": -41.582759857177734, "global_step": 258819, "epoch": 2139} {"train_loss": -41.168861389160156, "global_step": 258820, "epoch": 2139} {"train_loss": -41.00871658325195, "global_step": 258821, "epoch": 2139} {"train_loss": -41.97248458862305, "global_step": 258822, "epoch": 2139} {"train_loss": -41.43730545043945, "global_step": 258823, "epoch": 2139} {"train_loss": -40.965003967285156, "global_step": 258824, "epoch": 2139} {"train_loss": -41.525054931640625, "global_step": 258825, "epoch": 2139} {"train_loss": -41.7989387512207, "global_step": 258826, "epoch": 2139} {"train_loss": -42.217811584472656, "global_step": 258827, "epoch": 2139} {"train_loss": -41.83854293823242, "global_step": 258828, "epoch": 2139} {"train_loss": -41.309967041015625, "global_step": 258829, "epoch": 2139} {"train_loss": -41.849151611328125, "global_step": 258830, "epoch": 2139} {"train_loss": -41.46684646606445, "global_step": 258831, "epoch": 2139} {"train_loss": -42.11631393432617, "global_step": 258832, "epoch": 2139} {"train_loss": -40.98445510864258, "global_step": 258833, "epoch": 2139} {"train_loss": -42.198978424072266, "global_step": 258834, "epoch": 2139} {"train_loss": -41.471099853515625, "global_step": 258835, "epoch": 2139} {"train_loss": -41.23623275756836, "global_step": 258836, "epoch": 2139} {"train_loss": -41.47303009033203, "global_step": 258837, "epoch": 2139} {"train_loss": -41.30647659301758, "global_step": 258838, "epoch": 2139} {"train_loss": -41.1017951965332, "global_step": 258839, "epoch": 2139} {"train_loss": -41.9265022277832, "global_step": 258840, "epoch": 2139} {"train_loss": -41.022274017333984, "global_step": 258841, "epoch": 2139} {"train_loss": -42.190181732177734, "global_step": 258842, "epoch": 2139} {"train_loss": -42.228641510009766, "global_step": 258843, "epoch": 2139} {"train_loss": -41.49309158325195, "global_step": 258844, "epoch": 2139} {"train_loss": -39.23125457763672, "global_step": 258845, "epoch": 2139} {"train_loss": -39.283756256103516, "global_step": 258846, "epoch": 2139} {"train_loss": -42.268646240234375, "global_step": 258847, "epoch": 2139} {"train_loss": -39.8223876953125, "global_step": 258848, "epoch": 2139} {"train_loss": -37.48737335205078, "global_step": 258849, "epoch": 2139} {"train_loss": -40.5012321472168, "global_step": 258850, "epoch": 2139} {"train_loss": -40.99421691894531, "global_step": 258851, "epoch": 2139} {"train_loss": -38.1376953125, "global_step": 258852, "epoch": 2139} {"train_loss": -41.35968780517578, "global_step": 258853, "epoch": 2139} {"train_loss": -39.93707275390625, "global_step": 258854, "epoch": 2139} {"train_loss": -39.1799430847168, "global_step": 258855, "epoch": 2139} {"train_loss": -39.888832092285156, "global_step": 258856, "epoch": 2139} {"train_loss": -38.44601058959961, "global_step": 258857, "epoch": 2139} {"train_loss": -40.563232421875, "global_step": 258858, "epoch": 2139} {"train_loss": -40.53567123413086, "global_step": 258859, "epoch": 2139} {"train_loss": -40.18046951293945, "global_step": 258860, "epoch": 2139} {"train_loss": -40.520904541015625, "global_step": 258861, "epoch": 2139} {"train_loss": -40.45225524902344, "global_step": 258862, "epoch": 2139} {"train_loss": -41.24753952026367, "global_step": 258863, "epoch": 2139} {"train_loss": -40.66924285888672, "global_step": 258864, "epoch": 2139} {"train_loss": -41.12801742553711, "global_step": 258865, "epoch": 2139} {"train_loss": -40.454776763916016, "global_step": 258866, "epoch": 2139} {"train_loss": -41.08358383178711, "global_step": 258867, "epoch": 2139} {"train_loss": -41.07862091064453, "global_step": 258868, "epoch": 2139} {"train_loss": -41.17085647583008, "global_step": 258869, "epoch": 2139} {"train_loss": -41.7834587097168, "global_step": 258870, "epoch": 2139} {"train_loss": -37.9471549987793, "global_step": 258871, "epoch": 2139} {"train_loss": -40.87075424194336, "global_step": 258872, "epoch": 2139} {"train_loss": -41.29825973510742, "global_step": 258873, "epoch": 2139} {"train_loss": -41.3209114074707, "global_step": 258874, "epoch": 2139} {"train_loss": -41.84794235229492, "global_step": 258875, "epoch": 2139} {"train_loss": -39.92531967163086, "global_step": 258876, "epoch": 2139} {"train_loss": -41.6789665222168, "global_step": 258877, "epoch": 2139} {"train_loss": -41.371891021728516, "global_step": 258878, "epoch": 2139} {"train_loss": -41.05863952636719, "global_step": 258879, "epoch": 2139} {"train_loss": -42.406124114990234, "global_step": 258880, "epoch": 2139} {"train_loss": -41.108394622802734, "global_step": 258881, "epoch": 2139} {"train_loss": -42.525726318359375, "global_step": 258882, "epoch": 2139} {"train_loss": -41.332305908203125, "global_step": 258883, "epoch": 2139} {"train_loss": -42.408164978027344, "global_step": 258884, "epoch": 2139} {"train_loss": -42.09520721435547, "global_step": 258885, "epoch": 2139} {"train_loss": -41.90279006958008, "global_step": 258886, "epoch": 2139} {"train_loss": -41.13216018676758, "global_step": 258887, "epoch": 2139} {"train_loss": -42.235416412353516, "global_step": 258888, "epoch": 2139} {"train_loss": -41.928585052490234, "global_step": 258889, "epoch": 2139} {"train_loss": -41.0223274230957, "global_step": 258890, "epoch": 2139} {"train_loss": -42.37302017211914, "global_step": 258891, "epoch": 2139} {"train_loss": -42.0160026550293, "global_step": 258892, "epoch": 2139} {"train_loss": -42.50948715209961, "global_step": 258893, "epoch": 2139} {"train_loss": -42.57432174682617, "global_step": 258894, "epoch": 2139} {"train_loss": -42.78651809692383, "global_step": 258895, "epoch": 2139} {"train_loss": -42.07381820678711, "global_step": 258896, "epoch": 2139} {"train_loss": -42.64854049682617, "global_step": 258897, "epoch": 2139} {"train_loss": -42.561546325683594, "global_step": 258898, "epoch": 2139} {"train_loss": -43.15348815917969, "global_step": 258899, "epoch": 2139} {"train_loss": -42.593658447265625, "global_step": 258900, "epoch": 2139} {"train_loss": -41.89191436767578, "global_step": 258901, "epoch": 2139} {"train_loss": -42.24538040161133, "global_step": 258902, "epoch": 2139} {"train_loss": -42.44350814819336, "global_step": 258903, "epoch": 2139} {"train_loss": -42.581485748291016, "global_step": 258904, "epoch": 2139} {"train_loss": -42.980079650878906, "global_step": 258905, "epoch": 2139} {"train_loss": -42.3847541809082, "global_step": 258906, "epoch": 2139} {"train_loss": -42.56110382080078, "global_step": 258907, "epoch": 2139} {"train_loss": -42.673858642578125, "global_step": 258908, "epoch": 2139} {"train_loss": -43.04317092895508, "global_step": 258909, "epoch": 2139} {"train_loss": -42.631309509277344, "global_step": 258910, "epoch": 2139} {"train_loss": -43.160396575927734, "global_step": 258911, "epoch": 2139} {"train_loss": -42.60236740112305, "global_step": 258912, "epoch": 2139} {"train_loss": -42.27230453491211, "global_step": 258913, "epoch": 2139} {"train_loss": -43.21034622192383, "global_step": 258914, "epoch": 2139} {"train_loss": -43.09052658081055, "global_step": 258915, "epoch": 2139} {"train_loss": -42.53602981567383, "global_step": 258916, "epoch": 2139} {"train_loss": -42.651153564453125, "global_step": 258917, "epoch": 2139} {"train_loss": -42.586761474609375, "global_step": 258918, "epoch": 2139} {"train_loss": -42.14963912963867, "global_step": 258919, "epoch": 2139} {"train_loss": -42.523048400878906, "global_step": 258920, "epoch": 2139} {"train_loss": -43.115238189697266, "global_step": 258921, "epoch": 2139} {"train_loss": -42.663482666015625, "global_step": 258922, "epoch": 2139} {"train_loss": -42.10302734375, "global_step": 258923, "epoch": 2139} {"train_loss": -41.79692840576172, "global_step": 258924, "epoch": 2139} {"train_loss": -42.61233901977539, "global_step": 258925, "epoch": 2139} {"train_loss": -43.41714096069336, "global_step": 258926, "epoch": 2139} {"train_loss": -42.8616828918457, "global_step": 258927, "epoch": 2139} {"train_loss": -42.447364807128906, "global_step": 258928, "epoch": 2139} {"train_loss": -43.24457550048828, "global_step": 258929, "epoch": 2139} {"train_loss": -42.722862243652344, "global_step": 258930, "epoch": 2139} {"train_loss": -43.380496978759766, "global_step": 258931, "epoch": 2139} {"train_loss": -42.97300720214844, "global_step": 258932, "epoch": 2139} {"train_loss": -43.051849365234375, "global_step": 258933, "epoch": 2139} {"train_loss": -42.28242111206055, "global_step": 258934, "epoch": 2139} {"train_loss": -42.51189422607422, "global_step": 258935, "epoch": 2139} {"train_loss": -43.08164596557617, "global_step": 258936, "epoch": 2139} {"train_loss": -42.55176544189453, "global_step": 258937, "epoch": 2139} {"train_loss": -43.0755729675293, "global_step": 258938, "epoch": 2139} {"train_loss": -41.70441231845824, "global_step": 258939, "epoch": 2139, "val_loss": 2814057.75} {"train_loss": -41.79480743408203, "global_step": 258940, "epoch": 2140} {"train_loss": -42.13254928588867, "global_step": 258941, "epoch": 2140} {"train_loss": -41.95762634277344, "global_step": 258942, "epoch": 2140} {"train_loss": -42.5401725769043, "global_step": 258943, "epoch": 2140} {"train_loss": -42.940589904785156, "global_step": 258944, "epoch": 2140} {"train_loss": -43.07338333129883, "global_step": 258945, "epoch": 2140} {"train_loss": -43.140113830566406, "global_step": 258946, "epoch": 2140} {"train_loss": -43.20820999145508, "global_step": 258947, "epoch": 2140} {"train_loss": -42.89215850830078, "global_step": 258948, "epoch": 2140} {"train_loss": -40.795772552490234, "global_step": 258949, "epoch": 2140} {"train_loss": -42.7048454284668, "global_step": 258950, "epoch": 2140} {"train_loss": -43.216121673583984, "global_step": 258951, "epoch": 2140} {"train_loss": -43.25407028198242, "global_step": 258952, "epoch": 2140} {"train_loss": -42.8631706237793, "global_step": 258953, "epoch": 2140} {"train_loss": -42.91901779174805, "global_step": 258954, "epoch": 2140} {"train_loss": -43.016448974609375, "global_step": 258955, "epoch": 2140} {"train_loss": -43.2891960144043, "global_step": 258956, "epoch": 2140} {"train_loss": -42.72998809814453, "global_step": 258957, "epoch": 2140} {"train_loss": -43.26041793823242, "global_step": 258958, "epoch": 2140} {"train_loss": -42.23299026489258, "global_step": 258959, "epoch": 2140} {"train_loss": -42.03675079345703, "global_step": 258960, "epoch": 2140} {"train_loss": -41.95809555053711, "global_step": 258961, "epoch": 2140} {"train_loss": -43.30448532104492, "global_step": 258962, "epoch": 2140} {"train_loss": -42.777095794677734, "global_step": 258963, "epoch": 2140} {"train_loss": -42.463985443115234, "global_step": 258964, "epoch": 2140} {"train_loss": -42.574440002441406, "global_step": 258965, "epoch": 2140} {"train_loss": -41.78456115722656, "global_step": 258966, "epoch": 2140} {"train_loss": -42.664066314697266, "global_step": 258967, "epoch": 2140} {"train_loss": -42.48136901855469, "global_step": 258968, "epoch": 2140} {"train_loss": -43.374202728271484, "global_step": 258969, "epoch": 2140} {"train_loss": -42.373046875, "global_step": 258970, "epoch": 2140} {"train_loss": -42.3425407409668, "global_step": 258971, "epoch": 2140} {"train_loss": -43.03071594238281, "global_step": 258972, "epoch": 2140} {"train_loss": -42.491966247558594, "global_step": 258973, "epoch": 2140} {"train_loss": -42.44481658935547, "global_step": 258974, "epoch": 2140} {"train_loss": -42.636199951171875, "global_step": 258975, "epoch": 2140} {"train_loss": -42.44751739501953, "global_step": 258976, "epoch": 2140} {"train_loss": -43.18830490112305, "global_step": 258977, "epoch": 2140} {"train_loss": -42.15149688720703, "global_step": 258978, "epoch": 2140} {"train_loss": -43.293495178222656, "global_step": 258979, "epoch": 2140} {"train_loss": -41.945762634277344, "global_step": 258980, "epoch": 2140} {"train_loss": -40.944576263427734, "global_step": 258981, "epoch": 2140} {"train_loss": -42.21419143676758, "global_step": 258982, "epoch": 2140} {"train_loss": -42.29302978515625, "global_step": 258983, "epoch": 2140} {"train_loss": -41.16250991821289, "global_step": 258984, "epoch": 2140} {"train_loss": -40.5905876159668, "global_step": 258985, "epoch": 2140} {"train_loss": -39.621280670166016, "global_step": 258986, "epoch": 2140} {"train_loss": -35.36003494262695, "global_step": 258987, "epoch": 2140} {"train_loss": -32.18791580200195, "global_step": 258988, "epoch": 2140} {"train_loss": -34.67354202270508, "global_step": 258989, "epoch": 2140} {"train_loss": -39.69635009765625, "global_step": 258990, "epoch": 2140} {"train_loss": -41.129310607910156, "global_step": 258991, "epoch": 2140} {"train_loss": -38.91506576538086, "global_step": 258992, "epoch": 2140} {"train_loss": -41.31499099731445, "global_step": 258993, "epoch": 2140} {"train_loss": -41.75973129272461, "global_step": 258994, "epoch": 2140} {"train_loss": -39.47860336303711, "global_step": 258995, "epoch": 2140} {"train_loss": -40.650054931640625, "global_step": 258996, "epoch": 2140} {"train_loss": -41.58269119262695, "global_step": 258997, "epoch": 2140} {"train_loss": -38.31360626220703, "global_step": 258998, "epoch": 2140} {"train_loss": -41.4731330871582, "global_step": 258999, "epoch": 2140} {"train_loss": -40.98708724975586, "global_step": 259000, "epoch": 2140} {"train_loss": -40.91779327392578, "global_step": 259001, "epoch": 2140} {"train_loss": -41.64243698120117, "global_step": 259002, "epoch": 2140} {"train_loss": -41.41068649291992, "global_step": 259003, "epoch": 2140} {"train_loss": -41.844703674316406, "global_step": 259004, "epoch": 2140} {"train_loss": -41.21214294433594, "global_step": 259005, "epoch": 2140} {"train_loss": -41.9332160949707, "global_step": 259006, "epoch": 2140} {"train_loss": -42.2193489074707, "global_step": 259007, "epoch": 2140} {"train_loss": -42.537811279296875, "global_step": 259008, "epoch": 2140} {"train_loss": -42.4093017578125, "global_step": 259009, "epoch": 2140} {"train_loss": -42.48554229736328, "global_step": 259010, "epoch": 2140} {"train_loss": -42.420284271240234, "global_step": 259011, "epoch": 2140} {"train_loss": -42.375850677490234, "global_step": 259012, "epoch": 2140} {"train_loss": -42.69211959838867, "global_step": 259013, "epoch": 2140} {"train_loss": -42.90911865234375, "global_step": 259014, "epoch": 2140} {"train_loss": -42.20095443725586, "global_step": 259015, "epoch": 2140} {"train_loss": -42.78276443481445, "global_step": 259016, "epoch": 2140} {"train_loss": -43.0313835144043, "global_step": 259017, "epoch": 2140} {"train_loss": -42.800872802734375, "global_step": 259018, "epoch": 2140} {"train_loss": -42.94694900512695, "global_step": 259019, "epoch": 2140} {"train_loss": -42.39351272583008, "global_step": 259020, "epoch": 2140} {"train_loss": -43.1885986328125, "global_step": 259021, "epoch": 2140} {"train_loss": -42.83137512207031, "global_step": 259022, "epoch": 2140} {"train_loss": -42.83283996582031, "global_step": 259023, "epoch": 2140} {"train_loss": -42.462562561035156, "global_step": 259024, "epoch": 2140} {"train_loss": -42.8365364074707, "global_step": 259025, "epoch": 2140} {"train_loss": -42.796875, "global_step": 259026, "epoch": 2140} {"train_loss": -43.043331146240234, "global_step": 259027, "epoch": 2140} {"train_loss": -42.83793258666992, "global_step": 259028, "epoch": 2140} {"train_loss": -43.19575119018555, "global_step": 259029, "epoch": 2140} {"train_loss": -43.027896881103516, "global_step": 259030, "epoch": 2140} {"train_loss": -42.311973571777344, "global_step": 259031, "epoch": 2140} {"train_loss": -42.4585075378418, "global_step": 259032, "epoch": 2140} {"train_loss": -42.43329620361328, "global_step": 259033, "epoch": 2140} {"train_loss": -42.78496170043945, "global_step": 259034, "epoch": 2140} {"train_loss": -41.58427047729492, "global_step": 259035, "epoch": 2140} {"train_loss": -42.13261032104492, "global_step": 259036, "epoch": 2140} {"train_loss": -43.24567794799805, "global_step": 259037, "epoch": 2140} {"train_loss": -42.1207389831543, "global_step": 259038, "epoch": 2140} {"train_loss": -41.59706115722656, "global_step": 259039, "epoch": 2140} {"train_loss": -43.17060089111328, "global_step": 259040, "epoch": 2140} {"train_loss": -42.19913864135742, "global_step": 259041, "epoch": 2140} {"train_loss": -41.957435607910156, "global_step": 259042, "epoch": 2140} {"train_loss": -42.781124114990234, "global_step": 259043, "epoch": 2140} {"train_loss": -43.08626937866211, "global_step": 259044, "epoch": 2140} {"train_loss": -42.238338470458984, "global_step": 259045, "epoch": 2140} {"train_loss": -41.70149612426758, "global_step": 259046, "epoch": 2140} {"train_loss": -43.19947052001953, "global_step": 259047, "epoch": 2140} {"train_loss": -42.28770065307617, "global_step": 259048, "epoch": 2140} {"train_loss": -42.17403793334961, "global_step": 259049, "epoch": 2140} {"train_loss": -42.77738571166992, "global_step": 259050, "epoch": 2140} {"train_loss": -42.42461395263672, "global_step": 259051, "epoch": 2140} {"train_loss": -42.189613342285156, "global_step": 259052, "epoch": 2140} {"train_loss": -43.04368591308594, "global_step": 259053, "epoch": 2140} {"train_loss": -42.39207077026367, "global_step": 259054, "epoch": 2140} {"train_loss": -41.9656867980957, "global_step": 259055, "epoch": 2140} {"train_loss": -42.7321662902832, "global_step": 259056, "epoch": 2140} {"train_loss": -41.938232421875, "global_step": 259057, "epoch": 2140} {"train_loss": -40.50855255126953, "global_step": 259058, "epoch": 2140} {"train_loss": -42.12689208984375, "global_step": 259059, "epoch": 2140} {"train_loss": -42.02605993097479, "global_step": 259060, "epoch": 2140, "val_loss": 2748904.75} {"train_loss": -41.64863967895508, "global_step": 259061, "epoch": 2141} {"train_loss": -40.661006927490234, "global_step": 259062, "epoch": 2141} {"train_loss": -41.99502182006836, "global_step": 259063, "epoch": 2141} {"train_loss": -42.12671661376953, "global_step": 259064, "epoch": 2141} {"train_loss": -41.70638656616211, "global_step": 259065, "epoch": 2141} {"train_loss": -41.84395217895508, "global_step": 259066, "epoch": 2141} {"train_loss": -41.782630920410156, "global_step": 259067, "epoch": 2141} {"train_loss": -42.6308708190918, "global_step": 259068, "epoch": 2141} {"train_loss": -41.49063491821289, "global_step": 259069, "epoch": 2141} {"train_loss": -40.54108428955078, "global_step": 259070, "epoch": 2141} {"train_loss": -41.9798469543457, "global_step": 259071, "epoch": 2141} {"train_loss": -41.7299919128418, "global_step": 259072, "epoch": 2141} {"train_loss": -41.19652557373047, "global_step": 259073, "epoch": 2141} {"train_loss": -41.169288635253906, "global_step": 259074, "epoch": 2141} {"train_loss": -42.04143142700195, "global_step": 259075, "epoch": 2141} {"train_loss": -41.285335540771484, "global_step": 259076, "epoch": 2141} {"train_loss": -42.61968994140625, "global_step": 259077, "epoch": 2141} {"train_loss": -42.65106201171875, "global_step": 259078, "epoch": 2141} {"train_loss": -42.40614700317383, "global_step": 259079, "epoch": 2141} {"train_loss": -42.69184112548828, "global_step": 259080, "epoch": 2141} {"train_loss": -42.93317413330078, "global_step": 259081, "epoch": 2141} {"train_loss": -42.894439697265625, "global_step": 259082, "epoch": 2141} {"train_loss": -42.94148635864258, "global_step": 259083, "epoch": 2141} {"train_loss": -42.5850944519043, "global_step": 259084, "epoch": 2141} {"train_loss": -42.33846664428711, "global_step": 259085, "epoch": 2141} {"train_loss": -42.49578857421875, "global_step": 259086, "epoch": 2141} {"train_loss": -43.32328414916992, "global_step": 259087, "epoch": 2141} {"train_loss": -42.527408599853516, "global_step": 259088, "epoch": 2141} {"train_loss": -42.31876754760742, "global_step": 259089, "epoch": 2141} {"train_loss": -43.24714279174805, "global_step": 259090, "epoch": 2141} {"train_loss": -42.38187789916992, "global_step": 259091, "epoch": 2141} {"train_loss": -42.526893615722656, "global_step": 259092, "epoch": 2141} {"train_loss": -43.137451171875, "global_step": 259093, "epoch": 2141} {"train_loss": -42.16286849975586, "global_step": 259094, "epoch": 2141} {"train_loss": -43.594024658203125, "global_step": 259095, "epoch": 2141} {"train_loss": -43.37722396850586, "global_step": 259096, "epoch": 2141} {"train_loss": -43.51577377319336, "global_step": 259097, "epoch": 2141} {"train_loss": -42.60219955444336, "global_step": 259098, "epoch": 2141} {"train_loss": -42.84690475463867, "global_step": 259099, "epoch": 2141} {"train_loss": -43.43282699584961, "global_step": 259100, "epoch": 2141} {"train_loss": -42.63444900512695, "global_step": 259101, "epoch": 2141} {"train_loss": -42.53104782104492, "global_step": 259102, "epoch": 2141} {"train_loss": -42.564735412597656, "global_step": 259103, "epoch": 2141} {"train_loss": -42.8442268371582, "global_step": 259104, "epoch": 2141} {"train_loss": -42.694801330566406, "global_step": 259105, "epoch": 2141} {"train_loss": -42.323631286621094, "global_step": 259106, "epoch": 2141} {"train_loss": -42.75222396850586, "global_step": 259107, "epoch": 2141} {"train_loss": -42.99771499633789, "global_step": 259108, "epoch": 2141} {"train_loss": -42.372718811035156, "global_step": 259109, "epoch": 2141} {"train_loss": -41.726497650146484, "global_step": 259110, "epoch": 2141} {"train_loss": -41.84418869018555, "global_step": 259111, "epoch": 2141} {"train_loss": -43.14616012573242, "global_step": 259112, "epoch": 2141} {"train_loss": -41.566837310791016, "global_step": 259113, "epoch": 2141} {"train_loss": -41.3403434753418, "global_step": 259114, "epoch": 2141} {"train_loss": -42.009456634521484, "global_step": 259115, "epoch": 2141} {"train_loss": -41.81389617919922, "global_step": 259116, "epoch": 2141} {"train_loss": -41.52202224731445, "global_step": 259117, "epoch": 2141} {"train_loss": -41.73804473876953, "global_step": 259118, "epoch": 2141} {"train_loss": -41.41779708862305, "global_step": 259119, "epoch": 2141} {"train_loss": -42.248897552490234, "global_step": 259120, "epoch": 2141} {"train_loss": -42.464412689208984, "global_step": 259121, "epoch": 2141} {"train_loss": -40.22113037109375, "global_step": 259122, "epoch": 2141} {"train_loss": -40.5866584777832, "global_step": 259123, "epoch": 2141} {"train_loss": -41.918556213378906, "global_step": 259124, "epoch": 2141} {"train_loss": -40.71511459350586, "global_step": 259125, "epoch": 2141} {"train_loss": -41.712154388427734, "global_step": 259126, "epoch": 2141} {"train_loss": -41.71303939819336, "global_step": 259127, "epoch": 2141} {"train_loss": -42.26516342163086, "global_step": 259128, "epoch": 2141} {"train_loss": -41.57920455932617, "global_step": 259129, "epoch": 2141} {"train_loss": -41.85512924194336, "global_step": 259130, "epoch": 2141} {"train_loss": -41.9567756652832, "global_step": 259131, "epoch": 2141} {"train_loss": -42.50571823120117, "global_step": 259132, "epoch": 2141} {"train_loss": -41.5054931640625, "global_step": 259133, "epoch": 2141} {"train_loss": -42.181819915771484, "global_step": 259134, "epoch": 2141} {"train_loss": -42.66694259643555, "global_step": 259135, "epoch": 2141} {"train_loss": -41.879486083984375, "global_step": 259136, "epoch": 2141} {"train_loss": -42.4686393737793, "global_step": 259137, "epoch": 2141} {"train_loss": -42.083980560302734, "global_step": 259138, "epoch": 2141} {"train_loss": -42.19191360473633, "global_step": 259139, "epoch": 2141} {"train_loss": -42.667823791503906, "global_step": 259140, "epoch": 2141} {"train_loss": -41.230831146240234, "global_step": 259141, "epoch": 2141} {"train_loss": -41.94730758666992, "global_step": 259142, "epoch": 2141} {"train_loss": -41.67155075073242, "global_step": 259143, "epoch": 2141} {"train_loss": -41.65934371948242, "global_step": 259144, "epoch": 2141} {"train_loss": -43.012657165527344, "global_step": 259145, "epoch": 2141} {"train_loss": -42.883113861083984, "global_step": 259146, "epoch": 2141} {"train_loss": -42.83461380004883, "global_step": 259147, "epoch": 2141} {"train_loss": -42.84498596191406, "global_step": 259148, "epoch": 2141} {"train_loss": -42.23794174194336, "global_step": 259149, "epoch": 2141} {"train_loss": -42.80078125, "global_step": 259150, "epoch": 2141} {"train_loss": -42.84431076049805, "global_step": 259151, "epoch": 2141} {"train_loss": -42.237548828125, "global_step": 259152, "epoch": 2141} {"train_loss": -42.58498001098633, "global_step": 259153, "epoch": 2141} {"train_loss": -41.87066650390625, "global_step": 259154, "epoch": 2141} {"train_loss": -42.21916198730469, "global_step": 259155, "epoch": 2141} {"train_loss": -42.675743103027344, "global_step": 259156, "epoch": 2141} {"train_loss": -42.37055587768555, "global_step": 259157, "epoch": 2141} {"train_loss": -42.72346496582031, "global_step": 259158, "epoch": 2141} {"train_loss": -42.039302825927734, "global_step": 259159, "epoch": 2141} {"train_loss": -43.03321838378906, "global_step": 259160, "epoch": 2141} {"train_loss": -42.9833984375, "global_step": 259161, "epoch": 2141} {"train_loss": -42.42021560668945, "global_step": 259162, "epoch": 2141} {"train_loss": -43.25951385498047, "global_step": 259163, "epoch": 2141} {"train_loss": -43.00288009643555, "global_step": 259164, "epoch": 2141} {"train_loss": -43.6714973449707, "global_step": 259165, "epoch": 2141} {"train_loss": -42.869178771972656, "global_step": 259166, "epoch": 2141} {"train_loss": -43.673980712890625, "global_step": 259167, "epoch": 2141} {"train_loss": -43.30204391479492, "global_step": 259168, "epoch": 2141} {"train_loss": -43.43441390991211, "global_step": 259169, "epoch": 2141} {"train_loss": -43.25578308105469, "global_step": 259170, "epoch": 2141} {"train_loss": -43.526161193847656, "global_step": 259171, "epoch": 2141} {"train_loss": -43.381866455078125, "global_step": 259172, "epoch": 2141} {"train_loss": -43.43830108642578, "global_step": 259173, "epoch": 2141} {"train_loss": -43.304988861083984, "global_step": 259174, "epoch": 2141} {"train_loss": -43.536964416503906, "global_step": 259175, "epoch": 2141} {"train_loss": -42.636775970458984, "global_step": 259176, "epoch": 2141} {"train_loss": -43.33219528198242, "global_step": 259177, "epoch": 2141} {"train_loss": -42.272579193115234, "global_step": 259178, "epoch": 2141} {"train_loss": -42.604942321777344, "global_step": 259179, "epoch": 2141} {"train_loss": -42.593971252441406, "global_step": 259180, "epoch": 2141} {"train_loss": -42.37318700995327, "global_step": 259181, "epoch": 2141, "val_loss": 2682301.25} {"train_loss": -43.2253532409668, "global_step": 259182, "epoch": 2142} {"train_loss": -43.48981475830078, "global_step": 259183, "epoch": 2142} {"train_loss": -43.13140869140625, "global_step": 259184, "epoch": 2142} {"train_loss": -42.91056442260742, "global_step": 259185, "epoch": 2142} {"train_loss": -42.26023483276367, "global_step": 259186, "epoch": 2142} {"train_loss": -41.837039947509766, "global_step": 259187, "epoch": 2142} {"train_loss": -41.87491989135742, "global_step": 259188, "epoch": 2142} {"train_loss": -42.86167907714844, "global_step": 259189, "epoch": 2142} {"train_loss": -41.05545425415039, "global_step": 259190, "epoch": 2142} {"train_loss": -39.340118408203125, "global_step": 259191, "epoch": 2142} {"train_loss": -38.50563430786133, "global_step": 259192, "epoch": 2142} {"train_loss": -39.911495208740234, "global_step": 259193, "epoch": 2142} {"train_loss": -42.59758758544922, "global_step": 259194, "epoch": 2142} {"train_loss": -41.56648254394531, "global_step": 259195, "epoch": 2142} {"train_loss": -40.813018798828125, "global_step": 259196, "epoch": 2142} {"train_loss": -42.70429611206055, "global_step": 259197, "epoch": 2142} {"train_loss": -41.933197021484375, "global_step": 259198, "epoch": 2142} {"train_loss": -40.316871643066406, "global_step": 259199, "epoch": 2142} {"train_loss": -41.056549072265625, "global_step": 259200, "epoch": 2142} {"train_loss": -42.2125129699707, "global_step": 259201, "epoch": 2142} {"train_loss": -42.272029876708984, "global_step": 259202, "epoch": 2142} {"train_loss": -41.32611846923828, "global_step": 259203, "epoch": 2142} {"train_loss": -40.900020599365234, "global_step": 259204, "epoch": 2142} {"train_loss": -41.902095794677734, "global_step": 259205, "epoch": 2142} {"train_loss": -40.9993782043457, "global_step": 259206, "epoch": 2142} {"train_loss": -42.191139221191406, "global_step": 259207, "epoch": 2142} {"train_loss": -42.24885177612305, "global_step": 259208, "epoch": 2142} {"train_loss": -41.26188278198242, "global_step": 259209, "epoch": 2142} {"train_loss": -41.50020217895508, "global_step": 259210, "epoch": 2142} {"train_loss": -42.38346862792969, "global_step": 259211, "epoch": 2142} {"train_loss": -40.706424713134766, "global_step": 259212, "epoch": 2142} {"train_loss": -40.68827438354492, "global_step": 259213, "epoch": 2142} {"train_loss": -38.70318603515625, "global_step": 259214, "epoch": 2142} {"train_loss": -42.64703369140625, "global_step": 259215, "epoch": 2142} {"train_loss": -39.76662826538086, "global_step": 259216, "epoch": 2142} {"train_loss": -41.43963623046875, "global_step": 259217, "epoch": 2142} {"train_loss": -41.26894760131836, "global_step": 259218, "epoch": 2142} {"train_loss": -40.75126266479492, "global_step": 259219, "epoch": 2142} {"train_loss": -38.359466552734375, "global_step": 259220, "epoch": 2142} {"train_loss": -42.63985824584961, "global_step": 259221, "epoch": 2142} {"train_loss": -41.4248046875, "global_step": 259222, "epoch": 2142} {"train_loss": -42.37491989135742, "global_step": 259223, "epoch": 2142} {"train_loss": -41.672298431396484, "global_step": 259224, "epoch": 2142} {"train_loss": -42.29008483886719, "global_step": 259225, "epoch": 2142} {"train_loss": -41.45906448364258, "global_step": 259226, "epoch": 2142} {"train_loss": -41.16358184814453, "global_step": 259227, "epoch": 2142} {"train_loss": -42.705013275146484, "global_step": 259228, "epoch": 2142} {"train_loss": -41.73539733886719, "global_step": 259229, "epoch": 2142} {"train_loss": -37.987220764160156, "global_step": 259230, "epoch": 2142} {"train_loss": -42.5203857421875, "global_step": 259231, "epoch": 2142} {"train_loss": -42.193504333496094, "global_step": 259232, "epoch": 2142} {"train_loss": -42.35780715942383, "global_step": 259233, "epoch": 2142} {"train_loss": -41.81769943237305, "global_step": 259234, "epoch": 2142} {"train_loss": -29.834918975830078, "global_step": 259235, "epoch": 2142} {"train_loss": -41.159053802490234, "global_step": 259236, "epoch": 2142} {"train_loss": -41.76377487182617, "global_step": 259237, "epoch": 2142} {"train_loss": -40.15786361694336, "global_step": 259238, "epoch": 2142} {"train_loss": -39.225460052490234, "global_step": 259239, "epoch": 2142} {"train_loss": -33.014373779296875, "global_step": 259240, "epoch": 2142} {"train_loss": -39.9085578918457, "global_step": 259241, "epoch": 2142} {"train_loss": -39.626705169677734, "global_step": 259242, "epoch": 2142} {"train_loss": -25.404518127441406, "global_step": 259243, "epoch": 2142} {"train_loss": -35.84929275512695, "global_step": 259244, "epoch": 2142} {"train_loss": -37.85169219970703, "global_step": 259245, "epoch": 2142} {"train_loss": -29.252912521362305, "global_step": 259246, "epoch": 2142} {"train_loss": -32.41286087036133, "global_step": 259247, "epoch": 2142} {"train_loss": -40.14979553222656, "global_step": 259248, "epoch": 2142} {"train_loss": -38.16705322265625, "global_step": 259249, "epoch": 2142} {"train_loss": -34.4456787109375, "global_step": 259250, "epoch": 2142} {"train_loss": -30.775543212890625, "global_step": 259251, "epoch": 2142} {"train_loss": -38.863609313964844, "global_step": 259252, "epoch": 2142} {"train_loss": -32.25489044189453, "global_step": 259253, "epoch": 2142} {"train_loss": -40.27175521850586, "global_step": 259254, "epoch": 2142} {"train_loss": -38.0909309387207, "global_step": 259255, "epoch": 2142} {"train_loss": -28.577972412109375, "global_step": 259256, "epoch": 2142} {"train_loss": -35.3397331237793, "global_step": 259257, "epoch": 2142} {"train_loss": -36.831600189208984, "global_step": 259258, "epoch": 2142} {"train_loss": -38.30597686767578, "global_step": 259259, "epoch": 2142} {"train_loss": -39.88017654418945, "global_step": 259260, "epoch": 2142} {"train_loss": -38.58247756958008, "global_step": 259261, "epoch": 2142} {"train_loss": -34.595088958740234, "global_step": 259262, "epoch": 2142} {"train_loss": -34.580806732177734, "global_step": 259263, "epoch": 2142} {"train_loss": -34.01350021362305, "global_step": 259264, "epoch": 2142} {"train_loss": -37.8938102722168, "global_step": 259265, "epoch": 2142} {"train_loss": -39.54133987426758, "global_step": 259266, "epoch": 2142} {"train_loss": -35.98786544799805, "global_step": 259267, "epoch": 2142} {"train_loss": -39.19676208496094, "global_step": 259268, "epoch": 2142} {"train_loss": -38.75006103515625, "global_step": 259269, "epoch": 2142} {"train_loss": -38.66605758666992, "global_step": 259270, "epoch": 2142} {"train_loss": -39.82087326049805, "global_step": 259271, "epoch": 2142} {"train_loss": -36.52627182006836, "global_step": 259272, "epoch": 2142} {"train_loss": -37.275146484375, "global_step": 259273, "epoch": 2142} {"train_loss": -38.52198028564453, "global_step": 259274, "epoch": 2142} {"train_loss": -40.46171569824219, "global_step": 259275, "epoch": 2142} {"train_loss": -39.78118133544922, "global_step": 259276, "epoch": 2142} {"train_loss": -40.558406829833984, "global_step": 259277, "epoch": 2142} {"train_loss": -39.65605163574219, "global_step": 259278, "epoch": 2142} {"train_loss": -40.19949722290039, "global_step": 259279, "epoch": 2142} {"train_loss": -40.435089111328125, "global_step": 259280, "epoch": 2142} {"train_loss": -39.77239227294922, "global_step": 259281, "epoch": 2142} {"train_loss": -40.080413818359375, "global_step": 259282, "epoch": 2142} {"train_loss": -38.93571090698242, "global_step": 259283, "epoch": 2142} {"train_loss": -40.333641052246094, "global_step": 259284, "epoch": 2142} {"train_loss": -39.902565002441406, "global_step": 259285, "epoch": 2142} {"train_loss": -40.16876220703125, "global_step": 259286, "epoch": 2142} {"train_loss": -38.94032669067383, "global_step": 259287, "epoch": 2142} {"train_loss": -40.764339447021484, "global_step": 259288, "epoch": 2142} {"train_loss": -39.71839141845703, "global_step": 259289, "epoch": 2142} {"train_loss": -39.72700119018555, "global_step": 259290, "epoch": 2142} {"train_loss": -40.545875549316406, "global_step": 259291, "epoch": 2142} {"train_loss": -40.6263313293457, "global_step": 259292, "epoch": 2142} {"train_loss": -41.13374710083008, "global_step": 259293, "epoch": 2142} {"train_loss": -40.552120208740234, "global_step": 259294, "epoch": 2142} {"train_loss": -40.7478141784668, "global_step": 259295, "epoch": 2142} {"train_loss": -40.13024139404297, "global_step": 259296, "epoch": 2142} {"train_loss": -40.54689407348633, "global_step": 259297, "epoch": 2142} {"train_loss": -40.8657341003418, "global_step": 259298, "epoch": 2142} {"train_loss": -40.77022933959961, "global_step": 259299, "epoch": 2142} {"train_loss": -41.71331024169922, "global_step": 259300, "epoch": 2142} {"train_loss": -41.34540557861328, "global_step": 259301, "epoch": 2142} {"train_loss": -39.59161214592043, "global_step": 259302, "epoch": 2142, "val_loss": 2637763.0} {"train_loss": -40.809349060058594, "global_step": 259303, "epoch": 2143} {"train_loss": -41.510982513427734, "global_step": 259304, "epoch": 2143} {"train_loss": -41.74921798706055, "global_step": 259305, "epoch": 2143} {"train_loss": -41.40269470214844, "global_step": 259306, "epoch": 2143} {"train_loss": -41.85860061645508, "global_step": 259307, "epoch": 2143} {"train_loss": -41.2235221862793, "global_step": 259308, "epoch": 2143} {"train_loss": -40.906307220458984, "global_step": 259309, "epoch": 2143} {"train_loss": -41.66511917114258, "global_step": 259310, "epoch": 2143} {"train_loss": -41.36235427856445, "global_step": 259311, "epoch": 2143} {"train_loss": -41.71427536010742, "global_step": 259312, "epoch": 2143} {"train_loss": -41.30885696411133, "global_step": 259313, "epoch": 2143} {"train_loss": -41.23972702026367, "global_step": 259314, "epoch": 2143} {"train_loss": -41.862831115722656, "global_step": 259315, "epoch": 2143} {"train_loss": -42.280616760253906, "global_step": 259316, "epoch": 2143} {"train_loss": -42.285369873046875, "global_step": 259317, "epoch": 2143} {"train_loss": -42.385032653808594, "global_step": 259318, "epoch": 2143} {"train_loss": -42.2476806640625, "global_step": 259319, "epoch": 2143} {"train_loss": -42.34591293334961, "global_step": 259320, "epoch": 2143} {"train_loss": -40.89340591430664, "global_step": 259321, "epoch": 2143} {"train_loss": -41.92426681518555, "global_step": 259322, "epoch": 2143} {"train_loss": -42.35780715942383, "global_step": 259323, "epoch": 2143} {"train_loss": -42.034698486328125, "global_step": 259324, "epoch": 2143} {"train_loss": -42.032230377197266, "global_step": 259325, "epoch": 2143} {"train_loss": -42.00251388549805, "global_step": 259326, "epoch": 2143} {"train_loss": -42.227596282958984, "global_step": 259327, "epoch": 2143} {"train_loss": -42.10106658935547, "global_step": 259328, "epoch": 2143} {"train_loss": -42.26969528198242, "global_step": 259329, "epoch": 2143} {"train_loss": -42.282894134521484, "global_step": 259330, "epoch": 2143} {"train_loss": -42.40373611450195, "global_step": 259331, "epoch": 2143} {"train_loss": -40.883785247802734, "global_step": 259332, "epoch": 2143} {"train_loss": -41.899112701416016, "global_step": 259333, "epoch": 2143} {"train_loss": -41.939918518066406, "global_step": 259334, "epoch": 2143} {"train_loss": -41.47820281982422, "global_step": 259335, "epoch": 2143} {"train_loss": -41.5713996887207, "global_step": 259336, "epoch": 2143} {"train_loss": -42.19731903076172, "global_step": 259337, "epoch": 2143} {"train_loss": -42.67060089111328, "global_step": 259338, "epoch": 2143} {"train_loss": -42.5599479675293, "global_step": 259339, "epoch": 2143} {"train_loss": -42.612667083740234, "global_step": 259340, "epoch": 2143} {"train_loss": -42.33498001098633, "global_step": 259341, "epoch": 2143} {"train_loss": -40.97782516479492, "global_step": 259342, "epoch": 2143} {"train_loss": -42.440711975097656, "global_step": 259343, "epoch": 2143} {"train_loss": -42.7397346496582, "global_step": 259344, "epoch": 2143} {"train_loss": -42.86956787109375, "global_step": 259345, "epoch": 2143} {"train_loss": -42.733558654785156, "global_step": 259346, "epoch": 2143} {"train_loss": -42.61770248413086, "global_step": 259347, "epoch": 2143} {"train_loss": -42.85715103149414, "global_step": 259348, "epoch": 2143} {"train_loss": -42.73495101928711, "global_step": 259349, "epoch": 2143} {"train_loss": -42.99513626098633, "global_step": 259350, "epoch": 2143} {"train_loss": -42.79499816894531, "global_step": 259351, "epoch": 2143} {"train_loss": -42.95000076293945, "global_step": 259352, "epoch": 2143} {"train_loss": -42.92733383178711, "global_step": 259353, "epoch": 2143} {"train_loss": -42.75796890258789, "global_step": 259354, "epoch": 2143} {"train_loss": -42.92858123779297, "global_step": 259355, "epoch": 2143} {"train_loss": -42.59366989135742, "global_step": 259356, "epoch": 2143} {"train_loss": -41.35845947265625, "global_step": 259357, "epoch": 2143} {"train_loss": -41.7472038269043, "global_step": 259358, "epoch": 2143} {"train_loss": -42.63931655883789, "global_step": 259359, "epoch": 2143} {"train_loss": -42.24977493286133, "global_step": 259360, "epoch": 2143} {"train_loss": -42.819942474365234, "global_step": 259361, "epoch": 2143} {"train_loss": -42.44361114501953, "global_step": 259362, "epoch": 2143} {"train_loss": -42.59658432006836, "global_step": 259363, "epoch": 2143} {"train_loss": -42.62540817260742, "global_step": 259364, "epoch": 2143} {"train_loss": -42.2916259765625, "global_step": 259365, "epoch": 2143} {"train_loss": -42.4344596862793, "global_step": 259366, "epoch": 2143} {"train_loss": -42.933815002441406, "global_step": 259367, "epoch": 2143} {"train_loss": -42.58403396606445, "global_step": 259368, "epoch": 2143} {"train_loss": -43.070377349853516, "global_step": 259369, "epoch": 2143} {"train_loss": -42.078128814697266, "global_step": 259370, "epoch": 2143} {"train_loss": -42.8677978515625, "global_step": 259371, "epoch": 2143} {"train_loss": -42.04692459106445, "global_step": 259372, "epoch": 2143} {"train_loss": -42.425716400146484, "global_step": 259373, "epoch": 2143} {"train_loss": -42.5392951965332, "global_step": 259374, "epoch": 2143} {"train_loss": -42.231422424316406, "global_step": 259375, "epoch": 2143} {"train_loss": -42.441768646240234, "global_step": 259376, "epoch": 2143} {"train_loss": -41.9678955078125, "global_step": 259377, "epoch": 2143} {"train_loss": -42.917076110839844, "global_step": 259378, "epoch": 2143} {"train_loss": -42.010711669921875, "global_step": 259379, "epoch": 2143} {"train_loss": -41.02743148803711, "global_step": 259380, "epoch": 2143} {"train_loss": -39.638648986816406, "global_step": 259381, "epoch": 2143} {"train_loss": -42.093318939208984, "global_step": 259382, "epoch": 2143} {"train_loss": -41.677284240722656, "global_step": 259383, "epoch": 2143} {"train_loss": -42.34812545776367, "global_step": 259384, "epoch": 2143} {"train_loss": -41.03608322143555, "global_step": 259385, "epoch": 2143} {"train_loss": -42.535675048828125, "global_step": 259386, "epoch": 2143} {"train_loss": -42.10164260864258, "global_step": 259387, "epoch": 2143} {"train_loss": -42.1441535949707, "global_step": 259388, "epoch": 2143} {"train_loss": -41.553035736083984, "global_step": 259389, "epoch": 2143} {"train_loss": -42.77825927734375, "global_step": 259390, "epoch": 2143} {"train_loss": -42.87036895751953, "global_step": 259391, "epoch": 2143} {"train_loss": -42.71364974975586, "global_step": 259392, "epoch": 2143} {"train_loss": -42.80323791503906, "global_step": 259393, "epoch": 2143} {"train_loss": -42.81439208984375, "global_step": 259394, "epoch": 2143} {"train_loss": -42.739376068115234, "global_step": 259395, "epoch": 2143} {"train_loss": -42.52197265625, "global_step": 259396, "epoch": 2143} {"train_loss": -39.28450012207031, "global_step": 259397, "epoch": 2143} {"train_loss": -42.4300651550293, "global_step": 259398, "epoch": 2143} {"train_loss": -42.100669860839844, "global_step": 259399, "epoch": 2143} {"train_loss": -41.6053466796875, "global_step": 259400, "epoch": 2143} {"train_loss": -41.623016357421875, "global_step": 259401, "epoch": 2143} {"train_loss": -42.41874313354492, "global_step": 259402, "epoch": 2143} {"train_loss": -42.74961471557617, "global_step": 259403, "epoch": 2143} {"train_loss": -42.64431381225586, "global_step": 259404, "epoch": 2143} {"train_loss": -42.99740219116211, "global_step": 259405, "epoch": 2143} {"train_loss": -42.44804000854492, "global_step": 259406, "epoch": 2143} {"train_loss": -41.97705841064453, "global_step": 259407, "epoch": 2143} {"train_loss": -42.93408203125, "global_step": 259408, "epoch": 2143} {"train_loss": -42.65610885620117, "global_step": 259409, "epoch": 2143} {"train_loss": -42.36993408203125, "global_step": 259410, "epoch": 2143} {"train_loss": -42.495849609375, "global_step": 259411, "epoch": 2143} {"train_loss": -38.037235260009766, "global_step": 259412, "epoch": 2143} {"train_loss": -41.59765625, "global_step": 259413, "epoch": 2143} {"train_loss": -41.9260139465332, "global_step": 259414, "epoch": 2143} {"train_loss": -42.095436096191406, "global_step": 259415, "epoch": 2143} {"train_loss": -41.216156005859375, "global_step": 259416, "epoch": 2143} {"train_loss": -40.09681701660156, "global_step": 259417, "epoch": 2143} {"train_loss": -41.538841247558594, "global_step": 259418, "epoch": 2143} {"train_loss": -37.22251510620117, "global_step": 259419, "epoch": 2143} {"train_loss": -40.07869338989258, "global_step": 259420, "epoch": 2143} {"train_loss": -39.5721435546875, "global_step": 259421, "epoch": 2143} {"train_loss": -41.823299407958984, "global_step": 259422, "epoch": 2143} {"train_loss": -41.9814525005246, "global_step": 259423, "epoch": 2143, "val_loss": 2690989.5} {"train_loss": -38.125587463378906, "global_step": 259424, "epoch": 2144} {"train_loss": -40.86145782470703, "global_step": 259425, "epoch": 2144} {"train_loss": -37.4001579284668, "global_step": 259426, "epoch": 2144} {"train_loss": -41.70071029663086, "global_step": 259427, "epoch": 2144} {"train_loss": -38.90288543701172, "global_step": 259428, "epoch": 2144} {"train_loss": -41.48221206665039, "global_step": 259429, "epoch": 2144} {"train_loss": -40.63925552368164, "global_step": 259430, "epoch": 2144} {"train_loss": -40.46854782104492, "global_step": 259431, "epoch": 2144} {"train_loss": -41.40843200683594, "global_step": 259432, "epoch": 2144} {"train_loss": -40.333404541015625, "global_step": 259433, "epoch": 2144} {"train_loss": -42.08808135986328, "global_step": 259434, "epoch": 2144} {"train_loss": -41.4182243347168, "global_step": 259435, "epoch": 2144} {"train_loss": -41.40323257446289, "global_step": 259436, "epoch": 2144} {"train_loss": -41.219600677490234, "global_step": 259437, "epoch": 2144} {"train_loss": -41.3839225769043, "global_step": 259438, "epoch": 2144} {"train_loss": -41.42190170288086, "global_step": 259439, "epoch": 2144} {"train_loss": -41.224815368652344, "global_step": 259440, "epoch": 2144} {"train_loss": -42.06055450439453, "global_step": 259441, "epoch": 2144} {"train_loss": -41.784969329833984, "global_step": 259442, "epoch": 2144} {"train_loss": -42.25358200073242, "global_step": 259443, "epoch": 2144} {"train_loss": -42.40821838378906, "global_step": 259444, "epoch": 2144} {"train_loss": -42.217742919921875, "global_step": 259445, "epoch": 2144} {"train_loss": -42.56583023071289, "global_step": 259446, "epoch": 2144} {"train_loss": -42.416656494140625, "global_step": 259447, "epoch": 2144} {"train_loss": -42.3015251159668, "global_step": 259448, "epoch": 2144} {"train_loss": -42.48298263549805, "global_step": 259449, "epoch": 2144} {"train_loss": -40.58004379272461, "global_step": 259450, "epoch": 2144} {"train_loss": -42.08695602416992, "global_step": 259451, "epoch": 2144} {"train_loss": -42.950286865234375, "global_step": 259452, "epoch": 2144} {"train_loss": -41.48752212524414, "global_step": 259453, "epoch": 2144} {"train_loss": -42.743934631347656, "global_step": 259454, "epoch": 2144} {"train_loss": -42.885009765625, "global_step": 259455, "epoch": 2144} {"train_loss": -42.78813552856445, "global_step": 259456, "epoch": 2144} {"train_loss": -43.37528610229492, "global_step": 259457, "epoch": 2144} {"train_loss": -40.68092346191406, "global_step": 259458, "epoch": 2144} {"train_loss": -42.66433334350586, "global_step": 259459, "epoch": 2144} {"train_loss": -42.734249114990234, "global_step": 259460, "epoch": 2144} {"train_loss": -42.7143440246582, "global_step": 259461, "epoch": 2144} {"train_loss": -42.92823028564453, "global_step": 259462, "epoch": 2144} {"train_loss": -42.644981384277344, "global_step": 259463, "epoch": 2144} {"train_loss": -43.06510543823242, "global_step": 259464, "epoch": 2144} {"train_loss": -42.41997146606445, "global_step": 259465, "epoch": 2144} {"train_loss": -42.89546203613281, "global_step": 259466, "epoch": 2144} {"train_loss": -42.95392990112305, "global_step": 259467, "epoch": 2144} {"train_loss": -43.136474609375, "global_step": 259468, "epoch": 2144} {"train_loss": -42.93782424926758, "global_step": 259469, "epoch": 2144} {"train_loss": -43.04633712768555, "global_step": 259470, "epoch": 2144} {"train_loss": -43.18154525756836, "global_step": 259471, "epoch": 2144} {"train_loss": -43.17942428588867, "global_step": 259472, "epoch": 2144} {"train_loss": -43.04121017456055, "global_step": 259473, "epoch": 2144} {"train_loss": -42.9202880859375, "global_step": 259474, "epoch": 2144} {"train_loss": -43.272422790527344, "global_step": 259475, "epoch": 2144} {"train_loss": -43.32047653198242, "global_step": 259476, "epoch": 2144} {"train_loss": -43.018836975097656, "global_step": 259477, "epoch": 2144} {"train_loss": -43.285030364990234, "global_step": 259478, "epoch": 2144} {"train_loss": -43.3676872253418, "global_step": 259479, "epoch": 2144} {"train_loss": -43.28268051147461, "global_step": 259480, "epoch": 2144} {"train_loss": -43.14166259765625, "global_step": 259481, "epoch": 2144} {"train_loss": -43.51301574707031, "global_step": 259482, "epoch": 2144} {"train_loss": -43.20205307006836, "global_step": 259483, "epoch": 2144} {"train_loss": -43.06722640991211, "global_step": 259484, "epoch": 2144} {"train_loss": -43.05876541137695, "global_step": 259485, "epoch": 2144} {"train_loss": -43.714599609375, "global_step": 259486, "epoch": 2144} {"train_loss": -41.8348388671875, "global_step": 259487, "epoch": 2144} {"train_loss": -41.95766067504883, "global_step": 259488, "epoch": 2144} {"train_loss": -42.5050163269043, "global_step": 259489, "epoch": 2144} {"train_loss": -43.533653259277344, "global_step": 259490, "epoch": 2144} {"train_loss": -43.135597229003906, "global_step": 259491, "epoch": 2144} {"train_loss": -42.21367263793945, "global_step": 259492, "epoch": 2144} {"train_loss": -41.62563705444336, "global_step": 259493, "epoch": 2144} {"train_loss": -42.54340744018555, "global_step": 259494, "epoch": 2144} {"train_loss": -43.338565826416016, "global_step": 259495, "epoch": 2144} {"train_loss": -42.36821365356445, "global_step": 259496, "epoch": 2144} {"train_loss": -42.4295539855957, "global_step": 259497, "epoch": 2144} {"train_loss": -42.97285842895508, "global_step": 259498, "epoch": 2144} {"train_loss": -41.28694152832031, "global_step": 259499, "epoch": 2144} {"train_loss": -43.4594612121582, "global_step": 259500, "epoch": 2144} {"train_loss": -43.33720779418945, "global_step": 259501, "epoch": 2144} {"train_loss": -41.9426155090332, "global_step": 259502, "epoch": 2144} {"train_loss": -38.2911376953125, "global_step": 259503, "epoch": 2144} {"train_loss": -37.946266174316406, "global_step": 259504, "epoch": 2144} {"train_loss": -40.887264251708984, "global_step": 259505, "epoch": 2144} {"train_loss": -40.94490051269531, "global_step": 259506, "epoch": 2144} {"train_loss": -37.10111618041992, "global_step": 259507, "epoch": 2144} {"train_loss": -35.693180084228516, "global_step": 259508, "epoch": 2144} {"train_loss": -33.12540054321289, "global_step": 259509, "epoch": 2144} {"train_loss": -37.645263671875, "global_step": 259510, "epoch": 2144} {"train_loss": -37.7288932800293, "global_step": 259511, "epoch": 2144} {"train_loss": -37.5788459777832, "global_step": 259512, "epoch": 2144} {"train_loss": -37.60459518432617, "global_step": 259513, "epoch": 2144} {"train_loss": -35.531349182128906, "global_step": 259514, "epoch": 2144} {"train_loss": -35.62220001220703, "global_step": 259515, "epoch": 2144} {"train_loss": -37.295711517333984, "global_step": 259516, "epoch": 2144} {"train_loss": -38.826255798339844, "global_step": 259517, "epoch": 2144} {"train_loss": -32.28872299194336, "global_step": 259518, "epoch": 2144} {"train_loss": -33.618900299072266, "global_step": 259519, "epoch": 2144} {"train_loss": -36.63993453979492, "global_step": 259520, "epoch": 2144} {"train_loss": -35.001163482666016, "global_step": 259521, "epoch": 2144} {"train_loss": -38.58921432495117, "global_step": 259522, "epoch": 2144} {"train_loss": -37.495018005371094, "global_step": 259523, "epoch": 2144} {"train_loss": -36.87618637084961, "global_step": 259524, "epoch": 2144} {"train_loss": -39.51893997192383, "global_step": 259525, "epoch": 2144} {"train_loss": -37.61245346069336, "global_step": 259526, "epoch": 2144} {"train_loss": -38.08888244628906, "global_step": 259527, "epoch": 2144} {"train_loss": -36.68699264526367, "global_step": 259528, "epoch": 2144} {"train_loss": -37.84027099609375, "global_step": 259529, "epoch": 2144} {"train_loss": -39.51275634765625, "global_step": 259530, "epoch": 2144} {"train_loss": -34.13237762451172, "global_step": 259531, "epoch": 2144} {"train_loss": -39.10680389404297, "global_step": 259532, "epoch": 2144} {"train_loss": -37.72719192504883, "global_step": 259533, "epoch": 2144} {"train_loss": -32.88166427612305, "global_step": 259534, "epoch": 2144} {"train_loss": -37.24372482299805, "global_step": 259535, "epoch": 2144} {"train_loss": -37.3940544128418, "global_step": 259536, "epoch": 2144} {"train_loss": -37.16911697387695, "global_step": 259537, "epoch": 2144} {"train_loss": -40.3913688659668, "global_step": 259538, "epoch": 2144} {"train_loss": -38.05440902709961, "global_step": 259539, "epoch": 2144} {"train_loss": -40.02344512939453, "global_step": 259540, "epoch": 2144} {"train_loss": -37.87841796875, "global_step": 259541, "epoch": 2144} {"train_loss": -40.083370208740234, "global_step": 259542, "epoch": 2144} {"train_loss": -40.0798454284668, "global_step": 259543, "epoch": 2144} {"train_loss": -40.59183051369407, "global_step": 259544, "epoch": 2144, "val_loss": 2602142.0} {"train_loss": -40.179134368896484, "global_step": 259545, "epoch": 2145} {"train_loss": -39.89107894897461, "global_step": 259546, "epoch": 2145} {"train_loss": -40.46670150756836, "global_step": 259547, "epoch": 2145} {"train_loss": -40.562835693359375, "global_step": 259548, "epoch": 2145} {"train_loss": -40.58907699584961, "global_step": 259549, "epoch": 2145} {"train_loss": -40.16189193725586, "global_step": 259550, "epoch": 2145} {"train_loss": -40.90760040283203, "global_step": 259551, "epoch": 2145} {"train_loss": -40.95428466796875, "global_step": 259552, "epoch": 2145} {"train_loss": -40.75350570678711, "global_step": 259553, "epoch": 2145} {"train_loss": -40.2548942565918, "global_step": 259554, "epoch": 2145} {"train_loss": -41.4922981262207, "global_step": 259555, "epoch": 2145} {"train_loss": -40.897682189941406, "global_step": 259556, "epoch": 2145} {"train_loss": -40.951324462890625, "global_step": 259557, "epoch": 2145} {"train_loss": -40.448055267333984, "global_step": 259558, "epoch": 2145} {"train_loss": -40.646697998046875, "global_step": 259559, "epoch": 2145} {"train_loss": -40.86421203613281, "global_step": 259560, "epoch": 2145} {"train_loss": -41.10976791381836, "global_step": 259561, "epoch": 2145} {"train_loss": -42.01128005981445, "global_step": 259562, "epoch": 2145} {"train_loss": -41.53786087036133, "global_step": 259563, "epoch": 2145} {"train_loss": -41.524024963378906, "global_step": 259564, "epoch": 2145} {"train_loss": -40.8757209777832, "global_step": 259565, "epoch": 2145} {"train_loss": -40.386619567871094, "global_step": 259566, "epoch": 2145} {"train_loss": -41.08940505981445, "global_step": 259567, "epoch": 2145} {"train_loss": -41.694557189941406, "global_step": 259568, "epoch": 2145} {"train_loss": -41.6506462097168, "global_step": 259569, "epoch": 2145} {"train_loss": -41.39238739013672, "global_step": 259570, "epoch": 2145} {"train_loss": -41.79345703125, "global_step": 259571, "epoch": 2145} {"train_loss": -41.475624084472656, "global_step": 259572, "epoch": 2145} {"train_loss": -41.79023742675781, "global_step": 259573, "epoch": 2145} {"train_loss": -41.59183883666992, "global_step": 259574, "epoch": 2145} {"train_loss": -41.5977783203125, "global_step": 259575, "epoch": 2145} {"train_loss": -41.98210906982422, "global_step": 259576, "epoch": 2145} {"train_loss": -41.83921432495117, "global_step": 259577, "epoch": 2145} {"train_loss": -42.317474365234375, "global_step": 259578, "epoch": 2145} {"train_loss": -42.368438720703125, "global_step": 259579, "epoch": 2145} {"train_loss": -42.302581787109375, "global_step": 259580, "epoch": 2145} {"train_loss": -42.19324493408203, "global_step": 259581, "epoch": 2145} {"train_loss": -41.53432083129883, "global_step": 259582, "epoch": 2145} {"train_loss": -41.89620590209961, "global_step": 259583, "epoch": 2145} {"train_loss": -42.27145767211914, "global_step": 259584, "epoch": 2145} {"train_loss": -42.1102409362793, "global_step": 259585, "epoch": 2145} {"train_loss": -42.35017013549805, "global_step": 259586, "epoch": 2145} {"train_loss": -40.95820236206055, "global_step": 259587, "epoch": 2145} {"train_loss": -42.25922775268555, "global_step": 259588, "epoch": 2145} {"train_loss": -42.0092658996582, "global_step": 259589, "epoch": 2145} {"train_loss": -42.32933044433594, "global_step": 259590, "epoch": 2145} {"train_loss": -41.7620849609375, "global_step": 259591, "epoch": 2145} {"train_loss": -42.462860107421875, "global_step": 259592, "epoch": 2145} {"train_loss": -42.02281188964844, "global_step": 259593, "epoch": 2145} {"train_loss": -42.169429779052734, "global_step": 259594, "epoch": 2145} {"train_loss": -42.044288635253906, "global_step": 259595, "epoch": 2145} {"train_loss": -42.8486328125, "global_step": 259596, "epoch": 2145} {"train_loss": -42.64826583862305, "global_step": 259597, "epoch": 2145} {"train_loss": -42.40018844604492, "global_step": 259598, "epoch": 2145} {"train_loss": -42.69784164428711, "global_step": 259599, "epoch": 2145} {"train_loss": -42.43512725830078, "global_step": 259600, "epoch": 2145} {"train_loss": -42.705074310302734, "global_step": 259601, "epoch": 2145} {"train_loss": -42.46664047241211, "global_step": 259602, "epoch": 2145} {"train_loss": -42.505760192871094, "global_step": 259603, "epoch": 2145} {"train_loss": -42.74966049194336, "global_step": 259604, "epoch": 2145} {"train_loss": -42.541866302490234, "global_step": 259605, "epoch": 2145} {"train_loss": -42.59397888183594, "global_step": 259606, "epoch": 2145} {"train_loss": -43.01664352416992, "global_step": 259607, "epoch": 2145} {"train_loss": -42.431034088134766, "global_step": 259608, "epoch": 2145} {"train_loss": -42.854217529296875, "global_step": 259609, "epoch": 2145} {"train_loss": -43.0431022644043, "global_step": 259610, "epoch": 2145} {"train_loss": -42.43467330932617, "global_step": 259611, "epoch": 2145} {"train_loss": -42.948974609375, "global_step": 259612, "epoch": 2145} {"train_loss": -42.53620529174805, "global_step": 259613, "epoch": 2145} {"train_loss": -42.55025863647461, "global_step": 259614, "epoch": 2145} {"train_loss": -42.684547424316406, "global_step": 259615, "epoch": 2145} {"train_loss": -42.537879943847656, "global_step": 259616, "epoch": 2145} {"train_loss": -40.72046661376953, "global_step": 259617, "epoch": 2145} {"train_loss": -43.33833694458008, "global_step": 259618, "epoch": 2145} {"train_loss": -43.10167694091797, "global_step": 259619, "epoch": 2145} {"train_loss": -43.0560417175293, "global_step": 259620, "epoch": 2145} {"train_loss": -43.154144287109375, "global_step": 259621, "epoch": 2145} {"train_loss": -42.84312057495117, "global_step": 259622, "epoch": 2145} {"train_loss": -41.79667282104492, "global_step": 259623, "epoch": 2145} {"train_loss": -41.88972854614258, "global_step": 259624, "epoch": 2145} {"train_loss": -42.907596588134766, "global_step": 259625, "epoch": 2145} {"train_loss": -42.348567962646484, "global_step": 259626, "epoch": 2145} {"train_loss": -42.779693603515625, "global_step": 259627, "epoch": 2145} {"train_loss": -43.12616729736328, "global_step": 259628, "epoch": 2145} {"train_loss": -42.84442138671875, "global_step": 259629, "epoch": 2145} {"train_loss": -43.1588134765625, "global_step": 259630, "epoch": 2145} {"train_loss": -42.466915130615234, "global_step": 259631, "epoch": 2145} {"train_loss": -42.859500885009766, "global_step": 259632, "epoch": 2145} {"train_loss": -43.04120635986328, "global_step": 259633, "epoch": 2145} {"train_loss": -43.1015625, "global_step": 259634, "epoch": 2145} {"train_loss": -41.983463287353516, "global_step": 259635, "epoch": 2145} {"train_loss": -42.761558532714844, "global_step": 259636, "epoch": 2145} {"train_loss": -42.82881546020508, "global_step": 259637, "epoch": 2145} {"train_loss": -42.79632568359375, "global_step": 259638, "epoch": 2145} {"train_loss": -42.86405563354492, "global_step": 259639, "epoch": 2145} {"train_loss": -43.160579681396484, "global_step": 259640, "epoch": 2145} {"train_loss": -42.84243392944336, "global_step": 259641, "epoch": 2145} {"train_loss": -42.47852325439453, "global_step": 259642, "epoch": 2145} {"train_loss": -42.56785202026367, "global_step": 259643, "epoch": 2145} {"train_loss": -42.15645217895508, "global_step": 259644, "epoch": 2145} {"train_loss": -42.18020248413086, "global_step": 259645, "epoch": 2145} {"train_loss": -42.10353469848633, "global_step": 259646, "epoch": 2145} {"train_loss": -42.1539192199707, "global_step": 259647, "epoch": 2145} {"train_loss": -40.097042083740234, "global_step": 259648, "epoch": 2145} {"train_loss": -36.8907585144043, "global_step": 259649, "epoch": 2145} {"train_loss": -34.775054931640625, "global_step": 259650, "epoch": 2145} {"train_loss": -34.197479248046875, "global_step": 259651, "epoch": 2145} {"train_loss": -37.58295440673828, "global_step": 259652, "epoch": 2145} {"train_loss": -39.90461349487305, "global_step": 259653, "epoch": 2145} {"train_loss": -39.28116226196289, "global_step": 259654, "epoch": 2145} {"train_loss": -39.4005126953125, "global_step": 259655, "epoch": 2145} {"train_loss": -40.79625701904297, "global_step": 259656, "epoch": 2145} {"train_loss": -40.51607131958008, "global_step": 259657, "epoch": 2145} {"train_loss": -41.58866500854492, "global_step": 259658, "epoch": 2145} {"train_loss": -41.82656478881836, "global_step": 259659, "epoch": 2145} {"train_loss": -41.871700286865234, "global_step": 259660, "epoch": 2145} {"train_loss": -41.54619216918945, "global_step": 259661, "epoch": 2145} {"train_loss": -40.597904205322266, "global_step": 259662, "epoch": 2145} {"train_loss": -41.699676513671875, "global_step": 259663, "epoch": 2145} {"train_loss": -40.9167366027832, "global_step": 259664, "epoch": 2145} {"train_loss": -41.687099582892806, "global_step": 259665, "epoch": 2145, "val_loss": 2748009.75} {"train_loss": -41.510467529296875, "global_step": 259666, "epoch": 2146} {"train_loss": -41.65742111206055, "global_step": 259667, "epoch": 2146} {"train_loss": -41.6986198425293, "global_step": 259668, "epoch": 2146} {"train_loss": -41.845069885253906, "global_step": 259669, "epoch": 2146} {"train_loss": -41.45357894897461, "global_step": 259670, "epoch": 2146} {"train_loss": -42.46633529663086, "global_step": 259671, "epoch": 2146} {"train_loss": -41.52650833129883, "global_step": 259672, "epoch": 2146} {"train_loss": -42.04528045654297, "global_step": 259673, "epoch": 2146} {"train_loss": -41.62409973144531, "global_step": 259674, "epoch": 2146} {"train_loss": -41.39088821411133, "global_step": 259675, "epoch": 2146} {"train_loss": -41.43861389160156, "global_step": 259676, "epoch": 2146} {"train_loss": -40.48588943481445, "global_step": 259677, "epoch": 2146} {"train_loss": -40.10641860961914, "global_step": 259678, "epoch": 2146} {"train_loss": -39.42947006225586, "global_step": 259679, "epoch": 2146} {"train_loss": -41.39026641845703, "global_step": 259680, "epoch": 2146} {"train_loss": -39.26361083984375, "global_step": 259681, "epoch": 2146} {"train_loss": -40.97538375854492, "global_step": 259682, "epoch": 2146} {"train_loss": -39.79403305053711, "global_step": 259683, "epoch": 2146} {"train_loss": -40.41469955444336, "global_step": 259684, "epoch": 2146} {"train_loss": -40.446083068847656, "global_step": 259685, "epoch": 2146} {"train_loss": -40.8233757019043, "global_step": 259686, "epoch": 2146} {"train_loss": -40.8543815612793, "global_step": 259687, "epoch": 2146} {"train_loss": -40.86251449584961, "global_step": 259688, "epoch": 2146} {"train_loss": -41.65616989135742, "global_step": 259689, "epoch": 2146} {"train_loss": -41.02330017089844, "global_step": 259690, "epoch": 2146} {"train_loss": -41.27710723876953, "global_step": 259691, "epoch": 2146} {"train_loss": -42.0228271484375, "global_step": 259692, "epoch": 2146} {"train_loss": -41.041831970214844, "global_step": 259693, "epoch": 2146} {"train_loss": -41.795982360839844, "global_step": 259694, "epoch": 2146} {"train_loss": -42.06582260131836, "global_step": 259695, "epoch": 2146} {"train_loss": -41.674049377441406, "global_step": 259696, "epoch": 2146} {"train_loss": -41.12571334838867, "global_step": 259697, "epoch": 2146} {"train_loss": -41.93619918823242, "global_step": 259698, "epoch": 2146} {"train_loss": -41.875083923339844, "global_step": 259699, "epoch": 2146} {"train_loss": -41.78800582885742, "global_step": 259700, "epoch": 2146} {"train_loss": -42.466468811035156, "global_step": 259701, "epoch": 2146} {"train_loss": -42.090267181396484, "global_step": 259702, "epoch": 2146} {"train_loss": -42.020748138427734, "global_step": 259703, "epoch": 2146} {"train_loss": -42.29903793334961, "global_step": 259704, "epoch": 2146} {"train_loss": -42.2946891784668, "global_step": 259705, "epoch": 2146} {"train_loss": -42.2580680847168, "global_step": 259706, "epoch": 2146} {"train_loss": -42.08058547973633, "global_step": 259707, "epoch": 2146} {"train_loss": -42.136749267578125, "global_step": 259708, "epoch": 2146} {"train_loss": -42.211483001708984, "global_step": 259709, "epoch": 2146} {"train_loss": -42.404541015625, "global_step": 259710, "epoch": 2146} {"train_loss": -41.70316696166992, "global_step": 259711, "epoch": 2146} {"train_loss": -42.25495910644531, "global_step": 259712, "epoch": 2146} {"train_loss": -41.329627990722656, "global_step": 259713, "epoch": 2146} {"train_loss": -42.228023529052734, "global_step": 259714, "epoch": 2146} {"train_loss": -41.05580520629883, "global_step": 259715, "epoch": 2146} {"train_loss": -42.85523223876953, "global_step": 259716, "epoch": 2146} {"train_loss": -41.86530303955078, "global_step": 259717, "epoch": 2146} {"train_loss": -42.76630783081055, "global_step": 259718, "epoch": 2146} {"train_loss": -41.7744255065918, "global_step": 259719, "epoch": 2146} {"train_loss": -42.22251892089844, "global_step": 259720, "epoch": 2146} {"train_loss": -42.9073600769043, "global_step": 259721, "epoch": 2146} {"train_loss": -42.0411491394043, "global_step": 259722, "epoch": 2146} {"train_loss": -43.13729476928711, "global_step": 259723, "epoch": 2146} {"train_loss": -41.89500045776367, "global_step": 259724, "epoch": 2146} {"train_loss": -41.89051818847656, "global_step": 259725, "epoch": 2146} {"train_loss": -42.48649978637695, "global_step": 259726, "epoch": 2146} {"train_loss": -42.95273971557617, "global_step": 259727, "epoch": 2146} {"train_loss": -42.46051788330078, "global_step": 259728, "epoch": 2146} {"train_loss": -42.162452697753906, "global_step": 259729, "epoch": 2146} {"train_loss": -43.13226318359375, "global_step": 259730, "epoch": 2146} {"train_loss": -42.08921432495117, "global_step": 259731, "epoch": 2146} {"train_loss": -42.8089714050293, "global_step": 259732, "epoch": 2146} {"train_loss": -42.65748977661133, "global_step": 259733, "epoch": 2146} {"train_loss": -42.83211135864258, "global_step": 259734, "epoch": 2146} {"train_loss": -43.08366012573242, "global_step": 259735, "epoch": 2146} {"train_loss": -42.8505744934082, "global_step": 259736, "epoch": 2146} {"train_loss": -43.48261260986328, "global_step": 259737, "epoch": 2146} {"train_loss": -43.067440032958984, "global_step": 259738, "epoch": 2146} {"train_loss": -42.499053955078125, "global_step": 259739, "epoch": 2146} {"train_loss": -42.560585021972656, "global_step": 259740, "epoch": 2146} {"train_loss": -43.076141357421875, "global_step": 259741, "epoch": 2146} {"train_loss": -43.553890228271484, "global_step": 259742, "epoch": 2146} {"train_loss": -42.285972595214844, "global_step": 259743, "epoch": 2146} {"train_loss": -42.42502975463867, "global_step": 259744, "epoch": 2146} {"train_loss": -43.256919860839844, "global_step": 259745, "epoch": 2146} {"train_loss": -42.86350631713867, "global_step": 259746, "epoch": 2146} {"train_loss": -43.48834228515625, "global_step": 259747, "epoch": 2146} {"train_loss": -43.09079360961914, "global_step": 259748, "epoch": 2146} {"train_loss": -42.866024017333984, "global_step": 259749, "epoch": 2146} {"train_loss": -43.0014533996582, "global_step": 259750, "epoch": 2146} {"train_loss": -42.441898345947266, "global_step": 259751, "epoch": 2146} {"train_loss": -42.29176330566406, "global_step": 259752, "epoch": 2146} {"train_loss": -42.7851448059082, "global_step": 259753, "epoch": 2146} {"train_loss": -43.1068229675293, "global_step": 259754, "epoch": 2146} {"train_loss": -43.33353042602539, "global_step": 259755, "epoch": 2146} {"train_loss": -43.20280075073242, "global_step": 259756, "epoch": 2146} {"train_loss": -43.25440216064453, "global_step": 259757, "epoch": 2146} {"train_loss": -43.1647834777832, "global_step": 259758, "epoch": 2146} {"train_loss": -42.845088958740234, "global_step": 259759, "epoch": 2146} {"train_loss": -42.975189208984375, "global_step": 259760, "epoch": 2146} {"train_loss": -42.58589553833008, "global_step": 259761, "epoch": 2146} {"train_loss": -43.47761535644531, "global_step": 259762, "epoch": 2146} {"train_loss": -43.20903396606445, "global_step": 259763, "epoch": 2146} {"train_loss": -43.0009651184082, "global_step": 259764, "epoch": 2146} {"train_loss": -42.64650344848633, "global_step": 259765, "epoch": 2146} {"train_loss": -40.64078140258789, "global_step": 259766, "epoch": 2146} {"train_loss": -39.24466323852539, "global_step": 259767, "epoch": 2146} {"train_loss": -41.27135467529297, "global_step": 259768, "epoch": 2146} {"train_loss": -42.39717483520508, "global_step": 259769, "epoch": 2146} {"train_loss": -42.82304763793945, "global_step": 259770, "epoch": 2146} {"train_loss": -43.255062103271484, "global_step": 259771, "epoch": 2146} {"train_loss": -42.64423370361328, "global_step": 259772, "epoch": 2146} {"train_loss": -42.24357223510742, "global_step": 259773, "epoch": 2146} {"train_loss": -41.93981170654297, "global_step": 259774, "epoch": 2146} {"train_loss": -42.817115783691406, "global_step": 259775, "epoch": 2146} {"train_loss": -42.48619842529297, "global_step": 259776, "epoch": 2146} {"train_loss": -40.155582427978516, "global_step": 259777, "epoch": 2146} {"train_loss": -40.48337936401367, "global_step": 259778, "epoch": 2146} {"train_loss": -40.32217025756836, "global_step": 259779, "epoch": 2146} {"train_loss": -42.07880401611328, "global_step": 259780, "epoch": 2146} {"train_loss": -42.606754302978516, "global_step": 259781, "epoch": 2146} {"train_loss": -41.092079162597656, "global_step": 259782, "epoch": 2146} {"train_loss": -40.411705017089844, "global_step": 259783, "epoch": 2146} {"train_loss": -40.64702224731445, "global_step": 259784, "epoch": 2146} {"train_loss": -41.74359893798828, "global_step": 259785, "epoch": 2146} {"train_loss": -42.036542057005825, "global_step": 259786, "epoch": 2146, "val_loss": 2611224.75} {"train_loss": -41.56650161743164, "global_step": 259787, "epoch": 2147} {"train_loss": -42.134796142578125, "global_step": 259788, "epoch": 2147} {"train_loss": -43.02096176147461, "global_step": 259789, "epoch": 2147} {"train_loss": -42.06900405883789, "global_step": 259790, "epoch": 2147} {"train_loss": -40.81502151489258, "global_step": 259791, "epoch": 2147} {"train_loss": -42.11043167114258, "global_step": 259792, "epoch": 2147} {"train_loss": -42.72101593017578, "global_step": 259793, "epoch": 2147} {"train_loss": -41.699066162109375, "global_step": 259794, "epoch": 2147} {"train_loss": -42.3626823425293, "global_step": 259795, "epoch": 2147} {"train_loss": -42.516761779785156, "global_step": 259796, "epoch": 2147} {"train_loss": -41.06093215942383, "global_step": 259797, "epoch": 2147} {"train_loss": -41.221675872802734, "global_step": 259798, "epoch": 2147} {"train_loss": -41.1759033203125, "global_step": 259799, "epoch": 2147} {"train_loss": -42.22163009643555, "global_step": 259800, "epoch": 2147} {"train_loss": -42.064029693603516, "global_step": 259801, "epoch": 2147} {"train_loss": -41.19453048706055, "global_step": 259802, "epoch": 2147} {"train_loss": -39.8614501953125, "global_step": 259803, "epoch": 2147} {"train_loss": -41.826690673828125, "global_step": 259804, "epoch": 2147} {"train_loss": -41.2444953918457, "global_step": 259805, "epoch": 2147} {"train_loss": -39.82645797729492, "global_step": 259806, "epoch": 2147} {"train_loss": -37.752254486083984, "global_step": 259807, "epoch": 2147} {"train_loss": -38.54670333862305, "global_step": 259808, "epoch": 2147} {"train_loss": -41.506649017333984, "global_step": 259809, "epoch": 2147} {"train_loss": -35.518829345703125, "global_step": 259810, "epoch": 2147} {"train_loss": -31.828134536743164, "global_step": 259811, "epoch": 2147} {"train_loss": -37.5703239440918, "global_step": 259812, "epoch": 2147} {"train_loss": -39.622127532958984, "global_step": 259813, "epoch": 2147} {"train_loss": -37.282623291015625, "global_step": 259814, "epoch": 2147} {"train_loss": -37.924495697021484, "global_step": 259815, "epoch": 2147} {"train_loss": -40.929931640625, "global_step": 259816, "epoch": 2147} {"train_loss": -37.69362258911133, "global_step": 259817, "epoch": 2147} {"train_loss": -41.271610260009766, "global_step": 259818, "epoch": 2147} {"train_loss": -40.183067321777344, "global_step": 259819, "epoch": 2147} {"train_loss": -40.14787292480469, "global_step": 259820, "epoch": 2147} {"train_loss": -41.0460205078125, "global_step": 259821, "epoch": 2147} {"train_loss": -39.751461029052734, "global_step": 259822, "epoch": 2147} {"train_loss": -40.70463180541992, "global_step": 259823, "epoch": 2147} {"train_loss": -39.99449920654297, "global_step": 259824, "epoch": 2147} {"train_loss": -41.99849319458008, "global_step": 259825, "epoch": 2147} {"train_loss": -40.542964935302734, "global_step": 259826, "epoch": 2147} {"train_loss": -41.89775466918945, "global_step": 259827, "epoch": 2147} {"train_loss": -40.98165512084961, "global_step": 259828, "epoch": 2147} {"train_loss": -41.71840286254883, "global_step": 259829, "epoch": 2147} {"train_loss": -41.7355842590332, "global_step": 259830, "epoch": 2147} {"train_loss": -41.77061080932617, "global_step": 259831, "epoch": 2147} {"train_loss": -42.1400032043457, "global_step": 259832, "epoch": 2147} {"train_loss": -41.65668869018555, "global_step": 259833, "epoch": 2147} {"train_loss": -42.27582931518555, "global_step": 259834, "epoch": 2147} {"train_loss": -42.14830017089844, "global_step": 259835, "epoch": 2147} {"train_loss": -42.13066864013672, "global_step": 259836, "epoch": 2147} {"train_loss": -42.15708541870117, "global_step": 259837, "epoch": 2147} {"train_loss": -42.19466781616211, "global_step": 259838, "epoch": 2147} {"train_loss": -42.196983337402344, "global_step": 259839, "epoch": 2147} {"train_loss": -42.398468017578125, "global_step": 259840, "epoch": 2147} {"train_loss": -42.2910041809082, "global_step": 259841, "epoch": 2147} {"train_loss": -42.4080924987793, "global_step": 259842, "epoch": 2147} {"train_loss": -42.43790817260742, "global_step": 259843, "epoch": 2147} {"train_loss": -42.222084045410156, "global_step": 259844, "epoch": 2147} {"train_loss": -42.783016204833984, "global_step": 259845, "epoch": 2147} {"train_loss": -42.57126998901367, "global_step": 259846, "epoch": 2147} {"train_loss": -42.611392974853516, "global_step": 259847, "epoch": 2147} {"train_loss": -42.1346549987793, "global_step": 259848, "epoch": 2147} {"train_loss": -42.958072662353516, "global_step": 259849, "epoch": 2147} {"train_loss": -42.99189376831055, "global_step": 259850, "epoch": 2147} {"train_loss": -42.992916107177734, "global_step": 259851, "epoch": 2147} {"train_loss": -42.88236618041992, "global_step": 259852, "epoch": 2147} {"train_loss": -42.69712448120117, "global_step": 259853, "epoch": 2147} {"train_loss": -42.73638153076172, "global_step": 259854, "epoch": 2147} {"train_loss": -36.5950927734375, "global_step": 259855, "epoch": 2147} {"train_loss": -42.804744720458984, "global_step": 259856, "epoch": 2147} {"train_loss": -42.99384307861328, "global_step": 259857, "epoch": 2147} {"train_loss": -42.40272521972656, "global_step": 259858, "epoch": 2147} {"train_loss": -42.76295852661133, "global_step": 259859, "epoch": 2147} {"train_loss": -41.33345413208008, "global_step": 259860, "epoch": 2147} {"train_loss": -43.233680725097656, "global_step": 259861, "epoch": 2147} {"train_loss": -42.330745697021484, "global_step": 259862, "epoch": 2147} {"train_loss": -42.88794708251953, "global_step": 259863, "epoch": 2147} {"train_loss": -42.6994514465332, "global_step": 259864, "epoch": 2147} {"train_loss": -41.9134407043457, "global_step": 259865, "epoch": 2147} {"train_loss": -42.57892608642578, "global_step": 259866, "epoch": 2147} {"train_loss": -42.9484748840332, "global_step": 259867, "epoch": 2147} {"train_loss": -40.70359802246094, "global_step": 259868, "epoch": 2147} {"train_loss": -43.00178146362305, "global_step": 259869, "epoch": 2147} {"train_loss": -43.02324295043945, "global_step": 259870, "epoch": 2147} {"train_loss": -43.352108001708984, "global_step": 259871, "epoch": 2147} {"train_loss": -41.061744689941406, "global_step": 259872, "epoch": 2147} {"train_loss": -43.06538391113281, "global_step": 259873, "epoch": 2147} {"train_loss": -42.052276611328125, "global_step": 259874, "epoch": 2147} {"train_loss": -43.35430908203125, "global_step": 259875, "epoch": 2147} {"train_loss": -43.2223014831543, "global_step": 259876, "epoch": 2147} {"train_loss": -42.481727600097656, "global_step": 259877, "epoch": 2147} {"train_loss": -42.938865661621094, "global_step": 259878, "epoch": 2147} {"train_loss": -42.156429290771484, "global_step": 259879, "epoch": 2147} {"train_loss": -43.251670837402344, "global_step": 259880, "epoch": 2147} {"train_loss": -43.22038650512695, "global_step": 259881, "epoch": 2147} {"train_loss": -42.7388916015625, "global_step": 259882, "epoch": 2147} {"train_loss": -43.1545524597168, "global_step": 259883, "epoch": 2147} {"train_loss": -43.64351272583008, "global_step": 259884, "epoch": 2147} {"train_loss": -42.351661682128906, "global_step": 259885, "epoch": 2147} {"train_loss": -43.30233383178711, "global_step": 259886, "epoch": 2147} {"train_loss": -43.337074279785156, "global_step": 259887, "epoch": 2147} {"train_loss": -43.192359924316406, "global_step": 259888, "epoch": 2147} {"train_loss": -43.50330352783203, "global_step": 259889, "epoch": 2147} {"train_loss": -43.20290756225586, "global_step": 259890, "epoch": 2147} {"train_loss": -43.54462814331055, "global_step": 259891, "epoch": 2147} {"train_loss": -43.2959098815918, "global_step": 259892, "epoch": 2147} {"train_loss": -43.63112258911133, "global_step": 259893, "epoch": 2147} {"train_loss": -43.067256927490234, "global_step": 259894, "epoch": 2147} {"train_loss": -42.8807373046875, "global_step": 259895, "epoch": 2147} {"train_loss": -43.50061798095703, "global_step": 259896, "epoch": 2147} {"train_loss": -43.81991195678711, "global_step": 259897, "epoch": 2147} {"train_loss": -43.68779373168945, "global_step": 259898, "epoch": 2147} {"train_loss": -43.771018981933594, "global_step": 259899, "epoch": 2147} {"train_loss": -43.24761962890625, "global_step": 259900, "epoch": 2147} {"train_loss": -43.91170883178711, "global_step": 259901, "epoch": 2147} {"train_loss": -43.706626892089844, "global_step": 259902, "epoch": 2147} {"train_loss": -43.667720794677734, "global_step": 259903, "epoch": 2147} {"train_loss": -43.5467643737793, "global_step": 259904, "epoch": 2147} {"train_loss": -43.57500457763672, "global_step": 259905, "epoch": 2147} {"train_loss": -44.00020980834961, "global_step": 259906, "epoch": 2147} {"train_loss": -41.90993763001497, "global_step": 259907, "epoch": 2147, "val_loss": 2675339.75} {"train_loss": -43.63547897338867, "global_step": 259908, "epoch": 2148} {"train_loss": -43.065242767333984, "global_step": 259909, "epoch": 2148} {"train_loss": -42.60721206665039, "global_step": 259910, "epoch": 2148} {"train_loss": -42.781314849853516, "global_step": 259911, "epoch": 2148} {"train_loss": -43.4912223815918, "global_step": 259912, "epoch": 2148} {"train_loss": -42.63693618774414, "global_step": 259913, "epoch": 2148} {"train_loss": -40.07358932495117, "global_step": 259914, "epoch": 2148} {"train_loss": -38.74468994140625, "global_step": 259915, "epoch": 2148} {"train_loss": -42.13650131225586, "global_step": 259916, "epoch": 2148} {"train_loss": -41.5748291015625, "global_step": 259917, "epoch": 2148} {"train_loss": -41.29727554321289, "global_step": 259918, "epoch": 2148} {"train_loss": -37.93886947631836, "global_step": 259919, "epoch": 2148} {"train_loss": -37.341670989990234, "global_step": 259920, "epoch": 2148} {"train_loss": -40.55517578125, "global_step": 259921, "epoch": 2148} {"train_loss": -42.92822265625, "global_step": 259922, "epoch": 2148} {"train_loss": -42.249603271484375, "global_step": 259923, "epoch": 2148} {"train_loss": -41.53501510620117, "global_step": 259924, "epoch": 2148} {"train_loss": -43.11014938354492, "global_step": 259925, "epoch": 2148} {"train_loss": -41.48733901977539, "global_step": 259926, "epoch": 2148} {"train_loss": -41.63581466674805, "global_step": 259927, "epoch": 2148} {"train_loss": -43.30080795288086, "global_step": 259928, "epoch": 2148} {"train_loss": -42.07564163208008, "global_step": 259929, "epoch": 2148} {"train_loss": -42.76926040649414, "global_step": 259930, "epoch": 2148} {"train_loss": -42.927764892578125, "global_step": 259931, "epoch": 2148} {"train_loss": -42.02117919921875, "global_step": 259932, "epoch": 2148} {"train_loss": -43.363643646240234, "global_step": 259933, "epoch": 2148} {"train_loss": -41.58530807495117, "global_step": 259934, "epoch": 2148} {"train_loss": -42.87172317504883, "global_step": 259935, "epoch": 2148} {"train_loss": -42.05210494995117, "global_step": 259936, "epoch": 2148} {"train_loss": -43.18388748168945, "global_step": 259937, "epoch": 2148} {"train_loss": -42.77949905395508, "global_step": 259938, "epoch": 2148} {"train_loss": -42.490108489990234, "global_step": 259939, "epoch": 2148} {"train_loss": -43.363712310791016, "global_step": 259940, "epoch": 2148} {"train_loss": -43.091060638427734, "global_step": 259941, "epoch": 2148} {"train_loss": -42.903079986572266, "global_step": 259942, "epoch": 2148} {"train_loss": -42.76404571533203, "global_step": 259943, "epoch": 2148} {"train_loss": -43.484432220458984, "global_step": 259944, "epoch": 2148} {"train_loss": -43.20812225341797, "global_step": 259945, "epoch": 2148} {"train_loss": -42.695491790771484, "global_step": 259946, "epoch": 2148} {"train_loss": -43.442787170410156, "global_step": 259947, "epoch": 2148} {"train_loss": -43.39336395263672, "global_step": 259948, "epoch": 2148} {"train_loss": -43.56385803222656, "global_step": 259949, "epoch": 2148} {"train_loss": -43.16659164428711, "global_step": 259950, "epoch": 2148} {"train_loss": -43.78141403198242, "global_step": 259951, "epoch": 2148} {"train_loss": -43.117252349853516, "global_step": 259952, "epoch": 2148} {"train_loss": -43.28350067138672, "global_step": 259953, "epoch": 2148} {"train_loss": -42.83559036254883, "global_step": 259954, "epoch": 2148} {"train_loss": -43.387882232666016, "global_step": 259955, "epoch": 2148} {"train_loss": -43.17572784423828, "global_step": 259956, "epoch": 2148} {"train_loss": -42.85883712768555, "global_step": 259957, "epoch": 2148} {"train_loss": -42.682613372802734, "global_step": 259958, "epoch": 2148} {"train_loss": -42.85374069213867, "global_step": 259959, "epoch": 2148} {"train_loss": -43.48676681518555, "global_step": 259960, "epoch": 2148} {"train_loss": -42.95575714111328, "global_step": 259961, "epoch": 2148} {"train_loss": -42.45261001586914, "global_step": 259962, "epoch": 2148} {"train_loss": -42.445091247558594, "global_step": 259963, "epoch": 2148} {"train_loss": -43.89479446411133, "global_step": 259964, "epoch": 2148} {"train_loss": -41.665401458740234, "global_step": 259965, "epoch": 2148} {"train_loss": -41.20194625854492, "global_step": 259966, "epoch": 2148} {"train_loss": -42.710845947265625, "global_step": 259967, "epoch": 2148} {"train_loss": -43.42851638793945, "global_step": 259968, "epoch": 2148} {"train_loss": -42.442840576171875, "global_step": 259969, "epoch": 2148} {"train_loss": -42.18780517578125, "global_step": 259970, "epoch": 2148} {"train_loss": -43.02598190307617, "global_step": 259971, "epoch": 2148} {"train_loss": -43.69734573364258, "global_step": 259972, "epoch": 2148} {"train_loss": -42.86994552612305, "global_step": 259973, "epoch": 2148} {"train_loss": -43.25844192504883, "global_step": 259974, "epoch": 2148} {"train_loss": -42.59817123413086, "global_step": 259975, "epoch": 2148} {"train_loss": -43.05153274536133, "global_step": 259976, "epoch": 2148} {"train_loss": -43.03514862060547, "global_step": 259977, "epoch": 2148} {"train_loss": -42.913570404052734, "global_step": 259978, "epoch": 2148} {"train_loss": -42.220123291015625, "global_step": 259979, "epoch": 2148} {"train_loss": -41.92671585083008, "global_step": 259980, "epoch": 2148} {"train_loss": -41.5203857421875, "global_step": 259981, "epoch": 2148} {"train_loss": -41.70803451538086, "global_step": 259982, "epoch": 2148} {"train_loss": -42.63720703125, "global_step": 259983, "epoch": 2148} {"train_loss": -43.065425872802734, "global_step": 259984, "epoch": 2148} {"train_loss": -41.45942306518555, "global_step": 259985, "epoch": 2148} {"train_loss": -42.0578727722168, "global_step": 259986, "epoch": 2148} {"train_loss": -42.74385452270508, "global_step": 259987, "epoch": 2148} {"train_loss": -41.14068603515625, "global_step": 259988, "epoch": 2148} {"train_loss": -42.28371047973633, "global_step": 259989, "epoch": 2148} {"train_loss": -42.7103271484375, "global_step": 259990, "epoch": 2148} {"train_loss": -43.601715087890625, "global_step": 259991, "epoch": 2148} {"train_loss": -42.2469482421875, "global_step": 259992, "epoch": 2148} {"train_loss": -42.40229034423828, "global_step": 259993, "epoch": 2148} {"train_loss": -42.421146392822266, "global_step": 259994, "epoch": 2148} {"train_loss": -42.73147201538086, "global_step": 259995, "epoch": 2148} {"train_loss": -42.238346099853516, "global_step": 259996, "epoch": 2148} {"train_loss": -42.68512725830078, "global_step": 259997, "epoch": 2148} {"train_loss": -42.167598724365234, "global_step": 259998, "epoch": 2148} {"train_loss": -41.95051956176758, "global_step": 259999, "epoch": 2148} {"train_loss": -42.68307876586914, "global_step": 260000, "epoch": 2148} {"train_loss": -42.285980224609375, "global_step": 260001, "epoch": 2148} {"train_loss": -42.86997604370117, "global_step": 260002, "epoch": 2148} {"train_loss": -42.446746826171875, "global_step": 260003, "epoch": 2148} {"train_loss": -42.232662200927734, "global_step": 260004, "epoch": 2148} {"train_loss": -43.29679870605469, "global_step": 260005, "epoch": 2148} {"train_loss": -42.50642776489258, "global_step": 260006, "epoch": 2148} {"train_loss": -42.68077087402344, "global_step": 260007, "epoch": 2148} {"train_loss": -42.850337982177734, "global_step": 260008, "epoch": 2148} {"train_loss": -43.44662094116211, "global_step": 260009, "epoch": 2148} {"train_loss": -42.379085540771484, "global_step": 260010, "epoch": 2148} {"train_loss": -41.604713439941406, "global_step": 260011, "epoch": 2148} {"train_loss": -42.997108459472656, "global_step": 260012, "epoch": 2148} {"train_loss": -43.06610107421875, "global_step": 260013, "epoch": 2148} {"train_loss": -42.69807815551758, "global_step": 260014, "epoch": 2148} {"train_loss": -42.362239837646484, "global_step": 260015, "epoch": 2148} {"train_loss": -41.662837982177734, "global_step": 260016, "epoch": 2148} {"train_loss": -40.691650390625, "global_step": 260017, "epoch": 2148} {"train_loss": -41.86202621459961, "global_step": 260018, "epoch": 2148} {"train_loss": -42.2449836730957, "global_step": 260019, "epoch": 2148} {"train_loss": -42.35114669799805, "global_step": 260020, "epoch": 2148} {"train_loss": -41.812705993652344, "global_step": 260021, "epoch": 2148} {"train_loss": -42.722259521484375, "global_step": 260022, "epoch": 2148} {"train_loss": -42.562198638916016, "global_step": 260023, "epoch": 2148} {"train_loss": -41.834877014160156, "global_step": 260024, "epoch": 2148} {"train_loss": -42.85659408569336, "global_step": 260025, "epoch": 2148} {"train_loss": -41.729454040527344, "global_step": 260026, "epoch": 2148} {"train_loss": -41.668582916259766, "global_step": 260027, "epoch": 2148} {"train_loss": -42.44002261831741, "global_step": 260028, "epoch": 2148, "val_loss": 2703321.75} {"train_loss": -41.98154830932617, "global_step": 260029, "epoch": 2149} {"train_loss": -42.49424743652344, "global_step": 260030, "epoch": 2149} {"train_loss": -43.33501052856445, "global_step": 260031, "epoch": 2149} {"train_loss": -43.00931930541992, "global_step": 260032, "epoch": 2149} {"train_loss": -42.57546615600586, "global_step": 260033, "epoch": 2149} {"train_loss": -42.45941162109375, "global_step": 260034, "epoch": 2149} {"train_loss": -43.25655746459961, "global_step": 260035, "epoch": 2149} {"train_loss": -42.90544891357422, "global_step": 260036, "epoch": 2149} {"train_loss": -42.74245071411133, "global_step": 260037, "epoch": 2149} {"train_loss": -42.633758544921875, "global_step": 260038, "epoch": 2149} {"train_loss": -43.12891387939453, "global_step": 260039, "epoch": 2149} {"train_loss": -43.158138275146484, "global_step": 260040, "epoch": 2149} {"train_loss": -43.126365661621094, "global_step": 260041, "epoch": 2149} {"train_loss": -40.76985549926758, "global_step": 260042, "epoch": 2149} {"train_loss": -41.206817626953125, "global_step": 260043, "epoch": 2149} {"train_loss": -42.9103889465332, "global_step": 260044, "epoch": 2149} {"train_loss": -42.35219955444336, "global_step": 260045, "epoch": 2149} {"train_loss": -43.03011703491211, "global_step": 260046, "epoch": 2149} {"train_loss": -42.64680099487305, "global_step": 260047, "epoch": 2149} {"train_loss": -43.077903747558594, "global_step": 260048, "epoch": 2149} {"train_loss": -42.81815719604492, "global_step": 260049, "epoch": 2149} {"train_loss": -42.94926834106445, "global_step": 260050, "epoch": 2149} {"train_loss": -42.42365646362305, "global_step": 260051, "epoch": 2149} {"train_loss": -42.954627990722656, "global_step": 260052, "epoch": 2149} {"train_loss": -42.08736038208008, "global_step": 260053, "epoch": 2149} {"train_loss": -43.361427307128906, "global_step": 260054, "epoch": 2149} {"train_loss": -42.15620422363281, "global_step": 260055, "epoch": 2149} {"train_loss": -42.535762786865234, "global_step": 260056, "epoch": 2149} {"train_loss": -43.3021125793457, "global_step": 260057, "epoch": 2149} {"train_loss": -42.94411849975586, "global_step": 260058, "epoch": 2149} {"train_loss": -42.858211517333984, "global_step": 260059, "epoch": 2149} {"train_loss": -43.296661376953125, "global_step": 260060, "epoch": 2149} {"train_loss": -42.762733459472656, "global_step": 260061, "epoch": 2149} {"train_loss": -43.34648895263672, "global_step": 260062, "epoch": 2149} {"train_loss": -42.988094329833984, "global_step": 260063, "epoch": 2149} {"train_loss": -43.5023193359375, "global_step": 260064, "epoch": 2149} {"train_loss": -43.5837516784668, "global_step": 260065, "epoch": 2149} {"train_loss": -43.50791549682617, "global_step": 260066, "epoch": 2149} {"train_loss": -43.493438720703125, "global_step": 260067, "epoch": 2149} {"train_loss": -43.27712631225586, "global_step": 260068, "epoch": 2149} {"train_loss": -43.39923095703125, "global_step": 260069, "epoch": 2149} {"train_loss": -43.4100227355957, "global_step": 260070, "epoch": 2149} {"train_loss": -43.375423431396484, "global_step": 260071, "epoch": 2149} {"train_loss": -43.32932662963867, "global_step": 260072, "epoch": 2149} {"train_loss": -42.929500579833984, "global_step": 260073, "epoch": 2149} {"train_loss": -43.35136413574219, "global_step": 260074, "epoch": 2149} {"train_loss": -42.75143051147461, "global_step": 260075, "epoch": 2149} {"train_loss": -42.86275863647461, "global_step": 260076, "epoch": 2149} {"train_loss": -42.68967819213867, "global_step": 260077, "epoch": 2149} {"train_loss": -42.960628509521484, "global_step": 260078, "epoch": 2149} {"train_loss": -42.57977294921875, "global_step": 260079, "epoch": 2149} {"train_loss": -43.64348220825195, "global_step": 260080, "epoch": 2149} {"train_loss": -43.97802734375, "global_step": 260081, "epoch": 2149} {"train_loss": -42.55958938598633, "global_step": 260082, "epoch": 2149} {"train_loss": -43.41094970703125, "global_step": 260083, "epoch": 2149} {"train_loss": -43.42277145385742, "global_step": 260084, "epoch": 2149} {"train_loss": -42.439876556396484, "global_step": 260085, "epoch": 2149} {"train_loss": -42.550209045410156, "global_step": 260086, "epoch": 2149} {"train_loss": -43.61320114135742, "global_step": 260087, "epoch": 2149} {"train_loss": -42.09523391723633, "global_step": 260088, "epoch": 2149} {"train_loss": -40.30485916137695, "global_step": 260089, "epoch": 2149} {"train_loss": -42.1576042175293, "global_step": 260090, "epoch": 2149} {"train_loss": -43.215003967285156, "global_step": 260091, "epoch": 2149} {"train_loss": -42.57119369506836, "global_step": 260092, "epoch": 2149} {"train_loss": -41.85588455200195, "global_step": 260093, "epoch": 2149} {"train_loss": -40.53364181518555, "global_step": 260094, "epoch": 2149} {"train_loss": -40.29027557373047, "global_step": 260095, "epoch": 2149} {"train_loss": -42.21369552612305, "global_step": 260096, "epoch": 2149} {"train_loss": -42.24039840698242, "global_step": 260097, "epoch": 2149} {"train_loss": -41.99365234375, "global_step": 260098, "epoch": 2149} {"train_loss": -40.78966522216797, "global_step": 260099, "epoch": 2149} {"train_loss": -41.62557601928711, "global_step": 260100, "epoch": 2149} {"train_loss": -43.18164825439453, "global_step": 260101, "epoch": 2149} {"train_loss": -36.043785095214844, "global_step": 260102, "epoch": 2149} {"train_loss": -41.894439697265625, "global_step": 260103, "epoch": 2149} {"train_loss": -38.473777770996094, "global_step": 260104, "epoch": 2149} {"train_loss": -42.9004020690918, "global_step": 260105, "epoch": 2149} {"train_loss": -41.7623176574707, "global_step": 260106, "epoch": 2149} {"train_loss": -37.084354400634766, "global_step": 260107, "epoch": 2149} {"train_loss": -38.550880432128906, "global_step": 260108, "epoch": 2149} {"train_loss": -40.906063079833984, "global_step": 260109, "epoch": 2149} {"train_loss": -39.41538619995117, "global_step": 260110, "epoch": 2149} {"train_loss": -34.80290985107422, "global_step": 260111, "epoch": 2149} {"train_loss": -30.35249900817871, "global_step": 260112, "epoch": 2149} {"train_loss": -27.8046817779541, "global_step": 260113, "epoch": 2149} {"train_loss": -40.11484909057617, "global_step": 260114, "epoch": 2149} {"train_loss": -40.19149398803711, "global_step": 260115, "epoch": 2149} {"train_loss": -38.94236373901367, "global_step": 260116, "epoch": 2149} {"train_loss": -39.452369689941406, "global_step": 260117, "epoch": 2149} {"train_loss": -38.87716293334961, "global_step": 260118, "epoch": 2149} {"train_loss": -27.67111587524414, "global_step": 260119, "epoch": 2149} {"train_loss": -37.8334846496582, "global_step": 260120, "epoch": 2149} {"train_loss": -38.398929595947266, "global_step": 260121, "epoch": 2149} {"train_loss": 15.549160957336426, "global_step": 260122, "epoch": 2149} {"train_loss": -34.415672302246094, "global_step": 260123, "epoch": 2149} {"train_loss": -28.125, "global_step": 260124, "epoch": 2149} {"train_loss": -26.321353912353516, "global_step": 260125, "epoch": 2149} {"train_loss": -34.36261749267578, "global_step": 260126, "epoch": 2149} {"train_loss": -19.344242095947266, "global_step": 260127, "epoch": 2149} {"train_loss": -33.92951965332031, "global_step": 260128, "epoch": 2149} {"train_loss": -34.76561737060547, "global_step": 260129, "epoch": 2149} {"train_loss": -33.76850509643555, "global_step": 260130, "epoch": 2149} {"train_loss": -13.750642776489258, "global_step": 260131, "epoch": 2149} {"train_loss": -15.386151313781738, "global_step": 260132, "epoch": 2149} {"train_loss": -23.054765701293945, "global_step": 260133, "epoch": 2149} {"train_loss": -30.311365127563477, "global_step": 260134, "epoch": 2149} {"train_loss": -34.26627731323242, "global_step": 260135, "epoch": 2149} {"train_loss": -29.122882843017578, "global_step": 260136, "epoch": 2149} {"train_loss": -28.438648223876953, "global_step": 260137, "epoch": 2149} {"train_loss": -34.4893913269043, "global_step": 260138, "epoch": 2149} {"train_loss": -32.5737190246582, "global_step": 260139, "epoch": 2149} {"train_loss": -32.72101974487305, "global_step": 260140, "epoch": 2149} {"train_loss": -33.43740463256836, "global_step": 260141, "epoch": 2149} {"train_loss": -33.3460807800293, "global_step": 260142, "epoch": 2149} {"train_loss": -35.114166259765625, "global_step": 260143, "epoch": 2149} {"train_loss": -34.381099700927734, "global_step": 260144, "epoch": 2149} {"train_loss": -36.80146789550781, "global_step": 260145, "epoch": 2149} {"train_loss": -33.70923614501953, "global_step": 260146, "epoch": 2149} {"train_loss": -37.24372482299805, "global_step": 260147, "epoch": 2149} {"train_loss": -34.68953323364258, "global_step": 260148, "epoch": 2149} {"train_loss": -38.74035280401056, "global_step": 260149, "epoch": 2149, "val_loss": 2685795.25} {"train_loss": -36.235450744628906, "global_step": 260150, "epoch": 2150} {"train_loss": -36.147674560546875, "global_step": 260151, "epoch": 2150} {"train_loss": -36.48403549194336, "global_step": 260152, "epoch": 2150} {"train_loss": -36.86564254760742, "global_step": 260153, "epoch": 2150} {"train_loss": -35.48382568359375, "global_step": 260154, "epoch": 2150} {"train_loss": -37.073917388916016, "global_step": 260155, "epoch": 2150} {"train_loss": -37.81600570678711, "global_step": 260156, "epoch": 2150} {"train_loss": -36.22673797607422, "global_step": 260157, "epoch": 2150} {"train_loss": -37.08684539794922, "global_step": 260158, "epoch": 2150} {"train_loss": -36.774932861328125, "global_step": 260159, "epoch": 2150} {"train_loss": -37.0476188659668, "global_step": 260160, "epoch": 2150} {"train_loss": -36.90481185913086, "global_step": 260161, "epoch": 2150} {"train_loss": -36.304649353027344, "global_step": 260162, "epoch": 2150} {"train_loss": -36.940731048583984, "global_step": 260163, "epoch": 2150} {"train_loss": -37.012630462646484, "global_step": 260164, "epoch": 2150} {"train_loss": -37.38688278198242, "global_step": 260165, "epoch": 2150} {"train_loss": -37.45033264160156, "global_step": 260166, "epoch": 2150} {"train_loss": -37.66719436645508, "global_step": 260167, "epoch": 2150} {"train_loss": -37.33797073364258, "global_step": 260168, "epoch": 2150} {"train_loss": -37.69865036010742, "global_step": 260169, "epoch": 2150} {"train_loss": -37.278709411621094, "global_step": 260170, "epoch": 2150} {"train_loss": -38.09139633178711, "global_step": 260171, "epoch": 2150} {"train_loss": -38.37392807006836, "global_step": 260172, "epoch": 2150} {"train_loss": -38.40015411376953, "global_step": 260173, "epoch": 2150} {"train_loss": -37.605987548828125, "global_step": 260174, "epoch": 2150} {"train_loss": -38.54911804199219, "global_step": 260175, "epoch": 2150} {"train_loss": -38.24626541137695, "global_step": 260176, "epoch": 2150} {"train_loss": -38.4660758972168, "global_step": 260177, "epoch": 2150} {"train_loss": -38.614418029785156, "global_step": 260178, "epoch": 2150} {"train_loss": -37.6240348815918, "global_step": 260179, "epoch": 2150} {"train_loss": -38.447410583496094, "global_step": 260180, "epoch": 2150} {"train_loss": -39.2689323425293, "global_step": 260181, "epoch": 2150} {"train_loss": -38.29249954223633, "global_step": 260182, "epoch": 2150} {"train_loss": -38.38731384277344, "global_step": 260183, "epoch": 2150} {"train_loss": -38.86916732788086, "global_step": 260184, "epoch": 2150} {"train_loss": -38.989376068115234, "global_step": 260185, "epoch": 2150} {"train_loss": -39.173805236816406, "global_step": 260186, "epoch": 2150} {"train_loss": -38.61482620239258, "global_step": 260187, "epoch": 2150} {"train_loss": -39.0142822265625, "global_step": 260188, "epoch": 2150} {"train_loss": -39.42666244506836, "global_step": 260189, "epoch": 2150} {"train_loss": -39.43907928466797, "global_step": 260190, "epoch": 2150} {"train_loss": -38.601619720458984, "global_step": 260191, "epoch": 2150} {"train_loss": -37.94696807861328, "global_step": 260192, "epoch": 2150} {"train_loss": -38.97199249267578, "global_step": 260193, "epoch": 2150} {"train_loss": -38.968196868896484, "global_step": 260194, "epoch": 2150} {"train_loss": -39.19776153564453, "global_step": 260195, "epoch": 2150} {"train_loss": -39.14716339111328, "global_step": 260196, "epoch": 2150} {"train_loss": -39.689971923828125, "global_step": 260197, "epoch": 2150} {"train_loss": -38.451393127441406, "global_step": 260198, "epoch": 2150} {"train_loss": -39.66913986206055, "global_step": 260199, "epoch": 2150} {"train_loss": -39.13925552368164, "global_step": 260200, "epoch": 2150} {"train_loss": -40.10472106933594, "global_step": 260201, "epoch": 2150} {"train_loss": -39.15775680541992, "global_step": 260202, "epoch": 2150} {"train_loss": -39.44898223876953, "global_step": 260203, "epoch": 2150} {"train_loss": -39.98566818237305, "global_step": 260204, "epoch": 2150} {"train_loss": -39.5857048034668, "global_step": 260205, "epoch": 2150} {"train_loss": -39.865596771240234, "global_step": 260206, "epoch": 2150} {"train_loss": -40.10327911376953, "global_step": 260207, "epoch": 2150} {"train_loss": -40.19733810424805, "global_step": 260208, "epoch": 2150} {"train_loss": -38.503021240234375, "global_step": 260209, "epoch": 2150} {"train_loss": -40.17657470703125, "global_step": 260210, "epoch": 2150} {"train_loss": -38.9882698059082, "global_step": 260211, "epoch": 2150} {"train_loss": -39.66565704345703, "global_step": 260212, "epoch": 2150} {"train_loss": -40.242671966552734, "global_step": 260213, "epoch": 2150} {"train_loss": -40.14912796020508, "global_step": 260214, "epoch": 2150} {"train_loss": -39.88642883300781, "global_step": 260215, "epoch": 2150} {"train_loss": -39.910579681396484, "global_step": 260216, "epoch": 2150} {"train_loss": -39.68006134033203, "global_step": 260217, "epoch": 2150} {"train_loss": -40.12188720703125, "global_step": 260218, "epoch": 2150} {"train_loss": -40.49969482421875, "global_step": 260219, "epoch": 2150} {"train_loss": -40.27393341064453, "global_step": 260220, "epoch": 2150} {"train_loss": -40.232757568359375, "global_step": 260221, "epoch": 2150} {"train_loss": -40.616416931152344, "global_step": 260222, "epoch": 2150} {"train_loss": -39.484676361083984, "global_step": 260223, "epoch": 2150} {"train_loss": -40.21464157104492, "global_step": 260224, "epoch": 2150} {"train_loss": -40.454219818115234, "global_step": 260225, "epoch": 2150} {"train_loss": -40.277259826660156, "global_step": 260226, "epoch": 2150} {"train_loss": -40.57017135620117, "global_step": 260227, "epoch": 2150} {"train_loss": -40.77949142456055, "global_step": 260228, "epoch": 2150} {"train_loss": -40.6795539855957, "global_step": 260229, "epoch": 2150} {"train_loss": -40.70758056640625, "global_step": 260230, "epoch": 2150} {"train_loss": -40.881221771240234, "global_step": 260231, "epoch": 2150} {"train_loss": -40.05615997314453, "global_step": 260232, "epoch": 2150} {"train_loss": -40.76486587524414, "global_step": 260233, "epoch": 2150} {"train_loss": -41.0626106262207, "global_step": 260234, "epoch": 2150} {"train_loss": -40.8775749206543, "global_step": 260235, "epoch": 2150} {"train_loss": -40.9012565612793, "global_step": 260236, "epoch": 2150} {"train_loss": -41.228485107421875, "global_step": 260237, "epoch": 2150} {"train_loss": -40.6052360534668, "global_step": 260238, "epoch": 2150} {"train_loss": -41.12112808227539, "global_step": 260239, "epoch": 2150} {"train_loss": -40.946014404296875, "global_step": 260240, "epoch": 2150} {"train_loss": -41.20508575439453, "global_step": 260241, "epoch": 2150} {"train_loss": -40.8667106628418, "global_step": 260242, "epoch": 2150} {"train_loss": -40.65185546875, "global_step": 260243, "epoch": 2150} {"train_loss": -40.19633865356445, "global_step": 260244, "epoch": 2150} {"train_loss": -41.142452239990234, "global_step": 260245, "epoch": 2150} {"train_loss": -41.143253326416016, "global_step": 260246, "epoch": 2150} {"train_loss": -41.16859436035156, "global_step": 260247, "epoch": 2150} {"train_loss": -40.2394905090332, "global_step": 260248, "epoch": 2150} {"train_loss": -41.142433166503906, "global_step": 260249, "epoch": 2150} {"train_loss": -41.379180908203125, "global_step": 260250, "epoch": 2150} {"train_loss": -41.37500762939453, "global_step": 260251, "epoch": 2150} {"train_loss": -41.63370132446289, "global_step": 260252, "epoch": 2150} {"train_loss": -41.82600021362305, "global_step": 260253, "epoch": 2150} {"train_loss": -40.42812728881836, "global_step": 260254, "epoch": 2150} {"train_loss": -41.08942413330078, "global_step": 260255, "epoch": 2150} {"train_loss": -41.21206283569336, "global_step": 260256, "epoch": 2150} {"train_loss": -41.516082763671875, "global_step": 260257, "epoch": 2150} {"train_loss": -41.54709243774414, "global_step": 260258, "epoch": 2150} {"train_loss": -41.30901336669922, "global_step": 260259, "epoch": 2150} {"train_loss": -40.85329818725586, "global_step": 260260, "epoch": 2150} {"train_loss": -40.8118896484375, "global_step": 260261, "epoch": 2150} {"train_loss": -41.5462760925293, "global_step": 260262, "epoch": 2150} {"train_loss": -41.46183395385742, "global_step": 260263, "epoch": 2150} {"train_loss": -41.8238639831543, "global_step": 260264, "epoch": 2150} {"train_loss": -40.95393371582031, "global_step": 260265, "epoch": 2150} {"train_loss": -41.53419876098633, "global_step": 260266, "epoch": 2150} {"train_loss": -41.63368225097656, "global_step": 260267, "epoch": 2150} {"train_loss": -42.04868698120117, "global_step": 260268, "epoch": 2150} {"train_loss": -42.015037536621094, "global_step": 260269, "epoch": 2150} {"train_loss": -39.52909384483148, "global_step": 260270, "epoch": 2150, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4400000": 1.0, "test/sim_max_reward_4400001": 1.0, "test/sim_max_reward_4400002": 1.0, "test/sim_max_reward_4400003": 0.0, "test/sim_max_reward_4400004": 1.0, "test/sim_max_reward_4400005": 1.0, "test/sim_max_reward_4400006": 1.0, "test/sim_max_reward_4400007": 1.0, "test/sim_max_reward_4400008": 1.0, "test/sim_max_reward_4400009": 1.0, "test/sim_max_reward_4400010": 1.0, "test/sim_max_reward_4400011": 1.0, "test/sim_max_reward_4400012": 1.0, "test/sim_max_reward_4400013": 1.0, "test/sim_max_reward_4400014": 1.0, "test/sim_max_reward_4400015": 1.0, "test/sim_max_reward_4400016": 1.0, "test/sim_max_reward_4400017": 1.0, "test/sim_max_reward_4400018": 1.0, "test/sim_max_reward_4400019": 1.0, "test/sim_max_reward_4400020": 1.0, "test/sim_max_reward_4400021": 1.0, "train/mean_score": 1.0, "test/mean_score": 0.9545454545454546, "val_loss": 2643657.25} {"train_loss": -41.27418899536133, "global_step": 260271, "epoch": 2151} {"train_loss": -41.86817169189453, "global_step": 260272, "epoch": 2151} {"train_loss": -42.002498626708984, "global_step": 260273, "epoch": 2151} {"train_loss": -41.44984817504883, "global_step": 260274, "epoch": 2151} {"train_loss": -42.18027114868164, "global_step": 260275, "epoch": 2151} {"train_loss": -41.79110336303711, "global_step": 260276, "epoch": 2151} {"train_loss": -41.185970306396484, "global_step": 260277, "epoch": 2151} {"train_loss": -41.528778076171875, "global_step": 260278, "epoch": 2151} {"train_loss": -41.78240966796875, "global_step": 260279, "epoch": 2151} {"train_loss": -42.4805908203125, "global_step": 260280, "epoch": 2151} {"train_loss": -41.981441497802734, "global_step": 260281, "epoch": 2151} {"train_loss": -42.178707122802734, "global_step": 260282, "epoch": 2151} {"train_loss": -42.205841064453125, "global_step": 260283, "epoch": 2151} {"train_loss": -42.549259185791016, "global_step": 260284, "epoch": 2151} {"train_loss": -39.23938751220703, "global_step": 260285, "epoch": 2151} {"train_loss": -41.77305221557617, "global_step": 260286, "epoch": 2151} {"train_loss": -42.37600326538086, "global_step": 260287, "epoch": 2151} {"train_loss": -41.222557067871094, "global_step": 260288, "epoch": 2151} {"train_loss": -42.05935287475586, "global_step": 260289, "epoch": 2151} {"train_loss": -42.404380798339844, "global_step": 260290, "epoch": 2151} {"train_loss": -42.448299407958984, "global_step": 260291, "epoch": 2151} {"train_loss": -41.84732437133789, "global_step": 260292, "epoch": 2151} {"train_loss": -42.57028579711914, "global_step": 260293, "epoch": 2151} {"train_loss": -42.54045486450195, "global_step": 260294, "epoch": 2151} {"train_loss": -42.116756439208984, "global_step": 260295, "epoch": 2151} {"train_loss": -42.05619430541992, "global_step": 260296, "epoch": 2151} {"train_loss": -40.741817474365234, "global_step": 260297, "epoch": 2151} {"train_loss": -42.34005355834961, "global_step": 260298, "epoch": 2151} {"train_loss": -41.57322692871094, "global_step": 260299, "epoch": 2151} {"train_loss": -42.3303108215332, "global_step": 260300, "epoch": 2151} {"train_loss": -42.15616989135742, "global_step": 260301, "epoch": 2151} {"train_loss": -42.05586624145508, "global_step": 260302, "epoch": 2151} {"train_loss": -42.098323822021484, "global_step": 260303, "epoch": 2151} {"train_loss": -42.47917556762695, "global_step": 260304, "epoch": 2151} {"train_loss": -42.58855056762695, "global_step": 260305, "epoch": 2151} {"train_loss": -42.064788818359375, "global_step": 260306, "epoch": 2151} {"train_loss": -42.13594055175781, "global_step": 260307, "epoch": 2151} {"train_loss": -40.51438903808594, "global_step": 260308, "epoch": 2151} {"train_loss": -42.286861419677734, "global_step": 260309, "epoch": 2151} {"train_loss": -41.101078033447266, "global_step": 260310, "epoch": 2151} {"train_loss": -41.79401397705078, "global_step": 260311, "epoch": 2151} {"train_loss": -42.2631721496582, "global_step": 260312, "epoch": 2151} {"train_loss": -42.148380279541016, "global_step": 260313, "epoch": 2151} {"train_loss": -42.12174606323242, "global_step": 260314, "epoch": 2151} {"train_loss": -42.8383674621582, "global_step": 260315, "epoch": 2151} {"train_loss": -41.6378059387207, "global_step": 260316, "epoch": 2151} {"train_loss": -41.58380889892578, "global_step": 260317, "epoch": 2151} {"train_loss": -42.31547927856445, "global_step": 260318, "epoch": 2151} {"train_loss": -42.37115478515625, "global_step": 260319, "epoch": 2151} {"train_loss": -42.430843353271484, "global_step": 260320, "epoch": 2151} {"train_loss": -42.117095947265625, "global_step": 260321, "epoch": 2151} {"train_loss": -42.49874496459961, "global_step": 260322, "epoch": 2151} {"train_loss": -42.463958740234375, "global_step": 260323, "epoch": 2151} {"train_loss": -41.525760650634766, "global_step": 260324, "epoch": 2151} {"train_loss": -42.5909538269043, "global_step": 260325, "epoch": 2151} {"train_loss": -41.94567108154297, "global_step": 260326, "epoch": 2151} {"train_loss": -42.00682067871094, "global_step": 260327, "epoch": 2151} {"train_loss": -41.629764556884766, "global_step": 260328, "epoch": 2151} {"train_loss": -41.46833038330078, "global_step": 260329, "epoch": 2151} {"train_loss": -41.569183349609375, "global_step": 260330, "epoch": 2151} {"train_loss": -40.385379791259766, "global_step": 260331, "epoch": 2151} {"train_loss": -41.1435432434082, "global_step": 260332, "epoch": 2151} {"train_loss": -41.05229568481445, "global_step": 260333, "epoch": 2151} {"train_loss": -41.58364486694336, "global_step": 260334, "epoch": 2151} {"train_loss": -41.61153793334961, "global_step": 260335, "epoch": 2151} {"train_loss": -41.44962692260742, "global_step": 260336, "epoch": 2151} {"train_loss": -42.50870895385742, "global_step": 260337, "epoch": 2151} {"train_loss": -41.71366882324219, "global_step": 260338, "epoch": 2151} {"train_loss": -41.712684631347656, "global_step": 260339, "epoch": 2151} {"train_loss": -42.343788146972656, "global_step": 260340, "epoch": 2151} {"train_loss": -42.121620178222656, "global_step": 260341, "epoch": 2151} {"train_loss": -41.377113342285156, "global_step": 260342, "epoch": 2151} {"train_loss": -42.056610107421875, "global_step": 260343, "epoch": 2151} {"train_loss": -41.27790069580078, "global_step": 260344, "epoch": 2151} {"train_loss": -42.30694580078125, "global_step": 260345, "epoch": 2151} {"train_loss": -42.38454818725586, "global_step": 260346, "epoch": 2151} {"train_loss": -40.02626419067383, "global_step": 260347, "epoch": 2151} {"train_loss": -40.55221176147461, "global_step": 260348, "epoch": 2151} {"train_loss": -41.77467346191406, "global_step": 260349, "epoch": 2151} {"train_loss": -41.30901336669922, "global_step": 260350, "epoch": 2151} {"train_loss": -40.48331832885742, "global_step": 260351, "epoch": 2151} {"train_loss": -41.224910736083984, "global_step": 260352, "epoch": 2151} {"train_loss": -41.04849624633789, "global_step": 260353, "epoch": 2151} {"train_loss": -42.50071334838867, "global_step": 260354, "epoch": 2151} {"train_loss": -41.887290954589844, "global_step": 260355, "epoch": 2151} {"train_loss": -41.96242141723633, "global_step": 260356, "epoch": 2151} {"train_loss": -42.821468353271484, "global_step": 260357, "epoch": 2151} {"train_loss": -42.29118728637695, "global_step": 260358, "epoch": 2151} {"train_loss": -41.943904876708984, "global_step": 260359, "epoch": 2151} {"train_loss": -42.309486389160156, "global_step": 260360, "epoch": 2151} {"train_loss": -42.90704345703125, "global_step": 260361, "epoch": 2151} {"train_loss": -42.04213333129883, "global_step": 260362, "epoch": 2151} {"train_loss": -41.52137756347656, "global_step": 260363, "epoch": 2151} {"train_loss": -42.550472259521484, "global_step": 260364, "epoch": 2151} {"train_loss": -41.9656867980957, "global_step": 260365, "epoch": 2151} {"train_loss": -41.339054107666016, "global_step": 260366, "epoch": 2151} {"train_loss": -41.99277877807617, "global_step": 260367, "epoch": 2151} {"train_loss": -42.23786544799805, "global_step": 260368, "epoch": 2151} {"train_loss": -42.09192657470703, "global_step": 260369, "epoch": 2151} {"train_loss": -42.242103576660156, "global_step": 260370, "epoch": 2151} {"train_loss": -42.804866790771484, "global_step": 260371, "epoch": 2151} {"train_loss": -41.14607620239258, "global_step": 260372, "epoch": 2151} {"train_loss": -40.562042236328125, "global_step": 260373, "epoch": 2151} {"train_loss": -41.69416046142578, "global_step": 260374, "epoch": 2151} {"train_loss": -41.81684112548828, "global_step": 260375, "epoch": 2151} {"train_loss": -39.66706085205078, "global_step": 260376, "epoch": 2151} {"train_loss": -39.3133430480957, "global_step": 260377, "epoch": 2151} {"train_loss": -41.506919860839844, "global_step": 260378, "epoch": 2151} {"train_loss": -41.25338363647461, "global_step": 260379, "epoch": 2151} {"train_loss": -40.16267013549805, "global_step": 260380, "epoch": 2151} {"train_loss": -42.28409957885742, "global_step": 260381, "epoch": 2151} {"train_loss": -41.019405364990234, "global_step": 260382, "epoch": 2151} {"train_loss": -40.035621643066406, "global_step": 260383, "epoch": 2151} {"train_loss": -42.02936935424805, "global_step": 260384, "epoch": 2151} {"train_loss": -40.927364349365234, "global_step": 260385, "epoch": 2151} {"train_loss": -41.39156723022461, "global_step": 260386, "epoch": 2151} {"train_loss": -40.769737243652344, "global_step": 260387, "epoch": 2151} {"train_loss": -37.660858154296875, "global_step": 260388, "epoch": 2151} {"train_loss": -39.35007858276367, "global_step": 260389, "epoch": 2151} {"train_loss": -41.73062515258789, "global_step": 260390, "epoch": 2151} {"train_loss": -41.66655592484908, "global_step": 260391, "epoch": 2151, "val_loss": 2673164.0} {"train_loss": -39.772151947021484, "global_step": 260392, "epoch": 2152} {"train_loss": -41.20366287231445, "global_step": 260393, "epoch": 2152} {"train_loss": -39.89528274536133, "global_step": 260394, "epoch": 2152} {"train_loss": -41.19834518432617, "global_step": 260395, "epoch": 2152} {"train_loss": -38.37392807006836, "global_step": 260396, "epoch": 2152} {"train_loss": -40.49741744995117, "global_step": 260397, "epoch": 2152} {"train_loss": -39.423587799072266, "global_step": 260398, "epoch": 2152} {"train_loss": -40.32664108276367, "global_step": 260399, "epoch": 2152} {"train_loss": -40.604034423828125, "global_step": 260400, "epoch": 2152} {"train_loss": -40.39359664916992, "global_step": 260401, "epoch": 2152} {"train_loss": -41.29781723022461, "global_step": 260402, "epoch": 2152} {"train_loss": -40.03634262084961, "global_step": 260403, "epoch": 2152} {"train_loss": -39.82870101928711, "global_step": 260404, "epoch": 2152} {"train_loss": -40.62519073486328, "global_step": 260405, "epoch": 2152} {"train_loss": -40.79106521606445, "global_step": 260406, "epoch": 2152} {"train_loss": -41.19513702392578, "global_step": 260407, "epoch": 2152} {"train_loss": -41.494422912597656, "global_step": 260408, "epoch": 2152} {"train_loss": -41.02069091796875, "global_step": 260409, "epoch": 2152} {"train_loss": -41.31525421142578, "global_step": 260410, "epoch": 2152} {"train_loss": -41.63747024536133, "global_step": 260411, "epoch": 2152} {"train_loss": -41.41927719116211, "global_step": 260412, "epoch": 2152} {"train_loss": -41.08393096923828, "global_step": 260413, "epoch": 2152} {"train_loss": -41.256591796875, "global_step": 260414, "epoch": 2152} {"train_loss": -40.976436614990234, "global_step": 260415, "epoch": 2152} {"train_loss": -40.62517547607422, "global_step": 260416, "epoch": 2152} {"train_loss": -41.69683837890625, "global_step": 260417, "epoch": 2152} {"train_loss": -41.559669494628906, "global_step": 260418, "epoch": 2152} {"train_loss": -41.58090591430664, "global_step": 260419, "epoch": 2152} {"train_loss": -41.87510299682617, "global_step": 260420, "epoch": 2152} {"train_loss": -41.792354583740234, "global_step": 260421, "epoch": 2152} {"train_loss": -41.3929557800293, "global_step": 260422, "epoch": 2152} {"train_loss": -41.88880920410156, "global_step": 260423, "epoch": 2152} {"train_loss": -42.10414505004883, "global_step": 260424, "epoch": 2152} {"train_loss": -41.5667839050293, "global_step": 260425, "epoch": 2152} {"train_loss": -41.84291076660156, "global_step": 260426, "epoch": 2152} {"train_loss": -42.357479095458984, "global_step": 260427, "epoch": 2152} {"train_loss": -41.73543167114258, "global_step": 260428, "epoch": 2152} {"train_loss": -41.6553955078125, "global_step": 260429, "epoch": 2152} {"train_loss": -42.76710891723633, "global_step": 260430, "epoch": 2152} {"train_loss": -41.88792037963867, "global_step": 260431, "epoch": 2152} {"train_loss": -42.16849899291992, "global_step": 260432, "epoch": 2152} {"train_loss": -42.81220245361328, "global_step": 260433, "epoch": 2152} {"train_loss": -41.4153938293457, "global_step": 260434, "epoch": 2152} {"train_loss": -42.3839111328125, "global_step": 260435, "epoch": 2152} {"train_loss": -41.85272216796875, "global_step": 260436, "epoch": 2152} {"train_loss": -42.188419342041016, "global_step": 260437, "epoch": 2152} {"train_loss": -42.48014450073242, "global_step": 260438, "epoch": 2152} {"train_loss": -39.0191650390625, "global_step": 260439, "epoch": 2152} {"train_loss": -41.82912063598633, "global_step": 260440, "epoch": 2152} {"train_loss": -41.78908157348633, "global_step": 260441, "epoch": 2152} {"train_loss": -42.29026412963867, "global_step": 260442, "epoch": 2152} {"train_loss": -42.12782669067383, "global_step": 260443, "epoch": 2152} {"train_loss": -41.98585891723633, "global_step": 260444, "epoch": 2152} {"train_loss": -39.04653549194336, "global_step": 260445, "epoch": 2152} {"train_loss": -42.97140121459961, "global_step": 260446, "epoch": 2152} {"train_loss": -41.98600387573242, "global_step": 260447, "epoch": 2152} {"train_loss": -42.495635986328125, "global_step": 260448, "epoch": 2152} {"train_loss": -41.80758285522461, "global_step": 260449, "epoch": 2152} {"train_loss": -42.02705764770508, "global_step": 260450, "epoch": 2152} {"train_loss": -41.97126007080078, "global_step": 260451, "epoch": 2152} {"train_loss": -41.69757843017578, "global_step": 260452, "epoch": 2152} {"train_loss": -41.21999740600586, "global_step": 260453, "epoch": 2152} {"train_loss": -41.91591262817383, "global_step": 260454, "epoch": 2152} {"train_loss": -40.91909408569336, "global_step": 260455, "epoch": 2152} {"train_loss": -41.2773551940918, "global_step": 260456, "epoch": 2152} {"train_loss": -41.522884368896484, "global_step": 260457, "epoch": 2152} {"train_loss": -41.31080627441406, "global_step": 260458, "epoch": 2152} {"train_loss": -41.336151123046875, "global_step": 260459, "epoch": 2152} {"train_loss": -42.33201217651367, "global_step": 260460, "epoch": 2152} {"train_loss": -40.852806091308594, "global_step": 260461, "epoch": 2152} {"train_loss": -42.25040817260742, "global_step": 260462, "epoch": 2152} {"train_loss": -42.41555404663086, "global_step": 260463, "epoch": 2152} {"train_loss": -40.01342010498047, "global_step": 260464, "epoch": 2152} {"train_loss": -41.4269905090332, "global_step": 260465, "epoch": 2152} {"train_loss": -42.54268264770508, "global_step": 260466, "epoch": 2152} {"train_loss": -42.0595817565918, "global_step": 260467, "epoch": 2152} {"train_loss": -40.80051803588867, "global_step": 260468, "epoch": 2152} {"train_loss": -42.536556243896484, "global_step": 260469, "epoch": 2152} {"train_loss": -41.83072280883789, "global_step": 260470, "epoch": 2152} {"train_loss": -39.767356872558594, "global_step": 260471, "epoch": 2152} {"train_loss": -41.57686996459961, "global_step": 260472, "epoch": 2152} {"train_loss": -42.26603317260742, "global_step": 260473, "epoch": 2152} {"train_loss": -41.84237289428711, "global_step": 260474, "epoch": 2152} {"train_loss": -42.4920768737793, "global_step": 260475, "epoch": 2152} {"train_loss": -41.8997802734375, "global_step": 260476, "epoch": 2152} {"train_loss": -41.15798568725586, "global_step": 260477, "epoch": 2152} {"train_loss": -41.86375045776367, "global_step": 260478, "epoch": 2152} {"train_loss": -39.622798919677734, "global_step": 260479, "epoch": 2152} {"train_loss": -41.17318344116211, "global_step": 260480, "epoch": 2152} {"train_loss": -42.265350341796875, "global_step": 260481, "epoch": 2152} {"train_loss": -41.63224792480469, "global_step": 260482, "epoch": 2152} {"train_loss": -41.293060302734375, "global_step": 260483, "epoch": 2152} {"train_loss": -40.995365142822266, "global_step": 260484, "epoch": 2152} {"train_loss": -40.1961784362793, "global_step": 260485, "epoch": 2152} {"train_loss": -40.44126510620117, "global_step": 260486, "epoch": 2152} {"train_loss": -40.78548812866211, "global_step": 260487, "epoch": 2152} {"train_loss": -42.199729919433594, "global_step": 260488, "epoch": 2152} {"train_loss": -42.48855972290039, "global_step": 260489, "epoch": 2152} {"train_loss": -41.04023361206055, "global_step": 260490, "epoch": 2152} {"train_loss": -40.98460006713867, "global_step": 260491, "epoch": 2152} {"train_loss": -41.98261642456055, "global_step": 260492, "epoch": 2152} {"train_loss": -39.5073356628418, "global_step": 260493, "epoch": 2152} {"train_loss": -39.5946159362793, "global_step": 260494, "epoch": 2152} {"train_loss": -39.92208480834961, "global_step": 260495, "epoch": 2152} {"train_loss": -42.1856689453125, "global_step": 260496, "epoch": 2152} {"train_loss": -39.80854415893555, "global_step": 260497, "epoch": 2152} {"train_loss": -42.2154655456543, "global_step": 260498, "epoch": 2152} {"train_loss": -40.36990737915039, "global_step": 260499, "epoch": 2152} {"train_loss": -41.05475997924805, "global_step": 260500, "epoch": 2152} {"train_loss": -40.36305236816406, "global_step": 260501, "epoch": 2152} {"train_loss": -40.366268157958984, "global_step": 260502, "epoch": 2152} {"train_loss": -39.279293060302734, "global_step": 260503, "epoch": 2152} {"train_loss": -40.833580017089844, "global_step": 260504, "epoch": 2152} {"train_loss": -41.59153747558594, "global_step": 260505, "epoch": 2152} {"train_loss": -38.94429397583008, "global_step": 260506, "epoch": 2152} {"train_loss": -40.55701446533203, "global_step": 260507, "epoch": 2152} {"train_loss": -41.35061264038086, "global_step": 260508, "epoch": 2152} {"train_loss": -40.20267868041992, "global_step": 260509, "epoch": 2152} {"train_loss": -41.57699203491211, "global_step": 260510, "epoch": 2152} {"train_loss": -41.13099670410156, "global_step": 260511, "epoch": 2152} {"train_loss": -41.25407229967354, "global_step": 260512, "epoch": 2152, "val_loss": 2664190.75} {"train_loss": -42.105560302734375, "global_step": 260513, "epoch": 2153} {"train_loss": -41.31296157836914, "global_step": 260514, "epoch": 2153} {"train_loss": -41.69441223144531, "global_step": 260515, "epoch": 2153} {"train_loss": -40.911590576171875, "global_step": 260516, "epoch": 2153} {"train_loss": -39.89970016479492, "global_step": 260517, "epoch": 2153} {"train_loss": -42.000465393066406, "global_step": 260518, "epoch": 2153} {"train_loss": -40.11277389526367, "global_step": 260519, "epoch": 2153} {"train_loss": -42.3524284362793, "global_step": 260520, "epoch": 2153} {"train_loss": -40.20064926147461, "global_step": 260521, "epoch": 2153} {"train_loss": -41.45734786987305, "global_step": 260522, "epoch": 2153} {"train_loss": -42.30399703979492, "global_step": 260523, "epoch": 2153} {"train_loss": -41.414791107177734, "global_step": 260524, "epoch": 2153} {"train_loss": -40.96510314941406, "global_step": 260525, "epoch": 2153} {"train_loss": -41.89658737182617, "global_step": 260526, "epoch": 2153} {"train_loss": -42.39547348022461, "global_step": 260527, "epoch": 2153} {"train_loss": -39.82359313964844, "global_step": 260528, "epoch": 2153} {"train_loss": -41.608985900878906, "global_step": 260529, "epoch": 2153} {"train_loss": -41.459869384765625, "global_step": 260530, "epoch": 2153} {"train_loss": -42.78767776489258, "global_step": 260531, "epoch": 2153} {"train_loss": -42.09922409057617, "global_step": 260532, "epoch": 2153} {"train_loss": -42.31924057006836, "global_step": 260533, "epoch": 2153} {"train_loss": -39.64333724975586, "global_step": 260534, "epoch": 2153} {"train_loss": -41.941139221191406, "global_step": 260535, "epoch": 2153} {"train_loss": -42.2635612487793, "global_step": 260536, "epoch": 2153} {"train_loss": -42.711910247802734, "global_step": 260537, "epoch": 2153} {"train_loss": -39.877655029296875, "global_step": 260538, "epoch": 2153} {"train_loss": -42.53910827636719, "global_step": 260539, "epoch": 2153} {"train_loss": -42.39009475708008, "global_step": 260540, "epoch": 2153} {"train_loss": -41.64640426635742, "global_step": 260541, "epoch": 2153} {"train_loss": -42.18518829345703, "global_step": 260542, "epoch": 2153} {"train_loss": -42.54553985595703, "global_step": 260543, "epoch": 2153} {"train_loss": -41.05990219116211, "global_step": 260544, "epoch": 2153} {"train_loss": -42.790321350097656, "global_step": 260545, "epoch": 2153} {"train_loss": -42.432796478271484, "global_step": 260546, "epoch": 2153} {"train_loss": -42.37372970581055, "global_step": 260547, "epoch": 2153} {"train_loss": -42.21125411987305, "global_step": 260548, "epoch": 2153} {"train_loss": -42.40573501586914, "global_step": 260549, "epoch": 2153} {"train_loss": -42.47589874267578, "global_step": 260550, "epoch": 2153} {"train_loss": -41.73210144042969, "global_step": 260551, "epoch": 2153} {"train_loss": -41.530391693115234, "global_step": 260552, "epoch": 2153} {"train_loss": -42.74845504760742, "global_step": 260553, "epoch": 2153} {"train_loss": -41.81173324584961, "global_step": 260554, "epoch": 2153} {"train_loss": -42.5914306640625, "global_step": 260555, "epoch": 2153} {"train_loss": -41.654476165771484, "global_step": 260556, "epoch": 2153} {"train_loss": -42.5939826965332, "global_step": 260557, "epoch": 2153} {"train_loss": -43.1779899597168, "global_step": 260558, "epoch": 2153} {"train_loss": -42.63745880126953, "global_step": 260559, "epoch": 2153} {"train_loss": -42.56319046020508, "global_step": 260560, "epoch": 2153} {"train_loss": -42.600460052490234, "global_step": 260561, "epoch": 2153} {"train_loss": -42.41376876831055, "global_step": 260562, "epoch": 2153} {"train_loss": -42.296287536621094, "global_step": 260563, "epoch": 2153} {"train_loss": -43.12773513793945, "global_step": 260564, "epoch": 2153} {"train_loss": -42.477020263671875, "global_step": 260565, "epoch": 2153} {"train_loss": -42.597145080566406, "global_step": 260566, "epoch": 2153} {"train_loss": -41.64664840698242, "global_step": 260567, "epoch": 2153} {"train_loss": -42.8233528137207, "global_step": 260568, "epoch": 2153} {"train_loss": -42.694000244140625, "global_step": 260569, "epoch": 2153} {"train_loss": -41.44497299194336, "global_step": 260570, "epoch": 2153} {"train_loss": -42.71234893798828, "global_step": 260571, "epoch": 2153} {"train_loss": -42.63700485229492, "global_step": 260572, "epoch": 2153} {"train_loss": -42.23513412475586, "global_step": 260573, "epoch": 2153} {"train_loss": -42.42616271972656, "global_step": 260574, "epoch": 2153} {"train_loss": -42.67338180541992, "global_step": 260575, "epoch": 2153} {"train_loss": -42.750335693359375, "global_step": 260576, "epoch": 2153} {"train_loss": -42.66716384887695, "global_step": 260577, "epoch": 2153} {"train_loss": -37.562313079833984, "global_step": 260578, "epoch": 2153} {"train_loss": -42.49239730834961, "global_step": 260579, "epoch": 2153} {"train_loss": -43.391998291015625, "global_step": 260580, "epoch": 2153} {"train_loss": -42.71164321899414, "global_step": 260581, "epoch": 2153} {"train_loss": -42.39716720581055, "global_step": 260582, "epoch": 2153} {"train_loss": -42.625640869140625, "global_step": 260583, "epoch": 2153} {"train_loss": -42.51554489135742, "global_step": 260584, "epoch": 2153} {"train_loss": -42.85061264038086, "global_step": 260585, "epoch": 2153} {"train_loss": -38.94936752319336, "global_step": 260586, "epoch": 2153} {"train_loss": -42.348793029785156, "global_step": 260587, "epoch": 2153} {"train_loss": -42.06690216064453, "global_step": 260588, "epoch": 2153} {"train_loss": -42.51909255981445, "global_step": 260589, "epoch": 2153} {"train_loss": -42.395809173583984, "global_step": 260590, "epoch": 2153} {"train_loss": -42.58452224731445, "global_step": 260591, "epoch": 2153} {"train_loss": -42.765846252441406, "global_step": 260592, "epoch": 2153} {"train_loss": -41.78561019897461, "global_step": 260593, "epoch": 2153} {"train_loss": -42.96480941772461, "global_step": 260594, "epoch": 2153} {"train_loss": -42.968570709228516, "global_step": 260595, "epoch": 2153} {"train_loss": -42.67426681518555, "global_step": 260596, "epoch": 2153} {"train_loss": -41.525753021240234, "global_step": 260597, "epoch": 2153} {"train_loss": -42.20442199707031, "global_step": 260598, "epoch": 2153} {"train_loss": -42.37696838378906, "global_step": 260599, "epoch": 2153} {"train_loss": -42.416507720947266, "global_step": 260600, "epoch": 2153} {"train_loss": -42.39625930786133, "global_step": 260601, "epoch": 2153} {"train_loss": -42.750911712646484, "global_step": 260602, "epoch": 2153} {"train_loss": -42.1770133972168, "global_step": 260603, "epoch": 2153} {"train_loss": -42.51640701293945, "global_step": 260604, "epoch": 2153} {"train_loss": -42.313148498535156, "global_step": 260605, "epoch": 2153} {"train_loss": -43.23691177368164, "global_step": 260606, "epoch": 2153} {"train_loss": -42.10048294067383, "global_step": 260607, "epoch": 2153} {"train_loss": -42.45671081542969, "global_step": 260608, "epoch": 2153} {"train_loss": -41.1193962097168, "global_step": 260609, "epoch": 2153} {"train_loss": -42.063201904296875, "global_step": 260610, "epoch": 2153} {"train_loss": -42.162471771240234, "global_step": 260611, "epoch": 2153} {"train_loss": -41.460330963134766, "global_step": 260612, "epoch": 2153} {"train_loss": -42.58479690551758, "global_step": 260613, "epoch": 2153} {"train_loss": -42.302547454833984, "global_step": 260614, "epoch": 2153} {"train_loss": -42.739105224609375, "global_step": 260615, "epoch": 2153} {"train_loss": -42.91018295288086, "global_step": 260616, "epoch": 2153} {"train_loss": -41.65627670288086, "global_step": 260617, "epoch": 2153} {"train_loss": -43.17843246459961, "global_step": 260618, "epoch": 2153} {"train_loss": -42.00050735473633, "global_step": 260619, "epoch": 2153} {"train_loss": -42.61587142944336, "global_step": 260620, "epoch": 2153} {"train_loss": -42.812164306640625, "global_step": 260621, "epoch": 2153} {"train_loss": -42.04214096069336, "global_step": 260622, "epoch": 2153} {"train_loss": -41.41144561767578, "global_step": 260623, "epoch": 2153} {"train_loss": -42.7734489440918, "global_step": 260624, "epoch": 2153} {"train_loss": -42.9043083190918, "global_step": 260625, "epoch": 2153} {"train_loss": -42.81217575073242, "global_step": 260626, "epoch": 2153} {"train_loss": -41.6597900390625, "global_step": 260627, "epoch": 2153} {"train_loss": -42.573089599609375, "global_step": 260628, "epoch": 2153} {"train_loss": -42.3272819519043, "global_step": 260629, "epoch": 2153} {"train_loss": -42.655731201171875, "global_step": 260630, "epoch": 2153} {"train_loss": -41.428592681884766, "global_step": 260631, "epoch": 2153} {"train_loss": -40.293243408203125, "global_step": 260632, "epoch": 2153} {"train_loss": -42.08137874760904, "global_step": 260633, "epoch": 2153, "val_loss": 2627646.0} {"train_loss": -42.93947982788086, "global_step": 260634, "epoch": 2154} {"train_loss": -42.9277458190918, "global_step": 260635, "epoch": 2154} {"train_loss": -42.14248275756836, "global_step": 260636, "epoch": 2154} {"train_loss": -41.0950927734375, "global_step": 260637, "epoch": 2154} {"train_loss": -43.16337585449219, "global_step": 260638, "epoch": 2154} {"train_loss": -43.205787658691406, "global_step": 260639, "epoch": 2154} {"train_loss": -42.28586959838867, "global_step": 260640, "epoch": 2154} {"train_loss": -43.102012634277344, "global_step": 260641, "epoch": 2154} {"train_loss": -43.057472229003906, "global_step": 260642, "epoch": 2154} {"train_loss": -42.07045364379883, "global_step": 260643, "epoch": 2154} {"train_loss": -40.1270866394043, "global_step": 260644, "epoch": 2154} {"train_loss": -42.226863861083984, "global_step": 260645, "epoch": 2154} {"train_loss": -42.523006439208984, "global_step": 260646, "epoch": 2154} {"train_loss": -42.03107452392578, "global_step": 260647, "epoch": 2154} {"train_loss": -41.6192626953125, "global_step": 260648, "epoch": 2154} {"train_loss": -41.78763961791992, "global_step": 260649, "epoch": 2154} {"train_loss": -40.985103607177734, "global_step": 260650, "epoch": 2154} {"train_loss": -41.78328323364258, "global_step": 260651, "epoch": 2154} {"train_loss": -41.906944274902344, "global_step": 260652, "epoch": 2154} {"train_loss": -42.196258544921875, "global_step": 260653, "epoch": 2154} {"train_loss": -42.265567779541016, "global_step": 260654, "epoch": 2154} {"train_loss": -40.94198226928711, "global_step": 260655, "epoch": 2154} {"train_loss": -42.443756103515625, "global_step": 260656, "epoch": 2154} {"train_loss": -40.75581741333008, "global_step": 260657, "epoch": 2154} {"train_loss": -41.430728912353516, "global_step": 260658, "epoch": 2154} {"train_loss": -42.13070297241211, "global_step": 260659, "epoch": 2154} {"train_loss": -41.95372772216797, "global_step": 260660, "epoch": 2154} {"train_loss": -40.766883850097656, "global_step": 260661, "epoch": 2154} {"train_loss": -41.43816375732422, "global_step": 260662, "epoch": 2154} {"train_loss": -41.20431137084961, "global_step": 260663, "epoch": 2154} {"train_loss": -42.286434173583984, "global_step": 260664, "epoch": 2154} {"train_loss": -40.480220794677734, "global_step": 260665, "epoch": 2154} {"train_loss": -40.9484748840332, "global_step": 260666, "epoch": 2154} {"train_loss": -43.454490661621094, "global_step": 260667, "epoch": 2154} {"train_loss": -41.21611404418945, "global_step": 260668, "epoch": 2154} {"train_loss": -43.22515869140625, "global_step": 260669, "epoch": 2154} {"train_loss": -42.603912353515625, "global_step": 260670, "epoch": 2154} {"train_loss": -42.167022705078125, "global_step": 260671, "epoch": 2154} {"train_loss": -42.6912956237793, "global_step": 260672, "epoch": 2154} {"train_loss": -42.73661422729492, "global_step": 260673, "epoch": 2154} {"train_loss": -42.09434509277344, "global_step": 260674, "epoch": 2154} {"train_loss": -41.70882034301758, "global_step": 260675, "epoch": 2154} {"train_loss": -42.16841506958008, "global_step": 260676, "epoch": 2154} {"train_loss": -42.860015869140625, "global_step": 260677, "epoch": 2154} {"train_loss": -41.77122116088867, "global_step": 260678, "epoch": 2154} {"train_loss": -40.764556884765625, "global_step": 260679, "epoch": 2154} {"train_loss": -42.094173431396484, "global_step": 260680, "epoch": 2154} {"train_loss": -41.66660690307617, "global_step": 260681, "epoch": 2154} {"train_loss": -42.25141525268555, "global_step": 260682, "epoch": 2154} {"train_loss": -41.07941436767578, "global_step": 260683, "epoch": 2154} {"train_loss": -43.29032897949219, "global_step": 260684, "epoch": 2154} {"train_loss": -41.71403121948242, "global_step": 260685, "epoch": 2154} {"train_loss": -42.6744499206543, "global_step": 260686, "epoch": 2154} {"train_loss": -42.9242057800293, "global_step": 260687, "epoch": 2154} {"train_loss": -42.2861442565918, "global_step": 260688, "epoch": 2154} {"train_loss": -42.14907455444336, "global_step": 260689, "epoch": 2154} {"train_loss": -41.17367172241211, "global_step": 260690, "epoch": 2154} {"train_loss": -42.986061096191406, "global_step": 260691, "epoch": 2154} {"train_loss": -38.0140495300293, "global_step": 260692, "epoch": 2154} {"train_loss": -42.4948844909668, "global_step": 260693, "epoch": 2154} {"train_loss": -43.12736129760742, "global_step": 260694, "epoch": 2154} {"train_loss": -42.4603271484375, "global_step": 260695, "epoch": 2154} {"train_loss": -43.040992736816406, "global_step": 260696, "epoch": 2154} {"train_loss": -43.22025680541992, "global_step": 260697, "epoch": 2154} {"train_loss": -42.29819869995117, "global_step": 260698, "epoch": 2154} {"train_loss": -41.58600997924805, "global_step": 260699, "epoch": 2154} {"train_loss": -42.79246139526367, "global_step": 260700, "epoch": 2154} {"train_loss": -43.456207275390625, "global_step": 260701, "epoch": 2154} {"train_loss": -42.35193634033203, "global_step": 260702, "epoch": 2154} {"train_loss": -40.16575241088867, "global_step": 260703, "epoch": 2154} {"train_loss": -42.708595275878906, "global_step": 260704, "epoch": 2154} {"train_loss": -42.99699020385742, "global_step": 260705, "epoch": 2154} {"train_loss": -42.38971710205078, "global_step": 260706, "epoch": 2154} {"train_loss": -43.20132827758789, "global_step": 260707, "epoch": 2154} {"train_loss": -43.01227569580078, "global_step": 260708, "epoch": 2154} {"train_loss": -42.96064376831055, "global_step": 260709, "epoch": 2154} {"train_loss": -42.79189682006836, "global_step": 260710, "epoch": 2154} {"train_loss": -42.86372375488281, "global_step": 260711, "epoch": 2154} {"train_loss": -43.02244186401367, "global_step": 260712, "epoch": 2154} {"train_loss": -42.49767303466797, "global_step": 260713, "epoch": 2154} {"train_loss": -42.812496185302734, "global_step": 260714, "epoch": 2154} {"train_loss": -42.12905502319336, "global_step": 260715, "epoch": 2154} {"train_loss": -42.93327713012695, "global_step": 260716, "epoch": 2154} {"train_loss": -43.29021072387695, "global_step": 260717, "epoch": 2154} {"train_loss": -43.511390686035156, "global_step": 260718, "epoch": 2154} {"train_loss": -43.341766357421875, "global_step": 260719, "epoch": 2154} {"train_loss": -42.748382568359375, "global_step": 260720, "epoch": 2154} {"train_loss": -43.352481842041016, "global_step": 260721, "epoch": 2154} {"train_loss": -42.75252914428711, "global_step": 260722, "epoch": 2154} {"train_loss": -42.5098876953125, "global_step": 260723, "epoch": 2154} {"train_loss": -42.76978302001953, "global_step": 260724, "epoch": 2154} {"train_loss": -43.0587043762207, "global_step": 260725, "epoch": 2154} {"train_loss": -43.09943771362305, "global_step": 260726, "epoch": 2154} {"train_loss": -41.41805648803711, "global_step": 260727, "epoch": 2154} {"train_loss": -39.80906295776367, "global_step": 260728, "epoch": 2154} {"train_loss": -39.4163932800293, "global_step": 260729, "epoch": 2154} {"train_loss": -42.604949951171875, "global_step": 260730, "epoch": 2154} {"train_loss": -40.36865997314453, "global_step": 260731, "epoch": 2154} {"train_loss": -42.489559173583984, "global_step": 260732, "epoch": 2154} {"train_loss": -40.149959564208984, "global_step": 260733, "epoch": 2154} {"train_loss": -40.870967864990234, "global_step": 260734, "epoch": 2154} {"train_loss": -41.31869888305664, "global_step": 260735, "epoch": 2154} {"train_loss": -41.6561279296875, "global_step": 260736, "epoch": 2154} {"train_loss": -40.491363525390625, "global_step": 260737, "epoch": 2154} {"train_loss": -37.972511291503906, "global_step": 260738, "epoch": 2154} {"train_loss": -40.60390853881836, "global_step": 260739, "epoch": 2154} {"train_loss": -42.239803314208984, "global_step": 260740, "epoch": 2154} {"train_loss": -38.061279296875, "global_step": 260741, "epoch": 2154} {"train_loss": -30.565216064453125, "global_step": 260742, "epoch": 2154} {"train_loss": -28.276575088500977, "global_step": 260743, "epoch": 2154} {"train_loss": -34.871376037597656, "global_step": 260744, "epoch": 2154} {"train_loss": -36.325199127197266, "global_step": 260745, "epoch": 2154} {"train_loss": -37.0152473449707, "global_step": 260746, "epoch": 2154} {"train_loss": -34.0694580078125, "global_step": 260747, "epoch": 2154} {"train_loss": -38.44556427001953, "global_step": 260748, "epoch": 2154} {"train_loss": -37.15974044799805, "global_step": 260749, "epoch": 2154} {"train_loss": -39.63617706298828, "global_step": 260750, "epoch": 2154} {"train_loss": -40.551082611083984, "global_step": 260751, "epoch": 2154} {"train_loss": -37.675174713134766, "global_step": 260752, "epoch": 2154} {"train_loss": -39.49776077270508, "global_step": 260753, "epoch": 2154} {"train_loss": -41.432133461818225, "global_step": 260754, "epoch": 2154, "val_loss": 2638670.25} {"train_loss": -40.19080352783203, "global_step": 260755, "epoch": 2155} {"train_loss": -40.730018615722656, "global_step": 260756, "epoch": 2155} {"train_loss": -40.468563079833984, "global_step": 260757, "epoch": 2155} {"train_loss": -40.65845489501953, "global_step": 260758, "epoch": 2155} {"train_loss": -39.81293869018555, "global_step": 260759, "epoch": 2155} {"train_loss": -40.72618103027344, "global_step": 260760, "epoch": 2155} {"train_loss": -40.80845260620117, "global_step": 260761, "epoch": 2155} {"train_loss": -40.41878890991211, "global_step": 260762, "epoch": 2155} {"train_loss": -40.21080017089844, "global_step": 260763, "epoch": 2155} {"train_loss": -40.502037048339844, "global_step": 260764, "epoch": 2155} {"train_loss": -41.8604621887207, "global_step": 260765, "epoch": 2155} {"train_loss": -39.63505172729492, "global_step": 260766, "epoch": 2155} {"train_loss": -41.4577522277832, "global_step": 260767, "epoch": 2155} {"train_loss": -39.29386520385742, "global_step": 260768, "epoch": 2155} {"train_loss": -40.871158599853516, "global_step": 260769, "epoch": 2155} {"train_loss": -41.61216354370117, "global_step": 260770, "epoch": 2155} {"train_loss": -40.373165130615234, "global_step": 260771, "epoch": 2155} {"train_loss": -41.094024658203125, "global_step": 260772, "epoch": 2155} {"train_loss": -41.45874786376953, "global_step": 260773, "epoch": 2155} {"train_loss": -40.8965950012207, "global_step": 260774, "epoch": 2155} {"train_loss": -42.197364807128906, "global_step": 260775, "epoch": 2155} {"train_loss": -41.675716400146484, "global_step": 260776, "epoch": 2155} {"train_loss": -41.724185943603516, "global_step": 260777, "epoch": 2155} {"train_loss": -42.11642074584961, "global_step": 260778, "epoch": 2155} {"train_loss": -42.15239334106445, "global_step": 260779, "epoch": 2155} {"train_loss": -42.00410842895508, "global_step": 260780, "epoch": 2155} {"train_loss": -41.97158432006836, "global_step": 260781, "epoch": 2155} {"train_loss": -42.1186637878418, "global_step": 260782, "epoch": 2155} {"train_loss": -40.98689270019531, "global_step": 260783, "epoch": 2155} {"train_loss": -41.92344284057617, "global_step": 260784, "epoch": 2155} {"train_loss": -41.64923095703125, "global_step": 260785, "epoch": 2155} {"train_loss": -42.169960021972656, "global_step": 260786, "epoch": 2155} {"train_loss": -40.55057907104492, "global_step": 260787, "epoch": 2155} {"train_loss": -41.53876495361328, "global_step": 260788, "epoch": 2155} {"train_loss": -42.10909652709961, "global_step": 260789, "epoch": 2155} {"train_loss": -42.17478561401367, "global_step": 260790, "epoch": 2155} {"train_loss": -42.22233200073242, "global_step": 260791, "epoch": 2155} {"train_loss": -42.453643798828125, "global_step": 260792, "epoch": 2155} {"train_loss": -41.85986328125, "global_step": 260793, "epoch": 2155} {"train_loss": -42.690223693847656, "global_step": 260794, "epoch": 2155} {"train_loss": -42.05903625488281, "global_step": 260795, "epoch": 2155} {"train_loss": -41.504119873046875, "global_step": 260796, "epoch": 2155} {"train_loss": -42.29513168334961, "global_step": 260797, "epoch": 2155} {"train_loss": -42.541168212890625, "global_step": 260798, "epoch": 2155} {"train_loss": -42.390869140625, "global_step": 260799, "epoch": 2155} {"train_loss": -43.18932342529297, "global_step": 260800, "epoch": 2155} {"train_loss": -42.9244384765625, "global_step": 260801, "epoch": 2155} {"train_loss": -42.546424865722656, "global_step": 260802, "epoch": 2155} {"train_loss": -42.13322830200195, "global_step": 260803, "epoch": 2155} {"train_loss": -42.97864532470703, "global_step": 260804, "epoch": 2155} {"train_loss": -43.02764129638672, "global_step": 260805, "epoch": 2155} {"train_loss": -42.729248046875, "global_step": 260806, "epoch": 2155} {"train_loss": -43.082374572753906, "global_step": 260807, "epoch": 2155} {"train_loss": -43.368003845214844, "global_step": 260808, "epoch": 2155} {"train_loss": -42.52229690551758, "global_step": 260809, "epoch": 2155} {"train_loss": -43.108489990234375, "global_step": 260810, "epoch": 2155} {"train_loss": -42.36459732055664, "global_step": 260811, "epoch": 2155} {"train_loss": -43.277122497558594, "global_step": 260812, "epoch": 2155} {"train_loss": -42.90017318725586, "global_step": 260813, "epoch": 2155} {"train_loss": -43.11143112182617, "global_step": 260814, "epoch": 2155} {"train_loss": -41.80250549316406, "global_step": 260815, "epoch": 2155} {"train_loss": -43.07050323486328, "global_step": 260816, "epoch": 2155} {"train_loss": -42.89333724975586, "global_step": 260817, "epoch": 2155} {"train_loss": -42.8570442199707, "global_step": 260818, "epoch": 2155} {"train_loss": -43.48385238647461, "global_step": 260819, "epoch": 2155} {"train_loss": -43.27775955200195, "global_step": 260820, "epoch": 2155} {"train_loss": -43.520809173583984, "global_step": 260821, "epoch": 2155} {"train_loss": -43.551788330078125, "global_step": 260822, "epoch": 2155} {"train_loss": -43.56843185424805, "global_step": 260823, "epoch": 2155} {"train_loss": -42.38505935668945, "global_step": 260824, "epoch": 2155} {"train_loss": -43.025245666503906, "global_step": 260825, "epoch": 2155} {"train_loss": -42.20258712768555, "global_step": 260826, "epoch": 2155} {"train_loss": -43.39834213256836, "global_step": 260827, "epoch": 2155} {"train_loss": -43.402950286865234, "global_step": 260828, "epoch": 2155} {"train_loss": -43.59438705444336, "global_step": 260829, "epoch": 2155} {"train_loss": -43.5935173034668, "global_step": 260830, "epoch": 2155} {"train_loss": -43.05266189575195, "global_step": 260831, "epoch": 2155} {"train_loss": -43.51434326171875, "global_step": 260832, "epoch": 2155} {"train_loss": -43.597652435302734, "global_step": 260833, "epoch": 2155} {"train_loss": -43.835243225097656, "global_step": 260834, "epoch": 2155} {"train_loss": -41.443721771240234, "global_step": 260835, "epoch": 2155} {"train_loss": -43.82255554199219, "global_step": 260836, "epoch": 2155} {"train_loss": -43.5246696472168, "global_step": 260837, "epoch": 2155} {"train_loss": -43.82707595825195, "global_step": 260838, "epoch": 2155} {"train_loss": -43.58794021606445, "global_step": 260839, "epoch": 2155} {"train_loss": -42.22025680541992, "global_step": 260840, "epoch": 2155} {"train_loss": -41.61024475097656, "global_step": 260841, "epoch": 2155} {"train_loss": -42.99631881713867, "global_step": 260842, "epoch": 2155} {"train_loss": -43.10227966308594, "global_step": 260843, "epoch": 2155} {"train_loss": -42.66666793823242, "global_step": 260844, "epoch": 2155} {"train_loss": -42.65895462036133, "global_step": 260845, "epoch": 2155} {"train_loss": -42.889530181884766, "global_step": 260846, "epoch": 2155} {"train_loss": -41.86863327026367, "global_step": 260847, "epoch": 2155} {"train_loss": -43.61125564575195, "global_step": 260848, "epoch": 2155} {"train_loss": -42.33952331542969, "global_step": 260849, "epoch": 2155} {"train_loss": -43.7188835144043, "global_step": 260850, "epoch": 2155} {"train_loss": -42.56496810913086, "global_step": 260851, "epoch": 2155} {"train_loss": -43.00965118408203, "global_step": 260852, "epoch": 2155} {"train_loss": -42.320899963378906, "global_step": 260853, "epoch": 2155} {"train_loss": -40.00635528564453, "global_step": 260854, "epoch": 2155} {"train_loss": -42.0745964050293, "global_step": 260855, "epoch": 2155} {"train_loss": -41.54974365234375, "global_step": 260856, "epoch": 2155} {"train_loss": -41.45844650268555, "global_step": 260857, "epoch": 2155} {"train_loss": -42.38703536987305, "global_step": 260858, "epoch": 2155} {"train_loss": -43.035465240478516, "global_step": 260859, "epoch": 2155} {"train_loss": -42.129085540771484, "global_step": 260860, "epoch": 2155} {"train_loss": -43.130340576171875, "global_step": 260861, "epoch": 2155} {"train_loss": -42.0428352355957, "global_step": 260862, "epoch": 2155} {"train_loss": -42.52000045776367, "global_step": 260863, "epoch": 2155} {"train_loss": -42.314788818359375, "global_step": 260864, "epoch": 2155} {"train_loss": -42.95042037963867, "global_step": 260865, "epoch": 2155} {"train_loss": -42.7763671875, "global_step": 260866, "epoch": 2155} {"train_loss": -42.853363037109375, "global_step": 260867, "epoch": 2155} {"train_loss": -42.380916595458984, "global_step": 260868, "epoch": 2155} {"train_loss": -43.619991302490234, "global_step": 260869, "epoch": 2155} {"train_loss": -41.91279983520508, "global_step": 260870, "epoch": 2155} {"train_loss": -43.125457763671875, "global_step": 260871, "epoch": 2155} {"train_loss": -43.297607421875, "global_step": 260872, "epoch": 2155} {"train_loss": -43.49651336669922, "global_step": 260873, "epoch": 2155} {"train_loss": -42.90157699584961, "global_step": 260874, "epoch": 2155} {"train_loss": -42.29318275136396, "global_step": 260875, "epoch": 2155, "val_loss": 2691412.25} {"train_loss": -42.37028503417969, "global_step": 260876, "epoch": 2156} {"train_loss": -43.07735824584961, "global_step": 260877, "epoch": 2156} {"train_loss": -41.277156829833984, "global_step": 260878, "epoch": 2156} {"train_loss": -40.831207275390625, "global_step": 260879, "epoch": 2156} {"train_loss": -39.234718322753906, "global_step": 260880, "epoch": 2156} {"train_loss": -37.40900802612305, "global_step": 260881, "epoch": 2156} {"train_loss": -34.876895904541016, "global_step": 260882, "epoch": 2156} {"train_loss": -35.998939514160156, "global_step": 260883, "epoch": 2156} {"train_loss": -40.111263275146484, "global_step": 260884, "epoch": 2156} {"train_loss": -39.5673713684082, "global_step": 260885, "epoch": 2156} {"train_loss": -31.18528175354004, "global_step": 260886, "epoch": 2156} {"train_loss": -38.219818115234375, "global_step": 260887, "epoch": 2156} {"train_loss": -41.176876068115234, "global_step": 260888, "epoch": 2156} {"train_loss": -36.665733337402344, "global_step": 260889, "epoch": 2156} {"train_loss": -39.31354904174805, "global_step": 260890, "epoch": 2156} {"train_loss": -40.58577346801758, "global_step": 260891, "epoch": 2156} {"train_loss": -38.7641716003418, "global_step": 260892, "epoch": 2156} {"train_loss": -41.34135437011719, "global_step": 260893, "epoch": 2156} {"train_loss": -39.83304977416992, "global_step": 260894, "epoch": 2156} {"train_loss": -40.032630920410156, "global_step": 260895, "epoch": 2156} {"train_loss": -40.976463317871094, "global_step": 260896, "epoch": 2156} {"train_loss": -39.486228942871094, "global_step": 260897, "epoch": 2156} {"train_loss": -40.878936767578125, "global_step": 260898, "epoch": 2156} {"train_loss": -41.41937255859375, "global_step": 260899, "epoch": 2156} {"train_loss": -41.01465606689453, "global_step": 260900, "epoch": 2156} {"train_loss": -41.736061096191406, "global_step": 260901, "epoch": 2156} {"train_loss": -39.59312057495117, "global_step": 260902, "epoch": 2156} {"train_loss": -42.0256233215332, "global_step": 260903, "epoch": 2156} {"train_loss": -41.737300872802734, "global_step": 260904, "epoch": 2156} {"train_loss": -42.203392028808594, "global_step": 260905, "epoch": 2156} {"train_loss": -42.07316970825195, "global_step": 260906, "epoch": 2156} {"train_loss": -41.55584716796875, "global_step": 260907, "epoch": 2156} {"train_loss": -41.951820373535156, "global_step": 260908, "epoch": 2156} {"train_loss": -42.37665939331055, "global_step": 260909, "epoch": 2156} {"train_loss": -42.43409729003906, "global_step": 260910, "epoch": 2156} {"train_loss": -41.85440444946289, "global_step": 260911, "epoch": 2156} {"train_loss": -42.88489532470703, "global_step": 260912, "epoch": 2156} {"train_loss": -42.357120513916016, "global_step": 260913, "epoch": 2156} {"train_loss": -41.83647155761719, "global_step": 260914, "epoch": 2156} {"train_loss": -43.451560974121094, "global_step": 260915, "epoch": 2156} {"train_loss": -42.40895462036133, "global_step": 260916, "epoch": 2156} {"train_loss": -43.01163101196289, "global_step": 260917, "epoch": 2156} {"train_loss": -42.891944885253906, "global_step": 260918, "epoch": 2156} {"train_loss": -42.75604248046875, "global_step": 260919, "epoch": 2156} {"train_loss": -42.49592971801758, "global_step": 260920, "epoch": 2156} {"train_loss": -42.96220779418945, "global_step": 260921, "epoch": 2156} {"train_loss": -42.827945709228516, "global_step": 260922, "epoch": 2156} {"train_loss": -43.2528076171875, "global_step": 260923, "epoch": 2156} {"train_loss": -42.68861770629883, "global_step": 260924, "epoch": 2156} {"train_loss": -42.438629150390625, "global_step": 260925, "epoch": 2156} {"train_loss": -42.8043098449707, "global_step": 260926, "epoch": 2156} {"train_loss": -43.035953521728516, "global_step": 260927, "epoch": 2156} {"train_loss": -42.731624603271484, "global_step": 260928, "epoch": 2156} {"train_loss": -43.36960983276367, "global_step": 260929, "epoch": 2156} {"train_loss": -43.41102981567383, "global_step": 260930, "epoch": 2156} {"train_loss": -43.5766716003418, "global_step": 260931, "epoch": 2156} {"train_loss": -42.91454315185547, "global_step": 260932, "epoch": 2156} {"train_loss": -43.79852294921875, "global_step": 260933, "epoch": 2156} {"train_loss": -43.182308197021484, "global_step": 260934, "epoch": 2156} {"train_loss": -43.20056915283203, "global_step": 260935, "epoch": 2156} {"train_loss": -43.3956298828125, "global_step": 260936, "epoch": 2156} {"train_loss": -42.389251708984375, "global_step": 260937, "epoch": 2156} {"train_loss": -43.739585876464844, "global_step": 260938, "epoch": 2156} {"train_loss": -43.01229476928711, "global_step": 260939, "epoch": 2156} {"train_loss": -43.67441940307617, "global_step": 260940, "epoch": 2156} {"train_loss": -43.30841827392578, "global_step": 260941, "epoch": 2156} {"train_loss": -43.21632385253906, "global_step": 260942, "epoch": 2156} {"train_loss": -42.57175827026367, "global_step": 260943, "epoch": 2156} {"train_loss": -43.84617233276367, "global_step": 260944, "epoch": 2156} {"train_loss": -43.74862289428711, "global_step": 260945, "epoch": 2156} {"train_loss": -43.45643997192383, "global_step": 260946, "epoch": 2156} {"train_loss": -43.201412200927734, "global_step": 260947, "epoch": 2156} {"train_loss": -43.518043518066406, "global_step": 260948, "epoch": 2156} {"train_loss": -43.56956100463867, "global_step": 260949, "epoch": 2156} {"train_loss": -43.65385437011719, "global_step": 260950, "epoch": 2156} {"train_loss": -43.08534622192383, "global_step": 260951, "epoch": 2156} {"train_loss": -43.59247970581055, "global_step": 260952, "epoch": 2156} {"train_loss": -43.3472785949707, "global_step": 260953, "epoch": 2156} {"train_loss": -43.841243743896484, "global_step": 260954, "epoch": 2156} {"train_loss": -42.96567916870117, "global_step": 260955, "epoch": 2156} {"train_loss": -42.85858917236328, "global_step": 260956, "epoch": 2156} {"train_loss": -43.50051498413086, "global_step": 260957, "epoch": 2156} {"train_loss": -42.165489196777344, "global_step": 260958, "epoch": 2156} {"train_loss": -42.30891799926758, "global_step": 260959, "epoch": 2156} {"train_loss": -43.919227600097656, "global_step": 260960, "epoch": 2156} {"train_loss": -43.372291564941406, "global_step": 260961, "epoch": 2156} {"train_loss": -41.67850875854492, "global_step": 260962, "epoch": 2156} {"train_loss": -43.16151809692383, "global_step": 260963, "epoch": 2156} {"train_loss": -43.501258850097656, "global_step": 260964, "epoch": 2156} {"train_loss": -43.362735748291016, "global_step": 260965, "epoch": 2156} {"train_loss": -43.514312744140625, "global_step": 260966, "epoch": 2156} {"train_loss": -40.1098518371582, "global_step": 260967, "epoch": 2156} {"train_loss": -42.43319320678711, "global_step": 260968, "epoch": 2156} {"train_loss": -39.93290710449219, "global_step": 260969, "epoch": 2156} {"train_loss": -41.98240280151367, "global_step": 260970, "epoch": 2156} {"train_loss": -42.5548210144043, "global_step": 260971, "epoch": 2156} {"train_loss": -42.90944290161133, "global_step": 260972, "epoch": 2156} {"train_loss": -42.3674201965332, "global_step": 260973, "epoch": 2156} {"train_loss": -41.853939056396484, "global_step": 260974, "epoch": 2156} {"train_loss": -42.54232406616211, "global_step": 260975, "epoch": 2156} {"train_loss": -40.392478942871094, "global_step": 260976, "epoch": 2156} {"train_loss": -41.85898971557617, "global_step": 260977, "epoch": 2156} {"train_loss": -38.36481857299805, "global_step": 260978, "epoch": 2156} {"train_loss": -39.98026657104492, "global_step": 260979, "epoch": 2156} {"train_loss": -40.018348693847656, "global_step": 260980, "epoch": 2156} {"train_loss": -42.477516174316406, "global_step": 260981, "epoch": 2156} {"train_loss": -41.8695182800293, "global_step": 260982, "epoch": 2156} {"train_loss": -42.08477783203125, "global_step": 260983, "epoch": 2156} {"train_loss": -41.98122024536133, "global_step": 260984, "epoch": 2156} {"train_loss": -41.60850143432617, "global_step": 260985, "epoch": 2156} {"train_loss": -41.55891799926758, "global_step": 260986, "epoch": 2156} {"train_loss": -37.1657829284668, "global_step": 260987, "epoch": 2156} {"train_loss": -40.14939498901367, "global_step": 260988, "epoch": 2156} {"train_loss": -40.458858489990234, "global_step": 260989, "epoch": 2156} {"train_loss": -41.251319885253906, "global_step": 260990, "epoch": 2156} {"train_loss": -42.71589279174805, "global_step": 260991, "epoch": 2156} {"train_loss": -40.406890869140625, "global_step": 260992, "epoch": 2156} {"train_loss": -39.450782775878906, "global_step": 260993, "epoch": 2156} {"train_loss": -39.48591995239258, "global_step": 260994, "epoch": 2156} {"train_loss": -40.0624885559082, "global_step": 260995, "epoch": 2156} {"train_loss": -41.71369204245323, "global_step": 260996, "epoch": 2156, "val_loss": 2637953.75} {"train_loss": -36.900909423828125, "global_step": 260997, "epoch": 2157} {"train_loss": -35.61370849609375, "global_step": 260998, "epoch": 2157} {"train_loss": -38.90058517456055, "global_step": 260999, "epoch": 2157} {"train_loss": -31.519834518432617, "global_step": 261000, "epoch": 2157} {"train_loss": -36.680152893066406, "global_step": 261001, "epoch": 2157} {"train_loss": -41.977752685546875, "global_step": 261002, "epoch": 2157} {"train_loss": -40.78518295288086, "global_step": 261003, "epoch": 2157} {"train_loss": -39.28206253051758, "global_step": 261004, "epoch": 2157} {"train_loss": -41.08107376098633, "global_step": 261005, "epoch": 2157} {"train_loss": -37.84967803955078, "global_step": 261006, "epoch": 2157} {"train_loss": -39.25087356567383, "global_step": 261007, "epoch": 2157} {"train_loss": -39.69059371948242, "global_step": 261008, "epoch": 2157} {"train_loss": -38.02901077270508, "global_step": 261009, "epoch": 2157} {"train_loss": -39.45606231689453, "global_step": 261010, "epoch": 2157} {"train_loss": -42.188655853271484, "global_step": 261011, "epoch": 2157} {"train_loss": -37.45842361450195, "global_step": 261012, "epoch": 2157} {"train_loss": -36.87043380737305, "global_step": 261013, "epoch": 2157} {"train_loss": -26.123214721679688, "global_step": 261014, "epoch": 2157} {"train_loss": -40.938358306884766, "global_step": 261015, "epoch": 2157} {"train_loss": -37.79423904418945, "global_step": 261016, "epoch": 2157} {"train_loss": -37.832000732421875, "global_step": 261017, "epoch": 2157} {"train_loss": -40.06976318359375, "global_step": 261018, "epoch": 2157} {"train_loss": -36.02544403076172, "global_step": 261019, "epoch": 2157} {"train_loss": -40.50642776489258, "global_step": 261020, "epoch": 2157} {"train_loss": -39.72066879272461, "global_step": 261021, "epoch": 2157} {"train_loss": -39.49440383911133, "global_step": 261022, "epoch": 2157} {"train_loss": -38.98430633544922, "global_step": 261023, "epoch": 2157} {"train_loss": -41.38911056518555, "global_step": 261024, "epoch": 2157} {"train_loss": -37.65132141113281, "global_step": 261025, "epoch": 2157} {"train_loss": -37.8238639831543, "global_step": 261026, "epoch": 2157} {"train_loss": -38.96156692504883, "global_step": 261027, "epoch": 2157} {"train_loss": -32.89667892456055, "global_step": 261028, "epoch": 2157} {"train_loss": -37.71771240234375, "global_step": 261029, "epoch": 2157} {"train_loss": -39.849098205566406, "global_step": 261030, "epoch": 2157} {"train_loss": -39.50774002075195, "global_step": 261031, "epoch": 2157} {"train_loss": -40.942325592041016, "global_step": 261032, "epoch": 2157} {"train_loss": -38.08781051635742, "global_step": 261033, "epoch": 2157} {"train_loss": -41.099395751953125, "global_step": 261034, "epoch": 2157} {"train_loss": -34.50785827636719, "global_step": 261035, "epoch": 2157} {"train_loss": -40.8149299621582, "global_step": 261036, "epoch": 2157} {"train_loss": -41.061553955078125, "global_step": 261037, "epoch": 2157} {"train_loss": -39.1248893737793, "global_step": 261038, "epoch": 2157} {"train_loss": -40.83108139038086, "global_step": 261039, "epoch": 2157} {"train_loss": -40.031150817871094, "global_step": 261040, "epoch": 2157} {"train_loss": -40.149715423583984, "global_step": 261041, "epoch": 2157} {"train_loss": -38.823848724365234, "global_step": 261042, "epoch": 2157} {"train_loss": -40.46088409423828, "global_step": 261043, "epoch": 2157} {"train_loss": -39.55631637573242, "global_step": 261044, "epoch": 2157} {"train_loss": -36.979183197021484, "global_step": 261045, "epoch": 2157} {"train_loss": -39.170406341552734, "global_step": 261046, "epoch": 2157} {"train_loss": -38.75910568237305, "global_step": 261047, "epoch": 2157} {"train_loss": -41.317501068115234, "global_step": 261048, "epoch": 2157} {"train_loss": -40.896907806396484, "global_step": 261049, "epoch": 2157} {"train_loss": -39.490543365478516, "global_step": 261050, "epoch": 2157} {"train_loss": -38.638607025146484, "global_step": 261051, "epoch": 2157} {"train_loss": -35.77729797363281, "global_step": 261052, "epoch": 2157} {"train_loss": -40.87715530395508, "global_step": 261053, "epoch": 2157} {"train_loss": -39.94602584838867, "global_step": 261054, "epoch": 2157} {"train_loss": -40.0828857421875, "global_step": 261055, "epoch": 2157} {"train_loss": -40.82389450073242, "global_step": 261056, "epoch": 2157} {"train_loss": -39.64056396484375, "global_step": 261057, "epoch": 2157} {"train_loss": -40.910621643066406, "global_step": 261058, "epoch": 2157} {"train_loss": -40.362918853759766, "global_step": 261059, "epoch": 2157} {"train_loss": -40.53310012817383, "global_step": 261060, "epoch": 2157} {"train_loss": -40.209537506103516, "global_step": 261061, "epoch": 2157} {"train_loss": -41.208858489990234, "global_step": 261062, "epoch": 2157} {"train_loss": -40.460872650146484, "global_step": 261063, "epoch": 2157} {"train_loss": -41.155250549316406, "global_step": 261064, "epoch": 2157} {"train_loss": -40.955745697021484, "global_step": 261065, "epoch": 2157} {"train_loss": -40.2931022644043, "global_step": 261066, "epoch": 2157} {"train_loss": -40.93714141845703, "global_step": 261067, "epoch": 2157} {"train_loss": -40.99176788330078, "global_step": 261068, "epoch": 2157} {"train_loss": -41.740386962890625, "global_step": 261069, "epoch": 2157} {"train_loss": -40.8476448059082, "global_step": 261070, "epoch": 2157} {"train_loss": -41.5445671081543, "global_step": 261071, "epoch": 2157} {"train_loss": -41.063514709472656, "global_step": 261072, "epoch": 2157} {"train_loss": -41.62263870239258, "global_step": 261073, "epoch": 2157} {"train_loss": -41.919158935546875, "global_step": 261074, "epoch": 2157} {"train_loss": -40.935665130615234, "global_step": 261075, "epoch": 2157} {"train_loss": -41.48427963256836, "global_step": 261076, "epoch": 2157} {"train_loss": -41.400230407714844, "global_step": 261077, "epoch": 2157} {"train_loss": -41.60042190551758, "global_step": 261078, "epoch": 2157} {"train_loss": -41.566104888916016, "global_step": 261079, "epoch": 2157} {"train_loss": -41.45281219482422, "global_step": 261080, "epoch": 2157} {"train_loss": -42.03725051879883, "global_step": 261081, "epoch": 2157} {"train_loss": -42.2014045715332, "global_step": 261082, "epoch": 2157} {"train_loss": -42.03330612182617, "global_step": 261083, "epoch": 2157} {"train_loss": -42.27815628051758, "global_step": 261084, "epoch": 2157} {"train_loss": -41.97307586669922, "global_step": 261085, "epoch": 2157} {"train_loss": -42.395469665527344, "global_step": 261086, "epoch": 2157} {"train_loss": -41.88306427001953, "global_step": 261087, "epoch": 2157} {"train_loss": -42.2952995300293, "global_step": 261088, "epoch": 2157} {"train_loss": -42.18239974975586, "global_step": 261089, "epoch": 2157} {"train_loss": -40.80643844604492, "global_step": 261090, "epoch": 2157} {"train_loss": -42.580848693847656, "global_step": 261091, "epoch": 2157} {"train_loss": -42.17601776123047, "global_step": 261092, "epoch": 2157} {"train_loss": -41.51747512817383, "global_step": 261093, "epoch": 2157} {"train_loss": -42.48444747924805, "global_step": 261094, "epoch": 2157} {"train_loss": -41.870853424072266, "global_step": 261095, "epoch": 2157} {"train_loss": -41.69893264770508, "global_step": 261096, "epoch": 2157} {"train_loss": -42.601600646972656, "global_step": 261097, "epoch": 2157} {"train_loss": -41.89811325073242, "global_step": 261098, "epoch": 2157} {"train_loss": -42.18019485473633, "global_step": 261099, "epoch": 2157} {"train_loss": -42.4925537109375, "global_step": 261100, "epoch": 2157} {"train_loss": -42.23916244506836, "global_step": 261101, "epoch": 2157} {"train_loss": -42.696632385253906, "global_step": 261102, "epoch": 2157} {"train_loss": -42.45376205444336, "global_step": 261103, "epoch": 2157} {"train_loss": -42.66740417480469, "global_step": 261104, "epoch": 2157} {"train_loss": -42.84475326538086, "global_step": 261105, "epoch": 2157} {"train_loss": -42.75147247314453, "global_step": 261106, "epoch": 2157} {"train_loss": -42.99833679199219, "global_step": 261107, "epoch": 2157} {"train_loss": -41.87221908569336, "global_step": 261108, "epoch": 2157} {"train_loss": -42.178741455078125, "global_step": 261109, "epoch": 2157} {"train_loss": -42.83783721923828, "global_step": 261110, "epoch": 2157} {"train_loss": -42.80985641479492, "global_step": 261111, "epoch": 2157} {"train_loss": -41.28447341918945, "global_step": 261112, "epoch": 2157} {"train_loss": -43.129573822021484, "global_step": 261113, "epoch": 2157} {"train_loss": -43.024078369140625, "global_step": 261114, "epoch": 2157} {"train_loss": -42.76185989379883, "global_step": 261115, "epoch": 2157} {"train_loss": -42.8220100402832, "global_step": 261116, "epoch": 2157} {"train_loss": -40.29628944396973, "global_step": 261117, "epoch": 2157, "val_loss": 2592809.75} {"train_loss": -42.99917221069336, "global_step": 261118, "epoch": 2158} {"train_loss": -43.00204086303711, "global_step": 261119, "epoch": 2158} {"train_loss": -43.0865592956543, "global_step": 261120, "epoch": 2158} {"train_loss": -43.172401428222656, "global_step": 261121, "epoch": 2158} {"train_loss": -43.29291534423828, "global_step": 261122, "epoch": 2158} {"train_loss": -43.03656768798828, "global_step": 261123, "epoch": 2158} {"train_loss": -43.150814056396484, "global_step": 261124, "epoch": 2158} {"train_loss": -43.43421173095703, "global_step": 261125, "epoch": 2158} {"train_loss": -42.60850143432617, "global_step": 261126, "epoch": 2158} {"train_loss": -42.02937698364258, "global_step": 261127, "epoch": 2158} {"train_loss": -43.280181884765625, "global_step": 261128, "epoch": 2158} {"train_loss": -43.707767486572266, "global_step": 261129, "epoch": 2158} {"train_loss": -43.11951446533203, "global_step": 261130, "epoch": 2158} {"train_loss": -43.716278076171875, "global_step": 261131, "epoch": 2158} {"train_loss": -43.32234191894531, "global_step": 261132, "epoch": 2158} {"train_loss": -43.250282287597656, "global_step": 261133, "epoch": 2158} {"train_loss": -42.7534065246582, "global_step": 261134, "epoch": 2158} {"train_loss": -42.92429733276367, "global_step": 261135, "epoch": 2158} {"train_loss": -43.6385612487793, "global_step": 261136, "epoch": 2158} {"train_loss": -43.53860855102539, "global_step": 261137, "epoch": 2158} {"train_loss": -42.45583724975586, "global_step": 261138, "epoch": 2158} {"train_loss": -43.06355667114258, "global_step": 261139, "epoch": 2158} {"train_loss": -43.36725616455078, "global_step": 261140, "epoch": 2158} {"train_loss": -42.638153076171875, "global_step": 261141, "epoch": 2158} {"train_loss": -43.464908599853516, "global_step": 261142, "epoch": 2158} {"train_loss": -43.4897346496582, "global_step": 261143, "epoch": 2158} {"train_loss": -42.8646240234375, "global_step": 261144, "epoch": 2158} {"train_loss": -42.081912994384766, "global_step": 261145, "epoch": 2158} {"train_loss": -40.45278549194336, "global_step": 261146, "epoch": 2158} {"train_loss": -40.16868209838867, "global_step": 261147, "epoch": 2158} {"train_loss": -37.62527084350586, "global_step": 261148, "epoch": 2158} {"train_loss": -38.06867599487305, "global_step": 261149, "epoch": 2158} {"train_loss": -40.262699127197266, "global_step": 261150, "epoch": 2158} {"train_loss": -41.27729415893555, "global_step": 261151, "epoch": 2158} {"train_loss": -37.15781784057617, "global_step": 261152, "epoch": 2158} {"train_loss": -39.45986557006836, "global_step": 261153, "epoch": 2158} {"train_loss": -40.92857360839844, "global_step": 261154, "epoch": 2158} {"train_loss": -39.381195068359375, "global_step": 261155, "epoch": 2158} {"train_loss": -41.132408142089844, "global_step": 261156, "epoch": 2158} {"train_loss": -39.85820388793945, "global_step": 261157, "epoch": 2158} {"train_loss": -41.27558517456055, "global_step": 261158, "epoch": 2158} {"train_loss": -42.160057067871094, "global_step": 261159, "epoch": 2158} {"train_loss": -39.75443649291992, "global_step": 261160, "epoch": 2158} {"train_loss": -40.98564147949219, "global_step": 261161, "epoch": 2158} {"train_loss": -41.55487823486328, "global_step": 261162, "epoch": 2158} {"train_loss": -41.927040100097656, "global_step": 261163, "epoch": 2158} {"train_loss": -41.840919494628906, "global_step": 261164, "epoch": 2158} {"train_loss": -41.1748161315918, "global_step": 261165, "epoch": 2158} {"train_loss": -40.27301025390625, "global_step": 261166, "epoch": 2158} {"train_loss": -42.761077880859375, "global_step": 261167, "epoch": 2158} {"train_loss": -42.24101638793945, "global_step": 261168, "epoch": 2158} {"train_loss": -41.41168212890625, "global_step": 261169, "epoch": 2158} {"train_loss": -41.25002670288086, "global_step": 261170, "epoch": 2158} {"train_loss": -42.20644760131836, "global_step": 261171, "epoch": 2158} {"train_loss": -42.66009521484375, "global_step": 261172, "epoch": 2158} {"train_loss": -42.28025817871094, "global_step": 261173, "epoch": 2158} {"train_loss": -42.25395584106445, "global_step": 261174, "epoch": 2158} {"train_loss": -41.59305191040039, "global_step": 261175, "epoch": 2158} {"train_loss": -41.70737838745117, "global_step": 261176, "epoch": 2158} {"train_loss": -42.265716552734375, "global_step": 261177, "epoch": 2158} {"train_loss": -42.01276397705078, "global_step": 261178, "epoch": 2158} {"train_loss": -41.6898078918457, "global_step": 261179, "epoch": 2158} {"train_loss": -42.2431640625, "global_step": 261180, "epoch": 2158} {"train_loss": -42.68073272705078, "global_step": 261181, "epoch": 2158} {"train_loss": -42.54155349731445, "global_step": 261182, "epoch": 2158} {"train_loss": -42.526268005371094, "global_step": 261183, "epoch": 2158} {"train_loss": -42.73896408081055, "global_step": 261184, "epoch": 2158} {"train_loss": -42.490848541259766, "global_step": 261185, "epoch": 2158} {"train_loss": -42.3356819152832, "global_step": 261186, "epoch": 2158} {"train_loss": -41.76444625854492, "global_step": 261187, "epoch": 2158} {"train_loss": -41.1820068359375, "global_step": 261188, "epoch": 2158} {"train_loss": -41.330257415771484, "global_step": 261189, "epoch": 2158} {"train_loss": -43.10336685180664, "global_step": 261190, "epoch": 2158} {"train_loss": -41.49677658081055, "global_step": 261191, "epoch": 2158} {"train_loss": -42.2961540222168, "global_step": 261192, "epoch": 2158} {"train_loss": -42.84165954589844, "global_step": 261193, "epoch": 2158} {"train_loss": -41.44509506225586, "global_step": 261194, "epoch": 2158} {"train_loss": -41.69660186767578, "global_step": 261195, "epoch": 2158} {"train_loss": -41.95130157470703, "global_step": 261196, "epoch": 2158} {"train_loss": -42.10084915161133, "global_step": 261197, "epoch": 2158} {"train_loss": -42.569087982177734, "global_step": 261198, "epoch": 2158} {"train_loss": -42.4630126953125, "global_step": 261199, "epoch": 2158} {"train_loss": -42.6722526550293, "global_step": 261200, "epoch": 2158} {"train_loss": -42.41040802001953, "global_step": 261201, "epoch": 2158} {"train_loss": -42.9402961730957, "global_step": 261202, "epoch": 2158} {"train_loss": -42.58871078491211, "global_step": 261203, "epoch": 2158} {"train_loss": -42.166343688964844, "global_step": 261204, "epoch": 2158} {"train_loss": -43.11924362182617, "global_step": 261205, "epoch": 2158} {"train_loss": -42.19579315185547, "global_step": 261206, "epoch": 2158} {"train_loss": -43.20009994506836, "global_step": 261207, "epoch": 2158} {"train_loss": -42.45945358276367, "global_step": 261208, "epoch": 2158} {"train_loss": -42.91449737548828, "global_step": 261209, "epoch": 2158} {"train_loss": -43.43058395385742, "global_step": 261210, "epoch": 2158} {"train_loss": -41.940673828125, "global_step": 261211, "epoch": 2158} {"train_loss": -43.00536346435547, "global_step": 261212, "epoch": 2158} {"train_loss": -43.66225814819336, "global_step": 261213, "epoch": 2158} {"train_loss": -42.85504150390625, "global_step": 261214, "epoch": 2158} {"train_loss": -42.88368606567383, "global_step": 261215, "epoch": 2158} {"train_loss": -43.32027816772461, "global_step": 261216, "epoch": 2158} {"train_loss": -42.890602111816406, "global_step": 261217, "epoch": 2158} {"train_loss": -42.47846984863281, "global_step": 261218, "epoch": 2158} {"train_loss": -43.07517623901367, "global_step": 261219, "epoch": 2158} {"train_loss": -43.13922882080078, "global_step": 261220, "epoch": 2158} {"train_loss": -42.83134841918945, "global_step": 261221, "epoch": 2158} {"train_loss": -42.8887825012207, "global_step": 261222, "epoch": 2158} {"train_loss": -41.341434478759766, "global_step": 261223, "epoch": 2158} {"train_loss": -42.792171478271484, "global_step": 261224, "epoch": 2158} {"train_loss": -43.50753402709961, "global_step": 261225, "epoch": 2158} {"train_loss": -42.8929328918457, "global_step": 261226, "epoch": 2158} {"train_loss": -43.244686126708984, "global_step": 261227, "epoch": 2158} {"train_loss": -42.46711349487305, "global_step": 261228, "epoch": 2158} {"train_loss": -43.3642692565918, "global_step": 261229, "epoch": 2158} {"train_loss": -42.82346725463867, "global_step": 261230, "epoch": 2158} {"train_loss": -42.477664947509766, "global_step": 261231, "epoch": 2158} {"train_loss": -42.89237594604492, "global_step": 261232, "epoch": 2158} {"train_loss": -41.84077835083008, "global_step": 261233, "epoch": 2158} {"train_loss": -42.53535079956055, "global_step": 261234, "epoch": 2158} {"train_loss": -42.219093322753906, "global_step": 261235, "epoch": 2158} {"train_loss": -43.042415618896484, "global_step": 261236, "epoch": 2158} {"train_loss": -42.48417282104492, "global_step": 261237, "epoch": 2158} {"train_loss": -42.22060082175515, "global_step": 261238, "epoch": 2158, "val_loss": 2676058.75} {"train_loss": -40.67073440551758, "global_step": 261239, "epoch": 2159} {"train_loss": -41.056339263916016, "global_step": 261240, "epoch": 2159} {"train_loss": -38.17421340942383, "global_step": 261241, "epoch": 2159} {"train_loss": -35.36665725708008, "global_step": 261242, "epoch": 2159} {"train_loss": -31.36952018737793, "global_step": 261243, "epoch": 2159} {"train_loss": -35.35260772705078, "global_step": 261244, "epoch": 2159} {"train_loss": -41.08549118041992, "global_step": 261245, "epoch": 2159} {"train_loss": -40.32234573364258, "global_step": 261246, "epoch": 2159} {"train_loss": -39.38262939453125, "global_step": 261247, "epoch": 2159} {"train_loss": -40.57291793823242, "global_step": 261248, "epoch": 2159} {"train_loss": -41.63710403442383, "global_step": 261249, "epoch": 2159} {"train_loss": -41.30426025390625, "global_step": 261250, "epoch": 2159} {"train_loss": -40.98289108276367, "global_step": 261251, "epoch": 2159} {"train_loss": -41.145851135253906, "global_step": 261252, "epoch": 2159} {"train_loss": -40.36600875854492, "global_step": 261253, "epoch": 2159} {"train_loss": -41.28812789916992, "global_step": 261254, "epoch": 2159} {"train_loss": -40.90061569213867, "global_step": 261255, "epoch": 2159} {"train_loss": -41.231014251708984, "global_step": 261256, "epoch": 2159} {"train_loss": -39.15666961669922, "global_step": 261257, "epoch": 2159} {"train_loss": -41.2244873046875, "global_step": 261258, "epoch": 2159} {"train_loss": -41.623138427734375, "global_step": 261259, "epoch": 2159} {"train_loss": -41.38901901245117, "global_step": 261260, "epoch": 2159} {"train_loss": -41.22383499145508, "global_step": 261261, "epoch": 2159} {"train_loss": -41.2591667175293, "global_step": 261262, "epoch": 2159} {"train_loss": -41.96995162963867, "global_step": 261263, "epoch": 2159} {"train_loss": -40.204803466796875, "global_step": 261264, "epoch": 2159} {"train_loss": -42.058387756347656, "global_step": 261265, "epoch": 2159} {"train_loss": -41.93389892578125, "global_step": 261266, "epoch": 2159} {"train_loss": -41.297332763671875, "global_step": 261267, "epoch": 2159} {"train_loss": -42.40935134887695, "global_step": 261268, "epoch": 2159} {"train_loss": -41.6090087890625, "global_step": 261269, "epoch": 2159} {"train_loss": -41.69172286987305, "global_step": 261270, "epoch": 2159} {"train_loss": -42.03179931640625, "global_step": 261271, "epoch": 2159} {"train_loss": -42.46834945678711, "global_step": 261272, "epoch": 2159} {"train_loss": -42.17738723754883, "global_step": 261273, "epoch": 2159} {"train_loss": -41.891178131103516, "global_step": 261274, "epoch": 2159} {"train_loss": -41.55689239501953, "global_step": 261275, "epoch": 2159} {"train_loss": -42.20193099975586, "global_step": 261276, "epoch": 2159} {"train_loss": -42.84975814819336, "global_step": 261277, "epoch": 2159} {"train_loss": -42.97855758666992, "global_step": 261278, "epoch": 2159} {"train_loss": -42.59413528442383, "global_step": 261279, "epoch": 2159} {"train_loss": -43.045448303222656, "global_step": 261280, "epoch": 2159} {"train_loss": -42.53593063354492, "global_step": 261281, "epoch": 2159} {"train_loss": -42.491214752197266, "global_step": 261282, "epoch": 2159} {"train_loss": -42.9361572265625, "global_step": 261283, "epoch": 2159} {"train_loss": -42.37437057495117, "global_step": 261284, "epoch": 2159} {"train_loss": -42.37702178955078, "global_step": 261285, "epoch": 2159} {"train_loss": -42.91244125366211, "global_step": 261286, "epoch": 2159} {"train_loss": -42.85087585449219, "global_step": 261287, "epoch": 2159} {"train_loss": -43.1900634765625, "global_step": 261288, "epoch": 2159} {"train_loss": -42.267086029052734, "global_step": 261289, "epoch": 2159} {"train_loss": -42.713626861572266, "global_step": 261290, "epoch": 2159} {"train_loss": -43.22393798828125, "global_step": 261291, "epoch": 2159} {"train_loss": -42.87433624267578, "global_step": 261292, "epoch": 2159} {"train_loss": -42.8448600769043, "global_step": 261293, "epoch": 2159} {"train_loss": -42.40507507324219, "global_step": 261294, "epoch": 2159} {"train_loss": -43.2476921081543, "global_step": 261295, "epoch": 2159} {"train_loss": -43.47026443481445, "global_step": 261296, "epoch": 2159} {"train_loss": -43.60697555541992, "global_step": 261297, "epoch": 2159} {"train_loss": -43.419193267822266, "global_step": 261298, "epoch": 2159} {"train_loss": -43.365821838378906, "global_step": 261299, "epoch": 2159} {"train_loss": -43.83832550048828, "global_step": 261300, "epoch": 2159} {"train_loss": -43.60526657104492, "global_step": 261301, "epoch": 2159} {"train_loss": -42.16427230834961, "global_step": 261302, "epoch": 2159} {"train_loss": -43.597965240478516, "global_step": 261303, "epoch": 2159} {"train_loss": -43.299922943115234, "global_step": 261304, "epoch": 2159} {"train_loss": -43.79916000366211, "global_step": 261305, "epoch": 2159} {"train_loss": -43.73994064331055, "global_step": 261306, "epoch": 2159} {"train_loss": -43.58011245727539, "global_step": 261307, "epoch": 2159} {"train_loss": -43.692989349365234, "global_step": 261308, "epoch": 2159} {"train_loss": -43.819862365722656, "global_step": 261309, "epoch": 2159} {"train_loss": -43.08359146118164, "global_step": 261310, "epoch": 2159} {"train_loss": -43.38999938964844, "global_step": 261311, "epoch": 2159} {"train_loss": -43.46928405761719, "global_step": 261312, "epoch": 2159} {"train_loss": -43.79201889038086, "global_step": 261313, "epoch": 2159} {"train_loss": -43.59366989135742, "global_step": 261314, "epoch": 2159} {"train_loss": -43.90435791015625, "global_step": 261315, "epoch": 2159} {"train_loss": -43.71969223022461, "global_step": 261316, "epoch": 2159} {"train_loss": -42.461124420166016, "global_step": 261317, "epoch": 2159} {"train_loss": -43.005428314208984, "global_step": 261318, "epoch": 2159} {"train_loss": -42.722957611083984, "global_step": 261319, "epoch": 2159} {"train_loss": -44.019832611083984, "global_step": 261320, "epoch": 2159} {"train_loss": -44.105995178222656, "global_step": 261321, "epoch": 2159} {"train_loss": -43.46961212158203, "global_step": 261322, "epoch": 2159} {"train_loss": -42.09495162963867, "global_step": 261323, "epoch": 2159} {"train_loss": -42.56306457519531, "global_step": 261324, "epoch": 2159} {"train_loss": -38.80870056152344, "global_step": 261325, "epoch": 2159} {"train_loss": -35.751068115234375, "global_step": 261326, "epoch": 2159} {"train_loss": -24.31742286682129, "global_step": 261327, "epoch": 2159} {"train_loss": -16.47272300720215, "global_step": 261328, "epoch": 2159} {"train_loss": -29.832849502563477, "global_step": 261329, "epoch": 2159} {"train_loss": -41.11708450317383, "global_step": 261330, "epoch": 2159} {"train_loss": -28.60190200805664, "global_step": 261331, "epoch": 2159} {"train_loss": -36.97390365600586, "global_step": 261332, "epoch": 2159} {"train_loss": -40.008792877197266, "global_step": 261333, "epoch": 2159} {"train_loss": -36.2844352722168, "global_step": 261334, "epoch": 2159} {"train_loss": -41.250335693359375, "global_step": 261335, "epoch": 2159} {"train_loss": -39.530494689941406, "global_step": 261336, "epoch": 2159} {"train_loss": -42.03894805908203, "global_step": 261337, "epoch": 2159} {"train_loss": -40.65656661987305, "global_step": 261338, "epoch": 2159} {"train_loss": -41.408016204833984, "global_step": 261339, "epoch": 2159} {"train_loss": -40.097564697265625, "global_step": 261340, "epoch": 2159} {"train_loss": -41.855831146240234, "global_step": 261341, "epoch": 2159} {"train_loss": -40.49646759033203, "global_step": 261342, "epoch": 2159} {"train_loss": -40.8387565612793, "global_step": 261343, "epoch": 2159} {"train_loss": -40.98799514770508, "global_step": 261344, "epoch": 2159} {"train_loss": -41.20819091796875, "global_step": 261345, "epoch": 2159} {"train_loss": -40.80873489379883, "global_step": 261346, "epoch": 2159} {"train_loss": -41.44489288330078, "global_step": 261347, "epoch": 2159} {"train_loss": -41.966346740722656, "global_step": 261348, "epoch": 2159} {"train_loss": -40.97085189819336, "global_step": 261349, "epoch": 2159} {"train_loss": -42.646728515625, "global_step": 261350, "epoch": 2159} {"train_loss": -41.84892654418945, "global_step": 261351, "epoch": 2159} {"train_loss": -42.69526290893555, "global_step": 261352, "epoch": 2159} {"train_loss": -42.1995964050293, "global_step": 261353, "epoch": 2159} {"train_loss": -42.163368225097656, "global_step": 261354, "epoch": 2159} {"train_loss": -42.38057327270508, "global_step": 261355, "epoch": 2159} {"train_loss": -41.4525146484375, "global_step": 261356, "epoch": 2159} {"train_loss": -42.413848876953125, "global_step": 261357, "epoch": 2159} {"train_loss": -41.92154312133789, "global_step": 261358, "epoch": 2159} {"train_loss": -41.16147282497942, "global_step": 261359, "epoch": 2159, "val_loss": 2636255.75} {"train_loss": -42.297157287597656, "global_step": 261360, "epoch": 2160} {"train_loss": -42.42257308959961, "global_step": 261361, "epoch": 2160} {"train_loss": -42.44096374511719, "global_step": 261362, "epoch": 2160} {"train_loss": -42.408260345458984, "global_step": 261363, "epoch": 2160} {"train_loss": -42.538692474365234, "global_step": 261364, "epoch": 2160} {"train_loss": -43.16390609741211, "global_step": 261365, "epoch": 2160} {"train_loss": -42.59049606323242, "global_step": 261366, "epoch": 2160} {"train_loss": -42.667945861816406, "global_step": 261367, "epoch": 2160} {"train_loss": -42.77581787109375, "global_step": 261368, "epoch": 2160} {"train_loss": -42.722694396972656, "global_step": 261369, "epoch": 2160} {"train_loss": -42.750152587890625, "global_step": 261370, "epoch": 2160} {"train_loss": -42.88822937011719, "global_step": 261371, "epoch": 2160} {"train_loss": -43.07447052001953, "global_step": 261372, "epoch": 2160} {"train_loss": -43.18217849731445, "global_step": 261373, "epoch": 2160} {"train_loss": -43.188453674316406, "global_step": 261374, "epoch": 2160} {"train_loss": -42.57300567626953, "global_step": 261375, "epoch": 2160} {"train_loss": -43.17945098876953, "global_step": 261376, "epoch": 2160} {"train_loss": -43.673240661621094, "global_step": 261377, "epoch": 2160} {"train_loss": -43.23043441772461, "global_step": 261378, "epoch": 2160} {"train_loss": -43.18791580200195, "global_step": 261379, "epoch": 2160} {"train_loss": -43.6912841796875, "global_step": 261380, "epoch": 2160} {"train_loss": -43.348506927490234, "global_step": 261381, "epoch": 2160} {"train_loss": -43.391780853271484, "global_step": 261382, "epoch": 2160} {"train_loss": -43.397762298583984, "global_step": 261383, "epoch": 2160} {"train_loss": -43.5964469909668, "global_step": 261384, "epoch": 2160} {"train_loss": -42.934791564941406, "global_step": 261385, "epoch": 2160} {"train_loss": -43.03202438354492, "global_step": 261386, "epoch": 2160} {"train_loss": -43.41579055786133, "global_step": 261387, "epoch": 2160} {"train_loss": -43.5620002746582, "global_step": 261388, "epoch": 2160} {"train_loss": -43.81522750854492, "global_step": 261389, "epoch": 2160} {"train_loss": -43.81642532348633, "global_step": 261390, "epoch": 2160} {"train_loss": -43.81922149658203, "global_step": 261391, "epoch": 2160} {"train_loss": -43.78956985473633, "global_step": 261392, "epoch": 2160} {"train_loss": -43.452857971191406, "global_step": 261393, "epoch": 2160} {"train_loss": -43.5938835144043, "global_step": 261394, "epoch": 2160} {"train_loss": -43.79450607299805, "global_step": 261395, "epoch": 2160} {"train_loss": -43.7608642578125, "global_step": 261396, "epoch": 2160} {"train_loss": -43.81772232055664, "global_step": 261397, "epoch": 2160} {"train_loss": -43.572383880615234, "global_step": 261398, "epoch": 2160} {"train_loss": -43.52606201171875, "global_step": 261399, "epoch": 2160} {"train_loss": -43.731502532958984, "global_step": 261400, "epoch": 2160} {"train_loss": -43.678443908691406, "global_step": 261401, "epoch": 2160} {"train_loss": -43.76205062866211, "global_step": 261402, "epoch": 2160} {"train_loss": -43.81993865966797, "global_step": 261403, "epoch": 2160} {"train_loss": -43.745323181152344, "global_step": 261404, "epoch": 2160} {"train_loss": -43.64423751831055, "global_step": 261405, "epoch": 2160} {"train_loss": -43.690799713134766, "global_step": 261406, "epoch": 2160} {"train_loss": -44.13294219970703, "global_step": 261407, "epoch": 2160} {"train_loss": -43.78731918334961, "global_step": 261408, "epoch": 2160} {"train_loss": -43.77075958251953, "global_step": 261409, "epoch": 2160} {"train_loss": -43.7491569519043, "global_step": 261410, "epoch": 2160} {"train_loss": -42.93674087524414, "global_step": 261411, "epoch": 2160} {"train_loss": -42.76325988769531, "global_step": 261412, "epoch": 2160} {"train_loss": -42.79931640625, "global_step": 261413, "epoch": 2160} {"train_loss": -43.266178131103516, "global_step": 261414, "epoch": 2160} {"train_loss": -43.21792221069336, "global_step": 261415, "epoch": 2160} {"train_loss": -43.91897201538086, "global_step": 261416, "epoch": 2160} {"train_loss": -42.775177001953125, "global_step": 261417, "epoch": 2160} {"train_loss": -42.232906341552734, "global_step": 261418, "epoch": 2160} {"train_loss": -42.47493362426758, "global_step": 261419, "epoch": 2160} {"train_loss": -42.937477111816406, "global_step": 261420, "epoch": 2160} {"train_loss": -42.53266525268555, "global_step": 261421, "epoch": 2160} {"train_loss": -41.98140335083008, "global_step": 261422, "epoch": 2160} {"train_loss": -41.81663131713867, "global_step": 261423, "epoch": 2160} {"train_loss": -43.623260498046875, "global_step": 261424, "epoch": 2160} {"train_loss": -43.20286560058594, "global_step": 261425, "epoch": 2160} {"train_loss": -42.0100212097168, "global_step": 261426, "epoch": 2160} {"train_loss": -43.21029281616211, "global_step": 261427, "epoch": 2160} {"train_loss": -43.585994720458984, "global_step": 261428, "epoch": 2160} {"train_loss": -40.81178665161133, "global_step": 261429, "epoch": 2160} {"train_loss": -41.01136779785156, "global_step": 261430, "epoch": 2160} {"train_loss": -41.90313720703125, "global_step": 261431, "epoch": 2160} {"train_loss": -42.429683685302734, "global_step": 261432, "epoch": 2160} {"train_loss": -40.684471130371094, "global_step": 261433, "epoch": 2160} {"train_loss": -42.47652816772461, "global_step": 261434, "epoch": 2160} {"train_loss": -41.73833084106445, "global_step": 261435, "epoch": 2160} {"train_loss": -41.48287582397461, "global_step": 261436, "epoch": 2160} {"train_loss": -43.191951751708984, "global_step": 261437, "epoch": 2160} {"train_loss": -41.280025482177734, "global_step": 261438, "epoch": 2160} {"train_loss": -42.07172775268555, "global_step": 261439, "epoch": 2160} {"train_loss": -40.96610641479492, "global_step": 261440, "epoch": 2160} {"train_loss": -41.33734893798828, "global_step": 261441, "epoch": 2160} {"train_loss": -41.469181060791016, "global_step": 261442, "epoch": 2160} {"train_loss": -41.397769927978516, "global_step": 261443, "epoch": 2160} {"train_loss": -42.32944869995117, "global_step": 261444, "epoch": 2160} {"train_loss": -41.6685905456543, "global_step": 261445, "epoch": 2160} {"train_loss": -41.7684326171875, "global_step": 261446, "epoch": 2160} {"train_loss": -39.64039993286133, "global_step": 261447, "epoch": 2160} {"train_loss": -41.94020462036133, "global_step": 261448, "epoch": 2160} {"train_loss": -41.91022872924805, "global_step": 261449, "epoch": 2160} {"train_loss": -42.43723678588867, "global_step": 261450, "epoch": 2160} {"train_loss": -41.71703338623047, "global_step": 261451, "epoch": 2160} {"train_loss": -42.0897331237793, "global_step": 261452, "epoch": 2160} {"train_loss": -41.647865295410156, "global_step": 261453, "epoch": 2160} {"train_loss": -41.232444763183594, "global_step": 261454, "epoch": 2160} {"train_loss": -41.43291091918945, "global_step": 261455, "epoch": 2160} {"train_loss": -40.33618927001953, "global_step": 261456, "epoch": 2160} {"train_loss": -41.73825454711914, "global_step": 261457, "epoch": 2160} {"train_loss": -42.914791107177734, "global_step": 261458, "epoch": 2160} {"train_loss": -42.30323028564453, "global_step": 261459, "epoch": 2160} {"train_loss": -42.23971939086914, "global_step": 261460, "epoch": 2160} {"train_loss": -42.19702911376953, "global_step": 261461, "epoch": 2160} {"train_loss": -42.83210372924805, "global_step": 261462, "epoch": 2160} {"train_loss": -41.9099235534668, "global_step": 261463, "epoch": 2160} {"train_loss": -41.8523063659668, "global_step": 261464, "epoch": 2160} {"train_loss": -41.53553009033203, "global_step": 261465, "epoch": 2160} {"train_loss": -42.53927230834961, "global_step": 261466, "epoch": 2160} {"train_loss": -41.3769416809082, "global_step": 261467, "epoch": 2160} {"train_loss": -41.17725372314453, "global_step": 261468, "epoch": 2160} {"train_loss": -40.931480407714844, "global_step": 261469, "epoch": 2160} {"train_loss": -42.670352935791016, "global_step": 261470, "epoch": 2160} {"train_loss": -42.06825256347656, "global_step": 261471, "epoch": 2160} {"train_loss": -42.07689666748047, "global_step": 261472, "epoch": 2160} {"train_loss": -42.297637939453125, "global_step": 261473, "epoch": 2160} {"train_loss": -41.49282455444336, "global_step": 261474, "epoch": 2160} {"train_loss": -41.9890022277832, "global_step": 261475, "epoch": 2160} {"train_loss": -42.899166107177734, "global_step": 261476, "epoch": 2160} {"train_loss": -42.495601654052734, "global_step": 261477, "epoch": 2160} {"train_loss": -42.82398223876953, "global_step": 261478, "epoch": 2160} {"train_loss": -43.4676399230957, "global_step": 261479, "epoch": 2160} {"train_loss": -42.63012354827124, "global_step": 261480, "epoch": 2160, "val_loss": 2752148.75} {"train_loss": -42.422157287597656, "global_step": 261481, "epoch": 2161} {"train_loss": -42.922454833984375, "global_step": 261482, "epoch": 2161} {"train_loss": -41.652244567871094, "global_step": 261483, "epoch": 2161} {"train_loss": -42.209381103515625, "global_step": 261484, "epoch": 2161} {"train_loss": -43.10497283935547, "global_step": 261485, "epoch": 2161} {"train_loss": -42.60512161254883, "global_step": 261486, "epoch": 2161} {"train_loss": -42.9216194152832, "global_step": 261487, "epoch": 2161} {"train_loss": -42.13578796386719, "global_step": 261488, "epoch": 2161} {"train_loss": -40.27992630004883, "global_step": 261489, "epoch": 2161} {"train_loss": -42.421630859375, "global_step": 261490, "epoch": 2161} {"train_loss": -41.9099235534668, "global_step": 261491, "epoch": 2161} {"train_loss": -41.941688537597656, "global_step": 261492, "epoch": 2161} {"train_loss": -41.75423049926758, "global_step": 261493, "epoch": 2161} {"train_loss": -43.03809356689453, "global_step": 261494, "epoch": 2161} {"train_loss": -42.6942024230957, "global_step": 261495, "epoch": 2161} {"train_loss": -42.4490852355957, "global_step": 261496, "epoch": 2161} {"train_loss": -43.153709411621094, "global_step": 261497, "epoch": 2161} {"train_loss": -42.317562103271484, "global_step": 261498, "epoch": 2161} {"train_loss": -42.771705627441406, "global_step": 261499, "epoch": 2161} {"train_loss": -42.91117477416992, "global_step": 261500, "epoch": 2161} {"train_loss": -40.169795989990234, "global_step": 261501, "epoch": 2161} {"train_loss": -42.433197021484375, "global_step": 261502, "epoch": 2161} {"train_loss": -38.396697998046875, "global_step": 261503, "epoch": 2161} {"train_loss": -42.2191162109375, "global_step": 261504, "epoch": 2161} {"train_loss": -42.93408203125, "global_step": 261505, "epoch": 2161} {"train_loss": -43.12350082397461, "global_step": 261506, "epoch": 2161} {"train_loss": -43.26662063598633, "global_step": 261507, "epoch": 2161} {"train_loss": -42.857627868652344, "global_step": 261508, "epoch": 2161} {"train_loss": -43.38413619995117, "global_step": 261509, "epoch": 2161} {"train_loss": -42.57380676269531, "global_step": 261510, "epoch": 2161} {"train_loss": -42.47320556640625, "global_step": 261511, "epoch": 2161} {"train_loss": -42.858097076416016, "global_step": 261512, "epoch": 2161} {"train_loss": -40.61098861694336, "global_step": 261513, "epoch": 2161} {"train_loss": -42.57630157470703, "global_step": 261514, "epoch": 2161} {"train_loss": -37.0189094543457, "global_step": 261515, "epoch": 2161} {"train_loss": -42.38890075683594, "global_step": 261516, "epoch": 2161} {"train_loss": -42.449684143066406, "global_step": 261517, "epoch": 2161} {"train_loss": -32.79282760620117, "global_step": 261518, "epoch": 2161} {"train_loss": -40.70283126831055, "global_step": 261519, "epoch": 2161} {"train_loss": -35.408119201660156, "global_step": 261520, "epoch": 2161} {"train_loss": -41.78438949584961, "global_step": 261521, "epoch": 2161} {"train_loss": -41.76792907714844, "global_step": 261522, "epoch": 2161} {"train_loss": -41.200191497802734, "global_step": 261523, "epoch": 2161} {"train_loss": -39.38108825683594, "global_step": 261524, "epoch": 2161} {"train_loss": -36.59724807739258, "global_step": 261525, "epoch": 2161} {"train_loss": -41.88480758666992, "global_step": 261526, "epoch": 2161} {"train_loss": -42.36477279663086, "global_step": 261527, "epoch": 2161} {"train_loss": -41.1958122253418, "global_step": 261528, "epoch": 2161} {"train_loss": -42.42216110229492, "global_step": 261529, "epoch": 2161} {"train_loss": -42.4517822265625, "global_step": 261530, "epoch": 2161} {"train_loss": -40.760902404785156, "global_step": 261531, "epoch": 2161} {"train_loss": -41.785072326660156, "global_step": 261532, "epoch": 2161} {"train_loss": -41.79741668701172, "global_step": 261533, "epoch": 2161} {"train_loss": -42.20240020751953, "global_step": 261534, "epoch": 2161} {"train_loss": -41.77680587768555, "global_step": 261535, "epoch": 2161} {"train_loss": -42.1937141418457, "global_step": 261536, "epoch": 2161} {"train_loss": -42.01487350463867, "global_step": 261537, "epoch": 2161} {"train_loss": -40.43967819213867, "global_step": 261538, "epoch": 2161} {"train_loss": -39.74019241333008, "global_step": 261539, "epoch": 2161} {"train_loss": -42.234920501708984, "global_step": 261540, "epoch": 2161} {"train_loss": -42.94066619873047, "global_step": 261541, "epoch": 2161} {"train_loss": -41.06156921386719, "global_step": 261542, "epoch": 2161} {"train_loss": -41.03718566894531, "global_step": 261543, "epoch": 2161} {"train_loss": -39.28164291381836, "global_step": 261544, "epoch": 2161} {"train_loss": -42.71533966064453, "global_step": 261545, "epoch": 2161} {"train_loss": -42.71072006225586, "global_step": 261546, "epoch": 2161} {"train_loss": -41.75017166137695, "global_step": 261547, "epoch": 2161} {"train_loss": -41.84415817260742, "global_step": 261548, "epoch": 2161} {"train_loss": -40.592742919921875, "global_step": 261549, "epoch": 2161} {"train_loss": -41.52976608276367, "global_step": 261550, "epoch": 2161} {"train_loss": -42.12923812866211, "global_step": 261551, "epoch": 2161} {"train_loss": -42.879737854003906, "global_step": 261552, "epoch": 2161} {"train_loss": -41.76865768432617, "global_step": 261553, "epoch": 2161} {"train_loss": -42.516170501708984, "global_step": 261554, "epoch": 2161} {"train_loss": -42.178321838378906, "global_step": 261555, "epoch": 2161} {"train_loss": -42.04887008666992, "global_step": 261556, "epoch": 2161} {"train_loss": -42.005226135253906, "global_step": 261557, "epoch": 2161} {"train_loss": -41.27417755126953, "global_step": 261558, "epoch": 2161} {"train_loss": -42.9041748046875, "global_step": 261559, "epoch": 2161} {"train_loss": -41.889705657958984, "global_step": 261560, "epoch": 2161} {"train_loss": -42.361480712890625, "global_step": 261561, "epoch": 2161} {"train_loss": -42.4504280090332, "global_step": 261562, "epoch": 2161} {"train_loss": -39.71044921875, "global_step": 261563, "epoch": 2161} {"train_loss": -43.04610061645508, "global_step": 261564, "epoch": 2161} {"train_loss": -43.175811767578125, "global_step": 261565, "epoch": 2161} {"train_loss": -42.05903625488281, "global_step": 261566, "epoch": 2161} {"train_loss": -42.76447677612305, "global_step": 261567, "epoch": 2161} {"train_loss": -42.993194580078125, "global_step": 261568, "epoch": 2161} {"train_loss": -42.8146858215332, "global_step": 261569, "epoch": 2161} {"train_loss": -43.10716247558594, "global_step": 261570, "epoch": 2161} {"train_loss": -43.162715911865234, "global_step": 261571, "epoch": 2161} {"train_loss": -42.563209533691406, "global_step": 261572, "epoch": 2161} {"train_loss": -42.981868743896484, "global_step": 261573, "epoch": 2161} {"train_loss": -42.5341682434082, "global_step": 261574, "epoch": 2161} {"train_loss": -42.20876693725586, "global_step": 261575, "epoch": 2161} {"train_loss": -41.5374641418457, "global_step": 261576, "epoch": 2161} {"train_loss": -42.964027404785156, "global_step": 261577, "epoch": 2161} {"train_loss": -43.012176513671875, "global_step": 261578, "epoch": 2161} {"train_loss": -43.349021911621094, "global_step": 261579, "epoch": 2161} {"train_loss": -42.56456756591797, "global_step": 261580, "epoch": 2161} {"train_loss": -42.92939376831055, "global_step": 261581, "epoch": 2161} {"train_loss": -42.81946563720703, "global_step": 261582, "epoch": 2161} {"train_loss": -41.53078079223633, "global_step": 261583, "epoch": 2161} {"train_loss": -43.00118637084961, "global_step": 261584, "epoch": 2161} {"train_loss": -42.54115676879883, "global_step": 261585, "epoch": 2161} {"train_loss": -42.8922119140625, "global_step": 261586, "epoch": 2161} {"train_loss": -42.96291732788086, "global_step": 261587, "epoch": 2161} {"train_loss": -43.44778060913086, "global_step": 261588, "epoch": 2161} {"train_loss": -43.10182571411133, "global_step": 261589, "epoch": 2161} {"train_loss": -43.190975189208984, "global_step": 261590, "epoch": 2161} {"train_loss": -42.349700927734375, "global_step": 261591, "epoch": 2161} {"train_loss": -43.50502395629883, "global_step": 261592, "epoch": 2161} {"train_loss": -42.893409729003906, "global_step": 261593, "epoch": 2161} {"train_loss": -43.257633209228516, "global_step": 261594, "epoch": 2161} {"train_loss": -43.572853088378906, "global_step": 261595, "epoch": 2161} {"train_loss": -43.11512756347656, "global_step": 261596, "epoch": 2161} {"train_loss": -42.657047271728516, "global_step": 261597, "epoch": 2161} {"train_loss": -42.04344940185547, "global_step": 261598, "epoch": 2161} {"train_loss": -42.90363693237305, "global_step": 261599, "epoch": 2161} {"train_loss": -42.731483459472656, "global_step": 261600, "epoch": 2161} {"train_loss": -42.008057775576255, "global_step": 261601, "epoch": 2161, "val_loss": 2734633.25} {"train_loss": -42.92745590209961, "global_step": 261602, "epoch": 2162} {"train_loss": -44.025604248046875, "global_step": 261603, "epoch": 2162} {"train_loss": -43.404090881347656, "global_step": 261604, "epoch": 2162} {"train_loss": -40.984920501708984, "global_step": 261605, "epoch": 2162} {"train_loss": -43.174991607666016, "global_step": 261606, "epoch": 2162} {"train_loss": -42.6779899597168, "global_step": 261607, "epoch": 2162} {"train_loss": -43.457820892333984, "global_step": 261608, "epoch": 2162} {"train_loss": -43.458797454833984, "global_step": 261609, "epoch": 2162} {"train_loss": -43.903892517089844, "global_step": 261610, "epoch": 2162} {"train_loss": -43.313419342041016, "global_step": 261611, "epoch": 2162} {"train_loss": -43.838504791259766, "global_step": 261612, "epoch": 2162} {"train_loss": -42.79203414916992, "global_step": 261613, "epoch": 2162} {"train_loss": -42.95461654663086, "global_step": 261614, "epoch": 2162} {"train_loss": -43.17687225341797, "global_step": 261615, "epoch": 2162} {"train_loss": -43.53895950317383, "global_step": 261616, "epoch": 2162} {"train_loss": -43.45570755004883, "global_step": 261617, "epoch": 2162} {"train_loss": -43.922203063964844, "global_step": 261618, "epoch": 2162} {"train_loss": -43.57648849487305, "global_step": 261619, "epoch": 2162} {"train_loss": -43.002044677734375, "global_step": 261620, "epoch": 2162} {"train_loss": -43.51222610473633, "global_step": 261621, "epoch": 2162} {"train_loss": -42.85721969604492, "global_step": 261622, "epoch": 2162} {"train_loss": -43.3675422668457, "global_step": 261623, "epoch": 2162} {"train_loss": -43.01801300048828, "global_step": 261624, "epoch": 2162} {"train_loss": -43.121273040771484, "global_step": 261625, "epoch": 2162} {"train_loss": -43.13529586791992, "global_step": 261626, "epoch": 2162} {"train_loss": -42.39183807373047, "global_step": 261627, "epoch": 2162} {"train_loss": -42.222328186035156, "global_step": 261628, "epoch": 2162} {"train_loss": -42.68632888793945, "global_step": 261629, "epoch": 2162} {"train_loss": -42.971866607666016, "global_step": 261630, "epoch": 2162} {"train_loss": -43.60160446166992, "global_step": 261631, "epoch": 2162} {"train_loss": -41.955604553222656, "global_step": 261632, "epoch": 2162} {"train_loss": -39.43928146362305, "global_step": 261633, "epoch": 2162} {"train_loss": -41.8465461730957, "global_step": 261634, "epoch": 2162} {"train_loss": -40.40018081665039, "global_step": 261635, "epoch": 2162} {"train_loss": -40.536102294921875, "global_step": 261636, "epoch": 2162} {"train_loss": -41.187782287597656, "global_step": 261637, "epoch": 2162} {"train_loss": -42.02305603027344, "global_step": 261638, "epoch": 2162} {"train_loss": -37.5838737487793, "global_step": 261639, "epoch": 2162} {"train_loss": -41.19764709472656, "global_step": 261640, "epoch": 2162} {"train_loss": -41.96597671508789, "global_step": 261641, "epoch": 2162} {"train_loss": -41.87557601928711, "global_step": 261642, "epoch": 2162} {"train_loss": -39.715877532958984, "global_step": 261643, "epoch": 2162} {"train_loss": -38.87339401245117, "global_step": 261644, "epoch": 2162} {"train_loss": -38.43266677856445, "global_step": 261645, "epoch": 2162} {"train_loss": -38.84778594970703, "global_step": 261646, "epoch": 2162} {"train_loss": -41.740535736083984, "global_step": 261647, "epoch": 2162} {"train_loss": -41.26162338256836, "global_step": 261648, "epoch": 2162} {"train_loss": -40.58329391479492, "global_step": 261649, "epoch": 2162} {"train_loss": -40.56882095336914, "global_step": 261650, "epoch": 2162} {"train_loss": -40.68636703491211, "global_step": 261651, "epoch": 2162} {"train_loss": -41.056095123291016, "global_step": 261652, "epoch": 2162} {"train_loss": -42.26033401489258, "global_step": 261653, "epoch": 2162} {"train_loss": -39.778743743896484, "global_step": 261654, "epoch": 2162} {"train_loss": -42.207672119140625, "global_step": 261655, "epoch": 2162} {"train_loss": -40.97515869140625, "global_step": 261656, "epoch": 2162} {"train_loss": -40.945274353027344, "global_step": 261657, "epoch": 2162} {"train_loss": -39.48563766479492, "global_step": 261658, "epoch": 2162} {"train_loss": -41.7365608215332, "global_step": 261659, "epoch": 2162} {"train_loss": -41.89137649536133, "global_step": 261660, "epoch": 2162} {"train_loss": -42.467281341552734, "global_step": 261661, "epoch": 2162} {"train_loss": -41.89738845825195, "global_step": 261662, "epoch": 2162} {"train_loss": -42.18472671508789, "global_step": 261663, "epoch": 2162} {"train_loss": -42.488067626953125, "global_step": 261664, "epoch": 2162} {"train_loss": -38.229949951171875, "global_step": 261665, "epoch": 2162} {"train_loss": -42.83945846557617, "global_step": 261666, "epoch": 2162} {"train_loss": -42.25928497314453, "global_step": 261667, "epoch": 2162} {"train_loss": -40.25735092163086, "global_step": 261668, "epoch": 2162} {"train_loss": -38.5123291015625, "global_step": 261669, "epoch": 2162} {"train_loss": -41.23757553100586, "global_step": 261670, "epoch": 2162} {"train_loss": -42.50688171386719, "global_step": 261671, "epoch": 2162} {"train_loss": -40.96668243408203, "global_step": 261672, "epoch": 2162} {"train_loss": -42.67450714111328, "global_step": 261673, "epoch": 2162} {"train_loss": -41.89063262939453, "global_step": 261674, "epoch": 2162} {"train_loss": -40.838375091552734, "global_step": 261675, "epoch": 2162} {"train_loss": -38.53457260131836, "global_step": 261676, "epoch": 2162} {"train_loss": -41.781646728515625, "global_step": 261677, "epoch": 2162} {"train_loss": -42.709251403808594, "global_step": 261678, "epoch": 2162} {"train_loss": -39.64441680908203, "global_step": 261679, "epoch": 2162} {"train_loss": -41.13074493408203, "global_step": 261680, "epoch": 2162} {"train_loss": -42.16105270385742, "global_step": 261681, "epoch": 2162} {"train_loss": -42.88041305541992, "global_step": 261682, "epoch": 2162} {"train_loss": -42.29741287231445, "global_step": 261683, "epoch": 2162} {"train_loss": -37.51030349731445, "global_step": 261684, "epoch": 2162} {"train_loss": -42.99346160888672, "global_step": 261685, "epoch": 2162} {"train_loss": -41.235877990722656, "global_step": 261686, "epoch": 2162} {"train_loss": -41.5334587097168, "global_step": 261687, "epoch": 2162} {"train_loss": -40.9192008972168, "global_step": 261688, "epoch": 2162} {"train_loss": -41.628631591796875, "global_step": 261689, "epoch": 2162} {"train_loss": -39.84043502807617, "global_step": 261690, "epoch": 2162} {"train_loss": -40.42892837524414, "global_step": 261691, "epoch": 2162} {"train_loss": -42.8839225769043, "global_step": 261692, "epoch": 2162} {"train_loss": -40.502864837646484, "global_step": 261693, "epoch": 2162} {"train_loss": -38.83402633666992, "global_step": 261694, "epoch": 2162} {"train_loss": -40.07419967651367, "global_step": 261695, "epoch": 2162} {"train_loss": -41.287784576416016, "global_step": 261696, "epoch": 2162} {"train_loss": -41.3154182434082, "global_step": 261697, "epoch": 2162} {"train_loss": -38.13530349731445, "global_step": 261698, "epoch": 2162} {"train_loss": -41.505794525146484, "global_step": 261699, "epoch": 2162} {"train_loss": -40.60919189453125, "global_step": 261700, "epoch": 2162} {"train_loss": -41.965755462646484, "global_step": 261701, "epoch": 2162} {"train_loss": -41.83999252319336, "global_step": 261702, "epoch": 2162} {"train_loss": -35.19100570678711, "global_step": 261703, "epoch": 2162} {"train_loss": -41.19959259033203, "global_step": 261704, "epoch": 2162} {"train_loss": -40.36865997314453, "global_step": 261705, "epoch": 2162} {"train_loss": -39.264808654785156, "global_step": 261706, "epoch": 2162} {"train_loss": -42.08362579345703, "global_step": 261707, "epoch": 2162} {"train_loss": -39.72013854980469, "global_step": 261708, "epoch": 2162} {"train_loss": -41.05128860473633, "global_step": 261709, "epoch": 2162} {"train_loss": -41.446754455566406, "global_step": 261710, "epoch": 2162} {"train_loss": -40.9616813659668, "global_step": 261711, "epoch": 2162} {"train_loss": -41.42713165283203, "global_step": 261712, "epoch": 2162} {"train_loss": -40.700130462646484, "global_step": 261713, "epoch": 2162} {"train_loss": -41.016483306884766, "global_step": 261714, "epoch": 2162} {"train_loss": -41.78495407104492, "global_step": 261715, "epoch": 2162} {"train_loss": -39.35288619995117, "global_step": 261716, "epoch": 2162} {"train_loss": -41.07386016845703, "global_step": 261717, "epoch": 2162} {"train_loss": -41.326881408691406, "global_step": 261718, "epoch": 2162} {"train_loss": -41.181800842285156, "global_step": 261719, "epoch": 2162} {"train_loss": -40.96651077270508, "global_step": 261720, "epoch": 2162} {"train_loss": -42.148860931396484, "global_step": 261721, "epoch": 2162} {"train_loss": -41.47092592223617, "global_step": 261722, "epoch": 2162, "val_loss": 2666837.75} {"train_loss": -42.091915130615234, "global_step": 261723, "epoch": 2163} {"train_loss": -42.363521575927734, "global_step": 261724, "epoch": 2163} {"train_loss": -41.236488342285156, "global_step": 261725, "epoch": 2163} {"train_loss": -41.54612350463867, "global_step": 261726, "epoch": 2163} {"train_loss": -42.25177001953125, "global_step": 261727, "epoch": 2163} {"train_loss": -41.795875549316406, "global_step": 261728, "epoch": 2163} {"train_loss": -42.62728500366211, "global_step": 261729, "epoch": 2163} {"train_loss": -42.35302734375, "global_step": 261730, "epoch": 2163} {"train_loss": -42.77326965332031, "global_step": 261731, "epoch": 2163} {"train_loss": -41.915531158447266, "global_step": 261732, "epoch": 2163} {"train_loss": -41.96694564819336, "global_step": 261733, "epoch": 2163} {"train_loss": -42.48311996459961, "global_step": 261734, "epoch": 2163} {"train_loss": -41.345577239990234, "global_step": 261735, "epoch": 2163} {"train_loss": -42.06681442260742, "global_step": 261736, "epoch": 2163} {"train_loss": -42.48348617553711, "global_step": 261737, "epoch": 2163} {"train_loss": -42.407386779785156, "global_step": 261738, "epoch": 2163} {"train_loss": -42.68978500366211, "global_step": 261739, "epoch": 2163} {"train_loss": -42.34383773803711, "global_step": 261740, "epoch": 2163} {"train_loss": -43.03560256958008, "global_step": 261741, "epoch": 2163} {"train_loss": -42.67912673950195, "global_step": 261742, "epoch": 2163} {"train_loss": -43.10343551635742, "global_step": 261743, "epoch": 2163} {"train_loss": -42.55469512939453, "global_step": 261744, "epoch": 2163} {"train_loss": -42.509368896484375, "global_step": 261745, "epoch": 2163} {"train_loss": -42.168006896972656, "global_step": 261746, "epoch": 2163} {"train_loss": -42.526371002197266, "global_step": 261747, "epoch": 2163} {"train_loss": -42.88119888305664, "global_step": 261748, "epoch": 2163} {"train_loss": -42.77487564086914, "global_step": 261749, "epoch": 2163} {"train_loss": -42.23382568359375, "global_step": 261750, "epoch": 2163} {"train_loss": -41.10366439819336, "global_step": 261751, "epoch": 2163} {"train_loss": -42.69294357299805, "global_step": 261752, "epoch": 2163} {"train_loss": -42.84223937988281, "global_step": 261753, "epoch": 2163} {"train_loss": -43.272071838378906, "global_step": 261754, "epoch": 2163} {"train_loss": -43.06536102294922, "global_step": 261755, "epoch": 2163} {"train_loss": -43.10972213745117, "global_step": 261756, "epoch": 2163} {"train_loss": -42.830318450927734, "global_step": 261757, "epoch": 2163} {"train_loss": -42.829376220703125, "global_step": 261758, "epoch": 2163} {"train_loss": -43.28349685668945, "global_step": 261759, "epoch": 2163} {"train_loss": -43.31343460083008, "global_step": 261760, "epoch": 2163} {"train_loss": -42.557472229003906, "global_step": 261761, "epoch": 2163} {"train_loss": -43.351539611816406, "global_step": 261762, "epoch": 2163} {"train_loss": -42.944393157958984, "global_step": 261763, "epoch": 2163} {"train_loss": -41.96236801147461, "global_step": 261764, "epoch": 2163} {"train_loss": -43.377071380615234, "global_step": 261765, "epoch": 2163} {"train_loss": -42.862789154052734, "global_step": 261766, "epoch": 2163} {"train_loss": -43.2569465637207, "global_step": 261767, "epoch": 2163} {"train_loss": -43.27982711791992, "global_step": 261768, "epoch": 2163} {"train_loss": -43.0753173828125, "global_step": 261769, "epoch": 2163} {"train_loss": -43.63520050048828, "global_step": 261770, "epoch": 2163} {"train_loss": -42.9269905090332, "global_step": 261771, "epoch": 2163} {"train_loss": -42.87921142578125, "global_step": 261772, "epoch": 2163} {"train_loss": -43.227264404296875, "global_step": 261773, "epoch": 2163} {"train_loss": -43.12211608886719, "global_step": 261774, "epoch": 2163} {"train_loss": -43.149471282958984, "global_step": 261775, "epoch": 2163} {"train_loss": -43.486297607421875, "global_step": 261776, "epoch": 2163} {"train_loss": -43.353389739990234, "global_step": 261777, "epoch": 2163} {"train_loss": -43.3828125, "global_step": 261778, "epoch": 2163} {"train_loss": -43.21444320678711, "global_step": 261779, "epoch": 2163} {"train_loss": -43.28593826293945, "global_step": 261780, "epoch": 2163} {"train_loss": -43.86153793334961, "global_step": 261781, "epoch": 2163} {"train_loss": -43.53839111328125, "global_step": 261782, "epoch": 2163} {"train_loss": -43.30587387084961, "global_step": 261783, "epoch": 2163} {"train_loss": -43.9668083190918, "global_step": 261784, "epoch": 2163} {"train_loss": -43.8587760925293, "global_step": 261785, "epoch": 2163} {"train_loss": -43.91058349609375, "global_step": 261786, "epoch": 2163} {"train_loss": -43.731868743896484, "global_step": 261787, "epoch": 2163} {"train_loss": -44.134918212890625, "global_step": 261788, "epoch": 2163} {"train_loss": -43.1982536315918, "global_step": 261789, "epoch": 2163} {"train_loss": -43.96474075317383, "global_step": 261790, "epoch": 2163} {"train_loss": -43.11910629272461, "global_step": 261791, "epoch": 2163} {"train_loss": -42.680389404296875, "global_step": 261792, "epoch": 2163} {"train_loss": -43.79743576049805, "global_step": 261793, "epoch": 2163} {"train_loss": -44.120540618896484, "global_step": 261794, "epoch": 2163} {"train_loss": -43.36558151245117, "global_step": 261795, "epoch": 2163} {"train_loss": -42.9129638671875, "global_step": 261796, "epoch": 2163} {"train_loss": -40.62693405151367, "global_step": 261797, "epoch": 2163} {"train_loss": -38.75190353393555, "global_step": 261798, "epoch": 2163} {"train_loss": -38.70951461791992, "global_step": 261799, "epoch": 2163} {"train_loss": -36.597774505615234, "global_step": 261800, "epoch": 2163} {"train_loss": -34.66384506225586, "global_step": 261801, "epoch": 2163} {"train_loss": -40.24367141723633, "global_step": 261802, "epoch": 2163} {"train_loss": -41.87150192260742, "global_step": 261803, "epoch": 2163} {"train_loss": -40.00128173828125, "global_step": 261804, "epoch": 2163} {"train_loss": -39.29903030395508, "global_step": 261805, "epoch": 2163} {"train_loss": -41.08638381958008, "global_step": 261806, "epoch": 2163} {"train_loss": -42.819091796875, "global_step": 261807, "epoch": 2163} {"train_loss": -37.68879318237305, "global_step": 261808, "epoch": 2163} {"train_loss": -40.21281814575195, "global_step": 261809, "epoch": 2163} {"train_loss": -42.84953689575195, "global_step": 261810, "epoch": 2163} {"train_loss": -39.997920989990234, "global_step": 261811, "epoch": 2163} {"train_loss": -41.03427505493164, "global_step": 261812, "epoch": 2163} {"train_loss": -42.234962463378906, "global_step": 261813, "epoch": 2163} {"train_loss": -42.09764862060547, "global_step": 261814, "epoch": 2163} {"train_loss": -41.92210006713867, "global_step": 261815, "epoch": 2163} {"train_loss": -42.409481048583984, "global_step": 261816, "epoch": 2163} {"train_loss": -42.26114273071289, "global_step": 261817, "epoch": 2163} {"train_loss": -42.024925231933594, "global_step": 261818, "epoch": 2163} {"train_loss": -39.22172164916992, "global_step": 261819, "epoch": 2163} {"train_loss": -42.78696823120117, "global_step": 261820, "epoch": 2163} {"train_loss": -41.34164047241211, "global_step": 261821, "epoch": 2163} {"train_loss": -32.96400833129883, "global_step": 261822, "epoch": 2163} {"train_loss": -38.56496810913086, "global_step": 261823, "epoch": 2163} {"train_loss": -41.30910873413086, "global_step": 261824, "epoch": 2163} {"train_loss": -41.297245025634766, "global_step": 261825, "epoch": 2163} {"train_loss": -40.041500091552734, "global_step": 261826, "epoch": 2163} {"train_loss": -41.827117919921875, "global_step": 261827, "epoch": 2163} {"train_loss": -37.04332733154297, "global_step": 261828, "epoch": 2163} {"train_loss": -39.59992599487305, "global_step": 261829, "epoch": 2163} {"train_loss": -40.78752517700195, "global_step": 261830, "epoch": 2163} {"train_loss": -38.47567367553711, "global_step": 261831, "epoch": 2163} {"train_loss": -40.875343322753906, "global_step": 261832, "epoch": 2163} {"train_loss": -41.21773910522461, "global_step": 261833, "epoch": 2163} {"train_loss": -41.159523010253906, "global_step": 261834, "epoch": 2163} {"train_loss": -40.5216178894043, "global_step": 261835, "epoch": 2163} {"train_loss": -41.71501541137695, "global_step": 261836, "epoch": 2163} {"train_loss": -41.132080078125, "global_step": 261837, "epoch": 2163} {"train_loss": -41.692501068115234, "global_step": 261838, "epoch": 2163} {"train_loss": -40.79549789428711, "global_step": 261839, "epoch": 2163} {"train_loss": -40.62910079956055, "global_step": 261840, "epoch": 2163} {"train_loss": -41.36445236206055, "global_step": 261841, "epoch": 2163} {"train_loss": -41.0966682434082, "global_step": 261842, "epoch": 2163} {"train_loss": -41.90925043279474, "global_step": 261843, "epoch": 2163, "val_loss": 2698243.75} {"train_loss": -41.85418701171875, "global_step": 261844, "epoch": 2164} {"train_loss": -41.71061706542969, "global_step": 261845, "epoch": 2164} {"train_loss": -41.94367218017578, "global_step": 261846, "epoch": 2164} {"train_loss": -42.24520492553711, "global_step": 261847, "epoch": 2164} {"train_loss": -42.504661560058594, "global_step": 261848, "epoch": 2164} {"train_loss": -42.62876510620117, "global_step": 261849, "epoch": 2164} {"train_loss": -42.68081283569336, "global_step": 261850, "epoch": 2164} {"train_loss": -42.46489334106445, "global_step": 261851, "epoch": 2164} {"train_loss": -42.383724212646484, "global_step": 261852, "epoch": 2164} {"train_loss": -42.7384147644043, "global_step": 261853, "epoch": 2164} {"train_loss": -42.170040130615234, "global_step": 261854, "epoch": 2164} {"train_loss": -42.22378921508789, "global_step": 261855, "epoch": 2164} {"train_loss": -43.238983154296875, "global_step": 261856, "epoch": 2164} {"train_loss": -41.4698600769043, "global_step": 261857, "epoch": 2164} {"train_loss": -41.83587646484375, "global_step": 261858, "epoch": 2164} {"train_loss": -43.236793518066406, "global_step": 261859, "epoch": 2164} {"train_loss": -39.84902572631836, "global_step": 261860, "epoch": 2164} {"train_loss": -43.82367706298828, "global_step": 261861, "epoch": 2164} {"train_loss": -42.49589920043945, "global_step": 261862, "epoch": 2164} {"train_loss": -43.05759811401367, "global_step": 261863, "epoch": 2164} {"train_loss": -41.16691970825195, "global_step": 261864, "epoch": 2164} {"train_loss": -42.58730697631836, "global_step": 261865, "epoch": 2164} {"train_loss": -42.63676071166992, "global_step": 261866, "epoch": 2164} {"train_loss": -42.2259407043457, "global_step": 261867, "epoch": 2164} {"train_loss": -43.453617095947266, "global_step": 261868, "epoch": 2164} {"train_loss": -42.95414352416992, "global_step": 261869, "epoch": 2164} {"train_loss": -38.436614990234375, "global_step": 261870, "epoch": 2164} {"train_loss": -43.24686813354492, "global_step": 261871, "epoch": 2164} {"train_loss": -42.89687728881836, "global_step": 261872, "epoch": 2164} {"train_loss": -42.92080307006836, "global_step": 261873, "epoch": 2164} {"train_loss": -42.86585235595703, "global_step": 261874, "epoch": 2164} {"train_loss": -42.54339599609375, "global_step": 261875, "epoch": 2164} {"train_loss": -42.49215316772461, "global_step": 261876, "epoch": 2164} {"train_loss": -42.583702087402344, "global_step": 261877, "epoch": 2164} {"train_loss": -42.47138595581055, "global_step": 261878, "epoch": 2164} {"train_loss": -43.26200485229492, "global_step": 261879, "epoch": 2164} {"train_loss": -42.45347213745117, "global_step": 261880, "epoch": 2164} {"train_loss": -42.097015380859375, "global_step": 261881, "epoch": 2164} {"train_loss": -42.47910690307617, "global_step": 261882, "epoch": 2164} {"train_loss": -42.54964065551758, "global_step": 261883, "epoch": 2164} {"train_loss": -42.85981369018555, "global_step": 261884, "epoch": 2164} {"train_loss": -42.773983001708984, "global_step": 261885, "epoch": 2164} {"train_loss": -42.32139205932617, "global_step": 261886, "epoch": 2164} {"train_loss": -42.41337203979492, "global_step": 261887, "epoch": 2164} {"train_loss": -41.484283447265625, "global_step": 261888, "epoch": 2164} {"train_loss": -42.29494094848633, "global_step": 261889, "epoch": 2164} {"train_loss": -39.56734848022461, "global_step": 261890, "epoch": 2164} {"train_loss": -42.321022033691406, "global_step": 261891, "epoch": 2164} {"train_loss": -42.252498626708984, "global_step": 261892, "epoch": 2164} {"train_loss": -41.91059875488281, "global_step": 261893, "epoch": 2164} {"train_loss": -41.72541427612305, "global_step": 261894, "epoch": 2164} {"train_loss": -42.88980484008789, "global_step": 261895, "epoch": 2164} {"train_loss": -42.933170318603516, "global_step": 261896, "epoch": 2164} {"train_loss": -42.25141525268555, "global_step": 261897, "epoch": 2164} {"train_loss": -42.85984420776367, "global_step": 261898, "epoch": 2164} {"train_loss": -42.99294662475586, "global_step": 261899, "epoch": 2164} {"train_loss": -42.94765853881836, "global_step": 261900, "epoch": 2164} {"train_loss": -42.455787658691406, "global_step": 261901, "epoch": 2164} {"train_loss": -42.52702331542969, "global_step": 261902, "epoch": 2164} {"train_loss": -42.822933197021484, "global_step": 261903, "epoch": 2164} {"train_loss": -42.95321273803711, "global_step": 261904, "epoch": 2164} {"train_loss": -43.727996826171875, "global_step": 261905, "epoch": 2164} {"train_loss": -43.3344612121582, "global_step": 261906, "epoch": 2164} {"train_loss": -43.304290771484375, "global_step": 261907, "epoch": 2164} {"train_loss": -43.217769622802734, "global_step": 261908, "epoch": 2164} {"train_loss": -42.7450065612793, "global_step": 261909, "epoch": 2164} {"train_loss": -42.6318473815918, "global_step": 261910, "epoch": 2164} {"train_loss": -43.735286712646484, "global_step": 261911, "epoch": 2164} {"train_loss": -41.75846481323242, "global_step": 261912, "epoch": 2164} {"train_loss": -42.58076477050781, "global_step": 261913, "epoch": 2164} {"train_loss": -43.23308181762695, "global_step": 261914, "epoch": 2164} {"train_loss": -40.69425582885742, "global_step": 261915, "epoch": 2164} {"train_loss": -43.07939529418945, "global_step": 261916, "epoch": 2164} {"train_loss": -42.61176300048828, "global_step": 261917, "epoch": 2164} {"train_loss": -42.97854232788086, "global_step": 261918, "epoch": 2164} {"train_loss": -43.06879425048828, "global_step": 261919, "epoch": 2164} {"train_loss": -42.20570755004883, "global_step": 261920, "epoch": 2164} {"train_loss": -42.30302047729492, "global_step": 261921, "epoch": 2164} {"train_loss": -42.71668243408203, "global_step": 261922, "epoch": 2164} {"train_loss": -42.3273811340332, "global_step": 261923, "epoch": 2164} {"train_loss": -41.18632125854492, "global_step": 261924, "epoch": 2164} {"train_loss": -42.90742874145508, "global_step": 261925, "epoch": 2164} {"train_loss": -43.145782470703125, "global_step": 261926, "epoch": 2164} {"train_loss": -42.911277770996094, "global_step": 261927, "epoch": 2164} {"train_loss": -42.388282775878906, "global_step": 261928, "epoch": 2164} {"train_loss": -38.59607696533203, "global_step": 261929, "epoch": 2164} {"train_loss": -43.13985824584961, "global_step": 261930, "epoch": 2164} {"train_loss": -42.71860885620117, "global_step": 261931, "epoch": 2164} {"train_loss": -42.941436767578125, "global_step": 261932, "epoch": 2164} {"train_loss": -41.76126480102539, "global_step": 261933, "epoch": 2164} {"train_loss": -42.18049621582031, "global_step": 261934, "epoch": 2164} {"train_loss": -43.015174865722656, "global_step": 261935, "epoch": 2164} {"train_loss": -43.00307846069336, "global_step": 261936, "epoch": 2164} {"train_loss": -40.69746780395508, "global_step": 261937, "epoch": 2164} {"train_loss": -40.737548828125, "global_step": 261938, "epoch": 2164} {"train_loss": -39.93087387084961, "global_step": 261939, "epoch": 2164} {"train_loss": -42.5501594543457, "global_step": 261940, "epoch": 2164} {"train_loss": -40.02801513671875, "global_step": 261941, "epoch": 2164} {"train_loss": -43.28007888793945, "global_step": 261942, "epoch": 2164} {"train_loss": -41.951904296875, "global_step": 261943, "epoch": 2164} {"train_loss": -41.58987808227539, "global_step": 261944, "epoch": 2164} {"train_loss": -37.352535247802734, "global_step": 261945, "epoch": 2164} {"train_loss": -37.26191329956055, "global_step": 261946, "epoch": 2164} {"train_loss": -41.080604553222656, "global_step": 261947, "epoch": 2164} {"train_loss": -41.198875427246094, "global_step": 261948, "epoch": 2164} {"train_loss": -41.48351287841797, "global_step": 261949, "epoch": 2164} {"train_loss": -42.75042724609375, "global_step": 261950, "epoch": 2164} {"train_loss": -41.8368034362793, "global_step": 261951, "epoch": 2164} {"train_loss": -41.20248031616211, "global_step": 261952, "epoch": 2164} {"train_loss": -41.5428581237793, "global_step": 261953, "epoch": 2164} {"train_loss": -41.05376052856445, "global_step": 261954, "epoch": 2164} {"train_loss": -35.35348892211914, "global_step": 261955, "epoch": 2164} {"train_loss": -35.5291862487793, "global_step": 261956, "epoch": 2164} {"train_loss": -40.5478630065918, "global_step": 261957, "epoch": 2164} {"train_loss": -42.49644470214844, "global_step": 261958, "epoch": 2164} {"train_loss": -40.336029052734375, "global_step": 261959, "epoch": 2164} {"train_loss": -42.98740768432617, "global_step": 261960, "epoch": 2164} {"train_loss": -37.69404983520508, "global_step": 261961, "epoch": 2164} {"train_loss": -42.96767044067383, "global_step": 261962, "epoch": 2164} {"train_loss": -41.8264045715332, "global_step": 261963, "epoch": 2164} {"train_loss": -42.02867949304502, "global_step": 261964, "epoch": 2164, "val_loss": 2853978.25} {"train_loss": -42.370662689208984, "global_step": 261965, "epoch": 2165} {"train_loss": -42.00807571411133, "global_step": 261966, "epoch": 2165} {"train_loss": -41.50917053222656, "global_step": 261967, "epoch": 2165} {"train_loss": -41.25726318359375, "global_step": 261968, "epoch": 2165} {"train_loss": -40.018409729003906, "global_step": 261969, "epoch": 2165} {"train_loss": -42.51578903198242, "global_step": 261970, "epoch": 2165} {"train_loss": -42.44038772583008, "global_step": 261971, "epoch": 2165} {"train_loss": -39.64204025268555, "global_step": 261972, "epoch": 2165} {"train_loss": -40.928138732910156, "global_step": 261973, "epoch": 2165} {"train_loss": -42.54052734375, "global_step": 261974, "epoch": 2165} {"train_loss": -41.914974212646484, "global_step": 261975, "epoch": 2165} {"train_loss": -43.1898307800293, "global_step": 261976, "epoch": 2165} {"train_loss": -41.74779510498047, "global_step": 261977, "epoch": 2165} {"train_loss": -42.09714889526367, "global_step": 261978, "epoch": 2165} {"train_loss": -42.61237716674805, "global_step": 261979, "epoch": 2165} {"train_loss": -41.01308059692383, "global_step": 261980, "epoch": 2165} {"train_loss": -42.38227462768555, "global_step": 261981, "epoch": 2165} {"train_loss": -40.981929779052734, "global_step": 261982, "epoch": 2165} {"train_loss": -41.01023483276367, "global_step": 261983, "epoch": 2165} {"train_loss": -42.376678466796875, "global_step": 261984, "epoch": 2165} {"train_loss": -41.863502502441406, "global_step": 261985, "epoch": 2165} {"train_loss": -41.450103759765625, "global_step": 261986, "epoch": 2165} {"train_loss": -42.57813262939453, "global_step": 261987, "epoch": 2165} {"train_loss": -42.309539794921875, "global_step": 261988, "epoch": 2165} {"train_loss": -42.912166595458984, "global_step": 261989, "epoch": 2165} {"train_loss": -42.82302474975586, "global_step": 261990, "epoch": 2165} {"train_loss": -42.95608139038086, "global_step": 261991, "epoch": 2165} {"train_loss": -42.24027633666992, "global_step": 261992, "epoch": 2165} {"train_loss": -42.11869812011719, "global_step": 261993, "epoch": 2165} {"train_loss": -43.010799407958984, "global_step": 261994, "epoch": 2165} {"train_loss": -42.948402404785156, "global_step": 261995, "epoch": 2165} {"train_loss": -42.97331619262695, "global_step": 261996, "epoch": 2165} {"train_loss": -42.55358123779297, "global_step": 261997, "epoch": 2165} {"train_loss": -42.51338577270508, "global_step": 261998, "epoch": 2165} {"train_loss": -42.70262908935547, "global_step": 261999, "epoch": 2165} {"train_loss": -41.140254974365234, "global_step": 262000, "epoch": 2165} {"train_loss": -42.8929328918457, "global_step": 262001, "epoch": 2165} {"train_loss": -42.839447021484375, "global_step": 262002, "epoch": 2165} {"train_loss": -38.11912155151367, "global_step": 262003, "epoch": 2165} {"train_loss": -42.20793151855469, "global_step": 262004, "epoch": 2165} {"train_loss": -42.77444076538086, "global_step": 262005, "epoch": 2165} {"train_loss": -41.82802200317383, "global_step": 262006, "epoch": 2165} {"train_loss": -43.000526428222656, "global_step": 262007, "epoch": 2165} {"train_loss": -42.6701774597168, "global_step": 262008, "epoch": 2165} {"train_loss": -42.68264389038086, "global_step": 262009, "epoch": 2165} {"train_loss": -42.54813766479492, "global_step": 262010, "epoch": 2165} {"train_loss": -42.044551849365234, "global_step": 262011, "epoch": 2165} {"train_loss": -43.04731369018555, "global_step": 262012, "epoch": 2165} {"train_loss": -42.912200927734375, "global_step": 262013, "epoch": 2165} {"train_loss": -43.31815719604492, "global_step": 262014, "epoch": 2165} {"train_loss": -42.827857971191406, "global_step": 262015, "epoch": 2165} {"train_loss": -42.398529052734375, "global_step": 262016, "epoch": 2165} {"train_loss": -43.2894401550293, "global_step": 262017, "epoch": 2165} {"train_loss": -43.2396240234375, "global_step": 262018, "epoch": 2165} {"train_loss": -42.6043586730957, "global_step": 262019, "epoch": 2165} {"train_loss": -42.63433837890625, "global_step": 262020, "epoch": 2165} {"train_loss": -42.607723236083984, "global_step": 262021, "epoch": 2165} {"train_loss": -43.20372009277344, "global_step": 262022, "epoch": 2165} {"train_loss": -41.19205856323242, "global_step": 262023, "epoch": 2165} {"train_loss": -38.51234436035156, "global_step": 262024, "epoch": 2165} {"train_loss": -41.76777267456055, "global_step": 262025, "epoch": 2165} {"train_loss": -42.939430236816406, "global_step": 262026, "epoch": 2165} {"train_loss": -42.62984848022461, "global_step": 262027, "epoch": 2165} {"train_loss": -43.03315734863281, "global_step": 262028, "epoch": 2165} {"train_loss": -43.01627731323242, "global_step": 262029, "epoch": 2165} {"train_loss": -38.90822219848633, "global_step": 262030, "epoch": 2165} {"train_loss": -41.92873001098633, "global_step": 262031, "epoch": 2165} {"train_loss": -38.19781494140625, "global_step": 262032, "epoch": 2165} {"train_loss": -40.86385726928711, "global_step": 262033, "epoch": 2165} {"train_loss": -39.7596549987793, "global_step": 262034, "epoch": 2165} {"train_loss": -39.17678451538086, "global_step": 262035, "epoch": 2165} {"train_loss": -38.510223388671875, "global_step": 262036, "epoch": 2165} {"train_loss": -37.10345458984375, "global_step": 262037, "epoch": 2165} {"train_loss": -37.42597198486328, "global_step": 262038, "epoch": 2165} {"train_loss": -40.237117767333984, "global_step": 262039, "epoch": 2165} {"train_loss": -41.22825241088867, "global_step": 262040, "epoch": 2165} {"train_loss": -39.8365478515625, "global_step": 262041, "epoch": 2165} {"train_loss": -40.01826858520508, "global_step": 262042, "epoch": 2165} {"train_loss": -42.39548110961914, "global_step": 262043, "epoch": 2165} {"train_loss": -40.5481071472168, "global_step": 262044, "epoch": 2165} {"train_loss": -40.622650146484375, "global_step": 262045, "epoch": 2165} {"train_loss": -37.89058303833008, "global_step": 262046, "epoch": 2165} {"train_loss": -39.777767181396484, "global_step": 262047, "epoch": 2165} {"train_loss": -40.27726745605469, "global_step": 262048, "epoch": 2165} {"train_loss": -40.6395263671875, "global_step": 262049, "epoch": 2165} {"train_loss": -41.09497833251953, "global_step": 262050, "epoch": 2165} {"train_loss": -40.83881759643555, "global_step": 262051, "epoch": 2165} {"train_loss": -40.355464935302734, "global_step": 262052, "epoch": 2165} {"train_loss": -39.61299133300781, "global_step": 262053, "epoch": 2165} {"train_loss": -38.64299392700195, "global_step": 262054, "epoch": 2165} {"train_loss": -40.259765625, "global_step": 262055, "epoch": 2165} {"train_loss": -37.19739532470703, "global_step": 262056, "epoch": 2165} {"train_loss": -27.69930076599121, "global_step": 262057, "epoch": 2165} {"train_loss": -40.19704818725586, "global_step": 262058, "epoch": 2165} {"train_loss": -40.697776794433594, "global_step": 262059, "epoch": 2165} {"train_loss": -40.59622573852539, "global_step": 262060, "epoch": 2165} {"train_loss": -40.6363525390625, "global_step": 262061, "epoch": 2165} {"train_loss": -40.8531494140625, "global_step": 262062, "epoch": 2165} {"train_loss": -39.7614860534668, "global_step": 262063, "epoch": 2165} {"train_loss": -39.174068450927734, "global_step": 262064, "epoch": 2165} {"train_loss": -41.491798400878906, "global_step": 262065, "epoch": 2165} {"train_loss": -37.75967788696289, "global_step": 262066, "epoch": 2165} {"train_loss": -41.18220138549805, "global_step": 262067, "epoch": 2165} {"train_loss": -40.059242248535156, "global_step": 262068, "epoch": 2165} {"train_loss": -39.753631591796875, "global_step": 262069, "epoch": 2165} {"train_loss": -41.340084075927734, "global_step": 262070, "epoch": 2165} {"train_loss": -40.581356048583984, "global_step": 262071, "epoch": 2165} {"train_loss": -40.8783073425293, "global_step": 262072, "epoch": 2165} {"train_loss": -42.11145782470703, "global_step": 262073, "epoch": 2165} {"train_loss": -41.815067291259766, "global_step": 262074, "epoch": 2165} {"train_loss": -38.7171745300293, "global_step": 262075, "epoch": 2165} {"train_loss": -36.39901351928711, "global_step": 262076, "epoch": 2165} {"train_loss": -40.68747329711914, "global_step": 262077, "epoch": 2165} {"train_loss": -41.1150016784668, "global_step": 262078, "epoch": 2165} {"train_loss": -40.568687438964844, "global_step": 262079, "epoch": 2165} {"train_loss": -40.816932678222656, "global_step": 262080, "epoch": 2165} {"train_loss": -42.17107391357422, "global_step": 262081, "epoch": 2165} {"train_loss": -42.02878952026367, "global_step": 262082, "epoch": 2165} {"train_loss": -41.95966720581055, "global_step": 262083, "epoch": 2165} {"train_loss": -41.63971710205078, "global_step": 262084, "epoch": 2165} {"train_loss": -41.16282756269471, "global_step": 262085, "epoch": 2165, "val_loss": 3336880.0} {"train_loss": -42.11216354370117, "global_step": 262086, "epoch": 2166} {"train_loss": -42.48221969604492, "global_step": 262087, "epoch": 2166} {"train_loss": -42.546512603759766, "global_step": 262088, "epoch": 2166} {"train_loss": -42.28789138793945, "global_step": 262089, "epoch": 2166} {"train_loss": -41.680599212646484, "global_step": 262090, "epoch": 2166} {"train_loss": -41.537330627441406, "global_step": 262091, "epoch": 2166} {"train_loss": -41.37535095214844, "global_step": 262092, "epoch": 2166} {"train_loss": -42.712318420410156, "global_step": 262093, "epoch": 2166} {"train_loss": -41.624935150146484, "global_step": 262094, "epoch": 2166} {"train_loss": -42.172210693359375, "global_step": 262095, "epoch": 2166} {"train_loss": -40.29471206665039, "global_step": 262096, "epoch": 2166} {"train_loss": -42.08209228515625, "global_step": 262097, "epoch": 2166} {"train_loss": -42.00929260253906, "global_step": 262098, "epoch": 2166} {"train_loss": -42.63874053955078, "global_step": 262099, "epoch": 2166} {"train_loss": -42.695430755615234, "global_step": 262100, "epoch": 2166} {"train_loss": -41.76106262207031, "global_step": 262101, "epoch": 2166} {"train_loss": -41.949031829833984, "global_step": 262102, "epoch": 2166} {"train_loss": -43.1647834777832, "global_step": 262103, "epoch": 2166} {"train_loss": -42.374671936035156, "global_step": 262104, "epoch": 2166} {"train_loss": -41.79290771484375, "global_step": 262105, "epoch": 2166} {"train_loss": -42.99504470825195, "global_step": 262106, "epoch": 2166} {"train_loss": -42.21461486816406, "global_step": 262107, "epoch": 2166} {"train_loss": -42.36049270629883, "global_step": 262108, "epoch": 2166} {"train_loss": -42.13917541503906, "global_step": 262109, "epoch": 2166} {"train_loss": -42.2396354675293, "global_step": 262110, "epoch": 2166} {"train_loss": -42.59022903442383, "global_step": 262111, "epoch": 2166} {"train_loss": -42.65346908569336, "global_step": 262112, "epoch": 2166} {"train_loss": -42.9467887878418, "global_step": 262113, "epoch": 2166} {"train_loss": -42.72050476074219, "global_step": 262114, "epoch": 2166} {"train_loss": -40.44294357299805, "global_step": 262115, "epoch": 2166} {"train_loss": -42.54273223876953, "global_step": 262116, "epoch": 2166} {"train_loss": -42.464195251464844, "global_step": 262117, "epoch": 2166} {"train_loss": -42.560821533203125, "global_step": 262118, "epoch": 2166} {"train_loss": -43.263607025146484, "global_step": 262119, "epoch": 2166} {"train_loss": -42.819305419921875, "global_step": 262120, "epoch": 2166} {"train_loss": -42.92289352416992, "global_step": 262121, "epoch": 2166} {"train_loss": -43.321990966796875, "global_step": 262122, "epoch": 2166} {"train_loss": -42.82772445678711, "global_step": 262123, "epoch": 2166} {"train_loss": -42.2703742980957, "global_step": 262124, "epoch": 2166} {"train_loss": -42.69721603393555, "global_step": 262125, "epoch": 2166} {"train_loss": -43.25865173339844, "global_step": 262126, "epoch": 2166} {"train_loss": -41.7620849609375, "global_step": 262127, "epoch": 2166} {"train_loss": -43.45412826538086, "global_step": 262128, "epoch": 2166} {"train_loss": -43.550209045410156, "global_step": 262129, "epoch": 2166} {"train_loss": -41.37437057495117, "global_step": 262130, "epoch": 2166} {"train_loss": -42.49160385131836, "global_step": 262131, "epoch": 2166} {"train_loss": -43.3509407043457, "global_step": 262132, "epoch": 2166} {"train_loss": -42.5008430480957, "global_step": 262133, "epoch": 2166} {"train_loss": -42.752655029296875, "global_step": 262134, "epoch": 2166} {"train_loss": -42.76405715942383, "global_step": 262135, "epoch": 2166} {"train_loss": -42.03628921508789, "global_step": 262136, "epoch": 2166} {"train_loss": -43.55439758300781, "global_step": 262137, "epoch": 2166} {"train_loss": -42.461273193359375, "global_step": 262138, "epoch": 2166} {"train_loss": -42.49949264526367, "global_step": 262139, "epoch": 2166} {"train_loss": -43.22803497314453, "global_step": 262140, "epoch": 2166} {"train_loss": -43.053993225097656, "global_step": 262141, "epoch": 2166} {"train_loss": -42.1511344909668, "global_step": 262142, "epoch": 2166} {"train_loss": -42.26602554321289, "global_step": 262143, "epoch": 2166} {"train_loss": -43.30611038208008, "global_step": 262144, "epoch": 2166} {"train_loss": -42.5926399230957, "global_step": 262145, "epoch": 2166} {"train_loss": -43.286781311035156, "global_step": 262146, "epoch": 2166} {"train_loss": -42.97774887084961, "global_step": 262147, "epoch": 2166} {"train_loss": -43.14237594604492, "global_step": 262148, "epoch": 2166} {"train_loss": -42.83355712890625, "global_step": 262149, "epoch": 2166} {"train_loss": -42.97957992553711, "global_step": 262150, "epoch": 2166} {"train_loss": -42.58611297607422, "global_step": 262151, "epoch": 2166} {"train_loss": -43.10799789428711, "global_step": 262152, "epoch": 2166} {"train_loss": -43.18988800048828, "global_step": 262153, "epoch": 2166} {"train_loss": -42.979854583740234, "global_step": 262154, "epoch": 2166} {"train_loss": -43.56582260131836, "global_step": 262155, "epoch": 2166} {"train_loss": -43.066650390625, "global_step": 262156, "epoch": 2166} {"train_loss": -42.947784423828125, "global_step": 262157, "epoch": 2166} {"train_loss": -42.32558059692383, "global_step": 262158, "epoch": 2166} {"train_loss": -42.416786193847656, "global_step": 262159, "epoch": 2166} {"train_loss": -42.59755325317383, "global_step": 262160, "epoch": 2166} {"train_loss": -42.34558868408203, "global_step": 262161, "epoch": 2166} {"train_loss": -42.46892547607422, "global_step": 262162, "epoch": 2166} {"train_loss": -43.42939376831055, "global_step": 262163, "epoch": 2166} {"train_loss": -43.565731048583984, "global_step": 262164, "epoch": 2166} {"train_loss": -42.83615493774414, "global_step": 262165, "epoch": 2166} {"train_loss": -42.882991790771484, "global_step": 262166, "epoch": 2166} {"train_loss": -42.64887237548828, "global_step": 262167, "epoch": 2166} {"train_loss": -43.43034362792969, "global_step": 262168, "epoch": 2166} {"train_loss": -42.458526611328125, "global_step": 262169, "epoch": 2166} {"train_loss": -42.258060455322266, "global_step": 262170, "epoch": 2166} {"train_loss": -42.62512969970703, "global_step": 262171, "epoch": 2166} {"train_loss": -42.4015998840332, "global_step": 262172, "epoch": 2166} {"train_loss": -41.93739700317383, "global_step": 262173, "epoch": 2166} {"train_loss": -41.85750961303711, "global_step": 262174, "epoch": 2166} {"train_loss": -42.50737380981445, "global_step": 262175, "epoch": 2166} {"train_loss": -42.922935485839844, "global_step": 262176, "epoch": 2166} {"train_loss": -41.39705276489258, "global_step": 262177, "epoch": 2166} {"train_loss": -42.8322868347168, "global_step": 262178, "epoch": 2166} {"train_loss": -43.60708236694336, "global_step": 262179, "epoch": 2166} {"train_loss": -41.70840072631836, "global_step": 262180, "epoch": 2166} {"train_loss": -41.305301666259766, "global_step": 262181, "epoch": 2166} {"train_loss": -41.913211822509766, "global_step": 262182, "epoch": 2166} {"train_loss": -43.148475646972656, "global_step": 262183, "epoch": 2166} {"train_loss": -43.18046188354492, "global_step": 262184, "epoch": 2166} {"train_loss": -42.50029373168945, "global_step": 262185, "epoch": 2166} {"train_loss": -42.95432662963867, "global_step": 262186, "epoch": 2166} {"train_loss": -43.28435134887695, "global_step": 262187, "epoch": 2166} {"train_loss": -42.2701530456543, "global_step": 262188, "epoch": 2166} {"train_loss": -41.695987701416016, "global_step": 262189, "epoch": 2166} {"train_loss": -41.73811721801758, "global_step": 262190, "epoch": 2166} {"train_loss": -42.59932327270508, "global_step": 262191, "epoch": 2166} {"train_loss": -42.26093292236328, "global_step": 262192, "epoch": 2166} {"train_loss": -41.90439224243164, "global_step": 262193, "epoch": 2166} {"train_loss": -43.26255416870117, "global_step": 262194, "epoch": 2166} {"train_loss": -42.66144943237305, "global_step": 262195, "epoch": 2166} {"train_loss": -41.70296859741211, "global_step": 262196, "epoch": 2166} {"train_loss": -42.750484466552734, "global_step": 262197, "epoch": 2166} {"train_loss": -42.464080810546875, "global_step": 262198, "epoch": 2166} {"train_loss": -41.88640213012695, "global_step": 262199, "epoch": 2166} {"train_loss": -42.205440521240234, "global_step": 262200, "epoch": 2166} {"train_loss": -42.61048889160156, "global_step": 262201, "epoch": 2166} {"train_loss": -40.79911422729492, "global_step": 262202, "epoch": 2166} {"train_loss": -41.11912155151367, "global_step": 262203, "epoch": 2166} {"train_loss": -43.13838577270508, "global_step": 262204, "epoch": 2166} {"train_loss": -43.1865234375, "global_step": 262205, "epoch": 2166} {"train_loss": -42.50828810762768, "global_step": 262206, "epoch": 2166, "val_loss": 2649932.25} {"train_loss": -43.0236930847168, "global_step": 262207, "epoch": 2167} {"train_loss": -41.6694450378418, "global_step": 262208, "epoch": 2167} {"train_loss": -42.48469924926758, "global_step": 262209, "epoch": 2167} {"train_loss": -42.47319412231445, "global_step": 262210, "epoch": 2167} {"train_loss": -41.97080612182617, "global_step": 262211, "epoch": 2167} {"train_loss": -41.966758728027344, "global_step": 262212, "epoch": 2167} {"train_loss": -41.283302307128906, "global_step": 262213, "epoch": 2167} {"train_loss": -41.996700286865234, "global_step": 262214, "epoch": 2167} {"train_loss": -42.34725570678711, "global_step": 262215, "epoch": 2167} {"train_loss": -42.77231216430664, "global_step": 262216, "epoch": 2167} {"train_loss": -41.74183654785156, "global_step": 262217, "epoch": 2167} {"train_loss": -41.653865814208984, "global_step": 262218, "epoch": 2167} {"train_loss": -42.76992416381836, "global_step": 262219, "epoch": 2167} {"train_loss": -43.216976165771484, "global_step": 262220, "epoch": 2167} {"train_loss": -42.5220832824707, "global_step": 262221, "epoch": 2167} {"train_loss": -42.60883331298828, "global_step": 262222, "epoch": 2167} {"train_loss": -42.79276657104492, "global_step": 262223, "epoch": 2167} {"train_loss": -42.62053680419922, "global_step": 262224, "epoch": 2167} {"train_loss": -42.79961013793945, "global_step": 262225, "epoch": 2167} {"train_loss": -43.334163665771484, "global_step": 262226, "epoch": 2167} {"train_loss": -43.23060607910156, "global_step": 262227, "epoch": 2167} {"train_loss": -43.16376876831055, "global_step": 262228, "epoch": 2167} {"train_loss": -42.787269592285156, "global_step": 262229, "epoch": 2167} {"train_loss": -43.351036071777344, "global_step": 262230, "epoch": 2167} {"train_loss": -43.94899368286133, "global_step": 262231, "epoch": 2167} {"train_loss": -43.299259185791016, "global_step": 262232, "epoch": 2167} {"train_loss": -42.533565521240234, "global_step": 262233, "epoch": 2167} {"train_loss": -42.413021087646484, "global_step": 262234, "epoch": 2167} {"train_loss": -43.879581451416016, "global_step": 262235, "epoch": 2167} {"train_loss": -43.10493087768555, "global_step": 262236, "epoch": 2167} {"train_loss": -41.85393524169922, "global_step": 262237, "epoch": 2167} {"train_loss": -42.410579681396484, "global_step": 262238, "epoch": 2167} {"train_loss": -42.89946746826172, "global_step": 262239, "epoch": 2167} {"train_loss": -42.74842834472656, "global_step": 262240, "epoch": 2167} {"train_loss": -42.73099136352539, "global_step": 262241, "epoch": 2167} {"train_loss": -43.176513671875, "global_step": 262242, "epoch": 2167} {"train_loss": -42.00197982788086, "global_step": 262243, "epoch": 2167} {"train_loss": -41.2587776184082, "global_step": 262244, "epoch": 2167} {"train_loss": -42.326995849609375, "global_step": 262245, "epoch": 2167} {"train_loss": -42.267494201660156, "global_step": 262246, "epoch": 2167} {"train_loss": -41.854496002197266, "global_step": 262247, "epoch": 2167} {"train_loss": -41.76082992553711, "global_step": 262248, "epoch": 2167} {"train_loss": -42.72811508178711, "global_step": 262249, "epoch": 2167} {"train_loss": -42.896942138671875, "global_step": 262250, "epoch": 2167} {"train_loss": -42.412227630615234, "global_step": 262251, "epoch": 2167} {"train_loss": -42.499603271484375, "global_step": 262252, "epoch": 2167} {"train_loss": -43.67217254638672, "global_step": 262253, "epoch": 2167} {"train_loss": -43.446205139160156, "global_step": 262254, "epoch": 2167} {"train_loss": -42.18918991088867, "global_step": 262255, "epoch": 2167} {"train_loss": -43.51422119140625, "global_step": 262256, "epoch": 2167} {"train_loss": -43.24612808227539, "global_step": 262257, "epoch": 2167} {"train_loss": -42.73329544067383, "global_step": 262258, "epoch": 2167} {"train_loss": -43.02022933959961, "global_step": 262259, "epoch": 2167} {"train_loss": -42.73609161376953, "global_step": 262260, "epoch": 2167} {"train_loss": -43.18309020996094, "global_step": 262261, "epoch": 2167} {"train_loss": -43.23786163330078, "global_step": 262262, "epoch": 2167} {"train_loss": -42.55116653442383, "global_step": 262263, "epoch": 2167} {"train_loss": -43.402801513671875, "global_step": 262264, "epoch": 2167} {"train_loss": -42.81748962402344, "global_step": 262265, "epoch": 2167} {"train_loss": -43.180660247802734, "global_step": 262266, "epoch": 2167} {"train_loss": -42.88204574584961, "global_step": 262267, "epoch": 2167} {"train_loss": -42.53557205200195, "global_step": 262268, "epoch": 2167} {"train_loss": -43.14966583251953, "global_step": 262269, "epoch": 2167} {"train_loss": -43.04508590698242, "global_step": 262270, "epoch": 2167} {"train_loss": -41.3283576965332, "global_step": 262271, "epoch": 2167} {"train_loss": -42.20781326293945, "global_step": 262272, "epoch": 2167} {"train_loss": -41.891117095947266, "global_step": 262273, "epoch": 2167} {"train_loss": -42.3451042175293, "global_step": 262274, "epoch": 2167} {"train_loss": -43.50407791137695, "global_step": 262275, "epoch": 2167} {"train_loss": -41.87409973144531, "global_step": 262276, "epoch": 2167} {"train_loss": -42.494197845458984, "global_step": 262277, "epoch": 2167} {"train_loss": -42.54132080078125, "global_step": 262278, "epoch": 2167} {"train_loss": -42.65353012084961, "global_step": 262279, "epoch": 2167} {"train_loss": -42.40279006958008, "global_step": 262280, "epoch": 2167} {"train_loss": -40.736297607421875, "global_step": 262281, "epoch": 2167} {"train_loss": -39.86774826049805, "global_step": 262282, "epoch": 2167} {"train_loss": -40.20269775390625, "global_step": 262283, "epoch": 2167} {"train_loss": -42.77736282348633, "global_step": 262284, "epoch": 2167} {"train_loss": -41.080806732177734, "global_step": 262285, "epoch": 2167} {"train_loss": -35.44370651245117, "global_step": 262286, "epoch": 2167} {"train_loss": -36.76298141479492, "global_step": 262287, "epoch": 2167} {"train_loss": -39.260353088378906, "global_step": 262288, "epoch": 2167} {"train_loss": -41.98309326171875, "global_step": 262289, "epoch": 2167} {"train_loss": -39.979705810546875, "global_step": 262290, "epoch": 2167} {"train_loss": -39.97993087768555, "global_step": 262291, "epoch": 2167} {"train_loss": -42.10413360595703, "global_step": 262292, "epoch": 2167} {"train_loss": -40.49229431152344, "global_step": 262293, "epoch": 2167} {"train_loss": -39.60086441040039, "global_step": 262294, "epoch": 2167} {"train_loss": -41.80837631225586, "global_step": 262295, "epoch": 2167} {"train_loss": -39.42634582519531, "global_step": 262296, "epoch": 2167} {"train_loss": -40.66943359375, "global_step": 262297, "epoch": 2167} {"train_loss": -40.48027038574219, "global_step": 262298, "epoch": 2167} {"train_loss": -40.69732666015625, "global_step": 262299, "epoch": 2167} {"train_loss": -40.949459075927734, "global_step": 262300, "epoch": 2167} {"train_loss": -40.37632369995117, "global_step": 262301, "epoch": 2167} {"train_loss": -41.15902328491211, "global_step": 262302, "epoch": 2167} {"train_loss": -40.9359245300293, "global_step": 262303, "epoch": 2167} {"train_loss": -41.358341217041016, "global_step": 262304, "epoch": 2167} {"train_loss": -41.449241638183594, "global_step": 262305, "epoch": 2167} {"train_loss": -41.74141311645508, "global_step": 262306, "epoch": 2167} {"train_loss": -41.393043518066406, "global_step": 262307, "epoch": 2167} {"train_loss": -42.28157424926758, "global_step": 262308, "epoch": 2167} {"train_loss": -42.04081344604492, "global_step": 262309, "epoch": 2167} {"train_loss": -42.115779876708984, "global_step": 262310, "epoch": 2167} {"train_loss": -42.83155822753906, "global_step": 262311, "epoch": 2167} {"train_loss": -42.15403366088867, "global_step": 262312, "epoch": 2167} {"train_loss": -42.738807678222656, "global_step": 262313, "epoch": 2167} {"train_loss": -42.88261032104492, "global_step": 262314, "epoch": 2167} {"train_loss": -42.810970306396484, "global_step": 262315, "epoch": 2167} {"train_loss": -42.94963073730469, "global_step": 262316, "epoch": 2167} {"train_loss": -42.633846282958984, "global_step": 262317, "epoch": 2167} {"train_loss": -42.1462516784668, "global_step": 262318, "epoch": 2167} {"train_loss": -42.923675537109375, "global_step": 262319, "epoch": 2167} {"train_loss": -43.28877639770508, "global_step": 262320, "epoch": 2167} {"train_loss": -42.29734802246094, "global_step": 262321, "epoch": 2167} {"train_loss": -43.17099380493164, "global_step": 262322, "epoch": 2167} {"train_loss": -43.304786682128906, "global_step": 262323, "epoch": 2167} {"train_loss": -43.3382453918457, "global_step": 262324, "epoch": 2167} {"train_loss": -43.148494720458984, "global_step": 262325, "epoch": 2167} {"train_loss": -43.28947830200195, "global_step": 262326, "epoch": 2167} {"train_loss": -42.177457226209405, "global_step": 262327, "epoch": 2167, "val_loss": 2606698.75} {"train_loss": -42.70357894897461, "global_step": 262328, "epoch": 2168} {"train_loss": -43.05379867553711, "global_step": 262329, "epoch": 2168} {"train_loss": -43.13521957397461, "global_step": 262330, "epoch": 2168} {"train_loss": -43.05314254760742, "global_step": 262331, "epoch": 2168} {"train_loss": -43.01191329956055, "global_step": 262332, "epoch": 2168} {"train_loss": -43.03046798706055, "global_step": 262333, "epoch": 2168} {"train_loss": -43.4112548828125, "global_step": 262334, "epoch": 2168} {"train_loss": -43.49394226074219, "global_step": 262335, "epoch": 2168} {"train_loss": -43.756099700927734, "global_step": 262336, "epoch": 2168} {"train_loss": -43.1616325378418, "global_step": 262337, "epoch": 2168} {"train_loss": -42.87777328491211, "global_step": 262338, "epoch": 2168} {"train_loss": -43.902957916259766, "global_step": 262339, "epoch": 2168} {"train_loss": -43.631526947021484, "global_step": 262340, "epoch": 2168} {"train_loss": -43.519081115722656, "global_step": 262341, "epoch": 2168} {"train_loss": -43.336429595947266, "global_step": 262342, "epoch": 2168} {"train_loss": -43.411720275878906, "global_step": 262343, "epoch": 2168} {"train_loss": -43.272945404052734, "global_step": 262344, "epoch": 2168} {"train_loss": -43.48501205444336, "global_step": 262345, "epoch": 2168} {"train_loss": -43.549102783203125, "global_step": 262346, "epoch": 2168} {"train_loss": -43.582054138183594, "global_step": 262347, "epoch": 2168} {"train_loss": -43.26859664916992, "global_step": 262348, "epoch": 2168} {"train_loss": -43.28190231323242, "global_step": 262349, "epoch": 2168} {"train_loss": -43.36773681640625, "global_step": 262350, "epoch": 2168} {"train_loss": -43.608985900878906, "global_step": 262351, "epoch": 2168} {"train_loss": -43.71376037597656, "global_step": 262352, "epoch": 2168} {"train_loss": -44.311397552490234, "global_step": 262353, "epoch": 2168} {"train_loss": -43.80457305908203, "global_step": 262354, "epoch": 2168} {"train_loss": -43.517757415771484, "global_step": 262355, "epoch": 2168} {"train_loss": -43.87841796875, "global_step": 262356, "epoch": 2168} {"train_loss": -43.812469482421875, "global_step": 262357, "epoch": 2168} {"train_loss": -43.790889739990234, "global_step": 262358, "epoch": 2168} {"train_loss": -43.475738525390625, "global_step": 262359, "epoch": 2168} {"train_loss": -43.69175338745117, "global_step": 262360, "epoch": 2168} {"train_loss": -43.523475646972656, "global_step": 262361, "epoch": 2168} {"train_loss": -43.73246383666992, "global_step": 262362, "epoch": 2168} {"train_loss": -43.45756149291992, "global_step": 262363, "epoch": 2168} {"train_loss": -42.525718688964844, "global_step": 262364, "epoch": 2168} {"train_loss": -43.51295852661133, "global_step": 262365, "epoch": 2168} {"train_loss": -43.86530685424805, "global_step": 262366, "epoch": 2168} {"train_loss": -43.03212356567383, "global_step": 262367, "epoch": 2168} {"train_loss": -43.253108978271484, "global_step": 262368, "epoch": 2168} {"train_loss": -43.57062911987305, "global_step": 262369, "epoch": 2168} {"train_loss": -41.28713607788086, "global_step": 262370, "epoch": 2168} {"train_loss": -41.63257598876953, "global_step": 262371, "epoch": 2168} {"train_loss": -43.73643112182617, "global_step": 262372, "epoch": 2168} {"train_loss": -43.370399475097656, "global_step": 262373, "epoch": 2168} {"train_loss": -40.11552047729492, "global_step": 262374, "epoch": 2168} {"train_loss": -42.07998275756836, "global_step": 262375, "epoch": 2168} {"train_loss": -42.85885238647461, "global_step": 262376, "epoch": 2168} {"train_loss": -42.150970458984375, "global_step": 262377, "epoch": 2168} {"train_loss": -40.582332611083984, "global_step": 262378, "epoch": 2168} {"train_loss": -42.33095169067383, "global_step": 262379, "epoch": 2168} {"train_loss": -42.4640007019043, "global_step": 262380, "epoch": 2168} {"train_loss": -42.36236572265625, "global_step": 262381, "epoch": 2168} {"train_loss": -39.681922912597656, "global_step": 262382, "epoch": 2168} {"train_loss": -39.6055793762207, "global_step": 262383, "epoch": 2168} {"train_loss": -41.29785919189453, "global_step": 262384, "epoch": 2168} {"train_loss": -41.76231002807617, "global_step": 262385, "epoch": 2168} {"train_loss": -39.638755798339844, "global_step": 262386, "epoch": 2168} {"train_loss": -42.1907958984375, "global_step": 262387, "epoch": 2168} {"train_loss": -42.18061828613281, "global_step": 262388, "epoch": 2168} {"train_loss": -41.135528564453125, "global_step": 262389, "epoch": 2168} {"train_loss": -41.974735260009766, "global_step": 262390, "epoch": 2168} {"train_loss": -42.638641357421875, "global_step": 262391, "epoch": 2168} {"train_loss": -42.4150276184082, "global_step": 262392, "epoch": 2168} {"train_loss": -42.122802734375, "global_step": 262393, "epoch": 2168} {"train_loss": -41.1531982421875, "global_step": 262394, "epoch": 2168} {"train_loss": -42.264583587646484, "global_step": 262395, "epoch": 2168} {"train_loss": -40.95965576171875, "global_step": 262396, "epoch": 2168} {"train_loss": -42.45219039916992, "global_step": 262397, "epoch": 2168} {"train_loss": -41.70249557495117, "global_step": 262398, "epoch": 2168} {"train_loss": -42.49519729614258, "global_step": 262399, "epoch": 2168} {"train_loss": -41.6693000793457, "global_step": 262400, "epoch": 2168} {"train_loss": -41.23136520385742, "global_step": 262401, "epoch": 2168} {"train_loss": -41.41170120239258, "global_step": 262402, "epoch": 2168} {"train_loss": -40.16013717651367, "global_step": 262403, "epoch": 2168} {"train_loss": -40.844539642333984, "global_step": 262404, "epoch": 2168} {"train_loss": -42.068641662597656, "global_step": 262405, "epoch": 2168} {"train_loss": -41.992122650146484, "global_step": 262406, "epoch": 2168} {"train_loss": -41.55060577392578, "global_step": 262407, "epoch": 2168} {"train_loss": -40.68650436401367, "global_step": 262408, "epoch": 2168} {"train_loss": -40.02537155151367, "global_step": 262409, "epoch": 2168} {"train_loss": -39.58005905151367, "global_step": 262410, "epoch": 2168} {"train_loss": -39.9389533996582, "global_step": 262411, "epoch": 2168} {"train_loss": -36.225730895996094, "global_step": 262412, "epoch": 2168} {"train_loss": -39.70226287841797, "global_step": 262413, "epoch": 2168} {"train_loss": -42.554847717285156, "global_step": 262414, "epoch": 2168} {"train_loss": -42.38440704345703, "global_step": 262415, "epoch": 2168} {"train_loss": -41.74454879760742, "global_step": 262416, "epoch": 2168} {"train_loss": -40.62258529663086, "global_step": 262417, "epoch": 2168} {"train_loss": -32.13137435913086, "global_step": 262418, "epoch": 2168} {"train_loss": -42.229164123535156, "global_step": 262419, "epoch": 2168} {"train_loss": -42.509132385253906, "global_step": 262420, "epoch": 2168} {"train_loss": -42.04490280151367, "global_step": 262421, "epoch": 2168} {"train_loss": -42.07737350463867, "global_step": 262422, "epoch": 2168} {"train_loss": -42.207122802734375, "global_step": 262423, "epoch": 2168} {"train_loss": -42.646514892578125, "global_step": 262424, "epoch": 2168} {"train_loss": -42.3277702331543, "global_step": 262425, "epoch": 2168} {"train_loss": -33.853126525878906, "global_step": 262426, "epoch": 2168} {"train_loss": -35.670799255371094, "global_step": 262427, "epoch": 2168} {"train_loss": -41.9610710144043, "global_step": 262428, "epoch": 2168} {"train_loss": -41.231300354003906, "global_step": 262429, "epoch": 2168} {"train_loss": -42.106719970703125, "global_step": 262430, "epoch": 2168} {"train_loss": -40.584205627441406, "global_step": 262431, "epoch": 2168} {"train_loss": -41.73696517944336, "global_step": 262432, "epoch": 2168} {"train_loss": -42.25578689575195, "global_step": 262433, "epoch": 2168} {"train_loss": -41.73652648925781, "global_step": 262434, "epoch": 2168} {"train_loss": -41.78629684448242, "global_step": 262435, "epoch": 2168} {"train_loss": -41.74147415161133, "global_step": 262436, "epoch": 2168} {"train_loss": -41.54513168334961, "global_step": 262437, "epoch": 2168} {"train_loss": -42.3729133605957, "global_step": 262438, "epoch": 2168} {"train_loss": -42.112274169921875, "global_step": 262439, "epoch": 2168} {"train_loss": -41.065059661865234, "global_step": 262440, "epoch": 2168} {"train_loss": -42.40399169921875, "global_step": 262441, "epoch": 2168} {"train_loss": -39.54745864868164, "global_step": 262442, "epoch": 2168} {"train_loss": -42.017459869384766, "global_step": 262443, "epoch": 2168} {"train_loss": -38.791324615478516, "global_step": 262444, "epoch": 2168} {"train_loss": -39.9850959777832, "global_step": 262445, "epoch": 2168} {"train_loss": -42.65102005004883, "global_step": 262446, "epoch": 2168} {"train_loss": -42.1611442565918, "global_step": 262447, "epoch": 2168} {"train_loss": -41.9861605305317, "global_step": 262448, "epoch": 2168, "val_loss": 2673580.75} {"train_loss": -42.76819610595703, "global_step": 262449, "epoch": 2169} {"train_loss": -42.491329193115234, "global_step": 262450, "epoch": 2169} {"train_loss": -42.966941833496094, "global_step": 262451, "epoch": 2169} {"train_loss": -42.422203063964844, "global_step": 262452, "epoch": 2169} {"train_loss": -40.27640914916992, "global_step": 262453, "epoch": 2169} {"train_loss": -41.297306060791016, "global_step": 262454, "epoch": 2169} {"train_loss": -42.21981430053711, "global_step": 262455, "epoch": 2169} {"train_loss": -43.236026763916016, "global_step": 262456, "epoch": 2169} {"train_loss": -42.63179016113281, "global_step": 262457, "epoch": 2169} {"train_loss": -41.85061264038086, "global_step": 262458, "epoch": 2169} {"train_loss": -42.77473831176758, "global_step": 262459, "epoch": 2169} {"train_loss": -42.69256591796875, "global_step": 262460, "epoch": 2169} {"train_loss": -42.365386962890625, "global_step": 262461, "epoch": 2169} {"train_loss": -33.049320220947266, "global_step": 262462, "epoch": 2169} {"train_loss": -41.55861282348633, "global_step": 262463, "epoch": 2169} {"train_loss": -42.324462890625, "global_step": 262464, "epoch": 2169} {"train_loss": -37.654788970947266, "global_step": 262465, "epoch": 2169} {"train_loss": -42.18154525756836, "global_step": 262466, "epoch": 2169} {"train_loss": -37.59884262084961, "global_step": 262467, "epoch": 2169} {"train_loss": -40.04936599731445, "global_step": 262468, "epoch": 2169} {"train_loss": -41.28730392456055, "global_step": 262469, "epoch": 2169} {"train_loss": -40.70383834838867, "global_step": 262470, "epoch": 2169} {"train_loss": -42.2185173034668, "global_step": 262471, "epoch": 2169} {"train_loss": -41.1638298034668, "global_step": 262472, "epoch": 2169} {"train_loss": -41.618709564208984, "global_step": 262473, "epoch": 2169} {"train_loss": -42.14683151245117, "global_step": 262474, "epoch": 2169} {"train_loss": -41.317684173583984, "global_step": 262475, "epoch": 2169} {"train_loss": -42.71318435668945, "global_step": 262476, "epoch": 2169} {"train_loss": -42.48768997192383, "global_step": 262477, "epoch": 2169} {"train_loss": -42.33533477783203, "global_step": 262478, "epoch": 2169} {"train_loss": -38.949859619140625, "global_step": 262479, "epoch": 2169} {"train_loss": -41.97119140625, "global_step": 262480, "epoch": 2169} {"train_loss": -41.24904251098633, "global_step": 262481, "epoch": 2169} {"train_loss": -40.07375717163086, "global_step": 262482, "epoch": 2169} {"train_loss": -41.709686279296875, "global_step": 262483, "epoch": 2169} {"train_loss": -42.48929214477539, "global_step": 262484, "epoch": 2169} {"train_loss": -42.39622116088867, "global_step": 262485, "epoch": 2169} {"train_loss": -43.230567932128906, "global_step": 262486, "epoch": 2169} {"train_loss": -39.405338287353516, "global_step": 262487, "epoch": 2169} {"train_loss": -43.23575973510742, "global_step": 262488, "epoch": 2169} {"train_loss": -40.768829345703125, "global_step": 262489, "epoch": 2169} {"train_loss": -41.17151641845703, "global_step": 262490, "epoch": 2169} {"train_loss": -39.404117584228516, "global_step": 262491, "epoch": 2169} {"train_loss": -43.064666748046875, "global_step": 262492, "epoch": 2169} {"train_loss": -38.96702194213867, "global_step": 262493, "epoch": 2169} {"train_loss": -36.90224075317383, "global_step": 262494, "epoch": 2169} {"train_loss": -40.3785285949707, "global_step": 262495, "epoch": 2169} {"train_loss": -42.997596740722656, "global_step": 262496, "epoch": 2169} {"train_loss": -41.10878372192383, "global_step": 262497, "epoch": 2169} {"train_loss": -39.646846771240234, "global_step": 262498, "epoch": 2169} {"train_loss": -42.820228576660156, "global_step": 262499, "epoch": 2169} {"train_loss": -42.79067611694336, "global_step": 262500, "epoch": 2169} {"train_loss": -40.92997360229492, "global_step": 262501, "epoch": 2169} {"train_loss": -41.70542526245117, "global_step": 262502, "epoch": 2169} {"train_loss": -37.500953674316406, "global_step": 262503, "epoch": 2169} {"train_loss": -38.51047897338867, "global_step": 262504, "epoch": 2169} {"train_loss": -41.061500549316406, "global_step": 262505, "epoch": 2169} {"train_loss": -41.18147659301758, "global_step": 262506, "epoch": 2169} {"train_loss": -37.11867141723633, "global_step": 262507, "epoch": 2169} {"train_loss": -40.817108154296875, "global_step": 262508, "epoch": 2169} {"train_loss": -40.5811882019043, "global_step": 262509, "epoch": 2169} {"train_loss": -41.0775032043457, "global_step": 262510, "epoch": 2169} {"train_loss": -38.052059173583984, "global_step": 262511, "epoch": 2169} {"train_loss": -38.998878479003906, "global_step": 262512, "epoch": 2169} {"train_loss": -40.37734603881836, "global_step": 262513, "epoch": 2169} {"train_loss": -40.838680267333984, "global_step": 262514, "epoch": 2169} {"train_loss": -41.72275924682617, "global_step": 262515, "epoch": 2169} {"train_loss": -39.8825798034668, "global_step": 262516, "epoch": 2169} {"train_loss": -39.396827697753906, "global_step": 262517, "epoch": 2169} {"train_loss": -42.08012008666992, "global_step": 262518, "epoch": 2169} {"train_loss": -41.727813720703125, "global_step": 262519, "epoch": 2169} {"train_loss": -39.761474609375, "global_step": 262520, "epoch": 2169} {"train_loss": -37.43044662475586, "global_step": 262521, "epoch": 2169} {"train_loss": -40.808162689208984, "global_step": 262522, "epoch": 2169} {"train_loss": -39.001583099365234, "global_step": 262523, "epoch": 2169} {"train_loss": -40.582794189453125, "global_step": 262524, "epoch": 2169} {"train_loss": -40.640830993652344, "global_step": 262525, "epoch": 2169} {"train_loss": -41.03944778442383, "global_step": 262526, "epoch": 2169} {"train_loss": -41.68925857543945, "global_step": 262527, "epoch": 2169} {"train_loss": -40.07343673706055, "global_step": 262528, "epoch": 2169} {"train_loss": -41.64658737182617, "global_step": 262529, "epoch": 2169} {"train_loss": -41.85977554321289, "global_step": 262530, "epoch": 2169} {"train_loss": -41.0875358581543, "global_step": 262531, "epoch": 2169} {"train_loss": -42.27595138549805, "global_step": 262532, "epoch": 2169} {"train_loss": -41.22941589355469, "global_step": 262533, "epoch": 2169} {"train_loss": -41.633480072021484, "global_step": 262534, "epoch": 2169} {"train_loss": -42.26215362548828, "global_step": 262535, "epoch": 2169} {"train_loss": -39.7423210144043, "global_step": 262536, "epoch": 2169} {"train_loss": -41.910858154296875, "global_step": 262537, "epoch": 2169} {"train_loss": -38.480224609375, "global_step": 262538, "epoch": 2169} {"train_loss": -39.383399963378906, "global_step": 262539, "epoch": 2169} {"train_loss": -40.33430480957031, "global_step": 262540, "epoch": 2169} {"train_loss": -41.62050247192383, "global_step": 262541, "epoch": 2169} {"train_loss": -41.62765884399414, "global_step": 262542, "epoch": 2169} {"train_loss": -41.293212890625, "global_step": 262543, "epoch": 2169} {"train_loss": -42.22929000854492, "global_step": 262544, "epoch": 2169} {"train_loss": -41.75984191894531, "global_step": 262545, "epoch": 2169} {"train_loss": -41.83761215209961, "global_step": 262546, "epoch": 2169} {"train_loss": -41.924922943115234, "global_step": 262547, "epoch": 2169} {"train_loss": -42.25782012939453, "global_step": 262548, "epoch": 2169} {"train_loss": -42.0050163269043, "global_step": 262549, "epoch": 2169} {"train_loss": -42.7776985168457, "global_step": 262550, "epoch": 2169} {"train_loss": -43.05483627319336, "global_step": 262551, "epoch": 2169} {"train_loss": -42.34120559692383, "global_step": 262552, "epoch": 2169} {"train_loss": -40.27531433105469, "global_step": 262553, "epoch": 2169} {"train_loss": -41.79568099975586, "global_step": 262554, "epoch": 2169} {"train_loss": -41.8489875793457, "global_step": 262555, "epoch": 2169} {"train_loss": -42.74978256225586, "global_step": 262556, "epoch": 2169} {"train_loss": -42.321044921875, "global_step": 262557, "epoch": 2169} {"train_loss": -42.838218688964844, "global_step": 262558, "epoch": 2169} {"train_loss": -42.79494094848633, "global_step": 262559, "epoch": 2169} {"train_loss": -42.545074462890625, "global_step": 262560, "epoch": 2169} {"train_loss": -41.831539154052734, "global_step": 262561, "epoch": 2169} {"train_loss": -42.19464874267578, "global_step": 262562, "epoch": 2169} {"train_loss": -42.34455871582031, "global_step": 262563, "epoch": 2169} {"train_loss": -41.798187255859375, "global_step": 262564, "epoch": 2169} {"train_loss": -42.777339935302734, "global_step": 262565, "epoch": 2169} {"train_loss": -40.76445388793945, "global_step": 262566, "epoch": 2169} {"train_loss": -42.08376693725586, "global_step": 262567, "epoch": 2169} {"train_loss": -42.8173942565918, "global_step": 262568, "epoch": 2169} {"train_loss": -41.19872908158736, "global_step": 262569, "epoch": 2169, "val_loss": 2609361.25} {"train_loss": -42.94062423706055, "global_step": 262570, "epoch": 2170} {"train_loss": -41.838134765625, "global_step": 262571, "epoch": 2170} {"train_loss": -42.766178131103516, "global_step": 262572, "epoch": 2170} {"train_loss": -42.37112045288086, "global_step": 262573, "epoch": 2170} {"train_loss": -41.26990509033203, "global_step": 262574, "epoch": 2170} {"train_loss": -43.11214065551758, "global_step": 262575, "epoch": 2170} {"train_loss": -42.37895965576172, "global_step": 262576, "epoch": 2170} {"train_loss": -42.237937927246094, "global_step": 262577, "epoch": 2170} {"train_loss": -42.8991813659668, "global_step": 262578, "epoch": 2170} {"train_loss": -42.96676254272461, "global_step": 262579, "epoch": 2170} {"train_loss": -42.985107421875, "global_step": 262580, "epoch": 2170} {"train_loss": -40.713069915771484, "global_step": 262581, "epoch": 2170} {"train_loss": -42.56830596923828, "global_step": 262582, "epoch": 2170} {"train_loss": -42.69450759887695, "global_step": 262583, "epoch": 2170} {"train_loss": -42.68912887573242, "global_step": 262584, "epoch": 2170} {"train_loss": -42.57859420776367, "global_step": 262585, "epoch": 2170} {"train_loss": -42.8285026550293, "global_step": 262586, "epoch": 2170} {"train_loss": -41.659423828125, "global_step": 262587, "epoch": 2170} {"train_loss": -42.947364807128906, "global_step": 262588, "epoch": 2170} {"train_loss": -43.228668212890625, "global_step": 262589, "epoch": 2170} {"train_loss": -42.95173263549805, "global_step": 262590, "epoch": 2170} {"train_loss": -41.919403076171875, "global_step": 262591, "epoch": 2170} {"train_loss": -43.29864501953125, "global_step": 262592, "epoch": 2170} {"train_loss": -42.5915412902832, "global_step": 262593, "epoch": 2170} {"train_loss": -42.61398696899414, "global_step": 262594, "epoch": 2170} {"train_loss": -42.584869384765625, "global_step": 262595, "epoch": 2170} {"train_loss": -42.80132293701172, "global_step": 262596, "epoch": 2170} {"train_loss": -43.099666595458984, "global_step": 262597, "epoch": 2170} {"train_loss": -42.67962646484375, "global_step": 262598, "epoch": 2170} {"train_loss": -42.25183868408203, "global_step": 262599, "epoch": 2170} {"train_loss": -42.34049987792969, "global_step": 262600, "epoch": 2170} {"train_loss": -42.41020965576172, "global_step": 262601, "epoch": 2170} {"train_loss": -43.34439468383789, "global_step": 262602, "epoch": 2170} {"train_loss": -42.461002349853516, "global_step": 262603, "epoch": 2170} {"train_loss": -42.044254302978516, "global_step": 262604, "epoch": 2170} {"train_loss": -42.6532096862793, "global_step": 262605, "epoch": 2170} {"train_loss": -42.428367614746094, "global_step": 262606, "epoch": 2170} {"train_loss": -41.99435043334961, "global_step": 262607, "epoch": 2170} {"train_loss": -39.19106674194336, "global_step": 262608, "epoch": 2170} {"train_loss": -40.9337158203125, "global_step": 262609, "epoch": 2170} {"train_loss": -40.562782287597656, "global_step": 262610, "epoch": 2170} {"train_loss": -40.294403076171875, "global_step": 262611, "epoch": 2170} {"train_loss": -42.242095947265625, "global_step": 262612, "epoch": 2170} {"train_loss": -42.549530029296875, "global_step": 262613, "epoch": 2170} {"train_loss": -41.2677116394043, "global_step": 262614, "epoch": 2170} {"train_loss": -40.97161865234375, "global_step": 262615, "epoch": 2170} {"train_loss": -39.8251838684082, "global_step": 262616, "epoch": 2170} {"train_loss": -41.29046630859375, "global_step": 262617, "epoch": 2170} {"train_loss": -42.01958084106445, "global_step": 262618, "epoch": 2170} {"train_loss": -42.184234619140625, "global_step": 262619, "epoch": 2170} {"train_loss": -41.265167236328125, "global_step": 262620, "epoch": 2170} {"train_loss": -40.12452697753906, "global_step": 262621, "epoch": 2170} {"train_loss": -40.503143310546875, "global_step": 262622, "epoch": 2170} {"train_loss": -39.69538497924805, "global_step": 262623, "epoch": 2170} {"train_loss": -41.32893753051758, "global_step": 262624, "epoch": 2170} {"train_loss": -39.99089431762695, "global_step": 262625, "epoch": 2170} {"train_loss": -38.137306213378906, "global_step": 262626, "epoch": 2170} {"train_loss": -39.03260040283203, "global_step": 262627, "epoch": 2170} {"train_loss": -41.87791061401367, "global_step": 262628, "epoch": 2170} {"train_loss": -40.04901885986328, "global_step": 262629, "epoch": 2170} {"train_loss": -38.666542053222656, "global_step": 262630, "epoch": 2170} {"train_loss": -41.083126068115234, "global_step": 262631, "epoch": 2170} {"train_loss": -37.4777717590332, "global_step": 262632, "epoch": 2170} {"train_loss": -40.267337799072266, "global_step": 262633, "epoch": 2170} {"train_loss": -40.2127685546875, "global_step": 262634, "epoch": 2170} {"train_loss": -40.35663986206055, "global_step": 262635, "epoch": 2170} {"train_loss": -41.88694381713867, "global_step": 262636, "epoch": 2170} {"train_loss": -41.1644401550293, "global_step": 262637, "epoch": 2170} {"train_loss": -40.84239959716797, "global_step": 262638, "epoch": 2170} {"train_loss": -41.76982879638672, "global_step": 262639, "epoch": 2170} {"train_loss": -40.68421173095703, "global_step": 262640, "epoch": 2170} {"train_loss": -42.25053024291992, "global_step": 262641, "epoch": 2170} {"train_loss": -41.473419189453125, "global_step": 262642, "epoch": 2170} {"train_loss": -41.47591781616211, "global_step": 262643, "epoch": 2170} {"train_loss": -40.075069427490234, "global_step": 262644, "epoch": 2170} {"train_loss": -40.73829650878906, "global_step": 262645, "epoch": 2170} {"train_loss": -42.09102249145508, "global_step": 262646, "epoch": 2170} {"train_loss": -41.51475143432617, "global_step": 262647, "epoch": 2170} {"train_loss": -40.2548828125, "global_step": 262648, "epoch": 2170} {"train_loss": -41.98286056518555, "global_step": 262649, "epoch": 2170} {"train_loss": -41.43950271606445, "global_step": 262650, "epoch": 2170} {"train_loss": -41.06716537475586, "global_step": 262651, "epoch": 2170} {"train_loss": -42.01209259033203, "global_step": 262652, "epoch": 2170} {"train_loss": -41.59723663330078, "global_step": 262653, "epoch": 2170} {"train_loss": -41.7963981628418, "global_step": 262654, "epoch": 2170} {"train_loss": -39.014835357666016, "global_step": 262655, "epoch": 2170} {"train_loss": -42.11037826538086, "global_step": 262656, "epoch": 2170} {"train_loss": -41.65605163574219, "global_step": 262657, "epoch": 2170} {"train_loss": -42.24325180053711, "global_step": 262658, "epoch": 2170} {"train_loss": -41.8897590637207, "global_step": 262659, "epoch": 2170} {"train_loss": -41.76369857788086, "global_step": 262660, "epoch": 2170} {"train_loss": -42.259376525878906, "global_step": 262661, "epoch": 2170} {"train_loss": -42.61587142944336, "global_step": 262662, "epoch": 2170} {"train_loss": -41.6781120300293, "global_step": 262663, "epoch": 2170} {"train_loss": -42.058528900146484, "global_step": 262664, "epoch": 2170} {"train_loss": -42.18766403198242, "global_step": 262665, "epoch": 2170} {"train_loss": -42.469547271728516, "global_step": 262666, "epoch": 2170} {"train_loss": -42.38222122192383, "global_step": 262667, "epoch": 2170} {"train_loss": -39.39359664916992, "global_step": 262668, "epoch": 2170} {"train_loss": -42.542850494384766, "global_step": 262669, "epoch": 2170} {"train_loss": -36.34267807006836, "global_step": 262670, "epoch": 2170} {"train_loss": -32.87411117553711, "global_step": 262671, "epoch": 2170} {"train_loss": -39.065673828125, "global_step": 262672, "epoch": 2170} {"train_loss": -38.44124221801758, "global_step": 262673, "epoch": 2170} {"train_loss": -31.373544692993164, "global_step": 262674, "epoch": 2170} {"train_loss": -24.488794326782227, "global_step": 262675, "epoch": 2170} {"train_loss": -34.43473434448242, "global_step": 262676, "epoch": 2170} {"train_loss": -32.73683547973633, "global_step": 262677, "epoch": 2170} {"train_loss": -38.50629425048828, "global_step": 262678, "epoch": 2170} {"train_loss": -31.902969360351562, "global_step": 262679, "epoch": 2170} {"train_loss": -33.641971588134766, "global_step": 262680, "epoch": 2170} {"train_loss": -36.625789642333984, "global_step": 262681, "epoch": 2170} {"train_loss": -34.765411376953125, "global_step": 262682, "epoch": 2170} {"train_loss": -36.26919174194336, "global_step": 262683, "epoch": 2170} {"train_loss": -37.17863082885742, "global_step": 262684, "epoch": 2170} {"train_loss": -36.395721435546875, "global_step": 262685, "epoch": 2170} {"train_loss": -34.309783935546875, "global_step": 262686, "epoch": 2170} {"train_loss": -38.50751876831055, "global_step": 262687, "epoch": 2170} {"train_loss": -36.627845764160156, "global_step": 262688, "epoch": 2170} {"train_loss": -36.582054138183594, "global_step": 262689, "epoch": 2170} {"train_loss": -40.50569707697088, "global_step": 262690, "epoch": 2170, "val_loss": 2511823.5} {"train_loss": -38.288429260253906, "global_step": 262691, "epoch": 2171} {"train_loss": -37.734004974365234, "global_step": 262692, "epoch": 2171} {"train_loss": -37.78348922729492, "global_step": 262693, "epoch": 2171} {"train_loss": -39.10689926147461, "global_step": 262694, "epoch": 2171} {"train_loss": -36.5483512878418, "global_step": 262695, "epoch": 2171} {"train_loss": -38.609039306640625, "global_step": 262696, "epoch": 2171} {"train_loss": -39.02688217163086, "global_step": 262697, "epoch": 2171} {"train_loss": -36.86408615112305, "global_step": 262698, "epoch": 2171} {"train_loss": -38.62077331542969, "global_step": 262699, "epoch": 2171} {"train_loss": -39.515724182128906, "global_step": 262700, "epoch": 2171} {"train_loss": -38.58258819580078, "global_step": 262701, "epoch": 2171} {"train_loss": -39.81451416015625, "global_step": 262702, "epoch": 2171} {"train_loss": -37.2985954284668, "global_step": 262703, "epoch": 2171} {"train_loss": -40.12287521362305, "global_step": 262704, "epoch": 2171} {"train_loss": -39.565826416015625, "global_step": 262705, "epoch": 2171} {"train_loss": -40.2353401184082, "global_step": 262706, "epoch": 2171} {"train_loss": -40.10443878173828, "global_step": 262707, "epoch": 2171} {"train_loss": -39.93327713012695, "global_step": 262708, "epoch": 2171} {"train_loss": -39.64022445678711, "global_step": 262709, "epoch": 2171} {"train_loss": -39.705596923828125, "global_step": 262710, "epoch": 2171} {"train_loss": -39.442508697509766, "global_step": 262711, "epoch": 2171} {"train_loss": -40.010040283203125, "global_step": 262712, "epoch": 2171} {"train_loss": -40.063533782958984, "global_step": 262713, "epoch": 2171} {"train_loss": -38.90555953979492, "global_step": 262714, "epoch": 2171} {"train_loss": -40.88740158081055, "global_step": 262715, "epoch": 2171} {"train_loss": -40.671749114990234, "global_step": 262716, "epoch": 2171} {"train_loss": -40.45024490356445, "global_step": 262717, "epoch": 2171} {"train_loss": -40.77134323120117, "global_step": 262718, "epoch": 2171} {"train_loss": -39.428043365478516, "global_step": 262719, "epoch": 2171} {"train_loss": -40.57871627807617, "global_step": 262720, "epoch": 2171} {"train_loss": -41.12468338012695, "global_step": 262721, "epoch": 2171} {"train_loss": -35.76631546020508, "global_step": 262722, "epoch": 2171} {"train_loss": -41.10708236694336, "global_step": 262723, "epoch": 2171} {"train_loss": -37.27543640136719, "global_step": 262724, "epoch": 2171} {"train_loss": -40.52849578857422, "global_step": 262725, "epoch": 2171} {"train_loss": -40.63286590576172, "global_step": 262726, "epoch": 2171} {"train_loss": -41.12278366088867, "global_step": 262727, "epoch": 2171} {"train_loss": -40.41352844238281, "global_step": 262728, "epoch": 2171} {"train_loss": -41.35517120361328, "global_step": 262729, "epoch": 2171} {"train_loss": -41.224082946777344, "global_step": 262730, "epoch": 2171} {"train_loss": -41.076045989990234, "global_step": 262731, "epoch": 2171} {"train_loss": -40.018821716308594, "global_step": 262732, "epoch": 2171} {"train_loss": -40.79558181762695, "global_step": 262733, "epoch": 2171} {"train_loss": -41.52817153930664, "global_step": 262734, "epoch": 2171} {"train_loss": -41.10774612426758, "global_step": 262735, "epoch": 2171} {"train_loss": -40.25019454956055, "global_step": 262736, "epoch": 2171} {"train_loss": -41.5146369934082, "global_step": 262737, "epoch": 2171} {"train_loss": -41.479515075683594, "global_step": 262738, "epoch": 2171} {"train_loss": -40.50043487548828, "global_step": 262739, "epoch": 2171} {"train_loss": -40.455528259277344, "global_step": 262740, "epoch": 2171} {"train_loss": -41.0579719543457, "global_step": 262741, "epoch": 2171} {"train_loss": -41.44905471801758, "global_step": 262742, "epoch": 2171} {"train_loss": -41.55778121948242, "global_step": 262743, "epoch": 2171} {"train_loss": -41.58999252319336, "global_step": 262744, "epoch": 2171} {"train_loss": -41.05671310424805, "global_step": 262745, "epoch": 2171} {"train_loss": -41.74384307861328, "global_step": 262746, "epoch": 2171} {"train_loss": -40.979671478271484, "global_step": 262747, "epoch": 2171} {"train_loss": -40.90495681762695, "global_step": 262748, "epoch": 2171} {"train_loss": -41.2380256652832, "global_step": 262749, "epoch": 2171} {"train_loss": -41.308685302734375, "global_step": 262750, "epoch": 2171} {"train_loss": -41.606605529785156, "global_step": 262751, "epoch": 2171} {"train_loss": -41.602535247802734, "global_step": 262752, "epoch": 2171} {"train_loss": -41.484230041503906, "global_step": 262753, "epoch": 2171} {"train_loss": -41.51534652709961, "global_step": 262754, "epoch": 2171} {"train_loss": -41.98869705200195, "global_step": 262755, "epoch": 2171} {"train_loss": -42.07233810424805, "global_step": 262756, "epoch": 2171} {"train_loss": -41.74238967895508, "global_step": 262757, "epoch": 2171} {"train_loss": -42.04453659057617, "global_step": 262758, "epoch": 2171} {"train_loss": -41.898101806640625, "global_step": 262759, "epoch": 2171} {"train_loss": -41.8325080871582, "global_step": 262760, "epoch": 2171} {"train_loss": -41.680397033691406, "global_step": 262761, "epoch": 2171} {"train_loss": -42.07495880126953, "global_step": 262762, "epoch": 2171} {"train_loss": -42.52872848510742, "global_step": 262763, "epoch": 2171} {"train_loss": -42.114505767822266, "global_step": 262764, "epoch": 2171} {"train_loss": -41.910037994384766, "global_step": 262765, "epoch": 2171} {"train_loss": -42.357967376708984, "global_step": 262766, "epoch": 2171} {"train_loss": -42.00226593017578, "global_step": 262767, "epoch": 2171} {"train_loss": -42.15810775756836, "global_step": 262768, "epoch": 2171} {"train_loss": -42.14179611206055, "global_step": 262769, "epoch": 2171} {"train_loss": -41.86442184448242, "global_step": 262770, "epoch": 2171} {"train_loss": -42.56465148925781, "global_step": 262771, "epoch": 2171} {"train_loss": -42.57606887817383, "global_step": 262772, "epoch": 2171} {"train_loss": -42.15472412109375, "global_step": 262773, "epoch": 2171} {"train_loss": -42.33247756958008, "global_step": 262774, "epoch": 2171} {"train_loss": -42.473941802978516, "global_step": 262775, "epoch": 2171} {"train_loss": -42.430423736572266, "global_step": 262776, "epoch": 2171} {"train_loss": -42.36989974975586, "global_step": 262777, "epoch": 2171} {"train_loss": -42.50210189819336, "global_step": 262778, "epoch": 2171} {"train_loss": -41.88508224487305, "global_step": 262779, "epoch": 2171} {"train_loss": -42.45122528076172, "global_step": 262780, "epoch": 2171} {"train_loss": -42.38678741455078, "global_step": 262781, "epoch": 2171} {"train_loss": -41.55983352661133, "global_step": 262782, "epoch": 2171} {"train_loss": -42.3267936706543, "global_step": 262783, "epoch": 2171} {"train_loss": -42.1231689453125, "global_step": 262784, "epoch": 2171} {"train_loss": -42.65520095825195, "global_step": 262785, "epoch": 2171} {"train_loss": -41.99251174926758, "global_step": 262786, "epoch": 2171} {"train_loss": -42.30527877807617, "global_step": 262787, "epoch": 2171} {"train_loss": -42.60195541381836, "global_step": 262788, "epoch": 2171} {"train_loss": -42.783935546875, "global_step": 262789, "epoch": 2171} {"train_loss": -42.40016555786133, "global_step": 262790, "epoch": 2171} {"train_loss": -42.26349639892578, "global_step": 262791, "epoch": 2171} {"train_loss": -42.30842590332031, "global_step": 262792, "epoch": 2171} {"train_loss": -41.69379425048828, "global_step": 262793, "epoch": 2171} {"train_loss": -42.77177810668945, "global_step": 262794, "epoch": 2171} {"train_loss": -42.4019889831543, "global_step": 262795, "epoch": 2171} {"train_loss": -42.79684829711914, "global_step": 262796, "epoch": 2171} {"train_loss": -42.20158004760742, "global_step": 262797, "epoch": 2171} {"train_loss": -42.67990493774414, "global_step": 262798, "epoch": 2171} {"train_loss": -42.282222747802734, "global_step": 262799, "epoch": 2171} {"train_loss": -41.920860290527344, "global_step": 262800, "epoch": 2171} {"train_loss": -42.787750244140625, "global_step": 262801, "epoch": 2171} {"train_loss": -43.38759994506836, "global_step": 262802, "epoch": 2171} {"train_loss": -42.548397064208984, "global_step": 262803, "epoch": 2171} {"train_loss": -42.634090423583984, "global_step": 262804, "epoch": 2171} {"train_loss": -42.56693649291992, "global_step": 262805, "epoch": 2171} {"train_loss": -42.845855712890625, "global_step": 262806, "epoch": 2171} {"train_loss": -42.03667068481445, "global_step": 262807, "epoch": 2171} {"train_loss": -42.55422592163086, "global_step": 262808, "epoch": 2171} {"train_loss": -43.114295959472656, "global_step": 262809, "epoch": 2171} {"train_loss": -42.431427001953125, "global_step": 262810, "epoch": 2171} {"train_loss": -41.14881048911859, "global_step": 262811, "epoch": 2171, "val_loss": 2628585.75} {"train_loss": -42.755279541015625, "global_step": 262812, "epoch": 2172} {"train_loss": -43.25849151611328, "global_step": 262813, "epoch": 2172} {"train_loss": -43.18937301635742, "global_step": 262814, "epoch": 2172} {"train_loss": -43.114654541015625, "global_step": 262815, "epoch": 2172} {"train_loss": -43.40776443481445, "global_step": 262816, "epoch": 2172} {"train_loss": -43.24674606323242, "global_step": 262817, "epoch": 2172} {"train_loss": -42.68584060668945, "global_step": 262818, "epoch": 2172} {"train_loss": -43.2010498046875, "global_step": 262819, "epoch": 2172} {"train_loss": -42.823577880859375, "global_step": 262820, "epoch": 2172} {"train_loss": -43.561988830566406, "global_step": 262821, "epoch": 2172} {"train_loss": -42.03288650512695, "global_step": 262822, "epoch": 2172} {"train_loss": -42.95305252075195, "global_step": 262823, "epoch": 2172} {"train_loss": -43.15855026245117, "global_step": 262824, "epoch": 2172} {"train_loss": -42.529510498046875, "global_step": 262825, "epoch": 2172} {"train_loss": -43.149566650390625, "global_step": 262826, "epoch": 2172} {"train_loss": -43.241600036621094, "global_step": 262827, "epoch": 2172} {"train_loss": -42.867767333984375, "global_step": 262828, "epoch": 2172} {"train_loss": -42.70191192626953, "global_step": 262829, "epoch": 2172} {"train_loss": -42.864810943603516, "global_step": 262830, "epoch": 2172} {"train_loss": -43.166236877441406, "global_step": 262831, "epoch": 2172} {"train_loss": -43.396942138671875, "global_step": 262832, "epoch": 2172} {"train_loss": -42.872005462646484, "global_step": 262833, "epoch": 2172} {"train_loss": -42.221397399902344, "global_step": 262834, "epoch": 2172} {"train_loss": -42.32111358642578, "global_step": 262835, "epoch": 2172} {"train_loss": -42.15130615234375, "global_step": 262836, "epoch": 2172} {"train_loss": -41.582069396972656, "global_step": 262837, "epoch": 2172} {"train_loss": -41.264644622802734, "global_step": 262838, "epoch": 2172} {"train_loss": -40.884700775146484, "global_step": 262839, "epoch": 2172} {"train_loss": -41.65005111694336, "global_step": 262840, "epoch": 2172} {"train_loss": -42.05400466918945, "global_step": 262841, "epoch": 2172} {"train_loss": -42.00056076049805, "global_step": 262842, "epoch": 2172} {"train_loss": -42.405277252197266, "global_step": 262843, "epoch": 2172} {"train_loss": -41.044227600097656, "global_step": 262844, "epoch": 2172} {"train_loss": -39.80803680419922, "global_step": 262845, "epoch": 2172} {"train_loss": -41.0969123840332, "global_step": 262846, "epoch": 2172} {"train_loss": -42.24452590942383, "global_step": 262847, "epoch": 2172} {"train_loss": -41.472496032714844, "global_step": 262848, "epoch": 2172} {"train_loss": -40.149227142333984, "global_step": 262849, "epoch": 2172} {"train_loss": -40.8809700012207, "global_step": 262850, "epoch": 2172} {"train_loss": -41.45864486694336, "global_step": 262851, "epoch": 2172} {"train_loss": -42.61141586303711, "global_step": 262852, "epoch": 2172} {"train_loss": -40.42340850830078, "global_step": 262853, "epoch": 2172} {"train_loss": -40.8183479309082, "global_step": 262854, "epoch": 2172} {"train_loss": -41.92342758178711, "global_step": 262855, "epoch": 2172} {"train_loss": -41.5732307434082, "global_step": 262856, "epoch": 2172} {"train_loss": -41.0574836730957, "global_step": 262857, "epoch": 2172} {"train_loss": -39.372650146484375, "global_step": 262858, "epoch": 2172} {"train_loss": -39.93094253540039, "global_step": 262859, "epoch": 2172} {"train_loss": -41.152645111083984, "global_step": 262860, "epoch": 2172} {"train_loss": -40.72411346435547, "global_step": 262861, "epoch": 2172} {"train_loss": -41.07026672363281, "global_step": 262862, "epoch": 2172} {"train_loss": -39.991580963134766, "global_step": 262863, "epoch": 2172} {"train_loss": -40.83787155151367, "global_step": 262864, "epoch": 2172} {"train_loss": -42.13582229614258, "global_step": 262865, "epoch": 2172} {"train_loss": -40.528438568115234, "global_step": 262866, "epoch": 2172} {"train_loss": -42.39835739135742, "global_step": 262867, "epoch": 2172} {"train_loss": -41.89093780517578, "global_step": 262868, "epoch": 2172} {"train_loss": -41.2078742980957, "global_step": 262869, "epoch": 2172} {"train_loss": -41.77307891845703, "global_step": 262870, "epoch": 2172} {"train_loss": -41.342830657958984, "global_step": 262871, "epoch": 2172} {"train_loss": -40.94657516479492, "global_step": 262872, "epoch": 2172} {"train_loss": -42.30827713012695, "global_step": 262873, "epoch": 2172} {"train_loss": -42.31390380859375, "global_step": 262874, "epoch": 2172} {"train_loss": -41.82615280151367, "global_step": 262875, "epoch": 2172} {"train_loss": -41.719322204589844, "global_step": 262876, "epoch": 2172} {"train_loss": -42.19988250732422, "global_step": 262877, "epoch": 2172} {"train_loss": -42.26247787475586, "global_step": 262878, "epoch": 2172} {"train_loss": -41.0435905456543, "global_step": 262879, "epoch": 2172} {"train_loss": -41.598602294921875, "global_step": 262880, "epoch": 2172} {"train_loss": -40.9759521484375, "global_step": 262881, "epoch": 2172} {"train_loss": -42.81025314331055, "global_step": 262882, "epoch": 2172} {"train_loss": -42.22909164428711, "global_step": 262883, "epoch": 2172} {"train_loss": -40.753639221191406, "global_step": 262884, "epoch": 2172} {"train_loss": -41.827701568603516, "global_step": 262885, "epoch": 2172} {"train_loss": -41.90761947631836, "global_step": 262886, "epoch": 2172} {"train_loss": -40.51129913330078, "global_step": 262887, "epoch": 2172} {"train_loss": -42.24079513549805, "global_step": 262888, "epoch": 2172} {"train_loss": -42.155250549316406, "global_step": 262889, "epoch": 2172} {"train_loss": -42.135345458984375, "global_step": 262890, "epoch": 2172} {"train_loss": -42.217132568359375, "global_step": 262891, "epoch": 2172} {"train_loss": -41.78166580200195, "global_step": 262892, "epoch": 2172} {"train_loss": -42.441619873046875, "global_step": 262893, "epoch": 2172} {"train_loss": -42.251338958740234, "global_step": 262894, "epoch": 2172} {"train_loss": -41.96143341064453, "global_step": 262895, "epoch": 2172} {"train_loss": -42.7638053894043, "global_step": 262896, "epoch": 2172} {"train_loss": -41.922847747802734, "global_step": 262897, "epoch": 2172} {"train_loss": -42.267940521240234, "global_step": 262898, "epoch": 2172} {"train_loss": -43.35323715209961, "global_step": 262899, "epoch": 2172} {"train_loss": -41.559043884277344, "global_step": 262900, "epoch": 2172} {"train_loss": -42.602935791015625, "global_step": 262901, "epoch": 2172} {"train_loss": -42.57295608520508, "global_step": 262902, "epoch": 2172} {"train_loss": -42.1049690246582, "global_step": 262903, "epoch": 2172} {"train_loss": -42.238624572753906, "global_step": 262904, "epoch": 2172} {"train_loss": -42.331111907958984, "global_step": 262905, "epoch": 2172} {"train_loss": -42.69283676147461, "global_step": 262906, "epoch": 2172} {"train_loss": -42.76824188232422, "global_step": 262907, "epoch": 2172} {"train_loss": -41.79514694213867, "global_step": 262908, "epoch": 2172} {"train_loss": -42.462127685546875, "global_step": 262909, "epoch": 2172} {"train_loss": -42.985992431640625, "global_step": 262910, "epoch": 2172} {"train_loss": -42.33362579345703, "global_step": 262911, "epoch": 2172} {"train_loss": -41.943626403808594, "global_step": 262912, "epoch": 2172} {"train_loss": -41.98460006713867, "global_step": 262913, "epoch": 2172} {"train_loss": -42.6429443359375, "global_step": 262914, "epoch": 2172} {"train_loss": -42.78190231323242, "global_step": 262915, "epoch": 2172} {"train_loss": -42.28725051879883, "global_step": 262916, "epoch": 2172} {"train_loss": -42.80007553100586, "global_step": 262917, "epoch": 2172} {"train_loss": -42.67464065551758, "global_step": 262918, "epoch": 2172} {"train_loss": -43.107818603515625, "global_step": 262919, "epoch": 2172} {"train_loss": -43.3759651184082, "global_step": 262920, "epoch": 2172} {"train_loss": -42.892391204833984, "global_step": 262921, "epoch": 2172} {"train_loss": -43.60258102416992, "global_step": 262922, "epoch": 2172} {"train_loss": -42.59397506713867, "global_step": 262923, "epoch": 2172} {"train_loss": -43.1325798034668, "global_step": 262924, "epoch": 2172} {"train_loss": -43.69527053833008, "global_step": 262925, "epoch": 2172} {"train_loss": -43.0544319152832, "global_step": 262926, "epoch": 2172} {"train_loss": -42.88823318481445, "global_step": 262927, "epoch": 2172} {"train_loss": -43.159400939941406, "global_step": 262928, "epoch": 2172} {"train_loss": -42.81095886230469, "global_step": 262929, "epoch": 2172} {"train_loss": -42.98818588256836, "global_step": 262930, "epoch": 2172} {"train_loss": -43.07997131347656, "global_step": 262931, "epoch": 2172} {"train_loss": -42.14334938742898, "global_step": 262932, "epoch": 2172, "val_loss": 2648828.75} {"train_loss": -43.0047607421875, "global_step": 262933, "epoch": 2173} {"train_loss": -42.33732223510742, "global_step": 262934, "epoch": 2173} {"train_loss": -41.38213348388672, "global_step": 262935, "epoch": 2173} {"train_loss": -41.9984245300293, "global_step": 262936, "epoch": 2173} {"train_loss": -42.26304626464844, "global_step": 262937, "epoch": 2173} {"train_loss": -42.80306625366211, "global_step": 262938, "epoch": 2173} {"train_loss": -43.87275695800781, "global_step": 262939, "epoch": 2173} {"train_loss": -42.8595085144043, "global_step": 262940, "epoch": 2173} {"train_loss": -42.681884765625, "global_step": 262941, "epoch": 2173} {"train_loss": -42.34951400756836, "global_step": 262942, "epoch": 2173} {"train_loss": -42.70493698120117, "global_step": 262943, "epoch": 2173} {"train_loss": -42.808719635009766, "global_step": 262944, "epoch": 2173} {"train_loss": -41.27204513549805, "global_step": 262945, "epoch": 2173} {"train_loss": -40.045448303222656, "global_step": 262946, "epoch": 2173} {"train_loss": -40.10154724121094, "global_step": 262947, "epoch": 2173} {"train_loss": -42.1757698059082, "global_step": 262948, "epoch": 2173} {"train_loss": -42.90711212158203, "global_step": 262949, "epoch": 2173} {"train_loss": -41.423583984375, "global_step": 262950, "epoch": 2173} {"train_loss": -40.354270935058594, "global_step": 262951, "epoch": 2173} {"train_loss": -40.301597595214844, "global_step": 262952, "epoch": 2173} {"train_loss": -41.48794174194336, "global_step": 262953, "epoch": 2173} {"train_loss": -42.9764289855957, "global_step": 262954, "epoch": 2173} {"train_loss": -41.49763107299805, "global_step": 262955, "epoch": 2173} {"train_loss": -40.561519622802734, "global_step": 262956, "epoch": 2173} {"train_loss": -42.37240219116211, "global_step": 262957, "epoch": 2173} {"train_loss": -42.86051940917969, "global_step": 262958, "epoch": 2173} {"train_loss": -41.5528564453125, "global_step": 262959, "epoch": 2173} {"train_loss": -39.3164176940918, "global_step": 262960, "epoch": 2173} {"train_loss": -40.25578308105469, "global_step": 262961, "epoch": 2173} {"train_loss": -42.49378967285156, "global_step": 262962, "epoch": 2173} {"train_loss": -41.679141998291016, "global_step": 262963, "epoch": 2173} {"train_loss": -41.71349334716797, "global_step": 262964, "epoch": 2173} {"train_loss": -41.34510803222656, "global_step": 262965, "epoch": 2173} {"train_loss": -42.096981048583984, "global_step": 262966, "epoch": 2173} {"train_loss": -40.97376251220703, "global_step": 262967, "epoch": 2173} {"train_loss": -40.19231414794922, "global_step": 262968, "epoch": 2173} {"train_loss": -41.27678680419922, "global_step": 262969, "epoch": 2173} {"train_loss": -41.91828918457031, "global_step": 262970, "epoch": 2173} {"train_loss": -40.35918045043945, "global_step": 262971, "epoch": 2173} {"train_loss": -40.62777328491211, "global_step": 262972, "epoch": 2173} {"train_loss": -41.85295104980469, "global_step": 262973, "epoch": 2173} {"train_loss": -40.56319046020508, "global_step": 262974, "epoch": 2173} {"train_loss": -41.84670639038086, "global_step": 262975, "epoch": 2173} {"train_loss": -41.91279983520508, "global_step": 262976, "epoch": 2173} {"train_loss": -42.269466400146484, "global_step": 262977, "epoch": 2173} {"train_loss": -41.63387680053711, "global_step": 262978, "epoch": 2173} {"train_loss": -42.23991775512695, "global_step": 262979, "epoch": 2173} {"train_loss": -42.60788345336914, "global_step": 262980, "epoch": 2173} {"train_loss": -42.29085159301758, "global_step": 262981, "epoch": 2173} {"train_loss": -42.533538818359375, "global_step": 262982, "epoch": 2173} {"train_loss": -42.35700607299805, "global_step": 262983, "epoch": 2173} {"train_loss": -41.86710739135742, "global_step": 262984, "epoch": 2173} {"train_loss": -42.1956787109375, "global_step": 262985, "epoch": 2173} {"train_loss": -42.36127471923828, "global_step": 262986, "epoch": 2173} {"train_loss": -42.51325607299805, "global_step": 262987, "epoch": 2173} {"train_loss": -43.10761642456055, "global_step": 262988, "epoch": 2173} {"train_loss": -42.32038116455078, "global_step": 262989, "epoch": 2173} {"train_loss": -42.913787841796875, "global_step": 262990, "epoch": 2173} {"train_loss": -42.576416015625, "global_step": 262991, "epoch": 2173} {"train_loss": -43.40296173095703, "global_step": 262992, "epoch": 2173} {"train_loss": -42.56919479370117, "global_step": 262993, "epoch": 2173} {"train_loss": -42.787635803222656, "global_step": 262994, "epoch": 2173} {"train_loss": -43.215301513671875, "global_step": 262995, "epoch": 2173} {"train_loss": -42.60352325439453, "global_step": 262996, "epoch": 2173} {"train_loss": -42.84762954711914, "global_step": 262997, "epoch": 2173} {"train_loss": -43.39242172241211, "global_step": 262998, "epoch": 2173} {"train_loss": -42.75074768066406, "global_step": 262999, "epoch": 2173} {"train_loss": -42.804988861083984, "global_step": 263000, "epoch": 2173} {"train_loss": -43.6293830871582, "global_step": 263001, "epoch": 2173} {"train_loss": -42.65849685668945, "global_step": 263002, "epoch": 2173} {"train_loss": -43.11350631713867, "global_step": 263003, "epoch": 2173} {"train_loss": -42.926021575927734, "global_step": 263004, "epoch": 2173} {"train_loss": -42.96120834350586, "global_step": 263005, "epoch": 2173} {"train_loss": -42.988990783691406, "global_step": 263006, "epoch": 2173} {"train_loss": -43.245887756347656, "global_step": 263007, "epoch": 2173} {"train_loss": -43.60955810546875, "global_step": 263008, "epoch": 2173} {"train_loss": -42.68540573120117, "global_step": 263009, "epoch": 2173} {"train_loss": -42.6095085144043, "global_step": 263010, "epoch": 2173} {"train_loss": -43.42429733276367, "global_step": 263011, "epoch": 2173} {"train_loss": -43.14851760864258, "global_step": 263012, "epoch": 2173} {"train_loss": -43.48026657104492, "global_step": 263013, "epoch": 2173} {"train_loss": -43.38465118408203, "global_step": 263014, "epoch": 2173} {"train_loss": -43.68470764160156, "global_step": 263015, "epoch": 2173} {"train_loss": -43.41230392456055, "global_step": 263016, "epoch": 2173} {"train_loss": -43.58798599243164, "global_step": 263017, "epoch": 2173} {"train_loss": -43.27949142456055, "global_step": 263018, "epoch": 2173} {"train_loss": -43.86026382446289, "global_step": 263019, "epoch": 2173} {"train_loss": -43.47099685668945, "global_step": 263020, "epoch": 2173} {"train_loss": -43.870445251464844, "global_step": 263021, "epoch": 2173} {"train_loss": -44.00822067260742, "global_step": 263022, "epoch": 2173} {"train_loss": -43.195491790771484, "global_step": 263023, "epoch": 2173} {"train_loss": -43.9266471862793, "global_step": 263024, "epoch": 2173} {"train_loss": -44.2346076965332, "global_step": 263025, "epoch": 2173} {"train_loss": -43.330142974853516, "global_step": 263026, "epoch": 2173} {"train_loss": -43.85056686401367, "global_step": 263027, "epoch": 2173} {"train_loss": -43.634132385253906, "global_step": 263028, "epoch": 2173} {"train_loss": -43.79212188720703, "global_step": 263029, "epoch": 2173} {"train_loss": -43.54336929321289, "global_step": 263030, "epoch": 2173} {"train_loss": -43.924312591552734, "global_step": 263031, "epoch": 2173} {"train_loss": -43.58132553100586, "global_step": 263032, "epoch": 2173} {"train_loss": -44.274898529052734, "global_step": 263033, "epoch": 2173} {"train_loss": -43.80732345581055, "global_step": 263034, "epoch": 2173} {"train_loss": -43.56604766845703, "global_step": 263035, "epoch": 2173} {"train_loss": -44.030277252197266, "global_step": 263036, "epoch": 2173} {"train_loss": -43.695980072021484, "global_step": 263037, "epoch": 2173} {"train_loss": -42.931556701660156, "global_step": 263038, "epoch": 2173} {"train_loss": -43.062538146972656, "global_step": 263039, "epoch": 2173} {"train_loss": -42.46062088012695, "global_step": 263040, "epoch": 2173} {"train_loss": -41.55508041381836, "global_step": 263041, "epoch": 2173} {"train_loss": -43.27252197265625, "global_step": 263042, "epoch": 2173} {"train_loss": -42.630130767822266, "global_step": 263043, "epoch": 2173} {"train_loss": -38.710426330566406, "global_step": 263044, "epoch": 2173} {"train_loss": -32.787471771240234, "global_step": 263045, "epoch": 2173} {"train_loss": -36.2841682434082, "global_step": 263046, "epoch": 2173} {"train_loss": -40.331268310546875, "global_step": 263047, "epoch": 2173} {"train_loss": -33.39052200317383, "global_step": 263048, "epoch": 2173} {"train_loss": -28.0168514251709, "global_step": 263049, "epoch": 2173} {"train_loss": -40.00272750854492, "global_step": 263050, "epoch": 2173} {"train_loss": -37.0941047668457, "global_step": 263051, "epoch": 2173} {"train_loss": -35.78215408325195, "global_step": 263052, "epoch": 2173} {"train_loss": -42.00723892401073, "global_step": 263053, "epoch": 2173, "val_loss": 2585838.75} {"train_loss": -36.6169548034668, "global_step": 263054, "epoch": 2174} {"train_loss": -37.128841400146484, "global_step": 263055, "epoch": 2174} {"train_loss": -39.27995300292969, "global_step": 263056, "epoch": 2174} {"train_loss": -33.70235061645508, "global_step": 263057, "epoch": 2174} {"train_loss": -39.234676361083984, "global_step": 263058, "epoch": 2174} {"train_loss": -35.33245849609375, "global_step": 263059, "epoch": 2174} {"train_loss": -39.177459716796875, "global_step": 263060, "epoch": 2174} {"train_loss": -38.4173583984375, "global_step": 263061, "epoch": 2174} {"train_loss": -40.6783332824707, "global_step": 263062, "epoch": 2174} {"train_loss": -37.28243637084961, "global_step": 263063, "epoch": 2174} {"train_loss": -39.6784782409668, "global_step": 263064, "epoch": 2174} {"train_loss": -36.18890380859375, "global_step": 263065, "epoch": 2174} {"train_loss": -39.86394500732422, "global_step": 263066, "epoch": 2174} {"train_loss": -39.31879806518555, "global_step": 263067, "epoch": 2174} {"train_loss": -39.17903518676758, "global_step": 263068, "epoch": 2174} {"train_loss": -39.73295211791992, "global_step": 263069, "epoch": 2174} {"train_loss": -38.77724075317383, "global_step": 263070, "epoch": 2174} {"train_loss": -41.601863861083984, "global_step": 263071, "epoch": 2174} {"train_loss": -39.77653503417969, "global_step": 263072, "epoch": 2174} {"train_loss": -40.674537658691406, "global_step": 263073, "epoch": 2174} {"train_loss": -41.911991119384766, "global_step": 263074, "epoch": 2174} {"train_loss": -40.12617111206055, "global_step": 263075, "epoch": 2174} {"train_loss": -41.37150955200195, "global_step": 263076, "epoch": 2174} {"train_loss": -40.721435546875, "global_step": 263077, "epoch": 2174} {"train_loss": -41.74930191040039, "global_step": 263078, "epoch": 2174} {"train_loss": -41.3552360534668, "global_step": 263079, "epoch": 2174} {"train_loss": -41.281986236572266, "global_step": 263080, "epoch": 2174} {"train_loss": -42.27898025512695, "global_step": 263081, "epoch": 2174} {"train_loss": -41.64421463012695, "global_step": 263082, "epoch": 2174} {"train_loss": -41.63383483886719, "global_step": 263083, "epoch": 2174} {"train_loss": -42.04674530029297, "global_step": 263084, "epoch": 2174} {"train_loss": -41.37197494506836, "global_step": 263085, "epoch": 2174} {"train_loss": -42.016761779785156, "global_step": 263086, "epoch": 2174} {"train_loss": -41.72465133666992, "global_step": 263087, "epoch": 2174} {"train_loss": -41.89850616455078, "global_step": 263088, "epoch": 2174} {"train_loss": -42.380367279052734, "global_step": 263089, "epoch": 2174} {"train_loss": -41.974483489990234, "global_step": 263090, "epoch": 2174} {"train_loss": -42.07136154174805, "global_step": 263091, "epoch": 2174} {"train_loss": -41.81834030151367, "global_step": 263092, "epoch": 2174} {"train_loss": -42.25390625, "global_step": 263093, "epoch": 2174} {"train_loss": -42.0028190612793, "global_step": 263094, "epoch": 2174} {"train_loss": -42.441898345947266, "global_step": 263095, "epoch": 2174} {"train_loss": -41.64336013793945, "global_step": 263096, "epoch": 2174} {"train_loss": -42.46089553833008, "global_step": 263097, "epoch": 2174} {"train_loss": -42.44968795776367, "global_step": 263098, "epoch": 2174} {"train_loss": -42.06023406982422, "global_step": 263099, "epoch": 2174} {"train_loss": -42.83746337890625, "global_step": 263100, "epoch": 2174} {"train_loss": -42.94807052612305, "global_step": 263101, "epoch": 2174} {"train_loss": -42.70862579345703, "global_step": 263102, "epoch": 2174} {"train_loss": -42.62915802001953, "global_step": 263103, "epoch": 2174} {"train_loss": -42.97614669799805, "global_step": 263104, "epoch": 2174} {"train_loss": -42.80967330932617, "global_step": 263105, "epoch": 2174} {"train_loss": -42.62510681152344, "global_step": 263106, "epoch": 2174} {"train_loss": -42.565345764160156, "global_step": 263107, "epoch": 2174} {"train_loss": -42.714927673339844, "global_step": 263108, "epoch": 2174} {"train_loss": -42.96522903442383, "global_step": 263109, "epoch": 2174} {"train_loss": -43.05472946166992, "global_step": 263110, "epoch": 2174} {"train_loss": -42.81943130493164, "global_step": 263111, "epoch": 2174} {"train_loss": -43.02631759643555, "global_step": 263112, "epoch": 2174} {"train_loss": -42.69965744018555, "global_step": 263113, "epoch": 2174} {"train_loss": -42.875465393066406, "global_step": 263114, "epoch": 2174} {"train_loss": -43.17562484741211, "global_step": 263115, "epoch": 2174} {"train_loss": -42.85515213012695, "global_step": 263116, "epoch": 2174} {"train_loss": -42.83677291870117, "global_step": 263117, "epoch": 2174} {"train_loss": -42.990203857421875, "global_step": 263118, "epoch": 2174} {"train_loss": -43.208248138427734, "global_step": 263119, "epoch": 2174} {"train_loss": -43.432247161865234, "global_step": 263120, "epoch": 2174} {"train_loss": -42.80949020385742, "global_step": 263121, "epoch": 2174} {"train_loss": -43.4481315612793, "global_step": 263122, "epoch": 2174} {"train_loss": -42.84550094604492, "global_step": 263123, "epoch": 2174} {"train_loss": -43.159603118896484, "global_step": 263124, "epoch": 2174} {"train_loss": -43.023128509521484, "global_step": 263125, "epoch": 2174} {"train_loss": -43.369144439697266, "global_step": 263126, "epoch": 2174} {"train_loss": -43.0309944152832, "global_step": 263127, "epoch": 2174} {"train_loss": -43.35942459106445, "global_step": 263128, "epoch": 2174} {"train_loss": -43.28337860107422, "global_step": 263129, "epoch": 2174} {"train_loss": -43.86745071411133, "global_step": 263130, "epoch": 2174} {"train_loss": -43.45064163208008, "global_step": 263131, "epoch": 2174} {"train_loss": -43.61616516113281, "global_step": 263132, "epoch": 2174} {"train_loss": -43.3382682800293, "global_step": 263133, "epoch": 2174} {"train_loss": -42.705501556396484, "global_step": 263134, "epoch": 2174} {"train_loss": -43.3392219543457, "global_step": 263135, "epoch": 2174} {"train_loss": -43.27382278442383, "global_step": 263136, "epoch": 2174} {"train_loss": -43.55888748168945, "global_step": 263137, "epoch": 2174} {"train_loss": -43.21926498413086, "global_step": 263138, "epoch": 2174} {"train_loss": -43.25200653076172, "global_step": 263139, "epoch": 2174} {"train_loss": -43.782222747802734, "global_step": 263140, "epoch": 2174} {"train_loss": -43.55064010620117, "global_step": 263141, "epoch": 2174} {"train_loss": -43.133522033691406, "global_step": 263142, "epoch": 2174} {"train_loss": -43.6390495300293, "global_step": 263143, "epoch": 2174} {"train_loss": -43.29200744628906, "global_step": 263144, "epoch": 2174} {"train_loss": -43.4482307434082, "global_step": 263145, "epoch": 2174} {"train_loss": -43.62980270385742, "global_step": 263146, "epoch": 2174} {"train_loss": -43.35149002075195, "global_step": 263147, "epoch": 2174} {"train_loss": -43.538307189941406, "global_step": 263148, "epoch": 2174} {"train_loss": -43.15247344970703, "global_step": 263149, "epoch": 2174} {"train_loss": -44.100067138671875, "global_step": 263150, "epoch": 2174} {"train_loss": -43.183807373046875, "global_step": 263151, "epoch": 2174} {"train_loss": -42.023921966552734, "global_step": 263152, "epoch": 2174} {"train_loss": -42.17539596557617, "global_step": 263153, "epoch": 2174} {"train_loss": -43.302589416503906, "global_step": 263154, "epoch": 2174} {"train_loss": -42.79034423828125, "global_step": 263155, "epoch": 2174} {"train_loss": -42.40204620361328, "global_step": 263156, "epoch": 2174} {"train_loss": -42.842018127441406, "global_step": 263157, "epoch": 2174} {"train_loss": -43.444793701171875, "global_step": 263158, "epoch": 2174} {"train_loss": -43.31694793701172, "global_step": 263159, "epoch": 2174} {"train_loss": -43.34402084350586, "global_step": 263160, "epoch": 2174} {"train_loss": -44.124549865722656, "global_step": 263161, "epoch": 2174} {"train_loss": -43.6252555847168, "global_step": 263162, "epoch": 2174} {"train_loss": -43.451656341552734, "global_step": 263163, "epoch": 2174} {"train_loss": -43.604454040527344, "global_step": 263164, "epoch": 2174} {"train_loss": -43.258968353271484, "global_step": 263165, "epoch": 2174} {"train_loss": -43.19021224975586, "global_step": 263166, "epoch": 2174} {"train_loss": -43.10226821899414, "global_step": 263167, "epoch": 2174} {"train_loss": -42.918216705322266, "global_step": 263168, "epoch": 2174} {"train_loss": -42.996070861816406, "global_step": 263169, "epoch": 2174} {"train_loss": -43.21226119995117, "global_step": 263170, "epoch": 2174} {"train_loss": -42.66257858276367, "global_step": 263171, "epoch": 2174} {"train_loss": -41.777435302734375, "global_step": 263172, "epoch": 2174} {"train_loss": -39.93655014038086, "global_step": 263173, "epoch": 2174} {"train_loss": -42.04661588432375, "global_step": 263174, "epoch": 2174, "val_loss": 2727742.25} {"train_loss": -42.47797393798828, "global_step": 263175, "epoch": 2175} {"train_loss": -42.31797409057617, "global_step": 263176, "epoch": 2175} {"train_loss": -37.004730224609375, "global_step": 263177, "epoch": 2175} {"train_loss": -29.93338394165039, "global_step": 263178, "epoch": 2175} {"train_loss": -32.22831344604492, "global_step": 263179, "epoch": 2175} {"train_loss": -39.06553268432617, "global_step": 263180, "epoch": 2175} {"train_loss": -38.01393508911133, "global_step": 263181, "epoch": 2175} {"train_loss": -35.828399658203125, "global_step": 263182, "epoch": 2175} {"train_loss": -39.11586380004883, "global_step": 263183, "epoch": 2175} {"train_loss": -37.54338455200195, "global_step": 263184, "epoch": 2175} {"train_loss": -36.46970748901367, "global_step": 263185, "epoch": 2175} {"train_loss": -40.526123046875, "global_step": 263186, "epoch": 2175} {"train_loss": -40.02870559692383, "global_step": 263187, "epoch": 2175} {"train_loss": -38.90224075317383, "global_step": 263188, "epoch": 2175} {"train_loss": -37.1979866027832, "global_step": 263189, "epoch": 2175} {"train_loss": -39.72397232055664, "global_step": 263190, "epoch": 2175} {"train_loss": -41.38922882080078, "global_step": 263191, "epoch": 2175} {"train_loss": -37.70009231567383, "global_step": 263192, "epoch": 2175} {"train_loss": -41.08551788330078, "global_step": 263193, "epoch": 2175} {"train_loss": -38.64236068725586, "global_step": 263194, "epoch": 2175} {"train_loss": -38.999603271484375, "global_step": 263195, "epoch": 2175} {"train_loss": -41.27210998535156, "global_step": 263196, "epoch": 2175} {"train_loss": -39.71649169921875, "global_step": 263197, "epoch": 2175} {"train_loss": -40.24042892456055, "global_step": 263198, "epoch": 2175} {"train_loss": -41.242431640625, "global_step": 263199, "epoch": 2175} {"train_loss": -38.9998779296875, "global_step": 263200, "epoch": 2175} {"train_loss": -41.904701232910156, "global_step": 263201, "epoch": 2175} {"train_loss": -39.00602340698242, "global_step": 263202, "epoch": 2175} {"train_loss": -41.5518798828125, "global_step": 263203, "epoch": 2175} {"train_loss": -40.029876708984375, "global_step": 263204, "epoch": 2175} {"train_loss": -40.4452018737793, "global_step": 263205, "epoch": 2175} {"train_loss": -41.456199645996094, "global_step": 263206, "epoch": 2175} {"train_loss": -41.07877731323242, "global_step": 263207, "epoch": 2175} {"train_loss": -41.6013069152832, "global_step": 263208, "epoch": 2175} {"train_loss": -40.55588912963867, "global_step": 263209, "epoch": 2175} {"train_loss": -41.86906814575195, "global_step": 263210, "epoch": 2175} {"train_loss": -40.81028747558594, "global_step": 263211, "epoch": 2175} {"train_loss": -42.063392639160156, "global_step": 263212, "epoch": 2175} {"train_loss": -40.981178283691406, "global_step": 263213, "epoch": 2175} {"train_loss": -42.184303283691406, "global_step": 263214, "epoch": 2175} {"train_loss": -41.080787658691406, "global_step": 263215, "epoch": 2175} {"train_loss": -42.19578552246094, "global_step": 263216, "epoch": 2175} {"train_loss": -41.7346076965332, "global_step": 263217, "epoch": 2175} {"train_loss": -42.284244537353516, "global_step": 263218, "epoch": 2175} {"train_loss": -42.1751708984375, "global_step": 263219, "epoch": 2175} {"train_loss": -42.10213851928711, "global_step": 263220, "epoch": 2175} {"train_loss": -42.151824951171875, "global_step": 263221, "epoch": 2175} {"train_loss": -42.485652923583984, "global_step": 263222, "epoch": 2175} {"train_loss": -42.53701400756836, "global_step": 263223, "epoch": 2175} {"train_loss": -42.014259338378906, "global_step": 263224, "epoch": 2175} {"train_loss": -42.621822357177734, "global_step": 263225, "epoch": 2175} {"train_loss": -43.215431213378906, "global_step": 263226, "epoch": 2175} {"train_loss": -42.46739959716797, "global_step": 263227, "epoch": 2175} {"train_loss": -42.759681701660156, "global_step": 263228, "epoch": 2175} {"train_loss": -42.93836212158203, "global_step": 263229, "epoch": 2175} {"train_loss": -43.36495590209961, "global_step": 263230, "epoch": 2175} {"train_loss": -42.97234344482422, "global_step": 263231, "epoch": 2175} {"train_loss": -43.373870849609375, "global_step": 263232, "epoch": 2175} {"train_loss": -43.46564865112305, "global_step": 263233, "epoch": 2175} {"train_loss": -43.11872100830078, "global_step": 263234, "epoch": 2175} {"train_loss": -42.838050842285156, "global_step": 263235, "epoch": 2175} {"train_loss": -43.1273078918457, "global_step": 263236, "epoch": 2175} {"train_loss": -43.1576042175293, "global_step": 263237, "epoch": 2175} {"train_loss": -43.05500411987305, "global_step": 263238, "epoch": 2175} {"train_loss": -43.23435974121094, "global_step": 263239, "epoch": 2175} {"train_loss": -43.05022048950195, "global_step": 263240, "epoch": 2175} {"train_loss": -43.23393249511719, "global_step": 263241, "epoch": 2175} {"train_loss": -43.22237014770508, "global_step": 263242, "epoch": 2175} {"train_loss": -43.35720443725586, "global_step": 263243, "epoch": 2175} {"train_loss": -43.10979461669922, "global_step": 263244, "epoch": 2175} {"train_loss": -43.45426559448242, "global_step": 263245, "epoch": 2175} {"train_loss": -43.168212890625, "global_step": 263246, "epoch": 2175} {"train_loss": -43.496524810791016, "global_step": 263247, "epoch": 2175} {"train_loss": -43.311275482177734, "global_step": 263248, "epoch": 2175} {"train_loss": -43.705665588378906, "global_step": 263249, "epoch": 2175} {"train_loss": -43.6096305847168, "global_step": 263250, "epoch": 2175} {"train_loss": -43.23299789428711, "global_step": 263251, "epoch": 2175} {"train_loss": -43.68391036987305, "global_step": 263252, "epoch": 2175} {"train_loss": -42.998905181884766, "global_step": 263253, "epoch": 2175} {"train_loss": -43.72013473510742, "global_step": 263254, "epoch": 2175} {"train_loss": -43.56425476074219, "global_step": 263255, "epoch": 2175} {"train_loss": -43.54141616821289, "global_step": 263256, "epoch": 2175} {"train_loss": -44.01017379760742, "global_step": 263257, "epoch": 2175} {"train_loss": -43.6041259765625, "global_step": 263258, "epoch": 2175} {"train_loss": -43.72666549682617, "global_step": 263259, "epoch": 2175} {"train_loss": -43.54116439819336, "global_step": 263260, "epoch": 2175} {"train_loss": -43.99679183959961, "global_step": 263261, "epoch": 2175} {"train_loss": -43.43778991699219, "global_step": 263262, "epoch": 2175} {"train_loss": -43.94552230834961, "global_step": 263263, "epoch": 2175} {"train_loss": -43.83125686645508, "global_step": 263264, "epoch": 2175} {"train_loss": -43.66630172729492, "global_step": 263265, "epoch": 2175} {"train_loss": -44.30039596557617, "global_step": 263266, "epoch": 2175} {"train_loss": -44.23029327392578, "global_step": 263267, "epoch": 2175} {"train_loss": -44.13679885864258, "global_step": 263268, "epoch": 2175} {"train_loss": -44.01163864135742, "global_step": 263269, "epoch": 2175} {"train_loss": -43.914222717285156, "global_step": 263270, "epoch": 2175} {"train_loss": -44.41156005859375, "global_step": 263271, "epoch": 2175} {"train_loss": -44.31011962890625, "global_step": 263272, "epoch": 2175} {"train_loss": -44.07575225830078, "global_step": 263273, "epoch": 2175} {"train_loss": -44.50657272338867, "global_step": 263274, "epoch": 2175} {"train_loss": -43.4056510925293, "global_step": 263275, "epoch": 2175} {"train_loss": -44.05447006225586, "global_step": 263276, "epoch": 2175} {"train_loss": -44.07866668701172, "global_step": 263277, "epoch": 2175} {"train_loss": -44.16127395629883, "global_step": 263278, "epoch": 2175} {"train_loss": -44.56707763671875, "global_step": 263279, "epoch": 2175} {"train_loss": -44.21482467651367, "global_step": 263280, "epoch": 2175} {"train_loss": -44.1508903503418, "global_step": 263281, "epoch": 2175} {"train_loss": -42.89383316040039, "global_step": 263282, "epoch": 2175} {"train_loss": -42.22240447998047, "global_step": 263283, "epoch": 2175} {"train_loss": -43.3682861328125, "global_step": 263284, "epoch": 2175} {"train_loss": -43.45209503173828, "global_step": 263285, "epoch": 2175} {"train_loss": -43.96693801879883, "global_step": 263286, "epoch": 2175} {"train_loss": -43.69096755981445, "global_step": 263287, "epoch": 2175} {"train_loss": -43.236568450927734, "global_step": 263288, "epoch": 2175} {"train_loss": -43.139137268066406, "global_step": 263289, "epoch": 2175} {"train_loss": -43.676048278808594, "global_step": 263290, "epoch": 2175} {"train_loss": -43.997135162353516, "global_step": 263291, "epoch": 2175} {"train_loss": -43.77580642700195, "global_step": 263292, "epoch": 2175} {"train_loss": -43.96845626831055, "global_step": 263293, "epoch": 2175} {"train_loss": -43.77126693725586, "global_step": 263294, "epoch": 2175} {"train_loss": -42.09524819870626, "global_step": 263295, "epoch": 2175, "val_loss": 2711204.75} {"train_loss": -43.3569221496582, "global_step": 263296, "epoch": 2176} {"train_loss": -42.8117561340332, "global_step": 263297, "epoch": 2176} {"train_loss": -42.585384368896484, "global_step": 263298, "epoch": 2176} {"train_loss": -41.25193786621094, "global_step": 263299, "epoch": 2176} {"train_loss": -39.39345169067383, "global_step": 263300, "epoch": 2176} {"train_loss": -40.250099182128906, "global_step": 263301, "epoch": 2176} {"train_loss": -41.63621520996094, "global_step": 263302, "epoch": 2176} {"train_loss": -43.17951202392578, "global_step": 263303, "epoch": 2176} {"train_loss": -43.23089599609375, "global_step": 263304, "epoch": 2176} {"train_loss": -42.920223236083984, "global_step": 263305, "epoch": 2176} {"train_loss": -41.886348724365234, "global_step": 263306, "epoch": 2176} {"train_loss": -42.09583282470703, "global_step": 263307, "epoch": 2176} {"train_loss": -42.197139739990234, "global_step": 263308, "epoch": 2176} {"train_loss": -43.26119613647461, "global_step": 263309, "epoch": 2176} {"train_loss": -42.93635177612305, "global_step": 263310, "epoch": 2176} {"train_loss": -41.48874282836914, "global_step": 263311, "epoch": 2176} {"train_loss": -42.29437255859375, "global_step": 263312, "epoch": 2176} {"train_loss": -43.41376876831055, "global_step": 263313, "epoch": 2176} {"train_loss": -41.04975509643555, "global_step": 263314, "epoch": 2176} {"train_loss": -40.525089263916016, "global_step": 263315, "epoch": 2176} {"train_loss": -42.42598342895508, "global_step": 263316, "epoch": 2176} {"train_loss": -42.187965393066406, "global_step": 263317, "epoch": 2176} {"train_loss": -41.10395050048828, "global_step": 263318, "epoch": 2176} {"train_loss": -42.9911994934082, "global_step": 263319, "epoch": 2176} {"train_loss": -41.91684341430664, "global_step": 263320, "epoch": 2176} {"train_loss": -41.47520065307617, "global_step": 263321, "epoch": 2176} {"train_loss": -43.086273193359375, "global_step": 263322, "epoch": 2176} {"train_loss": -40.300899505615234, "global_step": 263323, "epoch": 2176} {"train_loss": -41.87845993041992, "global_step": 263324, "epoch": 2176} {"train_loss": -42.854248046875, "global_step": 263325, "epoch": 2176} {"train_loss": -40.596004486083984, "global_step": 263326, "epoch": 2176} {"train_loss": -43.29319381713867, "global_step": 263327, "epoch": 2176} {"train_loss": -42.10972213745117, "global_step": 263328, "epoch": 2176} {"train_loss": -41.33724594116211, "global_step": 263329, "epoch": 2176} {"train_loss": -43.252891540527344, "global_step": 263330, "epoch": 2176} {"train_loss": -42.23543167114258, "global_step": 263331, "epoch": 2176} {"train_loss": -42.150787353515625, "global_step": 263332, "epoch": 2176} {"train_loss": -42.7882194519043, "global_step": 263333, "epoch": 2176} {"train_loss": -41.79157638549805, "global_step": 263334, "epoch": 2176} {"train_loss": -42.5295524597168, "global_step": 263335, "epoch": 2176} {"train_loss": -43.440006256103516, "global_step": 263336, "epoch": 2176} {"train_loss": -43.10891342163086, "global_step": 263337, "epoch": 2176} {"train_loss": -43.138092041015625, "global_step": 263338, "epoch": 2176} {"train_loss": -42.34969711303711, "global_step": 263339, "epoch": 2176} {"train_loss": -42.03356170654297, "global_step": 263340, "epoch": 2176} {"train_loss": -42.449317932128906, "global_step": 263341, "epoch": 2176} {"train_loss": -42.216732025146484, "global_step": 263342, "epoch": 2176} {"train_loss": -42.306575775146484, "global_step": 263343, "epoch": 2176} {"train_loss": -41.77317810058594, "global_step": 263344, "epoch": 2176} {"train_loss": -41.72783279418945, "global_step": 263345, "epoch": 2176} {"train_loss": -42.460243225097656, "global_step": 263346, "epoch": 2176} {"train_loss": -42.32257843017578, "global_step": 263347, "epoch": 2176} {"train_loss": -42.69329833984375, "global_step": 263348, "epoch": 2176} {"train_loss": -42.867164611816406, "global_step": 263349, "epoch": 2176} {"train_loss": -43.12590408325195, "global_step": 263350, "epoch": 2176} {"train_loss": -42.458900451660156, "global_step": 263351, "epoch": 2176} {"train_loss": -43.129756927490234, "global_step": 263352, "epoch": 2176} {"train_loss": -42.83185958862305, "global_step": 263353, "epoch": 2176} {"train_loss": -43.18581771850586, "global_step": 263354, "epoch": 2176} {"train_loss": -42.98432159423828, "global_step": 263355, "epoch": 2176} {"train_loss": -41.997379302978516, "global_step": 263356, "epoch": 2176} {"train_loss": -42.9410514831543, "global_step": 263357, "epoch": 2176} {"train_loss": -42.508323669433594, "global_step": 263358, "epoch": 2176} {"train_loss": -41.699249267578125, "global_step": 263359, "epoch": 2176} {"train_loss": -42.752174377441406, "global_step": 263360, "epoch": 2176} {"train_loss": -42.44990158081055, "global_step": 263361, "epoch": 2176} {"train_loss": -42.006622314453125, "global_step": 263362, "epoch": 2176} {"train_loss": -42.318721771240234, "global_step": 263363, "epoch": 2176} {"train_loss": -42.11635971069336, "global_step": 263364, "epoch": 2176} {"train_loss": -42.350189208984375, "global_step": 263365, "epoch": 2176} {"train_loss": -41.042144775390625, "global_step": 263366, "epoch": 2176} {"train_loss": -43.098270416259766, "global_step": 263367, "epoch": 2176} {"train_loss": -41.626678466796875, "global_step": 263368, "epoch": 2176} {"train_loss": -41.293514251708984, "global_step": 263369, "epoch": 2176} {"train_loss": -41.349300384521484, "global_step": 263370, "epoch": 2176} {"train_loss": -42.570106506347656, "global_step": 263371, "epoch": 2176} {"train_loss": -43.317020416259766, "global_step": 263372, "epoch": 2176} {"train_loss": -42.9117317199707, "global_step": 263373, "epoch": 2176} {"train_loss": -42.905296325683594, "global_step": 263374, "epoch": 2176} {"train_loss": -42.889495849609375, "global_step": 263375, "epoch": 2176} {"train_loss": -42.176509857177734, "global_step": 263376, "epoch": 2176} {"train_loss": -43.09502410888672, "global_step": 263377, "epoch": 2176} {"train_loss": -43.35177230834961, "global_step": 263378, "epoch": 2176} {"train_loss": -42.413848876953125, "global_step": 263379, "epoch": 2176} {"train_loss": -43.736106872558594, "global_step": 263380, "epoch": 2176} {"train_loss": -42.820735931396484, "global_step": 263381, "epoch": 2176} {"train_loss": -43.20108413696289, "global_step": 263382, "epoch": 2176} {"train_loss": -42.54519271850586, "global_step": 263383, "epoch": 2176} {"train_loss": -43.292701721191406, "global_step": 263384, "epoch": 2176} {"train_loss": -43.327144622802734, "global_step": 263385, "epoch": 2176} {"train_loss": -43.304542541503906, "global_step": 263386, "epoch": 2176} {"train_loss": -43.48563766479492, "global_step": 263387, "epoch": 2176} {"train_loss": -43.22283935546875, "global_step": 263388, "epoch": 2176} {"train_loss": -43.47776412963867, "global_step": 263389, "epoch": 2176} {"train_loss": -43.29807662963867, "global_step": 263390, "epoch": 2176} {"train_loss": -43.06242752075195, "global_step": 263391, "epoch": 2176} {"train_loss": -43.11998748779297, "global_step": 263392, "epoch": 2176} {"train_loss": -43.4570198059082, "global_step": 263393, "epoch": 2176} {"train_loss": -43.3806266784668, "global_step": 263394, "epoch": 2176} {"train_loss": -43.173213958740234, "global_step": 263395, "epoch": 2176} {"train_loss": -43.7544059753418, "global_step": 263396, "epoch": 2176} {"train_loss": -43.388145446777344, "global_step": 263397, "epoch": 2176} {"train_loss": -43.12370300292969, "global_step": 263398, "epoch": 2176} {"train_loss": -43.53372573852539, "global_step": 263399, "epoch": 2176} {"train_loss": -43.036312103271484, "global_step": 263400, "epoch": 2176} {"train_loss": -43.06515121459961, "global_step": 263401, "epoch": 2176} {"train_loss": -41.73812484741211, "global_step": 263402, "epoch": 2176} {"train_loss": -42.12229919433594, "global_step": 263403, "epoch": 2176} {"train_loss": -42.93601608276367, "global_step": 263404, "epoch": 2176} {"train_loss": -43.332698822021484, "global_step": 263405, "epoch": 2176} {"train_loss": -40.69219970703125, "global_step": 263406, "epoch": 2176} {"train_loss": -40.3830451965332, "global_step": 263407, "epoch": 2176} {"train_loss": -42.945919036865234, "global_step": 263408, "epoch": 2176} {"train_loss": -40.663936614990234, "global_step": 263409, "epoch": 2176} {"train_loss": -42.753578186035156, "global_step": 263410, "epoch": 2176} {"train_loss": -41.638092041015625, "global_step": 263411, "epoch": 2176} {"train_loss": -42.737274169921875, "global_step": 263412, "epoch": 2176} {"train_loss": -41.53702926635742, "global_step": 263413, "epoch": 2176} {"train_loss": -41.420379638671875, "global_step": 263414, "epoch": 2176} {"train_loss": -42.170711517333984, "global_step": 263415, "epoch": 2176} {"train_loss": -42.430663431971524, "global_step": 263416, "epoch": 2176, "val_loss": 2644791.0} {"train_loss": -43.062686920166016, "global_step": 263417, "epoch": 2177} {"train_loss": -41.577144622802734, "global_step": 263418, "epoch": 2177} {"train_loss": -43.2740592956543, "global_step": 263419, "epoch": 2177} {"train_loss": -42.89473342895508, "global_step": 263420, "epoch": 2177} {"train_loss": -42.54448318481445, "global_step": 263421, "epoch": 2177} {"train_loss": -43.19518280029297, "global_step": 263422, "epoch": 2177} {"train_loss": -42.387447357177734, "global_step": 263423, "epoch": 2177} {"train_loss": -42.6601676940918, "global_step": 263424, "epoch": 2177} {"train_loss": -43.08222579956055, "global_step": 263425, "epoch": 2177} {"train_loss": -42.49514389038086, "global_step": 263426, "epoch": 2177} {"train_loss": -42.367462158203125, "global_step": 263427, "epoch": 2177} {"train_loss": -43.36054611206055, "global_step": 263428, "epoch": 2177} {"train_loss": -43.152679443359375, "global_step": 263429, "epoch": 2177} {"train_loss": -42.574005126953125, "global_step": 263430, "epoch": 2177} {"train_loss": -41.516944885253906, "global_step": 263431, "epoch": 2177} {"train_loss": -43.435272216796875, "global_step": 263432, "epoch": 2177} {"train_loss": -42.12339401245117, "global_step": 263433, "epoch": 2177} {"train_loss": -42.91706466674805, "global_step": 263434, "epoch": 2177} {"train_loss": -42.15605926513672, "global_step": 263435, "epoch": 2177} {"train_loss": -42.57801818847656, "global_step": 263436, "epoch": 2177} {"train_loss": -42.30160140991211, "global_step": 263437, "epoch": 2177} {"train_loss": -42.34444046020508, "global_step": 263438, "epoch": 2177} {"train_loss": -43.10371017456055, "global_step": 263439, "epoch": 2177} {"train_loss": -42.463111877441406, "global_step": 263440, "epoch": 2177} {"train_loss": -42.380714416503906, "global_step": 263441, "epoch": 2177} {"train_loss": -42.68373489379883, "global_step": 263442, "epoch": 2177} {"train_loss": -43.09226989746094, "global_step": 263443, "epoch": 2177} {"train_loss": -42.76383590698242, "global_step": 263444, "epoch": 2177} {"train_loss": -42.05986785888672, "global_step": 263445, "epoch": 2177} {"train_loss": -42.7504768371582, "global_step": 263446, "epoch": 2177} {"train_loss": -42.99869918823242, "global_step": 263447, "epoch": 2177} {"train_loss": -42.18532943725586, "global_step": 263448, "epoch": 2177} {"train_loss": -41.78248596191406, "global_step": 263449, "epoch": 2177} {"train_loss": -42.35493850708008, "global_step": 263450, "epoch": 2177} {"train_loss": -43.134910583496094, "global_step": 263451, "epoch": 2177} {"train_loss": -42.0973014831543, "global_step": 263452, "epoch": 2177} {"train_loss": -42.464908599853516, "global_step": 263453, "epoch": 2177} {"train_loss": -42.64728927612305, "global_step": 263454, "epoch": 2177} {"train_loss": -42.3222770690918, "global_step": 263455, "epoch": 2177} {"train_loss": -42.409332275390625, "global_step": 263456, "epoch": 2177} {"train_loss": -43.8686408996582, "global_step": 263457, "epoch": 2177} {"train_loss": -42.19314193725586, "global_step": 263458, "epoch": 2177} {"train_loss": -39.38089370727539, "global_step": 263459, "epoch": 2177} {"train_loss": -40.07938766479492, "global_step": 263460, "epoch": 2177} {"train_loss": -43.247798919677734, "global_step": 263461, "epoch": 2177} {"train_loss": -38.7539176940918, "global_step": 263462, "epoch": 2177} {"train_loss": -36.97176742553711, "global_step": 263463, "epoch": 2177} {"train_loss": -40.42451095581055, "global_step": 263464, "epoch": 2177} {"train_loss": -27.50409507751465, "global_step": 263465, "epoch": 2177} {"train_loss": -33.391029357910156, "global_step": 263466, "epoch": 2177} {"train_loss": -41.30754470825195, "global_step": 263467, "epoch": 2177} {"train_loss": -26.940351486206055, "global_step": 263468, "epoch": 2177} {"train_loss": -38.409603118896484, "global_step": 263469, "epoch": 2177} {"train_loss": -33.052337646484375, "global_step": 263470, "epoch": 2177} {"train_loss": -29.2327938079834, "global_step": 263471, "epoch": 2177} {"train_loss": -41.64068603515625, "global_step": 263472, "epoch": 2177} {"train_loss": -33.00244903564453, "global_step": 263473, "epoch": 2177} {"train_loss": -41.0775260925293, "global_step": 263474, "epoch": 2177} {"train_loss": -35.641849517822266, "global_step": 263475, "epoch": 2177} {"train_loss": -39.891326904296875, "global_step": 263476, "epoch": 2177} {"train_loss": -35.8377685546875, "global_step": 263477, "epoch": 2177} {"train_loss": -41.49637985229492, "global_step": 263478, "epoch": 2177} {"train_loss": -36.8515739440918, "global_step": 263479, "epoch": 2177} {"train_loss": -41.052711486816406, "global_step": 263480, "epoch": 2177} {"train_loss": -38.294002532958984, "global_step": 263481, "epoch": 2177} {"train_loss": -41.3257942199707, "global_step": 263482, "epoch": 2177} {"train_loss": -40.0655632019043, "global_step": 263483, "epoch": 2177} {"train_loss": -41.40244674682617, "global_step": 263484, "epoch": 2177} {"train_loss": -40.74512481689453, "global_step": 263485, "epoch": 2177} {"train_loss": -41.78287887573242, "global_step": 263486, "epoch": 2177} {"train_loss": -40.86804962158203, "global_step": 263487, "epoch": 2177} {"train_loss": -41.43513107299805, "global_step": 263488, "epoch": 2177} {"train_loss": -42.01096725463867, "global_step": 263489, "epoch": 2177} {"train_loss": -41.73746109008789, "global_step": 263490, "epoch": 2177} {"train_loss": -41.99333190917969, "global_step": 263491, "epoch": 2177} {"train_loss": -41.77490997314453, "global_step": 263492, "epoch": 2177} {"train_loss": -42.45414352416992, "global_step": 263493, "epoch": 2177} {"train_loss": -42.02473449707031, "global_step": 263494, "epoch": 2177} {"train_loss": -42.326839447021484, "global_step": 263495, "epoch": 2177} {"train_loss": -42.400047302246094, "global_step": 263496, "epoch": 2177} {"train_loss": -42.03730392456055, "global_step": 263497, "epoch": 2177} {"train_loss": -42.63788986206055, "global_step": 263498, "epoch": 2177} {"train_loss": -42.26790237426758, "global_step": 263499, "epoch": 2177} {"train_loss": -42.65054702758789, "global_step": 263500, "epoch": 2177} {"train_loss": -42.644134521484375, "global_step": 263501, "epoch": 2177} {"train_loss": -42.72823715209961, "global_step": 263502, "epoch": 2177} {"train_loss": -42.868934631347656, "global_step": 263503, "epoch": 2177} {"train_loss": -42.854740142822266, "global_step": 263504, "epoch": 2177} {"train_loss": -42.4477653503418, "global_step": 263505, "epoch": 2177} {"train_loss": -42.51567077636719, "global_step": 263506, "epoch": 2177} {"train_loss": -43.2410888671875, "global_step": 263507, "epoch": 2177} {"train_loss": -43.13320541381836, "global_step": 263508, "epoch": 2177} {"train_loss": -43.1721305847168, "global_step": 263509, "epoch": 2177} {"train_loss": -43.674095153808594, "global_step": 263510, "epoch": 2177} {"train_loss": -42.61722183227539, "global_step": 263511, "epoch": 2177} {"train_loss": -42.961395263671875, "global_step": 263512, "epoch": 2177} {"train_loss": -43.291053771972656, "global_step": 263513, "epoch": 2177} {"train_loss": -43.10691452026367, "global_step": 263514, "epoch": 2177} {"train_loss": -42.81129837036133, "global_step": 263515, "epoch": 2177} {"train_loss": -43.34864044189453, "global_step": 263516, "epoch": 2177} {"train_loss": -43.19094467163086, "global_step": 263517, "epoch": 2177} {"train_loss": -43.0802116394043, "global_step": 263518, "epoch": 2177} {"train_loss": -43.3148078918457, "global_step": 263519, "epoch": 2177} {"train_loss": -43.4321403503418, "global_step": 263520, "epoch": 2177} {"train_loss": -43.3017463684082, "global_step": 263521, "epoch": 2177} {"train_loss": -43.71293258666992, "global_step": 263522, "epoch": 2177} {"train_loss": -43.5449104309082, "global_step": 263523, "epoch": 2177} {"train_loss": -43.44698715209961, "global_step": 263524, "epoch": 2177} {"train_loss": -43.6496696472168, "global_step": 263525, "epoch": 2177} {"train_loss": -43.293212890625, "global_step": 263526, "epoch": 2177} {"train_loss": -43.68407440185547, "global_step": 263527, "epoch": 2177} {"train_loss": -43.26408767700195, "global_step": 263528, "epoch": 2177} {"train_loss": -43.38434600830078, "global_step": 263529, "epoch": 2177} {"train_loss": -43.19068908691406, "global_step": 263530, "epoch": 2177} {"train_loss": -43.55434036254883, "global_step": 263531, "epoch": 2177} {"train_loss": -43.70540237426758, "global_step": 263532, "epoch": 2177} {"train_loss": -43.65847396850586, "global_step": 263533, "epoch": 2177} {"train_loss": -43.335365295410156, "global_step": 263534, "epoch": 2177} {"train_loss": -43.64494705200195, "global_step": 263535, "epoch": 2177} {"train_loss": -43.38756561279297, "global_step": 263536, "epoch": 2177} {"train_loss": -41.630394439066734, "global_step": 263537, "epoch": 2177, "val_loss": 2695976.25} {"train_loss": -43.7974967956543, "global_step": 263538, "epoch": 2178} {"train_loss": -43.367279052734375, "global_step": 263539, "epoch": 2178} {"train_loss": -43.484371185302734, "global_step": 263540, "epoch": 2178} {"train_loss": -43.72018051147461, "global_step": 263541, "epoch": 2178} {"train_loss": -43.83439254760742, "global_step": 263542, "epoch": 2178} {"train_loss": -43.40584945678711, "global_step": 263543, "epoch": 2178} {"train_loss": -43.750728607177734, "global_step": 263544, "epoch": 2178} {"train_loss": -43.7111701965332, "global_step": 263545, "epoch": 2178} {"train_loss": -43.81873321533203, "global_step": 263546, "epoch": 2178} {"train_loss": -44.10346603393555, "global_step": 263547, "epoch": 2178} {"train_loss": -44.26443099975586, "global_step": 263548, "epoch": 2178} {"train_loss": -44.03995895385742, "global_step": 263549, "epoch": 2178} {"train_loss": -44.115413665771484, "global_step": 263550, "epoch": 2178} {"train_loss": -43.84642791748047, "global_step": 263551, "epoch": 2178} {"train_loss": -43.36411666870117, "global_step": 263552, "epoch": 2178} {"train_loss": -43.983985900878906, "global_step": 263553, "epoch": 2178} {"train_loss": -43.60380172729492, "global_step": 263554, "epoch": 2178} {"train_loss": -43.832515716552734, "global_step": 263555, "epoch": 2178} {"train_loss": -44.2084846496582, "global_step": 263556, "epoch": 2178} {"train_loss": -43.78629684448242, "global_step": 263557, "epoch": 2178} {"train_loss": -44.02866744995117, "global_step": 263558, "epoch": 2178} {"train_loss": -43.76149368286133, "global_step": 263559, "epoch": 2178} {"train_loss": -43.82271957397461, "global_step": 263560, "epoch": 2178} {"train_loss": -43.507083892822266, "global_step": 263561, "epoch": 2178} {"train_loss": -43.072608947753906, "global_step": 263562, "epoch": 2178} {"train_loss": -41.858524322509766, "global_step": 263563, "epoch": 2178} {"train_loss": -43.24968338012695, "global_step": 263564, "epoch": 2178} {"train_loss": -42.81356430053711, "global_step": 263565, "epoch": 2178} {"train_loss": -43.40266036987305, "global_step": 263566, "epoch": 2178} {"train_loss": -43.4300651550293, "global_step": 263567, "epoch": 2178} {"train_loss": -44.20911407470703, "global_step": 263568, "epoch": 2178} {"train_loss": -42.930477142333984, "global_step": 263569, "epoch": 2178} {"train_loss": -43.1671257019043, "global_step": 263570, "epoch": 2178} {"train_loss": -43.340450286865234, "global_step": 263571, "epoch": 2178} {"train_loss": -42.866573333740234, "global_step": 263572, "epoch": 2178} {"train_loss": -43.76396560668945, "global_step": 263573, "epoch": 2178} {"train_loss": -43.28763961791992, "global_step": 263574, "epoch": 2178} {"train_loss": -43.9453239440918, "global_step": 263575, "epoch": 2178} {"train_loss": -43.75236129760742, "global_step": 263576, "epoch": 2178} {"train_loss": -43.728389739990234, "global_step": 263577, "epoch": 2178} {"train_loss": -43.714046478271484, "global_step": 263578, "epoch": 2178} {"train_loss": -43.242740631103516, "global_step": 263579, "epoch": 2178} {"train_loss": -43.40073776245117, "global_step": 263580, "epoch": 2178} {"train_loss": -43.128536224365234, "global_step": 263581, "epoch": 2178} {"train_loss": -44.28412628173828, "global_step": 263582, "epoch": 2178} {"train_loss": -43.1279296875, "global_step": 263583, "epoch": 2178} {"train_loss": -43.73867416381836, "global_step": 263584, "epoch": 2178} {"train_loss": -41.50630569458008, "global_step": 263585, "epoch": 2178} {"train_loss": -40.77620315551758, "global_step": 263586, "epoch": 2178} {"train_loss": -38.8568229675293, "global_step": 263587, "epoch": 2178} {"train_loss": -40.83369064331055, "global_step": 263588, "epoch": 2178} {"train_loss": -41.104087829589844, "global_step": 263589, "epoch": 2178} {"train_loss": -39.13741683959961, "global_step": 263590, "epoch": 2178} {"train_loss": -40.16133499145508, "global_step": 263591, "epoch": 2178} {"train_loss": -42.40645980834961, "global_step": 263592, "epoch": 2178} {"train_loss": -43.403194427490234, "global_step": 263593, "epoch": 2178} {"train_loss": -39.74824142456055, "global_step": 263594, "epoch": 2178} {"train_loss": -36.25273513793945, "global_step": 263595, "epoch": 2178} {"train_loss": -40.93061447143555, "global_step": 263596, "epoch": 2178} {"train_loss": -41.13932418823242, "global_step": 263597, "epoch": 2178} {"train_loss": -37.663936614990234, "global_step": 263598, "epoch": 2178} {"train_loss": -39.154293060302734, "global_step": 263599, "epoch": 2178} {"train_loss": -42.1571159362793, "global_step": 263600, "epoch": 2178} {"train_loss": -40.73926544189453, "global_step": 263601, "epoch": 2178} {"train_loss": -39.582252502441406, "global_step": 263602, "epoch": 2178} {"train_loss": -41.75726318359375, "global_step": 263603, "epoch": 2178} {"train_loss": -38.93870162963867, "global_step": 263604, "epoch": 2178} {"train_loss": -41.61639404296875, "global_step": 263605, "epoch": 2178} {"train_loss": -41.70284652709961, "global_step": 263606, "epoch": 2178} {"train_loss": -38.65708541870117, "global_step": 263607, "epoch": 2178} {"train_loss": -39.5008430480957, "global_step": 263608, "epoch": 2178} {"train_loss": -38.678462982177734, "global_step": 263609, "epoch": 2178} {"train_loss": -42.001373291015625, "global_step": 263610, "epoch": 2178} {"train_loss": -40.95075225830078, "global_step": 263611, "epoch": 2178} {"train_loss": -41.17354202270508, "global_step": 263612, "epoch": 2178} {"train_loss": -41.200599670410156, "global_step": 263613, "epoch": 2178} {"train_loss": -41.44791793823242, "global_step": 263614, "epoch": 2178} {"train_loss": -41.33747482299805, "global_step": 263615, "epoch": 2178} {"train_loss": -41.5309944152832, "global_step": 263616, "epoch": 2178} {"train_loss": -42.12406539916992, "global_step": 263617, "epoch": 2178} {"train_loss": -40.796207427978516, "global_step": 263618, "epoch": 2178} {"train_loss": -42.70753860473633, "global_step": 263619, "epoch": 2178} {"train_loss": -41.81993103027344, "global_step": 263620, "epoch": 2178} {"train_loss": -42.304054260253906, "global_step": 263621, "epoch": 2178} {"train_loss": -42.4110221862793, "global_step": 263622, "epoch": 2178} {"train_loss": -41.506744384765625, "global_step": 263623, "epoch": 2178} {"train_loss": -40.47700119018555, "global_step": 263624, "epoch": 2178} {"train_loss": -42.5737419128418, "global_step": 263625, "epoch": 2178} {"train_loss": -42.60279083251953, "global_step": 263626, "epoch": 2178} {"train_loss": -42.94296646118164, "global_step": 263627, "epoch": 2178} {"train_loss": -42.40630340576172, "global_step": 263628, "epoch": 2178} {"train_loss": -42.83806228637695, "global_step": 263629, "epoch": 2178} {"train_loss": -43.07822036743164, "global_step": 263630, "epoch": 2178} {"train_loss": -42.846988677978516, "global_step": 263631, "epoch": 2178} {"train_loss": -42.96873092651367, "global_step": 263632, "epoch": 2178} {"train_loss": -42.87945556640625, "global_step": 263633, "epoch": 2178} {"train_loss": -43.08590316772461, "global_step": 263634, "epoch": 2178} {"train_loss": -42.84151077270508, "global_step": 263635, "epoch": 2178} {"train_loss": -43.28865051269531, "global_step": 263636, "epoch": 2178} {"train_loss": -43.49799346923828, "global_step": 263637, "epoch": 2178} {"train_loss": -42.86962890625, "global_step": 263638, "epoch": 2178} {"train_loss": -43.22781753540039, "global_step": 263639, "epoch": 2178} {"train_loss": -43.411128997802734, "global_step": 263640, "epoch": 2178} {"train_loss": -43.0594367980957, "global_step": 263641, "epoch": 2178} {"train_loss": -41.8111686706543, "global_step": 263642, "epoch": 2178} {"train_loss": -43.83504867553711, "global_step": 263643, "epoch": 2178} {"train_loss": -43.088600158691406, "global_step": 263644, "epoch": 2178} {"train_loss": -41.42879104614258, "global_step": 263645, "epoch": 2178} {"train_loss": -41.81722640991211, "global_step": 263646, "epoch": 2178} {"train_loss": -43.407405853271484, "global_step": 263647, "epoch": 2178} {"train_loss": -39.96866226196289, "global_step": 263648, "epoch": 2178} {"train_loss": -43.56745910644531, "global_step": 263649, "epoch": 2178} {"train_loss": -42.87761688232422, "global_step": 263650, "epoch": 2178} {"train_loss": -42.57697677612305, "global_step": 263651, "epoch": 2178} {"train_loss": -41.5366325378418, "global_step": 263652, "epoch": 2178} {"train_loss": -33.572906494140625, "global_step": 263653, "epoch": 2178} {"train_loss": -41.639461517333984, "global_step": 263654, "epoch": 2178} {"train_loss": -39.36865997314453, "global_step": 263655, "epoch": 2178} {"train_loss": -37.557640075683594, "global_step": 263656, "epoch": 2178} {"train_loss": -42.840492248535156, "global_step": 263657, "epoch": 2178} {"train_loss": -42.24320406953165, "global_step": 263658, "epoch": 2178, "val_loss": 2594741.25} {"train_loss": -39.54938888549805, "global_step": 263659, "epoch": 2179} {"train_loss": -33.05093765258789, "global_step": 263660, "epoch": 2179} {"train_loss": -34.44001388549805, "global_step": 263661, "epoch": 2179} {"train_loss": -40.36249923706055, "global_step": 263662, "epoch": 2179} {"train_loss": -38.29392623901367, "global_step": 263663, "epoch": 2179} {"train_loss": -38.27882766723633, "global_step": 263664, "epoch": 2179} {"train_loss": -41.82448196411133, "global_step": 263665, "epoch": 2179} {"train_loss": -42.27531051635742, "global_step": 263666, "epoch": 2179} {"train_loss": -36.33667755126953, "global_step": 263667, "epoch": 2179} {"train_loss": -42.16371536254883, "global_step": 263668, "epoch": 2179} {"train_loss": -39.456546783447266, "global_step": 263669, "epoch": 2179} {"train_loss": -35.31456756591797, "global_step": 263670, "epoch": 2179} {"train_loss": -41.63307571411133, "global_step": 263671, "epoch": 2179} {"train_loss": -39.69140625, "global_step": 263672, "epoch": 2179} {"train_loss": -41.44975662231445, "global_step": 263673, "epoch": 2179} {"train_loss": -40.144744873046875, "global_step": 263674, "epoch": 2179} {"train_loss": -40.14225387573242, "global_step": 263675, "epoch": 2179} {"train_loss": -40.88045883178711, "global_step": 263676, "epoch": 2179} {"train_loss": -39.95232009887695, "global_step": 263677, "epoch": 2179} {"train_loss": -41.464599609375, "global_step": 263678, "epoch": 2179} {"train_loss": -41.704036712646484, "global_step": 263679, "epoch": 2179} {"train_loss": -42.113670349121094, "global_step": 263680, "epoch": 2179} {"train_loss": -41.50014877319336, "global_step": 263681, "epoch": 2179} {"train_loss": -42.375213623046875, "global_step": 263682, "epoch": 2179} {"train_loss": -40.301025390625, "global_step": 263683, "epoch": 2179} {"train_loss": -40.3094596862793, "global_step": 263684, "epoch": 2179} {"train_loss": -41.125057220458984, "global_step": 263685, "epoch": 2179} {"train_loss": -41.93546676635742, "global_step": 263686, "epoch": 2179} {"train_loss": -42.22174835205078, "global_step": 263687, "epoch": 2179} {"train_loss": -39.20396423339844, "global_step": 263688, "epoch": 2179} {"train_loss": -40.8746452331543, "global_step": 263689, "epoch": 2179} {"train_loss": -42.23488235473633, "global_step": 263690, "epoch": 2179} {"train_loss": -41.62202072143555, "global_step": 263691, "epoch": 2179} {"train_loss": -42.11640167236328, "global_step": 263692, "epoch": 2179} {"train_loss": -42.22492599487305, "global_step": 263693, "epoch": 2179} {"train_loss": -42.42733383178711, "global_step": 263694, "epoch": 2179} {"train_loss": -42.304508209228516, "global_step": 263695, "epoch": 2179} {"train_loss": -41.966922760009766, "global_step": 263696, "epoch": 2179} {"train_loss": -42.84147644042969, "global_step": 263697, "epoch": 2179} {"train_loss": -41.88412094116211, "global_step": 263698, "epoch": 2179} {"train_loss": -42.84133529663086, "global_step": 263699, "epoch": 2179} {"train_loss": -42.11005401611328, "global_step": 263700, "epoch": 2179} {"train_loss": -42.32532501220703, "global_step": 263701, "epoch": 2179} {"train_loss": -41.91761016845703, "global_step": 263702, "epoch": 2179} {"train_loss": -40.39109420776367, "global_step": 263703, "epoch": 2179} {"train_loss": -42.026329040527344, "global_step": 263704, "epoch": 2179} {"train_loss": -42.835418701171875, "global_step": 263705, "epoch": 2179} {"train_loss": -42.43318176269531, "global_step": 263706, "epoch": 2179} {"train_loss": -42.81531524658203, "global_step": 263707, "epoch": 2179} {"train_loss": -42.51885223388672, "global_step": 263708, "epoch": 2179} {"train_loss": -42.63526916503906, "global_step": 263709, "epoch": 2179} {"train_loss": -42.7825927734375, "global_step": 263710, "epoch": 2179} {"train_loss": -43.065128326416016, "global_step": 263711, "epoch": 2179} {"train_loss": -42.615779876708984, "global_step": 263712, "epoch": 2179} {"train_loss": -43.07440948486328, "global_step": 263713, "epoch": 2179} {"train_loss": -42.351417541503906, "global_step": 263714, "epoch": 2179} {"train_loss": -42.85948181152344, "global_step": 263715, "epoch": 2179} {"train_loss": -43.101436614990234, "global_step": 263716, "epoch": 2179} {"train_loss": -43.42814636230469, "global_step": 263717, "epoch": 2179} {"train_loss": -41.74564743041992, "global_step": 263718, "epoch": 2179} {"train_loss": -42.72690963745117, "global_step": 263719, "epoch": 2179} {"train_loss": -41.80962371826172, "global_step": 263720, "epoch": 2179} {"train_loss": -43.63581848144531, "global_step": 263721, "epoch": 2179} {"train_loss": -43.11989974975586, "global_step": 263722, "epoch": 2179} {"train_loss": -43.46464920043945, "global_step": 263723, "epoch": 2179} {"train_loss": -43.26648712158203, "global_step": 263724, "epoch": 2179} {"train_loss": -43.37446975708008, "global_step": 263725, "epoch": 2179} {"train_loss": -43.61549758911133, "global_step": 263726, "epoch": 2179} {"train_loss": -42.927711486816406, "global_step": 263727, "epoch": 2179} {"train_loss": -42.84292221069336, "global_step": 263728, "epoch": 2179} {"train_loss": -43.63481521606445, "global_step": 263729, "epoch": 2179} {"train_loss": -43.52705764770508, "global_step": 263730, "epoch": 2179} {"train_loss": -42.90771484375, "global_step": 263731, "epoch": 2179} {"train_loss": -43.62081527709961, "global_step": 263732, "epoch": 2179} {"train_loss": -42.90896224975586, "global_step": 263733, "epoch": 2179} {"train_loss": -44.139801025390625, "global_step": 263734, "epoch": 2179} {"train_loss": -43.21177291870117, "global_step": 263735, "epoch": 2179} {"train_loss": -43.256839752197266, "global_step": 263736, "epoch": 2179} {"train_loss": -43.55953598022461, "global_step": 263737, "epoch": 2179} {"train_loss": -42.565670013427734, "global_step": 263738, "epoch": 2179} {"train_loss": -43.6390495300293, "global_step": 263739, "epoch": 2179} {"train_loss": -43.29298782348633, "global_step": 263740, "epoch": 2179} {"train_loss": -43.50989532470703, "global_step": 263741, "epoch": 2179} {"train_loss": -43.57234573364258, "global_step": 263742, "epoch": 2179} {"train_loss": -43.98402786254883, "global_step": 263743, "epoch": 2179} {"train_loss": -43.61003494262695, "global_step": 263744, "epoch": 2179} {"train_loss": -42.90328598022461, "global_step": 263745, "epoch": 2179} {"train_loss": -43.91724395751953, "global_step": 263746, "epoch": 2179} {"train_loss": -42.86764907836914, "global_step": 263747, "epoch": 2179} {"train_loss": -42.08602523803711, "global_step": 263748, "epoch": 2179} {"train_loss": -43.465187072753906, "global_step": 263749, "epoch": 2179} {"train_loss": -43.03530502319336, "global_step": 263750, "epoch": 2179} {"train_loss": -42.221370697021484, "global_step": 263751, "epoch": 2179} {"train_loss": -43.270572662353516, "global_step": 263752, "epoch": 2179} {"train_loss": -42.380882263183594, "global_step": 263753, "epoch": 2179} {"train_loss": -43.06553649902344, "global_step": 263754, "epoch": 2179} {"train_loss": -42.488033294677734, "global_step": 263755, "epoch": 2179} {"train_loss": -42.27253341674805, "global_step": 263756, "epoch": 2179} {"train_loss": -43.76539993286133, "global_step": 263757, "epoch": 2179} {"train_loss": -43.62970733642578, "global_step": 263758, "epoch": 2179} {"train_loss": -43.43351745605469, "global_step": 263759, "epoch": 2179} {"train_loss": -43.83252716064453, "global_step": 263760, "epoch": 2179} {"train_loss": -42.864009857177734, "global_step": 263761, "epoch": 2179} {"train_loss": -43.23968505859375, "global_step": 263762, "epoch": 2179} {"train_loss": -43.47140121459961, "global_step": 263763, "epoch": 2179} {"train_loss": -42.97113037109375, "global_step": 263764, "epoch": 2179} {"train_loss": -42.798885345458984, "global_step": 263765, "epoch": 2179} {"train_loss": -43.634002685546875, "global_step": 263766, "epoch": 2179} {"train_loss": -43.108219146728516, "global_step": 263767, "epoch": 2179} {"train_loss": -43.679630279541016, "global_step": 263768, "epoch": 2179} {"train_loss": -43.22331619262695, "global_step": 263769, "epoch": 2179} {"train_loss": -42.055908203125, "global_step": 263770, "epoch": 2179} {"train_loss": -43.00520706176758, "global_step": 263771, "epoch": 2179} {"train_loss": -42.68059158325195, "global_step": 263772, "epoch": 2179} {"train_loss": -41.95649337768555, "global_step": 263773, "epoch": 2179} {"train_loss": -43.40436553955078, "global_step": 263774, "epoch": 2179} {"train_loss": -42.43172836303711, "global_step": 263775, "epoch": 2179} {"train_loss": -40.44298553466797, "global_step": 263776, "epoch": 2179} {"train_loss": -40.23013687133789, "global_step": 263777, "epoch": 2179} {"train_loss": -42.18684768676758, "global_step": 263778, "epoch": 2179} {"train_loss": -42.07685634518458, "global_step": 263779, "epoch": 2179, "val_loss": 2711314.25} {"train_loss": -41.12479782104492, "global_step": 263780, "epoch": 2180} {"train_loss": -42.25246047973633, "global_step": 263781, "epoch": 2180} {"train_loss": -41.09846496582031, "global_step": 263782, "epoch": 2180} {"train_loss": -42.016544342041016, "global_step": 263783, "epoch": 2180} {"train_loss": -42.02931594848633, "global_step": 263784, "epoch": 2180} {"train_loss": -41.058082580566406, "global_step": 263785, "epoch": 2180} {"train_loss": -40.97092056274414, "global_step": 263786, "epoch": 2180} {"train_loss": -42.2329216003418, "global_step": 263787, "epoch": 2180} {"train_loss": -42.99517822265625, "global_step": 263788, "epoch": 2180} {"train_loss": -42.982173919677734, "global_step": 263789, "epoch": 2180} {"train_loss": -42.28771209716797, "global_step": 263790, "epoch": 2180} {"train_loss": -42.15571212768555, "global_step": 263791, "epoch": 2180} {"train_loss": -42.9506721496582, "global_step": 263792, "epoch": 2180} {"train_loss": -42.33469772338867, "global_step": 263793, "epoch": 2180} {"train_loss": -40.52317428588867, "global_step": 263794, "epoch": 2180} {"train_loss": -42.812225341796875, "global_step": 263795, "epoch": 2180} {"train_loss": -42.391441345214844, "global_step": 263796, "epoch": 2180} {"train_loss": -42.45486068725586, "global_step": 263797, "epoch": 2180} {"train_loss": -42.21171188354492, "global_step": 263798, "epoch": 2180} {"train_loss": -43.33154296875, "global_step": 263799, "epoch": 2180} {"train_loss": -41.669219970703125, "global_step": 263800, "epoch": 2180} {"train_loss": -42.800384521484375, "global_step": 263801, "epoch": 2180} {"train_loss": -42.744300842285156, "global_step": 263802, "epoch": 2180} {"train_loss": -41.350101470947266, "global_step": 263803, "epoch": 2180} {"train_loss": -42.17024612426758, "global_step": 263804, "epoch": 2180} {"train_loss": -42.011260986328125, "global_step": 263805, "epoch": 2180} {"train_loss": -41.39931869506836, "global_step": 263806, "epoch": 2180} {"train_loss": -42.89986801147461, "global_step": 263807, "epoch": 2180} {"train_loss": -41.414207458496094, "global_step": 263808, "epoch": 2180} {"train_loss": -42.224605560302734, "global_step": 263809, "epoch": 2180} {"train_loss": -42.459007263183594, "global_step": 263810, "epoch": 2180} {"train_loss": -43.05526351928711, "global_step": 263811, "epoch": 2180} {"train_loss": -42.450801849365234, "global_step": 263812, "epoch": 2180} {"train_loss": -43.07796859741211, "global_step": 263813, "epoch": 2180} {"train_loss": -42.61778259277344, "global_step": 263814, "epoch": 2180} {"train_loss": -43.0210075378418, "global_step": 263815, "epoch": 2180} {"train_loss": -43.2331657409668, "global_step": 263816, "epoch": 2180} {"train_loss": -43.03249740600586, "global_step": 263817, "epoch": 2180} {"train_loss": -43.306819915771484, "global_step": 263818, "epoch": 2180} {"train_loss": -42.12575912475586, "global_step": 263819, "epoch": 2180} {"train_loss": -43.005001068115234, "global_step": 263820, "epoch": 2180} {"train_loss": -42.93891525268555, "global_step": 263821, "epoch": 2180} {"train_loss": -43.053466796875, "global_step": 263822, "epoch": 2180} {"train_loss": -42.94528579711914, "global_step": 263823, "epoch": 2180} {"train_loss": -42.48326110839844, "global_step": 263824, "epoch": 2180} {"train_loss": -43.6381950378418, "global_step": 263825, "epoch": 2180} {"train_loss": -42.915870666503906, "global_step": 263826, "epoch": 2180} {"train_loss": -42.20782470703125, "global_step": 263827, "epoch": 2180} {"train_loss": -42.801265716552734, "global_step": 263828, "epoch": 2180} {"train_loss": -43.15633773803711, "global_step": 263829, "epoch": 2180} {"train_loss": -43.612709045410156, "global_step": 263830, "epoch": 2180} {"train_loss": -42.8397331237793, "global_step": 263831, "epoch": 2180} {"train_loss": -43.10892868041992, "global_step": 263832, "epoch": 2180} {"train_loss": -42.97688293457031, "global_step": 263833, "epoch": 2180} {"train_loss": -42.738792419433594, "global_step": 263834, "epoch": 2180} {"train_loss": -43.7066764831543, "global_step": 263835, "epoch": 2180} {"train_loss": -43.65517807006836, "global_step": 263836, "epoch": 2180} {"train_loss": -43.19869613647461, "global_step": 263837, "epoch": 2180} {"train_loss": -43.854339599609375, "global_step": 263838, "epoch": 2180} {"train_loss": -43.27698516845703, "global_step": 263839, "epoch": 2180} {"train_loss": -42.707820892333984, "global_step": 263840, "epoch": 2180} {"train_loss": -43.20687484741211, "global_step": 263841, "epoch": 2180} {"train_loss": -42.80127716064453, "global_step": 263842, "epoch": 2180} {"train_loss": -43.27778244018555, "global_step": 263843, "epoch": 2180} {"train_loss": -43.553436279296875, "global_step": 263844, "epoch": 2180} {"train_loss": -43.47460174560547, "global_step": 263845, "epoch": 2180} {"train_loss": -43.5434455871582, "global_step": 263846, "epoch": 2180} {"train_loss": -43.69386672973633, "global_step": 263847, "epoch": 2180} {"train_loss": -42.261749267578125, "global_step": 263848, "epoch": 2180} {"train_loss": -40.81594467163086, "global_step": 263849, "epoch": 2180} {"train_loss": -42.875, "global_step": 263850, "epoch": 2180} {"train_loss": -41.076446533203125, "global_step": 263851, "epoch": 2180} {"train_loss": -39.19611358642578, "global_step": 263852, "epoch": 2180} {"train_loss": -43.08878707885742, "global_step": 263853, "epoch": 2180} {"train_loss": -40.41750717163086, "global_step": 263854, "epoch": 2180} {"train_loss": -37.46873092651367, "global_step": 263855, "epoch": 2180} {"train_loss": -40.64836120605469, "global_step": 263856, "epoch": 2180} {"train_loss": -38.368019104003906, "global_step": 263857, "epoch": 2180} {"train_loss": -35.95327377319336, "global_step": 263858, "epoch": 2180} {"train_loss": -35.9028205871582, "global_step": 263859, "epoch": 2180} {"train_loss": -37.85651779174805, "global_step": 263860, "epoch": 2180} {"train_loss": -37.183414459228516, "global_step": 263861, "epoch": 2180} {"train_loss": -28.688434600830078, "global_step": 263862, "epoch": 2180} {"train_loss": -36.78672409057617, "global_step": 263863, "epoch": 2180} {"train_loss": -37.320125579833984, "global_step": 263864, "epoch": 2180} {"train_loss": -35.02464294433594, "global_step": 263865, "epoch": 2180} {"train_loss": -38.98712921142578, "global_step": 263866, "epoch": 2180} {"train_loss": -40.925025939941406, "global_step": 263867, "epoch": 2180} {"train_loss": -38.24247360229492, "global_step": 263868, "epoch": 2180} {"train_loss": -38.64183807373047, "global_step": 263869, "epoch": 2180} {"train_loss": -39.284828186035156, "global_step": 263870, "epoch": 2180} {"train_loss": -40.56039047241211, "global_step": 263871, "epoch": 2180} {"train_loss": -40.17367172241211, "global_step": 263872, "epoch": 2180} {"train_loss": -42.0416145324707, "global_step": 263873, "epoch": 2180} {"train_loss": -40.963172912597656, "global_step": 263874, "epoch": 2180} {"train_loss": -42.2503547668457, "global_step": 263875, "epoch": 2180} {"train_loss": -40.45172119140625, "global_step": 263876, "epoch": 2180} {"train_loss": -41.034725189208984, "global_step": 263877, "epoch": 2180} {"train_loss": -40.973838806152344, "global_step": 263878, "epoch": 2180} {"train_loss": -41.132957458496094, "global_step": 263879, "epoch": 2180} {"train_loss": -42.02975845336914, "global_step": 263880, "epoch": 2180} {"train_loss": -42.020992279052734, "global_step": 263881, "epoch": 2180} {"train_loss": -41.81357192993164, "global_step": 263882, "epoch": 2180} {"train_loss": -42.013065338134766, "global_step": 263883, "epoch": 2180} {"train_loss": -42.30317306518555, "global_step": 263884, "epoch": 2180} {"train_loss": -42.943511962890625, "global_step": 263885, "epoch": 2180} {"train_loss": -42.53156661987305, "global_step": 263886, "epoch": 2180} {"train_loss": -42.482460021972656, "global_step": 263887, "epoch": 2180} {"train_loss": -41.856178283691406, "global_step": 263888, "epoch": 2180} {"train_loss": -42.997718811035156, "global_step": 263889, "epoch": 2180} {"train_loss": -42.35686111450195, "global_step": 263890, "epoch": 2180} {"train_loss": -42.89226531982422, "global_step": 263891, "epoch": 2180} {"train_loss": -42.7364387512207, "global_step": 263892, "epoch": 2180} {"train_loss": -43.25428771972656, "global_step": 263893, "epoch": 2180} {"train_loss": -42.398311614990234, "global_step": 263894, "epoch": 2180} {"train_loss": -43.20387649536133, "global_step": 263895, "epoch": 2180} {"train_loss": -42.36930465698242, "global_step": 263896, "epoch": 2180} {"train_loss": -43.134273529052734, "global_step": 263897, "epoch": 2180} {"train_loss": -42.8902587890625, "global_step": 263898, "epoch": 2180} {"train_loss": -42.62109375, "global_step": 263899, "epoch": 2180} {"train_loss": -41.73852690389334, "global_step": 263900, "epoch": 2180, "val_loss": 2626056.75} {"train_loss": -42.172847747802734, "global_step": 263901, "epoch": 2181} {"train_loss": -43.16191864013672, "global_step": 263902, "epoch": 2181} {"train_loss": -42.794925689697266, "global_step": 263903, "epoch": 2181} {"train_loss": -43.47632598876953, "global_step": 263904, "epoch": 2181} {"train_loss": -42.241111755371094, "global_step": 263905, "epoch": 2181} {"train_loss": -43.465816497802734, "global_step": 263906, "epoch": 2181} {"train_loss": -42.514896392822266, "global_step": 263907, "epoch": 2181} {"train_loss": -43.41630935668945, "global_step": 263908, "epoch": 2181} {"train_loss": -42.8647346496582, "global_step": 263909, "epoch": 2181} {"train_loss": -43.43583297729492, "global_step": 263910, "epoch": 2181} {"train_loss": -42.769508361816406, "global_step": 263911, "epoch": 2181} {"train_loss": -43.728355407714844, "global_step": 263912, "epoch": 2181} {"train_loss": -42.549163818359375, "global_step": 263913, "epoch": 2181} {"train_loss": -43.06964111328125, "global_step": 263914, "epoch": 2181} {"train_loss": -42.32247543334961, "global_step": 263915, "epoch": 2181} {"train_loss": -43.32221221923828, "global_step": 263916, "epoch": 2181} {"train_loss": -41.41477584838867, "global_step": 263917, "epoch": 2181} {"train_loss": -43.51753234863281, "global_step": 263918, "epoch": 2181} {"train_loss": -42.188148498535156, "global_step": 263919, "epoch": 2181} {"train_loss": -43.38933181762695, "global_step": 263920, "epoch": 2181} {"train_loss": -42.03006362915039, "global_step": 263921, "epoch": 2181} {"train_loss": -43.28607177734375, "global_step": 263922, "epoch": 2181} {"train_loss": -42.577579498291016, "global_step": 263923, "epoch": 2181} {"train_loss": -42.6639404296875, "global_step": 263924, "epoch": 2181} {"train_loss": -42.556636810302734, "global_step": 263925, "epoch": 2181} {"train_loss": -43.00742721557617, "global_step": 263926, "epoch": 2181} {"train_loss": -42.75602340698242, "global_step": 263927, "epoch": 2181} {"train_loss": -42.90151596069336, "global_step": 263928, "epoch": 2181} {"train_loss": -42.78739547729492, "global_step": 263929, "epoch": 2181} {"train_loss": -42.88916778564453, "global_step": 263930, "epoch": 2181} {"train_loss": -42.34151077270508, "global_step": 263931, "epoch": 2181} {"train_loss": -43.40047073364258, "global_step": 263932, "epoch": 2181} {"train_loss": -43.7578010559082, "global_step": 263933, "epoch": 2181} {"train_loss": -43.4102783203125, "global_step": 263934, "epoch": 2181} {"train_loss": -42.817901611328125, "global_step": 263935, "epoch": 2181} {"train_loss": -42.75804901123047, "global_step": 263936, "epoch": 2181} {"train_loss": -42.930931091308594, "global_step": 263937, "epoch": 2181} {"train_loss": -43.381141662597656, "global_step": 263938, "epoch": 2181} {"train_loss": -42.8740348815918, "global_step": 263939, "epoch": 2181} {"train_loss": -42.16353988647461, "global_step": 263940, "epoch": 2181} {"train_loss": -41.76188659667969, "global_step": 263941, "epoch": 2181} {"train_loss": -41.39948654174805, "global_step": 263942, "epoch": 2181} {"train_loss": -41.5206413269043, "global_step": 263943, "epoch": 2181} {"train_loss": -42.33970260620117, "global_step": 263944, "epoch": 2181} {"train_loss": -42.761592864990234, "global_step": 263945, "epoch": 2181} {"train_loss": -42.00165557861328, "global_step": 263946, "epoch": 2181} {"train_loss": -42.598854064941406, "global_step": 263947, "epoch": 2181} {"train_loss": -43.08830642700195, "global_step": 263948, "epoch": 2181} {"train_loss": -43.0215950012207, "global_step": 263949, "epoch": 2181} {"train_loss": -42.91770553588867, "global_step": 263950, "epoch": 2181} {"train_loss": -43.450496673583984, "global_step": 263951, "epoch": 2181} {"train_loss": -43.5673713684082, "global_step": 263952, "epoch": 2181} {"train_loss": -42.950660705566406, "global_step": 263953, "epoch": 2181} {"train_loss": -43.020538330078125, "global_step": 263954, "epoch": 2181} {"train_loss": -43.73262405395508, "global_step": 263955, "epoch": 2181} {"train_loss": -42.9388313293457, "global_step": 263956, "epoch": 2181} {"train_loss": -43.4609260559082, "global_step": 263957, "epoch": 2181} {"train_loss": -43.62761306762695, "global_step": 263958, "epoch": 2181} {"train_loss": -43.059513092041016, "global_step": 263959, "epoch": 2181} {"train_loss": -43.146976470947266, "global_step": 263960, "epoch": 2181} {"train_loss": -42.42670822143555, "global_step": 263961, "epoch": 2181} {"train_loss": -42.67589569091797, "global_step": 263962, "epoch": 2181} {"train_loss": -43.47956466674805, "global_step": 263963, "epoch": 2181} {"train_loss": -43.54411697387695, "global_step": 263964, "epoch": 2181} {"train_loss": -42.84872055053711, "global_step": 263965, "epoch": 2181} {"train_loss": -43.06059646606445, "global_step": 263966, "epoch": 2181} {"train_loss": -43.58598709106445, "global_step": 263967, "epoch": 2181} {"train_loss": -43.064002990722656, "global_step": 263968, "epoch": 2181} {"train_loss": -43.172203063964844, "global_step": 263969, "epoch": 2181} {"train_loss": -43.350189208984375, "global_step": 263970, "epoch": 2181} {"train_loss": -43.696163177490234, "global_step": 263971, "epoch": 2181} {"train_loss": -43.26179885864258, "global_step": 263972, "epoch": 2181} {"train_loss": -43.448970794677734, "global_step": 263973, "epoch": 2181} {"train_loss": -43.76570510864258, "global_step": 263974, "epoch": 2181} {"train_loss": -43.814815521240234, "global_step": 263975, "epoch": 2181} {"train_loss": -43.35496139526367, "global_step": 263976, "epoch": 2181} {"train_loss": -43.3895149230957, "global_step": 263977, "epoch": 2181} {"train_loss": -44.27687454223633, "global_step": 263978, "epoch": 2181} {"train_loss": -42.81022262573242, "global_step": 263979, "epoch": 2181} {"train_loss": -43.01844787597656, "global_step": 263980, "epoch": 2181} {"train_loss": -43.660888671875, "global_step": 263981, "epoch": 2181} {"train_loss": -43.15476608276367, "global_step": 263982, "epoch": 2181} {"train_loss": -42.187843322753906, "global_step": 263983, "epoch": 2181} {"train_loss": -43.55202865600586, "global_step": 263984, "epoch": 2181} {"train_loss": -42.82184600830078, "global_step": 263985, "epoch": 2181} {"train_loss": -42.38080596923828, "global_step": 263986, "epoch": 2181} {"train_loss": -42.49299240112305, "global_step": 263987, "epoch": 2181} {"train_loss": -43.50773239135742, "global_step": 263988, "epoch": 2181} {"train_loss": -43.83807373046875, "global_step": 263989, "epoch": 2181} {"train_loss": -42.84516906738281, "global_step": 263990, "epoch": 2181} {"train_loss": -43.60185623168945, "global_step": 263991, "epoch": 2181} {"train_loss": -43.896419525146484, "global_step": 263992, "epoch": 2181} {"train_loss": -42.66297912597656, "global_step": 263993, "epoch": 2181} {"train_loss": -43.357574462890625, "global_step": 263994, "epoch": 2181} {"train_loss": -44.19338607788086, "global_step": 263995, "epoch": 2181} {"train_loss": -42.31501007080078, "global_step": 263996, "epoch": 2181} {"train_loss": -40.528541564941406, "global_step": 263997, "epoch": 2181} {"train_loss": -42.827022552490234, "global_step": 263998, "epoch": 2181} {"train_loss": -42.49700927734375, "global_step": 263999, "epoch": 2181} {"train_loss": -40.65890121459961, "global_step": 264000, "epoch": 2181} {"train_loss": -43.39771270751953, "global_step": 264001, "epoch": 2181} {"train_loss": -41.606929779052734, "global_step": 264002, "epoch": 2181} {"train_loss": -39.42414474487305, "global_step": 264003, "epoch": 2181} {"train_loss": -39.17036056518555, "global_step": 264004, "epoch": 2181} {"train_loss": -42.68860626220703, "global_step": 264005, "epoch": 2181} {"train_loss": -42.30564880371094, "global_step": 264006, "epoch": 2181} {"train_loss": -42.73116683959961, "global_step": 264007, "epoch": 2181} {"train_loss": -41.04841995239258, "global_step": 264008, "epoch": 2181} {"train_loss": -41.295772552490234, "global_step": 264009, "epoch": 2181} {"train_loss": -42.510711669921875, "global_step": 264010, "epoch": 2181} {"train_loss": -42.30807113647461, "global_step": 264011, "epoch": 2181} {"train_loss": -42.004756927490234, "global_step": 264012, "epoch": 2181} {"train_loss": -42.0751953125, "global_step": 264013, "epoch": 2181} {"train_loss": -41.422119140625, "global_step": 264014, "epoch": 2181} {"train_loss": -42.6910285949707, "global_step": 264015, "epoch": 2181} {"train_loss": -42.28982162475586, "global_step": 264016, "epoch": 2181} {"train_loss": -43.52437973022461, "global_step": 264017, "epoch": 2181} {"train_loss": -42.28874588012695, "global_step": 264018, "epoch": 2181} {"train_loss": -42.59003829956055, "global_step": 264019, "epoch": 2181} {"train_loss": -43.19004440307617, "global_step": 264020, "epoch": 2181} {"train_loss": -42.788468857442055, "global_step": 264021, "epoch": 2181, "val_loss": 2571357.5} {"train_loss": -42.65228271484375, "global_step": 264022, "epoch": 2182} {"train_loss": -42.004215240478516, "global_step": 264023, "epoch": 2182} {"train_loss": -41.897682189941406, "global_step": 264024, "epoch": 2182} {"train_loss": -43.700103759765625, "global_step": 264025, "epoch": 2182} {"train_loss": -42.71287155151367, "global_step": 264026, "epoch": 2182} {"train_loss": -43.110572814941406, "global_step": 264027, "epoch": 2182} {"train_loss": -42.806922912597656, "global_step": 264028, "epoch": 2182} {"train_loss": -42.860347747802734, "global_step": 264029, "epoch": 2182} {"train_loss": -43.00126266479492, "global_step": 264030, "epoch": 2182} {"train_loss": -42.20689010620117, "global_step": 264031, "epoch": 2182} {"train_loss": -42.45500564575195, "global_step": 264032, "epoch": 2182} {"train_loss": -42.80902099609375, "global_step": 264033, "epoch": 2182} {"train_loss": -43.46937942504883, "global_step": 264034, "epoch": 2182} {"train_loss": -43.588924407958984, "global_step": 264035, "epoch": 2182} {"train_loss": -43.192047119140625, "global_step": 264036, "epoch": 2182} {"train_loss": -42.6766471862793, "global_step": 264037, "epoch": 2182} {"train_loss": -42.53672790527344, "global_step": 264038, "epoch": 2182} {"train_loss": -42.865230560302734, "global_step": 264039, "epoch": 2182} {"train_loss": -42.08864974975586, "global_step": 264040, "epoch": 2182} {"train_loss": -42.996429443359375, "global_step": 264041, "epoch": 2182} {"train_loss": -42.818397521972656, "global_step": 264042, "epoch": 2182} {"train_loss": -42.85535430908203, "global_step": 264043, "epoch": 2182} {"train_loss": -43.16548156738281, "global_step": 264044, "epoch": 2182} {"train_loss": -42.723419189453125, "global_step": 264045, "epoch": 2182} {"train_loss": -43.61787796020508, "global_step": 264046, "epoch": 2182} {"train_loss": -42.01012420654297, "global_step": 264047, "epoch": 2182} {"train_loss": -42.88185501098633, "global_step": 264048, "epoch": 2182} {"train_loss": -42.9654655456543, "global_step": 264049, "epoch": 2182} {"train_loss": -43.28335189819336, "global_step": 264050, "epoch": 2182} {"train_loss": -42.65822219848633, "global_step": 264051, "epoch": 2182} {"train_loss": -42.41929244995117, "global_step": 264052, "epoch": 2182} {"train_loss": -42.7122917175293, "global_step": 264053, "epoch": 2182} {"train_loss": -43.52628707885742, "global_step": 264054, "epoch": 2182} {"train_loss": -42.392486572265625, "global_step": 264055, "epoch": 2182} {"train_loss": -42.280513763427734, "global_step": 264056, "epoch": 2182} {"train_loss": -43.5335693359375, "global_step": 264057, "epoch": 2182} {"train_loss": -43.27666091918945, "global_step": 264058, "epoch": 2182} {"train_loss": -42.899471282958984, "global_step": 264059, "epoch": 2182} {"train_loss": -43.2689208984375, "global_step": 264060, "epoch": 2182} {"train_loss": -43.35453414916992, "global_step": 264061, "epoch": 2182} {"train_loss": -43.236610412597656, "global_step": 264062, "epoch": 2182} {"train_loss": -43.097755432128906, "global_step": 264063, "epoch": 2182} {"train_loss": -43.066627502441406, "global_step": 264064, "epoch": 2182} {"train_loss": -43.653892517089844, "global_step": 264065, "epoch": 2182} {"train_loss": -43.142189025878906, "global_step": 264066, "epoch": 2182} {"train_loss": -43.213497161865234, "global_step": 264067, "epoch": 2182} {"train_loss": -41.0625, "global_step": 264068, "epoch": 2182} {"train_loss": -39.99280548095703, "global_step": 264069, "epoch": 2182} {"train_loss": -42.213924407958984, "global_step": 264070, "epoch": 2182} {"train_loss": -42.9429817199707, "global_step": 264071, "epoch": 2182} {"train_loss": -40.866554260253906, "global_step": 264072, "epoch": 2182} {"train_loss": -43.2093505859375, "global_step": 264073, "epoch": 2182} {"train_loss": -42.313819885253906, "global_step": 264074, "epoch": 2182} {"train_loss": -40.49375534057617, "global_step": 264075, "epoch": 2182} {"train_loss": -43.06146240234375, "global_step": 264076, "epoch": 2182} {"train_loss": -43.14996337890625, "global_step": 264077, "epoch": 2182} {"train_loss": -41.73188018798828, "global_step": 264078, "epoch": 2182} {"train_loss": -42.37964630126953, "global_step": 264079, "epoch": 2182} {"train_loss": -43.80867385864258, "global_step": 264080, "epoch": 2182} {"train_loss": -43.04365539550781, "global_step": 264081, "epoch": 2182} {"train_loss": -42.67855453491211, "global_step": 264082, "epoch": 2182} {"train_loss": -43.627593994140625, "global_step": 264083, "epoch": 2182} {"train_loss": -42.721038818359375, "global_step": 264084, "epoch": 2182} {"train_loss": -42.28596496582031, "global_step": 264085, "epoch": 2182} {"train_loss": -43.179561614990234, "global_step": 264086, "epoch": 2182} {"train_loss": -43.660362243652344, "global_step": 264087, "epoch": 2182} {"train_loss": -43.26756286621094, "global_step": 264088, "epoch": 2182} {"train_loss": -43.6615104675293, "global_step": 264089, "epoch": 2182} {"train_loss": -43.64889907836914, "global_step": 264090, "epoch": 2182} {"train_loss": -43.33024215698242, "global_step": 264091, "epoch": 2182} {"train_loss": -43.69891357421875, "global_step": 264092, "epoch": 2182} {"train_loss": -43.980655670166016, "global_step": 264093, "epoch": 2182} {"train_loss": -43.02521514892578, "global_step": 264094, "epoch": 2182} {"train_loss": -43.704017639160156, "global_step": 264095, "epoch": 2182} {"train_loss": -43.48210906982422, "global_step": 264096, "epoch": 2182} {"train_loss": -43.2341423034668, "global_step": 264097, "epoch": 2182} {"train_loss": -43.669456481933594, "global_step": 264098, "epoch": 2182} {"train_loss": -43.43160629272461, "global_step": 264099, "epoch": 2182} {"train_loss": -43.762691497802734, "global_step": 264100, "epoch": 2182} {"train_loss": -43.06483840942383, "global_step": 264101, "epoch": 2182} {"train_loss": -42.46305465698242, "global_step": 264102, "epoch": 2182} {"train_loss": -42.40737533569336, "global_step": 264103, "epoch": 2182} {"train_loss": -43.38483810424805, "global_step": 264104, "epoch": 2182} {"train_loss": -43.82004928588867, "global_step": 264105, "epoch": 2182} {"train_loss": -43.57450485229492, "global_step": 264106, "epoch": 2182} {"train_loss": -43.08878707885742, "global_step": 264107, "epoch": 2182} {"train_loss": -43.237091064453125, "global_step": 264108, "epoch": 2182} {"train_loss": -43.785274505615234, "global_step": 264109, "epoch": 2182} {"train_loss": -43.65317916870117, "global_step": 264110, "epoch": 2182} {"train_loss": -43.953182220458984, "global_step": 264111, "epoch": 2182} {"train_loss": -44.06876754760742, "global_step": 264112, "epoch": 2182} {"train_loss": -44.016300201416016, "global_step": 264113, "epoch": 2182} {"train_loss": -44.16226577758789, "global_step": 264114, "epoch": 2182} {"train_loss": -43.90168380737305, "global_step": 264115, "epoch": 2182} {"train_loss": -43.63300704956055, "global_step": 264116, "epoch": 2182} {"train_loss": -43.13917922973633, "global_step": 264117, "epoch": 2182} {"train_loss": -43.98396682739258, "global_step": 264118, "epoch": 2182} {"train_loss": -44.1823844909668, "global_step": 264119, "epoch": 2182} {"train_loss": -43.63969039916992, "global_step": 264120, "epoch": 2182} {"train_loss": -44.1786003112793, "global_step": 264121, "epoch": 2182} {"train_loss": -44.03411865234375, "global_step": 264122, "epoch": 2182} {"train_loss": -43.4753532409668, "global_step": 264123, "epoch": 2182} {"train_loss": -43.18930435180664, "global_step": 264124, "epoch": 2182} {"train_loss": -43.25033187866211, "global_step": 264125, "epoch": 2182} {"train_loss": -43.632755279541016, "global_step": 264126, "epoch": 2182} {"train_loss": -44.18841552734375, "global_step": 264127, "epoch": 2182} {"train_loss": -43.18671798706055, "global_step": 264128, "epoch": 2182} {"train_loss": -43.16868209838867, "global_step": 264129, "epoch": 2182} {"train_loss": -42.36225509643555, "global_step": 264130, "epoch": 2182} {"train_loss": -43.66457748413086, "global_step": 264131, "epoch": 2182} {"train_loss": -43.133827209472656, "global_step": 264132, "epoch": 2182} {"train_loss": -42.19384002685547, "global_step": 264133, "epoch": 2182} {"train_loss": -42.621803283691406, "global_step": 264134, "epoch": 2182} {"train_loss": -43.29875946044922, "global_step": 264135, "epoch": 2182} {"train_loss": -42.444374084472656, "global_step": 264136, "epoch": 2182} {"train_loss": -42.14939498901367, "global_step": 264137, "epoch": 2182} {"train_loss": -43.236907958984375, "global_step": 264138, "epoch": 2182} {"train_loss": -43.20431900024414, "global_step": 264139, "epoch": 2182} {"train_loss": -43.027523040771484, "global_step": 264140, "epoch": 2182} {"train_loss": -42.99275588989258, "global_step": 264141, "epoch": 2182} {"train_loss": -43.04759396009209, "global_step": 264142, "epoch": 2182, "val_loss": 2622875.75} {"train_loss": -42.02297592163086, "global_step": 264143, "epoch": 2183} {"train_loss": -42.68632125854492, "global_step": 264144, "epoch": 2183} {"train_loss": -43.117122650146484, "global_step": 264145, "epoch": 2183} {"train_loss": -43.67855453491211, "global_step": 264146, "epoch": 2183} {"train_loss": -42.47004318237305, "global_step": 264147, "epoch": 2183} {"train_loss": -42.839927673339844, "global_step": 264148, "epoch": 2183} {"train_loss": -43.132991790771484, "global_step": 264149, "epoch": 2183} {"train_loss": -43.45016860961914, "global_step": 264150, "epoch": 2183} {"train_loss": -42.88386917114258, "global_step": 264151, "epoch": 2183} {"train_loss": -42.21234130859375, "global_step": 264152, "epoch": 2183} {"train_loss": -42.48651885986328, "global_step": 264153, "epoch": 2183} {"train_loss": -43.361629486083984, "global_step": 264154, "epoch": 2183} {"train_loss": -43.19784164428711, "global_step": 264155, "epoch": 2183} {"train_loss": -42.31536865234375, "global_step": 264156, "epoch": 2183} {"train_loss": -42.596961975097656, "global_step": 264157, "epoch": 2183} {"train_loss": -43.10055923461914, "global_step": 264158, "epoch": 2183} {"train_loss": -42.76142120361328, "global_step": 264159, "epoch": 2183} {"train_loss": -42.65822982788086, "global_step": 264160, "epoch": 2183} {"train_loss": -42.674530029296875, "global_step": 264161, "epoch": 2183} {"train_loss": -42.34824752807617, "global_step": 264162, "epoch": 2183} {"train_loss": -42.90080642700195, "global_step": 264163, "epoch": 2183} {"train_loss": -41.584869384765625, "global_step": 264164, "epoch": 2183} {"train_loss": -39.93183517456055, "global_step": 264165, "epoch": 2183} {"train_loss": -42.60550308227539, "global_step": 264166, "epoch": 2183} {"train_loss": -43.44832229614258, "global_step": 264167, "epoch": 2183} {"train_loss": -42.02714538574219, "global_step": 264168, "epoch": 2183} {"train_loss": -41.46826171875, "global_step": 264169, "epoch": 2183} {"train_loss": -42.78825378417969, "global_step": 264170, "epoch": 2183} {"train_loss": -42.92259979248047, "global_step": 264171, "epoch": 2183} {"train_loss": -42.72834396362305, "global_step": 264172, "epoch": 2183} {"train_loss": -42.830322265625, "global_step": 264173, "epoch": 2183} {"train_loss": -43.70650863647461, "global_step": 264174, "epoch": 2183} {"train_loss": -42.411903381347656, "global_step": 264175, "epoch": 2183} {"train_loss": -41.88271713256836, "global_step": 264176, "epoch": 2183} {"train_loss": -43.13167953491211, "global_step": 264177, "epoch": 2183} {"train_loss": -40.514320373535156, "global_step": 264178, "epoch": 2183} {"train_loss": -42.84535598754883, "global_step": 264179, "epoch": 2183} {"train_loss": -42.33771514892578, "global_step": 264180, "epoch": 2183} {"train_loss": -42.51809310913086, "global_step": 264181, "epoch": 2183} {"train_loss": -42.76214599609375, "global_step": 264182, "epoch": 2183} {"train_loss": -42.078826904296875, "global_step": 264183, "epoch": 2183} {"train_loss": -42.6853141784668, "global_step": 264184, "epoch": 2183} {"train_loss": -42.54094314575195, "global_step": 264185, "epoch": 2183} {"train_loss": -41.7428092956543, "global_step": 264186, "epoch": 2183} {"train_loss": -43.19791793823242, "global_step": 264187, "epoch": 2183} {"train_loss": -43.06682205200195, "global_step": 264188, "epoch": 2183} {"train_loss": -42.42678451538086, "global_step": 264189, "epoch": 2183} {"train_loss": -43.65976333618164, "global_step": 264190, "epoch": 2183} {"train_loss": -43.40901565551758, "global_step": 264191, "epoch": 2183} {"train_loss": -42.79042434692383, "global_step": 264192, "epoch": 2183} {"train_loss": -41.95722579956055, "global_step": 264193, "epoch": 2183} {"train_loss": -39.87602615356445, "global_step": 264194, "epoch": 2183} {"train_loss": -42.208927154541016, "global_step": 264195, "epoch": 2183} {"train_loss": -43.16240310668945, "global_step": 264196, "epoch": 2183} {"train_loss": -43.486663818359375, "global_step": 264197, "epoch": 2183} {"train_loss": -43.2926025390625, "global_step": 264198, "epoch": 2183} {"train_loss": -42.72674560546875, "global_step": 264199, "epoch": 2183} {"train_loss": -43.53849792480469, "global_step": 264200, "epoch": 2183} {"train_loss": -43.77281188964844, "global_step": 264201, "epoch": 2183} {"train_loss": -43.08485794067383, "global_step": 264202, "epoch": 2183} {"train_loss": -43.30070114135742, "global_step": 264203, "epoch": 2183} {"train_loss": -43.432289123535156, "global_step": 264204, "epoch": 2183} {"train_loss": -43.576114654541016, "global_step": 264205, "epoch": 2183} {"train_loss": -43.370967864990234, "global_step": 264206, "epoch": 2183} {"train_loss": -43.01594924926758, "global_step": 264207, "epoch": 2183} {"train_loss": -43.74050521850586, "global_step": 264208, "epoch": 2183} {"train_loss": -43.8961296081543, "global_step": 264209, "epoch": 2183} {"train_loss": -43.84981918334961, "global_step": 264210, "epoch": 2183} {"train_loss": -43.908203125, "global_step": 264211, "epoch": 2183} {"train_loss": -43.338958740234375, "global_step": 264212, "epoch": 2183} {"train_loss": -44.193023681640625, "global_step": 264213, "epoch": 2183} {"train_loss": -43.57790756225586, "global_step": 264214, "epoch": 2183} {"train_loss": -43.11910629272461, "global_step": 264215, "epoch": 2183} {"train_loss": -43.780643463134766, "global_step": 264216, "epoch": 2183} {"train_loss": -43.6839714050293, "global_step": 264217, "epoch": 2183} {"train_loss": -43.11878967285156, "global_step": 264218, "epoch": 2183} {"train_loss": -43.47330856323242, "global_step": 264219, "epoch": 2183} {"train_loss": -42.535396575927734, "global_step": 264220, "epoch": 2183} {"train_loss": -42.15206527709961, "global_step": 264221, "epoch": 2183} {"train_loss": -42.97582244873047, "global_step": 264222, "epoch": 2183} {"train_loss": -43.5998649597168, "global_step": 264223, "epoch": 2183} {"train_loss": -42.11139678955078, "global_step": 264224, "epoch": 2183} {"train_loss": -42.14358901977539, "global_step": 264225, "epoch": 2183} {"train_loss": -41.90875244140625, "global_step": 264226, "epoch": 2183} {"train_loss": -42.46872329711914, "global_step": 264227, "epoch": 2183} {"train_loss": -42.73686218261719, "global_step": 264228, "epoch": 2183} {"train_loss": -43.397186279296875, "global_step": 264229, "epoch": 2183} {"train_loss": -42.78032302856445, "global_step": 264230, "epoch": 2183} {"train_loss": -42.60935592651367, "global_step": 264231, "epoch": 2183} {"train_loss": -41.40836715698242, "global_step": 264232, "epoch": 2183} {"train_loss": -42.47147750854492, "global_step": 264233, "epoch": 2183} {"train_loss": -43.233375549316406, "global_step": 264234, "epoch": 2183} {"train_loss": -41.72404861450195, "global_step": 264235, "epoch": 2183} {"train_loss": -41.87659454345703, "global_step": 264236, "epoch": 2183} {"train_loss": -41.43645095825195, "global_step": 264237, "epoch": 2183} {"train_loss": -42.12699890136719, "global_step": 264238, "epoch": 2183} {"train_loss": -42.66971969604492, "global_step": 264239, "epoch": 2183} {"train_loss": -41.6076774597168, "global_step": 264240, "epoch": 2183} {"train_loss": -41.974761962890625, "global_step": 264241, "epoch": 2183} {"train_loss": -41.85513687133789, "global_step": 264242, "epoch": 2183} {"train_loss": -42.33794021606445, "global_step": 264243, "epoch": 2183} {"train_loss": -42.739356994628906, "global_step": 264244, "epoch": 2183} {"train_loss": -42.16396713256836, "global_step": 264245, "epoch": 2183} {"train_loss": -42.98017501831055, "global_step": 264246, "epoch": 2183} {"train_loss": -41.028202056884766, "global_step": 264247, "epoch": 2183} {"train_loss": -42.47816848754883, "global_step": 264248, "epoch": 2183} {"train_loss": -42.31026840209961, "global_step": 264249, "epoch": 2183} {"train_loss": -41.60892868041992, "global_step": 264250, "epoch": 2183} {"train_loss": -42.61079406738281, "global_step": 264251, "epoch": 2183} {"train_loss": -42.626338958740234, "global_step": 264252, "epoch": 2183} {"train_loss": -41.674102783203125, "global_step": 264253, "epoch": 2183} {"train_loss": -42.72173309326172, "global_step": 264254, "epoch": 2183} {"train_loss": -42.94759750366211, "global_step": 264255, "epoch": 2183} {"train_loss": -42.3269157409668, "global_step": 264256, "epoch": 2183} {"train_loss": -42.21955490112305, "global_step": 264257, "epoch": 2183} {"train_loss": -43.372962951660156, "global_step": 264258, "epoch": 2183} {"train_loss": -42.5080680847168, "global_step": 264259, "epoch": 2183} {"train_loss": -43.173099517822266, "global_step": 264260, "epoch": 2183} {"train_loss": -42.46771240234375, "global_step": 264261, "epoch": 2183} {"train_loss": -43.08306884765625, "global_step": 264262, "epoch": 2183} {"train_loss": -42.684748405267385, "global_step": 264263, "epoch": 2183, "val_loss": 2679181.5} {"train_loss": -42.8153190612793, "global_step": 264264, "epoch": 2184} {"train_loss": -42.989315032958984, "global_step": 264265, "epoch": 2184} {"train_loss": -43.193355560302734, "global_step": 264266, "epoch": 2184} {"train_loss": -41.95199966430664, "global_step": 264267, "epoch": 2184} {"train_loss": -43.08366012573242, "global_step": 264268, "epoch": 2184} {"train_loss": -42.355751037597656, "global_step": 264269, "epoch": 2184} {"train_loss": -43.145137786865234, "global_step": 264270, "epoch": 2184} {"train_loss": -43.04384231567383, "global_step": 264271, "epoch": 2184} {"train_loss": -42.989078521728516, "global_step": 264272, "epoch": 2184} {"train_loss": -43.51583480834961, "global_step": 264273, "epoch": 2184} {"train_loss": -43.4654655456543, "global_step": 264274, "epoch": 2184} {"train_loss": -42.41587448120117, "global_step": 264275, "epoch": 2184} {"train_loss": -41.59145736694336, "global_step": 264276, "epoch": 2184} {"train_loss": -41.73365783691406, "global_step": 264277, "epoch": 2184} {"train_loss": -43.3531494140625, "global_step": 264278, "epoch": 2184} {"train_loss": -43.5431022644043, "global_step": 264279, "epoch": 2184} {"train_loss": -42.76597595214844, "global_step": 264280, "epoch": 2184} {"train_loss": -43.187374114990234, "global_step": 264281, "epoch": 2184} {"train_loss": -43.319969177246094, "global_step": 264282, "epoch": 2184} {"train_loss": -42.91975021362305, "global_step": 264283, "epoch": 2184} {"train_loss": -43.89753341674805, "global_step": 264284, "epoch": 2184} {"train_loss": -43.677852630615234, "global_step": 264285, "epoch": 2184} {"train_loss": -43.283199310302734, "global_step": 264286, "epoch": 2184} {"train_loss": -44.142906188964844, "global_step": 264287, "epoch": 2184} {"train_loss": -43.77340316772461, "global_step": 264288, "epoch": 2184} {"train_loss": -43.635475158691406, "global_step": 264289, "epoch": 2184} {"train_loss": -43.264522552490234, "global_step": 264290, "epoch": 2184} {"train_loss": -43.410457611083984, "global_step": 264291, "epoch": 2184} {"train_loss": -42.5827751159668, "global_step": 264292, "epoch": 2184} {"train_loss": -41.1779899597168, "global_step": 264293, "epoch": 2184} {"train_loss": -40.72321701049805, "global_step": 264294, "epoch": 2184} {"train_loss": -43.1209831237793, "global_step": 264295, "epoch": 2184} {"train_loss": -43.621826171875, "global_step": 264296, "epoch": 2184} {"train_loss": -42.199005126953125, "global_step": 264297, "epoch": 2184} {"train_loss": -42.67426300048828, "global_step": 264298, "epoch": 2184} {"train_loss": -43.19597625732422, "global_step": 264299, "epoch": 2184} {"train_loss": -43.926578521728516, "global_step": 264300, "epoch": 2184} {"train_loss": -43.856483459472656, "global_step": 264301, "epoch": 2184} {"train_loss": -42.62910842895508, "global_step": 264302, "epoch": 2184} {"train_loss": -42.709957122802734, "global_step": 264303, "epoch": 2184} {"train_loss": -43.5320930480957, "global_step": 264304, "epoch": 2184} {"train_loss": -44.0731086730957, "global_step": 264305, "epoch": 2184} {"train_loss": -43.38124465942383, "global_step": 264306, "epoch": 2184} {"train_loss": -43.09901809692383, "global_step": 264307, "epoch": 2184} {"train_loss": -42.25069046020508, "global_step": 264308, "epoch": 2184} {"train_loss": -42.83079147338867, "global_step": 264309, "epoch": 2184} {"train_loss": -43.75295639038086, "global_step": 264310, "epoch": 2184} {"train_loss": -41.905975341796875, "global_step": 264311, "epoch": 2184} {"train_loss": -42.68561553955078, "global_step": 264312, "epoch": 2184} {"train_loss": -43.615291595458984, "global_step": 264313, "epoch": 2184} {"train_loss": -43.46616744995117, "global_step": 264314, "epoch": 2184} {"train_loss": -43.18304443359375, "global_step": 264315, "epoch": 2184} {"train_loss": -42.790794372558594, "global_step": 264316, "epoch": 2184} {"train_loss": -43.53793716430664, "global_step": 264317, "epoch": 2184} {"train_loss": -44.40932846069336, "global_step": 264318, "epoch": 2184} {"train_loss": -42.900604248046875, "global_step": 264319, "epoch": 2184} {"train_loss": -43.47444534301758, "global_step": 264320, "epoch": 2184} {"train_loss": -43.940338134765625, "global_step": 264321, "epoch": 2184} {"train_loss": -44.03243637084961, "global_step": 264322, "epoch": 2184} {"train_loss": -44.22951889038086, "global_step": 264323, "epoch": 2184} {"train_loss": -43.856239318847656, "global_step": 264324, "epoch": 2184} {"train_loss": -43.884986877441406, "global_step": 264325, "epoch": 2184} {"train_loss": -44.27564239501953, "global_step": 264326, "epoch": 2184} {"train_loss": -43.76676559448242, "global_step": 264327, "epoch": 2184} {"train_loss": -44.38609313964844, "global_step": 264328, "epoch": 2184} {"train_loss": -44.2049446105957, "global_step": 264329, "epoch": 2184} {"train_loss": -43.231754302978516, "global_step": 264330, "epoch": 2184} {"train_loss": -44.29343032836914, "global_step": 264331, "epoch": 2184} {"train_loss": -43.29292297363281, "global_step": 264332, "epoch": 2184} {"train_loss": -44.353492736816406, "global_step": 264333, "epoch": 2184} {"train_loss": -44.17744064331055, "global_step": 264334, "epoch": 2184} {"train_loss": -43.74201202392578, "global_step": 264335, "epoch": 2184} {"train_loss": -44.084842681884766, "global_step": 264336, "epoch": 2184} {"train_loss": -43.090484619140625, "global_step": 264337, "epoch": 2184} {"train_loss": -43.519813537597656, "global_step": 264338, "epoch": 2184} {"train_loss": -42.97333908081055, "global_step": 264339, "epoch": 2184} {"train_loss": -42.59775924682617, "global_step": 264340, "epoch": 2184} {"train_loss": -42.885318756103516, "global_step": 264341, "epoch": 2184} {"train_loss": -43.99662780761719, "global_step": 264342, "epoch": 2184} {"train_loss": -42.7856330871582, "global_step": 264343, "epoch": 2184} {"train_loss": -43.89997482299805, "global_step": 264344, "epoch": 2184} {"train_loss": -43.10577392578125, "global_step": 264345, "epoch": 2184} {"train_loss": -43.371055603027344, "global_step": 264346, "epoch": 2184} {"train_loss": -43.86813735961914, "global_step": 264347, "epoch": 2184} {"train_loss": -43.96238708496094, "global_step": 264348, "epoch": 2184} {"train_loss": -43.3902702331543, "global_step": 264349, "epoch": 2184} {"train_loss": -42.8593864440918, "global_step": 264350, "epoch": 2184} {"train_loss": -42.74622344970703, "global_step": 264351, "epoch": 2184} {"train_loss": -43.059112548828125, "global_step": 264352, "epoch": 2184} {"train_loss": -42.72739791870117, "global_step": 264353, "epoch": 2184} {"train_loss": -41.86125564575195, "global_step": 264354, "epoch": 2184} {"train_loss": -40.08088302612305, "global_step": 264355, "epoch": 2184} {"train_loss": -35.426876068115234, "global_step": 264356, "epoch": 2184} {"train_loss": -39.793907165527344, "global_step": 264357, "epoch": 2184} {"train_loss": -41.304813385009766, "global_step": 264358, "epoch": 2184} {"train_loss": -41.982276916503906, "global_step": 264359, "epoch": 2184} {"train_loss": -40.104248046875, "global_step": 264360, "epoch": 2184} {"train_loss": -41.54691696166992, "global_step": 264361, "epoch": 2184} {"train_loss": -41.923152923583984, "global_step": 264362, "epoch": 2184} {"train_loss": -41.22005081176758, "global_step": 264363, "epoch": 2184} {"train_loss": -40.47300338745117, "global_step": 264364, "epoch": 2184} {"train_loss": -42.194801330566406, "global_step": 264365, "epoch": 2184} {"train_loss": -42.4796257019043, "global_step": 264366, "epoch": 2184} {"train_loss": -42.533042907714844, "global_step": 264367, "epoch": 2184} {"train_loss": -42.008201599121094, "global_step": 264368, "epoch": 2184} {"train_loss": -43.39548110961914, "global_step": 264369, "epoch": 2184} {"train_loss": -42.89273452758789, "global_step": 264370, "epoch": 2184} {"train_loss": -42.46405029296875, "global_step": 264371, "epoch": 2184} {"train_loss": -42.23971176147461, "global_step": 264372, "epoch": 2184} {"train_loss": -42.74763107299805, "global_step": 264373, "epoch": 2184} {"train_loss": -40.456336975097656, "global_step": 264374, "epoch": 2184} {"train_loss": -42.169677734375, "global_step": 264375, "epoch": 2184} {"train_loss": -42.220638275146484, "global_step": 264376, "epoch": 2184} {"train_loss": -39.24728012084961, "global_step": 264377, "epoch": 2184} {"train_loss": -43.104278564453125, "global_step": 264378, "epoch": 2184} {"train_loss": -42.51798629760742, "global_step": 264379, "epoch": 2184} {"train_loss": -42.632301330566406, "global_step": 264380, "epoch": 2184} {"train_loss": -42.912899017333984, "global_step": 264381, "epoch": 2184} {"train_loss": -43.065406799316406, "global_step": 264382, "epoch": 2184} {"train_loss": -41.71713638305664, "global_step": 264383, "epoch": 2184} {"train_loss": -42.834246517212925, "global_step": 264384, "epoch": 2184, "val_loss": 2621196.0} {"train_loss": -41.738853454589844, "global_step": 264385, "epoch": 2185} {"train_loss": -42.20209884643555, "global_step": 264386, "epoch": 2185} {"train_loss": -39.87837600708008, "global_step": 264387, "epoch": 2185} {"train_loss": -42.86714553833008, "global_step": 264388, "epoch": 2185} {"train_loss": -42.3436393737793, "global_step": 264389, "epoch": 2185} {"train_loss": -41.47107696533203, "global_step": 264390, "epoch": 2185} {"train_loss": -43.07170867919922, "global_step": 264391, "epoch": 2185} {"train_loss": -42.65135192871094, "global_step": 264392, "epoch": 2185} {"train_loss": -42.1212043762207, "global_step": 264393, "epoch": 2185} {"train_loss": -43.22262191772461, "global_step": 264394, "epoch": 2185} {"train_loss": -42.84675979614258, "global_step": 264395, "epoch": 2185} {"train_loss": -43.16071701049805, "global_step": 264396, "epoch": 2185} {"train_loss": -42.501304626464844, "global_step": 264397, "epoch": 2185} {"train_loss": -42.90399169921875, "global_step": 264398, "epoch": 2185} {"train_loss": -38.12908935546875, "global_step": 264399, "epoch": 2185} {"train_loss": -41.756446838378906, "global_step": 264400, "epoch": 2185} {"train_loss": -43.52370834350586, "global_step": 264401, "epoch": 2185} {"train_loss": -42.341182708740234, "global_step": 264402, "epoch": 2185} {"train_loss": -38.816558837890625, "global_step": 264403, "epoch": 2185} {"train_loss": -42.32632827758789, "global_step": 264404, "epoch": 2185} {"train_loss": -43.03325271606445, "global_step": 264405, "epoch": 2185} {"train_loss": -43.01387023925781, "global_step": 264406, "epoch": 2185} {"train_loss": -42.23666000366211, "global_step": 264407, "epoch": 2185} {"train_loss": -43.67765426635742, "global_step": 264408, "epoch": 2185} {"train_loss": -42.57285690307617, "global_step": 264409, "epoch": 2185} {"train_loss": -41.1710090637207, "global_step": 264410, "epoch": 2185} {"train_loss": -41.274051666259766, "global_step": 264411, "epoch": 2185} {"train_loss": -40.70872116088867, "global_step": 264412, "epoch": 2185} {"train_loss": -41.44321823120117, "global_step": 264413, "epoch": 2185} {"train_loss": -42.54814147949219, "global_step": 264414, "epoch": 2185} {"train_loss": -40.61172103881836, "global_step": 264415, "epoch": 2185} {"train_loss": -41.574520111083984, "global_step": 264416, "epoch": 2185} {"train_loss": -42.24497604370117, "global_step": 264417, "epoch": 2185} {"train_loss": -40.945533752441406, "global_step": 264418, "epoch": 2185} {"train_loss": -40.91610336303711, "global_step": 264419, "epoch": 2185} {"train_loss": -42.611934661865234, "global_step": 264420, "epoch": 2185} {"train_loss": -42.28054428100586, "global_step": 264421, "epoch": 2185} {"train_loss": -40.47694778442383, "global_step": 264422, "epoch": 2185} {"train_loss": -42.697933197021484, "global_step": 264423, "epoch": 2185} {"train_loss": -43.331329345703125, "global_step": 264424, "epoch": 2185} {"train_loss": -41.60691452026367, "global_step": 264425, "epoch": 2185} {"train_loss": -42.67164993286133, "global_step": 264426, "epoch": 2185} {"train_loss": -41.88214874267578, "global_step": 264427, "epoch": 2185} {"train_loss": -42.17258834838867, "global_step": 264428, "epoch": 2185} {"train_loss": -42.8553581237793, "global_step": 264429, "epoch": 2185} {"train_loss": -42.72590255737305, "global_step": 264430, "epoch": 2185} {"train_loss": -41.27739715576172, "global_step": 264431, "epoch": 2185} {"train_loss": -42.53921127319336, "global_step": 264432, "epoch": 2185} {"train_loss": -43.30862045288086, "global_step": 264433, "epoch": 2185} {"train_loss": -43.380950927734375, "global_step": 264434, "epoch": 2185} {"train_loss": -42.52141189575195, "global_step": 264435, "epoch": 2185} {"train_loss": -42.53676223754883, "global_step": 264436, "epoch": 2185} {"train_loss": -43.08213424682617, "global_step": 264437, "epoch": 2185} {"train_loss": -42.878273010253906, "global_step": 264438, "epoch": 2185} {"train_loss": -42.81769943237305, "global_step": 264439, "epoch": 2185} {"train_loss": -43.404541015625, "global_step": 264440, "epoch": 2185} {"train_loss": -41.17660140991211, "global_step": 264441, "epoch": 2185} {"train_loss": -43.032691955566406, "global_step": 264442, "epoch": 2185} {"train_loss": -43.494171142578125, "global_step": 264443, "epoch": 2185} {"train_loss": -43.07258987426758, "global_step": 264444, "epoch": 2185} {"train_loss": -42.45186996459961, "global_step": 264445, "epoch": 2185} {"train_loss": -43.56370544433594, "global_step": 264446, "epoch": 2185} {"train_loss": -42.150665283203125, "global_step": 264447, "epoch": 2185} {"train_loss": -42.99114990234375, "global_step": 264448, "epoch": 2185} {"train_loss": -43.72159957885742, "global_step": 264449, "epoch": 2185} {"train_loss": -43.15800094604492, "global_step": 264450, "epoch": 2185} {"train_loss": -42.692012786865234, "global_step": 264451, "epoch": 2185} {"train_loss": -43.69826889038086, "global_step": 264452, "epoch": 2185} {"train_loss": -42.64543533325195, "global_step": 264453, "epoch": 2185} {"train_loss": -43.114295959472656, "global_step": 264454, "epoch": 2185} {"train_loss": -42.82719802856445, "global_step": 264455, "epoch": 2185} {"train_loss": -43.41572952270508, "global_step": 264456, "epoch": 2185} {"train_loss": -43.911922454833984, "global_step": 264457, "epoch": 2185} {"train_loss": -42.062252044677734, "global_step": 264458, "epoch": 2185} {"train_loss": -42.70294952392578, "global_step": 264459, "epoch": 2185} {"train_loss": -43.242671966552734, "global_step": 264460, "epoch": 2185} {"train_loss": -43.829193115234375, "global_step": 264461, "epoch": 2185} {"train_loss": -43.111000061035156, "global_step": 264462, "epoch": 2185} {"train_loss": -42.2169303894043, "global_step": 264463, "epoch": 2185} {"train_loss": -43.913692474365234, "global_step": 264464, "epoch": 2185} {"train_loss": -43.949745178222656, "global_step": 264465, "epoch": 2185} {"train_loss": -43.52863693237305, "global_step": 264466, "epoch": 2185} {"train_loss": -42.74168014526367, "global_step": 264467, "epoch": 2185} {"train_loss": -43.94165802001953, "global_step": 264468, "epoch": 2185} {"train_loss": -43.57278060913086, "global_step": 264469, "epoch": 2185} {"train_loss": -43.36714172363281, "global_step": 264470, "epoch": 2185} {"train_loss": -42.5513916015625, "global_step": 264471, "epoch": 2185} {"train_loss": -43.00220489501953, "global_step": 264472, "epoch": 2185} {"train_loss": -43.737361907958984, "global_step": 264473, "epoch": 2185} {"train_loss": -43.961883544921875, "global_step": 264474, "epoch": 2185} {"train_loss": -43.25801467895508, "global_step": 264475, "epoch": 2185} {"train_loss": -42.784915924072266, "global_step": 264476, "epoch": 2185} {"train_loss": -42.57837677001953, "global_step": 264477, "epoch": 2185} {"train_loss": -43.00136947631836, "global_step": 264478, "epoch": 2185} {"train_loss": -43.50119400024414, "global_step": 264479, "epoch": 2185} {"train_loss": -43.43186569213867, "global_step": 264480, "epoch": 2185} {"train_loss": -42.62479782104492, "global_step": 264481, "epoch": 2185} {"train_loss": -42.977943420410156, "global_step": 264482, "epoch": 2185} {"train_loss": -43.594600677490234, "global_step": 264483, "epoch": 2185} {"train_loss": -42.18171310424805, "global_step": 264484, "epoch": 2185} {"train_loss": -42.91439437866211, "global_step": 264485, "epoch": 2185} {"train_loss": -42.61445999145508, "global_step": 264486, "epoch": 2185} {"train_loss": -42.74921417236328, "global_step": 264487, "epoch": 2185} {"train_loss": -43.125831604003906, "global_step": 264488, "epoch": 2185} {"train_loss": -41.6982421875, "global_step": 264489, "epoch": 2185} {"train_loss": -43.49794006347656, "global_step": 264490, "epoch": 2185} {"train_loss": -44.004241943359375, "global_step": 264491, "epoch": 2185} {"train_loss": -43.1060905456543, "global_step": 264492, "epoch": 2185} {"train_loss": -42.590362548828125, "global_step": 264493, "epoch": 2185} {"train_loss": -43.885013580322266, "global_step": 264494, "epoch": 2185} {"train_loss": -42.83078384399414, "global_step": 264495, "epoch": 2185} {"train_loss": -41.21757888793945, "global_step": 264496, "epoch": 2185} {"train_loss": -40.23423385620117, "global_step": 264497, "epoch": 2185} {"train_loss": -42.429107666015625, "global_step": 264498, "epoch": 2185} {"train_loss": -42.824920654296875, "global_step": 264499, "epoch": 2185} {"train_loss": -39.232173919677734, "global_step": 264500, "epoch": 2185} {"train_loss": -41.90406036376953, "global_step": 264501, "epoch": 2185} {"train_loss": -41.022029876708984, "global_step": 264502, "epoch": 2185} {"train_loss": -37.646392822265625, "global_step": 264503, "epoch": 2185} {"train_loss": -39.73818588256836, "global_step": 264504, "epoch": 2185} {"train_loss": -42.44834464837697, "global_step": 264505, "epoch": 2185, "val_loss": 2570659.25} {"train_loss": -37.62439727783203, "global_step": 264506, "epoch": 2186} {"train_loss": -36.13512420654297, "global_step": 264507, "epoch": 2186} {"train_loss": -36.793331146240234, "global_step": 264508, "epoch": 2186} {"train_loss": -35.48371505737305, "global_step": 264509, "epoch": 2186} {"train_loss": -36.91331100463867, "global_step": 264510, "epoch": 2186} {"train_loss": -38.50666427612305, "global_step": 264511, "epoch": 2186} {"train_loss": -37.112213134765625, "global_step": 264512, "epoch": 2186} {"train_loss": -38.32734680175781, "global_step": 264513, "epoch": 2186} {"train_loss": -38.052215576171875, "global_step": 264514, "epoch": 2186} {"train_loss": -39.189876556396484, "global_step": 264515, "epoch": 2186} {"train_loss": -40.50081253051758, "global_step": 264516, "epoch": 2186} {"train_loss": -39.89460372924805, "global_step": 264517, "epoch": 2186} {"train_loss": -39.78866195678711, "global_step": 264518, "epoch": 2186} {"train_loss": -39.872127532958984, "global_step": 264519, "epoch": 2186} {"train_loss": -39.270198822021484, "global_step": 264520, "epoch": 2186} {"train_loss": -41.802642822265625, "global_step": 264521, "epoch": 2186} {"train_loss": -41.741302490234375, "global_step": 264522, "epoch": 2186} {"train_loss": -41.54566192626953, "global_step": 264523, "epoch": 2186} {"train_loss": -41.88766860961914, "global_step": 264524, "epoch": 2186} {"train_loss": -41.8681640625, "global_step": 264525, "epoch": 2186} {"train_loss": -41.99845504760742, "global_step": 264526, "epoch": 2186} {"train_loss": -41.78125, "global_step": 264527, "epoch": 2186} {"train_loss": -42.5056266784668, "global_step": 264528, "epoch": 2186} {"train_loss": -42.31596374511719, "global_step": 264529, "epoch": 2186} {"train_loss": -42.04946517944336, "global_step": 264530, "epoch": 2186} {"train_loss": -42.79480743408203, "global_step": 264531, "epoch": 2186} {"train_loss": -41.86485290527344, "global_step": 264532, "epoch": 2186} {"train_loss": -42.72306442260742, "global_step": 264533, "epoch": 2186} {"train_loss": -41.86104965209961, "global_step": 264534, "epoch": 2186} {"train_loss": -42.75623321533203, "global_step": 264535, "epoch": 2186} {"train_loss": -43.18010330200195, "global_step": 264536, "epoch": 2186} {"train_loss": -42.89961242675781, "global_step": 264537, "epoch": 2186} {"train_loss": -42.914276123046875, "global_step": 264538, "epoch": 2186} {"train_loss": -42.8150520324707, "global_step": 264539, "epoch": 2186} {"train_loss": -43.532283782958984, "global_step": 264540, "epoch": 2186} {"train_loss": -42.73646926879883, "global_step": 264541, "epoch": 2186} {"train_loss": -42.65446090698242, "global_step": 264542, "epoch": 2186} {"train_loss": -42.909950256347656, "global_step": 264543, "epoch": 2186} {"train_loss": -42.22386169433594, "global_step": 264544, "epoch": 2186} {"train_loss": -43.268035888671875, "global_step": 264545, "epoch": 2186} {"train_loss": -42.59231185913086, "global_step": 264546, "epoch": 2186} {"train_loss": -42.542476654052734, "global_step": 264547, "epoch": 2186} {"train_loss": -42.44413375854492, "global_step": 264548, "epoch": 2186} {"train_loss": -41.93258285522461, "global_step": 264549, "epoch": 2186} {"train_loss": -43.398494720458984, "global_step": 264550, "epoch": 2186} {"train_loss": -43.01375198364258, "global_step": 264551, "epoch": 2186} {"train_loss": -42.68636703491211, "global_step": 264552, "epoch": 2186} {"train_loss": -43.570045471191406, "global_step": 264553, "epoch": 2186} {"train_loss": -43.11349105834961, "global_step": 264554, "epoch": 2186} {"train_loss": -43.18085861206055, "global_step": 264555, "epoch": 2186} {"train_loss": -43.77783966064453, "global_step": 264556, "epoch": 2186} {"train_loss": -43.60012435913086, "global_step": 264557, "epoch": 2186} {"train_loss": -43.55785369873047, "global_step": 264558, "epoch": 2186} {"train_loss": -43.48051834106445, "global_step": 264559, "epoch": 2186} {"train_loss": -43.63639450073242, "global_step": 264560, "epoch": 2186} {"train_loss": -43.020931243896484, "global_step": 264561, "epoch": 2186} {"train_loss": -43.591609954833984, "global_step": 264562, "epoch": 2186} {"train_loss": -43.25107192993164, "global_step": 264563, "epoch": 2186} {"train_loss": -44.07474136352539, "global_step": 264564, "epoch": 2186} {"train_loss": -43.75754928588867, "global_step": 264565, "epoch": 2186} {"train_loss": -43.819190979003906, "global_step": 264566, "epoch": 2186} {"train_loss": -43.32363510131836, "global_step": 264567, "epoch": 2186} {"train_loss": -44.219276428222656, "global_step": 264568, "epoch": 2186} {"train_loss": -44.0373649597168, "global_step": 264569, "epoch": 2186} {"train_loss": -44.094154357910156, "global_step": 264570, "epoch": 2186} {"train_loss": -44.03570556640625, "global_step": 264571, "epoch": 2186} {"train_loss": -43.876800537109375, "global_step": 264572, "epoch": 2186} {"train_loss": -43.238338470458984, "global_step": 264573, "epoch": 2186} {"train_loss": -44.28029251098633, "global_step": 264574, "epoch": 2186} {"train_loss": -43.64803695678711, "global_step": 264575, "epoch": 2186} {"train_loss": -43.631439208984375, "global_step": 264576, "epoch": 2186} {"train_loss": -44.43360137939453, "global_step": 264577, "epoch": 2186} {"train_loss": -43.95805740356445, "global_step": 264578, "epoch": 2186} {"train_loss": -42.92171859741211, "global_step": 264579, "epoch": 2186} {"train_loss": -44.055538177490234, "global_step": 264580, "epoch": 2186} {"train_loss": -43.8685417175293, "global_step": 264581, "epoch": 2186} {"train_loss": -43.94240951538086, "global_step": 264582, "epoch": 2186} {"train_loss": -42.81869125366211, "global_step": 264583, "epoch": 2186} {"train_loss": -44.109466552734375, "global_step": 264584, "epoch": 2186} {"train_loss": -43.97926712036133, "global_step": 264585, "epoch": 2186} {"train_loss": -44.24968338012695, "global_step": 264586, "epoch": 2186} {"train_loss": -43.16086959838867, "global_step": 264587, "epoch": 2186} {"train_loss": -42.25069046020508, "global_step": 264588, "epoch": 2186} {"train_loss": -42.24130630493164, "global_step": 264589, "epoch": 2186} {"train_loss": -42.08503723144531, "global_step": 264590, "epoch": 2186} {"train_loss": -43.17683792114258, "global_step": 264591, "epoch": 2186} {"train_loss": -44.10720443725586, "global_step": 264592, "epoch": 2186} {"train_loss": -43.19294357299805, "global_step": 264593, "epoch": 2186} {"train_loss": -40.81465530395508, "global_step": 264594, "epoch": 2186} {"train_loss": -42.588375091552734, "global_step": 264595, "epoch": 2186} {"train_loss": -43.00895690917969, "global_step": 264596, "epoch": 2186} {"train_loss": -43.03349685668945, "global_step": 264597, "epoch": 2186} {"train_loss": -42.718570709228516, "global_step": 264598, "epoch": 2186} {"train_loss": -43.03828048706055, "global_step": 264599, "epoch": 2186} {"train_loss": -43.27385711669922, "global_step": 264600, "epoch": 2186} {"train_loss": -43.824947357177734, "global_step": 264601, "epoch": 2186} {"train_loss": -43.34214782714844, "global_step": 264602, "epoch": 2186} {"train_loss": -42.83350372314453, "global_step": 264603, "epoch": 2186} {"train_loss": -42.7656364440918, "global_step": 264604, "epoch": 2186} {"train_loss": -42.605892181396484, "global_step": 264605, "epoch": 2186} {"train_loss": -42.08075714111328, "global_step": 264606, "epoch": 2186} {"train_loss": -42.089576721191406, "global_step": 264607, "epoch": 2186} {"train_loss": -42.99007034301758, "global_step": 264608, "epoch": 2186} {"train_loss": -43.12802505493164, "global_step": 264609, "epoch": 2186} {"train_loss": -43.30783462524414, "global_step": 264610, "epoch": 2186} {"train_loss": -42.591670989990234, "global_step": 264611, "epoch": 2186} {"train_loss": -41.268043518066406, "global_step": 264612, "epoch": 2186} {"train_loss": -44.01715850830078, "global_step": 264613, "epoch": 2186} {"train_loss": -41.772151947021484, "global_step": 264614, "epoch": 2186} {"train_loss": -41.93882751464844, "global_step": 264615, "epoch": 2186} {"train_loss": -42.252933502197266, "global_step": 264616, "epoch": 2186} {"train_loss": -43.21732711791992, "global_step": 264617, "epoch": 2186} {"train_loss": -42.53243637084961, "global_step": 264618, "epoch": 2186} {"train_loss": -42.816261291503906, "global_step": 264619, "epoch": 2186} {"train_loss": -42.74933624267578, "global_step": 264620, "epoch": 2186} {"train_loss": -43.043365478515625, "global_step": 264621, "epoch": 2186} {"train_loss": -43.16056823730469, "global_step": 264622, "epoch": 2186} {"train_loss": -43.5185661315918, "global_step": 264623, "epoch": 2186} {"train_loss": -42.84946823120117, "global_step": 264624, "epoch": 2186} {"train_loss": -44.01038360595703, "global_step": 264625, "epoch": 2186} {"train_loss": -42.40538024902344, "global_step": 264626, "epoch": 2186, "val_loss": 2635074.75} {"train_loss": -43.38622283935547, "global_step": 264627, "epoch": 2187} {"train_loss": -41.68886947631836, "global_step": 264628, "epoch": 2187} {"train_loss": -42.85140609741211, "global_step": 264629, "epoch": 2187} {"train_loss": -43.35714340209961, "global_step": 264630, "epoch": 2187} {"train_loss": -41.67623519897461, "global_step": 264631, "epoch": 2187} {"train_loss": -41.03622817993164, "global_step": 264632, "epoch": 2187} {"train_loss": -42.51994705200195, "global_step": 264633, "epoch": 2187} {"train_loss": -42.91762161254883, "global_step": 264634, "epoch": 2187} {"train_loss": -41.827877044677734, "global_step": 264635, "epoch": 2187} {"train_loss": -41.45612335205078, "global_step": 264636, "epoch": 2187} {"train_loss": -42.37470626831055, "global_step": 264637, "epoch": 2187} {"train_loss": -43.175777435302734, "global_step": 264638, "epoch": 2187} {"train_loss": -41.35358810424805, "global_step": 264639, "epoch": 2187} {"train_loss": -41.81474685668945, "global_step": 264640, "epoch": 2187} {"train_loss": -43.35250473022461, "global_step": 264641, "epoch": 2187} {"train_loss": -40.93693542480469, "global_step": 264642, "epoch": 2187} {"train_loss": -42.30717086791992, "global_step": 264643, "epoch": 2187} {"train_loss": -43.288551330566406, "global_step": 264644, "epoch": 2187} {"train_loss": -42.004417419433594, "global_step": 264645, "epoch": 2187} {"train_loss": -40.59809112548828, "global_step": 264646, "epoch": 2187} {"train_loss": -43.298526763916016, "global_step": 264647, "epoch": 2187} {"train_loss": -43.09040069580078, "global_step": 264648, "epoch": 2187} {"train_loss": -42.94111633300781, "global_step": 264649, "epoch": 2187} {"train_loss": -43.3003044128418, "global_step": 264650, "epoch": 2187} {"train_loss": -43.09886169433594, "global_step": 264651, "epoch": 2187} {"train_loss": -42.829437255859375, "global_step": 264652, "epoch": 2187} {"train_loss": -43.49725341796875, "global_step": 264653, "epoch": 2187} {"train_loss": -43.15574264526367, "global_step": 264654, "epoch": 2187} {"train_loss": -43.69765853881836, "global_step": 264655, "epoch": 2187} {"train_loss": -43.28836441040039, "global_step": 264656, "epoch": 2187} {"train_loss": -43.26333999633789, "global_step": 264657, "epoch": 2187} {"train_loss": -43.75275802612305, "global_step": 264658, "epoch": 2187} {"train_loss": -43.63065719604492, "global_step": 264659, "epoch": 2187} {"train_loss": -43.7780876159668, "global_step": 264660, "epoch": 2187} {"train_loss": -43.84322738647461, "global_step": 264661, "epoch": 2187} {"train_loss": -43.80902099609375, "global_step": 264662, "epoch": 2187} {"train_loss": -43.27438735961914, "global_step": 264663, "epoch": 2187} {"train_loss": -43.9630012512207, "global_step": 264664, "epoch": 2187} {"train_loss": -43.975765228271484, "global_step": 264665, "epoch": 2187} {"train_loss": -43.43318557739258, "global_step": 264666, "epoch": 2187} {"train_loss": -44.1572380065918, "global_step": 264667, "epoch": 2187} {"train_loss": -43.64541244506836, "global_step": 264668, "epoch": 2187} {"train_loss": -43.8836669921875, "global_step": 264669, "epoch": 2187} {"train_loss": -43.803253173828125, "global_step": 264670, "epoch": 2187} {"train_loss": -41.9676628112793, "global_step": 264671, "epoch": 2187} {"train_loss": -43.34564971923828, "global_step": 264672, "epoch": 2187} {"train_loss": -42.352420806884766, "global_step": 264673, "epoch": 2187} {"train_loss": -43.577980041503906, "global_step": 264674, "epoch": 2187} {"train_loss": -43.94309616088867, "global_step": 264675, "epoch": 2187} {"train_loss": -43.26411056518555, "global_step": 264676, "epoch": 2187} {"train_loss": -43.7403678894043, "global_step": 264677, "epoch": 2187} {"train_loss": -43.56532669067383, "global_step": 264678, "epoch": 2187} {"train_loss": -43.33106231689453, "global_step": 264679, "epoch": 2187} {"train_loss": -43.5644645690918, "global_step": 264680, "epoch": 2187} {"train_loss": -43.448699951171875, "global_step": 264681, "epoch": 2187} {"train_loss": -42.1768798828125, "global_step": 264682, "epoch": 2187} {"train_loss": -43.80155563354492, "global_step": 264683, "epoch": 2187} {"train_loss": -43.816802978515625, "global_step": 264684, "epoch": 2187} {"train_loss": -43.65679168701172, "global_step": 264685, "epoch": 2187} {"train_loss": -43.483646392822266, "global_step": 264686, "epoch": 2187} {"train_loss": -43.38691329956055, "global_step": 264687, "epoch": 2187} {"train_loss": -43.61659622192383, "global_step": 264688, "epoch": 2187} {"train_loss": -43.68148422241211, "global_step": 264689, "epoch": 2187} {"train_loss": -42.63325881958008, "global_step": 264690, "epoch": 2187} {"train_loss": -40.80841827392578, "global_step": 264691, "epoch": 2187} {"train_loss": -43.9697265625, "global_step": 264692, "epoch": 2187} {"train_loss": -43.623626708984375, "global_step": 264693, "epoch": 2187} {"train_loss": -41.15818786621094, "global_step": 264694, "epoch": 2187} {"train_loss": -42.6693000793457, "global_step": 264695, "epoch": 2187} {"train_loss": -42.48271179199219, "global_step": 264696, "epoch": 2187} {"train_loss": -40.54757308959961, "global_step": 264697, "epoch": 2187} {"train_loss": -43.07965850830078, "global_step": 264698, "epoch": 2187} {"train_loss": -42.45559310913086, "global_step": 264699, "epoch": 2187} {"train_loss": -40.69568634033203, "global_step": 264700, "epoch": 2187} {"train_loss": -42.60372543334961, "global_step": 264701, "epoch": 2187} {"train_loss": -42.24131393432617, "global_step": 264702, "epoch": 2187} {"train_loss": -41.18772506713867, "global_step": 264703, "epoch": 2187} {"train_loss": -41.66389083862305, "global_step": 264704, "epoch": 2187} {"train_loss": -41.12615966796875, "global_step": 264705, "epoch": 2187} {"train_loss": -41.53644561767578, "global_step": 264706, "epoch": 2187} {"train_loss": -39.44984817504883, "global_step": 264707, "epoch": 2187} {"train_loss": -42.2279052734375, "global_step": 264708, "epoch": 2187} {"train_loss": -38.30609893798828, "global_step": 264709, "epoch": 2187} {"train_loss": -41.37388610839844, "global_step": 264710, "epoch": 2187} {"train_loss": -36.52206039428711, "global_step": 264711, "epoch": 2187} {"train_loss": -36.28696823120117, "global_step": 264712, "epoch": 2187} {"train_loss": -41.753021240234375, "global_step": 264713, "epoch": 2187} {"train_loss": -35.5024528503418, "global_step": 264714, "epoch": 2187} {"train_loss": -39.349246978759766, "global_step": 264715, "epoch": 2187} {"train_loss": -37.65279006958008, "global_step": 264716, "epoch": 2187} {"train_loss": -38.69789505004883, "global_step": 264717, "epoch": 2187} {"train_loss": -40.107112884521484, "global_step": 264718, "epoch": 2187} {"train_loss": -36.95745849609375, "global_step": 264719, "epoch": 2187} {"train_loss": -41.751312255859375, "global_step": 264720, "epoch": 2187} {"train_loss": -38.591487884521484, "global_step": 264721, "epoch": 2187} {"train_loss": -41.74351119995117, "global_step": 264722, "epoch": 2187} {"train_loss": -38.63373565673828, "global_step": 264723, "epoch": 2187} {"train_loss": -41.93242263793945, "global_step": 264724, "epoch": 2187} {"train_loss": -39.92922592163086, "global_step": 264725, "epoch": 2187} {"train_loss": -41.66917419433594, "global_step": 264726, "epoch": 2187} {"train_loss": -41.43537139892578, "global_step": 264727, "epoch": 2187} {"train_loss": -41.6937370300293, "global_step": 264728, "epoch": 2187} {"train_loss": -40.16147994995117, "global_step": 264729, "epoch": 2187} {"train_loss": -40.903194427490234, "global_step": 264730, "epoch": 2187} {"train_loss": -42.79282760620117, "global_step": 264731, "epoch": 2187} {"train_loss": -40.82240676879883, "global_step": 264732, "epoch": 2187} {"train_loss": -42.05058670043945, "global_step": 264733, "epoch": 2187} {"train_loss": -42.01400375366211, "global_step": 264734, "epoch": 2187} {"train_loss": -41.30259704589844, "global_step": 264735, "epoch": 2187} {"train_loss": -41.48978805541992, "global_step": 264736, "epoch": 2187} {"train_loss": -42.34547805786133, "global_step": 264737, "epoch": 2187} {"train_loss": -41.953792572021484, "global_step": 264738, "epoch": 2187} {"train_loss": -42.445343017578125, "global_step": 264739, "epoch": 2187} {"train_loss": -42.726619720458984, "global_step": 264740, "epoch": 2187} {"train_loss": -42.70652770996094, "global_step": 264741, "epoch": 2187} {"train_loss": -42.865386962890625, "global_step": 264742, "epoch": 2187} {"train_loss": -41.854042053222656, "global_step": 264743, "epoch": 2187} {"train_loss": -42.894805908203125, "global_step": 264744, "epoch": 2187} {"train_loss": -42.704620361328125, "global_step": 264745, "epoch": 2187} {"train_loss": -43.148719787597656, "global_step": 264746, "epoch": 2187} {"train_loss": -42.1385587266654, "global_step": 264747, "epoch": 2187, "val_loss": 2574443.0} {"train_loss": -42.22732162475586, "global_step": 264748, "epoch": 2188} {"train_loss": -43.138797760009766, "global_step": 264749, "epoch": 2188} {"train_loss": -41.94071960449219, "global_step": 264750, "epoch": 2188} {"train_loss": -43.54449462890625, "global_step": 264751, "epoch": 2188} {"train_loss": -42.62226867675781, "global_step": 264752, "epoch": 2188} {"train_loss": -42.45050811767578, "global_step": 264753, "epoch": 2188} {"train_loss": -42.80067825317383, "global_step": 264754, "epoch": 2188} {"train_loss": -43.41193389892578, "global_step": 264755, "epoch": 2188} {"train_loss": -43.160133361816406, "global_step": 264756, "epoch": 2188} {"train_loss": -43.591896057128906, "global_step": 264757, "epoch": 2188} {"train_loss": -43.477195739746094, "global_step": 264758, "epoch": 2188} {"train_loss": -43.785152435302734, "global_step": 264759, "epoch": 2188} {"train_loss": -43.68193435668945, "global_step": 264760, "epoch": 2188} {"train_loss": -43.44062423706055, "global_step": 264761, "epoch": 2188} {"train_loss": -43.470802307128906, "global_step": 264762, "epoch": 2188} {"train_loss": -43.474525451660156, "global_step": 264763, "epoch": 2188} {"train_loss": -43.82455062866211, "global_step": 264764, "epoch": 2188} {"train_loss": -43.63596725463867, "global_step": 264765, "epoch": 2188} {"train_loss": -43.32291030883789, "global_step": 264766, "epoch": 2188} {"train_loss": -43.7120475769043, "global_step": 264767, "epoch": 2188} {"train_loss": -43.51109313964844, "global_step": 264768, "epoch": 2188} {"train_loss": -43.83382797241211, "global_step": 264769, "epoch": 2188} {"train_loss": -43.81901168823242, "global_step": 264770, "epoch": 2188} {"train_loss": -43.80860137939453, "global_step": 264771, "epoch": 2188} {"train_loss": -44.242218017578125, "global_step": 264772, "epoch": 2188} {"train_loss": -43.7525520324707, "global_step": 264773, "epoch": 2188} {"train_loss": -43.82545852661133, "global_step": 264774, "epoch": 2188} {"train_loss": -43.830047607421875, "global_step": 264775, "epoch": 2188} {"train_loss": -43.86945343017578, "global_step": 264776, "epoch": 2188} {"train_loss": -44.09170150756836, "global_step": 264777, "epoch": 2188} {"train_loss": -44.63204574584961, "global_step": 264778, "epoch": 2188} {"train_loss": -43.962158203125, "global_step": 264779, "epoch": 2188} {"train_loss": -43.93697738647461, "global_step": 264780, "epoch": 2188} {"train_loss": -44.305824279785156, "global_step": 264781, "epoch": 2188} {"train_loss": -43.784523010253906, "global_step": 264782, "epoch": 2188} {"train_loss": -44.434539794921875, "global_step": 264783, "epoch": 2188} {"train_loss": -44.027427673339844, "global_step": 264784, "epoch": 2188} {"train_loss": -44.26359939575195, "global_step": 264785, "epoch": 2188} {"train_loss": -44.4151496887207, "global_step": 264786, "epoch": 2188} {"train_loss": -44.01076889038086, "global_step": 264787, "epoch": 2188} {"train_loss": -44.11812210083008, "global_step": 264788, "epoch": 2188} {"train_loss": -44.472076416015625, "global_step": 264789, "epoch": 2188} {"train_loss": -44.35376739501953, "global_step": 264790, "epoch": 2188} {"train_loss": -44.492652893066406, "global_step": 264791, "epoch": 2188} {"train_loss": -44.31535720825195, "global_step": 264792, "epoch": 2188} {"train_loss": -43.89667510986328, "global_step": 264793, "epoch": 2188} {"train_loss": -43.86796569824219, "global_step": 264794, "epoch": 2188} {"train_loss": -43.24821090698242, "global_step": 264795, "epoch": 2188} {"train_loss": -44.315040588378906, "global_step": 264796, "epoch": 2188} {"train_loss": -44.28899383544922, "global_step": 264797, "epoch": 2188} {"train_loss": -44.3878059387207, "global_step": 264798, "epoch": 2188} {"train_loss": -44.33819580078125, "global_step": 264799, "epoch": 2188} {"train_loss": -44.50440979003906, "global_step": 264800, "epoch": 2188} {"train_loss": -44.59050369262695, "global_step": 264801, "epoch": 2188} {"train_loss": -44.539703369140625, "global_step": 264802, "epoch": 2188} {"train_loss": -43.2313117980957, "global_step": 264803, "epoch": 2188} {"train_loss": -41.007083892822266, "global_step": 264804, "epoch": 2188} {"train_loss": -41.52688217163086, "global_step": 264805, "epoch": 2188} {"train_loss": -44.17375564575195, "global_step": 264806, "epoch": 2188} {"train_loss": -43.89936447143555, "global_step": 264807, "epoch": 2188} {"train_loss": -41.069374084472656, "global_step": 264808, "epoch": 2188} {"train_loss": -40.64814758300781, "global_step": 264809, "epoch": 2188} {"train_loss": -43.29450988769531, "global_step": 264810, "epoch": 2188} {"train_loss": -40.083648681640625, "global_step": 264811, "epoch": 2188} {"train_loss": -39.570556640625, "global_step": 264812, "epoch": 2188} {"train_loss": -40.13679122924805, "global_step": 264813, "epoch": 2188} {"train_loss": -37.524532318115234, "global_step": 264814, "epoch": 2188} {"train_loss": -36.47016143798828, "global_step": 264815, "epoch": 2188} {"train_loss": -38.74188232421875, "global_step": 264816, "epoch": 2188} {"train_loss": -36.47705841064453, "global_step": 264817, "epoch": 2188} {"train_loss": -37.576026916503906, "global_step": 264818, "epoch": 2188} {"train_loss": -38.91884231567383, "global_step": 264819, "epoch": 2188} {"train_loss": -39.79283905029297, "global_step": 264820, "epoch": 2188} {"train_loss": -36.58185577392578, "global_step": 264821, "epoch": 2188} {"train_loss": -39.18605041503906, "global_step": 264822, "epoch": 2188} {"train_loss": -37.24947738647461, "global_step": 264823, "epoch": 2188} {"train_loss": -38.132381439208984, "global_step": 264824, "epoch": 2188} {"train_loss": -40.6453857421875, "global_step": 264825, "epoch": 2188} {"train_loss": -38.62615966796875, "global_step": 264826, "epoch": 2188} {"train_loss": -38.981849670410156, "global_step": 264827, "epoch": 2188} {"train_loss": -40.06140899658203, "global_step": 264828, "epoch": 2188} {"train_loss": -39.41017532348633, "global_step": 264829, "epoch": 2188} {"train_loss": -39.86147689819336, "global_step": 264830, "epoch": 2188} {"train_loss": -41.24673080444336, "global_step": 264831, "epoch": 2188} {"train_loss": -39.789005279541016, "global_step": 264832, "epoch": 2188} {"train_loss": -42.55323028564453, "global_step": 264833, "epoch": 2188} {"train_loss": -39.318172454833984, "global_step": 264834, "epoch": 2188} {"train_loss": -40.5245475769043, "global_step": 264835, "epoch": 2188} {"train_loss": -40.9788703918457, "global_step": 264836, "epoch": 2188} {"train_loss": -41.14897537231445, "global_step": 264837, "epoch": 2188} {"train_loss": -40.3569221496582, "global_step": 264838, "epoch": 2188} {"train_loss": -40.142147064208984, "global_step": 264839, "epoch": 2188} {"train_loss": -40.6695671081543, "global_step": 264840, "epoch": 2188} {"train_loss": -42.39271545410156, "global_step": 264841, "epoch": 2188} {"train_loss": -39.98025131225586, "global_step": 264842, "epoch": 2188} {"train_loss": -41.8458251953125, "global_step": 264843, "epoch": 2188} {"train_loss": -42.95917892456055, "global_step": 264844, "epoch": 2188} {"train_loss": -42.068565368652344, "global_step": 264845, "epoch": 2188} {"train_loss": -42.049659729003906, "global_step": 264846, "epoch": 2188} {"train_loss": -43.06622314453125, "global_step": 264847, "epoch": 2188} {"train_loss": -42.64576721191406, "global_step": 264848, "epoch": 2188} {"train_loss": -42.5677375793457, "global_step": 264849, "epoch": 2188} {"train_loss": -43.137203216552734, "global_step": 264850, "epoch": 2188} {"train_loss": -42.54166030883789, "global_step": 264851, "epoch": 2188} {"train_loss": -42.91679763793945, "global_step": 264852, "epoch": 2188} {"train_loss": -42.87073516845703, "global_step": 264853, "epoch": 2188} {"train_loss": -42.923484802246094, "global_step": 264854, "epoch": 2188} {"train_loss": -42.54726028442383, "global_step": 264855, "epoch": 2188} {"train_loss": -42.95941162109375, "global_step": 264856, "epoch": 2188} {"train_loss": -42.59339904785156, "global_step": 264857, "epoch": 2188} {"train_loss": -43.022090911865234, "global_step": 264858, "epoch": 2188} {"train_loss": -43.13045120239258, "global_step": 264859, "epoch": 2188} {"train_loss": -43.27203369140625, "global_step": 264860, "epoch": 2188} {"train_loss": -42.96611022949219, "global_step": 264861, "epoch": 2188} {"train_loss": -43.2209587097168, "global_step": 264862, "epoch": 2188} {"train_loss": -42.84648132324219, "global_step": 264863, "epoch": 2188} {"train_loss": -43.19573974609375, "global_step": 264864, "epoch": 2188} {"train_loss": -43.16081619262695, "global_step": 264865, "epoch": 2188} {"train_loss": -43.023765563964844, "global_step": 264866, "epoch": 2188} {"train_loss": -43.0196533203125, "global_step": 264867, "epoch": 2188} {"train_loss": -42.351412371170426, "global_step": 264868, "epoch": 2188, "val_loss": 2586743.25} {"train_loss": -43.54268264770508, "global_step": 264869, "epoch": 2189} {"train_loss": -43.324615478515625, "global_step": 264870, "epoch": 2189} {"train_loss": -43.07902908325195, "global_step": 264871, "epoch": 2189} {"train_loss": -43.577598571777344, "global_step": 264872, "epoch": 2189} {"train_loss": -43.68059539794922, "global_step": 264873, "epoch": 2189} {"train_loss": -43.80918502807617, "global_step": 264874, "epoch": 2189} {"train_loss": -43.10992431640625, "global_step": 264875, "epoch": 2189} {"train_loss": -43.44761657714844, "global_step": 264876, "epoch": 2189} {"train_loss": -43.19993209838867, "global_step": 264877, "epoch": 2189} {"train_loss": -43.67521286010742, "global_step": 264878, "epoch": 2189} {"train_loss": -43.427406311035156, "global_step": 264879, "epoch": 2189} {"train_loss": -44.28456497192383, "global_step": 264880, "epoch": 2189} {"train_loss": -43.741451263427734, "global_step": 264881, "epoch": 2189} {"train_loss": -43.92974853515625, "global_step": 264882, "epoch": 2189} {"train_loss": -43.449501037597656, "global_step": 264883, "epoch": 2189} {"train_loss": -42.9754753112793, "global_step": 264884, "epoch": 2189} {"train_loss": -43.65778732299805, "global_step": 264885, "epoch": 2189} {"train_loss": -43.350799560546875, "global_step": 264886, "epoch": 2189} {"train_loss": -42.89433670043945, "global_step": 264887, "epoch": 2189} {"train_loss": -42.934017181396484, "global_step": 264888, "epoch": 2189} {"train_loss": -43.6569938659668, "global_step": 264889, "epoch": 2189} {"train_loss": -43.0890998840332, "global_step": 264890, "epoch": 2189} {"train_loss": -43.82278823852539, "global_step": 264891, "epoch": 2189} {"train_loss": -42.944061279296875, "global_step": 264892, "epoch": 2189} {"train_loss": -43.793373107910156, "global_step": 264893, "epoch": 2189} {"train_loss": -43.888668060302734, "global_step": 264894, "epoch": 2189} {"train_loss": -43.8603515625, "global_step": 264895, "epoch": 2189} {"train_loss": -43.50466537475586, "global_step": 264896, "epoch": 2189} {"train_loss": -43.57094955444336, "global_step": 264897, "epoch": 2189} {"train_loss": -44.47528839111328, "global_step": 264898, "epoch": 2189} {"train_loss": -43.33949661254883, "global_step": 264899, "epoch": 2189} {"train_loss": -42.4404296875, "global_step": 264900, "epoch": 2189} {"train_loss": -43.94108963012695, "global_step": 264901, "epoch": 2189} {"train_loss": -43.64051055908203, "global_step": 264902, "epoch": 2189} {"train_loss": -43.360931396484375, "global_step": 264903, "epoch": 2189} {"train_loss": -43.89728546142578, "global_step": 264904, "epoch": 2189} {"train_loss": -43.62531280517578, "global_step": 264905, "epoch": 2189} {"train_loss": -42.84360885620117, "global_step": 264906, "epoch": 2189} {"train_loss": -43.75788497924805, "global_step": 264907, "epoch": 2189} {"train_loss": -43.5492057800293, "global_step": 264908, "epoch": 2189} {"train_loss": -42.57351303100586, "global_step": 264909, "epoch": 2189} {"train_loss": -43.74477005004883, "global_step": 264910, "epoch": 2189} {"train_loss": -43.79345703125, "global_step": 264911, "epoch": 2189} {"train_loss": -42.995758056640625, "global_step": 264912, "epoch": 2189} {"train_loss": -42.79270553588867, "global_step": 264913, "epoch": 2189} {"train_loss": -43.73945999145508, "global_step": 264914, "epoch": 2189} {"train_loss": -43.835567474365234, "global_step": 264915, "epoch": 2189} {"train_loss": -43.40571212768555, "global_step": 264916, "epoch": 2189} {"train_loss": -43.8260383605957, "global_step": 264917, "epoch": 2189} {"train_loss": -42.978031158447266, "global_step": 264918, "epoch": 2189} {"train_loss": -43.84981918334961, "global_step": 264919, "epoch": 2189} {"train_loss": -43.11018371582031, "global_step": 264920, "epoch": 2189} {"train_loss": -43.05605697631836, "global_step": 264921, "epoch": 2189} {"train_loss": -43.26993942260742, "global_step": 264922, "epoch": 2189} {"train_loss": -43.997596740722656, "global_step": 264923, "epoch": 2189} {"train_loss": -43.586280822753906, "global_step": 264924, "epoch": 2189} {"train_loss": -43.467857360839844, "global_step": 264925, "epoch": 2189} {"train_loss": -43.45985794067383, "global_step": 264926, "epoch": 2189} {"train_loss": -43.09299850463867, "global_step": 264927, "epoch": 2189} {"train_loss": -43.35083770751953, "global_step": 264928, "epoch": 2189} {"train_loss": -43.86997604370117, "global_step": 264929, "epoch": 2189} {"train_loss": -43.45794677734375, "global_step": 264930, "epoch": 2189} {"train_loss": -42.83928680419922, "global_step": 264931, "epoch": 2189} {"train_loss": -42.644554138183594, "global_step": 264932, "epoch": 2189} {"train_loss": -41.47787094116211, "global_step": 264933, "epoch": 2189} {"train_loss": -41.90774917602539, "global_step": 264934, "epoch": 2189} {"train_loss": -43.94474411010742, "global_step": 264935, "epoch": 2189} {"train_loss": -43.872764587402344, "global_step": 264936, "epoch": 2189} {"train_loss": -43.0052604675293, "global_step": 264937, "epoch": 2189} {"train_loss": -42.78471755981445, "global_step": 264938, "epoch": 2189} {"train_loss": -42.39902877807617, "global_step": 264939, "epoch": 2189} {"train_loss": -43.47962188720703, "global_step": 264940, "epoch": 2189} {"train_loss": -43.9980583190918, "global_step": 264941, "epoch": 2189} {"train_loss": -43.41048812866211, "global_step": 264942, "epoch": 2189} {"train_loss": -42.72383499145508, "global_step": 264943, "epoch": 2189} {"train_loss": -44.5999870300293, "global_step": 264944, "epoch": 2189} {"train_loss": -42.6358528137207, "global_step": 264945, "epoch": 2189} {"train_loss": -39.84133529663086, "global_step": 264946, "epoch": 2189} {"train_loss": -44.04466247558594, "global_step": 264947, "epoch": 2189} {"train_loss": -40.27349090576172, "global_step": 264948, "epoch": 2189} {"train_loss": -39.317291259765625, "global_step": 264949, "epoch": 2189} {"train_loss": -43.5026741027832, "global_step": 264950, "epoch": 2189} {"train_loss": -39.46149444580078, "global_step": 264951, "epoch": 2189} {"train_loss": -43.47282791137695, "global_step": 264952, "epoch": 2189} {"train_loss": -41.029541015625, "global_step": 264953, "epoch": 2189} {"train_loss": -42.48270797729492, "global_step": 264954, "epoch": 2189} {"train_loss": -42.001129150390625, "global_step": 264955, "epoch": 2189} {"train_loss": -40.80462646484375, "global_step": 264956, "epoch": 2189} {"train_loss": -42.29657745361328, "global_step": 264957, "epoch": 2189} {"train_loss": -42.797054290771484, "global_step": 264958, "epoch": 2189} {"train_loss": -42.827850341796875, "global_step": 264959, "epoch": 2189} {"train_loss": -42.78781509399414, "global_step": 264960, "epoch": 2189} {"train_loss": -42.66453170776367, "global_step": 264961, "epoch": 2189} {"train_loss": -42.99808883666992, "global_step": 264962, "epoch": 2189} {"train_loss": -42.22087860107422, "global_step": 264963, "epoch": 2189} {"train_loss": -42.90097427368164, "global_step": 264964, "epoch": 2189} {"train_loss": -42.5417594909668, "global_step": 264965, "epoch": 2189} {"train_loss": -40.694522857666016, "global_step": 264966, "epoch": 2189} {"train_loss": -43.11494064331055, "global_step": 264967, "epoch": 2189} {"train_loss": -41.434288024902344, "global_step": 264968, "epoch": 2189} {"train_loss": -39.529388427734375, "global_step": 264969, "epoch": 2189} {"train_loss": -42.67881393432617, "global_step": 264970, "epoch": 2189} {"train_loss": -41.62610626220703, "global_step": 264971, "epoch": 2189} {"train_loss": -43.67753219604492, "global_step": 264972, "epoch": 2189} {"train_loss": -41.48446273803711, "global_step": 264973, "epoch": 2189} {"train_loss": -41.983123779296875, "global_step": 264974, "epoch": 2189} {"train_loss": -42.08588409423828, "global_step": 264975, "epoch": 2189} {"train_loss": -43.2922477722168, "global_step": 264976, "epoch": 2189} {"train_loss": -42.070335388183594, "global_step": 264977, "epoch": 2189} {"train_loss": -42.43721389770508, "global_step": 264978, "epoch": 2189} {"train_loss": -40.1600456237793, "global_step": 264979, "epoch": 2189} {"train_loss": -42.883155822753906, "global_step": 264980, "epoch": 2189} {"train_loss": -42.913352966308594, "global_step": 264981, "epoch": 2189} {"train_loss": -40.5454216003418, "global_step": 264982, "epoch": 2189} {"train_loss": -42.52600860595703, "global_step": 264983, "epoch": 2189} {"train_loss": -42.21944808959961, "global_step": 264984, "epoch": 2189} {"train_loss": -43.04191970825195, "global_step": 264985, "epoch": 2189} {"train_loss": -43.91166305541992, "global_step": 264986, "epoch": 2189} {"train_loss": -42.615692138671875, "global_step": 264987, "epoch": 2189} {"train_loss": -41.40793991088867, "global_step": 264988, "epoch": 2189} {"train_loss": -42.91456061749419, "global_step": 264989, "epoch": 2189, "val_loss": 2765006.0} {"train_loss": -40.1144905090332, "global_step": 264990, "epoch": 2190} {"train_loss": -43.40065383911133, "global_step": 264991, "epoch": 2190} {"train_loss": -43.239349365234375, "global_step": 264992, "epoch": 2190} {"train_loss": -42.21418380737305, "global_step": 264993, "epoch": 2190} {"train_loss": -41.2201042175293, "global_step": 264994, "epoch": 2190} {"train_loss": -42.84402084350586, "global_step": 264995, "epoch": 2190} {"train_loss": -38.2054443359375, "global_step": 264996, "epoch": 2190} {"train_loss": -41.53586196899414, "global_step": 264997, "epoch": 2190} {"train_loss": -42.314720153808594, "global_step": 264998, "epoch": 2190} {"train_loss": -43.22441864013672, "global_step": 264999, "epoch": 2190} {"train_loss": -41.00637435913086, "global_step": 265000, "epoch": 2190} {"train_loss": -42.36249923706055, "global_step": 265001, "epoch": 2190} {"train_loss": -41.04560470581055, "global_step": 265002, "epoch": 2190} {"train_loss": -42.06814193725586, "global_step": 265003, "epoch": 2190} {"train_loss": -42.12229537963867, "global_step": 265004, "epoch": 2190} {"train_loss": -42.354740142822266, "global_step": 265005, "epoch": 2190} {"train_loss": -43.07210922241211, "global_step": 265006, "epoch": 2190} {"train_loss": -42.56637191772461, "global_step": 265007, "epoch": 2190} {"train_loss": -42.392513275146484, "global_step": 265008, "epoch": 2190} {"train_loss": -43.2682991027832, "global_step": 265009, "epoch": 2190} {"train_loss": -42.06403732299805, "global_step": 265010, "epoch": 2190} {"train_loss": -43.290584564208984, "global_step": 265011, "epoch": 2190} {"train_loss": -41.92580032348633, "global_step": 265012, "epoch": 2190} {"train_loss": -43.88239288330078, "global_step": 265013, "epoch": 2190} {"train_loss": -42.435298919677734, "global_step": 265014, "epoch": 2190} {"train_loss": -42.78753662109375, "global_step": 265015, "epoch": 2190} {"train_loss": -37.227989196777344, "global_step": 265016, "epoch": 2190} {"train_loss": -42.04209518432617, "global_step": 265017, "epoch": 2190} {"train_loss": -44.162628173828125, "global_step": 265018, "epoch": 2190} {"train_loss": -43.309234619140625, "global_step": 265019, "epoch": 2190} {"train_loss": -42.80885696411133, "global_step": 265020, "epoch": 2190} {"train_loss": -43.34741973876953, "global_step": 265021, "epoch": 2190} {"train_loss": -43.208003997802734, "global_step": 265022, "epoch": 2190} {"train_loss": -43.145599365234375, "global_step": 265023, "epoch": 2190} {"train_loss": -42.3047981262207, "global_step": 265024, "epoch": 2190} {"train_loss": -43.316158294677734, "global_step": 265025, "epoch": 2190} {"train_loss": -42.85858917236328, "global_step": 265026, "epoch": 2190} {"train_loss": -43.665367126464844, "global_step": 265027, "epoch": 2190} {"train_loss": -43.249359130859375, "global_step": 265028, "epoch": 2190} {"train_loss": -43.594032287597656, "global_step": 265029, "epoch": 2190} {"train_loss": -43.206417083740234, "global_step": 265030, "epoch": 2190} {"train_loss": -43.007545471191406, "global_step": 265031, "epoch": 2190} {"train_loss": -43.363616943359375, "global_step": 265032, "epoch": 2190} {"train_loss": -43.5303840637207, "global_step": 265033, "epoch": 2190} {"train_loss": -41.60407257080078, "global_step": 265034, "epoch": 2190} {"train_loss": -42.379249572753906, "global_step": 265035, "epoch": 2190} {"train_loss": -42.9859733581543, "global_step": 265036, "epoch": 2190} {"train_loss": -43.03955078125, "global_step": 265037, "epoch": 2190} {"train_loss": -43.46262741088867, "global_step": 265038, "epoch": 2190} {"train_loss": -39.00482177734375, "global_step": 265039, "epoch": 2190} {"train_loss": -42.82384490966797, "global_step": 265040, "epoch": 2190} {"train_loss": -43.51713562011719, "global_step": 265041, "epoch": 2190} {"train_loss": -43.12369918823242, "global_step": 265042, "epoch": 2190} {"train_loss": -43.45493698120117, "global_step": 265043, "epoch": 2190} {"train_loss": -42.616600036621094, "global_step": 265044, "epoch": 2190} {"train_loss": -43.57798385620117, "global_step": 265045, "epoch": 2190} {"train_loss": -42.13897705078125, "global_step": 265046, "epoch": 2190} {"train_loss": -43.01247787475586, "global_step": 265047, "epoch": 2190} {"train_loss": -42.94898223876953, "global_step": 265048, "epoch": 2190} {"train_loss": -43.64207077026367, "global_step": 265049, "epoch": 2190} {"train_loss": -43.03201675415039, "global_step": 265050, "epoch": 2190} {"train_loss": -43.57638168334961, "global_step": 265051, "epoch": 2190} {"train_loss": -43.587459564208984, "global_step": 265052, "epoch": 2190} {"train_loss": -44.11122131347656, "global_step": 265053, "epoch": 2190} {"train_loss": -42.959232330322266, "global_step": 265054, "epoch": 2190} {"train_loss": -40.99127960205078, "global_step": 265055, "epoch": 2190} {"train_loss": -40.70930862426758, "global_step": 265056, "epoch": 2190} {"train_loss": -43.70815658569336, "global_step": 265057, "epoch": 2190} {"train_loss": -43.00847625732422, "global_step": 265058, "epoch": 2190} {"train_loss": -42.1889762878418, "global_step": 265059, "epoch": 2190} {"train_loss": -42.06012725830078, "global_step": 265060, "epoch": 2190} {"train_loss": -43.38837814331055, "global_step": 265061, "epoch": 2190} {"train_loss": -42.837440490722656, "global_step": 265062, "epoch": 2190} {"train_loss": -41.527339935302734, "global_step": 265063, "epoch": 2190} {"train_loss": -41.32672119140625, "global_step": 265064, "epoch": 2190} {"train_loss": -39.58448791503906, "global_step": 265065, "epoch": 2190} {"train_loss": -39.28544616699219, "global_step": 265066, "epoch": 2190} {"train_loss": -41.699214935302734, "global_step": 265067, "epoch": 2190} {"train_loss": -40.68467712402344, "global_step": 265068, "epoch": 2190} {"train_loss": -38.957611083984375, "global_step": 265069, "epoch": 2190} {"train_loss": -42.116973876953125, "global_step": 265070, "epoch": 2190} {"train_loss": -40.90778732299805, "global_step": 265071, "epoch": 2190} {"train_loss": -42.077606201171875, "global_step": 265072, "epoch": 2190} {"train_loss": -41.45598220825195, "global_step": 265073, "epoch": 2190} {"train_loss": -41.1260871887207, "global_step": 265074, "epoch": 2190} {"train_loss": -41.00375747680664, "global_step": 265075, "epoch": 2190} {"train_loss": -42.515350341796875, "global_step": 265076, "epoch": 2190} {"train_loss": -42.8632698059082, "global_step": 265077, "epoch": 2190} {"train_loss": -42.77800369262695, "global_step": 265078, "epoch": 2190} {"train_loss": -42.93864059448242, "global_step": 265079, "epoch": 2190} {"train_loss": -42.84440612792969, "global_step": 265080, "epoch": 2190} {"train_loss": -41.867042541503906, "global_step": 265081, "epoch": 2190} {"train_loss": -42.590614318847656, "global_step": 265082, "epoch": 2190} {"train_loss": -42.774051666259766, "global_step": 265083, "epoch": 2190} {"train_loss": -43.016448974609375, "global_step": 265084, "epoch": 2190} {"train_loss": -41.506591796875, "global_step": 265085, "epoch": 2190} {"train_loss": -39.326969146728516, "global_step": 265086, "epoch": 2190} {"train_loss": -41.15174102783203, "global_step": 265087, "epoch": 2190} {"train_loss": -42.81855392456055, "global_step": 265088, "epoch": 2190} {"train_loss": -42.48904037475586, "global_step": 265089, "epoch": 2190} {"train_loss": -41.57009506225586, "global_step": 265090, "epoch": 2190} {"train_loss": -42.76274108886719, "global_step": 265091, "epoch": 2190} {"train_loss": -42.48128128051758, "global_step": 265092, "epoch": 2190} {"train_loss": -38.30220413208008, "global_step": 265093, "epoch": 2190} {"train_loss": -42.29338455200195, "global_step": 265094, "epoch": 2190} {"train_loss": -43.20511245727539, "global_step": 265095, "epoch": 2190} {"train_loss": -40.47095489501953, "global_step": 265096, "epoch": 2190} {"train_loss": -42.142391204833984, "global_step": 265097, "epoch": 2190} {"train_loss": -43.190673828125, "global_step": 265098, "epoch": 2190} {"train_loss": -43.19010543823242, "global_step": 265099, "epoch": 2190} {"train_loss": -43.047149658203125, "global_step": 265100, "epoch": 2190} {"train_loss": -42.45221710205078, "global_step": 265101, "epoch": 2190} {"train_loss": -43.18246078491211, "global_step": 265102, "epoch": 2190} {"train_loss": -43.009521484375, "global_step": 265103, "epoch": 2190} {"train_loss": -42.10964584350586, "global_step": 265104, "epoch": 2190} {"train_loss": -43.17566680908203, "global_step": 265105, "epoch": 2190} {"train_loss": -43.1995964050293, "global_step": 265106, "epoch": 2190} {"train_loss": -43.562191009521484, "global_step": 265107, "epoch": 2190} {"train_loss": -43.425140380859375, "global_step": 265108, "epoch": 2190} {"train_loss": -42.523860931396484, "global_step": 265109, "epoch": 2190} {"train_loss": -42.34612939377462, "global_step": 265110, "epoch": 2190, "val_loss": 2684846.25} {"train_loss": -42.5404167175293, "global_step": 265111, "epoch": 2191} {"train_loss": -41.90578079223633, "global_step": 265112, "epoch": 2191} {"train_loss": -42.07992172241211, "global_step": 265113, "epoch": 2191} {"train_loss": -39.89101028442383, "global_step": 265114, "epoch": 2191} {"train_loss": -42.65270233154297, "global_step": 265115, "epoch": 2191} {"train_loss": -43.511531829833984, "global_step": 265116, "epoch": 2191} {"train_loss": -43.17308807373047, "global_step": 265117, "epoch": 2191} {"train_loss": -41.83820343017578, "global_step": 265118, "epoch": 2191} {"train_loss": -43.14506912231445, "global_step": 265119, "epoch": 2191} {"train_loss": -41.96519088745117, "global_step": 265120, "epoch": 2191} {"train_loss": -40.74924850463867, "global_step": 265121, "epoch": 2191} {"train_loss": -41.93388748168945, "global_step": 265122, "epoch": 2191} {"train_loss": -39.92658615112305, "global_step": 265123, "epoch": 2191} {"train_loss": -43.12527847290039, "global_step": 265124, "epoch": 2191} {"train_loss": -39.425106048583984, "global_step": 265125, "epoch": 2191} {"train_loss": -42.2923469543457, "global_step": 265126, "epoch": 2191} {"train_loss": -37.926544189453125, "global_step": 265127, "epoch": 2191} {"train_loss": -42.48060989379883, "global_step": 265128, "epoch": 2191} {"train_loss": -38.0352897644043, "global_step": 265129, "epoch": 2191} {"train_loss": -43.239524841308594, "global_step": 265130, "epoch": 2191} {"train_loss": -41.179744720458984, "global_step": 265131, "epoch": 2191} {"train_loss": -41.73200225830078, "global_step": 265132, "epoch": 2191} {"train_loss": -40.62884521484375, "global_step": 265133, "epoch": 2191} {"train_loss": -42.33928298950195, "global_step": 265134, "epoch": 2191} {"train_loss": -40.85715103149414, "global_step": 265135, "epoch": 2191} {"train_loss": -42.005043029785156, "global_step": 265136, "epoch": 2191} {"train_loss": -40.44002914428711, "global_step": 265137, "epoch": 2191} {"train_loss": -40.82159423828125, "global_step": 265138, "epoch": 2191} {"train_loss": -40.952857971191406, "global_step": 265139, "epoch": 2191} {"train_loss": -43.4193115234375, "global_step": 265140, "epoch": 2191} {"train_loss": -40.77876281738281, "global_step": 265141, "epoch": 2191} {"train_loss": -41.91682815551758, "global_step": 265142, "epoch": 2191} {"train_loss": -41.38282012939453, "global_step": 265143, "epoch": 2191} {"train_loss": -42.39262008666992, "global_step": 265144, "epoch": 2191} {"train_loss": -41.3041877746582, "global_step": 265145, "epoch": 2191} {"train_loss": -40.317604064941406, "global_step": 265146, "epoch": 2191} {"train_loss": -42.10853958129883, "global_step": 265147, "epoch": 2191} {"train_loss": -42.77913284301758, "global_step": 265148, "epoch": 2191} {"train_loss": -41.60835266113281, "global_step": 265149, "epoch": 2191} {"train_loss": -42.615657806396484, "global_step": 265150, "epoch": 2191} {"train_loss": -43.16604232788086, "global_step": 265151, "epoch": 2191} {"train_loss": -40.03361892700195, "global_step": 265152, "epoch": 2191} {"train_loss": -41.96723556518555, "global_step": 265153, "epoch": 2191} {"train_loss": -42.798336029052734, "global_step": 265154, "epoch": 2191} {"train_loss": -42.04935836791992, "global_step": 265155, "epoch": 2191} {"train_loss": -42.215484619140625, "global_step": 265156, "epoch": 2191} {"train_loss": -43.0223274230957, "global_step": 265157, "epoch": 2191} {"train_loss": -41.91396713256836, "global_step": 265158, "epoch": 2191} {"train_loss": -42.02717590332031, "global_step": 265159, "epoch": 2191} {"train_loss": -41.329345703125, "global_step": 265160, "epoch": 2191} {"train_loss": -43.16585159301758, "global_step": 265161, "epoch": 2191} {"train_loss": -41.55498123168945, "global_step": 265162, "epoch": 2191} {"train_loss": -42.897579193115234, "global_step": 265163, "epoch": 2191} {"train_loss": -42.504981994628906, "global_step": 265164, "epoch": 2191} {"train_loss": -42.50609588623047, "global_step": 265165, "epoch": 2191} {"train_loss": -43.4463005065918, "global_step": 265166, "epoch": 2191} {"train_loss": -42.43025207519531, "global_step": 265167, "epoch": 2191} {"train_loss": -42.64018630981445, "global_step": 265168, "epoch": 2191} {"train_loss": -42.7470703125, "global_step": 265169, "epoch": 2191} {"train_loss": -41.5462532043457, "global_step": 265170, "epoch": 2191} {"train_loss": -42.939849853515625, "global_step": 265171, "epoch": 2191} {"train_loss": -42.33309555053711, "global_step": 265172, "epoch": 2191} {"train_loss": -42.87031555175781, "global_step": 265173, "epoch": 2191} {"train_loss": -43.42502212524414, "global_step": 265174, "epoch": 2191} {"train_loss": -42.71957015991211, "global_step": 265175, "epoch": 2191} {"train_loss": -42.5578498840332, "global_step": 265176, "epoch": 2191} {"train_loss": -43.955223083496094, "global_step": 265177, "epoch": 2191} {"train_loss": -42.31467819213867, "global_step": 265178, "epoch": 2191} {"train_loss": -42.62934494018555, "global_step": 265179, "epoch": 2191} {"train_loss": -43.224220275878906, "global_step": 265180, "epoch": 2191} {"train_loss": -43.25545883178711, "global_step": 265181, "epoch": 2191} {"train_loss": -42.75101852416992, "global_step": 265182, "epoch": 2191} {"train_loss": -43.630184173583984, "global_step": 265183, "epoch": 2191} {"train_loss": -42.87321090698242, "global_step": 265184, "epoch": 2191} {"train_loss": -42.676490783691406, "global_step": 265185, "epoch": 2191} {"train_loss": -43.48515701293945, "global_step": 265186, "epoch": 2191} {"train_loss": -43.02745819091797, "global_step": 265187, "epoch": 2191} {"train_loss": -43.34675216674805, "global_step": 265188, "epoch": 2191} {"train_loss": -43.13840866088867, "global_step": 265189, "epoch": 2191} {"train_loss": -43.056095123291016, "global_step": 265190, "epoch": 2191} {"train_loss": -43.46759796142578, "global_step": 265191, "epoch": 2191} {"train_loss": -42.98956298828125, "global_step": 265192, "epoch": 2191} {"train_loss": -43.3415641784668, "global_step": 265193, "epoch": 2191} {"train_loss": -43.58350372314453, "global_step": 265194, "epoch": 2191} {"train_loss": -44.01812744140625, "global_step": 265195, "epoch": 2191} {"train_loss": -42.7067756652832, "global_step": 265196, "epoch": 2191} {"train_loss": -43.44399642944336, "global_step": 265197, "epoch": 2191} {"train_loss": -44.15343475341797, "global_step": 265198, "epoch": 2191} {"train_loss": -43.05743408203125, "global_step": 265199, "epoch": 2191} {"train_loss": -43.33490753173828, "global_step": 265200, "epoch": 2191} {"train_loss": -43.711517333984375, "global_step": 265201, "epoch": 2191} {"train_loss": -43.51047897338867, "global_step": 265202, "epoch": 2191} {"train_loss": -43.1904411315918, "global_step": 265203, "epoch": 2191} {"train_loss": -43.428993225097656, "global_step": 265204, "epoch": 2191} {"train_loss": -43.479583740234375, "global_step": 265205, "epoch": 2191} {"train_loss": -43.202064514160156, "global_step": 265206, "epoch": 2191} {"train_loss": -43.45588302612305, "global_step": 265207, "epoch": 2191} {"train_loss": -43.9526252746582, "global_step": 265208, "epoch": 2191} {"train_loss": -44.05050277709961, "global_step": 265209, "epoch": 2191} {"train_loss": -43.93564987182617, "global_step": 265210, "epoch": 2191} {"train_loss": -43.66685104370117, "global_step": 265211, "epoch": 2191} {"train_loss": -43.316184997558594, "global_step": 265212, "epoch": 2191} {"train_loss": -42.43339157104492, "global_step": 265213, "epoch": 2191} {"train_loss": -42.61347579956055, "global_step": 265214, "epoch": 2191} {"train_loss": -43.56820297241211, "global_step": 265215, "epoch": 2191} {"train_loss": -43.647377014160156, "global_step": 265216, "epoch": 2191} {"train_loss": -41.93696212768555, "global_step": 265217, "epoch": 2191} {"train_loss": -41.838008880615234, "global_step": 265218, "epoch": 2191} {"train_loss": -43.504554748535156, "global_step": 265219, "epoch": 2191} {"train_loss": -44.00833511352539, "global_step": 265220, "epoch": 2191} {"train_loss": -42.364986419677734, "global_step": 265221, "epoch": 2191} {"train_loss": -42.871150970458984, "global_step": 265222, "epoch": 2191} {"train_loss": -43.40938949584961, "global_step": 265223, "epoch": 2191} {"train_loss": -43.47135543823242, "global_step": 265224, "epoch": 2191} {"train_loss": -43.20649337768555, "global_step": 265225, "epoch": 2191} {"train_loss": -42.91057205200195, "global_step": 265226, "epoch": 2191} {"train_loss": -43.57320022583008, "global_step": 265227, "epoch": 2191} {"train_loss": -43.52055740356445, "global_step": 265228, "epoch": 2191} {"train_loss": -43.009185791015625, "global_step": 265229, "epoch": 2191} {"train_loss": -43.401092529296875, "global_step": 265230, "epoch": 2191} {"train_loss": -42.52282065399422, "global_step": 265231, "epoch": 2191, "val_loss": 2677452.0} {"train_loss": -42.6505241394043, "global_step": 265232, "epoch": 2192} {"train_loss": -42.397125244140625, "global_step": 265233, "epoch": 2192} {"train_loss": -42.63401412963867, "global_step": 265234, "epoch": 2192} {"train_loss": -43.912532806396484, "global_step": 265235, "epoch": 2192} {"train_loss": -42.73943328857422, "global_step": 265236, "epoch": 2192} {"train_loss": -43.795345306396484, "global_step": 265237, "epoch": 2192} {"train_loss": -43.51604080200195, "global_step": 265238, "epoch": 2192} {"train_loss": -42.74066162109375, "global_step": 265239, "epoch": 2192} {"train_loss": -42.499088287353516, "global_step": 265240, "epoch": 2192} {"train_loss": -41.70830154418945, "global_step": 265241, "epoch": 2192} {"train_loss": -42.27156448364258, "global_step": 265242, "epoch": 2192} {"train_loss": -43.097999572753906, "global_step": 265243, "epoch": 2192} {"train_loss": -40.806095123291016, "global_step": 265244, "epoch": 2192} {"train_loss": -41.51603317260742, "global_step": 265245, "epoch": 2192} {"train_loss": -41.000606536865234, "global_step": 265246, "epoch": 2192} {"train_loss": -40.9935417175293, "global_step": 265247, "epoch": 2192} {"train_loss": -40.894203186035156, "global_step": 265248, "epoch": 2192} {"train_loss": -42.217403411865234, "global_step": 265249, "epoch": 2192} {"train_loss": -41.5547981262207, "global_step": 265250, "epoch": 2192} {"train_loss": -42.21257781982422, "global_step": 265251, "epoch": 2192} {"train_loss": -40.33211898803711, "global_step": 265252, "epoch": 2192} {"train_loss": -41.74866485595703, "global_step": 265253, "epoch": 2192} {"train_loss": -40.0594596862793, "global_step": 265254, "epoch": 2192} {"train_loss": -41.49771499633789, "global_step": 265255, "epoch": 2192} {"train_loss": -41.14814758300781, "global_step": 265256, "epoch": 2192} {"train_loss": -39.984649658203125, "global_step": 265257, "epoch": 2192} {"train_loss": -42.18484115600586, "global_step": 265258, "epoch": 2192} {"train_loss": -41.450897216796875, "global_step": 265259, "epoch": 2192} {"train_loss": -42.50750732421875, "global_step": 265260, "epoch": 2192} {"train_loss": -41.74650192260742, "global_step": 265261, "epoch": 2192} {"train_loss": -41.827510833740234, "global_step": 265262, "epoch": 2192} {"train_loss": -42.55023956298828, "global_step": 265263, "epoch": 2192} {"train_loss": -41.179134368896484, "global_step": 265264, "epoch": 2192} {"train_loss": -41.5218620300293, "global_step": 265265, "epoch": 2192} {"train_loss": -42.010467529296875, "global_step": 265266, "epoch": 2192} {"train_loss": -40.96078872680664, "global_step": 265267, "epoch": 2192} {"train_loss": -42.39097213745117, "global_step": 265268, "epoch": 2192} {"train_loss": -41.406036376953125, "global_step": 265269, "epoch": 2192} {"train_loss": -42.17979431152344, "global_step": 265270, "epoch": 2192} {"train_loss": -40.15444564819336, "global_step": 265271, "epoch": 2192} {"train_loss": -42.56953811645508, "global_step": 265272, "epoch": 2192} {"train_loss": -39.33944320678711, "global_step": 265273, "epoch": 2192} {"train_loss": -42.24635314941406, "global_step": 265274, "epoch": 2192} {"train_loss": -40.50177001953125, "global_step": 265275, "epoch": 2192} {"train_loss": -39.70332717895508, "global_step": 265276, "epoch": 2192} {"train_loss": -42.07638168334961, "global_step": 265277, "epoch": 2192} {"train_loss": -38.110206604003906, "global_step": 265278, "epoch": 2192} {"train_loss": -41.781375885009766, "global_step": 265279, "epoch": 2192} {"train_loss": -38.35803985595703, "global_step": 265280, "epoch": 2192} {"train_loss": -40.0392951965332, "global_step": 265281, "epoch": 2192} {"train_loss": -38.95988082885742, "global_step": 265282, "epoch": 2192} {"train_loss": -37.84690475463867, "global_step": 265283, "epoch": 2192} {"train_loss": -40.72693634033203, "global_step": 265284, "epoch": 2192} {"train_loss": -37.83712387084961, "global_step": 265285, "epoch": 2192} {"train_loss": -41.98298263549805, "global_step": 265286, "epoch": 2192} {"train_loss": -39.07685470581055, "global_step": 265287, "epoch": 2192} {"train_loss": -40.65413284301758, "global_step": 265288, "epoch": 2192} {"train_loss": -39.0708122253418, "global_step": 265289, "epoch": 2192} {"train_loss": -41.314979553222656, "global_step": 265290, "epoch": 2192} {"train_loss": -39.415618896484375, "global_step": 265291, "epoch": 2192} {"train_loss": -40.22037124633789, "global_step": 265292, "epoch": 2192} {"train_loss": -40.60393142700195, "global_step": 265293, "epoch": 2192} {"train_loss": -40.505592346191406, "global_step": 265294, "epoch": 2192} {"train_loss": -41.704742431640625, "global_step": 265295, "epoch": 2192} {"train_loss": -41.20526885986328, "global_step": 265296, "epoch": 2192} {"train_loss": -41.071048736572266, "global_step": 265297, "epoch": 2192} {"train_loss": -41.365413665771484, "global_step": 265298, "epoch": 2192} {"train_loss": -41.08818435668945, "global_step": 265299, "epoch": 2192} {"train_loss": -41.32578659057617, "global_step": 265300, "epoch": 2192} {"train_loss": -42.60490036010742, "global_step": 265301, "epoch": 2192} {"train_loss": -41.08234786987305, "global_step": 265302, "epoch": 2192} {"train_loss": -42.757484436035156, "global_step": 265303, "epoch": 2192} {"train_loss": -40.59334945678711, "global_step": 265304, "epoch": 2192} {"train_loss": -42.93624496459961, "global_step": 265305, "epoch": 2192} {"train_loss": -41.03255844116211, "global_step": 265306, "epoch": 2192} {"train_loss": -42.37639236450195, "global_step": 265307, "epoch": 2192} {"train_loss": -42.141475677490234, "global_step": 265308, "epoch": 2192} {"train_loss": -41.77633285522461, "global_step": 265309, "epoch": 2192} {"train_loss": -42.89985656738281, "global_step": 265310, "epoch": 2192} {"train_loss": -42.58383560180664, "global_step": 265311, "epoch": 2192} {"train_loss": -42.238990783691406, "global_step": 265312, "epoch": 2192} {"train_loss": -42.319087982177734, "global_step": 265313, "epoch": 2192} {"train_loss": -41.285858154296875, "global_step": 265314, "epoch": 2192} {"train_loss": -42.26438522338867, "global_step": 265315, "epoch": 2192} {"train_loss": -42.48965835571289, "global_step": 265316, "epoch": 2192} {"train_loss": -42.09856033325195, "global_step": 265317, "epoch": 2192} {"train_loss": -43.35222244262695, "global_step": 265318, "epoch": 2192} {"train_loss": -42.172237396240234, "global_step": 265319, "epoch": 2192} {"train_loss": -43.116859436035156, "global_step": 265320, "epoch": 2192} {"train_loss": -43.047637939453125, "global_step": 265321, "epoch": 2192} {"train_loss": -42.60929489135742, "global_step": 265322, "epoch": 2192} {"train_loss": -43.4005241394043, "global_step": 265323, "epoch": 2192} {"train_loss": -42.68842697143555, "global_step": 265324, "epoch": 2192} {"train_loss": -42.740394592285156, "global_step": 265325, "epoch": 2192} {"train_loss": -43.3112678527832, "global_step": 265326, "epoch": 2192} {"train_loss": -43.13129806518555, "global_step": 265327, "epoch": 2192} {"train_loss": -43.640228271484375, "global_step": 265328, "epoch": 2192} {"train_loss": -42.60001754760742, "global_step": 265329, "epoch": 2192} {"train_loss": -43.24860763549805, "global_step": 265330, "epoch": 2192} {"train_loss": -43.468990325927734, "global_step": 265331, "epoch": 2192} {"train_loss": -43.111141204833984, "global_step": 265332, "epoch": 2192} {"train_loss": -43.72673797607422, "global_step": 265333, "epoch": 2192} {"train_loss": -43.65104293823242, "global_step": 265334, "epoch": 2192} {"train_loss": -43.53444290161133, "global_step": 265335, "epoch": 2192} {"train_loss": -43.80360794067383, "global_step": 265336, "epoch": 2192} {"train_loss": -43.541961669921875, "global_step": 265337, "epoch": 2192} {"train_loss": -43.833370208740234, "global_step": 265338, "epoch": 2192} {"train_loss": -43.44065475463867, "global_step": 265339, "epoch": 2192} {"train_loss": -43.782066345214844, "global_step": 265340, "epoch": 2192} {"train_loss": -43.587318420410156, "global_step": 265341, "epoch": 2192} {"train_loss": -43.791954040527344, "global_step": 265342, "epoch": 2192} {"train_loss": -43.414794921875, "global_step": 265343, "epoch": 2192} {"train_loss": -43.621578216552734, "global_step": 265344, "epoch": 2192} {"train_loss": -43.65191650390625, "global_step": 265345, "epoch": 2192} {"train_loss": -43.5391845703125, "global_step": 265346, "epoch": 2192} {"train_loss": -43.85084915161133, "global_step": 265347, "epoch": 2192} {"train_loss": -43.877593994140625, "global_step": 265348, "epoch": 2192} {"train_loss": -43.48894119262695, "global_step": 265349, "epoch": 2192} {"train_loss": -43.82415771484375, "global_step": 265350, "epoch": 2192} {"train_loss": -43.601661682128906, "global_step": 265351, "epoch": 2192} {"train_loss": -41.97492744508854, "global_step": 265352, "epoch": 2192, "val_loss": 2668422.25} {"train_loss": -43.899574279785156, "global_step": 265353, "epoch": 2193} {"train_loss": -44.15147018432617, "global_step": 265354, "epoch": 2193} {"train_loss": -44.143672943115234, "global_step": 265355, "epoch": 2193} {"train_loss": -44.4674072265625, "global_step": 265356, "epoch": 2193} {"train_loss": -44.20850372314453, "global_step": 265357, "epoch": 2193} {"train_loss": -44.21662521362305, "global_step": 265358, "epoch": 2193} {"train_loss": -44.27040481567383, "global_step": 265359, "epoch": 2193} {"train_loss": -43.80361557006836, "global_step": 265360, "epoch": 2193} {"train_loss": -43.87919235229492, "global_step": 265361, "epoch": 2193} {"train_loss": -44.39036560058594, "global_step": 265362, "epoch": 2193} {"train_loss": -43.68363952636719, "global_step": 265363, "epoch": 2193} {"train_loss": -44.33030700683594, "global_step": 265364, "epoch": 2193} {"train_loss": -44.250038146972656, "global_step": 265365, "epoch": 2193} {"train_loss": -43.4283447265625, "global_step": 265366, "epoch": 2193} {"train_loss": -44.154842376708984, "global_step": 265367, "epoch": 2193} {"train_loss": -43.25577926635742, "global_step": 265368, "epoch": 2193} {"train_loss": -43.79240036010742, "global_step": 265369, "epoch": 2193} {"train_loss": -44.24506378173828, "global_step": 265370, "epoch": 2193} {"train_loss": -43.2239990234375, "global_step": 265371, "epoch": 2193} {"train_loss": -43.4799919128418, "global_step": 265372, "epoch": 2193} {"train_loss": -43.7779541015625, "global_step": 265373, "epoch": 2193} {"train_loss": -43.85320281982422, "global_step": 265374, "epoch": 2193} {"train_loss": -43.13505554199219, "global_step": 265375, "epoch": 2193} {"train_loss": -44.255531311035156, "global_step": 265376, "epoch": 2193} {"train_loss": -43.767234802246094, "global_step": 265377, "epoch": 2193} {"train_loss": -43.607032775878906, "global_step": 265378, "epoch": 2193} {"train_loss": -43.62213897705078, "global_step": 265379, "epoch": 2193} {"train_loss": -43.849796295166016, "global_step": 265380, "epoch": 2193} {"train_loss": -42.8615837097168, "global_step": 265381, "epoch": 2193} {"train_loss": -44.412925720214844, "global_step": 265382, "epoch": 2193} {"train_loss": -43.877262115478516, "global_step": 265383, "epoch": 2193} {"train_loss": -44.12611770629883, "global_step": 265384, "epoch": 2193} {"train_loss": -43.8651237487793, "global_step": 265385, "epoch": 2193} {"train_loss": -43.61262893676758, "global_step": 265386, "epoch": 2193} {"train_loss": -43.9456672668457, "global_step": 265387, "epoch": 2193} {"train_loss": -44.355194091796875, "global_step": 265388, "epoch": 2193} {"train_loss": -44.1328239440918, "global_step": 265389, "epoch": 2193} {"train_loss": -44.587215423583984, "global_step": 265390, "epoch": 2193} {"train_loss": -44.01296615600586, "global_step": 265391, "epoch": 2193} {"train_loss": -43.803077697753906, "global_step": 265392, "epoch": 2193} {"train_loss": -44.392852783203125, "global_step": 265393, "epoch": 2193} {"train_loss": -44.690425872802734, "global_step": 265394, "epoch": 2193} {"train_loss": -44.126949310302734, "global_step": 265395, "epoch": 2193} {"train_loss": -44.11366653442383, "global_step": 265396, "epoch": 2193} {"train_loss": -44.168331146240234, "global_step": 265397, "epoch": 2193} {"train_loss": -43.900264739990234, "global_step": 265398, "epoch": 2193} {"train_loss": -43.017696380615234, "global_step": 265399, "epoch": 2193} {"train_loss": -43.22200393676758, "global_step": 265400, "epoch": 2193} {"train_loss": -43.3448371887207, "global_step": 265401, "epoch": 2193} {"train_loss": -43.63608932495117, "global_step": 265402, "epoch": 2193} {"train_loss": -43.2459831237793, "global_step": 265403, "epoch": 2193} {"train_loss": -41.53425216674805, "global_step": 265404, "epoch": 2193} {"train_loss": -42.90855026245117, "global_step": 265405, "epoch": 2193} {"train_loss": -42.15332794189453, "global_step": 265406, "epoch": 2193} {"train_loss": -41.593170166015625, "global_step": 265407, "epoch": 2193} {"train_loss": -42.371307373046875, "global_step": 265408, "epoch": 2193} {"train_loss": -43.19722366333008, "global_step": 265409, "epoch": 2193} {"train_loss": -43.5314826965332, "global_step": 265410, "epoch": 2193} {"train_loss": -42.45254135131836, "global_step": 265411, "epoch": 2193} {"train_loss": -42.6320915222168, "global_step": 265412, "epoch": 2193} {"train_loss": -43.177852630615234, "global_step": 265413, "epoch": 2193} {"train_loss": -42.201045989990234, "global_step": 265414, "epoch": 2193} {"train_loss": -42.192264556884766, "global_step": 265415, "epoch": 2193} {"train_loss": -41.58845901489258, "global_step": 265416, "epoch": 2193} {"train_loss": -39.94289779663086, "global_step": 265417, "epoch": 2193} {"train_loss": -42.528438568115234, "global_step": 265418, "epoch": 2193} {"train_loss": -42.18046188354492, "global_step": 265419, "epoch": 2193} {"train_loss": -40.931461334228516, "global_step": 265420, "epoch": 2193} {"train_loss": -40.97856140136719, "global_step": 265421, "epoch": 2193} {"train_loss": -41.52751541137695, "global_step": 265422, "epoch": 2193} {"train_loss": -42.44318389892578, "global_step": 265423, "epoch": 2193} {"train_loss": -43.24520492553711, "global_step": 265424, "epoch": 2193} {"train_loss": -43.25080108642578, "global_step": 265425, "epoch": 2193} {"train_loss": -42.63025665283203, "global_step": 265426, "epoch": 2193} {"train_loss": -42.402732849121094, "global_step": 265427, "epoch": 2193} {"train_loss": -43.339759826660156, "global_step": 265428, "epoch": 2193} {"train_loss": -42.9676513671875, "global_step": 265429, "epoch": 2193} {"train_loss": -42.373634338378906, "global_step": 265430, "epoch": 2193} {"train_loss": -41.94185256958008, "global_step": 265431, "epoch": 2193} {"train_loss": -42.37632751464844, "global_step": 265432, "epoch": 2193} {"train_loss": -42.89519119262695, "global_step": 265433, "epoch": 2193} {"train_loss": -42.95664596557617, "global_step": 265434, "epoch": 2193} {"train_loss": -42.0366325378418, "global_step": 265435, "epoch": 2193} {"train_loss": -42.779212951660156, "global_step": 265436, "epoch": 2193} {"train_loss": -43.460243225097656, "global_step": 265437, "epoch": 2193} {"train_loss": -42.764381408691406, "global_step": 265438, "epoch": 2193} {"train_loss": -42.91896057128906, "global_step": 265439, "epoch": 2193} {"train_loss": -43.78692626953125, "global_step": 265440, "epoch": 2193} {"train_loss": -43.108642578125, "global_step": 265441, "epoch": 2193} {"train_loss": -41.71340560913086, "global_step": 265442, "epoch": 2193} {"train_loss": -42.80341720581055, "global_step": 265443, "epoch": 2193} {"train_loss": -43.82110595703125, "global_step": 265444, "epoch": 2193} {"train_loss": -43.01792526245117, "global_step": 265445, "epoch": 2193} {"train_loss": -43.31574630737305, "global_step": 265446, "epoch": 2193} {"train_loss": -43.06034469604492, "global_step": 265447, "epoch": 2193} {"train_loss": -42.62632369995117, "global_step": 265448, "epoch": 2193} {"train_loss": -42.66887664794922, "global_step": 265449, "epoch": 2193} {"train_loss": -43.85056686401367, "global_step": 265450, "epoch": 2193} {"train_loss": -43.566925048828125, "global_step": 265451, "epoch": 2193} {"train_loss": -42.87343978881836, "global_step": 265452, "epoch": 2193} {"train_loss": -43.535560607910156, "global_step": 265453, "epoch": 2193} {"train_loss": -43.6638298034668, "global_step": 265454, "epoch": 2193} {"train_loss": -43.61140060424805, "global_step": 265455, "epoch": 2193} {"train_loss": -42.50681686401367, "global_step": 265456, "epoch": 2193} {"train_loss": -43.64138412475586, "global_step": 265457, "epoch": 2193} {"train_loss": -43.82142639160156, "global_step": 265458, "epoch": 2193} {"train_loss": -42.26206970214844, "global_step": 265459, "epoch": 2193} {"train_loss": -42.307186126708984, "global_step": 265460, "epoch": 2193} {"train_loss": -43.017818450927734, "global_step": 265461, "epoch": 2193} {"train_loss": -43.88045120239258, "global_step": 265462, "epoch": 2193} {"train_loss": -42.87626266479492, "global_step": 265463, "epoch": 2193} {"train_loss": -43.48817825317383, "global_step": 265464, "epoch": 2193} {"train_loss": -43.65243148803711, "global_step": 265465, "epoch": 2193} {"train_loss": -43.79994583129883, "global_step": 265466, "epoch": 2193} {"train_loss": -42.44916534423828, "global_step": 265467, "epoch": 2193} {"train_loss": -42.702083587646484, "global_step": 265468, "epoch": 2193} {"train_loss": -43.400306701660156, "global_step": 265469, "epoch": 2193} {"train_loss": -42.141178131103516, "global_step": 265470, "epoch": 2193} {"train_loss": -40.76149368286133, "global_step": 265471, "epoch": 2193} {"train_loss": -42.4139404296875, "global_step": 265472, "epoch": 2193} {"train_loss": -43.21132423463932, "global_step": 265473, "epoch": 2193, "val_loss": 2706088.75} {"train_loss": -42.2242317199707, "global_step": 265474, "epoch": 2194} {"train_loss": -42.87446212768555, "global_step": 265475, "epoch": 2194} {"train_loss": -42.07155227661133, "global_step": 265476, "epoch": 2194} {"train_loss": -42.009971618652344, "global_step": 265477, "epoch": 2194} {"train_loss": -43.21645736694336, "global_step": 265478, "epoch": 2194} {"train_loss": -42.403045654296875, "global_step": 265479, "epoch": 2194} {"train_loss": -42.43433380126953, "global_step": 265480, "epoch": 2194} {"train_loss": -43.86500930786133, "global_step": 265481, "epoch": 2194} {"train_loss": -40.79154586791992, "global_step": 265482, "epoch": 2194} {"train_loss": -42.58698654174805, "global_step": 265483, "epoch": 2194} {"train_loss": -42.562801361083984, "global_step": 265484, "epoch": 2194} {"train_loss": -41.889076232910156, "global_step": 265485, "epoch": 2194} {"train_loss": -43.150386810302734, "global_step": 265486, "epoch": 2194} {"train_loss": -43.35122299194336, "global_step": 265487, "epoch": 2194} {"train_loss": -42.76856231689453, "global_step": 265488, "epoch": 2194} {"train_loss": -43.35417938232422, "global_step": 265489, "epoch": 2194} {"train_loss": -42.84633255004883, "global_step": 265490, "epoch": 2194} {"train_loss": -41.72336959838867, "global_step": 265491, "epoch": 2194} {"train_loss": -43.74080276489258, "global_step": 265492, "epoch": 2194} {"train_loss": -42.148681640625, "global_step": 265493, "epoch": 2194} {"train_loss": -42.40232849121094, "global_step": 265494, "epoch": 2194} {"train_loss": -43.56015396118164, "global_step": 265495, "epoch": 2194} {"train_loss": -42.54304885864258, "global_step": 265496, "epoch": 2194} {"train_loss": -42.81929397583008, "global_step": 265497, "epoch": 2194} {"train_loss": -42.952972412109375, "global_step": 265498, "epoch": 2194} {"train_loss": -42.17051315307617, "global_step": 265499, "epoch": 2194} {"train_loss": -41.879600524902344, "global_step": 265500, "epoch": 2194} {"train_loss": -42.8701286315918, "global_step": 265501, "epoch": 2194} {"train_loss": -43.52313232421875, "global_step": 265502, "epoch": 2194} {"train_loss": -42.18173599243164, "global_step": 265503, "epoch": 2194} {"train_loss": -42.25685501098633, "global_step": 265504, "epoch": 2194} {"train_loss": -42.76914596557617, "global_step": 265505, "epoch": 2194} {"train_loss": -42.63459396362305, "global_step": 265506, "epoch": 2194} {"train_loss": -43.40961456298828, "global_step": 265507, "epoch": 2194} {"train_loss": -42.977474212646484, "global_step": 265508, "epoch": 2194} {"train_loss": -43.73112869262695, "global_step": 265509, "epoch": 2194} {"train_loss": -43.64651107788086, "global_step": 265510, "epoch": 2194} {"train_loss": -43.555057525634766, "global_step": 265511, "epoch": 2194} {"train_loss": -43.913387298583984, "global_step": 265512, "epoch": 2194} {"train_loss": -44.020965576171875, "global_step": 265513, "epoch": 2194} {"train_loss": -43.8258171081543, "global_step": 265514, "epoch": 2194} {"train_loss": -43.84428024291992, "global_step": 265515, "epoch": 2194} {"train_loss": -43.99036407470703, "global_step": 265516, "epoch": 2194} {"train_loss": -43.72186279296875, "global_step": 265517, "epoch": 2194} {"train_loss": -43.15156173706055, "global_step": 265518, "epoch": 2194} {"train_loss": -44.13383865356445, "global_step": 265519, "epoch": 2194} {"train_loss": -43.70730209350586, "global_step": 265520, "epoch": 2194} {"train_loss": -43.60289001464844, "global_step": 265521, "epoch": 2194} {"train_loss": -44.092689514160156, "global_step": 265522, "epoch": 2194} {"train_loss": -43.8333740234375, "global_step": 265523, "epoch": 2194} {"train_loss": -43.41288375854492, "global_step": 265524, "epoch": 2194} {"train_loss": -43.902706146240234, "global_step": 265525, "epoch": 2194} {"train_loss": -43.28171920776367, "global_step": 265526, "epoch": 2194} {"train_loss": -43.54356384277344, "global_step": 265527, "epoch": 2194} {"train_loss": -43.57045364379883, "global_step": 265528, "epoch": 2194} {"train_loss": -42.492122650146484, "global_step": 265529, "epoch": 2194} {"train_loss": -42.20327377319336, "global_step": 265530, "epoch": 2194} {"train_loss": -43.88698196411133, "global_step": 265531, "epoch": 2194} {"train_loss": -43.734920501708984, "global_step": 265532, "epoch": 2194} {"train_loss": -43.41350555419922, "global_step": 265533, "epoch": 2194} {"train_loss": -43.29464340209961, "global_step": 265534, "epoch": 2194} {"train_loss": -43.7269172668457, "global_step": 265535, "epoch": 2194} {"train_loss": -43.71733856201172, "global_step": 265536, "epoch": 2194} {"train_loss": -42.86770248413086, "global_step": 265537, "epoch": 2194} {"train_loss": -41.90351104736328, "global_step": 265538, "epoch": 2194} {"train_loss": -42.7158088684082, "global_step": 265539, "epoch": 2194} {"train_loss": -44.08171463012695, "global_step": 265540, "epoch": 2194} {"train_loss": -43.27207565307617, "global_step": 265541, "epoch": 2194} {"train_loss": -43.22626876831055, "global_step": 265542, "epoch": 2194} {"train_loss": -43.85207748413086, "global_step": 265543, "epoch": 2194} {"train_loss": -43.741722106933594, "global_step": 265544, "epoch": 2194} {"train_loss": -43.897274017333984, "global_step": 265545, "epoch": 2194} {"train_loss": -43.82857894897461, "global_step": 265546, "epoch": 2194} {"train_loss": -43.65871047973633, "global_step": 265547, "epoch": 2194} {"train_loss": -43.7477912902832, "global_step": 265548, "epoch": 2194} {"train_loss": -43.76830291748047, "global_step": 265549, "epoch": 2194} {"train_loss": -43.51560974121094, "global_step": 265550, "epoch": 2194} {"train_loss": -43.33189010620117, "global_step": 265551, "epoch": 2194} {"train_loss": -43.872535705566406, "global_step": 265552, "epoch": 2194} {"train_loss": -43.90400314331055, "global_step": 265553, "epoch": 2194} {"train_loss": -43.793270111083984, "global_step": 265554, "epoch": 2194} {"train_loss": -43.836822509765625, "global_step": 265555, "epoch": 2194} {"train_loss": -43.25516128540039, "global_step": 265556, "epoch": 2194} {"train_loss": -43.751708984375, "global_step": 265557, "epoch": 2194} {"train_loss": -43.9432373046875, "global_step": 265558, "epoch": 2194} {"train_loss": -43.45100021362305, "global_step": 265559, "epoch": 2194} {"train_loss": -43.86639404296875, "global_step": 265560, "epoch": 2194} {"train_loss": -42.89520263671875, "global_step": 265561, "epoch": 2194} {"train_loss": -41.922027587890625, "global_step": 265562, "epoch": 2194} {"train_loss": -42.1342887878418, "global_step": 265563, "epoch": 2194} {"train_loss": -44.15989303588867, "global_step": 265564, "epoch": 2194} {"train_loss": -40.7095947265625, "global_step": 265565, "epoch": 2194} {"train_loss": -43.699493408203125, "global_step": 265566, "epoch": 2194} {"train_loss": -42.92644119262695, "global_step": 265567, "epoch": 2194} {"train_loss": -40.75541305541992, "global_step": 265568, "epoch": 2194} {"train_loss": -43.28768539428711, "global_step": 265569, "epoch": 2194} {"train_loss": -41.931549072265625, "global_step": 265570, "epoch": 2194} {"train_loss": -40.389495849609375, "global_step": 265571, "epoch": 2194} {"train_loss": -43.07136154174805, "global_step": 265572, "epoch": 2194} {"train_loss": -39.121315002441406, "global_step": 265573, "epoch": 2194} {"train_loss": -42.86715316772461, "global_step": 265574, "epoch": 2194} {"train_loss": -40.98942947387695, "global_step": 265575, "epoch": 2194} {"train_loss": -41.59070587158203, "global_step": 265576, "epoch": 2194} {"train_loss": -41.333919525146484, "global_step": 265577, "epoch": 2194} {"train_loss": -40.3916130065918, "global_step": 265578, "epoch": 2194} {"train_loss": -40.939178466796875, "global_step": 265579, "epoch": 2194} {"train_loss": -42.221351623535156, "global_step": 265580, "epoch": 2194} {"train_loss": -42.318660736083984, "global_step": 265581, "epoch": 2194} {"train_loss": -41.966346740722656, "global_step": 265582, "epoch": 2194} {"train_loss": -41.960811614990234, "global_step": 265583, "epoch": 2194} {"train_loss": -41.42779541015625, "global_step": 265584, "epoch": 2194} {"train_loss": -42.089900970458984, "global_step": 265585, "epoch": 2194} {"train_loss": -41.873291015625, "global_step": 265586, "epoch": 2194} {"train_loss": -42.4351921081543, "global_step": 265587, "epoch": 2194} {"train_loss": -42.92251205444336, "global_step": 265588, "epoch": 2194} {"train_loss": -41.97475814819336, "global_step": 265589, "epoch": 2194} {"train_loss": -42.38014221191406, "global_step": 265590, "epoch": 2194} {"train_loss": -41.88570022583008, "global_step": 265591, "epoch": 2194} {"train_loss": -42.42803192138672, "global_step": 265592, "epoch": 2194} {"train_loss": -42.08811569213867, "global_step": 265593, "epoch": 2194} {"train_loss": -42.8657435582689, "global_step": 265594, "epoch": 2194, "val_loss": 2638607.0} {"train_loss": -41.94157791137695, "global_step": 265595, "epoch": 2195} {"train_loss": -43.03133010864258, "global_step": 265596, "epoch": 2195} {"train_loss": -41.39451217651367, "global_step": 265597, "epoch": 2195} {"train_loss": -43.22683334350586, "global_step": 265598, "epoch": 2195} {"train_loss": -42.07805252075195, "global_step": 265599, "epoch": 2195} {"train_loss": -42.640113830566406, "global_step": 265600, "epoch": 2195} {"train_loss": -42.569366455078125, "global_step": 265601, "epoch": 2195} {"train_loss": -42.58970260620117, "global_step": 265602, "epoch": 2195} {"train_loss": -42.574642181396484, "global_step": 265603, "epoch": 2195} {"train_loss": -42.35895538330078, "global_step": 265604, "epoch": 2195} {"train_loss": -42.95486068725586, "global_step": 265605, "epoch": 2195} {"train_loss": -41.95658493041992, "global_step": 265606, "epoch": 2195} {"train_loss": -43.46173858642578, "global_step": 265607, "epoch": 2195} {"train_loss": -41.9390754699707, "global_step": 265608, "epoch": 2195} {"train_loss": -43.641029357910156, "global_step": 265609, "epoch": 2195} {"train_loss": -42.018821716308594, "global_step": 265610, "epoch": 2195} {"train_loss": -42.97391891479492, "global_step": 265611, "epoch": 2195} {"train_loss": -42.44902420043945, "global_step": 265612, "epoch": 2195} {"train_loss": -42.7637825012207, "global_step": 265613, "epoch": 2195} {"train_loss": -42.96328353881836, "global_step": 265614, "epoch": 2195} {"train_loss": -42.82133102416992, "global_step": 265615, "epoch": 2195} {"train_loss": -42.79423141479492, "global_step": 265616, "epoch": 2195} {"train_loss": -43.145599365234375, "global_step": 265617, "epoch": 2195} {"train_loss": -43.097164154052734, "global_step": 265618, "epoch": 2195} {"train_loss": -42.770668029785156, "global_step": 265619, "epoch": 2195} {"train_loss": -43.20846176147461, "global_step": 265620, "epoch": 2195} {"train_loss": -43.76546859741211, "global_step": 265621, "epoch": 2195} {"train_loss": -43.71478271484375, "global_step": 265622, "epoch": 2195} {"train_loss": -43.1229248046875, "global_step": 265623, "epoch": 2195} {"train_loss": -43.48565673828125, "global_step": 265624, "epoch": 2195} {"train_loss": -43.571754455566406, "global_step": 265625, "epoch": 2195} {"train_loss": -41.770381927490234, "global_step": 265626, "epoch": 2195} {"train_loss": -41.9107551574707, "global_step": 265627, "epoch": 2195} {"train_loss": -42.46090316772461, "global_step": 265628, "epoch": 2195} {"train_loss": -44.04903030395508, "global_step": 265629, "epoch": 2195} {"train_loss": -42.8327522277832, "global_step": 265630, "epoch": 2195} {"train_loss": -43.1991081237793, "global_step": 265631, "epoch": 2195} {"train_loss": -43.80213165283203, "global_step": 265632, "epoch": 2195} {"train_loss": -42.925716400146484, "global_step": 265633, "epoch": 2195} {"train_loss": -42.619789123535156, "global_step": 265634, "epoch": 2195} {"train_loss": -43.28569412231445, "global_step": 265635, "epoch": 2195} {"train_loss": -43.353084564208984, "global_step": 265636, "epoch": 2195} {"train_loss": -43.565765380859375, "global_step": 265637, "epoch": 2195} {"train_loss": -43.821258544921875, "global_step": 265638, "epoch": 2195} {"train_loss": -43.872257232666016, "global_step": 265639, "epoch": 2195} {"train_loss": -44.17010498046875, "global_step": 265640, "epoch": 2195} {"train_loss": -44.305267333984375, "global_step": 265641, "epoch": 2195} {"train_loss": -43.6256217956543, "global_step": 265642, "epoch": 2195} {"train_loss": -43.82342529296875, "global_step": 265643, "epoch": 2195} {"train_loss": -44.270599365234375, "global_step": 265644, "epoch": 2195} {"train_loss": -44.52130126953125, "global_step": 265645, "epoch": 2195} {"train_loss": -43.384830474853516, "global_step": 265646, "epoch": 2195} {"train_loss": -43.496429443359375, "global_step": 265647, "epoch": 2195} {"train_loss": -44.2274055480957, "global_step": 265648, "epoch": 2195} {"train_loss": -44.200557708740234, "global_step": 265649, "epoch": 2195} {"train_loss": -44.32151794433594, "global_step": 265650, "epoch": 2195} {"train_loss": -44.517024993896484, "global_step": 265651, "epoch": 2195} {"train_loss": -43.891231536865234, "global_step": 265652, "epoch": 2195} {"train_loss": -43.96828842163086, "global_step": 265653, "epoch": 2195} {"train_loss": -44.83074188232422, "global_step": 265654, "epoch": 2195} {"train_loss": -43.1599006652832, "global_step": 265655, "epoch": 2195} {"train_loss": -44.24920654296875, "global_step": 265656, "epoch": 2195} {"train_loss": -43.945411682128906, "global_step": 265657, "epoch": 2195} {"train_loss": -43.13499069213867, "global_step": 265658, "epoch": 2195} {"train_loss": -43.878631591796875, "global_step": 265659, "epoch": 2195} {"train_loss": -43.74695587158203, "global_step": 265660, "epoch": 2195} {"train_loss": -43.77997970581055, "global_step": 265661, "epoch": 2195} {"train_loss": -44.13288116455078, "global_step": 265662, "epoch": 2195} {"train_loss": -43.67922592163086, "global_step": 265663, "epoch": 2195} {"train_loss": -44.169830322265625, "global_step": 265664, "epoch": 2195} {"train_loss": -43.93317794799805, "global_step": 265665, "epoch": 2195} {"train_loss": -43.890541076660156, "global_step": 265666, "epoch": 2195} {"train_loss": -44.3358154296875, "global_step": 265667, "epoch": 2195} {"train_loss": -44.4463996887207, "global_step": 265668, "epoch": 2195} {"train_loss": -43.83320617675781, "global_step": 265669, "epoch": 2195} {"train_loss": -44.41816711425781, "global_step": 265670, "epoch": 2195} {"train_loss": -44.069129943847656, "global_step": 265671, "epoch": 2195} {"train_loss": -44.13741683959961, "global_step": 265672, "epoch": 2195} {"train_loss": -43.46969223022461, "global_step": 265673, "epoch": 2195} {"train_loss": -43.8466682434082, "global_step": 265674, "epoch": 2195} {"train_loss": -43.8538703918457, "global_step": 265675, "epoch": 2195} {"train_loss": -43.679840087890625, "global_step": 265676, "epoch": 2195} {"train_loss": -42.790584564208984, "global_step": 265677, "epoch": 2195} {"train_loss": -43.251277923583984, "global_step": 265678, "epoch": 2195} {"train_loss": -43.94023895263672, "global_step": 265679, "epoch": 2195} {"train_loss": -43.77341842651367, "global_step": 265680, "epoch": 2195} {"train_loss": -44.26611328125, "global_step": 265681, "epoch": 2195} {"train_loss": -43.9159049987793, "global_step": 265682, "epoch": 2195} {"train_loss": -44.29616165161133, "global_step": 265683, "epoch": 2195} {"train_loss": -43.696468353271484, "global_step": 265684, "epoch": 2195} {"train_loss": -43.30329132080078, "global_step": 265685, "epoch": 2195} {"train_loss": -43.171871185302734, "global_step": 265686, "epoch": 2195} {"train_loss": -43.90483474731445, "global_step": 265687, "epoch": 2195} {"train_loss": -42.35871505737305, "global_step": 265688, "epoch": 2195} {"train_loss": -43.094661712646484, "global_step": 265689, "epoch": 2195} {"train_loss": -42.098533630371094, "global_step": 265690, "epoch": 2195} {"train_loss": -42.01921463012695, "global_step": 265691, "epoch": 2195} {"train_loss": -44.03335189819336, "global_step": 265692, "epoch": 2195} {"train_loss": -43.45798873901367, "global_step": 265693, "epoch": 2195} {"train_loss": -43.110233306884766, "global_step": 265694, "epoch": 2195} {"train_loss": -41.32670974731445, "global_step": 265695, "epoch": 2195} {"train_loss": -41.19417190551758, "global_step": 265696, "epoch": 2195} {"train_loss": -42.35969543457031, "global_step": 265697, "epoch": 2195} {"train_loss": -42.7507438659668, "global_step": 265698, "epoch": 2195} {"train_loss": -42.99335479736328, "global_step": 265699, "epoch": 2195} {"train_loss": -42.75050735473633, "global_step": 265700, "epoch": 2195} {"train_loss": -42.58381271362305, "global_step": 265701, "epoch": 2195} {"train_loss": -40.86297607421875, "global_step": 265702, "epoch": 2195} {"train_loss": -41.4683952331543, "global_step": 265703, "epoch": 2195} {"train_loss": -42.379024505615234, "global_step": 265704, "epoch": 2195} {"train_loss": -43.60061264038086, "global_step": 265705, "epoch": 2195} {"train_loss": -43.35649490356445, "global_step": 265706, "epoch": 2195} {"train_loss": -43.45703125, "global_step": 265707, "epoch": 2195} {"train_loss": -43.18395233154297, "global_step": 265708, "epoch": 2195} {"train_loss": -41.30558395385742, "global_step": 265709, "epoch": 2195} {"train_loss": -43.23922348022461, "global_step": 265710, "epoch": 2195} {"train_loss": -42.9028205871582, "global_step": 265711, "epoch": 2195} {"train_loss": -42.49135971069336, "global_step": 265712, "epoch": 2195} {"train_loss": -41.333168029785156, "global_step": 265713, "epoch": 2195} {"train_loss": -42.735267639160156, "global_step": 265714, "epoch": 2195} {"train_loss": -43.220871696787434, "global_step": 265715, "epoch": 2195, "val_loss": 2625972.75} {"train_loss": -42.36051559448242, "global_step": 265716, "epoch": 2196} {"train_loss": -41.331966400146484, "global_step": 265717, "epoch": 2196} {"train_loss": -43.18746566772461, "global_step": 265718, "epoch": 2196} {"train_loss": -41.551822662353516, "global_step": 265719, "epoch": 2196} {"train_loss": -42.6337776184082, "global_step": 265720, "epoch": 2196} {"train_loss": -42.91239929199219, "global_step": 265721, "epoch": 2196} {"train_loss": -42.4217414855957, "global_step": 265722, "epoch": 2196} {"train_loss": -40.65141677856445, "global_step": 265723, "epoch": 2196} {"train_loss": -42.53841781616211, "global_step": 265724, "epoch": 2196} {"train_loss": -42.1923942565918, "global_step": 265725, "epoch": 2196} {"train_loss": -41.957454681396484, "global_step": 265726, "epoch": 2196} {"train_loss": -43.15130615234375, "global_step": 265727, "epoch": 2196} {"train_loss": -39.87504577636719, "global_step": 265728, "epoch": 2196} {"train_loss": -41.492340087890625, "global_step": 265729, "epoch": 2196} {"train_loss": -42.978431701660156, "global_step": 265730, "epoch": 2196} {"train_loss": -42.01873779296875, "global_step": 265731, "epoch": 2196} {"train_loss": -42.86554718017578, "global_step": 265732, "epoch": 2196} {"train_loss": -43.51434326171875, "global_step": 265733, "epoch": 2196} {"train_loss": -43.04763412475586, "global_step": 265734, "epoch": 2196} {"train_loss": -43.14545440673828, "global_step": 265735, "epoch": 2196} {"train_loss": -43.572975158691406, "global_step": 265736, "epoch": 2196} {"train_loss": -43.2924690246582, "global_step": 265737, "epoch": 2196} {"train_loss": -43.185237884521484, "global_step": 265738, "epoch": 2196} {"train_loss": -43.880958557128906, "global_step": 265739, "epoch": 2196} {"train_loss": -42.824214935302734, "global_step": 265740, "epoch": 2196} {"train_loss": -43.2719841003418, "global_step": 265741, "epoch": 2196} {"train_loss": -43.218502044677734, "global_step": 265742, "epoch": 2196} {"train_loss": -42.030738830566406, "global_step": 265743, "epoch": 2196} {"train_loss": -43.43574142456055, "global_step": 265744, "epoch": 2196} {"train_loss": -42.583675384521484, "global_step": 265745, "epoch": 2196} {"train_loss": -42.810279846191406, "global_step": 265746, "epoch": 2196} {"train_loss": -42.9721565246582, "global_step": 265747, "epoch": 2196} {"train_loss": -43.410221099853516, "global_step": 265748, "epoch": 2196} {"train_loss": -43.3117790222168, "global_step": 265749, "epoch": 2196} {"train_loss": -43.462196350097656, "global_step": 265750, "epoch": 2196} {"train_loss": -43.28950119018555, "global_step": 265751, "epoch": 2196} {"train_loss": -43.0594367980957, "global_step": 265752, "epoch": 2196} {"train_loss": -43.51612091064453, "global_step": 265753, "epoch": 2196} {"train_loss": -42.70636749267578, "global_step": 265754, "epoch": 2196} {"train_loss": -43.66457748413086, "global_step": 265755, "epoch": 2196} {"train_loss": -43.343570709228516, "global_step": 265756, "epoch": 2196} {"train_loss": -43.037044525146484, "global_step": 265757, "epoch": 2196} {"train_loss": -42.841087341308594, "global_step": 265758, "epoch": 2196} {"train_loss": -43.11614990234375, "global_step": 265759, "epoch": 2196} {"train_loss": -43.59554672241211, "global_step": 265760, "epoch": 2196} {"train_loss": -42.96379470825195, "global_step": 265761, "epoch": 2196} {"train_loss": -43.270530700683594, "global_step": 265762, "epoch": 2196} {"train_loss": -43.28921127319336, "global_step": 265763, "epoch": 2196} {"train_loss": -43.12119674682617, "global_step": 265764, "epoch": 2196} {"train_loss": -43.6711540222168, "global_step": 265765, "epoch": 2196} {"train_loss": -42.863704681396484, "global_step": 265766, "epoch": 2196} {"train_loss": -42.829498291015625, "global_step": 265767, "epoch": 2196} {"train_loss": -43.5682258605957, "global_step": 265768, "epoch": 2196} {"train_loss": -43.757930755615234, "global_step": 265769, "epoch": 2196} {"train_loss": -43.986263275146484, "global_step": 265770, "epoch": 2196} {"train_loss": -43.9058837890625, "global_step": 265771, "epoch": 2196} {"train_loss": -43.74868392944336, "global_step": 265772, "epoch": 2196} {"train_loss": -43.94423294067383, "global_step": 265773, "epoch": 2196} {"train_loss": -43.291481018066406, "global_step": 265774, "epoch": 2196} {"train_loss": -43.82998275756836, "global_step": 265775, "epoch": 2196} {"train_loss": -43.31520080566406, "global_step": 265776, "epoch": 2196} {"train_loss": -43.69876480102539, "global_step": 265777, "epoch": 2196} {"train_loss": -43.82715606689453, "global_step": 265778, "epoch": 2196} {"train_loss": -44.013282775878906, "global_step": 265779, "epoch": 2196} {"train_loss": -43.84000778198242, "global_step": 265780, "epoch": 2196} {"train_loss": -43.48311233520508, "global_step": 265781, "epoch": 2196} {"train_loss": -42.40460968017578, "global_step": 265782, "epoch": 2196} {"train_loss": -43.111690521240234, "global_step": 265783, "epoch": 2196} {"train_loss": -43.65096664428711, "global_step": 265784, "epoch": 2196} {"train_loss": -43.97919464111328, "global_step": 265785, "epoch": 2196} {"train_loss": -44.20943069458008, "global_step": 265786, "epoch": 2196} {"train_loss": -43.950862884521484, "global_step": 265787, "epoch": 2196} {"train_loss": -44.081573486328125, "global_step": 265788, "epoch": 2196} {"train_loss": -43.886051177978516, "global_step": 265789, "epoch": 2196} {"train_loss": -43.20382308959961, "global_step": 265790, "epoch": 2196} {"train_loss": -43.9415397644043, "global_step": 265791, "epoch": 2196} {"train_loss": -43.508731842041016, "global_step": 265792, "epoch": 2196} {"train_loss": -43.19203567504883, "global_step": 265793, "epoch": 2196} {"train_loss": -43.367977142333984, "global_step": 265794, "epoch": 2196} {"train_loss": -44.4232177734375, "global_step": 265795, "epoch": 2196} {"train_loss": -43.440223693847656, "global_step": 265796, "epoch": 2196} {"train_loss": -42.536231994628906, "global_step": 265797, "epoch": 2196} {"train_loss": -42.20390701293945, "global_step": 265798, "epoch": 2196} {"train_loss": -42.80166244506836, "global_step": 265799, "epoch": 2196} {"train_loss": -43.80095291137695, "global_step": 265800, "epoch": 2196} {"train_loss": -42.49152374267578, "global_step": 265801, "epoch": 2196} {"train_loss": -42.82748031616211, "global_step": 265802, "epoch": 2196} {"train_loss": -43.80005645751953, "global_step": 265803, "epoch": 2196} {"train_loss": -43.70082473754883, "global_step": 265804, "epoch": 2196} {"train_loss": -43.3799934387207, "global_step": 265805, "epoch": 2196} {"train_loss": -43.78023147583008, "global_step": 265806, "epoch": 2196} {"train_loss": -43.37266540527344, "global_step": 265807, "epoch": 2196} {"train_loss": -43.397396087646484, "global_step": 265808, "epoch": 2196} {"train_loss": -43.16606140136719, "global_step": 265809, "epoch": 2196} {"train_loss": -42.07319641113281, "global_step": 265810, "epoch": 2196} {"train_loss": -41.635101318359375, "global_step": 265811, "epoch": 2196} {"train_loss": -43.36553955078125, "global_step": 265812, "epoch": 2196} {"train_loss": -42.95154571533203, "global_step": 265813, "epoch": 2196} {"train_loss": -41.6185302734375, "global_step": 265814, "epoch": 2196} {"train_loss": -43.20833206176758, "global_step": 265815, "epoch": 2196} {"train_loss": -42.96302032470703, "global_step": 265816, "epoch": 2196} {"train_loss": -44.092498779296875, "global_step": 265817, "epoch": 2196} {"train_loss": -42.88349533081055, "global_step": 265818, "epoch": 2196} {"train_loss": -41.1904411315918, "global_step": 265819, "epoch": 2196} {"train_loss": -42.000545501708984, "global_step": 265820, "epoch": 2196} {"train_loss": -42.38750076293945, "global_step": 265821, "epoch": 2196} {"train_loss": -42.45220947265625, "global_step": 265822, "epoch": 2196} {"train_loss": -43.30531692504883, "global_step": 265823, "epoch": 2196} {"train_loss": -43.3751106262207, "global_step": 265824, "epoch": 2196} {"train_loss": -42.72978591918945, "global_step": 265825, "epoch": 2196} {"train_loss": -42.445159912109375, "global_step": 265826, "epoch": 2196} {"train_loss": -42.48242950439453, "global_step": 265827, "epoch": 2196} {"train_loss": -43.054962158203125, "global_step": 265828, "epoch": 2196} {"train_loss": -43.166351318359375, "global_step": 265829, "epoch": 2196} {"train_loss": -40.78789520263672, "global_step": 265830, "epoch": 2196} {"train_loss": -41.68260955810547, "global_step": 265831, "epoch": 2196} {"train_loss": -42.504364013671875, "global_step": 265832, "epoch": 2196} {"train_loss": -43.35258865356445, "global_step": 265833, "epoch": 2196} {"train_loss": -41.891883850097656, "global_step": 265834, "epoch": 2196} {"train_loss": -43.812740325927734, "global_step": 265835, "epoch": 2196} {"train_loss": -43.01732304470598, "global_step": 265836, "epoch": 2196, "val_loss": 2683944.25} {"train_loss": -41.79830551147461, "global_step": 265837, "epoch": 2197} {"train_loss": -43.721717834472656, "global_step": 265838, "epoch": 2197} {"train_loss": -41.704139709472656, "global_step": 265839, "epoch": 2197} {"train_loss": -42.528419494628906, "global_step": 265840, "epoch": 2197} {"train_loss": -43.571231842041016, "global_step": 265841, "epoch": 2197} {"train_loss": -43.09095001220703, "global_step": 265842, "epoch": 2197} {"train_loss": -42.03473663330078, "global_step": 265843, "epoch": 2197} {"train_loss": -42.936431884765625, "global_step": 265844, "epoch": 2197} {"train_loss": -43.059017181396484, "global_step": 265845, "epoch": 2197} {"train_loss": -43.29744338989258, "global_step": 265846, "epoch": 2197} {"train_loss": -42.984375, "global_step": 265847, "epoch": 2197} {"train_loss": -41.40433883666992, "global_step": 265848, "epoch": 2197} {"train_loss": -41.198482513427734, "global_step": 265849, "epoch": 2197} {"train_loss": -42.30628204345703, "global_step": 265850, "epoch": 2197} {"train_loss": -42.20097351074219, "global_step": 265851, "epoch": 2197} {"train_loss": -40.47066116333008, "global_step": 265852, "epoch": 2197} {"train_loss": -42.16919708251953, "global_step": 265853, "epoch": 2197} {"train_loss": -41.736148834228516, "global_step": 265854, "epoch": 2197} {"train_loss": -41.746246337890625, "global_step": 265855, "epoch": 2197} {"train_loss": -39.45412063598633, "global_step": 265856, "epoch": 2197} {"train_loss": -41.72090148925781, "global_step": 265857, "epoch": 2197} {"train_loss": -41.841976165771484, "global_step": 265858, "epoch": 2197} {"train_loss": -38.71118927001953, "global_step": 265859, "epoch": 2197} {"train_loss": -42.57400131225586, "global_step": 265860, "epoch": 2197} {"train_loss": -38.35857009887695, "global_step": 265861, "epoch": 2197} {"train_loss": -42.54035568237305, "global_step": 265862, "epoch": 2197} {"train_loss": -38.00465393066406, "global_step": 265863, "epoch": 2197} {"train_loss": -40.407318115234375, "global_step": 265864, "epoch": 2197} {"train_loss": -39.89707565307617, "global_step": 265865, "epoch": 2197} {"train_loss": -40.94736862182617, "global_step": 265866, "epoch": 2197} {"train_loss": -40.27100372314453, "global_step": 265867, "epoch": 2197} {"train_loss": -39.11619567871094, "global_step": 265868, "epoch": 2197} {"train_loss": -41.92914581298828, "global_step": 265869, "epoch": 2197} {"train_loss": -38.32788848876953, "global_step": 265870, "epoch": 2197} {"train_loss": -41.88857650756836, "global_step": 265871, "epoch": 2197} {"train_loss": -37.63554763793945, "global_step": 265872, "epoch": 2197} {"train_loss": -42.540191650390625, "global_step": 265873, "epoch": 2197} {"train_loss": -40.05740737915039, "global_step": 265874, "epoch": 2197} {"train_loss": -40.742733001708984, "global_step": 265875, "epoch": 2197} {"train_loss": -40.573909759521484, "global_step": 265876, "epoch": 2197} {"train_loss": -39.326656341552734, "global_step": 265877, "epoch": 2197} {"train_loss": -41.66674041748047, "global_step": 265878, "epoch": 2197} {"train_loss": -40.890419006347656, "global_step": 265879, "epoch": 2197} {"train_loss": -40.592201232910156, "global_step": 265880, "epoch": 2197} {"train_loss": -40.2671012878418, "global_step": 265881, "epoch": 2197} {"train_loss": -40.34868240356445, "global_step": 265882, "epoch": 2197} {"train_loss": -41.280086517333984, "global_step": 265883, "epoch": 2197} {"train_loss": -39.95256805419922, "global_step": 265884, "epoch": 2197} {"train_loss": -41.94107437133789, "global_step": 265885, "epoch": 2197} {"train_loss": -41.421730041503906, "global_step": 265886, "epoch": 2197} {"train_loss": -42.20943832397461, "global_step": 265887, "epoch": 2197} {"train_loss": -41.88102722167969, "global_step": 265888, "epoch": 2197} {"train_loss": -41.55411911010742, "global_step": 265889, "epoch": 2197} {"train_loss": -42.13638687133789, "global_step": 265890, "epoch": 2197} {"train_loss": -42.70768356323242, "global_step": 265891, "epoch": 2197} {"train_loss": -42.07870101928711, "global_step": 265892, "epoch": 2197} {"train_loss": -41.3256721496582, "global_step": 265893, "epoch": 2197} {"train_loss": -42.677913665771484, "global_step": 265894, "epoch": 2197} {"train_loss": -42.84821319580078, "global_step": 265895, "epoch": 2197} {"train_loss": -43.2291145324707, "global_step": 265896, "epoch": 2197} {"train_loss": -43.3509635925293, "global_step": 265897, "epoch": 2197} {"train_loss": -42.54197311401367, "global_step": 265898, "epoch": 2197} {"train_loss": -43.21903991699219, "global_step": 265899, "epoch": 2197} {"train_loss": -42.96462631225586, "global_step": 265900, "epoch": 2197} {"train_loss": -43.49363327026367, "global_step": 265901, "epoch": 2197} {"train_loss": -42.37276077270508, "global_step": 265902, "epoch": 2197} {"train_loss": -43.1547737121582, "global_step": 265903, "epoch": 2197} {"train_loss": -43.27141571044922, "global_step": 265904, "epoch": 2197} {"train_loss": -42.97178268432617, "global_step": 265905, "epoch": 2197} {"train_loss": -43.58285140991211, "global_step": 265906, "epoch": 2197} {"train_loss": -43.2942008972168, "global_step": 265907, "epoch": 2197} {"train_loss": -43.7688102722168, "global_step": 265908, "epoch": 2197} {"train_loss": -43.7262077331543, "global_step": 265909, "epoch": 2197} {"train_loss": -43.46516799926758, "global_step": 265910, "epoch": 2197} {"train_loss": -43.115928649902344, "global_step": 265911, "epoch": 2197} {"train_loss": -43.453697204589844, "global_step": 265912, "epoch": 2197} {"train_loss": -43.68119812011719, "global_step": 265913, "epoch": 2197} {"train_loss": -43.71842575073242, "global_step": 265914, "epoch": 2197} {"train_loss": -43.542999267578125, "global_step": 265915, "epoch": 2197} {"train_loss": -43.402503967285156, "global_step": 265916, "epoch": 2197} {"train_loss": -43.73821258544922, "global_step": 265917, "epoch": 2197} {"train_loss": -43.45512771606445, "global_step": 265918, "epoch": 2197} {"train_loss": -43.60288619995117, "global_step": 265919, "epoch": 2197} {"train_loss": -44.02547836303711, "global_step": 265920, "epoch": 2197} {"train_loss": -42.37227249145508, "global_step": 265921, "epoch": 2197} {"train_loss": -44.024173736572266, "global_step": 265922, "epoch": 2197} {"train_loss": -43.6922492980957, "global_step": 265923, "epoch": 2197} {"train_loss": -44.002376556396484, "global_step": 265924, "epoch": 2197} {"train_loss": -43.80902099609375, "global_step": 265925, "epoch": 2197} {"train_loss": -44.46669387817383, "global_step": 265926, "epoch": 2197} {"train_loss": -44.43451690673828, "global_step": 265927, "epoch": 2197} {"train_loss": -44.21836471557617, "global_step": 265928, "epoch": 2197} {"train_loss": -43.94965744018555, "global_step": 265929, "epoch": 2197} {"train_loss": -43.927818298339844, "global_step": 265930, "epoch": 2197} {"train_loss": -44.26585006713867, "global_step": 265931, "epoch": 2197} {"train_loss": -44.44929122924805, "global_step": 265932, "epoch": 2197} {"train_loss": -44.411312103271484, "global_step": 265933, "epoch": 2197} {"train_loss": -44.3907356262207, "global_step": 265934, "epoch": 2197} {"train_loss": -44.42204666137695, "global_step": 265935, "epoch": 2197} {"train_loss": -43.92292022705078, "global_step": 265936, "epoch": 2197} {"train_loss": -44.65664291381836, "global_step": 265937, "epoch": 2197} {"train_loss": -43.62911605834961, "global_step": 265938, "epoch": 2197} {"train_loss": -44.39445114135742, "global_step": 265939, "epoch": 2197} {"train_loss": -44.42855453491211, "global_step": 265940, "epoch": 2197} {"train_loss": -44.64856719970703, "global_step": 265941, "epoch": 2197} {"train_loss": -44.624446868896484, "global_step": 265942, "epoch": 2197} {"train_loss": -44.22521209716797, "global_step": 265943, "epoch": 2197} {"train_loss": -44.114070892333984, "global_step": 265944, "epoch": 2197} {"train_loss": -44.640037536621094, "global_step": 265945, "epoch": 2197} {"train_loss": -44.774593353271484, "global_step": 265946, "epoch": 2197} {"train_loss": -42.90397262573242, "global_step": 265947, "epoch": 2197} {"train_loss": -44.489707946777344, "global_step": 265948, "epoch": 2197} {"train_loss": -44.39453887939453, "global_step": 265949, "epoch": 2197} {"train_loss": -42.46833801269531, "global_step": 265950, "epoch": 2197} {"train_loss": -37.19968795776367, "global_step": 265951, "epoch": 2197} {"train_loss": -42.25956344604492, "global_step": 265952, "epoch": 2197} {"train_loss": -44.4079475402832, "global_step": 265953, "epoch": 2197} {"train_loss": -41.442806243896484, "global_step": 265954, "epoch": 2197} {"train_loss": -42.86149215698242, "global_step": 265955, "epoch": 2197} {"train_loss": -41.960018157958984, "global_step": 265956, "epoch": 2197} {"train_loss": -42.45430821820724, "global_step": 265957, "epoch": 2197, "val_loss": 2802407.75} {"train_loss": -44.089935302734375, "global_step": 265958, "epoch": 2198} {"train_loss": -43.645992279052734, "global_step": 265959, "epoch": 2198} {"train_loss": -40.42453384399414, "global_step": 265960, "epoch": 2198} {"train_loss": -37.0050163269043, "global_step": 265961, "epoch": 2198} {"train_loss": -42.1216926574707, "global_step": 265962, "epoch": 2198} {"train_loss": -39.379329681396484, "global_step": 265963, "epoch": 2198} {"train_loss": -41.91355514526367, "global_step": 265964, "epoch": 2198} {"train_loss": -41.34307098388672, "global_step": 265965, "epoch": 2198} {"train_loss": -40.36539077758789, "global_step": 265966, "epoch": 2198} {"train_loss": -41.630531311035156, "global_step": 265967, "epoch": 2198} {"train_loss": -42.812191009521484, "global_step": 265968, "epoch": 2198} {"train_loss": -40.79389572143555, "global_step": 265969, "epoch": 2198} {"train_loss": -40.3411750793457, "global_step": 265970, "epoch": 2198} {"train_loss": -41.487186431884766, "global_step": 265971, "epoch": 2198} {"train_loss": -42.2023811340332, "global_step": 265972, "epoch": 2198} {"train_loss": -40.91592025756836, "global_step": 265973, "epoch": 2198} {"train_loss": -42.4937744140625, "global_step": 265974, "epoch": 2198} {"train_loss": -41.45728302001953, "global_step": 265975, "epoch": 2198} {"train_loss": -39.67733383178711, "global_step": 265976, "epoch": 2198} {"train_loss": -42.306121826171875, "global_step": 265977, "epoch": 2198} {"train_loss": -36.477272033691406, "global_step": 265978, "epoch": 2198} {"train_loss": -32.78279495239258, "global_step": 265979, "epoch": 2198} {"train_loss": -34.63416290283203, "global_step": 265980, "epoch": 2198} {"train_loss": -40.25065994262695, "global_step": 265981, "epoch": 2198} {"train_loss": -29.325855255126953, "global_step": 265982, "epoch": 2198} {"train_loss": -38.35836410522461, "global_step": 265983, "epoch": 2198} {"train_loss": -38.999053955078125, "global_step": 265984, "epoch": 2198} {"train_loss": -32.03572463989258, "global_step": 265985, "epoch": 2198} {"train_loss": -38.10825729370117, "global_step": 265986, "epoch": 2198} {"train_loss": -35.70091247558594, "global_step": 265987, "epoch": 2198} {"train_loss": -37.322235107421875, "global_step": 265988, "epoch": 2198} {"train_loss": -38.10373306274414, "global_step": 265989, "epoch": 2198} {"train_loss": -40.284725189208984, "global_step": 265990, "epoch": 2198} {"train_loss": -38.418766021728516, "global_step": 265991, "epoch": 2198} {"train_loss": -41.524375915527344, "global_step": 265992, "epoch": 2198} {"train_loss": -38.70509719848633, "global_step": 265993, "epoch": 2198} {"train_loss": -40.63259506225586, "global_step": 265994, "epoch": 2198} {"train_loss": -39.47303009033203, "global_step": 265995, "epoch": 2198} {"train_loss": -40.28860092163086, "global_step": 265996, "epoch": 2198} {"train_loss": -41.565608978271484, "global_step": 265997, "epoch": 2198} {"train_loss": -39.93159866333008, "global_step": 265998, "epoch": 2198} {"train_loss": -41.126556396484375, "global_step": 265999, "epoch": 2198} {"train_loss": -41.437923431396484, "global_step": 266000, "epoch": 2198} {"train_loss": -39.67835998535156, "global_step": 266001, "epoch": 2198} {"train_loss": -40.91584396362305, "global_step": 266002, "epoch": 2198} {"train_loss": -41.15669631958008, "global_step": 266003, "epoch": 2198} {"train_loss": -41.40195846557617, "global_step": 266004, "epoch": 2198} {"train_loss": -40.62138748168945, "global_step": 266005, "epoch": 2198} {"train_loss": -41.16368103027344, "global_step": 266006, "epoch": 2198} {"train_loss": -41.8240852355957, "global_step": 266007, "epoch": 2198} {"train_loss": -41.94721984863281, "global_step": 266008, "epoch": 2198} {"train_loss": -39.07129669189453, "global_step": 266009, "epoch": 2198} {"train_loss": -42.00910186767578, "global_step": 266010, "epoch": 2198} {"train_loss": -41.48512649536133, "global_step": 266011, "epoch": 2198} {"train_loss": -42.44381332397461, "global_step": 266012, "epoch": 2198} {"train_loss": -42.01751708984375, "global_step": 266013, "epoch": 2198} {"train_loss": -41.931575775146484, "global_step": 266014, "epoch": 2198} {"train_loss": -42.051021575927734, "global_step": 266015, "epoch": 2198} {"train_loss": -42.4934196472168, "global_step": 266016, "epoch": 2198} {"train_loss": -42.68280029296875, "global_step": 266017, "epoch": 2198} {"train_loss": -42.170318603515625, "global_step": 266018, "epoch": 2198} {"train_loss": -42.18830490112305, "global_step": 266019, "epoch": 2198} {"train_loss": -42.50358963012695, "global_step": 266020, "epoch": 2198} {"train_loss": -43.03974533081055, "global_step": 266021, "epoch": 2198} {"train_loss": -43.3675651550293, "global_step": 266022, "epoch": 2198} {"train_loss": -42.79909133911133, "global_step": 266023, "epoch": 2198} {"train_loss": -43.0617561340332, "global_step": 266024, "epoch": 2198} {"train_loss": -43.24549102783203, "global_step": 266025, "epoch": 2198} {"train_loss": -42.01844787597656, "global_step": 266026, "epoch": 2198} {"train_loss": -42.75052261352539, "global_step": 266027, "epoch": 2198} {"train_loss": -43.00391387939453, "global_step": 266028, "epoch": 2198} {"train_loss": -42.8205680847168, "global_step": 266029, "epoch": 2198} {"train_loss": -43.256141662597656, "global_step": 266030, "epoch": 2198} {"train_loss": -42.647823333740234, "global_step": 266031, "epoch": 2198} {"train_loss": -43.315162658691406, "global_step": 266032, "epoch": 2198} {"train_loss": -41.989532470703125, "global_step": 266033, "epoch": 2198} {"train_loss": -42.056312561035156, "global_step": 266034, "epoch": 2198} {"train_loss": -41.5574836730957, "global_step": 266035, "epoch": 2198} {"train_loss": -43.347694396972656, "global_step": 266036, "epoch": 2198} {"train_loss": -43.20600128173828, "global_step": 266037, "epoch": 2198} {"train_loss": -43.554901123046875, "global_step": 266038, "epoch": 2198} {"train_loss": -42.40656661987305, "global_step": 266039, "epoch": 2198} {"train_loss": -43.40083694458008, "global_step": 266040, "epoch": 2198} {"train_loss": -43.30251693725586, "global_step": 266041, "epoch": 2198} {"train_loss": -43.3801155090332, "global_step": 266042, "epoch": 2198} {"train_loss": -43.021610260009766, "global_step": 266043, "epoch": 2198} {"train_loss": -43.4895133972168, "global_step": 266044, "epoch": 2198} {"train_loss": -42.5648307800293, "global_step": 266045, "epoch": 2198} {"train_loss": -43.35245895385742, "global_step": 266046, "epoch": 2198} {"train_loss": -43.12942886352539, "global_step": 266047, "epoch": 2198} {"train_loss": -43.35639953613281, "global_step": 266048, "epoch": 2198} {"train_loss": -44.01803970336914, "global_step": 266049, "epoch": 2198} {"train_loss": -43.87285614013672, "global_step": 266050, "epoch": 2198} {"train_loss": -43.079715728759766, "global_step": 266051, "epoch": 2198} {"train_loss": -43.91498947143555, "global_step": 266052, "epoch": 2198} {"train_loss": -42.32330322265625, "global_step": 266053, "epoch": 2198} {"train_loss": -43.66347885131836, "global_step": 266054, "epoch": 2198} {"train_loss": -43.56046676635742, "global_step": 266055, "epoch": 2198} {"train_loss": -42.60396957397461, "global_step": 266056, "epoch": 2198} {"train_loss": -41.72706985473633, "global_step": 266057, "epoch": 2198} {"train_loss": -43.103851318359375, "global_step": 266058, "epoch": 2198} {"train_loss": -43.67851638793945, "global_step": 266059, "epoch": 2198} {"train_loss": -43.352996826171875, "global_step": 266060, "epoch": 2198} {"train_loss": -43.31489181518555, "global_step": 266061, "epoch": 2198} {"train_loss": -43.66203689575195, "global_step": 266062, "epoch": 2198} {"train_loss": -43.727813720703125, "global_step": 266063, "epoch": 2198} {"train_loss": -42.76606369018555, "global_step": 266064, "epoch": 2198} {"train_loss": -43.34615707397461, "global_step": 266065, "epoch": 2198} {"train_loss": -43.801673889160156, "global_step": 266066, "epoch": 2198} {"train_loss": -43.72127914428711, "global_step": 266067, "epoch": 2198} {"train_loss": -43.93291091918945, "global_step": 266068, "epoch": 2198} {"train_loss": -43.111568450927734, "global_step": 266069, "epoch": 2198} {"train_loss": -42.16483688354492, "global_step": 266070, "epoch": 2198} {"train_loss": -42.6174430847168, "global_step": 266071, "epoch": 2198} {"train_loss": -42.635135650634766, "global_step": 266072, "epoch": 2198} {"train_loss": -42.798824310302734, "global_step": 266073, "epoch": 2198} {"train_loss": -41.19034957885742, "global_step": 266074, "epoch": 2198} {"train_loss": -42.913143157958984, "global_step": 266075, "epoch": 2198} {"train_loss": -42.79502487182617, "global_step": 266076, "epoch": 2198} {"train_loss": -43.27992630004883, "global_step": 266077, "epoch": 2198} {"train_loss": -41.5668633831434, "global_step": 266078, "epoch": 2198, "val_loss": 2659893.25} {"train_loss": -42.67393112182617, "global_step": 266079, "epoch": 2199} {"train_loss": -43.48311996459961, "global_step": 266080, "epoch": 2199} {"train_loss": -42.11181640625, "global_step": 266081, "epoch": 2199} {"train_loss": -39.305023193359375, "global_step": 266082, "epoch": 2199} {"train_loss": -43.11655807495117, "global_step": 266083, "epoch": 2199} {"train_loss": -42.115997314453125, "global_step": 266084, "epoch": 2199} {"train_loss": -38.688209533691406, "global_step": 266085, "epoch": 2199} {"train_loss": -43.78309631347656, "global_step": 266086, "epoch": 2199} {"train_loss": -38.77107238769531, "global_step": 266087, "epoch": 2199} {"train_loss": -41.19306182861328, "global_step": 266088, "epoch": 2199} {"train_loss": -43.20784378051758, "global_step": 266089, "epoch": 2199} {"train_loss": -40.178672790527344, "global_step": 266090, "epoch": 2199} {"train_loss": -43.16722106933594, "global_step": 266091, "epoch": 2199} {"train_loss": -41.82996368408203, "global_step": 266092, "epoch": 2199} {"train_loss": -41.191062927246094, "global_step": 266093, "epoch": 2199} {"train_loss": -42.98440933227539, "global_step": 266094, "epoch": 2199} {"train_loss": -41.42905807495117, "global_step": 266095, "epoch": 2199} {"train_loss": -41.528568267822266, "global_step": 266096, "epoch": 2199} {"train_loss": -43.98798751831055, "global_step": 266097, "epoch": 2199} {"train_loss": -41.12839889526367, "global_step": 266098, "epoch": 2199} {"train_loss": -43.203529357910156, "global_step": 266099, "epoch": 2199} {"train_loss": -41.7043571472168, "global_step": 266100, "epoch": 2199} {"train_loss": -42.03656005859375, "global_step": 266101, "epoch": 2199} {"train_loss": -43.764129638671875, "global_step": 266102, "epoch": 2199} {"train_loss": -41.99794006347656, "global_step": 266103, "epoch": 2199} {"train_loss": -42.63728713989258, "global_step": 266104, "epoch": 2199} {"train_loss": -42.4593505859375, "global_step": 266105, "epoch": 2199} {"train_loss": -42.12897491455078, "global_step": 266106, "epoch": 2199} {"train_loss": -43.01420974731445, "global_step": 266107, "epoch": 2199} {"train_loss": -41.86455535888672, "global_step": 266108, "epoch": 2199} {"train_loss": -43.56586837768555, "global_step": 266109, "epoch": 2199} {"train_loss": -42.53132247924805, "global_step": 266110, "epoch": 2199} {"train_loss": -43.17120361328125, "global_step": 266111, "epoch": 2199} {"train_loss": -43.40365219116211, "global_step": 266112, "epoch": 2199} {"train_loss": -44.01384353637695, "global_step": 266113, "epoch": 2199} {"train_loss": -43.17814636230469, "global_step": 266114, "epoch": 2199} {"train_loss": -43.248046875, "global_step": 266115, "epoch": 2199} {"train_loss": -43.34080123901367, "global_step": 266116, "epoch": 2199} {"train_loss": -43.73269271850586, "global_step": 266117, "epoch": 2199} {"train_loss": -44.0482292175293, "global_step": 266118, "epoch": 2199} {"train_loss": -43.216915130615234, "global_step": 266119, "epoch": 2199} {"train_loss": -43.9162712097168, "global_step": 266120, "epoch": 2199} {"train_loss": -44.06409454345703, "global_step": 266121, "epoch": 2199} {"train_loss": -43.80249786376953, "global_step": 266122, "epoch": 2199} {"train_loss": -43.97868728637695, "global_step": 266123, "epoch": 2199} {"train_loss": -44.13565444946289, "global_step": 266124, "epoch": 2199} {"train_loss": -43.725677490234375, "global_step": 266125, "epoch": 2199} {"train_loss": -44.14082336425781, "global_step": 266126, "epoch": 2199} {"train_loss": -38.97346115112305, "global_step": 266127, "epoch": 2199} {"train_loss": -44.043243408203125, "global_step": 266128, "epoch": 2199} {"train_loss": -43.35401153564453, "global_step": 266129, "epoch": 2199} {"train_loss": -43.50273132324219, "global_step": 266130, "epoch": 2199} {"train_loss": -43.78098678588867, "global_step": 266131, "epoch": 2199} {"train_loss": -43.582340240478516, "global_step": 266132, "epoch": 2199} {"train_loss": -42.78727340698242, "global_step": 266133, "epoch": 2199} {"train_loss": -42.03594970703125, "global_step": 266134, "epoch": 2199} {"train_loss": -43.142391204833984, "global_step": 266135, "epoch": 2199} {"train_loss": -44.29340744018555, "global_step": 266136, "epoch": 2199} {"train_loss": -44.26039505004883, "global_step": 266137, "epoch": 2199} {"train_loss": -42.55447006225586, "global_step": 266138, "epoch": 2199} {"train_loss": -42.603023529052734, "global_step": 266139, "epoch": 2199} {"train_loss": -43.21131896972656, "global_step": 266140, "epoch": 2199} {"train_loss": -43.28109359741211, "global_step": 266141, "epoch": 2199} {"train_loss": -41.88773727416992, "global_step": 266142, "epoch": 2199} {"train_loss": -43.936763763427734, "global_step": 266143, "epoch": 2199} {"train_loss": -42.541786193847656, "global_step": 266144, "epoch": 2199} {"train_loss": -37.98960494995117, "global_step": 266145, "epoch": 2199} {"train_loss": -42.35061264038086, "global_step": 266146, "epoch": 2199} {"train_loss": -40.57954025268555, "global_step": 266147, "epoch": 2199} {"train_loss": -37.3659553527832, "global_step": 266148, "epoch": 2199} {"train_loss": -39.346553802490234, "global_step": 266149, "epoch": 2199} {"train_loss": -38.16509246826172, "global_step": 266150, "epoch": 2199} {"train_loss": -36.72957229614258, "global_step": 266151, "epoch": 2199} {"train_loss": -38.38863754272461, "global_step": 266152, "epoch": 2199} {"train_loss": -38.99943161010742, "global_step": 266153, "epoch": 2199} {"train_loss": -37.75143814086914, "global_step": 266154, "epoch": 2199} {"train_loss": -37.95769500732422, "global_step": 266155, "epoch": 2199} {"train_loss": -38.43777084350586, "global_step": 266156, "epoch": 2199} {"train_loss": -41.7066764831543, "global_step": 266157, "epoch": 2199} {"train_loss": -41.17903137207031, "global_step": 266158, "epoch": 2199} {"train_loss": -40.89508056640625, "global_step": 266159, "epoch": 2199} {"train_loss": -40.543514251708984, "global_step": 266160, "epoch": 2199} {"train_loss": -41.6859130859375, "global_step": 266161, "epoch": 2199} {"train_loss": -40.831642150878906, "global_step": 266162, "epoch": 2199} {"train_loss": -41.569454193115234, "global_step": 266163, "epoch": 2199} {"train_loss": -41.42683792114258, "global_step": 266164, "epoch": 2199} {"train_loss": -40.55733871459961, "global_step": 266165, "epoch": 2199} {"train_loss": -41.3607177734375, "global_step": 266166, "epoch": 2199} {"train_loss": -40.51032638549805, "global_step": 266167, "epoch": 2199} {"train_loss": -41.55146408081055, "global_step": 266168, "epoch": 2199} {"train_loss": -41.757930755615234, "global_step": 266169, "epoch": 2199} {"train_loss": -41.37488555908203, "global_step": 266170, "epoch": 2199} {"train_loss": -42.207923889160156, "global_step": 266171, "epoch": 2199} {"train_loss": -41.723602294921875, "global_step": 266172, "epoch": 2199} {"train_loss": -41.856468200683594, "global_step": 266173, "epoch": 2199} {"train_loss": -42.38385009765625, "global_step": 266174, "epoch": 2199} {"train_loss": -41.439903259277344, "global_step": 266175, "epoch": 2199} {"train_loss": -40.810462951660156, "global_step": 266176, "epoch": 2199} {"train_loss": -41.53950500488281, "global_step": 266177, "epoch": 2199} {"train_loss": -42.04264450073242, "global_step": 266178, "epoch": 2199} {"train_loss": -42.22834396362305, "global_step": 266179, "epoch": 2199} {"train_loss": -41.9097900390625, "global_step": 266180, "epoch": 2199} {"train_loss": -42.340633392333984, "global_step": 266181, "epoch": 2199} {"train_loss": -42.084922790527344, "global_step": 266182, "epoch": 2199} {"train_loss": -42.38439178466797, "global_step": 266183, "epoch": 2199} {"train_loss": -42.62344741821289, "global_step": 266184, "epoch": 2199} {"train_loss": -42.91044998168945, "global_step": 266185, "epoch": 2199} {"train_loss": -42.806739807128906, "global_step": 266186, "epoch": 2199} {"train_loss": -42.31740188598633, "global_step": 266187, "epoch": 2199} {"train_loss": -42.99149703979492, "global_step": 266188, "epoch": 2199} {"train_loss": -43.14520263671875, "global_step": 266189, "epoch": 2199} {"train_loss": -43.500450134277344, "global_step": 266190, "epoch": 2199} {"train_loss": -42.9226188659668, "global_step": 266191, "epoch": 2199} {"train_loss": -43.728389739990234, "global_step": 266192, "epoch": 2199} {"train_loss": -43.35163879394531, "global_step": 266193, "epoch": 2199} {"train_loss": -43.29016876220703, "global_step": 266194, "epoch": 2199} {"train_loss": -43.6576042175293, "global_step": 266195, "epoch": 2199} {"train_loss": -43.388587951660156, "global_step": 266196, "epoch": 2199} {"train_loss": -43.8346061706543, "global_step": 266197, "epoch": 2199} {"train_loss": -43.36698532104492, "global_step": 266198, "epoch": 2199} {"train_loss": -42.125121628942566, "global_step": 266199, "epoch": 2199, "val_loss": 2737556.0} {"train_loss": -44.068565368652344, "global_step": 266200, "epoch": 2200} {"train_loss": -43.0067024230957, "global_step": 266201, "epoch": 2200} {"train_loss": -43.565216064453125, "global_step": 266202, "epoch": 2200} {"train_loss": -43.85811996459961, "global_step": 266203, "epoch": 2200} {"train_loss": -43.94138717651367, "global_step": 266204, "epoch": 2200} {"train_loss": -44.18889236450195, "global_step": 266205, "epoch": 2200} {"train_loss": -43.80519485473633, "global_step": 266206, "epoch": 2200} {"train_loss": -43.99736785888672, "global_step": 266207, "epoch": 2200} {"train_loss": -43.94533157348633, "global_step": 266208, "epoch": 2200} {"train_loss": -44.0994987487793, "global_step": 266209, "epoch": 2200} {"train_loss": -43.7426872253418, "global_step": 266210, "epoch": 2200} {"train_loss": -44.37702941894531, "global_step": 266211, "epoch": 2200} {"train_loss": -44.0677490234375, "global_step": 266212, "epoch": 2200} {"train_loss": -44.25897979736328, "global_step": 266213, "epoch": 2200} {"train_loss": -43.77238845825195, "global_step": 266214, "epoch": 2200} {"train_loss": -43.9898796081543, "global_step": 266215, "epoch": 2200} {"train_loss": -44.18876266479492, "global_step": 266216, "epoch": 2200} {"train_loss": -44.09409713745117, "global_step": 266217, "epoch": 2200} {"train_loss": -44.13927459716797, "global_step": 266218, "epoch": 2200} {"train_loss": -43.945945739746094, "global_step": 266219, "epoch": 2200} {"train_loss": -43.95701217651367, "global_step": 266220, "epoch": 2200} {"train_loss": -44.20854568481445, "global_step": 266221, "epoch": 2200} {"train_loss": -43.90125274658203, "global_step": 266222, "epoch": 2200} {"train_loss": -43.309593200683594, "global_step": 266223, "epoch": 2200} {"train_loss": -44.38169860839844, "global_step": 266224, "epoch": 2200} {"train_loss": -44.48001480102539, "global_step": 266225, "epoch": 2200} {"train_loss": -43.688446044921875, "global_step": 266226, "epoch": 2200} {"train_loss": -44.40178298950195, "global_step": 266227, "epoch": 2200} {"train_loss": -43.87687301635742, "global_step": 266228, "epoch": 2200} {"train_loss": -42.77920150756836, "global_step": 266229, "epoch": 2200} {"train_loss": -43.720726013183594, "global_step": 266230, "epoch": 2200} {"train_loss": -43.98760223388672, "global_step": 266231, "epoch": 2200} {"train_loss": -43.38420486450195, "global_step": 266232, "epoch": 2200} {"train_loss": -42.45665740966797, "global_step": 266233, "epoch": 2200} {"train_loss": -42.5893669128418, "global_step": 266234, "epoch": 2200} {"train_loss": -42.4924201965332, "global_step": 266235, "epoch": 2200} {"train_loss": -41.95337677001953, "global_step": 266236, "epoch": 2200} {"train_loss": -43.20391082763672, "global_step": 266237, "epoch": 2200} {"train_loss": -44.22917938232422, "global_step": 266238, "epoch": 2200} {"train_loss": -43.00950622558594, "global_step": 266239, "epoch": 2200} {"train_loss": -43.55673599243164, "global_step": 266240, "epoch": 2200} {"train_loss": -43.047035217285156, "global_step": 266241, "epoch": 2200} {"train_loss": -43.09804916381836, "global_step": 266242, "epoch": 2200} {"train_loss": -43.45481491088867, "global_step": 266243, "epoch": 2200} {"train_loss": -41.94529342651367, "global_step": 266244, "epoch": 2200} {"train_loss": -43.42240524291992, "global_step": 266245, "epoch": 2200} {"train_loss": -42.88664627075195, "global_step": 266246, "epoch": 2200} {"train_loss": -41.88480758666992, "global_step": 266247, "epoch": 2200} {"train_loss": -43.99098205566406, "global_step": 266248, "epoch": 2200} {"train_loss": -42.581111907958984, "global_step": 266249, "epoch": 2200} {"train_loss": -41.9990119934082, "global_step": 266250, "epoch": 2200} {"train_loss": -43.59357833862305, "global_step": 266251, "epoch": 2200} {"train_loss": -42.33806228637695, "global_step": 266252, "epoch": 2200} {"train_loss": -41.98994064331055, "global_step": 266253, "epoch": 2200} {"train_loss": -43.30355453491211, "global_step": 266254, "epoch": 2200} {"train_loss": -40.97237777709961, "global_step": 266255, "epoch": 2200} {"train_loss": -42.82709884643555, "global_step": 266256, "epoch": 2200} {"train_loss": -41.70632553100586, "global_step": 266257, "epoch": 2200} {"train_loss": -43.08787155151367, "global_step": 266258, "epoch": 2200} {"train_loss": -40.812896728515625, "global_step": 266259, "epoch": 2200} {"train_loss": -43.39435577392578, "global_step": 266260, "epoch": 2200} {"train_loss": -42.81435775756836, "global_step": 266261, "epoch": 2200} {"train_loss": -42.61911392211914, "global_step": 266262, "epoch": 2200} {"train_loss": -43.02265548706055, "global_step": 266263, "epoch": 2200} {"train_loss": -43.17103958129883, "global_step": 266264, "epoch": 2200} {"train_loss": -42.76449203491211, "global_step": 266265, "epoch": 2200} {"train_loss": -42.22188186645508, "global_step": 266266, "epoch": 2200} {"train_loss": -43.661598205566406, "global_step": 266267, "epoch": 2200} {"train_loss": -42.349525451660156, "global_step": 266268, "epoch": 2200} {"train_loss": -43.629119873046875, "global_step": 266269, "epoch": 2200} {"train_loss": -43.12113571166992, "global_step": 266270, "epoch": 2200} {"train_loss": -42.751461029052734, "global_step": 266271, "epoch": 2200} {"train_loss": -42.14909744262695, "global_step": 266272, "epoch": 2200} {"train_loss": -41.37717819213867, "global_step": 266273, "epoch": 2200} {"train_loss": -41.409828186035156, "global_step": 266274, "epoch": 2200} {"train_loss": -42.789329528808594, "global_step": 266275, "epoch": 2200} {"train_loss": -42.42446517944336, "global_step": 266276, "epoch": 2200} {"train_loss": -42.485870361328125, "global_step": 266277, "epoch": 2200} {"train_loss": -43.22776412963867, "global_step": 266278, "epoch": 2200} {"train_loss": -43.34016799926758, "global_step": 266279, "epoch": 2200} {"train_loss": -41.13685989379883, "global_step": 266280, "epoch": 2200} {"train_loss": -39.116966247558594, "global_step": 266281, "epoch": 2200} {"train_loss": -42.808712005615234, "global_step": 266282, "epoch": 2200} {"train_loss": -40.40615463256836, "global_step": 266283, "epoch": 2200} {"train_loss": -41.582244873046875, "global_step": 266284, "epoch": 2200} {"train_loss": -42.515098571777344, "global_step": 266285, "epoch": 2200} {"train_loss": -43.54664993286133, "global_step": 266286, "epoch": 2200} {"train_loss": -42.50264358520508, "global_step": 266287, "epoch": 2200} {"train_loss": -43.39601516723633, "global_step": 266288, "epoch": 2200} {"train_loss": -43.13057327270508, "global_step": 266289, "epoch": 2200} {"train_loss": -42.96583938598633, "global_step": 266290, "epoch": 2200} {"train_loss": -42.75490951538086, "global_step": 266291, "epoch": 2200} {"train_loss": -41.8630485534668, "global_step": 266292, "epoch": 2200} {"train_loss": -42.41576385498047, "global_step": 266293, "epoch": 2200} {"train_loss": -43.355194091796875, "global_step": 266294, "epoch": 2200} {"train_loss": -43.15144729614258, "global_step": 266295, "epoch": 2200} {"train_loss": -43.02443313598633, "global_step": 266296, "epoch": 2200} {"train_loss": -43.309627532958984, "global_step": 266297, "epoch": 2200} {"train_loss": -42.27296447753906, "global_step": 266298, "epoch": 2200} {"train_loss": -40.4322509765625, "global_step": 266299, "epoch": 2200} {"train_loss": -43.206295013427734, "global_step": 266300, "epoch": 2200} {"train_loss": -41.51534652709961, "global_step": 266301, "epoch": 2200} {"train_loss": -42.268890380859375, "global_step": 266302, "epoch": 2200} {"train_loss": -42.47620391845703, "global_step": 266303, "epoch": 2200} {"train_loss": -42.07624053955078, "global_step": 266304, "epoch": 2200} {"train_loss": -42.36812973022461, "global_step": 266305, "epoch": 2200} {"train_loss": -42.24897003173828, "global_step": 266306, "epoch": 2200} {"train_loss": -43.12750244140625, "global_step": 266307, "epoch": 2200} {"train_loss": -42.50889587402344, "global_step": 266308, "epoch": 2200} {"train_loss": -41.78801345825195, "global_step": 266309, "epoch": 2200} {"train_loss": -43.26810836791992, "global_step": 266310, "epoch": 2200} {"train_loss": -42.20526123046875, "global_step": 266311, "epoch": 2200} {"train_loss": -42.383113861083984, "global_step": 266312, "epoch": 2200} {"train_loss": -42.23987579345703, "global_step": 266313, "epoch": 2200} {"train_loss": -41.99275207519531, "global_step": 266314, "epoch": 2200} {"train_loss": -43.730751037597656, "global_step": 266315, "epoch": 2200} {"train_loss": -41.12805938720703, "global_step": 266316, "epoch": 2200} {"train_loss": -43.04924392700195, "global_step": 266317, "epoch": 2200} {"train_loss": -42.620216369628906, "global_step": 266318, "epoch": 2200} {"train_loss": -43.2269172668457, "global_step": 266319, "epoch": 2200} {"train_loss": -42.92910060409672, "global_step": 266320, "epoch": 2200, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4400000": 1.0, "test/sim_max_reward_4400001": 1.0, "test/sim_max_reward_4400002": 1.0, "test/sim_max_reward_4400003": 0.0, "test/sim_max_reward_4400004": 1.0, "test/sim_max_reward_4400005": 1.0, "test/sim_max_reward_4400006": 1.0, "test/sim_max_reward_4400007": 1.0, "test/sim_max_reward_4400008": 1.0, "test/sim_max_reward_4400009": 0.0, "test/sim_max_reward_4400010": 1.0, "test/sim_max_reward_4400011": 1.0, "test/sim_max_reward_4400012": 1.0, "test/sim_max_reward_4400013": 1.0, "test/sim_max_reward_4400014": 1.0, "test/sim_max_reward_4400015": 1.0, "test/sim_max_reward_4400016": 1.0, "test/sim_max_reward_4400017": 1.0, "test/sim_max_reward_4400018": 1.0, "test/sim_max_reward_4400019": 1.0, "test/sim_max_reward_4400020": 1.0, "test/sim_max_reward_4400021": 1.0, "train/mean_score": 1.0, "test/mean_score": 0.9090909090909091, "val_loss": 2815991.0} {"train_loss": -43.15321731567383, "global_step": 266321, "epoch": 2201} {"train_loss": -43.67329025268555, "global_step": 266322, "epoch": 2201} {"train_loss": -42.131065368652344, "global_step": 266323, "epoch": 2201} {"train_loss": -43.24665451049805, "global_step": 266324, "epoch": 2201} {"train_loss": -42.84574508666992, "global_step": 266325, "epoch": 2201} {"train_loss": -43.50210189819336, "global_step": 266326, "epoch": 2201} {"train_loss": -42.62255096435547, "global_step": 266327, "epoch": 2201} {"train_loss": -43.662574768066406, "global_step": 266328, "epoch": 2201} {"train_loss": -43.338253021240234, "global_step": 266329, "epoch": 2201} {"train_loss": -43.639827728271484, "global_step": 266330, "epoch": 2201} {"train_loss": -43.314395904541016, "global_step": 266331, "epoch": 2201} {"train_loss": -43.0609245300293, "global_step": 266332, "epoch": 2201} {"train_loss": -44.43217086791992, "global_step": 266333, "epoch": 2201} {"train_loss": -43.50653839111328, "global_step": 266334, "epoch": 2201} {"train_loss": -43.76152038574219, "global_step": 266335, "epoch": 2201} {"train_loss": -43.396942138671875, "global_step": 266336, "epoch": 2201} {"train_loss": -44.085479736328125, "global_step": 266337, "epoch": 2201} {"train_loss": -43.578060150146484, "global_step": 266338, "epoch": 2201} {"train_loss": -43.864498138427734, "global_step": 266339, "epoch": 2201} {"train_loss": -43.70283126831055, "global_step": 266340, "epoch": 2201} {"train_loss": -43.590545654296875, "global_step": 266341, "epoch": 2201} {"train_loss": -43.840362548828125, "global_step": 266342, "epoch": 2201} {"train_loss": -44.22463607788086, "global_step": 266343, "epoch": 2201} {"train_loss": -42.86723709106445, "global_step": 266344, "epoch": 2201} {"train_loss": -42.76900863647461, "global_step": 266345, "epoch": 2201} {"train_loss": -43.7076301574707, "global_step": 266346, "epoch": 2201} {"train_loss": -42.24397659301758, "global_step": 266347, "epoch": 2201} {"train_loss": -41.240211486816406, "global_step": 266348, "epoch": 2201} {"train_loss": -43.421119689941406, "global_step": 266349, "epoch": 2201} {"train_loss": -40.59519577026367, "global_step": 266350, "epoch": 2201} {"train_loss": -42.65055465698242, "global_step": 266351, "epoch": 2201} {"train_loss": -42.33146286010742, "global_step": 266352, "epoch": 2201} {"train_loss": -41.19880294799805, "global_step": 266353, "epoch": 2201} {"train_loss": -39.97945022583008, "global_step": 266354, "epoch": 2201} {"train_loss": -39.116249084472656, "global_step": 266355, "epoch": 2201} {"train_loss": -43.605712890625, "global_step": 266356, "epoch": 2201} {"train_loss": -40.4128532409668, "global_step": 266357, "epoch": 2201} {"train_loss": -41.88623046875, "global_step": 266358, "epoch": 2201} {"train_loss": -41.9027214050293, "global_step": 266359, "epoch": 2201} {"train_loss": -42.12050247192383, "global_step": 266360, "epoch": 2201} {"train_loss": -41.81613540649414, "global_step": 266361, "epoch": 2201} {"train_loss": -37.35673141479492, "global_step": 266362, "epoch": 2201} {"train_loss": -43.039581298828125, "global_step": 266363, "epoch": 2201} {"train_loss": -41.094417572021484, "global_step": 266364, "epoch": 2201} {"train_loss": -39.62714767456055, "global_step": 266365, "epoch": 2201} {"train_loss": -41.083309173583984, "global_step": 266366, "epoch": 2201} {"train_loss": -41.61345291137695, "global_step": 266367, "epoch": 2201} {"train_loss": -41.7843017578125, "global_step": 266368, "epoch": 2201} {"train_loss": -39.14266586303711, "global_step": 266369, "epoch": 2201} {"train_loss": -42.30796432495117, "global_step": 266370, "epoch": 2201} {"train_loss": -39.1953125, "global_step": 266371, "epoch": 2201} {"train_loss": -40.909576416015625, "global_step": 266372, "epoch": 2201} {"train_loss": -40.38094711303711, "global_step": 266373, "epoch": 2201} {"train_loss": -40.2414436340332, "global_step": 266374, "epoch": 2201} {"train_loss": -41.099361419677734, "global_step": 266375, "epoch": 2201} {"train_loss": -41.956600189208984, "global_step": 266376, "epoch": 2201} {"train_loss": -39.54066848754883, "global_step": 266377, "epoch": 2201} {"train_loss": -42.45990753173828, "global_step": 266378, "epoch": 2201} {"train_loss": -37.320987701416016, "global_step": 266379, "epoch": 2201} {"train_loss": -40.82577133178711, "global_step": 266380, "epoch": 2201} {"train_loss": -37.27368927001953, "global_step": 266381, "epoch": 2201} {"train_loss": -39.375038146972656, "global_step": 266382, "epoch": 2201} {"train_loss": -40.46871566772461, "global_step": 266383, "epoch": 2201} {"train_loss": -38.278076171875, "global_step": 266384, "epoch": 2201} {"train_loss": -42.171688079833984, "global_step": 266385, "epoch": 2201} {"train_loss": -38.0249137878418, "global_step": 266386, "epoch": 2201} {"train_loss": -39.77877426147461, "global_step": 266387, "epoch": 2201} {"train_loss": -40.08766555786133, "global_step": 266388, "epoch": 2201} {"train_loss": -38.8473014831543, "global_step": 266389, "epoch": 2201} {"train_loss": -42.13640213012695, "global_step": 266390, "epoch": 2201} {"train_loss": -39.97751998901367, "global_step": 266391, "epoch": 2201} {"train_loss": -42.2712287902832, "global_step": 266392, "epoch": 2201} {"train_loss": -39.205108642578125, "global_step": 266393, "epoch": 2201} {"train_loss": -42.58314895629883, "global_step": 266394, "epoch": 2201} {"train_loss": -39.97663497924805, "global_step": 266395, "epoch": 2201} {"train_loss": -42.74429702758789, "global_step": 266396, "epoch": 2201} {"train_loss": -40.12364959716797, "global_step": 266397, "epoch": 2201} {"train_loss": -42.397335052490234, "global_step": 266398, "epoch": 2201} {"train_loss": -39.36057662963867, "global_step": 266399, "epoch": 2201} {"train_loss": -42.361915588378906, "global_step": 266400, "epoch": 2201} {"train_loss": -41.191532135009766, "global_step": 266401, "epoch": 2201} {"train_loss": -42.10579299926758, "global_step": 266402, "epoch": 2201} {"train_loss": -41.418792724609375, "global_step": 266403, "epoch": 2201} {"train_loss": -42.33665466308594, "global_step": 266404, "epoch": 2201} {"train_loss": -42.016841888427734, "global_step": 266405, "epoch": 2201} {"train_loss": -42.59653854370117, "global_step": 266406, "epoch": 2201} {"train_loss": -42.413185119628906, "global_step": 266407, "epoch": 2201} {"train_loss": -42.77106857299805, "global_step": 266408, "epoch": 2201} {"train_loss": -42.605098724365234, "global_step": 266409, "epoch": 2201} {"train_loss": -42.80452346801758, "global_step": 266410, "epoch": 2201} {"train_loss": -42.66926193237305, "global_step": 266411, "epoch": 2201} {"train_loss": -42.61371994018555, "global_step": 266412, "epoch": 2201} {"train_loss": -43.3897590637207, "global_step": 266413, "epoch": 2201} {"train_loss": -42.803009033203125, "global_step": 266414, "epoch": 2201} {"train_loss": -43.778656005859375, "global_step": 266415, "epoch": 2201} {"train_loss": -43.040863037109375, "global_step": 266416, "epoch": 2201} {"train_loss": -42.97151184082031, "global_step": 266417, "epoch": 2201} {"train_loss": -41.142784118652344, "global_step": 266418, "epoch": 2201} {"train_loss": -43.20082473754883, "global_step": 266419, "epoch": 2201} {"train_loss": -42.990867614746094, "global_step": 266420, "epoch": 2201} {"train_loss": -43.39931106567383, "global_step": 266421, "epoch": 2201} {"train_loss": -42.582374572753906, "global_step": 266422, "epoch": 2201} {"train_loss": -43.71190643310547, "global_step": 266423, "epoch": 2201} {"train_loss": -43.35060119628906, "global_step": 266424, "epoch": 2201} {"train_loss": -42.500160217285156, "global_step": 266425, "epoch": 2201} {"train_loss": -42.77533721923828, "global_step": 266426, "epoch": 2201} {"train_loss": -43.521240234375, "global_step": 266427, "epoch": 2201} {"train_loss": -35.68679428100586, "global_step": 266428, "epoch": 2201} {"train_loss": -43.540443420410156, "global_step": 266429, "epoch": 2201} {"train_loss": -42.95215606689453, "global_step": 266430, "epoch": 2201} {"train_loss": -43.76247787475586, "global_step": 266431, "epoch": 2201} {"train_loss": -42.24424743652344, "global_step": 266432, "epoch": 2201} {"train_loss": -43.55513381958008, "global_step": 266433, "epoch": 2201} {"train_loss": -43.68444061279297, "global_step": 266434, "epoch": 2201} {"train_loss": -43.711448669433594, "global_step": 266435, "epoch": 2201} {"train_loss": -43.393829345703125, "global_step": 266436, "epoch": 2201} {"train_loss": -43.6936149597168, "global_step": 266437, "epoch": 2201} {"train_loss": -43.88192367553711, "global_step": 266438, "epoch": 2201} {"train_loss": -43.599674224853516, "global_step": 266439, "epoch": 2201} {"train_loss": -43.937255859375, "global_step": 266440, "epoch": 2201} {"train_loss": -42.038986426739655, "global_step": 266441, "epoch": 2201, "val_loss": 2604002.0} {"train_loss": -43.631813049316406, "global_step": 266442, "epoch": 2202} {"train_loss": -43.89461135864258, "global_step": 266443, "epoch": 2202} {"train_loss": -38.64799880981445, "global_step": 266444, "epoch": 2202} {"train_loss": -43.810142517089844, "global_step": 266445, "epoch": 2202} {"train_loss": -42.96223068237305, "global_step": 266446, "epoch": 2202} {"train_loss": -44.04389190673828, "global_step": 266447, "epoch": 2202} {"train_loss": -43.12397384643555, "global_step": 266448, "epoch": 2202} {"train_loss": -43.91160202026367, "global_step": 266449, "epoch": 2202} {"train_loss": -34.814186096191406, "global_step": 266450, "epoch": 2202} {"train_loss": -43.59290313720703, "global_step": 266451, "epoch": 2202} {"train_loss": -43.082672119140625, "global_step": 266452, "epoch": 2202} {"train_loss": -12.52946662902832, "global_step": 266453, "epoch": 2202} {"train_loss": -42.0495719909668, "global_step": 266454, "epoch": 2202} {"train_loss": -42.532833099365234, "global_step": 266455, "epoch": 2202} {"train_loss": -42.693233489990234, "global_step": 266456, "epoch": 2202} {"train_loss": -42.56493377685547, "global_step": 266457, "epoch": 2202} {"train_loss": -42.00454330444336, "global_step": 266458, "epoch": 2202} {"train_loss": -42.528724670410156, "global_step": 266459, "epoch": 2202} {"train_loss": -41.7585563659668, "global_step": 266460, "epoch": 2202} {"train_loss": -43.38630676269531, "global_step": 266461, "epoch": 2202} {"train_loss": -42.35740280151367, "global_step": 266462, "epoch": 2202} {"train_loss": -43.006507873535156, "global_step": 266463, "epoch": 2202} {"train_loss": -42.4410514831543, "global_step": 266464, "epoch": 2202} {"train_loss": -41.61613845825195, "global_step": 266465, "epoch": 2202} {"train_loss": -42.73141098022461, "global_step": 266466, "epoch": 2202} {"train_loss": -41.37971115112305, "global_step": 266467, "epoch": 2202} {"train_loss": -42.5820198059082, "global_step": 266468, "epoch": 2202} {"train_loss": -43.046661376953125, "global_step": 266469, "epoch": 2202} {"train_loss": -39.65134048461914, "global_step": 266470, "epoch": 2202} {"train_loss": -42.73526382446289, "global_step": 266471, "epoch": 2202} {"train_loss": -33.59699249267578, "global_step": 266472, "epoch": 2202} {"train_loss": -41.565330505371094, "global_step": 266473, "epoch": 2202} {"train_loss": -42.36956787109375, "global_step": 266474, "epoch": 2202} {"train_loss": -41.74605178833008, "global_step": 266475, "epoch": 2202} {"train_loss": -39.72530746459961, "global_step": 266476, "epoch": 2202} {"train_loss": -42.110328674316406, "global_step": 266477, "epoch": 2202} {"train_loss": -40.842681884765625, "global_step": 266478, "epoch": 2202} {"train_loss": -38.63358688354492, "global_step": 266479, "epoch": 2202} {"train_loss": -41.871707916259766, "global_step": 266480, "epoch": 2202} {"train_loss": -42.78034591674805, "global_step": 266481, "epoch": 2202} {"train_loss": -41.99262237548828, "global_step": 266482, "epoch": 2202} {"train_loss": -41.134490966796875, "global_step": 266483, "epoch": 2202} {"train_loss": -41.967872619628906, "global_step": 266484, "epoch": 2202} {"train_loss": -42.78561019897461, "global_step": 266485, "epoch": 2202} {"train_loss": -39.53547286987305, "global_step": 266486, "epoch": 2202} {"train_loss": -42.79199981689453, "global_step": 266487, "epoch": 2202} {"train_loss": -41.38337326049805, "global_step": 266488, "epoch": 2202} {"train_loss": -42.690982818603516, "global_step": 266489, "epoch": 2202} {"train_loss": -42.823760986328125, "global_step": 266490, "epoch": 2202} {"train_loss": -40.59534454345703, "global_step": 266491, "epoch": 2202} {"train_loss": -42.74882507324219, "global_step": 266492, "epoch": 2202} {"train_loss": -42.55849838256836, "global_step": 266493, "epoch": 2202} {"train_loss": -42.68846130371094, "global_step": 266494, "epoch": 2202} {"train_loss": -43.04759216308594, "global_step": 266495, "epoch": 2202} {"train_loss": -42.16948318481445, "global_step": 266496, "epoch": 2202} {"train_loss": -42.50368118286133, "global_step": 266497, "epoch": 2202} {"train_loss": -41.604915618896484, "global_step": 266498, "epoch": 2202} {"train_loss": -41.537261962890625, "global_step": 266499, "epoch": 2202} {"train_loss": -42.03973388671875, "global_step": 266500, "epoch": 2202} {"train_loss": -42.49555587768555, "global_step": 266501, "epoch": 2202} {"train_loss": -41.454158782958984, "global_step": 266502, "epoch": 2202} {"train_loss": -43.04779052734375, "global_step": 266503, "epoch": 2202} {"train_loss": -42.413368225097656, "global_step": 266504, "epoch": 2202} {"train_loss": -41.9449348449707, "global_step": 266505, "epoch": 2202} {"train_loss": -38.35390853881836, "global_step": 266506, "epoch": 2202} {"train_loss": -42.636409759521484, "global_step": 266507, "epoch": 2202} {"train_loss": -42.4049186706543, "global_step": 266508, "epoch": 2202} {"train_loss": -42.30601119995117, "global_step": 266509, "epoch": 2202} {"train_loss": -43.018707275390625, "global_step": 266510, "epoch": 2202} {"train_loss": -42.61692428588867, "global_step": 266511, "epoch": 2202} {"train_loss": -42.495086669921875, "global_step": 266512, "epoch": 2202} {"train_loss": -42.2786750793457, "global_step": 266513, "epoch": 2202} {"train_loss": -42.96405792236328, "global_step": 266514, "epoch": 2202} {"train_loss": -43.379329681396484, "global_step": 266515, "epoch": 2202} {"train_loss": -42.391136169433594, "global_step": 266516, "epoch": 2202} {"train_loss": -43.32908248901367, "global_step": 266517, "epoch": 2202} {"train_loss": -43.133235931396484, "global_step": 266518, "epoch": 2202} {"train_loss": -42.79248046875, "global_step": 266519, "epoch": 2202} {"train_loss": -43.00225830078125, "global_step": 266520, "epoch": 2202} {"train_loss": -42.56758117675781, "global_step": 266521, "epoch": 2202} {"train_loss": -43.38624954223633, "global_step": 266522, "epoch": 2202} {"train_loss": -43.21586990356445, "global_step": 266523, "epoch": 2202} {"train_loss": -42.795005798339844, "global_step": 266524, "epoch": 2202} {"train_loss": -43.23125076293945, "global_step": 266525, "epoch": 2202} {"train_loss": -42.025150299072266, "global_step": 266526, "epoch": 2202} {"train_loss": -43.63661575317383, "global_step": 266527, "epoch": 2202} {"train_loss": -40.9278564453125, "global_step": 266528, "epoch": 2202} {"train_loss": -43.638668060302734, "global_step": 266529, "epoch": 2202} {"train_loss": -43.44865798950195, "global_step": 266530, "epoch": 2202} {"train_loss": -42.949459075927734, "global_step": 266531, "epoch": 2202} {"train_loss": -43.382080078125, "global_step": 266532, "epoch": 2202} {"train_loss": -43.64905548095703, "global_step": 266533, "epoch": 2202} {"train_loss": -43.658695220947266, "global_step": 266534, "epoch": 2202} {"train_loss": -43.84471130371094, "global_step": 266535, "epoch": 2202} {"train_loss": -43.48666000366211, "global_step": 266536, "epoch": 2202} {"train_loss": -44.052223205566406, "global_step": 266537, "epoch": 2202} {"train_loss": -43.163047790527344, "global_step": 266538, "epoch": 2202} {"train_loss": -43.57582092285156, "global_step": 266539, "epoch": 2202} {"train_loss": -43.90663528442383, "global_step": 266540, "epoch": 2202} {"train_loss": -43.73849105834961, "global_step": 266541, "epoch": 2202} {"train_loss": -43.78496170043945, "global_step": 266542, "epoch": 2202} {"train_loss": -43.493812561035156, "global_step": 266543, "epoch": 2202} {"train_loss": -43.940704345703125, "global_step": 266544, "epoch": 2202} {"train_loss": -43.597938537597656, "global_step": 266545, "epoch": 2202} {"train_loss": -43.66798400878906, "global_step": 266546, "epoch": 2202} {"train_loss": -43.5778694152832, "global_step": 266547, "epoch": 2202} {"train_loss": -43.67084884643555, "global_step": 266548, "epoch": 2202} {"train_loss": -43.63056182861328, "global_step": 266549, "epoch": 2202} {"train_loss": -41.7130012512207, "global_step": 266550, "epoch": 2202} {"train_loss": -41.77582550048828, "global_step": 266551, "epoch": 2202} {"train_loss": -42.30082321166992, "global_step": 266552, "epoch": 2202} {"train_loss": -43.035579681396484, "global_step": 266553, "epoch": 2202} {"train_loss": -43.36911392211914, "global_step": 266554, "epoch": 2202} {"train_loss": -43.42646408081055, "global_step": 266555, "epoch": 2202} {"train_loss": -43.2213020324707, "global_step": 266556, "epoch": 2202} {"train_loss": -42.59170150756836, "global_step": 266557, "epoch": 2202} {"train_loss": -42.262638092041016, "global_step": 266558, "epoch": 2202} {"train_loss": -41.85506820678711, "global_step": 266559, "epoch": 2202} {"train_loss": -43.46833038330078, "global_step": 266560, "epoch": 2202} {"train_loss": -42.754302978515625, "global_step": 266561, "epoch": 2202} {"train_loss": -42.18052198867167, "global_step": 266562, "epoch": 2202, "val_loss": 2658670.75} {"train_loss": -43.287025451660156, "global_step": 266563, "epoch": 2203} {"train_loss": -43.43212890625, "global_step": 266564, "epoch": 2203} {"train_loss": -43.3121223449707, "global_step": 266565, "epoch": 2203} {"train_loss": -43.84632110595703, "global_step": 266566, "epoch": 2203} {"train_loss": -43.12773513793945, "global_step": 266567, "epoch": 2203} {"train_loss": -41.68818283081055, "global_step": 266568, "epoch": 2203} {"train_loss": -41.41973876953125, "global_step": 266569, "epoch": 2203} {"train_loss": -41.653526306152344, "global_step": 266570, "epoch": 2203} {"train_loss": -42.42653274536133, "global_step": 266571, "epoch": 2203} {"train_loss": -43.134857177734375, "global_step": 266572, "epoch": 2203} {"train_loss": -41.80576705932617, "global_step": 266573, "epoch": 2203} {"train_loss": -42.134090423583984, "global_step": 266574, "epoch": 2203} {"train_loss": -42.61650848388672, "global_step": 266575, "epoch": 2203} {"train_loss": -41.996063232421875, "global_step": 266576, "epoch": 2203} {"train_loss": -42.81095504760742, "global_step": 266577, "epoch": 2203} {"train_loss": -42.068634033203125, "global_step": 266578, "epoch": 2203} {"train_loss": -40.86872863769531, "global_step": 266579, "epoch": 2203} {"train_loss": -42.515201568603516, "global_step": 266580, "epoch": 2203} {"train_loss": -42.74021911621094, "global_step": 266581, "epoch": 2203} {"train_loss": -41.69652557373047, "global_step": 266582, "epoch": 2203} {"train_loss": -38.14434051513672, "global_step": 266583, "epoch": 2203} {"train_loss": -39.3458366394043, "global_step": 266584, "epoch": 2203} {"train_loss": -39.842952728271484, "global_step": 266585, "epoch": 2203} {"train_loss": -40.76933288574219, "global_step": 266586, "epoch": 2203} {"train_loss": -41.73397445678711, "global_step": 266587, "epoch": 2203} {"train_loss": -39.76131820678711, "global_step": 266588, "epoch": 2203} {"train_loss": -41.904815673828125, "global_step": 266589, "epoch": 2203} {"train_loss": -41.31822967529297, "global_step": 266590, "epoch": 2203} {"train_loss": -40.93684005737305, "global_step": 266591, "epoch": 2203} {"train_loss": -40.48097610473633, "global_step": 266592, "epoch": 2203} {"train_loss": -40.417720794677734, "global_step": 266593, "epoch": 2203} {"train_loss": -41.57338333129883, "global_step": 266594, "epoch": 2203} {"train_loss": -41.750370025634766, "global_step": 266595, "epoch": 2203} {"train_loss": -41.48381423950195, "global_step": 266596, "epoch": 2203} {"train_loss": -41.281105041503906, "global_step": 266597, "epoch": 2203} {"train_loss": -40.85639572143555, "global_step": 266598, "epoch": 2203} {"train_loss": -41.882720947265625, "global_step": 266599, "epoch": 2203} {"train_loss": -40.41841125488281, "global_step": 266600, "epoch": 2203} {"train_loss": -42.90623092651367, "global_step": 266601, "epoch": 2203} {"train_loss": -38.72093200683594, "global_step": 266602, "epoch": 2203} {"train_loss": -42.173736572265625, "global_step": 266603, "epoch": 2203} {"train_loss": -39.91508102416992, "global_step": 266604, "epoch": 2203} {"train_loss": -41.30746078491211, "global_step": 266605, "epoch": 2203} {"train_loss": -41.594017028808594, "global_step": 266606, "epoch": 2203} {"train_loss": -40.87058639526367, "global_step": 266607, "epoch": 2203} {"train_loss": -41.945369720458984, "global_step": 266608, "epoch": 2203} {"train_loss": -40.05144119262695, "global_step": 266609, "epoch": 2203} {"train_loss": -41.76176834106445, "global_step": 266610, "epoch": 2203} {"train_loss": -40.35512161254883, "global_step": 266611, "epoch": 2203} {"train_loss": -40.93136215209961, "global_step": 266612, "epoch": 2203} {"train_loss": -38.4136848449707, "global_step": 266613, "epoch": 2203} {"train_loss": -40.538848876953125, "global_step": 266614, "epoch": 2203} {"train_loss": -39.8291130065918, "global_step": 266615, "epoch": 2203} {"train_loss": -40.04308319091797, "global_step": 266616, "epoch": 2203} {"train_loss": -41.14645004272461, "global_step": 266617, "epoch": 2203} {"train_loss": -40.851070404052734, "global_step": 266618, "epoch": 2203} {"train_loss": -42.5075569152832, "global_step": 266619, "epoch": 2203} {"train_loss": -40.529335021972656, "global_step": 266620, "epoch": 2203} {"train_loss": -42.71841049194336, "global_step": 266621, "epoch": 2203} {"train_loss": -41.69036865234375, "global_step": 266622, "epoch": 2203} {"train_loss": -42.62627029418945, "global_step": 266623, "epoch": 2203} {"train_loss": -41.95266342163086, "global_step": 266624, "epoch": 2203} {"train_loss": -42.34531784057617, "global_step": 266625, "epoch": 2203} {"train_loss": -43.33689880371094, "global_step": 266626, "epoch": 2203} {"train_loss": -42.62551498413086, "global_step": 266627, "epoch": 2203} {"train_loss": -42.88874053955078, "global_step": 266628, "epoch": 2203} {"train_loss": -41.98489761352539, "global_step": 266629, "epoch": 2203} {"train_loss": -43.20706558227539, "global_step": 266630, "epoch": 2203} {"train_loss": -42.225616455078125, "global_step": 266631, "epoch": 2203} {"train_loss": -43.112152099609375, "global_step": 266632, "epoch": 2203} {"train_loss": -43.17438507080078, "global_step": 266633, "epoch": 2203} {"train_loss": -42.86684036254883, "global_step": 266634, "epoch": 2203} {"train_loss": -43.596221923828125, "global_step": 266635, "epoch": 2203} {"train_loss": -42.5098762512207, "global_step": 266636, "epoch": 2203} {"train_loss": -43.450469970703125, "global_step": 266637, "epoch": 2203} {"train_loss": -43.103431701660156, "global_step": 266638, "epoch": 2203} {"train_loss": -42.59983444213867, "global_step": 266639, "epoch": 2203} {"train_loss": -43.59917068481445, "global_step": 266640, "epoch": 2203} {"train_loss": -43.488643646240234, "global_step": 266641, "epoch": 2203} {"train_loss": -43.276458740234375, "global_step": 266642, "epoch": 2203} {"train_loss": -43.763729095458984, "global_step": 266643, "epoch": 2203} {"train_loss": -43.50882339477539, "global_step": 266644, "epoch": 2203} {"train_loss": -43.81797409057617, "global_step": 266645, "epoch": 2203} {"train_loss": -43.49406051635742, "global_step": 266646, "epoch": 2203} {"train_loss": -42.97768783569336, "global_step": 266647, "epoch": 2203} {"train_loss": -43.57439041137695, "global_step": 266648, "epoch": 2203} {"train_loss": -43.728973388671875, "global_step": 266649, "epoch": 2203} {"train_loss": -43.62736129760742, "global_step": 266650, "epoch": 2203} {"train_loss": -43.48408889770508, "global_step": 266651, "epoch": 2203} {"train_loss": -44.20893478393555, "global_step": 266652, "epoch": 2203} {"train_loss": -43.08546829223633, "global_step": 266653, "epoch": 2203} {"train_loss": -43.935211181640625, "global_step": 266654, "epoch": 2203} {"train_loss": -43.937740325927734, "global_step": 266655, "epoch": 2203} {"train_loss": -44.03212356567383, "global_step": 266656, "epoch": 2203} {"train_loss": -44.10860061645508, "global_step": 266657, "epoch": 2203} {"train_loss": -43.588924407958984, "global_step": 266658, "epoch": 2203} {"train_loss": -44.118682861328125, "global_step": 266659, "epoch": 2203} {"train_loss": -43.931495666503906, "global_step": 266660, "epoch": 2203} {"train_loss": -44.03857421875, "global_step": 266661, "epoch": 2203} {"train_loss": -44.23042678833008, "global_step": 266662, "epoch": 2203} {"train_loss": -44.08395004272461, "global_step": 266663, "epoch": 2203} {"train_loss": -44.13648223876953, "global_step": 266664, "epoch": 2203} {"train_loss": -43.063072204589844, "global_step": 266665, "epoch": 2203} {"train_loss": -43.95322036743164, "global_step": 266666, "epoch": 2203} {"train_loss": -44.07047653198242, "global_step": 266667, "epoch": 2203} {"train_loss": -44.50758743286133, "global_step": 266668, "epoch": 2203} {"train_loss": -43.702457427978516, "global_step": 266669, "epoch": 2203} {"train_loss": -44.340755462646484, "global_step": 266670, "epoch": 2203} {"train_loss": -44.092586517333984, "global_step": 266671, "epoch": 2203} {"train_loss": -44.490089416503906, "global_step": 266672, "epoch": 2203} {"train_loss": -44.40482711791992, "global_step": 266673, "epoch": 2203} {"train_loss": -43.555908203125, "global_step": 266674, "epoch": 2203} {"train_loss": -44.529293060302734, "global_step": 266675, "epoch": 2203} {"train_loss": -44.31730651855469, "global_step": 266676, "epoch": 2203} {"train_loss": -44.41520309448242, "global_step": 266677, "epoch": 2203} {"train_loss": -44.30074691772461, "global_step": 266678, "epoch": 2203} {"train_loss": -44.01750564575195, "global_step": 266679, "epoch": 2203} {"train_loss": -44.391387939453125, "global_step": 266680, "epoch": 2203} {"train_loss": -44.2735595703125, "global_step": 266681, "epoch": 2203} {"train_loss": -44.163631439208984, "global_step": 266682, "epoch": 2203} {"train_loss": -42.506408722932676, "global_step": 266683, "epoch": 2203, "val_loss": 2654780.25} {"train_loss": -43.986629486083984, "global_step": 266684, "epoch": 2204} {"train_loss": -43.673484802246094, "global_step": 266685, "epoch": 2204} {"train_loss": -44.070796966552734, "global_step": 266686, "epoch": 2204} {"train_loss": -44.397457122802734, "global_step": 266687, "epoch": 2204} {"train_loss": -44.32718276977539, "global_step": 266688, "epoch": 2204} {"train_loss": -44.295101165771484, "global_step": 266689, "epoch": 2204} {"train_loss": -44.352012634277344, "global_step": 266690, "epoch": 2204} {"train_loss": -43.689979553222656, "global_step": 266691, "epoch": 2204} {"train_loss": -44.00486373901367, "global_step": 266692, "epoch": 2204} {"train_loss": -44.57817459106445, "global_step": 266693, "epoch": 2204} {"train_loss": -43.18233108520508, "global_step": 266694, "epoch": 2204} {"train_loss": -41.7368049621582, "global_step": 266695, "epoch": 2204} {"train_loss": -41.009395599365234, "global_step": 266696, "epoch": 2204} {"train_loss": -41.870582580566406, "global_step": 266697, "epoch": 2204} {"train_loss": -40.64552307128906, "global_step": 266698, "epoch": 2204} {"train_loss": -41.15131759643555, "global_step": 266699, "epoch": 2204} {"train_loss": -43.2575569152832, "global_step": 266700, "epoch": 2204} {"train_loss": -41.4783821105957, "global_step": 266701, "epoch": 2204} {"train_loss": -38.6530647277832, "global_step": 266702, "epoch": 2204} {"train_loss": -42.56466293334961, "global_step": 266703, "epoch": 2204} {"train_loss": -34.3538932800293, "global_step": 266704, "epoch": 2204} {"train_loss": -22.345991134643555, "global_step": 266705, "epoch": 2204} {"train_loss": -7.250907897949219, "global_step": 266706, "epoch": 2204} {"train_loss": -24.20356559753418, "global_step": 266707, "epoch": 2204} {"train_loss": -16.017044067382812, "global_step": 266708, "epoch": 2204} {"train_loss": -31.290258407592773, "global_step": 266709, "epoch": 2204} {"train_loss": -21.861618041992188, "global_step": 266710, "epoch": 2204} {"train_loss": -25.60700798034668, "global_step": 266711, "epoch": 2204} {"train_loss": -32.689998626708984, "global_step": 266712, "epoch": 2204} {"train_loss": -27.36847496032715, "global_step": 266713, "epoch": 2204} {"train_loss": -28.8866024017334, "global_step": 266714, "epoch": 2204} {"train_loss": -33.61061477661133, "global_step": 266715, "epoch": 2204} {"train_loss": -31.11146354675293, "global_step": 266716, "epoch": 2204} {"train_loss": -29.10352897644043, "global_step": 266717, "epoch": 2204} {"train_loss": -33.76466751098633, "global_step": 266718, "epoch": 2204} {"train_loss": -33.77741622924805, "global_step": 266719, "epoch": 2204} {"train_loss": -32.24821090698242, "global_step": 266720, "epoch": 2204} {"train_loss": -32.90924072265625, "global_step": 266721, "epoch": 2204} {"train_loss": -34.124820709228516, "global_step": 266722, "epoch": 2204} {"train_loss": -34.43410873413086, "global_step": 266723, "epoch": 2204} {"train_loss": -33.87743377685547, "global_step": 266724, "epoch": 2204} {"train_loss": -34.337894439697266, "global_step": 266725, "epoch": 2204} {"train_loss": -35.378421783447266, "global_step": 266726, "epoch": 2204} {"train_loss": -36.134864807128906, "global_step": 266727, "epoch": 2204} {"train_loss": -35.462371826171875, "global_step": 266728, "epoch": 2204} {"train_loss": -35.547584533691406, "global_step": 266729, "epoch": 2204} {"train_loss": -35.92938232421875, "global_step": 266730, "epoch": 2204} {"train_loss": -36.231971740722656, "global_step": 266731, "epoch": 2204} {"train_loss": -36.50394821166992, "global_step": 266732, "epoch": 2204} {"train_loss": -36.58716583251953, "global_step": 266733, "epoch": 2204} {"train_loss": -36.24211120605469, "global_step": 266734, "epoch": 2204} {"train_loss": -37.3702278137207, "global_step": 266735, "epoch": 2204} {"train_loss": -37.577857971191406, "global_step": 266736, "epoch": 2204} {"train_loss": -36.71739959716797, "global_step": 266737, "epoch": 2204} {"train_loss": -36.50553894042969, "global_step": 266738, "epoch": 2204} {"train_loss": -36.94214630126953, "global_step": 266739, "epoch": 2204} {"train_loss": -37.462459564208984, "global_step": 266740, "epoch": 2204} {"train_loss": -37.3187370300293, "global_step": 266741, "epoch": 2204} {"train_loss": -36.925689697265625, "global_step": 266742, "epoch": 2204} {"train_loss": -37.62468338012695, "global_step": 266743, "epoch": 2204} {"train_loss": -37.62685012817383, "global_step": 266744, "epoch": 2204} {"train_loss": -38.05624008178711, "global_step": 266745, "epoch": 2204} {"train_loss": -37.40362548828125, "global_step": 266746, "epoch": 2204} {"train_loss": -37.67992401123047, "global_step": 266747, "epoch": 2204} {"train_loss": -38.48179244995117, "global_step": 266748, "epoch": 2204} {"train_loss": -38.38196563720703, "global_step": 266749, "epoch": 2204} {"train_loss": -38.367984771728516, "global_step": 266750, "epoch": 2204} {"train_loss": -37.971065521240234, "global_step": 266751, "epoch": 2204} {"train_loss": -38.399505615234375, "global_step": 266752, "epoch": 2204} {"train_loss": -38.311744689941406, "global_step": 266753, "epoch": 2204} {"train_loss": -37.91288757324219, "global_step": 266754, "epoch": 2204} {"train_loss": -38.70435333251953, "global_step": 266755, "epoch": 2204} {"train_loss": -38.97465133666992, "global_step": 266756, "epoch": 2204} {"train_loss": -38.42903518676758, "global_step": 266757, "epoch": 2204} {"train_loss": -39.16109848022461, "global_step": 266758, "epoch": 2204} {"train_loss": -38.67087173461914, "global_step": 266759, "epoch": 2204} {"train_loss": -38.26002502441406, "global_step": 266760, "epoch": 2204} {"train_loss": -38.42107009887695, "global_step": 266761, "epoch": 2204} {"train_loss": -38.68505096435547, "global_step": 266762, "epoch": 2204} {"train_loss": -39.05078125, "global_step": 266763, "epoch": 2204} {"train_loss": -38.89503479003906, "global_step": 266764, "epoch": 2204} {"train_loss": -38.700225830078125, "global_step": 266765, "epoch": 2204} {"train_loss": -38.80827713012695, "global_step": 266766, "epoch": 2204} {"train_loss": -39.079036712646484, "global_step": 266767, "epoch": 2204} {"train_loss": -39.294673919677734, "global_step": 266768, "epoch": 2204} {"train_loss": -39.074520111083984, "global_step": 266769, "epoch": 2204} {"train_loss": -39.4909782409668, "global_step": 266770, "epoch": 2204} {"train_loss": -39.239784240722656, "global_step": 266771, "epoch": 2204} {"train_loss": -39.38508605957031, "global_step": 266772, "epoch": 2204} {"train_loss": -39.77549362182617, "global_step": 266773, "epoch": 2204} {"train_loss": -39.71763229370117, "global_step": 266774, "epoch": 2204} {"train_loss": -39.51853561401367, "global_step": 266775, "epoch": 2204} {"train_loss": -39.316646575927734, "global_step": 266776, "epoch": 2204} {"train_loss": -37.656978607177734, "global_step": 266777, "epoch": 2204} {"train_loss": -39.14430618286133, "global_step": 266778, "epoch": 2204} {"train_loss": -39.11083984375, "global_step": 266779, "epoch": 2204} {"train_loss": -39.052894592285156, "global_step": 266780, "epoch": 2204} {"train_loss": -39.88328170776367, "global_step": 266781, "epoch": 2204} {"train_loss": -40.23809814453125, "global_step": 266782, "epoch": 2204} {"train_loss": -39.8431396484375, "global_step": 266783, "epoch": 2204} {"train_loss": -40.218955993652344, "global_step": 266784, "epoch": 2204} {"train_loss": -40.47503662109375, "global_step": 266785, "epoch": 2204} {"train_loss": -39.245784759521484, "global_step": 266786, "epoch": 2204} {"train_loss": -39.05481719970703, "global_step": 266787, "epoch": 2204} {"train_loss": -40.49175262451172, "global_step": 266788, "epoch": 2204} {"train_loss": -38.289119720458984, "global_step": 266789, "epoch": 2204} {"train_loss": -39.876949310302734, "global_step": 266790, "epoch": 2204} {"train_loss": -40.521480560302734, "global_step": 266791, "epoch": 2204} {"train_loss": -40.55707931518555, "global_step": 266792, "epoch": 2204} {"train_loss": -39.79072952270508, "global_step": 266793, "epoch": 2204} {"train_loss": -40.69710922241211, "global_step": 266794, "epoch": 2204} {"train_loss": -40.204471588134766, "global_step": 266795, "epoch": 2204} {"train_loss": -40.289398193359375, "global_step": 266796, "epoch": 2204} {"train_loss": -40.79629135131836, "global_step": 266797, "epoch": 2204} {"train_loss": -40.67229080200195, "global_step": 266798, "epoch": 2204} {"train_loss": -39.057186126708984, "global_step": 266799, "epoch": 2204} {"train_loss": -40.57749938964844, "global_step": 266800, "epoch": 2204} {"train_loss": -40.92258834838867, "global_step": 266801, "epoch": 2204} {"train_loss": -40.62420654296875, "global_step": 266802, "epoch": 2204} {"train_loss": -40.63920211791992, "global_step": 266803, "epoch": 2204} {"train_loss": -37.569632033671226, "global_step": 266804, "epoch": 2204, "val_loss": 2557926.0} {"train_loss": -40.38581466674805, "global_step": 266805, "epoch": 2205} {"train_loss": -40.782283782958984, "global_step": 266806, "epoch": 2205} {"train_loss": -41.10166549682617, "global_step": 266807, "epoch": 2205} {"train_loss": -40.51987075805664, "global_step": 266808, "epoch": 2205} {"train_loss": -40.78998565673828, "global_step": 266809, "epoch": 2205} {"train_loss": -41.12411117553711, "global_step": 266810, "epoch": 2205} {"train_loss": -41.041500091552734, "global_step": 266811, "epoch": 2205} {"train_loss": -41.126060485839844, "global_step": 266812, "epoch": 2205} {"train_loss": -40.87706756591797, "global_step": 266813, "epoch": 2205} {"train_loss": -41.08967208862305, "global_step": 266814, "epoch": 2205} {"train_loss": -41.139854431152344, "global_step": 266815, "epoch": 2205} {"train_loss": -41.199127197265625, "global_step": 266816, "epoch": 2205} {"train_loss": -40.8941650390625, "global_step": 266817, "epoch": 2205} {"train_loss": -41.43058776855469, "global_step": 266818, "epoch": 2205} {"train_loss": -40.65974426269531, "global_step": 266819, "epoch": 2205} {"train_loss": -39.98878860473633, "global_step": 266820, "epoch": 2205} {"train_loss": -40.00244140625, "global_step": 266821, "epoch": 2205} {"train_loss": -40.593910217285156, "global_step": 266822, "epoch": 2205} {"train_loss": -41.32100296020508, "global_step": 266823, "epoch": 2205} {"train_loss": -40.08939743041992, "global_step": 266824, "epoch": 2205} {"train_loss": -39.371253967285156, "global_step": 266825, "epoch": 2205} {"train_loss": -40.609798431396484, "global_step": 266826, "epoch": 2205} {"train_loss": -40.1121711730957, "global_step": 266827, "epoch": 2205} {"train_loss": -40.397216796875, "global_step": 266828, "epoch": 2205} {"train_loss": -40.6941032409668, "global_step": 266829, "epoch": 2205} {"train_loss": -40.45515060424805, "global_step": 266830, "epoch": 2205} {"train_loss": -40.26387405395508, "global_step": 266831, "epoch": 2205} {"train_loss": -40.29648971557617, "global_step": 266832, "epoch": 2205} {"train_loss": -41.71938705444336, "global_step": 266833, "epoch": 2205} {"train_loss": -41.634521484375, "global_step": 266834, "epoch": 2205} {"train_loss": -40.290931701660156, "global_step": 266835, "epoch": 2205} {"train_loss": -40.61513137817383, "global_step": 266836, "epoch": 2205} {"train_loss": -40.857688903808594, "global_step": 266837, "epoch": 2205} {"train_loss": -39.378753662109375, "global_step": 266838, "epoch": 2205} {"train_loss": -40.24599838256836, "global_step": 266839, "epoch": 2205} {"train_loss": -40.53359603881836, "global_step": 266840, "epoch": 2205} {"train_loss": -41.1313591003418, "global_step": 266841, "epoch": 2205} {"train_loss": -41.22241973876953, "global_step": 266842, "epoch": 2205} {"train_loss": -40.9766845703125, "global_step": 266843, "epoch": 2205} {"train_loss": -41.313507080078125, "global_step": 266844, "epoch": 2205} {"train_loss": -41.51131820678711, "global_step": 266845, "epoch": 2205} {"train_loss": -40.0009880065918, "global_step": 266846, "epoch": 2205} {"train_loss": -41.642513275146484, "global_step": 266847, "epoch": 2205} {"train_loss": -40.14624786376953, "global_step": 266848, "epoch": 2205} {"train_loss": -40.25598907470703, "global_step": 266849, "epoch": 2205} {"train_loss": -40.46300506591797, "global_step": 266850, "epoch": 2205} {"train_loss": -40.07399368286133, "global_step": 266851, "epoch": 2205} {"train_loss": -41.57733154296875, "global_step": 266852, "epoch": 2205} {"train_loss": -40.98979568481445, "global_step": 266853, "epoch": 2205} {"train_loss": -41.10860824584961, "global_step": 266854, "epoch": 2205} {"train_loss": -39.4522819519043, "global_step": 266855, "epoch": 2205} {"train_loss": -35.53020095825195, "global_step": 266856, "epoch": 2205} {"train_loss": -36.25253677368164, "global_step": 266857, "epoch": 2205} {"train_loss": -40.94915771484375, "global_step": 266858, "epoch": 2205} {"train_loss": -40.05641174316406, "global_step": 266859, "epoch": 2205} {"train_loss": -39.73322677612305, "global_step": 266860, "epoch": 2205} {"train_loss": -31.3790283203125, "global_step": 266861, "epoch": 2205} {"train_loss": -40.20414733886719, "global_step": 266862, "epoch": 2205} {"train_loss": -41.46940231323242, "global_step": 266863, "epoch": 2205} {"train_loss": -38.12513732910156, "global_step": 266864, "epoch": 2205} {"train_loss": -35.584564208984375, "global_step": 266865, "epoch": 2205} {"train_loss": -34.21552658081055, "global_step": 266866, "epoch": 2205} {"train_loss": -32.20705795288086, "global_step": 266867, "epoch": 2205} {"train_loss": -38.87429428100586, "global_step": 266868, "epoch": 2205} {"train_loss": -37.14432907104492, "global_step": 266869, "epoch": 2205} {"train_loss": -36.425201416015625, "global_step": 266870, "epoch": 2205} {"train_loss": -31.521848678588867, "global_step": 266871, "epoch": 2205} {"train_loss": -37.47004318237305, "global_step": 266872, "epoch": 2205} {"train_loss": -39.52456283569336, "global_step": 266873, "epoch": 2205} {"train_loss": -34.125118255615234, "global_step": 266874, "epoch": 2205} {"train_loss": -37.742218017578125, "global_step": 266875, "epoch": 2205} {"train_loss": -31.76177406311035, "global_step": 266876, "epoch": 2205} {"train_loss": -30.80388832092285, "global_step": 266877, "epoch": 2205} {"train_loss": -37.043922424316406, "global_step": 266878, "epoch": 2205} {"train_loss": -38.431610107421875, "global_step": 266879, "epoch": 2205} {"train_loss": -36.86542892456055, "global_step": 266880, "epoch": 2205} {"train_loss": -34.34031677246094, "global_step": 266881, "epoch": 2205} {"train_loss": -36.9305534362793, "global_step": 266882, "epoch": 2205} {"train_loss": -37.547027587890625, "global_step": 266883, "epoch": 2205} {"train_loss": -36.857177734375, "global_step": 266884, "epoch": 2205} {"train_loss": -37.00197982788086, "global_step": 266885, "epoch": 2205} {"train_loss": -34.82686996459961, "global_step": 266886, "epoch": 2205} {"train_loss": -34.929718017578125, "global_step": 266887, "epoch": 2205} {"train_loss": -36.69636917114258, "global_step": 266888, "epoch": 2205} {"train_loss": -38.46358871459961, "global_step": 266889, "epoch": 2205} {"train_loss": -38.09061813354492, "global_step": 266890, "epoch": 2205} {"train_loss": -38.15263748168945, "global_step": 266891, "epoch": 2205} {"train_loss": -39.64094924926758, "global_step": 266892, "epoch": 2205} {"train_loss": -37.72795486450195, "global_step": 266893, "epoch": 2205} {"train_loss": -37.35024642944336, "global_step": 266894, "epoch": 2205} {"train_loss": -39.41152572631836, "global_step": 266895, "epoch": 2205} {"train_loss": -37.739044189453125, "global_step": 266896, "epoch": 2205} {"train_loss": -38.305763244628906, "global_step": 266897, "epoch": 2205} {"train_loss": -39.87446212768555, "global_step": 266898, "epoch": 2205} {"train_loss": -37.04862594604492, "global_step": 266899, "epoch": 2205} {"train_loss": -39.153202056884766, "global_step": 266900, "epoch": 2205} {"train_loss": -39.11367416381836, "global_step": 266901, "epoch": 2205} {"train_loss": -38.04057693481445, "global_step": 266902, "epoch": 2205} {"train_loss": -38.42776107788086, "global_step": 266903, "epoch": 2205} {"train_loss": -39.7626953125, "global_step": 266904, "epoch": 2205} {"train_loss": -39.07851791381836, "global_step": 266905, "epoch": 2205} {"train_loss": -39.512359619140625, "global_step": 266906, "epoch": 2205} {"train_loss": -39.15676498413086, "global_step": 266907, "epoch": 2205} {"train_loss": -40.414588928222656, "global_step": 266908, "epoch": 2205} {"train_loss": -37.49326705932617, "global_step": 266909, "epoch": 2205} {"train_loss": -38.816009521484375, "global_step": 266910, "epoch": 2205} {"train_loss": -39.45530319213867, "global_step": 266911, "epoch": 2205} {"train_loss": -39.81559371948242, "global_step": 266912, "epoch": 2205} {"train_loss": -39.4788703918457, "global_step": 266913, "epoch": 2205} {"train_loss": -39.67238998413086, "global_step": 266914, "epoch": 2205} {"train_loss": -39.92548370361328, "global_step": 266915, "epoch": 2205} {"train_loss": -40.00192642211914, "global_step": 266916, "epoch": 2205} {"train_loss": -40.60260772705078, "global_step": 266917, "epoch": 2205} {"train_loss": -39.26102828979492, "global_step": 266918, "epoch": 2205} {"train_loss": -40.2262077331543, "global_step": 266919, "epoch": 2205} {"train_loss": -40.23502731323242, "global_step": 266920, "epoch": 2205} {"train_loss": -39.30908203125, "global_step": 266921, "epoch": 2205} {"train_loss": -40.027015686035156, "global_step": 266922, "epoch": 2205} {"train_loss": -40.25309371948242, "global_step": 266923, "epoch": 2205} {"train_loss": -40.201324462890625, "global_step": 266924, "epoch": 2205} {"train_loss": -39.06774844019866, "global_step": 266925, "epoch": 2205, "val_loss": 2739981.75} {"train_loss": -40.27288818359375, "global_step": 266926, "epoch": 2206} {"train_loss": -40.527801513671875, "global_step": 266927, "epoch": 2206} {"train_loss": -41.37881088256836, "global_step": 266928, "epoch": 2206} {"train_loss": -40.47569274902344, "global_step": 266929, "epoch": 2206} {"train_loss": -41.16801834106445, "global_step": 266930, "epoch": 2206} {"train_loss": -40.7558708190918, "global_step": 266931, "epoch": 2206} {"train_loss": -40.03151321411133, "global_step": 266932, "epoch": 2206} {"train_loss": -41.15321731567383, "global_step": 266933, "epoch": 2206} {"train_loss": -40.81380844116211, "global_step": 266934, "epoch": 2206} {"train_loss": -41.7032585144043, "global_step": 266935, "epoch": 2206} {"train_loss": -40.274593353271484, "global_step": 266936, "epoch": 2206} {"train_loss": -41.94861602783203, "global_step": 266937, "epoch": 2206} {"train_loss": -41.105552673339844, "global_step": 266938, "epoch": 2206} {"train_loss": -41.86397933959961, "global_step": 266939, "epoch": 2206} {"train_loss": -41.88762283325195, "global_step": 266940, "epoch": 2206} {"train_loss": -41.55807876586914, "global_step": 266941, "epoch": 2206} {"train_loss": -41.923683166503906, "global_step": 266942, "epoch": 2206} {"train_loss": -42.93445587158203, "global_step": 266943, "epoch": 2206} {"train_loss": -42.28446578979492, "global_step": 266944, "epoch": 2206} {"train_loss": -41.937129974365234, "global_step": 266945, "epoch": 2206} {"train_loss": -41.84939193725586, "global_step": 266946, "epoch": 2206} {"train_loss": -42.58158493041992, "global_step": 266947, "epoch": 2206} {"train_loss": -42.1394157409668, "global_step": 266948, "epoch": 2206} {"train_loss": -42.05967330932617, "global_step": 266949, "epoch": 2206} {"train_loss": -42.24793243408203, "global_step": 266950, "epoch": 2206} {"train_loss": -41.763484954833984, "global_step": 266951, "epoch": 2206} {"train_loss": -42.21516418457031, "global_step": 266952, "epoch": 2206} {"train_loss": -42.70856857299805, "global_step": 266953, "epoch": 2206} {"train_loss": -41.71122360229492, "global_step": 266954, "epoch": 2206} {"train_loss": -42.077308654785156, "global_step": 266955, "epoch": 2206} {"train_loss": -42.78767776489258, "global_step": 266956, "epoch": 2206} {"train_loss": -41.11776351928711, "global_step": 266957, "epoch": 2206} {"train_loss": -42.01002883911133, "global_step": 266958, "epoch": 2206} {"train_loss": -41.10791015625, "global_step": 266959, "epoch": 2206} {"train_loss": -41.20540237426758, "global_step": 266960, "epoch": 2206} {"train_loss": -41.649898529052734, "global_step": 266961, "epoch": 2206} {"train_loss": -41.26343536376953, "global_step": 266962, "epoch": 2206} {"train_loss": -42.29729461669922, "global_step": 266963, "epoch": 2206} {"train_loss": -41.254905700683594, "global_step": 266964, "epoch": 2206} {"train_loss": -41.726318359375, "global_step": 266965, "epoch": 2206} {"train_loss": -41.637081146240234, "global_step": 266966, "epoch": 2206} {"train_loss": -41.79082107543945, "global_step": 266967, "epoch": 2206} {"train_loss": -40.718379974365234, "global_step": 266968, "epoch": 2206} {"train_loss": -41.760555267333984, "global_step": 266969, "epoch": 2206} {"train_loss": -41.3647346496582, "global_step": 266970, "epoch": 2206} {"train_loss": -40.71821975708008, "global_step": 266971, "epoch": 2206} {"train_loss": -42.45186233520508, "global_step": 266972, "epoch": 2206} {"train_loss": -41.26295852661133, "global_step": 266973, "epoch": 2206} {"train_loss": -41.357173919677734, "global_step": 266974, "epoch": 2206} {"train_loss": -42.314369201660156, "global_step": 266975, "epoch": 2206} {"train_loss": -41.423946380615234, "global_step": 266976, "epoch": 2206} {"train_loss": -42.299530029296875, "global_step": 266977, "epoch": 2206} {"train_loss": -40.91083526611328, "global_step": 266978, "epoch": 2206} {"train_loss": -42.298030853271484, "global_step": 266979, "epoch": 2206} {"train_loss": -41.66279220581055, "global_step": 266980, "epoch": 2206} {"train_loss": -41.077415466308594, "global_step": 266981, "epoch": 2206} {"train_loss": -42.51313018798828, "global_step": 266982, "epoch": 2206} {"train_loss": -41.758602142333984, "global_step": 266983, "epoch": 2206} {"train_loss": -41.73981857299805, "global_step": 266984, "epoch": 2206} {"train_loss": -41.98097610473633, "global_step": 266985, "epoch": 2206} {"train_loss": -42.179290771484375, "global_step": 266986, "epoch": 2206} {"train_loss": -42.607574462890625, "global_step": 266987, "epoch": 2206} {"train_loss": -42.08761215209961, "global_step": 266988, "epoch": 2206} {"train_loss": -42.35553741455078, "global_step": 266989, "epoch": 2206} {"train_loss": -42.68305587768555, "global_step": 266990, "epoch": 2206} {"train_loss": -41.305511474609375, "global_step": 266991, "epoch": 2206} {"train_loss": -42.39160919189453, "global_step": 266992, "epoch": 2206} {"train_loss": -41.881656646728516, "global_step": 266993, "epoch": 2206} {"train_loss": -42.75110626220703, "global_step": 266994, "epoch": 2206} {"train_loss": -41.69485092163086, "global_step": 266995, "epoch": 2206} {"train_loss": -42.55912399291992, "global_step": 266996, "epoch": 2206} {"train_loss": -43.125213623046875, "global_step": 266997, "epoch": 2206} {"train_loss": -42.303627014160156, "global_step": 266998, "epoch": 2206} {"train_loss": -42.54644775390625, "global_step": 266999, "epoch": 2206} {"train_loss": -42.76887512207031, "global_step": 267000, "epoch": 2206} {"train_loss": -42.2508659362793, "global_step": 267001, "epoch": 2206} {"train_loss": -42.33559036254883, "global_step": 267002, "epoch": 2206} {"train_loss": -42.21742248535156, "global_step": 267003, "epoch": 2206} {"train_loss": -43.31333541870117, "global_step": 267004, "epoch": 2206} {"train_loss": -42.501861572265625, "global_step": 267005, "epoch": 2206} {"train_loss": -42.81132888793945, "global_step": 267006, "epoch": 2206} {"train_loss": -43.22377014160156, "global_step": 267007, "epoch": 2206} {"train_loss": -42.958648681640625, "global_step": 267008, "epoch": 2206} {"train_loss": -42.72842025756836, "global_step": 267009, "epoch": 2206} {"train_loss": -42.73380661010742, "global_step": 267010, "epoch": 2206} {"train_loss": -43.15162658691406, "global_step": 267011, "epoch": 2206} {"train_loss": -42.416046142578125, "global_step": 267012, "epoch": 2206} {"train_loss": -41.693450927734375, "global_step": 267013, "epoch": 2206} {"train_loss": -42.304019927978516, "global_step": 267014, "epoch": 2206} {"train_loss": -43.51758575439453, "global_step": 267015, "epoch": 2206} {"train_loss": -42.99624252319336, "global_step": 267016, "epoch": 2206} {"train_loss": -43.08102798461914, "global_step": 267017, "epoch": 2206} {"train_loss": -42.85531234741211, "global_step": 267018, "epoch": 2206} {"train_loss": -42.83396911621094, "global_step": 267019, "epoch": 2206} {"train_loss": -43.19218063354492, "global_step": 267020, "epoch": 2206} {"train_loss": -42.297821044921875, "global_step": 267021, "epoch": 2206} {"train_loss": -42.609596252441406, "global_step": 267022, "epoch": 2206} {"train_loss": -42.979000091552734, "global_step": 267023, "epoch": 2206} {"train_loss": -43.648189544677734, "global_step": 267024, "epoch": 2206} {"train_loss": -43.545475006103516, "global_step": 267025, "epoch": 2206} {"train_loss": -43.40376281738281, "global_step": 267026, "epoch": 2206} {"train_loss": -42.03739547729492, "global_step": 267027, "epoch": 2206} {"train_loss": -42.718238830566406, "global_step": 267028, "epoch": 2206} {"train_loss": -42.017913818359375, "global_step": 267029, "epoch": 2206} {"train_loss": -42.529930114746094, "global_step": 267030, "epoch": 2206} {"train_loss": -42.53408432006836, "global_step": 267031, "epoch": 2206} {"train_loss": -41.6646842956543, "global_step": 267032, "epoch": 2206} {"train_loss": -41.871402740478516, "global_step": 267033, "epoch": 2206} {"train_loss": -43.01560592651367, "global_step": 267034, "epoch": 2206} {"train_loss": -41.411231994628906, "global_step": 267035, "epoch": 2206} {"train_loss": -41.68851089477539, "global_step": 267036, "epoch": 2206} {"train_loss": -41.6711540222168, "global_step": 267037, "epoch": 2206} {"train_loss": -41.358211517333984, "global_step": 267038, "epoch": 2206} {"train_loss": -41.811180114746094, "global_step": 267039, "epoch": 2206} {"train_loss": -41.35890579223633, "global_step": 267040, "epoch": 2206} {"train_loss": -42.06818771362305, "global_step": 267041, "epoch": 2206} {"train_loss": -41.39254379272461, "global_step": 267042, "epoch": 2206} {"train_loss": -42.760498046875, "global_step": 267043, "epoch": 2206} {"train_loss": -42.03092575073242, "global_step": 267044, "epoch": 2206} {"train_loss": -41.32259750366211, "global_step": 267045, "epoch": 2206} {"train_loss": -42.02473446554389, "global_step": 267046, "epoch": 2206, "val_loss": 2792175.75} {"train_loss": -41.3078727722168, "global_step": 267047, "epoch": 2207} {"train_loss": -41.50728225708008, "global_step": 267048, "epoch": 2207} {"train_loss": -41.3807373046875, "global_step": 267049, "epoch": 2207} {"train_loss": -41.090919494628906, "global_step": 267050, "epoch": 2207} {"train_loss": -39.988502502441406, "global_step": 267051, "epoch": 2207} {"train_loss": -42.1707878112793, "global_step": 267052, "epoch": 2207} {"train_loss": -39.18316650390625, "global_step": 267053, "epoch": 2207} {"train_loss": -41.830753326416016, "global_step": 267054, "epoch": 2207} {"train_loss": -40.19900131225586, "global_step": 267055, "epoch": 2207} {"train_loss": -40.08491897583008, "global_step": 267056, "epoch": 2207} {"train_loss": -40.750732421875, "global_step": 267057, "epoch": 2207} {"train_loss": -40.66083908081055, "global_step": 267058, "epoch": 2207} {"train_loss": -41.70499038696289, "global_step": 267059, "epoch": 2207} {"train_loss": -40.24408721923828, "global_step": 267060, "epoch": 2207} {"train_loss": -41.203678131103516, "global_step": 267061, "epoch": 2207} {"train_loss": -41.85612869262695, "global_step": 267062, "epoch": 2207} {"train_loss": -41.2115592956543, "global_step": 267063, "epoch": 2207} {"train_loss": -41.608341217041016, "global_step": 267064, "epoch": 2207} {"train_loss": -41.81386947631836, "global_step": 267065, "epoch": 2207} {"train_loss": -41.130531311035156, "global_step": 267066, "epoch": 2207} {"train_loss": -42.365692138671875, "global_step": 267067, "epoch": 2207} {"train_loss": -41.37377166748047, "global_step": 267068, "epoch": 2207} {"train_loss": -42.417659759521484, "global_step": 267069, "epoch": 2207} {"train_loss": -41.77169418334961, "global_step": 267070, "epoch": 2207} {"train_loss": -42.40176010131836, "global_step": 267071, "epoch": 2207} {"train_loss": -41.80873489379883, "global_step": 267072, "epoch": 2207} {"train_loss": -42.02528762817383, "global_step": 267073, "epoch": 2207} {"train_loss": -41.468929290771484, "global_step": 267074, "epoch": 2207} {"train_loss": -42.45815658569336, "global_step": 267075, "epoch": 2207} {"train_loss": -42.14688491821289, "global_step": 267076, "epoch": 2207} {"train_loss": -41.94337463378906, "global_step": 267077, "epoch": 2207} {"train_loss": -41.860198974609375, "global_step": 267078, "epoch": 2207} {"train_loss": -42.49512481689453, "global_step": 267079, "epoch": 2207} {"train_loss": -41.04326629638672, "global_step": 267080, "epoch": 2207} {"train_loss": -41.81075668334961, "global_step": 267081, "epoch": 2207} {"train_loss": -42.30638885498047, "global_step": 267082, "epoch": 2207} {"train_loss": -42.15285873413086, "global_step": 267083, "epoch": 2207} {"train_loss": -42.3942985534668, "global_step": 267084, "epoch": 2207} {"train_loss": -42.678775787353516, "global_step": 267085, "epoch": 2207} {"train_loss": -42.92888259887695, "global_step": 267086, "epoch": 2207} {"train_loss": -42.319969177246094, "global_step": 267087, "epoch": 2207} {"train_loss": -42.211273193359375, "global_step": 267088, "epoch": 2207} {"train_loss": -43.090782165527344, "global_step": 267089, "epoch": 2207} {"train_loss": -41.9714469909668, "global_step": 267090, "epoch": 2207} {"train_loss": -42.48697280883789, "global_step": 267091, "epoch": 2207} {"train_loss": -42.409889221191406, "global_step": 267092, "epoch": 2207} {"train_loss": -42.60793685913086, "global_step": 267093, "epoch": 2207} {"train_loss": -43.30896759033203, "global_step": 267094, "epoch": 2207} {"train_loss": -41.69024658203125, "global_step": 267095, "epoch": 2207} {"train_loss": -43.291114807128906, "global_step": 267096, "epoch": 2207} {"train_loss": -41.87237548828125, "global_step": 267097, "epoch": 2207} {"train_loss": -42.4172248840332, "global_step": 267098, "epoch": 2207} {"train_loss": -42.824493408203125, "global_step": 267099, "epoch": 2207} {"train_loss": -41.5290641784668, "global_step": 267100, "epoch": 2207} {"train_loss": -42.99882888793945, "global_step": 267101, "epoch": 2207} {"train_loss": -40.580013275146484, "global_step": 267102, "epoch": 2207} {"train_loss": -42.91997146606445, "global_step": 267103, "epoch": 2207} {"train_loss": -40.99774169921875, "global_step": 267104, "epoch": 2207} {"train_loss": -40.03622817993164, "global_step": 267105, "epoch": 2207} {"train_loss": -41.69572067260742, "global_step": 267106, "epoch": 2207} {"train_loss": -41.01863098144531, "global_step": 267107, "epoch": 2207} {"train_loss": -40.7229118347168, "global_step": 267108, "epoch": 2207} {"train_loss": -41.556114196777344, "global_step": 267109, "epoch": 2207} {"train_loss": -40.740901947021484, "global_step": 267110, "epoch": 2207} {"train_loss": -42.538429260253906, "global_step": 267111, "epoch": 2207} {"train_loss": -39.756282806396484, "global_step": 267112, "epoch": 2207} {"train_loss": -42.27185821533203, "global_step": 267113, "epoch": 2207} {"train_loss": -40.198726654052734, "global_step": 267114, "epoch": 2207} {"train_loss": -40.41946029663086, "global_step": 267115, "epoch": 2207} {"train_loss": -42.05641174316406, "global_step": 267116, "epoch": 2207} {"train_loss": -39.26674270629883, "global_step": 267117, "epoch": 2207} {"train_loss": -40.91645431518555, "global_step": 267118, "epoch": 2207} {"train_loss": -40.60261917114258, "global_step": 267119, "epoch": 2207} {"train_loss": -41.214439392089844, "global_step": 267120, "epoch": 2207} {"train_loss": -41.36237716674805, "global_step": 267121, "epoch": 2207} {"train_loss": -41.06364059448242, "global_step": 267122, "epoch": 2207} {"train_loss": -42.3221435546875, "global_step": 267123, "epoch": 2207} {"train_loss": -41.09408187866211, "global_step": 267124, "epoch": 2207} {"train_loss": -42.3942985534668, "global_step": 267125, "epoch": 2207} {"train_loss": -40.90328598022461, "global_step": 267126, "epoch": 2207} {"train_loss": -42.291587829589844, "global_step": 267127, "epoch": 2207} {"train_loss": -41.2763786315918, "global_step": 267128, "epoch": 2207} {"train_loss": -42.44757080078125, "global_step": 267129, "epoch": 2207} {"train_loss": -41.80249786376953, "global_step": 267130, "epoch": 2207} {"train_loss": -43.3642578125, "global_step": 267131, "epoch": 2207} {"train_loss": -41.6810188293457, "global_step": 267132, "epoch": 2207} {"train_loss": -42.64668655395508, "global_step": 267133, "epoch": 2207} {"train_loss": -40.91168975830078, "global_step": 267134, "epoch": 2207} {"train_loss": -41.66135787963867, "global_step": 267135, "epoch": 2207} {"train_loss": -41.4912109375, "global_step": 267136, "epoch": 2207} {"train_loss": -41.31120681762695, "global_step": 267137, "epoch": 2207} {"train_loss": -42.743099212646484, "global_step": 267138, "epoch": 2207} {"train_loss": -40.480281829833984, "global_step": 267139, "epoch": 2207} {"train_loss": -41.47880172729492, "global_step": 267140, "epoch": 2207} {"train_loss": -40.24502182006836, "global_step": 267141, "epoch": 2207} {"train_loss": -40.23688507080078, "global_step": 267142, "epoch": 2207} {"train_loss": -40.71750259399414, "global_step": 267143, "epoch": 2207} {"train_loss": -41.435707092285156, "global_step": 267144, "epoch": 2207} {"train_loss": -39.51538848876953, "global_step": 267145, "epoch": 2207} {"train_loss": -41.203094482421875, "global_step": 267146, "epoch": 2207} {"train_loss": -41.296485900878906, "global_step": 267147, "epoch": 2207} {"train_loss": -40.4036979675293, "global_step": 267148, "epoch": 2207} {"train_loss": -42.30460739135742, "global_step": 267149, "epoch": 2207} {"train_loss": -40.843299865722656, "global_step": 267150, "epoch": 2207} {"train_loss": -42.26542282104492, "global_step": 267151, "epoch": 2207} {"train_loss": -41.5952262878418, "global_step": 267152, "epoch": 2207} {"train_loss": -41.06336212158203, "global_step": 267153, "epoch": 2207} {"train_loss": -41.64680099487305, "global_step": 267154, "epoch": 2207} {"train_loss": -42.94080352783203, "global_step": 267155, "epoch": 2207} {"train_loss": -42.019073486328125, "global_step": 267156, "epoch": 2207} {"train_loss": -41.658973693847656, "global_step": 267157, "epoch": 2207} {"train_loss": -39.893402099609375, "global_step": 267158, "epoch": 2207} {"train_loss": -42.54987335205078, "global_step": 267159, "epoch": 2207} {"train_loss": -40.823482513427734, "global_step": 267160, "epoch": 2207} {"train_loss": -41.2191276550293, "global_step": 267161, "epoch": 2207} {"train_loss": -41.60859680175781, "global_step": 267162, "epoch": 2207} {"train_loss": -40.42612838745117, "global_step": 267163, "epoch": 2207} {"train_loss": -41.954105377197266, "global_step": 267164, "epoch": 2207} {"train_loss": -40.95634078979492, "global_step": 267165, "epoch": 2207} {"train_loss": -42.25608444213867, "global_step": 267166, "epoch": 2207} {"train_loss": -41.550395650311934, "global_step": 267167, "epoch": 2207, "val_loss": 2756886.0} {"train_loss": -41.9248046875, "global_step": 267168, "epoch": 2208} {"train_loss": -41.92155838012695, "global_step": 267169, "epoch": 2208} {"train_loss": -42.12451934814453, "global_step": 267170, "epoch": 2208} {"train_loss": -41.756587982177734, "global_step": 267171, "epoch": 2208} {"train_loss": -42.43726348876953, "global_step": 267172, "epoch": 2208} {"train_loss": -42.28269577026367, "global_step": 267173, "epoch": 2208} {"train_loss": -41.84524154663086, "global_step": 267174, "epoch": 2208} {"train_loss": -42.7638053894043, "global_step": 267175, "epoch": 2208} {"train_loss": -42.02649688720703, "global_step": 267176, "epoch": 2208} {"train_loss": -41.39262008666992, "global_step": 267177, "epoch": 2208} {"train_loss": -42.68528366088867, "global_step": 267178, "epoch": 2208} {"train_loss": -41.84664535522461, "global_step": 267179, "epoch": 2208} {"train_loss": -42.38627624511719, "global_step": 267180, "epoch": 2208} {"train_loss": -41.86346435546875, "global_step": 267181, "epoch": 2208} {"train_loss": -42.97309494018555, "global_step": 267182, "epoch": 2208} {"train_loss": -41.79313659667969, "global_step": 267183, "epoch": 2208} {"train_loss": -41.58777618408203, "global_step": 267184, "epoch": 2208} {"train_loss": -42.50568389892578, "global_step": 267185, "epoch": 2208} {"train_loss": -43.201107025146484, "global_step": 267186, "epoch": 2208} {"train_loss": -43.27971267700195, "global_step": 267187, "epoch": 2208} {"train_loss": -42.2413444519043, "global_step": 267188, "epoch": 2208} {"train_loss": -42.281307220458984, "global_step": 267189, "epoch": 2208} {"train_loss": -42.849300384521484, "global_step": 267190, "epoch": 2208} {"train_loss": -43.29047775268555, "global_step": 267191, "epoch": 2208} {"train_loss": -42.978939056396484, "global_step": 267192, "epoch": 2208} {"train_loss": -43.225379943847656, "global_step": 267193, "epoch": 2208} {"train_loss": -43.05270767211914, "global_step": 267194, "epoch": 2208} {"train_loss": -43.57350540161133, "global_step": 267195, "epoch": 2208} {"train_loss": -43.259273529052734, "global_step": 267196, "epoch": 2208} {"train_loss": -42.99956130981445, "global_step": 267197, "epoch": 2208} {"train_loss": -43.300201416015625, "global_step": 267198, "epoch": 2208} {"train_loss": -43.56187057495117, "global_step": 267199, "epoch": 2208} {"train_loss": -43.3186149597168, "global_step": 267200, "epoch": 2208} {"train_loss": -43.27377700805664, "global_step": 267201, "epoch": 2208} {"train_loss": -43.63528060913086, "global_step": 267202, "epoch": 2208} {"train_loss": -43.764652252197266, "global_step": 267203, "epoch": 2208} {"train_loss": -43.56404495239258, "global_step": 267204, "epoch": 2208} {"train_loss": -43.85691452026367, "global_step": 267205, "epoch": 2208} {"train_loss": -43.84104537963867, "global_step": 267206, "epoch": 2208} {"train_loss": -43.07338333129883, "global_step": 267207, "epoch": 2208} {"train_loss": -44.424156188964844, "global_step": 267208, "epoch": 2208} {"train_loss": -43.332420349121094, "global_step": 267209, "epoch": 2208} {"train_loss": -43.614227294921875, "global_step": 267210, "epoch": 2208} {"train_loss": -43.70780563354492, "global_step": 267211, "epoch": 2208} {"train_loss": -43.70930099487305, "global_step": 267212, "epoch": 2208} {"train_loss": -43.26119613647461, "global_step": 267213, "epoch": 2208} {"train_loss": -43.97421646118164, "global_step": 267214, "epoch": 2208} {"train_loss": -44.13607406616211, "global_step": 267215, "epoch": 2208} {"train_loss": -43.9488525390625, "global_step": 267216, "epoch": 2208} {"train_loss": -44.11583709716797, "global_step": 267217, "epoch": 2208} {"train_loss": -43.65480422973633, "global_step": 267218, "epoch": 2208} {"train_loss": -44.02088165283203, "global_step": 267219, "epoch": 2208} {"train_loss": -43.97550582885742, "global_step": 267220, "epoch": 2208} {"train_loss": -43.442108154296875, "global_step": 267221, "epoch": 2208} {"train_loss": -43.924407958984375, "global_step": 267222, "epoch": 2208} {"train_loss": -43.409420013427734, "global_step": 267223, "epoch": 2208} {"train_loss": -44.18647766113281, "global_step": 267224, "epoch": 2208} {"train_loss": -43.65761184692383, "global_step": 267225, "epoch": 2208} {"train_loss": -44.05137252807617, "global_step": 267226, "epoch": 2208} {"train_loss": -44.181129455566406, "global_step": 267227, "epoch": 2208} {"train_loss": -44.01945877075195, "global_step": 267228, "epoch": 2208} {"train_loss": -42.77432632446289, "global_step": 267229, "epoch": 2208} {"train_loss": -43.43320846557617, "global_step": 267230, "epoch": 2208} {"train_loss": -43.673675537109375, "global_step": 267231, "epoch": 2208} {"train_loss": -42.741912841796875, "global_step": 267232, "epoch": 2208} {"train_loss": -43.20853805541992, "global_step": 267233, "epoch": 2208} {"train_loss": -43.09307861328125, "global_step": 267234, "epoch": 2208} {"train_loss": -42.446075439453125, "global_step": 267235, "epoch": 2208} {"train_loss": -42.113525390625, "global_step": 267236, "epoch": 2208} {"train_loss": -43.05569076538086, "global_step": 267237, "epoch": 2208} {"train_loss": -42.53690719604492, "global_step": 267238, "epoch": 2208} {"train_loss": -42.207881927490234, "global_step": 267239, "epoch": 2208} {"train_loss": -42.884883880615234, "global_step": 267240, "epoch": 2208} {"train_loss": -42.29616165161133, "global_step": 267241, "epoch": 2208} {"train_loss": -42.70987319946289, "global_step": 267242, "epoch": 2208} {"train_loss": -43.25634765625, "global_step": 267243, "epoch": 2208} {"train_loss": -42.529083251953125, "global_step": 267244, "epoch": 2208} {"train_loss": -43.137935638427734, "global_step": 267245, "epoch": 2208} {"train_loss": -42.84624099731445, "global_step": 267246, "epoch": 2208} {"train_loss": -42.901302337646484, "global_step": 267247, "epoch": 2208} {"train_loss": -43.38436508178711, "global_step": 267248, "epoch": 2208} {"train_loss": -42.33481216430664, "global_step": 267249, "epoch": 2208} {"train_loss": -43.449676513671875, "global_step": 267250, "epoch": 2208} {"train_loss": -42.08940887451172, "global_step": 267251, "epoch": 2208} {"train_loss": -42.41627883911133, "global_step": 267252, "epoch": 2208} {"train_loss": -42.49723434448242, "global_step": 267253, "epoch": 2208} {"train_loss": -43.366004943847656, "global_step": 267254, "epoch": 2208} {"train_loss": -43.03153991699219, "global_step": 267255, "epoch": 2208} {"train_loss": -43.348121643066406, "global_step": 267256, "epoch": 2208} {"train_loss": -42.76539611816406, "global_step": 267257, "epoch": 2208} {"train_loss": -42.47774887084961, "global_step": 267258, "epoch": 2208} {"train_loss": -42.32251739501953, "global_step": 267259, "epoch": 2208} {"train_loss": -42.96358871459961, "global_step": 267260, "epoch": 2208} {"train_loss": -42.50651550292969, "global_step": 267261, "epoch": 2208} {"train_loss": -43.50239181518555, "global_step": 267262, "epoch": 2208} {"train_loss": -42.89284133911133, "global_step": 267263, "epoch": 2208} {"train_loss": -42.28421401977539, "global_step": 267264, "epoch": 2208} {"train_loss": -42.726654052734375, "global_step": 267265, "epoch": 2208} {"train_loss": -41.18107223510742, "global_step": 267266, "epoch": 2208} {"train_loss": -43.208648681640625, "global_step": 267267, "epoch": 2208} {"train_loss": -40.64581298828125, "global_step": 267268, "epoch": 2208} {"train_loss": -42.68233871459961, "global_step": 267269, "epoch": 2208} {"train_loss": -39.374141693115234, "global_step": 267270, "epoch": 2208} {"train_loss": -41.53341293334961, "global_step": 267271, "epoch": 2208} {"train_loss": -41.06612014770508, "global_step": 267272, "epoch": 2208} {"train_loss": -39.85456848144531, "global_step": 267273, "epoch": 2208} {"train_loss": -40.19268798828125, "global_step": 267274, "epoch": 2208} {"train_loss": -41.47720718383789, "global_step": 267275, "epoch": 2208} {"train_loss": -39.25054931640625, "global_step": 267276, "epoch": 2208} {"train_loss": -39.701812744140625, "global_step": 267277, "epoch": 2208} {"train_loss": -41.562171936035156, "global_step": 267278, "epoch": 2208} {"train_loss": -39.94248580932617, "global_step": 267279, "epoch": 2208} {"train_loss": -43.34915542602539, "global_step": 267280, "epoch": 2208} {"train_loss": -39.64425277709961, "global_step": 267281, "epoch": 2208} {"train_loss": -42.33512496948242, "global_step": 267282, "epoch": 2208} {"train_loss": -42.320335388183594, "global_step": 267283, "epoch": 2208} {"train_loss": -40.661685943603516, "global_step": 267284, "epoch": 2208} {"train_loss": -41.73960494995117, "global_step": 267285, "epoch": 2208} {"train_loss": -41.0014533996582, "global_step": 267286, "epoch": 2208} {"train_loss": -42.42527389526367, "global_step": 267287, "epoch": 2208} {"train_loss": -42.66167560293655, "global_step": 267288, "epoch": 2208, "val_loss": 2699112.25} {"train_loss": -42.526588439941406, "global_step": 267289, "epoch": 2209} {"train_loss": -42.1953010559082, "global_step": 267290, "epoch": 2209} {"train_loss": -42.95500946044922, "global_step": 267291, "epoch": 2209} {"train_loss": -41.764122009277344, "global_step": 267292, "epoch": 2209} {"train_loss": -41.55442428588867, "global_step": 267293, "epoch": 2209} {"train_loss": -41.3099365234375, "global_step": 267294, "epoch": 2209} {"train_loss": -42.01228713989258, "global_step": 267295, "epoch": 2209} {"train_loss": -43.151119232177734, "global_step": 267296, "epoch": 2209} {"train_loss": -41.97602844238281, "global_step": 267297, "epoch": 2209} {"train_loss": -42.83651351928711, "global_step": 267298, "epoch": 2209} {"train_loss": -42.96621322631836, "global_step": 267299, "epoch": 2209} {"train_loss": -42.073795318603516, "global_step": 267300, "epoch": 2209} {"train_loss": -42.28041458129883, "global_step": 267301, "epoch": 2209} {"train_loss": -41.22488021850586, "global_step": 267302, "epoch": 2209} {"train_loss": -42.23226547241211, "global_step": 267303, "epoch": 2209} {"train_loss": -41.899471282958984, "global_step": 267304, "epoch": 2209} {"train_loss": -42.69009017944336, "global_step": 267305, "epoch": 2209} {"train_loss": -41.556270599365234, "global_step": 267306, "epoch": 2209} {"train_loss": -42.17719268798828, "global_step": 267307, "epoch": 2209} {"train_loss": -41.69118118286133, "global_step": 267308, "epoch": 2209} {"train_loss": -41.17490768432617, "global_step": 267309, "epoch": 2209} {"train_loss": -42.77906036376953, "global_step": 267310, "epoch": 2209} {"train_loss": -40.40715408325195, "global_step": 267311, "epoch": 2209} {"train_loss": -41.42777633666992, "global_step": 267312, "epoch": 2209} {"train_loss": -40.64980697631836, "global_step": 267313, "epoch": 2209} {"train_loss": -41.36045455932617, "global_step": 267314, "epoch": 2209} {"train_loss": -42.02046585083008, "global_step": 267315, "epoch": 2209} {"train_loss": -40.51703643798828, "global_step": 267316, "epoch": 2209} {"train_loss": -42.02694320678711, "global_step": 267317, "epoch": 2209} {"train_loss": -41.7109489440918, "global_step": 267318, "epoch": 2209} {"train_loss": -42.3820915222168, "global_step": 267319, "epoch": 2209} {"train_loss": -43.005123138427734, "global_step": 267320, "epoch": 2209} {"train_loss": -41.8018798828125, "global_step": 267321, "epoch": 2209} {"train_loss": -42.5803337097168, "global_step": 267322, "epoch": 2209} {"train_loss": -42.794857025146484, "global_step": 267323, "epoch": 2209} {"train_loss": -42.188777923583984, "global_step": 267324, "epoch": 2209} {"train_loss": -42.835357666015625, "global_step": 267325, "epoch": 2209} {"train_loss": -42.640228271484375, "global_step": 267326, "epoch": 2209} {"train_loss": -42.02375411987305, "global_step": 267327, "epoch": 2209} {"train_loss": -42.32403564453125, "global_step": 267328, "epoch": 2209} {"train_loss": -42.6077766418457, "global_step": 267329, "epoch": 2209} {"train_loss": -41.54086685180664, "global_step": 267330, "epoch": 2209} {"train_loss": -42.50092315673828, "global_step": 267331, "epoch": 2209} {"train_loss": -42.073638916015625, "global_step": 267332, "epoch": 2209} {"train_loss": -42.3519401550293, "global_step": 267333, "epoch": 2209} {"train_loss": -43.204280853271484, "global_step": 267334, "epoch": 2209} {"train_loss": -41.94391632080078, "global_step": 267335, "epoch": 2209} {"train_loss": -41.23442840576172, "global_step": 267336, "epoch": 2209} {"train_loss": -43.076087951660156, "global_step": 267337, "epoch": 2209} {"train_loss": -41.22335433959961, "global_step": 267338, "epoch": 2209} {"train_loss": -42.87481689453125, "global_step": 267339, "epoch": 2209} {"train_loss": -41.68082046508789, "global_step": 267340, "epoch": 2209} {"train_loss": -41.97986602783203, "global_step": 267341, "epoch": 2209} {"train_loss": -42.04637908935547, "global_step": 267342, "epoch": 2209} {"train_loss": -40.581085205078125, "global_step": 267343, "epoch": 2209} {"train_loss": -42.62760543823242, "global_step": 267344, "epoch": 2209} {"train_loss": -38.565582275390625, "global_step": 267345, "epoch": 2209} {"train_loss": -39.33588790893555, "global_step": 267346, "epoch": 2209} {"train_loss": -38.270198822021484, "global_step": 267347, "epoch": 2209} {"train_loss": -39.163211822509766, "global_step": 267348, "epoch": 2209} {"train_loss": -39.83516311645508, "global_step": 267349, "epoch": 2209} {"train_loss": -40.02976608276367, "global_step": 267350, "epoch": 2209} {"train_loss": -39.48966979980469, "global_step": 267351, "epoch": 2209} {"train_loss": -39.91958236694336, "global_step": 267352, "epoch": 2209} {"train_loss": -40.655677795410156, "global_step": 267353, "epoch": 2209} {"train_loss": -40.76252365112305, "global_step": 267354, "epoch": 2209} {"train_loss": -41.567657470703125, "global_step": 267355, "epoch": 2209} {"train_loss": -41.363101959228516, "global_step": 267356, "epoch": 2209} {"train_loss": -40.42461013793945, "global_step": 267357, "epoch": 2209} {"train_loss": -41.4433708190918, "global_step": 267358, "epoch": 2209} {"train_loss": -41.67316818237305, "global_step": 267359, "epoch": 2209} {"train_loss": -41.76709747314453, "global_step": 267360, "epoch": 2209} {"train_loss": -42.889808654785156, "global_step": 267361, "epoch": 2209} {"train_loss": -42.47700119018555, "global_step": 267362, "epoch": 2209} {"train_loss": -42.674598693847656, "global_step": 267363, "epoch": 2209} {"train_loss": -42.40235137939453, "global_step": 267364, "epoch": 2209} {"train_loss": -42.92243576049805, "global_step": 267365, "epoch": 2209} {"train_loss": -42.70415115356445, "global_step": 267366, "epoch": 2209} {"train_loss": -42.89889144897461, "global_step": 267367, "epoch": 2209} {"train_loss": -42.81084060668945, "global_step": 267368, "epoch": 2209} {"train_loss": -42.48527145385742, "global_step": 267369, "epoch": 2209} {"train_loss": -42.686492919921875, "global_step": 267370, "epoch": 2209} {"train_loss": -42.340084075927734, "global_step": 267371, "epoch": 2209} {"train_loss": -41.82654571533203, "global_step": 267372, "epoch": 2209} {"train_loss": -40.90989303588867, "global_step": 267373, "epoch": 2209} {"train_loss": -40.01862716674805, "global_step": 267374, "epoch": 2209} {"train_loss": -42.123043060302734, "global_step": 267375, "epoch": 2209} {"train_loss": -42.570125579833984, "global_step": 267376, "epoch": 2209} {"train_loss": -43.63824462890625, "global_step": 267377, "epoch": 2209} {"train_loss": -43.01807403564453, "global_step": 267378, "epoch": 2209} {"train_loss": -42.862388610839844, "global_step": 267379, "epoch": 2209} {"train_loss": -41.6991081237793, "global_step": 267380, "epoch": 2209} {"train_loss": -41.89105224609375, "global_step": 267381, "epoch": 2209} {"train_loss": -43.05106735229492, "global_step": 267382, "epoch": 2209} {"train_loss": -40.67209243774414, "global_step": 267383, "epoch": 2209} {"train_loss": -43.353450775146484, "global_step": 267384, "epoch": 2209} {"train_loss": -42.978084564208984, "global_step": 267385, "epoch": 2209} {"train_loss": -41.62420654296875, "global_step": 267386, "epoch": 2209} {"train_loss": -43.13702392578125, "global_step": 267387, "epoch": 2209} {"train_loss": -42.13090896606445, "global_step": 267388, "epoch": 2209} {"train_loss": -42.64705276489258, "global_step": 267389, "epoch": 2209} {"train_loss": -42.125526428222656, "global_step": 267390, "epoch": 2209} {"train_loss": -42.795101165771484, "global_step": 267391, "epoch": 2209} {"train_loss": -41.370201110839844, "global_step": 267392, "epoch": 2209} {"train_loss": -42.58687210083008, "global_step": 267393, "epoch": 2209} {"train_loss": -42.736270904541016, "global_step": 267394, "epoch": 2209} {"train_loss": -41.263851165771484, "global_step": 267395, "epoch": 2209} {"train_loss": -43.395790100097656, "global_step": 267396, "epoch": 2209} {"train_loss": -42.35304641723633, "global_step": 267397, "epoch": 2209} {"train_loss": -43.12137985229492, "global_step": 267398, "epoch": 2209} {"train_loss": -42.5155143737793, "global_step": 267399, "epoch": 2209} {"train_loss": -43.32823181152344, "global_step": 267400, "epoch": 2209} {"train_loss": -42.551998138427734, "global_step": 267401, "epoch": 2209} {"train_loss": -43.54258346557617, "global_step": 267402, "epoch": 2209} {"train_loss": -42.880775451660156, "global_step": 267403, "epoch": 2209} {"train_loss": -43.008392333984375, "global_step": 267404, "epoch": 2209} {"train_loss": -43.3333740234375, "global_step": 267405, "epoch": 2209} {"train_loss": -43.35626983642578, "global_step": 267406, "epoch": 2209} {"train_loss": -43.45103073120117, "global_step": 267407, "epoch": 2209} {"train_loss": -43.26516342163086, "global_step": 267408, "epoch": 2209} {"train_loss": -42.02908416621941, "global_step": 267409, "epoch": 2209, "val_loss": 2751383.75} {"train_loss": -43.64265823364258, "global_step": 267410, "epoch": 2210} {"train_loss": -43.660701751708984, "global_step": 267411, "epoch": 2210} {"train_loss": -43.17106246948242, "global_step": 267412, "epoch": 2210} {"train_loss": -43.683616638183594, "global_step": 267413, "epoch": 2210} {"train_loss": -43.1521110534668, "global_step": 267414, "epoch": 2210} {"train_loss": -43.54018783569336, "global_step": 267415, "epoch": 2210} {"train_loss": -43.55947494506836, "global_step": 267416, "epoch": 2210} {"train_loss": -43.8731689453125, "global_step": 267417, "epoch": 2210} {"train_loss": -43.75457000732422, "global_step": 267418, "epoch": 2210} {"train_loss": -44.03878402709961, "global_step": 267419, "epoch": 2210} {"train_loss": -43.080440521240234, "global_step": 267420, "epoch": 2210} {"train_loss": -44.14011764526367, "global_step": 267421, "epoch": 2210} {"train_loss": -43.157588958740234, "global_step": 267422, "epoch": 2210} {"train_loss": -43.51546859741211, "global_step": 267423, "epoch": 2210} {"train_loss": -43.05908966064453, "global_step": 267424, "epoch": 2210} {"train_loss": -44.280723571777344, "global_step": 267425, "epoch": 2210} {"train_loss": -43.7364616394043, "global_step": 267426, "epoch": 2210} {"train_loss": -43.600494384765625, "global_step": 267427, "epoch": 2210} {"train_loss": -42.8162727355957, "global_step": 267428, "epoch": 2210} {"train_loss": -44.12075424194336, "global_step": 267429, "epoch": 2210} {"train_loss": -44.339881896972656, "global_step": 267430, "epoch": 2210} {"train_loss": -43.32617950439453, "global_step": 267431, "epoch": 2210} {"train_loss": -42.88853073120117, "global_step": 267432, "epoch": 2210} {"train_loss": -43.81211853027344, "global_step": 267433, "epoch": 2210} {"train_loss": -44.22759246826172, "global_step": 267434, "epoch": 2210} {"train_loss": -43.404327392578125, "global_step": 267435, "epoch": 2210} {"train_loss": -43.9549446105957, "global_step": 267436, "epoch": 2210} {"train_loss": -43.84382247924805, "global_step": 267437, "epoch": 2210} {"train_loss": -43.9893798828125, "global_step": 267438, "epoch": 2210} {"train_loss": -43.79636764526367, "global_step": 267439, "epoch": 2210} {"train_loss": -43.999080657958984, "global_step": 267440, "epoch": 2210} {"train_loss": -43.636695861816406, "global_step": 267441, "epoch": 2210} {"train_loss": -43.43278121948242, "global_step": 267442, "epoch": 2210} {"train_loss": -43.239593505859375, "global_step": 267443, "epoch": 2210} {"train_loss": -43.923301696777344, "global_step": 267444, "epoch": 2210} {"train_loss": -43.50920486450195, "global_step": 267445, "epoch": 2210} {"train_loss": -44.0987663269043, "global_step": 267446, "epoch": 2210} {"train_loss": -43.43796157836914, "global_step": 267447, "epoch": 2210} {"train_loss": -44.02155685424805, "global_step": 267448, "epoch": 2210} {"train_loss": -44.2010383605957, "global_step": 267449, "epoch": 2210} {"train_loss": -43.79975128173828, "global_step": 267450, "epoch": 2210} {"train_loss": -43.18250274658203, "global_step": 267451, "epoch": 2210} {"train_loss": -43.23542022705078, "global_step": 267452, "epoch": 2210} {"train_loss": -42.67789840698242, "global_step": 267453, "epoch": 2210} {"train_loss": -43.80277633666992, "global_step": 267454, "epoch": 2210} {"train_loss": -43.015296936035156, "global_step": 267455, "epoch": 2210} {"train_loss": -43.03019332885742, "global_step": 267456, "epoch": 2210} {"train_loss": -43.55840301513672, "global_step": 267457, "epoch": 2210} {"train_loss": -42.24906539916992, "global_step": 267458, "epoch": 2210} {"train_loss": -43.704402923583984, "global_step": 267459, "epoch": 2210} {"train_loss": -41.94423294067383, "global_step": 267460, "epoch": 2210} {"train_loss": -42.65093994140625, "global_step": 267461, "epoch": 2210} {"train_loss": -43.93170166015625, "global_step": 267462, "epoch": 2210} {"train_loss": -43.7100830078125, "global_step": 267463, "epoch": 2210} {"train_loss": -42.15241622924805, "global_step": 267464, "epoch": 2210} {"train_loss": -43.94112014770508, "global_step": 267465, "epoch": 2210} {"train_loss": -43.181819915771484, "global_step": 267466, "epoch": 2210} {"train_loss": -42.09424591064453, "global_step": 267467, "epoch": 2210} {"train_loss": -43.35664367675781, "global_step": 267468, "epoch": 2210} {"train_loss": -42.36916732788086, "global_step": 267469, "epoch": 2210} {"train_loss": -41.68722152709961, "global_step": 267470, "epoch": 2210} {"train_loss": -42.60561752319336, "global_step": 267471, "epoch": 2210} {"train_loss": -41.68683624267578, "global_step": 267472, "epoch": 2210} {"train_loss": -43.06098937988281, "global_step": 267473, "epoch": 2210} {"train_loss": -42.434486389160156, "global_step": 267474, "epoch": 2210} {"train_loss": -41.5272102355957, "global_step": 267475, "epoch": 2210} {"train_loss": -42.23495101928711, "global_step": 267476, "epoch": 2210} {"train_loss": -42.190032958984375, "global_step": 267477, "epoch": 2210} {"train_loss": -41.73451614379883, "global_step": 267478, "epoch": 2210} {"train_loss": -41.28346252441406, "global_step": 267479, "epoch": 2210} {"train_loss": -42.881439208984375, "global_step": 267480, "epoch": 2210} {"train_loss": -41.25690841674805, "global_step": 267481, "epoch": 2210} {"train_loss": -41.03104782104492, "global_step": 267482, "epoch": 2210} {"train_loss": -41.61124801635742, "global_step": 267483, "epoch": 2210} {"train_loss": -41.21820068359375, "global_step": 267484, "epoch": 2210} {"train_loss": -40.85481262207031, "global_step": 267485, "epoch": 2210} {"train_loss": -41.95418167114258, "global_step": 267486, "epoch": 2210} {"train_loss": -41.2400016784668, "global_step": 267487, "epoch": 2210} {"train_loss": -43.15884780883789, "global_step": 267488, "epoch": 2210} {"train_loss": -42.26267623901367, "global_step": 267489, "epoch": 2210} {"train_loss": -41.396297454833984, "global_step": 267490, "epoch": 2210} {"train_loss": -41.3514404296875, "global_step": 267491, "epoch": 2210} {"train_loss": -42.328678131103516, "global_step": 267492, "epoch": 2210} {"train_loss": -41.72111129760742, "global_step": 267493, "epoch": 2210} {"train_loss": -41.111549377441406, "global_step": 267494, "epoch": 2210} {"train_loss": -43.154754638671875, "global_step": 267495, "epoch": 2210} {"train_loss": -40.64592742919922, "global_step": 267496, "epoch": 2210} {"train_loss": -41.75049591064453, "global_step": 267497, "epoch": 2210} {"train_loss": -42.82662582397461, "global_step": 267498, "epoch": 2210} {"train_loss": -42.534454345703125, "global_step": 267499, "epoch": 2210} {"train_loss": -42.54994201660156, "global_step": 267500, "epoch": 2210} {"train_loss": -41.912418365478516, "global_step": 267501, "epoch": 2210} {"train_loss": -42.53237533569336, "global_step": 267502, "epoch": 2210} {"train_loss": -42.00857925415039, "global_step": 267503, "epoch": 2210} {"train_loss": -42.59757995605469, "global_step": 267504, "epoch": 2210} {"train_loss": -41.6922492980957, "global_step": 267505, "epoch": 2210} {"train_loss": -42.954689025878906, "global_step": 267506, "epoch": 2210} {"train_loss": -43.246124267578125, "global_step": 267507, "epoch": 2210} {"train_loss": -42.78346252441406, "global_step": 267508, "epoch": 2210} {"train_loss": -43.32194137573242, "global_step": 267509, "epoch": 2210} {"train_loss": -42.523006439208984, "global_step": 267510, "epoch": 2210} {"train_loss": -42.8240966796875, "global_step": 267511, "epoch": 2210} {"train_loss": -42.10685729980469, "global_step": 267512, "epoch": 2210} {"train_loss": -43.25038528442383, "global_step": 267513, "epoch": 2210} {"train_loss": -43.36767578125, "global_step": 267514, "epoch": 2210} {"train_loss": -43.461769104003906, "global_step": 267515, "epoch": 2210} {"train_loss": -43.69957733154297, "global_step": 267516, "epoch": 2210} {"train_loss": -42.63834762573242, "global_step": 267517, "epoch": 2210} {"train_loss": -43.31159973144531, "global_step": 267518, "epoch": 2210} {"train_loss": -43.21906661987305, "global_step": 267519, "epoch": 2210} {"train_loss": -43.48317337036133, "global_step": 267520, "epoch": 2210} {"train_loss": -43.445343017578125, "global_step": 267521, "epoch": 2210} {"train_loss": -43.69160842895508, "global_step": 267522, "epoch": 2210} {"train_loss": -43.481285095214844, "global_step": 267523, "epoch": 2210} {"train_loss": -43.21512985229492, "global_step": 267524, "epoch": 2210} {"train_loss": -43.14963912963867, "global_step": 267525, "epoch": 2210} {"train_loss": -42.53432846069336, "global_step": 267526, "epoch": 2210} {"train_loss": -43.1507568359375, "global_step": 267527, "epoch": 2210} {"train_loss": -43.10403823852539, "global_step": 267528, "epoch": 2210} {"train_loss": -43.81325149536133, "global_step": 267529, "epoch": 2210} {"train_loss": -42.95179918777844, "global_step": 267530, "epoch": 2210, "val_loss": 2742316.25} {"train_loss": -42.7128791809082, "global_step": 267531, "epoch": 2211} {"train_loss": -43.61317825317383, "global_step": 267532, "epoch": 2211} {"train_loss": -42.78622055053711, "global_step": 267533, "epoch": 2211} {"train_loss": -44.34589385986328, "global_step": 267534, "epoch": 2211} {"train_loss": -43.74964904785156, "global_step": 267535, "epoch": 2211} {"train_loss": -43.32786178588867, "global_step": 267536, "epoch": 2211} {"train_loss": -42.6937141418457, "global_step": 267537, "epoch": 2211} {"train_loss": -42.97306442260742, "global_step": 267538, "epoch": 2211} {"train_loss": -43.36754608154297, "global_step": 267539, "epoch": 2211} {"train_loss": -43.8747444152832, "global_step": 267540, "epoch": 2211} {"train_loss": -43.32387924194336, "global_step": 267541, "epoch": 2211} {"train_loss": -41.93500518798828, "global_step": 267542, "epoch": 2211} {"train_loss": -43.5354118347168, "global_step": 267543, "epoch": 2211} {"train_loss": -43.96419143676758, "global_step": 267544, "epoch": 2211} {"train_loss": -43.4897346496582, "global_step": 267545, "epoch": 2211} {"train_loss": -42.64737319946289, "global_step": 267546, "epoch": 2211} {"train_loss": -43.85103225708008, "global_step": 267547, "epoch": 2211} {"train_loss": -42.98442459106445, "global_step": 267548, "epoch": 2211} {"train_loss": -43.1778564453125, "global_step": 267549, "epoch": 2211} {"train_loss": -43.147438049316406, "global_step": 267550, "epoch": 2211} {"train_loss": -43.956546783447266, "global_step": 267551, "epoch": 2211} {"train_loss": -42.49404525756836, "global_step": 267552, "epoch": 2211} {"train_loss": -42.354103088378906, "global_step": 267553, "epoch": 2211} {"train_loss": -43.42257308959961, "global_step": 267554, "epoch": 2211} {"train_loss": -40.562320709228516, "global_step": 267555, "epoch": 2211} {"train_loss": -41.918304443359375, "global_step": 267556, "epoch": 2211} {"train_loss": -40.27290725708008, "global_step": 267557, "epoch": 2211} {"train_loss": -42.32866287231445, "global_step": 267558, "epoch": 2211} {"train_loss": -41.32120895385742, "global_step": 267559, "epoch": 2211} {"train_loss": -41.50349044799805, "global_step": 267560, "epoch": 2211} {"train_loss": -42.2805290222168, "global_step": 267561, "epoch": 2211} {"train_loss": -40.34263610839844, "global_step": 267562, "epoch": 2211} {"train_loss": -43.09981918334961, "global_step": 267563, "epoch": 2211} {"train_loss": -40.28774642944336, "global_step": 267564, "epoch": 2211} {"train_loss": -43.001834869384766, "global_step": 267565, "epoch": 2211} {"train_loss": -40.66114807128906, "global_step": 267566, "epoch": 2211} {"train_loss": -41.1391487121582, "global_step": 267567, "epoch": 2211} {"train_loss": -41.86741638183594, "global_step": 267568, "epoch": 2211} {"train_loss": -40.501312255859375, "global_step": 267569, "epoch": 2211} {"train_loss": -41.94171905517578, "global_step": 267570, "epoch": 2211} {"train_loss": -42.40339279174805, "global_step": 267571, "epoch": 2211} {"train_loss": -42.96290969848633, "global_step": 267572, "epoch": 2211} {"train_loss": -42.09735870361328, "global_step": 267573, "epoch": 2211} {"train_loss": -41.96337127685547, "global_step": 267574, "epoch": 2211} {"train_loss": -41.966060638427734, "global_step": 267575, "epoch": 2211} {"train_loss": -41.15858459472656, "global_step": 267576, "epoch": 2211} {"train_loss": -42.868560791015625, "global_step": 267577, "epoch": 2211} {"train_loss": -41.10053634643555, "global_step": 267578, "epoch": 2211} {"train_loss": -40.841712951660156, "global_step": 267579, "epoch": 2211} {"train_loss": -42.61537551879883, "global_step": 267580, "epoch": 2211} {"train_loss": -40.583553314208984, "global_step": 267581, "epoch": 2211} {"train_loss": -43.13296890258789, "global_step": 267582, "epoch": 2211} {"train_loss": -40.235504150390625, "global_step": 267583, "epoch": 2211} {"train_loss": -43.242698669433594, "global_step": 267584, "epoch": 2211} {"train_loss": -41.20212173461914, "global_step": 267585, "epoch": 2211} {"train_loss": -42.51523971557617, "global_step": 267586, "epoch": 2211} {"train_loss": -42.0939826965332, "global_step": 267587, "epoch": 2211} {"train_loss": -42.640262603759766, "global_step": 267588, "epoch": 2211} {"train_loss": -41.62022018432617, "global_step": 267589, "epoch": 2211} {"train_loss": -41.92652130126953, "global_step": 267590, "epoch": 2211} {"train_loss": -42.342689514160156, "global_step": 267591, "epoch": 2211} {"train_loss": -40.73600769042969, "global_step": 267592, "epoch": 2211} {"train_loss": -42.61306381225586, "global_step": 267593, "epoch": 2211} {"train_loss": -42.171363830566406, "global_step": 267594, "epoch": 2211} {"train_loss": -40.763179779052734, "global_step": 267595, "epoch": 2211} {"train_loss": -42.731903076171875, "global_step": 267596, "epoch": 2211} {"train_loss": -42.88766860961914, "global_step": 267597, "epoch": 2211} {"train_loss": -40.82819366455078, "global_step": 267598, "epoch": 2211} {"train_loss": -41.69813537597656, "global_step": 267599, "epoch": 2211} {"train_loss": -41.71181869506836, "global_step": 267600, "epoch": 2211} {"train_loss": -43.062286376953125, "global_step": 267601, "epoch": 2211} {"train_loss": -43.064231872558594, "global_step": 267602, "epoch": 2211} {"train_loss": -43.31258773803711, "global_step": 267603, "epoch": 2211} {"train_loss": -41.95219039916992, "global_step": 267604, "epoch": 2211} {"train_loss": -42.09486770629883, "global_step": 267605, "epoch": 2211} {"train_loss": -43.26263427734375, "global_step": 267606, "epoch": 2211} {"train_loss": -43.18982696533203, "global_step": 267607, "epoch": 2211} {"train_loss": -42.382381439208984, "global_step": 267608, "epoch": 2211} {"train_loss": -42.7728385925293, "global_step": 267609, "epoch": 2211} {"train_loss": -42.92546463012695, "global_step": 267610, "epoch": 2211} {"train_loss": -43.4766960144043, "global_step": 267611, "epoch": 2211} {"train_loss": -42.07474136352539, "global_step": 267612, "epoch": 2211} {"train_loss": -42.50185775756836, "global_step": 267613, "epoch": 2211} {"train_loss": -44.036293029785156, "global_step": 267614, "epoch": 2211} {"train_loss": -42.91050338745117, "global_step": 267615, "epoch": 2211} {"train_loss": -42.538272857666016, "global_step": 267616, "epoch": 2211} {"train_loss": -42.52006912231445, "global_step": 267617, "epoch": 2211} {"train_loss": -42.929466247558594, "global_step": 267618, "epoch": 2211} {"train_loss": -43.3243522644043, "global_step": 267619, "epoch": 2211} {"train_loss": -43.44816970825195, "global_step": 267620, "epoch": 2211} {"train_loss": -42.59322738647461, "global_step": 267621, "epoch": 2211} {"train_loss": -43.70473861694336, "global_step": 267622, "epoch": 2211} {"train_loss": -43.8423957824707, "global_step": 267623, "epoch": 2211} {"train_loss": -43.1939582824707, "global_step": 267624, "epoch": 2211} {"train_loss": -43.9210205078125, "global_step": 267625, "epoch": 2211} {"train_loss": -44.068599700927734, "global_step": 267626, "epoch": 2211} {"train_loss": -43.34666061401367, "global_step": 267627, "epoch": 2211} {"train_loss": -43.80501937866211, "global_step": 267628, "epoch": 2211} {"train_loss": -43.81227493286133, "global_step": 267629, "epoch": 2211} {"train_loss": -43.2476921081543, "global_step": 267630, "epoch": 2211} {"train_loss": -43.85581588745117, "global_step": 267631, "epoch": 2211} {"train_loss": -44.0070915222168, "global_step": 267632, "epoch": 2211} {"train_loss": -43.61479187011719, "global_step": 267633, "epoch": 2211} {"train_loss": -43.86859893798828, "global_step": 267634, "epoch": 2211} {"train_loss": -43.91704559326172, "global_step": 267635, "epoch": 2211} {"train_loss": -44.2233772277832, "global_step": 267636, "epoch": 2211} {"train_loss": -43.5188102722168, "global_step": 267637, "epoch": 2211} {"train_loss": -43.7099609375, "global_step": 267638, "epoch": 2211} {"train_loss": -44.207252502441406, "global_step": 267639, "epoch": 2211} {"train_loss": -43.4904899597168, "global_step": 267640, "epoch": 2211} {"train_loss": -43.60374069213867, "global_step": 267641, "epoch": 2211} {"train_loss": -44.127498626708984, "global_step": 267642, "epoch": 2211} {"train_loss": -42.812557220458984, "global_step": 267643, "epoch": 2211} {"train_loss": -43.15052032470703, "global_step": 267644, "epoch": 2211} {"train_loss": -43.04304504394531, "global_step": 267645, "epoch": 2211} {"train_loss": -43.361534118652344, "global_step": 267646, "epoch": 2211} {"train_loss": -43.74544906616211, "global_step": 267647, "epoch": 2211} {"train_loss": -43.12184143066406, "global_step": 267648, "epoch": 2211} {"train_loss": -43.38239669799805, "global_step": 267649, "epoch": 2211} {"train_loss": -44.07097244262695, "global_step": 267650, "epoch": 2211} {"train_loss": -42.70861611484496, "global_step": 267651, "epoch": 2211, "val_loss": 2755475.25} {"train_loss": -42.764583587646484, "global_step": 267652, "epoch": 2212} {"train_loss": -43.729923248291016, "global_step": 267653, "epoch": 2212} {"train_loss": -43.446353912353516, "global_step": 267654, "epoch": 2212} {"train_loss": -42.165645599365234, "global_step": 267655, "epoch": 2212} {"train_loss": -42.22828674316406, "global_step": 267656, "epoch": 2212} {"train_loss": -42.75567626953125, "global_step": 267657, "epoch": 2212} {"train_loss": -43.375831604003906, "global_step": 267658, "epoch": 2212} {"train_loss": -43.284420013427734, "global_step": 267659, "epoch": 2212} {"train_loss": -42.05459976196289, "global_step": 267660, "epoch": 2212} {"train_loss": -43.4166145324707, "global_step": 267661, "epoch": 2212} {"train_loss": -43.286434173583984, "global_step": 267662, "epoch": 2212} {"train_loss": -43.09725570678711, "global_step": 267663, "epoch": 2212} {"train_loss": -43.99243927001953, "global_step": 267664, "epoch": 2212} {"train_loss": -43.54487609863281, "global_step": 267665, "epoch": 2212} {"train_loss": -43.546043395996094, "global_step": 267666, "epoch": 2212} {"train_loss": -43.779659271240234, "global_step": 267667, "epoch": 2212} {"train_loss": -43.929073333740234, "global_step": 267668, "epoch": 2212} {"train_loss": -43.041358947753906, "global_step": 267669, "epoch": 2212} {"train_loss": -42.89208984375, "global_step": 267670, "epoch": 2212} {"train_loss": -44.03658676147461, "global_step": 267671, "epoch": 2212} {"train_loss": -44.002235412597656, "global_step": 267672, "epoch": 2212} {"train_loss": -43.843929290771484, "global_step": 267673, "epoch": 2212} {"train_loss": -44.085182189941406, "global_step": 267674, "epoch": 2212} {"train_loss": -43.28438949584961, "global_step": 267675, "epoch": 2212} {"train_loss": -44.05134582519531, "global_step": 267676, "epoch": 2212} {"train_loss": -44.39668273925781, "global_step": 267677, "epoch": 2212} {"train_loss": -43.99152755737305, "global_step": 267678, "epoch": 2212} {"train_loss": -43.93351364135742, "global_step": 267679, "epoch": 2212} {"train_loss": -43.38079071044922, "global_step": 267680, "epoch": 2212} {"train_loss": -43.69917297363281, "global_step": 267681, "epoch": 2212} {"train_loss": -43.83376693725586, "global_step": 267682, "epoch": 2212} {"train_loss": -43.846736907958984, "global_step": 267683, "epoch": 2212} {"train_loss": -43.653255462646484, "global_step": 267684, "epoch": 2212} {"train_loss": -43.73786163330078, "global_step": 267685, "epoch": 2212} {"train_loss": -43.32183837890625, "global_step": 267686, "epoch": 2212} {"train_loss": -40.71645736694336, "global_step": 267687, "epoch": 2212} {"train_loss": -41.7794303894043, "global_step": 267688, "epoch": 2212} {"train_loss": -42.12925338745117, "global_step": 267689, "epoch": 2212} {"train_loss": -42.72719192504883, "global_step": 267690, "epoch": 2212} {"train_loss": -42.660396575927734, "global_step": 267691, "epoch": 2212} {"train_loss": -42.77071762084961, "global_step": 267692, "epoch": 2212} {"train_loss": -43.09579849243164, "global_step": 267693, "epoch": 2212} {"train_loss": -43.32500076293945, "global_step": 267694, "epoch": 2212} {"train_loss": -43.42222213745117, "global_step": 267695, "epoch": 2212} {"train_loss": -43.210914611816406, "global_step": 267696, "epoch": 2212} {"train_loss": -43.12083435058594, "global_step": 267697, "epoch": 2212} {"train_loss": -43.294246673583984, "global_step": 267698, "epoch": 2212} {"train_loss": -42.987728118896484, "global_step": 267699, "epoch": 2212} {"train_loss": -43.770263671875, "global_step": 267700, "epoch": 2212} {"train_loss": -42.72319030761719, "global_step": 267701, "epoch": 2212} {"train_loss": -43.47282409667969, "global_step": 267702, "epoch": 2212} {"train_loss": -43.99415969848633, "global_step": 267703, "epoch": 2212} {"train_loss": -42.494503021240234, "global_step": 267704, "epoch": 2212} {"train_loss": -43.5055046081543, "global_step": 267705, "epoch": 2212} {"train_loss": -43.9365348815918, "global_step": 267706, "epoch": 2212} {"train_loss": -42.669898986816406, "global_step": 267707, "epoch": 2212} {"train_loss": -42.863338470458984, "global_step": 267708, "epoch": 2212} {"train_loss": -43.781463623046875, "global_step": 267709, "epoch": 2212} {"train_loss": -43.12960433959961, "global_step": 267710, "epoch": 2212} {"train_loss": -43.712196350097656, "global_step": 267711, "epoch": 2212} {"train_loss": -44.11492919921875, "global_step": 267712, "epoch": 2212} {"train_loss": -43.17824935913086, "global_step": 267713, "epoch": 2212} {"train_loss": -42.84284210205078, "global_step": 267714, "epoch": 2212} {"train_loss": -43.73179244995117, "global_step": 267715, "epoch": 2212} {"train_loss": -44.22538375854492, "global_step": 267716, "epoch": 2212} {"train_loss": -43.56385803222656, "global_step": 267717, "epoch": 2212} {"train_loss": -43.29029083251953, "global_step": 267718, "epoch": 2212} {"train_loss": -43.23380661010742, "global_step": 267719, "epoch": 2212} {"train_loss": -42.88383102416992, "global_step": 267720, "epoch": 2212} {"train_loss": -44.074066162109375, "global_step": 267721, "epoch": 2212} {"train_loss": -43.578060150146484, "global_step": 267722, "epoch": 2212} {"train_loss": -42.92394256591797, "global_step": 267723, "epoch": 2212} {"train_loss": -43.926727294921875, "global_step": 267724, "epoch": 2212} {"train_loss": -43.80794906616211, "global_step": 267725, "epoch": 2212} {"train_loss": -42.334449768066406, "global_step": 267726, "epoch": 2212} {"train_loss": -43.2260856628418, "global_step": 267727, "epoch": 2212} {"train_loss": -41.65376663208008, "global_step": 267728, "epoch": 2212} {"train_loss": -41.74816131591797, "global_step": 267729, "epoch": 2212} {"train_loss": -43.0550422668457, "global_step": 267730, "epoch": 2212} {"train_loss": -40.10692596435547, "global_step": 267731, "epoch": 2212} {"train_loss": -42.14339065551758, "global_step": 267732, "epoch": 2212} {"train_loss": -39.19607162475586, "global_step": 267733, "epoch": 2212} {"train_loss": -43.42633056640625, "global_step": 267734, "epoch": 2212} {"train_loss": -39.97276306152344, "global_step": 267735, "epoch": 2212} {"train_loss": -39.76483917236328, "global_step": 267736, "epoch": 2212} {"train_loss": -39.75284957885742, "global_step": 267737, "epoch": 2212} {"train_loss": -39.39643478393555, "global_step": 267738, "epoch": 2212} {"train_loss": -39.954505920410156, "global_step": 267739, "epoch": 2212} {"train_loss": -39.53581237792969, "global_step": 267740, "epoch": 2212} {"train_loss": -40.6861457824707, "global_step": 267741, "epoch": 2212} {"train_loss": -39.56733703613281, "global_step": 267742, "epoch": 2212} {"train_loss": -39.54876708984375, "global_step": 267743, "epoch": 2212} {"train_loss": -40.50361633300781, "global_step": 267744, "epoch": 2212} {"train_loss": -40.473426818847656, "global_step": 267745, "epoch": 2212} {"train_loss": -39.53738021850586, "global_step": 267746, "epoch": 2212} {"train_loss": -40.723873138427734, "global_step": 267747, "epoch": 2212} {"train_loss": -40.825782775878906, "global_step": 267748, "epoch": 2212} {"train_loss": -40.805599212646484, "global_step": 267749, "epoch": 2212} {"train_loss": -41.5126838684082, "global_step": 267750, "epoch": 2212} {"train_loss": -42.95546340942383, "global_step": 267751, "epoch": 2212} {"train_loss": -41.362728118896484, "global_step": 267752, "epoch": 2212} {"train_loss": -42.996315002441406, "global_step": 267753, "epoch": 2212} {"train_loss": -42.344573974609375, "global_step": 267754, "epoch": 2212} {"train_loss": -40.701148986816406, "global_step": 267755, "epoch": 2212} {"train_loss": -41.440956115722656, "global_step": 267756, "epoch": 2212} {"train_loss": -41.35030746459961, "global_step": 267757, "epoch": 2212} {"train_loss": -41.8217887878418, "global_step": 267758, "epoch": 2212} {"train_loss": -42.61552810668945, "global_step": 267759, "epoch": 2212} {"train_loss": -41.62091064453125, "global_step": 267760, "epoch": 2212} {"train_loss": -42.61857223510742, "global_step": 267761, "epoch": 2212} {"train_loss": -42.381404876708984, "global_step": 267762, "epoch": 2212} {"train_loss": -42.84617233276367, "global_step": 267763, "epoch": 2212} {"train_loss": -42.56876754760742, "global_step": 267764, "epoch": 2212} {"train_loss": -42.10357666015625, "global_step": 267765, "epoch": 2212} {"train_loss": -42.80311965942383, "global_step": 267766, "epoch": 2212} {"train_loss": -42.749324798583984, "global_step": 267767, "epoch": 2212} {"train_loss": -43.06657409667969, "global_step": 267768, "epoch": 2212} {"train_loss": -42.997493743896484, "global_step": 267769, "epoch": 2212} {"train_loss": -42.17176055908203, "global_step": 267770, "epoch": 2212} {"train_loss": -42.42793655395508, "global_step": 267771, "epoch": 2212} {"train_loss": -42.61239062853096, "global_step": 267772, "epoch": 2212, "val_loss": 2734232.0} {"train_loss": -41.07000732421875, "global_step": 267773, "epoch": 2213} {"train_loss": -42.28879928588867, "global_step": 267774, "epoch": 2213} {"train_loss": -43.1434326171875, "global_step": 267775, "epoch": 2213} {"train_loss": -42.22024154663086, "global_step": 267776, "epoch": 2213} {"train_loss": -43.48805618286133, "global_step": 267777, "epoch": 2213} {"train_loss": -42.53922653198242, "global_step": 267778, "epoch": 2213} {"train_loss": -42.88457107543945, "global_step": 267779, "epoch": 2213} {"train_loss": -42.659423828125, "global_step": 267780, "epoch": 2213} {"train_loss": -42.996498107910156, "global_step": 267781, "epoch": 2213} {"train_loss": -42.652523040771484, "global_step": 267782, "epoch": 2213} {"train_loss": -42.87910842895508, "global_step": 267783, "epoch": 2213} {"train_loss": -43.461647033691406, "global_step": 267784, "epoch": 2213} {"train_loss": -43.136688232421875, "global_step": 267785, "epoch": 2213} {"train_loss": -43.635955810546875, "global_step": 267786, "epoch": 2213} {"train_loss": -42.91834259033203, "global_step": 267787, "epoch": 2213} {"train_loss": -43.95401382446289, "global_step": 267788, "epoch": 2213} {"train_loss": -43.65102767944336, "global_step": 267789, "epoch": 2213} {"train_loss": -43.38703155517578, "global_step": 267790, "epoch": 2213} {"train_loss": -43.381507873535156, "global_step": 267791, "epoch": 2213} {"train_loss": -43.795536041259766, "global_step": 267792, "epoch": 2213} {"train_loss": -43.655853271484375, "global_step": 267793, "epoch": 2213} {"train_loss": -43.85296630859375, "global_step": 267794, "epoch": 2213} {"train_loss": -43.89986801147461, "global_step": 267795, "epoch": 2213} {"train_loss": -44.127784729003906, "global_step": 267796, "epoch": 2213} {"train_loss": -43.60276794433594, "global_step": 267797, "epoch": 2213} {"train_loss": -43.65981674194336, "global_step": 267798, "epoch": 2213} {"train_loss": -43.8332633972168, "global_step": 267799, "epoch": 2213} {"train_loss": -43.52234649658203, "global_step": 267800, "epoch": 2213} {"train_loss": -43.25688552856445, "global_step": 267801, "epoch": 2213} {"train_loss": -43.46397018432617, "global_step": 267802, "epoch": 2213} {"train_loss": -42.203529357910156, "global_step": 267803, "epoch": 2213} {"train_loss": -42.39661407470703, "global_step": 267804, "epoch": 2213} {"train_loss": -42.85663604736328, "global_step": 267805, "epoch": 2213} {"train_loss": -43.44136047363281, "global_step": 267806, "epoch": 2213} {"train_loss": -43.22739028930664, "global_step": 267807, "epoch": 2213} {"train_loss": -41.338924407958984, "global_step": 267808, "epoch": 2213} {"train_loss": -43.403804779052734, "global_step": 267809, "epoch": 2213} {"train_loss": -42.771514892578125, "global_step": 267810, "epoch": 2213} {"train_loss": -42.89844512939453, "global_step": 267811, "epoch": 2213} {"train_loss": -42.6804084777832, "global_step": 267812, "epoch": 2213} {"train_loss": -43.48979568481445, "global_step": 267813, "epoch": 2213} {"train_loss": -43.1963996887207, "global_step": 267814, "epoch": 2213} {"train_loss": -41.76743698120117, "global_step": 267815, "epoch": 2213} {"train_loss": -43.5540657043457, "global_step": 267816, "epoch": 2213} {"train_loss": -41.894989013671875, "global_step": 267817, "epoch": 2213} {"train_loss": -41.63589096069336, "global_step": 267818, "epoch": 2213} {"train_loss": -41.50766372680664, "global_step": 267819, "epoch": 2213} {"train_loss": -42.656982421875, "global_step": 267820, "epoch": 2213} {"train_loss": -41.392913818359375, "global_step": 267821, "epoch": 2213} {"train_loss": -42.33375930786133, "global_step": 267822, "epoch": 2213} {"train_loss": -41.6353759765625, "global_step": 267823, "epoch": 2213} {"train_loss": -42.7661247253418, "global_step": 267824, "epoch": 2213} {"train_loss": -42.6307487487793, "global_step": 267825, "epoch": 2213} {"train_loss": -41.920799255371094, "global_step": 267826, "epoch": 2213} {"train_loss": -42.615447998046875, "global_step": 267827, "epoch": 2213} {"train_loss": -43.212066650390625, "global_step": 267828, "epoch": 2213} {"train_loss": -42.17446517944336, "global_step": 267829, "epoch": 2213} {"train_loss": -42.31911087036133, "global_step": 267830, "epoch": 2213} {"train_loss": -42.711021423339844, "global_step": 267831, "epoch": 2213} {"train_loss": -41.66845703125, "global_step": 267832, "epoch": 2213} {"train_loss": -43.07133865356445, "global_step": 267833, "epoch": 2213} {"train_loss": -41.294612884521484, "global_step": 267834, "epoch": 2213} {"train_loss": -43.1177864074707, "global_step": 267835, "epoch": 2213} {"train_loss": -41.17241668701172, "global_step": 267836, "epoch": 2213} {"train_loss": -43.58480453491211, "global_step": 267837, "epoch": 2213} {"train_loss": -40.46930694580078, "global_step": 267838, "epoch": 2213} {"train_loss": -42.18171691894531, "global_step": 267839, "epoch": 2213} {"train_loss": -38.25237274169922, "global_step": 267840, "epoch": 2213} {"train_loss": -41.597389221191406, "global_step": 267841, "epoch": 2213} {"train_loss": -40.800987243652344, "global_step": 267842, "epoch": 2213} {"train_loss": -41.7036247253418, "global_step": 267843, "epoch": 2213} {"train_loss": -40.833709716796875, "global_step": 267844, "epoch": 2213} {"train_loss": -40.22902297973633, "global_step": 267845, "epoch": 2213} {"train_loss": -38.99052810668945, "global_step": 267846, "epoch": 2213} {"train_loss": -39.519927978515625, "global_step": 267847, "epoch": 2213} {"train_loss": -41.9264030456543, "global_step": 267848, "epoch": 2213} {"train_loss": -40.42291259765625, "global_step": 267849, "epoch": 2213} {"train_loss": -41.9924430847168, "global_step": 267850, "epoch": 2213} {"train_loss": -41.67901611328125, "global_step": 267851, "epoch": 2213} {"train_loss": -42.26409912109375, "global_step": 267852, "epoch": 2213} {"train_loss": -41.048343658447266, "global_step": 267853, "epoch": 2213} {"train_loss": -42.6550407409668, "global_step": 267854, "epoch": 2213} {"train_loss": -40.925697326660156, "global_step": 267855, "epoch": 2213} {"train_loss": -41.62948989868164, "global_step": 267856, "epoch": 2213} {"train_loss": -42.25632858276367, "global_step": 267857, "epoch": 2213} {"train_loss": -41.15029525756836, "global_step": 267858, "epoch": 2213} {"train_loss": -40.71010208129883, "global_step": 267859, "epoch": 2213} {"train_loss": -42.016387939453125, "global_step": 267860, "epoch": 2213} {"train_loss": -40.542842864990234, "global_step": 267861, "epoch": 2213} {"train_loss": -40.93397903442383, "global_step": 267862, "epoch": 2213} {"train_loss": -41.71305465698242, "global_step": 267863, "epoch": 2213} {"train_loss": -37.2318229675293, "global_step": 267864, "epoch": 2213} {"train_loss": -40.47098159790039, "global_step": 267865, "epoch": 2213} {"train_loss": -39.91618728637695, "global_step": 267866, "epoch": 2213} {"train_loss": -42.779239654541016, "global_step": 267867, "epoch": 2213} {"train_loss": -41.48576736450195, "global_step": 267868, "epoch": 2213} {"train_loss": -41.50927734375, "global_step": 267869, "epoch": 2213} {"train_loss": -41.3122673034668, "global_step": 267870, "epoch": 2213} {"train_loss": -37.29311752319336, "global_step": 267871, "epoch": 2213} {"train_loss": -41.65633010864258, "global_step": 267872, "epoch": 2213} {"train_loss": -42.82407760620117, "global_step": 267873, "epoch": 2213} {"train_loss": -41.03071212768555, "global_step": 267874, "epoch": 2213} {"train_loss": -40.680023193359375, "global_step": 267875, "epoch": 2213} {"train_loss": -42.52337646484375, "global_step": 267876, "epoch": 2213} {"train_loss": -38.75728988647461, "global_step": 267877, "epoch": 2213} {"train_loss": -37.913814544677734, "global_step": 267878, "epoch": 2213} {"train_loss": -42.79903030395508, "global_step": 267879, "epoch": 2213} {"train_loss": -40.22211456298828, "global_step": 267880, "epoch": 2213} {"train_loss": -37.4761848449707, "global_step": 267881, "epoch": 2213} {"train_loss": -32.95720672607422, "global_step": 267882, "epoch": 2213} {"train_loss": -40.43121337890625, "global_step": 267883, "epoch": 2213} {"train_loss": -38.99410629272461, "global_step": 267884, "epoch": 2213} {"train_loss": -33.9613037109375, "global_step": 267885, "epoch": 2213} {"train_loss": -40.637393951416016, "global_step": 267886, "epoch": 2213} {"train_loss": -34.35206985473633, "global_step": 267887, "epoch": 2213} {"train_loss": -37.15829086303711, "global_step": 267888, "epoch": 2213} {"train_loss": -37.05942916870117, "global_step": 267889, "epoch": 2213} {"train_loss": -37.056640625, "global_step": 267890, "epoch": 2213} {"train_loss": -37.02936553955078, "global_step": 267891, "epoch": 2213} {"train_loss": -38.82973861694336, "global_step": 267892, "epoch": 2213} {"train_loss": -41.552384999172745, "global_step": 267893, "epoch": 2213, "val_loss": 2991725.25} {"train_loss": -38.410823822021484, "global_step": 267894, "epoch": 2214} {"train_loss": -35.072608947753906, "global_step": 267895, "epoch": 2214} {"train_loss": -40.44575119018555, "global_step": 267896, "epoch": 2214} {"train_loss": -37.490657806396484, "global_step": 267897, "epoch": 2214} {"train_loss": -37.51985549926758, "global_step": 267898, "epoch": 2214} {"train_loss": -40.51142501831055, "global_step": 267899, "epoch": 2214} {"train_loss": -37.58535385131836, "global_step": 267900, "epoch": 2214} {"train_loss": -39.909461975097656, "global_step": 267901, "epoch": 2214} {"train_loss": -37.8740348815918, "global_step": 267902, "epoch": 2214} {"train_loss": -38.74027633666992, "global_step": 267903, "epoch": 2214} {"train_loss": -40.21662521362305, "global_step": 267904, "epoch": 2214} {"train_loss": -39.735233306884766, "global_step": 267905, "epoch": 2214} {"train_loss": -40.32430648803711, "global_step": 267906, "epoch": 2214} {"train_loss": -41.01325607299805, "global_step": 267907, "epoch": 2214} {"train_loss": -38.848812103271484, "global_step": 267908, "epoch": 2214} {"train_loss": -39.95936965942383, "global_step": 267909, "epoch": 2214} {"train_loss": -40.9388542175293, "global_step": 267910, "epoch": 2214} {"train_loss": -41.13352584838867, "global_step": 267911, "epoch": 2214} {"train_loss": -40.87728500366211, "global_step": 267912, "epoch": 2214} {"train_loss": -40.6373405456543, "global_step": 267913, "epoch": 2214} {"train_loss": -40.725921630859375, "global_step": 267914, "epoch": 2214} {"train_loss": -37.85939407348633, "global_step": 267915, "epoch": 2214} {"train_loss": -40.905006408691406, "global_step": 267916, "epoch": 2214} {"train_loss": -40.255821228027344, "global_step": 267917, "epoch": 2214} {"train_loss": -40.785640716552734, "global_step": 267918, "epoch": 2214} {"train_loss": -40.79536819458008, "global_step": 267919, "epoch": 2214} {"train_loss": -40.11252975463867, "global_step": 267920, "epoch": 2214} {"train_loss": -41.203330993652344, "global_step": 267921, "epoch": 2214} {"train_loss": -41.46622848510742, "global_step": 267922, "epoch": 2214} {"train_loss": -41.94139862060547, "global_step": 267923, "epoch": 2214} {"train_loss": -41.76156234741211, "global_step": 267924, "epoch": 2214} {"train_loss": -41.45722579956055, "global_step": 267925, "epoch": 2214} {"train_loss": -42.60396957397461, "global_step": 267926, "epoch": 2214} {"train_loss": -41.97829818725586, "global_step": 267927, "epoch": 2214} {"train_loss": -40.965511322021484, "global_step": 267928, "epoch": 2214} {"train_loss": -41.7208251953125, "global_step": 267929, "epoch": 2214} {"train_loss": -41.87059783935547, "global_step": 267930, "epoch": 2214} {"train_loss": -41.37980270385742, "global_step": 267931, "epoch": 2214} {"train_loss": -42.30598068237305, "global_step": 267932, "epoch": 2214} {"train_loss": -40.832550048828125, "global_step": 267933, "epoch": 2214} {"train_loss": -42.06425476074219, "global_step": 267934, "epoch": 2214} {"train_loss": -41.746826171875, "global_step": 267935, "epoch": 2214} {"train_loss": -42.45979690551758, "global_step": 267936, "epoch": 2214} {"train_loss": -43.07514572143555, "global_step": 267937, "epoch": 2214} {"train_loss": -42.7696647644043, "global_step": 267938, "epoch": 2214} {"train_loss": -42.438106536865234, "global_step": 267939, "epoch": 2214} {"train_loss": -42.746307373046875, "global_step": 267940, "epoch": 2214} {"train_loss": -41.94729995727539, "global_step": 267941, "epoch": 2214} {"train_loss": -42.062461853027344, "global_step": 267942, "epoch": 2214} {"train_loss": -42.14238357543945, "global_step": 267943, "epoch": 2214} {"train_loss": -42.53945541381836, "global_step": 267944, "epoch": 2214} {"train_loss": -42.51752471923828, "global_step": 267945, "epoch": 2214} {"train_loss": -42.68465805053711, "global_step": 267946, "epoch": 2214} {"train_loss": -43.40138626098633, "global_step": 267947, "epoch": 2214} {"train_loss": -42.61785125732422, "global_step": 267948, "epoch": 2214} {"train_loss": -42.37995529174805, "global_step": 267949, "epoch": 2214} {"train_loss": -42.97944259643555, "global_step": 267950, "epoch": 2214} {"train_loss": -42.05070114135742, "global_step": 267951, "epoch": 2214} {"train_loss": -41.8546142578125, "global_step": 267952, "epoch": 2214} {"train_loss": -43.09850311279297, "global_step": 267953, "epoch": 2214} {"train_loss": -41.94378662109375, "global_step": 267954, "epoch": 2214} {"train_loss": -42.92831039428711, "global_step": 267955, "epoch": 2214} {"train_loss": -43.375152587890625, "global_step": 267956, "epoch": 2214} {"train_loss": -42.60369873046875, "global_step": 267957, "epoch": 2214} {"train_loss": -42.53760528564453, "global_step": 267958, "epoch": 2214} {"train_loss": -43.263057708740234, "global_step": 267959, "epoch": 2214} {"train_loss": -42.75178909301758, "global_step": 267960, "epoch": 2214} {"train_loss": -43.24736785888672, "global_step": 267961, "epoch": 2214} {"train_loss": -42.82247543334961, "global_step": 267962, "epoch": 2214} {"train_loss": -43.12092971801758, "global_step": 267963, "epoch": 2214} {"train_loss": -42.81612777709961, "global_step": 267964, "epoch": 2214} {"train_loss": -42.592830657958984, "global_step": 267965, "epoch": 2214} {"train_loss": -43.67629623413086, "global_step": 267966, "epoch": 2214} {"train_loss": -41.879695892333984, "global_step": 267967, "epoch": 2214} {"train_loss": -42.924659729003906, "global_step": 267968, "epoch": 2214} {"train_loss": -42.8484001159668, "global_step": 267969, "epoch": 2214} {"train_loss": -42.90055465698242, "global_step": 267970, "epoch": 2214} {"train_loss": -43.595367431640625, "global_step": 267971, "epoch": 2214} {"train_loss": -42.743629455566406, "global_step": 267972, "epoch": 2214} {"train_loss": -43.691566467285156, "global_step": 267973, "epoch": 2214} {"train_loss": -43.300270080566406, "global_step": 267974, "epoch": 2214} {"train_loss": -42.9344596862793, "global_step": 267975, "epoch": 2214} {"train_loss": -41.69121551513672, "global_step": 267976, "epoch": 2214} {"train_loss": -43.03135299682617, "global_step": 267977, "epoch": 2214} {"train_loss": -43.29362106323242, "global_step": 267978, "epoch": 2214} {"train_loss": -43.0533447265625, "global_step": 267979, "epoch": 2214} {"train_loss": -41.777217864990234, "global_step": 267980, "epoch": 2214} {"train_loss": -41.81269073486328, "global_step": 267981, "epoch": 2214} {"train_loss": -43.26787185668945, "global_step": 267982, "epoch": 2214} {"train_loss": -43.34209442138672, "global_step": 267983, "epoch": 2214} {"train_loss": -42.8663444519043, "global_step": 267984, "epoch": 2214} {"train_loss": -42.57400131225586, "global_step": 267985, "epoch": 2214} {"train_loss": -43.305477142333984, "global_step": 267986, "epoch": 2214} {"train_loss": -42.95235824584961, "global_step": 267987, "epoch": 2214} {"train_loss": -42.50150680541992, "global_step": 267988, "epoch": 2214} {"train_loss": -43.464141845703125, "global_step": 267989, "epoch": 2214} {"train_loss": -43.34393310546875, "global_step": 267990, "epoch": 2214} {"train_loss": -40.73299789428711, "global_step": 267991, "epoch": 2214} {"train_loss": -41.5098762512207, "global_step": 267992, "epoch": 2214} {"train_loss": -43.873138427734375, "global_step": 267993, "epoch": 2214} {"train_loss": -41.88838195800781, "global_step": 267994, "epoch": 2214} {"train_loss": -41.25112533569336, "global_step": 267995, "epoch": 2214} {"train_loss": -43.32645034790039, "global_step": 267996, "epoch": 2214} {"train_loss": -41.24496078491211, "global_step": 267997, "epoch": 2214} {"train_loss": -41.19276809692383, "global_step": 267998, "epoch": 2214} {"train_loss": -42.30788803100586, "global_step": 267999, "epoch": 2214} {"train_loss": -38.18933868408203, "global_step": 268000, "epoch": 2214} {"train_loss": -38.27720642089844, "global_step": 268001, "epoch": 2214} {"train_loss": -38.669647216796875, "global_step": 268002, "epoch": 2214} {"train_loss": -38.65876388549805, "global_step": 268003, "epoch": 2214} {"train_loss": -39.975440979003906, "global_step": 268004, "epoch": 2214} {"train_loss": -39.810176849365234, "global_step": 268005, "epoch": 2214} {"train_loss": -39.9119873046875, "global_step": 268006, "epoch": 2214} {"train_loss": -41.1065673828125, "global_step": 268007, "epoch": 2214} {"train_loss": -41.05820846557617, "global_step": 268008, "epoch": 2214} {"train_loss": -41.13103103637695, "global_step": 268009, "epoch": 2214} {"train_loss": -40.86086654663086, "global_step": 268010, "epoch": 2214} {"train_loss": -41.79140090942383, "global_step": 268011, "epoch": 2214} {"train_loss": -42.20380783081055, "global_step": 268012, "epoch": 2214} {"train_loss": -40.7718505859375, "global_step": 268013, "epoch": 2214} {"train_loss": -41.553563898259945, "global_step": 268014, "epoch": 2214, "val_loss": 2734789.0} {"train_loss": -42.12398910522461, "global_step": 268015, "epoch": 2215} {"train_loss": -41.711204528808594, "global_step": 268016, "epoch": 2215} {"train_loss": -40.68351745605469, "global_step": 268017, "epoch": 2215} {"train_loss": -40.64015197753906, "global_step": 268018, "epoch": 2215} {"train_loss": -41.58177185058594, "global_step": 268019, "epoch": 2215} {"train_loss": -42.60663986206055, "global_step": 268020, "epoch": 2215} {"train_loss": -41.58549499511719, "global_step": 268021, "epoch": 2215} {"train_loss": -41.895023345947266, "global_step": 268022, "epoch": 2215} {"train_loss": -41.34760665893555, "global_step": 268023, "epoch": 2215} {"train_loss": -42.21672439575195, "global_step": 268024, "epoch": 2215} {"train_loss": -42.3209342956543, "global_step": 268025, "epoch": 2215} {"train_loss": -41.72685623168945, "global_step": 268026, "epoch": 2215} {"train_loss": -42.626258850097656, "global_step": 268027, "epoch": 2215} {"train_loss": -42.406822204589844, "global_step": 268028, "epoch": 2215} {"train_loss": -41.23903274536133, "global_step": 268029, "epoch": 2215} {"train_loss": -42.69578552246094, "global_step": 268030, "epoch": 2215} {"train_loss": -42.709468841552734, "global_step": 268031, "epoch": 2215} {"train_loss": -42.279720306396484, "global_step": 268032, "epoch": 2215} {"train_loss": -42.612796783447266, "global_step": 268033, "epoch": 2215} {"train_loss": -42.56315994262695, "global_step": 268034, "epoch": 2215} {"train_loss": -42.74268341064453, "global_step": 268035, "epoch": 2215} {"train_loss": -42.21193313598633, "global_step": 268036, "epoch": 2215} {"train_loss": -43.082332611083984, "global_step": 268037, "epoch": 2215} {"train_loss": -42.51137924194336, "global_step": 268038, "epoch": 2215} {"train_loss": -43.12139892578125, "global_step": 268039, "epoch": 2215} {"train_loss": -43.055667877197266, "global_step": 268040, "epoch": 2215} {"train_loss": -42.407867431640625, "global_step": 268041, "epoch": 2215} {"train_loss": -42.753902435302734, "global_step": 268042, "epoch": 2215} {"train_loss": -42.431800842285156, "global_step": 268043, "epoch": 2215} {"train_loss": -43.368011474609375, "global_step": 268044, "epoch": 2215} {"train_loss": -42.5297966003418, "global_step": 268045, "epoch": 2215} {"train_loss": -42.89406967163086, "global_step": 268046, "epoch": 2215} {"train_loss": -42.19355010986328, "global_step": 268047, "epoch": 2215} {"train_loss": -43.27985382080078, "global_step": 268048, "epoch": 2215} {"train_loss": -43.027400970458984, "global_step": 268049, "epoch": 2215} {"train_loss": -43.209678649902344, "global_step": 268050, "epoch": 2215} {"train_loss": -41.87596130371094, "global_step": 268051, "epoch": 2215} {"train_loss": -43.640037536621094, "global_step": 268052, "epoch": 2215} {"train_loss": -43.7715950012207, "global_step": 268053, "epoch": 2215} {"train_loss": -43.55030059814453, "global_step": 268054, "epoch": 2215} {"train_loss": -43.496646881103516, "global_step": 268055, "epoch": 2215} {"train_loss": -43.20463943481445, "global_step": 268056, "epoch": 2215} {"train_loss": -43.5673828125, "global_step": 268057, "epoch": 2215} {"train_loss": -43.22874069213867, "global_step": 268058, "epoch": 2215} {"train_loss": -43.52975082397461, "global_step": 268059, "epoch": 2215} {"train_loss": -43.48618698120117, "global_step": 268060, "epoch": 2215} {"train_loss": -43.621307373046875, "global_step": 268061, "epoch": 2215} {"train_loss": -43.788021087646484, "global_step": 268062, "epoch": 2215} {"train_loss": -43.570709228515625, "global_step": 268063, "epoch": 2215} {"train_loss": -44.206661224365234, "global_step": 268064, "epoch": 2215} {"train_loss": -42.88245391845703, "global_step": 268065, "epoch": 2215} {"train_loss": -42.00242233276367, "global_step": 268066, "epoch": 2215} {"train_loss": -43.95650863647461, "global_step": 268067, "epoch": 2215} {"train_loss": -43.69855499267578, "global_step": 268068, "epoch": 2215} {"train_loss": -41.6195068359375, "global_step": 268069, "epoch": 2215} {"train_loss": -42.96662521362305, "global_step": 268070, "epoch": 2215} {"train_loss": -43.55045700073242, "global_step": 268071, "epoch": 2215} {"train_loss": -42.490028381347656, "global_step": 268072, "epoch": 2215} {"train_loss": -42.939048767089844, "global_step": 268073, "epoch": 2215} {"train_loss": -43.1995735168457, "global_step": 268074, "epoch": 2215} {"train_loss": -43.24258041381836, "global_step": 268075, "epoch": 2215} {"train_loss": -43.12327194213867, "global_step": 268076, "epoch": 2215} {"train_loss": -43.795005798339844, "global_step": 268077, "epoch": 2215} {"train_loss": -43.263309478759766, "global_step": 268078, "epoch": 2215} {"train_loss": -42.693756103515625, "global_step": 268079, "epoch": 2215} {"train_loss": -43.817378997802734, "global_step": 268080, "epoch": 2215} {"train_loss": -41.9841194152832, "global_step": 268081, "epoch": 2215} {"train_loss": -43.06061935424805, "global_step": 268082, "epoch": 2215} {"train_loss": -41.67633056640625, "global_step": 268083, "epoch": 2215} {"train_loss": -40.72459030151367, "global_step": 268084, "epoch": 2215} {"train_loss": -42.936676025390625, "global_step": 268085, "epoch": 2215} {"train_loss": -39.88901901245117, "global_step": 268086, "epoch": 2215} {"train_loss": -43.556522369384766, "global_step": 268087, "epoch": 2215} {"train_loss": -37.68598175048828, "global_step": 268088, "epoch": 2215} {"train_loss": -39.245826721191406, "global_step": 268089, "epoch": 2215} {"train_loss": -42.07798385620117, "global_step": 268090, "epoch": 2215} {"train_loss": -38.46816635131836, "global_step": 268091, "epoch": 2215} {"train_loss": -41.232418060302734, "global_step": 268092, "epoch": 2215} {"train_loss": -39.465484619140625, "global_step": 268093, "epoch": 2215} {"train_loss": -40.38721466064453, "global_step": 268094, "epoch": 2215} {"train_loss": -42.24589157104492, "global_step": 268095, "epoch": 2215} {"train_loss": -40.181976318359375, "global_step": 268096, "epoch": 2215} {"train_loss": -40.51314163208008, "global_step": 268097, "epoch": 2215} {"train_loss": -39.89332962036133, "global_step": 268098, "epoch": 2215} {"train_loss": -40.7951545715332, "global_step": 268099, "epoch": 2215} {"train_loss": -41.03120803833008, "global_step": 268100, "epoch": 2215} {"train_loss": -40.6294059753418, "global_step": 268101, "epoch": 2215} {"train_loss": -40.7502555847168, "global_step": 268102, "epoch": 2215} {"train_loss": -40.91303253173828, "global_step": 268103, "epoch": 2215} {"train_loss": -41.14802169799805, "global_step": 268104, "epoch": 2215} {"train_loss": -41.903629302978516, "global_step": 268105, "epoch": 2215} {"train_loss": -42.085113525390625, "global_step": 268106, "epoch": 2215} {"train_loss": -41.415462493896484, "global_step": 268107, "epoch": 2215} {"train_loss": -41.5949592590332, "global_step": 268108, "epoch": 2215} {"train_loss": -42.16378402709961, "global_step": 268109, "epoch": 2215} {"train_loss": -41.661766052246094, "global_step": 268110, "epoch": 2215} {"train_loss": -39.220638275146484, "global_step": 268111, "epoch": 2215} {"train_loss": -41.54010772705078, "global_step": 268112, "epoch": 2215} {"train_loss": -42.95864486694336, "global_step": 268113, "epoch": 2215} {"train_loss": -41.03975296020508, "global_step": 268114, "epoch": 2215} {"train_loss": -42.21584701538086, "global_step": 268115, "epoch": 2215} {"train_loss": -42.603248596191406, "global_step": 268116, "epoch": 2215} {"train_loss": -42.15639114379883, "global_step": 268117, "epoch": 2215} {"train_loss": -42.42112350463867, "global_step": 268118, "epoch": 2215} {"train_loss": -42.22434997558594, "global_step": 268119, "epoch": 2215} {"train_loss": -43.190128326416016, "global_step": 268120, "epoch": 2215} {"train_loss": -42.38677215576172, "global_step": 268121, "epoch": 2215} {"train_loss": -42.504642486572266, "global_step": 268122, "epoch": 2215} {"train_loss": -43.363311767578125, "global_step": 268123, "epoch": 2215} {"train_loss": -42.2613410949707, "global_step": 268124, "epoch": 2215} {"train_loss": -43.1803092956543, "global_step": 268125, "epoch": 2215} {"train_loss": -42.610836029052734, "global_step": 268126, "epoch": 2215} {"train_loss": -43.03656768798828, "global_step": 268127, "epoch": 2215} {"train_loss": -42.58721160888672, "global_step": 268128, "epoch": 2215} {"train_loss": -42.95998001098633, "global_step": 268129, "epoch": 2215} {"train_loss": -43.5799446105957, "global_step": 268130, "epoch": 2215} {"train_loss": -43.01864242553711, "global_step": 268131, "epoch": 2215} {"train_loss": -43.1124382019043, "global_step": 268132, "epoch": 2215} {"train_loss": -43.21516418457031, "global_step": 268133, "epoch": 2215} {"train_loss": -42.605220794677734, "global_step": 268134, "epoch": 2215} {"train_loss": -42.293726834383875, "global_step": 268135, "epoch": 2215, "val_loss": 2741039.25} {"train_loss": -42.984230041503906, "global_step": 268136, "epoch": 2216} {"train_loss": -42.794979095458984, "global_step": 268137, "epoch": 2216} {"train_loss": -43.59614181518555, "global_step": 268138, "epoch": 2216} {"train_loss": -43.121192932128906, "global_step": 268139, "epoch": 2216} {"train_loss": -43.96636199951172, "global_step": 268140, "epoch": 2216} {"train_loss": -42.515357971191406, "global_step": 268141, "epoch": 2216} {"train_loss": -43.81889724731445, "global_step": 268142, "epoch": 2216} {"train_loss": -43.53422546386719, "global_step": 268143, "epoch": 2216} {"train_loss": -43.68532943725586, "global_step": 268144, "epoch": 2216} {"train_loss": -43.802520751953125, "global_step": 268145, "epoch": 2216} {"train_loss": -43.44102096557617, "global_step": 268146, "epoch": 2216} {"train_loss": -43.29402542114258, "global_step": 268147, "epoch": 2216} {"train_loss": -43.69400405883789, "global_step": 268148, "epoch": 2216} {"train_loss": -43.59372329711914, "global_step": 268149, "epoch": 2216} {"train_loss": -43.56883239746094, "global_step": 268150, "epoch": 2216} {"train_loss": -43.169586181640625, "global_step": 268151, "epoch": 2216} {"train_loss": -43.984519958496094, "global_step": 268152, "epoch": 2216} {"train_loss": -43.70356750488281, "global_step": 268153, "epoch": 2216} {"train_loss": -43.962642669677734, "global_step": 268154, "epoch": 2216} {"train_loss": -43.831443786621094, "global_step": 268155, "epoch": 2216} {"train_loss": -42.83827209472656, "global_step": 268156, "epoch": 2216} {"train_loss": -43.62617111206055, "global_step": 268157, "epoch": 2216} {"train_loss": -44.179161071777344, "global_step": 268158, "epoch": 2216} {"train_loss": -43.869869232177734, "global_step": 268159, "epoch": 2216} {"train_loss": -43.394771575927734, "global_step": 268160, "epoch": 2216} {"train_loss": -43.12612533569336, "global_step": 268161, "epoch": 2216} {"train_loss": -44.08763122558594, "global_step": 268162, "epoch": 2216} {"train_loss": -42.550331115722656, "global_step": 268163, "epoch": 2216} {"train_loss": -41.99198532104492, "global_step": 268164, "epoch": 2216} {"train_loss": -42.91291809082031, "global_step": 268165, "epoch": 2216} {"train_loss": -43.3200569152832, "global_step": 268166, "epoch": 2216} {"train_loss": -42.243228912353516, "global_step": 268167, "epoch": 2216} {"train_loss": -41.347286224365234, "global_step": 268168, "epoch": 2216} {"train_loss": -43.84603500366211, "global_step": 268169, "epoch": 2216} {"train_loss": -40.45043182373047, "global_step": 268170, "epoch": 2216} {"train_loss": -43.33341598510742, "global_step": 268171, "epoch": 2216} {"train_loss": -43.82747268676758, "global_step": 268172, "epoch": 2216} {"train_loss": -41.54102325439453, "global_step": 268173, "epoch": 2216} {"train_loss": -43.13376998901367, "global_step": 268174, "epoch": 2216} {"train_loss": -41.93331527709961, "global_step": 268175, "epoch": 2216} {"train_loss": -42.197509765625, "global_step": 268176, "epoch": 2216} {"train_loss": -43.07892608642578, "global_step": 268177, "epoch": 2216} {"train_loss": -41.19581985473633, "global_step": 268178, "epoch": 2216} {"train_loss": -42.37282943725586, "global_step": 268179, "epoch": 2216} {"train_loss": -41.6385498046875, "global_step": 268180, "epoch": 2216} {"train_loss": -42.981868743896484, "global_step": 268181, "epoch": 2216} {"train_loss": -42.240516662597656, "global_step": 268182, "epoch": 2216} {"train_loss": -42.381771087646484, "global_step": 268183, "epoch": 2216} {"train_loss": -43.43886947631836, "global_step": 268184, "epoch": 2216} {"train_loss": -40.89182662963867, "global_step": 268185, "epoch": 2216} {"train_loss": -42.38874435424805, "global_step": 268186, "epoch": 2216} {"train_loss": -42.05842971801758, "global_step": 268187, "epoch": 2216} {"train_loss": -34.43935775756836, "global_step": 268188, "epoch": 2216} {"train_loss": -42.92152786254883, "global_step": 268189, "epoch": 2216} {"train_loss": -42.83539962768555, "global_step": 268190, "epoch": 2216} {"train_loss": -42.42039489746094, "global_step": 268191, "epoch": 2216} {"train_loss": -43.05745315551758, "global_step": 268192, "epoch": 2216} {"train_loss": -40.78193283081055, "global_step": 268193, "epoch": 2216} {"train_loss": -36.580718994140625, "global_step": 268194, "epoch": 2216} {"train_loss": -41.64352035522461, "global_step": 268195, "epoch": 2216} {"train_loss": -41.41890335083008, "global_step": 268196, "epoch": 2216} {"train_loss": -39.9124641418457, "global_step": 268197, "epoch": 2216} {"train_loss": -42.22145462036133, "global_step": 268198, "epoch": 2216} {"train_loss": -42.77559280395508, "global_step": 268199, "epoch": 2216} {"train_loss": -41.40323257446289, "global_step": 268200, "epoch": 2216} {"train_loss": -41.62517547607422, "global_step": 268201, "epoch": 2216} {"train_loss": -41.047454833984375, "global_step": 268202, "epoch": 2216} {"train_loss": -41.15188980102539, "global_step": 268203, "epoch": 2216} {"train_loss": -41.01576614379883, "global_step": 268204, "epoch": 2216} {"train_loss": -40.826107025146484, "global_step": 268205, "epoch": 2216} {"train_loss": -41.6676139831543, "global_step": 268206, "epoch": 2216} {"train_loss": -41.81171798706055, "global_step": 268207, "epoch": 2216} {"train_loss": -39.64701461791992, "global_step": 268208, "epoch": 2216} {"train_loss": -39.68625259399414, "global_step": 268209, "epoch": 2216} {"train_loss": -41.3886833190918, "global_step": 268210, "epoch": 2216} {"train_loss": -39.002716064453125, "global_step": 268211, "epoch": 2216} {"train_loss": -41.488739013671875, "global_step": 268212, "epoch": 2216} {"train_loss": -35.41957473754883, "global_step": 268213, "epoch": 2216} {"train_loss": -40.521724700927734, "global_step": 268214, "epoch": 2216} {"train_loss": -40.199642181396484, "global_step": 268215, "epoch": 2216} {"train_loss": -40.366798400878906, "global_step": 268216, "epoch": 2216} {"train_loss": -42.03034591674805, "global_step": 268217, "epoch": 2216} {"train_loss": -39.81682205200195, "global_step": 268218, "epoch": 2216} {"train_loss": -41.17675018310547, "global_step": 268219, "epoch": 2216} {"train_loss": -41.73183822631836, "global_step": 268220, "epoch": 2216} {"train_loss": -42.08625411987305, "global_step": 268221, "epoch": 2216} {"train_loss": -41.29449462890625, "global_step": 268222, "epoch": 2216} {"train_loss": -42.45808792114258, "global_step": 268223, "epoch": 2216} {"train_loss": -42.0338134765625, "global_step": 268224, "epoch": 2216} {"train_loss": -40.381256103515625, "global_step": 268225, "epoch": 2216} {"train_loss": -42.46894836425781, "global_step": 268226, "epoch": 2216} {"train_loss": -41.163936614990234, "global_step": 268227, "epoch": 2216} {"train_loss": -40.821041107177734, "global_step": 268228, "epoch": 2216} {"train_loss": -41.62990951538086, "global_step": 268229, "epoch": 2216} {"train_loss": -41.470184326171875, "global_step": 268230, "epoch": 2216} {"train_loss": -42.283138275146484, "global_step": 268231, "epoch": 2216} {"train_loss": -41.90444564819336, "global_step": 268232, "epoch": 2216} {"train_loss": -42.87977981567383, "global_step": 268233, "epoch": 2216} {"train_loss": -42.74087142944336, "global_step": 268234, "epoch": 2216} {"train_loss": -41.96705627441406, "global_step": 268235, "epoch": 2216} {"train_loss": -42.10499954223633, "global_step": 268236, "epoch": 2216} {"train_loss": -41.39333724975586, "global_step": 268237, "epoch": 2216} {"train_loss": -41.56667709350586, "global_step": 268238, "epoch": 2216} {"train_loss": -41.104286193847656, "global_step": 268239, "epoch": 2216} {"train_loss": -42.2887077331543, "global_step": 268240, "epoch": 2216} {"train_loss": -42.56170654296875, "global_step": 268241, "epoch": 2216} {"train_loss": -42.49620819091797, "global_step": 268242, "epoch": 2216} {"train_loss": -42.74325180053711, "global_step": 268243, "epoch": 2216} {"train_loss": -41.71466064453125, "global_step": 268244, "epoch": 2216} {"train_loss": -42.31663513183594, "global_step": 268245, "epoch": 2216} {"train_loss": -41.55842590332031, "global_step": 268246, "epoch": 2216} {"train_loss": -42.054931640625, "global_step": 268247, "epoch": 2216} {"train_loss": -41.614253997802734, "global_step": 268248, "epoch": 2216} {"train_loss": -43.52299118041992, "global_step": 268249, "epoch": 2216} {"train_loss": -42.16754913330078, "global_step": 268250, "epoch": 2216} {"train_loss": -42.827205657958984, "global_step": 268251, "epoch": 2216} {"train_loss": -42.90070343017578, "global_step": 268252, "epoch": 2216} {"train_loss": -43.2137565612793, "global_step": 268253, "epoch": 2216} {"train_loss": -43.16944122314453, "global_step": 268254, "epoch": 2216} {"train_loss": -42.301734924316406, "global_step": 268255, "epoch": 2216} {"train_loss": -42.10114527930898, "global_step": 268256, "epoch": 2216, "val_loss": 3597751.75} {"train_loss": -43.389686584472656, "global_step": 268257, "epoch": 2217} {"train_loss": -42.72089385986328, "global_step": 268258, "epoch": 2217} {"train_loss": -43.49086380004883, "global_step": 268259, "epoch": 2217} {"train_loss": -43.576969146728516, "global_step": 268260, "epoch": 2217} {"train_loss": -42.594940185546875, "global_step": 268261, "epoch": 2217} {"train_loss": -43.16766357421875, "global_step": 268262, "epoch": 2217} {"train_loss": -43.4085693359375, "global_step": 268263, "epoch": 2217} {"train_loss": -42.97355270385742, "global_step": 268264, "epoch": 2217} {"train_loss": -41.615962982177734, "global_step": 268265, "epoch": 2217} {"train_loss": -40.96364212036133, "global_step": 268266, "epoch": 2217} {"train_loss": -41.58100509643555, "global_step": 268267, "epoch": 2217} {"train_loss": -42.39466094970703, "global_step": 268268, "epoch": 2217} {"train_loss": -40.34150314331055, "global_step": 268269, "epoch": 2217} {"train_loss": -41.668724060058594, "global_step": 268270, "epoch": 2217} {"train_loss": -42.9512939453125, "global_step": 268271, "epoch": 2217} {"train_loss": -42.82532501220703, "global_step": 268272, "epoch": 2217} {"train_loss": -41.13616180419922, "global_step": 268273, "epoch": 2217} {"train_loss": -42.40867233276367, "global_step": 268274, "epoch": 2217} {"train_loss": -42.425472259521484, "global_step": 268275, "epoch": 2217} {"train_loss": -41.40397262573242, "global_step": 268276, "epoch": 2217} {"train_loss": -43.02972412109375, "global_step": 268277, "epoch": 2217} {"train_loss": -42.07212448120117, "global_step": 268278, "epoch": 2217} {"train_loss": -41.333797454833984, "global_step": 268279, "epoch": 2217} {"train_loss": -43.475894927978516, "global_step": 268280, "epoch": 2217} {"train_loss": -42.1843376159668, "global_step": 268281, "epoch": 2217} {"train_loss": -41.281917572021484, "global_step": 268282, "epoch": 2217} {"train_loss": -42.98008346557617, "global_step": 268283, "epoch": 2217} {"train_loss": -41.911590576171875, "global_step": 268284, "epoch": 2217} {"train_loss": -41.58002471923828, "global_step": 268285, "epoch": 2217} {"train_loss": -42.5674934387207, "global_step": 268286, "epoch": 2217} {"train_loss": -38.9604606628418, "global_step": 268287, "epoch": 2217} {"train_loss": -43.200599670410156, "global_step": 268288, "epoch": 2217} {"train_loss": -41.22452926635742, "global_step": 268289, "epoch": 2217} {"train_loss": -40.40183639526367, "global_step": 268290, "epoch": 2217} {"train_loss": -42.290645599365234, "global_step": 268291, "epoch": 2217} {"train_loss": -40.71360778808594, "global_step": 268292, "epoch": 2217} {"train_loss": -41.9132080078125, "global_step": 268293, "epoch": 2217} {"train_loss": -41.3426399230957, "global_step": 268294, "epoch": 2217} {"train_loss": -42.538143157958984, "global_step": 268295, "epoch": 2217} {"train_loss": -42.048614501953125, "global_step": 268296, "epoch": 2217} {"train_loss": -42.13084030151367, "global_step": 268297, "epoch": 2217} {"train_loss": -42.499847412109375, "global_step": 268298, "epoch": 2217} {"train_loss": -43.07624053955078, "global_step": 268299, "epoch": 2217} {"train_loss": -41.30186080932617, "global_step": 268300, "epoch": 2217} {"train_loss": -40.795005798339844, "global_step": 268301, "epoch": 2217} {"train_loss": -43.3801383972168, "global_step": 268302, "epoch": 2217} {"train_loss": -41.236488342285156, "global_step": 268303, "epoch": 2217} {"train_loss": -42.54888916015625, "global_step": 268304, "epoch": 2217} {"train_loss": -42.60238265991211, "global_step": 268305, "epoch": 2217} {"train_loss": -39.81931686401367, "global_step": 268306, "epoch": 2217} {"train_loss": -41.58901596069336, "global_step": 268307, "epoch": 2217} {"train_loss": -40.07697296142578, "global_step": 268308, "epoch": 2217} {"train_loss": -41.838836669921875, "global_step": 268309, "epoch": 2217} {"train_loss": -39.21600341796875, "global_step": 268310, "epoch": 2217} {"train_loss": -38.37012481689453, "global_step": 268311, "epoch": 2217} {"train_loss": -39.89628219604492, "global_step": 268312, "epoch": 2217} {"train_loss": -42.50053024291992, "global_step": 268313, "epoch": 2217} {"train_loss": -38.85022735595703, "global_step": 268314, "epoch": 2217} {"train_loss": -42.415706634521484, "global_step": 268315, "epoch": 2217} {"train_loss": -41.55501937866211, "global_step": 268316, "epoch": 2217} {"train_loss": -42.8168830871582, "global_step": 268317, "epoch": 2217} {"train_loss": -40.58669662475586, "global_step": 268318, "epoch": 2217} {"train_loss": -42.09414291381836, "global_step": 268319, "epoch": 2217} {"train_loss": -42.2302360534668, "global_step": 268320, "epoch": 2217} {"train_loss": -42.498043060302734, "global_step": 268321, "epoch": 2217} {"train_loss": -41.377315521240234, "global_step": 268322, "epoch": 2217} {"train_loss": -42.00606918334961, "global_step": 268323, "epoch": 2217} {"train_loss": -41.9537239074707, "global_step": 268324, "epoch": 2217} {"train_loss": -42.04001235961914, "global_step": 268325, "epoch": 2217} {"train_loss": -41.65370559692383, "global_step": 268326, "epoch": 2217} {"train_loss": -40.51681137084961, "global_step": 268327, "epoch": 2217} {"train_loss": -41.007808685302734, "global_step": 268328, "epoch": 2217} {"train_loss": -41.714778900146484, "global_step": 268329, "epoch": 2217} {"train_loss": -41.979095458984375, "global_step": 268330, "epoch": 2217} {"train_loss": -40.568973541259766, "global_step": 268331, "epoch": 2217} {"train_loss": -42.48925018310547, "global_step": 268332, "epoch": 2217} {"train_loss": -39.4581413269043, "global_step": 268333, "epoch": 2217} {"train_loss": -42.44464874267578, "global_step": 268334, "epoch": 2217} {"train_loss": -41.068214416503906, "global_step": 268335, "epoch": 2217} {"train_loss": -38.89103698730469, "global_step": 268336, "epoch": 2217} {"train_loss": -42.729766845703125, "global_step": 268337, "epoch": 2217} {"train_loss": -38.763587951660156, "global_step": 268338, "epoch": 2217} {"train_loss": -37.24269485473633, "global_step": 268339, "epoch": 2217} {"train_loss": -39.085426330566406, "global_step": 268340, "epoch": 2217} {"train_loss": -38.59928512573242, "global_step": 268341, "epoch": 2217} {"train_loss": -40.469512939453125, "global_step": 268342, "epoch": 2217} {"train_loss": -40.444984436035156, "global_step": 268343, "epoch": 2217} {"train_loss": -39.26803970336914, "global_step": 268344, "epoch": 2217} {"train_loss": -40.93669509887695, "global_step": 268345, "epoch": 2217} {"train_loss": -41.26762008666992, "global_step": 268346, "epoch": 2217} {"train_loss": -41.17198944091797, "global_step": 268347, "epoch": 2217} {"train_loss": -42.1246452331543, "global_step": 268348, "epoch": 2217} {"train_loss": -40.50385665893555, "global_step": 268349, "epoch": 2217} {"train_loss": -41.460609436035156, "global_step": 268350, "epoch": 2217} {"train_loss": -41.837440490722656, "global_step": 268351, "epoch": 2217} {"train_loss": -40.03678894042969, "global_step": 268352, "epoch": 2217} {"train_loss": -41.451576232910156, "global_step": 268353, "epoch": 2217} {"train_loss": -41.035892486572266, "global_step": 268354, "epoch": 2217} {"train_loss": -41.425323486328125, "global_step": 268355, "epoch": 2217} {"train_loss": -40.620059967041016, "global_step": 268356, "epoch": 2217} {"train_loss": -41.886199951171875, "global_step": 268357, "epoch": 2217} {"train_loss": -42.42605209350586, "global_step": 268358, "epoch": 2217} {"train_loss": -41.90031051635742, "global_step": 268359, "epoch": 2217} {"train_loss": -42.63525390625, "global_step": 268360, "epoch": 2217} {"train_loss": -43.13396072387695, "global_step": 268361, "epoch": 2217} {"train_loss": -42.576255798339844, "global_step": 268362, "epoch": 2217} {"train_loss": -42.05066680908203, "global_step": 268363, "epoch": 2217} {"train_loss": -42.5345458984375, "global_step": 268364, "epoch": 2217} {"train_loss": -42.13604736328125, "global_step": 268365, "epoch": 2217} {"train_loss": -43.0043830871582, "global_step": 268366, "epoch": 2217} {"train_loss": -42.66315841674805, "global_step": 268367, "epoch": 2217} {"train_loss": -42.6451530456543, "global_step": 268368, "epoch": 2217} {"train_loss": -42.51184844970703, "global_step": 268369, "epoch": 2217} {"train_loss": -42.0000114440918, "global_step": 268370, "epoch": 2217} {"train_loss": -42.62160110473633, "global_step": 268371, "epoch": 2217} {"train_loss": -42.09762191772461, "global_step": 268372, "epoch": 2217} {"train_loss": -42.40297317504883, "global_step": 268373, "epoch": 2217} {"train_loss": -41.93337631225586, "global_step": 268374, "epoch": 2217} {"train_loss": -41.06109619140625, "global_step": 268375, "epoch": 2217} {"train_loss": -38.19871139526367, "global_step": 268376, "epoch": 2217} {"train_loss": -41.574723834833826, "global_step": 268377, "epoch": 2217, "val_loss": 2778279.25} {"train_loss": -38.89319610595703, "global_step": 268378, "epoch": 2218} {"train_loss": -41.633750915527344, "global_step": 268379, "epoch": 2218} {"train_loss": -39.50234603881836, "global_step": 268380, "epoch": 2218} {"train_loss": -41.71537399291992, "global_step": 268381, "epoch": 2218} {"train_loss": -41.1569709777832, "global_step": 268382, "epoch": 2218} {"train_loss": -42.09101486206055, "global_step": 268383, "epoch": 2218} {"train_loss": -41.55562973022461, "global_step": 268384, "epoch": 2218} {"train_loss": -41.36397933959961, "global_step": 268385, "epoch": 2218} {"train_loss": -41.8069953918457, "global_step": 268386, "epoch": 2218} {"train_loss": -40.46411895751953, "global_step": 268387, "epoch": 2218} {"train_loss": -42.907039642333984, "global_step": 268388, "epoch": 2218} {"train_loss": -41.20894241333008, "global_step": 268389, "epoch": 2218} {"train_loss": -42.63901138305664, "global_step": 268390, "epoch": 2218} {"train_loss": -41.5822868347168, "global_step": 268391, "epoch": 2218} {"train_loss": -42.204708099365234, "global_step": 268392, "epoch": 2218} {"train_loss": -42.51371383666992, "global_step": 268393, "epoch": 2218} {"train_loss": -42.0684928894043, "global_step": 268394, "epoch": 2218} {"train_loss": -42.56624984741211, "global_step": 268395, "epoch": 2218} {"train_loss": -41.58101272583008, "global_step": 268396, "epoch": 2218} {"train_loss": -41.98419952392578, "global_step": 268397, "epoch": 2218} {"train_loss": -42.114688873291016, "global_step": 268398, "epoch": 2218} {"train_loss": -42.75944137573242, "global_step": 268399, "epoch": 2218} {"train_loss": -42.151737213134766, "global_step": 268400, "epoch": 2218} {"train_loss": -43.12019729614258, "global_step": 268401, "epoch": 2218} {"train_loss": -42.72113037109375, "global_step": 268402, "epoch": 2218} {"train_loss": -43.11652755737305, "global_step": 268403, "epoch": 2218} {"train_loss": -42.863136291503906, "global_step": 268404, "epoch": 2218} {"train_loss": -42.7056999206543, "global_step": 268405, "epoch": 2218} {"train_loss": -43.2087516784668, "global_step": 268406, "epoch": 2218} {"train_loss": -43.02199172973633, "global_step": 268407, "epoch": 2218} {"train_loss": -42.83552169799805, "global_step": 268408, "epoch": 2218} {"train_loss": -43.456398010253906, "global_step": 268409, "epoch": 2218} {"train_loss": -43.2640266418457, "global_step": 268410, "epoch": 2218} {"train_loss": -42.627662658691406, "global_step": 268411, "epoch": 2218} {"train_loss": -42.54304504394531, "global_step": 268412, "epoch": 2218} {"train_loss": -43.25285720825195, "global_step": 268413, "epoch": 2218} {"train_loss": -42.62222671508789, "global_step": 268414, "epoch": 2218} {"train_loss": -42.765010833740234, "global_step": 268415, "epoch": 2218} {"train_loss": -43.56925582885742, "global_step": 268416, "epoch": 2218} {"train_loss": -43.196407318115234, "global_step": 268417, "epoch": 2218} {"train_loss": -43.29369354248047, "global_step": 268418, "epoch": 2218} {"train_loss": -43.22892379760742, "global_step": 268419, "epoch": 2218} {"train_loss": -43.374568939208984, "global_step": 268420, "epoch": 2218} {"train_loss": -43.657936096191406, "global_step": 268421, "epoch": 2218} {"train_loss": -43.3751335144043, "global_step": 268422, "epoch": 2218} {"train_loss": -43.43223190307617, "global_step": 268423, "epoch": 2218} {"train_loss": -43.76136779785156, "global_step": 268424, "epoch": 2218} {"train_loss": -43.0577507019043, "global_step": 268425, "epoch": 2218} {"train_loss": -43.695106506347656, "global_step": 268426, "epoch": 2218} {"train_loss": -43.337867736816406, "global_step": 268427, "epoch": 2218} {"train_loss": -43.97811508178711, "global_step": 268428, "epoch": 2218} {"train_loss": -43.69047546386719, "global_step": 268429, "epoch": 2218} {"train_loss": -43.558284759521484, "global_step": 268430, "epoch": 2218} {"train_loss": -43.86385726928711, "global_step": 268431, "epoch": 2218} {"train_loss": -43.777740478515625, "global_step": 268432, "epoch": 2218} {"train_loss": -44.278297424316406, "global_step": 268433, "epoch": 2218} {"train_loss": -44.028907775878906, "global_step": 268434, "epoch": 2218} {"train_loss": -44.15986251831055, "global_step": 268435, "epoch": 2218} {"train_loss": -44.11962890625, "global_step": 268436, "epoch": 2218} {"train_loss": -44.06622314453125, "global_step": 268437, "epoch": 2218} {"train_loss": -44.23347091674805, "global_step": 268438, "epoch": 2218} {"train_loss": -43.9586296081543, "global_step": 268439, "epoch": 2218} {"train_loss": -44.07143020629883, "global_step": 268440, "epoch": 2218} {"train_loss": -44.3558464050293, "global_step": 268441, "epoch": 2218} {"train_loss": -44.249229431152344, "global_step": 268442, "epoch": 2218} {"train_loss": -44.166603088378906, "global_step": 268443, "epoch": 2218} {"train_loss": -44.77079391479492, "global_step": 268444, "epoch": 2218} {"train_loss": -44.128868103027344, "global_step": 268445, "epoch": 2218} {"train_loss": -44.24054718017578, "global_step": 268446, "epoch": 2218} {"train_loss": -43.86408615112305, "global_step": 268447, "epoch": 2218} {"train_loss": -44.220184326171875, "global_step": 268448, "epoch": 2218} {"train_loss": -43.945106506347656, "global_step": 268449, "epoch": 2218} {"train_loss": -44.73426055908203, "global_step": 268450, "epoch": 2218} {"train_loss": -44.20841598510742, "global_step": 268451, "epoch": 2218} {"train_loss": -44.350677490234375, "global_step": 268452, "epoch": 2218} {"train_loss": -44.40705490112305, "global_step": 268453, "epoch": 2218} {"train_loss": -44.899112701416016, "global_step": 268454, "epoch": 2218} {"train_loss": -44.270809173583984, "global_step": 268455, "epoch": 2218} {"train_loss": -44.54124069213867, "global_step": 268456, "epoch": 2218} {"train_loss": -44.19157791137695, "global_step": 268457, "epoch": 2218} {"train_loss": -44.843223571777344, "global_step": 268458, "epoch": 2218} {"train_loss": -44.1867561340332, "global_step": 268459, "epoch": 2218} {"train_loss": -42.40091323852539, "global_step": 268460, "epoch": 2218} {"train_loss": -40.4207763671875, "global_step": 268461, "epoch": 2218} {"train_loss": -41.96274185180664, "global_step": 268462, "epoch": 2218} {"train_loss": -42.67878723144531, "global_step": 268463, "epoch": 2218} {"train_loss": -41.46876907348633, "global_step": 268464, "epoch": 2218} {"train_loss": -42.02581024169922, "global_step": 268465, "epoch": 2218} {"train_loss": -40.5449333190918, "global_step": 268466, "epoch": 2218} {"train_loss": -42.732452392578125, "global_step": 268467, "epoch": 2218} {"train_loss": -42.40397262573242, "global_step": 268468, "epoch": 2218} {"train_loss": -40.82660675048828, "global_step": 268469, "epoch": 2218} {"train_loss": -43.31235885620117, "global_step": 268470, "epoch": 2218} {"train_loss": -42.259742736816406, "global_step": 268471, "epoch": 2218} {"train_loss": -40.85182189941406, "global_step": 268472, "epoch": 2218} {"train_loss": -41.2218017578125, "global_step": 268473, "epoch": 2218} {"train_loss": -41.285091400146484, "global_step": 268474, "epoch": 2218} {"train_loss": -41.80402374267578, "global_step": 268475, "epoch": 2218} {"train_loss": -43.00565719604492, "global_step": 268476, "epoch": 2218} {"train_loss": -43.17463302612305, "global_step": 268477, "epoch": 2218} {"train_loss": -42.66489028930664, "global_step": 268478, "epoch": 2218} {"train_loss": -42.557769775390625, "global_step": 268479, "epoch": 2218} {"train_loss": -43.0998420715332, "global_step": 268480, "epoch": 2218} {"train_loss": -42.554351806640625, "global_step": 268481, "epoch": 2218} {"train_loss": -43.198570251464844, "global_step": 268482, "epoch": 2218} {"train_loss": -43.36818313598633, "global_step": 268483, "epoch": 2218} {"train_loss": -42.68630599975586, "global_step": 268484, "epoch": 2218} {"train_loss": -43.3311882019043, "global_step": 268485, "epoch": 2218} {"train_loss": -43.648475646972656, "global_step": 268486, "epoch": 2218} {"train_loss": -43.835548400878906, "global_step": 268487, "epoch": 2218} {"train_loss": -43.686187744140625, "global_step": 268488, "epoch": 2218} {"train_loss": -42.62881088256836, "global_step": 268489, "epoch": 2218} {"train_loss": -41.63180160522461, "global_step": 268490, "epoch": 2218} {"train_loss": -43.31180191040039, "global_step": 268491, "epoch": 2218} {"train_loss": -42.778682708740234, "global_step": 268492, "epoch": 2218} {"train_loss": -42.51312255859375, "global_step": 268493, "epoch": 2218} {"train_loss": -43.240875244140625, "global_step": 268494, "epoch": 2218} {"train_loss": -42.59165573120117, "global_step": 268495, "epoch": 2218} {"train_loss": -42.99486541748047, "global_step": 268496, "epoch": 2218} {"train_loss": -43.299461364746094, "global_step": 268497, "epoch": 2218} {"train_loss": -42.9344451841244, "global_step": 268498, "epoch": 2218, "val_loss": 2790575.0} {"train_loss": -43.49177551269531, "global_step": 268499, "epoch": 2219} {"train_loss": -43.07722091674805, "global_step": 268500, "epoch": 2219} {"train_loss": -42.75852584838867, "global_step": 268501, "epoch": 2219} {"train_loss": -42.92438507080078, "global_step": 268502, "epoch": 2219} {"train_loss": -43.90871047973633, "global_step": 268503, "epoch": 2219} {"train_loss": -43.51430130004883, "global_step": 268504, "epoch": 2219} {"train_loss": -44.11275863647461, "global_step": 268505, "epoch": 2219} {"train_loss": -44.14527893066406, "global_step": 268506, "epoch": 2219} {"train_loss": -43.567054748535156, "global_step": 268507, "epoch": 2219} {"train_loss": -44.1408805847168, "global_step": 268508, "epoch": 2219} {"train_loss": -43.858158111572266, "global_step": 268509, "epoch": 2219} {"train_loss": -43.527767181396484, "global_step": 268510, "epoch": 2219} {"train_loss": -42.63347244262695, "global_step": 268511, "epoch": 2219} {"train_loss": -43.90061569213867, "global_step": 268512, "epoch": 2219} {"train_loss": -42.893184661865234, "global_step": 268513, "epoch": 2219} {"train_loss": -41.91937255859375, "global_step": 268514, "epoch": 2219} {"train_loss": -44.04490280151367, "global_step": 268515, "epoch": 2219} {"train_loss": -41.96388626098633, "global_step": 268516, "epoch": 2219} {"train_loss": -42.78863525390625, "global_step": 268517, "epoch": 2219} {"train_loss": -43.16935348510742, "global_step": 268518, "epoch": 2219} {"train_loss": -41.37965774536133, "global_step": 268519, "epoch": 2219} {"train_loss": -43.827392578125, "global_step": 268520, "epoch": 2219} {"train_loss": -42.204166412353516, "global_step": 268521, "epoch": 2219} {"train_loss": -41.759544372558594, "global_step": 268522, "epoch": 2219} {"train_loss": -43.138851165771484, "global_step": 268523, "epoch": 2219} {"train_loss": -41.80580520629883, "global_step": 268524, "epoch": 2219} {"train_loss": -43.1544075012207, "global_step": 268525, "epoch": 2219} {"train_loss": -40.62264633178711, "global_step": 268526, "epoch": 2219} {"train_loss": -43.478126525878906, "global_step": 268527, "epoch": 2219} {"train_loss": -41.11257553100586, "global_step": 268528, "epoch": 2219} {"train_loss": -41.85251998901367, "global_step": 268529, "epoch": 2219} {"train_loss": -42.67500686645508, "global_step": 268530, "epoch": 2219} {"train_loss": -41.50925064086914, "global_step": 268531, "epoch": 2219} {"train_loss": -42.12726974487305, "global_step": 268532, "epoch": 2219} {"train_loss": -41.59695053100586, "global_step": 268533, "epoch": 2219} {"train_loss": -41.91157150268555, "global_step": 268534, "epoch": 2219} {"train_loss": -42.29909896850586, "global_step": 268535, "epoch": 2219} {"train_loss": -40.130191802978516, "global_step": 268536, "epoch": 2219} {"train_loss": -41.959869384765625, "global_step": 268537, "epoch": 2219} {"train_loss": -38.88190460205078, "global_step": 268538, "epoch": 2219} {"train_loss": -38.27494430541992, "global_step": 268539, "epoch": 2219} {"train_loss": -39.21980285644531, "global_step": 268540, "epoch": 2219} {"train_loss": -38.59654998779297, "global_step": 268541, "epoch": 2219} {"train_loss": -39.10030746459961, "global_step": 268542, "epoch": 2219} {"train_loss": -38.639774322509766, "global_step": 268543, "epoch": 2219} {"train_loss": -38.59548568725586, "global_step": 268544, "epoch": 2219} {"train_loss": -39.917293548583984, "global_step": 268545, "epoch": 2219} {"train_loss": -41.09621810913086, "global_step": 268546, "epoch": 2219} {"train_loss": -40.34835433959961, "global_step": 268547, "epoch": 2219} {"train_loss": -39.919090270996094, "global_step": 268548, "epoch": 2219} {"train_loss": -41.11815643310547, "global_step": 268549, "epoch": 2219} {"train_loss": -40.57908248901367, "global_step": 268550, "epoch": 2219} {"train_loss": -41.436553955078125, "global_step": 268551, "epoch": 2219} {"train_loss": -40.34133529663086, "global_step": 268552, "epoch": 2219} {"train_loss": -42.105953216552734, "global_step": 268553, "epoch": 2219} {"train_loss": -42.12249755859375, "global_step": 268554, "epoch": 2219} {"train_loss": -42.170326232910156, "global_step": 268555, "epoch": 2219} {"train_loss": -42.13698196411133, "global_step": 268556, "epoch": 2219} {"train_loss": -41.634864807128906, "global_step": 268557, "epoch": 2219} {"train_loss": -42.35056686401367, "global_step": 268558, "epoch": 2219} {"train_loss": -42.45130920410156, "global_step": 268559, "epoch": 2219} {"train_loss": -42.469112396240234, "global_step": 268560, "epoch": 2219} {"train_loss": -42.9940299987793, "global_step": 268561, "epoch": 2219} {"train_loss": -42.506954193115234, "global_step": 268562, "epoch": 2219} {"train_loss": -42.91072082519531, "global_step": 268563, "epoch": 2219} {"train_loss": -42.51458740234375, "global_step": 268564, "epoch": 2219} {"train_loss": -43.09583282470703, "global_step": 268565, "epoch": 2219} {"train_loss": -42.52588653564453, "global_step": 268566, "epoch": 2219} {"train_loss": -42.0105094909668, "global_step": 268567, "epoch": 2219} {"train_loss": -42.78384017944336, "global_step": 268568, "epoch": 2219} {"train_loss": -42.339046478271484, "global_step": 268569, "epoch": 2219} {"train_loss": -41.79311752319336, "global_step": 268570, "epoch": 2219} {"train_loss": -42.58412551879883, "global_step": 268571, "epoch": 2219} {"train_loss": -43.43721008300781, "global_step": 268572, "epoch": 2219} {"train_loss": -42.89149475097656, "global_step": 268573, "epoch": 2219} {"train_loss": -43.05985641479492, "global_step": 268574, "epoch": 2219} {"train_loss": -42.29392623901367, "global_step": 268575, "epoch": 2219} {"train_loss": -42.853553771972656, "global_step": 268576, "epoch": 2219} {"train_loss": -43.108272552490234, "global_step": 268577, "epoch": 2219} {"train_loss": -43.588558197021484, "global_step": 268578, "epoch": 2219} {"train_loss": -43.2028923034668, "global_step": 268579, "epoch": 2219} {"train_loss": -43.563438415527344, "global_step": 268580, "epoch": 2219} {"train_loss": -43.38261795043945, "global_step": 268581, "epoch": 2219} {"train_loss": -43.790767669677734, "global_step": 268582, "epoch": 2219} {"train_loss": -43.220741271972656, "global_step": 268583, "epoch": 2219} {"train_loss": -43.13694381713867, "global_step": 268584, "epoch": 2219} {"train_loss": -43.42942810058594, "global_step": 268585, "epoch": 2219} {"train_loss": -44.018348693847656, "global_step": 268586, "epoch": 2219} {"train_loss": -43.65085983276367, "global_step": 268587, "epoch": 2219} {"train_loss": -43.83596420288086, "global_step": 268588, "epoch": 2219} {"train_loss": -43.16880416870117, "global_step": 268589, "epoch": 2219} {"train_loss": -43.478515625, "global_step": 268590, "epoch": 2219} {"train_loss": -43.71338653564453, "global_step": 268591, "epoch": 2219} {"train_loss": -44.68722152709961, "global_step": 268592, "epoch": 2219} {"train_loss": -43.95695114135742, "global_step": 268593, "epoch": 2219} {"train_loss": -43.439476013183594, "global_step": 268594, "epoch": 2219} {"train_loss": -43.28757858276367, "global_step": 268595, "epoch": 2219} {"train_loss": -44.01814270019531, "global_step": 268596, "epoch": 2219} {"train_loss": -43.974884033203125, "global_step": 268597, "epoch": 2219} {"train_loss": -43.59302520751953, "global_step": 268598, "epoch": 2219} {"train_loss": -43.50413131713867, "global_step": 268599, "epoch": 2219} {"train_loss": -44.097103118896484, "global_step": 268600, "epoch": 2219} {"train_loss": -43.37960433959961, "global_step": 268601, "epoch": 2219} {"train_loss": -42.78073501586914, "global_step": 268602, "epoch": 2219} {"train_loss": -42.0970458984375, "global_step": 268603, "epoch": 2219} {"train_loss": -43.241920471191406, "global_step": 268604, "epoch": 2219} {"train_loss": -44.0601806640625, "global_step": 268605, "epoch": 2219} {"train_loss": -43.78926467895508, "global_step": 268606, "epoch": 2219} {"train_loss": -43.793983459472656, "global_step": 268607, "epoch": 2219} {"train_loss": -43.86151885986328, "global_step": 268608, "epoch": 2219} {"train_loss": -44.095821380615234, "global_step": 268609, "epoch": 2219} {"train_loss": -43.324363708496094, "global_step": 268610, "epoch": 2219} {"train_loss": -44.65414047241211, "global_step": 268611, "epoch": 2219} {"train_loss": -43.7955436706543, "global_step": 268612, "epoch": 2219} {"train_loss": -42.592445373535156, "global_step": 268613, "epoch": 2219} {"train_loss": -42.595272064208984, "global_step": 268614, "epoch": 2219} {"train_loss": -43.0418815612793, "global_step": 268615, "epoch": 2219} {"train_loss": -43.80685043334961, "global_step": 268616, "epoch": 2219} {"train_loss": -43.563819885253906, "global_step": 268617, "epoch": 2219} {"train_loss": -42.69560241699219, "global_step": 268618, "epoch": 2219} {"train_loss": -42.57895988275197, "global_step": 268619, "epoch": 2219, "val_loss": 2734810.25} {"train_loss": -42.70344924926758, "global_step": 268620, "epoch": 2220} {"train_loss": -43.26540756225586, "global_step": 268621, "epoch": 2220} {"train_loss": -41.91510009765625, "global_step": 268622, "epoch": 2220} {"train_loss": -43.74309158325195, "global_step": 268623, "epoch": 2220} {"train_loss": -42.46841049194336, "global_step": 268624, "epoch": 2220} {"train_loss": -41.44016647338867, "global_step": 268625, "epoch": 2220} {"train_loss": -41.755943298339844, "global_step": 268626, "epoch": 2220} {"train_loss": -40.23064041137695, "global_step": 268627, "epoch": 2220} {"train_loss": -41.11161422729492, "global_step": 268628, "epoch": 2220} {"train_loss": -42.973854064941406, "global_step": 268629, "epoch": 2220} {"train_loss": -40.333553314208984, "global_step": 268630, "epoch": 2220} {"train_loss": -40.84391403198242, "global_step": 268631, "epoch": 2220} {"train_loss": -41.2163200378418, "global_step": 268632, "epoch": 2220} {"train_loss": -41.93365478515625, "global_step": 268633, "epoch": 2220} {"train_loss": -41.244327545166016, "global_step": 268634, "epoch": 2220} {"train_loss": -43.32125473022461, "global_step": 268635, "epoch": 2220} {"train_loss": -39.462791442871094, "global_step": 268636, "epoch": 2220} {"train_loss": -42.70230484008789, "global_step": 268637, "epoch": 2220} {"train_loss": -40.97366714477539, "global_step": 268638, "epoch": 2220} {"train_loss": -42.61287307739258, "global_step": 268639, "epoch": 2220} {"train_loss": -41.98484420776367, "global_step": 268640, "epoch": 2220} {"train_loss": -40.94670867919922, "global_step": 268641, "epoch": 2220} {"train_loss": -41.2923583984375, "global_step": 268642, "epoch": 2220} {"train_loss": -41.51919174194336, "global_step": 268643, "epoch": 2220} {"train_loss": -42.53407669067383, "global_step": 268644, "epoch": 2220} {"train_loss": -40.88851547241211, "global_step": 268645, "epoch": 2220} {"train_loss": -42.71673583984375, "global_step": 268646, "epoch": 2220} {"train_loss": -40.43702697753906, "global_step": 268647, "epoch": 2220} {"train_loss": -43.011436462402344, "global_step": 268648, "epoch": 2220} {"train_loss": -41.42328643798828, "global_step": 268649, "epoch": 2220} {"train_loss": -42.98831558227539, "global_step": 268650, "epoch": 2220} {"train_loss": -40.41463851928711, "global_step": 268651, "epoch": 2220} {"train_loss": -42.298194885253906, "global_step": 268652, "epoch": 2220} {"train_loss": -41.14226150512695, "global_step": 268653, "epoch": 2220} {"train_loss": -41.75122833251953, "global_step": 268654, "epoch": 2220} {"train_loss": -42.320865631103516, "global_step": 268655, "epoch": 2220} {"train_loss": -41.58388137817383, "global_step": 268656, "epoch": 2220} {"train_loss": -43.1478385925293, "global_step": 268657, "epoch": 2220} {"train_loss": -42.65566635131836, "global_step": 268658, "epoch": 2220} {"train_loss": -42.63539505004883, "global_step": 268659, "epoch": 2220} {"train_loss": -41.692169189453125, "global_step": 268660, "epoch": 2220} {"train_loss": -43.075340270996094, "global_step": 268661, "epoch": 2220} {"train_loss": -42.261470794677734, "global_step": 268662, "epoch": 2220} {"train_loss": -43.301025390625, "global_step": 268663, "epoch": 2220} {"train_loss": -43.55217742919922, "global_step": 268664, "epoch": 2220} {"train_loss": -43.09906768798828, "global_step": 268665, "epoch": 2220} {"train_loss": -43.285030364990234, "global_step": 268666, "epoch": 2220} {"train_loss": -43.4513053894043, "global_step": 268667, "epoch": 2220} {"train_loss": -43.04704666137695, "global_step": 268668, "epoch": 2220} {"train_loss": -43.1077766418457, "global_step": 268669, "epoch": 2220} {"train_loss": -43.37995529174805, "global_step": 268670, "epoch": 2220} {"train_loss": -43.1645393371582, "global_step": 268671, "epoch": 2220} {"train_loss": -42.275272369384766, "global_step": 268672, "epoch": 2220} {"train_loss": -43.58054733276367, "global_step": 268673, "epoch": 2220} {"train_loss": -43.618167877197266, "global_step": 268674, "epoch": 2220} {"train_loss": -41.705135345458984, "global_step": 268675, "epoch": 2220} {"train_loss": -42.31852340698242, "global_step": 268676, "epoch": 2220} {"train_loss": -43.23972702026367, "global_step": 268677, "epoch": 2220} {"train_loss": -42.736629486083984, "global_step": 268678, "epoch": 2220} {"train_loss": -43.45570755004883, "global_step": 268679, "epoch": 2220} {"train_loss": -43.44883346557617, "global_step": 268680, "epoch": 2220} {"train_loss": -43.357662200927734, "global_step": 268681, "epoch": 2220} {"train_loss": -42.64912033081055, "global_step": 268682, "epoch": 2220} {"train_loss": -43.8012809753418, "global_step": 268683, "epoch": 2220} {"train_loss": -43.29226303100586, "global_step": 268684, "epoch": 2220} {"train_loss": -41.056095123291016, "global_step": 268685, "epoch": 2220} {"train_loss": -41.91994094848633, "global_step": 268686, "epoch": 2220} {"train_loss": -43.661865234375, "global_step": 268687, "epoch": 2220} {"train_loss": -42.8387565612793, "global_step": 268688, "epoch": 2220} {"train_loss": -41.872962951660156, "global_step": 268689, "epoch": 2220} {"train_loss": -43.35350036621094, "global_step": 268690, "epoch": 2220} {"train_loss": -43.38279342651367, "global_step": 268691, "epoch": 2220} {"train_loss": -42.646766662597656, "global_step": 268692, "epoch": 2220} {"train_loss": -43.4272346496582, "global_step": 268693, "epoch": 2220} {"train_loss": -43.976470947265625, "global_step": 268694, "epoch": 2220} {"train_loss": -43.50291442871094, "global_step": 268695, "epoch": 2220} {"train_loss": -43.60847854614258, "global_step": 268696, "epoch": 2220} {"train_loss": -43.19134521484375, "global_step": 268697, "epoch": 2220} {"train_loss": -42.44294357299805, "global_step": 268698, "epoch": 2220} {"train_loss": -43.76447677612305, "global_step": 268699, "epoch": 2220} {"train_loss": -43.247962951660156, "global_step": 268700, "epoch": 2220} {"train_loss": -43.22286605834961, "global_step": 268701, "epoch": 2220} {"train_loss": -44.00058364868164, "global_step": 268702, "epoch": 2220} {"train_loss": -43.533565521240234, "global_step": 268703, "epoch": 2220} {"train_loss": -42.98783493041992, "global_step": 268704, "epoch": 2220} {"train_loss": -42.450904846191406, "global_step": 268705, "epoch": 2220} {"train_loss": -43.3664436340332, "global_step": 268706, "epoch": 2220} {"train_loss": -43.02946090698242, "global_step": 268707, "epoch": 2220} {"train_loss": -43.15724563598633, "global_step": 268708, "epoch": 2220} {"train_loss": -43.4368896484375, "global_step": 268709, "epoch": 2220} {"train_loss": -44.03464889526367, "global_step": 268710, "epoch": 2220} {"train_loss": -43.770179748535156, "global_step": 268711, "epoch": 2220} {"train_loss": -43.19183349609375, "global_step": 268712, "epoch": 2220} {"train_loss": -43.664737701416016, "global_step": 268713, "epoch": 2220} {"train_loss": -44.362789154052734, "global_step": 268714, "epoch": 2220} {"train_loss": -43.140724182128906, "global_step": 268715, "epoch": 2220} {"train_loss": -43.81389236450195, "global_step": 268716, "epoch": 2220} {"train_loss": -43.290584564208984, "global_step": 268717, "epoch": 2220} {"train_loss": -43.33829879760742, "global_step": 268718, "epoch": 2220} {"train_loss": -43.03384780883789, "global_step": 268719, "epoch": 2220} {"train_loss": -44.02479934692383, "global_step": 268720, "epoch": 2220} {"train_loss": -44.4053840637207, "global_step": 268721, "epoch": 2220} {"train_loss": -43.77651596069336, "global_step": 268722, "epoch": 2220} {"train_loss": -42.7630500793457, "global_step": 268723, "epoch": 2220} {"train_loss": -43.55960464477539, "global_step": 268724, "epoch": 2220} {"train_loss": -43.75048828125, "global_step": 268725, "epoch": 2220} {"train_loss": -43.71427536010742, "global_step": 268726, "epoch": 2220} {"train_loss": -43.255367279052734, "global_step": 268727, "epoch": 2220} {"train_loss": -42.710296630859375, "global_step": 268728, "epoch": 2220} {"train_loss": -43.168025970458984, "global_step": 268729, "epoch": 2220} {"train_loss": -43.379459381103516, "global_step": 268730, "epoch": 2220} {"train_loss": -43.301475524902344, "global_step": 268731, "epoch": 2220} {"train_loss": -43.60444259643555, "global_step": 268732, "epoch": 2220} {"train_loss": -43.57583236694336, "global_step": 268733, "epoch": 2220} {"train_loss": -43.71220779418945, "global_step": 268734, "epoch": 2220} {"train_loss": -42.8697509765625, "global_step": 268735, "epoch": 2220} {"train_loss": -43.70743179321289, "global_step": 268736, "epoch": 2220} {"train_loss": -43.36295700073242, "global_step": 268737, "epoch": 2220} {"train_loss": -43.84830856323242, "global_step": 268738, "epoch": 2220} {"train_loss": -43.37622833251953, "global_step": 268739, "epoch": 2220} {"train_loss": -42.77374532400084, "global_step": 268740, "epoch": 2220, "val_loss": 2737595.75} {"train_loss": -42.032196044921875, "global_step": 268741, "epoch": 2221} {"train_loss": -42.241634368896484, "global_step": 268742, "epoch": 2221} {"train_loss": -43.11924362182617, "global_step": 268743, "epoch": 2221} {"train_loss": -43.179683685302734, "global_step": 268744, "epoch": 2221} {"train_loss": -40.6585807800293, "global_step": 268745, "epoch": 2221} {"train_loss": -40.656673431396484, "global_step": 268746, "epoch": 2221} {"train_loss": -39.14805603027344, "global_step": 268747, "epoch": 2221} {"train_loss": -37.82129669189453, "global_step": 268748, "epoch": 2221} {"train_loss": -41.978641510009766, "global_step": 268749, "epoch": 2221} {"train_loss": -37.44565963745117, "global_step": 268750, "epoch": 2221} {"train_loss": -40.32606887817383, "global_step": 268751, "epoch": 2221} {"train_loss": -40.9022331237793, "global_step": 268752, "epoch": 2221} {"train_loss": -42.61207580566406, "global_step": 268753, "epoch": 2221} {"train_loss": -39.227596282958984, "global_step": 268754, "epoch": 2221} {"train_loss": -42.38471984863281, "global_step": 268755, "epoch": 2221} {"train_loss": -41.04890441894531, "global_step": 268756, "epoch": 2221} {"train_loss": -40.42085266113281, "global_step": 268757, "epoch": 2221} {"train_loss": -41.56407165527344, "global_step": 268758, "epoch": 2221} {"train_loss": -43.01979446411133, "global_step": 268759, "epoch": 2221} {"train_loss": -42.005043029785156, "global_step": 268760, "epoch": 2221} {"train_loss": -42.21882247924805, "global_step": 268761, "epoch": 2221} {"train_loss": -42.501502990722656, "global_step": 268762, "epoch": 2221} {"train_loss": -42.17509460449219, "global_step": 268763, "epoch": 2221} {"train_loss": -42.24671173095703, "global_step": 268764, "epoch": 2221} {"train_loss": -42.661373138427734, "global_step": 268765, "epoch": 2221} {"train_loss": -42.27894592285156, "global_step": 268766, "epoch": 2221} {"train_loss": -42.87004852294922, "global_step": 268767, "epoch": 2221} {"train_loss": -42.601348876953125, "global_step": 268768, "epoch": 2221} {"train_loss": -42.031280517578125, "global_step": 268769, "epoch": 2221} {"train_loss": -42.49826431274414, "global_step": 268770, "epoch": 2221} {"train_loss": -43.48136520385742, "global_step": 268771, "epoch": 2221} {"train_loss": -41.923885345458984, "global_step": 268772, "epoch": 2221} {"train_loss": -41.39723205566406, "global_step": 268773, "epoch": 2221} {"train_loss": -43.21523666381836, "global_step": 268774, "epoch": 2221} {"train_loss": -42.51796340942383, "global_step": 268775, "epoch": 2221} {"train_loss": -40.82399368286133, "global_step": 268776, "epoch": 2221} {"train_loss": -42.1995964050293, "global_step": 268777, "epoch": 2221} {"train_loss": -43.041133880615234, "global_step": 268778, "epoch": 2221} {"train_loss": -40.15267562866211, "global_step": 268779, "epoch": 2221} {"train_loss": -42.903968811035156, "global_step": 268780, "epoch": 2221} {"train_loss": -42.856529235839844, "global_step": 268781, "epoch": 2221} {"train_loss": -41.32662582397461, "global_step": 268782, "epoch": 2221} {"train_loss": -43.51353073120117, "global_step": 268783, "epoch": 2221} {"train_loss": -42.42249298095703, "global_step": 268784, "epoch": 2221} {"train_loss": -42.613826751708984, "global_step": 268785, "epoch": 2221} {"train_loss": -43.113502502441406, "global_step": 268786, "epoch": 2221} {"train_loss": -43.44774627685547, "global_step": 268787, "epoch": 2221} {"train_loss": -43.76887893676758, "global_step": 268788, "epoch": 2221} {"train_loss": -43.38084030151367, "global_step": 268789, "epoch": 2221} {"train_loss": -43.030826568603516, "global_step": 268790, "epoch": 2221} {"train_loss": -43.229549407958984, "global_step": 268791, "epoch": 2221} {"train_loss": -43.83189010620117, "global_step": 268792, "epoch": 2221} {"train_loss": -43.10106658935547, "global_step": 268793, "epoch": 2221} {"train_loss": -43.228023529052734, "global_step": 268794, "epoch": 2221} {"train_loss": -43.46260452270508, "global_step": 268795, "epoch": 2221} {"train_loss": -43.73418045043945, "global_step": 268796, "epoch": 2221} {"train_loss": -43.24831771850586, "global_step": 268797, "epoch": 2221} {"train_loss": -43.262332916259766, "global_step": 268798, "epoch": 2221} {"train_loss": -43.57177734375, "global_step": 268799, "epoch": 2221} {"train_loss": -43.356201171875, "global_step": 268800, "epoch": 2221} {"train_loss": -43.36588668823242, "global_step": 268801, "epoch": 2221} {"train_loss": -43.94422912597656, "global_step": 268802, "epoch": 2221} {"train_loss": -43.752681732177734, "global_step": 268803, "epoch": 2221} {"train_loss": -44.107330322265625, "global_step": 268804, "epoch": 2221} {"train_loss": -44.633113861083984, "global_step": 268805, "epoch": 2221} {"train_loss": -43.99781036376953, "global_step": 268806, "epoch": 2221} {"train_loss": -44.02840805053711, "global_step": 268807, "epoch": 2221} {"train_loss": -44.28855514526367, "global_step": 268808, "epoch": 2221} {"train_loss": -43.9591064453125, "global_step": 268809, "epoch": 2221} {"train_loss": -44.37550735473633, "global_step": 268810, "epoch": 2221} {"train_loss": -44.7696418762207, "global_step": 268811, "epoch": 2221} {"train_loss": -44.30139923095703, "global_step": 268812, "epoch": 2221} {"train_loss": -43.975948333740234, "global_step": 268813, "epoch": 2221} {"train_loss": -43.79463577270508, "global_step": 268814, "epoch": 2221} {"train_loss": -44.11554718017578, "global_step": 268815, "epoch": 2221} {"train_loss": -44.45136260986328, "global_step": 268816, "epoch": 2221} {"train_loss": -44.39911651611328, "global_step": 268817, "epoch": 2221} {"train_loss": -44.684452056884766, "global_step": 268818, "epoch": 2221} {"train_loss": -44.1723747253418, "global_step": 268819, "epoch": 2221} {"train_loss": -44.55564498901367, "global_step": 268820, "epoch": 2221} {"train_loss": -44.39854049682617, "global_step": 268821, "epoch": 2221} {"train_loss": -44.42387390136719, "global_step": 268822, "epoch": 2221} {"train_loss": -44.467140197753906, "global_step": 268823, "epoch": 2221} {"train_loss": -44.20343780517578, "global_step": 268824, "epoch": 2221} {"train_loss": -44.21310043334961, "global_step": 268825, "epoch": 2221} {"train_loss": -44.894630432128906, "global_step": 268826, "epoch": 2221} {"train_loss": -43.97758102416992, "global_step": 268827, "epoch": 2221} {"train_loss": -43.66067123413086, "global_step": 268828, "epoch": 2221} {"train_loss": -44.17219543457031, "global_step": 268829, "epoch": 2221} {"train_loss": -44.486183166503906, "global_step": 268830, "epoch": 2221} {"train_loss": -44.73912811279297, "global_step": 268831, "epoch": 2221} {"train_loss": -43.424015045166016, "global_step": 268832, "epoch": 2221} {"train_loss": -44.80353546142578, "global_step": 268833, "epoch": 2221} {"train_loss": -45.14895248413086, "global_step": 268834, "epoch": 2221} {"train_loss": -44.5052604675293, "global_step": 268835, "epoch": 2221} {"train_loss": -43.61550521850586, "global_step": 268836, "epoch": 2221} {"train_loss": -43.58696746826172, "global_step": 268837, "epoch": 2221} {"train_loss": -43.15288162231445, "global_step": 268838, "epoch": 2221} {"train_loss": -43.45789337158203, "global_step": 268839, "epoch": 2221} {"train_loss": -44.212730407714844, "global_step": 268840, "epoch": 2221} {"train_loss": -43.8077507019043, "global_step": 268841, "epoch": 2221} {"train_loss": -42.692501068115234, "global_step": 268842, "epoch": 2221} {"train_loss": -43.04348373413086, "global_step": 268843, "epoch": 2221} {"train_loss": -43.945411682128906, "global_step": 268844, "epoch": 2221} {"train_loss": -43.6031379699707, "global_step": 268845, "epoch": 2221} {"train_loss": -42.91129684448242, "global_step": 268846, "epoch": 2221} {"train_loss": -42.037567138671875, "global_step": 268847, "epoch": 2221} {"train_loss": -43.494903564453125, "global_step": 268848, "epoch": 2221} {"train_loss": -43.78532791137695, "global_step": 268849, "epoch": 2221} {"train_loss": -43.36714553833008, "global_step": 268850, "epoch": 2221} {"train_loss": -43.0020866394043, "global_step": 268851, "epoch": 2221} {"train_loss": -42.0301628112793, "global_step": 268852, "epoch": 2221} {"train_loss": -42.55874252319336, "global_step": 268853, "epoch": 2221} {"train_loss": -42.941314697265625, "global_step": 268854, "epoch": 2221} {"train_loss": -42.34272003173828, "global_step": 268855, "epoch": 2221} {"train_loss": -43.74032211303711, "global_step": 268856, "epoch": 2221} {"train_loss": -43.23591613769531, "global_step": 268857, "epoch": 2221} {"train_loss": -42.70438003540039, "global_step": 268858, "epoch": 2221} {"train_loss": -43.2765007019043, "global_step": 268859, "epoch": 2221} {"train_loss": -43.03822708129883, "global_step": 268860, "epoch": 2221} {"train_loss": -43.00175044162214, "global_step": 268861, "epoch": 2221, "val_loss": 2697658.75} {"train_loss": -43.394020080566406, "global_step": 268862, "epoch": 2222} {"train_loss": -43.31108474731445, "global_step": 268863, "epoch": 2222} {"train_loss": -42.22762680053711, "global_step": 268864, "epoch": 2222} {"train_loss": -43.72096633911133, "global_step": 268865, "epoch": 2222} {"train_loss": -42.64591598510742, "global_step": 268866, "epoch": 2222} {"train_loss": -42.192989349365234, "global_step": 268867, "epoch": 2222} {"train_loss": -43.848060607910156, "global_step": 268868, "epoch": 2222} {"train_loss": -42.18646240234375, "global_step": 268869, "epoch": 2222} {"train_loss": -42.17938232421875, "global_step": 268870, "epoch": 2222} {"train_loss": -43.84171676635742, "global_step": 268871, "epoch": 2222} {"train_loss": -42.88754653930664, "global_step": 268872, "epoch": 2222} {"train_loss": -42.899871826171875, "global_step": 268873, "epoch": 2222} {"train_loss": -42.76532745361328, "global_step": 268874, "epoch": 2222} {"train_loss": -42.863460540771484, "global_step": 268875, "epoch": 2222} {"train_loss": -42.974891662597656, "global_step": 268876, "epoch": 2222} {"train_loss": -43.133033752441406, "global_step": 268877, "epoch": 2222} {"train_loss": -42.61415100097656, "global_step": 268878, "epoch": 2222} {"train_loss": -41.84965133666992, "global_step": 268879, "epoch": 2222} {"train_loss": -41.974430084228516, "global_step": 268880, "epoch": 2222} {"train_loss": -41.16786575317383, "global_step": 268881, "epoch": 2222} {"train_loss": -42.53672790527344, "global_step": 268882, "epoch": 2222} {"train_loss": -41.2721061706543, "global_step": 268883, "epoch": 2222} {"train_loss": -42.35329055786133, "global_step": 268884, "epoch": 2222} {"train_loss": -39.3415641784668, "global_step": 268885, "epoch": 2222} {"train_loss": -41.6629753112793, "global_step": 268886, "epoch": 2222} {"train_loss": -35.58614730834961, "global_step": 268887, "epoch": 2222} {"train_loss": -36.17156219482422, "global_step": 268888, "epoch": 2222} {"train_loss": -29.19630241394043, "global_step": 268889, "epoch": 2222} {"train_loss": -35.679683685302734, "global_step": 268890, "epoch": 2222} {"train_loss": -37.42104721069336, "global_step": 268891, "epoch": 2222} {"train_loss": -35.609500885009766, "global_step": 268892, "epoch": 2222} {"train_loss": -39.85874557495117, "global_step": 268893, "epoch": 2222} {"train_loss": -36.69340133666992, "global_step": 268894, "epoch": 2222} {"train_loss": -40.83079147338867, "global_step": 268895, "epoch": 2222} {"train_loss": -38.82857131958008, "global_step": 268896, "epoch": 2222} {"train_loss": -37.2620964050293, "global_step": 268897, "epoch": 2222} {"train_loss": -35.73707962036133, "global_step": 268898, "epoch": 2222} {"train_loss": -40.478248596191406, "global_step": 268899, "epoch": 2222} {"train_loss": -35.59940719604492, "global_step": 268900, "epoch": 2222} {"train_loss": -39.68543243408203, "global_step": 268901, "epoch": 2222} {"train_loss": -36.75081253051758, "global_step": 268902, "epoch": 2222} {"train_loss": -38.738929748535156, "global_step": 268903, "epoch": 2222} {"train_loss": -39.797760009765625, "global_step": 268904, "epoch": 2222} {"train_loss": -39.01541519165039, "global_step": 268905, "epoch": 2222} {"train_loss": -40.1187744140625, "global_step": 268906, "epoch": 2222} {"train_loss": -39.66830062866211, "global_step": 268907, "epoch": 2222} {"train_loss": -40.699729919433594, "global_step": 268908, "epoch": 2222} {"train_loss": -40.11698532104492, "global_step": 268909, "epoch": 2222} {"train_loss": -41.14228439331055, "global_step": 268910, "epoch": 2222} {"train_loss": -41.14608383178711, "global_step": 268911, "epoch": 2222} {"train_loss": -41.045772552490234, "global_step": 268912, "epoch": 2222} {"train_loss": -40.85337829589844, "global_step": 268913, "epoch": 2222} {"train_loss": -41.795780181884766, "global_step": 268914, "epoch": 2222} {"train_loss": -41.67611312866211, "global_step": 268915, "epoch": 2222} {"train_loss": -41.717987060546875, "global_step": 268916, "epoch": 2222} {"train_loss": -42.86967849731445, "global_step": 268917, "epoch": 2222} {"train_loss": -42.05192184448242, "global_step": 268918, "epoch": 2222} {"train_loss": -42.5438346862793, "global_step": 268919, "epoch": 2222} {"train_loss": -42.473121643066406, "global_step": 268920, "epoch": 2222} {"train_loss": -42.67385482788086, "global_step": 268921, "epoch": 2222} {"train_loss": -42.4820671081543, "global_step": 268922, "epoch": 2222} {"train_loss": -42.847023010253906, "global_step": 268923, "epoch": 2222} {"train_loss": -42.649932861328125, "global_step": 268924, "epoch": 2222} {"train_loss": -42.596466064453125, "global_step": 268925, "epoch": 2222} {"train_loss": -43.422576904296875, "global_step": 268926, "epoch": 2222} {"train_loss": -42.698116302490234, "global_step": 268927, "epoch": 2222} {"train_loss": -42.498226165771484, "global_step": 268928, "epoch": 2222} {"train_loss": -43.09528350830078, "global_step": 268929, "epoch": 2222} {"train_loss": -42.78105926513672, "global_step": 268930, "epoch": 2222} {"train_loss": -42.66255569458008, "global_step": 268931, "epoch": 2222} {"train_loss": -42.93116760253906, "global_step": 268932, "epoch": 2222} {"train_loss": -43.086753845214844, "global_step": 268933, "epoch": 2222} {"train_loss": -42.61625289916992, "global_step": 268934, "epoch": 2222} {"train_loss": -43.39278793334961, "global_step": 268935, "epoch": 2222} {"train_loss": -42.955318450927734, "global_step": 268936, "epoch": 2222} {"train_loss": -42.992305755615234, "global_step": 268937, "epoch": 2222} {"train_loss": -43.24319076538086, "global_step": 268938, "epoch": 2222} {"train_loss": -43.17560958862305, "global_step": 268939, "epoch": 2222} {"train_loss": -43.40031051635742, "global_step": 268940, "epoch": 2222} {"train_loss": -43.10457229614258, "global_step": 268941, "epoch": 2222} {"train_loss": -43.40487289428711, "global_step": 268942, "epoch": 2222} {"train_loss": -43.26351547241211, "global_step": 268943, "epoch": 2222} {"train_loss": -43.172767639160156, "global_step": 268944, "epoch": 2222} {"train_loss": -43.40116500854492, "global_step": 268945, "epoch": 2222} {"train_loss": -43.49525833129883, "global_step": 268946, "epoch": 2222} {"train_loss": -43.53119659423828, "global_step": 268947, "epoch": 2222} {"train_loss": -42.74849319458008, "global_step": 268948, "epoch": 2222} {"train_loss": -43.88090133666992, "global_step": 268949, "epoch": 2222} {"train_loss": -43.308387756347656, "global_step": 268950, "epoch": 2222} {"train_loss": -43.66168975830078, "global_step": 268951, "epoch": 2222} {"train_loss": -43.55632781982422, "global_step": 268952, "epoch": 2222} {"train_loss": -43.50800704956055, "global_step": 268953, "epoch": 2222} {"train_loss": -43.78205490112305, "global_step": 268954, "epoch": 2222} {"train_loss": -43.8267822265625, "global_step": 268955, "epoch": 2222} {"train_loss": -43.79356002807617, "global_step": 268956, "epoch": 2222} {"train_loss": -44.197166442871094, "global_step": 268957, "epoch": 2222} {"train_loss": -43.718204498291016, "global_step": 268958, "epoch": 2222} {"train_loss": -44.36953353881836, "global_step": 268959, "epoch": 2222} {"train_loss": -44.258846282958984, "global_step": 268960, "epoch": 2222} {"train_loss": -43.964080810546875, "global_step": 268961, "epoch": 2222} {"train_loss": -43.9642448425293, "global_step": 268962, "epoch": 2222} {"train_loss": -43.837398529052734, "global_step": 268963, "epoch": 2222} {"train_loss": -44.40471267700195, "global_step": 268964, "epoch": 2222} {"train_loss": -43.98421859741211, "global_step": 268965, "epoch": 2222} {"train_loss": -44.1437873840332, "global_step": 268966, "epoch": 2222} {"train_loss": -43.321929931640625, "global_step": 268967, "epoch": 2222} {"train_loss": -44.14216995239258, "global_step": 268968, "epoch": 2222} {"train_loss": -44.51276779174805, "global_step": 268969, "epoch": 2222} {"train_loss": -44.30719757080078, "global_step": 268970, "epoch": 2222} {"train_loss": -44.23133087158203, "global_step": 268971, "epoch": 2222} {"train_loss": -44.310646057128906, "global_step": 268972, "epoch": 2222} {"train_loss": -44.4761962890625, "global_step": 268973, "epoch": 2222} {"train_loss": -44.603519439697266, "global_step": 268974, "epoch": 2222} {"train_loss": -44.35462188720703, "global_step": 268975, "epoch": 2222} {"train_loss": -44.06593704223633, "global_step": 268976, "epoch": 2222} {"train_loss": -43.71418380737305, "global_step": 268977, "epoch": 2222} {"train_loss": -44.080135345458984, "global_step": 268978, "epoch": 2222} {"train_loss": -44.54197311401367, "global_step": 268979, "epoch": 2222} {"train_loss": -44.55892562866211, "global_step": 268980, "epoch": 2222} {"train_loss": -44.307621002197266, "global_step": 268981, "epoch": 2222} {"train_loss": -42.087975005472984, "global_step": 268982, "epoch": 2222, "val_loss": 2718625.75} {"train_loss": -44.57073211669922, "global_step": 268983, "epoch": 2223} {"train_loss": -44.674415588378906, "global_step": 268984, "epoch": 2223} {"train_loss": -44.0898323059082, "global_step": 268985, "epoch": 2223} {"train_loss": -43.528438568115234, "global_step": 268986, "epoch": 2223} {"train_loss": -43.394439697265625, "global_step": 268987, "epoch": 2223} {"train_loss": -44.061309814453125, "global_step": 268988, "epoch": 2223} {"train_loss": -44.31037139892578, "global_step": 268989, "epoch": 2223} {"train_loss": -44.4171257019043, "global_step": 268990, "epoch": 2223} {"train_loss": -41.34113693237305, "global_step": 268991, "epoch": 2223} {"train_loss": -37.61749267578125, "global_step": 268992, "epoch": 2223} {"train_loss": -31.333744049072266, "global_step": 268993, "epoch": 2223} {"train_loss": -36.0008544921875, "global_step": 268994, "epoch": 2223} {"train_loss": -41.874385833740234, "global_step": 268995, "epoch": 2223} {"train_loss": -38.43277359008789, "global_step": 268996, "epoch": 2223} {"train_loss": -37.65519332885742, "global_step": 268997, "epoch": 2223} {"train_loss": -41.087493896484375, "global_step": 268998, "epoch": 2223} {"train_loss": -41.71335983276367, "global_step": 268999, "epoch": 2223} {"train_loss": -40.43514633178711, "global_step": 269000, "epoch": 2223} {"train_loss": -41.045814514160156, "global_step": 269001, "epoch": 2223} {"train_loss": -40.34200668334961, "global_step": 269002, "epoch": 2223} {"train_loss": -40.31882095336914, "global_step": 269003, "epoch": 2223} {"train_loss": -32.60398483276367, "global_step": 269004, "epoch": 2223} {"train_loss": -37.96962356567383, "global_step": 269005, "epoch": 2223} {"train_loss": -40.15363693237305, "global_step": 269006, "epoch": 2223} {"train_loss": -38.11342239379883, "global_step": 269007, "epoch": 2223} {"train_loss": -38.726436614990234, "global_step": 269008, "epoch": 2223} {"train_loss": -40.369384765625, "global_step": 269009, "epoch": 2223} {"train_loss": -41.36774444580078, "global_step": 269010, "epoch": 2223} {"train_loss": -39.69114303588867, "global_step": 269011, "epoch": 2223} {"train_loss": -40.446876525878906, "global_step": 269012, "epoch": 2223} {"train_loss": -39.90370178222656, "global_step": 269013, "epoch": 2223} {"train_loss": -40.069488525390625, "global_step": 269014, "epoch": 2223} {"train_loss": -34.211055755615234, "global_step": 269015, "epoch": 2223} {"train_loss": -39.497127532958984, "global_step": 269016, "epoch": 2223} {"train_loss": -39.27926254272461, "global_step": 269017, "epoch": 2223} {"train_loss": -39.99951934814453, "global_step": 269018, "epoch": 2223} {"train_loss": -38.96795654296875, "global_step": 269019, "epoch": 2223} {"train_loss": -41.19284439086914, "global_step": 269020, "epoch": 2223} {"train_loss": -39.4193000793457, "global_step": 269021, "epoch": 2223} {"train_loss": -41.221256256103516, "global_step": 269022, "epoch": 2223} {"train_loss": -39.38853073120117, "global_step": 269023, "epoch": 2223} {"train_loss": -39.89077377319336, "global_step": 269024, "epoch": 2223} {"train_loss": -39.596309661865234, "global_step": 269025, "epoch": 2223} {"train_loss": -40.45597457885742, "global_step": 269026, "epoch": 2223} {"train_loss": -41.2591438293457, "global_step": 269027, "epoch": 2223} {"train_loss": -41.19990158081055, "global_step": 269028, "epoch": 2223} {"train_loss": -40.659358978271484, "global_step": 269029, "epoch": 2223} {"train_loss": -42.7364501953125, "global_step": 269030, "epoch": 2223} {"train_loss": -40.325103759765625, "global_step": 269031, "epoch": 2223} {"train_loss": -41.80011749267578, "global_step": 269032, "epoch": 2223} {"train_loss": -41.027706146240234, "global_step": 269033, "epoch": 2223} {"train_loss": -42.230987548828125, "global_step": 269034, "epoch": 2223} {"train_loss": -41.9511604309082, "global_step": 269035, "epoch": 2223} {"train_loss": -41.448970794677734, "global_step": 269036, "epoch": 2223} {"train_loss": -41.6718864440918, "global_step": 269037, "epoch": 2223} {"train_loss": -40.72549057006836, "global_step": 269038, "epoch": 2223} {"train_loss": -41.83495330810547, "global_step": 269039, "epoch": 2223} {"train_loss": -42.472957611083984, "global_step": 269040, "epoch": 2223} {"train_loss": -42.059749603271484, "global_step": 269041, "epoch": 2223} {"train_loss": -43.03153610229492, "global_step": 269042, "epoch": 2223} {"train_loss": -42.57965087890625, "global_step": 269043, "epoch": 2223} {"train_loss": -42.636993408203125, "global_step": 269044, "epoch": 2223} {"train_loss": -42.8603401184082, "global_step": 269045, "epoch": 2223} {"train_loss": -42.172340393066406, "global_step": 269046, "epoch": 2223} {"train_loss": -42.262081146240234, "global_step": 269047, "epoch": 2223} {"train_loss": -42.37274932861328, "global_step": 269048, "epoch": 2223} {"train_loss": -42.745887756347656, "global_step": 269049, "epoch": 2223} {"train_loss": -43.04920196533203, "global_step": 269050, "epoch": 2223} {"train_loss": -42.894805908203125, "global_step": 269051, "epoch": 2223} {"train_loss": -43.129554748535156, "global_step": 269052, "epoch": 2223} {"train_loss": -43.36513137817383, "global_step": 269053, "epoch": 2223} {"train_loss": -43.3953857421875, "global_step": 269054, "epoch": 2223} {"train_loss": -43.055397033691406, "global_step": 269055, "epoch": 2223} {"train_loss": -42.810115814208984, "global_step": 269056, "epoch": 2223} {"train_loss": -42.590450286865234, "global_step": 269057, "epoch": 2223} {"train_loss": -43.118717193603516, "global_step": 269058, "epoch": 2223} {"train_loss": -43.327735900878906, "global_step": 269059, "epoch": 2223} {"train_loss": -43.68913650512695, "global_step": 269060, "epoch": 2223} {"train_loss": -43.17889404296875, "global_step": 269061, "epoch": 2223} {"train_loss": -43.22962188720703, "global_step": 269062, "epoch": 2223} {"train_loss": -43.61953353881836, "global_step": 269063, "epoch": 2223} {"train_loss": -43.6209716796875, "global_step": 269064, "epoch": 2223} {"train_loss": -43.73360824584961, "global_step": 269065, "epoch": 2223} {"train_loss": -43.24058151245117, "global_step": 269066, "epoch": 2223} {"train_loss": -43.52322769165039, "global_step": 269067, "epoch": 2223} {"train_loss": -43.32258224487305, "global_step": 269068, "epoch": 2223} {"train_loss": -43.7434196472168, "global_step": 269069, "epoch": 2223} {"train_loss": -43.23582458496094, "global_step": 269070, "epoch": 2223} {"train_loss": -44.03386306762695, "global_step": 269071, "epoch": 2223} {"train_loss": -43.24827194213867, "global_step": 269072, "epoch": 2223} {"train_loss": -43.809600830078125, "global_step": 269073, "epoch": 2223} {"train_loss": -43.4830436706543, "global_step": 269074, "epoch": 2223} {"train_loss": -43.75077438354492, "global_step": 269075, "epoch": 2223} {"train_loss": -43.71699523925781, "global_step": 269076, "epoch": 2223} {"train_loss": -43.6915283203125, "global_step": 269077, "epoch": 2223} {"train_loss": -43.672969818115234, "global_step": 269078, "epoch": 2223} {"train_loss": -44.115516662597656, "global_step": 269079, "epoch": 2223} {"train_loss": -43.09033203125, "global_step": 269080, "epoch": 2223} {"train_loss": -44.11767578125, "global_step": 269081, "epoch": 2223} {"train_loss": -43.98408889770508, "global_step": 269082, "epoch": 2223} {"train_loss": -43.42724609375, "global_step": 269083, "epoch": 2223} {"train_loss": -44.34098434448242, "global_step": 269084, "epoch": 2223} {"train_loss": -44.148624420166016, "global_step": 269085, "epoch": 2223} {"train_loss": -43.64567184448242, "global_step": 269086, "epoch": 2223} {"train_loss": -43.88691329956055, "global_step": 269087, "epoch": 2223} {"train_loss": -43.8876838684082, "global_step": 269088, "epoch": 2223} {"train_loss": -44.2224235534668, "global_step": 269089, "epoch": 2223} {"train_loss": -44.18326950073242, "global_step": 269090, "epoch": 2223} {"train_loss": -43.68178939819336, "global_step": 269091, "epoch": 2223} {"train_loss": -43.720516204833984, "global_step": 269092, "epoch": 2223} {"train_loss": -43.73905944824219, "global_step": 269093, "epoch": 2223} {"train_loss": -44.051841735839844, "global_step": 269094, "epoch": 2223} {"train_loss": -42.37131881713867, "global_step": 269095, "epoch": 2223} {"train_loss": -43.70338821411133, "global_step": 269096, "epoch": 2223} {"train_loss": -44.51308059692383, "global_step": 269097, "epoch": 2223} {"train_loss": -44.272823333740234, "global_step": 269098, "epoch": 2223} {"train_loss": -44.05637741088867, "global_step": 269099, "epoch": 2223} {"train_loss": -42.29819869995117, "global_step": 269100, "epoch": 2223} {"train_loss": -21.142080307006836, "global_step": 269101, "epoch": 2223} {"train_loss": -40.89156723022461, "global_step": 269102, "epoch": 2223} {"train_loss": -41.720731703703066, "global_step": 269103, "epoch": 2223, "val_loss": 2788971.75} {"train_loss": -38.89701461791992, "global_step": 269104, "epoch": 2224} {"train_loss": -36.34123611450195, "global_step": 269105, "epoch": 2224} {"train_loss": -25.3291015625, "global_step": 269106, "epoch": 2224} {"train_loss": -34.63245391845703, "global_step": 269107, "epoch": 2224} {"train_loss": -31.110822677612305, "global_step": 269108, "epoch": 2224} {"train_loss": -27.282886505126953, "global_step": 269109, "epoch": 2224} {"train_loss": -35.14558029174805, "global_step": 269110, "epoch": 2224} {"train_loss": -37.91299057006836, "global_step": 269111, "epoch": 2224} {"train_loss": -34.75349044799805, "global_step": 269112, "epoch": 2224} {"train_loss": -36.44647979736328, "global_step": 269113, "epoch": 2224} {"train_loss": -34.01838302612305, "global_step": 269114, "epoch": 2224} {"train_loss": -28.292118072509766, "global_step": 269115, "epoch": 2224} {"train_loss": -38.79368209838867, "global_step": 269116, "epoch": 2224} {"train_loss": -35.2402458190918, "global_step": 269117, "epoch": 2224} {"train_loss": -38.456756591796875, "global_step": 269118, "epoch": 2224} {"train_loss": -38.28235626220703, "global_step": 269119, "epoch": 2224} {"train_loss": -37.82008743286133, "global_step": 269120, "epoch": 2224} {"train_loss": -37.3134765625, "global_step": 269121, "epoch": 2224} {"train_loss": -33.89020538330078, "global_step": 269122, "epoch": 2224} {"train_loss": -35.04724884033203, "global_step": 269123, "epoch": 2224} {"train_loss": -38.461952209472656, "global_step": 269124, "epoch": 2224} {"train_loss": -39.04052734375, "global_step": 269125, "epoch": 2224} {"train_loss": -40.8619384765625, "global_step": 269126, "epoch": 2224} {"train_loss": -37.860626220703125, "global_step": 269127, "epoch": 2224} {"train_loss": -39.43205642700195, "global_step": 269128, "epoch": 2224} {"train_loss": -40.54523468017578, "global_step": 269129, "epoch": 2224} {"train_loss": -40.38477325439453, "global_step": 269130, "epoch": 2224} {"train_loss": -41.10978317260742, "global_step": 269131, "epoch": 2224} {"train_loss": -40.8233757019043, "global_step": 269132, "epoch": 2224} {"train_loss": -40.323055267333984, "global_step": 269133, "epoch": 2224} {"train_loss": -40.45903778076172, "global_step": 269134, "epoch": 2224} {"train_loss": -41.01229476928711, "global_step": 269135, "epoch": 2224} {"train_loss": -41.08346176147461, "global_step": 269136, "epoch": 2224} {"train_loss": -40.7440299987793, "global_step": 269137, "epoch": 2224} {"train_loss": -40.83305740356445, "global_step": 269138, "epoch": 2224} {"train_loss": -40.82861328125, "global_step": 269139, "epoch": 2224} {"train_loss": -41.57709884643555, "global_step": 269140, "epoch": 2224} {"train_loss": -41.18449783325195, "global_step": 269141, "epoch": 2224} {"train_loss": -41.00065612792969, "global_step": 269142, "epoch": 2224} {"train_loss": -41.33360290527344, "global_step": 269143, "epoch": 2224} {"train_loss": -41.62654495239258, "global_step": 269144, "epoch": 2224} {"train_loss": -42.171417236328125, "global_step": 269145, "epoch": 2224} {"train_loss": -40.92715835571289, "global_step": 269146, "epoch": 2224} {"train_loss": -40.94753646850586, "global_step": 269147, "epoch": 2224} {"train_loss": -41.1895637512207, "global_step": 269148, "epoch": 2224} {"train_loss": -40.63889694213867, "global_step": 269149, "epoch": 2224} {"train_loss": -41.45759582519531, "global_step": 269150, "epoch": 2224} {"train_loss": -42.0789909362793, "global_step": 269151, "epoch": 2224} {"train_loss": -42.14888000488281, "global_step": 269152, "epoch": 2224} {"train_loss": -41.3872184753418, "global_step": 269153, "epoch": 2224} {"train_loss": -42.0267219543457, "global_step": 269154, "epoch": 2224} {"train_loss": -41.72862243652344, "global_step": 269155, "epoch": 2224} {"train_loss": -41.89787292480469, "global_step": 269156, "epoch": 2224} {"train_loss": -41.62435531616211, "global_step": 269157, "epoch": 2224} {"train_loss": -42.211585998535156, "global_step": 269158, "epoch": 2224} {"train_loss": -41.9542121887207, "global_step": 269159, "epoch": 2224} {"train_loss": -42.14439392089844, "global_step": 269160, "epoch": 2224} {"train_loss": -42.16634750366211, "global_step": 269161, "epoch": 2224} {"train_loss": -42.148677825927734, "global_step": 269162, "epoch": 2224} {"train_loss": -42.55980682373047, "global_step": 269163, "epoch": 2224} {"train_loss": -42.99306106567383, "global_step": 269164, "epoch": 2224} {"train_loss": -41.682403564453125, "global_step": 269165, "epoch": 2224} {"train_loss": -42.9049072265625, "global_step": 269166, "epoch": 2224} {"train_loss": -42.518978118896484, "global_step": 269167, "epoch": 2224} {"train_loss": -42.064361572265625, "global_step": 269168, "epoch": 2224} {"train_loss": -43.20032501220703, "global_step": 269169, "epoch": 2224} {"train_loss": -42.16496276855469, "global_step": 269170, "epoch": 2224} {"train_loss": -42.664833068847656, "global_step": 269171, "epoch": 2224} {"train_loss": -43.07766342163086, "global_step": 269172, "epoch": 2224} {"train_loss": -42.578914642333984, "global_step": 269173, "epoch": 2224} {"train_loss": -42.9071159362793, "global_step": 269174, "epoch": 2224} {"train_loss": -42.561187744140625, "global_step": 269175, "epoch": 2224} {"train_loss": -43.247222900390625, "global_step": 269176, "epoch": 2224} {"train_loss": -43.10962677001953, "global_step": 269177, "epoch": 2224} {"train_loss": -42.16489791870117, "global_step": 269178, "epoch": 2224} {"train_loss": -42.83524703979492, "global_step": 269179, "epoch": 2224} {"train_loss": -42.645782470703125, "global_step": 269180, "epoch": 2224} {"train_loss": -42.636085510253906, "global_step": 269181, "epoch": 2224} {"train_loss": -43.0223503112793, "global_step": 269182, "epoch": 2224} {"train_loss": -43.327938079833984, "global_step": 269183, "epoch": 2224} {"train_loss": -42.79462432861328, "global_step": 269184, "epoch": 2224} {"train_loss": -43.12370681762695, "global_step": 269185, "epoch": 2224} {"train_loss": -43.17082595825195, "global_step": 269186, "epoch": 2224} {"train_loss": -43.024208068847656, "global_step": 269187, "epoch": 2224} {"train_loss": -43.27134323120117, "global_step": 269188, "epoch": 2224} {"train_loss": -42.92067337036133, "global_step": 269189, "epoch": 2224} {"train_loss": -42.67392349243164, "global_step": 269190, "epoch": 2224} {"train_loss": -43.405452728271484, "global_step": 269191, "epoch": 2224} {"train_loss": -43.42109298706055, "global_step": 269192, "epoch": 2224} {"train_loss": -43.56319046020508, "global_step": 269193, "epoch": 2224} {"train_loss": -43.4329833984375, "global_step": 269194, "epoch": 2224} {"train_loss": -42.80027389526367, "global_step": 269195, "epoch": 2224} {"train_loss": -43.31276321411133, "global_step": 269196, "epoch": 2224} {"train_loss": -43.969207763671875, "global_step": 269197, "epoch": 2224} {"train_loss": -42.824066162109375, "global_step": 269198, "epoch": 2224} {"train_loss": -42.52338409423828, "global_step": 269199, "epoch": 2224} {"train_loss": -43.05461883544922, "global_step": 269200, "epoch": 2224} {"train_loss": -43.40987014770508, "global_step": 269201, "epoch": 2224} {"train_loss": -43.950801849365234, "global_step": 269202, "epoch": 2224} {"train_loss": -43.53298568725586, "global_step": 269203, "epoch": 2224} {"train_loss": -43.42243576049805, "global_step": 269204, "epoch": 2224} {"train_loss": -44.01411056518555, "global_step": 269205, "epoch": 2224} {"train_loss": -43.26791763305664, "global_step": 269206, "epoch": 2224} {"train_loss": -43.02531814575195, "global_step": 269207, "epoch": 2224} {"train_loss": -43.55662155151367, "global_step": 269208, "epoch": 2224} {"train_loss": -44.164363861083984, "global_step": 269209, "epoch": 2224} {"train_loss": -43.82151412963867, "global_step": 269210, "epoch": 2224} {"train_loss": -43.48917007446289, "global_step": 269211, "epoch": 2224} {"train_loss": -43.18857192993164, "global_step": 269212, "epoch": 2224} {"train_loss": -43.84618377685547, "global_step": 269213, "epoch": 2224} {"train_loss": -43.564056396484375, "global_step": 269214, "epoch": 2224} {"train_loss": -43.67778015136719, "global_step": 269215, "epoch": 2224} {"train_loss": -42.00542449951172, "global_step": 269216, "epoch": 2224} {"train_loss": -39.87117004394531, "global_step": 269217, "epoch": 2224} {"train_loss": -43.03204345703125, "global_step": 269218, "epoch": 2224} {"train_loss": -42.8038330078125, "global_step": 269219, "epoch": 2224} {"train_loss": -42.62177276611328, "global_step": 269220, "epoch": 2224} {"train_loss": -42.88767623901367, "global_step": 269221, "epoch": 2224} {"train_loss": -42.836891174316406, "global_step": 269222, "epoch": 2224} {"train_loss": -42.15791320800781, "global_step": 269223, "epoch": 2224} {"train_loss": -40.98821903260286, "global_step": 269224, "epoch": 2224, "val_loss": 2662600.75} {"train_loss": -43.059810638427734, "global_step": 269225, "epoch": 2225} {"train_loss": -41.37928009033203, "global_step": 269226, "epoch": 2225} {"train_loss": -39.978904724121094, "global_step": 269227, "epoch": 2225} {"train_loss": -42.64266586303711, "global_step": 269228, "epoch": 2225} {"train_loss": -39.021602630615234, "global_step": 269229, "epoch": 2225} {"train_loss": -42.891082763671875, "global_step": 269230, "epoch": 2225} {"train_loss": -42.662715911865234, "global_step": 269231, "epoch": 2225} {"train_loss": -39.017555236816406, "global_step": 269232, "epoch": 2225} {"train_loss": -38.63821792602539, "global_step": 269233, "epoch": 2225} {"train_loss": -39.33816146850586, "global_step": 269234, "epoch": 2225} {"train_loss": -40.13117980957031, "global_step": 269235, "epoch": 2225} {"train_loss": -40.49042892456055, "global_step": 269236, "epoch": 2225} {"train_loss": -41.855308532714844, "global_step": 269237, "epoch": 2225} {"train_loss": -41.52450180053711, "global_step": 269238, "epoch": 2225} {"train_loss": -39.73719787597656, "global_step": 269239, "epoch": 2225} {"train_loss": -39.73328399658203, "global_step": 269240, "epoch": 2225} {"train_loss": -42.26430130004883, "global_step": 269241, "epoch": 2225} {"train_loss": -42.15632629394531, "global_step": 269242, "epoch": 2225} {"train_loss": -41.46108627319336, "global_step": 269243, "epoch": 2225} {"train_loss": -42.63056182861328, "global_step": 269244, "epoch": 2225} {"train_loss": -43.0218620300293, "global_step": 269245, "epoch": 2225} {"train_loss": -42.65617370605469, "global_step": 269246, "epoch": 2225} {"train_loss": -41.117225646972656, "global_step": 269247, "epoch": 2225} {"train_loss": -41.297969818115234, "global_step": 269248, "epoch": 2225} {"train_loss": -40.980709075927734, "global_step": 269249, "epoch": 2225} {"train_loss": -40.966583251953125, "global_step": 269250, "epoch": 2225} {"train_loss": -41.85332107543945, "global_step": 269251, "epoch": 2225} {"train_loss": -41.029762268066406, "global_step": 269252, "epoch": 2225} {"train_loss": -41.89652633666992, "global_step": 269253, "epoch": 2225} {"train_loss": -41.6927604675293, "global_step": 269254, "epoch": 2225} {"train_loss": -41.475128173828125, "global_step": 269255, "epoch": 2225} {"train_loss": -41.830055236816406, "global_step": 269256, "epoch": 2225} {"train_loss": -39.923744201660156, "global_step": 269257, "epoch": 2225} {"train_loss": -40.759395599365234, "global_step": 269258, "epoch": 2225} {"train_loss": -39.56117630004883, "global_step": 269259, "epoch": 2225} {"train_loss": -38.917110443115234, "global_step": 269260, "epoch": 2225} {"train_loss": -38.7718620300293, "global_step": 269261, "epoch": 2225} {"train_loss": -41.3929557800293, "global_step": 269262, "epoch": 2225} {"train_loss": -39.93379211425781, "global_step": 269263, "epoch": 2225} {"train_loss": -41.09333038330078, "global_step": 269264, "epoch": 2225} {"train_loss": -41.35891342163086, "global_step": 269265, "epoch": 2225} {"train_loss": -42.008758544921875, "global_step": 269266, "epoch": 2225} {"train_loss": -41.239234924316406, "global_step": 269267, "epoch": 2225} {"train_loss": -41.88088607788086, "global_step": 269268, "epoch": 2225} {"train_loss": -41.83071517944336, "global_step": 269269, "epoch": 2225} {"train_loss": -42.80369567871094, "global_step": 269270, "epoch": 2225} {"train_loss": -40.98545837402344, "global_step": 269271, "epoch": 2225} {"train_loss": -42.318172454833984, "global_step": 269272, "epoch": 2225} {"train_loss": -41.81513977050781, "global_step": 269273, "epoch": 2225} {"train_loss": -40.81679153442383, "global_step": 269274, "epoch": 2225} {"train_loss": -42.63035202026367, "global_step": 269275, "epoch": 2225} {"train_loss": -41.65256881713867, "global_step": 269276, "epoch": 2225} {"train_loss": -41.92903518676758, "global_step": 269277, "epoch": 2225} {"train_loss": -42.32611846923828, "global_step": 269278, "epoch": 2225} {"train_loss": -42.34426498413086, "global_step": 269279, "epoch": 2225} {"train_loss": -42.13404083251953, "global_step": 269280, "epoch": 2225} {"train_loss": -42.45655822753906, "global_step": 269281, "epoch": 2225} {"train_loss": -41.95164108276367, "global_step": 269282, "epoch": 2225} {"train_loss": -42.96156692504883, "global_step": 269283, "epoch": 2225} {"train_loss": -41.1895866394043, "global_step": 269284, "epoch": 2225} {"train_loss": -40.68060302734375, "global_step": 269285, "epoch": 2225} {"train_loss": -42.62754821777344, "global_step": 269286, "epoch": 2225} {"train_loss": -42.3760871887207, "global_step": 269287, "epoch": 2225} {"train_loss": -41.871944427490234, "global_step": 269288, "epoch": 2225} {"train_loss": -42.68993377685547, "global_step": 269289, "epoch": 2225} {"train_loss": -42.60256576538086, "global_step": 269290, "epoch": 2225} {"train_loss": -42.84220504760742, "global_step": 269291, "epoch": 2225} {"train_loss": -42.72017288208008, "global_step": 269292, "epoch": 2225} {"train_loss": -42.59541702270508, "global_step": 269293, "epoch": 2225} {"train_loss": -42.1525764465332, "global_step": 269294, "epoch": 2225} {"train_loss": -43.41960525512695, "global_step": 269295, "epoch": 2225} {"train_loss": -42.77724838256836, "global_step": 269296, "epoch": 2225} {"train_loss": -42.01301574707031, "global_step": 269297, "epoch": 2225} {"train_loss": -42.64878463745117, "global_step": 269298, "epoch": 2225} {"train_loss": -42.14260482788086, "global_step": 269299, "epoch": 2225} {"train_loss": -42.40709686279297, "global_step": 269300, "epoch": 2225} {"train_loss": -43.03948974609375, "global_step": 269301, "epoch": 2225} {"train_loss": -42.566864013671875, "global_step": 269302, "epoch": 2225} {"train_loss": -42.98811340332031, "global_step": 269303, "epoch": 2225} {"train_loss": -43.42924118041992, "global_step": 269304, "epoch": 2225} {"train_loss": -42.6917724609375, "global_step": 269305, "epoch": 2225} {"train_loss": -42.947120666503906, "global_step": 269306, "epoch": 2225} {"train_loss": -42.903846740722656, "global_step": 269307, "epoch": 2225} {"train_loss": -43.510345458984375, "global_step": 269308, "epoch": 2225} {"train_loss": -43.203365325927734, "global_step": 269309, "epoch": 2225} {"train_loss": -43.404991149902344, "global_step": 269310, "epoch": 2225} {"train_loss": -43.352500915527344, "global_step": 269311, "epoch": 2225} {"train_loss": -43.65298080444336, "global_step": 269312, "epoch": 2225} {"train_loss": -43.85595703125, "global_step": 269313, "epoch": 2225} {"train_loss": -43.014686584472656, "global_step": 269314, "epoch": 2225} {"train_loss": -43.629451751708984, "global_step": 269315, "epoch": 2225} {"train_loss": -44.247772216796875, "global_step": 269316, "epoch": 2225} {"train_loss": -42.62086868286133, "global_step": 269317, "epoch": 2225} {"train_loss": -43.65635299682617, "global_step": 269318, "epoch": 2225} {"train_loss": -44.303245544433594, "global_step": 269319, "epoch": 2225} {"train_loss": -43.506221771240234, "global_step": 269320, "epoch": 2225} {"train_loss": -43.91548538208008, "global_step": 269321, "epoch": 2225} {"train_loss": -43.89357376098633, "global_step": 269322, "epoch": 2225} {"train_loss": -44.163997650146484, "global_step": 269323, "epoch": 2225} {"train_loss": -43.796852111816406, "global_step": 269324, "epoch": 2225} {"train_loss": -43.43022918701172, "global_step": 269325, "epoch": 2225} {"train_loss": -44.188533782958984, "global_step": 269326, "epoch": 2225} {"train_loss": -43.371883392333984, "global_step": 269327, "epoch": 2225} {"train_loss": -43.16201400756836, "global_step": 269328, "epoch": 2225} {"train_loss": -44.11448287963867, "global_step": 269329, "epoch": 2225} {"train_loss": -42.80305862426758, "global_step": 269330, "epoch": 2225} {"train_loss": -42.316226959228516, "global_step": 269331, "epoch": 2225} {"train_loss": -43.74465560913086, "global_step": 269332, "epoch": 2225} {"train_loss": -42.89207077026367, "global_step": 269333, "epoch": 2225} {"train_loss": -41.18793869018555, "global_step": 269334, "epoch": 2225} {"train_loss": -43.7859992980957, "global_step": 269335, "epoch": 2225} {"train_loss": -41.97243118286133, "global_step": 269336, "epoch": 2225} {"train_loss": -43.0262565612793, "global_step": 269337, "epoch": 2225} {"train_loss": -43.78984832763672, "global_step": 269338, "epoch": 2225} {"train_loss": -43.148681640625, "global_step": 269339, "epoch": 2225} {"train_loss": -43.396484375, "global_step": 269340, "epoch": 2225} {"train_loss": -43.64280319213867, "global_step": 269341, "epoch": 2225} {"train_loss": -43.41375732421875, "global_step": 269342, "epoch": 2225} {"train_loss": -43.75924301147461, "global_step": 269343, "epoch": 2225} {"train_loss": -43.77360153198242, "global_step": 269344, "epoch": 2225} {"train_loss": -42.22085117308561, "global_step": 269345, "epoch": 2225, "val_loss": 2679032.75} {"train_loss": -43.6641731262207, "global_step": 269346, "epoch": 2226} {"train_loss": -42.3504524230957, "global_step": 269347, "epoch": 2226} {"train_loss": -42.637821197509766, "global_step": 269348, "epoch": 2226} {"train_loss": -43.49769973754883, "global_step": 269349, "epoch": 2226} {"train_loss": -42.8389778137207, "global_step": 269350, "epoch": 2226} {"train_loss": -43.38652038574219, "global_step": 269351, "epoch": 2226} {"train_loss": -43.62128829956055, "global_step": 269352, "epoch": 2226} {"train_loss": -42.690269470214844, "global_step": 269353, "epoch": 2226} {"train_loss": -42.39692306518555, "global_step": 269354, "epoch": 2226} {"train_loss": -43.5946159362793, "global_step": 269355, "epoch": 2226} {"train_loss": -43.889076232910156, "global_step": 269356, "epoch": 2226} {"train_loss": -42.648311614990234, "global_step": 269357, "epoch": 2226} {"train_loss": -42.97443771362305, "global_step": 269358, "epoch": 2226} {"train_loss": -43.21558380126953, "global_step": 269359, "epoch": 2226} {"train_loss": -43.07587432861328, "global_step": 269360, "epoch": 2226} {"train_loss": -40.91168212890625, "global_step": 269361, "epoch": 2226} {"train_loss": -43.143531799316406, "global_step": 269362, "epoch": 2226} {"train_loss": -42.9232063293457, "global_step": 269363, "epoch": 2226} {"train_loss": -42.69322204589844, "global_step": 269364, "epoch": 2226} {"train_loss": -42.78634262084961, "global_step": 269365, "epoch": 2226} {"train_loss": -43.7530403137207, "global_step": 269366, "epoch": 2226} {"train_loss": -41.630958557128906, "global_step": 269367, "epoch": 2226} {"train_loss": -41.1835823059082, "global_step": 269368, "epoch": 2226} {"train_loss": -43.543663024902344, "global_step": 269369, "epoch": 2226} {"train_loss": -42.07646179199219, "global_step": 269370, "epoch": 2226} {"train_loss": -42.38973617553711, "global_step": 269371, "epoch": 2226} {"train_loss": -43.29218673706055, "global_step": 269372, "epoch": 2226} {"train_loss": -43.2547721862793, "global_step": 269373, "epoch": 2226} {"train_loss": -43.40877914428711, "global_step": 269374, "epoch": 2226} {"train_loss": -43.34017562866211, "global_step": 269375, "epoch": 2226} {"train_loss": -42.91217803955078, "global_step": 269376, "epoch": 2226} {"train_loss": -41.95133590698242, "global_step": 269377, "epoch": 2226} {"train_loss": -42.622432708740234, "global_step": 269378, "epoch": 2226} {"train_loss": -43.581661224365234, "global_step": 269379, "epoch": 2226} {"train_loss": -42.370460510253906, "global_step": 269380, "epoch": 2226} {"train_loss": -42.99129867553711, "global_step": 269381, "epoch": 2226} {"train_loss": -43.4775505065918, "global_step": 269382, "epoch": 2226} {"train_loss": -43.20735549926758, "global_step": 269383, "epoch": 2226} {"train_loss": -43.218528747558594, "global_step": 269384, "epoch": 2226} {"train_loss": -43.45920944213867, "global_step": 269385, "epoch": 2226} {"train_loss": -42.46674728393555, "global_step": 269386, "epoch": 2226} {"train_loss": -42.994171142578125, "global_step": 269387, "epoch": 2226} {"train_loss": -43.51478958129883, "global_step": 269388, "epoch": 2226} {"train_loss": -42.693214416503906, "global_step": 269389, "epoch": 2226} {"train_loss": -42.8555793762207, "global_step": 269390, "epoch": 2226} {"train_loss": -43.84186935424805, "global_step": 269391, "epoch": 2226} {"train_loss": -43.732322692871094, "global_step": 269392, "epoch": 2226} {"train_loss": -43.62498092651367, "global_step": 269393, "epoch": 2226} {"train_loss": -43.5252685546875, "global_step": 269394, "epoch": 2226} {"train_loss": -43.03972244262695, "global_step": 269395, "epoch": 2226} {"train_loss": -43.562713623046875, "global_step": 269396, "epoch": 2226} {"train_loss": -43.42599105834961, "global_step": 269397, "epoch": 2226} {"train_loss": -43.18257522583008, "global_step": 269398, "epoch": 2226} {"train_loss": -42.890235900878906, "global_step": 269399, "epoch": 2226} {"train_loss": -43.69810104370117, "global_step": 269400, "epoch": 2226} {"train_loss": -42.778141021728516, "global_step": 269401, "epoch": 2226} {"train_loss": -43.69085693359375, "global_step": 269402, "epoch": 2226} {"train_loss": -43.54286575317383, "global_step": 269403, "epoch": 2226} {"train_loss": -43.921409606933594, "global_step": 269404, "epoch": 2226} {"train_loss": -43.588958740234375, "global_step": 269405, "epoch": 2226} {"train_loss": -43.86248779296875, "global_step": 269406, "epoch": 2226} {"train_loss": -43.63203811645508, "global_step": 269407, "epoch": 2226} {"train_loss": -43.75263595581055, "global_step": 269408, "epoch": 2226} {"train_loss": -43.7421760559082, "global_step": 269409, "epoch": 2226} {"train_loss": -43.98777770996094, "global_step": 269410, "epoch": 2226} {"train_loss": -43.81718444824219, "global_step": 269411, "epoch": 2226} {"train_loss": -43.74107360839844, "global_step": 269412, "epoch": 2226} {"train_loss": -44.21134948730469, "global_step": 269413, "epoch": 2226} {"train_loss": -43.62334060668945, "global_step": 269414, "epoch": 2226} {"train_loss": -43.415435791015625, "global_step": 269415, "epoch": 2226} {"train_loss": -44.11488723754883, "global_step": 269416, "epoch": 2226} {"train_loss": -43.99881362915039, "global_step": 269417, "epoch": 2226} {"train_loss": -44.50635528564453, "global_step": 269418, "epoch": 2226} {"train_loss": -44.46802520751953, "global_step": 269419, "epoch": 2226} {"train_loss": -44.156002044677734, "global_step": 269420, "epoch": 2226} {"train_loss": -44.3316650390625, "global_step": 269421, "epoch": 2226} {"train_loss": -44.39727020263672, "global_step": 269422, "epoch": 2226} {"train_loss": -44.405548095703125, "global_step": 269423, "epoch": 2226} {"train_loss": -44.50066375732422, "global_step": 269424, "epoch": 2226} {"train_loss": -44.399139404296875, "global_step": 269425, "epoch": 2226} {"train_loss": -44.274776458740234, "global_step": 269426, "epoch": 2226} {"train_loss": -44.109527587890625, "global_step": 269427, "epoch": 2226} {"train_loss": -44.14815902709961, "global_step": 269428, "epoch": 2226} {"train_loss": -43.78768539428711, "global_step": 269429, "epoch": 2226} {"train_loss": -44.12832260131836, "global_step": 269430, "epoch": 2226} {"train_loss": -44.004638671875, "global_step": 269431, "epoch": 2226} {"train_loss": -44.58857345581055, "global_step": 269432, "epoch": 2226} {"train_loss": -44.20380783081055, "global_step": 269433, "epoch": 2226} {"train_loss": -43.17459487915039, "global_step": 269434, "epoch": 2226} {"train_loss": -42.03400802612305, "global_step": 269435, "epoch": 2226} {"train_loss": -43.44424819946289, "global_step": 269436, "epoch": 2226} {"train_loss": -43.4589958190918, "global_step": 269437, "epoch": 2226} {"train_loss": -42.84849166870117, "global_step": 269438, "epoch": 2226} {"train_loss": -43.35500717163086, "global_step": 269439, "epoch": 2226} {"train_loss": -41.731021881103516, "global_step": 269440, "epoch": 2226} {"train_loss": -43.01471710205078, "global_step": 269441, "epoch": 2226} {"train_loss": -43.18315505981445, "global_step": 269442, "epoch": 2226} {"train_loss": -43.7016716003418, "global_step": 269443, "epoch": 2226} {"train_loss": -42.816619873046875, "global_step": 269444, "epoch": 2226} {"train_loss": -42.033058166503906, "global_step": 269445, "epoch": 2226} {"train_loss": -42.03376007080078, "global_step": 269446, "epoch": 2226} {"train_loss": -42.183006286621094, "global_step": 269447, "epoch": 2226} {"train_loss": -42.63700485229492, "global_step": 269448, "epoch": 2226} {"train_loss": -41.38457489013672, "global_step": 269449, "epoch": 2226} {"train_loss": -42.09128189086914, "global_step": 269450, "epoch": 2226} {"train_loss": -42.54983901977539, "global_step": 269451, "epoch": 2226} {"train_loss": -41.63589096069336, "global_step": 269452, "epoch": 2226} {"train_loss": -41.48167037963867, "global_step": 269453, "epoch": 2226} {"train_loss": -42.266845703125, "global_step": 269454, "epoch": 2226} {"train_loss": -42.59027099609375, "global_step": 269455, "epoch": 2226} {"train_loss": -41.86186599731445, "global_step": 269456, "epoch": 2226} {"train_loss": -40.905250549316406, "global_step": 269457, "epoch": 2226} {"train_loss": -42.82469177246094, "global_step": 269458, "epoch": 2226} {"train_loss": -41.855194091796875, "global_step": 269459, "epoch": 2226} {"train_loss": -40.32697677612305, "global_step": 269460, "epoch": 2226} {"train_loss": -42.94469451904297, "global_step": 269461, "epoch": 2226} {"train_loss": -38.967559814453125, "global_step": 269462, "epoch": 2226} {"train_loss": -42.4978141784668, "global_step": 269463, "epoch": 2226} {"train_loss": -35.67271041870117, "global_step": 269464, "epoch": 2226} {"train_loss": -41.61595153808594, "global_step": 269465, "epoch": 2226} {"train_loss": -42.927988052368164, "global_step": 269466, "epoch": 2226, "val_loss": 2772251.25} {"train_loss": -34.074684143066406, "global_step": 269467, "epoch": 2227} {"train_loss": -38.6008415222168, "global_step": 269468, "epoch": 2227} {"train_loss": -32.11392593383789, "global_step": 269469, "epoch": 2227} {"train_loss": -37.49799728393555, "global_step": 269470, "epoch": 2227} {"train_loss": -31.373096466064453, "global_step": 269471, "epoch": 2227} {"train_loss": -38.21976852416992, "global_step": 269472, "epoch": 2227} {"train_loss": -34.52741622924805, "global_step": 269473, "epoch": 2227} {"train_loss": -39.632083892822266, "global_step": 269474, "epoch": 2227} {"train_loss": -34.338619232177734, "global_step": 269475, "epoch": 2227} {"train_loss": -39.58272933959961, "global_step": 269476, "epoch": 2227} {"train_loss": -37.66661834716797, "global_step": 269477, "epoch": 2227} {"train_loss": -38.99922180175781, "global_step": 269478, "epoch": 2227} {"train_loss": -39.830013275146484, "global_step": 269479, "epoch": 2227} {"train_loss": -39.209625244140625, "global_step": 269480, "epoch": 2227} {"train_loss": -39.305145263671875, "global_step": 269481, "epoch": 2227} {"train_loss": -39.33254623413086, "global_step": 269482, "epoch": 2227} {"train_loss": -40.40809631347656, "global_step": 269483, "epoch": 2227} {"train_loss": -41.01430892944336, "global_step": 269484, "epoch": 2227} {"train_loss": -40.073509216308594, "global_step": 269485, "epoch": 2227} {"train_loss": -41.0675163269043, "global_step": 269486, "epoch": 2227} {"train_loss": -41.518638610839844, "global_step": 269487, "epoch": 2227} {"train_loss": -40.92398452758789, "global_step": 269488, "epoch": 2227} {"train_loss": -41.56439971923828, "global_step": 269489, "epoch": 2227} {"train_loss": -40.65823745727539, "global_step": 269490, "epoch": 2227} {"train_loss": -41.180519104003906, "global_step": 269491, "epoch": 2227} {"train_loss": -41.0040283203125, "global_step": 269492, "epoch": 2227} {"train_loss": -41.72382354736328, "global_step": 269493, "epoch": 2227} {"train_loss": -41.836429595947266, "global_step": 269494, "epoch": 2227} {"train_loss": -41.51835632324219, "global_step": 269495, "epoch": 2227} {"train_loss": -42.492950439453125, "global_step": 269496, "epoch": 2227} {"train_loss": -41.92909622192383, "global_step": 269497, "epoch": 2227} {"train_loss": -42.3454704284668, "global_step": 269498, "epoch": 2227} {"train_loss": -42.252742767333984, "global_step": 269499, "epoch": 2227} {"train_loss": -42.626617431640625, "global_step": 269500, "epoch": 2227} {"train_loss": -42.31578826904297, "global_step": 269501, "epoch": 2227} {"train_loss": -42.12295913696289, "global_step": 269502, "epoch": 2227} {"train_loss": -42.59601593017578, "global_step": 269503, "epoch": 2227} {"train_loss": -42.34623718261719, "global_step": 269504, "epoch": 2227} {"train_loss": -42.13457107543945, "global_step": 269505, "epoch": 2227} {"train_loss": -42.73500442504883, "global_step": 269506, "epoch": 2227} {"train_loss": -42.57712936401367, "global_step": 269507, "epoch": 2227} {"train_loss": -42.75095748901367, "global_step": 269508, "epoch": 2227} {"train_loss": -42.77517318725586, "global_step": 269509, "epoch": 2227} {"train_loss": -42.89829635620117, "global_step": 269510, "epoch": 2227} {"train_loss": -43.024166107177734, "global_step": 269511, "epoch": 2227} {"train_loss": -43.128639221191406, "global_step": 269512, "epoch": 2227} {"train_loss": -43.155086517333984, "global_step": 269513, "epoch": 2227} {"train_loss": -43.21934127807617, "global_step": 269514, "epoch": 2227} {"train_loss": -43.3614501953125, "global_step": 269515, "epoch": 2227} {"train_loss": -43.399070739746094, "global_step": 269516, "epoch": 2227} {"train_loss": -43.69033432006836, "global_step": 269517, "epoch": 2227} {"train_loss": -43.17292404174805, "global_step": 269518, "epoch": 2227} {"train_loss": -43.391719818115234, "global_step": 269519, "epoch": 2227} {"train_loss": -43.59944534301758, "global_step": 269520, "epoch": 2227} {"train_loss": -43.522735595703125, "global_step": 269521, "epoch": 2227} {"train_loss": -43.274959564208984, "global_step": 269522, "epoch": 2227} {"train_loss": -43.43208694458008, "global_step": 269523, "epoch": 2227} {"train_loss": -43.66097640991211, "global_step": 269524, "epoch": 2227} {"train_loss": -43.374202728271484, "global_step": 269525, "epoch": 2227} {"train_loss": -43.68569564819336, "global_step": 269526, "epoch": 2227} {"train_loss": -43.4136848449707, "global_step": 269527, "epoch": 2227} {"train_loss": -43.46908187866211, "global_step": 269528, "epoch": 2227} {"train_loss": -44.17892837524414, "global_step": 269529, "epoch": 2227} {"train_loss": -43.14006423950195, "global_step": 269530, "epoch": 2227} {"train_loss": -43.28407669067383, "global_step": 269531, "epoch": 2227} {"train_loss": -43.8388786315918, "global_step": 269532, "epoch": 2227} {"train_loss": -43.62091827392578, "global_step": 269533, "epoch": 2227} {"train_loss": -44.04627227783203, "global_step": 269534, "epoch": 2227} {"train_loss": -43.64921188354492, "global_step": 269535, "epoch": 2227} {"train_loss": -43.754920959472656, "global_step": 269536, "epoch": 2227} {"train_loss": -43.8619270324707, "global_step": 269537, "epoch": 2227} {"train_loss": -44.329036712646484, "global_step": 269538, "epoch": 2227} {"train_loss": -43.89809799194336, "global_step": 269539, "epoch": 2227} {"train_loss": -43.61252975463867, "global_step": 269540, "epoch": 2227} {"train_loss": -44.02568435668945, "global_step": 269541, "epoch": 2227} {"train_loss": -43.85287094116211, "global_step": 269542, "epoch": 2227} {"train_loss": -44.17330551147461, "global_step": 269543, "epoch": 2227} {"train_loss": -44.302486419677734, "global_step": 269544, "epoch": 2227} {"train_loss": -43.824615478515625, "global_step": 269545, "epoch": 2227} {"train_loss": -44.21489715576172, "global_step": 269546, "epoch": 2227} {"train_loss": -44.26301956176758, "global_step": 269547, "epoch": 2227} {"train_loss": -44.28016662597656, "global_step": 269548, "epoch": 2227} {"train_loss": -44.493682861328125, "global_step": 269549, "epoch": 2227} {"train_loss": -43.95846176147461, "global_step": 269550, "epoch": 2227} {"train_loss": -44.23838424682617, "global_step": 269551, "epoch": 2227} {"train_loss": -43.50963592529297, "global_step": 269552, "epoch": 2227} {"train_loss": -44.550907135009766, "global_step": 269553, "epoch": 2227} {"train_loss": -43.98289108276367, "global_step": 269554, "epoch": 2227} {"train_loss": -44.42857360839844, "global_step": 269555, "epoch": 2227} {"train_loss": -44.49855422973633, "global_step": 269556, "epoch": 2227} {"train_loss": -44.05991744995117, "global_step": 269557, "epoch": 2227} {"train_loss": -44.2791748046875, "global_step": 269558, "epoch": 2227} {"train_loss": -43.618831634521484, "global_step": 269559, "epoch": 2227} {"train_loss": -44.49493408203125, "global_step": 269560, "epoch": 2227} {"train_loss": -43.756507873535156, "global_step": 269561, "epoch": 2227} {"train_loss": -44.32589340209961, "global_step": 269562, "epoch": 2227} {"train_loss": -44.67092514038086, "global_step": 269563, "epoch": 2227} {"train_loss": -43.26459503173828, "global_step": 269564, "epoch": 2227} {"train_loss": -43.14309310913086, "global_step": 269565, "epoch": 2227} {"train_loss": -43.16898727416992, "global_step": 269566, "epoch": 2227} {"train_loss": -42.92139434814453, "global_step": 269567, "epoch": 2227} {"train_loss": -42.53253173828125, "global_step": 269568, "epoch": 2227} {"train_loss": -41.91060256958008, "global_step": 269569, "epoch": 2227} {"train_loss": -41.697357177734375, "global_step": 269570, "epoch": 2227} {"train_loss": -42.69123458862305, "global_step": 269571, "epoch": 2227} {"train_loss": -43.206504821777344, "global_step": 269572, "epoch": 2227} {"train_loss": -44.02871322631836, "global_step": 269573, "epoch": 2227} {"train_loss": -43.72032928466797, "global_step": 269574, "epoch": 2227} {"train_loss": -43.75603103637695, "global_step": 269575, "epoch": 2227} {"train_loss": -43.18416976928711, "global_step": 269576, "epoch": 2227} {"train_loss": -44.192108154296875, "global_step": 269577, "epoch": 2227} {"train_loss": -41.410701751708984, "global_step": 269578, "epoch": 2227} {"train_loss": -40.1255989074707, "global_step": 269579, "epoch": 2227} {"train_loss": -42.29960250854492, "global_step": 269580, "epoch": 2227} {"train_loss": -43.524139404296875, "global_step": 269581, "epoch": 2227} {"train_loss": -43.102352142333984, "global_step": 269582, "epoch": 2227} {"train_loss": -42.412593841552734, "global_step": 269583, "epoch": 2227} {"train_loss": -43.572967529296875, "global_step": 269584, "epoch": 2227} {"train_loss": -42.8416748046875, "global_step": 269585, "epoch": 2227} {"train_loss": -42.59232711791992, "global_step": 269586, "epoch": 2227} {"train_loss": -42.24392161093468, "global_step": 269587, "epoch": 2227, "val_loss": 2638336.25} {"train_loss": -43.73808670043945, "global_step": 269588, "epoch": 2228} {"train_loss": -43.43948745727539, "global_step": 269589, "epoch": 2228} {"train_loss": -43.758079528808594, "global_step": 269590, "epoch": 2228} {"train_loss": -43.74873733520508, "global_step": 269591, "epoch": 2228} {"train_loss": -41.906288146972656, "global_step": 269592, "epoch": 2228} {"train_loss": -43.43426513671875, "global_step": 269593, "epoch": 2228} {"train_loss": -43.9923095703125, "global_step": 269594, "epoch": 2228} {"train_loss": -42.71256637573242, "global_step": 269595, "epoch": 2228} {"train_loss": -43.57236862182617, "global_step": 269596, "epoch": 2228} {"train_loss": -43.79640197753906, "global_step": 269597, "epoch": 2228} {"train_loss": -43.65228271484375, "global_step": 269598, "epoch": 2228} {"train_loss": -44.05580520629883, "global_step": 269599, "epoch": 2228} {"train_loss": -43.71284103393555, "global_step": 269600, "epoch": 2228} {"train_loss": -43.65823745727539, "global_step": 269601, "epoch": 2228} {"train_loss": -43.79104232788086, "global_step": 269602, "epoch": 2228} {"train_loss": -43.342464447021484, "global_step": 269603, "epoch": 2228} {"train_loss": -43.73487091064453, "global_step": 269604, "epoch": 2228} {"train_loss": -43.33200454711914, "global_step": 269605, "epoch": 2228} {"train_loss": -44.208900451660156, "global_step": 269606, "epoch": 2228} {"train_loss": -42.5803337097168, "global_step": 269607, "epoch": 2228} {"train_loss": -41.56590270996094, "global_step": 269608, "epoch": 2228} {"train_loss": -43.89780807495117, "global_step": 269609, "epoch": 2228} {"train_loss": -41.71674728393555, "global_step": 269610, "epoch": 2228} {"train_loss": -42.257652282714844, "global_step": 269611, "epoch": 2228} {"train_loss": -43.08602523803711, "global_step": 269612, "epoch": 2228} {"train_loss": -41.546913146972656, "global_step": 269613, "epoch": 2228} {"train_loss": -42.79122543334961, "global_step": 269614, "epoch": 2228} {"train_loss": -40.832923889160156, "global_step": 269615, "epoch": 2228} {"train_loss": -43.168941497802734, "global_step": 269616, "epoch": 2228} {"train_loss": -43.22754669189453, "global_step": 269617, "epoch": 2228} {"train_loss": -41.14776611328125, "global_step": 269618, "epoch": 2228} {"train_loss": -42.82686996459961, "global_step": 269619, "epoch": 2228} {"train_loss": -43.10708999633789, "global_step": 269620, "epoch": 2228} {"train_loss": -40.00324630737305, "global_step": 269621, "epoch": 2228} {"train_loss": -38.5763053894043, "global_step": 269622, "epoch": 2228} {"train_loss": -41.217262268066406, "global_step": 269623, "epoch": 2228} {"train_loss": -36.981101989746094, "global_step": 269624, "epoch": 2228} {"train_loss": -38.7154655456543, "global_step": 269625, "epoch": 2228} {"train_loss": -35.46770095825195, "global_step": 269626, "epoch": 2228} {"train_loss": -39.54302978515625, "global_step": 269627, "epoch": 2228} {"train_loss": -34.292110443115234, "global_step": 269628, "epoch": 2228} {"train_loss": -37.38550567626953, "global_step": 269629, "epoch": 2228} {"train_loss": -38.809478759765625, "global_step": 269630, "epoch": 2228} {"train_loss": -37.24178695678711, "global_step": 269631, "epoch": 2228} {"train_loss": -37.98039627075195, "global_step": 269632, "epoch": 2228} {"train_loss": -38.08001708984375, "global_step": 269633, "epoch": 2228} {"train_loss": -38.62484359741211, "global_step": 269634, "epoch": 2228} {"train_loss": -40.54560089111328, "global_step": 269635, "epoch": 2228} {"train_loss": -40.453125, "global_step": 269636, "epoch": 2228} {"train_loss": -41.27177810668945, "global_step": 269637, "epoch": 2228} {"train_loss": -41.37981033325195, "global_step": 269638, "epoch": 2228} {"train_loss": -41.239471435546875, "global_step": 269639, "epoch": 2228} {"train_loss": -41.25630569458008, "global_step": 269640, "epoch": 2228} {"train_loss": -40.52191162109375, "global_step": 269641, "epoch": 2228} {"train_loss": -40.82532501220703, "global_step": 269642, "epoch": 2228} {"train_loss": -41.7816276550293, "global_step": 269643, "epoch": 2228} {"train_loss": -40.46963119506836, "global_step": 269644, "epoch": 2228} {"train_loss": -42.64392852783203, "global_step": 269645, "epoch": 2228} {"train_loss": -40.36697006225586, "global_step": 269646, "epoch": 2228} {"train_loss": -41.93512725830078, "global_step": 269647, "epoch": 2228} {"train_loss": -41.11942672729492, "global_step": 269648, "epoch": 2228} {"train_loss": -43.157814025878906, "global_step": 269649, "epoch": 2228} {"train_loss": -40.82078170776367, "global_step": 269650, "epoch": 2228} {"train_loss": -42.62954330444336, "global_step": 269651, "epoch": 2228} {"train_loss": -41.919654846191406, "global_step": 269652, "epoch": 2228} {"train_loss": -42.55992889404297, "global_step": 269653, "epoch": 2228} {"train_loss": -41.822509765625, "global_step": 269654, "epoch": 2228} {"train_loss": -42.89082336425781, "global_step": 269655, "epoch": 2228} {"train_loss": -42.939056396484375, "global_step": 269656, "epoch": 2228} {"train_loss": -43.17673873901367, "global_step": 269657, "epoch": 2228} {"train_loss": -42.6209716796875, "global_step": 269658, "epoch": 2228} {"train_loss": -42.99528884887695, "global_step": 269659, "epoch": 2228} {"train_loss": -43.31321334838867, "global_step": 269660, "epoch": 2228} {"train_loss": -41.9002571105957, "global_step": 269661, "epoch": 2228} {"train_loss": -42.85920333862305, "global_step": 269662, "epoch": 2228} {"train_loss": -41.97370529174805, "global_step": 269663, "epoch": 2228} {"train_loss": -43.25959014892578, "global_step": 269664, "epoch": 2228} {"train_loss": -43.19270706176758, "global_step": 269665, "epoch": 2228} {"train_loss": -43.09253692626953, "global_step": 269666, "epoch": 2228} {"train_loss": -41.33481979370117, "global_step": 269667, "epoch": 2228} {"train_loss": -43.06572723388672, "global_step": 269668, "epoch": 2228} {"train_loss": -43.32589340209961, "global_step": 269669, "epoch": 2228} {"train_loss": -43.28391647338867, "global_step": 269670, "epoch": 2228} {"train_loss": -43.252410888671875, "global_step": 269671, "epoch": 2228} {"train_loss": -42.05523681640625, "global_step": 269672, "epoch": 2228} {"train_loss": -40.44630432128906, "global_step": 269673, "epoch": 2228} {"train_loss": -42.22710037231445, "global_step": 269674, "epoch": 2228} {"train_loss": -40.701595306396484, "global_step": 269675, "epoch": 2228} {"train_loss": -40.86140060424805, "global_step": 269676, "epoch": 2228} {"train_loss": -41.46455001831055, "global_step": 269677, "epoch": 2228} {"train_loss": -42.73208236694336, "global_step": 269678, "epoch": 2228} {"train_loss": -35.506011962890625, "global_step": 269679, "epoch": 2228} {"train_loss": -39.229164123535156, "global_step": 269680, "epoch": 2228} {"train_loss": -42.3415412902832, "global_step": 269681, "epoch": 2228} {"train_loss": -42.40006637573242, "global_step": 269682, "epoch": 2228} {"train_loss": -38.20158767700195, "global_step": 269683, "epoch": 2228} {"train_loss": -40.7224235534668, "global_step": 269684, "epoch": 2228} {"train_loss": -42.6193962097168, "global_step": 269685, "epoch": 2228} {"train_loss": -42.31716537475586, "global_step": 269686, "epoch": 2228} {"train_loss": -39.602840423583984, "global_step": 269687, "epoch": 2228} {"train_loss": -42.25936508178711, "global_step": 269688, "epoch": 2228} {"train_loss": -41.6411247253418, "global_step": 269689, "epoch": 2228} {"train_loss": -42.91660690307617, "global_step": 269690, "epoch": 2228} {"train_loss": -37.670772552490234, "global_step": 269691, "epoch": 2228} {"train_loss": -42.708106994628906, "global_step": 269692, "epoch": 2228} {"train_loss": -42.031898498535156, "global_step": 269693, "epoch": 2228} {"train_loss": -42.25128936767578, "global_step": 269694, "epoch": 2228} {"train_loss": -41.58362579345703, "global_step": 269695, "epoch": 2228} {"train_loss": -40.44021224975586, "global_step": 269696, "epoch": 2228} {"train_loss": -39.38724136352539, "global_step": 269697, "epoch": 2228} {"train_loss": -42.819122314453125, "global_step": 269698, "epoch": 2228} {"train_loss": -41.12350082397461, "global_step": 269699, "epoch": 2228} {"train_loss": -39.810951232910156, "global_step": 269700, "epoch": 2228} {"train_loss": -38.04877853393555, "global_step": 269701, "epoch": 2228} {"train_loss": -42.613365173339844, "global_step": 269702, "epoch": 2228} {"train_loss": -41.53343200683594, "global_step": 269703, "epoch": 2228} {"train_loss": -42.6147346496582, "global_step": 269704, "epoch": 2228} {"train_loss": -42.778297424316406, "global_step": 269705, "epoch": 2228} {"train_loss": -41.258296966552734, "global_step": 269706, "epoch": 2228} {"train_loss": -40.36649703979492, "global_step": 269707, "epoch": 2228} {"train_loss": -41.59629096669599, "global_step": 269708, "epoch": 2228, "val_loss": 2565530.0} {"train_loss": -42.409297943115234, "global_step": 269709, "epoch": 2229} {"train_loss": -42.97287368774414, "global_step": 269710, "epoch": 2229} {"train_loss": -41.30073928833008, "global_step": 269711, "epoch": 2229} {"train_loss": -43.088905334472656, "global_step": 269712, "epoch": 2229} {"train_loss": -42.79902267456055, "global_step": 269713, "epoch": 2229} {"train_loss": -42.89357376098633, "global_step": 269714, "epoch": 2229} {"train_loss": -42.356536865234375, "global_step": 269715, "epoch": 2229} {"train_loss": -42.50119400024414, "global_step": 269716, "epoch": 2229} {"train_loss": -41.11869430541992, "global_step": 269717, "epoch": 2229} {"train_loss": -39.76759338378906, "global_step": 269718, "epoch": 2229} {"train_loss": -42.03890609741211, "global_step": 269719, "epoch": 2229} {"train_loss": -42.08584213256836, "global_step": 269720, "epoch": 2229} {"train_loss": -43.32630157470703, "global_step": 269721, "epoch": 2229} {"train_loss": -42.276222229003906, "global_step": 269722, "epoch": 2229} {"train_loss": -43.08835220336914, "global_step": 269723, "epoch": 2229} {"train_loss": -42.415931701660156, "global_step": 269724, "epoch": 2229} {"train_loss": -43.4249153137207, "global_step": 269725, "epoch": 2229} {"train_loss": -40.55807113647461, "global_step": 269726, "epoch": 2229} {"train_loss": -42.754127502441406, "global_step": 269727, "epoch": 2229} {"train_loss": -42.856868743896484, "global_step": 269728, "epoch": 2229} {"train_loss": -42.57308578491211, "global_step": 269729, "epoch": 2229} {"train_loss": -42.95432662963867, "global_step": 269730, "epoch": 2229} {"train_loss": -41.74248504638672, "global_step": 269731, "epoch": 2229} {"train_loss": -42.40200424194336, "global_step": 269732, "epoch": 2229} {"train_loss": -42.35178756713867, "global_step": 269733, "epoch": 2229} {"train_loss": -42.10302734375, "global_step": 269734, "epoch": 2229} {"train_loss": -41.0283317565918, "global_step": 269735, "epoch": 2229} {"train_loss": -41.8183708190918, "global_step": 269736, "epoch": 2229} {"train_loss": -42.495487213134766, "global_step": 269737, "epoch": 2229} {"train_loss": -43.26139450073242, "global_step": 269738, "epoch": 2229} {"train_loss": -42.74496078491211, "global_step": 269739, "epoch": 2229} {"train_loss": -43.59588623046875, "global_step": 269740, "epoch": 2229} {"train_loss": -42.017333984375, "global_step": 269741, "epoch": 2229} {"train_loss": -42.899818420410156, "global_step": 269742, "epoch": 2229} {"train_loss": -42.454097747802734, "global_step": 269743, "epoch": 2229} {"train_loss": -43.66473388671875, "global_step": 269744, "epoch": 2229} {"train_loss": -43.13744354248047, "global_step": 269745, "epoch": 2229} {"train_loss": -43.12247085571289, "global_step": 269746, "epoch": 2229} {"train_loss": -42.98763656616211, "global_step": 269747, "epoch": 2229} {"train_loss": -43.370643615722656, "global_step": 269748, "epoch": 2229} {"train_loss": -42.17032241821289, "global_step": 269749, "epoch": 2229} {"train_loss": -43.52626419067383, "global_step": 269750, "epoch": 2229} {"train_loss": -43.95048141479492, "global_step": 269751, "epoch": 2229} {"train_loss": -43.06452560424805, "global_step": 269752, "epoch": 2229} {"train_loss": -41.89801788330078, "global_step": 269753, "epoch": 2229} {"train_loss": -43.378414154052734, "global_step": 269754, "epoch": 2229} {"train_loss": -42.83278274536133, "global_step": 269755, "epoch": 2229} {"train_loss": -43.03712463378906, "global_step": 269756, "epoch": 2229} {"train_loss": -43.22465133666992, "global_step": 269757, "epoch": 2229} {"train_loss": -43.41232681274414, "global_step": 269758, "epoch": 2229} {"train_loss": -43.72538375854492, "global_step": 269759, "epoch": 2229} {"train_loss": -43.245208740234375, "global_step": 269760, "epoch": 2229} {"train_loss": -43.308223724365234, "global_step": 269761, "epoch": 2229} {"train_loss": -42.89280319213867, "global_step": 269762, "epoch": 2229} {"train_loss": -42.68107223510742, "global_step": 269763, "epoch": 2229} {"train_loss": -42.77406692504883, "global_step": 269764, "epoch": 2229} {"train_loss": -43.26633071899414, "global_step": 269765, "epoch": 2229} {"train_loss": -42.87637710571289, "global_step": 269766, "epoch": 2229} {"train_loss": -43.118621826171875, "global_step": 269767, "epoch": 2229} {"train_loss": -41.56307601928711, "global_step": 269768, "epoch": 2229} {"train_loss": -40.30461883544922, "global_step": 269769, "epoch": 2229} {"train_loss": -42.097835540771484, "global_step": 269770, "epoch": 2229} {"train_loss": -42.535945892333984, "global_step": 269771, "epoch": 2229} {"train_loss": -43.0581169128418, "global_step": 269772, "epoch": 2229} {"train_loss": -43.06707000732422, "global_step": 269773, "epoch": 2229} {"train_loss": -41.65659713745117, "global_step": 269774, "epoch": 2229} {"train_loss": -43.78879928588867, "global_step": 269775, "epoch": 2229} {"train_loss": -41.96878433227539, "global_step": 269776, "epoch": 2229} {"train_loss": -42.73818588256836, "global_step": 269777, "epoch": 2229} {"train_loss": -42.3940544128418, "global_step": 269778, "epoch": 2229} {"train_loss": -43.46023178100586, "global_step": 269779, "epoch": 2229} {"train_loss": -43.23147201538086, "global_step": 269780, "epoch": 2229} {"train_loss": -42.59394454956055, "global_step": 269781, "epoch": 2229} {"train_loss": -43.20368194580078, "global_step": 269782, "epoch": 2229} {"train_loss": -42.336238861083984, "global_step": 269783, "epoch": 2229} {"train_loss": -41.95985794067383, "global_step": 269784, "epoch": 2229} {"train_loss": -43.52224349975586, "global_step": 269785, "epoch": 2229} {"train_loss": -43.430885314941406, "global_step": 269786, "epoch": 2229} {"train_loss": -42.57102584838867, "global_step": 269787, "epoch": 2229} {"train_loss": -43.75594711303711, "global_step": 269788, "epoch": 2229} {"train_loss": -41.616329193115234, "global_step": 269789, "epoch": 2229} {"train_loss": -41.786163330078125, "global_step": 269790, "epoch": 2229} {"train_loss": -42.96519088745117, "global_step": 269791, "epoch": 2229} {"train_loss": -43.15482711791992, "global_step": 269792, "epoch": 2229} {"train_loss": -42.58301544189453, "global_step": 269793, "epoch": 2229} {"train_loss": -43.73257064819336, "global_step": 269794, "epoch": 2229} {"train_loss": -42.956478118896484, "global_step": 269795, "epoch": 2229} {"train_loss": -42.60749435424805, "global_step": 269796, "epoch": 2229} {"train_loss": -43.111446380615234, "global_step": 269797, "epoch": 2229} {"train_loss": -43.263763427734375, "global_step": 269798, "epoch": 2229} {"train_loss": -40.9277229309082, "global_step": 269799, "epoch": 2229} {"train_loss": -43.48870849609375, "global_step": 269800, "epoch": 2229} {"train_loss": -42.43489456176758, "global_step": 269801, "epoch": 2229} {"train_loss": -40.79691696166992, "global_step": 269802, "epoch": 2229} {"train_loss": -42.669921875, "global_step": 269803, "epoch": 2229} {"train_loss": -41.70084762573242, "global_step": 269804, "epoch": 2229} {"train_loss": -40.52153015136719, "global_step": 269805, "epoch": 2229} {"train_loss": -43.22157287597656, "global_step": 269806, "epoch": 2229} {"train_loss": -38.74839401245117, "global_step": 269807, "epoch": 2229} {"train_loss": -40.379215240478516, "global_step": 269808, "epoch": 2229} {"train_loss": -40.06888961791992, "global_step": 269809, "epoch": 2229} {"train_loss": -41.92910385131836, "global_step": 269810, "epoch": 2229} {"train_loss": -40.77166748046875, "global_step": 269811, "epoch": 2229} {"train_loss": -40.28314971923828, "global_step": 269812, "epoch": 2229} {"train_loss": -41.78803634643555, "global_step": 269813, "epoch": 2229} {"train_loss": -38.92085647583008, "global_step": 269814, "epoch": 2229} {"train_loss": -39.88644027709961, "global_step": 269815, "epoch": 2229} {"train_loss": -37.65804672241211, "global_step": 269816, "epoch": 2229} {"train_loss": -36.5908317565918, "global_step": 269817, "epoch": 2229} {"train_loss": -38.23661422729492, "global_step": 269818, "epoch": 2229} {"train_loss": -39.88482666015625, "global_step": 269819, "epoch": 2229} {"train_loss": -38.05691146850586, "global_step": 269820, "epoch": 2229} {"train_loss": -37.61751937866211, "global_step": 269821, "epoch": 2229} {"train_loss": -39.401058197021484, "global_step": 269822, "epoch": 2229} {"train_loss": -40.322296142578125, "global_step": 269823, "epoch": 2229} {"train_loss": -41.83475875854492, "global_step": 269824, "epoch": 2229} {"train_loss": -40.44745635986328, "global_step": 269825, "epoch": 2229} {"train_loss": -41.97480773925781, "global_step": 269826, "epoch": 2229} {"train_loss": -41.45876693725586, "global_step": 269827, "epoch": 2229} {"train_loss": -42.48771667480469, "global_step": 269828, "epoch": 2229} {"train_loss": -42.115993152965196, "global_step": 269829, "epoch": 2229, "val_loss": 2658537.0} {"train_loss": -42.6451416015625, "global_step": 269830, "epoch": 2230} {"train_loss": -41.62714767456055, "global_step": 269831, "epoch": 2230} {"train_loss": -42.6267204284668, "global_step": 269832, "epoch": 2230} {"train_loss": -42.48916244506836, "global_step": 269833, "epoch": 2230} {"train_loss": -42.39656448364258, "global_step": 269834, "epoch": 2230} {"train_loss": -42.643680572509766, "global_step": 269835, "epoch": 2230} {"train_loss": -42.62834548950195, "global_step": 269836, "epoch": 2230} {"train_loss": -42.69044494628906, "global_step": 269837, "epoch": 2230} {"train_loss": -42.08333206176758, "global_step": 269838, "epoch": 2230} {"train_loss": -43.496395111083984, "global_step": 269839, "epoch": 2230} {"train_loss": -42.14439010620117, "global_step": 269840, "epoch": 2230} {"train_loss": -42.50641632080078, "global_step": 269841, "epoch": 2230} {"train_loss": -42.8070182800293, "global_step": 269842, "epoch": 2230} {"train_loss": -43.40370559692383, "global_step": 269843, "epoch": 2230} {"train_loss": -42.89016342163086, "global_step": 269844, "epoch": 2230} {"train_loss": -42.63079071044922, "global_step": 269845, "epoch": 2230} {"train_loss": -43.0167350769043, "global_step": 269846, "epoch": 2230} {"train_loss": -42.61750411987305, "global_step": 269847, "epoch": 2230} {"train_loss": -43.4498176574707, "global_step": 269848, "epoch": 2230} {"train_loss": -43.25541305541992, "global_step": 269849, "epoch": 2230} {"train_loss": -43.259029388427734, "global_step": 269850, "epoch": 2230} {"train_loss": -43.59244155883789, "global_step": 269851, "epoch": 2230} {"train_loss": -43.5340576171875, "global_step": 269852, "epoch": 2230} {"train_loss": -43.33985137939453, "global_step": 269853, "epoch": 2230} {"train_loss": -42.95517349243164, "global_step": 269854, "epoch": 2230} {"train_loss": -43.71052169799805, "global_step": 269855, "epoch": 2230} {"train_loss": -42.64315414428711, "global_step": 269856, "epoch": 2230} {"train_loss": -42.0872802734375, "global_step": 269857, "epoch": 2230} {"train_loss": -41.03651809692383, "global_step": 269858, "epoch": 2230} {"train_loss": -42.240081787109375, "global_step": 269859, "epoch": 2230} {"train_loss": -43.50919723510742, "global_step": 269860, "epoch": 2230} {"train_loss": -39.81637191772461, "global_step": 269861, "epoch": 2230} {"train_loss": -37.855995178222656, "global_step": 269862, "epoch": 2230} {"train_loss": -41.167537689208984, "global_step": 269863, "epoch": 2230} {"train_loss": -35.004695892333984, "global_step": 269864, "epoch": 2230} {"train_loss": -35.22733688354492, "global_step": 269865, "epoch": 2230} {"train_loss": -34.04654312133789, "global_step": 269866, "epoch": 2230} {"train_loss": -37.292701721191406, "global_step": 269867, "epoch": 2230} {"train_loss": -36.14875411987305, "global_step": 269868, "epoch": 2230} {"train_loss": -36.7539176940918, "global_step": 269869, "epoch": 2230} {"train_loss": -36.7264404296875, "global_step": 269870, "epoch": 2230} {"train_loss": -36.788063049316406, "global_step": 269871, "epoch": 2230} {"train_loss": -37.6280632019043, "global_step": 269872, "epoch": 2230} {"train_loss": -35.86833190917969, "global_step": 269873, "epoch": 2230} {"train_loss": -36.68892288208008, "global_step": 269874, "epoch": 2230} {"train_loss": -36.02852249145508, "global_step": 269875, "epoch": 2230} {"train_loss": -36.7669792175293, "global_step": 269876, "epoch": 2230} {"train_loss": -37.21798324584961, "global_step": 269877, "epoch": 2230} {"train_loss": -37.06419372558594, "global_step": 269878, "epoch": 2230} {"train_loss": -37.61407470703125, "global_step": 269879, "epoch": 2230} {"train_loss": -37.85505294799805, "global_step": 269880, "epoch": 2230} {"train_loss": -37.700565338134766, "global_step": 269881, "epoch": 2230} {"train_loss": -37.581233978271484, "global_step": 269882, "epoch": 2230} {"train_loss": -37.696285247802734, "global_step": 269883, "epoch": 2230} {"train_loss": -37.563514709472656, "global_step": 269884, "epoch": 2230} {"train_loss": -37.00447463989258, "global_step": 269885, "epoch": 2230} {"train_loss": -38.48722457885742, "global_step": 269886, "epoch": 2230} {"train_loss": -38.443580627441406, "global_step": 269887, "epoch": 2230} {"train_loss": -37.997772216796875, "global_step": 269888, "epoch": 2230} {"train_loss": -38.0743522644043, "global_step": 269889, "epoch": 2230} {"train_loss": -37.57699966430664, "global_step": 269890, "epoch": 2230} {"train_loss": -38.32146453857422, "global_step": 269891, "epoch": 2230} {"train_loss": -38.302852630615234, "global_step": 269892, "epoch": 2230} {"train_loss": -38.777225494384766, "global_step": 269893, "epoch": 2230} {"train_loss": -38.69503402709961, "global_step": 269894, "epoch": 2230} {"train_loss": -39.50846481323242, "global_step": 269895, "epoch": 2230} {"train_loss": -38.893123626708984, "global_step": 269896, "epoch": 2230} {"train_loss": -39.22697067260742, "global_step": 269897, "epoch": 2230} {"train_loss": -39.43658447265625, "global_step": 269898, "epoch": 2230} {"train_loss": -39.38645553588867, "global_step": 269899, "epoch": 2230} {"train_loss": -38.57430648803711, "global_step": 269900, "epoch": 2230} {"train_loss": -38.690650939941406, "global_step": 269901, "epoch": 2230} {"train_loss": -38.89731979370117, "global_step": 269902, "epoch": 2230} {"train_loss": -38.785823822021484, "global_step": 269903, "epoch": 2230} {"train_loss": -39.52948760986328, "global_step": 269904, "epoch": 2230} {"train_loss": -39.49616622924805, "global_step": 269905, "epoch": 2230} {"train_loss": -39.42818069458008, "global_step": 269906, "epoch": 2230} {"train_loss": -39.54219436645508, "global_step": 269907, "epoch": 2230} {"train_loss": -39.0699577331543, "global_step": 269908, "epoch": 2230} {"train_loss": -39.34132385253906, "global_step": 269909, "epoch": 2230} {"train_loss": -40.354759216308594, "global_step": 269910, "epoch": 2230} {"train_loss": -40.21869659423828, "global_step": 269911, "epoch": 2230} {"train_loss": -39.709991455078125, "global_step": 269912, "epoch": 2230} {"train_loss": -40.20135498046875, "global_step": 269913, "epoch": 2230} {"train_loss": -39.599952697753906, "global_step": 269914, "epoch": 2230} {"train_loss": -39.8486328125, "global_step": 269915, "epoch": 2230} {"train_loss": -39.8090705871582, "global_step": 269916, "epoch": 2230} {"train_loss": -39.62327194213867, "global_step": 269917, "epoch": 2230} {"train_loss": -39.25126266479492, "global_step": 269918, "epoch": 2230} {"train_loss": -40.0361442565918, "global_step": 269919, "epoch": 2230} {"train_loss": -39.636775970458984, "global_step": 269920, "epoch": 2230} {"train_loss": -40.2275390625, "global_step": 269921, "epoch": 2230} {"train_loss": -39.95235061645508, "global_step": 269922, "epoch": 2230} {"train_loss": -40.57294464111328, "global_step": 269923, "epoch": 2230} {"train_loss": -40.437862396240234, "global_step": 269924, "epoch": 2230} {"train_loss": -39.9283561706543, "global_step": 269925, "epoch": 2230} {"train_loss": -40.16795349121094, "global_step": 269926, "epoch": 2230} {"train_loss": -40.785926818847656, "global_step": 269927, "epoch": 2230} {"train_loss": -40.14228057861328, "global_step": 269928, "epoch": 2230} {"train_loss": -40.10483932495117, "global_step": 269929, "epoch": 2230} {"train_loss": -38.99692916870117, "global_step": 269930, "epoch": 2230} {"train_loss": -39.1670036315918, "global_step": 269931, "epoch": 2230} {"train_loss": -40.24009323120117, "global_step": 269932, "epoch": 2230} {"train_loss": -40.939998626708984, "global_step": 269933, "epoch": 2230} {"train_loss": -39.74760818481445, "global_step": 269934, "epoch": 2230} {"train_loss": -40.436885833740234, "global_step": 269935, "epoch": 2230} {"train_loss": -40.603084564208984, "global_step": 269936, "epoch": 2230} {"train_loss": -40.61581039428711, "global_step": 269937, "epoch": 2230} {"train_loss": -41.02394104003906, "global_step": 269938, "epoch": 2230} {"train_loss": -40.34665298461914, "global_step": 269939, "epoch": 2230} {"train_loss": -39.470855712890625, "global_step": 269940, "epoch": 2230} {"train_loss": -39.37843322753906, "global_step": 269941, "epoch": 2230} {"train_loss": -39.54289627075195, "global_step": 269942, "epoch": 2230} {"train_loss": -40.0535774230957, "global_step": 269943, "epoch": 2230} {"train_loss": -39.76552963256836, "global_step": 269944, "epoch": 2230} {"train_loss": -40.473628997802734, "global_step": 269945, "epoch": 2230} {"train_loss": -39.87156295776367, "global_step": 269946, "epoch": 2230} {"train_loss": -38.96102523803711, "global_step": 269947, "epoch": 2230} {"train_loss": -40.386627197265625, "global_step": 269948, "epoch": 2230} {"train_loss": -40.74576950073242, "global_step": 269949, "epoch": 2230} {"train_loss": -39.88581305890044, "global_step": 269950, "epoch": 2230, "val_loss": 2671901.75} {"train_loss": -39.87842559814453, "global_step": 269951, "epoch": 2231} {"train_loss": -40.151466369628906, "global_step": 269952, "epoch": 2231} {"train_loss": -39.93800354003906, "global_step": 269953, "epoch": 2231} {"train_loss": -40.75641632080078, "global_step": 269954, "epoch": 2231} {"train_loss": -41.10387420654297, "global_step": 269955, "epoch": 2231} {"train_loss": -41.17435836791992, "global_step": 269956, "epoch": 2231} {"train_loss": -40.88932418823242, "global_step": 269957, "epoch": 2231} {"train_loss": -40.10687255859375, "global_step": 269958, "epoch": 2231} {"train_loss": -39.91539001464844, "global_step": 269959, "epoch": 2231} {"train_loss": -38.232486724853516, "global_step": 269960, "epoch": 2231} {"train_loss": -39.52165603637695, "global_step": 269961, "epoch": 2231} {"train_loss": -41.452178955078125, "global_step": 269962, "epoch": 2231} {"train_loss": -39.92168426513672, "global_step": 269963, "epoch": 2231} {"train_loss": -40.854366302490234, "global_step": 269964, "epoch": 2231} {"train_loss": -40.617576599121094, "global_step": 269965, "epoch": 2231} {"train_loss": -39.96546173095703, "global_step": 269966, "epoch": 2231} {"train_loss": -39.92454147338867, "global_step": 269967, "epoch": 2231} {"train_loss": -41.13978576660156, "global_step": 269968, "epoch": 2231} {"train_loss": -40.46735763549805, "global_step": 269969, "epoch": 2231} {"train_loss": -40.719783782958984, "global_step": 269970, "epoch": 2231} {"train_loss": -41.2676887512207, "global_step": 269971, "epoch": 2231} {"train_loss": -41.25858688354492, "global_step": 269972, "epoch": 2231} {"train_loss": -41.347984313964844, "global_step": 269973, "epoch": 2231} {"train_loss": -40.5391960144043, "global_step": 269974, "epoch": 2231} {"train_loss": -40.85982131958008, "global_step": 269975, "epoch": 2231} {"train_loss": -41.06635284423828, "global_step": 269976, "epoch": 2231} {"train_loss": -40.66609573364258, "global_step": 269977, "epoch": 2231} {"train_loss": -40.187015533447266, "global_step": 269978, "epoch": 2231} {"train_loss": -41.38651657104492, "global_step": 269979, "epoch": 2231} {"train_loss": -40.00197982788086, "global_step": 269980, "epoch": 2231} {"train_loss": -41.06170654296875, "global_step": 269981, "epoch": 2231} {"train_loss": -39.55543899536133, "global_step": 269982, "epoch": 2231} {"train_loss": -40.709259033203125, "global_step": 269983, "epoch": 2231} {"train_loss": -41.88133239746094, "global_step": 269984, "epoch": 2231} {"train_loss": -40.63373565673828, "global_step": 269985, "epoch": 2231} {"train_loss": -41.40696334838867, "global_step": 269986, "epoch": 2231} {"train_loss": -40.77642822265625, "global_step": 269987, "epoch": 2231} {"train_loss": -41.54511260986328, "global_step": 269988, "epoch": 2231} {"train_loss": -40.847076416015625, "global_step": 269989, "epoch": 2231} {"train_loss": -41.30338668823242, "global_step": 269990, "epoch": 2231} {"train_loss": -40.5124397277832, "global_step": 269991, "epoch": 2231} {"train_loss": -41.790443420410156, "global_step": 269992, "epoch": 2231} {"train_loss": -41.53764724731445, "global_step": 269993, "epoch": 2231} {"train_loss": -40.92765426635742, "global_step": 269994, "epoch": 2231} {"train_loss": -41.59109115600586, "global_step": 269995, "epoch": 2231} {"train_loss": -40.697444915771484, "global_step": 269996, "epoch": 2231} {"train_loss": -40.88568878173828, "global_step": 269997, "epoch": 2231} {"train_loss": -39.30588912963867, "global_step": 269998, "epoch": 2231} {"train_loss": -40.96879959106445, "global_step": 269999, "epoch": 2231} {"train_loss": -40.01160430908203, "global_step": 270000, "epoch": 2231} {"train_loss": -41.937416076660156, "global_step": 270001, "epoch": 2231} {"train_loss": -40.10708236694336, "global_step": 270002, "epoch": 2231} {"train_loss": -40.842403411865234, "global_step": 270003, "epoch": 2231} {"train_loss": -41.211788177490234, "global_step": 270004, "epoch": 2231} {"train_loss": -40.85640335083008, "global_step": 270005, "epoch": 2231} {"train_loss": -41.050418853759766, "global_step": 270006, "epoch": 2231} {"train_loss": -41.121944427490234, "global_step": 270007, "epoch": 2231} {"train_loss": -41.15797424316406, "global_step": 270008, "epoch": 2231} {"train_loss": -42.35309982299805, "global_step": 270009, "epoch": 2231} {"train_loss": -41.08746337890625, "global_step": 270010, "epoch": 2231} {"train_loss": -39.790523529052734, "global_step": 270011, "epoch": 2231} {"train_loss": -41.09975051879883, "global_step": 270012, "epoch": 2231} {"train_loss": -36.07209396362305, "global_step": 270013, "epoch": 2231} {"train_loss": -41.100502014160156, "global_step": 270014, "epoch": 2231} {"train_loss": -35.306251525878906, "global_step": 270015, "epoch": 2231} {"train_loss": -38.26582717895508, "global_step": 270016, "epoch": 2231} {"train_loss": -35.507568359375, "global_step": 270017, "epoch": 2231} {"train_loss": -37.763671875, "global_step": 270018, "epoch": 2231} {"train_loss": -36.172550201416016, "global_step": 270019, "epoch": 2231} {"train_loss": -33.474369049072266, "global_step": 270020, "epoch": 2231} {"train_loss": -40.22197341918945, "global_step": 270021, "epoch": 2231} {"train_loss": -30.367664337158203, "global_step": 270022, "epoch": 2231} {"train_loss": -33.07161331176758, "global_step": 270023, "epoch": 2231} {"train_loss": -34.71150207519531, "global_step": 270024, "epoch": 2231} {"train_loss": -34.9866828918457, "global_step": 270025, "epoch": 2231} {"train_loss": -34.456626892089844, "global_step": 270026, "epoch": 2231} {"train_loss": -37.1914176940918, "global_step": 270027, "epoch": 2231} {"train_loss": -22.262338638305664, "global_step": 270028, "epoch": 2231} {"train_loss": -33.226890563964844, "global_step": 270029, "epoch": 2231} {"train_loss": -37.56351852416992, "global_step": 270030, "epoch": 2231} {"train_loss": -33.62592315673828, "global_step": 270031, "epoch": 2231} {"train_loss": -37.299407958984375, "global_step": 270032, "epoch": 2231} {"train_loss": -36.56231689453125, "global_step": 270033, "epoch": 2231} {"train_loss": -33.6646728515625, "global_step": 270034, "epoch": 2231} {"train_loss": -32.626155853271484, "global_step": 270035, "epoch": 2231} {"train_loss": -29.95686149597168, "global_step": 270036, "epoch": 2231} {"train_loss": -34.95204544067383, "global_step": 270037, "epoch": 2231} {"train_loss": -33.67552185058594, "global_step": 270038, "epoch": 2231} {"train_loss": -39.49770736694336, "global_step": 270039, "epoch": 2231} {"train_loss": -33.29777145385742, "global_step": 270040, "epoch": 2231} {"train_loss": -33.14054489135742, "global_step": 270041, "epoch": 2231} {"train_loss": -37.71852493286133, "global_step": 270042, "epoch": 2231} {"train_loss": -35.9487419128418, "global_step": 270043, "epoch": 2231} {"train_loss": -36.74187469482422, "global_step": 270044, "epoch": 2231} {"train_loss": -33.01020050048828, "global_step": 270045, "epoch": 2231} {"train_loss": -32.65007400512695, "global_step": 270046, "epoch": 2231} {"train_loss": -36.762874603271484, "global_step": 270047, "epoch": 2231} {"train_loss": -35.09726333618164, "global_step": 270048, "epoch": 2231} {"train_loss": -35.42776107788086, "global_step": 270049, "epoch": 2231} {"train_loss": -37.04673385620117, "global_step": 270050, "epoch": 2231} {"train_loss": -36.63850784301758, "global_step": 270051, "epoch": 2231} {"train_loss": -37.3469352722168, "global_step": 270052, "epoch": 2231} {"train_loss": -34.1760139465332, "global_step": 270053, "epoch": 2231} {"train_loss": -26.87106704711914, "global_step": 270054, "epoch": 2231} {"train_loss": -30.518661499023438, "global_step": 270055, "epoch": 2231} {"train_loss": -34.9935302734375, "global_step": 270056, "epoch": 2231} {"train_loss": -36.13277053833008, "global_step": 270057, "epoch": 2231} {"train_loss": -36.667110443115234, "global_step": 270058, "epoch": 2231} {"train_loss": -36.05056381225586, "global_step": 270059, "epoch": 2231} {"train_loss": -38.173091888427734, "global_step": 270060, "epoch": 2231} {"train_loss": -37.8157844543457, "global_step": 270061, "epoch": 2231} {"train_loss": -36.588985443115234, "global_step": 270062, "epoch": 2231} {"train_loss": -37.4039306640625, "global_step": 270063, "epoch": 2231} {"train_loss": -37.58727264404297, "global_step": 270064, "epoch": 2231} {"train_loss": -37.4900016784668, "global_step": 270065, "epoch": 2231} {"train_loss": -38.33061981201172, "global_step": 270066, "epoch": 2231} {"train_loss": -37.355560302734375, "global_step": 270067, "epoch": 2231} {"train_loss": -37.72396469116211, "global_step": 270068, "epoch": 2231} {"train_loss": -37.554351806640625, "global_step": 270069, "epoch": 2231} {"train_loss": -38.71877670288086, "global_step": 270070, "epoch": 2231} {"train_loss": -38.162568336675974, "global_step": 270071, "epoch": 2231, "val_loss": 2645936.25} {"train_loss": -37.99375534057617, "global_step": 270072, "epoch": 2232} {"train_loss": -38.760433197021484, "global_step": 270073, "epoch": 2232} {"train_loss": -38.20576477050781, "global_step": 270074, "epoch": 2232} {"train_loss": -37.97370529174805, "global_step": 270075, "epoch": 2232} {"train_loss": -36.874786376953125, "global_step": 270076, "epoch": 2232} {"train_loss": -37.30289840698242, "global_step": 270077, "epoch": 2232} {"train_loss": -38.361507415771484, "global_step": 270078, "epoch": 2232} {"train_loss": -38.94916915893555, "global_step": 270079, "epoch": 2232} {"train_loss": -36.580928802490234, "global_step": 270080, "epoch": 2232} {"train_loss": -38.28049850463867, "global_step": 270081, "epoch": 2232} {"train_loss": -38.654537200927734, "global_step": 270082, "epoch": 2232} {"train_loss": -39.4132194519043, "global_step": 270083, "epoch": 2232} {"train_loss": -38.73109817504883, "global_step": 270084, "epoch": 2232} {"train_loss": -39.067440032958984, "global_step": 270085, "epoch": 2232} {"train_loss": -38.44282150268555, "global_step": 270086, "epoch": 2232} {"train_loss": -39.0655632019043, "global_step": 270087, "epoch": 2232} {"train_loss": -39.600887298583984, "global_step": 270088, "epoch": 2232} {"train_loss": -39.261878967285156, "global_step": 270089, "epoch": 2232} {"train_loss": -39.29677200317383, "global_step": 270090, "epoch": 2232} {"train_loss": -39.849456787109375, "global_step": 270091, "epoch": 2232} {"train_loss": -39.29399490356445, "global_step": 270092, "epoch": 2232} {"train_loss": -39.08242416381836, "global_step": 270093, "epoch": 2232} {"train_loss": -39.7263298034668, "global_step": 270094, "epoch": 2232} {"train_loss": -40.15603256225586, "global_step": 270095, "epoch": 2232} {"train_loss": -40.00962448120117, "global_step": 270096, "epoch": 2232} {"train_loss": -38.99760055541992, "global_step": 270097, "epoch": 2232} {"train_loss": -37.97089767456055, "global_step": 270098, "epoch": 2232} {"train_loss": -39.973934173583984, "global_step": 270099, "epoch": 2232} {"train_loss": -35.38930892944336, "global_step": 270100, "epoch": 2232} {"train_loss": -39.65362548828125, "global_step": 270101, "epoch": 2232} {"train_loss": -38.351158142089844, "global_step": 270102, "epoch": 2232} {"train_loss": -39.9238395690918, "global_step": 270103, "epoch": 2232} {"train_loss": -39.75482177734375, "global_step": 270104, "epoch": 2232} {"train_loss": -40.39980697631836, "global_step": 270105, "epoch": 2232} {"train_loss": -40.07725143432617, "global_step": 270106, "epoch": 2232} {"train_loss": -40.164215087890625, "global_step": 270107, "epoch": 2232} {"train_loss": -39.742835998535156, "global_step": 270108, "epoch": 2232} {"train_loss": -40.147377014160156, "global_step": 270109, "epoch": 2232} {"train_loss": -40.20615768432617, "global_step": 270110, "epoch": 2232} {"train_loss": -39.81769943237305, "global_step": 270111, "epoch": 2232} {"train_loss": -40.048736572265625, "global_step": 270112, "epoch": 2232} {"train_loss": -40.008724212646484, "global_step": 270113, "epoch": 2232} {"train_loss": -40.043880462646484, "global_step": 270114, "epoch": 2232} {"train_loss": -39.25864791870117, "global_step": 270115, "epoch": 2232} {"train_loss": -38.174415588378906, "global_step": 270116, "epoch": 2232} {"train_loss": -39.81350326538086, "global_step": 270117, "epoch": 2232} {"train_loss": -38.88105010986328, "global_step": 270118, "epoch": 2232} {"train_loss": -40.215110778808594, "global_step": 270119, "epoch": 2232} {"train_loss": -38.87355422973633, "global_step": 270120, "epoch": 2232} {"train_loss": -39.47585678100586, "global_step": 270121, "epoch": 2232} {"train_loss": -39.872833251953125, "global_step": 270122, "epoch": 2232} {"train_loss": -40.668582916259766, "global_step": 270123, "epoch": 2232} {"train_loss": -39.94856643676758, "global_step": 270124, "epoch": 2232} {"train_loss": -36.93256759643555, "global_step": 270125, "epoch": 2232} {"train_loss": -40.311134338378906, "global_step": 270126, "epoch": 2232} {"train_loss": -39.90607452392578, "global_step": 270127, "epoch": 2232} {"train_loss": -40.78230667114258, "global_step": 270128, "epoch": 2232} {"train_loss": -39.61387252807617, "global_step": 270129, "epoch": 2232} {"train_loss": -39.83517074584961, "global_step": 270130, "epoch": 2232} {"train_loss": -40.039127349853516, "global_step": 270131, "epoch": 2232} {"train_loss": -40.69861602783203, "global_step": 270132, "epoch": 2232} {"train_loss": -40.88275909423828, "global_step": 270133, "epoch": 2232} {"train_loss": -40.13627243041992, "global_step": 270134, "epoch": 2232} {"train_loss": -40.61484909057617, "global_step": 270135, "epoch": 2232} {"train_loss": -40.53489303588867, "global_step": 270136, "epoch": 2232} {"train_loss": -40.053489685058594, "global_step": 270137, "epoch": 2232} {"train_loss": -40.48139572143555, "global_step": 270138, "epoch": 2232} {"train_loss": -40.93149948120117, "global_step": 270139, "epoch": 2232} {"train_loss": -39.696746826171875, "global_step": 270140, "epoch": 2232} {"train_loss": -40.6507682800293, "global_step": 270141, "epoch": 2232} {"train_loss": -40.33024978637695, "global_step": 270142, "epoch": 2232} {"train_loss": -40.277950286865234, "global_step": 270143, "epoch": 2232} {"train_loss": -41.33827590942383, "global_step": 270144, "epoch": 2232} {"train_loss": -40.868648529052734, "global_step": 270145, "epoch": 2232} {"train_loss": -40.45195388793945, "global_step": 270146, "epoch": 2232} {"train_loss": -40.63340759277344, "global_step": 270147, "epoch": 2232} {"train_loss": -40.27134323120117, "global_step": 270148, "epoch": 2232} {"train_loss": -39.606048583984375, "global_step": 270149, "epoch": 2232} {"train_loss": -39.205753326416016, "global_step": 270150, "epoch": 2232} {"train_loss": -39.74417495727539, "global_step": 270151, "epoch": 2232} {"train_loss": -40.91444396972656, "global_step": 270152, "epoch": 2232} {"train_loss": -40.49345779418945, "global_step": 270153, "epoch": 2232} {"train_loss": -40.234649658203125, "global_step": 270154, "epoch": 2232} {"train_loss": -40.39500045776367, "global_step": 270155, "epoch": 2232} {"train_loss": -41.22332763671875, "global_step": 270156, "epoch": 2232} {"train_loss": -41.360206604003906, "global_step": 270157, "epoch": 2232} {"train_loss": -40.50580596923828, "global_step": 270158, "epoch": 2232} {"train_loss": -41.015403747558594, "global_step": 270159, "epoch": 2232} {"train_loss": -40.371341705322266, "global_step": 270160, "epoch": 2232} {"train_loss": -39.51548385620117, "global_step": 270161, "epoch": 2232} {"train_loss": -39.82981491088867, "global_step": 270162, "epoch": 2232} {"train_loss": -40.729835510253906, "global_step": 270163, "epoch": 2232} {"train_loss": -39.171295166015625, "global_step": 270164, "epoch": 2232} {"train_loss": -36.00515365600586, "global_step": 270165, "epoch": 2232} {"train_loss": -34.169403076171875, "global_step": 270166, "epoch": 2232} {"train_loss": -36.56376266479492, "global_step": 270167, "epoch": 2232} {"train_loss": -38.96783447265625, "global_step": 270168, "epoch": 2232} {"train_loss": -37.72971725463867, "global_step": 270169, "epoch": 2232} {"train_loss": -38.171905517578125, "global_step": 270170, "epoch": 2232} {"train_loss": -40.26721954345703, "global_step": 270171, "epoch": 2232} {"train_loss": -36.771751403808594, "global_step": 270172, "epoch": 2232} {"train_loss": -36.19740676879883, "global_step": 270173, "epoch": 2232} {"train_loss": -40.175636291503906, "global_step": 270174, "epoch": 2232} {"train_loss": -37.74174118041992, "global_step": 270175, "epoch": 2232} {"train_loss": -40.039791107177734, "global_step": 270176, "epoch": 2232} {"train_loss": -38.08462142944336, "global_step": 270177, "epoch": 2232} {"train_loss": -39.50605392456055, "global_step": 270178, "epoch": 2232} {"train_loss": -39.9193229675293, "global_step": 270179, "epoch": 2232} {"train_loss": -39.367713928222656, "global_step": 270180, "epoch": 2232} {"train_loss": -40.499656677246094, "global_step": 270181, "epoch": 2232} {"train_loss": -39.64683532714844, "global_step": 270182, "epoch": 2232} {"train_loss": -40.38992691040039, "global_step": 270183, "epoch": 2232} {"train_loss": -39.62714767456055, "global_step": 270184, "epoch": 2232} {"train_loss": -40.82155990600586, "global_step": 270185, "epoch": 2232} {"train_loss": -39.865806579589844, "global_step": 270186, "epoch": 2232} {"train_loss": -39.06876754760742, "global_step": 270187, "epoch": 2232} {"train_loss": -40.33547592163086, "global_step": 270188, "epoch": 2232} {"train_loss": -40.672210693359375, "global_step": 270189, "epoch": 2232} {"train_loss": -40.98893356323242, "global_step": 270190, "epoch": 2232} {"train_loss": -40.51995849609375, "global_step": 270191, "epoch": 2232} {"train_loss": -39.47542042377567, "global_step": 270192, "epoch": 2232, "val_loss": 2535738.75} {"train_loss": -40.45368576049805, "global_step": 270193, "epoch": 2233} {"train_loss": -40.4059944152832, "global_step": 270194, "epoch": 2233} {"train_loss": -40.95307540893555, "global_step": 270195, "epoch": 2233} {"train_loss": -41.485687255859375, "global_step": 270196, "epoch": 2233} {"train_loss": -40.44906997680664, "global_step": 270197, "epoch": 2233} {"train_loss": -40.75849151611328, "global_step": 270198, "epoch": 2233} {"train_loss": -40.56135940551758, "global_step": 270199, "epoch": 2233} {"train_loss": -39.57210159301758, "global_step": 270200, "epoch": 2233} {"train_loss": -40.517391204833984, "global_step": 270201, "epoch": 2233} {"train_loss": -41.1082763671875, "global_step": 270202, "epoch": 2233} {"train_loss": -41.31999969482422, "global_step": 270203, "epoch": 2233} {"train_loss": -41.23929977416992, "global_step": 270204, "epoch": 2233} {"train_loss": -41.72359085083008, "global_step": 270205, "epoch": 2233} {"train_loss": -41.19883346557617, "global_step": 270206, "epoch": 2233} {"train_loss": -41.55705642700195, "global_step": 270207, "epoch": 2233} {"train_loss": -40.6590461730957, "global_step": 270208, "epoch": 2233} {"train_loss": -41.45119857788086, "global_step": 270209, "epoch": 2233} {"train_loss": -40.347476959228516, "global_step": 270210, "epoch": 2233} {"train_loss": -41.34823226928711, "global_step": 270211, "epoch": 2233} {"train_loss": -41.54859161376953, "global_step": 270212, "epoch": 2233} {"train_loss": -41.40580368041992, "global_step": 270213, "epoch": 2233} {"train_loss": -41.316688537597656, "global_step": 270214, "epoch": 2233} {"train_loss": -41.1373176574707, "global_step": 270215, "epoch": 2233} {"train_loss": -40.73269271850586, "global_step": 270216, "epoch": 2233} {"train_loss": -40.70903015136719, "global_step": 270217, "epoch": 2233} {"train_loss": -40.36621856689453, "global_step": 270218, "epoch": 2233} {"train_loss": -41.42129135131836, "global_step": 270219, "epoch": 2233} {"train_loss": -41.303585052490234, "global_step": 270220, "epoch": 2233} {"train_loss": -40.67041778564453, "global_step": 270221, "epoch": 2233} {"train_loss": -40.20938491821289, "global_step": 270222, "epoch": 2233} {"train_loss": -40.69892120361328, "global_step": 270223, "epoch": 2233} {"train_loss": -41.87921905517578, "global_step": 270224, "epoch": 2233} {"train_loss": -41.4634895324707, "global_step": 270225, "epoch": 2233} {"train_loss": -41.968109130859375, "global_step": 270226, "epoch": 2233} {"train_loss": -41.811885833740234, "global_step": 270227, "epoch": 2233} {"train_loss": -41.73088073730469, "global_step": 270228, "epoch": 2233} {"train_loss": -41.38691711425781, "global_step": 270229, "epoch": 2233} {"train_loss": -41.93577194213867, "global_step": 270230, "epoch": 2233} {"train_loss": -41.538665771484375, "global_step": 270231, "epoch": 2233} {"train_loss": -41.37624740600586, "global_step": 270232, "epoch": 2233} {"train_loss": -41.565101623535156, "global_step": 270233, "epoch": 2233} {"train_loss": -42.068355560302734, "global_step": 270234, "epoch": 2233} {"train_loss": -41.16569137573242, "global_step": 270235, "epoch": 2233} {"train_loss": -40.840572357177734, "global_step": 270236, "epoch": 2233} {"train_loss": -41.017234802246094, "global_step": 270237, "epoch": 2233} {"train_loss": -41.66586685180664, "global_step": 270238, "epoch": 2233} {"train_loss": -40.663089752197266, "global_step": 270239, "epoch": 2233} {"train_loss": -41.418087005615234, "global_step": 270240, "epoch": 2233} {"train_loss": -40.98199462890625, "global_step": 270241, "epoch": 2233} {"train_loss": -41.258724212646484, "global_step": 270242, "epoch": 2233} {"train_loss": -41.167152404785156, "global_step": 270243, "epoch": 2233} {"train_loss": -41.4385986328125, "global_step": 270244, "epoch": 2233} {"train_loss": -40.81748580932617, "global_step": 270245, "epoch": 2233} {"train_loss": -42.157691955566406, "global_step": 270246, "epoch": 2233} {"train_loss": -41.55535888671875, "global_step": 270247, "epoch": 2233} {"train_loss": -40.180580139160156, "global_step": 270248, "epoch": 2233} {"train_loss": -40.54769515991211, "global_step": 270249, "epoch": 2233} {"train_loss": -42.534881591796875, "global_step": 270250, "epoch": 2233} {"train_loss": -41.05100631713867, "global_step": 270251, "epoch": 2233} {"train_loss": -41.24111557006836, "global_step": 270252, "epoch": 2233} {"train_loss": -41.113128662109375, "global_step": 270253, "epoch": 2233} {"train_loss": -41.60956573486328, "global_step": 270254, "epoch": 2233} {"train_loss": -38.82008743286133, "global_step": 270255, "epoch": 2233} {"train_loss": -41.980098724365234, "global_step": 270256, "epoch": 2233} {"train_loss": -42.2647819519043, "global_step": 270257, "epoch": 2233} {"train_loss": -41.030391693115234, "global_step": 270258, "epoch": 2233} {"train_loss": -40.66983413696289, "global_step": 270259, "epoch": 2233} {"train_loss": -42.12601089477539, "global_step": 270260, "epoch": 2233} {"train_loss": -41.736289978027344, "global_step": 270261, "epoch": 2233} {"train_loss": -41.59550476074219, "global_step": 270262, "epoch": 2233} {"train_loss": -41.65416717529297, "global_step": 270263, "epoch": 2233} {"train_loss": -42.28505325317383, "global_step": 270264, "epoch": 2233} {"train_loss": -41.21770095825195, "global_step": 270265, "epoch": 2233} {"train_loss": -42.15632629394531, "global_step": 270266, "epoch": 2233} {"train_loss": -42.448970794677734, "global_step": 270267, "epoch": 2233} {"train_loss": -41.823734283447266, "global_step": 270268, "epoch": 2233} {"train_loss": -41.95698928833008, "global_step": 270269, "epoch": 2233} {"train_loss": -42.293697357177734, "global_step": 270270, "epoch": 2233} {"train_loss": -41.871124267578125, "global_step": 270271, "epoch": 2233} {"train_loss": -42.31563949584961, "global_step": 270272, "epoch": 2233} {"train_loss": -42.44137191772461, "global_step": 270273, "epoch": 2233} {"train_loss": -42.324073791503906, "global_step": 270274, "epoch": 2233} {"train_loss": -41.801334381103516, "global_step": 270275, "epoch": 2233} {"train_loss": -42.16901779174805, "global_step": 270276, "epoch": 2233} {"train_loss": -42.35311508178711, "global_step": 270277, "epoch": 2233} {"train_loss": -42.528377532958984, "global_step": 270278, "epoch": 2233} {"train_loss": -42.34778594970703, "global_step": 270279, "epoch": 2233} {"train_loss": -42.691036224365234, "global_step": 270280, "epoch": 2233} {"train_loss": -42.38591384887695, "global_step": 270281, "epoch": 2233} {"train_loss": -42.375152587890625, "global_step": 270282, "epoch": 2233} {"train_loss": -41.84117126464844, "global_step": 270283, "epoch": 2233} {"train_loss": -41.680419921875, "global_step": 270284, "epoch": 2233} {"train_loss": -42.01796340942383, "global_step": 270285, "epoch": 2233} {"train_loss": -42.04541015625, "global_step": 270286, "epoch": 2233} {"train_loss": -42.46739959716797, "global_step": 270287, "epoch": 2233} {"train_loss": -41.64103317260742, "global_step": 270288, "epoch": 2233} {"train_loss": -42.736515045166016, "global_step": 270289, "epoch": 2233} {"train_loss": -41.449668884277344, "global_step": 270290, "epoch": 2233} {"train_loss": -41.802947998046875, "global_step": 270291, "epoch": 2233} {"train_loss": -40.99032211303711, "global_step": 270292, "epoch": 2233} {"train_loss": -40.94672393798828, "global_step": 270293, "epoch": 2233} {"train_loss": -40.787837982177734, "global_step": 270294, "epoch": 2233} {"train_loss": -41.95139694213867, "global_step": 270295, "epoch": 2233} {"train_loss": -41.74677276611328, "global_step": 270296, "epoch": 2233} {"train_loss": -40.148223876953125, "global_step": 270297, "epoch": 2233} {"train_loss": -41.36473083496094, "global_step": 270298, "epoch": 2233} {"train_loss": -40.418548583984375, "global_step": 270299, "epoch": 2233} {"train_loss": -41.480934143066406, "global_step": 270300, "epoch": 2233} {"train_loss": -40.69948959350586, "global_step": 270301, "epoch": 2233} {"train_loss": -42.490882873535156, "global_step": 270302, "epoch": 2233} {"train_loss": -41.49343490600586, "global_step": 270303, "epoch": 2233} {"train_loss": -41.13499450683594, "global_step": 270304, "epoch": 2233} {"train_loss": -41.659637451171875, "global_step": 270305, "epoch": 2233} {"train_loss": -42.4677734375, "global_step": 270306, "epoch": 2233} {"train_loss": -41.552391052246094, "global_step": 270307, "epoch": 2233} {"train_loss": -41.674835205078125, "global_step": 270308, "epoch": 2233} {"train_loss": -40.43844223022461, "global_step": 270309, "epoch": 2233} {"train_loss": -40.5714225769043, "global_step": 270310, "epoch": 2233} {"train_loss": -42.02067184448242, "global_step": 270311, "epoch": 2233} {"train_loss": -41.94664764404297, "global_step": 270312, "epoch": 2233} {"train_loss": -41.42246022500282, "global_step": 270313, "epoch": 2233, "val_loss": 2741253.25} {"train_loss": -40.91328430175781, "global_step": 270314, "epoch": 2234} {"train_loss": -41.19717788696289, "global_step": 270315, "epoch": 2234} {"train_loss": -40.51816940307617, "global_step": 270316, "epoch": 2234} {"train_loss": -40.0463752746582, "global_step": 270317, "epoch": 2234} {"train_loss": -40.9189338684082, "global_step": 270318, "epoch": 2234} {"train_loss": -40.90464401245117, "global_step": 270319, "epoch": 2234} {"train_loss": -40.170570373535156, "global_step": 270320, "epoch": 2234} {"train_loss": -37.40300369262695, "global_step": 270321, "epoch": 2234} {"train_loss": -41.25971984863281, "global_step": 270322, "epoch": 2234} {"train_loss": -40.96908950805664, "global_step": 270323, "epoch": 2234} {"train_loss": -41.73106002807617, "global_step": 270324, "epoch": 2234} {"train_loss": -37.786354064941406, "global_step": 270325, "epoch": 2234} {"train_loss": -39.47443771362305, "global_step": 270326, "epoch": 2234} {"train_loss": -39.96677780151367, "global_step": 270327, "epoch": 2234} {"train_loss": -41.53878402709961, "global_step": 270328, "epoch": 2234} {"train_loss": -41.16264724731445, "global_step": 270329, "epoch": 2234} {"train_loss": -40.96356964111328, "global_step": 270330, "epoch": 2234} {"train_loss": -41.41278076171875, "global_step": 270331, "epoch": 2234} {"train_loss": -41.67354965209961, "global_step": 270332, "epoch": 2234} {"train_loss": -41.48163986206055, "global_step": 270333, "epoch": 2234} {"train_loss": -41.452327728271484, "global_step": 270334, "epoch": 2234} {"train_loss": -40.22058868408203, "global_step": 270335, "epoch": 2234} {"train_loss": -40.42130661010742, "global_step": 270336, "epoch": 2234} {"train_loss": -41.09511184692383, "global_step": 270337, "epoch": 2234} {"train_loss": -41.163509368896484, "global_step": 270338, "epoch": 2234} {"train_loss": -36.94023895263672, "global_step": 270339, "epoch": 2234} {"train_loss": -40.340267181396484, "global_step": 270340, "epoch": 2234} {"train_loss": -37.35332107543945, "global_step": 270341, "epoch": 2234} {"train_loss": -40.4309196472168, "global_step": 270342, "epoch": 2234} {"train_loss": -40.930389404296875, "global_step": 270343, "epoch": 2234} {"train_loss": -39.417816162109375, "global_step": 270344, "epoch": 2234} {"train_loss": -38.1461067199707, "global_step": 270345, "epoch": 2234} {"train_loss": -29.8924617767334, "global_step": 270346, "epoch": 2234} {"train_loss": -37.75600814819336, "global_step": 270347, "epoch": 2234} {"train_loss": -38.29741287231445, "global_step": 270348, "epoch": 2234} {"train_loss": -40.50828552246094, "global_step": 270349, "epoch": 2234} {"train_loss": -38.8848876953125, "global_step": 270350, "epoch": 2234} {"train_loss": -39.25146484375, "global_step": 270351, "epoch": 2234} {"train_loss": -39.0364990234375, "global_step": 270352, "epoch": 2234} {"train_loss": -40.174896240234375, "global_step": 270353, "epoch": 2234} {"train_loss": -39.784423828125, "global_step": 270354, "epoch": 2234} {"train_loss": -38.991363525390625, "global_step": 270355, "epoch": 2234} {"train_loss": -40.49266815185547, "global_step": 270356, "epoch": 2234} {"train_loss": -40.42913055419922, "global_step": 270357, "epoch": 2234} {"train_loss": -38.37819290161133, "global_step": 270358, "epoch": 2234} {"train_loss": -40.40865707397461, "global_step": 270359, "epoch": 2234} {"train_loss": -40.2045783996582, "global_step": 270360, "epoch": 2234} {"train_loss": -40.22305679321289, "global_step": 270361, "epoch": 2234} {"train_loss": -38.693443298339844, "global_step": 270362, "epoch": 2234} {"train_loss": -41.03933334350586, "global_step": 270363, "epoch": 2234} {"train_loss": -38.72499465942383, "global_step": 270364, "epoch": 2234} {"train_loss": -40.46906661987305, "global_step": 270365, "epoch": 2234} {"train_loss": -40.81372833251953, "global_step": 270366, "epoch": 2234} {"train_loss": -40.77463912963867, "global_step": 270367, "epoch": 2234} {"train_loss": -40.27230453491211, "global_step": 270368, "epoch": 2234} {"train_loss": -40.7093505859375, "global_step": 270369, "epoch": 2234} {"train_loss": -40.78636932373047, "global_step": 270370, "epoch": 2234} {"train_loss": -41.37410354614258, "global_step": 270371, "epoch": 2234} {"train_loss": -40.041168212890625, "global_step": 270372, "epoch": 2234} {"train_loss": -40.557342529296875, "global_step": 270373, "epoch": 2234} {"train_loss": -41.28644561767578, "global_step": 270374, "epoch": 2234} {"train_loss": -41.09713363647461, "global_step": 270375, "epoch": 2234} {"train_loss": -41.633304595947266, "global_step": 270376, "epoch": 2234} {"train_loss": -39.24994659423828, "global_step": 270377, "epoch": 2234} {"train_loss": -39.43260192871094, "global_step": 270378, "epoch": 2234} {"train_loss": -41.67389678955078, "global_step": 270379, "epoch": 2234} {"train_loss": -40.777381896972656, "global_step": 270380, "epoch": 2234} {"train_loss": -40.19933319091797, "global_step": 270381, "epoch": 2234} {"train_loss": -41.844791412353516, "global_step": 270382, "epoch": 2234} {"train_loss": -41.21813201904297, "global_step": 270383, "epoch": 2234} {"train_loss": -41.1259880065918, "global_step": 270384, "epoch": 2234} {"train_loss": -38.99982833862305, "global_step": 270385, "epoch": 2234} {"train_loss": -41.3951301574707, "global_step": 270386, "epoch": 2234} {"train_loss": -41.387908935546875, "global_step": 270387, "epoch": 2234} {"train_loss": -41.08837890625, "global_step": 270388, "epoch": 2234} {"train_loss": -41.94790267944336, "global_step": 270389, "epoch": 2234} {"train_loss": -41.55125045776367, "global_step": 270390, "epoch": 2234} {"train_loss": -40.702091217041016, "global_step": 270391, "epoch": 2234} {"train_loss": -41.594608306884766, "global_step": 270392, "epoch": 2234} {"train_loss": -41.24416732788086, "global_step": 270393, "epoch": 2234} {"train_loss": -41.53902816772461, "global_step": 270394, "epoch": 2234} {"train_loss": -41.22712326049805, "global_step": 270395, "epoch": 2234} {"train_loss": -39.406471252441406, "global_step": 270396, "epoch": 2234} {"train_loss": -41.815731048583984, "global_step": 270397, "epoch": 2234} {"train_loss": -42.02659606933594, "global_step": 270398, "epoch": 2234} {"train_loss": -39.90647506713867, "global_step": 270399, "epoch": 2234} {"train_loss": -42.17920684814453, "global_step": 270400, "epoch": 2234} {"train_loss": -41.34782791137695, "global_step": 270401, "epoch": 2234} {"train_loss": -41.59322738647461, "global_step": 270402, "epoch": 2234} {"train_loss": -41.088802337646484, "global_step": 270403, "epoch": 2234} {"train_loss": -40.13800811767578, "global_step": 270404, "epoch": 2234} {"train_loss": -41.9991569519043, "global_step": 270405, "epoch": 2234} {"train_loss": -39.57611083984375, "global_step": 270406, "epoch": 2234} {"train_loss": -38.412010192871094, "global_step": 270407, "epoch": 2234} {"train_loss": -40.45023727416992, "global_step": 270408, "epoch": 2234} {"train_loss": -41.64500045776367, "global_step": 270409, "epoch": 2234} {"train_loss": -41.44929504394531, "global_step": 270410, "epoch": 2234} {"train_loss": -41.617828369140625, "global_step": 270411, "epoch": 2234} {"train_loss": -39.68256759643555, "global_step": 270412, "epoch": 2234} {"train_loss": -41.88126754760742, "global_step": 270413, "epoch": 2234} {"train_loss": -41.58687973022461, "global_step": 270414, "epoch": 2234} {"train_loss": -41.16168212890625, "global_step": 270415, "epoch": 2234} {"train_loss": -40.020259857177734, "global_step": 270416, "epoch": 2234} {"train_loss": -39.668617248535156, "global_step": 270417, "epoch": 2234} {"train_loss": -38.62477493286133, "global_step": 270418, "epoch": 2234} {"train_loss": -40.146278381347656, "global_step": 270419, "epoch": 2234} {"train_loss": -40.783870697021484, "global_step": 270420, "epoch": 2234} {"train_loss": -41.0897102355957, "global_step": 270421, "epoch": 2234} {"train_loss": -38.106502532958984, "global_step": 270422, "epoch": 2234} {"train_loss": -38.586219787597656, "global_step": 270423, "epoch": 2234} {"train_loss": -38.618927001953125, "global_step": 270424, "epoch": 2234} {"train_loss": -39.54232406616211, "global_step": 270425, "epoch": 2234} {"train_loss": -36.9270133972168, "global_step": 270426, "epoch": 2234} {"train_loss": -39.9587287902832, "global_step": 270427, "epoch": 2234} {"train_loss": -36.453468322753906, "global_step": 270428, "epoch": 2234} {"train_loss": -37.75688552856445, "global_step": 270429, "epoch": 2234} {"train_loss": -40.537513732910156, "global_step": 270430, "epoch": 2234} {"train_loss": -39.29148483276367, "global_step": 270431, "epoch": 2234} {"train_loss": -38.85675811767578, "global_step": 270432, "epoch": 2234} {"train_loss": -40.13019561767578, "global_step": 270433, "epoch": 2234} {"train_loss": -40.180245754147364, "global_step": 270434, "epoch": 2234, "val_loss": 2561806.75} {"train_loss": -41.30277633666992, "global_step": 270435, "epoch": 2235} {"train_loss": -40.521907806396484, "global_step": 270436, "epoch": 2235} {"train_loss": -40.424888610839844, "global_step": 270437, "epoch": 2235} {"train_loss": -40.8466682434082, "global_step": 270438, "epoch": 2235} {"train_loss": -40.71550369262695, "global_step": 270439, "epoch": 2235} {"train_loss": -40.64414596557617, "global_step": 270440, "epoch": 2235} {"train_loss": -39.08856201171875, "global_step": 270441, "epoch": 2235} {"train_loss": -39.81769561767578, "global_step": 270442, "epoch": 2235} {"train_loss": -41.39824295043945, "global_step": 270443, "epoch": 2235} {"train_loss": -40.89680862426758, "global_step": 270444, "epoch": 2235} {"train_loss": -41.029415130615234, "global_step": 270445, "epoch": 2235} {"train_loss": -41.521114349365234, "global_step": 270446, "epoch": 2235} {"train_loss": -39.56184005737305, "global_step": 270447, "epoch": 2235} {"train_loss": -41.785430908203125, "global_step": 270448, "epoch": 2235} {"train_loss": -41.64078903198242, "global_step": 270449, "epoch": 2235} {"train_loss": -41.6544189453125, "global_step": 270450, "epoch": 2235} {"train_loss": -41.39408493041992, "global_step": 270451, "epoch": 2235} {"train_loss": -40.935791015625, "global_step": 270452, "epoch": 2235} {"train_loss": -40.65627670288086, "global_step": 270453, "epoch": 2235} {"train_loss": -41.4079475402832, "global_step": 270454, "epoch": 2235} {"train_loss": -40.572715759277344, "global_step": 270455, "epoch": 2235} {"train_loss": -40.65456008911133, "global_step": 270456, "epoch": 2235} {"train_loss": -41.44294357299805, "global_step": 270457, "epoch": 2235} {"train_loss": -42.23469161987305, "global_step": 270458, "epoch": 2235} {"train_loss": -40.7692985534668, "global_step": 270459, "epoch": 2235} {"train_loss": -41.80305862426758, "global_step": 270460, "epoch": 2235} {"train_loss": -41.97819900512695, "global_step": 270461, "epoch": 2235} {"train_loss": -40.77400207519531, "global_step": 270462, "epoch": 2235} {"train_loss": -40.58641815185547, "global_step": 270463, "epoch": 2235} {"train_loss": -41.43798828125, "global_step": 270464, "epoch": 2235} {"train_loss": -41.234588623046875, "global_step": 270465, "epoch": 2235} {"train_loss": -42.0400276184082, "global_step": 270466, "epoch": 2235} {"train_loss": -41.57244110107422, "global_step": 270467, "epoch": 2235} {"train_loss": -40.54567337036133, "global_step": 270468, "epoch": 2235} {"train_loss": -41.442352294921875, "global_step": 270469, "epoch": 2235} {"train_loss": -42.06293487548828, "global_step": 270470, "epoch": 2235} {"train_loss": -41.94207763671875, "global_step": 270471, "epoch": 2235} {"train_loss": -41.817230224609375, "global_step": 270472, "epoch": 2235} {"train_loss": -40.95437240600586, "global_step": 270473, "epoch": 2235} {"train_loss": -40.885169982910156, "global_step": 270474, "epoch": 2235} {"train_loss": -39.204036712646484, "global_step": 270475, "epoch": 2235} {"train_loss": -41.508888244628906, "global_step": 270476, "epoch": 2235} {"train_loss": -40.75297927856445, "global_step": 270477, "epoch": 2235} {"train_loss": -41.23987579345703, "global_step": 270478, "epoch": 2235} {"train_loss": -40.488033294677734, "global_step": 270479, "epoch": 2235} {"train_loss": -41.61855697631836, "global_step": 270480, "epoch": 2235} {"train_loss": -40.22057342529297, "global_step": 270481, "epoch": 2235} {"train_loss": -40.74599838256836, "global_step": 270482, "epoch": 2235} {"train_loss": -40.19580841064453, "global_step": 270483, "epoch": 2235} {"train_loss": -41.673858642578125, "global_step": 270484, "epoch": 2235} {"train_loss": -41.23246383666992, "global_step": 270485, "epoch": 2235} {"train_loss": -41.740966796875, "global_step": 270486, "epoch": 2235} {"train_loss": -41.864471435546875, "global_step": 270487, "epoch": 2235} {"train_loss": -40.610931396484375, "global_step": 270488, "epoch": 2235} {"train_loss": -42.251014709472656, "global_step": 270489, "epoch": 2235} {"train_loss": -41.23397445678711, "global_step": 270490, "epoch": 2235} {"train_loss": -41.72817611694336, "global_step": 270491, "epoch": 2235} {"train_loss": -40.98865509033203, "global_step": 270492, "epoch": 2235} {"train_loss": -40.87144088745117, "global_step": 270493, "epoch": 2235} {"train_loss": -41.77599334716797, "global_step": 270494, "epoch": 2235} {"train_loss": -41.017494201660156, "global_step": 270495, "epoch": 2235} {"train_loss": -40.5886116027832, "global_step": 270496, "epoch": 2235} {"train_loss": -41.980464935302734, "global_step": 270497, "epoch": 2235} {"train_loss": -41.87004852294922, "global_step": 270498, "epoch": 2235} {"train_loss": -41.84572982788086, "global_step": 270499, "epoch": 2235} {"train_loss": -41.856109619140625, "global_step": 270500, "epoch": 2235} {"train_loss": -41.608131408691406, "global_step": 270501, "epoch": 2235} {"train_loss": -41.26371383666992, "global_step": 270502, "epoch": 2235} {"train_loss": -41.016014099121094, "global_step": 270503, "epoch": 2235} {"train_loss": -40.8806037902832, "global_step": 270504, "epoch": 2235} {"train_loss": -41.798397064208984, "global_step": 270505, "epoch": 2235} {"train_loss": -41.115447998046875, "global_step": 270506, "epoch": 2235} {"train_loss": -40.98091506958008, "global_step": 270507, "epoch": 2235} {"train_loss": -41.473907470703125, "global_step": 270508, "epoch": 2235} {"train_loss": -41.342586517333984, "global_step": 270509, "epoch": 2235} {"train_loss": -40.93952178955078, "global_step": 270510, "epoch": 2235} {"train_loss": -41.57158279418945, "global_step": 270511, "epoch": 2235} {"train_loss": -40.17554473876953, "global_step": 270512, "epoch": 2235} {"train_loss": -41.50082015991211, "global_step": 270513, "epoch": 2235} {"train_loss": -41.15729904174805, "global_step": 270514, "epoch": 2235} {"train_loss": -40.8006706237793, "global_step": 270515, "epoch": 2235} {"train_loss": -40.72856521606445, "global_step": 270516, "epoch": 2235} {"train_loss": -41.94124984741211, "global_step": 270517, "epoch": 2235} {"train_loss": -42.03627395629883, "global_step": 270518, "epoch": 2235} {"train_loss": -42.227378845214844, "global_step": 270519, "epoch": 2235} {"train_loss": -41.756771087646484, "global_step": 270520, "epoch": 2235} {"train_loss": -41.70051193237305, "global_step": 270521, "epoch": 2235} {"train_loss": -41.14915084838867, "global_step": 270522, "epoch": 2235} {"train_loss": -41.75693893432617, "global_step": 270523, "epoch": 2235} {"train_loss": -40.39548110961914, "global_step": 270524, "epoch": 2235} {"train_loss": -39.35353469848633, "global_step": 270525, "epoch": 2235} {"train_loss": -39.2708854675293, "global_step": 270526, "epoch": 2235} {"train_loss": -40.3577880859375, "global_step": 270527, "epoch": 2235} {"train_loss": -41.6025390625, "global_step": 270528, "epoch": 2235} {"train_loss": -41.48674392700195, "global_step": 270529, "epoch": 2235} {"train_loss": -41.752166748046875, "global_step": 270530, "epoch": 2235} {"train_loss": -41.654457092285156, "global_step": 270531, "epoch": 2235} {"train_loss": -41.971309661865234, "global_step": 270532, "epoch": 2235} {"train_loss": -42.472389221191406, "global_step": 270533, "epoch": 2235} {"train_loss": -41.657012939453125, "global_step": 270534, "epoch": 2235} {"train_loss": -41.674072265625, "global_step": 270535, "epoch": 2235} {"train_loss": -42.16865158081055, "global_step": 270536, "epoch": 2235} {"train_loss": -42.211891174316406, "global_step": 270537, "epoch": 2235} {"train_loss": -42.541194915771484, "global_step": 270538, "epoch": 2235} {"train_loss": -41.43996047973633, "global_step": 270539, "epoch": 2235} {"train_loss": -42.11338806152344, "global_step": 270540, "epoch": 2235} {"train_loss": -42.42198944091797, "global_step": 270541, "epoch": 2235} {"train_loss": -42.48285675048828, "global_step": 270542, "epoch": 2235} {"train_loss": -41.238826751708984, "global_step": 270543, "epoch": 2235} {"train_loss": -41.74679183959961, "global_step": 270544, "epoch": 2235} {"train_loss": -42.29523468017578, "global_step": 270545, "epoch": 2235} {"train_loss": -41.676231384277344, "global_step": 270546, "epoch": 2235} {"train_loss": -42.49562072753906, "global_step": 270547, "epoch": 2235} {"train_loss": -42.04328155517578, "global_step": 270548, "epoch": 2235} {"train_loss": -42.30675506591797, "global_step": 270549, "epoch": 2235} {"train_loss": -41.32502365112305, "global_step": 270550, "epoch": 2235} {"train_loss": -41.4751091003418, "global_step": 270551, "epoch": 2235} {"train_loss": -42.38441848754883, "global_step": 270552, "epoch": 2235} {"train_loss": -41.99232482910156, "global_step": 270553, "epoch": 2235} {"train_loss": -41.24163818359375, "global_step": 270554, "epoch": 2235} {"train_loss": -41.28172160377187, "global_step": 270555, "epoch": 2235, "val_loss": 2576000.75} {"train_loss": -33.968910217285156, "global_step": 270556, "epoch": 2236} {"train_loss": -39.99346160888672, "global_step": 270557, "epoch": 2236} {"train_loss": -42.118160247802734, "global_step": 270558, "epoch": 2236} {"train_loss": -38.77632522583008, "global_step": 270559, "epoch": 2236} {"train_loss": -39.73051071166992, "global_step": 270560, "epoch": 2236} {"train_loss": -42.483245849609375, "global_step": 270561, "epoch": 2236} {"train_loss": -40.87299346923828, "global_step": 270562, "epoch": 2236} {"train_loss": -39.7921028137207, "global_step": 270563, "epoch": 2236} {"train_loss": -41.554988861083984, "global_step": 270564, "epoch": 2236} {"train_loss": -41.9539680480957, "global_step": 270565, "epoch": 2236} {"train_loss": -41.19664001464844, "global_step": 270566, "epoch": 2236} {"train_loss": -41.42368698120117, "global_step": 270567, "epoch": 2236} {"train_loss": -42.04055404663086, "global_step": 270568, "epoch": 2236} {"train_loss": -40.87100601196289, "global_step": 270569, "epoch": 2236} {"train_loss": -42.0528450012207, "global_step": 270570, "epoch": 2236} {"train_loss": -40.93393325805664, "global_step": 270571, "epoch": 2236} {"train_loss": -41.935054779052734, "global_step": 270572, "epoch": 2236} {"train_loss": -42.08408737182617, "global_step": 270573, "epoch": 2236} {"train_loss": -41.69853210449219, "global_step": 270574, "epoch": 2236} {"train_loss": -42.13690948486328, "global_step": 270575, "epoch": 2236} {"train_loss": -42.00416946411133, "global_step": 270576, "epoch": 2236} {"train_loss": -41.850921630859375, "global_step": 270577, "epoch": 2236} {"train_loss": -41.74517059326172, "global_step": 270578, "epoch": 2236} {"train_loss": -41.53768539428711, "global_step": 270579, "epoch": 2236} {"train_loss": -42.026817321777344, "global_step": 270580, "epoch": 2236} {"train_loss": -42.610042572021484, "global_step": 270581, "epoch": 2236} {"train_loss": -42.28300857543945, "global_step": 270582, "epoch": 2236} {"train_loss": -42.2614860534668, "global_step": 270583, "epoch": 2236} {"train_loss": -42.07285690307617, "global_step": 270584, "epoch": 2236} {"train_loss": -42.294246673583984, "global_step": 270585, "epoch": 2236} {"train_loss": -42.03594207763672, "global_step": 270586, "epoch": 2236} {"train_loss": -42.84944152832031, "global_step": 270587, "epoch": 2236} {"train_loss": -42.84174346923828, "global_step": 270588, "epoch": 2236} {"train_loss": -43.160396575927734, "global_step": 270589, "epoch": 2236} {"train_loss": -42.63631820678711, "global_step": 270590, "epoch": 2236} {"train_loss": -42.65839767456055, "global_step": 270591, "epoch": 2236} {"train_loss": -43.3852653503418, "global_step": 270592, "epoch": 2236} {"train_loss": -42.938148498535156, "global_step": 270593, "epoch": 2236} {"train_loss": -42.76664352416992, "global_step": 270594, "epoch": 2236} {"train_loss": -42.3880615234375, "global_step": 270595, "epoch": 2236} {"train_loss": -42.700138092041016, "global_step": 270596, "epoch": 2236} {"train_loss": -42.7819938659668, "global_step": 270597, "epoch": 2236} {"train_loss": -42.548851013183594, "global_step": 270598, "epoch": 2236} {"train_loss": -42.808349609375, "global_step": 270599, "epoch": 2236} {"train_loss": -42.6839485168457, "global_step": 270600, "epoch": 2236} {"train_loss": -42.92106628417969, "global_step": 270601, "epoch": 2236} {"train_loss": -42.76246643066406, "global_step": 270602, "epoch": 2236} {"train_loss": -42.341793060302734, "global_step": 270603, "epoch": 2236} {"train_loss": -42.32573318481445, "global_step": 270604, "epoch": 2236} {"train_loss": -42.76237106323242, "global_step": 270605, "epoch": 2236} {"train_loss": -42.97711944580078, "global_step": 270606, "epoch": 2236} {"train_loss": -43.22629928588867, "global_step": 270607, "epoch": 2236} {"train_loss": -42.2158317565918, "global_step": 270608, "epoch": 2236} {"train_loss": -43.12270736694336, "global_step": 270609, "epoch": 2236} {"train_loss": -42.919551849365234, "global_step": 270610, "epoch": 2236} {"train_loss": -42.68182373046875, "global_step": 270611, "epoch": 2236} {"train_loss": -42.04463577270508, "global_step": 270612, "epoch": 2236} {"train_loss": -40.63808822631836, "global_step": 270613, "epoch": 2236} {"train_loss": -38.9058952331543, "global_step": 270614, "epoch": 2236} {"train_loss": -35.51055908203125, "global_step": 270615, "epoch": 2236} {"train_loss": -38.48931884765625, "global_step": 270616, "epoch": 2236} {"train_loss": -41.23762130737305, "global_step": 270617, "epoch": 2236} {"train_loss": -40.9107551574707, "global_step": 270618, "epoch": 2236} {"train_loss": -40.5654182434082, "global_step": 270619, "epoch": 2236} {"train_loss": -41.48506546020508, "global_step": 270620, "epoch": 2236} {"train_loss": -40.55060577392578, "global_step": 270621, "epoch": 2236} {"train_loss": -39.24470520019531, "global_step": 270622, "epoch": 2236} {"train_loss": -39.68699264526367, "global_step": 270623, "epoch": 2236} {"train_loss": -41.66115188598633, "global_step": 270624, "epoch": 2236} {"train_loss": -42.14631271362305, "global_step": 270625, "epoch": 2236} {"train_loss": -42.288063049316406, "global_step": 270626, "epoch": 2236} {"train_loss": -41.38039779663086, "global_step": 270627, "epoch": 2236} {"train_loss": -41.852108001708984, "global_step": 270628, "epoch": 2236} {"train_loss": -42.28910446166992, "global_step": 270629, "epoch": 2236} {"train_loss": -42.87282943725586, "global_step": 270630, "epoch": 2236} {"train_loss": -42.21042251586914, "global_step": 270631, "epoch": 2236} {"train_loss": -42.23868942260742, "global_step": 270632, "epoch": 2236} {"train_loss": -41.22721481323242, "global_step": 270633, "epoch": 2236} {"train_loss": -41.4481086730957, "global_step": 270634, "epoch": 2236} {"train_loss": -42.1528434753418, "global_step": 270635, "epoch": 2236} {"train_loss": -42.001304626464844, "global_step": 270636, "epoch": 2236} {"train_loss": -42.15250778198242, "global_step": 270637, "epoch": 2236} {"train_loss": -42.56952667236328, "global_step": 270638, "epoch": 2236} {"train_loss": -41.498878479003906, "global_step": 270639, "epoch": 2236} {"train_loss": -42.470149993896484, "global_step": 270640, "epoch": 2236} {"train_loss": -41.18939971923828, "global_step": 270641, "epoch": 2236} {"train_loss": -42.390357971191406, "global_step": 270642, "epoch": 2236} {"train_loss": -40.56574249267578, "global_step": 270643, "epoch": 2236} {"train_loss": -41.59208297729492, "global_step": 270644, "epoch": 2236} {"train_loss": -42.004486083984375, "global_step": 270645, "epoch": 2236} {"train_loss": -42.11210250854492, "global_step": 270646, "epoch": 2236} {"train_loss": -42.250732421875, "global_step": 270647, "epoch": 2236} {"train_loss": -41.67267990112305, "global_step": 270648, "epoch": 2236} {"train_loss": -42.28365707397461, "global_step": 270649, "epoch": 2236} {"train_loss": -41.559600830078125, "global_step": 270650, "epoch": 2236} {"train_loss": -39.96472930908203, "global_step": 270651, "epoch": 2236} {"train_loss": -42.026466369628906, "global_step": 270652, "epoch": 2236} {"train_loss": -42.249542236328125, "global_step": 270653, "epoch": 2236} {"train_loss": -42.983028411865234, "global_step": 270654, "epoch": 2236} {"train_loss": -40.2672119140625, "global_step": 270655, "epoch": 2236} {"train_loss": -42.15181350708008, "global_step": 270656, "epoch": 2236} {"train_loss": -41.968666076660156, "global_step": 270657, "epoch": 2236} {"train_loss": -37.66520309448242, "global_step": 270658, "epoch": 2236} {"train_loss": -39.14908981323242, "global_step": 270659, "epoch": 2236} {"train_loss": -40.23727035522461, "global_step": 270660, "epoch": 2236} {"train_loss": -39.530818939208984, "global_step": 270661, "epoch": 2236} {"train_loss": -37.9216194152832, "global_step": 270662, "epoch": 2236} {"train_loss": -36.53239059448242, "global_step": 270663, "epoch": 2236} {"train_loss": -38.51747131347656, "global_step": 270664, "epoch": 2236} {"train_loss": -39.82534408569336, "global_step": 270665, "epoch": 2236} {"train_loss": -39.53496551513672, "global_step": 270666, "epoch": 2236} {"train_loss": -39.160621643066406, "global_step": 270667, "epoch": 2236} {"train_loss": -37.57017135620117, "global_step": 270668, "epoch": 2236} {"train_loss": -35.855037689208984, "global_step": 270669, "epoch": 2236} {"train_loss": -41.01876449584961, "global_step": 270670, "epoch": 2236} {"train_loss": -39.63245391845703, "global_step": 270671, "epoch": 2236} {"train_loss": -35.28402328491211, "global_step": 270672, "epoch": 2236} {"train_loss": -38.049949645996094, "global_step": 270673, "epoch": 2236} {"train_loss": -38.3676643371582, "global_step": 270674, "epoch": 2236} {"train_loss": -39.62922668457031, "global_step": 270675, "epoch": 2236} {"train_loss": -41.20890332056471, "global_step": 270676, "epoch": 2236, "val_loss": 2496900.75} {"train_loss": -39.6511116027832, "global_step": 270677, "epoch": 2237} {"train_loss": -39.68653869628906, "global_step": 270678, "epoch": 2237} {"train_loss": -39.3620491027832, "global_step": 270679, "epoch": 2237} {"train_loss": -39.50310134887695, "global_step": 270680, "epoch": 2237} {"train_loss": -38.49943161010742, "global_step": 270681, "epoch": 2237} {"train_loss": -40.94536209106445, "global_step": 270682, "epoch": 2237} {"train_loss": -38.69205856323242, "global_step": 270683, "epoch": 2237} {"train_loss": -38.82221221923828, "global_step": 270684, "epoch": 2237} {"train_loss": -39.386383056640625, "global_step": 270685, "epoch": 2237} {"train_loss": -40.576595306396484, "global_step": 270686, "epoch": 2237} {"train_loss": -39.65764617919922, "global_step": 270687, "epoch": 2237} {"train_loss": -39.503963470458984, "global_step": 270688, "epoch": 2237} {"train_loss": -39.36433792114258, "global_step": 270689, "epoch": 2237} {"train_loss": -39.06475067138672, "global_step": 270690, "epoch": 2237} {"train_loss": -40.45867156982422, "global_step": 270691, "epoch": 2237} {"train_loss": -40.73731231689453, "global_step": 270692, "epoch": 2237} {"train_loss": -40.53713607788086, "global_step": 270693, "epoch": 2237} {"train_loss": -40.75829315185547, "global_step": 270694, "epoch": 2237} {"train_loss": -41.617374420166016, "global_step": 270695, "epoch": 2237} {"train_loss": -41.42893600463867, "global_step": 270696, "epoch": 2237} {"train_loss": -40.61260986328125, "global_step": 270697, "epoch": 2237} {"train_loss": -40.5123176574707, "global_step": 270698, "epoch": 2237} {"train_loss": -41.34560012817383, "global_step": 270699, "epoch": 2237} {"train_loss": -40.899539947509766, "global_step": 270700, "epoch": 2237} {"train_loss": -40.914955139160156, "global_step": 270701, "epoch": 2237} {"train_loss": -41.1108283996582, "global_step": 270702, "epoch": 2237} {"train_loss": -40.341400146484375, "global_step": 270703, "epoch": 2237} {"train_loss": -41.63650131225586, "global_step": 270704, "epoch": 2237} {"train_loss": -41.055965423583984, "global_step": 270705, "epoch": 2237} {"train_loss": -41.46625900268555, "global_step": 270706, "epoch": 2237} {"train_loss": -41.88410186767578, "global_step": 270707, "epoch": 2237} {"train_loss": -40.808231353759766, "global_step": 270708, "epoch": 2237} {"train_loss": -42.02360153198242, "global_step": 270709, "epoch": 2237} {"train_loss": -41.083316802978516, "global_step": 270710, "epoch": 2237} {"train_loss": -41.222232818603516, "global_step": 270711, "epoch": 2237} {"train_loss": -41.24355697631836, "global_step": 270712, "epoch": 2237} {"train_loss": -40.28645324707031, "global_step": 270713, "epoch": 2237} {"train_loss": -42.185333251953125, "global_step": 270714, "epoch": 2237} {"train_loss": -41.7530632019043, "global_step": 270715, "epoch": 2237} {"train_loss": -41.724483489990234, "global_step": 270716, "epoch": 2237} {"train_loss": -40.89951705932617, "global_step": 270717, "epoch": 2237} {"train_loss": -41.98311996459961, "global_step": 270718, "epoch": 2237} {"train_loss": -40.682220458984375, "global_step": 270719, "epoch": 2237} {"train_loss": -41.32477951049805, "global_step": 270720, "epoch": 2237} {"train_loss": -41.87968063354492, "global_step": 270721, "epoch": 2237} {"train_loss": -41.34341049194336, "global_step": 270722, "epoch": 2237} {"train_loss": -41.29344177246094, "global_step": 270723, "epoch": 2237} {"train_loss": -41.415157318115234, "global_step": 270724, "epoch": 2237} {"train_loss": -41.751060485839844, "global_step": 270725, "epoch": 2237} {"train_loss": -41.50776290893555, "global_step": 270726, "epoch": 2237} {"train_loss": -41.63656234741211, "global_step": 270727, "epoch": 2237} {"train_loss": -42.09028625488281, "global_step": 270728, "epoch": 2237} {"train_loss": -41.8975944519043, "global_step": 270729, "epoch": 2237} {"train_loss": -41.8984489440918, "global_step": 270730, "epoch": 2237} {"train_loss": -41.71567153930664, "global_step": 270731, "epoch": 2237} {"train_loss": -42.7363166809082, "global_step": 270732, "epoch": 2237} {"train_loss": -41.34139633178711, "global_step": 270733, "epoch": 2237} {"train_loss": -41.69785690307617, "global_step": 270734, "epoch": 2237} {"train_loss": -42.047088623046875, "global_step": 270735, "epoch": 2237} {"train_loss": -41.60394287109375, "global_step": 270736, "epoch": 2237} {"train_loss": -41.50480651855469, "global_step": 270737, "epoch": 2237} {"train_loss": -40.62385559082031, "global_step": 270738, "epoch": 2237} {"train_loss": -42.22560501098633, "global_step": 270739, "epoch": 2237} {"train_loss": -40.544010162353516, "global_step": 270740, "epoch": 2237} {"train_loss": -40.583553314208984, "global_step": 270741, "epoch": 2237} {"train_loss": -40.955013275146484, "global_step": 270742, "epoch": 2237} {"train_loss": -41.559810638427734, "global_step": 270743, "epoch": 2237} {"train_loss": -41.368446350097656, "global_step": 270744, "epoch": 2237} {"train_loss": -39.465370178222656, "global_step": 270745, "epoch": 2237} {"train_loss": -42.827754974365234, "global_step": 270746, "epoch": 2237} {"train_loss": -39.95794677734375, "global_step": 270747, "epoch": 2237} {"train_loss": -40.92940139770508, "global_step": 270748, "epoch": 2237} {"train_loss": -41.1727180480957, "global_step": 270749, "epoch": 2237} {"train_loss": -42.068992614746094, "global_step": 270750, "epoch": 2237} {"train_loss": -41.406002044677734, "global_step": 270751, "epoch": 2237} {"train_loss": -40.960994720458984, "global_step": 270752, "epoch": 2237} {"train_loss": -41.432247161865234, "global_step": 270753, "epoch": 2237} {"train_loss": -41.81254959106445, "global_step": 270754, "epoch": 2237} {"train_loss": -41.479122161865234, "global_step": 270755, "epoch": 2237} {"train_loss": -42.258907318115234, "global_step": 270756, "epoch": 2237} {"train_loss": -41.91083526611328, "global_step": 270757, "epoch": 2237} {"train_loss": -41.18124008178711, "global_step": 270758, "epoch": 2237} {"train_loss": -41.8814811706543, "global_step": 270759, "epoch": 2237} {"train_loss": -42.21845245361328, "global_step": 270760, "epoch": 2237} {"train_loss": -41.787784576416016, "global_step": 270761, "epoch": 2237} {"train_loss": -42.10910415649414, "global_step": 270762, "epoch": 2237} {"train_loss": -41.48624038696289, "global_step": 270763, "epoch": 2237} {"train_loss": -39.25580596923828, "global_step": 270764, "epoch": 2237} {"train_loss": -34.47852325439453, "global_step": 270765, "epoch": 2237} {"train_loss": -33.831966400146484, "global_step": 270766, "epoch": 2237} {"train_loss": -38.998878479003906, "global_step": 270767, "epoch": 2237} {"train_loss": -39.839778900146484, "global_step": 270768, "epoch": 2237} {"train_loss": -38.9068603515625, "global_step": 270769, "epoch": 2237} {"train_loss": -39.55215072631836, "global_step": 270770, "epoch": 2237} {"train_loss": -37.58226776123047, "global_step": 270771, "epoch": 2237} {"train_loss": -39.78102111816406, "global_step": 270772, "epoch": 2237} {"train_loss": -40.14794921875, "global_step": 270773, "epoch": 2237} {"train_loss": -41.263702392578125, "global_step": 270774, "epoch": 2237} {"train_loss": -38.97233200073242, "global_step": 270775, "epoch": 2237} {"train_loss": -41.75096130371094, "global_step": 270776, "epoch": 2237} {"train_loss": -40.17115020751953, "global_step": 270777, "epoch": 2237} {"train_loss": -39.16903305053711, "global_step": 270778, "epoch": 2237} {"train_loss": -41.18490219116211, "global_step": 270779, "epoch": 2237} {"train_loss": -40.288082122802734, "global_step": 270780, "epoch": 2237} {"train_loss": -41.21350860595703, "global_step": 270781, "epoch": 2237} {"train_loss": -41.197998046875, "global_step": 270782, "epoch": 2237} {"train_loss": -39.56461715698242, "global_step": 270783, "epoch": 2237} {"train_loss": -40.58491134643555, "global_step": 270784, "epoch": 2237} {"train_loss": -40.75533676147461, "global_step": 270785, "epoch": 2237} {"train_loss": -41.624305725097656, "global_step": 270786, "epoch": 2237} {"train_loss": -41.4471321105957, "global_step": 270787, "epoch": 2237} {"train_loss": -40.70695877075195, "global_step": 270788, "epoch": 2237} {"train_loss": -40.949371337890625, "global_step": 270789, "epoch": 2237} {"train_loss": -40.5157356262207, "global_step": 270790, "epoch": 2237} {"train_loss": -42.508304595947266, "global_step": 270791, "epoch": 2237} {"train_loss": -42.028663635253906, "global_step": 270792, "epoch": 2237} {"train_loss": -41.84413528442383, "global_step": 270793, "epoch": 2237} {"train_loss": -41.207374572753906, "global_step": 270794, "epoch": 2237} {"train_loss": -42.18131637573242, "global_step": 270795, "epoch": 2237} {"train_loss": -42.02202606201172, "global_step": 270796, "epoch": 2237} {"train_loss": -40.82898327535834, "global_step": 270797, "epoch": 2237, "val_loss": 2724058.25} {"train_loss": -41.93021011352539, "global_step": 270798, "epoch": 2238} {"train_loss": -41.894405364990234, "global_step": 270799, "epoch": 2238} {"train_loss": -42.433956146240234, "global_step": 270800, "epoch": 2238} {"train_loss": -42.2462043762207, "global_step": 270801, "epoch": 2238} {"train_loss": -41.261268615722656, "global_step": 270802, "epoch": 2238} {"train_loss": -41.31879806518555, "global_step": 270803, "epoch": 2238} {"train_loss": -42.07489013671875, "global_step": 270804, "epoch": 2238} {"train_loss": -42.02370071411133, "global_step": 270805, "epoch": 2238} {"train_loss": -41.460018157958984, "global_step": 270806, "epoch": 2238} {"train_loss": -41.61790466308594, "global_step": 270807, "epoch": 2238} {"train_loss": -42.7066764831543, "global_step": 270808, "epoch": 2238} {"train_loss": -41.57288360595703, "global_step": 270809, "epoch": 2238} {"train_loss": -42.067623138427734, "global_step": 270810, "epoch": 2238} {"train_loss": -42.06576156616211, "global_step": 270811, "epoch": 2238} {"train_loss": -41.897377014160156, "global_step": 270812, "epoch": 2238} {"train_loss": -42.02412414550781, "global_step": 270813, "epoch": 2238} {"train_loss": -38.93619155883789, "global_step": 270814, "epoch": 2238} {"train_loss": -40.63138961791992, "global_step": 270815, "epoch": 2238} {"train_loss": -38.237239837646484, "global_step": 270816, "epoch": 2238} {"train_loss": -39.509735107421875, "global_step": 270817, "epoch": 2238} {"train_loss": -42.222740173339844, "global_step": 270818, "epoch": 2238} {"train_loss": -41.35758590698242, "global_step": 270819, "epoch": 2238} {"train_loss": -38.13539505004883, "global_step": 270820, "epoch": 2238} {"train_loss": -34.505714416503906, "global_step": 270821, "epoch": 2238} {"train_loss": -40.9826545715332, "global_step": 270822, "epoch": 2238} {"train_loss": -38.522911071777344, "global_step": 270823, "epoch": 2238} {"train_loss": -40.616127014160156, "global_step": 270824, "epoch": 2238} {"train_loss": -40.9482536315918, "global_step": 270825, "epoch": 2238} {"train_loss": -36.92564392089844, "global_step": 270826, "epoch": 2238} {"train_loss": -35.81260299682617, "global_step": 270827, "epoch": 2238} {"train_loss": -40.659358978271484, "global_step": 270828, "epoch": 2238} {"train_loss": -41.32706832885742, "global_step": 270829, "epoch": 2238} {"train_loss": -41.314632415771484, "global_step": 270830, "epoch": 2238} {"train_loss": -40.58360290527344, "global_step": 270831, "epoch": 2238} {"train_loss": -40.90279769897461, "global_step": 270832, "epoch": 2238} {"train_loss": -41.247962951660156, "global_step": 270833, "epoch": 2238} {"train_loss": -40.2987174987793, "global_step": 270834, "epoch": 2238} {"train_loss": -36.618953704833984, "global_step": 270835, "epoch": 2238} {"train_loss": -41.25374984741211, "global_step": 270836, "epoch": 2238} {"train_loss": -40.58175277709961, "global_step": 270837, "epoch": 2238} {"train_loss": -40.93671798706055, "global_step": 270838, "epoch": 2238} {"train_loss": -41.01309585571289, "global_step": 270839, "epoch": 2238} {"train_loss": -41.76732635498047, "global_step": 270840, "epoch": 2238} {"train_loss": -42.205482482910156, "global_step": 270841, "epoch": 2238} {"train_loss": -40.33758544921875, "global_step": 270842, "epoch": 2238} {"train_loss": -39.69578170776367, "global_step": 270843, "epoch": 2238} {"train_loss": -40.75434494018555, "global_step": 270844, "epoch": 2238} {"train_loss": -41.770538330078125, "global_step": 270845, "epoch": 2238} {"train_loss": -40.87382125854492, "global_step": 270846, "epoch": 2238} {"train_loss": -41.560909271240234, "global_step": 270847, "epoch": 2238} {"train_loss": -39.9780387878418, "global_step": 270848, "epoch": 2238} {"train_loss": -40.62933349609375, "global_step": 270849, "epoch": 2238} {"train_loss": -41.36103057861328, "global_step": 270850, "epoch": 2238} {"train_loss": -41.599212646484375, "global_step": 270851, "epoch": 2238} {"train_loss": -41.18434143066406, "global_step": 270852, "epoch": 2238} {"train_loss": -41.47517776489258, "global_step": 270853, "epoch": 2238} {"train_loss": -41.22041702270508, "global_step": 270854, "epoch": 2238} {"train_loss": -40.53019332885742, "global_step": 270855, "epoch": 2238} {"train_loss": -40.91180419921875, "global_step": 270856, "epoch": 2238} {"train_loss": -41.70024490356445, "global_step": 270857, "epoch": 2238} {"train_loss": -42.05706024169922, "global_step": 270858, "epoch": 2238} {"train_loss": -42.07551574707031, "global_step": 270859, "epoch": 2238} {"train_loss": -39.79274368286133, "global_step": 270860, "epoch": 2238} {"train_loss": -40.599666595458984, "global_step": 270861, "epoch": 2238} {"train_loss": -41.7967529296875, "global_step": 270862, "epoch": 2238} {"train_loss": -42.380916595458984, "global_step": 270863, "epoch": 2238} {"train_loss": -42.229103088378906, "global_step": 270864, "epoch": 2238} {"train_loss": -42.00667953491211, "global_step": 270865, "epoch": 2238} {"train_loss": -42.14626693725586, "global_step": 270866, "epoch": 2238} {"train_loss": -41.964569091796875, "global_step": 270867, "epoch": 2238} {"train_loss": -42.3923454284668, "global_step": 270868, "epoch": 2238} {"train_loss": -42.71205139160156, "global_step": 270869, "epoch": 2238} {"train_loss": -42.508541107177734, "global_step": 270870, "epoch": 2238} {"train_loss": -42.116973876953125, "global_step": 270871, "epoch": 2238} {"train_loss": -42.10453414916992, "global_step": 270872, "epoch": 2238} {"train_loss": -42.7253303527832, "global_step": 270873, "epoch": 2238} {"train_loss": -43.02197265625, "global_step": 270874, "epoch": 2238} {"train_loss": -42.86739730834961, "global_step": 270875, "epoch": 2238} {"train_loss": -42.13713073730469, "global_step": 270876, "epoch": 2238} {"train_loss": -42.222572326660156, "global_step": 270877, "epoch": 2238} {"train_loss": -42.58797073364258, "global_step": 270878, "epoch": 2238} {"train_loss": -42.001155853271484, "global_step": 270879, "epoch": 2238} {"train_loss": -42.509986877441406, "global_step": 270880, "epoch": 2238} {"train_loss": -41.73127365112305, "global_step": 270881, "epoch": 2238} {"train_loss": -42.34547424316406, "global_step": 270882, "epoch": 2238} {"train_loss": -41.652931213378906, "global_step": 270883, "epoch": 2238} {"train_loss": -41.72187805175781, "global_step": 270884, "epoch": 2238} {"train_loss": -41.350257873535156, "global_step": 270885, "epoch": 2238} {"train_loss": -42.31850814819336, "global_step": 270886, "epoch": 2238} {"train_loss": -41.82974624633789, "global_step": 270887, "epoch": 2238} {"train_loss": -42.523773193359375, "global_step": 270888, "epoch": 2238} {"train_loss": -42.640533447265625, "global_step": 270889, "epoch": 2238} {"train_loss": -42.048095703125, "global_step": 270890, "epoch": 2238} {"train_loss": -42.24203109741211, "global_step": 270891, "epoch": 2238} {"train_loss": -42.53036880493164, "global_step": 270892, "epoch": 2238} {"train_loss": -39.89436721801758, "global_step": 270893, "epoch": 2238} {"train_loss": -41.198455810546875, "global_step": 270894, "epoch": 2238} {"train_loss": -41.38618469238281, "global_step": 270895, "epoch": 2238} {"train_loss": -40.062313079833984, "global_step": 270896, "epoch": 2238} {"train_loss": -41.14955520629883, "global_step": 270897, "epoch": 2238} {"train_loss": -41.3001594543457, "global_step": 270898, "epoch": 2238} {"train_loss": -42.04167556762695, "global_step": 270899, "epoch": 2238} {"train_loss": -40.66167068481445, "global_step": 270900, "epoch": 2238} {"train_loss": -40.055355072021484, "global_step": 270901, "epoch": 2238} {"train_loss": -41.7489013671875, "global_step": 270902, "epoch": 2238} {"train_loss": -42.148765563964844, "global_step": 270903, "epoch": 2238} {"train_loss": -39.35637283325195, "global_step": 270904, "epoch": 2238} {"train_loss": -42.20589828491211, "global_step": 270905, "epoch": 2238} {"train_loss": -42.40034866333008, "global_step": 270906, "epoch": 2238} {"train_loss": -41.635677337646484, "global_step": 270907, "epoch": 2238} {"train_loss": -41.94919967651367, "global_step": 270908, "epoch": 2238} {"train_loss": -41.6829948425293, "global_step": 270909, "epoch": 2238} {"train_loss": -41.883480072021484, "global_step": 270910, "epoch": 2238} {"train_loss": -41.64870834350586, "global_step": 270911, "epoch": 2238} {"train_loss": -41.556697845458984, "global_step": 270912, "epoch": 2238} {"train_loss": -40.51930618286133, "global_step": 270913, "epoch": 2238} {"train_loss": -39.89397048950195, "global_step": 270914, "epoch": 2238} {"train_loss": -42.30025100708008, "global_step": 270915, "epoch": 2238} {"train_loss": -41.5466194152832, "global_step": 270916, "epoch": 2238} {"train_loss": -39.58232116699219, "global_step": 270917, "epoch": 2238} {"train_loss": -41.25059931731421, "global_step": 270918, "epoch": 2238, "val_loss": 3193090.75} {"train_loss": -42.4511604309082, "global_step": 270919, "epoch": 2239} {"train_loss": -42.3175163269043, "global_step": 270920, "epoch": 2239} {"train_loss": -41.71529006958008, "global_step": 270921, "epoch": 2239} {"train_loss": -40.49074935913086, "global_step": 270922, "epoch": 2239} {"train_loss": -40.25185012817383, "global_step": 270923, "epoch": 2239} {"train_loss": -40.676185607910156, "global_step": 270924, "epoch": 2239} {"train_loss": -40.722991943359375, "global_step": 270925, "epoch": 2239} {"train_loss": -40.513423919677734, "global_step": 270926, "epoch": 2239} {"train_loss": -41.94450759887695, "global_step": 270927, "epoch": 2239} {"train_loss": -41.798728942871094, "global_step": 270928, "epoch": 2239} {"train_loss": -39.006103515625, "global_step": 270929, "epoch": 2239} {"train_loss": -41.028289794921875, "global_step": 270930, "epoch": 2239} {"train_loss": -37.7967529296875, "global_step": 270931, "epoch": 2239} {"train_loss": -37.92454147338867, "global_step": 270932, "epoch": 2239} {"train_loss": -37.52114486694336, "global_step": 270933, "epoch": 2239} {"train_loss": -36.719276428222656, "global_step": 270934, "epoch": 2239} {"train_loss": -37.16636276245117, "global_step": 270935, "epoch": 2239} {"train_loss": -37.077327728271484, "global_step": 270936, "epoch": 2239} {"train_loss": -25.645044326782227, "global_step": 270937, "epoch": 2239} {"train_loss": -38.658424377441406, "global_step": 270938, "epoch": 2239} {"train_loss": -39.945213317871094, "global_step": 270939, "epoch": 2239} {"train_loss": -13.098625183105469, "global_step": 270940, "epoch": 2239} {"train_loss": -37.85308074951172, "global_step": 270941, "epoch": 2239} {"train_loss": -39.64018630981445, "global_step": 270942, "epoch": 2239} {"train_loss": -38.253456115722656, "global_step": 270943, "epoch": 2239} {"train_loss": -37.944087982177734, "global_step": 270944, "epoch": 2239} {"train_loss": -25.45310401916504, "global_step": 270945, "epoch": 2239} {"train_loss": -23.813230514526367, "global_step": 270946, "epoch": 2239} {"train_loss": -37.3428840637207, "global_step": 270947, "epoch": 2239} {"train_loss": -39.06538391113281, "global_step": 270948, "epoch": 2239} {"train_loss": -38.204402923583984, "global_step": 270949, "epoch": 2239} {"train_loss": -38.205810546875, "global_step": 270950, "epoch": 2239} {"train_loss": -29.423913955688477, "global_step": 270951, "epoch": 2239} {"train_loss": -36.96151351928711, "global_step": 270952, "epoch": 2239} {"train_loss": -36.50107955932617, "global_step": 270953, "epoch": 2239} {"train_loss": -37.962120056152344, "global_step": 270954, "epoch": 2239} {"train_loss": -37.24835968017578, "global_step": 270955, "epoch": 2239} {"train_loss": -37.461883544921875, "global_step": 270956, "epoch": 2239} {"train_loss": -37.885231018066406, "global_step": 270957, "epoch": 2239} {"train_loss": -38.660926818847656, "global_step": 270958, "epoch": 2239} {"train_loss": -36.283111572265625, "global_step": 270959, "epoch": 2239} {"train_loss": -33.82832717895508, "global_step": 270960, "epoch": 2239} {"train_loss": -33.45199966430664, "global_step": 270961, "epoch": 2239} {"train_loss": -36.67049789428711, "global_step": 270962, "epoch": 2239} {"train_loss": -39.73206329345703, "global_step": 270963, "epoch": 2239} {"train_loss": -38.568031311035156, "global_step": 270964, "epoch": 2239} {"train_loss": -39.21749496459961, "global_step": 270965, "epoch": 2239} {"train_loss": -38.524208068847656, "global_step": 270966, "epoch": 2239} {"train_loss": -39.62001037597656, "global_step": 270967, "epoch": 2239} {"train_loss": -39.916561126708984, "global_step": 270968, "epoch": 2239} {"train_loss": -38.405174255371094, "global_step": 270969, "epoch": 2239} {"train_loss": -39.50918197631836, "global_step": 270970, "epoch": 2239} {"train_loss": -38.5615119934082, "global_step": 270971, "epoch": 2239} {"train_loss": -39.6155891418457, "global_step": 270972, "epoch": 2239} {"train_loss": -39.9559326171875, "global_step": 270973, "epoch": 2239} {"train_loss": -39.00801467895508, "global_step": 270974, "epoch": 2239} {"train_loss": -39.32609558105469, "global_step": 270975, "epoch": 2239} {"train_loss": -39.7237663269043, "global_step": 270976, "epoch": 2239} {"train_loss": -38.42716979980469, "global_step": 270977, "epoch": 2239} {"train_loss": -39.712127685546875, "global_step": 270978, "epoch": 2239} {"train_loss": -39.727474212646484, "global_step": 270979, "epoch": 2239} {"train_loss": -40.71743392944336, "global_step": 270980, "epoch": 2239} {"train_loss": -40.364479064941406, "global_step": 270981, "epoch": 2239} {"train_loss": -39.67170715332031, "global_step": 270982, "epoch": 2239} {"train_loss": -40.169246673583984, "global_step": 270983, "epoch": 2239} {"train_loss": -40.0727424621582, "global_step": 270984, "epoch": 2239} {"train_loss": -40.29914093017578, "global_step": 270985, "epoch": 2239} {"train_loss": -40.1635856628418, "global_step": 270986, "epoch": 2239} {"train_loss": -41.07310104370117, "global_step": 270987, "epoch": 2239} {"train_loss": -40.75870895385742, "global_step": 270988, "epoch": 2239} {"train_loss": -40.62636184692383, "global_step": 270989, "epoch": 2239} {"train_loss": -40.63957595825195, "global_step": 270990, "epoch": 2239} {"train_loss": -41.241878509521484, "global_step": 270991, "epoch": 2239} {"train_loss": -41.3704719543457, "global_step": 270992, "epoch": 2239} {"train_loss": -40.17939376831055, "global_step": 270993, "epoch": 2239} {"train_loss": -40.919490814208984, "global_step": 270994, "epoch": 2239} {"train_loss": -40.848812103271484, "global_step": 270995, "epoch": 2239} {"train_loss": -40.81751251220703, "global_step": 270996, "epoch": 2239} {"train_loss": -40.335750579833984, "global_step": 270997, "epoch": 2239} {"train_loss": -40.36220932006836, "global_step": 270998, "epoch": 2239} {"train_loss": -40.518550872802734, "global_step": 270999, "epoch": 2239} {"train_loss": -41.089229583740234, "global_step": 271000, "epoch": 2239} {"train_loss": -41.14308547973633, "global_step": 271001, "epoch": 2239} {"train_loss": -41.41195297241211, "global_step": 271002, "epoch": 2239} {"train_loss": -41.35405349731445, "global_step": 271003, "epoch": 2239} {"train_loss": -40.64727020263672, "global_step": 271004, "epoch": 2239} {"train_loss": -41.331817626953125, "global_step": 271005, "epoch": 2239} {"train_loss": -41.49053955078125, "global_step": 271006, "epoch": 2239} {"train_loss": -41.63094711303711, "global_step": 271007, "epoch": 2239} {"train_loss": -41.57320022583008, "global_step": 271008, "epoch": 2239} {"train_loss": -41.328033447265625, "global_step": 271009, "epoch": 2239} {"train_loss": -41.41408157348633, "global_step": 271010, "epoch": 2239} {"train_loss": -41.70952224731445, "global_step": 271011, "epoch": 2239} {"train_loss": -41.27265167236328, "global_step": 271012, "epoch": 2239} {"train_loss": -41.768890380859375, "global_step": 271013, "epoch": 2239} {"train_loss": -41.24216842651367, "global_step": 271014, "epoch": 2239} {"train_loss": -40.668941497802734, "global_step": 271015, "epoch": 2239} {"train_loss": -41.50269317626953, "global_step": 271016, "epoch": 2239} {"train_loss": -41.75980758666992, "global_step": 271017, "epoch": 2239} {"train_loss": -41.896724700927734, "global_step": 271018, "epoch": 2239} {"train_loss": -40.935386657714844, "global_step": 271019, "epoch": 2239} {"train_loss": -41.68861389160156, "global_step": 271020, "epoch": 2239} {"train_loss": -42.49443817138672, "global_step": 271021, "epoch": 2239} {"train_loss": -41.061614990234375, "global_step": 271022, "epoch": 2239} {"train_loss": -41.92643356323242, "global_step": 271023, "epoch": 2239} {"train_loss": -42.13717269897461, "global_step": 271024, "epoch": 2239} {"train_loss": -41.68777847290039, "global_step": 271025, "epoch": 2239} {"train_loss": -41.946319580078125, "global_step": 271026, "epoch": 2239} {"train_loss": -41.924400329589844, "global_step": 271027, "epoch": 2239} {"train_loss": -42.0942497253418, "global_step": 271028, "epoch": 2239} {"train_loss": -42.24159240722656, "global_step": 271029, "epoch": 2239} {"train_loss": -42.05607223510742, "global_step": 271030, "epoch": 2239} {"train_loss": -42.10228729248047, "global_step": 271031, "epoch": 2239} {"train_loss": -42.32017135620117, "global_step": 271032, "epoch": 2239} {"train_loss": -41.92395782470703, "global_step": 271033, "epoch": 2239} {"train_loss": -42.29948043823242, "global_step": 271034, "epoch": 2239} {"train_loss": -42.136619567871094, "global_step": 271035, "epoch": 2239} {"train_loss": -41.70416259765625, "global_step": 271036, "epoch": 2239} {"train_loss": -42.2188606262207, "global_step": 271037, "epoch": 2239} {"train_loss": -42.01716232299805, "global_step": 271038, "epoch": 2239} {"train_loss": -39.40932291204279, "global_step": 271039, "epoch": 2239, "val_loss": 2760134.5} {"train_loss": -42.450130462646484, "global_step": 271040, "epoch": 2240} {"train_loss": -42.4257926940918, "global_step": 271041, "epoch": 2240} {"train_loss": -42.27437973022461, "global_step": 271042, "epoch": 2240} {"train_loss": -42.17377853393555, "global_step": 271043, "epoch": 2240} {"train_loss": -42.76841354370117, "global_step": 271044, "epoch": 2240} {"train_loss": -42.654579162597656, "global_step": 271045, "epoch": 2240} {"train_loss": -42.68062210083008, "global_step": 271046, "epoch": 2240} {"train_loss": -42.77360153198242, "global_step": 271047, "epoch": 2240} {"train_loss": -41.88161849975586, "global_step": 271048, "epoch": 2240} {"train_loss": -42.554508209228516, "global_step": 271049, "epoch": 2240} {"train_loss": -42.73283004760742, "global_step": 271050, "epoch": 2240} {"train_loss": -42.78693389892578, "global_step": 271051, "epoch": 2240} {"train_loss": -41.3658332824707, "global_step": 271052, "epoch": 2240} {"train_loss": -42.721229553222656, "global_step": 271053, "epoch": 2240} {"train_loss": -42.82265853881836, "global_step": 271054, "epoch": 2240} {"train_loss": -42.272422790527344, "global_step": 271055, "epoch": 2240} {"train_loss": -41.219146728515625, "global_step": 271056, "epoch": 2240} {"train_loss": -42.65488815307617, "global_step": 271057, "epoch": 2240} {"train_loss": -42.93661117553711, "global_step": 271058, "epoch": 2240} {"train_loss": -42.168922424316406, "global_step": 271059, "epoch": 2240} {"train_loss": -41.27216339111328, "global_step": 271060, "epoch": 2240} {"train_loss": -40.362648010253906, "global_step": 271061, "epoch": 2240} {"train_loss": -36.23655319213867, "global_step": 271062, "epoch": 2240} {"train_loss": -30.425155639648438, "global_step": 271063, "epoch": 2240} {"train_loss": -17.543670654296875, "global_step": 271064, "epoch": 2240} {"train_loss": -15.743060111999512, "global_step": 271065, "epoch": 2240} {"train_loss": -38.70988845825195, "global_step": 271066, "epoch": 2240} {"train_loss": -26.141874313354492, "global_step": 271067, "epoch": 2240} {"train_loss": -15.307289123535156, "global_step": 271068, "epoch": 2240} {"train_loss": -37.96622085571289, "global_step": 271069, "epoch": 2240} {"train_loss": -24.49783706665039, "global_step": 271070, "epoch": 2240} {"train_loss": -34.874359130859375, "global_step": 271071, "epoch": 2240} {"train_loss": -21.980857849121094, "global_step": 271072, "epoch": 2240} {"train_loss": -37.83275604248047, "global_step": 271073, "epoch": 2240} {"train_loss": -20.273462295532227, "global_step": 271074, "epoch": 2240} {"train_loss": -36.82124710083008, "global_step": 271075, "epoch": 2240} {"train_loss": -28.566089630126953, "global_step": 271076, "epoch": 2240} {"train_loss": -29.249786376953125, "global_step": 271077, "epoch": 2240} {"train_loss": -38.661163330078125, "global_step": 271078, "epoch": 2240} {"train_loss": -28.37494468688965, "global_step": 271079, "epoch": 2240} {"train_loss": -30.504648208618164, "global_step": 271080, "epoch": 2240} {"train_loss": -38.5123176574707, "global_step": 271081, "epoch": 2240} {"train_loss": -37.552982330322266, "global_step": 271082, "epoch": 2240} {"train_loss": -32.95503234863281, "global_step": 271083, "epoch": 2240} {"train_loss": -34.63886642456055, "global_step": 271084, "epoch": 2240} {"train_loss": -37.8792839050293, "global_step": 271085, "epoch": 2240} {"train_loss": -37.482215881347656, "global_step": 271086, "epoch": 2240} {"train_loss": -37.59999465942383, "global_step": 271087, "epoch": 2240} {"train_loss": -36.71592330932617, "global_step": 271088, "epoch": 2240} {"train_loss": -36.09223175048828, "global_step": 271089, "epoch": 2240} {"train_loss": -38.34980392456055, "global_step": 271090, "epoch": 2240} {"train_loss": -39.65408706665039, "global_step": 271091, "epoch": 2240} {"train_loss": -38.00941848754883, "global_step": 271092, "epoch": 2240} {"train_loss": -37.447914123535156, "global_step": 271093, "epoch": 2240} {"train_loss": -38.656982421875, "global_step": 271094, "epoch": 2240} {"train_loss": -39.162376403808594, "global_step": 271095, "epoch": 2240} {"train_loss": -38.9441032409668, "global_step": 271096, "epoch": 2240} {"train_loss": -39.01801681518555, "global_step": 271097, "epoch": 2240} {"train_loss": -39.39797592163086, "global_step": 271098, "epoch": 2240} {"train_loss": -38.77365493774414, "global_step": 271099, "epoch": 2240} {"train_loss": -39.18276596069336, "global_step": 271100, "epoch": 2240} {"train_loss": -39.203983306884766, "global_step": 271101, "epoch": 2240} {"train_loss": -39.48453903198242, "global_step": 271102, "epoch": 2240} {"train_loss": -39.07575225830078, "global_step": 271103, "epoch": 2240} {"train_loss": -39.66777420043945, "global_step": 271104, "epoch": 2240} {"train_loss": -40.23916244506836, "global_step": 271105, "epoch": 2240} {"train_loss": -39.81185531616211, "global_step": 271106, "epoch": 2240} {"train_loss": -39.95929718017578, "global_step": 271107, "epoch": 2240} {"train_loss": -39.91642379760742, "global_step": 271108, "epoch": 2240} {"train_loss": -40.30160140991211, "global_step": 271109, "epoch": 2240} {"train_loss": -40.08030319213867, "global_step": 271110, "epoch": 2240} {"train_loss": -40.131591796875, "global_step": 271111, "epoch": 2240} {"train_loss": -40.15755844116211, "global_step": 271112, "epoch": 2240} {"train_loss": -40.658973693847656, "global_step": 271113, "epoch": 2240} {"train_loss": -40.154701232910156, "global_step": 271114, "epoch": 2240} {"train_loss": -40.34893035888672, "global_step": 271115, "epoch": 2240} {"train_loss": -39.964454650878906, "global_step": 271116, "epoch": 2240} {"train_loss": -40.551429748535156, "global_step": 271117, "epoch": 2240} {"train_loss": -40.19858932495117, "global_step": 271118, "epoch": 2240} {"train_loss": -40.883941650390625, "global_step": 271119, "epoch": 2240} {"train_loss": -40.58843994140625, "global_step": 271120, "epoch": 2240} {"train_loss": -40.71718215942383, "global_step": 271121, "epoch": 2240} {"train_loss": -40.690895080566406, "global_step": 271122, "epoch": 2240} {"train_loss": -41.03151321411133, "global_step": 271123, "epoch": 2240} {"train_loss": -40.794227600097656, "global_step": 271124, "epoch": 2240} {"train_loss": -40.94163131713867, "global_step": 271125, "epoch": 2240} {"train_loss": -41.1475944519043, "global_step": 271126, "epoch": 2240} {"train_loss": -40.71602249145508, "global_step": 271127, "epoch": 2240} {"train_loss": -40.91288375854492, "global_step": 271128, "epoch": 2240} {"train_loss": -41.35293197631836, "global_step": 271129, "epoch": 2240} {"train_loss": -41.24614334106445, "global_step": 271130, "epoch": 2240} {"train_loss": -40.88749313354492, "global_step": 271131, "epoch": 2240} {"train_loss": -40.73950958251953, "global_step": 271132, "epoch": 2240} {"train_loss": -41.5025634765625, "global_step": 271133, "epoch": 2240} {"train_loss": -41.576507568359375, "global_step": 271134, "epoch": 2240} {"train_loss": -41.11135482788086, "global_step": 271135, "epoch": 2240} {"train_loss": -41.250728607177734, "global_step": 271136, "epoch": 2240} {"train_loss": -41.42155075073242, "global_step": 271137, "epoch": 2240} {"train_loss": -41.644874572753906, "global_step": 271138, "epoch": 2240} {"train_loss": -41.087528228759766, "global_step": 271139, "epoch": 2240} {"train_loss": -41.27861404418945, "global_step": 271140, "epoch": 2240} {"train_loss": -41.495235443115234, "global_step": 271141, "epoch": 2240} {"train_loss": -41.68109893798828, "global_step": 271142, "epoch": 2240} {"train_loss": -41.80082321166992, "global_step": 271143, "epoch": 2240} {"train_loss": -41.754913330078125, "global_step": 271144, "epoch": 2240} {"train_loss": -41.11896514892578, "global_step": 271145, "epoch": 2240} {"train_loss": -41.94297409057617, "global_step": 271146, "epoch": 2240} {"train_loss": -42.17771530151367, "global_step": 271147, "epoch": 2240} {"train_loss": -41.60456848144531, "global_step": 271148, "epoch": 2240} {"train_loss": -41.74135208129883, "global_step": 271149, "epoch": 2240} {"train_loss": -42.10348129272461, "global_step": 271150, "epoch": 2240} {"train_loss": -42.21732711791992, "global_step": 271151, "epoch": 2240} {"train_loss": -42.29348373413086, "global_step": 271152, "epoch": 2240} {"train_loss": -40.76809310913086, "global_step": 271153, "epoch": 2240} {"train_loss": -41.92460250854492, "global_step": 271154, "epoch": 2240} {"train_loss": -42.1066780090332, "global_step": 271155, "epoch": 2240} {"train_loss": -42.24263381958008, "global_step": 271156, "epoch": 2240} {"train_loss": -41.78709030151367, "global_step": 271157, "epoch": 2240} {"train_loss": -42.358028411865234, "global_step": 271158, "epoch": 2240} {"train_loss": -42.109710693359375, "global_step": 271159, "epoch": 2240} {"train_loss": -38.812136492453334, "global_step": 271160, "epoch": 2240, "val_loss": 2603431.25} {"train_loss": -42.38266372680664, "global_step": 271161, "epoch": 2241} {"train_loss": -41.92641830444336, "global_step": 271162, "epoch": 2241} {"train_loss": -42.153804779052734, "global_step": 271163, "epoch": 2241} {"train_loss": -42.11872482299805, "global_step": 271164, "epoch": 2241} {"train_loss": -41.82423782348633, "global_step": 271165, "epoch": 2241} {"train_loss": -42.70328140258789, "global_step": 271166, "epoch": 2241} {"train_loss": -42.08102035522461, "global_step": 271167, "epoch": 2241} {"train_loss": -41.681949615478516, "global_step": 271168, "epoch": 2241} {"train_loss": -42.453887939453125, "global_step": 271169, "epoch": 2241} {"train_loss": -42.76990509033203, "global_step": 271170, "epoch": 2241} {"train_loss": -42.64246368408203, "global_step": 271171, "epoch": 2241} {"train_loss": -43.0069580078125, "global_step": 271172, "epoch": 2241} {"train_loss": -42.35798263549805, "global_step": 271173, "epoch": 2241} {"train_loss": -42.47443389892578, "global_step": 271174, "epoch": 2241} {"train_loss": -43.032371520996094, "global_step": 271175, "epoch": 2241} {"train_loss": -42.568084716796875, "global_step": 271176, "epoch": 2241} {"train_loss": -41.17913055419922, "global_step": 271177, "epoch": 2241} {"train_loss": -42.56189727783203, "global_step": 271178, "epoch": 2241} {"train_loss": -43.13325119018555, "global_step": 271179, "epoch": 2241} {"train_loss": -42.99143600463867, "global_step": 271180, "epoch": 2241} {"train_loss": -42.89447784423828, "global_step": 271181, "epoch": 2241} {"train_loss": -42.6389045715332, "global_step": 271182, "epoch": 2241} {"train_loss": -41.90362548828125, "global_step": 271183, "epoch": 2241} {"train_loss": -42.65175247192383, "global_step": 271184, "epoch": 2241} {"train_loss": -42.95302963256836, "global_step": 271185, "epoch": 2241} {"train_loss": -43.20387649536133, "global_step": 271186, "epoch": 2241} {"train_loss": -43.27371597290039, "global_step": 271187, "epoch": 2241} {"train_loss": -43.16001892089844, "global_step": 271188, "epoch": 2241} {"train_loss": -42.57435607910156, "global_step": 271189, "epoch": 2241} {"train_loss": -42.71999740600586, "global_step": 271190, "epoch": 2241} {"train_loss": -42.86500930786133, "global_step": 271191, "epoch": 2241} {"train_loss": -43.17845916748047, "global_step": 271192, "epoch": 2241} {"train_loss": -42.87498092651367, "global_step": 271193, "epoch": 2241} {"train_loss": -43.140960693359375, "global_step": 271194, "epoch": 2241} {"train_loss": -43.49468231201172, "global_step": 271195, "epoch": 2241} {"train_loss": -43.11444854736328, "global_step": 271196, "epoch": 2241} {"train_loss": -43.480224609375, "global_step": 271197, "epoch": 2241} {"train_loss": -43.316749572753906, "global_step": 271198, "epoch": 2241} {"train_loss": -43.4242057800293, "global_step": 271199, "epoch": 2241} {"train_loss": -43.35549545288086, "global_step": 271200, "epoch": 2241} {"train_loss": -43.04418182373047, "global_step": 271201, "epoch": 2241} {"train_loss": -43.14642333984375, "global_step": 271202, "epoch": 2241} {"train_loss": -43.230499267578125, "global_step": 271203, "epoch": 2241} {"train_loss": -43.53066635131836, "global_step": 271204, "epoch": 2241} {"train_loss": -42.097755432128906, "global_step": 271205, "epoch": 2241} {"train_loss": -41.92241287231445, "global_step": 271206, "epoch": 2241} {"train_loss": -34.82754135131836, "global_step": 271207, "epoch": 2241} {"train_loss": -19.618024826049805, "global_step": 271208, "epoch": 2241} {"train_loss": -6.931037902832031, "global_step": 271209, "epoch": 2241} {"train_loss": -16.455936431884766, "global_step": 271210, "epoch": 2241} {"train_loss": -31.341949462890625, "global_step": 271211, "epoch": 2241} {"train_loss": -34.064796447753906, "global_step": 271212, "epoch": 2241} {"train_loss": -35.60990524291992, "global_step": 271213, "epoch": 2241} {"train_loss": -33.45759963989258, "global_step": 271214, "epoch": 2241} {"train_loss": -34.639827728271484, "global_step": 271215, "epoch": 2241} {"train_loss": -38.75733184814453, "global_step": 271216, "epoch": 2241} {"train_loss": -35.38386154174805, "global_step": 271217, "epoch": 2241} {"train_loss": -40.0765495300293, "global_step": 271218, "epoch": 2241} {"train_loss": -37.54011154174805, "global_step": 271219, "epoch": 2241} {"train_loss": -39.17160415649414, "global_step": 271220, "epoch": 2241} {"train_loss": -39.700042724609375, "global_step": 271221, "epoch": 2241} {"train_loss": -39.680084228515625, "global_step": 271222, "epoch": 2241} {"train_loss": -40.74989700317383, "global_step": 271223, "epoch": 2241} {"train_loss": -40.684486389160156, "global_step": 271224, "epoch": 2241} {"train_loss": -40.23635482788086, "global_step": 271225, "epoch": 2241} {"train_loss": -40.46908187866211, "global_step": 271226, "epoch": 2241} {"train_loss": -40.56461715698242, "global_step": 271227, "epoch": 2241} {"train_loss": -41.15802764892578, "global_step": 271228, "epoch": 2241} {"train_loss": -40.6082878112793, "global_step": 271229, "epoch": 2241} {"train_loss": -40.30571365356445, "global_step": 271230, "epoch": 2241} {"train_loss": -41.28097915649414, "global_step": 271231, "epoch": 2241} {"train_loss": -40.136505126953125, "global_step": 271232, "epoch": 2241} {"train_loss": -41.101749420166016, "global_step": 271233, "epoch": 2241} {"train_loss": -40.83826446533203, "global_step": 271234, "epoch": 2241} {"train_loss": -41.11983108520508, "global_step": 271235, "epoch": 2241} {"train_loss": -40.84897994995117, "global_step": 271236, "epoch": 2241} {"train_loss": -40.77586364746094, "global_step": 271237, "epoch": 2241} {"train_loss": -41.477725982666016, "global_step": 271238, "epoch": 2241} {"train_loss": -40.86099624633789, "global_step": 271239, "epoch": 2241} {"train_loss": -41.86971664428711, "global_step": 271240, "epoch": 2241} {"train_loss": -41.590248107910156, "global_step": 271241, "epoch": 2241} {"train_loss": -41.4342155456543, "global_step": 271242, "epoch": 2241} {"train_loss": -41.84088134765625, "global_step": 271243, "epoch": 2241} {"train_loss": -41.60294723510742, "global_step": 271244, "epoch": 2241} {"train_loss": -41.844661712646484, "global_step": 271245, "epoch": 2241} {"train_loss": -41.8846321105957, "global_step": 271246, "epoch": 2241} {"train_loss": -41.84770202636719, "global_step": 271247, "epoch": 2241} {"train_loss": -42.03400421142578, "global_step": 271248, "epoch": 2241} {"train_loss": -42.2337760925293, "global_step": 271249, "epoch": 2241} {"train_loss": -42.06162643432617, "global_step": 271250, "epoch": 2241} {"train_loss": -42.0050048828125, "global_step": 271251, "epoch": 2241} {"train_loss": -42.061195373535156, "global_step": 271252, "epoch": 2241} {"train_loss": -42.01679992675781, "global_step": 271253, "epoch": 2241} {"train_loss": -42.17885971069336, "global_step": 271254, "epoch": 2241} {"train_loss": -42.200653076171875, "global_step": 271255, "epoch": 2241} {"train_loss": -42.126930236816406, "global_step": 271256, "epoch": 2241} {"train_loss": -42.02730941772461, "global_step": 271257, "epoch": 2241} {"train_loss": -42.30171585083008, "global_step": 271258, "epoch": 2241} {"train_loss": -41.919612884521484, "global_step": 271259, "epoch": 2241} {"train_loss": -42.46393585205078, "global_step": 271260, "epoch": 2241} {"train_loss": -41.99679183959961, "global_step": 271261, "epoch": 2241} {"train_loss": -42.811676025390625, "global_step": 271262, "epoch": 2241} {"train_loss": -42.4296989440918, "global_step": 271263, "epoch": 2241} {"train_loss": -42.8565559387207, "global_step": 271264, "epoch": 2241} {"train_loss": -42.163238525390625, "global_step": 271265, "epoch": 2241} {"train_loss": -42.420528411865234, "global_step": 271266, "epoch": 2241} {"train_loss": -42.111427307128906, "global_step": 271267, "epoch": 2241} {"train_loss": -42.476318359375, "global_step": 271268, "epoch": 2241} {"train_loss": -42.5045280456543, "global_step": 271269, "epoch": 2241} {"train_loss": -42.786651611328125, "global_step": 271270, "epoch": 2241} {"train_loss": -43.03110885620117, "global_step": 271271, "epoch": 2241} {"train_loss": -42.92302703857422, "global_step": 271272, "epoch": 2241} {"train_loss": -42.809696197509766, "global_step": 271273, "epoch": 2241} {"train_loss": -43.06073760986328, "global_step": 271274, "epoch": 2241} {"train_loss": -42.76530075073242, "global_step": 271275, "epoch": 2241} {"train_loss": -42.635841369628906, "global_step": 271276, "epoch": 2241} {"train_loss": -42.978431701660156, "global_step": 271277, "epoch": 2241} {"train_loss": -42.85173416137695, "global_step": 271278, "epoch": 2241} {"train_loss": -42.78243637084961, "global_step": 271279, "epoch": 2241} {"train_loss": -41.99008560180664, "global_step": 271280, "epoch": 2241} {"train_loss": -40.93058557746824, "global_step": 271281, "epoch": 2241, "val_loss": 2539502.0} {"train_loss": -43.11094284057617, "global_step": 271282, "epoch": 2242} {"train_loss": -43.08370590209961, "global_step": 271283, "epoch": 2242} {"train_loss": -42.955657958984375, "global_step": 271284, "epoch": 2242} {"train_loss": -42.985538482666016, "global_step": 271285, "epoch": 2242} {"train_loss": -43.25886154174805, "global_step": 271286, "epoch": 2242} {"train_loss": -42.73746871948242, "global_step": 271287, "epoch": 2242} {"train_loss": -43.12112808227539, "global_step": 271288, "epoch": 2242} {"train_loss": -42.47172164916992, "global_step": 271289, "epoch": 2242} {"train_loss": -43.26903533935547, "global_step": 271290, "epoch": 2242} {"train_loss": -43.142391204833984, "global_step": 271291, "epoch": 2242} {"train_loss": -42.88859939575195, "global_step": 271292, "epoch": 2242} {"train_loss": -43.253944396972656, "global_step": 271293, "epoch": 2242} {"train_loss": -43.110939025878906, "global_step": 271294, "epoch": 2242} {"train_loss": -43.339149475097656, "global_step": 271295, "epoch": 2242} {"train_loss": -43.43708801269531, "global_step": 271296, "epoch": 2242} {"train_loss": -43.31473922729492, "global_step": 271297, "epoch": 2242} {"train_loss": -43.42313003540039, "global_step": 271298, "epoch": 2242} {"train_loss": -43.42717742919922, "global_step": 271299, "epoch": 2242} {"train_loss": -43.17359924316406, "global_step": 271300, "epoch": 2242} {"train_loss": -43.11304473876953, "global_step": 271301, "epoch": 2242} {"train_loss": -42.8541259765625, "global_step": 271302, "epoch": 2242} {"train_loss": -43.16851806640625, "global_step": 271303, "epoch": 2242} {"train_loss": -43.27095413208008, "global_step": 271304, "epoch": 2242} {"train_loss": -43.19059753417969, "global_step": 271305, "epoch": 2242} {"train_loss": -43.683204650878906, "global_step": 271306, "epoch": 2242} {"train_loss": -43.50698471069336, "global_step": 271307, "epoch": 2242} {"train_loss": -43.438968658447266, "global_step": 271308, "epoch": 2242} {"train_loss": -43.36614990234375, "global_step": 271309, "epoch": 2242} {"train_loss": -43.365901947021484, "global_step": 271310, "epoch": 2242} {"train_loss": -43.90989303588867, "global_step": 271311, "epoch": 2242} {"train_loss": -42.9752311706543, "global_step": 271312, "epoch": 2242} {"train_loss": -43.69968032836914, "global_step": 271313, "epoch": 2242} {"train_loss": -43.699275970458984, "global_step": 271314, "epoch": 2242} {"train_loss": -43.46855163574219, "global_step": 271315, "epoch": 2242} {"train_loss": -43.24900436401367, "global_step": 271316, "epoch": 2242} {"train_loss": -43.3389778137207, "global_step": 271317, "epoch": 2242} {"train_loss": -43.34810256958008, "global_step": 271318, "epoch": 2242} {"train_loss": -43.5526237487793, "global_step": 271319, "epoch": 2242} {"train_loss": -43.407344818115234, "global_step": 271320, "epoch": 2242} {"train_loss": -43.59444808959961, "global_step": 271321, "epoch": 2242} {"train_loss": -42.297767639160156, "global_step": 271322, "epoch": 2242} {"train_loss": -43.280548095703125, "global_step": 271323, "epoch": 2242} {"train_loss": -43.368988037109375, "global_step": 271324, "epoch": 2242} {"train_loss": -43.26812744140625, "global_step": 271325, "epoch": 2242} {"train_loss": -43.18738555908203, "global_step": 271326, "epoch": 2242} {"train_loss": -42.93156051635742, "global_step": 271327, "epoch": 2242} {"train_loss": -42.992488861083984, "global_step": 271328, "epoch": 2242} {"train_loss": -43.301815032958984, "global_step": 271329, "epoch": 2242} {"train_loss": -42.494140625, "global_step": 271330, "epoch": 2242} {"train_loss": -41.73161315917969, "global_step": 271331, "epoch": 2242} {"train_loss": -41.59992218017578, "global_step": 271332, "epoch": 2242} {"train_loss": -41.10544204711914, "global_step": 271333, "epoch": 2242} {"train_loss": -41.19076156616211, "global_step": 271334, "epoch": 2242} {"train_loss": -41.71332931518555, "global_step": 271335, "epoch": 2242} {"train_loss": -39.186553955078125, "global_step": 271336, "epoch": 2242} {"train_loss": -41.09894943237305, "global_step": 271337, "epoch": 2242} {"train_loss": -40.770721435546875, "global_step": 271338, "epoch": 2242} {"train_loss": -40.91506576538086, "global_step": 271339, "epoch": 2242} {"train_loss": -41.64373779296875, "global_step": 271340, "epoch": 2242} {"train_loss": -40.206539154052734, "global_step": 271341, "epoch": 2242} {"train_loss": -40.77769470214844, "global_step": 271342, "epoch": 2242} {"train_loss": -41.32829666137695, "global_step": 271343, "epoch": 2242} {"train_loss": -41.886756896972656, "global_step": 271344, "epoch": 2242} {"train_loss": -41.4143180847168, "global_step": 271345, "epoch": 2242} {"train_loss": -40.75916290283203, "global_step": 271346, "epoch": 2242} {"train_loss": -42.36713790893555, "global_step": 271347, "epoch": 2242} {"train_loss": -40.94855880737305, "global_step": 271348, "epoch": 2242} {"train_loss": -41.40226745605469, "global_step": 271349, "epoch": 2242} {"train_loss": -39.659053802490234, "global_step": 271350, "epoch": 2242} {"train_loss": -41.508811950683594, "global_step": 271351, "epoch": 2242} {"train_loss": -35.93266677856445, "global_step": 271352, "epoch": 2242} {"train_loss": -40.491268157958984, "global_step": 271353, "epoch": 2242} {"train_loss": -38.260108947753906, "global_step": 271354, "epoch": 2242} {"train_loss": -40.6778564453125, "global_step": 271355, "epoch": 2242} {"train_loss": -40.29820251464844, "global_step": 271356, "epoch": 2242} {"train_loss": -39.63359832763672, "global_step": 271357, "epoch": 2242} {"train_loss": -41.24477767944336, "global_step": 271358, "epoch": 2242} {"train_loss": -39.60531234741211, "global_step": 271359, "epoch": 2242} {"train_loss": -39.80253219604492, "global_step": 271360, "epoch": 2242} {"train_loss": -41.23305130004883, "global_step": 271361, "epoch": 2242} {"train_loss": -40.444801330566406, "global_step": 271362, "epoch": 2242} {"train_loss": -41.57937240600586, "global_step": 271363, "epoch": 2242} {"train_loss": -39.93523025512695, "global_step": 271364, "epoch": 2242} {"train_loss": -41.12276840209961, "global_step": 271365, "epoch": 2242} {"train_loss": -41.10090255737305, "global_step": 271366, "epoch": 2242} {"train_loss": -39.84291458129883, "global_step": 271367, "epoch": 2242} {"train_loss": -42.07260513305664, "global_step": 271368, "epoch": 2242} {"train_loss": -40.44100570678711, "global_step": 271369, "epoch": 2242} {"train_loss": -41.56622314453125, "global_step": 271370, "epoch": 2242} {"train_loss": -42.172664642333984, "global_step": 271371, "epoch": 2242} {"train_loss": -41.65968704223633, "global_step": 271372, "epoch": 2242} {"train_loss": -41.70585250854492, "global_step": 271373, "epoch": 2242} {"train_loss": -41.297569274902344, "global_step": 271374, "epoch": 2242} {"train_loss": -41.50015640258789, "global_step": 271375, "epoch": 2242} {"train_loss": -40.360015869140625, "global_step": 271376, "epoch": 2242} {"train_loss": -42.015411376953125, "global_step": 271377, "epoch": 2242} {"train_loss": -42.0262565612793, "global_step": 271378, "epoch": 2242} {"train_loss": -42.54856872558594, "global_step": 271379, "epoch": 2242} {"train_loss": -42.277137756347656, "global_step": 271380, "epoch": 2242} {"train_loss": -41.3532829284668, "global_step": 271381, "epoch": 2242} {"train_loss": -42.53739547729492, "global_step": 271382, "epoch": 2242} {"train_loss": -41.47208786010742, "global_step": 271383, "epoch": 2242} {"train_loss": -41.791603088378906, "global_step": 271384, "epoch": 2242} {"train_loss": -42.51922607421875, "global_step": 271385, "epoch": 2242} {"train_loss": -42.48944091796875, "global_step": 271386, "epoch": 2242} {"train_loss": -42.085330963134766, "global_step": 271387, "epoch": 2242} {"train_loss": -42.17243194580078, "global_step": 271388, "epoch": 2242} {"train_loss": -41.678070068359375, "global_step": 271389, "epoch": 2242} {"train_loss": -42.000450134277344, "global_step": 271390, "epoch": 2242} {"train_loss": -42.3165397644043, "global_step": 271391, "epoch": 2242} {"train_loss": -42.770896911621094, "global_step": 271392, "epoch": 2242} {"train_loss": -42.41796875, "global_step": 271393, "epoch": 2242} {"train_loss": -42.533260345458984, "global_step": 271394, "epoch": 2242} {"train_loss": -42.578041076660156, "global_step": 271395, "epoch": 2242} {"train_loss": -42.479610443115234, "global_step": 271396, "epoch": 2242} {"train_loss": -42.66426467895508, "global_step": 271397, "epoch": 2242} {"train_loss": -42.56370162963867, "global_step": 271398, "epoch": 2242} {"train_loss": -43.0709342956543, "global_step": 271399, "epoch": 2242} {"train_loss": -43.557533264160156, "global_step": 271400, "epoch": 2242} {"train_loss": -42.6186637878418, "global_step": 271401, "epoch": 2242} {"train_loss": -42.120433523635235, "global_step": 271402, "epoch": 2242, "val_loss": 2653250.0} {"train_loss": -43.17195129394531, "global_step": 271403, "epoch": 2243} {"train_loss": -43.5672607421875, "global_step": 271404, "epoch": 2243} {"train_loss": -43.0172004699707, "global_step": 271405, "epoch": 2243} {"train_loss": -43.03855895996094, "global_step": 271406, "epoch": 2243} {"train_loss": -42.60140609741211, "global_step": 271407, "epoch": 2243} {"train_loss": -42.97532272338867, "global_step": 271408, "epoch": 2243} {"train_loss": -42.63420486450195, "global_step": 271409, "epoch": 2243} {"train_loss": -43.295772552490234, "global_step": 271410, "epoch": 2243} {"train_loss": -43.2816276550293, "global_step": 271411, "epoch": 2243} {"train_loss": -43.729705810546875, "global_step": 271412, "epoch": 2243} {"train_loss": -43.093421936035156, "global_step": 271413, "epoch": 2243} {"train_loss": -43.3133430480957, "global_step": 271414, "epoch": 2243} {"train_loss": -43.2016487121582, "global_step": 271415, "epoch": 2243} {"train_loss": -43.5019645690918, "global_step": 271416, "epoch": 2243} {"train_loss": -43.16231918334961, "global_step": 271417, "epoch": 2243} {"train_loss": -43.22269058227539, "global_step": 271418, "epoch": 2243} {"train_loss": -43.37470626831055, "global_step": 271419, "epoch": 2243} {"train_loss": -43.34745788574219, "global_step": 271420, "epoch": 2243} {"train_loss": -43.552547454833984, "global_step": 271421, "epoch": 2243} {"train_loss": -43.09805679321289, "global_step": 271422, "epoch": 2243} {"train_loss": -42.558990478515625, "global_step": 271423, "epoch": 2243} {"train_loss": -42.59558868408203, "global_step": 271424, "epoch": 2243} {"train_loss": -43.28358840942383, "global_step": 271425, "epoch": 2243} {"train_loss": -43.01313018798828, "global_step": 271426, "epoch": 2243} {"train_loss": -43.20060348510742, "global_step": 271427, "epoch": 2243} {"train_loss": -43.319129943847656, "global_step": 271428, "epoch": 2243} {"train_loss": -42.3225212097168, "global_step": 271429, "epoch": 2243} {"train_loss": -42.81223678588867, "global_step": 271430, "epoch": 2243} {"train_loss": -43.14402770996094, "global_step": 271431, "epoch": 2243} {"train_loss": -42.75106430053711, "global_step": 271432, "epoch": 2243} {"train_loss": -41.32558822631836, "global_step": 271433, "epoch": 2243} {"train_loss": -41.936767578125, "global_step": 271434, "epoch": 2243} {"train_loss": -43.58354187011719, "global_step": 271435, "epoch": 2243} {"train_loss": -42.28643798828125, "global_step": 271436, "epoch": 2243} {"train_loss": -41.523353576660156, "global_step": 271437, "epoch": 2243} {"train_loss": -41.406341552734375, "global_step": 271438, "epoch": 2243} {"train_loss": -42.24293518066406, "global_step": 271439, "epoch": 2243} {"train_loss": -43.286216735839844, "global_step": 271440, "epoch": 2243} {"train_loss": -41.5439567565918, "global_step": 271441, "epoch": 2243} {"train_loss": -40.2686882019043, "global_step": 271442, "epoch": 2243} {"train_loss": -42.47758865356445, "global_step": 271443, "epoch": 2243} {"train_loss": -42.635643005371094, "global_step": 271444, "epoch": 2243} {"train_loss": -42.55585479736328, "global_step": 271445, "epoch": 2243} {"train_loss": -41.800533294677734, "global_step": 271446, "epoch": 2243} {"train_loss": -42.6878776550293, "global_step": 271447, "epoch": 2243} {"train_loss": -43.166812896728516, "global_step": 271448, "epoch": 2243} {"train_loss": -42.78009796142578, "global_step": 271449, "epoch": 2243} {"train_loss": -42.94914627075195, "global_step": 271450, "epoch": 2243} {"train_loss": -42.96443557739258, "global_step": 271451, "epoch": 2243} {"train_loss": -42.41328048706055, "global_step": 271452, "epoch": 2243} {"train_loss": -43.521488189697266, "global_step": 271453, "epoch": 2243} {"train_loss": -43.292091369628906, "global_step": 271454, "epoch": 2243} {"train_loss": -43.260040283203125, "global_step": 271455, "epoch": 2243} {"train_loss": -43.662391662597656, "global_step": 271456, "epoch": 2243} {"train_loss": -43.02397918701172, "global_step": 271457, "epoch": 2243} {"train_loss": -43.425071716308594, "global_step": 271458, "epoch": 2243} {"train_loss": -42.80217361450195, "global_step": 271459, "epoch": 2243} {"train_loss": -43.349788665771484, "global_step": 271460, "epoch": 2243} {"train_loss": -43.397090911865234, "global_step": 271461, "epoch": 2243} {"train_loss": -43.12386703491211, "global_step": 271462, "epoch": 2243} {"train_loss": -43.98988342285156, "global_step": 271463, "epoch": 2243} {"train_loss": -43.42121887207031, "global_step": 271464, "epoch": 2243} {"train_loss": -43.38163375854492, "global_step": 271465, "epoch": 2243} {"train_loss": -43.317527770996094, "global_step": 271466, "epoch": 2243} {"train_loss": -43.0377197265625, "global_step": 271467, "epoch": 2243} {"train_loss": -43.79185104370117, "global_step": 271468, "epoch": 2243} {"train_loss": -43.42686080932617, "global_step": 271469, "epoch": 2243} {"train_loss": -43.349365234375, "global_step": 271470, "epoch": 2243} {"train_loss": -43.83889389038086, "global_step": 271471, "epoch": 2243} {"train_loss": -43.34442138671875, "global_step": 271472, "epoch": 2243} {"train_loss": -43.5318603515625, "global_step": 271473, "epoch": 2243} {"train_loss": -43.585731506347656, "global_step": 271474, "epoch": 2243} {"train_loss": -43.31702423095703, "global_step": 271475, "epoch": 2243} {"train_loss": -43.64590072631836, "global_step": 271476, "epoch": 2243} {"train_loss": -44.01531982421875, "global_step": 271477, "epoch": 2243} {"train_loss": -42.28669357299805, "global_step": 271478, "epoch": 2243} {"train_loss": -43.5975456237793, "global_step": 271479, "epoch": 2243} {"train_loss": -43.134918212890625, "global_step": 271480, "epoch": 2243} {"train_loss": -43.25790023803711, "global_step": 271481, "epoch": 2243} {"train_loss": -40.054283142089844, "global_step": 271482, "epoch": 2243} {"train_loss": -40.368019104003906, "global_step": 271483, "epoch": 2243} {"train_loss": -43.06797790527344, "global_step": 271484, "epoch": 2243} {"train_loss": -42.567047119140625, "global_step": 271485, "epoch": 2243} {"train_loss": -42.05900192260742, "global_step": 271486, "epoch": 2243} {"train_loss": -42.01375198364258, "global_step": 271487, "epoch": 2243} {"train_loss": -42.060333251953125, "global_step": 271488, "epoch": 2243} {"train_loss": -39.611183166503906, "global_step": 271489, "epoch": 2243} {"train_loss": -29.185800552368164, "global_step": 271490, "epoch": 2243} {"train_loss": -24.258512496948242, "global_step": 271491, "epoch": 2243} {"train_loss": -41.338233947753906, "global_step": 271492, "epoch": 2243} {"train_loss": -39.810081481933594, "global_step": 271493, "epoch": 2243} {"train_loss": -41.20402145385742, "global_step": 271494, "epoch": 2243} {"train_loss": -36.90312576293945, "global_step": 271495, "epoch": 2243} {"train_loss": -35.033992767333984, "global_step": 271496, "epoch": 2243} {"train_loss": -38.896827697753906, "global_step": 271497, "epoch": 2243} {"train_loss": -39.76773452758789, "global_step": 271498, "epoch": 2243} {"train_loss": -37.96021270751953, "global_step": 271499, "epoch": 2243} {"train_loss": -38.331172943115234, "global_step": 271500, "epoch": 2243} {"train_loss": -37.925682067871094, "global_step": 271501, "epoch": 2243} {"train_loss": -30.25166130065918, "global_step": 271502, "epoch": 2243} {"train_loss": -26.0439453125, "global_step": 271503, "epoch": 2243} {"train_loss": -39.4758415222168, "global_step": 271504, "epoch": 2243} {"train_loss": -24.778120040893555, "global_step": 271505, "epoch": 2243} {"train_loss": -36.4080696105957, "global_step": 271506, "epoch": 2243} {"train_loss": -37.0853271484375, "global_step": 271507, "epoch": 2243} {"train_loss": -39.786598205566406, "global_step": 271508, "epoch": 2243} {"train_loss": -33.55691146850586, "global_step": 271509, "epoch": 2243} {"train_loss": -36.72455596923828, "global_step": 271510, "epoch": 2243} {"train_loss": -37.12458038330078, "global_step": 271511, "epoch": 2243} {"train_loss": -39.996315002441406, "global_step": 271512, "epoch": 2243} {"train_loss": -36.74745559692383, "global_step": 271513, "epoch": 2243} {"train_loss": -35.219234466552734, "global_step": 271514, "epoch": 2243} {"train_loss": -38.068153381347656, "global_step": 271515, "epoch": 2243} {"train_loss": -39.64552307128906, "global_step": 271516, "epoch": 2243} {"train_loss": -35.58097457885742, "global_step": 271517, "epoch": 2243} {"train_loss": -31.963428497314453, "global_step": 271518, "epoch": 2243} {"train_loss": -39.16865158081055, "global_step": 271519, "epoch": 2243} {"train_loss": -39.173824310302734, "global_step": 271520, "epoch": 2243} {"train_loss": -36.62459945678711, "global_step": 271521, "epoch": 2243} {"train_loss": -35.879425048828125, "global_step": 271522, "epoch": 2243} {"train_loss": -40.96220520902271, "global_step": 271523, "epoch": 2243, "val_loss": 2822119.0} {"train_loss": -38.97895431518555, "global_step": 271524, "epoch": 2244} {"train_loss": -35.022682189941406, "global_step": 271525, "epoch": 2244} {"train_loss": -37.06881332397461, "global_step": 271526, "epoch": 2244} {"train_loss": -38.790096282958984, "global_step": 271527, "epoch": 2244} {"train_loss": -36.93058395385742, "global_step": 271528, "epoch": 2244} {"train_loss": -36.38779830932617, "global_step": 271529, "epoch": 2244} {"train_loss": -39.46572494506836, "global_step": 271530, "epoch": 2244} {"train_loss": -40.11236572265625, "global_step": 271531, "epoch": 2244} {"train_loss": -39.61854934692383, "global_step": 271532, "epoch": 2244} {"train_loss": -37.86553955078125, "global_step": 271533, "epoch": 2244} {"train_loss": -39.181575775146484, "global_step": 271534, "epoch": 2244} {"train_loss": -39.889007568359375, "global_step": 271535, "epoch": 2244} {"train_loss": -39.18781280517578, "global_step": 271536, "epoch": 2244} {"train_loss": -40.40116882324219, "global_step": 271537, "epoch": 2244} {"train_loss": -40.56415939331055, "global_step": 271538, "epoch": 2244} {"train_loss": -40.458797454833984, "global_step": 271539, "epoch": 2244} {"train_loss": -40.177398681640625, "global_step": 271540, "epoch": 2244} {"train_loss": -39.63628005981445, "global_step": 271541, "epoch": 2244} {"train_loss": -40.540687561035156, "global_step": 271542, "epoch": 2244} {"train_loss": -40.88420486450195, "global_step": 271543, "epoch": 2244} {"train_loss": -40.715206146240234, "global_step": 271544, "epoch": 2244} {"train_loss": -39.94892120361328, "global_step": 271545, "epoch": 2244} {"train_loss": -40.484893798828125, "global_step": 271546, "epoch": 2244} {"train_loss": -39.635379791259766, "global_step": 271547, "epoch": 2244} {"train_loss": -40.596168518066406, "global_step": 271548, "epoch": 2244} {"train_loss": -40.498905181884766, "global_step": 271549, "epoch": 2244} {"train_loss": -39.543853759765625, "global_step": 271550, "epoch": 2244} {"train_loss": -41.137847900390625, "global_step": 271551, "epoch": 2244} {"train_loss": -40.230682373046875, "global_step": 271552, "epoch": 2244} {"train_loss": -39.50468063354492, "global_step": 271553, "epoch": 2244} {"train_loss": -40.5361328125, "global_step": 271554, "epoch": 2244} {"train_loss": -39.563018798828125, "global_step": 271555, "epoch": 2244} {"train_loss": -39.390625, "global_step": 271556, "epoch": 2244} {"train_loss": -41.453956604003906, "global_step": 271557, "epoch": 2244} {"train_loss": -40.95976638793945, "global_step": 271558, "epoch": 2244} {"train_loss": -35.599395751953125, "global_step": 271559, "epoch": 2244} {"train_loss": -41.12583541870117, "global_step": 271560, "epoch": 2244} {"train_loss": -40.6505241394043, "global_step": 271561, "epoch": 2244} {"train_loss": -41.35975646972656, "global_step": 271562, "epoch": 2244} {"train_loss": -40.70695114135742, "global_step": 271563, "epoch": 2244} {"train_loss": -38.41794967651367, "global_step": 271564, "epoch": 2244} {"train_loss": -41.10965347290039, "global_step": 271565, "epoch": 2244} {"train_loss": -41.40849685668945, "global_step": 271566, "epoch": 2244} {"train_loss": -41.3316764831543, "global_step": 271567, "epoch": 2244} {"train_loss": -32.715087890625, "global_step": 271568, "epoch": 2244} {"train_loss": -39.79842758178711, "global_step": 271569, "epoch": 2244} {"train_loss": -37.1286506652832, "global_step": 271570, "epoch": 2244} {"train_loss": -25.040508270263672, "global_step": 271571, "epoch": 2244} {"train_loss": -36.82657241821289, "global_step": 271572, "epoch": 2244} {"train_loss": -36.697628021240234, "global_step": 271573, "epoch": 2244} {"train_loss": -36.28933334350586, "global_step": 271574, "epoch": 2244} {"train_loss": -32.13703536987305, "global_step": 271575, "epoch": 2244} {"train_loss": -39.2627067565918, "global_step": 271576, "epoch": 2244} {"train_loss": -34.93815231323242, "global_step": 271577, "epoch": 2244} {"train_loss": -37.793880462646484, "global_step": 271578, "epoch": 2244} {"train_loss": -32.248207092285156, "global_step": 271579, "epoch": 2244} {"train_loss": -34.964813232421875, "global_step": 271580, "epoch": 2244} {"train_loss": -37.82733154296875, "global_step": 271581, "epoch": 2244} {"train_loss": -39.535858154296875, "global_step": 271582, "epoch": 2244} {"train_loss": -37.59480285644531, "global_step": 271583, "epoch": 2244} {"train_loss": -39.763587951660156, "global_step": 271584, "epoch": 2244} {"train_loss": -37.91990280151367, "global_step": 271585, "epoch": 2244} {"train_loss": -38.94893264770508, "global_step": 271586, "epoch": 2244} {"train_loss": -34.83391189575195, "global_step": 271587, "epoch": 2244} {"train_loss": -36.45760726928711, "global_step": 271588, "epoch": 2244} {"train_loss": -38.364990234375, "global_step": 271589, "epoch": 2244} {"train_loss": -38.065521240234375, "global_step": 271590, "epoch": 2244} {"train_loss": -37.332672119140625, "global_step": 271591, "epoch": 2244} {"train_loss": -38.07931900024414, "global_step": 271592, "epoch": 2244} {"train_loss": -39.13487243652344, "global_step": 271593, "epoch": 2244} {"train_loss": -39.078407287597656, "global_step": 271594, "epoch": 2244} {"train_loss": -39.08668899536133, "global_step": 271595, "epoch": 2244} {"train_loss": -38.519561767578125, "global_step": 271596, "epoch": 2244} {"train_loss": -40.09855270385742, "global_step": 271597, "epoch": 2244} {"train_loss": -40.23541259765625, "global_step": 271598, "epoch": 2244} {"train_loss": -38.248592376708984, "global_step": 271599, "epoch": 2244} {"train_loss": -39.292720794677734, "global_step": 271600, "epoch": 2244} {"train_loss": -39.283294677734375, "global_step": 271601, "epoch": 2244} {"train_loss": -40.339111328125, "global_step": 271602, "epoch": 2244} {"train_loss": -40.26310348510742, "global_step": 271603, "epoch": 2244} {"train_loss": -40.46755599975586, "global_step": 271604, "epoch": 2244} {"train_loss": -40.47736740112305, "global_step": 271605, "epoch": 2244} {"train_loss": -38.94083786010742, "global_step": 271606, "epoch": 2244} {"train_loss": -40.221622467041016, "global_step": 271607, "epoch": 2244} {"train_loss": -40.301116943359375, "global_step": 271608, "epoch": 2244} {"train_loss": -40.017330169677734, "global_step": 271609, "epoch": 2244} {"train_loss": -40.60762405395508, "global_step": 271610, "epoch": 2244} {"train_loss": -40.17537307739258, "global_step": 271611, "epoch": 2244} {"train_loss": -40.993770599365234, "global_step": 271612, "epoch": 2244} {"train_loss": -40.88713073730469, "global_step": 271613, "epoch": 2244} {"train_loss": -40.566864013671875, "global_step": 271614, "epoch": 2244} {"train_loss": -40.615447998046875, "global_step": 271615, "epoch": 2244} {"train_loss": -40.433406829833984, "global_step": 271616, "epoch": 2244} {"train_loss": -41.06581115722656, "global_step": 271617, "epoch": 2244} {"train_loss": -41.04428482055664, "global_step": 271618, "epoch": 2244} {"train_loss": -41.30385971069336, "global_step": 271619, "epoch": 2244} {"train_loss": -41.44621276855469, "global_step": 271620, "epoch": 2244} {"train_loss": -41.69074249267578, "global_step": 271621, "epoch": 2244} {"train_loss": -40.54915237426758, "global_step": 271622, "epoch": 2244} {"train_loss": -40.81746292114258, "global_step": 271623, "epoch": 2244} {"train_loss": -41.319366455078125, "global_step": 271624, "epoch": 2244} {"train_loss": -40.286312103271484, "global_step": 271625, "epoch": 2244} {"train_loss": -41.226253509521484, "global_step": 271626, "epoch": 2244} {"train_loss": -41.1364860534668, "global_step": 271627, "epoch": 2244} {"train_loss": -41.724727630615234, "global_step": 271628, "epoch": 2244} {"train_loss": -41.4755973815918, "global_step": 271629, "epoch": 2244} {"train_loss": -41.1890983581543, "global_step": 271630, "epoch": 2244} {"train_loss": -41.302093505859375, "global_step": 271631, "epoch": 2244} {"train_loss": -42.12334060668945, "global_step": 271632, "epoch": 2244} {"train_loss": -41.26130294799805, "global_step": 271633, "epoch": 2244} {"train_loss": -41.50254440307617, "global_step": 271634, "epoch": 2244} {"train_loss": -41.709468841552734, "global_step": 271635, "epoch": 2244} {"train_loss": -41.435543060302734, "global_step": 271636, "epoch": 2244} {"train_loss": -41.8306770324707, "global_step": 271637, "epoch": 2244} {"train_loss": -42.213645935058594, "global_step": 271638, "epoch": 2244} {"train_loss": -39.35647964477539, "global_step": 271639, "epoch": 2244} {"train_loss": -41.91642379760742, "global_step": 271640, "epoch": 2244} {"train_loss": -41.133113861083984, "global_step": 271641, "epoch": 2244} {"train_loss": -41.86590576171875, "global_step": 271642, "epoch": 2244} {"train_loss": -41.96875, "global_step": 271643, "epoch": 2244} {"train_loss": -39.43982261468556, "global_step": 271644, "epoch": 2244, "val_loss": 2601144.25} {"train_loss": -41.65629196166992, "global_step": 271645, "epoch": 2245} {"train_loss": -42.01764678955078, "global_step": 271646, "epoch": 2245} {"train_loss": -42.078948974609375, "global_step": 271647, "epoch": 2245} {"train_loss": -41.508602142333984, "global_step": 271648, "epoch": 2245} {"train_loss": -41.308929443359375, "global_step": 271649, "epoch": 2245} {"train_loss": -42.019161224365234, "global_step": 271650, "epoch": 2245} {"train_loss": -41.63253402709961, "global_step": 271651, "epoch": 2245} {"train_loss": -41.95280838012695, "global_step": 271652, "epoch": 2245} {"train_loss": -41.79054641723633, "global_step": 271653, "epoch": 2245} {"train_loss": -41.9505500793457, "global_step": 271654, "epoch": 2245} {"train_loss": -41.93782043457031, "global_step": 271655, "epoch": 2245} {"train_loss": -41.4331169128418, "global_step": 271656, "epoch": 2245} {"train_loss": -41.423866271972656, "global_step": 271657, "epoch": 2245} {"train_loss": -42.160945892333984, "global_step": 271658, "epoch": 2245} {"train_loss": -42.2683219909668, "global_step": 271659, "epoch": 2245} {"train_loss": -42.207008361816406, "global_step": 271660, "epoch": 2245} {"train_loss": -42.089271545410156, "global_step": 271661, "epoch": 2245} {"train_loss": -42.16154098510742, "global_step": 271662, "epoch": 2245} {"train_loss": -42.39311599731445, "global_step": 271663, "epoch": 2245} {"train_loss": -42.66054916381836, "global_step": 271664, "epoch": 2245} {"train_loss": -42.387630462646484, "global_step": 271665, "epoch": 2245} {"train_loss": -42.57217025756836, "global_step": 271666, "epoch": 2245} {"train_loss": -42.51752853393555, "global_step": 271667, "epoch": 2245} {"train_loss": -42.60786819458008, "global_step": 271668, "epoch": 2245} {"train_loss": -42.44826889038086, "global_step": 271669, "epoch": 2245} {"train_loss": -42.51969528198242, "global_step": 271670, "epoch": 2245} {"train_loss": -40.777503967285156, "global_step": 271671, "epoch": 2245} {"train_loss": -42.22285842895508, "global_step": 271672, "epoch": 2245} {"train_loss": -42.5394172668457, "global_step": 271673, "epoch": 2245} {"train_loss": -42.12467956542969, "global_step": 271674, "epoch": 2245} {"train_loss": -42.41890335083008, "global_step": 271675, "epoch": 2245} {"train_loss": -42.49644088745117, "global_step": 271676, "epoch": 2245} {"train_loss": -42.32722091674805, "global_step": 271677, "epoch": 2245} {"train_loss": -42.1196174621582, "global_step": 271678, "epoch": 2245} {"train_loss": -42.397212982177734, "global_step": 271679, "epoch": 2245} {"train_loss": -42.102088928222656, "global_step": 271680, "epoch": 2245} {"train_loss": -42.7645378112793, "global_step": 271681, "epoch": 2245} {"train_loss": -42.543067932128906, "global_step": 271682, "epoch": 2245} {"train_loss": -42.23154830932617, "global_step": 271683, "epoch": 2245} {"train_loss": -42.396785736083984, "global_step": 271684, "epoch": 2245} {"train_loss": -42.24668502807617, "global_step": 271685, "epoch": 2245} {"train_loss": -42.604671478271484, "global_step": 271686, "epoch": 2245} {"train_loss": -42.5610466003418, "global_step": 271687, "epoch": 2245} {"train_loss": -42.74093246459961, "global_step": 271688, "epoch": 2245} {"train_loss": -42.740413665771484, "global_step": 271689, "epoch": 2245} {"train_loss": -42.67746353149414, "global_step": 271690, "epoch": 2245} {"train_loss": -42.53206253051758, "global_step": 271691, "epoch": 2245} {"train_loss": -41.74654769897461, "global_step": 271692, "epoch": 2245} {"train_loss": -41.58717727661133, "global_step": 271693, "epoch": 2245} {"train_loss": -42.31870651245117, "global_step": 271694, "epoch": 2245} {"train_loss": -41.9677734375, "global_step": 271695, "epoch": 2245} {"train_loss": -41.51842498779297, "global_step": 271696, "epoch": 2245} {"train_loss": -41.237606048583984, "global_step": 271697, "epoch": 2245} {"train_loss": -42.560935974121094, "global_step": 271698, "epoch": 2245} {"train_loss": -42.080535888671875, "global_step": 271699, "epoch": 2245} {"train_loss": -40.97506332397461, "global_step": 271700, "epoch": 2245} {"train_loss": -42.3455810546875, "global_step": 271701, "epoch": 2245} {"train_loss": -42.771400451660156, "global_step": 271702, "epoch": 2245} {"train_loss": -42.79647445678711, "global_step": 271703, "epoch": 2245} {"train_loss": -42.75399398803711, "global_step": 271704, "epoch": 2245} {"train_loss": -42.5936279296875, "global_step": 271705, "epoch": 2245} {"train_loss": -42.85453414916992, "global_step": 271706, "epoch": 2245} {"train_loss": -41.868316650390625, "global_step": 271707, "epoch": 2245} {"train_loss": -42.62796401977539, "global_step": 271708, "epoch": 2245} {"train_loss": -41.81658935546875, "global_step": 271709, "epoch": 2245} {"train_loss": -42.60594940185547, "global_step": 271710, "epoch": 2245} {"train_loss": -42.332454681396484, "global_step": 271711, "epoch": 2245} {"train_loss": -42.560516357421875, "global_step": 271712, "epoch": 2245} {"train_loss": -42.93532943725586, "global_step": 271713, "epoch": 2245} {"train_loss": -42.330169677734375, "global_step": 271714, "epoch": 2245} {"train_loss": -41.968780517578125, "global_step": 271715, "epoch": 2245} {"train_loss": -42.26787567138672, "global_step": 271716, "epoch": 2245} {"train_loss": -41.93016815185547, "global_step": 271717, "epoch": 2245} {"train_loss": -41.900753021240234, "global_step": 271718, "epoch": 2245} {"train_loss": -42.01729965209961, "global_step": 271719, "epoch": 2245} {"train_loss": -42.03452682495117, "global_step": 271720, "epoch": 2245} {"train_loss": -42.14187240600586, "global_step": 271721, "epoch": 2245} {"train_loss": -42.77744674682617, "global_step": 271722, "epoch": 2245} {"train_loss": -42.18206787109375, "global_step": 271723, "epoch": 2245} {"train_loss": -42.57638168334961, "global_step": 271724, "epoch": 2245} {"train_loss": -42.057525634765625, "global_step": 271725, "epoch": 2245} {"train_loss": -41.70518493652344, "global_step": 271726, "epoch": 2245} {"train_loss": -43.370201110839844, "global_step": 271727, "epoch": 2245} {"train_loss": -43.00608444213867, "global_step": 271728, "epoch": 2245} {"train_loss": -42.714412689208984, "global_step": 271729, "epoch": 2245} {"train_loss": -43.057857513427734, "global_step": 271730, "epoch": 2245} {"train_loss": -42.6307258605957, "global_step": 271731, "epoch": 2245} {"train_loss": -42.85264587402344, "global_step": 271732, "epoch": 2245} {"train_loss": -42.090171813964844, "global_step": 271733, "epoch": 2245} {"train_loss": -42.2839469909668, "global_step": 271734, "epoch": 2245} {"train_loss": -42.01289749145508, "global_step": 271735, "epoch": 2245} {"train_loss": -42.66367721557617, "global_step": 271736, "epoch": 2245} {"train_loss": -41.6485710144043, "global_step": 271737, "epoch": 2245} {"train_loss": -41.07769012451172, "global_step": 271738, "epoch": 2245} {"train_loss": -40.19978713989258, "global_step": 271739, "epoch": 2245} {"train_loss": -41.651466369628906, "global_step": 271740, "epoch": 2245} {"train_loss": -41.660865783691406, "global_step": 271741, "epoch": 2245} {"train_loss": -42.356842041015625, "global_step": 271742, "epoch": 2245} {"train_loss": -41.98537063598633, "global_step": 271743, "epoch": 2245} {"train_loss": -40.899147033691406, "global_step": 271744, "epoch": 2245} {"train_loss": -42.34040832519531, "global_step": 271745, "epoch": 2245} {"train_loss": -42.567195892333984, "global_step": 271746, "epoch": 2245} {"train_loss": -42.49947738647461, "global_step": 271747, "epoch": 2245} {"train_loss": -40.645111083984375, "global_step": 271748, "epoch": 2245} {"train_loss": -41.48209762573242, "global_step": 271749, "epoch": 2245} {"train_loss": -41.880977630615234, "global_step": 271750, "epoch": 2245} {"train_loss": -42.05279541015625, "global_step": 271751, "epoch": 2245} {"train_loss": -40.664527893066406, "global_step": 271752, "epoch": 2245} {"train_loss": -40.36128616333008, "global_step": 271753, "epoch": 2245} {"train_loss": -39.9689826965332, "global_step": 271754, "epoch": 2245} {"train_loss": -41.45309066772461, "global_step": 271755, "epoch": 2245} {"train_loss": -42.659759521484375, "global_step": 271756, "epoch": 2245} {"train_loss": -42.03487014770508, "global_step": 271757, "epoch": 2245} {"train_loss": -41.615570068359375, "global_step": 271758, "epoch": 2245} {"train_loss": -40.4532356262207, "global_step": 271759, "epoch": 2245} {"train_loss": -41.38797378540039, "global_step": 271760, "epoch": 2245} {"train_loss": -42.13669967651367, "global_step": 271761, "epoch": 2245} {"train_loss": -40.68098831176758, "global_step": 271762, "epoch": 2245} {"train_loss": -40.89748764038086, "global_step": 271763, "epoch": 2245} {"train_loss": -40.212921142578125, "global_step": 271764, "epoch": 2245} {"train_loss": -42.04260761481671, "global_step": 271765, "epoch": 2245, "val_loss": 2588057.75} {"train_loss": -39.22365188598633, "global_step": 271766, "epoch": 2246} {"train_loss": -42.98435974121094, "global_step": 271767, "epoch": 2246} {"train_loss": -40.640201568603516, "global_step": 271768, "epoch": 2246} {"train_loss": -42.08637237548828, "global_step": 271769, "epoch": 2246} {"train_loss": -42.31697082519531, "global_step": 271770, "epoch": 2246} {"train_loss": -42.23273849487305, "global_step": 271771, "epoch": 2246} {"train_loss": -42.1668701171875, "global_step": 271772, "epoch": 2246} {"train_loss": -42.37668991088867, "global_step": 271773, "epoch": 2246} {"train_loss": -42.904659271240234, "global_step": 271774, "epoch": 2246} {"train_loss": -42.97806930541992, "global_step": 271775, "epoch": 2246} {"train_loss": -42.207275390625, "global_step": 271776, "epoch": 2246} {"train_loss": -42.4283561706543, "global_step": 271777, "epoch": 2246} {"train_loss": -43.0103645324707, "global_step": 271778, "epoch": 2246} {"train_loss": -42.54812240600586, "global_step": 271779, "epoch": 2246} {"train_loss": -41.879127502441406, "global_step": 271780, "epoch": 2246} {"train_loss": -42.58999252319336, "global_step": 271781, "epoch": 2246} {"train_loss": -42.99020004272461, "global_step": 271782, "epoch": 2246} {"train_loss": -42.07170486450195, "global_step": 271783, "epoch": 2246} {"train_loss": -42.243995666503906, "global_step": 271784, "epoch": 2246} {"train_loss": -42.568511962890625, "global_step": 271785, "epoch": 2246} {"train_loss": -42.80236053466797, "global_step": 271786, "epoch": 2246} {"train_loss": -42.18347930908203, "global_step": 271787, "epoch": 2246} {"train_loss": -42.15350341796875, "global_step": 271788, "epoch": 2246} {"train_loss": -42.95861053466797, "global_step": 271789, "epoch": 2246} {"train_loss": -42.09212875366211, "global_step": 271790, "epoch": 2246} {"train_loss": -42.46712875366211, "global_step": 271791, "epoch": 2246} {"train_loss": -42.63814926147461, "global_step": 271792, "epoch": 2246} {"train_loss": -41.72101974487305, "global_step": 271793, "epoch": 2246} {"train_loss": -41.83441925048828, "global_step": 271794, "epoch": 2246} {"train_loss": -42.621395111083984, "global_step": 271795, "epoch": 2246} {"train_loss": -42.07026672363281, "global_step": 271796, "epoch": 2246} {"train_loss": -41.685577392578125, "global_step": 271797, "epoch": 2246} {"train_loss": -42.16242599487305, "global_step": 271798, "epoch": 2246} {"train_loss": -42.003536224365234, "global_step": 271799, "epoch": 2246} {"train_loss": -42.639381408691406, "global_step": 271800, "epoch": 2246} {"train_loss": -41.83098220825195, "global_step": 271801, "epoch": 2246} {"train_loss": -42.3029670715332, "global_step": 271802, "epoch": 2246} {"train_loss": -42.18478012084961, "global_step": 271803, "epoch": 2246} {"train_loss": -42.76795196533203, "global_step": 271804, "epoch": 2246} {"train_loss": -41.721099853515625, "global_step": 271805, "epoch": 2246} {"train_loss": -41.789276123046875, "global_step": 271806, "epoch": 2246} {"train_loss": -40.25041580200195, "global_step": 271807, "epoch": 2246} {"train_loss": -39.75251388549805, "global_step": 271808, "epoch": 2246} {"train_loss": -41.78899002075195, "global_step": 271809, "epoch": 2246} {"train_loss": -42.41654586791992, "global_step": 271810, "epoch": 2246} {"train_loss": -40.06818771362305, "global_step": 271811, "epoch": 2246} {"train_loss": -39.85945129394531, "global_step": 271812, "epoch": 2246} {"train_loss": -42.928035736083984, "global_step": 271813, "epoch": 2246} {"train_loss": -41.98849868774414, "global_step": 271814, "epoch": 2246} {"train_loss": -41.001625061035156, "global_step": 271815, "epoch": 2246} {"train_loss": -42.555477142333984, "global_step": 271816, "epoch": 2246} {"train_loss": -43.45296859741211, "global_step": 271817, "epoch": 2246} {"train_loss": -42.48796463012695, "global_step": 271818, "epoch": 2246} {"train_loss": -43.12144088745117, "global_step": 271819, "epoch": 2246} {"train_loss": -42.586429595947266, "global_step": 271820, "epoch": 2246} {"train_loss": -42.61220169067383, "global_step": 271821, "epoch": 2246} {"train_loss": -42.479469299316406, "global_step": 271822, "epoch": 2246} {"train_loss": -43.06767272949219, "global_step": 271823, "epoch": 2246} {"train_loss": -42.79267120361328, "global_step": 271824, "epoch": 2246} {"train_loss": -42.80448532104492, "global_step": 271825, "epoch": 2246} {"train_loss": -42.86985397338867, "global_step": 271826, "epoch": 2246} {"train_loss": -43.06718063354492, "global_step": 271827, "epoch": 2246} {"train_loss": -42.736541748046875, "global_step": 271828, "epoch": 2246} {"train_loss": -42.66439437866211, "global_step": 271829, "epoch": 2246} {"train_loss": -42.545711517333984, "global_step": 271830, "epoch": 2246} {"train_loss": -41.98972702026367, "global_step": 271831, "epoch": 2246} {"train_loss": -42.4904670715332, "global_step": 271832, "epoch": 2246} {"train_loss": -43.32781982421875, "global_step": 271833, "epoch": 2246} {"train_loss": -42.45552444458008, "global_step": 271834, "epoch": 2246} {"train_loss": -42.9095344543457, "global_step": 271835, "epoch": 2246} {"train_loss": -42.455711364746094, "global_step": 271836, "epoch": 2246} {"train_loss": -41.5938835144043, "global_step": 271837, "epoch": 2246} {"train_loss": -41.65645217895508, "global_step": 271838, "epoch": 2246} {"train_loss": -42.77098846435547, "global_step": 271839, "epoch": 2246} {"train_loss": -43.09975814819336, "global_step": 271840, "epoch": 2246} {"train_loss": -41.100807189941406, "global_step": 271841, "epoch": 2246} {"train_loss": -40.33341598510742, "global_step": 271842, "epoch": 2246} {"train_loss": -40.560420989990234, "global_step": 271843, "epoch": 2246} {"train_loss": -41.28156661987305, "global_step": 271844, "epoch": 2246} {"train_loss": -42.191490173339844, "global_step": 271845, "epoch": 2246} {"train_loss": -42.2060546875, "global_step": 271846, "epoch": 2246} {"train_loss": -41.33753204345703, "global_step": 271847, "epoch": 2246} {"train_loss": -40.118831634521484, "global_step": 271848, "epoch": 2246} {"train_loss": -40.56239700317383, "global_step": 271849, "epoch": 2246} {"train_loss": -41.551551818847656, "global_step": 271850, "epoch": 2246} {"train_loss": -42.58905029296875, "global_step": 271851, "epoch": 2246} {"train_loss": -37.653446197509766, "global_step": 271852, "epoch": 2246} {"train_loss": -33.61912536621094, "global_step": 271853, "epoch": 2246} {"train_loss": -32.54872131347656, "global_step": 271854, "epoch": 2246} {"train_loss": -38.34980392456055, "global_step": 271855, "epoch": 2246} {"train_loss": -41.93827819824219, "global_step": 271856, "epoch": 2246} {"train_loss": -36.25046920776367, "global_step": 271857, "epoch": 2246} {"train_loss": -38.85891342163086, "global_step": 271858, "epoch": 2246} {"train_loss": -42.2774543762207, "global_step": 271859, "epoch": 2246} {"train_loss": -38.54372024536133, "global_step": 271860, "epoch": 2246} {"train_loss": -42.3200798034668, "global_step": 271861, "epoch": 2246} {"train_loss": -39.04481887817383, "global_step": 271862, "epoch": 2246} {"train_loss": -35.670448303222656, "global_step": 271863, "epoch": 2246} {"train_loss": -42.59408187866211, "global_step": 271864, "epoch": 2246} {"train_loss": -38.64387130737305, "global_step": 271865, "epoch": 2246} {"train_loss": -40.91387939453125, "global_step": 271866, "epoch": 2246} {"train_loss": -41.493099212646484, "global_step": 271867, "epoch": 2246} {"train_loss": -40.440185546875, "global_step": 271868, "epoch": 2246} {"train_loss": -42.36197280883789, "global_step": 271869, "epoch": 2246} {"train_loss": -40.66450881958008, "global_step": 271870, "epoch": 2246} {"train_loss": -42.261104583740234, "global_step": 271871, "epoch": 2246} {"train_loss": -41.01899337768555, "global_step": 271872, "epoch": 2246} {"train_loss": -42.2614860534668, "global_step": 271873, "epoch": 2246} {"train_loss": -41.61085891723633, "global_step": 271874, "epoch": 2246} {"train_loss": -42.183631896972656, "global_step": 271875, "epoch": 2246} {"train_loss": -42.27853775024414, "global_step": 271876, "epoch": 2246} {"train_loss": -42.08900451660156, "global_step": 271877, "epoch": 2246} {"train_loss": -42.562355041503906, "global_step": 271878, "epoch": 2246} {"train_loss": -41.4112434387207, "global_step": 271879, "epoch": 2246} {"train_loss": -42.460662841796875, "global_step": 271880, "epoch": 2246} {"train_loss": -41.88115310668945, "global_step": 271881, "epoch": 2246} {"train_loss": -42.49626159667969, "global_step": 271882, "epoch": 2246} {"train_loss": -42.05161666870117, "global_step": 271883, "epoch": 2246} {"train_loss": -42.39426803588867, "global_step": 271884, "epoch": 2246} {"train_loss": -42.82606887817383, "global_step": 271885, "epoch": 2246} {"train_loss": -41.65280356288942, "global_step": 271886, "epoch": 2246, "val_loss": 2617778.25} {"train_loss": -42.701576232910156, "global_step": 271887, "epoch": 2247} {"train_loss": -42.772823333740234, "global_step": 271888, "epoch": 2247} {"train_loss": -42.46560287475586, "global_step": 271889, "epoch": 2247} {"train_loss": -42.3315544128418, "global_step": 271890, "epoch": 2247} {"train_loss": -43.051246643066406, "global_step": 271891, "epoch": 2247} {"train_loss": -42.838314056396484, "global_step": 271892, "epoch": 2247} {"train_loss": -43.10163497924805, "global_step": 271893, "epoch": 2247} {"train_loss": -43.41303253173828, "global_step": 271894, "epoch": 2247} {"train_loss": -43.10483932495117, "global_step": 271895, "epoch": 2247} {"train_loss": -43.390811920166016, "global_step": 271896, "epoch": 2247} {"train_loss": -42.98504638671875, "global_step": 271897, "epoch": 2247} {"train_loss": -42.957427978515625, "global_step": 271898, "epoch": 2247} {"train_loss": -43.49178695678711, "global_step": 271899, "epoch": 2247} {"train_loss": -43.633514404296875, "global_step": 271900, "epoch": 2247} {"train_loss": -43.219078063964844, "global_step": 271901, "epoch": 2247} {"train_loss": -43.36701202392578, "global_step": 271902, "epoch": 2247} {"train_loss": -43.64951705932617, "global_step": 271903, "epoch": 2247} {"train_loss": -43.759761810302734, "global_step": 271904, "epoch": 2247} {"train_loss": -43.812740325927734, "global_step": 271905, "epoch": 2247} {"train_loss": -43.39554977416992, "global_step": 271906, "epoch": 2247} {"train_loss": -43.56523895263672, "global_step": 271907, "epoch": 2247} {"train_loss": -43.83099365234375, "global_step": 271908, "epoch": 2247} {"train_loss": -43.6782341003418, "global_step": 271909, "epoch": 2247} {"train_loss": -43.77796173095703, "global_step": 271910, "epoch": 2247} {"train_loss": -43.711204528808594, "global_step": 271911, "epoch": 2247} {"train_loss": -43.74595260620117, "global_step": 271912, "epoch": 2247} {"train_loss": -43.82365036010742, "global_step": 271913, "epoch": 2247} {"train_loss": -43.63835906982422, "global_step": 271914, "epoch": 2247} {"train_loss": -43.80866622924805, "global_step": 271915, "epoch": 2247} {"train_loss": -44.12419891357422, "global_step": 271916, "epoch": 2247} {"train_loss": -43.52671432495117, "global_step": 271917, "epoch": 2247} {"train_loss": -43.3728141784668, "global_step": 271918, "epoch": 2247} {"train_loss": -43.20805740356445, "global_step": 271919, "epoch": 2247} {"train_loss": -43.47029495239258, "global_step": 271920, "epoch": 2247} {"train_loss": -43.326011657714844, "global_step": 271921, "epoch": 2247} {"train_loss": -43.00905990600586, "global_step": 271922, "epoch": 2247} {"train_loss": -43.716636657714844, "global_step": 271923, "epoch": 2247} {"train_loss": -42.44546127319336, "global_step": 271924, "epoch": 2247} {"train_loss": -41.78560256958008, "global_step": 271925, "epoch": 2247} {"train_loss": -41.431312561035156, "global_step": 271926, "epoch": 2247} {"train_loss": -41.898902893066406, "global_step": 271927, "epoch": 2247} {"train_loss": -41.0610466003418, "global_step": 271928, "epoch": 2247} {"train_loss": -40.57917404174805, "global_step": 271929, "epoch": 2247} {"train_loss": -42.57556915283203, "global_step": 271930, "epoch": 2247} {"train_loss": -42.72208786010742, "global_step": 271931, "epoch": 2247} {"train_loss": -42.48674392700195, "global_step": 271932, "epoch": 2247} {"train_loss": -42.57295608520508, "global_step": 271933, "epoch": 2247} {"train_loss": -42.85882568359375, "global_step": 271934, "epoch": 2247} {"train_loss": -43.071746826171875, "global_step": 271935, "epoch": 2247} {"train_loss": -41.90674591064453, "global_step": 271936, "epoch": 2247} {"train_loss": -42.35689926147461, "global_step": 271937, "epoch": 2247} {"train_loss": -41.45588302612305, "global_step": 271938, "epoch": 2247} {"train_loss": -42.40651321411133, "global_step": 271939, "epoch": 2247} {"train_loss": -42.88571548461914, "global_step": 271940, "epoch": 2247} {"train_loss": -42.96169662475586, "global_step": 271941, "epoch": 2247} {"train_loss": -41.989498138427734, "global_step": 271942, "epoch": 2247} {"train_loss": -42.74378204345703, "global_step": 271943, "epoch": 2247} {"train_loss": -41.51308822631836, "global_step": 271944, "epoch": 2247} {"train_loss": -42.35624694824219, "global_step": 271945, "epoch": 2247} {"train_loss": -42.2770881652832, "global_step": 271946, "epoch": 2247} {"train_loss": -40.8136100769043, "global_step": 271947, "epoch": 2247} {"train_loss": -41.97947311401367, "global_step": 271948, "epoch": 2247} {"train_loss": -40.92658615112305, "global_step": 271949, "epoch": 2247} {"train_loss": -42.440303802490234, "global_step": 271950, "epoch": 2247} {"train_loss": -42.47347640991211, "global_step": 271951, "epoch": 2247} {"train_loss": -41.73933029174805, "global_step": 271952, "epoch": 2247} {"train_loss": -42.49978256225586, "global_step": 271953, "epoch": 2247} {"train_loss": -42.7197151184082, "global_step": 271954, "epoch": 2247} {"train_loss": -40.842018127441406, "global_step": 271955, "epoch": 2247} {"train_loss": -42.98432540893555, "global_step": 271956, "epoch": 2247} {"train_loss": -42.124961853027344, "global_step": 271957, "epoch": 2247} {"train_loss": -41.213680267333984, "global_step": 271958, "epoch": 2247} {"train_loss": -41.41078567504883, "global_step": 271959, "epoch": 2247} {"train_loss": -42.904293060302734, "global_step": 271960, "epoch": 2247} {"train_loss": -42.4707145690918, "global_step": 271961, "epoch": 2247} {"train_loss": -42.53377914428711, "global_step": 271962, "epoch": 2247} {"train_loss": -42.893287658691406, "global_step": 271963, "epoch": 2247} {"train_loss": -42.50461959838867, "global_step": 271964, "epoch": 2247} {"train_loss": -42.90424346923828, "global_step": 271965, "epoch": 2247} {"train_loss": -42.4858512878418, "global_step": 271966, "epoch": 2247} {"train_loss": -42.55543899536133, "global_step": 271967, "epoch": 2247} {"train_loss": -43.191219329833984, "global_step": 271968, "epoch": 2247} {"train_loss": -41.84505081176758, "global_step": 271969, "epoch": 2247} {"train_loss": -43.31498336791992, "global_step": 271970, "epoch": 2247} {"train_loss": -43.53300857543945, "global_step": 271971, "epoch": 2247} {"train_loss": -42.93208694458008, "global_step": 271972, "epoch": 2247} {"train_loss": -42.92861557006836, "global_step": 271973, "epoch": 2247} {"train_loss": -42.365718841552734, "global_step": 271974, "epoch": 2247} {"train_loss": -41.738067626953125, "global_step": 271975, "epoch": 2247} {"train_loss": -43.519073486328125, "global_step": 271976, "epoch": 2247} {"train_loss": -42.993507385253906, "global_step": 271977, "epoch": 2247} {"train_loss": -43.403076171875, "global_step": 271978, "epoch": 2247} {"train_loss": -42.962066650390625, "global_step": 271979, "epoch": 2247} {"train_loss": -42.82497024536133, "global_step": 271980, "epoch": 2247} {"train_loss": -41.3851318359375, "global_step": 271981, "epoch": 2247} {"train_loss": -42.3249626159668, "global_step": 271982, "epoch": 2247} {"train_loss": -42.88444137573242, "global_step": 271983, "epoch": 2247} {"train_loss": -42.907752990722656, "global_step": 271984, "epoch": 2247} {"train_loss": -42.9825325012207, "global_step": 271985, "epoch": 2247} {"train_loss": -43.15894317626953, "global_step": 271986, "epoch": 2247} {"train_loss": -41.78887939453125, "global_step": 271987, "epoch": 2247} {"train_loss": -41.905948638916016, "global_step": 271988, "epoch": 2247} {"train_loss": -43.2285270690918, "global_step": 271989, "epoch": 2247} {"train_loss": -42.6074104309082, "global_step": 271990, "epoch": 2247} {"train_loss": -39.288726806640625, "global_step": 271991, "epoch": 2247} {"train_loss": -43.0061149597168, "global_step": 271992, "epoch": 2247} {"train_loss": -42.74415969848633, "global_step": 271993, "epoch": 2247} {"train_loss": -42.73727798461914, "global_step": 271994, "epoch": 2247} {"train_loss": -42.49770736694336, "global_step": 271995, "epoch": 2247} {"train_loss": -39.8101806640625, "global_step": 271996, "epoch": 2247} {"train_loss": -40.812904357910156, "global_step": 271997, "epoch": 2247} {"train_loss": -38.52888870239258, "global_step": 271998, "epoch": 2247} {"train_loss": -39.04671096801758, "global_step": 271999, "epoch": 2247} {"train_loss": -41.12027359008789, "global_step": 272000, "epoch": 2247} {"train_loss": -41.19214630126953, "global_step": 272001, "epoch": 2247} {"train_loss": -30.964630126953125, "global_step": 272002, "epoch": 2247} {"train_loss": -35.37447738647461, "global_step": 272003, "epoch": 2247} {"train_loss": -40.91509246826172, "global_step": 272004, "epoch": 2247} {"train_loss": -35.93170928955078, "global_step": 272005, "epoch": 2247} {"train_loss": -28.890094757080078, "global_step": 272006, "epoch": 2247} {"train_loss": -42.18612803309417, "global_step": 272007, "epoch": 2247, "val_loss": 2956606.25} {"train_loss": -37.72587203979492, "global_step": 272008, "epoch": 2248} {"train_loss": -40.11114501953125, "global_step": 272009, "epoch": 2248} {"train_loss": -39.974365234375, "global_step": 272010, "epoch": 2248} {"train_loss": -35.43740463256836, "global_step": 272011, "epoch": 2248} {"train_loss": -29.302677154541016, "global_step": 272012, "epoch": 2248} {"train_loss": -38.264923095703125, "global_step": 272013, "epoch": 2248} {"train_loss": -39.65424346923828, "global_step": 272014, "epoch": 2248} {"train_loss": -40.527767181396484, "global_step": 272015, "epoch": 2248} {"train_loss": -40.17582321166992, "global_step": 272016, "epoch": 2248} {"train_loss": -36.79176330566406, "global_step": 272017, "epoch": 2248} {"train_loss": -37.0375862121582, "global_step": 272018, "epoch": 2248} {"train_loss": -40.73348617553711, "global_step": 272019, "epoch": 2248} {"train_loss": -39.60032272338867, "global_step": 272020, "epoch": 2248} {"train_loss": -33.48991012573242, "global_step": 272021, "epoch": 2248} {"train_loss": -38.31852340698242, "global_step": 272022, "epoch": 2248} {"train_loss": -41.017147064208984, "global_step": 272023, "epoch": 2248} {"train_loss": -40.07526397705078, "global_step": 272024, "epoch": 2248} {"train_loss": -40.33300018310547, "global_step": 272025, "epoch": 2248} {"train_loss": -40.300228118896484, "global_step": 272026, "epoch": 2248} {"train_loss": -40.355587005615234, "global_step": 272027, "epoch": 2248} {"train_loss": -40.05667495727539, "global_step": 272028, "epoch": 2248} {"train_loss": -39.8122444152832, "global_step": 272029, "epoch": 2248} {"train_loss": -40.66202163696289, "global_step": 272030, "epoch": 2248} {"train_loss": -36.09865188598633, "global_step": 272031, "epoch": 2248} {"train_loss": -38.84845733642578, "global_step": 272032, "epoch": 2248} {"train_loss": -39.517765045166016, "global_step": 272033, "epoch": 2248} {"train_loss": -36.7014274597168, "global_step": 272034, "epoch": 2248} {"train_loss": -41.4390754699707, "global_step": 272035, "epoch": 2248} {"train_loss": -39.5405387878418, "global_step": 272036, "epoch": 2248} {"train_loss": -40.738914489746094, "global_step": 272037, "epoch": 2248} {"train_loss": -41.95476150512695, "global_step": 272038, "epoch": 2248} {"train_loss": -40.9144401550293, "global_step": 272039, "epoch": 2248} {"train_loss": -41.35649108886719, "global_step": 272040, "epoch": 2248} {"train_loss": -40.55559158325195, "global_step": 272041, "epoch": 2248} {"train_loss": -41.32966613769531, "global_step": 272042, "epoch": 2248} {"train_loss": -40.76914596557617, "global_step": 272043, "epoch": 2248} {"train_loss": -41.553009033203125, "global_step": 272044, "epoch": 2248} {"train_loss": -41.5893440246582, "global_step": 272045, "epoch": 2248} {"train_loss": -39.84663009643555, "global_step": 272046, "epoch": 2248} {"train_loss": -39.73820114135742, "global_step": 272047, "epoch": 2248} {"train_loss": -42.23600387573242, "global_step": 272048, "epoch": 2248} {"train_loss": -41.88485336303711, "global_step": 272049, "epoch": 2248} {"train_loss": -41.627723693847656, "global_step": 272050, "epoch": 2248} {"train_loss": -41.51355743408203, "global_step": 272051, "epoch": 2248} {"train_loss": -41.80733871459961, "global_step": 272052, "epoch": 2248} {"train_loss": -41.2550048828125, "global_step": 272053, "epoch": 2248} {"train_loss": -41.67269515991211, "global_step": 272054, "epoch": 2248} {"train_loss": -41.09596252441406, "global_step": 272055, "epoch": 2248} {"train_loss": -41.568599700927734, "global_step": 272056, "epoch": 2248} {"train_loss": -42.068634033203125, "global_step": 272057, "epoch": 2248} {"train_loss": -41.49065017700195, "global_step": 272058, "epoch": 2248} {"train_loss": -41.60382080078125, "global_step": 272059, "epoch": 2248} {"train_loss": -42.331600189208984, "global_step": 272060, "epoch": 2248} {"train_loss": -41.99129867553711, "global_step": 272061, "epoch": 2248} {"train_loss": -42.54426193237305, "global_step": 272062, "epoch": 2248} {"train_loss": -42.2591552734375, "global_step": 272063, "epoch": 2248} {"train_loss": -42.36134719848633, "global_step": 272064, "epoch": 2248} {"train_loss": -42.30034637451172, "global_step": 272065, "epoch": 2248} {"train_loss": -41.8134765625, "global_step": 272066, "epoch": 2248} {"train_loss": -42.013641357421875, "global_step": 272067, "epoch": 2248} {"train_loss": -42.224430084228516, "global_step": 272068, "epoch": 2248} {"train_loss": -42.488136291503906, "global_step": 272069, "epoch": 2248} {"train_loss": -41.84708786010742, "global_step": 272070, "epoch": 2248} {"train_loss": -41.29315948486328, "global_step": 272071, "epoch": 2248} {"train_loss": -42.08015441894531, "global_step": 272072, "epoch": 2248} {"train_loss": -42.2513542175293, "global_step": 272073, "epoch": 2248} {"train_loss": -42.74409103393555, "global_step": 272074, "epoch": 2248} {"train_loss": -42.49386978149414, "global_step": 272075, "epoch": 2248} {"train_loss": -42.221923828125, "global_step": 272076, "epoch": 2248} {"train_loss": -41.70344924926758, "global_step": 272077, "epoch": 2248} {"train_loss": -42.678138732910156, "global_step": 272078, "epoch": 2248} {"train_loss": -42.150569915771484, "global_step": 272079, "epoch": 2248} {"train_loss": -42.51682662963867, "global_step": 272080, "epoch": 2248} {"train_loss": -41.3803596496582, "global_step": 272081, "epoch": 2248} {"train_loss": -41.53152084350586, "global_step": 272082, "epoch": 2248} {"train_loss": -42.5374641418457, "global_step": 272083, "epoch": 2248} {"train_loss": -42.706417083740234, "global_step": 272084, "epoch": 2248} {"train_loss": -42.99801254272461, "global_step": 272085, "epoch": 2248} {"train_loss": -42.596336364746094, "global_step": 272086, "epoch": 2248} {"train_loss": -42.85078430175781, "global_step": 272087, "epoch": 2248} {"train_loss": -42.596778869628906, "global_step": 272088, "epoch": 2248} {"train_loss": -43.04966354370117, "global_step": 272089, "epoch": 2248} {"train_loss": -42.38542175292969, "global_step": 272090, "epoch": 2248} {"train_loss": -42.621124267578125, "global_step": 272091, "epoch": 2248} {"train_loss": -42.98184585571289, "global_step": 272092, "epoch": 2248} {"train_loss": -41.59943389892578, "global_step": 272093, "epoch": 2248} {"train_loss": -42.25944137573242, "global_step": 272094, "epoch": 2248} {"train_loss": -41.86621856689453, "global_step": 272095, "epoch": 2248} {"train_loss": -43.01385498046875, "global_step": 272096, "epoch": 2248} {"train_loss": -42.67527389526367, "global_step": 272097, "epoch": 2248} {"train_loss": -42.7039794921875, "global_step": 272098, "epoch": 2248} {"train_loss": -42.91188430786133, "global_step": 272099, "epoch": 2248} {"train_loss": -41.74464416503906, "global_step": 272100, "epoch": 2248} {"train_loss": -42.92857360839844, "global_step": 272101, "epoch": 2248} {"train_loss": -43.43649673461914, "global_step": 272102, "epoch": 2248} {"train_loss": -43.01088333129883, "global_step": 272103, "epoch": 2248} {"train_loss": -42.660438537597656, "global_step": 272104, "epoch": 2248} {"train_loss": -42.207576751708984, "global_step": 272105, "epoch": 2248} {"train_loss": -42.46168899536133, "global_step": 272106, "epoch": 2248} {"train_loss": -42.92523193359375, "global_step": 272107, "epoch": 2248} {"train_loss": -42.82606887817383, "global_step": 272108, "epoch": 2248} {"train_loss": -43.28537368774414, "global_step": 272109, "epoch": 2248} {"train_loss": -43.24646759033203, "global_step": 272110, "epoch": 2248} {"train_loss": -41.6876106262207, "global_step": 272111, "epoch": 2248} {"train_loss": -42.46548080444336, "global_step": 272112, "epoch": 2248} {"train_loss": -43.001312255859375, "global_step": 272113, "epoch": 2248} {"train_loss": -42.084800720214844, "global_step": 272114, "epoch": 2248} {"train_loss": -41.592891693115234, "global_step": 272115, "epoch": 2248} {"train_loss": -43.498592376708984, "global_step": 272116, "epoch": 2248} {"train_loss": -43.34558868408203, "global_step": 272117, "epoch": 2248} {"train_loss": -43.26980209350586, "global_step": 272118, "epoch": 2248} {"train_loss": -43.571990966796875, "global_step": 272119, "epoch": 2248} {"train_loss": -43.1347541809082, "global_step": 272120, "epoch": 2248} {"train_loss": -43.28606033325195, "global_step": 272121, "epoch": 2248} {"train_loss": -43.45895004272461, "global_step": 272122, "epoch": 2248} {"train_loss": -42.66313934326172, "global_step": 272123, "epoch": 2248} {"train_loss": -42.934505462646484, "global_step": 272124, "epoch": 2248} {"train_loss": -42.20283126831055, "global_step": 272125, "epoch": 2248} {"train_loss": -42.193294525146484, "global_step": 272126, "epoch": 2248} {"train_loss": -43.13873291015625, "global_step": 272127, "epoch": 2248} {"train_loss": -41.37997780161456, "global_step": 272128, "epoch": 2248, "val_loss": 2756774.75} {"train_loss": -43.120113372802734, "global_step": 272129, "epoch": 2249} {"train_loss": -43.387596130371094, "global_step": 272130, "epoch": 2249} {"train_loss": -42.567874908447266, "global_step": 272131, "epoch": 2249} {"train_loss": -41.63669204711914, "global_step": 272132, "epoch": 2249} {"train_loss": -43.68916320800781, "global_step": 272133, "epoch": 2249} {"train_loss": -43.519981384277344, "global_step": 272134, "epoch": 2249} {"train_loss": -42.975704193115234, "global_step": 272135, "epoch": 2249} {"train_loss": -43.102691650390625, "global_step": 272136, "epoch": 2249} {"train_loss": -43.078590393066406, "global_step": 272137, "epoch": 2249} {"train_loss": -43.055747985839844, "global_step": 272138, "epoch": 2249} {"train_loss": -42.94173812866211, "global_step": 272139, "epoch": 2249} {"train_loss": -42.37917709350586, "global_step": 272140, "epoch": 2249} {"train_loss": -42.043067932128906, "global_step": 272141, "epoch": 2249} {"train_loss": -43.1973991394043, "global_step": 272142, "epoch": 2249} {"train_loss": -43.235816955566406, "global_step": 272143, "epoch": 2249} {"train_loss": -42.61884689331055, "global_step": 272144, "epoch": 2249} {"train_loss": -42.41939926147461, "global_step": 272145, "epoch": 2249} {"train_loss": -42.99728012084961, "global_step": 272146, "epoch": 2249} {"train_loss": -43.10275650024414, "global_step": 272147, "epoch": 2249} {"train_loss": -42.83250427246094, "global_step": 272148, "epoch": 2249} {"train_loss": -42.5092658996582, "global_step": 272149, "epoch": 2249} {"train_loss": -43.104549407958984, "global_step": 272150, "epoch": 2249} {"train_loss": -43.1922721862793, "global_step": 272151, "epoch": 2249} {"train_loss": -43.39854049682617, "global_step": 272152, "epoch": 2249} {"train_loss": -42.7591438293457, "global_step": 272153, "epoch": 2249} {"train_loss": -43.20546340942383, "global_step": 272154, "epoch": 2249} {"train_loss": -43.287322998046875, "global_step": 272155, "epoch": 2249} {"train_loss": -43.2752685546875, "global_step": 272156, "epoch": 2249} {"train_loss": -40.53493118286133, "global_step": 272157, "epoch": 2249} {"train_loss": -43.28802490234375, "global_step": 272158, "epoch": 2249} {"train_loss": -42.64423751831055, "global_step": 272159, "epoch": 2249} {"train_loss": -42.910743713378906, "global_step": 272160, "epoch": 2249} {"train_loss": -42.76897430419922, "global_step": 272161, "epoch": 2249} {"train_loss": -41.68339920043945, "global_step": 272162, "epoch": 2249} {"train_loss": -37.83158493041992, "global_step": 272163, "epoch": 2249} {"train_loss": -38.90861129760742, "global_step": 272164, "epoch": 2249} {"train_loss": -39.4477424621582, "global_step": 272165, "epoch": 2249} {"train_loss": -42.02936553955078, "global_step": 272166, "epoch": 2249} {"train_loss": -42.59184646606445, "global_step": 272167, "epoch": 2249} {"train_loss": -40.22529602050781, "global_step": 272168, "epoch": 2249} {"train_loss": -39.85919952392578, "global_step": 272169, "epoch": 2249} {"train_loss": -40.30366134643555, "global_step": 272170, "epoch": 2249} {"train_loss": -40.94721603393555, "global_step": 272171, "epoch": 2249} {"train_loss": -37.76284408569336, "global_step": 272172, "epoch": 2249} {"train_loss": -39.332557678222656, "global_step": 272173, "epoch": 2249} {"train_loss": -41.493404388427734, "global_step": 272174, "epoch": 2249} {"train_loss": -40.3268928527832, "global_step": 272175, "epoch": 2249} {"train_loss": -41.893333435058594, "global_step": 272176, "epoch": 2249} {"train_loss": -41.54104995727539, "global_step": 272177, "epoch": 2249} {"train_loss": -38.09095764160156, "global_step": 272178, "epoch": 2249} {"train_loss": -41.316654205322266, "global_step": 272179, "epoch": 2249} {"train_loss": -39.78076171875, "global_step": 272180, "epoch": 2249} {"train_loss": -39.09943389892578, "global_step": 272181, "epoch": 2249} {"train_loss": -41.4778938293457, "global_step": 272182, "epoch": 2249} {"train_loss": -40.20840072631836, "global_step": 272183, "epoch": 2249} {"train_loss": -41.18032455444336, "global_step": 272184, "epoch": 2249} {"train_loss": -40.46355056762695, "global_step": 272185, "epoch": 2249} {"train_loss": -40.54179000854492, "global_step": 272186, "epoch": 2249} {"train_loss": -41.71633529663086, "global_step": 272187, "epoch": 2249} {"train_loss": -40.60132598876953, "global_step": 272188, "epoch": 2249} {"train_loss": -42.297611236572266, "global_step": 272189, "epoch": 2249} {"train_loss": -40.825965881347656, "global_step": 272190, "epoch": 2249} {"train_loss": -42.420860290527344, "global_step": 272191, "epoch": 2249} {"train_loss": -41.63886642456055, "global_step": 272192, "epoch": 2249} {"train_loss": -41.60970687866211, "global_step": 272193, "epoch": 2249} {"train_loss": -39.76118469238281, "global_step": 272194, "epoch": 2249} {"train_loss": -41.85852813720703, "global_step": 272195, "epoch": 2249} {"train_loss": -41.74236297607422, "global_step": 272196, "epoch": 2249} {"train_loss": -41.93135452270508, "global_step": 272197, "epoch": 2249} {"train_loss": -41.58257293701172, "global_step": 272198, "epoch": 2249} {"train_loss": -42.84186935424805, "global_step": 272199, "epoch": 2249} {"train_loss": -42.40338134765625, "global_step": 272200, "epoch": 2249} {"train_loss": -42.725826263427734, "global_step": 272201, "epoch": 2249} {"train_loss": -42.26328659057617, "global_step": 272202, "epoch": 2249} {"train_loss": -42.32634353637695, "global_step": 272203, "epoch": 2249} {"train_loss": -42.13275146484375, "global_step": 272204, "epoch": 2249} {"train_loss": -42.88782501220703, "global_step": 272205, "epoch": 2249} {"train_loss": -42.81410217285156, "global_step": 272206, "epoch": 2249} {"train_loss": -42.26771545410156, "global_step": 272207, "epoch": 2249} {"train_loss": -41.75517272949219, "global_step": 272208, "epoch": 2249} {"train_loss": -43.016815185546875, "global_step": 272209, "epoch": 2249} {"train_loss": -42.42416763305664, "global_step": 272210, "epoch": 2249} {"train_loss": -42.90540313720703, "global_step": 272211, "epoch": 2249} {"train_loss": -42.90189743041992, "global_step": 272212, "epoch": 2249} {"train_loss": -42.58408737182617, "global_step": 272213, "epoch": 2249} {"train_loss": -42.950191497802734, "global_step": 272214, "epoch": 2249} {"train_loss": -43.03620529174805, "global_step": 272215, "epoch": 2249} {"train_loss": -43.12696075439453, "global_step": 272216, "epoch": 2249} {"train_loss": -42.99634552001953, "global_step": 272217, "epoch": 2249} {"train_loss": -42.80091857910156, "global_step": 272218, "epoch": 2249} {"train_loss": -42.3993034362793, "global_step": 272219, "epoch": 2249} {"train_loss": -42.50334548950195, "global_step": 272220, "epoch": 2249} {"train_loss": -42.67123031616211, "global_step": 272221, "epoch": 2249} {"train_loss": -42.77170181274414, "global_step": 272222, "epoch": 2249} {"train_loss": -42.7998046875, "global_step": 272223, "epoch": 2249} {"train_loss": -41.07866287231445, "global_step": 272224, "epoch": 2249} {"train_loss": -42.92795944213867, "global_step": 272225, "epoch": 2249} {"train_loss": -43.13616180419922, "global_step": 272226, "epoch": 2249} {"train_loss": -42.254180908203125, "global_step": 272227, "epoch": 2249} {"train_loss": -42.57404708862305, "global_step": 272228, "epoch": 2249} {"train_loss": -43.17514419555664, "global_step": 272229, "epoch": 2249} {"train_loss": -42.25241470336914, "global_step": 272230, "epoch": 2249} {"train_loss": -39.65552520751953, "global_step": 272231, "epoch": 2249} {"train_loss": -42.1693229675293, "global_step": 272232, "epoch": 2249} {"train_loss": -42.801673889160156, "global_step": 272233, "epoch": 2249} {"train_loss": -42.3199577331543, "global_step": 272234, "epoch": 2249} {"train_loss": -40.33883285522461, "global_step": 272235, "epoch": 2249} {"train_loss": -43.24933624267578, "global_step": 272236, "epoch": 2249} {"train_loss": -43.485504150390625, "global_step": 272237, "epoch": 2249} {"train_loss": -42.86513900756836, "global_step": 272238, "epoch": 2249} {"train_loss": -43.14140701293945, "global_step": 272239, "epoch": 2249} {"train_loss": -43.44366455078125, "global_step": 272240, "epoch": 2249} {"train_loss": -43.208065032958984, "global_step": 272241, "epoch": 2249} {"train_loss": -40.96797180175781, "global_step": 272242, "epoch": 2249} {"train_loss": -43.0903434753418, "global_step": 272243, "epoch": 2249} {"train_loss": -42.894126892089844, "global_step": 272244, "epoch": 2249} {"train_loss": -41.50272750854492, "global_step": 272245, "epoch": 2249} {"train_loss": -41.93696212768555, "global_step": 272246, "epoch": 2249} {"train_loss": -42.40348434448242, "global_step": 272247, "epoch": 2249} {"train_loss": -43.45249557495117, "global_step": 272248, "epoch": 2249} {"train_loss": -42.07177945602039, "global_step": 272249, "epoch": 2249, "val_loss": 2671344.0} {"train_loss": -41.88494110107422, "global_step": 272250, "epoch": 2250} {"train_loss": -42.98529052734375, "global_step": 272251, "epoch": 2250} {"train_loss": -42.90060043334961, "global_step": 272252, "epoch": 2250} {"train_loss": -42.96168899536133, "global_step": 272253, "epoch": 2250} {"train_loss": -41.9815788269043, "global_step": 272254, "epoch": 2250} {"train_loss": -43.109920501708984, "global_step": 272255, "epoch": 2250} {"train_loss": -42.92705535888672, "global_step": 272256, "epoch": 2250} {"train_loss": -42.56496047973633, "global_step": 272257, "epoch": 2250} {"train_loss": -43.38868713378906, "global_step": 272258, "epoch": 2250} {"train_loss": -43.0245246887207, "global_step": 272259, "epoch": 2250} {"train_loss": -42.53596878051758, "global_step": 272260, "epoch": 2250} {"train_loss": -43.65987014770508, "global_step": 272261, "epoch": 2250} {"train_loss": -43.58297348022461, "global_step": 272262, "epoch": 2250} {"train_loss": -43.32462692260742, "global_step": 272263, "epoch": 2250} {"train_loss": -43.2387809753418, "global_step": 272264, "epoch": 2250} {"train_loss": -43.101295471191406, "global_step": 272265, "epoch": 2250} {"train_loss": -43.72754669189453, "global_step": 272266, "epoch": 2250} {"train_loss": -42.87043380737305, "global_step": 272267, "epoch": 2250} {"train_loss": -42.34540557861328, "global_step": 272268, "epoch": 2250} {"train_loss": -43.5528564453125, "global_step": 272269, "epoch": 2250} {"train_loss": -42.739620208740234, "global_step": 272270, "epoch": 2250} {"train_loss": -42.586605072021484, "global_step": 272271, "epoch": 2250} {"train_loss": -43.37001419067383, "global_step": 272272, "epoch": 2250} {"train_loss": -41.8498649597168, "global_step": 272273, "epoch": 2250} {"train_loss": -42.161705017089844, "global_step": 272274, "epoch": 2250} {"train_loss": -43.16680145263672, "global_step": 272275, "epoch": 2250} {"train_loss": -43.39411163330078, "global_step": 272276, "epoch": 2250} {"train_loss": -42.38595962524414, "global_step": 272277, "epoch": 2250} {"train_loss": -42.21079635620117, "global_step": 272278, "epoch": 2250} {"train_loss": -41.43620681762695, "global_step": 272279, "epoch": 2250} {"train_loss": -42.0258903503418, "global_step": 272280, "epoch": 2250} {"train_loss": -42.551631927490234, "global_step": 272281, "epoch": 2250} {"train_loss": -42.178871154785156, "global_step": 272282, "epoch": 2250} {"train_loss": -41.3873405456543, "global_step": 272283, "epoch": 2250} {"train_loss": -42.15147018432617, "global_step": 272284, "epoch": 2250} {"train_loss": -40.94206619262695, "global_step": 272285, "epoch": 2250} {"train_loss": -42.165687561035156, "global_step": 272286, "epoch": 2250} {"train_loss": -41.84360885620117, "global_step": 272287, "epoch": 2250} {"train_loss": -41.78493118286133, "global_step": 272288, "epoch": 2250} {"train_loss": -41.4288330078125, "global_step": 272289, "epoch": 2250} {"train_loss": -42.17036819458008, "global_step": 272290, "epoch": 2250} {"train_loss": -41.5892333984375, "global_step": 272291, "epoch": 2250} {"train_loss": -41.91265869140625, "global_step": 272292, "epoch": 2250} {"train_loss": -40.956722259521484, "global_step": 272293, "epoch": 2250} {"train_loss": -42.720699310302734, "global_step": 272294, "epoch": 2250} {"train_loss": -41.35938262939453, "global_step": 272295, "epoch": 2250} {"train_loss": -42.203033447265625, "global_step": 272296, "epoch": 2250} {"train_loss": -42.20351028442383, "global_step": 272297, "epoch": 2250} {"train_loss": -42.578914642333984, "global_step": 272298, "epoch": 2250} {"train_loss": -39.866004943847656, "global_step": 272299, "epoch": 2250} {"train_loss": -40.168609619140625, "global_step": 272300, "epoch": 2250} {"train_loss": -41.824893951416016, "global_step": 272301, "epoch": 2250} {"train_loss": -41.69692611694336, "global_step": 272302, "epoch": 2250} {"train_loss": -40.97401809692383, "global_step": 272303, "epoch": 2250} {"train_loss": -41.41421127319336, "global_step": 272304, "epoch": 2250} {"train_loss": -42.81064987182617, "global_step": 272305, "epoch": 2250} {"train_loss": -41.31422805786133, "global_step": 272306, "epoch": 2250} {"train_loss": -41.765380859375, "global_step": 272307, "epoch": 2250} {"train_loss": -41.90475082397461, "global_step": 272308, "epoch": 2250} {"train_loss": -42.262603759765625, "global_step": 272309, "epoch": 2250} {"train_loss": -40.95637893676758, "global_step": 272310, "epoch": 2250} {"train_loss": -43.13591766357422, "global_step": 272311, "epoch": 2250} {"train_loss": -41.90428924560547, "global_step": 272312, "epoch": 2250} {"train_loss": -42.703460693359375, "global_step": 272313, "epoch": 2250} {"train_loss": -42.171424865722656, "global_step": 272314, "epoch": 2250} {"train_loss": -42.01640701293945, "global_step": 272315, "epoch": 2250} {"train_loss": -43.01686477661133, "global_step": 272316, "epoch": 2250} {"train_loss": -42.664981842041016, "global_step": 272317, "epoch": 2250} {"train_loss": -42.42770767211914, "global_step": 272318, "epoch": 2250} {"train_loss": -42.332176208496094, "global_step": 272319, "epoch": 2250} {"train_loss": -42.36713790893555, "global_step": 272320, "epoch": 2250} {"train_loss": -42.41440963745117, "global_step": 272321, "epoch": 2250} {"train_loss": -42.21596145629883, "global_step": 272322, "epoch": 2250} {"train_loss": -43.1419677734375, "global_step": 272323, "epoch": 2250} {"train_loss": -42.56128692626953, "global_step": 272324, "epoch": 2250} {"train_loss": -42.43470764160156, "global_step": 272325, "epoch": 2250} {"train_loss": -41.6282844543457, "global_step": 272326, "epoch": 2250} {"train_loss": -42.375553131103516, "global_step": 272327, "epoch": 2250} {"train_loss": -41.2148551940918, "global_step": 272328, "epoch": 2250} {"train_loss": -39.530845642089844, "global_step": 272329, "epoch": 2250} {"train_loss": -43.0886344909668, "global_step": 272330, "epoch": 2250} {"train_loss": -42.641876220703125, "global_step": 272331, "epoch": 2250} {"train_loss": -40.47869873046875, "global_step": 272332, "epoch": 2250} {"train_loss": -40.07075119018555, "global_step": 272333, "epoch": 2250} {"train_loss": -43.41331481933594, "global_step": 272334, "epoch": 2250} {"train_loss": -42.36188888549805, "global_step": 272335, "epoch": 2250} {"train_loss": -41.6798095703125, "global_step": 272336, "epoch": 2250} {"train_loss": -42.45234298706055, "global_step": 272337, "epoch": 2250} {"train_loss": -42.10750961303711, "global_step": 272338, "epoch": 2250} {"train_loss": -40.973548889160156, "global_step": 272339, "epoch": 2250} {"train_loss": -42.18185043334961, "global_step": 272340, "epoch": 2250} {"train_loss": -43.03091049194336, "global_step": 272341, "epoch": 2250} {"train_loss": -41.45180892944336, "global_step": 272342, "epoch": 2250} {"train_loss": -41.495601654052734, "global_step": 272343, "epoch": 2250} {"train_loss": -43.40571212768555, "global_step": 272344, "epoch": 2250} {"train_loss": -41.785213470458984, "global_step": 272345, "epoch": 2250} {"train_loss": -39.4220085144043, "global_step": 272346, "epoch": 2250} {"train_loss": -43.12777328491211, "global_step": 272347, "epoch": 2250} {"train_loss": -42.13976287841797, "global_step": 272348, "epoch": 2250} {"train_loss": -40.53162384033203, "global_step": 272349, "epoch": 2250} {"train_loss": -42.1601676940918, "global_step": 272350, "epoch": 2250} {"train_loss": -42.409027099609375, "global_step": 272351, "epoch": 2250} {"train_loss": -40.24557113647461, "global_step": 272352, "epoch": 2250} {"train_loss": -42.448543548583984, "global_step": 272353, "epoch": 2250} {"train_loss": -42.06622314453125, "global_step": 272354, "epoch": 2250} {"train_loss": -42.5592155456543, "global_step": 272355, "epoch": 2250} {"train_loss": -42.724849700927734, "global_step": 272356, "epoch": 2250} {"train_loss": -41.33583068847656, "global_step": 272357, "epoch": 2250} {"train_loss": -42.6248779296875, "global_step": 272358, "epoch": 2250} {"train_loss": -43.370460510253906, "global_step": 272359, "epoch": 2250} {"train_loss": -42.282527923583984, "global_step": 272360, "epoch": 2250} {"train_loss": -43.38119125366211, "global_step": 272361, "epoch": 2250} {"train_loss": -41.71709060668945, "global_step": 272362, "epoch": 2250} {"train_loss": -42.50370407104492, "global_step": 272363, "epoch": 2250} {"train_loss": -43.44588088989258, "global_step": 272364, "epoch": 2250} {"train_loss": -42.29618453979492, "global_step": 272365, "epoch": 2250} {"train_loss": -43.23945236206055, "global_step": 272366, "epoch": 2250} {"train_loss": -43.15740966796875, "global_step": 272367, "epoch": 2250} {"train_loss": -43.09487533569336, "global_step": 272368, "epoch": 2250} {"train_loss": -43.03317642211914, "global_step": 272369, "epoch": 2250} {"train_loss": -42.23594905128164, "global_step": 272370, "epoch": 2250, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4400000": 1.0, "test/sim_max_reward_4400001": 1.0, "test/sim_max_reward_4400002": 1.0, "test/sim_max_reward_4400003": 0.0, "test/sim_max_reward_4400004": 1.0, "test/sim_max_reward_4400005": 1.0, "test/sim_max_reward_4400006": 1.0, "test/sim_max_reward_4400007": 1.0, "test/sim_max_reward_4400008": 1.0, "test/sim_max_reward_4400009": 1.0, "test/sim_max_reward_4400010": 1.0, "test/sim_max_reward_4400011": 0.0, "test/sim_max_reward_4400012": 1.0, "test/sim_max_reward_4400013": 1.0, "test/sim_max_reward_4400014": 1.0, "test/sim_max_reward_4400015": 1.0, "test/sim_max_reward_4400016": 1.0, "test/sim_max_reward_4400017": 1.0, "test/sim_max_reward_4400018": 1.0, "test/sim_max_reward_4400019": 1.0, "test/sim_max_reward_4400020": 1.0, "test/sim_max_reward_4400021": 1.0, "train/mean_score": 1.0, "test/mean_score": 0.9090909090909091, "val_loss": 2679095.25} {"train_loss": -42.407470703125, "global_step": 272371, "epoch": 2251} {"train_loss": -42.71923828125, "global_step": 272372, "epoch": 2251} {"train_loss": -43.24637985229492, "global_step": 272373, "epoch": 2251} {"train_loss": -41.9859619140625, "global_step": 272374, "epoch": 2251} {"train_loss": -43.055599212646484, "global_step": 272375, "epoch": 2251} {"train_loss": -43.58102798461914, "global_step": 272376, "epoch": 2251} {"train_loss": -43.63485336303711, "global_step": 272377, "epoch": 2251} {"train_loss": -42.203643798828125, "global_step": 272378, "epoch": 2251} {"train_loss": -42.79969787597656, "global_step": 272379, "epoch": 2251} {"train_loss": -42.259769439697266, "global_step": 272380, "epoch": 2251} {"train_loss": -43.3614616394043, "global_step": 272381, "epoch": 2251} {"train_loss": -42.287567138671875, "global_step": 272382, "epoch": 2251} {"train_loss": -41.396026611328125, "global_step": 272383, "epoch": 2251} {"train_loss": -43.09421157836914, "global_step": 272384, "epoch": 2251} {"train_loss": -41.317527770996094, "global_step": 272385, "epoch": 2251} {"train_loss": -42.27421188354492, "global_step": 272386, "epoch": 2251} {"train_loss": -43.19376754760742, "global_step": 272387, "epoch": 2251} {"train_loss": -40.13786315917969, "global_step": 272388, "epoch": 2251} {"train_loss": -42.51336669921875, "global_step": 272389, "epoch": 2251} {"train_loss": -42.475555419921875, "global_step": 272390, "epoch": 2251} {"train_loss": -40.17196273803711, "global_step": 272391, "epoch": 2251} {"train_loss": -42.419673919677734, "global_step": 272392, "epoch": 2251} {"train_loss": -40.78015899658203, "global_step": 272393, "epoch": 2251} {"train_loss": -40.48529052734375, "global_step": 272394, "epoch": 2251} {"train_loss": -41.890560150146484, "global_step": 272395, "epoch": 2251} {"train_loss": -41.60730743408203, "global_step": 272396, "epoch": 2251} {"train_loss": -41.724430084228516, "global_step": 272397, "epoch": 2251} {"train_loss": -41.94647216796875, "global_step": 272398, "epoch": 2251} {"train_loss": -41.4567756652832, "global_step": 272399, "epoch": 2251} {"train_loss": -42.32685470581055, "global_step": 272400, "epoch": 2251} {"train_loss": -41.58845901489258, "global_step": 272401, "epoch": 2251} {"train_loss": -41.669185638427734, "global_step": 272402, "epoch": 2251} {"train_loss": -43.07664108276367, "global_step": 272403, "epoch": 2251} {"train_loss": -41.102622985839844, "global_step": 272404, "epoch": 2251} {"train_loss": -41.906063079833984, "global_step": 272405, "epoch": 2251} {"train_loss": -41.98684310913086, "global_step": 272406, "epoch": 2251} {"train_loss": -42.6463737487793, "global_step": 272407, "epoch": 2251} {"train_loss": -42.42922592163086, "global_step": 272408, "epoch": 2251} {"train_loss": -42.33723068237305, "global_step": 272409, "epoch": 2251} {"train_loss": -42.2298469543457, "global_step": 272410, "epoch": 2251} {"train_loss": -42.70113754272461, "global_step": 272411, "epoch": 2251} {"train_loss": -42.221221923828125, "global_step": 272412, "epoch": 2251} {"train_loss": -42.748531341552734, "global_step": 272413, "epoch": 2251} {"train_loss": -42.32695770263672, "global_step": 272414, "epoch": 2251} {"train_loss": -42.0494384765625, "global_step": 272415, "epoch": 2251} {"train_loss": -42.95441436767578, "global_step": 272416, "epoch": 2251} {"train_loss": -42.55091094970703, "global_step": 272417, "epoch": 2251} {"train_loss": -42.83889389038086, "global_step": 272418, "epoch": 2251} {"train_loss": -42.90189743041992, "global_step": 272419, "epoch": 2251} {"train_loss": -42.93080520629883, "global_step": 272420, "epoch": 2251} {"train_loss": -42.71588134765625, "global_step": 272421, "epoch": 2251} {"train_loss": -43.06116485595703, "global_step": 272422, "epoch": 2251} {"train_loss": -42.97092056274414, "global_step": 272423, "epoch": 2251} {"train_loss": -43.18008041381836, "global_step": 272424, "epoch": 2251} {"train_loss": -42.822689056396484, "global_step": 272425, "epoch": 2251} {"train_loss": -42.73284912109375, "global_step": 272426, "epoch": 2251} {"train_loss": -42.96550750732422, "global_step": 272427, "epoch": 2251} {"train_loss": -42.96033477783203, "global_step": 272428, "epoch": 2251} {"train_loss": -42.45162582397461, "global_step": 272429, "epoch": 2251} {"train_loss": -43.20731735229492, "global_step": 272430, "epoch": 2251} {"train_loss": -42.71145248413086, "global_step": 272431, "epoch": 2251} {"train_loss": -41.58782196044922, "global_step": 272432, "epoch": 2251} {"train_loss": -42.892677307128906, "global_step": 272433, "epoch": 2251} {"train_loss": -43.00596237182617, "global_step": 272434, "epoch": 2251} {"train_loss": -41.688507080078125, "global_step": 272435, "epoch": 2251} {"train_loss": -42.848392486572266, "global_step": 272436, "epoch": 2251} {"train_loss": -42.65031051635742, "global_step": 272437, "epoch": 2251} {"train_loss": -42.24396514892578, "global_step": 272438, "epoch": 2251} {"train_loss": -42.52339553833008, "global_step": 272439, "epoch": 2251} {"train_loss": -42.32669448852539, "global_step": 272440, "epoch": 2251} {"train_loss": -42.03953170776367, "global_step": 272441, "epoch": 2251} {"train_loss": -42.84463882446289, "global_step": 272442, "epoch": 2251} {"train_loss": -41.44812774658203, "global_step": 272443, "epoch": 2251} {"train_loss": -39.37948226928711, "global_step": 272444, "epoch": 2251} {"train_loss": -40.20878982543945, "global_step": 272445, "epoch": 2251} {"train_loss": -42.84597396850586, "global_step": 272446, "epoch": 2251} {"train_loss": -41.198299407958984, "global_step": 272447, "epoch": 2251} {"train_loss": -41.48737716674805, "global_step": 272448, "epoch": 2251} {"train_loss": -43.34177780151367, "global_step": 272449, "epoch": 2251} {"train_loss": -41.96116256713867, "global_step": 272450, "epoch": 2251} {"train_loss": -42.863983154296875, "global_step": 272451, "epoch": 2251} {"train_loss": -42.51889419555664, "global_step": 272452, "epoch": 2251} {"train_loss": -42.1817741394043, "global_step": 272453, "epoch": 2251} {"train_loss": -41.77555847167969, "global_step": 272454, "epoch": 2251} {"train_loss": -42.42438507080078, "global_step": 272455, "epoch": 2251} {"train_loss": -42.8026123046875, "global_step": 272456, "epoch": 2251} {"train_loss": -42.12467575073242, "global_step": 272457, "epoch": 2251} {"train_loss": -40.66712188720703, "global_step": 272458, "epoch": 2251} {"train_loss": -42.19550704956055, "global_step": 272459, "epoch": 2251} {"train_loss": -42.8403205871582, "global_step": 272460, "epoch": 2251} {"train_loss": -41.68629837036133, "global_step": 272461, "epoch": 2251} {"train_loss": -42.41827392578125, "global_step": 272462, "epoch": 2251} {"train_loss": -43.173954010009766, "global_step": 272463, "epoch": 2251} {"train_loss": -42.1290397644043, "global_step": 272464, "epoch": 2251} {"train_loss": -42.81705093383789, "global_step": 272465, "epoch": 2251} {"train_loss": -43.22105407714844, "global_step": 272466, "epoch": 2251} {"train_loss": -43.06925582885742, "global_step": 272467, "epoch": 2251} {"train_loss": -42.47103500366211, "global_step": 272468, "epoch": 2251} {"train_loss": -43.14913558959961, "global_step": 272469, "epoch": 2251} {"train_loss": -43.204586029052734, "global_step": 272470, "epoch": 2251} {"train_loss": -43.23506164550781, "global_step": 272471, "epoch": 2251} {"train_loss": -42.90211868286133, "global_step": 272472, "epoch": 2251} {"train_loss": -43.43115997314453, "global_step": 272473, "epoch": 2251} {"train_loss": -42.91522979736328, "global_step": 272474, "epoch": 2251} {"train_loss": -43.2104377746582, "global_step": 272475, "epoch": 2251} {"train_loss": -43.218143463134766, "global_step": 272476, "epoch": 2251} {"train_loss": -42.9285888671875, "global_step": 272477, "epoch": 2251} {"train_loss": -43.131752014160156, "global_step": 272478, "epoch": 2251} {"train_loss": -42.87043380737305, "global_step": 272479, "epoch": 2251} {"train_loss": -43.32277297973633, "global_step": 272480, "epoch": 2251} {"train_loss": -43.616634368896484, "global_step": 272481, "epoch": 2251} {"train_loss": -43.2458381652832, "global_step": 272482, "epoch": 2251} {"train_loss": -43.60763931274414, "global_step": 272483, "epoch": 2251} {"train_loss": -43.4715690612793, "global_step": 272484, "epoch": 2251} {"train_loss": -43.14544677734375, "global_step": 272485, "epoch": 2251} {"train_loss": -43.80357360839844, "global_step": 272486, "epoch": 2251} {"train_loss": -43.976661682128906, "global_step": 272487, "epoch": 2251} {"train_loss": -43.94242477416992, "global_step": 272488, "epoch": 2251} {"train_loss": -42.847267150878906, "global_step": 272489, "epoch": 2251} {"train_loss": -43.77691650390625, "global_step": 272490, "epoch": 2251} {"train_loss": -42.499030909262416, "global_step": 272491, "epoch": 2251, "val_loss": 2648563.75} {"train_loss": -43.47414016723633, "global_step": 272492, "epoch": 2252} {"train_loss": -43.45317840576172, "global_step": 272493, "epoch": 2252} {"train_loss": -43.64022445678711, "global_step": 272494, "epoch": 2252} {"train_loss": -43.68617630004883, "global_step": 272495, "epoch": 2252} {"train_loss": -43.97335433959961, "global_step": 272496, "epoch": 2252} {"train_loss": -42.931148529052734, "global_step": 272497, "epoch": 2252} {"train_loss": -42.18191146850586, "global_step": 272498, "epoch": 2252} {"train_loss": -43.470924377441406, "global_step": 272499, "epoch": 2252} {"train_loss": -42.68520736694336, "global_step": 272500, "epoch": 2252} {"train_loss": -42.666656494140625, "global_step": 272501, "epoch": 2252} {"train_loss": -43.18721389770508, "global_step": 272502, "epoch": 2252} {"train_loss": -42.4701042175293, "global_step": 272503, "epoch": 2252} {"train_loss": -43.281856536865234, "global_step": 272504, "epoch": 2252} {"train_loss": -43.08015823364258, "global_step": 272505, "epoch": 2252} {"train_loss": -43.71147155761719, "global_step": 272506, "epoch": 2252} {"train_loss": -43.54414367675781, "global_step": 272507, "epoch": 2252} {"train_loss": -41.687530517578125, "global_step": 272508, "epoch": 2252} {"train_loss": -41.92277145385742, "global_step": 272509, "epoch": 2252} {"train_loss": -41.69419479370117, "global_step": 272510, "epoch": 2252} {"train_loss": -42.806949615478516, "global_step": 272511, "epoch": 2252} {"train_loss": -41.32752990722656, "global_step": 272512, "epoch": 2252} {"train_loss": -42.32826232910156, "global_step": 272513, "epoch": 2252} {"train_loss": -40.967098236083984, "global_step": 272514, "epoch": 2252} {"train_loss": -39.72567367553711, "global_step": 272515, "epoch": 2252} {"train_loss": -40.58271408081055, "global_step": 272516, "epoch": 2252} {"train_loss": -41.83205795288086, "global_step": 272517, "epoch": 2252} {"train_loss": -41.978572845458984, "global_step": 272518, "epoch": 2252} {"train_loss": -41.44000244140625, "global_step": 272519, "epoch": 2252} {"train_loss": -42.204708099365234, "global_step": 272520, "epoch": 2252} {"train_loss": -40.174293518066406, "global_step": 272521, "epoch": 2252} {"train_loss": -41.09843444824219, "global_step": 272522, "epoch": 2252} {"train_loss": -37.68119812011719, "global_step": 272523, "epoch": 2252} {"train_loss": -41.59272003173828, "global_step": 272524, "epoch": 2252} {"train_loss": -42.60920333862305, "global_step": 272525, "epoch": 2252} {"train_loss": -41.23773193359375, "global_step": 272526, "epoch": 2252} {"train_loss": -42.900386810302734, "global_step": 272527, "epoch": 2252} {"train_loss": -39.37900924682617, "global_step": 272528, "epoch": 2252} {"train_loss": -42.51381301879883, "global_step": 272529, "epoch": 2252} {"train_loss": -42.272640228271484, "global_step": 272530, "epoch": 2252} {"train_loss": -43.034027099609375, "global_step": 272531, "epoch": 2252} {"train_loss": -42.489131927490234, "global_step": 272532, "epoch": 2252} {"train_loss": -42.25869369506836, "global_step": 272533, "epoch": 2252} {"train_loss": -42.9945182800293, "global_step": 272534, "epoch": 2252} {"train_loss": -42.0545539855957, "global_step": 272535, "epoch": 2252} {"train_loss": -42.063411712646484, "global_step": 272536, "epoch": 2252} {"train_loss": -41.74440383911133, "global_step": 272537, "epoch": 2252} {"train_loss": -43.03078079223633, "global_step": 272538, "epoch": 2252} {"train_loss": -41.601318359375, "global_step": 272539, "epoch": 2252} {"train_loss": -43.29634094238281, "global_step": 272540, "epoch": 2252} {"train_loss": -42.77390670776367, "global_step": 272541, "epoch": 2252} {"train_loss": -43.6445426940918, "global_step": 272542, "epoch": 2252} {"train_loss": -42.76595687866211, "global_step": 272543, "epoch": 2252} {"train_loss": -43.115020751953125, "global_step": 272544, "epoch": 2252} {"train_loss": -43.45027542114258, "global_step": 272545, "epoch": 2252} {"train_loss": -42.890602111816406, "global_step": 272546, "epoch": 2252} {"train_loss": -41.75931167602539, "global_step": 272547, "epoch": 2252} {"train_loss": -43.244407653808594, "global_step": 272548, "epoch": 2252} {"train_loss": -42.23685836791992, "global_step": 272549, "epoch": 2252} {"train_loss": -43.1453971862793, "global_step": 272550, "epoch": 2252} {"train_loss": -43.22999572753906, "global_step": 272551, "epoch": 2252} {"train_loss": -41.95281219482422, "global_step": 272552, "epoch": 2252} {"train_loss": -43.43668746948242, "global_step": 272553, "epoch": 2252} {"train_loss": -42.913482666015625, "global_step": 272554, "epoch": 2252} {"train_loss": -43.113243103027344, "global_step": 272555, "epoch": 2252} {"train_loss": -43.301883697509766, "global_step": 272556, "epoch": 2252} {"train_loss": -42.91252517700195, "global_step": 272557, "epoch": 2252} {"train_loss": -41.987098693847656, "global_step": 272558, "epoch": 2252} {"train_loss": -42.30055236816406, "global_step": 272559, "epoch": 2252} {"train_loss": -43.5926399230957, "global_step": 272560, "epoch": 2252} {"train_loss": -41.43021011352539, "global_step": 272561, "epoch": 2252} {"train_loss": -41.91872787475586, "global_step": 272562, "epoch": 2252} {"train_loss": -43.029747009277344, "global_step": 272563, "epoch": 2252} {"train_loss": -40.41849899291992, "global_step": 272564, "epoch": 2252} {"train_loss": -42.42641830444336, "global_step": 272565, "epoch": 2252} {"train_loss": -43.5897331237793, "global_step": 272566, "epoch": 2252} {"train_loss": -41.08804702758789, "global_step": 272567, "epoch": 2252} {"train_loss": -42.38992691040039, "global_step": 272568, "epoch": 2252} {"train_loss": -43.24210739135742, "global_step": 272569, "epoch": 2252} {"train_loss": -43.03470993041992, "global_step": 272570, "epoch": 2252} {"train_loss": -42.594879150390625, "global_step": 272571, "epoch": 2252} {"train_loss": -42.81595230102539, "global_step": 272572, "epoch": 2252} {"train_loss": -42.39036560058594, "global_step": 272573, "epoch": 2252} {"train_loss": -42.101051330566406, "global_step": 272574, "epoch": 2252} {"train_loss": -42.52722930908203, "global_step": 272575, "epoch": 2252} {"train_loss": -43.01559066772461, "global_step": 272576, "epoch": 2252} {"train_loss": -42.3434944152832, "global_step": 272577, "epoch": 2252} {"train_loss": -42.95920944213867, "global_step": 272578, "epoch": 2252} {"train_loss": -42.48466873168945, "global_step": 272579, "epoch": 2252} {"train_loss": -42.537933349609375, "global_step": 272580, "epoch": 2252} {"train_loss": -42.887939453125, "global_step": 272581, "epoch": 2252} {"train_loss": -42.371307373046875, "global_step": 272582, "epoch": 2252} {"train_loss": -42.641502380371094, "global_step": 272583, "epoch": 2252} {"train_loss": -42.40549850463867, "global_step": 272584, "epoch": 2252} {"train_loss": -40.881324768066406, "global_step": 272585, "epoch": 2252} {"train_loss": -42.14451217651367, "global_step": 272586, "epoch": 2252} {"train_loss": -37.89207458496094, "global_step": 272587, "epoch": 2252} {"train_loss": -41.742340087890625, "global_step": 272588, "epoch": 2252} {"train_loss": -41.834571838378906, "global_step": 272589, "epoch": 2252} {"train_loss": -42.39820098876953, "global_step": 272590, "epoch": 2252} {"train_loss": -42.7801513671875, "global_step": 272591, "epoch": 2252} {"train_loss": -42.818660736083984, "global_step": 272592, "epoch": 2252} {"train_loss": -42.572540283203125, "global_step": 272593, "epoch": 2252} {"train_loss": -43.318511962890625, "global_step": 272594, "epoch": 2252} {"train_loss": -42.46299362182617, "global_step": 272595, "epoch": 2252} {"train_loss": -42.1955680847168, "global_step": 272596, "epoch": 2252} {"train_loss": -42.84941864013672, "global_step": 272597, "epoch": 2252} {"train_loss": -43.060585021972656, "global_step": 272598, "epoch": 2252} {"train_loss": -43.00513458251953, "global_step": 272599, "epoch": 2252} {"train_loss": -43.272518157958984, "global_step": 272600, "epoch": 2252} {"train_loss": -43.194305419921875, "global_step": 272601, "epoch": 2252} {"train_loss": -43.6088981628418, "global_step": 272602, "epoch": 2252} {"train_loss": -43.066158294677734, "global_step": 272603, "epoch": 2252} {"train_loss": -43.57923126220703, "global_step": 272604, "epoch": 2252} {"train_loss": -43.72727584838867, "global_step": 272605, "epoch": 2252} {"train_loss": -42.10183334350586, "global_step": 272606, "epoch": 2252} {"train_loss": -43.49570846557617, "global_step": 272607, "epoch": 2252} {"train_loss": -43.724849700927734, "global_step": 272608, "epoch": 2252} {"train_loss": -43.66007614135742, "global_step": 272609, "epoch": 2252} {"train_loss": -43.31673812866211, "global_step": 272610, "epoch": 2252} {"train_loss": -43.631813049316406, "global_step": 272611, "epoch": 2252} {"train_loss": -42.48322854160277, "global_step": 272612, "epoch": 2252, "val_loss": 2742297.0} {"train_loss": -43.50251007080078, "global_step": 272613, "epoch": 2253} {"train_loss": -43.487525939941406, "global_step": 272614, "epoch": 2253} {"train_loss": -43.70326614379883, "global_step": 272615, "epoch": 2253} {"train_loss": -43.67275619506836, "global_step": 272616, "epoch": 2253} {"train_loss": -43.3687744140625, "global_step": 272617, "epoch": 2253} {"train_loss": -42.54777145385742, "global_step": 272618, "epoch": 2253} {"train_loss": -43.078182220458984, "global_step": 272619, "epoch": 2253} {"train_loss": -42.789493560791016, "global_step": 272620, "epoch": 2253} {"train_loss": -42.36949920654297, "global_step": 272621, "epoch": 2253} {"train_loss": -42.3893928527832, "global_step": 272622, "epoch": 2253} {"train_loss": -43.16044998168945, "global_step": 272623, "epoch": 2253} {"train_loss": -42.451881408691406, "global_step": 272624, "epoch": 2253} {"train_loss": -43.38899230957031, "global_step": 272625, "epoch": 2253} {"train_loss": -40.44856643676758, "global_step": 272626, "epoch": 2253} {"train_loss": -43.21596145629883, "global_step": 272627, "epoch": 2253} {"train_loss": -43.064510345458984, "global_step": 272628, "epoch": 2253} {"train_loss": -42.3602294921875, "global_step": 272629, "epoch": 2253} {"train_loss": -41.860450744628906, "global_step": 272630, "epoch": 2253} {"train_loss": -41.90102767944336, "global_step": 272631, "epoch": 2253} {"train_loss": -43.3508186340332, "global_step": 272632, "epoch": 2253} {"train_loss": -41.44028854370117, "global_step": 272633, "epoch": 2253} {"train_loss": -38.94129180908203, "global_step": 272634, "epoch": 2253} {"train_loss": -41.79962158203125, "global_step": 272635, "epoch": 2253} {"train_loss": -42.29631423950195, "global_step": 272636, "epoch": 2253} {"train_loss": -41.2360954284668, "global_step": 272637, "epoch": 2253} {"train_loss": -39.16239929199219, "global_step": 272638, "epoch": 2253} {"train_loss": -42.86167907714844, "global_step": 272639, "epoch": 2253} {"train_loss": -41.871891021728516, "global_step": 272640, "epoch": 2253} {"train_loss": -41.38904571533203, "global_step": 272641, "epoch": 2253} {"train_loss": -43.12278366088867, "global_step": 272642, "epoch": 2253} {"train_loss": -42.2689323425293, "global_step": 272643, "epoch": 2253} {"train_loss": -42.65861129760742, "global_step": 272644, "epoch": 2253} {"train_loss": -42.375675201416016, "global_step": 272645, "epoch": 2253} {"train_loss": -43.18955612182617, "global_step": 272646, "epoch": 2253} {"train_loss": -41.702423095703125, "global_step": 272647, "epoch": 2253} {"train_loss": -41.135311126708984, "global_step": 272648, "epoch": 2253} {"train_loss": -42.54359817504883, "global_step": 272649, "epoch": 2253} {"train_loss": -41.307456970214844, "global_step": 272650, "epoch": 2253} {"train_loss": -42.413875579833984, "global_step": 272651, "epoch": 2253} {"train_loss": -42.05225372314453, "global_step": 272652, "epoch": 2253} {"train_loss": -41.89617919921875, "global_step": 272653, "epoch": 2253} {"train_loss": -42.92302322387695, "global_step": 272654, "epoch": 2253} {"train_loss": -42.71553039550781, "global_step": 272655, "epoch": 2253} {"train_loss": -42.50516891479492, "global_step": 272656, "epoch": 2253} {"train_loss": -42.45228576660156, "global_step": 272657, "epoch": 2253} {"train_loss": -42.38935470581055, "global_step": 272658, "epoch": 2253} {"train_loss": -41.436920166015625, "global_step": 272659, "epoch": 2253} {"train_loss": -42.6279296875, "global_step": 272660, "epoch": 2253} {"train_loss": -42.53907775878906, "global_step": 272661, "epoch": 2253} {"train_loss": -39.81917953491211, "global_step": 272662, "epoch": 2253} {"train_loss": -41.93805694580078, "global_step": 272663, "epoch": 2253} {"train_loss": -39.83384704589844, "global_step": 272664, "epoch": 2253} {"train_loss": -42.191200256347656, "global_step": 272665, "epoch": 2253} {"train_loss": -40.76913833618164, "global_step": 272666, "epoch": 2253} {"train_loss": -42.482112884521484, "global_step": 272667, "epoch": 2253} {"train_loss": -42.526187896728516, "global_step": 272668, "epoch": 2253} {"train_loss": -40.778255462646484, "global_step": 272669, "epoch": 2253} {"train_loss": -41.552669525146484, "global_step": 272670, "epoch": 2253} {"train_loss": -40.8331413269043, "global_step": 272671, "epoch": 2253} {"train_loss": -40.65884017944336, "global_step": 272672, "epoch": 2253} {"train_loss": -39.9286003112793, "global_step": 272673, "epoch": 2253} {"train_loss": -40.28401565551758, "global_step": 272674, "epoch": 2253} {"train_loss": -41.8082389831543, "global_step": 272675, "epoch": 2253} {"train_loss": -42.824134826660156, "global_step": 272676, "epoch": 2253} {"train_loss": -40.6524543762207, "global_step": 272677, "epoch": 2253} {"train_loss": -42.12202835083008, "global_step": 272678, "epoch": 2253} {"train_loss": -43.16012191772461, "global_step": 272679, "epoch": 2253} {"train_loss": -42.15644454956055, "global_step": 272680, "epoch": 2253} {"train_loss": -42.845924377441406, "global_step": 272681, "epoch": 2253} {"train_loss": -42.72107696533203, "global_step": 272682, "epoch": 2253} {"train_loss": -41.886287689208984, "global_step": 272683, "epoch": 2253} {"train_loss": -42.851844787597656, "global_step": 272684, "epoch": 2253} {"train_loss": -42.438621520996094, "global_step": 272685, "epoch": 2253} {"train_loss": -42.16681671142578, "global_step": 272686, "epoch": 2253} {"train_loss": -42.509849548339844, "global_step": 272687, "epoch": 2253} {"train_loss": -42.477020263671875, "global_step": 272688, "epoch": 2253} {"train_loss": -42.46322250366211, "global_step": 272689, "epoch": 2253} {"train_loss": -43.26169967651367, "global_step": 272690, "epoch": 2253} {"train_loss": -41.86793518066406, "global_step": 272691, "epoch": 2253} {"train_loss": -43.63042449951172, "global_step": 272692, "epoch": 2253} {"train_loss": -43.044429779052734, "global_step": 272693, "epoch": 2253} {"train_loss": -42.55997848510742, "global_step": 272694, "epoch": 2253} {"train_loss": -43.0665397644043, "global_step": 272695, "epoch": 2253} {"train_loss": -43.1059455871582, "global_step": 272696, "epoch": 2253} {"train_loss": -43.221275329589844, "global_step": 272697, "epoch": 2253} {"train_loss": -43.58693313598633, "global_step": 272698, "epoch": 2253} {"train_loss": -42.98334884643555, "global_step": 272699, "epoch": 2253} {"train_loss": -43.678138732910156, "global_step": 272700, "epoch": 2253} {"train_loss": -43.59553909301758, "global_step": 272701, "epoch": 2253} {"train_loss": -43.59598922729492, "global_step": 272702, "epoch": 2253} {"train_loss": -44.177852630615234, "global_step": 272703, "epoch": 2253} {"train_loss": -43.54213333129883, "global_step": 272704, "epoch": 2253} {"train_loss": -43.340057373046875, "global_step": 272705, "epoch": 2253} {"train_loss": -43.52772903442383, "global_step": 272706, "epoch": 2253} {"train_loss": -43.31178665161133, "global_step": 272707, "epoch": 2253} {"train_loss": -43.668819427490234, "global_step": 272708, "epoch": 2253} {"train_loss": -43.26462173461914, "global_step": 272709, "epoch": 2253} {"train_loss": -43.303443908691406, "global_step": 272710, "epoch": 2253} {"train_loss": -43.769500732421875, "global_step": 272711, "epoch": 2253} {"train_loss": -43.80601119995117, "global_step": 272712, "epoch": 2253} {"train_loss": -43.18360900878906, "global_step": 272713, "epoch": 2253} {"train_loss": -43.4090690612793, "global_step": 272714, "epoch": 2253} {"train_loss": -43.672237396240234, "global_step": 272715, "epoch": 2253} {"train_loss": -43.04224395751953, "global_step": 272716, "epoch": 2253} {"train_loss": -43.491939544677734, "global_step": 272717, "epoch": 2253} {"train_loss": -43.54482650756836, "global_step": 272718, "epoch": 2253} {"train_loss": -43.53413009643555, "global_step": 272719, "epoch": 2253} {"train_loss": -43.437374114990234, "global_step": 272720, "epoch": 2253} {"train_loss": -42.98748779296875, "global_step": 272721, "epoch": 2253} {"train_loss": -42.15360641479492, "global_step": 272722, "epoch": 2253} {"train_loss": -42.138851165771484, "global_step": 272723, "epoch": 2253} {"train_loss": -43.768836975097656, "global_step": 272724, "epoch": 2253} {"train_loss": -43.425811767578125, "global_step": 272725, "epoch": 2253} {"train_loss": -42.974159240722656, "global_step": 272726, "epoch": 2253} {"train_loss": -43.2972526550293, "global_step": 272727, "epoch": 2253} {"train_loss": -43.22578048706055, "global_step": 272728, "epoch": 2253} {"train_loss": -43.469329833984375, "global_step": 272729, "epoch": 2253} {"train_loss": -43.856781005859375, "global_step": 272730, "epoch": 2253} {"train_loss": -43.64398956298828, "global_step": 272731, "epoch": 2253} {"train_loss": -42.97129440307617, "global_step": 272732, "epoch": 2253} {"train_loss": -42.54064663973722, "global_step": 272733, "epoch": 2253, "val_loss": 2639181.75} {"train_loss": -43.16597366333008, "global_step": 272734, "epoch": 2254} {"train_loss": -43.21780014038086, "global_step": 272735, "epoch": 2254} {"train_loss": -43.554996490478516, "global_step": 272736, "epoch": 2254} {"train_loss": -42.94454574584961, "global_step": 272737, "epoch": 2254} {"train_loss": -43.16001510620117, "global_step": 272738, "epoch": 2254} {"train_loss": -43.22252655029297, "global_step": 272739, "epoch": 2254} {"train_loss": -42.489234924316406, "global_step": 272740, "epoch": 2254} {"train_loss": -43.19255447387695, "global_step": 272741, "epoch": 2254} {"train_loss": -42.042213439941406, "global_step": 272742, "epoch": 2254} {"train_loss": -42.54729080200195, "global_step": 272743, "epoch": 2254} {"train_loss": -43.717994689941406, "global_step": 272744, "epoch": 2254} {"train_loss": -43.313411712646484, "global_step": 272745, "epoch": 2254} {"train_loss": -41.849769592285156, "global_step": 272746, "epoch": 2254} {"train_loss": -42.86756134033203, "global_step": 272747, "epoch": 2254} {"train_loss": -42.81865310668945, "global_step": 272748, "epoch": 2254} {"train_loss": -42.185462951660156, "global_step": 272749, "epoch": 2254} {"train_loss": -42.72213363647461, "global_step": 272750, "epoch": 2254} {"train_loss": -43.37876892089844, "global_step": 272751, "epoch": 2254} {"train_loss": -42.864418029785156, "global_step": 272752, "epoch": 2254} {"train_loss": -43.502769470214844, "global_step": 272753, "epoch": 2254} {"train_loss": -43.009490966796875, "global_step": 272754, "epoch": 2254} {"train_loss": -43.223594665527344, "global_step": 272755, "epoch": 2254} {"train_loss": -43.634395599365234, "global_step": 272756, "epoch": 2254} {"train_loss": -43.397457122802734, "global_step": 272757, "epoch": 2254} {"train_loss": -40.10842514038086, "global_step": 272758, "epoch": 2254} {"train_loss": -41.12770462036133, "global_step": 272759, "epoch": 2254} {"train_loss": -42.44997024536133, "global_step": 272760, "epoch": 2254} {"train_loss": -41.119361877441406, "global_step": 272761, "epoch": 2254} {"train_loss": -40.81501770019531, "global_step": 272762, "epoch": 2254} {"train_loss": -42.70041275024414, "global_step": 272763, "epoch": 2254} {"train_loss": -42.15826416015625, "global_step": 272764, "epoch": 2254} {"train_loss": -40.84938430786133, "global_step": 272765, "epoch": 2254} {"train_loss": -43.21857452392578, "global_step": 272766, "epoch": 2254} {"train_loss": -37.947235107421875, "global_step": 272767, "epoch": 2254} {"train_loss": -33.23392868041992, "global_step": 272768, "epoch": 2254} {"train_loss": -42.446311950683594, "global_step": 272769, "epoch": 2254} {"train_loss": -30.649173736572266, "global_step": 272770, "epoch": 2254} {"train_loss": -38.249977111816406, "global_step": 272771, "epoch": 2254} {"train_loss": -38.03815841674805, "global_step": 272772, "epoch": 2254} {"train_loss": -37.85991287231445, "global_step": 272773, "epoch": 2254} {"train_loss": -27.16778564453125, "global_step": 272774, "epoch": 2254} {"train_loss": -14.537118911743164, "global_step": 272775, "epoch": 2254} {"train_loss": -28.727996826171875, "global_step": 272776, "epoch": 2254} {"train_loss": -31.079788208007812, "global_step": 272777, "epoch": 2254} {"train_loss": -34.56633377075195, "global_step": 272778, "epoch": 2254} {"train_loss": -30.3528995513916, "global_step": 272779, "epoch": 2254} {"train_loss": -27.59113121032715, "global_step": 272780, "epoch": 2254} {"train_loss": -28.660999298095703, "global_step": 272781, "epoch": 2254} {"train_loss": -31.05274772644043, "global_step": 272782, "epoch": 2254} {"train_loss": -34.16618728637695, "global_step": 272783, "epoch": 2254} {"train_loss": -31.01942253112793, "global_step": 272784, "epoch": 2254} {"train_loss": -34.988548278808594, "global_step": 272785, "epoch": 2254} {"train_loss": -26.653858184814453, "global_step": 272786, "epoch": 2254} {"train_loss": -28.008176803588867, "global_step": 272787, "epoch": 2254} {"train_loss": -34.50946807861328, "global_step": 272788, "epoch": 2254} {"train_loss": -29.795785903930664, "global_step": 272789, "epoch": 2254} {"train_loss": -33.228919982910156, "global_step": 272790, "epoch": 2254} {"train_loss": -18.33827781677246, "global_step": 272791, "epoch": 2254} {"train_loss": -35.10268020629883, "global_step": 272792, "epoch": 2254} {"train_loss": -34.68825149536133, "global_step": 272793, "epoch": 2254} {"train_loss": -34.08390426635742, "global_step": 272794, "epoch": 2254} {"train_loss": -36.202816009521484, "global_step": 272795, "epoch": 2254} {"train_loss": -33.109901428222656, "global_step": 272796, "epoch": 2254} {"train_loss": -35.93539047241211, "global_step": 272797, "epoch": 2254} {"train_loss": -33.039581298828125, "global_step": 272798, "epoch": 2254} {"train_loss": -35.4334831237793, "global_step": 272799, "epoch": 2254} {"train_loss": -37.05514144897461, "global_step": 272800, "epoch": 2254} {"train_loss": -35.643985748291016, "global_step": 272801, "epoch": 2254} {"train_loss": -36.11262512207031, "global_step": 272802, "epoch": 2254} {"train_loss": -36.8286247253418, "global_step": 272803, "epoch": 2254} {"train_loss": -36.54896926879883, "global_step": 272804, "epoch": 2254} {"train_loss": -37.02975845336914, "global_step": 272805, "epoch": 2254} {"train_loss": -36.09141159057617, "global_step": 272806, "epoch": 2254} {"train_loss": -37.70903778076172, "global_step": 272807, "epoch": 2254} {"train_loss": -38.37003707885742, "global_step": 272808, "epoch": 2254} {"train_loss": -37.85267639160156, "global_step": 272809, "epoch": 2254} {"train_loss": -37.512794494628906, "global_step": 272810, "epoch": 2254} {"train_loss": -38.531307220458984, "global_step": 272811, "epoch": 2254} {"train_loss": -36.79829788208008, "global_step": 272812, "epoch": 2254} {"train_loss": -37.36725997924805, "global_step": 272813, "epoch": 2254} {"train_loss": -38.521522521972656, "global_step": 272814, "epoch": 2254} {"train_loss": -37.846858978271484, "global_step": 272815, "epoch": 2254} {"train_loss": -39.06522750854492, "global_step": 272816, "epoch": 2254} {"train_loss": -38.58993148803711, "global_step": 272817, "epoch": 2254} {"train_loss": -38.69586181640625, "global_step": 272818, "epoch": 2254} {"train_loss": -39.031307220458984, "global_step": 272819, "epoch": 2254} {"train_loss": -37.94551086425781, "global_step": 272820, "epoch": 2254} {"train_loss": -38.33234786987305, "global_step": 272821, "epoch": 2254} {"train_loss": -38.1880989074707, "global_step": 272822, "epoch": 2254} {"train_loss": -38.56229782104492, "global_step": 272823, "epoch": 2254} {"train_loss": -38.841514587402344, "global_step": 272824, "epoch": 2254} {"train_loss": -39.28667068481445, "global_step": 272825, "epoch": 2254} {"train_loss": -37.754268646240234, "global_step": 272826, "epoch": 2254} {"train_loss": -38.79395294189453, "global_step": 272827, "epoch": 2254} {"train_loss": -39.04826736450195, "global_step": 272828, "epoch": 2254} {"train_loss": -39.379432678222656, "global_step": 272829, "epoch": 2254} {"train_loss": -38.246517181396484, "global_step": 272830, "epoch": 2254} {"train_loss": -39.263824462890625, "global_step": 272831, "epoch": 2254} {"train_loss": -38.63184356689453, "global_step": 272832, "epoch": 2254} {"train_loss": -40.303340911865234, "global_step": 272833, "epoch": 2254} {"train_loss": -39.68244171142578, "global_step": 272834, "epoch": 2254} {"train_loss": -40.01881790161133, "global_step": 272835, "epoch": 2254} {"train_loss": -38.76264190673828, "global_step": 272836, "epoch": 2254} {"train_loss": -38.824317932128906, "global_step": 272837, "epoch": 2254} {"train_loss": -39.99640655517578, "global_step": 272838, "epoch": 2254} {"train_loss": -39.536582946777344, "global_step": 272839, "epoch": 2254} {"train_loss": -39.08317184448242, "global_step": 272840, "epoch": 2254} {"train_loss": -39.489315032958984, "global_step": 272841, "epoch": 2254} {"train_loss": -40.13777542114258, "global_step": 272842, "epoch": 2254} {"train_loss": -39.41317367553711, "global_step": 272843, "epoch": 2254} {"train_loss": -39.58290481567383, "global_step": 272844, "epoch": 2254} {"train_loss": -39.6015739440918, "global_step": 272845, "epoch": 2254} {"train_loss": -40.53636932373047, "global_step": 272846, "epoch": 2254} {"train_loss": -40.65164566040039, "global_step": 272847, "epoch": 2254} {"train_loss": -40.220943450927734, "global_step": 272848, "epoch": 2254} {"train_loss": -40.23461151123047, "global_step": 272849, "epoch": 2254} {"train_loss": -40.38974380493164, "global_step": 272850, "epoch": 2254} {"train_loss": -41.30958938598633, "global_step": 272851, "epoch": 2254} {"train_loss": -39.59282684326172, "global_step": 272852, "epoch": 2254} {"train_loss": -40.969234466552734, "global_step": 272853, "epoch": 2254} {"train_loss": -38.00313640626009, "global_step": 272854, "epoch": 2254, "val_loss": 2703771.75} {"train_loss": -40.425872802734375, "global_step": 272855, "epoch": 2255} {"train_loss": -40.192623138427734, "global_step": 272856, "epoch": 2255} {"train_loss": -39.74567794799805, "global_step": 272857, "epoch": 2255} {"train_loss": -40.38090133666992, "global_step": 272858, "epoch": 2255} {"train_loss": -39.725379943847656, "global_step": 272859, "epoch": 2255} {"train_loss": -40.37228012084961, "global_step": 272860, "epoch": 2255} {"train_loss": -40.980281829833984, "global_step": 272861, "epoch": 2255} {"train_loss": -40.84017562866211, "global_step": 272862, "epoch": 2255} {"train_loss": -41.01943588256836, "global_step": 272863, "epoch": 2255} {"train_loss": -40.91755294799805, "global_step": 272864, "epoch": 2255} {"train_loss": -41.00447463989258, "global_step": 272865, "epoch": 2255} {"train_loss": -40.64509201049805, "global_step": 272866, "epoch": 2255} {"train_loss": -41.161861419677734, "global_step": 272867, "epoch": 2255} {"train_loss": -41.247108459472656, "global_step": 272868, "epoch": 2255} {"train_loss": -40.492401123046875, "global_step": 272869, "epoch": 2255} {"train_loss": -41.000694274902344, "global_step": 272870, "epoch": 2255} {"train_loss": -40.56870651245117, "global_step": 272871, "epoch": 2255} {"train_loss": -40.89755630493164, "global_step": 272872, "epoch": 2255} {"train_loss": -41.87363815307617, "global_step": 272873, "epoch": 2255} {"train_loss": -40.45777130126953, "global_step": 272874, "epoch": 2255} {"train_loss": -41.062744140625, "global_step": 272875, "epoch": 2255} {"train_loss": -40.820960998535156, "global_step": 272876, "epoch": 2255} {"train_loss": -41.24308395385742, "global_step": 272877, "epoch": 2255} {"train_loss": -41.0973014831543, "global_step": 272878, "epoch": 2255} {"train_loss": -41.3547248840332, "global_step": 272879, "epoch": 2255} {"train_loss": -41.1580924987793, "global_step": 272880, "epoch": 2255} {"train_loss": -41.909210205078125, "global_step": 272881, "epoch": 2255} {"train_loss": -41.70166015625, "global_step": 272882, "epoch": 2255} {"train_loss": -42.02558898925781, "global_step": 272883, "epoch": 2255} {"train_loss": -41.882442474365234, "global_step": 272884, "epoch": 2255} {"train_loss": -41.28396224975586, "global_step": 272885, "epoch": 2255} {"train_loss": -41.352352142333984, "global_step": 272886, "epoch": 2255} {"train_loss": -41.80012130737305, "global_step": 272887, "epoch": 2255} {"train_loss": -41.65077209472656, "global_step": 272888, "epoch": 2255} {"train_loss": -41.64948272705078, "global_step": 272889, "epoch": 2255} {"train_loss": -41.26929473876953, "global_step": 272890, "epoch": 2255} {"train_loss": -40.6989860534668, "global_step": 272891, "epoch": 2255} {"train_loss": -41.84573745727539, "global_step": 272892, "epoch": 2255} {"train_loss": -42.27933883666992, "global_step": 272893, "epoch": 2255} {"train_loss": -41.99935531616211, "global_step": 272894, "epoch": 2255} {"train_loss": -41.62311553955078, "global_step": 272895, "epoch": 2255} {"train_loss": -41.94589614868164, "global_step": 272896, "epoch": 2255} {"train_loss": -41.15435791015625, "global_step": 272897, "epoch": 2255} {"train_loss": -41.79581832885742, "global_step": 272898, "epoch": 2255} {"train_loss": -41.900604248046875, "global_step": 272899, "epoch": 2255} {"train_loss": -41.97214889526367, "global_step": 272900, "epoch": 2255} {"train_loss": -41.98988723754883, "global_step": 272901, "epoch": 2255} {"train_loss": -41.82234573364258, "global_step": 272902, "epoch": 2255} {"train_loss": -42.72331237792969, "global_step": 272903, "epoch": 2255} {"train_loss": -42.6423454284668, "global_step": 272904, "epoch": 2255} {"train_loss": -41.265438079833984, "global_step": 272905, "epoch": 2255} {"train_loss": -41.4166145324707, "global_step": 272906, "epoch": 2255} {"train_loss": -41.602455139160156, "global_step": 272907, "epoch": 2255} {"train_loss": -42.14497756958008, "global_step": 272908, "epoch": 2255} {"train_loss": -42.41950225830078, "global_step": 272909, "epoch": 2255} {"train_loss": -42.78468704223633, "global_step": 272910, "epoch": 2255} {"train_loss": -42.38539123535156, "global_step": 272911, "epoch": 2255} {"train_loss": -41.48103332519531, "global_step": 272912, "epoch": 2255} {"train_loss": -42.47188949584961, "global_step": 272913, "epoch": 2255} {"train_loss": -42.295772552490234, "global_step": 272914, "epoch": 2255} {"train_loss": -42.14689254760742, "global_step": 272915, "epoch": 2255} {"train_loss": -42.153785705566406, "global_step": 272916, "epoch": 2255} {"train_loss": -42.924556732177734, "global_step": 272917, "epoch": 2255} {"train_loss": -42.7582893371582, "global_step": 272918, "epoch": 2255} {"train_loss": -42.97243881225586, "global_step": 272919, "epoch": 2255} {"train_loss": -42.58264923095703, "global_step": 272920, "epoch": 2255} {"train_loss": -42.4571647644043, "global_step": 272921, "epoch": 2255} {"train_loss": -42.47832107543945, "global_step": 272922, "epoch": 2255} {"train_loss": -42.2703742980957, "global_step": 272923, "epoch": 2255} {"train_loss": -42.50123977661133, "global_step": 272924, "epoch": 2255} {"train_loss": -42.916419982910156, "global_step": 272925, "epoch": 2255} {"train_loss": -42.32877731323242, "global_step": 272926, "epoch": 2255} {"train_loss": -42.66950225830078, "global_step": 272927, "epoch": 2255} {"train_loss": -42.42405319213867, "global_step": 272928, "epoch": 2255} {"train_loss": -42.109371185302734, "global_step": 272929, "epoch": 2255} {"train_loss": -42.49177169799805, "global_step": 272930, "epoch": 2255} {"train_loss": -42.838253021240234, "global_step": 272931, "epoch": 2255} {"train_loss": -42.75006866455078, "global_step": 272932, "epoch": 2255} {"train_loss": -42.0809440612793, "global_step": 272933, "epoch": 2255} {"train_loss": -42.282623291015625, "global_step": 272934, "epoch": 2255} {"train_loss": -42.23899841308594, "global_step": 272935, "epoch": 2255} {"train_loss": -42.07808303833008, "global_step": 272936, "epoch": 2255} {"train_loss": -42.8778190612793, "global_step": 272937, "epoch": 2255} {"train_loss": -42.52875518798828, "global_step": 272938, "epoch": 2255} {"train_loss": -42.12630081176758, "global_step": 272939, "epoch": 2255} {"train_loss": -42.77363204956055, "global_step": 272940, "epoch": 2255} {"train_loss": -42.41036605834961, "global_step": 272941, "epoch": 2255} {"train_loss": -42.84716796875, "global_step": 272942, "epoch": 2255} {"train_loss": -42.08195114135742, "global_step": 272943, "epoch": 2255} {"train_loss": -42.633419036865234, "global_step": 272944, "epoch": 2255} {"train_loss": -42.856475830078125, "global_step": 272945, "epoch": 2255} {"train_loss": -42.52957534790039, "global_step": 272946, "epoch": 2255} {"train_loss": -42.55451583862305, "global_step": 272947, "epoch": 2255} {"train_loss": -42.6499137878418, "global_step": 272948, "epoch": 2255} {"train_loss": -43.30537033081055, "global_step": 272949, "epoch": 2255} {"train_loss": -43.4216194152832, "global_step": 272950, "epoch": 2255} {"train_loss": -43.12935256958008, "global_step": 272951, "epoch": 2255} {"train_loss": -42.834285736083984, "global_step": 272952, "epoch": 2255} {"train_loss": -43.37028121948242, "global_step": 272953, "epoch": 2255} {"train_loss": -43.30739212036133, "global_step": 272954, "epoch": 2255} {"train_loss": -42.419063568115234, "global_step": 272955, "epoch": 2255} {"train_loss": -42.202640533447266, "global_step": 272956, "epoch": 2255} {"train_loss": -42.484046936035156, "global_step": 272957, "epoch": 2255} {"train_loss": -42.72167205810547, "global_step": 272958, "epoch": 2255} {"train_loss": -43.16563034057617, "global_step": 272959, "epoch": 2255} {"train_loss": -42.395263671875, "global_step": 272960, "epoch": 2255} {"train_loss": -43.20164108276367, "global_step": 272961, "epoch": 2255} {"train_loss": -42.32444381713867, "global_step": 272962, "epoch": 2255} {"train_loss": -42.7458610534668, "global_step": 272963, "epoch": 2255} {"train_loss": -43.653194427490234, "global_step": 272964, "epoch": 2255} {"train_loss": -41.57902908325195, "global_step": 272965, "epoch": 2255} {"train_loss": -41.96158218383789, "global_step": 272966, "epoch": 2255} {"train_loss": -41.943058013916016, "global_step": 272967, "epoch": 2255} {"train_loss": -42.398345947265625, "global_step": 272968, "epoch": 2255} {"train_loss": -41.44245529174805, "global_step": 272969, "epoch": 2255} {"train_loss": -39.6457633972168, "global_step": 272970, "epoch": 2255} {"train_loss": -41.83549118041992, "global_step": 272971, "epoch": 2255} {"train_loss": -42.230098724365234, "global_step": 272972, "epoch": 2255} {"train_loss": -41.75088882446289, "global_step": 272973, "epoch": 2255} {"train_loss": -41.329627990722656, "global_step": 272974, "epoch": 2255} {"train_loss": -41.93150323284559, "global_step": 272975, "epoch": 2255, "val_loss": 2755545.0} {"train_loss": -40.52277755737305, "global_step": 272976, "epoch": 2256} {"train_loss": -41.1856803894043, "global_step": 272977, "epoch": 2256} {"train_loss": -41.05904769897461, "global_step": 272978, "epoch": 2256} {"train_loss": -40.77511215209961, "global_step": 272979, "epoch": 2256} {"train_loss": -40.67660140991211, "global_step": 272980, "epoch": 2256} {"train_loss": -40.70435333251953, "global_step": 272981, "epoch": 2256} {"train_loss": -42.3779411315918, "global_step": 272982, "epoch": 2256} {"train_loss": -41.39151382446289, "global_step": 272983, "epoch": 2256} {"train_loss": -41.96055221557617, "global_step": 272984, "epoch": 2256} {"train_loss": -42.010833740234375, "global_step": 272985, "epoch": 2256} {"train_loss": -42.264339447021484, "global_step": 272986, "epoch": 2256} {"train_loss": -41.227115631103516, "global_step": 272987, "epoch": 2256} {"train_loss": -42.09112548828125, "global_step": 272988, "epoch": 2256} {"train_loss": -39.21051788330078, "global_step": 272989, "epoch": 2256} {"train_loss": -41.41941452026367, "global_step": 272990, "epoch": 2256} {"train_loss": -40.675785064697266, "global_step": 272991, "epoch": 2256} {"train_loss": -41.468231201171875, "global_step": 272992, "epoch": 2256} {"train_loss": -41.381202697753906, "global_step": 272993, "epoch": 2256} {"train_loss": -41.95478439331055, "global_step": 272994, "epoch": 2256} {"train_loss": -40.77610397338867, "global_step": 272995, "epoch": 2256} {"train_loss": -41.68121337890625, "global_step": 272996, "epoch": 2256} {"train_loss": -40.99422073364258, "global_step": 272997, "epoch": 2256} {"train_loss": -41.11429977416992, "global_step": 272998, "epoch": 2256} {"train_loss": -41.19940185546875, "global_step": 272999, "epoch": 2256} {"train_loss": -41.4698486328125, "global_step": 273000, "epoch": 2256} {"train_loss": -40.97117233276367, "global_step": 273001, "epoch": 2256} {"train_loss": -42.932220458984375, "global_step": 273002, "epoch": 2256} {"train_loss": -41.799503326416016, "global_step": 273003, "epoch": 2256} {"train_loss": -39.31665802001953, "global_step": 273004, "epoch": 2256} {"train_loss": -42.54652786254883, "global_step": 273005, "epoch": 2256} {"train_loss": -40.6625862121582, "global_step": 273006, "epoch": 2256} {"train_loss": -40.769081115722656, "global_step": 273007, "epoch": 2256} {"train_loss": -40.82561111450195, "global_step": 273008, "epoch": 2256} {"train_loss": -41.362483978271484, "global_step": 273009, "epoch": 2256} {"train_loss": -40.96189498901367, "global_step": 273010, "epoch": 2256} {"train_loss": -40.7204704284668, "global_step": 273011, "epoch": 2256} {"train_loss": -41.223602294921875, "global_step": 273012, "epoch": 2256} {"train_loss": -41.469398498535156, "global_step": 273013, "epoch": 2256} {"train_loss": -41.51496124267578, "global_step": 273014, "epoch": 2256} {"train_loss": -41.85775375366211, "global_step": 273015, "epoch": 2256} {"train_loss": -41.51662826538086, "global_step": 273016, "epoch": 2256} {"train_loss": -40.4882698059082, "global_step": 273017, "epoch": 2256} {"train_loss": -41.59092712402344, "global_step": 273018, "epoch": 2256} {"train_loss": -41.71870040893555, "global_step": 273019, "epoch": 2256} {"train_loss": -41.723690032958984, "global_step": 273020, "epoch": 2256} {"train_loss": -41.819740295410156, "global_step": 273021, "epoch": 2256} {"train_loss": -41.348663330078125, "global_step": 273022, "epoch": 2256} {"train_loss": -42.254547119140625, "global_step": 273023, "epoch": 2256} {"train_loss": -42.417030334472656, "global_step": 273024, "epoch": 2256} {"train_loss": -42.17380905151367, "global_step": 273025, "epoch": 2256} {"train_loss": -42.920982360839844, "global_step": 273026, "epoch": 2256} {"train_loss": -42.34322738647461, "global_step": 273027, "epoch": 2256} {"train_loss": -42.78440475463867, "global_step": 273028, "epoch": 2256} {"train_loss": -42.60951614379883, "global_step": 273029, "epoch": 2256} {"train_loss": -42.28017044067383, "global_step": 273030, "epoch": 2256} {"train_loss": -42.512813568115234, "global_step": 273031, "epoch": 2256} {"train_loss": -41.650665283203125, "global_step": 273032, "epoch": 2256} {"train_loss": -42.66041564941406, "global_step": 273033, "epoch": 2256} {"train_loss": -42.70158767700195, "global_step": 273034, "epoch": 2256} {"train_loss": -42.67450714111328, "global_step": 273035, "epoch": 2256} {"train_loss": -42.8425407409668, "global_step": 273036, "epoch": 2256} {"train_loss": -42.82122039794922, "global_step": 273037, "epoch": 2256} {"train_loss": -42.34033966064453, "global_step": 273038, "epoch": 2256} {"train_loss": -42.71281051635742, "global_step": 273039, "epoch": 2256} {"train_loss": -42.29597854614258, "global_step": 273040, "epoch": 2256} {"train_loss": -42.673057556152344, "global_step": 273041, "epoch": 2256} {"train_loss": -41.425079345703125, "global_step": 273042, "epoch": 2256} {"train_loss": -42.11480712890625, "global_step": 273043, "epoch": 2256} {"train_loss": -42.12342071533203, "global_step": 273044, "epoch": 2256} {"train_loss": -42.71358871459961, "global_step": 273045, "epoch": 2256} {"train_loss": -42.24822235107422, "global_step": 273046, "epoch": 2256} {"train_loss": -41.69670867919922, "global_step": 273047, "epoch": 2256} {"train_loss": -42.56380081176758, "global_step": 273048, "epoch": 2256} {"train_loss": -42.86088943481445, "global_step": 273049, "epoch": 2256} {"train_loss": -42.447044372558594, "global_step": 273050, "epoch": 2256} {"train_loss": -42.80517578125, "global_step": 273051, "epoch": 2256} {"train_loss": -41.552490234375, "global_step": 273052, "epoch": 2256} {"train_loss": -40.4715690612793, "global_step": 273053, "epoch": 2256} {"train_loss": -41.61359405517578, "global_step": 273054, "epoch": 2256} {"train_loss": -43.02346420288086, "global_step": 273055, "epoch": 2256} {"train_loss": -41.30549621582031, "global_step": 273056, "epoch": 2256} {"train_loss": -41.549415588378906, "global_step": 273057, "epoch": 2256} {"train_loss": -42.645103454589844, "global_step": 273058, "epoch": 2256} {"train_loss": -43.171504974365234, "global_step": 273059, "epoch": 2256} {"train_loss": -41.50259780883789, "global_step": 273060, "epoch": 2256} {"train_loss": -41.32696533203125, "global_step": 273061, "epoch": 2256} {"train_loss": -42.870052337646484, "global_step": 273062, "epoch": 2256} {"train_loss": -42.005340576171875, "global_step": 273063, "epoch": 2256} {"train_loss": -42.598140716552734, "global_step": 273064, "epoch": 2256} {"train_loss": -42.889244079589844, "global_step": 273065, "epoch": 2256} {"train_loss": -41.94578170776367, "global_step": 273066, "epoch": 2256} {"train_loss": -41.95066833496094, "global_step": 273067, "epoch": 2256} {"train_loss": -42.694942474365234, "global_step": 273068, "epoch": 2256} {"train_loss": -42.42338180541992, "global_step": 273069, "epoch": 2256} {"train_loss": -42.56814193725586, "global_step": 273070, "epoch": 2256} {"train_loss": -42.53192901611328, "global_step": 273071, "epoch": 2256} {"train_loss": -43.00632858276367, "global_step": 273072, "epoch": 2256} {"train_loss": -42.77740478515625, "global_step": 273073, "epoch": 2256} {"train_loss": -42.827392578125, "global_step": 273074, "epoch": 2256} {"train_loss": -43.247737884521484, "global_step": 273075, "epoch": 2256} {"train_loss": -42.79905700683594, "global_step": 273076, "epoch": 2256} {"train_loss": -42.443660736083984, "global_step": 273077, "epoch": 2256} {"train_loss": -42.8864860534668, "global_step": 273078, "epoch": 2256} {"train_loss": -42.21356964111328, "global_step": 273079, "epoch": 2256} {"train_loss": -42.27289581298828, "global_step": 273080, "epoch": 2256} {"train_loss": -42.52372360229492, "global_step": 273081, "epoch": 2256} {"train_loss": -43.361751556396484, "global_step": 273082, "epoch": 2256} {"train_loss": -43.328853607177734, "global_step": 273083, "epoch": 2256} {"train_loss": -43.09023666381836, "global_step": 273084, "epoch": 2256} {"train_loss": -43.68679428100586, "global_step": 273085, "epoch": 2256} {"train_loss": -42.990779876708984, "global_step": 273086, "epoch": 2256} {"train_loss": -42.699954986572266, "global_step": 273087, "epoch": 2256} {"train_loss": -42.97537612915039, "global_step": 273088, "epoch": 2256} {"train_loss": -43.5177001953125, "global_step": 273089, "epoch": 2256} {"train_loss": -42.93921661376953, "global_step": 273090, "epoch": 2256} {"train_loss": -43.67578125, "global_step": 273091, "epoch": 2256} {"train_loss": -43.32625198364258, "global_step": 273092, "epoch": 2256} {"train_loss": -42.590187072753906, "global_step": 273093, "epoch": 2256} {"train_loss": -42.666683197021484, "global_step": 273094, "epoch": 2256} {"train_loss": -43.23563766479492, "global_step": 273095, "epoch": 2256} {"train_loss": -42.05031308260831, "global_step": 273096, "epoch": 2256, "val_loss": 2742140.0} {"train_loss": -43.52128982543945, "global_step": 273097, "epoch": 2257} {"train_loss": -43.223995208740234, "global_step": 273098, "epoch": 2257} {"train_loss": -42.86811447143555, "global_step": 273099, "epoch": 2257} {"train_loss": -43.237213134765625, "global_step": 273100, "epoch": 2257} {"train_loss": -43.772884368896484, "global_step": 273101, "epoch": 2257} {"train_loss": -43.411373138427734, "global_step": 273102, "epoch": 2257} {"train_loss": -42.908447265625, "global_step": 273103, "epoch": 2257} {"train_loss": -41.96289825439453, "global_step": 273104, "epoch": 2257} {"train_loss": -42.96747589111328, "global_step": 273105, "epoch": 2257} {"train_loss": -42.78943634033203, "global_step": 273106, "epoch": 2257} {"train_loss": -43.26841354370117, "global_step": 273107, "epoch": 2257} {"train_loss": -44.0576286315918, "global_step": 273108, "epoch": 2257} {"train_loss": -42.996795654296875, "global_step": 273109, "epoch": 2257} {"train_loss": -42.0045051574707, "global_step": 273110, "epoch": 2257} {"train_loss": -42.2945671081543, "global_step": 273111, "epoch": 2257} {"train_loss": -41.16640853881836, "global_step": 273112, "epoch": 2257} {"train_loss": -38.60316848754883, "global_step": 273113, "epoch": 2257} {"train_loss": -36.425270080566406, "global_step": 273114, "epoch": 2257} {"train_loss": -36.021995544433594, "global_step": 273115, "epoch": 2257} {"train_loss": -38.214717864990234, "global_step": 273116, "epoch": 2257} {"train_loss": -41.34971237182617, "global_step": 273117, "epoch": 2257} {"train_loss": -39.4448356628418, "global_step": 273118, "epoch": 2257} {"train_loss": -39.77262496948242, "global_step": 273119, "epoch": 2257} {"train_loss": -41.27633285522461, "global_step": 273120, "epoch": 2257} {"train_loss": -39.10590744018555, "global_step": 273121, "epoch": 2257} {"train_loss": -40.02932357788086, "global_step": 273122, "epoch": 2257} {"train_loss": -42.32085418701172, "global_step": 273123, "epoch": 2257} {"train_loss": -40.44588851928711, "global_step": 273124, "epoch": 2257} {"train_loss": -41.976924896240234, "global_step": 273125, "epoch": 2257} {"train_loss": -39.90087890625, "global_step": 273126, "epoch": 2257} {"train_loss": -41.551025390625, "global_step": 273127, "epoch": 2257} {"train_loss": -42.09811019897461, "global_step": 273128, "epoch": 2257} {"train_loss": -40.848777770996094, "global_step": 273129, "epoch": 2257} {"train_loss": -41.42051315307617, "global_step": 273130, "epoch": 2257} {"train_loss": -40.766212463378906, "global_step": 273131, "epoch": 2257} {"train_loss": -39.98517608642578, "global_step": 273132, "epoch": 2257} {"train_loss": -39.99402618408203, "global_step": 273133, "epoch": 2257} {"train_loss": -41.4665412902832, "global_step": 273134, "epoch": 2257} {"train_loss": -42.1329345703125, "global_step": 273135, "epoch": 2257} {"train_loss": -41.155853271484375, "global_step": 273136, "epoch": 2257} {"train_loss": -42.06538391113281, "global_step": 273137, "epoch": 2257} {"train_loss": -41.956336975097656, "global_step": 273138, "epoch": 2257} {"train_loss": -42.2205924987793, "global_step": 273139, "epoch": 2257} {"train_loss": -42.29282760620117, "global_step": 273140, "epoch": 2257} {"train_loss": -42.41086959838867, "global_step": 273141, "epoch": 2257} {"train_loss": -40.6077995300293, "global_step": 273142, "epoch": 2257} {"train_loss": -42.703365325927734, "global_step": 273143, "epoch": 2257} {"train_loss": -41.421417236328125, "global_step": 273144, "epoch": 2257} {"train_loss": -41.4443244934082, "global_step": 273145, "epoch": 2257} {"train_loss": -42.286590576171875, "global_step": 273146, "epoch": 2257} {"train_loss": -41.80118942260742, "global_step": 273147, "epoch": 2257} {"train_loss": -41.87471389770508, "global_step": 273148, "epoch": 2257} {"train_loss": -42.51233673095703, "global_step": 273149, "epoch": 2257} {"train_loss": -41.886688232421875, "global_step": 273150, "epoch": 2257} {"train_loss": -41.7991943359375, "global_step": 273151, "epoch": 2257} {"train_loss": -41.86668014526367, "global_step": 273152, "epoch": 2257} {"train_loss": -42.29080581665039, "global_step": 273153, "epoch": 2257} {"train_loss": -42.4994010925293, "global_step": 273154, "epoch": 2257} {"train_loss": -42.70371627807617, "global_step": 273155, "epoch": 2257} {"train_loss": -42.54463577270508, "global_step": 273156, "epoch": 2257} {"train_loss": -43.083980560302734, "global_step": 273157, "epoch": 2257} {"train_loss": -42.57120895385742, "global_step": 273158, "epoch": 2257} {"train_loss": -42.562255859375, "global_step": 273159, "epoch": 2257} {"train_loss": -43.01707077026367, "global_step": 273160, "epoch": 2257} {"train_loss": -42.29861068725586, "global_step": 273161, "epoch": 2257} {"train_loss": -43.40195083618164, "global_step": 273162, "epoch": 2257} {"train_loss": -43.13161849975586, "global_step": 273163, "epoch": 2257} {"train_loss": -42.96145248413086, "global_step": 273164, "epoch": 2257} {"train_loss": -43.34514236450195, "global_step": 273165, "epoch": 2257} {"train_loss": -43.523048400878906, "global_step": 273166, "epoch": 2257} {"train_loss": -42.29075622558594, "global_step": 273167, "epoch": 2257} {"train_loss": -43.61415481567383, "global_step": 273168, "epoch": 2257} {"train_loss": -42.83643341064453, "global_step": 273169, "epoch": 2257} {"train_loss": -43.29950714111328, "global_step": 273170, "epoch": 2257} {"train_loss": -43.288551330566406, "global_step": 273171, "epoch": 2257} {"train_loss": -42.90249252319336, "global_step": 273172, "epoch": 2257} {"train_loss": -43.338008880615234, "global_step": 273173, "epoch": 2257} {"train_loss": -43.457515716552734, "global_step": 273174, "epoch": 2257} {"train_loss": -43.670589447021484, "global_step": 273175, "epoch": 2257} {"train_loss": -44.0343132019043, "global_step": 273176, "epoch": 2257} {"train_loss": -43.03963851928711, "global_step": 273177, "epoch": 2257} {"train_loss": -43.31039047241211, "global_step": 273178, "epoch": 2257} {"train_loss": -43.341426849365234, "global_step": 273179, "epoch": 2257} {"train_loss": -43.62138366699219, "global_step": 273180, "epoch": 2257} {"train_loss": -43.57551193237305, "global_step": 273181, "epoch": 2257} {"train_loss": -43.42647171020508, "global_step": 273182, "epoch": 2257} {"train_loss": -43.600948333740234, "global_step": 273183, "epoch": 2257} {"train_loss": -43.85095977783203, "global_step": 273184, "epoch": 2257} {"train_loss": -43.42346954345703, "global_step": 273185, "epoch": 2257} {"train_loss": -43.17496871948242, "global_step": 273186, "epoch": 2257} {"train_loss": -43.7203369140625, "global_step": 273187, "epoch": 2257} {"train_loss": -43.67892837524414, "global_step": 273188, "epoch": 2257} {"train_loss": -43.86618423461914, "global_step": 273189, "epoch": 2257} {"train_loss": -43.20111846923828, "global_step": 273190, "epoch": 2257} {"train_loss": -43.7494010925293, "global_step": 273191, "epoch": 2257} {"train_loss": -43.8507080078125, "global_step": 273192, "epoch": 2257} {"train_loss": -42.944618225097656, "global_step": 273193, "epoch": 2257} {"train_loss": -43.108882904052734, "global_step": 273194, "epoch": 2257} {"train_loss": -42.349239349365234, "global_step": 273195, "epoch": 2257} {"train_loss": -40.164390563964844, "global_step": 273196, "epoch": 2257} {"train_loss": -39.61067199707031, "global_step": 273197, "epoch": 2257} {"train_loss": -34.21013259887695, "global_step": 273198, "epoch": 2257} {"train_loss": -27.97296142578125, "global_step": 273199, "epoch": 2257} {"train_loss": -36.61965560913086, "global_step": 273200, "epoch": 2257} {"train_loss": -41.490333557128906, "global_step": 273201, "epoch": 2257} {"train_loss": -32.62202072143555, "global_step": 273202, "epoch": 2257} {"train_loss": -34.876365661621094, "global_step": 273203, "epoch": 2257} {"train_loss": -41.61213302612305, "global_step": 273204, "epoch": 2257} {"train_loss": -37.125457763671875, "global_step": 273205, "epoch": 2257} {"train_loss": -39.93391799926758, "global_step": 273206, "epoch": 2257} {"train_loss": -39.29106140136719, "global_step": 273207, "epoch": 2257} {"train_loss": -38.364253997802734, "global_step": 273208, "epoch": 2257} {"train_loss": -38.3794059753418, "global_step": 273209, "epoch": 2257} {"train_loss": -37.60237503051758, "global_step": 273210, "epoch": 2257} {"train_loss": -35.490394592285156, "global_step": 273211, "epoch": 2257} {"train_loss": -37.59675979614258, "global_step": 273212, "epoch": 2257} {"train_loss": -41.36924362182617, "global_step": 273213, "epoch": 2257} {"train_loss": -38.802730560302734, "global_step": 273214, "epoch": 2257} {"train_loss": -41.683223724365234, "global_step": 273215, "epoch": 2257} {"train_loss": -38.868404388427734, "global_step": 273216, "epoch": 2257} {"train_loss": -41.31419066752284, "global_step": 273217, "epoch": 2257, "val_loss": 2673259.25} {"train_loss": -39.558349609375, "global_step": 273218, "epoch": 2258} {"train_loss": -40.19134521484375, "global_step": 273219, "epoch": 2258} {"train_loss": -40.25686264038086, "global_step": 273220, "epoch": 2258} {"train_loss": -40.572025299072266, "global_step": 273221, "epoch": 2258} {"train_loss": -38.0567626953125, "global_step": 273222, "epoch": 2258} {"train_loss": -39.34339141845703, "global_step": 273223, "epoch": 2258} {"train_loss": -17.354175567626953, "global_step": 273224, "epoch": 2258} {"train_loss": -38.51932907104492, "global_step": 273225, "epoch": 2258} {"train_loss": -36.91694259643555, "global_step": 273226, "epoch": 2258} {"train_loss": -39.59189987182617, "global_step": 273227, "epoch": 2258} {"train_loss": -39.376094818115234, "global_step": 273228, "epoch": 2258} {"train_loss": -39.493682861328125, "global_step": 273229, "epoch": 2258} {"train_loss": -38.7159538269043, "global_step": 273230, "epoch": 2258} {"train_loss": -37.086997985839844, "global_step": 273231, "epoch": 2258} {"train_loss": -40.43790817260742, "global_step": 273232, "epoch": 2258} {"train_loss": -35.27764129638672, "global_step": 273233, "epoch": 2258} {"train_loss": -38.94762420654297, "global_step": 273234, "epoch": 2258} {"train_loss": -35.35524368286133, "global_step": 273235, "epoch": 2258} {"train_loss": -39.60074234008789, "global_step": 273236, "epoch": 2258} {"train_loss": -40.13995361328125, "global_step": 273237, "epoch": 2258} {"train_loss": -27.585851669311523, "global_step": 273238, "epoch": 2258} {"train_loss": -32.63872146606445, "global_step": 273239, "epoch": 2258} {"train_loss": -32.623199462890625, "global_step": 273240, "epoch": 2258} {"train_loss": -37.613765716552734, "global_step": 273241, "epoch": 2258} {"train_loss": -36.452022552490234, "global_step": 273242, "epoch": 2258} {"train_loss": -35.8935432434082, "global_step": 273243, "epoch": 2258} {"train_loss": -39.829689025878906, "global_step": 273244, "epoch": 2258} {"train_loss": -39.76409912109375, "global_step": 273245, "epoch": 2258} {"train_loss": -36.16375732421875, "global_step": 273246, "epoch": 2258} {"train_loss": -37.84385299682617, "global_step": 273247, "epoch": 2258} {"train_loss": -32.763301849365234, "global_step": 273248, "epoch": 2258} {"train_loss": -34.99903869628906, "global_step": 273249, "epoch": 2258} {"train_loss": -38.10939407348633, "global_step": 273250, "epoch": 2258} {"train_loss": -36.84070587158203, "global_step": 273251, "epoch": 2258} {"train_loss": -35.790489196777344, "global_step": 273252, "epoch": 2258} {"train_loss": -36.12794494628906, "global_step": 273253, "epoch": 2258} {"train_loss": -37.96543502807617, "global_step": 273254, "epoch": 2258} {"train_loss": -37.50764083862305, "global_step": 273255, "epoch": 2258} {"train_loss": -39.21228790283203, "global_step": 273256, "epoch": 2258} {"train_loss": -38.78533935546875, "global_step": 273257, "epoch": 2258} {"train_loss": -40.232818603515625, "global_step": 273258, "epoch": 2258} {"train_loss": -40.26961898803711, "global_step": 273259, "epoch": 2258} {"train_loss": -38.216102600097656, "global_step": 273260, "epoch": 2258} {"train_loss": -38.50517654418945, "global_step": 273261, "epoch": 2258} {"train_loss": -39.82813262939453, "global_step": 273262, "epoch": 2258} {"train_loss": -39.67966079711914, "global_step": 273263, "epoch": 2258} {"train_loss": -39.76057052612305, "global_step": 273264, "epoch": 2258} {"train_loss": -40.34291076660156, "global_step": 273265, "epoch": 2258} {"train_loss": -38.85114288330078, "global_step": 273266, "epoch": 2258} {"train_loss": -38.835819244384766, "global_step": 273267, "epoch": 2258} {"train_loss": -40.91697311401367, "global_step": 273268, "epoch": 2258} {"train_loss": -39.0471305847168, "global_step": 273269, "epoch": 2258} {"train_loss": -40.522003173828125, "global_step": 273270, "epoch": 2258} {"train_loss": -38.18592071533203, "global_step": 273271, "epoch": 2258} {"train_loss": -39.08329391479492, "global_step": 273272, "epoch": 2258} {"train_loss": -40.367713928222656, "global_step": 273273, "epoch": 2258} {"train_loss": -38.23956298828125, "global_step": 273274, "epoch": 2258} {"train_loss": -38.09760284423828, "global_step": 273275, "epoch": 2258} {"train_loss": -39.32987594604492, "global_step": 273276, "epoch": 2258} {"train_loss": -40.313777923583984, "global_step": 273277, "epoch": 2258} {"train_loss": -38.88374710083008, "global_step": 273278, "epoch": 2258} {"train_loss": -37.594970703125, "global_step": 273279, "epoch": 2258} {"train_loss": -39.770484924316406, "global_step": 273280, "epoch": 2258} {"train_loss": -40.75638961791992, "global_step": 273281, "epoch": 2258} {"train_loss": -41.3781852722168, "global_step": 273282, "epoch": 2258} {"train_loss": -40.58338928222656, "global_step": 273283, "epoch": 2258} {"train_loss": -40.32529830932617, "global_step": 273284, "epoch": 2258} {"train_loss": -40.88870620727539, "global_step": 273285, "epoch": 2258} {"train_loss": -40.43829345703125, "global_step": 273286, "epoch": 2258} {"train_loss": -40.80861282348633, "global_step": 273287, "epoch": 2258} {"train_loss": -41.5073127746582, "global_step": 273288, "epoch": 2258} {"train_loss": -40.40659713745117, "global_step": 273289, "epoch": 2258} {"train_loss": -40.68655014038086, "global_step": 273290, "epoch": 2258} {"train_loss": -41.27696228027344, "global_step": 273291, "epoch": 2258} {"train_loss": -41.24613952636719, "global_step": 273292, "epoch": 2258} {"train_loss": -41.43259811401367, "global_step": 273293, "epoch": 2258} {"train_loss": -41.97093963623047, "global_step": 273294, "epoch": 2258} {"train_loss": -41.771358489990234, "global_step": 273295, "epoch": 2258} {"train_loss": -41.016658782958984, "global_step": 273296, "epoch": 2258} {"train_loss": -41.126747131347656, "global_step": 273297, "epoch": 2258} {"train_loss": -40.5921630859375, "global_step": 273298, "epoch": 2258} {"train_loss": -41.478065490722656, "global_step": 273299, "epoch": 2258} {"train_loss": -40.8643684387207, "global_step": 273300, "epoch": 2258} {"train_loss": -41.13418197631836, "global_step": 273301, "epoch": 2258} {"train_loss": -41.15242385864258, "global_step": 273302, "epoch": 2258} {"train_loss": -41.64281463623047, "global_step": 273303, "epoch": 2258} {"train_loss": -41.138336181640625, "global_step": 273304, "epoch": 2258} {"train_loss": -41.31917190551758, "global_step": 273305, "epoch": 2258} {"train_loss": -40.20914840698242, "global_step": 273306, "epoch": 2258} {"train_loss": -42.0450553894043, "global_step": 273307, "epoch": 2258} {"train_loss": -41.787349700927734, "global_step": 273308, "epoch": 2258} {"train_loss": -42.020442962646484, "global_step": 273309, "epoch": 2258} {"train_loss": -41.69563674926758, "global_step": 273310, "epoch": 2258} {"train_loss": -41.195960998535156, "global_step": 273311, "epoch": 2258} {"train_loss": -41.54292678833008, "global_step": 273312, "epoch": 2258} {"train_loss": -41.617584228515625, "global_step": 273313, "epoch": 2258} {"train_loss": -41.983638763427734, "global_step": 273314, "epoch": 2258} {"train_loss": -42.053592681884766, "global_step": 273315, "epoch": 2258} {"train_loss": -42.079750061035156, "global_step": 273316, "epoch": 2258} {"train_loss": -42.19292068481445, "global_step": 273317, "epoch": 2258} {"train_loss": -42.26154708862305, "global_step": 273318, "epoch": 2258} {"train_loss": -42.20381164550781, "global_step": 273319, "epoch": 2258} {"train_loss": -42.90930938720703, "global_step": 273320, "epoch": 2258} {"train_loss": -41.670597076416016, "global_step": 273321, "epoch": 2258} {"train_loss": -41.70023727416992, "global_step": 273322, "epoch": 2258} {"train_loss": -42.70149230957031, "global_step": 273323, "epoch": 2258} {"train_loss": -41.81719207763672, "global_step": 273324, "epoch": 2258} {"train_loss": -42.3213996887207, "global_step": 273325, "epoch": 2258} {"train_loss": -42.20532989501953, "global_step": 273326, "epoch": 2258} {"train_loss": -42.57046127319336, "global_step": 273327, "epoch": 2258} {"train_loss": -41.41886520385742, "global_step": 273328, "epoch": 2258} {"train_loss": -42.650978088378906, "global_step": 273329, "epoch": 2258} {"train_loss": -41.9578742980957, "global_step": 273330, "epoch": 2258} {"train_loss": -42.73986053466797, "global_step": 273331, "epoch": 2258} {"train_loss": -42.5459098815918, "global_step": 273332, "epoch": 2258} {"train_loss": -42.8984489440918, "global_step": 273333, "epoch": 2258} {"train_loss": -42.76887893676758, "global_step": 273334, "epoch": 2258} {"train_loss": -42.615962982177734, "global_step": 273335, "epoch": 2258} {"train_loss": -41.604122161865234, "global_step": 273336, "epoch": 2258} {"train_loss": -42.02554702758789, "global_step": 273337, "epoch": 2258} {"train_loss": -39.66939164784329, "global_step": 273338, "epoch": 2258, "val_loss": 2703508.5} {"train_loss": -42.23282241821289, "global_step": 273339, "epoch": 2259} {"train_loss": -42.96762466430664, "global_step": 273340, "epoch": 2259} {"train_loss": -42.06367111206055, "global_step": 273341, "epoch": 2259} {"train_loss": -42.57024002075195, "global_step": 273342, "epoch": 2259} {"train_loss": -43.080135345458984, "global_step": 273343, "epoch": 2259} {"train_loss": -42.8426513671875, "global_step": 273344, "epoch": 2259} {"train_loss": -42.76144027709961, "global_step": 273345, "epoch": 2259} {"train_loss": -42.89287185668945, "global_step": 273346, "epoch": 2259} {"train_loss": -42.33194351196289, "global_step": 273347, "epoch": 2259} {"train_loss": -42.930362701416016, "global_step": 273348, "epoch": 2259} {"train_loss": -42.343116760253906, "global_step": 273349, "epoch": 2259} {"train_loss": -42.14255905151367, "global_step": 273350, "epoch": 2259} {"train_loss": -41.68669128417969, "global_step": 273351, "epoch": 2259} {"train_loss": -42.791046142578125, "global_step": 273352, "epoch": 2259} {"train_loss": -42.535152435302734, "global_step": 273353, "epoch": 2259} {"train_loss": -42.580116271972656, "global_step": 273354, "epoch": 2259} {"train_loss": -42.805458068847656, "global_step": 273355, "epoch": 2259} {"train_loss": -42.44447708129883, "global_step": 273356, "epoch": 2259} {"train_loss": -41.5238037109375, "global_step": 273357, "epoch": 2259} {"train_loss": -43.3099365234375, "global_step": 273358, "epoch": 2259} {"train_loss": -42.247737884521484, "global_step": 273359, "epoch": 2259} {"train_loss": -42.356693267822266, "global_step": 273360, "epoch": 2259} {"train_loss": -42.70650100708008, "global_step": 273361, "epoch": 2259} {"train_loss": -42.53178024291992, "global_step": 273362, "epoch": 2259} {"train_loss": -43.6834831237793, "global_step": 273363, "epoch": 2259} {"train_loss": -42.913246154785156, "global_step": 273364, "epoch": 2259} {"train_loss": -43.42125701904297, "global_step": 273365, "epoch": 2259} {"train_loss": -43.257362365722656, "global_step": 273366, "epoch": 2259} {"train_loss": -43.019901275634766, "global_step": 273367, "epoch": 2259} {"train_loss": -43.034461975097656, "global_step": 273368, "epoch": 2259} {"train_loss": -43.1235466003418, "global_step": 273369, "epoch": 2259} {"train_loss": -43.045833587646484, "global_step": 273370, "epoch": 2259} {"train_loss": -41.27272415161133, "global_step": 273371, "epoch": 2259} {"train_loss": -43.26820755004883, "global_step": 273372, "epoch": 2259} {"train_loss": -42.77226638793945, "global_step": 273373, "epoch": 2259} {"train_loss": -41.562835693359375, "global_step": 273374, "epoch": 2259} {"train_loss": -42.549686431884766, "global_step": 273375, "epoch": 2259} {"train_loss": -42.585060119628906, "global_step": 273376, "epoch": 2259} {"train_loss": -40.70577621459961, "global_step": 273377, "epoch": 2259} {"train_loss": -43.2188835144043, "global_step": 273378, "epoch": 2259} {"train_loss": -42.99813461303711, "global_step": 273379, "epoch": 2259} {"train_loss": -41.53597640991211, "global_step": 273380, "epoch": 2259} {"train_loss": -42.26292037963867, "global_step": 273381, "epoch": 2259} {"train_loss": -42.2646598815918, "global_step": 273382, "epoch": 2259} {"train_loss": -40.73137664794922, "global_step": 273383, "epoch": 2259} {"train_loss": -42.0554084777832, "global_step": 273384, "epoch": 2259} {"train_loss": -40.943359375, "global_step": 273385, "epoch": 2259} {"train_loss": -41.029781341552734, "global_step": 273386, "epoch": 2259} {"train_loss": -37.93465042114258, "global_step": 273387, "epoch": 2259} {"train_loss": -37.6348762512207, "global_step": 273388, "epoch": 2259} {"train_loss": -39.569332122802734, "global_step": 273389, "epoch": 2259} {"train_loss": -42.01982879638672, "global_step": 273390, "epoch": 2259} {"train_loss": -39.9258918762207, "global_step": 273391, "epoch": 2259} {"train_loss": -41.403194427490234, "global_step": 273392, "epoch": 2259} {"train_loss": -38.0352783203125, "global_step": 273393, "epoch": 2259} {"train_loss": -36.6638298034668, "global_step": 273394, "epoch": 2259} {"train_loss": -34.46238327026367, "global_step": 273395, "epoch": 2259} {"train_loss": -42.807281494140625, "global_step": 273396, "epoch": 2259} {"train_loss": -38.707557678222656, "global_step": 273397, "epoch": 2259} {"train_loss": -41.188751220703125, "global_step": 273398, "epoch": 2259} {"train_loss": -39.32080841064453, "global_step": 273399, "epoch": 2259} {"train_loss": -41.39643478393555, "global_step": 273400, "epoch": 2259} {"train_loss": -38.19683837890625, "global_step": 273401, "epoch": 2259} {"train_loss": -40.66874313354492, "global_step": 273402, "epoch": 2259} {"train_loss": -39.65425491333008, "global_step": 273403, "epoch": 2259} {"train_loss": -38.89984893798828, "global_step": 273404, "epoch": 2259} {"train_loss": -36.04863357543945, "global_step": 273405, "epoch": 2259} {"train_loss": -39.46039581298828, "global_step": 273406, "epoch": 2259} {"train_loss": -38.2840690612793, "global_step": 273407, "epoch": 2259} {"train_loss": -40.01752853393555, "global_step": 273408, "epoch": 2259} {"train_loss": -40.32866668701172, "global_step": 273409, "epoch": 2259} {"train_loss": -40.84182357788086, "global_step": 273410, "epoch": 2259} {"train_loss": -40.18891143798828, "global_step": 273411, "epoch": 2259} {"train_loss": -39.32872009277344, "global_step": 273412, "epoch": 2259} {"train_loss": -39.515663146972656, "global_step": 273413, "epoch": 2259} {"train_loss": -41.405426025390625, "global_step": 273414, "epoch": 2259} {"train_loss": -40.34641647338867, "global_step": 273415, "epoch": 2259} {"train_loss": -41.461029052734375, "global_step": 273416, "epoch": 2259} {"train_loss": -41.6158332824707, "global_step": 273417, "epoch": 2259} {"train_loss": -39.19622802734375, "global_step": 273418, "epoch": 2259} {"train_loss": -39.662105560302734, "global_step": 273419, "epoch": 2259} {"train_loss": -39.24257278442383, "global_step": 273420, "epoch": 2259} {"train_loss": -40.70698928833008, "global_step": 273421, "epoch": 2259} {"train_loss": -41.40534210205078, "global_step": 273422, "epoch": 2259} {"train_loss": -41.135780334472656, "global_step": 273423, "epoch": 2259} {"train_loss": -40.43120193481445, "global_step": 273424, "epoch": 2259} {"train_loss": -41.7719612121582, "global_step": 273425, "epoch": 2259} {"train_loss": -40.76102828979492, "global_step": 273426, "epoch": 2259} {"train_loss": -41.84615707397461, "global_step": 273427, "epoch": 2259} {"train_loss": -40.4961051940918, "global_step": 273428, "epoch": 2259} {"train_loss": -42.1873893737793, "global_step": 273429, "epoch": 2259} {"train_loss": -41.80747604370117, "global_step": 273430, "epoch": 2259} {"train_loss": -40.96559143066406, "global_step": 273431, "epoch": 2259} {"train_loss": -42.59850311279297, "global_step": 273432, "epoch": 2259} {"train_loss": -42.617488861083984, "global_step": 273433, "epoch": 2259} {"train_loss": -42.00673294067383, "global_step": 273434, "epoch": 2259} {"train_loss": -41.19965744018555, "global_step": 273435, "epoch": 2259} {"train_loss": -42.55782699584961, "global_step": 273436, "epoch": 2259} {"train_loss": -42.25662612915039, "global_step": 273437, "epoch": 2259} {"train_loss": -42.62792205810547, "global_step": 273438, "epoch": 2259} {"train_loss": -42.401954650878906, "global_step": 273439, "epoch": 2259} {"train_loss": -42.081153869628906, "global_step": 273440, "epoch": 2259} {"train_loss": -41.83237075805664, "global_step": 273441, "epoch": 2259} {"train_loss": -41.70397186279297, "global_step": 273442, "epoch": 2259} {"train_loss": -42.36793518066406, "global_step": 273443, "epoch": 2259} {"train_loss": -40.530250549316406, "global_step": 273444, "epoch": 2259} {"train_loss": -40.31111526489258, "global_step": 273445, "epoch": 2259} {"train_loss": -41.70882034301758, "global_step": 273446, "epoch": 2259} {"train_loss": -42.18326950073242, "global_step": 273447, "epoch": 2259} {"train_loss": -40.93998336791992, "global_step": 273448, "epoch": 2259} {"train_loss": -41.591121673583984, "global_step": 273449, "epoch": 2259} {"train_loss": -42.50053024291992, "global_step": 273450, "epoch": 2259} {"train_loss": -41.82265853881836, "global_step": 273451, "epoch": 2259} {"train_loss": -41.74330520629883, "global_step": 273452, "epoch": 2259} {"train_loss": -42.56367874145508, "global_step": 273453, "epoch": 2259} {"train_loss": -41.98529052734375, "global_step": 273454, "epoch": 2259} {"train_loss": -42.11472702026367, "global_step": 273455, "epoch": 2259} {"train_loss": -41.39518356323242, "global_step": 273456, "epoch": 2259} {"train_loss": -41.54012680053711, "global_step": 273457, "epoch": 2259} {"train_loss": -42.70583724975586, "global_step": 273458, "epoch": 2259} {"train_loss": -41.40939703066487, "global_step": 273459, "epoch": 2259, "val_loss": 2623940.75} {"train_loss": -40.948421478271484, "global_step": 273460, "epoch": 2260} {"train_loss": -41.28444290161133, "global_step": 273461, "epoch": 2260} {"train_loss": -42.70439147949219, "global_step": 273462, "epoch": 2260} {"train_loss": -40.16287612915039, "global_step": 273463, "epoch": 2260} {"train_loss": -40.5216178894043, "global_step": 273464, "epoch": 2260} {"train_loss": -41.17630386352539, "global_step": 273465, "epoch": 2260} {"train_loss": -42.005035400390625, "global_step": 273466, "epoch": 2260} {"train_loss": -41.195430755615234, "global_step": 273467, "epoch": 2260} {"train_loss": -39.941070556640625, "global_step": 273468, "epoch": 2260} {"train_loss": -42.860591888427734, "global_step": 273469, "epoch": 2260} {"train_loss": -42.14207077026367, "global_step": 273470, "epoch": 2260} {"train_loss": -40.39506912231445, "global_step": 273471, "epoch": 2260} {"train_loss": -41.13874816894531, "global_step": 273472, "epoch": 2260} {"train_loss": -42.53408432006836, "global_step": 273473, "epoch": 2260} {"train_loss": -41.91721725463867, "global_step": 273474, "epoch": 2260} {"train_loss": -40.98917770385742, "global_step": 273475, "epoch": 2260} {"train_loss": -42.40259552001953, "global_step": 273476, "epoch": 2260} {"train_loss": -42.47114562988281, "global_step": 273477, "epoch": 2260} {"train_loss": -41.29804229736328, "global_step": 273478, "epoch": 2260} {"train_loss": -41.30221176147461, "global_step": 273479, "epoch": 2260} {"train_loss": -41.18040466308594, "global_step": 273480, "epoch": 2260} {"train_loss": -42.76456832885742, "global_step": 273481, "epoch": 2260} {"train_loss": -42.49863815307617, "global_step": 273482, "epoch": 2260} {"train_loss": -41.961055755615234, "global_step": 273483, "epoch": 2260} {"train_loss": -42.0744514465332, "global_step": 273484, "epoch": 2260} {"train_loss": -42.844093322753906, "global_step": 273485, "epoch": 2260} {"train_loss": -43.06814193725586, "global_step": 273486, "epoch": 2260} {"train_loss": -42.42445373535156, "global_step": 273487, "epoch": 2260} {"train_loss": -42.896461486816406, "global_step": 273488, "epoch": 2260} {"train_loss": -43.07786178588867, "global_step": 273489, "epoch": 2260} {"train_loss": -42.57331466674805, "global_step": 273490, "epoch": 2260} {"train_loss": -42.77864456176758, "global_step": 273491, "epoch": 2260} {"train_loss": -42.61421585083008, "global_step": 273492, "epoch": 2260} {"train_loss": -42.895198822021484, "global_step": 273493, "epoch": 2260} {"train_loss": -41.834716796875, "global_step": 273494, "epoch": 2260} {"train_loss": -42.616294860839844, "global_step": 273495, "epoch": 2260} {"train_loss": -42.87778854370117, "global_step": 273496, "epoch": 2260} {"train_loss": -41.22942352294922, "global_step": 273497, "epoch": 2260} {"train_loss": -42.61906814575195, "global_step": 273498, "epoch": 2260} {"train_loss": -42.72536087036133, "global_step": 273499, "epoch": 2260} {"train_loss": -42.86260986328125, "global_step": 273500, "epoch": 2260} {"train_loss": -42.43037796020508, "global_step": 273501, "epoch": 2260} {"train_loss": -41.2123908996582, "global_step": 273502, "epoch": 2260} {"train_loss": -42.37089538574219, "global_step": 273503, "epoch": 2260} {"train_loss": -42.73759078979492, "global_step": 273504, "epoch": 2260} {"train_loss": -41.649742126464844, "global_step": 273505, "epoch": 2260} {"train_loss": -42.0363883972168, "global_step": 273506, "epoch": 2260} {"train_loss": -42.1446418762207, "global_step": 273507, "epoch": 2260} {"train_loss": -42.881202697753906, "global_step": 273508, "epoch": 2260} {"train_loss": -40.31794357299805, "global_step": 273509, "epoch": 2260} {"train_loss": -42.296817779541016, "global_step": 273510, "epoch": 2260} {"train_loss": -42.32107162475586, "global_step": 273511, "epoch": 2260} {"train_loss": -42.8753547668457, "global_step": 273512, "epoch": 2260} {"train_loss": -42.95590591430664, "global_step": 273513, "epoch": 2260} {"train_loss": -42.49067306518555, "global_step": 273514, "epoch": 2260} {"train_loss": -42.78953170776367, "global_step": 273515, "epoch": 2260} {"train_loss": -42.67948913574219, "global_step": 273516, "epoch": 2260} {"train_loss": -43.3518180847168, "global_step": 273517, "epoch": 2260} {"train_loss": -42.58230209350586, "global_step": 273518, "epoch": 2260} {"train_loss": -42.45318603515625, "global_step": 273519, "epoch": 2260} {"train_loss": -42.461280822753906, "global_step": 273520, "epoch": 2260} {"train_loss": -43.03595733642578, "global_step": 273521, "epoch": 2260} {"train_loss": -42.89838409423828, "global_step": 273522, "epoch": 2260} {"train_loss": -42.688785552978516, "global_step": 273523, "epoch": 2260} {"train_loss": -43.10041046142578, "global_step": 273524, "epoch": 2260} {"train_loss": -43.06952667236328, "global_step": 273525, "epoch": 2260} {"train_loss": -42.97844696044922, "global_step": 273526, "epoch": 2260} {"train_loss": -42.8856086730957, "global_step": 273527, "epoch": 2260} {"train_loss": -43.16419219970703, "global_step": 273528, "epoch": 2260} {"train_loss": -41.84735107421875, "global_step": 273529, "epoch": 2260} {"train_loss": -42.336421966552734, "global_step": 273530, "epoch": 2260} {"train_loss": -41.7183723449707, "global_step": 273531, "epoch": 2260} {"train_loss": -42.582515716552734, "global_step": 273532, "epoch": 2260} {"train_loss": -41.258907318115234, "global_step": 273533, "epoch": 2260} {"train_loss": -42.22047424316406, "global_step": 273534, "epoch": 2260} {"train_loss": -42.1449089050293, "global_step": 273535, "epoch": 2260} {"train_loss": -42.534732818603516, "global_step": 273536, "epoch": 2260} {"train_loss": -42.23036575317383, "global_step": 273537, "epoch": 2260} {"train_loss": -41.461360931396484, "global_step": 273538, "epoch": 2260} {"train_loss": -41.00682067871094, "global_step": 273539, "epoch": 2260} {"train_loss": -41.141510009765625, "global_step": 273540, "epoch": 2260} {"train_loss": -42.0297737121582, "global_step": 273541, "epoch": 2260} {"train_loss": -41.797874450683594, "global_step": 273542, "epoch": 2260} {"train_loss": -41.3997688293457, "global_step": 273543, "epoch": 2260} {"train_loss": -41.7520866394043, "global_step": 273544, "epoch": 2260} {"train_loss": -41.15182113647461, "global_step": 273545, "epoch": 2260} {"train_loss": -41.58808517456055, "global_step": 273546, "epoch": 2260} {"train_loss": -42.333221435546875, "global_step": 273547, "epoch": 2260} {"train_loss": -41.50358963012695, "global_step": 273548, "epoch": 2260} {"train_loss": -42.100364685058594, "global_step": 273549, "epoch": 2260} {"train_loss": -41.92018508911133, "global_step": 273550, "epoch": 2260} {"train_loss": -43.174591064453125, "global_step": 273551, "epoch": 2260} {"train_loss": -41.75086212158203, "global_step": 273552, "epoch": 2260} {"train_loss": -41.29586410522461, "global_step": 273553, "epoch": 2260} {"train_loss": -42.50696563720703, "global_step": 273554, "epoch": 2260} {"train_loss": -42.611751556396484, "global_step": 273555, "epoch": 2260} {"train_loss": -40.559322357177734, "global_step": 273556, "epoch": 2260} {"train_loss": -41.971256256103516, "global_step": 273557, "epoch": 2260} {"train_loss": -42.311851501464844, "global_step": 273558, "epoch": 2260} {"train_loss": -41.94660186767578, "global_step": 273559, "epoch": 2260} {"train_loss": -41.697296142578125, "global_step": 273560, "epoch": 2260} {"train_loss": -41.624786376953125, "global_step": 273561, "epoch": 2260} {"train_loss": -42.60853958129883, "global_step": 273562, "epoch": 2260} {"train_loss": -41.78571701049805, "global_step": 273563, "epoch": 2260} {"train_loss": -42.0774040222168, "global_step": 273564, "epoch": 2260} {"train_loss": -42.8563117980957, "global_step": 273565, "epoch": 2260} {"train_loss": -41.887203216552734, "global_step": 273566, "epoch": 2260} {"train_loss": -42.09294891357422, "global_step": 273567, "epoch": 2260} {"train_loss": -42.10991287231445, "global_step": 273568, "epoch": 2260} {"train_loss": -42.7544059753418, "global_step": 273569, "epoch": 2260} {"train_loss": -42.746700286865234, "global_step": 273570, "epoch": 2260} {"train_loss": -40.283294677734375, "global_step": 273571, "epoch": 2260} {"train_loss": -42.31843948364258, "global_step": 273572, "epoch": 2260} {"train_loss": -42.5397834777832, "global_step": 273573, "epoch": 2260} {"train_loss": -42.55721664428711, "global_step": 273574, "epoch": 2260} {"train_loss": -42.7713508605957, "global_step": 273575, "epoch": 2260} {"train_loss": -42.584632873535156, "global_step": 273576, "epoch": 2260} {"train_loss": -42.41584396362305, "global_step": 273577, "epoch": 2260} {"train_loss": -42.621150970458984, "global_step": 273578, "epoch": 2260} {"train_loss": -43.20759201049805, "global_step": 273579, "epoch": 2260} {"train_loss": -42.14261759608245, "global_step": 273580, "epoch": 2260, "val_loss": 2728137.75} {"train_loss": -42.27311706542969, "global_step": 273581, "epoch": 2261} {"train_loss": -43.21921157836914, "global_step": 273582, "epoch": 2261} {"train_loss": -43.1757698059082, "global_step": 273583, "epoch": 2261} {"train_loss": -43.155113220214844, "global_step": 273584, "epoch": 2261} {"train_loss": -43.10139846801758, "global_step": 273585, "epoch": 2261} {"train_loss": -43.1259651184082, "global_step": 273586, "epoch": 2261} {"train_loss": -43.12310028076172, "global_step": 273587, "epoch": 2261} {"train_loss": -43.659942626953125, "global_step": 273588, "epoch": 2261} {"train_loss": -43.30606460571289, "global_step": 273589, "epoch": 2261} {"train_loss": -41.43647003173828, "global_step": 273590, "epoch": 2261} {"train_loss": -41.037750244140625, "global_step": 273591, "epoch": 2261} {"train_loss": -42.87042236328125, "global_step": 273592, "epoch": 2261} {"train_loss": -41.4039192199707, "global_step": 273593, "epoch": 2261} {"train_loss": -42.738067626953125, "global_step": 273594, "epoch": 2261} {"train_loss": -42.488162994384766, "global_step": 273595, "epoch": 2261} {"train_loss": -38.89643478393555, "global_step": 273596, "epoch": 2261} {"train_loss": -42.98280715942383, "global_step": 273597, "epoch": 2261} {"train_loss": -42.03103256225586, "global_step": 273598, "epoch": 2261} {"train_loss": -42.5704231262207, "global_step": 273599, "epoch": 2261} {"train_loss": -43.07991027832031, "global_step": 273600, "epoch": 2261} {"train_loss": -41.892303466796875, "global_step": 273601, "epoch": 2261} {"train_loss": -42.555084228515625, "global_step": 273602, "epoch": 2261} {"train_loss": -42.51752853393555, "global_step": 273603, "epoch": 2261} {"train_loss": -42.71821212768555, "global_step": 273604, "epoch": 2261} {"train_loss": -40.744998931884766, "global_step": 273605, "epoch": 2261} {"train_loss": -42.89702224731445, "global_step": 273606, "epoch": 2261} {"train_loss": -42.76703643798828, "global_step": 273607, "epoch": 2261} {"train_loss": -40.20193099975586, "global_step": 273608, "epoch": 2261} {"train_loss": -33.89445877075195, "global_step": 273609, "epoch": 2261} {"train_loss": -42.76523971557617, "global_step": 273610, "epoch": 2261} {"train_loss": -40.935543060302734, "global_step": 273611, "epoch": 2261} {"train_loss": -38.219234466552734, "global_step": 273612, "epoch": 2261} {"train_loss": -38.81685256958008, "global_step": 273613, "epoch": 2261} {"train_loss": -40.783241271972656, "global_step": 273614, "epoch": 2261} {"train_loss": -39.672393798828125, "global_step": 273615, "epoch": 2261} {"train_loss": -40.86802291870117, "global_step": 273616, "epoch": 2261} {"train_loss": -38.006195068359375, "global_step": 273617, "epoch": 2261} {"train_loss": -39.81612777709961, "global_step": 273618, "epoch": 2261} {"train_loss": -40.70537185668945, "global_step": 273619, "epoch": 2261} {"train_loss": -41.23151779174805, "global_step": 273620, "epoch": 2261} {"train_loss": -41.727787017822266, "global_step": 273621, "epoch": 2261} {"train_loss": -41.85261917114258, "global_step": 273622, "epoch": 2261} {"train_loss": -40.94539260864258, "global_step": 273623, "epoch": 2261} {"train_loss": -40.768951416015625, "global_step": 273624, "epoch": 2261} {"train_loss": -42.06582260131836, "global_step": 273625, "epoch": 2261} {"train_loss": -40.59603500366211, "global_step": 273626, "epoch": 2261} {"train_loss": -38.16015625, "global_step": 273627, "epoch": 2261} {"train_loss": -38.6513786315918, "global_step": 273628, "epoch": 2261} {"train_loss": -41.52842330932617, "global_step": 273629, "epoch": 2261} {"train_loss": -42.483699798583984, "global_step": 273630, "epoch": 2261} {"train_loss": -38.40153121948242, "global_step": 273631, "epoch": 2261} {"train_loss": -39.39447784423828, "global_step": 273632, "epoch": 2261} {"train_loss": -39.330013275146484, "global_step": 273633, "epoch": 2261} {"train_loss": -40.688167572021484, "global_step": 273634, "epoch": 2261} {"train_loss": -40.639461517333984, "global_step": 273635, "epoch": 2261} {"train_loss": -41.24414825439453, "global_step": 273636, "epoch": 2261} {"train_loss": -41.30659866333008, "global_step": 273637, "epoch": 2261} {"train_loss": -41.09053421020508, "global_step": 273638, "epoch": 2261} {"train_loss": -41.042572021484375, "global_step": 273639, "epoch": 2261} {"train_loss": -40.41616439819336, "global_step": 273640, "epoch": 2261} {"train_loss": -39.14731979370117, "global_step": 273641, "epoch": 2261} {"train_loss": -40.26766586303711, "global_step": 273642, "epoch": 2261} {"train_loss": -34.939266204833984, "global_step": 273643, "epoch": 2261} {"train_loss": -40.61507034301758, "global_step": 273644, "epoch": 2261} {"train_loss": -40.102569580078125, "global_step": 273645, "epoch": 2261} {"train_loss": -39.96857833862305, "global_step": 273646, "epoch": 2261} {"train_loss": -39.46456527709961, "global_step": 273647, "epoch": 2261} {"train_loss": -39.08172607421875, "global_step": 273648, "epoch": 2261} {"train_loss": -36.56903839111328, "global_step": 273649, "epoch": 2261} {"train_loss": -39.5033073425293, "global_step": 273650, "epoch": 2261} {"train_loss": -38.94600296020508, "global_step": 273651, "epoch": 2261} {"train_loss": -39.567840576171875, "global_step": 273652, "epoch": 2261} {"train_loss": -38.80106735229492, "global_step": 273653, "epoch": 2261} {"train_loss": -39.36383819580078, "global_step": 273654, "epoch": 2261} {"train_loss": -40.6770133972168, "global_step": 273655, "epoch": 2261} {"train_loss": -39.57925033569336, "global_step": 273656, "epoch": 2261} {"train_loss": -29.012659072875977, "global_step": 273657, "epoch": 2261} {"train_loss": -38.401485443115234, "global_step": 273658, "epoch": 2261} {"train_loss": -40.215023040771484, "global_step": 273659, "epoch": 2261} {"train_loss": -39.19377899169922, "global_step": 273660, "epoch": 2261} {"train_loss": -39.96824264526367, "global_step": 273661, "epoch": 2261} {"train_loss": -39.51725769042969, "global_step": 273662, "epoch": 2261} {"train_loss": -25.146209716796875, "global_step": 273663, "epoch": 2261} {"train_loss": -38.65443420410156, "global_step": 273664, "epoch": 2261} {"train_loss": -40.15211868286133, "global_step": 273665, "epoch": 2261} {"train_loss": -39.97890853881836, "global_step": 273666, "epoch": 2261} {"train_loss": -37.96363067626953, "global_step": 273667, "epoch": 2261} {"train_loss": -41.32386016845703, "global_step": 273668, "epoch": 2261} {"train_loss": -37.85896682739258, "global_step": 273669, "epoch": 2261} {"train_loss": -41.12520980834961, "global_step": 273670, "epoch": 2261} {"train_loss": -40.333126068115234, "global_step": 273671, "epoch": 2261} {"train_loss": -40.79058837890625, "global_step": 273672, "epoch": 2261} {"train_loss": -39.97031784057617, "global_step": 273673, "epoch": 2261} {"train_loss": -28.8021297454834, "global_step": 273674, "epoch": 2261} {"train_loss": -28.638019561767578, "global_step": 273675, "epoch": 2261} {"train_loss": -37.56901168823242, "global_step": 273676, "epoch": 2261} {"train_loss": -39.692012786865234, "global_step": 273677, "epoch": 2261} {"train_loss": -40.855316162109375, "global_step": 273678, "epoch": 2261} {"train_loss": -39.17452621459961, "global_step": 273679, "epoch": 2261} {"train_loss": -27.366836547851562, "global_step": 273680, "epoch": 2261} {"train_loss": -39.42008590698242, "global_step": 273681, "epoch": 2261} {"train_loss": -35.241111755371094, "global_step": 273682, "epoch": 2261} {"train_loss": -36.7979621887207, "global_step": 273683, "epoch": 2261} {"train_loss": -40.709869384765625, "global_step": 273684, "epoch": 2261} {"train_loss": -39.18955612182617, "global_step": 273685, "epoch": 2261} {"train_loss": -39.6639518737793, "global_step": 273686, "epoch": 2261} {"train_loss": -40.345367431640625, "global_step": 273687, "epoch": 2261} {"train_loss": -40.544647216796875, "global_step": 273688, "epoch": 2261} {"train_loss": -40.471248626708984, "global_step": 273689, "epoch": 2261} {"train_loss": -40.88291931152344, "global_step": 273690, "epoch": 2261} {"train_loss": -39.26505661010742, "global_step": 273691, "epoch": 2261} {"train_loss": -38.8593635559082, "global_step": 273692, "epoch": 2261} {"train_loss": -38.8610725402832, "global_step": 273693, "epoch": 2261} {"train_loss": -38.9516716003418, "global_step": 273694, "epoch": 2261} {"train_loss": -40.46216583251953, "global_step": 273695, "epoch": 2261} {"train_loss": -39.47018051147461, "global_step": 273696, "epoch": 2261} {"train_loss": -41.272796630859375, "global_step": 273697, "epoch": 2261} {"train_loss": -40.20176696777344, "global_step": 273698, "epoch": 2261} {"train_loss": -39.294002532958984, "global_step": 273699, "epoch": 2261} {"train_loss": -40.95090866088867, "global_step": 273700, "epoch": 2261} {"train_loss": -39.87012191646355, "global_step": 273701, "epoch": 2261, "val_loss": 2650045.75} {"train_loss": -38.75457763671875, "global_step": 273702, "epoch": 2262} {"train_loss": -40.76361846923828, "global_step": 273703, "epoch": 2262} {"train_loss": -40.74459457397461, "global_step": 273704, "epoch": 2262} {"train_loss": -41.395599365234375, "global_step": 273705, "epoch": 2262} {"train_loss": -40.634857177734375, "global_step": 273706, "epoch": 2262} {"train_loss": -41.26700210571289, "global_step": 273707, "epoch": 2262} {"train_loss": -39.128822326660156, "global_step": 273708, "epoch": 2262} {"train_loss": -41.02653884887695, "global_step": 273709, "epoch": 2262} {"train_loss": -39.60139083862305, "global_step": 273710, "epoch": 2262} {"train_loss": -41.091670989990234, "global_step": 273711, "epoch": 2262} {"train_loss": -40.95634078979492, "global_step": 273712, "epoch": 2262} {"train_loss": -41.40473175048828, "global_step": 273713, "epoch": 2262} {"train_loss": -41.597171783447266, "global_step": 273714, "epoch": 2262} {"train_loss": -41.49857711791992, "global_step": 273715, "epoch": 2262} {"train_loss": -41.83664321899414, "global_step": 273716, "epoch": 2262} {"train_loss": -41.2884407043457, "global_step": 273717, "epoch": 2262} {"train_loss": -40.84090042114258, "global_step": 273718, "epoch": 2262} {"train_loss": -41.4909553527832, "global_step": 273719, "epoch": 2262} {"train_loss": -41.661617279052734, "global_step": 273720, "epoch": 2262} {"train_loss": -41.97007369995117, "global_step": 273721, "epoch": 2262} {"train_loss": -41.7234992980957, "global_step": 273722, "epoch": 2262} {"train_loss": -42.06431579589844, "global_step": 273723, "epoch": 2262} {"train_loss": -41.126441955566406, "global_step": 273724, "epoch": 2262} {"train_loss": -41.94086837768555, "global_step": 273725, "epoch": 2262} {"train_loss": -42.37205505371094, "global_step": 273726, "epoch": 2262} {"train_loss": -41.84708023071289, "global_step": 273727, "epoch": 2262} {"train_loss": -42.14274978637695, "global_step": 273728, "epoch": 2262} {"train_loss": -40.860076904296875, "global_step": 273729, "epoch": 2262} {"train_loss": -42.2838134765625, "global_step": 273730, "epoch": 2262} {"train_loss": -41.59621810913086, "global_step": 273731, "epoch": 2262} {"train_loss": -42.332122802734375, "global_step": 273732, "epoch": 2262} {"train_loss": -42.340023040771484, "global_step": 273733, "epoch": 2262} {"train_loss": -42.32863235473633, "global_step": 273734, "epoch": 2262} {"train_loss": -42.40913772583008, "global_step": 273735, "epoch": 2262} {"train_loss": -42.57307052612305, "global_step": 273736, "epoch": 2262} {"train_loss": -42.620243072509766, "global_step": 273737, "epoch": 2262} {"train_loss": -42.67666244506836, "global_step": 273738, "epoch": 2262} {"train_loss": -42.191253662109375, "global_step": 273739, "epoch": 2262} {"train_loss": -41.435646057128906, "global_step": 273740, "epoch": 2262} {"train_loss": -42.453060150146484, "global_step": 273741, "epoch": 2262} {"train_loss": -40.24337387084961, "global_step": 273742, "epoch": 2262} {"train_loss": -41.95954513549805, "global_step": 273743, "epoch": 2262} {"train_loss": -42.255088806152344, "global_step": 273744, "epoch": 2262} {"train_loss": -41.57902145385742, "global_step": 273745, "epoch": 2262} {"train_loss": -42.663917541503906, "global_step": 273746, "epoch": 2262} {"train_loss": -42.77714157104492, "global_step": 273747, "epoch": 2262} {"train_loss": -42.53654098510742, "global_step": 273748, "epoch": 2262} {"train_loss": -42.50896072387695, "global_step": 273749, "epoch": 2262} {"train_loss": -42.673580169677734, "global_step": 273750, "epoch": 2262} {"train_loss": -42.88267135620117, "global_step": 273751, "epoch": 2262} {"train_loss": -42.905433654785156, "global_step": 273752, "epoch": 2262} {"train_loss": -42.0596809387207, "global_step": 273753, "epoch": 2262} {"train_loss": -42.8783073425293, "global_step": 273754, "epoch": 2262} {"train_loss": -41.753597259521484, "global_step": 273755, "epoch": 2262} {"train_loss": -42.802120208740234, "global_step": 273756, "epoch": 2262} {"train_loss": -42.78478240966797, "global_step": 273757, "epoch": 2262} {"train_loss": -42.36057662963867, "global_step": 273758, "epoch": 2262} {"train_loss": -42.355770111083984, "global_step": 273759, "epoch": 2262} {"train_loss": -42.691951751708984, "global_step": 273760, "epoch": 2262} {"train_loss": -42.50663375854492, "global_step": 273761, "epoch": 2262} {"train_loss": -42.977752685546875, "global_step": 273762, "epoch": 2262} {"train_loss": -43.09287643432617, "global_step": 273763, "epoch": 2262} {"train_loss": -43.1961784362793, "global_step": 273764, "epoch": 2262} {"train_loss": -42.02799987792969, "global_step": 273765, "epoch": 2262} {"train_loss": -42.98971176147461, "global_step": 273766, "epoch": 2262} {"train_loss": -43.048980712890625, "global_step": 273767, "epoch": 2262} {"train_loss": -42.92049789428711, "global_step": 273768, "epoch": 2262} {"train_loss": -42.96281051635742, "global_step": 273769, "epoch": 2262} {"train_loss": -42.80744552612305, "global_step": 273770, "epoch": 2262} {"train_loss": -42.779327392578125, "global_step": 273771, "epoch": 2262} {"train_loss": -42.731292724609375, "global_step": 273772, "epoch": 2262} {"train_loss": -43.16318893432617, "global_step": 273773, "epoch": 2262} {"train_loss": -42.699127197265625, "global_step": 273774, "epoch": 2262} {"train_loss": -42.67716598510742, "global_step": 273775, "epoch": 2262} {"train_loss": -42.567230224609375, "global_step": 273776, "epoch": 2262} {"train_loss": -42.8613395690918, "global_step": 273777, "epoch": 2262} {"train_loss": -42.58181381225586, "global_step": 273778, "epoch": 2262} {"train_loss": -42.24309158325195, "global_step": 273779, "epoch": 2262} {"train_loss": -41.421104431152344, "global_step": 273780, "epoch": 2262} {"train_loss": -41.64564895629883, "global_step": 273781, "epoch": 2262} {"train_loss": -42.505271911621094, "global_step": 273782, "epoch": 2262} {"train_loss": -42.72382736206055, "global_step": 273783, "epoch": 2262} {"train_loss": -43.365928649902344, "global_step": 273784, "epoch": 2262} {"train_loss": -42.87690353393555, "global_step": 273785, "epoch": 2262} {"train_loss": -42.24076461791992, "global_step": 273786, "epoch": 2262} {"train_loss": -41.03425216674805, "global_step": 273787, "epoch": 2262} {"train_loss": -40.87845993041992, "global_step": 273788, "epoch": 2262} {"train_loss": -41.572750091552734, "global_step": 273789, "epoch": 2262} {"train_loss": -43.415191650390625, "global_step": 273790, "epoch": 2262} {"train_loss": -41.66695785522461, "global_step": 273791, "epoch": 2262} {"train_loss": -39.96839141845703, "global_step": 273792, "epoch": 2262} {"train_loss": -39.47914505004883, "global_step": 273793, "epoch": 2262} {"train_loss": -37.8755989074707, "global_step": 273794, "epoch": 2262} {"train_loss": -39.51419448852539, "global_step": 273795, "epoch": 2262} {"train_loss": -42.55152893066406, "global_step": 273796, "epoch": 2262} {"train_loss": -41.71043395996094, "global_step": 273797, "epoch": 2262} {"train_loss": -41.83552932739258, "global_step": 273798, "epoch": 2262} {"train_loss": -42.658599853515625, "global_step": 273799, "epoch": 2262} {"train_loss": -40.1001091003418, "global_step": 273800, "epoch": 2262} {"train_loss": -38.64366912841797, "global_step": 273801, "epoch": 2262} {"train_loss": -40.55039596557617, "global_step": 273802, "epoch": 2262} {"train_loss": -42.47410202026367, "global_step": 273803, "epoch": 2262} {"train_loss": -40.511451721191406, "global_step": 273804, "epoch": 2262} {"train_loss": -41.355281829833984, "global_step": 273805, "epoch": 2262} {"train_loss": -41.77896499633789, "global_step": 273806, "epoch": 2262} {"train_loss": -37.79862594604492, "global_step": 273807, "epoch": 2262} {"train_loss": -41.57831573486328, "global_step": 273808, "epoch": 2262} {"train_loss": -41.54243850708008, "global_step": 273809, "epoch": 2262} {"train_loss": -39.78367233276367, "global_step": 273810, "epoch": 2262} {"train_loss": -42.34739303588867, "global_step": 273811, "epoch": 2262} {"train_loss": -38.99413299560547, "global_step": 273812, "epoch": 2262} {"train_loss": -42.89352035522461, "global_step": 273813, "epoch": 2262} {"train_loss": -39.435768127441406, "global_step": 273814, "epoch": 2262} {"train_loss": -41.15855026245117, "global_step": 273815, "epoch": 2262} {"train_loss": -41.050140380859375, "global_step": 273816, "epoch": 2262} {"train_loss": -41.205116271972656, "global_step": 273817, "epoch": 2262} {"train_loss": -42.025875091552734, "global_step": 273818, "epoch": 2262} {"train_loss": -41.234718322753906, "global_step": 273819, "epoch": 2262} {"train_loss": -42.8360710144043, "global_step": 273820, "epoch": 2262} {"train_loss": -41.85142517089844, "global_step": 273821, "epoch": 2262} {"train_loss": -41.753652619921475, "global_step": 273822, "epoch": 2262, "val_loss": 2698721.5} {"train_loss": -41.9108772277832, "global_step": 273823, "epoch": 2263} {"train_loss": -42.27920150756836, "global_step": 273824, "epoch": 2263} {"train_loss": -41.9627571105957, "global_step": 273825, "epoch": 2263} {"train_loss": -42.40475082397461, "global_step": 273826, "epoch": 2263} {"train_loss": -42.75767135620117, "global_step": 273827, "epoch": 2263} {"train_loss": -42.5427360534668, "global_step": 273828, "epoch": 2263} {"train_loss": -43.02531051635742, "global_step": 273829, "epoch": 2263} {"train_loss": -42.6827507019043, "global_step": 273830, "epoch": 2263} {"train_loss": -42.627296447753906, "global_step": 273831, "epoch": 2263} {"train_loss": -43.0502815246582, "global_step": 273832, "epoch": 2263} {"train_loss": -42.18206787109375, "global_step": 273833, "epoch": 2263} {"train_loss": -43.0513916015625, "global_step": 273834, "epoch": 2263} {"train_loss": -42.86371612548828, "global_step": 273835, "epoch": 2263} {"train_loss": -42.267860412597656, "global_step": 273836, "epoch": 2263} {"train_loss": -42.971229553222656, "global_step": 273837, "epoch": 2263} {"train_loss": -42.851173400878906, "global_step": 273838, "epoch": 2263} {"train_loss": -43.29096221923828, "global_step": 273839, "epoch": 2263} {"train_loss": -42.75059509277344, "global_step": 273840, "epoch": 2263} {"train_loss": -43.083412170410156, "global_step": 273841, "epoch": 2263} {"train_loss": -42.85673141479492, "global_step": 273842, "epoch": 2263} {"train_loss": -43.387657165527344, "global_step": 273843, "epoch": 2263} {"train_loss": -42.92622756958008, "global_step": 273844, "epoch": 2263} {"train_loss": -43.06490707397461, "global_step": 273845, "epoch": 2263} {"train_loss": -42.990840911865234, "global_step": 273846, "epoch": 2263} {"train_loss": -43.04417419433594, "global_step": 273847, "epoch": 2263} {"train_loss": -43.673500061035156, "global_step": 273848, "epoch": 2263} {"train_loss": -42.9152717590332, "global_step": 273849, "epoch": 2263} {"train_loss": -43.52981185913086, "global_step": 273850, "epoch": 2263} {"train_loss": -43.327919006347656, "global_step": 273851, "epoch": 2263} {"train_loss": -42.24306106567383, "global_step": 273852, "epoch": 2263} {"train_loss": -43.059608459472656, "global_step": 273853, "epoch": 2263} {"train_loss": -43.594261169433594, "global_step": 273854, "epoch": 2263} {"train_loss": -42.953338623046875, "global_step": 273855, "epoch": 2263} {"train_loss": -43.47117233276367, "global_step": 273856, "epoch": 2263} {"train_loss": -43.536376953125, "global_step": 273857, "epoch": 2263} {"train_loss": -43.329158782958984, "global_step": 273858, "epoch": 2263} {"train_loss": -43.1552848815918, "global_step": 273859, "epoch": 2263} {"train_loss": -43.04380416870117, "global_step": 273860, "epoch": 2263} {"train_loss": -43.07963943481445, "global_step": 273861, "epoch": 2263} {"train_loss": -43.25870895385742, "global_step": 273862, "epoch": 2263} {"train_loss": -43.59334182739258, "global_step": 273863, "epoch": 2263} {"train_loss": -43.28060531616211, "global_step": 273864, "epoch": 2263} {"train_loss": -43.333072662353516, "global_step": 273865, "epoch": 2263} {"train_loss": -43.64924240112305, "global_step": 273866, "epoch": 2263} {"train_loss": -42.897003173828125, "global_step": 273867, "epoch": 2263} {"train_loss": -43.24733352661133, "global_step": 273868, "epoch": 2263} {"train_loss": -43.06260299682617, "global_step": 273869, "epoch": 2263} {"train_loss": -43.1851921081543, "global_step": 273870, "epoch": 2263} {"train_loss": -43.54506301879883, "global_step": 273871, "epoch": 2263} {"train_loss": -43.52561569213867, "global_step": 273872, "epoch": 2263} {"train_loss": -43.32024002075195, "global_step": 273873, "epoch": 2263} {"train_loss": -43.61538314819336, "global_step": 273874, "epoch": 2263} {"train_loss": -43.953975677490234, "global_step": 273875, "epoch": 2263} {"train_loss": -43.993228912353516, "global_step": 273876, "epoch": 2263} {"train_loss": -43.505428314208984, "global_step": 273877, "epoch": 2263} {"train_loss": -43.37929916381836, "global_step": 273878, "epoch": 2263} {"train_loss": -43.1711540222168, "global_step": 273879, "epoch": 2263} {"train_loss": -43.56637954711914, "global_step": 273880, "epoch": 2263} {"train_loss": -43.722999572753906, "global_step": 273881, "epoch": 2263} {"train_loss": -43.486026763916016, "global_step": 273882, "epoch": 2263} {"train_loss": -42.97486114501953, "global_step": 273883, "epoch": 2263} {"train_loss": -42.2025260925293, "global_step": 273884, "epoch": 2263} {"train_loss": -42.20672607421875, "global_step": 273885, "epoch": 2263} {"train_loss": -42.842567443847656, "global_step": 273886, "epoch": 2263} {"train_loss": -43.119022369384766, "global_step": 273887, "epoch": 2263} {"train_loss": -41.55440902709961, "global_step": 273888, "epoch": 2263} {"train_loss": -42.04343795776367, "global_step": 273889, "epoch": 2263} {"train_loss": -40.94025421142578, "global_step": 273890, "epoch": 2263} {"train_loss": -41.87819290161133, "global_step": 273891, "epoch": 2263} {"train_loss": -41.813411712646484, "global_step": 273892, "epoch": 2263} {"train_loss": -42.992103576660156, "global_step": 273893, "epoch": 2263} {"train_loss": -42.421363830566406, "global_step": 273894, "epoch": 2263} {"train_loss": -43.162784576416016, "global_step": 273895, "epoch": 2263} {"train_loss": -42.5079231262207, "global_step": 273896, "epoch": 2263} {"train_loss": -41.63258743286133, "global_step": 273897, "epoch": 2263} {"train_loss": -42.435096740722656, "global_step": 273898, "epoch": 2263} {"train_loss": -42.91461944580078, "global_step": 273899, "epoch": 2263} {"train_loss": -43.369354248046875, "global_step": 273900, "epoch": 2263} {"train_loss": -42.62924575805664, "global_step": 273901, "epoch": 2263} {"train_loss": -42.70429611206055, "global_step": 273902, "epoch": 2263} {"train_loss": -42.43767166137695, "global_step": 273903, "epoch": 2263} {"train_loss": -42.15458297729492, "global_step": 273904, "epoch": 2263} {"train_loss": -42.90838623046875, "global_step": 273905, "epoch": 2263} {"train_loss": -42.77680206298828, "global_step": 273906, "epoch": 2263} {"train_loss": -42.44179153442383, "global_step": 273907, "epoch": 2263} {"train_loss": -42.807491302490234, "global_step": 273908, "epoch": 2263} {"train_loss": -42.0365104675293, "global_step": 273909, "epoch": 2263} {"train_loss": -41.08822250366211, "global_step": 273910, "epoch": 2263} {"train_loss": -42.780906677246094, "global_step": 273911, "epoch": 2263} {"train_loss": -43.203182220458984, "global_step": 273912, "epoch": 2263} {"train_loss": -42.8007926940918, "global_step": 273913, "epoch": 2263} {"train_loss": -42.35198974609375, "global_step": 273914, "epoch": 2263} {"train_loss": -43.05470657348633, "global_step": 273915, "epoch": 2263} {"train_loss": -42.82757568359375, "global_step": 273916, "epoch": 2263} {"train_loss": -42.21243667602539, "global_step": 273917, "epoch": 2263} {"train_loss": -41.59471893310547, "global_step": 273918, "epoch": 2263} {"train_loss": -40.742061614990234, "global_step": 273919, "epoch": 2263} {"train_loss": -42.17827224731445, "global_step": 273920, "epoch": 2263} {"train_loss": -40.324615478515625, "global_step": 273921, "epoch": 2263} {"train_loss": -41.606876373291016, "global_step": 273922, "epoch": 2263} {"train_loss": -39.77309036254883, "global_step": 273923, "epoch": 2263} {"train_loss": -41.73781204223633, "global_step": 273924, "epoch": 2263} {"train_loss": -40.84095764160156, "global_step": 273925, "epoch": 2263} {"train_loss": -39.43596649169922, "global_step": 273926, "epoch": 2263} {"train_loss": -42.176719665527344, "global_step": 273927, "epoch": 2263} {"train_loss": -40.07948303222656, "global_step": 273928, "epoch": 2263} {"train_loss": -39.8134880065918, "global_step": 273929, "epoch": 2263} {"train_loss": -41.890193939208984, "global_step": 273930, "epoch": 2263} {"train_loss": -40.42295455932617, "global_step": 273931, "epoch": 2263} {"train_loss": -39.947975158691406, "global_step": 273932, "epoch": 2263} {"train_loss": -41.8920783996582, "global_step": 273933, "epoch": 2263} {"train_loss": -39.317481994628906, "global_step": 273934, "epoch": 2263} {"train_loss": -40.5427360534668, "global_step": 273935, "epoch": 2263} {"train_loss": -41.36566925048828, "global_step": 273936, "epoch": 2263} {"train_loss": -41.06764602661133, "global_step": 273937, "epoch": 2263} {"train_loss": -40.40190124511719, "global_step": 273938, "epoch": 2263} {"train_loss": -41.58127975463867, "global_step": 273939, "epoch": 2263} {"train_loss": -41.462581634521484, "global_step": 273940, "epoch": 2263} {"train_loss": -40.9582633972168, "global_step": 273941, "epoch": 2263} {"train_loss": -42.40313720703125, "global_step": 273942, "epoch": 2263} {"train_loss": -42.458260843576475, "global_step": 273943, "epoch": 2263, "val_loss": 2735318.75} {"train_loss": -41.25168991088867, "global_step": 273944, "epoch": 2264} {"train_loss": -42.55306625366211, "global_step": 273945, "epoch": 2264} {"train_loss": -41.18711853027344, "global_step": 273946, "epoch": 2264} {"train_loss": -42.48763656616211, "global_step": 273947, "epoch": 2264} {"train_loss": -41.74021530151367, "global_step": 273948, "epoch": 2264} {"train_loss": -42.31568145751953, "global_step": 273949, "epoch": 2264} {"train_loss": -43.135494232177734, "global_step": 273950, "epoch": 2264} {"train_loss": -42.55142593383789, "global_step": 273951, "epoch": 2264} {"train_loss": -43.045082092285156, "global_step": 273952, "epoch": 2264} {"train_loss": -42.39215850830078, "global_step": 273953, "epoch": 2264} {"train_loss": -42.391510009765625, "global_step": 273954, "epoch": 2264} {"train_loss": -42.54896926879883, "global_step": 273955, "epoch": 2264} {"train_loss": -42.880760192871094, "global_step": 273956, "epoch": 2264} {"train_loss": -42.85515213012695, "global_step": 273957, "epoch": 2264} {"train_loss": -42.9386100769043, "global_step": 273958, "epoch": 2264} {"train_loss": -43.36533737182617, "global_step": 273959, "epoch": 2264} {"train_loss": -42.903316497802734, "global_step": 273960, "epoch": 2264} {"train_loss": -43.320777893066406, "global_step": 273961, "epoch": 2264} {"train_loss": -43.20347213745117, "global_step": 273962, "epoch": 2264} {"train_loss": -42.5482177734375, "global_step": 273963, "epoch": 2264} {"train_loss": -43.0865364074707, "global_step": 273964, "epoch": 2264} {"train_loss": -42.9464225769043, "global_step": 273965, "epoch": 2264} {"train_loss": -43.109378814697266, "global_step": 273966, "epoch": 2264} {"train_loss": -42.8475456237793, "global_step": 273967, "epoch": 2264} {"train_loss": -42.61335372924805, "global_step": 273968, "epoch": 2264} {"train_loss": -43.6312141418457, "global_step": 273969, "epoch": 2264} {"train_loss": -42.67095947265625, "global_step": 273970, "epoch": 2264} {"train_loss": -42.74707794189453, "global_step": 273971, "epoch": 2264} {"train_loss": -42.52280807495117, "global_step": 273972, "epoch": 2264} {"train_loss": -42.8039436340332, "global_step": 273973, "epoch": 2264} {"train_loss": -43.466705322265625, "global_step": 273974, "epoch": 2264} {"train_loss": -42.629791259765625, "global_step": 273975, "epoch": 2264} {"train_loss": -42.778656005859375, "global_step": 273976, "epoch": 2264} {"train_loss": -42.65305709838867, "global_step": 273977, "epoch": 2264} {"train_loss": -43.687294006347656, "global_step": 273978, "epoch": 2264} {"train_loss": -43.312889099121094, "global_step": 273979, "epoch": 2264} {"train_loss": -42.668190002441406, "global_step": 273980, "epoch": 2264} {"train_loss": -43.42612838745117, "global_step": 273981, "epoch": 2264} {"train_loss": -43.26408004760742, "global_step": 273982, "epoch": 2264} {"train_loss": -42.907508850097656, "global_step": 273983, "epoch": 2264} {"train_loss": -43.58314895629883, "global_step": 273984, "epoch": 2264} {"train_loss": -43.06782913208008, "global_step": 273985, "epoch": 2264} {"train_loss": -43.18170166015625, "global_step": 273986, "epoch": 2264} {"train_loss": -42.98484420776367, "global_step": 273987, "epoch": 2264} {"train_loss": -43.63218307495117, "global_step": 273988, "epoch": 2264} {"train_loss": -43.745201110839844, "global_step": 273989, "epoch": 2264} {"train_loss": -43.31718063354492, "global_step": 273990, "epoch": 2264} {"train_loss": -42.2967643737793, "global_step": 273991, "epoch": 2264} {"train_loss": -43.153053283691406, "global_step": 273992, "epoch": 2264} {"train_loss": -42.54323196411133, "global_step": 273993, "epoch": 2264} {"train_loss": -43.318702697753906, "global_step": 273994, "epoch": 2264} {"train_loss": -42.99220657348633, "global_step": 273995, "epoch": 2264} {"train_loss": -42.653541564941406, "global_step": 273996, "epoch": 2264} {"train_loss": -42.204158782958984, "global_step": 273997, "epoch": 2264} {"train_loss": -43.13008499145508, "global_step": 273998, "epoch": 2264} {"train_loss": -43.327327728271484, "global_step": 273999, "epoch": 2264} {"train_loss": -42.4509391784668, "global_step": 274000, "epoch": 2264} {"train_loss": -42.03949737548828, "global_step": 274001, "epoch": 2264} {"train_loss": -41.56951141357422, "global_step": 274002, "epoch": 2264} {"train_loss": -43.94363021850586, "global_step": 274003, "epoch": 2264} {"train_loss": -42.85988998413086, "global_step": 274004, "epoch": 2264} {"train_loss": -42.0923957824707, "global_step": 274005, "epoch": 2264} {"train_loss": -42.5712890625, "global_step": 274006, "epoch": 2264} {"train_loss": -43.120399475097656, "global_step": 274007, "epoch": 2264} {"train_loss": -43.52631378173828, "global_step": 274008, "epoch": 2264} {"train_loss": -43.119869232177734, "global_step": 274009, "epoch": 2264} {"train_loss": -42.42866134643555, "global_step": 274010, "epoch": 2264} {"train_loss": -42.38032150268555, "global_step": 274011, "epoch": 2264} {"train_loss": -43.72251892089844, "global_step": 274012, "epoch": 2264} {"train_loss": -43.47844696044922, "global_step": 274013, "epoch": 2264} {"train_loss": -42.513282775878906, "global_step": 274014, "epoch": 2264} {"train_loss": -43.68910598754883, "global_step": 274015, "epoch": 2264} {"train_loss": -42.25739288330078, "global_step": 274016, "epoch": 2264} {"train_loss": -43.096099853515625, "global_step": 274017, "epoch": 2264} {"train_loss": -42.50187301635742, "global_step": 274018, "epoch": 2264} {"train_loss": -43.11555099487305, "global_step": 274019, "epoch": 2264} {"train_loss": -42.811100006103516, "global_step": 274020, "epoch": 2264} {"train_loss": -43.392967224121094, "global_step": 274021, "epoch": 2264} {"train_loss": -42.95054626464844, "global_step": 274022, "epoch": 2264} {"train_loss": -43.777042388916016, "global_step": 274023, "epoch": 2264} {"train_loss": -43.01213455200195, "global_step": 274024, "epoch": 2264} {"train_loss": -42.71057891845703, "global_step": 274025, "epoch": 2264} {"train_loss": -42.94911575317383, "global_step": 274026, "epoch": 2264} {"train_loss": -42.712520599365234, "global_step": 274027, "epoch": 2264} {"train_loss": -43.13462448120117, "global_step": 274028, "epoch": 2264} {"train_loss": -43.249488830566406, "global_step": 274029, "epoch": 2264} {"train_loss": -42.27334213256836, "global_step": 274030, "epoch": 2264} {"train_loss": -42.31095886230469, "global_step": 274031, "epoch": 2264} {"train_loss": -42.90377426147461, "global_step": 274032, "epoch": 2264} {"train_loss": -40.6402702331543, "global_step": 274033, "epoch": 2264} {"train_loss": -42.67156219482422, "global_step": 274034, "epoch": 2264} {"train_loss": -42.8327751159668, "global_step": 274035, "epoch": 2264} {"train_loss": -43.39604187011719, "global_step": 274036, "epoch": 2264} {"train_loss": -43.68024826049805, "global_step": 274037, "epoch": 2264} {"train_loss": -43.3828239440918, "global_step": 274038, "epoch": 2264} {"train_loss": -43.020809173583984, "global_step": 274039, "epoch": 2264} {"train_loss": -41.561279296875, "global_step": 274040, "epoch": 2264} {"train_loss": -41.95600509643555, "global_step": 274041, "epoch": 2264} {"train_loss": -43.31533432006836, "global_step": 274042, "epoch": 2264} {"train_loss": -43.17850875854492, "global_step": 274043, "epoch": 2264} {"train_loss": -42.06693649291992, "global_step": 274044, "epoch": 2264} {"train_loss": -43.674110412597656, "global_step": 274045, "epoch": 2264} {"train_loss": -43.066097259521484, "global_step": 274046, "epoch": 2264} {"train_loss": -43.64811325073242, "global_step": 274047, "epoch": 2264} {"train_loss": -43.274654388427734, "global_step": 274048, "epoch": 2264} {"train_loss": -39.65536117553711, "global_step": 274049, "epoch": 2264} {"train_loss": -42.934940338134766, "global_step": 274050, "epoch": 2264} {"train_loss": -43.251155853271484, "global_step": 274051, "epoch": 2264} {"train_loss": -42.77244186401367, "global_step": 274052, "epoch": 2264} {"train_loss": -43.18244552612305, "global_step": 274053, "epoch": 2264} {"train_loss": -43.1524543762207, "global_step": 274054, "epoch": 2264} {"train_loss": -43.31910705566406, "global_step": 274055, "epoch": 2264} {"train_loss": -42.79604721069336, "global_step": 274056, "epoch": 2264} {"train_loss": -41.612831115722656, "global_step": 274057, "epoch": 2264} {"train_loss": -40.78143310546875, "global_step": 274058, "epoch": 2264} {"train_loss": -42.65271759033203, "global_step": 274059, "epoch": 2264} {"train_loss": -42.197792053222656, "global_step": 274060, "epoch": 2264} {"train_loss": -39.175628662109375, "global_step": 274061, "epoch": 2264} {"train_loss": -40.917884826660156, "global_step": 274062, "epoch": 2264} {"train_loss": -41.79050827026367, "global_step": 274063, "epoch": 2264} {"train_loss": -42.74797798976425, "global_step": 274064, "epoch": 2264, "val_loss": 2728757.75} {"train_loss": -43.02183151245117, "global_step": 274065, "epoch": 2265} {"train_loss": -39.63069152832031, "global_step": 274066, "epoch": 2265} {"train_loss": -36.43801498413086, "global_step": 274067, "epoch": 2265} {"train_loss": -40.314327239990234, "global_step": 274068, "epoch": 2265} {"train_loss": -35.88274383544922, "global_step": 274069, "epoch": 2265} {"train_loss": -36.49199295043945, "global_step": 274070, "epoch": 2265} {"train_loss": -40.00916290283203, "global_step": 274071, "epoch": 2265} {"train_loss": -40.57856369018555, "global_step": 274072, "epoch": 2265} {"train_loss": -35.41469955444336, "global_step": 274073, "epoch": 2265} {"train_loss": -39.00545120239258, "global_step": 274074, "epoch": 2265} {"train_loss": -42.407676696777344, "global_step": 274075, "epoch": 2265} {"train_loss": -38.30378341674805, "global_step": 274076, "epoch": 2265} {"train_loss": -40.375823974609375, "global_step": 274077, "epoch": 2265} {"train_loss": -41.59882354736328, "global_step": 274078, "epoch": 2265} {"train_loss": -41.415374755859375, "global_step": 274079, "epoch": 2265} {"train_loss": -42.208675384521484, "global_step": 274080, "epoch": 2265} {"train_loss": -38.25874710083008, "global_step": 274081, "epoch": 2265} {"train_loss": -39.12238693237305, "global_step": 274082, "epoch": 2265} {"train_loss": -40.72840881347656, "global_step": 274083, "epoch": 2265} {"train_loss": -42.048377990722656, "global_step": 274084, "epoch": 2265} {"train_loss": -40.98408126831055, "global_step": 274085, "epoch": 2265} {"train_loss": -41.393951416015625, "global_step": 274086, "epoch": 2265} {"train_loss": -40.697776794433594, "global_step": 274087, "epoch": 2265} {"train_loss": -40.98125076293945, "global_step": 274088, "epoch": 2265} {"train_loss": -40.49110794067383, "global_step": 274089, "epoch": 2265} {"train_loss": -41.425350189208984, "global_step": 274090, "epoch": 2265} {"train_loss": -40.8502311706543, "global_step": 274091, "epoch": 2265} {"train_loss": -42.10274887084961, "global_step": 274092, "epoch": 2265} {"train_loss": -41.28742599487305, "global_step": 274093, "epoch": 2265} {"train_loss": -40.480953216552734, "global_step": 274094, "epoch": 2265} {"train_loss": -38.54133987426758, "global_step": 274095, "epoch": 2265} {"train_loss": -41.54543685913086, "global_step": 274096, "epoch": 2265} {"train_loss": -41.54106521606445, "global_step": 274097, "epoch": 2265} {"train_loss": -41.601985931396484, "global_step": 274098, "epoch": 2265} {"train_loss": -39.8383674621582, "global_step": 274099, "epoch": 2265} {"train_loss": -42.0350456237793, "global_step": 274100, "epoch": 2265} {"train_loss": -41.88069534301758, "global_step": 274101, "epoch": 2265} {"train_loss": -38.23170852661133, "global_step": 274102, "epoch": 2265} {"train_loss": -40.91582107543945, "global_step": 274103, "epoch": 2265} {"train_loss": -39.10978317260742, "global_step": 274104, "epoch": 2265} {"train_loss": -40.44358444213867, "global_step": 274105, "epoch": 2265} {"train_loss": -41.790618896484375, "global_step": 274106, "epoch": 2265} {"train_loss": -41.5184440612793, "global_step": 274107, "epoch": 2265} {"train_loss": -41.763423919677734, "global_step": 274108, "epoch": 2265} {"train_loss": -40.9662971496582, "global_step": 274109, "epoch": 2265} {"train_loss": -41.21533966064453, "global_step": 274110, "epoch": 2265} {"train_loss": -39.150081634521484, "global_step": 274111, "epoch": 2265} {"train_loss": -42.18095397949219, "global_step": 274112, "epoch": 2265} {"train_loss": -41.03217697143555, "global_step": 274113, "epoch": 2265} {"train_loss": -40.72333908081055, "global_step": 274114, "epoch": 2265} {"train_loss": -42.35993957519531, "global_step": 274115, "epoch": 2265} {"train_loss": -41.652442932128906, "global_step": 274116, "epoch": 2265} {"train_loss": -42.13924026489258, "global_step": 274117, "epoch": 2265} {"train_loss": -40.748207092285156, "global_step": 274118, "epoch": 2265} {"train_loss": -41.982540130615234, "global_step": 274119, "epoch": 2265} {"train_loss": -40.04566955566406, "global_step": 274120, "epoch": 2265} {"train_loss": -42.68935775756836, "global_step": 274121, "epoch": 2265} {"train_loss": -41.19138717651367, "global_step": 274122, "epoch": 2265} {"train_loss": -42.76312255859375, "global_step": 274123, "epoch": 2265} {"train_loss": -40.18270492553711, "global_step": 274124, "epoch": 2265} {"train_loss": -37.28129196166992, "global_step": 274125, "epoch": 2265} {"train_loss": -39.91256332397461, "global_step": 274126, "epoch": 2265} {"train_loss": -41.116371154785156, "global_step": 274127, "epoch": 2265} {"train_loss": -42.175899505615234, "global_step": 274128, "epoch": 2265} {"train_loss": -41.28737258911133, "global_step": 274129, "epoch": 2265} {"train_loss": -39.7656364440918, "global_step": 274130, "epoch": 2265} {"train_loss": -42.585147857666016, "global_step": 274131, "epoch": 2265} {"train_loss": -42.49540328979492, "global_step": 274132, "epoch": 2265} {"train_loss": -42.897674560546875, "global_step": 274133, "epoch": 2265} {"train_loss": -41.06790542602539, "global_step": 274134, "epoch": 2265} {"train_loss": -42.700050354003906, "global_step": 274135, "epoch": 2265} {"train_loss": -42.10652542114258, "global_step": 274136, "epoch": 2265} {"train_loss": -41.04736328125, "global_step": 274137, "epoch": 2265} {"train_loss": -42.19437789916992, "global_step": 274138, "epoch": 2265} {"train_loss": -40.803646087646484, "global_step": 274139, "epoch": 2265} {"train_loss": -42.41511917114258, "global_step": 274140, "epoch": 2265} {"train_loss": -40.1121940612793, "global_step": 274141, "epoch": 2265} {"train_loss": -41.49557876586914, "global_step": 274142, "epoch": 2265} {"train_loss": -40.721920013427734, "global_step": 274143, "epoch": 2265} {"train_loss": -42.52846145629883, "global_step": 274144, "epoch": 2265} {"train_loss": -42.2700309753418, "global_step": 274145, "epoch": 2265} {"train_loss": -42.01054382324219, "global_step": 274146, "epoch": 2265} {"train_loss": -41.90761184692383, "global_step": 274147, "epoch": 2265} {"train_loss": -42.58066940307617, "global_step": 274148, "epoch": 2265} {"train_loss": -41.92385482788086, "global_step": 274149, "epoch": 2265} {"train_loss": -41.521881103515625, "global_step": 274150, "epoch": 2265} {"train_loss": -42.59969711303711, "global_step": 274151, "epoch": 2265} {"train_loss": -42.53178405761719, "global_step": 274152, "epoch": 2265} {"train_loss": -43.49968338012695, "global_step": 274153, "epoch": 2265} {"train_loss": -42.73958969116211, "global_step": 274154, "epoch": 2265} {"train_loss": -42.587642669677734, "global_step": 274155, "epoch": 2265} {"train_loss": -43.06412887573242, "global_step": 274156, "epoch": 2265} {"train_loss": -42.99125289916992, "global_step": 274157, "epoch": 2265} {"train_loss": -42.591976165771484, "global_step": 274158, "epoch": 2265} {"train_loss": -43.15401077270508, "global_step": 274159, "epoch": 2265} {"train_loss": -43.104305267333984, "global_step": 274160, "epoch": 2265} {"train_loss": -43.09712219238281, "global_step": 274161, "epoch": 2265} {"train_loss": -42.76764678955078, "global_step": 274162, "epoch": 2265} {"train_loss": -41.074378967285156, "global_step": 274163, "epoch": 2265} {"train_loss": -42.31899642944336, "global_step": 274164, "epoch": 2265} {"train_loss": -42.87995147705078, "global_step": 274165, "epoch": 2265} {"train_loss": -42.880043029785156, "global_step": 274166, "epoch": 2265} {"train_loss": -43.17700958251953, "global_step": 274167, "epoch": 2265} {"train_loss": -42.32062911987305, "global_step": 274168, "epoch": 2265} {"train_loss": -42.460693359375, "global_step": 274169, "epoch": 2265} {"train_loss": -41.05202102661133, "global_step": 274170, "epoch": 2265} {"train_loss": -40.434967041015625, "global_step": 274171, "epoch": 2265} {"train_loss": -43.60091781616211, "global_step": 274172, "epoch": 2265} {"train_loss": -41.302757263183594, "global_step": 274173, "epoch": 2265} {"train_loss": -41.89509201049805, "global_step": 274174, "epoch": 2265} {"train_loss": -43.25236511230469, "global_step": 274175, "epoch": 2265} {"train_loss": -37.49332046508789, "global_step": 274176, "epoch": 2265} {"train_loss": -42.04763412475586, "global_step": 274177, "epoch": 2265} {"train_loss": -43.29535675048828, "global_step": 274178, "epoch": 2265} {"train_loss": -42.2001838684082, "global_step": 274179, "epoch": 2265} {"train_loss": -37.689979553222656, "global_step": 274180, "epoch": 2265} {"train_loss": -42.440086364746094, "global_step": 274181, "epoch": 2265} {"train_loss": -41.41169357299805, "global_step": 274182, "epoch": 2265} {"train_loss": -41.13496017456055, "global_step": 274183, "epoch": 2265} {"train_loss": -42.64458084106445, "global_step": 274184, "epoch": 2265} {"train_loss": -41.2272105256388, "global_step": 274185, "epoch": 2265, "val_loss": 3353977.25} {"train_loss": -41.710182189941406, "global_step": 274186, "epoch": 2266} {"train_loss": -42.14137649536133, "global_step": 274187, "epoch": 2266} {"train_loss": -41.12504959106445, "global_step": 274188, "epoch": 2266} {"train_loss": -42.7232780456543, "global_step": 274189, "epoch": 2266} {"train_loss": -41.94455337524414, "global_step": 274190, "epoch": 2266} {"train_loss": -43.376644134521484, "global_step": 274191, "epoch": 2266} {"train_loss": -41.22913360595703, "global_step": 274192, "epoch": 2266} {"train_loss": -42.939300537109375, "global_step": 274193, "epoch": 2266} {"train_loss": -42.95383071899414, "global_step": 274194, "epoch": 2266} {"train_loss": -42.944557189941406, "global_step": 274195, "epoch": 2266} {"train_loss": -42.66437911987305, "global_step": 274196, "epoch": 2266} {"train_loss": -43.105777740478516, "global_step": 274197, "epoch": 2266} {"train_loss": -42.69405746459961, "global_step": 274198, "epoch": 2266} {"train_loss": -42.615753173828125, "global_step": 274199, "epoch": 2266} {"train_loss": -41.14158248901367, "global_step": 274200, "epoch": 2266} {"train_loss": -43.056495666503906, "global_step": 274201, "epoch": 2266} {"train_loss": -42.848182678222656, "global_step": 274202, "epoch": 2266} {"train_loss": -43.21796798706055, "global_step": 274203, "epoch": 2266} {"train_loss": -43.09367752075195, "global_step": 274204, "epoch": 2266} {"train_loss": -42.34602737426758, "global_step": 274205, "epoch": 2266} {"train_loss": -43.64771270751953, "global_step": 274206, "epoch": 2266} {"train_loss": -42.31151580810547, "global_step": 274207, "epoch": 2266} {"train_loss": -42.20821762084961, "global_step": 274208, "epoch": 2266} {"train_loss": -42.42277145385742, "global_step": 274209, "epoch": 2266} {"train_loss": -42.19631576538086, "global_step": 274210, "epoch": 2266} {"train_loss": -43.06914520263672, "global_step": 274211, "epoch": 2266} {"train_loss": -43.5728759765625, "global_step": 274212, "epoch": 2266} {"train_loss": -43.70740509033203, "global_step": 274213, "epoch": 2266} {"train_loss": -43.22193145751953, "global_step": 274214, "epoch": 2266} {"train_loss": -43.2618522644043, "global_step": 274215, "epoch": 2266} {"train_loss": -42.40715789794922, "global_step": 274216, "epoch": 2266} {"train_loss": -42.516414642333984, "global_step": 274217, "epoch": 2266} {"train_loss": -43.1385498046875, "global_step": 274218, "epoch": 2266} {"train_loss": -43.3342399597168, "global_step": 274219, "epoch": 2266} {"train_loss": -43.647727966308594, "global_step": 274220, "epoch": 2266} {"train_loss": -41.823055267333984, "global_step": 274221, "epoch": 2266} {"train_loss": -43.210811614990234, "global_step": 274222, "epoch": 2266} {"train_loss": -41.83393096923828, "global_step": 274223, "epoch": 2266} {"train_loss": -42.668697357177734, "global_step": 274224, "epoch": 2266} {"train_loss": -43.12278366088867, "global_step": 274225, "epoch": 2266} {"train_loss": -43.051979064941406, "global_step": 274226, "epoch": 2266} {"train_loss": -42.626590728759766, "global_step": 274227, "epoch": 2266} {"train_loss": -43.803558349609375, "global_step": 274228, "epoch": 2266} {"train_loss": -42.14923858642578, "global_step": 274229, "epoch": 2266} {"train_loss": -42.78875732421875, "global_step": 274230, "epoch": 2266} {"train_loss": -40.44964599609375, "global_step": 274231, "epoch": 2266} {"train_loss": -41.657264709472656, "global_step": 274232, "epoch": 2266} {"train_loss": -43.611019134521484, "global_step": 274233, "epoch": 2266} {"train_loss": -40.23533630371094, "global_step": 274234, "epoch": 2266} {"train_loss": -41.00335693359375, "global_step": 274235, "epoch": 2266} {"train_loss": -40.51861572265625, "global_step": 274236, "epoch": 2266} {"train_loss": -40.98026657104492, "global_step": 274237, "epoch": 2266} {"train_loss": -38.1884765625, "global_step": 274238, "epoch": 2266} {"train_loss": -41.87244415283203, "global_step": 274239, "epoch": 2266} {"train_loss": -40.50322341918945, "global_step": 274240, "epoch": 2266} {"train_loss": -41.29575729370117, "global_step": 274241, "epoch": 2266} {"train_loss": -40.26983642578125, "global_step": 274242, "epoch": 2266} {"train_loss": -38.64886474609375, "global_step": 274243, "epoch": 2266} {"train_loss": -33.347469329833984, "global_step": 274244, "epoch": 2266} {"train_loss": -38.54771041870117, "global_step": 274245, "epoch": 2266} {"train_loss": -40.32075119018555, "global_step": 274246, "epoch": 2266} {"train_loss": -39.25654602050781, "global_step": 274247, "epoch": 2266} {"train_loss": -39.3188591003418, "global_step": 274248, "epoch": 2266} {"train_loss": -41.15688705444336, "global_step": 274249, "epoch": 2266} {"train_loss": -39.538509368896484, "global_step": 274250, "epoch": 2266} {"train_loss": -37.820159912109375, "global_step": 274251, "epoch": 2266} {"train_loss": -38.6871452331543, "global_step": 274252, "epoch": 2266} {"train_loss": -35.17776107788086, "global_step": 274253, "epoch": 2266} {"train_loss": -41.654937744140625, "global_step": 274254, "epoch": 2266} {"train_loss": -39.736114501953125, "global_step": 274255, "epoch": 2266} {"train_loss": -39.150238037109375, "global_step": 274256, "epoch": 2266} {"train_loss": -39.520259857177734, "global_step": 274257, "epoch": 2266} {"train_loss": -41.61548614501953, "global_step": 274258, "epoch": 2266} {"train_loss": -37.151607513427734, "global_step": 274259, "epoch": 2266} {"train_loss": -39.50877380371094, "global_step": 274260, "epoch": 2266} {"train_loss": -40.35298156738281, "global_step": 274261, "epoch": 2266} {"train_loss": -40.392486572265625, "global_step": 274262, "epoch": 2266} {"train_loss": -39.306392669677734, "global_step": 274263, "epoch": 2266} {"train_loss": -41.05888748168945, "global_step": 274264, "epoch": 2266} {"train_loss": -42.20266342163086, "global_step": 274265, "epoch": 2266} {"train_loss": -40.838279724121094, "global_step": 274266, "epoch": 2266} {"train_loss": -39.98870849609375, "global_step": 274267, "epoch": 2266} {"train_loss": -41.39348220825195, "global_step": 274268, "epoch": 2266} {"train_loss": -40.19628143310547, "global_step": 274269, "epoch": 2266} {"train_loss": -41.28207778930664, "global_step": 274270, "epoch": 2266} {"train_loss": -41.309295654296875, "global_step": 274271, "epoch": 2266} {"train_loss": -41.774810791015625, "global_step": 274272, "epoch": 2266} {"train_loss": -41.3498649597168, "global_step": 274273, "epoch": 2266} {"train_loss": -41.41289520263672, "global_step": 274274, "epoch": 2266} {"train_loss": -41.91400146484375, "global_step": 274275, "epoch": 2266} {"train_loss": -41.969276428222656, "global_step": 274276, "epoch": 2266} {"train_loss": -42.2441291809082, "global_step": 274277, "epoch": 2266} {"train_loss": -41.587886810302734, "global_step": 274278, "epoch": 2266} {"train_loss": -41.53471755981445, "global_step": 274279, "epoch": 2266} {"train_loss": -42.49784469604492, "global_step": 274280, "epoch": 2266} {"train_loss": -41.68357467651367, "global_step": 274281, "epoch": 2266} {"train_loss": -41.098121643066406, "global_step": 274282, "epoch": 2266} {"train_loss": -41.65361404418945, "global_step": 274283, "epoch": 2266} {"train_loss": -42.04806137084961, "global_step": 274284, "epoch": 2266} {"train_loss": -42.26020431518555, "global_step": 274285, "epoch": 2266} {"train_loss": -42.14091110229492, "global_step": 274286, "epoch": 2266} {"train_loss": -42.0852165222168, "global_step": 274287, "epoch": 2266} {"train_loss": -42.50210189819336, "global_step": 274288, "epoch": 2266} {"train_loss": -42.50389862060547, "global_step": 274289, "epoch": 2266} {"train_loss": -42.533390045166016, "global_step": 274290, "epoch": 2266} {"train_loss": -41.6046142578125, "global_step": 274291, "epoch": 2266} {"train_loss": -42.64240264892578, "global_step": 274292, "epoch": 2266} {"train_loss": -42.69354248046875, "global_step": 274293, "epoch": 2266} {"train_loss": -42.7814826965332, "global_step": 274294, "epoch": 2266} {"train_loss": -43.05593490600586, "global_step": 274295, "epoch": 2266} {"train_loss": -42.9495964050293, "global_step": 274296, "epoch": 2266} {"train_loss": -42.991817474365234, "global_step": 274297, "epoch": 2266} {"train_loss": -43.08673858642578, "global_step": 274298, "epoch": 2266} {"train_loss": -43.1120491027832, "global_step": 274299, "epoch": 2266} {"train_loss": -42.91714096069336, "global_step": 274300, "epoch": 2266} {"train_loss": -42.69731903076172, "global_step": 274301, "epoch": 2266} {"train_loss": -42.32528305053711, "global_step": 274302, "epoch": 2266} {"train_loss": -42.94701385498047, "global_step": 274303, "epoch": 2266} {"train_loss": -42.56631088256836, "global_step": 274304, "epoch": 2266} {"train_loss": -42.95186233520508, "global_step": 274305, "epoch": 2266} {"train_loss": -41.658786017047476, "global_step": 274306, "epoch": 2266, "val_loss": 2709346.25} {"train_loss": -43.16913986206055, "global_step": 274307, "epoch": 2267} {"train_loss": -42.2235221862793, "global_step": 274308, "epoch": 2267} {"train_loss": -42.0803108215332, "global_step": 274309, "epoch": 2267} {"train_loss": -42.69070053100586, "global_step": 274310, "epoch": 2267} {"train_loss": -42.74198532104492, "global_step": 274311, "epoch": 2267} {"train_loss": -42.17958068847656, "global_step": 274312, "epoch": 2267} {"train_loss": -43.08706283569336, "global_step": 274313, "epoch": 2267} {"train_loss": -42.81413650512695, "global_step": 274314, "epoch": 2267} {"train_loss": -43.54545211791992, "global_step": 274315, "epoch": 2267} {"train_loss": -43.609371185302734, "global_step": 274316, "epoch": 2267} {"train_loss": -43.2195930480957, "global_step": 274317, "epoch": 2267} {"train_loss": -42.87295150756836, "global_step": 274318, "epoch": 2267} {"train_loss": -43.35114288330078, "global_step": 274319, "epoch": 2267} {"train_loss": -43.7144775390625, "global_step": 274320, "epoch": 2267} {"train_loss": -42.699764251708984, "global_step": 274321, "epoch": 2267} {"train_loss": -43.007057189941406, "global_step": 274322, "epoch": 2267} {"train_loss": -42.91891860961914, "global_step": 274323, "epoch": 2267} {"train_loss": -42.68038558959961, "global_step": 274324, "epoch": 2267} {"train_loss": -42.08409118652344, "global_step": 274325, "epoch": 2267} {"train_loss": -43.00441360473633, "global_step": 274326, "epoch": 2267} {"train_loss": -40.90931701660156, "global_step": 274327, "epoch": 2267} {"train_loss": -40.22385787963867, "global_step": 274328, "epoch": 2267} {"train_loss": -39.60870361328125, "global_step": 274329, "epoch": 2267} {"train_loss": -41.63494873046875, "global_step": 274330, "epoch": 2267} {"train_loss": -42.61794662475586, "global_step": 274331, "epoch": 2267} {"train_loss": -42.780433654785156, "global_step": 274332, "epoch": 2267} {"train_loss": -43.135494232177734, "global_step": 274333, "epoch": 2267} {"train_loss": -42.604610443115234, "global_step": 274334, "epoch": 2267} {"train_loss": -43.341976165771484, "global_step": 274335, "epoch": 2267} {"train_loss": -41.773807525634766, "global_step": 274336, "epoch": 2267} {"train_loss": -43.12000274658203, "global_step": 274337, "epoch": 2267} {"train_loss": -42.69365692138672, "global_step": 274338, "epoch": 2267} {"train_loss": -43.008697509765625, "global_step": 274339, "epoch": 2267} {"train_loss": -43.501853942871094, "global_step": 274340, "epoch": 2267} {"train_loss": -42.71021270751953, "global_step": 274341, "epoch": 2267} {"train_loss": -42.54412841796875, "global_step": 274342, "epoch": 2267} {"train_loss": -42.60671615600586, "global_step": 274343, "epoch": 2267} {"train_loss": -43.48482894897461, "global_step": 274344, "epoch": 2267} {"train_loss": -43.17290115356445, "global_step": 274345, "epoch": 2267} {"train_loss": -43.3831672668457, "global_step": 274346, "epoch": 2267} {"train_loss": -41.37921905517578, "global_step": 274347, "epoch": 2267} {"train_loss": -43.16699981689453, "global_step": 274348, "epoch": 2267} {"train_loss": -41.48969268798828, "global_step": 274349, "epoch": 2267} {"train_loss": -40.37336349487305, "global_step": 274350, "epoch": 2267} {"train_loss": -42.32951736450195, "global_step": 274351, "epoch": 2267} {"train_loss": -42.13911819458008, "global_step": 274352, "epoch": 2267} {"train_loss": -41.9521598815918, "global_step": 274353, "epoch": 2267} {"train_loss": -42.1485710144043, "global_step": 274354, "epoch": 2267} {"train_loss": -41.972991943359375, "global_step": 274355, "epoch": 2267} {"train_loss": -43.24819564819336, "global_step": 274356, "epoch": 2267} {"train_loss": -42.14240264892578, "global_step": 274357, "epoch": 2267} {"train_loss": -42.674346923828125, "global_step": 274358, "epoch": 2267} {"train_loss": -43.029754638671875, "global_step": 274359, "epoch": 2267} {"train_loss": -42.9662971496582, "global_step": 274360, "epoch": 2267} {"train_loss": -41.953460693359375, "global_step": 274361, "epoch": 2267} {"train_loss": -42.82120895385742, "global_step": 274362, "epoch": 2267} {"train_loss": -42.47710037231445, "global_step": 274363, "epoch": 2267} {"train_loss": -42.108943939208984, "global_step": 274364, "epoch": 2267} {"train_loss": -42.891441345214844, "global_step": 274365, "epoch": 2267} {"train_loss": -42.60795974731445, "global_step": 274366, "epoch": 2267} {"train_loss": -43.50173568725586, "global_step": 274367, "epoch": 2267} {"train_loss": -41.89910888671875, "global_step": 274368, "epoch": 2267} {"train_loss": -43.068031311035156, "global_step": 274369, "epoch": 2267} {"train_loss": -43.233314514160156, "global_step": 274370, "epoch": 2267} {"train_loss": -43.403804779052734, "global_step": 274371, "epoch": 2267} {"train_loss": -42.507476806640625, "global_step": 274372, "epoch": 2267} {"train_loss": -43.864158630371094, "global_step": 274373, "epoch": 2267} {"train_loss": -43.58673858642578, "global_step": 274374, "epoch": 2267} {"train_loss": -43.161224365234375, "global_step": 274375, "epoch": 2267} {"train_loss": -43.374977111816406, "global_step": 274376, "epoch": 2267} {"train_loss": -42.922786712646484, "global_step": 274377, "epoch": 2267} {"train_loss": -43.23149490356445, "global_step": 274378, "epoch": 2267} {"train_loss": -43.766273498535156, "global_step": 274379, "epoch": 2267} {"train_loss": -43.212711334228516, "global_step": 274380, "epoch": 2267} {"train_loss": -43.012481689453125, "global_step": 274381, "epoch": 2267} {"train_loss": -43.70835494995117, "global_step": 274382, "epoch": 2267} {"train_loss": -42.949134826660156, "global_step": 274383, "epoch": 2267} {"train_loss": -43.6586799621582, "global_step": 274384, "epoch": 2267} {"train_loss": -43.18156051635742, "global_step": 274385, "epoch": 2267} {"train_loss": -43.3281364440918, "global_step": 274386, "epoch": 2267} {"train_loss": -43.459259033203125, "global_step": 274387, "epoch": 2267} {"train_loss": -43.84074401855469, "global_step": 274388, "epoch": 2267} {"train_loss": -43.09159851074219, "global_step": 274389, "epoch": 2267} {"train_loss": -41.52488327026367, "global_step": 274390, "epoch": 2267} {"train_loss": -40.84713363647461, "global_step": 274391, "epoch": 2267} {"train_loss": -40.290077209472656, "global_step": 274392, "epoch": 2267} {"train_loss": -40.76493453979492, "global_step": 274393, "epoch": 2267} {"train_loss": -42.03429412841797, "global_step": 274394, "epoch": 2267} {"train_loss": -42.972755432128906, "global_step": 274395, "epoch": 2267} {"train_loss": -41.55047607421875, "global_step": 274396, "epoch": 2267} {"train_loss": -40.717403411865234, "global_step": 274397, "epoch": 2267} {"train_loss": -40.5776481628418, "global_step": 274398, "epoch": 2267} {"train_loss": -42.88603973388672, "global_step": 274399, "epoch": 2267} {"train_loss": -43.2824821472168, "global_step": 274400, "epoch": 2267} {"train_loss": -42.27213668823242, "global_step": 274401, "epoch": 2267} {"train_loss": -42.77781677246094, "global_step": 274402, "epoch": 2267} {"train_loss": -42.588096618652344, "global_step": 274403, "epoch": 2267} {"train_loss": -41.766902923583984, "global_step": 274404, "epoch": 2267} {"train_loss": -43.08346176147461, "global_step": 274405, "epoch": 2267} {"train_loss": -42.34483337402344, "global_step": 274406, "epoch": 2267} {"train_loss": -41.910614013671875, "global_step": 274407, "epoch": 2267} {"train_loss": -43.43687057495117, "global_step": 274408, "epoch": 2267} {"train_loss": -42.03315353393555, "global_step": 274409, "epoch": 2267} {"train_loss": -42.39755630493164, "global_step": 274410, "epoch": 2267} {"train_loss": -42.11962127685547, "global_step": 274411, "epoch": 2267} {"train_loss": -41.84759521484375, "global_step": 274412, "epoch": 2267} {"train_loss": -42.95148849487305, "global_step": 274413, "epoch": 2267} {"train_loss": -42.09320068359375, "global_step": 274414, "epoch": 2267} {"train_loss": -41.821311950683594, "global_step": 274415, "epoch": 2267} {"train_loss": -42.4096565246582, "global_step": 274416, "epoch": 2267} {"train_loss": -42.596832275390625, "global_step": 274417, "epoch": 2267} {"train_loss": -42.49044418334961, "global_step": 274418, "epoch": 2267} {"train_loss": -42.70468521118164, "global_step": 274419, "epoch": 2267} {"train_loss": -42.60127639770508, "global_step": 274420, "epoch": 2267} {"train_loss": -42.81618118286133, "global_step": 274421, "epoch": 2267} {"train_loss": -42.371273040771484, "global_step": 274422, "epoch": 2267} {"train_loss": -43.242855072021484, "global_step": 274423, "epoch": 2267} {"train_loss": -43.17985916137695, "global_step": 274424, "epoch": 2267} {"train_loss": -42.77751541137695, "global_step": 274425, "epoch": 2267} {"train_loss": -43.0633659362793, "global_step": 274426, "epoch": 2267} {"train_loss": -42.58846651818141, "global_step": 274427, "epoch": 2267, "val_loss": 2673606.5} {"train_loss": -43.24060821533203, "global_step": 274428, "epoch": 2268} {"train_loss": -42.5257568359375, "global_step": 274429, "epoch": 2268} {"train_loss": -43.32149124145508, "global_step": 274430, "epoch": 2268} {"train_loss": -43.20362854003906, "global_step": 274431, "epoch": 2268} {"train_loss": -43.56959915161133, "global_step": 274432, "epoch": 2268} {"train_loss": -43.44451904296875, "global_step": 274433, "epoch": 2268} {"train_loss": -43.282318115234375, "global_step": 274434, "epoch": 2268} {"train_loss": -41.49082565307617, "global_step": 274435, "epoch": 2268} {"train_loss": -42.559059143066406, "global_step": 274436, "epoch": 2268} {"train_loss": -42.978485107421875, "global_step": 274437, "epoch": 2268} {"train_loss": -42.52251052856445, "global_step": 274438, "epoch": 2268} {"train_loss": -43.362342834472656, "global_step": 274439, "epoch": 2268} {"train_loss": -43.4029426574707, "global_step": 274440, "epoch": 2268} {"train_loss": -42.315120697021484, "global_step": 274441, "epoch": 2268} {"train_loss": -41.38735580444336, "global_step": 274442, "epoch": 2268} {"train_loss": -43.17974853515625, "global_step": 274443, "epoch": 2268} {"train_loss": -43.03776168823242, "global_step": 274444, "epoch": 2268} {"train_loss": -42.63957977294922, "global_step": 274445, "epoch": 2268} {"train_loss": -43.7371940612793, "global_step": 274446, "epoch": 2268} {"train_loss": -43.53818893432617, "global_step": 274447, "epoch": 2268} {"train_loss": -42.96833419799805, "global_step": 274448, "epoch": 2268} {"train_loss": -42.83945846557617, "global_step": 274449, "epoch": 2268} {"train_loss": -41.70878219604492, "global_step": 274450, "epoch": 2268} {"train_loss": -42.90420150756836, "global_step": 274451, "epoch": 2268} {"train_loss": -42.86636734008789, "global_step": 274452, "epoch": 2268} {"train_loss": -42.38482666015625, "global_step": 274453, "epoch": 2268} {"train_loss": -41.83859634399414, "global_step": 274454, "epoch": 2268} {"train_loss": -41.27448654174805, "global_step": 274455, "epoch": 2268} {"train_loss": -42.921199798583984, "global_step": 274456, "epoch": 2268} {"train_loss": -43.333229064941406, "global_step": 274457, "epoch": 2268} {"train_loss": -42.58986282348633, "global_step": 274458, "epoch": 2268} {"train_loss": -42.41046142578125, "global_step": 274459, "epoch": 2268} {"train_loss": -42.757938385009766, "global_step": 274460, "epoch": 2268} {"train_loss": -43.741573333740234, "global_step": 274461, "epoch": 2268} {"train_loss": -43.11909103393555, "global_step": 274462, "epoch": 2268} {"train_loss": -42.28426742553711, "global_step": 274463, "epoch": 2268} {"train_loss": -43.33234405517578, "global_step": 274464, "epoch": 2268} {"train_loss": -42.49727249145508, "global_step": 274465, "epoch": 2268} {"train_loss": -42.07863998413086, "global_step": 274466, "epoch": 2268} {"train_loss": -43.6702880859375, "global_step": 274467, "epoch": 2268} {"train_loss": -42.496192932128906, "global_step": 274468, "epoch": 2268} {"train_loss": -42.36219787597656, "global_step": 274469, "epoch": 2268} {"train_loss": -42.857303619384766, "global_step": 274470, "epoch": 2268} {"train_loss": -43.6769905090332, "global_step": 274471, "epoch": 2268} {"train_loss": -42.60111618041992, "global_step": 274472, "epoch": 2268} {"train_loss": -43.42494201660156, "global_step": 274473, "epoch": 2268} {"train_loss": -42.81763458251953, "global_step": 274474, "epoch": 2268} {"train_loss": -41.2878532409668, "global_step": 274475, "epoch": 2268} {"train_loss": -42.177425384521484, "global_step": 274476, "epoch": 2268} {"train_loss": -42.72138977050781, "global_step": 274477, "epoch": 2268} {"train_loss": -41.31298828125, "global_step": 274478, "epoch": 2268} {"train_loss": -42.960243225097656, "global_step": 274479, "epoch": 2268} {"train_loss": -41.76432418823242, "global_step": 274480, "epoch": 2268} {"train_loss": -38.829437255859375, "global_step": 274481, "epoch": 2268} {"train_loss": -36.18940353393555, "global_step": 274482, "epoch": 2268} {"train_loss": -40.264076232910156, "global_step": 274483, "epoch": 2268} {"train_loss": -41.49079513549805, "global_step": 274484, "epoch": 2268} {"train_loss": -40.231056213378906, "global_step": 274485, "epoch": 2268} {"train_loss": -41.276790618896484, "global_step": 274486, "epoch": 2268} {"train_loss": -40.028682708740234, "global_step": 274487, "epoch": 2268} {"train_loss": -38.29618453979492, "global_step": 274488, "epoch": 2268} {"train_loss": -41.87339401245117, "global_step": 274489, "epoch": 2268} {"train_loss": -42.0721549987793, "global_step": 274490, "epoch": 2268} {"train_loss": -40.70173263549805, "global_step": 274491, "epoch": 2268} {"train_loss": -42.07771682739258, "global_step": 274492, "epoch": 2268} {"train_loss": -40.13276290893555, "global_step": 274493, "epoch": 2268} {"train_loss": -42.531253814697266, "global_step": 274494, "epoch": 2268} {"train_loss": -40.330230712890625, "global_step": 274495, "epoch": 2268} {"train_loss": -41.36265563964844, "global_step": 274496, "epoch": 2268} {"train_loss": -41.201904296875, "global_step": 274497, "epoch": 2268} {"train_loss": -41.06827926635742, "global_step": 274498, "epoch": 2268} {"train_loss": -42.2511100769043, "global_step": 274499, "epoch": 2268} {"train_loss": -40.87251663208008, "global_step": 274500, "epoch": 2268} {"train_loss": -41.89520263671875, "global_step": 274501, "epoch": 2268} {"train_loss": -41.00638198852539, "global_step": 274502, "epoch": 2268} {"train_loss": -41.35493087768555, "global_step": 274503, "epoch": 2268} {"train_loss": -41.59754180908203, "global_step": 274504, "epoch": 2268} {"train_loss": -42.192073822021484, "global_step": 274505, "epoch": 2268} {"train_loss": -41.55046463012695, "global_step": 274506, "epoch": 2268} {"train_loss": -42.47333526611328, "global_step": 274507, "epoch": 2268} {"train_loss": -42.731178283691406, "global_step": 274508, "epoch": 2268} {"train_loss": -41.6566162109375, "global_step": 274509, "epoch": 2268} {"train_loss": -42.34199905395508, "global_step": 274510, "epoch": 2268} {"train_loss": -41.954002380371094, "global_step": 274511, "epoch": 2268} {"train_loss": -42.62299728393555, "global_step": 274512, "epoch": 2268} {"train_loss": -42.41387176513672, "global_step": 274513, "epoch": 2268} {"train_loss": -41.83219528198242, "global_step": 274514, "epoch": 2268} {"train_loss": -42.94559860229492, "global_step": 274515, "epoch": 2268} {"train_loss": -42.6390495300293, "global_step": 274516, "epoch": 2268} {"train_loss": -43.22031784057617, "global_step": 274517, "epoch": 2268} {"train_loss": -42.809913635253906, "global_step": 274518, "epoch": 2268} {"train_loss": -42.82399368286133, "global_step": 274519, "epoch": 2268} {"train_loss": -42.26496505737305, "global_step": 274520, "epoch": 2268} {"train_loss": -43.370338439941406, "global_step": 274521, "epoch": 2268} {"train_loss": -42.54301452636719, "global_step": 274522, "epoch": 2268} {"train_loss": -42.902530670166016, "global_step": 274523, "epoch": 2268} {"train_loss": -42.56562042236328, "global_step": 274524, "epoch": 2268} {"train_loss": -42.374855041503906, "global_step": 274525, "epoch": 2268} {"train_loss": -42.54660415649414, "global_step": 274526, "epoch": 2268} {"train_loss": -42.572425842285156, "global_step": 274527, "epoch": 2268} {"train_loss": -42.95840072631836, "global_step": 274528, "epoch": 2268} {"train_loss": -42.80123519897461, "global_step": 274529, "epoch": 2268} {"train_loss": -41.741729736328125, "global_step": 274530, "epoch": 2268} {"train_loss": -43.26657485961914, "global_step": 274531, "epoch": 2268} {"train_loss": -42.44588851928711, "global_step": 274532, "epoch": 2268} {"train_loss": -42.78656768798828, "global_step": 274533, "epoch": 2268} {"train_loss": -43.03358459472656, "global_step": 274534, "epoch": 2268} {"train_loss": -42.72257614135742, "global_step": 274535, "epoch": 2268} {"train_loss": -43.02932357788086, "global_step": 274536, "epoch": 2268} {"train_loss": -43.011077880859375, "global_step": 274537, "epoch": 2268} {"train_loss": -43.41630172729492, "global_step": 274538, "epoch": 2268} {"train_loss": -43.413516998291016, "global_step": 274539, "epoch": 2268} {"train_loss": -42.82194900512695, "global_step": 274540, "epoch": 2268} {"train_loss": -42.862953186035156, "global_step": 274541, "epoch": 2268} {"train_loss": -43.5711555480957, "global_step": 274542, "epoch": 2268} {"train_loss": -43.56666946411133, "global_step": 274543, "epoch": 2268} {"train_loss": -43.400474548339844, "global_step": 274544, "epoch": 2268} {"train_loss": -43.183040618896484, "global_step": 274545, "epoch": 2268} {"train_loss": -43.56021499633789, "global_step": 274546, "epoch": 2268} {"train_loss": -43.31365966796875, "global_step": 274547, "epoch": 2268} {"train_loss": -42.35558605982252, "global_step": 274548, "epoch": 2268, "val_loss": 2671681.25} {"train_loss": -43.85616683959961, "global_step": 274549, "epoch": 2269} {"train_loss": -42.95235824584961, "global_step": 274550, "epoch": 2269} {"train_loss": -42.62884521484375, "global_step": 274551, "epoch": 2269} {"train_loss": -43.27827072143555, "global_step": 274552, "epoch": 2269} {"train_loss": -43.48723220825195, "global_step": 274553, "epoch": 2269} {"train_loss": -42.489479064941406, "global_step": 274554, "epoch": 2269} {"train_loss": -42.42273712158203, "global_step": 274555, "epoch": 2269} {"train_loss": -43.053131103515625, "global_step": 274556, "epoch": 2269} {"train_loss": -43.8674201965332, "global_step": 274557, "epoch": 2269} {"train_loss": -42.737945556640625, "global_step": 274558, "epoch": 2269} {"train_loss": -42.84961700439453, "global_step": 274559, "epoch": 2269} {"train_loss": -43.13186264038086, "global_step": 274560, "epoch": 2269} {"train_loss": -43.89016342163086, "global_step": 274561, "epoch": 2269} {"train_loss": -43.451934814453125, "global_step": 274562, "epoch": 2269} {"train_loss": -42.91027069091797, "global_step": 274563, "epoch": 2269} {"train_loss": -43.614776611328125, "global_step": 274564, "epoch": 2269} {"train_loss": -43.686195373535156, "global_step": 274565, "epoch": 2269} {"train_loss": -43.11741256713867, "global_step": 274566, "epoch": 2269} {"train_loss": -43.14768600463867, "global_step": 274567, "epoch": 2269} {"train_loss": -44.14425277709961, "global_step": 274568, "epoch": 2269} {"train_loss": -43.41653060913086, "global_step": 274569, "epoch": 2269} {"train_loss": -43.97083282470703, "global_step": 274570, "epoch": 2269} {"train_loss": -42.96931838989258, "global_step": 274571, "epoch": 2269} {"train_loss": -43.522953033447266, "global_step": 274572, "epoch": 2269} {"train_loss": -43.632171630859375, "global_step": 274573, "epoch": 2269} {"train_loss": -43.90177917480469, "global_step": 274574, "epoch": 2269} {"train_loss": -43.555110931396484, "global_step": 274575, "epoch": 2269} {"train_loss": -42.55271530151367, "global_step": 274576, "epoch": 2269} {"train_loss": -43.3840446472168, "global_step": 274577, "epoch": 2269} {"train_loss": -43.07835388183594, "global_step": 274578, "epoch": 2269} {"train_loss": -43.820858001708984, "global_step": 274579, "epoch": 2269} {"train_loss": -42.334083557128906, "global_step": 274580, "epoch": 2269} {"train_loss": -43.29655838012695, "global_step": 274581, "epoch": 2269} {"train_loss": -42.300907135009766, "global_step": 274582, "epoch": 2269} {"train_loss": -41.20072555541992, "global_step": 274583, "epoch": 2269} {"train_loss": -41.64615249633789, "global_step": 274584, "epoch": 2269} {"train_loss": -41.239749908447266, "global_step": 274585, "epoch": 2269} {"train_loss": -41.890350341796875, "global_step": 274586, "epoch": 2269} {"train_loss": -42.948909759521484, "global_step": 274587, "epoch": 2269} {"train_loss": -41.72886276245117, "global_step": 274588, "epoch": 2269} {"train_loss": -43.08193588256836, "global_step": 274589, "epoch": 2269} {"train_loss": -42.29566192626953, "global_step": 274590, "epoch": 2269} {"train_loss": -42.74729919433594, "global_step": 274591, "epoch": 2269} {"train_loss": -43.42669677734375, "global_step": 274592, "epoch": 2269} {"train_loss": -42.57296371459961, "global_step": 274593, "epoch": 2269} {"train_loss": -41.43563461303711, "global_step": 274594, "epoch": 2269} {"train_loss": -42.682037353515625, "global_step": 274595, "epoch": 2269} {"train_loss": -41.316402435302734, "global_step": 274596, "epoch": 2269} {"train_loss": -43.08964157104492, "global_step": 274597, "epoch": 2269} {"train_loss": -41.68690872192383, "global_step": 274598, "epoch": 2269} {"train_loss": -41.68308639526367, "global_step": 274599, "epoch": 2269} {"train_loss": -42.601253509521484, "global_step": 274600, "epoch": 2269} {"train_loss": -43.15180206298828, "global_step": 274601, "epoch": 2269} {"train_loss": -41.40171432495117, "global_step": 274602, "epoch": 2269} {"train_loss": -42.877437591552734, "global_step": 274603, "epoch": 2269} {"train_loss": -42.615299224853516, "global_step": 274604, "epoch": 2269} {"train_loss": -42.59984588623047, "global_step": 274605, "epoch": 2269} {"train_loss": -42.95709228515625, "global_step": 274606, "epoch": 2269} {"train_loss": -42.492156982421875, "global_step": 274607, "epoch": 2269} {"train_loss": -40.199737548828125, "global_step": 274608, "epoch": 2269} {"train_loss": -42.40316390991211, "global_step": 274609, "epoch": 2269} {"train_loss": -42.84754180908203, "global_step": 274610, "epoch": 2269} {"train_loss": -42.94291687011719, "global_step": 274611, "epoch": 2269} {"train_loss": -42.34812545776367, "global_step": 274612, "epoch": 2269} {"train_loss": -43.143768310546875, "global_step": 274613, "epoch": 2269} {"train_loss": -42.7360954284668, "global_step": 274614, "epoch": 2269} {"train_loss": -42.91238021850586, "global_step": 274615, "epoch": 2269} {"train_loss": -43.37537384033203, "global_step": 274616, "epoch": 2269} {"train_loss": -42.913509368896484, "global_step": 274617, "epoch": 2269} {"train_loss": -42.647926330566406, "global_step": 274618, "epoch": 2269} {"train_loss": -42.321659088134766, "global_step": 274619, "epoch": 2269} {"train_loss": -41.732425689697266, "global_step": 274620, "epoch": 2269} {"train_loss": -42.61020278930664, "global_step": 274621, "epoch": 2269} {"train_loss": -42.365447998046875, "global_step": 274622, "epoch": 2269} {"train_loss": -42.96512985229492, "global_step": 274623, "epoch": 2269} {"train_loss": -43.36234664916992, "global_step": 274624, "epoch": 2269} {"train_loss": -42.66493606567383, "global_step": 274625, "epoch": 2269} {"train_loss": -42.704219818115234, "global_step": 274626, "epoch": 2269} {"train_loss": -42.71279525756836, "global_step": 274627, "epoch": 2269} {"train_loss": -42.70082473754883, "global_step": 274628, "epoch": 2269} {"train_loss": -43.65126037597656, "global_step": 274629, "epoch": 2269} {"train_loss": -43.13096618652344, "global_step": 274630, "epoch": 2269} {"train_loss": -43.30040740966797, "global_step": 274631, "epoch": 2269} {"train_loss": -43.200077056884766, "global_step": 274632, "epoch": 2269} {"train_loss": -43.204219818115234, "global_step": 274633, "epoch": 2269} {"train_loss": -43.13083267211914, "global_step": 274634, "epoch": 2269} {"train_loss": -43.26121139526367, "global_step": 274635, "epoch": 2269} {"train_loss": -43.42783737182617, "global_step": 274636, "epoch": 2269} {"train_loss": -43.33932113647461, "global_step": 274637, "epoch": 2269} {"train_loss": -43.25631332397461, "global_step": 274638, "epoch": 2269} {"train_loss": -43.704044342041016, "global_step": 274639, "epoch": 2269} {"train_loss": -43.921504974365234, "global_step": 274640, "epoch": 2269} {"train_loss": -43.00382614135742, "global_step": 274641, "epoch": 2269} {"train_loss": -44.20563888549805, "global_step": 274642, "epoch": 2269} {"train_loss": -43.95664596557617, "global_step": 274643, "epoch": 2269} {"train_loss": -43.39118576049805, "global_step": 274644, "epoch": 2269} {"train_loss": -43.87488555908203, "global_step": 274645, "epoch": 2269} {"train_loss": -43.41643524169922, "global_step": 274646, "epoch": 2269} {"train_loss": -43.99923324584961, "global_step": 274647, "epoch": 2269} {"train_loss": -43.16157150268555, "global_step": 274648, "epoch": 2269} {"train_loss": -43.26872634887695, "global_step": 274649, "epoch": 2269} {"train_loss": -43.77549743652344, "global_step": 274650, "epoch": 2269} {"train_loss": -43.59125900268555, "global_step": 274651, "epoch": 2269} {"train_loss": -43.37095260620117, "global_step": 274652, "epoch": 2269} {"train_loss": -42.72311019897461, "global_step": 274653, "epoch": 2269} {"train_loss": -42.9915771484375, "global_step": 274654, "epoch": 2269} {"train_loss": -43.6959228515625, "global_step": 274655, "epoch": 2269} {"train_loss": -42.92143630981445, "global_step": 274656, "epoch": 2269} {"train_loss": -43.050106048583984, "global_step": 274657, "epoch": 2269} {"train_loss": -42.727134704589844, "global_step": 274658, "epoch": 2269} {"train_loss": -43.83161163330078, "global_step": 274659, "epoch": 2269} {"train_loss": -43.86550521850586, "global_step": 274660, "epoch": 2269} {"train_loss": -43.82439422607422, "global_step": 274661, "epoch": 2269} {"train_loss": -42.87053298950195, "global_step": 274662, "epoch": 2269} {"train_loss": -43.03803634643555, "global_step": 274663, "epoch": 2269} {"train_loss": -43.67727279663086, "global_step": 274664, "epoch": 2269} {"train_loss": -43.66899490356445, "global_step": 274665, "epoch": 2269} {"train_loss": -42.63116455078125, "global_step": 274666, "epoch": 2269} {"train_loss": -42.30350875854492, "global_step": 274667, "epoch": 2269} {"train_loss": -42.71256637573242, "global_step": 274668, "epoch": 2269} {"train_loss": -42.95450081312952, "global_step": 274669, "epoch": 2269, "val_loss": 2692415.25} {"train_loss": -39.88873291015625, "global_step": 274670, "epoch": 2270} {"train_loss": -42.46467208862305, "global_step": 274671, "epoch": 2270} {"train_loss": -43.047340393066406, "global_step": 274672, "epoch": 2270} {"train_loss": -40.80648422241211, "global_step": 274673, "epoch": 2270} {"train_loss": -40.91791915893555, "global_step": 274674, "epoch": 2270} {"train_loss": -41.13648223876953, "global_step": 274675, "epoch": 2270} {"train_loss": -40.94649887084961, "global_step": 274676, "epoch": 2270} {"train_loss": -42.11692810058594, "global_step": 274677, "epoch": 2270} {"train_loss": -42.048561096191406, "global_step": 274678, "epoch": 2270} {"train_loss": -39.59562301635742, "global_step": 274679, "epoch": 2270} {"train_loss": -35.521339416503906, "global_step": 274680, "epoch": 2270} {"train_loss": -39.578704833984375, "global_step": 274681, "epoch": 2270} {"train_loss": -41.54841232299805, "global_step": 274682, "epoch": 2270} {"train_loss": -35.85487747192383, "global_step": 274683, "epoch": 2270} {"train_loss": -35.258846282958984, "global_step": 274684, "epoch": 2270} {"train_loss": -41.057376861572266, "global_step": 274685, "epoch": 2270} {"train_loss": -39.678401947021484, "global_step": 274686, "epoch": 2270} {"train_loss": -38.29753494262695, "global_step": 274687, "epoch": 2270} {"train_loss": -42.401615142822266, "global_step": 274688, "epoch": 2270} {"train_loss": -39.80451202392578, "global_step": 274689, "epoch": 2270} {"train_loss": -41.85627365112305, "global_step": 274690, "epoch": 2270} {"train_loss": -39.88792037963867, "global_step": 274691, "epoch": 2270} {"train_loss": -42.659515380859375, "global_step": 274692, "epoch": 2270} {"train_loss": -38.89545822143555, "global_step": 274693, "epoch": 2270} {"train_loss": -41.94012451171875, "global_step": 274694, "epoch": 2270} {"train_loss": -41.469356536865234, "global_step": 274695, "epoch": 2270} {"train_loss": -40.716705322265625, "global_step": 274696, "epoch": 2270} {"train_loss": -42.22261428833008, "global_step": 274697, "epoch": 2270} {"train_loss": -41.289283752441406, "global_step": 274698, "epoch": 2270} {"train_loss": -42.63645553588867, "global_step": 274699, "epoch": 2270} {"train_loss": -41.37420654296875, "global_step": 274700, "epoch": 2270} {"train_loss": -42.98320388793945, "global_step": 274701, "epoch": 2270} {"train_loss": -41.09938430786133, "global_step": 274702, "epoch": 2270} {"train_loss": -43.10504150390625, "global_step": 274703, "epoch": 2270} {"train_loss": -41.838233947753906, "global_step": 274704, "epoch": 2270} {"train_loss": -42.77472686767578, "global_step": 274705, "epoch": 2270} {"train_loss": -41.4454345703125, "global_step": 274706, "epoch": 2270} {"train_loss": -42.598995208740234, "global_step": 274707, "epoch": 2270} {"train_loss": -41.8330078125, "global_step": 274708, "epoch": 2270} {"train_loss": -43.04610824584961, "global_step": 274709, "epoch": 2270} {"train_loss": -41.72732162475586, "global_step": 274710, "epoch": 2270} {"train_loss": -43.164573669433594, "global_step": 274711, "epoch": 2270} {"train_loss": -41.89284133911133, "global_step": 274712, "epoch": 2270} {"train_loss": -42.762332916259766, "global_step": 274713, "epoch": 2270} {"train_loss": -42.32164764404297, "global_step": 274714, "epoch": 2270} {"train_loss": -43.03570556640625, "global_step": 274715, "epoch": 2270} {"train_loss": -43.02417755126953, "global_step": 274716, "epoch": 2270} {"train_loss": -42.65734100341797, "global_step": 274717, "epoch": 2270} {"train_loss": -43.190303802490234, "global_step": 274718, "epoch": 2270} {"train_loss": -43.003883361816406, "global_step": 274719, "epoch": 2270} {"train_loss": -43.124107360839844, "global_step": 274720, "epoch": 2270} {"train_loss": -42.82596206665039, "global_step": 274721, "epoch": 2270} {"train_loss": -42.90085220336914, "global_step": 274722, "epoch": 2270} {"train_loss": -42.907066345214844, "global_step": 274723, "epoch": 2270} {"train_loss": -43.14544677734375, "global_step": 274724, "epoch": 2270} {"train_loss": -42.9020881652832, "global_step": 274725, "epoch": 2270} {"train_loss": -42.98480224609375, "global_step": 274726, "epoch": 2270} {"train_loss": -43.660335540771484, "global_step": 274727, "epoch": 2270} {"train_loss": -43.38454055786133, "global_step": 274728, "epoch": 2270} {"train_loss": -43.68307876586914, "global_step": 274729, "epoch": 2270} {"train_loss": -43.518798828125, "global_step": 274730, "epoch": 2270} {"train_loss": -43.551204681396484, "global_step": 274731, "epoch": 2270} {"train_loss": -43.46126174926758, "global_step": 274732, "epoch": 2270} {"train_loss": -43.29322052001953, "global_step": 274733, "epoch": 2270} {"train_loss": -44.02187728881836, "global_step": 274734, "epoch": 2270} {"train_loss": -43.7960205078125, "global_step": 274735, "epoch": 2270} {"train_loss": -43.48835372924805, "global_step": 274736, "epoch": 2270} {"train_loss": -43.89567947387695, "global_step": 274737, "epoch": 2270} {"train_loss": -43.530303955078125, "global_step": 274738, "epoch": 2270} {"train_loss": -44.409481048583984, "global_step": 274739, "epoch": 2270} {"train_loss": -43.62453079223633, "global_step": 274740, "epoch": 2270} {"train_loss": -43.960166931152344, "global_step": 274741, "epoch": 2270} {"train_loss": -44.4679069519043, "global_step": 274742, "epoch": 2270} {"train_loss": -43.92900466918945, "global_step": 274743, "epoch": 2270} {"train_loss": -44.05167007446289, "global_step": 274744, "epoch": 2270} {"train_loss": -44.057621002197266, "global_step": 274745, "epoch": 2270} {"train_loss": -44.17109298706055, "global_step": 274746, "epoch": 2270} {"train_loss": -43.67484664916992, "global_step": 274747, "epoch": 2270} {"train_loss": -44.42704772949219, "global_step": 274748, "epoch": 2270} {"train_loss": -44.379676818847656, "global_step": 274749, "epoch": 2270} {"train_loss": -43.16715621948242, "global_step": 274750, "epoch": 2270} {"train_loss": -44.377777099609375, "global_step": 274751, "epoch": 2270} {"train_loss": -43.92213821411133, "global_step": 274752, "epoch": 2270} {"train_loss": -43.20044708251953, "global_step": 274753, "epoch": 2270} {"train_loss": -44.340450286865234, "global_step": 274754, "epoch": 2270} {"train_loss": -43.189693450927734, "global_step": 274755, "epoch": 2270} {"train_loss": -43.35615158081055, "global_step": 274756, "epoch": 2270} {"train_loss": -44.2515983581543, "global_step": 274757, "epoch": 2270} {"train_loss": -44.44849395751953, "global_step": 274758, "epoch": 2270} {"train_loss": -42.7224235534668, "global_step": 274759, "epoch": 2270} {"train_loss": -43.396888732910156, "global_step": 274760, "epoch": 2270} {"train_loss": -44.24169921875, "global_step": 274761, "epoch": 2270} {"train_loss": -43.09627151489258, "global_step": 274762, "epoch": 2270} {"train_loss": -42.593360900878906, "global_step": 274763, "epoch": 2270} {"train_loss": -43.51189041137695, "global_step": 274764, "epoch": 2270} {"train_loss": -44.05344009399414, "global_step": 274765, "epoch": 2270} {"train_loss": -43.733924865722656, "global_step": 274766, "epoch": 2270} {"train_loss": -43.740516662597656, "global_step": 274767, "epoch": 2270} {"train_loss": -44.3991584777832, "global_step": 274768, "epoch": 2270} {"train_loss": -43.6845588684082, "global_step": 274769, "epoch": 2270} {"train_loss": -43.96719741821289, "global_step": 274770, "epoch": 2270} {"train_loss": -43.655391693115234, "global_step": 274771, "epoch": 2270} {"train_loss": -43.59246826171875, "global_step": 274772, "epoch": 2270} {"train_loss": -43.21271514892578, "global_step": 274773, "epoch": 2270} {"train_loss": -43.9050178527832, "global_step": 274774, "epoch": 2270} {"train_loss": -43.52006149291992, "global_step": 274775, "epoch": 2270} {"train_loss": -44.16939926147461, "global_step": 274776, "epoch": 2270} {"train_loss": -43.54059600830078, "global_step": 274777, "epoch": 2270} {"train_loss": -42.855403900146484, "global_step": 274778, "epoch": 2270} {"train_loss": -40.54790115356445, "global_step": 274779, "epoch": 2270} {"train_loss": -36.557254791259766, "global_step": 274780, "epoch": 2270} {"train_loss": -32.952850341796875, "global_step": 274781, "epoch": 2270} {"train_loss": -31.208454132080078, "global_step": 274782, "epoch": 2270} {"train_loss": -33.1029167175293, "global_step": 274783, "epoch": 2270} {"train_loss": -41.15907669067383, "global_step": 274784, "epoch": 2270} {"train_loss": -42.37954330444336, "global_step": 274785, "epoch": 2270} {"train_loss": -37.69814682006836, "global_step": 274786, "epoch": 2270} {"train_loss": -35.392173767089844, "global_step": 274787, "epoch": 2270} {"train_loss": -40.92525863647461, "global_step": 274788, "epoch": 2270} {"train_loss": -42.26517868041992, "global_step": 274789, "epoch": 2270} {"train_loss": -42.0986137705401, "global_step": 274790, "epoch": 2270, "val_loss": 2743390.0} {"train_loss": -40.94783401489258, "global_step": 274791, "epoch": 2271} {"train_loss": -41.887306213378906, "global_step": 274792, "epoch": 2271} {"train_loss": -41.28998565673828, "global_step": 274793, "epoch": 2271} {"train_loss": -42.29349899291992, "global_step": 274794, "epoch": 2271} {"train_loss": -42.47999572753906, "global_step": 274795, "epoch": 2271} {"train_loss": -42.014862060546875, "global_step": 274796, "epoch": 2271} {"train_loss": -42.89423751831055, "global_step": 274797, "epoch": 2271} {"train_loss": -41.83584976196289, "global_step": 274798, "epoch": 2271} {"train_loss": -42.77924728393555, "global_step": 274799, "epoch": 2271} {"train_loss": -43.03093338012695, "global_step": 274800, "epoch": 2271} {"train_loss": -42.606605529785156, "global_step": 274801, "epoch": 2271} {"train_loss": -42.95753479003906, "global_step": 274802, "epoch": 2271} {"train_loss": -42.86215591430664, "global_step": 274803, "epoch": 2271} {"train_loss": -43.08045196533203, "global_step": 274804, "epoch": 2271} {"train_loss": -43.421634674072266, "global_step": 274805, "epoch": 2271} {"train_loss": -43.2863883972168, "global_step": 274806, "epoch": 2271} {"train_loss": -43.03240966796875, "global_step": 274807, "epoch": 2271} {"train_loss": -43.341304779052734, "global_step": 274808, "epoch": 2271} {"train_loss": -42.23454284667969, "global_step": 274809, "epoch": 2271} {"train_loss": -43.29851150512695, "global_step": 274810, "epoch": 2271} {"train_loss": -42.21757125854492, "global_step": 274811, "epoch": 2271} {"train_loss": -43.11906051635742, "global_step": 274812, "epoch": 2271} {"train_loss": -42.243690490722656, "global_step": 274813, "epoch": 2271} {"train_loss": -43.28190231323242, "global_step": 274814, "epoch": 2271} {"train_loss": -41.563594818115234, "global_step": 274815, "epoch": 2271} {"train_loss": -43.784881591796875, "global_step": 274816, "epoch": 2271} {"train_loss": -42.356685638427734, "global_step": 274817, "epoch": 2271} {"train_loss": -43.337581634521484, "global_step": 274818, "epoch": 2271} {"train_loss": -43.055641174316406, "global_step": 274819, "epoch": 2271} {"train_loss": -43.54630661010742, "global_step": 274820, "epoch": 2271} {"train_loss": -43.06467056274414, "global_step": 274821, "epoch": 2271} {"train_loss": -43.35381317138672, "global_step": 274822, "epoch": 2271} {"train_loss": -42.72842788696289, "global_step": 274823, "epoch": 2271} {"train_loss": -43.54601287841797, "global_step": 274824, "epoch": 2271} {"train_loss": -43.1390266418457, "global_step": 274825, "epoch": 2271} {"train_loss": -43.75571060180664, "global_step": 274826, "epoch": 2271} {"train_loss": -43.37248611450195, "global_step": 274827, "epoch": 2271} {"train_loss": -43.45002365112305, "global_step": 274828, "epoch": 2271} {"train_loss": -43.21957015991211, "global_step": 274829, "epoch": 2271} {"train_loss": -43.482051849365234, "global_step": 274830, "epoch": 2271} {"train_loss": -43.48159408569336, "global_step": 274831, "epoch": 2271} {"train_loss": -43.895416259765625, "global_step": 274832, "epoch": 2271} {"train_loss": -43.737037658691406, "global_step": 274833, "epoch": 2271} {"train_loss": -43.82029724121094, "global_step": 274834, "epoch": 2271} {"train_loss": -43.261512756347656, "global_step": 274835, "epoch": 2271} {"train_loss": -43.3294677734375, "global_step": 274836, "epoch": 2271} {"train_loss": -43.43174362182617, "global_step": 274837, "epoch": 2271} {"train_loss": -43.59736251831055, "global_step": 274838, "epoch": 2271} {"train_loss": -43.32442855834961, "global_step": 274839, "epoch": 2271} {"train_loss": -43.38187789916992, "global_step": 274840, "epoch": 2271} {"train_loss": -44.07734298706055, "global_step": 274841, "epoch": 2271} {"train_loss": -44.2276611328125, "global_step": 274842, "epoch": 2271} {"train_loss": -44.569007873535156, "global_step": 274843, "epoch": 2271} {"train_loss": -43.93117141723633, "global_step": 274844, "epoch": 2271} {"train_loss": -43.1997184753418, "global_step": 274845, "epoch": 2271} {"train_loss": -44.33107376098633, "global_step": 274846, "epoch": 2271} {"train_loss": -43.7854118347168, "global_step": 274847, "epoch": 2271} {"train_loss": -43.942604064941406, "global_step": 274848, "epoch": 2271} {"train_loss": -43.36433029174805, "global_step": 274849, "epoch": 2271} {"train_loss": -43.797996520996094, "global_step": 274850, "epoch": 2271} {"train_loss": -43.3212776184082, "global_step": 274851, "epoch": 2271} {"train_loss": -43.92524719238281, "global_step": 274852, "epoch": 2271} {"train_loss": -44.19743347167969, "global_step": 274853, "epoch": 2271} {"train_loss": -43.74668502807617, "global_step": 274854, "epoch": 2271} {"train_loss": -43.75472640991211, "global_step": 274855, "epoch": 2271} {"train_loss": -44.55922317504883, "global_step": 274856, "epoch": 2271} {"train_loss": -43.67927932739258, "global_step": 274857, "epoch": 2271} {"train_loss": -44.1035270690918, "global_step": 274858, "epoch": 2271} {"train_loss": -44.241668701171875, "global_step": 274859, "epoch": 2271} {"train_loss": -43.799068450927734, "global_step": 274860, "epoch": 2271} {"train_loss": -43.09279251098633, "global_step": 274861, "epoch": 2271} {"train_loss": -43.39570236206055, "global_step": 274862, "epoch": 2271} {"train_loss": -43.649295806884766, "global_step": 274863, "epoch": 2271} {"train_loss": -43.85620880126953, "global_step": 274864, "epoch": 2271} {"train_loss": -44.421627044677734, "global_step": 274865, "epoch": 2271} {"train_loss": -44.058143615722656, "global_step": 274866, "epoch": 2271} {"train_loss": -43.941890716552734, "global_step": 274867, "epoch": 2271} {"train_loss": -42.502925872802734, "global_step": 274868, "epoch": 2271} {"train_loss": -42.95198440551758, "global_step": 274869, "epoch": 2271} {"train_loss": -42.324703216552734, "global_step": 274870, "epoch": 2271} {"train_loss": -42.24796676635742, "global_step": 274871, "epoch": 2271} {"train_loss": -41.15224838256836, "global_step": 274872, "epoch": 2271} {"train_loss": -42.71897506713867, "global_step": 274873, "epoch": 2271} {"train_loss": -42.40396499633789, "global_step": 274874, "epoch": 2271} {"train_loss": -42.631526947021484, "global_step": 274875, "epoch": 2271} {"train_loss": -43.323970794677734, "global_step": 274876, "epoch": 2271} {"train_loss": -43.26587677001953, "global_step": 274877, "epoch": 2271} {"train_loss": -42.04159927368164, "global_step": 274878, "epoch": 2271} {"train_loss": -41.9738883972168, "global_step": 274879, "epoch": 2271} {"train_loss": -42.279014587402344, "global_step": 274880, "epoch": 2271} {"train_loss": -42.93036651611328, "global_step": 274881, "epoch": 2271} {"train_loss": -42.48664855957031, "global_step": 274882, "epoch": 2271} {"train_loss": -41.739105224609375, "global_step": 274883, "epoch": 2271} {"train_loss": -40.38324737548828, "global_step": 274884, "epoch": 2271} {"train_loss": -39.48055648803711, "global_step": 274885, "epoch": 2271} {"train_loss": -41.58534622192383, "global_step": 274886, "epoch": 2271} {"train_loss": -42.854469299316406, "global_step": 274887, "epoch": 2271} {"train_loss": -40.10773849487305, "global_step": 274888, "epoch": 2271} {"train_loss": -41.92033767700195, "global_step": 274889, "epoch": 2271} {"train_loss": -41.881771087646484, "global_step": 274890, "epoch": 2271} {"train_loss": -38.827980041503906, "global_step": 274891, "epoch": 2271} {"train_loss": -39.80144119262695, "global_step": 274892, "epoch": 2271} {"train_loss": -43.33367919921875, "global_step": 274893, "epoch": 2271} {"train_loss": -40.14833068847656, "global_step": 274894, "epoch": 2271} {"train_loss": -40.434959411621094, "global_step": 274895, "epoch": 2271} {"train_loss": -43.258724212646484, "global_step": 274896, "epoch": 2271} {"train_loss": -41.965431213378906, "global_step": 274897, "epoch": 2271} {"train_loss": -42.74427795410156, "global_step": 274898, "epoch": 2271} {"train_loss": -42.2235221862793, "global_step": 274899, "epoch": 2271} {"train_loss": -42.31315231323242, "global_step": 274900, "epoch": 2271} {"train_loss": -43.317623138427734, "global_step": 274901, "epoch": 2271} {"train_loss": -42.8309440612793, "global_step": 274902, "epoch": 2271} {"train_loss": -43.05547332763672, "global_step": 274903, "epoch": 2271} {"train_loss": -42.93937301635742, "global_step": 274904, "epoch": 2271} {"train_loss": -43.592220306396484, "global_step": 274905, "epoch": 2271} {"train_loss": -42.287841796875, "global_step": 274906, "epoch": 2271} {"train_loss": -42.40987777709961, "global_step": 274907, "epoch": 2271} {"train_loss": -42.48525619506836, "global_step": 274908, "epoch": 2271} {"train_loss": -43.23594665527344, "global_step": 274909, "epoch": 2271} {"train_loss": -42.944271087646484, "global_step": 274910, "epoch": 2271} {"train_loss": -42.872287498032755, "global_step": 274911, "epoch": 2271, "val_loss": 2614668.25} {"train_loss": -43.738800048828125, "global_step": 274912, "epoch": 2272} {"train_loss": -43.066036224365234, "global_step": 274913, "epoch": 2272} {"train_loss": -43.980255126953125, "global_step": 274914, "epoch": 2272} {"train_loss": -43.30548095703125, "global_step": 274915, "epoch": 2272} {"train_loss": -43.614864349365234, "global_step": 274916, "epoch": 2272} {"train_loss": -43.72115707397461, "global_step": 274917, "epoch": 2272} {"train_loss": -43.54256820678711, "global_step": 274918, "epoch": 2272} {"train_loss": -44.02976608276367, "global_step": 274919, "epoch": 2272} {"train_loss": -43.729793548583984, "global_step": 274920, "epoch": 2272} {"train_loss": -43.54671859741211, "global_step": 274921, "epoch": 2272} {"train_loss": -43.843231201171875, "global_step": 274922, "epoch": 2272} {"train_loss": -43.755374908447266, "global_step": 274923, "epoch": 2272} {"train_loss": -43.610225677490234, "global_step": 274924, "epoch": 2272} {"train_loss": -43.66767120361328, "global_step": 274925, "epoch": 2272} {"train_loss": -43.86333084106445, "global_step": 274926, "epoch": 2272} {"train_loss": -43.14783477783203, "global_step": 274927, "epoch": 2272} {"train_loss": -43.539913177490234, "global_step": 274928, "epoch": 2272} {"train_loss": -43.2484245300293, "global_step": 274929, "epoch": 2272} {"train_loss": -43.29853057861328, "global_step": 274930, "epoch": 2272} {"train_loss": -43.50331497192383, "global_step": 274931, "epoch": 2272} {"train_loss": -43.95150375366211, "global_step": 274932, "epoch": 2272} {"train_loss": -43.67768096923828, "global_step": 274933, "epoch": 2272} {"train_loss": -43.51789855957031, "global_step": 274934, "epoch": 2272} {"train_loss": -43.1532096862793, "global_step": 274935, "epoch": 2272} {"train_loss": -43.65750503540039, "global_step": 274936, "epoch": 2272} {"train_loss": -43.681209564208984, "global_step": 274937, "epoch": 2272} {"train_loss": -43.64896011352539, "global_step": 274938, "epoch": 2272} {"train_loss": -41.9350700378418, "global_step": 274939, "epoch": 2272} {"train_loss": -42.34107208251953, "global_step": 274940, "epoch": 2272} {"train_loss": -42.07477951049805, "global_step": 274941, "epoch": 2272} {"train_loss": -43.00107192993164, "global_step": 274942, "epoch": 2272} {"train_loss": -42.26202392578125, "global_step": 274943, "epoch": 2272} {"train_loss": -42.594913482666016, "global_step": 274944, "epoch": 2272} {"train_loss": -43.154842376708984, "global_step": 274945, "epoch": 2272} {"train_loss": -42.52486038208008, "global_step": 274946, "epoch": 2272} {"train_loss": -43.43631362915039, "global_step": 274947, "epoch": 2272} {"train_loss": -41.774139404296875, "global_step": 274948, "epoch": 2272} {"train_loss": -42.89111328125, "global_step": 274949, "epoch": 2272} {"train_loss": -43.64728927612305, "global_step": 274950, "epoch": 2272} {"train_loss": -41.74222946166992, "global_step": 274951, "epoch": 2272} {"train_loss": -42.735877990722656, "global_step": 274952, "epoch": 2272} {"train_loss": -43.499263763427734, "global_step": 274953, "epoch": 2272} {"train_loss": -42.2799186706543, "global_step": 274954, "epoch": 2272} {"train_loss": -43.035186767578125, "global_step": 274955, "epoch": 2272} {"train_loss": -43.23851013183594, "global_step": 274956, "epoch": 2272} {"train_loss": -42.30957794189453, "global_step": 274957, "epoch": 2272} {"train_loss": -43.01487350463867, "global_step": 274958, "epoch": 2272} {"train_loss": -43.14365005493164, "global_step": 274959, "epoch": 2272} {"train_loss": -42.84141159057617, "global_step": 274960, "epoch": 2272} {"train_loss": -42.82435989379883, "global_step": 274961, "epoch": 2272} {"train_loss": -42.94066619873047, "global_step": 274962, "epoch": 2272} {"train_loss": -42.70077133178711, "global_step": 274963, "epoch": 2272} {"train_loss": -42.25132369995117, "global_step": 274964, "epoch": 2272} {"train_loss": -43.463863372802734, "global_step": 274965, "epoch": 2272} {"train_loss": -43.075111389160156, "global_step": 274966, "epoch": 2272} {"train_loss": -41.404232025146484, "global_step": 274967, "epoch": 2272} {"train_loss": -43.09037399291992, "global_step": 274968, "epoch": 2272} {"train_loss": -43.22628402709961, "global_step": 274969, "epoch": 2272} {"train_loss": -43.327266693115234, "global_step": 274970, "epoch": 2272} {"train_loss": -43.181678771972656, "global_step": 274971, "epoch": 2272} {"train_loss": -42.046756744384766, "global_step": 274972, "epoch": 2272} {"train_loss": -41.857086181640625, "global_step": 274973, "epoch": 2272} {"train_loss": -42.732154846191406, "global_step": 274974, "epoch": 2272} {"train_loss": -42.732357025146484, "global_step": 274975, "epoch": 2272} {"train_loss": -42.465816497802734, "global_step": 274976, "epoch": 2272} {"train_loss": -43.02787780761719, "global_step": 274977, "epoch": 2272} {"train_loss": -43.06597900390625, "global_step": 274978, "epoch": 2272} {"train_loss": -42.090816497802734, "global_step": 274979, "epoch": 2272} {"train_loss": -43.861541748046875, "global_step": 274980, "epoch": 2272} {"train_loss": -41.72827911376953, "global_step": 274981, "epoch": 2272} {"train_loss": -42.366912841796875, "global_step": 274982, "epoch": 2272} {"train_loss": -42.980010986328125, "global_step": 274983, "epoch": 2272} {"train_loss": -42.48280715942383, "global_step": 274984, "epoch": 2272} {"train_loss": -43.296913146972656, "global_step": 274985, "epoch": 2272} {"train_loss": -43.24676513671875, "global_step": 274986, "epoch": 2272} {"train_loss": -43.3764762878418, "global_step": 274987, "epoch": 2272} {"train_loss": -43.474613189697266, "global_step": 274988, "epoch": 2272} {"train_loss": -43.61361312866211, "global_step": 274989, "epoch": 2272} {"train_loss": -43.89836120605469, "global_step": 274990, "epoch": 2272} {"train_loss": -43.64829635620117, "global_step": 274991, "epoch": 2272} {"train_loss": -43.49580001831055, "global_step": 274992, "epoch": 2272} {"train_loss": -44.2253532409668, "global_step": 274993, "epoch": 2272} {"train_loss": -43.99775314331055, "global_step": 274994, "epoch": 2272} {"train_loss": -43.7866096496582, "global_step": 274995, "epoch": 2272} {"train_loss": -43.439510345458984, "global_step": 274996, "epoch": 2272} {"train_loss": -43.739620208740234, "global_step": 274997, "epoch": 2272} {"train_loss": -43.918739318847656, "global_step": 274998, "epoch": 2272} {"train_loss": -43.176692962646484, "global_step": 274999, "epoch": 2272} {"train_loss": -43.90692901611328, "global_step": 275000, "epoch": 2272} {"train_loss": -44.1815299987793, "global_step": 275001, "epoch": 2272} {"train_loss": -43.13063430786133, "global_step": 275002, "epoch": 2272} {"train_loss": -41.87335968017578, "global_step": 275003, "epoch": 2272} {"train_loss": -44.094722747802734, "global_step": 275004, "epoch": 2272} {"train_loss": -42.872772216796875, "global_step": 275005, "epoch": 2272} {"train_loss": -41.456329345703125, "global_step": 275006, "epoch": 2272} {"train_loss": -42.1331672668457, "global_step": 275007, "epoch": 2272} {"train_loss": -42.29904556274414, "global_step": 275008, "epoch": 2272} {"train_loss": -43.41714096069336, "global_step": 275009, "epoch": 2272} {"train_loss": -43.0723876953125, "global_step": 275010, "epoch": 2272} {"train_loss": -43.08967208862305, "global_step": 275011, "epoch": 2272} {"train_loss": -43.765071868896484, "global_step": 275012, "epoch": 2272} {"train_loss": -43.14106750488281, "global_step": 275013, "epoch": 2272} {"train_loss": -43.82257843017578, "global_step": 275014, "epoch": 2272} {"train_loss": -43.20779037475586, "global_step": 275015, "epoch": 2272} {"train_loss": -44.16278076171875, "global_step": 275016, "epoch": 2272} {"train_loss": -44.02440643310547, "global_step": 275017, "epoch": 2272} {"train_loss": -42.87704086303711, "global_step": 275018, "epoch": 2272} {"train_loss": -42.777099609375, "global_step": 275019, "epoch": 2272} {"train_loss": -44.07468032836914, "global_step": 275020, "epoch": 2272} {"train_loss": -43.49675750732422, "global_step": 275021, "epoch": 2272} {"train_loss": -43.1982536315918, "global_step": 275022, "epoch": 2272} {"train_loss": -43.822059631347656, "global_step": 275023, "epoch": 2272} {"train_loss": -44.02101516723633, "global_step": 275024, "epoch": 2272} {"train_loss": -43.735206604003906, "global_step": 275025, "epoch": 2272} {"train_loss": -43.489498138427734, "global_step": 275026, "epoch": 2272} {"train_loss": -43.942176818847656, "global_step": 275027, "epoch": 2272} {"train_loss": -43.358924865722656, "global_step": 275028, "epoch": 2272} {"train_loss": -43.303749084472656, "global_step": 275029, "epoch": 2272} {"train_loss": -43.76055908203125, "global_step": 275030, "epoch": 2272} {"train_loss": -43.6655387878418, "global_step": 275031, "epoch": 2272} {"train_loss": -43.19647147438743, "global_step": 275032, "epoch": 2272, "val_loss": 2755478.25} {"train_loss": -43.494014739990234, "global_step": 275033, "epoch": 2273} {"train_loss": -44.03200149536133, "global_step": 275034, "epoch": 2273} {"train_loss": -43.77665710449219, "global_step": 275035, "epoch": 2273} {"train_loss": -44.002986907958984, "global_step": 275036, "epoch": 2273} {"train_loss": -43.986785888671875, "global_step": 275037, "epoch": 2273} {"train_loss": -33.34466552734375, "global_step": 275038, "epoch": 2273} {"train_loss": -42.52081298828125, "global_step": 275039, "epoch": 2273} {"train_loss": -43.90975570678711, "global_step": 275040, "epoch": 2273} {"train_loss": -43.603981018066406, "global_step": 275041, "epoch": 2273} {"train_loss": -41.81708908081055, "global_step": 275042, "epoch": 2273} {"train_loss": -34.12186813354492, "global_step": 275043, "epoch": 2273} {"train_loss": -41.811737060546875, "global_step": 275044, "epoch": 2273} {"train_loss": -39.19152069091797, "global_step": 275045, "epoch": 2273} {"train_loss": -41.952552795410156, "global_step": 275046, "epoch": 2273} {"train_loss": -41.5422248840332, "global_step": 275047, "epoch": 2273} {"train_loss": -39.720542907714844, "global_step": 275048, "epoch": 2273} {"train_loss": -41.834991455078125, "global_step": 275049, "epoch": 2273} {"train_loss": -38.7260627746582, "global_step": 275050, "epoch": 2273} {"train_loss": -41.02791976928711, "global_step": 275051, "epoch": 2273} {"train_loss": -38.608333587646484, "global_step": 275052, "epoch": 2273} {"train_loss": -38.71745681762695, "global_step": 275053, "epoch": 2273} {"train_loss": -35.712928771972656, "global_step": 275054, "epoch": 2273} {"train_loss": -37.059967041015625, "global_step": 275055, "epoch": 2273} {"train_loss": -29.109012603759766, "global_step": 275056, "epoch": 2273} {"train_loss": -39.721370697021484, "global_step": 275057, "epoch": 2273} {"train_loss": -32.8910026550293, "global_step": 275058, "epoch": 2273} {"train_loss": -32.98667526245117, "global_step": 275059, "epoch": 2273} {"train_loss": -21.621706008911133, "global_step": 275060, "epoch": 2273} {"train_loss": -36.47021484375, "global_step": 275061, "epoch": 2273} {"train_loss": -36.276275634765625, "global_step": 275062, "epoch": 2273} {"train_loss": -32.9764404296875, "global_step": 275063, "epoch": 2273} {"train_loss": -23.39412498474121, "global_step": 275064, "epoch": 2273} {"train_loss": -17.830881118774414, "global_step": 275065, "epoch": 2273} {"train_loss": -34.024879455566406, "global_step": 275066, "epoch": 2273} {"train_loss": -26.077533721923828, "global_step": 275067, "epoch": 2273} {"train_loss": -37.622535705566406, "global_step": 275068, "epoch": 2273} {"train_loss": -36.23442459106445, "global_step": 275069, "epoch": 2273} {"train_loss": -10.662147521972656, "global_step": 275070, "epoch": 2273} {"train_loss": -29.569599151611328, "global_step": 275071, "epoch": 2273} {"train_loss": -2.437948703765869, "global_step": 275072, "epoch": 2273} {"train_loss": -32.603973388671875, "global_step": 275073, "epoch": 2273} {"train_loss": -33.579586029052734, "global_step": 275074, "epoch": 2273} {"train_loss": -27.430418014526367, "global_step": 275075, "epoch": 2273} {"train_loss": -34.862701416015625, "global_step": 275076, "epoch": 2273} {"train_loss": -33.88794708251953, "global_step": 275077, "epoch": 2273} {"train_loss": -29.978662490844727, "global_step": 275078, "epoch": 2273} {"train_loss": -34.66111755371094, "global_step": 275079, "epoch": 2273} {"train_loss": -35.964839935302734, "global_step": 275080, "epoch": 2273} {"train_loss": -35.49821853637695, "global_step": 275081, "epoch": 2273} {"train_loss": -34.79618835449219, "global_step": 275082, "epoch": 2273} {"train_loss": -35.38892364501953, "global_step": 275083, "epoch": 2273} {"train_loss": -38.07672119140625, "global_step": 275084, "epoch": 2273} {"train_loss": -37.40587615966797, "global_step": 275085, "epoch": 2273} {"train_loss": -35.9052848815918, "global_step": 275086, "epoch": 2273} {"train_loss": -37.26871871948242, "global_step": 275087, "epoch": 2273} {"train_loss": -38.595211029052734, "global_step": 275088, "epoch": 2273} {"train_loss": -37.45261764526367, "global_step": 275089, "epoch": 2273} {"train_loss": -37.29532241821289, "global_step": 275090, "epoch": 2273} {"train_loss": -37.086883544921875, "global_step": 275091, "epoch": 2273} {"train_loss": -37.67543411254883, "global_step": 275092, "epoch": 2273} {"train_loss": -37.78834533691406, "global_step": 275093, "epoch": 2273} {"train_loss": -37.932125091552734, "global_step": 275094, "epoch": 2273} {"train_loss": -36.83551788330078, "global_step": 275095, "epoch": 2273} {"train_loss": -37.74956130981445, "global_step": 275096, "epoch": 2273} {"train_loss": -38.38637161254883, "global_step": 275097, "epoch": 2273} {"train_loss": -38.38139724731445, "global_step": 275098, "epoch": 2273} {"train_loss": -37.769752502441406, "global_step": 275099, "epoch": 2273} {"train_loss": -37.976863861083984, "global_step": 275100, "epoch": 2273} {"train_loss": -38.82650375366211, "global_step": 275101, "epoch": 2273} {"train_loss": -37.888526916503906, "global_step": 275102, "epoch": 2273} {"train_loss": -38.215824127197266, "global_step": 275103, "epoch": 2273} {"train_loss": -40.15205764770508, "global_step": 275104, "epoch": 2273} {"train_loss": -39.465633392333984, "global_step": 275105, "epoch": 2273} {"train_loss": -38.81212615966797, "global_step": 275106, "epoch": 2273} {"train_loss": -38.724273681640625, "global_step": 275107, "epoch": 2273} {"train_loss": -38.82114791870117, "global_step": 275108, "epoch": 2273} {"train_loss": -40.12308883666992, "global_step": 275109, "epoch": 2273} {"train_loss": -39.6185417175293, "global_step": 275110, "epoch": 2273} {"train_loss": -39.112098693847656, "global_step": 275111, "epoch": 2273} {"train_loss": -38.702415466308594, "global_step": 275112, "epoch": 2273} {"train_loss": -39.7762565612793, "global_step": 275113, "epoch": 2273} {"train_loss": -39.90781784057617, "global_step": 275114, "epoch": 2273} {"train_loss": -39.637935638427734, "global_step": 275115, "epoch": 2273} {"train_loss": -39.97795104980469, "global_step": 275116, "epoch": 2273} {"train_loss": -39.26023483276367, "global_step": 275117, "epoch": 2273} {"train_loss": -39.94371032714844, "global_step": 275118, "epoch": 2273} {"train_loss": -39.86423873901367, "global_step": 275119, "epoch": 2273} {"train_loss": -40.04258346557617, "global_step": 275120, "epoch": 2273} {"train_loss": -39.86314010620117, "global_step": 275121, "epoch": 2273} {"train_loss": -39.851436614990234, "global_step": 275122, "epoch": 2273} {"train_loss": -39.94492721557617, "global_step": 275123, "epoch": 2273} {"train_loss": -39.23493194580078, "global_step": 275124, "epoch": 2273} {"train_loss": -39.6871452331543, "global_step": 275125, "epoch": 2273} {"train_loss": -39.55283737182617, "global_step": 275126, "epoch": 2273} {"train_loss": -39.75540542602539, "global_step": 275127, "epoch": 2273} {"train_loss": -40.43898391723633, "global_step": 275128, "epoch": 2273} {"train_loss": -40.429718017578125, "global_step": 275129, "epoch": 2273} {"train_loss": -40.601409912109375, "global_step": 275130, "epoch": 2273} {"train_loss": -39.98297119140625, "global_step": 275131, "epoch": 2273} {"train_loss": -40.50881576538086, "global_step": 275132, "epoch": 2273} {"train_loss": -40.18613815307617, "global_step": 275133, "epoch": 2273} {"train_loss": -40.45172882080078, "global_step": 275134, "epoch": 2273} {"train_loss": -39.75503921508789, "global_step": 275135, "epoch": 2273} {"train_loss": -40.91496658325195, "global_step": 275136, "epoch": 2273} {"train_loss": -40.85393142700195, "global_step": 275137, "epoch": 2273} {"train_loss": -40.4664421081543, "global_step": 275138, "epoch": 2273} {"train_loss": -40.11707305908203, "global_step": 275139, "epoch": 2273} {"train_loss": -39.94831848144531, "global_step": 275140, "epoch": 2273} {"train_loss": -40.83759689331055, "global_step": 275141, "epoch": 2273} {"train_loss": -41.440338134765625, "global_step": 275142, "epoch": 2273} {"train_loss": -40.190223693847656, "global_step": 275143, "epoch": 2273} {"train_loss": -41.46714401245117, "global_step": 275144, "epoch": 2273} {"train_loss": -40.3315544128418, "global_step": 275145, "epoch": 2273} {"train_loss": -40.49619674682617, "global_step": 275146, "epoch": 2273} {"train_loss": -41.291011810302734, "global_step": 275147, "epoch": 2273} {"train_loss": -40.98530197143555, "global_step": 275148, "epoch": 2273} {"train_loss": -40.95686340332031, "global_step": 275149, "epoch": 2273} {"train_loss": -41.17643356323242, "global_step": 275150, "epoch": 2273} {"train_loss": -40.244808197021484, "global_step": 275151, "epoch": 2273} {"train_loss": -40.95657730102539, "global_step": 275152, "epoch": 2273} {"train_loss": -37.5470894466747, "global_step": 275153, "epoch": 2273, "val_loss": 2689944.25} {"train_loss": -41.660728454589844, "global_step": 275154, "epoch": 2274} {"train_loss": -41.492610931396484, "global_step": 275155, "epoch": 2274} {"train_loss": -40.45266342163086, "global_step": 275156, "epoch": 2274} {"train_loss": -40.94068145751953, "global_step": 275157, "epoch": 2274} {"train_loss": -40.381465911865234, "global_step": 275158, "epoch": 2274} {"train_loss": -41.48087692260742, "global_step": 275159, "epoch": 2274} {"train_loss": -41.040706634521484, "global_step": 275160, "epoch": 2274} {"train_loss": -41.71535873413086, "global_step": 275161, "epoch": 2274} {"train_loss": -41.77252197265625, "global_step": 275162, "epoch": 2274} {"train_loss": -42.06942367553711, "global_step": 275163, "epoch": 2274} {"train_loss": -41.635650634765625, "global_step": 275164, "epoch": 2274} {"train_loss": -40.99435043334961, "global_step": 275165, "epoch": 2274} {"train_loss": -41.931129455566406, "global_step": 275166, "epoch": 2274} {"train_loss": -41.590538024902344, "global_step": 275167, "epoch": 2274} {"train_loss": -41.35820007324219, "global_step": 275168, "epoch": 2274} {"train_loss": -41.37248229980469, "global_step": 275169, "epoch": 2274} {"train_loss": -42.48418426513672, "global_step": 275170, "epoch": 2274} {"train_loss": -41.9151611328125, "global_step": 275171, "epoch": 2274} {"train_loss": -42.30048370361328, "global_step": 275172, "epoch": 2274} {"train_loss": -41.65365219116211, "global_step": 275173, "epoch": 2274} {"train_loss": -41.91825485229492, "global_step": 275174, "epoch": 2274} {"train_loss": -42.110164642333984, "global_step": 275175, "epoch": 2274} {"train_loss": -41.569889068603516, "global_step": 275176, "epoch": 2274} {"train_loss": -42.0997314453125, "global_step": 275177, "epoch": 2274} {"train_loss": -41.33232498168945, "global_step": 275178, "epoch": 2274} {"train_loss": -42.358428955078125, "global_step": 275179, "epoch": 2274} {"train_loss": -42.51852035522461, "global_step": 275180, "epoch": 2274} {"train_loss": -41.793636322021484, "global_step": 275181, "epoch": 2274} {"train_loss": -41.94844436645508, "global_step": 275182, "epoch": 2274} {"train_loss": -42.13870620727539, "global_step": 275183, "epoch": 2274} {"train_loss": -42.415401458740234, "global_step": 275184, "epoch": 2274} {"train_loss": -42.00623321533203, "global_step": 275185, "epoch": 2274} {"train_loss": -42.02996063232422, "global_step": 275186, "epoch": 2274} {"train_loss": -41.69722366333008, "global_step": 275187, "epoch": 2274} {"train_loss": -42.216426849365234, "global_step": 275188, "epoch": 2274} {"train_loss": -41.80880355834961, "global_step": 275189, "epoch": 2274} {"train_loss": -42.4976692199707, "global_step": 275190, "epoch": 2274} {"train_loss": -41.5770149230957, "global_step": 275191, "epoch": 2274} {"train_loss": -41.436824798583984, "global_step": 275192, "epoch": 2274} {"train_loss": -42.289527893066406, "global_step": 275193, "epoch": 2274} {"train_loss": -41.93251419067383, "global_step": 275194, "epoch": 2274} {"train_loss": -42.160152435302734, "global_step": 275195, "epoch": 2274} {"train_loss": -42.57683181762695, "global_step": 275196, "epoch": 2274} {"train_loss": -41.51005554199219, "global_step": 275197, "epoch": 2274} {"train_loss": -42.596412658691406, "global_step": 275198, "epoch": 2274} {"train_loss": -42.453697204589844, "global_step": 275199, "epoch": 2274} {"train_loss": -42.47305679321289, "global_step": 275200, "epoch": 2274} {"train_loss": -42.5842170715332, "global_step": 275201, "epoch": 2274} {"train_loss": -43.08348083496094, "global_step": 275202, "epoch": 2274} {"train_loss": -41.92170333862305, "global_step": 275203, "epoch": 2274} {"train_loss": -42.056312561035156, "global_step": 275204, "epoch": 2274} {"train_loss": -42.63136672973633, "global_step": 275205, "epoch": 2274} {"train_loss": -42.85114288330078, "global_step": 275206, "epoch": 2274} {"train_loss": -42.453060150146484, "global_step": 275207, "epoch": 2274} {"train_loss": -40.918453216552734, "global_step": 275208, "epoch": 2274} {"train_loss": -42.54694747924805, "global_step": 275209, "epoch": 2274} {"train_loss": -43.119720458984375, "global_step": 275210, "epoch": 2274} {"train_loss": -42.314571380615234, "global_step": 275211, "epoch": 2274} {"train_loss": -42.64203643798828, "global_step": 275212, "epoch": 2274} {"train_loss": -42.92649459838867, "global_step": 275213, "epoch": 2274} {"train_loss": -43.092838287353516, "global_step": 275214, "epoch": 2274} {"train_loss": -42.36715316772461, "global_step": 275215, "epoch": 2274} {"train_loss": -42.828678131103516, "global_step": 275216, "epoch": 2274} {"train_loss": -42.68992233276367, "global_step": 275217, "epoch": 2274} {"train_loss": -43.37622833251953, "global_step": 275218, "epoch": 2274} {"train_loss": -42.27518844604492, "global_step": 275219, "epoch": 2274} {"train_loss": -42.3121337890625, "global_step": 275220, "epoch": 2274} {"train_loss": -42.992855072021484, "global_step": 275221, "epoch": 2274} {"train_loss": -42.00923538208008, "global_step": 275222, "epoch": 2274} {"train_loss": -43.50880432128906, "global_step": 275223, "epoch": 2274} {"train_loss": -42.70115661621094, "global_step": 275224, "epoch": 2274} {"train_loss": -43.09743881225586, "global_step": 275225, "epoch": 2274} {"train_loss": -43.319671630859375, "global_step": 275226, "epoch": 2274} {"train_loss": -42.61930465698242, "global_step": 275227, "epoch": 2274} {"train_loss": -41.79978942871094, "global_step": 275228, "epoch": 2274} {"train_loss": -42.661983489990234, "global_step": 275229, "epoch": 2274} {"train_loss": -42.95106887817383, "global_step": 275230, "epoch": 2274} {"train_loss": -43.01333236694336, "global_step": 275231, "epoch": 2274} {"train_loss": -42.49171829223633, "global_step": 275232, "epoch": 2274} {"train_loss": -42.648887634277344, "global_step": 275233, "epoch": 2274} {"train_loss": -42.42325973510742, "global_step": 275234, "epoch": 2274} {"train_loss": -42.17206954956055, "global_step": 275235, "epoch": 2274} {"train_loss": -42.67802810668945, "global_step": 275236, "epoch": 2274} {"train_loss": -42.536651611328125, "global_step": 275237, "epoch": 2274} {"train_loss": -43.02022933959961, "global_step": 275238, "epoch": 2274} {"train_loss": -40.695556640625, "global_step": 275239, "epoch": 2274} {"train_loss": -43.02204895019531, "global_step": 275240, "epoch": 2274} {"train_loss": -42.878578186035156, "global_step": 275241, "epoch": 2274} {"train_loss": -43.18585968017578, "global_step": 275242, "epoch": 2274} {"train_loss": -43.1824951171875, "global_step": 275243, "epoch": 2274} {"train_loss": -43.00879669189453, "global_step": 275244, "epoch": 2274} {"train_loss": -42.8858528137207, "global_step": 275245, "epoch": 2274} {"train_loss": -42.935699462890625, "global_step": 275246, "epoch": 2274} {"train_loss": -42.801631927490234, "global_step": 275247, "epoch": 2274} {"train_loss": -42.03484344482422, "global_step": 275248, "epoch": 2274} {"train_loss": -42.33231735229492, "global_step": 275249, "epoch": 2274} {"train_loss": -42.8206901550293, "global_step": 275250, "epoch": 2274} {"train_loss": -41.577606201171875, "global_step": 275251, "epoch": 2274} {"train_loss": -42.817726135253906, "global_step": 275252, "epoch": 2274} {"train_loss": -42.007808685302734, "global_step": 275253, "epoch": 2274} {"train_loss": -41.1662712097168, "global_step": 275254, "epoch": 2274} {"train_loss": -42.71986389160156, "global_step": 275255, "epoch": 2274} {"train_loss": -42.131160736083984, "global_step": 275256, "epoch": 2274} {"train_loss": -41.68526840209961, "global_step": 275257, "epoch": 2274} {"train_loss": -42.90816879272461, "global_step": 275258, "epoch": 2274} {"train_loss": -43.21448516845703, "global_step": 275259, "epoch": 2274} {"train_loss": -42.275047302246094, "global_step": 275260, "epoch": 2274} {"train_loss": -42.96752166748047, "global_step": 275261, "epoch": 2274} {"train_loss": -42.86870574951172, "global_step": 275262, "epoch": 2274} {"train_loss": -42.670345306396484, "global_step": 275263, "epoch": 2274} {"train_loss": -42.80337142944336, "global_step": 275264, "epoch": 2274} {"train_loss": -42.65603256225586, "global_step": 275265, "epoch": 2274} {"train_loss": -42.28657150268555, "global_step": 275266, "epoch": 2274} {"train_loss": -42.33436965942383, "global_step": 275267, "epoch": 2274} {"train_loss": -41.68754196166992, "global_step": 275268, "epoch": 2274} {"train_loss": -41.60920333862305, "global_step": 275269, "epoch": 2274} {"train_loss": -43.02992630004883, "global_step": 275270, "epoch": 2274} {"train_loss": -42.48733901977539, "global_step": 275271, "epoch": 2274} {"train_loss": -40.71091842651367, "global_step": 275272, "epoch": 2274} {"train_loss": -41.798255920410156, "global_step": 275273, "epoch": 2274} {"train_loss": -42.23409791426225, "global_step": 275274, "epoch": 2274, "val_loss": 2718817.75} {"train_loss": -39.79038619995117, "global_step": 275275, "epoch": 2275} {"train_loss": -41.65601348876953, "global_step": 275276, "epoch": 2275} {"train_loss": -40.703224182128906, "global_step": 275277, "epoch": 2275} {"train_loss": -41.89226150512695, "global_step": 275278, "epoch": 2275} {"train_loss": -39.3326530456543, "global_step": 275279, "epoch": 2275} {"train_loss": -40.303707122802734, "global_step": 275280, "epoch": 2275} {"train_loss": -41.34955978393555, "global_step": 275281, "epoch": 2275} {"train_loss": -41.277530670166016, "global_step": 275282, "epoch": 2275} {"train_loss": -40.0538444519043, "global_step": 275283, "epoch": 2275} {"train_loss": -41.725013732910156, "global_step": 275284, "epoch": 2275} {"train_loss": -38.99862289428711, "global_step": 275285, "epoch": 2275} {"train_loss": -41.50950241088867, "global_step": 275286, "epoch": 2275} {"train_loss": -40.015987396240234, "global_step": 275287, "epoch": 2275} {"train_loss": -38.51876449584961, "global_step": 275288, "epoch": 2275} {"train_loss": -40.8513069152832, "global_step": 275289, "epoch": 2275} {"train_loss": -39.56850051879883, "global_step": 275290, "epoch": 2275} {"train_loss": -37.825103759765625, "global_step": 275291, "epoch": 2275} {"train_loss": -41.84831237792969, "global_step": 275292, "epoch": 2275} {"train_loss": -40.03740310668945, "global_step": 275293, "epoch": 2275} {"train_loss": -38.76972198486328, "global_step": 275294, "epoch": 2275} {"train_loss": -39.65871047973633, "global_step": 275295, "epoch": 2275} {"train_loss": -40.894466400146484, "global_step": 275296, "epoch": 2275} {"train_loss": -41.270381927490234, "global_step": 275297, "epoch": 2275} {"train_loss": -41.33082962036133, "global_step": 275298, "epoch": 2275} {"train_loss": -40.92475891113281, "global_step": 275299, "epoch": 2275} {"train_loss": -41.60822677612305, "global_step": 275300, "epoch": 2275} {"train_loss": -41.956485748291016, "global_step": 275301, "epoch": 2275} {"train_loss": -41.14836502075195, "global_step": 275302, "epoch": 2275} {"train_loss": -41.631404876708984, "global_step": 275303, "epoch": 2275} {"train_loss": -41.53932189941406, "global_step": 275304, "epoch": 2275} {"train_loss": -41.887542724609375, "global_step": 275305, "epoch": 2275} {"train_loss": -41.741371154785156, "global_step": 275306, "epoch": 2275} {"train_loss": -40.86088180541992, "global_step": 275307, "epoch": 2275} {"train_loss": -42.13155746459961, "global_step": 275308, "epoch": 2275} {"train_loss": -41.730525970458984, "global_step": 275309, "epoch": 2275} {"train_loss": -42.2763671875, "global_step": 275310, "epoch": 2275} {"train_loss": -41.834442138671875, "global_step": 275311, "epoch": 2275} {"train_loss": -41.84361267089844, "global_step": 275312, "epoch": 2275} {"train_loss": -41.704647064208984, "global_step": 275313, "epoch": 2275} {"train_loss": -42.09748458862305, "global_step": 275314, "epoch": 2275} {"train_loss": -42.33296585083008, "global_step": 275315, "epoch": 2275} {"train_loss": -41.208805084228516, "global_step": 275316, "epoch": 2275} {"train_loss": -42.56607437133789, "global_step": 275317, "epoch": 2275} {"train_loss": -42.42434310913086, "global_step": 275318, "epoch": 2275} {"train_loss": -41.88276290893555, "global_step": 275319, "epoch": 2275} {"train_loss": -42.44033432006836, "global_step": 275320, "epoch": 2275} {"train_loss": -42.24726104736328, "global_step": 275321, "epoch": 2275} {"train_loss": -42.162052154541016, "global_step": 275322, "epoch": 2275} {"train_loss": -42.15852737426758, "global_step": 275323, "epoch": 2275} {"train_loss": -42.02177429199219, "global_step": 275324, "epoch": 2275} {"train_loss": -41.81083297729492, "global_step": 275325, "epoch": 2275} {"train_loss": -42.09328842163086, "global_step": 275326, "epoch": 2275} {"train_loss": -42.314064025878906, "global_step": 275327, "epoch": 2275} {"train_loss": -41.81551742553711, "global_step": 275328, "epoch": 2275} {"train_loss": -41.50010299682617, "global_step": 275329, "epoch": 2275} {"train_loss": -41.84993362426758, "global_step": 275330, "epoch": 2275} {"train_loss": -42.7042350769043, "global_step": 275331, "epoch": 2275} {"train_loss": -43.024330139160156, "global_step": 275332, "epoch": 2275} {"train_loss": -42.31196594238281, "global_step": 275333, "epoch": 2275} {"train_loss": -42.17948532104492, "global_step": 275334, "epoch": 2275} {"train_loss": -42.46062088012695, "global_step": 275335, "epoch": 2275} {"train_loss": -42.38357162475586, "global_step": 275336, "epoch": 2275} {"train_loss": -42.52618408203125, "global_step": 275337, "epoch": 2275} {"train_loss": -42.715660095214844, "global_step": 275338, "epoch": 2275} {"train_loss": -43.175655364990234, "global_step": 275339, "epoch": 2275} {"train_loss": -42.75188064575195, "global_step": 275340, "epoch": 2275} {"train_loss": -43.22278594970703, "global_step": 275341, "epoch": 2275} {"train_loss": -42.856719970703125, "global_step": 275342, "epoch": 2275} {"train_loss": -42.878326416015625, "global_step": 275343, "epoch": 2275} {"train_loss": -42.58363723754883, "global_step": 275344, "epoch": 2275} {"train_loss": -43.030731201171875, "global_step": 275345, "epoch": 2275} {"train_loss": -42.68033218383789, "global_step": 275346, "epoch": 2275} {"train_loss": -42.36412048339844, "global_step": 275347, "epoch": 2275} {"train_loss": -42.5623893737793, "global_step": 275348, "epoch": 2275} {"train_loss": -43.17558670043945, "global_step": 275349, "epoch": 2275} {"train_loss": -43.246456146240234, "global_step": 275350, "epoch": 2275} {"train_loss": -43.38651657104492, "global_step": 275351, "epoch": 2275} {"train_loss": -42.8922233581543, "global_step": 275352, "epoch": 2275} {"train_loss": -43.15069580078125, "global_step": 275353, "epoch": 2275} {"train_loss": -43.08121871948242, "global_step": 275354, "epoch": 2275} {"train_loss": -43.04729080200195, "global_step": 275355, "epoch": 2275} {"train_loss": -42.75435256958008, "global_step": 275356, "epoch": 2275} {"train_loss": -43.654396057128906, "global_step": 275357, "epoch": 2275} {"train_loss": -43.18325424194336, "global_step": 275358, "epoch": 2275} {"train_loss": -43.72336959838867, "global_step": 275359, "epoch": 2275} {"train_loss": -43.8690185546875, "global_step": 275360, "epoch": 2275} {"train_loss": -43.500850677490234, "global_step": 275361, "epoch": 2275} {"train_loss": -43.3862419128418, "global_step": 275362, "epoch": 2275} {"train_loss": -43.25013732910156, "global_step": 275363, "epoch": 2275} {"train_loss": -43.77213668823242, "global_step": 275364, "epoch": 2275} {"train_loss": -43.394996643066406, "global_step": 275365, "epoch": 2275} {"train_loss": -42.83478927612305, "global_step": 275366, "epoch": 2275} {"train_loss": -43.702091217041016, "global_step": 275367, "epoch": 2275} {"train_loss": -43.27397918701172, "global_step": 275368, "epoch": 2275} {"train_loss": -43.71390914916992, "global_step": 275369, "epoch": 2275} {"train_loss": -43.752418518066406, "global_step": 275370, "epoch": 2275} {"train_loss": -43.510066986083984, "global_step": 275371, "epoch": 2275} {"train_loss": -43.4304313659668, "global_step": 275372, "epoch": 2275} {"train_loss": -43.04365921020508, "global_step": 275373, "epoch": 2275} {"train_loss": -43.24142837524414, "global_step": 275374, "epoch": 2275} {"train_loss": -42.921966552734375, "global_step": 275375, "epoch": 2275} {"train_loss": -43.665130615234375, "global_step": 275376, "epoch": 2275} {"train_loss": -43.143218994140625, "global_step": 275377, "epoch": 2275} {"train_loss": -43.335330963134766, "global_step": 275378, "epoch": 2275} {"train_loss": -43.47304153442383, "global_step": 275379, "epoch": 2275} {"train_loss": -42.87936782836914, "global_step": 275380, "epoch": 2275} {"train_loss": -43.854671478271484, "global_step": 275381, "epoch": 2275} {"train_loss": -43.24251937866211, "global_step": 275382, "epoch": 2275} {"train_loss": -42.37485885620117, "global_step": 275383, "epoch": 2275} {"train_loss": -42.23563766479492, "global_step": 275384, "epoch": 2275} {"train_loss": -41.26980209350586, "global_step": 275385, "epoch": 2275} {"train_loss": -42.31135177612305, "global_step": 275386, "epoch": 2275} {"train_loss": -42.72774124145508, "global_step": 275387, "epoch": 2275} {"train_loss": -43.07016372680664, "global_step": 275388, "epoch": 2275} {"train_loss": -42.95162582397461, "global_step": 275389, "epoch": 2275} {"train_loss": -42.62300109863281, "global_step": 275390, "epoch": 2275} {"train_loss": -39.463191986083984, "global_step": 275391, "epoch": 2275} {"train_loss": -28.264205932617188, "global_step": 275392, "epoch": 2275} {"train_loss": -9.040328025817871, "global_step": 275393, "epoch": 2275} {"train_loss": -4.221446514129639, "global_step": 275394, "epoch": 2275} {"train_loss": -41.39538358656828, "global_step": 275395, "epoch": 2275, "val_loss": 2729669.75} {"train_loss": -30.506494522094727, "global_step": 275396, "epoch": 2276} {"train_loss": -25.365081787109375, "global_step": 275397, "epoch": 2276} {"train_loss": -41.0241584777832, "global_step": 275398, "epoch": 2276} {"train_loss": -27.818634033203125, "global_step": 275399, "epoch": 2276} {"train_loss": -39.59143829345703, "global_step": 275400, "epoch": 2276} {"train_loss": -30.659048080444336, "global_step": 275401, "epoch": 2276} {"train_loss": -39.51173400878906, "global_step": 275402, "epoch": 2276} {"train_loss": -35.10869598388672, "global_step": 275403, "epoch": 2276} {"train_loss": -39.70618438720703, "global_step": 275404, "epoch": 2276} {"train_loss": -32.88524627685547, "global_step": 275405, "epoch": 2276} {"train_loss": -40.874122619628906, "global_step": 275406, "epoch": 2276} {"train_loss": -36.297847747802734, "global_step": 275407, "epoch": 2276} {"train_loss": -41.48231887817383, "global_step": 275408, "epoch": 2276} {"train_loss": -37.007720947265625, "global_step": 275409, "epoch": 2276} {"train_loss": -39.55220413208008, "global_step": 275410, "epoch": 2276} {"train_loss": -39.594818115234375, "global_step": 275411, "epoch": 2276} {"train_loss": -37.43893051147461, "global_step": 275412, "epoch": 2276} {"train_loss": -40.44070053100586, "global_step": 275413, "epoch": 2276} {"train_loss": -37.91081619262695, "global_step": 275414, "epoch": 2276} {"train_loss": -40.74908447265625, "global_step": 275415, "epoch": 2276} {"train_loss": -40.38330078125, "global_step": 275416, "epoch": 2276} {"train_loss": -38.671443939208984, "global_step": 275417, "epoch": 2276} {"train_loss": -40.0270881652832, "global_step": 275418, "epoch": 2276} {"train_loss": -40.084205627441406, "global_step": 275419, "epoch": 2276} {"train_loss": -40.4092903137207, "global_step": 275420, "epoch": 2276} {"train_loss": -41.26507568359375, "global_step": 275421, "epoch": 2276} {"train_loss": -40.321773529052734, "global_step": 275422, "epoch": 2276} {"train_loss": -40.08657455444336, "global_step": 275423, "epoch": 2276} {"train_loss": -41.515865325927734, "global_step": 275424, "epoch": 2276} {"train_loss": -41.08089828491211, "global_step": 275425, "epoch": 2276} {"train_loss": -40.658103942871094, "global_step": 275426, "epoch": 2276} {"train_loss": -40.86491775512695, "global_step": 275427, "epoch": 2276} {"train_loss": -41.19123458862305, "global_step": 275428, "epoch": 2276} {"train_loss": -41.25327682495117, "global_step": 275429, "epoch": 2276} {"train_loss": -41.247314453125, "global_step": 275430, "epoch": 2276} {"train_loss": -41.77410888671875, "global_step": 275431, "epoch": 2276} {"train_loss": -41.04940414428711, "global_step": 275432, "epoch": 2276} {"train_loss": -40.445831298828125, "global_step": 275433, "epoch": 2276} {"train_loss": -41.69401168823242, "global_step": 275434, "epoch": 2276} {"train_loss": -41.557918548583984, "global_step": 275435, "epoch": 2276} {"train_loss": -41.6168098449707, "global_step": 275436, "epoch": 2276} {"train_loss": -42.1483268737793, "global_step": 275437, "epoch": 2276} {"train_loss": -41.61924362182617, "global_step": 275438, "epoch": 2276} {"train_loss": -42.530738830566406, "global_step": 275439, "epoch": 2276} {"train_loss": -42.58254623413086, "global_step": 275440, "epoch": 2276} {"train_loss": -41.2611198425293, "global_step": 275441, "epoch": 2276} {"train_loss": -42.41624069213867, "global_step": 275442, "epoch": 2276} {"train_loss": -42.40805435180664, "global_step": 275443, "epoch": 2276} {"train_loss": -42.57524490356445, "global_step": 275444, "epoch": 2276} {"train_loss": -42.3255615234375, "global_step": 275445, "epoch": 2276} {"train_loss": -42.54859161376953, "global_step": 275446, "epoch": 2276} {"train_loss": -42.413002014160156, "global_step": 275447, "epoch": 2276} {"train_loss": -42.58950424194336, "global_step": 275448, "epoch": 2276} {"train_loss": -42.5046272277832, "global_step": 275449, "epoch": 2276} {"train_loss": -42.39792251586914, "global_step": 275450, "epoch": 2276} {"train_loss": -41.9241828918457, "global_step": 275451, "epoch": 2276} {"train_loss": -42.79338836669922, "global_step": 275452, "epoch": 2276} {"train_loss": -42.94016647338867, "global_step": 275453, "epoch": 2276} {"train_loss": -42.499122619628906, "global_step": 275454, "epoch": 2276} {"train_loss": -42.415287017822266, "global_step": 275455, "epoch": 2276} {"train_loss": -42.22919845581055, "global_step": 275456, "epoch": 2276} {"train_loss": -42.617332458496094, "global_step": 275457, "epoch": 2276} {"train_loss": -42.287227630615234, "global_step": 275458, "epoch": 2276} {"train_loss": -42.4644889831543, "global_step": 275459, "epoch": 2276} {"train_loss": -42.501197814941406, "global_step": 275460, "epoch": 2276} {"train_loss": -43.0625114440918, "global_step": 275461, "epoch": 2276} {"train_loss": -42.26008987426758, "global_step": 275462, "epoch": 2276} {"train_loss": -42.1024284362793, "global_step": 275463, "epoch": 2276} {"train_loss": -43.04539108276367, "global_step": 275464, "epoch": 2276} {"train_loss": -42.87372589111328, "global_step": 275465, "epoch": 2276} {"train_loss": -42.616573333740234, "global_step": 275466, "epoch": 2276} {"train_loss": -42.54753494262695, "global_step": 275467, "epoch": 2276} {"train_loss": -43.39829635620117, "global_step": 275468, "epoch": 2276} {"train_loss": -43.187381744384766, "global_step": 275469, "epoch": 2276} {"train_loss": -42.911495208740234, "global_step": 275470, "epoch": 2276} {"train_loss": -43.21715545654297, "global_step": 275471, "epoch": 2276} {"train_loss": -43.056396484375, "global_step": 275472, "epoch": 2276} {"train_loss": -43.392127990722656, "global_step": 275473, "epoch": 2276} {"train_loss": -42.37794876098633, "global_step": 275474, "epoch": 2276} {"train_loss": -43.28704833984375, "global_step": 275475, "epoch": 2276} {"train_loss": -43.47378158569336, "global_step": 275476, "epoch": 2276} {"train_loss": -42.98545455932617, "global_step": 275477, "epoch": 2276} {"train_loss": -43.2861328125, "global_step": 275478, "epoch": 2276} {"train_loss": -43.0330924987793, "global_step": 275479, "epoch": 2276} {"train_loss": -42.96102523803711, "global_step": 275480, "epoch": 2276} {"train_loss": -42.956146240234375, "global_step": 275481, "epoch": 2276} {"train_loss": -43.61994552612305, "global_step": 275482, "epoch": 2276} {"train_loss": -43.08729553222656, "global_step": 275483, "epoch": 2276} {"train_loss": -43.5535774230957, "global_step": 275484, "epoch": 2276} {"train_loss": -43.40298080444336, "global_step": 275485, "epoch": 2276} {"train_loss": -43.098995208740234, "global_step": 275486, "epoch": 2276} {"train_loss": -43.521820068359375, "global_step": 275487, "epoch": 2276} {"train_loss": -43.13816452026367, "global_step": 275488, "epoch": 2276} {"train_loss": -43.266780853271484, "global_step": 275489, "epoch": 2276} {"train_loss": -43.74365997314453, "global_step": 275490, "epoch": 2276} {"train_loss": -43.17095947265625, "global_step": 275491, "epoch": 2276} {"train_loss": -43.669593811035156, "global_step": 275492, "epoch": 2276} {"train_loss": -43.85005569458008, "global_step": 275493, "epoch": 2276} {"train_loss": -43.81661605834961, "global_step": 275494, "epoch": 2276} {"train_loss": -43.796661376953125, "global_step": 275495, "epoch": 2276} {"train_loss": -43.23789596557617, "global_step": 275496, "epoch": 2276} {"train_loss": -43.51460647583008, "global_step": 275497, "epoch": 2276} {"train_loss": -43.810482025146484, "global_step": 275498, "epoch": 2276} {"train_loss": -43.65099334716797, "global_step": 275499, "epoch": 2276} {"train_loss": -44.05843734741211, "global_step": 275500, "epoch": 2276} {"train_loss": -44.064144134521484, "global_step": 275501, "epoch": 2276} {"train_loss": -43.62360763549805, "global_step": 275502, "epoch": 2276} {"train_loss": -43.70643615722656, "global_step": 275503, "epoch": 2276} {"train_loss": -43.561912536621094, "global_step": 275504, "epoch": 2276} {"train_loss": -43.83456039428711, "global_step": 275505, "epoch": 2276} {"train_loss": -43.63962936401367, "global_step": 275506, "epoch": 2276} {"train_loss": -44.16453552246094, "global_step": 275507, "epoch": 2276} {"train_loss": -43.26091003417969, "global_step": 275508, "epoch": 2276} {"train_loss": -43.35587692260742, "global_step": 275509, "epoch": 2276} {"train_loss": -43.86525344848633, "global_step": 275510, "epoch": 2276} {"train_loss": -42.96645736694336, "global_step": 275511, "epoch": 2276} {"train_loss": -43.7270622253418, "global_step": 275512, "epoch": 2276} {"train_loss": -43.38016128540039, "global_step": 275513, "epoch": 2276} {"train_loss": -44.31852340698242, "global_step": 275514, "epoch": 2276} {"train_loss": -40.4434928894043, "global_step": 275515, "epoch": 2276} {"train_loss": -41.56273124631771, "global_step": 275516, "epoch": 2276, "val_loss": 2639716.75} {"train_loss": -42.49579620361328, "global_step": 275517, "epoch": 2277} {"train_loss": -41.31740188598633, "global_step": 275518, "epoch": 2277} {"train_loss": -37.882965087890625, "global_step": 275519, "epoch": 2277} {"train_loss": -42.41535186767578, "global_step": 275520, "epoch": 2277} {"train_loss": -42.098663330078125, "global_step": 275521, "epoch": 2277} {"train_loss": -42.78818893432617, "global_step": 275522, "epoch": 2277} {"train_loss": -43.1278190612793, "global_step": 275523, "epoch": 2277} {"train_loss": -42.271461486816406, "global_step": 275524, "epoch": 2277} {"train_loss": -42.770015716552734, "global_step": 275525, "epoch": 2277} {"train_loss": -36.271034240722656, "global_step": 275526, "epoch": 2277} {"train_loss": -41.09273910522461, "global_step": 275527, "epoch": 2277} {"train_loss": -40.540496826171875, "global_step": 275528, "epoch": 2277} {"train_loss": -37.948692321777344, "global_step": 275529, "epoch": 2277} {"train_loss": -38.713478088378906, "global_step": 275530, "epoch": 2277} {"train_loss": -40.94855880737305, "global_step": 275531, "epoch": 2277} {"train_loss": -41.344200134277344, "global_step": 275532, "epoch": 2277} {"train_loss": -41.71018600463867, "global_step": 275533, "epoch": 2277} {"train_loss": -37.47806930541992, "global_step": 275534, "epoch": 2277} {"train_loss": -38.904815673828125, "global_step": 275535, "epoch": 2277} {"train_loss": -39.85837936401367, "global_step": 275536, "epoch": 2277} {"train_loss": -41.26418685913086, "global_step": 275537, "epoch": 2277} {"train_loss": -42.223697662353516, "global_step": 275538, "epoch": 2277} {"train_loss": -42.309356689453125, "global_step": 275539, "epoch": 2277} {"train_loss": -27.87544059753418, "global_step": 275540, "epoch": 2277} {"train_loss": -33.74667739868164, "global_step": 275541, "epoch": 2277} {"train_loss": -39.849422454833984, "global_step": 275542, "epoch": 2277} {"train_loss": -39.29657745361328, "global_step": 275543, "epoch": 2277} {"train_loss": -39.88106155395508, "global_step": 275544, "epoch": 2277} {"train_loss": -37.988136291503906, "global_step": 275545, "epoch": 2277} {"train_loss": -36.86374282836914, "global_step": 275546, "epoch": 2277} {"train_loss": -41.24121856689453, "global_step": 275547, "epoch": 2277} {"train_loss": -40.4567985534668, "global_step": 275548, "epoch": 2277} {"train_loss": -40.130611419677734, "global_step": 275549, "epoch": 2277} {"train_loss": -40.21419906616211, "global_step": 275550, "epoch": 2277} {"train_loss": -40.97366714477539, "global_step": 275551, "epoch": 2277} {"train_loss": -40.5418701171875, "global_step": 275552, "epoch": 2277} {"train_loss": -40.95208740234375, "global_step": 275553, "epoch": 2277} {"train_loss": -37.44340133666992, "global_step": 275554, "epoch": 2277} {"train_loss": -38.52241516113281, "global_step": 275555, "epoch": 2277} {"train_loss": -37.400123596191406, "global_step": 275556, "epoch": 2277} {"train_loss": -36.89167404174805, "global_step": 275557, "epoch": 2277} {"train_loss": -41.843048095703125, "global_step": 275558, "epoch": 2277} {"train_loss": -41.36898422241211, "global_step": 275559, "epoch": 2277} {"train_loss": -40.86277389526367, "global_step": 275560, "epoch": 2277} {"train_loss": -40.91170120239258, "global_step": 275561, "epoch": 2277} {"train_loss": -39.5197868347168, "global_step": 275562, "epoch": 2277} {"train_loss": -39.33738327026367, "global_step": 275563, "epoch": 2277} {"train_loss": -39.906517028808594, "global_step": 275564, "epoch": 2277} {"train_loss": -41.01615905761719, "global_step": 275565, "epoch": 2277} {"train_loss": -41.35050582885742, "global_step": 275566, "epoch": 2277} {"train_loss": -41.59958267211914, "global_step": 275567, "epoch": 2277} {"train_loss": -41.265533447265625, "global_step": 275568, "epoch": 2277} {"train_loss": -40.27827453613281, "global_step": 275569, "epoch": 2277} {"train_loss": -40.57640075683594, "global_step": 275570, "epoch": 2277} {"train_loss": -40.20709228515625, "global_step": 275571, "epoch": 2277} {"train_loss": -40.0611457824707, "global_step": 275572, "epoch": 2277} {"train_loss": -41.533084869384766, "global_step": 275573, "epoch": 2277} {"train_loss": -42.15410232543945, "global_step": 275574, "epoch": 2277} {"train_loss": -41.06526565551758, "global_step": 275575, "epoch": 2277} {"train_loss": -41.1729621887207, "global_step": 275576, "epoch": 2277} {"train_loss": -41.606910705566406, "global_step": 275577, "epoch": 2277} {"train_loss": -38.808258056640625, "global_step": 275578, "epoch": 2277} {"train_loss": -41.72015380859375, "global_step": 275579, "epoch": 2277} {"train_loss": -42.054805755615234, "global_step": 275580, "epoch": 2277} {"train_loss": -40.50661849975586, "global_step": 275581, "epoch": 2277} {"train_loss": -41.49019241333008, "global_step": 275582, "epoch": 2277} {"train_loss": -42.2522087097168, "global_step": 275583, "epoch": 2277} {"train_loss": -42.664363861083984, "global_step": 275584, "epoch": 2277} {"train_loss": -41.83430862426758, "global_step": 275585, "epoch": 2277} {"train_loss": -41.88331985473633, "global_step": 275586, "epoch": 2277} {"train_loss": -40.694820404052734, "global_step": 275587, "epoch": 2277} {"train_loss": -42.027931213378906, "global_step": 275588, "epoch": 2277} {"train_loss": -42.626678466796875, "global_step": 275589, "epoch": 2277} {"train_loss": -42.30684280395508, "global_step": 275590, "epoch": 2277} {"train_loss": -40.501739501953125, "global_step": 275591, "epoch": 2277} {"train_loss": -40.37543487548828, "global_step": 275592, "epoch": 2277} {"train_loss": -41.05989074707031, "global_step": 275593, "epoch": 2277} {"train_loss": -42.495635986328125, "global_step": 275594, "epoch": 2277} {"train_loss": -42.607261657714844, "global_step": 275595, "epoch": 2277} {"train_loss": -40.87681198120117, "global_step": 275596, "epoch": 2277} {"train_loss": -42.49675750732422, "global_step": 275597, "epoch": 2277} {"train_loss": -42.417449951171875, "global_step": 275598, "epoch": 2277} {"train_loss": -42.40775680541992, "global_step": 275599, "epoch": 2277} {"train_loss": -42.833736419677734, "global_step": 275600, "epoch": 2277} {"train_loss": -40.39963150024414, "global_step": 275601, "epoch": 2277} {"train_loss": -40.87176513671875, "global_step": 275602, "epoch": 2277} {"train_loss": -42.55058670043945, "global_step": 275603, "epoch": 2277} {"train_loss": -40.67140579223633, "global_step": 275604, "epoch": 2277} {"train_loss": -41.920589447021484, "global_step": 275605, "epoch": 2277} {"train_loss": -40.42091369628906, "global_step": 275606, "epoch": 2277} {"train_loss": -40.837703704833984, "global_step": 275607, "epoch": 2277} {"train_loss": -42.7203483581543, "global_step": 275608, "epoch": 2277} {"train_loss": -42.9155158996582, "global_step": 275609, "epoch": 2277} {"train_loss": -41.68587875366211, "global_step": 275610, "epoch": 2277} {"train_loss": -42.999080657958984, "global_step": 275611, "epoch": 2277} {"train_loss": -42.56447982788086, "global_step": 275612, "epoch": 2277} {"train_loss": -41.29280090332031, "global_step": 275613, "epoch": 2277} {"train_loss": -41.36866760253906, "global_step": 275614, "epoch": 2277} {"train_loss": -42.63969802856445, "global_step": 275615, "epoch": 2277} {"train_loss": -41.810237884521484, "global_step": 275616, "epoch": 2277} {"train_loss": -42.00465774536133, "global_step": 275617, "epoch": 2277} {"train_loss": -42.36738204956055, "global_step": 275618, "epoch": 2277} {"train_loss": -42.830936431884766, "global_step": 275619, "epoch": 2277} {"train_loss": -42.1328010559082, "global_step": 275620, "epoch": 2277} {"train_loss": -43.15919876098633, "global_step": 275621, "epoch": 2277} {"train_loss": -42.72903060913086, "global_step": 275622, "epoch": 2277} {"train_loss": -42.347023010253906, "global_step": 275623, "epoch": 2277} {"train_loss": -42.74445343017578, "global_step": 275624, "epoch": 2277} {"train_loss": -42.86229705810547, "global_step": 275625, "epoch": 2277} {"train_loss": -42.541297912597656, "global_step": 275626, "epoch": 2277} {"train_loss": -42.91642379760742, "global_step": 275627, "epoch": 2277} {"train_loss": -42.147396087646484, "global_step": 275628, "epoch": 2277} {"train_loss": -42.49159622192383, "global_step": 275629, "epoch": 2277} {"train_loss": -42.9691047668457, "global_step": 275630, "epoch": 2277} {"train_loss": -43.06817626953125, "global_step": 275631, "epoch": 2277} {"train_loss": -42.56146240234375, "global_step": 275632, "epoch": 2277} {"train_loss": -42.183753967285156, "global_step": 275633, "epoch": 2277} {"train_loss": -41.63149642944336, "global_step": 275634, "epoch": 2277} {"train_loss": -42.24528884887695, "global_step": 275635, "epoch": 2277} {"train_loss": -43.07041549682617, "global_step": 275636, "epoch": 2277} {"train_loss": -41.03080196222983, "global_step": 275637, "epoch": 2277, "val_loss": 2713914.25} {"train_loss": -41.27277755737305, "global_step": 275638, "epoch": 2278} {"train_loss": -43.2023811340332, "global_step": 275639, "epoch": 2278} {"train_loss": -42.96628952026367, "global_step": 275640, "epoch": 2278} {"train_loss": -42.90919494628906, "global_step": 275641, "epoch": 2278} {"train_loss": -40.772125244140625, "global_step": 275642, "epoch": 2278} {"train_loss": -41.961036682128906, "global_step": 275643, "epoch": 2278} {"train_loss": -43.157135009765625, "global_step": 275644, "epoch": 2278} {"train_loss": -43.475830078125, "global_step": 275645, "epoch": 2278} {"train_loss": -42.6978645324707, "global_step": 275646, "epoch": 2278} {"train_loss": -43.42490768432617, "global_step": 275647, "epoch": 2278} {"train_loss": -43.13771057128906, "global_step": 275648, "epoch": 2278} {"train_loss": -43.11077117919922, "global_step": 275649, "epoch": 2278} {"train_loss": -42.3465576171875, "global_step": 275650, "epoch": 2278} {"train_loss": -43.51707077026367, "global_step": 275651, "epoch": 2278} {"train_loss": -42.77371597290039, "global_step": 275652, "epoch": 2278} {"train_loss": -42.716854095458984, "global_step": 275653, "epoch": 2278} {"train_loss": -42.606842041015625, "global_step": 275654, "epoch": 2278} {"train_loss": -43.09470748901367, "global_step": 275655, "epoch": 2278} {"train_loss": -42.72380065917969, "global_step": 275656, "epoch": 2278} {"train_loss": -42.991676330566406, "global_step": 275657, "epoch": 2278} {"train_loss": -42.93490219116211, "global_step": 275658, "epoch": 2278} {"train_loss": -43.082427978515625, "global_step": 275659, "epoch": 2278} {"train_loss": -42.88819122314453, "global_step": 275660, "epoch": 2278} {"train_loss": -43.15678787231445, "global_step": 275661, "epoch": 2278} {"train_loss": -42.12119674682617, "global_step": 275662, "epoch": 2278} {"train_loss": -42.90523910522461, "global_step": 275663, "epoch": 2278} {"train_loss": -42.64023208618164, "global_step": 275664, "epoch": 2278} {"train_loss": -42.516212463378906, "global_step": 275665, "epoch": 2278} {"train_loss": -43.35574722290039, "global_step": 275666, "epoch": 2278} {"train_loss": -43.60576248168945, "global_step": 275667, "epoch": 2278} {"train_loss": -43.54003143310547, "global_step": 275668, "epoch": 2278} {"train_loss": -42.77983474731445, "global_step": 275669, "epoch": 2278} {"train_loss": -43.1581916809082, "global_step": 275670, "epoch": 2278} {"train_loss": -43.70076370239258, "global_step": 275671, "epoch": 2278} {"train_loss": -43.210350036621094, "global_step": 275672, "epoch": 2278} {"train_loss": -43.23640060424805, "global_step": 275673, "epoch": 2278} {"train_loss": -43.291690826416016, "global_step": 275674, "epoch": 2278} {"train_loss": -43.52995681762695, "global_step": 275675, "epoch": 2278} {"train_loss": -43.7608528137207, "global_step": 275676, "epoch": 2278} {"train_loss": -43.5181770324707, "global_step": 275677, "epoch": 2278} {"train_loss": -42.665374755859375, "global_step": 275678, "epoch": 2278} {"train_loss": -42.28871154785156, "global_step": 275679, "epoch": 2278} {"train_loss": -42.299007415771484, "global_step": 275680, "epoch": 2278} {"train_loss": -41.93447494506836, "global_step": 275681, "epoch": 2278} {"train_loss": -43.22172546386719, "global_step": 275682, "epoch": 2278} {"train_loss": -43.19681167602539, "global_step": 275683, "epoch": 2278} {"train_loss": -42.55741500854492, "global_step": 275684, "epoch": 2278} {"train_loss": -41.920284271240234, "global_step": 275685, "epoch": 2278} {"train_loss": -42.34514236450195, "global_step": 275686, "epoch": 2278} {"train_loss": -43.230262756347656, "global_step": 275687, "epoch": 2278} {"train_loss": -41.9074592590332, "global_step": 275688, "epoch": 2278} {"train_loss": -41.7085075378418, "global_step": 275689, "epoch": 2278} {"train_loss": -41.229976654052734, "global_step": 275690, "epoch": 2278} {"train_loss": -41.72126770019531, "global_step": 275691, "epoch": 2278} {"train_loss": -41.85283279418945, "global_step": 275692, "epoch": 2278} {"train_loss": -42.475311279296875, "global_step": 275693, "epoch": 2278} {"train_loss": -41.82416534423828, "global_step": 275694, "epoch": 2278} {"train_loss": -42.77827453613281, "global_step": 275695, "epoch": 2278} {"train_loss": -42.64063262939453, "global_step": 275696, "epoch": 2278} {"train_loss": -43.16537094116211, "global_step": 275697, "epoch": 2278} {"train_loss": -39.98487091064453, "global_step": 275698, "epoch": 2278} {"train_loss": -42.62191390991211, "global_step": 275699, "epoch": 2278} {"train_loss": -42.586997985839844, "global_step": 275700, "epoch": 2278} {"train_loss": -43.660064697265625, "global_step": 275701, "epoch": 2278} {"train_loss": -42.814483642578125, "global_step": 275702, "epoch": 2278} {"train_loss": -42.3818359375, "global_step": 275703, "epoch": 2278} {"train_loss": -42.57297134399414, "global_step": 275704, "epoch": 2278} {"train_loss": -41.083370208740234, "global_step": 275705, "epoch": 2278} {"train_loss": -41.831966400146484, "global_step": 275706, "epoch": 2278} {"train_loss": -43.0774040222168, "global_step": 275707, "epoch": 2278} {"train_loss": -42.85146713256836, "global_step": 275708, "epoch": 2278} {"train_loss": -40.08748245239258, "global_step": 275709, "epoch": 2278} {"train_loss": -38.510719299316406, "global_step": 275710, "epoch": 2278} {"train_loss": -42.42963790893555, "global_step": 275711, "epoch": 2278} {"train_loss": -43.04843521118164, "global_step": 275712, "epoch": 2278} {"train_loss": -42.40913772583008, "global_step": 275713, "epoch": 2278} {"train_loss": -41.410465240478516, "global_step": 275714, "epoch": 2278} {"train_loss": -41.18776321411133, "global_step": 275715, "epoch": 2278} {"train_loss": -42.76752471923828, "global_step": 275716, "epoch": 2278} {"train_loss": -42.74789047241211, "global_step": 275717, "epoch": 2278} {"train_loss": -42.86344528198242, "global_step": 275718, "epoch": 2278} {"train_loss": -42.28169631958008, "global_step": 275719, "epoch": 2278} {"train_loss": -42.70774459838867, "global_step": 275720, "epoch": 2278} {"train_loss": -43.188663482666016, "global_step": 275721, "epoch": 2278} {"train_loss": -41.87029266357422, "global_step": 275722, "epoch": 2278} {"train_loss": -42.934410095214844, "global_step": 275723, "epoch": 2278} {"train_loss": -43.22127914428711, "global_step": 275724, "epoch": 2278} {"train_loss": -42.914337158203125, "global_step": 275725, "epoch": 2278} {"train_loss": -43.261226654052734, "global_step": 275726, "epoch": 2278} {"train_loss": -32.84014129638672, "global_step": 275727, "epoch": 2278} {"train_loss": -42.7019157409668, "global_step": 275728, "epoch": 2278} {"train_loss": -42.828365325927734, "global_step": 275729, "epoch": 2278} {"train_loss": -42.6772575378418, "global_step": 275730, "epoch": 2278} {"train_loss": -42.242469787597656, "global_step": 275731, "epoch": 2278} {"train_loss": -42.997314453125, "global_step": 275732, "epoch": 2278} {"train_loss": -36.32997512817383, "global_step": 275733, "epoch": 2278} {"train_loss": -39.920406341552734, "global_step": 275734, "epoch": 2278} {"train_loss": -42.76707077026367, "global_step": 275735, "epoch": 2278} {"train_loss": -40.8667106628418, "global_step": 275736, "epoch": 2278} {"train_loss": -39.95414352416992, "global_step": 275737, "epoch": 2278} {"train_loss": -42.6380729675293, "global_step": 275738, "epoch": 2278} {"train_loss": -41.40644073486328, "global_step": 275739, "epoch": 2278} {"train_loss": -42.29987716674805, "global_step": 275740, "epoch": 2278} {"train_loss": -42.1683235168457, "global_step": 275741, "epoch": 2278} {"train_loss": -41.43253707885742, "global_step": 275742, "epoch": 2278} {"train_loss": -42.91801071166992, "global_step": 275743, "epoch": 2278} {"train_loss": -41.92383575439453, "global_step": 275744, "epoch": 2278} {"train_loss": -42.845985412597656, "global_step": 275745, "epoch": 2278} {"train_loss": -42.4403190612793, "global_step": 275746, "epoch": 2278} {"train_loss": -41.53020095825195, "global_step": 275747, "epoch": 2278} {"train_loss": -41.51293182373047, "global_step": 275748, "epoch": 2278} {"train_loss": -42.57204055786133, "global_step": 275749, "epoch": 2278} {"train_loss": -42.59560012817383, "global_step": 275750, "epoch": 2278} {"train_loss": -41.93534469604492, "global_step": 275751, "epoch": 2278} {"train_loss": -42.7967643737793, "global_step": 275752, "epoch": 2278} {"train_loss": -42.47278594970703, "global_step": 275753, "epoch": 2278} {"train_loss": -42.1636962890625, "global_step": 275754, "epoch": 2278} {"train_loss": -23.08050537109375, "global_step": 275755, "epoch": 2278} {"train_loss": -41.89681625366211, "global_step": 275756, "epoch": 2278} {"train_loss": -36.9313850402832, "global_step": 275757, "epoch": 2278} {"train_loss": -42.13442904890076, "global_step": 275758, "epoch": 2278, "val_loss": 2612843.0} {"train_loss": -42.800537109375, "global_step": 275759, "epoch": 2279} {"train_loss": -42.449256896972656, "global_step": 275760, "epoch": 2279} {"train_loss": -41.977420806884766, "global_step": 275761, "epoch": 2279} {"train_loss": -41.521419525146484, "global_step": 275762, "epoch": 2279} {"train_loss": -40.05215072631836, "global_step": 275763, "epoch": 2279} {"train_loss": -35.667808532714844, "global_step": 275764, "epoch": 2279} {"train_loss": -33.96382522583008, "global_step": 275765, "epoch": 2279} {"train_loss": -34.726531982421875, "global_step": 275766, "epoch": 2279} {"train_loss": -41.84263229370117, "global_step": 275767, "epoch": 2279} {"train_loss": -40.10920333862305, "global_step": 275768, "epoch": 2279} {"train_loss": -41.86876678466797, "global_step": 275769, "epoch": 2279} {"train_loss": -40.537540435791016, "global_step": 275770, "epoch": 2279} {"train_loss": -41.016204833984375, "global_step": 275771, "epoch": 2279} {"train_loss": -42.146427154541016, "global_step": 275772, "epoch": 2279} {"train_loss": -38.19303512573242, "global_step": 275773, "epoch": 2279} {"train_loss": -41.79197311401367, "global_step": 275774, "epoch": 2279} {"train_loss": -41.554012298583984, "global_step": 275775, "epoch": 2279} {"train_loss": -40.37672805786133, "global_step": 275776, "epoch": 2279} {"train_loss": -40.219970703125, "global_step": 275777, "epoch": 2279} {"train_loss": -40.61277389526367, "global_step": 275778, "epoch": 2279} {"train_loss": -38.61777114868164, "global_step": 275779, "epoch": 2279} {"train_loss": -42.38639450073242, "global_step": 275780, "epoch": 2279} {"train_loss": -41.7307243347168, "global_step": 275781, "epoch": 2279} {"train_loss": -39.628448486328125, "global_step": 275782, "epoch": 2279} {"train_loss": -41.148067474365234, "global_step": 275783, "epoch": 2279} {"train_loss": -41.5952262878418, "global_step": 275784, "epoch": 2279} {"train_loss": -41.79714584350586, "global_step": 275785, "epoch": 2279} {"train_loss": -42.1544303894043, "global_step": 275786, "epoch": 2279} {"train_loss": -42.044918060302734, "global_step": 275787, "epoch": 2279} {"train_loss": -42.68895721435547, "global_step": 275788, "epoch": 2279} {"train_loss": -41.806129455566406, "global_step": 275789, "epoch": 2279} {"train_loss": -41.74445724487305, "global_step": 275790, "epoch": 2279} {"train_loss": -42.51477813720703, "global_step": 275791, "epoch": 2279} {"train_loss": -42.57419204711914, "global_step": 275792, "epoch": 2279} {"train_loss": -36.410335540771484, "global_step": 275793, "epoch": 2279} {"train_loss": -42.13813400268555, "global_step": 275794, "epoch": 2279} {"train_loss": -41.00111770629883, "global_step": 275795, "epoch": 2279} {"train_loss": -40.600502014160156, "global_step": 275796, "epoch": 2279} {"train_loss": -41.715248107910156, "global_step": 275797, "epoch": 2279} {"train_loss": -42.520015716552734, "global_step": 275798, "epoch": 2279} {"train_loss": -41.32065963745117, "global_step": 275799, "epoch": 2279} {"train_loss": -42.31057357788086, "global_step": 275800, "epoch": 2279} {"train_loss": -42.50373458862305, "global_step": 275801, "epoch": 2279} {"train_loss": -42.61942672729492, "global_step": 275802, "epoch": 2279} {"train_loss": -42.989505767822266, "global_step": 275803, "epoch": 2279} {"train_loss": -42.71436309814453, "global_step": 275804, "epoch": 2279} {"train_loss": -41.44185256958008, "global_step": 275805, "epoch": 2279} {"train_loss": -41.967681884765625, "global_step": 275806, "epoch": 2279} {"train_loss": -42.69124984741211, "global_step": 275807, "epoch": 2279} {"train_loss": -41.87784957885742, "global_step": 275808, "epoch": 2279} {"train_loss": -42.814720153808594, "global_step": 275809, "epoch": 2279} {"train_loss": -42.84077072143555, "global_step": 275810, "epoch": 2279} {"train_loss": -42.88015365600586, "global_step": 275811, "epoch": 2279} {"train_loss": -42.848567962646484, "global_step": 275812, "epoch": 2279} {"train_loss": -42.473690032958984, "global_step": 275813, "epoch": 2279} {"train_loss": -43.06476974487305, "global_step": 275814, "epoch": 2279} {"train_loss": -43.0942268371582, "global_step": 275815, "epoch": 2279} {"train_loss": -42.63855743408203, "global_step": 275816, "epoch": 2279} {"train_loss": -42.534088134765625, "global_step": 275817, "epoch": 2279} {"train_loss": -42.856380462646484, "global_step": 275818, "epoch": 2279} {"train_loss": -42.82464599609375, "global_step": 275819, "epoch": 2279} {"train_loss": -43.41048049926758, "global_step": 275820, "epoch": 2279} {"train_loss": -42.2314567565918, "global_step": 275821, "epoch": 2279} {"train_loss": -43.39021301269531, "global_step": 275822, "epoch": 2279} {"train_loss": -42.62395095825195, "global_step": 275823, "epoch": 2279} {"train_loss": -43.39260482788086, "global_step": 275824, "epoch": 2279} {"train_loss": -42.90455627441406, "global_step": 275825, "epoch": 2279} {"train_loss": -42.05027770996094, "global_step": 275826, "epoch": 2279} {"train_loss": -43.602596282958984, "global_step": 275827, "epoch": 2279} {"train_loss": -42.346248626708984, "global_step": 275828, "epoch": 2279} {"train_loss": -42.93809509277344, "global_step": 275829, "epoch": 2279} {"train_loss": -42.7939453125, "global_step": 275830, "epoch": 2279} {"train_loss": -43.04789352416992, "global_step": 275831, "epoch": 2279} {"train_loss": -43.23324203491211, "global_step": 275832, "epoch": 2279} {"train_loss": -43.418487548828125, "global_step": 275833, "epoch": 2279} {"train_loss": -42.6920280456543, "global_step": 275834, "epoch": 2279} {"train_loss": -42.89271926879883, "global_step": 275835, "epoch": 2279} {"train_loss": -42.94162368774414, "global_step": 275836, "epoch": 2279} {"train_loss": -40.604583740234375, "global_step": 275837, "epoch": 2279} {"train_loss": -40.832000732421875, "global_step": 275838, "epoch": 2279} {"train_loss": -43.50651550292969, "global_step": 275839, "epoch": 2279} {"train_loss": -43.28642272949219, "global_step": 275840, "epoch": 2279} {"train_loss": -43.45561599731445, "global_step": 275841, "epoch": 2279} {"train_loss": -43.01951217651367, "global_step": 275842, "epoch": 2279} {"train_loss": -43.34634017944336, "global_step": 275843, "epoch": 2279} {"train_loss": -43.62849044799805, "global_step": 275844, "epoch": 2279} {"train_loss": -41.85837936401367, "global_step": 275845, "epoch": 2279} {"train_loss": -42.885005950927734, "global_step": 275846, "epoch": 2279} {"train_loss": -43.080780029296875, "global_step": 275847, "epoch": 2279} {"train_loss": -43.380592346191406, "global_step": 275848, "epoch": 2279} {"train_loss": -43.11611557006836, "global_step": 275849, "epoch": 2279} {"train_loss": -41.68494415283203, "global_step": 275850, "epoch": 2279} {"train_loss": -43.34363555908203, "global_step": 275851, "epoch": 2279} {"train_loss": -43.08180618286133, "global_step": 275852, "epoch": 2279} {"train_loss": -42.346534729003906, "global_step": 275853, "epoch": 2279} {"train_loss": -43.74912643432617, "global_step": 275854, "epoch": 2279} {"train_loss": -43.088619232177734, "global_step": 275855, "epoch": 2279} {"train_loss": -42.626220703125, "global_step": 275856, "epoch": 2279} {"train_loss": -43.28688049316406, "global_step": 275857, "epoch": 2279} {"train_loss": -41.93463897705078, "global_step": 275858, "epoch": 2279} {"train_loss": -42.95325469970703, "global_step": 275859, "epoch": 2279} {"train_loss": -42.529815673828125, "global_step": 275860, "epoch": 2279} {"train_loss": -39.95470428466797, "global_step": 275861, "epoch": 2279} {"train_loss": -40.39443588256836, "global_step": 275862, "epoch": 2279} {"train_loss": -42.830970764160156, "global_step": 275863, "epoch": 2279} {"train_loss": -42.22306442260742, "global_step": 275864, "epoch": 2279} {"train_loss": -43.099342346191406, "global_step": 275865, "epoch": 2279} {"train_loss": -42.71219253540039, "global_step": 275866, "epoch": 2279} {"train_loss": -42.06747055053711, "global_step": 275867, "epoch": 2279} {"train_loss": -42.99492263793945, "global_step": 275868, "epoch": 2279} {"train_loss": -43.01274871826172, "global_step": 275869, "epoch": 2279} {"train_loss": -42.37765121459961, "global_step": 275870, "epoch": 2279} {"train_loss": -42.6072998046875, "global_step": 275871, "epoch": 2279} {"train_loss": -41.871429443359375, "global_step": 275872, "epoch": 2279} {"train_loss": -42.21824264526367, "global_step": 275873, "epoch": 2279} {"train_loss": -42.41535186767578, "global_step": 275874, "epoch": 2279} {"train_loss": -42.59292221069336, "global_step": 275875, "epoch": 2279} {"train_loss": -40.760982513427734, "global_step": 275876, "epoch": 2279} {"train_loss": -40.31855392456055, "global_step": 275877, "epoch": 2279} {"train_loss": -43.076534271240234, "global_step": 275878, "epoch": 2279} {"train_loss": -41.983734225438646, "global_step": 275879, "epoch": 2279, "val_loss": 2546682.25} {"train_loss": -41.79800033569336, "global_step": 275880, "epoch": 2280} {"train_loss": -41.48491287231445, "global_step": 275881, "epoch": 2280} {"train_loss": -42.686283111572266, "global_step": 275882, "epoch": 2280} {"train_loss": -41.36890411376953, "global_step": 275883, "epoch": 2280} {"train_loss": -40.50564193725586, "global_step": 275884, "epoch": 2280} {"train_loss": -41.179779052734375, "global_step": 275885, "epoch": 2280} {"train_loss": -41.28082275390625, "global_step": 275886, "epoch": 2280} {"train_loss": -41.14691162109375, "global_step": 275887, "epoch": 2280} {"train_loss": -39.7262077331543, "global_step": 275888, "epoch": 2280} {"train_loss": -40.79490280151367, "global_step": 275889, "epoch": 2280} {"train_loss": -42.96165084838867, "global_step": 275890, "epoch": 2280} {"train_loss": -40.043212890625, "global_step": 275891, "epoch": 2280} {"train_loss": -42.005348205566406, "global_step": 275892, "epoch": 2280} {"train_loss": -41.34565353393555, "global_step": 275893, "epoch": 2280} {"train_loss": -41.055763244628906, "global_step": 275894, "epoch": 2280} {"train_loss": -42.23175811767578, "global_step": 275895, "epoch": 2280} {"train_loss": -42.12660598754883, "global_step": 275896, "epoch": 2280} {"train_loss": -41.10270309448242, "global_step": 275897, "epoch": 2280} {"train_loss": -42.956268310546875, "global_step": 275898, "epoch": 2280} {"train_loss": -41.22832489013672, "global_step": 275899, "epoch": 2280} {"train_loss": -42.31092071533203, "global_step": 275900, "epoch": 2280} {"train_loss": -41.97092819213867, "global_step": 275901, "epoch": 2280} {"train_loss": -42.757503509521484, "global_step": 275902, "epoch": 2280} {"train_loss": -41.97001647949219, "global_step": 275903, "epoch": 2280} {"train_loss": -42.60628890991211, "global_step": 275904, "epoch": 2280} {"train_loss": -41.87757873535156, "global_step": 275905, "epoch": 2280} {"train_loss": -42.424102783203125, "global_step": 275906, "epoch": 2280} {"train_loss": -42.37211990356445, "global_step": 275907, "epoch": 2280} {"train_loss": -41.748260498046875, "global_step": 275908, "epoch": 2280} {"train_loss": -42.7104377746582, "global_step": 275909, "epoch": 2280} {"train_loss": -42.18931198120117, "global_step": 275910, "epoch": 2280} {"train_loss": -42.29582214355469, "global_step": 275911, "epoch": 2280} {"train_loss": -42.66667556762695, "global_step": 275912, "epoch": 2280} {"train_loss": -43.12527084350586, "global_step": 275913, "epoch": 2280} {"train_loss": -42.41081619262695, "global_step": 275914, "epoch": 2280} {"train_loss": -42.80604934692383, "global_step": 275915, "epoch": 2280} {"train_loss": -42.5766716003418, "global_step": 275916, "epoch": 2280} {"train_loss": -43.003929138183594, "global_step": 275917, "epoch": 2280} {"train_loss": -42.400856018066406, "global_step": 275918, "epoch": 2280} {"train_loss": -43.04249954223633, "global_step": 275919, "epoch": 2280} {"train_loss": -43.10758590698242, "global_step": 275920, "epoch": 2280} {"train_loss": -42.87733840942383, "global_step": 275921, "epoch": 2280} {"train_loss": -43.09197998046875, "global_step": 275922, "epoch": 2280} {"train_loss": -43.13336181640625, "global_step": 275923, "epoch": 2280} {"train_loss": -43.7647590637207, "global_step": 275924, "epoch": 2280} {"train_loss": -43.70262145996094, "global_step": 275925, "epoch": 2280} {"train_loss": -43.13522720336914, "global_step": 275926, "epoch": 2280} {"train_loss": -43.5936279296875, "global_step": 275927, "epoch": 2280} {"train_loss": -43.28261947631836, "global_step": 275928, "epoch": 2280} {"train_loss": -43.17320251464844, "global_step": 275929, "epoch": 2280} {"train_loss": -43.921382904052734, "global_step": 275930, "epoch": 2280} {"train_loss": -42.95711898803711, "global_step": 275931, "epoch": 2280} {"train_loss": -42.770259857177734, "global_step": 275932, "epoch": 2280} {"train_loss": -43.44344711303711, "global_step": 275933, "epoch": 2280} {"train_loss": -43.32817077636719, "global_step": 275934, "epoch": 2280} {"train_loss": -42.33448028564453, "global_step": 275935, "epoch": 2280} {"train_loss": -43.52033233642578, "global_step": 275936, "epoch": 2280} {"train_loss": -42.81370162963867, "global_step": 275937, "epoch": 2280} {"train_loss": -42.89739227294922, "global_step": 275938, "epoch": 2280} {"train_loss": -43.54049301147461, "global_step": 275939, "epoch": 2280} {"train_loss": -43.151119232177734, "global_step": 275940, "epoch": 2280} {"train_loss": -43.58340072631836, "global_step": 275941, "epoch": 2280} {"train_loss": -43.78107452392578, "global_step": 275942, "epoch": 2280} {"train_loss": -43.67808151245117, "global_step": 275943, "epoch": 2280} {"train_loss": -43.47080612182617, "global_step": 275944, "epoch": 2280} {"train_loss": -43.169036865234375, "global_step": 275945, "epoch": 2280} {"train_loss": -42.1390495300293, "global_step": 275946, "epoch": 2280} {"train_loss": -43.27395248413086, "global_step": 275947, "epoch": 2280} {"train_loss": -43.43429183959961, "global_step": 275948, "epoch": 2280} {"train_loss": -42.82054138183594, "global_step": 275949, "epoch": 2280} {"train_loss": -42.103267669677734, "global_step": 275950, "epoch": 2280} {"train_loss": -43.98031997680664, "global_step": 275951, "epoch": 2280} {"train_loss": -43.53443908691406, "global_step": 275952, "epoch": 2280} {"train_loss": -42.82489013671875, "global_step": 275953, "epoch": 2280} {"train_loss": -43.68568801879883, "global_step": 275954, "epoch": 2280} {"train_loss": -43.754425048828125, "global_step": 275955, "epoch": 2280} {"train_loss": -43.46405792236328, "global_step": 275956, "epoch": 2280} {"train_loss": -43.82916259765625, "global_step": 275957, "epoch": 2280} {"train_loss": -43.54059600830078, "global_step": 275958, "epoch": 2280} {"train_loss": -41.84774398803711, "global_step": 275959, "epoch": 2280} {"train_loss": -43.7370491027832, "global_step": 275960, "epoch": 2280} {"train_loss": -42.984962463378906, "global_step": 275961, "epoch": 2280} {"train_loss": -42.43707275390625, "global_step": 275962, "epoch": 2280} {"train_loss": -43.34368133544922, "global_step": 275963, "epoch": 2280} {"train_loss": -43.529598236083984, "global_step": 275964, "epoch": 2280} {"train_loss": -42.263919830322266, "global_step": 275965, "epoch": 2280} {"train_loss": -42.66021728515625, "global_step": 275966, "epoch": 2280} {"train_loss": -43.46647262573242, "global_step": 275967, "epoch": 2280} {"train_loss": -42.502235412597656, "global_step": 275968, "epoch": 2280} {"train_loss": -43.391170501708984, "global_step": 275969, "epoch": 2280} {"train_loss": -42.82542037963867, "global_step": 275970, "epoch": 2280} {"train_loss": -43.265316009521484, "global_step": 275971, "epoch": 2280} {"train_loss": -43.54166793823242, "global_step": 275972, "epoch": 2280} {"train_loss": -43.352256774902344, "global_step": 275973, "epoch": 2280} {"train_loss": -42.31000518798828, "global_step": 275974, "epoch": 2280} {"train_loss": -43.37852478027344, "global_step": 275975, "epoch": 2280} {"train_loss": -42.594783782958984, "global_step": 275976, "epoch": 2280} {"train_loss": -42.63785934448242, "global_step": 275977, "epoch": 2280} {"train_loss": -42.42926788330078, "global_step": 275978, "epoch": 2280} {"train_loss": -41.15862274169922, "global_step": 275979, "epoch": 2280} {"train_loss": -40.160125732421875, "global_step": 275980, "epoch": 2280} {"train_loss": -41.690452575683594, "global_step": 275981, "epoch": 2280} {"train_loss": -42.84376525878906, "global_step": 275982, "epoch": 2280} {"train_loss": -43.08340072631836, "global_step": 275983, "epoch": 2280} {"train_loss": -42.15377426147461, "global_step": 275984, "epoch": 2280} {"train_loss": -40.843692779541016, "global_step": 275985, "epoch": 2280} {"train_loss": -42.1780891418457, "global_step": 275986, "epoch": 2280} {"train_loss": -43.36939239501953, "global_step": 275987, "epoch": 2280} {"train_loss": -41.55949401855469, "global_step": 275988, "epoch": 2280} {"train_loss": -41.804561614990234, "global_step": 275989, "epoch": 2280} {"train_loss": -41.468994140625, "global_step": 275990, "epoch": 2280} {"train_loss": -42.01920700073242, "global_step": 275991, "epoch": 2280} {"train_loss": -41.80588912963867, "global_step": 275992, "epoch": 2280} {"train_loss": -42.757476806640625, "global_step": 275993, "epoch": 2280} {"train_loss": -42.10940170288086, "global_step": 275994, "epoch": 2280} {"train_loss": -42.23093032836914, "global_step": 275995, "epoch": 2280} {"train_loss": -42.25954818725586, "global_step": 275996, "epoch": 2280} {"train_loss": -43.16984176635742, "global_step": 275997, "epoch": 2280} {"train_loss": -41.96857833862305, "global_step": 275998, "epoch": 2280} {"train_loss": -41.52202606201172, "global_step": 275999, "epoch": 2280} {"train_loss": -42.55735403644152, "global_step": 276000, "epoch": 2280, "val_loss": 2586617.75} {"train_loss": -42.97675704956055, "global_step": 276001, "epoch": 2281} {"train_loss": -42.67616271972656, "global_step": 276002, "epoch": 2281} {"train_loss": -43.1294059753418, "global_step": 276003, "epoch": 2281} {"train_loss": -41.98026657104492, "global_step": 276004, "epoch": 2281} {"train_loss": -43.31985092163086, "global_step": 276005, "epoch": 2281} {"train_loss": -43.0418701171875, "global_step": 276006, "epoch": 2281} {"train_loss": -42.85376739501953, "global_step": 276007, "epoch": 2281} {"train_loss": -43.34147262573242, "global_step": 276008, "epoch": 2281} {"train_loss": -42.57380676269531, "global_step": 276009, "epoch": 2281} {"train_loss": -38.561885833740234, "global_step": 276010, "epoch": 2281} {"train_loss": -41.95351791381836, "global_step": 276011, "epoch": 2281} {"train_loss": -41.596981048583984, "global_step": 276012, "epoch": 2281} {"train_loss": -40.16305160522461, "global_step": 276013, "epoch": 2281} {"train_loss": -36.95283889770508, "global_step": 276014, "epoch": 2281} {"train_loss": -41.89207458496094, "global_step": 276015, "epoch": 2281} {"train_loss": -33.72983932495117, "global_step": 276016, "epoch": 2281} {"train_loss": -39.70670700073242, "global_step": 276017, "epoch": 2281} {"train_loss": -38.17737579345703, "global_step": 276018, "epoch": 2281} {"train_loss": -42.549922943115234, "global_step": 276019, "epoch": 2281} {"train_loss": -34.44895935058594, "global_step": 276020, "epoch": 2281} {"train_loss": -30.710758209228516, "global_step": 276021, "epoch": 2281} {"train_loss": -34.25384521484375, "global_step": 276022, "epoch": 2281} {"train_loss": -39.09474563598633, "global_step": 276023, "epoch": 2281} {"train_loss": -33.32452392578125, "global_step": 276024, "epoch": 2281} {"train_loss": -25.32676124572754, "global_step": 276025, "epoch": 2281} {"train_loss": -37.7382698059082, "global_step": 276026, "epoch": 2281} {"train_loss": -23.3183536529541, "global_step": 276027, "epoch": 2281} {"train_loss": -12.772323608398438, "global_step": 276028, "epoch": 2281} {"train_loss": -32.351654052734375, "global_step": 276029, "epoch": 2281} {"train_loss": -37.4306755065918, "global_step": 276030, "epoch": 2281} {"train_loss": -35.238155364990234, "global_step": 276031, "epoch": 2281} {"train_loss": -24.333494186401367, "global_step": 276032, "epoch": 2281} {"train_loss": -25.883726119995117, "global_step": 276033, "epoch": 2281} {"train_loss": -33.23220443725586, "global_step": 276034, "epoch": 2281} {"train_loss": -36.34027099609375, "global_step": 276035, "epoch": 2281} {"train_loss": -35.857200622558594, "global_step": 276036, "epoch": 2281} {"train_loss": -31.18121910095215, "global_step": 276037, "epoch": 2281} {"train_loss": -36.594459533691406, "global_step": 276038, "epoch": 2281} {"train_loss": -34.804176330566406, "global_step": 276039, "epoch": 2281} {"train_loss": -35.49192810058594, "global_step": 276040, "epoch": 2281} {"train_loss": -34.81339645385742, "global_step": 276041, "epoch": 2281} {"train_loss": -32.75642013549805, "global_step": 276042, "epoch": 2281} {"train_loss": -33.08953094482422, "global_step": 276043, "epoch": 2281} {"train_loss": -36.59727096557617, "global_step": 276044, "epoch": 2281} {"train_loss": -35.919769287109375, "global_step": 276045, "epoch": 2281} {"train_loss": -36.0966911315918, "global_step": 276046, "epoch": 2281} {"train_loss": -36.835411071777344, "global_step": 276047, "epoch": 2281} {"train_loss": -37.07755661010742, "global_step": 276048, "epoch": 2281} {"train_loss": -38.36902618408203, "global_step": 276049, "epoch": 2281} {"train_loss": -37.39897537231445, "global_step": 276050, "epoch": 2281} {"train_loss": -36.1793327331543, "global_step": 276051, "epoch": 2281} {"train_loss": -38.49002456665039, "global_step": 276052, "epoch": 2281} {"train_loss": -36.47895050048828, "global_step": 276053, "epoch": 2281} {"train_loss": -38.34016418457031, "global_step": 276054, "epoch": 2281} {"train_loss": -36.8303108215332, "global_step": 276055, "epoch": 2281} {"train_loss": -37.176204681396484, "global_step": 276056, "epoch": 2281} {"train_loss": -39.15481948852539, "global_step": 276057, "epoch": 2281} {"train_loss": -39.00368881225586, "global_step": 276058, "epoch": 2281} {"train_loss": -38.8473014831543, "global_step": 276059, "epoch": 2281} {"train_loss": -37.736305236816406, "global_step": 276060, "epoch": 2281} {"train_loss": -38.7912483215332, "global_step": 276061, "epoch": 2281} {"train_loss": -37.76764678955078, "global_step": 276062, "epoch": 2281} {"train_loss": -37.416961669921875, "global_step": 276063, "epoch": 2281} {"train_loss": -38.6710205078125, "global_step": 276064, "epoch": 2281} {"train_loss": -38.485713958740234, "global_step": 276065, "epoch": 2281} {"train_loss": -39.05746078491211, "global_step": 276066, "epoch": 2281} {"train_loss": -39.49637985229492, "global_step": 276067, "epoch": 2281} {"train_loss": -38.58649826049805, "global_step": 276068, "epoch": 2281} {"train_loss": -39.55449676513672, "global_step": 276069, "epoch": 2281} {"train_loss": -39.561767578125, "global_step": 276070, "epoch": 2281} {"train_loss": -38.5482292175293, "global_step": 276071, "epoch": 2281} {"train_loss": -39.436004638671875, "global_step": 276072, "epoch": 2281} {"train_loss": -40.14679718017578, "global_step": 276073, "epoch": 2281} {"train_loss": -39.8489875793457, "global_step": 276074, "epoch": 2281} {"train_loss": -39.512046813964844, "global_step": 276075, "epoch": 2281} {"train_loss": -39.3921012878418, "global_step": 276076, "epoch": 2281} {"train_loss": -40.0065803527832, "global_step": 276077, "epoch": 2281} {"train_loss": -39.4189453125, "global_step": 276078, "epoch": 2281} {"train_loss": -40.86113357543945, "global_step": 276079, "epoch": 2281} {"train_loss": -38.3108024597168, "global_step": 276080, "epoch": 2281} {"train_loss": -40.22916030883789, "global_step": 276081, "epoch": 2281} {"train_loss": -39.58564376831055, "global_step": 276082, "epoch": 2281} {"train_loss": -39.55146408081055, "global_step": 276083, "epoch": 2281} {"train_loss": -39.39101791381836, "global_step": 276084, "epoch": 2281} {"train_loss": -38.804073333740234, "global_step": 276085, "epoch": 2281} {"train_loss": -39.83833312988281, "global_step": 276086, "epoch": 2281} {"train_loss": -39.76545333862305, "global_step": 276087, "epoch": 2281} {"train_loss": -40.154640197753906, "global_step": 276088, "epoch": 2281} {"train_loss": -40.32971954345703, "global_step": 276089, "epoch": 2281} {"train_loss": -40.6718864440918, "global_step": 276090, "epoch": 2281} {"train_loss": -39.91079330444336, "global_step": 276091, "epoch": 2281} {"train_loss": -40.45685577392578, "global_step": 276092, "epoch": 2281} {"train_loss": -39.36389923095703, "global_step": 276093, "epoch": 2281} {"train_loss": -39.73610305786133, "global_step": 276094, "epoch": 2281} {"train_loss": -39.65290069580078, "global_step": 276095, "epoch": 2281} {"train_loss": -40.14871597290039, "global_step": 276096, "epoch": 2281} {"train_loss": -40.334625244140625, "global_step": 276097, "epoch": 2281} {"train_loss": -39.9735107421875, "global_step": 276098, "epoch": 2281} {"train_loss": -40.18586349487305, "global_step": 276099, "epoch": 2281} {"train_loss": -41.03252029418945, "global_step": 276100, "epoch": 2281} {"train_loss": -40.54161834716797, "global_step": 276101, "epoch": 2281} {"train_loss": -40.711238861083984, "global_step": 276102, "epoch": 2281} {"train_loss": -40.58650588989258, "global_step": 276103, "epoch": 2281} {"train_loss": -40.412654876708984, "global_step": 276104, "epoch": 2281} {"train_loss": -41.2251091003418, "global_step": 276105, "epoch": 2281} {"train_loss": -40.72877502441406, "global_step": 276106, "epoch": 2281} {"train_loss": -40.51963806152344, "global_step": 276107, "epoch": 2281} {"train_loss": -40.658050537109375, "global_step": 276108, "epoch": 2281} {"train_loss": -39.5156364440918, "global_step": 276109, "epoch": 2281} {"train_loss": -40.391029357910156, "global_step": 276110, "epoch": 2281} {"train_loss": -41.15359115600586, "global_step": 276111, "epoch": 2281} {"train_loss": -41.32500457763672, "global_step": 276112, "epoch": 2281} {"train_loss": -41.10053253173828, "global_step": 276113, "epoch": 2281} {"train_loss": -42.25698471069336, "global_step": 276114, "epoch": 2281} {"train_loss": -41.31001663208008, "global_step": 276115, "epoch": 2281} {"train_loss": -41.105648040771484, "global_step": 276116, "epoch": 2281} {"train_loss": -41.557796478271484, "global_step": 276117, "epoch": 2281} {"train_loss": -41.069549560546875, "global_step": 276118, "epoch": 2281} {"train_loss": -41.843414306640625, "global_step": 276119, "epoch": 2281} {"train_loss": -41.4328727722168, "global_step": 276120, "epoch": 2281} {"train_loss": -38.27543266548598, "global_step": 276121, "epoch": 2281, "val_loss": 2522319.75} {"train_loss": -40.92110061645508, "global_step": 276122, "epoch": 2282} {"train_loss": -41.11829376220703, "global_step": 276123, "epoch": 2282} {"train_loss": -42.17021560668945, "global_step": 276124, "epoch": 2282} {"train_loss": -42.00681686401367, "global_step": 276125, "epoch": 2282} {"train_loss": -41.75778579711914, "global_step": 276126, "epoch": 2282} {"train_loss": -42.3156623840332, "global_step": 276127, "epoch": 2282} {"train_loss": -41.462432861328125, "global_step": 276128, "epoch": 2282} {"train_loss": -41.626304626464844, "global_step": 276129, "epoch": 2282} {"train_loss": -41.559539794921875, "global_step": 276130, "epoch": 2282} {"train_loss": -41.976280212402344, "global_step": 276131, "epoch": 2282} {"train_loss": -40.97297668457031, "global_step": 276132, "epoch": 2282} {"train_loss": -41.177581787109375, "global_step": 276133, "epoch": 2282} {"train_loss": -41.829776763916016, "global_step": 276134, "epoch": 2282} {"train_loss": -41.266719818115234, "global_step": 276135, "epoch": 2282} {"train_loss": -41.32645797729492, "global_step": 276136, "epoch": 2282} {"train_loss": -41.4506950378418, "global_step": 276137, "epoch": 2282} {"train_loss": -41.73579025268555, "global_step": 276138, "epoch": 2282} {"train_loss": -42.20176315307617, "global_step": 276139, "epoch": 2282} {"train_loss": -41.86214065551758, "global_step": 276140, "epoch": 2282} {"train_loss": -42.48385238647461, "global_step": 276141, "epoch": 2282} {"train_loss": -42.09773635864258, "global_step": 276142, "epoch": 2282} {"train_loss": -42.240875244140625, "global_step": 276143, "epoch": 2282} {"train_loss": -41.5643196105957, "global_step": 276144, "epoch": 2282} {"train_loss": -41.74272537231445, "global_step": 276145, "epoch": 2282} {"train_loss": -41.68962478637695, "global_step": 276146, "epoch": 2282} {"train_loss": -42.382816314697266, "global_step": 276147, "epoch": 2282} {"train_loss": -42.100223541259766, "global_step": 276148, "epoch": 2282} {"train_loss": -42.706878662109375, "global_step": 276149, "epoch": 2282} {"train_loss": -42.157981872558594, "global_step": 276150, "epoch": 2282} {"train_loss": -41.923946380615234, "global_step": 276151, "epoch": 2282} {"train_loss": -42.74896240234375, "global_step": 276152, "epoch": 2282} {"train_loss": -42.06174087524414, "global_step": 276153, "epoch": 2282} {"train_loss": -42.2320671081543, "global_step": 276154, "epoch": 2282} {"train_loss": -42.74092102050781, "global_step": 276155, "epoch": 2282} {"train_loss": -42.33911895751953, "global_step": 276156, "epoch": 2282} {"train_loss": -42.3879508972168, "global_step": 276157, "epoch": 2282} {"train_loss": -42.913394927978516, "global_step": 276158, "epoch": 2282} {"train_loss": -42.118534088134766, "global_step": 276159, "epoch": 2282} {"train_loss": -41.50666046142578, "global_step": 276160, "epoch": 2282} {"train_loss": -42.476600646972656, "global_step": 276161, "epoch": 2282} {"train_loss": -42.182186126708984, "global_step": 276162, "epoch": 2282} {"train_loss": -42.25035858154297, "global_step": 276163, "epoch": 2282} {"train_loss": -42.691993713378906, "global_step": 276164, "epoch": 2282} {"train_loss": -41.98749923706055, "global_step": 276165, "epoch": 2282} {"train_loss": -42.286659240722656, "global_step": 276166, "epoch": 2282} {"train_loss": -42.5047721862793, "global_step": 276167, "epoch": 2282} {"train_loss": -42.10211944580078, "global_step": 276168, "epoch": 2282} {"train_loss": -42.02100372314453, "global_step": 276169, "epoch": 2282} {"train_loss": -42.23484420776367, "global_step": 276170, "epoch": 2282} {"train_loss": -42.02628707885742, "global_step": 276171, "epoch": 2282} {"train_loss": -42.425724029541016, "global_step": 276172, "epoch": 2282} {"train_loss": -42.874412536621094, "global_step": 276173, "epoch": 2282} {"train_loss": -42.55207443237305, "global_step": 276174, "epoch": 2282} {"train_loss": -42.013851165771484, "global_step": 276175, "epoch": 2282} {"train_loss": -42.519840240478516, "global_step": 276176, "epoch": 2282} {"train_loss": -43.206661224365234, "global_step": 276177, "epoch": 2282} {"train_loss": -41.72515869140625, "global_step": 276178, "epoch": 2282} {"train_loss": -41.71660232543945, "global_step": 276179, "epoch": 2282} {"train_loss": -42.66853332519531, "global_step": 276180, "epoch": 2282} {"train_loss": -41.88264465332031, "global_step": 276181, "epoch": 2282} {"train_loss": -42.873695373535156, "global_step": 276182, "epoch": 2282} {"train_loss": -42.566802978515625, "global_step": 276183, "epoch": 2282} {"train_loss": -42.13480758666992, "global_step": 276184, "epoch": 2282} {"train_loss": -41.810699462890625, "global_step": 276185, "epoch": 2282} {"train_loss": -42.34193420410156, "global_step": 276186, "epoch": 2282} {"train_loss": -42.34081268310547, "global_step": 276187, "epoch": 2282} {"train_loss": -42.402950286865234, "global_step": 276188, "epoch": 2282} {"train_loss": -41.365657806396484, "global_step": 276189, "epoch": 2282} {"train_loss": -42.651981353759766, "global_step": 276190, "epoch": 2282} {"train_loss": -42.724891662597656, "global_step": 276191, "epoch": 2282} {"train_loss": -41.3763427734375, "global_step": 276192, "epoch": 2282} {"train_loss": -42.4919319152832, "global_step": 276193, "epoch": 2282} {"train_loss": -41.96120834350586, "global_step": 276194, "epoch": 2282} {"train_loss": -42.243865966796875, "global_step": 276195, "epoch": 2282} {"train_loss": -42.910823822021484, "global_step": 276196, "epoch": 2282} {"train_loss": -42.645660400390625, "global_step": 276197, "epoch": 2282} {"train_loss": -42.201656341552734, "global_step": 276198, "epoch": 2282} {"train_loss": -41.77967071533203, "global_step": 276199, "epoch": 2282} {"train_loss": -43.00759506225586, "global_step": 276200, "epoch": 2282} {"train_loss": -42.19139099121094, "global_step": 276201, "epoch": 2282} {"train_loss": -40.97904586791992, "global_step": 276202, "epoch": 2282} {"train_loss": -42.390724182128906, "global_step": 276203, "epoch": 2282} {"train_loss": -42.59858703613281, "global_step": 276204, "epoch": 2282} {"train_loss": -42.67976379394531, "global_step": 276205, "epoch": 2282} {"train_loss": -43.23934555053711, "global_step": 276206, "epoch": 2282} {"train_loss": -42.903289794921875, "global_step": 276207, "epoch": 2282} {"train_loss": -42.02736282348633, "global_step": 276208, "epoch": 2282} {"train_loss": -41.13369369506836, "global_step": 276209, "epoch": 2282} {"train_loss": -39.88532257080078, "global_step": 276210, "epoch": 2282} {"train_loss": -39.17842483520508, "global_step": 276211, "epoch": 2282} {"train_loss": -39.7092399597168, "global_step": 276212, "epoch": 2282} {"train_loss": -40.6017951965332, "global_step": 276213, "epoch": 2282} {"train_loss": -41.37532424926758, "global_step": 276214, "epoch": 2282} {"train_loss": -40.75513458251953, "global_step": 276215, "epoch": 2282} {"train_loss": -42.397945404052734, "global_step": 276216, "epoch": 2282} {"train_loss": -41.19622802734375, "global_step": 276217, "epoch": 2282} {"train_loss": -41.848575592041016, "global_step": 276218, "epoch": 2282} {"train_loss": -42.02474594116211, "global_step": 276219, "epoch": 2282} {"train_loss": -41.21710205078125, "global_step": 276220, "epoch": 2282} {"train_loss": -41.84992218017578, "global_step": 276221, "epoch": 2282} {"train_loss": -40.25153732299805, "global_step": 276222, "epoch": 2282} {"train_loss": -42.16876983642578, "global_step": 276223, "epoch": 2282} {"train_loss": -40.25908279418945, "global_step": 276224, "epoch": 2282} {"train_loss": -40.8194694519043, "global_step": 276225, "epoch": 2282} {"train_loss": -41.27192687988281, "global_step": 276226, "epoch": 2282} {"train_loss": -39.74050521850586, "global_step": 276227, "epoch": 2282} {"train_loss": -41.65554428100586, "global_step": 276228, "epoch": 2282} {"train_loss": -38.453033447265625, "global_step": 276229, "epoch": 2282} {"train_loss": -41.48286819458008, "global_step": 276230, "epoch": 2282} {"train_loss": -39.379615783691406, "global_step": 276231, "epoch": 2282} {"train_loss": -39.64065170288086, "global_step": 276232, "epoch": 2282} {"train_loss": -38.45645523071289, "global_step": 276233, "epoch": 2282} {"train_loss": -40.76035690307617, "global_step": 276234, "epoch": 2282} {"train_loss": -39.29864501953125, "global_step": 276235, "epoch": 2282} {"train_loss": -33.54154586791992, "global_step": 276236, "epoch": 2282} {"train_loss": -36.013404846191406, "global_step": 276237, "epoch": 2282} {"train_loss": -37.02384567260742, "global_step": 276238, "epoch": 2282} {"train_loss": -38.215171813964844, "global_step": 276239, "epoch": 2282} {"train_loss": -32.94279098510742, "global_step": 276240, "epoch": 2282} {"train_loss": -39.23391342163086, "global_step": 276241, "epoch": 2282} {"train_loss": -41.40962804053441, "global_step": 276242, "epoch": 2282, "val_loss": 2679539.5} {"train_loss": -39.68949508666992, "global_step": 276243, "epoch": 2283} {"train_loss": -30.4532527923584, "global_step": 276244, "epoch": 2283} {"train_loss": -40.3974609375, "global_step": 276245, "epoch": 2283} {"train_loss": -34.5053596496582, "global_step": 276246, "epoch": 2283} {"train_loss": -35.32991027832031, "global_step": 276247, "epoch": 2283} {"train_loss": -40.13473129272461, "global_step": 276248, "epoch": 2283} {"train_loss": -38.298675537109375, "global_step": 276249, "epoch": 2283} {"train_loss": -38.67766571044922, "global_step": 276250, "epoch": 2283} {"train_loss": -40.54978561401367, "global_step": 276251, "epoch": 2283} {"train_loss": -39.286659240722656, "global_step": 276252, "epoch": 2283} {"train_loss": -40.257381439208984, "global_step": 276253, "epoch": 2283} {"train_loss": -40.582611083984375, "global_step": 276254, "epoch": 2283} {"train_loss": -39.271461486816406, "global_step": 276255, "epoch": 2283} {"train_loss": -40.314083099365234, "global_step": 276256, "epoch": 2283} {"train_loss": -40.20821762084961, "global_step": 276257, "epoch": 2283} {"train_loss": -41.055850982666016, "global_step": 276258, "epoch": 2283} {"train_loss": -41.056793212890625, "global_step": 276259, "epoch": 2283} {"train_loss": -41.077728271484375, "global_step": 276260, "epoch": 2283} {"train_loss": -40.311946868896484, "global_step": 276261, "epoch": 2283} {"train_loss": -41.197288513183594, "global_step": 276262, "epoch": 2283} {"train_loss": -40.89296340942383, "global_step": 276263, "epoch": 2283} {"train_loss": -41.63544845581055, "global_step": 276264, "epoch": 2283} {"train_loss": -40.61284255981445, "global_step": 276265, "epoch": 2283} {"train_loss": -41.4820671081543, "global_step": 276266, "epoch": 2283} {"train_loss": -41.26879119873047, "global_step": 276267, "epoch": 2283} {"train_loss": -41.168453216552734, "global_step": 276268, "epoch": 2283} {"train_loss": -41.4548454284668, "global_step": 276269, "epoch": 2283} {"train_loss": -42.5560302734375, "global_step": 276270, "epoch": 2283} {"train_loss": -42.02042770385742, "global_step": 276271, "epoch": 2283} {"train_loss": -41.8486442565918, "global_step": 276272, "epoch": 2283} {"train_loss": -41.09368896484375, "global_step": 276273, "epoch": 2283} {"train_loss": -42.31416702270508, "global_step": 276274, "epoch": 2283} {"train_loss": -41.42042922973633, "global_step": 276275, "epoch": 2283} {"train_loss": -41.78205490112305, "global_step": 276276, "epoch": 2283} {"train_loss": -42.01616668701172, "global_step": 276277, "epoch": 2283} {"train_loss": -42.37245559692383, "global_step": 276278, "epoch": 2283} {"train_loss": -42.390628814697266, "global_step": 276279, "epoch": 2283} {"train_loss": -41.61244583129883, "global_step": 276280, "epoch": 2283} {"train_loss": -42.132110595703125, "global_step": 276281, "epoch": 2283} {"train_loss": -42.21854782104492, "global_step": 276282, "epoch": 2283} {"train_loss": -42.421939849853516, "global_step": 276283, "epoch": 2283} {"train_loss": -42.45507049560547, "global_step": 276284, "epoch": 2283} {"train_loss": -42.21804428100586, "global_step": 276285, "epoch": 2283} {"train_loss": -41.9207878112793, "global_step": 276286, "epoch": 2283} {"train_loss": -42.33896255493164, "global_step": 276287, "epoch": 2283} {"train_loss": -42.68239974975586, "global_step": 276288, "epoch": 2283} {"train_loss": -42.591339111328125, "global_step": 276289, "epoch": 2283} {"train_loss": -42.83344650268555, "global_step": 276290, "epoch": 2283} {"train_loss": -42.49043655395508, "global_step": 276291, "epoch": 2283} {"train_loss": -42.454811096191406, "global_step": 276292, "epoch": 2283} {"train_loss": -42.941776275634766, "global_step": 276293, "epoch": 2283} {"train_loss": -42.975379943847656, "global_step": 276294, "epoch": 2283} {"train_loss": -42.64237594604492, "global_step": 276295, "epoch": 2283} {"train_loss": -42.943031311035156, "global_step": 276296, "epoch": 2283} {"train_loss": -42.583213806152344, "global_step": 276297, "epoch": 2283} {"train_loss": -42.416778564453125, "global_step": 276298, "epoch": 2283} {"train_loss": -43.0954704284668, "global_step": 276299, "epoch": 2283} {"train_loss": -42.91733169555664, "global_step": 276300, "epoch": 2283} {"train_loss": -42.77242660522461, "global_step": 276301, "epoch": 2283} {"train_loss": -43.14480972290039, "global_step": 276302, "epoch": 2283} {"train_loss": -42.95859146118164, "global_step": 276303, "epoch": 2283} {"train_loss": -43.3175048828125, "global_step": 276304, "epoch": 2283} {"train_loss": -43.436920166015625, "global_step": 276305, "epoch": 2283} {"train_loss": -43.08704376220703, "global_step": 276306, "epoch": 2283} {"train_loss": -43.02374267578125, "global_step": 276307, "epoch": 2283} {"train_loss": -42.74186325073242, "global_step": 276308, "epoch": 2283} {"train_loss": -43.113128662109375, "global_step": 276309, "epoch": 2283} {"train_loss": -43.3910026550293, "global_step": 276310, "epoch": 2283} {"train_loss": -42.680965423583984, "global_step": 276311, "epoch": 2283} {"train_loss": -43.27989959716797, "global_step": 276312, "epoch": 2283} {"train_loss": -42.77748489379883, "global_step": 276313, "epoch": 2283} {"train_loss": -43.430355072021484, "global_step": 276314, "epoch": 2283} {"train_loss": -43.01042556762695, "global_step": 276315, "epoch": 2283} {"train_loss": -42.78330612182617, "global_step": 276316, "epoch": 2283} {"train_loss": -42.86783981323242, "global_step": 276317, "epoch": 2283} {"train_loss": -43.53495788574219, "global_step": 276318, "epoch": 2283} {"train_loss": -42.74587631225586, "global_step": 276319, "epoch": 2283} {"train_loss": -43.08861541748047, "global_step": 276320, "epoch": 2283} {"train_loss": -43.492427825927734, "global_step": 276321, "epoch": 2283} {"train_loss": -43.231781005859375, "global_step": 276322, "epoch": 2283} {"train_loss": -42.677093505859375, "global_step": 276323, "epoch": 2283} {"train_loss": -44.05844497680664, "global_step": 276324, "epoch": 2283} {"train_loss": -43.261962890625, "global_step": 276325, "epoch": 2283} {"train_loss": -43.14876174926758, "global_step": 276326, "epoch": 2283} {"train_loss": -42.19937515258789, "global_step": 276327, "epoch": 2283} {"train_loss": -43.274566650390625, "global_step": 276328, "epoch": 2283} {"train_loss": -43.83995056152344, "global_step": 276329, "epoch": 2283} {"train_loss": -42.46193313598633, "global_step": 276330, "epoch": 2283} {"train_loss": -41.41437530517578, "global_step": 276331, "epoch": 2283} {"train_loss": -43.44062042236328, "global_step": 276332, "epoch": 2283} {"train_loss": -42.921180725097656, "global_step": 276333, "epoch": 2283} {"train_loss": -42.911537170410156, "global_step": 276334, "epoch": 2283} {"train_loss": -41.900020599365234, "global_step": 276335, "epoch": 2283} {"train_loss": -42.75053024291992, "global_step": 276336, "epoch": 2283} {"train_loss": -43.14076614379883, "global_step": 276337, "epoch": 2283} {"train_loss": -42.13611602783203, "global_step": 276338, "epoch": 2283} {"train_loss": -41.596675872802734, "global_step": 276339, "epoch": 2283} {"train_loss": -39.284454345703125, "global_step": 276340, "epoch": 2283} {"train_loss": -37.430999755859375, "global_step": 276341, "epoch": 2283} {"train_loss": -37.008155822753906, "global_step": 276342, "epoch": 2283} {"train_loss": -37.49800491333008, "global_step": 276343, "epoch": 2283} {"train_loss": -38.61323165893555, "global_step": 276344, "epoch": 2283} {"train_loss": -41.20785140991211, "global_step": 276345, "epoch": 2283} {"train_loss": -42.30180358886719, "global_step": 276346, "epoch": 2283} {"train_loss": -39.9261360168457, "global_step": 276347, "epoch": 2283} {"train_loss": -41.42384719848633, "global_step": 276348, "epoch": 2283} {"train_loss": -40.1268310546875, "global_step": 276349, "epoch": 2283} {"train_loss": -40.15981674194336, "global_step": 276350, "epoch": 2283} {"train_loss": -41.91162872314453, "global_step": 276351, "epoch": 2283} {"train_loss": -41.51811218261719, "global_step": 276352, "epoch": 2283} {"train_loss": -41.22865295410156, "global_step": 276353, "epoch": 2283} {"train_loss": -40.99921417236328, "global_step": 276354, "epoch": 2283} {"train_loss": -40.973060607910156, "global_step": 276355, "epoch": 2283} {"train_loss": -41.88978958129883, "global_step": 276356, "epoch": 2283} {"train_loss": -41.28799819946289, "global_step": 276357, "epoch": 2283} {"train_loss": -41.568355560302734, "global_step": 276358, "epoch": 2283} {"train_loss": -40.88067626953125, "global_step": 276359, "epoch": 2283} {"train_loss": -40.9030647277832, "global_step": 276360, "epoch": 2283} {"train_loss": -39.372676849365234, "global_step": 276361, "epoch": 2283} {"train_loss": -42.04812240600586, "global_step": 276362, "epoch": 2283} {"train_loss": -41.56445001964727, "global_step": 276363, "epoch": 2283, "val_loss": 2575962.75} {"train_loss": -40.88043975830078, "global_step": 276364, "epoch": 2284} {"train_loss": -40.85907745361328, "global_step": 276365, "epoch": 2284} {"train_loss": -41.48033142089844, "global_step": 276366, "epoch": 2284} {"train_loss": -41.21095275878906, "global_step": 276367, "epoch": 2284} {"train_loss": -41.5138053894043, "global_step": 276368, "epoch": 2284} {"train_loss": -40.58285903930664, "global_step": 276369, "epoch": 2284} {"train_loss": -42.47367477416992, "global_step": 276370, "epoch": 2284} {"train_loss": -41.6217041015625, "global_step": 276371, "epoch": 2284} {"train_loss": -41.52946472167969, "global_step": 276372, "epoch": 2284} {"train_loss": -41.891883850097656, "global_step": 276373, "epoch": 2284} {"train_loss": -40.73863220214844, "global_step": 276374, "epoch": 2284} {"train_loss": -41.271148681640625, "global_step": 276375, "epoch": 2284} {"train_loss": -41.349571228027344, "global_step": 276376, "epoch": 2284} {"train_loss": -40.97844314575195, "global_step": 276377, "epoch": 2284} {"train_loss": -41.51091384887695, "global_step": 276378, "epoch": 2284} {"train_loss": -41.312347412109375, "global_step": 276379, "epoch": 2284} {"train_loss": -41.54243087768555, "global_step": 276380, "epoch": 2284} {"train_loss": -42.05341339111328, "global_step": 276381, "epoch": 2284} {"train_loss": -41.222747802734375, "global_step": 276382, "epoch": 2284} {"train_loss": -40.980106353759766, "global_step": 276383, "epoch": 2284} {"train_loss": -40.7149658203125, "global_step": 276384, "epoch": 2284} {"train_loss": -41.254329681396484, "global_step": 276385, "epoch": 2284} {"train_loss": -41.044281005859375, "global_step": 276386, "epoch": 2284} {"train_loss": -41.59088134765625, "global_step": 276387, "epoch": 2284} {"train_loss": -41.10162353515625, "global_step": 276388, "epoch": 2284} {"train_loss": -41.73590087890625, "global_step": 276389, "epoch": 2284} {"train_loss": -42.30414581298828, "global_step": 276390, "epoch": 2284} {"train_loss": -41.26901626586914, "global_step": 276391, "epoch": 2284} {"train_loss": -42.798274993896484, "global_step": 276392, "epoch": 2284} {"train_loss": -37.685157775878906, "global_step": 276393, "epoch": 2284} {"train_loss": -42.359031677246094, "global_step": 276394, "epoch": 2284} {"train_loss": -40.93426513671875, "global_step": 276395, "epoch": 2284} {"train_loss": -41.4602165222168, "global_step": 276396, "epoch": 2284} {"train_loss": -40.701171875, "global_step": 276397, "epoch": 2284} {"train_loss": -39.58909225463867, "global_step": 276398, "epoch": 2284} {"train_loss": -39.460357666015625, "global_step": 276399, "epoch": 2284} {"train_loss": -40.23529052734375, "global_step": 276400, "epoch": 2284} {"train_loss": -39.55360412597656, "global_step": 276401, "epoch": 2284} {"train_loss": -25.744916915893555, "global_step": 276402, "epoch": 2284} {"train_loss": -37.65714645385742, "global_step": 276403, "epoch": 2284} {"train_loss": -39.04206466674805, "global_step": 276404, "epoch": 2284} {"train_loss": -38.2090950012207, "global_step": 276405, "epoch": 2284} {"train_loss": -38.53041458129883, "global_step": 276406, "epoch": 2284} {"train_loss": -37.02897262573242, "global_step": 276407, "epoch": 2284} {"train_loss": -39.550106048583984, "global_step": 276408, "epoch": 2284} {"train_loss": -37.301513671875, "global_step": 276409, "epoch": 2284} {"train_loss": -40.92133712768555, "global_step": 276410, "epoch": 2284} {"train_loss": -39.2664680480957, "global_step": 276411, "epoch": 2284} {"train_loss": -40.81943893432617, "global_step": 276412, "epoch": 2284} {"train_loss": -40.83112716674805, "global_step": 276413, "epoch": 2284} {"train_loss": -40.31117630004883, "global_step": 276414, "epoch": 2284} {"train_loss": -40.422645568847656, "global_step": 276415, "epoch": 2284} {"train_loss": -39.45634841918945, "global_step": 276416, "epoch": 2284} {"train_loss": -38.75145721435547, "global_step": 276417, "epoch": 2284} {"train_loss": -38.13299560546875, "global_step": 276418, "epoch": 2284} {"train_loss": -40.24410629272461, "global_step": 276419, "epoch": 2284} {"train_loss": -40.78017044067383, "global_step": 276420, "epoch": 2284} {"train_loss": -40.38479232788086, "global_step": 276421, "epoch": 2284} {"train_loss": -39.13529586791992, "global_step": 276422, "epoch": 2284} {"train_loss": -39.05155563354492, "global_step": 276423, "epoch": 2284} {"train_loss": -38.841346740722656, "global_step": 276424, "epoch": 2284} {"train_loss": -40.574951171875, "global_step": 276425, "epoch": 2284} {"train_loss": -40.471595764160156, "global_step": 276426, "epoch": 2284} {"train_loss": -33.52279281616211, "global_step": 276427, "epoch": 2284} {"train_loss": -41.10957717895508, "global_step": 276428, "epoch": 2284} {"train_loss": -35.42061233520508, "global_step": 276429, "epoch": 2284} {"train_loss": -40.380035400390625, "global_step": 276430, "epoch": 2284} {"train_loss": -40.28017044067383, "global_step": 276431, "epoch": 2284} {"train_loss": -39.61643600463867, "global_step": 276432, "epoch": 2284} {"train_loss": -39.27413558959961, "global_step": 276433, "epoch": 2284} {"train_loss": -40.063209533691406, "global_step": 276434, "epoch": 2284} {"train_loss": -41.22645950317383, "global_step": 276435, "epoch": 2284} {"train_loss": -41.14595031738281, "global_step": 276436, "epoch": 2284} {"train_loss": -38.52969741821289, "global_step": 276437, "epoch": 2284} {"train_loss": -40.3624267578125, "global_step": 276438, "epoch": 2284} {"train_loss": -39.53190231323242, "global_step": 276439, "epoch": 2284} {"train_loss": -40.391571044921875, "global_step": 276440, "epoch": 2284} {"train_loss": -38.11137008666992, "global_step": 276441, "epoch": 2284} {"train_loss": -39.825531005859375, "global_step": 276442, "epoch": 2284} {"train_loss": -39.25572967529297, "global_step": 276443, "epoch": 2284} {"train_loss": -39.154842376708984, "global_step": 276444, "epoch": 2284} {"train_loss": -38.08500671386719, "global_step": 276445, "epoch": 2284} {"train_loss": -38.15083694458008, "global_step": 276446, "epoch": 2284} {"train_loss": -40.410579681396484, "global_step": 276447, "epoch": 2284} {"train_loss": -38.15070343017578, "global_step": 276448, "epoch": 2284} {"train_loss": -38.0142707824707, "global_step": 276449, "epoch": 2284} {"train_loss": -40.24093246459961, "global_step": 276450, "epoch": 2284} {"train_loss": -39.567955017089844, "global_step": 276451, "epoch": 2284} {"train_loss": -40.5935173034668, "global_step": 276452, "epoch": 2284} {"train_loss": -41.783416748046875, "global_step": 276453, "epoch": 2284} {"train_loss": -39.50958251953125, "global_step": 276454, "epoch": 2284} {"train_loss": -40.10288619995117, "global_step": 276455, "epoch": 2284} {"train_loss": -39.32598876953125, "global_step": 276456, "epoch": 2284} {"train_loss": -40.451045989990234, "global_step": 276457, "epoch": 2284} {"train_loss": -39.91807174682617, "global_step": 276458, "epoch": 2284} {"train_loss": -40.79911422729492, "global_step": 276459, "epoch": 2284} {"train_loss": -41.291412353515625, "global_step": 276460, "epoch": 2284} {"train_loss": -41.59333419799805, "global_step": 276461, "epoch": 2284} {"train_loss": -41.391578674316406, "global_step": 276462, "epoch": 2284} {"train_loss": -41.368927001953125, "global_step": 276463, "epoch": 2284} {"train_loss": -41.72450256347656, "global_step": 276464, "epoch": 2284} {"train_loss": -40.72593307495117, "global_step": 276465, "epoch": 2284} {"train_loss": -41.5443115234375, "global_step": 276466, "epoch": 2284} {"train_loss": -40.59112548828125, "global_step": 276467, "epoch": 2284} {"train_loss": -41.562255859375, "global_step": 276468, "epoch": 2284} {"train_loss": -41.72768783569336, "global_step": 276469, "epoch": 2284} {"train_loss": -41.48284912109375, "global_step": 276470, "epoch": 2284} {"train_loss": -41.65556335449219, "global_step": 276471, "epoch": 2284} {"train_loss": -41.2511100769043, "global_step": 276472, "epoch": 2284} {"train_loss": -41.76819610595703, "global_step": 276473, "epoch": 2284} {"train_loss": -41.05410385131836, "global_step": 276474, "epoch": 2284} {"train_loss": -41.27415084838867, "global_step": 276475, "epoch": 2284} {"train_loss": -42.02634048461914, "global_step": 276476, "epoch": 2284} {"train_loss": -41.27911376953125, "global_step": 276477, "epoch": 2284} {"train_loss": -41.97368240356445, "global_step": 276478, "epoch": 2284} {"train_loss": -41.76990509033203, "global_step": 276479, "epoch": 2284} {"train_loss": -42.10820388793945, "global_step": 276480, "epoch": 2284} {"train_loss": -41.926429748535156, "global_step": 276481, "epoch": 2284} {"train_loss": -42.483978271484375, "global_step": 276482, "epoch": 2284} {"train_loss": -41.28776931762695, "global_step": 276483, "epoch": 2284} {"train_loss": -40.28913836833859, "global_step": 276484, "epoch": 2284, "val_loss": 2470151.5} {"train_loss": -41.74125289916992, "global_step": 276485, "epoch": 2285} {"train_loss": -41.534034729003906, "global_step": 276486, "epoch": 2285} {"train_loss": -42.42573165893555, "global_step": 276487, "epoch": 2285} {"train_loss": -41.93831253051758, "global_step": 276488, "epoch": 2285} {"train_loss": -42.04868698120117, "global_step": 276489, "epoch": 2285} {"train_loss": -42.18438720703125, "global_step": 276490, "epoch": 2285} {"train_loss": -42.54074478149414, "global_step": 276491, "epoch": 2285} {"train_loss": -42.00798416137695, "global_step": 276492, "epoch": 2285} {"train_loss": -42.482418060302734, "global_step": 276493, "epoch": 2285} {"train_loss": -42.60661697387695, "global_step": 276494, "epoch": 2285} {"train_loss": -42.346893310546875, "global_step": 276495, "epoch": 2285} {"train_loss": -42.90234375, "global_step": 276496, "epoch": 2285} {"train_loss": -42.3299560546875, "global_step": 276497, "epoch": 2285} {"train_loss": -41.80664825439453, "global_step": 276498, "epoch": 2285} {"train_loss": -41.42839431762695, "global_step": 276499, "epoch": 2285} {"train_loss": -42.31234359741211, "global_step": 276500, "epoch": 2285} {"train_loss": -42.540924072265625, "global_step": 276501, "epoch": 2285} {"train_loss": -42.90117263793945, "global_step": 276502, "epoch": 2285} {"train_loss": -42.49871063232422, "global_step": 276503, "epoch": 2285} {"train_loss": -42.77909469604492, "global_step": 276504, "epoch": 2285} {"train_loss": -43.028133392333984, "global_step": 276505, "epoch": 2285} {"train_loss": -42.291664123535156, "global_step": 276506, "epoch": 2285} {"train_loss": -42.65326690673828, "global_step": 276507, "epoch": 2285} {"train_loss": -43.080570220947266, "global_step": 276508, "epoch": 2285} {"train_loss": -42.963844299316406, "global_step": 276509, "epoch": 2285} {"train_loss": -43.1788444519043, "global_step": 276510, "epoch": 2285} {"train_loss": -42.82472610473633, "global_step": 276511, "epoch": 2285} {"train_loss": -42.47428512573242, "global_step": 276512, "epoch": 2285} {"train_loss": -42.66692352294922, "global_step": 276513, "epoch": 2285} {"train_loss": -42.72809982299805, "global_step": 276514, "epoch": 2285} {"train_loss": -41.956417083740234, "global_step": 276515, "epoch": 2285} {"train_loss": -42.93101119995117, "global_step": 276516, "epoch": 2285} {"train_loss": -42.8416862487793, "global_step": 276517, "epoch": 2285} {"train_loss": -42.66849136352539, "global_step": 276518, "epoch": 2285} {"train_loss": -42.602943420410156, "global_step": 276519, "epoch": 2285} {"train_loss": -43.37783432006836, "global_step": 276520, "epoch": 2285} {"train_loss": -43.006187438964844, "global_step": 276521, "epoch": 2285} {"train_loss": -42.27545928955078, "global_step": 276522, "epoch": 2285} {"train_loss": -42.173301696777344, "global_step": 276523, "epoch": 2285} {"train_loss": -42.85056686401367, "global_step": 276524, "epoch": 2285} {"train_loss": -42.02894592285156, "global_step": 276525, "epoch": 2285} {"train_loss": -42.82487869262695, "global_step": 276526, "epoch": 2285} {"train_loss": -42.54632568359375, "global_step": 276527, "epoch": 2285} {"train_loss": -42.40576171875, "global_step": 276528, "epoch": 2285} {"train_loss": -42.519290924072266, "global_step": 276529, "epoch": 2285} {"train_loss": -42.78927993774414, "global_step": 276530, "epoch": 2285} {"train_loss": -42.53836441040039, "global_step": 276531, "epoch": 2285} {"train_loss": -42.2054328918457, "global_step": 276532, "epoch": 2285} {"train_loss": -41.93557357788086, "global_step": 276533, "epoch": 2285} {"train_loss": -42.82186508178711, "global_step": 276534, "epoch": 2285} {"train_loss": -42.901222229003906, "global_step": 276535, "epoch": 2285} {"train_loss": -42.734107971191406, "global_step": 276536, "epoch": 2285} {"train_loss": -41.55450439453125, "global_step": 276537, "epoch": 2285} {"train_loss": -42.794734954833984, "global_step": 276538, "epoch": 2285} {"train_loss": -42.84076690673828, "global_step": 276539, "epoch": 2285} {"train_loss": -42.59044647216797, "global_step": 276540, "epoch": 2285} {"train_loss": -41.9280891418457, "global_step": 276541, "epoch": 2285} {"train_loss": -42.70626449584961, "global_step": 276542, "epoch": 2285} {"train_loss": -43.39505386352539, "global_step": 276543, "epoch": 2285} {"train_loss": -41.58082962036133, "global_step": 276544, "epoch": 2285} {"train_loss": -41.76398468017578, "global_step": 276545, "epoch": 2285} {"train_loss": -41.548484802246094, "global_step": 276546, "epoch": 2285} {"train_loss": -42.99505615234375, "global_step": 276547, "epoch": 2285} {"train_loss": -42.51392364501953, "global_step": 276548, "epoch": 2285} {"train_loss": -41.88447189331055, "global_step": 276549, "epoch": 2285} {"train_loss": -42.542869567871094, "global_step": 276550, "epoch": 2285} {"train_loss": -42.945987701416016, "global_step": 276551, "epoch": 2285} {"train_loss": -43.138240814208984, "global_step": 276552, "epoch": 2285} {"train_loss": -42.05876922607422, "global_step": 276553, "epoch": 2285} {"train_loss": -41.84882354736328, "global_step": 276554, "epoch": 2285} {"train_loss": -42.788238525390625, "global_step": 276555, "epoch": 2285} {"train_loss": -43.510589599609375, "global_step": 276556, "epoch": 2285} {"train_loss": -43.16141128540039, "global_step": 276557, "epoch": 2285} {"train_loss": -43.13426208496094, "global_step": 276558, "epoch": 2285} {"train_loss": -41.37835693359375, "global_step": 276559, "epoch": 2285} {"train_loss": -41.96464920043945, "global_step": 276560, "epoch": 2285} {"train_loss": -42.23350143432617, "global_step": 276561, "epoch": 2285} {"train_loss": -43.511871337890625, "global_step": 276562, "epoch": 2285} {"train_loss": -43.225276947021484, "global_step": 276563, "epoch": 2285} {"train_loss": -43.379676818847656, "global_step": 276564, "epoch": 2285} {"train_loss": -43.18054962158203, "global_step": 276565, "epoch": 2285} {"train_loss": -43.35076904296875, "global_step": 276566, "epoch": 2285} {"train_loss": -42.770687103271484, "global_step": 276567, "epoch": 2285} {"train_loss": -42.82494354248047, "global_step": 276568, "epoch": 2285} {"train_loss": -43.10135269165039, "global_step": 276569, "epoch": 2285} {"train_loss": -43.183387756347656, "global_step": 276570, "epoch": 2285} {"train_loss": -42.632362365722656, "global_step": 276571, "epoch": 2285} {"train_loss": -43.45620346069336, "global_step": 276572, "epoch": 2285} {"train_loss": -42.839046478271484, "global_step": 276573, "epoch": 2285} {"train_loss": -41.70938491821289, "global_step": 276574, "epoch": 2285} {"train_loss": -43.29896926879883, "global_step": 276575, "epoch": 2285} {"train_loss": -42.851341247558594, "global_step": 276576, "epoch": 2285} {"train_loss": -42.97355270385742, "global_step": 276577, "epoch": 2285} {"train_loss": -43.19501876831055, "global_step": 276578, "epoch": 2285} {"train_loss": -41.45372772216797, "global_step": 276579, "epoch": 2285} {"train_loss": -43.346107482910156, "global_step": 276580, "epoch": 2285} {"train_loss": -42.337127685546875, "global_step": 276581, "epoch": 2285} {"train_loss": -42.443397521972656, "global_step": 276582, "epoch": 2285} {"train_loss": -43.109989166259766, "global_step": 276583, "epoch": 2285} {"train_loss": -42.23905944824219, "global_step": 276584, "epoch": 2285} {"train_loss": -41.88636016845703, "global_step": 276585, "epoch": 2285} {"train_loss": -41.39411544799805, "global_step": 276586, "epoch": 2285} {"train_loss": -40.72358322143555, "global_step": 276587, "epoch": 2285} {"train_loss": -40.70437240600586, "global_step": 276588, "epoch": 2285} {"train_loss": -41.05247116088867, "global_step": 276589, "epoch": 2285} {"train_loss": -42.537410736083984, "global_step": 276590, "epoch": 2285} {"train_loss": -42.105140686035156, "global_step": 276591, "epoch": 2285} {"train_loss": -42.654388427734375, "global_step": 276592, "epoch": 2285} {"train_loss": -42.72384262084961, "global_step": 276593, "epoch": 2285} {"train_loss": -42.72365188598633, "global_step": 276594, "epoch": 2285} {"train_loss": -40.14162063598633, "global_step": 276595, "epoch": 2285} {"train_loss": -37.419700622558594, "global_step": 276596, "epoch": 2285} {"train_loss": -34.7984504699707, "global_step": 276597, "epoch": 2285} {"train_loss": -28.792190551757812, "global_step": 276598, "epoch": 2285} {"train_loss": -40.059200286865234, "global_step": 276599, "epoch": 2285} {"train_loss": -39.04978561401367, "global_step": 276600, "epoch": 2285} {"train_loss": -38.480567932128906, "global_step": 276601, "epoch": 2285} {"train_loss": -40.7065544128418, "global_step": 276602, "epoch": 2285} {"train_loss": -37.39597702026367, "global_step": 276603, "epoch": 2285} {"train_loss": -33.12136459350586, "global_step": 276604, "epoch": 2285} {"train_loss": -42.03774504228072, "global_step": 276605, "epoch": 2285, "val_loss": 2573709.0} {"train_loss": -36.509979248046875, "global_step": 276606, "epoch": 2286} {"train_loss": -38.97665023803711, "global_step": 276607, "epoch": 2286} {"train_loss": -38.98329544067383, "global_step": 276608, "epoch": 2286} {"train_loss": -34.60049819946289, "global_step": 276609, "epoch": 2286} {"train_loss": -41.57051086425781, "global_step": 276610, "epoch": 2286} {"train_loss": -37.63454055786133, "global_step": 276611, "epoch": 2286} {"train_loss": -40.97261047363281, "global_step": 276612, "epoch": 2286} {"train_loss": -38.244384765625, "global_step": 276613, "epoch": 2286} {"train_loss": -40.12158966064453, "global_step": 276614, "epoch": 2286} {"train_loss": -39.03725814819336, "global_step": 276615, "epoch": 2286} {"train_loss": -41.084712982177734, "global_step": 276616, "epoch": 2286} {"train_loss": -39.60992431640625, "global_step": 276617, "epoch": 2286} {"train_loss": -41.29484939575195, "global_step": 276618, "epoch": 2286} {"train_loss": -40.624107360839844, "global_step": 276619, "epoch": 2286} {"train_loss": -41.86470413208008, "global_step": 276620, "epoch": 2286} {"train_loss": -40.65001678466797, "global_step": 276621, "epoch": 2286} {"train_loss": -40.813743591308594, "global_step": 276622, "epoch": 2286} {"train_loss": -41.89099884033203, "global_step": 276623, "epoch": 2286} {"train_loss": -41.89093780517578, "global_step": 276624, "epoch": 2286} {"train_loss": -39.493385314941406, "global_step": 276625, "epoch": 2286} {"train_loss": -39.93076705932617, "global_step": 276626, "epoch": 2286} {"train_loss": -41.89344024658203, "global_step": 276627, "epoch": 2286} {"train_loss": -40.9059944152832, "global_step": 276628, "epoch": 2286} {"train_loss": -41.027652740478516, "global_step": 276629, "epoch": 2286} {"train_loss": -39.67195129394531, "global_step": 276630, "epoch": 2286} {"train_loss": -41.311763763427734, "global_step": 276631, "epoch": 2286} {"train_loss": -41.6812858581543, "global_step": 276632, "epoch": 2286} {"train_loss": -41.4702033996582, "global_step": 276633, "epoch": 2286} {"train_loss": -41.52845001220703, "global_step": 276634, "epoch": 2286} {"train_loss": -42.17141342163086, "global_step": 276635, "epoch": 2286} {"train_loss": -41.723392486572266, "global_step": 276636, "epoch": 2286} {"train_loss": -42.35130310058594, "global_step": 276637, "epoch": 2286} {"train_loss": -41.43400955200195, "global_step": 276638, "epoch": 2286} {"train_loss": -42.582427978515625, "global_step": 276639, "epoch": 2286} {"train_loss": -41.35532760620117, "global_step": 276640, "epoch": 2286} {"train_loss": -42.33177185058594, "global_step": 276641, "epoch": 2286} {"train_loss": -41.42881393432617, "global_step": 276642, "epoch": 2286} {"train_loss": -42.10761260986328, "global_step": 276643, "epoch": 2286} {"train_loss": -42.14748001098633, "global_step": 276644, "epoch": 2286} {"train_loss": -41.87685775756836, "global_step": 276645, "epoch": 2286} {"train_loss": -42.1534538269043, "global_step": 276646, "epoch": 2286} {"train_loss": -41.92454147338867, "global_step": 276647, "epoch": 2286} {"train_loss": -42.731201171875, "global_step": 276648, "epoch": 2286} {"train_loss": -42.13883590698242, "global_step": 276649, "epoch": 2286} {"train_loss": -42.38364791870117, "global_step": 276650, "epoch": 2286} {"train_loss": -41.88450241088867, "global_step": 276651, "epoch": 2286} {"train_loss": -42.839447021484375, "global_step": 276652, "epoch": 2286} {"train_loss": -42.497501373291016, "global_step": 276653, "epoch": 2286} {"train_loss": -42.89631271362305, "global_step": 276654, "epoch": 2286} {"train_loss": -42.44879913330078, "global_step": 276655, "epoch": 2286} {"train_loss": -42.47284698486328, "global_step": 276656, "epoch": 2286} {"train_loss": -42.862342834472656, "global_step": 276657, "epoch": 2286} {"train_loss": -42.584144592285156, "global_step": 276658, "epoch": 2286} {"train_loss": -42.858577728271484, "global_step": 276659, "epoch": 2286} {"train_loss": -42.875789642333984, "global_step": 276660, "epoch": 2286} {"train_loss": -42.829410552978516, "global_step": 276661, "epoch": 2286} {"train_loss": -42.90436553955078, "global_step": 276662, "epoch": 2286} {"train_loss": -42.983985900878906, "global_step": 276663, "epoch": 2286} {"train_loss": -43.020442962646484, "global_step": 276664, "epoch": 2286} {"train_loss": -42.59031295776367, "global_step": 276665, "epoch": 2286} {"train_loss": -42.98543167114258, "global_step": 276666, "epoch": 2286} {"train_loss": -43.293479919433594, "global_step": 276667, "epoch": 2286} {"train_loss": -42.786598205566406, "global_step": 276668, "epoch": 2286} {"train_loss": -43.27531051635742, "global_step": 276669, "epoch": 2286} {"train_loss": -42.372432708740234, "global_step": 276670, "epoch": 2286} {"train_loss": -43.06890869140625, "global_step": 276671, "epoch": 2286} {"train_loss": -43.74300765991211, "global_step": 276672, "epoch": 2286} {"train_loss": -42.947486877441406, "global_step": 276673, "epoch": 2286} {"train_loss": -42.78871536254883, "global_step": 276674, "epoch": 2286} {"train_loss": -43.12922286987305, "global_step": 276675, "epoch": 2286} {"train_loss": -43.37996292114258, "global_step": 276676, "epoch": 2286} {"train_loss": -43.123043060302734, "global_step": 276677, "epoch": 2286} {"train_loss": -42.75638961791992, "global_step": 276678, "epoch": 2286} {"train_loss": -42.98952102661133, "global_step": 276679, "epoch": 2286} {"train_loss": -43.51484298706055, "global_step": 276680, "epoch": 2286} {"train_loss": -43.18199920654297, "global_step": 276681, "epoch": 2286} {"train_loss": -42.765254974365234, "global_step": 276682, "epoch": 2286} {"train_loss": -43.23552322387695, "global_step": 276683, "epoch": 2286} {"train_loss": -43.112213134765625, "global_step": 276684, "epoch": 2286} {"train_loss": -42.849639892578125, "global_step": 276685, "epoch": 2286} {"train_loss": -43.224891662597656, "global_step": 276686, "epoch": 2286} {"train_loss": -43.27161407470703, "global_step": 276687, "epoch": 2286} {"train_loss": -43.28491973876953, "global_step": 276688, "epoch": 2286} {"train_loss": -41.209510803222656, "global_step": 276689, "epoch": 2286} {"train_loss": -39.882076263427734, "global_step": 276690, "epoch": 2286} {"train_loss": -40.24068069458008, "global_step": 276691, "epoch": 2286} {"train_loss": -43.068878173828125, "global_step": 276692, "epoch": 2286} {"train_loss": -42.30221176147461, "global_step": 276693, "epoch": 2286} {"train_loss": -39.27348327636719, "global_step": 276694, "epoch": 2286} {"train_loss": -39.144073486328125, "global_step": 276695, "epoch": 2286} {"train_loss": -42.418731689453125, "global_step": 276696, "epoch": 2286} {"train_loss": -40.20075607299805, "global_step": 276697, "epoch": 2286} {"train_loss": -40.061134338378906, "global_step": 276698, "epoch": 2286} {"train_loss": -42.780364990234375, "global_step": 276699, "epoch": 2286} {"train_loss": -41.507938385009766, "global_step": 276700, "epoch": 2286} {"train_loss": -41.73765563964844, "global_step": 276701, "epoch": 2286} {"train_loss": -42.94655990600586, "global_step": 276702, "epoch": 2286} {"train_loss": -41.488616943359375, "global_step": 276703, "epoch": 2286} {"train_loss": -41.70466232299805, "global_step": 276704, "epoch": 2286} {"train_loss": -40.776214599609375, "global_step": 276705, "epoch": 2286} {"train_loss": -40.693634033203125, "global_step": 276706, "epoch": 2286} {"train_loss": -42.106475830078125, "global_step": 276707, "epoch": 2286} {"train_loss": -39.58661651611328, "global_step": 276708, "epoch": 2286} {"train_loss": -41.77687454223633, "global_step": 276709, "epoch": 2286} {"train_loss": -40.82408142089844, "global_step": 276710, "epoch": 2286} {"train_loss": -40.92923355102539, "global_step": 276711, "epoch": 2286} {"train_loss": -42.49808883666992, "global_step": 276712, "epoch": 2286} {"train_loss": -41.434112548828125, "global_step": 276713, "epoch": 2286} {"train_loss": -42.07693099975586, "global_step": 276714, "epoch": 2286} {"train_loss": -41.095489501953125, "global_step": 276715, "epoch": 2286} {"train_loss": -41.332271575927734, "global_step": 276716, "epoch": 2286} {"train_loss": -41.74564743041992, "global_step": 276717, "epoch": 2286} {"train_loss": -42.09138870239258, "global_step": 276718, "epoch": 2286} {"train_loss": -41.99302291870117, "global_step": 276719, "epoch": 2286} {"train_loss": -42.80589294433594, "global_step": 276720, "epoch": 2286} {"train_loss": -41.9098014831543, "global_step": 276721, "epoch": 2286} {"train_loss": -42.131954193115234, "global_step": 276722, "epoch": 2286} {"train_loss": -42.69729232788086, "global_step": 276723, "epoch": 2286} {"train_loss": -42.46207046508789, "global_step": 276724, "epoch": 2286} {"train_loss": -42.71464538574219, "global_step": 276725, "epoch": 2286} {"train_loss": -41.71638482464247, "global_step": 276726, "epoch": 2286, "val_loss": 2514876.25} {"train_loss": -42.420204162597656, "global_step": 276727, "epoch": 2287} {"train_loss": -42.69088363647461, "global_step": 276728, "epoch": 2287} {"train_loss": -43.02900314331055, "global_step": 276729, "epoch": 2287} {"train_loss": -42.00864791870117, "global_step": 276730, "epoch": 2287} {"train_loss": -42.32003402709961, "global_step": 276731, "epoch": 2287} {"train_loss": -42.55255126953125, "global_step": 276732, "epoch": 2287} {"train_loss": -41.80464172363281, "global_step": 276733, "epoch": 2287} {"train_loss": -42.581085205078125, "global_step": 276734, "epoch": 2287} {"train_loss": -41.363155364990234, "global_step": 276735, "epoch": 2287} {"train_loss": -42.5820426940918, "global_step": 276736, "epoch": 2287} {"train_loss": -42.6251106262207, "global_step": 276737, "epoch": 2287} {"train_loss": -41.80754089355469, "global_step": 276738, "epoch": 2287} {"train_loss": -41.985679626464844, "global_step": 276739, "epoch": 2287} {"train_loss": -41.63523483276367, "global_step": 276740, "epoch": 2287} {"train_loss": -42.093936920166016, "global_step": 276741, "epoch": 2287} {"train_loss": -42.73513412475586, "global_step": 276742, "epoch": 2287} {"train_loss": -42.00749588012695, "global_step": 276743, "epoch": 2287} {"train_loss": -42.310455322265625, "global_step": 276744, "epoch": 2287} {"train_loss": -42.29276657104492, "global_step": 276745, "epoch": 2287} {"train_loss": -42.8482780456543, "global_step": 276746, "epoch": 2287} {"train_loss": -41.79161071777344, "global_step": 276747, "epoch": 2287} {"train_loss": -41.01430892944336, "global_step": 276748, "epoch": 2287} {"train_loss": -41.960731506347656, "global_step": 276749, "epoch": 2287} {"train_loss": -43.12197494506836, "global_step": 276750, "epoch": 2287} {"train_loss": -42.119407653808594, "global_step": 276751, "epoch": 2287} {"train_loss": -40.18996810913086, "global_step": 276752, "epoch": 2287} {"train_loss": -42.96163558959961, "global_step": 276753, "epoch": 2287} {"train_loss": -41.2613639831543, "global_step": 276754, "epoch": 2287} {"train_loss": -40.28338623046875, "global_step": 276755, "epoch": 2287} {"train_loss": -39.44118118286133, "global_step": 276756, "epoch": 2287} {"train_loss": -42.647613525390625, "global_step": 276757, "epoch": 2287} {"train_loss": -41.24505615234375, "global_step": 276758, "epoch": 2287} {"train_loss": -36.389678955078125, "global_step": 276759, "epoch": 2287} {"train_loss": -42.6898307800293, "global_step": 276760, "epoch": 2287} {"train_loss": -42.46790313720703, "global_step": 276761, "epoch": 2287} {"train_loss": -40.81886672973633, "global_step": 276762, "epoch": 2287} {"train_loss": -40.8147087097168, "global_step": 276763, "epoch": 2287} {"train_loss": -41.55306625366211, "global_step": 276764, "epoch": 2287} {"train_loss": -41.479373931884766, "global_step": 276765, "epoch": 2287} {"train_loss": -41.27520751953125, "global_step": 276766, "epoch": 2287} {"train_loss": -42.35011291503906, "global_step": 276767, "epoch": 2287} {"train_loss": -41.195030212402344, "global_step": 276768, "epoch": 2287} {"train_loss": -37.69636154174805, "global_step": 276769, "epoch": 2287} {"train_loss": -42.36859130859375, "global_step": 276770, "epoch": 2287} {"train_loss": -40.711631774902344, "global_step": 276771, "epoch": 2287} {"train_loss": -42.49481201171875, "global_step": 276772, "epoch": 2287} {"train_loss": -42.13395309448242, "global_step": 276773, "epoch": 2287} {"train_loss": -42.2537956237793, "global_step": 276774, "epoch": 2287} {"train_loss": -42.79926681518555, "global_step": 276775, "epoch": 2287} {"train_loss": -42.6672248840332, "global_step": 276776, "epoch": 2287} {"train_loss": -43.199527740478516, "global_step": 276777, "epoch": 2287} {"train_loss": -42.6987190246582, "global_step": 276778, "epoch": 2287} {"train_loss": -39.357810974121094, "global_step": 276779, "epoch": 2287} {"train_loss": -40.764808654785156, "global_step": 276780, "epoch": 2287} {"train_loss": -40.34239959716797, "global_step": 276781, "epoch": 2287} {"train_loss": -41.643672943115234, "global_step": 276782, "epoch": 2287} {"train_loss": -41.75761795043945, "global_step": 276783, "epoch": 2287} {"train_loss": -41.67440414428711, "global_step": 276784, "epoch": 2287} {"train_loss": -41.712703704833984, "global_step": 276785, "epoch": 2287} {"train_loss": -42.200843811035156, "global_step": 276786, "epoch": 2287} {"train_loss": -42.208465576171875, "global_step": 276787, "epoch": 2287} {"train_loss": -37.020851135253906, "global_step": 276788, "epoch": 2287} {"train_loss": -42.780025482177734, "global_step": 276789, "epoch": 2287} {"train_loss": -40.559696197509766, "global_step": 276790, "epoch": 2287} {"train_loss": -41.21256637573242, "global_step": 276791, "epoch": 2287} {"train_loss": -42.490962982177734, "global_step": 276792, "epoch": 2287} {"train_loss": -42.86907196044922, "global_step": 276793, "epoch": 2287} {"train_loss": -43.138710021972656, "global_step": 276794, "epoch": 2287} {"train_loss": -42.741390228271484, "global_step": 276795, "epoch": 2287} {"train_loss": -42.346527099609375, "global_step": 276796, "epoch": 2287} {"train_loss": -43.202762603759766, "global_step": 276797, "epoch": 2287} {"train_loss": -42.37797927856445, "global_step": 276798, "epoch": 2287} {"train_loss": -43.06142044067383, "global_step": 276799, "epoch": 2287} {"train_loss": -42.90032958984375, "global_step": 276800, "epoch": 2287} {"train_loss": -42.466583251953125, "global_step": 276801, "epoch": 2287} {"train_loss": -42.93471908569336, "global_step": 276802, "epoch": 2287} {"train_loss": -42.67582321166992, "global_step": 276803, "epoch": 2287} {"train_loss": -43.08730697631836, "global_step": 276804, "epoch": 2287} {"train_loss": -43.0064697265625, "global_step": 276805, "epoch": 2287} {"train_loss": -42.9714469909668, "global_step": 276806, "epoch": 2287} {"train_loss": -43.3784294128418, "global_step": 276807, "epoch": 2287} {"train_loss": -43.037872314453125, "global_step": 276808, "epoch": 2287} {"train_loss": -41.05299758911133, "global_step": 276809, "epoch": 2287} {"train_loss": -42.12839889526367, "global_step": 276810, "epoch": 2287} {"train_loss": -43.38369369506836, "global_step": 276811, "epoch": 2287} {"train_loss": -42.88178634643555, "global_step": 276812, "epoch": 2287} {"train_loss": -43.041927337646484, "global_step": 276813, "epoch": 2287} {"train_loss": -37.18613815307617, "global_step": 276814, "epoch": 2287} {"train_loss": -43.12881851196289, "global_step": 276815, "epoch": 2287} {"train_loss": -42.74396896362305, "global_step": 276816, "epoch": 2287} {"train_loss": -43.10569381713867, "global_step": 276817, "epoch": 2287} {"train_loss": -40.86428451538086, "global_step": 276818, "epoch": 2287} {"train_loss": -43.051475524902344, "global_step": 276819, "epoch": 2287} {"train_loss": -43.56659698486328, "global_step": 276820, "epoch": 2287} {"train_loss": -40.48162078857422, "global_step": 276821, "epoch": 2287} {"train_loss": -42.123939514160156, "global_step": 276822, "epoch": 2287} {"train_loss": -43.595558166503906, "global_step": 276823, "epoch": 2287} {"train_loss": -43.058895111083984, "global_step": 276824, "epoch": 2287} {"train_loss": -43.29756546020508, "global_step": 276825, "epoch": 2287} {"train_loss": -42.07929229736328, "global_step": 276826, "epoch": 2287} {"train_loss": -42.54404830932617, "global_step": 276827, "epoch": 2287} {"train_loss": -43.15202713012695, "global_step": 276828, "epoch": 2287} {"train_loss": -42.78178787231445, "global_step": 276829, "epoch": 2287} {"train_loss": -42.2613639831543, "global_step": 276830, "epoch": 2287} {"train_loss": -42.051143646240234, "global_step": 276831, "epoch": 2287} {"train_loss": -42.85500717163086, "global_step": 276832, "epoch": 2287} {"train_loss": -42.38828659057617, "global_step": 276833, "epoch": 2287} {"train_loss": -43.373023986816406, "global_step": 276834, "epoch": 2287} {"train_loss": -41.35837173461914, "global_step": 276835, "epoch": 2287} {"train_loss": -43.4187126159668, "global_step": 276836, "epoch": 2287} {"train_loss": -43.5539436340332, "global_step": 276837, "epoch": 2287} {"train_loss": -42.60564041137695, "global_step": 276838, "epoch": 2287} {"train_loss": -43.302825927734375, "global_step": 276839, "epoch": 2287} {"train_loss": -42.11453628540039, "global_step": 276840, "epoch": 2287} {"train_loss": -43.6264533996582, "global_step": 276841, "epoch": 2287} {"train_loss": -42.71688461303711, "global_step": 276842, "epoch": 2287} {"train_loss": -43.68796157836914, "global_step": 276843, "epoch": 2287} {"train_loss": -43.032535552978516, "global_step": 276844, "epoch": 2287} {"train_loss": -42.27349853515625, "global_step": 276845, "epoch": 2287} {"train_loss": -43.30013656616211, "global_step": 276846, "epoch": 2287} {"train_loss": -42.10264366717378, "global_step": 276847, "epoch": 2287, "val_loss": 2502850.75} {"train_loss": -42.704612731933594, "global_step": 276848, "epoch": 2288} {"train_loss": -43.339080810546875, "global_step": 276849, "epoch": 2288} {"train_loss": -43.49273681640625, "global_step": 276850, "epoch": 2288} {"train_loss": -43.214900970458984, "global_step": 276851, "epoch": 2288} {"train_loss": -43.07479476928711, "global_step": 276852, "epoch": 2288} {"train_loss": -40.72820281982422, "global_step": 276853, "epoch": 2288} {"train_loss": -42.77140426635742, "global_step": 276854, "epoch": 2288} {"train_loss": -42.47451400756836, "global_step": 276855, "epoch": 2288} {"train_loss": -42.47015380859375, "global_step": 276856, "epoch": 2288} {"train_loss": -39.90333938598633, "global_step": 276857, "epoch": 2288} {"train_loss": -42.25200271606445, "global_step": 276858, "epoch": 2288} {"train_loss": -43.16189193725586, "global_step": 276859, "epoch": 2288} {"train_loss": -43.07844161987305, "global_step": 276860, "epoch": 2288} {"train_loss": -42.46114730834961, "global_step": 276861, "epoch": 2288} {"train_loss": -42.991825103759766, "global_step": 276862, "epoch": 2288} {"train_loss": -43.14048385620117, "global_step": 276863, "epoch": 2288} {"train_loss": -42.598506927490234, "global_step": 276864, "epoch": 2288} {"train_loss": -41.12822341918945, "global_step": 276865, "epoch": 2288} {"train_loss": -42.21158981323242, "global_step": 276866, "epoch": 2288} {"train_loss": -40.49032211303711, "global_step": 276867, "epoch": 2288} {"train_loss": -42.48484420776367, "global_step": 276868, "epoch": 2288} {"train_loss": -43.31550216674805, "global_step": 276869, "epoch": 2288} {"train_loss": -43.032188415527344, "global_step": 276870, "epoch": 2288} {"train_loss": -41.91621017456055, "global_step": 276871, "epoch": 2288} {"train_loss": -41.56705856323242, "global_step": 276872, "epoch": 2288} {"train_loss": -42.912715911865234, "global_step": 276873, "epoch": 2288} {"train_loss": -43.27530288696289, "global_step": 276874, "epoch": 2288} {"train_loss": -42.07855987548828, "global_step": 276875, "epoch": 2288} {"train_loss": -41.70246124267578, "global_step": 276876, "epoch": 2288} {"train_loss": -41.583126068115234, "global_step": 276877, "epoch": 2288} {"train_loss": -42.82851028442383, "global_step": 276878, "epoch": 2288} {"train_loss": -42.05669021606445, "global_step": 276879, "epoch": 2288} {"train_loss": -42.30965042114258, "global_step": 276880, "epoch": 2288} {"train_loss": -40.835079193115234, "global_step": 276881, "epoch": 2288} {"train_loss": -40.4997673034668, "global_step": 276882, "epoch": 2288} {"train_loss": -42.11635208129883, "global_step": 276883, "epoch": 2288} {"train_loss": -41.395938873291016, "global_step": 276884, "epoch": 2288} {"train_loss": -41.16192626953125, "global_step": 276885, "epoch": 2288} {"train_loss": -41.76488494873047, "global_step": 276886, "epoch": 2288} {"train_loss": -41.38479232788086, "global_step": 276887, "epoch": 2288} {"train_loss": -40.908966064453125, "global_step": 276888, "epoch": 2288} {"train_loss": -41.560585021972656, "global_step": 276889, "epoch": 2288} {"train_loss": -42.384639739990234, "global_step": 276890, "epoch": 2288} {"train_loss": -42.49440383911133, "global_step": 276891, "epoch": 2288} {"train_loss": -42.5232048034668, "global_step": 276892, "epoch": 2288} {"train_loss": -41.10421371459961, "global_step": 276893, "epoch": 2288} {"train_loss": -38.00605010986328, "global_step": 276894, "epoch": 2288} {"train_loss": -42.2086296081543, "global_step": 276895, "epoch": 2288} {"train_loss": -41.83650207519531, "global_step": 276896, "epoch": 2288} {"train_loss": -42.8867073059082, "global_step": 276897, "epoch": 2288} {"train_loss": -42.75400924682617, "global_step": 276898, "epoch": 2288} {"train_loss": -39.857582092285156, "global_step": 276899, "epoch": 2288} {"train_loss": -40.23588180541992, "global_step": 276900, "epoch": 2288} {"train_loss": -42.173458099365234, "global_step": 276901, "epoch": 2288} {"train_loss": -40.875450134277344, "global_step": 276902, "epoch": 2288} {"train_loss": -43.053192138671875, "global_step": 276903, "epoch": 2288} {"train_loss": -42.16321563720703, "global_step": 276904, "epoch": 2288} {"train_loss": -39.66547393798828, "global_step": 276905, "epoch": 2288} {"train_loss": -41.60663604736328, "global_step": 276906, "epoch": 2288} {"train_loss": -41.96485137939453, "global_step": 276907, "epoch": 2288} {"train_loss": -41.35312271118164, "global_step": 276908, "epoch": 2288} {"train_loss": -37.560707092285156, "global_step": 276909, "epoch": 2288} {"train_loss": -40.92489242553711, "global_step": 276910, "epoch": 2288} {"train_loss": -39.28693771362305, "global_step": 276911, "epoch": 2288} {"train_loss": -39.830596923828125, "global_step": 276912, "epoch": 2288} {"train_loss": -40.92686462402344, "global_step": 276913, "epoch": 2288} {"train_loss": -40.34707260131836, "global_step": 276914, "epoch": 2288} {"train_loss": -41.93769073486328, "global_step": 276915, "epoch": 2288} {"train_loss": -42.53194808959961, "global_step": 276916, "epoch": 2288} {"train_loss": -42.686492919921875, "global_step": 276917, "epoch": 2288} {"train_loss": -41.687862396240234, "global_step": 276918, "epoch": 2288} {"train_loss": -42.33755874633789, "global_step": 276919, "epoch": 2288} {"train_loss": -40.54425048828125, "global_step": 276920, "epoch": 2288} {"train_loss": -41.0052604675293, "global_step": 276921, "epoch": 2288} {"train_loss": -41.97868728637695, "global_step": 276922, "epoch": 2288} {"train_loss": -39.1171989440918, "global_step": 276923, "epoch": 2288} {"train_loss": -42.461647033691406, "global_step": 276924, "epoch": 2288} {"train_loss": -41.19453811645508, "global_step": 276925, "epoch": 2288} {"train_loss": -42.15835189819336, "global_step": 276926, "epoch": 2288} {"train_loss": -42.588470458984375, "global_step": 276927, "epoch": 2288} {"train_loss": -40.857421875, "global_step": 276928, "epoch": 2288} {"train_loss": -41.300506591796875, "global_step": 276929, "epoch": 2288} {"train_loss": -40.33675765991211, "global_step": 276930, "epoch": 2288} {"train_loss": -40.3886833190918, "global_step": 276931, "epoch": 2288} {"train_loss": -40.875423431396484, "global_step": 276932, "epoch": 2288} {"train_loss": -41.91536331176758, "global_step": 276933, "epoch": 2288} {"train_loss": -40.55958557128906, "global_step": 276934, "epoch": 2288} {"train_loss": -41.71346664428711, "global_step": 276935, "epoch": 2288} {"train_loss": -41.50212097167969, "global_step": 276936, "epoch": 2288} {"train_loss": -42.17170333862305, "global_step": 276937, "epoch": 2288} {"train_loss": -35.544979095458984, "global_step": 276938, "epoch": 2288} {"train_loss": -42.80570602416992, "global_step": 276939, "epoch": 2288} {"train_loss": -41.83875274658203, "global_step": 276940, "epoch": 2288} {"train_loss": -42.00130081176758, "global_step": 276941, "epoch": 2288} {"train_loss": -42.502384185791016, "global_step": 276942, "epoch": 2288} {"train_loss": -40.804203033447266, "global_step": 276943, "epoch": 2288} {"train_loss": -41.984375, "global_step": 276944, "epoch": 2288} {"train_loss": -41.77924728393555, "global_step": 276945, "epoch": 2288} {"train_loss": -42.929691314697266, "global_step": 276946, "epoch": 2288} {"train_loss": -42.19324493408203, "global_step": 276947, "epoch": 2288} {"train_loss": -41.75014877319336, "global_step": 276948, "epoch": 2288} {"train_loss": -41.200469970703125, "global_step": 276949, "epoch": 2288} {"train_loss": -42.81499481201172, "global_step": 276950, "epoch": 2288} {"train_loss": -42.266822814941406, "global_step": 276951, "epoch": 2288} {"train_loss": -43.07137680053711, "global_step": 276952, "epoch": 2288} {"train_loss": -42.575782775878906, "global_step": 276953, "epoch": 2288} {"train_loss": -38.305355072021484, "global_step": 276954, "epoch": 2288} {"train_loss": -39.89775466918945, "global_step": 276955, "epoch": 2288} {"train_loss": -42.659725189208984, "global_step": 276956, "epoch": 2288} {"train_loss": -42.17137908935547, "global_step": 276957, "epoch": 2288} {"train_loss": -39.23451232910156, "global_step": 276958, "epoch": 2288} {"train_loss": -39.9720573425293, "global_step": 276959, "epoch": 2288} {"train_loss": -41.77293395996094, "global_step": 276960, "epoch": 2288} {"train_loss": -41.8724479675293, "global_step": 276961, "epoch": 2288} {"train_loss": -39.47213363647461, "global_step": 276962, "epoch": 2288} {"train_loss": -39.30806350708008, "global_step": 276963, "epoch": 2288} {"train_loss": -42.67792510986328, "global_step": 276964, "epoch": 2288} {"train_loss": -41.09363555908203, "global_step": 276965, "epoch": 2288} {"train_loss": -39.37624740600586, "global_step": 276966, "epoch": 2288} {"train_loss": -42.632450103759766, "global_step": 276967, "epoch": 2288} {"train_loss": -41.549344464767074, "global_step": 276968, "epoch": 2288, "val_loss": 2714428.75} {"train_loss": -37.30985641479492, "global_step": 276969, "epoch": 2289} {"train_loss": -41.57709884643555, "global_step": 276970, "epoch": 2289} {"train_loss": -35.761287689208984, "global_step": 276971, "epoch": 2289} {"train_loss": -40.416568756103516, "global_step": 276972, "epoch": 2289} {"train_loss": -39.27075958251953, "global_step": 276973, "epoch": 2289} {"train_loss": -32.378639221191406, "global_step": 276974, "epoch": 2289} {"train_loss": -38.43799591064453, "global_step": 276975, "epoch": 2289} {"train_loss": -12.054805755615234, "global_step": 276976, "epoch": 2289} {"train_loss": -28.71893310546875, "global_step": 276977, "epoch": 2289} {"train_loss": -30.871809005737305, "global_step": 276978, "epoch": 2289} {"train_loss": -16.920738220214844, "global_step": 276979, "epoch": 2289} {"train_loss": 56.22809982299805, "global_step": 276980, "epoch": 2289} {"train_loss": -30.943017959594727, "global_step": 276981, "epoch": 2289} {"train_loss": -4.174267768859863, "global_step": 276982, "epoch": 2289} {"train_loss": -31.314544677734375, "global_step": 276983, "epoch": 2289} {"train_loss": -30.064197540283203, "global_step": 276984, "epoch": 2289} {"train_loss": -27.692102432250977, "global_step": 276985, "epoch": 2289} {"train_loss": -22.21757698059082, "global_step": 276986, "epoch": 2289} {"train_loss": -12.433798789978027, "global_step": 276987, "epoch": 2289} {"train_loss": -27.821889877319336, "global_step": 276988, "epoch": 2289} {"train_loss": -33.62177276611328, "global_step": 276989, "epoch": 2289} {"train_loss": -31.333967208862305, "global_step": 276990, "epoch": 2289} {"train_loss": -33.780574798583984, "global_step": 276991, "epoch": 2289} {"train_loss": -32.4482421875, "global_step": 276992, "epoch": 2289} {"train_loss": -32.1359977722168, "global_step": 276993, "epoch": 2289} {"train_loss": -34.24055099487305, "global_step": 276994, "epoch": 2289} {"train_loss": -33.62160873413086, "global_step": 276995, "epoch": 2289} {"train_loss": -28.445409774780273, "global_step": 276996, "epoch": 2289} {"train_loss": -35.36659622192383, "global_step": 276997, "epoch": 2289} {"train_loss": -35.53562545776367, "global_step": 276998, "epoch": 2289} {"train_loss": -35.1932373046875, "global_step": 276999, "epoch": 2289} {"train_loss": -35.26085662841797, "global_step": 277000, "epoch": 2289} {"train_loss": -34.96465301513672, "global_step": 277001, "epoch": 2289} {"train_loss": -36.0395622253418, "global_step": 277002, "epoch": 2289} {"train_loss": -36.52412033081055, "global_step": 277003, "epoch": 2289} {"train_loss": -36.225982666015625, "global_step": 277004, "epoch": 2289} {"train_loss": -36.89373016357422, "global_step": 277005, "epoch": 2289} {"train_loss": -37.320404052734375, "global_step": 277006, "epoch": 2289} {"train_loss": -35.686622619628906, "global_step": 277007, "epoch": 2289} {"train_loss": -36.7192268371582, "global_step": 277008, "epoch": 2289} {"train_loss": -36.27056884765625, "global_step": 277009, "epoch": 2289} {"train_loss": -36.792640686035156, "global_step": 277010, "epoch": 2289} {"train_loss": -35.55255889892578, "global_step": 277011, "epoch": 2289} {"train_loss": -36.46333694458008, "global_step": 277012, "epoch": 2289} {"train_loss": -37.336605072021484, "global_step": 277013, "epoch": 2289} {"train_loss": -37.602230072021484, "global_step": 277014, "epoch": 2289} {"train_loss": -37.1867790222168, "global_step": 277015, "epoch": 2289} {"train_loss": -37.26033401489258, "global_step": 277016, "epoch": 2289} {"train_loss": -37.07890701293945, "global_step": 277017, "epoch": 2289} {"train_loss": -37.4010009765625, "global_step": 277018, "epoch": 2289} {"train_loss": -37.764339447021484, "global_step": 277019, "epoch": 2289} {"train_loss": -37.380855560302734, "global_step": 277020, "epoch": 2289} {"train_loss": -38.417415618896484, "global_step": 277021, "epoch": 2289} {"train_loss": -36.931846618652344, "global_step": 277022, "epoch": 2289} {"train_loss": -37.811729431152344, "global_step": 277023, "epoch": 2289} {"train_loss": -36.41230773925781, "global_step": 277024, "epoch": 2289} {"train_loss": -37.21605682373047, "global_step": 277025, "epoch": 2289} {"train_loss": -37.69136428833008, "global_step": 277026, "epoch": 2289} {"train_loss": -37.15010452270508, "global_step": 277027, "epoch": 2289} {"train_loss": -37.7451057434082, "global_step": 277028, "epoch": 2289} {"train_loss": -37.952903747558594, "global_step": 277029, "epoch": 2289} {"train_loss": -37.85898971557617, "global_step": 277030, "epoch": 2289} {"train_loss": -37.91433334350586, "global_step": 277031, "epoch": 2289} {"train_loss": -38.64577865600586, "global_step": 277032, "epoch": 2289} {"train_loss": -38.597713470458984, "global_step": 277033, "epoch": 2289} {"train_loss": -38.37252426147461, "global_step": 277034, "epoch": 2289} {"train_loss": -38.18490982055664, "global_step": 277035, "epoch": 2289} {"train_loss": -37.83202362060547, "global_step": 277036, "epoch": 2289} {"train_loss": -38.5529899597168, "global_step": 277037, "epoch": 2289} {"train_loss": -38.20318603515625, "global_step": 277038, "epoch": 2289} {"train_loss": -38.521846771240234, "global_step": 277039, "epoch": 2289} {"train_loss": -38.05405807495117, "global_step": 277040, "epoch": 2289} {"train_loss": -38.08042526245117, "global_step": 277041, "epoch": 2289} {"train_loss": -38.72614669799805, "global_step": 277042, "epoch": 2289} {"train_loss": -38.85520553588867, "global_step": 277043, "epoch": 2289} {"train_loss": -38.047115325927734, "global_step": 277044, "epoch": 2289} {"train_loss": -38.50992202758789, "global_step": 277045, "epoch": 2289} {"train_loss": -39.158241271972656, "global_step": 277046, "epoch": 2289} {"train_loss": -38.31569290161133, "global_step": 277047, "epoch": 2289} {"train_loss": -39.415000915527344, "global_step": 277048, "epoch": 2289} {"train_loss": -39.48531723022461, "global_step": 277049, "epoch": 2289} {"train_loss": -39.38368606567383, "global_step": 277050, "epoch": 2289} {"train_loss": -39.64248275756836, "global_step": 277051, "epoch": 2289} {"train_loss": -38.637725830078125, "global_step": 277052, "epoch": 2289} {"train_loss": -39.475921630859375, "global_step": 277053, "epoch": 2289} {"train_loss": -38.20769119262695, "global_step": 277054, "epoch": 2289} {"train_loss": -38.81669235229492, "global_step": 277055, "epoch": 2289} {"train_loss": -39.92412567138672, "global_step": 277056, "epoch": 2289} {"train_loss": -40.23354721069336, "global_step": 277057, "epoch": 2289} {"train_loss": -39.25347900390625, "global_step": 277058, "epoch": 2289} {"train_loss": -38.51568603515625, "global_step": 277059, "epoch": 2289} {"train_loss": -39.33985900878906, "global_step": 277060, "epoch": 2289} {"train_loss": -39.13722610473633, "global_step": 277061, "epoch": 2289} {"train_loss": -39.49100875854492, "global_step": 277062, "epoch": 2289} {"train_loss": -39.03562927246094, "global_step": 277063, "epoch": 2289} {"train_loss": -39.50433349609375, "global_step": 277064, "epoch": 2289} {"train_loss": -39.60502624511719, "global_step": 277065, "epoch": 2289} {"train_loss": -39.28960037231445, "global_step": 277066, "epoch": 2289} {"train_loss": -39.16105270385742, "global_step": 277067, "epoch": 2289} {"train_loss": -38.686614990234375, "global_step": 277068, "epoch": 2289} {"train_loss": -38.984283447265625, "global_step": 277069, "epoch": 2289} {"train_loss": -40.05587387084961, "global_step": 277070, "epoch": 2289} {"train_loss": -39.097267150878906, "global_step": 277071, "epoch": 2289} {"train_loss": -39.33086013793945, "global_step": 277072, "epoch": 2289} {"train_loss": -40.260066986083984, "global_step": 277073, "epoch": 2289} {"train_loss": -40.15833282470703, "global_step": 277074, "epoch": 2289} {"train_loss": -40.388153076171875, "global_step": 277075, "epoch": 2289} {"train_loss": -39.29957962036133, "global_step": 277076, "epoch": 2289} {"train_loss": -39.72797775268555, "global_step": 277077, "epoch": 2289} {"train_loss": -40.07650375366211, "global_step": 277078, "epoch": 2289} {"train_loss": -40.45408248901367, "global_step": 277079, "epoch": 2289} {"train_loss": -40.55984115600586, "global_step": 277080, "epoch": 2289} {"train_loss": -40.42818069458008, "global_step": 277081, "epoch": 2289} {"train_loss": -39.62725830078125, "global_step": 277082, "epoch": 2289} {"train_loss": -39.8681526184082, "global_step": 277083, "epoch": 2289} {"train_loss": -40.03778076171875, "global_step": 277084, "epoch": 2289} {"train_loss": -40.775970458984375, "global_step": 277085, "epoch": 2289} {"train_loss": -39.64821243286133, "global_step": 277086, "epoch": 2289} {"train_loss": -40.0613899230957, "global_step": 277087, "epoch": 2289} {"train_loss": -40.89078903198242, "global_step": 277088, "epoch": 2289} {"train_loss": -35.63341706646376, "global_step": 277089, "epoch": 2289, "val_loss": 2485669.5} {"train_loss": -39.62712478637695, "global_step": 277090, "epoch": 2290} {"train_loss": -40.45283126831055, "global_step": 277091, "epoch": 2290} {"train_loss": -40.72266387939453, "global_step": 277092, "epoch": 2290} {"train_loss": -40.58160400390625, "global_step": 277093, "epoch": 2290} {"train_loss": -39.320518493652344, "global_step": 277094, "epoch": 2290} {"train_loss": -40.8863639831543, "global_step": 277095, "epoch": 2290} {"train_loss": -41.1779899597168, "global_step": 277096, "epoch": 2290} {"train_loss": -40.77988815307617, "global_step": 277097, "epoch": 2290} {"train_loss": -40.62744140625, "global_step": 277098, "epoch": 2290} {"train_loss": -40.68703842163086, "global_step": 277099, "epoch": 2290} {"train_loss": -40.282752990722656, "global_step": 277100, "epoch": 2290} {"train_loss": -40.493385314941406, "global_step": 277101, "epoch": 2290} {"train_loss": -40.76203536987305, "global_step": 277102, "epoch": 2290} {"train_loss": -40.757991790771484, "global_step": 277103, "epoch": 2290} {"train_loss": -41.302032470703125, "global_step": 277104, "epoch": 2290} {"train_loss": -41.58596420288086, "global_step": 277105, "epoch": 2290} {"train_loss": -41.16669464111328, "global_step": 277106, "epoch": 2290} {"train_loss": -40.65199279785156, "global_step": 277107, "epoch": 2290} {"train_loss": -41.15639114379883, "global_step": 277108, "epoch": 2290} {"train_loss": -39.74318313598633, "global_step": 277109, "epoch": 2290} {"train_loss": -41.55186080932617, "global_step": 277110, "epoch": 2290} {"train_loss": -41.33036804199219, "global_step": 277111, "epoch": 2290} {"train_loss": -40.5192985534668, "global_step": 277112, "epoch": 2290} {"train_loss": -40.368553161621094, "global_step": 277113, "epoch": 2290} {"train_loss": -40.736812591552734, "global_step": 277114, "epoch": 2290} {"train_loss": -40.97895050048828, "global_step": 277115, "epoch": 2290} {"train_loss": -40.954219818115234, "global_step": 277116, "epoch": 2290} {"train_loss": -41.48402786254883, "global_step": 277117, "epoch": 2290} {"train_loss": -40.420143127441406, "global_step": 277118, "epoch": 2290} {"train_loss": -40.89464569091797, "global_step": 277119, "epoch": 2290} {"train_loss": -40.67658233642578, "global_step": 277120, "epoch": 2290} {"train_loss": -40.63471984863281, "global_step": 277121, "epoch": 2290} {"train_loss": -41.417625427246094, "global_step": 277122, "epoch": 2290} {"train_loss": -41.69816207885742, "global_step": 277123, "epoch": 2290} {"train_loss": -41.36489486694336, "global_step": 277124, "epoch": 2290} {"train_loss": -41.50661849975586, "global_step": 277125, "epoch": 2290} {"train_loss": -41.099998474121094, "global_step": 277126, "epoch": 2290} {"train_loss": -41.323097229003906, "global_step": 277127, "epoch": 2290} {"train_loss": -41.248626708984375, "global_step": 277128, "epoch": 2290} {"train_loss": -40.30898666381836, "global_step": 277129, "epoch": 2290} {"train_loss": -41.1679573059082, "global_step": 277130, "epoch": 2290} {"train_loss": -41.85908126831055, "global_step": 277131, "epoch": 2290} {"train_loss": -41.513118743896484, "global_step": 277132, "epoch": 2290} {"train_loss": -42.10279083251953, "global_step": 277133, "epoch": 2290} {"train_loss": -40.366878509521484, "global_step": 277134, "epoch": 2290} {"train_loss": -40.70449447631836, "global_step": 277135, "epoch": 2290} {"train_loss": -41.223384857177734, "global_step": 277136, "epoch": 2290} {"train_loss": -41.41215133666992, "global_step": 277137, "epoch": 2290} {"train_loss": -40.85653305053711, "global_step": 277138, "epoch": 2290} {"train_loss": -41.153663635253906, "global_step": 277139, "epoch": 2290} {"train_loss": -42.2703971862793, "global_step": 277140, "epoch": 2290} {"train_loss": -41.52048873901367, "global_step": 277141, "epoch": 2290} {"train_loss": -40.602882385253906, "global_step": 277142, "epoch": 2290} {"train_loss": -41.354957580566406, "global_step": 277143, "epoch": 2290} {"train_loss": -42.18462371826172, "global_step": 277144, "epoch": 2290} {"train_loss": -41.68197250366211, "global_step": 277145, "epoch": 2290} {"train_loss": -41.161067962646484, "global_step": 277146, "epoch": 2290} {"train_loss": -41.914058685302734, "global_step": 277147, "epoch": 2290} {"train_loss": -41.446937561035156, "global_step": 277148, "epoch": 2290} {"train_loss": -41.37687301635742, "global_step": 277149, "epoch": 2290} {"train_loss": -42.08721160888672, "global_step": 277150, "epoch": 2290} {"train_loss": -41.68452835083008, "global_step": 277151, "epoch": 2290} {"train_loss": -41.009883880615234, "global_step": 277152, "epoch": 2290} {"train_loss": -41.7978401184082, "global_step": 277153, "epoch": 2290} {"train_loss": -41.3316764831543, "global_step": 277154, "epoch": 2290} {"train_loss": -41.340843200683594, "global_step": 277155, "epoch": 2290} {"train_loss": -42.355770111083984, "global_step": 277156, "epoch": 2290} {"train_loss": -42.09841537475586, "global_step": 277157, "epoch": 2290} {"train_loss": -42.097137451171875, "global_step": 277158, "epoch": 2290} {"train_loss": -41.99721145629883, "global_step": 277159, "epoch": 2290} {"train_loss": -41.66175079345703, "global_step": 277160, "epoch": 2290} {"train_loss": -42.42507553100586, "global_step": 277161, "epoch": 2290} {"train_loss": -41.9210205078125, "global_step": 277162, "epoch": 2290} {"train_loss": -41.58606719970703, "global_step": 277163, "epoch": 2290} {"train_loss": -41.36979293823242, "global_step": 277164, "epoch": 2290} {"train_loss": -41.33075714111328, "global_step": 277165, "epoch": 2290} {"train_loss": -40.72766876220703, "global_step": 277166, "epoch": 2290} {"train_loss": -41.37502670288086, "global_step": 277167, "epoch": 2290} {"train_loss": -41.07070541381836, "global_step": 277168, "epoch": 2290} {"train_loss": -41.06930160522461, "global_step": 277169, "epoch": 2290} {"train_loss": -41.52762985229492, "global_step": 277170, "epoch": 2290} {"train_loss": -41.613037109375, "global_step": 277171, "epoch": 2290} {"train_loss": -41.64966583251953, "global_step": 277172, "epoch": 2290} {"train_loss": -42.06826400756836, "global_step": 277173, "epoch": 2290} {"train_loss": -41.419918060302734, "global_step": 277174, "epoch": 2290} {"train_loss": -41.33700180053711, "global_step": 277175, "epoch": 2290} {"train_loss": -42.084163665771484, "global_step": 277176, "epoch": 2290} {"train_loss": -41.94234848022461, "global_step": 277177, "epoch": 2290} {"train_loss": -41.99675750732422, "global_step": 277178, "epoch": 2290} {"train_loss": -41.568878173828125, "global_step": 277179, "epoch": 2290} {"train_loss": -42.21114730834961, "global_step": 277180, "epoch": 2290} {"train_loss": -41.257057189941406, "global_step": 277181, "epoch": 2290} {"train_loss": -41.46244430541992, "global_step": 277182, "epoch": 2290} {"train_loss": -42.28131103515625, "global_step": 277183, "epoch": 2290} {"train_loss": -40.81103515625, "global_step": 277184, "epoch": 2290} {"train_loss": -41.78509521484375, "global_step": 277185, "epoch": 2290} {"train_loss": -41.08687973022461, "global_step": 277186, "epoch": 2290} {"train_loss": -41.949745178222656, "global_step": 277187, "epoch": 2290} {"train_loss": -41.128395080566406, "global_step": 277188, "epoch": 2290} {"train_loss": -41.29616165161133, "global_step": 277189, "epoch": 2290} {"train_loss": -41.726837158203125, "global_step": 277190, "epoch": 2290} {"train_loss": -41.98005294799805, "global_step": 277191, "epoch": 2290} {"train_loss": -40.552669525146484, "global_step": 277192, "epoch": 2290} {"train_loss": -41.62480545043945, "global_step": 277193, "epoch": 2290} {"train_loss": -41.481258392333984, "global_step": 277194, "epoch": 2290} {"train_loss": -41.69392395019531, "global_step": 277195, "epoch": 2290} {"train_loss": -40.778114318847656, "global_step": 277196, "epoch": 2290} {"train_loss": -40.96242141723633, "global_step": 277197, "epoch": 2290} {"train_loss": -41.6683349609375, "global_step": 277198, "epoch": 2290} {"train_loss": -40.78868865966797, "global_step": 277199, "epoch": 2290} {"train_loss": -41.60619354248047, "global_step": 277200, "epoch": 2290} {"train_loss": -41.499656677246094, "global_step": 277201, "epoch": 2290} {"train_loss": -41.09162521362305, "global_step": 277202, "epoch": 2290} {"train_loss": -39.31315994262695, "global_step": 277203, "epoch": 2290} {"train_loss": -41.65756607055664, "global_step": 277204, "epoch": 2290} {"train_loss": -40.47308349609375, "global_step": 277205, "epoch": 2290} {"train_loss": -39.834808349609375, "global_step": 277206, "epoch": 2290} {"train_loss": -40.83155059814453, "global_step": 277207, "epoch": 2290} {"train_loss": -41.36619567871094, "global_step": 277208, "epoch": 2290} {"train_loss": -39.96409225463867, "global_step": 277209, "epoch": 2290} {"train_loss": -41.22352625318795, "global_step": 277210, "epoch": 2290, "val_loss": 2510791.0} {"train_loss": -41.52798080444336, "global_step": 277211, "epoch": 2291} {"train_loss": -40.020320892333984, "global_step": 277212, "epoch": 2291} {"train_loss": -41.51551055908203, "global_step": 277213, "epoch": 2291} {"train_loss": -41.2664680480957, "global_step": 277214, "epoch": 2291} {"train_loss": -41.92328643798828, "global_step": 277215, "epoch": 2291} {"train_loss": -41.81879806518555, "global_step": 277216, "epoch": 2291} {"train_loss": -41.715938568115234, "global_step": 277217, "epoch": 2291} {"train_loss": -41.172645568847656, "global_step": 277218, "epoch": 2291} {"train_loss": -41.98625564575195, "global_step": 277219, "epoch": 2291} {"train_loss": -40.59775924682617, "global_step": 277220, "epoch": 2291} {"train_loss": -42.25565719604492, "global_step": 277221, "epoch": 2291} {"train_loss": -41.79570388793945, "global_step": 277222, "epoch": 2291} {"train_loss": -40.49061965942383, "global_step": 277223, "epoch": 2291} {"train_loss": -41.5750846862793, "global_step": 277224, "epoch": 2291} {"train_loss": -41.88918685913086, "global_step": 277225, "epoch": 2291} {"train_loss": -39.996822357177734, "global_step": 277226, "epoch": 2291} {"train_loss": -41.5275764465332, "global_step": 277227, "epoch": 2291} {"train_loss": -41.32627868652344, "global_step": 277228, "epoch": 2291} {"train_loss": -40.795623779296875, "global_step": 277229, "epoch": 2291} {"train_loss": -41.06697082519531, "global_step": 277230, "epoch": 2291} {"train_loss": -41.098976135253906, "global_step": 277231, "epoch": 2291} {"train_loss": -40.940914154052734, "global_step": 277232, "epoch": 2291} {"train_loss": -41.84637451171875, "global_step": 277233, "epoch": 2291} {"train_loss": -40.1661491394043, "global_step": 277234, "epoch": 2291} {"train_loss": -39.57046127319336, "global_step": 277235, "epoch": 2291} {"train_loss": -42.566341400146484, "global_step": 277236, "epoch": 2291} {"train_loss": -39.095157623291016, "global_step": 277237, "epoch": 2291} {"train_loss": -38.40625, "global_step": 277238, "epoch": 2291} {"train_loss": -41.378082275390625, "global_step": 277239, "epoch": 2291} {"train_loss": -40.08701705932617, "global_step": 277240, "epoch": 2291} {"train_loss": -40.905731201171875, "global_step": 277241, "epoch": 2291} {"train_loss": -41.420528411865234, "global_step": 277242, "epoch": 2291} {"train_loss": -39.879940032958984, "global_step": 277243, "epoch": 2291} {"train_loss": -40.74878692626953, "global_step": 277244, "epoch": 2291} {"train_loss": -39.916988372802734, "global_step": 277245, "epoch": 2291} {"train_loss": -40.719444274902344, "global_step": 277246, "epoch": 2291} {"train_loss": -41.0496826171875, "global_step": 277247, "epoch": 2291} {"train_loss": -39.63826370239258, "global_step": 277248, "epoch": 2291} {"train_loss": -42.09023666381836, "global_step": 277249, "epoch": 2291} {"train_loss": -40.33818817138672, "global_step": 277250, "epoch": 2291} {"train_loss": -40.62320327758789, "global_step": 277251, "epoch": 2291} {"train_loss": -40.65555953979492, "global_step": 277252, "epoch": 2291} {"train_loss": -40.460697174072266, "global_step": 277253, "epoch": 2291} {"train_loss": -42.35707473754883, "global_step": 277254, "epoch": 2291} {"train_loss": -40.02067184448242, "global_step": 277255, "epoch": 2291} {"train_loss": -41.291648864746094, "global_step": 277256, "epoch": 2291} {"train_loss": -41.420753479003906, "global_step": 277257, "epoch": 2291} {"train_loss": -41.98065948486328, "global_step": 277258, "epoch": 2291} {"train_loss": -42.017635345458984, "global_step": 277259, "epoch": 2291} {"train_loss": -41.745304107666016, "global_step": 277260, "epoch": 2291} {"train_loss": -41.42500305175781, "global_step": 277261, "epoch": 2291} {"train_loss": -41.309478759765625, "global_step": 277262, "epoch": 2291} {"train_loss": -42.097320556640625, "global_step": 277263, "epoch": 2291} {"train_loss": -41.221614837646484, "global_step": 277264, "epoch": 2291} {"train_loss": -42.092796325683594, "global_step": 277265, "epoch": 2291} {"train_loss": -41.03534698486328, "global_step": 277266, "epoch": 2291} {"train_loss": -41.92488479614258, "global_step": 277267, "epoch": 2291} {"train_loss": -42.08554458618164, "global_step": 277268, "epoch": 2291} {"train_loss": -42.29182052612305, "global_step": 277269, "epoch": 2291} {"train_loss": -41.974361419677734, "global_step": 277270, "epoch": 2291} {"train_loss": -42.22068405151367, "global_step": 277271, "epoch": 2291} {"train_loss": -42.48752975463867, "global_step": 277272, "epoch": 2291} {"train_loss": -42.147064208984375, "global_step": 277273, "epoch": 2291} {"train_loss": -42.292724609375, "global_step": 277274, "epoch": 2291} {"train_loss": -41.778411865234375, "global_step": 277275, "epoch": 2291} {"train_loss": -42.35984802246094, "global_step": 277276, "epoch": 2291} {"train_loss": -41.41143798828125, "global_step": 277277, "epoch": 2291} {"train_loss": -42.00818634033203, "global_step": 277278, "epoch": 2291} {"train_loss": -42.0621452331543, "global_step": 277279, "epoch": 2291} {"train_loss": -41.96407699584961, "global_step": 277280, "epoch": 2291} {"train_loss": -40.97722244262695, "global_step": 277281, "epoch": 2291} {"train_loss": -40.790069580078125, "global_step": 277282, "epoch": 2291} {"train_loss": -40.58307647705078, "global_step": 277283, "epoch": 2291} {"train_loss": -39.927223205566406, "global_step": 277284, "epoch": 2291} {"train_loss": -41.10898971557617, "global_step": 277285, "epoch": 2291} {"train_loss": -40.714481353759766, "global_step": 277286, "epoch": 2291} {"train_loss": -41.43311309814453, "global_step": 277287, "epoch": 2291} {"train_loss": -39.61931228637695, "global_step": 277288, "epoch": 2291} {"train_loss": -40.51327133178711, "global_step": 277289, "epoch": 2291} {"train_loss": -41.35028076171875, "global_step": 277290, "epoch": 2291} {"train_loss": -40.26496505737305, "global_step": 277291, "epoch": 2291} {"train_loss": -39.39455795288086, "global_step": 277292, "epoch": 2291} {"train_loss": -39.7570686340332, "global_step": 277293, "epoch": 2291} {"train_loss": -41.3414306640625, "global_step": 277294, "epoch": 2291} {"train_loss": -40.38420486450195, "global_step": 277295, "epoch": 2291} {"train_loss": -41.06425094604492, "global_step": 277296, "epoch": 2291} {"train_loss": -41.24198913574219, "global_step": 277297, "epoch": 2291} {"train_loss": -40.77878189086914, "global_step": 277298, "epoch": 2291} {"train_loss": -41.27244186401367, "global_step": 277299, "epoch": 2291} {"train_loss": -40.50001525878906, "global_step": 277300, "epoch": 2291} {"train_loss": -42.11980056762695, "global_step": 277301, "epoch": 2291} {"train_loss": -41.99595260620117, "global_step": 277302, "epoch": 2291} {"train_loss": -41.107872009277344, "global_step": 277303, "epoch": 2291} {"train_loss": -41.69491958618164, "global_step": 277304, "epoch": 2291} {"train_loss": -40.95632553100586, "global_step": 277305, "epoch": 2291} {"train_loss": -42.29568862915039, "global_step": 277306, "epoch": 2291} {"train_loss": -41.60639190673828, "global_step": 277307, "epoch": 2291} {"train_loss": -40.857791900634766, "global_step": 277308, "epoch": 2291} {"train_loss": -40.21685028076172, "global_step": 277309, "epoch": 2291} {"train_loss": -40.04267120361328, "global_step": 277310, "epoch": 2291} {"train_loss": -40.95216751098633, "global_step": 277311, "epoch": 2291} {"train_loss": -39.97488784790039, "global_step": 277312, "epoch": 2291} {"train_loss": -41.78461456298828, "global_step": 277313, "epoch": 2291} {"train_loss": -38.42123794555664, "global_step": 277314, "epoch": 2291} {"train_loss": -41.215213775634766, "global_step": 277315, "epoch": 2291} {"train_loss": -40.09476089477539, "global_step": 277316, "epoch": 2291} {"train_loss": -41.24971389770508, "global_step": 277317, "epoch": 2291} {"train_loss": -41.043514251708984, "global_step": 277318, "epoch": 2291} {"train_loss": -41.391822814941406, "global_step": 277319, "epoch": 2291} {"train_loss": -41.3493766784668, "global_step": 277320, "epoch": 2291} {"train_loss": -42.03953552246094, "global_step": 277321, "epoch": 2291} {"train_loss": -40.8848991394043, "global_step": 277322, "epoch": 2291} {"train_loss": -41.89802551269531, "global_step": 277323, "epoch": 2291} {"train_loss": -42.23106002807617, "global_step": 277324, "epoch": 2291} {"train_loss": -41.854000091552734, "global_step": 277325, "epoch": 2291} {"train_loss": -41.40903091430664, "global_step": 277326, "epoch": 2291} {"train_loss": -42.54534149169922, "global_step": 277327, "epoch": 2291} {"train_loss": -41.48611068725586, "global_step": 277328, "epoch": 2291} {"train_loss": -41.87338638305664, "global_step": 277329, "epoch": 2291} {"train_loss": -41.43120574951172, "global_step": 277330, "epoch": 2291} {"train_loss": -41.16524370051613, "global_step": 277331, "epoch": 2291, "val_loss": 2487274.75} {"train_loss": -41.07855224609375, "global_step": 277332, "epoch": 2292} {"train_loss": -41.54120635986328, "global_step": 277333, "epoch": 2292} {"train_loss": -41.92325973510742, "global_step": 277334, "epoch": 2292} {"train_loss": -42.418277740478516, "global_step": 277335, "epoch": 2292} {"train_loss": -42.272621154785156, "global_step": 277336, "epoch": 2292} {"train_loss": -42.10227584838867, "global_step": 277337, "epoch": 2292} {"train_loss": -42.64082717895508, "global_step": 277338, "epoch": 2292} {"train_loss": -42.272579193115234, "global_step": 277339, "epoch": 2292} {"train_loss": -42.52849197387695, "global_step": 277340, "epoch": 2292} {"train_loss": -42.18153762817383, "global_step": 277341, "epoch": 2292} {"train_loss": -42.20431900024414, "global_step": 277342, "epoch": 2292} {"train_loss": -42.30704879760742, "global_step": 277343, "epoch": 2292} {"train_loss": -42.6839599609375, "global_step": 277344, "epoch": 2292} {"train_loss": -42.248531341552734, "global_step": 277345, "epoch": 2292} {"train_loss": -42.534481048583984, "global_step": 277346, "epoch": 2292} {"train_loss": -42.0830192565918, "global_step": 277347, "epoch": 2292} {"train_loss": -42.74043655395508, "global_step": 277348, "epoch": 2292} {"train_loss": -42.65951156616211, "global_step": 277349, "epoch": 2292} {"train_loss": -41.88090133666992, "global_step": 277350, "epoch": 2292} {"train_loss": -41.31293869018555, "global_step": 277351, "epoch": 2292} {"train_loss": -41.17972946166992, "global_step": 277352, "epoch": 2292} {"train_loss": -42.57081604003906, "global_step": 277353, "epoch": 2292} {"train_loss": -42.865352630615234, "global_step": 277354, "epoch": 2292} {"train_loss": -42.34498977661133, "global_step": 277355, "epoch": 2292} {"train_loss": -42.45357894897461, "global_step": 277356, "epoch": 2292} {"train_loss": -42.727779388427734, "global_step": 277357, "epoch": 2292} {"train_loss": -41.91743087768555, "global_step": 277358, "epoch": 2292} {"train_loss": -41.73820877075195, "global_step": 277359, "epoch": 2292} {"train_loss": -41.5267448425293, "global_step": 277360, "epoch": 2292} {"train_loss": -42.3724250793457, "global_step": 277361, "epoch": 2292} {"train_loss": -42.939491271972656, "global_step": 277362, "epoch": 2292} {"train_loss": -42.6594352722168, "global_step": 277363, "epoch": 2292} {"train_loss": -42.789974212646484, "global_step": 277364, "epoch": 2292} {"train_loss": -42.74881362915039, "global_step": 277365, "epoch": 2292} {"train_loss": -42.95957565307617, "global_step": 277366, "epoch": 2292} {"train_loss": -42.56391525268555, "global_step": 277367, "epoch": 2292} {"train_loss": -42.620750427246094, "global_step": 277368, "epoch": 2292} {"train_loss": -43.48545455932617, "global_step": 277369, "epoch": 2292} {"train_loss": -42.96624755859375, "global_step": 277370, "epoch": 2292} {"train_loss": -43.28687286376953, "global_step": 277371, "epoch": 2292} {"train_loss": -42.68137741088867, "global_step": 277372, "epoch": 2292} {"train_loss": -42.90742111206055, "global_step": 277373, "epoch": 2292} {"train_loss": -43.17501449584961, "global_step": 277374, "epoch": 2292} {"train_loss": -42.828956604003906, "global_step": 277375, "epoch": 2292} {"train_loss": -42.997066497802734, "global_step": 277376, "epoch": 2292} {"train_loss": -42.93788528442383, "global_step": 277377, "epoch": 2292} {"train_loss": -43.03901290893555, "global_step": 277378, "epoch": 2292} {"train_loss": -43.20713424682617, "global_step": 277379, "epoch": 2292} {"train_loss": -42.35785675048828, "global_step": 277380, "epoch": 2292} {"train_loss": -43.013607025146484, "global_step": 277381, "epoch": 2292} {"train_loss": -43.21221160888672, "global_step": 277382, "epoch": 2292} {"train_loss": -42.78011703491211, "global_step": 277383, "epoch": 2292} {"train_loss": -43.30100631713867, "global_step": 277384, "epoch": 2292} {"train_loss": -43.1408576965332, "global_step": 277385, "epoch": 2292} {"train_loss": -43.39285659790039, "global_step": 277386, "epoch": 2292} {"train_loss": -42.40434265136719, "global_step": 277387, "epoch": 2292} {"train_loss": -42.57619857788086, "global_step": 277388, "epoch": 2292} {"train_loss": -41.840484619140625, "global_step": 277389, "epoch": 2292} {"train_loss": -42.45743179321289, "global_step": 277390, "epoch": 2292} {"train_loss": -42.504981994628906, "global_step": 277391, "epoch": 2292} {"train_loss": -42.14005661010742, "global_step": 277392, "epoch": 2292} {"train_loss": -42.07448959350586, "global_step": 277393, "epoch": 2292} {"train_loss": -42.718666076660156, "global_step": 277394, "epoch": 2292} {"train_loss": -41.47819900512695, "global_step": 277395, "epoch": 2292} {"train_loss": -42.613014221191406, "global_step": 277396, "epoch": 2292} {"train_loss": -42.1810188293457, "global_step": 277397, "epoch": 2292} {"train_loss": -42.703617095947266, "global_step": 277398, "epoch": 2292} {"train_loss": -41.87114334106445, "global_step": 277399, "epoch": 2292} {"train_loss": -42.4676628112793, "global_step": 277400, "epoch": 2292} {"train_loss": -41.65755844116211, "global_step": 277401, "epoch": 2292} {"train_loss": -41.59650802612305, "global_step": 277402, "epoch": 2292} {"train_loss": -42.4248161315918, "global_step": 277403, "epoch": 2292} {"train_loss": -41.619049072265625, "global_step": 277404, "epoch": 2292} {"train_loss": -42.024017333984375, "global_step": 277405, "epoch": 2292} {"train_loss": -42.10801315307617, "global_step": 277406, "epoch": 2292} {"train_loss": -42.94701385498047, "global_step": 277407, "epoch": 2292} {"train_loss": -42.0787467956543, "global_step": 277408, "epoch": 2292} {"train_loss": -42.52077102661133, "global_step": 277409, "epoch": 2292} {"train_loss": -42.20499801635742, "global_step": 277410, "epoch": 2292} {"train_loss": -42.51023864746094, "global_step": 277411, "epoch": 2292} {"train_loss": -41.61100387573242, "global_step": 277412, "epoch": 2292} {"train_loss": -41.43940734863281, "global_step": 277413, "epoch": 2292} {"train_loss": -42.01717758178711, "global_step": 277414, "epoch": 2292} {"train_loss": -42.41779327392578, "global_step": 277415, "epoch": 2292} {"train_loss": -41.44178771972656, "global_step": 277416, "epoch": 2292} {"train_loss": -42.21436309814453, "global_step": 277417, "epoch": 2292} {"train_loss": -41.353271484375, "global_step": 277418, "epoch": 2292} {"train_loss": -42.07100296020508, "global_step": 277419, "epoch": 2292} {"train_loss": -41.09082794189453, "global_step": 277420, "epoch": 2292} {"train_loss": -42.544368743896484, "global_step": 277421, "epoch": 2292} {"train_loss": -42.15085983276367, "global_step": 277422, "epoch": 2292} {"train_loss": -42.34480285644531, "global_step": 277423, "epoch": 2292} {"train_loss": -41.59200668334961, "global_step": 277424, "epoch": 2292} {"train_loss": -42.65362548828125, "global_step": 277425, "epoch": 2292} {"train_loss": -42.10381317138672, "global_step": 277426, "epoch": 2292} {"train_loss": -42.46027755737305, "global_step": 277427, "epoch": 2292} {"train_loss": -41.82047653198242, "global_step": 277428, "epoch": 2292} {"train_loss": -42.484222412109375, "global_step": 277429, "epoch": 2292} {"train_loss": -42.000572204589844, "global_step": 277430, "epoch": 2292} {"train_loss": -42.14396286010742, "global_step": 277431, "epoch": 2292} {"train_loss": -41.61701583862305, "global_step": 277432, "epoch": 2292} {"train_loss": -41.74675369262695, "global_step": 277433, "epoch": 2292} {"train_loss": -41.65346145629883, "global_step": 277434, "epoch": 2292} {"train_loss": -42.3979377746582, "global_step": 277435, "epoch": 2292} {"train_loss": -41.80777359008789, "global_step": 277436, "epoch": 2292} {"train_loss": -41.985626220703125, "global_step": 277437, "epoch": 2292} {"train_loss": -41.31815719604492, "global_step": 277438, "epoch": 2292} {"train_loss": -42.75864791870117, "global_step": 277439, "epoch": 2292} {"train_loss": -42.500213623046875, "global_step": 277440, "epoch": 2292} {"train_loss": -41.408103942871094, "global_step": 277441, "epoch": 2292} {"train_loss": -38.977745056152344, "global_step": 277442, "epoch": 2292} {"train_loss": -38.088600158691406, "global_step": 277443, "epoch": 2292} {"train_loss": -40.61958312988281, "global_step": 277444, "epoch": 2292} {"train_loss": -41.824886322021484, "global_step": 277445, "epoch": 2292} {"train_loss": -42.098487854003906, "global_step": 277446, "epoch": 2292} {"train_loss": -40.62590026855469, "global_step": 277447, "epoch": 2292} {"train_loss": -40.38253402709961, "global_step": 277448, "epoch": 2292} {"train_loss": -42.35238265991211, "global_step": 277449, "epoch": 2292} {"train_loss": -42.19648361206055, "global_step": 277450, "epoch": 2292} {"train_loss": -41.274085998535156, "global_step": 277451, "epoch": 2292} {"train_loss": -42.19059788097035, "global_step": 277452, "epoch": 2292, "val_loss": 2528781.75} {"train_loss": -41.098175048828125, "global_step": 277453, "epoch": 2293} {"train_loss": -40.70408248901367, "global_step": 277454, "epoch": 2293} {"train_loss": -41.95976638793945, "global_step": 277455, "epoch": 2293} {"train_loss": -41.93124008178711, "global_step": 277456, "epoch": 2293} {"train_loss": -41.98878860473633, "global_step": 277457, "epoch": 2293} {"train_loss": -39.822383880615234, "global_step": 277458, "epoch": 2293} {"train_loss": -41.906410217285156, "global_step": 277459, "epoch": 2293} {"train_loss": -40.529579162597656, "global_step": 277460, "epoch": 2293} {"train_loss": -41.29417419433594, "global_step": 277461, "epoch": 2293} {"train_loss": -42.40168380737305, "global_step": 277462, "epoch": 2293} {"train_loss": -40.93988800048828, "global_step": 277463, "epoch": 2293} {"train_loss": -41.52919387817383, "global_step": 277464, "epoch": 2293} {"train_loss": -42.02543640136719, "global_step": 277465, "epoch": 2293} {"train_loss": -40.54757308959961, "global_step": 277466, "epoch": 2293} {"train_loss": -41.66799545288086, "global_step": 277467, "epoch": 2293} {"train_loss": -41.73220443725586, "global_step": 277468, "epoch": 2293} {"train_loss": -41.61735153198242, "global_step": 277469, "epoch": 2293} {"train_loss": -42.21887969970703, "global_step": 277470, "epoch": 2293} {"train_loss": -42.75592041015625, "global_step": 277471, "epoch": 2293} {"train_loss": -42.33976745605469, "global_step": 277472, "epoch": 2293} {"train_loss": -41.8393440246582, "global_step": 277473, "epoch": 2293} {"train_loss": -42.83808898925781, "global_step": 277474, "epoch": 2293} {"train_loss": -42.167362213134766, "global_step": 277475, "epoch": 2293} {"train_loss": -41.5607795715332, "global_step": 277476, "epoch": 2293} {"train_loss": -42.434017181396484, "global_step": 277477, "epoch": 2293} {"train_loss": -42.74490737915039, "global_step": 277478, "epoch": 2293} {"train_loss": -41.519222259521484, "global_step": 277479, "epoch": 2293} {"train_loss": -42.588680267333984, "global_step": 277480, "epoch": 2293} {"train_loss": -42.7595100402832, "global_step": 277481, "epoch": 2293} {"train_loss": -42.58201217651367, "global_step": 277482, "epoch": 2293} {"train_loss": -43.16408920288086, "global_step": 277483, "epoch": 2293} {"train_loss": -41.674808502197266, "global_step": 277484, "epoch": 2293} {"train_loss": -42.93047332763672, "global_step": 277485, "epoch": 2293} {"train_loss": -42.98994827270508, "global_step": 277486, "epoch": 2293} {"train_loss": -42.66950988769531, "global_step": 277487, "epoch": 2293} {"train_loss": -42.735321044921875, "global_step": 277488, "epoch": 2293} {"train_loss": -42.72412109375, "global_step": 277489, "epoch": 2293} {"train_loss": -43.190670013427734, "global_step": 277490, "epoch": 2293} {"train_loss": -42.89612579345703, "global_step": 277491, "epoch": 2293} {"train_loss": -42.777313232421875, "global_step": 277492, "epoch": 2293} {"train_loss": -42.5020637512207, "global_step": 277493, "epoch": 2293} {"train_loss": -43.40679168701172, "global_step": 277494, "epoch": 2293} {"train_loss": -42.362545013427734, "global_step": 277495, "epoch": 2293} {"train_loss": -43.11684799194336, "global_step": 277496, "epoch": 2293} {"train_loss": -42.953670501708984, "global_step": 277497, "epoch": 2293} {"train_loss": -42.54652786254883, "global_step": 277498, "epoch": 2293} {"train_loss": -42.94889450073242, "global_step": 277499, "epoch": 2293} {"train_loss": -42.97053146362305, "global_step": 277500, "epoch": 2293} {"train_loss": -43.14950180053711, "global_step": 277501, "epoch": 2293} {"train_loss": -42.30692672729492, "global_step": 277502, "epoch": 2293} {"train_loss": -43.129703521728516, "global_step": 277503, "epoch": 2293} {"train_loss": -42.68643569946289, "global_step": 277504, "epoch": 2293} {"train_loss": -42.79962158203125, "global_step": 277505, "epoch": 2293} {"train_loss": -42.350425720214844, "global_step": 277506, "epoch": 2293} {"train_loss": -42.535282135009766, "global_step": 277507, "epoch": 2293} {"train_loss": -42.12556838989258, "global_step": 277508, "epoch": 2293} {"train_loss": -43.40676498413086, "global_step": 277509, "epoch": 2293} {"train_loss": -42.76772689819336, "global_step": 277510, "epoch": 2293} {"train_loss": -42.30065155029297, "global_step": 277511, "epoch": 2293} {"train_loss": -42.89611053466797, "global_step": 277512, "epoch": 2293} {"train_loss": -42.88033676147461, "global_step": 277513, "epoch": 2293} {"train_loss": -42.87355422973633, "global_step": 277514, "epoch": 2293} {"train_loss": -43.134033203125, "global_step": 277515, "epoch": 2293} {"train_loss": -40.8188362121582, "global_step": 277516, "epoch": 2293} {"train_loss": -41.114173889160156, "global_step": 277517, "epoch": 2293} {"train_loss": -42.95095443725586, "global_step": 277518, "epoch": 2293} {"train_loss": -42.4819221496582, "global_step": 277519, "epoch": 2293} {"train_loss": -39.11392593383789, "global_step": 277520, "epoch": 2293} {"train_loss": -39.82513427734375, "global_step": 277521, "epoch": 2293} {"train_loss": -41.730770111083984, "global_step": 277522, "epoch": 2293} {"train_loss": -42.7081413269043, "global_step": 277523, "epoch": 2293} {"train_loss": -40.258113861083984, "global_step": 277524, "epoch": 2293} {"train_loss": -31.721302032470703, "global_step": 277525, "epoch": 2293} {"train_loss": -41.18647384643555, "global_step": 277526, "epoch": 2293} {"train_loss": -36.08296585083008, "global_step": 277527, "epoch": 2293} {"train_loss": -41.43709182739258, "global_step": 277528, "epoch": 2293} {"train_loss": -39.260318756103516, "global_step": 277529, "epoch": 2293} {"train_loss": -38.59185791015625, "global_step": 277530, "epoch": 2293} {"train_loss": -40.18023681640625, "global_step": 277531, "epoch": 2293} {"train_loss": -40.93796157836914, "global_step": 277532, "epoch": 2293} {"train_loss": -39.550960540771484, "global_step": 277533, "epoch": 2293} {"train_loss": -40.431678771972656, "global_step": 277534, "epoch": 2293} {"train_loss": -33.03120040893555, "global_step": 277535, "epoch": 2293} {"train_loss": -39.0390625, "global_step": 277536, "epoch": 2293} {"train_loss": -40.191162109375, "global_step": 277537, "epoch": 2293} {"train_loss": -40.55949783325195, "global_step": 277538, "epoch": 2293} {"train_loss": -38.74601364135742, "global_step": 277539, "epoch": 2293} {"train_loss": -39.49063491821289, "global_step": 277540, "epoch": 2293} {"train_loss": -37.03382110595703, "global_step": 277541, "epoch": 2293} {"train_loss": -35.13250732421875, "global_step": 277542, "epoch": 2293} {"train_loss": -36.67971420288086, "global_step": 277543, "epoch": 2293} {"train_loss": -37.73752975463867, "global_step": 277544, "epoch": 2293} {"train_loss": -37.008907318115234, "global_step": 277545, "epoch": 2293} {"train_loss": -32.65529251098633, "global_step": 277546, "epoch": 2293} {"train_loss": -37.899940490722656, "global_step": 277547, "epoch": 2293} {"train_loss": -39.59962844848633, "global_step": 277548, "epoch": 2293} {"train_loss": -39.981624603271484, "global_step": 277549, "epoch": 2293} {"train_loss": -39.75856018066406, "global_step": 277550, "epoch": 2293} {"train_loss": -40.09255599975586, "global_step": 277551, "epoch": 2293} {"train_loss": -35.89334487915039, "global_step": 277552, "epoch": 2293} {"train_loss": -36.004844665527344, "global_step": 277553, "epoch": 2293} {"train_loss": -37.37958908081055, "global_step": 277554, "epoch": 2293} {"train_loss": -39.38005447387695, "global_step": 277555, "epoch": 2293} {"train_loss": -38.392860412597656, "global_step": 277556, "epoch": 2293} {"train_loss": -39.95188903808594, "global_step": 277557, "epoch": 2293} {"train_loss": -39.79374313354492, "global_step": 277558, "epoch": 2293} {"train_loss": -40.32863998413086, "global_step": 277559, "epoch": 2293} {"train_loss": -37.03428268432617, "global_step": 277560, "epoch": 2293} {"train_loss": -40.060585021972656, "global_step": 277561, "epoch": 2293} {"train_loss": -39.35854721069336, "global_step": 277562, "epoch": 2293} {"train_loss": -40.46543884277344, "global_step": 277563, "epoch": 2293} {"train_loss": -40.05411911010742, "global_step": 277564, "epoch": 2293} {"train_loss": -38.896209716796875, "global_step": 277565, "epoch": 2293} {"train_loss": -40.56726837158203, "global_step": 277566, "epoch": 2293} {"train_loss": -40.144466400146484, "global_step": 277567, "epoch": 2293} {"train_loss": -40.75370788574219, "global_step": 277568, "epoch": 2293} {"train_loss": -40.3530158996582, "global_step": 277569, "epoch": 2293} {"train_loss": -40.76032638549805, "global_step": 277570, "epoch": 2293} {"train_loss": -39.445960998535156, "global_step": 277571, "epoch": 2293} {"train_loss": -40.3260498046875, "global_step": 277572, "epoch": 2293} {"train_loss": -40.79034023442544, "global_step": 277573, "epoch": 2293, "val_loss": 2513606.75} {"train_loss": -40.256256103515625, "global_step": 277574, "epoch": 2294} {"train_loss": -41.00116729736328, "global_step": 277575, "epoch": 2294} {"train_loss": -41.00751876831055, "global_step": 277576, "epoch": 2294} {"train_loss": -40.5716552734375, "global_step": 277577, "epoch": 2294} {"train_loss": -41.32637405395508, "global_step": 277578, "epoch": 2294} {"train_loss": -41.168975830078125, "global_step": 277579, "epoch": 2294} {"train_loss": -41.2214469909668, "global_step": 277580, "epoch": 2294} {"train_loss": -40.34714889526367, "global_step": 277581, "epoch": 2294} {"train_loss": -40.60090255737305, "global_step": 277582, "epoch": 2294} {"train_loss": -41.468509674072266, "global_step": 277583, "epoch": 2294} {"train_loss": -39.51427459716797, "global_step": 277584, "epoch": 2294} {"train_loss": -41.24952697753906, "global_step": 277585, "epoch": 2294} {"train_loss": -41.144187927246094, "global_step": 277586, "epoch": 2294} {"train_loss": -41.72151565551758, "global_step": 277587, "epoch": 2294} {"train_loss": -41.15953826904297, "global_step": 277588, "epoch": 2294} {"train_loss": -41.63970947265625, "global_step": 277589, "epoch": 2294} {"train_loss": -41.4007682800293, "global_step": 277590, "epoch": 2294} {"train_loss": -41.9586296081543, "global_step": 277591, "epoch": 2294} {"train_loss": -40.84347152709961, "global_step": 277592, "epoch": 2294} {"train_loss": -41.4099006652832, "global_step": 277593, "epoch": 2294} {"train_loss": -41.877197265625, "global_step": 277594, "epoch": 2294} {"train_loss": -42.638458251953125, "global_step": 277595, "epoch": 2294} {"train_loss": -42.49043273925781, "global_step": 277596, "epoch": 2294} {"train_loss": -42.28483200073242, "global_step": 277597, "epoch": 2294} {"train_loss": -41.79764938354492, "global_step": 277598, "epoch": 2294} {"train_loss": -41.81100082397461, "global_step": 277599, "epoch": 2294} {"train_loss": -42.571102142333984, "global_step": 277600, "epoch": 2294} {"train_loss": -42.503177642822266, "global_step": 277601, "epoch": 2294} {"train_loss": -42.45024490356445, "global_step": 277602, "epoch": 2294} {"train_loss": -41.451412200927734, "global_step": 277603, "epoch": 2294} {"train_loss": -42.64966583251953, "global_step": 277604, "epoch": 2294} {"train_loss": -41.866268157958984, "global_step": 277605, "epoch": 2294} {"train_loss": -42.33720779418945, "global_step": 277606, "epoch": 2294} {"train_loss": -42.4030876159668, "global_step": 277607, "epoch": 2294} {"train_loss": -42.312835693359375, "global_step": 277608, "epoch": 2294} {"train_loss": -42.54740524291992, "global_step": 277609, "epoch": 2294} {"train_loss": -42.112281799316406, "global_step": 277610, "epoch": 2294} {"train_loss": -42.52729797363281, "global_step": 277611, "epoch": 2294} {"train_loss": -42.038387298583984, "global_step": 277612, "epoch": 2294} {"train_loss": -42.437679290771484, "global_step": 277613, "epoch": 2294} {"train_loss": -42.218963623046875, "global_step": 277614, "epoch": 2294} {"train_loss": -42.821895599365234, "global_step": 277615, "epoch": 2294} {"train_loss": -43.06386184692383, "global_step": 277616, "epoch": 2294} {"train_loss": -41.58366012573242, "global_step": 277617, "epoch": 2294} {"train_loss": -42.720367431640625, "global_step": 277618, "epoch": 2294} {"train_loss": -42.84062576293945, "global_step": 277619, "epoch": 2294} {"train_loss": -42.18806838989258, "global_step": 277620, "epoch": 2294} {"train_loss": -42.984771728515625, "global_step": 277621, "epoch": 2294} {"train_loss": -42.59001159667969, "global_step": 277622, "epoch": 2294} {"train_loss": -41.82416534423828, "global_step": 277623, "epoch": 2294} {"train_loss": -42.16128158569336, "global_step": 277624, "epoch": 2294} {"train_loss": -42.739410400390625, "global_step": 277625, "epoch": 2294} {"train_loss": -41.85544204711914, "global_step": 277626, "epoch": 2294} {"train_loss": -42.916603088378906, "global_step": 277627, "epoch": 2294} {"train_loss": -43.186309814453125, "global_step": 277628, "epoch": 2294} {"train_loss": -42.91608810424805, "global_step": 277629, "epoch": 2294} {"train_loss": -42.707828521728516, "global_step": 277630, "epoch": 2294} {"train_loss": -42.94028854370117, "global_step": 277631, "epoch": 2294} {"train_loss": -43.25698471069336, "global_step": 277632, "epoch": 2294} {"train_loss": -42.997432708740234, "global_step": 277633, "epoch": 2294} {"train_loss": -43.258941650390625, "global_step": 277634, "epoch": 2294} {"train_loss": -42.67356491088867, "global_step": 277635, "epoch": 2294} {"train_loss": -42.68231964111328, "global_step": 277636, "epoch": 2294} {"train_loss": -43.22574996948242, "global_step": 277637, "epoch": 2294} {"train_loss": -42.82058334350586, "global_step": 277638, "epoch": 2294} {"train_loss": -42.9263916015625, "global_step": 277639, "epoch": 2294} {"train_loss": -42.8915901184082, "global_step": 277640, "epoch": 2294} {"train_loss": -41.90533447265625, "global_step": 277641, "epoch": 2294} {"train_loss": -43.255531311035156, "global_step": 277642, "epoch": 2294} {"train_loss": -42.3931770324707, "global_step": 277643, "epoch": 2294} {"train_loss": -43.00635528564453, "global_step": 277644, "epoch": 2294} {"train_loss": -42.9854736328125, "global_step": 277645, "epoch": 2294} {"train_loss": -43.09395980834961, "global_step": 277646, "epoch": 2294} {"train_loss": -43.55477523803711, "global_step": 277647, "epoch": 2294} {"train_loss": -43.16422653198242, "global_step": 277648, "epoch": 2294} {"train_loss": -43.41012191772461, "global_step": 277649, "epoch": 2294} {"train_loss": -43.11001205444336, "global_step": 277650, "epoch": 2294} {"train_loss": -43.2808952331543, "global_step": 277651, "epoch": 2294} {"train_loss": -43.09970474243164, "global_step": 277652, "epoch": 2294} {"train_loss": -42.58832550048828, "global_step": 277653, "epoch": 2294} {"train_loss": -42.481239318847656, "global_step": 277654, "epoch": 2294} {"train_loss": -43.90464401245117, "global_step": 277655, "epoch": 2294} {"train_loss": -42.9462776184082, "global_step": 277656, "epoch": 2294} {"train_loss": -38.67136764526367, "global_step": 277657, "epoch": 2294} {"train_loss": -37.1776237487793, "global_step": 277658, "epoch": 2294} {"train_loss": -40.84116744995117, "global_step": 277659, "epoch": 2294} {"train_loss": -39.22688674926758, "global_step": 277660, "epoch": 2294} {"train_loss": -42.022071838378906, "global_step": 277661, "epoch": 2294} {"train_loss": -41.29572677612305, "global_step": 277662, "epoch": 2294} {"train_loss": -42.25515365600586, "global_step": 277663, "epoch": 2294} {"train_loss": -41.043846130371094, "global_step": 277664, "epoch": 2294} {"train_loss": -41.310733795166016, "global_step": 277665, "epoch": 2294} {"train_loss": -42.36952590942383, "global_step": 277666, "epoch": 2294} {"train_loss": -36.457916259765625, "global_step": 277667, "epoch": 2294} {"train_loss": -41.0472526550293, "global_step": 277668, "epoch": 2294} {"train_loss": -40.5093994140625, "global_step": 277669, "epoch": 2294} {"train_loss": -40.2785530090332, "global_step": 277670, "epoch": 2294} {"train_loss": -42.044612884521484, "global_step": 277671, "epoch": 2294} {"train_loss": -39.17269515991211, "global_step": 277672, "epoch": 2294} {"train_loss": -40.434661865234375, "global_step": 277673, "epoch": 2294} {"train_loss": -40.58075714111328, "global_step": 277674, "epoch": 2294} {"train_loss": -39.546836853027344, "global_step": 277675, "epoch": 2294} {"train_loss": -38.89588928222656, "global_step": 277676, "epoch": 2294} {"train_loss": -39.514278411865234, "global_step": 277677, "epoch": 2294} {"train_loss": -36.99628829956055, "global_step": 277678, "epoch": 2294} {"train_loss": -39.06854248046875, "global_step": 277679, "epoch": 2294} {"train_loss": -39.650543212890625, "global_step": 277680, "epoch": 2294} {"train_loss": -38.39002990722656, "global_step": 277681, "epoch": 2294} {"train_loss": -38.82459259033203, "global_step": 277682, "epoch": 2294} {"train_loss": -40.86113357543945, "global_step": 277683, "epoch": 2294} {"train_loss": -39.59353256225586, "global_step": 277684, "epoch": 2294} {"train_loss": -37.90464401245117, "global_step": 277685, "epoch": 2294} {"train_loss": -39.237281799316406, "global_step": 277686, "epoch": 2294} {"train_loss": -39.363162994384766, "global_step": 277687, "epoch": 2294} {"train_loss": -38.202796936035156, "global_step": 277688, "epoch": 2294} {"train_loss": -40.81156921386719, "global_step": 277689, "epoch": 2294} {"train_loss": -39.51566696166992, "global_step": 277690, "epoch": 2294} {"train_loss": -40.039161682128906, "global_step": 277691, "epoch": 2294} {"train_loss": -38.31832504272461, "global_step": 277692, "epoch": 2294} {"train_loss": -40.88197708129883, "global_step": 277693, "epoch": 2294} {"train_loss": -41.49169502573565, "global_step": 277694, "epoch": 2294, "val_loss": 2407351.75} {"train_loss": -40.318267822265625, "global_step": 277695, "epoch": 2295} {"train_loss": -40.946205139160156, "global_step": 277696, "epoch": 2295} {"train_loss": -41.16496658325195, "global_step": 277697, "epoch": 2295} {"train_loss": -41.20957565307617, "global_step": 277698, "epoch": 2295} {"train_loss": -41.0588264465332, "global_step": 277699, "epoch": 2295} {"train_loss": -41.067928314208984, "global_step": 277700, "epoch": 2295} {"train_loss": -41.08090591430664, "global_step": 277701, "epoch": 2295} {"train_loss": -41.53023910522461, "global_step": 277702, "epoch": 2295} {"train_loss": -40.62113571166992, "global_step": 277703, "epoch": 2295} {"train_loss": -41.59455108642578, "global_step": 277704, "epoch": 2295} {"train_loss": -37.48270034790039, "global_step": 277705, "epoch": 2295} {"train_loss": -40.49604034423828, "global_step": 277706, "epoch": 2295} {"train_loss": -38.84292221069336, "global_step": 277707, "epoch": 2295} {"train_loss": -41.92649459838867, "global_step": 277708, "epoch": 2295} {"train_loss": -41.650840759277344, "global_step": 277709, "epoch": 2295} {"train_loss": -36.697235107421875, "global_step": 277710, "epoch": 2295} {"train_loss": -39.98906707763672, "global_step": 277711, "epoch": 2295} {"train_loss": -41.33124923706055, "global_step": 277712, "epoch": 2295} {"train_loss": -41.04893112182617, "global_step": 277713, "epoch": 2295} {"train_loss": -38.13854217529297, "global_step": 277714, "epoch": 2295} {"train_loss": -38.31133270263672, "global_step": 277715, "epoch": 2295} {"train_loss": -41.448917388916016, "global_step": 277716, "epoch": 2295} {"train_loss": -41.32241439819336, "global_step": 277717, "epoch": 2295} {"train_loss": -41.456565856933594, "global_step": 277718, "epoch": 2295} {"train_loss": -41.62682342529297, "global_step": 277719, "epoch": 2295} {"train_loss": -41.057373046875, "global_step": 277720, "epoch": 2295} {"train_loss": -42.20981979370117, "global_step": 277721, "epoch": 2295} {"train_loss": -41.58663558959961, "global_step": 277722, "epoch": 2295} {"train_loss": -41.70603561401367, "global_step": 277723, "epoch": 2295} {"train_loss": -41.69346237182617, "global_step": 277724, "epoch": 2295} {"train_loss": -41.04071044921875, "global_step": 277725, "epoch": 2295} {"train_loss": -41.58467483520508, "global_step": 277726, "epoch": 2295} {"train_loss": -42.139015197753906, "global_step": 277727, "epoch": 2295} {"train_loss": -41.4908561706543, "global_step": 277728, "epoch": 2295} {"train_loss": -41.587791442871094, "global_step": 277729, "epoch": 2295} {"train_loss": -41.46994400024414, "global_step": 277730, "epoch": 2295} {"train_loss": -41.94431686401367, "global_step": 277731, "epoch": 2295} {"train_loss": -41.667625427246094, "global_step": 277732, "epoch": 2295} {"train_loss": -40.46749496459961, "global_step": 277733, "epoch": 2295} {"train_loss": -41.827022552490234, "global_step": 277734, "epoch": 2295} {"train_loss": -40.87490463256836, "global_step": 277735, "epoch": 2295} {"train_loss": -41.61305618286133, "global_step": 277736, "epoch": 2295} {"train_loss": -42.324615478515625, "global_step": 277737, "epoch": 2295} {"train_loss": -41.76879119873047, "global_step": 277738, "epoch": 2295} {"train_loss": -41.70463180541992, "global_step": 277739, "epoch": 2295} {"train_loss": -41.816349029541016, "global_step": 277740, "epoch": 2295} {"train_loss": -42.127174377441406, "global_step": 277741, "epoch": 2295} {"train_loss": -42.20374298095703, "global_step": 277742, "epoch": 2295} {"train_loss": -41.9416389465332, "global_step": 277743, "epoch": 2295} {"train_loss": -42.255126953125, "global_step": 277744, "epoch": 2295} {"train_loss": -41.7239990234375, "global_step": 277745, "epoch": 2295} {"train_loss": -42.509971618652344, "global_step": 277746, "epoch": 2295} {"train_loss": -41.51601028442383, "global_step": 277747, "epoch": 2295} {"train_loss": -42.726375579833984, "global_step": 277748, "epoch": 2295} {"train_loss": -41.914344787597656, "global_step": 277749, "epoch": 2295} {"train_loss": -41.68233871459961, "global_step": 277750, "epoch": 2295} {"train_loss": -42.5007438659668, "global_step": 277751, "epoch": 2295} {"train_loss": -42.55952835083008, "global_step": 277752, "epoch": 2295} {"train_loss": -42.239158630371094, "global_step": 277753, "epoch": 2295} {"train_loss": -41.82353591918945, "global_step": 277754, "epoch": 2295} {"train_loss": -41.965980529785156, "global_step": 277755, "epoch": 2295} {"train_loss": -42.95087814331055, "global_step": 277756, "epoch": 2295} {"train_loss": -42.77247619628906, "global_step": 277757, "epoch": 2295} {"train_loss": -42.66044235229492, "global_step": 277758, "epoch": 2295} {"train_loss": -43.08333206176758, "global_step": 277759, "epoch": 2295} {"train_loss": -42.666927337646484, "global_step": 277760, "epoch": 2295} {"train_loss": -43.093963623046875, "global_step": 277761, "epoch": 2295} {"train_loss": -43.09648132324219, "global_step": 277762, "epoch": 2295} {"train_loss": -42.87153625488281, "global_step": 277763, "epoch": 2295} {"train_loss": -42.75054931640625, "global_step": 277764, "epoch": 2295} {"train_loss": -42.59994125366211, "global_step": 277765, "epoch": 2295} {"train_loss": -42.94089126586914, "global_step": 277766, "epoch": 2295} {"train_loss": -42.88469314575195, "global_step": 277767, "epoch": 2295} {"train_loss": -43.57128143310547, "global_step": 277768, "epoch": 2295} {"train_loss": -43.25667953491211, "global_step": 277769, "epoch": 2295} {"train_loss": -43.13106918334961, "global_step": 277770, "epoch": 2295} {"train_loss": -43.161537170410156, "global_step": 277771, "epoch": 2295} {"train_loss": -42.54975891113281, "global_step": 277772, "epoch": 2295} {"train_loss": -42.95612716674805, "global_step": 277773, "epoch": 2295} {"train_loss": -43.080291748046875, "global_step": 277774, "epoch": 2295} {"train_loss": -42.377777099609375, "global_step": 277775, "epoch": 2295} {"train_loss": -43.39691162109375, "global_step": 277776, "epoch": 2295} {"train_loss": -42.48628616333008, "global_step": 277777, "epoch": 2295} {"train_loss": -42.212677001953125, "global_step": 277778, "epoch": 2295} {"train_loss": -43.19312286376953, "global_step": 277779, "epoch": 2295} {"train_loss": -42.909786224365234, "global_step": 277780, "epoch": 2295} {"train_loss": -41.36208724975586, "global_step": 277781, "epoch": 2295} {"train_loss": -39.399574279785156, "global_step": 277782, "epoch": 2295} {"train_loss": -42.92008590698242, "global_step": 277783, "epoch": 2295} {"train_loss": -42.13568878173828, "global_step": 277784, "epoch": 2295} {"train_loss": -41.83620834350586, "global_step": 277785, "epoch": 2295} {"train_loss": -41.26432418823242, "global_step": 277786, "epoch": 2295} {"train_loss": -42.81221389770508, "global_step": 277787, "epoch": 2295} {"train_loss": -42.555599212646484, "global_step": 277788, "epoch": 2295} {"train_loss": -40.5842399597168, "global_step": 277789, "epoch": 2295} {"train_loss": -41.529598236083984, "global_step": 277790, "epoch": 2295} {"train_loss": -42.082252502441406, "global_step": 277791, "epoch": 2295} {"train_loss": -42.4691162109375, "global_step": 277792, "epoch": 2295} {"train_loss": -41.62406539916992, "global_step": 277793, "epoch": 2295} {"train_loss": -41.53025817871094, "global_step": 277794, "epoch": 2295} {"train_loss": -41.961910247802734, "global_step": 277795, "epoch": 2295} {"train_loss": -41.07218933105469, "global_step": 277796, "epoch": 2295} {"train_loss": -41.876434326171875, "global_step": 277797, "epoch": 2295} {"train_loss": -42.032958984375, "global_step": 277798, "epoch": 2295} {"train_loss": -41.95510482788086, "global_step": 277799, "epoch": 2295} {"train_loss": -41.626033782958984, "global_step": 277800, "epoch": 2295} {"train_loss": -41.35763931274414, "global_step": 277801, "epoch": 2295} {"train_loss": -41.955989837646484, "global_step": 277802, "epoch": 2295} {"train_loss": -41.148468017578125, "global_step": 277803, "epoch": 2295} {"train_loss": -41.98014450073242, "global_step": 277804, "epoch": 2295} {"train_loss": -41.54902267456055, "global_step": 277805, "epoch": 2295} {"train_loss": -42.15501022338867, "global_step": 277806, "epoch": 2295} {"train_loss": -41.96659469604492, "global_step": 277807, "epoch": 2295} {"train_loss": -42.72854995727539, "global_step": 277808, "epoch": 2295} {"train_loss": -42.22164535522461, "global_step": 277809, "epoch": 2295} {"train_loss": -42.47700881958008, "global_step": 277810, "epoch": 2295} {"train_loss": -40.89698791503906, "global_step": 277811, "epoch": 2295} {"train_loss": -42.891624450683594, "global_step": 277812, "epoch": 2295} {"train_loss": -42.8106689453125, "global_step": 277813, "epoch": 2295} {"train_loss": -42.27190399169922, "global_step": 277814, "epoch": 2295} {"train_loss": -41.78180445521331, "global_step": 277815, "epoch": 2295, "val_loss": 2450157.75} {"train_loss": -43.44403076171875, "global_step": 277816, "epoch": 2296} {"train_loss": -42.858612060546875, "global_step": 277817, "epoch": 2296} {"train_loss": -41.5687255859375, "global_step": 277818, "epoch": 2296} {"train_loss": -41.23773956298828, "global_step": 277819, "epoch": 2296} {"train_loss": -42.772789001464844, "global_step": 277820, "epoch": 2296} {"train_loss": -42.108333587646484, "global_step": 277821, "epoch": 2296} {"train_loss": -42.5343132019043, "global_step": 277822, "epoch": 2296} {"train_loss": -42.505950927734375, "global_step": 277823, "epoch": 2296} {"train_loss": -42.34077072143555, "global_step": 277824, "epoch": 2296} {"train_loss": -42.10075759887695, "global_step": 277825, "epoch": 2296} {"train_loss": -42.61609649658203, "global_step": 277826, "epoch": 2296} {"train_loss": -43.101226806640625, "global_step": 277827, "epoch": 2296} {"train_loss": -42.00715255737305, "global_step": 277828, "epoch": 2296} {"train_loss": -42.264400482177734, "global_step": 277829, "epoch": 2296} {"train_loss": -43.1152458190918, "global_step": 277830, "epoch": 2296} {"train_loss": -42.77408981323242, "global_step": 277831, "epoch": 2296} {"train_loss": -41.22926330566406, "global_step": 277832, "epoch": 2296} {"train_loss": -42.353790283203125, "global_step": 277833, "epoch": 2296} {"train_loss": -43.243282318115234, "global_step": 277834, "epoch": 2296} {"train_loss": -41.91240310668945, "global_step": 277835, "epoch": 2296} {"train_loss": -41.27350616455078, "global_step": 277836, "epoch": 2296} {"train_loss": -42.062713623046875, "global_step": 277837, "epoch": 2296} {"train_loss": -43.0130615234375, "global_step": 277838, "epoch": 2296} {"train_loss": -41.69510269165039, "global_step": 277839, "epoch": 2296} {"train_loss": -42.87060546875, "global_step": 277840, "epoch": 2296} {"train_loss": -42.44660186767578, "global_step": 277841, "epoch": 2296} {"train_loss": -42.4284782409668, "global_step": 277842, "epoch": 2296} {"train_loss": -41.85161209106445, "global_step": 277843, "epoch": 2296} {"train_loss": -42.64201354980469, "global_step": 277844, "epoch": 2296} {"train_loss": -43.24220657348633, "global_step": 277845, "epoch": 2296} {"train_loss": -42.74190139770508, "global_step": 277846, "epoch": 2296} {"train_loss": -42.512733459472656, "global_step": 277847, "epoch": 2296} {"train_loss": -42.16987228393555, "global_step": 277848, "epoch": 2296} {"train_loss": -41.54108810424805, "global_step": 277849, "epoch": 2296} {"train_loss": -42.54114532470703, "global_step": 277850, "epoch": 2296} {"train_loss": -42.25542449951172, "global_step": 277851, "epoch": 2296} {"train_loss": -43.02549743652344, "global_step": 277852, "epoch": 2296} {"train_loss": -42.618621826171875, "global_step": 277853, "epoch": 2296} {"train_loss": -42.76101303100586, "global_step": 277854, "epoch": 2296} {"train_loss": -43.2412223815918, "global_step": 277855, "epoch": 2296} {"train_loss": -42.46599578857422, "global_step": 277856, "epoch": 2296} {"train_loss": -42.96567916870117, "global_step": 277857, "epoch": 2296} {"train_loss": -42.83858871459961, "global_step": 277858, "epoch": 2296} {"train_loss": -42.98442077636719, "global_step": 277859, "epoch": 2296} {"train_loss": -43.072078704833984, "global_step": 277860, "epoch": 2296} {"train_loss": -42.787620544433594, "global_step": 277861, "epoch": 2296} {"train_loss": -41.641178131103516, "global_step": 277862, "epoch": 2296} {"train_loss": -42.3701286315918, "global_step": 277863, "epoch": 2296} {"train_loss": -43.05941390991211, "global_step": 277864, "epoch": 2296} {"train_loss": -42.234649658203125, "global_step": 277865, "epoch": 2296} {"train_loss": -41.69060134887695, "global_step": 277866, "epoch": 2296} {"train_loss": -41.589412689208984, "global_step": 277867, "epoch": 2296} {"train_loss": -39.95706558227539, "global_step": 277868, "epoch": 2296} {"train_loss": -42.03876876831055, "global_step": 277869, "epoch": 2296} {"train_loss": -42.2202262878418, "global_step": 277870, "epoch": 2296} {"train_loss": -41.51055908203125, "global_step": 277871, "epoch": 2296} {"train_loss": -41.63252258300781, "global_step": 277872, "epoch": 2296} {"train_loss": -41.7993049621582, "global_step": 277873, "epoch": 2296} {"train_loss": -43.46963119506836, "global_step": 277874, "epoch": 2296} {"train_loss": -41.08369445800781, "global_step": 277875, "epoch": 2296} {"train_loss": -39.92026901245117, "global_step": 277876, "epoch": 2296} {"train_loss": -39.85411834716797, "global_step": 277877, "epoch": 2296} {"train_loss": -39.35821533203125, "global_step": 277878, "epoch": 2296} {"train_loss": -40.655799865722656, "global_step": 277879, "epoch": 2296} {"train_loss": -40.88700485229492, "global_step": 277880, "epoch": 2296} {"train_loss": -40.49824142456055, "global_step": 277881, "epoch": 2296} {"train_loss": -41.34376907348633, "global_step": 277882, "epoch": 2296} {"train_loss": -41.649356842041016, "global_step": 277883, "epoch": 2296} {"train_loss": -38.52588653564453, "global_step": 277884, "epoch": 2296} {"train_loss": -41.62405014038086, "global_step": 277885, "epoch": 2296} {"train_loss": -42.50716018676758, "global_step": 277886, "epoch": 2296} {"train_loss": -39.08476638793945, "global_step": 277887, "epoch": 2296} {"train_loss": -41.66498947143555, "global_step": 277888, "epoch": 2296} {"train_loss": -42.1098747253418, "global_step": 277889, "epoch": 2296} {"train_loss": -42.062477111816406, "global_step": 277890, "epoch": 2296} {"train_loss": -42.09342575073242, "global_step": 277891, "epoch": 2296} {"train_loss": -40.458412170410156, "global_step": 277892, "epoch": 2296} {"train_loss": -41.67924118041992, "global_step": 277893, "epoch": 2296} {"train_loss": -41.39382553100586, "global_step": 277894, "epoch": 2296} {"train_loss": -37.8426628112793, "global_step": 277895, "epoch": 2296} {"train_loss": -41.27439498901367, "global_step": 277896, "epoch": 2296} {"train_loss": -41.63544845581055, "global_step": 277897, "epoch": 2296} {"train_loss": -32.3594970703125, "global_step": 277898, "epoch": 2296} {"train_loss": -39.725765228271484, "global_step": 277899, "epoch": 2296} {"train_loss": -39.23404312133789, "global_step": 277900, "epoch": 2296} {"train_loss": -19.0535945892334, "global_step": 277901, "epoch": 2296} {"train_loss": -27.30393409729004, "global_step": 277902, "epoch": 2296} {"train_loss": -39.331546783447266, "global_step": 277903, "epoch": 2296} {"train_loss": -37.84186935424805, "global_step": 277904, "epoch": 2296} {"train_loss": -39.58803176879883, "global_step": 277905, "epoch": 2296} {"train_loss": -35.80788803100586, "global_step": 277906, "epoch": 2296} {"train_loss": -33.385372161865234, "global_step": 277907, "epoch": 2296} {"train_loss": -25.09649085998535, "global_step": 277908, "epoch": 2296} {"train_loss": -26.709625244140625, "global_step": 277909, "epoch": 2296} {"train_loss": -35.044349670410156, "global_step": 277910, "epoch": 2296} {"train_loss": -35.78786849975586, "global_step": 277911, "epoch": 2296} {"train_loss": -32.000144958496094, "global_step": 277912, "epoch": 2296} {"train_loss": -34.30221176147461, "global_step": 277913, "epoch": 2296} {"train_loss": -33.64773178100586, "global_step": 277914, "epoch": 2296} {"train_loss": -37.039764404296875, "global_step": 277915, "epoch": 2296} {"train_loss": -34.65211486816406, "global_step": 277916, "epoch": 2296} {"train_loss": -36.0010871887207, "global_step": 277917, "epoch": 2296} {"train_loss": -36.037864685058594, "global_step": 277918, "epoch": 2296} {"train_loss": -33.70424270629883, "global_step": 277919, "epoch": 2296} {"train_loss": -37.25253677368164, "global_step": 277920, "epoch": 2296} {"train_loss": -34.70564651489258, "global_step": 277921, "epoch": 2296} {"train_loss": -37.142974853515625, "global_step": 277922, "epoch": 2296} {"train_loss": -35.177490234375, "global_step": 277923, "epoch": 2296} {"train_loss": -35.05710983276367, "global_step": 277924, "epoch": 2296} {"train_loss": -37.21674346923828, "global_step": 277925, "epoch": 2296} {"train_loss": -37.10149002075195, "global_step": 277926, "epoch": 2296} {"train_loss": -37.07151412963867, "global_step": 277927, "epoch": 2296} {"train_loss": -37.849029541015625, "global_step": 277928, "epoch": 2296} {"train_loss": -39.34147644042969, "global_step": 277929, "epoch": 2296} {"train_loss": -38.603511810302734, "global_step": 277930, "epoch": 2296} {"train_loss": -38.94526290893555, "global_step": 277931, "epoch": 2296} {"train_loss": -37.11959457397461, "global_step": 277932, "epoch": 2296} {"train_loss": -39.67664337158203, "global_step": 277933, "epoch": 2296} {"train_loss": -38.947628021240234, "global_step": 277934, "epoch": 2296} {"train_loss": -39.95777130126953, "global_step": 277935, "epoch": 2296} {"train_loss": -39.85282559040164, "global_step": 277936, "epoch": 2296, "val_loss": 2524066.25} {"train_loss": -38.570030212402344, "global_step": 277937, "epoch": 2297} {"train_loss": -39.57536697387695, "global_step": 277938, "epoch": 2297} {"train_loss": -39.91603469848633, "global_step": 277939, "epoch": 2297} {"train_loss": -38.7763786315918, "global_step": 277940, "epoch": 2297} {"train_loss": -39.80008316040039, "global_step": 277941, "epoch": 2297} {"train_loss": -37.29825973510742, "global_step": 277942, "epoch": 2297} {"train_loss": -39.005706787109375, "global_step": 277943, "epoch": 2297} {"train_loss": -39.10622787475586, "global_step": 277944, "epoch": 2297} {"train_loss": -39.75910949707031, "global_step": 277945, "epoch": 2297} {"train_loss": -39.9594841003418, "global_step": 277946, "epoch": 2297} {"train_loss": -40.2878532409668, "global_step": 277947, "epoch": 2297} {"train_loss": -38.453975677490234, "global_step": 277948, "epoch": 2297} {"train_loss": -40.10554504394531, "global_step": 277949, "epoch": 2297} {"train_loss": -40.518165588378906, "global_step": 277950, "epoch": 2297} {"train_loss": -40.45402908325195, "global_step": 277951, "epoch": 2297} {"train_loss": -39.08037185668945, "global_step": 277952, "epoch": 2297} {"train_loss": -40.798152923583984, "global_step": 277953, "epoch": 2297} {"train_loss": -40.668514251708984, "global_step": 277954, "epoch": 2297} {"train_loss": -40.461631774902344, "global_step": 277955, "epoch": 2297} {"train_loss": -40.454471588134766, "global_step": 277956, "epoch": 2297} {"train_loss": -40.724769592285156, "global_step": 277957, "epoch": 2297} {"train_loss": -40.2368278503418, "global_step": 277958, "epoch": 2297} {"train_loss": -40.450172424316406, "global_step": 277959, "epoch": 2297} {"train_loss": -40.64986038208008, "global_step": 277960, "epoch": 2297} {"train_loss": -41.390987396240234, "global_step": 277961, "epoch": 2297} {"train_loss": -40.738258361816406, "global_step": 277962, "epoch": 2297} {"train_loss": -40.8314094543457, "global_step": 277963, "epoch": 2297} {"train_loss": -40.764739990234375, "global_step": 277964, "epoch": 2297} {"train_loss": -39.98268508911133, "global_step": 277965, "epoch": 2297} {"train_loss": -40.9552001953125, "global_step": 277966, "epoch": 2297} {"train_loss": -40.72247314453125, "global_step": 277967, "epoch": 2297} {"train_loss": -41.58823776245117, "global_step": 277968, "epoch": 2297} {"train_loss": -39.815467834472656, "global_step": 277969, "epoch": 2297} {"train_loss": -40.530704498291016, "global_step": 277970, "epoch": 2297} {"train_loss": -41.05424118041992, "global_step": 277971, "epoch": 2297} {"train_loss": -40.74362564086914, "global_step": 277972, "epoch": 2297} {"train_loss": -41.2465934753418, "global_step": 277973, "epoch": 2297} {"train_loss": -41.72671127319336, "global_step": 277974, "epoch": 2297} {"train_loss": -41.03396224975586, "global_step": 277975, "epoch": 2297} {"train_loss": -41.20333480834961, "global_step": 277976, "epoch": 2297} {"train_loss": -40.57572937011719, "global_step": 277977, "epoch": 2297} {"train_loss": -41.55025100708008, "global_step": 277978, "epoch": 2297} {"train_loss": -41.91770935058594, "global_step": 277979, "epoch": 2297} {"train_loss": -41.16067123413086, "global_step": 277980, "epoch": 2297} {"train_loss": -41.67982864379883, "global_step": 277981, "epoch": 2297} {"train_loss": -41.111053466796875, "global_step": 277982, "epoch": 2297} {"train_loss": -41.58132553100586, "global_step": 277983, "epoch": 2297} {"train_loss": -41.46939468383789, "global_step": 277984, "epoch": 2297} {"train_loss": -40.30479431152344, "global_step": 277985, "epoch": 2297} {"train_loss": -41.43827438354492, "global_step": 277986, "epoch": 2297} {"train_loss": -41.871150970458984, "global_step": 277987, "epoch": 2297} {"train_loss": -41.05854415893555, "global_step": 277988, "epoch": 2297} {"train_loss": -42.28889465332031, "global_step": 277989, "epoch": 2297} {"train_loss": -41.96680450439453, "global_step": 277990, "epoch": 2297} {"train_loss": -40.67744064331055, "global_step": 277991, "epoch": 2297} {"train_loss": -41.213863372802734, "global_step": 277992, "epoch": 2297} {"train_loss": -41.816650390625, "global_step": 277993, "epoch": 2297} {"train_loss": -40.7325553894043, "global_step": 277994, "epoch": 2297} {"train_loss": -41.98383712768555, "global_step": 277995, "epoch": 2297} {"train_loss": -40.412837982177734, "global_step": 277996, "epoch": 2297} {"train_loss": -42.35568618774414, "global_step": 277997, "epoch": 2297} {"train_loss": -42.420448303222656, "global_step": 277998, "epoch": 2297} {"train_loss": -42.234554290771484, "global_step": 277999, "epoch": 2297} {"train_loss": -41.73585891723633, "global_step": 278000, "epoch": 2297} {"train_loss": -42.38151168823242, "global_step": 278001, "epoch": 2297} {"train_loss": -41.964317321777344, "global_step": 278002, "epoch": 2297} {"train_loss": -42.233760833740234, "global_step": 278003, "epoch": 2297} {"train_loss": -42.56794357299805, "global_step": 278004, "epoch": 2297} {"train_loss": -41.90499496459961, "global_step": 278005, "epoch": 2297} {"train_loss": -42.37925338745117, "global_step": 278006, "epoch": 2297} {"train_loss": -42.3780517578125, "global_step": 278007, "epoch": 2297} {"train_loss": -42.078369140625, "global_step": 278008, "epoch": 2297} {"train_loss": -42.44118881225586, "global_step": 278009, "epoch": 2297} {"train_loss": -42.4041862487793, "global_step": 278010, "epoch": 2297} {"train_loss": -41.635780334472656, "global_step": 278011, "epoch": 2297} {"train_loss": -42.508399963378906, "global_step": 278012, "epoch": 2297} {"train_loss": -42.23781967163086, "global_step": 278013, "epoch": 2297} {"train_loss": -42.395606994628906, "global_step": 278014, "epoch": 2297} {"train_loss": -42.500335693359375, "global_step": 278015, "epoch": 2297} {"train_loss": -42.40388107299805, "global_step": 278016, "epoch": 2297} {"train_loss": -42.40089797973633, "global_step": 278017, "epoch": 2297} {"train_loss": -42.53017044067383, "global_step": 278018, "epoch": 2297} {"train_loss": -42.338233947753906, "global_step": 278019, "epoch": 2297} {"train_loss": -42.38663101196289, "global_step": 278020, "epoch": 2297} {"train_loss": -42.630611419677734, "global_step": 278021, "epoch": 2297} {"train_loss": -42.95940017700195, "global_step": 278022, "epoch": 2297} {"train_loss": -42.80453872680664, "global_step": 278023, "epoch": 2297} {"train_loss": -42.09820556640625, "global_step": 278024, "epoch": 2297} {"train_loss": -43.05268478393555, "global_step": 278025, "epoch": 2297} {"train_loss": -42.362117767333984, "global_step": 278026, "epoch": 2297} {"train_loss": -42.79704666137695, "global_step": 278027, "epoch": 2297} {"train_loss": -42.956478118896484, "global_step": 278028, "epoch": 2297} {"train_loss": -42.857269287109375, "global_step": 278029, "epoch": 2297} {"train_loss": -42.834747314453125, "global_step": 278030, "epoch": 2297} {"train_loss": -42.30500030517578, "global_step": 278031, "epoch": 2297} {"train_loss": -42.54107666015625, "global_step": 278032, "epoch": 2297} {"train_loss": -43.04616165161133, "global_step": 278033, "epoch": 2297} {"train_loss": -43.05732727050781, "global_step": 278034, "epoch": 2297} {"train_loss": -42.965267181396484, "global_step": 278035, "epoch": 2297} {"train_loss": -43.1898307800293, "global_step": 278036, "epoch": 2297} {"train_loss": -42.57444381713867, "global_step": 278037, "epoch": 2297} {"train_loss": -42.3520622253418, "global_step": 278038, "epoch": 2297} {"train_loss": -43.002925872802734, "global_step": 278039, "epoch": 2297} {"train_loss": -42.86674880981445, "global_step": 278040, "epoch": 2297} {"train_loss": -43.38239669799805, "global_step": 278041, "epoch": 2297} {"train_loss": -42.85811996459961, "global_step": 278042, "epoch": 2297} {"train_loss": -42.60907745361328, "global_step": 278043, "epoch": 2297} {"train_loss": -43.067501068115234, "global_step": 278044, "epoch": 2297} {"train_loss": -42.00975036621094, "global_step": 278045, "epoch": 2297} {"train_loss": -43.1191520690918, "global_step": 278046, "epoch": 2297} {"train_loss": -42.88863754272461, "global_step": 278047, "epoch": 2297} {"train_loss": -42.78377914428711, "global_step": 278048, "epoch": 2297} {"train_loss": -43.135311126708984, "global_step": 278049, "epoch": 2297} {"train_loss": -43.5601806640625, "global_step": 278050, "epoch": 2297} {"train_loss": -43.358943939208984, "global_step": 278051, "epoch": 2297} {"train_loss": -43.18327713012695, "global_step": 278052, "epoch": 2297} {"train_loss": -43.17464828491211, "global_step": 278053, "epoch": 2297} {"train_loss": -43.04254913330078, "global_step": 278054, "epoch": 2297} {"train_loss": -43.226417541503906, "global_step": 278055, "epoch": 2297} {"train_loss": -43.1107292175293, "global_step": 278056, "epoch": 2297} {"train_loss": -41.632044106475576, "global_step": 278057, "epoch": 2297, "val_loss": 2472334.75} {"train_loss": -43.616634368896484, "global_step": 278058, "epoch": 2298} {"train_loss": -43.01121139526367, "global_step": 278059, "epoch": 2298} {"train_loss": -43.468666076660156, "global_step": 278060, "epoch": 2298} {"train_loss": -43.20515823364258, "global_step": 278061, "epoch": 2298} {"train_loss": -43.89011764526367, "global_step": 278062, "epoch": 2298} {"train_loss": -43.23341751098633, "global_step": 278063, "epoch": 2298} {"train_loss": -43.29200744628906, "global_step": 278064, "epoch": 2298} {"train_loss": -43.27637481689453, "global_step": 278065, "epoch": 2298} {"train_loss": -43.16686248779297, "global_step": 278066, "epoch": 2298} {"train_loss": -42.6765022277832, "global_step": 278067, "epoch": 2298} {"train_loss": -42.95899200439453, "global_step": 278068, "epoch": 2298} {"train_loss": -42.9074821472168, "global_step": 278069, "epoch": 2298} {"train_loss": -41.893829345703125, "global_step": 278070, "epoch": 2298} {"train_loss": -42.846099853515625, "global_step": 278071, "epoch": 2298} {"train_loss": -42.69236373901367, "global_step": 278072, "epoch": 2298} {"train_loss": -42.56103515625, "global_step": 278073, "epoch": 2298} {"train_loss": -41.650203704833984, "global_step": 278074, "epoch": 2298} {"train_loss": -41.133968353271484, "global_step": 278075, "epoch": 2298} {"train_loss": -41.04842758178711, "global_step": 278076, "epoch": 2298} {"train_loss": -40.2315788269043, "global_step": 278077, "epoch": 2298} {"train_loss": -37.486000061035156, "global_step": 278078, "epoch": 2298} {"train_loss": -35.07023239135742, "global_step": 278079, "epoch": 2298} {"train_loss": -38.10722351074219, "global_step": 278080, "epoch": 2298} {"train_loss": -42.292991638183594, "global_step": 278081, "epoch": 2298} {"train_loss": -41.42732238769531, "global_step": 278082, "epoch": 2298} {"train_loss": -37.24987030029297, "global_step": 278083, "epoch": 2298} {"train_loss": -34.22710037231445, "global_step": 278084, "epoch": 2298} {"train_loss": -42.26747512817383, "global_step": 278085, "epoch": 2298} {"train_loss": -37.246944427490234, "global_step": 278086, "epoch": 2298} {"train_loss": -36.757789611816406, "global_step": 278087, "epoch": 2298} {"train_loss": -39.016719818115234, "global_step": 278088, "epoch": 2298} {"train_loss": -37.46895980834961, "global_step": 278089, "epoch": 2298} {"train_loss": -37.301143646240234, "global_step": 278090, "epoch": 2298} {"train_loss": -41.75370407104492, "global_step": 278091, "epoch": 2298} {"train_loss": -37.14009475708008, "global_step": 278092, "epoch": 2298} {"train_loss": -38.89099884033203, "global_step": 278093, "epoch": 2298} {"train_loss": -38.6687126159668, "global_step": 278094, "epoch": 2298} {"train_loss": -37.36360549926758, "global_step": 278095, "epoch": 2298} {"train_loss": -39.238285064697266, "global_step": 278096, "epoch": 2298} {"train_loss": -39.85628128051758, "global_step": 278097, "epoch": 2298} {"train_loss": -39.66147994995117, "global_step": 278098, "epoch": 2298} {"train_loss": -40.05710983276367, "global_step": 278099, "epoch": 2298} {"train_loss": -41.599117279052734, "global_step": 278100, "epoch": 2298} {"train_loss": -40.17727279663086, "global_step": 278101, "epoch": 2298} {"train_loss": -41.211116790771484, "global_step": 278102, "epoch": 2298} {"train_loss": -40.88126754760742, "global_step": 278103, "epoch": 2298} {"train_loss": -41.305816650390625, "global_step": 278104, "epoch": 2298} {"train_loss": -40.49708557128906, "global_step": 278105, "epoch": 2298} {"train_loss": -41.051124572753906, "global_step": 278106, "epoch": 2298} {"train_loss": -40.660579681396484, "global_step": 278107, "epoch": 2298} {"train_loss": -41.39054489135742, "global_step": 278108, "epoch": 2298} {"train_loss": -41.68569564819336, "global_step": 278109, "epoch": 2298} {"train_loss": -40.71784210205078, "global_step": 278110, "epoch": 2298} {"train_loss": -41.28196334838867, "global_step": 278111, "epoch": 2298} {"train_loss": -41.55907440185547, "global_step": 278112, "epoch": 2298} {"train_loss": -40.272254943847656, "global_step": 278113, "epoch": 2298} {"train_loss": -42.001373291015625, "global_step": 278114, "epoch": 2298} {"train_loss": -40.724853515625, "global_step": 278115, "epoch": 2298} {"train_loss": -40.6722526550293, "global_step": 278116, "epoch": 2298} {"train_loss": -41.58858108520508, "global_step": 278117, "epoch": 2298} {"train_loss": -41.632667541503906, "global_step": 278118, "epoch": 2298} {"train_loss": -41.60018539428711, "global_step": 278119, "epoch": 2298} {"train_loss": -41.6955451965332, "global_step": 278120, "epoch": 2298} {"train_loss": -39.72946548461914, "global_step": 278121, "epoch": 2298} {"train_loss": -41.82174301147461, "global_step": 278122, "epoch": 2298} {"train_loss": -41.97328567504883, "global_step": 278123, "epoch": 2298} {"train_loss": -41.32301712036133, "global_step": 278124, "epoch": 2298} {"train_loss": -41.961273193359375, "global_step": 278125, "epoch": 2298} {"train_loss": -41.931270599365234, "global_step": 278126, "epoch": 2298} {"train_loss": -41.246192932128906, "global_step": 278127, "epoch": 2298} {"train_loss": -42.351585388183594, "global_step": 278128, "epoch": 2298} {"train_loss": -42.082393646240234, "global_step": 278129, "epoch": 2298} {"train_loss": -42.249385833740234, "global_step": 278130, "epoch": 2298} {"train_loss": -42.36381149291992, "global_step": 278131, "epoch": 2298} {"train_loss": -42.617374420166016, "global_step": 278132, "epoch": 2298} {"train_loss": -42.265804290771484, "global_step": 278133, "epoch": 2298} {"train_loss": -42.676025390625, "global_step": 278134, "epoch": 2298} {"train_loss": -42.48820877075195, "global_step": 278135, "epoch": 2298} {"train_loss": -42.59829330444336, "global_step": 278136, "epoch": 2298} {"train_loss": -42.113685607910156, "global_step": 278137, "epoch": 2298} {"train_loss": -43.160762786865234, "global_step": 278138, "epoch": 2298} {"train_loss": -42.548152923583984, "global_step": 278139, "epoch": 2298} {"train_loss": -42.70453643798828, "global_step": 278140, "epoch": 2298} {"train_loss": -41.608116149902344, "global_step": 278141, "epoch": 2298} {"train_loss": -42.052589416503906, "global_step": 278142, "epoch": 2298} {"train_loss": -42.555843353271484, "global_step": 278143, "epoch": 2298} {"train_loss": -42.56911849975586, "global_step": 278144, "epoch": 2298} {"train_loss": -43.057796478271484, "global_step": 278145, "epoch": 2298} {"train_loss": -42.362159729003906, "global_step": 278146, "epoch": 2298} {"train_loss": -42.84648132324219, "global_step": 278147, "epoch": 2298} {"train_loss": -42.817626953125, "global_step": 278148, "epoch": 2298} {"train_loss": -42.431575775146484, "global_step": 278149, "epoch": 2298} {"train_loss": -43.22801208496094, "global_step": 278150, "epoch": 2298} {"train_loss": -42.89263916015625, "global_step": 278151, "epoch": 2298} {"train_loss": -42.787410736083984, "global_step": 278152, "epoch": 2298} {"train_loss": -42.86306381225586, "global_step": 278153, "epoch": 2298} {"train_loss": -43.15036392211914, "global_step": 278154, "epoch": 2298} {"train_loss": -43.25368881225586, "global_step": 278155, "epoch": 2298} {"train_loss": -43.1536750793457, "global_step": 278156, "epoch": 2298} {"train_loss": -43.01935577392578, "global_step": 278157, "epoch": 2298} {"train_loss": -42.96083450317383, "global_step": 278158, "epoch": 2298} {"train_loss": -43.2327995300293, "global_step": 278159, "epoch": 2298} {"train_loss": -42.98116683959961, "global_step": 278160, "epoch": 2298} {"train_loss": -43.49274826049805, "global_step": 278161, "epoch": 2298} {"train_loss": -42.910213470458984, "global_step": 278162, "epoch": 2298} {"train_loss": -43.18582534790039, "global_step": 278163, "epoch": 2298} {"train_loss": -43.18928909301758, "global_step": 278164, "epoch": 2298} {"train_loss": -43.09811019897461, "global_step": 278165, "epoch": 2298} {"train_loss": -43.335052490234375, "global_step": 278166, "epoch": 2298} {"train_loss": -43.47349166870117, "global_step": 278167, "epoch": 2298} {"train_loss": -42.425010681152344, "global_step": 278168, "epoch": 2298} {"train_loss": -43.00748825073242, "global_step": 278169, "epoch": 2298} {"train_loss": -42.9283447265625, "global_step": 278170, "epoch": 2298} {"train_loss": -43.50862503051758, "global_step": 278171, "epoch": 2298} {"train_loss": -42.9646110534668, "global_step": 278172, "epoch": 2298} {"train_loss": -42.563228607177734, "global_step": 278173, "epoch": 2298} {"train_loss": -42.875633239746094, "global_step": 278174, "epoch": 2298} {"train_loss": -42.84077835083008, "global_step": 278175, "epoch": 2298} {"train_loss": -42.74185562133789, "global_step": 278176, "epoch": 2298} {"train_loss": -43.552974700927734, "global_step": 278177, "epoch": 2298} {"train_loss": -41.64008432183384, "global_step": 278178, "epoch": 2298, "val_loss": 2471545.25} {"train_loss": -43.522186279296875, "global_step": 278179, "epoch": 2299} {"train_loss": -43.08350372314453, "global_step": 278180, "epoch": 2299} {"train_loss": -43.256282806396484, "global_step": 278181, "epoch": 2299} {"train_loss": -42.95309066772461, "global_step": 278182, "epoch": 2299} {"train_loss": -43.454307556152344, "global_step": 278183, "epoch": 2299} {"train_loss": -43.006038665771484, "global_step": 278184, "epoch": 2299} {"train_loss": -43.33855056762695, "global_step": 278185, "epoch": 2299} {"train_loss": -42.922603607177734, "global_step": 278186, "epoch": 2299} {"train_loss": -43.622962951660156, "global_step": 278187, "epoch": 2299} {"train_loss": -43.49163818359375, "global_step": 278188, "epoch": 2299} {"train_loss": -43.35601806640625, "global_step": 278189, "epoch": 2299} {"train_loss": -43.32221984863281, "global_step": 278190, "epoch": 2299} {"train_loss": -42.90554428100586, "global_step": 278191, "epoch": 2299} {"train_loss": -41.38179397583008, "global_step": 278192, "epoch": 2299} {"train_loss": -41.92628479003906, "global_step": 278193, "epoch": 2299} {"train_loss": -40.93362045288086, "global_step": 278194, "epoch": 2299} {"train_loss": -41.151039123535156, "global_step": 278195, "epoch": 2299} {"train_loss": -42.1237907409668, "global_step": 278196, "epoch": 2299} {"train_loss": -42.91004180908203, "global_step": 278197, "epoch": 2299} {"train_loss": -42.94402313232422, "global_step": 278198, "epoch": 2299} {"train_loss": -42.1793098449707, "global_step": 278199, "epoch": 2299} {"train_loss": -37.34048080444336, "global_step": 278200, "epoch": 2299} {"train_loss": -32.8318977355957, "global_step": 278201, "epoch": 2299} {"train_loss": -33.6428337097168, "global_step": 278202, "epoch": 2299} {"train_loss": -38.8580436706543, "global_step": 278203, "epoch": 2299} {"train_loss": -42.41131591796875, "global_step": 278204, "epoch": 2299} {"train_loss": -41.71940231323242, "global_step": 278205, "epoch": 2299} {"train_loss": -41.624210357666016, "global_step": 278206, "epoch": 2299} {"train_loss": -42.10523223876953, "global_step": 278207, "epoch": 2299} {"train_loss": -42.27572250366211, "global_step": 278208, "epoch": 2299} {"train_loss": -42.25856399536133, "global_step": 278209, "epoch": 2299} {"train_loss": -41.6976432800293, "global_step": 278210, "epoch": 2299} {"train_loss": -41.23828125, "global_step": 278211, "epoch": 2299} {"train_loss": -41.926631927490234, "global_step": 278212, "epoch": 2299} {"train_loss": -41.24343490600586, "global_step": 278213, "epoch": 2299} {"train_loss": -42.482337951660156, "global_step": 278214, "epoch": 2299} {"train_loss": -42.55812454223633, "global_step": 278215, "epoch": 2299} {"train_loss": -41.34806442260742, "global_step": 278216, "epoch": 2299} {"train_loss": -42.46561050415039, "global_step": 278217, "epoch": 2299} {"train_loss": -42.38723373413086, "global_step": 278218, "epoch": 2299} {"train_loss": -42.228572845458984, "global_step": 278219, "epoch": 2299} {"train_loss": -42.32987594604492, "global_step": 278220, "epoch": 2299} {"train_loss": -42.3475456237793, "global_step": 278221, "epoch": 2299} {"train_loss": -41.94086837768555, "global_step": 278222, "epoch": 2299} {"train_loss": -43.10474395751953, "global_step": 278223, "epoch": 2299} {"train_loss": -42.16575241088867, "global_step": 278224, "epoch": 2299} {"train_loss": -42.11814498901367, "global_step": 278225, "epoch": 2299} {"train_loss": -42.76255416870117, "global_step": 278226, "epoch": 2299} {"train_loss": -42.59430694580078, "global_step": 278227, "epoch": 2299} {"train_loss": -42.8508415222168, "global_step": 278228, "epoch": 2299} {"train_loss": -41.61323165893555, "global_step": 278229, "epoch": 2299} {"train_loss": -42.12296676635742, "global_step": 278230, "epoch": 2299} {"train_loss": -42.783607482910156, "global_step": 278231, "epoch": 2299} {"train_loss": -42.846736907958984, "global_step": 278232, "epoch": 2299} {"train_loss": -43.17286682128906, "global_step": 278233, "epoch": 2299} {"train_loss": -43.485225677490234, "global_step": 278234, "epoch": 2299} {"train_loss": -43.402740478515625, "global_step": 278235, "epoch": 2299} {"train_loss": -43.169918060302734, "global_step": 278236, "epoch": 2299} {"train_loss": -43.45090866088867, "global_step": 278237, "epoch": 2299} {"train_loss": -43.48145294189453, "global_step": 278238, "epoch": 2299} {"train_loss": -43.044647216796875, "global_step": 278239, "epoch": 2299} {"train_loss": -42.98417282104492, "global_step": 278240, "epoch": 2299} {"train_loss": -43.09782791137695, "global_step": 278241, "epoch": 2299} {"train_loss": -43.13847732543945, "global_step": 278242, "epoch": 2299} {"train_loss": -43.21934509277344, "global_step": 278243, "epoch": 2299} {"train_loss": -43.0310173034668, "global_step": 278244, "epoch": 2299} {"train_loss": -43.527801513671875, "global_step": 278245, "epoch": 2299} {"train_loss": -43.13494873046875, "global_step": 278246, "epoch": 2299} {"train_loss": -43.264686584472656, "global_step": 278247, "epoch": 2299} {"train_loss": -43.54848861694336, "global_step": 278248, "epoch": 2299} {"train_loss": -43.7749137878418, "global_step": 278249, "epoch": 2299} {"train_loss": -43.14253234863281, "global_step": 278250, "epoch": 2299} {"train_loss": -43.49387741088867, "global_step": 278251, "epoch": 2299} {"train_loss": -43.175209045410156, "global_step": 278252, "epoch": 2299} {"train_loss": -43.26129913330078, "global_step": 278253, "epoch": 2299} {"train_loss": -43.36084747314453, "global_step": 278254, "epoch": 2299} {"train_loss": -43.60871887207031, "global_step": 278255, "epoch": 2299} {"train_loss": -43.45800018310547, "global_step": 278256, "epoch": 2299} {"train_loss": -42.849422454833984, "global_step": 278257, "epoch": 2299} {"train_loss": -42.93465042114258, "global_step": 278258, "epoch": 2299} {"train_loss": -43.45637512207031, "global_step": 278259, "epoch": 2299} {"train_loss": -43.54807662963867, "global_step": 278260, "epoch": 2299} {"train_loss": -43.96186447143555, "global_step": 278261, "epoch": 2299} {"train_loss": -43.8355712890625, "global_step": 278262, "epoch": 2299} {"train_loss": -43.65319061279297, "global_step": 278263, "epoch": 2299} {"train_loss": -43.50348663330078, "global_step": 278264, "epoch": 2299} {"train_loss": -43.69321823120117, "global_step": 278265, "epoch": 2299} {"train_loss": -42.569541931152344, "global_step": 278266, "epoch": 2299} {"train_loss": -43.17058563232422, "global_step": 278267, "epoch": 2299} {"train_loss": -43.0809211730957, "global_step": 278268, "epoch": 2299} {"train_loss": -43.68839645385742, "global_step": 278269, "epoch": 2299} {"train_loss": -43.25936508178711, "global_step": 278270, "epoch": 2299} {"train_loss": -43.16652297973633, "global_step": 278271, "epoch": 2299} {"train_loss": -43.35801315307617, "global_step": 278272, "epoch": 2299} {"train_loss": -43.513648986816406, "global_step": 278273, "epoch": 2299} {"train_loss": -43.10710525512695, "global_step": 278274, "epoch": 2299} {"train_loss": -43.372554779052734, "global_step": 278275, "epoch": 2299} {"train_loss": -42.66170883178711, "global_step": 278276, "epoch": 2299} {"train_loss": -43.157283782958984, "global_step": 278277, "epoch": 2299} {"train_loss": -42.40412521362305, "global_step": 278278, "epoch": 2299} {"train_loss": -40.78715133666992, "global_step": 278279, "epoch": 2299} {"train_loss": -40.04133224487305, "global_step": 278280, "epoch": 2299} {"train_loss": -39.82106399536133, "global_step": 278281, "epoch": 2299} {"train_loss": -42.27511215209961, "global_step": 278282, "epoch": 2299} {"train_loss": -41.82418441772461, "global_step": 278283, "epoch": 2299} {"train_loss": -39.99711990356445, "global_step": 278284, "epoch": 2299} {"train_loss": -39.4602165222168, "global_step": 278285, "epoch": 2299} {"train_loss": -41.149837493896484, "global_step": 278286, "epoch": 2299} {"train_loss": -40.90591812133789, "global_step": 278287, "epoch": 2299} {"train_loss": -37.8725700378418, "global_step": 278288, "epoch": 2299} {"train_loss": -34.33487319946289, "global_step": 278289, "epoch": 2299} {"train_loss": -36.918548583984375, "global_step": 278290, "epoch": 2299} {"train_loss": -39.78996276855469, "global_step": 278291, "epoch": 2299} {"train_loss": -39.62078857421875, "global_step": 278292, "epoch": 2299} {"train_loss": -37.997596740722656, "global_step": 278293, "epoch": 2299} {"train_loss": -40.587928771972656, "global_step": 278294, "epoch": 2299} {"train_loss": -39.36240768432617, "global_step": 278295, "epoch": 2299} {"train_loss": -38.80546951293945, "global_step": 278296, "epoch": 2299} {"train_loss": -41.77425003051758, "global_step": 278297, "epoch": 2299} {"train_loss": -38.95354080200195, "global_step": 278298, "epoch": 2299} {"train_loss": -42.06189299023841, "global_step": 278299, "epoch": 2299, "val_loss": 2467777.25} {"train_loss": -40.07511520385742, "global_step": 278300, "epoch": 2300} {"train_loss": -41.8157958984375, "global_step": 278301, "epoch": 2300} {"train_loss": -40.418243408203125, "global_step": 278302, "epoch": 2300} {"train_loss": -41.30718231201172, "global_step": 278303, "epoch": 2300} {"train_loss": -41.5187873840332, "global_step": 278304, "epoch": 2300} {"train_loss": -41.205101013183594, "global_step": 278305, "epoch": 2300} {"train_loss": -41.56489944458008, "global_step": 278306, "epoch": 2300} {"train_loss": -41.05011749267578, "global_step": 278307, "epoch": 2300} {"train_loss": -39.97802734375, "global_step": 278308, "epoch": 2300} {"train_loss": -41.04282760620117, "global_step": 278309, "epoch": 2300} {"train_loss": -41.90177536010742, "global_step": 278310, "epoch": 2300} {"train_loss": -41.37553024291992, "global_step": 278311, "epoch": 2300} {"train_loss": -41.136146545410156, "global_step": 278312, "epoch": 2300} {"train_loss": -41.0089225769043, "global_step": 278313, "epoch": 2300} {"train_loss": -41.98886489868164, "global_step": 278314, "epoch": 2300} {"train_loss": -42.175899505615234, "global_step": 278315, "epoch": 2300} {"train_loss": -42.07415008544922, "global_step": 278316, "epoch": 2300} {"train_loss": -41.56627655029297, "global_step": 278317, "epoch": 2300} {"train_loss": -42.61304473876953, "global_step": 278318, "epoch": 2300} {"train_loss": -41.9858283996582, "global_step": 278319, "epoch": 2300} {"train_loss": -43.08823776245117, "global_step": 278320, "epoch": 2300} {"train_loss": -42.06026840209961, "global_step": 278321, "epoch": 2300} {"train_loss": -43.21794128417969, "global_step": 278322, "epoch": 2300} {"train_loss": -42.561702728271484, "global_step": 278323, "epoch": 2300} {"train_loss": -42.69147491455078, "global_step": 278324, "epoch": 2300} {"train_loss": -42.66475296020508, "global_step": 278325, "epoch": 2300} {"train_loss": -42.95188903808594, "global_step": 278326, "epoch": 2300} {"train_loss": -43.149539947509766, "global_step": 278327, "epoch": 2300} {"train_loss": -42.57269287109375, "global_step": 278328, "epoch": 2300} {"train_loss": -43.119384765625, "global_step": 278329, "epoch": 2300} {"train_loss": -42.69358825683594, "global_step": 278330, "epoch": 2300} {"train_loss": -42.20396423339844, "global_step": 278331, "epoch": 2300} {"train_loss": -43.26669692993164, "global_step": 278332, "epoch": 2300} {"train_loss": -43.08842086791992, "global_step": 278333, "epoch": 2300} {"train_loss": -43.21564483642578, "global_step": 278334, "epoch": 2300} {"train_loss": -42.79478454589844, "global_step": 278335, "epoch": 2300} {"train_loss": -43.237239837646484, "global_step": 278336, "epoch": 2300} {"train_loss": -43.16851806640625, "global_step": 278337, "epoch": 2300} {"train_loss": -43.217628479003906, "global_step": 278338, "epoch": 2300} {"train_loss": -43.17469787597656, "global_step": 278339, "epoch": 2300} {"train_loss": -43.27895736694336, "global_step": 278340, "epoch": 2300} {"train_loss": -43.47274398803711, "global_step": 278341, "epoch": 2300} {"train_loss": -43.48415756225586, "global_step": 278342, "epoch": 2300} {"train_loss": -43.146148681640625, "global_step": 278343, "epoch": 2300} {"train_loss": -43.313411712646484, "global_step": 278344, "epoch": 2300} {"train_loss": -42.40316390991211, "global_step": 278345, "epoch": 2300} {"train_loss": -43.46416473388672, "global_step": 278346, "epoch": 2300} {"train_loss": -43.40549850463867, "global_step": 278347, "epoch": 2300} {"train_loss": -42.8812255859375, "global_step": 278348, "epoch": 2300} {"train_loss": -43.67243576049805, "global_step": 278349, "epoch": 2300} {"train_loss": -43.75652313232422, "global_step": 278350, "epoch": 2300} {"train_loss": -43.63741683959961, "global_step": 278351, "epoch": 2300} {"train_loss": -43.88027572631836, "global_step": 278352, "epoch": 2300} {"train_loss": -43.44353103637695, "global_step": 278353, "epoch": 2300} {"train_loss": -42.99794387817383, "global_step": 278354, "epoch": 2300} {"train_loss": -43.547115325927734, "global_step": 278355, "epoch": 2300} {"train_loss": -42.4581413269043, "global_step": 278356, "epoch": 2300} {"train_loss": -43.30238723754883, "global_step": 278357, "epoch": 2300} {"train_loss": -43.872406005859375, "global_step": 278358, "epoch": 2300} {"train_loss": -43.40314483642578, "global_step": 278359, "epoch": 2300} {"train_loss": -43.152347564697266, "global_step": 278360, "epoch": 2300} {"train_loss": -43.06722640991211, "global_step": 278361, "epoch": 2300} {"train_loss": -43.531795501708984, "global_step": 278362, "epoch": 2300} {"train_loss": -42.0687370300293, "global_step": 278363, "epoch": 2300} {"train_loss": -43.31869125366211, "global_step": 278364, "epoch": 2300} {"train_loss": -44.305660247802734, "global_step": 278365, "epoch": 2300} {"train_loss": -43.469886779785156, "global_step": 278366, "epoch": 2300} {"train_loss": -40.150516510009766, "global_step": 278367, "epoch": 2300} {"train_loss": -42.587162017822266, "global_step": 278368, "epoch": 2300} {"train_loss": -43.384761810302734, "global_step": 278369, "epoch": 2300} {"train_loss": -41.726009368896484, "global_step": 278370, "epoch": 2300} {"train_loss": -42.853004455566406, "global_step": 278371, "epoch": 2300} {"train_loss": -42.89472961425781, "global_step": 278372, "epoch": 2300} {"train_loss": -42.77682113647461, "global_step": 278373, "epoch": 2300} {"train_loss": -42.549312591552734, "global_step": 278374, "epoch": 2300} {"train_loss": -42.751338958740234, "global_step": 278375, "epoch": 2300} {"train_loss": -42.53235626220703, "global_step": 278376, "epoch": 2300} {"train_loss": -43.18940353393555, "global_step": 278377, "epoch": 2300} {"train_loss": -42.488372802734375, "global_step": 278378, "epoch": 2300} {"train_loss": -42.3354606628418, "global_step": 278379, "epoch": 2300} {"train_loss": -41.82322311401367, "global_step": 278380, "epoch": 2300} {"train_loss": -41.87055206298828, "global_step": 278381, "epoch": 2300} {"train_loss": -42.084259033203125, "global_step": 278382, "epoch": 2300} {"train_loss": -39.16577911376953, "global_step": 278383, "epoch": 2300} {"train_loss": -41.62786865234375, "global_step": 278384, "epoch": 2300} {"train_loss": -36.21467590332031, "global_step": 278385, "epoch": 2300} {"train_loss": -42.57450485229492, "global_step": 278386, "epoch": 2300} {"train_loss": -41.38591384887695, "global_step": 278387, "epoch": 2300} {"train_loss": -42.16669845581055, "global_step": 278388, "epoch": 2300} {"train_loss": -42.05266571044922, "global_step": 278389, "epoch": 2300} {"train_loss": -42.103919982910156, "global_step": 278390, "epoch": 2300} {"train_loss": -41.26669692993164, "global_step": 278391, "epoch": 2300} {"train_loss": -41.296993255615234, "global_step": 278392, "epoch": 2300} {"train_loss": -42.90914535522461, "global_step": 278393, "epoch": 2300} {"train_loss": -38.164730072021484, "global_step": 278394, "epoch": 2300} {"train_loss": -38.78488540649414, "global_step": 278395, "epoch": 2300} {"train_loss": -42.67885971069336, "global_step": 278396, "epoch": 2300} {"train_loss": -41.68255615234375, "global_step": 278397, "epoch": 2300} {"train_loss": -41.59365463256836, "global_step": 278398, "epoch": 2300} {"train_loss": -41.74424743652344, "global_step": 278399, "epoch": 2300} {"train_loss": -39.93229293823242, "global_step": 278400, "epoch": 2300} {"train_loss": -42.30890655517578, "global_step": 278401, "epoch": 2300} {"train_loss": -42.37323760986328, "global_step": 278402, "epoch": 2300} {"train_loss": -40.710906982421875, "global_step": 278403, "epoch": 2300} {"train_loss": -40.95486068725586, "global_step": 278404, "epoch": 2300} {"train_loss": -39.23865509033203, "global_step": 278405, "epoch": 2300} {"train_loss": -40.582027435302734, "global_step": 278406, "epoch": 2300} {"train_loss": -41.817073822021484, "global_step": 278407, "epoch": 2300} {"train_loss": -40.93238067626953, "global_step": 278408, "epoch": 2300} {"train_loss": -41.0233154296875, "global_step": 278409, "epoch": 2300} {"train_loss": -41.64252853393555, "global_step": 278410, "epoch": 2300} {"train_loss": -41.70339584350586, "global_step": 278411, "epoch": 2300} {"train_loss": -40.43764877319336, "global_step": 278412, "epoch": 2300} {"train_loss": -40.22612762451172, "global_step": 278413, "epoch": 2300} {"train_loss": -32.5576057434082, "global_step": 278414, "epoch": 2300} {"train_loss": -40.276023864746094, "global_step": 278415, "epoch": 2300} {"train_loss": -39.6017951965332, "global_step": 278416, "epoch": 2300} {"train_loss": -39.447086334228516, "global_step": 278417, "epoch": 2300} {"train_loss": -41.854766845703125, "global_step": 278418, "epoch": 2300} {"train_loss": -39.72027587890625, "global_step": 278419, "epoch": 2300} {"train_loss": -41.97801779124362, "global_step": 278420, "epoch": 2300, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 0.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4400000": 1.0, "test/sim_max_reward_4400001": 1.0, "test/sim_max_reward_4400002": 1.0, "test/sim_max_reward_4400003": 1.0, "test/sim_max_reward_4400004": 1.0, "test/sim_max_reward_4400005": 1.0, "test/sim_max_reward_4400006": 1.0, "test/sim_max_reward_4400007": 1.0, "test/sim_max_reward_4400008": 1.0, "test/sim_max_reward_4400009": 1.0, "test/sim_max_reward_4400010": 1.0, "test/sim_max_reward_4400011": 0.0, "test/sim_max_reward_4400012": 1.0, "test/sim_max_reward_4400013": 1.0, "test/sim_max_reward_4400014": 1.0, "test/sim_max_reward_4400015": 1.0, "test/sim_max_reward_4400016": 1.0, "test/sim_max_reward_4400017": 1.0, "test/sim_max_reward_4400018": 1.0, "test/sim_max_reward_4400019": 1.0, "test/sim_max_reward_4400020": 1.0, "test/sim_max_reward_4400021": 1.0, "train/mean_score": 0.8333333333333334, "test/mean_score": 0.9545454545454546, "val_loss": 2449942.75} {"train_loss": -37.457733154296875, "global_step": 278421, "epoch": 2301} {"train_loss": -41.61952590942383, "global_step": 278422, "epoch": 2301} {"train_loss": -37.995506286621094, "global_step": 278423, "epoch": 2301} {"train_loss": -38.90170669555664, "global_step": 278424, "epoch": 2301} {"train_loss": -40.58859634399414, "global_step": 278425, "epoch": 2301} {"train_loss": -37.230743408203125, "global_step": 278426, "epoch": 2301} {"train_loss": -39.51885223388672, "global_step": 278427, "epoch": 2301} {"train_loss": -39.840232849121094, "global_step": 278428, "epoch": 2301} {"train_loss": -39.84537887573242, "global_step": 278429, "epoch": 2301} {"train_loss": -41.50923156738281, "global_step": 278430, "epoch": 2301} {"train_loss": -41.89008712768555, "global_step": 278431, "epoch": 2301} {"train_loss": -41.20722198486328, "global_step": 278432, "epoch": 2301} {"train_loss": -40.3661003112793, "global_step": 278433, "epoch": 2301} {"train_loss": -40.93342971801758, "global_step": 278434, "epoch": 2301} {"train_loss": -41.70504379272461, "global_step": 278435, "epoch": 2301} {"train_loss": -41.2500114440918, "global_step": 278436, "epoch": 2301} {"train_loss": -37.5864372253418, "global_step": 278437, "epoch": 2301} {"train_loss": -41.81126403808594, "global_step": 278438, "epoch": 2301} {"train_loss": -41.1475830078125, "global_step": 278439, "epoch": 2301} {"train_loss": -41.82487106323242, "global_step": 278440, "epoch": 2301} {"train_loss": -41.4113883972168, "global_step": 278441, "epoch": 2301} {"train_loss": -36.848365783691406, "global_step": 278442, "epoch": 2301} {"train_loss": -40.42375564575195, "global_step": 278443, "epoch": 2301} {"train_loss": -40.773311614990234, "global_step": 278444, "epoch": 2301} {"train_loss": -40.09702682495117, "global_step": 278445, "epoch": 2301} {"train_loss": -41.563743591308594, "global_step": 278446, "epoch": 2301} {"train_loss": -39.53593444824219, "global_step": 278447, "epoch": 2301} {"train_loss": -40.233558654785156, "global_step": 278448, "epoch": 2301} {"train_loss": -39.8853874206543, "global_step": 278449, "epoch": 2301} {"train_loss": -39.62942886352539, "global_step": 278450, "epoch": 2301} {"train_loss": -41.44852828979492, "global_step": 278451, "epoch": 2301} {"train_loss": -39.316078186035156, "global_step": 278452, "epoch": 2301} {"train_loss": -41.67450714111328, "global_step": 278453, "epoch": 2301} {"train_loss": -41.272483825683594, "global_step": 278454, "epoch": 2301} {"train_loss": -40.6173210144043, "global_step": 278455, "epoch": 2301} {"train_loss": -42.14638137817383, "global_step": 278456, "epoch": 2301} {"train_loss": -40.76738357543945, "global_step": 278457, "epoch": 2301} {"train_loss": -38.14723205566406, "global_step": 278458, "epoch": 2301} {"train_loss": -39.99189758300781, "global_step": 278459, "epoch": 2301} {"train_loss": -40.6848030090332, "global_step": 278460, "epoch": 2301} {"train_loss": -40.922607421875, "global_step": 278461, "epoch": 2301} {"train_loss": -42.064117431640625, "global_step": 278462, "epoch": 2301} {"train_loss": -39.47003173828125, "global_step": 278463, "epoch": 2301} {"train_loss": -42.2976188659668, "global_step": 278464, "epoch": 2301} {"train_loss": -41.634639739990234, "global_step": 278465, "epoch": 2301} {"train_loss": -41.69940185546875, "global_step": 278466, "epoch": 2301} {"train_loss": -41.94476318359375, "global_step": 278467, "epoch": 2301} {"train_loss": -42.61880111694336, "global_step": 278468, "epoch": 2301} {"train_loss": -41.671382904052734, "global_step": 278469, "epoch": 2301} {"train_loss": -41.732078552246094, "global_step": 278470, "epoch": 2301} {"train_loss": -39.47757339477539, "global_step": 278471, "epoch": 2301} {"train_loss": -41.92129135131836, "global_step": 278472, "epoch": 2301} {"train_loss": -41.023311614990234, "global_step": 278473, "epoch": 2301} {"train_loss": -41.11674118041992, "global_step": 278474, "epoch": 2301} {"train_loss": -41.32365036010742, "global_step": 278475, "epoch": 2301} {"train_loss": -38.90193557739258, "global_step": 278476, "epoch": 2301} {"train_loss": -41.32486343383789, "global_step": 278477, "epoch": 2301} {"train_loss": -42.269161224365234, "global_step": 278478, "epoch": 2301} {"train_loss": -42.179656982421875, "global_step": 278479, "epoch": 2301} {"train_loss": -42.220367431640625, "global_step": 278480, "epoch": 2301} {"train_loss": -42.39179611206055, "global_step": 278481, "epoch": 2301} {"train_loss": -39.593502044677734, "global_step": 278482, "epoch": 2301} {"train_loss": -39.666255950927734, "global_step": 278483, "epoch": 2301} {"train_loss": -41.07763671875, "global_step": 278484, "epoch": 2301} {"train_loss": -42.4686164855957, "global_step": 278485, "epoch": 2301} {"train_loss": -41.95134353637695, "global_step": 278486, "epoch": 2301} {"train_loss": -40.594566345214844, "global_step": 278487, "epoch": 2301} {"train_loss": -41.502017974853516, "global_step": 278488, "epoch": 2301} {"train_loss": -42.04607009887695, "global_step": 278489, "epoch": 2301} {"train_loss": -42.55038070678711, "global_step": 278490, "epoch": 2301} {"train_loss": -40.720394134521484, "global_step": 278491, "epoch": 2301} {"train_loss": -42.0807991027832, "global_step": 278492, "epoch": 2301} {"train_loss": -40.611778259277344, "global_step": 278493, "epoch": 2301} {"train_loss": -41.96926498413086, "global_step": 278494, "epoch": 2301} {"train_loss": -40.51841354370117, "global_step": 278495, "epoch": 2301} {"train_loss": -42.589866638183594, "global_step": 278496, "epoch": 2301} {"train_loss": -40.01979446411133, "global_step": 278497, "epoch": 2301} {"train_loss": -41.28582763671875, "global_step": 278498, "epoch": 2301} {"train_loss": -41.48446273803711, "global_step": 278499, "epoch": 2301} {"train_loss": -41.72269821166992, "global_step": 278500, "epoch": 2301} {"train_loss": -42.474945068359375, "global_step": 278501, "epoch": 2301} {"train_loss": -41.78506088256836, "global_step": 278502, "epoch": 2301} {"train_loss": -42.46204376220703, "global_step": 278503, "epoch": 2301} {"train_loss": -42.615386962890625, "global_step": 278504, "epoch": 2301} {"train_loss": -42.548255920410156, "global_step": 278505, "epoch": 2301} {"train_loss": -42.340091705322266, "global_step": 278506, "epoch": 2301} {"train_loss": -38.689083099365234, "global_step": 278507, "epoch": 2301} {"train_loss": -42.549983978271484, "global_step": 278508, "epoch": 2301} {"train_loss": -42.68293762207031, "global_step": 278509, "epoch": 2301} {"train_loss": -41.76420211791992, "global_step": 278510, "epoch": 2301} {"train_loss": -40.383419036865234, "global_step": 278511, "epoch": 2301} {"train_loss": -40.120357513427734, "global_step": 278512, "epoch": 2301} {"train_loss": -41.306922912597656, "global_step": 278513, "epoch": 2301} {"train_loss": -42.753700256347656, "global_step": 278514, "epoch": 2301} {"train_loss": -42.2038459777832, "global_step": 278515, "epoch": 2301} {"train_loss": -42.76273727416992, "global_step": 278516, "epoch": 2301} {"train_loss": -42.616207122802734, "global_step": 278517, "epoch": 2301} {"train_loss": -42.11228942871094, "global_step": 278518, "epoch": 2301} {"train_loss": -40.69426345825195, "global_step": 278519, "epoch": 2301} {"train_loss": -39.91415023803711, "global_step": 278520, "epoch": 2301} {"train_loss": -41.876705169677734, "global_step": 278521, "epoch": 2301} {"train_loss": -40.49834060668945, "global_step": 278522, "epoch": 2301} {"train_loss": -42.432621002197266, "global_step": 278523, "epoch": 2301} {"train_loss": -41.626380920410156, "global_step": 278524, "epoch": 2301} {"train_loss": -42.63908767700195, "global_step": 278525, "epoch": 2301} {"train_loss": -41.65855026245117, "global_step": 278526, "epoch": 2301} {"train_loss": -42.75057601928711, "global_step": 278527, "epoch": 2301} {"train_loss": -42.863685607910156, "global_step": 278528, "epoch": 2301} {"train_loss": -41.66401672363281, "global_step": 278529, "epoch": 2301} {"train_loss": -42.79167556762695, "global_step": 278530, "epoch": 2301} {"train_loss": -41.96452713012695, "global_step": 278531, "epoch": 2301} {"train_loss": -43.070472717285156, "global_step": 278532, "epoch": 2301} {"train_loss": -41.8909912109375, "global_step": 278533, "epoch": 2301} {"train_loss": -42.96864700317383, "global_step": 278534, "epoch": 2301} {"train_loss": -42.544795989990234, "global_step": 278535, "epoch": 2301} {"train_loss": -42.8223991394043, "global_step": 278536, "epoch": 2301} {"train_loss": -43.11796188354492, "global_step": 278537, "epoch": 2301} {"train_loss": -42.41536331176758, "global_step": 278538, "epoch": 2301} {"train_loss": -41.875057220458984, "global_step": 278539, "epoch": 2301} {"train_loss": -43.273746490478516, "global_step": 278540, "epoch": 2301} {"train_loss": -41.243690900566165, "global_step": 278541, "epoch": 2301, "val_loss": 2606044.75} {"train_loss": -42.23432540893555, "global_step": 278542, "epoch": 2302} {"train_loss": -43.21148681640625, "global_step": 278543, "epoch": 2302} {"train_loss": -42.88322830200195, "global_step": 278544, "epoch": 2302} {"train_loss": -43.164955139160156, "global_step": 278545, "epoch": 2302} {"train_loss": -42.617305755615234, "global_step": 278546, "epoch": 2302} {"train_loss": -42.85969924926758, "global_step": 278547, "epoch": 2302} {"train_loss": -42.4155387878418, "global_step": 278548, "epoch": 2302} {"train_loss": -42.68603515625, "global_step": 278549, "epoch": 2302} {"train_loss": -43.72064971923828, "global_step": 278550, "epoch": 2302} {"train_loss": -42.6021614074707, "global_step": 278551, "epoch": 2302} {"train_loss": -43.33433532714844, "global_step": 278552, "epoch": 2302} {"train_loss": -42.77976608276367, "global_step": 278553, "epoch": 2302} {"train_loss": -42.38204574584961, "global_step": 278554, "epoch": 2302} {"train_loss": -42.64561080932617, "global_step": 278555, "epoch": 2302} {"train_loss": -42.350399017333984, "global_step": 278556, "epoch": 2302} {"train_loss": -42.35036849975586, "global_step": 278557, "epoch": 2302} {"train_loss": -42.34021759033203, "global_step": 278558, "epoch": 2302} {"train_loss": -43.17582321166992, "global_step": 278559, "epoch": 2302} {"train_loss": -42.56364059448242, "global_step": 278560, "epoch": 2302} {"train_loss": -42.4047966003418, "global_step": 278561, "epoch": 2302} {"train_loss": -42.37075424194336, "global_step": 278562, "epoch": 2302} {"train_loss": -42.19879913330078, "global_step": 278563, "epoch": 2302} {"train_loss": -42.135414123535156, "global_step": 278564, "epoch": 2302} {"train_loss": -41.62765121459961, "global_step": 278565, "epoch": 2302} {"train_loss": -41.83037185668945, "global_step": 278566, "epoch": 2302} {"train_loss": -42.556697845458984, "global_step": 278567, "epoch": 2302} {"train_loss": -41.99287033081055, "global_step": 278568, "epoch": 2302} {"train_loss": -43.55662155151367, "global_step": 278569, "epoch": 2302} {"train_loss": -43.10295486450195, "global_step": 278570, "epoch": 2302} {"train_loss": -42.73999786376953, "global_step": 278571, "epoch": 2302} {"train_loss": -43.20097732543945, "global_step": 278572, "epoch": 2302} {"train_loss": -42.80593490600586, "global_step": 278573, "epoch": 2302} {"train_loss": -41.99472427368164, "global_step": 278574, "epoch": 2302} {"train_loss": -42.9130973815918, "global_step": 278575, "epoch": 2302} {"train_loss": -42.37592315673828, "global_step": 278576, "epoch": 2302} {"train_loss": -40.88339614868164, "global_step": 278577, "epoch": 2302} {"train_loss": -41.759822845458984, "global_step": 278578, "epoch": 2302} {"train_loss": -41.99726486206055, "global_step": 278579, "epoch": 2302} {"train_loss": -42.34804153442383, "global_step": 278580, "epoch": 2302} {"train_loss": -42.152931213378906, "global_step": 278581, "epoch": 2302} {"train_loss": -42.049720764160156, "global_step": 278582, "epoch": 2302} {"train_loss": -42.50725173950195, "global_step": 278583, "epoch": 2302} {"train_loss": -42.696983337402344, "global_step": 278584, "epoch": 2302} {"train_loss": -43.452388763427734, "global_step": 278585, "epoch": 2302} {"train_loss": -41.4417839050293, "global_step": 278586, "epoch": 2302} {"train_loss": -42.74518585205078, "global_step": 278587, "epoch": 2302} {"train_loss": -43.252803802490234, "global_step": 278588, "epoch": 2302} {"train_loss": -42.119319915771484, "global_step": 278589, "epoch": 2302} {"train_loss": -42.463592529296875, "global_step": 278590, "epoch": 2302} {"train_loss": -41.57218933105469, "global_step": 278591, "epoch": 2302} {"train_loss": -41.541751861572266, "global_step": 278592, "epoch": 2302} {"train_loss": -42.00864791870117, "global_step": 278593, "epoch": 2302} {"train_loss": -41.57825469970703, "global_step": 278594, "epoch": 2302} {"train_loss": -41.99882507324219, "global_step": 278595, "epoch": 2302} {"train_loss": -40.003414154052734, "global_step": 278596, "epoch": 2302} {"train_loss": -35.71049118041992, "global_step": 278597, "epoch": 2302} {"train_loss": -27.361066818237305, "global_step": 278598, "epoch": 2302} {"train_loss": -26.40986442565918, "global_step": 278599, "epoch": 2302} {"train_loss": -37.12127685546875, "global_step": 278600, "epoch": 2302} {"train_loss": -38.53151321411133, "global_step": 278601, "epoch": 2302} {"train_loss": -35.742530822753906, "global_step": 278602, "epoch": 2302} {"train_loss": -39.36347579956055, "global_step": 278603, "epoch": 2302} {"train_loss": -36.4979362487793, "global_step": 278604, "epoch": 2302} {"train_loss": -27.634382247924805, "global_step": 278605, "epoch": 2302} {"train_loss": -35.22364044189453, "global_step": 278606, "epoch": 2302} {"train_loss": -26.505746841430664, "global_step": 278607, "epoch": 2302} {"train_loss": -35.26385498046875, "global_step": 278608, "epoch": 2302} {"train_loss": -36.24261474609375, "global_step": 278609, "epoch": 2302} {"train_loss": -32.21267318725586, "global_step": 278610, "epoch": 2302} {"train_loss": -39.1312370300293, "global_step": 278611, "epoch": 2302} {"train_loss": -32.890045166015625, "global_step": 278612, "epoch": 2302} {"train_loss": -38.86626052856445, "global_step": 278613, "epoch": 2302} {"train_loss": -36.799312591552734, "global_step": 278614, "epoch": 2302} {"train_loss": -38.22410583496094, "global_step": 278615, "epoch": 2302} {"train_loss": -32.8399658203125, "global_step": 278616, "epoch": 2302} {"train_loss": -39.6032600402832, "global_step": 278617, "epoch": 2302} {"train_loss": -37.58955764770508, "global_step": 278618, "epoch": 2302} {"train_loss": -36.92445373535156, "global_step": 278619, "epoch": 2302} {"train_loss": -39.823177337646484, "global_step": 278620, "epoch": 2302} {"train_loss": -39.752071380615234, "global_step": 278621, "epoch": 2302} {"train_loss": -38.99549102783203, "global_step": 278622, "epoch": 2302} {"train_loss": -38.56112289428711, "global_step": 278623, "epoch": 2302} {"train_loss": -39.64289855957031, "global_step": 278624, "epoch": 2302} {"train_loss": -40.77215576171875, "global_step": 278625, "epoch": 2302} {"train_loss": -40.71815872192383, "global_step": 278626, "epoch": 2302} {"train_loss": -39.894744873046875, "global_step": 278627, "epoch": 2302} {"train_loss": -39.67253494262695, "global_step": 278628, "epoch": 2302} {"train_loss": -40.81893539428711, "global_step": 278629, "epoch": 2302} {"train_loss": -40.97397994995117, "global_step": 278630, "epoch": 2302} {"train_loss": -40.666168212890625, "global_step": 278631, "epoch": 2302} {"train_loss": -41.044532775878906, "global_step": 278632, "epoch": 2302} {"train_loss": -40.57851791381836, "global_step": 278633, "epoch": 2302} {"train_loss": -41.36797332763672, "global_step": 278634, "epoch": 2302} {"train_loss": -41.07415771484375, "global_step": 278635, "epoch": 2302} {"train_loss": -41.08922576904297, "global_step": 278636, "epoch": 2302} {"train_loss": -41.1751594543457, "global_step": 278637, "epoch": 2302} {"train_loss": -41.694210052490234, "global_step": 278638, "epoch": 2302} {"train_loss": -41.65956497192383, "global_step": 278639, "epoch": 2302} {"train_loss": -41.381591796875, "global_step": 278640, "epoch": 2302} {"train_loss": -41.70409393310547, "global_step": 278641, "epoch": 2302} {"train_loss": -41.5676383972168, "global_step": 278642, "epoch": 2302} {"train_loss": -42.025672912597656, "global_step": 278643, "epoch": 2302} {"train_loss": -42.18699264526367, "global_step": 278644, "epoch": 2302} {"train_loss": -41.64299011230469, "global_step": 278645, "epoch": 2302} {"train_loss": -41.88535690307617, "global_step": 278646, "epoch": 2302} {"train_loss": -42.30399703979492, "global_step": 278647, "epoch": 2302} {"train_loss": -40.57133865356445, "global_step": 278648, "epoch": 2302} {"train_loss": -41.846038818359375, "global_step": 278649, "epoch": 2302} {"train_loss": -41.97519302368164, "global_step": 278650, "epoch": 2302} {"train_loss": -42.034847259521484, "global_step": 278651, "epoch": 2302} {"train_loss": -42.26939010620117, "global_step": 278652, "epoch": 2302} {"train_loss": -42.40481185913086, "global_step": 278653, "epoch": 2302} {"train_loss": -42.33884048461914, "global_step": 278654, "epoch": 2302} {"train_loss": -42.15629577636719, "global_step": 278655, "epoch": 2302} {"train_loss": -42.29462814331055, "global_step": 278656, "epoch": 2302} {"train_loss": -42.02707290649414, "global_step": 278657, "epoch": 2302} {"train_loss": -42.433963775634766, "global_step": 278658, "epoch": 2302} {"train_loss": -42.16111373901367, "global_step": 278659, "epoch": 2302} {"train_loss": -42.432395935058594, "global_step": 278660, "epoch": 2302} {"train_loss": -42.174224853515625, "global_step": 278661, "epoch": 2302} {"train_loss": -40.591412567895304, "global_step": 278662, "epoch": 2302, "val_loss": 2445341.0} {"train_loss": -42.551692962646484, "global_step": 278663, "epoch": 2303} {"train_loss": -42.423011779785156, "global_step": 278664, "epoch": 2303} {"train_loss": -42.76521682739258, "global_step": 278665, "epoch": 2303} {"train_loss": -42.42136764526367, "global_step": 278666, "epoch": 2303} {"train_loss": -42.6992073059082, "global_step": 278667, "epoch": 2303} {"train_loss": -42.49166488647461, "global_step": 278668, "epoch": 2303} {"train_loss": -42.66396713256836, "global_step": 278669, "epoch": 2303} {"train_loss": -42.85218048095703, "global_step": 278670, "epoch": 2303} {"train_loss": -42.7578125, "global_step": 278671, "epoch": 2303} {"train_loss": -43.150447845458984, "global_step": 278672, "epoch": 2303} {"train_loss": -43.002479553222656, "global_step": 278673, "epoch": 2303} {"train_loss": -42.99406051635742, "global_step": 278674, "epoch": 2303} {"train_loss": -42.965614318847656, "global_step": 278675, "epoch": 2303} {"train_loss": -43.12143325805664, "global_step": 278676, "epoch": 2303} {"train_loss": -42.97288513183594, "global_step": 278677, "epoch": 2303} {"train_loss": -43.15930938720703, "global_step": 278678, "epoch": 2303} {"train_loss": -42.81417465209961, "global_step": 278679, "epoch": 2303} {"train_loss": -42.95840072631836, "global_step": 278680, "epoch": 2303} {"train_loss": -43.62005615234375, "global_step": 278681, "epoch": 2303} {"train_loss": -42.66999816894531, "global_step": 278682, "epoch": 2303} {"train_loss": -43.446197509765625, "global_step": 278683, "epoch": 2303} {"train_loss": -43.60279083251953, "global_step": 278684, "epoch": 2303} {"train_loss": -43.44789505004883, "global_step": 278685, "epoch": 2303} {"train_loss": -43.035911560058594, "global_step": 278686, "epoch": 2303} {"train_loss": -43.41581344604492, "global_step": 278687, "epoch": 2303} {"train_loss": -43.1190071105957, "global_step": 278688, "epoch": 2303} {"train_loss": -43.57920837402344, "global_step": 278689, "epoch": 2303} {"train_loss": -43.135372161865234, "global_step": 278690, "epoch": 2303} {"train_loss": -43.63569641113281, "global_step": 278691, "epoch": 2303} {"train_loss": -42.14759826660156, "global_step": 278692, "epoch": 2303} {"train_loss": -43.56721115112305, "global_step": 278693, "epoch": 2303} {"train_loss": -43.5844612121582, "global_step": 278694, "epoch": 2303} {"train_loss": -43.36115646362305, "global_step": 278695, "epoch": 2303} {"train_loss": -43.356536865234375, "global_step": 278696, "epoch": 2303} {"train_loss": -43.52058029174805, "global_step": 278697, "epoch": 2303} {"train_loss": -43.826942443847656, "global_step": 278698, "epoch": 2303} {"train_loss": -43.27165603637695, "global_step": 278699, "epoch": 2303} {"train_loss": -43.65812683105469, "global_step": 278700, "epoch": 2303} {"train_loss": -42.75727462768555, "global_step": 278701, "epoch": 2303} {"train_loss": -43.650001525878906, "global_step": 278702, "epoch": 2303} {"train_loss": -43.984230041503906, "global_step": 278703, "epoch": 2303} {"train_loss": -43.766761779785156, "global_step": 278704, "epoch": 2303} {"train_loss": -43.834651947021484, "global_step": 278705, "epoch": 2303} {"train_loss": -43.803977966308594, "global_step": 278706, "epoch": 2303} {"train_loss": -43.78436279296875, "global_step": 278707, "epoch": 2303} {"train_loss": -42.81258010864258, "global_step": 278708, "epoch": 2303} {"train_loss": -43.709320068359375, "global_step": 278709, "epoch": 2303} {"train_loss": -43.72046661376953, "global_step": 278710, "epoch": 2303} {"train_loss": -43.69550323486328, "global_step": 278711, "epoch": 2303} {"train_loss": -43.72314453125, "global_step": 278712, "epoch": 2303} {"train_loss": -43.78118133544922, "global_step": 278713, "epoch": 2303} {"train_loss": -43.64973068237305, "global_step": 278714, "epoch": 2303} {"train_loss": -43.79084014892578, "global_step": 278715, "epoch": 2303} {"train_loss": -43.95662307739258, "global_step": 278716, "epoch": 2303} {"train_loss": -42.71515655517578, "global_step": 278717, "epoch": 2303} {"train_loss": -43.787391662597656, "global_step": 278718, "epoch": 2303} {"train_loss": -44.03052520751953, "global_step": 278719, "epoch": 2303} {"train_loss": -43.53388214111328, "global_step": 278720, "epoch": 2303} {"train_loss": -43.81037902832031, "global_step": 278721, "epoch": 2303} {"train_loss": -42.934242248535156, "global_step": 278722, "epoch": 2303} {"train_loss": -43.20363998413086, "global_step": 278723, "epoch": 2303} {"train_loss": -43.859619140625, "global_step": 278724, "epoch": 2303} {"train_loss": -43.9122200012207, "global_step": 278725, "epoch": 2303} {"train_loss": -43.844791412353516, "global_step": 278726, "epoch": 2303} {"train_loss": -43.617855072021484, "global_step": 278727, "epoch": 2303} {"train_loss": -43.928802490234375, "global_step": 278728, "epoch": 2303} {"train_loss": -44.0692253112793, "global_step": 278729, "epoch": 2303} {"train_loss": -43.54802703857422, "global_step": 278730, "epoch": 2303} {"train_loss": -43.699825286865234, "global_step": 278731, "epoch": 2303} {"train_loss": -40.807708740234375, "global_step": 278732, "epoch": 2303} {"train_loss": -44.10771179199219, "global_step": 278733, "epoch": 2303} {"train_loss": -42.74654769897461, "global_step": 278734, "epoch": 2303} {"train_loss": -43.53668212890625, "global_step": 278735, "epoch": 2303} {"train_loss": -43.574317932128906, "global_step": 278736, "epoch": 2303} {"train_loss": -41.45893859863281, "global_step": 278737, "epoch": 2303} {"train_loss": -40.4167594909668, "global_step": 278738, "epoch": 2303} {"train_loss": -38.51728057861328, "global_step": 278739, "epoch": 2303} {"train_loss": -36.9314079284668, "global_step": 278740, "epoch": 2303} {"train_loss": -32.80537796020508, "global_step": 278741, "epoch": 2303} {"train_loss": -27.974267959594727, "global_step": 278742, "epoch": 2303} {"train_loss": -30.076169967651367, "global_step": 278743, "epoch": 2303} {"train_loss": -42.173458099365234, "global_step": 278744, "epoch": 2303} {"train_loss": -37.05061721801758, "global_step": 278745, "epoch": 2303} {"train_loss": -36.893306732177734, "global_step": 278746, "epoch": 2303} {"train_loss": -41.3038330078125, "global_step": 278747, "epoch": 2303} {"train_loss": -39.5621452331543, "global_step": 278748, "epoch": 2303} {"train_loss": -41.005775451660156, "global_step": 278749, "epoch": 2303} {"train_loss": -42.012725830078125, "global_step": 278750, "epoch": 2303} {"train_loss": -40.851558685302734, "global_step": 278751, "epoch": 2303} {"train_loss": -41.98385238647461, "global_step": 278752, "epoch": 2303} {"train_loss": -41.36861038208008, "global_step": 278753, "epoch": 2303} {"train_loss": -42.00008010864258, "global_step": 278754, "epoch": 2303} {"train_loss": -42.07830810546875, "global_step": 278755, "epoch": 2303} {"train_loss": -41.77317428588867, "global_step": 278756, "epoch": 2303} {"train_loss": -42.06966781616211, "global_step": 278757, "epoch": 2303} {"train_loss": -41.945587158203125, "global_step": 278758, "epoch": 2303} {"train_loss": -42.1022834777832, "global_step": 278759, "epoch": 2303} {"train_loss": -42.23214340209961, "global_step": 278760, "epoch": 2303} {"train_loss": -42.041378021240234, "global_step": 278761, "epoch": 2303} {"train_loss": -41.940162658691406, "global_step": 278762, "epoch": 2303} {"train_loss": -42.223663330078125, "global_step": 278763, "epoch": 2303} {"train_loss": -39.578121185302734, "global_step": 278764, "epoch": 2303} {"train_loss": -43.04015350341797, "global_step": 278765, "epoch": 2303} {"train_loss": -41.6210823059082, "global_step": 278766, "epoch": 2303} {"train_loss": -43.182472229003906, "global_step": 278767, "epoch": 2303} {"train_loss": -42.553707122802734, "global_step": 278768, "epoch": 2303} {"train_loss": -41.572540283203125, "global_step": 278769, "epoch": 2303} {"train_loss": -42.88606262207031, "global_step": 278770, "epoch": 2303} {"train_loss": -42.93818283081055, "global_step": 278771, "epoch": 2303} {"train_loss": -42.25162887573242, "global_step": 278772, "epoch": 2303} {"train_loss": -42.128326416015625, "global_step": 278773, "epoch": 2303} {"train_loss": -42.7990837097168, "global_step": 278774, "epoch": 2303} {"train_loss": -42.96122360229492, "global_step": 278775, "epoch": 2303} {"train_loss": -43.223121643066406, "global_step": 278776, "epoch": 2303} {"train_loss": -42.34181594848633, "global_step": 278777, "epoch": 2303} {"train_loss": -43.2809944152832, "global_step": 278778, "epoch": 2303} {"train_loss": -42.936946868896484, "global_step": 278779, "epoch": 2303} {"train_loss": -42.52510452270508, "global_step": 278780, "epoch": 2303} {"train_loss": -42.7934455871582, "global_step": 278781, "epoch": 2303} {"train_loss": -42.7950439453125, "global_step": 278782, "epoch": 2303} {"train_loss": -42.38728269466684, "global_step": 278783, "epoch": 2303, "val_loss": 2457276.0} {"train_loss": -42.93731689453125, "global_step": 278784, "epoch": 2304} {"train_loss": -42.9680290222168, "global_step": 278785, "epoch": 2304} {"train_loss": -42.57327651977539, "global_step": 278786, "epoch": 2304} {"train_loss": -43.43843460083008, "global_step": 278787, "epoch": 2304} {"train_loss": -43.21294021606445, "global_step": 278788, "epoch": 2304} {"train_loss": -43.40277862548828, "global_step": 278789, "epoch": 2304} {"train_loss": -43.07587432861328, "global_step": 278790, "epoch": 2304} {"train_loss": -42.826026916503906, "global_step": 278791, "epoch": 2304} {"train_loss": -43.3390007019043, "global_step": 278792, "epoch": 2304} {"train_loss": -43.04502487182617, "global_step": 278793, "epoch": 2304} {"train_loss": -43.33237838745117, "global_step": 278794, "epoch": 2304} {"train_loss": -42.5134391784668, "global_step": 278795, "epoch": 2304} {"train_loss": -43.5711555480957, "global_step": 278796, "epoch": 2304} {"train_loss": -43.063209533691406, "global_step": 278797, "epoch": 2304} {"train_loss": -43.434967041015625, "global_step": 278798, "epoch": 2304} {"train_loss": -43.51585006713867, "global_step": 278799, "epoch": 2304} {"train_loss": -43.637176513671875, "global_step": 278800, "epoch": 2304} {"train_loss": -43.04951858520508, "global_step": 278801, "epoch": 2304} {"train_loss": -43.79179000854492, "global_step": 278802, "epoch": 2304} {"train_loss": -43.4278564453125, "global_step": 278803, "epoch": 2304} {"train_loss": -43.649627685546875, "global_step": 278804, "epoch": 2304} {"train_loss": -42.80988311767578, "global_step": 278805, "epoch": 2304} {"train_loss": -43.32411193847656, "global_step": 278806, "epoch": 2304} {"train_loss": -43.79940414428711, "global_step": 278807, "epoch": 2304} {"train_loss": -43.61111068725586, "global_step": 278808, "epoch": 2304} {"train_loss": -43.13259506225586, "global_step": 278809, "epoch": 2304} {"train_loss": -43.199466705322266, "global_step": 278810, "epoch": 2304} {"train_loss": -43.457122802734375, "global_step": 278811, "epoch": 2304} {"train_loss": -43.71030807495117, "global_step": 278812, "epoch": 2304} {"train_loss": -43.65181350708008, "global_step": 278813, "epoch": 2304} {"train_loss": -43.72361373901367, "global_step": 278814, "epoch": 2304} {"train_loss": -43.59479522705078, "global_step": 278815, "epoch": 2304} {"train_loss": -43.890045166015625, "global_step": 278816, "epoch": 2304} {"train_loss": -43.672969818115234, "global_step": 278817, "epoch": 2304} {"train_loss": -42.83401870727539, "global_step": 278818, "epoch": 2304} {"train_loss": -44.2569694519043, "global_step": 278819, "epoch": 2304} {"train_loss": -43.82963562011719, "global_step": 278820, "epoch": 2304} {"train_loss": -43.77088165283203, "global_step": 278821, "epoch": 2304} {"train_loss": -43.2266960144043, "global_step": 278822, "epoch": 2304} {"train_loss": -42.626468658447266, "global_step": 278823, "epoch": 2304} {"train_loss": -41.800689697265625, "global_step": 278824, "epoch": 2304} {"train_loss": -42.12441635131836, "global_step": 278825, "epoch": 2304} {"train_loss": -43.5861701965332, "global_step": 278826, "epoch": 2304} {"train_loss": -44.0427131652832, "global_step": 278827, "epoch": 2304} {"train_loss": -42.27275848388672, "global_step": 278828, "epoch": 2304} {"train_loss": -38.6634407043457, "global_step": 278829, "epoch": 2304} {"train_loss": -25.993078231811523, "global_step": 278830, "epoch": 2304} {"train_loss": -13.265049934387207, "global_step": 278831, "epoch": 2304} {"train_loss": -19.830968856811523, "global_step": 278832, "epoch": 2304} {"train_loss": -40.58976364135742, "global_step": 278833, "epoch": 2304} {"train_loss": -21.913244247436523, "global_step": 278834, "epoch": 2304} {"train_loss": -25.777469635009766, "global_step": 278835, "epoch": 2304} {"train_loss": -35.09859848022461, "global_step": 278836, "epoch": 2304} {"train_loss": -28.072406768798828, "global_step": 278837, "epoch": 2304} {"train_loss": -35.766845703125, "global_step": 278838, "epoch": 2304} {"train_loss": -29.28449058532715, "global_step": 278839, "epoch": 2304} {"train_loss": -35.463558197021484, "global_step": 278840, "epoch": 2304} {"train_loss": -34.365257263183594, "global_step": 278841, "epoch": 2304} {"train_loss": -35.635990142822266, "global_step": 278842, "epoch": 2304} {"train_loss": -33.9163932800293, "global_step": 278843, "epoch": 2304} {"train_loss": -36.70245361328125, "global_step": 278844, "epoch": 2304} {"train_loss": -38.01129913330078, "global_step": 278845, "epoch": 2304} {"train_loss": -37.19148635864258, "global_step": 278846, "epoch": 2304} {"train_loss": -38.246917724609375, "global_step": 278847, "epoch": 2304} {"train_loss": -38.689796447753906, "global_step": 278848, "epoch": 2304} {"train_loss": -37.304080963134766, "global_step": 278849, "epoch": 2304} {"train_loss": -40.0601921081543, "global_step": 278850, "epoch": 2304} {"train_loss": -39.51509475708008, "global_step": 278851, "epoch": 2304} {"train_loss": -38.15403366088867, "global_step": 278852, "epoch": 2304} {"train_loss": -41.348140716552734, "global_step": 278853, "epoch": 2304} {"train_loss": -38.718746185302734, "global_step": 278854, "epoch": 2304} {"train_loss": -40.09257125854492, "global_step": 278855, "epoch": 2304} {"train_loss": -40.43137741088867, "global_step": 278856, "epoch": 2304} {"train_loss": -39.41127395629883, "global_step": 278857, "epoch": 2304} {"train_loss": -40.03561019897461, "global_step": 278858, "epoch": 2304} {"train_loss": -40.8489875793457, "global_step": 278859, "epoch": 2304} {"train_loss": -40.4940299987793, "global_step": 278860, "epoch": 2304} {"train_loss": -40.171119689941406, "global_step": 278861, "epoch": 2304} {"train_loss": -40.99907302856445, "global_step": 278862, "epoch": 2304} {"train_loss": -40.61811065673828, "global_step": 278863, "epoch": 2304} {"train_loss": -40.901817321777344, "global_step": 278864, "epoch": 2304} {"train_loss": -40.70244216918945, "global_step": 278865, "epoch": 2304} {"train_loss": -41.2960090637207, "global_step": 278866, "epoch": 2304} {"train_loss": -40.58415222167969, "global_step": 278867, "epoch": 2304} {"train_loss": -40.628963470458984, "global_step": 278868, "epoch": 2304} {"train_loss": -41.66766357421875, "global_step": 278869, "epoch": 2304} {"train_loss": -40.758358001708984, "global_step": 278870, "epoch": 2304} {"train_loss": -40.983917236328125, "global_step": 278871, "epoch": 2304} {"train_loss": -41.8685417175293, "global_step": 278872, "epoch": 2304} {"train_loss": -41.21118927001953, "global_step": 278873, "epoch": 2304} {"train_loss": -41.48406982421875, "global_step": 278874, "epoch": 2304} {"train_loss": -41.77238845825195, "global_step": 278875, "epoch": 2304} {"train_loss": -41.551597595214844, "global_step": 278876, "epoch": 2304} {"train_loss": -41.9058837890625, "global_step": 278877, "epoch": 2304} {"train_loss": -41.9405403137207, "global_step": 278878, "epoch": 2304} {"train_loss": -41.83463668823242, "global_step": 278879, "epoch": 2304} {"train_loss": -41.583251953125, "global_step": 278880, "epoch": 2304} {"train_loss": -42.26972198486328, "global_step": 278881, "epoch": 2304} {"train_loss": -42.000667572021484, "global_step": 278882, "epoch": 2304} {"train_loss": -42.128135681152344, "global_step": 278883, "epoch": 2304} {"train_loss": -42.08637237548828, "global_step": 278884, "epoch": 2304} {"train_loss": -42.0648307800293, "global_step": 278885, "epoch": 2304} {"train_loss": -42.05324172973633, "global_step": 278886, "epoch": 2304} {"train_loss": -42.25307846069336, "global_step": 278887, "epoch": 2304} {"train_loss": -42.26064682006836, "global_step": 278888, "epoch": 2304} {"train_loss": -42.674285888671875, "global_step": 278889, "epoch": 2304} {"train_loss": -42.6735725402832, "global_step": 278890, "epoch": 2304} {"train_loss": -42.578548431396484, "global_step": 278891, "epoch": 2304} {"train_loss": -42.55316925048828, "global_step": 278892, "epoch": 2304} {"train_loss": -42.53312301635742, "global_step": 278893, "epoch": 2304} {"train_loss": -42.968505859375, "global_step": 278894, "epoch": 2304} {"train_loss": -42.87971496582031, "global_step": 278895, "epoch": 2304} {"train_loss": -42.31000900268555, "global_step": 278896, "epoch": 2304} {"train_loss": -42.42770767211914, "global_step": 278897, "epoch": 2304} {"train_loss": -42.887939453125, "global_step": 278898, "epoch": 2304} {"train_loss": -42.7619743347168, "global_step": 278899, "epoch": 2304} {"train_loss": -43.204559326171875, "global_step": 278900, "epoch": 2304} {"train_loss": -42.9931640625, "global_step": 278901, "epoch": 2304} {"train_loss": -43.18925094604492, "global_step": 278902, "epoch": 2304} {"train_loss": -42.956573486328125, "global_step": 278903, "epoch": 2304} {"train_loss": -40.603642085367, "global_step": 278904, "epoch": 2304, "val_loss": 2451164.75} {"train_loss": -43.16936111450195, "global_step": 278905, "epoch": 2305} {"train_loss": -43.17837142944336, "global_step": 278906, "epoch": 2305} {"train_loss": -43.19784164428711, "global_step": 278907, "epoch": 2305} {"train_loss": -43.43788528442383, "global_step": 278908, "epoch": 2305} {"train_loss": -42.995452880859375, "global_step": 278909, "epoch": 2305} {"train_loss": -43.36042022705078, "global_step": 278910, "epoch": 2305} {"train_loss": -43.43021774291992, "global_step": 278911, "epoch": 2305} {"train_loss": -43.280548095703125, "global_step": 278912, "epoch": 2305} {"train_loss": -43.426963806152344, "global_step": 278913, "epoch": 2305} {"train_loss": -43.698787689208984, "global_step": 278914, "epoch": 2305} {"train_loss": -43.30015563964844, "global_step": 278915, "epoch": 2305} {"train_loss": -43.70695495605469, "global_step": 278916, "epoch": 2305} {"train_loss": -43.05277633666992, "global_step": 278917, "epoch": 2305} {"train_loss": -43.38776397705078, "global_step": 278918, "epoch": 2305} {"train_loss": -44.0342903137207, "global_step": 278919, "epoch": 2305} {"train_loss": -43.77173614501953, "global_step": 278920, "epoch": 2305} {"train_loss": -43.83728790283203, "global_step": 278921, "epoch": 2305} {"train_loss": -43.489593505859375, "global_step": 278922, "epoch": 2305} {"train_loss": -43.536861419677734, "global_step": 278923, "epoch": 2305} {"train_loss": -43.9613037109375, "global_step": 278924, "epoch": 2305} {"train_loss": -43.51691818237305, "global_step": 278925, "epoch": 2305} {"train_loss": -43.599666595458984, "global_step": 278926, "epoch": 2305} {"train_loss": -43.71894073486328, "global_step": 278927, "epoch": 2305} {"train_loss": -43.71034622192383, "global_step": 278928, "epoch": 2305} {"train_loss": -43.260231018066406, "global_step": 278929, "epoch": 2305} {"train_loss": -44.01199722290039, "global_step": 278930, "epoch": 2305} {"train_loss": -43.49300003051758, "global_step": 278931, "epoch": 2305} {"train_loss": -43.58795166015625, "global_step": 278932, "epoch": 2305} {"train_loss": -44.114437103271484, "global_step": 278933, "epoch": 2305} {"train_loss": -43.52554702758789, "global_step": 278934, "epoch": 2305} {"train_loss": -44.18391799926758, "global_step": 278935, "epoch": 2305} {"train_loss": -44.075843811035156, "global_step": 278936, "epoch": 2305} {"train_loss": -43.944610595703125, "global_step": 278937, "epoch": 2305} {"train_loss": -43.54057693481445, "global_step": 278938, "epoch": 2305} {"train_loss": -43.62653732299805, "global_step": 278939, "epoch": 2305} {"train_loss": -43.91475296020508, "global_step": 278940, "epoch": 2305} {"train_loss": -44.02100372314453, "global_step": 278941, "epoch": 2305} {"train_loss": -43.487972259521484, "global_step": 278942, "epoch": 2305} {"train_loss": -44.16802215576172, "global_step": 278943, "epoch": 2305} {"train_loss": -44.054290771484375, "global_step": 278944, "epoch": 2305} {"train_loss": -43.450260162353516, "global_step": 278945, "epoch": 2305} {"train_loss": -43.850929260253906, "global_step": 278946, "epoch": 2305} {"train_loss": -43.2337760925293, "global_step": 278947, "epoch": 2305} {"train_loss": -43.80113220214844, "global_step": 278948, "epoch": 2305} {"train_loss": -43.913909912109375, "global_step": 278949, "epoch": 2305} {"train_loss": -43.84934616088867, "global_step": 278950, "epoch": 2305} {"train_loss": -43.897621154785156, "global_step": 278951, "epoch": 2305} {"train_loss": -43.47434616088867, "global_step": 278952, "epoch": 2305} {"train_loss": -43.30337142944336, "global_step": 278953, "epoch": 2305} {"train_loss": -43.583431243896484, "global_step": 278954, "epoch": 2305} {"train_loss": -43.6039924621582, "global_step": 278955, "epoch": 2305} {"train_loss": -44.036258697509766, "global_step": 278956, "epoch": 2305} {"train_loss": -42.90979766845703, "global_step": 278957, "epoch": 2305} {"train_loss": -43.83274459838867, "global_step": 278958, "epoch": 2305} {"train_loss": -43.619136810302734, "global_step": 278959, "epoch": 2305} {"train_loss": -43.68491744995117, "global_step": 278960, "epoch": 2305} {"train_loss": -43.97071075439453, "global_step": 278961, "epoch": 2305} {"train_loss": -42.56031036376953, "global_step": 278962, "epoch": 2305} {"train_loss": -42.580322265625, "global_step": 278963, "epoch": 2305} {"train_loss": -41.01207733154297, "global_step": 278964, "epoch": 2305} {"train_loss": -40.35730743408203, "global_step": 278965, "epoch": 2305} {"train_loss": -42.43165969848633, "global_step": 278966, "epoch": 2305} {"train_loss": -43.20705795288086, "global_step": 278967, "epoch": 2305} {"train_loss": -43.47774887084961, "global_step": 278968, "epoch": 2305} {"train_loss": -43.06836700439453, "global_step": 278969, "epoch": 2305} {"train_loss": -41.54084396362305, "global_step": 278970, "epoch": 2305} {"train_loss": -42.354366302490234, "global_step": 278971, "epoch": 2305} {"train_loss": -42.276954650878906, "global_step": 278972, "epoch": 2305} {"train_loss": -43.015193939208984, "global_step": 278973, "epoch": 2305} {"train_loss": -42.18214797973633, "global_step": 278974, "epoch": 2305} {"train_loss": -41.68745422363281, "global_step": 278975, "epoch": 2305} {"train_loss": -41.902130126953125, "global_step": 278976, "epoch": 2305} {"train_loss": -41.78034591674805, "global_step": 278977, "epoch": 2305} {"train_loss": -40.756446838378906, "global_step": 278978, "epoch": 2305} {"train_loss": -40.433650970458984, "global_step": 278979, "epoch": 2305} {"train_loss": -41.20517349243164, "global_step": 278980, "epoch": 2305} {"train_loss": -41.7630729675293, "global_step": 278981, "epoch": 2305} {"train_loss": -40.78740310668945, "global_step": 278982, "epoch": 2305} {"train_loss": -42.18684768676758, "global_step": 278983, "epoch": 2305} {"train_loss": -41.6515998840332, "global_step": 278984, "epoch": 2305} {"train_loss": -40.85437774658203, "global_step": 278985, "epoch": 2305} {"train_loss": -43.046669006347656, "global_step": 278986, "epoch": 2305} {"train_loss": -40.542999267578125, "global_step": 278987, "epoch": 2305} {"train_loss": -41.8926887512207, "global_step": 278988, "epoch": 2305} {"train_loss": -42.26997756958008, "global_step": 278989, "epoch": 2305} {"train_loss": -41.65571212768555, "global_step": 278990, "epoch": 2305} {"train_loss": -43.272090911865234, "global_step": 278991, "epoch": 2305} {"train_loss": -40.1163215637207, "global_step": 278992, "epoch": 2305} {"train_loss": -40.79975509643555, "global_step": 278993, "epoch": 2305} {"train_loss": -42.373870849609375, "global_step": 278994, "epoch": 2305} {"train_loss": -40.15630340576172, "global_step": 278995, "epoch": 2305} {"train_loss": -41.79183578491211, "global_step": 278996, "epoch": 2305} {"train_loss": -41.60920333862305, "global_step": 278997, "epoch": 2305} {"train_loss": -41.06535339355469, "global_step": 278998, "epoch": 2305} {"train_loss": -42.38197326660156, "global_step": 278999, "epoch": 2305} {"train_loss": -41.9956169128418, "global_step": 279000, "epoch": 2305} {"train_loss": -41.78006362915039, "global_step": 279001, "epoch": 2305} {"train_loss": -41.489803314208984, "global_step": 279002, "epoch": 2305} {"train_loss": -42.2568244934082, "global_step": 279003, "epoch": 2305} {"train_loss": -41.6787223815918, "global_step": 279004, "epoch": 2305} {"train_loss": -42.059059143066406, "global_step": 279005, "epoch": 2305} {"train_loss": -41.89813995361328, "global_step": 279006, "epoch": 2305} {"train_loss": -42.23264694213867, "global_step": 279007, "epoch": 2305} {"train_loss": -41.83757400512695, "global_step": 279008, "epoch": 2305} {"train_loss": -43.14617156982422, "global_step": 279009, "epoch": 2305} {"train_loss": -41.63982009887695, "global_step": 279010, "epoch": 2305} {"train_loss": -43.164737701416016, "global_step": 279011, "epoch": 2305} {"train_loss": -42.417293548583984, "global_step": 279012, "epoch": 2305} {"train_loss": -43.423702239990234, "global_step": 279013, "epoch": 2305} {"train_loss": -42.889198303222656, "global_step": 279014, "epoch": 2305} {"train_loss": -42.97506332397461, "global_step": 279015, "epoch": 2305} {"train_loss": -43.049835205078125, "global_step": 279016, "epoch": 2305} {"train_loss": -43.09455108642578, "global_step": 279017, "epoch": 2305} {"train_loss": -43.05788803100586, "global_step": 279018, "epoch": 2305} {"train_loss": -42.99750900268555, "global_step": 279019, "epoch": 2305} {"train_loss": -43.59288024902344, "global_step": 279020, "epoch": 2305} {"train_loss": -43.06561279296875, "global_step": 279021, "epoch": 2305} {"train_loss": -43.44962692260742, "global_step": 279022, "epoch": 2305} {"train_loss": -43.140621185302734, "global_step": 279023, "epoch": 2305} {"train_loss": -43.79281234741211, "global_step": 279024, "epoch": 2305} {"train_loss": -42.84625887279668, "global_step": 279025, "epoch": 2305, "val_loss": 2468305.75} {"train_loss": -43.13315963745117, "global_step": 279026, "epoch": 2306} {"train_loss": -43.209251403808594, "global_step": 279027, "epoch": 2306} {"train_loss": -43.63348388671875, "global_step": 279028, "epoch": 2306} {"train_loss": -43.0771598815918, "global_step": 279029, "epoch": 2306} {"train_loss": -43.59571075439453, "global_step": 279030, "epoch": 2306} {"train_loss": -43.08152389526367, "global_step": 279031, "epoch": 2306} {"train_loss": -43.49856185913086, "global_step": 279032, "epoch": 2306} {"train_loss": -42.254676818847656, "global_step": 279033, "epoch": 2306} {"train_loss": -43.030147552490234, "global_step": 279034, "epoch": 2306} {"train_loss": -43.20880889892578, "global_step": 279035, "epoch": 2306} {"train_loss": -43.24262619018555, "global_step": 279036, "epoch": 2306} {"train_loss": -42.890724182128906, "global_step": 279037, "epoch": 2306} {"train_loss": -43.533992767333984, "global_step": 279038, "epoch": 2306} {"train_loss": -43.31527328491211, "global_step": 279039, "epoch": 2306} {"train_loss": -42.50425338745117, "global_step": 279040, "epoch": 2306} {"train_loss": -42.984649658203125, "global_step": 279041, "epoch": 2306} {"train_loss": -42.868587493896484, "global_step": 279042, "epoch": 2306} {"train_loss": -43.213802337646484, "global_step": 279043, "epoch": 2306} {"train_loss": -43.569271087646484, "global_step": 279044, "epoch": 2306} {"train_loss": -43.099205017089844, "global_step": 279045, "epoch": 2306} {"train_loss": -42.1657829284668, "global_step": 279046, "epoch": 2306} {"train_loss": -38.51357650756836, "global_step": 279047, "epoch": 2306} {"train_loss": -38.08906936645508, "global_step": 279048, "epoch": 2306} {"train_loss": -38.609718322753906, "global_step": 279049, "epoch": 2306} {"train_loss": -39.09639358520508, "global_step": 279050, "epoch": 2306} {"train_loss": -41.97699737548828, "global_step": 279051, "epoch": 2306} {"train_loss": -43.312435150146484, "global_step": 279052, "epoch": 2306} {"train_loss": -41.068580627441406, "global_step": 279053, "epoch": 2306} {"train_loss": -41.92165756225586, "global_step": 279054, "epoch": 2306} {"train_loss": -41.48246383666992, "global_step": 279055, "epoch": 2306} {"train_loss": -38.05805587768555, "global_step": 279056, "epoch": 2306} {"train_loss": -37.0751953125, "global_step": 279057, "epoch": 2306} {"train_loss": -34.9292106628418, "global_step": 279058, "epoch": 2306} {"train_loss": -37.743675231933594, "global_step": 279059, "epoch": 2306} {"train_loss": -38.30339431762695, "global_step": 279060, "epoch": 2306} {"train_loss": -39.00642013549805, "global_step": 279061, "epoch": 2306} {"train_loss": -38.69430160522461, "global_step": 279062, "epoch": 2306} {"train_loss": -36.968658447265625, "global_step": 279063, "epoch": 2306} {"train_loss": -36.68569564819336, "global_step": 279064, "epoch": 2306} {"train_loss": -31.880847930908203, "global_step": 279065, "epoch": 2306} {"train_loss": -37.5361213684082, "global_step": 279066, "epoch": 2306} {"train_loss": -40.552215576171875, "global_step": 279067, "epoch": 2306} {"train_loss": -36.90968704223633, "global_step": 279068, "epoch": 2306} {"train_loss": -39.31782150268555, "global_step": 279069, "epoch": 2306} {"train_loss": -34.60603713989258, "global_step": 279070, "epoch": 2306} {"train_loss": -38.01947784423828, "global_step": 279071, "epoch": 2306} {"train_loss": -38.01557540893555, "global_step": 279072, "epoch": 2306} {"train_loss": -37.27906036376953, "global_step": 279073, "epoch": 2306} {"train_loss": -36.97809982299805, "global_step": 279074, "epoch": 2306} {"train_loss": -39.035552978515625, "global_step": 279075, "epoch": 2306} {"train_loss": -38.11499786376953, "global_step": 279076, "epoch": 2306} {"train_loss": -35.31623840332031, "global_step": 279077, "epoch": 2306} {"train_loss": -40.61332702636719, "global_step": 279078, "epoch": 2306} {"train_loss": -34.33161926269531, "global_step": 279079, "epoch": 2306} {"train_loss": -37.99557876586914, "global_step": 279080, "epoch": 2306} {"train_loss": -40.29161071777344, "global_step": 279081, "epoch": 2306} {"train_loss": -39.64341354370117, "global_step": 279082, "epoch": 2306} {"train_loss": -37.43539047241211, "global_step": 279083, "epoch": 2306} {"train_loss": -39.69800567626953, "global_step": 279084, "epoch": 2306} {"train_loss": -39.966670989990234, "global_step": 279085, "epoch": 2306} {"train_loss": -39.824012756347656, "global_step": 279086, "epoch": 2306} {"train_loss": -39.33720779418945, "global_step": 279087, "epoch": 2306} {"train_loss": -35.621070861816406, "global_step": 279088, "epoch": 2306} {"train_loss": -38.7097282409668, "global_step": 279089, "epoch": 2306} {"train_loss": -41.0125846862793, "global_step": 279090, "epoch": 2306} {"train_loss": -39.39386749267578, "global_step": 279091, "epoch": 2306} {"train_loss": -37.214717864990234, "global_step": 279092, "epoch": 2306} {"train_loss": -40.40473556518555, "global_step": 279093, "epoch": 2306} {"train_loss": -37.15727615356445, "global_step": 279094, "epoch": 2306} {"train_loss": -35.83148956298828, "global_step": 279095, "epoch": 2306} {"train_loss": -40.56061935424805, "global_step": 279096, "epoch": 2306} {"train_loss": -41.51563262939453, "global_step": 279097, "epoch": 2306} {"train_loss": -41.457275390625, "global_step": 279098, "epoch": 2306} {"train_loss": -38.27022171020508, "global_step": 279099, "epoch": 2306} {"train_loss": -40.091705322265625, "global_step": 279100, "epoch": 2306} {"train_loss": -40.37623977661133, "global_step": 279101, "epoch": 2306} {"train_loss": -40.631378173828125, "global_step": 279102, "epoch": 2306} {"train_loss": -41.146480560302734, "global_step": 279103, "epoch": 2306} {"train_loss": -41.444515228271484, "global_step": 279104, "epoch": 2306} {"train_loss": -40.22968673706055, "global_step": 279105, "epoch": 2306} {"train_loss": -41.07296371459961, "global_step": 279106, "epoch": 2306} {"train_loss": -40.67158508300781, "global_step": 279107, "epoch": 2306} {"train_loss": -39.103694915771484, "global_step": 279108, "epoch": 2306} {"train_loss": -41.83372116088867, "global_step": 279109, "epoch": 2306} {"train_loss": -41.58230209350586, "global_step": 279110, "epoch": 2306} {"train_loss": -40.128814697265625, "global_step": 279111, "epoch": 2306} {"train_loss": -41.82022476196289, "global_step": 279112, "epoch": 2306} {"train_loss": -41.50312423706055, "global_step": 279113, "epoch": 2306} {"train_loss": -42.01472854614258, "global_step": 279114, "epoch": 2306} {"train_loss": -42.210262298583984, "global_step": 279115, "epoch": 2306} {"train_loss": -39.725799560546875, "global_step": 279116, "epoch": 2306} {"train_loss": -41.30643844604492, "global_step": 279117, "epoch": 2306} {"train_loss": -42.293006896972656, "global_step": 279118, "epoch": 2306} {"train_loss": -42.31142044067383, "global_step": 279119, "epoch": 2306} {"train_loss": -42.176177978515625, "global_step": 279120, "epoch": 2306} {"train_loss": -41.7128791809082, "global_step": 279121, "epoch": 2306} {"train_loss": -39.7470817565918, "global_step": 279122, "epoch": 2306} {"train_loss": -42.1807746887207, "global_step": 279123, "epoch": 2306} {"train_loss": -42.15665817260742, "global_step": 279124, "epoch": 2306} {"train_loss": -41.311946868896484, "global_step": 279125, "epoch": 2306} {"train_loss": -42.03776931762695, "global_step": 279126, "epoch": 2306} {"train_loss": -41.901668548583984, "global_step": 279127, "epoch": 2306} {"train_loss": -42.009464263916016, "global_step": 279128, "epoch": 2306} {"train_loss": -42.36309814453125, "global_step": 279129, "epoch": 2306} {"train_loss": -41.357810974121094, "global_step": 279130, "epoch": 2306} {"train_loss": -41.65396499633789, "global_step": 279131, "epoch": 2306} {"train_loss": -41.93555450439453, "global_step": 279132, "epoch": 2306} {"train_loss": -41.4152717590332, "global_step": 279133, "epoch": 2306} {"train_loss": -41.571834564208984, "global_step": 279134, "epoch": 2306} {"train_loss": -42.43751907348633, "global_step": 279135, "epoch": 2306} {"train_loss": -41.9762077331543, "global_step": 279136, "epoch": 2306} {"train_loss": -42.12749099731445, "global_step": 279137, "epoch": 2306} {"train_loss": -42.32108688354492, "global_step": 279138, "epoch": 2306} {"train_loss": -42.249244689941406, "global_step": 279139, "epoch": 2306} {"train_loss": -41.316680908203125, "global_step": 279140, "epoch": 2306} {"train_loss": -42.48494338989258, "global_step": 279141, "epoch": 2306} {"train_loss": -42.57334518432617, "global_step": 279142, "epoch": 2306} {"train_loss": -42.34709548950195, "global_step": 279143, "epoch": 2306} {"train_loss": -42.6479606628418, "global_step": 279144, "epoch": 2306} {"train_loss": -43.1561279296875, "global_step": 279145, "epoch": 2306} {"train_loss": -40.51473507211228, "global_step": 279146, "epoch": 2306, "val_loss": 2499306.25} {"train_loss": -42.061256408691406, "global_step": 279147, "epoch": 2307} {"train_loss": -41.883052825927734, "global_step": 279148, "epoch": 2307} {"train_loss": -42.498043060302734, "global_step": 279149, "epoch": 2307} {"train_loss": -42.125022888183594, "global_step": 279150, "epoch": 2307} {"train_loss": -41.90621566772461, "global_step": 279151, "epoch": 2307} {"train_loss": -43.2070426940918, "global_step": 279152, "epoch": 2307} {"train_loss": -43.0721549987793, "global_step": 279153, "epoch": 2307} {"train_loss": -42.86623764038086, "global_step": 279154, "epoch": 2307} {"train_loss": -42.11195755004883, "global_step": 279155, "epoch": 2307} {"train_loss": -42.659725189208984, "global_step": 279156, "epoch": 2307} {"train_loss": -42.73299789428711, "global_step": 279157, "epoch": 2307} {"train_loss": -43.470741271972656, "global_step": 279158, "epoch": 2307} {"train_loss": -42.850032806396484, "global_step": 279159, "epoch": 2307} {"train_loss": -43.14936447143555, "global_step": 279160, "epoch": 2307} {"train_loss": -43.49705123901367, "global_step": 279161, "epoch": 2307} {"train_loss": -43.26507568359375, "global_step": 279162, "epoch": 2307} {"train_loss": -43.46675491333008, "global_step": 279163, "epoch": 2307} {"train_loss": -43.47719192504883, "global_step": 279164, "epoch": 2307} {"train_loss": -43.140541076660156, "global_step": 279165, "epoch": 2307} {"train_loss": -43.19181442260742, "global_step": 279166, "epoch": 2307} {"train_loss": -43.04463577270508, "global_step": 279167, "epoch": 2307} {"train_loss": -43.288909912109375, "global_step": 279168, "epoch": 2307} {"train_loss": -42.32060241699219, "global_step": 279169, "epoch": 2307} {"train_loss": -43.34649658203125, "global_step": 279170, "epoch": 2307} {"train_loss": -43.35433578491211, "global_step": 279171, "epoch": 2307} {"train_loss": -43.12881088256836, "global_step": 279172, "epoch": 2307} {"train_loss": -43.02727508544922, "global_step": 279173, "epoch": 2307} {"train_loss": -43.22576904296875, "global_step": 279174, "epoch": 2307} {"train_loss": -42.8717041015625, "global_step": 279175, "epoch": 2307} {"train_loss": -43.25100326538086, "global_step": 279176, "epoch": 2307} {"train_loss": -43.34285354614258, "global_step": 279177, "epoch": 2307} {"train_loss": -43.17356491088867, "global_step": 279178, "epoch": 2307} {"train_loss": -43.46757888793945, "global_step": 279179, "epoch": 2307} {"train_loss": -43.5072021484375, "global_step": 279180, "epoch": 2307} {"train_loss": -42.49201583862305, "global_step": 279181, "epoch": 2307} {"train_loss": -43.25897979736328, "global_step": 279182, "epoch": 2307} {"train_loss": -43.42151641845703, "global_step": 279183, "epoch": 2307} {"train_loss": -43.5103645324707, "global_step": 279184, "epoch": 2307} {"train_loss": -43.0574836730957, "global_step": 279185, "epoch": 2307} {"train_loss": -43.256805419921875, "global_step": 279186, "epoch": 2307} {"train_loss": -43.45076370239258, "global_step": 279187, "epoch": 2307} {"train_loss": -43.395565032958984, "global_step": 279188, "epoch": 2307} {"train_loss": -43.460636138916016, "global_step": 279189, "epoch": 2307} {"train_loss": -43.1221809387207, "global_step": 279190, "epoch": 2307} {"train_loss": -42.44253158569336, "global_step": 279191, "epoch": 2307} {"train_loss": -42.349609375, "global_step": 279192, "epoch": 2307} {"train_loss": -42.7888069152832, "global_step": 279193, "epoch": 2307} {"train_loss": -42.319488525390625, "global_step": 279194, "epoch": 2307} {"train_loss": -42.85493850708008, "global_step": 279195, "epoch": 2307} {"train_loss": -42.918983459472656, "global_step": 279196, "epoch": 2307} {"train_loss": -43.546730041503906, "global_step": 279197, "epoch": 2307} {"train_loss": -43.10493850708008, "global_step": 279198, "epoch": 2307} {"train_loss": -42.12311935424805, "global_step": 279199, "epoch": 2307} {"train_loss": -42.825130462646484, "global_step": 279200, "epoch": 2307} {"train_loss": -43.2503776550293, "global_step": 279201, "epoch": 2307} {"train_loss": -43.430023193359375, "global_step": 279202, "epoch": 2307} {"train_loss": -42.95741653442383, "global_step": 279203, "epoch": 2307} {"train_loss": -43.24515914916992, "global_step": 279204, "epoch": 2307} {"train_loss": -43.44016647338867, "global_step": 279205, "epoch": 2307} {"train_loss": -42.779502868652344, "global_step": 279206, "epoch": 2307} {"train_loss": -43.3956413269043, "global_step": 279207, "epoch": 2307} {"train_loss": -43.42094802856445, "global_step": 279208, "epoch": 2307} {"train_loss": -43.40045928955078, "global_step": 279209, "epoch": 2307} {"train_loss": -43.6300163269043, "global_step": 279210, "epoch": 2307} {"train_loss": -43.248138427734375, "global_step": 279211, "epoch": 2307} {"train_loss": -43.314727783203125, "global_step": 279212, "epoch": 2307} {"train_loss": -41.99457550048828, "global_step": 279213, "epoch": 2307} {"train_loss": -42.1323356628418, "global_step": 279214, "epoch": 2307} {"train_loss": -43.640262603759766, "global_step": 279215, "epoch": 2307} {"train_loss": -43.697608947753906, "global_step": 279216, "epoch": 2307} {"train_loss": -43.19364929199219, "global_step": 279217, "epoch": 2307} {"train_loss": -42.9921760559082, "global_step": 279218, "epoch": 2307} {"train_loss": -43.36085891723633, "global_step": 279219, "epoch": 2307} {"train_loss": -42.1208381652832, "global_step": 279220, "epoch": 2307} {"train_loss": -43.394039154052734, "global_step": 279221, "epoch": 2307} {"train_loss": -42.86571502685547, "global_step": 279222, "epoch": 2307} {"train_loss": -41.24939727783203, "global_step": 279223, "epoch": 2307} {"train_loss": -43.525630950927734, "global_step": 279224, "epoch": 2307} {"train_loss": -42.25101852416992, "global_step": 279225, "epoch": 2307} {"train_loss": -42.56843185424805, "global_step": 279226, "epoch": 2307} {"train_loss": -42.581146240234375, "global_step": 279227, "epoch": 2307} {"train_loss": -42.40236282348633, "global_step": 279228, "epoch": 2307} {"train_loss": -42.0946044921875, "global_step": 279229, "epoch": 2307} {"train_loss": -41.81071853637695, "global_step": 279230, "epoch": 2307} {"train_loss": -43.0897102355957, "global_step": 279231, "epoch": 2307} {"train_loss": -43.2498779296875, "global_step": 279232, "epoch": 2307} {"train_loss": -43.45911407470703, "global_step": 279233, "epoch": 2307} {"train_loss": -42.8095817565918, "global_step": 279234, "epoch": 2307} {"train_loss": -42.3460807800293, "global_step": 279235, "epoch": 2307} {"train_loss": -42.518733978271484, "global_step": 279236, "epoch": 2307} {"train_loss": -42.88447952270508, "global_step": 279237, "epoch": 2307} {"train_loss": -41.181068420410156, "global_step": 279238, "epoch": 2307} {"train_loss": -42.80694580078125, "global_step": 279239, "epoch": 2307} {"train_loss": -41.4072151184082, "global_step": 279240, "epoch": 2307} {"train_loss": -40.938987731933594, "global_step": 279241, "epoch": 2307} {"train_loss": -42.002437591552734, "global_step": 279242, "epoch": 2307} {"train_loss": -42.73933029174805, "global_step": 279243, "epoch": 2307} {"train_loss": -41.0442008972168, "global_step": 279244, "epoch": 2307} {"train_loss": -40.75797653198242, "global_step": 279245, "epoch": 2307} {"train_loss": -42.35578536987305, "global_step": 279246, "epoch": 2307} {"train_loss": -42.331817626953125, "global_step": 279247, "epoch": 2307} {"train_loss": -40.006439208984375, "global_step": 279248, "epoch": 2307} {"train_loss": -41.51609420776367, "global_step": 279249, "epoch": 2307} {"train_loss": -42.30552291870117, "global_step": 279250, "epoch": 2307} {"train_loss": -42.19635009765625, "global_step": 279251, "epoch": 2307} {"train_loss": -40.616329193115234, "global_step": 279252, "epoch": 2307} {"train_loss": -41.2368049621582, "global_step": 279253, "epoch": 2307} {"train_loss": -42.39967346191406, "global_step": 279254, "epoch": 2307} {"train_loss": -42.35013961791992, "global_step": 279255, "epoch": 2307} {"train_loss": -41.86368942260742, "global_step": 279256, "epoch": 2307} {"train_loss": -42.51761245727539, "global_step": 279257, "epoch": 2307} {"train_loss": -42.436767578125, "global_step": 279258, "epoch": 2307} {"train_loss": -42.1512565612793, "global_step": 279259, "epoch": 2307} {"train_loss": -40.97856140136719, "global_step": 279260, "epoch": 2307} {"train_loss": -42.7550048828125, "global_step": 279261, "epoch": 2307} {"train_loss": -42.32331085205078, "global_step": 279262, "epoch": 2307} {"train_loss": -42.20243453979492, "global_step": 279263, "epoch": 2307} {"train_loss": -42.49720001220703, "global_step": 279264, "epoch": 2307} {"train_loss": -42.75582504272461, "global_step": 279265, "epoch": 2307} {"train_loss": -42.36067581176758, "global_step": 279266, "epoch": 2307} {"train_loss": -42.692132461169535, "global_step": 279267, "epoch": 2307, "val_loss": 2478721.0} {"train_loss": -43.21146774291992, "global_step": 279268, "epoch": 2308} {"train_loss": -42.98162078857422, "global_step": 279269, "epoch": 2308} {"train_loss": -42.83687973022461, "global_step": 279270, "epoch": 2308} {"train_loss": -42.995155334472656, "global_step": 279271, "epoch": 2308} {"train_loss": -43.31024932861328, "global_step": 279272, "epoch": 2308} {"train_loss": -43.33842086791992, "global_step": 279273, "epoch": 2308} {"train_loss": -43.15853500366211, "global_step": 279274, "epoch": 2308} {"train_loss": -43.046844482421875, "global_step": 279275, "epoch": 2308} {"train_loss": -43.43197250366211, "global_step": 279276, "epoch": 2308} {"train_loss": -43.2125358581543, "global_step": 279277, "epoch": 2308} {"train_loss": -42.80203628540039, "global_step": 279278, "epoch": 2308} {"train_loss": -42.969146728515625, "global_step": 279279, "epoch": 2308} {"train_loss": -43.24729537963867, "global_step": 279280, "epoch": 2308} {"train_loss": -43.12094497680664, "global_step": 279281, "epoch": 2308} {"train_loss": -43.04469680786133, "global_step": 279282, "epoch": 2308} {"train_loss": -43.331275939941406, "global_step": 279283, "epoch": 2308} {"train_loss": -42.81075668334961, "global_step": 279284, "epoch": 2308} {"train_loss": -42.66719436645508, "global_step": 279285, "epoch": 2308} {"train_loss": -43.470703125, "global_step": 279286, "epoch": 2308} {"train_loss": -43.0111083984375, "global_step": 279287, "epoch": 2308} {"train_loss": -42.24995803833008, "global_step": 279288, "epoch": 2308} {"train_loss": -42.918922424316406, "global_step": 279289, "epoch": 2308} {"train_loss": -43.49978256225586, "global_step": 279290, "epoch": 2308} {"train_loss": -43.20191192626953, "global_step": 279291, "epoch": 2308} {"train_loss": -41.967132568359375, "global_step": 279292, "epoch": 2308} {"train_loss": -43.46424102783203, "global_step": 279293, "epoch": 2308} {"train_loss": -43.136653900146484, "global_step": 279294, "epoch": 2308} {"train_loss": -42.56220626831055, "global_step": 279295, "epoch": 2308} {"train_loss": -42.5086669921875, "global_step": 279296, "epoch": 2308} {"train_loss": -42.771034240722656, "global_step": 279297, "epoch": 2308} {"train_loss": -42.99186325073242, "global_step": 279298, "epoch": 2308} {"train_loss": -43.531612396240234, "global_step": 279299, "epoch": 2308} {"train_loss": -43.2276496887207, "global_step": 279300, "epoch": 2308} {"train_loss": -43.26850891113281, "global_step": 279301, "epoch": 2308} {"train_loss": -42.567413330078125, "global_step": 279302, "epoch": 2308} {"train_loss": -43.981300354003906, "global_step": 279303, "epoch": 2308} {"train_loss": -42.40996170043945, "global_step": 279304, "epoch": 2308} {"train_loss": -42.91688919067383, "global_step": 279305, "epoch": 2308} {"train_loss": -42.06327438354492, "global_step": 279306, "epoch": 2308} {"train_loss": -41.72077178955078, "global_step": 279307, "epoch": 2308} {"train_loss": -40.454898834228516, "global_step": 279308, "epoch": 2308} {"train_loss": -41.85942077636719, "global_step": 279309, "epoch": 2308} {"train_loss": -43.30552291870117, "global_step": 279310, "epoch": 2308} {"train_loss": -43.03691482543945, "global_step": 279311, "epoch": 2308} {"train_loss": -41.923065185546875, "global_step": 279312, "epoch": 2308} {"train_loss": -42.11787033081055, "global_step": 279313, "epoch": 2308} {"train_loss": -42.80665969848633, "global_step": 279314, "epoch": 2308} {"train_loss": -43.475990295410156, "global_step": 279315, "epoch": 2308} {"train_loss": -43.857276916503906, "global_step": 279316, "epoch": 2308} {"train_loss": -43.124000549316406, "global_step": 279317, "epoch": 2308} {"train_loss": -43.12455368041992, "global_step": 279318, "epoch": 2308} {"train_loss": -43.269569396972656, "global_step": 279319, "epoch": 2308} {"train_loss": -43.613033294677734, "global_step": 279320, "epoch": 2308} {"train_loss": -42.16935348510742, "global_step": 279321, "epoch": 2308} {"train_loss": -41.07577133178711, "global_step": 279322, "epoch": 2308} {"train_loss": -42.6528434753418, "global_step": 279323, "epoch": 2308} {"train_loss": -43.41190719604492, "global_step": 279324, "epoch": 2308} {"train_loss": -41.546363830566406, "global_step": 279325, "epoch": 2308} {"train_loss": -41.587738037109375, "global_step": 279326, "epoch": 2308} {"train_loss": -43.61973190307617, "global_step": 279327, "epoch": 2308} {"train_loss": -42.35196304321289, "global_step": 279328, "epoch": 2308} {"train_loss": -42.30179214477539, "global_step": 279329, "epoch": 2308} {"train_loss": -43.44032669067383, "global_step": 279330, "epoch": 2308} {"train_loss": -42.26983642578125, "global_step": 279331, "epoch": 2308} {"train_loss": -41.186161041259766, "global_step": 279332, "epoch": 2308} {"train_loss": -43.391151428222656, "global_step": 279333, "epoch": 2308} {"train_loss": -42.34086990356445, "global_step": 279334, "epoch": 2308} {"train_loss": -42.40906524658203, "global_step": 279335, "epoch": 2308} {"train_loss": -43.0735969543457, "global_step": 279336, "epoch": 2308} {"train_loss": -42.51987838745117, "global_step": 279337, "epoch": 2308} {"train_loss": -42.87520980834961, "global_step": 279338, "epoch": 2308} {"train_loss": -43.01776123046875, "global_step": 279339, "epoch": 2308} {"train_loss": -42.86423110961914, "global_step": 279340, "epoch": 2308} {"train_loss": -41.073883056640625, "global_step": 279341, "epoch": 2308} {"train_loss": -43.40822982788086, "global_step": 279342, "epoch": 2308} {"train_loss": -41.858821868896484, "global_step": 279343, "epoch": 2308} {"train_loss": -40.76958084106445, "global_step": 279344, "epoch": 2308} {"train_loss": -42.571224212646484, "global_step": 279345, "epoch": 2308} {"train_loss": -42.2015380859375, "global_step": 279346, "epoch": 2308} {"train_loss": -42.7718620300293, "global_step": 279347, "epoch": 2308} {"train_loss": -41.99599075317383, "global_step": 279348, "epoch": 2308} {"train_loss": -41.86043167114258, "global_step": 279349, "epoch": 2308} {"train_loss": -43.158058166503906, "global_step": 279350, "epoch": 2308} {"train_loss": -41.740577697753906, "global_step": 279351, "epoch": 2308} {"train_loss": -42.4558219909668, "global_step": 279352, "epoch": 2308} {"train_loss": -42.431697845458984, "global_step": 279353, "epoch": 2308} {"train_loss": -42.09591293334961, "global_step": 279354, "epoch": 2308} {"train_loss": -41.87309265136719, "global_step": 279355, "epoch": 2308} {"train_loss": -42.06304931640625, "global_step": 279356, "epoch": 2308} {"train_loss": -42.42219161987305, "global_step": 279357, "epoch": 2308} {"train_loss": -42.82746887207031, "global_step": 279358, "epoch": 2308} {"train_loss": -42.152565002441406, "global_step": 279359, "epoch": 2308} {"train_loss": -42.3451042175293, "global_step": 279360, "epoch": 2308} {"train_loss": -42.6448860168457, "global_step": 279361, "epoch": 2308} {"train_loss": -43.90916061401367, "global_step": 279362, "epoch": 2308} {"train_loss": -41.8643798828125, "global_step": 279363, "epoch": 2308} {"train_loss": -42.842891693115234, "global_step": 279364, "epoch": 2308} {"train_loss": -42.924068450927734, "global_step": 279365, "epoch": 2308} {"train_loss": -43.20856857299805, "global_step": 279366, "epoch": 2308} {"train_loss": -43.51897048950195, "global_step": 279367, "epoch": 2308} {"train_loss": -43.51675033569336, "global_step": 279368, "epoch": 2308} {"train_loss": -43.37441635131836, "global_step": 279369, "epoch": 2308} {"train_loss": -43.69489669799805, "global_step": 279370, "epoch": 2308} {"train_loss": -43.49784851074219, "global_step": 279371, "epoch": 2308} {"train_loss": -43.7120361328125, "global_step": 279372, "epoch": 2308} {"train_loss": -42.77708053588867, "global_step": 279373, "epoch": 2308} {"train_loss": -43.79410171508789, "global_step": 279374, "epoch": 2308} {"train_loss": -43.33445358276367, "global_step": 279375, "epoch": 2308} {"train_loss": -42.83613967895508, "global_step": 279376, "epoch": 2308} {"train_loss": -43.43365478515625, "global_step": 279377, "epoch": 2308} {"train_loss": -42.02584457397461, "global_step": 279378, "epoch": 2308} {"train_loss": -42.70234298706055, "global_step": 279379, "epoch": 2308} {"train_loss": -42.329750061035156, "global_step": 279380, "epoch": 2308} {"train_loss": -43.785526275634766, "global_step": 279381, "epoch": 2308} {"train_loss": -42.46466827392578, "global_step": 279382, "epoch": 2308} {"train_loss": -43.209495544433594, "global_step": 279383, "epoch": 2308} {"train_loss": -43.05978012084961, "global_step": 279384, "epoch": 2308} {"train_loss": -42.54293441772461, "global_step": 279385, "epoch": 2308} {"train_loss": -42.75565719604492, "global_step": 279386, "epoch": 2308} {"train_loss": -43.0703239440918, "global_step": 279387, "epoch": 2308} {"train_loss": -42.765247029706465, "global_step": 279388, "epoch": 2308, "val_loss": 2441405.0} {"train_loss": -43.08208084106445, "global_step": 279389, "epoch": 2309} {"train_loss": -43.40684127807617, "global_step": 279390, "epoch": 2309} {"train_loss": -42.82856369018555, "global_step": 279391, "epoch": 2309} {"train_loss": -41.36666488647461, "global_step": 279392, "epoch": 2309} {"train_loss": -42.964603424072266, "global_step": 279393, "epoch": 2309} {"train_loss": -42.45539474487305, "global_step": 279394, "epoch": 2309} {"train_loss": -43.13724899291992, "global_step": 279395, "epoch": 2309} {"train_loss": -42.35845947265625, "global_step": 279396, "epoch": 2309} {"train_loss": -42.32209396362305, "global_step": 279397, "epoch": 2309} {"train_loss": -42.4097785949707, "global_step": 279398, "epoch": 2309} {"train_loss": -43.177833557128906, "global_step": 279399, "epoch": 2309} {"train_loss": -43.38111114501953, "global_step": 279400, "epoch": 2309} {"train_loss": -43.05059051513672, "global_step": 279401, "epoch": 2309} {"train_loss": -42.96723556518555, "global_step": 279402, "epoch": 2309} {"train_loss": -43.598304748535156, "global_step": 279403, "epoch": 2309} {"train_loss": -43.31853103637695, "global_step": 279404, "epoch": 2309} {"train_loss": -43.11272048950195, "global_step": 279405, "epoch": 2309} {"train_loss": -43.670143127441406, "global_step": 279406, "epoch": 2309} {"train_loss": -43.100852966308594, "global_step": 279407, "epoch": 2309} {"train_loss": -43.21757888793945, "global_step": 279408, "epoch": 2309} {"train_loss": -43.3039436340332, "global_step": 279409, "epoch": 2309} {"train_loss": -43.48307418823242, "global_step": 279410, "epoch": 2309} {"train_loss": -42.654991149902344, "global_step": 279411, "epoch": 2309} {"train_loss": -41.4759407043457, "global_step": 279412, "epoch": 2309} {"train_loss": -42.828426361083984, "global_step": 279413, "epoch": 2309} {"train_loss": -43.019039154052734, "global_step": 279414, "epoch": 2309} {"train_loss": -43.42367172241211, "global_step": 279415, "epoch": 2309} {"train_loss": -42.70780563354492, "global_step": 279416, "epoch": 2309} {"train_loss": -43.0467643737793, "global_step": 279417, "epoch": 2309} {"train_loss": -42.7590217590332, "global_step": 279418, "epoch": 2309} {"train_loss": -42.73814392089844, "global_step": 279419, "epoch": 2309} {"train_loss": -43.337867736816406, "global_step": 279420, "epoch": 2309} {"train_loss": -42.070823669433594, "global_step": 279421, "epoch": 2309} {"train_loss": -42.75443649291992, "global_step": 279422, "epoch": 2309} {"train_loss": -43.444515228271484, "global_step": 279423, "epoch": 2309} {"train_loss": -42.379058837890625, "global_step": 279424, "epoch": 2309} {"train_loss": -43.145259857177734, "global_step": 279425, "epoch": 2309} {"train_loss": -43.77530288696289, "global_step": 279426, "epoch": 2309} {"train_loss": -42.756526947021484, "global_step": 279427, "epoch": 2309} {"train_loss": -43.22663497924805, "global_step": 279428, "epoch": 2309} {"train_loss": -43.56399154663086, "global_step": 279429, "epoch": 2309} {"train_loss": -42.15985870361328, "global_step": 279430, "epoch": 2309} {"train_loss": -43.0952262878418, "global_step": 279431, "epoch": 2309} {"train_loss": -43.320552825927734, "global_step": 279432, "epoch": 2309} {"train_loss": -43.40266799926758, "global_step": 279433, "epoch": 2309} {"train_loss": -43.76591110229492, "global_step": 279434, "epoch": 2309} {"train_loss": -43.15024948120117, "global_step": 279435, "epoch": 2309} {"train_loss": -41.813507080078125, "global_step": 279436, "epoch": 2309} {"train_loss": -41.79580307006836, "global_step": 279437, "epoch": 2309} {"train_loss": -42.06331253051758, "global_step": 279438, "epoch": 2309} {"train_loss": -41.440277099609375, "global_step": 279439, "epoch": 2309} {"train_loss": -42.71029281616211, "global_step": 279440, "epoch": 2309} {"train_loss": -42.89329147338867, "global_step": 279441, "epoch": 2309} {"train_loss": -43.13446044921875, "global_step": 279442, "epoch": 2309} {"train_loss": -43.501007080078125, "global_step": 279443, "epoch": 2309} {"train_loss": -43.202816009521484, "global_step": 279444, "epoch": 2309} {"train_loss": -43.11136245727539, "global_step": 279445, "epoch": 2309} {"train_loss": -43.045204162597656, "global_step": 279446, "epoch": 2309} {"train_loss": -43.45574188232422, "global_step": 279447, "epoch": 2309} {"train_loss": -43.57046127319336, "global_step": 279448, "epoch": 2309} {"train_loss": -43.49590301513672, "global_step": 279449, "epoch": 2309} {"train_loss": -43.86794662475586, "global_step": 279450, "epoch": 2309} {"train_loss": -43.48988342285156, "global_step": 279451, "epoch": 2309} {"train_loss": -43.69257736206055, "global_step": 279452, "epoch": 2309} {"train_loss": -42.942867279052734, "global_step": 279453, "epoch": 2309} {"train_loss": -39.38086700439453, "global_step": 279454, "epoch": 2309} {"train_loss": -41.09723663330078, "global_step": 279455, "epoch": 2309} {"train_loss": -43.571388244628906, "global_step": 279456, "epoch": 2309} {"train_loss": -43.54612350463867, "global_step": 279457, "epoch": 2309} {"train_loss": -43.34259796142578, "global_step": 279458, "epoch": 2309} {"train_loss": -42.636505126953125, "global_step": 279459, "epoch": 2309} {"train_loss": -43.74979782104492, "global_step": 279460, "epoch": 2309} {"train_loss": -42.46786117553711, "global_step": 279461, "epoch": 2309} {"train_loss": -43.045711517333984, "global_step": 279462, "epoch": 2309} {"train_loss": -42.726654052734375, "global_step": 279463, "epoch": 2309} {"train_loss": -42.790374755859375, "global_step": 279464, "epoch": 2309} {"train_loss": -43.65903854370117, "global_step": 279465, "epoch": 2309} {"train_loss": -43.942440032958984, "global_step": 279466, "epoch": 2309} {"train_loss": -43.164794921875, "global_step": 279467, "epoch": 2309} {"train_loss": -44.389442443847656, "global_step": 279468, "epoch": 2309} {"train_loss": -43.16934585571289, "global_step": 279469, "epoch": 2309} {"train_loss": -43.76187515258789, "global_step": 279470, "epoch": 2309} {"train_loss": -43.6351432800293, "global_step": 279471, "epoch": 2309} {"train_loss": -42.32033920288086, "global_step": 279472, "epoch": 2309} {"train_loss": -43.34299850463867, "global_step": 279473, "epoch": 2309} {"train_loss": -43.694190979003906, "global_step": 279474, "epoch": 2309} {"train_loss": -39.60157775878906, "global_step": 279475, "epoch": 2309} {"train_loss": -43.30152130126953, "global_step": 279476, "epoch": 2309} {"train_loss": -43.823360443115234, "global_step": 279477, "epoch": 2309} {"train_loss": -41.00874328613281, "global_step": 279478, "epoch": 2309} {"train_loss": -42.88726806640625, "global_step": 279479, "epoch": 2309} {"train_loss": -40.2779541015625, "global_step": 279480, "epoch": 2309} {"train_loss": -42.93272018432617, "global_step": 279481, "epoch": 2309} {"train_loss": -41.92403793334961, "global_step": 279482, "epoch": 2309} {"train_loss": -38.57907485961914, "global_step": 279483, "epoch": 2309} {"train_loss": -42.217159271240234, "global_step": 279484, "epoch": 2309} {"train_loss": -41.158138275146484, "global_step": 279485, "epoch": 2309} {"train_loss": -41.963172912597656, "global_step": 279486, "epoch": 2309} {"train_loss": -35.431453704833984, "global_step": 279487, "epoch": 2309} {"train_loss": -38.269691467285156, "global_step": 279488, "epoch": 2309} {"train_loss": -38.881866455078125, "global_step": 279489, "epoch": 2309} {"train_loss": -39.05723190307617, "global_step": 279490, "epoch": 2309} {"train_loss": -38.11410140991211, "global_step": 279491, "epoch": 2309} {"train_loss": -38.90472412109375, "global_step": 279492, "epoch": 2309} {"train_loss": -40.80544662475586, "global_step": 279493, "epoch": 2309} {"train_loss": -41.37980651855469, "global_step": 279494, "epoch": 2309} {"train_loss": -42.47883987426758, "global_step": 279495, "epoch": 2309} {"train_loss": -41.08057403564453, "global_step": 279496, "epoch": 2309} {"train_loss": -40.410926818847656, "global_step": 279497, "epoch": 2309} {"train_loss": -42.14980697631836, "global_step": 279498, "epoch": 2309} {"train_loss": -39.3788948059082, "global_step": 279499, "epoch": 2309} {"train_loss": -39.832298278808594, "global_step": 279500, "epoch": 2309} {"train_loss": -38.24210739135742, "global_step": 279501, "epoch": 2309} {"train_loss": -40.084144592285156, "global_step": 279502, "epoch": 2309} {"train_loss": -39.973140716552734, "global_step": 279503, "epoch": 2309} {"train_loss": -41.55828857421875, "global_step": 279504, "epoch": 2309} {"train_loss": -36.73424530029297, "global_step": 279505, "epoch": 2309} {"train_loss": -39.185829162597656, "global_step": 279506, "epoch": 2309} {"train_loss": -36.59560012817383, "global_step": 279507, "epoch": 2309} {"train_loss": -39.21064376831055, "global_step": 279508, "epoch": 2309} {"train_loss": -42.14402856117438, "global_step": 279509, "epoch": 2309, "val_loss": 2601088.25} {"train_loss": -33.11518859863281, "global_step": 279510, "epoch": 2310} {"train_loss": -37.30625534057617, "global_step": 279511, "epoch": 2310} {"train_loss": -36.43182373046875, "global_step": 279512, "epoch": 2310} {"train_loss": -40.49994659423828, "global_step": 279513, "epoch": 2310} {"train_loss": -35.157466888427734, "global_step": 279514, "epoch": 2310} {"train_loss": -38.88004684448242, "global_step": 279515, "epoch": 2310} {"train_loss": -40.67609786987305, "global_step": 279516, "epoch": 2310} {"train_loss": -36.91228103637695, "global_step": 279517, "epoch": 2310} {"train_loss": -40.928260803222656, "global_step": 279518, "epoch": 2310} {"train_loss": -38.902164459228516, "global_step": 279519, "epoch": 2310} {"train_loss": -37.93529510498047, "global_step": 279520, "epoch": 2310} {"train_loss": -41.645790100097656, "global_step": 279521, "epoch": 2310} {"train_loss": -40.67367172241211, "global_step": 279522, "epoch": 2310} {"train_loss": -40.2730712890625, "global_step": 279523, "epoch": 2310} {"train_loss": -40.92542266845703, "global_step": 279524, "epoch": 2310} {"train_loss": -40.894710540771484, "global_step": 279525, "epoch": 2310} {"train_loss": -40.148651123046875, "global_step": 279526, "epoch": 2310} {"train_loss": -41.7616081237793, "global_step": 279527, "epoch": 2310} {"train_loss": -41.44558334350586, "global_step": 279528, "epoch": 2310} {"train_loss": -40.792877197265625, "global_step": 279529, "epoch": 2310} {"train_loss": -42.459144592285156, "global_step": 279530, "epoch": 2310} {"train_loss": -41.85017776489258, "global_step": 279531, "epoch": 2310} {"train_loss": -40.523738861083984, "global_step": 279532, "epoch": 2310} {"train_loss": -42.016719818115234, "global_step": 279533, "epoch": 2310} {"train_loss": -40.87575912475586, "global_step": 279534, "epoch": 2310} {"train_loss": -40.90450668334961, "global_step": 279535, "epoch": 2310} {"train_loss": -40.33534622192383, "global_step": 279536, "epoch": 2310} {"train_loss": -42.210601806640625, "global_step": 279537, "epoch": 2310} {"train_loss": -42.01508712768555, "global_step": 279538, "epoch": 2310} {"train_loss": -41.59049987792969, "global_step": 279539, "epoch": 2310} {"train_loss": -42.820716857910156, "global_step": 279540, "epoch": 2310} {"train_loss": -42.3699951171875, "global_step": 279541, "epoch": 2310} {"train_loss": -41.64725875854492, "global_step": 279542, "epoch": 2310} {"train_loss": -42.107913970947266, "global_step": 279543, "epoch": 2310} {"train_loss": -41.447505950927734, "global_step": 279544, "epoch": 2310} {"train_loss": -42.37977981567383, "global_step": 279545, "epoch": 2310} {"train_loss": -41.98371124267578, "global_step": 279546, "epoch": 2310} {"train_loss": -41.64704132080078, "global_step": 279547, "epoch": 2310} {"train_loss": -42.4647216796875, "global_step": 279548, "epoch": 2310} {"train_loss": -42.3812141418457, "global_step": 279549, "epoch": 2310} {"train_loss": -42.12324905395508, "global_step": 279550, "epoch": 2310} {"train_loss": -42.567195892333984, "global_step": 279551, "epoch": 2310} {"train_loss": -42.560646057128906, "global_step": 279552, "epoch": 2310} {"train_loss": -40.80695724487305, "global_step": 279553, "epoch": 2310} {"train_loss": -41.2900276184082, "global_step": 279554, "epoch": 2310} {"train_loss": -41.91402053833008, "global_step": 279555, "epoch": 2310} {"train_loss": -42.88121032714844, "global_step": 279556, "epoch": 2310} {"train_loss": -42.24055099487305, "global_step": 279557, "epoch": 2310} {"train_loss": -42.71409225463867, "global_step": 279558, "epoch": 2310} {"train_loss": -42.10733413696289, "global_step": 279559, "epoch": 2310} {"train_loss": -42.45966720581055, "global_step": 279560, "epoch": 2310} {"train_loss": -43.06060791015625, "global_step": 279561, "epoch": 2310} {"train_loss": -41.5091438293457, "global_step": 279562, "epoch": 2310} {"train_loss": -13.508918762207031, "global_step": 279563, "epoch": 2310} {"train_loss": -28.616575241088867, "global_step": 279564, "epoch": 2310} {"train_loss": -35.8817024230957, "global_step": 279565, "epoch": 2310} {"train_loss": -41.815643310546875, "global_step": 279566, "epoch": 2310} {"train_loss": -39.490169525146484, "global_step": 279567, "epoch": 2310} {"train_loss": -32.15065383911133, "global_step": 279568, "epoch": 2310} {"train_loss": -34.178646087646484, "global_step": 279569, "epoch": 2310} {"train_loss": -40.21154022216797, "global_step": 279570, "epoch": 2310} {"train_loss": -39.26609420776367, "global_step": 279571, "epoch": 2310} {"train_loss": -19.61371421813965, "global_step": 279572, "epoch": 2310} {"train_loss": -32.98130416870117, "global_step": 279573, "epoch": 2310} {"train_loss": -38.84226608276367, "global_step": 279574, "epoch": 2310} {"train_loss": -35.60968017578125, "global_step": 279575, "epoch": 2310} {"train_loss": -39.423614501953125, "global_step": 279576, "epoch": 2310} {"train_loss": -36.96839141845703, "global_step": 279577, "epoch": 2310} {"train_loss": -34.850563049316406, "global_step": 279578, "epoch": 2310} {"train_loss": -35.770118713378906, "global_step": 279579, "epoch": 2310} {"train_loss": -28.606103897094727, "global_step": 279580, "epoch": 2310} {"train_loss": -39.185733795166016, "global_step": 279581, "epoch": 2310} {"train_loss": -38.541847229003906, "global_step": 279582, "epoch": 2310} {"train_loss": -38.69227981567383, "global_step": 279583, "epoch": 2310} {"train_loss": -32.5827751159668, "global_step": 279584, "epoch": 2310} {"train_loss": -36.85056686401367, "global_step": 279585, "epoch": 2310} {"train_loss": -39.061763763427734, "global_step": 279586, "epoch": 2310} {"train_loss": -38.783870697021484, "global_step": 279587, "epoch": 2310} {"train_loss": -38.47226333618164, "global_step": 279588, "epoch": 2310} {"train_loss": -38.224639892578125, "global_step": 279589, "epoch": 2310} {"train_loss": -39.338497161865234, "global_step": 279590, "epoch": 2310} {"train_loss": -38.82146072387695, "global_step": 279591, "epoch": 2310} {"train_loss": -38.593231201171875, "global_step": 279592, "epoch": 2310} {"train_loss": -39.54163360595703, "global_step": 279593, "epoch": 2310} {"train_loss": -39.45479965209961, "global_step": 279594, "epoch": 2310} {"train_loss": -39.23057556152344, "global_step": 279595, "epoch": 2310} {"train_loss": -38.4966926574707, "global_step": 279596, "epoch": 2310} {"train_loss": -39.64017105102539, "global_step": 279597, "epoch": 2310} {"train_loss": -40.43961715698242, "global_step": 279598, "epoch": 2310} {"train_loss": -39.15401840209961, "global_step": 279599, "epoch": 2310} {"train_loss": -38.92024612426758, "global_step": 279600, "epoch": 2310} {"train_loss": -40.50112533569336, "global_step": 279601, "epoch": 2310} {"train_loss": -39.67427444458008, "global_step": 279602, "epoch": 2310} {"train_loss": -39.48596954345703, "global_step": 279603, "epoch": 2310} {"train_loss": -39.61323165893555, "global_step": 279604, "epoch": 2310} {"train_loss": -40.60775375366211, "global_step": 279605, "epoch": 2310} {"train_loss": -40.736263275146484, "global_step": 279606, "epoch": 2310} {"train_loss": -39.83160400390625, "global_step": 279607, "epoch": 2310} {"train_loss": -39.83748245239258, "global_step": 279608, "epoch": 2310} {"train_loss": -40.55010986328125, "global_step": 279609, "epoch": 2310} {"train_loss": -40.392330169677734, "global_step": 279610, "epoch": 2310} {"train_loss": -40.71512985229492, "global_step": 279611, "epoch": 2310} {"train_loss": -40.19409942626953, "global_step": 279612, "epoch": 2310} {"train_loss": -39.283077239990234, "global_step": 279613, "epoch": 2310} {"train_loss": -40.015987396240234, "global_step": 279614, "epoch": 2310} {"train_loss": -39.732418060302734, "global_step": 279615, "epoch": 2310} {"train_loss": -41.127899169921875, "global_step": 279616, "epoch": 2310} {"train_loss": -41.46413803100586, "global_step": 279617, "epoch": 2310} {"train_loss": -40.62562942504883, "global_step": 279618, "epoch": 2310} {"train_loss": -39.80152130126953, "global_step": 279619, "epoch": 2310} {"train_loss": -41.099090576171875, "global_step": 279620, "epoch": 2310} {"train_loss": -41.484771728515625, "global_step": 279621, "epoch": 2310} {"train_loss": -40.5477409362793, "global_step": 279622, "epoch": 2310} {"train_loss": -41.04848861694336, "global_step": 279623, "epoch": 2310} {"train_loss": -40.70980453491211, "global_step": 279624, "epoch": 2310} {"train_loss": -40.81003952026367, "global_step": 279625, "epoch": 2310} {"train_loss": -41.395301818847656, "global_step": 279626, "epoch": 2310} {"train_loss": -41.59933090209961, "global_step": 279627, "epoch": 2310} {"train_loss": -40.69440460205078, "global_step": 279628, "epoch": 2310} {"train_loss": -40.37708282470703, "global_step": 279629, "epoch": 2310} {"train_loss": -39.38103540278664, "global_step": 279630, "epoch": 2310, "val_loss": 2473899.75} {"train_loss": -40.78703689575195, "global_step": 279631, "epoch": 2311} {"train_loss": -41.65639877319336, "global_step": 279632, "epoch": 2311} {"train_loss": -41.424800872802734, "global_step": 279633, "epoch": 2311} {"train_loss": -41.782257080078125, "global_step": 279634, "epoch": 2311} {"train_loss": -40.67615509033203, "global_step": 279635, "epoch": 2311} {"train_loss": -40.81056213378906, "global_step": 279636, "epoch": 2311} {"train_loss": -41.2879753112793, "global_step": 279637, "epoch": 2311} {"train_loss": -41.084781646728516, "global_step": 279638, "epoch": 2311} {"train_loss": -40.83882522583008, "global_step": 279639, "epoch": 2311} {"train_loss": -42.13544845581055, "global_step": 279640, "epoch": 2311} {"train_loss": -41.972660064697266, "global_step": 279641, "epoch": 2311} {"train_loss": -42.03181838989258, "global_step": 279642, "epoch": 2311} {"train_loss": -41.72597885131836, "global_step": 279643, "epoch": 2311} {"train_loss": -42.05739974975586, "global_step": 279644, "epoch": 2311} {"train_loss": -41.8047981262207, "global_step": 279645, "epoch": 2311} {"train_loss": -41.22956085205078, "global_step": 279646, "epoch": 2311} {"train_loss": -42.26829147338867, "global_step": 279647, "epoch": 2311} {"train_loss": -41.7662353515625, "global_step": 279648, "epoch": 2311} {"train_loss": -41.90818786621094, "global_step": 279649, "epoch": 2311} {"train_loss": -42.08992385864258, "global_step": 279650, "epoch": 2311} {"train_loss": -42.4348258972168, "global_step": 279651, "epoch": 2311} {"train_loss": -41.479835510253906, "global_step": 279652, "epoch": 2311} {"train_loss": -41.36898422241211, "global_step": 279653, "epoch": 2311} {"train_loss": -41.89896774291992, "global_step": 279654, "epoch": 2311} {"train_loss": -42.476966857910156, "global_step": 279655, "epoch": 2311} {"train_loss": -43.1368522644043, "global_step": 279656, "epoch": 2311} {"train_loss": -41.635894775390625, "global_step": 279657, "epoch": 2311} {"train_loss": -41.72926330566406, "global_step": 279658, "epoch": 2311} {"train_loss": -40.7857666015625, "global_step": 279659, "epoch": 2311} {"train_loss": -42.44108963012695, "global_step": 279660, "epoch": 2311} {"train_loss": -42.0319709777832, "global_step": 279661, "epoch": 2311} {"train_loss": -41.14802169799805, "global_step": 279662, "epoch": 2311} {"train_loss": -42.940731048583984, "global_step": 279663, "epoch": 2311} {"train_loss": -41.68366622924805, "global_step": 279664, "epoch": 2311} {"train_loss": -41.50651168823242, "global_step": 279665, "epoch": 2311} {"train_loss": -42.382266998291016, "global_step": 279666, "epoch": 2311} {"train_loss": -42.07888412475586, "global_step": 279667, "epoch": 2311} {"train_loss": -42.325111389160156, "global_step": 279668, "epoch": 2311} {"train_loss": -42.873661041259766, "global_step": 279669, "epoch": 2311} {"train_loss": -42.95427322387695, "global_step": 279670, "epoch": 2311} {"train_loss": -42.42887878417969, "global_step": 279671, "epoch": 2311} {"train_loss": -41.60087203979492, "global_step": 279672, "epoch": 2311} {"train_loss": -42.862178802490234, "global_step": 279673, "epoch": 2311} {"train_loss": -42.87244415283203, "global_step": 279674, "epoch": 2311} {"train_loss": -42.60872268676758, "global_step": 279675, "epoch": 2311} {"train_loss": -42.585601806640625, "global_step": 279676, "epoch": 2311} {"train_loss": -41.877685546875, "global_step": 279677, "epoch": 2311} {"train_loss": -42.768123626708984, "global_step": 279678, "epoch": 2311} {"train_loss": -42.23031997680664, "global_step": 279679, "epoch": 2311} {"train_loss": -42.26456832885742, "global_step": 279680, "epoch": 2311} {"train_loss": -42.337371826171875, "global_step": 279681, "epoch": 2311} {"train_loss": -42.6064567565918, "global_step": 279682, "epoch": 2311} {"train_loss": -42.459991455078125, "global_step": 279683, "epoch": 2311} {"train_loss": -42.51634979248047, "global_step": 279684, "epoch": 2311} {"train_loss": -42.9925537109375, "global_step": 279685, "epoch": 2311} {"train_loss": -42.50539016723633, "global_step": 279686, "epoch": 2311} {"train_loss": -42.10520935058594, "global_step": 279687, "epoch": 2311} {"train_loss": -43.07434844970703, "global_step": 279688, "epoch": 2311} {"train_loss": -41.69655227661133, "global_step": 279689, "epoch": 2311} {"train_loss": -41.545692443847656, "global_step": 279690, "epoch": 2311} {"train_loss": -42.705684661865234, "global_step": 279691, "epoch": 2311} {"train_loss": -43.051448822021484, "global_step": 279692, "epoch": 2311} {"train_loss": -42.159366607666016, "global_step": 279693, "epoch": 2311} {"train_loss": -43.21731185913086, "global_step": 279694, "epoch": 2311} {"train_loss": -43.1292839050293, "global_step": 279695, "epoch": 2311} {"train_loss": -42.953182220458984, "global_step": 279696, "epoch": 2311} {"train_loss": -43.23408126831055, "global_step": 279697, "epoch": 2311} {"train_loss": -42.805362701416016, "global_step": 279698, "epoch": 2311} {"train_loss": -43.065086364746094, "global_step": 279699, "epoch": 2311} {"train_loss": -42.419551849365234, "global_step": 279700, "epoch": 2311} {"train_loss": -43.103851318359375, "global_step": 279701, "epoch": 2311} {"train_loss": -40.881324768066406, "global_step": 279702, "epoch": 2311} {"train_loss": -42.87746810913086, "global_step": 279703, "epoch": 2311} {"train_loss": -42.868858337402344, "global_step": 279704, "epoch": 2311} {"train_loss": -41.63682174682617, "global_step": 279705, "epoch": 2311} {"train_loss": -42.550777435302734, "global_step": 279706, "epoch": 2311} {"train_loss": -43.29193878173828, "global_step": 279707, "epoch": 2311} {"train_loss": -42.46885299682617, "global_step": 279708, "epoch": 2311} {"train_loss": -43.08658981323242, "global_step": 279709, "epoch": 2311} {"train_loss": -43.19792556762695, "global_step": 279710, "epoch": 2311} {"train_loss": -42.219573974609375, "global_step": 279711, "epoch": 2311} {"train_loss": -43.40510940551758, "global_step": 279712, "epoch": 2311} {"train_loss": -42.4423828125, "global_step": 279713, "epoch": 2311} {"train_loss": -41.861934661865234, "global_step": 279714, "epoch": 2311} {"train_loss": -42.57868957519531, "global_step": 279715, "epoch": 2311} {"train_loss": -42.31809997558594, "global_step": 279716, "epoch": 2311} {"train_loss": -41.93394088745117, "global_step": 279717, "epoch": 2311} {"train_loss": -42.800838470458984, "global_step": 279718, "epoch": 2311} {"train_loss": -43.07432174682617, "global_step": 279719, "epoch": 2311} {"train_loss": -42.454776763916016, "global_step": 279720, "epoch": 2311} {"train_loss": -42.87313461303711, "global_step": 279721, "epoch": 2311} {"train_loss": -43.38628387451172, "global_step": 279722, "epoch": 2311} {"train_loss": -42.81435012817383, "global_step": 279723, "epoch": 2311} {"train_loss": -43.469390869140625, "global_step": 279724, "epoch": 2311} {"train_loss": -42.46377182006836, "global_step": 279725, "epoch": 2311} {"train_loss": -42.983036041259766, "global_step": 279726, "epoch": 2311} {"train_loss": -43.13990020751953, "global_step": 279727, "epoch": 2311} {"train_loss": -40.98179244995117, "global_step": 279728, "epoch": 2311} {"train_loss": -42.46308898925781, "global_step": 279729, "epoch": 2311} {"train_loss": -40.4850959777832, "global_step": 279730, "epoch": 2311} {"train_loss": -42.26805114746094, "global_step": 279731, "epoch": 2311} {"train_loss": -42.59662628173828, "global_step": 279732, "epoch": 2311} {"train_loss": -42.61181640625, "global_step": 279733, "epoch": 2311} {"train_loss": -43.00682830810547, "global_step": 279734, "epoch": 2311} {"train_loss": -42.54278564453125, "global_step": 279735, "epoch": 2311} {"train_loss": -41.69918441772461, "global_step": 279736, "epoch": 2311} {"train_loss": -42.99614715576172, "global_step": 279737, "epoch": 2311} {"train_loss": -42.40037536621094, "global_step": 279738, "epoch": 2311} {"train_loss": -42.82074737548828, "global_step": 279739, "epoch": 2311} {"train_loss": -42.15149688720703, "global_step": 279740, "epoch": 2311} {"train_loss": -43.126373291015625, "global_step": 279741, "epoch": 2311} {"train_loss": -41.969970703125, "global_step": 279742, "epoch": 2311} {"train_loss": -42.964900970458984, "global_step": 279743, "epoch": 2311} {"train_loss": -42.963924407958984, "global_step": 279744, "epoch": 2311} {"train_loss": -43.38625717163086, "global_step": 279745, "epoch": 2311} {"train_loss": -42.65143585205078, "global_step": 279746, "epoch": 2311} {"train_loss": -42.658390045166016, "global_step": 279747, "epoch": 2311} {"train_loss": -42.35493087768555, "global_step": 279748, "epoch": 2311} {"train_loss": -41.844512939453125, "global_step": 279749, "epoch": 2311} {"train_loss": -42.20616149902344, "global_step": 279750, "epoch": 2311} {"train_loss": -42.308089768591, "global_step": 279751, "epoch": 2311, "val_loss": 2426757.25} {"train_loss": -42.59062576293945, "global_step": 279752, "epoch": 2312} {"train_loss": -42.9606819152832, "global_step": 279753, "epoch": 2312} {"train_loss": -42.87579345703125, "global_step": 279754, "epoch": 2312} {"train_loss": -41.96738052368164, "global_step": 279755, "epoch": 2312} {"train_loss": -42.36259078979492, "global_step": 279756, "epoch": 2312} {"train_loss": -41.07963562011719, "global_step": 279757, "epoch": 2312} {"train_loss": -42.52021408081055, "global_step": 279758, "epoch": 2312} {"train_loss": -41.1760368347168, "global_step": 279759, "epoch": 2312} {"train_loss": -41.20491409301758, "global_step": 279760, "epoch": 2312} {"train_loss": -42.72355270385742, "global_step": 279761, "epoch": 2312} {"train_loss": -42.4874267578125, "global_step": 279762, "epoch": 2312} {"train_loss": -42.97821044921875, "global_step": 279763, "epoch": 2312} {"train_loss": -43.12489318847656, "global_step": 279764, "epoch": 2312} {"train_loss": -42.92688751220703, "global_step": 279765, "epoch": 2312} {"train_loss": -42.39896774291992, "global_step": 279766, "epoch": 2312} {"train_loss": -41.845245361328125, "global_step": 279767, "epoch": 2312} {"train_loss": -42.2967643737793, "global_step": 279768, "epoch": 2312} {"train_loss": -42.95835494995117, "global_step": 279769, "epoch": 2312} {"train_loss": -42.56031036376953, "global_step": 279770, "epoch": 2312} {"train_loss": -42.76579666137695, "global_step": 279771, "epoch": 2312} {"train_loss": -42.5645866394043, "global_step": 279772, "epoch": 2312} {"train_loss": -42.751953125, "global_step": 279773, "epoch": 2312} {"train_loss": -42.11573028564453, "global_step": 279774, "epoch": 2312} {"train_loss": -39.647300720214844, "global_step": 279775, "epoch": 2312} {"train_loss": -38.150848388671875, "global_step": 279776, "epoch": 2312} {"train_loss": -40.08987045288086, "global_step": 279777, "epoch": 2312} {"train_loss": -41.58315658569336, "global_step": 279778, "epoch": 2312} {"train_loss": -42.27851486206055, "global_step": 279779, "epoch": 2312} {"train_loss": -41.02207565307617, "global_step": 279780, "epoch": 2312} {"train_loss": -40.2481575012207, "global_step": 279781, "epoch": 2312} {"train_loss": -39.6692008972168, "global_step": 279782, "epoch": 2312} {"train_loss": -41.728755950927734, "global_step": 279783, "epoch": 2312} {"train_loss": -42.19049835205078, "global_step": 279784, "epoch": 2312} {"train_loss": -41.87498092651367, "global_step": 279785, "epoch": 2312} {"train_loss": -42.471126556396484, "global_step": 279786, "epoch": 2312} {"train_loss": -39.564449310302734, "global_step": 279787, "epoch": 2312} {"train_loss": -36.51612091064453, "global_step": 279788, "epoch": 2312} {"train_loss": -38.65787887573242, "global_step": 279789, "epoch": 2312} {"train_loss": -42.70201873779297, "global_step": 279790, "epoch": 2312} {"train_loss": -39.69761276245117, "global_step": 279791, "epoch": 2312} {"train_loss": -37.01528549194336, "global_step": 279792, "epoch": 2312} {"train_loss": -41.10831832885742, "global_step": 279793, "epoch": 2312} {"train_loss": -41.713172912597656, "global_step": 279794, "epoch": 2312} {"train_loss": -39.450897216796875, "global_step": 279795, "epoch": 2312} {"train_loss": -41.21068572998047, "global_step": 279796, "epoch": 2312} {"train_loss": -41.03880310058594, "global_step": 279797, "epoch": 2312} {"train_loss": -41.55181884765625, "global_step": 279798, "epoch": 2312} {"train_loss": -41.856754302978516, "global_step": 279799, "epoch": 2312} {"train_loss": -40.72343063354492, "global_step": 279800, "epoch": 2312} {"train_loss": -42.416439056396484, "global_step": 279801, "epoch": 2312} {"train_loss": -41.38340377807617, "global_step": 279802, "epoch": 2312} {"train_loss": -40.215179443359375, "global_step": 279803, "epoch": 2312} {"train_loss": -42.93634796142578, "global_step": 279804, "epoch": 2312} {"train_loss": -41.22428894042969, "global_step": 279805, "epoch": 2312} {"train_loss": -41.6977653503418, "global_step": 279806, "epoch": 2312} {"train_loss": -42.23357391357422, "global_step": 279807, "epoch": 2312} {"train_loss": -41.21029281616211, "global_step": 279808, "epoch": 2312} {"train_loss": -42.79990768432617, "global_step": 279809, "epoch": 2312} {"train_loss": -41.437049865722656, "global_step": 279810, "epoch": 2312} {"train_loss": -42.97711181640625, "global_step": 279811, "epoch": 2312} {"train_loss": -41.008235931396484, "global_step": 279812, "epoch": 2312} {"train_loss": -41.247283935546875, "global_step": 279813, "epoch": 2312} {"train_loss": -42.76691818237305, "global_step": 279814, "epoch": 2312} {"train_loss": -41.41630554199219, "global_step": 279815, "epoch": 2312} {"train_loss": -42.6508903503418, "global_step": 279816, "epoch": 2312} {"train_loss": -41.533241271972656, "global_step": 279817, "epoch": 2312} {"train_loss": -41.606258392333984, "global_step": 279818, "epoch": 2312} {"train_loss": -41.616058349609375, "global_step": 279819, "epoch": 2312} {"train_loss": -42.28933334350586, "global_step": 279820, "epoch": 2312} {"train_loss": -41.873653411865234, "global_step": 279821, "epoch": 2312} {"train_loss": -42.456298828125, "global_step": 279822, "epoch": 2312} {"train_loss": -42.64044189453125, "global_step": 279823, "epoch": 2312} {"train_loss": -42.819183349609375, "global_step": 279824, "epoch": 2312} {"train_loss": -42.05152893066406, "global_step": 279825, "epoch": 2312} {"train_loss": -42.0541877746582, "global_step": 279826, "epoch": 2312} {"train_loss": -42.308189392089844, "global_step": 279827, "epoch": 2312} {"train_loss": -42.84644317626953, "global_step": 279828, "epoch": 2312} {"train_loss": -42.487361907958984, "global_step": 279829, "epoch": 2312} {"train_loss": -42.59083938598633, "global_step": 279830, "epoch": 2312} {"train_loss": -42.51902389526367, "global_step": 279831, "epoch": 2312} {"train_loss": -43.25323486328125, "global_step": 279832, "epoch": 2312} {"train_loss": -42.322418212890625, "global_step": 279833, "epoch": 2312} {"train_loss": -43.210811614990234, "global_step": 279834, "epoch": 2312} {"train_loss": -43.18388748168945, "global_step": 279835, "epoch": 2312} {"train_loss": -43.37828826904297, "global_step": 279836, "epoch": 2312} {"train_loss": -42.6079216003418, "global_step": 279837, "epoch": 2312} {"train_loss": -43.35073471069336, "global_step": 279838, "epoch": 2312} {"train_loss": -42.79578399658203, "global_step": 279839, "epoch": 2312} {"train_loss": -43.64378356933594, "global_step": 279840, "epoch": 2312} {"train_loss": -42.52864074707031, "global_step": 279841, "epoch": 2312} {"train_loss": -42.6848030090332, "global_step": 279842, "epoch": 2312} {"train_loss": -42.403076171875, "global_step": 279843, "epoch": 2312} {"train_loss": -42.9752082824707, "global_step": 279844, "epoch": 2312} {"train_loss": -43.71453094482422, "global_step": 279845, "epoch": 2312} {"train_loss": -42.46644973754883, "global_step": 279846, "epoch": 2312} {"train_loss": -43.061737060546875, "global_step": 279847, "epoch": 2312} {"train_loss": -42.552825927734375, "global_step": 279848, "epoch": 2312} {"train_loss": -42.82942581176758, "global_step": 279849, "epoch": 2312} {"train_loss": -42.58586502075195, "global_step": 279850, "epoch": 2312} {"train_loss": -42.81568145751953, "global_step": 279851, "epoch": 2312} {"train_loss": -42.33156204223633, "global_step": 279852, "epoch": 2312} {"train_loss": -42.905494689941406, "global_step": 279853, "epoch": 2312} {"train_loss": -43.04494857788086, "global_step": 279854, "epoch": 2312} {"train_loss": -42.13497543334961, "global_step": 279855, "epoch": 2312} {"train_loss": -43.10087966918945, "global_step": 279856, "epoch": 2312} {"train_loss": -43.07624435424805, "global_step": 279857, "epoch": 2312} {"train_loss": -43.79688262939453, "global_step": 279858, "epoch": 2312} {"train_loss": -42.837974548339844, "global_step": 279859, "epoch": 2312} {"train_loss": -42.750362396240234, "global_step": 279860, "epoch": 2312} {"train_loss": -43.36772918701172, "global_step": 279861, "epoch": 2312} {"train_loss": -43.36588668823242, "global_step": 279862, "epoch": 2312} {"train_loss": -43.05591583251953, "global_step": 279863, "epoch": 2312} {"train_loss": -43.57624053955078, "global_step": 279864, "epoch": 2312} {"train_loss": -43.128074645996094, "global_step": 279865, "epoch": 2312} {"train_loss": -43.31733322143555, "global_step": 279866, "epoch": 2312} {"train_loss": -43.364837646484375, "global_step": 279867, "epoch": 2312} {"train_loss": -42.98142623901367, "global_step": 279868, "epoch": 2312} {"train_loss": -43.061092376708984, "global_step": 279869, "epoch": 2312} {"train_loss": -42.93906784057617, "global_step": 279870, "epoch": 2312} {"train_loss": -43.01225662231445, "global_step": 279871, "epoch": 2312} {"train_loss": -42.10338955083169, "global_step": 279872, "epoch": 2312, "val_loss": 2476894.5} {"train_loss": -43.24544906616211, "global_step": 279873, "epoch": 2313} {"train_loss": -42.387943267822266, "global_step": 279874, "epoch": 2313} {"train_loss": -41.63090896606445, "global_step": 279875, "epoch": 2313} {"train_loss": -42.28564453125, "global_step": 279876, "epoch": 2313} {"train_loss": -43.25471115112305, "global_step": 279877, "epoch": 2313} {"train_loss": -42.509090423583984, "global_step": 279878, "epoch": 2313} {"train_loss": -39.96710205078125, "global_step": 279879, "epoch": 2313} {"train_loss": -40.91895294189453, "global_step": 279880, "epoch": 2313} {"train_loss": -42.45572280883789, "global_step": 279881, "epoch": 2313} {"train_loss": -41.74003219604492, "global_step": 279882, "epoch": 2313} {"train_loss": -41.26613235473633, "global_step": 279883, "epoch": 2313} {"train_loss": -40.326107025146484, "global_step": 279884, "epoch": 2313} {"train_loss": -40.640316009521484, "global_step": 279885, "epoch": 2313} {"train_loss": -40.805538177490234, "global_step": 279886, "epoch": 2313} {"train_loss": -40.871761322021484, "global_step": 279887, "epoch": 2313} {"train_loss": -41.149208068847656, "global_step": 279888, "epoch": 2313} {"train_loss": -41.705562591552734, "global_step": 279889, "epoch": 2313} {"train_loss": -41.08933639526367, "global_step": 279890, "epoch": 2313} {"train_loss": -41.94103240966797, "global_step": 279891, "epoch": 2313} {"train_loss": -41.2224235534668, "global_step": 279892, "epoch": 2313} {"train_loss": -42.4946403503418, "global_step": 279893, "epoch": 2313} {"train_loss": -41.47860336303711, "global_step": 279894, "epoch": 2313} {"train_loss": -41.824493408203125, "global_step": 279895, "epoch": 2313} {"train_loss": -42.00275421142578, "global_step": 279896, "epoch": 2313} {"train_loss": -41.99886703491211, "global_step": 279897, "epoch": 2313} {"train_loss": -42.117347717285156, "global_step": 279898, "epoch": 2313} {"train_loss": -42.357452392578125, "global_step": 279899, "epoch": 2313} {"train_loss": -40.74837112426758, "global_step": 279900, "epoch": 2313} {"train_loss": -42.11091232299805, "global_step": 279901, "epoch": 2313} {"train_loss": -41.75673294067383, "global_step": 279902, "epoch": 2313} {"train_loss": -42.2506103515625, "global_step": 279903, "epoch": 2313} {"train_loss": -41.004859924316406, "global_step": 279904, "epoch": 2313} {"train_loss": -42.61338424682617, "global_step": 279905, "epoch": 2313} {"train_loss": -41.3989372253418, "global_step": 279906, "epoch": 2313} {"train_loss": -41.39899826049805, "global_step": 279907, "epoch": 2313} {"train_loss": -41.473018646240234, "global_step": 279908, "epoch": 2313} {"train_loss": -41.4046516418457, "global_step": 279909, "epoch": 2313} {"train_loss": -40.56953048706055, "global_step": 279910, "epoch": 2313} {"train_loss": -42.28607940673828, "global_step": 279911, "epoch": 2313} {"train_loss": -40.23732376098633, "global_step": 279912, "epoch": 2313} {"train_loss": -41.27317428588867, "global_step": 279913, "epoch": 2313} {"train_loss": -41.53276062011719, "global_step": 279914, "epoch": 2313} {"train_loss": -40.38639450073242, "global_step": 279915, "epoch": 2313} {"train_loss": -41.68931198120117, "global_step": 279916, "epoch": 2313} {"train_loss": -40.11223220825195, "global_step": 279917, "epoch": 2313} {"train_loss": -41.170204162597656, "global_step": 279918, "epoch": 2313} {"train_loss": -41.19762420654297, "global_step": 279919, "epoch": 2313} {"train_loss": -41.35160446166992, "global_step": 279920, "epoch": 2313} {"train_loss": -41.29791259765625, "global_step": 279921, "epoch": 2313} {"train_loss": -42.457855224609375, "global_step": 279922, "epoch": 2313} {"train_loss": -41.2347526550293, "global_step": 279923, "epoch": 2313} {"train_loss": -41.4528923034668, "global_step": 279924, "epoch": 2313} {"train_loss": -41.71159744262695, "global_step": 279925, "epoch": 2313} {"train_loss": -41.67191696166992, "global_step": 279926, "epoch": 2313} {"train_loss": -42.38250732421875, "global_step": 279927, "epoch": 2313} {"train_loss": -41.48495101928711, "global_step": 279928, "epoch": 2313} {"train_loss": -42.74049758911133, "global_step": 279929, "epoch": 2313} {"train_loss": -41.50386428833008, "global_step": 279930, "epoch": 2313} {"train_loss": -42.8132438659668, "global_step": 279931, "epoch": 2313} {"train_loss": -42.22152328491211, "global_step": 279932, "epoch": 2313} {"train_loss": -42.27737045288086, "global_step": 279933, "epoch": 2313} {"train_loss": -42.402069091796875, "global_step": 279934, "epoch": 2313} {"train_loss": -41.7059440612793, "global_step": 279935, "epoch": 2313} {"train_loss": -43.06763458251953, "global_step": 279936, "epoch": 2313} {"train_loss": -42.447792053222656, "global_step": 279937, "epoch": 2313} {"train_loss": -43.237548828125, "global_step": 279938, "epoch": 2313} {"train_loss": -42.78253173828125, "global_step": 279939, "epoch": 2313} {"train_loss": -41.9393310546875, "global_step": 279940, "epoch": 2313} {"train_loss": -43.316436767578125, "global_step": 279941, "epoch": 2313} {"train_loss": -42.688026428222656, "global_step": 279942, "epoch": 2313} {"train_loss": -42.867164611816406, "global_step": 279943, "epoch": 2313} {"train_loss": -42.640743255615234, "global_step": 279944, "epoch": 2313} {"train_loss": -43.12005615234375, "global_step": 279945, "epoch": 2313} {"train_loss": -43.231483459472656, "global_step": 279946, "epoch": 2313} {"train_loss": -43.02543258666992, "global_step": 279947, "epoch": 2313} {"train_loss": -43.02702331542969, "global_step": 279948, "epoch": 2313} {"train_loss": -42.64109420776367, "global_step": 279949, "epoch": 2313} {"train_loss": -43.021671295166016, "global_step": 279950, "epoch": 2313} {"train_loss": -43.19855880737305, "global_step": 279951, "epoch": 2313} {"train_loss": -43.27996826171875, "global_step": 279952, "epoch": 2313} {"train_loss": -43.10145568847656, "global_step": 279953, "epoch": 2313} {"train_loss": -43.45951461791992, "global_step": 279954, "epoch": 2313} {"train_loss": -43.38767623901367, "global_step": 279955, "epoch": 2313} {"train_loss": -43.25550079345703, "global_step": 279956, "epoch": 2313} {"train_loss": -43.30158996582031, "global_step": 279957, "epoch": 2313} {"train_loss": -43.34536361694336, "global_step": 279958, "epoch": 2313} {"train_loss": -43.12364196777344, "global_step": 279959, "epoch": 2313} {"train_loss": -43.56310272216797, "global_step": 279960, "epoch": 2313} {"train_loss": -43.39403533935547, "global_step": 279961, "epoch": 2313} {"train_loss": -43.22505569458008, "global_step": 279962, "epoch": 2313} {"train_loss": -43.451900482177734, "global_step": 279963, "epoch": 2313} {"train_loss": -44.223873138427734, "global_step": 279964, "epoch": 2313} {"train_loss": -43.352474212646484, "global_step": 279965, "epoch": 2313} {"train_loss": -43.94260787963867, "global_step": 279966, "epoch": 2313} {"train_loss": -43.88276290893555, "global_step": 279967, "epoch": 2313} {"train_loss": -43.66434860229492, "global_step": 279968, "epoch": 2313} {"train_loss": -43.50423049926758, "global_step": 279969, "epoch": 2313} {"train_loss": -43.50274658203125, "global_step": 279970, "epoch": 2313} {"train_loss": -43.62581253051758, "global_step": 279971, "epoch": 2313} {"train_loss": -43.405967712402344, "global_step": 279972, "epoch": 2313} {"train_loss": -43.832698822021484, "global_step": 279973, "epoch": 2313} {"train_loss": -42.901512145996094, "global_step": 279974, "epoch": 2313} {"train_loss": -43.614501953125, "global_step": 279975, "epoch": 2313} {"train_loss": -43.22575759887695, "global_step": 279976, "epoch": 2313} {"train_loss": -43.37236404418945, "global_step": 279977, "epoch": 2313} {"train_loss": -43.2224235534668, "global_step": 279978, "epoch": 2313} {"train_loss": -43.994022369384766, "global_step": 279979, "epoch": 2313} {"train_loss": -43.30668258666992, "global_step": 279980, "epoch": 2313} {"train_loss": -43.31415939331055, "global_step": 279981, "epoch": 2313} {"train_loss": -43.09077835083008, "global_step": 279982, "epoch": 2313} {"train_loss": -42.3535041809082, "global_step": 279983, "epoch": 2313} {"train_loss": -43.187774658203125, "global_step": 279984, "epoch": 2313} {"train_loss": -43.154266357421875, "global_step": 279985, "epoch": 2313} {"train_loss": -43.985877990722656, "global_step": 279986, "epoch": 2313} {"train_loss": -43.72245788574219, "global_step": 279987, "epoch": 2313} {"train_loss": -43.13173294067383, "global_step": 279988, "epoch": 2313} {"train_loss": -42.19942092895508, "global_step": 279989, "epoch": 2313} {"train_loss": -41.552650451660156, "global_step": 279990, "epoch": 2313} {"train_loss": -42.54853820800781, "global_step": 279991, "epoch": 2313} {"train_loss": -42.86800003051758, "global_step": 279992, "epoch": 2313} {"train_loss": -42.3721792047674, "global_step": 279993, "epoch": 2313, "val_loss": 2499287.0} {"train_loss": -41.981964111328125, "global_step": 279994, "epoch": 2314} {"train_loss": -42.6033821105957, "global_step": 279995, "epoch": 2314} {"train_loss": -41.63779830932617, "global_step": 279996, "epoch": 2314} {"train_loss": -42.273502349853516, "global_step": 279997, "epoch": 2314} {"train_loss": -42.562957763671875, "global_step": 279998, "epoch": 2314} {"train_loss": -40.19343185424805, "global_step": 279999, "epoch": 2314} {"train_loss": -43.47011947631836, "global_step": 280000, "epoch": 2314} {"train_loss": -42.93845748901367, "global_step": 280001, "epoch": 2314} {"train_loss": -42.787811279296875, "global_step": 280002, "epoch": 2314} {"train_loss": -42.26841735839844, "global_step": 280003, "epoch": 2314} {"train_loss": -40.64996337890625, "global_step": 280004, "epoch": 2314} {"train_loss": -42.74318313598633, "global_step": 280005, "epoch": 2314} {"train_loss": -43.58171463012695, "global_step": 280006, "epoch": 2314} {"train_loss": -43.0595703125, "global_step": 280007, "epoch": 2314} {"train_loss": -39.17490768432617, "global_step": 280008, "epoch": 2314} {"train_loss": -40.18857192993164, "global_step": 280009, "epoch": 2314} {"train_loss": -37.27973556518555, "global_step": 280010, "epoch": 2314} {"train_loss": -43.07598114013672, "global_step": 280011, "epoch": 2314} {"train_loss": -36.68381118774414, "global_step": 280012, "epoch": 2314} {"train_loss": -40.266632080078125, "global_step": 280013, "epoch": 2314} {"train_loss": -41.931190490722656, "global_step": 280014, "epoch": 2314} {"train_loss": -40.87358093261719, "global_step": 280015, "epoch": 2314} {"train_loss": -38.524932861328125, "global_step": 280016, "epoch": 2314} {"train_loss": -41.76717758178711, "global_step": 280017, "epoch": 2314} {"train_loss": -42.30133819580078, "global_step": 280018, "epoch": 2314} {"train_loss": -28.35944938659668, "global_step": 280019, "epoch": 2314} {"train_loss": -32.22605514526367, "global_step": 280020, "epoch": 2314} {"train_loss": -40.1560173034668, "global_step": 280021, "epoch": 2314} {"train_loss": -40.597164154052734, "global_step": 280022, "epoch": 2314} {"train_loss": -36.651309967041016, "global_step": 280023, "epoch": 2314} {"train_loss": -41.17343521118164, "global_step": 280024, "epoch": 2314} {"train_loss": -37.17822265625, "global_step": 280025, "epoch": 2314} {"train_loss": -38.04813003540039, "global_step": 280026, "epoch": 2314} {"train_loss": -37.40509796142578, "global_step": 280027, "epoch": 2314} {"train_loss": -38.7558479309082, "global_step": 280028, "epoch": 2314} {"train_loss": -38.28164291381836, "global_step": 280029, "epoch": 2314} {"train_loss": -37.07869338989258, "global_step": 280030, "epoch": 2314} {"train_loss": -39.85786819458008, "global_step": 280031, "epoch": 2314} {"train_loss": -39.64134979248047, "global_step": 280032, "epoch": 2314} {"train_loss": -35.804264068603516, "global_step": 280033, "epoch": 2314} {"train_loss": -32.295162200927734, "global_step": 280034, "epoch": 2314} {"train_loss": -39.907474517822266, "global_step": 280035, "epoch": 2314} {"train_loss": -40.95164108276367, "global_step": 280036, "epoch": 2314} {"train_loss": -41.171382904052734, "global_step": 280037, "epoch": 2314} {"train_loss": -39.0064582824707, "global_step": 280038, "epoch": 2314} {"train_loss": -39.55442428588867, "global_step": 280039, "epoch": 2314} {"train_loss": -39.7365837097168, "global_step": 280040, "epoch": 2314} {"train_loss": -35.8315315246582, "global_step": 280041, "epoch": 2314} {"train_loss": -38.011043548583984, "global_step": 280042, "epoch": 2314} {"train_loss": -38.6997184753418, "global_step": 280043, "epoch": 2314} {"train_loss": -38.088714599609375, "global_step": 280044, "epoch": 2314} {"train_loss": -38.5693359375, "global_step": 280045, "epoch": 2314} {"train_loss": -37.375240325927734, "global_step": 280046, "epoch": 2314} {"train_loss": -40.296390533447266, "global_step": 280047, "epoch": 2314} {"train_loss": -41.82160568237305, "global_step": 280048, "epoch": 2314} {"train_loss": -30.7092342376709, "global_step": 280049, "epoch": 2314} {"train_loss": -37.33050537109375, "global_step": 280050, "epoch": 2314} {"train_loss": -40.904327392578125, "global_step": 280051, "epoch": 2314} {"train_loss": -37.24007797241211, "global_step": 280052, "epoch": 2314} {"train_loss": -40.89858627319336, "global_step": 280053, "epoch": 2314} {"train_loss": -37.757423400878906, "global_step": 280054, "epoch": 2314} {"train_loss": -40.60704803466797, "global_step": 280055, "epoch": 2314} {"train_loss": -39.3353157043457, "global_step": 280056, "epoch": 2314} {"train_loss": -38.6053581237793, "global_step": 280057, "epoch": 2314} {"train_loss": -40.97947311401367, "global_step": 280058, "epoch": 2314} {"train_loss": -39.95528793334961, "global_step": 280059, "epoch": 2314} {"train_loss": -40.54518508911133, "global_step": 280060, "epoch": 2314} {"train_loss": -38.94736862182617, "global_step": 280061, "epoch": 2314} {"train_loss": -40.063262939453125, "global_step": 280062, "epoch": 2314} {"train_loss": -40.809993743896484, "global_step": 280063, "epoch": 2314} {"train_loss": -40.092262268066406, "global_step": 280064, "epoch": 2314} {"train_loss": -39.90401840209961, "global_step": 280065, "epoch": 2314} {"train_loss": -41.60136032104492, "global_step": 280066, "epoch": 2314} {"train_loss": -37.43804168701172, "global_step": 280067, "epoch": 2314} {"train_loss": -41.49336624145508, "global_step": 280068, "epoch": 2314} {"train_loss": -41.093223571777344, "global_step": 280069, "epoch": 2314} {"train_loss": -41.80432891845703, "global_step": 280070, "epoch": 2314} {"train_loss": -40.7953987121582, "global_step": 280071, "epoch": 2314} {"train_loss": -40.35831832885742, "global_step": 280072, "epoch": 2314} {"train_loss": -41.34823226928711, "global_step": 280073, "epoch": 2314} {"train_loss": -41.25988006591797, "global_step": 280074, "epoch": 2314} {"train_loss": -41.82548141479492, "global_step": 280075, "epoch": 2314} {"train_loss": -40.09029006958008, "global_step": 280076, "epoch": 2314} {"train_loss": -39.46216583251953, "global_step": 280077, "epoch": 2314} {"train_loss": -40.90726852416992, "global_step": 280078, "epoch": 2314} {"train_loss": -38.751808166503906, "global_step": 280079, "epoch": 2314} {"train_loss": -41.97037124633789, "global_step": 280080, "epoch": 2314} {"train_loss": -39.16463851928711, "global_step": 280081, "epoch": 2314} {"train_loss": -41.18609619140625, "global_step": 280082, "epoch": 2314} {"train_loss": -42.01681137084961, "global_step": 280083, "epoch": 2314} {"train_loss": -40.47737503051758, "global_step": 280084, "epoch": 2314} {"train_loss": -41.645877838134766, "global_step": 280085, "epoch": 2314} {"train_loss": -42.07781982421875, "global_step": 280086, "epoch": 2314} {"train_loss": -41.88975524902344, "global_step": 280087, "epoch": 2314} {"train_loss": -41.000160217285156, "global_step": 280088, "epoch": 2314} {"train_loss": -41.515594482421875, "global_step": 280089, "epoch": 2314} {"train_loss": -41.45114517211914, "global_step": 280090, "epoch": 2314} {"train_loss": -41.3497428894043, "global_step": 280091, "epoch": 2314} {"train_loss": -41.100921630859375, "global_step": 280092, "epoch": 2314} {"train_loss": -42.15087127685547, "global_step": 280093, "epoch": 2314} {"train_loss": -41.5848503112793, "global_step": 280094, "epoch": 2314} {"train_loss": -41.4369010925293, "global_step": 280095, "epoch": 2314} {"train_loss": -41.528316497802734, "global_step": 280096, "epoch": 2314} {"train_loss": -42.89620590209961, "global_step": 280097, "epoch": 2314} {"train_loss": -39.779754638671875, "global_step": 280098, "epoch": 2314} {"train_loss": -41.97129440307617, "global_step": 280099, "epoch": 2314} {"train_loss": -41.80670928955078, "global_step": 280100, "epoch": 2314} {"train_loss": -41.059104919433594, "global_step": 280101, "epoch": 2314} {"train_loss": -42.24238586425781, "global_step": 280102, "epoch": 2314} {"train_loss": -42.39570236206055, "global_step": 280103, "epoch": 2314} {"train_loss": -40.02398681640625, "global_step": 280104, "epoch": 2314} {"train_loss": -42.848838806152344, "global_step": 280105, "epoch": 2314} {"train_loss": -42.333160400390625, "global_step": 280106, "epoch": 2314} {"train_loss": -42.614070892333984, "global_step": 280107, "epoch": 2314} {"train_loss": -41.9673957824707, "global_step": 280108, "epoch": 2314} {"train_loss": -42.66860580444336, "global_step": 280109, "epoch": 2314} {"train_loss": -42.07637405395508, "global_step": 280110, "epoch": 2314} {"train_loss": -42.80533981323242, "global_step": 280111, "epoch": 2314} {"train_loss": -42.372989654541016, "global_step": 280112, "epoch": 2314} {"train_loss": -42.30413818359375, "global_step": 280113, "epoch": 2314} {"train_loss": -40.25346560517618, "global_step": 280114, "epoch": 2314, "val_loss": 2469118.0} {"train_loss": -42.391845703125, "global_step": 280115, "epoch": 2315} {"train_loss": -42.674530029296875, "global_step": 280116, "epoch": 2315} {"train_loss": -42.40361785888672, "global_step": 280117, "epoch": 2315} {"train_loss": -42.45291519165039, "global_step": 280118, "epoch": 2315} {"train_loss": -42.182464599609375, "global_step": 280119, "epoch": 2315} {"train_loss": -42.05399703979492, "global_step": 280120, "epoch": 2315} {"train_loss": -42.91486358642578, "global_step": 280121, "epoch": 2315} {"train_loss": -42.3641471862793, "global_step": 280122, "epoch": 2315} {"train_loss": -42.025718688964844, "global_step": 280123, "epoch": 2315} {"train_loss": -40.905303955078125, "global_step": 280124, "epoch": 2315} {"train_loss": -41.22553253173828, "global_step": 280125, "epoch": 2315} {"train_loss": -42.31980514526367, "global_step": 280126, "epoch": 2315} {"train_loss": -42.164730072021484, "global_step": 280127, "epoch": 2315} {"train_loss": -41.73005294799805, "global_step": 280128, "epoch": 2315} {"train_loss": -42.96720504760742, "global_step": 280129, "epoch": 2315} {"train_loss": -43.082000732421875, "global_step": 280130, "epoch": 2315} {"train_loss": -42.85013961791992, "global_step": 280131, "epoch": 2315} {"train_loss": -42.76223373413086, "global_step": 280132, "epoch": 2315} {"train_loss": -42.4428825378418, "global_step": 280133, "epoch": 2315} {"train_loss": -42.6400032043457, "global_step": 280134, "epoch": 2315} {"train_loss": -43.40772247314453, "global_step": 280135, "epoch": 2315} {"train_loss": -43.18972396850586, "global_step": 280136, "epoch": 2315} {"train_loss": -42.77299499511719, "global_step": 280137, "epoch": 2315} {"train_loss": -43.14702224731445, "global_step": 280138, "epoch": 2315} {"train_loss": -43.4368782043457, "global_step": 280139, "epoch": 2315} {"train_loss": -43.03145980834961, "global_step": 280140, "epoch": 2315} {"train_loss": -42.98210906982422, "global_step": 280141, "epoch": 2315} {"train_loss": -41.83604049682617, "global_step": 280142, "epoch": 2315} {"train_loss": -43.66045379638672, "global_step": 280143, "epoch": 2315} {"train_loss": -43.23571014404297, "global_step": 280144, "epoch": 2315} {"train_loss": -41.379390716552734, "global_step": 280145, "epoch": 2315} {"train_loss": -43.021968841552734, "global_step": 280146, "epoch": 2315} {"train_loss": -42.649505615234375, "global_step": 280147, "epoch": 2315} {"train_loss": -43.05323791503906, "global_step": 280148, "epoch": 2315} {"train_loss": -42.7343864440918, "global_step": 280149, "epoch": 2315} {"train_loss": -41.79081344604492, "global_step": 280150, "epoch": 2315} {"train_loss": -43.20648956298828, "global_step": 280151, "epoch": 2315} {"train_loss": -43.30628204345703, "global_step": 280152, "epoch": 2315} {"train_loss": -42.41141891479492, "global_step": 280153, "epoch": 2315} {"train_loss": -43.36201095581055, "global_step": 280154, "epoch": 2315} {"train_loss": -43.29764175415039, "global_step": 280155, "epoch": 2315} {"train_loss": -41.239952087402344, "global_step": 280156, "epoch": 2315} {"train_loss": -42.7700309753418, "global_step": 280157, "epoch": 2315} {"train_loss": -43.12700271606445, "global_step": 280158, "epoch": 2315} {"train_loss": -41.966487884521484, "global_step": 280159, "epoch": 2315} {"train_loss": -43.33663558959961, "global_step": 280160, "epoch": 2315} {"train_loss": -42.292640686035156, "global_step": 280161, "epoch": 2315} {"train_loss": -42.462677001953125, "global_step": 280162, "epoch": 2315} {"train_loss": -42.5037841796875, "global_step": 280163, "epoch": 2315} {"train_loss": -42.166656494140625, "global_step": 280164, "epoch": 2315} {"train_loss": -43.29325866699219, "global_step": 280165, "epoch": 2315} {"train_loss": -42.666011810302734, "global_step": 280166, "epoch": 2315} {"train_loss": -41.97719192504883, "global_step": 280167, "epoch": 2315} {"train_loss": -42.48432540893555, "global_step": 280168, "epoch": 2315} {"train_loss": -42.4842643737793, "global_step": 280169, "epoch": 2315} {"train_loss": -43.043209075927734, "global_step": 280170, "epoch": 2315} {"train_loss": -42.97758865356445, "global_step": 280171, "epoch": 2315} {"train_loss": -41.84406661987305, "global_step": 280172, "epoch": 2315} {"train_loss": -42.736202239990234, "global_step": 280173, "epoch": 2315} {"train_loss": -43.1891975402832, "global_step": 280174, "epoch": 2315} {"train_loss": -42.9755973815918, "global_step": 280175, "epoch": 2315} {"train_loss": -41.858943939208984, "global_step": 280176, "epoch": 2315} {"train_loss": -42.949222564697266, "global_step": 280177, "epoch": 2315} {"train_loss": -43.039546966552734, "global_step": 280178, "epoch": 2315} {"train_loss": -41.855892181396484, "global_step": 280179, "epoch": 2315} {"train_loss": -42.21122360229492, "global_step": 280180, "epoch": 2315} {"train_loss": -41.225013732910156, "global_step": 280181, "epoch": 2315} {"train_loss": -40.865509033203125, "global_step": 280182, "epoch": 2315} {"train_loss": -41.014583587646484, "global_step": 280183, "epoch": 2315} {"train_loss": -41.7701416015625, "global_step": 280184, "epoch": 2315} {"train_loss": -41.64227294921875, "global_step": 280185, "epoch": 2315} {"train_loss": -41.84182357788086, "global_step": 280186, "epoch": 2315} {"train_loss": -42.56657791137695, "global_step": 280187, "epoch": 2315} {"train_loss": -42.23268508911133, "global_step": 280188, "epoch": 2315} {"train_loss": -42.72343826293945, "global_step": 280189, "epoch": 2315} {"train_loss": -42.35392379760742, "global_step": 280190, "epoch": 2315} {"train_loss": -42.48305130004883, "global_step": 280191, "epoch": 2315} {"train_loss": -42.850067138671875, "global_step": 280192, "epoch": 2315} {"train_loss": -42.19812774658203, "global_step": 280193, "epoch": 2315} {"train_loss": -42.60436248779297, "global_step": 280194, "epoch": 2315} {"train_loss": -40.678443908691406, "global_step": 280195, "epoch": 2315} {"train_loss": -39.607383728027344, "global_step": 280196, "epoch": 2315} {"train_loss": -43.39847946166992, "global_step": 280197, "epoch": 2315} {"train_loss": -40.67863464355469, "global_step": 280198, "epoch": 2315} {"train_loss": -41.64272689819336, "global_step": 280199, "epoch": 2315} {"train_loss": -41.80643844604492, "global_step": 280200, "epoch": 2315} {"train_loss": -41.67946243286133, "global_step": 280201, "epoch": 2315} {"train_loss": -40.89875411987305, "global_step": 280202, "epoch": 2315} {"train_loss": -40.6285514831543, "global_step": 280203, "epoch": 2315} {"train_loss": -42.40821075439453, "global_step": 280204, "epoch": 2315} {"train_loss": -40.38125228881836, "global_step": 280205, "epoch": 2315} {"train_loss": -38.66294860839844, "global_step": 280206, "epoch": 2315} {"train_loss": -39.27253341674805, "global_step": 280207, "epoch": 2315} {"train_loss": -38.0252799987793, "global_step": 280208, "epoch": 2315} {"train_loss": -40.30585479736328, "global_step": 280209, "epoch": 2315} {"train_loss": -40.17679977416992, "global_step": 280210, "epoch": 2315} {"train_loss": -41.15444564819336, "global_step": 280211, "epoch": 2315} {"train_loss": -41.427215576171875, "global_step": 280212, "epoch": 2315} {"train_loss": -40.922176361083984, "global_step": 280213, "epoch": 2315} {"train_loss": -40.811092376708984, "global_step": 280214, "epoch": 2315} {"train_loss": -40.34159469604492, "global_step": 280215, "epoch": 2315} {"train_loss": -41.484962463378906, "global_step": 280216, "epoch": 2315} {"train_loss": -40.5333366394043, "global_step": 280217, "epoch": 2315} {"train_loss": -40.57722091674805, "global_step": 280218, "epoch": 2315} {"train_loss": -41.28813171386719, "global_step": 280219, "epoch": 2315} {"train_loss": -41.675289154052734, "global_step": 280220, "epoch": 2315} {"train_loss": -41.52768325805664, "global_step": 280221, "epoch": 2315} {"train_loss": -41.02993392944336, "global_step": 280222, "epoch": 2315} {"train_loss": -40.93941116333008, "global_step": 280223, "epoch": 2315} {"train_loss": -41.38616180419922, "global_step": 280224, "epoch": 2315} {"train_loss": -42.54024124145508, "global_step": 280225, "epoch": 2315} {"train_loss": -41.127052307128906, "global_step": 280226, "epoch": 2315} {"train_loss": -37.34651184082031, "global_step": 280227, "epoch": 2315} {"train_loss": -39.0826301574707, "global_step": 280228, "epoch": 2315} {"train_loss": -41.1756706237793, "global_step": 280229, "epoch": 2315} {"train_loss": -41.99984359741211, "global_step": 280230, "epoch": 2315} {"train_loss": -41.340877532958984, "global_step": 280231, "epoch": 2315} {"train_loss": -39.96122360229492, "global_step": 280232, "epoch": 2315} {"train_loss": -40.36736297607422, "global_step": 280233, "epoch": 2315} {"train_loss": -41.80159378051758, "global_step": 280234, "epoch": 2315} {"train_loss": -41.91995018572847, "global_step": 280235, "epoch": 2315, "val_loss": 2382146.25} {"train_loss": -40.5159797668457, "global_step": 280236, "epoch": 2316} {"train_loss": -38.58852767944336, "global_step": 280237, "epoch": 2316} {"train_loss": -41.75006866455078, "global_step": 280238, "epoch": 2316} {"train_loss": -41.55305862426758, "global_step": 280239, "epoch": 2316} {"train_loss": -41.91626739501953, "global_step": 280240, "epoch": 2316} {"train_loss": -42.42805099487305, "global_step": 280241, "epoch": 2316} {"train_loss": -41.76898193359375, "global_step": 280242, "epoch": 2316} {"train_loss": -42.4724006652832, "global_step": 280243, "epoch": 2316} {"train_loss": -41.94389724731445, "global_step": 280244, "epoch": 2316} {"train_loss": -42.614479064941406, "global_step": 280245, "epoch": 2316} {"train_loss": -42.85319137573242, "global_step": 280246, "epoch": 2316} {"train_loss": -42.38594436645508, "global_step": 280247, "epoch": 2316} {"train_loss": -42.002166748046875, "global_step": 280248, "epoch": 2316} {"train_loss": -41.603084564208984, "global_step": 280249, "epoch": 2316} {"train_loss": -42.27675247192383, "global_step": 280250, "epoch": 2316} {"train_loss": -42.3150749206543, "global_step": 280251, "epoch": 2316} {"train_loss": -42.28702926635742, "global_step": 280252, "epoch": 2316} {"train_loss": -42.52303695678711, "global_step": 280253, "epoch": 2316} {"train_loss": -42.39723587036133, "global_step": 280254, "epoch": 2316} {"train_loss": -42.10557556152344, "global_step": 280255, "epoch": 2316} {"train_loss": -42.26954650878906, "global_step": 280256, "epoch": 2316} {"train_loss": -42.45212173461914, "global_step": 280257, "epoch": 2316} {"train_loss": -42.86527633666992, "global_step": 280258, "epoch": 2316} {"train_loss": -42.929386138916016, "global_step": 280259, "epoch": 2316} {"train_loss": -42.62404251098633, "global_step": 280260, "epoch": 2316} {"train_loss": -42.746341705322266, "global_step": 280261, "epoch": 2316} {"train_loss": -42.790279388427734, "global_step": 280262, "epoch": 2316} {"train_loss": -39.76430130004883, "global_step": 280263, "epoch": 2316} {"train_loss": -43.1472282409668, "global_step": 280264, "epoch": 2316} {"train_loss": -42.24091720581055, "global_step": 280265, "epoch": 2316} {"train_loss": -43.02268600463867, "global_step": 280266, "epoch": 2316} {"train_loss": -42.98057556152344, "global_step": 280267, "epoch": 2316} {"train_loss": -42.81562042236328, "global_step": 280268, "epoch": 2316} {"train_loss": -43.494998931884766, "global_step": 280269, "epoch": 2316} {"train_loss": -43.43032455444336, "global_step": 280270, "epoch": 2316} {"train_loss": -43.54110336303711, "global_step": 280271, "epoch": 2316} {"train_loss": -43.483394622802734, "global_step": 280272, "epoch": 2316} {"train_loss": -43.600833892822266, "global_step": 280273, "epoch": 2316} {"train_loss": -43.59636306762695, "global_step": 280274, "epoch": 2316} {"train_loss": -42.21936798095703, "global_step": 280275, "epoch": 2316} {"train_loss": -43.90758514404297, "global_step": 280276, "epoch": 2316} {"train_loss": -43.45729064941406, "global_step": 280277, "epoch": 2316} {"train_loss": -42.11766052246094, "global_step": 280278, "epoch": 2316} {"train_loss": -43.303001403808594, "global_step": 280279, "epoch": 2316} {"train_loss": -43.038936614990234, "global_step": 280280, "epoch": 2316} {"train_loss": -43.24250411987305, "global_step": 280281, "epoch": 2316} {"train_loss": -43.17427444458008, "global_step": 280282, "epoch": 2316} {"train_loss": -41.92192459106445, "global_step": 280283, "epoch": 2316} {"train_loss": -43.657249450683594, "global_step": 280284, "epoch": 2316} {"train_loss": -43.4743537902832, "global_step": 280285, "epoch": 2316} {"train_loss": -43.382564544677734, "global_step": 280286, "epoch": 2316} {"train_loss": -42.993133544921875, "global_step": 280287, "epoch": 2316} {"train_loss": -43.34062957763672, "global_step": 280288, "epoch": 2316} {"train_loss": -43.67327880859375, "global_step": 280289, "epoch": 2316} {"train_loss": -43.64797592163086, "global_step": 280290, "epoch": 2316} {"train_loss": -43.42603302001953, "global_step": 280291, "epoch": 2316} {"train_loss": -42.59722137451172, "global_step": 280292, "epoch": 2316} {"train_loss": -42.503482818603516, "global_step": 280293, "epoch": 2316} {"train_loss": -43.87641525268555, "global_step": 280294, "epoch": 2316} {"train_loss": -42.75945281982422, "global_step": 280295, "epoch": 2316} {"train_loss": -42.26300048828125, "global_step": 280296, "epoch": 2316} {"train_loss": -41.807342529296875, "global_step": 280297, "epoch": 2316} {"train_loss": -42.057151794433594, "global_step": 280298, "epoch": 2316} {"train_loss": -42.81406784057617, "global_step": 280299, "epoch": 2316} {"train_loss": -42.4044189453125, "global_step": 280300, "epoch": 2316} {"train_loss": -43.43184280395508, "global_step": 280301, "epoch": 2316} {"train_loss": -40.85476303100586, "global_step": 280302, "epoch": 2316} {"train_loss": -41.67869186401367, "global_step": 280303, "epoch": 2316} {"train_loss": -41.87286376953125, "global_step": 280304, "epoch": 2316} {"train_loss": -42.95998001098633, "global_step": 280305, "epoch": 2316} {"train_loss": -42.69047164916992, "global_step": 280306, "epoch": 2316} {"train_loss": -43.026546478271484, "global_step": 280307, "epoch": 2316} {"train_loss": -42.70936965942383, "global_step": 280308, "epoch": 2316} {"train_loss": -43.452919006347656, "global_step": 280309, "epoch": 2316} {"train_loss": -43.27438735961914, "global_step": 280310, "epoch": 2316} {"train_loss": -43.27006912231445, "global_step": 280311, "epoch": 2316} {"train_loss": -43.02490234375, "global_step": 280312, "epoch": 2316} {"train_loss": -42.822696685791016, "global_step": 280313, "epoch": 2316} {"train_loss": -42.818084716796875, "global_step": 280314, "epoch": 2316} {"train_loss": -42.956661224365234, "global_step": 280315, "epoch": 2316} {"train_loss": -43.685333251953125, "global_step": 280316, "epoch": 2316} {"train_loss": -43.101688385009766, "global_step": 280317, "epoch": 2316} {"train_loss": -43.270023345947266, "global_step": 280318, "epoch": 2316} {"train_loss": -41.677146911621094, "global_step": 280319, "epoch": 2316} {"train_loss": -42.85833740234375, "global_step": 280320, "epoch": 2316} {"train_loss": -42.8768310546875, "global_step": 280321, "epoch": 2316} {"train_loss": -43.595088958740234, "global_step": 280322, "epoch": 2316} {"train_loss": -42.31455612182617, "global_step": 280323, "epoch": 2316} {"train_loss": -40.874019622802734, "global_step": 280324, "epoch": 2316} {"train_loss": -41.7491569519043, "global_step": 280325, "epoch": 2316} {"train_loss": -42.29603576660156, "global_step": 280326, "epoch": 2316} {"train_loss": -42.57755661010742, "global_step": 280327, "epoch": 2316} {"train_loss": -42.22231674194336, "global_step": 280328, "epoch": 2316} {"train_loss": -43.78704833984375, "global_step": 280329, "epoch": 2316} {"train_loss": -42.703670501708984, "global_step": 280330, "epoch": 2316} {"train_loss": -41.81783676147461, "global_step": 280331, "epoch": 2316} {"train_loss": -42.980796813964844, "global_step": 280332, "epoch": 2316} {"train_loss": -41.871273040771484, "global_step": 280333, "epoch": 2316} {"train_loss": -41.544952392578125, "global_step": 280334, "epoch": 2316} {"train_loss": -43.23102569580078, "global_step": 280335, "epoch": 2316} {"train_loss": -41.03480529785156, "global_step": 280336, "epoch": 2316} {"train_loss": -40.28449249267578, "global_step": 280337, "epoch": 2316} {"train_loss": -41.831298828125, "global_step": 280338, "epoch": 2316} {"train_loss": -40.37069320678711, "global_step": 280339, "epoch": 2316} {"train_loss": -40.38532257080078, "global_step": 280340, "epoch": 2316} {"train_loss": -41.34408187866211, "global_step": 280341, "epoch": 2316} {"train_loss": -42.10866928100586, "global_step": 280342, "epoch": 2316} {"train_loss": -42.162132263183594, "global_step": 280343, "epoch": 2316} {"train_loss": -41.48862838745117, "global_step": 280344, "epoch": 2316} {"train_loss": -40.13105010986328, "global_step": 280345, "epoch": 2316} {"train_loss": -42.72248077392578, "global_step": 280346, "epoch": 2316} {"train_loss": -41.29156494140625, "global_step": 280347, "epoch": 2316} {"train_loss": -43.225948333740234, "global_step": 280348, "epoch": 2316} {"train_loss": -41.35028076171875, "global_step": 280349, "epoch": 2316} {"train_loss": -38.159271240234375, "global_step": 280350, "epoch": 2316} {"train_loss": -39.313575744628906, "global_step": 280351, "epoch": 2316} {"train_loss": -37.717430114746094, "global_step": 280352, "epoch": 2316} {"train_loss": -41.01597595214844, "global_step": 280353, "epoch": 2316} {"train_loss": -37.93728256225586, "global_step": 280354, "epoch": 2316} {"train_loss": -42.02071762084961, "global_step": 280355, "epoch": 2316} {"train_loss": -42.295769652059256, "global_step": 280356, "epoch": 2316, "val_loss": 2376243.25} {"train_loss": -41.28986740112305, "global_step": 280357, "epoch": 2317} {"train_loss": -40.14556121826172, "global_step": 280358, "epoch": 2317} {"train_loss": -41.231258392333984, "global_step": 280359, "epoch": 2317} {"train_loss": -41.224910736083984, "global_step": 280360, "epoch": 2317} {"train_loss": -40.81558609008789, "global_step": 280361, "epoch": 2317} {"train_loss": -39.98223876953125, "global_step": 280362, "epoch": 2317} {"train_loss": -40.647674560546875, "global_step": 280363, "epoch": 2317} {"train_loss": -40.00122833251953, "global_step": 280364, "epoch": 2317} {"train_loss": -38.33477783203125, "global_step": 280365, "epoch": 2317} {"train_loss": -39.86898422241211, "global_step": 280366, "epoch": 2317} {"train_loss": -40.4488525390625, "global_step": 280367, "epoch": 2317} {"train_loss": -40.899574279785156, "global_step": 280368, "epoch": 2317} {"train_loss": -36.14443588256836, "global_step": 280369, "epoch": 2317} {"train_loss": -39.524173736572266, "global_step": 280370, "epoch": 2317} {"train_loss": -41.42919158935547, "global_step": 280371, "epoch": 2317} {"train_loss": -40.45620346069336, "global_step": 280372, "epoch": 2317} {"train_loss": -40.31838607788086, "global_step": 280373, "epoch": 2317} {"train_loss": -39.71162033081055, "global_step": 280374, "epoch": 2317} {"train_loss": -41.721343994140625, "global_step": 280375, "epoch": 2317} {"train_loss": -41.95941925048828, "global_step": 280376, "epoch": 2317} {"train_loss": -40.17581558227539, "global_step": 280377, "epoch": 2317} {"train_loss": -41.10771560668945, "global_step": 280378, "epoch": 2317} {"train_loss": -41.43368148803711, "global_step": 280379, "epoch": 2317} {"train_loss": -40.39010238647461, "global_step": 280380, "epoch": 2317} {"train_loss": -39.87980270385742, "global_step": 280381, "epoch": 2317} {"train_loss": -39.858604431152344, "global_step": 280382, "epoch": 2317} {"train_loss": -40.17938232421875, "global_step": 280383, "epoch": 2317} {"train_loss": -38.489845275878906, "global_step": 280384, "epoch": 2317} {"train_loss": -40.13360595703125, "global_step": 280385, "epoch": 2317} {"train_loss": -41.66023635864258, "global_step": 280386, "epoch": 2317} {"train_loss": -40.502315521240234, "global_step": 280387, "epoch": 2317} {"train_loss": -40.052093505859375, "global_step": 280388, "epoch": 2317} {"train_loss": -41.74404525756836, "global_step": 280389, "epoch": 2317} {"train_loss": -40.698604583740234, "global_step": 280390, "epoch": 2317} {"train_loss": -41.7598991394043, "global_step": 280391, "epoch": 2317} {"train_loss": -41.51456832885742, "global_step": 280392, "epoch": 2317} {"train_loss": -41.38966751098633, "global_step": 280393, "epoch": 2317} {"train_loss": -41.907012939453125, "global_step": 280394, "epoch": 2317} {"train_loss": -41.948097229003906, "global_step": 280395, "epoch": 2317} {"train_loss": -41.59579086303711, "global_step": 280396, "epoch": 2317} {"train_loss": -41.7528076171875, "global_step": 280397, "epoch": 2317} {"train_loss": -40.84527587890625, "global_step": 280398, "epoch": 2317} {"train_loss": -42.12953567504883, "global_step": 280399, "epoch": 2317} {"train_loss": -41.61941146850586, "global_step": 280400, "epoch": 2317} {"train_loss": -41.673091888427734, "global_step": 280401, "epoch": 2317} {"train_loss": -42.197750091552734, "global_step": 280402, "epoch": 2317} {"train_loss": -41.61283493041992, "global_step": 280403, "epoch": 2317} {"train_loss": -42.164146423339844, "global_step": 280404, "epoch": 2317} {"train_loss": -41.53304672241211, "global_step": 280405, "epoch": 2317} {"train_loss": -41.89958190917969, "global_step": 280406, "epoch": 2317} {"train_loss": -42.42207717895508, "global_step": 280407, "epoch": 2317} {"train_loss": -41.600460052490234, "global_step": 280408, "epoch": 2317} {"train_loss": -42.11276626586914, "global_step": 280409, "epoch": 2317} {"train_loss": -41.89797592163086, "global_step": 280410, "epoch": 2317} {"train_loss": -41.73701477050781, "global_step": 280411, "epoch": 2317} {"train_loss": -42.12534713745117, "global_step": 280412, "epoch": 2317} {"train_loss": -42.34880065917969, "global_step": 280413, "epoch": 2317} {"train_loss": -42.16434860229492, "global_step": 280414, "epoch": 2317} {"train_loss": -42.17912673950195, "global_step": 280415, "epoch": 2317} {"train_loss": -42.0032844543457, "global_step": 280416, "epoch": 2317} {"train_loss": -41.9923210144043, "global_step": 280417, "epoch": 2317} {"train_loss": -41.60514450073242, "global_step": 280418, "epoch": 2317} {"train_loss": -43.06386947631836, "global_step": 280419, "epoch": 2317} {"train_loss": -42.41844940185547, "global_step": 280420, "epoch": 2317} {"train_loss": -42.693050384521484, "global_step": 280421, "epoch": 2317} {"train_loss": -42.49246597290039, "global_step": 280422, "epoch": 2317} {"train_loss": -42.21589279174805, "global_step": 280423, "epoch": 2317} {"train_loss": -43.49575424194336, "global_step": 280424, "epoch": 2317} {"train_loss": -42.130348205566406, "global_step": 280425, "epoch": 2317} {"train_loss": -42.67156982421875, "global_step": 280426, "epoch": 2317} {"train_loss": -43.05170440673828, "global_step": 280427, "epoch": 2317} {"train_loss": -43.40421676635742, "global_step": 280428, "epoch": 2317} {"train_loss": -42.72552490234375, "global_step": 280429, "epoch": 2317} {"train_loss": -42.68606185913086, "global_step": 280430, "epoch": 2317} {"train_loss": -42.606658935546875, "global_step": 280431, "epoch": 2317} {"train_loss": -42.67379379272461, "global_step": 280432, "epoch": 2317} {"train_loss": -42.69871139526367, "global_step": 280433, "epoch": 2317} {"train_loss": -43.13655471801758, "global_step": 280434, "epoch": 2317} {"train_loss": -43.44965362548828, "global_step": 280435, "epoch": 2317} {"train_loss": -43.161678314208984, "global_step": 280436, "epoch": 2317} {"train_loss": -42.67034912109375, "global_step": 280437, "epoch": 2317} {"train_loss": -43.477325439453125, "global_step": 280438, "epoch": 2317} {"train_loss": -43.170806884765625, "global_step": 280439, "epoch": 2317} {"train_loss": -42.55525588989258, "global_step": 280440, "epoch": 2317} {"train_loss": -43.18986129760742, "global_step": 280441, "epoch": 2317} {"train_loss": -43.11955261230469, "global_step": 280442, "epoch": 2317} {"train_loss": -42.76249313354492, "global_step": 280443, "epoch": 2317} {"train_loss": -43.493133544921875, "global_step": 280444, "epoch": 2317} {"train_loss": -43.33435821533203, "global_step": 280445, "epoch": 2317} {"train_loss": -41.78878402709961, "global_step": 280446, "epoch": 2317} {"train_loss": -42.795040130615234, "global_step": 280447, "epoch": 2317} {"train_loss": -43.01771926879883, "global_step": 280448, "epoch": 2317} {"train_loss": -43.600013732910156, "global_step": 280449, "epoch": 2317} {"train_loss": -43.27790451049805, "global_step": 280450, "epoch": 2317} {"train_loss": -43.919151306152344, "global_step": 280451, "epoch": 2317} {"train_loss": -43.4173469543457, "global_step": 280452, "epoch": 2317} {"train_loss": -42.51844024658203, "global_step": 280453, "epoch": 2317} {"train_loss": -42.999305725097656, "global_step": 280454, "epoch": 2317} {"train_loss": -43.05345916748047, "global_step": 280455, "epoch": 2317} {"train_loss": -43.70241928100586, "global_step": 280456, "epoch": 2317} {"train_loss": -41.69970703125, "global_step": 280457, "epoch": 2317} {"train_loss": -42.706573486328125, "global_step": 280458, "epoch": 2317} {"train_loss": -43.01288986206055, "global_step": 280459, "epoch": 2317} {"train_loss": -42.710899353027344, "global_step": 280460, "epoch": 2317} {"train_loss": -43.001216888427734, "global_step": 280461, "epoch": 2317} {"train_loss": -42.765560150146484, "global_step": 280462, "epoch": 2317} {"train_loss": -41.73814010620117, "global_step": 280463, "epoch": 2317} {"train_loss": -41.8568229675293, "global_step": 280464, "epoch": 2317} {"train_loss": -41.61533737182617, "global_step": 280465, "epoch": 2317} {"train_loss": -43.32559585571289, "global_step": 280466, "epoch": 2317} {"train_loss": -42.74189376831055, "global_step": 280467, "epoch": 2317} {"train_loss": -41.42975616455078, "global_step": 280468, "epoch": 2317} {"train_loss": -41.897987365722656, "global_step": 280469, "epoch": 2317} {"train_loss": -43.1705207824707, "global_step": 280470, "epoch": 2317} {"train_loss": -42.215633392333984, "global_step": 280471, "epoch": 2317} {"train_loss": -41.63869857788086, "global_step": 280472, "epoch": 2317} {"train_loss": -41.06596755981445, "global_step": 280473, "epoch": 2317} {"train_loss": -40.48744583129883, "global_step": 280474, "epoch": 2317} {"train_loss": -41.93107223510742, "global_step": 280475, "epoch": 2317} {"train_loss": -42.43385696411133, "global_step": 280476, "epoch": 2317} {"train_loss": -41.83902598609609, "global_step": 280477, "epoch": 2317, "val_loss": 2493700.75} {"train_loss": -40.50640869140625, "global_step": 280478, "epoch": 2318} {"train_loss": -41.269039154052734, "global_step": 280479, "epoch": 2318} {"train_loss": -42.703460693359375, "global_step": 280480, "epoch": 2318} {"train_loss": -42.0722770690918, "global_step": 280481, "epoch": 2318} {"train_loss": -41.57009506225586, "global_step": 280482, "epoch": 2318} {"train_loss": -42.04343032836914, "global_step": 280483, "epoch": 2318} {"train_loss": -43.2448616027832, "global_step": 280484, "epoch": 2318} {"train_loss": -42.179176330566406, "global_step": 280485, "epoch": 2318} {"train_loss": -41.72658157348633, "global_step": 280486, "epoch": 2318} {"train_loss": -42.919673919677734, "global_step": 280487, "epoch": 2318} {"train_loss": -42.95354080200195, "global_step": 280488, "epoch": 2318} {"train_loss": -42.51593780517578, "global_step": 280489, "epoch": 2318} {"train_loss": -42.768951416015625, "global_step": 280490, "epoch": 2318} {"train_loss": -42.8490104675293, "global_step": 280491, "epoch": 2318} {"train_loss": -41.28043746948242, "global_step": 280492, "epoch": 2318} {"train_loss": -42.485015869140625, "global_step": 280493, "epoch": 2318} {"train_loss": -42.981658935546875, "global_step": 280494, "epoch": 2318} {"train_loss": -42.609519958496094, "global_step": 280495, "epoch": 2318} {"train_loss": -41.66825485229492, "global_step": 280496, "epoch": 2318} {"train_loss": -41.08388137817383, "global_step": 280497, "epoch": 2318} {"train_loss": -43.01992416381836, "global_step": 280498, "epoch": 2318} {"train_loss": -42.20479965209961, "global_step": 280499, "epoch": 2318} {"train_loss": -42.849143981933594, "global_step": 280500, "epoch": 2318} {"train_loss": -42.66447830200195, "global_step": 280501, "epoch": 2318} {"train_loss": -43.281490325927734, "global_step": 280502, "epoch": 2318} {"train_loss": -43.18783187866211, "global_step": 280503, "epoch": 2318} {"train_loss": -43.087825775146484, "global_step": 280504, "epoch": 2318} {"train_loss": -43.65608596801758, "global_step": 280505, "epoch": 2318} {"train_loss": -42.960872650146484, "global_step": 280506, "epoch": 2318} {"train_loss": -40.14179611206055, "global_step": 280507, "epoch": 2318} {"train_loss": -43.066184997558594, "global_step": 280508, "epoch": 2318} {"train_loss": -42.73215866088867, "global_step": 280509, "epoch": 2318} {"train_loss": -42.5062370300293, "global_step": 280510, "epoch": 2318} {"train_loss": -42.935787200927734, "global_step": 280511, "epoch": 2318} {"train_loss": -43.45540237426758, "global_step": 280512, "epoch": 2318} {"train_loss": -43.19259262084961, "global_step": 280513, "epoch": 2318} {"train_loss": -42.95286560058594, "global_step": 280514, "epoch": 2318} {"train_loss": -43.07169723510742, "global_step": 280515, "epoch": 2318} {"train_loss": -43.4535026550293, "global_step": 280516, "epoch": 2318} {"train_loss": -43.24131774902344, "global_step": 280517, "epoch": 2318} {"train_loss": -42.10444259643555, "global_step": 280518, "epoch": 2318} {"train_loss": -42.53084945678711, "global_step": 280519, "epoch": 2318} {"train_loss": -43.243587493896484, "global_step": 280520, "epoch": 2318} {"train_loss": -42.52263641357422, "global_step": 280521, "epoch": 2318} {"train_loss": -42.19024658203125, "global_step": 280522, "epoch": 2318} {"train_loss": -42.340980529785156, "global_step": 280523, "epoch": 2318} {"train_loss": -42.940853118896484, "global_step": 280524, "epoch": 2318} {"train_loss": -42.18478012084961, "global_step": 280525, "epoch": 2318} {"train_loss": -41.80940246582031, "global_step": 280526, "epoch": 2318} {"train_loss": -42.73366165161133, "global_step": 280527, "epoch": 2318} {"train_loss": -41.91518783569336, "global_step": 280528, "epoch": 2318} {"train_loss": -41.48491668701172, "global_step": 280529, "epoch": 2318} {"train_loss": -41.74135208129883, "global_step": 280530, "epoch": 2318} {"train_loss": -42.0743408203125, "global_step": 280531, "epoch": 2318} {"train_loss": -41.84896469116211, "global_step": 280532, "epoch": 2318} {"train_loss": -42.471248626708984, "global_step": 280533, "epoch": 2318} {"train_loss": -41.3154296875, "global_step": 280534, "epoch": 2318} {"train_loss": -42.57261276245117, "global_step": 280535, "epoch": 2318} {"train_loss": -41.27593994140625, "global_step": 280536, "epoch": 2318} {"train_loss": -41.25425338745117, "global_step": 280537, "epoch": 2318} {"train_loss": -43.573822021484375, "global_step": 280538, "epoch": 2318} {"train_loss": -41.90090560913086, "global_step": 280539, "epoch": 2318} {"train_loss": -42.7276611328125, "global_step": 280540, "epoch": 2318} {"train_loss": -42.9383544921875, "global_step": 280541, "epoch": 2318} {"train_loss": -41.86255645751953, "global_step": 280542, "epoch": 2318} {"train_loss": -43.09721755981445, "global_step": 280543, "epoch": 2318} {"train_loss": -41.71406936645508, "global_step": 280544, "epoch": 2318} {"train_loss": -43.292327880859375, "global_step": 280545, "epoch": 2318} {"train_loss": -42.30593490600586, "global_step": 280546, "epoch": 2318} {"train_loss": -42.567665100097656, "global_step": 280547, "epoch": 2318} {"train_loss": -42.246490478515625, "global_step": 280548, "epoch": 2318} {"train_loss": -41.339900970458984, "global_step": 280549, "epoch": 2318} {"train_loss": -42.757205963134766, "global_step": 280550, "epoch": 2318} {"train_loss": -42.850730895996094, "global_step": 280551, "epoch": 2318} {"train_loss": -42.262123107910156, "global_step": 280552, "epoch": 2318} {"train_loss": -42.73746109008789, "global_step": 280553, "epoch": 2318} {"train_loss": -42.86298751831055, "global_step": 280554, "epoch": 2318} {"train_loss": -42.08909606933594, "global_step": 280555, "epoch": 2318} {"train_loss": -42.42725372314453, "global_step": 280556, "epoch": 2318} {"train_loss": -39.846553802490234, "global_step": 280557, "epoch": 2318} {"train_loss": -39.566707611083984, "global_step": 280558, "epoch": 2318} {"train_loss": -41.83100509643555, "global_step": 280559, "epoch": 2318} {"train_loss": -40.39253234863281, "global_step": 280560, "epoch": 2318} {"train_loss": -39.65702438354492, "global_step": 280561, "epoch": 2318} {"train_loss": -41.30060958862305, "global_step": 280562, "epoch": 2318} {"train_loss": -40.417049407958984, "global_step": 280563, "epoch": 2318} {"train_loss": -38.80236053466797, "global_step": 280564, "epoch": 2318} {"train_loss": -41.21146774291992, "global_step": 280565, "epoch": 2318} {"train_loss": -41.211360931396484, "global_step": 280566, "epoch": 2318} {"train_loss": -39.40879440307617, "global_step": 280567, "epoch": 2318} {"train_loss": -42.036956787109375, "global_step": 280568, "epoch": 2318} {"train_loss": -39.92145919799805, "global_step": 280569, "epoch": 2318} {"train_loss": -41.8978271484375, "global_step": 280570, "epoch": 2318} {"train_loss": -40.91495895385742, "global_step": 280571, "epoch": 2318} {"train_loss": -40.47565460205078, "global_step": 280572, "epoch": 2318} {"train_loss": -42.35191345214844, "global_step": 280573, "epoch": 2318} {"train_loss": -40.74536895751953, "global_step": 280574, "epoch": 2318} {"train_loss": -42.08051681518555, "global_step": 280575, "epoch": 2318} {"train_loss": -41.487483978271484, "global_step": 280576, "epoch": 2318} {"train_loss": -42.76263427734375, "global_step": 280577, "epoch": 2318} {"train_loss": -42.565834045410156, "global_step": 280578, "epoch": 2318} {"train_loss": -42.05621337890625, "global_step": 280579, "epoch": 2318} {"train_loss": -42.76288604736328, "global_step": 280580, "epoch": 2318} {"train_loss": -42.773189544677734, "global_step": 280581, "epoch": 2318} {"train_loss": -41.86983871459961, "global_step": 280582, "epoch": 2318} {"train_loss": -42.49148941040039, "global_step": 280583, "epoch": 2318} {"train_loss": -42.764469146728516, "global_step": 280584, "epoch": 2318} {"train_loss": -42.823795318603516, "global_step": 280585, "epoch": 2318} {"train_loss": -43.026424407958984, "global_step": 280586, "epoch": 2318} {"train_loss": -42.554683685302734, "global_step": 280587, "epoch": 2318} {"train_loss": -41.845279693603516, "global_step": 280588, "epoch": 2318} {"train_loss": -42.70918655395508, "global_step": 280589, "epoch": 2318} {"train_loss": -42.96433639526367, "global_step": 280590, "epoch": 2318} {"train_loss": -42.07965850830078, "global_step": 280591, "epoch": 2318} {"train_loss": -43.20463943481445, "global_step": 280592, "epoch": 2318} {"train_loss": -42.953128814697266, "global_step": 280593, "epoch": 2318} {"train_loss": -43.338138580322266, "global_step": 280594, "epoch": 2318} {"train_loss": -43.4382209777832, "global_step": 280595, "epoch": 2318} {"train_loss": -42.94979476928711, "global_step": 280596, "epoch": 2318} {"train_loss": -43.71425247192383, "global_step": 280597, "epoch": 2318} {"train_loss": -42.19966125488281, "global_step": 280598, "epoch": 2318, "val_loss": 2443022.0} {"train_loss": -43.304691314697266, "global_step": 280599, "epoch": 2319} {"train_loss": -42.25295639038086, "global_step": 280600, "epoch": 2319} {"train_loss": -42.58319091796875, "global_step": 280601, "epoch": 2319} {"train_loss": -43.59153366088867, "global_step": 280602, "epoch": 2319} {"train_loss": -43.044368743896484, "global_step": 280603, "epoch": 2319} {"train_loss": -43.15658187866211, "global_step": 280604, "epoch": 2319} {"train_loss": -43.1181640625, "global_step": 280605, "epoch": 2319} {"train_loss": -43.41913986206055, "global_step": 280606, "epoch": 2319} {"train_loss": -43.420166015625, "global_step": 280607, "epoch": 2319} {"train_loss": -43.7469596862793, "global_step": 280608, "epoch": 2319} {"train_loss": -43.390724182128906, "global_step": 280609, "epoch": 2319} {"train_loss": -43.52509689331055, "global_step": 280610, "epoch": 2319} {"train_loss": -43.1658821105957, "global_step": 280611, "epoch": 2319} {"train_loss": -43.34811782836914, "global_step": 280612, "epoch": 2319} {"train_loss": -43.5186653137207, "global_step": 280613, "epoch": 2319} {"train_loss": -43.1024284362793, "global_step": 280614, "epoch": 2319} {"train_loss": -43.98855209350586, "global_step": 280615, "epoch": 2319} {"train_loss": -43.6106071472168, "global_step": 280616, "epoch": 2319} {"train_loss": -44.025482177734375, "global_step": 280617, "epoch": 2319} {"train_loss": -43.443241119384766, "global_step": 280618, "epoch": 2319} {"train_loss": -42.85248565673828, "global_step": 280619, "epoch": 2319} {"train_loss": -43.784889221191406, "global_step": 280620, "epoch": 2319} {"train_loss": -43.39262008666992, "global_step": 280621, "epoch": 2319} {"train_loss": -44.07844924926758, "global_step": 280622, "epoch": 2319} {"train_loss": -43.82630157470703, "global_step": 280623, "epoch": 2319} {"train_loss": -43.66953659057617, "global_step": 280624, "epoch": 2319} {"train_loss": -42.79619598388672, "global_step": 280625, "epoch": 2319} {"train_loss": -43.346858978271484, "global_step": 280626, "epoch": 2319} {"train_loss": -43.02997589111328, "global_step": 280627, "epoch": 2319} {"train_loss": -43.74188995361328, "global_step": 280628, "epoch": 2319} {"train_loss": -43.42144775390625, "global_step": 280629, "epoch": 2319} {"train_loss": -43.471920013427734, "global_step": 280630, "epoch": 2319} {"train_loss": -42.97726058959961, "global_step": 280631, "epoch": 2319} {"train_loss": -43.395263671875, "global_step": 280632, "epoch": 2319} {"train_loss": -44.21240997314453, "global_step": 280633, "epoch": 2319} {"train_loss": -43.233436584472656, "global_step": 280634, "epoch": 2319} {"train_loss": -42.28342819213867, "global_step": 280635, "epoch": 2319} {"train_loss": -40.78773880004883, "global_step": 280636, "epoch": 2319} {"train_loss": -40.977359771728516, "global_step": 280637, "epoch": 2319} {"train_loss": -42.399227142333984, "global_step": 280638, "epoch": 2319} {"train_loss": -43.96828079223633, "global_step": 280639, "epoch": 2319} {"train_loss": -42.869441986083984, "global_step": 280640, "epoch": 2319} {"train_loss": -41.44498062133789, "global_step": 280641, "epoch": 2319} {"train_loss": -43.17745590209961, "global_step": 280642, "epoch": 2319} {"train_loss": -42.96493148803711, "global_step": 280643, "epoch": 2319} {"train_loss": -40.76152801513672, "global_step": 280644, "epoch": 2319} {"train_loss": -41.446083068847656, "global_step": 280645, "epoch": 2319} {"train_loss": -43.022743225097656, "global_step": 280646, "epoch": 2319} {"train_loss": -43.333892822265625, "global_step": 280647, "epoch": 2319} {"train_loss": -39.67645263671875, "global_step": 280648, "epoch": 2319} {"train_loss": -42.00922775268555, "global_step": 280649, "epoch": 2319} {"train_loss": -42.932613372802734, "global_step": 280650, "epoch": 2319} {"train_loss": -41.9765739440918, "global_step": 280651, "epoch": 2319} {"train_loss": -42.20522689819336, "global_step": 280652, "epoch": 2319} {"train_loss": -42.99947738647461, "global_step": 280653, "epoch": 2319} {"train_loss": -42.41379928588867, "global_step": 280654, "epoch": 2319} {"train_loss": -42.79264450073242, "global_step": 280655, "epoch": 2319} {"train_loss": -41.910369873046875, "global_step": 280656, "epoch": 2319} {"train_loss": -42.74567413330078, "global_step": 280657, "epoch": 2319} {"train_loss": -42.36250686645508, "global_step": 280658, "epoch": 2319} {"train_loss": -41.910160064697266, "global_step": 280659, "epoch": 2319} {"train_loss": -42.484588623046875, "global_step": 280660, "epoch": 2319} {"train_loss": -41.72459030151367, "global_step": 280661, "epoch": 2319} {"train_loss": -41.617515563964844, "global_step": 280662, "epoch": 2319} {"train_loss": -42.170204162597656, "global_step": 280663, "epoch": 2319} {"train_loss": -41.14055633544922, "global_step": 280664, "epoch": 2319} {"train_loss": -43.39243698120117, "global_step": 280665, "epoch": 2319} {"train_loss": -41.29661178588867, "global_step": 280666, "epoch": 2319} {"train_loss": -42.59661865234375, "global_step": 280667, "epoch": 2319} {"train_loss": -42.77317428588867, "global_step": 280668, "epoch": 2319} {"train_loss": -42.183135986328125, "global_step": 280669, "epoch": 2319} {"train_loss": -43.14075469970703, "global_step": 280670, "epoch": 2319} {"train_loss": -40.62187576293945, "global_step": 280671, "epoch": 2319} {"train_loss": -41.90312957763672, "global_step": 280672, "epoch": 2319} {"train_loss": -41.5187873840332, "global_step": 280673, "epoch": 2319} {"train_loss": -41.51076889038086, "global_step": 280674, "epoch": 2319} {"train_loss": -40.923583984375, "global_step": 280675, "epoch": 2319} {"train_loss": -42.59443283081055, "global_step": 280676, "epoch": 2319} {"train_loss": -42.95821762084961, "global_step": 280677, "epoch": 2319} {"train_loss": -41.723304748535156, "global_step": 280678, "epoch": 2319} {"train_loss": -43.09575653076172, "global_step": 280679, "epoch": 2319} {"train_loss": -42.1500358581543, "global_step": 280680, "epoch": 2319} {"train_loss": -43.03426742553711, "global_step": 280681, "epoch": 2319} {"train_loss": -43.272377014160156, "global_step": 280682, "epoch": 2319} {"train_loss": -42.23360824584961, "global_step": 280683, "epoch": 2319} {"train_loss": -42.8847541809082, "global_step": 280684, "epoch": 2319} {"train_loss": -42.35299301147461, "global_step": 280685, "epoch": 2319} {"train_loss": -42.966915130615234, "global_step": 280686, "epoch": 2319} {"train_loss": -42.06727981567383, "global_step": 280687, "epoch": 2319} {"train_loss": -43.20463180541992, "global_step": 280688, "epoch": 2319} {"train_loss": -42.667236328125, "global_step": 280689, "epoch": 2319} {"train_loss": -43.40559005737305, "global_step": 280690, "epoch": 2319} {"train_loss": -42.78089141845703, "global_step": 280691, "epoch": 2319} {"train_loss": -43.097415924072266, "global_step": 280692, "epoch": 2319} {"train_loss": -43.611297607421875, "global_step": 280693, "epoch": 2319} {"train_loss": -42.828041076660156, "global_step": 280694, "epoch": 2319} {"train_loss": -43.22637939453125, "global_step": 280695, "epoch": 2319} {"train_loss": -43.08445739746094, "global_step": 280696, "epoch": 2319} {"train_loss": -44.192771911621094, "global_step": 280697, "epoch": 2319} {"train_loss": -42.960445404052734, "global_step": 280698, "epoch": 2319} {"train_loss": -43.8520622253418, "global_step": 280699, "epoch": 2319} {"train_loss": -43.548770904541016, "global_step": 280700, "epoch": 2319} {"train_loss": -43.716670989990234, "global_step": 280701, "epoch": 2319} {"train_loss": -43.79813766479492, "global_step": 280702, "epoch": 2319} {"train_loss": -43.28658676147461, "global_step": 280703, "epoch": 2319} {"train_loss": -43.45223617553711, "global_step": 280704, "epoch": 2319} {"train_loss": -43.229549407958984, "global_step": 280705, "epoch": 2319} {"train_loss": -43.52898025512695, "global_step": 280706, "epoch": 2319} {"train_loss": -43.970252990722656, "global_step": 280707, "epoch": 2319} {"train_loss": -43.446533203125, "global_step": 280708, "epoch": 2319} {"train_loss": -43.90421676635742, "global_step": 280709, "epoch": 2319} {"train_loss": -43.7667121887207, "global_step": 280710, "epoch": 2319} {"train_loss": -43.7907829284668, "global_step": 280711, "epoch": 2319} {"train_loss": -43.66303634643555, "global_step": 280712, "epoch": 2319} {"train_loss": -43.99259567260742, "global_step": 280713, "epoch": 2319} {"train_loss": -43.955318450927734, "global_step": 280714, "epoch": 2319} {"train_loss": -42.930477142333984, "global_step": 280715, "epoch": 2319} {"train_loss": -43.02284622192383, "global_step": 280716, "epoch": 2319} {"train_loss": -43.459957122802734, "global_step": 280717, "epoch": 2319} {"train_loss": -43.30057144165039, "global_step": 280718, "epoch": 2319} {"train_loss": -42.88595814350223, "global_step": 280719, "epoch": 2319, "val_loss": 2479720.0} {"train_loss": -43.205162048339844, "global_step": 280720, "epoch": 2320} {"train_loss": -43.87357711791992, "global_step": 280721, "epoch": 2320} {"train_loss": -43.72883987426758, "global_step": 280722, "epoch": 2320} {"train_loss": -44.41259765625, "global_step": 280723, "epoch": 2320} {"train_loss": -43.73688888549805, "global_step": 280724, "epoch": 2320} {"train_loss": -43.63686752319336, "global_step": 280725, "epoch": 2320} {"train_loss": -43.69346237182617, "global_step": 280726, "epoch": 2320} {"train_loss": -43.74978256225586, "global_step": 280727, "epoch": 2320} {"train_loss": -43.48817825317383, "global_step": 280728, "epoch": 2320} {"train_loss": -43.32164001464844, "global_step": 280729, "epoch": 2320} {"train_loss": -43.255001068115234, "global_step": 280730, "epoch": 2320} {"train_loss": -43.328983306884766, "global_step": 280731, "epoch": 2320} {"train_loss": -43.9128532409668, "global_step": 280732, "epoch": 2320} {"train_loss": -42.51681137084961, "global_step": 280733, "epoch": 2320} {"train_loss": -43.08612823486328, "global_step": 280734, "epoch": 2320} {"train_loss": -43.701812744140625, "global_step": 280735, "epoch": 2320} {"train_loss": -43.307735443115234, "global_step": 280736, "epoch": 2320} {"train_loss": -43.19074249267578, "global_step": 280737, "epoch": 2320} {"train_loss": -42.8405876159668, "global_step": 280738, "epoch": 2320} {"train_loss": -43.311058044433594, "global_step": 280739, "epoch": 2320} {"train_loss": -43.540016174316406, "global_step": 280740, "epoch": 2320} {"train_loss": -42.01530075073242, "global_step": 280741, "epoch": 2320} {"train_loss": -40.85233688354492, "global_step": 280742, "epoch": 2320} {"train_loss": -42.505828857421875, "global_step": 280743, "epoch": 2320} {"train_loss": -41.88885498046875, "global_step": 280744, "epoch": 2320} {"train_loss": -42.609310150146484, "global_step": 280745, "epoch": 2320} {"train_loss": -40.25800323486328, "global_step": 280746, "epoch": 2320} {"train_loss": -39.38481521606445, "global_step": 280747, "epoch": 2320} {"train_loss": -37.58023452758789, "global_step": 280748, "epoch": 2320} {"train_loss": -37.943538665771484, "global_step": 280749, "epoch": 2320} {"train_loss": -37.2738037109375, "global_step": 280750, "epoch": 2320} {"train_loss": -38.49985122680664, "global_step": 280751, "epoch": 2320} {"train_loss": -40.028533935546875, "global_step": 280752, "epoch": 2320} {"train_loss": -41.05942916870117, "global_step": 280753, "epoch": 2320} {"train_loss": -41.9436149597168, "global_step": 280754, "epoch": 2320} {"train_loss": -38.513031005859375, "global_step": 280755, "epoch": 2320} {"train_loss": -40.7713623046875, "global_step": 280756, "epoch": 2320} {"train_loss": -40.9404296875, "global_step": 280757, "epoch": 2320} {"train_loss": -39.95868682861328, "global_step": 280758, "epoch": 2320} {"train_loss": -41.520565032958984, "global_step": 280759, "epoch": 2320} {"train_loss": -40.317989349365234, "global_step": 280760, "epoch": 2320} {"train_loss": -40.543148040771484, "global_step": 280761, "epoch": 2320} {"train_loss": -40.95064926147461, "global_step": 280762, "epoch": 2320} {"train_loss": -41.59741973876953, "global_step": 280763, "epoch": 2320} {"train_loss": -42.18443298339844, "global_step": 280764, "epoch": 2320} {"train_loss": -42.04670333862305, "global_step": 280765, "epoch": 2320} {"train_loss": -40.9306640625, "global_step": 280766, "epoch": 2320} {"train_loss": -42.43717575073242, "global_step": 280767, "epoch": 2320} {"train_loss": -41.67905044555664, "global_step": 280768, "epoch": 2320} {"train_loss": -42.049072265625, "global_step": 280769, "epoch": 2320} {"train_loss": -42.123043060302734, "global_step": 280770, "epoch": 2320} {"train_loss": -41.99424362182617, "global_step": 280771, "epoch": 2320} {"train_loss": -42.6234245300293, "global_step": 280772, "epoch": 2320} {"train_loss": -42.3558464050293, "global_step": 280773, "epoch": 2320} {"train_loss": -43.27901840209961, "global_step": 280774, "epoch": 2320} {"train_loss": -42.836360931396484, "global_step": 280775, "epoch": 2320} {"train_loss": -43.13418197631836, "global_step": 280776, "epoch": 2320} {"train_loss": -42.654571533203125, "global_step": 280777, "epoch": 2320} {"train_loss": -42.28062057495117, "global_step": 280778, "epoch": 2320} {"train_loss": -43.29240036010742, "global_step": 280779, "epoch": 2320} {"train_loss": -43.08369064331055, "global_step": 280780, "epoch": 2320} {"train_loss": -43.50921630859375, "global_step": 280781, "epoch": 2320} {"train_loss": -43.0455322265625, "global_step": 280782, "epoch": 2320} {"train_loss": -42.65342330932617, "global_step": 280783, "epoch": 2320} {"train_loss": -43.02268600463867, "global_step": 280784, "epoch": 2320} {"train_loss": -42.583168029785156, "global_step": 280785, "epoch": 2320} {"train_loss": -43.092742919921875, "global_step": 280786, "epoch": 2320} {"train_loss": -42.0261116027832, "global_step": 280787, "epoch": 2320} {"train_loss": -41.63338851928711, "global_step": 280788, "epoch": 2320} {"train_loss": -42.6437873840332, "global_step": 280789, "epoch": 2320} {"train_loss": -42.76043701171875, "global_step": 280790, "epoch": 2320} {"train_loss": -42.59564208984375, "global_step": 280791, "epoch": 2320} {"train_loss": -42.446434020996094, "global_step": 280792, "epoch": 2320} {"train_loss": -42.59297561645508, "global_step": 280793, "epoch": 2320} {"train_loss": -43.212921142578125, "global_step": 280794, "epoch": 2320} {"train_loss": -42.0259895324707, "global_step": 280795, "epoch": 2320} {"train_loss": -43.2332878112793, "global_step": 280796, "epoch": 2320} {"train_loss": -43.4305534362793, "global_step": 280797, "epoch": 2320} {"train_loss": -42.89955520629883, "global_step": 280798, "epoch": 2320} {"train_loss": -43.553070068359375, "global_step": 280799, "epoch": 2320} {"train_loss": -42.90839385986328, "global_step": 280800, "epoch": 2320} {"train_loss": -43.03522491455078, "global_step": 280801, "epoch": 2320} {"train_loss": -43.84194564819336, "global_step": 280802, "epoch": 2320} {"train_loss": -43.312744140625, "global_step": 280803, "epoch": 2320} {"train_loss": -44.00400924682617, "global_step": 280804, "epoch": 2320} {"train_loss": -44.090126037597656, "global_step": 280805, "epoch": 2320} {"train_loss": -43.75442886352539, "global_step": 280806, "epoch": 2320} {"train_loss": -43.772377014160156, "global_step": 280807, "epoch": 2320} {"train_loss": -43.979583740234375, "global_step": 280808, "epoch": 2320} {"train_loss": -43.912288665771484, "global_step": 280809, "epoch": 2320} {"train_loss": -43.58798599243164, "global_step": 280810, "epoch": 2320} {"train_loss": -43.99616241455078, "global_step": 280811, "epoch": 2320} {"train_loss": -43.254432678222656, "global_step": 280812, "epoch": 2320} {"train_loss": -43.94430923461914, "global_step": 280813, "epoch": 2320} {"train_loss": -43.66493606567383, "global_step": 280814, "epoch": 2320} {"train_loss": -43.504459381103516, "global_step": 280815, "epoch": 2320} {"train_loss": -43.91064453125, "global_step": 280816, "epoch": 2320} {"train_loss": -44.078365325927734, "global_step": 280817, "epoch": 2320} {"train_loss": -44.22755432128906, "global_step": 280818, "epoch": 2320} {"train_loss": -43.71775436401367, "global_step": 280819, "epoch": 2320} {"train_loss": -43.5095329284668, "global_step": 280820, "epoch": 2320} {"train_loss": -43.370018005371094, "global_step": 280821, "epoch": 2320} {"train_loss": -43.40735626220703, "global_step": 280822, "epoch": 2320} {"train_loss": -44.090118408203125, "global_step": 280823, "epoch": 2320} {"train_loss": -43.64491271972656, "global_step": 280824, "epoch": 2320} {"train_loss": -43.38288116455078, "global_step": 280825, "epoch": 2320} {"train_loss": -43.39638900756836, "global_step": 280826, "epoch": 2320} {"train_loss": -40.489322662353516, "global_step": 280827, "epoch": 2320} {"train_loss": -44.01008224487305, "global_step": 280828, "epoch": 2320} {"train_loss": -42.86184310913086, "global_step": 280829, "epoch": 2320} {"train_loss": -41.4557991027832, "global_step": 280830, "epoch": 2320} {"train_loss": -42.280982971191406, "global_step": 280831, "epoch": 2320} {"train_loss": -43.568450927734375, "global_step": 280832, "epoch": 2320} {"train_loss": -44.022159576416016, "global_step": 280833, "epoch": 2320} {"train_loss": -42.8812141418457, "global_step": 280834, "epoch": 2320} {"train_loss": -42.89339828491211, "global_step": 280835, "epoch": 2320} {"train_loss": -42.823585510253906, "global_step": 280836, "epoch": 2320} {"train_loss": -42.514427185058594, "global_step": 280837, "epoch": 2320} {"train_loss": -43.36581039428711, "global_step": 280838, "epoch": 2320} {"train_loss": -43.94306564331055, "global_step": 280839, "epoch": 2320} {"train_loss": -42.61144701114371, "global_step": 280840, "epoch": 2320, "val_loss": 2543523.0} {"train_loss": -43.13867950439453, "global_step": 280841, "epoch": 2321} {"train_loss": -36.432762145996094, "global_step": 280842, "epoch": 2321} {"train_loss": -42.66428756713867, "global_step": 280843, "epoch": 2321} {"train_loss": -43.597381591796875, "global_step": 280844, "epoch": 2321} {"train_loss": -43.670753479003906, "global_step": 280845, "epoch": 2321} {"train_loss": -43.6043815612793, "global_step": 280846, "epoch": 2321} {"train_loss": -43.2130241394043, "global_step": 280847, "epoch": 2321} {"train_loss": -43.81629180908203, "global_step": 280848, "epoch": 2321} {"train_loss": -41.65389633178711, "global_step": 280849, "epoch": 2321} {"train_loss": -43.79140853881836, "global_step": 280850, "epoch": 2321} {"train_loss": -43.7534294128418, "global_step": 280851, "epoch": 2321} {"train_loss": -43.58491897583008, "global_step": 280852, "epoch": 2321} {"train_loss": -43.839935302734375, "global_step": 280853, "epoch": 2321} {"train_loss": -43.92216110229492, "global_step": 280854, "epoch": 2321} {"train_loss": -43.74644470214844, "global_step": 280855, "epoch": 2321} {"train_loss": -43.989192962646484, "global_step": 280856, "epoch": 2321} {"train_loss": -34.1096305847168, "global_step": 280857, "epoch": 2321} {"train_loss": -42.38218307495117, "global_step": 280858, "epoch": 2321} {"train_loss": -39.74528503417969, "global_step": 280859, "epoch": 2321} {"train_loss": -42.02570343017578, "global_step": 280860, "epoch": 2321} {"train_loss": -42.977630615234375, "global_step": 280861, "epoch": 2321} {"train_loss": -41.55605697631836, "global_step": 280862, "epoch": 2321} {"train_loss": -41.183135986328125, "global_step": 280863, "epoch": 2321} {"train_loss": -43.17039108276367, "global_step": 280864, "epoch": 2321} {"train_loss": -41.81434631347656, "global_step": 280865, "epoch": 2321} {"train_loss": -42.08250045776367, "global_step": 280866, "epoch": 2321} {"train_loss": -43.577491760253906, "global_step": 280867, "epoch": 2321} {"train_loss": -42.939144134521484, "global_step": 280868, "epoch": 2321} {"train_loss": -42.92356491088867, "global_step": 280869, "epoch": 2321} {"train_loss": -43.76007080078125, "global_step": 280870, "epoch": 2321} {"train_loss": -40.02704620361328, "global_step": 280871, "epoch": 2321} {"train_loss": -43.100276947021484, "global_step": 280872, "epoch": 2321} {"train_loss": -42.699039459228516, "global_step": 280873, "epoch": 2321} {"train_loss": -43.09519577026367, "global_step": 280874, "epoch": 2321} {"train_loss": -41.33805847167969, "global_step": 280875, "epoch": 2321} {"train_loss": -42.47963333129883, "global_step": 280876, "epoch": 2321} {"train_loss": -43.979095458984375, "global_step": 280877, "epoch": 2321} {"train_loss": -42.57379913330078, "global_step": 280878, "epoch": 2321} {"train_loss": -42.31765365600586, "global_step": 280879, "epoch": 2321} {"train_loss": -42.71940994262695, "global_step": 280880, "epoch": 2321} {"train_loss": -43.51229476928711, "global_step": 280881, "epoch": 2321} {"train_loss": -42.82554244995117, "global_step": 280882, "epoch": 2321} {"train_loss": -39.841766357421875, "global_step": 280883, "epoch": 2321} {"train_loss": -43.719783782958984, "global_step": 280884, "epoch": 2321} {"train_loss": -40.43989944458008, "global_step": 280885, "epoch": 2321} {"train_loss": -42.037818908691406, "global_step": 280886, "epoch": 2321} {"train_loss": -41.936256408691406, "global_step": 280887, "epoch": 2321} {"train_loss": -42.043853759765625, "global_step": 280888, "epoch": 2321} {"train_loss": -43.34391784667969, "global_step": 280889, "epoch": 2321} {"train_loss": -43.105438232421875, "global_step": 280890, "epoch": 2321} {"train_loss": -41.798072814941406, "global_step": 280891, "epoch": 2321} {"train_loss": -42.66278839111328, "global_step": 280892, "epoch": 2321} {"train_loss": -43.15116500854492, "global_step": 280893, "epoch": 2321} {"train_loss": -37.91221618652344, "global_step": 280894, "epoch": 2321} {"train_loss": -42.82805633544922, "global_step": 280895, "epoch": 2321} {"train_loss": -41.804866790771484, "global_step": 280896, "epoch": 2321} {"train_loss": -42.7620964050293, "global_step": 280897, "epoch": 2321} {"train_loss": -42.488216400146484, "global_step": 280898, "epoch": 2321} {"train_loss": -41.27767562866211, "global_step": 280899, "epoch": 2321} {"train_loss": -41.297706604003906, "global_step": 280900, "epoch": 2321} {"train_loss": -41.54400634765625, "global_step": 280901, "epoch": 2321} {"train_loss": -40.79555892944336, "global_step": 280902, "epoch": 2321} {"train_loss": -34.39303207397461, "global_step": 280903, "epoch": 2321} {"train_loss": -42.67591094970703, "global_step": 280904, "epoch": 2321} {"train_loss": -39.31318664550781, "global_step": 280905, "epoch": 2321} {"train_loss": -41.94221115112305, "global_step": 280906, "epoch": 2321} {"train_loss": -42.97309494018555, "global_step": 280907, "epoch": 2321} {"train_loss": -41.8360481262207, "global_step": 280908, "epoch": 2321} {"train_loss": -42.0380744934082, "global_step": 280909, "epoch": 2321} {"train_loss": -41.446590423583984, "global_step": 280910, "epoch": 2321} {"train_loss": -40.44692611694336, "global_step": 280911, "epoch": 2321} {"train_loss": -36.251502990722656, "global_step": 280912, "epoch": 2321} {"train_loss": -41.68812942504883, "global_step": 280913, "epoch": 2321} {"train_loss": -42.159629821777344, "global_step": 280914, "epoch": 2321} {"train_loss": -40.93882369995117, "global_step": 280915, "epoch": 2321} {"train_loss": -42.590492248535156, "global_step": 280916, "epoch": 2321} {"train_loss": -42.82191848754883, "global_step": 280917, "epoch": 2321} {"train_loss": -40.844940185546875, "global_step": 280918, "epoch": 2321} {"train_loss": -42.735504150390625, "global_step": 280919, "epoch": 2321} {"train_loss": -38.51820373535156, "global_step": 280920, "epoch": 2321} {"train_loss": -41.76298141479492, "global_step": 280921, "epoch": 2321} {"train_loss": -42.60585403442383, "global_step": 280922, "epoch": 2321} {"train_loss": -40.70474624633789, "global_step": 280923, "epoch": 2321} {"train_loss": -41.64960479736328, "global_step": 280924, "epoch": 2321} {"train_loss": -39.1937255859375, "global_step": 280925, "epoch": 2321} {"train_loss": -41.62306594848633, "global_step": 280926, "epoch": 2321} {"train_loss": -41.30100631713867, "global_step": 280927, "epoch": 2321} {"train_loss": -41.93264389038086, "global_step": 280928, "epoch": 2321} {"train_loss": -41.626953125, "global_step": 280929, "epoch": 2321} {"train_loss": -42.24408721923828, "global_step": 280930, "epoch": 2321} {"train_loss": -41.405086517333984, "global_step": 280931, "epoch": 2321} {"train_loss": -41.70024490356445, "global_step": 280932, "epoch": 2321} {"train_loss": -43.14809799194336, "global_step": 280933, "epoch": 2321} {"train_loss": -42.489776611328125, "global_step": 280934, "epoch": 2321} {"train_loss": -42.70321273803711, "global_step": 280935, "epoch": 2321} {"train_loss": -41.87490463256836, "global_step": 280936, "epoch": 2321} {"train_loss": -42.97534942626953, "global_step": 280937, "epoch": 2321} {"train_loss": -41.59408187866211, "global_step": 280938, "epoch": 2321} {"train_loss": -42.54320526123047, "global_step": 280939, "epoch": 2321} {"train_loss": -42.692413330078125, "global_step": 280940, "epoch": 2321} {"train_loss": -40.999359130859375, "global_step": 280941, "epoch": 2321} {"train_loss": -42.393157958984375, "global_step": 280942, "epoch": 2321} {"train_loss": -42.78289794921875, "global_step": 280943, "epoch": 2321} {"train_loss": -42.23097229003906, "global_step": 280944, "epoch": 2321} {"train_loss": -43.33494186401367, "global_step": 280945, "epoch": 2321} {"train_loss": -42.7251091003418, "global_step": 280946, "epoch": 2321} {"train_loss": -43.35262680053711, "global_step": 280947, "epoch": 2321} {"train_loss": -42.964759826660156, "global_step": 280948, "epoch": 2321} {"train_loss": -42.760231018066406, "global_step": 280949, "epoch": 2321} {"train_loss": -42.66987228393555, "global_step": 280950, "epoch": 2321} {"train_loss": -42.28968048095703, "global_step": 280951, "epoch": 2321} {"train_loss": -43.03110885620117, "global_step": 280952, "epoch": 2321} {"train_loss": -43.17177963256836, "global_step": 280953, "epoch": 2321} {"train_loss": -42.20158767700195, "global_step": 280954, "epoch": 2321} {"train_loss": -42.8381233215332, "global_step": 280955, "epoch": 2321} {"train_loss": -43.16025924682617, "global_step": 280956, "epoch": 2321} {"train_loss": -42.385921478271484, "global_step": 280957, "epoch": 2321} {"train_loss": -43.535057067871094, "global_step": 280958, "epoch": 2321} {"train_loss": -42.42974853515625, "global_step": 280959, "epoch": 2321} {"train_loss": -42.48108673095703, "global_step": 280960, "epoch": 2321} {"train_loss": -42.07157024667283, "global_step": 280961, "epoch": 2321, "val_loss": 2498194.25} {"train_loss": -43.13063430786133, "global_step": 280962, "epoch": 2322} {"train_loss": -41.54156494140625, "global_step": 280963, "epoch": 2322} {"train_loss": -42.79328155517578, "global_step": 280964, "epoch": 2322} {"train_loss": -42.6165885925293, "global_step": 280965, "epoch": 2322} {"train_loss": -41.956298828125, "global_step": 280966, "epoch": 2322} {"train_loss": -43.354244232177734, "global_step": 280967, "epoch": 2322} {"train_loss": -43.265907287597656, "global_step": 280968, "epoch": 2322} {"train_loss": -41.173439025878906, "global_step": 280969, "epoch": 2322} {"train_loss": -42.284759521484375, "global_step": 280970, "epoch": 2322} {"train_loss": -41.60973358154297, "global_step": 280971, "epoch": 2322} {"train_loss": -43.7215690612793, "global_step": 280972, "epoch": 2322} {"train_loss": -43.21348571777344, "global_step": 280973, "epoch": 2322} {"train_loss": -42.827796936035156, "global_step": 280974, "epoch": 2322} {"train_loss": -43.64082717895508, "global_step": 280975, "epoch": 2322} {"train_loss": -43.363372802734375, "global_step": 280976, "epoch": 2322} {"train_loss": -42.987911224365234, "global_step": 280977, "epoch": 2322} {"train_loss": -43.72381591796875, "global_step": 280978, "epoch": 2322} {"train_loss": -43.310489654541016, "global_step": 280979, "epoch": 2322} {"train_loss": -43.54749298095703, "global_step": 280980, "epoch": 2322} {"train_loss": -43.75940704345703, "global_step": 280981, "epoch": 2322} {"train_loss": -43.57859420776367, "global_step": 280982, "epoch": 2322} {"train_loss": -43.62887191772461, "global_step": 280983, "epoch": 2322} {"train_loss": -42.25428771972656, "global_step": 280984, "epoch": 2322} {"train_loss": -43.06264114379883, "global_step": 280985, "epoch": 2322} {"train_loss": -44.02035140991211, "global_step": 280986, "epoch": 2322} {"train_loss": -43.320518493652344, "global_step": 280987, "epoch": 2322} {"train_loss": -41.892391204833984, "global_step": 280988, "epoch": 2322} {"train_loss": -42.32954788208008, "global_step": 280989, "epoch": 2322} {"train_loss": -42.62323760986328, "global_step": 280990, "epoch": 2322} {"train_loss": -41.579280853271484, "global_step": 280991, "epoch": 2322} {"train_loss": -41.36385726928711, "global_step": 280992, "epoch": 2322} {"train_loss": -42.363887786865234, "global_step": 280993, "epoch": 2322} {"train_loss": -43.166603088378906, "global_step": 280994, "epoch": 2322} {"train_loss": -42.07351303100586, "global_step": 280995, "epoch": 2322} {"train_loss": -42.17932891845703, "global_step": 280996, "epoch": 2322} {"train_loss": -43.15693283081055, "global_step": 280997, "epoch": 2322} {"train_loss": -41.408016204833984, "global_step": 280998, "epoch": 2322} {"train_loss": -40.356502532958984, "global_step": 280999, "epoch": 2322} {"train_loss": -40.75138473510742, "global_step": 281000, "epoch": 2322} {"train_loss": -41.287235260009766, "global_step": 281001, "epoch": 2322} {"train_loss": -43.132240295410156, "global_step": 281002, "epoch": 2322} {"train_loss": -39.89073944091797, "global_step": 281003, "epoch": 2322} {"train_loss": -40.26350021362305, "global_step": 281004, "epoch": 2322} {"train_loss": -39.546661376953125, "global_step": 281005, "epoch": 2322} {"train_loss": -42.017784118652344, "global_step": 281006, "epoch": 2322} {"train_loss": -42.78139877319336, "global_step": 281007, "epoch": 2322} {"train_loss": -40.910980224609375, "global_step": 281008, "epoch": 2322} {"train_loss": -40.104923248291016, "global_step": 281009, "epoch": 2322} {"train_loss": -42.1245231628418, "global_step": 281010, "epoch": 2322} {"train_loss": -40.54832077026367, "global_step": 281011, "epoch": 2322} {"train_loss": -40.089107513427734, "global_step": 281012, "epoch": 2322} {"train_loss": -41.93917465209961, "global_step": 281013, "epoch": 2322} {"train_loss": -41.4973030090332, "global_step": 281014, "epoch": 2322} {"train_loss": -42.4354362487793, "global_step": 281015, "epoch": 2322} {"train_loss": -42.02084732055664, "global_step": 281016, "epoch": 2322} {"train_loss": -42.52117156982422, "global_step": 281017, "epoch": 2322} {"train_loss": -42.14240264892578, "global_step": 281018, "epoch": 2322} {"train_loss": -42.7915153503418, "global_step": 281019, "epoch": 2322} {"train_loss": -43.36188888549805, "global_step": 281020, "epoch": 2322} {"train_loss": -43.69146728515625, "global_step": 281021, "epoch": 2322} {"train_loss": -43.07596969604492, "global_step": 281022, "epoch": 2322} {"train_loss": -43.18880844116211, "global_step": 281023, "epoch": 2322} {"train_loss": -43.277366638183594, "global_step": 281024, "epoch": 2322} {"train_loss": -43.11103820800781, "global_step": 281025, "epoch": 2322} {"train_loss": -43.13147735595703, "global_step": 281026, "epoch": 2322} {"train_loss": -43.45634460449219, "global_step": 281027, "epoch": 2322} {"train_loss": -43.236122131347656, "global_step": 281028, "epoch": 2322} {"train_loss": -43.535255432128906, "global_step": 281029, "epoch": 2322} {"train_loss": -43.611812591552734, "global_step": 281030, "epoch": 2322} {"train_loss": -43.07052230834961, "global_step": 281031, "epoch": 2322} {"train_loss": -43.40446853637695, "global_step": 281032, "epoch": 2322} {"train_loss": -43.71946334838867, "global_step": 281033, "epoch": 2322} {"train_loss": -43.268978118896484, "global_step": 281034, "epoch": 2322} {"train_loss": -43.376155853271484, "global_step": 281035, "epoch": 2322} {"train_loss": -43.523529052734375, "global_step": 281036, "epoch": 2322} {"train_loss": -43.44624328613281, "global_step": 281037, "epoch": 2322} {"train_loss": -44.143592834472656, "global_step": 281038, "epoch": 2322} {"train_loss": -43.07719802856445, "global_step": 281039, "epoch": 2322} {"train_loss": -43.3947639465332, "global_step": 281040, "epoch": 2322} {"train_loss": -43.6678581237793, "global_step": 281041, "epoch": 2322} {"train_loss": -43.713844299316406, "global_step": 281042, "epoch": 2322} {"train_loss": -43.419891357421875, "global_step": 281043, "epoch": 2322} {"train_loss": -43.53952407836914, "global_step": 281044, "epoch": 2322} {"train_loss": -43.14109420776367, "global_step": 281045, "epoch": 2322} {"train_loss": -44.304988861083984, "global_step": 281046, "epoch": 2322} {"train_loss": -43.9567985534668, "global_step": 281047, "epoch": 2322} {"train_loss": -43.975250244140625, "global_step": 281048, "epoch": 2322} {"train_loss": -43.9282341003418, "global_step": 281049, "epoch": 2322} {"train_loss": -43.96476745605469, "global_step": 281050, "epoch": 2322} {"train_loss": -44.3709716796875, "global_step": 281051, "epoch": 2322} {"train_loss": -43.72768783569336, "global_step": 281052, "epoch": 2322} {"train_loss": -43.63477325439453, "global_step": 281053, "epoch": 2322} {"train_loss": -43.63262939453125, "global_step": 281054, "epoch": 2322} {"train_loss": -43.316558837890625, "global_step": 281055, "epoch": 2322} {"train_loss": -44.03413009643555, "global_step": 281056, "epoch": 2322} {"train_loss": -43.76235580444336, "global_step": 281057, "epoch": 2322} {"train_loss": -42.60139846801758, "global_step": 281058, "epoch": 2322} {"train_loss": -43.36800003051758, "global_step": 281059, "epoch": 2322} {"train_loss": -43.41891098022461, "global_step": 281060, "epoch": 2322} {"train_loss": -44.093292236328125, "global_step": 281061, "epoch": 2322} {"train_loss": -43.91097640991211, "global_step": 281062, "epoch": 2322} {"train_loss": -43.906410217285156, "global_step": 281063, "epoch": 2322} {"train_loss": -44.43430709838867, "global_step": 281064, "epoch": 2322} {"train_loss": -44.487972259521484, "global_step": 281065, "epoch": 2322} {"train_loss": -44.31224060058594, "global_step": 281066, "epoch": 2322} {"train_loss": -43.315887451171875, "global_step": 281067, "epoch": 2322} {"train_loss": -43.857566833496094, "global_step": 281068, "epoch": 2322} {"train_loss": -44.479610443115234, "global_step": 281069, "epoch": 2322} {"train_loss": -43.93471908569336, "global_step": 281070, "epoch": 2322} {"train_loss": -44.135223388671875, "global_step": 281071, "epoch": 2322} {"train_loss": -43.52682113647461, "global_step": 281072, "epoch": 2322} {"train_loss": -43.5980339050293, "global_step": 281073, "epoch": 2322} {"train_loss": -43.72700881958008, "global_step": 281074, "epoch": 2322} {"train_loss": -43.55103302001953, "global_step": 281075, "epoch": 2322} {"train_loss": -42.44208908081055, "global_step": 281076, "epoch": 2322} {"train_loss": -43.681617736816406, "global_step": 281077, "epoch": 2322} {"train_loss": -43.68700408935547, "global_step": 281078, "epoch": 2322} {"train_loss": -42.479305267333984, "global_step": 281079, "epoch": 2322} {"train_loss": -43.182090759277344, "global_step": 281080, "epoch": 2322} {"train_loss": -43.04951095581055, "global_step": 281081, "epoch": 2322} {"train_loss": -42.94581484203496, "global_step": 281082, "epoch": 2322, "val_loss": 2453111.25} {"train_loss": -43.679603576660156, "global_step": 281083, "epoch": 2323} {"train_loss": -42.29838943481445, "global_step": 281084, "epoch": 2323} {"train_loss": -41.25529098510742, "global_step": 281085, "epoch": 2323} {"train_loss": -41.7195930480957, "global_step": 281086, "epoch": 2323} {"train_loss": -43.1567497253418, "global_step": 281087, "epoch": 2323} {"train_loss": -43.01041793823242, "global_step": 281088, "epoch": 2323} {"train_loss": -40.93958282470703, "global_step": 281089, "epoch": 2323} {"train_loss": -42.17774200439453, "global_step": 281090, "epoch": 2323} {"train_loss": -41.29536056518555, "global_step": 281091, "epoch": 2323} {"train_loss": -37.8805046081543, "global_step": 281092, "epoch": 2323} {"train_loss": -42.273590087890625, "global_step": 281093, "epoch": 2323} {"train_loss": -38.81785583496094, "global_step": 281094, "epoch": 2323} {"train_loss": -40.20707702636719, "global_step": 281095, "epoch": 2323} {"train_loss": -42.46126937866211, "global_step": 281096, "epoch": 2323} {"train_loss": -36.928646087646484, "global_step": 281097, "epoch": 2323} {"train_loss": -37.800533294677734, "global_step": 281098, "epoch": 2323} {"train_loss": -41.65336227416992, "global_step": 281099, "epoch": 2323} {"train_loss": -38.98405075073242, "global_step": 281100, "epoch": 2323} {"train_loss": -42.02649688720703, "global_step": 281101, "epoch": 2323} {"train_loss": -37.66450881958008, "global_step": 281102, "epoch": 2323} {"train_loss": -35.45463943481445, "global_step": 281103, "epoch": 2323} {"train_loss": -40.189239501953125, "global_step": 281104, "epoch": 2323} {"train_loss": -36.7895393371582, "global_step": 281105, "epoch": 2323} {"train_loss": -40.05421829223633, "global_step": 281106, "epoch": 2323} {"train_loss": -33.96588134765625, "global_step": 281107, "epoch": 2323} {"train_loss": -37.237667083740234, "global_step": 281108, "epoch": 2323} {"train_loss": -39.004608154296875, "global_step": 281109, "epoch": 2323} {"train_loss": -37.49160385131836, "global_step": 281110, "epoch": 2323} {"train_loss": -37.569427490234375, "global_step": 281111, "epoch": 2323} {"train_loss": -39.52895736694336, "global_step": 281112, "epoch": 2323} {"train_loss": -38.463478088378906, "global_step": 281113, "epoch": 2323} {"train_loss": -38.62069320678711, "global_step": 281114, "epoch": 2323} {"train_loss": -39.362247467041016, "global_step": 281115, "epoch": 2323} {"train_loss": -39.809661865234375, "global_step": 281116, "epoch": 2323} {"train_loss": -39.13067626953125, "global_step": 281117, "epoch": 2323} {"train_loss": -40.996788024902344, "global_step": 281118, "epoch": 2323} {"train_loss": -41.48737335205078, "global_step": 281119, "epoch": 2323} {"train_loss": -41.201534271240234, "global_step": 281120, "epoch": 2323} {"train_loss": -40.928157806396484, "global_step": 281121, "epoch": 2323} {"train_loss": -41.745574951171875, "global_step": 281122, "epoch": 2323} {"train_loss": -41.89716339111328, "global_step": 281123, "epoch": 2323} {"train_loss": -41.417301177978516, "global_step": 281124, "epoch": 2323} {"train_loss": -41.724159240722656, "global_step": 281125, "epoch": 2323} {"train_loss": -41.79026794433594, "global_step": 281126, "epoch": 2323} {"train_loss": -41.43024826049805, "global_step": 281127, "epoch": 2323} {"train_loss": -41.5460319519043, "global_step": 281128, "epoch": 2323} {"train_loss": -41.725189208984375, "global_step": 281129, "epoch": 2323} {"train_loss": -41.72532272338867, "global_step": 281130, "epoch": 2323} {"train_loss": -41.711090087890625, "global_step": 281131, "epoch": 2323} {"train_loss": -42.12984848022461, "global_step": 281132, "epoch": 2323} {"train_loss": -42.26917266845703, "global_step": 281133, "epoch": 2323} {"train_loss": -42.3041877746582, "global_step": 281134, "epoch": 2323} {"train_loss": -42.7818717956543, "global_step": 281135, "epoch": 2323} {"train_loss": -42.58452224731445, "global_step": 281136, "epoch": 2323} {"train_loss": -42.39497756958008, "global_step": 281137, "epoch": 2323} {"train_loss": -42.60572052001953, "global_step": 281138, "epoch": 2323} {"train_loss": -42.558406829833984, "global_step": 281139, "epoch": 2323} {"train_loss": -42.32405090332031, "global_step": 281140, "epoch": 2323} {"train_loss": -42.16704559326172, "global_step": 281141, "epoch": 2323} {"train_loss": -42.98334884643555, "global_step": 281142, "epoch": 2323} {"train_loss": -42.291717529296875, "global_step": 281143, "epoch": 2323} {"train_loss": -43.08515167236328, "global_step": 281144, "epoch": 2323} {"train_loss": -42.99726104736328, "global_step": 281145, "epoch": 2323} {"train_loss": -42.855525970458984, "global_step": 281146, "epoch": 2323} {"train_loss": -43.087371826171875, "global_step": 281147, "epoch": 2323} {"train_loss": -42.977962493896484, "global_step": 281148, "epoch": 2323} {"train_loss": -42.57319259643555, "global_step": 281149, "epoch": 2323} {"train_loss": -43.01090621948242, "global_step": 281150, "epoch": 2323} {"train_loss": -43.00653076171875, "global_step": 281151, "epoch": 2323} {"train_loss": -43.1628532409668, "global_step": 281152, "epoch": 2323} {"train_loss": -43.32261657714844, "global_step": 281153, "epoch": 2323} {"train_loss": -42.75056076049805, "global_step": 281154, "epoch": 2323} {"train_loss": -43.27114486694336, "global_step": 281155, "epoch": 2323} {"train_loss": -43.78007125854492, "global_step": 281156, "epoch": 2323} {"train_loss": -43.803829193115234, "global_step": 281157, "epoch": 2323} {"train_loss": -43.946109771728516, "global_step": 281158, "epoch": 2323} {"train_loss": -43.76118850708008, "global_step": 281159, "epoch": 2323} {"train_loss": -43.33076858520508, "global_step": 281160, "epoch": 2323} {"train_loss": -43.684364318847656, "global_step": 281161, "epoch": 2323} {"train_loss": -43.61928939819336, "global_step": 281162, "epoch": 2323} {"train_loss": -43.73036575317383, "global_step": 281163, "epoch": 2323} {"train_loss": -43.32456970214844, "global_step": 281164, "epoch": 2323} {"train_loss": -43.56681442260742, "global_step": 281165, "epoch": 2323} {"train_loss": -43.680824279785156, "global_step": 281166, "epoch": 2323} {"train_loss": -43.911102294921875, "global_step": 281167, "epoch": 2323} {"train_loss": -43.91560745239258, "global_step": 281168, "epoch": 2323} {"train_loss": -44.125736236572266, "global_step": 281169, "epoch": 2323} {"train_loss": -43.791988372802734, "global_step": 281170, "epoch": 2323} {"train_loss": -44.25779342651367, "global_step": 281171, "epoch": 2323} {"train_loss": -43.83869552612305, "global_step": 281172, "epoch": 2323} {"train_loss": -43.96370315551758, "global_step": 281173, "epoch": 2323} {"train_loss": -44.24574279785156, "global_step": 281174, "epoch": 2323} {"train_loss": -44.21175003051758, "global_step": 281175, "epoch": 2323} {"train_loss": -44.35056686401367, "global_step": 281176, "epoch": 2323} {"train_loss": -44.42338943481445, "global_step": 281177, "epoch": 2323} {"train_loss": -44.06430435180664, "global_step": 281178, "epoch": 2323} {"train_loss": -44.14619445800781, "global_step": 281179, "epoch": 2323} {"train_loss": -44.488502502441406, "global_step": 281180, "epoch": 2323} {"train_loss": -44.04243087768555, "global_step": 281181, "epoch": 2323} {"train_loss": -44.4373893737793, "global_step": 281182, "epoch": 2323} {"train_loss": -44.343658447265625, "global_step": 281183, "epoch": 2323} {"train_loss": -44.109310150146484, "global_step": 281184, "epoch": 2323} {"train_loss": -44.40464401245117, "global_step": 281185, "epoch": 2323} {"train_loss": -44.081153869628906, "global_step": 281186, "epoch": 2323} {"train_loss": -44.22011184692383, "global_step": 281187, "epoch": 2323} {"train_loss": -44.63557434082031, "global_step": 281188, "epoch": 2323} {"train_loss": -44.42460632324219, "global_step": 281189, "epoch": 2323} {"train_loss": -43.685604095458984, "global_step": 281190, "epoch": 2323} {"train_loss": -43.87864303588867, "global_step": 281191, "epoch": 2323} {"train_loss": -44.31599807739258, "global_step": 281192, "epoch": 2323} {"train_loss": -44.21053695678711, "global_step": 281193, "epoch": 2323} {"train_loss": -44.818790435791016, "global_step": 281194, "epoch": 2323} {"train_loss": -44.421791076660156, "global_step": 281195, "epoch": 2323} {"train_loss": -43.95519256591797, "global_step": 281196, "epoch": 2323} {"train_loss": -44.179012298583984, "global_step": 281197, "epoch": 2323} {"train_loss": -44.05859375, "global_step": 281198, "epoch": 2323} {"train_loss": -44.05439376831055, "global_step": 281199, "epoch": 2323} {"train_loss": -43.641971588134766, "global_step": 281200, "epoch": 2323} {"train_loss": -43.4600944519043, "global_step": 281201, "epoch": 2323} {"train_loss": -42.41712188720703, "global_step": 281202, "epoch": 2323} {"train_loss": -42.198631286621094, "global_step": 281203, "epoch": 2323, "val_loss": 2491052.75} {"train_loss": -44.702293395996094, "global_step": 281204, "epoch": 2324} {"train_loss": -43.434730529785156, "global_step": 281205, "epoch": 2324} {"train_loss": -42.80129623413086, "global_step": 281206, "epoch": 2324} {"train_loss": -41.15058135986328, "global_step": 281207, "epoch": 2324} {"train_loss": -42.7252082824707, "global_step": 281208, "epoch": 2324} {"train_loss": -44.191219329833984, "global_step": 281209, "epoch": 2324} {"train_loss": -43.76327133178711, "global_step": 281210, "epoch": 2324} {"train_loss": -42.89139938354492, "global_step": 281211, "epoch": 2324} {"train_loss": -41.24019241333008, "global_step": 281212, "epoch": 2324} {"train_loss": -40.281192779541016, "global_step": 281213, "epoch": 2324} {"train_loss": -42.96837615966797, "global_step": 281214, "epoch": 2324} {"train_loss": -39.07563781738281, "global_step": 281215, "epoch": 2324} {"train_loss": -41.72842025756836, "global_step": 281216, "epoch": 2324} {"train_loss": -43.15806198120117, "global_step": 281217, "epoch": 2324} {"train_loss": -38.04609298706055, "global_step": 281218, "epoch": 2324} {"train_loss": -37.67349624633789, "global_step": 281219, "epoch": 2324} {"train_loss": -42.23564529418945, "global_step": 281220, "epoch": 2324} {"train_loss": -32.64165496826172, "global_step": 281221, "epoch": 2324} {"train_loss": -31.136627197265625, "global_step": 281222, "epoch": 2324} {"train_loss": -41.2446403503418, "global_step": 281223, "epoch": 2324} {"train_loss": -37.56048583984375, "global_step": 281224, "epoch": 2324} {"train_loss": -37.63337326049805, "global_step": 281225, "epoch": 2324} {"train_loss": -40.25698471069336, "global_step": 281226, "epoch": 2324} {"train_loss": -41.08641815185547, "global_step": 281227, "epoch": 2324} {"train_loss": -39.9989128112793, "global_step": 281228, "epoch": 2324} {"train_loss": -39.2747688293457, "global_step": 281229, "epoch": 2324} {"train_loss": -41.536808013916016, "global_step": 281230, "epoch": 2324} {"train_loss": -41.98720932006836, "global_step": 281231, "epoch": 2324} {"train_loss": -36.640525817871094, "global_step": 281232, "epoch": 2324} {"train_loss": -39.644073486328125, "global_step": 281233, "epoch": 2324} {"train_loss": -41.75555419921875, "global_step": 281234, "epoch": 2324} {"train_loss": -39.82400131225586, "global_step": 281235, "epoch": 2324} {"train_loss": -42.470184326171875, "global_step": 281236, "epoch": 2324} {"train_loss": -39.68178939819336, "global_step": 281237, "epoch": 2324} {"train_loss": -40.57229232788086, "global_step": 281238, "epoch": 2324} {"train_loss": -41.80683517456055, "global_step": 281239, "epoch": 2324} {"train_loss": -39.9643440246582, "global_step": 281240, "epoch": 2324} {"train_loss": -41.939788818359375, "global_step": 281241, "epoch": 2324} {"train_loss": -39.897098541259766, "global_step": 281242, "epoch": 2324} {"train_loss": -39.377803802490234, "global_step": 281243, "epoch": 2324} {"train_loss": -41.89933395385742, "global_step": 281244, "epoch": 2324} {"train_loss": -39.64925765991211, "global_step": 281245, "epoch": 2324} {"train_loss": -42.41481399536133, "global_step": 281246, "epoch": 2324} {"train_loss": -41.409603118896484, "global_step": 281247, "epoch": 2324} {"train_loss": -42.40431594848633, "global_step": 281248, "epoch": 2324} {"train_loss": -42.13956832885742, "global_step": 281249, "epoch": 2324} {"train_loss": -42.10132598876953, "global_step": 281250, "epoch": 2324} {"train_loss": -42.38624954223633, "global_step": 281251, "epoch": 2324} {"train_loss": -41.5038948059082, "global_step": 281252, "epoch": 2324} {"train_loss": -42.686092376708984, "global_step": 281253, "epoch": 2324} {"train_loss": -42.27055358886719, "global_step": 281254, "epoch": 2324} {"train_loss": -42.77044677734375, "global_step": 281255, "epoch": 2324} {"train_loss": -42.849891662597656, "global_step": 281256, "epoch": 2324} {"train_loss": -42.80941390991211, "global_step": 281257, "epoch": 2324} {"train_loss": -42.36320114135742, "global_step": 281258, "epoch": 2324} {"train_loss": -43.03660202026367, "global_step": 281259, "epoch": 2324} {"train_loss": -43.210418701171875, "global_step": 281260, "epoch": 2324} {"train_loss": -42.64991760253906, "global_step": 281261, "epoch": 2324} {"train_loss": -42.98406982421875, "global_step": 281262, "epoch": 2324} {"train_loss": -42.24917984008789, "global_step": 281263, "epoch": 2324} {"train_loss": -42.907508850097656, "global_step": 281264, "epoch": 2324} {"train_loss": -42.82778549194336, "global_step": 281265, "epoch": 2324} {"train_loss": -42.64754867553711, "global_step": 281266, "epoch": 2324} {"train_loss": -43.209285736083984, "global_step": 281267, "epoch": 2324} {"train_loss": -42.5380744934082, "global_step": 281268, "epoch": 2324} {"train_loss": -43.18424606323242, "global_step": 281269, "epoch": 2324} {"train_loss": -42.54978561401367, "global_step": 281270, "epoch": 2324} {"train_loss": -41.90345001220703, "global_step": 281271, "epoch": 2324} {"train_loss": -42.90846633911133, "global_step": 281272, "epoch": 2324} {"train_loss": -42.187068939208984, "global_step": 281273, "epoch": 2324} {"train_loss": -43.44175338745117, "global_step": 281274, "epoch": 2324} {"train_loss": -43.133636474609375, "global_step": 281275, "epoch": 2324} {"train_loss": -43.568321228027344, "global_step": 281276, "epoch": 2324} {"train_loss": -42.8407096862793, "global_step": 281277, "epoch": 2324} {"train_loss": -43.29732894897461, "global_step": 281278, "epoch": 2324} {"train_loss": -43.34660720825195, "global_step": 281279, "epoch": 2324} {"train_loss": -43.014007568359375, "global_step": 281280, "epoch": 2324} {"train_loss": -42.92384719848633, "global_step": 281281, "epoch": 2324} {"train_loss": -42.75631332397461, "global_step": 281282, "epoch": 2324} {"train_loss": -43.738826751708984, "global_step": 281283, "epoch": 2324} {"train_loss": -43.088706970214844, "global_step": 281284, "epoch": 2324} {"train_loss": -43.58765411376953, "global_step": 281285, "epoch": 2324} {"train_loss": -43.22331619262695, "global_step": 281286, "epoch": 2324} {"train_loss": -43.50859832763672, "global_step": 281287, "epoch": 2324} {"train_loss": -43.16614532470703, "global_step": 281288, "epoch": 2324} {"train_loss": -43.414676666259766, "global_step": 281289, "epoch": 2324} {"train_loss": -43.45732498168945, "global_step": 281290, "epoch": 2324} {"train_loss": -43.523860931396484, "global_step": 281291, "epoch": 2324} {"train_loss": -43.06312942504883, "global_step": 281292, "epoch": 2324} {"train_loss": -43.365142822265625, "global_step": 281293, "epoch": 2324} {"train_loss": -43.841121673583984, "global_step": 281294, "epoch": 2324} {"train_loss": -44.02082443237305, "global_step": 281295, "epoch": 2324} {"train_loss": -43.74250030517578, "global_step": 281296, "epoch": 2324} {"train_loss": -43.54779052734375, "global_step": 281297, "epoch": 2324} {"train_loss": -43.989227294921875, "global_step": 281298, "epoch": 2324} {"train_loss": -44.19883346557617, "global_step": 281299, "epoch": 2324} {"train_loss": -43.94441223144531, "global_step": 281300, "epoch": 2324} {"train_loss": -43.50864791870117, "global_step": 281301, "epoch": 2324} {"train_loss": -44.065494537353516, "global_step": 281302, "epoch": 2324} {"train_loss": -43.469947814941406, "global_step": 281303, "epoch": 2324} {"train_loss": -43.76390838623047, "global_step": 281304, "epoch": 2324} {"train_loss": -43.5467529296875, "global_step": 281305, "epoch": 2324} {"train_loss": -43.78230667114258, "global_step": 281306, "epoch": 2324} {"train_loss": -43.49824142456055, "global_step": 281307, "epoch": 2324} {"train_loss": -43.96072006225586, "global_step": 281308, "epoch": 2324} {"train_loss": -43.24471664428711, "global_step": 281309, "epoch": 2324} {"train_loss": -43.9105339050293, "global_step": 281310, "epoch": 2324} {"train_loss": -44.05335998535156, "global_step": 281311, "epoch": 2324} {"train_loss": -43.6922492980957, "global_step": 281312, "epoch": 2324} {"train_loss": -43.28437805175781, "global_step": 281313, "epoch": 2324} {"train_loss": -44.26313400268555, "global_step": 281314, "epoch": 2324} {"train_loss": -44.00566482543945, "global_step": 281315, "epoch": 2324} {"train_loss": -43.65237808227539, "global_step": 281316, "epoch": 2324} {"train_loss": -43.859867095947266, "global_step": 281317, "epoch": 2324} {"train_loss": -43.99635696411133, "global_step": 281318, "epoch": 2324} {"train_loss": -43.60943603515625, "global_step": 281319, "epoch": 2324} {"train_loss": -44.14429473876953, "global_step": 281320, "epoch": 2324} {"train_loss": -44.1849250793457, "global_step": 281321, "epoch": 2324} {"train_loss": -44.21449661254883, "global_step": 281322, "epoch": 2324} {"train_loss": -44.5414924621582, "global_step": 281323, "epoch": 2324} {"train_loss": -42.293234170960986, "global_step": 281324, "epoch": 2324, "val_loss": 2524355.75} {"train_loss": -44.096031188964844, "global_step": 281325, "epoch": 2325} {"train_loss": -44.40763473510742, "global_step": 281326, "epoch": 2325} {"train_loss": -43.845882415771484, "global_step": 281327, "epoch": 2325} {"train_loss": -43.35282516479492, "global_step": 281328, "epoch": 2325} {"train_loss": -44.68281936645508, "global_step": 281329, "epoch": 2325} {"train_loss": -43.861045837402344, "global_step": 281330, "epoch": 2325} {"train_loss": -43.13812255859375, "global_step": 281331, "epoch": 2325} {"train_loss": -44.082210540771484, "global_step": 281332, "epoch": 2325} {"train_loss": -44.177486419677734, "global_step": 281333, "epoch": 2325} {"train_loss": -43.73181915283203, "global_step": 281334, "epoch": 2325} {"train_loss": -43.1829719543457, "global_step": 281335, "epoch": 2325} {"train_loss": -43.865272521972656, "global_step": 281336, "epoch": 2325} {"train_loss": -43.44525146484375, "global_step": 281337, "epoch": 2325} {"train_loss": -43.76850128173828, "global_step": 281338, "epoch": 2325} {"train_loss": -43.436309814453125, "global_step": 281339, "epoch": 2325} {"train_loss": -43.23530197143555, "global_step": 281340, "epoch": 2325} {"train_loss": -41.58834457397461, "global_step": 281341, "epoch": 2325} {"train_loss": -40.69181442260742, "global_step": 281342, "epoch": 2325} {"train_loss": -38.64291763305664, "global_step": 281343, "epoch": 2325} {"train_loss": -38.033695220947266, "global_step": 281344, "epoch": 2325} {"train_loss": -40.572235107421875, "global_step": 281345, "epoch": 2325} {"train_loss": -31.331329345703125, "global_step": 281346, "epoch": 2325} {"train_loss": -37.30706787109375, "global_step": 281347, "epoch": 2325} {"train_loss": -36.081268310546875, "global_step": 281348, "epoch": 2325} {"train_loss": -33.08739471435547, "global_step": 281349, "epoch": 2325} {"train_loss": -37.757354736328125, "global_step": 281350, "epoch": 2325} {"train_loss": -33.397003173828125, "global_step": 281351, "epoch": 2325} {"train_loss": -37.52863693237305, "global_step": 281352, "epoch": 2325} {"train_loss": -34.41718673706055, "global_step": 281353, "epoch": 2325} {"train_loss": -38.10248565673828, "global_step": 281354, "epoch": 2325} {"train_loss": -37.10789108276367, "global_step": 281355, "epoch": 2325} {"train_loss": -39.48751449584961, "global_step": 281356, "epoch": 2325} {"train_loss": -38.45117950439453, "global_step": 281357, "epoch": 2325} {"train_loss": -39.7547607421875, "global_step": 281358, "epoch": 2325} {"train_loss": -39.94162368774414, "global_step": 281359, "epoch": 2325} {"train_loss": -36.964988708496094, "global_step": 281360, "epoch": 2325} {"train_loss": -40.89724349975586, "global_step": 281361, "epoch": 2325} {"train_loss": -38.82845687866211, "global_step": 281362, "epoch": 2325} {"train_loss": -41.88190841674805, "global_step": 281363, "epoch": 2325} {"train_loss": -40.76709747314453, "global_step": 281364, "epoch": 2325} {"train_loss": -41.103851318359375, "global_step": 281365, "epoch": 2325} {"train_loss": -41.862640380859375, "global_step": 281366, "epoch": 2325} {"train_loss": -41.38555145263672, "global_step": 281367, "epoch": 2325} {"train_loss": -40.342376708984375, "global_step": 281368, "epoch": 2325} {"train_loss": -42.20996856689453, "global_step": 281369, "epoch": 2325} {"train_loss": -41.20595169067383, "global_step": 281370, "epoch": 2325} {"train_loss": -41.88438415527344, "global_step": 281371, "epoch": 2325} {"train_loss": -42.141822814941406, "global_step": 281372, "epoch": 2325} {"train_loss": -41.49614715576172, "global_step": 281373, "epoch": 2325} {"train_loss": -42.4368896484375, "global_step": 281374, "epoch": 2325} {"train_loss": -42.597259521484375, "global_step": 281375, "epoch": 2325} {"train_loss": -41.86517333984375, "global_step": 281376, "epoch": 2325} {"train_loss": -42.13985824584961, "global_step": 281377, "epoch": 2325} {"train_loss": -42.32512664794922, "global_step": 281378, "epoch": 2325} {"train_loss": -41.895347595214844, "global_step": 281379, "epoch": 2325} {"train_loss": -42.56343460083008, "global_step": 281380, "epoch": 2325} {"train_loss": -42.806488037109375, "global_step": 281381, "epoch": 2325} {"train_loss": -42.69835662841797, "global_step": 281382, "epoch": 2325} {"train_loss": -42.82719039916992, "global_step": 281383, "epoch": 2325} {"train_loss": -42.77203369140625, "global_step": 281384, "epoch": 2325} {"train_loss": -42.6447868347168, "global_step": 281385, "epoch": 2325} {"train_loss": -42.65278244018555, "global_step": 281386, "epoch": 2325} {"train_loss": -43.08062744140625, "global_step": 281387, "epoch": 2325} {"train_loss": -42.441558837890625, "global_step": 281388, "epoch": 2325} {"train_loss": -42.94135665893555, "global_step": 281389, "epoch": 2325} {"train_loss": -43.100284576416016, "global_step": 281390, "epoch": 2325} {"train_loss": -42.440643310546875, "global_step": 281391, "epoch": 2325} {"train_loss": -43.0037956237793, "global_step": 281392, "epoch": 2325} {"train_loss": -43.08191680908203, "global_step": 281393, "epoch": 2325} {"train_loss": -43.40645217895508, "global_step": 281394, "epoch": 2325} {"train_loss": -43.1580810546875, "global_step": 281395, "epoch": 2325} {"train_loss": -43.81077194213867, "global_step": 281396, "epoch": 2325} {"train_loss": -43.37624740600586, "global_step": 281397, "epoch": 2325} {"train_loss": -43.34939956665039, "global_step": 281398, "epoch": 2325} {"train_loss": -43.5015983581543, "global_step": 281399, "epoch": 2325} {"train_loss": -43.50460433959961, "global_step": 281400, "epoch": 2325} {"train_loss": -43.92877197265625, "global_step": 281401, "epoch": 2325} {"train_loss": -43.53176498413086, "global_step": 281402, "epoch": 2325} {"train_loss": -43.55411911010742, "global_step": 281403, "epoch": 2325} {"train_loss": -43.10722732543945, "global_step": 281404, "epoch": 2325} {"train_loss": -43.657161712646484, "global_step": 281405, "epoch": 2325} {"train_loss": -43.76032638549805, "global_step": 281406, "epoch": 2325} {"train_loss": -43.48936462402344, "global_step": 281407, "epoch": 2325} {"train_loss": -42.90180969238281, "global_step": 281408, "epoch": 2325} {"train_loss": -43.155452728271484, "global_step": 281409, "epoch": 2325} {"train_loss": -43.78542709350586, "global_step": 281410, "epoch": 2325} {"train_loss": -43.28300857543945, "global_step": 281411, "epoch": 2325} {"train_loss": -43.71339416503906, "global_step": 281412, "epoch": 2325} {"train_loss": -43.2335090637207, "global_step": 281413, "epoch": 2325} {"train_loss": -41.70853805541992, "global_step": 281414, "epoch": 2325} {"train_loss": -43.52568435668945, "global_step": 281415, "epoch": 2325} {"train_loss": -42.897216796875, "global_step": 281416, "epoch": 2325} {"train_loss": -43.24111557006836, "global_step": 281417, "epoch": 2325} {"train_loss": -43.603878021240234, "global_step": 281418, "epoch": 2325} {"train_loss": -43.863983154296875, "global_step": 281419, "epoch": 2325} {"train_loss": -42.85860824584961, "global_step": 281420, "epoch": 2325} {"train_loss": -42.96604537963867, "global_step": 281421, "epoch": 2325} {"train_loss": -43.42011642456055, "global_step": 281422, "epoch": 2325} {"train_loss": -43.77869415283203, "global_step": 281423, "epoch": 2325} {"train_loss": -42.94137191772461, "global_step": 281424, "epoch": 2325} {"train_loss": -43.44350814819336, "global_step": 281425, "epoch": 2325} {"train_loss": -43.848018646240234, "global_step": 281426, "epoch": 2325} {"train_loss": -43.68803405761719, "global_step": 281427, "epoch": 2325} {"train_loss": -42.882808685302734, "global_step": 281428, "epoch": 2325} {"train_loss": -43.255531311035156, "global_step": 281429, "epoch": 2325} {"train_loss": -43.98542022705078, "global_step": 281430, "epoch": 2325} {"train_loss": -43.93739700317383, "global_step": 281431, "epoch": 2325} {"train_loss": -43.6990852355957, "global_step": 281432, "epoch": 2325} {"train_loss": -44.206932067871094, "global_step": 281433, "epoch": 2325} {"train_loss": -43.82020950317383, "global_step": 281434, "epoch": 2325} {"train_loss": -43.858917236328125, "global_step": 281435, "epoch": 2325} {"train_loss": -43.610103607177734, "global_step": 281436, "epoch": 2325} {"train_loss": -42.6772575378418, "global_step": 281437, "epoch": 2325} {"train_loss": -42.61536407470703, "global_step": 281438, "epoch": 2325} {"train_loss": -43.41121292114258, "global_step": 281439, "epoch": 2325} {"train_loss": -43.613861083984375, "global_step": 281440, "epoch": 2325} {"train_loss": -42.522315979003906, "global_step": 281441, "epoch": 2325} {"train_loss": -43.780513763427734, "global_step": 281442, "epoch": 2325} {"train_loss": -42.834041595458984, "global_step": 281443, "epoch": 2325} {"train_loss": -42.88711166381836, "global_step": 281444, "epoch": 2325} {"train_loss": -42.109554385350755, "global_step": 281445, "epoch": 2325, "val_loss": 2509835.75} {"train_loss": -42.06473922729492, "global_step": 281446, "epoch": 2326} {"train_loss": -41.388771057128906, "global_step": 281447, "epoch": 2326} {"train_loss": -43.43560791015625, "global_step": 281448, "epoch": 2326} {"train_loss": -42.06483459472656, "global_step": 281449, "epoch": 2326} {"train_loss": -41.660701751708984, "global_step": 281450, "epoch": 2326} {"train_loss": -41.90125274658203, "global_step": 281451, "epoch": 2326} {"train_loss": -41.89335250854492, "global_step": 281452, "epoch": 2326} {"train_loss": -41.8160285949707, "global_step": 281453, "epoch": 2326} {"train_loss": -42.460166931152344, "global_step": 281454, "epoch": 2326} {"train_loss": -42.160396575927734, "global_step": 281455, "epoch": 2326} {"train_loss": -42.234798431396484, "global_step": 281456, "epoch": 2326} {"train_loss": -42.6135139465332, "global_step": 281457, "epoch": 2326} {"train_loss": -39.881134033203125, "global_step": 281458, "epoch": 2326} {"train_loss": -42.300209045410156, "global_step": 281459, "epoch": 2326} {"train_loss": -43.080650329589844, "global_step": 281460, "epoch": 2326} {"train_loss": -42.19757843017578, "global_step": 281461, "epoch": 2326} {"train_loss": -42.25457000732422, "global_step": 281462, "epoch": 2326} {"train_loss": -42.22013854980469, "global_step": 281463, "epoch": 2326} {"train_loss": -42.60956573486328, "global_step": 281464, "epoch": 2326} {"train_loss": -43.199378967285156, "global_step": 281465, "epoch": 2326} {"train_loss": -42.947906494140625, "global_step": 281466, "epoch": 2326} {"train_loss": -42.759857177734375, "global_step": 281467, "epoch": 2326} {"train_loss": -41.67304611206055, "global_step": 281468, "epoch": 2326} {"train_loss": -42.539608001708984, "global_step": 281469, "epoch": 2326} {"train_loss": -43.541622161865234, "global_step": 281470, "epoch": 2326} {"train_loss": -42.67522430419922, "global_step": 281471, "epoch": 2326} {"train_loss": -43.186309814453125, "global_step": 281472, "epoch": 2326} {"train_loss": -43.512062072753906, "global_step": 281473, "epoch": 2326} {"train_loss": -43.200233459472656, "global_step": 281474, "epoch": 2326} {"train_loss": -42.78650665283203, "global_step": 281475, "epoch": 2326} {"train_loss": -42.55450439453125, "global_step": 281476, "epoch": 2326} {"train_loss": -42.194129943847656, "global_step": 281477, "epoch": 2326} {"train_loss": -42.518245697021484, "global_step": 281478, "epoch": 2326} {"train_loss": -43.002777099609375, "global_step": 281479, "epoch": 2326} {"train_loss": -42.32510757446289, "global_step": 281480, "epoch": 2326} {"train_loss": -42.94704055786133, "global_step": 281481, "epoch": 2326} {"train_loss": -43.20455551147461, "global_step": 281482, "epoch": 2326} {"train_loss": -42.451175689697266, "global_step": 281483, "epoch": 2326} {"train_loss": -43.285850524902344, "global_step": 281484, "epoch": 2326} {"train_loss": -42.53013610839844, "global_step": 281485, "epoch": 2326} {"train_loss": -43.113868713378906, "global_step": 281486, "epoch": 2326} {"train_loss": -42.956756591796875, "global_step": 281487, "epoch": 2326} {"train_loss": -42.91657638549805, "global_step": 281488, "epoch": 2326} {"train_loss": -43.8125, "global_step": 281489, "epoch": 2326} {"train_loss": -43.046504974365234, "global_step": 281490, "epoch": 2326} {"train_loss": -43.388763427734375, "global_step": 281491, "epoch": 2326} {"train_loss": -43.2381591796875, "global_step": 281492, "epoch": 2326} {"train_loss": -42.30207443237305, "global_step": 281493, "epoch": 2326} {"train_loss": -44.09312057495117, "global_step": 281494, "epoch": 2326} {"train_loss": -42.971954345703125, "global_step": 281495, "epoch": 2326} {"train_loss": -43.52384567260742, "global_step": 281496, "epoch": 2326} {"train_loss": -43.416900634765625, "global_step": 281497, "epoch": 2326} {"train_loss": -43.11009216308594, "global_step": 281498, "epoch": 2326} {"train_loss": -43.39858627319336, "global_step": 281499, "epoch": 2326} {"train_loss": -43.57455062866211, "global_step": 281500, "epoch": 2326} {"train_loss": -43.556575775146484, "global_step": 281501, "epoch": 2326} {"train_loss": -43.35539245605469, "global_step": 281502, "epoch": 2326} {"train_loss": -43.75334167480469, "global_step": 281503, "epoch": 2326} {"train_loss": -43.52293014526367, "global_step": 281504, "epoch": 2326} {"train_loss": -43.32450485229492, "global_step": 281505, "epoch": 2326} {"train_loss": -43.548866271972656, "global_step": 281506, "epoch": 2326} {"train_loss": -43.708370208740234, "global_step": 281507, "epoch": 2326} {"train_loss": -43.43634033203125, "global_step": 281508, "epoch": 2326} {"train_loss": -43.963619232177734, "global_step": 281509, "epoch": 2326} {"train_loss": -43.66273880004883, "global_step": 281510, "epoch": 2326} {"train_loss": -43.50849533081055, "global_step": 281511, "epoch": 2326} {"train_loss": -43.15757751464844, "global_step": 281512, "epoch": 2326} {"train_loss": -43.984619140625, "global_step": 281513, "epoch": 2326} {"train_loss": -43.35828399658203, "global_step": 281514, "epoch": 2326} {"train_loss": -43.712745666503906, "global_step": 281515, "epoch": 2326} {"train_loss": -43.51969909667969, "global_step": 281516, "epoch": 2326} {"train_loss": -43.30125045776367, "global_step": 281517, "epoch": 2326} {"train_loss": -43.63261032104492, "global_step": 281518, "epoch": 2326} {"train_loss": -43.997291564941406, "global_step": 281519, "epoch": 2326} {"train_loss": -43.77368927001953, "global_step": 281520, "epoch": 2326} {"train_loss": -43.8393440246582, "global_step": 281521, "epoch": 2326} {"train_loss": -43.71092987060547, "global_step": 281522, "epoch": 2326} {"train_loss": -44.1051139831543, "global_step": 281523, "epoch": 2326} {"train_loss": -43.96464920043945, "global_step": 281524, "epoch": 2326} {"train_loss": -43.848506927490234, "global_step": 281525, "epoch": 2326} {"train_loss": -42.735347747802734, "global_step": 281526, "epoch": 2326} {"train_loss": -43.75214767456055, "global_step": 281527, "epoch": 2326} {"train_loss": -44.140323638916016, "global_step": 281528, "epoch": 2326} {"train_loss": -44.12901306152344, "global_step": 281529, "epoch": 2326} {"train_loss": -43.92382049560547, "global_step": 281530, "epoch": 2326} {"train_loss": -44.266807556152344, "global_step": 281531, "epoch": 2326} {"train_loss": -44.180728912353516, "global_step": 281532, "epoch": 2326} {"train_loss": -43.49522018432617, "global_step": 281533, "epoch": 2326} {"train_loss": -43.985530853271484, "global_step": 281534, "epoch": 2326} {"train_loss": -44.27944564819336, "global_step": 281535, "epoch": 2326} {"train_loss": -44.026611328125, "global_step": 281536, "epoch": 2326} {"train_loss": -44.140193939208984, "global_step": 281537, "epoch": 2326} {"train_loss": -43.814613342285156, "global_step": 281538, "epoch": 2326} {"train_loss": -44.241390228271484, "global_step": 281539, "epoch": 2326} {"train_loss": -43.74117660522461, "global_step": 281540, "epoch": 2326} {"train_loss": -43.60963439941406, "global_step": 281541, "epoch": 2326} {"train_loss": -43.61570358276367, "global_step": 281542, "epoch": 2326} {"train_loss": -44.040016174316406, "global_step": 281543, "epoch": 2326} {"train_loss": -44.00020217895508, "global_step": 281544, "epoch": 2326} {"train_loss": -43.96429443359375, "global_step": 281545, "epoch": 2326} {"train_loss": -44.28908920288086, "global_step": 281546, "epoch": 2326} {"train_loss": -43.56190872192383, "global_step": 281547, "epoch": 2326} {"train_loss": -41.91663360595703, "global_step": 281548, "epoch": 2326} {"train_loss": -41.1844596862793, "global_step": 281549, "epoch": 2326} {"train_loss": -41.37297439575195, "global_step": 281550, "epoch": 2326} {"train_loss": -42.250282287597656, "global_step": 281551, "epoch": 2326} {"train_loss": -42.56873321533203, "global_step": 281552, "epoch": 2326} {"train_loss": -42.0484619140625, "global_step": 281553, "epoch": 2326} {"train_loss": -42.99734115600586, "global_step": 281554, "epoch": 2326} {"train_loss": -42.46871566772461, "global_step": 281555, "epoch": 2326} {"train_loss": -42.7440071105957, "global_step": 281556, "epoch": 2326} {"train_loss": -43.58986282348633, "global_step": 281557, "epoch": 2326} {"train_loss": -43.241939544677734, "global_step": 281558, "epoch": 2326} {"train_loss": -42.959407806396484, "global_step": 281559, "epoch": 2326} {"train_loss": -43.472808837890625, "global_step": 281560, "epoch": 2326} {"train_loss": -42.08052444458008, "global_step": 281561, "epoch": 2326} {"train_loss": -41.54218673706055, "global_step": 281562, "epoch": 2326} {"train_loss": -42.51690673828125, "global_step": 281563, "epoch": 2326} {"train_loss": -41.96892547607422, "global_step": 281564, "epoch": 2326} {"train_loss": -41.81082534790039, "global_step": 281565, "epoch": 2326} {"train_loss": -43.05530128794268, "global_step": 281566, "epoch": 2326, "val_loss": 2516043.25} {"train_loss": -42.91565704345703, "global_step": 281567, "epoch": 2327} {"train_loss": -42.2735481262207, "global_step": 281568, "epoch": 2327} {"train_loss": -41.78251266479492, "global_step": 281569, "epoch": 2327} {"train_loss": -41.974239349365234, "global_step": 281570, "epoch": 2327} {"train_loss": -43.06415939331055, "global_step": 281571, "epoch": 2327} {"train_loss": -40.993343353271484, "global_step": 281572, "epoch": 2327} {"train_loss": -41.07461166381836, "global_step": 281573, "epoch": 2327} {"train_loss": -42.60580062866211, "global_step": 281574, "epoch": 2327} {"train_loss": -42.439510345458984, "global_step": 281575, "epoch": 2327} {"train_loss": -40.78793716430664, "global_step": 281576, "epoch": 2327} {"train_loss": -42.237457275390625, "global_step": 281577, "epoch": 2327} {"train_loss": -42.1949577331543, "global_step": 281578, "epoch": 2327} {"train_loss": -41.69296646118164, "global_step": 281579, "epoch": 2327} {"train_loss": -42.69942855834961, "global_step": 281580, "epoch": 2327} {"train_loss": -41.997596740722656, "global_step": 281581, "epoch": 2327} {"train_loss": -42.57609176635742, "global_step": 281582, "epoch": 2327} {"train_loss": -43.145259857177734, "global_step": 281583, "epoch": 2327} {"train_loss": -41.68120574951172, "global_step": 281584, "epoch": 2327} {"train_loss": -43.49119186401367, "global_step": 281585, "epoch": 2327} {"train_loss": -42.63189697265625, "global_step": 281586, "epoch": 2327} {"train_loss": -42.47102355957031, "global_step": 281587, "epoch": 2327} {"train_loss": -43.085208892822266, "global_step": 281588, "epoch": 2327} {"train_loss": -43.1661262512207, "global_step": 281589, "epoch": 2327} {"train_loss": -43.86981964111328, "global_step": 281590, "epoch": 2327} {"train_loss": -43.00879669189453, "global_step": 281591, "epoch": 2327} {"train_loss": -43.45729064941406, "global_step": 281592, "epoch": 2327} {"train_loss": -43.7008056640625, "global_step": 281593, "epoch": 2327} {"train_loss": -43.52006149291992, "global_step": 281594, "epoch": 2327} {"train_loss": -44.074031829833984, "global_step": 281595, "epoch": 2327} {"train_loss": -43.717079162597656, "global_step": 281596, "epoch": 2327} {"train_loss": -43.53582000732422, "global_step": 281597, "epoch": 2327} {"train_loss": -43.76643753051758, "global_step": 281598, "epoch": 2327} {"train_loss": -43.59272003173828, "global_step": 281599, "epoch": 2327} {"train_loss": -43.69145584106445, "global_step": 281600, "epoch": 2327} {"train_loss": -43.44874954223633, "global_step": 281601, "epoch": 2327} {"train_loss": -43.643245697021484, "global_step": 281602, "epoch": 2327} {"train_loss": -43.85670852661133, "global_step": 281603, "epoch": 2327} {"train_loss": -43.89406967163086, "global_step": 281604, "epoch": 2327} {"train_loss": -44.10163497924805, "global_step": 281605, "epoch": 2327} {"train_loss": -43.909664154052734, "global_step": 281606, "epoch": 2327} {"train_loss": -44.00052261352539, "global_step": 281607, "epoch": 2327} {"train_loss": -44.18290328979492, "global_step": 281608, "epoch": 2327} {"train_loss": -43.821495056152344, "global_step": 281609, "epoch": 2327} {"train_loss": -44.08657455444336, "global_step": 281610, "epoch": 2327} {"train_loss": -43.971439361572266, "global_step": 281611, "epoch": 2327} {"train_loss": -44.32216262817383, "global_step": 281612, "epoch": 2327} {"train_loss": -44.0760498046875, "global_step": 281613, "epoch": 2327} {"train_loss": -44.1290283203125, "global_step": 281614, "epoch": 2327} {"train_loss": -44.40727233886719, "global_step": 281615, "epoch": 2327} {"train_loss": -44.10628890991211, "global_step": 281616, "epoch": 2327} {"train_loss": -44.1409912109375, "global_step": 281617, "epoch": 2327} {"train_loss": -44.47379684448242, "global_step": 281618, "epoch": 2327} {"train_loss": -44.276405334472656, "global_step": 281619, "epoch": 2327} {"train_loss": -44.0472297668457, "global_step": 281620, "epoch": 2327} {"train_loss": -44.398555755615234, "global_step": 281621, "epoch": 2327} {"train_loss": -43.854854583740234, "global_step": 281622, "epoch": 2327} {"train_loss": -43.77297592163086, "global_step": 281623, "epoch": 2327} {"train_loss": -43.88983917236328, "global_step": 281624, "epoch": 2327} {"train_loss": -43.57625961303711, "global_step": 281625, "epoch": 2327} {"train_loss": -43.627132415771484, "global_step": 281626, "epoch": 2327} {"train_loss": -44.24109649658203, "global_step": 281627, "epoch": 2327} {"train_loss": -44.02506637573242, "global_step": 281628, "epoch": 2327} {"train_loss": -43.65520095825195, "global_step": 281629, "epoch": 2327} {"train_loss": -43.06312942504883, "global_step": 281630, "epoch": 2327} {"train_loss": -42.75020980834961, "global_step": 281631, "epoch": 2327} {"train_loss": -43.57789993286133, "global_step": 281632, "epoch": 2327} {"train_loss": -44.1268424987793, "global_step": 281633, "epoch": 2327} {"train_loss": -43.091854095458984, "global_step": 281634, "epoch": 2327} {"train_loss": -43.361934661865234, "global_step": 281635, "epoch": 2327} {"train_loss": -43.84425735473633, "global_step": 281636, "epoch": 2327} {"train_loss": -43.3887939453125, "global_step": 281637, "epoch": 2327} {"train_loss": -43.88991165161133, "global_step": 281638, "epoch": 2327} {"train_loss": -43.323699951171875, "global_step": 281639, "epoch": 2327} {"train_loss": -43.67043685913086, "global_step": 281640, "epoch": 2327} {"train_loss": -43.713600158691406, "global_step": 281641, "epoch": 2327} {"train_loss": -43.99141311645508, "global_step": 281642, "epoch": 2327} {"train_loss": -43.838836669921875, "global_step": 281643, "epoch": 2327} {"train_loss": -43.84192657470703, "global_step": 281644, "epoch": 2327} {"train_loss": -43.97239303588867, "global_step": 281645, "epoch": 2327} {"train_loss": -43.584869384765625, "global_step": 281646, "epoch": 2327} {"train_loss": -42.98330307006836, "global_step": 281647, "epoch": 2327} {"train_loss": -43.56123352050781, "global_step": 281648, "epoch": 2327} {"train_loss": -41.97040557861328, "global_step": 281649, "epoch": 2327} {"train_loss": -42.54520797729492, "global_step": 281650, "epoch": 2327} {"train_loss": -42.68622589111328, "global_step": 281651, "epoch": 2327} {"train_loss": -43.743988037109375, "global_step": 281652, "epoch": 2327} {"train_loss": -42.52217483520508, "global_step": 281653, "epoch": 2327} {"train_loss": -43.2966194152832, "global_step": 281654, "epoch": 2327} {"train_loss": -42.27604293823242, "global_step": 281655, "epoch": 2327} {"train_loss": -42.62398910522461, "global_step": 281656, "epoch": 2327} {"train_loss": -41.697994232177734, "global_step": 281657, "epoch": 2327} {"train_loss": -41.70259475708008, "global_step": 281658, "epoch": 2327} {"train_loss": -40.697025299072266, "global_step": 281659, "epoch": 2327} {"train_loss": -40.48211669921875, "global_step": 281660, "epoch": 2327} {"train_loss": -42.324928283691406, "global_step": 281661, "epoch": 2327} {"train_loss": -43.04508590698242, "global_step": 281662, "epoch": 2327} {"train_loss": -41.484642028808594, "global_step": 281663, "epoch": 2327} {"train_loss": -42.59845733642578, "global_step": 281664, "epoch": 2327} {"train_loss": -42.27187728881836, "global_step": 281665, "epoch": 2327} {"train_loss": -41.532554626464844, "global_step": 281666, "epoch": 2327} {"train_loss": -43.150062561035156, "global_step": 281667, "epoch": 2327} {"train_loss": -41.85811996459961, "global_step": 281668, "epoch": 2327} {"train_loss": -42.254981994628906, "global_step": 281669, "epoch": 2327} {"train_loss": -43.00838088989258, "global_step": 281670, "epoch": 2327} {"train_loss": -42.8580207824707, "global_step": 281671, "epoch": 2327} {"train_loss": -42.50527572631836, "global_step": 281672, "epoch": 2327} {"train_loss": -43.38522720336914, "global_step": 281673, "epoch": 2327} {"train_loss": -42.94382858276367, "global_step": 281674, "epoch": 2327} {"train_loss": -42.32170867919922, "global_step": 281675, "epoch": 2327} {"train_loss": -43.215457916259766, "global_step": 281676, "epoch": 2327} {"train_loss": -43.74726486206055, "global_step": 281677, "epoch": 2327} {"train_loss": -43.9387321472168, "global_step": 281678, "epoch": 2327} {"train_loss": -43.52126693725586, "global_step": 281679, "epoch": 2327} {"train_loss": -43.204315185546875, "global_step": 281680, "epoch": 2327} {"train_loss": -43.47774887084961, "global_step": 281681, "epoch": 2327} {"train_loss": -43.41691589355469, "global_step": 281682, "epoch": 2327} {"train_loss": -43.8786506652832, "global_step": 281683, "epoch": 2327} {"train_loss": -43.27560043334961, "global_step": 281684, "epoch": 2327} {"train_loss": -43.768550872802734, "global_step": 281685, "epoch": 2327} {"train_loss": -44.49433135986328, "global_step": 281686, "epoch": 2327} {"train_loss": -43.176317451414, "global_step": 281687, "epoch": 2327, "val_loss": 2490169.25} {"train_loss": -44.14372253417969, "global_step": 281688, "epoch": 2328} {"train_loss": -44.26593017578125, "global_step": 281689, "epoch": 2328} {"train_loss": -44.24787521362305, "global_step": 281690, "epoch": 2328} {"train_loss": -43.950592041015625, "global_step": 281691, "epoch": 2328} {"train_loss": -43.67456817626953, "global_step": 281692, "epoch": 2328} {"train_loss": -44.2586555480957, "global_step": 281693, "epoch": 2328} {"train_loss": -43.896583557128906, "global_step": 281694, "epoch": 2328} {"train_loss": -44.047515869140625, "global_step": 281695, "epoch": 2328} {"train_loss": -43.93416976928711, "global_step": 281696, "epoch": 2328} {"train_loss": -43.574066162109375, "global_step": 281697, "epoch": 2328} {"train_loss": -44.08936309814453, "global_step": 281698, "epoch": 2328} {"train_loss": -44.0265998840332, "global_step": 281699, "epoch": 2328} {"train_loss": -43.801265716552734, "global_step": 281700, "epoch": 2328} {"train_loss": -44.072242736816406, "global_step": 281701, "epoch": 2328} {"train_loss": -44.08905792236328, "global_step": 281702, "epoch": 2328} {"train_loss": -43.7088508605957, "global_step": 281703, "epoch": 2328} {"train_loss": -42.3874626159668, "global_step": 281704, "epoch": 2328} {"train_loss": -42.358516693115234, "global_step": 281705, "epoch": 2328} {"train_loss": -43.76545333862305, "global_step": 281706, "epoch": 2328} {"train_loss": -44.607032775878906, "global_step": 281707, "epoch": 2328} {"train_loss": -42.759368896484375, "global_step": 281708, "epoch": 2328} {"train_loss": -43.05831527709961, "global_step": 281709, "epoch": 2328} {"train_loss": -44.03403854370117, "global_step": 281710, "epoch": 2328} {"train_loss": -44.2960319519043, "global_step": 281711, "epoch": 2328} {"train_loss": -43.165374755859375, "global_step": 281712, "epoch": 2328} {"train_loss": -42.176639556884766, "global_step": 281713, "epoch": 2328} {"train_loss": -43.0059814453125, "global_step": 281714, "epoch": 2328} {"train_loss": -43.3615608215332, "global_step": 281715, "epoch": 2328} {"train_loss": -43.69390106201172, "global_step": 281716, "epoch": 2328} {"train_loss": -44.11289978027344, "global_step": 281717, "epoch": 2328} {"train_loss": -43.430763244628906, "global_step": 281718, "epoch": 2328} {"train_loss": -43.66569137573242, "global_step": 281719, "epoch": 2328} {"train_loss": -44.57355880737305, "global_step": 281720, "epoch": 2328} {"train_loss": -43.77088165283203, "global_step": 281721, "epoch": 2328} {"train_loss": -43.99860382080078, "global_step": 281722, "epoch": 2328} {"train_loss": -44.127960205078125, "global_step": 281723, "epoch": 2328} {"train_loss": -43.79148483276367, "global_step": 281724, "epoch": 2328} {"train_loss": -43.24068832397461, "global_step": 281725, "epoch": 2328} {"train_loss": -43.30963134765625, "global_step": 281726, "epoch": 2328} {"train_loss": -43.592960357666016, "global_step": 281727, "epoch": 2328} {"train_loss": -44.53310012817383, "global_step": 281728, "epoch": 2328} {"train_loss": -43.49314880371094, "global_step": 281729, "epoch": 2328} {"train_loss": -43.22105026245117, "global_step": 281730, "epoch": 2328} {"train_loss": -43.05122375488281, "global_step": 281731, "epoch": 2328} {"train_loss": -43.966102600097656, "global_step": 281732, "epoch": 2328} {"train_loss": -43.813262939453125, "global_step": 281733, "epoch": 2328} {"train_loss": -44.200164794921875, "global_step": 281734, "epoch": 2328} {"train_loss": -43.814666748046875, "global_step": 281735, "epoch": 2328} {"train_loss": -43.783809661865234, "global_step": 281736, "epoch": 2328} {"train_loss": -43.70095443725586, "global_step": 281737, "epoch": 2328} {"train_loss": -43.599544525146484, "global_step": 281738, "epoch": 2328} {"train_loss": -44.18625259399414, "global_step": 281739, "epoch": 2328} {"train_loss": -43.86635208129883, "global_step": 281740, "epoch": 2328} {"train_loss": -43.3428840637207, "global_step": 281741, "epoch": 2328} {"train_loss": -43.31058883666992, "global_step": 281742, "epoch": 2328} {"train_loss": -43.75748825073242, "global_step": 281743, "epoch": 2328} {"train_loss": -43.979835510253906, "global_step": 281744, "epoch": 2328} {"train_loss": -43.83652114868164, "global_step": 281745, "epoch": 2328} {"train_loss": -43.05720901489258, "global_step": 281746, "epoch": 2328} {"train_loss": -42.59834671020508, "global_step": 281747, "epoch": 2328} {"train_loss": -43.36842727661133, "global_step": 281748, "epoch": 2328} {"train_loss": -43.40802764892578, "global_step": 281749, "epoch": 2328} {"train_loss": -42.839874267578125, "global_step": 281750, "epoch": 2328} {"train_loss": -43.563167572021484, "global_step": 281751, "epoch": 2328} {"train_loss": -44.17812728881836, "global_step": 281752, "epoch": 2328} {"train_loss": -43.160133361816406, "global_step": 281753, "epoch": 2328} {"train_loss": -43.24721908569336, "global_step": 281754, "epoch": 2328} {"train_loss": -43.40471649169922, "global_step": 281755, "epoch": 2328} {"train_loss": -42.249691009521484, "global_step": 281756, "epoch": 2328} {"train_loss": -41.358848571777344, "global_step": 281757, "epoch": 2328} {"train_loss": -42.548583984375, "global_step": 281758, "epoch": 2328} {"train_loss": -42.55153274536133, "global_step": 281759, "epoch": 2328} {"train_loss": -43.02302169799805, "global_step": 281760, "epoch": 2328} {"train_loss": -42.402462005615234, "global_step": 281761, "epoch": 2328} {"train_loss": -39.16017532348633, "global_step": 281762, "epoch": 2328} {"train_loss": -42.03782272338867, "global_step": 281763, "epoch": 2328} {"train_loss": -40.53894805908203, "global_step": 281764, "epoch": 2328} {"train_loss": -39.96040344238281, "global_step": 281765, "epoch": 2328} {"train_loss": -39.9176025390625, "global_step": 281766, "epoch": 2328} {"train_loss": -41.36354446411133, "global_step": 281767, "epoch": 2328} {"train_loss": -42.21016311645508, "global_step": 281768, "epoch": 2328} {"train_loss": -41.76753616333008, "global_step": 281769, "epoch": 2328} {"train_loss": -39.01099395751953, "global_step": 281770, "epoch": 2328} {"train_loss": -42.9606819152832, "global_step": 281771, "epoch": 2328} {"train_loss": -42.95812225341797, "global_step": 281772, "epoch": 2328} {"train_loss": -41.62986373901367, "global_step": 281773, "epoch": 2328} {"train_loss": -41.22602844238281, "global_step": 281774, "epoch": 2328} {"train_loss": -42.329158782958984, "global_step": 281775, "epoch": 2328} {"train_loss": -42.614585876464844, "global_step": 281776, "epoch": 2328} {"train_loss": -41.76436233520508, "global_step": 281777, "epoch": 2328} {"train_loss": -38.75053787231445, "global_step": 281778, "epoch": 2328} {"train_loss": -43.44081115722656, "global_step": 281779, "epoch": 2328} {"train_loss": -42.20088195800781, "global_step": 281780, "epoch": 2328} {"train_loss": -42.73649215698242, "global_step": 281781, "epoch": 2328} {"train_loss": -42.536476135253906, "global_step": 281782, "epoch": 2328} {"train_loss": -41.45051574707031, "global_step": 281783, "epoch": 2328} {"train_loss": -41.13389205932617, "global_step": 281784, "epoch": 2328} {"train_loss": -41.91582489013672, "global_step": 281785, "epoch": 2328} {"train_loss": -41.07477569580078, "global_step": 281786, "epoch": 2328} {"train_loss": -41.30929183959961, "global_step": 281787, "epoch": 2328} {"train_loss": -42.85909652709961, "global_step": 281788, "epoch": 2328} {"train_loss": -41.01784896850586, "global_step": 281789, "epoch": 2328} {"train_loss": -40.00418472290039, "global_step": 281790, "epoch": 2328} {"train_loss": -42.95267868041992, "global_step": 281791, "epoch": 2328} {"train_loss": -41.58735275268555, "global_step": 281792, "epoch": 2328} {"train_loss": -39.752872467041016, "global_step": 281793, "epoch": 2328} {"train_loss": -42.553955078125, "global_step": 281794, "epoch": 2328} {"train_loss": -42.185420989990234, "global_step": 281795, "epoch": 2328} {"train_loss": -41.847023010253906, "global_step": 281796, "epoch": 2328} {"train_loss": -43.02891159057617, "global_step": 281797, "epoch": 2328} {"train_loss": -42.01226806640625, "global_step": 281798, "epoch": 2328} {"train_loss": -41.9379997253418, "global_step": 281799, "epoch": 2328} {"train_loss": -42.34223175048828, "global_step": 281800, "epoch": 2328} {"train_loss": -41.93508529663086, "global_step": 281801, "epoch": 2328} {"train_loss": -42.906124114990234, "global_step": 281802, "epoch": 2328} {"train_loss": -41.70351791381836, "global_step": 281803, "epoch": 2328} {"train_loss": -41.171234130859375, "global_step": 281804, "epoch": 2328} {"train_loss": -42.722381591796875, "global_step": 281805, "epoch": 2328} {"train_loss": -42.46562957763672, "global_step": 281806, "epoch": 2328} {"train_loss": -43.29046630859375, "global_step": 281807, "epoch": 2328} {"train_loss": -42.843453588564536, "global_step": 281808, "epoch": 2328, "val_loss": 2477649.75} {"train_loss": -42.12635040283203, "global_step": 281809, "epoch": 2329} {"train_loss": -43.47015380859375, "global_step": 281810, "epoch": 2329} {"train_loss": -42.40550231933594, "global_step": 281811, "epoch": 2329} {"train_loss": -42.800453186035156, "global_step": 281812, "epoch": 2329} {"train_loss": -41.41255569458008, "global_step": 281813, "epoch": 2329} {"train_loss": -42.595130920410156, "global_step": 281814, "epoch": 2329} {"train_loss": -42.572444915771484, "global_step": 281815, "epoch": 2329} {"train_loss": -43.04376983642578, "global_step": 281816, "epoch": 2329} {"train_loss": -41.82423400878906, "global_step": 281817, "epoch": 2329} {"train_loss": -43.172786712646484, "global_step": 281818, "epoch": 2329} {"train_loss": -42.494503021240234, "global_step": 281819, "epoch": 2329} {"train_loss": -43.1546516418457, "global_step": 281820, "epoch": 2329} {"train_loss": -42.57729721069336, "global_step": 281821, "epoch": 2329} {"train_loss": -43.20981979370117, "global_step": 281822, "epoch": 2329} {"train_loss": -42.91096115112305, "global_step": 281823, "epoch": 2329} {"train_loss": -43.3696174621582, "global_step": 281824, "epoch": 2329} {"train_loss": -43.6051025390625, "global_step": 281825, "epoch": 2329} {"train_loss": -41.4102668762207, "global_step": 281826, "epoch": 2329} {"train_loss": -43.46700668334961, "global_step": 281827, "epoch": 2329} {"train_loss": -42.562744140625, "global_step": 281828, "epoch": 2329} {"train_loss": -43.01773452758789, "global_step": 281829, "epoch": 2329} {"train_loss": -43.455467224121094, "global_step": 281830, "epoch": 2329} {"train_loss": -43.44898223876953, "global_step": 281831, "epoch": 2329} {"train_loss": -42.337520599365234, "global_step": 281832, "epoch": 2329} {"train_loss": -43.38340377807617, "global_step": 281833, "epoch": 2329} {"train_loss": -43.6190299987793, "global_step": 281834, "epoch": 2329} {"train_loss": -42.86903762817383, "global_step": 281835, "epoch": 2329} {"train_loss": -42.51485824584961, "global_step": 281836, "epoch": 2329} {"train_loss": -44.00542449951172, "global_step": 281837, "epoch": 2329} {"train_loss": -43.43696594238281, "global_step": 281838, "epoch": 2329} {"train_loss": -43.1348876953125, "global_step": 281839, "epoch": 2329} {"train_loss": -43.50786209106445, "global_step": 281840, "epoch": 2329} {"train_loss": -38.91362380981445, "global_step": 281841, "epoch": 2329} {"train_loss": -37.35211944580078, "global_step": 281842, "epoch": 2329} {"train_loss": -38.863887786865234, "global_step": 281843, "epoch": 2329} {"train_loss": -43.04052734375, "global_step": 281844, "epoch": 2329} {"train_loss": -42.1256103515625, "global_step": 281845, "epoch": 2329} {"train_loss": -42.890682220458984, "global_step": 281846, "epoch": 2329} {"train_loss": -42.70573043823242, "global_step": 281847, "epoch": 2329} {"train_loss": -42.329986572265625, "global_step": 281848, "epoch": 2329} {"train_loss": -39.292442321777344, "global_step": 281849, "epoch": 2329} {"train_loss": -34.49317932128906, "global_step": 281850, "epoch": 2329} {"train_loss": -42.05758285522461, "global_step": 281851, "epoch": 2329} {"train_loss": -37.72344207763672, "global_step": 281852, "epoch": 2329} {"train_loss": -43.2822380065918, "global_step": 281853, "epoch": 2329} {"train_loss": -42.2210807800293, "global_step": 281854, "epoch": 2329} {"train_loss": -40.17695236206055, "global_step": 281855, "epoch": 2329} {"train_loss": -41.33818817138672, "global_step": 281856, "epoch": 2329} {"train_loss": -41.70878219604492, "global_step": 281857, "epoch": 2329} {"train_loss": -41.168704986572266, "global_step": 281858, "epoch": 2329} {"train_loss": -39.17078399658203, "global_step": 281859, "epoch": 2329} {"train_loss": -41.78841018676758, "global_step": 281860, "epoch": 2329} {"train_loss": -39.99699020385742, "global_step": 281861, "epoch": 2329} {"train_loss": -38.53135299682617, "global_step": 281862, "epoch": 2329} {"train_loss": -42.50167465209961, "global_step": 281863, "epoch": 2329} {"train_loss": -41.62166976928711, "global_step": 281864, "epoch": 2329} {"train_loss": -42.08584213256836, "global_step": 281865, "epoch": 2329} {"train_loss": -39.28388214111328, "global_step": 281866, "epoch": 2329} {"train_loss": -41.52520751953125, "global_step": 281867, "epoch": 2329} {"train_loss": -39.84552001953125, "global_step": 281868, "epoch": 2329} {"train_loss": -41.766048431396484, "global_step": 281869, "epoch": 2329} {"train_loss": -41.0700798034668, "global_step": 281870, "epoch": 2329} {"train_loss": -42.457279205322266, "global_step": 281871, "epoch": 2329} {"train_loss": -39.95998764038086, "global_step": 281872, "epoch": 2329} {"train_loss": -40.80710983276367, "global_step": 281873, "epoch": 2329} {"train_loss": -40.65610885620117, "global_step": 281874, "epoch": 2329} {"train_loss": -42.253700256347656, "global_step": 281875, "epoch": 2329} {"train_loss": -41.315589904785156, "global_step": 281876, "epoch": 2329} {"train_loss": -42.110382080078125, "global_step": 281877, "epoch": 2329} {"train_loss": -42.2557487487793, "global_step": 281878, "epoch": 2329} {"train_loss": -41.52602005004883, "global_step": 281879, "epoch": 2329} {"train_loss": -42.09072494506836, "global_step": 281880, "epoch": 2329} {"train_loss": -42.4602165222168, "global_step": 281881, "epoch": 2329} {"train_loss": -40.68229675292969, "global_step": 281882, "epoch": 2329} {"train_loss": -41.7516975402832, "global_step": 281883, "epoch": 2329} {"train_loss": -41.85030746459961, "global_step": 281884, "epoch": 2329} {"train_loss": -42.35480499267578, "global_step": 281885, "epoch": 2329} {"train_loss": -40.58047103881836, "global_step": 281886, "epoch": 2329} {"train_loss": -42.59841537475586, "global_step": 281887, "epoch": 2329} {"train_loss": -42.04121017456055, "global_step": 281888, "epoch": 2329} {"train_loss": -41.906028747558594, "global_step": 281889, "epoch": 2329} {"train_loss": -41.93611145019531, "global_step": 281890, "epoch": 2329} {"train_loss": -41.500633239746094, "global_step": 281891, "epoch": 2329} {"train_loss": -43.56686019897461, "global_step": 281892, "epoch": 2329} {"train_loss": -41.889686584472656, "global_step": 281893, "epoch": 2329} {"train_loss": -42.172664642333984, "global_step": 281894, "epoch": 2329} {"train_loss": -42.661251068115234, "global_step": 281895, "epoch": 2329} {"train_loss": -41.90958023071289, "global_step": 281896, "epoch": 2329} {"train_loss": -41.81545639038086, "global_step": 281897, "epoch": 2329} {"train_loss": -42.68632888793945, "global_step": 281898, "epoch": 2329} {"train_loss": -42.910003662109375, "global_step": 281899, "epoch": 2329} {"train_loss": -42.4343376159668, "global_step": 281900, "epoch": 2329} {"train_loss": -42.45612716674805, "global_step": 281901, "epoch": 2329} {"train_loss": -42.37392807006836, "global_step": 281902, "epoch": 2329} {"train_loss": -43.19514083862305, "global_step": 281903, "epoch": 2329} {"train_loss": -43.364559173583984, "global_step": 281904, "epoch": 2329} {"train_loss": -43.274452209472656, "global_step": 281905, "epoch": 2329} {"train_loss": -43.46030807495117, "global_step": 281906, "epoch": 2329} {"train_loss": -42.62922286987305, "global_step": 281907, "epoch": 2329} {"train_loss": -42.852901458740234, "global_step": 281908, "epoch": 2329} {"train_loss": -43.316307067871094, "global_step": 281909, "epoch": 2329} {"train_loss": -42.88155746459961, "global_step": 281910, "epoch": 2329} {"train_loss": -43.454444885253906, "global_step": 281911, "epoch": 2329} {"train_loss": -42.91048812866211, "global_step": 281912, "epoch": 2329} {"train_loss": -42.80120086669922, "global_step": 281913, "epoch": 2329} {"train_loss": -43.79460525512695, "global_step": 281914, "epoch": 2329} {"train_loss": -42.71200180053711, "global_step": 281915, "epoch": 2329} {"train_loss": -42.89815902709961, "global_step": 281916, "epoch": 2329} {"train_loss": -43.00474166870117, "global_step": 281917, "epoch": 2329} {"train_loss": -43.221710205078125, "global_step": 281918, "epoch": 2329} {"train_loss": -42.920841217041016, "global_step": 281919, "epoch": 2329} {"train_loss": -42.90536117553711, "global_step": 281920, "epoch": 2329} {"train_loss": -43.466121673583984, "global_step": 281921, "epoch": 2329} {"train_loss": -43.39242172241211, "global_step": 281922, "epoch": 2329} {"train_loss": -43.35373306274414, "global_step": 281923, "epoch": 2329} {"train_loss": -43.6240348815918, "global_step": 281924, "epoch": 2329} {"train_loss": -43.45467758178711, "global_step": 281925, "epoch": 2329} {"train_loss": -43.276241302490234, "global_step": 281926, "epoch": 2329} {"train_loss": -43.53984451293945, "global_step": 281927, "epoch": 2329} {"train_loss": -43.954898834228516, "global_step": 281928, "epoch": 2329} {"train_loss": -42.166274015568504, "global_step": 281929, "epoch": 2329, "val_loss": 2404186.0} {"train_loss": -44.117835998535156, "global_step": 281930, "epoch": 2330} {"train_loss": -43.18465805053711, "global_step": 281931, "epoch": 2330} {"train_loss": -41.920318603515625, "global_step": 281932, "epoch": 2330} {"train_loss": -43.216758728027344, "global_step": 281933, "epoch": 2330} {"train_loss": -42.31126022338867, "global_step": 281934, "epoch": 2330} {"train_loss": -42.81232833862305, "global_step": 281935, "epoch": 2330} {"train_loss": -43.410884857177734, "global_step": 281936, "epoch": 2330} {"train_loss": -42.33897018432617, "global_step": 281937, "epoch": 2330} {"train_loss": -43.144439697265625, "global_step": 281938, "epoch": 2330} {"train_loss": -42.841922760009766, "global_step": 281939, "epoch": 2330} {"train_loss": -42.64724349975586, "global_step": 281940, "epoch": 2330} {"train_loss": -43.190467834472656, "global_step": 281941, "epoch": 2330} {"train_loss": -42.7501335144043, "global_step": 281942, "epoch": 2330} {"train_loss": -43.52511215209961, "global_step": 281943, "epoch": 2330} {"train_loss": -42.755367279052734, "global_step": 281944, "epoch": 2330} {"train_loss": -42.203800201416016, "global_step": 281945, "epoch": 2330} {"train_loss": -41.96455001831055, "global_step": 281946, "epoch": 2330} {"train_loss": -41.1013069152832, "global_step": 281947, "epoch": 2330} {"train_loss": -42.51945114135742, "global_step": 281948, "epoch": 2330} {"train_loss": -42.78888702392578, "global_step": 281949, "epoch": 2330} {"train_loss": -42.01264572143555, "global_step": 281950, "epoch": 2330} {"train_loss": -42.82697677612305, "global_step": 281951, "epoch": 2330} {"train_loss": -40.5667610168457, "global_step": 281952, "epoch": 2330} {"train_loss": -42.87188720703125, "global_step": 281953, "epoch": 2330} {"train_loss": -42.7975959777832, "global_step": 281954, "epoch": 2330} {"train_loss": -41.69239044189453, "global_step": 281955, "epoch": 2330} {"train_loss": -42.569801330566406, "global_step": 281956, "epoch": 2330} {"train_loss": -43.23250961303711, "global_step": 281957, "epoch": 2330} {"train_loss": -42.1373405456543, "global_step": 281958, "epoch": 2330} {"train_loss": -43.43953323364258, "global_step": 281959, "epoch": 2330} {"train_loss": -43.67824935913086, "global_step": 281960, "epoch": 2330} {"train_loss": -42.240806579589844, "global_step": 281961, "epoch": 2330} {"train_loss": -41.239627838134766, "global_step": 281962, "epoch": 2330} {"train_loss": -41.791534423828125, "global_step": 281963, "epoch": 2330} {"train_loss": -42.4960823059082, "global_step": 281964, "epoch": 2330} {"train_loss": -42.66620635986328, "global_step": 281965, "epoch": 2330} {"train_loss": -42.590293884277344, "global_step": 281966, "epoch": 2330} {"train_loss": -40.040870666503906, "global_step": 281967, "epoch": 2330} {"train_loss": -42.149723052978516, "global_step": 281968, "epoch": 2330} {"train_loss": -41.776065826416016, "global_step": 281969, "epoch": 2330} {"train_loss": -39.428985595703125, "global_step": 281970, "epoch": 2330} {"train_loss": -38.55923080444336, "global_step": 281971, "epoch": 2330} {"train_loss": -41.97077560424805, "global_step": 281972, "epoch": 2330} {"train_loss": -41.1948127746582, "global_step": 281973, "epoch": 2330} {"train_loss": -41.42832565307617, "global_step": 281974, "epoch": 2330} {"train_loss": -42.68722915649414, "global_step": 281975, "epoch": 2330} {"train_loss": -41.954444885253906, "global_step": 281976, "epoch": 2330} {"train_loss": -42.651004791259766, "global_step": 281977, "epoch": 2330} {"train_loss": -42.41645050048828, "global_step": 281978, "epoch": 2330} {"train_loss": -43.24728012084961, "global_step": 281979, "epoch": 2330} {"train_loss": -42.41978073120117, "global_step": 281980, "epoch": 2330} {"train_loss": -42.881927490234375, "global_step": 281981, "epoch": 2330} {"train_loss": -43.39079284667969, "global_step": 281982, "epoch": 2330} {"train_loss": -42.72468185424805, "global_step": 281983, "epoch": 2330} {"train_loss": -43.58325958251953, "global_step": 281984, "epoch": 2330} {"train_loss": -42.629764556884766, "global_step": 281985, "epoch": 2330} {"train_loss": -42.729122161865234, "global_step": 281986, "epoch": 2330} {"train_loss": -42.958038330078125, "global_step": 281987, "epoch": 2330} {"train_loss": -43.557891845703125, "global_step": 281988, "epoch": 2330} {"train_loss": -43.252685546875, "global_step": 281989, "epoch": 2330} {"train_loss": -42.303524017333984, "global_step": 281990, "epoch": 2330} {"train_loss": -43.49542999267578, "global_step": 281991, "epoch": 2330} {"train_loss": -43.8013916015625, "global_step": 281992, "epoch": 2330} {"train_loss": -43.27170944213867, "global_step": 281993, "epoch": 2330} {"train_loss": -43.57914352416992, "global_step": 281994, "epoch": 2330} {"train_loss": -43.44132995605469, "global_step": 281995, "epoch": 2330} {"train_loss": -43.21637725830078, "global_step": 281996, "epoch": 2330} {"train_loss": -43.13277816772461, "global_step": 281997, "epoch": 2330} {"train_loss": -43.88480758666992, "global_step": 281998, "epoch": 2330} {"train_loss": -43.70481491088867, "global_step": 281999, "epoch": 2330} {"train_loss": -43.439781188964844, "global_step": 282000, "epoch": 2330} {"train_loss": -40.7392692565918, "global_step": 282001, "epoch": 2330} {"train_loss": -43.33570098876953, "global_step": 282002, "epoch": 2330} {"train_loss": -43.752498626708984, "global_step": 282003, "epoch": 2330} {"train_loss": -42.861412048339844, "global_step": 282004, "epoch": 2330} {"train_loss": -43.40970993041992, "global_step": 282005, "epoch": 2330} {"train_loss": -43.85914993286133, "global_step": 282006, "epoch": 2330} {"train_loss": -43.82487869262695, "global_step": 282007, "epoch": 2330} {"train_loss": -43.57790756225586, "global_step": 282008, "epoch": 2330} {"train_loss": -43.924617767333984, "global_step": 282009, "epoch": 2330} {"train_loss": -43.905029296875, "global_step": 282010, "epoch": 2330} {"train_loss": -44.489742279052734, "global_step": 282011, "epoch": 2330} {"train_loss": -43.94894790649414, "global_step": 282012, "epoch": 2330} {"train_loss": -43.460758209228516, "global_step": 282013, "epoch": 2330} {"train_loss": -44.13725662231445, "global_step": 282014, "epoch": 2330} {"train_loss": -44.09994125366211, "global_step": 282015, "epoch": 2330} {"train_loss": -43.62336730957031, "global_step": 282016, "epoch": 2330} {"train_loss": -44.3398323059082, "global_step": 282017, "epoch": 2330} {"train_loss": -44.32583999633789, "global_step": 282018, "epoch": 2330} {"train_loss": -44.355037689208984, "global_step": 282019, "epoch": 2330} {"train_loss": -43.89539337158203, "global_step": 282020, "epoch": 2330} {"train_loss": -44.115142822265625, "global_step": 282021, "epoch": 2330} {"train_loss": -44.27036666870117, "global_step": 282022, "epoch": 2330} {"train_loss": -44.381771087646484, "global_step": 282023, "epoch": 2330} {"train_loss": -44.31899642944336, "global_step": 282024, "epoch": 2330} {"train_loss": -44.3328971862793, "global_step": 282025, "epoch": 2330} {"train_loss": -43.83488845825195, "global_step": 282026, "epoch": 2330} {"train_loss": -43.97761154174805, "global_step": 282027, "epoch": 2330} {"train_loss": -44.02012252807617, "global_step": 282028, "epoch": 2330} {"train_loss": -43.9160270690918, "global_step": 282029, "epoch": 2330} {"train_loss": -44.26555252075195, "global_step": 282030, "epoch": 2330} {"train_loss": -43.90415954589844, "global_step": 282031, "epoch": 2330} {"train_loss": -43.713008880615234, "global_step": 282032, "epoch": 2330} {"train_loss": -41.753910064697266, "global_step": 282033, "epoch": 2330} {"train_loss": -40.18901443481445, "global_step": 282034, "epoch": 2330} {"train_loss": -43.02187728881836, "global_step": 282035, "epoch": 2330} {"train_loss": -43.7640495300293, "global_step": 282036, "epoch": 2330} {"train_loss": -44.482093811035156, "global_step": 282037, "epoch": 2330} {"train_loss": -41.673622131347656, "global_step": 282038, "epoch": 2330} {"train_loss": -40.76361083984375, "global_step": 282039, "epoch": 2330} {"train_loss": -41.94824981689453, "global_step": 282040, "epoch": 2330} {"train_loss": -43.162628173828125, "global_step": 282041, "epoch": 2330} {"train_loss": -44.02524185180664, "global_step": 282042, "epoch": 2330} {"train_loss": -41.39857864379883, "global_step": 282043, "epoch": 2330} {"train_loss": -41.728755950927734, "global_step": 282044, "epoch": 2330} {"train_loss": -44.159034729003906, "global_step": 282045, "epoch": 2330} {"train_loss": -42.96168899536133, "global_step": 282046, "epoch": 2330} {"train_loss": -42.39216232299805, "global_step": 282047, "epoch": 2330} {"train_loss": -43.671630859375, "global_step": 282048, "epoch": 2330} {"train_loss": -43.72613525390625, "global_step": 282049, "epoch": 2330} {"train_loss": -42.91288842445563, "global_step": 282050, "epoch": 2330, "val_loss": 2450262.0} {"train_loss": -43.8748664855957, "global_step": 282051, "epoch": 2331} {"train_loss": -42.857093811035156, "global_step": 282052, "epoch": 2331} {"train_loss": -41.315704345703125, "global_step": 282053, "epoch": 2331} {"train_loss": -43.179412841796875, "global_step": 282054, "epoch": 2331} {"train_loss": -43.11164855957031, "global_step": 282055, "epoch": 2331} {"train_loss": -42.22515869140625, "global_step": 282056, "epoch": 2331} {"train_loss": -43.5782585144043, "global_step": 282057, "epoch": 2331} {"train_loss": -42.1904411315918, "global_step": 282058, "epoch": 2331} {"train_loss": -41.942718505859375, "global_step": 282059, "epoch": 2331} {"train_loss": -43.16016387939453, "global_step": 282060, "epoch": 2331} {"train_loss": -41.77485275268555, "global_step": 282061, "epoch": 2331} {"train_loss": -41.659664154052734, "global_step": 282062, "epoch": 2331} {"train_loss": -38.79429626464844, "global_step": 282063, "epoch": 2331} {"train_loss": -40.398345947265625, "global_step": 282064, "epoch": 2331} {"train_loss": -42.959964752197266, "global_step": 282065, "epoch": 2331} {"train_loss": -42.09870529174805, "global_step": 282066, "epoch": 2331} {"train_loss": -39.187557220458984, "global_step": 282067, "epoch": 2331} {"train_loss": -40.754024505615234, "global_step": 282068, "epoch": 2331} {"train_loss": -42.11042022705078, "global_step": 282069, "epoch": 2331} {"train_loss": -41.9535026550293, "global_step": 282070, "epoch": 2331} {"train_loss": -41.30817794799805, "global_step": 282071, "epoch": 2331} {"train_loss": -41.31816101074219, "global_step": 282072, "epoch": 2331} {"train_loss": -40.713844299316406, "global_step": 282073, "epoch": 2331} {"train_loss": -42.7342643737793, "global_step": 282074, "epoch": 2331} {"train_loss": -41.27817153930664, "global_step": 282075, "epoch": 2331} {"train_loss": -41.63701248168945, "global_step": 282076, "epoch": 2331} {"train_loss": -41.85539627075195, "global_step": 282077, "epoch": 2331} {"train_loss": -42.151756286621094, "global_step": 282078, "epoch": 2331} {"train_loss": -41.5609016418457, "global_step": 282079, "epoch": 2331} {"train_loss": -39.8656120300293, "global_step": 282080, "epoch": 2331} {"train_loss": -39.82666778564453, "global_step": 282081, "epoch": 2331} {"train_loss": -39.77924728393555, "global_step": 282082, "epoch": 2331} {"train_loss": -40.576690673828125, "global_step": 282083, "epoch": 2331} {"train_loss": -38.98298263549805, "global_step": 282084, "epoch": 2331} {"train_loss": -40.67324447631836, "global_step": 282085, "epoch": 2331} {"train_loss": -39.832820892333984, "global_step": 282086, "epoch": 2331} {"train_loss": -38.91630935668945, "global_step": 282087, "epoch": 2331} {"train_loss": -38.94447708129883, "global_step": 282088, "epoch": 2331} {"train_loss": -41.99752426147461, "global_step": 282089, "epoch": 2331} {"train_loss": -39.97488021850586, "global_step": 282090, "epoch": 2331} {"train_loss": -42.15009307861328, "global_step": 282091, "epoch": 2331} {"train_loss": -40.63514709472656, "global_step": 282092, "epoch": 2331} {"train_loss": -41.23666000366211, "global_step": 282093, "epoch": 2331} {"train_loss": -42.013824462890625, "global_step": 282094, "epoch": 2331} {"train_loss": -40.525428771972656, "global_step": 282095, "epoch": 2331} {"train_loss": -42.01275634765625, "global_step": 282096, "epoch": 2331} {"train_loss": -40.87592697143555, "global_step": 282097, "epoch": 2331} {"train_loss": -42.40387725830078, "global_step": 282098, "epoch": 2331} {"train_loss": -42.76755142211914, "global_step": 282099, "epoch": 2331} {"train_loss": -42.202083587646484, "global_step": 282100, "epoch": 2331} {"train_loss": -42.66175079345703, "global_step": 282101, "epoch": 2331} {"train_loss": -41.533447265625, "global_step": 282102, "epoch": 2331} {"train_loss": -42.59107208251953, "global_step": 282103, "epoch": 2331} {"train_loss": -42.85775375366211, "global_step": 282104, "epoch": 2331} {"train_loss": -42.32563400268555, "global_step": 282105, "epoch": 2331} {"train_loss": -43.17327880859375, "global_step": 282106, "epoch": 2331} {"train_loss": -41.844791412353516, "global_step": 282107, "epoch": 2331} {"train_loss": -42.976966857910156, "global_step": 282108, "epoch": 2331} {"train_loss": -42.824501037597656, "global_step": 282109, "epoch": 2331} {"train_loss": -43.05839920043945, "global_step": 282110, "epoch": 2331} {"train_loss": -42.86049270629883, "global_step": 282111, "epoch": 2331} {"train_loss": -43.10972213745117, "global_step": 282112, "epoch": 2331} {"train_loss": -43.33379364013672, "global_step": 282113, "epoch": 2331} {"train_loss": -43.308807373046875, "global_step": 282114, "epoch": 2331} {"train_loss": -43.57646560668945, "global_step": 282115, "epoch": 2331} {"train_loss": -43.210044860839844, "global_step": 282116, "epoch": 2331} {"train_loss": -43.591796875, "global_step": 282117, "epoch": 2331} {"train_loss": -43.13859176635742, "global_step": 282118, "epoch": 2331} {"train_loss": -43.70622253417969, "global_step": 282119, "epoch": 2331} {"train_loss": -43.35313034057617, "global_step": 282120, "epoch": 2331} {"train_loss": -43.395484924316406, "global_step": 282121, "epoch": 2331} {"train_loss": -43.779144287109375, "global_step": 282122, "epoch": 2331} {"train_loss": -43.543697357177734, "global_step": 282123, "epoch": 2331} {"train_loss": -43.60630798339844, "global_step": 282124, "epoch": 2331} {"train_loss": -44.04574203491211, "global_step": 282125, "epoch": 2331} {"train_loss": -44.02455520629883, "global_step": 282126, "epoch": 2331} {"train_loss": -43.29941940307617, "global_step": 282127, "epoch": 2331} {"train_loss": -43.74794387817383, "global_step": 282128, "epoch": 2331} {"train_loss": -43.4412727355957, "global_step": 282129, "epoch": 2331} {"train_loss": -43.36993408203125, "global_step": 282130, "epoch": 2331} {"train_loss": -43.67866897583008, "global_step": 282131, "epoch": 2331} {"train_loss": -43.74318313598633, "global_step": 282132, "epoch": 2331} {"train_loss": -43.74452590942383, "global_step": 282133, "epoch": 2331} {"train_loss": -44.379150390625, "global_step": 282134, "epoch": 2331} {"train_loss": -43.98637008666992, "global_step": 282135, "epoch": 2331} {"train_loss": -43.65353012084961, "global_step": 282136, "epoch": 2331} {"train_loss": -44.272850036621094, "global_step": 282137, "epoch": 2331} {"train_loss": -44.31716537475586, "global_step": 282138, "epoch": 2331} {"train_loss": -44.086463928222656, "global_step": 282139, "epoch": 2331} {"train_loss": -43.6981315612793, "global_step": 282140, "epoch": 2331} {"train_loss": -44.001216888427734, "global_step": 282141, "epoch": 2331} {"train_loss": -44.411842346191406, "global_step": 282142, "epoch": 2331} {"train_loss": -44.35866165161133, "global_step": 282143, "epoch": 2331} {"train_loss": -43.90476989746094, "global_step": 282144, "epoch": 2331} {"train_loss": -44.126033782958984, "global_step": 282145, "epoch": 2331} {"train_loss": -44.01567077636719, "global_step": 282146, "epoch": 2331} {"train_loss": -43.90864944458008, "global_step": 282147, "epoch": 2331} {"train_loss": -43.97366714477539, "global_step": 282148, "epoch": 2331} {"train_loss": -44.579593658447266, "global_step": 282149, "epoch": 2331} {"train_loss": -43.328514099121094, "global_step": 282150, "epoch": 2331} {"train_loss": -44.04695510864258, "global_step": 282151, "epoch": 2331} {"train_loss": -44.59355545043945, "global_step": 282152, "epoch": 2331} {"train_loss": -43.652957916259766, "global_step": 282153, "epoch": 2331} {"train_loss": -44.19875717163086, "global_step": 282154, "epoch": 2331} {"train_loss": -44.184120178222656, "global_step": 282155, "epoch": 2331} {"train_loss": -43.9411735534668, "global_step": 282156, "epoch": 2331} {"train_loss": -43.77200698852539, "global_step": 282157, "epoch": 2331} {"train_loss": -43.30295181274414, "global_step": 282158, "epoch": 2331} {"train_loss": -43.5148811340332, "global_step": 282159, "epoch": 2331} {"train_loss": -43.1453742980957, "global_step": 282160, "epoch": 2331} {"train_loss": -43.4150276184082, "global_step": 282161, "epoch": 2331} {"train_loss": -43.73572540283203, "global_step": 282162, "epoch": 2331} {"train_loss": -41.78162384033203, "global_step": 282163, "epoch": 2331} {"train_loss": -41.369319915771484, "global_step": 282164, "epoch": 2331} {"train_loss": -42.85026931762695, "global_step": 282165, "epoch": 2331} {"train_loss": -43.09735107421875, "global_step": 282166, "epoch": 2331} {"train_loss": -43.40281677246094, "global_step": 282167, "epoch": 2331} {"train_loss": -42.47425842285156, "global_step": 282168, "epoch": 2331} {"train_loss": -41.68647003173828, "global_step": 282169, "epoch": 2331} {"train_loss": -43.16450881958008, "global_step": 282170, "epoch": 2331} {"train_loss": -42.59378225153143, "global_step": 282171, "epoch": 2331, "val_loss": 2455106.75} {"train_loss": -43.3831672668457, "global_step": 282172, "epoch": 2332} {"train_loss": -42.913818359375, "global_step": 282173, "epoch": 2332} {"train_loss": -41.538753509521484, "global_step": 282174, "epoch": 2332} {"train_loss": -40.500396728515625, "global_step": 282175, "epoch": 2332} {"train_loss": -43.06391143798828, "global_step": 282176, "epoch": 2332} {"train_loss": -41.2985954284668, "global_step": 282177, "epoch": 2332} {"train_loss": -40.714027404785156, "global_step": 282178, "epoch": 2332} {"train_loss": -40.11367416381836, "global_step": 282179, "epoch": 2332} {"train_loss": -43.179901123046875, "global_step": 282180, "epoch": 2332} {"train_loss": -41.85901641845703, "global_step": 282181, "epoch": 2332} {"train_loss": -39.59186935424805, "global_step": 282182, "epoch": 2332} {"train_loss": -43.30527877807617, "global_step": 282183, "epoch": 2332} {"train_loss": -42.38075637817383, "global_step": 282184, "epoch": 2332} {"train_loss": -42.067012786865234, "global_step": 282185, "epoch": 2332} {"train_loss": -43.330604553222656, "global_step": 282186, "epoch": 2332} {"train_loss": -41.68546676635742, "global_step": 282187, "epoch": 2332} {"train_loss": -42.60196304321289, "global_step": 282188, "epoch": 2332} {"train_loss": -42.93870162963867, "global_step": 282189, "epoch": 2332} {"train_loss": -42.407711029052734, "global_step": 282190, "epoch": 2332} {"train_loss": -43.04729080200195, "global_step": 282191, "epoch": 2332} {"train_loss": -42.54209518432617, "global_step": 282192, "epoch": 2332} {"train_loss": -42.8839111328125, "global_step": 282193, "epoch": 2332} {"train_loss": -43.527549743652344, "global_step": 282194, "epoch": 2332} {"train_loss": -42.616363525390625, "global_step": 282195, "epoch": 2332} {"train_loss": -40.98435974121094, "global_step": 282196, "epoch": 2332} {"train_loss": -43.5197868347168, "global_step": 282197, "epoch": 2332} {"train_loss": -41.57253646850586, "global_step": 282198, "epoch": 2332} {"train_loss": -42.257381439208984, "global_step": 282199, "epoch": 2332} {"train_loss": -42.71712112426758, "global_step": 282200, "epoch": 2332} {"train_loss": -42.72188949584961, "global_step": 282201, "epoch": 2332} {"train_loss": -42.1515007019043, "global_step": 282202, "epoch": 2332} {"train_loss": -43.46140670776367, "global_step": 282203, "epoch": 2332} {"train_loss": -42.93009567260742, "global_step": 282204, "epoch": 2332} {"train_loss": -42.563690185546875, "global_step": 282205, "epoch": 2332} {"train_loss": -43.8589973449707, "global_step": 282206, "epoch": 2332} {"train_loss": -43.22708511352539, "global_step": 282207, "epoch": 2332} {"train_loss": -43.17170333862305, "global_step": 282208, "epoch": 2332} {"train_loss": -43.528656005859375, "global_step": 282209, "epoch": 2332} {"train_loss": -43.54015350341797, "global_step": 282210, "epoch": 2332} {"train_loss": -43.1390380859375, "global_step": 282211, "epoch": 2332} {"train_loss": -43.27812576293945, "global_step": 282212, "epoch": 2332} {"train_loss": -42.9565315246582, "global_step": 282213, "epoch": 2332} {"train_loss": -43.13784408569336, "global_step": 282214, "epoch": 2332} {"train_loss": -43.57284164428711, "global_step": 282215, "epoch": 2332} {"train_loss": -43.15106201171875, "global_step": 282216, "epoch": 2332} {"train_loss": -43.460914611816406, "global_step": 282217, "epoch": 2332} {"train_loss": -43.5726203918457, "global_step": 282218, "epoch": 2332} {"train_loss": -43.83641815185547, "global_step": 282219, "epoch": 2332} {"train_loss": -43.253318786621094, "global_step": 282220, "epoch": 2332} {"train_loss": -43.93136215209961, "global_step": 282221, "epoch": 2332} {"train_loss": -44.15718460083008, "global_step": 282222, "epoch": 2332} {"train_loss": -43.824676513671875, "global_step": 282223, "epoch": 2332} {"train_loss": -43.72650146484375, "global_step": 282224, "epoch": 2332} {"train_loss": -42.932884216308594, "global_step": 282225, "epoch": 2332} {"train_loss": -43.59346008300781, "global_step": 282226, "epoch": 2332} {"train_loss": -44.07479476928711, "global_step": 282227, "epoch": 2332} {"train_loss": -42.68825912475586, "global_step": 282228, "epoch": 2332} {"train_loss": -43.63044357299805, "global_step": 282229, "epoch": 2332} {"train_loss": -43.27525329589844, "global_step": 282230, "epoch": 2332} {"train_loss": -43.425960540771484, "global_step": 282231, "epoch": 2332} {"train_loss": -43.59162521362305, "global_step": 282232, "epoch": 2332} {"train_loss": -42.64487838745117, "global_step": 282233, "epoch": 2332} {"train_loss": -43.85151290893555, "global_step": 282234, "epoch": 2332} {"train_loss": -42.936668395996094, "global_step": 282235, "epoch": 2332} {"train_loss": -41.57029724121094, "global_step": 282236, "epoch": 2332} {"train_loss": -42.498046875, "global_step": 282237, "epoch": 2332} {"train_loss": -42.71818161010742, "global_step": 282238, "epoch": 2332} {"train_loss": -42.125762939453125, "global_step": 282239, "epoch": 2332} {"train_loss": -42.02480697631836, "global_step": 282240, "epoch": 2332} {"train_loss": -43.33388137817383, "global_step": 282241, "epoch": 2332} {"train_loss": -42.363494873046875, "global_step": 282242, "epoch": 2332} {"train_loss": -42.865142822265625, "global_step": 282243, "epoch": 2332} {"train_loss": -42.5511360168457, "global_step": 282244, "epoch": 2332} {"train_loss": -42.98746871948242, "global_step": 282245, "epoch": 2332} {"train_loss": -43.0357780456543, "global_step": 282246, "epoch": 2332} {"train_loss": -42.206783294677734, "global_step": 282247, "epoch": 2332} {"train_loss": -43.41815185546875, "global_step": 282248, "epoch": 2332} {"train_loss": -42.319183349609375, "global_step": 282249, "epoch": 2332} {"train_loss": -43.69076156616211, "global_step": 282250, "epoch": 2332} {"train_loss": -43.42344284057617, "global_step": 282251, "epoch": 2332} {"train_loss": -43.43381881713867, "global_step": 282252, "epoch": 2332} {"train_loss": -43.41685104370117, "global_step": 282253, "epoch": 2332} {"train_loss": -43.56730651855469, "global_step": 282254, "epoch": 2332} {"train_loss": -43.05170822143555, "global_step": 282255, "epoch": 2332} {"train_loss": -43.308509826660156, "global_step": 282256, "epoch": 2332} {"train_loss": -42.754981994628906, "global_step": 282257, "epoch": 2332} {"train_loss": -43.72362518310547, "global_step": 282258, "epoch": 2332} {"train_loss": -43.25712966918945, "global_step": 282259, "epoch": 2332} {"train_loss": -43.792816162109375, "global_step": 282260, "epoch": 2332} {"train_loss": -43.146888732910156, "global_step": 282261, "epoch": 2332} {"train_loss": -43.99815368652344, "global_step": 282262, "epoch": 2332} {"train_loss": -43.453102111816406, "global_step": 282263, "epoch": 2332} {"train_loss": -44.223819732666016, "global_step": 282264, "epoch": 2332} {"train_loss": -43.49393844604492, "global_step": 282265, "epoch": 2332} {"train_loss": -44.14842224121094, "global_step": 282266, "epoch": 2332} {"train_loss": -43.52488327026367, "global_step": 282267, "epoch": 2332} {"train_loss": -43.504051208496094, "global_step": 282268, "epoch": 2332} {"train_loss": -43.29417037963867, "global_step": 282269, "epoch": 2332} {"train_loss": -44.045143127441406, "global_step": 282270, "epoch": 2332} {"train_loss": -43.81985092163086, "global_step": 282271, "epoch": 2332} {"train_loss": -43.76958465576172, "global_step": 282272, "epoch": 2332} {"train_loss": -43.55951690673828, "global_step": 282273, "epoch": 2332} {"train_loss": -43.647518157958984, "global_step": 282274, "epoch": 2332} {"train_loss": -44.05642318725586, "global_step": 282275, "epoch": 2332} {"train_loss": -44.14394760131836, "global_step": 282276, "epoch": 2332} {"train_loss": -44.02921676635742, "global_step": 282277, "epoch": 2332} {"train_loss": -44.30489730834961, "global_step": 282278, "epoch": 2332} {"train_loss": -43.92401885986328, "global_step": 282279, "epoch": 2332} {"train_loss": -44.17182540893555, "global_step": 282280, "epoch": 2332} {"train_loss": -43.9797477722168, "global_step": 282281, "epoch": 2332} {"train_loss": -43.49879455566406, "global_step": 282282, "epoch": 2332} {"train_loss": -44.18037796020508, "global_step": 282283, "epoch": 2332} {"train_loss": -44.141510009765625, "global_step": 282284, "epoch": 2332} {"train_loss": -43.7874755859375, "global_step": 282285, "epoch": 2332} {"train_loss": -43.505489349365234, "global_step": 282286, "epoch": 2332} {"train_loss": -43.533931732177734, "global_step": 282287, "epoch": 2332} {"train_loss": -44.65355682373047, "global_step": 282288, "epoch": 2332} {"train_loss": -42.63393020629883, "global_step": 282289, "epoch": 2332} {"train_loss": -43.4287109375, "global_step": 282290, "epoch": 2332} {"train_loss": -43.46001052856445, "global_step": 282291, "epoch": 2332} {"train_loss": -43.10428865290871, "global_step": 282292, "epoch": 2332, "val_loss": 2409469.75} {"train_loss": -44.43548583984375, "global_step": 282293, "epoch": 2333} {"train_loss": -43.25985336303711, "global_step": 282294, "epoch": 2333} {"train_loss": -40.068267822265625, "global_step": 282295, "epoch": 2333} {"train_loss": -40.98777389526367, "global_step": 282296, "epoch": 2333} {"train_loss": -42.132667541503906, "global_step": 282297, "epoch": 2333} {"train_loss": -43.22764205932617, "global_step": 282298, "epoch": 2333} {"train_loss": -41.97414016723633, "global_step": 282299, "epoch": 2333} {"train_loss": -40.1548957824707, "global_step": 282300, "epoch": 2333} {"train_loss": -42.245849609375, "global_step": 282301, "epoch": 2333} {"train_loss": -41.34077835083008, "global_step": 282302, "epoch": 2333} {"train_loss": -43.31007766723633, "global_step": 282303, "epoch": 2333} {"train_loss": -42.65938186645508, "global_step": 282304, "epoch": 2333} {"train_loss": -41.599708557128906, "global_step": 282305, "epoch": 2333} {"train_loss": -42.73400115966797, "global_step": 282306, "epoch": 2333} {"train_loss": -43.78907012939453, "global_step": 282307, "epoch": 2333} {"train_loss": -42.26203536987305, "global_step": 282308, "epoch": 2333} {"train_loss": -42.2641487121582, "global_step": 282309, "epoch": 2333} {"train_loss": -42.404876708984375, "global_step": 282310, "epoch": 2333} {"train_loss": -42.69021224975586, "global_step": 282311, "epoch": 2333} {"train_loss": -42.45856475830078, "global_step": 282312, "epoch": 2333} {"train_loss": -44.31367874145508, "global_step": 282313, "epoch": 2333} {"train_loss": -43.172706604003906, "global_step": 282314, "epoch": 2333} {"train_loss": -42.77765655517578, "global_step": 282315, "epoch": 2333} {"train_loss": -43.64266586303711, "global_step": 282316, "epoch": 2333} {"train_loss": -43.55335235595703, "global_step": 282317, "epoch": 2333} {"train_loss": -43.7962760925293, "global_step": 282318, "epoch": 2333} {"train_loss": -43.63533020019531, "global_step": 282319, "epoch": 2333} {"train_loss": -43.282691955566406, "global_step": 282320, "epoch": 2333} {"train_loss": -42.8106575012207, "global_step": 282321, "epoch": 2333} {"train_loss": -42.577796936035156, "global_step": 282322, "epoch": 2333} {"train_loss": -42.85380554199219, "global_step": 282323, "epoch": 2333} {"train_loss": -43.51343536376953, "global_step": 282324, "epoch": 2333} {"train_loss": -43.601009368896484, "global_step": 282325, "epoch": 2333} {"train_loss": -42.14401626586914, "global_step": 282326, "epoch": 2333} {"train_loss": -43.1141471862793, "global_step": 282327, "epoch": 2333} {"train_loss": -43.31220626831055, "global_step": 282328, "epoch": 2333} {"train_loss": -43.054527282714844, "global_step": 282329, "epoch": 2333} {"train_loss": -43.633785247802734, "global_step": 282330, "epoch": 2333} {"train_loss": -42.097801208496094, "global_step": 282331, "epoch": 2333} {"train_loss": -43.883811950683594, "global_step": 282332, "epoch": 2333} {"train_loss": -43.01372528076172, "global_step": 282333, "epoch": 2333} {"train_loss": -42.49039840698242, "global_step": 282334, "epoch": 2333} {"train_loss": -43.560523986816406, "global_step": 282335, "epoch": 2333} {"train_loss": -43.058563232421875, "global_step": 282336, "epoch": 2333} {"train_loss": -42.580841064453125, "global_step": 282337, "epoch": 2333} {"train_loss": -43.70656967163086, "global_step": 282338, "epoch": 2333} {"train_loss": -43.50178909301758, "global_step": 282339, "epoch": 2333} {"train_loss": -43.08927536010742, "global_step": 282340, "epoch": 2333} {"train_loss": -43.70063781738281, "global_step": 282341, "epoch": 2333} {"train_loss": -42.82244873046875, "global_step": 282342, "epoch": 2333} {"train_loss": -43.52797317504883, "global_step": 282343, "epoch": 2333} {"train_loss": -41.647891998291016, "global_step": 282344, "epoch": 2333} {"train_loss": -40.70853805541992, "global_step": 282345, "epoch": 2333} {"train_loss": -42.39210891723633, "global_step": 282346, "epoch": 2333} {"train_loss": -43.101863861083984, "global_step": 282347, "epoch": 2333} {"train_loss": -41.06143569946289, "global_step": 282348, "epoch": 2333} {"train_loss": -41.3211784362793, "global_step": 282349, "epoch": 2333} {"train_loss": -43.286067962646484, "global_step": 282350, "epoch": 2333} {"train_loss": -41.35923385620117, "global_step": 282351, "epoch": 2333} {"train_loss": -42.478858947753906, "global_step": 282352, "epoch": 2333} {"train_loss": -42.660770416259766, "global_step": 282353, "epoch": 2333} {"train_loss": -41.862388610839844, "global_step": 282354, "epoch": 2333} {"train_loss": -43.041622161865234, "global_step": 282355, "epoch": 2333} {"train_loss": -41.49662399291992, "global_step": 282356, "epoch": 2333} {"train_loss": -39.68885040283203, "global_step": 282357, "epoch": 2333} {"train_loss": -41.6200065612793, "global_step": 282358, "epoch": 2333} {"train_loss": -42.12383270263672, "global_step": 282359, "epoch": 2333} {"train_loss": -39.46588897705078, "global_step": 282360, "epoch": 2333} {"train_loss": -42.334259033203125, "global_step": 282361, "epoch": 2333} {"train_loss": -41.80177688598633, "global_step": 282362, "epoch": 2333} {"train_loss": -41.25818634033203, "global_step": 282363, "epoch": 2333} {"train_loss": -41.98878860473633, "global_step": 282364, "epoch": 2333} {"train_loss": -41.0336799621582, "global_step": 282365, "epoch": 2333} {"train_loss": -42.41587448120117, "global_step": 282366, "epoch": 2333} {"train_loss": -43.03055953979492, "global_step": 282367, "epoch": 2333} {"train_loss": -43.055904388427734, "global_step": 282368, "epoch": 2333} {"train_loss": -42.54014205932617, "global_step": 282369, "epoch": 2333} {"train_loss": -43.40208053588867, "global_step": 282370, "epoch": 2333} {"train_loss": -43.057865142822266, "global_step": 282371, "epoch": 2333} {"train_loss": -43.2309684753418, "global_step": 282372, "epoch": 2333} {"train_loss": -42.45984649658203, "global_step": 282373, "epoch": 2333} {"train_loss": -42.07831954956055, "global_step": 282374, "epoch": 2333} {"train_loss": -43.34745407104492, "global_step": 282375, "epoch": 2333} {"train_loss": -43.2861328125, "global_step": 282376, "epoch": 2333} {"train_loss": -43.13507843017578, "global_step": 282377, "epoch": 2333} {"train_loss": -43.60137176513672, "global_step": 282378, "epoch": 2333} {"train_loss": -43.02028274536133, "global_step": 282379, "epoch": 2333} {"train_loss": -43.75173568725586, "global_step": 282380, "epoch": 2333} {"train_loss": -43.0915641784668, "global_step": 282381, "epoch": 2333} {"train_loss": -43.120765686035156, "global_step": 282382, "epoch": 2333} {"train_loss": -43.06679916381836, "global_step": 282383, "epoch": 2333} {"train_loss": -43.83571243286133, "global_step": 282384, "epoch": 2333} {"train_loss": -43.33891677856445, "global_step": 282385, "epoch": 2333} {"train_loss": -43.75235366821289, "global_step": 282386, "epoch": 2333} {"train_loss": -43.98933792114258, "global_step": 282387, "epoch": 2333} {"train_loss": -43.71342849731445, "global_step": 282388, "epoch": 2333} {"train_loss": -43.616432189941406, "global_step": 282389, "epoch": 2333} {"train_loss": -43.899261474609375, "global_step": 282390, "epoch": 2333} {"train_loss": -43.584938049316406, "global_step": 282391, "epoch": 2333} {"train_loss": -43.820858001708984, "global_step": 282392, "epoch": 2333} {"train_loss": -43.992454528808594, "global_step": 282393, "epoch": 2333} {"train_loss": -43.01052474975586, "global_step": 282394, "epoch": 2333} {"train_loss": -43.84708786010742, "global_step": 282395, "epoch": 2333} {"train_loss": -43.199928283691406, "global_step": 282396, "epoch": 2333} {"train_loss": -43.745174407958984, "global_step": 282397, "epoch": 2333} {"train_loss": -42.78398895263672, "global_step": 282398, "epoch": 2333} {"train_loss": -43.57419967651367, "global_step": 282399, "epoch": 2333} {"train_loss": -43.25764846801758, "global_step": 282400, "epoch": 2333} {"train_loss": -43.476253509521484, "global_step": 282401, "epoch": 2333} {"train_loss": -44.11189651489258, "global_step": 282402, "epoch": 2333} {"train_loss": -43.85512924194336, "global_step": 282403, "epoch": 2333} {"train_loss": -43.86969757080078, "global_step": 282404, "epoch": 2333} {"train_loss": -44.13032531738281, "global_step": 282405, "epoch": 2333} {"train_loss": -43.918792724609375, "global_step": 282406, "epoch": 2333} {"train_loss": -43.614803314208984, "global_step": 282407, "epoch": 2333} {"train_loss": -43.889862060546875, "global_step": 282408, "epoch": 2333} {"train_loss": -44.00958251953125, "global_step": 282409, "epoch": 2333} {"train_loss": -44.16123580932617, "global_step": 282410, "epoch": 2333} {"train_loss": -43.28534698486328, "global_step": 282411, "epoch": 2333} {"train_loss": -44.0914306640625, "global_step": 282412, "epoch": 2333} {"train_loss": -42.88798031137009, "global_step": 282413, "epoch": 2333, "val_loss": 2448951.0} {"train_loss": -40.619815826416016, "global_step": 282414, "epoch": 2334} {"train_loss": -40.472076416015625, "global_step": 282415, "epoch": 2334} {"train_loss": -43.44449996948242, "global_step": 282416, "epoch": 2334} {"train_loss": -41.99654006958008, "global_step": 282417, "epoch": 2334} {"train_loss": -41.594058990478516, "global_step": 282418, "epoch": 2334} {"train_loss": -43.65704345703125, "global_step": 282419, "epoch": 2334} {"train_loss": -40.40761947631836, "global_step": 282420, "epoch": 2334} {"train_loss": -43.01032257080078, "global_step": 282421, "epoch": 2334} {"train_loss": -42.674766540527344, "global_step": 282422, "epoch": 2334} {"train_loss": -41.27312469482422, "global_step": 282423, "epoch": 2334} {"train_loss": -43.533138275146484, "global_step": 282424, "epoch": 2334} {"train_loss": -41.676063537597656, "global_step": 282425, "epoch": 2334} {"train_loss": -41.92116165161133, "global_step": 282426, "epoch": 2334} {"train_loss": -43.812129974365234, "global_step": 282427, "epoch": 2334} {"train_loss": -40.783443450927734, "global_step": 282428, "epoch": 2334} {"train_loss": -43.37104797363281, "global_step": 282429, "epoch": 2334} {"train_loss": -42.4338493347168, "global_step": 282430, "epoch": 2334} {"train_loss": -41.6966438293457, "global_step": 282431, "epoch": 2334} {"train_loss": -43.76933670043945, "global_step": 282432, "epoch": 2334} {"train_loss": -42.015384674072266, "global_step": 282433, "epoch": 2334} {"train_loss": -42.6512336730957, "global_step": 282434, "epoch": 2334} {"train_loss": -42.61228942871094, "global_step": 282435, "epoch": 2334} {"train_loss": -43.52574920654297, "global_step": 282436, "epoch": 2334} {"train_loss": -43.87772750854492, "global_step": 282437, "epoch": 2334} {"train_loss": -43.26949691772461, "global_step": 282438, "epoch": 2334} {"train_loss": -43.67262649536133, "global_step": 282439, "epoch": 2334} {"train_loss": -43.69834899902344, "global_step": 282440, "epoch": 2334} {"train_loss": -43.5372200012207, "global_step": 282441, "epoch": 2334} {"train_loss": -43.31732177734375, "global_step": 282442, "epoch": 2334} {"train_loss": -43.5729866027832, "global_step": 282443, "epoch": 2334} {"train_loss": -43.38017654418945, "global_step": 282444, "epoch": 2334} {"train_loss": -43.095184326171875, "global_step": 282445, "epoch": 2334} {"train_loss": -42.673973083496094, "global_step": 282446, "epoch": 2334} {"train_loss": -43.32863998413086, "global_step": 282447, "epoch": 2334} {"train_loss": -42.377925872802734, "global_step": 282448, "epoch": 2334} {"train_loss": -43.2348747253418, "global_step": 282449, "epoch": 2334} {"train_loss": -43.57301330566406, "global_step": 282450, "epoch": 2334} {"train_loss": -43.68381881713867, "global_step": 282451, "epoch": 2334} {"train_loss": -43.381107330322266, "global_step": 282452, "epoch": 2334} {"train_loss": -43.19805908203125, "global_step": 282453, "epoch": 2334} {"train_loss": -42.40850067138672, "global_step": 282454, "epoch": 2334} {"train_loss": -43.736053466796875, "global_step": 282455, "epoch": 2334} {"train_loss": -43.709442138671875, "global_step": 282456, "epoch": 2334} {"train_loss": -43.23525619506836, "global_step": 282457, "epoch": 2334} {"train_loss": -44.15765380859375, "global_step": 282458, "epoch": 2334} {"train_loss": -42.76594161987305, "global_step": 282459, "epoch": 2334} {"train_loss": -43.374794006347656, "global_step": 282460, "epoch": 2334} {"train_loss": -43.49801254272461, "global_step": 282461, "epoch": 2334} {"train_loss": -43.15073013305664, "global_step": 282462, "epoch": 2334} {"train_loss": -43.513671875, "global_step": 282463, "epoch": 2334} {"train_loss": -44.26911544799805, "global_step": 282464, "epoch": 2334} {"train_loss": -42.31239700317383, "global_step": 282465, "epoch": 2334} {"train_loss": -43.38994598388672, "global_step": 282466, "epoch": 2334} {"train_loss": -44.048011779785156, "global_step": 282467, "epoch": 2334} {"train_loss": -43.29906463623047, "global_step": 282468, "epoch": 2334} {"train_loss": -43.9558219909668, "global_step": 282469, "epoch": 2334} {"train_loss": -43.57801818847656, "global_step": 282470, "epoch": 2334} {"train_loss": -43.66545867919922, "global_step": 282471, "epoch": 2334} {"train_loss": -43.79024124145508, "global_step": 282472, "epoch": 2334} {"train_loss": -43.84017562866211, "global_step": 282473, "epoch": 2334} {"train_loss": -43.27327346801758, "global_step": 282474, "epoch": 2334} {"train_loss": -43.74824905395508, "global_step": 282475, "epoch": 2334} {"train_loss": -44.11661911010742, "global_step": 282476, "epoch": 2334} {"train_loss": -43.94952392578125, "global_step": 282477, "epoch": 2334} {"train_loss": -44.1917610168457, "global_step": 282478, "epoch": 2334} {"train_loss": -44.36520004272461, "global_step": 282479, "epoch": 2334} {"train_loss": -44.457088470458984, "global_step": 282480, "epoch": 2334} {"train_loss": -44.43156814575195, "global_step": 282481, "epoch": 2334} {"train_loss": -44.37771224975586, "global_step": 282482, "epoch": 2334} {"train_loss": -44.235591888427734, "global_step": 282483, "epoch": 2334} {"train_loss": -44.07297897338867, "global_step": 282484, "epoch": 2334} {"train_loss": -44.60340881347656, "global_step": 282485, "epoch": 2334} {"train_loss": -43.39338302612305, "global_step": 282486, "epoch": 2334} {"train_loss": -42.8455810546875, "global_step": 282487, "epoch": 2334} {"train_loss": -43.289161682128906, "global_step": 282488, "epoch": 2334} {"train_loss": -43.08082580566406, "global_step": 282489, "epoch": 2334} {"train_loss": -42.39864730834961, "global_step": 282490, "epoch": 2334} {"train_loss": -42.88788986206055, "global_step": 282491, "epoch": 2334} {"train_loss": -42.48505401611328, "global_step": 282492, "epoch": 2334} {"train_loss": -43.456687927246094, "global_step": 282493, "epoch": 2334} {"train_loss": -43.650691986083984, "global_step": 282494, "epoch": 2334} {"train_loss": -43.935035705566406, "global_step": 282495, "epoch": 2334} {"train_loss": -43.43857955932617, "global_step": 282496, "epoch": 2334} {"train_loss": -43.46027374267578, "global_step": 282497, "epoch": 2334} {"train_loss": -43.32792663574219, "global_step": 282498, "epoch": 2334} {"train_loss": -43.700504302978516, "global_step": 282499, "epoch": 2334} {"train_loss": -43.965415954589844, "global_step": 282500, "epoch": 2334} {"train_loss": -43.211097717285156, "global_step": 282501, "epoch": 2334} {"train_loss": -43.58993148803711, "global_step": 282502, "epoch": 2334} {"train_loss": -43.13471984863281, "global_step": 282503, "epoch": 2334} {"train_loss": -44.177669525146484, "global_step": 282504, "epoch": 2334} {"train_loss": -43.832881927490234, "global_step": 282505, "epoch": 2334} {"train_loss": -42.876399993896484, "global_step": 282506, "epoch": 2334} {"train_loss": -43.50632858276367, "global_step": 282507, "epoch": 2334} {"train_loss": -44.25674819946289, "global_step": 282508, "epoch": 2334} {"train_loss": -44.22260665893555, "global_step": 282509, "epoch": 2334} {"train_loss": -43.609596252441406, "global_step": 282510, "epoch": 2334} {"train_loss": -43.8328742980957, "global_step": 282511, "epoch": 2334} {"train_loss": -43.41775131225586, "global_step": 282512, "epoch": 2334} {"train_loss": -43.77082061767578, "global_step": 282513, "epoch": 2334} {"train_loss": -44.0205192565918, "global_step": 282514, "epoch": 2334} {"train_loss": -43.74337387084961, "global_step": 282515, "epoch": 2334} {"train_loss": -44.05770492553711, "global_step": 282516, "epoch": 2334} {"train_loss": -42.85543441772461, "global_step": 282517, "epoch": 2334} {"train_loss": -43.528297424316406, "global_step": 282518, "epoch": 2334} {"train_loss": -43.97770309448242, "global_step": 282519, "epoch": 2334} {"train_loss": -44.234474182128906, "global_step": 282520, "epoch": 2334} {"train_loss": -43.70674133300781, "global_step": 282521, "epoch": 2334} {"train_loss": -43.492916107177734, "global_step": 282522, "epoch": 2334} {"train_loss": -44.0219612121582, "global_step": 282523, "epoch": 2334} {"train_loss": -43.46444320678711, "global_step": 282524, "epoch": 2334} {"train_loss": -44.60801315307617, "global_step": 282525, "epoch": 2334} {"train_loss": -43.30995559692383, "global_step": 282526, "epoch": 2334} {"train_loss": -43.4066162109375, "global_step": 282527, "epoch": 2334} {"train_loss": -43.986427307128906, "global_step": 282528, "epoch": 2334} {"train_loss": -44.646095275878906, "global_step": 282529, "epoch": 2334} {"train_loss": -43.7269287109375, "global_step": 282530, "epoch": 2334} {"train_loss": -44.05996322631836, "global_step": 282531, "epoch": 2334} {"train_loss": -43.934688568115234, "global_step": 282532, "epoch": 2334} {"train_loss": -43.93137741088867, "global_step": 282533, "epoch": 2334} {"train_loss": -43.35946191835009, "global_step": 282534, "epoch": 2334, "val_loss": 2486884.25} {"train_loss": -44.622047424316406, "global_step": 282535, "epoch": 2335} {"train_loss": -42.88344955444336, "global_step": 282536, "epoch": 2335} {"train_loss": -44.14312744140625, "global_step": 282537, "epoch": 2335} {"train_loss": -43.60536575317383, "global_step": 282538, "epoch": 2335} {"train_loss": -42.34379959106445, "global_step": 282539, "epoch": 2335} {"train_loss": -43.85393142700195, "global_step": 282540, "epoch": 2335} {"train_loss": -42.8021354675293, "global_step": 282541, "epoch": 2335} {"train_loss": -42.64396286010742, "global_step": 282542, "epoch": 2335} {"train_loss": -43.625877380371094, "global_step": 282543, "epoch": 2335} {"train_loss": -42.47269821166992, "global_step": 282544, "epoch": 2335} {"train_loss": -42.029232025146484, "global_step": 282545, "epoch": 2335} {"train_loss": -42.74922561645508, "global_step": 282546, "epoch": 2335} {"train_loss": -43.48991775512695, "global_step": 282547, "epoch": 2335} {"train_loss": -42.575740814208984, "global_step": 282548, "epoch": 2335} {"train_loss": -42.43742752075195, "global_step": 282549, "epoch": 2335} {"train_loss": -41.827659606933594, "global_step": 282550, "epoch": 2335} {"train_loss": -42.14827346801758, "global_step": 282551, "epoch": 2335} {"train_loss": -42.702152252197266, "global_step": 282552, "epoch": 2335} {"train_loss": -41.497406005859375, "global_step": 282553, "epoch": 2335} {"train_loss": -41.932865142822266, "global_step": 282554, "epoch": 2335} {"train_loss": -42.72773361206055, "global_step": 282555, "epoch": 2335} {"train_loss": -42.63492965698242, "global_step": 282556, "epoch": 2335} {"train_loss": -41.6374397277832, "global_step": 282557, "epoch": 2335} {"train_loss": -42.20824432373047, "global_step": 282558, "epoch": 2335} {"train_loss": -42.94023895263672, "global_step": 282559, "epoch": 2335} {"train_loss": -41.16097640991211, "global_step": 282560, "epoch": 2335} {"train_loss": -41.91082763671875, "global_step": 282561, "epoch": 2335} {"train_loss": -42.1360969543457, "global_step": 282562, "epoch": 2335} {"train_loss": -41.21590805053711, "global_step": 282563, "epoch": 2335} {"train_loss": -42.2365837097168, "global_step": 282564, "epoch": 2335} {"train_loss": -41.919368743896484, "global_step": 282565, "epoch": 2335} {"train_loss": -41.72117233276367, "global_step": 282566, "epoch": 2335} {"train_loss": -40.996490478515625, "global_step": 282567, "epoch": 2335} {"train_loss": -41.61921691894531, "global_step": 282568, "epoch": 2335} {"train_loss": -39.24399185180664, "global_step": 282569, "epoch": 2335} {"train_loss": -42.724098205566406, "global_step": 282570, "epoch": 2335} {"train_loss": -38.743988037109375, "global_step": 282571, "epoch": 2335} {"train_loss": -41.81988525390625, "global_step": 282572, "epoch": 2335} {"train_loss": -35.65237045288086, "global_step": 282573, "epoch": 2335} {"train_loss": -42.66402816772461, "global_step": 282574, "epoch": 2335} {"train_loss": -39.46829605102539, "global_step": 282575, "epoch": 2335} {"train_loss": -39.73558807373047, "global_step": 282576, "epoch": 2335} {"train_loss": -40.3427848815918, "global_step": 282577, "epoch": 2335} {"train_loss": -40.42536926269531, "global_step": 282578, "epoch": 2335} {"train_loss": -39.86854934692383, "global_step": 282579, "epoch": 2335} {"train_loss": -41.551692962646484, "global_step": 282580, "epoch": 2335} {"train_loss": -38.99677658081055, "global_step": 282581, "epoch": 2335} {"train_loss": -42.04071044921875, "global_step": 282582, "epoch": 2335} {"train_loss": -39.88645553588867, "global_step": 282583, "epoch": 2335} {"train_loss": -42.45537567138672, "global_step": 282584, "epoch": 2335} {"train_loss": -40.86137771606445, "global_step": 282585, "epoch": 2335} {"train_loss": -42.538936614990234, "global_step": 282586, "epoch": 2335} {"train_loss": -40.71645736694336, "global_step": 282587, "epoch": 2335} {"train_loss": -41.05242156982422, "global_step": 282588, "epoch": 2335} {"train_loss": -41.527931213378906, "global_step": 282589, "epoch": 2335} {"train_loss": -42.51059341430664, "global_step": 282590, "epoch": 2335} {"train_loss": -41.50424575805664, "global_step": 282591, "epoch": 2335} {"train_loss": -42.89689254760742, "global_step": 282592, "epoch": 2335} {"train_loss": -42.09140396118164, "global_step": 282593, "epoch": 2335} {"train_loss": -42.68793487548828, "global_step": 282594, "epoch": 2335} {"train_loss": -19.64674186706543, "global_step": 282595, "epoch": 2335} {"train_loss": -41.109161376953125, "global_step": 282596, "epoch": 2335} {"train_loss": -42.10071563720703, "global_step": 282597, "epoch": 2335} {"train_loss": -39.73225784301758, "global_step": 282598, "epoch": 2335} {"train_loss": -41.169918060302734, "global_step": 282599, "epoch": 2335} {"train_loss": -41.22384262084961, "global_step": 282600, "epoch": 2335} {"train_loss": -39.75299072265625, "global_step": 282601, "epoch": 2335} {"train_loss": -41.70915222167969, "global_step": 282602, "epoch": 2335} {"train_loss": -41.28242874145508, "global_step": 282603, "epoch": 2335} {"train_loss": -40.12943649291992, "global_step": 282604, "epoch": 2335} {"train_loss": -40.28899002075195, "global_step": 282605, "epoch": 2335} {"train_loss": -41.6356201171875, "global_step": 282606, "epoch": 2335} {"train_loss": -34.01877212524414, "global_step": 282607, "epoch": 2335} {"train_loss": -41.93349838256836, "global_step": 282608, "epoch": 2335} {"train_loss": -29.0701904296875, "global_step": 282609, "epoch": 2335} {"train_loss": -41.55549240112305, "global_step": 282610, "epoch": 2335} {"train_loss": -31.859512329101562, "global_step": 282611, "epoch": 2335} {"train_loss": -39.968013763427734, "global_step": 282612, "epoch": 2335} {"train_loss": -42.01618576049805, "global_step": 282613, "epoch": 2335} {"train_loss": -41.92070007324219, "global_step": 282614, "epoch": 2335} {"train_loss": -40.329219818115234, "global_step": 282615, "epoch": 2335} {"train_loss": -41.479736328125, "global_step": 282616, "epoch": 2335} {"train_loss": -41.58561325073242, "global_step": 282617, "epoch": 2335} {"train_loss": -39.465545654296875, "global_step": 282618, "epoch": 2335} {"train_loss": -42.81790542602539, "global_step": 282619, "epoch": 2335} {"train_loss": -41.969085693359375, "global_step": 282620, "epoch": 2335} {"train_loss": -41.30695724487305, "global_step": 282621, "epoch": 2335} {"train_loss": -42.019287109375, "global_step": 282622, "epoch": 2335} {"train_loss": -42.355037689208984, "global_step": 282623, "epoch": 2335} {"train_loss": -42.36678695678711, "global_step": 282624, "epoch": 2335} {"train_loss": -39.77064895629883, "global_step": 282625, "epoch": 2335} {"train_loss": -42.10380172729492, "global_step": 282626, "epoch": 2335} {"train_loss": -36.96021270751953, "global_step": 282627, "epoch": 2335} {"train_loss": -41.21212387084961, "global_step": 282628, "epoch": 2335} {"train_loss": -42.57061004638672, "global_step": 282629, "epoch": 2335} {"train_loss": -42.33545684814453, "global_step": 282630, "epoch": 2335} {"train_loss": -42.74465560913086, "global_step": 282631, "epoch": 2335} {"train_loss": -42.612728118896484, "global_step": 282632, "epoch": 2335} {"train_loss": -43.17465591430664, "global_step": 282633, "epoch": 2335} {"train_loss": -37.955955505371094, "global_step": 282634, "epoch": 2335} {"train_loss": -43.09735107421875, "global_step": 282635, "epoch": 2335} {"train_loss": -42.248695373535156, "global_step": 282636, "epoch": 2335} {"train_loss": -42.673885345458984, "global_step": 282637, "epoch": 2335} {"train_loss": -41.090049743652344, "global_step": 282638, "epoch": 2335} {"train_loss": -41.62070846557617, "global_step": 282639, "epoch": 2335} {"train_loss": -43.32143783569336, "global_step": 282640, "epoch": 2335} {"train_loss": -42.8781852722168, "global_step": 282641, "epoch": 2335} {"train_loss": -40.278594970703125, "global_step": 282642, "epoch": 2335} {"train_loss": -42.81466293334961, "global_step": 282643, "epoch": 2335} {"train_loss": -42.363250732421875, "global_step": 282644, "epoch": 2335} {"train_loss": -40.93335723876953, "global_step": 282645, "epoch": 2335} {"train_loss": -41.62831115722656, "global_step": 282646, "epoch": 2335} {"train_loss": -42.04899978637695, "global_step": 282647, "epoch": 2335} {"train_loss": -43.40917205810547, "global_step": 282648, "epoch": 2335} {"train_loss": -42.8499755859375, "global_step": 282649, "epoch": 2335} {"train_loss": -42.66355514526367, "global_step": 282650, "epoch": 2335} {"train_loss": -43.158199310302734, "global_step": 282651, "epoch": 2335} {"train_loss": -43.6744384765625, "global_step": 282652, "epoch": 2335} {"train_loss": -42.69190216064453, "global_step": 282653, "epoch": 2335} {"train_loss": -42.973384857177734, "global_step": 282654, "epoch": 2335} {"train_loss": -41.30237997070817, "global_step": 282655, "epoch": 2335, "val_loss": 2867373.0} {"train_loss": -42.13096618652344, "global_step": 282656, "epoch": 2336} {"train_loss": -43.295127868652344, "global_step": 282657, "epoch": 2336} {"train_loss": -43.17816162109375, "global_step": 282658, "epoch": 2336} {"train_loss": -43.13320541381836, "global_step": 282659, "epoch": 2336} {"train_loss": -43.78489685058594, "global_step": 282660, "epoch": 2336} {"train_loss": -43.678375244140625, "global_step": 282661, "epoch": 2336} {"train_loss": -43.75919723510742, "global_step": 282662, "epoch": 2336} {"train_loss": -43.278594970703125, "global_step": 282663, "epoch": 2336} {"train_loss": -42.84489059448242, "global_step": 282664, "epoch": 2336} {"train_loss": -43.30347442626953, "global_step": 282665, "epoch": 2336} {"train_loss": -43.34458541870117, "global_step": 282666, "epoch": 2336} {"train_loss": -43.92591094970703, "global_step": 282667, "epoch": 2336} {"train_loss": -43.771663665771484, "global_step": 282668, "epoch": 2336} {"train_loss": -42.3832893371582, "global_step": 282669, "epoch": 2336} {"train_loss": -43.18886184692383, "global_step": 282670, "epoch": 2336} {"train_loss": -43.7445068359375, "global_step": 282671, "epoch": 2336} {"train_loss": -39.332027435302734, "global_step": 282672, "epoch": 2336} {"train_loss": -42.82523727416992, "global_step": 282673, "epoch": 2336} {"train_loss": -44.159725189208984, "global_step": 282674, "epoch": 2336} {"train_loss": -42.87605667114258, "global_step": 282675, "epoch": 2336} {"train_loss": -44.06914138793945, "global_step": 282676, "epoch": 2336} {"train_loss": -44.099029541015625, "global_step": 282677, "epoch": 2336} {"train_loss": -43.950992584228516, "global_step": 282678, "epoch": 2336} {"train_loss": -44.04476547241211, "global_step": 282679, "epoch": 2336} {"train_loss": -43.489654541015625, "global_step": 282680, "epoch": 2336} {"train_loss": -43.99386215209961, "global_step": 282681, "epoch": 2336} {"train_loss": -44.4189338684082, "global_step": 282682, "epoch": 2336} {"train_loss": -44.0868034362793, "global_step": 282683, "epoch": 2336} {"train_loss": -42.89031982421875, "global_step": 282684, "epoch": 2336} {"train_loss": -42.11855697631836, "global_step": 282685, "epoch": 2336} {"train_loss": -43.553382873535156, "global_step": 282686, "epoch": 2336} {"train_loss": -42.78230667114258, "global_step": 282687, "epoch": 2336} {"train_loss": -41.880027770996094, "global_step": 282688, "epoch": 2336} {"train_loss": -43.21030807495117, "global_step": 282689, "epoch": 2336} {"train_loss": -44.2029914855957, "global_step": 282690, "epoch": 2336} {"train_loss": -42.56425094604492, "global_step": 282691, "epoch": 2336} {"train_loss": -44.23551559448242, "global_step": 282692, "epoch": 2336} {"train_loss": -43.64955520629883, "global_step": 282693, "epoch": 2336} {"train_loss": -44.60708236694336, "global_step": 282694, "epoch": 2336} {"train_loss": -43.23612976074219, "global_step": 282695, "epoch": 2336} {"train_loss": -41.39992141723633, "global_step": 282696, "epoch": 2336} {"train_loss": -43.74762725830078, "global_step": 282697, "epoch": 2336} {"train_loss": -42.99067306518555, "global_step": 282698, "epoch": 2336} {"train_loss": -43.64999008178711, "global_step": 282699, "epoch": 2336} {"train_loss": -42.778602600097656, "global_step": 282700, "epoch": 2336} {"train_loss": -43.388999938964844, "global_step": 282701, "epoch": 2336} {"train_loss": -43.29473876953125, "global_step": 282702, "epoch": 2336} {"train_loss": -43.93069076538086, "global_step": 282703, "epoch": 2336} {"train_loss": -42.47669219970703, "global_step": 282704, "epoch": 2336} {"train_loss": -42.19851303100586, "global_step": 282705, "epoch": 2336} {"train_loss": -41.3965950012207, "global_step": 282706, "epoch": 2336} {"train_loss": -40.73719024658203, "global_step": 282707, "epoch": 2336} {"train_loss": -41.206268310546875, "global_step": 282708, "epoch": 2336} {"train_loss": -41.10559844970703, "global_step": 282709, "epoch": 2336} {"train_loss": -40.76613998413086, "global_step": 282710, "epoch": 2336} {"train_loss": -39.94210433959961, "global_step": 282711, "epoch": 2336} {"train_loss": -40.14809799194336, "global_step": 282712, "epoch": 2336} {"train_loss": -41.37642288208008, "global_step": 282713, "epoch": 2336} {"train_loss": -40.251792907714844, "global_step": 282714, "epoch": 2336} {"train_loss": -40.787899017333984, "global_step": 282715, "epoch": 2336} {"train_loss": -42.82419967651367, "global_step": 282716, "epoch": 2336} {"train_loss": -38.66188430786133, "global_step": 282717, "epoch": 2336} {"train_loss": -42.083106994628906, "global_step": 282718, "epoch": 2336} {"train_loss": -35.37484359741211, "global_step": 282719, "epoch": 2336} {"train_loss": -41.78316879272461, "global_step": 282720, "epoch": 2336} {"train_loss": -36.99273681640625, "global_step": 282721, "epoch": 2336} {"train_loss": -36.273231506347656, "global_step": 282722, "epoch": 2336} {"train_loss": -41.509334564208984, "global_step": 282723, "epoch": 2336} {"train_loss": -35.749141693115234, "global_step": 282724, "epoch": 2336} {"train_loss": -38.9796142578125, "global_step": 282725, "epoch": 2336} {"train_loss": -39.05228805541992, "global_step": 282726, "epoch": 2336} {"train_loss": -39.40271759033203, "global_step": 282727, "epoch": 2336} {"train_loss": -40.82764434814453, "global_step": 282728, "epoch": 2336} {"train_loss": -38.35129928588867, "global_step": 282729, "epoch": 2336} {"train_loss": -41.8888053894043, "global_step": 282730, "epoch": 2336} {"train_loss": -37.76666259765625, "global_step": 282731, "epoch": 2336} {"train_loss": -41.133602142333984, "global_step": 282732, "epoch": 2336} {"train_loss": -35.532718658447266, "global_step": 282733, "epoch": 2336} {"train_loss": -40.82419967651367, "global_step": 282734, "epoch": 2336} {"train_loss": -40.46796798706055, "global_step": 282735, "epoch": 2336} {"train_loss": -41.46403121948242, "global_step": 282736, "epoch": 2336} {"train_loss": -40.129024505615234, "global_step": 282737, "epoch": 2336} {"train_loss": -42.1715087890625, "global_step": 282738, "epoch": 2336} {"train_loss": -38.7081413269043, "global_step": 282739, "epoch": 2336} {"train_loss": -42.50863265991211, "global_step": 282740, "epoch": 2336} {"train_loss": -39.33359909057617, "global_step": 282741, "epoch": 2336} {"train_loss": -41.300350189208984, "global_step": 282742, "epoch": 2336} {"train_loss": -40.48688888549805, "global_step": 282743, "epoch": 2336} {"train_loss": -42.98189926147461, "global_step": 282744, "epoch": 2336} {"train_loss": -42.123046875, "global_step": 282745, "epoch": 2336} {"train_loss": -40.04059982299805, "global_step": 282746, "epoch": 2336} {"train_loss": -41.92600631713867, "global_step": 282747, "epoch": 2336} {"train_loss": -42.03123092651367, "global_step": 282748, "epoch": 2336} {"train_loss": -42.20431137084961, "global_step": 282749, "epoch": 2336} {"train_loss": -42.3869514465332, "global_step": 282750, "epoch": 2336} {"train_loss": -41.88347625732422, "global_step": 282751, "epoch": 2336} {"train_loss": -42.227691650390625, "global_step": 282752, "epoch": 2336} {"train_loss": -42.90700912475586, "global_step": 282753, "epoch": 2336} {"train_loss": -42.68672561645508, "global_step": 282754, "epoch": 2336} {"train_loss": -42.37660598754883, "global_step": 282755, "epoch": 2336} {"train_loss": -41.0975341796875, "global_step": 282756, "epoch": 2336} {"train_loss": -42.67699432373047, "global_step": 282757, "epoch": 2336} {"train_loss": -38.80960464477539, "global_step": 282758, "epoch": 2336} {"train_loss": -42.30486297607422, "global_step": 282759, "epoch": 2336} {"train_loss": -42.970516204833984, "global_step": 282760, "epoch": 2336} {"train_loss": -42.446205139160156, "global_step": 282761, "epoch": 2336} {"train_loss": -42.95941925048828, "global_step": 282762, "epoch": 2336} {"train_loss": -42.99314498901367, "global_step": 282763, "epoch": 2336} {"train_loss": -43.0352668762207, "global_step": 282764, "epoch": 2336} {"train_loss": -43.19686508178711, "global_step": 282765, "epoch": 2336} {"train_loss": -43.03567123413086, "global_step": 282766, "epoch": 2336} {"train_loss": -43.206050872802734, "global_step": 282767, "epoch": 2336} {"train_loss": -43.121665954589844, "global_step": 282768, "epoch": 2336} {"train_loss": -43.2767219543457, "global_step": 282769, "epoch": 2336} {"train_loss": -43.567588806152344, "global_step": 282770, "epoch": 2336} {"train_loss": -43.41291046142578, "global_step": 282771, "epoch": 2336} {"train_loss": -42.76424789428711, "global_step": 282772, "epoch": 2336} {"train_loss": -43.106868743896484, "global_step": 282773, "epoch": 2336} {"train_loss": -43.06257629394531, "global_step": 282774, "epoch": 2336} {"train_loss": -42.8724365234375, "global_step": 282775, "epoch": 2336} {"train_loss": -42.02721026712213, "global_step": 282776, "epoch": 2336, "val_loss": 2691777.75} {"train_loss": -43.24774932861328, "global_step": 282777, "epoch": 2337} {"train_loss": -43.67969512939453, "global_step": 282778, "epoch": 2337} {"train_loss": -43.24323654174805, "global_step": 282779, "epoch": 2337} {"train_loss": -43.29929733276367, "global_step": 282780, "epoch": 2337} {"train_loss": -42.684539794921875, "global_step": 282781, "epoch": 2337} {"train_loss": -43.66604232788086, "global_step": 282782, "epoch": 2337} {"train_loss": -43.834442138671875, "global_step": 282783, "epoch": 2337} {"train_loss": -43.4189453125, "global_step": 282784, "epoch": 2337} {"train_loss": -44.009010314941406, "global_step": 282785, "epoch": 2337} {"train_loss": -43.26194381713867, "global_step": 282786, "epoch": 2337} {"train_loss": -42.99007797241211, "global_step": 282787, "epoch": 2337} {"train_loss": -43.43012237548828, "global_step": 282788, "epoch": 2337} {"train_loss": -43.185516357421875, "global_step": 282789, "epoch": 2337} {"train_loss": -43.49937438964844, "global_step": 282790, "epoch": 2337} {"train_loss": -43.438133239746094, "global_step": 282791, "epoch": 2337} {"train_loss": -43.25294876098633, "global_step": 282792, "epoch": 2337} {"train_loss": -43.23957443237305, "global_step": 282793, "epoch": 2337} {"train_loss": -42.74932098388672, "global_step": 282794, "epoch": 2337} {"train_loss": -42.112892150878906, "global_step": 282795, "epoch": 2337} {"train_loss": -42.56438446044922, "global_step": 282796, "epoch": 2337} {"train_loss": -43.68810272216797, "global_step": 282797, "epoch": 2337} {"train_loss": -43.043392181396484, "global_step": 282798, "epoch": 2337} {"train_loss": -40.22654342651367, "global_step": 282799, "epoch": 2337} {"train_loss": -38.14168167114258, "global_step": 282800, "epoch": 2337} {"train_loss": -43.03957748413086, "global_step": 282801, "epoch": 2337} {"train_loss": -38.14199447631836, "global_step": 282802, "epoch": 2337} {"train_loss": -42.784549713134766, "global_step": 282803, "epoch": 2337} {"train_loss": -38.664520263671875, "global_step": 282804, "epoch": 2337} {"train_loss": -35.52853012084961, "global_step": 282805, "epoch": 2337} {"train_loss": -41.77429962158203, "global_step": 282806, "epoch": 2337} {"train_loss": -38.29313659667969, "global_step": 282807, "epoch": 2337} {"train_loss": -38.91767501831055, "global_step": 282808, "epoch": 2337} {"train_loss": -39.57613754272461, "global_step": 282809, "epoch": 2337} {"train_loss": -39.19301986694336, "global_step": 282810, "epoch": 2337} {"train_loss": -40.51541519165039, "global_step": 282811, "epoch": 2337} {"train_loss": -38.67135238647461, "global_step": 282812, "epoch": 2337} {"train_loss": -38.845252990722656, "global_step": 282813, "epoch": 2337} {"train_loss": -40.23225021362305, "global_step": 282814, "epoch": 2337} {"train_loss": -41.03174591064453, "global_step": 282815, "epoch": 2337} {"train_loss": -40.157371520996094, "global_step": 282816, "epoch": 2337} {"train_loss": -41.281883239746094, "global_step": 282817, "epoch": 2337} {"train_loss": -39.925201416015625, "global_step": 282818, "epoch": 2337} {"train_loss": -42.77796173095703, "global_step": 282819, "epoch": 2337} {"train_loss": -40.92953872680664, "global_step": 282820, "epoch": 2337} {"train_loss": -42.13161849975586, "global_step": 282821, "epoch": 2337} {"train_loss": -40.49509811401367, "global_step": 282822, "epoch": 2337} {"train_loss": -42.22079086303711, "global_step": 282823, "epoch": 2337} {"train_loss": -41.87595748901367, "global_step": 282824, "epoch": 2337} {"train_loss": -42.590309143066406, "global_step": 282825, "epoch": 2337} {"train_loss": -41.30595016479492, "global_step": 282826, "epoch": 2337} {"train_loss": -42.7751579284668, "global_step": 282827, "epoch": 2337} {"train_loss": -42.59086608886719, "global_step": 282828, "epoch": 2337} {"train_loss": -42.635009765625, "global_step": 282829, "epoch": 2337} {"train_loss": -42.20193099975586, "global_step": 282830, "epoch": 2337} {"train_loss": -42.22389602661133, "global_step": 282831, "epoch": 2337} {"train_loss": -42.117462158203125, "global_step": 282832, "epoch": 2337} {"train_loss": -42.5223503112793, "global_step": 282833, "epoch": 2337} {"train_loss": -42.6818733215332, "global_step": 282834, "epoch": 2337} {"train_loss": -42.898983001708984, "global_step": 282835, "epoch": 2337} {"train_loss": -42.84235763549805, "global_step": 282836, "epoch": 2337} {"train_loss": -42.8282470703125, "global_step": 282837, "epoch": 2337} {"train_loss": -42.9283447265625, "global_step": 282838, "epoch": 2337} {"train_loss": -42.809017181396484, "global_step": 282839, "epoch": 2337} {"train_loss": -43.05025100708008, "global_step": 282840, "epoch": 2337} {"train_loss": -42.992733001708984, "global_step": 282841, "epoch": 2337} {"train_loss": -42.80845642089844, "global_step": 282842, "epoch": 2337} {"train_loss": -42.93944549560547, "global_step": 282843, "epoch": 2337} {"train_loss": -43.4267692565918, "global_step": 282844, "epoch": 2337} {"train_loss": -42.4470329284668, "global_step": 282845, "epoch": 2337} {"train_loss": -43.12932586669922, "global_step": 282846, "epoch": 2337} {"train_loss": -42.953392028808594, "global_step": 282847, "epoch": 2337} {"train_loss": -43.50606155395508, "global_step": 282848, "epoch": 2337} {"train_loss": -43.50454330444336, "global_step": 282849, "epoch": 2337} {"train_loss": -43.52077865600586, "global_step": 282850, "epoch": 2337} {"train_loss": -43.387691497802734, "global_step": 282851, "epoch": 2337} {"train_loss": -43.5103874206543, "global_step": 282852, "epoch": 2337} {"train_loss": -43.6536979675293, "global_step": 282853, "epoch": 2337} {"train_loss": -43.63152313232422, "global_step": 282854, "epoch": 2337} {"train_loss": -43.85018539428711, "global_step": 282855, "epoch": 2337} {"train_loss": -43.95161819458008, "global_step": 282856, "epoch": 2337} {"train_loss": -43.41276931762695, "global_step": 282857, "epoch": 2337} {"train_loss": -44.1796875, "global_step": 282858, "epoch": 2337} {"train_loss": -43.86042022705078, "global_step": 282859, "epoch": 2337} {"train_loss": -44.29022216796875, "global_step": 282860, "epoch": 2337} {"train_loss": -43.888423919677734, "global_step": 282861, "epoch": 2337} {"train_loss": -44.132179260253906, "global_step": 282862, "epoch": 2337} {"train_loss": -44.03434371948242, "global_step": 282863, "epoch": 2337} {"train_loss": -43.226478576660156, "global_step": 282864, "epoch": 2337} {"train_loss": -43.893585205078125, "global_step": 282865, "epoch": 2337} {"train_loss": -43.92280960083008, "global_step": 282866, "epoch": 2337} {"train_loss": -43.82066345214844, "global_step": 282867, "epoch": 2337} {"train_loss": -43.823848724365234, "global_step": 282868, "epoch": 2337} {"train_loss": -43.817440032958984, "global_step": 282869, "epoch": 2337} {"train_loss": -42.776123046875, "global_step": 282870, "epoch": 2337} {"train_loss": -44.29473114013672, "global_step": 282871, "epoch": 2337} {"train_loss": -44.00105667114258, "global_step": 282872, "epoch": 2337} {"train_loss": -42.740394592285156, "global_step": 282873, "epoch": 2337} {"train_loss": -43.64087677001953, "global_step": 282874, "epoch": 2337} {"train_loss": -43.56983947753906, "global_step": 282875, "epoch": 2337} {"train_loss": -44.131805419921875, "global_step": 282876, "epoch": 2337} {"train_loss": -43.66432571411133, "global_step": 282877, "epoch": 2337} {"train_loss": -44.027278900146484, "global_step": 282878, "epoch": 2337} {"train_loss": -44.2483024597168, "global_step": 282879, "epoch": 2337} {"train_loss": -43.734066009521484, "global_step": 282880, "epoch": 2337} {"train_loss": -42.56049346923828, "global_step": 282881, "epoch": 2337} {"train_loss": -42.7336540222168, "global_step": 282882, "epoch": 2337} {"train_loss": -43.5548210144043, "global_step": 282883, "epoch": 2337} {"train_loss": -43.07960510253906, "global_step": 282884, "epoch": 2337} {"train_loss": -42.33182907104492, "global_step": 282885, "epoch": 2337} {"train_loss": -43.269927978515625, "global_step": 282886, "epoch": 2337} {"train_loss": -43.14925003051758, "global_step": 282887, "epoch": 2337} {"train_loss": -43.16171646118164, "global_step": 282888, "epoch": 2337} {"train_loss": -41.86405563354492, "global_step": 282889, "epoch": 2337} {"train_loss": -42.36013412475586, "global_step": 282890, "epoch": 2337} {"train_loss": -41.46538162231445, "global_step": 282891, "epoch": 2337} {"train_loss": -42.436275482177734, "global_step": 282892, "epoch": 2337} {"train_loss": -42.60546875, "global_step": 282893, "epoch": 2337} {"train_loss": -42.57347106933594, "global_step": 282894, "epoch": 2337} {"train_loss": -42.2517204284668, "global_step": 282895, "epoch": 2337} {"train_loss": -42.26941680908203, "global_step": 282896, "epoch": 2337} {"train_loss": -42.5300604449816, "global_step": 282897, "epoch": 2337, "val_loss": 2556978.75} {"train_loss": -42.27210235595703, "global_step": 282898, "epoch": 2338} {"train_loss": -41.19588088989258, "global_step": 282899, "epoch": 2338} {"train_loss": -41.86568069458008, "global_step": 282900, "epoch": 2338} {"train_loss": -42.34528350830078, "global_step": 282901, "epoch": 2338} {"train_loss": -41.201683044433594, "global_step": 282902, "epoch": 2338} {"train_loss": -42.52383041381836, "global_step": 282903, "epoch": 2338} {"train_loss": -40.9468879699707, "global_step": 282904, "epoch": 2338} {"train_loss": -42.75706100463867, "global_step": 282905, "epoch": 2338} {"train_loss": -42.769222259521484, "global_step": 282906, "epoch": 2338} {"train_loss": -41.94287872314453, "global_step": 282907, "epoch": 2338} {"train_loss": -42.86433792114258, "global_step": 282908, "epoch": 2338} {"train_loss": -40.90321350097656, "global_step": 282909, "epoch": 2338} {"train_loss": -42.19957733154297, "global_step": 282910, "epoch": 2338} {"train_loss": -40.82598876953125, "global_step": 282911, "epoch": 2338} {"train_loss": -39.36576461791992, "global_step": 282912, "epoch": 2338} {"train_loss": -41.33225631713867, "global_step": 282913, "epoch": 2338} {"train_loss": -36.92461395263672, "global_step": 282914, "epoch": 2338} {"train_loss": -38.089542388916016, "global_step": 282915, "epoch": 2338} {"train_loss": -40.695064544677734, "global_step": 282916, "epoch": 2338} {"train_loss": -36.69089889526367, "global_step": 282917, "epoch": 2338} {"train_loss": -38.5395622253418, "global_step": 282918, "epoch": 2338} {"train_loss": -41.253204345703125, "global_step": 282919, "epoch": 2338} {"train_loss": -39.61151885986328, "global_step": 282920, "epoch": 2338} {"train_loss": -40.272769927978516, "global_step": 282921, "epoch": 2338} {"train_loss": -40.70208740234375, "global_step": 282922, "epoch": 2338} {"train_loss": -39.40185546875, "global_step": 282923, "epoch": 2338} {"train_loss": -41.02621078491211, "global_step": 282924, "epoch": 2338} {"train_loss": -38.8202018737793, "global_step": 282925, "epoch": 2338} {"train_loss": -41.897216796875, "global_step": 282926, "epoch": 2338} {"train_loss": -40.52064895629883, "global_step": 282927, "epoch": 2338} {"train_loss": -42.041255950927734, "global_step": 282928, "epoch": 2338} {"train_loss": -41.811275482177734, "global_step": 282929, "epoch": 2338} {"train_loss": -40.67143630981445, "global_step": 282930, "epoch": 2338} {"train_loss": -42.879737854003906, "global_step": 282931, "epoch": 2338} {"train_loss": -41.13981246948242, "global_step": 282932, "epoch": 2338} {"train_loss": -41.625667572021484, "global_step": 282933, "epoch": 2338} {"train_loss": -42.03059005737305, "global_step": 282934, "epoch": 2338} {"train_loss": -41.98088455200195, "global_step": 282935, "epoch": 2338} {"train_loss": -42.676185607910156, "global_step": 282936, "epoch": 2338} {"train_loss": -42.467010498046875, "global_step": 282937, "epoch": 2338} {"train_loss": -42.423946380615234, "global_step": 282938, "epoch": 2338} {"train_loss": -42.62526321411133, "global_step": 282939, "epoch": 2338} {"train_loss": -42.97740173339844, "global_step": 282940, "epoch": 2338} {"train_loss": -41.41236114501953, "global_step": 282941, "epoch": 2338} {"train_loss": -42.85468673706055, "global_step": 282942, "epoch": 2338} {"train_loss": -42.61579513549805, "global_step": 282943, "epoch": 2338} {"train_loss": -43.49955368041992, "global_step": 282944, "epoch": 2338} {"train_loss": -43.111724853515625, "global_step": 282945, "epoch": 2338} {"train_loss": -43.1296501159668, "global_step": 282946, "epoch": 2338} {"train_loss": -43.101253509521484, "global_step": 282947, "epoch": 2338} {"train_loss": -43.3442497253418, "global_step": 282948, "epoch": 2338} {"train_loss": -43.511451721191406, "global_step": 282949, "epoch": 2338} {"train_loss": -42.84113693237305, "global_step": 282950, "epoch": 2338} {"train_loss": -43.236778259277344, "global_step": 282951, "epoch": 2338} {"train_loss": -43.089046478271484, "global_step": 282952, "epoch": 2338} {"train_loss": -43.088497161865234, "global_step": 282953, "epoch": 2338} {"train_loss": -43.50901412963867, "global_step": 282954, "epoch": 2338} {"train_loss": -43.541507720947266, "global_step": 282955, "epoch": 2338} {"train_loss": -43.956783294677734, "global_step": 282956, "epoch": 2338} {"train_loss": -43.54231643676758, "global_step": 282957, "epoch": 2338} {"train_loss": -43.606136322021484, "global_step": 282958, "epoch": 2338} {"train_loss": -43.65330123901367, "global_step": 282959, "epoch": 2338} {"train_loss": -43.88452911376953, "global_step": 282960, "epoch": 2338} {"train_loss": -43.95234298706055, "global_step": 282961, "epoch": 2338} {"train_loss": -43.90313720703125, "global_step": 282962, "epoch": 2338} {"train_loss": -43.631370544433594, "global_step": 282963, "epoch": 2338} {"train_loss": -43.399471282958984, "global_step": 282964, "epoch": 2338} {"train_loss": -43.81406784057617, "global_step": 282965, "epoch": 2338} {"train_loss": -44.14105987548828, "global_step": 282966, "epoch": 2338} {"train_loss": -43.929508209228516, "global_step": 282967, "epoch": 2338} {"train_loss": -43.741554260253906, "global_step": 282968, "epoch": 2338} {"train_loss": -44.53702926635742, "global_step": 282969, "epoch": 2338} {"train_loss": -42.11784362792969, "global_step": 282970, "epoch": 2338} {"train_loss": -44.088680267333984, "global_step": 282971, "epoch": 2338} {"train_loss": -43.13541793823242, "global_step": 282972, "epoch": 2338} {"train_loss": -43.72726058959961, "global_step": 282973, "epoch": 2338} {"train_loss": -44.15604782104492, "global_step": 282974, "epoch": 2338} {"train_loss": -44.25048828125, "global_step": 282975, "epoch": 2338} {"train_loss": -44.238067626953125, "global_step": 282976, "epoch": 2338} {"train_loss": -44.103355407714844, "global_step": 282977, "epoch": 2338} {"train_loss": -44.27811050415039, "global_step": 282978, "epoch": 2338} {"train_loss": -44.35993194580078, "global_step": 282979, "epoch": 2338} {"train_loss": -44.36040115356445, "global_step": 282980, "epoch": 2338} {"train_loss": -44.27507400512695, "global_step": 282981, "epoch": 2338} {"train_loss": -43.72683334350586, "global_step": 282982, "epoch": 2338} {"train_loss": -44.268760681152344, "global_step": 282983, "epoch": 2338} {"train_loss": -43.96208572387695, "global_step": 282984, "epoch": 2338} {"train_loss": -43.44868087768555, "global_step": 282985, "epoch": 2338} {"train_loss": -43.75498962402344, "global_step": 282986, "epoch": 2338} {"train_loss": -43.52355194091797, "global_step": 282987, "epoch": 2338} {"train_loss": -43.90442657470703, "global_step": 282988, "epoch": 2338} {"train_loss": -43.990631103515625, "global_step": 282989, "epoch": 2338} {"train_loss": -43.37160873413086, "global_step": 282990, "epoch": 2338} {"train_loss": -43.10214614868164, "global_step": 282991, "epoch": 2338} {"train_loss": -42.930389404296875, "global_step": 282992, "epoch": 2338} {"train_loss": -43.33811950683594, "global_step": 282993, "epoch": 2338} {"train_loss": -43.93292236328125, "global_step": 282994, "epoch": 2338} {"train_loss": -41.939666748046875, "global_step": 282995, "epoch": 2338} {"train_loss": -41.3214111328125, "global_step": 282996, "epoch": 2338} {"train_loss": -39.74944305419922, "global_step": 282997, "epoch": 2338} {"train_loss": -37.486454010009766, "global_step": 282998, "epoch": 2338} {"train_loss": -36.836891174316406, "global_step": 282999, "epoch": 2338} {"train_loss": -37.852291107177734, "global_step": 283000, "epoch": 2338} {"train_loss": -37.08955001831055, "global_step": 283001, "epoch": 2338} {"train_loss": -39.96649932861328, "global_step": 283002, "epoch": 2338} {"train_loss": -37.35200881958008, "global_step": 283003, "epoch": 2338} {"train_loss": -37.23282241821289, "global_step": 283004, "epoch": 2338} {"train_loss": -38.68062210083008, "global_step": 283005, "epoch": 2338} {"train_loss": -38.30474853515625, "global_step": 283006, "epoch": 2338} {"train_loss": -37.58742904663086, "global_step": 283007, "epoch": 2338} {"train_loss": -37.56023406982422, "global_step": 283008, "epoch": 2338} {"train_loss": -37.68353271484375, "global_step": 283009, "epoch": 2338} {"train_loss": -37.321136474609375, "global_step": 283010, "epoch": 2338} {"train_loss": -37.19965744018555, "global_step": 283011, "epoch": 2338} {"train_loss": -38.51925277709961, "global_step": 283012, "epoch": 2338} {"train_loss": -39.70659637451172, "global_step": 283013, "epoch": 2338} {"train_loss": -39.11743927001953, "global_step": 283014, "epoch": 2338} {"train_loss": -40.162105560302734, "global_step": 283015, "epoch": 2338} {"train_loss": -40.1943473815918, "global_step": 283016, "epoch": 2338} {"train_loss": -41.861202239990234, "global_step": 283017, "epoch": 2338} {"train_loss": -41.76685153551338, "global_step": 283018, "epoch": 2338, "val_loss": 2642882.75} {"train_loss": -41.501304626464844, "global_step": 283019, "epoch": 2339} {"train_loss": -40.357906341552734, "global_step": 283020, "epoch": 2339} {"train_loss": -41.37202072143555, "global_step": 283021, "epoch": 2339} {"train_loss": -37.68389892578125, "global_step": 283022, "epoch": 2339} {"train_loss": -39.2833137512207, "global_step": 283023, "epoch": 2339} {"train_loss": -38.875728607177734, "global_step": 283024, "epoch": 2339} {"train_loss": -39.296051025390625, "global_step": 283025, "epoch": 2339} {"train_loss": -38.559635162353516, "global_step": 283026, "epoch": 2339} {"train_loss": -40.19585037231445, "global_step": 283027, "epoch": 2339} {"train_loss": -36.41953659057617, "global_step": 283028, "epoch": 2339} {"train_loss": -41.74905014038086, "global_step": 283029, "epoch": 2339} {"train_loss": -37.15386962890625, "global_step": 283030, "epoch": 2339} {"train_loss": -40.71936798095703, "global_step": 283031, "epoch": 2339} {"train_loss": -37.557674407958984, "global_step": 283032, "epoch": 2339} {"train_loss": -40.851287841796875, "global_step": 283033, "epoch": 2339} {"train_loss": -36.73756408691406, "global_step": 283034, "epoch": 2339} {"train_loss": -40.128211975097656, "global_step": 283035, "epoch": 2339} {"train_loss": -39.91303253173828, "global_step": 283036, "epoch": 2339} {"train_loss": -38.24343490600586, "global_step": 283037, "epoch": 2339} {"train_loss": -41.556739807128906, "global_step": 283038, "epoch": 2339} {"train_loss": -39.18720626831055, "global_step": 283039, "epoch": 2339} {"train_loss": -41.77883529663086, "global_step": 283040, "epoch": 2339} {"train_loss": -40.11062240600586, "global_step": 283041, "epoch": 2339} {"train_loss": -41.8769645690918, "global_step": 283042, "epoch": 2339} {"train_loss": -39.914302825927734, "global_step": 283043, "epoch": 2339} {"train_loss": -41.6408805847168, "global_step": 283044, "epoch": 2339} {"train_loss": -40.43245315551758, "global_step": 283045, "epoch": 2339} {"train_loss": -42.27523422241211, "global_step": 283046, "epoch": 2339} {"train_loss": -39.47241973876953, "global_step": 283047, "epoch": 2339} {"train_loss": -42.11674118041992, "global_step": 283048, "epoch": 2339} {"train_loss": -40.679283142089844, "global_step": 283049, "epoch": 2339} {"train_loss": -42.15519332885742, "global_step": 283050, "epoch": 2339} {"train_loss": -41.54594802856445, "global_step": 283051, "epoch": 2339} {"train_loss": -42.016746520996094, "global_step": 283052, "epoch": 2339} {"train_loss": -41.95271301269531, "global_step": 283053, "epoch": 2339} {"train_loss": -41.964195251464844, "global_step": 283054, "epoch": 2339} {"train_loss": -41.81351852416992, "global_step": 283055, "epoch": 2339} {"train_loss": -42.61936569213867, "global_step": 283056, "epoch": 2339} {"train_loss": -42.02054214477539, "global_step": 283057, "epoch": 2339} {"train_loss": -42.51192092895508, "global_step": 283058, "epoch": 2339} {"train_loss": -42.914703369140625, "global_step": 283059, "epoch": 2339} {"train_loss": -42.87617492675781, "global_step": 283060, "epoch": 2339} {"train_loss": -42.54636764526367, "global_step": 283061, "epoch": 2339} {"train_loss": -42.290836334228516, "global_step": 283062, "epoch": 2339} {"train_loss": -43.531002044677734, "global_step": 283063, "epoch": 2339} {"train_loss": -42.778743743896484, "global_step": 283064, "epoch": 2339} {"train_loss": -43.47292709350586, "global_step": 283065, "epoch": 2339} {"train_loss": -43.30671310424805, "global_step": 283066, "epoch": 2339} {"train_loss": -42.62098693847656, "global_step": 283067, "epoch": 2339} {"train_loss": -43.26420593261719, "global_step": 283068, "epoch": 2339} {"train_loss": -43.184139251708984, "global_step": 283069, "epoch": 2339} {"train_loss": -43.7783317565918, "global_step": 283070, "epoch": 2339} {"train_loss": -43.45209884643555, "global_step": 283071, "epoch": 2339} {"train_loss": -43.80259323120117, "global_step": 283072, "epoch": 2339} {"train_loss": -43.54976272583008, "global_step": 283073, "epoch": 2339} {"train_loss": -43.53400802612305, "global_step": 283074, "epoch": 2339} {"train_loss": -43.344600677490234, "global_step": 283075, "epoch": 2339} {"train_loss": -43.627960205078125, "global_step": 283076, "epoch": 2339} {"train_loss": -43.34357833862305, "global_step": 283077, "epoch": 2339} {"train_loss": -43.8654670715332, "global_step": 283078, "epoch": 2339} {"train_loss": -43.65210723876953, "global_step": 283079, "epoch": 2339} {"train_loss": -43.85842514038086, "global_step": 283080, "epoch": 2339} {"train_loss": -43.908260345458984, "global_step": 283081, "epoch": 2339} {"train_loss": -43.56134796142578, "global_step": 283082, "epoch": 2339} {"train_loss": -44.076148986816406, "global_step": 283083, "epoch": 2339} {"train_loss": -44.11168670654297, "global_step": 283084, "epoch": 2339} {"train_loss": -43.8426513671875, "global_step": 283085, "epoch": 2339} {"train_loss": -44.12184524536133, "global_step": 283086, "epoch": 2339} {"train_loss": -44.05909729003906, "global_step": 283087, "epoch": 2339} {"train_loss": -44.28852462768555, "global_step": 283088, "epoch": 2339} {"train_loss": -43.98002243041992, "global_step": 283089, "epoch": 2339} {"train_loss": -44.177181243896484, "global_step": 283090, "epoch": 2339} {"train_loss": -43.987911224365234, "global_step": 283091, "epoch": 2339} {"train_loss": -44.16384506225586, "global_step": 283092, "epoch": 2339} {"train_loss": -43.83870315551758, "global_step": 283093, "epoch": 2339} {"train_loss": -43.5898551940918, "global_step": 283094, "epoch": 2339} {"train_loss": -44.506134033203125, "global_step": 283095, "epoch": 2339} {"train_loss": -44.02056121826172, "global_step": 283096, "epoch": 2339} {"train_loss": -44.6856803894043, "global_step": 283097, "epoch": 2339} {"train_loss": -44.19184112548828, "global_step": 283098, "epoch": 2339} {"train_loss": -44.69884490966797, "global_step": 283099, "epoch": 2339} {"train_loss": -43.688358306884766, "global_step": 283100, "epoch": 2339} {"train_loss": -43.68461990356445, "global_step": 283101, "epoch": 2339} {"train_loss": -44.29708480834961, "global_step": 283102, "epoch": 2339} {"train_loss": -44.18666458129883, "global_step": 283103, "epoch": 2339} {"train_loss": -44.26936721801758, "global_step": 283104, "epoch": 2339} {"train_loss": -42.99076843261719, "global_step": 283105, "epoch": 2339} {"train_loss": -42.82881546020508, "global_step": 283106, "epoch": 2339} {"train_loss": -42.090972900390625, "global_step": 283107, "epoch": 2339} {"train_loss": -41.31477737426758, "global_step": 283108, "epoch": 2339} {"train_loss": -42.84450149536133, "global_step": 283109, "epoch": 2339} {"train_loss": -44.14308547973633, "global_step": 283110, "epoch": 2339} {"train_loss": -42.601131439208984, "global_step": 283111, "epoch": 2339} {"train_loss": -42.45878601074219, "global_step": 283112, "epoch": 2339} {"train_loss": -43.074554443359375, "global_step": 283113, "epoch": 2339} {"train_loss": -43.75617599487305, "global_step": 283114, "epoch": 2339} {"train_loss": -43.89604949951172, "global_step": 283115, "epoch": 2339} {"train_loss": -43.317386627197266, "global_step": 283116, "epoch": 2339} {"train_loss": -42.52268981933594, "global_step": 283117, "epoch": 2339} {"train_loss": -42.816341400146484, "global_step": 283118, "epoch": 2339} {"train_loss": -43.20980453491211, "global_step": 283119, "epoch": 2339} {"train_loss": -44.0490837097168, "global_step": 283120, "epoch": 2339} {"train_loss": -43.7907829284668, "global_step": 283121, "epoch": 2339} {"train_loss": -43.89706039428711, "global_step": 283122, "epoch": 2339} {"train_loss": -43.87838363647461, "global_step": 283123, "epoch": 2339} {"train_loss": -43.64901351928711, "global_step": 283124, "epoch": 2339} {"train_loss": -43.926414489746094, "global_step": 283125, "epoch": 2339} {"train_loss": -43.083187103271484, "global_step": 283126, "epoch": 2339} {"train_loss": -42.9803466796875, "global_step": 283127, "epoch": 2339} {"train_loss": -44.23716735839844, "global_step": 283128, "epoch": 2339} {"train_loss": -43.8538703918457, "global_step": 283129, "epoch": 2339} {"train_loss": -43.16688537597656, "global_step": 283130, "epoch": 2339} {"train_loss": -42.97706985473633, "global_step": 283131, "epoch": 2339} {"train_loss": -42.43365478515625, "global_step": 283132, "epoch": 2339} {"train_loss": -43.1544303894043, "global_step": 283133, "epoch": 2339} {"train_loss": -44.176849365234375, "global_step": 283134, "epoch": 2339} {"train_loss": -44.153778076171875, "global_step": 283135, "epoch": 2339} {"train_loss": -43.809871673583984, "global_step": 283136, "epoch": 2339} {"train_loss": -44.28108215332031, "global_step": 283137, "epoch": 2339} {"train_loss": -44.08460235595703, "global_step": 283138, "epoch": 2339} {"train_loss": -42.51711881653336, "global_step": 283139, "epoch": 2339, "val_loss": 2550824.75} {"train_loss": -44.46307373046875, "global_step": 283140, "epoch": 2340} {"train_loss": -44.6104850769043, "global_step": 283141, "epoch": 2340} {"train_loss": -44.4786376953125, "global_step": 283142, "epoch": 2340} {"train_loss": -44.34607696533203, "global_step": 283143, "epoch": 2340} {"train_loss": -44.113746643066406, "global_step": 283144, "epoch": 2340} {"train_loss": -44.05927276611328, "global_step": 283145, "epoch": 2340} {"train_loss": -44.83706283569336, "global_step": 283146, "epoch": 2340} {"train_loss": -43.70768356323242, "global_step": 283147, "epoch": 2340} {"train_loss": -44.556453704833984, "global_step": 283148, "epoch": 2340} {"train_loss": -44.401363372802734, "global_step": 283149, "epoch": 2340} {"train_loss": -44.70881271362305, "global_step": 283150, "epoch": 2340} {"train_loss": -44.3289794921875, "global_step": 283151, "epoch": 2340} {"train_loss": -44.0250358581543, "global_step": 283152, "epoch": 2340} {"train_loss": -44.2529411315918, "global_step": 283153, "epoch": 2340} {"train_loss": -44.296810150146484, "global_step": 283154, "epoch": 2340} {"train_loss": -43.884830474853516, "global_step": 283155, "epoch": 2340} {"train_loss": -43.962764739990234, "global_step": 283156, "epoch": 2340} {"train_loss": -43.85844039916992, "global_step": 283157, "epoch": 2340} {"train_loss": -43.05772018432617, "global_step": 283158, "epoch": 2340} {"train_loss": -43.819271087646484, "global_step": 283159, "epoch": 2340} {"train_loss": -44.485748291015625, "global_step": 283160, "epoch": 2340} {"train_loss": -44.43054962158203, "global_step": 283161, "epoch": 2340} {"train_loss": -44.072261810302734, "global_step": 283162, "epoch": 2340} {"train_loss": -44.133968353271484, "global_step": 283163, "epoch": 2340} {"train_loss": -43.42243194580078, "global_step": 283164, "epoch": 2340} {"train_loss": -42.987422943115234, "global_step": 283165, "epoch": 2340} {"train_loss": -42.94248580932617, "global_step": 283166, "epoch": 2340} {"train_loss": -43.5432243347168, "global_step": 283167, "epoch": 2340} {"train_loss": -43.445037841796875, "global_step": 283168, "epoch": 2340} {"train_loss": -43.5279426574707, "global_step": 283169, "epoch": 2340} {"train_loss": -42.525760650634766, "global_step": 283170, "epoch": 2340} {"train_loss": -41.83223342895508, "global_step": 283171, "epoch": 2340} {"train_loss": -42.43946075439453, "global_step": 283172, "epoch": 2340} {"train_loss": -41.82713317871094, "global_step": 283173, "epoch": 2340} {"train_loss": -38.435142517089844, "global_step": 283174, "epoch": 2340} {"train_loss": -39.91164016723633, "global_step": 283175, "epoch": 2340} {"train_loss": -40.88481521606445, "global_step": 283176, "epoch": 2340} {"train_loss": -41.150909423828125, "global_step": 283177, "epoch": 2340} {"train_loss": -40.60350036621094, "global_step": 283178, "epoch": 2340} {"train_loss": -41.793853759765625, "global_step": 283179, "epoch": 2340} {"train_loss": -41.94904327392578, "global_step": 283180, "epoch": 2340} {"train_loss": -40.14015197753906, "global_step": 283181, "epoch": 2340} {"train_loss": -41.75889205932617, "global_step": 283182, "epoch": 2340} {"train_loss": -40.64624786376953, "global_step": 283183, "epoch": 2340} {"train_loss": -40.3381462097168, "global_step": 283184, "epoch": 2340} {"train_loss": -43.016334533691406, "global_step": 283185, "epoch": 2340} {"train_loss": -41.15950393676758, "global_step": 283186, "epoch": 2340} {"train_loss": -41.95278549194336, "global_step": 283187, "epoch": 2340} {"train_loss": -41.35586929321289, "global_step": 283188, "epoch": 2340} {"train_loss": -41.877105712890625, "global_step": 283189, "epoch": 2340} {"train_loss": -43.07597732543945, "global_step": 283190, "epoch": 2340} {"train_loss": -41.18091583251953, "global_step": 283191, "epoch": 2340} {"train_loss": -41.81904983520508, "global_step": 283192, "epoch": 2340} {"train_loss": -42.253936767578125, "global_step": 283193, "epoch": 2340} {"train_loss": -42.76579666137695, "global_step": 283194, "epoch": 2340} {"train_loss": -42.418853759765625, "global_step": 283195, "epoch": 2340} {"train_loss": -42.42607498168945, "global_step": 283196, "epoch": 2340} {"train_loss": -42.61968994140625, "global_step": 283197, "epoch": 2340} {"train_loss": -43.53902816772461, "global_step": 283198, "epoch": 2340} {"train_loss": -42.679176330566406, "global_step": 283199, "epoch": 2340} {"train_loss": -42.85935592651367, "global_step": 283200, "epoch": 2340} {"train_loss": -43.01849365234375, "global_step": 283201, "epoch": 2340} {"train_loss": -42.39368438720703, "global_step": 283202, "epoch": 2340} {"train_loss": -43.353668212890625, "global_step": 283203, "epoch": 2340} {"train_loss": -42.97944259643555, "global_step": 283204, "epoch": 2340} {"train_loss": -42.62611389160156, "global_step": 283205, "epoch": 2340} {"train_loss": -42.96818923950195, "global_step": 283206, "epoch": 2340} {"train_loss": -43.5058708190918, "global_step": 283207, "epoch": 2340} {"train_loss": -42.93882369995117, "global_step": 283208, "epoch": 2340} {"train_loss": -43.2269287109375, "global_step": 283209, "epoch": 2340} {"train_loss": -43.38505172729492, "global_step": 283210, "epoch": 2340} {"train_loss": -42.3536262512207, "global_step": 283211, "epoch": 2340} {"train_loss": -43.74858474731445, "global_step": 283212, "epoch": 2340} {"train_loss": -42.76872253417969, "global_step": 283213, "epoch": 2340} {"train_loss": -42.726585388183594, "global_step": 283214, "epoch": 2340} {"train_loss": -43.0372428894043, "global_step": 283215, "epoch": 2340} {"train_loss": -42.367889404296875, "global_step": 283216, "epoch": 2340} {"train_loss": -41.33260726928711, "global_step": 283217, "epoch": 2340} {"train_loss": -42.939849853515625, "global_step": 283218, "epoch": 2340} {"train_loss": -42.1771125793457, "global_step": 283219, "epoch": 2340} {"train_loss": -42.53553771972656, "global_step": 283220, "epoch": 2340} {"train_loss": -43.21335983276367, "global_step": 283221, "epoch": 2340} {"train_loss": -43.14844512939453, "global_step": 283222, "epoch": 2340} {"train_loss": -42.827117919921875, "global_step": 283223, "epoch": 2340} {"train_loss": -43.36122512817383, "global_step": 283224, "epoch": 2340} {"train_loss": -42.44005584716797, "global_step": 283225, "epoch": 2340} {"train_loss": -43.727752685546875, "global_step": 283226, "epoch": 2340} {"train_loss": -43.438392639160156, "global_step": 283227, "epoch": 2340} {"train_loss": -43.18099594116211, "global_step": 283228, "epoch": 2340} {"train_loss": -43.150142669677734, "global_step": 283229, "epoch": 2340} {"train_loss": -43.5126953125, "global_step": 283230, "epoch": 2340} {"train_loss": -43.44731521606445, "global_step": 283231, "epoch": 2340} {"train_loss": -42.57551193237305, "global_step": 283232, "epoch": 2340} {"train_loss": -43.14229965209961, "global_step": 283233, "epoch": 2340} {"train_loss": -44.31241226196289, "global_step": 283234, "epoch": 2340} {"train_loss": -42.690486907958984, "global_step": 283235, "epoch": 2340} {"train_loss": -43.338069915771484, "global_step": 283236, "epoch": 2340} {"train_loss": -44.174049377441406, "global_step": 283237, "epoch": 2340} {"train_loss": -43.59251022338867, "global_step": 283238, "epoch": 2340} {"train_loss": -44.01762008666992, "global_step": 283239, "epoch": 2340} {"train_loss": -44.37984848022461, "global_step": 283240, "epoch": 2340} {"train_loss": -43.69975662231445, "global_step": 283241, "epoch": 2340} {"train_loss": -44.02848434448242, "global_step": 283242, "epoch": 2340} {"train_loss": -43.833560943603516, "global_step": 283243, "epoch": 2340} {"train_loss": -44.25526809692383, "global_step": 283244, "epoch": 2340} {"train_loss": -44.273616790771484, "global_step": 283245, "epoch": 2340} {"train_loss": -44.20864486694336, "global_step": 283246, "epoch": 2340} {"train_loss": -44.26829528808594, "global_step": 283247, "epoch": 2340} {"train_loss": -44.13930892944336, "global_step": 283248, "epoch": 2340} {"train_loss": -43.854061126708984, "global_step": 283249, "epoch": 2340} {"train_loss": -44.144744873046875, "global_step": 283250, "epoch": 2340} {"train_loss": -43.718482971191406, "global_step": 283251, "epoch": 2340} {"train_loss": -43.71869659423828, "global_step": 283252, "epoch": 2340} {"train_loss": -43.82963180541992, "global_step": 283253, "epoch": 2340} {"train_loss": -43.922698974609375, "global_step": 283254, "epoch": 2340} {"train_loss": -42.85121536254883, "global_step": 283255, "epoch": 2340} {"train_loss": -43.437957763671875, "global_step": 283256, "epoch": 2340} {"train_loss": -43.3932991027832, "global_step": 283257, "epoch": 2340} {"train_loss": -43.559051513671875, "global_step": 283258, "epoch": 2340} {"train_loss": -43.94735336303711, "global_step": 283259, "epoch": 2340} {"train_loss": -43.098489556430785, "global_step": 283260, "epoch": 2340, "val_loss": 2503660.25} {"train_loss": -44.064453125, "global_step": 283261, "epoch": 2341} {"train_loss": -43.310821533203125, "global_step": 283262, "epoch": 2341} {"train_loss": -43.91652297973633, "global_step": 283263, "epoch": 2341} {"train_loss": -43.65725326538086, "global_step": 283264, "epoch": 2341} {"train_loss": -43.60567855834961, "global_step": 283265, "epoch": 2341} {"train_loss": -44.063228607177734, "global_step": 283266, "epoch": 2341} {"train_loss": -43.06943130493164, "global_step": 283267, "epoch": 2341} {"train_loss": -43.55302047729492, "global_step": 283268, "epoch": 2341} {"train_loss": -43.3328971862793, "global_step": 283269, "epoch": 2341} {"train_loss": -43.57160568237305, "global_step": 283270, "epoch": 2341} {"train_loss": -44.08784103393555, "global_step": 283271, "epoch": 2341} {"train_loss": -43.808692932128906, "global_step": 283272, "epoch": 2341} {"train_loss": -43.74142074584961, "global_step": 283273, "epoch": 2341} {"train_loss": -44.4624137878418, "global_step": 283274, "epoch": 2341} {"train_loss": -42.922142028808594, "global_step": 283275, "epoch": 2341} {"train_loss": -43.823829650878906, "global_step": 283276, "epoch": 2341} {"train_loss": -44.1731071472168, "global_step": 283277, "epoch": 2341} {"train_loss": -43.09031295776367, "global_step": 283278, "epoch": 2341} {"train_loss": -43.47461700439453, "global_step": 283279, "epoch": 2341} {"train_loss": -43.05317687988281, "global_step": 283280, "epoch": 2341} {"train_loss": -42.93154525756836, "global_step": 283281, "epoch": 2341} {"train_loss": -43.559871673583984, "global_step": 283282, "epoch": 2341} {"train_loss": -41.14957809448242, "global_step": 283283, "epoch": 2341} {"train_loss": -43.32070541381836, "global_step": 283284, "epoch": 2341} {"train_loss": -42.9085578918457, "global_step": 283285, "epoch": 2341} {"train_loss": -41.13190460205078, "global_step": 283286, "epoch": 2341} {"train_loss": -41.1093635559082, "global_step": 283287, "epoch": 2341} {"train_loss": -43.542903900146484, "global_step": 283288, "epoch": 2341} {"train_loss": -43.098602294921875, "global_step": 283289, "epoch": 2341} {"train_loss": -41.42341232299805, "global_step": 283290, "epoch": 2341} {"train_loss": -42.618465423583984, "global_step": 283291, "epoch": 2341} {"train_loss": -43.067134857177734, "global_step": 283292, "epoch": 2341} {"train_loss": -41.396629333496094, "global_step": 283293, "epoch": 2341} {"train_loss": -41.3964729309082, "global_step": 283294, "epoch": 2341} {"train_loss": -42.325923919677734, "global_step": 283295, "epoch": 2341} {"train_loss": -42.26567840576172, "global_step": 283296, "epoch": 2341} {"train_loss": -41.965423583984375, "global_step": 283297, "epoch": 2341} {"train_loss": -43.84000778198242, "global_step": 283298, "epoch": 2341} {"train_loss": -42.742645263671875, "global_step": 283299, "epoch": 2341} {"train_loss": -41.7987174987793, "global_step": 283300, "epoch": 2341} {"train_loss": -43.98490524291992, "global_step": 283301, "epoch": 2341} {"train_loss": -42.19337844848633, "global_step": 283302, "epoch": 2341} {"train_loss": -41.0338020324707, "global_step": 283303, "epoch": 2341} {"train_loss": -43.07476806640625, "global_step": 283304, "epoch": 2341} {"train_loss": -43.06464385986328, "global_step": 283305, "epoch": 2341} {"train_loss": -42.39290237426758, "global_step": 283306, "epoch": 2341} {"train_loss": -43.94409942626953, "global_step": 283307, "epoch": 2341} {"train_loss": -42.04399108886719, "global_step": 283308, "epoch": 2341} {"train_loss": -43.10185623168945, "global_step": 283309, "epoch": 2341} {"train_loss": -43.478878021240234, "global_step": 283310, "epoch": 2341} {"train_loss": -42.808067321777344, "global_step": 283311, "epoch": 2341} {"train_loss": -42.84113311767578, "global_step": 283312, "epoch": 2341} {"train_loss": -42.976871490478516, "global_step": 283313, "epoch": 2341} {"train_loss": -42.87398910522461, "global_step": 283314, "epoch": 2341} {"train_loss": -42.419410705566406, "global_step": 283315, "epoch": 2341} {"train_loss": -43.57125473022461, "global_step": 283316, "epoch": 2341} {"train_loss": -42.541908264160156, "global_step": 283317, "epoch": 2341} {"train_loss": -42.773433685302734, "global_step": 283318, "epoch": 2341} {"train_loss": -43.32285690307617, "global_step": 283319, "epoch": 2341} {"train_loss": -43.357330322265625, "global_step": 283320, "epoch": 2341} {"train_loss": -43.1203727722168, "global_step": 283321, "epoch": 2341} {"train_loss": -43.29439926147461, "global_step": 283322, "epoch": 2341} {"train_loss": -44.15403747558594, "global_step": 283323, "epoch": 2341} {"train_loss": -42.644771575927734, "global_step": 283324, "epoch": 2341} {"train_loss": -43.34088897705078, "global_step": 283325, "epoch": 2341} {"train_loss": -43.187557220458984, "global_step": 283326, "epoch": 2341} {"train_loss": -44.05185317993164, "global_step": 283327, "epoch": 2341} {"train_loss": -43.628082275390625, "global_step": 283328, "epoch": 2341} {"train_loss": -43.75938415527344, "global_step": 283329, "epoch": 2341} {"train_loss": -43.900970458984375, "global_step": 283330, "epoch": 2341} {"train_loss": -43.710784912109375, "global_step": 283331, "epoch": 2341} {"train_loss": -42.7392463684082, "global_step": 283332, "epoch": 2341} {"train_loss": -44.11948776245117, "global_step": 283333, "epoch": 2341} {"train_loss": -42.15717697143555, "global_step": 283334, "epoch": 2341} {"train_loss": -41.66773223876953, "global_step": 283335, "epoch": 2341} {"train_loss": -43.28377914428711, "global_step": 283336, "epoch": 2341} {"train_loss": -42.131614685058594, "global_step": 283337, "epoch": 2341} {"train_loss": -42.55989456176758, "global_step": 283338, "epoch": 2341} {"train_loss": -43.2532844543457, "global_step": 283339, "epoch": 2341} {"train_loss": -42.963134765625, "global_step": 283340, "epoch": 2341} {"train_loss": -42.42708969116211, "global_step": 283341, "epoch": 2341} {"train_loss": -43.079566955566406, "global_step": 283342, "epoch": 2341} {"train_loss": -41.81582260131836, "global_step": 283343, "epoch": 2341} {"train_loss": -42.144073486328125, "global_step": 283344, "epoch": 2341} {"train_loss": -42.712074279785156, "global_step": 283345, "epoch": 2341} {"train_loss": -43.32324981689453, "global_step": 283346, "epoch": 2341} {"train_loss": -42.44240951538086, "global_step": 283347, "epoch": 2341} {"train_loss": -43.189064025878906, "global_step": 283348, "epoch": 2341} {"train_loss": -43.7645263671875, "global_step": 283349, "epoch": 2341} {"train_loss": -43.76958084106445, "global_step": 283350, "epoch": 2341} {"train_loss": -42.97342300415039, "global_step": 283351, "epoch": 2341} {"train_loss": -43.6429557800293, "global_step": 283352, "epoch": 2341} {"train_loss": -43.150482177734375, "global_step": 283353, "epoch": 2341} {"train_loss": -42.7745246887207, "global_step": 283354, "epoch": 2341} {"train_loss": -43.60211944580078, "global_step": 283355, "epoch": 2341} {"train_loss": -42.75370788574219, "global_step": 283356, "epoch": 2341} {"train_loss": -44.26863479614258, "global_step": 283357, "epoch": 2341} {"train_loss": -43.77705001831055, "global_step": 283358, "epoch": 2341} {"train_loss": -43.2668571472168, "global_step": 283359, "epoch": 2341} {"train_loss": -44.322200775146484, "global_step": 283360, "epoch": 2341} {"train_loss": -43.9355583190918, "global_step": 283361, "epoch": 2341} {"train_loss": -43.60466384887695, "global_step": 283362, "epoch": 2341} {"train_loss": -43.63021469116211, "global_step": 283363, "epoch": 2341} {"train_loss": -44.02717208862305, "global_step": 283364, "epoch": 2341} {"train_loss": -43.2611198425293, "global_step": 283365, "epoch": 2341} {"train_loss": -44.16926193237305, "global_step": 283366, "epoch": 2341} {"train_loss": -43.201778411865234, "global_step": 283367, "epoch": 2341} {"train_loss": -43.51130294799805, "global_step": 283368, "epoch": 2341} {"train_loss": -43.494136810302734, "global_step": 283369, "epoch": 2341} {"train_loss": -42.92694854736328, "global_step": 283370, "epoch": 2341} {"train_loss": -43.30464553833008, "global_step": 283371, "epoch": 2341} {"train_loss": -42.75472640991211, "global_step": 283372, "epoch": 2341} {"train_loss": -43.11717224121094, "global_step": 283373, "epoch": 2341} {"train_loss": -43.189212799072266, "global_step": 283374, "epoch": 2341} {"train_loss": -42.89963150024414, "global_step": 283375, "epoch": 2341} {"train_loss": -43.211429595947266, "global_step": 283376, "epoch": 2341} {"train_loss": -42.98804473876953, "global_step": 283377, "epoch": 2341} {"train_loss": -43.099884033203125, "global_step": 283378, "epoch": 2341} {"train_loss": -43.903499603271484, "global_step": 283379, "epoch": 2341} {"train_loss": -42.722503662109375, "global_step": 283380, "epoch": 2341} {"train_loss": -43.104622233997695, "global_step": 283381, "epoch": 2341, "val_loss": 2451606.75} {"train_loss": -44.11517333984375, "global_step": 283382, "epoch": 2342} {"train_loss": -42.44425964355469, "global_step": 283383, "epoch": 2342} {"train_loss": -43.738277435302734, "global_step": 283384, "epoch": 2342} {"train_loss": -43.071205139160156, "global_step": 283385, "epoch": 2342} {"train_loss": -43.287635803222656, "global_step": 283386, "epoch": 2342} {"train_loss": -43.346988677978516, "global_step": 283387, "epoch": 2342} {"train_loss": -43.08969497680664, "global_step": 283388, "epoch": 2342} {"train_loss": -43.79328536987305, "global_step": 283389, "epoch": 2342} {"train_loss": -44.1405143737793, "global_step": 283390, "epoch": 2342} {"train_loss": -40.28870391845703, "global_step": 283391, "epoch": 2342} {"train_loss": -43.872344970703125, "global_step": 283392, "epoch": 2342} {"train_loss": -43.44429016113281, "global_step": 283393, "epoch": 2342} {"train_loss": -42.54270553588867, "global_step": 283394, "epoch": 2342} {"train_loss": -44.056007385253906, "global_step": 283395, "epoch": 2342} {"train_loss": -43.28443145751953, "global_step": 283396, "epoch": 2342} {"train_loss": -43.77116012573242, "global_step": 283397, "epoch": 2342} {"train_loss": -44.039424896240234, "global_step": 283398, "epoch": 2342} {"train_loss": -42.06486129760742, "global_step": 283399, "epoch": 2342} {"train_loss": -43.62845993041992, "global_step": 283400, "epoch": 2342} {"train_loss": -42.85980987548828, "global_step": 283401, "epoch": 2342} {"train_loss": -43.789093017578125, "global_step": 283402, "epoch": 2342} {"train_loss": -42.41555404663086, "global_step": 283403, "epoch": 2342} {"train_loss": -42.81334686279297, "global_step": 283404, "epoch": 2342} {"train_loss": -43.12109375, "global_step": 283405, "epoch": 2342} {"train_loss": -43.49860763549805, "global_step": 283406, "epoch": 2342} {"train_loss": -43.52875518798828, "global_step": 283407, "epoch": 2342} {"train_loss": -41.72457504272461, "global_step": 283408, "epoch": 2342} {"train_loss": -42.474266052246094, "global_step": 283409, "epoch": 2342} {"train_loss": -42.02850341796875, "global_step": 283410, "epoch": 2342} {"train_loss": -42.101951599121094, "global_step": 283411, "epoch": 2342} {"train_loss": -40.888587951660156, "global_step": 283412, "epoch": 2342} {"train_loss": -42.312931060791016, "global_step": 283413, "epoch": 2342} {"train_loss": -42.936248779296875, "global_step": 283414, "epoch": 2342} {"train_loss": -40.48161315917969, "global_step": 283415, "epoch": 2342} {"train_loss": -42.973976135253906, "global_step": 283416, "epoch": 2342} {"train_loss": -43.58696365356445, "global_step": 283417, "epoch": 2342} {"train_loss": -42.32371139526367, "global_step": 283418, "epoch": 2342} {"train_loss": -43.03811264038086, "global_step": 283419, "epoch": 2342} {"train_loss": -43.71791458129883, "global_step": 283420, "epoch": 2342} {"train_loss": -42.94932174682617, "global_step": 283421, "epoch": 2342} {"train_loss": -43.12356185913086, "global_step": 283422, "epoch": 2342} {"train_loss": -44.18709182739258, "global_step": 283423, "epoch": 2342} {"train_loss": -43.6467170715332, "global_step": 283424, "epoch": 2342} {"train_loss": -43.38816452026367, "global_step": 283425, "epoch": 2342} {"train_loss": -42.8370475769043, "global_step": 283426, "epoch": 2342} {"train_loss": -35.44152069091797, "global_step": 283427, "epoch": 2342} {"train_loss": -43.3503303527832, "global_step": 283428, "epoch": 2342} {"train_loss": -42.822994232177734, "global_step": 283429, "epoch": 2342} {"train_loss": -43.36955261230469, "global_step": 283430, "epoch": 2342} {"train_loss": -43.72895431518555, "global_step": 283431, "epoch": 2342} {"train_loss": -42.03387451171875, "global_step": 283432, "epoch": 2342} {"train_loss": -41.98974609375, "global_step": 283433, "epoch": 2342} {"train_loss": -42.288631439208984, "global_step": 283434, "epoch": 2342} {"train_loss": -43.43199157714844, "global_step": 283435, "epoch": 2342} {"train_loss": -42.42340850830078, "global_step": 283436, "epoch": 2342} {"train_loss": -42.967933654785156, "global_step": 283437, "epoch": 2342} {"train_loss": -42.82246017456055, "global_step": 283438, "epoch": 2342} {"train_loss": -42.89678955078125, "global_step": 283439, "epoch": 2342} {"train_loss": -43.77262496948242, "global_step": 283440, "epoch": 2342} {"train_loss": -43.05733108520508, "global_step": 283441, "epoch": 2342} {"train_loss": -42.8721809387207, "global_step": 283442, "epoch": 2342} {"train_loss": -43.29814910888672, "global_step": 283443, "epoch": 2342} {"train_loss": -42.51585006713867, "global_step": 283444, "epoch": 2342} {"train_loss": -43.923377990722656, "global_step": 283445, "epoch": 2342} {"train_loss": -43.558631896972656, "global_step": 283446, "epoch": 2342} {"train_loss": -42.155574798583984, "global_step": 283447, "epoch": 2342} {"train_loss": -42.61746597290039, "global_step": 283448, "epoch": 2342} {"train_loss": -37.72113800048828, "global_step": 283449, "epoch": 2342} {"train_loss": -41.586055755615234, "global_step": 283450, "epoch": 2342} {"train_loss": -42.09798049926758, "global_step": 283451, "epoch": 2342} {"train_loss": -41.1209831237793, "global_step": 283452, "epoch": 2342} {"train_loss": -41.04342269897461, "global_step": 283453, "epoch": 2342} {"train_loss": -40.73502731323242, "global_step": 283454, "epoch": 2342} {"train_loss": -41.19783401489258, "global_step": 283455, "epoch": 2342} {"train_loss": -38.58695983886719, "global_step": 283456, "epoch": 2342} {"train_loss": -38.935115814208984, "global_step": 283457, "epoch": 2342} {"train_loss": -41.39979934692383, "global_step": 283458, "epoch": 2342} {"train_loss": -39.720191955566406, "global_step": 283459, "epoch": 2342} {"train_loss": -40.774044036865234, "global_step": 283460, "epoch": 2342} {"train_loss": -40.754207611083984, "global_step": 283461, "epoch": 2342} {"train_loss": -41.83003616333008, "global_step": 283462, "epoch": 2342} {"train_loss": -40.61967086791992, "global_step": 283463, "epoch": 2342} {"train_loss": -38.1984977722168, "global_step": 283464, "epoch": 2342} {"train_loss": -41.3170051574707, "global_step": 283465, "epoch": 2342} {"train_loss": -39.969173431396484, "global_step": 283466, "epoch": 2342} {"train_loss": -40.08515548706055, "global_step": 283467, "epoch": 2342} {"train_loss": -41.0603141784668, "global_step": 283468, "epoch": 2342} {"train_loss": -40.00366973876953, "global_step": 283469, "epoch": 2342} {"train_loss": -38.0937614440918, "global_step": 283470, "epoch": 2342} {"train_loss": -39.68701171875, "global_step": 283471, "epoch": 2342} {"train_loss": -40.80168533325195, "global_step": 283472, "epoch": 2342} {"train_loss": -42.18926239013672, "global_step": 283473, "epoch": 2342} {"train_loss": -39.90980911254883, "global_step": 283474, "epoch": 2342} {"train_loss": -42.47900390625, "global_step": 283475, "epoch": 2342} {"train_loss": -41.087528228759766, "global_step": 283476, "epoch": 2342} {"train_loss": -41.76824951171875, "global_step": 283477, "epoch": 2342} {"train_loss": -41.6766242980957, "global_step": 283478, "epoch": 2342} {"train_loss": -40.37898635864258, "global_step": 283479, "epoch": 2342} {"train_loss": -37.67996597290039, "global_step": 283480, "epoch": 2342} {"train_loss": -41.0511589050293, "global_step": 283481, "epoch": 2342} {"train_loss": -41.013397216796875, "global_step": 283482, "epoch": 2342} {"train_loss": -41.042999267578125, "global_step": 283483, "epoch": 2342} {"train_loss": -42.538246154785156, "global_step": 283484, "epoch": 2342} {"train_loss": -41.892398834228516, "global_step": 283485, "epoch": 2342} {"train_loss": -41.739864349365234, "global_step": 283486, "epoch": 2342} {"train_loss": -41.89750671386719, "global_step": 283487, "epoch": 2342} {"train_loss": -42.26642990112305, "global_step": 283488, "epoch": 2342} {"train_loss": -41.330196380615234, "global_step": 283489, "epoch": 2342} {"train_loss": -41.70268630981445, "global_step": 283490, "epoch": 2342} {"train_loss": -42.3156623840332, "global_step": 283491, "epoch": 2342} {"train_loss": -42.734798431396484, "global_step": 283492, "epoch": 2342} {"train_loss": -42.2090950012207, "global_step": 283493, "epoch": 2342} {"train_loss": -41.913700103759766, "global_step": 283494, "epoch": 2342} {"train_loss": -42.239471435546875, "global_step": 283495, "epoch": 2342} {"train_loss": -42.402191162109375, "global_step": 283496, "epoch": 2342} {"train_loss": -41.96674728393555, "global_step": 283497, "epoch": 2342} {"train_loss": -43.26703643798828, "global_step": 283498, "epoch": 2342} {"train_loss": -43.212364196777344, "global_step": 283499, "epoch": 2342} {"train_loss": -42.595680236816406, "global_step": 283500, "epoch": 2342} {"train_loss": -42.4351692199707, "global_step": 283501, "epoch": 2342} {"train_loss": -42.09211853910084, "global_step": 283502, "epoch": 2342, "val_loss": 2536091.0} {"train_loss": -42.64426803588867, "global_step": 283503, "epoch": 2343} {"train_loss": -42.7001838684082, "global_step": 283504, "epoch": 2343} {"train_loss": -43.00551223754883, "global_step": 283505, "epoch": 2343} {"train_loss": -42.915653228759766, "global_step": 283506, "epoch": 2343} {"train_loss": -42.890174865722656, "global_step": 283507, "epoch": 2343} {"train_loss": -43.08012771606445, "global_step": 283508, "epoch": 2343} {"train_loss": -42.542640686035156, "global_step": 283509, "epoch": 2343} {"train_loss": -43.0449104309082, "global_step": 283510, "epoch": 2343} {"train_loss": -42.40427017211914, "global_step": 283511, "epoch": 2343} {"train_loss": -43.15272903442383, "global_step": 283512, "epoch": 2343} {"train_loss": -43.301998138427734, "global_step": 283513, "epoch": 2343} {"train_loss": -43.44488525390625, "global_step": 283514, "epoch": 2343} {"train_loss": -42.80946731567383, "global_step": 283515, "epoch": 2343} {"train_loss": -43.17455291748047, "global_step": 283516, "epoch": 2343} {"train_loss": -43.2875862121582, "global_step": 283517, "epoch": 2343} {"train_loss": -43.30773162841797, "global_step": 283518, "epoch": 2343} {"train_loss": -42.883399963378906, "global_step": 283519, "epoch": 2343} {"train_loss": -42.81319808959961, "global_step": 283520, "epoch": 2343} {"train_loss": -43.65665817260742, "global_step": 283521, "epoch": 2343} {"train_loss": -43.43006134033203, "global_step": 283522, "epoch": 2343} {"train_loss": -42.61806869506836, "global_step": 283523, "epoch": 2343} {"train_loss": -43.833011627197266, "global_step": 283524, "epoch": 2343} {"train_loss": -43.02753829956055, "global_step": 283525, "epoch": 2343} {"train_loss": -43.43209457397461, "global_step": 283526, "epoch": 2343} {"train_loss": -43.290218353271484, "global_step": 283527, "epoch": 2343} {"train_loss": -44.05991744995117, "global_step": 283528, "epoch": 2343} {"train_loss": -43.95001220703125, "global_step": 283529, "epoch": 2343} {"train_loss": -42.77079391479492, "global_step": 283530, "epoch": 2343} {"train_loss": -44.30548858642578, "global_step": 283531, "epoch": 2343} {"train_loss": -43.195491790771484, "global_step": 283532, "epoch": 2343} {"train_loss": -43.95359802246094, "global_step": 283533, "epoch": 2343} {"train_loss": -43.42995071411133, "global_step": 283534, "epoch": 2343} {"train_loss": -42.96854782104492, "global_step": 283535, "epoch": 2343} {"train_loss": -43.50203323364258, "global_step": 283536, "epoch": 2343} {"train_loss": -43.92593002319336, "global_step": 283537, "epoch": 2343} {"train_loss": -43.81459045410156, "global_step": 283538, "epoch": 2343} {"train_loss": -43.1011962890625, "global_step": 283539, "epoch": 2343} {"train_loss": -43.31557846069336, "global_step": 283540, "epoch": 2343} {"train_loss": -43.2027702331543, "global_step": 283541, "epoch": 2343} {"train_loss": -43.945884704589844, "global_step": 283542, "epoch": 2343} {"train_loss": -43.90250015258789, "global_step": 283543, "epoch": 2343} {"train_loss": -43.745155334472656, "global_step": 283544, "epoch": 2343} {"train_loss": -44.34553146362305, "global_step": 283545, "epoch": 2343} {"train_loss": -43.53489685058594, "global_step": 283546, "epoch": 2343} {"train_loss": -44.03972244262695, "global_step": 283547, "epoch": 2343} {"train_loss": -43.75383377075195, "global_step": 283548, "epoch": 2343} {"train_loss": -43.610660552978516, "global_step": 283549, "epoch": 2343} {"train_loss": -44.3857307434082, "global_step": 283550, "epoch": 2343} {"train_loss": -43.599361419677734, "global_step": 283551, "epoch": 2343} {"train_loss": -44.297515869140625, "global_step": 283552, "epoch": 2343} {"train_loss": -44.59660720825195, "global_step": 283553, "epoch": 2343} {"train_loss": -43.90760040283203, "global_step": 283554, "epoch": 2343} {"train_loss": -44.21390914916992, "global_step": 283555, "epoch": 2343} {"train_loss": -44.49043655395508, "global_step": 283556, "epoch": 2343} {"train_loss": -44.11285400390625, "global_step": 283557, "epoch": 2343} {"train_loss": -44.841651916503906, "global_step": 283558, "epoch": 2343} {"train_loss": -44.04309844970703, "global_step": 283559, "epoch": 2343} {"train_loss": -44.120399475097656, "global_step": 283560, "epoch": 2343} {"train_loss": -44.62543869018555, "global_step": 283561, "epoch": 2343} {"train_loss": -44.09990310668945, "global_step": 283562, "epoch": 2343} {"train_loss": -43.960384368896484, "global_step": 283563, "epoch": 2343} {"train_loss": -42.48417282104492, "global_step": 283564, "epoch": 2343} {"train_loss": -43.036659240722656, "global_step": 283565, "epoch": 2343} {"train_loss": -41.55415725708008, "global_step": 283566, "epoch": 2343} {"train_loss": -42.6617431640625, "global_step": 283567, "epoch": 2343} {"train_loss": -43.93161392211914, "global_step": 283568, "epoch": 2343} {"train_loss": -42.83492660522461, "global_step": 283569, "epoch": 2343} {"train_loss": -44.55659866333008, "global_step": 283570, "epoch": 2343} {"train_loss": -43.845550537109375, "global_step": 283571, "epoch": 2343} {"train_loss": -44.0323486328125, "global_step": 283572, "epoch": 2343} {"train_loss": -43.13169479370117, "global_step": 283573, "epoch": 2343} {"train_loss": -42.879032135009766, "global_step": 283574, "epoch": 2343} {"train_loss": -43.35262680053711, "global_step": 283575, "epoch": 2343} {"train_loss": -44.4825325012207, "global_step": 283576, "epoch": 2343} {"train_loss": -43.03657150268555, "global_step": 283577, "epoch": 2343} {"train_loss": -43.3380241394043, "global_step": 283578, "epoch": 2343} {"train_loss": -43.77674865722656, "global_step": 283579, "epoch": 2343} {"train_loss": -43.8375358581543, "global_step": 283580, "epoch": 2343} {"train_loss": -43.044464111328125, "global_step": 283581, "epoch": 2343} {"train_loss": -44.23859786987305, "global_step": 283582, "epoch": 2343} {"train_loss": -43.51321792602539, "global_step": 283583, "epoch": 2343} {"train_loss": -42.51902389526367, "global_step": 283584, "epoch": 2343} {"train_loss": -43.39884567260742, "global_step": 283585, "epoch": 2343} {"train_loss": -43.62685775756836, "global_step": 283586, "epoch": 2343} {"train_loss": -43.195404052734375, "global_step": 283587, "epoch": 2343} {"train_loss": -42.7354621887207, "global_step": 283588, "epoch": 2343} {"train_loss": -43.99940872192383, "global_step": 283589, "epoch": 2343} {"train_loss": -43.8475227355957, "global_step": 283590, "epoch": 2343} {"train_loss": -43.425086975097656, "global_step": 283591, "epoch": 2343} {"train_loss": -43.76939010620117, "global_step": 283592, "epoch": 2343} {"train_loss": -43.45521926879883, "global_step": 283593, "epoch": 2343} {"train_loss": -42.3049430847168, "global_step": 283594, "epoch": 2343} {"train_loss": -43.39370346069336, "global_step": 283595, "epoch": 2343} {"train_loss": -42.65995407104492, "global_step": 283596, "epoch": 2343} {"train_loss": -41.9287223815918, "global_step": 283597, "epoch": 2343} {"train_loss": -43.130882263183594, "global_step": 283598, "epoch": 2343} {"train_loss": -42.156982421875, "global_step": 283599, "epoch": 2343} {"train_loss": -40.95296859741211, "global_step": 283600, "epoch": 2343} {"train_loss": -41.11564636230469, "global_step": 283601, "epoch": 2343} {"train_loss": -43.26589584350586, "global_step": 283602, "epoch": 2343} {"train_loss": -42.94258499145508, "global_step": 283603, "epoch": 2343} {"train_loss": -39.593666076660156, "global_step": 283604, "epoch": 2343} {"train_loss": -42.27410888671875, "global_step": 283605, "epoch": 2343} {"train_loss": -35.04231643676758, "global_step": 283606, "epoch": 2343} {"train_loss": -30.6662654876709, "global_step": 283607, "epoch": 2343} {"train_loss": -38.52920913696289, "global_step": 283608, "epoch": 2343} {"train_loss": -37.23971176147461, "global_step": 283609, "epoch": 2343} {"train_loss": -37.97858810424805, "global_step": 283610, "epoch": 2343} {"train_loss": -40.371456146240234, "global_step": 283611, "epoch": 2343} {"train_loss": -34.8597526550293, "global_step": 283612, "epoch": 2343} {"train_loss": -41.10175704956055, "global_step": 283613, "epoch": 2343} {"train_loss": -38.1751594543457, "global_step": 283614, "epoch": 2343} {"train_loss": -40.070682525634766, "global_step": 283615, "epoch": 2343} {"train_loss": -39.6879997253418, "global_step": 283616, "epoch": 2343} {"train_loss": -40.126434326171875, "global_step": 283617, "epoch": 2343} {"train_loss": -41.16731643676758, "global_step": 283618, "epoch": 2343} {"train_loss": -41.09124755859375, "global_step": 283619, "epoch": 2343} {"train_loss": -41.5269889831543, "global_step": 283620, "epoch": 2343} {"train_loss": -42.01369857788086, "global_step": 283621, "epoch": 2343} {"train_loss": -42.209835052490234, "global_step": 283622, "epoch": 2343} {"train_loss": -42.71236585191459, "global_step": 283623, "epoch": 2343, "val_loss": 2434452.5} {"train_loss": -41.85758590698242, "global_step": 283624, "epoch": 2344} {"train_loss": -42.12165069580078, "global_step": 283625, "epoch": 2344} {"train_loss": -42.13955307006836, "global_step": 283626, "epoch": 2344} {"train_loss": -43.04261016845703, "global_step": 283627, "epoch": 2344} {"train_loss": -42.44544219970703, "global_step": 283628, "epoch": 2344} {"train_loss": -42.323307037353516, "global_step": 283629, "epoch": 2344} {"train_loss": -41.69497299194336, "global_step": 283630, "epoch": 2344} {"train_loss": -42.341400146484375, "global_step": 283631, "epoch": 2344} {"train_loss": -42.58209991455078, "global_step": 283632, "epoch": 2344} {"train_loss": -42.978214263916016, "global_step": 283633, "epoch": 2344} {"train_loss": -42.23093795776367, "global_step": 283634, "epoch": 2344} {"train_loss": -42.55998229980469, "global_step": 283635, "epoch": 2344} {"train_loss": -42.80636215209961, "global_step": 283636, "epoch": 2344} {"train_loss": -41.61737060546875, "global_step": 283637, "epoch": 2344} {"train_loss": -42.337867736816406, "global_step": 283638, "epoch": 2344} {"train_loss": -42.52280807495117, "global_step": 283639, "epoch": 2344} {"train_loss": -41.955440521240234, "global_step": 283640, "epoch": 2344} {"train_loss": -42.835113525390625, "global_step": 283641, "epoch": 2344} {"train_loss": -42.4466552734375, "global_step": 283642, "epoch": 2344} {"train_loss": -42.180423736572266, "global_step": 283643, "epoch": 2344} {"train_loss": -42.63616943359375, "global_step": 283644, "epoch": 2344} {"train_loss": -42.95603561401367, "global_step": 283645, "epoch": 2344} {"train_loss": -42.85889434814453, "global_step": 283646, "epoch": 2344} {"train_loss": -42.65763854980469, "global_step": 283647, "epoch": 2344} {"train_loss": -43.5723991394043, "global_step": 283648, "epoch": 2344} {"train_loss": -42.771690368652344, "global_step": 283649, "epoch": 2344} {"train_loss": -42.40311813354492, "global_step": 283650, "epoch": 2344} {"train_loss": -43.830928802490234, "global_step": 283651, "epoch": 2344} {"train_loss": -42.798133850097656, "global_step": 283652, "epoch": 2344} {"train_loss": -42.84188461303711, "global_step": 283653, "epoch": 2344} {"train_loss": -43.36927032470703, "global_step": 283654, "epoch": 2344} {"train_loss": -42.92210388183594, "global_step": 283655, "epoch": 2344} {"train_loss": -42.00234603881836, "global_step": 283656, "epoch": 2344} {"train_loss": -43.45893096923828, "global_step": 283657, "epoch": 2344} {"train_loss": -42.711181640625, "global_step": 283658, "epoch": 2344} {"train_loss": -42.154903411865234, "global_step": 283659, "epoch": 2344} {"train_loss": -43.29745864868164, "global_step": 283660, "epoch": 2344} {"train_loss": -43.443233489990234, "global_step": 283661, "epoch": 2344} {"train_loss": -42.95115280151367, "global_step": 283662, "epoch": 2344} {"train_loss": -43.6031494140625, "global_step": 283663, "epoch": 2344} {"train_loss": -43.11684799194336, "global_step": 283664, "epoch": 2344} {"train_loss": -43.6810417175293, "global_step": 283665, "epoch": 2344} {"train_loss": -44.015663146972656, "global_step": 283666, "epoch": 2344} {"train_loss": -44.088844299316406, "global_step": 283667, "epoch": 2344} {"train_loss": -43.89120101928711, "global_step": 283668, "epoch": 2344} {"train_loss": -44.16324996948242, "global_step": 283669, "epoch": 2344} {"train_loss": -43.89254379272461, "global_step": 283670, "epoch": 2344} {"train_loss": -43.871116638183594, "global_step": 283671, "epoch": 2344} {"train_loss": -44.4716911315918, "global_step": 283672, "epoch": 2344} {"train_loss": -43.47795104980469, "global_step": 283673, "epoch": 2344} {"train_loss": -43.91731643676758, "global_step": 283674, "epoch": 2344} {"train_loss": -43.70160675048828, "global_step": 283675, "epoch": 2344} {"train_loss": -43.91241455078125, "global_step": 283676, "epoch": 2344} {"train_loss": -44.1829948425293, "global_step": 283677, "epoch": 2344} {"train_loss": -44.3298454284668, "global_step": 283678, "epoch": 2344} {"train_loss": -44.35701370239258, "global_step": 283679, "epoch": 2344} {"train_loss": -43.984039306640625, "global_step": 283680, "epoch": 2344} {"train_loss": -43.99500274658203, "global_step": 283681, "epoch": 2344} {"train_loss": -43.78765106201172, "global_step": 283682, "epoch": 2344} {"train_loss": -43.74709701538086, "global_step": 283683, "epoch": 2344} {"train_loss": -44.229366302490234, "global_step": 283684, "epoch": 2344} {"train_loss": -43.62255859375, "global_step": 283685, "epoch": 2344} {"train_loss": -44.29499435424805, "global_step": 283686, "epoch": 2344} {"train_loss": -44.240657806396484, "global_step": 283687, "epoch": 2344} {"train_loss": -44.27543640136719, "global_step": 283688, "epoch": 2344} {"train_loss": -44.332366943359375, "global_step": 283689, "epoch": 2344} {"train_loss": -44.231319427490234, "global_step": 283690, "epoch": 2344} {"train_loss": -43.002193450927734, "global_step": 283691, "epoch": 2344} {"train_loss": -44.75938034057617, "global_step": 283692, "epoch": 2344} {"train_loss": -44.29645919799805, "global_step": 283693, "epoch": 2344} {"train_loss": -44.4628791809082, "global_step": 283694, "epoch": 2344} {"train_loss": -44.49296951293945, "global_step": 283695, "epoch": 2344} {"train_loss": -44.36322021484375, "global_step": 283696, "epoch": 2344} {"train_loss": -44.30842971801758, "global_step": 283697, "epoch": 2344} {"train_loss": -44.16761016845703, "global_step": 283698, "epoch": 2344} {"train_loss": -44.27265167236328, "global_step": 283699, "epoch": 2344} {"train_loss": -44.0281982421875, "global_step": 283700, "epoch": 2344} {"train_loss": -44.01081848144531, "global_step": 283701, "epoch": 2344} {"train_loss": -44.11719512939453, "global_step": 283702, "epoch": 2344} {"train_loss": -43.8896484375, "global_step": 283703, "epoch": 2344} {"train_loss": -44.5611572265625, "global_step": 283704, "epoch": 2344} {"train_loss": -44.33415222167969, "global_step": 283705, "epoch": 2344} {"train_loss": -44.899654388427734, "global_step": 283706, "epoch": 2344} {"train_loss": -44.243263244628906, "global_step": 283707, "epoch": 2344} {"train_loss": -44.49298858642578, "global_step": 283708, "epoch": 2344} {"train_loss": -44.150390625, "global_step": 283709, "epoch": 2344} {"train_loss": -44.21442794799805, "global_step": 283710, "epoch": 2344} {"train_loss": -41.29113006591797, "global_step": 283711, "epoch": 2344} {"train_loss": -38.312164306640625, "global_step": 283712, "epoch": 2344} {"train_loss": -39.1485481262207, "global_step": 283713, "epoch": 2344} {"train_loss": -39.612117767333984, "global_step": 283714, "epoch": 2344} {"train_loss": -41.87862777709961, "global_step": 283715, "epoch": 2344} {"train_loss": -42.596683502197266, "global_step": 283716, "epoch": 2344} {"train_loss": -42.52610397338867, "global_step": 283717, "epoch": 2344} {"train_loss": -40.9335823059082, "global_step": 283718, "epoch": 2344} {"train_loss": -42.91423416137695, "global_step": 283719, "epoch": 2344} {"train_loss": -41.80989456176758, "global_step": 283720, "epoch": 2344} {"train_loss": -43.29903030395508, "global_step": 283721, "epoch": 2344} {"train_loss": -41.09609603881836, "global_step": 283722, "epoch": 2344} {"train_loss": -42.19657897949219, "global_step": 283723, "epoch": 2344} {"train_loss": -42.775508880615234, "global_step": 283724, "epoch": 2344} {"train_loss": -42.47688293457031, "global_step": 283725, "epoch": 2344} {"train_loss": -41.66298294067383, "global_step": 283726, "epoch": 2344} {"train_loss": -38.96194839477539, "global_step": 283727, "epoch": 2344} {"train_loss": -42.471920013427734, "global_step": 283728, "epoch": 2344} {"train_loss": -41.79146957397461, "global_step": 283729, "epoch": 2344} {"train_loss": -41.39287185668945, "global_step": 283730, "epoch": 2344} {"train_loss": -40.35270309448242, "global_step": 283731, "epoch": 2344} {"train_loss": -42.2825927734375, "global_step": 283732, "epoch": 2344} {"train_loss": -41.532806396484375, "global_step": 283733, "epoch": 2344} {"train_loss": -42.1961784362793, "global_step": 283734, "epoch": 2344} {"train_loss": -42.5008544921875, "global_step": 283735, "epoch": 2344} {"train_loss": -41.04029083251953, "global_step": 283736, "epoch": 2344} {"train_loss": -43.45408248901367, "global_step": 283737, "epoch": 2344} {"train_loss": -42.62018585205078, "global_step": 283738, "epoch": 2344} {"train_loss": -41.822566986083984, "global_step": 283739, "epoch": 2344} {"train_loss": -41.872318267822266, "global_step": 283740, "epoch": 2344} {"train_loss": -42.26209259033203, "global_step": 283741, "epoch": 2344} {"train_loss": -41.95418167114258, "global_step": 283742, "epoch": 2344} {"train_loss": -42.67446517944336, "global_step": 283743, "epoch": 2344} {"train_loss": -42.961666012598464, "global_step": 283744, "epoch": 2344, "val_loss": 2480477.25} {"train_loss": -42.02009201049805, "global_step": 283745, "epoch": 2345} {"train_loss": -43.1334342956543, "global_step": 283746, "epoch": 2345} {"train_loss": -42.82898712158203, "global_step": 283747, "epoch": 2345} {"train_loss": -42.753326416015625, "global_step": 283748, "epoch": 2345} {"train_loss": -43.254085540771484, "global_step": 283749, "epoch": 2345} {"train_loss": -41.816322326660156, "global_step": 283750, "epoch": 2345} {"train_loss": -42.30292892456055, "global_step": 283751, "epoch": 2345} {"train_loss": -43.07612228393555, "global_step": 283752, "epoch": 2345} {"train_loss": -42.48623275756836, "global_step": 283753, "epoch": 2345} {"train_loss": -41.81043243408203, "global_step": 283754, "epoch": 2345} {"train_loss": -42.55298614501953, "global_step": 283755, "epoch": 2345} {"train_loss": -43.42959213256836, "global_step": 283756, "epoch": 2345} {"train_loss": -42.634742736816406, "global_step": 283757, "epoch": 2345} {"train_loss": -42.095802307128906, "global_step": 283758, "epoch": 2345} {"train_loss": -43.50889205932617, "global_step": 283759, "epoch": 2345} {"train_loss": -42.28717803955078, "global_step": 283760, "epoch": 2345} {"train_loss": -42.44381332397461, "global_step": 283761, "epoch": 2345} {"train_loss": -43.346805572509766, "global_step": 283762, "epoch": 2345} {"train_loss": -42.948158264160156, "global_step": 283763, "epoch": 2345} {"train_loss": -43.601627349853516, "global_step": 283764, "epoch": 2345} {"train_loss": -43.193050384521484, "global_step": 283765, "epoch": 2345} {"train_loss": -43.09467697143555, "global_step": 283766, "epoch": 2345} {"train_loss": -43.485321044921875, "global_step": 283767, "epoch": 2345} {"train_loss": -42.623573303222656, "global_step": 283768, "epoch": 2345} {"train_loss": -43.5062370300293, "global_step": 283769, "epoch": 2345} {"train_loss": -43.70705795288086, "global_step": 283770, "epoch": 2345} {"train_loss": -42.91117477416992, "global_step": 283771, "epoch": 2345} {"train_loss": -43.69941711425781, "global_step": 283772, "epoch": 2345} {"train_loss": -43.953243255615234, "global_step": 283773, "epoch": 2345} {"train_loss": -43.26314163208008, "global_step": 283774, "epoch": 2345} {"train_loss": -43.31307601928711, "global_step": 283775, "epoch": 2345} {"train_loss": -43.33442306518555, "global_step": 283776, "epoch": 2345} {"train_loss": -42.31538009643555, "global_step": 283777, "epoch": 2345} {"train_loss": -43.680721282958984, "global_step": 283778, "epoch": 2345} {"train_loss": -42.438594818115234, "global_step": 283779, "epoch": 2345} {"train_loss": -43.18003463745117, "global_step": 283780, "epoch": 2345} {"train_loss": -43.50634765625, "global_step": 283781, "epoch": 2345} {"train_loss": -42.234771728515625, "global_step": 283782, "epoch": 2345} {"train_loss": -43.82015609741211, "global_step": 283783, "epoch": 2345} {"train_loss": -41.4096794128418, "global_step": 283784, "epoch": 2345} {"train_loss": -43.17667770385742, "global_step": 283785, "epoch": 2345} {"train_loss": -43.37420654296875, "global_step": 283786, "epoch": 2345} {"train_loss": -42.872188568115234, "global_step": 283787, "epoch": 2345} {"train_loss": -43.1617317199707, "global_step": 283788, "epoch": 2345} {"train_loss": -43.47627639770508, "global_step": 283789, "epoch": 2345} {"train_loss": -43.682735443115234, "global_step": 283790, "epoch": 2345} {"train_loss": -43.12989044189453, "global_step": 283791, "epoch": 2345} {"train_loss": -43.588626861572266, "global_step": 283792, "epoch": 2345} {"train_loss": -43.46895980834961, "global_step": 283793, "epoch": 2345} {"train_loss": -43.6478385925293, "global_step": 283794, "epoch": 2345} {"train_loss": -43.697776794433594, "global_step": 283795, "epoch": 2345} {"train_loss": -43.01860427856445, "global_step": 283796, "epoch": 2345} {"train_loss": -43.709144592285156, "global_step": 283797, "epoch": 2345} {"train_loss": -43.098182678222656, "global_step": 283798, "epoch": 2345} {"train_loss": -43.69902801513672, "global_step": 283799, "epoch": 2345} {"train_loss": -44.26169967651367, "global_step": 283800, "epoch": 2345} {"train_loss": -42.7641716003418, "global_step": 283801, "epoch": 2345} {"train_loss": -43.2602424621582, "global_step": 283802, "epoch": 2345} {"train_loss": -43.33694076538086, "global_step": 283803, "epoch": 2345} {"train_loss": -43.867977142333984, "global_step": 283804, "epoch": 2345} {"train_loss": -43.212825775146484, "global_step": 283805, "epoch": 2345} {"train_loss": -42.58057403564453, "global_step": 283806, "epoch": 2345} {"train_loss": -42.68242645263672, "global_step": 283807, "epoch": 2345} {"train_loss": -42.9942512512207, "global_step": 283808, "epoch": 2345} {"train_loss": -43.37722396850586, "global_step": 283809, "epoch": 2345} {"train_loss": -43.88994216918945, "global_step": 283810, "epoch": 2345} {"train_loss": -42.84650421142578, "global_step": 283811, "epoch": 2345} {"train_loss": -41.99337387084961, "global_step": 283812, "epoch": 2345} {"train_loss": -43.41401672363281, "global_step": 283813, "epoch": 2345} {"train_loss": -42.20469284057617, "global_step": 283814, "epoch": 2345} {"train_loss": -43.75120544433594, "global_step": 283815, "epoch": 2345} {"train_loss": -43.1129035949707, "global_step": 283816, "epoch": 2345} {"train_loss": -42.9864387512207, "global_step": 283817, "epoch": 2345} {"train_loss": -43.35558319091797, "global_step": 283818, "epoch": 2345} {"train_loss": -42.87155532836914, "global_step": 283819, "epoch": 2345} {"train_loss": -43.550453186035156, "global_step": 283820, "epoch": 2345} {"train_loss": -43.456153869628906, "global_step": 283821, "epoch": 2345} {"train_loss": -42.92299270629883, "global_step": 283822, "epoch": 2345} {"train_loss": -43.66111373901367, "global_step": 283823, "epoch": 2345} {"train_loss": -42.197818756103516, "global_step": 283824, "epoch": 2345} {"train_loss": -41.52674102783203, "global_step": 283825, "epoch": 2345} {"train_loss": -41.172298431396484, "global_step": 283826, "epoch": 2345} {"train_loss": -42.5402946472168, "global_step": 283827, "epoch": 2345} {"train_loss": -42.77839279174805, "global_step": 283828, "epoch": 2345} {"train_loss": -42.42684555053711, "global_step": 283829, "epoch": 2345} {"train_loss": -43.05520248413086, "global_step": 283830, "epoch": 2345} {"train_loss": -42.68735885620117, "global_step": 283831, "epoch": 2345} {"train_loss": -42.30706787109375, "global_step": 283832, "epoch": 2345} {"train_loss": -43.24818801879883, "global_step": 283833, "epoch": 2345} {"train_loss": -42.87742233276367, "global_step": 283834, "epoch": 2345} {"train_loss": -42.93674850463867, "global_step": 283835, "epoch": 2345} {"train_loss": -42.747474670410156, "global_step": 283836, "epoch": 2345} {"train_loss": -40.93705368041992, "global_step": 283837, "epoch": 2345} {"train_loss": -42.25187301635742, "global_step": 283838, "epoch": 2345} {"train_loss": -41.12791061401367, "global_step": 283839, "epoch": 2345} {"train_loss": -40.244441986083984, "global_step": 283840, "epoch": 2345} {"train_loss": -42.098567962646484, "global_step": 283841, "epoch": 2345} {"train_loss": -41.495113372802734, "global_step": 283842, "epoch": 2345} {"train_loss": -40.744178771972656, "global_step": 283843, "epoch": 2345} {"train_loss": -42.04783248901367, "global_step": 283844, "epoch": 2345} {"train_loss": -42.19735336303711, "global_step": 283845, "epoch": 2345} {"train_loss": -40.511653900146484, "global_step": 283846, "epoch": 2345} {"train_loss": -42.432491302490234, "global_step": 283847, "epoch": 2345} {"train_loss": -40.15700912475586, "global_step": 283848, "epoch": 2345} {"train_loss": -41.65243148803711, "global_step": 283849, "epoch": 2345} {"train_loss": -42.80936813354492, "global_step": 283850, "epoch": 2345} {"train_loss": -40.77420425415039, "global_step": 283851, "epoch": 2345} {"train_loss": -43.18196487426758, "global_step": 283852, "epoch": 2345} {"train_loss": -40.95712661743164, "global_step": 283853, "epoch": 2345} {"train_loss": -42.89837646484375, "global_step": 283854, "epoch": 2345} {"train_loss": -42.76005172729492, "global_step": 283855, "epoch": 2345} {"train_loss": -42.14079666137695, "global_step": 283856, "epoch": 2345} {"train_loss": -42.59136962890625, "global_step": 283857, "epoch": 2345} {"train_loss": -42.09818649291992, "global_step": 283858, "epoch": 2345} {"train_loss": -43.53375244140625, "global_step": 283859, "epoch": 2345} {"train_loss": -42.54959487915039, "global_step": 283860, "epoch": 2345} {"train_loss": -43.38819122314453, "global_step": 283861, "epoch": 2345} {"train_loss": -42.618648529052734, "global_step": 283862, "epoch": 2345} {"train_loss": -43.052452087402344, "global_step": 283863, "epoch": 2345} {"train_loss": -42.956581115722656, "global_step": 283864, "epoch": 2345} {"train_loss": -42.7807305706434, "global_step": 283865, "epoch": 2345, "val_loss": 2480737.75} {"train_loss": -42.53644943237305, "global_step": 283866, "epoch": 2346} {"train_loss": -43.38527297973633, "global_step": 283867, "epoch": 2346} {"train_loss": -42.41585922241211, "global_step": 283868, "epoch": 2346} {"train_loss": -43.21779251098633, "global_step": 283869, "epoch": 2346} {"train_loss": -42.325477600097656, "global_step": 283870, "epoch": 2346} {"train_loss": -43.402225494384766, "global_step": 283871, "epoch": 2346} {"train_loss": -42.89020538330078, "global_step": 283872, "epoch": 2346} {"train_loss": -43.3409538269043, "global_step": 283873, "epoch": 2346} {"train_loss": -43.4787483215332, "global_step": 283874, "epoch": 2346} {"train_loss": -43.47341537475586, "global_step": 283875, "epoch": 2346} {"train_loss": -43.417171478271484, "global_step": 283876, "epoch": 2346} {"train_loss": -44.0323486328125, "global_step": 283877, "epoch": 2346} {"train_loss": -43.257015228271484, "global_step": 283878, "epoch": 2346} {"train_loss": -43.656646728515625, "global_step": 283879, "epoch": 2346} {"train_loss": -43.860965728759766, "global_step": 283880, "epoch": 2346} {"train_loss": -43.039241790771484, "global_step": 283881, "epoch": 2346} {"train_loss": -43.284095764160156, "global_step": 283882, "epoch": 2346} {"train_loss": -43.8661003112793, "global_step": 283883, "epoch": 2346} {"train_loss": -43.624263763427734, "global_step": 283884, "epoch": 2346} {"train_loss": -42.63747787475586, "global_step": 283885, "epoch": 2346} {"train_loss": -43.21163558959961, "global_step": 283886, "epoch": 2346} {"train_loss": -43.491024017333984, "global_step": 283887, "epoch": 2346} {"train_loss": -42.94154739379883, "global_step": 283888, "epoch": 2346} {"train_loss": -43.69903564453125, "global_step": 283889, "epoch": 2346} {"train_loss": -43.55431365966797, "global_step": 283890, "epoch": 2346} {"train_loss": -43.79650115966797, "global_step": 283891, "epoch": 2346} {"train_loss": -42.81258773803711, "global_step": 283892, "epoch": 2346} {"train_loss": -44.259090423583984, "global_step": 283893, "epoch": 2346} {"train_loss": -43.28915786743164, "global_step": 283894, "epoch": 2346} {"train_loss": -44.14754867553711, "global_step": 283895, "epoch": 2346} {"train_loss": -43.09812545776367, "global_step": 283896, "epoch": 2346} {"train_loss": -43.130001068115234, "global_step": 283897, "epoch": 2346} {"train_loss": -43.824493408203125, "global_step": 283898, "epoch": 2346} {"train_loss": -43.759029388427734, "global_step": 283899, "epoch": 2346} {"train_loss": -44.02544403076172, "global_step": 283900, "epoch": 2346} {"train_loss": -44.133445739746094, "global_step": 283901, "epoch": 2346} {"train_loss": -44.13911437988281, "global_step": 283902, "epoch": 2346} {"train_loss": -43.84148406982422, "global_step": 283903, "epoch": 2346} {"train_loss": -43.94785690307617, "global_step": 283904, "epoch": 2346} {"train_loss": -43.833919525146484, "global_step": 283905, "epoch": 2346} {"train_loss": -43.10467529296875, "global_step": 283906, "epoch": 2346} {"train_loss": -43.669830322265625, "global_step": 283907, "epoch": 2346} {"train_loss": -44.16160202026367, "global_step": 283908, "epoch": 2346} {"train_loss": -42.49616622924805, "global_step": 283909, "epoch": 2346} {"train_loss": -44.052860260009766, "global_step": 283910, "epoch": 2346} {"train_loss": -43.43941879272461, "global_step": 283911, "epoch": 2346} {"train_loss": -42.87063980102539, "global_step": 283912, "epoch": 2346} {"train_loss": -44.050453186035156, "global_step": 283913, "epoch": 2346} {"train_loss": -43.909339904785156, "global_step": 283914, "epoch": 2346} {"train_loss": -44.05491256713867, "global_step": 283915, "epoch": 2346} {"train_loss": -44.0014762878418, "global_step": 283916, "epoch": 2346} {"train_loss": -44.33380126953125, "global_step": 283917, "epoch": 2346} {"train_loss": -44.140602111816406, "global_step": 283918, "epoch": 2346} {"train_loss": -43.40273666381836, "global_step": 283919, "epoch": 2346} {"train_loss": -43.98970413208008, "global_step": 283920, "epoch": 2346} {"train_loss": -44.13074493408203, "global_step": 283921, "epoch": 2346} {"train_loss": -44.145843505859375, "global_step": 283922, "epoch": 2346} {"train_loss": -44.30936813354492, "global_step": 283923, "epoch": 2346} {"train_loss": -44.41657257080078, "global_step": 283924, "epoch": 2346} {"train_loss": -44.12301254272461, "global_step": 283925, "epoch": 2346} {"train_loss": -44.59064865112305, "global_step": 283926, "epoch": 2346} {"train_loss": -44.2645378112793, "global_step": 283927, "epoch": 2346} {"train_loss": -44.92670822143555, "global_step": 283928, "epoch": 2346} {"train_loss": -44.30374526977539, "global_step": 283929, "epoch": 2346} {"train_loss": -44.19167709350586, "global_step": 283930, "epoch": 2346} {"train_loss": -44.63031768798828, "global_step": 283931, "epoch": 2346} {"train_loss": -44.600337982177734, "global_step": 283932, "epoch": 2346} {"train_loss": -44.913917541503906, "global_step": 283933, "epoch": 2346} {"train_loss": -44.761024475097656, "global_step": 283934, "epoch": 2346} {"train_loss": -44.47721481323242, "global_step": 283935, "epoch": 2346} {"train_loss": -44.4340934753418, "global_step": 283936, "epoch": 2346} {"train_loss": -43.953304290771484, "global_step": 283937, "epoch": 2346} {"train_loss": -44.40775680541992, "global_step": 283938, "epoch": 2346} {"train_loss": -44.346290588378906, "global_step": 283939, "epoch": 2346} {"train_loss": -44.39567184448242, "global_step": 283940, "epoch": 2346} {"train_loss": -43.949214935302734, "global_step": 283941, "epoch": 2346} {"train_loss": -44.125099182128906, "global_step": 283942, "epoch": 2346} {"train_loss": -45.07840347290039, "global_step": 283943, "epoch": 2346} {"train_loss": -44.401580810546875, "global_step": 283944, "epoch": 2346} {"train_loss": -44.71586608886719, "global_step": 283945, "epoch": 2346} {"train_loss": -44.990997314453125, "global_step": 283946, "epoch": 2346} {"train_loss": -44.64091873168945, "global_step": 283947, "epoch": 2346} {"train_loss": -44.7636604309082, "global_step": 283948, "epoch": 2346} {"train_loss": -44.51249694824219, "global_step": 283949, "epoch": 2346} {"train_loss": -44.786964416503906, "global_step": 283950, "epoch": 2346} {"train_loss": -44.16439437866211, "global_step": 283951, "epoch": 2346} {"train_loss": -43.99546813964844, "global_step": 283952, "epoch": 2346} {"train_loss": -44.22174072265625, "global_step": 283953, "epoch": 2346} {"train_loss": -43.2411003112793, "global_step": 283954, "epoch": 2346} {"train_loss": -40.4129753112793, "global_step": 283955, "epoch": 2346} {"train_loss": -39.0317497253418, "global_step": 283956, "epoch": 2346} {"train_loss": -44.13857650756836, "global_step": 283957, "epoch": 2346} {"train_loss": -38.72134780883789, "global_step": 283958, "epoch": 2346} {"train_loss": -38.27431106567383, "global_step": 283959, "epoch": 2346} {"train_loss": -33.488739013671875, "global_step": 283960, "epoch": 2346} {"train_loss": -27.13297462463379, "global_step": 283961, "epoch": 2346} {"train_loss": -34.655696868896484, "global_step": 283962, "epoch": 2346} {"train_loss": -33.0984992980957, "global_step": 283963, "epoch": 2346} {"train_loss": -33.24353790283203, "global_step": 283964, "epoch": 2346} {"train_loss": -32.285762786865234, "global_step": 283965, "epoch": 2346} {"train_loss": -34.2456169128418, "global_step": 283966, "epoch": 2346} {"train_loss": -34.8206787109375, "global_step": 283967, "epoch": 2346} {"train_loss": -34.80462646484375, "global_step": 283968, "epoch": 2346} {"train_loss": -35.06010055541992, "global_step": 283969, "epoch": 2346} {"train_loss": -33.90709686279297, "global_step": 283970, "epoch": 2346} {"train_loss": -35.44956588745117, "global_step": 283971, "epoch": 2346} {"train_loss": -34.88828659057617, "global_step": 283972, "epoch": 2346} {"train_loss": -36.64405822753906, "global_step": 283973, "epoch": 2346} {"train_loss": -36.3817138671875, "global_step": 283974, "epoch": 2346} {"train_loss": -36.11494827270508, "global_step": 283975, "epoch": 2346} {"train_loss": -36.37405014038086, "global_step": 283976, "epoch": 2346} {"train_loss": -36.349510192871094, "global_step": 283977, "epoch": 2346} {"train_loss": -36.106868743896484, "global_step": 283978, "epoch": 2346} {"train_loss": -36.517608642578125, "global_step": 283979, "epoch": 2346} {"train_loss": -37.63624572753906, "global_step": 283980, "epoch": 2346} {"train_loss": -37.06321334838867, "global_step": 283981, "epoch": 2346} {"train_loss": -37.43766403198242, "global_step": 283982, "epoch": 2346} {"train_loss": -37.535804748535156, "global_step": 283983, "epoch": 2346} {"train_loss": -37.56867218017578, "global_step": 283984, "epoch": 2346} {"train_loss": -37.44341278076172, "global_step": 283985, "epoch": 2346} {"train_loss": -41.80563056567484, "global_step": 283986, "epoch": 2346, "val_loss": 2447250.5} {"train_loss": -37.38454818725586, "global_step": 283987, "epoch": 2347} {"train_loss": -37.38350296020508, "global_step": 283988, "epoch": 2347} {"train_loss": -37.511940002441406, "global_step": 283989, "epoch": 2347} {"train_loss": -38.598201751708984, "global_step": 283990, "epoch": 2347} {"train_loss": -37.64288330078125, "global_step": 283991, "epoch": 2347} {"train_loss": -38.194759368896484, "global_step": 283992, "epoch": 2347} {"train_loss": -38.192230224609375, "global_step": 283993, "epoch": 2347} {"train_loss": -38.373043060302734, "global_step": 283994, "epoch": 2347} {"train_loss": -38.730003356933594, "global_step": 283995, "epoch": 2347} {"train_loss": -39.146663665771484, "global_step": 283996, "epoch": 2347} {"train_loss": -38.91421127319336, "global_step": 283997, "epoch": 2347} {"train_loss": -39.09247970581055, "global_step": 283998, "epoch": 2347} {"train_loss": -38.71331024169922, "global_step": 283999, "epoch": 2347} {"train_loss": -38.885738372802734, "global_step": 284000, "epoch": 2347} {"train_loss": -38.03535079956055, "global_step": 284001, "epoch": 2347} {"train_loss": -38.44763946533203, "global_step": 284002, "epoch": 2347} {"train_loss": -38.50144577026367, "global_step": 284003, "epoch": 2347} {"train_loss": -40.14610290527344, "global_step": 284004, "epoch": 2347} {"train_loss": -39.795082092285156, "global_step": 284005, "epoch": 2347} {"train_loss": -40.14241027832031, "global_step": 284006, "epoch": 2347} {"train_loss": -39.166160583496094, "global_step": 284007, "epoch": 2347} {"train_loss": -39.8846435546875, "global_step": 284008, "epoch": 2347} {"train_loss": -39.24779510498047, "global_step": 284009, "epoch": 2347} {"train_loss": -39.78007125854492, "global_step": 284010, "epoch": 2347} {"train_loss": -40.135047912597656, "global_step": 284011, "epoch": 2347} {"train_loss": -40.209320068359375, "global_step": 284012, "epoch": 2347} {"train_loss": -40.4759635925293, "global_step": 284013, "epoch": 2347} {"train_loss": -39.894752502441406, "global_step": 284014, "epoch": 2347} {"train_loss": -39.986873626708984, "global_step": 284015, "epoch": 2347} {"train_loss": -40.436607360839844, "global_step": 284016, "epoch": 2347} {"train_loss": -39.56256866455078, "global_step": 284017, "epoch": 2347} {"train_loss": -40.222469329833984, "global_step": 284018, "epoch": 2347} {"train_loss": -39.96696090698242, "global_step": 284019, "epoch": 2347} {"train_loss": -39.84339904785156, "global_step": 284020, "epoch": 2347} {"train_loss": -40.311927795410156, "global_step": 284021, "epoch": 2347} {"train_loss": -39.90299606323242, "global_step": 284022, "epoch": 2347} {"train_loss": -38.32914352416992, "global_step": 284023, "epoch": 2347} {"train_loss": -37.80210876464844, "global_step": 284024, "epoch": 2347} {"train_loss": -39.80587387084961, "global_step": 284025, "epoch": 2347} {"train_loss": -39.70254135131836, "global_step": 284026, "epoch": 2347} {"train_loss": -38.994781494140625, "global_step": 284027, "epoch": 2347} {"train_loss": -39.15869903564453, "global_step": 284028, "epoch": 2347} {"train_loss": -39.71501922607422, "global_step": 284029, "epoch": 2347} {"train_loss": -39.6710319519043, "global_step": 284030, "epoch": 2347} {"train_loss": -38.42202377319336, "global_step": 284031, "epoch": 2347} {"train_loss": -40.7032585144043, "global_step": 284032, "epoch": 2347} {"train_loss": -40.2294807434082, "global_step": 284033, "epoch": 2347} {"train_loss": -39.182857513427734, "global_step": 284034, "epoch": 2347} {"train_loss": -39.1810302734375, "global_step": 284035, "epoch": 2347} {"train_loss": -39.25278091430664, "global_step": 284036, "epoch": 2347} {"train_loss": -40.8151741027832, "global_step": 284037, "epoch": 2347} {"train_loss": -39.662330627441406, "global_step": 284038, "epoch": 2347} {"train_loss": -40.235626220703125, "global_step": 284039, "epoch": 2347} {"train_loss": -40.07986068725586, "global_step": 284040, "epoch": 2347} {"train_loss": -40.485107421875, "global_step": 284041, "epoch": 2347} {"train_loss": -39.000789642333984, "global_step": 284042, "epoch": 2347} {"train_loss": -40.48954391479492, "global_step": 284043, "epoch": 2347} {"train_loss": -40.03943634033203, "global_step": 284044, "epoch": 2347} {"train_loss": -39.81858444213867, "global_step": 284045, "epoch": 2347} {"train_loss": -37.39897918701172, "global_step": 284046, "epoch": 2347} {"train_loss": -39.63525390625, "global_step": 284047, "epoch": 2347} {"train_loss": -38.781429290771484, "global_step": 284048, "epoch": 2347} {"train_loss": -38.73719024658203, "global_step": 284049, "epoch": 2347} {"train_loss": -38.066261291503906, "global_step": 284050, "epoch": 2347} {"train_loss": -36.64500045776367, "global_step": 284051, "epoch": 2347} {"train_loss": -39.559139251708984, "global_step": 284052, "epoch": 2347} {"train_loss": -35.8731803894043, "global_step": 284053, "epoch": 2347} {"train_loss": -37.87845993041992, "global_step": 284054, "epoch": 2347} {"train_loss": -36.333805084228516, "global_step": 284055, "epoch": 2347} {"train_loss": -36.35004806518555, "global_step": 284056, "epoch": 2347} {"train_loss": -37.09092330932617, "global_step": 284057, "epoch": 2347} {"train_loss": -37.06342697143555, "global_step": 284058, "epoch": 2347} {"train_loss": -37.68975830078125, "global_step": 284059, "epoch": 2347} {"train_loss": -35.36573791503906, "global_step": 284060, "epoch": 2347} {"train_loss": -37.249488830566406, "global_step": 284061, "epoch": 2347} {"train_loss": -38.060630798339844, "global_step": 284062, "epoch": 2347} {"train_loss": -37.25291061401367, "global_step": 284063, "epoch": 2347} {"train_loss": -38.346046447753906, "global_step": 284064, "epoch": 2347} {"train_loss": -36.93804931640625, "global_step": 284065, "epoch": 2347} {"train_loss": -37.6600341796875, "global_step": 284066, "epoch": 2347} {"train_loss": -39.09324264526367, "global_step": 284067, "epoch": 2347} {"train_loss": -36.11152648925781, "global_step": 284068, "epoch": 2347} {"train_loss": -31.142065048217773, "global_step": 284069, "epoch": 2347} {"train_loss": -35.409996032714844, "global_step": 284070, "epoch": 2347} {"train_loss": -37.034950256347656, "global_step": 284071, "epoch": 2347} {"train_loss": -37.595458984375, "global_step": 284072, "epoch": 2347} {"train_loss": -36.83108139038086, "global_step": 284073, "epoch": 2347} {"train_loss": -34.45161819458008, "global_step": 284074, "epoch": 2347} {"train_loss": -17.30713653564453, "global_step": 284075, "epoch": 2347} {"train_loss": -37.91914749145508, "global_step": 284076, "epoch": 2347} {"train_loss": -35.45716094970703, "global_step": 284077, "epoch": 2347} {"train_loss": -17.0926513671875, "global_step": 284078, "epoch": 2347} {"train_loss": -12.83642578125, "global_step": 284079, "epoch": 2347} {"train_loss": -34.49915313720703, "global_step": 284080, "epoch": 2347} {"train_loss": -33.98183822631836, "global_step": 284081, "epoch": 2347} {"train_loss": -18.629531860351562, "global_step": 284082, "epoch": 2347} {"train_loss": -24.85218620300293, "global_step": 284083, "epoch": 2347} {"train_loss": -8.62674617767334, "global_step": 284084, "epoch": 2347} {"train_loss": -34.58059310913086, "global_step": 284085, "epoch": 2347} {"train_loss": -34.09648895263672, "global_step": 284086, "epoch": 2347} {"train_loss": -29.677900314331055, "global_step": 284087, "epoch": 2347} {"train_loss": -32.47771453857422, "global_step": 284088, "epoch": 2347} {"train_loss": -27.094755172729492, "global_step": 284089, "epoch": 2347} {"train_loss": -34.72385025024414, "global_step": 284090, "epoch": 2347} {"train_loss": -29.972126007080078, "global_step": 284091, "epoch": 2347} {"train_loss": -32.190834045410156, "global_step": 284092, "epoch": 2347} {"train_loss": -34.89600372314453, "global_step": 284093, "epoch": 2347} {"train_loss": -32.326927185058594, "global_step": 284094, "epoch": 2347} {"train_loss": -35.56824493408203, "global_step": 284095, "epoch": 2347} {"train_loss": -33.106903076171875, "global_step": 284096, "epoch": 2347} {"train_loss": -35.689876556396484, "global_step": 284097, "epoch": 2347} {"train_loss": -34.41229248046875, "global_step": 284098, "epoch": 2347} {"train_loss": -32.36111831665039, "global_step": 284099, "epoch": 2347} {"train_loss": -34.451393127441406, "global_step": 284100, "epoch": 2347} {"train_loss": -34.90469741821289, "global_step": 284101, "epoch": 2347} {"train_loss": -35.60897445678711, "global_step": 284102, "epoch": 2347} {"train_loss": -35.097267150878906, "global_step": 284103, "epoch": 2347} {"train_loss": -33.948917388916016, "global_step": 284104, "epoch": 2347} {"train_loss": -35.8348503112793, "global_step": 284105, "epoch": 2347} {"train_loss": -35.29146957397461, "global_step": 284106, "epoch": 2347} {"train_loss": -36.46502413631471, "global_step": 284107, "epoch": 2347, "val_loss": 2601288.75} {"train_loss": -34.737892150878906, "global_step": 284108, "epoch": 2348} {"train_loss": -36.83401870727539, "global_step": 284109, "epoch": 2348} {"train_loss": -35.75193405151367, "global_step": 284110, "epoch": 2348} {"train_loss": -36.51197052001953, "global_step": 284111, "epoch": 2348} {"train_loss": -37.4967155456543, "global_step": 284112, "epoch": 2348} {"train_loss": -34.989837646484375, "global_step": 284113, "epoch": 2348} {"train_loss": -36.507781982421875, "global_step": 284114, "epoch": 2348} {"train_loss": -36.95128631591797, "global_step": 284115, "epoch": 2348} {"train_loss": -37.38648986816406, "global_step": 284116, "epoch": 2348} {"train_loss": -36.71961212158203, "global_step": 284117, "epoch": 2348} {"train_loss": -37.624366760253906, "global_step": 284118, "epoch": 2348} {"train_loss": -36.81696319580078, "global_step": 284119, "epoch": 2348} {"train_loss": -37.545257568359375, "global_step": 284120, "epoch": 2348} {"train_loss": -38.168617248535156, "global_step": 284121, "epoch": 2348} {"train_loss": -37.46749496459961, "global_step": 284122, "epoch": 2348} {"train_loss": -37.742855072021484, "global_step": 284123, "epoch": 2348} {"train_loss": -37.42170715332031, "global_step": 284124, "epoch": 2348} {"train_loss": -36.47344207763672, "global_step": 284125, "epoch": 2348} {"train_loss": -37.93559646606445, "global_step": 284126, "epoch": 2348} {"train_loss": -37.151123046875, "global_step": 284127, "epoch": 2348} {"train_loss": -37.17924499511719, "global_step": 284128, "epoch": 2348} {"train_loss": -37.32502365112305, "global_step": 284129, "epoch": 2348} {"train_loss": -38.10614013671875, "global_step": 284130, "epoch": 2348} {"train_loss": -38.05399703979492, "global_step": 284131, "epoch": 2348} {"train_loss": -37.24498748779297, "global_step": 284132, "epoch": 2348} {"train_loss": -37.8314323425293, "global_step": 284133, "epoch": 2348} {"train_loss": -37.93661117553711, "global_step": 284134, "epoch": 2348} {"train_loss": -37.75788497924805, "global_step": 284135, "epoch": 2348} {"train_loss": -38.39790725708008, "global_step": 284136, "epoch": 2348} {"train_loss": -38.11734390258789, "global_step": 284137, "epoch": 2348} {"train_loss": -37.424232482910156, "global_step": 284138, "epoch": 2348} {"train_loss": -38.13405227661133, "global_step": 284139, "epoch": 2348} {"train_loss": -37.32517623901367, "global_step": 284140, "epoch": 2348} {"train_loss": -37.77566146850586, "global_step": 284141, "epoch": 2348} {"train_loss": -37.7865104675293, "global_step": 284142, "epoch": 2348} {"train_loss": -38.5662956237793, "global_step": 284143, "epoch": 2348} {"train_loss": -37.83600997924805, "global_step": 284144, "epoch": 2348} {"train_loss": -38.09739303588867, "global_step": 284145, "epoch": 2348} {"train_loss": -38.39262008666992, "global_step": 284146, "epoch": 2348} {"train_loss": -37.2072868347168, "global_step": 284147, "epoch": 2348} {"train_loss": -38.450260162353516, "global_step": 284148, "epoch": 2348} {"train_loss": -38.0948600769043, "global_step": 284149, "epoch": 2348} {"train_loss": -38.942047119140625, "global_step": 284150, "epoch": 2348} {"train_loss": -38.92751693725586, "global_step": 284151, "epoch": 2348} {"train_loss": -38.73360824584961, "global_step": 284152, "epoch": 2348} {"train_loss": -38.57566452026367, "global_step": 284153, "epoch": 2348} {"train_loss": -38.76642990112305, "global_step": 284154, "epoch": 2348} {"train_loss": -38.9606819152832, "global_step": 284155, "epoch": 2348} {"train_loss": -38.64613723754883, "global_step": 284156, "epoch": 2348} {"train_loss": -39.71747589111328, "global_step": 284157, "epoch": 2348} {"train_loss": -38.60593032836914, "global_step": 284158, "epoch": 2348} {"train_loss": -38.450496673583984, "global_step": 284159, "epoch": 2348} {"train_loss": -38.9179801940918, "global_step": 284160, "epoch": 2348} {"train_loss": -39.74419021606445, "global_step": 284161, "epoch": 2348} {"train_loss": -40.17783737182617, "global_step": 284162, "epoch": 2348} {"train_loss": -39.82135772705078, "global_step": 284163, "epoch": 2348} {"train_loss": -38.26675033569336, "global_step": 284164, "epoch": 2348} {"train_loss": -38.399898529052734, "global_step": 284165, "epoch": 2348} {"train_loss": -39.721858978271484, "global_step": 284166, "epoch": 2348} {"train_loss": -39.4404411315918, "global_step": 284167, "epoch": 2348} {"train_loss": -40.5722770690918, "global_step": 284168, "epoch": 2348} {"train_loss": -39.68297576904297, "global_step": 284169, "epoch": 2348} {"train_loss": -39.5911979675293, "global_step": 284170, "epoch": 2348} {"train_loss": -40.139095306396484, "global_step": 284171, "epoch": 2348} {"train_loss": -40.2325439453125, "global_step": 284172, "epoch": 2348} {"train_loss": -39.948448181152344, "global_step": 284173, "epoch": 2348} {"train_loss": -40.30764389038086, "global_step": 284174, "epoch": 2348} {"train_loss": -40.36408233642578, "global_step": 284175, "epoch": 2348} {"train_loss": -40.94290542602539, "global_step": 284176, "epoch": 2348} {"train_loss": -40.50938034057617, "global_step": 284177, "epoch": 2348} {"train_loss": -40.177520751953125, "global_step": 284178, "epoch": 2348} {"train_loss": -41.44697189331055, "global_step": 284179, "epoch": 2348} {"train_loss": -41.56070327758789, "global_step": 284180, "epoch": 2348} {"train_loss": -40.59174346923828, "global_step": 284181, "epoch": 2348} {"train_loss": -40.44927978515625, "global_step": 284182, "epoch": 2348} {"train_loss": -41.45916748046875, "global_step": 284183, "epoch": 2348} {"train_loss": -41.41020202636719, "global_step": 284184, "epoch": 2348} {"train_loss": -41.6932373046875, "global_step": 284185, "epoch": 2348} {"train_loss": -41.76760482788086, "global_step": 284186, "epoch": 2348} {"train_loss": -41.5467643737793, "global_step": 284187, "epoch": 2348} {"train_loss": -41.08004379272461, "global_step": 284188, "epoch": 2348} {"train_loss": -41.605892181396484, "global_step": 284189, "epoch": 2348} {"train_loss": -41.439239501953125, "global_step": 284190, "epoch": 2348} {"train_loss": -41.003902435302734, "global_step": 284191, "epoch": 2348} {"train_loss": -41.78147506713867, "global_step": 284192, "epoch": 2348} {"train_loss": -42.409576416015625, "global_step": 284193, "epoch": 2348} {"train_loss": -41.9598503112793, "global_step": 284194, "epoch": 2348} {"train_loss": -41.51642608642578, "global_step": 284195, "epoch": 2348} {"train_loss": -42.38167953491211, "global_step": 284196, "epoch": 2348} {"train_loss": -41.00790023803711, "global_step": 284197, "epoch": 2348} {"train_loss": -42.72868728637695, "global_step": 284198, "epoch": 2348} {"train_loss": -41.97509765625, "global_step": 284199, "epoch": 2348} {"train_loss": -40.88076400756836, "global_step": 284200, "epoch": 2348} {"train_loss": -41.00899887084961, "global_step": 284201, "epoch": 2348} {"train_loss": -40.42151641845703, "global_step": 284202, "epoch": 2348} {"train_loss": -41.18585968017578, "global_step": 284203, "epoch": 2348} {"train_loss": -42.04814910888672, "global_step": 284204, "epoch": 2348} {"train_loss": -40.58039093017578, "global_step": 284205, "epoch": 2348} {"train_loss": -41.976993560791016, "global_step": 284206, "epoch": 2348} {"train_loss": -39.589168548583984, "global_step": 284207, "epoch": 2348} {"train_loss": -41.31452560424805, "global_step": 284208, "epoch": 2348} {"train_loss": -41.05255126953125, "global_step": 284209, "epoch": 2348} {"train_loss": -40.25411605834961, "global_step": 284210, "epoch": 2348} {"train_loss": -40.551673889160156, "global_step": 284211, "epoch": 2348} {"train_loss": -40.709808349609375, "global_step": 284212, "epoch": 2348} {"train_loss": -40.191131591796875, "global_step": 284213, "epoch": 2348} {"train_loss": -40.880672454833984, "global_step": 284214, "epoch": 2348} {"train_loss": -41.41401290893555, "global_step": 284215, "epoch": 2348} {"train_loss": -39.8787841796875, "global_step": 284216, "epoch": 2348} {"train_loss": -40.560951232910156, "global_step": 284217, "epoch": 2348} {"train_loss": -41.821533203125, "global_step": 284218, "epoch": 2348} {"train_loss": -40.999324798583984, "global_step": 284219, "epoch": 2348} {"train_loss": -41.4156608581543, "global_step": 284220, "epoch": 2348} {"train_loss": -41.71674346923828, "global_step": 284221, "epoch": 2348} {"train_loss": -41.287261962890625, "global_step": 284222, "epoch": 2348} {"train_loss": -40.99973678588867, "global_step": 284223, "epoch": 2348} {"train_loss": -41.51185607910156, "global_step": 284224, "epoch": 2348} {"train_loss": -41.96199417114258, "global_step": 284225, "epoch": 2348} {"train_loss": -41.77505874633789, "global_step": 284226, "epoch": 2348} {"train_loss": -42.53327560424805, "global_step": 284227, "epoch": 2348} {"train_loss": -39.5150134504334, "global_step": 284228, "epoch": 2348, "val_loss": 2591890.0} {"train_loss": -42.798030853271484, "global_step": 284229, "epoch": 2349} {"train_loss": -41.5786018371582, "global_step": 284230, "epoch": 2349} {"train_loss": -42.475440979003906, "global_step": 284231, "epoch": 2349} {"train_loss": -41.407833099365234, "global_step": 284232, "epoch": 2349} {"train_loss": -42.8237419128418, "global_step": 284233, "epoch": 2349} {"train_loss": -41.447418212890625, "global_step": 284234, "epoch": 2349} {"train_loss": -42.525569915771484, "global_step": 284235, "epoch": 2349} {"train_loss": -41.8067512512207, "global_step": 284236, "epoch": 2349} {"train_loss": -41.645484924316406, "global_step": 284237, "epoch": 2349} {"train_loss": -42.32154083251953, "global_step": 284238, "epoch": 2349} {"train_loss": -41.171546936035156, "global_step": 284239, "epoch": 2349} {"train_loss": -42.48771286010742, "global_step": 284240, "epoch": 2349} {"train_loss": -41.833251953125, "global_step": 284241, "epoch": 2349} {"train_loss": -42.823368072509766, "global_step": 284242, "epoch": 2349} {"train_loss": -42.48434066772461, "global_step": 284243, "epoch": 2349} {"train_loss": -42.4330940246582, "global_step": 284244, "epoch": 2349} {"train_loss": -42.72098922729492, "global_step": 284245, "epoch": 2349} {"train_loss": -42.82386016845703, "global_step": 284246, "epoch": 2349} {"train_loss": -42.28496170043945, "global_step": 284247, "epoch": 2349} {"train_loss": -42.11803436279297, "global_step": 284248, "epoch": 2349} {"train_loss": -42.555912017822266, "global_step": 284249, "epoch": 2349} {"train_loss": -41.73587417602539, "global_step": 284250, "epoch": 2349} {"train_loss": -42.68832015991211, "global_step": 284251, "epoch": 2349} {"train_loss": -41.9400634765625, "global_step": 284252, "epoch": 2349} {"train_loss": -42.943145751953125, "global_step": 284253, "epoch": 2349} {"train_loss": -41.123931884765625, "global_step": 284254, "epoch": 2349} {"train_loss": -42.24625778198242, "global_step": 284255, "epoch": 2349} {"train_loss": -41.34548568725586, "global_step": 284256, "epoch": 2349} {"train_loss": -41.92695999145508, "global_step": 284257, "epoch": 2349} {"train_loss": -42.09770202636719, "global_step": 284258, "epoch": 2349} {"train_loss": -42.49755859375, "global_step": 284259, "epoch": 2349} {"train_loss": -42.14480209350586, "global_step": 284260, "epoch": 2349} {"train_loss": -42.63431930541992, "global_step": 284261, "epoch": 2349} {"train_loss": -42.030517578125, "global_step": 284262, "epoch": 2349} {"train_loss": -42.61159896850586, "global_step": 284263, "epoch": 2349} {"train_loss": -41.2248420715332, "global_step": 284264, "epoch": 2349} {"train_loss": -41.530025482177734, "global_step": 284265, "epoch": 2349} {"train_loss": -42.11919021606445, "global_step": 284266, "epoch": 2349} {"train_loss": -41.444061279296875, "global_step": 284267, "epoch": 2349} {"train_loss": -42.33772659301758, "global_step": 284268, "epoch": 2349} {"train_loss": -41.739383697509766, "global_step": 284269, "epoch": 2349} {"train_loss": -42.42232894897461, "global_step": 284270, "epoch": 2349} {"train_loss": -41.68922805786133, "global_step": 284271, "epoch": 2349} {"train_loss": -42.418006896972656, "global_step": 284272, "epoch": 2349} {"train_loss": -42.11611557006836, "global_step": 284273, "epoch": 2349} {"train_loss": -42.353912353515625, "global_step": 284274, "epoch": 2349} {"train_loss": -41.89868927001953, "global_step": 284275, "epoch": 2349} {"train_loss": -42.04612350463867, "global_step": 284276, "epoch": 2349} {"train_loss": -42.74912643432617, "global_step": 284277, "epoch": 2349} {"train_loss": -42.880645751953125, "global_step": 284278, "epoch": 2349} {"train_loss": -42.32880401611328, "global_step": 284279, "epoch": 2349} {"train_loss": -42.735321044921875, "global_step": 284280, "epoch": 2349} {"train_loss": -41.7951545715332, "global_step": 284281, "epoch": 2349} {"train_loss": -42.33683776855469, "global_step": 284282, "epoch": 2349} {"train_loss": -42.36589431762695, "global_step": 284283, "epoch": 2349} {"train_loss": -41.58823013305664, "global_step": 284284, "epoch": 2349} {"train_loss": -42.25163650512695, "global_step": 284285, "epoch": 2349} {"train_loss": -42.461692810058594, "global_step": 284286, "epoch": 2349} {"train_loss": -41.649688720703125, "global_step": 284287, "epoch": 2349} {"train_loss": -42.785743713378906, "global_step": 284288, "epoch": 2349} {"train_loss": -41.26446533203125, "global_step": 284289, "epoch": 2349} {"train_loss": -42.311767578125, "global_step": 284290, "epoch": 2349} {"train_loss": -40.48075485229492, "global_step": 284291, "epoch": 2349} {"train_loss": -42.805084228515625, "global_step": 284292, "epoch": 2349} {"train_loss": -39.44198989868164, "global_step": 284293, "epoch": 2349} {"train_loss": -41.69537353515625, "global_step": 284294, "epoch": 2349} {"train_loss": -40.7401237487793, "global_step": 284295, "epoch": 2349} {"train_loss": -42.1328010559082, "global_step": 284296, "epoch": 2349} {"train_loss": -41.2465705871582, "global_step": 284297, "epoch": 2349} {"train_loss": -39.5356559753418, "global_step": 284298, "epoch": 2349} {"train_loss": -40.56620407104492, "global_step": 284299, "epoch": 2349} {"train_loss": -39.87272262573242, "global_step": 284300, "epoch": 2349} {"train_loss": -41.29774856567383, "global_step": 284301, "epoch": 2349} {"train_loss": -40.08982467651367, "global_step": 284302, "epoch": 2349} {"train_loss": -40.053043365478516, "global_step": 284303, "epoch": 2349} {"train_loss": -40.196502685546875, "global_step": 284304, "epoch": 2349} {"train_loss": -41.39496994018555, "global_step": 284305, "epoch": 2349} {"train_loss": -39.423622131347656, "global_step": 284306, "epoch": 2349} {"train_loss": -41.61066818237305, "global_step": 284307, "epoch": 2349} {"train_loss": -39.56899642944336, "global_step": 284308, "epoch": 2349} {"train_loss": -41.8971061706543, "global_step": 284309, "epoch": 2349} {"train_loss": -39.3223991394043, "global_step": 284310, "epoch": 2349} {"train_loss": -39.616451263427734, "global_step": 284311, "epoch": 2349} {"train_loss": -39.39651107788086, "global_step": 284312, "epoch": 2349} {"train_loss": -39.82943344116211, "global_step": 284313, "epoch": 2349} {"train_loss": -40.56441879272461, "global_step": 284314, "epoch": 2349} {"train_loss": -41.42043685913086, "global_step": 284315, "epoch": 2349} {"train_loss": -39.0494270324707, "global_step": 284316, "epoch": 2349} {"train_loss": -36.66781234741211, "global_step": 284317, "epoch": 2349} {"train_loss": -38.2445182800293, "global_step": 284318, "epoch": 2349} {"train_loss": -39.81895065307617, "global_step": 284319, "epoch": 2349} {"train_loss": -40.09368896484375, "global_step": 284320, "epoch": 2349} {"train_loss": -39.04895782470703, "global_step": 284321, "epoch": 2349} {"train_loss": -33.793983459472656, "global_step": 284322, "epoch": 2349} {"train_loss": -37.25041198730469, "global_step": 284323, "epoch": 2349} {"train_loss": -40.76547622680664, "global_step": 284324, "epoch": 2349} {"train_loss": -37.85359573364258, "global_step": 284325, "epoch": 2349} {"train_loss": -39.10020065307617, "global_step": 284326, "epoch": 2349} {"train_loss": -38.82890319824219, "global_step": 284327, "epoch": 2349} {"train_loss": -38.40559005737305, "global_step": 284328, "epoch": 2349} {"train_loss": -39.1602897644043, "global_step": 284329, "epoch": 2349} {"train_loss": -39.865074157714844, "global_step": 284330, "epoch": 2349} {"train_loss": -38.21090316772461, "global_step": 284331, "epoch": 2349} {"train_loss": -41.35774230957031, "global_step": 284332, "epoch": 2349} {"train_loss": -38.558372497558594, "global_step": 284333, "epoch": 2349} {"train_loss": -40.77606964111328, "global_step": 284334, "epoch": 2349} {"train_loss": -39.916255950927734, "global_step": 284335, "epoch": 2349} {"train_loss": -41.295570373535156, "global_step": 284336, "epoch": 2349} {"train_loss": -41.50250244140625, "global_step": 284337, "epoch": 2349} {"train_loss": -41.643707275390625, "global_step": 284338, "epoch": 2349} {"train_loss": -41.524227142333984, "global_step": 284339, "epoch": 2349} {"train_loss": -41.64617156982422, "global_step": 284340, "epoch": 2349} {"train_loss": -41.3670539855957, "global_step": 284341, "epoch": 2349} {"train_loss": -42.38685607910156, "global_step": 284342, "epoch": 2349} {"train_loss": -42.32746505737305, "global_step": 284343, "epoch": 2349} {"train_loss": -41.84458541870117, "global_step": 284344, "epoch": 2349} {"train_loss": -42.57423782348633, "global_step": 284345, "epoch": 2349} {"train_loss": -41.8031120300293, "global_step": 284346, "epoch": 2349} {"train_loss": -42.31728744506836, "global_step": 284347, "epoch": 2349} {"train_loss": -42.14304733276367, "global_step": 284348, "epoch": 2349} {"train_loss": -41.244558192481676, "global_step": 284349, "epoch": 2349, "val_loss": 2503423.0} {"train_loss": -42.23103713989258, "global_step": 284350, "epoch": 2350} {"train_loss": -42.48286819458008, "global_step": 284351, "epoch": 2350} {"train_loss": -42.7089958190918, "global_step": 284352, "epoch": 2350} {"train_loss": -41.970001220703125, "global_step": 284353, "epoch": 2350} {"train_loss": -42.395408630371094, "global_step": 284354, "epoch": 2350} {"train_loss": -41.83279037475586, "global_step": 284355, "epoch": 2350} {"train_loss": -42.47239303588867, "global_step": 284356, "epoch": 2350} {"train_loss": -42.29755783081055, "global_step": 284357, "epoch": 2350} {"train_loss": -42.89180374145508, "global_step": 284358, "epoch": 2350} {"train_loss": -42.72684860229492, "global_step": 284359, "epoch": 2350} {"train_loss": -42.28825378417969, "global_step": 284360, "epoch": 2350} {"train_loss": -41.87602233886719, "global_step": 284361, "epoch": 2350} {"train_loss": -43.207542419433594, "global_step": 284362, "epoch": 2350} {"train_loss": -42.47795486450195, "global_step": 284363, "epoch": 2350} {"train_loss": -42.99996566772461, "global_step": 284364, "epoch": 2350} {"train_loss": -42.9460334777832, "global_step": 284365, "epoch": 2350} {"train_loss": -43.017032623291016, "global_step": 284366, "epoch": 2350} {"train_loss": -43.06663513183594, "global_step": 284367, "epoch": 2350} {"train_loss": -43.28547286987305, "global_step": 284368, "epoch": 2350} {"train_loss": -43.00227737426758, "global_step": 284369, "epoch": 2350} {"train_loss": -43.36030197143555, "global_step": 284370, "epoch": 2350} {"train_loss": -43.50307846069336, "global_step": 284371, "epoch": 2350} {"train_loss": -43.16152572631836, "global_step": 284372, "epoch": 2350} {"train_loss": -42.88825225830078, "global_step": 284373, "epoch": 2350} {"train_loss": -43.80181884765625, "global_step": 284374, "epoch": 2350} {"train_loss": -42.98101043701172, "global_step": 284375, "epoch": 2350} {"train_loss": -43.0987434387207, "global_step": 284376, "epoch": 2350} {"train_loss": -43.47682571411133, "global_step": 284377, "epoch": 2350} {"train_loss": -43.297908782958984, "global_step": 284378, "epoch": 2350} {"train_loss": -43.1402587890625, "global_step": 284379, "epoch": 2350} {"train_loss": -43.43061447143555, "global_step": 284380, "epoch": 2350} {"train_loss": -41.95680236816406, "global_step": 284381, "epoch": 2350} {"train_loss": -42.97606658935547, "global_step": 284382, "epoch": 2350} {"train_loss": -42.85671615600586, "global_step": 284383, "epoch": 2350} {"train_loss": -42.95905303955078, "global_step": 284384, "epoch": 2350} {"train_loss": -42.7947998046875, "global_step": 284385, "epoch": 2350} {"train_loss": -42.866188049316406, "global_step": 284386, "epoch": 2350} {"train_loss": -41.04230880737305, "global_step": 284387, "epoch": 2350} {"train_loss": -42.9190673828125, "global_step": 284388, "epoch": 2350} {"train_loss": -43.0467643737793, "global_step": 284389, "epoch": 2350} {"train_loss": -42.67363357543945, "global_step": 284390, "epoch": 2350} {"train_loss": -42.386959075927734, "global_step": 284391, "epoch": 2350} {"train_loss": -42.96636199951172, "global_step": 284392, "epoch": 2350} {"train_loss": -42.173072814941406, "global_step": 284393, "epoch": 2350} {"train_loss": -43.66802215576172, "global_step": 284394, "epoch": 2350} {"train_loss": -41.7609748840332, "global_step": 284395, "epoch": 2350} {"train_loss": -42.61275100708008, "global_step": 284396, "epoch": 2350} {"train_loss": -43.205745697021484, "global_step": 284397, "epoch": 2350} {"train_loss": -42.805782318115234, "global_step": 284398, "epoch": 2350} {"train_loss": -43.304805755615234, "global_step": 284399, "epoch": 2350} {"train_loss": -42.962520599365234, "global_step": 284400, "epoch": 2350} {"train_loss": -42.77880859375, "global_step": 284401, "epoch": 2350} {"train_loss": -42.98594284057617, "global_step": 284402, "epoch": 2350} {"train_loss": -43.632198333740234, "global_step": 284403, "epoch": 2350} {"train_loss": -42.9829216003418, "global_step": 284404, "epoch": 2350} {"train_loss": -42.52936935424805, "global_step": 284405, "epoch": 2350} {"train_loss": -43.35606002807617, "global_step": 284406, "epoch": 2350} {"train_loss": -43.17304611206055, "global_step": 284407, "epoch": 2350} {"train_loss": -41.55510711669922, "global_step": 284408, "epoch": 2350} {"train_loss": -44.0859375, "global_step": 284409, "epoch": 2350} {"train_loss": -42.90098571777344, "global_step": 284410, "epoch": 2350} {"train_loss": -43.142696380615234, "global_step": 284411, "epoch": 2350} {"train_loss": -43.571990966796875, "global_step": 284412, "epoch": 2350} {"train_loss": -43.26926803588867, "global_step": 284413, "epoch": 2350} {"train_loss": -42.9682731628418, "global_step": 284414, "epoch": 2350} {"train_loss": -43.495357513427734, "global_step": 284415, "epoch": 2350} {"train_loss": -43.08671951293945, "global_step": 284416, "epoch": 2350} {"train_loss": -42.81616973876953, "global_step": 284417, "epoch": 2350} {"train_loss": -44.428707122802734, "global_step": 284418, "epoch": 2350} {"train_loss": -41.9054069519043, "global_step": 284419, "epoch": 2350} {"train_loss": -42.49186706542969, "global_step": 284420, "epoch": 2350} {"train_loss": -43.24725341796875, "global_step": 284421, "epoch": 2350} {"train_loss": -43.39292526245117, "global_step": 284422, "epoch": 2350} {"train_loss": -42.58247756958008, "global_step": 284423, "epoch": 2350} {"train_loss": -43.22964859008789, "global_step": 284424, "epoch": 2350} {"train_loss": -42.550167083740234, "global_step": 284425, "epoch": 2350} {"train_loss": -42.50582504272461, "global_step": 284426, "epoch": 2350} {"train_loss": -43.06943893432617, "global_step": 284427, "epoch": 2350} {"train_loss": -42.62593460083008, "global_step": 284428, "epoch": 2350} {"train_loss": -42.91898727416992, "global_step": 284429, "epoch": 2350} {"train_loss": -42.9482536315918, "global_step": 284430, "epoch": 2350} {"train_loss": -42.80611038208008, "global_step": 284431, "epoch": 2350} {"train_loss": -43.26797103881836, "global_step": 284432, "epoch": 2350} {"train_loss": -42.84218978881836, "global_step": 284433, "epoch": 2350} {"train_loss": -42.17747116088867, "global_step": 284434, "epoch": 2350} {"train_loss": -43.3939208984375, "global_step": 284435, "epoch": 2350} {"train_loss": -43.22114181518555, "global_step": 284436, "epoch": 2350} {"train_loss": -43.90412139892578, "global_step": 284437, "epoch": 2350} {"train_loss": -43.44145202636719, "global_step": 284438, "epoch": 2350} {"train_loss": -42.19355010986328, "global_step": 284439, "epoch": 2350} {"train_loss": -43.4517822265625, "global_step": 284440, "epoch": 2350} {"train_loss": -42.98910140991211, "global_step": 284441, "epoch": 2350} {"train_loss": -42.72186279296875, "global_step": 284442, "epoch": 2350} {"train_loss": -41.664066314697266, "global_step": 284443, "epoch": 2350} {"train_loss": -42.86725997924805, "global_step": 284444, "epoch": 2350} {"train_loss": -42.187686920166016, "global_step": 284445, "epoch": 2350} {"train_loss": -41.74223709106445, "global_step": 284446, "epoch": 2350} {"train_loss": -43.56882858276367, "global_step": 284447, "epoch": 2350} {"train_loss": -40.208770751953125, "global_step": 284448, "epoch": 2350} {"train_loss": -40.316890716552734, "global_step": 284449, "epoch": 2350} {"train_loss": -41.40867614746094, "global_step": 284450, "epoch": 2350} {"train_loss": -41.79780578613281, "global_step": 284451, "epoch": 2350} {"train_loss": -41.94589614868164, "global_step": 284452, "epoch": 2350} {"train_loss": -42.52283477783203, "global_step": 284453, "epoch": 2350} {"train_loss": -42.00233840942383, "global_step": 284454, "epoch": 2350} {"train_loss": -42.528987884521484, "global_step": 284455, "epoch": 2350} {"train_loss": -41.3194465637207, "global_step": 284456, "epoch": 2350} {"train_loss": -43.05095291137695, "global_step": 284457, "epoch": 2350} {"train_loss": -42.21595001220703, "global_step": 284458, "epoch": 2350} {"train_loss": -40.299617767333984, "global_step": 284459, "epoch": 2350} {"train_loss": -42.594478607177734, "global_step": 284460, "epoch": 2350} {"train_loss": -41.31260299682617, "global_step": 284461, "epoch": 2350} {"train_loss": -41.288509368896484, "global_step": 284462, "epoch": 2350} {"train_loss": -42.1329231262207, "global_step": 284463, "epoch": 2350} {"train_loss": -39.89619827270508, "global_step": 284464, "epoch": 2350} {"train_loss": -40.90748977661133, "global_step": 284465, "epoch": 2350} {"train_loss": -42.913665771484375, "global_step": 284466, "epoch": 2350} {"train_loss": -41.55277633666992, "global_step": 284467, "epoch": 2350} {"train_loss": -39.6837158203125, "global_step": 284468, "epoch": 2350} {"train_loss": -43.105506896972656, "global_step": 284469, "epoch": 2350} {"train_loss": -42.62180426101054, "global_step": 284470, "epoch": 2350, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 0.0, "train/sim_max_reward_3": 0.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4400000": 1.0, "test/sim_max_reward_4400001": 1.0, "test/sim_max_reward_4400002": 1.0, "test/sim_max_reward_4400003": 0.0, "test/sim_max_reward_4400004": 1.0, "test/sim_max_reward_4400005": 1.0, "test/sim_max_reward_4400006": 1.0, "test/sim_max_reward_4400007": 1.0, "test/sim_max_reward_4400008": 1.0, "test/sim_max_reward_4400009": 1.0, "test/sim_max_reward_4400010": 1.0, "test/sim_max_reward_4400011": 1.0, "test/sim_max_reward_4400012": 1.0, "test/sim_max_reward_4400013": 1.0, "test/sim_max_reward_4400014": 1.0, "test/sim_max_reward_4400015": 0.0, "test/sim_max_reward_4400016": 1.0, "test/sim_max_reward_4400017": 1.0, "test/sim_max_reward_4400018": 1.0, "test/sim_max_reward_4400019": 1.0, "test/sim_max_reward_4400020": 1.0, "test/sim_max_reward_4400021": 1.0, "train/mean_score": 0.6666666666666666, "test/mean_score": 0.9090909090909091, "val_loss": 2567090.0} {"train_loss": -40.88814926147461, "global_step": 284471, "epoch": 2351} {"train_loss": -41.53634262084961, "global_step": 284472, "epoch": 2351} {"train_loss": -40.37883377075195, "global_step": 284473, "epoch": 2351} {"train_loss": -42.38823318481445, "global_step": 284474, "epoch": 2351} {"train_loss": -41.606964111328125, "global_step": 284475, "epoch": 2351} {"train_loss": -40.96969985961914, "global_step": 284476, "epoch": 2351} {"train_loss": -41.706783294677734, "global_step": 284477, "epoch": 2351} {"train_loss": -41.76978302001953, "global_step": 284478, "epoch": 2351} {"train_loss": -36.74726104736328, "global_step": 284479, "epoch": 2351} {"train_loss": -42.183387756347656, "global_step": 284480, "epoch": 2351} {"train_loss": -39.26076889038086, "global_step": 284481, "epoch": 2351} {"train_loss": -40.82821273803711, "global_step": 284482, "epoch": 2351} {"train_loss": -40.36716842651367, "global_step": 284483, "epoch": 2351} {"train_loss": -40.361080169677734, "global_step": 284484, "epoch": 2351} {"train_loss": -40.08164596557617, "global_step": 284485, "epoch": 2351} {"train_loss": -42.9123420715332, "global_step": 284486, "epoch": 2351} {"train_loss": -40.46342086791992, "global_step": 284487, "epoch": 2351} {"train_loss": -42.354331970214844, "global_step": 284488, "epoch": 2351} {"train_loss": -39.90947341918945, "global_step": 284489, "epoch": 2351} {"train_loss": -41.920501708984375, "global_step": 284490, "epoch": 2351} {"train_loss": -41.4379768371582, "global_step": 284491, "epoch": 2351} {"train_loss": -41.25625228881836, "global_step": 284492, "epoch": 2351} {"train_loss": -41.573089599609375, "global_step": 284493, "epoch": 2351} {"train_loss": -41.42081832885742, "global_step": 284494, "epoch": 2351} {"train_loss": -41.278289794921875, "global_step": 284495, "epoch": 2351} {"train_loss": -41.97308349609375, "global_step": 284496, "epoch": 2351} {"train_loss": -41.9796257019043, "global_step": 284497, "epoch": 2351} {"train_loss": -41.77409744262695, "global_step": 284498, "epoch": 2351} {"train_loss": -41.8861083984375, "global_step": 284499, "epoch": 2351} {"train_loss": -41.6580696105957, "global_step": 284500, "epoch": 2351} {"train_loss": -42.87282943725586, "global_step": 284501, "epoch": 2351} {"train_loss": -42.45033645629883, "global_step": 284502, "epoch": 2351} {"train_loss": -42.33436965942383, "global_step": 284503, "epoch": 2351} {"train_loss": -41.472633361816406, "global_step": 284504, "epoch": 2351} {"train_loss": -41.98665237426758, "global_step": 284505, "epoch": 2351} {"train_loss": -42.08927536010742, "global_step": 284506, "epoch": 2351} {"train_loss": -42.517677307128906, "global_step": 284507, "epoch": 2351} {"train_loss": -42.51091766357422, "global_step": 284508, "epoch": 2351} {"train_loss": -42.14645004272461, "global_step": 284509, "epoch": 2351} {"train_loss": -42.81103515625, "global_step": 284510, "epoch": 2351} {"train_loss": -42.994197845458984, "global_step": 284511, "epoch": 2351} {"train_loss": -42.42499923706055, "global_step": 284512, "epoch": 2351} {"train_loss": -42.809959411621094, "global_step": 284513, "epoch": 2351} {"train_loss": -41.84648895263672, "global_step": 284514, "epoch": 2351} {"train_loss": -42.63715744018555, "global_step": 284515, "epoch": 2351} {"train_loss": -42.595947265625, "global_step": 284516, "epoch": 2351} {"train_loss": -43.04121398925781, "global_step": 284517, "epoch": 2351} {"train_loss": -43.2215690612793, "global_step": 284518, "epoch": 2351} {"train_loss": -42.11385726928711, "global_step": 284519, "epoch": 2351} {"train_loss": -42.80451583862305, "global_step": 284520, "epoch": 2351} {"train_loss": -43.10492706298828, "global_step": 284521, "epoch": 2351} {"train_loss": -42.46879196166992, "global_step": 284522, "epoch": 2351} {"train_loss": -43.41033172607422, "global_step": 284523, "epoch": 2351} {"train_loss": -41.98679733276367, "global_step": 284524, "epoch": 2351} {"train_loss": -43.92226028442383, "global_step": 284525, "epoch": 2351} {"train_loss": -42.792503356933594, "global_step": 284526, "epoch": 2351} {"train_loss": -42.44578552246094, "global_step": 284527, "epoch": 2351} {"train_loss": -43.96506881713867, "global_step": 284528, "epoch": 2351} {"train_loss": -43.13103485107422, "global_step": 284529, "epoch": 2351} {"train_loss": -43.63532638549805, "global_step": 284530, "epoch": 2351} {"train_loss": -43.00012969970703, "global_step": 284531, "epoch": 2351} {"train_loss": -42.38955307006836, "global_step": 284532, "epoch": 2351} {"train_loss": -42.51070022583008, "global_step": 284533, "epoch": 2351} {"train_loss": -43.03618621826172, "global_step": 284534, "epoch": 2351} {"train_loss": -42.626522064208984, "global_step": 284535, "epoch": 2351} {"train_loss": -43.16120147705078, "global_step": 284536, "epoch": 2351} {"train_loss": -43.33206558227539, "global_step": 284537, "epoch": 2351} {"train_loss": -43.68156814575195, "global_step": 284538, "epoch": 2351} {"train_loss": -42.25503158569336, "global_step": 284539, "epoch": 2351} {"train_loss": -43.3354606628418, "global_step": 284540, "epoch": 2351} {"train_loss": -43.16682434082031, "global_step": 284541, "epoch": 2351} {"train_loss": -43.669898986816406, "global_step": 284542, "epoch": 2351} {"train_loss": -43.09762191772461, "global_step": 284543, "epoch": 2351} {"train_loss": -43.41689682006836, "global_step": 284544, "epoch": 2351} {"train_loss": -43.620487213134766, "global_step": 284545, "epoch": 2351} {"train_loss": -43.31706619262695, "global_step": 284546, "epoch": 2351} {"train_loss": -43.708152770996094, "global_step": 284547, "epoch": 2351} {"train_loss": -43.62298583984375, "global_step": 284548, "epoch": 2351} {"train_loss": -43.19077682495117, "global_step": 284549, "epoch": 2351} {"train_loss": -43.60921096801758, "global_step": 284550, "epoch": 2351} {"train_loss": -44.02132797241211, "global_step": 284551, "epoch": 2351} {"train_loss": -44.051856994628906, "global_step": 284552, "epoch": 2351} {"train_loss": -43.969478607177734, "global_step": 284553, "epoch": 2351} {"train_loss": -44.05284881591797, "global_step": 284554, "epoch": 2351} {"train_loss": -44.34507751464844, "global_step": 284555, "epoch": 2351} {"train_loss": -43.48208999633789, "global_step": 284556, "epoch": 2351} {"train_loss": -44.2513313293457, "global_step": 284557, "epoch": 2351} {"train_loss": -43.652339935302734, "global_step": 284558, "epoch": 2351} {"train_loss": -44.20802688598633, "global_step": 284559, "epoch": 2351} {"train_loss": -43.7412223815918, "global_step": 284560, "epoch": 2351} {"train_loss": -43.746315002441406, "global_step": 284561, "epoch": 2351} {"train_loss": -44.075225830078125, "global_step": 284562, "epoch": 2351} {"train_loss": -43.6075553894043, "global_step": 284563, "epoch": 2351} {"train_loss": -44.13637924194336, "global_step": 284564, "epoch": 2351} {"train_loss": -43.62797927856445, "global_step": 284565, "epoch": 2351} {"train_loss": -43.74017333984375, "global_step": 284566, "epoch": 2351} {"train_loss": -43.1617546081543, "global_step": 284567, "epoch": 2351} {"train_loss": -43.98630905151367, "global_step": 284568, "epoch": 2351} {"train_loss": -42.145423889160156, "global_step": 284569, "epoch": 2351} {"train_loss": -43.3909912109375, "global_step": 284570, "epoch": 2351} {"train_loss": -43.29290771484375, "global_step": 284571, "epoch": 2351} {"train_loss": -43.78915023803711, "global_step": 284572, "epoch": 2351} {"train_loss": -43.19813537597656, "global_step": 284573, "epoch": 2351} {"train_loss": -43.367916107177734, "global_step": 284574, "epoch": 2351} {"train_loss": -43.605831146240234, "global_step": 284575, "epoch": 2351} {"train_loss": -43.434818267822266, "global_step": 284576, "epoch": 2351} {"train_loss": -43.98212432861328, "global_step": 284577, "epoch": 2351} {"train_loss": -43.60679244995117, "global_step": 284578, "epoch": 2351} {"train_loss": -43.201255798339844, "global_step": 284579, "epoch": 2351} {"train_loss": -43.409080505371094, "global_step": 284580, "epoch": 2351} {"train_loss": -43.738037109375, "global_step": 284581, "epoch": 2351} {"train_loss": -42.7951545715332, "global_step": 284582, "epoch": 2351} {"train_loss": -43.9296989440918, "global_step": 284583, "epoch": 2351} {"train_loss": -43.52731704711914, "global_step": 284584, "epoch": 2351} {"train_loss": -42.73541259765625, "global_step": 284585, "epoch": 2351} {"train_loss": -43.82159423828125, "global_step": 284586, "epoch": 2351} {"train_loss": -43.10725784301758, "global_step": 284587, "epoch": 2351} {"train_loss": -43.364402770996094, "global_step": 284588, "epoch": 2351} {"train_loss": -43.48208999633789, "global_step": 284589, "epoch": 2351} {"train_loss": -41.5769157409668, "global_step": 284590, "epoch": 2351} {"train_loss": -42.689637491525694, "global_step": 284591, "epoch": 2351, "val_loss": 2476338.25} {"train_loss": -40.986175537109375, "global_step": 284592, "epoch": 2352} {"train_loss": -42.854740142822266, "global_step": 284593, "epoch": 2352} {"train_loss": -43.18335723876953, "global_step": 284594, "epoch": 2352} {"train_loss": -42.20999526977539, "global_step": 284595, "epoch": 2352} {"train_loss": -42.99079513549805, "global_step": 284596, "epoch": 2352} {"train_loss": -42.83232498168945, "global_step": 284597, "epoch": 2352} {"train_loss": -42.220245361328125, "global_step": 284598, "epoch": 2352} {"train_loss": -43.46340560913086, "global_step": 284599, "epoch": 2352} {"train_loss": -42.261024475097656, "global_step": 284600, "epoch": 2352} {"train_loss": -42.41103744506836, "global_step": 284601, "epoch": 2352} {"train_loss": -42.505126953125, "global_step": 284602, "epoch": 2352} {"train_loss": -40.35881042480469, "global_step": 284603, "epoch": 2352} {"train_loss": -40.82225799560547, "global_step": 284604, "epoch": 2352} {"train_loss": -43.06662368774414, "global_step": 284605, "epoch": 2352} {"train_loss": -39.56248474121094, "global_step": 284606, "epoch": 2352} {"train_loss": -42.55134201049805, "global_step": 284607, "epoch": 2352} {"train_loss": -39.04048156738281, "global_step": 284608, "epoch": 2352} {"train_loss": -38.46549987792969, "global_step": 284609, "epoch": 2352} {"train_loss": -40.971107482910156, "global_step": 284610, "epoch": 2352} {"train_loss": -40.51398849487305, "global_step": 284611, "epoch": 2352} {"train_loss": -40.36323547363281, "global_step": 284612, "epoch": 2352} {"train_loss": -41.167049407958984, "global_step": 284613, "epoch": 2352} {"train_loss": -41.24055862426758, "global_step": 284614, "epoch": 2352} {"train_loss": -41.34674835205078, "global_step": 284615, "epoch": 2352} {"train_loss": -41.15739822387695, "global_step": 284616, "epoch": 2352} {"train_loss": -41.02180099487305, "global_step": 284617, "epoch": 2352} {"train_loss": -40.3524055480957, "global_step": 284618, "epoch": 2352} {"train_loss": -39.60755920410156, "global_step": 284619, "epoch": 2352} {"train_loss": -39.71978759765625, "global_step": 284620, "epoch": 2352} {"train_loss": -40.05928039550781, "global_step": 284621, "epoch": 2352} {"train_loss": -41.0333251953125, "global_step": 284622, "epoch": 2352} {"train_loss": -41.83623504638672, "global_step": 284623, "epoch": 2352} {"train_loss": -40.97646713256836, "global_step": 284624, "epoch": 2352} {"train_loss": -42.03322982788086, "global_step": 284625, "epoch": 2352} {"train_loss": -42.229251861572266, "global_step": 284626, "epoch": 2352} {"train_loss": -42.182308197021484, "global_step": 284627, "epoch": 2352} {"train_loss": -40.9461784362793, "global_step": 284628, "epoch": 2352} {"train_loss": -41.39970016479492, "global_step": 284629, "epoch": 2352} {"train_loss": -42.29770278930664, "global_step": 284630, "epoch": 2352} {"train_loss": -42.0426025390625, "global_step": 284631, "epoch": 2352} {"train_loss": -40.98714065551758, "global_step": 284632, "epoch": 2352} {"train_loss": -42.191986083984375, "global_step": 284633, "epoch": 2352} {"train_loss": -39.51318359375, "global_step": 284634, "epoch": 2352} {"train_loss": -40.2520866394043, "global_step": 284635, "epoch": 2352} {"train_loss": -40.86907958984375, "global_step": 284636, "epoch": 2352} {"train_loss": -40.4561653137207, "global_step": 284637, "epoch": 2352} {"train_loss": -41.889808654785156, "global_step": 284638, "epoch": 2352} {"train_loss": -41.18709182739258, "global_step": 284639, "epoch": 2352} {"train_loss": -40.8210334777832, "global_step": 284640, "epoch": 2352} {"train_loss": -39.825042724609375, "global_step": 284641, "epoch": 2352} {"train_loss": -41.28736114501953, "global_step": 284642, "epoch": 2352} {"train_loss": -40.98456573486328, "global_step": 284643, "epoch": 2352} {"train_loss": -41.163055419921875, "global_step": 284644, "epoch": 2352} {"train_loss": -40.06476974487305, "global_step": 284645, "epoch": 2352} {"train_loss": -42.09678649902344, "global_step": 284646, "epoch": 2352} {"train_loss": -41.2200813293457, "global_step": 284647, "epoch": 2352} {"train_loss": -42.40824508666992, "global_step": 284648, "epoch": 2352} {"train_loss": -41.493221282958984, "global_step": 284649, "epoch": 2352} {"train_loss": -42.671653747558594, "global_step": 284650, "epoch": 2352} {"train_loss": -43.02085876464844, "global_step": 284651, "epoch": 2352} {"train_loss": -42.49862289428711, "global_step": 284652, "epoch": 2352} {"train_loss": -43.04460144042969, "global_step": 284653, "epoch": 2352} {"train_loss": -42.89358139038086, "global_step": 284654, "epoch": 2352} {"train_loss": -42.69271469116211, "global_step": 284655, "epoch": 2352} {"train_loss": -42.75014877319336, "global_step": 284656, "epoch": 2352} {"train_loss": -43.448787689208984, "global_step": 284657, "epoch": 2352} {"train_loss": -43.393619537353516, "global_step": 284658, "epoch": 2352} {"train_loss": -43.532470703125, "global_step": 284659, "epoch": 2352} {"train_loss": -43.000099182128906, "global_step": 284660, "epoch": 2352} {"train_loss": -43.3288459777832, "global_step": 284661, "epoch": 2352} {"train_loss": -43.11833190917969, "global_step": 284662, "epoch": 2352} {"train_loss": -43.138282775878906, "global_step": 284663, "epoch": 2352} {"train_loss": -43.421974182128906, "global_step": 284664, "epoch": 2352} {"train_loss": -42.893463134765625, "global_step": 284665, "epoch": 2352} {"train_loss": -43.12520980834961, "global_step": 284666, "epoch": 2352} {"train_loss": -42.839500427246094, "global_step": 284667, "epoch": 2352} {"train_loss": -43.486358642578125, "global_step": 284668, "epoch": 2352} {"train_loss": -42.759578704833984, "global_step": 284669, "epoch": 2352} {"train_loss": -43.84205627441406, "global_step": 284670, "epoch": 2352} {"train_loss": -43.954750061035156, "global_step": 284671, "epoch": 2352} {"train_loss": -43.25553512573242, "global_step": 284672, "epoch": 2352} {"train_loss": -42.88642883300781, "global_step": 284673, "epoch": 2352} {"train_loss": -43.28168487548828, "global_step": 284674, "epoch": 2352} {"train_loss": -44.16769027709961, "global_step": 284675, "epoch": 2352} {"train_loss": -43.24516677856445, "global_step": 284676, "epoch": 2352} {"train_loss": -43.732295989990234, "global_step": 284677, "epoch": 2352} {"train_loss": -43.88893508911133, "global_step": 284678, "epoch": 2352} {"train_loss": -43.81876754760742, "global_step": 284679, "epoch": 2352} {"train_loss": -43.921260833740234, "global_step": 284680, "epoch": 2352} {"train_loss": -44.046878814697266, "global_step": 284681, "epoch": 2352} {"train_loss": -44.181819915771484, "global_step": 284682, "epoch": 2352} {"train_loss": -43.86274337768555, "global_step": 284683, "epoch": 2352} {"train_loss": -43.6475944519043, "global_step": 284684, "epoch": 2352} {"train_loss": -43.568336486816406, "global_step": 284685, "epoch": 2352} {"train_loss": -43.66741943359375, "global_step": 284686, "epoch": 2352} {"train_loss": -43.59614944458008, "global_step": 284687, "epoch": 2352} {"train_loss": -44.19751739501953, "global_step": 284688, "epoch": 2352} {"train_loss": -43.65187454223633, "global_step": 284689, "epoch": 2352} {"train_loss": -44.093624114990234, "global_step": 284690, "epoch": 2352} {"train_loss": -44.00295639038086, "global_step": 284691, "epoch": 2352} {"train_loss": -44.22675704956055, "global_step": 284692, "epoch": 2352} {"train_loss": -43.0628662109375, "global_step": 284693, "epoch": 2352} {"train_loss": -43.19321823120117, "global_step": 284694, "epoch": 2352} {"train_loss": -43.67672348022461, "global_step": 284695, "epoch": 2352} {"train_loss": -43.44943618774414, "global_step": 284696, "epoch": 2352} {"train_loss": -42.57322311401367, "global_step": 284697, "epoch": 2352} {"train_loss": -43.26741409301758, "global_step": 284698, "epoch": 2352} {"train_loss": -42.695884704589844, "global_step": 284699, "epoch": 2352} {"train_loss": -43.65317916870117, "global_step": 284700, "epoch": 2352} {"train_loss": -43.672157287597656, "global_step": 284701, "epoch": 2352} {"train_loss": -43.662376403808594, "global_step": 284702, "epoch": 2352} {"train_loss": -43.193450927734375, "global_step": 284703, "epoch": 2352} {"train_loss": -43.06977081298828, "global_step": 284704, "epoch": 2352} {"train_loss": -43.81159210205078, "global_step": 284705, "epoch": 2352} {"train_loss": -43.387874603271484, "global_step": 284706, "epoch": 2352} {"train_loss": -42.25104904174805, "global_step": 284707, "epoch": 2352} {"train_loss": -43.692474365234375, "global_step": 284708, "epoch": 2352} {"train_loss": -43.791015625, "global_step": 284709, "epoch": 2352} {"train_loss": -41.991722106933594, "global_step": 284710, "epoch": 2352} {"train_loss": -42.78021240234375, "global_step": 284711, "epoch": 2352} {"train_loss": -42.36882586518595, "global_step": 284712, "epoch": 2352, "val_loss": 2510882.0} {"train_loss": -42.05628967285156, "global_step": 284713, "epoch": 2353} {"train_loss": -43.1706657409668, "global_step": 284714, "epoch": 2353} {"train_loss": -41.86302185058594, "global_step": 284715, "epoch": 2353} {"train_loss": -42.47685623168945, "global_step": 284716, "epoch": 2353} {"train_loss": -40.97954177856445, "global_step": 284717, "epoch": 2353} {"train_loss": -43.61357879638672, "global_step": 284718, "epoch": 2353} {"train_loss": -41.864078521728516, "global_step": 284719, "epoch": 2353} {"train_loss": -42.42283630371094, "global_step": 284720, "epoch": 2353} {"train_loss": -43.345550537109375, "global_step": 284721, "epoch": 2353} {"train_loss": -41.87879180908203, "global_step": 284722, "epoch": 2353} {"train_loss": -42.43248748779297, "global_step": 284723, "epoch": 2353} {"train_loss": -42.35414505004883, "global_step": 284724, "epoch": 2353} {"train_loss": -43.09405517578125, "global_step": 284725, "epoch": 2353} {"train_loss": -41.9583625793457, "global_step": 284726, "epoch": 2353} {"train_loss": -42.59585189819336, "global_step": 284727, "epoch": 2353} {"train_loss": -41.9713134765625, "global_step": 284728, "epoch": 2353} {"train_loss": -41.5770263671875, "global_step": 284729, "epoch": 2353} {"train_loss": -42.60710525512695, "global_step": 284730, "epoch": 2353} {"train_loss": -36.81257247924805, "global_step": 284731, "epoch": 2353} {"train_loss": -42.88153076171875, "global_step": 284732, "epoch": 2353} {"train_loss": -37.75730514526367, "global_step": 284733, "epoch": 2353} {"train_loss": -39.62646484375, "global_step": 284734, "epoch": 2353} {"train_loss": -40.47583770751953, "global_step": 284735, "epoch": 2353} {"train_loss": -40.91793441772461, "global_step": 284736, "epoch": 2353} {"train_loss": -39.294044494628906, "global_step": 284737, "epoch": 2353} {"train_loss": -41.116294860839844, "global_step": 284738, "epoch": 2353} {"train_loss": -40.516197204589844, "global_step": 284739, "epoch": 2353} {"train_loss": -41.09702682495117, "global_step": 284740, "epoch": 2353} {"train_loss": -38.69715118408203, "global_step": 284741, "epoch": 2353} {"train_loss": -41.36918258666992, "global_step": 284742, "epoch": 2353} {"train_loss": -39.98594665527344, "global_step": 284743, "epoch": 2353} {"train_loss": -41.85604476928711, "global_step": 284744, "epoch": 2353} {"train_loss": -41.63037109375, "global_step": 284745, "epoch": 2353} {"train_loss": -40.87165069580078, "global_step": 284746, "epoch": 2353} {"train_loss": -39.15263748168945, "global_step": 284747, "epoch": 2353} {"train_loss": -39.64889144897461, "global_step": 284748, "epoch": 2353} {"train_loss": -39.23905563354492, "global_step": 284749, "epoch": 2353} {"train_loss": -41.12936019897461, "global_step": 284750, "epoch": 2353} {"train_loss": -39.488651275634766, "global_step": 284751, "epoch": 2353} {"train_loss": -40.98047637939453, "global_step": 284752, "epoch": 2353} {"train_loss": -39.05009078979492, "global_step": 284753, "epoch": 2353} {"train_loss": -42.44281005859375, "global_step": 284754, "epoch": 2353} {"train_loss": -40.881282806396484, "global_step": 284755, "epoch": 2353} {"train_loss": -40.51430892944336, "global_step": 284756, "epoch": 2353} {"train_loss": -40.127662658691406, "global_step": 284757, "epoch": 2353} {"train_loss": -40.42592239379883, "global_step": 284758, "epoch": 2353} {"train_loss": -40.08736038208008, "global_step": 284759, "epoch": 2353} {"train_loss": -40.58774948120117, "global_step": 284760, "epoch": 2353} {"train_loss": -41.56138229370117, "global_step": 284761, "epoch": 2353} {"train_loss": -40.833675384521484, "global_step": 284762, "epoch": 2353} {"train_loss": -40.935401916503906, "global_step": 284763, "epoch": 2353} {"train_loss": -42.11690139770508, "global_step": 284764, "epoch": 2353} {"train_loss": -41.340328216552734, "global_step": 284765, "epoch": 2353} {"train_loss": -41.424076080322266, "global_step": 284766, "epoch": 2353} {"train_loss": -42.169654846191406, "global_step": 284767, "epoch": 2353} {"train_loss": -42.40589141845703, "global_step": 284768, "epoch": 2353} {"train_loss": -41.91830062866211, "global_step": 284769, "epoch": 2353} {"train_loss": -41.73923110961914, "global_step": 284770, "epoch": 2353} {"train_loss": -42.4550895690918, "global_step": 284771, "epoch": 2353} {"train_loss": -42.43603515625, "global_step": 284772, "epoch": 2353} {"train_loss": -42.32792282104492, "global_step": 284773, "epoch": 2353} {"train_loss": -42.95474624633789, "global_step": 284774, "epoch": 2353} {"train_loss": -42.98452377319336, "global_step": 284775, "epoch": 2353} {"train_loss": -42.42341232299805, "global_step": 284776, "epoch": 2353} {"train_loss": -43.041831970214844, "global_step": 284777, "epoch": 2353} {"train_loss": -42.75227737426758, "global_step": 284778, "epoch": 2353} {"train_loss": -42.99818801879883, "global_step": 284779, "epoch": 2353} {"train_loss": -43.70486068725586, "global_step": 284780, "epoch": 2353} {"train_loss": -43.1273307800293, "global_step": 284781, "epoch": 2353} {"train_loss": -43.216285705566406, "global_step": 284782, "epoch": 2353} {"train_loss": -43.598114013671875, "global_step": 284783, "epoch": 2353} {"train_loss": -43.35480880737305, "global_step": 284784, "epoch": 2353} {"train_loss": -43.62225341796875, "global_step": 284785, "epoch": 2353} {"train_loss": -43.31343460083008, "global_step": 284786, "epoch": 2353} {"train_loss": -43.74797439575195, "global_step": 284787, "epoch": 2353} {"train_loss": -43.557403564453125, "global_step": 284788, "epoch": 2353} {"train_loss": -43.75608825683594, "global_step": 284789, "epoch": 2353} {"train_loss": -43.607208251953125, "global_step": 284790, "epoch": 2353} {"train_loss": -43.55208969116211, "global_step": 284791, "epoch": 2353} {"train_loss": -43.4862060546875, "global_step": 284792, "epoch": 2353} {"train_loss": -43.35825729370117, "global_step": 284793, "epoch": 2353} {"train_loss": -43.59071350097656, "global_step": 284794, "epoch": 2353} {"train_loss": -42.551212310791016, "global_step": 284795, "epoch": 2353} {"train_loss": -43.54253005981445, "global_step": 284796, "epoch": 2353} {"train_loss": -44.01029586791992, "global_step": 284797, "epoch": 2353} {"train_loss": -43.93111801147461, "global_step": 284798, "epoch": 2353} {"train_loss": -43.93972396850586, "global_step": 284799, "epoch": 2353} {"train_loss": -44.18854522705078, "global_step": 284800, "epoch": 2353} {"train_loss": -43.509544372558594, "global_step": 284801, "epoch": 2353} {"train_loss": -44.47066879272461, "global_step": 284802, "epoch": 2353} {"train_loss": -44.06957244873047, "global_step": 284803, "epoch": 2353} {"train_loss": -44.13823699951172, "global_step": 284804, "epoch": 2353} {"train_loss": -44.59189987182617, "global_step": 284805, "epoch": 2353} {"train_loss": -43.5808219909668, "global_step": 284806, "epoch": 2353} {"train_loss": -43.9810905456543, "global_step": 284807, "epoch": 2353} {"train_loss": -43.84339141845703, "global_step": 284808, "epoch": 2353} {"train_loss": -44.01479721069336, "global_step": 284809, "epoch": 2353} {"train_loss": -44.01020050048828, "global_step": 284810, "epoch": 2353} {"train_loss": -44.387489318847656, "global_step": 284811, "epoch": 2353} {"train_loss": -44.22372055053711, "global_step": 284812, "epoch": 2353} {"train_loss": -44.499664306640625, "global_step": 284813, "epoch": 2353} {"train_loss": -44.005836486816406, "global_step": 284814, "epoch": 2353} {"train_loss": -44.52046585083008, "global_step": 284815, "epoch": 2353} {"train_loss": -44.80073165893555, "global_step": 284816, "epoch": 2353} {"train_loss": -44.01402282714844, "global_step": 284817, "epoch": 2353} {"train_loss": -44.07881546020508, "global_step": 284818, "epoch": 2353} {"train_loss": -44.152099609375, "global_step": 284819, "epoch": 2353} {"train_loss": -44.57897186279297, "global_step": 284820, "epoch": 2353} {"train_loss": -44.11458206176758, "global_step": 284821, "epoch": 2353} {"train_loss": -44.70615768432617, "global_step": 284822, "epoch": 2353} {"train_loss": -44.50626754760742, "global_step": 284823, "epoch": 2353} {"train_loss": -42.7145881652832, "global_step": 284824, "epoch": 2353} {"train_loss": -42.174503326416016, "global_step": 284825, "epoch": 2353} {"train_loss": -43.485816955566406, "global_step": 284826, "epoch": 2353} {"train_loss": -43.495601654052734, "global_step": 284827, "epoch": 2353} {"train_loss": -43.48359298706055, "global_step": 284828, "epoch": 2353} {"train_loss": -44.2139778137207, "global_step": 284829, "epoch": 2353} {"train_loss": -44.37929153442383, "global_step": 284830, "epoch": 2353} {"train_loss": -44.0230827331543, "global_step": 284831, "epoch": 2353} {"train_loss": -43.76831817626953, "global_step": 284832, "epoch": 2353} {"train_loss": -42.467352465164566, "global_step": 284833, "epoch": 2353, "val_loss": 2528562.0} {"train_loss": -43.90049362182617, "global_step": 284834, "epoch": 2354} {"train_loss": -44.27838134765625, "global_step": 284835, "epoch": 2354} {"train_loss": -43.94572830200195, "global_step": 284836, "epoch": 2354} {"train_loss": -44.133785247802734, "global_step": 284837, "epoch": 2354} {"train_loss": -43.649993896484375, "global_step": 284838, "epoch": 2354} {"train_loss": -44.00226593017578, "global_step": 284839, "epoch": 2354} {"train_loss": -43.39768600463867, "global_step": 284840, "epoch": 2354} {"train_loss": -43.56757736206055, "global_step": 284841, "epoch": 2354} {"train_loss": -43.50868225097656, "global_step": 284842, "epoch": 2354} {"train_loss": -42.788856506347656, "global_step": 284843, "epoch": 2354} {"train_loss": -41.98918533325195, "global_step": 284844, "epoch": 2354} {"train_loss": -44.12980270385742, "global_step": 284845, "epoch": 2354} {"train_loss": -43.46848678588867, "global_step": 284846, "epoch": 2354} {"train_loss": -43.00404739379883, "global_step": 284847, "epoch": 2354} {"train_loss": -44.03306198120117, "global_step": 284848, "epoch": 2354} {"train_loss": -43.23884201049805, "global_step": 284849, "epoch": 2354} {"train_loss": -42.21076965332031, "global_step": 284850, "epoch": 2354} {"train_loss": -42.5376091003418, "global_step": 284851, "epoch": 2354} {"train_loss": -44.343257904052734, "global_step": 284852, "epoch": 2354} {"train_loss": -42.410457611083984, "global_step": 284853, "epoch": 2354} {"train_loss": -42.778072357177734, "global_step": 284854, "epoch": 2354} {"train_loss": -43.78434371948242, "global_step": 284855, "epoch": 2354} {"train_loss": -41.63776397705078, "global_step": 284856, "epoch": 2354} {"train_loss": -44.13499069213867, "global_step": 284857, "epoch": 2354} {"train_loss": -39.23374557495117, "global_step": 284858, "epoch": 2354} {"train_loss": -40.16126251220703, "global_step": 284859, "epoch": 2354} {"train_loss": -41.758785247802734, "global_step": 284860, "epoch": 2354} {"train_loss": -40.5461311340332, "global_step": 284861, "epoch": 2354} {"train_loss": -36.96797180175781, "global_step": 284862, "epoch": 2354} {"train_loss": -39.247337341308594, "global_step": 284863, "epoch": 2354} {"train_loss": -40.932491302490234, "global_step": 284864, "epoch": 2354} {"train_loss": -39.04896926879883, "global_step": 284865, "epoch": 2354} {"train_loss": -39.907108306884766, "global_step": 284866, "epoch": 2354} {"train_loss": -40.21574020385742, "global_step": 284867, "epoch": 2354} {"train_loss": -41.806453704833984, "global_step": 284868, "epoch": 2354} {"train_loss": -40.454139709472656, "global_step": 284869, "epoch": 2354} {"train_loss": -36.510498046875, "global_step": 284870, "epoch": 2354} {"train_loss": -24.596914291381836, "global_step": 284871, "epoch": 2354} {"train_loss": -31.828540802001953, "global_step": 284872, "epoch": 2354} {"train_loss": -29.21173095703125, "global_step": 284873, "epoch": 2354} {"train_loss": -33.8654899597168, "global_step": 284874, "epoch": 2354} {"train_loss": -27.58676528930664, "global_step": 284875, "epoch": 2354} {"train_loss": -34.64433670043945, "global_step": 284876, "epoch": 2354} {"train_loss": -29.77144432067871, "global_step": 284877, "epoch": 2354} {"train_loss": -36.28823471069336, "global_step": 284878, "epoch": 2354} {"train_loss": -32.6604118347168, "global_step": 284879, "epoch": 2354} {"train_loss": -35.6049919128418, "global_step": 284880, "epoch": 2354} {"train_loss": -35.779930114746094, "global_step": 284881, "epoch": 2354} {"train_loss": -35.550899505615234, "global_step": 284882, "epoch": 2354} {"train_loss": -37.48054504394531, "global_step": 284883, "epoch": 2354} {"train_loss": -35.696189880371094, "global_step": 284884, "epoch": 2354} {"train_loss": -36.27450180053711, "global_step": 284885, "epoch": 2354} {"train_loss": -37.33991622924805, "global_step": 284886, "epoch": 2354} {"train_loss": -36.5211296081543, "global_step": 284887, "epoch": 2354} {"train_loss": -37.04187774658203, "global_step": 284888, "epoch": 2354} {"train_loss": -38.20060348510742, "global_step": 284889, "epoch": 2354} {"train_loss": -37.173763275146484, "global_step": 284890, "epoch": 2354} {"train_loss": -37.05149459838867, "global_step": 284891, "epoch": 2354} {"train_loss": -38.152435302734375, "global_step": 284892, "epoch": 2354} {"train_loss": -37.965660095214844, "global_step": 284893, "epoch": 2354} {"train_loss": -36.48231506347656, "global_step": 284894, "epoch": 2354} {"train_loss": -37.74148178100586, "global_step": 284895, "epoch": 2354} {"train_loss": -37.94873809814453, "global_step": 284896, "epoch": 2354} {"train_loss": -38.0693359375, "global_step": 284897, "epoch": 2354} {"train_loss": -38.3962287902832, "global_step": 284898, "epoch": 2354} {"train_loss": -38.535274505615234, "global_step": 284899, "epoch": 2354} {"train_loss": -37.82069396972656, "global_step": 284900, "epoch": 2354} {"train_loss": -37.58205795288086, "global_step": 284901, "epoch": 2354} {"train_loss": -38.449249267578125, "global_step": 284902, "epoch": 2354} {"train_loss": -38.93175506591797, "global_step": 284903, "epoch": 2354} {"train_loss": -38.6428337097168, "global_step": 284904, "epoch": 2354} {"train_loss": -38.22624206542969, "global_step": 284905, "epoch": 2354} {"train_loss": -38.889305114746094, "global_step": 284906, "epoch": 2354} {"train_loss": -39.18748092651367, "global_step": 284907, "epoch": 2354} {"train_loss": -39.59333038330078, "global_step": 284908, "epoch": 2354} {"train_loss": -39.4246826171875, "global_step": 284909, "epoch": 2354} {"train_loss": -38.95623016357422, "global_step": 284910, "epoch": 2354} {"train_loss": -39.539398193359375, "global_step": 284911, "epoch": 2354} {"train_loss": -39.74978256225586, "global_step": 284912, "epoch": 2354} {"train_loss": -39.733158111572266, "global_step": 284913, "epoch": 2354} {"train_loss": -39.58618927001953, "global_step": 284914, "epoch": 2354} {"train_loss": -39.36604690551758, "global_step": 284915, "epoch": 2354} {"train_loss": -39.151424407958984, "global_step": 284916, "epoch": 2354} {"train_loss": -40.30513381958008, "global_step": 284917, "epoch": 2354} {"train_loss": -39.840572357177734, "global_step": 284918, "epoch": 2354} {"train_loss": -39.419246673583984, "global_step": 284919, "epoch": 2354} {"train_loss": -39.52573776245117, "global_step": 284920, "epoch": 2354} {"train_loss": -39.94759750366211, "global_step": 284921, "epoch": 2354} {"train_loss": -40.18124771118164, "global_step": 284922, "epoch": 2354} {"train_loss": -40.3099365234375, "global_step": 284923, "epoch": 2354} {"train_loss": -40.105892181396484, "global_step": 284924, "epoch": 2354} {"train_loss": -39.971092224121094, "global_step": 284925, "epoch": 2354} {"train_loss": -39.879173278808594, "global_step": 284926, "epoch": 2354} {"train_loss": -39.415897369384766, "global_step": 284927, "epoch": 2354} {"train_loss": -38.011959075927734, "global_step": 284928, "epoch": 2354} {"train_loss": -35.74288558959961, "global_step": 284929, "epoch": 2354} {"train_loss": -38.971771240234375, "global_step": 284930, "epoch": 2354} {"train_loss": -40.7711181640625, "global_step": 284931, "epoch": 2354} {"train_loss": -38.38888168334961, "global_step": 284932, "epoch": 2354} {"train_loss": -39.92473602294922, "global_step": 284933, "epoch": 2354} {"train_loss": -40.11357116699219, "global_step": 284934, "epoch": 2354} {"train_loss": -39.779720306396484, "global_step": 284935, "epoch": 2354} {"train_loss": -41.18624496459961, "global_step": 284936, "epoch": 2354} {"train_loss": -39.59423828125, "global_step": 284937, "epoch": 2354} {"train_loss": -40.694210052490234, "global_step": 284938, "epoch": 2354} {"train_loss": -40.831817626953125, "global_step": 284939, "epoch": 2354} {"train_loss": -40.70009994506836, "global_step": 284940, "epoch": 2354} {"train_loss": -40.6458740234375, "global_step": 284941, "epoch": 2354} {"train_loss": -40.43070602416992, "global_step": 284942, "epoch": 2354} {"train_loss": -40.221153259277344, "global_step": 284943, "epoch": 2354} {"train_loss": -40.296104431152344, "global_step": 284944, "epoch": 2354} {"train_loss": -40.366817474365234, "global_step": 284945, "epoch": 2354} {"train_loss": -41.07754135131836, "global_step": 284946, "epoch": 2354} {"train_loss": -40.921817779541016, "global_step": 284947, "epoch": 2354} {"train_loss": -40.99292755126953, "global_step": 284948, "epoch": 2354} {"train_loss": -41.19806671142578, "global_step": 284949, "epoch": 2354} {"train_loss": -40.89693832397461, "global_step": 284950, "epoch": 2354} {"train_loss": -41.25121307373047, "global_step": 284951, "epoch": 2354} {"train_loss": -40.60457229614258, "global_step": 284952, "epoch": 2354} {"train_loss": -40.95481491088867, "global_step": 284953, "epoch": 2354} {"train_loss": -39.40765850603088, "global_step": 284954, "epoch": 2354, "val_loss": 2498016.75} {"train_loss": -41.12894821166992, "global_step": 284955, "epoch": 2355} {"train_loss": -40.98821258544922, "global_step": 284956, "epoch": 2355} {"train_loss": -41.337886810302734, "global_step": 284957, "epoch": 2355} {"train_loss": -41.19074249267578, "global_step": 284958, "epoch": 2355} {"train_loss": -41.479862213134766, "global_step": 284959, "epoch": 2355} {"train_loss": -41.324092864990234, "global_step": 284960, "epoch": 2355} {"train_loss": -41.79633331298828, "global_step": 284961, "epoch": 2355} {"train_loss": -41.90358352661133, "global_step": 284962, "epoch": 2355} {"train_loss": -41.081695556640625, "global_step": 284963, "epoch": 2355} {"train_loss": -41.10456466674805, "global_step": 284964, "epoch": 2355} {"train_loss": -41.22907638549805, "global_step": 284965, "epoch": 2355} {"train_loss": -41.633460998535156, "global_step": 284966, "epoch": 2355} {"train_loss": -41.634521484375, "global_step": 284967, "epoch": 2355} {"train_loss": -41.54731369018555, "global_step": 284968, "epoch": 2355} {"train_loss": -41.56180953979492, "global_step": 284969, "epoch": 2355} {"train_loss": -41.42784881591797, "global_step": 284970, "epoch": 2355} {"train_loss": -41.81616973876953, "global_step": 284971, "epoch": 2355} {"train_loss": -42.750038146972656, "global_step": 284972, "epoch": 2355} {"train_loss": -41.86967849731445, "global_step": 284973, "epoch": 2355} {"train_loss": -41.75584030151367, "global_step": 284974, "epoch": 2355} {"train_loss": -41.86888122558594, "global_step": 284975, "epoch": 2355} {"train_loss": -41.983009338378906, "global_step": 284976, "epoch": 2355} {"train_loss": -41.831092834472656, "global_step": 284977, "epoch": 2355} {"train_loss": -42.205665588378906, "global_step": 284978, "epoch": 2355} {"train_loss": -42.73765182495117, "global_step": 284979, "epoch": 2355} {"train_loss": -41.912872314453125, "global_step": 284980, "epoch": 2355} {"train_loss": -42.115966796875, "global_step": 284981, "epoch": 2355} {"train_loss": -41.9323844909668, "global_step": 284982, "epoch": 2355} {"train_loss": -42.52676010131836, "global_step": 284983, "epoch": 2355} {"train_loss": -42.06113815307617, "global_step": 284984, "epoch": 2355} {"train_loss": -41.94271469116211, "global_step": 284985, "epoch": 2355} {"train_loss": -42.079444885253906, "global_step": 284986, "epoch": 2355} {"train_loss": -42.48847579956055, "global_step": 284987, "epoch": 2355} {"train_loss": -42.43488311767578, "global_step": 284988, "epoch": 2355} {"train_loss": -42.04148483276367, "global_step": 284989, "epoch": 2355} {"train_loss": -41.260860443115234, "global_step": 284990, "epoch": 2355} {"train_loss": -42.548866271972656, "global_step": 284991, "epoch": 2355} {"train_loss": -42.478389739990234, "global_step": 284992, "epoch": 2355} {"train_loss": -42.56694412231445, "global_step": 284993, "epoch": 2355} {"train_loss": -40.19752883911133, "global_step": 284994, "epoch": 2355} {"train_loss": -41.88536071777344, "global_step": 284995, "epoch": 2355} {"train_loss": -42.09005355834961, "global_step": 284996, "epoch": 2355} {"train_loss": -42.11562728881836, "global_step": 284997, "epoch": 2355} {"train_loss": -41.5913200378418, "global_step": 284998, "epoch": 2355} {"train_loss": -42.59048080444336, "global_step": 284999, "epoch": 2355} {"train_loss": -42.22066879272461, "global_step": 285000, "epoch": 2355} {"train_loss": -42.39447021484375, "global_step": 285001, "epoch": 2355} {"train_loss": -42.1970329284668, "global_step": 285002, "epoch": 2355} {"train_loss": -42.88210678100586, "global_step": 285003, "epoch": 2355} {"train_loss": -42.439449310302734, "global_step": 285004, "epoch": 2355} {"train_loss": -41.84210205078125, "global_step": 285005, "epoch": 2355} {"train_loss": -39.76301956176758, "global_step": 285006, "epoch": 2355} {"train_loss": -36.33807373046875, "global_step": 285007, "epoch": 2355} {"train_loss": -31.70429039001465, "global_step": 285008, "epoch": 2355} {"train_loss": -39.17116928100586, "global_step": 285009, "epoch": 2355} {"train_loss": -39.87844467163086, "global_step": 285010, "epoch": 2355} {"train_loss": -33.26880645751953, "global_step": 285011, "epoch": 2355} {"train_loss": -39.93154525756836, "global_step": 285012, "epoch": 2355} {"train_loss": -40.25177001953125, "global_step": 285013, "epoch": 2355} {"train_loss": -37.4109992980957, "global_step": 285014, "epoch": 2355} {"train_loss": -41.20363998413086, "global_step": 285015, "epoch": 2355} {"train_loss": -39.56324005126953, "global_step": 285016, "epoch": 2355} {"train_loss": -40.01052474975586, "global_step": 285017, "epoch": 2355} {"train_loss": -40.397857666015625, "global_step": 285018, "epoch": 2355} {"train_loss": -38.74663162231445, "global_step": 285019, "epoch": 2355} {"train_loss": -39.84695053100586, "global_step": 285020, "epoch": 2355} {"train_loss": -39.531005859375, "global_step": 285021, "epoch": 2355} {"train_loss": -40.263282775878906, "global_step": 285022, "epoch": 2355} {"train_loss": -40.35026931762695, "global_step": 285023, "epoch": 2355} {"train_loss": -39.393489837646484, "global_step": 285024, "epoch": 2355} {"train_loss": -39.860694885253906, "global_step": 285025, "epoch": 2355} {"train_loss": -40.694252014160156, "global_step": 285026, "epoch": 2355} {"train_loss": -40.05173110961914, "global_step": 285027, "epoch": 2355} {"train_loss": -40.55338668823242, "global_step": 285028, "epoch": 2355} {"train_loss": -40.15968704223633, "global_step": 285029, "epoch": 2355} {"train_loss": -40.9775505065918, "global_step": 285030, "epoch": 2355} {"train_loss": -40.54913330078125, "global_step": 285031, "epoch": 2355} {"train_loss": -39.75099182128906, "global_step": 285032, "epoch": 2355} {"train_loss": -38.58192825317383, "global_step": 285033, "epoch": 2355} {"train_loss": -40.87174606323242, "global_step": 285034, "epoch": 2355} {"train_loss": -39.7524528503418, "global_step": 285035, "epoch": 2355} {"train_loss": -40.433834075927734, "global_step": 285036, "epoch": 2355} {"train_loss": -39.6697883605957, "global_step": 285037, "epoch": 2355} {"train_loss": -40.889827728271484, "global_step": 285038, "epoch": 2355} {"train_loss": -41.18854522705078, "global_step": 285039, "epoch": 2355} {"train_loss": -40.9058723449707, "global_step": 285040, "epoch": 2355} {"train_loss": -38.80283737182617, "global_step": 285041, "epoch": 2355} {"train_loss": -40.945228576660156, "global_step": 285042, "epoch": 2355} {"train_loss": -40.96259307861328, "global_step": 285043, "epoch": 2355} {"train_loss": -40.597103118896484, "global_step": 285044, "epoch": 2355} {"train_loss": -41.660709381103516, "global_step": 285045, "epoch": 2355} {"train_loss": -41.03152084350586, "global_step": 285046, "epoch": 2355} {"train_loss": -41.5531120300293, "global_step": 285047, "epoch": 2355} {"train_loss": -40.27167892456055, "global_step": 285048, "epoch": 2355} {"train_loss": -41.03007125854492, "global_step": 285049, "epoch": 2355} {"train_loss": -41.730472564697266, "global_step": 285050, "epoch": 2355} {"train_loss": -41.32415771484375, "global_step": 285051, "epoch": 2355} {"train_loss": -41.10183334350586, "global_step": 285052, "epoch": 2355} {"train_loss": -38.891143798828125, "global_step": 285053, "epoch": 2355} {"train_loss": -40.248592376708984, "global_step": 285054, "epoch": 2355} {"train_loss": -41.725128173828125, "global_step": 285055, "epoch": 2355} {"train_loss": -39.99327087402344, "global_step": 285056, "epoch": 2355} {"train_loss": -40.62293243408203, "global_step": 285057, "epoch": 2355} {"train_loss": -39.06679916381836, "global_step": 285058, "epoch": 2355} {"train_loss": -41.167442321777344, "global_step": 285059, "epoch": 2355} {"train_loss": -40.09296798706055, "global_step": 285060, "epoch": 2355} {"train_loss": -40.4630012512207, "global_step": 285061, "epoch": 2355} {"train_loss": -39.99149703979492, "global_step": 285062, "epoch": 2355} {"train_loss": -41.40437698364258, "global_step": 285063, "epoch": 2355} {"train_loss": -41.00438690185547, "global_step": 285064, "epoch": 2355} {"train_loss": -37.97492218017578, "global_step": 285065, "epoch": 2355} {"train_loss": -41.02317428588867, "global_step": 285066, "epoch": 2355} {"train_loss": -41.07984924316406, "global_step": 285067, "epoch": 2355} {"train_loss": -40.43765640258789, "global_step": 285068, "epoch": 2355} {"train_loss": -40.474178314208984, "global_step": 285069, "epoch": 2355} {"train_loss": -40.48621368408203, "global_step": 285070, "epoch": 2355} {"train_loss": -40.27201461791992, "global_step": 285071, "epoch": 2355} {"train_loss": -39.94709396362305, "global_step": 285072, "epoch": 2355} {"train_loss": -39.66560745239258, "global_step": 285073, "epoch": 2355} {"train_loss": -39.0448112487793, "global_step": 285074, "epoch": 2355} {"train_loss": -40.773057811516374, "global_step": 285075, "epoch": 2355, "val_loss": 2567540.25} {"train_loss": -40.63190841674805, "global_step": 285076, "epoch": 2356} {"train_loss": -41.24229049682617, "global_step": 285077, "epoch": 2356} {"train_loss": -41.353424072265625, "global_step": 285078, "epoch": 2356} {"train_loss": -38.55709457397461, "global_step": 285079, "epoch": 2356} {"train_loss": -40.785335540771484, "global_step": 285080, "epoch": 2356} {"train_loss": -39.94448471069336, "global_step": 285081, "epoch": 2356} {"train_loss": -40.86852264404297, "global_step": 285082, "epoch": 2356} {"train_loss": -41.30424118041992, "global_step": 285083, "epoch": 2356} {"train_loss": -40.91038131713867, "global_step": 285084, "epoch": 2356} {"train_loss": -40.6956901550293, "global_step": 285085, "epoch": 2356} {"train_loss": -39.47713851928711, "global_step": 285086, "epoch": 2356} {"train_loss": -37.9623908996582, "global_step": 285087, "epoch": 2356} {"train_loss": -40.96818923950195, "global_step": 285088, "epoch": 2356} {"train_loss": -40.57639694213867, "global_step": 285089, "epoch": 2356} {"train_loss": -38.62880325317383, "global_step": 285090, "epoch": 2356} {"train_loss": -41.0142936706543, "global_step": 285091, "epoch": 2356} {"train_loss": -41.53300857543945, "global_step": 285092, "epoch": 2356} {"train_loss": -41.15104293823242, "global_step": 285093, "epoch": 2356} {"train_loss": -40.07668685913086, "global_step": 285094, "epoch": 2356} {"train_loss": -39.61228561401367, "global_step": 285095, "epoch": 2356} {"train_loss": -24.479795455932617, "global_step": 285096, "epoch": 2356} {"train_loss": -40.661354064941406, "global_step": 285097, "epoch": 2356} {"train_loss": -39.92780685424805, "global_step": 285098, "epoch": 2356} {"train_loss": -35.684261322021484, "global_step": 285099, "epoch": 2356} {"train_loss": -19.495222091674805, "global_step": 285100, "epoch": 2356} {"train_loss": -32.16374969482422, "global_step": 285101, "epoch": 2356} {"train_loss": -34.65580368041992, "global_step": 285102, "epoch": 2356} {"train_loss": -28.820068359375, "global_step": 285103, "epoch": 2356} {"train_loss": -36.16630172729492, "global_step": 285104, "epoch": 2356} {"train_loss": -35.52991485595703, "global_step": 285105, "epoch": 2356} {"train_loss": -36.91487503051758, "global_step": 285106, "epoch": 2356} {"train_loss": -32.4311637878418, "global_step": 285107, "epoch": 2356} {"train_loss": -32.95586013793945, "global_step": 285108, "epoch": 2356} {"train_loss": -36.624393463134766, "global_step": 285109, "epoch": 2356} {"train_loss": -31.431577682495117, "global_step": 285110, "epoch": 2356} {"train_loss": -37.8254280090332, "global_step": 285111, "epoch": 2356} {"train_loss": -37.639251708984375, "global_step": 285112, "epoch": 2356} {"train_loss": -37.313941955566406, "global_step": 285113, "epoch": 2356} {"train_loss": -36.21928024291992, "global_step": 285114, "epoch": 2356} {"train_loss": -35.01274490356445, "global_step": 285115, "epoch": 2356} {"train_loss": -38.11256408691406, "global_step": 285116, "epoch": 2356} {"train_loss": -35.22365951538086, "global_step": 285117, "epoch": 2356} {"train_loss": -38.32316589355469, "global_step": 285118, "epoch": 2356} {"train_loss": -37.84816360473633, "global_step": 285119, "epoch": 2356} {"train_loss": -37.8169059753418, "global_step": 285120, "epoch": 2356} {"train_loss": -36.216766357421875, "global_step": 285121, "epoch": 2356} {"train_loss": -36.88051223754883, "global_step": 285122, "epoch": 2356} {"train_loss": -38.12305450439453, "global_step": 285123, "epoch": 2356} {"train_loss": -36.517616271972656, "global_step": 285124, "epoch": 2356} {"train_loss": -33.18122482299805, "global_step": 285125, "epoch": 2356} {"train_loss": -37.132286071777344, "global_step": 285126, "epoch": 2356} {"train_loss": -38.68421173095703, "global_step": 285127, "epoch": 2356} {"train_loss": -38.6897087097168, "global_step": 285128, "epoch": 2356} {"train_loss": -38.30647659301758, "global_step": 285129, "epoch": 2356} {"train_loss": -38.91086959838867, "global_step": 285130, "epoch": 2356} {"train_loss": -39.04343795776367, "global_step": 285131, "epoch": 2356} {"train_loss": -39.28829574584961, "global_step": 285132, "epoch": 2356} {"train_loss": -36.35166549682617, "global_step": 285133, "epoch": 2356} {"train_loss": -38.816707611083984, "global_step": 285134, "epoch": 2356} {"train_loss": -39.639137268066406, "global_step": 285135, "epoch": 2356} {"train_loss": -38.655799865722656, "global_step": 285136, "epoch": 2356} {"train_loss": -39.58639144897461, "global_step": 285137, "epoch": 2356} {"train_loss": -38.60154342651367, "global_step": 285138, "epoch": 2356} {"train_loss": -39.69732666015625, "global_step": 285139, "epoch": 2356} {"train_loss": -39.105934143066406, "global_step": 285140, "epoch": 2356} {"train_loss": -38.659912109375, "global_step": 285141, "epoch": 2356} {"train_loss": -39.903724670410156, "global_step": 285142, "epoch": 2356} {"train_loss": -40.33469772338867, "global_step": 285143, "epoch": 2356} {"train_loss": -39.73843002319336, "global_step": 285144, "epoch": 2356} {"train_loss": -39.91519546508789, "global_step": 285145, "epoch": 2356} {"train_loss": -39.37051773071289, "global_step": 285146, "epoch": 2356} {"train_loss": -39.58696365356445, "global_step": 285147, "epoch": 2356} {"train_loss": -39.58207321166992, "global_step": 285148, "epoch": 2356} {"train_loss": -39.97304153442383, "global_step": 285149, "epoch": 2356} {"train_loss": -40.425716400146484, "global_step": 285150, "epoch": 2356} {"train_loss": -39.5576286315918, "global_step": 285151, "epoch": 2356} {"train_loss": -39.63980484008789, "global_step": 285152, "epoch": 2356} {"train_loss": -39.88474655151367, "global_step": 285153, "epoch": 2356} {"train_loss": -39.43715286254883, "global_step": 285154, "epoch": 2356} {"train_loss": -40.72188186645508, "global_step": 285155, "epoch": 2356} {"train_loss": -40.25010681152344, "global_step": 285156, "epoch": 2356} {"train_loss": -39.7428092956543, "global_step": 285157, "epoch": 2356} {"train_loss": -38.39496994018555, "global_step": 285158, "epoch": 2356} {"train_loss": -39.4713249206543, "global_step": 285159, "epoch": 2356} {"train_loss": -39.95991897583008, "global_step": 285160, "epoch": 2356} {"train_loss": -40.35457992553711, "global_step": 285161, "epoch": 2356} {"train_loss": -40.12974166870117, "global_step": 285162, "epoch": 2356} {"train_loss": -40.046573638916016, "global_step": 285163, "epoch": 2356} {"train_loss": -39.9921989440918, "global_step": 285164, "epoch": 2356} {"train_loss": -39.66067123413086, "global_step": 285165, "epoch": 2356} {"train_loss": -40.373661041259766, "global_step": 285166, "epoch": 2356} {"train_loss": -41.197330474853516, "global_step": 285167, "epoch": 2356} {"train_loss": -40.505672454833984, "global_step": 285168, "epoch": 2356} {"train_loss": -40.25969314575195, "global_step": 285169, "epoch": 2356} {"train_loss": -40.735225677490234, "global_step": 285170, "epoch": 2356} {"train_loss": -40.39848327636719, "global_step": 285171, "epoch": 2356} {"train_loss": -40.8470573425293, "global_step": 285172, "epoch": 2356} {"train_loss": -40.95772933959961, "global_step": 285173, "epoch": 2356} {"train_loss": -40.801204681396484, "global_step": 285174, "epoch": 2356} {"train_loss": -40.462249755859375, "global_step": 285175, "epoch": 2356} {"train_loss": -40.88473129272461, "global_step": 285176, "epoch": 2356} {"train_loss": -40.83974075317383, "global_step": 285177, "epoch": 2356} {"train_loss": -40.69240951538086, "global_step": 285178, "epoch": 2356} {"train_loss": -40.91083526611328, "global_step": 285179, "epoch": 2356} {"train_loss": -41.4422607421875, "global_step": 285180, "epoch": 2356} {"train_loss": -40.54493713378906, "global_step": 285181, "epoch": 2356} {"train_loss": -41.23002624511719, "global_step": 285182, "epoch": 2356} {"train_loss": -41.45454788208008, "global_step": 285183, "epoch": 2356} {"train_loss": -40.34487533569336, "global_step": 285184, "epoch": 2356} {"train_loss": -41.00410842895508, "global_step": 285185, "epoch": 2356} {"train_loss": -41.4625129699707, "global_step": 285186, "epoch": 2356} {"train_loss": -40.478660583496094, "global_step": 285187, "epoch": 2356} {"train_loss": -41.583580017089844, "global_step": 285188, "epoch": 2356} {"train_loss": -40.04423522949219, "global_step": 285189, "epoch": 2356} {"train_loss": -41.27138137817383, "global_step": 285190, "epoch": 2356} {"train_loss": -41.515724182128906, "global_step": 285191, "epoch": 2356} {"train_loss": -40.8151741027832, "global_step": 285192, "epoch": 2356} {"train_loss": -40.52790451049805, "global_step": 285193, "epoch": 2356} {"train_loss": -41.329612731933594, "global_step": 285194, "epoch": 2356} {"train_loss": -41.88521957397461, "global_step": 285195, "epoch": 2356} {"train_loss": -38.848229069355106, "global_step": 285196, "epoch": 2356, "val_loss": 2554579.25} {"train_loss": -41.74858856201172, "global_step": 285197, "epoch": 2357} {"train_loss": -42.118343353271484, "global_step": 285198, "epoch": 2357} {"train_loss": -41.97018051147461, "global_step": 285199, "epoch": 2357} {"train_loss": -41.4189567565918, "global_step": 285200, "epoch": 2357} {"train_loss": -42.249427795410156, "global_step": 285201, "epoch": 2357} {"train_loss": -40.82350540161133, "global_step": 285202, "epoch": 2357} {"train_loss": -41.51629638671875, "global_step": 285203, "epoch": 2357} {"train_loss": -41.74364471435547, "global_step": 285204, "epoch": 2357} {"train_loss": -41.662288665771484, "global_step": 285205, "epoch": 2357} {"train_loss": -41.70904541015625, "global_step": 285206, "epoch": 2357} {"train_loss": -40.953670501708984, "global_step": 285207, "epoch": 2357} {"train_loss": -40.95647048950195, "global_step": 285208, "epoch": 2357} {"train_loss": -40.066619873046875, "global_step": 285209, "epoch": 2357} {"train_loss": -40.53081130981445, "global_step": 285210, "epoch": 2357} {"train_loss": -40.24990463256836, "global_step": 285211, "epoch": 2357} {"train_loss": -38.97664260864258, "global_step": 285212, "epoch": 2357} {"train_loss": -41.04471206665039, "global_step": 285213, "epoch": 2357} {"train_loss": -42.07707214355469, "global_step": 285214, "epoch": 2357} {"train_loss": -41.496559143066406, "global_step": 285215, "epoch": 2357} {"train_loss": -39.76594924926758, "global_step": 285216, "epoch": 2357} {"train_loss": -40.9434928894043, "global_step": 285217, "epoch": 2357} {"train_loss": -41.126991271972656, "global_step": 285218, "epoch": 2357} {"train_loss": -41.45939254760742, "global_step": 285219, "epoch": 2357} {"train_loss": -41.83783721923828, "global_step": 285220, "epoch": 2357} {"train_loss": -40.78728485107422, "global_step": 285221, "epoch": 2357} {"train_loss": -41.33989715576172, "global_step": 285222, "epoch": 2357} {"train_loss": -41.34521484375, "global_step": 285223, "epoch": 2357} {"train_loss": -42.05275344848633, "global_step": 285224, "epoch": 2357} {"train_loss": -41.7584228515625, "global_step": 285225, "epoch": 2357} {"train_loss": -41.68560028076172, "global_step": 285226, "epoch": 2357} {"train_loss": -41.97004318237305, "global_step": 285227, "epoch": 2357} {"train_loss": -41.90693283081055, "global_step": 285228, "epoch": 2357} {"train_loss": -41.14787673950195, "global_step": 285229, "epoch": 2357} {"train_loss": -41.90305709838867, "global_step": 285230, "epoch": 2357} {"train_loss": -41.98011016845703, "global_step": 285231, "epoch": 2357} {"train_loss": -41.27614974975586, "global_step": 285232, "epoch": 2357} {"train_loss": -40.449256896972656, "global_step": 285233, "epoch": 2357} {"train_loss": -41.87580108642578, "global_step": 285234, "epoch": 2357} {"train_loss": -41.50517654418945, "global_step": 285235, "epoch": 2357} {"train_loss": -41.54282760620117, "global_step": 285236, "epoch": 2357} {"train_loss": -41.708404541015625, "global_step": 285237, "epoch": 2357} {"train_loss": -41.52356719970703, "global_step": 285238, "epoch": 2357} {"train_loss": -41.93006134033203, "global_step": 285239, "epoch": 2357} {"train_loss": -42.191009521484375, "global_step": 285240, "epoch": 2357} {"train_loss": -42.102779388427734, "global_step": 285241, "epoch": 2357} {"train_loss": -42.554237365722656, "global_step": 285242, "epoch": 2357} {"train_loss": -42.17670822143555, "global_step": 285243, "epoch": 2357} {"train_loss": -42.28188705444336, "global_step": 285244, "epoch": 2357} {"train_loss": -42.3615837097168, "global_step": 285245, "epoch": 2357} {"train_loss": -41.85014343261719, "global_step": 285246, "epoch": 2357} {"train_loss": -39.609375, "global_step": 285247, "epoch": 2357} {"train_loss": -39.6535530090332, "global_step": 285248, "epoch": 2357} {"train_loss": -41.50812911987305, "global_step": 285249, "epoch": 2357} {"train_loss": -40.996761322021484, "global_step": 285250, "epoch": 2357} {"train_loss": -40.95942306518555, "global_step": 285251, "epoch": 2357} {"train_loss": -40.620906829833984, "global_step": 285252, "epoch": 2357} {"train_loss": -40.8447380065918, "global_step": 285253, "epoch": 2357} {"train_loss": -40.66701126098633, "global_step": 285254, "epoch": 2357} {"train_loss": -38.86483383178711, "global_step": 285255, "epoch": 2357} {"train_loss": -40.13785934448242, "global_step": 285256, "epoch": 2357} {"train_loss": -41.46281814575195, "global_step": 285257, "epoch": 2357} {"train_loss": -36.87831497192383, "global_step": 285258, "epoch": 2357} {"train_loss": -37.72410202026367, "global_step": 285259, "epoch": 2357} {"train_loss": -41.08587646484375, "global_step": 285260, "epoch": 2357} {"train_loss": -38.583251953125, "global_step": 285261, "epoch": 2357} {"train_loss": -41.09140396118164, "global_step": 285262, "epoch": 2357} {"train_loss": -38.09499740600586, "global_step": 285263, "epoch": 2357} {"train_loss": -40.88397979736328, "global_step": 285264, "epoch": 2357} {"train_loss": -40.550437927246094, "global_step": 285265, "epoch": 2357} {"train_loss": -40.246360778808594, "global_step": 285266, "epoch": 2357} {"train_loss": -41.544464111328125, "global_step": 285267, "epoch": 2357} {"train_loss": -39.527278900146484, "global_step": 285268, "epoch": 2357} {"train_loss": -41.981536865234375, "global_step": 285269, "epoch": 2357} {"train_loss": -40.74846267700195, "global_step": 285270, "epoch": 2357} {"train_loss": -40.001644134521484, "global_step": 285271, "epoch": 2357} {"train_loss": -39.62971496582031, "global_step": 285272, "epoch": 2357} {"train_loss": -42.15045928955078, "global_step": 285273, "epoch": 2357} {"train_loss": -39.83660125732422, "global_step": 285274, "epoch": 2357} {"train_loss": -41.409053802490234, "global_step": 285275, "epoch": 2357} {"train_loss": -41.72623825073242, "global_step": 285276, "epoch": 2357} {"train_loss": -40.611602783203125, "global_step": 285277, "epoch": 2357} {"train_loss": -41.612606048583984, "global_step": 285278, "epoch": 2357} {"train_loss": -41.123260498046875, "global_step": 285279, "epoch": 2357} {"train_loss": -40.879268646240234, "global_step": 285280, "epoch": 2357} {"train_loss": -42.14809799194336, "global_step": 285281, "epoch": 2357} {"train_loss": -40.660194396972656, "global_step": 285282, "epoch": 2357} {"train_loss": -41.697689056396484, "global_step": 285283, "epoch": 2357} {"train_loss": -41.463172912597656, "global_step": 285284, "epoch": 2357} {"train_loss": -41.68235778808594, "global_step": 285285, "epoch": 2357} {"train_loss": -42.215484619140625, "global_step": 285286, "epoch": 2357} {"train_loss": -41.58027648925781, "global_step": 285287, "epoch": 2357} {"train_loss": -40.983951568603516, "global_step": 285288, "epoch": 2357} {"train_loss": -41.97475814819336, "global_step": 285289, "epoch": 2357} {"train_loss": -41.67026901245117, "global_step": 285290, "epoch": 2357} {"train_loss": -42.12287521362305, "global_step": 285291, "epoch": 2357} {"train_loss": -41.54956817626953, "global_step": 285292, "epoch": 2357} {"train_loss": -41.498775482177734, "global_step": 285293, "epoch": 2357} {"train_loss": -42.0208625793457, "global_step": 285294, "epoch": 2357} {"train_loss": -41.223297119140625, "global_step": 285295, "epoch": 2357} {"train_loss": -41.613311767578125, "global_step": 285296, "epoch": 2357} {"train_loss": -41.544471740722656, "global_step": 285297, "epoch": 2357} {"train_loss": -42.04049301147461, "global_step": 285298, "epoch": 2357} {"train_loss": -41.32341384887695, "global_step": 285299, "epoch": 2357} {"train_loss": -41.41761016845703, "global_step": 285300, "epoch": 2357} {"train_loss": -41.76375961303711, "global_step": 285301, "epoch": 2357} {"train_loss": -41.05086898803711, "global_step": 285302, "epoch": 2357} {"train_loss": -41.32697296142578, "global_step": 285303, "epoch": 2357} {"train_loss": -41.64199447631836, "global_step": 285304, "epoch": 2357} {"train_loss": -41.27079772949219, "global_step": 285305, "epoch": 2357} {"train_loss": -42.288265228271484, "global_step": 285306, "epoch": 2357} {"train_loss": -42.27552032470703, "global_step": 285307, "epoch": 2357} {"train_loss": -40.85591506958008, "global_step": 285308, "epoch": 2357} {"train_loss": -41.69196319580078, "global_step": 285309, "epoch": 2357} {"train_loss": -40.37876892089844, "global_step": 285310, "epoch": 2357} {"train_loss": -41.39458084106445, "global_step": 285311, "epoch": 2357} {"train_loss": -41.77588653564453, "global_step": 285312, "epoch": 2357} {"train_loss": -40.65102767944336, "global_step": 285313, "epoch": 2357} {"train_loss": -37.17460250854492, "global_step": 285314, "epoch": 2357} {"train_loss": -38.663272857666016, "global_step": 285315, "epoch": 2357} {"train_loss": -41.707298278808594, "global_step": 285316, "epoch": 2357} {"train_loss": -41.12720212069425, "global_step": 285317, "epoch": 2357, "val_loss": 2608695.25} {"train_loss": -40.883636474609375, "global_step": 285318, "epoch": 2358} {"train_loss": -41.888187408447266, "global_step": 285319, "epoch": 2358} {"train_loss": -42.63176727294922, "global_step": 285320, "epoch": 2358} {"train_loss": -41.66488265991211, "global_step": 285321, "epoch": 2358} {"train_loss": -41.94997787475586, "global_step": 285322, "epoch": 2358} {"train_loss": -42.537757873535156, "global_step": 285323, "epoch": 2358} {"train_loss": -42.18446350097656, "global_step": 285324, "epoch": 2358} {"train_loss": -42.36090087890625, "global_step": 285325, "epoch": 2358} {"train_loss": -42.151885986328125, "global_step": 285326, "epoch": 2358} {"train_loss": -41.3787727355957, "global_step": 285327, "epoch": 2358} {"train_loss": -41.69431686401367, "global_step": 285328, "epoch": 2358} {"train_loss": -41.785701751708984, "global_step": 285329, "epoch": 2358} {"train_loss": -42.230587005615234, "global_step": 285330, "epoch": 2358} {"train_loss": -42.38508987426758, "global_step": 285331, "epoch": 2358} {"train_loss": -42.615875244140625, "global_step": 285332, "epoch": 2358} {"train_loss": -42.309608459472656, "global_step": 285333, "epoch": 2358} {"train_loss": -42.343624114990234, "global_step": 285334, "epoch": 2358} {"train_loss": -42.7547721862793, "global_step": 285335, "epoch": 2358} {"train_loss": -42.29460144042969, "global_step": 285336, "epoch": 2358} {"train_loss": -42.735984802246094, "global_step": 285337, "epoch": 2358} {"train_loss": -42.47447204589844, "global_step": 285338, "epoch": 2358} {"train_loss": -41.49992370605469, "global_step": 285339, "epoch": 2358} {"train_loss": -42.441097259521484, "global_step": 285340, "epoch": 2358} {"train_loss": -42.04338455200195, "global_step": 285341, "epoch": 2358} {"train_loss": -42.75778579711914, "global_step": 285342, "epoch": 2358} {"train_loss": -42.51194381713867, "global_step": 285343, "epoch": 2358} {"train_loss": -42.694210052490234, "global_step": 285344, "epoch": 2358} {"train_loss": -42.5738639831543, "global_step": 285345, "epoch": 2358} {"train_loss": -43.18555450439453, "global_step": 285346, "epoch": 2358} {"train_loss": -42.56592559814453, "global_step": 285347, "epoch": 2358} {"train_loss": -43.25555419921875, "global_step": 285348, "epoch": 2358} {"train_loss": -42.578670501708984, "global_step": 285349, "epoch": 2358} {"train_loss": -43.054054260253906, "global_step": 285350, "epoch": 2358} {"train_loss": -42.7768669128418, "global_step": 285351, "epoch": 2358} {"train_loss": -42.56232833862305, "global_step": 285352, "epoch": 2358} {"train_loss": -42.65647506713867, "global_step": 285353, "epoch": 2358} {"train_loss": -43.01862716674805, "global_step": 285354, "epoch": 2358} {"train_loss": -43.08481979370117, "global_step": 285355, "epoch": 2358} {"train_loss": -42.96059799194336, "global_step": 285356, "epoch": 2358} {"train_loss": -42.79296875, "global_step": 285357, "epoch": 2358} {"train_loss": -42.30534744262695, "global_step": 285358, "epoch": 2358} {"train_loss": -42.22060775756836, "global_step": 285359, "epoch": 2358} {"train_loss": -42.7674674987793, "global_step": 285360, "epoch": 2358} {"train_loss": -42.03030014038086, "global_step": 285361, "epoch": 2358} {"train_loss": -42.050655364990234, "global_step": 285362, "epoch": 2358} {"train_loss": -42.81155014038086, "global_step": 285363, "epoch": 2358} {"train_loss": -43.416568756103516, "global_step": 285364, "epoch": 2358} {"train_loss": -42.75307846069336, "global_step": 285365, "epoch": 2358} {"train_loss": -42.46085739135742, "global_step": 285366, "epoch": 2358} {"train_loss": -42.563106536865234, "global_step": 285367, "epoch": 2358} {"train_loss": -42.00285720825195, "global_step": 285368, "epoch": 2358} {"train_loss": -42.564754486083984, "global_step": 285369, "epoch": 2358} {"train_loss": -42.64374923706055, "global_step": 285370, "epoch": 2358} {"train_loss": -43.53214645385742, "global_step": 285371, "epoch": 2358} {"train_loss": -41.892879486083984, "global_step": 285372, "epoch": 2358} {"train_loss": -43.55329513549805, "global_step": 285373, "epoch": 2358} {"train_loss": -43.270023345947266, "global_step": 285374, "epoch": 2358} {"train_loss": -42.956233978271484, "global_step": 285375, "epoch": 2358} {"train_loss": -43.9567985534668, "global_step": 285376, "epoch": 2358} {"train_loss": -43.506954193115234, "global_step": 285377, "epoch": 2358} {"train_loss": -43.12589645385742, "global_step": 285378, "epoch": 2358} {"train_loss": -42.2574462890625, "global_step": 285379, "epoch": 2358} {"train_loss": -43.56280517578125, "global_step": 285380, "epoch": 2358} {"train_loss": -42.83687210083008, "global_step": 285381, "epoch": 2358} {"train_loss": -42.31033706665039, "global_step": 285382, "epoch": 2358} {"train_loss": -43.029052734375, "global_step": 285383, "epoch": 2358} {"train_loss": -42.85148239135742, "global_step": 285384, "epoch": 2358} {"train_loss": -41.816688537597656, "global_step": 285385, "epoch": 2358} {"train_loss": -42.777366638183594, "global_step": 285386, "epoch": 2358} {"train_loss": -42.50602340698242, "global_step": 285387, "epoch": 2358} {"train_loss": -43.21613693237305, "global_step": 285388, "epoch": 2358} {"train_loss": -43.147621154785156, "global_step": 285389, "epoch": 2358} {"train_loss": -42.993343353271484, "global_step": 285390, "epoch": 2358} {"train_loss": -41.51987838745117, "global_step": 285391, "epoch": 2358} {"train_loss": -41.43254089355469, "global_step": 285392, "epoch": 2358} {"train_loss": -42.13936996459961, "global_step": 285393, "epoch": 2358} {"train_loss": -42.4289665222168, "global_step": 285394, "epoch": 2358} {"train_loss": -42.69438552856445, "global_step": 285395, "epoch": 2358} {"train_loss": -41.45121383666992, "global_step": 285396, "epoch": 2358} {"train_loss": -40.304847717285156, "global_step": 285397, "epoch": 2358} {"train_loss": -42.26840591430664, "global_step": 285398, "epoch": 2358} {"train_loss": -42.77537155151367, "global_step": 285399, "epoch": 2358} {"train_loss": -40.704078674316406, "global_step": 285400, "epoch": 2358} {"train_loss": -39.76179122924805, "global_step": 285401, "epoch": 2358} {"train_loss": -42.16987228393555, "global_step": 285402, "epoch": 2358} {"train_loss": -42.538482666015625, "global_step": 285403, "epoch": 2358} {"train_loss": -39.973873138427734, "global_step": 285404, "epoch": 2358} {"train_loss": -35.013282775878906, "global_step": 285405, "epoch": 2358} {"train_loss": -37.18374252319336, "global_step": 285406, "epoch": 2358} {"train_loss": -41.70574188232422, "global_step": 285407, "epoch": 2358} {"train_loss": -38.64668655395508, "global_step": 285408, "epoch": 2358} {"train_loss": -35.44132614135742, "global_step": 285409, "epoch": 2358} {"train_loss": -42.266822814941406, "global_step": 285410, "epoch": 2358} {"train_loss": -39.39101791381836, "global_step": 285411, "epoch": 2358} {"train_loss": -40.51234817504883, "global_step": 285412, "epoch": 2358} {"train_loss": -41.84820556640625, "global_step": 285413, "epoch": 2358} {"train_loss": -40.961769104003906, "global_step": 285414, "epoch": 2358} {"train_loss": -42.136810302734375, "global_step": 285415, "epoch": 2358} {"train_loss": -39.81241989135742, "global_step": 285416, "epoch": 2358} {"train_loss": -41.881187438964844, "global_step": 285417, "epoch": 2358} {"train_loss": -40.66415786743164, "global_step": 285418, "epoch": 2358} {"train_loss": -40.8475341796875, "global_step": 285419, "epoch": 2358} {"train_loss": -40.40193557739258, "global_step": 285420, "epoch": 2358} {"train_loss": -39.862300872802734, "global_step": 285421, "epoch": 2358} {"train_loss": -42.1643180847168, "global_step": 285422, "epoch": 2358} {"train_loss": -39.828765869140625, "global_step": 285423, "epoch": 2358} {"train_loss": -39.14976119995117, "global_step": 285424, "epoch": 2358} {"train_loss": -38.233638763427734, "global_step": 285425, "epoch": 2358} {"train_loss": -42.25570297241211, "global_step": 285426, "epoch": 2358} {"train_loss": -41.21870803833008, "global_step": 285427, "epoch": 2358} {"train_loss": -42.1900634765625, "global_step": 285428, "epoch": 2358} {"train_loss": -42.00253677368164, "global_step": 285429, "epoch": 2358} {"train_loss": -41.0710563659668, "global_step": 285430, "epoch": 2358} {"train_loss": -42.08590316772461, "global_step": 285431, "epoch": 2358} {"train_loss": -42.2297477722168, "global_step": 285432, "epoch": 2358} {"train_loss": -42.40926742553711, "global_step": 285433, "epoch": 2358} {"train_loss": -41.32533645629883, "global_step": 285434, "epoch": 2358} {"train_loss": -41.74115753173828, "global_step": 285435, "epoch": 2358} {"train_loss": -43.02227783203125, "global_step": 285436, "epoch": 2358} {"train_loss": -41.37086486816406, "global_step": 285437, "epoch": 2358} {"train_loss": -41.92208272760565, "global_step": 285438, "epoch": 2358, "val_loss": 2441637.25} {"train_loss": -42.52161407470703, "global_step": 285439, "epoch": 2359} {"train_loss": -41.71952438354492, "global_step": 285440, "epoch": 2359} {"train_loss": -42.29998016357422, "global_step": 285441, "epoch": 2359} {"train_loss": -42.90926742553711, "global_step": 285442, "epoch": 2359} {"train_loss": -42.57450485229492, "global_step": 285443, "epoch": 2359} {"train_loss": -43.319915771484375, "global_step": 285444, "epoch": 2359} {"train_loss": -43.02539825439453, "global_step": 285445, "epoch": 2359} {"train_loss": -43.3326530456543, "global_step": 285446, "epoch": 2359} {"train_loss": -43.249568939208984, "global_step": 285447, "epoch": 2359} {"train_loss": -42.05730056762695, "global_step": 285448, "epoch": 2359} {"train_loss": -42.80531692504883, "global_step": 285449, "epoch": 2359} {"train_loss": -42.90913772583008, "global_step": 285450, "epoch": 2359} {"train_loss": -43.07932662963867, "global_step": 285451, "epoch": 2359} {"train_loss": -42.62196731567383, "global_step": 285452, "epoch": 2359} {"train_loss": -41.528656005859375, "global_step": 285453, "epoch": 2359} {"train_loss": -42.957244873046875, "global_step": 285454, "epoch": 2359} {"train_loss": -42.712398529052734, "global_step": 285455, "epoch": 2359} {"train_loss": -42.99441146850586, "global_step": 285456, "epoch": 2359} {"train_loss": -43.15966033935547, "global_step": 285457, "epoch": 2359} {"train_loss": -42.913787841796875, "global_step": 285458, "epoch": 2359} {"train_loss": -42.782283782958984, "global_step": 285459, "epoch": 2359} {"train_loss": -43.140045166015625, "global_step": 285460, "epoch": 2359} {"train_loss": -42.478878021240234, "global_step": 285461, "epoch": 2359} {"train_loss": -42.83644104003906, "global_step": 285462, "epoch": 2359} {"train_loss": -43.20234298706055, "global_step": 285463, "epoch": 2359} {"train_loss": -43.4404411315918, "global_step": 285464, "epoch": 2359} {"train_loss": -42.937686920166016, "global_step": 285465, "epoch": 2359} {"train_loss": -43.82143020629883, "global_step": 285466, "epoch": 2359} {"train_loss": -42.833492279052734, "global_step": 285467, "epoch": 2359} {"train_loss": -42.465511322021484, "global_step": 285468, "epoch": 2359} {"train_loss": -41.969295501708984, "global_step": 285469, "epoch": 2359} {"train_loss": -41.76212692260742, "global_step": 285470, "epoch": 2359} {"train_loss": -41.2923698425293, "global_step": 285471, "epoch": 2359} {"train_loss": -41.7426872253418, "global_step": 285472, "epoch": 2359} {"train_loss": -41.710350036621094, "global_step": 285473, "epoch": 2359} {"train_loss": -41.241973876953125, "global_step": 285474, "epoch": 2359} {"train_loss": -40.85963439941406, "global_step": 285475, "epoch": 2359} {"train_loss": -39.023681640625, "global_step": 285476, "epoch": 2359} {"train_loss": -37.85075759887695, "global_step": 285477, "epoch": 2359} {"train_loss": -38.138343811035156, "global_step": 285478, "epoch": 2359} {"train_loss": -42.00856018066406, "global_step": 285479, "epoch": 2359} {"train_loss": -40.86792755126953, "global_step": 285480, "epoch": 2359} {"train_loss": -39.99119186401367, "global_step": 285481, "epoch": 2359} {"train_loss": -41.2222785949707, "global_step": 285482, "epoch": 2359} {"train_loss": -41.785091400146484, "global_step": 285483, "epoch": 2359} {"train_loss": -40.64412307739258, "global_step": 285484, "epoch": 2359} {"train_loss": -42.2525520324707, "global_step": 285485, "epoch": 2359} {"train_loss": -41.16886520385742, "global_step": 285486, "epoch": 2359} {"train_loss": -40.81086349487305, "global_step": 285487, "epoch": 2359} {"train_loss": -41.481693267822266, "global_step": 285488, "epoch": 2359} {"train_loss": -42.508792877197266, "global_step": 285489, "epoch": 2359} {"train_loss": -41.03205490112305, "global_step": 285490, "epoch": 2359} {"train_loss": -42.46404266357422, "global_step": 285491, "epoch": 2359} {"train_loss": -41.887088775634766, "global_step": 285492, "epoch": 2359} {"train_loss": -42.16822052001953, "global_step": 285493, "epoch": 2359} {"train_loss": -42.526912689208984, "global_step": 285494, "epoch": 2359} {"train_loss": -41.820037841796875, "global_step": 285495, "epoch": 2359} {"train_loss": -41.59237289428711, "global_step": 285496, "epoch": 2359} {"train_loss": -41.96208572387695, "global_step": 285497, "epoch": 2359} {"train_loss": -42.75498580932617, "global_step": 285498, "epoch": 2359} {"train_loss": -41.801883697509766, "global_step": 285499, "epoch": 2359} {"train_loss": -42.09544372558594, "global_step": 285500, "epoch": 2359} {"train_loss": -42.225196838378906, "global_step": 285501, "epoch": 2359} {"train_loss": -42.035499572753906, "global_step": 285502, "epoch": 2359} {"train_loss": -42.12514877319336, "global_step": 285503, "epoch": 2359} {"train_loss": -43.25043487548828, "global_step": 285504, "epoch": 2359} {"train_loss": -42.992095947265625, "global_step": 285505, "epoch": 2359} {"train_loss": -42.21176528930664, "global_step": 285506, "epoch": 2359} {"train_loss": -42.79541015625, "global_step": 285507, "epoch": 2359} {"train_loss": -43.0384521484375, "global_step": 285508, "epoch": 2359} {"train_loss": -41.502105712890625, "global_step": 285509, "epoch": 2359} {"train_loss": -43.26959228515625, "global_step": 285510, "epoch": 2359} {"train_loss": -43.32888412475586, "global_step": 285511, "epoch": 2359} {"train_loss": -42.56203079223633, "global_step": 285512, "epoch": 2359} {"train_loss": -43.18966293334961, "global_step": 285513, "epoch": 2359} {"train_loss": -42.697940826416016, "global_step": 285514, "epoch": 2359} {"train_loss": -42.5689582824707, "global_step": 285515, "epoch": 2359} {"train_loss": -43.03211212158203, "global_step": 285516, "epoch": 2359} {"train_loss": -42.7235221862793, "global_step": 285517, "epoch": 2359} {"train_loss": -43.25065994262695, "global_step": 285518, "epoch": 2359} {"train_loss": -43.149078369140625, "global_step": 285519, "epoch": 2359} {"train_loss": -43.0999870300293, "global_step": 285520, "epoch": 2359} {"train_loss": -43.35809326171875, "global_step": 285521, "epoch": 2359} {"train_loss": -42.92448806762695, "global_step": 285522, "epoch": 2359} {"train_loss": -43.22713088989258, "global_step": 285523, "epoch": 2359} {"train_loss": -43.55001449584961, "global_step": 285524, "epoch": 2359} {"train_loss": -41.51394271850586, "global_step": 285525, "epoch": 2359} {"train_loss": -43.09859085083008, "global_step": 285526, "epoch": 2359} {"train_loss": -43.324798583984375, "global_step": 285527, "epoch": 2359} {"train_loss": -43.13529968261719, "global_step": 285528, "epoch": 2359} {"train_loss": -39.51552963256836, "global_step": 285529, "epoch": 2359} {"train_loss": -43.14909362792969, "global_step": 285530, "epoch": 2359} {"train_loss": -37.93451690673828, "global_step": 285531, "epoch": 2359} {"train_loss": -43.31766891479492, "global_step": 285532, "epoch": 2359} {"train_loss": -36.3906135559082, "global_step": 285533, "epoch": 2359} {"train_loss": -43.1871223449707, "global_step": 285534, "epoch": 2359} {"train_loss": -43.55322265625, "global_step": 285535, "epoch": 2359} {"train_loss": -43.0019645690918, "global_step": 285536, "epoch": 2359} {"train_loss": -43.150699615478516, "global_step": 285537, "epoch": 2359} {"train_loss": -40.06546401977539, "global_step": 285538, "epoch": 2359} {"train_loss": -43.03672409057617, "global_step": 285539, "epoch": 2359} {"train_loss": -42.42325973510742, "global_step": 285540, "epoch": 2359} {"train_loss": -42.3433837890625, "global_step": 285541, "epoch": 2359} {"train_loss": -42.885101318359375, "global_step": 285542, "epoch": 2359} {"train_loss": -40.8575553894043, "global_step": 285543, "epoch": 2359} {"train_loss": -41.336509704589844, "global_step": 285544, "epoch": 2359} {"train_loss": -42.589385986328125, "global_step": 285545, "epoch": 2359} {"train_loss": -42.67127227783203, "global_step": 285546, "epoch": 2359} {"train_loss": -41.81905746459961, "global_step": 285547, "epoch": 2359} {"train_loss": -35.0019416809082, "global_step": 285548, "epoch": 2359} {"train_loss": -39.93352508544922, "global_step": 285549, "epoch": 2359} {"train_loss": -41.19465255737305, "global_step": 285550, "epoch": 2359} {"train_loss": -42.03668212890625, "global_step": 285551, "epoch": 2359} {"train_loss": -39.48537826538086, "global_step": 285552, "epoch": 2359} {"train_loss": -41.0611686706543, "global_step": 285553, "epoch": 2359} {"train_loss": -41.61210250854492, "global_step": 285554, "epoch": 2359} {"train_loss": -40.959197998046875, "global_step": 285555, "epoch": 2359} {"train_loss": -39.325103759765625, "global_step": 285556, "epoch": 2359} {"train_loss": -42.44901657104492, "global_step": 285557, "epoch": 2359} {"train_loss": -41.82603454589844, "global_step": 285558, "epoch": 2359} {"train_loss": -42.025964910333805, "global_step": 285559, "epoch": 2359, "val_loss": 2606293.75} {"train_loss": -41.83317565917969, "global_step": 285560, "epoch": 2360} {"train_loss": -39.6146354675293, "global_step": 285561, "epoch": 2360} {"train_loss": -42.18758773803711, "global_step": 285562, "epoch": 2360} {"train_loss": -40.489463806152344, "global_step": 285563, "epoch": 2360} {"train_loss": -41.338653564453125, "global_step": 285564, "epoch": 2360} {"train_loss": -40.83875274658203, "global_step": 285565, "epoch": 2360} {"train_loss": -42.3492431640625, "global_step": 285566, "epoch": 2360} {"train_loss": -40.611263275146484, "global_step": 285567, "epoch": 2360} {"train_loss": -41.9579963684082, "global_step": 285568, "epoch": 2360} {"train_loss": -40.40154266357422, "global_step": 285569, "epoch": 2360} {"train_loss": -38.72542953491211, "global_step": 285570, "epoch": 2360} {"train_loss": -42.09908676147461, "global_step": 285571, "epoch": 2360} {"train_loss": -41.07282638549805, "global_step": 285572, "epoch": 2360} {"train_loss": -39.34138107299805, "global_step": 285573, "epoch": 2360} {"train_loss": -40.96681213378906, "global_step": 285574, "epoch": 2360} {"train_loss": -42.78849792480469, "global_step": 285575, "epoch": 2360} {"train_loss": -41.529296875, "global_step": 285576, "epoch": 2360} {"train_loss": -41.98689651489258, "global_step": 285577, "epoch": 2360} {"train_loss": -42.08991241455078, "global_step": 285578, "epoch": 2360} {"train_loss": -41.7463493347168, "global_step": 285579, "epoch": 2360} {"train_loss": -42.50181198120117, "global_step": 285580, "epoch": 2360} {"train_loss": -41.2697639465332, "global_step": 285581, "epoch": 2360} {"train_loss": -40.07340621948242, "global_step": 285582, "epoch": 2360} {"train_loss": -40.98230743408203, "global_step": 285583, "epoch": 2360} {"train_loss": -40.554012298583984, "global_step": 285584, "epoch": 2360} {"train_loss": -41.79572677612305, "global_step": 285585, "epoch": 2360} {"train_loss": -39.9932746887207, "global_step": 285586, "epoch": 2360} {"train_loss": -42.22576904296875, "global_step": 285587, "epoch": 2360} {"train_loss": -41.62422561645508, "global_step": 285588, "epoch": 2360} {"train_loss": -40.105831146240234, "global_step": 285589, "epoch": 2360} {"train_loss": -41.88813781738281, "global_step": 285590, "epoch": 2360} {"train_loss": -42.32527542114258, "global_step": 285591, "epoch": 2360} {"train_loss": -40.07932662963867, "global_step": 285592, "epoch": 2360} {"train_loss": -42.13067626953125, "global_step": 285593, "epoch": 2360} {"train_loss": -42.1156005859375, "global_step": 285594, "epoch": 2360} {"train_loss": -39.82948303222656, "global_step": 285595, "epoch": 2360} {"train_loss": -39.66563415527344, "global_step": 285596, "epoch": 2360} {"train_loss": -41.38785934448242, "global_step": 285597, "epoch": 2360} {"train_loss": -39.56423568725586, "global_step": 285598, "epoch": 2360} {"train_loss": -42.07011795043945, "global_step": 285599, "epoch": 2360} {"train_loss": -41.92019271850586, "global_step": 285600, "epoch": 2360} {"train_loss": -40.92619705200195, "global_step": 285601, "epoch": 2360} {"train_loss": -42.130733489990234, "global_step": 285602, "epoch": 2360} {"train_loss": -40.705074310302734, "global_step": 285603, "epoch": 2360} {"train_loss": -42.317256927490234, "global_step": 285604, "epoch": 2360} {"train_loss": -41.29593276977539, "global_step": 285605, "epoch": 2360} {"train_loss": -41.35382080078125, "global_step": 285606, "epoch": 2360} {"train_loss": -40.911190032958984, "global_step": 285607, "epoch": 2360} {"train_loss": -38.80186080932617, "global_step": 285608, "epoch": 2360} {"train_loss": -40.81582260131836, "global_step": 285609, "epoch": 2360} {"train_loss": -39.86240768432617, "global_step": 285610, "epoch": 2360} {"train_loss": -40.43123245239258, "global_step": 285611, "epoch": 2360} {"train_loss": -41.81565856933594, "global_step": 285612, "epoch": 2360} {"train_loss": -36.032596588134766, "global_step": 285613, "epoch": 2360} {"train_loss": -39.0539436340332, "global_step": 285614, "epoch": 2360} {"train_loss": -41.148067474365234, "global_step": 285615, "epoch": 2360} {"train_loss": -40.28232955932617, "global_step": 285616, "epoch": 2360} {"train_loss": -40.37185287475586, "global_step": 285617, "epoch": 2360} {"train_loss": -35.065574645996094, "global_step": 285618, "epoch": 2360} {"train_loss": -39.2283935546875, "global_step": 285619, "epoch": 2360} {"train_loss": -39.80221939086914, "global_step": 285620, "epoch": 2360} {"train_loss": -35.56446075439453, "global_step": 285621, "epoch": 2360} {"train_loss": -38.896644592285156, "global_step": 285622, "epoch": 2360} {"train_loss": -40.36311721801758, "global_step": 285623, "epoch": 2360} {"train_loss": -38.4823112487793, "global_step": 285624, "epoch": 2360} {"train_loss": -34.22929763793945, "global_step": 285625, "epoch": 2360} {"train_loss": -40.04250717163086, "global_step": 285626, "epoch": 2360} {"train_loss": -36.763946533203125, "global_step": 285627, "epoch": 2360} {"train_loss": -39.5178108215332, "global_step": 285628, "epoch": 2360} {"train_loss": -35.98212432861328, "global_step": 285629, "epoch": 2360} {"train_loss": -40.222721099853516, "global_step": 285630, "epoch": 2360} {"train_loss": -39.097496032714844, "global_step": 285631, "epoch": 2360} {"train_loss": -38.752037048339844, "global_step": 285632, "epoch": 2360} {"train_loss": -36.53105163574219, "global_step": 285633, "epoch": 2360} {"train_loss": -38.90740966796875, "global_step": 285634, "epoch": 2360} {"train_loss": -37.32218551635742, "global_step": 285635, "epoch": 2360} {"train_loss": -38.85636520385742, "global_step": 285636, "epoch": 2360} {"train_loss": -36.61709213256836, "global_step": 285637, "epoch": 2360} {"train_loss": -39.65211868286133, "global_step": 285638, "epoch": 2360} {"train_loss": -39.86749267578125, "global_step": 285639, "epoch": 2360} {"train_loss": -39.584835052490234, "global_step": 285640, "epoch": 2360} {"train_loss": -39.23614501953125, "global_step": 285641, "epoch": 2360} {"train_loss": -38.97370147705078, "global_step": 285642, "epoch": 2360} {"train_loss": -39.561309814453125, "global_step": 285643, "epoch": 2360} {"train_loss": -39.22336959838867, "global_step": 285644, "epoch": 2360} {"train_loss": -39.34814453125, "global_step": 285645, "epoch": 2360} {"train_loss": -40.7457160949707, "global_step": 285646, "epoch": 2360} {"train_loss": -39.83417892456055, "global_step": 285647, "epoch": 2360} {"train_loss": -40.086097717285156, "global_step": 285648, "epoch": 2360} {"train_loss": -40.25397872924805, "global_step": 285649, "epoch": 2360} {"train_loss": -40.989593505859375, "global_step": 285650, "epoch": 2360} {"train_loss": -41.195674896240234, "global_step": 285651, "epoch": 2360} {"train_loss": -41.123409271240234, "global_step": 285652, "epoch": 2360} {"train_loss": -39.358497619628906, "global_step": 285653, "epoch": 2360} {"train_loss": -40.97407150268555, "global_step": 285654, "epoch": 2360} {"train_loss": -35.838191986083984, "global_step": 285655, "epoch": 2360} {"train_loss": -39.838409423828125, "global_step": 285656, "epoch": 2360} {"train_loss": -41.46738815307617, "global_step": 285657, "epoch": 2360} {"train_loss": -40.7320671081543, "global_step": 285658, "epoch": 2360} {"train_loss": -39.31483459472656, "global_step": 285659, "epoch": 2360} {"train_loss": -39.82530212402344, "global_step": 285660, "epoch": 2360} {"train_loss": -41.14593505859375, "global_step": 285661, "epoch": 2360} {"train_loss": -41.7783088684082, "global_step": 285662, "epoch": 2360} {"train_loss": -40.74433517456055, "global_step": 285663, "epoch": 2360} {"train_loss": -40.58272933959961, "global_step": 285664, "epoch": 2360} {"train_loss": -37.88508987426758, "global_step": 285665, "epoch": 2360} {"train_loss": -39.28269577026367, "global_step": 285666, "epoch": 2360} {"train_loss": -39.996070861816406, "global_step": 285667, "epoch": 2360} {"train_loss": -40.49739456176758, "global_step": 285668, "epoch": 2360} {"train_loss": -40.245296478271484, "global_step": 285669, "epoch": 2360} {"train_loss": -39.306983947753906, "global_step": 285670, "epoch": 2360} {"train_loss": -41.02601623535156, "global_step": 285671, "epoch": 2360} {"train_loss": -40.40642547607422, "global_step": 285672, "epoch": 2360} {"train_loss": -41.1182746887207, "global_step": 285673, "epoch": 2360} {"train_loss": -40.264556884765625, "global_step": 285674, "epoch": 2360} {"train_loss": -40.98356246948242, "global_step": 285675, "epoch": 2360} {"train_loss": -41.108924865722656, "global_step": 285676, "epoch": 2360} {"train_loss": -40.707672119140625, "global_step": 285677, "epoch": 2360} {"train_loss": -41.596378326416016, "global_step": 285678, "epoch": 2360} {"train_loss": -41.65426254272461, "global_step": 285679, "epoch": 2360} {"train_loss": -40.21163458075405, "global_step": 285680, "epoch": 2360, "val_loss": 3242843.25} {"train_loss": -38.72426986694336, "global_step": 285681, "epoch": 2361} {"train_loss": -41.68162536621094, "global_step": 285682, "epoch": 2361} {"train_loss": -38.89242172241211, "global_step": 285683, "epoch": 2361} {"train_loss": -38.82754135131836, "global_step": 285684, "epoch": 2361} {"train_loss": -40.80626678466797, "global_step": 285685, "epoch": 2361} {"train_loss": -40.74382400512695, "global_step": 285686, "epoch": 2361} {"train_loss": -40.71961212158203, "global_step": 285687, "epoch": 2361} {"train_loss": -41.536537170410156, "global_step": 285688, "epoch": 2361} {"train_loss": -40.99233627319336, "global_step": 285689, "epoch": 2361} {"train_loss": -41.193824768066406, "global_step": 285690, "epoch": 2361} {"train_loss": -39.688087463378906, "global_step": 285691, "epoch": 2361} {"train_loss": -37.7729377746582, "global_step": 285692, "epoch": 2361} {"train_loss": -39.482574462890625, "global_step": 285693, "epoch": 2361} {"train_loss": -40.310298919677734, "global_step": 285694, "epoch": 2361} {"train_loss": -40.935420989990234, "global_step": 285695, "epoch": 2361} {"train_loss": -40.40068435668945, "global_step": 285696, "epoch": 2361} {"train_loss": -38.73823928833008, "global_step": 285697, "epoch": 2361} {"train_loss": -41.36570358276367, "global_step": 285698, "epoch": 2361} {"train_loss": -41.155391693115234, "global_step": 285699, "epoch": 2361} {"train_loss": -40.61436080932617, "global_step": 285700, "epoch": 2361} {"train_loss": -41.19759750366211, "global_step": 285701, "epoch": 2361} {"train_loss": -41.40812301635742, "global_step": 285702, "epoch": 2361} {"train_loss": -41.76338577270508, "global_step": 285703, "epoch": 2361} {"train_loss": -41.2845344543457, "global_step": 285704, "epoch": 2361} {"train_loss": -40.92605209350586, "global_step": 285705, "epoch": 2361} {"train_loss": -41.20388412475586, "global_step": 285706, "epoch": 2361} {"train_loss": -40.8037223815918, "global_step": 285707, "epoch": 2361} {"train_loss": -40.87343215942383, "global_step": 285708, "epoch": 2361} {"train_loss": -39.18376159667969, "global_step": 285709, "epoch": 2361} {"train_loss": -41.46798324584961, "global_step": 285710, "epoch": 2361} {"train_loss": -42.025856018066406, "global_step": 285711, "epoch": 2361} {"train_loss": -41.26892852783203, "global_step": 285712, "epoch": 2361} {"train_loss": -40.46421432495117, "global_step": 285713, "epoch": 2361} {"train_loss": -41.45112991333008, "global_step": 285714, "epoch": 2361} {"train_loss": -40.74640655517578, "global_step": 285715, "epoch": 2361} {"train_loss": -40.924495697021484, "global_step": 285716, "epoch": 2361} {"train_loss": -42.097412109375, "global_step": 285717, "epoch": 2361} {"train_loss": -41.452850341796875, "global_step": 285718, "epoch": 2361} {"train_loss": -41.8758659362793, "global_step": 285719, "epoch": 2361} {"train_loss": -41.884002685546875, "global_step": 285720, "epoch": 2361} {"train_loss": -42.333412170410156, "global_step": 285721, "epoch": 2361} {"train_loss": -41.8613395690918, "global_step": 285722, "epoch": 2361} {"train_loss": -40.97427749633789, "global_step": 285723, "epoch": 2361} {"train_loss": -41.829288482666016, "global_step": 285724, "epoch": 2361} {"train_loss": -39.76264190673828, "global_step": 285725, "epoch": 2361} {"train_loss": -41.76999282836914, "global_step": 285726, "epoch": 2361} {"train_loss": -41.72040557861328, "global_step": 285727, "epoch": 2361} {"train_loss": -41.77143859863281, "global_step": 285728, "epoch": 2361} {"train_loss": -41.72407150268555, "global_step": 285729, "epoch": 2361} {"train_loss": -42.3891716003418, "global_step": 285730, "epoch": 2361} {"train_loss": -40.81287384033203, "global_step": 285731, "epoch": 2361} {"train_loss": -42.07439422607422, "global_step": 285732, "epoch": 2361} {"train_loss": -42.39075469970703, "global_step": 285733, "epoch": 2361} {"train_loss": -39.827266693115234, "global_step": 285734, "epoch": 2361} {"train_loss": -41.09626388549805, "global_step": 285735, "epoch": 2361} {"train_loss": -40.8443489074707, "global_step": 285736, "epoch": 2361} {"train_loss": -41.43878173828125, "global_step": 285737, "epoch": 2361} {"train_loss": -41.8510856628418, "global_step": 285738, "epoch": 2361} {"train_loss": -41.43605422973633, "global_step": 285739, "epoch": 2361} {"train_loss": -41.9912109375, "global_step": 285740, "epoch": 2361} {"train_loss": -42.39970779418945, "global_step": 285741, "epoch": 2361} {"train_loss": -41.9915657043457, "global_step": 285742, "epoch": 2361} {"train_loss": -42.334659576416016, "global_step": 285743, "epoch": 2361} {"train_loss": -42.4123649597168, "global_step": 285744, "epoch": 2361} {"train_loss": -41.81298828125, "global_step": 285745, "epoch": 2361} {"train_loss": -40.618202209472656, "global_step": 285746, "epoch": 2361} {"train_loss": -41.74177932739258, "global_step": 285747, "epoch": 2361} {"train_loss": -42.43977737426758, "global_step": 285748, "epoch": 2361} {"train_loss": -41.309654235839844, "global_step": 285749, "epoch": 2361} {"train_loss": -42.50179672241211, "global_step": 285750, "epoch": 2361} {"train_loss": -42.102657318115234, "global_step": 285751, "epoch": 2361} {"train_loss": -41.87295150756836, "global_step": 285752, "epoch": 2361} {"train_loss": -42.04116439819336, "global_step": 285753, "epoch": 2361} {"train_loss": -41.07118606567383, "global_step": 285754, "epoch": 2361} {"train_loss": -41.01607131958008, "global_step": 285755, "epoch": 2361} {"train_loss": -42.038761138916016, "global_step": 285756, "epoch": 2361} {"train_loss": -41.711421966552734, "global_step": 285757, "epoch": 2361} {"train_loss": -41.122920989990234, "global_step": 285758, "epoch": 2361} {"train_loss": -42.30845260620117, "global_step": 285759, "epoch": 2361} {"train_loss": -42.40254592895508, "global_step": 285760, "epoch": 2361} {"train_loss": -42.39765548706055, "global_step": 285761, "epoch": 2361} {"train_loss": -41.9235954284668, "global_step": 285762, "epoch": 2361} {"train_loss": -42.149940490722656, "global_step": 285763, "epoch": 2361} {"train_loss": -41.92205810546875, "global_step": 285764, "epoch": 2361} {"train_loss": -41.73493194580078, "global_step": 285765, "epoch": 2361} {"train_loss": -42.49079132080078, "global_step": 285766, "epoch": 2361} {"train_loss": -41.393409729003906, "global_step": 285767, "epoch": 2361} {"train_loss": -42.0899772644043, "global_step": 285768, "epoch": 2361} {"train_loss": -42.1660270690918, "global_step": 285769, "epoch": 2361} {"train_loss": -41.8720817565918, "global_step": 285770, "epoch": 2361} {"train_loss": -42.61214065551758, "global_step": 285771, "epoch": 2361} {"train_loss": -41.53947067260742, "global_step": 285772, "epoch": 2361} {"train_loss": -40.58531188964844, "global_step": 285773, "epoch": 2361} {"train_loss": -39.860069274902344, "global_step": 285774, "epoch": 2361} {"train_loss": -39.85070037841797, "global_step": 285775, "epoch": 2361} {"train_loss": -42.0504035949707, "global_step": 285776, "epoch": 2361} {"train_loss": -41.60905075073242, "global_step": 285777, "epoch": 2361} {"train_loss": -40.1060676574707, "global_step": 285778, "epoch": 2361} {"train_loss": -41.54536056518555, "global_step": 285779, "epoch": 2361} {"train_loss": -41.25093460083008, "global_step": 285780, "epoch": 2361} {"train_loss": -42.335365295410156, "global_step": 285781, "epoch": 2361} {"train_loss": -42.005455017089844, "global_step": 285782, "epoch": 2361} {"train_loss": -39.992557525634766, "global_step": 285783, "epoch": 2361} {"train_loss": -41.42647171020508, "global_step": 285784, "epoch": 2361} {"train_loss": -41.46708297729492, "global_step": 285785, "epoch": 2361} {"train_loss": -41.75444030761719, "global_step": 285786, "epoch": 2361} {"train_loss": -40.80427932739258, "global_step": 285787, "epoch": 2361} {"train_loss": -41.987911224365234, "global_step": 285788, "epoch": 2361} {"train_loss": -41.58557891845703, "global_step": 285789, "epoch": 2361} {"train_loss": -41.28315353393555, "global_step": 285790, "epoch": 2361} {"train_loss": -41.059608459472656, "global_step": 285791, "epoch": 2361} {"train_loss": -40.45175552368164, "global_step": 285792, "epoch": 2361} {"train_loss": -42.45634078979492, "global_step": 285793, "epoch": 2361} {"train_loss": -40.343379974365234, "global_step": 285794, "epoch": 2361} {"train_loss": -39.543601989746094, "global_step": 285795, "epoch": 2361} {"train_loss": -40.48748779296875, "global_step": 285796, "epoch": 2361} {"train_loss": -41.43876266479492, "global_step": 285797, "epoch": 2361} {"train_loss": -39.67902374267578, "global_step": 285798, "epoch": 2361} {"train_loss": -39.18351745605469, "global_step": 285799, "epoch": 2361} {"train_loss": -39.395050048828125, "global_step": 285800, "epoch": 2361} {"train_loss": -41.21631407934772, "global_step": 285801, "epoch": 2361, "val_loss": 2562660.0} {"train_loss": -41.92840576171875, "global_step": 285802, "epoch": 2362} {"train_loss": -41.44025802612305, "global_step": 285803, "epoch": 2362} {"train_loss": -41.279232025146484, "global_step": 285804, "epoch": 2362} {"train_loss": -41.76505661010742, "global_step": 285805, "epoch": 2362} {"train_loss": -41.6927375793457, "global_step": 285806, "epoch": 2362} {"train_loss": -41.07846450805664, "global_step": 285807, "epoch": 2362} {"train_loss": -41.65470504760742, "global_step": 285808, "epoch": 2362} {"train_loss": -42.275360107421875, "global_step": 285809, "epoch": 2362} {"train_loss": -42.165252685546875, "global_step": 285810, "epoch": 2362} {"train_loss": -40.82565689086914, "global_step": 285811, "epoch": 2362} {"train_loss": -41.56524658203125, "global_step": 285812, "epoch": 2362} {"train_loss": -41.496307373046875, "global_step": 285813, "epoch": 2362} {"train_loss": -42.05181884765625, "global_step": 285814, "epoch": 2362} {"train_loss": -41.96604537963867, "global_step": 285815, "epoch": 2362} {"train_loss": -41.62656021118164, "global_step": 285816, "epoch": 2362} {"train_loss": -40.506614685058594, "global_step": 285817, "epoch": 2362} {"train_loss": -40.70613479614258, "global_step": 285818, "epoch": 2362} {"train_loss": -41.16910934448242, "global_step": 285819, "epoch": 2362} {"train_loss": -42.025882720947266, "global_step": 285820, "epoch": 2362} {"train_loss": -41.602352142333984, "global_step": 285821, "epoch": 2362} {"train_loss": -41.92374801635742, "global_step": 285822, "epoch": 2362} {"train_loss": -41.90424728393555, "global_step": 285823, "epoch": 2362} {"train_loss": -42.7927360534668, "global_step": 285824, "epoch": 2362} {"train_loss": -42.625179290771484, "global_step": 285825, "epoch": 2362} {"train_loss": -42.30727767944336, "global_step": 285826, "epoch": 2362} {"train_loss": -41.13158416748047, "global_step": 285827, "epoch": 2362} {"train_loss": -42.5682487487793, "global_step": 285828, "epoch": 2362} {"train_loss": -42.20753860473633, "global_step": 285829, "epoch": 2362} {"train_loss": -40.993099212646484, "global_step": 285830, "epoch": 2362} {"train_loss": -41.673553466796875, "global_step": 285831, "epoch": 2362} {"train_loss": -42.05147171020508, "global_step": 285832, "epoch": 2362} {"train_loss": -42.395545959472656, "global_step": 285833, "epoch": 2362} {"train_loss": -42.30134201049805, "global_step": 285834, "epoch": 2362} {"train_loss": -42.86139678955078, "global_step": 285835, "epoch": 2362} {"train_loss": -42.54756546020508, "global_step": 285836, "epoch": 2362} {"train_loss": -42.01604080200195, "global_step": 285837, "epoch": 2362} {"train_loss": -43.42110061645508, "global_step": 285838, "epoch": 2362} {"train_loss": -42.369895935058594, "global_step": 285839, "epoch": 2362} {"train_loss": -42.521602630615234, "global_step": 285840, "epoch": 2362} {"train_loss": -42.82773971557617, "global_step": 285841, "epoch": 2362} {"train_loss": -42.44704818725586, "global_step": 285842, "epoch": 2362} {"train_loss": -42.145606994628906, "global_step": 285843, "epoch": 2362} {"train_loss": -43.24541091918945, "global_step": 285844, "epoch": 2362} {"train_loss": -41.848690032958984, "global_step": 285845, "epoch": 2362} {"train_loss": -42.313209533691406, "global_step": 285846, "epoch": 2362} {"train_loss": -43.07989501953125, "global_step": 285847, "epoch": 2362} {"train_loss": -41.65401840209961, "global_step": 285848, "epoch": 2362} {"train_loss": -42.97438430786133, "global_step": 285849, "epoch": 2362} {"train_loss": -43.23017501831055, "global_step": 285850, "epoch": 2362} {"train_loss": -42.34309768676758, "global_step": 285851, "epoch": 2362} {"train_loss": -42.27057647705078, "global_step": 285852, "epoch": 2362} {"train_loss": -42.89397048950195, "global_step": 285853, "epoch": 2362} {"train_loss": -41.51866149902344, "global_step": 285854, "epoch": 2362} {"train_loss": -41.9463005065918, "global_step": 285855, "epoch": 2362} {"train_loss": -42.643245697021484, "global_step": 285856, "epoch": 2362} {"train_loss": -42.234947204589844, "global_step": 285857, "epoch": 2362} {"train_loss": -42.336788177490234, "global_step": 285858, "epoch": 2362} {"train_loss": -42.86404037475586, "global_step": 285859, "epoch": 2362} {"train_loss": -42.50222396850586, "global_step": 285860, "epoch": 2362} {"train_loss": -39.513389587402344, "global_step": 285861, "epoch": 2362} {"train_loss": -40.591609954833984, "global_step": 285862, "epoch": 2362} {"train_loss": -35.103816986083984, "global_step": 285863, "epoch": 2362} {"train_loss": -36.778907775878906, "global_step": 285864, "epoch": 2362} {"train_loss": -37.3819694519043, "global_step": 285865, "epoch": 2362} {"train_loss": -39.19934844970703, "global_step": 285866, "epoch": 2362} {"train_loss": -37.084041595458984, "global_step": 285867, "epoch": 2362} {"train_loss": -40.8195686340332, "global_step": 285868, "epoch": 2362} {"train_loss": -40.30752944946289, "global_step": 285869, "epoch": 2362} {"train_loss": -39.54231643676758, "global_step": 285870, "epoch": 2362} {"train_loss": -41.63114547729492, "global_step": 285871, "epoch": 2362} {"train_loss": -40.78279495239258, "global_step": 285872, "epoch": 2362} {"train_loss": -40.19084548950195, "global_step": 285873, "epoch": 2362} {"train_loss": -38.782955169677734, "global_step": 285874, "epoch": 2362} {"train_loss": -41.8426628112793, "global_step": 285875, "epoch": 2362} {"train_loss": -41.55699920654297, "global_step": 285876, "epoch": 2362} {"train_loss": -38.919063568115234, "global_step": 285877, "epoch": 2362} {"train_loss": -42.059234619140625, "global_step": 285878, "epoch": 2362} {"train_loss": -40.47954177856445, "global_step": 285879, "epoch": 2362} {"train_loss": -40.450523376464844, "global_step": 285880, "epoch": 2362} {"train_loss": -39.448787689208984, "global_step": 285881, "epoch": 2362} {"train_loss": -42.21087646484375, "global_step": 285882, "epoch": 2362} {"train_loss": -42.15617752075195, "global_step": 285883, "epoch": 2362} {"train_loss": -41.73676681518555, "global_step": 285884, "epoch": 2362} {"train_loss": -41.324562072753906, "global_step": 285885, "epoch": 2362} {"train_loss": -41.25129318237305, "global_step": 285886, "epoch": 2362} {"train_loss": -35.30935287475586, "global_step": 285887, "epoch": 2362} {"train_loss": -40.40232467651367, "global_step": 285888, "epoch": 2362} {"train_loss": -40.10774612426758, "global_step": 285889, "epoch": 2362} {"train_loss": -41.7904052734375, "global_step": 285890, "epoch": 2362} {"train_loss": -41.7586784362793, "global_step": 285891, "epoch": 2362} {"train_loss": -41.623897552490234, "global_step": 285892, "epoch": 2362} {"train_loss": -39.73199462890625, "global_step": 285893, "epoch": 2362} {"train_loss": -41.68272018432617, "global_step": 285894, "epoch": 2362} {"train_loss": -36.227943420410156, "global_step": 285895, "epoch": 2362} {"train_loss": -41.5994873046875, "global_step": 285896, "epoch": 2362} {"train_loss": -41.25078582763672, "global_step": 285897, "epoch": 2362} {"train_loss": -40.70304489135742, "global_step": 285898, "epoch": 2362} {"train_loss": -40.84638595581055, "global_step": 285899, "epoch": 2362} {"train_loss": -40.19776153564453, "global_step": 285900, "epoch": 2362} {"train_loss": -39.97712326049805, "global_step": 285901, "epoch": 2362} {"train_loss": -40.96730422973633, "global_step": 285902, "epoch": 2362} {"train_loss": -41.983299255371094, "global_step": 285903, "epoch": 2362} {"train_loss": -40.28205871582031, "global_step": 285904, "epoch": 2362} {"train_loss": -42.05900192260742, "global_step": 285905, "epoch": 2362} {"train_loss": -41.22016525268555, "global_step": 285906, "epoch": 2362} {"train_loss": -41.53670883178711, "global_step": 285907, "epoch": 2362} {"train_loss": -41.4207878112793, "global_step": 285908, "epoch": 2362} {"train_loss": -41.83449172973633, "global_step": 285909, "epoch": 2362} {"train_loss": -42.10471725463867, "global_step": 285910, "epoch": 2362} {"train_loss": -37.09284591674805, "global_step": 285911, "epoch": 2362} {"train_loss": -39.56899642944336, "global_step": 285912, "epoch": 2362} {"train_loss": -41.16416549682617, "global_step": 285913, "epoch": 2362} {"train_loss": -41.502647399902344, "global_step": 285914, "epoch": 2362} {"train_loss": -39.458309173583984, "global_step": 285915, "epoch": 2362} {"train_loss": -40.74061965942383, "global_step": 285916, "epoch": 2362} {"train_loss": -41.541378021240234, "global_step": 285917, "epoch": 2362} {"train_loss": -41.609474182128906, "global_step": 285918, "epoch": 2362} {"train_loss": -41.50712966918945, "global_step": 285919, "epoch": 2362} {"train_loss": -42.44486618041992, "global_step": 285920, "epoch": 2362} {"train_loss": -41.8439826965332, "global_step": 285921, "epoch": 2362} {"train_loss": -41.22805385747232, "global_step": 285922, "epoch": 2362, "val_loss": 2686513.0} {"train_loss": -40.68669509887695, "global_step": 285923, "epoch": 2363} {"train_loss": -40.57265090942383, "global_step": 285924, "epoch": 2363} {"train_loss": -42.012733459472656, "global_step": 285925, "epoch": 2363} {"train_loss": -40.7787971496582, "global_step": 285926, "epoch": 2363} {"train_loss": -39.7012939453125, "global_step": 285927, "epoch": 2363} {"train_loss": -42.5892219543457, "global_step": 285928, "epoch": 2363} {"train_loss": -42.029212951660156, "global_step": 285929, "epoch": 2363} {"train_loss": -41.22589111328125, "global_step": 285930, "epoch": 2363} {"train_loss": -41.799583435058594, "global_step": 285931, "epoch": 2363} {"train_loss": -42.00551223754883, "global_step": 285932, "epoch": 2363} {"train_loss": -40.14556121826172, "global_step": 285933, "epoch": 2363} {"train_loss": -41.63901901245117, "global_step": 285934, "epoch": 2363} {"train_loss": -40.06399154663086, "global_step": 285935, "epoch": 2363} {"train_loss": -41.849369049072266, "global_step": 285936, "epoch": 2363} {"train_loss": -41.483673095703125, "global_step": 285937, "epoch": 2363} {"train_loss": -40.952754974365234, "global_step": 285938, "epoch": 2363} {"train_loss": -40.85856246948242, "global_step": 285939, "epoch": 2363} {"train_loss": -42.410274505615234, "global_step": 285940, "epoch": 2363} {"train_loss": -41.3176155090332, "global_step": 285941, "epoch": 2363} {"train_loss": -41.771785736083984, "global_step": 285942, "epoch": 2363} {"train_loss": -41.45676803588867, "global_step": 285943, "epoch": 2363} {"train_loss": -40.94343948364258, "global_step": 285944, "epoch": 2363} {"train_loss": -41.37511444091797, "global_step": 285945, "epoch": 2363} {"train_loss": -37.91360092163086, "global_step": 285946, "epoch": 2363} {"train_loss": -42.044288635253906, "global_step": 285947, "epoch": 2363} {"train_loss": -41.47524642944336, "global_step": 285948, "epoch": 2363} {"train_loss": -34.80108642578125, "global_step": 285949, "epoch": 2363} {"train_loss": -41.68671798706055, "global_step": 285950, "epoch": 2363} {"train_loss": -39.213253021240234, "global_step": 285951, "epoch": 2363} {"train_loss": -41.95295333862305, "global_step": 285952, "epoch": 2363} {"train_loss": -42.27470016479492, "global_step": 285953, "epoch": 2363} {"train_loss": -41.22298812866211, "global_step": 285954, "epoch": 2363} {"train_loss": -41.345672607421875, "global_step": 285955, "epoch": 2363} {"train_loss": -40.817466735839844, "global_step": 285956, "epoch": 2363} {"train_loss": -40.65037155151367, "global_step": 285957, "epoch": 2363} {"train_loss": -41.648067474365234, "global_step": 285958, "epoch": 2363} {"train_loss": -42.3746337890625, "global_step": 285959, "epoch": 2363} {"train_loss": -42.108516693115234, "global_step": 285960, "epoch": 2363} {"train_loss": -39.883113861083984, "global_step": 285961, "epoch": 2363} {"train_loss": -41.05957794189453, "global_step": 285962, "epoch": 2363} {"train_loss": -41.82068634033203, "global_step": 285963, "epoch": 2363} {"train_loss": -41.49576187133789, "global_step": 285964, "epoch": 2363} {"train_loss": -40.2273063659668, "global_step": 285965, "epoch": 2363} {"train_loss": -41.520606994628906, "global_step": 285966, "epoch": 2363} {"train_loss": -42.20676803588867, "global_step": 285967, "epoch": 2363} {"train_loss": -39.16672134399414, "global_step": 285968, "epoch": 2363} {"train_loss": -41.60842514038086, "global_step": 285969, "epoch": 2363} {"train_loss": -41.01072311401367, "global_step": 285970, "epoch": 2363} {"train_loss": -39.88145446777344, "global_step": 285971, "epoch": 2363} {"train_loss": -42.28017044067383, "global_step": 285972, "epoch": 2363} {"train_loss": -41.811431884765625, "global_step": 285973, "epoch": 2363} {"train_loss": -41.7722282409668, "global_step": 285974, "epoch": 2363} {"train_loss": -41.7021598815918, "global_step": 285975, "epoch": 2363} {"train_loss": -42.28102111816406, "global_step": 285976, "epoch": 2363} {"train_loss": -42.646629333496094, "global_step": 285977, "epoch": 2363} {"train_loss": -42.489471435546875, "global_step": 285978, "epoch": 2363} {"train_loss": -42.7082633972168, "global_step": 285979, "epoch": 2363} {"train_loss": -42.66921615600586, "global_step": 285980, "epoch": 2363} {"train_loss": -42.85771942138672, "global_step": 285981, "epoch": 2363} {"train_loss": -42.4410285949707, "global_step": 285982, "epoch": 2363} {"train_loss": -42.7122802734375, "global_step": 285983, "epoch": 2363} {"train_loss": -42.102169036865234, "global_step": 285984, "epoch": 2363} {"train_loss": -42.7548713684082, "global_step": 285985, "epoch": 2363} {"train_loss": -42.12116241455078, "global_step": 285986, "epoch": 2363} {"train_loss": -42.31486892700195, "global_step": 285987, "epoch": 2363} {"train_loss": -42.97269058227539, "global_step": 285988, "epoch": 2363} {"train_loss": -41.742061614990234, "global_step": 285989, "epoch": 2363} {"train_loss": -42.327327728271484, "global_step": 285990, "epoch": 2363} {"train_loss": -42.39211654663086, "global_step": 285991, "epoch": 2363} {"train_loss": -42.94342803955078, "global_step": 285992, "epoch": 2363} {"train_loss": -42.883949279785156, "global_step": 285993, "epoch": 2363} {"train_loss": -43.3989372253418, "global_step": 285994, "epoch": 2363} {"train_loss": -42.38740921020508, "global_step": 285995, "epoch": 2363} {"train_loss": -42.82070541381836, "global_step": 285996, "epoch": 2363} {"train_loss": -40.57908248901367, "global_step": 285997, "epoch": 2363} {"train_loss": -37.816341400146484, "global_step": 285998, "epoch": 2363} {"train_loss": -38.06970977783203, "global_step": 285999, "epoch": 2363} {"train_loss": -40.907920837402344, "global_step": 286000, "epoch": 2363} {"train_loss": -41.11931228637695, "global_step": 286001, "epoch": 2363} {"train_loss": -40.86298370361328, "global_step": 286002, "epoch": 2363} {"train_loss": -40.526885986328125, "global_step": 286003, "epoch": 2363} {"train_loss": -39.607540130615234, "global_step": 286004, "epoch": 2363} {"train_loss": -39.65557861328125, "global_step": 286005, "epoch": 2363} {"train_loss": -39.683815002441406, "global_step": 286006, "epoch": 2363} {"train_loss": -39.86207580566406, "global_step": 286007, "epoch": 2363} {"train_loss": -39.866912841796875, "global_step": 286008, "epoch": 2363} {"train_loss": -35.86802291870117, "global_step": 286009, "epoch": 2363} {"train_loss": -40.36738586425781, "global_step": 286010, "epoch": 2363} {"train_loss": -41.80037307739258, "global_step": 286011, "epoch": 2363} {"train_loss": -37.888336181640625, "global_step": 286012, "epoch": 2363} {"train_loss": -39.85127258300781, "global_step": 286013, "epoch": 2363} {"train_loss": -40.43606185913086, "global_step": 286014, "epoch": 2363} {"train_loss": -40.99143981933594, "global_step": 286015, "epoch": 2363} {"train_loss": -37.067501068115234, "global_step": 286016, "epoch": 2363} {"train_loss": -40.39130783081055, "global_step": 286017, "epoch": 2363} {"train_loss": -37.3143196105957, "global_step": 286018, "epoch": 2363} {"train_loss": -38.845123291015625, "global_step": 286019, "epoch": 2363} {"train_loss": -39.681148529052734, "global_step": 286020, "epoch": 2363} {"train_loss": -40.1815299987793, "global_step": 286021, "epoch": 2363} {"train_loss": -35.44586944580078, "global_step": 286022, "epoch": 2363} {"train_loss": -38.6422233581543, "global_step": 286023, "epoch": 2363} {"train_loss": -40.297794342041016, "global_step": 286024, "epoch": 2363} {"train_loss": -40.10222244262695, "global_step": 286025, "epoch": 2363} {"train_loss": -41.37531661987305, "global_step": 286026, "epoch": 2363} {"train_loss": -41.123958587646484, "global_step": 286027, "epoch": 2363} {"train_loss": -41.0985221862793, "global_step": 286028, "epoch": 2363} {"train_loss": -39.624755859375, "global_step": 286029, "epoch": 2363} {"train_loss": -41.615421295166016, "global_step": 286030, "epoch": 2363} {"train_loss": -27.396121978759766, "global_step": 286031, "epoch": 2363} {"train_loss": -39.206939697265625, "global_step": 286032, "epoch": 2363} {"train_loss": -41.3021125793457, "global_step": 286033, "epoch": 2363} {"train_loss": -32.0713996887207, "global_step": 286034, "epoch": 2363} {"train_loss": -41.74174118041992, "global_step": 286035, "epoch": 2363} {"train_loss": -41.68223190307617, "global_step": 286036, "epoch": 2363} {"train_loss": -35.40667724609375, "global_step": 286037, "epoch": 2363} {"train_loss": -38.98936462402344, "global_step": 286038, "epoch": 2363} {"train_loss": -39.75373458862305, "global_step": 286039, "epoch": 2363} {"train_loss": -38.13257598876953, "global_step": 286040, "epoch": 2363} {"train_loss": -40.3177604675293, "global_step": 286041, "epoch": 2363} {"train_loss": -34.79616165161133, "global_step": 286042, "epoch": 2363} {"train_loss": -40.59738944187637, "global_step": 286043, "epoch": 2363, "val_loss": 3020061.75} {"train_loss": -41.12471008300781, "global_step": 286044, "epoch": 2364} {"train_loss": -41.713932037353516, "global_step": 286045, "epoch": 2364} {"train_loss": -41.685142517089844, "global_step": 286046, "epoch": 2364} {"train_loss": -37.30465316772461, "global_step": 286047, "epoch": 2364} {"train_loss": -41.313446044921875, "global_step": 286048, "epoch": 2364} {"train_loss": -39.14667892456055, "global_step": 286049, "epoch": 2364} {"train_loss": -41.43830490112305, "global_step": 286050, "epoch": 2364} {"train_loss": -41.23237228393555, "global_step": 286051, "epoch": 2364} {"train_loss": -42.195098876953125, "global_step": 286052, "epoch": 2364} {"train_loss": -39.2296028137207, "global_step": 286053, "epoch": 2364} {"train_loss": -40.169593811035156, "global_step": 286054, "epoch": 2364} {"train_loss": -41.28297805786133, "global_step": 286055, "epoch": 2364} {"train_loss": -36.51453399658203, "global_step": 286056, "epoch": 2364} {"train_loss": -41.47135543823242, "global_step": 286057, "epoch": 2364} {"train_loss": -41.51649475097656, "global_step": 286058, "epoch": 2364} {"train_loss": -41.531227111816406, "global_step": 286059, "epoch": 2364} {"train_loss": -39.386165618896484, "global_step": 286060, "epoch": 2364} {"train_loss": -41.15160369873047, "global_step": 286061, "epoch": 2364} {"train_loss": -41.711727142333984, "global_step": 286062, "epoch": 2364} {"train_loss": -39.9791374206543, "global_step": 286063, "epoch": 2364} {"train_loss": -41.4869270324707, "global_step": 286064, "epoch": 2364} {"train_loss": -41.38727569580078, "global_step": 286065, "epoch": 2364} {"train_loss": -30.201513290405273, "global_step": 286066, "epoch": 2364} {"train_loss": -37.533958435058594, "global_step": 286067, "epoch": 2364} {"train_loss": -39.21015548706055, "global_step": 286068, "epoch": 2364} {"train_loss": -38.21688461303711, "global_step": 286069, "epoch": 2364} {"train_loss": -40.54222106933594, "global_step": 286070, "epoch": 2364} {"train_loss": -40.44834899902344, "global_step": 286071, "epoch": 2364} {"train_loss": -36.05904769897461, "global_step": 286072, "epoch": 2364} {"train_loss": -41.25715255737305, "global_step": 286073, "epoch": 2364} {"train_loss": -39.81385803222656, "global_step": 286074, "epoch": 2364} {"train_loss": -39.46271896362305, "global_step": 286075, "epoch": 2364} {"train_loss": -40.378902435302734, "global_step": 286076, "epoch": 2364} {"train_loss": -40.56451416015625, "global_step": 286077, "epoch": 2364} {"train_loss": -41.084468841552734, "global_step": 286078, "epoch": 2364} {"train_loss": -38.58298110961914, "global_step": 286079, "epoch": 2364} {"train_loss": -40.1372184753418, "global_step": 286080, "epoch": 2364} {"train_loss": -39.02994155883789, "global_step": 286081, "epoch": 2364} {"train_loss": -40.932003021240234, "global_step": 286082, "epoch": 2364} {"train_loss": -39.09226608276367, "global_step": 286083, "epoch": 2364} {"train_loss": -39.590938568115234, "global_step": 286084, "epoch": 2364} {"train_loss": -41.487491607666016, "global_step": 286085, "epoch": 2364} {"train_loss": -34.298824310302734, "global_step": 286086, "epoch": 2364} {"train_loss": -41.1845588684082, "global_step": 286087, "epoch": 2364} {"train_loss": -40.93380355834961, "global_step": 286088, "epoch": 2364} {"train_loss": -39.93925094604492, "global_step": 286089, "epoch": 2364} {"train_loss": -37.4345703125, "global_step": 286090, "epoch": 2364} {"train_loss": -40.67902374267578, "global_step": 286091, "epoch": 2364} {"train_loss": -41.39005661010742, "global_step": 286092, "epoch": 2364} {"train_loss": -38.58574676513672, "global_step": 286093, "epoch": 2364} {"train_loss": -41.835140228271484, "global_step": 286094, "epoch": 2364} {"train_loss": -41.170894622802734, "global_step": 286095, "epoch": 2364} {"train_loss": -39.31234359741211, "global_step": 286096, "epoch": 2364} {"train_loss": -39.90274429321289, "global_step": 286097, "epoch": 2364} {"train_loss": -40.76987075805664, "global_step": 286098, "epoch": 2364} {"train_loss": -37.471229553222656, "global_step": 286099, "epoch": 2364} {"train_loss": -41.379966735839844, "global_step": 286100, "epoch": 2364} {"train_loss": -40.092342376708984, "global_step": 286101, "epoch": 2364} {"train_loss": -39.301918029785156, "global_step": 286102, "epoch": 2364} {"train_loss": -40.83608627319336, "global_step": 286103, "epoch": 2364} {"train_loss": -39.22111892700195, "global_step": 286104, "epoch": 2364} {"train_loss": -40.731746673583984, "global_step": 286105, "epoch": 2364} {"train_loss": -40.738319396972656, "global_step": 286106, "epoch": 2364} {"train_loss": -40.379112243652344, "global_step": 286107, "epoch": 2364} {"train_loss": -40.69852828979492, "global_step": 286108, "epoch": 2364} {"train_loss": -41.129878997802734, "global_step": 286109, "epoch": 2364} {"train_loss": -41.70621871948242, "global_step": 286110, "epoch": 2364} {"train_loss": -39.6712646484375, "global_step": 286111, "epoch": 2364} {"train_loss": -41.59035110473633, "global_step": 286112, "epoch": 2364} {"train_loss": -41.59856033325195, "global_step": 286113, "epoch": 2364} {"train_loss": -41.91277313232422, "global_step": 286114, "epoch": 2364} {"train_loss": -41.44169235229492, "global_step": 286115, "epoch": 2364} {"train_loss": -41.840179443359375, "global_step": 286116, "epoch": 2364} {"train_loss": -40.438716888427734, "global_step": 286117, "epoch": 2364} {"train_loss": -41.751129150390625, "global_step": 286118, "epoch": 2364} {"train_loss": -41.34637451171875, "global_step": 286119, "epoch": 2364} {"train_loss": -41.141597747802734, "global_step": 286120, "epoch": 2364} {"train_loss": -40.47526168823242, "global_step": 286121, "epoch": 2364} {"train_loss": -40.993377685546875, "global_step": 286122, "epoch": 2364} {"train_loss": -41.55847930908203, "global_step": 286123, "epoch": 2364} {"train_loss": -41.6681022644043, "global_step": 286124, "epoch": 2364} {"train_loss": -41.55215835571289, "global_step": 286125, "epoch": 2364} {"train_loss": -39.94135665893555, "global_step": 286126, "epoch": 2364} {"train_loss": -41.657196044921875, "global_step": 286127, "epoch": 2364} {"train_loss": -41.532588958740234, "global_step": 286128, "epoch": 2364} {"train_loss": -41.44051742553711, "global_step": 286129, "epoch": 2364} {"train_loss": -41.1295280456543, "global_step": 286130, "epoch": 2364} {"train_loss": -41.088172912597656, "global_step": 286131, "epoch": 2364} {"train_loss": -41.16901779174805, "global_step": 286132, "epoch": 2364} {"train_loss": -40.03987503051758, "global_step": 286133, "epoch": 2364} {"train_loss": -41.85966110229492, "global_step": 286134, "epoch": 2364} {"train_loss": -41.44983673095703, "global_step": 286135, "epoch": 2364} {"train_loss": -41.331607818603516, "global_step": 286136, "epoch": 2364} {"train_loss": -41.62125778198242, "global_step": 286137, "epoch": 2364} {"train_loss": -40.76206970214844, "global_step": 286138, "epoch": 2364} {"train_loss": -41.01272964477539, "global_step": 286139, "epoch": 2364} {"train_loss": -41.73371124267578, "global_step": 286140, "epoch": 2364} {"train_loss": -41.41401290893555, "global_step": 286141, "epoch": 2364} {"train_loss": -41.57121658325195, "global_step": 286142, "epoch": 2364} {"train_loss": -41.60873031616211, "global_step": 286143, "epoch": 2364} {"train_loss": -42.04597854614258, "global_step": 286144, "epoch": 2364} {"train_loss": -41.8722038269043, "global_step": 286145, "epoch": 2364} {"train_loss": -42.13029479980469, "global_step": 286146, "epoch": 2364} {"train_loss": -41.43705368041992, "global_step": 286147, "epoch": 2364} {"train_loss": -41.452789306640625, "global_step": 286148, "epoch": 2364} {"train_loss": -41.126747131347656, "global_step": 286149, "epoch": 2364} {"train_loss": -41.2656364440918, "global_step": 286150, "epoch": 2364} {"train_loss": -41.96680450439453, "global_step": 286151, "epoch": 2364} {"train_loss": -41.141056060791016, "global_step": 286152, "epoch": 2364} {"train_loss": -41.42319869995117, "global_step": 286153, "epoch": 2364} {"train_loss": -41.53324508666992, "global_step": 286154, "epoch": 2364} {"train_loss": -40.74414825439453, "global_step": 286155, "epoch": 2364} {"train_loss": -42.433589935302734, "global_step": 286156, "epoch": 2364} {"train_loss": -40.67129135131836, "global_step": 286157, "epoch": 2364} {"train_loss": -41.27824020385742, "global_step": 286158, "epoch": 2364} {"train_loss": -41.75262451171875, "global_step": 286159, "epoch": 2364} {"train_loss": -41.76472854614258, "global_step": 286160, "epoch": 2364} {"train_loss": -41.906776428222656, "global_step": 286161, "epoch": 2364} {"train_loss": -41.65552520751953, "global_step": 286162, "epoch": 2364} {"train_loss": -42.4836311340332, "global_step": 286163, "epoch": 2364} {"train_loss": -40.616049380341835, "global_step": 286164, "epoch": 2364, "val_loss": 2521026.25} {"train_loss": -41.94063186645508, "global_step": 286165, "epoch": 2365} {"train_loss": -42.184051513671875, "global_step": 286166, "epoch": 2365} {"train_loss": -42.594146728515625, "global_step": 286167, "epoch": 2365} {"train_loss": -42.409114837646484, "global_step": 286168, "epoch": 2365} {"train_loss": -42.37635040283203, "global_step": 286169, "epoch": 2365} {"train_loss": -41.36338424682617, "global_step": 286170, "epoch": 2365} {"train_loss": -42.53030776977539, "global_step": 286171, "epoch": 2365} {"train_loss": -42.70212936401367, "global_step": 286172, "epoch": 2365} {"train_loss": -41.95697021484375, "global_step": 286173, "epoch": 2365} {"train_loss": -41.862545013427734, "global_step": 286174, "epoch": 2365} {"train_loss": -42.15571975708008, "global_step": 286175, "epoch": 2365} {"train_loss": -42.09313201904297, "global_step": 286176, "epoch": 2365} {"train_loss": -41.964473724365234, "global_step": 286177, "epoch": 2365} {"train_loss": -42.71183395385742, "global_step": 286178, "epoch": 2365} {"train_loss": -42.389862060546875, "global_step": 286179, "epoch": 2365} {"train_loss": -42.30231857299805, "global_step": 286180, "epoch": 2365} {"train_loss": -42.5578727722168, "global_step": 286181, "epoch": 2365} {"train_loss": -42.264503479003906, "global_step": 286182, "epoch": 2365} {"train_loss": -42.984798431396484, "global_step": 286183, "epoch": 2365} {"train_loss": -42.213714599609375, "global_step": 286184, "epoch": 2365} {"train_loss": -42.14488220214844, "global_step": 286185, "epoch": 2365} {"train_loss": -42.14278793334961, "global_step": 286186, "epoch": 2365} {"train_loss": -41.79393768310547, "global_step": 286187, "epoch": 2365} {"train_loss": -40.23260498046875, "global_step": 286188, "epoch": 2365} {"train_loss": -40.11906051635742, "global_step": 286189, "epoch": 2365} {"train_loss": -38.53804397583008, "global_step": 286190, "epoch": 2365} {"train_loss": -38.6489143371582, "global_step": 286191, "epoch": 2365} {"train_loss": -38.923885345458984, "global_step": 286192, "epoch": 2365} {"train_loss": -40.21577835083008, "global_step": 286193, "epoch": 2365} {"train_loss": -35.132606506347656, "global_step": 286194, "epoch": 2365} {"train_loss": -38.22378158569336, "global_step": 286195, "epoch": 2365} {"train_loss": -40.4943962097168, "global_step": 286196, "epoch": 2365} {"train_loss": -39.267730712890625, "global_step": 286197, "epoch": 2365} {"train_loss": -37.90053176879883, "global_step": 286198, "epoch": 2365} {"train_loss": -39.120338439941406, "global_step": 286199, "epoch": 2365} {"train_loss": -39.66434860229492, "global_step": 286200, "epoch": 2365} {"train_loss": -40.599727630615234, "global_step": 286201, "epoch": 2365} {"train_loss": -40.34857940673828, "global_step": 286202, "epoch": 2365} {"train_loss": -40.0849609375, "global_step": 286203, "epoch": 2365} {"train_loss": -39.641136169433594, "global_step": 286204, "epoch": 2365} {"train_loss": -40.951351165771484, "global_step": 286205, "epoch": 2365} {"train_loss": -38.19698715209961, "global_step": 286206, "epoch": 2365} {"train_loss": -40.955955505371094, "global_step": 286207, "epoch": 2365} {"train_loss": -39.2288932800293, "global_step": 286208, "epoch": 2365} {"train_loss": -39.47682189941406, "global_step": 286209, "epoch": 2365} {"train_loss": -41.137916564941406, "global_step": 286210, "epoch": 2365} {"train_loss": -39.76251220703125, "global_step": 286211, "epoch": 2365} {"train_loss": -40.85745620727539, "global_step": 286212, "epoch": 2365} {"train_loss": -39.80048751831055, "global_step": 286213, "epoch": 2365} {"train_loss": -40.9923210144043, "global_step": 286214, "epoch": 2365} {"train_loss": -40.25990676879883, "global_step": 286215, "epoch": 2365} {"train_loss": -40.87108612060547, "global_step": 286216, "epoch": 2365} {"train_loss": -40.83074188232422, "global_step": 286217, "epoch": 2365} {"train_loss": -40.13639450073242, "global_step": 286218, "epoch": 2365} {"train_loss": -41.79558181762695, "global_step": 286219, "epoch": 2365} {"train_loss": -41.13750076293945, "global_step": 286220, "epoch": 2365} {"train_loss": -42.0112419128418, "global_step": 286221, "epoch": 2365} {"train_loss": -41.369014739990234, "global_step": 286222, "epoch": 2365} {"train_loss": -42.00178909301758, "global_step": 286223, "epoch": 2365} {"train_loss": -41.227962493896484, "global_step": 286224, "epoch": 2365} {"train_loss": -42.07630157470703, "global_step": 286225, "epoch": 2365} {"train_loss": -42.10407638549805, "global_step": 286226, "epoch": 2365} {"train_loss": -41.72630310058594, "global_step": 286227, "epoch": 2365} {"train_loss": -41.441558837890625, "global_step": 286228, "epoch": 2365} {"train_loss": -42.064300537109375, "global_step": 286229, "epoch": 2365} {"train_loss": -41.96529769897461, "global_step": 286230, "epoch": 2365} {"train_loss": -41.53228759765625, "global_step": 286231, "epoch": 2365} {"train_loss": -42.2390251159668, "global_step": 286232, "epoch": 2365} {"train_loss": -42.24094772338867, "global_step": 286233, "epoch": 2365} {"train_loss": -41.52442932128906, "global_step": 286234, "epoch": 2365} {"train_loss": -41.781856536865234, "global_step": 286235, "epoch": 2365} {"train_loss": -42.120784759521484, "global_step": 286236, "epoch": 2365} {"train_loss": -41.11983871459961, "global_step": 286237, "epoch": 2365} {"train_loss": -41.685638427734375, "global_step": 286238, "epoch": 2365} {"train_loss": -42.61787033081055, "global_step": 286239, "epoch": 2365} {"train_loss": -42.11308670043945, "global_step": 286240, "epoch": 2365} {"train_loss": -41.93238830566406, "global_step": 286241, "epoch": 2365} {"train_loss": -41.70858383178711, "global_step": 286242, "epoch": 2365} {"train_loss": -42.84965896606445, "global_step": 286243, "epoch": 2365} {"train_loss": -41.90882110595703, "global_step": 286244, "epoch": 2365} {"train_loss": -41.59806442260742, "global_step": 286245, "epoch": 2365} {"train_loss": -41.919403076171875, "global_step": 286246, "epoch": 2365} {"train_loss": -41.97337341308594, "global_step": 286247, "epoch": 2365} {"train_loss": -42.16303253173828, "global_step": 286248, "epoch": 2365} {"train_loss": -41.814979553222656, "global_step": 286249, "epoch": 2365} {"train_loss": -42.00942611694336, "global_step": 286250, "epoch": 2365} {"train_loss": -42.993465423583984, "global_step": 286251, "epoch": 2365} {"train_loss": -41.31171798706055, "global_step": 286252, "epoch": 2365} {"train_loss": -41.87277603149414, "global_step": 286253, "epoch": 2365} {"train_loss": -42.7769775390625, "global_step": 286254, "epoch": 2365} {"train_loss": -42.244667053222656, "global_step": 286255, "epoch": 2365} {"train_loss": -39.6161003112793, "global_step": 286256, "epoch": 2365} {"train_loss": -40.43136215209961, "global_step": 286257, "epoch": 2365} {"train_loss": -42.868682861328125, "global_step": 286258, "epoch": 2365} {"train_loss": -41.32087326049805, "global_step": 286259, "epoch": 2365} {"train_loss": -41.85423278808594, "global_step": 286260, "epoch": 2365} {"train_loss": -41.968448638916016, "global_step": 286261, "epoch": 2365} {"train_loss": -43.00177001953125, "global_step": 286262, "epoch": 2365} {"train_loss": -42.65324783325195, "global_step": 286263, "epoch": 2365} {"train_loss": -41.648433685302734, "global_step": 286264, "epoch": 2365} {"train_loss": -42.75151443481445, "global_step": 286265, "epoch": 2365} {"train_loss": -43.11566925048828, "global_step": 286266, "epoch": 2365} {"train_loss": -42.792091369628906, "global_step": 286267, "epoch": 2365} {"train_loss": -42.71734619140625, "global_step": 286268, "epoch": 2365} {"train_loss": -41.76607894897461, "global_step": 286269, "epoch": 2365} {"train_loss": -42.66777420043945, "global_step": 286270, "epoch": 2365} {"train_loss": -42.635406494140625, "global_step": 286271, "epoch": 2365} {"train_loss": -43.28428268432617, "global_step": 286272, "epoch": 2365} {"train_loss": -40.5430908203125, "global_step": 286273, "epoch": 2365} {"train_loss": -40.32451248168945, "global_step": 286274, "epoch": 2365} {"train_loss": -42.97847366333008, "global_step": 286275, "epoch": 2365} {"train_loss": -42.472129821777344, "global_step": 286276, "epoch": 2365} {"train_loss": -42.46427536010742, "global_step": 286277, "epoch": 2365} {"train_loss": -42.78447341918945, "global_step": 286278, "epoch": 2365} {"train_loss": -41.659698486328125, "global_step": 286279, "epoch": 2365} {"train_loss": -43.28506088256836, "global_step": 286280, "epoch": 2365} {"train_loss": -43.37141799926758, "global_step": 286281, "epoch": 2365} {"train_loss": -43.1054573059082, "global_step": 286282, "epoch": 2365} {"train_loss": -42.78792953491211, "global_step": 286283, "epoch": 2365} {"train_loss": -42.84684371948242, "global_step": 286284, "epoch": 2365} {"train_loss": -41.4527043429288, "global_step": 286285, "epoch": 2365, "val_loss": 2885655.25} {"train_loss": -41.19443893432617, "global_step": 286286, "epoch": 2366} {"train_loss": -42.516448974609375, "global_step": 286287, "epoch": 2366} {"train_loss": -41.92325210571289, "global_step": 286288, "epoch": 2366} {"train_loss": -38.3947639465332, "global_step": 286289, "epoch": 2366} {"train_loss": -39.61054611206055, "global_step": 286290, "epoch": 2366} {"train_loss": -40.619815826416016, "global_step": 286291, "epoch": 2366} {"train_loss": -41.98070526123047, "global_step": 286292, "epoch": 2366} {"train_loss": -42.40065383911133, "global_step": 286293, "epoch": 2366} {"train_loss": -40.1074333190918, "global_step": 286294, "epoch": 2366} {"train_loss": -40.52851486206055, "global_step": 286295, "epoch": 2366} {"train_loss": -40.924678802490234, "global_step": 286296, "epoch": 2366} {"train_loss": -40.4373893737793, "global_step": 286297, "epoch": 2366} {"train_loss": -42.53280258178711, "global_step": 286298, "epoch": 2366} {"train_loss": -42.136253356933594, "global_step": 286299, "epoch": 2366} {"train_loss": -41.83972930908203, "global_step": 286300, "epoch": 2366} {"train_loss": -41.84075927734375, "global_step": 286301, "epoch": 2366} {"train_loss": -40.6265983581543, "global_step": 286302, "epoch": 2366} {"train_loss": -41.916812896728516, "global_step": 286303, "epoch": 2366} {"train_loss": -40.80942916870117, "global_step": 286304, "epoch": 2366} {"train_loss": -42.647483825683594, "global_step": 286305, "epoch": 2366} {"train_loss": -41.34132385253906, "global_step": 286306, "epoch": 2366} {"train_loss": -42.11810302734375, "global_step": 286307, "epoch": 2366} {"train_loss": -40.642757415771484, "global_step": 286308, "epoch": 2366} {"train_loss": -42.12066650390625, "global_step": 286309, "epoch": 2366} {"train_loss": -41.75701904296875, "global_step": 286310, "epoch": 2366} {"train_loss": -41.30581283569336, "global_step": 286311, "epoch": 2366} {"train_loss": -42.2354850769043, "global_step": 286312, "epoch": 2366} {"train_loss": -42.60477828979492, "global_step": 286313, "epoch": 2366} {"train_loss": -41.94623565673828, "global_step": 286314, "epoch": 2366} {"train_loss": -42.54124450683594, "global_step": 286315, "epoch": 2366} {"train_loss": -42.66317367553711, "global_step": 286316, "epoch": 2366} {"train_loss": -41.97407913208008, "global_step": 286317, "epoch": 2366} {"train_loss": -41.540828704833984, "global_step": 286318, "epoch": 2366} {"train_loss": -42.41341781616211, "global_step": 286319, "epoch": 2366} {"train_loss": -41.38228988647461, "global_step": 286320, "epoch": 2366} {"train_loss": -42.08149719238281, "global_step": 286321, "epoch": 2366} {"train_loss": -42.78668212890625, "global_step": 286322, "epoch": 2366} {"train_loss": -42.393497467041016, "global_step": 286323, "epoch": 2366} {"train_loss": -42.58943557739258, "global_step": 286324, "epoch": 2366} {"train_loss": -42.22903060913086, "global_step": 286325, "epoch": 2366} {"train_loss": -42.67256546020508, "global_step": 286326, "epoch": 2366} {"train_loss": -42.92182922363281, "global_step": 286327, "epoch": 2366} {"train_loss": -42.108062744140625, "global_step": 286328, "epoch": 2366} {"train_loss": -42.770782470703125, "global_step": 286329, "epoch": 2366} {"train_loss": -42.88832092285156, "global_step": 286330, "epoch": 2366} {"train_loss": -41.89932632446289, "global_step": 286331, "epoch": 2366} {"train_loss": -41.35275650024414, "global_step": 286332, "epoch": 2366} {"train_loss": -42.63604736328125, "global_step": 286333, "epoch": 2366} {"train_loss": -43.26877212524414, "global_step": 286334, "epoch": 2366} {"train_loss": -42.68782424926758, "global_step": 286335, "epoch": 2366} {"train_loss": -42.23295974731445, "global_step": 286336, "epoch": 2366} {"train_loss": -41.433815002441406, "global_step": 286337, "epoch": 2366} {"train_loss": -42.63158416748047, "global_step": 286338, "epoch": 2366} {"train_loss": -42.48424530029297, "global_step": 286339, "epoch": 2366} {"train_loss": -43.15332794189453, "global_step": 286340, "epoch": 2366} {"train_loss": -42.382328033447266, "global_step": 286341, "epoch": 2366} {"train_loss": -41.880462646484375, "global_step": 286342, "epoch": 2366} {"train_loss": -42.74209213256836, "global_step": 286343, "epoch": 2366} {"train_loss": -41.58074951171875, "global_step": 286344, "epoch": 2366} {"train_loss": -42.47213363647461, "global_step": 286345, "epoch": 2366} {"train_loss": -42.050479888916016, "global_step": 286346, "epoch": 2366} {"train_loss": -42.554443359375, "global_step": 286347, "epoch": 2366} {"train_loss": -41.96910858154297, "global_step": 286348, "epoch": 2366} {"train_loss": -42.836517333984375, "global_step": 286349, "epoch": 2366} {"train_loss": -42.232421875, "global_step": 286350, "epoch": 2366} {"train_loss": -40.5430908203125, "global_step": 286351, "epoch": 2366} {"train_loss": -42.34706497192383, "global_step": 286352, "epoch": 2366} {"train_loss": -41.9476318359375, "global_step": 286353, "epoch": 2366} {"train_loss": -43.079803466796875, "global_step": 286354, "epoch": 2366} {"train_loss": -42.79716110229492, "global_step": 286355, "epoch": 2366} {"train_loss": -42.974002838134766, "global_step": 286356, "epoch": 2366} {"train_loss": -43.26385498046875, "global_step": 286357, "epoch": 2366} {"train_loss": -42.33600997924805, "global_step": 286358, "epoch": 2366} {"train_loss": -42.255714416503906, "global_step": 286359, "epoch": 2366} {"train_loss": -42.173980712890625, "global_step": 286360, "epoch": 2366} {"train_loss": -40.1140251159668, "global_step": 286361, "epoch": 2366} {"train_loss": -42.47466278076172, "global_step": 286362, "epoch": 2366} {"train_loss": -41.99079132080078, "global_step": 286363, "epoch": 2366} {"train_loss": -42.31987380981445, "global_step": 286364, "epoch": 2366} {"train_loss": -42.98942947387695, "global_step": 286365, "epoch": 2366} {"train_loss": -41.301361083984375, "global_step": 286366, "epoch": 2366} {"train_loss": -43.2525520324707, "global_step": 286367, "epoch": 2366} {"train_loss": -42.22953414916992, "global_step": 286368, "epoch": 2366} {"train_loss": -41.87180709838867, "global_step": 286369, "epoch": 2366} {"train_loss": -42.2729606628418, "global_step": 286370, "epoch": 2366} {"train_loss": -41.2451171875, "global_step": 286371, "epoch": 2366} {"train_loss": -42.60737228393555, "global_step": 286372, "epoch": 2366} {"train_loss": -42.18157958984375, "global_step": 286373, "epoch": 2366} {"train_loss": -40.42407989501953, "global_step": 286374, "epoch": 2366} {"train_loss": -42.107398986816406, "global_step": 286375, "epoch": 2366} {"train_loss": -43.15543746948242, "global_step": 286376, "epoch": 2366} {"train_loss": -42.79692459106445, "global_step": 286377, "epoch": 2366} {"train_loss": -41.99520492553711, "global_step": 286378, "epoch": 2366} {"train_loss": -38.72040939331055, "global_step": 286379, "epoch": 2366} {"train_loss": -42.29964828491211, "global_step": 286380, "epoch": 2366} {"train_loss": -41.201942443847656, "global_step": 286381, "epoch": 2366} {"train_loss": -37.82124710083008, "global_step": 286382, "epoch": 2366} {"train_loss": -41.004859924316406, "global_step": 286383, "epoch": 2366} {"train_loss": -42.733367919921875, "global_step": 286384, "epoch": 2366} {"train_loss": -42.49285888671875, "global_step": 286385, "epoch": 2366} {"train_loss": -42.82412338256836, "global_step": 286386, "epoch": 2366} {"train_loss": -41.95858383178711, "global_step": 286387, "epoch": 2366} {"train_loss": -42.29106521606445, "global_step": 286388, "epoch": 2366} {"train_loss": -40.84457778930664, "global_step": 286389, "epoch": 2366} {"train_loss": -41.66852569580078, "global_step": 286390, "epoch": 2366} {"train_loss": -39.586177825927734, "global_step": 286391, "epoch": 2366} {"train_loss": -34.40999221801758, "global_step": 286392, "epoch": 2366} {"train_loss": -41.52710723876953, "global_step": 286393, "epoch": 2366} {"train_loss": -39.80662155151367, "global_step": 286394, "epoch": 2366} {"train_loss": -40.919315338134766, "global_step": 286395, "epoch": 2366} {"train_loss": -40.70526885986328, "global_step": 286396, "epoch": 2366} {"train_loss": -29.3817138671875, "global_step": 286397, "epoch": 2366} {"train_loss": -41.372859954833984, "global_step": 286398, "epoch": 2366} {"train_loss": -41.90542984008789, "global_step": 286399, "epoch": 2366} {"train_loss": -41.653045654296875, "global_step": 286400, "epoch": 2366} {"train_loss": -41.91416931152344, "global_step": 286401, "epoch": 2366} {"train_loss": -31.295063018798828, "global_step": 286402, "epoch": 2366} {"train_loss": -40.42139434814453, "global_step": 286403, "epoch": 2366} {"train_loss": -38.138397216796875, "global_step": 286404, "epoch": 2366} {"train_loss": -40.40507125854492, "global_step": 286405, "epoch": 2366} {"train_loss": -41.5382494020068, "global_step": 286406, "epoch": 2366, "val_loss": 2732014.25} {"train_loss": -40.66718673706055, "global_step": 286407, "epoch": 2367} {"train_loss": -39.16270446777344, "global_step": 286408, "epoch": 2367} {"train_loss": -35.42292022705078, "global_step": 286409, "epoch": 2367} {"train_loss": -38.018306732177734, "global_step": 286410, "epoch": 2367} {"train_loss": -39.38230895996094, "global_step": 286411, "epoch": 2367} {"train_loss": -39.961849212646484, "global_step": 286412, "epoch": 2367} {"train_loss": -39.16254806518555, "global_step": 286413, "epoch": 2367} {"train_loss": -39.9940299987793, "global_step": 286414, "epoch": 2367} {"train_loss": -38.13231658935547, "global_step": 286415, "epoch": 2367} {"train_loss": -40.582916259765625, "global_step": 286416, "epoch": 2367} {"train_loss": -39.48252487182617, "global_step": 286417, "epoch": 2367} {"train_loss": -40.51285171508789, "global_step": 286418, "epoch": 2367} {"train_loss": -40.96891403198242, "global_step": 286419, "epoch": 2367} {"train_loss": -40.403526306152344, "global_step": 286420, "epoch": 2367} {"train_loss": -37.14332580566406, "global_step": 286421, "epoch": 2367} {"train_loss": -41.01532745361328, "global_step": 286422, "epoch": 2367} {"train_loss": -41.23500442504883, "global_step": 286423, "epoch": 2367} {"train_loss": -41.26455307006836, "global_step": 286424, "epoch": 2367} {"train_loss": -40.21376419067383, "global_step": 286425, "epoch": 2367} {"train_loss": -41.218257904052734, "global_step": 286426, "epoch": 2367} {"train_loss": -40.855987548828125, "global_step": 286427, "epoch": 2367} {"train_loss": -34.4713249206543, "global_step": 286428, "epoch": 2367} {"train_loss": -41.08779525756836, "global_step": 286429, "epoch": 2367} {"train_loss": -38.131309509277344, "global_step": 286430, "epoch": 2367} {"train_loss": -40.778167724609375, "global_step": 286431, "epoch": 2367} {"train_loss": -39.8775634765625, "global_step": 286432, "epoch": 2367} {"train_loss": -41.1263542175293, "global_step": 286433, "epoch": 2367} {"train_loss": -41.710208892822266, "global_step": 286434, "epoch": 2367} {"train_loss": -39.5057487487793, "global_step": 286435, "epoch": 2367} {"train_loss": -39.98762893676758, "global_step": 286436, "epoch": 2367} {"train_loss": -41.949256896972656, "global_step": 286437, "epoch": 2367} {"train_loss": -39.65838623046875, "global_step": 286438, "epoch": 2367} {"train_loss": -41.570335388183594, "global_step": 286439, "epoch": 2367} {"train_loss": -41.3436279296875, "global_step": 286440, "epoch": 2367} {"train_loss": -40.585060119628906, "global_step": 286441, "epoch": 2367} {"train_loss": -40.847042083740234, "global_step": 286442, "epoch": 2367} {"train_loss": -41.590145111083984, "global_step": 286443, "epoch": 2367} {"train_loss": -41.771728515625, "global_step": 286444, "epoch": 2367} {"train_loss": -38.68004608154297, "global_step": 286445, "epoch": 2367} {"train_loss": -39.33586502075195, "global_step": 286446, "epoch": 2367} {"train_loss": -40.94696807861328, "global_step": 286447, "epoch": 2367} {"train_loss": -41.40829086303711, "global_step": 286448, "epoch": 2367} {"train_loss": -41.52632522583008, "global_step": 286449, "epoch": 2367} {"train_loss": -41.95707702636719, "global_step": 286450, "epoch": 2367} {"train_loss": -42.77329635620117, "global_step": 286451, "epoch": 2367} {"train_loss": -42.087982177734375, "global_step": 286452, "epoch": 2367} {"train_loss": -41.86511993408203, "global_step": 286453, "epoch": 2367} {"train_loss": -41.669002532958984, "global_step": 286454, "epoch": 2367} {"train_loss": -40.6784553527832, "global_step": 286455, "epoch": 2367} {"train_loss": -41.740325927734375, "global_step": 286456, "epoch": 2367} {"train_loss": -42.361141204833984, "global_step": 286457, "epoch": 2367} {"train_loss": -41.77056884765625, "global_step": 286458, "epoch": 2367} {"train_loss": -41.537879943847656, "global_step": 286459, "epoch": 2367} {"train_loss": -42.5558967590332, "global_step": 286460, "epoch": 2367} {"train_loss": -41.63740158081055, "global_step": 286461, "epoch": 2367} {"train_loss": -41.98160934448242, "global_step": 286462, "epoch": 2367} {"train_loss": -42.045623779296875, "global_step": 286463, "epoch": 2367} {"train_loss": -40.24264144897461, "global_step": 286464, "epoch": 2367} {"train_loss": -42.62177658081055, "global_step": 286465, "epoch": 2367} {"train_loss": -39.92280197143555, "global_step": 286466, "epoch": 2367} {"train_loss": -41.482295989990234, "global_step": 286467, "epoch": 2367} {"train_loss": -40.94179916381836, "global_step": 286468, "epoch": 2367} {"train_loss": -41.776153564453125, "global_step": 286469, "epoch": 2367} {"train_loss": -41.57402801513672, "global_step": 286470, "epoch": 2367} {"train_loss": -41.6096076965332, "global_step": 286471, "epoch": 2367} {"train_loss": -42.4517822265625, "global_step": 286472, "epoch": 2367} {"train_loss": -42.178035736083984, "global_step": 286473, "epoch": 2367} {"train_loss": -41.927276611328125, "global_step": 286474, "epoch": 2367} {"train_loss": -42.59450912475586, "global_step": 286475, "epoch": 2367} {"train_loss": -41.54354476928711, "global_step": 286476, "epoch": 2367} {"train_loss": -40.24068832397461, "global_step": 286477, "epoch": 2367} {"train_loss": -42.68050003051758, "global_step": 286478, "epoch": 2367} {"train_loss": -42.76968002319336, "global_step": 286479, "epoch": 2367} {"train_loss": -41.676239013671875, "global_step": 286480, "epoch": 2367} {"train_loss": -42.464881896972656, "global_step": 286481, "epoch": 2367} {"train_loss": -42.71393966674805, "global_step": 286482, "epoch": 2367} {"train_loss": -42.63059616088867, "global_step": 286483, "epoch": 2367} {"train_loss": -42.82646179199219, "global_step": 286484, "epoch": 2367} {"train_loss": -42.04587936401367, "global_step": 286485, "epoch": 2367} {"train_loss": -42.29397201538086, "global_step": 286486, "epoch": 2367} {"train_loss": -40.7517204284668, "global_step": 286487, "epoch": 2367} {"train_loss": -41.81050491333008, "global_step": 286488, "epoch": 2367} {"train_loss": -41.736690521240234, "global_step": 286489, "epoch": 2367} {"train_loss": -41.854347229003906, "global_step": 286490, "epoch": 2367} {"train_loss": -42.213050842285156, "global_step": 286491, "epoch": 2367} {"train_loss": -42.64125061035156, "global_step": 286492, "epoch": 2367} {"train_loss": -42.97883224487305, "global_step": 286493, "epoch": 2367} {"train_loss": -42.63792037963867, "global_step": 286494, "epoch": 2367} {"train_loss": -41.239845275878906, "global_step": 286495, "epoch": 2367} {"train_loss": -43.0147705078125, "global_step": 286496, "epoch": 2367} {"train_loss": -42.786170959472656, "global_step": 286497, "epoch": 2367} {"train_loss": -40.1514778137207, "global_step": 286498, "epoch": 2367} {"train_loss": -42.07587814331055, "global_step": 286499, "epoch": 2367} {"train_loss": -42.291866302490234, "global_step": 286500, "epoch": 2367} {"train_loss": -41.578609466552734, "global_step": 286501, "epoch": 2367} {"train_loss": -40.20807647705078, "global_step": 286502, "epoch": 2367} {"train_loss": -40.972991943359375, "global_step": 286503, "epoch": 2367} {"train_loss": -41.159767150878906, "global_step": 286504, "epoch": 2367} {"train_loss": -42.036373138427734, "global_step": 286505, "epoch": 2367} {"train_loss": -39.139373779296875, "global_step": 286506, "epoch": 2367} {"train_loss": -38.827423095703125, "global_step": 286507, "epoch": 2367} {"train_loss": -41.930023193359375, "global_step": 286508, "epoch": 2367} {"train_loss": -41.882240295410156, "global_step": 286509, "epoch": 2367} {"train_loss": -40.04172134399414, "global_step": 286510, "epoch": 2367} {"train_loss": -38.729366302490234, "global_step": 286511, "epoch": 2367} {"train_loss": -41.672664642333984, "global_step": 286512, "epoch": 2367} {"train_loss": -41.97766876220703, "global_step": 286513, "epoch": 2367} {"train_loss": -40.62860107421875, "global_step": 286514, "epoch": 2367} {"train_loss": -40.87481689453125, "global_step": 286515, "epoch": 2367} {"train_loss": -41.77884292602539, "global_step": 286516, "epoch": 2367} {"train_loss": -41.67967224121094, "global_step": 286517, "epoch": 2367} {"train_loss": -40.09857177734375, "global_step": 286518, "epoch": 2367} {"train_loss": -41.325008392333984, "global_step": 286519, "epoch": 2367} {"train_loss": -41.20882797241211, "global_step": 286520, "epoch": 2367} {"train_loss": -40.50589370727539, "global_step": 286521, "epoch": 2367} {"train_loss": -42.03729248046875, "global_step": 286522, "epoch": 2367} {"train_loss": -40.393550872802734, "global_step": 286523, "epoch": 2367} {"train_loss": -39.55865478515625, "global_step": 286524, "epoch": 2367} {"train_loss": -40.56504821777344, "global_step": 286525, "epoch": 2367} {"train_loss": -41.84687423706055, "global_step": 286526, "epoch": 2367} {"train_loss": -41.02375071501929, "global_step": 286527, "epoch": 2367, "val_loss": 2457333.25} {"train_loss": -40.262306213378906, "global_step": 286528, "epoch": 2368} {"train_loss": -41.23784255981445, "global_step": 286529, "epoch": 2368} {"train_loss": -42.227210998535156, "global_step": 286530, "epoch": 2368} {"train_loss": -41.29417037963867, "global_step": 286531, "epoch": 2368} {"train_loss": -39.885738372802734, "global_step": 286532, "epoch": 2368} {"train_loss": -42.1318359375, "global_step": 286533, "epoch": 2368} {"train_loss": -42.12607955932617, "global_step": 286534, "epoch": 2368} {"train_loss": -41.68272018432617, "global_step": 286535, "epoch": 2368} {"train_loss": -41.5241813659668, "global_step": 286536, "epoch": 2368} {"train_loss": -41.82250213623047, "global_step": 286537, "epoch": 2368} {"train_loss": -42.487579345703125, "global_step": 286538, "epoch": 2368} {"train_loss": -41.99857711791992, "global_step": 286539, "epoch": 2368} {"train_loss": -42.72693634033203, "global_step": 286540, "epoch": 2368} {"train_loss": -41.545265197753906, "global_step": 286541, "epoch": 2368} {"train_loss": -42.17717361450195, "global_step": 286542, "epoch": 2368} {"train_loss": -42.314456939697266, "global_step": 286543, "epoch": 2368} {"train_loss": -42.31130599975586, "global_step": 286544, "epoch": 2368} {"train_loss": -41.68775939941406, "global_step": 286545, "epoch": 2368} {"train_loss": -42.157012939453125, "global_step": 286546, "epoch": 2368} {"train_loss": -42.65107345581055, "global_step": 286547, "epoch": 2368} {"train_loss": -42.78801345825195, "global_step": 286548, "epoch": 2368} {"train_loss": -42.60869216918945, "global_step": 286549, "epoch": 2368} {"train_loss": -41.49011993408203, "global_step": 286550, "epoch": 2368} {"train_loss": -43.1596565246582, "global_step": 286551, "epoch": 2368} {"train_loss": -42.39348220825195, "global_step": 286552, "epoch": 2368} {"train_loss": -42.537330627441406, "global_step": 286553, "epoch": 2368} {"train_loss": -43.648921966552734, "global_step": 286554, "epoch": 2368} {"train_loss": -41.6177978515625, "global_step": 286555, "epoch": 2368} {"train_loss": -42.5074577331543, "global_step": 286556, "epoch": 2368} {"train_loss": -42.73990249633789, "global_step": 286557, "epoch": 2368} {"train_loss": -42.819759368896484, "global_step": 286558, "epoch": 2368} {"train_loss": -42.72030258178711, "global_step": 286559, "epoch": 2368} {"train_loss": -43.04843521118164, "global_step": 286560, "epoch": 2368} {"train_loss": -43.48211669921875, "global_step": 286561, "epoch": 2368} {"train_loss": -42.454986572265625, "global_step": 286562, "epoch": 2368} {"train_loss": -42.215240478515625, "global_step": 286563, "epoch": 2368} {"train_loss": -43.373783111572266, "global_step": 286564, "epoch": 2368} {"train_loss": -41.9868278503418, "global_step": 286565, "epoch": 2368} {"train_loss": -42.76831817626953, "global_step": 286566, "epoch": 2368} {"train_loss": -43.009002685546875, "global_step": 286567, "epoch": 2368} {"train_loss": -42.941139221191406, "global_step": 286568, "epoch": 2368} {"train_loss": -42.72328567504883, "global_step": 286569, "epoch": 2368} {"train_loss": -43.01539611816406, "global_step": 286570, "epoch": 2368} {"train_loss": -42.879573822021484, "global_step": 286571, "epoch": 2368} {"train_loss": -42.47309112548828, "global_step": 286572, "epoch": 2368} {"train_loss": -42.41514205932617, "global_step": 286573, "epoch": 2368} {"train_loss": -42.370174407958984, "global_step": 286574, "epoch": 2368} {"train_loss": -41.3319206237793, "global_step": 286575, "epoch": 2368} {"train_loss": -42.16394805908203, "global_step": 286576, "epoch": 2368} {"train_loss": -43.01860427856445, "global_step": 286577, "epoch": 2368} {"train_loss": -42.281097412109375, "global_step": 286578, "epoch": 2368} {"train_loss": -41.681819915771484, "global_step": 286579, "epoch": 2368} {"train_loss": -42.46818923950195, "global_step": 286580, "epoch": 2368} {"train_loss": -43.08913803100586, "global_step": 286581, "epoch": 2368} {"train_loss": -42.85506820678711, "global_step": 286582, "epoch": 2368} {"train_loss": -41.978057861328125, "global_step": 286583, "epoch": 2368} {"train_loss": -42.672447204589844, "global_step": 286584, "epoch": 2368} {"train_loss": -43.14645004272461, "global_step": 286585, "epoch": 2368} {"train_loss": -42.2729606628418, "global_step": 286586, "epoch": 2368} {"train_loss": -40.26710891723633, "global_step": 286587, "epoch": 2368} {"train_loss": -41.80348205566406, "global_step": 286588, "epoch": 2368} {"train_loss": -42.12617111206055, "global_step": 286589, "epoch": 2368} {"train_loss": -38.05671691894531, "global_step": 286590, "epoch": 2368} {"train_loss": -39.41990280151367, "global_step": 286591, "epoch": 2368} {"train_loss": -42.41373825073242, "global_step": 286592, "epoch": 2368} {"train_loss": -41.37773132324219, "global_step": 286593, "epoch": 2368} {"train_loss": -40.03068923950195, "global_step": 286594, "epoch": 2368} {"train_loss": -40.34531784057617, "global_step": 286595, "epoch": 2368} {"train_loss": -42.051063537597656, "global_step": 286596, "epoch": 2368} {"train_loss": -40.959632873535156, "global_step": 286597, "epoch": 2368} {"train_loss": -41.00730514526367, "global_step": 286598, "epoch": 2368} {"train_loss": -40.18082809448242, "global_step": 286599, "epoch": 2368} {"train_loss": -40.65867233276367, "global_step": 286600, "epoch": 2368} {"train_loss": -40.29331970214844, "global_step": 286601, "epoch": 2368} {"train_loss": -40.078182220458984, "global_step": 286602, "epoch": 2368} {"train_loss": -39.09283447265625, "global_step": 286603, "epoch": 2368} {"train_loss": -41.242279052734375, "global_step": 286604, "epoch": 2368} {"train_loss": -41.5740852355957, "global_step": 286605, "epoch": 2368} {"train_loss": -40.60219955444336, "global_step": 286606, "epoch": 2368} {"train_loss": -41.42643356323242, "global_step": 286607, "epoch": 2368} {"train_loss": -41.6163215637207, "global_step": 286608, "epoch": 2368} {"train_loss": -41.98759078979492, "global_step": 286609, "epoch": 2368} {"train_loss": -39.619564056396484, "global_step": 286610, "epoch": 2368} {"train_loss": -40.03751754760742, "global_step": 286611, "epoch": 2368} {"train_loss": -39.368377685546875, "global_step": 286612, "epoch": 2368} {"train_loss": -42.19332504272461, "global_step": 286613, "epoch": 2368} {"train_loss": -40.8558464050293, "global_step": 286614, "epoch": 2368} {"train_loss": -41.32672882080078, "global_step": 286615, "epoch": 2368} {"train_loss": -41.33351516723633, "global_step": 286616, "epoch": 2368} {"train_loss": -36.21157455444336, "global_step": 286617, "epoch": 2368} {"train_loss": -41.599395751953125, "global_step": 286618, "epoch": 2368} {"train_loss": -42.61110305786133, "global_step": 286619, "epoch": 2368} {"train_loss": -41.388179779052734, "global_step": 286620, "epoch": 2368} {"train_loss": -42.377655029296875, "global_step": 286621, "epoch": 2368} {"train_loss": -41.61699295043945, "global_step": 286622, "epoch": 2368} {"train_loss": -42.035186767578125, "global_step": 286623, "epoch": 2368} {"train_loss": -42.053466796875, "global_step": 286624, "epoch": 2368} {"train_loss": -42.23318099975586, "global_step": 286625, "epoch": 2368} {"train_loss": -42.5584602355957, "global_step": 286626, "epoch": 2368} {"train_loss": -42.51328659057617, "global_step": 286627, "epoch": 2368} {"train_loss": -41.58341598510742, "global_step": 286628, "epoch": 2368} {"train_loss": -41.70496368408203, "global_step": 286629, "epoch": 2368} {"train_loss": -42.741634368896484, "global_step": 286630, "epoch": 2368} {"train_loss": -42.28818893432617, "global_step": 286631, "epoch": 2368} {"train_loss": -42.91794204711914, "global_step": 286632, "epoch": 2368} {"train_loss": -42.74372100830078, "global_step": 286633, "epoch": 2368} {"train_loss": -42.49445724487305, "global_step": 286634, "epoch": 2368} {"train_loss": -42.595027923583984, "global_step": 286635, "epoch": 2368} {"train_loss": -42.705894470214844, "global_step": 286636, "epoch": 2368} {"train_loss": -42.63550567626953, "global_step": 286637, "epoch": 2368} {"train_loss": -42.46523666381836, "global_step": 286638, "epoch": 2368} {"train_loss": -42.927398681640625, "global_step": 286639, "epoch": 2368} {"train_loss": -42.656124114990234, "global_step": 286640, "epoch": 2368} {"train_loss": -42.68284225463867, "global_step": 286641, "epoch": 2368} {"train_loss": -42.088958740234375, "global_step": 286642, "epoch": 2368} {"train_loss": -42.61408996582031, "global_step": 286643, "epoch": 2368} {"train_loss": -42.173152923583984, "global_step": 286644, "epoch": 2368} {"train_loss": -42.88369369506836, "global_step": 286645, "epoch": 2368} {"train_loss": -42.790096282958984, "global_step": 286646, "epoch": 2368} {"train_loss": -42.24699020385742, "global_step": 286647, "epoch": 2368} {"train_loss": -41.902459704186306, "global_step": 286648, "epoch": 2368, "val_loss": 2538790.75} {"train_loss": -42.68528366088867, "global_step": 286649, "epoch": 2369} {"train_loss": -42.50102233886719, "global_step": 286650, "epoch": 2369} {"train_loss": -42.9178466796875, "global_step": 286651, "epoch": 2369} {"train_loss": -42.292537689208984, "global_step": 286652, "epoch": 2369} {"train_loss": -42.8698844909668, "global_step": 286653, "epoch": 2369} {"train_loss": -42.55482864379883, "global_step": 286654, "epoch": 2369} {"train_loss": -42.551673889160156, "global_step": 286655, "epoch": 2369} {"train_loss": -43.14742660522461, "global_step": 286656, "epoch": 2369} {"train_loss": -42.268489837646484, "global_step": 286657, "epoch": 2369} {"train_loss": -42.721736907958984, "global_step": 286658, "epoch": 2369} {"train_loss": -42.985267639160156, "global_step": 286659, "epoch": 2369} {"train_loss": -42.21122360229492, "global_step": 286660, "epoch": 2369} {"train_loss": -41.44546127319336, "global_step": 286661, "epoch": 2369} {"train_loss": -43.03818130493164, "global_step": 286662, "epoch": 2369} {"train_loss": -43.07486343383789, "global_step": 286663, "epoch": 2369} {"train_loss": -43.28708267211914, "global_step": 286664, "epoch": 2369} {"train_loss": -42.98161697387695, "global_step": 286665, "epoch": 2369} {"train_loss": -42.499874114990234, "global_step": 286666, "epoch": 2369} {"train_loss": -42.75112533569336, "global_step": 286667, "epoch": 2369} {"train_loss": -42.634681701660156, "global_step": 286668, "epoch": 2369} {"train_loss": -43.264644622802734, "global_step": 286669, "epoch": 2369} {"train_loss": -43.07280731201172, "global_step": 286670, "epoch": 2369} {"train_loss": -42.34775924682617, "global_step": 286671, "epoch": 2369} {"train_loss": -43.10487747192383, "global_step": 286672, "epoch": 2369} {"train_loss": -42.93376159667969, "global_step": 286673, "epoch": 2369} {"train_loss": -42.63917922973633, "global_step": 286674, "epoch": 2369} {"train_loss": -42.54305648803711, "global_step": 286675, "epoch": 2369} {"train_loss": -43.038814544677734, "global_step": 286676, "epoch": 2369} {"train_loss": -42.99991226196289, "global_step": 286677, "epoch": 2369} {"train_loss": -42.96872329711914, "global_step": 286678, "epoch": 2369} {"train_loss": -42.59012985229492, "global_step": 286679, "epoch": 2369} {"train_loss": -43.14973068237305, "global_step": 286680, "epoch": 2369} {"train_loss": -43.40119552612305, "global_step": 286681, "epoch": 2369} {"train_loss": -43.02250289916992, "global_step": 286682, "epoch": 2369} {"train_loss": -42.72426223754883, "global_step": 286683, "epoch": 2369} {"train_loss": -43.66215515136719, "global_step": 286684, "epoch": 2369} {"train_loss": -42.147098541259766, "global_step": 286685, "epoch": 2369} {"train_loss": -41.65975570678711, "global_step": 286686, "epoch": 2369} {"train_loss": -41.98873519897461, "global_step": 286687, "epoch": 2369} {"train_loss": -43.154502868652344, "global_step": 286688, "epoch": 2369} {"train_loss": -42.90238571166992, "global_step": 286689, "epoch": 2369} {"train_loss": -42.84648132324219, "global_step": 286690, "epoch": 2369} {"train_loss": -42.37459945678711, "global_step": 286691, "epoch": 2369} {"train_loss": -42.32674026489258, "global_step": 286692, "epoch": 2369} {"train_loss": -41.31223678588867, "global_step": 286693, "epoch": 2369} {"train_loss": -41.15998077392578, "global_step": 286694, "epoch": 2369} {"train_loss": -40.490570068359375, "global_step": 286695, "epoch": 2369} {"train_loss": -40.87521743774414, "global_step": 286696, "epoch": 2369} {"train_loss": -41.66010665893555, "global_step": 286697, "epoch": 2369} {"train_loss": -42.02105712890625, "global_step": 286698, "epoch": 2369} {"train_loss": -41.43746566772461, "global_step": 286699, "epoch": 2369} {"train_loss": -41.547603607177734, "global_step": 286700, "epoch": 2369} {"train_loss": -42.1609001159668, "global_step": 286701, "epoch": 2369} {"train_loss": -41.566776275634766, "global_step": 286702, "epoch": 2369} {"train_loss": -42.873355865478516, "global_step": 286703, "epoch": 2369} {"train_loss": -42.12856674194336, "global_step": 286704, "epoch": 2369} {"train_loss": -41.71405029296875, "global_step": 286705, "epoch": 2369} {"train_loss": -41.823768615722656, "global_step": 286706, "epoch": 2369} {"train_loss": -42.643348693847656, "global_step": 286707, "epoch": 2369} {"train_loss": -42.95479965209961, "global_step": 286708, "epoch": 2369} {"train_loss": -42.08614730834961, "global_step": 286709, "epoch": 2369} {"train_loss": -42.804786682128906, "global_step": 286710, "epoch": 2369} {"train_loss": -42.06525802612305, "global_step": 286711, "epoch": 2369} {"train_loss": -42.311038970947266, "global_step": 286712, "epoch": 2369} {"train_loss": -41.556095123291016, "global_step": 286713, "epoch": 2369} {"train_loss": -41.98725509643555, "global_step": 286714, "epoch": 2369} {"train_loss": -42.895591735839844, "global_step": 286715, "epoch": 2369} {"train_loss": -42.378143310546875, "global_step": 286716, "epoch": 2369} {"train_loss": -42.618106842041016, "global_step": 286717, "epoch": 2369} {"train_loss": -42.63371658325195, "global_step": 286718, "epoch": 2369} {"train_loss": -42.257564544677734, "global_step": 286719, "epoch": 2369} {"train_loss": -41.60692596435547, "global_step": 286720, "epoch": 2369} {"train_loss": -41.022865295410156, "global_step": 286721, "epoch": 2369} {"train_loss": -43.334144592285156, "global_step": 286722, "epoch": 2369} {"train_loss": -42.59840393066406, "global_step": 286723, "epoch": 2369} {"train_loss": -41.695396423339844, "global_step": 286724, "epoch": 2369} {"train_loss": -43.01552963256836, "global_step": 286725, "epoch": 2369} {"train_loss": -42.438289642333984, "global_step": 286726, "epoch": 2369} {"train_loss": -42.859527587890625, "global_step": 286727, "epoch": 2369} {"train_loss": -43.42287063598633, "global_step": 286728, "epoch": 2369} {"train_loss": -43.141761779785156, "global_step": 286729, "epoch": 2369} {"train_loss": -42.75840377807617, "global_step": 286730, "epoch": 2369} {"train_loss": -43.0181999206543, "global_step": 286731, "epoch": 2369} {"train_loss": -43.73012924194336, "global_step": 286732, "epoch": 2369} {"train_loss": -42.8496208190918, "global_step": 286733, "epoch": 2369} {"train_loss": -38.98222732543945, "global_step": 286734, "epoch": 2369} {"train_loss": -42.783546447753906, "global_step": 286735, "epoch": 2369} {"train_loss": -42.53767013549805, "global_step": 286736, "epoch": 2369} {"train_loss": -43.437103271484375, "global_step": 286737, "epoch": 2369} {"train_loss": -43.16669845581055, "global_step": 286738, "epoch": 2369} {"train_loss": -42.18756866455078, "global_step": 286739, "epoch": 2369} {"train_loss": -41.07050323486328, "global_step": 286740, "epoch": 2369} {"train_loss": -41.711029052734375, "global_step": 286741, "epoch": 2369} {"train_loss": -43.270633697509766, "global_step": 286742, "epoch": 2369} {"train_loss": -42.10377883911133, "global_step": 286743, "epoch": 2369} {"train_loss": -37.74467849731445, "global_step": 286744, "epoch": 2369} {"train_loss": -42.03921890258789, "global_step": 286745, "epoch": 2369} {"train_loss": -42.00001907348633, "global_step": 286746, "epoch": 2369} {"train_loss": -40.43479537963867, "global_step": 286747, "epoch": 2369} {"train_loss": -38.54065704345703, "global_step": 286748, "epoch": 2369} {"train_loss": -38.37073516845703, "global_step": 286749, "epoch": 2369} {"train_loss": -41.458351135253906, "global_step": 286750, "epoch": 2369} {"train_loss": -42.14461135864258, "global_step": 286751, "epoch": 2369} {"train_loss": -41.2283935546875, "global_step": 286752, "epoch": 2369} {"train_loss": -40.441768646240234, "global_step": 286753, "epoch": 2369} {"train_loss": -42.34712219238281, "global_step": 286754, "epoch": 2369} {"train_loss": -42.3830451965332, "global_step": 286755, "epoch": 2369} {"train_loss": -40.35683822631836, "global_step": 286756, "epoch": 2369} {"train_loss": -41.10584259033203, "global_step": 286757, "epoch": 2369} {"train_loss": -42.62797164916992, "global_step": 286758, "epoch": 2369} {"train_loss": -39.97553253173828, "global_step": 286759, "epoch": 2369} {"train_loss": -41.048851013183594, "global_step": 286760, "epoch": 2369} {"train_loss": -41.82512664794922, "global_step": 286761, "epoch": 2369} {"train_loss": -41.7917366027832, "global_step": 286762, "epoch": 2369} {"train_loss": -42.221065521240234, "global_step": 286763, "epoch": 2369} {"train_loss": -40.839534759521484, "global_step": 286764, "epoch": 2369} {"train_loss": -42.1873779296875, "global_step": 286765, "epoch": 2369} {"train_loss": -42.51731491088867, "global_step": 286766, "epoch": 2369} {"train_loss": -42.03516387939453, "global_step": 286767, "epoch": 2369} {"train_loss": -42.61255645751953, "global_step": 286768, "epoch": 2369} {"train_loss": -42.1881486876937, "global_step": 286769, "epoch": 2369, "val_loss": 2500524.75} {"train_loss": -41.8621940612793, "global_step": 286770, "epoch": 2370} {"train_loss": -42.04270553588867, "global_step": 286771, "epoch": 2370} {"train_loss": -41.19279098510742, "global_step": 286772, "epoch": 2370} {"train_loss": -42.54569625854492, "global_step": 286773, "epoch": 2370} {"train_loss": -40.4797248840332, "global_step": 286774, "epoch": 2370} {"train_loss": -40.32184600830078, "global_step": 286775, "epoch": 2370} {"train_loss": -42.34012222290039, "global_step": 286776, "epoch": 2370} {"train_loss": -41.48017501831055, "global_step": 286777, "epoch": 2370} {"train_loss": -42.961856842041016, "global_step": 286778, "epoch": 2370} {"train_loss": -40.852928161621094, "global_step": 286779, "epoch": 2370} {"train_loss": -42.02734375, "global_step": 286780, "epoch": 2370} {"train_loss": -41.61167907714844, "global_step": 286781, "epoch": 2370} {"train_loss": -42.167354583740234, "global_step": 286782, "epoch": 2370} {"train_loss": -43.25006866455078, "global_step": 286783, "epoch": 2370} {"train_loss": -42.49507522583008, "global_step": 286784, "epoch": 2370} {"train_loss": -43.143455505371094, "global_step": 286785, "epoch": 2370} {"train_loss": -42.521514892578125, "global_step": 286786, "epoch": 2370} {"train_loss": -42.90291976928711, "global_step": 286787, "epoch": 2370} {"train_loss": -43.08369827270508, "global_step": 286788, "epoch": 2370} {"train_loss": -42.48059844970703, "global_step": 286789, "epoch": 2370} {"train_loss": -43.21623611450195, "global_step": 286790, "epoch": 2370} {"train_loss": -43.29703140258789, "global_step": 286791, "epoch": 2370} {"train_loss": -42.84043884277344, "global_step": 286792, "epoch": 2370} {"train_loss": -43.166786193847656, "global_step": 286793, "epoch": 2370} {"train_loss": -42.773284912109375, "global_step": 286794, "epoch": 2370} {"train_loss": -42.1920280456543, "global_step": 286795, "epoch": 2370} {"train_loss": -43.69124221801758, "global_step": 286796, "epoch": 2370} {"train_loss": -42.833194732666016, "global_step": 286797, "epoch": 2370} {"train_loss": -43.62691879272461, "global_step": 286798, "epoch": 2370} {"train_loss": -43.31081008911133, "global_step": 286799, "epoch": 2370} {"train_loss": -43.1615104675293, "global_step": 286800, "epoch": 2370} {"train_loss": -42.530086517333984, "global_step": 286801, "epoch": 2370} {"train_loss": -43.23651123046875, "global_step": 286802, "epoch": 2370} {"train_loss": -43.1336784362793, "global_step": 286803, "epoch": 2370} {"train_loss": -42.79703903198242, "global_step": 286804, "epoch": 2370} {"train_loss": -43.608001708984375, "global_step": 286805, "epoch": 2370} {"train_loss": -43.51279830932617, "global_step": 286806, "epoch": 2370} {"train_loss": -42.74032211303711, "global_step": 286807, "epoch": 2370} {"train_loss": -43.01366424560547, "global_step": 286808, "epoch": 2370} {"train_loss": -43.32666015625, "global_step": 286809, "epoch": 2370} {"train_loss": -43.13703918457031, "global_step": 286810, "epoch": 2370} {"train_loss": -41.845001220703125, "global_step": 286811, "epoch": 2370} {"train_loss": -42.86975860595703, "global_step": 286812, "epoch": 2370} {"train_loss": -42.046348571777344, "global_step": 286813, "epoch": 2370} {"train_loss": -42.06582260131836, "global_step": 286814, "epoch": 2370} {"train_loss": -41.906578063964844, "global_step": 286815, "epoch": 2370} {"train_loss": -43.244747161865234, "global_step": 286816, "epoch": 2370} {"train_loss": -41.77279281616211, "global_step": 286817, "epoch": 2370} {"train_loss": -41.99391555786133, "global_step": 286818, "epoch": 2370} {"train_loss": -42.21730422973633, "global_step": 286819, "epoch": 2370} {"train_loss": -42.41838836669922, "global_step": 286820, "epoch": 2370} {"train_loss": -42.00760269165039, "global_step": 286821, "epoch": 2370} {"train_loss": -42.771297454833984, "global_step": 286822, "epoch": 2370} {"train_loss": -43.28904342651367, "global_step": 286823, "epoch": 2370} {"train_loss": -42.97639846801758, "global_step": 286824, "epoch": 2370} {"train_loss": -41.9243049621582, "global_step": 286825, "epoch": 2370} {"train_loss": -42.51936721801758, "global_step": 286826, "epoch": 2370} {"train_loss": -42.36539840698242, "global_step": 286827, "epoch": 2370} {"train_loss": -41.317378997802734, "global_step": 286828, "epoch": 2370} {"train_loss": -42.84267807006836, "global_step": 286829, "epoch": 2370} {"train_loss": -41.58382797241211, "global_step": 286830, "epoch": 2370} {"train_loss": -42.0338249206543, "global_step": 286831, "epoch": 2370} {"train_loss": -42.30420684814453, "global_step": 286832, "epoch": 2370} {"train_loss": -42.167903900146484, "global_step": 286833, "epoch": 2370} {"train_loss": -41.939971923828125, "global_step": 286834, "epoch": 2370} {"train_loss": -42.93923568725586, "global_step": 286835, "epoch": 2370} {"train_loss": -43.23292922973633, "global_step": 286836, "epoch": 2370} {"train_loss": -42.681610107421875, "global_step": 286837, "epoch": 2370} {"train_loss": -43.20649719238281, "global_step": 286838, "epoch": 2370} {"train_loss": -43.1884880065918, "global_step": 286839, "epoch": 2370} {"train_loss": -42.80126190185547, "global_step": 286840, "epoch": 2370} {"train_loss": -42.06527328491211, "global_step": 286841, "epoch": 2370} {"train_loss": -42.17810821533203, "global_step": 286842, "epoch": 2370} {"train_loss": -42.022377014160156, "global_step": 286843, "epoch": 2370} {"train_loss": -42.559906005859375, "global_step": 286844, "epoch": 2370} {"train_loss": -43.1218147277832, "global_step": 286845, "epoch": 2370} {"train_loss": -43.55454635620117, "global_step": 286846, "epoch": 2370} {"train_loss": -42.7906494140625, "global_step": 286847, "epoch": 2370} {"train_loss": -41.49656295776367, "global_step": 286848, "epoch": 2370} {"train_loss": -43.119197845458984, "global_step": 286849, "epoch": 2370} {"train_loss": -43.01929473876953, "global_step": 286850, "epoch": 2370} {"train_loss": -42.642948150634766, "global_step": 286851, "epoch": 2370} {"train_loss": -43.147796630859375, "global_step": 286852, "epoch": 2370} {"train_loss": -42.473236083984375, "global_step": 286853, "epoch": 2370} {"train_loss": -42.491939544677734, "global_step": 286854, "epoch": 2370} {"train_loss": -42.529964447021484, "global_step": 286855, "epoch": 2370} {"train_loss": -43.104427337646484, "global_step": 286856, "epoch": 2370} {"train_loss": -42.75127410888672, "global_step": 286857, "epoch": 2370} {"train_loss": -43.10708236694336, "global_step": 286858, "epoch": 2370} {"train_loss": -43.22180938720703, "global_step": 286859, "epoch": 2370} {"train_loss": -42.95691680908203, "global_step": 286860, "epoch": 2370} {"train_loss": -41.90298080444336, "global_step": 286861, "epoch": 2370} {"train_loss": -43.65009307861328, "global_step": 286862, "epoch": 2370} {"train_loss": -42.35863494873047, "global_step": 286863, "epoch": 2370} {"train_loss": -42.52069854736328, "global_step": 286864, "epoch": 2370} {"train_loss": -42.47291946411133, "global_step": 286865, "epoch": 2370} {"train_loss": -41.5719108581543, "global_step": 286866, "epoch": 2370} {"train_loss": -42.019344329833984, "global_step": 286867, "epoch": 2370} {"train_loss": -41.44227600097656, "global_step": 286868, "epoch": 2370} {"train_loss": -42.28672790527344, "global_step": 286869, "epoch": 2370} {"train_loss": -41.094451904296875, "global_step": 286870, "epoch": 2370} {"train_loss": -42.149837493896484, "global_step": 286871, "epoch": 2370} {"train_loss": -42.49099349975586, "global_step": 286872, "epoch": 2370} {"train_loss": -42.5247917175293, "global_step": 286873, "epoch": 2370} {"train_loss": -41.65205383300781, "global_step": 286874, "epoch": 2370} {"train_loss": -41.85163497924805, "global_step": 286875, "epoch": 2370} {"train_loss": -42.45803451538086, "global_step": 286876, "epoch": 2370} {"train_loss": -42.10022735595703, "global_step": 286877, "epoch": 2370} {"train_loss": -40.622005462646484, "global_step": 286878, "epoch": 2370} {"train_loss": -38.13576889038086, "global_step": 286879, "epoch": 2370} {"train_loss": -38.95468521118164, "global_step": 286880, "epoch": 2370} {"train_loss": -42.25697708129883, "global_step": 286881, "epoch": 2370} {"train_loss": -39.33232879638672, "global_step": 286882, "epoch": 2370} {"train_loss": -40.383399963378906, "global_step": 286883, "epoch": 2370} {"train_loss": -38.711971282958984, "global_step": 286884, "epoch": 2370} {"train_loss": -34.56880569458008, "global_step": 286885, "epoch": 2370} {"train_loss": -36.081546783447266, "global_step": 286886, "epoch": 2370} {"train_loss": -30.063831329345703, "global_step": 286887, "epoch": 2370} {"train_loss": -34.48067855834961, "global_step": 286888, "epoch": 2370} {"train_loss": -34.878047943115234, "global_step": 286889, "epoch": 2370} {"train_loss": -41.92920101575615, "global_step": 286890, "epoch": 2370, "val_loss": 3104047.25} {"train_loss": -37.61369323730469, "global_step": 286891, "epoch": 2371} {"train_loss": -35.433284759521484, "global_step": 286892, "epoch": 2371} {"train_loss": -38.45096969604492, "global_step": 286893, "epoch": 2371} {"train_loss": -28.938465118408203, "global_step": 286894, "epoch": 2371} {"train_loss": -38.30989456176758, "global_step": 286895, "epoch": 2371} {"train_loss": -35.0308723449707, "global_step": 286896, "epoch": 2371} {"train_loss": -34.191524505615234, "global_step": 286897, "epoch": 2371} {"train_loss": -35.99209213256836, "global_step": 286898, "epoch": 2371} {"train_loss": -35.837982177734375, "global_step": 286899, "epoch": 2371} {"train_loss": -39.478721618652344, "global_step": 286900, "epoch": 2371} {"train_loss": -33.03340530395508, "global_step": 286901, "epoch": 2371} {"train_loss": -40.2657585144043, "global_step": 286902, "epoch": 2371} {"train_loss": -38.54247283935547, "global_step": 286903, "epoch": 2371} {"train_loss": -36.774139404296875, "global_step": 286904, "epoch": 2371} {"train_loss": -39.56797409057617, "global_step": 286905, "epoch": 2371} {"train_loss": -35.98939895629883, "global_step": 286906, "epoch": 2371} {"train_loss": -37.01900863647461, "global_step": 286907, "epoch": 2371} {"train_loss": -35.18500900268555, "global_step": 286908, "epoch": 2371} {"train_loss": -38.30890655517578, "global_step": 286909, "epoch": 2371} {"train_loss": -31.00433921813965, "global_step": 286910, "epoch": 2371} {"train_loss": -39.3005485534668, "global_step": 286911, "epoch": 2371} {"train_loss": -39.502681732177734, "global_step": 286912, "epoch": 2371} {"train_loss": -37.95866012573242, "global_step": 286913, "epoch": 2371} {"train_loss": -38.0737190246582, "global_step": 286914, "epoch": 2371} {"train_loss": -38.937007904052734, "global_step": 286915, "epoch": 2371} {"train_loss": -37.52785110473633, "global_step": 286916, "epoch": 2371} {"train_loss": -38.84183120727539, "global_step": 286917, "epoch": 2371} {"train_loss": -34.4818115234375, "global_step": 286918, "epoch": 2371} {"train_loss": -40.18193817138672, "global_step": 286919, "epoch": 2371} {"train_loss": -39.015159606933594, "global_step": 286920, "epoch": 2371} {"train_loss": -40.50635528564453, "global_step": 286921, "epoch": 2371} {"train_loss": -40.954280853271484, "global_step": 286922, "epoch": 2371} {"train_loss": -38.0954704284668, "global_step": 286923, "epoch": 2371} {"train_loss": -39.461692810058594, "global_step": 286924, "epoch": 2371} {"train_loss": -38.19560623168945, "global_step": 286925, "epoch": 2371} {"train_loss": -39.30708694458008, "global_step": 286926, "epoch": 2371} {"train_loss": -39.466426849365234, "global_step": 286927, "epoch": 2371} {"train_loss": -40.49281692504883, "global_step": 286928, "epoch": 2371} {"train_loss": -39.8872184753418, "global_step": 286929, "epoch": 2371} {"train_loss": -40.43156814575195, "global_step": 286930, "epoch": 2371} {"train_loss": -39.08150100708008, "global_step": 286931, "epoch": 2371} {"train_loss": -40.666080474853516, "global_step": 286932, "epoch": 2371} {"train_loss": -40.28535461425781, "global_step": 286933, "epoch": 2371} {"train_loss": -40.777767181396484, "global_step": 286934, "epoch": 2371} {"train_loss": -41.06589889526367, "global_step": 286935, "epoch": 2371} {"train_loss": -40.441463470458984, "global_step": 286936, "epoch": 2371} {"train_loss": -39.35382843017578, "global_step": 286937, "epoch": 2371} {"train_loss": -41.09075927734375, "global_step": 286938, "epoch": 2371} {"train_loss": -40.059776306152344, "global_step": 286939, "epoch": 2371} {"train_loss": -40.58112335205078, "global_step": 286940, "epoch": 2371} {"train_loss": -41.0382080078125, "global_step": 286941, "epoch": 2371} {"train_loss": -41.51520919799805, "global_step": 286942, "epoch": 2371} {"train_loss": -41.33125305175781, "global_step": 286943, "epoch": 2371} {"train_loss": -39.09822082519531, "global_step": 286944, "epoch": 2371} {"train_loss": -41.52035140991211, "global_step": 286945, "epoch": 2371} {"train_loss": -40.554351806640625, "global_step": 286946, "epoch": 2371} {"train_loss": -37.326263427734375, "global_step": 286947, "epoch": 2371} {"train_loss": -41.60063171386719, "global_step": 286948, "epoch": 2371} {"train_loss": -41.17412185668945, "global_step": 286949, "epoch": 2371} {"train_loss": -40.81687927246094, "global_step": 286950, "epoch": 2371} {"train_loss": -41.62996292114258, "global_step": 286951, "epoch": 2371} {"train_loss": -42.16395568847656, "global_step": 286952, "epoch": 2371} {"train_loss": -40.606258392333984, "global_step": 286953, "epoch": 2371} {"train_loss": -41.101009368896484, "global_step": 286954, "epoch": 2371} {"train_loss": -41.3772087097168, "global_step": 286955, "epoch": 2371} {"train_loss": -41.579830169677734, "global_step": 286956, "epoch": 2371} {"train_loss": -41.24885177612305, "global_step": 286957, "epoch": 2371} {"train_loss": -42.0538444519043, "global_step": 286958, "epoch": 2371} {"train_loss": -41.395755767822266, "global_step": 286959, "epoch": 2371} {"train_loss": -40.94822311401367, "global_step": 286960, "epoch": 2371} {"train_loss": -42.3887825012207, "global_step": 286961, "epoch": 2371} {"train_loss": -38.4046516418457, "global_step": 286962, "epoch": 2371} {"train_loss": -40.652400970458984, "global_step": 286963, "epoch": 2371} {"train_loss": -41.89738082885742, "global_step": 286964, "epoch": 2371} {"train_loss": -41.86172866821289, "global_step": 286965, "epoch": 2371} {"train_loss": -42.275550842285156, "global_step": 286966, "epoch": 2371} {"train_loss": -42.346946716308594, "global_step": 286967, "epoch": 2371} {"train_loss": -40.58763122558594, "global_step": 286968, "epoch": 2371} {"train_loss": -39.35787582397461, "global_step": 286969, "epoch": 2371} {"train_loss": -42.221946716308594, "global_step": 286970, "epoch": 2371} {"train_loss": -41.97733688354492, "global_step": 286971, "epoch": 2371} {"train_loss": -41.74884796142578, "global_step": 286972, "epoch": 2371} {"train_loss": -41.409507751464844, "global_step": 286973, "epoch": 2371} {"train_loss": -42.14070510864258, "global_step": 286974, "epoch": 2371} {"train_loss": -41.942909240722656, "global_step": 286975, "epoch": 2371} {"train_loss": -41.702999114990234, "global_step": 286976, "epoch": 2371} {"train_loss": -41.85700225830078, "global_step": 286977, "epoch": 2371} {"train_loss": -42.568416595458984, "global_step": 286978, "epoch": 2371} {"train_loss": -41.69252395629883, "global_step": 286979, "epoch": 2371} {"train_loss": -41.62844467163086, "global_step": 286980, "epoch": 2371} {"train_loss": -41.963531494140625, "global_step": 286981, "epoch": 2371} {"train_loss": -42.48169708251953, "global_step": 286982, "epoch": 2371} {"train_loss": -41.676361083984375, "global_step": 286983, "epoch": 2371} {"train_loss": -42.674468994140625, "global_step": 286984, "epoch": 2371} {"train_loss": -39.4102897644043, "global_step": 286985, "epoch": 2371} {"train_loss": -41.513153076171875, "global_step": 286986, "epoch": 2371} {"train_loss": -42.204811096191406, "global_step": 286987, "epoch": 2371} {"train_loss": -42.029563903808594, "global_step": 286988, "epoch": 2371} {"train_loss": -42.402565002441406, "global_step": 286989, "epoch": 2371} {"train_loss": -42.846099853515625, "global_step": 286990, "epoch": 2371} {"train_loss": -42.20108413696289, "global_step": 286991, "epoch": 2371} {"train_loss": -42.03471755981445, "global_step": 286992, "epoch": 2371} {"train_loss": -42.20345687866211, "global_step": 286993, "epoch": 2371} {"train_loss": -42.367027282714844, "global_step": 286994, "epoch": 2371} {"train_loss": -42.68122482299805, "global_step": 286995, "epoch": 2371} {"train_loss": -43.03116226196289, "global_step": 286996, "epoch": 2371} {"train_loss": -42.81209945678711, "global_step": 286997, "epoch": 2371} {"train_loss": -39.48598098754883, "global_step": 286998, "epoch": 2371} {"train_loss": -42.621429443359375, "global_step": 286999, "epoch": 2371} {"train_loss": -40.348201751708984, "global_step": 287000, "epoch": 2371} {"train_loss": -42.78025817871094, "global_step": 287001, "epoch": 2371} {"train_loss": -41.89485168457031, "global_step": 287002, "epoch": 2371} {"train_loss": -42.394779205322266, "global_step": 287003, "epoch": 2371} {"train_loss": -43.336334228515625, "global_step": 287004, "epoch": 2371} {"train_loss": -41.297576904296875, "global_step": 287005, "epoch": 2371} {"train_loss": -41.61334991455078, "global_step": 287006, "epoch": 2371} {"train_loss": -41.942405700683594, "global_step": 287007, "epoch": 2371} {"train_loss": -42.08945846557617, "global_step": 287008, "epoch": 2371} {"train_loss": -43.08240509033203, "global_step": 287009, "epoch": 2371} {"train_loss": -41.27242660522461, "global_step": 287010, "epoch": 2371} {"train_loss": -40.181491962149124, "global_step": 287011, "epoch": 2371, "val_loss": 2436654.0} {"train_loss": -42.6355094909668, "global_step": 287012, "epoch": 2372} {"train_loss": -41.816871643066406, "global_step": 287013, "epoch": 2372} {"train_loss": -42.76631546020508, "global_step": 287014, "epoch": 2372} {"train_loss": -42.95025634765625, "global_step": 287015, "epoch": 2372} {"train_loss": -43.31959915161133, "global_step": 287016, "epoch": 2372} {"train_loss": -42.71149826049805, "global_step": 287017, "epoch": 2372} {"train_loss": -40.32535934448242, "global_step": 287018, "epoch": 2372} {"train_loss": -39.38557815551758, "global_step": 287019, "epoch": 2372} {"train_loss": -41.43062210083008, "global_step": 287020, "epoch": 2372} {"train_loss": -43.22957992553711, "global_step": 287021, "epoch": 2372} {"train_loss": -40.60291290283203, "global_step": 287022, "epoch": 2372} {"train_loss": -41.7879753112793, "global_step": 287023, "epoch": 2372} {"train_loss": -41.61750411987305, "global_step": 287024, "epoch": 2372} {"train_loss": -43.01551818847656, "global_step": 287025, "epoch": 2372} {"train_loss": -42.94706344604492, "global_step": 287026, "epoch": 2372} {"train_loss": -38.94419860839844, "global_step": 287027, "epoch": 2372} {"train_loss": -43.30161666870117, "global_step": 287028, "epoch": 2372} {"train_loss": -42.6036376953125, "global_step": 287029, "epoch": 2372} {"train_loss": -42.8425178527832, "global_step": 287030, "epoch": 2372} {"train_loss": -41.420936584472656, "global_step": 287031, "epoch": 2372} {"train_loss": -43.1427116394043, "global_step": 287032, "epoch": 2372} {"train_loss": -42.692501068115234, "global_step": 287033, "epoch": 2372} {"train_loss": -41.6982536315918, "global_step": 287034, "epoch": 2372} {"train_loss": -41.37607955932617, "global_step": 287035, "epoch": 2372} {"train_loss": -41.364013671875, "global_step": 287036, "epoch": 2372} {"train_loss": -40.43109893798828, "global_step": 287037, "epoch": 2372} {"train_loss": -41.080970764160156, "global_step": 287038, "epoch": 2372} {"train_loss": -40.39486312866211, "global_step": 287039, "epoch": 2372} {"train_loss": -42.71187973022461, "global_step": 287040, "epoch": 2372} {"train_loss": -41.81583786010742, "global_step": 287041, "epoch": 2372} {"train_loss": -41.204097747802734, "global_step": 287042, "epoch": 2372} {"train_loss": -41.2345085144043, "global_step": 287043, "epoch": 2372} {"train_loss": -42.325111389160156, "global_step": 287044, "epoch": 2372} {"train_loss": -42.23445510864258, "global_step": 287045, "epoch": 2372} {"train_loss": -41.66704177856445, "global_step": 287046, "epoch": 2372} {"train_loss": -42.763153076171875, "global_step": 287047, "epoch": 2372} {"train_loss": -41.042076110839844, "global_step": 287048, "epoch": 2372} {"train_loss": -40.55888366699219, "global_step": 287049, "epoch": 2372} {"train_loss": -41.13407516479492, "global_step": 287050, "epoch": 2372} {"train_loss": -41.53944778442383, "global_step": 287051, "epoch": 2372} {"train_loss": -41.74473190307617, "global_step": 287052, "epoch": 2372} {"train_loss": -41.975284576416016, "global_step": 287053, "epoch": 2372} {"train_loss": -41.20265197753906, "global_step": 287054, "epoch": 2372} {"train_loss": -39.60060119628906, "global_step": 287055, "epoch": 2372} {"train_loss": -40.8973274230957, "global_step": 287056, "epoch": 2372} {"train_loss": -41.8441047668457, "global_step": 287057, "epoch": 2372} {"train_loss": -42.06673049926758, "global_step": 287058, "epoch": 2372} {"train_loss": -40.68221664428711, "global_step": 287059, "epoch": 2372} {"train_loss": -40.50843048095703, "global_step": 287060, "epoch": 2372} {"train_loss": -42.19587326049805, "global_step": 287061, "epoch": 2372} {"train_loss": -41.66627502441406, "global_step": 287062, "epoch": 2372} {"train_loss": -41.953521728515625, "global_step": 287063, "epoch": 2372} {"train_loss": -42.036163330078125, "global_step": 287064, "epoch": 2372} {"train_loss": -41.53839874267578, "global_step": 287065, "epoch": 2372} {"train_loss": -41.25803756713867, "global_step": 287066, "epoch": 2372} {"train_loss": -42.340484619140625, "global_step": 287067, "epoch": 2372} {"train_loss": -41.94316864013672, "global_step": 287068, "epoch": 2372} {"train_loss": -40.865779876708984, "global_step": 287069, "epoch": 2372} {"train_loss": -41.820858001708984, "global_step": 287070, "epoch": 2372} {"train_loss": -42.40767288208008, "global_step": 287071, "epoch": 2372} {"train_loss": -38.92572784423828, "global_step": 287072, "epoch": 2372} {"train_loss": -41.172237396240234, "global_step": 287073, "epoch": 2372} {"train_loss": -41.62726974487305, "global_step": 287074, "epoch": 2372} {"train_loss": -40.06922912597656, "global_step": 287075, "epoch": 2372} {"train_loss": -42.664405822753906, "global_step": 287076, "epoch": 2372} {"train_loss": -41.79370880126953, "global_step": 287077, "epoch": 2372} {"train_loss": -40.83277130126953, "global_step": 287078, "epoch": 2372} {"train_loss": -41.98133087158203, "global_step": 287079, "epoch": 2372} {"train_loss": -41.3189697265625, "global_step": 287080, "epoch": 2372} {"train_loss": -42.1994743347168, "global_step": 287081, "epoch": 2372} {"train_loss": -41.486629486083984, "global_step": 287082, "epoch": 2372} {"train_loss": -42.277252197265625, "global_step": 287083, "epoch": 2372} {"train_loss": -42.244232177734375, "global_step": 287084, "epoch": 2372} {"train_loss": -41.23098373413086, "global_step": 287085, "epoch": 2372} {"train_loss": -43.19026565551758, "global_step": 287086, "epoch": 2372} {"train_loss": -41.38741683959961, "global_step": 287087, "epoch": 2372} {"train_loss": -42.848140716552734, "global_step": 287088, "epoch": 2372} {"train_loss": -42.0196533203125, "global_step": 287089, "epoch": 2372} {"train_loss": -42.36048126220703, "global_step": 287090, "epoch": 2372} {"train_loss": -42.34273910522461, "global_step": 287091, "epoch": 2372} {"train_loss": -42.1237678527832, "global_step": 287092, "epoch": 2372} {"train_loss": -41.49988555908203, "global_step": 287093, "epoch": 2372} {"train_loss": -41.80094528198242, "global_step": 287094, "epoch": 2372} {"train_loss": -42.06821823120117, "global_step": 287095, "epoch": 2372} {"train_loss": -41.57405471801758, "global_step": 287096, "epoch": 2372} {"train_loss": -42.52731704711914, "global_step": 287097, "epoch": 2372} {"train_loss": -42.140342712402344, "global_step": 287098, "epoch": 2372} {"train_loss": -42.43207931518555, "global_step": 287099, "epoch": 2372} {"train_loss": -41.78359603881836, "global_step": 287100, "epoch": 2372} {"train_loss": -42.63936996459961, "global_step": 287101, "epoch": 2372} {"train_loss": -41.98017501831055, "global_step": 287102, "epoch": 2372} {"train_loss": -42.083168029785156, "global_step": 287103, "epoch": 2372} {"train_loss": -42.55891799926758, "global_step": 287104, "epoch": 2372} {"train_loss": -40.715003967285156, "global_step": 287105, "epoch": 2372} {"train_loss": -42.35023880004883, "global_step": 287106, "epoch": 2372} {"train_loss": -42.37128829956055, "global_step": 287107, "epoch": 2372} {"train_loss": -41.5451545715332, "global_step": 287108, "epoch": 2372} {"train_loss": -42.70810317993164, "global_step": 287109, "epoch": 2372} {"train_loss": -42.09394836425781, "global_step": 287110, "epoch": 2372} {"train_loss": -42.86494064331055, "global_step": 287111, "epoch": 2372} {"train_loss": -42.3697624206543, "global_step": 287112, "epoch": 2372} {"train_loss": -42.67599105834961, "global_step": 287113, "epoch": 2372} {"train_loss": -42.551029205322266, "global_step": 287114, "epoch": 2372} {"train_loss": -42.70862579345703, "global_step": 287115, "epoch": 2372} {"train_loss": -42.14727783203125, "global_step": 287116, "epoch": 2372} {"train_loss": -42.38006591796875, "global_step": 287117, "epoch": 2372} {"train_loss": -43.162269592285156, "global_step": 287118, "epoch": 2372} {"train_loss": -41.711402893066406, "global_step": 287119, "epoch": 2372} {"train_loss": -42.36857223510742, "global_step": 287120, "epoch": 2372} {"train_loss": -41.60258865356445, "global_step": 287121, "epoch": 2372} {"train_loss": -42.677608489990234, "global_step": 287122, "epoch": 2372} {"train_loss": -42.71668243408203, "global_step": 287123, "epoch": 2372} {"train_loss": -42.62465286254883, "global_step": 287124, "epoch": 2372} {"train_loss": -42.359375, "global_step": 287125, "epoch": 2372} {"train_loss": -42.9249382019043, "global_step": 287126, "epoch": 2372} {"train_loss": -42.936580657958984, "global_step": 287127, "epoch": 2372} {"train_loss": -41.3990364074707, "global_step": 287128, "epoch": 2372} {"train_loss": -43.166561126708984, "global_step": 287129, "epoch": 2372} {"train_loss": -42.72095489501953, "global_step": 287130, "epoch": 2372} {"train_loss": -42.668941497802734, "global_step": 287131, "epoch": 2372} {"train_loss": -41.90687258381489, "global_step": 287132, "epoch": 2372, "val_loss": 2511299.25} {"train_loss": -43.01144027709961, "global_step": 287133, "epoch": 2373} {"train_loss": -42.31751251220703, "global_step": 287134, "epoch": 2373} {"train_loss": -41.805633544921875, "global_step": 287135, "epoch": 2373} {"train_loss": -43.269100189208984, "global_step": 287136, "epoch": 2373} {"train_loss": -41.90812301635742, "global_step": 287137, "epoch": 2373} {"train_loss": -42.611236572265625, "global_step": 287138, "epoch": 2373} {"train_loss": -42.72743606567383, "global_step": 287139, "epoch": 2373} {"train_loss": -43.26186752319336, "global_step": 287140, "epoch": 2373} {"train_loss": -43.43606185913086, "global_step": 287141, "epoch": 2373} {"train_loss": -43.07731246948242, "global_step": 287142, "epoch": 2373} {"train_loss": -43.32650375366211, "global_step": 287143, "epoch": 2373} {"train_loss": -43.11977767944336, "global_step": 287144, "epoch": 2373} {"train_loss": -43.05632781982422, "global_step": 287145, "epoch": 2373} {"train_loss": -42.648189544677734, "global_step": 287146, "epoch": 2373} {"train_loss": -42.30847930908203, "global_step": 287147, "epoch": 2373} {"train_loss": -39.920166015625, "global_step": 287148, "epoch": 2373} {"train_loss": -31.768665313720703, "global_step": 287149, "epoch": 2373} {"train_loss": -27.203948974609375, "global_step": 287150, "epoch": 2373} {"train_loss": -28.084457397460938, "global_step": 287151, "epoch": 2373} {"train_loss": -37.64689254760742, "global_step": 287152, "epoch": 2373} {"train_loss": -41.61210250854492, "global_step": 287153, "epoch": 2373} {"train_loss": -40.89208984375, "global_step": 287154, "epoch": 2373} {"train_loss": -38.08915328979492, "global_step": 287155, "epoch": 2373} {"train_loss": -41.27222442626953, "global_step": 287156, "epoch": 2373} {"train_loss": -40.57756423950195, "global_step": 287157, "epoch": 2373} {"train_loss": -40.661865234375, "global_step": 287158, "epoch": 2373} {"train_loss": -41.97793197631836, "global_step": 287159, "epoch": 2373} {"train_loss": -42.06608200073242, "global_step": 287160, "epoch": 2373} {"train_loss": -41.25059127807617, "global_step": 287161, "epoch": 2373} {"train_loss": -41.0443229675293, "global_step": 287162, "epoch": 2373} {"train_loss": -41.63882827758789, "global_step": 287163, "epoch": 2373} {"train_loss": -41.89339065551758, "global_step": 287164, "epoch": 2373} {"train_loss": -41.853187561035156, "global_step": 287165, "epoch": 2373} {"train_loss": -41.980621337890625, "global_step": 287166, "epoch": 2373} {"train_loss": -41.78296661376953, "global_step": 287167, "epoch": 2373} {"train_loss": -40.79868698120117, "global_step": 287168, "epoch": 2373} {"train_loss": -41.90101623535156, "global_step": 287169, "epoch": 2373} {"train_loss": -42.15835189819336, "global_step": 287170, "epoch": 2373} {"train_loss": -41.96403884887695, "global_step": 287171, "epoch": 2373} {"train_loss": -42.98124313354492, "global_step": 287172, "epoch": 2373} {"train_loss": -40.64915084838867, "global_step": 287173, "epoch": 2373} {"train_loss": -42.59754180908203, "global_step": 287174, "epoch": 2373} {"train_loss": -41.01161193847656, "global_step": 287175, "epoch": 2373} {"train_loss": -42.67263412475586, "global_step": 287176, "epoch": 2373} {"train_loss": -41.66172409057617, "global_step": 287177, "epoch": 2373} {"train_loss": -42.617794036865234, "global_step": 287178, "epoch": 2373} {"train_loss": -42.60532760620117, "global_step": 287179, "epoch": 2373} {"train_loss": -42.66596221923828, "global_step": 287180, "epoch": 2373} {"train_loss": -42.61945724487305, "global_step": 287181, "epoch": 2373} {"train_loss": -42.672706604003906, "global_step": 287182, "epoch": 2373} {"train_loss": -43.01091384887695, "global_step": 287183, "epoch": 2373} {"train_loss": -43.24885177612305, "global_step": 287184, "epoch": 2373} {"train_loss": -42.55351638793945, "global_step": 287185, "epoch": 2373} {"train_loss": -43.13763427734375, "global_step": 287186, "epoch": 2373} {"train_loss": -43.34428024291992, "global_step": 287187, "epoch": 2373} {"train_loss": -43.04878616333008, "global_step": 287188, "epoch": 2373} {"train_loss": -43.10798263549805, "global_step": 287189, "epoch": 2373} {"train_loss": -43.3068962097168, "global_step": 287190, "epoch": 2373} {"train_loss": -42.6087646484375, "global_step": 287191, "epoch": 2373} {"train_loss": -43.07158279418945, "global_step": 287192, "epoch": 2373} {"train_loss": -43.06916809082031, "global_step": 287193, "epoch": 2373} {"train_loss": -43.36635208129883, "global_step": 287194, "epoch": 2373} {"train_loss": -42.3922004699707, "global_step": 287195, "epoch": 2373} {"train_loss": -43.40467071533203, "global_step": 287196, "epoch": 2373} {"train_loss": -43.47758102416992, "global_step": 287197, "epoch": 2373} {"train_loss": -43.05641555786133, "global_step": 287198, "epoch": 2373} {"train_loss": -42.83952713012695, "global_step": 287199, "epoch": 2373} {"train_loss": -43.50446701049805, "global_step": 287200, "epoch": 2373} {"train_loss": -43.313533782958984, "global_step": 287201, "epoch": 2373} {"train_loss": -43.4880485534668, "global_step": 287202, "epoch": 2373} {"train_loss": -43.28449249267578, "global_step": 287203, "epoch": 2373} {"train_loss": -43.267913818359375, "global_step": 287204, "epoch": 2373} {"train_loss": -43.5125846862793, "global_step": 287205, "epoch": 2373} {"train_loss": -43.11389923095703, "global_step": 287206, "epoch": 2373} {"train_loss": -43.51770782470703, "global_step": 287207, "epoch": 2373} {"train_loss": -43.65122604370117, "global_step": 287208, "epoch": 2373} {"train_loss": -43.68585968017578, "global_step": 287209, "epoch": 2373} {"train_loss": -43.72651672363281, "global_step": 287210, "epoch": 2373} {"train_loss": -43.54579544067383, "global_step": 287211, "epoch": 2373} {"train_loss": -43.261775970458984, "global_step": 287212, "epoch": 2373} {"train_loss": -44.00816345214844, "global_step": 287213, "epoch": 2373} {"train_loss": -42.92473602294922, "global_step": 287214, "epoch": 2373} {"train_loss": -42.91596221923828, "global_step": 287215, "epoch": 2373} {"train_loss": -43.538021087646484, "global_step": 287216, "epoch": 2373} {"train_loss": -43.77376174926758, "global_step": 287217, "epoch": 2373} {"train_loss": -42.618797302246094, "global_step": 287218, "epoch": 2373} {"train_loss": -42.7087287902832, "global_step": 287219, "epoch": 2373} {"train_loss": -43.0511589050293, "global_step": 287220, "epoch": 2373} {"train_loss": -42.97170639038086, "global_step": 287221, "epoch": 2373} {"train_loss": -43.173282623291016, "global_step": 287222, "epoch": 2373} {"train_loss": -43.31766891479492, "global_step": 287223, "epoch": 2373} {"train_loss": -43.73154830932617, "global_step": 287224, "epoch": 2373} {"train_loss": -43.794124603271484, "global_step": 287225, "epoch": 2373} {"train_loss": -43.96018981933594, "global_step": 287226, "epoch": 2373} {"train_loss": -42.57304763793945, "global_step": 287227, "epoch": 2373} {"train_loss": -43.6512565612793, "global_step": 287228, "epoch": 2373} {"train_loss": -43.83442306518555, "global_step": 287229, "epoch": 2373} {"train_loss": -43.71760177612305, "global_step": 287230, "epoch": 2373} {"train_loss": -42.690975189208984, "global_step": 287231, "epoch": 2373} {"train_loss": -43.3184700012207, "global_step": 287232, "epoch": 2373} {"train_loss": -42.21893310546875, "global_step": 287233, "epoch": 2373} {"train_loss": -42.59995651245117, "global_step": 287234, "epoch": 2373} {"train_loss": -42.944679260253906, "global_step": 287235, "epoch": 2373} {"train_loss": -43.18776321411133, "global_step": 287236, "epoch": 2373} {"train_loss": -42.62987518310547, "global_step": 287237, "epoch": 2373} {"train_loss": -42.77867126464844, "global_step": 287238, "epoch": 2373} {"train_loss": -42.24129867553711, "global_step": 287239, "epoch": 2373} {"train_loss": -39.339324951171875, "global_step": 287240, "epoch": 2373} {"train_loss": -34.14241027832031, "global_step": 287241, "epoch": 2373} {"train_loss": -25.058135986328125, "global_step": 287242, "epoch": 2373} {"train_loss": -18.465229034423828, "global_step": 287243, "epoch": 2373} {"train_loss": -23.800186157226562, "global_step": 287244, "epoch": 2373} {"train_loss": -40.02248764038086, "global_step": 287245, "epoch": 2373} {"train_loss": -33.51959228515625, "global_step": 287246, "epoch": 2373} {"train_loss": -30.652902603149414, "global_step": 287247, "epoch": 2373} {"train_loss": -38.83872985839844, "global_step": 287248, "epoch": 2373} {"train_loss": -31.45458984375, "global_step": 287249, "epoch": 2373} {"train_loss": -36.536766052246094, "global_step": 287250, "epoch": 2373} {"train_loss": -37.70769119262695, "global_step": 287251, "epoch": 2373} {"train_loss": -37.944129943847656, "global_step": 287252, "epoch": 2373} {"train_loss": -41.20209630855844, "global_step": 287253, "epoch": 2373, "val_loss": 2374867.0} {"train_loss": -38.91274642944336, "global_step": 287254, "epoch": 2374} {"train_loss": -39.63866424560547, "global_step": 287255, "epoch": 2374} {"train_loss": -39.39779281616211, "global_step": 287256, "epoch": 2374} {"train_loss": -40.14121627807617, "global_step": 287257, "epoch": 2374} {"train_loss": -39.96158981323242, "global_step": 287258, "epoch": 2374} {"train_loss": -41.04497146606445, "global_step": 287259, "epoch": 2374} {"train_loss": -40.370750427246094, "global_step": 287260, "epoch": 2374} {"train_loss": -41.294490814208984, "global_step": 287261, "epoch": 2374} {"train_loss": -41.679420471191406, "global_step": 287262, "epoch": 2374} {"train_loss": -41.32666778564453, "global_step": 287263, "epoch": 2374} {"train_loss": -39.73508071899414, "global_step": 287264, "epoch": 2374} {"train_loss": -39.40813064575195, "global_step": 287265, "epoch": 2374} {"train_loss": -41.873592376708984, "global_step": 287266, "epoch": 2374} {"train_loss": -40.35897445678711, "global_step": 287267, "epoch": 2374} {"train_loss": -41.218685150146484, "global_step": 287268, "epoch": 2374} {"train_loss": -41.8382453918457, "global_step": 287269, "epoch": 2374} {"train_loss": -40.570220947265625, "global_step": 287270, "epoch": 2374} {"train_loss": -41.419219970703125, "global_step": 287271, "epoch": 2374} {"train_loss": -41.94552230834961, "global_step": 287272, "epoch": 2374} {"train_loss": -41.73271560668945, "global_step": 287273, "epoch": 2374} {"train_loss": -41.927154541015625, "global_step": 287274, "epoch": 2374} {"train_loss": -41.884517669677734, "global_step": 287275, "epoch": 2374} {"train_loss": -41.763248443603516, "global_step": 287276, "epoch": 2374} {"train_loss": -42.02499008178711, "global_step": 287277, "epoch": 2374} {"train_loss": -41.91981887817383, "global_step": 287278, "epoch": 2374} {"train_loss": -42.12989044189453, "global_step": 287279, "epoch": 2374} {"train_loss": -42.24025344848633, "global_step": 287280, "epoch": 2374} {"train_loss": -41.93475341796875, "global_step": 287281, "epoch": 2374} {"train_loss": -42.577301025390625, "global_step": 287282, "epoch": 2374} {"train_loss": -42.23679733276367, "global_step": 287283, "epoch": 2374} {"train_loss": -42.55880355834961, "global_step": 287284, "epoch": 2374} {"train_loss": -42.317176818847656, "global_step": 287285, "epoch": 2374} {"train_loss": -41.68965530395508, "global_step": 287286, "epoch": 2374} {"train_loss": -42.84663009643555, "global_step": 287287, "epoch": 2374} {"train_loss": -42.5870361328125, "global_step": 287288, "epoch": 2374} {"train_loss": -42.49972152709961, "global_step": 287289, "epoch": 2374} {"train_loss": -41.87222671508789, "global_step": 287290, "epoch": 2374} {"train_loss": -41.65644454956055, "global_step": 287291, "epoch": 2374} {"train_loss": -42.76104736328125, "global_step": 287292, "epoch": 2374} {"train_loss": -42.9473762512207, "global_step": 287293, "epoch": 2374} {"train_loss": -42.49546813964844, "global_step": 287294, "epoch": 2374} {"train_loss": -42.766319274902344, "global_step": 287295, "epoch": 2374} {"train_loss": -42.598506927490234, "global_step": 287296, "epoch": 2374} {"train_loss": -43.3338508605957, "global_step": 287297, "epoch": 2374} {"train_loss": -42.64011764526367, "global_step": 287298, "epoch": 2374} {"train_loss": -43.35305404663086, "global_step": 287299, "epoch": 2374} {"train_loss": -43.30131149291992, "global_step": 287300, "epoch": 2374} {"train_loss": -42.414241790771484, "global_step": 287301, "epoch": 2374} {"train_loss": -42.80304718017578, "global_step": 287302, "epoch": 2374} {"train_loss": -42.735652923583984, "global_step": 287303, "epoch": 2374} {"train_loss": -43.061214447021484, "global_step": 287304, "epoch": 2374} {"train_loss": -42.338348388671875, "global_step": 287305, "epoch": 2374} {"train_loss": -43.1904296875, "global_step": 287306, "epoch": 2374} {"train_loss": -43.500308990478516, "global_step": 287307, "epoch": 2374} {"train_loss": -42.727630615234375, "global_step": 287308, "epoch": 2374} {"train_loss": -43.582820892333984, "global_step": 287309, "epoch": 2374} {"train_loss": -42.19535446166992, "global_step": 287310, "epoch": 2374} {"train_loss": -43.58085250854492, "global_step": 287311, "epoch": 2374} {"train_loss": -42.9331169128418, "global_step": 287312, "epoch": 2374} {"train_loss": -42.93394088745117, "global_step": 287313, "epoch": 2374} {"train_loss": -43.39490509033203, "global_step": 287314, "epoch": 2374} {"train_loss": -43.140594482421875, "global_step": 287315, "epoch": 2374} {"train_loss": -43.4036865234375, "global_step": 287316, "epoch": 2374} {"train_loss": -43.79540252685547, "global_step": 287317, "epoch": 2374} {"train_loss": -43.78767776489258, "global_step": 287318, "epoch": 2374} {"train_loss": -44.0195426940918, "global_step": 287319, "epoch": 2374} {"train_loss": -43.23602294921875, "global_step": 287320, "epoch": 2374} {"train_loss": -43.42698669433594, "global_step": 287321, "epoch": 2374} {"train_loss": -43.64430236816406, "global_step": 287322, "epoch": 2374} {"train_loss": -43.92483139038086, "global_step": 287323, "epoch": 2374} {"train_loss": -43.31385040283203, "global_step": 287324, "epoch": 2374} {"train_loss": -44.01491928100586, "global_step": 287325, "epoch": 2374} {"train_loss": -43.764713287353516, "global_step": 287326, "epoch": 2374} {"train_loss": -43.61176681518555, "global_step": 287327, "epoch": 2374} {"train_loss": -43.75362777709961, "global_step": 287328, "epoch": 2374} {"train_loss": -43.63562774658203, "global_step": 287329, "epoch": 2374} {"train_loss": -44.198150634765625, "global_step": 287330, "epoch": 2374} {"train_loss": -44.003814697265625, "global_step": 287331, "epoch": 2374} {"train_loss": -43.297584533691406, "global_step": 287332, "epoch": 2374} {"train_loss": -43.57557678222656, "global_step": 287333, "epoch": 2374} {"train_loss": -43.73916244506836, "global_step": 287334, "epoch": 2374} {"train_loss": -43.79783248901367, "global_step": 287335, "epoch": 2374} {"train_loss": -43.640960693359375, "global_step": 287336, "epoch": 2374} {"train_loss": -43.59449005126953, "global_step": 287337, "epoch": 2374} {"train_loss": -44.07297897338867, "global_step": 287338, "epoch": 2374} {"train_loss": -43.140926361083984, "global_step": 287339, "epoch": 2374} {"train_loss": -44.1345329284668, "global_step": 287340, "epoch": 2374} {"train_loss": -43.571712493896484, "global_step": 287341, "epoch": 2374} {"train_loss": -43.089412689208984, "global_step": 287342, "epoch": 2374} {"train_loss": -43.76420211791992, "global_step": 287343, "epoch": 2374} {"train_loss": -43.46881103515625, "global_step": 287344, "epoch": 2374} {"train_loss": -43.800018310546875, "global_step": 287345, "epoch": 2374} {"train_loss": -43.42414474487305, "global_step": 287346, "epoch": 2374} {"train_loss": -42.13534164428711, "global_step": 287347, "epoch": 2374} {"train_loss": -43.701576232910156, "global_step": 287348, "epoch": 2374} {"train_loss": -43.470458984375, "global_step": 287349, "epoch": 2374} {"train_loss": -43.836761474609375, "global_step": 287350, "epoch": 2374} {"train_loss": -43.59446716308594, "global_step": 287351, "epoch": 2374} {"train_loss": -43.25687789916992, "global_step": 287352, "epoch": 2374} {"train_loss": -43.486053466796875, "global_step": 287353, "epoch": 2374} {"train_loss": -43.325435638427734, "global_step": 287354, "epoch": 2374} {"train_loss": -43.0639533996582, "global_step": 287355, "epoch": 2374} {"train_loss": -44.009498596191406, "global_step": 287356, "epoch": 2374} {"train_loss": -44.0171012878418, "global_step": 287357, "epoch": 2374} {"train_loss": -43.81139373779297, "global_step": 287358, "epoch": 2374} {"train_loss": -43.91944122314453, "global_step": 287359, "epoch": 2374} {"train_loss": -43.77082443237305, "global_step": 287360, "epoch": 2374} {"train_loss": -42.911190032958984, "global_step": 287361, "epoch": 2374} {"train_loss": -42.76527786254883, "global_step": 287362, "epoch": 2374} {"train_loss": -42.324214935302734, "global_step": 287363, "epoch": 2374} {"train_loss": -43.80717849731445, "global_step": 287364, "epoch": 2374} {"train_loss": -43.3417854309082, "global_step": 287365, "epoch": 2374} {"train_loss": -41.93856430053711, "global_step": 287366, "epoch": 2374} {"train_loss": -42.3494987487793, "global_step": 287367, "epoch": 2374} {"train_loss": -42.17424392700195, "global_step": 287368, "epoch": 2374} {"train_loss": -43.53633117675781, "global_step": 287369, "epoch": 2374} {"train_loss": -43.3858642578125, "global_step": 287370, "epoch": 2374} {"train_loss": -43.273990631103516, "global_step": 287371, "epoch": 2374} {"train_loss": -42.97518539428711, "global_step": 287372, "epoch": 2374} {"train_loss": -41.85903549194336, "global_step": 287373, "epoch": 2374} {"train_loss": -42.6729000186132, "global_step": 287374, "epoch": 2374, "val_loss": 2465787.75} {"train_loss": -43.614315032958984, "global_step": 287375, "epoch": 2375} {"train_loss": -41.4410285949707, "global_step": 287376, "epoch": 2375} {"train_loss": -39.603511810302734, "global_step": 287377, "epoch": 2375} {"train_loss": -41.894073486328125, "global_step": 287378, "epoch": 2375} {"train_loss": -42.49154281616211, "global_step": 287379, "epoch": 2375} {"train_loss": -42.82416915893555, "global_step": 287380, "epoch": 2375} {"train_loss": -43.276424407958984, "global_step": 287381, "epoch": 2375} {"train_loss": -42.62323760986328, "global_step": 287382, "epoch": 2375} {"train_loss": -42.71588134765625, "global_step": 287383, "epoch": 2375} {"train_loss": -42.15859603881836, "global_step": 287384, "epoch": 2375} {"train_loss": -43.303592681884766, "global_step": 287385, "epoch": 2375} {"train_loss": -42.95854568481445, "global_step": 287386, "epoch": 2375} {"train_loss": -43.13772964477539, "global_step": 287387, "epoch": 2375} {"train_loss": -42.86781692504883, "global_step": 287388, "epoch": 2375} {"train_loss": -42.92841339111328, "global_step": 287389, "epoch": 2375} {"train_loss": -43.7276496887207, "global_step": 287390, "epoch": 2375} {"train_loss": -43.36812210083008, "global_step": 287391, "epoch": 2375} {"train_loss": -43.25020980834961, "global_step": 287392, "epoch": 2375} {"train_loss": -43.65375900268555, "global_step": 287393, "epoch": 2375} {"train_loss": -43.33645248413086, "global_step": 287394, "epoch": 2375} {"train_loss": -43.46937942504883, "global_step": 287395, "epoch": 2375} {"train_loss": -43.55835723876953, "global_step": 287396, "epoch": 2375} {"train_loss": -42.86346435546875, "global_step": 287397, "epoch": 2375} {"train_loss": -42.74857711791992, "global_step": 287398, "epoch": 2375} {"train_loss": -43.03379821777344, "global_step": 287399, "epoch": 2375} {"train_loss": -43.02704620361328, "global_step": 287400, "epoch": 2375} {"train_loss": -42.6884880065918, "global_step": 287401, "epoch": 2375} {"train_loss": -42.106197357177734, "global_step": 287402, "epoch": 2375} {"train_loss": -43.14420700073242, "global_step": 287403, "epoch": 2375} {"train_loss": -41.87891387939453, "global_step": 287404, "epoch": 2375} {"train_loss": -40.659645080566406, "global_step": 287405, "epoch": 2375} {"train_loss": -42.49851608276367, "global_step": 287406, "epoch": 2375} {"train_loss": -41.93286895751953, "global_step": 287407, "epoch": 2375} {"train_loss": -41.85805892944336, "global_step": 287408, "epoch": 2375} {"train_loss": -40.94306564331055, "global_step": 287409, "epoch": 2375} {"train_loss": -40.98928451538086, "global_step": 287410, "epoch": 2375} {"train_loss": -38.308502197265625, "global_step": 287411, "epoch": 2375} {"train_loss": -41.85652542114258, "global_step": 287412, "epoch": 2375} {"train_loss": -42.78510665893555, "global_step": 287413, "epoch": 2375} {"train_loss": -41.68524169921875, "global_step": 287414, "epoch": 2375} {"train_loss": -41.94428634643555, "global_step": 287415, "epoch": 2375} {"train_loss": -42.13821029663086, "global_step": 287416, "epoch": 2375} {"train_loss": -41.74607467651367, "global_step": 287417, "epoch": 2375} {"train_loss": -42.993587493896484, "global_step": 287418, "epoch": 2375} {"train_loss": -41.65069580078125, "global_step": 287419, "epoch": 2375} {"train_loss": -42.519081115722656, "global_step": 287420, "epoch": 2375} {"train_loss": -42.67974853515625, "global_step": 287421, "epoch": 2375} {"train_loss": -42.23284149169922, "global_step": 287422, "epoch": 2375} {"train_loss": -42.84955978393555, "global_step": 287423, "epoch": 2375} {"train_loss": -42.6702766418457, "global_step": 287424, "epoch": 2375} {"train_loss": -43.58612823486328, "global_step": 287425, "epoch": 2375} {"train_loss": -43.2313346862793, "global_step": 287426, "epoch": 2375} {"train_loss": -42.62052917480469, "global_step": 287427, "epoch": 2375} {"train_loss": -42.45478439331055, "global_step": 287428, "epoch": 2375} {"train_loss": -43.25221252441406, "global_step": 287429, "epoch": 2375} {"train_loss": -42.572357177734375, "global_step": 287430, "epoch": 2375} {"train_loss": -41.9375114440918, "global_step": 287431, "epoch": 2375} {"train_loss": -43.07259750366211, "global_step": 287432, "epoch": 2375} {"train_loss": -42.89170455932617, "global_step": 287433, "epoch": 2375} {"train_loss": -41.580299377441406, "global_step": 287434, "epoch": 2375} {"train_loss": -43.04441833496094, "global_step": 287435, "epoch": 2375} {"train_loss": -42.531681060791016, "global_step": 287436, "epoch": 2375} {"train_loss": -42.03596878051758, "global_step": 287437, "epoch": 2375} {"train_loss": -41.986000061035156, "global_step": 287438, "epoch": 2375} {"train_loss": -42.015357971191406, "global_step": 287439, "epoch": 2375} {"train_loss": -43.4827995300293, "global_step": 287440, "epoch": 2375} {"train_loss": -42.472198486328125, "global_step": 287441, "epoch": 2375} {"train_loss": -42.82173538208008, "global_step": 287442, "epoch": 2375} {"train_loss": -42.51308059692383, "global_step": 287443, "epoch": 2375} {"train_loss": -43.12250900268555, "global_step": 287444, "epoch": 2375} {"train_loss": -42.375953674316406, "global_step": 287445, "epoch": 2375} {"train_loss": -42.75554275512695, "global_step": 287446, "epoch": 2375} {"train_loss": -42.31528854370117, "global_step": 287447, "epoch": 2375} {"train_loss": -41.871212005615234, "global_step": 287448, "epoch": 2375} {"train_loss": -42.78117752075195, "global_step": 287449, "epoch": 2375} {"train_loss": -41.557403564453125, "global_step": 287450, "epoch": 2375} {"train_loss": -42.496212005615234, "global_step": 287451, "epoch": 2375} {"train_loss": -42.77223587036133, "global_step": 287452, "epoch": 2375} {"train_loss": -43.636409759521484, "global_step": 287453, "epoch": 2375} {"train_loss": -42.42655563354492, "global_step": 287454, "epoch": 2375} {"train_loss": -43.387908935546875, "global_step": 287455, "epoch": 2375} {"train_loss": -43.05472946166992, "global_step": 287456, "epoch": 2375} {"train_loss": -43.51894760131836, "global_step": 287457, "epoch": 2375} {"train_loss": -42.4614372253418, "global_step": 287458, "epoch": 2375} {"train_loss": -43.47259521484375, "global_step": 287459, "epoch": 2375} {"train_loss": -43.08384323120117, "global_step": 287460, "epoch": 2375} {"train_loss": -42.32204055786133, "global_step": 287461, "epoch": 2375} {"train_loss": -43.05959701538086, "global_step": 287462, "epoch": 2375} {"train_loss": -43.54884719848633, "global_step": 287463, "epoch": 2375} {"train_loss": -41.662315368652344, "global_step": 287464, "epoch": 2375} {"train_loss": -42.627254486083984, "global_step": 287465, "epoch": 2375} {"train_loss": -42.63399887084961, "global_step": 287466, "epoch": 2375} {"train_loss": -42.83159637451172, "global_step": 287467, "epoch": 2375} {"train_loss": -42.76117706298828, "global_step": 287468, "epoch": 2375} {"train_loss": -43.53290939331055, "global_step": 287469, "epoch": 2375} {"train_loss": -42.672264099121094, "global_step": 287470, "epoch": 2375} {"train_loss": -43.17227554321289, "global_step": 287471, "epoch": 2375} {"train_loss": -43.304168701171875, "global_step": 287472, "epoch": 2375} {"train_loss": -42.776973724365234, "global_step": 287473, "epoch": 2375} {"train_loss": -42.003204345703125, "global_step": 287474, "epoch": 2375} {"train_loss": -41.82307052612305, "global_step": 287475, "epoch": 2375} {"train_loss": -41.80522537231445, "global_step": 287476, "epoch": 2375} {"train_loss": -43.28242874145508, "global_step": 287477, "epoch": 2375} {"train_loss": -43.01087188720703, "global_step": 287478, "epoch": 2375} {"train_loss": -43.515846252441406, "global_step": 287479, "epoch": 2375} {"train_loss": -42.96331787109375, "global_step": 287480, "epoch": 2375} {"train_loss": -43.466156005859375, "global_step": 287481, "epoch": 2375} {"train_loss": -43.15330123901367, "global_step": 287482, "epoch": 2375} {"train_loss": -40.264896392822266, "global_step": 287483, "epoch": 2375} {"train_loss": -43.37646484375, "global_step": 287484, "epoch": 2375} {"train_loss": -42.36893844604492, "global_step": 287485, "epoch": 2375} {"train_loss": -42.89252853393555, "global_step": 287486, "epoch": 2375} {"train_loss": -43.08610153198242, "global_step": 287487, "epoch": 2375} {"train_loss": -43.622440338134766, "global_step": 287488, "epoch": 2375} {"train_loss": -43.449623107910156, "global_step": 287489, "epoch": 2375} {"train_loss": -43.61250686645508, "global_step": 287490, "epoch": 2375} {"train_loss": -43.75492477416992, "global_step": 287491, "epoch": 2375} {"train_loss": -42.82487106323242, "global_step": 287492, "epoch": 2375} {"train_loss": -42.19443130493164, "global_step": 287493, "epoch": 2375} {"train_loss": -43.282081604003906, "global_step": 287494, "epoch": 2375} {"train_loss": -42.60814420841942, "global_step": 287495, "epoch": 2375, "val_loss": 2469768.25} {"train_loss": -41.47737121582031, "global_step": 287496, "epoch": 2376} {"train_loss": -43.11520767211914, "global_step": 287497, "epoch": 2376} {"train_loss": -42.52515411376953, "global_step": 287498, "epoch": 2376} {"train_loss": -41.31732177734375, "global_step": 287499, "epoch": 2376} {"train_loss": -43.1565055847168, "global_step": 287500, "epoch": 2376} {"train_loss": -43.04076385498047, "global_step": 287501, "epoch": 2376} {"train_loss": -43.798274993896484, "global_step": 287502, "epoch": 2376} {"train_loss": -43.67006301879883, "global_step": 287503, "epoch": 2376} {"train_loss": -40.939849853515625, "global_step": 287504, "epoch": 2376} {"train_loss": -43.58838653564453, "global_step": 287505, "epoch": 2376} {"train_loss": -43.79258728027344, "global_step": 287506, "epoch": 2376} {"train_loss": -42.334503173828125, "global_step": 287507, "epoch": 2376} {"train_loss": -42.24029541015625, "global_step": 287508, "epoch": 2376} {"train_loss": -43.44929504394531, "global_step": 287509, "epoch": 2376} {"train_loss": -40.34330368041992, "global_step": 287510, "epoch": 2376} {"train_loss": -40.458377838134766, "global_step": 287511, "epoch": 2376} {"train_loss": -43.61161422729492, "global_step": 287512, "epoch": 2376} {"train_loss": -42.110877990722656, "global_step": 287513, "epoch": 2376} {"train_loss": -43.68299102783203, "global_step": 287514, "epoch": 2376} {"train_loss": -42.604461669921875, "global_step": 287515, "epoch": 2376} {"train_loss": -42.8319206237793, "global_step": 287516, "epoch": 2376} {"train_loss": -41.58590316772461, "global_step": 287517, "epoch": 2376} {"train_loss": -39.96104049682617, "global_step": 287518, "epoch": 2376} {"train_loss": -38.6761589050293, "global_step": 287519, "epoch": 2376} {"train_loss": -41.97550582885742, "global_step": 287520, "epoch": 2376} {"train_loss": -42.22080612182617, "global_step": 287521, "epoch": 2376} {"train_loss": -40.70653533935547, "global_step": 287522, "epoch": 2376} {"train_loss": -39.901180267333984, "global_step": 287523, "epoch": 2376} {"train_loss": -41.85858154296875, "global_step": 287524, "epoch": 2376} {"train_loss": -38.53178024291992, "global_step": 287525, "epoch": 2376} {"train_loss": -42.97003936767578, "global_step": 287526, "epoch": 2376} {"train_loss": -40.1002311706543, "global_step": 287527, "epoch": 2376} {"train_loss": -37.37586212158203, "global_step": 287528, "epoch": 2376} {"train_loss": -40.804054260253906, "global_step": 287529, "epoch": 2376} {"train_loss": -35.62616729736328, "global_step": 287530, "epoch": 2376} {"train_loss": -40.40909957885742, "global_step": 287531, "epoch": 2376} {"train_loss": -40.417240142822266, "global_step": 287532, "epoch": 2376} {"train_loss": -37.920875549316406, "global_step": 287533, "epoch": 2376} {"train_loss": -40.307762145996094, "global_step": 287534, "epoch": 2376} {"train_loss": -36.54608154296875, "global_step": 287535, "epoch": 2376} {"train_loss": -37.54313278198242, "global_step": 287536, "epoch": 2376} {"train_loss": -35.82171630859375, "global_step": 287537, "epoch": 2376} {"train_loss": -38.679195404052734, "global_step": 287538, "epoch": 2376} {"train_loss": -38.099327087402344, "global_step": 287539, "epoch": 2376} {"train_loss": -40.120845794677734, "global_step": 287540, "epoch": 2376} {"train_loss": -36.8098258972168, "global_step": 287541, "epoch": 2376} {"train_loss": -39.24074935913086, "global_step": 287542, "epoch": 2376} {"train_loss": -40.105743408203125, "global_step": 287543, "epoch": 2376} {"train_loss": -40.65568161010742, "global_step": 287544, "epoch": 2376} {"train_loss": -34.007293701171875, "global_step": 287545, "epoch": 2376} {"train_loss": -37.75284194946289, "global_step": 287546, "epoch": 2376} {"train_loss": -38.34572219848633, "global_step": 287547, "epoch": 2376} {"train_loss": -38.90150833129883, "global_step": 287548, "epoch": 2376} {"train_loss": -38.607688903808594, "global_step": 287549, "epoch": 2376} {"train_loss": -38.85438919067383, "global_step": 287550, "epoch": 2376} {"train_loss": -39.177520751953125, "global_step": 287551, "epoch": 2376} {"train_loss": -38.33525466918945, "global_step": 287552, "epoch": 2376} {"train_loss": -39.85650634765625, "global_step": 287553, "epoch": 2376} {"train_loss": -40.892608642578125, "global_step": 287554, "epoch": 2376} {"train_loss": -40.006832122802734, "global_step": 287555, "epoch": 2376} {"train_loss": -33.388938903808594, "global_step": 287556, "epoch": 2376} {"train_loss": -40.49387741088867, "global_step": 287557, "epoch": 2376} {"train_loss": -40.60805892944336, "global_step": 287558, "epoch": 2376} {"train_loss": -39.416744232177734, "global_step": 287559, "epoch": 2376} {"train_loss": -37.696136474609375, "global_step": 287560, "epoch": 2376} {"train_loss": -40.239158630371094, "global_step": 287561, "epoch": 2376} {"train_loss": -39.92671203613281, "global_step": 287562, "epoch": 2376} {"train_loss": -39.43947982788086, "global_step": 287563, "epoch": 2376} {"train_loss": -40.2209587097168, "global_step": 287564, "epoch": 2376} {"train_loss": -40.06367492675781, "global_step": 287565, "epoch": 2376} {"train_loss": -38.85041046142578, "global_step": 287566, "epoch": 2376} {"train_loss": -39.909706115722656, "global_step": 287567, "epoch": 2376} {"train_loss": -41.391639709472656, "global_step": 287568, "epoch": 2376} {"train_loss": -36.10268783569336, "global_step": 287569, "epoch": 2376} {"train_loss": -39.8064079284668, "global_step": 287570, "epoch": 2376} {"train_loss": -41.878326416015625, "global_step": 287571, "epoch": 2376} {"train_loss": -40.648780822753906, "global_step": 287572, "epoch": 2376} {"train_loss": -40.342281341552734, "global_step": 287573, "epoch": 2376} {"train_loss": -41.17607116699219, "global_step": 287574, "epoch": 2376} {"train_loss": -41.51127243041992, "global_step": 287575, "epoch": 2376} {"train_loss": -41.535274505615234, "global_step": 287576, "epoch": 2376} {"train_loss": -39.359981536865234, "global_step": 287577, "epoch": 2376} {"train_loss": -41.465675354003906, "global_step": 287578, "epoch": 2376} {"train_loss": -41.713287353515625, "global_step": 287579, "epoch": 2376} {"train_loss": -40.40227127075195, "global_step": 287580, "epoch": 2376} {"train_loss": -41.26687240600586, "global_step": 287581, "epoch": 2376} {"train_loss": -39.21504211425781, "global_step": 287582, "epoch": 2376} {"train_loss": -40.52655792236328, "global_step": 287583, "epoch": 2376} {"train_loss": -41.30796432495117, "global_step": 287584, "epoch": 2376} {"train_loss": -40.631160736083984, "global_step": 287585, "epoch": 2376} {"train_loss": -41.193965911865234, "global_step": 287586, "epoch": 2376} {"train_loss": -40.48681640625, "global_step": 287587, "epoch": 2376} {"train_loss": -41.90914535522461, "global_step": 287588, "epoch": 2376} {"train_loss": -40.34123611450195, "global_step": 287589, "epoch": 2376} {"train_loss": -41.25927734375, "global_step": 287590, "epoch": 2376} {"train_loss": -42.171546936035156, "global_step": 287591, "epoch": 2376} {"train_loss": -41.220916748046875, "global_step": 287592, "epoch": 2376} {"train_loss": -41.68667221069336, "global_step": 287593, "epoch": 2376} {"train_loss": -41.880367279052734, "global_step": 287594, "epoch": 2376} {"train_loss": -42.461875915527344, "global_step": 287595, "epoch": 2376} {"train_loss": -42.07772445678711, "global_step": 287596, "epoch": 2376} {"train_loss": -42.11652755737305, "global_step": 287597, "epoch": 2376} {"train_loss": -41.97377395629883, "global_step": 287598, "epoch": 2376} {"train_loss": -42.48582458496094, "global_step": 287599, "epoch": 2376} {"train_loss": -41.24728012084961, "global_step": 287600, "epoch": 2376} {"train_loss": -41.72861862182617, "global_step": 287601, "epoch": 2376} {"train_loss": -42.64408874511719, "global_step": 287602, "epoch": 2376} {"train_loss": -42.26414108276367, "global_step": 287603, "epoch": 2376} {"train_loss": -42.12404251098633, "global_step": 287604, "epoch": 2376} {"train_loss": -42.03361511230469, "global_step": 287605, "epoch": 2376} {"train_loss": -43.04827117919922, "global_step": 287606, "epoch": 2376} {"train_loss": -41.86103057861328, "global_step": 287607, "epoch": 2376} {"train_loss": -42.201759338378906, "global_step": 287608, "epoch": 2376} {"train_loss": -41.9654541015625, "global_step": 287609, "epoch": 2376} {"train_loss": -42.59125900268555, "global_step": 287610, "epoch": 2376} {"train_loss": -41.580039978027344, "global_step": 287611, "epoch": 2376} {"train_loss": -41.776729583740234, "global_step": 287612, "epoch": 2376} {"train_loss": -42.100830078125, "global_step": 287613, "epoch": 2376} {"train_loss": -42.39107894897461, "global_step": 287614, "epoch": 2376} {"train_loss": -42.67030715942383, "global_step": 287615, "epoch": 2376} {"train_loss": -40.69613206091006, "global_step": 287616, "epoch": 2376, "val_loss": 2445400.75} {"train_loss": -42.60721969604492, "global_step": 287617, "epoch": 2377} {"train_loss": -42.49514389038086, "global_step": 287618, "epoch": 2377} {"train_loss": -42.66518783569336, "global_step": 287619, "epoch": 2377} {"train_loss": -42.79775619506836, "global_step": 287620, "epoch": 2377} {"train_loss": -42.88344955444336, "global_step": 287621, "epoch": 2377} {"train_loss": -43.53684616088867, "global_step": 287622, "epoch": 2377} {"train_loss": -42.22037887573242, "global_step": 287623, "epoch": 2377} {"train_loss": -42.410789489746094, "global_step": 287624, "epoch": 2377} {"train_loss": -42.70192337036133, "global_step": 287625, "epoch": 2377} {"train_loss": -41.97456741333008, "global_step": 287626, "epoch": 2377} {"train_loss": -41.610748291015625, "global_step": 287627, "epoch": 2377} {"train_loss": -43.20634841918945, "global_step": 287628, "epoch": 2377} {"train_loss": -42.537776947021484, "global_step": 287629, "epoch": 2377} {"train_loss": -40.62777328491211, "global_step": 287630, "epoch": 2377} {"train_loss": -43.418426513671875, "global_step": 287631, "epoch": 2377} {"train_loss": -42.67354965209961, "global_step": 287632, "epoch": 2377} {"train_loss": -42.640316009521484, "global_step": 287633, "epoch": 2377} {"train_loss": -42.9774055480957, "global_step": 287634, "epoch": 2377} {"train_loss": -42.52888107299805, "global_step": 287635, "epoch": 2377} {"train_loss": -42.89710998535156, "global_step": 287636, "epoch": 2377} {"train_loss": -43.34279251098633, "global_step": 287637, "epoch": 2377} {"train_loss": -42.97383499145508, "global_step": 287638, "epoch": 2377} {"train_loss": -43.3400993347168, "global_step": 287639, "epoch": 2377} {"train_loss": -42.14876937866211, "global_step": 287640, "epoch": 2377} {"train_loss": -43.043209075927734, "global_step": 287641, "epoch": 2377} {"train_loss": -43.18124008178711, "global_step": 287642, "epoch": 2377} {"train_loss": -42.59905242919922, "global_step": 287643, "epoch": 2377} {"train_loss": -43.122108459472656, "global_step": 287644, "epoch": 2377} {"train_loss": -42.86660385131836, "global_step": 287645, "epoch": 2377} {"train_loss": -43.29783630371094, "global_step": 287646, "epoch": 2377} {"train_loss": -43.621944427490234, "global_step": 287647, "epoch": 2377} {"train_loss": -43.4650993347168, "global_step": 287648, "epoch": 2377} {"train_loss": -42.5503044128418, "global_step": 287649, "epoch": 2377} {"train_loss": -43.742347717285156, "global_step": 287650, "epoch": 2377} {"train_loss": -43.06472396850586, "global_step": 287651, "epoch": 2377} {"train_loss": -43.80678939819336, "global_step": 287652, "epoch": 2377} {"train_loss": -43.17096710205078, "global_step": 287653, "epoch": 2377} {"train_loss": -42.873046875, "global_step": 287654, "epoch": 2377} {"train_loss": -43.04852294921875, "global_step": 287655, "epoch": 2377} {"train_loss": -43.553466796875, "global_step": 287656, "epoch": 2377} {"train_loss": -41.91237258911133, "global_step": 287657, "epoch": 2377} {"train_loss": -42.43046188354492, "global_step": 287658, "epoch": 2377} {"train_loss": -42.189857482910156, "global_step": 287659, "epoch": 2377} {"train_loss": -43.86058044433594, "global_step": 287660, "epoch": 2377} {"train_loss": -42.12639617919922, "global_step": 287661, "epoch": 2377} {"train_loss": -43.480323791503906, "global_step": 287662, "epoch": 2377} {"train_loss": -43.050968170166016, "global_step": 287663, "epoch": 2377} {"train_loss": -42.93882369995117, "global_step": 287664, "epoch": 2377} {"train_loss": -42.405548095703125, "global_step": 287665, "epoch": 2377} {"train_loss": -44.04473114013672, "global_step": 287666, "epoch": 2377} {"train_loss": -43.11100769042969, "global_step": 287667, "epoch": 2377} {"train_loss": -43.3350715637207, "global_step": 287668, "epoch": 2377} {"train_loss": -42.9161491394043, "global_step": 287669, "epoch": 2377} {"train_loss": -43.12751388549805, "global_step": 287670, "epoch": 2377} {"train_loss": -41.55636215209961, "global_step": 287671, "epoch": 2377} {"train_loss": -42.99577713012695, "global_step": 287672, "epoch": 2377} {"train_loss": -43.357460021972656, "global_step": 287673, "epoch": 2377} {"train_loss": -43.420501708984375, "global_step": 287674, "epoch": 2377} {"train_loss": -42.22053146362305, "global_step": 287675, "epoch": 2377} {"train_loss": -42.22026062011719, "global_step": 287676, "epoch": 2377} {"train_loss": -42.89683151245117, "global_step": 287677, "epoch": 2377} {"train_loss": -42.17221450805664, "global_step": 287678, "epoch": 2377} {"train_loss": -42.74258041381836, "global_step": 287679, "epoch": 2377} {"train_loss": -38.100555419921875, "global_step": 287680, "epoch": 2377} {"train_loss": -41.52412796020508, "global_step": 287681, "epoch": 2377} {"train_loss": -42.887630462646484, "global_step": 287682, "epoch": 2377} {"train_loss": -42.080867767333984, "global_step": 287683, "epoch": 2377} {"train_loss": -42.11768341064453, "global_step": 287684, "epoch": 2377} {"train_loss": -43.1961784362793, "global_step": 287685, "epoch": 2377} {"train_loss": -42.863460540771484, "global_step": 287686, "epoch": 2377} {"train_loss": -43.0236701965332, "global_step": 287687, "epoch": 2377} {"train_loss": -43.182064056396484, "global_step": 287688, "epoch": 2377} {"train_loss": -43.18421936035156, "global_step": 287689, "epoch": 2377} {"train_loss": -42.190547943115234, "global_step": 287690, "epoch": 2377} {"train_loss": -42.41209030151367, "global_step": 287691, "epoch": 2377} {"train_loss": -43.30998611450195, "global_step": 287692, "epoch": 2377} {"train_loss": -42.80232620239258, "global_step": 287693, "epoch": 2377} {"train_loss": -43.04138946533203, "global_step": 287694, "epoch": 2377} {"train_loss": -43.07597351074219, "global_step": 287695, "epoch": 2377} {"train_loss": -43.045833587646484, "global_step": 287696, "epoch": 2377} {"train_loss": -43.122493743896484, "global_step": 287697, "epoch": 2377} {"train_loss": -42.50474166870117, "global_step": 287698, "epoch": 2377} {"train_loss": -43.342987060546875, "global_step": 287699, "epoch": 2377} {"train_loss": -42.96773910522461, "global_step": 287700, "epoch": 2377} {"train_loss": -42.58393096923828, "global_step": 287701, "epoch": 2377} {"train_loss": -42.83187484741211, "global_step": 287702, "epoch": 2377} {"train_loss": -42.97163772583008, "global_step": 287703, "epoch": 2377} {"train_loss": -41.4177360534668, "global_step": 287704, "epoch": 2377} {"train_loss": -41.057010650634766, "global_step": 287705, "epoch": 2377} {"train_loss": -42.353111267089844, "global_step": 287706, "epoch": 2377} {"train_loss": -39.37386703491211, "global_step": 287707, "epoch": 2377} {"train_loss": -37.328041076660156, "global_step": 287708, "epoch": 2377} {"train_loss": -35.30356979370117, "global_step": 287709, "epoch": 2377} {"train_loss": -39.8910026550293, "global_step": 287710, "epoch": 2377} {"train_loss": -41.90910720825195, "global_step": 287711, "epoch": 2377} {"train_loss": -37.71852111816406, "global_step": 287712, "epoch": 2377} {"train_loss": -36.955780029296875, "global_step": 287713, "epoch": 2377} {"train_loss": -40.20646667480469, "global_step": 287714, "epoch": 2377} {"train_loss": -36.61574935913086, "global_step": 287715, "epoch": 2377} {"train_loss": -39.64939498901367, "global_step": 287716, "epoch": 2377} {"train_loss": -41.515724182128906, "global_step": 287717, "epoch": 2377} {"train_loss": -38.5121955871582, "global_step": 287718, "epoch": 2377} {"train_loss": -41.66948318481445, "global_step": 287719, "epoch": 2377} {"train_loss": -38.46682357788086, "global_step": 287720, "epoch": 2377} {"train_loss": -40.268924713134766, "global_step": 287721, "epoch": 2377} {"train_loss": -41.88176727294922, "global_step": 287722, "epoch": 2377} {"train_loss": -41.23025131225586, "global_step": 287723, "epoch": 2377} {"train_loss": -41.169334411621094, "global_step": 287724, "epoch": 2377} {"train_loss": -41.74116516113281, "global_step": 287725, "epoch": 2377} {"train_loss": -40.856990814208984, "global_step": 287726, "epoch": 2377} {"train_loss": -41.09628677368164, "global_step": 287727, "epoch": 2377} {"train_loss": -42.425941467285156, "global_step": 287728, "epoch": 2377} {"train_loss": -40.952857971191406, "global_step": 287729, "epoch": 2377} {"train_loss": -41.715633392333984, "global_step": 287730, "epoch": 2377} {"train_loss": -40.12530517578125, "global_step": 287731, "epoch": 2377} {"train_loss": -35.78228759765625, "global_step": 287732, "epoch": 2377} {"train_loss": -41.17204284667969, "global_step": 287733, "epoch": 2377} {"train_loss": -41.00692367553711, "global_step": 287734, "epoch": 2377} {"train_loss": -41.13778305053711, "global_step": 287735, "epoch": 2377} {"train_loss": -42.5046501159668, "global_step": 287736, "epoch": 2377} {"train_loss": -42.05103305154596, "global_step": 287737, "epoch": 2377, "val_loss": 2927816.75} {"train_loss": -41.763545989990234, "global_step": 287738, "epoch": 2378} {"train_loss": -42.77627182006836, "global_step": 287739, "epoch": 2378} {"train_loss": -42.72672653198242, "global_step": 287740, "epoch": 2378} {"train_loss": -42.44743728637695, "global_step": 287741, "epoch": 2378} {"train_loss": -41.64405059814453, "global_step": 287742, "epoch": 2378} {"train_loss": -42.458106994628906, "global_step": 287743, "epoch": 2378} {"train_loss": -41.99775314331055, "global_step": 287744, "epoch": 2378} {"train_loss": -41.592041015625, "global_step": 287745, "epoch": 2378} {"train_loss": -42.28056716918945, "global_step": 287746, "epoch": 2378} {"train_loss": -43.03343963623047, "global_step": 287747, "epoch": 2378} {"train_loss": -42.293636322021484, "global_step": 287748, "epoch": 2378} {"train_loss": -42.376216888427734, "global_step": 287749, "epoch": 2378} {"train_loss": -42.88523483276367, "global_step": 287750, "epoch": 2378} {"train_loss": -42.33658981323242, "global_step": 287751, "epoch": 2378} {"train_loss": -40.95774459838867, "global_step": 287752, "epoch": 2378} {"train_loss": -42.47467803955078, "global_step": 287753, "epoch": 2378} {"train_loss": -42.11451721191406, "global_step": 287754, "epoch": 2378} {"train_loss": -42.54402542114258, "global_step": 287755, "epoch": 2378} {"train_loss": -42.37413787841797, "global_step": 287756, "epoch": 2378} {"train_loss": -42.34011459350586, "global_step": 287757, "epoch": 2378} {"train_loss": -42.366981506347656, "global_step": 287758, "epoch": 2378} {"train_loss": -42.8818244934082, "global_step": 287759, "epoch": 2378} {"train_loss": -42.09646987915039, "global_step": 287760, "epoch": 2378} {"train_loss": -42.585350036621094, "global_step": 287761, "epoch": 2378} {"train_loss": -42.65910720825195, "global_step": 287762, "epoch": 2378} {"train_loss": -41.560546875, "global_step": 287763, "epoch": 2378} {"train_loss": -42.719783782958984, "global_step": 287764, "epoch": 2378} {"train_loss": -41.648353576660156, "global_step": 287765, "epoch": 2378} {"train_loss": -41.677879333496094, "global_step": 287766, "epoch": 2378} {"train_loss": -42.02857208251953, "global_step": 287767, "epoch": 2378} {"train_loss": -42.71018600463867, "global_step": 287768, "epoch": 2378} {"train_loss": -42.640132904052734, "global_step": 287769, "epoch": 2378} {"train_loss": -42.20478439331055, "global_step": 287770, "epoch": 2378} {"train_loss": -42.75095748901367, "global_step": 287771, "epoch": 2378} {"train_loss": -42.91317367553711, "global_step": 287772, "epoch": 2378} {"train_loss": -42.88174057006836, "global_step": 287773, "epoch": 2378} {"train_loss": -43.570003509521484, "global_step": 287774, "epoch": 2378} {"train_loss": -43.366390228271484, "global_step": 287775, "epoch": 2378} {"train_loss": -43.72136306762695, "global_step": 287776, "epoch": 2378} {"train_loss": -42.85670852661133, "global_step": 287777, "epoch": 2378} {"train_loss": -41.64223861694336, "global_step": 287778, "epoch": 2378} {"train_loss": -43.10493469238281, "global_step": 287779, "epoch": 2378} {"train_loss": -42.63776397705078, "global_step": 287780, "epoch": 2378} {"train_loss": -43.00806427001953, "global_step": 287781, "epoch": 2378} {"train_loss": -43.698734283447266, "global_step": 287782, "epoch": 2378} {"train_loss": -43.30488967895508, "global_step": 287783, "epoch": 2378} {"train_loss": -42.89345169067383, "global_step": 287784, "epoch": 2378} {"train_loss": -43.53987503051758, "global_step": 287785, "epoch": 2378} {"train_loss": -43.472816467285156, "global_step": 287786, "epoch": 2378} {"train_loss": -43.21694564819336, "global_step": 287787, "epoch": 2378} {"train_loss": -43.22285842895508, "global_step": 287788, "epoch": 2378} {"train_loss": -42.07075119018555, "global_step": 287789, "epoch": 2378} {"train_loss": -43.281307220458984, "global_step": 287790, "epoch": 2378} {"train_loss": -43.659061431884766, "global_step": 287791, "epoch": 2378} {"train_loss": -43.51884841918945, "global_step": 287792, "epoch": 2378} {"train_loss": -43.5149040222168, "global_step": 287793, "epoch": 2378} {"train_loss": -43.558406829833984, "global_step": 287794, "epoch": 2378} {"train_loss": -43.100440979003906, "global_step": 287795, "epoch": 2378} {"train_loss": -44.1627082824707, "global_step": 287796, "epoch": 2378} {"train_loss": -43.361629486083984, "global_step": 287797, "epoch": 2378} {"train_loss": -43.11602020263672, "global_step": 287798, "epoch": 2378} {"train_loss": -43.640804290771484, "global_step": 287799, "epoch": 2378} {"train_loss": -43.74894332885742, "global_step": 287800, "epoch": 2378} {"train_loss": -43.77809524536133, "global_step": 287801, "epoch": 2378} {"train_loss": -43.84930419921875, "global_step": 287802, "epoch": 2378} {"train_loss": -42.65790939331055, "global_step": 287803, "epoch": 2378} {"train_loss": -42.572296142578125, "global_step": 287804, "epoch": 2378} {"train_loss": -43.99135971069336, "global_step": 287805, "epoch": 2378} {"train_loss": -43.29011535644531, "global_step": 287806, "epoch": 2378} {"train_loss": -43.243568420410156, "global_step": 287807, "epoch": 2378} {"train_loss": -43.54829788208008, "global_step": 287808, "epoch": 2378} {"train_loss": -42.605979919433594, "global_step": 287809, "epoch": 2378} {"train_loss": -42.626216888427734, "global_step": 287810, "epoch": 2378} {"train_loss": -43.55570602416992, "global_step": 287811, "epoch": 2378} {"train_loss": -43.28426742553711, "global_step": 287812, "epoch": 2378} {"train_loss": -41.728492736816406, "global_step": 287813, "epoch": 2378} {"train_loss": -39.843971252441406, "global_step": 287814, "epoch": 2378} {"train_loss": -40.54160690307617, "global_step": 287815, "epoch": 2378} {"train_loss": -42.46390914916992, "global_step": 287816, "epoch": 2378} {"train_loss": -43.50911331176758, "global_step": 287817, "epoch": 2378} {"train_loss": -44.109798431396484, "global_step": 287818, "epoch": 2378} {"train_loss": -42.964595794677734, "global_step": 287819, "epoch": 2378} {"train_loss": -43.094696044921875, "global_step": 287820, "epoch": 2378} {"train_loss": -41.411354064941406, "global_step": 287821, "epoch": 2378} {"train_loss": -43.1175422668457, "global_step": 287822, "epoch": 2378} {"train_loss": -42.505245208740234, "global_step": 287823, "epoch": 2378} {"train_loss": -42.26616287231445, "global_step": 287824, "epoch": 2378} {"train_loss": -42.41663360595703, "global_step": 287825, "epoch": 2378} {"train_loss": -42.64677810668945, "global_step": 287826, "epoch": 2378} {"train_loss": -42.46732711791992, "global_step": 287827, "epoch": 2378} {"train_loss": -42.0227165222168, "global_step": 287828, "epoch": 2378} {"train_loss": -42.76070785522461, "global_step": 287829, "epoch": 2378} {"train_loss": -41.716060638427734, "global_step": 287830, "epoch": 2378} {"train_loss": -40.425106048583984, "global_step": 287831, "epoch": 2378} {"train_loss": -41.40082931518555, "global_step": 287832, "epoch": 2378} {"train_loss": -42.19757843017578, "global_step": 287833, "epoch": 2378} {"train_loss": -43.51237869262695, "global_step": 287834, "epoch": 2378} {"train_loss": -43.102508544921875, "global_step": 287835, "epoch": 2378} {"train_loss": -42.62333297729492, "global_step": 287836, "epoch": 2378} {"train_loss": -40.35512161254883, "global_step": 287837, "epoch": 2378} {"train_loss": -39.26724624633789, "global_step": 287838, "epoch": 2378} {"train_loss": -36.746620178222656, "global_step": 287839, "epoch": 2378} {"train_loss": -38.58015060424805, "global_step": 287840, "epoch": 2378} {"train_loss": -40.359397888183594, "global_step": 287841, "epoch": 2378} {"train_loss": -42.94059371948242, "global_step": 287842, "epoch": 2378} {"train_loss": -40.217620849609375, "global_step": 287843, "epoch": 2378} {"train_loss": -36.90433883666992, "global_step": 287844, "epoch": 2378} {"train_loss": -37.00228500366211, "global_step": 287845, "epoch": 2378} {"train_loss": -41.58815383911133, "global_step": 287846, "epoch": 2378} {"train_loss": -41.22426986694336, "global_step": 287847, "epoch": 2378} {"train_loss": -38.58666229248047, "global_step": 287848, "epoch": 2378} {"train_loss": -41.07090377807617, "global_step": 287849, "epoch": 2378} {"train_loss": -42.286251068115234, "global_step": 287850, "epoch": 2378} {"train_loss": -41.01092529296875, "global_step": 287851, "epoch": 2378} {"train_loss": -42.128597259521484, "global_step": 287852, "epoch": 2378} {"train_loss": -41.42762756347656, "global_step": 287853, "epoch": 2378} {"train_loss": -41.213253021240234, "global_step": 287854, "epoch": 2378} {"train_loss": -41.830238342285156, "global_step": 287855, "epoch": 2378} {"train_loss": -41.927276611328125, "global_step": 287856, "epoch": 2378} {"train_loss": -42.344173431396484, "global_step": 287857, "epoch": 2378} {"train_loss": -42.27969912063977, "global_step": 287858, "epoch": 2378, "val_loss": 2556948.25} {"train_loss": -39.491943359375, "global_step": 287859, "epoch": 2379} {"train_loss": -39.84613037109375, "global_step": 287860, "epoch": 2379} {"train_loss": -39.838497161865234, "global_step": 287861, "epoch": 2379} {"train_loss": -42.69224166870117, "global_step": 287862, "epoch": 2379} {"train_loss": -41.055946350097656, "global_step": 287863, "epoch": 2379} {"train_loss": -41.78889465332031, "global_step": 287864, "epoch": 2379} {"train_loss": -36.587074279785156, "global_step": 287865, "epoch": 2379} {"train_loss": -41.22260665893555, "global_step": 287866, "epoch": 2379} {"train_loss": -40.60378646850586, "global_step": 287867, "epoch": 2379} {"train_loss": -41.58268356323242, "global_step": 287868, "epoch": 2379} {"train_loss": -41.883323669433594, "global_step": 287869, "epoch": 2379} {"train_loss": -41.76414489746094, "global_step": 287870, "epoch": 2379} {"train_loss": -41.40393829345703, "global_step": 287871, "epoch": 2379} {"train_loss": -40.94651412963867, "global_step": 287872, "epoch": 2379} {"train_loss": -40.947784423828125, "global_step": 287873, "epoch": 2379} {"train_loss": -42.61249923706055, "global_step": 287874, "epoch": 2379} {"train_loss": -40.31260299682617, "global_step": 287875, "epoch": 2379} {"train_loss": -42.29702377319336, "global_step": 287876, "epoch": 2379} {"train_loss": -42.11748123168945, "global_step": 287877, "epoch": 2379} {"train_loss": -42.746986389160156, "global_step": 287878, "epoch": 2379} {"train_loss": -41.639686584472656, "global_step": 287879, "epoch": 2379} {"train_loss": -41.3412971496582, "global_step": 287880, "epoch": 2379} {"train_loss": -42.40420150756836, "global_step": 287881, "epoch": 2379} {"train_loss": -42.76164627075195, "global_step": 287882, "epoch": 2379} {"train_loss": -42.67396926879883, "global_step": 287883, "epoch": 2379} {"train_loss": -42.240604400634766, "global_step": 287884, "epoch": 2379} {"train_loss": -42.395774841308594, "global_step": 287885, "epoch": 2379} {"train_loss": -40.94009780883789, "global_step": 287886, "epoch": 2379} {"train_loss": -41.9218635559082, "global_step": 287887, "epoch": 2379} {"train_loss": -42.43265914916992, "global_step": 287888, "epoch": 2379} {"train_loss": -42.389949798583984, "global_step": 287889, "epoch": 2379} {"train_loss": -41.13896560668945, "global_step": 287890, "epoch": 2379} {"train_loss": -42.84610366821289, "global_step": 287891, "epoch": 2379} {"train_loss": -42.11355972290039, "global_step": 287892, "epoch": 2379} {"train_loss": -41.65788650512695, "global_step": 287893, "epoch": 2379} {"train_loss": -42.36058044433594, "global_step": 287894, "epoch": 2379} {"train_loss": -41.4487419128418, "global_step": 287895, "epoch": 2379} {"train_loss": -42.41090393066406, "global_step": 287896, "epoch": 2379} {"train_loss": -41.18852615356445, "global_step": 287897, "epoch": 2379} {"train_loss": -41.96466064453125, "global_step": 287898, "epoch": 2379} {"train_loss": -42.64557647705078, "global_step": 287899, "epoch": 2379} {"train_loss": -38.14974594116211, "global_step": 287900, "epoch": 2379} {"train_loss": -42.213253021240234, "global_step": 287901, "epoch": 2379} {"train_loss": -42.73545455932617, "global_step": 287902, "epoch": 2379} {"train_loss": -41.03031539916992, "global_step": 287903, "epoch": 2379} {"train_loss": -42.78200912475586, "global_step": 287904, "epoch": 2379} {"train_loss": -42.293418884277344, "global_step": 287905, "epoch": 2379} {"train_loss": -42.28156661987305, "global_step": 287906, "epoch": 2379} {"train_loss": -42.83516311645508, "global_step": 287907, "epoch": 2379} {"train_loss": -42.94647216796875, "global_step": 287908, "epoch": 2379} {"train_loss": -42.89595413208008, "global_step": 287909, "epoch": 2379} {"train_loss": -43.1246452331543, "global_step": 287910, "epoch": 2379} {"train_loss": -40.496185302734375, "global_step": 287911, "epoch": 2379} {"train_loss": -42.52766036987305, "global_step": 287912, "epoch": 2379} {"train_loss": -40.7134895324707, "global_step": 287913, "epoch": 2379} {"train_loss": -42.04433059692383, "global_step": 287914, "epoch": 2379} {"train_loss": -43.277252197265625, "global_step": 287915, "epoch": 2379} {"train_loss": -42.61521530151367, "global_step": 287916, "epoch": 2379} {"train_loss": -42.958099365234375, "global_step": 287917, "epoch": 2379} {"train_loss": -42.20998764038086, "global_step": 287918, "epoch": 2379} {"train_loss": -42.763404846191406, "global_step": 287919, "epoch": 2379} {"train_loss": -40.2760124206543, "global_step": 287920, "epoch": 2379} {"train_loss": -42.817867279052734, "global_step": 287921, "epoch": 2379} {"train_loss": -42.46892166137695, "global_step": 287922, "epoch": 2379} {"train_loss": -41.20124053955078, "global_step": 287923, "epoch": 2379} {"train_loss": -42.5822639465332, "global_step": 287924, "epoch": 2379} {"train_loss": -42.39453125, "global_step": 287925, "epoch": 2379} {"train_loss": -42.885475158691406, "global_step": 287926, "epoch": 2379} {"train_loss": -38.537353515625, "global_step": 287927, "epoch": 2379} {"train_loss": -42.190284729003906, "global_step": 287928, "epoch": 2379} {"train_loss": -42.232460021972656, "global_step": 287929, "epoch": 2379} {"train_loss": -42.278839111328125, "global_step": 287930, "epoch": 2379} {"train_loss": -40.99824142456055, "global_step": 287931, "epoch": 2379} {"train_loss": -40.599056243896484, "global_step": 287932, "epoch": 2379} {"train_loss": -42.778255462646484, "global_step": 287933, "epoch": 2379} {"train_loss": -42.91351318359375, "global_step": 287934, "epoch": 2379} {"train_loss": -41.43354034423828, "global_step": 287935, "epoch": 2379} {"train_loss": -42.181556701660156, "global_step": 287936, "epoch": 2379} {"train_loss": -40.374202728271484, "global_step": 287937, "epoch": 2379} {"train_loss": -41.78424835205078, "global_step": 287938, "epoch": 2379} {"train_loss": -41.7412109375, "global_step": 287939, "epoch": 2379} {"train_loss": -41.52427291870117, "global_step": 287940, "epoch": 2379} {"train_loss": -39.27666091918945, "global_step": 287941, "epoch": 2379} {"train_loss": -39.3857421875, "global_step": 287942, "epoch": 2379} {"train_loss": -41.29109573364258, "global_step": 287943, "epoch": 2379} {"train_loss": -40.4246826171875, "global_step": 287944, "epoch": 2379} {"train_loss": -39.68031692504883, "global_step": 287945, "epoch": 2379} {"train_loss": -40.838844299316406, "global_step": 287946, "epoch": 2379} {"train_loss": -39.642578125, "global_step": 287947, "epoch": 2379} {"train_loss": -41.51011276245117, "global_step": 287948, "epoch": 2379} {"train_loss": -38.21043014526367, "global_step": 287949, "epoch": 2379} {"train_loss": -40.68196105957031, "global_step": 287950, "epoch": 2379} {"train_loss": -39.9140510559082, "global_step": 287951, "epoch": 2379} {"train_loss": -41.086910247802734, "global_step": 287952, "epoch": 2379} {"train_loss": -38.701507568359375, "global_step": 287953, "epoch": 2379} {"train_loss": -41.82723617553711, "global_step": 287954, "epoch": 2379} {"train_loss": -39.21950149536133, "global_step": 287955, "epoch": 2379} {"train_loss": -40.36075973510742, "global_step": 287956, "epoch": 2379} {"train_loss": -39.46039581298828, "global_step": 287957, "epoch": 2379} {"train_loss": -38.43595886230469, "global_step": 287958, "epoch": 2379} {"train_loss": -29.16144371032715, "global_step": 287959, "epoch": 2379} {"train_loss": -35.97397232055664, "global_step": 287960, "epoch": 2379} {"train_loss": -35.88429641723633, "global_step": 287961, "epoch": 2379} {"train_loss": -38.52040481567383, "global_step": 287962, "epoch": 2379} {"train_loss": -39.185752868652344, "global_step": 287963, "epoch": 2379} {"train_loss": -40.62197494506836, "global_step": 287964, "epoch": 2379} {"train_loss": -36.56737518310547, "global_step": 287965, "epoch": 2379} {"train_loss": -40.2053337097168, "global_step": 287966, "epoch": 2379} {"train_loss": -39.621002197265625, "global_step": 287967, "epoch": 2379} {"train_loss": -36.616512298583984, "global_step": 287968, "epoch": 2379} {"train_loss": -36.75197219848633, "global_step": 287969, "epoch": 2379} {"train_loss": -40.788978576660156, "global_step": 287970, "epoch": 2379} {"train_loss": -37.414791107177734, "global_step": 287971, "epoch": 2379} {"train_loss": -37.707069396972656, "global_step": 287972, "epoch": 2379} {"train_loss": -38.13374328613281, "global_step": 287973, "epoch": 2379} {"train_loss": -38.34119415283203, "global_step": 287974, "epoch": 2379} {"train_loss": -40.09100341796875, "global_step": 287975, "epoch": 2379} {"train_loss": -38.24093246459961, "global_step": 287976, "epoch": 2379} {"train_loss": -40.685306549072266, "global_step": 287977, "epoch": 2379} {"train_loss": -40.7119140625, "global_step": 287978, "epoch": 2379} {"train_loss": -40.861958038708394, "global_step": 287979, "epoch": 2379, "val_loss": 2538198.25} {"train_loss": -40.80918502807617, "global_step": 287980, "epoch": 2380} {"train_loss": -39.28179168701172, "global_step": 287981, "epoch": 2380} {"train_loss": -39.779842376708984, "global_step": 287982, "epoch": 2380} {"train_loss": -40.302459716796875, "global_step": 287983, "epoch": 2380} {"train_loss": -39.980926513671875, "global_step": 287984, "epoch": 2380} {"train_loss": -40.501644134521484, "global_step": 287985, "epoch": 2380} {"train_loss": -39.01496124267578, "global_step": 287986, "epoch": 2380} {"train_loss": -39.505699157714844, "global_step": 287987, "epoch": 2380} {"train_loss": -41.131752014160156, "global_step": 287988, "epoch": 2380} {"train_loss": -40.383670806884766, "global_step": 287989, "epoch": 2380} {"train_loss": -40.76541519165039, "global_step": 287990, "epoch": 2380} {"train_loss": -41.144561767578125, "global_step": 287991, "epoch": 2380} {"train_loss": -41.25461959838867, "global_step": 287992, "epoch": 2380} {"train_loss": -42.297706604003906, "global_step": 287993, "epoch": 2380} {"train_loss": -41.045738220214844, "global_step": 287994, "epoch": 2380} {"train_loss": -41.9028434753418, "global_step": 287995, "epoch": 2380} {"train_loss": -41.28355026245117, "global_step": 287996, "epoch": 2380} {"train_loss": -39.9951286315918, "global_step": 287997, "epoch": 2380} {"train_loss": -41.67884826660156, "global_step": 287998, "epoch": 2380} {"train_loss": -40.66650390625, "global_step": 287999, "epoch": 2380} {"train_loss": -40.7775993347168, "global_step": 288000, "epoch": 2380} {"train_loss": -41.62603759765625, "global_step": 288001, "epoch": 2380} {"train_loss": -41.39499282836914, "global_step": 288002, "epoch": 2380} {"train_loss": -42.144081115722656, "global_step": 288003, "epoch": 2380} {"train_loss": -42.1139030456543, "global_step": 288004, "epoch": 2380} {"train_loss": -41.70150375366211, "global_step": 288005, "epoch": 2380} {"train_loss": -41.881282806396484, "global_step": 288006, "epoch": 2380} {"train_loss": -41.527462005615234, "global_step": 288007, "epoch": 2380} {"train_loss": -40.19181823730469, "global_step": 288008, "epoch": 2380} {"train_loss": -41.9901008605957, "global_step": 288009, "epoch": 2380} {"train_loss": -42.34148406982422, "global_step": 288010, "epoch": 2380} {"train_loss": -42.036739349365234, "global_step": 288011, "epoch": 2380} {"train_loss": -41.745697021484375, "global_step": 288012, "epoch": 2380} {"train_loss": -41.940059661865234, "global_step": 288013, "epoch": 2380} {"train_loss": -41.6220817565918, "global_step": 288014, "epoch": 2380} {"train_loss": -40.53744125366211, "global_step": 288015, "epoch": 2380} {"train_loss": -42.12714767456055, "global_step": 288016, "epoch": 2380} {"train_loss": -41.84046173095703, "global_step": 288017, "epoch": 2380} {"train_loss": -41.963863372802734, "global_step": 288018, "epoch": 2380} {"train_loss": -41.078956604003906, "global_step": 288019, "epoch": 2380} {"train_loss": -41.658260345458984, "global_step": 288020, "epoch": 2380} {"train_loss": -42.1204948425293, "global_step": 288021, "epoch": 2380} {"train_loss": -41.756072998046875, "global_step": 288022, "epoch": 2380} {"train_loss": -41.06648635864258, "global_step": 288023, "epoch": 2380} {"train_loss": -41.66533660888672, "global_step": 288024, "epoch": 2380} {"train_loss": -42.121864318847656, "global_step": 288025, "epoch": 2380} {"train_loss": -42.47270965576172, "global_step": 288026, "epoch": 2380} {"train_loss": -42.22046661376953, "global_step": 288027, "epoch": 2380} {"train_loss": -42.63670349121094, "global_step": 288028, "epoch": 2380} {"train_loss": -40.537837982177734, "global_step": 288029, "epoch": 2380} {"train_loss": -42.16482162475586, "global_step": 288030, "epoch": 2380} {"train_loss": -41.89382553100586, "global_step": 288031, "epoch": 2380} {"train_loss": -37.817291259765625, "global_step": 288032, "epoch": 2380} {"train_loss": -41.29293441772461, "global_step": 288033, "epoch": 2380} {"train_loss": -41.2471923828125, "global_step": 288034, "epoch": 2380} {"train_loss": -41.8439826965332, "global_step": 288035, "epoch": 2380} {"train_loss": -42.15370559692383, "global_step": 288036, "epoch": 2380} {"train_loss": -42.00251007080078, "global_step": 288037, "epoch": 2380} {"train_loss": -41.487613677978516, "global_step": 288038, "epoch": 2380} {"train_loss": -42.27216720581055, "global_step": 288039, "epoch": 2380} {"train_loss": -42.12722396850586, "global_step": 288040, "epoch": 2380} {"train_loss": -42.25655746459961, "global_step": 288041, "epoch": 2380} {"train_loss": -41.95784378051758, "global_step": 288042, "epoch": 2380} {"train_loss": -42.12879943847656, "global_step": 288043, "epoch": 2380} {"train_loss": -42.3011360168457, "global_step": 288044, "epoch": 2380} {"train_loss": -41.897560119628906, "global_step": 288045, "epoch": 2380} {"train_loss": -41.832489013671875, "global_step": 288046, "epoch": 2380} {"train_loss": -39.78974151611328, "global_step": 288047, "epoch": 2380} {"train_loss": -42.19247055053711, "global_step": 288048, "epoch": 2380} {"train_loss": -42.92596435546875, "global_step": 288049, "epoch": 2380} {"train_loss": -40.647090911865234, "global_step": 288050, "epoch": 2380} {"train_loss": -41.69993209838867, "global_step": 288051, "epoch": 2380} {"train_loss": -42.44947052001953, "global_step": 288052, "epoch": 2380} {"train_loss": -42.74772262573242, "global_step": 288053, "epoch": 2380} {"train_loss": -42.07603073120117, "global_step": 288054, "epoch": 2380} {"train_loss": -42.9291877746582, "global_step": 288055, "epoch": 2380} {"train_loss": -42.4490966796875, "global_step": 288056, "epoch": 2380} {"train_loss": -41.69934844970703, "global_step": 288057, "epoch": 2380} {"train_loss": -43.076210021972656, "global_step": 288058, "epoch": 2380} {"train_loss": -40.57974624633789, "global_step": 288059, "epoch": 2380} {"train_loss": -37.0627555847168, "global_step": 288060, "epoch": 2380} {"train_loss": -41.3436279296875, "global_step": 288061, "epoch": 2380} {"train_loss": -39.93720245361328, "global_step": 288062, "epoch": 2380} {"train_loss": -41.08689498901367, "global_step": 288063, "epoch": 2380} {"train_loss": -41.22540283203125, "global_step": 288064, "epoch": 2380} {"train_loss": -41.72615432739258, "global_step": 288065, "epoch": 2380} {"train_loss": -42.362030029296875, "global_step": 288066, "epoch": 2380} {"train_loss": -42.16873550415039, "global_step": 288067, "epoch": 2380} {"train_loss": -41.862525939941406, "global_step": 288068, "epoch": 2380} {"train_loss": -39.48264694213867, "global_step": 288069, "epoch": 2380} {"train_loss": -41.47119140625, "global_step": 288070, "epoch": 2380} {"train_loss": -42.22916793823242, "global_step": 288071, "epoch": 2380} {"train_loss": -40.67416000366211, "global_step": 288072, "epoch": 2380} {"train_loss": -41.77859115600586, "global_step": 288073, "epoch": 2380} {"train_loss": -42.09370422363281, "global_step": 288074, "epoch": 2380} {"train_loss": -42.768978118896484, "global_step": 288075, "epoch": 2380} {"train_loss": -41.143795013427734, "global_step": 288076, "epoch": 2380} {"train_loss": -41.89857482910156, "global_step": 288077, "epoch": 2380} {"train_loss": -41.11513137817383, "global_step": 288078, "epoch": 2380} {"train_loss": -42.07695388793945, "global_step": 288079, "epoch": 2380} {"train_loss": -42.201995849609375, "global_step": 288080, "epoch": 2380} {"train_loss": -42.584190368652344, "global_step": 288081, "epoch": 2380} {"train_loss": -41.4410400390625, "global_step": 288082, "epoch": 2380} {"train_loss": -41.315711975097656, "global_step": 288083, "epoch": 2380} {"train_loss": -40.168556213378906, "global_step": 288084, "epoch": 2380} {"train_loss": -42.454627990722656, "global_step": 288085, "epoch": 2380} {"train_loss": -42.83304214477539, "global_step": 288086, "epoch": 2380} {"train_loss": -42.06889724731445, "global_step": 288087, "epoch": 2380} {"train_loss": -40.924251556396484, "global_step": 288088, "epoch": 2380} {"train_loss": -42.09830856323242, "global_step": 288089, "epoch": 2380} {"train_loss": -41.7319450378418, "global_step": 288090, "epoch": 2380} {"train_loss": -40.96244812011719, "global_step": 288091, "epoch": 2380} {"train_loss": -41.12557601928711, "global_step": 288092, "epoch": 2380} {"train_loss": -41.66730880737305, "global_step": 288093, "epoch": 2380} {"train_loss": -41.96510696411133, "global_step": 288094, "epoch": 2380} {"train_loss": -41.48518371582031, "global_step": 288095, "epoch": 2380} {"train_loss": -41.07025146484375, "global_step": 288096, "epoch": 2380} {"train_loss": -41.14430618286133, "global_step": 288097, "epoch": 2380} {"train_loss": -36.209617614746094, "global_step": 288098, "epoch": 2380} {"train_loss": -42.3106803894043, "global_step": 288099, "epoch": 2380} {"train_loss": -41.42212421637921, "global_step": 288100, "epoch": 2380, "val_loss": 2426268.75} {"train_loss": -41.801353454589844, "global_step": 288101, "epoch": 2381} {"train_loss": -40.21826171875, "global_step": 288102, "epoch": 2381} {"train_loss": -40.94154739379883, "global_step": 288103, "epoch": 2381} {"train_loss": -40.75858688354492, "global_step": 288104, "epoch": 2381} {"train_loss": -42.33148956298828, "global_step": 288105, "epoch": 2381} {"train_loss": -41.99178695678711, "global_step": 288106, "epoch": 2381} {"train_loss": -40.37069320678711, "global_step": 288107, "epoch": 2381} {"train_loss": -41.90920639038086, "global_step": 288108, "epoch": 2381} {"train_loss": -41.97205352783203, "global_step": 288109, "epoch": 2381} {"train_loss": -39.337799072265625, "global_step": 288110, "epoch": 2381} {"train_loss": -41.99620056152344, "global_step": 288111, "epoch": 2381} {"train_loss": -40.53242874145508, "global_step": 288112, "epoch": 2381} {"train_loss": -41.6184196472168, "global_step": 288113, "epoch": 2381} {"train_loss": -41.76933670043945, "global_step": 288114, "epoch": 2381} {"train_loss": -41.95734786987305, "global_step": 288115, "epoch": 2381} {"train_loss": -39.6069221496582, "global_step": 288116, "epoch": 2381} {"train_loss": -42.08960723876953, "global_step": 288117, "epoch": 2381} {"train_loss": -40.48427963256836, "global_step": 288118, "epoch": 2381} {"train_loss": -39.899574279785156, "global_step": 288119, "epoch": 2381} {"train_loss": -39.32551956176758, "global_step": 288120, "epoch": 2381} {"train_loss": -41.50289535522461, "global_step": 288121, "epoch": 2381} {"train_loss": -39.29916000366211, "global_step": 288122, "epoch": 2381} {"train_loss": -41.83314895629883, "global_step": 288123, "epoch": 2381} {"train_loss": -39.38087844848633, "global_step": 288124, "epoch": 2381} {"train_loss": -40.97774124145508, "global_step": 288125, "epoch": 2381} {"train_loss": -40.76374435424805, "global_step": 288126, "epoch": 2381} {"train_loss": -41.544063568115234, "global_step": 288127, "epoch": 2381} {"train_loss": -39.97380065917969, "global_step": 288128, "epoch": 2381} {"train_loss": -41.88425827026367, "global_step": 288129, "epoch": 2381} {"train_loss": -41.075958251953125, "global_step": 288130, "epoch": 2381} {"train_loss": -42.525596618652344, "global_step": 288131, "epoch": 2381} {"train_loss": -41.1229248046875, "global_step": 288132, "epoch": 2381} {"train_loss": -41.7432861328125, "global_step": 288133, "epoch": 2381} {"train_loss": -40.27916717529297, "global_step": 288134, "epoch": 2381} {"train_loss": -42.525917053222656, "global_step": 288135, "epoch": 2381} {"train_loss": -40.96245193481445, "global_step": 288136, "epoch": 2381} {"train_loss": -40.22146224975586, "global_step": 288137, "epoch": 2381} {"train_loss": -42.67534255981445, "global_step": 288138, "epoch": 2381} {"train_loss": -41.535377502441406, "global_step": 288139, "epoch": 2381} {"train_loss": -41.074432373046875, "global_step": 288140, "epoch": 2381} {"train_loss": -41.863914489746094, "global_step": 288141, "epoch": 2381} {"train_loss": -41.6783561706543, "global_step": 288142, "epoch": 2381} {"train_loss": -41.32329559326172, "global_step": 288143, "epoch": 2381} {"train_loss": -37.82880783081055, "global_step": 288144, "epoch": 2381} {"train_loss": -41.49301528930664, "global_step": 288145, "epoch": 2381} {"train_loss": -41.505287170410156, "global_step": 288146, "epoch": 2381} {"train_loss": -41.08209991455078, "global_step": 288147, "epoch": 2381} {"train_loss": -38.96206283569336, "global_step": 288148, "epoch": 2381} {"train_loss": -41.67253875732422, "global_step": 288149, "epoch": 2381} {"train_loss": -40.14632797241211, "global_step": 288150, "epoch": 2381} {"train_loss": -41.97608947753906, "global_step": 288151, "epoch": 2381} {"train_loss": -41.701595306396484, "global_step": 288152, "epoch": 2381} {"train_loss": -41.371944427490234, "global_step": 288153, "epoch": 2381} {"train_loss": -41.93330001831055, "global_step": 288154, "epoch": 2381} {"train_loss": -41.9548225402832, "global_step": 288155, "epoch": 2381} {"train_loss": -41.99512481689453, "global_step": 288156, "epoch": 2381} {"train_loss": -41.773738861083984, "global_step": 288157, "epoch": 2381} {"train_loss": -41.10927200317383, "global_step": 288158, "epoch": 2381} {"train_loss": -42.19868087768555, "global_step": 288159, "epoch": 2381} {"train_loss": -41.73244857788086, "global_step": 288160, "epoch": 2381} {"train_loss": -42.215877532958984, "global_step": 288161, "epoch": 2381} {"train_loss": -40.944190979003906, "global_step": 288162, "epoch": 2381} {"train_loss": -41.73923873901367, "global_step": 288163, "epoch": 2381} {"train_loss": -42.066226959228516, "global_step": 288164, "epoch": 2381} {"train_loss": -42.61124801635742, "global_step": 288165, "epoch": 2381} {"train_loss": -40.58076095581055, "global_step": 288166, "epoch": 2381} {"train_loss": -42.413448333740234, "global_step": 288167, "epoch": 2381} {"train_loss": -42.61274337768555, "global_step": 288168, "epoch": 2381} {"train_loss": -41.959388732910156, "global_step": 288169, "epoch": 2381} {"train_loss": -42.3305549621582, "global_step": 288170, "epoch": 2381} {"train_loss": -42.223236083984375, "global_step": 288171, "epoch": 2381} {"train_loss": -41.38091278076172, "global_step": 288172, "epoch": 2381} {"train_loss": -42.105831146240234, "global_step": 288173, "epoch": 2381} {"train_loss": -42.078731536865234, "global_step": 288174, "epoch": 2381} {"train_loss": -42.31201171875, "global_step": 288175, "epoch": 2381} {"train_loss": -42.3358154296875, "global_step": 288176, "epoch": 2381} {"train_loss": -41.53702926635742, "global_step": 288177, "epoch": 2381} {"train_loss": -41.39825439453125, "global_step": 288178, "epoch": 2381} {"train_loss": -42.72880935668945, "global_step": 288179, "epoch": 2381} {"train_loss": -42.60641098022461, "global_step": 288180, "epoch": 2381} {"train_loss": -42.39470291137695, "global_step": 288181, "epoch": 2381} {"train_loss": -42.75996780395508, "global_step": 288182, "epoch": 2381} {"train_loss": -42.15009689331055, "global_step": 288183, "epoch": 2381} {"train_loss": -41.9052619934082, "global_step": 288184, "epoch": 2381} {"train_loss": -43.350196838378906, "global_step": 288185, "epoch": 2381} {"train_loss": -42.694759368896484, "global_step": 288186, "epoch": 2381} {"train_loss": -41.239662170410156, "global_step": 288187, "epoch": 2381} {"train_loss": -42.07179641723633, "global_step": 288188, "epoch": 2381} {"train_loss": -42.17734909057617, "global_step": 288189, "epoch": 2381} {"train_loss": -42.22519302368164, "global_step": 288190, "epoch": 2381} {"train_loss": -42.85108184814453, "global_step": 288191, "epoch": 2381} {"train_loss": -42.475337982177734, "global_step": 288192, "epoch": 2381} {"train_loss": -42.205726623535156, "global_step": 288193, "epoch": 2381} {"train_loss": -41.88662338256836, "global_step": 288194, "epoch": 2381} {"train_loss": -43.23752212524414, "global_step": 288195, "epoch": 2381} {"train_loss": -42.35469436645508, "global_step": 288196, "epoch": 2381} {"train_loss": -42.86245346069336, "global_step": 288197, "epoch": 2381} {"train_loss": -42.99420928955078, "global_step": 288198, "epoch": 2381} {"train_loss": -43.204254150390625, "global_step": 288199, "epoch": 2381} {"train_loss": -42.62677001953125, "global_step": 288200, "epoch": 2381} {"train_loss": -42.34043502807617, "global_step": 288201, "epoch": 2381} {"train_loss": -42.82578659057617, "global_step": 288202, "epoch": 2381} {"train_loss": -42.34117126464844, "global_step": 288203, "epoch": 2381} {"train_loss": -41.86982727050781, "global_step": 288204, "epoch": 2381} {"train_loss": -42.639461517333984, "global_step": 288205, "epoch": 2381} {"train_loss": -42.968441009521484, "global_step": 288206, "epoch": 2381} {"train_loss": -43.006221771240234, "global_step": 288207, "epoch": 2381} {"train_loss": -43.32802963256836, "global_step": 288208, "epoch": 2381} {"train_loss": -41.705223083496094, "global_step": 288209, "epoch": 2381} {"train_loss": -42.302608489990234, "global_step": 288210, "epoch": 2381} {"train_loss": -41.818660736083984, "global_step": 288211, "epoch": 2381} {"train_loss": -42.94196701049805, "global_step": 288212, "epoch": 2381} {"train_loss": -42.63166427612305, "global_step": 288213, "epoch": 2381} {"train_loss": -41.42424392700195, "global_step": 288214, "epoch": 2381} {"train_loss": -42.4697151184082, "global_step": 288215, "epoch": 2381} {"train_loss": -41.3577880859375, "global_step": 288216, "epoch": 2381} {"train_loss": -41.58622360229492, "global_step": 288217, "epoch": 2381} {"train_loss": -42.111534118652344, "global_step": 288218, "epoch": 2381} {"train_loss": -42.28408432006836, "global_step": 288219, "epoch": 2381} {"train_loss": -40.7802848815918, "global_step": 288220, "epoch": 2381} {"train_loss": -41.707924992584985, "global_step": 288221, "epoch": 2381, "val_loss": 2397864.5} {"train_loss": -41.956817626953125, "global_step": 288222, "epoch": 2382} {"train_loss": -41.858646392822266, "global_step": 288223, "epoch": 2382} {"train_loss": -41.73634719848633, "global_step": 288224, "epoch": 2382} {"train_loss": -39.70056915283203, "global_step": 288225, "epoch": 2382} {"train_loss": -39.296417236328125, "global_step": 288226, "epoch": 2382} {"train_loss": -40.9390869140625, "global_step": 288227, "epoch": 2382} {"train_loss": -39.71601104736328, "global_step": 288228, "epoch": 2382} {"train_loss": -41.367855072021484, "global_step": 288229, "epoch": 2382} {"train_loss": -39.459129333496094, "global_step": 288230, "epoch": 2382} {"train_loss": -40.34954833984375, "global_step": 288231, "epoch": 2382} {"train_loss": -41.272586822509766, "global_step": 288232, "epoch": 2382} {"train_loss": -42.072147369384766, "global_step": 288233, "epoch": 2382} {"train_loss": -41.05698776245117, "global_step": 288234, "epoch": 2382} {"train_loss": -41.1187744140625, "global_step": 288235, "epoch": 2382} {"train_loss": -37.224483489990234, "global_step": 288236, "epoch": 2382} {"train_loss": -37.91769027709961, "global_step": 288237, "epoch": 2382} {"train_loss": -41.60044479370117, "global_step": 288238, "epoch": 2382} {"train_loss": -41.122657775878906, "global_step": 288239, "epoch": 2382} {"train_loss": -40.19867706298828, "global_step": 288240, "epoch": 2382} {"train_loss": -40.549312591552734, "global_step": 288241, "epoch": 2382} {"train_loss": -41.67753219604492, "global_step": 288242, "epoch": 2382} {"train_loss": -39.681461334228516, "global_step": 288243, "epoch": 2382} {"train_loss": -41.34487533569336, "global_step": 288244, "epoch": 2382} {"train_loss": -38.14255905151367, "global_step": 288245, "epoch": 2382} {"train_loss": -41.96658706665039, "global_step": 288246, "epoch": 2382} {"train_loss": -41.26186752319336, "global_step": 288247, "epoch": 2382} {"train_loss": -42.16022491455078, "global_step": 288248, "epoch": 2382} {"train_loss": -41.305904388427734, "global_step": 288249, "epoch": 2382} {"train_loss": -35.884578704833984, "global_step": 288250, "epoch": 2382} {"train_loss": -42.029014587402344, "global_step": 288251, "epoch": 2382} {"train_loss": -39.7162971496582, "global_step": 288252, "epoch": 2382} {"train_loss": -40.92402648925781, "global_step": 288253, "epoch": 2382} {"train_loss": -39.708492279052734, "global_step": 288254, "epoch": 2382} {"train_loss": -40.60699462890625, "global_step": 288255, "epoch": 2382} {"train_loss": -41.84391784667969, "global_step": 288256, "epoch": 2382} {"train_loss": -41.71554946899414, "global_step": 288257, "epoch": 2382} {"train_loss": -41.29462814331055, "global_step": 288258, "epoch": 2382} {"train_loss": -41.591732025146484, "global_step": 288259, "epoch": 2382} {"train_loss": -41.95209503173828, "global_step": 288260, "epoch": 2382} {"train_loss": -41.67247772216797, "global_step": 288261, "epoch": 2382} {"train_loss": -41.7698860168457, "global_step": 288262, "epoch": 2382} {"train_loss": -42.351783752441406, "global_step": 288263, "epoch": 2382} {"train_loss": -41.70026779174805, "global_step": 288264, "epoch": 2382} {"train_loss": -40.73444366455078, "global_step": 288265, "epoch": 2382} {"train_loss": -41.99978256225586, "global_step": 288266, "epoch": 2382} {"train_loss": -41.107112884521484, "global_step": 288267, "epoch": 2382} {"train_loss": -42.32035446166992, "global_step": 288268, "epoch": 2382} {"train_loss": -41.93486022949219, "global_step": 288269, "epoch": 2382} {"train_loss": -40.946075439453125, "global_step": 288270, "epoch": 2382} {"train_loss": -41.9289436340332, "global_step": 288271, "epoch": 2382} {"train_loss": -42.6151008605957, "global_step": 288272, "epoch": 2382} {"train_loss": -41.95104217529297, "global_step": 288273, "epoch": 2382} {"train_loss": -42.81757736206055, "global_step": 288274, "epoch": 2382} {"train_loss": -42.699073791503906, "global_step": 288275, "epoch": 2382} {"train_loss": -41.76154327392578, "global_step": 288276, "epoch": 2382} {"train_loss": -42.33274841308594, "global_step": 288277, "epoch": 2382} {"train_loss": -42.09142303466797, "global_step": 288278, "epoch": 2382} {"train_loss": -41.999324798583984, "global_step": 288279, "epoch": 2382} {"train_loss": -41.78253173828125, "global_step": 288280, "epoch": 2382} {"train_loss": -42.15972900390625, "global_step": 288281, "epoch": 2382} {"train_loss": -41.206172943115234, "global_step": 288282, "epoch": 2382} {"train_loss": -43.088356018066406, "global_step": 288283, "epoch": 2382} {"train_loss": -42.66268539428711, "global_step": 288284, "epoch": 2382} {"train_loss": -40.791812896728516, "global_step": 288285, "epoch": 2382} {"train_loss": -41.88607406616211, "global_step": 288286, "epoch": 2382} {"train_loss": -42.108333587646484, "global_step": 288287, "epoch": 2382} {"train_loss": -42.37126922607422, "global_step": 288288, "epoch": 2382} {"train_loss": -42.29806137084961, "global_step": 288289, "epoch": 2382} {"train_loss": -42.96270751953125, "global_step": 288290, "epoch": 2382} {"train_loss": -40.8934211730957, "global_step": 288291, "epoch": 2382} {"train_loss": -42.2803955078125, "global_step": 288292, "epoch": 2382} {"train_loss": -42.189208984375, "global_step": 288293, "epoch": 2382} {"train_loss": -41.3848991394043, "global_step": 288294, "epoch": 2382} {"train_loss": -41.02394485473633, "global_step": 288295, "epoch": 2382} {"train_loss": -43.20220947265625, "global_step": 288296, "epoch": 2382} {"train_loss": -42.27950668334961, "global_step": 288297, "epoch": 2382} {"train_loss": -42.2470817565918, "global_step": 288298, "epoch": 2382} {"train_loss": -41.71446228027344, "global_step": 288299, "epoch": 2382} {"train_loss": -42.29970932006836, "global_step": 288300, "epoch": 2382} {"train_loss": -42.553688049316406, "global_step": 288301, "epoch": 2382} {"train_loss": -42.35938262939453, "global_step": 288302, "epoch": 2382} {"train_loss": -41.108001708984375, "global_step": 288303, "epoch": 2382} {"train_loss": -42.636287689208984, "global_step": 288304, "epoch": 2382} {"train_loss": -42.787715911865234, "global_step": 288305, "epoch": 2382} {"train_loss": -42.0522575378418, "global_step": 288306, "epoch": 2382} {"train_loss": -43.16550827026367, "global_step": 288307, "epoch": 2382} {"train_loss": -41.61720657348633, "global_step": 288308, "epoch": 2382} {"train_loss": -40.8134651184082, "global_step": 288309, "epoch": 2382} {"train_loss": -42.85372543334961, "global_step": 288310, "epoch": 2382} {"train_loss": -42.58810043334961, "global_step": 288311, "epoch": 2382} {"train_loss": -39.26310348510742, "global_step": 288312, "epoch": 2382} {"train_loss": -42.50989532470703, "global_step": 288313, "epoch": 2382} {"train_loss": -41.8520622253418, "global_step": 288314, "epoch": 2382} {"train_loss": -42.76738357543945, "global_step": 288315, "epoch": 2382} {"train_loss": -40.65182113647461, "global_step": 288316, "epoch": 2382} {"train_loss": -42.80288314819336, "global_step": 288317, "epoch": 2382} {"train_loss": -42.76111602783203, "global_step": 288318, "epoch": 2382} {"train_loss": -42.26482009887695, "global_step": 288319, "epoch": 2382} {"train_loss": -41.9008903503418, "global_step": 288320, "epoch": 2382} {"train_loss": -42.86307907104492, "global_step": 288321, "epoch": 2382} {"train_loss": -42.51769256591797, "global_step": 288322, "epoch": 2382} {"train_loss": -42.01959991455078, "global_step": 288323, "epoch": 2382} {"train_loss": -42.30388641357422, "global_step": 288324, "epoch": 2382} {"train_loss": -42.40444564819336, "global_step": 288325, "epoch": 2382} {"train_loss": -43.00533676147461, "global_step": 288326, "epoch": 2382} {"train_loss": -42.68681335449219, "global_step": 288327, "epoch": 2382} {"train_loss": -42.61866760253906, "global_step": 288328, "epoch": 2382} {"train_loss": -42.18142318725586, "global_step": 288329, "epoch": 2382} {"train_loss": -42.31651306152344, "global_step": 288330, "epoch": 2382} {"train_loss": -42.53001022338867, "global_step": 288331, "epoch": 2382} {"train_loss": -42.75056838989258, "global_step": 288332, "epoch": 2382} {"train_loss": -43.29863357543945, "global_step": 288333, "epoch": 2382} {"train_loss": -41.6845588684082, "global_step": 288334, "epoch": 2382} {"train_loss": -42.78237533569336, "global_step": 288335, "epoch": 2382} {"train_loss": -42.422119140625, "global_step": 288336, "epoch": 2382} {"train_loss": -42.76727294921875, "global_step": 288337, "epoch": 2382} {"train_loss": -42.45066452026367, "global_step": 288338, "epoch": 2382} {"train_loss": -42.51325988769531, "global_step": 288339, "epoch": 2382} {"train_loss": -42.50822830200195, "global_step": 288340, "epoch": 2382} {"train_loss": -43.0892333984375, "global_step": 288341, "epoch": 2382} {"train_loss": -41.67398903586648, "global_step": 288342, "epoch": 2382, "val_loss": 2450624.75} {"train_loss": -42.805049896240234, "global_step": 288343, "epoch": 2383} {"train_loss": -43.04057693481445, "global_step": 288344, "epoch": 2383} {"train_loss": -43.16596221923828, "global_step": 288345, "epoch": 2383} {"train_loss": -43.71284103393555, "global_step": 288346, "epoch": 2383} {"train_loss": -42.238990783691406, "global_step": 288347, "epoch": 2383} {"train_loss": -40.98053741455078, "global_step": 288348, "epoch": 2383} {"train_loss": -42.3448371887207, "global_step": 288349, "epoch": 2383} {"train_loss": -42.862335205078125, "global_step": 288350, "epoch": 2383} {"train_loss": -43.13533401489258, "global_step": 288351, "epoch": 2383} {"train_loss": -40.51436996459961, "global_step": 288352, "epoch": 2383} {"train_loss": -39.658447265625, "global_step": 288353, "epoch": 2383} {"train_loss": -40.837432861328125, "global_step": 288354, "epoch": 2383} {"train_loss": -42.313720703125, "global_step": 288355, "epoch": 2383} {"train_loss": -42.4952507019043, "global_step": 288356, "epoch": 2383} {"train_loss": -40.36309814453125, "global_step": 288357, "epoch": 2383} {"train_loss": -41.14225769042969, "global_step": 288358, "epoch": 2383} {"train_loss": -42.0591926574707, "global_step": 288359, "epoch": 2383} {"train_loss": -41.426185607910156, "global_step": 288360, "epoch": 2383} {"train_loss": -41.57064437866211, "global_step": 288361, "epoch": 2383} {"train_loss": -42.41200637817383, "global_step": 288362, "epoch": 2383} {"train_loss": -41.00170135498047, "global_step": 288363, "epoch": 2383} {"train_loss": -39.60633087158203, "global_step": 288364, "epoch": 2383} {"train_loss": -39.29681396484375, "global_step": 288365, "epoch": 2383} {"train_loss": -41.08742904663086, "global_step": 288366, "epoch": 2383} {"train_loss": -38.950592041015625, "global_step": 288367, "epoch": 2383} {"train_loss": -40.15388107299805, "global_step": 288368, "epoch": 2383} {"train_loss": -41.29656982421875, "global_step": 288369, "epoch": 2383} {"train_loss": -40.741920471191406, "global_step": 288370, "epoch": 2383} {"train_loss": -41.773681640625, "global_step": 288371, "epoch": 2383} {"train_loss": -42.14741134643555, "global_step": 288372, "epoch": 2383} {"train_loss": -41.52843475341797, "global_step": 288373, "epoch": 2383} {"train_loss": -42.88300704956055, "global_step": 288374, "epoch": 2383} {"train_loss": -42.53157043457031, "global_step": 288375, "epoch": 2383} {"train_loss": -40.90645217895508, "global_step": 288376, "epoch": 2383} {"train_loss": -42.50297164916992, "global_step": 288377, "epoch": 2383} {"train_loss": -41.13189697265625, "global_step": 288378, "epoch": 2383} {"train_loss": -42.47140121459961, "global_step": 288379, "epoch": 2383} {"train_loss": -41.40013122558594, "global_step": 288380, "epoch": 2383} {"train_loss": -42.44589614868164, "global_step": 288381, "epoch": 2383} {"train_loss": -41.632667541503906, "global_step": 288382, "epoch": 2383} {"train_loss": -41.89057540893555, "global_step": 288383, "epoch": 2383} {"train_loss": -41.49763107299805, "global_step": 288384, "epoch": 2383} {"train_loss": -41.39820098876953, "global_step": 288385, "epoch": 2383} {"train_loss": -41.416561126708984, "global_step": 288386, "epoch": 2383} {"train_loss": -41.77044677734375, "global_step": 288387, "epoch": 2383} {"train_loss": -41.434444427490234, "global_step": 288388, "epoch": 2383} {"train_loss": -42.488643646240234, "global_step": 288389, "epoch": 2383} {"train_loss": -41.88424301147461, "global_step": 288390, "epoch": 2383} {"train_loss": -42.191890716552734, "global_step": 288391, "epoch": 2383} {"train_loss": -42.05091857910156, "global_step": 288392, "epoch": 2383} {"train_loss": -40.834510803222656, "global_step": 288393, "epoch": 2383} {"train_loss": -42.84434127807617, "global_step": 288394, "epoch": 2383} {"train_loss": -42.62142562866211, "global_step": 288395, "epoch": 2383} {"train_loss": -41.46425247192383, "global_step": 288396, "epoch": 2383} {"train_loss": -43.119815826416016, "global_step": 288397, "epoch": 2383} {"train_loss": -42.46486282348633, "global_step": 288398, "epoch": 2383} {"train_loss": -42.726409912109375, "global_step": 288399, "epoch": 2383} {"train_loss": -43.16192626953125, "global_step": 288400, "epoch": 2383} {"train_loss": -42.394020080566406, "global_step": 288401, "epoch": 2383} {"train_loss": -42.93571472167969, "global_step": 288402, "epoch": 2383} {"train_loss": -42.54200744628906, "global_step": 288403, "epoch": 2383} {"train_loss": -43.148860931396484, "global_step": 288404, "epoch": 2383} {"train_loss": -43.03845977783203, "global_step": 288405, "epoch": 2383} {"train_loss": -42.933963775634766, "global_step": 288406, "epoch": 2383} {"train_loss": -42.8223876953125, "global_step": 288407, "epoch": 2383} {"train_loss": -43.04731369018555, "global_step": 288408, "epoch": 2383} {"train_loss": -43.60329055786133, "global_step": 288409, "epoch": 2383} {"train_loss": -43.28458023071289, "global_step": 288410, "epoch": 2383} {"train_loss": -43.271053314208984, "global_step": 288411, "epoch": 2383} {"train_loss": -43.01723098754883, "global_step": 288412, "epoch": 2383} {"train_loss": -43.41159439086914, "global_step": 288413, "epoch": 2383} {"train_loss": -43.10403060913086, "global_step": 288414, "epoch": 2383} {"train_loss": -42.45682907104492, "global_step": 288415, "epoch": 2383} {"train_loss": -43.39264678955078, "global_step": 288416, "epoch": 2383} {"train_loss": -42.847843170166016, "global_step": 288417, "epoch": 2383} {"train_loss": -43.112762451171875, "global_step": 288418, "epoch": 2383} {"train_loss": -43.8881950378418, "global_step": 288419, "epoch": 2383} {"train_loss": -43.07039260864258, "global_step": 288420, "epoch": 2383} {"train_loss": -43.8990592956543, "global_step": 288421, "epoch": 2383} {"train_loss": -43.14864730834961, "global_step": 288422, "epoch": 2383} {"train_loss": -43.642337799072266, "global_step": 288423, "epoch": 2383} {"train_loss": -43.5828971862793, "global_step": 288424, "epoch": 2383} {"train_loss": -43.14460372924805, "global_step": 288425, "epoch": 2383} {"train_loss": -42.962764739990234, "global_step": 288426, "epoch": 2383} {"train_loss": -43.01392364501953, "global_step": 288427, "epoch": 2383} {"train_loss": -43.114742279052734, "global_step": 288428, "epoch": 2383} {"train_loss": -43.13238525390625, "global_step": 288429, "epoch": 2383} {"train_loss": -43.62919998168945, "global_step": 288430, "epoch": 2383} {"train_loss": -44.115638732910156, "global_step": 288431, "epoch": 2383} {"train_loss": -39.8302116394043, "global_step": 288432, "epoch": 2383} {"train_loss": -43.570526123046875, "global_step": 288433, "epoch": 2383} {"train_loss": -43.88919448852539, "global_step": 288434, "epoch": 2383} {"train_loss": -43.27070236206055, "global_step": 288435, "epoch": 2383} {"train_loss": -43.15876007080078, "global_step": 288436, "epoch": 2383} {"train_loss": -43.617469787597656, "global_step": 288437, "epoch": 2383} {"train_loss": -43.45157241821289, "global_step": 288438, "epoch": 2383} {"train_loss": -42.7132453918457, "global_step": 288439, "epoch": 2383} {"train_loss": -41.445003509521484, "global_step": 288440, "epoch": 2383} {"train_loss": -42.12130355834961, "global_step": 288441, "epoch": 2383} {"train_loss": -42.65847396850586, "global_step": 288442, "epoch": 2383} {"train_loss": -43.74366760253906, "global_step": 288443, "epoch": 2383} {"train_loss": -42.065834045410156, "global_step": 288444, "epoch": 2383} {"train_loss": -41.831172943115234, "global_step": 288445, "epoch": 2383} {"train_loss": -42.273860931396484, "global_step": 288446, "epoch": 2383} {"train_loss": -43.161231994628906, "global_step": 288447, "epoch": 2383} {"train_loss": -43.112464904785156, "global_step": 288448, "epoch": 2383} {"train_loss": -43.05460739135742, "global_step": 288449, "epoch": 2383} {"train_loss": -43.40988540649414, "global_step": 288450, "epoch": 2383} {"train_loss": -43.22550964355469, "global_step": 288451, "epoch": 2383} {"train_loss": -43.815765380859375, "global_step": 288452, "epoch": 2383} {"train_loss": -43.22208786010742, "global_step": 288453, "epoch": 2383} {"train_loss": -43.15485763549805, "global_step": 288454, "epoch": 2383} {"train_loss": -43.23117446899414, "global_step": 288455, "epoch": 2383} {"train_loss": -43.359222412109375, "global_step": 288456, "epoch": 2383} {"train_loss": -43.472049713134766, "global_step": 288457, "epoch": 2383} {"train_loss": -44.02880859375, "global_step": 288458, "epoch": 2383} {"train_loss": -43.34467697143555, "global_step": 288459, "epoch": 2383} {"train_loss": -42.428382873535156, "global_step": 288460, "epoch": 2383} {"train_loss": -43.18744659423828, "global_step": 288461, "epoch": 2383} {"train_loss": -43.24784469604492, "global_step": 288462, "epoch": 2383} {"train_loss": -42.443090391553135, "global_step": 288463, "epoch": 2383, "val_loss": 2410516.75} {"train_loss": -41.9888801574707, "global_step": 288464, "epoch": 2384} {"train_loss": -42.12408447265625, "global_step": 288465, "epoch": 2384} {"train_loss": -43.003108978271484, "global_step": 288466, "epoch": 2384} {"train_loss": -39.947662353515625, "global_step": 288467, "epoch": 2384} {"train_loss": -36.066280364990234, "global_step": 288468, "epoch": 2384} {"train_loss": -39.117984771728516, "global_step": 288469, "epoch": 2384} {"train_loss": -40.49302291870117, "global_step": 288470, "epoch": 2384} {"train_loss": -40.028663635253906, "global_step": 288471, "epoch": 2384} {"train_loss": -40.6593132019043, "global_step": 288472, "epoch": 2384} {"train_loss": -34.45452880859375, "global_step": 288473, "epoch": 2384} {"train_loss": -40.433685302734375, "global_step": 288474, "epoch": 2384} {"train_loss": -36.68838119506836, "global_step": 288475, "epoch": 2384} {"train_loss": -39.229766845703125, "global_step": 288476, "epoch": 2384} {"train_loss": -40.30979919433594, "global_step": 288477, "epoch": 2384} {"train_loss": -37.60203170776367, "global_step": 288478, "epoch": 2384} {"train_loss": -41.353424072265625, "global_step": 288479, "epoch": 2384} {"train_loss": -37.760433197021484, "global_step": 288480, "epoch": 2384} {"train_loss": -41.47197723388672, "global_step": 288481, "epoch": 2384} {"train_loss": -39.74617385864258, "global_step": 288482, "epoch": 2384} {"train_loss": -41.86079788208008, "global_step": 288483, "epoch": 2384} {"train_loss": -39.20655822753906, "global_step": 288484, "epoch": 2384} {"train_loss": -42.290706634521484, "global_step": 288485, "epoch": 2384} {"train_loss": -41.08155059814453, "global_step": 288486, "epoch": 2384} {"train_loss": -41.7022819519043, "global_step": 288487, "epoch": 2384} {"train_loss": -41.54661178588867, "global_step": 288488, "epoch": 2384} {"train_loss": -41.3765983581543, "global_step": 288489, "epoch": 2384} {"train_loss": -42.46644592285156, "global_step": 288490, "epoch": 2384} {"train_loss": -41.583072662353516, "global_step": 288491, "epoch": 2384} {"train_loss": -42.606781005859375, "global_step": 288492, "epoch": 2384} {"train_loss": -41.37348937988281, "global_step": 288493, "epoch": 2384} {"train_loss": -42.44913864135742, "global_step": 288494, "epoch": 2384} {"train_loss": -42.55465316772461, "global_step": 288495, "epoch": 2384} {"train_loss": -41.817657470703125, "global_step": 288496, "epoch": 2384} {"train_loss": -42.9815559387207, "global_step": 288497, "epoch": 2384} {"train_loss": -42.27954864501953, "global_step": 288498, "epoch": 2384} {"train_loss": -42.30062484741211, "global_step": 288499, "epoch": 2384} {"train_loss": -42.3956413269043, "global_step": 288500, "epoch": 2384} {"train_loss": -42.84763717651367, "global_step": 288501, "epoch": 2384} {"train_loss": -42.49365234375, "global_step": 288502, "epoch": 2384} {"train_loss": -42.76922607421875, "global_step": 288503, "epoch": 2384} {"train_loss": -41.09185791015625, "global_step": 288504, "epoch": 2384} {"train_loss": -42.68418502807617, "global_step": 288505, "epoch": 2384} {"train_loss": -42.236610412597656, "global_step": 288506, "epoch": 2384} {"train_loss": -42.82265090942383, "global_step": 288507, "epoch": 2384} {"train_loss": -42.77995300292969, "global_step": 288508, "epoch": 2384} {"train_loss": -42.586177825927734, "global_step": 288509, "epoch": 2384} {"train_loss": -42.88416290283203, "global_step": 288510, "epoch": 2384} {"train_loss": -42.57036209106445, "global_step": 288511, "epoch": 2384} {"train_loss": -42.63526916503906, "global_step": 288512, "epoch": 2384} {"train_loss": -40.962364196777344, "global_step": 288513, "epoch": 2384} {"train_loss": -43.05105209350586, "global_step": 288514, "epoch": 2384} {"train_loss": -43.005245208740234, "global_step": 288515, "epoch": 2384} {"train_loss": -42.73781204223633, "global_step": 288516, "epoch": 2384} {"train_loss": -42.8344612121582, "global_step": 288517, "epoch": 2384} {"train_loss": -43.304412841796875, "global_step": 288518, "epoch": 2384} {"train_loss": -42.83219528198242, "global_step": 288519, "epoch": 2384} {"train_loss": -42.8907470703125, "global_step": 288520, "epoch": 2384} {"train_loss": -42.89194869995117, "global_step": 288521, "epoch": 2384} {"train_loss": -43.346317291259766, "global_step": 288522, "epoch": 2384} {"train_loss": -43.38026809692383, "global_step": 288523, "epoch": 2384} {"train_loss": -43.135921478271484, "global_step": 288524, "epoch": 2384} {"train_loss": -43.080413818359375, "global_step": 288525, "epoch": 2384} {"train_loss": -42.57533645629883, "global_step": 288526, "epoch": 2384} {"train_loss": -43.50336837768555, "global_step": 288527, "epoch": 2384} {"train_loss": -42.86617660522461, "global_step": 288528, "epoch": 2384} {"train_loss": -42.655513763427734, "global_step": 288529, "epoch": 2384} {"train_loss": -43.4645881652832, "global_step": 288530, "epoch": 2384} {"train_loss": -42.679073333740234, "global_step": 288531, "epoch": 2384} {"train_loss": -42.491607666015625, "global_step": 288532, "epoch": 2384} {"train_loss": -40.876495361328125, "global_step": 288533, "epoch": 2384} {"train_loss": -40.51328659057617, "global_step": 288534, "epoch": 2384} {"train_loss": -42.99186325073242, "global_step": 288535, "epoch": 2384} {"train_loss": -41.87201690673828, "global_step": 288536, "epoch": 2384} {"train_loss": -41.10102081298828, "global_step": 288537, "epoch": 2384} {"train_loss": -38.6280403137207, "global_step": 288538, "epoch": 2384} {"train_loss": -42.1871452331543, "global_step": 288539, "epoch": 2384} {"train_loss": -41.56132888793945, "global_step": 288540, "epoch": 2384} {"train_loss": -39.89120101928711, "global_step": 288541, "epoch": 2384} {"train_loss": -39.43303298950195, "global_step": 288542, "epoch": 2384} {"train_loss": -41.70426559448242, "global_step": 288543, "epoch": 2384} {"train_loss": -40.45347595214844, "global_step": 288544, "epoch": 2384} {"train_loss": -39.473445892333984, "global_step": 288545, "epoch": 2384} {"train_loss": -42.184326171875, "global_step": 288546, "epoch": 2384} {"train_loss": -41.13136291503906, "global_step": 288547, "epoch": 2384} {"train_loss": -42.18096923828125, "global_step": 288548, "epoch": 2384} {"train_loss": -42.27220916748047, "global_step": 288549, "epoch": 2384} {"train_loss": -41.936859130859375, "global_step": 288550, "epoch": 2384} {"train_loss": -42.78828811645508, "global_step": 288551, "epoch": 2384} {"train_loss": -42.616424560546875, "global_step": 288552, "epoch": 2384} {"train_loss": -41.8375129699707, "global_step": 288553, "epoch": 2384} {"train_loss": -43.085731506347656, "global_step": 288554, "epoch": 2384} {"train_loss": -42.34086227416992, "global_step": 288555, "epoch": 2384} {"train_loss": -42.833740234375, "global_step": 288556, "epoch": 2384} {"train_loss": -42.822532653808594, "global_step": 288557, "epoch": 2384} {"train_loss": -42.260475158691406, "global_step": 288558, "epoch": 2384} {"train_loss": -42.95768356323242, "global_step": 288559, "epoch": 2384} {"train_loss": -42.800472259521484, "global_step": 288560, "epoch": 2384} {"train_loss": -43.24778747558594, "global_step": 288561, "epoch": 2384} {"train_loss": -42.646331787109375, "global_step": 288562, "epoch": 2384} {"train_loss": -43.43300247192383, "global_step": 288563, "epoch": 2384} {"train_loss": -43.42055892944336, "global_step": 288564, "epoch": 2384} {"train_loss": -43.000953674316406, "global_step": 288565, "epoch": 2384} {"train_loss": -43.564735412597656, "global_step": 288566, "epoch": 2384} {"train_loss": -43.4532585144043, "global_step": 288567, "epoch": 2384} {"train_loss": -43.16562271118164, "global_step": 288568, "epoch": 2384} {"train_loss": -43.16375732421875, "global_step": 288569, "epoch": 2384} {"train_loss": -43.64832305908203, "global_step": 288570, "epoch": 2384} {"train_loss": -43.322566986083984, "global_step": 288571, "epoch": 2384} {"train_loss": -43.56439208984375, "global_step": 288572, "epoch": 2384} {"train_loss": -43.734947204589844, "global_step": 288573, "epoch": 2384} {"train_loss": -43.724300384521484, "global_step": 288574, "epoch": 2384} {"train_loss": -43.620723724365234, "global_step": 288575, "epoch": 2384} {"train_loss": -44.0874137878418, "global_step": 288576, "epoch": 2384} {"train_loss": -44.12749099731445, "global_step": 288577, "epoch": 2384} {"train_loss": -43.303279876708984, "global_step": 288578, "epoch": 2384} {"train_loss": -43.60797119140625, "global_step": 288579, "epoch": 2384} {"train_loss": -43.44658279418945, "global_step": 288580, "epoch": 2384} {"train_loss": -43.01643753051758, "global_step": 288581, "epoch": 2384} {"train_loss": -43.821041107177734, "global_step": 288582, "epoch": 2384} {"train_loss": -44.18960189819336, "global_step": 288583, "epoch": 2384} {"train_loss": -42.02699979671762, "global_step": 288584, "epoch": 2384, "val_loss": 2434830.25} {"train_loss": -43.24443435668945, "global_step": 288585, "epoch": 2385} {"train_loss": -43.57612228393555, "global_step": 288586, "epoch": 2385} {"train_loss": -43.431331634521484, "global_step": 288587, "epoch": 2385} {"train_loss": -43.848751068115234, "global_step": 288588, "epoch": 2385} {"train_loss": -44.028255462646484, "global_step": 288589, "epoch": 2385} {"train_loss": -43.8716926574707, "global_step": 288590, "epoch": 2385} {"train_loss": -44.07319259643555, "global_step": 288591, "epoch": 2385} {"train_loss": -43.78635025024414, "global_step": 288592, "epoch": 2385} {"train_loss": -43.51760482788086, "global_step": 288593, "epoch": 2385} {"train_loss": -43.47098922729492, "global_step": 288594, "epoch": 2385} {"train_loss": -43.8662223815918, "global_step": 288595, "epoch": 2385} {"train_loss": -43.42191696166992, "global_step": 288596, "epoch": 2385} {"train_loss": -43.74703598022461, "global_step": 288597, "epoch": 2385} {"train_loss": -43.928070068359375, "global_step": 288598, "epoch": 2385} {"train_loss": -43.62611770629883, "global_step": 288599, "epoch": 2385} {"train_loss": -43.821006774902344, "global_step": 288600, "epoch": 2385} {"train_loss": -43.87934494018555, "global_step": 288601, "epoch": 2385} {"train_loss": -43.96546173095703, "global_step": 288602, "epoch": 2385} {"train_loss": -44.1299934387207, "global_step": 288603, "epoch": 2385} {"train_loss": -44.196224212646484, "global_step": 288604, "epoch": 2385} {"train_loss": -44.04965591430664, "global_step": 288605, "epoch": 2385} {"train_loss": -44.59608840942383, "global_step": 288606, "epoch": 2385} {"train_loss": -44.19350051879883, "global_step": 288607, "epoch": 2385} {"train_loss": -44.124420166015625, "global_step": 288608, "epoch": 2385} {"train_loss": -43.5618896484375, "global_step": 288609, "epoch": 2385} {"train_loss": -43.98749923706055, "global_step": 288610, "epoch": 2385} {"train_loss": -43.56196212768555, "global_step": 288611, "epoch": 2385} {"train_loss": -43.011817932128906, "global_step": 288612, "epoch": 2385} {"train_loss": -40.527587890625, "global_step": 288613, "epoch": 2385} {"train_loss": -35.16866683959961, "global_step": 288614, "epoch": 2385} {"train_loss": -35.8604621887207, "global_step": 288615, "epoch": 2385} {"train_loss": -42.43756866455078, "global_step": 288616, "epoch": 2385} {"train_loss": -41.946632385253906, "global_step": 288617, "epoch": 2385} {"train_loss": -32.51816940307617, "global_step": 288618, "epoch": 2385} {"train_loss": -24.566213607788086, "global_step": 288619, "epoch": 2385} {"train_loss": -30.466215133666992, "global_step": 288620, "epoch": 2385} {"train_loss": -39.710323333740234, "global_step": 288621, "epoch": 2385} {"train_loss": -33.844390869140625, "global_step": 288622, "epoch": 2385} {"train_loss": -38.34918212890625, "global_step": 288623, "epoch": 2385} {"train_loss": -39.936485290527344, "global_step": 288624, "epoch": 2385} {"train_loss": -39.35053634643555, "global_step": 288625, "epoch": 2385} {"train_loss": -42.07558822631836, "global_step": 288626, "epoch": 2385} {"train_loss": -40.45139694213867, "global_step": 288627, "epoch": 2385} {"train_loss": -41.492149353027344, "global_step": 288628, "epoch": 2385} {"train_loss": -41.126216888427734, "global_step": 288629, "epoch": 2385} {"train_loss": -42.8746223449707, "global_step": 288630, "epoch": 2385} {"train_loss": -41.79132080078125, "global_step": 288631, "epoch": 2385} {"train_loss": -42.11538314819336, "global_step": 288632, "epoch": 2385} {"train_loss": -41.73319625854492, "global_step": 288633, "epoch": 2385} {"train_loss": -42.21407699584961, "global_step": 288634, "epoch": 2385} {"train_loss": -41.473995208740234, "global_step": 288635, "epoch": 2385} {"train_loss": -42.77003479003906, "global_step": 288636, "epoch": 2385} {"train_loss": -40.82868194580078, "global_step": 288637, "epoch": 2385} {"train_loss": -42.29557418823242, "global_step": 288638, "epoch": 2385} {"train_loss": -41.048377990722656, "global_step": 288639, "epoch": 2385} {"train_loss": -41.67997360229492, "global_step": 288640, "epoch": 2385} {"train_loss": -42.26856231689453, "global_step": 288641, "epoch": 2385} {"train_loss": -40.99074935913086, "global_step": 288642, "epoch": 2385} {"train_loss": -42.55219650268555, "global_step": 288643, "epoch": 2385} {"train_loss": -40.59079360961914, "global_step": 288644, "epoch": 2385} {"train_loss": -42.4425048828125, "global_step": 288645, "epoch": 2385} {"train_loss": -40.99343490600586, "global_step": 288646, "epoch": 2385} {"train_loss": -40.63019943237305, "global_step": 288647, "epoch": 2385} {"train_loss": -42.15619659423828, "global_step": 288648, "epoch": 2385} {"train_loss": -40.79175567626953, "global_step": 288649, "epoch": 2385} {"train_loss": -43.03965377807617, "global_step": 288650, "epoch": 2385} {"train_loss": -41.32985305786133, "global_step": 288651, "epoch": 2385} {"train_loss": -41.08712387084961, "global_step": 288652, "epoch": 2385} {"train_loss": -42.240840911865234, "global_step": 288653, "epoch": 2385} {"train_loss": -41.11507034301758, "global_step": 288654, "epoch": 2385} {"train_loss": -42.09348678588867, "global_step": 288655, "epoch": 2385} {"train_loss": -42.59608840942383, "global_step": 288656, "epoch": 2385} {"train_loss": -41.983707427978516, "global_step": 288657, "epoch": 2385} {"train_loss": -42.733402252197266, "global_step": 288658, "epoch": 2385} {"train_loss": -42.020320892333984, "global_step": 288659, "epoch": 2385} {"train_loss": -42.918853759765625, "global_step": 288660, "epoch": 2385} {"train_loss": -41.92911911010742, "global_step": 288661, "epoch": 2385} {"train_loss": -41.9259147644043, "global_step": 288662, "epoch": 2385} {"train_loss": -43.226566314697266, "global_step": 288663, "epoch": 2385} {"train_loss": -42.38047409057617, "global_step": 288664, "epoch": 2385} {"train_loss": -42.964210510253906, "global_step": 288665, "epoch": 2385} {"train_loss": -42.9557991027832, "global_step": 288666, "epoch": 2385} {"train_loss": -42.55904006958008, "global_step": 288667, "epoch": 2385} {"train_loss": -43.18503952026367, "global_step": 288668, "epoch": 2385} {"train_loss": -42.92774200439453, "global_step": 288669, "epoch": 2385} {"train_loss": -42.74247360229492, "global_step": 288670, "epoch": 2385} {"train_loss": -43.567596435546875, "global_step": 288671, "epoch": 2385} {"train_loss": -42.37425231933594, "global_step": 288672, "epoch": 2385} {"train_loss": -43.12946701049805, "global_step": 288673, "epoch": 2385} {"train_loss": -43.34870529174805, "global_step": 288674, "epoch": 2385} {"train_loss": -42.62089920043945, "global_step": 288675, "epoch": 2385} {"train_loss": -43.34291076660156, "global_step": 288676, "epoch": 2385} {"train_loss": -43.030757904052734, "global_step": 288677, "epoch": 2385} {"train_loss": -42.40425109863281, "global_step": 288678, "epoch": 2385} {"train_loss": -43.87876510620117, "global_step": 288679, "epoch": 2385} {"train_loss": -43.09520721435547, "global_step": 288680, "epoch": 2385} {"train_loss": -43.48321533203125, "global_step": 288681, "epoch": 2385} {"train_loss": -43.22563171386719, "global_step": 288682, "epoch": 2385} {"train_loss": -43.309051513671875, "global_step": 288683, "epoch": 2385} {"train_loss": -43.85557174682617, "global_step": 288684, "epoch": 2385} {"train_loss": -43.6379280090332, "global_step": 288685, "epoch": 2385} {"train_loss": -43.70632553100586, "global_step": 288686, "epoch": 2385} {"train_loss": -43.65761947631836, "global_step": 288687, "epoch": 2385} {"train_loss": -44.018104553222656, "global_step": 288688, "epoch": 2385} {"train_loss": -43.099365234375, "global_step": 288689, "epoch": 2385} {"train_loss": -43.98143768310547, "global_step": 288690, "epoch": 2385} {"train_loss": -43.3725471496582, "global_step": 288691, "epoch": 2385} {"train_loss": -43.26705551147461, "global_step": 288692, "epoch": 2385} {"train_loss": -43.93838119506836, "global_step": 288693, "epoch": 2385} {"train_loss": -43.611549377441406, "global_step": 288694, "epoch": 2385} {"train_loss": -43.80251693725586, "global_step": 288695, "epoch": 2385} {"train_loss": -43.863304138183594, "global_step": 288696, "epoch": 2385} {"train_loss": -43.36616897583008, "global_step": 288697, "epoch": 2385} {"train_loss": -43.828548431396484, "global_step": 288698, "epoch": 2385} {"train_loss": -43.833717346191406, "global_step": 288699, "epoch": 2385} {"train_loss": -43.951011657714844, "global_step": 288700, "epoch": 2385} {"train_loss": -43.850372314453125, "global_step": 288701, "epoch": 2385} {"train_loss": -44.0374870300293, "global_step": 288702, "epoch": 2385} {"train_loss": -43.90343475341797, "global_step": 288703, "epoch": 2385} {"train_loss": -44.125667572021484, "global_step": 288704, "epoch": 2385} {"train_loss": -42.26890434706507, "global_step": 288705, "epoch": 2385, "val_loss": 2387050.75} {"train_loss": -44.58933639526367, "global_step": 288706, "epoch": 2386} {"train_loss": -44.1044807434082, "global_step": 288707, "epoch": 2386} {"train_loss": -44.04763412475586, "global_step": 288708, "epoch": 2386} {"train_loss": -42.94422149658203, "global_step": 288709, "epoch": 2386} {"train_loss": -42.19808578491211, "global_step": 288710, "epoch": 2386} {"train_loss": -41.70478439331055, "global_step": 288711, "epoch": 2386} {"train_loss": -43.87109375, "global_step": 288712, "epoch": 2386} {"train_loss": -43.72306442260742, "global_step": 288713, "epoch": 2386} {"train_loss": -41.79060363769531, "global_step": 288714, "epoch": 2386} {"train_loss": -39.43642807006836, "global_step": 288715, "epoch": 2386} {"train_loss": -40.02386474609375, "global_step": 288716, "epoch": 2386} {"train_loss": -42.93156051635742, "global_step": 288717, "epoch": 2386} {"train_loss": -43.51703643798828, "global_step": 288718, "epoch": 2386} {"train_loss": -42.07841873168945, "global_step": 288719, "epoch": 2386} {"train_loss": -40.41128158569336, "global_step": 288720, "epoch": 2386} {"train_loss": -42.82876205444336, "global_step": 288721, "epoch": 2386} {"train_loss": -43.416481018066406, "global_step": 288722, "epoch": 2386} {"train_loss": -43.04246139526367, "global_step": 288723, "epoch": 2386} {"train_loss": -43.716278076171875, "global_step": 288724, "epoch": 2386} {"train_loss": -42.91624069213867, "global_step": 288725, "epoch": 2386} {"train_loss": -43.17368698120117, "global_step": 288726, "epoch": 2386} {"train_loss": -43.61936569213867, "global_step": 288727, "epoch": 2386} {"train_loss": -43.28732681274414, "global_step": 288728, "epoch": 2386} {"train_loss": -42.07313919067383, "global_step": 288729, "epoch": 2386} {"train_loss": -43.118648529052734, "global_step": 288730, "epoch": 2386} {"train_loss": -42.156124114990234, "global_step": 288731, "epoch": 2386} {"train_loss": -42.07085418701172, "global_step": 288732, "epoch": 2386} {"train_loss": -42.813385009765625, "global_step": 288733, "epoch": 2386} {"train_loss": -42.40802001953125, "global_step": 288734, "epoch": 2386} {"train_loss": -43.080020904541016, "global_step": 288735, "epoch": 2386} {"train_loss": -42.87437057495117, "global_step": 288736, "epoch": 2386} {"train_loss": -42.700706481933594, "global_step": 288737, "epoch": 2386} {"train_loss": -43.06763458251953, "global_step": 288738, "epoch": 2386} {"train_loss": -42.07904052734375, "global_step": 288739, "epoch": 2386} {"train_loss": -42.19862747192383, "global_step": 288740, "epoch": 2386} {"train_loss": -42.32160568237305, "global_step": 288741, "epoch": 2386} {"train_loss": -42.842323303222656, "global_step": 288742, "epoch": 2386} {"train_loss": -42.72119140625, "global_step": 288743, "epoch": 2386} {"train_loss": -43.05608367919922, "global_step": 288744, "epoch": 2386} {"train_loss": -41.373779296875, "global_step": 288745, "epoch": 2386} {"train_loss": -41.088722229003906, "global_step": 288746, "epoch": 2386} {"train_loss": -39.19561767578125, "global_step": 288747, "epoch": 2386} {"train_loss": -41.9797248840332, "global_step": 288748, "epoch": 2386} {"train_loss": -38.71662139892578, "global_step": 288749, "epoch": 2386} {"train_loss": -38.09920883178711, "global_step": 288750, "epoch": 2386} {"train_loss": -38.45015335083008, "global_step": 288751, "epoch": 2386} {"train_loss": -40.9486198425293, "global_step": 288752, "epoch": 2386} {"train_loss": -40.41575241088867, "global_step": 288753, "epoch": 2386} {"train_loss": -40.0460319519043, "global_step": 288754, "epoch": 2386} {"train_loss": -39.864410400390625, "global_step": 288755, "epoch": 2386} {"train_loss": -39.896514892578125, "global_step": 288756, "epoch": 2386} {"train_loss": -37.23023223876953, "global_step": 288757, "epoch": 2386} {"train_loss": -38.17672348022461, "global_step": 288758, "epoch": 2386} {"train_loss": -41.85175704956055, "global_step": 288759, "epoch": 2386} {"train_loss": -39.31642532348633, "global_step": 288760, "epoch": 2386} {"train_loss": -42.15095520019531, "global_step": 288761, "epoch": 2386} {"train_loss": -40.14336013793945, "global_step": 288762, "epoch": 2386} {"train_loss": -39.69076156616211, "global_step": 288763, "epoch": 2386} {"train_loss": -41.73640060424805, "global_step": 288764, "epoch": 2386} {"train_loss": -40.02968978881836, "global_step": 288765, "epoch": 2386} {"train_loss": -41.08584213256836, "global_step": 288766, "epoch": 2386} {"train_loss": -41.354549407958984, "global_step": 288767, "epoch": 2386} {"train_loss": -40.54354476928711, "global_step": 288768, "epoch": 2386} {"train_loss": -42.27000045776367, "global_step": 288769, "epoch": 2386} {"train_loss": -39.935054779052734, "global_step": 288770, "epoch": 2386} {"train_loss": -41.566688537597656, "global_step": 288771, "epoch": 2386} {"train_loss": -41.572784423828125, "global_step": 288772, "epoch": 2386} {"train_loss": -41.296077728271484, "global_step": 288773, "epoch": 2386} {"train_loss": -42.07958221435547, "global_step": 288774, "epoch": 2386} {"train_loss": -41.315242767333984, "global_step": 288775, "epoch": 2386} {"train_loss": -42.376190185546875, "global_step": 288776, "epoch": 2386} {"train_loss": -41.14109420776367, "global_step": 288777, "epoch": 2386} {"train_loss": -42.7781982421875, "global_step": 288778, "epoch": 2386} {"train_loss": -41.37406539916992, "global_step": 288779, "epoch": 2386} {"train_loss": -42.60063934326172, "global_step": 288780, "epoch": 2386} {"train_loss": -42.19875717163086, "global_step": 288781, "epoch": 2386} {"train_loss": -42.71338653564453, "global_step": 288782, "epoch": 2386} {"train_loss": -41.783626556396484, "global_step": 288783, "epoch": 2386} {"train_loss": -40.737457275390625, "global_step": 288784, "epoch": 2386} {"train_loss": -42.62591552734375, "global_step": 288785, "epoch": 2386} {"train_loss": -41.24513626098633, "global_step": 288786, "epoch": 2386} {"train_loss": -43.37220001220703, "global_step": 288787, "epoch": 2386} {"train_loss": -42.02212142944336, "global_step": 288788, "epoch": 2386} {"train_loss": -42.84937286376953, "global_step": 288789, "epoch": 2386} {"train_loss": -42.49174118041992, "global_step": 288790, "epoch": 2386} {"train_loss": -43.187679290771484, "global_step": 288791, "epoch": 2386} {"train_loss": -42.5369758605957, "global_step": 288792, "epoch": 2386} {"train_loss": -43.09783935546875, "global_step": 288793, "epoch": 2386} {"train_loss": -43.31169509887695, "global_step": 288794, "epoch": 2386} {"train_loss": -42.8990364074707, "global_step": 288795, "epoch": 2386} {"train_loss": -42.937129974365234, "global_step": 288796, "epoch": 2386} {"train_loss": -43.14971923828125, "global_step": 288797, "epoch": 2386} {"train_loss": -42.807861328125, "global_step": 288798, "epoch": 2386} {"train_loss": -42.6801872253418, "global_step": 288799, "epoch": 2386} {"train_loss": -42.566383361816406, "global_step": 288800, "epoch": 2386} {"train_loss": -43.19102478027344, "global_step": 288801, "epoch": 2386} {"train_loss": -42.983917236328125, "global_step": 288802, "epoch": 2386} {"train_loss": -42.91206359863281, "global_step": 288803, "epoch": 2386} {"train_loss": -43.7857780456543, "global_step": 288804, "epoch": 2386} {"train_loss": -42.877254486083984, "global_step": 288805, "epoch": 2386} {"train_loss": -43.128780364990234, "global_step": 288806, "epoch": 2386} {"train_loss": -42.50027084350586, "global_step": 288807, "epoch": 2386} {"train_loss": -43.70502471923828, "global_step": 288808, "epoch": 2386} {"train_loss": -42.42460632324219, "global_step": 288809, "epoch": 2386} {"train_loss": -43.566768646240234, "global_step": 288810, "epoch": 2386} {"train_loss": -43.087684631347656, "global_step": 288811, "epoch": 2386} {"train_loss": -43.2309684753418, "global_step": 288812, "epoch": 2386} {"train_loss": -43.29671859741211, "global_step": 288813, "epoch": 2386} {"train_loss": -43.0731086730957, "global_step": 288814, "epoch": 2386} {"train_loss": -43.17106246948242, "global_step": 288815, "epoch": 2386} {"train_loss": -42.392635345458984, "global_step": 288816, "epoch": 2386} {"train_loss": -43.42054748535156, "global_step": 288817, "epoch": 2386} {"train_loss": -43.526424407958984, "global_step": 288818, "epoch": 2386} {"train_loss": -42.994258880615234, "global_step": 288819, "epoch": 2386} {"train_loss": -43.70210266113281, "global_step": 288820, "epoch": 2386} {"train_loss": -43.135189056396484, "global_step": 288821, "epoch": 2386} {"train_loss": -43.663482666015625, "global_step": 288822, "epoch": 2386} {"train_loss": -43.77149200439453, "global_step": 288823, "epoch": 2386} {"train_loss": -44.03239822387695, "global_step": 288824, "epoch": 2386} {"train_loss": -43.8459358215332, "global_step": 288825, "epoch": 2386} {"train_loss": -42.19301094496546, "global_step": 288826, "epoch": 2386, "val_loss": 2418412.0} {"train_loss": -43.05922317504883, "global_step": 288827, "epoch": 2387} {"train_loss": -43.71485137939453, "global_step": 288828, "epoch": 2387} {"train_loss": -43.67238235473633, "global_step": 288829, "epoch": 2387} {"train_loss": -44.070716857910156, "global_step": 288830, "epoch": 2387} {"train_loss": -43.832515716552734, "global_step": 288831, "epoch": 2387} {"train_loss": -44.187721252441406, "global_step": 288832, "epoch": 2387} {"train_loss": -43.67812728881836, "global_step": 288833, "epoch": 2387} {"train_loss": -43.65327072143555, "global_step": 288834, "epoch": 2387} {"train_loss": -43.665283203125, "global_step": 288835, "epoch": 2387} {"train_loss": -43.15287780761719, "global_step": 288836, "epoch": 2387} {"train_loss": -43.50750732421875, "global_step": 288837, "epoch": 2387} {"train_loss": -44.3200798034668, "global_step": 288838, "epoch": 2387} {"train_loss": -42.98710250854492, "global_step": 288839, "epoch": 2387} {"train_loss": -43.749271392822266, "global_step": 288840, "epoch": 2387} {"train_loss": -43.868099212646484, "global_step": 288841, "epoch": 2387} {"train_loss": -42.91016387939453, "global_step": 288842, "epoch": 2387} {"train_loss": -43.395198822021484, "global_step": 288843, "epoch": 2387} {"train_loss": -42.9018669128418, "global_step": 288844, "epoch": 2387} {"train_loss": -43.95256423950195, "global_step": 288845, "epoch": 2387} {"train_loss": -44.46052169799805, "global_step": 288846, "epoch": 2387} {"train_loss": -43.55420684814453, "global_step": 288847, "epoch": 2387} {"train_loss": -43.15421676635742, "global_step": 288848, "epoch": 2387} {"train_loss": -44.03276062011719, "global_step": 288849, "epoch": 2387} {"train_loss": -43.3856086730957, "global_step": 288850, "epoch": 2387} {"train_loss": -43.70290756225586, "global_step": 288851, "epoch": 2387} {"train_loss": -44.21845626831055, "global_step": 288852, "epoch": 2387} {"train_loss": -43.32573699951172, "global_step": 288853, "epoch": 2387} {"train_loss": -43.45197677612305, "global_step": 288854, "epoch": 2387} {"train_loss": -44.39345932006836, "global_step": 288855, "epoch": 2387} {"train_loss": -42.39789962768555, "global_step": 288856, "epoch": 2387} {"train_loss": -42.780242919921875, "global_step": 288857, "epoch": 2387} {"train_loss": -43.233428955078125, "global_step": 288858, "epoch": 2387} {"train_loss": -41.600975036621094, "global_step": 288859, "epoch": 2387} {"train_loss": -41.1632080078125, "global_step": 288860, "epoch": 2387} {"train_loss": -43.60971450805664, "global_step": 288861, "epoch": 2387} {"train_loss": -40.23390579223633, "global_step": 288862, "epoch": 2387} {"train_loss": -37.3116569519043, "global_step": 288863, "epoch": 2387} {"train_loss": -40.26488494873047, "global_step": 288864, "epoch": 2387} {"train_loss": -40.366424560546875, "global_step": 288865, "epoch": 2387} {"train_loss": -40.9965934753418, "global_step": 288866, "epoch": 2387} {"train_loss": -43.92815017700195, "global_step": 288867, "epoch": 2387} {"train_loss": -39.3093376159668, "global_step": 288868, "epoch": 2387} {"train_loss": -40.69804763793945, "global_step": 288869, "epoch": 2387} {"train_loss": -42.4900016784668, "global_step": 288870, "epoch": 2387} {"train_loss": -38.85367202758789, "global_step": 288871, "epoch": 2387} {"train_loss": -39.70124816894531, "global_step": 288872, "epoch": 2387} {"train_loss": -38.769596099853516, "global_step": 288873, "epoch": 2387} {"train_loss": -41.1753044128418, "global_step": 288874, "epoch": 2387} {"train_loss": -41.99543762207031, "global_step": 288875, "epoch": 2387} {"train_loss": -40.58952713012695, "global_step": 288876, "epoch": 2387} {"train_loss": -42.89385223388672, "global_step": 288877, "epoch": 2387} {"train_loss": -40.282222747802734, "global_step": 288878, "epoch": 2387} {"train_loss": -40.736812591552734, "global_step": 288879, "epoch": 2387} {"train_loss": -42.944580078125, "global_step": 288880, "epoch": 2387} {"train_loss": -41.85215377807617, "global_step": 288881, "epoch": 2387} {"train_loss": -42.482460021972656, "global_step": 288882, "epoch": 2387} {"train_loss": -42.11851119995117, "global_step": 288883, "epoch": 2387} {"train_loss": -40.97012710571289, "global_step": 288884, "epoch": 2387} {"train_loss": -42.86110305786133, "global_step": 288885, "epoch": 2387} {"train_loss": -42.077056884765625, "global_step": 288886, "epoch": 2387} {"train_loss": -42.84832763671875, "global_step": 288887, "epoch": 2387} {"train_loss": -42.86524963378906, "global_step": 288888, "epoch": 2387} {"train_loss": -42.21772766113281, "global_step": 288889, "epoch": 2387} {"train_loss": -43.56437683105469, "global_step": 288890, "epoch": 2387} {"train_loss": -42.750343322753906, "global_step": 288891, "epoch": 2387} {"train_loss": -42.77191925048828, "global_step": 288892, "epoch": 2387} {"train_loss": -43.45098114013672, "global_step": 288893, "epoch": 2387} {"train_loss": -42.421302795410156, "global_step": 288894, "epoch": 2387} {"train_loss": -43.56614685058594, "global_step": 288895, "epoch": 2387} {"train_loss": -42.522743225097656, "global_step": 288896, "epoch": 2387} {"train_loss": -42.8045768737793, "global_step": 288897, "epoch": 2387} {"train_loss": -43.29401779174805, "global_step": 288898, "epoch": 2387} {"train_loss": -41.229042053222656, "global_step": 288899, "epoch": 2387} {"train_loss": -43.098915100097656, "global_step": 288900, "epoch": 2387} {"train_loss": -39.65135955810547, "global_step": 288901, "epoch": 2387} {"train_loss": -42.7537727355957, "global_step": 288902, "epoch": 2387} {"train_loss": -43.64899826049805, "global_step": 288903, "epoch": 2387} {"train_loss": -43.152320861816406, "global_step": 288904, "epoch": 2387} {"train_loss": -43.59428787231445, "global_step": 288905, "epoch": 2387} {"train_loss": -43.19512939453125, "global_step": 288906, "epoch": 2387} {"train_loss": -43.4980583190918, "global_step": 288907, "epoch": 2387} {"train_loss": -43.045936584472656, "global_step": 288908, "epoch": 2387} {"train_loss": -43.08066940307617, "global_step": 288909, "epoch": 2387} {"train_loss": -43.7535285949707, "global_step": 288910, "epoch": 2387} {"train_loss": -43.277137756347656, "global_step": 288911, "epoch": 2387} {"train_loss": -43.86564254760742, "global_step": 288912, "epoch": 2387} {"train_loss": -43.82545471191406, "global_step": 288913, "epoch": 2387} {"train_loss": -41.48368835449219, "global_step": 288914, "epoch": 2387} {"train_loss": -43.12099838256836, "global_step": 288915, "epoch": 2387} {"train_loss": -42.88442611694336, "global_step": 288916, "epoch": 2387} {"train_loss": -43.4979248046875, "global_step": 288917, "epoch": 2387} {"train_loss": -43.42543029785156, "global_step": 288918, "epoch": 2387} {"train_loss": -43.336402893066406, "global_step": 288919, "epoch": 2387} {"train_loss": -43.43597412109375, "global_step": 288920, "epoch": 2387} {"train_loss": -43.38878631591797, "global_step": 288921, "epoch": 2387} {"train_loss": -37.53459167480469, "global_step": 288922, "epoch": 2387} {"train_loss": -43.72321701049805, "global_step": 288923, "epoch": 2387} {"train_loss": -43.666969299316406, "global_step": 288924, "epoch": 2387} {"train_loss": -44.154415130615234, "global_step": 288925, "epoch": 2387} {"train_loss": -43.432281494140625, "global_step": 288926, "epoch": 2387} {"train_loss": -43.80442428588867, "global_step": 288927, "epoch": 2387} {"train_loss": -43.107051849365234, "global_step": 288928, "epoch": 2387} {"train_loss": -41.243072509765625, "global_step": 288929, "epoch": 2387} {"train_loss": -43.49577713012695, "global_step": 288930, "epoch": 2387} {"train_loss": -42.77468490600586, "global_step": 288931, "epoch": 2387} {"train_loss": -13.595901489257812, "global_step": 288932, "epoch": 2387} {"train_loss": -41.83824157714844, "global_step": 288933, "epoch": 2387} {"train_loss": -41.12313461303711, "global_step": 288934, "epoch": 2387} {"train_loss": -33.868839263916016, "global_step": 288935, "epoch": 2387} {"train_loss": -35.57241439819336, "global_step": 288936, "epoch": 2387} {"train_loss": -42.278968811035156, "global_step": 288937, "epoch": 2387} {"train_loss": -41.87663269042969, "global_step": 288938, "epoch": 2387} {"train_loss": -41.69527816772461, "global_step": 288939, "epoch": 2387} {"train_loss": -39.1984748840332, "global_step": 288940, "epoch": 2387} {"train_loss": -41.06388473510742, "global_step": 288941, "epoch": 2387} {"train_loss": -41.7181510925293, "global_step": 288942, "epoch": 2387} {"train_loss": -34.04091262817383, "global_step": 288943, "epoch": 2387} {"train_loss": -34.09806823730469, "global_step": 288944, "epoch": 2387} {"train_loss": -39.252479553222656, "global_step": 288945, "epoch": 2387} {"train_loss": -37.72615432739258, "global_step": 288946, "epoch": 2387} {"train_loss": -41.917686052558835, "global_step": 288947, "epoch": 2387, "val_loss": 2542074.25} {"train_loss": -39.68800354003906, "global_step": 288948, "epoch": 2388} {"train_loss": -37.736167907714844, "global_step": 288949, "epoch": 2388} {"train_loss": -1.1953308582305908, "global_step": 288950, "epoch": 2388} {"train_loss": -37.98716735839844, "global_step": 288951, "epoch": 2388} {"train_loss": -30.21636390686035, "global_step": 288952, "epoch": 2388} {"train_loss": -33.12983322143555, "global_step": 288953, "epoch": 2388} {"train_loss": -36.63544464111328, "global_step": 288954, "epoch": 2388} {"train_loss": -33.498878479003906, "global_step": 288955, "epoch": 2388} {"train_loss": -32.71950912475586, "global_step": 288956, "epoch": 2388} {"train_loss": -37.31604766845703, "global_step": 288957, "epoch": 2388} {"train_loss": -39.38896560668945, "global_step": 288958, "epoch": 2388} {"train_loss": -37.92310333251953, "global_step": 288959, "epoch": 2388} {"train_loss": -37.9962043762207, "global_step": 288960, "epoch": 2388} {"train_loss": -37.91217803955078, "global_step": 288961, "epoch": 2388} {"train_loss": -35.98918914794922, "global_step": 288962, "epoch": 2388} {"train_loss": -38.070674896240234, "global_step": 288963, "epoch": 2388} {"train_loss": -32.976661682128906, "global_step": 288964, "epoch": 2388} {"train_loss": -35.667144775390625, "global_step": 288965, "epoch": 2388} {"train_loss": -37.4882926940918, "global_step": 288966, "epoch": 2388} {"train_loss": -38.1146240234375, "global_step": 288967, "epoch": 2388} {"train_loss": -39.364601135253906, "global_step": 288968, "epoch": 2388} {"train_loss": -39.43527603149414, "global_step": 288969, "epoch": 2388} {"train_loss": -40.38203430175781, "global_step": 288970, "epoch": 2388} {"train_loss": -39.236793518066406, "global_step": 288971, "epoch": 2388} {"train_loss": -39.09022903442383, "global_step": 288972, "epoch": 2388} {"train_loss": -38.8543586730957, "global_step": 288973, "epoch": 2388} {"train_loss": -39.667171478271484, "global_step": 288974, "epoch": 2388} {"train_loss": -39.72318649291992, "global_step": 288975, "epoch": 2388} {"train_loss": -39.964900970458984, "global_step": 288976, "epoch": 2388} {"train_loss": -38.51975631713867, "global_step": 288977, "epoch": 2388} {"train_loss": -39.7524528503418, "global_step": 288978, "epoch": 2388} {"train_loss": -39.78857421875, "global_step": 288979, "epoch": 2388} {"train_loss": -38.456050872802734, "global_step": 288980, "epoch": 2388} {"train_loss": -39.00727081298828, "global_step": 288981, "epoch": 2388} {"train_loss": -39.99224853515625, "global_step": 288982, "epoch": 2388} {"train_loss": -40.47848129272461, "global_step": 288983, "epoch": 2388} {"train_loss": -40.672969818115234, "global_step": 288984, "epoch": 2388} {"train_loss": -40.940513610839844, "global_step": 288985, "epoch": 2388} {"train_loss": -40.64102554321289, "global_step": 288986, "epoch": 2388} {"train_loss": -40.40255355834961, "global_step": 288987, "epoch": 2388} {"train_loss": -40.63985061645508, "global_step": 288988, "epoch": 2388} {"train_loss": -39.330039978027344, "global_step": 288989, "epoch": 2388} {"train_loss": -40.238502502441406, "global_step": 288990, "epoch": 2388} {"train_loss": -40.23797607421875, "global_step": 288991, "epoch": 2388} {"train_loss": -41.04177474975586, "global_step": 288992, "epoch": 2388} {"train_loss": -41.3087043762207, "global_step": 288993, "epoch": 2388} {"train_loss": -41.235652923583984, "global_step": 288994, "epoch": 2388} {"train_loss": -40.517601013183594, "global_step": 288995, "epoch": 2388} {"train_loss": -41.264801025390625, "global_step": 288996, "epoch": 2388} {"train_loss": -40.80745315551758, "global_step": 288997, "epoch": 2388} {"train_loss": -41.25120544433594, "global_step": 288998, "epoch": 2388} {"train_loss": -40.65591049194336, "global_step": 288999, "epoch": 2388} {"train_loss": -40.87624740600586, "global_step": 289000, "epoch": 2388} {"train_loss": -41.35826110839844, "global_step": 289001, "epoch": 2388} {"train_loss": -41.53215789794922, "global_step": 289002, "epoch": 2388} {"train_loss": -41.42822265625, "global_step": 289003, "epoch": 2388} {"train_loss": -41.69559860229492, "global_step": 289004, "epoch": 2388} {"train_loss": -41.124691009521484, "global_step": 289005, "epoch": 2388} {"train_loss": -41.49151611328125, "global_step": 289006, "epoch": 2388} {"train_loss": -41.97637176513672, "global_step": 289007, "epoch": 2388} {"train_loss": -41.527095794677734, "global_step": 289008, "epoch": 2388} {"train_loss": -40.96332931518555, "global_step": 289009, "epoch": 2388} {"train_loss": -42.016658782958984, "global_step": 289010, "epoch": 2388} {"train_loss": -41.43059158325195, "global_step": 289011, "epoch": 2388} {"train_loss": -41.728485107421875, "global_step": 289012, "epoch": 2388} {"train_loss": -41.46090316772461, "global_step": 289013, "epoch": 2388} {"train_loss": -41.608978271484375, "global_step": 289014, "epoch": 2388} {"train_loss": -42.254032135009766, "global_step": 289015, "epoch": 2388} {"train_loss": -41.787349700927734, "global_step": 289016, "epoch": 2388} {"train_loss": -42.222747802734375, "global_step": 289017, "epoch": 2388} {"train_loss": -41.64764404296875, "global_step": 289018, "epoch": 2388} {"train_loss": -42.2794075012207, "global_step": 289019, "epoch": 2388} {"train_loss": -41.97581100463867, "global_step": 289020, "epoch": 2388} {"train_loss": -42.3134765625, "global_step": 289021, "epoch": 2388} {"train_loss": -40.92112731933594, "global_step": 289022, "epoch": 2388} {"train_loss": -42.04642868041992, "global_step": 289023, "epoch": 2388} {"train_loss": -42.60311508178711, "global_step": 289024, "epoch": 2388} {"train_loss": -41.90681076049805, "global_step": 289025, "epoch": 2388} {"train_loss": -42.320289611816406, "global_step": 289026, "epoch": 2388} {"train_loss": -41.790794372558594, "global_step": 289027, "epoch": 2388} {"train_loss": -42.08709716796875, "global_step": 289028, "epoch": 2388} {"train_loss": -42.01800537109375, "global_step": 289029, "epoch": 2388} {"train_loss": -42.3042106628418, "global_step": 289030, "epoch": 2388} {"train_loss": -42.142547607421875, "global_step": 289031, "epoch": 2388} {"train_loss": -42.9428596496582, "global_step": 289032, "epoch": 2388} {"train_loss": -42.793216705322266, "global_step": 289033, "epoch": 2388} {"train_loss": -42.5344352722168, "global_step": 289034, "epoch": 2388} {"train_loss": -41.9935417175293, "global_step": 289035, "epoch": 2388} {"train_loss": -41.69157791137695, "global_step": 289036, "epoch": 2388} {"train_loss": -42.804256439208984, "global_step": 289037, "epoch": 2388} {"train_loss": -42.44831085205078, "global_step": 289038, "epoch": 2388} {"train_loss": -43.05328369140625, "global_step": 289039, "epoch": 2388} {"train_loss": -42.53745651245117, "global_step": 289040, "epoch": 2388} {"train_loss": -42.20164108276367, "global_step": 289041, "epoch": 2388} {"train_loss": -42.70064163208008, "global_step": 289042, "epoch": 2388} {"train_loss": -42.75968551635742, "global_step": 289043, "epoch": 2388} {"train_loss": -42.968013763427734, "global_step": 289044, "epoch": 2388} {"train_loss": -42.975616455078125, "global_step": 289045, "epoch": 2388} {"train_loss": -42.46938705444336, "global_step": 289046, "epoch": 2388} {"train_loss": -42.80416488647461, "global_step": 289047, "epoch": 2388} {"train_loss": -43.117916107177734, "global_step": 289048, "epoch": 2388} {"train_loss": -42.50777053833008, "global_step": 289049, "epoch": 2388} {"train_loss": -42.65838623046875, "global_step": 289050, "epoch": 2388} {"train_loss": -42.34727096557617, "global_step": 289051, "epoch": 2388} {"train_loss": -42.61967468261719, "global_step": 289052, "epoch": 2388} {"train_loss": -43.138946533203125, "global_step": 289053, "epoch": 2388} {"train_loss": -41.91180419921875, "global_step": 289054, "epoch": 2388} {"train_loss": -41.712677001953125, "global_step": 289055, "epoch": 2388} {"train_loss": -43.13905715942383, "global_step": 289056, "epoch": 2388} {"train_loss": -42.09889602661133, "global_step": 289057, "epoch": 2388} {"train_loss": -42.88147735595703, "global_step": 289058, "epoch": 2388} {"train_loss": -41.917972564697266, "global_step": 289059, "epoch": 2388} {"train_loss": -43.204689025878906, "global_step": 289060, "epoch": 2388} {"train_loss": -43.1116943359375, "global_step": 289061, "epoch": 2388} {"train_loss": -42.831905364990234, "global_step": 289062, "epoch": 2388} {"train_loss": -41.15021514892578, "global_step": 289063, "epoch": 2388} {"train_loss": -42.96859359741211, "global_step": 289064, "epoch": 2388} {"train_loss": -42.7868537902832, "global_step": 289065, "epoch": 2388} {"train_loss": -43.285667419433594, "global_step": 289066, "epoch": 2388} {"train_loss": -42.52394485473633, "global_step": 289067, "epoch": 2388} {"train_loss": -40.39535655857118, "global_step": 289068, "epoch": 2388, "val_loss": 2500163.5} {"train_loss": -42.13109588623047, "global_step": 289069, "epoch": 2389} {"train_loss": -42.91687774658203, "global_step": 289070, "epoch": 2389} {"train_loss": -43.22015380859375, "global_step": 289071, "epoch": 2389} {"train_loss": -43.446739196777344, "global_step": 289072, "epoch": 2389} {"train_loss": -43.1953239440918, "global_step": 289073, "epoch": 2389} {"train_loss": -43.414974212646484, "global_step": 289074, "epoch": 2389} {"train_loss": -43.393585205078125, "global_step": 289075, "epoch": 2389} {"train_loss": -43.69424057006836, "global_step": 289076, "epoch": 2389} {"train_loss": -43.54827117919922, "global_step": 289077, "epoch": 2389} {"train_loss": -43.24462890625, "global_step": 289078, "epoch": 2389} {"train_loss": -43.37856674194336, "global_step": 289079, "epoch": 2389} {"train_loss": -42.60630416870117, "global_step": 289080, "epoch": 2389} {"train_loss": -43.34661865234375, "global_step": 289081, "epoch": 2389} {"train_loss": -42.79130554199219, "global_step": 289082, "epoch": 2389} {"train_loss": -43.15803146362305, "global_step": 289083, "epoch": 2389} {"train_loss": -43.436431884765625, "global_step": 289084, "epoch": 2389} {"train_loss": -43.009033203125, "global_step": 289085, "epoch": 2389} {"train_loss": -43.46261215209961, "global_step": 289086, "epoch": 2389} {"train_loss": -43.22047805786133, "global_step": 289087, "epoch": 2389} {"train_loss": -43.83565902709961, "global_step": 289088, "epoch": 2389} {"train_loss": -42.68268966674805, "global_step": 289089, "epoch": 2389} {"train_loss": -43.13376235961914, "global_step": 289090, "epoch": 2389} {"train_loss": -42.50584411621094, "global_step": 289091, "epoch": 2389} {"train_loss": -43.676143646240234, "global_step": 289092, "epoch": 2389} {"train_loss": -43.981536865234375, "global_step": 289093, "epoch": 2389} {"train_loss": -43.49751663208008, "global_step": 289094, "epoch": 2389} {"train_loss": -43.651668548583984, "global_step": 289095, "epoch": 2389} {"train_loss": -43.52839660644531, "global_step": 289096, "epoch": 2389} {"train_loss": -43.38837432861328, "global_step": 289097, "epoch": 2389} {"train_loss": -43.19125747680664, "global_step": 289098, "epoch": 2389} {"train_loss": -44.10273742675781, "global_step": 289099, "epoch": 2389} {"train_loss": -42.668067932128906, "global_step": 289100, "epoch": 2389} {"train_loss": -43.83219528198242, "global_step": 289101, "epoch": 2389} {"train_loss": -43.54553985595703, "global_step": 289102, "epoch": 2389} {"train_loss": -42.9723014831543, "global_step": 289103, "epoch": 2389} {"train_loss": -42.756256103515625, "global_step": 289104, "epoch": 2389} {"train_loss": -42.56913375854492, "global_step": 289105, "epoch": 2389} {"train_loss": -43.88959884643555, "global_step": 289106, "epoch": 2389} {"train_loss": -43.16978073120117, "global_step": 289107, "epoch": 2389} {"train_loss": -42.90281295776367, "global_step": 289108, "epoch": 2389} {"train_loss": -43.39535140991211, "global_step": 289109, "epoch": 2389} {"train_loss": -42.97673416137695, "global_step": 289110, "epoch": 2389} {"train_loss": -43.7594108581543, "global_step": 289111, "epoch": 2389} {"train_loss": -43.0665397644043, "global_step": 289112, "epoch": 2389} {"train_loss": -43.025787353515625, "global_step": 289113, "epoch": 2389} {"train_loss": -44.01227951049805, "global_step": 289114, "epoch": 2389} {"train_loss": -43.64180374145508, "global_step": 289115, "epoch": 2389} {"train_loss": -43.96870040893555, "global_step": 289116, "epoch": 2389} {"train_loss": -43.75020217895508, "global_step": 289117, "epoch": 2389} {"train_loss": -43.03817367553711, "global_step": 289118, "epoch": 2389} {"train_loss": -43.39971923828125, "global_step": 289119, "epoch": 2389} {"train_loss": -43.687740325927734, "global_step": 289120, "epoch": 2389} {"train_loss": -43.55084228515625, "global_step": 289121, "epoch": 2389} {"train_loss": -44.170772552490234, "global_step": 289122, "epoch": 2389} {"train_loss": -43.9366569519043, "global_step": 289123, "epoch": 2389} {"train_loss": -44.1037483215332, "global_step": 289124, "epoch": 2389} {"train_loss": -43.122859954833984, "global_step": 289125, "epoch": 2389} {"train_loss": -42.712947845458984, "global_step": 289126, "epoch": 2389} {"train_loss": -40.88114929199219, "global_step": 289127, "epoch": 2389} {"train_loss": -39.27659225463867, "global_step": 289128, "epoch": 2389} {"train_loss": -39.08674621582031, "global_step": 289129, "epoch": 2389} {"train_loss": -38.02421188354492, "global_step": 289130, "epoch": 2389} {"train_loss": -38.08773422241211, "global_step": 289131, "epoch": 2389} {"train_loss": -40.30597686767578, "global_step": 289132, "epoch": 2389} {"train_loss": -42.36140060424805, "global_step": 289133, "epoch": 2389} {"train_loss": -40.657222747802734, "global_step": 289134, "epoch": 2389} {"train_loss": -37.262718200683594, "global_step": 289135, "epoch": 2389} {"train_loss": -41.13839340209961, "global_step": 289136, "epoch": 2389} {"train_loss": -40.83488845825195, "global_step": 289137, "epoch": 2389} {"train_loss": -41.00834655761719, "global_step": 289138, "epoch": 2389} {"train_loss": -39.59270095825195, "global_step": 289139, "epoch": 2389} {"train_loss": -41.85894775390625, "global_step": 289140, "epoch": 2389} {"train_loss": -39.829952239990234, "global_step": 289141, "epoch": 2389} {"train_loss": -36.613739013671875, "global_step": 289142, "epoch": 2389} {"train_loss": -39.622371673583984, "global_step": 289143, "epoch": 2389} {"train_loss": -41.26972579956055, "global_step": 289144, "epoch": 2389} {"train_loss": -38.85696029663086, "global_step": 289145, "epoch": 2389} {"train_loss": -42.21808624267578, "global_step": 289146, "epoch": 2389} {"train_loss": -40.991947174072266, "global_step": 289147, "epoch": 2389} {"train_loss": -40.90041732788086, "global_step": 289148, "epoch": 2389} {"train_loss": -41.36109161376953, "global_step": 289149, "epoch": 2389} {"train_loss": -40.9720573425293, "global_step": 289150, "epoch": 2389} {"train_loss": -41.18815231323242, "global_step": 289151, "epoch": 2389} {"train_loss": -38.46628952026367, "global_step": 289152, "epoch": 2389} {"train_loss": -41.66510009765625, "global_step": 289153, "epoch": 2389} {"train_loss": -37.96015167236328, "global_step": 289154, "epoch": 2389} {"train_loss": -40.79139709472656, "global_step": 289155, "epoch": 2389} {"train_loss": -41.47829055786133, "global_step": 289156, "epoch": 2389} {"train_loss": -41.4219856262207, "global_step": 289157, "epoch": 2389} {"train_loss": -42.04900360107422, "global_step": 289158, "epoch": 2389} {"train_loss": -40.06950378417969, "global_step": 289159, "epoch": 2389} {"train_loss": -41.86049270629883, "global_step": 289160, "epoch": 2389} {"train_loss": -42.7061882019043, "global_step": 289161, "epoch": 2389} {"train_loss": -42.06284713745117, "global_step": 289162, "epoch": 2389} {"train_loss": -42.61875534057617, "global_step": 289163, "epoch": 2389} {"train_loss": -41.73031234741211, "global_step": 289164, "epoch": 2389} {"train_loss": -42.73771286010742, "global_step": 289165, "epoch": 2389} {"train_loss": -41.86099624633789, "global_step": 289166, "epoch": 2389} {"train_loss": -31.837987899780273, "global_step": 289167, "epoch": 2389} {"train_loss": -41.986785888671875, "global_step": 289168, "epoch": 2389} {"train_loss": -42.41947555541992, "global_step": 289169, "epoch": 2389} {"train_loss": -42.36091995239258, "global_step": 289170, "epoch": 2389} {"train_loss": -41.017425537109375, "global_step": 289171, "epoch": 2389} {"train_loss": -41.76493453979492, "global_step": 289172, "epoch": 2389} {"train_loss": -40.992584228515625, "global_step": 289173, "epoch": 2389} {"train_loss": -42.064762115478516, "global_step": 289174, "epoch": 2389} {"train_loss": -41.30918884277344, "global_step": 289175, "epoch": 2389} {"train_loss": -42.67424011230469, "global_step": 289176, "epoch": 2389} {"train_loss": -40.925689697265625, "global_step": 289177, "epoch": 2389} {"train_loss": -39.92876052856445, "global_step": 289178, "epoch": 2389} {"train_loss": -41.5463981628418, "global_step": 289179, "epoch": 2389} {"train_loss": -40.933441162109375, "global_step": 289180, "epoch": 2389} {"train_loss": -41.23556137084961, "global_step": 289181, "epoch": 2389} {"train_loss": -40.19584655761719, "global_step": 289182, "epoch": 2389} {"train_loss": -41.68634033203125, "global_step": 289183, "epoch": 2389} {"train_loss": -41.808921813964844, "global_step": 289184, "epoch": 2389} {"train_loss": -41.48524856567383, "global_step": 289185, "epoch": 2389} {"train_loss": -41.65102767944336, "global_step": 289186, "epoch": 2389} {"train_loss": -40.766136169433594, "global_step": 289187, "epoch": 2389} {"train_loss": -42.22119903564453, "global_step": 289188, "epoch": 2389} {"train_loss": -41.99896244963339, "global_step": 289189, "epoch": 2389, "val_loss": 2431261.25} {"train_loss": -42.42625045776367, "global_step": 289190, "epoch": 2390} {"train_loss": -42.75012969970703, "global_step": 289191, "epoch": 2390} {"train_loss": -41.27328872680664, "global_step": 289192, "epoch": 2390} {"train_loss": -42.34495162963867, "global_step": 289193, "epoch": 2390} {"train_loss": -42.785797119140625, "global_step": 289194, "epoch": 2390} {"train_loss": -42.70425033569336, "global_step": 289195, "epoch": 2390} {"train_loss": -42.69845199584961, "global_step": 289196, "epoch": 2390} {"train_loss": -42.59444808959961, "global_step": 289197, "epoch": 2390} {"train_loss": -41.95637893676758, "global_step": 289198, "epoch": 2390} {"train_loss": -42.3541374206543, "global_step": 289199, "epoch": 2390} {"train_loss": -42.76316833496094, "global_step": 289200, "epoch": 2390} {"train_loss": -42.71924591064453, "global_step": 289201, "epoch": 2390} {"train_loss": -42.49728012084961, "global_step": 289202, "epoch": 2390} {"train_loss": -41.997413635253906, "global_step": 289203, "epoch": 2390} {"train_loss": -42.731422424316406, "global_step": 289204, "epoch": 2390} {"train_loss": -42.28186798095703, "global_step": 289205, "epoch": 2390} {"train_loss": -42.51743698120117, "global_step": 289206, "epoch": 2390} {"train_loss": -42.80270004272461, "global_step": 289207, "epoch": 2390} {"train_loss": -42.03297805786133, "global_step": 289208, "epoch": 2390} {"train_loss": -43.0969123840332, "global_step": 289209, "epoch": 2390} {"train_loss": -42.24058151245117, "global_step": 289210, "epoch": 2390} {"train_loss": -42.20018768310547, "global_step": 289211, "epoch": 2390} {"train_loss": -42.1921501159668, "global_step": 289212, "epoch": 2390} {"train_loss": -42.89494705200195, "global_step": 289213, "epoch": 2390} {"train_loss": -40.385616302490234, "global_step": 289214, "epoch": 2390} {"train_loss": -42.06219482421875, "global_step": 289215, "epoch": 2390} {"train_loss": -42.30349349975586, "global_step": 289216, "epoch": 2390} {"train_loss": -43.16066360473633, "global_step": 289217, "epoch": 2390} {"train_loss": -42.69575881958008, "global_step": 289218, "epoch": 2390} {"train_loss": -43.07410430908203, "global_step": 289219, "epoch": 2390} {"train_loss": -42.00761032104492, "global_step": 289220, "epoch": 2390} {"train_loss": -41.51882553100586, "global_step": 289221, "epoch": 2390} {"train_loss": -43.5794792175293, "global_step": 289222, "epoch": 2390} {"train_loss": -41.43026351928711, "global_step": 289223, "epoch": 2390} {"train_loss": -42.70692443847656, "global_step": 289224, "epoch": 2390} {"train_loss": -42.24967575073242, "global_step": 289225, "epoch": 2390} {"train_loss": -41.84209442138672, "global_step": 289226, "epoch": 2390} {"train_loss": -42.49494934082031, "global_step": 289227, "epoch": 2390} {"train_loss": -41.71026611328125, "global_step": 289228, "epoch": 2390} {"train_loss": -42.291439056396484, "global_step": 289229, "epoch": 2390} {"train_loss": -40.08269500732422, "global_step": 289230, "epoch": 2390} {"train_loss": -43.3049430847168, "global_step": 289231, "epoch": 2390} {"train_loss": -42.84788131713867, "global_step": 289232, "epoch": 2390} {"train_loss": -42.494606018066406, "global_step": 289233, "epoch": 2390} {"train_loss": -41.098419189453125, "global_step": 289234, "epoch": 2390} {"train_loss": -41.28391647338867, "global_step": 289235, "epoch": 2390} {"train_loss": -42.773170471191406, "global_step": 289236, "epoch": 2390} {"train_loss": -41.528507232666016, "global_step": 289237, "epoch": 2390} {"train_loss": -43.28472900390625, "global_step": 289238, "epoch": 2390} {"train_loss": -40.79586410522461, "global_step": 289239, "epoch": 2390} {"train_loss": -42.68351364135742, "global_step": 289240, "epoch": 2390} {"train_loss": -41.76487731933594, "global_step": 289241, "epoch": 2390} {"train_loss": -42.13286209106445, "global_step": 289242, "epoch": 2390} {"train_loss": -43.04140853881836, "global_step": 289243, "epoch": 2390} {"train_loss": -42.93866729736328, "global_step": 289244, "epoch": 2390} {"train_loss": -42.8069953918457, "global_step": 289245, "epoch": 2390} {"train_loss": -41.62845993041992, "global_step": 289246, "epoch": 2390} {"train_loss": -43.050899505615234, "global_step": 289247, "epoch": 2390} {"train_loss": -41.44111633300781, "global_step": 289248, "epoch": 2390} {"train_loss": -41.31172180175781, "global_step": 289249, "epoch": 2390} {"train_loss": -41.857479095458984, "global_step": 289250, "epoch": 2390} {"train_loss": -41.54888153076172, "global_step": 289251, "epoch": 2390} {"train_loss": -43.561851501464844, "global_step": 289252, "epoch": 2390} {"train_loss": -42.16203689575195, "global_step": 289253, "epoch": 2390} {"train_loss": -43.46200942993164, "global_step": 289254, "epoch": 2390} {"train_loss": -43.053382873535156, "global_step": 289255, "epoch": 2390} {"train_loss": -42.6595458984375, "global_step": 289256, "epoch": 2390} {"train_loss": -42.70215606689453, "global_step": 289257, "epoch": 2390} {"train_loss": -43.49517059326172, "global_step": 289258, "epoch": 2390} {"train_loss": -42.398250579833984, "global_step": 289259, "epoch": 2390} {"train_loss": -42.464149475097656, "global_step": 289260, "epoch": 2390} {"train_loss": -42.495174407958984, "global_step": 289261, "epoch": 2390} {"train_loss": -41.396148681640625, "global_step": 289262, "epoch": 2390} {"train_loss": -42.95868682861328, "global_step": 289263, "epoch": 2390} {"train_loss": -43.3691291809082, "global_step": 289264, "epoch": 2390} {"train_loss": -40.36172103881836, "global_step": 289265, "epoch": 2390} {"train_loss": -41.213783264160156, "global_step": 289266, "epoch": 2390} {"train_loss": -42.86040115356445, "global_step": 289267, "epoch": 2390} {"train_loss": -42.482059478759766, "global_step": 289268, "epoch": 2390} {"train_loss": -42.13019943237305, "global_step": 289269, "epoch": 2390} {"train_loss": -42.830997467041016, "global_step": 289270, "epoch": 2390} {"train_loss": -42.221893310546875, "global_step": 289271, "epoch": 2390} {"train_loss": -43.20237350463867, "global_step": 289272, "epoch": 2390} {"train_loss": -41.73291778564453, "global_step": 289273, "epoch": 2390} {"train_loss": -41.829776763916016, "global_step": 289274, "epoch": 2390} {"train_loss": -41.677490234375, "global_step": 289275, "epoch": 2390} {"train_loss": -42.8300666809082, "global_step": 289276, "epoch": 2390} {"train_loss": -43.48287582397461, "global_step": 289277, "epoch": 2390} {"train_loss": -42.67051696777344, "global_step": 289278, "epoch": 2390} {"train_loss": -42.190528869628906, "global_step": 289279, "epoch": 2390} {"train_loss": -42.81620407104492, "global_step": 289280, "epoch": 2390} {"train_loss": -41.8804817199707, "global_step": 289281, "epoch": 2390} {"train_loss": -40.58718490600586, "global_step": 289282, "epoch": 2390} {"train_loss": -43.06708908081055, "global_step": 289283, "epoch": 2390} {"train_loss": -42.1728515625, "global_step": 289284, "epoch": 2390} {"train_loss": -40.722747802734375, "global_step": 289285, "epoch": 2390} {"train_loss": -41.87569808959961, "global_step": 289286, "epoch": 2390} {"train_loss": -41.143951416015625, "global_step": 289287, "epoch": 2390} {"train_loss": -37.88837814331055, "global_step": 289288, "epoch": 2390} {"train_loss": -42.67374801635742, "global_step": 289289, "epoch": 2390} {"train_loss": -42.5056266784668, "global_step": 289290, "epoch": 2390} {"train_loss": -41.99577713012695, "global_step": 289291, "epoch": 2390} {"train_loss": -42.96395492553711, "global_step": 289292, "epoch": 2390} {"train_loss": -40.5702018737793, "global_step": 289293, "epoch": 2390} {"train_loss": -40.13348388671875, "global_step": 289294, "epoch": 2390} {"train_loss": -42.844844818115234, "global_step": 289295, "epoch": 2390} {"train_loss": -39.87678146362305, "global_step": 289296, "epoch": 2390} {"train_loss": -41.766963958740234, "global_step": 289297, "epoch": 2390} {"train_loss": -42.59361267089844, "global_step": 289298, "epoch": 2390} {"train_loss": -39.93732833862305, "global_step": 289299, "epoch": 2390} {"train_loss": -42.13005447387695, "global_step": 289300, "epoch": 2390} {"train_loss": -41.772682189941406, "global_step": 289301, "epoch": 2390} {"train_loss": -40.68169021606445, "global_step": 289302, "epoch": 2390} {"train_loss": -42.94768524169922, "global_step": 289303, "epoch": 2390} {"train_loss": -42.63083267211914, "global_step": 289304, "epoch": 2390} {"train_loss": -41.84919738769531, "global_step": 289305, "epoch": 2390} {"train_loss": -42.49158477783203, "global_step": 289306, "epoch": 2390} {"train_loss": -41.1418342590332, "global_step": 289307, "epoch": 2390} {"train_loss": -38.90267562866211, "global_step": 289308, "epoch": 2390} {"train_loss": -42.01577377319336, "global_step": 289309, "epoch": 2390} {"train_loss": -42.1325414673356, "global_step": 289310, "epoch": 2390, "val_loss": 2771325.0} {"train_loss": -41.837440490722656, "global_step": 289311, "epoch": 2391} {"train_loss": -42.70857620239258, "global_step": 289312, "epoch": 2391} {"train_loss": -42.950260162353516, "global_step": 289313, "epoch": 2391} {"train_loss": -42.595916748046875, "global_step": 289314, "epoch": 2391} {"train_loss": -42.95707321166992, "global_step": 289315, "epoch": 2391} {"train_loss": -41.75069808959961, "global_step": 289316, "epoch": 2391} {"train_loss": -42.82501983642578, "global_step": 289317, "epoch": 2391} {"train_loss": -42.9012336730957, "global_step": 289318, "epoch": 2391} {"train_loss": -43.05065155029297, "global_step": 289319, "epoch": 2391} {"train_loss": -42.81856918334961, "global_step": 289320, "epoch": 2391} {"train_loss": -42.87984085083008, "global_step": 289321, "epoch": 2391} {"train_loss": -42.92407989501953, "global_step": 289322, "epoch": 2391} {"train_loss": -42.3614616394043, "global_step": 289323, "epoch": 2391} {"train_loss": -43.405479431152344, "global_step": 289324, "epoch": 2391} {"train_loss": -43.16440963745117, "global_step": 289325, "epoch": 2391} {"train_loss": -42.39335250854492, "global_step": 289326, "epoch": 2391} {"train_loss": -41.52782440185547, "global_step": 289327, "epoch": 2391} {"train_loss": -42.755165100097656, "global_step": 289328, "epoch": 2391} {"train_loss": -42.72738265991211, "global_step": 289329, "epoch": 2391} {"train_loss": -41.88755416870117, "global_step": 289330, "epoch": 2391} {"train_loss": -42.48018264770508, "global_step": 289331, "epoch": 2391} {"train_loss": -43.161434173583984, "global_step": 289332, "epoch": 2391} {"train_loss": -43.60529708862305, "global_step": 289333, "epoch": 2391} {"train_loss": -42.40985107421875, "global_step": 289334, "epoch": 2391} {"train_loss": -42.7998161315918, "global_step": 289335, "epoch": 2391} {"train_loss": -43.15340805053711, "global_step": 289336, "epoch": 2391} {"train_loss": -42.899085998535156, "global_step": 289337, "epoch": 2391} {"train_loss": -43.25779342651367, "global_step": 289338, "epoch": 2391} {"train_loss": -43.663509368896484, "global_step": 289339, "epoch": 2391} {"train_loss": -42.640892028808594, "global_step": 289340, "epoch": 2391} {"train_loss": -43.63618469238281, "global_step": 289341, "epoch": 2391} {"train_loss": -43.375091552734375, "global_step": 289342, "epoch": 2391} {"train_loss": -43.555416107177734, "global_step": 289343, "epoch": 2391} {"train_loss": -41.67053985595703, "global_step": 289344, "epoch": 2391} {"train_loss": -43.05950927734375, "global_step": 289345, "epoch": 2391} {"train_loss": -42.68949508666992, "global_step": 289346, "epoch": 2391} {"train_loss": -42.94969177246094, "global_step": 289347, "epoch": 2391} {"train_loss": -41.691280364990234, "global_step": 289348, "epoch": 2391} {"train_loss": -42.148536682128906, "global_step": 289349, "epoch": 2391} {"train_loss": -38.422916412353516, "global_step": 289350, "epoch": 2391} {"train_loss": -42.761817932128906, "global_step": 289351, "epoch": 2391} {"train_loss": -43.19527816772461, "global_step": 289352, "epoch": 2391} {"train_loss": -41.889892578125, "global_step": 289353, "epoch": 2391} {"train_loss": -42.296138763427734, "global_step": 289354, "epoch": 2391} {"train_loss": -40.83694076538086, "global_step": 289355, "epoch": 2391} {"train_loss": -42.7736930847168, "global_step": 289356, "epoch": 2391} {"train_loss": -41.525753021240234, "global_step": 289357, "epoch": 2391} {"train_loss": -43.03095245361328, "global_step": 289358, "epoch": 2391} {"train_loss": -42.52773666381836, "global_step": 289359, "epoch": 2391} {"train_loss": -43.07190704345703, "global_step": 289360, "epoch": 2391} {"train_loss": -42.422080993652344, "global_step": 289361, "epoch": 2391} {"train_loss": -41.18037796020508, "global_step": 289362, "epoch": 2391} {"train_loss": -41.80512619018555, "global_step": 289363, "epoch": 2391} {"train_loss": -42.66941833496094, "global_step": 289364, "epoch": 2391} {"train_loss": -39.61853790283203, "global_step": 289365, "epoch": 2391} {"train_loss": -38.1972541809082, "global_step": 289366, "epoch": 2391} {"train_loss": -42.63096237182617, "global_step": 289367, "epoch": 2391} {"train_loss": -41.699676513671875, "global_step": 289368, "epoch": 2391} {"train_loss": -42.19576644897461, "global_step": 289369, "epoch": 2391} {"train_loss": -39.18675994873047, "global_step": 289370, "epoch": 2391} {"train_loss": -42.57203674316406, "global_step": 289371, "epoch": 2391} {"train_loss": -41.984859466552734, "global_step": 289372, "epoch": 2391} {"train_loss": -42.46952438354492, "global_step": 289373, "epoch": 2391} {"train_loss": -40.81697463989258, "global_step": 289374, "epoch": 2391} {"train_loss": -41.61743927001953, "global_step": 289375, "epoch": 2391} {"train_loss": -42.184078216552734, "global_step": 289376, "epoch": 2391} {"train_loss": -38.40460205078125, "global_step": 289377, "epoch": 2391} {"train_loss": -40.645259857177734, "global_step": 289378, "epoch": 2391} {"train_loss": -40.16530990600586, "global_step": 289379, "epoch": 2391} {"train_loss": -42.754058837890625, "global_step": 289380, "epoch": 2391} {"train_loss": -41.70313262939453, "global_step": 289381, "epoch": 2391} {"train_loss": -41.15410232543945, "global_step": 289382, "epoch": 2391} {"train_loss": -42.25551986694336, "global_step": 289383, "epoch": 2391} {"train_loss": -39.766990661621094, "global_step": 289384, "epoch": 2391} {"train_loss": -41.37351608276367, "global_step": 289385, "epoch": 2391} {"train_loss": -42.50907897949219, "global_step": 289386, "epoch": 2391} {"train_loss": -41.36623764038086, "global_step": 289387, "epoch": 2391} {"train_loss": -42.75124740600586, "global_step": 289388, "epoch": 2391} {"train_loss": -41.184932708740234, "global_step": 289389, "epoch": 2391} {"train_loss": -41.81378173828125, "global_step": 289390, "epoch": 2391} {"train_loss": -40.9980354309082, "global_step": 289391, "epoch": 2391} {"train_loss": -40.05348587036133, "global_step": 289392, "epoch": 2391} {"train_loss": -40.89971160888672, "global_step": 289393, "epoch": 2391} {"train_loss": -42.06234359741211, "global_step": 289394, "epoch": 2391} {"train_loss": -39.81998825073242, "global_step": 289395, "epoch": 2391} {"train_loss": -40.54629135131836, "global_step": 289396, "epoch": 2391} {"train_loss": -41.33427429199219, "global_step": 289397, "epoch": 2391} {"train_loss": -40.15902328491211, "global_step": 289398, "epoch": 2391} {"train_loss": -40.20355987548828, "global_step": 289399, "epoch": 2391} {"train_loss": -40.5071907043457, "global_step": 289400, "epoch": 2391} {"train_loss": -40.38759231567383, "global_step": 289401, "epoch": 2391} {"train_loss": -41.56256866455078, "global_step": 289402, "epoch": 2391} {"train_loss": -40.894107818603516, "global_step": 289403, "epoch": 2391} {"train_loss": -41.292083740234375, "global_step": 289404, "epoch": 2391} {"train_loss": -41.24027633666992, "global_step": 289405, "epoch": 2391} {"train_loss": -41.63650894165039, "global_step": 289406, "epoch": 2391} {"train_loss": -40.749244689941406, "global_step": 289407, "epoch": 2391} {"train_loss": -41.064327239990234, "global_step": 289408, "epoch": 2391} {"train_loss": -41.98299789428711, "global_step": 289409, "epoch": 2391} {"train_loss": -42.31488037109375, "global_step": 289410, "epoch": 2391} {"train_loss": -41.61735153198242, "global_step": 289411, "epoch": 2391} {"train_loss": -42.808502197265625, "global_step": 289412, "epoch": 2391} {"train_loss": -40.583473205566406, "global_step": 289413, "epoch": 2391} {"train_loss": -42.50715255737305, "global_step": 289414, "epoch": 2391} {"train_loss": -42.0223388671875, "global_step": 289415, "epoch": 2391} {"train_loss": -41.255611419677734, "global_step": 289416, "epoch": 2391} {"train_loss": -41.695613861083984, "global_step": 289417, "epoch": 2391} {"train_loss": -42.63790512084961, "global_step": 289418, "epoch": 2391} {"train_loss": -42.44023513793945, "global_step": 289419, "epoch": 2391} {"train_loss": -42.697265625, "global_step": 289420, "epoch": 2391} {"train_loss": -42.806556701660156, "global_step": 289421, "epoch": 2391} {"train_loss": -42.60136032104492, "global_step": 289422, "epoch": 2391} {"train_loss": -42.47581100463867, "global_step": 289423, "epoch": 2391} {"train_loss": -41.832191467285156, "global_step": 289424, "epoch": 2391} {"train_loss": -43.0263786315918, "global_step": 289425, "epoch": 2391} {"train_loss": -43.299171447753906, "global_step": 289426, "epoch": 2391} {"train_loss": -42.27977752685547, "global_step": 289427, "epoch": 2391} {"train_loss": -43.38148880004883, "global_step": 289428, "epoch": 2391} {"train_loss": -42.62058639526367, "global_step": 289429, "epoch": 2391} {"train_loss": -43.222084045410156, "global_step": 289430, "epoch": 2391} {"train_loss": -41.99479249686249, "global_step": 289431, "epoch": 2391, "val_loss": 2488535.75} {"train_loss": -41.118873596191406, "global_step": 289432, "epoch": 2392} {"train_loss": -43.364620208740234, "global_step": 289433, "epoch": 2392} {"train_loss": -42.94972610473633, "global_step": 289434, "epoch": 2392} {"train_loss": -42.62776565551758, "global_step": 289435, "epoch": 2392} {"train_loss": -43.3948860168457, "global_step": 289436, "epoch": 2392} {"train_loss": -42.74774932861328, "global_step": 289437, "epoch": 2392} {"train_loss": -43.58671188354492, "global_step": 289438, "epoch": 2392} {"train_loss": -42.933406829833984, "global_step": 289439, "epoch": 2392} {"train_loss": -43.03731918334961, "global_step": 289440, "epoch": 2392} {"train_loss": -42.65110397338867, "global_step": 289441, "epoch": 2392} {"train_loss": -43.59121322631836, "global_step": 289442, "epoch": 2392} {"train_loss": -43.156551361083984, "global_step": 289443, "epoch": 2392} {"train_loss": -43.03020095825195, "global_step": 289444, "epoch": 2392} {"train_loss": -42.627052307128906, "global_step": 289445, "epoch": 2392} {"train_loss": -43.40525436401367, "global_step": 289446, "epoch": 2392} {"train_loss": -43.31687927246094, "global_step": 289447, "epoch": 2392} {"train_loss": -43.68708801269531, "global_step": 289448, "epoch": 2392} {"train_loss": -39.26630783081055, "global_step": 289449, "epoch": 2392} {"train_loss": -41.01087951660156, "global_step": 289450, "epoch": 2392} {"train_loss": -42.7871208190918, "global_step": 289451, "epoch": 2392} {"train_loss": -43.326820373535156, "global_step": 289452, "epoch": 2392} {"train_loss": -42.05317306518555, "global_step": 289453, "epoch": 2392} {"train_loss": -42.32039260864258, "global_step": 289454, "epoch": 2392} {"train_loss": -42.541847229003906, "global_step": 289455, "epoch": 2392} {"train_loss": -42.98053741455078, "global_step": 289456, "epoch": 2392} {"train_loss": -42.9563102722168, "global_step": 289457, "epoch": 2392} {"train_loss": -42.793697357177734, "global_step": 289458, "epoch": 2392} {"train_loss": -43.68825912475586, "global_step": 289459, "epoch": 2392} {"train_loss": -43.389339447021484, "global_step": 289460, "epoch": 2392} {"train_loss": -42.51768493652344, "global_step": 289461, "epoch": 2392} {"train_loss": -43.59000778198242, "global_step": 289462, "epoch": 2392} {"train_loss": -42.5750732421875, "global_step": 289463, "epoch": 2392} {"train_loss": -43.449092864990234, "global_step": 289464, "epoch": 2392} {"train_loss": -42.75490951538086, "global_step": 289465, "epoch": 2392} {"train_loss": -43.70578384399414, "global_step": 289466, "epoch": 2392} {"train_loss": -43.19587326049805, "global_step": 289467, "epoch": 2392} {"train_loss": -42.46885299682617, "global_step": 289468, "epoch": 2392} {"train_loss": -42.62944412231445, "global_step": 289469, "epoch": 2392} {"train_loss": -42.92905807495117, "global_step": 289470, "epoch": 2392} {"train_loss": -42.083858489990234, "global_step": 289471, "epoch": 2392} {"train_loss": -39.184730529785156, "global_step": 289472, "epoch": 2392} {"train_loss": -40.96869659423828, "global_step": 289473, "epoch": 2392} {"train_loss": -42.20777130126953, "global_step": 289474, "epoch": 2392} {"train_loss": -40.45916748046875, "global_step": 289475, "epoch": 2392} {"train_loss": -41.08711624145508, "global_step": 289476, "epoch": 2392} {"train_loss": -43.20904541015625, "global_step": 289477, "epoch": 2392} {"train_loss": -42.49076843261719, "global_step": 289478, "epoch": 2392} {"train_loss": -41.333656311035156, "global_step": 289479, "epoch": 2392} {"train_loss": -40.4501838684082, "global_step": 289480, "epoch": 2392} {"train_loss": -42.46106719970703, "global_step": 289481, "epoch": 2392} {"train_loss": -41.94144821166992, "global_step": 289482, "epoch": 2392} {"train_loss": -40.64127731323242, "global_step": 289483, "epoch": 2392} {"train_loss": -42.731380462646484, "global_step": 289484, "epoch": 2392} {"train_loss": -40.446041107177734, "global_step": 289485, "epoch": 2392} {"train_loss": -39.160335540771484, "global_step": 289486, "epoch": 2392} {"train_loss": -38.82070541381836, "global_step": 289487, "epoch": 2392} {"train_loss": -42.46696090698242, "global_step": 289488, "epoch": 2392} {"train_loss": -38.97710037231445, "global_step": 289489, "epoch": 2392} {"train_loss": -38.41585159301758, "global_step": 289490, "epoch": 2392} {"train_loss": -41.442745208740234, "global_step": 289491, "epoch": 2392} {"train_loss": -41.49496078491211, "global_step": 289492, "epoch": 2392} {"train_loss": -38.749855041503906, "global_step": 289493, "epoch": 2392} {"train_loss": -42.307979583740234, "global_step": 289494, "epoch": 2392} {"train_loss": -40.89468002319336, "global_step": 289495, "epoch": 2392} {"train_loss": -41.37791061401367, "global_step": 289496, "epoch": 2392} {"train_loss": -40.3856201171875, "global_step": 289497, "epoch": 2392} {"train_loss": -38.022701263427734, "global_step": 289498, "epoch": 2392} {"train_loss": -42.058860778808594, "global_step": 289499, "epoch": 2392} {"train_loss": -40.85725021362305, "global_step": 289500, "epoch": 2392} {"train_loss": -40.39741134643555, "global_step": 289501, "epoch": 2392} {"train_loss": -42.11865997314453, "global_step": 289502, "epoch": 2392} {"train_loss": -40.27722930908203, "global_step": 289503, "epoch": 2392} {"train_loss": -41.58994674682617, "global_step": 289504, "epoch": 2392} {"train_loss": -41.215576171875, "global_step": 289505, "epoch": 2392} {"train_loss": -42.89051055908203, "global_step": 289506, "epoch": 2392} {"train_loss": -42.20209884643555, "global_step": 289507, "epoch": 2392} {"train_loss": -41.127723693847656, "global_step": 289508, "epoch": 2392} {"train_loss": -41.527915954589844, "global_step": 289509, "epoch": 2392} {"train_loss": -41.06392288208008, "global_step": 289510, "epoch": 2392} {"train_loss": -41.517147064208984, "global_step": 289511, "epoch": 2392} {"train_loss": -42.16680908203125, "global_step": 289512, "epoch": 2392} {"train_loss": -42.8390998840332, "global_step": 289513, "epoch": 2392} {"train_loss": -42.191280364990234, "global_step": 289514, "epoch": 2392} {"train_loss": -42.74020004272461, "global_step": 289515, "epoch": 2392} {"train_loss": -43.39677047729492, "global_step": 289516, "epoch": 2392} {"train_loss": -42.165313720703125, "global_step": 289517, "epoch": 2392} {"train_loss": -42.90204620361328, "global_step": 289518, "epoch": 2392} {"train_loss": -42.21151351928711, "global_step": 289519, "epoch": 2392} {"train_loss": -39.66634750366211, "global_step": 289520, "epoch": 2392} {"train_loss": -42.92994689941406, "global_step": 289521, "epoch": 2392} {"train_loss": -42.8288688659668, "global_step": 289522, "epoch": 2392} {"train_loss": -42.905853271484375, "global_step": 289523, "epoch": 2392} {"train_loss": -42.1811408996582, "global_step": 289524, "epoch": 2392} {"train_loss": -42.86421585083008, "global_step": 289525, "epoch": 2392} {"train_loss": -42.6708869934082, "global_step": 289526, "epoch": 2392} {"train_loss": -43.4039421081543, "global_step": 289527, "epoch": 2392} {"train_loss": -42.991363525390625, "global_step": 289528, "epoch": 2392} {"train_loss": -42.47756576538086, "global_step": 289529, "epoch": 2392} {"train_loss": -43.27375411987305, "global_step": 289530, "epoch": 2392} {"train_loss": -43.891937255859375, "global_step": 289531, "epoch": 2392} {"train_loss": -43.88674545288086, "global_step": 289532, "epoch": 2392} {"train_loss": -41.123985290527344, "global_step": 289533, "epoch": 2392} {"train_loss": -43.715450286865234, "global_step": 289534, "epoch": 2392} {"train_loss": -42.83334732055664, "global_step": 289535, "epoch": 2392} {"train_loss": -43.402992248535156, "global_step": 289536, "epoch": 2392} {"train_loss": -43.4036979675293, "global_step": 289537, "epoch": 2392} {"train_loss": -43.08989334106445, "global_step": 289538, "epoch": 2392} {"train_loss": -43.391273498535156, "global_step": 289539, "epoch": 2392} {"train_loss": -43.45567321777344, "global_step": 289540, "epoch": 2392} {"train_loss": -42.80154800415039, "global_step": 289541, "epoch": 2392} {"train_loss": -43.561737060546875, "global_step": 289542, "epoch": 2392} {"train_loss": -43.439697265625, "global_step": 289543, "epoch": 2392} {"train_loss": -43.74219512939453, "global_step": 289544, "epoch": 2392} {"train_loss": -43.36946487426758, "global_step": 289545, "epoch": 2392} {"train_loss": -43.88431930541992, "global_step": 289546, "epoch": 2392} {"train_loss": -41.940956115722656, "global_step": 289547, "epoch": 2392} {"train_loss": -43.80226135253906, "global_step": 289548, "epoch": 2392} {"train_loss": -42.39227294921875, "global_step": 289549, "epoch": 2392} {"train_loss": -43.802921295166016, "global_step": 289550, "epoch": 2392} {"train_loss": -43.6453742980957, "global_step": 289551, "epoch": 2392} {"train_loss": -42.26805918669898, "global_step": 289552, "epoch": 2392, "val_loss": 2434215.75} {"train_loss": -43.57111740112305, "global_step": 289553, "epoch": 2393} {"train_loss": -44.33869552612305, "global_step": 289554, "epoch": 2393} {"train_loss": -42.863433837890625, "global_step": 289555, "epoch": 2393} {"train_loss": -41.608699798583984, "global_step": 289556, "epoch": 2393} {"train_loss": -43.90432357788086, "global_step": 289557, "epoch": 2393} {"train_loss": -42.71506118774414, "global_step": 289558, "epoch": 2393} {"train_loss": -43.6882209777832, "global_step": 289559, "epoch": 2393} {"train_loss": -44.105377197265625, "global_step": 289560, "epoch": 2393} {"train_loss": -43.61552047729492, "global_step": 289561, "epoch": 2393} {"train_loss": -43.806243896484375, "global_step": 289562, "epoch": 2393} {"train_loss": -43.767887115478516, "global_step": 289563, "epoch": 2393} {"train_loss": -43.5794792175293, "global_step": 289564, "epoch": 2393} {"train_loss": -43.470882415771484, "global_step": 289565, "epoch": 2393} {"train_loss": -43.03365707397461, "global_step": 289566, "epoch": 2393} {"train_loss": -41.4210319519043, "global_step": 289567, "epoch": 2393} {"train_loss": -43.37282943725586, "global_step": 289568, "epoch": 2393} {"train_loss": -43.70907211303711, "global_step": 289569, "epoch": 2393} {"train_loss": -43.951656341552734, "global_step": 289570, "epoch": 2393} {"train_loss": -43.514774322509766, "global_step": 289571, "epoch": 2393} {"train_loss": -42.85793685913086, "global_step": 289572, "epoch": 2393} {"train_loss": -43.00532150268555, "global_step": 289573, "epoch": 2393} {"train_loss": -40.790313720703125, "global_step": 289574, "epoch": 2393} {"train_loss": -41.54508972167969, "global_step": 289575, "epoch": 2393} {"train_loss": -43.1008415222168, "global_step": 289576, "epoch": 2393} {"train_loss": -41.496578216552734, "global_step": 289577, "epoch": 2393} {"train_loss": -42.708003997802734, "global_step": 289578, "epoch": 2393} {"train_loss": -42.28718185424805, "global_step": 289579, "epoch": 2393} {"train_loss": -43.41823959350586, "global_step": 289580, "epoch": 2393} {"train_loss": -42.761505126953125, "global_step": 289581, "epoch": 2393} {"train_loss": -42.45314407348633, "global_step": 289582, "epoch": 2393} {"train_loss": -41.88957214355469, "global_step": 289583, "epoch": 2393} {"train_loss": -42.16312789916992, "global_step": 289584, "epoch": 2393} {"train_loss": -41.41035842895508, "global_step": 289585, "epoch": 2393} {"train_loss": -38.651424407958984, "global_step": 289586, "epoch": 2393} {"train_loss": -43.204097747802734, "global_step": 289587, "epoch": 2393} {"train_loss": -42.95854949951172, "global_step": 289588, "epoch": 2393} {"train_loss": -40.059635162353516, "global_step": 289589, "epoch": 2393} {"train_loss": -40.763641357421875, "global_step": 289590, "epoch": 2393} {"train_loss": -40.358802795410156, "global_step": 289591, "epoch": 2393} {"train_loss": -42.665828704833984, "global_step": 289592, "epoch": 2393} {"train_loss": -42.461082458496094, "global_step": 289593, "epoch": 2393} {"train_loss": -38.992191314697266, "global_step": 289594, "epoch": 2393} {"train_loss": -36.715702056884766, "global_step": 289595, "epoch": 2393} {"train_loss": -41.72157287597656, "global_step": 289596, "epoch": 2393} {"train_loss": -42.35633087158203, "global_step": 289597, "epoch": 2393} {"train_loss": -41.826080322265625, "global_step": 289598, "epoch": 2393} {"train_loss": -40.66478729248047, "global_step": 289599, "epoch": 2393} {"train_loss": -41.02711868286133, "global_step": 289600, "epoch": 2393} {"train_loss": -41.487518310546875, "global_step": 289601, "epoch": 2393} {"train_loss": -40.706417083740234, "global_step": 289602, "epoch": 2393} {"train_loss": -36.27874755859375, "global_step": 289603, "epoch": 2393} {"train_loss": -39.13337707519531, "global_step": 289604, "epoch": 2393} {"train_loss": -40.86283493041992, "global_step": 289605, "epoch": 2393} {"train_loss": -37.030548095703125, "global_step": 289606, "epoch": 2393} {"train_loss": -42.265380859375, "global_step": 289607, "epoch": 2393} {"train_loss": -40.085567474365234, "global_step": 289608, "epoch": 2393} {"train_loss": -36.62949752807617, "global_step": 289609, "epoch": 2393} {"train_loss": -38.09629440307617, "global_step": 289610, "epoch": 2393} {"train_loss": -38.14051055908203, "global_step": 289611, "epoch": 2393} {"train_loss": -39.781803131103516, "global_step": 289612, "epoch": 2393} {"train_loss": -36.04526901245117, "global_step": 289613, "epoch": 2393} {"train_loss": -40.22397994995117, "global_step": 289614, "epoch": 2393} {"train_loss": -39.969459533691406, "global_step": 289615, "epoch": 2393} {"train_loss": -41.57465362548828, "global_step": 289616, "epoch": 2393} {"train_loss": -41.47731018066406, "global_step": 289617, "epoch": 2393} {"train_loss": -37.87462615966797, "global_step": 289618, "epoch": 2393} {"train_loss": -40.92576599121094, "global_step": 289619, "epoch": 2393} {"train_loss": -37.0401611328125, "global_step": 289620, "epoch": 2393} {"train_loss": -38.73342514038086, "global_step": 289621, "epoch": 2393} {"train_loss": -40.9891242980957, "global_step": 289622, "epoch": 2393} {"train_loss": -37.48783874511719, "global_step": 289623, "epoch": 2393} {"train_loss": -41.3071403503418, "global_step": 289624, "epoch": 2393} {"train_loss": -39.25936508178711, "global_step": 289625, "epoch": 2393} {"train_loss": -37.82790756225586, "global_step": 289626, "epoch": 2393} {"train_loss": -38.317848205566406, "global_step": 289627, "epoch": 2393} {"train_loss": -39.79262924194336, "global_step": 289628, "epoch": 2393} {"train_loss": -40.9006233215332, "global_step": 289629, "epoch": 2393} {"train_loss": -37.615272521972656, "global_step": 289630, "epoch": 2393} {"train_loss": -39.937774658203125, "global_step": 289631, "epoch": 2393} {"train_loss": -39.95647048950195, "global_step": 289632, "epoch": 2393} {"train_loss": -39.88630294799805, "global_step": 289633, "epoch": 2393} {"train_loss": -42.278438568115234, "global_step": 289634, "epoch": 2393} {"train_loss": -40.50642776489258, "global_step": 289635, "epoch": 2393} {"train_loss": -42.06150436401367, "global_step": 289636, "epoch": 2393} {"train_loss": -40.215938568115234, "global_step": 289637, "epoch": 2393} {"train_loss": -42.1098747253418, "global_step": 289638, "epoch": 2393} {"train_loss": -40.369659423828125, "global_step": 289639, "epoch": 2393} {"train_loss": -41.475807189941406, "global_step": 289640, "epoch": 2393} {"train_loss": -39.88507080078125, "global_step": 289641, "epoch": 2393} {"train_loss": -40.86833572387695, "global_step": 289642, "epoch": 2393} {"train_loss": -41.90625, "global_step": 289643, "epoch": 2393} {"train_loss": -41.34184646606445, "global_step": 289644, "epoch": 2393} {"train_loss": -40.83845138549805, "global_step": 289645, "epoch": 2393} {"train_loss": -42.053375244140625, "global_step": 289646, "epoch": 2393} {"train_loss": -41.415401458740234, "global_step": 289647, "epoch": 2393} {"train_loss": -41.51179504394531, "global_step": 289648, "epoch": 2393} {"train_loss": -39.58906173706055, "global_step": 289649, "epoch": 2393} {"train_loss": -41.64240264892578, "global_step": 289650, "epoch": 2393} {"train_loss": -40.74958038330078, "global_step": 289651, "epoch": 2393} {"train_loss": -41.76093292236328, "global_step": 289652, "epoch": 2393} {"train_loss": -39.814125061035156, "global_step": 289653, "epoch": 2393} {"train_loss": -39.7829475402832, "global_step": 289654, "epoch": 2393} {"train_loss": -40.42429733276367, "global_step": 289655, "epoch": 2393} {"train_loss": -41.46791076660156, "global_step": 289656, "epoch": 2393} {"train_loss": -42.11444854736328, "global_step": 289657, "epoch": 2393} {"train_loss": -42.67550277709961, "global_step": 289658, "epoch": 2393} {"train_loss": -42.158775329589844, "global_step": 289659, "epoch": 2393} {"train_loss": -41.810726165771484, "global_step": 289660, "epoch": 2393} {"train_loss": -42.49714660644531, "global_step": 289661, "epoch": 2393} {"train_loss": -40.62299728393555, "global_step": 289662, "epoch": 2393} {"train_loss": -41.577327728271484, "global_step": 289663, "epoch": 2393} {"train_loss": -42.762474060058594, "global_step": 289664, "epoch": 2393} {"train_loss": -41.6494255065918, "global_step": 289665, "epoch": 2393} {"train_loss": -41.96671676635742, "global_step": 289666, "epoch": 2393} {"train_loss": -42.32355499267578, "global_step": 289667, "epoch": 2393} {"train_loss": -42.04011154174805, "global_step": 289668, "epoch": 2393} {"train_loss": -40.24001693725586, "global_step": 289669, "epoch": 2393} {"train_loss": -40.81144714355469, "global_step": 289670, "epoch": 2393} {"train_loss": -42.39793014526367, "global_step": 289671, "epoch": 2393} {"train_loss": -42.4853515625, "global_step": 289672, "epoch": 2393} {"train_loss": -41.19715663815333, "global_step": 289673, "epoch": 2393, "val_loss": 2587681.0} {"train_loss": -41.666255950927734, "global_step": 289674, "epoch": 2394} {"train_loss": -42.660888671875, "global_step": 289675, "epoch": 2394} {"train_loss": -42.778751373291016, "global_step": 289676, "epoch": 2394} {"train_loss": -42.7913932800293, "global_step": 289677, "epoch": 2394} {"train_loss": -42.649452209472656, "global_step": 289678, "epoch": 2394} {"train_loss": -42.60193634033203, "global_step": 289679, "epoch": 2394} {"train_loss": -38.55702209472656, "global_step": 289680, "epoch": 2394} {"train_loss": -42.05154037475586, "global_step": 289681, "epoch": 2394} {"train_loss": -42.7805290222168, "global_step": 289682, "epoch": 2394} {"train_loss": -42.08468246459961, "global_step": 289683, "epoch": 2394} {"train_loss": -42.45235824584961, "global_step": 289684, "epoch": 2394} {"train_loss": -43.15298843383789, "global_step": 289685, "epoch": 2394} {"train_loss": -42.79197311401367, "global_step": 289686, "epoch": 2394} {"train_loss": -42.136131286621094, "global_step": 289687, "epoch": 2394} {"train_loss": -43.159114837646484, "global_step": 289688, "epoch": 2394} {"train_loss": -41.402191162109375, "global_step": 289689, "epoch": 2394} {"train_loss": -43.058040618896484, "global_step": 289690, "epoch": 2394} {"train_loss": -42.213008880615234, "global_step": 289691, "epoch": 2394} {"train_loss": -40.573944091796875, "global_step": 289692, "epoch": 2394} {"train_loss": -42.53333282470703, "global_step": 289693, "epoch": 2394} {"train_loss": -42.62732696533203, "global_step": 289694, "epoch": 2394} {"train_loss": -42.26277542114258, "global_step": 289695, "epoch": 2394} {"train_loss": -41.087345123291016, "global_step": 289696, "epoch": 2394} {"train_loss": -43.09316635131836, "global_step": 289697, "epoch": 2394} {"train_loss": -42.83320236206055, "global_step": 289698, "epoch": 2394} {"train_loss": -42.78520965576172, "global_step": 289699, "epoch": 2394} {"train_loss": -42.89113998413086, "global_step": 289700, "epoch": 2394} {"train_loss": -43.41188430786133, "global_step": 289701, "epoch": 2394} {"train_loss": -42.9842643737793, "global_step": 289702, "epoch": 2394} {"train_loss": -41.8390007019043, "global_step": 289703, "epoch": 2394} {"train_loss": -42.54085922241211, "global_step": 289704, "epoch": 2394} {"train_loss": -42.41522216796875, "global_step": 289705, "epoch": 2394} {"train_loss": -42.166194915771484, "global_step": 289706, "epoch": 2394} {"train_loss": -40.43952941894531, "global_step": 289707, "epoch": 2394} {"train_loss": -43.10122299194336, "global_step": 289708, "epoch": 2394} {"train_loss": -43.2307243347168, "global_step": 289709, "epoch": 2394} {"train_loss": -43.22247314453125, "global_step": 289710, "epoch": 2394} {"train_loss": -42.86418533325195, "global_step": 289711, "epoch": 2394} {"train_loss": -43.066158294677734, "global_step": 289712, "epoch": 2394} {"train_loss": -43.08966827392578, "global_step": 289713, "epoch": 2394} {"train_loss": -42.64716720581055, "global_step": 289714, "epoch": 2394} {"train_loss": -42.74387741088867, "global_step": 289715, "epoch": 2394} {"train_loss": -43.51797103881836, "global_step": 289716, "epoch": 2394} {"train_loss": -43.09107971191406, "global_step": 289717, "epoch": 2394} {"train_loss": -40.55059814453125, "global_step": 289718, "epoch": 2394} {"train_loss": -43.0930061340332, "global_step": 289719, "epoch": 2394} {"train_loss": -42.61701965332031, "global_step": 289720, "epoch": 2394} {"train_loss": -42.122249603271484, "global_step": 289721, "epoch": 2394} {"train_loss": -42.4468994140625, "global_step": 289722, "epoch": 2394} {"train_loss": -43.54045486450195, "global_step": 289723, "epoch": 2394} {"train_loss": -42.976051330566406, "global_step": 289724, "epoch": 2394} {"train_loss": -41.86739730834961, "global_step": 289725, "epoch": 2394} {"train_loss": -42.85919952392578, "global_step": 289726, "epoch": 2394} {"train_loss": -43.01283264160156, "global_step": 289727, "epoch": 2394} {"train_loss": -43.116878509521484, "global_step": 289728, "epoch": 2394} {"train_loss": -43.685001373291016, "global_step": 289729, "epoch": 2394} {"train_loss": -43.006065368652344, "global_step": 289730, "epoch": 2394} {"train_loss": -43.138893127441406, "global_step": 289731, "epoch": 2394} {"train_loss": -43.22636032104492, "global_step": 289732, "epoch": 2394} {"train_loss": -43.372657775878906, "global_step": 289733, "epoch": 2394} {"train_loss": -43.824432373046875, "global_step": 289734, "epoch": 2394} {"train_loss": -43.37736129760742, "global_step": 289735, "epoch": 2394} {"train_loss": -43.33036422729492, "global_step": 289736, "epoch": 2394} {"train_loss": -43.40974807739258, "global_step": 289737, "epoch": 2394} {"train_loss": -43.46529006958008, "global_step": 289738, "epoch": 2394} {"train_loss": -43.477420806884766, "global_step": 289739, "epoch": 2394} {"train_loss": -43.662567138671875, "global_step": 289740, "epoch": 2394} {"train_loss": -43.855125427246094, "global_step": 289741, "epoch": 2394} {"train_loss": -42.82617950439453, "global_step": 289742, "epoch": 2394} {"train_loss": -44.093116760253906, "global_step": 289743, "epoch": 2394} {"train_loss": -43.867977142333984, "global_step": 289744, "epoch": 2394} {"train_loss": -43.31827926635742, "global_step": 289745, "epoch": 2394} {"train_loss": -43.90538024902344, "global_step": 289746, "epoch": 2394} {"train_loss": -44.32747268676758, "global_step": 289747, "epoch": 2394} {"train_loss": -43.32327651977539, "global_step": 289748, "epoch": 2394} {"train_loss": -43.7427978515625, "global_step": 289749, "epoch": 2394} {"train_loss": -43.71031951904297, "global_step": 289750, "epoch": 2394} {"train_loss": -42.77478790283203, "global_step": 289751, "epoch": 2394} {"train_loss": -43.07499313354492, "global_step": 289752, "epoch": 2394} {"train_loss": -43.02539825439453, "global_step": 289753, "epoch": 2394} {"train_loss": -41.981712341308594, "global_step": 289754, "epoch": 2394} {"train_loss": -43.10903549194336, "global_step": 289755, "epoch": 2394} {"train_loss": -43.50796890258789, "global_step": 289756, "epoch": 2394} {"train_loss": -43.68337631225586, "global_step": 289757, "epoch": 2394} {"train_loss": -42.63033676147461, "global_step": 289758, "epoch": 2394} {"train_loss": -43.57500076293945, "global_step": 289759, "epoch": 2394} {"train_loss": -42.570526123046875, "global_step": 289760, "epoch": 2394} {"train_loss": -44.11033248901367, "global_step": 289761, "epoch": 2394} {"train_loss": -43.59530258178711, "global_step": 289762, "epoch": 2394} {"train_loss": -42.487178802490234, "global_step": 289763, "epoch": 2394} {"train_loss": -41.30354690551758, "global_step": 289764, "epoch": 2394} {"train_loss": -40.961334228515625, "global_step": 289765, "epoch": 2394} {"train_loss": -43.195491790771484, "global_step": 289766, "epoch": 2394} {"train_loss": -43.48961639404297, "global_step": 289767, "epoch": 2394} {"train_loss": -41.8946647644043, "global_step": 289768, "epoch": 2394} {"train_loss": -41.70595932006836, "global_step": 289769, "epoch": 2394} {"train_loss": -41.74872970581055, "global_step": 289770, "epoch": 2394} {"train_loss": -43.320533752441406, "global_step": 289771, "epoch": 2394} {"train_loss": -42.636356353759766, "global_step": 289772, "epoch": 2394} {"train_loss": -42.62919616699219, "global_step": 289773, "epoch": 2394} {"train_loss": -43.69901657104492, "global_step": 289774, "epoch": 2394} {"train_loss": -43.749305725097656, "global_step": 289775, "epoch": 2394} {"train_loss": -43.880184173583984, "global_step": 289776, "epoch": 2394} {"train_loss": -42.75147247314453, "global_step": 289777, "epoch": 2394} {"train_loss": -42.272064208984375, "global_step": 289778, "epoch": 2394} {"train_loss": -43.025146484375, "global_step": 289779, "epoch": 2394} {"train_loss": -43.168182373046875, "global_step": 289780, "epoch": 2394} {"train_loss": -43.45636749267578, "global_step": 289781, "epoch": 2394} {"train_loss": -43.51830291748047, "global_step": 289782, "epoch": 2394} {"train_loss": -42.9295654296875, "global_step": 289783, "epoch": 2394} {"train_loss": -41.79037094116211, "global_step": 289784, "epoch": 2394} {"train_loss": -41.41282272338867, "global_step": 289785, "epoch": 2394} {"train_loss": -42.06752395629883, "global_step": 289786, "epoch": 2394} {"train_loss": -43.12710189819336, "global_step": 289787, "epoch": 2394} {"train_loss": -42.26620864868164, "global_step": 289788, "epoch": 2394} {"train_loss": -37.208961486816406, "global_step": 289789, "epoch": 2394} {"train_loss": -40.97860336303711, "global_step": 289790, "epoch": 2394} {"train_loss": -41.240047454833984, "global_step": 289791, "epoch": 2394} {"train_loss": -41.1431770324707, "global_step": 289792, "epoch": 2394} {"train_loss": -37.22959518432617, "global_step": 289793, "epoch": 2394} {"train_loss": -42.620668742282334, "global_step": 289794, "epoch": 2394, "val_loss": 2497196.0} {"train_loss": -38.27389144897461, "global_step": 289795, "epoch": 2395} {"train_loss": -41.65083312988281, "global_step": 289796, "epoch": 2395} {"train_loss": -39.52170944213867, "global_step": 289797, "epoch": 2395} {"train_loss": -36.40947723388672, "global_step": 289798, "epoch": 2395} {"train_loss": -38.17523193359375, "global_step": 289799, "epoch": 2395} {"train_loss": -38.27727127075195, "global_step": 289800, "epoch": 2395} {"train_loss": -40.57612228393555, "global_step": 289801, "epoch": 2395} {"train_loss": -39.83882522583008, "global_step": 289802, "epoch": 2395} {"train_loss": -41.088836669921875, "global_step": 289803, "epoch": 2395} {"train_loss": -41.92937088012695, "global_step": 289804, "epoch": 2395} {"train_loss": -40.38262176513672, "global_step": 289805, "epoch": 2395} {"train_loss": -42.261322021484375, "global_step": 289806, "epoch": 2395} {"train_loss": -41.8236083984375, "global_step": 289807, "epoch": 2395} {"train_loss": -42.04572677612305, "global_step": 289808, "epoch": 2395} {"train_loss": -42.93941116333008, "global_step": 289809, "epoch": 2395} {"train_loss": -41.18058395385742, "global_step": 289810, "epoch": 2395} {"train_loss": -42.448951721191406, "global_step": 289811, "epoch": 2395} {"train_loss": -42.343929290771484, "global_step": 289812, "epoch": 2395} {"train_loss": -41.985328674316406, "global_step": 289813, "epoch": 2395} {"train_loss": -42.21126937866211, "global_step": 289814, "epoch": 2395} {"train_loss": -41.752906799316406, "global_step": 289815, "epoch": 2395} {"train_loss": -42.974666595458984, "global_step": 289816, "epoch": 2395} {"train_loss": -42.5744514465332, "global_step": 289817, "epoch": 2395} {"train_loss": -41.45530319213867, "global_step": 289818, "epoch": 2395} {"train_loss": -42.60072326660156, "global_step": 289819, "epoch": 2395} {"train_loss": -41.58767318725586, "global_step": 289820, "epoch": 2395} {"train_loss": -42.86827087402344, "global_step": 289821, "epoch": 2395} {"train_loss": -42.770484924316406, "global_step": 289822, "epoch": 2395} {"train_loss": -42.31972885131836, "global_step": 289823, "epoch": 2395} {"train_loss": -42.61642074584961, "global_step": 289824, "epoch": 2395} {"train_loss": -41.95315170288086, "global_step": 289825, "epoch": 2395} {"train_loss": -42.64906692504883, "global_step": 289826, "epoch": 2395} {"train_loss": -42.8448486328125, "global_step": 289827, "epoch": 2395} {"train_loss": -42.47834014892578, "global_step": 289828, "epoch": 2395} {"train_loss": -42.18497848510742, "global_step": 289829, "epoch": 2395} {"train_loss": -43.05685043334961, "global_step": 289830, "epoch": 2395} {"train_loss": -42.850013732910156, "global_step": 289831, "epoch": 2395} {"train_loss": -42.90304183959961, "global_step": 289832, "epoch": 2395} {"train_loss": -43.261474609375, "global_step": 289833, "epoch": 2395} {"train_loss": -42.58720397949219, "global_step": 289834, "epoch": 2395} {"train_loss": -43.08146286010742, "global_step": 289835, "epoch": 2395} {"train_loss": -43.01325988769531, "global_step": 289836, "epoch": 2395} {"train_loss": -43.68251419067383, "global_step": 289837, "epoch": 2395} {"train_loss": -43.20676803588867, "global_step": 289838, "epoch": 2395} {"train_loss": -43.524898529052734, "global_step": 289839, "epoch": 2395} {"train_loss": -43.577980041503906, "global_step": 289840, "epoch": 2395} {"train_loss": -44.076454162597656, "global_step": 289841, "epoch": 2395} {"train_loss": -43.661407470703125, "global_step": 289842, "epoch": 2395} {"train_loss": -43.42066192626953, "global_step": 289843, "epoch": 2395} {"train_loss": -43.33763122558594, "global_step": 289844, "epoch": 2395} {"train_loss": -43.736122131347656, "global_step": 289845, "epoch": 2395} {"train_loss": -42.22805404663086, "global_step": 289846, "epoch": 2395} {"train_loss": -42.77237319946289, "global_step": 289847, "epoch": 2395} {"train_loss": -43.25798416137695, "global_step": 289848, "epoch": 2395} {"train_loss": -43.59538650512695, "global_step": 289849, "epoch": 2395} {"train_loss": -43.13957595825195, "global_step": 289850, "epoch": 2395} {"train_loss": -43.34821701049805, "global_step": 289851, "epoch": 2395} {"train_loss": -41.97750473022461, "global_step": 289852, "epoch": 2395} {"train_loss": -43.691612243652344, "global_step": 289853, "epoch": 2395} {"train_loss": -42.44388198852539, "global_step": 289854, "epoch": 2395} {"train_loss": -42.97123336791992, "global_step": 289855, "epoch": 2395} {"train_loss": -43.08486557006836, "global_step": 289856, "epoch": 2395} {"train_loss": -43.78072738647461, "global_step": 289857, "epoch": 2395} {"train_loss": -43.01776885986328, "global_step": 289858, "epoch": 2395} {"train_loss": -42.46767044067383, "global_step": 289859, "epoch": 2395} {"train_loss": -43.2962646484375, "global_step": 289860, "epoch": 2395} {"train_loss": -43.33781051635742, "global_step": 289861, "epoch": 2395} {"train_loss": -42.64138412475586, "global_step": 289862, "epoch": 2395} {"train_loss": -43.695709228515625, "global_step": 289863, "epoch": 2395} {"train_loss": -43.06023025512695, "global_step": 289864, "epoch": 2395} {"train_loss": -42.084693908691406, "global_step": 289865, "epoch": 2395} {"train_loss": -43.21547317504883, "global_step": 289866, "epoch": 2395} {"train_loss": -42.979034423828125, "global_step": 289867, "epoch": 2395} {"train_loss": -43.40971755981445, "global_step": 289868, "epoch": 2395} {"train_loss": -42.4529914855957, "global_step": 289869, "epoch": 2395} {"train_loss": -43.699031829833984, "global_step": 289870, "epoch": 2395} {"train_loss": -42.49088668823242, "global_step": 289871, "epoch": 2395} {"train_loss": -40.538917541503906, "global_step": 289872, "epoch": 2395} {"train_loss": -41.836647033691406, "global_step": 289873, "epoch": 2395} {"train_loss": -43.034420013427734, "global_step": 289874, "epoch": 2395} {"train_loss": -43.974788665771484, "global_step": 289875, "epoch": 2395} {"train_loss": -42.5675163269043, "global_step": 289876, "epoch": 2395} {"train_loss": -43.397666931152344, "global_step": 289877, "epoch": 2395} {"train_loss": -43.04278564453125, "global_step": 289878, "epoch": 2395} {"train_loss": -42.85627365112305, "global_step": 289879, "epoch": 2395} {"train_loss": -42.59857940673828, "global_step": 289880, "epoch": 2395} {"train_loss": -43.70527267456055, "global_step": 289881, "epoch": 2395} {"train_loss": -42.83950424194336, "global_step": 289882, "epoch": 2395} {"train_loss": -41.0280647277832, "global_step": 289883, "epoch": 2395} {"train_loss": -43.125282287597656, "global_step": 289884, "epoch": 2395} {"train_loss": -43.341644287109375, "global_step": 289885, "epoch": 2395} {"train_loss": -42.30765914916992, "global_step": 289886, "epoch": 2395} {"train_loss": -43.21317672729492, "global_step": 289887, "epoch": 2395} {"train_loss": -43.562217712402344, "global_step": 289888, "epoch": 2395} {"train_loss": -43.204280853271484, "global_step": 289889, "epoch": 2395} {"train_loss": -43.64711380004883, "global_step": 289890, "epoch": 2395} {"train_loss": -42.909393310546875, "global_step": 289891, "epoch": 2395} {"train_loss": -43.009944915771484, "global_step": 289892, "epoch": 2395} {"train_loss": -42.79130172729492, "global_step": 289893, "epoch": 2395} {"train_loss": -43.17367172241211, "global_step": 289894, "epoch": 2395} {"train_loss": -43.0278434753418, "global_step": 289895, "epoch": 2395} {"train_loss": -43.05231857299805, "global_step": 289896, "epoch": 2395} {"train_loss": -43.72296905517578, "global_step": 289897, "epoch": 2395} {"train_loss": -42.86750411987305, "global_step": 289898, "epoch": 2395} {"train_loss": -42.897926330566406, "global_step": 289899, "epoch": 2395} {"train_loss": -42.33319854736328, "global_step": 289900, "epoch": 2395} {"train_loss": -44.095882415771484, "global_step": 289901, "epoch": 2395} {"train_loss": -41.976436614990234, "global_step": 289902, "epoch": 2395} {"train_loss": -43.74045181274414, "global_step": 289903, "epoch": 2395} {"train_loss": -42.10022735595703, "global_step": 289904, "epoch": 2395} {"train_loss": -42.273616790771484, "global_step": 289905, "epoch": 2395} {"train_loss": -42.718990325927734, "global_step": 289906, "epoch": 2395} {"train_loss": -42.41259765625, "global_step": 289907, "epoch": 2395} {"train_loss": -42.99309158325195, "global_step": 289908, "epoch": 2395} {"train_loss": -42.84040451049805, "global_step": 289909, "epoch": 2395} {"train_loss": -42.0976676940918, "global_step": 289910, "epoch": 2395} {"train_loss": -42.28840255737305, "global_step": 289911, "epoch": 2395} {"train_loss": -42.3286018371582, "global_step": 289912, "epoch": 2395} {"train_loss": -42.296226501464844, "global_step": 289913, "epoch": 2395} {"train_loss": -43.113685607910156, "global_step": 289914, "epoch": 2395} {"train_loss": -42.52818301492486, "global_step": 289915, "epoch": 2395, "val_loss": 2509352.25} {"train_loss": -42.55587387084961, "global_step": 289916, "epoch": 2396} {"train_loss": -43.06869125366211, "global_step": 289917, "epoch": 2396} {"train_loss": -42.64389419555664, "global_step": 289918, "epoch": 2396} {"train_loss": -41.708770751953125, "global_step": 289919, "epoch": 2396} {"train_loss": -43.1627311706543, "global_step": 289920, "epoch": 2396} {"train_loss": -42.310821533203125, "global_step": 289921, "epoch": 2396} {"train_loss": -42.94677734375, "global_step": 289922, "epoch": 2396} {"train_loss": -42.951473236083984, "global_step": 289923, "epoch": 2396} {"train_loss": -42.42497634887695, "global_step": 289924, "epoch": 2396} {"train_loss": -42.49893569946289, "global_step": 289925, "epoch": 2396} {"train_loss": -42.79397964477539, "global_step": 289926, "epoch": 2396} {"train_loss": -43.03811264038086, "global_step": 289927, "epoch": 2396} {"train_loss": -43.000274658203125, "global_step": 289928, "epoch": 2396} {"train_loss": -42.26435470581055, "global_step": 289929, "epoch": 2396} {"train_loss": -42.06924057006836, "global_step": 289930, "epoch": 2396} {"train_loss": -43.31269454956055, "global_step": 289931, "epoch": 2396} {"train_loss": -42.076324462890625, "global_step": 289932, "epoch": 2396} {"train_loss": -42.39531326293945, "global_step": 289933, "epoch": 2396} {"train_loss": -42.49905014038086, "global_step": 289934, "epoch": 2396} {"train_loss": -42.43891525268555, "global_step": 289935, "epoch": 2396} {"train_loss": -41.436431884765625, "global_step": 289936, "epoch": 2396} {"train_loss": -40.76725387573242, "global_step": 289937, "epoch": 2396} {"train_loss": -42.38856887817383, "global_step": 289938, "epoch": 2396} {"train_loss": -40.85091018676758, "global_step": 289939, "epoch": 2396} {"train_loss": -42.42045974731445, "global_step": 289940, "epoch": 2396} {"train_loss": -41.475101470947266, "global_step": 289941, "epoch": 2396} {"train_loss": -40.56175231933594, "global_step": 289942, "epoch": 2396} {"train_loss": -43.080265045166016, "global_step": 289943, "epoch": 2396} {"train_loss": -39.82340621948242, "global_step": 289944, "epoch": 2396} {"train_loss": -41.24289321899414, "global_step": 289945, "epoch": 2396} {"train_loss": -43.189754486083984, "global_step": 289946, "epoch": 2396} {"train_loss": -41.69416427612305, "global_step": 289947, "epoch": 2396} {"train_loss": -42.56382751464844, "global_step": 289948, "epoch": 2396} {"train_loss": -43.1139030456543, "global_step": 289949, "epoch": 2396} {"train_loss": -40.477603912353516, "global_step": 289950, "epoch": 2396} {"train_loss": -41.731327056884766, "global_step": 289951, "epoch": 2396} {"train_loss": -41.935054779052734, "global_step": 289952, "epoch": 2396} {"train_loss": -42.00710678100586, "global_step": 289953, "epoch": 2396} {"train_loss": -43.23429489135742, "global_step": 289954, "epoch": 2396} {"train_loss": -42.54103469848633, "global_step": 289955, "epoch": 2396} {"train_loss": -42.57405471801758, "global_step": 289956, "epoch": 2396} {"train_loss": -42.8347053527832, "global_step": 289957, "epoch": 2396} {"train_loss": -42.98673629760742, "global_step": 289958, "epoch": 2396} {"train_loss": -42.47938919067383, "global_step": 289959, "epoch": 2396} {"train_loss": -40.87807846069336, "global_step": 289960, "epoch": 2396} {"train_loss": -42.55168533325195, "global_step": 289961, "epoch": 2396} {"train_loss": -42.758914947509766, "global_step": 289962, "epoch": 2396} {"train_loss": -41.034698486328125, "global_step": 289963, "epoch": 2396} {"train_loss": -42.26551055908203, "global_step": 289964, "epoch": 2396} {"train_loss": -42.15386962890625, "global_step": 289965, "epoch": 2396} {"train_loss": -40.68525314331055, "global_step": 289966, "epoch": 2396} {"train_loss": -41.95509338378906, "global_step": 289967, "epoch": 2396} {"train_loss": -43.12055206298828, "global_step": 289968, "epoch": 2396} {"train_loss": -42.36782455444336, "global_step": 289969, "epoch": 2396} {"train_loss": -42.780784606933594, "global_step": 289970, "epoch": 2396} {"train_loss": -41.97530746459961, "global_step": 289971, "epoch": 2396} {"train_loss": -41.27560043334961, "global_step": 289972, "epoch": 2396} {"train_loss": -43.380367279052734, "global_step": 289973, "epoch": 2396} {"train_loss": -41.84130096435547, "global_step": 289974, "epoch": 2396} {"train_loss": -40.18101119995117, "global_step": 289975, "epoch": 2396} {"train_loss": -42.245975494384766, "global_step": 289976, "epoch": 2396} {"train_loss": -42.70951461791992, "global_step": 289977, "epoch": 2396} {"train_loss": -42.58344268798828, "global_step": 289978, "epoch": 2396} {"train_loss": -42.470123291015625, "global_step": 289979, "epoch": 2396} {"train_loss": -42.76552963256836, "global_step": 289980, "epoch": 2396} {"train_loss": -43.633056640625, "global_step": 289981, "epoch": 2396} {"train_loss": -42.485626220703125, "global_step": 289982, "epoch": 2396} {"train_loss": -43.07814025878906, "global_step": 289983, "epoch": 2396} {"train_loss": -43.095516204833984, "global_step": 289984, "epoch": 2396} {"train_loss": -43.03837585449219, "global_step": 289985, "epoch": 2396} {"train_loss": -43.3284797668457, "global_step": 289986, "epoch": 2396} {"train_loss": -43.27848434448242, "global_step": 289987, "epoch": 2396} {"train_loss": -43.78205108642578, "global_step": 289988, "epoch": 2396} {"train_loss": -43.470237731933594, "global_step": 289989, "epoch": 2396} {"train_loss": -43.22829818725586, "global_step": 289990, "epoch": 2396} {"train_loss": -43.85041809082031, "global_step": 289991, "epoch": 2396} {"train_loss": -43.098384857177734, "global_step": 289992, "epoch": 2396} {"train_loss": -43.77070236206055, "global_step": 289993, "epoch": 2396} {"train_loss": -43.0271110534668, "global_step": 289994, "epoch": 2396} {"train_loss": -43.602386474609375, "global_step": 289995, "epoch": 2396} {"train_loss": -42.68292999267578, "global_step": 289996, "epoch": 2396} {"train_loss": -43.4472770690918, "global_step": 289997, "epoch": 2396} {"train_loss": -43.49130630493164, "global_step": 289998, "epoch": 2396} {"train_loss": -42.37302780151367, "global_step": 289999, "epoch": 2396} {"train_loss": -43.90253448486328, "global_step": 290000, "epoch": 2396} {"train_loss": -43.10634994506836, "global_step": 290001, "epoch": 2396} {"train_loss": -43.093994140625, "global_step": 290002, "epoch": 2396} {"train_loss": -42.7372932434082, "global_step": 290003, "epoch": 2396} {"train_loss": -43.54423141479492, "global_step": 290004, "epoch": 2396} {"train_loss": -43.06522750854492, "global_step": 290005, "epoch": 2396} {"train_loss": -42.940181732177734, "global_step": 290006, "epoch": 2396} {"train_loss": -43.37896728515625, "global_step": 290007, "epoch": 2396} {"train_loss": -42.41242599487305, "global_step": 290008, "epoch": 2396} {"train_loss": -43.120826721191406, "global_step": 290009, "epoch": 2396} {"train_loss": -43.67424392700195, "global_step": 290010, "epoch": 2396} {"train_loss": -42.954139709472656, "global_step": 290011, "epoch": 2396} {"train_loss": -42.462615966796875, "global_step": 290012, "epoch": 2396} {"train_loss": -43.96640396118164, "global_step": 290013, "epoch": 2396} {"train_loss": -42.9369010925293, "global_step": 290014, "epoch": 2396} {"train_loss": -43.33121871948242, "global_step": 290015, "epoch": 2396} {"train_loss": -43.96025848388672, "global_step": 290016, "epoch": 2396} {"train_loss": -43.41217041015625, "global_step": 290017, "epoch": 2396} {"train_loss": -43.698394775390625, "global_step": 290018, "epoch": 2396} {"train_loss": -43.793800354003906, "global_step": 290019, "epoch": 2396} {"train_loss": -43.23258590698242, "global_step": 290020, "epoch": 2396} {"train_loss": -43.83048629760742, "global_step": 290021, "epoch": 2396} {"train_loss": -43.45891189575195, "global_step": 290022, "epoch": 2396} {"train_loss": -43.56330490112305, "global_step": 290023, "epoch": 2396} {"train_loss": -43.35945129394531, "global_step": 290024, "epoch": 2396} {"train_loss": -43.642120361328125, "global_step": 290025, "epoch": 2396} {"train_loss": -42.84659957885742, "global_step": 290026, "epoch": 2396} {"train_loss": -43.330081939697266, "global_step": 290027, "epoch": 2396} {"train_loss": -44.04401397705078, "global_step": 290028, "epoch": 2396} {"train_loss": -42.92910385131836, "global_step": 290029, "epoch": 2396} {"train_loss": -39.42954635620117, "global_step": 290030, "epoch": 2396} {"train_loss": -42.9804801940918, "global_step": 290031, "epoch": 2396} {"train_loss": -42.98634338378906, "global_step": 290032, "epoch": 2396} {"train_loss": -42.46026611328125, "global_step": 290033, "epoch": 2396} {"train_loss": -41.83125686645508, "global_step": 290034, "epoch": 2396} {"train_loss": -41.812652587890625, "global_step": 290035, "epoch": 2396} {"train_loss": -42.631599174058145, "global_step": 290036, "epoch": 2396, "val_loss": 2505835.0} {"train_loss": -42.17506408691406, "global_step": 290037, "epoch": 2397} {"train_loss": -41.40641403198242, "global_step": 290038, "epoch": 2397} {"train_loss": -42.71889877319336, "global_step": 290039, "epoch": 2397} {"train_loss": -41.394798278808594, "global_step": 290040, "epoch": 2397} {"train_loss": -41.93953323364258, "global_step": 290041, "epoch": 2397} {"train_loss": -42.35210037231445, "global_step": 290042, "epoch": 2397} {"train_loss": -42.096412658691406, "global_step": 290043, "epoch": 2397} {"train_loss": -32.77024459838867, "global_step": 290044, "epoch": 2397} {"train_loss": -39.68855667114258, "global_step": 290045, "epoch": 2397} {"train_loss": -42.56000900268555, "global_step": 290046, "epoch": 2397} {"train_loss": -42.00748825073242, "global_step": 290047, "epoch": 2397} {"train_loss": -40.621795654296875, "global_step": 290048, "epoch": 2397} {"train_loss": -42.954036712646484, "global_step": 290049, "epoch": 2397} {"train_loss": -41.25727081298828, "global_step": 290050, "epoch": 2397} {"train_loss": -41.11988067626953, "global_step": 290051, "epoch": 2397} {"train_loss": -41.752197265625, "global_step": 290052, "epoch": 2397} {"train_loss": -40.90904998779297, "global_step": 290053, "epoch": 2397} {"train_loss": -41.43037796020508, "global_step": 290054, "epoch": 2397} {"train_loss": -41.7685546875, "global_step": 290055, "epoch": 2397} {"train_loss": -41.62519073486328, "global_step": 290056, "epoch": 2397} {"train_loss": -42.20317459106445, "global_step": 290057, "epoch": 2397} {"train_loss": -42.11391830444336, "global_step": 290058, "epoch": 2397} {"train_loss": -41.77669143676758, "global_step": 290059, "epoch": 2397} {"train_loss": -32.97034454345703, "global_step": 290060, "epoch": 2397} {"train_loss": -41.787776947021484, "global_step": 290061, "epoch": 2397} {"train_loss": -41.00077438354492, "global_step": 290062, "epoch": 2397} {"train_loss": -39.059906005859375, "global_step": 290063, "epoch": 2397} {"train_loss": -41.77717208862305, "global_step": 290064, "epoch": 2397} {"train_loss": -41.40107727050781, "global_step": 290065, "epoch": 2397} {"train_loss": -42.409400939941406, "global_step": 290066, "epoch": 2397} {"train_loss": -42.44190979003906, "global_step": 290067, "epoch": 2397} {"train_loss": -42.24492645263672, "global_step": 290068, "epoch": 2397} {"train_loss": -41.92851257324219, "global_step": 290069, "epoch": 2397} {"train_loss": -41.21961975097656, "global_step": 290070, "epoch": 2397} {"train_loss": -42.06815719604492, "global_step": 290071, "epoch": 2397} {"train_loss": -41.927833557128906, "global_step": 290072, "epoch": 2397} {"train_loss": -41.784461975097656, "global_step": 290073, "epoch": 2397} {"train_loss": -42.06972122192383, "global_step": 290074, "epoch": 2397} {"train_loss": -41.1182975769043, "global_step": 290075, "epoch": 2397} {"train_loss": -41.968849182128906, "global_step": 290076, "epoch": 2397} {"train_loss": -42.636661529541016, "global_step": 290077, "epoch": 2397} {"train_loss": -41.94828414916992, "global_step": 290078, "epoch": 2397} {"train_loss": -42.18878936767578, "global_step": 290079, "epoch": 2397} {"train_loss": -41.835243225097656, "global_step": 290080, "epoch": 2397} {"train_loss": -42.02354049682617, "global_step": 290081, "epoch": 2397} {"train_loss": -42.65591049194336, "global_step": 290082, "epoch": 2397} {"train_loss": -42.465003967285156, "global_step": 290083, "epoch": 2397} {"train_loss": -43.39182662963867, "global_step": 290084, "epoch": 2397} {"train_loss": -41.90794372558594, "global_step": 290085, "epoch": 2397} {"train_loss": -40.1544075012207, "global_step": 290086, "epoch": 2397} {"train_loss": -43.032222747802734, "global_step": 290087, "epoch": 2397} {"train_loss": -42.198116302490234, "global_step": 290088, "epoch": 2397} {"train_loss": -41.66972732543945, "global_step": 290089, "epoch": 2397} {"train_loss": -43.51515579223633, "global_step": 290090, "epoch": 2397} {"train_loss": -42.654415130615234, "global_step": 290091, "epoch": 2397} {"train_loss": -43.37458038330078, "global_step": 290092, "epoch": 2397} {"train_loss": -43.34366989135742, "global_step": 290093, "epoch": 2397} {"train_loss": -43.17290115356445, "global_step": 290094, "epoch": 2397} {"train_loss": -42.68574142456055, "global_step": 290095, "epoch": 2397} {"train_loss": -42.16297149658203, "global_step": 290096, "epoch": 2397} {"train_loss": -43.091243743896484, "global_step": 290097, "epoch": 2397} {"train_loss": -42.50262451171875, "global_step": 290098, "epoch": 2397} {"train_loss": -43.475894927978516, "global_step": 290099, "epoch": 2397} {"train_loss": -43.436885833740234, "global_step": 290100, "epoch": 2397} {"train_loss": -42.80120849609375, "global_step": 290101, "epoch": 2397} {"train_loss": -41.85097885131836, "global_step": 290102, "epoch": 2397} {"train_loss": -43.421260833740234, "global_step": 290103, "epoch": 2397} {"train_loss": -43.391273498535156, "global_step": 290104, "epoch": 2397} {"train_loss": -43.14752960205078, "global_step": 290105, "epoch": 2397} {"train_loss": -43.77679443359375, "global_step": 290106, "epoch": 2397} {"train_loss": -43.27928924560547, "global_step": 290107, "epoch": 2397} {"train_loss": -43.70309066772461, "global_step": 290108, "epoch": 2397} {"train_loss": -43.61673355102539, "global_step": 290109, "epoch": 2397} {"train_loss": -42.85708999633789, "global_step": 290110, "epoch": 2397} {"train_loss": -44.15847396850586, "global_step": 290111, "epoch": 2397} {"train_loss": -43.56932830810547, "global_step": 290112, "epoch": 2397} {"train_loss": -43.7156867980957, "global_step": 290113, "epoch": 2397} {"train_loss": -43.8116569519043, "global_step": 290114, "epoch": 2397} {"train_loss": -43.880043029785156, "global_step": 290115, "epoch": 2397} {"train_loss": -43.60938262939453, "global_step": 290116, "epoch": 2397} {"train_loss": -43.88371658325195, "global_step": 290117, "epoch": 2397} {"train_loss": -42.50011444091797, "global_step": 290118, "epoch": 2397} {"train_loss": -43.77193069458008, "global_step": 290119, "epoch": 2397} {"train_loss": -43.84406280517578, "global_step": 290120, "epoch": 2397} {"train_loss": -44.27740478515625, "global_step": 290121, "epoch": 2397} {"train_loss": -43.5614013671875, "global_step": 290122, "epoch": 2397} {"train_loss": -43.22520065307617, "global_step": 290123, "epoch": 2397} {"train_loss": -43.98727035522461, "global_step": 290124, "epoch": 2397} {"train_loss": -43.58435821533203, "global_step": 290125, "epoch": 2397} {"train_loss": -43.68143844604492, "global_step": 290126, "epoch": 2397} {"train_loss": -42.8812141418457, "global_step": 290127, "epoch": 2397} {"train_loss": -41.71458053588867, "global_step": 290128, "epoch": 2397} {"train_loss": -41.81099319458008, "global_step": 290129, "epoch": 2397} {"train_loss": -42.45380783081055, "global_step": 290130, "epoch": 2397} {"train_loss": -42.9370002746582, "global_step": 290131, "epoch": 2397} {"train_loss": -43.989601135253906, "global_step": 290132, "epoch": 2397} {"train_loss": -43.2610969543457, "global_step": 290133, "epoch": 2397} {"train_loss": -43.822628021240234, "global_step": 290134, "epoch": 2397} {"train_loss": -42.66535949707031, "global_step": 290135, "epoch": 2397} {"train_loss": -43.257110595703125, "global_step": 290136, "epoch": 2397} {"train_loss": -42.677730560302734, "global_step": 290137, "epoch": 2397} {"train_loss": -43.466041564941406, "global_step": 290138, "epoch": 2397} {"train_loss": -42.7147331237793, "global_step": 290139, "epoch": 2397} {"train_loss": -42.79024887084961, "global_step": 290140, "epoch": 2397} {"train_loss": -43.442508697509766, "global_step": 290141, "epoch": 2397} {"train_loss": -42.426673889160156, "global_step": 290142, "epoch": 2397} {"train_loss": -43.58123779296875, "global_step": 290143, "epoch": 2397} {"train_loss": -43.21565628051758, "global_step": 290144, "epoch": 2397} {"train_loss": -43.34157943725586, "global_step": 290145, "epoch": 2397} {"train_loss": -43.827980041503906, "global_step": 290146, "epoch": 2397} {"train_loss": -43.0971565246582, "global_step": 290147, "epoch": 2397} {"train_loss": -42.972591400146484, "global_step": 290148, "epoch": 2397} {"train_loss": -43.70389938354492, "global_step": 290149, "epoch": 2397} {"train_loss": -43.24142074584961, "global_step": 290150, "epoch": 2397} {"train_loss": -42.87443161010742, "global_step": 290151, "epoch": 2397} {"train_loss": -44.08465576171875, "global_step": 290152, "epoch": 2397} {"train_loss": -43.76569366455078, "global_step": 290153, "epoch": 2397} {"train_loss": -43.20573806762695, "global_step": 290154, "epoch": 2397} {"train_loss": -43.91410446166992, "global_step": 290155, "epoch": 2397} {"train_loss": -43.789546966552734, "global_step": 290156, "epoch": 2397} {"train_loss": -42.482155855036964, "global_step": 290157, "epoch": 2397, "val_loss": 2511445.25} {"train_loss": -43.33425521850586, "global_step": 290158, "epoch": 2398} {"train_loss": -43.712547302246094, "global_step": 290159, "epoch": 2398} {"train_loss": -42.81573486328125, "global_step": 290160, "epoch": 2398} {"train_loss": -43.96170425415039, "global_step": 290161, "epoch": 2398} {"train_loss": -42.21255111694336, "global_step": 290162, "epoch": 2398} {"train_loss": -42.8889274597168, "global_step": 290163, "epoch": 2398} {"train_loss": -43.9455680847168, "global_step": 290164, "epoch": 2398} {"train_loss": -42.2712516784668, "global_step": 290165, "epoch": 2398} {"train_loss": -42.20009994506836, "global_step": 290166, "epoch": 2398} {"train_loss": -43.74203109741211, "global_step": 290167, "epoch": 2398} {"train_loss": -42.66145706176758, "global_step": 290168, "epoch": 2398} {"train_loss": -42.1173095703125, "global_step": 290169, "epoch": 2398} {"train_loss": -42.87153244018555, "global_step": 290170, "epoch": 2398} {"train_loss": -43.007564544677734, "global_step": 290171, "epoch": 2398} {"train_loss": -43.55769729614258, "global_step": 290172, "epoch": 2398} {"train_loss": -43.816280364990234, "global_step": 290173, "epoch": 2398} {"train_loss": -42.87592697143555, "global_step": 290174, "epoch": 2398} {"train_loss": -44.08934783935547, "global_step": 290175, "epoch": 2398} {"train_loss": -43.759307861328125, "global_step": 290176, "epoch": 2398} {"train_loss": -43.8242073059082, "global_step": 290177, "epoch": 2398} {"train_loss": -43.556758880615234, "global_step": 290178, "epoch": 2398} {"train_loss": -44.456905364990234, "global_step": 290179, "epoch": 2398} {"train_loss": -43.10505294799805, "global_step": 290180, "epoch": 2398} {"train_loss": -43.41825485229492, "global_step": 290181, "epoch": 2398} {"train_loss": -43.43864059448242, "global_step": 290182, "epoch": 2398} {"train_loss": -43.03717041015625, "global_step": 290183, "epoch": 2398} {"train_loss": -42.19007873535156, "global_step": 290184, "epoch": 2398} {"train_loss": -41.92648696899414, "global_step": 290185, "epoch": 2398} {"train_loss": -43.39805221557617, "global_step": 290186, "epoch": 2398} {"train_loss": -42.74009323120117, "global_step": 290187, "epoch": 2398} {"train_loss": -41.16189193725586, "global_step": 290188, "epoch": 2398} {"train_loss": -42.63296127319336, "global_step": 290189, "epoch": 2398} {"train_loss": -43.15509796142578, "global_step": 290190, "epoch": 2398} {"train_loss": -42.44790267944336, "global_step": 290191, "epoch": 2398} {"train_loss": -41.347625732421875, "global_step": 290192, "epoch": 2398} {"train_loss": -42.830162048339844, "global_step": 290193, "epoch": 2398} {"train_loss": -43.047245025634766, "global_step": 290194, "epoch": 2398} {"train_loss": -41.569305419921875, "global_step": 290195, "epoch": 2398} {"train_loss": -43.257728576660156, "global_step": 290196, "epoch": 2398} {"train_loss": -43.02116775512695, "global_step": 290197, "epoch": 2398} {"train_loss": -42.3160514831543, "global_step": 290198, "epoch": 2398} {"train_loss": -42.59040069580078, "global_step": 290199, "epoch": 2398} {"train_loss": -42.53586959838867, "global_step": 290200, "epoch": 2398} {"train_loss": -43.392066955566406, "global_step": 290201, "epoch": 2398} {"train_loss": -43.14838790893555, "global_step": 290202, "epoch": 2398} {"train_loss": -42.11714553833008, "global_step": 290203, "epoch": 2398} {"train_loss": -43.24582290649414, "global_step": 290204, "epoch": 2398} {"train_loss": -43.64296340942383, "global_step": 290205, "epoch": 2398} {"train_loss": -43.363521575927734, "global_step": 290206, "epoch": 2398} {"train_loss": -42.395599365234375, "global_step": 290207, "epoch": 2398} {"train_loss": -43.66933822631836, "global_step": 290208, "epoch": 2398} {"train_loss": -43.85438919067383, "global_step": 290209, "epoch": 2398} {"train_loss": -43.640010833740234, "global_step": 290210, "epoch": 2398} {"train_loss": -43.31380844116211, "global_step": 290211, "epoch": 2398} {"train_loss": -41.244380950927734, "global_step": 290212, "epoch": 2398} {"train_loss": -42.31413650512695, "global_step": 290213, "epoch": 2398} {"train_loss": -43.03166580200195, "global_step": 290214, "epoch": 2398} {"train_loss": -43.2412223815918, "global_step": 290215, "epoch": 2398} {"train_loss": -43.40729904174805, "global_step": 290216, "epoch": 2398} {"train_loss": -42.6226692199707, "global_step": 290217, "epoch": 2398} {"train_loss": -43.460723876953125, "global_step": 290218, "epoch": 2398} {"train_loss": -43.617591857910156, "global_step": 290219, "epoch": 2398} {"train_loss": -42.797298431396484, "global_step": 290220, "epoch": 2398} {"train_loss": -42.27753448486328, "global_step": 290221, "epoch": 2398} {"train_loss": -42.401363372802734, "global_step": 290222, "epoch": 2398} {"train_loss": -41.951663970947266, "global_step": 290223, "epoch": 2398} {"train_loss": -41.38178253173828, "global_step": 290224, "epoch": 2398} {"train_loss": -43.655155181884766, "global_step": 290225, "epoch": 2398} {"train_loss": -42.93141555786133, "global_step": 290226, "epoch": 2398} {"train_loss": -41.9309196472168, "global_step": 290227, "epoch": 2398} {"train_loss": -41.843658447265625, "global_step": 290228, "epoch": 2398} {"train_loss": -43.364784240722656, "global_step": 290229, "epoch": 2398} {"train_loss": -42.35990524291992, "global_step": 290230, "epoch": 2398} {"train_loss": -42.15560531616211, "global_step": 290231, "epoch": 2398} {"train_loss": -43.91062545776367, "global_step": 290232, "epoch": 2398} {"train_loss": -41.44976806640625, "global_step": 290233, "epoch": 2398} {"train_loss": -42.22822189331055, "global_step": 290234, "epoch": 2398} {"train_loss": -43.337989807128906, "global_step": 290235, "epoch": 2398} {"train_loss": -39.95518112182617, "global_step": 290236, "epoch": 2398} {"train_loss": -43.59074783325195, "global_step": 290237, "epoch": 2398} {"train_loss": -40.942176818847656, "global_step": 290238, "epoch": 2398} {"train_loss": -41.259735107421875, "global_step": 290239, "epoch": 2398} {"train_loss": -42.22773742675781, "global_step": 290240, "epoch": 2398} {"train_loss": -40.52783203125, "global_step": 290241, "epoch": 2398} {"train_loss": -43.370643615722656, "global_step": 290242, "epoch": 2398} {"train_loss": -40.69462203979492, "global_step": 290243, "epoch": 2398} {"train_loss": -41.662410736083984, "global_step": 290244, "epoch": 2398} {"train_loss": -41.988582611083984, "global_step": 290245, "epoch": 2398} {"train_loss": -41.768714904785156, "global_step": 290246, "epoch": 2398} {"train_loss": -42.290679931640625, "global_step": 290247, "epoch": 2398} {"train_loss": -42.6397590637207, "global_step": 290248, "epoch": 2398} {"train_loss": -42.138092041015625, "global_step": 290249, "epoch": 2398} {"train_loss": -43.19242477416992, "global_step": 290250, "epoch": 2398} {"train_loss": -42.980743408203125, "global_step": 290251, "epoch": 2398} {"train_loss": -42.65235137939453, "global_step": 290252, "epoch": 2398} {"train_loss": -43.364784240722656, "global_step": 290253, "epoch": 2398} {"train_loss": -42.6248664855957, "global_step": 290254, "epoch": 2398} {"train_loss": -43.35334396362305, "global_step": 290255, "epoch": 2398} {"train_loss": -43.37242126464844, "global_step": 290256, "epoch": 2398} {"train_loss": -43.28131103515625, "global_step": 290257, "epoch": 2398} {"train_loss": -43.322235107421875, "global_step": 290258, "epoch": 2398} {"train_loss": -43.39377975463867, "global_step": 290259, "epoch": 2398} {"train_loss": -43.77708053588867, "global_step": 290260, "epoch": 2398} {"train_loss": -43.43976974487305, "global_step": 290261, "epoch": 2398} {"train_loss": -43.461631774902344, "global_step": 290262, "epoch": 2398} {"train_loss": -42.740478515625, "global_step": 290263, "epoch": 2398} {"train_loss": -43.443050384521484, "global_step": 290264, "epoch": 2398} {"train_loss": -43.93998336791992, "global_step": 290265, "epoch": 2398} {"train_loss": -43.114200592041016, "global_step": 290266, "epoch": 2398} {"train_loss": -43.94528579711914, "global_step": 290267, "epoch": 2398} {"train_loss": -43.68201446533203, "global_step": 290268, "epoch": 2398} {"train_loss": -43.17578887939453, "global_step": 290269, "epoch": 2398} {"train_loss": -42.961544036865234, "global_step": 290270, "epoch": 2398} {"train_loss": -43.16317367553711, "global_step": 290271, "epoch": 2398} {"train_loss": -43.38934326171875, "global_step": 290272, "epoch": 2398} {"train_loss": -42.5916862487793, "global_step": 290273, "epoch": 2398} {"train_loss": -43.183780670166016, "global_step": 290274, "epoch": 2398} {"train_loss": -43.62786865234375, "global_step": 290275, "epoch": 2398} {"train_loss": -43.66474151611328, "global_step": 290276, "epoch": 2398} {"train_loss": -43.282928466796875, "global_step": 290277, "epoch": 2398} {"train_loss": -42.85995013654725, "global_step": 290278, "epoch": 2398, "val_loss": 2456342.0} {"train_loss": -42.570465087890625, "global_step": 290279, "epoch": 2399} {"train_loss": -42.9471321105957, "global_step": 290280, "epoch": 2399} {"train_loss": -44.081172943115234, "global_step": 290281, "epoch": 2399} {"train_loss": -43.17258834838867, "global_step": 290282, "epoch": 2399} {"train_loss": -41.429771423339844, "global_step": 290283, "epoch": 2399} {"train_loss": -43.722564697265625, "global_step": 290284, "epoch": 2399} {"train_loss": -40.635013580322266, "global_step": 290285, "epoch": 2399} {"train_loss": -39.80820846557617, "global_step": 290286, "epoch": 2399} {"train_loss": -42.63150405883789, "global_step": 290287, "epoch": 2399} {"train_loss": -39.40424346923828, "global_step": 290288, "epoch": 2399} {"train_loss": -42.80548858642578, "global_step": 290289, "epoch": 2399} {"train_loss": -39.744895935058594, "global_step": 290290, "epoch": 2399} {"train_loss": -43.33988571166992, "global_step": 290291, "epoch": 2399} {"train_loss": -40.81196975708008, "global_step": 290292, "epoch": 2399} {"train_loss": -41.464271545410156, "global_step": 290293, "epoch": 2399} {"train_loss": -42.79062271118164, "global_step": 290294, "epoch": 2399} {"train_loss": -40.62189483642578, "global_step": 290295, "epoch": 2399} {"train_loss": -42.915382385253906, "global_step": 290296, "epoch": 2399} {"train_loss": -41.42159652709961, "global_step": 290297, "epoch": 2399} {"train_loss": -40.49127960205078, "global_step": 290298, "epoch": 2399} {"train_loss": -43.17439651489258, "global_step": 290299, "epoch": 2399} {"train_loss": -41.42325973510742, "global_step": 290300, "epoch": 2399} {"train_loss": -41.91529083251953, "global_step": 290301, "epoch": 2399} {"train_loss": -41.95764923095703, "global_step": 290302, "epoch": 2399} {"train_loss": -42.50429153442383, "global_step": 290303, "epoch": 2399} {"train_loss": -42.48417282104492, "global_step": 290304, "epoch": 2399} {"train_loss": -42.22688674926758, "global_step": 290305, "epoch": 2399} {"train_loss": -43.238094329833984, "global_step": 290306, "epoch": 2399} {"train_loss": -43.058536529541016, "global_step": 290307, "epoch": 2399} {"train_loss": -42.18464279174805, "global_step": 290308, "epoch": 2399} {"train_loss": -43.373695373535156, "global_step": 290309, "epoch": 2399} {"train_loss": -43.271480560302734, "global_step": 290310, "epoch": 2399} {"train_loss": -43.42568588256836, "global_step": 290311, "epoch": 2399} {"train_loss": -43.28004455566406, "global_step": 290312, "epoch": 2399} {"train_loss": -43.08460235595703, "global_step": 290313, "epoch": 2399} {"train_loss": -42.97854232788086, "global_step": 290314, "epoch": 2399} {"train_loss": -43.243038177490234, "global_step": 290315, "epoch": 2399} {"train_loss": -43.4580192565918, "global_step": 290316, "epoch": 2399} {"train_loss": -43.67818832397461, "global_step": 290317, "epoch": 2399} {"train_loss": -42.773189544677734, "global_step": 290318, "epoch": 2399} {"train_loss": -42.689674377441406, "global_step": 290319, "epoch": 2399} {"train_loss": -43.517513275146484, "global_step": 290320, "epoch": 2399} {"train_loss": -43.67830276489258, "global_step": 290321, "epoch": 2399} {"train_loss": -42.837799072265625, "global_step": 290322, "epoch": 2399} {"train_loss": -40.2713737487793, "global_step": 290323, "epoch": 2399} {"train_loss": -43.471736907958984, "global_step": 290324, "epoch": 2399} {"train_loss": -42.886714935302734, "global_step": 290325, "epoch": 2399} {"train_loss": -41.86021423339844, "global_step": 290326, "epoch": 2399} {"train_loss": -37.548179626464844, "global_step": 290327, "epoch": 2399} {"train_loss": -42.7113151550293, "global_step": 290328, "epoch": 2399} {"train_loss": -42.19091796875, "global_step": 290329, "epoch": 2399} {"train_loss": -42.86065673828125, "global_step": 290330, "epoch": 2399} {"train_loss": -40.82748794555664, "global_step": 290331, "epoch": 2399} {"train_loss": -42.48232650756836, "global_step": 290332, "epoch": 2399} {"train_loss": -43.14823532104492, "global_step": 290333, "epoch": 2399} {"train_loss": -32.89801788330078, "global_step": 290334, "epoch": 2399} {"train_loss": -41.51847457885742, "global_step": 290335, "epoch": 2399} {"train_loss": -42.3625602722168, "global_step": 290336, "epoch": 2399} {"train_loss": -42.8392448425293, "global_step": 290337, "epoch": 2399} {"train_loss": -43.222957611083984, "global_step": 290338, "epoch": 2399} {"train_loss": -41.0565071105957, "global_step": 290339, "epoch": 2399} {"train_loss": -42.499000549316406, "global_step": 290340, "epoch": 2399} {"train_loss": -38.16476058959961, "global_step": 290341, "epoch": 2399} {"train_loss": -42.090328216552734, "global_step": 290342, "epoch": 2399} {"train_loss": -41.9774055480957, "global_step": 290343, "epoch": 2399} {"train_loss": -42.811378479003906, "global_step": 290344, "epoch": 2399} {"train_loss": -42.39726638793945, "global_step": 290345, "epoch": 2399} {"train_loss": -43.14398956298828, "global_step": 290346, "epoch": 2399} {"train_loss": -42.20899963378906, "global_step": 290347, "epoch": 2399} {"train_loss": -40.986656188964844, "global_step": 290348, "epoch": 2399} {"train_loss": -42.90153121948242, "global_step": 290349, "epoch": 2399} {"train_loss": -42.63404083251953, "global_step": 290350, "epoch": 2399} {"train_loss": -42.11210250854492, "global_step": 290351, "epoch": 2399} {"train_loss": -42.87593460083008, "global_step": 290352, "epoch": 2399} {"train_loss": -42.9112434387207, "global_step": 290353, "epoch": 2399} {"train_loss": -42.66919708251953, "global_step": 290354, "epoch": 2399} {"train_loss": -42.93017578125, "global_step": 290355, "epoch": 2399} {"train_loss": -43.31877136230469, "global_step": 290356, "epoch": 2399} {"train_loss": -43.182796478271484, "global_step": 290357, "epoch": 2399} {"train_loss": -42.019466400146484, "global_step": 290358, "epoch": 2399} {"train_loss": -43.486427307128906, "global_step": 290359, "epoch": 2399} {"train_loss": -43.06719970703125, "global_step": 290360, "epoch": 2399} {"train_loss": -42.3095817565918, "global_step": 290361, "epoch": 2399} {"train_loss": -43.59687805175781, "global_step": 290362, "epoch": 2399} {"train_loss": -43.43294906616211, "global_step": 290363, "epoch": 2399} {"train_loss": -43.4500846862793, "global_step": 290364, "epoch": 2399} {"train_loss": -41.71216583251953, "global_step": 290365, "epoch": 2399} {"train_loss": -43.37456130981445, "global_step": 290366, "epoch": 2399} {"train_loss": -44.078224182128906, "global_step": 290367, "epoch": 2399} {"train_loss": -43.12115478515625, "global_step": 290368, "epoch": 2399} {"train_loss": -43.68387985229492, "global_step": 290369, "epoch": 2399} {"train_loss": -43.72774887084961, "global_step": 290370, "epoch": 2399} {"train_loss": -43.71819305419922, "global_step": 290371, "epoch": 2399} {"train_loss": -43.9243049621582, "global_step": 290372, "epoch": 2399} {"train_loss": -43.895790100097656, "global_step": 290373, "epoch": 2399} {"train_loss": -43.94301223754883, "global_step": 290374, "epoch": 2399} {"train_loss": -43.81890106201172, "global_step": 290375, "epoch": 2399} {"train_loss": -42.753700256347656, "global_step": 290376, "epoch": 2399} {"train_loss": -44.25392150878906, "global_step": 290377, "epoch": 2399} {"train_loss": -42.591552734375, "global_step": 290378, "epoch": 2399} {"train_loss": -43.79461669921875, "global_step": 290379, "epoch": 2399} {"train_loss": -42.55796813964844, "global_step": 290380, "epoch": 2399} {"train_loss": -43.836830139160156, "global_step": 290381, "epoch": 2399} {"train_loss": -43.676116943359375, "global_step": 290382, "epoch": 2399} {"train_loss": -43.91824722290039, "global_step": 290383, "epoch": 2399} {"train_loss": -44.14531707763672, "global_step": 290384, "epoch": 2399} {"train_loss": -43.743099212646484, "global_step": 290385, "epoch": 2399} {"train_loss": -44.30348587036133, "global_step": 290386, "epoch": 2399} {"train_loss": -43.78916931152344, "global_step": 290387, "epoch": 2399} {"train_loss": -44.0789680480957, "global_step": 290388, "epoch": 2399} {"train_loss": -43.99253463745117, "global_step": 290389, "epoch": 2399} {"train_loss": -43.729549407958984, "global_step": 290390, "epoch": 2399} {"train_loss": -44.28361129760742, "global_step": 290391, "epoch": 2399} {"train_loss": -44.00606918334961, "global_step": 290392, "epoch": 2399} {"train_loss": -43.94971466064453, "global_step": 290393, "epoch": 2399} {"train_loss": -43.66901779174805, "global_step": 290394, "epoch": 2399} {"train_loss": -43.817054748535156, "global_step": 290395, "epoch": 2399} {"train_loss": -42.451812744140625, "global_step": 290396, "epoch": 2399} {"train_loss": -42.788055419921875, "global_step": 290397, "epoch": 2399} {"train_loss": -43.58588409423828, "global_step": 290398, "epoch": 2399} {"train_loss": -42.63501594480404, "global_step": 290399, "epoch": 2399, "val_loss": 2461121.75} {"train_loss": -41.76412582397461, "global_step": 290400, "epoch": 2400} {"train_loss": -41.77567672729492, "global_step": 290401, "epoch": 2400} {"train_loss": -42.097408294677734, "global_step": 290402, "epoch": 2400} {"train_loss": -43.13458251953125, "global_step": 290403, "epoch": 2400} {"train_loss": -43.321563720703125, "global_step": 290404, "epoch": 2400} {"train_loss": -41.96828842163086, "global_step": 290405, "epoch": 2400} {"train_loss": -41.28989791870117, "global_step": 290406, "epoch": 2400} {"train_loss": -40.246334075927734, "global_step": 290407, "epoch": 2400} {"train_loss": -41.8903923034668, "global_step": 290408, "epoch": 2400} {"train_loss": -43.86330032348633, "global_step": 290409, "epoch": 2400} {"train_loss": -43.57251739501953, "global_step": 290410, "epoch": 2400} {"train_loss": -42.47119903564453, "global_step": 290411, "epoch": 2400} {"train_loss": -43.54512405395508, "global_step": 290412, "epoch": 2400} {"train_loss": -43.896644592285156, "global_step": 290413, "epoch": 2400} {"train_loss": -43.66971969604492, "global_step": 290414, "epoch": 2400} {"train_loss": -43.5614013671875, "global_step": 290415, "epoch": 2400} {"train_loss": -43.4393424987793, "global_step": 290416, "epoch": 2400} {"train_loss": -43.74443435668945, "global_step": 290417, "epoch": 2400} {"train_loss": -44.097530364990234, "global_step": 290418, "epoch": 2400} {"train_loss": -43.60590362548828, "global_step": 290419, "epoch": 2400} {"train_loss": -43.624576568603516, "global_step": 290420, "epoch": 2400} {"train_loss": -43.433929443359375, "global_step": 290421, "epoch": 2400} {"train_loss": -42.962249755859375, "global_step": 290422, "epoch": 2400} {"train_loss": -43.072052001953125, "global_step": 290423, "epoch": 2400} {"train_loss": -43.0359001159668, "global_step": 290424, "epoch": 2400} {"train_loss": -41.90940475463867, "global_step": 290425, "epoch": 2400} {"train_loss": -43.31005859375, "global_step": 290426, "epoch": 2400} {"train_loss": -42.36599349975586, "global_step": 290427, "epoch": 2400} {"train_loss": -42.14516830444336, "global_step": 290428, "epoch": 2400} {"train_loss": -40.849220275878906, "global_step": 290429, "epoch": 2400} {"train_loss": -41.97723388671875, "global_step": 290430, "epoch": 2400} {"train_loss": -42.17140579223633, "global_step": 290431, "epoch": 2400} {"train_loss": -40.4099006652832, "global_step": 290432, "epoch": 2400} {"train_loss": -40.61267852783203, "global_step": 290433, "epoch": 2400} {"train_loss": -43.076080322265625, "global_step": 290434, "epoch": 2400} {"train_loss": -39.13150405883789, "global_step": 290435, "epoch": 2400} {"train_loss": -42.979583740234375, "global_step": 290436, "epoch": 2400} {"train_loss": -40.55242156982422, "global_step": 290437, "epoch": 2400} {"train_loss": -37.31208801269531, "global_step": 290438, "epoch": 2400} {"train_loss": -42.83427429199219, "global_step": 290439, "epoch": 2400} {"train_loss": -38.88346481323242, "global_step": 290440, "epoch": 2400} {"train_loss": -39.245174407958984, "global_step": 290441, "epoch": 2400} {"train_loss": -39.06229019165039, "global_step": 290442, "epoch": 2400} {"train_loss": -39.82582473754883, "global_step": 290443, "epoch": 2400} {"train_loss": -42.35465621948242, "global_step": 290444, "epoch": 2400} {"train_loss": -42.123512268066406, "global_step": 290445, "epoch": 2400} {"train_loss": -40.48087692260742, "global_step": 290446, "epoch": 2400} {"train_loss": -43.07173538208008, "global_step": 290447, "epoch": 2400} {"train_loss": -39.53005599975586, "global_step": 290448, "epoch": 2400} {"train_loss": -40.76560592651367, "global_step": 290449, "epoch": 2400} {"train_loss": -42.10509490966797, "global_step": 290450, "epoch": 2400} {"train_loss": -39.43706512451172, "global_step": 290451, "epoch": 2400} {"train_loss": -41.58637237548828, "global_step": 290452, "epoch": 2400} {"train_loss": -40.931358337402344, "global_step": 290453, "epoch": 2400} {"train_loss": -40.20497512817383, "global_step": 290454, "epoch": 2400} {"train_loss": -42.84462356567383, "global_step": 290455, "epoch": 2400} {"train_loss": -41.095638275146484, "global_step": 290456, "epoch": 2400} {"train_loss": -41.83982467651367, "global_step": 290457, "epoch": 2400} {"train_loss": -41.9260368347168, "global_step": 290458, "epoch": 2400} {"train_loss": -40.864959716796875, "global_step": 290459, "epoch": 2400} {"train_loss": -42.5321044921875, "global_step": 290460, "epoch": 2400} {"train_loss": -41.144683837890625, "global_step": 290461, "epoch": 2400} {"train_loss": -42.285186767578125, "global_step": 290462, "epoch": 2400} {"train_loss": -41.334571838378906, "global_step": 290463, "epoch": 2400} {"train_loss": -41.76465606689453, "global_step": 290464, "epoch": 2400} {"train_loss": -42.903194427490234, "global_step": 290465, "epoch": 2400} {"train_loss": -41.51893997192383, "global_step": 290466, "epoch": 2400} {"train_loss": -42.34320068359375, "global_step": 290467, "epoch": 2400} {"train_loss": -42.30754852294922, "global_step": 290468, "epoch": 2400} {"train_loss": -42.15930938720703, "global_step": 290469, "epoch": 2400} {"train_loss": -42.98240280151367, "global_step": 290470, "epoch": 2400} {"train_loss": -41.642574310302734, "global_step": 290471, "epoch": 2400} {"train_loss": -43.00834274291992, "global_step": 290472, "epoch": 2400} {"train_loss": -42.95472717285156, "global_step": 290473, "epoch": 2400} {"train_loss": -42.359527587890625, "global_step": 290474, "epoch": 2400} {"train_loss": -43.0643424987793, "global_step": 290475, "epoch": 2400} {"train_loss": -43.49636459350586, "global_step": 290476, "epoch": 2400} {"train_loss": -42.67951202392578, "global_step": 290477, "epoch": 2400} {"train_loss": -43.0494270324707, "global_step": 290478, "epoch": 2400} {"train_loss": -42.57174301147461, "global_step": 290479, "epoch": 2400} {"train_loss": -43.3437614440918, "global_step": 290480, "epoch": 2400} {"train_loss": -43.65255355834961, "global_step": 290481, "epoch": 2400} {"train_loss": -43.06733703613281, "global_step": 290482, "epoch": 2400} {"train_loss": -43.868141174316406, "global_step": 290483, "epoch": 2400} {"train_loss": -43.27459716796875, "global_step": 290484, "epoch": 2400} {"train_loss": -43.65754699707031, "global_step": 290485, "epoch": 2400} {"train_loss": -43.690673828125, "global_step": 290486, "epoch": 2400} {"train_loss": -43.46340560913086, "global_step": 290487, "epoch": 2400} {"train_loss": -43.54372787475586, "global_step": 290488, "epoch": 2400} {"train_loss": -43.22932815551758, "global_step": 290489, "epoch": 2400} {"train_loss": -44.19208908081055, "global_step": 290490, "epoch": 2400} {"train_loss": -42.97111892700195, "global_step": 290491, "epoch": 2400} {"train_loss": -43.77253341674805, "global_step": 290492, "epoch": 2400} {"train_loss": -43.20595169067383, "global_step": 290493, "epoch": 2400} {"train_loss": -44.07464599609375, "global_step": 290494, "epoch": 2400} {"train_loss": -43.91355514526367, "global_step": 290495, "epoch": 2400} {"train_loss": -43.92900085449219, "global_step": 290496, "epoch": 2400} {"train_loss": -43.700782775878906, "global_step": 290497, "epoch": 2400} {"train_loss": -43.93400192260742, "global_step": 290498, "epoch": 2400} {"train_loss": -43.57224655151367, "global_step": 290499, "epoch": 2400} {"train_loss": -43.609642028808594, "global_step": 290500, "epoch": 2400} {"train_loss": -43.87620162963867, "global_step": 290501, "epoch": 2400} {"train_loss": -43.840553283691406, "global_step": 290502, "epoch": 2400} {"train_loss": -44.25447082519531, "global_step": 290503, "epoch": 2400} {"train_loss": -44.463993072509766, "global_step": 290504, "epoch": 2400} {"train_loss": -44.1595458984375, "global_step": 290505, "epoch": 2400} {"train_loss": -44.42609786987305, "global_step": 290506, "epoch": 2400} {"train_loss": -44.57685470581055, "global_step": 290507, "epoch": 2400} {"train_loss": -44.45647048950195, "global_step": 290508, "epoch": 2400} {"train_loss": -44.114959716796875, "global_step": 290509, "epoch": 2400} {"train_loss": -44.4026985168457, "global_step": 290510, "epoch": 2400} {"train_loss": -44.47898483276367, "global_step": 290511, "epoch": 2400} {"train_loss": -44.5644416809082, "global_step": 290512, "epoch": 2400} {"train_loss": -44.39231491088867, "global_step": 290513, "epoch": 2400} {"train_loss": -44.59560012817383, "global_step": 290514, "epoch": 2400} {"train_loss": -43.93966293334961, "global_step": 290515, "epoch": 2400} {"train_loss": -44.369361877441406, "global_step": 290516, "epoch": 2400} {"train_loss": -44.65876388549805, "global_step": 290517, "epoch": 2400} {"train_loss": -44.660430908203125, "global_step": 290518, "epoch": 2400} {"train_loss": -44.55526351928711, "global_step": 290519, "epoch": 2400} {"train_loss": -42.682642723903186, "global_step": 290520, "epoch": 2400, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4400000": 1.0, "test/sim_max_reward_4400001": 1.0, "test/sim_max_reward_4400002": 1.0, "test/sim_max_reward_4400003": 1.0, "test/sim_max_reward_4400004": 1.0, "test/sim_max_reward_4400005": 1.0, "test/sim_max_reward_4400006": 1.0, "test/sim_max_reward_4400007": 1.0, "test/sim_max_reward_4400008": 1.0, "test/sim_max_reward_4400009": 1.0, "test/sim_max_reward_4400010": 1.0, "test/sim_max_reward_4400011": 1.0, "test/sim_max_reward_4400012": 1.0, "test/sim_max_reward_4400013": 1.0, "test/sim_max_reward_4400014": 1.0, "test/sim_max_reward_4400015": 1.0, "test/sim_max_reward_4400016": 1.0, "test/sim_max_reward_4400017": 1.0, "test/sim_max_reward_4400018": 1.0, "test/sim_max_reward_4400019": 1.0, "test/sim_max_reward_4400020": 1.0, "test/sim_max_reward_4400021": 1.0, "train/mean_score": 1.0, "test/mean_score": 1.0, "val_loss": 2434304.25} {"train_loss": -44.416927337646484, "global_step": 290521, "epoch": 2401} {"train_loss": -44.324588775634766, "global_step": 290522, "epoch": 2401} {"train_loss": -44.540042877197266, "global_step": 290523, "epoch": 2401} {"train_loss": -44.03192901611328, "global_step": 290524, "epoch": 2401} {"train_loss": -44.71080017089844, "global_step": 290525, "epoch": 2401} {"train_loss": -44.969642639160156, "global_step": 290526, "epoch": 2401} {"train_loss": -44.03550338745117, "global_step": 290527, "epoch": 2401} {"train_loss": -44.48789596557617, "global_step": 290528, "epoch": 2401} {"train_loss": -44.612274169921875, "global_step": 290529, "epoch": 2401} {"train_loss": -43.975250244140625, "global_step": 290530, "epoch": 2401} {"train_loss": -44.168766021728516, "global_step": 290531, "epoch": 2401} {"train_loss": -44.21792984008789, "global_step": 290532, "epoch": 2401} {"train_loss": -43.944496154785156, "global_step": 290533, "epoch": 2401} {"train_loss": -42.897884368896484, "global_step": 290534, "epoch": 2401} {"train_loss": -41.558536529541016, "global_step": 290535, "epoch": 2401} {"train_loss": -42.89805221557617, "global_step": 290536, "epoch": 2401} {"train_loss": -43.373470306396484, "global_step": 290537, "epoch": 2401} {"train_loss": -43.912452697753906, "global_step": 290538, "epoch": 2401} {"train_loss": -43.982933044433594, "global_step": 290539, "epoch": 2401} {"train_loss": -43.29214096069336, "global_step": 290540, "epoch": 2401} {"train_loss": -42.472591400146484, "global_step": 290541, "epoch": 2401} {"train_loss": -43.07535934448242, "global_step": 290542, "epoch": 2401} {"train_loss": -44.372039794921875, "global_step": 290543, "epoch": 2401} {"train_loss": -44.326637268066406, "global_step": 290544, "epoch": 2401} {"train_loss": -42.923866271972656, "global_step": 290545, "epoch": 2401} {"train_loss": -42.929107666015625, "global_step": 290546, "epoch": 2401} {"train_loss": -43.25484848022461, "global_step": 290547, "epoch": 2401} {"train_loss": -44.041996002197266, "global_step": 290548, "epoch": 2401} {"train_loss": -43.530025482177734, "global_step": 290549, "epoch": 2401} {"train_loss": -43.20176315307617, "global_step": 290550, "epoch": 2401} {"train_loss": -42.96635818481445, "global_step": 290551, "epoch": 2401} {"train_loss": -43.393394470214844, "global_step": 290552, "epoch": 2401} {"train_loss": -44.57241439819336, "global_step": 290553, "epoch": 2401} {"train_loss": -43.381343841552734, "global_step": 290554, "epoch": 2401} {"train_loss": -42.84426498413086, "global_step": 290555, "epoch": 2401} {"train_loss": -42.739131927490234, "global_step": 290556, "epoch": 2401} {"train_loss": -43.279998779296875, "global_step": 290557, "epoch": 2401} {"train_loss": -42.4488410949707, "global_step": 290558, "epoch": 2401} {"train_loss": -42.37222671508789, "global_step": 290559, "epoch": 2401} {"train_loss": -41.44289779663086, "global_step": 290560, "epoch": 2401} {"train_loss": -41.43911361694336, "global_step": 290561, "epoch": 2401} {"train_loss": -42.79431915283203, "global_step": 290562, "epoch": 2401} {"train_loss": -42.16775131225586, "global_step": 290563, "epoch": 2401} {"train_loss": -42.8356819152832, "global_step": 290564, "epoch": 2401} {"train_loss": -43.08185958862305, "global_step": 290565, "epoch": 2401} {"train_loss": -43.1835823059082, "global_step": 290566, "epoch": 2401} {"train_loss": -43.404754638671875, "global_step": 290567, "epoch": 2401} {"train_loss": -41.3044319152832, "global_step": 290568, "epoch": 2401} {"train_loss": -41.80722427368164, "global_step": 290569, "epoch": 2401} {"train_loss": -43.803321838378906, "global_step": 290570, "epoch": 2401} {"train_loss": -42.94855499267578, "global_step": 290571, "epoch": 2401} {"train_loss": -41.935890197753906, "global_step": 290572, "epoch": 2401} {"train_loss": -42.102840423583984, "global_step": 290573, "epoch": 2401} {"train_loss": -42.47085189819336, "global_step": 290574, "epoch": 2401} {"train_loss": -43.10349655151367, "global_step": 290575, "epoch": 2401} {"train_loss": -42.67758560180664, "global_step": 290576, "epoch": 2401} {"train_loss": -41.98958206176758, "global_step": 290577, "epoch": 2401} {"train_loss": -42.91916275024414, "global_step": 290578, "epoch": 2401} {"train_loss": -43.403282165527344, "global_step": 290579, "epoch": 2401} {"train_loss": -41.987396240234375, "global_step": 290580, "epoch": 2401} {"train_loss": -42.66218185424805, "global_step": 290581, "epoch": 2401} {"train_loss": -43.78242874145508, "global_step": 290582, "epoch": 2401} {"train_loss": -41.58207321166992, "global_step": 290583, "epoch": 2401} {"train_loss": -42.77804183959961, "global_step": 290584, "epoch": 2401} {"train_loss": -42.916988372802734, "global_step": 290585, "epoch": 2401} {"train_loss": -41.92683029174805, "global_step": 290586, "epoch": 2401} {"train_loss": -42.33991622924805, "global_step": 290587, "epoch": 2401} {"train_loss": -43.60066604614258, "global_step": 290588, "epoch": 2401} {"train_loss": -43.28908157348633, "global_step": 290589, "epoch": 2401} {"train_loss": -42.12209701538086, "global_step": 290590, "epoch": 2401} {"train_loss": -43.02845001220703, "global_step": 290591, "epoch": 2401} {"train_loss": -42.416542053222656, "global_step": 290592, "epoch": 2401} {"train_loss": -42.8969841003418, "global_step": 290593, "epoch": 2401} {"train_loss": -43.403594970703125, "global_step": 290594, "epoch": 2401} {"train_loss": -41.793174743652344, "global_step": 290595, "epoch": 2401} {"train_loss": -42.87067794799805, "global_step": 290596, "epoch": 2401} {"train_loss": -43.26579284667969, "global_step": 290597, "epoch": 2401} {"train_loss": -42.544857025146484, "global_step": 290598, "epoch": 2401} {"train_loss": -42.21794509887695, "global_step": 290599, "epoch": 2401} {"train_loss": -42.57027053833008, "global_step": 290600, "epoch": 2401} {"train_loss": -42.89901351928711, "global_step": 290601, "epoch": 2401} {"train_loss": -42.06526184082031, "global_step": 290602, "epoch": 2401} {"train_loss": -43.02728271484375, "global_step": 290603, "epoch": 2401} {"train_loss": -42.51911163330078, "global_step": 290604, "epoch": 2401} {"train_loss": -43.77946853637695, "global_step": 290605, "epoch": 2401} {"train_loss": -43.32545471191406, "global_step": 290606, "epoch": 2401} {"train_loss": -43.05631637573242, "global_step": 290607, "epoch": 2401} {"train_loss": -43.794647216796875, "global_step": 290608, "epoch": 2401} {"train_loss": -43.236968994140625, "global_step": 290609, "epoch": 2401} {"train_loss": -43.96253204345703, "global_step": 290610, "epoch": 2401} {"train_loss": -43.20296096801758, "global_step": 290611, "epoch": 2401} {"train_loss": -43.13557052612305, "global_step": 290612, "epoch": 2401} {"train_loss": -43.59008026123047, "global_step": 290613, "epoch": 2401} {"train_loss": -43.48686218261719, "global_step": 290614, "epoch": 2401} {"train_loss": -42.57952117919922, "global_step": 290615, "epoch": 2401} {"train_loss": -43.088958740234375, "global_step": 290616, "epoch": 2401} {"train_loss": -44.321041107177734, "global_step": 290617, "epoch": 2401} {"train_loss": -43.4539794921875, "global_step": 290618, "epoch": 2401} {"train_loss": -43.96089553833008, "global_step": 290619, "epoch": 2401} {"train_loss": -43.95899200439453, "global_step": 290620, "epoch": 2401} {"train_loss": -43.79182052612305, "global_step": 290621, "epoch": 2401} {"train_loss": -43.51427459716797, "global_step": 290622, "epoch": 2401} {"train_loss": -44.16231918334961, "global_step": 290623, "epoch": 2401} {"train_loss": -43.89566421508789, "global_step": 290624, "epoch": 2401} {"train_loss": -44.20426940917969, "global_step": 290625, "epoch": 2401} {"train_loss": -43.87512969970703, "global_step": 290626, "epoch": 2401} {"train_loss": -44.20547103881836, "global_step": 290627, "epoch": 2401} {"train_loss": -43.862545013427734, "global_step": 290628, "epoch": 2401} {"train_loss": -43.40786361694336, "global_step": 290629, "epoch": 2401} {"train_loss": -43.272254943847656, "global_step": 290630, "epoch": 2401} {"train_loss": -44.00553894042969, "global_step": 290631, "epoch": 2401} {"train_loss": -42.919410705566406, "global_step": 290632, "epoch": 2401} {"train_loss": -43.857086181640625, "global_step": 290633, "epoch": 2401} {"train_loss": -42.88393020629883, "global_step": 290634, "epoch": 2401} {"train_loss": -42.999298095703125, "global_step": 290635, "epoch": 2401} {"train_loss": -42.50398254394531, "global_step": 290636, "epoch": 2401} {"train_loss": -43.22809982299805, "global_step": 290637, "epoch": 2401} {"train_loss": -44.642578125, "global_step": 290638, "epoch": 2401} {"train_loss": -44.47866439819336, "global_step": 290639, "epoch": 2401} {"train_loss": -43.590919494628906, "global_step": 290640, "epoch": 2401} {"train_loss": -43.226161988313535, "global_step": 290641, "epoch": 2401, "val_loss": 2500145.0} {"train_loss": -42.72065734863281, "global_step": 290642, "epoch": 2402} {"train_loss": -44.08080291748047, "global_step": 290643, "epoch": 2402} {"train_loss": -42.896705627441406, "global_step": 290644, "epoch": 2402} {"train_loss": -41.905845642089844, "global_step": 290645, "epoch": 2402} {"train_loss": -43.51041793823242, "global_step": 290646, "epoch": 2402} {"train_loss": -43.37883758544922, "global_step": 290647, "epoch": 2402} {"train_loss": -42.795654296875, "global_step": 290648, "epoch": 2402} {"train_loss": -42.131587982177734, "global_step": 290649, "epoch": 2402} {"train_loss": -43.362091064453125, "global_step": 290650, "epoch": 2402} {"train_loss": -43.630008697509766, "global_step": 290651, "epoch": 2402} {"train_loss": -43.08376693725586, "global_step": 290652, "epoch": 2402} {"train_loss": -43.44085693359375, "global_step": 290653, "epoch": 2402} {"train_loss": -43.96339797973633, "global_step": 290654, "epoch": 2402} {"train_loss": -44.22328186035156, "global_step": 290655, "epoch": 2402} {"train_loss": -43.329734802246094, "global_step": 290656, "epoch": 2402} {"train_loss": -43.018619537353516, "global_step": 290657, "epoch": 2402} {"train_loss": -43.675350189208984, "global_step": 290658, "epoch": 2402} {"train_loss": -43.79402542114258, "global_step": 290659, "epoch": 2402} {"train_loss": -43.13233184814453, "global_step": 290660, "epoch": 2402} {"train_loss": -42.88496017456055, "global_step": 290661, "epoch": 2402} {"train_loss": -42.42267990112305, "global_step": 290662, "epoch": 2402} {"train_loss": -44.340938568115234, "global_step": 290663, "epoch": 2402} {"train_loss": -44.02099609375, "global_step": 290664, "epoch": 2402} {"train_loss": -43.02762985229492, "global_step": 290665, "epoch": 2402} {"train_loss": -43.11552047729492, "global_step": 290666, "epoch": 2402} {"train_loss": -43.554100036621094, "global_step": 290667, "epoch": 2402} {"train_loss": -44.32353591918945, "global_step": 290668, "epoch": 2402} {"train_loss": -43.264305114746094, "global_step": 290669, "epoch": 2402} {"train_loss": -43.33729934692383, "global_step": 290670, "epoch": 2402} {"train_loss": -43.50534439086914, "global_step": 290671, "epoch": 2402} {"train_loss": -44.03034591674805, "global_step": 290672, "epoch": 2402} {"train_loss": -43.87984848022461, "global_step": 290673, "epoch": 2402} {"train_loss": -42.697818756103516, "global_step": 290674, "epoch": 2402} {"train_loss": -43.51351547241211, "global_step": 290675, "epoch": 2402} {"train_loss": -43.90767288208008, "global_step": 290676, "epoch": 2402} {"train_loss": -43.72725296020508, "global_step": 290677, "epoch": 2402} {"train_loss": -43.95624923706055, "global_step": 290678, "epoch": 2402} {"train_loss": -44.04448318481445, "global_step": 290679, "epoch": 2402} {"train_loss": -42.98418426513672, "global_step": 290680, "epoch": 2402} {"train_loss": -42.73970413208008, "global_step": 290681, "epoch": 2402} {"train_loss": -43.67521286010742, "global_step": 290682, "epoch": 2402} {"train_loss": -41.91342544555664, "global_step": 290683, "epoch": 2402} {"train_loss": -42.0858154296875, "global_step": 290684, "epoch": 2402} {"train_loss": -43.69089126586914, "global_step": 290685, "epoch": 2402} {"train_loss": -42.619937896728516, "global_step": 290686, "epoch": 2402} {"train_loss": -40.73641586303711, "global_step": 290687, "epoch": 2402} {"train_loss": -43.42812728881836, "global_step": 290688, "epoch": 2402} {"train_loss": -43.510616302490234, "global_step": 290689, "epoch": 2402} {"train_loss": -43.72370529174805, "global_step": 290690, "epoch": 2402} {"train_loss": -43.565303802490234, "global_step": 290691, "epoch": 2402} {"train_loss": -43.27798080444336, "global_step": 290692, "epoch": 2402} {"train_loss": -42.457733154296875, "global_step": 290693, "epoch": 2402} {"train_loss": -43.61077880859375, "global_step": 290694, "epoch": 2402} {"train_loss": -43.64141845703125, "global_step": 290695, "epoch": 2402} {"train_loss": -42.018184661865234, "global_step": 290696, "epoch": 2402} {"train_loss": -42.57979965209961, "global_step": 290697, "epoch": 2402} {"train_loss": -43.79914093017578, "global_step": 290698, "epoch": 2402} {"train_loss": -42.843353271484375, "global_step": 290699, "epoch": 2402} {"train_loss": -42.79431915283203, "global_step": 290700, "epoch": 2402} {"train_loss": -43.100921630859375, "global_step": 290701, "epoch": 2402} {"train_loss": -43.471702575683594, "global_step": 290702, "epoch": 2402} {"train_loss": -42.905479431152344, "global_step": 290703, "epoch": 2402} {"train_loss": -42.869789123535156, "global_step": 290704, "epoch": 2402} {"train_loss": -43.60812759399414, "global_step": 290705, "epoch": 2402} {"train_loss": -42.31962203979492, "global_step": 290706, "epoch": 2402} {"train_loss": -39.532413482666016, "global_step": 290707, "epoch": 2402} {"train_loss": -41.07790756225586, "global_step": 290708, "epoch": 2402} {"train_loss": -42.81386184692383, "global_step": 290709, "epoch": 2402} {"train_loss": -41.6727180480957, "global_step": 290710, "epoch": 2402} {"train_loss": -42.480464935302734, "global_step": 290711, "epoch": 2402} {"train_loss": -42.36220932006836, "global_step": 290712, "epoch": 2402} {"train_loss": -42.23410415649414, "global_step": 290713, "epoch": 2402} {"train_loss": -41.34564208984375, "global_step": 290714, "epoch": 2402} {"train_loss": -43.27376174926758, "global_step": 290715, "epoch": 2402} {"train_loss": -42.18081283569336, "global_step": 290716, "epoch": 2402} {"train_loss": -43.1199836730957, "global_step": 290717, "epoch": 2402} {"train_loss": -42.34507369995117, "global_step": 290718, "epoch": 2402} {"train_loss": -43.967559814453125, "global_step": 290719, "epoch": 2402} {"train_loss": -41.31291961669922, "global_step": 290720, "epoch": 2402} {"train_loss": -42.620635986328125, "global_step": 290721, "epoch": 2402} {"train_loss": -42.940765380859375, "global_step": 290722, "epoch": 2402} {"train_loss": -41.8903923034668, "global_step": 290723, "epoch": 2402} {"train_loss": -41.01606369018555, "global_step": 290724, "epoch": 2402} {"train_loss": -42.79883575439453, "global_step": 290725, "epoch": 2402} {"train_loss": -42.0317497253418, "global_step": 290726, "epoch": 2402} {"train_loss": -42.92464828491211, "global_step": 290727, "epoch": 2402} {"train_loss": -42.69033432006836, "global_step": 290728, "epoch": 2402} {"train_loss": -42.836219787597656, "global_step": 290729, "epoch": 2402} {"train_loss": -42.24628829956055, "global_step": 290730, "epoch": 2402} {"train_loss": -43.05656051635742, "global_step": 290731, "epoch": 2402} {"train_loss": -42.61088943481445, "global_step": 290732, "epoch": 2402} {"train_loss": -43.003719329833984, "global_step": 290733, "epoch": 2402} {"train_loss": -41.813453674316406, "global_step": 290734, "epoch": 2402} {"train_loss": -42.448486328125, "global_step": 290735, "epoch": 2402} {"train_loss": -42.695980072021484, "global_step": 290736, "epoch": 2402} {"train_loss": -42.82817077636719, "global_step": 290737, "epoch": 2402} {"train_loss": -42.739803314208984, "global_step": 290738, "epoch": 2402} {"train_loss": -43.4737548828125, "global_step": 290739, "epoch": 2402} {"train_loss": -42.49892044067383, "global_step": 290740, "epoch": 2402} {"train_loss": -42.78852844238281, "global_step": 290741, "epoch": 2402} {"train_loss": -43.346588134765625, "global_step": 290742, "epoch": 2402} {"train_loss": -42.297935485839844, "global_step": 290743, "epoch": 2402} {"train_loss": -43.727272033691406, "global_step": 290744, "epoch": 2402} {"train_loss": -42.9106559753418, "global_step": 290745, "epoch": 2402} {"train_loss": -42.8955078125, "global_step": 290746, "epoch": 2402} {"train_loss": -44.028560638427734, "global_step": 290747, "epoch": 2402} {"train_loss": -42.31033706665039, "global_step": 290748, "epoch": 2402} {"train_loss": -43.635257720947266, "global_step": 290749, "epoch": 2402} {"train_loss": -42.79697036743164, "global_step": 290750, "epoch": 2402} {"train_loss": -43.4703369140625, "global_step": 290751, "epoch": 2402} {"train_loss": -43.62858581542969, "global_step": 290752, "epoch": 2402} {"train_loss": -42.0003776550293, "global_step": 290753, "epoch": 2402} {"train_loss": -44.12836456298828, "global_step": 290754, "epoch": 2402} {"train_loss": -42.2011833190918, "global_step": 290755, "epoch": 2402} {"train_loss": -43.354671478271484, "global_step": 290756, "epoch": 2402} {"train_loss": -43.3773307800293, "global_step": 290757, "epoch": 2402} {"train_loss": -43.109703063964844, "global_step": 290758, "epoch": 2402} {"train_loss": -44.33441925048828, "global_step": 290759, "epoch": 2402} {"train_loss": -43.286556243896484, "global_step": 290760, "epoch": 2402} {"train_loss": -43.83478546142578, "global_step": 290761, "epoch": 2402} {"train_loss": -42.980664812828884, "global_step": 290762, "epoch": 2402, "val_loss": 2464534.75} {"train_loss": -43.59556579589844, "global_step": 290763, "epoch": 2403} {"train_loss": -43.64762496948242, "global_step": 290764, "epoch": 2403} {"train_loss": -43.78988265991211, "global_step": 290765, "epoch": 2403} {"train_loss": -44.01231002807617, "global_step": 290766, "epoch": 2403} {"train_loss": -43.79902267456055, "global_step": 290767, "epoch": 2403} {"train_loss": -43.89971923828125, "global_step": 290768, "epoch": 2403} {"train_loss": -43.96368408203125, "global_step": 290769, "epoch": 2403} {"train_loss": -44.79716110229492, "global_step": 290770, "epoch": 2403} {"train_loss": -43.83135986328125, "global_step": 290771, "epoch": 2403} {"train_loss": -43.84857177734375, "global_step": 290772, "epoch": 2403} {"train_loss": -44.10200119018555, "global_step": 290773, "epoch": 2403} {"train_loss": -43.99855041503906, "global_step": 290774, "epoch": 2403} {"train_loss": -44.224082946777344, "global_step": 290775, "epoch": 2403} {"train_loss": -42.91615676879883, "global_step": 290776, "epoch": 2403} {"train_loss": -42.84231948852539, "global_step": 290777, "epoch": 2403} {"train_loss": -44.02708053588867, "global_step": 290778, "epoch": 2403} {"train_loss": -44.112857818603516, "global_step": 290779, "epoch": 2403} {"train_loss": -43.647972106933594, "global_step": 290780, "epoch": 2403} {"train_loss": -44.06778335571289, "global_step": 290781, "epoch": 2403} {"train_loss": -43.95353317260742, "global_step": 290782, "epoch": 2403} {"train_loss": -43.20981979370117, "global_step": 290783, "epoch": 2403} {"train_loss": -44.08002471923828, "global_step": 290784, "epoch": 2403} {"train_loss": -43.63408279418945, "global_step": 290785, "epoch": 2403} {"train_loss": -44.34150314331055, "global_step": 290786, "epoch": 2403} {"train_loss": -43.93435287475586, "global_step": 290787, "epoch": 2403} {"train_loss": -42.49618148803711, "global_step": 290788, "epoch": 2403} {"train_loss": -43.934715270996094, "global_step": 290789, "epoch": 2403} {"train_loss": -43.059322357177734, "global_step": 290790, "epoch": 2403} {"train_loss": -43.396949768066406, "global_step": 290791, "epoch": 2403} {"train_loss": -44.08466720581055, "global_step": 290792, "epoch": 2403} {"train_loss": -43.29063034057617, "global_step": 290793, "epoch": 2403} {"train_loss": -44.27344512939453, "global_step": 290794, "epoch": 2403} {"train_loss": -44.33706283569336, "global_step": 290795, "epoch": 2403} {"train_loss": -43.023292541503906, "global_step": 290796, "epoch": 2403} {"train_loss": -44.00582504272461, "global_step": 290797, "epoch": 2403} {"train_loss": -43.616790771484375, "global_step": 290798, "epoch": 2403} {"train_loss": -44.41802978515625, "global_step": 290799, "epoch": 2403} {"train_loss": -43.683773040771484, "global_step": 290800, "epoch": 2403} {"train_loss": -43.488887786865234, "global_step": 290801, "epoch": 2403} {"train_loss": -44.13924026489258, "global_step": 290802, "epoch": 2403} {"train_loss": -43.70035934448242, "global_step": 290803, "epoch": 2403} {"train_loss": -43.56018829345703, "global_step": 290804, "epoch": 2403} {"train_loss": -43.082157135009766, "global_step": 290805, "epoch": 2403} {"train_loss": -43.777313232421875, "global_step": 290806, "epoch": 2403} {"train_loss": -44.13788604736328, "global_step": 290807, "epoch": 2403} {"train_loss": -44.51658248901367, "global_step": 290808, "epoch": 2403} {"train_loss": -43.902645111083984, "global_step": 290809, "epoch": 2403} {"train_loss": -44.027278900146484, "global_step": 290810, "epoch": 2403} {"train_loss": -44.10408401489258, "global_step": 290811, "epoch": 2403} {"train_loss": -44.05434036254883, "global_step": 290812, "epoch": 2403} {"train_loss": -44.09638214111328, "global_step": 290813, "epoch": 2403} {"train_loss": -43.88908004760742, "global_step": 290814, "epoch": 2403} {"train_loss": -44.603328704833984, "global_step": 290815, "epoch": 2403} {"train_loss": -43.94567108154297, "global_step": 290816, "epoch": 2403} {"train_loss": -44.24192428588867, "global_step": 290817, "epoch": 2403} {"train_loss": -44.52519607543945, "global_step": 290818, "epoch": 2403} {"train_loss": -44.22603988647461, "global_step": 290819, "epoch": 2403} {"train_loss": -43.94546127319336, "global_step": 290820, "epoch": 2403} {"train_loss": -43.747314453125, "global_step": 290821, "epoch": 2403} {"train_loss": -44.09821701049805, "global_step": 290822, "epoch": 2403} {"train_loss": -44.26525115966797, "global_step": 290823, "epoch": 2403} {"train_loss": -43.94346618652344, "global_step": 290824, "epoch": 2403} {"train_loss": -44.085289001464844, "global_step": 290825, "epoch": 2403} {"train_loss": -44.110328674316406, "global_step": 290826, "epoch": 2403} {"train_loss": -43.25892639160156, "global_step": 290827, "epoch": 2403} {"train_loss": -43.7608528137207, "global_step": 290828, "epoch": 2403} {"train_loss": -44.172080993652344, "global_step": 290829, "epoch": 2403} {"train_loss": -41.708187103271484, "global_step": 290830, "epoch": 2403} {"train_loss": -42.713653564453125, "global_step": 290831, "epoch": 2403} {"train_loss": -43.489871978759766, "global_step": 290832, "epoch": 2403} {"train_loss": -43.655517578125, "global_step": 290833, "epoch": 2403} {"train_loss": -42.52305221557617, "global_step": 290834, "epoch": 2403} {"train_loss": -41.88468933105469, "global_step": 290835, "epoch": 2403} {"train_loss": -43.881710052490234, "global_step": 290836, "epoch": 2403} {"train_loss": -43.497188568115234, "global_step": 290837, "epoch": 2403} {"train_loss": -44.16718673706055, "global_step": 290838, "epoch": 2403} {"train_loss": -42.712947845458984, "global_step": 290839, "epoch": 2403} {"train_loss": -43.50416946411133, "global_step": 290840, "epoch": 2403} {"train_loss": -42.842987060546875, "global_step": 290841, "epoch": 2403} {"train_loss": -43.93856430053711, "global_step": 290842, "epoch": 2403} {"train_loss": -43.637420654296875, "global_step": 290843, "epoch": 2403} {"train_loss": -43.88605880737305, "global_step": 290844, "epoch": 2403} {"train_loss": -42.602718353271484, "global_step": 290845, "epoch": 2403} {"train_loss": -42.15956497192383, "global_step": 290846, "epoch": 2403} {"train_loss": -43.98635482788086, "global_step": 290847, "epoch": 2403} {"train_loss": -43.954376220703125, "global_step": 290848, "epoch": 2403} {"train_loss": -43.2418212890625, "global_step": 290849, "epoch": 2403} {"train_loss": -43.993934631347656, "global_step": 290850, "epoch": 2403} {"train_loss": -43.86211013793945, "global_step": 290851, "epoch": 2403} {"train_loss": -43.5980339050293, "global_step": 290852, "epoch": 2403} {"train_loss": -43.22041702270508, "global_step": 290853, "epoch": 2403} {"train_loss": -43.99025344848633, "global_step": 290854, "epoch": 2403} {"train_loss": -43.240413665771484, "global_step": 290855, "epoch": 2403} {"train_loss": -44.07175827026367, "global_step": 290856, "epoch": 2403} {"train_loss": -42.8748779296875, "global_step": 290857, "epoch": 2403} {"train_loss": -43.223873138427734, "global_step": 290858, "epoch": 2403} {"train_loss": -43.266448974609375, "global_step": 290859, "epoch": 2403} {"train_loss": -43.39786911010742, "global_step": 290860, "epoch": 2403} {"train_loss": -43.80506896972656, "global_step": 290861, "epoch": 2403} {"train_loss": -43.4849739074707, "global_step": 290862, "epoch": 2403} {"train_loss": -42.56126022338867, "global_step": 290863, "epoch": 2403} {"train_loss": -41.9552116394043, "global_step": 290864, "epoch": 2403} {"train_loss": -43.1065559387207, "global_step": 290865, "epoch": 2403} {"train_loss": -40.9542121887207, "global_step": 290866, "epoch": 2403} {"train_loss": -42.41796875, "global_step": 290867, "epoch": 2403} {"train_loss": -42.395286560058594, "global_step": 290868, "epoch": 2403} {"train_loss": -40.81354522705078, "global_step": 290869, "epoch": 2403} {"train_loss": -42.61370849609375, "global_step": 290870, "epoch": 2403} {"train_loss": -39.71257400512695, "global_step": 290871, "epoch": 2403} {"train_loss": -42.67342758178711, "global_step": 290872, "epoch": 2403} {"train_loss": -40.77920913696289, "global_step": 290873, "epoch": 2403} {"train_loss": -41.853397369384766, "global_step": 290874, "epoch": 2403} {"train_loss": -43.399253845214844, "global_step": 290875, "epoch": 2403} {"train_loss": -41.4321403503418, "global_step": 290876, "epoch": 2403} {"train_loss": -42.27855682373047, "global_step": 290877, "epoch": 2403} {"train_loss": -43.52358627319336, "global_step": 290878, "epoch": 2403} {"train_loss": -42.00940704345703, "global_step": 290879, "epoch": 2403} {"train_loss": -41.2035026550293, "global_step": 290880, "epoch": 2403} {"train_loss": -43.51327133178711, "global_step": 290881, "epoch": 2403} {"train_loss": -40.85952377319336, "global_step": 290882, "epoch": 2403} {"train_loss": -43.39740151019136, "global_step": 290883, "epoch": 2403, "val_loss": 2483933.75} {"train_loss": -42.35260009765625, "global_step": 290884, "epoch": 2404} {"train_loss": -43.433013916015625, "global_step": 290885, "epoch": 2404} {"train_loss": -43.42829132080078, "global_step": 290886, "epoch": 2404} {"train_loss": -42.93353271484375, "global_step": 290887, "epoch": 2404} {"train_loss": -43.30046463012695, "global_step": 290888, "epoch": 2404} {"train_loss": -43.234676361083984, "global_step": 290889, "epoch": 2404} {"train_loss": -42.61002731323242, "global_step": 290890, "epoch": 2404} {"train_loss": -42.90583801269531, "global_step": 290891, "epoch": 2404} {"train_loss": -43.83181381225586, "global_step": 290892, "epoch": 2404} {"train_loss": -43.14736557006836, "global_step": 290893, "epoch": 2404} {"train_loss": -41.95139694213867, "global_step": 290894, "epoch": 2404} {"train_loss": -42.3296012878418, "global_step": 290895, "epoch": 2404} {"train_loss": -42.98711395263672, "global_step": 290896, "epoch": 2404} {"train_loss": -42.08351516723633, "global_step": 290897, "epoch": 2404} {"train_loss": -42.45579147338867, "global_step": 290898, "epoch": 2404} {"train_loss": -42.53120040893555, "global_step": 290899, "epoch": 2404} {"train_loss": -43.26704025268555, "global_step": 290900, "epoch": 2404} {"train_loss": -43.366973876953125, "global_step": 290901, "epoch": 2404} {"train_loss": -43.012081146240234, "global_step": 290902, "epoch": 2404} {"train_loss": -43.32828140258789, "global_step": 290903, "epoch": 2404} {"train_loss": -43.24277877807617, "global_step": 290904, "epoch": 2404} {"train_loss": -42.86750030517578, "global_step": 290905, "epoch": 2404} {"train_loss": -43.4447021484375, "global_step": 290906, "epoch": 2404} {"train_loss": -43.51418685913086, "global_step": 290907, "epoch": 2404} {"train_loss": -43.31480026245117, "global_step": 290908, "epoch": 2404} {"train_loss": -43.84986877441406, "global_step": 290909, "epoch": 2404} {"train_loss": -43.604434967041016, "global_step": 290910, "epoch": 2404} {"train_loss": -43.6513557434082, "global_step": 290911, "epoch": 2404} {"train_loss": -43.50699234008789, "global_step": 290912, "epoch": 2404} {"train_loss": -43.4535026550293, "global_step": 290913, "epoch": 2404} {"train_loss": -44.23651885986328, "global_step": 290914, "epoch": 2404} {"train_loss": -42.88810729980469, "global_step": 290915, "epoch": 2404} {"train_loss": -43.40450668334961, "global_step": 290916, "epoch": 2404} {"train_loss": -43.065589904785156, "global_step": 290917, "epoch": 2404} {"train_loss": -43.47629165649414, "global_step": 290918, "epoch": 2404} {"train_loss": -43.06963348388672, "global_step": 290919, "epoch": 2404} {"train_loss": -42.85945510864258, "global_step": 290920, "epoch": 2404} {"train_loss": -44.004783630371094, "global_step": 290921, "epoch": 2404} {"train_loss": -42.914058685302734, "global_step": 290922, "epoch": 2404} {"train_loss": -44.043785095214844, "global_step": 290923, "epoch": 2404} {"train_loss": -43.343170166015625, "global_step": 290924, "epoch": 2404} {"train_loss": -43.09321212768555, "global_step": 290925, "epoch": 2404} {"train_loss": -44.09176254272461, "global_step": 290926, "epoch": 2404} {"train_loss": -43.62330627441406, "global_step": 290927, "epoch": 2404} {"train_loss": -44.0446662902832, "global_step": 290928, "epoch": 2404} {"train_loss": -43.67082595825195, "global_step": 290929, "epoch": 2404} {"train_loss": -44.290462493896484, "global_step": 290930, "epoch": 2404} {"train_loss": -43.35226058959961, "global_step": 290931, "epoch": 2404} {"train_loss": -44.226768493652344, "global_step": 290932, "epoch": 2404} {"train_loss": -44.13729476928711, "global_step": 290933, "epoch": 2404} {"train_loss": -43.52617645263672, "global_step": 290934, "epoch": 2404} {"train_loss": -43.86509323120117, "global_step": 290935, "epoch": 2404} {"train_loss": -43.297080993652344, "global_step": 290936, "epoch": 2404} {"train_loss": -43.895957946777344, "global_step": 290937, "epoch": 2404} {"train_loss": -43.45203399658203, "global_step": 290938, "epoch": 2404} {"train_loss": -43.568519592285156, "global_step": 290939, "epoch": 2404} {"train_loss": -44.031551361083984, "global_step": 290940, "epoch": 2404} {"train_loss": -43.37769317626953, "global_step": 290941, "epoch": 2404} {"train_loss": -44.36115646362305, "global_step": 290942, "epoch": 2404} {"train_loss": -43.65491485595703, "global_step": 290943, "epoch": 2404} {"train_loss": -43.73429489135742, "global_step": 290944, "epoch": 2404} {"train_loss": -44.19086837768555, "global_step": 290945, "epoch": 2404} {"train_loss": -42.68923568725586, "global_step": 290946, "epoch": 2404} {"train_loss": -44.232723236083984, "global_step": 290947, "epoch": 2404} {"train_loss": -42.83386993408203, "global_step": 290948, "epoch": 2404} {"train_loss": -43.07307815551758, "global_step": 290949, "epoch": 2404} {"train_loss": -44.29522705078125, "global_step": 290950, "epoch": 2404} {"train_loss": -43.37433624267578, "global_step": 290951, "epoch": 2404} {"train_loss": -43.00836944580078, "global_step": 290952, "epoch": 2404} {"train_loss": -43.19144821166992, "global_step": 290953, "epoch": 2404} {"train_loss": -43.3385124206543, "global_step": 290954, "epoch": 2404} {"train_loss": -43.173702239990234, "global_step": 290955, "epoch": 2404} {"train_loss": -41.64118194580078, "global_step": 290956, "epoch": 2404} {"train_loss": -42.62394332885742, "global_step": 290957, "epoch": 2404} {"train_loss": -44.1656379699707, "global_step": 290958, "epoch": 2404} {"train_loss": -42.588985443115234, "global_step": 290959, "epoch": 2404} {"train_loss": -41.15291976928711, "global_step": 290960, "epoch": 2404} {"train_loss": -43.531715393066406, "global_step": 290961, "epoch": 2404} {"train_loss": -43.270870208740234, "global_step": 290962, "epoch": 2404} {"train_loss": -41.218910217285156, "global_step": 290963, "epoch": 2404} {"train_loss": -43.86524963378906, "global_step": 290964, "epoch": 2404} {"train_loss": -41.225772857666016, "global_step": 290965, "epoch": 2404} {"train_loss": -41.59726333618164, "global_step": 290966, "epoch": 2404} {"train_loss": -43.18721389770508, "global_step": 290967, "epoch": 2404} {"train_loss": -42.59572982788086, "global_step": 290968, "epoch": 2404} {"train_loss": -42.19809341430664, "global_step": 290969, "epoch": 2404} {"train_loss": -41.90150833129883, "global_step": 290970, "epoch": 2404} {"train_loss": -43.39712905883789, "global_step": 290971, "epoch": 2404} {"train_loss": -43.136688232421875, "global_step": 290972, "epoch": 2404} {"train_loss": -42.42701721191406, "global_step": 290973, "epoch": 2404} {"train_loss": -42.89624786376953, "global_step": 290974, "epoch": 2404} {"train_loss": -43.34185791015625, "global_step": 290975, "epoch": 2404} {"train_loss": -43.26497268676758, "global_step": 290976, "epoch": 2404} {"train_loss": -43.63074493408203, "global_step": 290977, "epoch": 2404} {"train_loss": -43.89826202392578, "global_step": 290978, "epoch": 2404} {"train_loss": -43.773372650146484, "global_step": 290979, "epoch": 2404} {"train_loss": -43.97372055053711, "global_step": 290980, "epoch": 2404} {"train_loss": -43.41136169433594, "global_step": 290981, "epoch": 2404} {"train_loss": -44.2325325012207, "global_step": 290982, "epoch": 2404} {"train_loss": -43.08835983276367, "global_step": 290983, "epoch": 2404} {"train_loss": -44.608375549316406, "global_step": 290984, "epoch": 2404} {"train_loss": -43.80535888671875, "global_step": 290985, "epoch": 2404} {"train_loss": -43.56972885131836, "global_step": 290986, "epoch": 2404} {"train_loss": -44.35468673706055, "global_step": 290987, "epoch": 2404} {"train_loss": -42.970741271972656, "global_step": 290988, "epoch": 2404} {"train_loss": -43.61825180053711, "global_step": 290989, "epoch": 2404} {"train_loss": -43.87188720703125, "global_step": 290990, "epoch": 2404} {"train_loss": -44.45827865600586, "global_step": 290991, "epoch": 2404} {"train_loss": -43.547115325927734, "global_step": 290992, "epoch": 2404} {"train_loss": -42.32684326171875, "global_step": 290993, "epoch": 2404} {"train_loss": -43.01866912841797, "global_step": 290994, "epoch": 2404} {"train_loss": -42.72381591796875, "global_step": 290995, "epoch": 2404} {"train_loss": -43.38667678833008, "global_step": 290996, "epoch": 2404} {"train_loss": -43.07318115234375, "global_step": 290997, "epoch": 2404} {"train_loss": -41.4810791015625, "global_step": 290998, "epoch": 2404} {"train_loss": -42.324058532714844, "global_step": 290999, "epoch": 2404} {"train_loss": -43.187721252441406, "global_step": 291000, "epoch": 2404} {"train_loss": -43.10071563720703, "global_step": 291001, "epoch": 2404} {"train_loss": -43.60970687866211, "global_step": 291002, "epoch": 2404} {"train_loss": -42.651729583740234, "global_step": 291003, "epoch": 2404} {"train_loss": -43.24333673272251, "global_step": 291004, "epoch": 2404, "val_loss": 2603599.0} {"train_loss": -42.75434494018555, "global_step": 291005, "epoch": 2405} {"train_loss": -43.5546875, "global_step": 291006, "epoch": 2405} {"train_loss": -42.73393630981445, "global_step": 291007, "epoch": 2405} {"train_loss": -42.14400863647461, "global_step": 291008, "epoch": 2405} {"train_loss": -42.59945297241211, "global_step": 291009, "epoch": 2405} {"train_loss": -43.127967834472656, "global_step": 291010, "epoch": 2405} {"train_loss": -43.65420150756836, "global_step": 291011, "epoch": 2405} {"train_loss": -43.21821212768555, "global_step": 291012, "epoch": 2405} {"train_loss": -43.01063919067383, "global_step": 291013, "epoch": 2405} {"train_loss": -44.1838493347168, "global_step": 291014, "epoch": 2405} {"train_loss": -43.224308013916016, "global_step": 291015, "epoch": 2405} {"train_loss": -43.08758544921875, "global_step": 291016, "epoch": 2405} {"train_loss": -43.248390197753906, "global_step": 291017, "epoch": 2405} {"train_loss": -43.75862121582031, "global_step": 291018, "epoch": 2405} {"train_loss": -43.715206146240234, "global_step": 291019, "epoch": 2405} {"train_loss": -43.33364486694336, "global_step": 291020, "epoch": 2405} {"train_loss": -44.099876403808594, "global_step": 291021, "epoch": 2405} {"train_loss": -44.108951568603516, "global_step": 291022, "epoch": 2405} {"train_loss": -43.280941009521484, "global_step": 291023, "epoch": 2405} {"train_loss": -44.2833366394043, "global_step": 291024, "epoch": 2405} {"train_loss": -43.98602294921875, "global_step": 291025, "epoch": 2405} {"train_loss": -44.02861785888672, "global_step": 291026, "epoch": 2405} {"train_loss": -44.28805160522461, "global_step": 291027, "epoch": 2405} {"train_loss": -44.00899124145508, "global_step": 291028, "epoch": 2405} {"train_loss": -44.339881896972656, "global_step": 291029, "epoch": 2405} {"train_loss": -43.88280487060547, "global_step": 291030, "epoch": 2405} {"train_loss": -44.55229187011719, "global_step": 291031, "epoch": 2405} {"train_loss": -44.200687408447266, "global_step": 291032, "epoch": 2405} {"train_loss": -44.468055725097656, "global_step": 291033, "epoch": 2405} {"train_loss": -43.58583450317383, "global_step": 291034, "epoch": 2405} {"train_loss": -44.17442321777344, "global_step": 291035, "epoch": 2405} {"train_loss": -44.2494010925293, "global_step": 291036, "epoch": 2405} {"train_loss": -43.58759307861328, "global_step": 291037, "epoch": 2405} {"train_loss": -43.95864486694336, "global_step": 291038, "epoch": 2405} {"train_loss": -44.31525421142578, "global_step": 291039, "epoch": 2405} {"train_loss": -44.24514389038086, "global_step": 291040, "epoch": 2405} {"train_loss": -44.2204475402832, "global_step": 291041, "epoch": 2405} {"train_loss": -44.350582122802734, "global_step": 291042, "epoch": 2405} {"train_loss": -44.374488830566406, "global_step": 291043, "epoch": 2405} {"train_loss": -43.68476104736328, "global_step": 291044, "epoch": 2405} {"train_loss": -43.440574645996094, "global_step": 291045, "epoch": 2405} {"train_loss": -43.43683624267578, "global_step": 291046, "epoch": 2405} {"train_loss": -44.179683685302734, "global_step": 291047, "epoch": 2405} {"train_loss": -44.42096710205078, "global_step": 291048, "epoch": 2405} {"train_loss": -43.698795318603516, "global_step": 291049, "epoch": 2405} {"train_loss": -43.74040222167969, "global_step": 291050, "epoch": 2405} {"train_loss": -44.05230712890625, "global_step": 291051, "epoch": 2405} {"train_loss": -43.70565414428711, "global_step": 291052, "epoch": 2405} {"train_loss": -43.71285629272461, "global_step": 291053, "epoch": 2405} {"train_loss": -43.7295036315918, "global_step": 291054, "epoch": 2405} {"train_loss": -44.53849411010742, "global_step": 291055, "epoch": 2405} {"train_loss": -44.33831024169922, "global_step": 291056, "epoch": 2405} {"train_loss": -44.69495391845703, "global_step": 291057, "epoch": 2405} {"train_loss": -43.98942565917969, "global_step": 291058, "epoch": 2405} {"train_loss": -43.91593551635742, "global_step": 291059, "epoch": 2405} {"train_loss": -43.988704681396484, "global_step": 291060, "epoch": 2405} {"train_loss": -44.10327911376953, "global_step": 291061, "epoch": 2405} {"train_loss": -43.63043212890625, "global_step": 291062, "epoch": 2405} {"train_loss": -44.0357780456543, "global_step": 291063, "epoch": 2405} {"train_loss": -43.370452880859375, "global_step": 291064, "epoch": 2405} {"train_loss": -43.59381866455078, "global_step": 291065, "epoch": 2405} {"train_loss": -44.44576644897461, "global_step": 291066, "epoch": 2405} {"train_loss": -43.73106002807617, "global_step": 291067, "epoch": 2405} {"train_loss": -43.85598373413086, "global_step": 291068, "epoch": 2405} {"train_loss": -44.11256408691406, "global_step": 291069, "epoch": 2405} {"train_loss": -43.61260986328125, "global_step": 291070, "epoch": 2405} {"train_loss": -44.552894592285156, "global_step": 291071, "epoch": 2405} {"train_loss": -44.89356994628906, "global_step": 291072, "epoch": 2405} {"train_loss": -43.6800537109375, "global_step": 291073, "epoch": 2405} {"train_loss": -44.20538330078125, "global_step": 291074, "epoch": 2405} {"train_loss": -44.52642822265625, "global_step": 291075, "epoch": 2405} {"train_loss": -44.18793869018555, "global_step": 291076, "epoch": 2405} {"train_loss": -43.67584228515625, "global_step": 291077, "epoch": 2405} {"train_loss": -43.69355392456055, "global_step": 291078, "epoch": 2405} {"train_loss": -43.3590202331543, "global_step": 291079, "epoch": 2405} {"train_loss": -44.78983688354492, "global_step": 291080, "epoch": 2405} {"train_loss": -43.3819465637207, "global_step": 291081, "epoch": 2405} {"train_loss": -41.88547897338867, "global_step": 291082, "epoch": 2405} {"train_loss": -44.33905029296875, "global_step": 291083, "epoch": 2405} {"train_loss": -43.718441009521484, "global_step": 291084, "epoch": 2405} {"train_loss": -42.43365478515625, "global_step": 291085, "epoch": 2405} {"train_loss": -44.10152816772461, "global_step": 291086, "epoch": 2405} {"train_loss": -43.3875846862793, "global_step": 291087, "epoch": 2405} {"train_loss": -42.59788131713867, "global_step": 291088, "epoch": 2405} {"train_loss": -43.1875, "global_step": 291089, "epoch": 2405} {"train_loss": -44.00931930541992, "global_step": 291090, "epoch": 2405} {"train_loss": -43.83552551269531, "global_step": 291091, "epoch": 2405} {"train_loss": -41.9796257019043, "global_step": 291092, "epoch": 2405} {"train_loss": -43.05946731567383, "global_step": 291093, "epoch": 2405} {"train_loss": -43.49024200439453, "global_step": 291094, "epoch": 2405} {"train_loss": -42.66794967651367, "global_step": 291095, "epoch": 2405} {"train_loss": -43.0703239440918, "global_step": 291096, "epoch": 2405} {"train_loss": -41.952693939208984, "global_step": 291097, "epoch": 2405} {"train_loss": -43.621803283691406, "global_step": 291098, "epoch": 2405} {"train_loss": -42.6556396484375, "global_step": 291099, "epoch": 2405} {"train_loss": -41.50448226928711, "global_step": 291100, "epoch": 2405} {"train_loss": -42.84572219848633, "global_step": 291101, "epoch": 2405} {"train_loss": -42.810150146484375, "global_step": 291102, "epoch": 2405} {"train_loss": -42.27381134033203, "global_step": 291103, "epoch": 2405} {"train_loss": -42.82854080200195, "global_step": 291104, "epoch": 2405} {"train_loss": -42.4437255859375, "global_step": 291105, "epoch": 2405} {"train_loss": -43.334678649902344, "global_step": 291106, "epoch": 2405} {"train_loss": -44.039039611816406, "global_step": 291107, "epoch": 2405} {"train_loss": -43.6251335144043, "global_step": 291108, "epoch": 2405} {"train_loss": -43.27920150756836, "global_step": 291109, "epoch": 2405} {"train_loss": -44.03021240234375, "global_step": 291110, "epoch": 2405} {"train_loss": -43.482784271240234, "global_step": 291111, "epoch": 2405} {"train_loss": -43.7481575012207, "global_step": 291112, "epoch": 2405} {"train_loss": -43.25765609741211, "global_step": 291113, "epoch": 2405} {"train_loss": -43.775325775146484, "global_step": 291114, "epoch": 2405} {"train_loss": -43.2669563293457, "global_step": 291115, "epoch": 2405} {"train_loss": -43.68598175048828, "global_step": 291116, "epoch": 2405} {"train_loss": -43.50490188598633, "global_step": 291117, "epoch": 2405} {"train_loss": -43.32215118408203, "global_step": 291118, "epoch": 2405} {"train_loss": -43.263587951660156, "global_step": 291119, "epoch": 2405} {"train_loss": -43.37278366088867, "global_step": 291120, "epoch": 2405} {"train_loss": -43.47953414916992, "global_step": 291121, "epoch": 2405} {"train_loss": -43.933162689208984, "global_step": 291122, "epoch": 2405} {"train_loss": -43.70050048828125, "global_step": 291123, "epoch": 2405} {"train_loss": -43.33799362182617, "global_step": 291124, "epoch": 2405} {"train_loss": -43.621967441779525, "global_step": 291125, "epoch": 2405, "val_loss": 2478351.0} {"train_loss": -42.57161331176758, "global_step": 291126, "epoch": 2406} {"train_loss": -42.37041473388672, "global_step": 291127, "epoch": 2406} {"train_loss": -43.95246124267578, "global_step": 291128, "epoch": 2406} {"train_loss": -42.32809066772461, "global_step": 291129, "epoch": 2406} {"train_loss": -42.74998474121094, "global_step": 291130, "epoch": 2406} {"train_loss": -42.99013900756836, "global_step": 291131, "epoch": 2406} {"train_loss": -42.30410385131836, "global_step": 291132, "epoch": 2406} {"train_loss": -42.75718307495117, "global_step": 291133, "epoch": 2406} {"train_loss": -42.71209716796875, "global_step": 291134, "epoch": 2406} {"train_loss": -42.44919967651367, "global_step": 291135, "epoch": 2406} {"train_loss": -42.870025634765625, "global_step": 291136, "epoch": 2406} {"train_loss": -42.46159744262695, "global_step": 291137, "epoch": 2406} {"train_loss": -43.379634857177734, "global_step": 291138, "epoch": 2406} {"train_loss": -42.2987174987793, "global_step": 291139, "epoch": 2406} {"train_loss": -42.95682907104492, "global_step": 291140, "epoch": 2406} {"train_loss": -43.2176513671875, "global_step": 291141, "epoch": 2406} {"train_loss": -41.97140121459961, "global_step": 291142, "epoch": 2406} {"train_loss": -43.25879669189453, "global_step": 291143, "epoch": 2406} {"train_loss": -43.14128112792969, "global_step": 291144, "epoch": 2406} {"train_loss": -43.003700256347656, "global_step": 291145, "epoch": 2406} {"train_loss": -43.7027587890625, "global_step": 291146, "epoch": 2406} {"train_loss": -42.763153076171875, "global_step": 291147, "epoch": 2406} {"train_loss": -43.45296096801758, "global_step": 291148, "epoch": 2406} {"train_loss": -42.86385726928711, "global_step": 291149, "epoch": 2406} {"train_loss": -43.2580451965332, "global_step": 291150, "epoch": 2406} {"train_loss": -44.05562210083008, "global_step": 291151, "epoch": 2406} {"train_loss": -42.98088455200195, "global_step": 291152, "epoch": 2406} {"train_loss": -43.67121887207031, "global_step": 291153, "epoch": 2406} {"train_loss": -43.42011642456055, "global_step": 291154, "epoch": 2406} {"train_loss": -44.230342864990234, "global_step": 291155, "epoch": 2406} {"train_loss": -44.20705795288086, "global_step": 291156, "epoch": 2406} {"train_loss": -44.04237365722656, "global_step": 291157, "epoch": 2406} {"train_loss": -43.826515197753906, "global_step": 291158, "epoch": 2406} {"train_loss": -43.9273681640625, "global_step": 291159, "epoch": 2406} {"train_loss": -44.5656852722168, "global_step": 291160, "epoch": 2406} {"train_loss": -44.11222839355469, "global_step": 291161, "epoch": 2406} {"train_loss": -43.116390228271484, "global_step": 291162, "epoch": 2406} {"train_loss": -44.216346740722656, "global_step": 291163, "epoch": 2406} {"train_loss": -44.061336517333984, "global_step": 291164, "epoch": 2406} {"train_loss": -43.423397064208984, "global_step": 291165, "epoch": 2406} {"train_loss": -44.0339241027832, "global_step": 291166, "epoch": 2406} {"train_loss": -43.67082977294922, "global_step": 291167, "epoch": 2406} {"train_loss": -44.30747985839844, "global_step": 291168, "epoch": 2406} {"train_loss": -44.50286865234375, "global_step": 291169, "epoch": 2406} {"train_loss": -44.31501388549805, "global_step": 291170, "epoch": 2406} {"train_loss": -44.57196807861328, "global_step": 291171, "epoch": 2406} {"train_loss": -44.652488708496094, "global_step": 291172, "epoch": 2406} {"train_loss": -44.58480453491211, "global_step": 291173, "epoch": 2406} {"train_loss": -44.931148529052734, "global_step": 291174, "epoch": 2406} {"train_loss": -44.5040397644043, "global_step": 291175, "epoch": 2406} {"train_loss": -44.39703369140625, "global_step": 291176, "epoch": 2406} {"train_loss": -44.9410400390625, "global_step": 291177, "epoch": 2406} {"train_loss": -44.82223129272461, "global_step": 291178, "epoch": 2406} {"train_loss": -44.91999435424805, "global_step": 291179, "epoch": 2406} {"train_loss": -44.76476287841797, "global_step": 291180, "epoch": 2406} {"train_loss": -44.769805908203125, "global_step": 291181, "epoch": 2406} {"train_loss": -43.85116195678711, "global_step": 291182, "epoch": 2406} {"train_loss": -42.90327835083008, "global_step": 291183, "epoch": 2406} {"train_loss": -41.4112434387207, "global_step": 291184, "epoch": 2406} {"train_loss": -42.305747985839844, "global_step": 291185, "epoch": 2406} {"train_loss": -43.56487274169922, "global_step": 291186, "epoch": 2406} {"train_loss": -43.92413330078125, "global_step": 291187, "epoch": 2406} {"train_loss": -44.128517150878906, "global_step": 291188, "epoch": 2406} {"train_loss": -42.96232604980469, "global_step": 291189, "epoch": 2406} {"train_loss": -39.99247360229492, "global_step": 291190, "epoch": 2406} {"train_loss": -44.34846878051758, "global_step": 291191, "epoch": 2406} {"train_loss": -42.10372543334961, "global_step": 291192, "epoch": 2406} {"train_loss": -37.0451774597168, "global_step": 291193, "epoch": 2406} {"train_loss": -31.2313232421875, "global_step": 291194, "epoch": 2406} {"train_loss": -26.77667236328125, "global_step": 291195, "epoch": 2406} {"train_loss": -32.754634857177734, "global_step": 291196, "epoch": 2406} {"train_loss": -42.72341537475586, "global_step": 291197, "epoch": 2406} {"train_loss": -31.897363662719727, "global_step": 291198, "epoch": 2406} {"train_loss": -33.065547943115234, "global_step": 291199, "epoch": 2406} {"train_loss": -40.36477279663086, "global_step": 291200, "epoch": 2406} {"train_loss": -38.799964904785156, "global_step": 291201, "epoch": 2406} {"train_loss": -38.544464111328125, "global_step": 291202, "epoch": 2406} {"train_loss": -41.77907180786133, "global_step": 291203, "epoch": 2406} {"train_loss": -38.6353874206543, "global_step": 291204, "epoch": 2406} {"train_loss": -42.6354866027832, "global_step": 291205, "epoch": 2406} {"train_loss": -39.8952751159668, "global_step": 291206, "epoch": 2406} {"train_loss": -41.4042854309082, "global_step": 291207, "epoch": 2406} {"train_loss": -41.428016662597656, "global_step": 291208, "epoch": 2406} {"train_loss": -41.73310089111328, "global_step": 291209, "epoch": 2406} {"train_loss": -41.9250602722168, "global_step": 291210, "epoch": 2406} {"train_loss": -41.800933837890625, "global_step": 291211, "epoch": 2406} {"train_loss": -39.98503875732422, "global_step": 291212, "epoch": 2406} {"train_loss": -42.09464645385742, "global_step": 291213, "epoch": 2406} {"train_loss": -40.92789077758789, "global_step": 291214, "epoch": 2406} {"train_loss": -42.607173919677734, "global_step": 291215, "epoch": 2406} {"train_loss": -42.159423828125, "global_step": 291216, "epoch": 2406} {"train_loss": -42.135311126708984, "global_step": 291217, "epoch": 2406} {"train_loss": -42.09951400756836, "global_step": 291218, "epoch": 2406} {"train_loss": -42.76101303100586, "global_step": 291219, "epoch": 2406} {"train_loss": -43.21547317504883, "global_step": 291220, "epoch": 2406} {"train_loss": -43.20554733276367, "global_step": 291221, "epoch": 2406} {"train_loss": -42.53672409057617, "global_step": 291222, "epoch": 2406} {"train_loss": -42.34346389770508, "global_step": 291223, "epoch": 2406} {"train_loss": -42.712520599365234, "global_step": 291224, "epoch": 2406} {"train_loss": -43.10319137573242, "global_step": 291225, "epoch": 2406} {"train_loss": -43.58526611328125, "global_step": 291226, "epoch": 2406} {"train_loss": -42.81170654296875, "global_step": 291227, "epoch": 2406} {"train_loss": -43.588104248046875, "global_step": 291228, "epoch": 2406} {"train_loss": -43.70321273803711, "global_step": 291229, "epoch": 2406} {"train_loss": -43.12947463989258, "global_step": 291230, "epoch": 2406} {"train_loss": -43.537166595458984, "global_step": 291231, "epoch": 2406} {"train_loss": -43.219966888427734, "global_step": 291232, "epoch": 2406} {"train_loss": -43.71223068237305, "global_step": 291233, "epoch": 2406} {"train_loss": -43.02132034301758, "global_step": 291234, "epoch": 2406} {"train_loss": -43.46470642089844, "global_step": 291235, "epoch": 2406} {"train_loss": -44.0780029296875, "global_step": 291236, "epoch": 2406} {"train_loss": -43.412879943847656, "global_step": 291237, "epoch": 2406} {"train_loss": -43.875885009765625, "global_step": 291238, "epoch": 2406} {"train_loss": -43.85981369018555, "global_step": 291239, "epoch": 2406} {"train_loss": -43.58937072753906, "global_step": 291240, "epoch": 2406} {"train_loss": -43.89390182495117, "global_step": 291241, "epoch": 2406} {"train_loss": -43.69808578491211, "global_step": 291242, "epoch": 2406} {"train_loss": -43.83163070678711, "global_step": 291243, "epoch": 2406} {"train_loss": -44.221126556396484, "global_step": 291244, "epoch": 2406} {"train_loss": -43.78396224975586, "global_step": 291245, "epoch": 2406} {"train_loss": -42.534107823017216, "global_step": 291246, "epoch": 2406, "val_loss": 2444906.5} {"train_loss": -44.15717697143555, "global_step": 291247, "epoch": 2407} {"train_loss": -43.953147888183594, "global_step": 291248, "epoch": 2407} {"train_loss": -44.24471664428711, "global_step": 291249, "epoch": 2407} {"train_loss": -44.28260803222656, "global_step": 291250, "epoch": 2407} {"train_loss": -44.25543212890625, "global_step": 291251, "epoch": 2407} {"train_loss": -44.10691452026367, "global_step": 291252, "epoch": 2407} {"train_loss": -44.45134353637695, "global_step": 291253, "epoch": 2407} {"train_loss": -44.24562454223633, "global_step": 291254, "epoch": 2407} {"train_loss": -44.39863204956055, "global_step": 291255, "epoch": 2407} {"train_loss": -44.3836555480957, "global_step": 291256, "epoch": 2407} {"train_loss": -44.45845413208008, "global_step": 291257, "epoch": 2407} {"train_loss": -44.552581787109375, "global_step": 291258, "epoch": 2407} {"train_loss": -44.57566452026367, "global_step": 291259, "epoch": 2407} {"train_loss": -44.34150695800781, "global_step": 291260, "epoch": 2407} {"train_loss": -44.47867965698242, "global_step": 291261, "epoch": 2407} {"train_loss": -44.39472579956055, "global_step": 291262, "epoch": 2407} {"train_loss": -44.89539337158203, "global_step": 291263, "epoch": 2407} {"train_loss": -44.31171798706055, "global_step": 291264, "epoch": 2407} {"train_loss": -44.79779052734375, "global_step": 291265, "epoch": 2407} {"train_loss": -44.545387268066406, "global_step": 291266, "epoch": 2407} {"train_loss": -44.45372772216797, "global_step": 291267, "epoch": 2407} {"train_loss": -44.36430358886719, "global_step": 291268, "epoch": 2407} {"train_loss": -44.56727600097656, "global_step": 291269, "epoch": 2407} {"train_loss": -44.0363883972168, "global_step": 291270, "epoch": 2407} {"train_loss": -44.74509048461914, "global_step": 291271, "epoch": 2407} {"train_loss": -44.727630615234375, "global_step": 291272, "epoch": 2407} {"train_loss": -44.01618576049805, "global_step": 291273, "epoch": 2407} {"train_loss": -44.701751708984375, "global_step": 291274, "epoch": 2407} {"train_loss": -44.60738754272461, "global_step": 291275, "epoch": 2407} {"train_loss": -44.6413459777832, "global_step": 291276, "epoch": 2407} {"train_loss": -44.89847183227539, "global_step": 291277, "epoch": 2407} {"train_loss": -44.79793930053711, "global_step": 291278, "epoch": 2407} {"train_loss": -45.199886322021484, "global_step": 291279, "epoch": 2407} {"train_loss": -44.86259078979492, "global_step": 291280, "epoch": 2407} {"train_loss": -44.56214141845703, "global_step": 291281, "epoch": 2407} {"train_loss": -44.77029800415039, "global_step": 291282, "epoch": 2407} {"train_loss": -44.26723861694336, "global_step": 291283, "epoch": 2407} {"train_loss": -44.51316452026367, "global_step": 291284, "epoch": 2407} {"train_loss": -44.628089904785156, "global_step": 291285, "epoch": 2407} {"train_loss": -44.528289794921875, "global_step": 291286, "epoch": 2407} {"train_loss": -44.689208984375, "global_step": 291287, "epoch": 2407} {"train_loss": -44.4827995300293, "global_step": 291288, "epoch": 2407} {"train_loss": -44.56234359741211, "global_step": 291289, "epoch": 2407} {"train_loss": -44.9278564453125, "global_step": 291290, "epoch": 2407} {"train_loss": -44.54840850830078, "global_step": 291291, "epoch": 2407} {"train_loss": -44.39356231689453, "global_step": 291292, "epoch": 2407} {"train_loss": -43.61347198486328, "global_step": 291293, "epoch": 2407} {"train_loss": -41.96662902832031, "global_step": 291294, "epoch": 2407} {"train_loss": -43.219791412353516, "global_step": 291295, "epoch": 2407} {"train_loss": -43.625213623046875, "global_step": 291296, "epoch": 2407} {"train_loss": -44.86252975463867, "global_step": 291297, "epoch": 2407} {"train_loss": -43.3327751159668, "global_step": 291298, "epoch": 2407} {"train_loss": -41.49056625366211, "global_step": 291299, "epoch": 2407} {"train_loss": -43.106441497802734, "global_step": 291300, "epoch": 2407} {"train_loss": -42.32502365112305, "global_step": 291301, "epoch": 2407} {"train_loss": -41.92319869995117, "global_step": 291302, "epoch": 2407} {"train_loss": -42.2418212890625, "global_step": 291303, "epoch": 2407} {"train_loss": -41.78241729736328, "global_step": 291304, "epoch": 2407} {"train_loss": -41.323158264160156, "global_step": 291305, "epoch": 2407} {"train_loss": -43.75490951538086, "global_step": 291306, "epoch": 2407} {"train_loss": -40.919795989990234, "global_step": 291307, "epoch": 2407} {"train_loss": -41.4815788269043, "global_step": 291308, "epoch": 2407} {"train_loss": -43.849761962890625, "global_step": 291309, "epoch": 2407} {"train_loss": -41.42937088012695, "global_step": 291310, "epoch": 2407} {"train_loss": -42.95005798339844, "global_step": 291311, "epoch": 2407} {"train_loss": -41.93375778198242, "global_step": 291312, "epoch": 2407} {"train_loss": -42.87767028808594, "global_step": 291313, "epoch": 2407} {"train_loss": -42.619075775146484, "global_step": 291314, "epoch": 2407} {"train_loss": -41.008846282958984, "global_step": 291315, "epoch": 2407} {"train_loss": -43.48134994506836, "global_step": 291316, "epoch": 2407} {"train_loss": -42.8185920715332, "global_step": 291317, "epoch": 2407} {"train_loss": -42.54659652709961, "global_step": 291318, "epoch": 2407} {"train_loss": -42.51543426513672, "global_step": 291319, "epoch": 2407} {"train_loss": -43.315914154052734, "global_step": 291320, "epoch": 2407} {"train_loss": -41.85496139526367, "global_step": 291321, "epoch": 2407} {"train_loss": -42.12508773803711, "global_step": 291322, "epoch": 2407} {"train_loss": -43.102108001708984, "global_step": 291323, "epoch": 2407} {"train_loss": -43.10921096801758, "global_step": 291324, "epoch": 2407} {"train_loss": -42.467674255371094, "global_step": 291325, "epoch": 2407} {"train_loss": -43.69385528564453, "global_step": 291326, "epoch": 2407} {"train_loss": -43.08435821533203, "global_step": 291327, "epoch": 2407} {"train_loss": -42.8126220703125, "global_step": 291328, "epoch": 2407} {"train_loss": -43.394100189208984, "global_step": 291329, "epoch": 2407} {"train_loss": -43.00031661987305, "global_step": 291330, "epoch": 2407} {"train_loss": -43.2092170715332, "global_step": 291331, "epoch": 2407} {"train_loss": -43.2316780090332, "global_step": 291332, "epoch": 2407} {"train_loss": -42.70310592651367, "global_step": 291333, "epoch": 2407} {"train_loss": -43.1799430847168, "global_step": 291334, "epoch": 2407} {"train_loss": -43.4908332824707, "global_step": 291335, "epoch": 2407} {"train_loss": -43.72024917602539, "global_step": 291336, "epoch": 2407} {"train_loss": -44.014217376708984, "global_step": 291337, "epoch": 2407} {"train_loss": -43.430450439453125, "global_step": 291338, "epoch": 2407} {"train_loss": -43.27996826171875, "global_step": 291339, "epoch": 2407} {"train_loss": -43.15568923950195, "global_step": 291340, "epoch": 2407} {"train_loss": -44.50497055053711, "global_step": 291341, "epoch": 2407} {"train_loss": -43.1953010559082, "global_step": 291342, "epoch": 2407} {"train_loss": -43.96735763549805, "global_step": 291343, "epoch": 2407} {"train_loss": -43.6772575378418, "global_step": 291344, "epoch": 2407} {"train_loss": -43.882328033447266, "global_step": 291345, "epoch": 2407} {"train_loss": -42.98270797729492, "global_step": 291346, "epoch": 2407} {"train_loss": -43.85020065307617, "global_step": 291347, "epoch": 2407} {"train_loss": -43.8832893371582, "global_step": 291348, "epoch": 2407} {"train_loss": -43.91905975341797, "global_step": 291349, "epoch": 2407} {"train_loss": -44.24540328979492, "global_step": 291350, "epoch": 2407} {"train_loss": -43.803688049316406, "global_step": 291351, "epoch": 2407} {"train_loss": -44.01821517944336, "global_step": 291352, "epoch": 2407} {"train_loss": -44.011531829833984, "global_step": 291353, "epoch": 2407} {"train_loss": -44.12217330932617, "global_step": 291354, "epoch": 2407} {"train_loss": -43.97100830078125, "global_step": 291355, "epoch": 2407} {"train_loss": -43.9648323059082, "global_step": 291356, "epoch": 2407} {"train_loss": -44.17444610595703, "global_step": 291357, "epoch": 2407} {"train_loss": -43.770851135253906, "global_step": 291358, "epoch": 2407} {"train_loss": -44.12946701049805, "global_step": 291359, "epoch": 2407} {"train_loss": -44.39760208129883, "global_step": 291360, "epoch": 2407} {"train_loss": -44.415122985839844, "global_step": 291361, "epoch": 2407} {"train_loss": -43.624916076660156, "global_step": 291362, "epoch": 2407} {"train_loss": -44.15966033935547, "global_step": 291363, "epoch": 2407} {"train_loss": -42.78105545043945, "global_step": 291364, "epoch": 2407} {"train_loss": -43.185394287109375, "global_step": 291365, "epoch": 2407} {"train_loss": -43.48141098022461, "global_step": 291366, "epoch": 2407} {"train_loss": -43.679348118049056, "global_step": 291367, "epoch": 2407, "val_loss": 2471850.0} {"train_loss": -43.323116302490234, "global_step": 291368, "epoch": 2408} {"train_loss": -43.96088409423828, "global_step": 291369, "epoch": 2408} {"train_loss": -42.38567352294922, "global_step": 291370, "epoch": 2408} {"train_loss": -44.07113265991211, "global_step": 291371, "epoch": 2408} {"train_loss": -42.17727279663086, "global_step": 291372, "epoch": 2408} {"train_loss": -43.52315902709961, "global_step": 291373, "epoch": 2408} {"train_loss": -42.94916915893555, "global_step": 291374, "epoch": 2408} {"train_loss": -43.223270416259766, "global_step": 291375, "epoch": 2408} {"train_loss": -43.14565658569336, "global_step": 291376, "epoch": 2408} {"train_loss": -41.2103385925293, "global_step": 291377, "epoch": 2408} {"train_loss": -42.30182647705078, "global_step": 291378, "epoch": 2408} {"train_loss": -42.92245864868164, "global_step": 291379, "epoch": 2408} {"train_loss": -42.93903350830078, "global_step": 291380, "epoch": 2408} {"train_loss": -43.375370025634766, "global_step": 291381, "epoch": 2408} {"train_loss": -42.39374923706055, "global_step": 291382, "epoch": 2408} {"train_loss": -42.68438720703125, "global_step": 291383, "epoch": 2408} {"train_loss": -43.429744720458984, "global_step": 291384, "epoch": 2408} {"train_loss": -43.02045440673828, "global_step": 291385, "epoch": 2408} {"train_loss": -43.343379974365234, "global_step": 291386, "epoch": 2408} {"train_loss": -43.126319885253906, "global_step": 291387, "epoch": 2408} {"train_loss": -43.48504638671875, "global_step": 291388, "epoch": 2408} {"train_loss": -42.33857345581055, "global_step": 291389, "epoch": 2408} {"train_loss": -41.8643798828125, "global_step": 291390, "epoch": 2408} {"train_loss": -43.855804443359375, "global_step": 291391, "epoch": 2408} {"train_loss": -43.14090347290039, "global_step": 291392, "epoch": 2408} {"train_loss": -42.904232025146484, "global_step": 291393, "epoch": 2408} {"train_loss": -43.539207458496094, "global_step": 291394, "epoch": 2408} {"train_loss": -43.1611213684082, "global_step": 291395, "epoch": 2408} {"train_loss": -42.050933837890625, "global_step": 291396, "epoch": 2408} {"train_loss": -43.140621185302734, "global_step": 291397, "epoch": 2408} {"train_loss": -43.092105865478516, "global_step": 291398, "epoch": 2408} {"train_loss": -43.01361083984375, "global_step": 291399, "epoch": 2408} {"train_loss": -43.26896667480469, "global_step": 291400, "epoch": 2408} {"train_loss": -43.650184631347656, "global_step": 291401, "epoch": 2408} {"train_loss": -44.057586669921875, "global_step": 291402, "epoch": 2408} {"train_loss": -42.55984115600586, "global_step": 291403, "epoch": 2408} {"train_loss": -43.20168685913086, "global_step": 291404, "epoch": 2408} {"train_loss": -43.00313186645508, "global_step": 291405, "epoch": 2408} {"train_loss": -43.03062438964844, "global_step": 291406, "epoch": 2408} {"train_loss": -44.27091979980469, "global_step": 291407, "epoch": 2408} {"train_loss": -43.54631042480469, "global_step": 291408, "epoch": 2408} {"train_loss": -44.43528366088867, "global_step": 291409, "epoch": 2408} {"train_loss": -43.96977615356445, "global_step": 291410, "epoch": 2408} {"train_loss": -43.749324798583984, "global_step": 291411, "epoch": 2408} {"train_loss": -44.187801361083984, "global_step": 291412, "epoch": 2408} {"train_loss": -43.0460090637207, "global_step": 291413, "epoch": 2408} {"train_loss": -43.53884506225586, "global_step": 291414, "epoch": 2408} {"train_loss": -44.472991943359375, "global_step": 291415, "epoch": 2408} {"train_loss": -43.523250579833984, "global_step": 291416, "epoch": 2408} {"train_loss": -43.73323440551758, "global_step": 291417, "epoch": 2408} {"train_loss": -43.67912673950195, "global_step": 291418, "epoch": 2408} {"train_loss": -44.27288818359375, "global_step": 291419, "epoch": 2408} {"train_loss": -43.938236236572266, "global_step": 291420, "epoch": 2408} {"train_loss": -43.696346282958984, "global_step": 291421, "epoch": 2408} {"train_loss": -44.2166633605957, "global_step": 291422, "epoch": 2408} {"train_loss": -44.402191162109375, "global_step": 291423, "epoch": 2408} {"train_loss": -44.408077239990234, "global_step": 291424, "epoch": 2408} {"train_loss": -44.218910217285156, "global_step": 291425, "epoch": 2408} {"train_loss": -44.35189437866211, "global_step": 291426, "epoch": 2408} {"train_loss": -43.851295471191406, "global_step": 291427, "epoch": 2408} {"train_loss": -44.23722457885742, "global_step": 291428, "epoch": 2408} {"train_loss": -44.281341552734375, "global_step": 291429, "epoch": 2408} {"train_loss": -44.80027389526367, "global_step": 291430, "epoch": 2408} {"train_loss": -44.31086349487305, "global_step": 291431, "epoch": 2408} {"train_loss": -44.85980987548828, "global_step": 291432, "epoch": 2408} {"train_loss": -44.40925216674805, "global_step": 291433, "epoch": 2408} {"train_loss": -44.108314514160156, "global_step": 291434, "epoch": 2408} {"train_loss": -44.091121673583984, "global_step": 291435, "epoch": 2408} {"train_loss": -44.08558654785156, "global_step": 291436, "epoch": 2408} {"train_loss": -44.29827117919922, "global_step": 291437, "epoch": 2408} {"train_loss": -44.93177032470703, "global_step": 291438, "epoch": 2408} {"train_loss": -44.279457092285156, "global_step": 291439, "epoch": 2408} {"train_loss": -44.309844970703125, "global_step": 291440, "epoch": 2408} {"train_loss": -44.328182220458984, "global_step": 291441, "epoch": 2408} {"train_loss": -44.59295654296875, "global_step": 291442, "epoch": 2408} {"train_loss": -44.459259033203125, "global_step": 291443, "epoch": 2408} {"train_loss": -44.84054946899414, "global_step": 291444, "epoch": 2408} {"train_loss": -44.242889404296875, "global_step": 291445, "epoch": 2408} {"train_loss": -44.01179504394531, "global_step": 291446, "epoch": 2408} {"train_loss": -43.622039794921875, "global_step": 291447, "epoch": 2408} {"train_loss": -41.44148254394531, "global_step": 291448, "epoch": 2408} {"train_loss": -42.54969787597656, "global_step": 291449, "epoch": 2408} {"train_loss": -43.49195098876953, "global_step": 291450, "epoch": 2408} {"train_loss": -42.88142013549805, "global_step": 291451, "epoch": 2408} {"train_loss": -41.228790283203125, "global_step": 291452, "epoch": 2408} {"train_loss": -40.997745513916016, "global_step": 291453, "epoch": 2408} {"train_loss": -44.07752227783203, "global_step": 291454, "epoch": 2408} {"train_loss": -39.62847900390625, "global_step": 291455, "epoch": 2408} {"train_loss": -43.137813568115234, "global_step": 291456, "epoch": 2408} {"train_loss": -37.2640380859375, "global_step": 291457, "epoch": 2408} {"train_loss": -38.90641403198242, "global_step": 291458, "epoch": 2408} {"train_loss": -41.29952621459961, "global_step": 291459, "epoch": 2408} {"train_loss": -41.348018646240234, "global_step": 291460, "epoch": 2408} {"train_loss": -41.421607971191406, "global_step": 291461, "epoch": 2408} {"train_loss": -42.4045295715332, "global_step": 291462, "epoch": 2408} {"train_loss": -42.116912841796875, "global_step": 291463, "epoch": 2408} {"train_loss": -42.42555236816406, "global_step": 291464, "epoch": 2408} {"train_loss": -41.33685302734375, "global_step": 291465, "epoch": 2408} {"train_loss": -41.950077056884766, "global_step": 291466, "epoch": 2408} {"train_loss": -42.6275749206543, "global_step": 291467, "epoch": 2408} {"train_loss": -41.158477783203125, "global_step": 291468, "epoch": 2408} {"train_loss": -42.642364501953125, "global_step": 291469, "epoch": 2408} {"train_loss": -42.739253997802734, "global_step": 291470, "epoch": 2408} {"train_loss": -40.42179489135742, "global_step": 291471, "epoch": 2408} {"train_loss": -43.261470794677734, "global_step": 291472, "epoch": 2408} {"train_loss": -40.4445686340332, "global_step": 291473, "epoch": 2408} {"train_loss": -40.76958084106445, "global_step": 291474, "epoch": 2408} {"train_loss": -42.63423538208008, "global_step": 291475, "epoch": 2408} {"train_loss": -41.03640365600586, "global_step": 291476, "epoch": 2408} {"train_loss": -43.01803207397461, "global_step": 291477, "epoch": 2408} {"train_loss": -40.65534210205078, "global_step": 291478, "epoch": 2408} {"train_loss": -40.526588439941406, "global_step": 291479, "epoch": 2408} {"train_loss": -41.61201858520508, "global_step": 291480, "epoch": 2408} {"train_loss": -40.37723922729492, "global_step": 291481, "epoch": 2408} {"train_loss": -41.573143005371094, "global_step": 291482, "epoch": 2408} {"train_loss": -40.60490798950195, "global_step": 291483, "epoch": 2408} {"train_loss": -40.715187072753906, "global_step": 291484, "epoch": 2408} {"train_loss": -41.52470016479492, "global_step": 291485, "epoch": 2408} {"train_loss": -42.058284759521484, "global_step": 291486, "epoch": 2408} {"train_loss": -42.15911102294922, "global_step": 291487, "epoch": 2408} {"train_loss": -42.90584387661012, "global_step": 291488, "epoch": 2408, "val_loss": 2534337.75} {"train_loss": -42.84687042236328, "global_step": 291489, "epoch": 2409} {"train_loss": -42.45595932006836, "global_step": 291490, "epoch": 2409} {"train_loss": -42.320858001708984, "global_step": 291491, "epoch": 2409} {"train_loss": -39.1615104675293, "global_step": 291492, "epoch": 2409} {"train_loss": -42.559322357177734, "global_step": 291493, "epoch": 2409} {"train_loss": -25.50750160217285, "global_step": 291494, "epoch": 2409} {"train_loss": -40.53817367553711, "global_step": 291495, "epoch": 2409} {"train_loss": -38.94724655151367, "global_step": 291496, "epoch": 2409} {"train_loss": -41.58354568481445, "global_step": 291497, "epoch": 2409} {"train_loss": -42.42501449584961, "global_step": 291498, "epoch": 2409} {"train_loss": -42.26579666137695, "global_step": 291499, "epoch": 2409} {"train_loss": -42.02815628051758, "global_step": 291500, "epoch": 2409} {"train_loss": -42.0462760925293, "global_step": 291501, "epoch": 2409} {"train_loss": -40.90807342529297, "global_step": 291502, "epoch": 2409} {"train_loss": -42.47793197631836, "global_step": 291503, "epoch": 2409} {"train_loss": -42.38922882080078, "global_step": 291504, "epoch": 2409} {"train_loss": -42.37229919433594, "global_step": 291505, "epoch": 2409} {"train_loss": -42.65366744995117, "global_step": 291506, "epoch": 2409} {"train_loss": -42.133087158203125, "global_step": 291507, "epoch": 2409} {"train_loss": -41.987125396728516, "global_step": 291508, "epoch": 2409} {"train_loss": -42.83074951171875, "global_step": 291509, "epoch": 2409} {"train_loss": -39.37660598754883, "global_step": 291510, "epoch": 2409} {"train_loss": -41.45672607421875, "global_step": 291511, "epoch": 2409} {"train_loss": -42.99850845336914, "global_step": 291512, "epoch": 2409} {"train_loss": -42.80453109741211, "global_step": 291513, "epoch": 2409} {"train_loss": -40.90264129638672, "global_step": 291514, "epoch": 2409} {"train_loss": -42.27362823486328, "global_step": 291515, "epoch": 2409} {"train_loss": -42.293243408203125, "global_step": 291516, "epoch": 2409} {"train_loss": -42.83368682861328, "global_step": 291517, "epoch": 2409} {"train_loss": -40.18874740600586, "global_step": 291518, "epoch": 2409} {"train_loss": -42.95726013183594, "global_step": 291519, "epoch": 2409} {"train_loss": -42.931270599365234, "global_step": 291520, "epoch": 2409} {"train_loss": -42.92208480834961, "global_step": 291521, "epoch": 2409} {"train_loss": -43.22547149658203, "global_step": 291522, "epoch": 2409} {"train_loss": -41.31342697143555, "global_step": 291523, "epoch": 2409} {"train_loss": -41.2896614074707, "global_step": 291524, "epoch": 2409} {"train_loss": -43.23698043823242, "global_step": 291525, "epoch": 2409} {"train_loss": -42.2650146484375, "global_step": 291526, "epoch": 2409} {"train_loss": -42.83193588256836, "global_step": 291527, "epoch": 2409} {"train_loss": -43.34092330932617, "global_step": 291528, "epoch": 2409} {"train_loss": -42.505001068115234, "global_step": 291529, "epoch": 2409} {"train_loss": -43.44332504272461, "global_step": 291530, "epoch": 2409} {"train_loss": -42.769012451171875, "global_step": 291531, "epoch": 2409} {"train_loss": -41.66607666015625, "global_step": 291532, "epoch": 2409} {"train_loss": -43.5474967956543, "global_step": 291533, "epoch": 2409} {"train_loss": -42.771087646484375, "global_step": 291534, "epoch": 2409} {"train_loss": -42.608943939208984, "global_step": 291535, "epoch": 2409} {"train_loss": -42.03109359741211, "global_step": 291536, "epoch": 2409} {"train_loss": -43.155120849609375, "global_step": 291537, "epoch": 2409} {"train_loss": -41.400936126708984, "global_step": 291538, "epoch": 2409} {"train_loss": -43.367488861083984, "global_step": 291539, "epoch": 2409} {"train_loss": -43.05241012573242, "global_step": 291540, "epoch": 2409} {"train_loss": -43.78317642211914, "global_step": 291541, "epoch": 2409} {"train_loss": -42.22276306152344, "global_step": 291542, "epoch": 2409} {"train_loss": -40.640380859375, "global_step": 291543, "epoch": 2409} {"train_loss": -41.53022384643555, "global_step": 291544, "epoch": 2409} {"train_loss": -44.26658248901367, "global_step": 291545, "epoch": 2409} {"train_loss": -43.3253173828125, "global_step": 291546, "epoch": 2409} {"train_loss": -42.99788284301758, "global_step": 291547, "epoch": 2409} {"train_loss": -43.90055465698242, "global_step": 291548, "epoch": 2409} {"train_loss": -43.26061248779297, "global_step": 291549, "epoch": 2409} {"train_loss": -42.91837692260742, "global_step": 291550, "epoch": 2409} {"train_loss": -43.72616195678711, "global_step": 291551, "epoch": 2409} {"train_loss": -43.32286071777344, "global_step": 291552, "epoch": 2409} {"train_loss": -40.38682174682617, "global_step": 291553, "epoch": 2409} {"train_loss": -44.05229568481445, "global_step": 291554, "epoch": 2409} {"train_loss": -43.31653594970703, "global_step": 291555, "epoch": 2409} {"train_loss": -43.25989532470703, "global_step": 291556, "epoch": 2409} {"train_loss": -40.90546417236328, "global_step": 291557, "epoch": 2409} {"train_loss": -42.13680648803711, "global_step": 291558, "epoch": 2409} {"train_loss": -42.220237731933594, "global_step": 291559, "epoch": 2409} {"train_loss": -43.7594108581543, "global_step": 291560, "epoch": 2409} {"train_loss": -43.55577850341797, "global_step": 291561, "epoch": 2409} {"train_loss": -42.63026428222656, "global_step": 291562, "epoch": 2409} {"train_loss": -42.467769622802734, "global_step": 291563, "epoch": 2409} {"train_loss": -43.4338264465332, "global_step": 291564, "epoch": 2409} {"train_loss": -43.90279006958008, "global_step": 291565, "epoch": 2409} {"train_loss": -43.488853454589844, "global_step": 291566, "epoch": 2409} {"train_loss": -43.070674896240234, "global_step": 291567, "epoch": 2409} {"train_loss": -42.416175842285156, "global_step": 291568, "epoch": 2409} {"train_loss": -42.1110954284668, "global_step": 291569, "epoch": 2409} {"train_loss": -43.7533073425293, "global_step": 291570, "epoch": 2409} {"train_loss": -40.006900787353516, "global_step": 291571, "epoch": 2409} {"train_loss": -24.03948211669922, "global_step": 291572, "epoch": 2409} {"train_loss": -44.15214920043945, "global_step": 291573, "epoch": 2409} {"train_loss": -41.21480941772461, "global_step": 291574, "epoch": 2409} {"train_loss": -40.74488830566406, "global_step": 291575, "epoch": 2409} {"train_loss": -42.89994430541992, "global_step": 291576, "epoch": 2409} {"train_loss": -20.968244552612305, "global_step": 291577, "epoch": 2409} {"train_loss": -39.88080978393555, "global_step": 291578, "epoch": 2409} {"train_loss": -41.566932678222656, "global_step": 291579, "epoch": 2409} {"train_loss": -38.328182220458984, "global_step": 291580, "epoch": 2409} {"train_loss": -41.66327667236328, "global_step": 291581, "epoch": 2409} {"train_loss": -39.8420524597168, "global_step": 291582, "epoch": 2409} {"train_loss": -39.77267074584961, "global_step": 291583, "epoch": 2409} {"train_loss": -39.868743896484375, "global_step": 291584, "epoch": 2409} {"train_loss": -26.90887451171875, "global_step": 291585, "epoch": 2409} {"train_loss": -42.69034957885742, "global_step": 291586, "epoch": 2409} {"train_loss": -43.182594299316406, "global_step": 291587, "epoch": 2409} {"train_loss": -42.02976608276367, "global_step": 291588, "epoch": 2409} {"train_loss": -42.14058303833008, "global_step": 291589, "epoch": 2409} {"train_loss": -41.2843132019043, "global_step": 291590, "epoch": 2409} {"train_loss": -41.465736389160156, "global_step": 291591, "epoch": 2409} {"train_loss": -40.456573486328125, "global_step": 291592, "epoch": 2409} {"train_loss": -41.55611801147461, "global_step": 291593, "epoch": 2409} {"train_loss": -41.660091400146484, "global_step": 291594, "epoch": 2409} {"train_loss": -42.36259460449219, "global_step": 291595, "epoch": 2409} {"train_loss": -42.06075668334961, "global_step": 291596, "epoch": 2409} {"train_loss": -41.25486373901367, "global_step": 291597, "epoch": 2409} {"train_loss": -42.865577697753906, "global_step": 291598, "epoch": 2409} {"train_loss": -42.7556266784668, "global_step": 291599, "epoch": 2409} {"train_loss": -42.16351318359375, "global_step": 291600, "epoch": 2409} {"train_loss": -40.79248809814453, "global_step": 291601, "epoch": 2409} {"train_loss": -42.403133392333984, "global_step": 291602, "epoch": 2409} {"train_loss": -42.6845817565918, "global_step": 291603, "epoch": 2409} {"train_loss": -43.00112533569336, "global_step": 291604, "epoch": 2409} {"train_loss": -42.823421478271484, "global_step": 291605, "epoch": 2409} {"train_loss": -43.136043548583984, "global_step": 291606, "epoch": 2409} {"train_loss": -42.22180938720703, "global_step": 291607, "epoch": 2409} {"train_loss": -43.126426696777344, "global_step": 291608, "epoch": 2409} {"train_loss": -41.61272417809352, "global_step": 291609, "epoch": 2409, "val_loss": 2515136.0} {"train_loss": -43.065433502197266, "global_step": 291610, "epoch": 2410} {"train_loss": -43.33113479614258, "global_step": 291611, "epoch": 2410} {"train_loss": -43.075584411621094, "global_step": 291612, "epoch": 2410} {"train_loss": -42.82696533203125, "global_step": 291613, "epoch": 2410} {"train_loss": -43.10341262817383, "global_step": 291614, "epoch": 2410} {"train_loss": -43.544952392578125, "global_step": 291615, "epoch": 2410} {"train_loss": -43.662925720214844, "global_step": 291616, "epoch": 2410} {"train_loss": -43.629737854003906, "global_step": 291617, "epoch": 2410} {"train_loss": -43.318214416503906, "global_step": 291618, "epoch": 2410} {"train_loss": -43.247920989990234, "global_step": 291619, "epoch": 2410} {"train_loss": -43.29800033569336, "global_step": 291620, "epoch": 2410} {"train_loss": -43.43535232543945, "global_step": 291621, "epoch": 2410} {"train_loss": -43.36220932006836, "global_step": 291622, "epoch": 2410} {"train_loss": -43.24225997924805, "global_step": 291623, "epoch": 2410} {"train_loss": -43.210594177246094, "global_step": 291624, "epoch": 2410} {"train_loss": -44.01215744018555, "global_step": 291625, "epoch": 2410} {"train_loss": -43.91496658325195, "global_step": 291626, "epoch": 2410} {"train_loss": -43.88330841064453, "global_step": 291627, "epoch": 2410} {"train_loss": -44.01306915283203, "global_step": 291628, "epoch": 2410} {"train_loss": -43.82636260986328, "global_step": 291629, "epoch": 2410} {"train_loss": -43.73469924926758, "global_step": 291630, "epoch": 2410} {"train_loss": -43.549720764160156, "global_step": 291631, "epoch": 2410} {"train_loss": -44.00887680053711, "global_step": 291632, "epoch": 2410} {"train_loss": -43.686309814453125, "global_step": 291633, "epoch": 2410} {"train_loss": -43.64787673950195, "global_step": 291634, "epoch": 2410} {"train_loss": -43.59177017211914, "global_step": 291635, "epoch": 2410} {"train_loss": -44.49808883666992, "global_step": 291636, "epoch": 2410} {"train_loss": -44.17694091796875, "global_step": 291637, "epoch": 2410} {"train_loss": -43.827613830566406, "global_step": 291638, "epoch": 2410} {"train_loss": -44.4576530456543, "global_step": 291639, "epoch": 2410} {"train_loss": -44.01229476928711, "global_step": 291640, "epoch": 2410} {"train_loss": -43.4047966003418, "global_step": 291641, "epoch": 2410} {"train_loss": -43.960235595703125, "global_step": 291642, "epoch": 2410} {"train_loss": -44.38594436645508, "global_step": 291643, "epoch": 2410} {"train_loss": -43.786006927490234, "global_step": 291644, "epoch": 2410} {"train_loss": -43.22833251953125, "global_step": 291645, "epoch": 2410} {"train_loss": -43.4736328125, "global_step": 291646, "epoch": 2410} {"train_loss": -44.264984130859375, "global_step": 291647, "epoch": 2410} {"train_loss": -42.23353576660156, "global_step": 291648, "epoch": 2410} {"train_loss": -41.988990783691406, "global_step": 291649, "epoch": 2410} {"train_loss": -43.47895431518555, "global_step": 291650, "epoch": 2410} {"train_loss": -43.17932891845703, "global_step": 291651, "epoch": 2410} {"train_loss": -41.39590835571289, "global_step": 291652, "epoch": 2410} {"train_loss": -42.865108489990234, "global_step": 291653, "epoch": 2410} {"train_loss": -43.5513801574707, "global_step": 291654, "epoch": 2410} {"train_loss": -42.58498001098633, "global_step": 291655, "epoch": 2410} {"train_loss": -41.95847702026367, "global_step": 291656, "epoch": 2410} {"train_loss": -43.21555709838867, "global_step": 291657, "epoch": 2410} {"train_loss": -41.39120864868164, "global_step": 291658, "epoch": 2410} {"train_loss": -38.794673919677734, "global_step": 291659, "epoch": 2410} {"train_loss": -42.88466262817383, "global_step": 291660, "epoch": 2410} {"train_loss": -41.14714431762695, "global_step": 291661, "epoch": 2410} {"train_loss": -42.24174880981445, "global_step": 291662, "epoch": 2410} {"train_loss": -41.65478515625, "global_step": 291663, "epoch": 2410} {"train_loss": -40.94019317626953, "global_step": 291664, "epoch": 2410} {"train_loss": -42.18047332763672, "global_step": 291665, "epoch": 2410} {"train_loss": -41.941646575927734, "global_step": 291666, "epoch": 2410} {"train_loss": -41.21149826049805, "global_step": 291667, "epoch": 2410} {"train_loss": -41.4875602722168, "global_step": 291668, "epoch": 2410} {"train_loss": -40.552276611328125, "global_step": 291669, "epoch": 2410} {"train_loss": -40.2340202331543, "global_step": 291670, "epoch": 2410} {"train_loss": -41.5204963684082, "global_step": 291671, "epoch": 2410} {"train_loss": -41.95512771606445, "global_step": 291672, "epoch": 2410} {"train_loss": -41.20803451538086, "global_step": 291673, "epoch": 2410} {"train_loss": -41.3475227355957, "global_step": 291674, "epoch": 2410} {"train_loss": -41.00895309448242, "global_step": 291675, "epoch": 2410} {"train_loss": -40.72274398803711, "global_step": 291676, "epoch": 2410} {"train_loss": -41.48603820800781, "global_step": 291677, "epoch": 2410} {"train_loss": -40.8640022277832, "global_step": 291678, "epoch": 2410} {"train_loss": -42.69623947143555, "global_step": 291679, "epoch": 2410} {"train_loss": -40.64325714111328, "global_step": 291680, "epoch": 2410} {"train_loss": -43.00116729736328, "global_step": 291681, "epoch": 2410} {"train_loss": -40.237857818603516, "global_step": 291682, "epoch": 2410} {"train_loss": -41.828697204589844, "global_step": 291683, "epoch": 2410} {"train_loss": -39.93495178222656, "global_step": 291684, "epoch": 2410} {"train_loss": -40.48604965209961, "global_step": 291685, "epoch": 2410} {"train_loss": -41.256263732910156, "global_step": 291686, "epoch": 2410} {"train_loss": -41.371944427490234, "global_step": 291687, "epoch": 2410} {"train_loss": -42.60355758666992, "global_step": 291688, "epoch": 2410} {"train_loss": -42.67127990722656, "global_step": 291689, "epoch": 2410} {"train_loss": -42.70020294189453, "global_step": 291690, "epoch": 2410} {"train_loss": -42.40639114379883, "global_step": 291691, "epoch": 2410} {"train_loss": -42.22072982788086, "global_step": 291692, "epoch": 2410} {"train_loss": -42.213382720947266, "global_step": 291693, "epoch": 2410} {"train_loss": -42.44473648071289, "global_step": 291694, "epoch": 2410} {"train_loss": -42.63064956665039, "global_step": 291695, "epoch": 2410} {"train_loss": -42.34823226928711, "global_step": 291696, "epoch": 2410} {"train_loss": -43.151771545410156, "global_step": 291697, "epoch": 2410} {"train_loss": -42.60768508911133, "global_step": 291698, "epoch": 2410} {"train_loss": -41.81862258911133, "global_step": 291699, "epoch": 2410} {"train_loss": -42.4072380065918, "global_step": 291700, "epoch": 2410} {"train_loss": -42.6249885559082, "global_step": 291701, "epoch": 2410} {"train_loss": -41.99949264526367, "global_step": 291702, "epoch": 2410} {"train_loss": -41.818092346191406, "global_step": 291703, "epoch": 2410} {"train_loss": -42.50889587402344, "global_step": 291704, "epoch": 2410} {"train_loss": -42.82203674316406, "global_step": 291705, "epoch": 2410} {"train_loss": -42.02537155151367, "global_step": 291706, "epoch": 2410} {"train_loss": -42.118343353271484, "global_step": 291707, "epoch": 2410} {"train_loss": -42.57851791381836, "global_step": 291708, "epoch": 2410} {"train_loss": -42.6524543762207, "global_step": 291709, "epoch": 2410} {"train_loss": -42.105567932128906, "global_step": 291710, "epoch": 2410} {"train_loss": -42.64698028564453, "global_step": 291711, "epoch": 2410} {"train_loss": -42.70138931274414, "global_step": 291712, "epoch": 2410} {"train_loss": -43.320594787597656, "global_step": 291713, "epoch": 2410} {"train_loss": -42.889495849609375, "global_step": 291714, "epoch": 2410} {"train_loss": -42.98796081542969, "global_step": 291715, "epoch": 2410} {"train_loss": -43.64887237548828, "global_step": 291716, "epoch": 2410} {"train_loss": -42.27192306518555, "global_step": 291717, "epoch": 2410} {"train_loss": -42.759727478027344, "global_step": 291718, "epoch": 2410} {"train_loss": -43.199684143066406, "global_step": 291719, "epoch": 2410} {"train_loss": -42.923919677734375, "global_step": 291720, "epoch": 2410} {"train_loss": -42.80904769897461, "global_step": 291721, "epoch": 2410} {"train_loss": -43.66605758666992, "global_step": 291722, "epoch": 2410} {"train_loss": -43.71743392944336, "global_step": 291723, "epoch": 2410} {"train_loss": -43.68488311767578, "global_step": 291724, "epoch": 2410} {"train_loss": -42.97188949584961, "global_step": 291725, "epoch": 2410} {"train_loss": -43.194602966308594, "global_step": 291726, "epoch": 2410} {"train_loss": -43.387901306152344, "global_step": 291727, "epoch": 2410} {"train_loss": -42.847835540771484, "global_step": 291728, "epoch": 2410} {"train_loss": -42.89216995239258, "global_step": 291729, "epoch": 2410} {"train_loss": -42.646300512897085, "global_step": 291730, "epoch": 2410, "val_loss": 2517203.25} {"train_loss": -43.76789093017578, "global_step": 291731, "epoch": 2411} {"train_loss": -43.171058654785156, "global_step": 291732, "epoch": 2411} {"train_loss": -42.53007507324219, "global_step": 291733, "epoch": 2411} {"train_loss": -42.38442611694336, "global_step": 291734, "epoch": 2411} {"train_loss": -44.167236328125, "global_step": 291735, "epoch": 2411} {"train_loss": -43.25286865234375, "global_step": 291736, "epoch": 2411} {"train_loss": -43.85028076171875, "global_step": 291737, "epoch": 2411} {"train_loss": -43.32465744018555, "global_step": 291738, "epoch": 2411} {"train_loss": -43.87288284301758, "global_step": 291739, "epoch": 2411} {"train_loss": -44.19370651245117, "global_step": 291740, "epoch": 2411} {"train_loss": -43.36112976074219, "global_step": 291741, "epoch": 2411} {"train_loss": -43.252140045166016, "global_step": 291742, "epoch": 2411} {"train_loss": -44.097023010253906, "global_step": 291743, "epoch": 2411} {"train_loss": -44.33210754394531, "global_step": 291744, "epoch": 2411} {"train_loss": -43.88774108886719, "global_step": 291745, "epoch": 2411} {"train_loss": -43.753273010253906, "global_step": 291746, "epoch": 2411} {"train_loss": -44.0081787109375, "global_step": 291747, "epoch": 2411} {"train_loss": -43.412174224853516, "global_step": 291748, "epoch": 2411} {"train_loss": -42.783626556396484, "global_step": 291749, "epoch": 2411} {"train_loss": -44.19052505493164, "global_step": 291750, "epoch": 2411} {"train_loss": -44.25004196166992, "global_step": 291751, "epoch": 2411} {"train_loss": -42.98323440551758, "global_step": 291752, "epoch": 2411} {"train_loss": -44.36738204956055, "global_step": 291753, "epoch": 2411} {"train_loss": -43.8239631652832, "global_step": 291754, "epoch": 2411} {"train_loss": -43.2410888671875, "global_step": 291755, "epoch": 2411} {"train_loss": -42.47469711303711, "global_step": 291756, "epoch": 2411} {"train_loss": -42.951419830322266, "global_step": 291757, "epoch": 2411} {"train_loss": -43.82170104980469, "global_step": 291758, "epoch": 2411} {"train_loss": -42.7894401550293, "global_step": 291759, "epoch": 2411} {"train_loss": -43.36389923095703, "global_step": 291760, "epoch": 2411} {"train_loss": -44.12004089355469, "global_step": 291761, "epoch": 2411} {"train_loss": -44.207027435302734, "global_step": 291762, "epoch": 2411} {"train_loss": -43.86428451538086, "global_step": 291763, "epoch": 2411} {"train_loss": -43.02315902709961, "global_step": 291764, "epoch": 2411} {"train_loss": -43.052303314208984, "global_step": 291765, "epoch": 2411} {"train_loss": -43.61350631713867, "global_step": 291766, "epoch": 2411} {"train_loss": -44.147308349609375, "global_step": 291767, "epoch": 2411} {"train_loss": -43.939300537109375, "global_step": 291768, "epoch": 2411} {"train_loss": -43.86304473876953, "global_step": 291769, "epoch": 2411} {"train_loss": -43.531856536865234, "global_step": 291770, "epoch": 2411} {"train_loss": -43.594764709472656, "global_step": 291771, "epoch": 2411} {"train_loss": -42.565006256103516, "global_step": 291772, "epoch": 2411} {"train_loss": -42.68972396850586, "global_step": 291773, "epoch": 2411} {"train_loss": -42.7000846862793, "global_step": 291774, "epoch": 2411} {"train_loss": -43.36058807373047, "global_step": 291775, "epoch": 2411} {"train_loss": -42.91802978515625, "global_step": 291776, "epoch": 2411} {"train_loss": -42.50486373901367, "global_step": 291777, "epoch": 2411} {"train_loss": -42.43151092529297, "global_step": 291778, "epoch": 2411} {"train_loss": -43.4765510559082, "global_step": 291779, "epoch": 2411} {"train_loss": -43.74759292602539, "global_step": 291780, "epoch": 2411} {"train_loss": -44.20554733276367, "global_step": 291781, "epoch": 2411} {"train_loss": -42.02677917480469, "global_step": 291782, "epoch": 2411} {"train_loss": -42.04977035522461, "global_step": 291783, "epoch": 2411} {"train_loss": -43.70161437988281, "global_step": 291784, "epoch": 2411} {"train_loss": -42.104915618896484, "global_step": 291785, "epoch": 2411} {"train_loss": -42.706085205078125, "global_step": 291786, "epoch": 2411} {"train_loss": -43.41748809814453, "global_step": 291787, "epoch": 2411} {"train_loss": -42.73373031616211, "global_step": 291788, "epoch": 2411} {"train_loss": -42.891944885253906, "global_step": 291789, "epoch": 2411} {"train_loss": -42.42491149902344, "global_step": 291790, "epoch": 2411} {"train_loss": -42.64018630981445, "global_step": 291791, "epoch": 2411} {"train_loss": -44.04761505126953, "global_step": 291792, "epoch": 2411} {"train_loss": -42.995304107666016, "global_step": 291793, "epoch": 2411} {"train_loss": -41.68326950073242, "global_step": 291794, "epoch": 2411} {"train_loss": -42.92013168334961, "global_step": 291795, "epoch": 2411} {"train_loss": -43.95024871826172, "global_step": 291796, "epoch": 2411} {"train_loss": -43.031288146972656, "global_step": 291797, "epoch": 2411} {"train_loss": -41.980674743652344, "global_step": 291798, "epoch": 2411} {"train_loss": -43.1763801574707, "global_step": 291799, "epoch": 2411} {"train_loss": -43.794612884521484, "global_step": 291800, "epoch": 2411} {"train_loss": -42.21723175048828, "global_step": 291801, "epoch": 2411} {"train_loss": -42.49283981323242, "global_step": 291802, "epoch": 2411} {"train_loss": -44.068695068359375, "global_step": 291803, "epoch": 2411} {"train_loss": -42.17826461791992, "global_step": 291804, "epoch": 2411} {"train_loss": -41.40285110473633, "global_step": 291805, "epoch": 2411} {"train_loss": -43.9527473449707, "global_step": 291806, "epoch": 2411} {"train_loss": -42.93062973022461, "global_step": 291807, "epoch": 2411} {"train_loss": -41.7057991027832, "global_step": 291808, "epoch": 2411} {"train_loss": -44.1248779296875, "global_step": 291809, "epoch": 2411} {"train_loss": -43.13395309448242, "global_step": 291810, "epoch": 2411} {"train_loss": -43.08719253540039, "global_step": 291811, "epoch": 2411} {"train_loss": -43.30149841308594, "global_step": 291812, "epoch": 2411} {"train_loss": -41.853851318359375, "global_step": 291813, "epoch": 2411} {"train_loss": -43.62888717651367, "global_step": 291814, "epoch": 2411} {"train_loss": -40.800743103027344, "global_step": 291815, "epoch": 2411} {"train_loss": -42.92159652709961, "global_step": 291816, "epoch": 2411} {"train_loss": -42.64655685424805, "global_step": 291817, "epoch": 2411} {"train_loss": -39.50552749633789, "global_step": 291818, "epoch": 2411} {"train_loss": -43.47343826293945, "global_step": 291819, "epoch": 2411} {"train_loss": -42.427425384521484, "global_step": 291820, "epoch": 2411} {"train_loss": -40.95571517944336, "global_step": 291821, "epoch": 2411} {"train_loss": -43.03461456298828, "global_step": 291822, "epoch": 2411} {"train_loss": -42.78510665893555, "global_step": 291823, "epoch": 2411} {"train_loss": -41.87168502807617, "global_step": 291824, "epoch": 2411} {"train_loss": -43.59796142578125, "global_step": 291825, "epoch": 2411} {"train_loss": -43.29366683959961, "global_step": 291826, "epoch": 2411} {"train_loss": -42.42659378051758, "global_step": 291827, "epoch": 2411} {"train_loss": -43.364315032958984, "global_step": 291828, "epoch": 2411} {"train_loss": -43.547576904296875, "global_step": 291829, "epoch": 2411} {"train_loss": -43.22438430786133, "global_step": 291830, "epoch": 2411} {"train_loss": -43.11758804321289, "global_step": 291831, "epoch": 2411} {"train_loss": -43.672977447509766, "global_step": 291832, "epoch": 2411} {"train_loss": -43.29087448120117, "global_step": 291833, "epoch": 2411} {"train_loss": -42.499664306640625, "global_step": 291834, "epoch": 2411} {"train_loss": -43.350791931152344, "global_step": 291835, "epoch": 2411} {"train_loss": -43.45792770385742, "global_step": 291836, "epoch": 2411} {"train_loss": -43.21533203125, "global_step": 291837, "epoch": 2411} {"train_loss": -43.744510650634766, "global_step": 291838, "epoch": 2411} {"train_loss": -43.69586181640625, "global_step": 291839, "epoch": 2411} {"train_loss": -42.9240608215332, "global_step": 291840, "epoch": 2411} {"train_loss": -43.761619567871094, "global_step": 291841, "epoch": 2411} {"train_loss": -43.387569427490234, "global_step": 291842, "epoch": 2411} {"train_loss": -43.997100830078125, "global_step": 291843, "epoch": 2411} {"train_loss": -43.487979888916016, "global_step": 291844, "epoch": 2411} {"train_loss": -44.2818489074707, "global_step": 291845, "epoch": 2411} {"train_loss": -43.444881439208984, "global_step": 291846, "epoch": 2411} {"train_loss": -43.404598236083984, "global_step": 291847, "epoch": 2411} {"train_loss": -43.09025573730469, "global_step": 291848, "epoch": 2411} {"train_loss": -44.17763137817383, "global_step": 291849, "epoch": 2411} {"train_loss": -43.4843635559082, "global_step": 291850, "epoch": 2411} {"train_loss": -43.176051210766, "global_step": 291851, "epoch": 2411, "val_loss": 2414463.75} {"train_loss": -43.86800003051758, "global_step": 291852, "epoch": 2412} {"train_loss": -44.246612548828125, "global_step": 291853, "epoch": 2412} {"train_loss": -43.949623107910156, "global_step": 291854, "epoch": 2412} {"train_loss": -43.56060791015625, "global_step": 291855, "epoch": 2412} {"train_loss": -44.06355285644531, "global_step": 291856, "epoch": 2412} {"train_loss": -44.27177810668945, "global_step": 291857, "epoch": 2412} {"train_loss": -44.04373550415039, "global_step": 291858, "epoch": 2412} {"train_loss": -42.81858825683594, "global_step": 291859, "epoch": 2412} {"train_loss": -43.28190231323242, "global_step": 291860, "epoch": 2412} {"train_loss": -43.916988372802734, "global_step": 291861, "epoch": 2412} {"train_loss": -42.22758865356445, "global_step": 291862, "epoch": 2412} {"train_loss": -42.576759338378906, "global_step": 291863, "epoch": 2412} {"train_loss": -43.99638748168945, "global_step": 291864, "epoch": 2412} {"train_loss": -43.99228286743164, "global_step": 291865, "epoch": 2412} {"train_loss": -44.23049545288086, "global_step": 291866, "epoch": 2412} {"train_loss": -43.87360763549805, "global_step": 291867, "epoch": 2412} {"train_loss": -43.84536361694336, "global_step": 291868, "epoch": 2412} {"train_loss": -44.46156311035156, "global_step": 291869, "epoch": 2412} {"train_loss": -44.60467529296875, "global_step": 291870, "epoch": 2412} {"train_loss": -43.02877426147461, "global_step": 291871, "epoch": 2412} {"train_loss": -41.5691032409668, "global_step": 291872, "epoch": 2412} {"train_loss": -41.06474685668945, "global_step": 291873, "epoch": 2412} {"train_loss": -42.80130386352539, "global_step": 291874, "epoch": 2412} {"train_loss": -43.80994415283203, "global_step": 291875, "epoch": 2412} {"train_loss": -42.95927047729492, "global_step": 291876, "epoch": 2412} {"train_loss": -42.43701171875, "global_step": 291877, "epoch": 2412} {"train_loss": -43.94973373413086, "global_step": 291878, "epoch": 2412} {"train_loss": -44.384220123291016, "global_step": 291879, "epoch": 2412} {"train_loss": -43.48563766479492, "global_step": 291880, "epoch": 2412} {"train_loss": -43.33137512207031, "global_step": 291881, "epoch": 2412} {"train_loss": -44.176673889160156, "global_step": 291882, "epoch": 2412} {"train_loss": -43.83015823364258, "global_step": 291883, "epoch": 2412} {"train_loss": -43.87955856323242, "global_step": 291884, "epoch": 2412} {"train_loss": -43.74214172363281, "global_step": 291885, "epoch": 2412} {"train_loss": -43.49129867553711, "global_step": 291886, "epoch": 2412} {"train_loss": -44.244903564453125, "global_step": 291887, "epoch": 2412} {"train_loss": -43.89156723022461, "global_step": 291888, "epoch": 2412} {"train_loss": -44.09773635864258, "global_step": 291889, "epoch": 2412} {"train_loss": -43.51089096069336, "global_step": 291890, "epoch": 2412} {"train_loss": -44.24703598022461, "global_step": 291891, "epoch": 2412} {"train_loss": -43.96944046020508, "global_step": 291892, "epoch": 2412} {"train_loss": -43.02125930786133, "global_step": 291893, "epoch": 2412} {"train_loss": -44.0446662902832, "global_step": 291894, "epoch": 2412} {"train_loss": -44.257301330566406, "global_step": 291895, "epoch": 2412} {"train_loss": -43.87827682495117, "global_step": 291896, "epoch": 2412} {"train_loss": -44.230770111083984, "global_step": 291897, "epoch": 2412} {"train_loss": -44.33347702026367, "global_step": 291898, "epoch": 2412} {"train_loss": -44.26917266845703, "global_step": 291899, "epoch": 2412} {"train_loss": -44.22917175292969, "global_step": 291900, "epoch": 2412} {"train_loss": -44.226322174072266, "global_step": 291901, "epoch": 2412} {"train_loss": -43.8018798828125, "global_step": 291902, "epoch": 2412} {"train_loss": -43.63704299926758, "global_step": 291903, "epoch": 2412} {"train_loss": -43.89863204956055, "global_step": 291904, "epoch": 2412} {"train_loss": -44.63410186767578, "global_step": 291905, "epoch": 2412} {"train_loss": -43.680843353271484, "global_step": 291906, "epoch": 2412} {"train_loss": -43.22774124145508, "global_step": 291907, "epoch": 2412} {"train_loss": -44.16495895385742, "global_step": 291908, "epoch": 2412} {"train_loss": -43.989681243896484, "global_step": 291909, "epoch": 2412} {"train_loss": -43.4354133605957, "global_step": 291910, "epoch": 2412} {"train_loss": -43.716304779052734, "global_step": 291911, "epoch": 2412} {"train_loss": -44.2296028137207, "global_step": 291912, "epoch": 2412} {"train_loss": -43.50139617919922, "global_step": 291913, "epoch": 2412} {"train_loss": -43.96971893310547, "global_step": 291914, "epoch": 2412} {"train_loss": -43.89544677734375, "global_step": 291915, "epoch": 2412} {"train_loss": -44.36009216308594, "global_step": 291916, "epoch": 2412} {"train_loss": -44.63822937011719, "global_step": 291917, "epoch": 2412} {"train_loss": -44.255516052246094, "global_step": 291918, "epoch": 2412} {"train_loss": -43.079559326171875, "global_step": 291919, "epoch": 2412} {"train_loss": -43.44155502319336, "global_step": 291920, "epoch": 2412} {"train_loss": -43.76678466796875, "global_step": 291921, "epoch": 2412} {"train_loss": -42.01148223876953, "global_step": 291922, "epoch": 2412} {"train_loss": -42.4573974609375, "global_step": 291923, "epoch": 2412} {"train_loss": -44.44011306762695, "global_step": 291924, "epoch": 2412} {"train_loss": -44.08774948120117, "global_step": 291925, "epoch": 2412} {"train_loss": -43.5912971496582, "global_step": 291926, "epoch": 2412} {"train_loss": -44.105682373046875, "global_step": 291927, "epoch": 2412} {"train_loss": -44.36162185668945, "global_step": 291928, "epoch": 2412} {"train_loss": -42.85398864746094, "global_step": 291929, "epoch": 2412} {"train_loss": -43.57731246948242, "global_step": 291930, "epoch": 2412} {"train_loss": -44.71684265136719, "global_step": 291931, "epoch": 2412} {"train_loss": -42.77798080444336, "global_step": 291932, "epoch": 2412} {"train_loss": -42.46372985839844, "global_step": 291933, "epoch": 2412} {"train_loss": -44.92718505859375, "global_step": 291934, "epoch": 2412} {"train_loss": -43.20749282836914, "global_step": 291935, "epoch": 2412} {"train_loss": -43.17369079589844, "global_step": 291936, "epoch": 2412} {"train_loss": -43.79608154296875, "global_step": 291937, "epoch": 2412} {"train_loss": -43.4512825012207, "global_step": 291938, "epoch": 2412} {"train_loss": -42.68885040283203, "global_step": 291939, "epoch": 2412} {"train_loss": -44.00019454956055, "global_step": 291940, "epoch": 2412} {"train_loss": -44.21946334838867, "global_step": 291941, "epoch": 2412} {"train_loss": -43.14801025390625, "global_step": 291942, "epoch": 2412} {"train_loss": -43.892059326171875, "global_step": 291943, "epoch": 2412} {"train_loss": -43.00177764892578, "global_step": 291944, "epoch": 2412} {"train_loss": -43.44300842285156, "global_step": 291945, "epoch": 2412} {"train_loss": -43.005130767822266, "global_step": 291946, "epoch": 2412} {"train_loss": -42.641021728515625, "global_step": 291947, "epoch": 2412} {"train_loss": -44.109127044677734, "global_step": 291948, "epoch": 2412} {"train_loss": -44.22170639038086, "global_step": 291949, "epoch": 2412} {"train_loss": -43.57417297363281, "global_step": 291950, "epoch": 2412} {"train_loss": -44.356380462646484, "global_step": 291951, "epoch": 2412} {"train_loss": -43.06380844116211, "global_step": 291952, "epoch": 2412} {"train_loss": -44.06083297729492, "global_step": 291953, "epoch": 2412} {"train_loss": -44.09022521972656, "global_step": 291954, "epoch": 2412} {"train_loss": -43.45146179199219, "global_step": 291955, "epoch": 2412} {"train_loss": -44.223140716552734, "global_step": 291956, "epoch": 2412} {"train_loss": -43.62899398803711, "global_step": 291957, "epoch": 2412} {"train_loss": -43.8996696472168, "global_step": 291958, "epoch": 2412} {"train_loss": -43.382415771484375, "global_step": 291959, "epoch": 2412} {"train_loss": -43.25458526611328, "global_step": 291960, "epoch": 2412} {"train_loss": -44.1087646484375, "global_step": 291961, "epoch": 2412} {"train_loss": -43.412086486816406, "global_step": 291962, "epoch": 2412} {"train_loss": -43.7361946105957, "global_step": 291963, "epoch": 2412} {"train_loss": -42.869075775146484, "global_step": 291964, "epoch": 2412} {"train_loss": -42.76498031616211, "global_step": 291965, "epoch": 2412} {"train_loss": -43.60205078125, "global_step": 291966, "epoch": 2412} {"train_loss": -43.57968521118164, "global_step": 291967, "epoch": 2412} {"train_loss": -41.96622848510742, "global_step": 291968, "epoch": 2412} {"train_loss": -41.11518478393555, "global_step": 291969, "epoch": 2412} {"train_loss": -42.56288528442383, "global_step": 291970, "epoch": 2412} {"train_loss": -43.17173385620117, "global_step": 291971, "epoch": 2412} {"train_loss": -43.60462201331273, "global_step": 291972, "epoch": 2412, "val_loss": 2420326.25} {"train_loss": -41.82038497924805, "global_step": 291973, "epoch": 2413} {"train_loss": -42.905643463134766, "global_step": 291974, "epoch": 2413} {"train_loss": -43.502376556396484, "global_step": 291975, "epoch": 2413} {"train_loss": -43.48883056640625, "global_step": 291976, "epoch": 2413} {"train_loss": -43.73988342285156, "global_step": 291977, "epoch": 2413} {"train_loss": -43.05513000488281, "global_step": 291978, "epoch": 2413} {"train_loss": -43.561920166015625, "global_step": 291979, "epoch": 2413} {"train_loss": -42.98174285888672, "global_step": 291980, "epoch": 2413} {"train_loss": -43.526397705078125, "global_step": 291981, "epoch": 2413} {"train_loss": -43.83763122558594, "global_step": 291982, "epoch": 2413} {"train_loss": -42.780494689941406, "global_step": 291983, "epoch": 2413} {"train_loss": -41.49892807006836, "global_step": 291984, "epoch": 2413} {"train_loss": -43.40372848510742, "global_step": 291985, "epoch": 2413} {"train_loss": -43.52498245239258, "global_step": 291986, "epoch": 2413} {"train_loss": -43.31526565551758, "global_step": 291987, "epoch": 2413} {"train_loss": -43.20600128173828, "global_step": 291988, "epoch": 2413} {"train_loss": -43.35175704956055, "global_step": 291989, "epoch": 2413} {"train_loss": -44.09017562866211, "global_step": 291990, "epoch": 2413} {"train_loss": -41.701602935791016, "global_step": 291991, "epoch": 2413} {"train_loss": -41.78957748413086, "global_step": 291992, "epoch": 2413} {"train_loss": -43.456905364990234, "global_step": 291993, "epoch": 2413} {"train_loss": -41.25416946411133, "global_step": 291994, "epoch": 2413} {"train_loss": -43.17940139770508, "global_step": 291995, "epoch": 2413} {"train_loss": -43.35087203979492, "global_step": 291996, "epoch": 2413} {"train_loss": -42.657657623291016, "global_step": 291997, "epoch": 2413} {"train_loss": -43.15448760986328, "global_step": 291998, "epoch": 2413} {"train_loss": -43.78313064575195, "global_step": 291999, "epoch": 2413} {"train_loss": -43.2976188659668, "global_step": 292000, "epoch": 2413} {"train_loss": -42.713775634765625, "global_step": 292001, "epoch": 2413} {"train_loss": -42.83812713623047, "global_step": 292002, "epoch": 2413} {"train_loss": -43.74842071533203, "global_step": 292003, "epoch": 2413} {"train_loss": -43.151859283447266, "global_step": 292004, "epoch": 2413} {"train_loss": -43.0450439453125, "global_step": 292005, "epoch": 2413} {"train_loss": -43.88844680786133, "global_step": 292006, "epoch": 2413} {"train_loss": -43.51875686645508, "global_step": 292007, "epoch": 2413} {"train_loss": -43.52047348022461, "global_step": 292008, "epoch": 2413} {"train_loss": -43.37250900268555, "global_step": 292009, "epoch": 2413} {"train_loss": -43.6283073425293, "global_step": 292010, "epoch": 2413} {"train_loss": -43.6431884765625, "global_step": 292011, "epoch": 2413} {"train_loss": -42.91533279418945, "global_step": 292012, "epoch": 2413} {"train_loss": -41.4164924621582, "global_step": 292013, "epoch": 2413} {"train_loss": -43.45261001586914, "global_step": 292014, "epoch": 2413} {"train_loss": -42.729190826416016, "global_step": 292015, "epoch": 2413} {"train_loss": -42.6277961730957, "global_step": 292016, "epoch": 2413} {"train_loss": -44.202022552490234, "global_step": 292017, "epoch": 2413} {"train_loss": -44.026424407958984, "global_step": 292018, "epoch": 2413} {"train_loss": -43.89825439453125, "global_step": 292019, "epoch": 2413} {"train_loss": -43.7375602722168, "global_step": 292020, "epoch": 2413} {"train_loss": -43.80432891845703, "global_step": 292021, "epoch": 2413} {"train_loss": -44.13850402832031, "global_step": 292022, "epoch": 2413} {"train_loss": -43.245140075683594, "global_step": 292023, "epoch": 2413} {"train_loss": -42.75398635864258, "global_step": 292024, "epoch": 2413} {"train_loss": -44.004905700683594, "global_step": 292025, "epoch": 2413} {"train_loss": -43.65159225463867, "global_step": 292026, "epoch": 2413} {"train_loss": -43.976539611816406, "global_step": 292027, "epoch": 2413} {"train_loss": -43.295875549316406, "global_step": 292028, "epoch": 2413} {"train_loss": -42.61177444458008, "global_step": 292029, "epoch": 2413} {"train_loss": -41.847618103027344, "global_step": 292030, "epoch": 2413} {"train_loss": -41.694698333740234, "global_step": 292031, "epoch": 2413} {"train_loss": -44.02424621582031, "global_step": 292032, "epoch": 2413} {"train_loss": -42.070533752441406, "global_step": 292033, "epoch": 2413} {"train_loss": -41.26353073120117, "global_step": 292034, "epoch": 2413} {"train_loss": -42.22060012817383, "global_step": 292035, "epoch": 2413} {"train_loss": -43.613582611083984, "global_step": 292036, "epoch": 2413} {"train_loss": -41.39194869995117, "global_step": 292037, "epoch": 2413} {"train_loss": -42.1419563293457, "global_step": 292038, "epoch": 2413} {"train_loss": -41.36948776245117, "global_step": 292039, "epoch": 2413} {"train_loss": -42.465511322021484, "global_step": 292040, "epoch": 2413} {"train_loss": -40.45199203491211, "global_step": 292041, "epoch": 2413} {"train_loss": -42.28874588012695, "global_step": 292042, "epoch": 2413} {"train_loss": -39.6448860168457, "global_step": 292043, "epoch": 2413} {"train_loss": -41.71671676635742, "global_step": 292044, "epoch": 2413} {"train_loss": -36.77108383178711, "global_step": 292045, "epoch": 2413} {"train_loss": -41.95528030395508, "global_step": 292046, "epoch": 2413} {"train_loss": -36.53389358520508, "global_step": 292047, "epoch": 2413} {"train_loss": -34.012054443359375, "global_step": 292048, "epoch": 2413} {"train_loss": -37.68345642089844, "global_step": 292049, "epoch": 2413} {"train_loss": -41.17428207397461, "global_step": 292050, "epoch": 2413} {"train_loss": -38.33449935913086, "global_step": 292051, "epoch": 2413} {"train_loss": -41.82680892944336, "global_step": 292052, "epoch": 2413} {"train_loss": -40.4550666809082, "global_step": 292053, "epoch": 2413} {"train_loss": -40.924373626708984, "global_step": 292054, "epoch": 2413} {"train_loss": -41.12331008911133, "global_step": 292055, "epoch": 2413} {"train_loss": -41.645084381103516, "global_step": 292056, "epoch": 2413} {"train_loss": -40.532928466796875, "global_step": 292057, "epoch": 2413} {"train_loss": -42.27384567260742, "global_step": 292058, "epoch": 2413} {"train_loss": -41.42748260498047, "global_step": 292059, "epoch": 2413} {"train_loss": -42.10565185546875, "global_step": 292060, "epoch": 2413} {"train_loss": -41.23584747314453, "global_step": 292061, "epoch": 2413} {"train_loss": -42.22034454345703, "global_step": 292062, "epoch": 2413} {"train_loss": -41.35712814331055, "global_step": 292063, "epoch": 2413} {"train_loss": -42.82741928100586, "global_step": 292064, "epoch": 2413} {"train_loss": -41.64511489868164, "global_step": 292065, "epoch": 2413} {"train_loss": -42.304595947265625, "global_step": 292066, "epoch": 2413} {"train_loss": -42.13681411743164, "global_step": 292067, "epoch": 2413} {"train_loss": -41.54006576538086, "global_step": 292068, "epoch": 2413} {"train_loss": -42.87086868286133, "global_step": 292069, "epoch": 2413} {"train_loss": -42.508480072021484, "global_step": 292070, "epoch": 2413} {"train_loss": -43.185546875, "global_step": 292071, "epoch": 2413} {"train_loss": -42.98356246948242, "global_step": 292072, "epoch": 2413} {"train_loss": -43.197837829589844, "global_step": 292073, "epoch": 2413} {"train_loss": -42.822853088378906, "global_step": 292074, "epoch": 2413} {"train_loss": -42.99445343017578, "global_step": 292075, "epoch": 2413} {"train_loss": -42.6231803894043, "global_step": 292076, "epoch": 2413} {"train_loss": -43.45117950439453, "global_step": 292077, "epoch": 2413} {"train_loss": -42.53168869018555, "global_step": 292078, "epoch": 2413} {"train_loss": -43.220314025878906, "global_step": 292079, "epoch": 2413} {"train_loss": -42.85974884033203, "global_step": 292080, "epoch": 2413} {"train_loss": -42.6689567565918, "global_step": 292081, "epoch": 2413} {"train_loss": -43.10447311401367, "global_step": 292082, "epoch": 2413} {"train_loss": -43.18453598022461, "global_step": 292083, "epoch": 2413} {"train_loss": -42.96977996826172, "global_step": 292084, "epoch": 2413} {"train_loss": -43.4632682800293, "global_step": 292085, "epoch": 2413} {"train_loss": -42.8615608215332, "global_step": 292086, "epoch": 2413} {"train_loss": -40.39424133300781, "global_step": 292087, "epoch": 2413} {"train_loss": -43.452720642089844, "global_step": 292088, "epoch": 2413} {"train_loss": -43.64632034301758, "global_step": 292089, "epoch": 2413} {"train_loss": -43.287269592285156, "global_step": 292090, "epoch": 2413} {"train_loss": -42.7695198059082, "global_step": 292091, "epoch": 2413} {"train_loss": -43.8357048034668, "global_step": 292092, "epoch": 2413} {"train_loss": -42.475776136414076, "global_step": 292093, "epoch": 2413, "val_loss": 2603199.25} {"train_loss": -40.54507827758789, "global_step": 292094, "epoch": 2414} {"train_loss": -43.46277618408203, "global_step": 292095, "epoch": 2414} {"train_loss": -43.23539733886719, "global_step": 292096, "epoch": 2414} {"train_loss": -44.2421989440918, "global_step": 292097, "epoch": 2414} {"train_loss": -42.99369430541992, "global_step": 292098, "epoch": 2414} {"train_loss": -43.481746673583984, "global_step": 292099, "epoch": 2414} {"train_loss": -43.70045852661133, "global_step": 292100, "epoch": 2414} {"train_loss": -43.23737335205078, "global_step": 292101, "epoch": 2414} {"train_loss": -43.7755012512207, "global_step": 292102, "epoch": 2414} {"train_loss": -43.3090705871582, "global_step": 292103, "epoch": 2414} {"train_loss": -44.030067443847656, "global_step": 292104, "epoch": 2414} {"train_loss": -40.8378791809082, "global_step": 292105, "epoch": 2414} {"train_loss": -43.851985931396484, "global_step": 292106, "epoch": 2414} {"train_loss": -40.1585578918457, "global_step": 292107, "epoch": 2414} {"train_loss": -44.411251068115234, "global_step": 292108, "epoch": 2414} {"train_loss": -43.71089553833008, "global_step": 292109, "epoch": 2414} {"train_loss": -40.75533676147461, "global_step": 292110, "epoch": 2414} {"train_loss": -41.32861328125, "global_step": 292111, "epoch": 2414} {"train_loss": -42.63908004760742, "global_step": 292112, "epoch": 2414} {"train_loss": -42.963069915771484, "global_step": 292113, "epoch": 2414} {"train_loss": -42.913414001464844, "global_step": 292114, "epoch": 2414} {"train_loss": -42.7297477722168, "global_step": 292115, "epoch": 2414} {"train_loss": -43.45256805419922, "global_step": 292116, "epoch": 2414} {"train_loss": -43.34711456298828, "global_step": 292117, "epoch": 2414} {"train_loss": -42.5916862487793, "global_step": 292118, "epoch": 2414} {"train_loss": -43.57276916503906, "global_step": 292119, "epoch": 2414} {"train_loss": -42.71296310424805, "global_step": 292120, "epoch": 2414} {"train_loss": -43.22768020629883, "global_step": 292121, "epoch": 2414} {"train_loss": -43.76676559448242, "global_step": 292122, "epoch": 2414} {"train_loss": -44.12437438964844, "global_step": 292123, "epoch": 2414} {"train_loss": -43.339900970458984, "global_step": 292124, "epoch": 2414} {"train_loss": -43.132415771484375, "global_step": 292125, "epoch": 2414} {"train_loss": -41.670066833496094, "global_step": 292126, "epoch": 2414} {"train_loss": -44.031829833984375, "global_step": 292127, "epoch": 2414} {"train_loss": -43.46706771850586, "global_step": 292128, "epoch": 2414} {"train_loss": -43.491268157958984, "global_step": 292129, "epoch": 2414} {"train_loss": -44.1453971862793, "global_step": 292130, "epoch": 2414} {"train_loss": -44.20607376098633, "global_step": 292131, "epoch": 2414} {"train_loss": -43.92732238769531, "global_step": 292132, "epoch": 2414} {"train_loss": -44.0640869140625, "global_step": 292133, "epoch": 2414} {"train_loss": -44.17877197265625, "global_step": 292134, "epoch": 2414} {"train_loss": -43.756263732910156, "global_step": 292135, "epoch": 2414} {"train_loss": -44.12383270263672, "global_step": 292136, "epoch": 2414} {"train_loss": -43.81793212890625, "global_step": 292137, "epoch": 2414} {"train_loss": -43.9444694519043, "global_step": 292138, "epoch": 2414} {"train_loss": -44.390384674072266, "global_step": 292139, "epoch": 2414} {"train_loss": -44.216224670410156, "global_step": 292140, "epoch": 2414} {"train_loss": -43.915584564208984, "global_step": 292141, "epoch": 2414} {"train_loss": -44.545284271240234, "global_step": 292142, "epoch": 2414} {"train_loss": -44.010772705078125, "global_step": 292143, "epoch": 2414} {"train_loss": -43.83014678955078, "global_step": 292144, "epoch": 2414} {"train_loss": -43.90171813964844, "global_step": 292145, "epoch": 2414} {"train_loss": -44.53427505493164, "global_step": 292146, "epoch": 2414} {"train_loss": -44.1881217956543, "global_step": 292147, "epoch": 2414} {"train_loss": -44.045711517333984, "global_step": 292148, "epoch": 2414} {"train_loss": -43.82631301879883, "global_step": 292149, "epoch": 2414} {"train_loss": -43.92436218261719, "global_step": 292150, "epoch": 2414} {"train_loss": -44.61198806762695, "global_step": 292151, "epoch": 2414} {"train_loss": -44.075653076171875, "global_step": 292152, "epoch": 2414} {"train_loss": -44.3299446105957, "global_step": 292153, "epoch": 2414} {"train_loss": -44.4805908203125, "global_step": 292154, "epoch": 2414} {"train_loss": -44.319278717041016, "global_step": 292155, "epoch": 2414} {"train_loss": -44.389461517333984, "global_step": 292156, "epoch": 2414} {"train_loss": -44.349945068359375, "global_step": 292157, "epoch": 2414} {"train_loss": -43.56821823120117, "global_step": 292158, "epoch": 2414} {"train_loss": -44.427467346191406, "global_step": 292159, "epoch": 2414} {"train_loss": -43.48251724243164, "global_step": 292160, "epoch": 2414} {"train_loss": -43.97697448730469, "global_step": 292161, "epoch": 2414} {"train_loss": -44.81687545776367, "global_step": 292162, "epoch": 2414} {"train_loss": -44.347442626953125, "global_step": 292163, "epoch": 2414} {"train_loss": -43.119930267333984, "global_step": 292164, "epoch": 2414} {"train_loss": -40.52228927612305, "global_step": 292165, "epoch": 2414} {"train_loss": -42.1937141418457, "global_step": 292166, "epoch": 2414} {"train_loss": -44.670318603515625, "global_step": 292167, "epoch": 2414} {"train_loss": -42.35327911376953, "global_step": 292168, "epoch": 2414} {"train_loss": -40.606056213378906, "global_step": 292169, "epoch": 2414} {"train_loss": -43.68281555175781, "global_step": 292170, "epoch": 2414} {"train_loss": -42.302528381347656, "global_step": 292171, "epoch": 2414} {"train_loss": -42.21558380126953, "global_step": 292172, "epoch": 2414} {"train_loss": -44.009456634521484, "global_step": 292173, "epoch": 2414} {"train_loss": -41.58461380004883, "global_step": 292174, "epoch": 2414} {"train_loss": -42.0610237121582, "global_step": 292175, "epoch": 2414} {"train_loss": -43.76491165161133, "global_step": 292176, "epoch": 2414} {"train_loss": -42.23554229736328, "global_step": 292177, "epoch": 2414} {"train_loss": -42.64638137817383, "global_step": 292178, "epoch": 2414} {"train_loss": -42.49323654174805, "global_step": 292179, "epoch": 2414} {"train_loss": -42.11422348022461, "global_step": 292180, "epoch": 2414} {"train_loss": -43.218223571777344, "global_step": 292181, "epoch": 2414} {"train_loss": -41.11279296875, "global_step": 292182, "epoch": 2414} {"train_loss": -43.094600677490234, "global_step": 292183, "epoch": 2414} {"train_loss": -42.43865203857422, "global_step": 292184, "epoch": 2414} {"train_loss": -43.46426010131836, "global_step": 292185, "epoch": 2414} {"train_loss": -43.23995590209961, "global_step": 292186, "epoch": 2414} {"train_loss": -42.834503173828125, "global_step": 292187, "epoch": 2414} {"train_loss": -44.169097900390625, "global_step": 292188, "epoch": 2414} {"train_loss": -42.67121505737305, "global_step": 292189, "epoch": 2414} {"train_loss": -43.7822151184082, "global_step": 292190, "epoch": 2414} {"train_loss": -43.35726547241211, "global_step": 292191, "epoch": 2414} {"train_loss": -42.36137008666992, "global_step": 292192, "epoch": 2414} {"train_loss": -43.94584274291992, "global_step": 292193, "epoch": 2414} {"train_loss": -42.2989501953125, "global_step": 292194, "epoch": 2414} {"train_loss": -42.72642135620117, "global_step": 292195, "epoch": 2414} {"train_loss": -43.2784309387207, "global_step": 292196, "epoch": 2414} {"train_loss": -42.735801696777344, "global_step": 292197, "epoch": 2414} {"train_loss": -43.08177185058594, "global_step": 292198, "epoch": 2414} {"train_loss": -42.248470306396484, "global_step": 292199, "epoch": 2414} {"train_loss": -42.51462936401367, "global_step": 292200, "epoch": 2414} {"train_loss": -43.65910720825195, "global_step": 292201, "epoch": 2414} {"train_loss": -43.413204193115234, "global_step": 292202, "epoch": 2414} {"train_loss": -43.59739303588867, "global_step": 292203, "epoch": 2414} {"train_loss": -44.11928176879883, "global_step": 292204, "epoch": 2414} {"train_loss": -43.14799118041992, "global_step": 292205, "epoch": 2414} {"train_loss": -43.99717330932617, "global_step": 292206, "epoch": 2414} {"train_loss": -44.13153076171875, "global_step": 292207, "epoch": 2414} {"train_loss": -43.749874114990234, "global_step": 292208, "epoch": 2414} {"train_loss": -44.01604461669922, "global_step": 292209, "epoch": 2414} {"train_loss": -43.982295989990234, "global_step": 292210, "epoch": 2414} {"train_loss": -43.93356704711914, "global_step": 292211, "epoch": 2414} {"train_loss": -44.14069366455078, "global_step": 292212, "epoch": 2414} {"train_loss": -43.78280258178711, "global_step": 292213, "epoch": 2414} {"train_loss": -43.335998976526184, "global_step": 292214, "epoch": 2414, "val_loss": 2474623.0} {"train_loss": -43.85771942138672, "global_step": 292215, "epoch": 2415} {"train_loss": -43.632904052734375, "global_step": 292216, "epoch": 2415} {"train_loss": -44.532073974609375, "global_step": 292217, "epoch": 2415} {"train_loss": -44.035797119140625, "global_step": 292218, "epoch": 2415} {"train_loss": -44.25716781616211, "global_step": 292219, "epoch": 2415} {"train_loss": -43.90268325805664, "global_step": 292220, "epoch": 2415} {"train_loss": -44.13465881347656, "global_step": 292221, "epoch": 2415} {"train_loss": -44.55002975463867, "global_step": 292222, "epoch": 2415} {"train_loss": -44.160675048828125, "global_step": 292223, "epoch": 2415} {"train_loss": -44.38501739501953, "global_step": 292224, "epoch": 2415} {"train_loss": -44.7244873046875, "global_step": 292225, "epoch": 2415} {"train_loss": -44.51834487915039, "global_step": 292226, "epoch": 2415} {"train_loss": -44.890926361083984, "global_step": 292227, "epoch": 2415} {"train_loss": -44.198760986328125, "global_step": 292228, "epoch": 2415} {"train_loss": -43.91206359863281, "global_step": 292229, "epoch": 2415} {"train_loss": -44.634315490722656, "global_step": 292230, "epoch": 2415} {"train_loss": -44.243858337402344, "global_step": 292231, "epoch": 2415} {"train_loss": -44.32792282104492, "global_step": 292232, "epoch": 2415} {"train_loss": -44.42811965942383, "global_step": 292233, "epoch": 2415} {"train_loss": -43.80683898925781, "global_step": 292234, "epoch": 2415} {"train_loss": -43.77641677856445, "global_step": 292235, "epoch": 2415} {"train_loss": -44.585933685302734, "global_step": 292236, "epoch": 2415} {"train_loss": -44.148555755615234, "global_step": 292237, "epoch": 2415} {"train_loss": -44.1268424987793, "global_step": 292238, "epoch": 2415} {"train_loss": -43.821815490722656, "global_step": 292239, "epoch": 2415} {"train_loss": -44.2406005859375, "global_step": 292240, "epoch": 2415} {"train_loss": -44.99665832519531, "global_step": 292241, "epoch": 2415} {"train_loss": -43.72452926635742, "global_step": 292242, "epoch": 2415} {"train_loss": -43.8858528137207, "global_step": 292243, "epoch": 2415} {"train_loss": -43.94537353515625, "global_step": 292244, "epoch": 2415} {"train_loss": -44.258480072021484, "global_step": 292245, "epoch": 2415} {"train_loss": -44.32782745361328, "global_step": 292246, "epoch": 2415} {"train_loss": -44.247676849365234, "global_step": 292247, "epoch": 2415} {"train_loss": -43.8875617980957, "global_step": 292248, "epoch": 2415} {"train_loss": -43.727718353271484, "global_step": 292249, "epoch": 2415} {"train_loss": -41.76844024658203, "global_step": 292250, "epoch": 2415} {"train_loss": -40.32008743286133, "global_step": 292251, "epoch": 2415} {"train_loss": -43.87621307373047, "global_step": 292252, "epoch": 2415} {"train_loss": -42.41135787963867, "global_step": 292253, "epoch": 2415} {"train_loss": -39.6565055847168, "global_step": 292254, "epoch": 2415} {"train_loss": -44.163482666015625, "global_step": 292255, "epoch": 2415} {"train_loss": -39.26864242553711, "global_step": 292256, "epoch": 2415} {"train_loss": -41.30980682373047, "global_step": 292257, "epoch": 2415} {"train_loss": -42.74306106567383, "global_step": 292258, "epoch": 2415} {"train_loss": -43.1213264465332, "global_step": 292259, "epoch": 2415} {"train_loss": -41.873779296875, "global_step": 292260, "epoch": 2415} {"train_loss": -42.607479095458984, "global_step": 292261, "epoch": 2415} {"train_loss": -42.96112060546875, "global_step": 292262, "epoch": 2415} {"train_loss": -43.8657112121582, "global_step": 292263, "epoch": 2415} {"train_loss": -43.3262939453125, "global_step": 292264, "epoch": 2415} {"train_loss": -42.20063018798828, "global_step": 292265, "epoch": 2415} {"train_loss": -43.392295837402344, "global_step": 292266, "epoch": 2415} {"train_loss": -43.5714225769043, "global_step": 292267, "epoch": 2415} {"train_loss": -43.11757278442383, "global_step": 292268, "epoch": 2415} {"train_loss": -43.83306884765625, "global_step": 292269, "epoch": 2415} {"train_loss": -44.28205108642578, "global_step": 292270, "epoch": 2415} {"train_loss": -43.44671630859375, "global_step": 292271, "epoch": 2415} {"train_loss": -43.65535354614258, "global_step": 292272, "epoch": 2415} {"train_loss": -44.37384033203125, "global_step": 292273, "epoch": 2415} {"train_loss": -43.0283203125, "global_step": 292274, "epoch": 2415} {"train_loss": -42.740413665771484, "global_step": 292275, "epoch": 2415} {"train_loss": -43.90793228149414, "global_step": 292276, "epoch": 2415} {"train_loss": -43.940425872802734, "global_step": 292277, "epoch": 2415} {"train_loss": -44.1558952331543, "global_step": 292278, "epoch": 2415} {"train_loss": -43.756771087646484, "global_step": 292279, "epoch": 2415} {"train_loss": -44.59878158569336, "global_step": 292280, "epoch": 2415} {"train_loss": -43.80208969116211, "global_step": 292281, "epoch": 2415} {"train_loss": -43.52886962890625, "global_step": 292282, "epoch": 2415} {"train_loss": -44.49970245361328, "global_step": 292283, "epoch": 2415} {"train_loss": -43.98612594604492, "global_step": 292284, "epoch": 2415} {"train_loss": -43.939857482910156, "global_step": 292285, "epoch": 2415} {"train_loss": -44.29459762573242, "global_step": 292286, "epoch": 2415} {"train_loss": -43.89449691772461, "global_step": 292287, "epoch": 2415} {"train_loss": -44.14113998413086, "global_step": 292288, "epoch": 2415} {"train_loss": -43.50327682495117, "global_step": 292289, "epoch": 2415} {"train_loss": -42.86965560913086, "global_step": 292290, "epoch": 2415} {"train_loss": -44.272247314453125, "global_step": 292291, "epoch": 2415} {"train_loss": -43.730716705322266, "global_step": 292292, "epoch": 2415} {"train_loss": -43.16992950439453, "global_step": 292293, "epoch": 2415} {"train_loss": -43.92794418334961, "global_step": 292294, "epoch": 2415} {"train_loss": -43.20667266845703, "global_step": 292295, "epoch": 2415} {"train_loss": -43.38911819458008, "global_step": 292296, "epoch": 2415} {"train_loss": -40.79834747314453, "global_step": 292297, "epoch": 2415} {"train_loss": -42.8828010559082, "global_step": 292298, "epoch": 2415} {"train_loss": -42.80340576171875, "global_step": 292299, "epoch": 2415} {"train_loss": -40.84406661987305, "global_step": 292300, "epoch": 2415} {"train_loss": -39.85640335083008, "global_step": 292301, "epoch": 2415} {"train_loss": -42.802520751953125, "global_step": 292302, "epoch": 2415} {"train_loss": -40.00505447387695, "global_step": 292303, "epoch": 2415} {"train_loss": -39.99018859863281, "global_step": 292304, "epoch": 2415} {"train_loss": -42.3664436340332, "global_step": 292305, "epoch": 2415} {"train_loss": -41.0903205871582, "global_step": 292306, "epoch": 2415} {"train_loss": -40.76602554321289, "global_step": 292307, "epoch": 2415} {"train_loss": -42.75130844116211, "global_step": 292308, "epoch": 2415} {"train_loss": -42.24361801147461, "global_step": 292309, "epoch": 2415} {"train_loss": -42.866451263427734, "global_step": 292310, "epoch": 2415} {"train_loss": -43.011444091796875, "global_step": 292311, "epoch": 2415} {"train_loss": -41.744384765625, "global_step": 292312, "epoch": 2415} {"train_loss": -42.06985092163086, "global_step": 292313, "epoch": 2415} {"train_loss": -42.74143600463867, "global_step": 292314, "epoch": 2415} {"train_loss": -40.590023040771484, "global_step": 292315, "epoch": 2415} {"train_loss": -42.39237594604492, "global_step": 292316, "epoch": 2415} {"train_loss": -41.5634880065918, "global_step": 292317, "epoch": 2415} {"train_loss": -42.148468017578125, "global_step": 292318, "epoch": 2415} {"train_loss": -42.67451858520508, "global_step": 292319, "epoch": 2415} {"train_loss": -42.564266204833984, "global_step": 292320, "epoch": 2415} {"train_loss": -42.44231033325195, "global_step": 292321, "epoch": 2415} {"train_loss": -42.54939651489258, "global_step": 292322, "epoch": 2415} {"train_loss": -43.05780792236328, "global_step": 292323, "epoch": 2415} {"train_loss": -43.290828704833984, "global_step": 292324, "epoch": 2415} {"train_loss": -42.70180130004883, "global_step": 292325, "epoch": 2415} {"train_loss": -43.27927780151367, "global_step": 292326, "epoch": 2415} {"train_loss": -42.1043815612793, "global_step": 292327, "epoch": 2415} {"train_loss": -44.248104095458984, "global_step": 292328, "epoch": 2415} {"train_loss": -42.38090133666992, "global_step": 292329, "epoch": 2415} {"train_loss": -43.34578323364258, "global_step": 292330, "epoch": 2415} {"train_loss": -43.335296630859375, "global_step": 292331, "epoch": 2415} {"train_loss": -43.426185607910156, "global_step": 292332, "epoch": 2415} {"train_loss": -43.20668411254883, "global_step": 292333, "epoch": 2415} {"train_loss": -43.42799758911133, "global_step": 292334, "epoch": 2415} {"train_loss": -43.208679546009414, "global_step": 292335, "epoch": 2415, "val_loss": 2479009.75} {"train_loss": -43.627464294433594, "global_step": 292336, "epoch": 2416} {"train_loss": -44.287906646728516, "global_step": 292337, "epoch": 2416} {"train_loss": -43.91840362548828, "global_step": 292338, "epoch": 2416} {"train_loss": -44.13961410522461, "global_step": 292339, "epoch": 2416} {"train_loss": -44.04848098754883, "global_step": 292340, "epoch": 2416} {"train_loss": -44.42431640625, "global_step": 292341, "epoch": 2416} {"train_loss": -44.850135803222656, "global_step": 292342, "epoch": 2416} {"train_loss": -44.12910079956055, "global_step": 292343, "epoch": 2416} {"train_loss": -44.4667854309082, "global_step": 292344, "epoch": 2416} {"train_loss": -44.384151458740234, "global_step": 292345, "epoch": 2416} {"train_loss": -43.97170639038086, "global_step": 292346, "epoch": 2416} {"train_loss": -44.52605056762695, "global_step": 292347, "epoch": 2416} {"train_loss": -43.981658935546875, "global_step": 292348, "epoch": 2416} {"train_loss": -44.32357406616211, "global_step": 292349, "epoch": 2416} {"train_loss": -43.6994743347168, "global_step": 292350, "epoch": 2416} {"train_loss": -44.07299041748047, "global_step": 292351, "epoch": 2416} {"train_loss": -44.32303237915039, "global_step": 292352, "epoch": 2416} {"train_loss": -44.379817962646484, "global_step": 292353, "epoch": 2416} {"train_loss": -44.24422073364258, "global_step": 292354, "epoch": 2416} {"train_loss": -44.12404251098633, "global_step": 292355, "epoch": 2416} {"train_loss": -43.94055938720703, "global_step": 292356, "epoch": 2416} {"train_loss": -44.27346420288086, "global_step": 292357, "epoch": 2416} {"train_loss": -44.38945007324219, "global_step": 292358, "epoch": 2416} {"train_loss": -44.74491500854492, "global_step": 292359, "epoch": 2416} {"train_loss": -44.44759750366211, "global_step": 292360, "epoch": 2416} {"train_loss": -44.4545783996582, "global_step": 292361, "epoch": 2416} {"train_loss": -44.546817779541016, "global_step": 292362, "epoch": 2416} {"train_loss": -45.27883529663086, "global_step": 292363, "epoch": 2416} {"train_loss": -44.636592864990234, "global_step": 292364, "epoch": 2416} {"train_loss": -44.24580764770508, "global_step": 292365, "epoch": 2416} {"train_loss": -43.45417022705078, "global_step": 292366, "epoch": 2416} {"train_loss": -44.044673919677734, "global_step": 292367, "epoch": 2416} {"train_loss": -44.624507904052734, "global_step": 292368, "epoch": 2416} {"train_loss": -44.541358947753906, "global_step": 292369, "epoch": 2416} {"train_loss": -42.05719757080078, "global_step": 292370, "epoch": 2416} {"train_loss": -40.944610595703125, "global_step": 292371, "epoch": 2416} {"train_loss": -42.2303466796875, "global_step": 292372, "epoch": 2416} {"train_loss": -42.3101806640625, "global_step": 292373, "epoch": 2416} {"train_loss": -44.149471282958984, "global_step": 292374, "epoch": 2416} {"train_loss": -44.69025802612305, "global_step": 292375, "epoch": 2416} {"train_loss": -43.210506439208984, "global_step": 292376, "epoch": 2416} {"train_loss": -41.94105529785156, "global_step": 292377, "epoch": 2416} {"train_loss": -43.819122314453125, "global_step": 292378, "epoch": 2416} {"train_loss": -44.628150939941406, "global_step": 292379, "epoch": 2416} {"train_loss": -43.18962478637695, "global_step": 292380, "epoch": 2416} {"train_loss": -43.15354537963867, "global_step": 292381, "epoch": 2416} {"train_loss": -43.200862884521484, "global_step": 292382, "epoch": 2416} {"train_loss": -43.488014221191406, "global_step": 292383, "epoch": 2416} {"train_loss": -40.951473236083984, "global_step": 292384, "epoch": 2416} {"train_loss": -43.71185302734375, "global_step": 292385, "epoch": 2416} {"train_loss": -43.0905647277832, "global_step": 292386, "epoch": 2416} {"train_loss": -40.94150924682617, "global_step": 292387, "epoch": 2416} {"train_loss": -43.07624435424805, "global_step": 292388, "epoch": 2416} {"train_loss": -42.90235137939453, "global_step": 292389, "epoch": 2416} {"train_loss": -38.10334396362305, "global_step": 292390, "epoch": 2416} {"train_loss": -37.45635986328125, "global_step": 292391, "epoch": 2416} {"train_loss": -33.19340133666992, "global_step": 292392, "epoch": 2416} {"train_loss": -23.93187713623047, "global_step": 292393, "epoch": 2416} {"train_loss": -39.631317138671875, "global_step": 292394, "epoch": 2416} {"train_loss": -31.71925163269043, "global_step": 292395, "epoch": 2416} {"train_loss": -40.581912994384766, "global_step": 292396, "epoch": 2416} {"train_loss": -34.33297348022461, "global_step": 292397, "epoch": 2416} {"train_loss": -41.6275749206543, "global_step": 292398, "epoch": 2416} {"train_loss": -37.434303283691406, "global_step": 292399, "epoch": 2416} {"train_loss": -39.85032653808594, "global_step": 292400, "epoch": 2416} {"train_loss": -37.332908630371094, "global_step": 292401, "epoch": 2416} {"train_loss": -40.47196578979492, "global_step": 292402, "epoch": 2416} {"train_loss": -41.59548568725586, "global_step": 292403, "epoch": 2416} {"train_loss": -41.608856201171875, "global_step": 292404, "epoch": 2416} {"train_loss": -40.484737396240234, "global_step": 292405, "epoch": 2416} {"train_loss": -40.707088470458984, "global_step": 292406, "epoch": 2416} {"train_loss": -40.483306884765625, "global_step": 292407, "epoch": 2416} {"train_loss": -41.375728607177734, "global_step": 292408, "epoch": 2416} {"train_loss": -42.55833053588867, "global_step": 292409, "epoch": 2416} {"train_loss": -40.0624885559082, "global_step": 292410, "epoch": 2416} {"train_loss": -41.351741790771484, "global_step": 292411, "epoch": 2416} {"train_loss": -41.7673225402832, "global_step": 292412, "epoch": 2416} {"train_loss": -41.389339447021484, "global_step": 292413, "epoch": 2416} {"train_loss": -42.63112258911133, "global_step": 292414, "epoch": 2416} {"train_loss": -41.659217834472656, "global_step": 292415, "epoch": 2416} {"train_loss": -42.620582580566406, "global_step": 292416, "epoch": 2416} {"train_loss": -41.97331619262695, "global_step": 292417, "epoch": 2416} {"train_loss": -42.44868850708008, "global_step": 292418, "epoch": 2416} {"train_loss": -42.56427001953125, "global_step": 292419, "epoch": 2416} {"train_loss": -42.5300407409668, "global_step": 292420, "epoch": 2416} {"train_loss": -42.837432861328125, "global_step": 292421, "epoch": 2416} {"train_loss": -42.18475341796875, "global_step": 292422, "epoch": 2416} {"train_loss": -42.96614456176758, "global_step": 292423, "epoch": 2416} {"train_loss": -43.299171447753906, "global_step": 292424, "epoch": 2416} {"train_loss": -43.3782958984375, "global_step": 292425, "epoch": 2416} {"train_loss": -43.287391662597656, "global_step": 292426, "epoch": 2416} {"train_loss": -43.21730422973633, "global_step": 292427, "epoch": 2416} {"train_loss": -43.57328414916992, "global_step": 292428, "epoch": 2416} {"train_loss": -42.9703369140625, "global_step": 292429, "epoch": 2416} {"train_loss": -43.60611343383789, "global_step": 292430, "epoch": 2416} {"train_loss": -43.27238082885742, "global_step": 292431, "epoch": 2416} {"train_loss": -43.262630462646484, "global_step": 292432, "epoch": 2416} {"train_loss": -43.75045394897461, "global_step": 292433, "epoch": 2416} {"train_loss": -43.00468826293945, "global_step": 292434, "epoch": 2416} {"train_loss": -42.8422737121582, "global_step": 292435, "epoch": 2416} {"train_loss": -43.68144607543945, "global_step": 292436, "epoch": 2416} {"train_loss": -43.50674057006836, "global_step": 292437, "epoch": 2416} {"train_loss": -43.92702865600586, "global_step": 292438, "epoch": 2416} {"train_loss": -43.780853271484375, "global_step": 292439, "epoch": 2416} {"train_loss": -44.05782699584961, "global_step": 292440, "epoch": 2416} {"train_loss": -44.15012741088867, "global_step": 292441, "epoch": 2416} {"train_loss": -43.786380767822266, "global_step": 292442, "epoch": 2416} {"train_loss": -43.867923736572266, "global_step": 292443, "epoch": 2416} {"train_loss": -44.1048583984375, "global_step": 292444, "epoch": 2416} {"train_loss": -43.933414459228516, "global_step": 292445, "epoch": 2416} {"train_loss": -43.721290588378906, "global_step": 292446, "epoch": 2416} {"train_loss": -44.20335388183594, "global_step": 292447, "epoch": 2416} {"train_loss": -44.40550231933594, "global_step": 292448, "epoch": 2416} {"train_loss": -44.07353591918945, "global_step": 292449, "epoch": 2416} {"train_loss": -44.251888275146484, "global_step": 292450, "epoch": 2416} {"train_loss": -43.887451171875, "global_step": 292451, "epoch": 2416} {"train_loss": -44.51106262207031, "global_step": 292452, "epoch": 2416} {"train_loss": -43.784976959228516, "global_step": 292453, "epoch": 2416} {"train_loss": -44.209651947021484, "global_step": 292454, "epoch": 2416} {"train_loss": -44.3447380065918, "global_step": 292455, "epoch": 2416} {"train_loss": -42.65218408442726, "global_step": 292456, "epoch": 2416, "val_loss": 2495845.25} {"train_loss": -43.91484451293945, "global_step": 292457, "epoch": 2417} {"train_loss": -44.38707733154297, "global_step": 292458, "epoch": 2417} {"train_loss": -44.584373474121094, "global_step": 292459, "epoch": 2417} {"train_loss": -44.335609436035156, "global_step": 292460, "epoch": 2417} {"train_loss": -44.69648742675781, "global_step": 292461, "epoch": 2417} {"train_loss": -44.254329681396484, "global_step": 292462, "epoch": 2417} {"train_loss": -44.83565139770508, "global_step": 292463, "epoch": 2417} {"train_loss": -44.419551849365234, "global_step": 292464, "epoch": 2417} {"train_loss": -44.30845260620117, "global_step": 292465, "epoch": 2417} {"train_loss": -44.73905563354492, "global_step": 292466, "epoch": 2417} {"train_loss": -44.367584228515625, "global_step": 292467, "epoch": 2417} {"train_loss": -44.26634979248047, "global_step": 292468, "epoch": 2417} {"train_loss": -44.492183685302734, "global_step": 292469, "epoch": 2417} {"train_loss": -44.983856201171875, "global_step": 292470, "epoch": 2417} {"train_loss": -44.83834457397461, "global_step": 292471, "epoch": 2417} {"train_loss": -44.751033782958984, "global_step": 292472, "epoch": 2417} {"train_loss": -44.90918731689453, "global_step": 292473, "epoch": 2417} {"train_loss": -44.83232498168945, "global_step": 292474, "epoch": 2417} {"train_loss": -44.392120361328125, "global_step": 292475, "epoch": 2417} {"train_loss": -44.918617248535156, "global_step": 292476, "epoch": 2417} {"train_loss": -42.700531005859375, "global_step": 292477, "epoch": 2417} {"train_loss": -43.94740676879883, "global_step": 292478, "epoch": 2417} {"train_loss": -44.382747650146484, "global_step": 292479, "epoch": 2417} {"train_loss": -44.81834411621094, "global_step": 292480, "epoch": 2417} {"train_loss": -44.6921501159668, "global_step": 292481, "epoch": 2417} {"train_loss": -36.2390251159668, "global_step": 292482, "epoch": 2417} {"train_loss": -43.65349197387695, "global_step": 292483, "epoch": 2417} {"train_loss": -43.832942962646484, "global_step": 292484, "epoch": 2417} {"train_loss": -43.894405364990234, "global_step": 292485, "epoch": 2417} {"train_loss": -44.14665603637695, "global_step": 292486, "epoch": 2417} {"train_loss": -43.44649124145508, "global_step": 292487, "epoch": 2417} {"train_loss": -43.83782958984375, "global_step": 292488, "epoch": 2417} {"train_loss": -43.84283447265625, "global_step": 292489, "epoch": 2417} {"train_loss": -42.686031341552734, "global_step": 292490, "epoch": 2417} {"train_loss": -42.328590393066406, "global_step": 292491, "epoch": 2417} {"train_loss": -41.7153434753418, "global_step": 292492, "epoch": 2417} {"train_loss": -44.61326599121094, "global_step": 292493, "epoch": 2417} {"train_loss": -42.49129104614258, "global_step": 292494, "epoch": 2417} {"train_loss": -44.58363723754883, "global_step": 292495, "epoch": 2417} {"train_loss": -43.49274444580078, "global_step": 292496, "epoch": 2417} {"train_loss": -44.109737396240234, "global_step": 292497, "epoch": 2417} {"train_loss": -42.619049072265625, "global_step": 292498, "epoch": 2417} {"train_loss": -44.538330078125, "global_step": 292499, "epoch": 2417} {"train_loss": -42.46076583862305, "global_step": 292500, "epoch": 2417} {"train_loss": -41.44684600830078, "global_step": 292501, "epoch": 2417} {"train_loss": -44.14011001586914, "global_step": 292502, "epoch": 2417} {"train_loss": -44.05986404418945, "global_step": 292503, "epoch": 2417} {"train_loss": -43.912960052490234, "global_step": 292504, "epoch": 2417} {"train_loss": -43.46750259399414, "global_step": 292505, "epoch": 2417} {"train_loss": -39.916141510009766, "global_step": 292506, "epoch": 2417} {"train_loss": -44.26737594604492, "global_step": 292507, "epoch": 2417} {"train_loss": -43.50831985473633, "global_step": 292508, "epoch": 2417} {"train_loss": -41.45940017700195, "global_step": 292509, "epoch": 2417} {"train_loss": -41.53701400756836, "global_step": 292510, "epoch": 2417} {"train_loss": -42.2318229675293, "global_step": 292511, "epoch": 2417} {"train_loss": -41.5751953125, "global_step": 292512, "epoch": 2417} {"train_loss": -42.14625930786133, "global_step": 292513, "epoch": 2417} {"train_loss": -42.1864013671875, "global_step": 292514, "epoch": 2417} {"train_loss": -43.08076477050781, "global_step": 292515, "epoch": 2417} {"train_loss": -41.146636962890625, "global_step": 292516, "epoch": 2417} {"train_loss": -40.00053024291992, "global_step": 292517, "epoch": 2417} {"train_loss": -42.88859939575195, "global_step": 292518, "epoch": 2417} {"train_loss": -36.61134719848633, "global_step": 292519, "epoch": 2417} {"train_loss": -40.428035736083984, "global_step": 292520, "epoch": 2417} {"train_loss": -35.93071365356445, "global_step": 292521, "epoch": 2417} {"train_loss": -41.760475158691406, "global_step": 292522, "epoch": 2417} {"train_loss": -39.239253997802734, "global_step": 292523, "epoch": 2417} {"train_loss": -38.1685791015625, "global_step": 292524, "epoch": 2417} {"train_loss": -33.75233459472656, "global_step": 292525, "epoch": 2417} {"train_loss": -36.22075271606445, "global_step": 292526, "epoch": 2417} {"train_loss": -40.40105056762695, "global_step": 292527, "epoch": 2417} {"train_loss": -36.03304672241211, "global_step": 292528, "epoch": 2417} {"train_loss": -40.07992172241211, "global_step": 292529, "epoch": 2417} {"train_loss": -37.35049057006836, "global_step": 292530, "epoch": 2417} {"train_loss": -35.14447784423828, "global_step": 292531, "epoch": 2417} {"train_loss": -39.88801574707031, "global_step": 292532, "epoch": 2417} {"train_loss": -34.662994384765625, "global_step": 292533, "epoch": 2417} {"train_loss": -41.33236312866211, "global_step": 292534, "epoch": 2417} {"train_loss": -40.1887321472168, "global_step": 292535, "epoch": 2417} {"train_loss": -41.1637077331543, "global_step": 292536, "epoch": 2417} {"train_loss": -41.69637680053711, "global_step": 292537, "epoch": 2417} {"train_loss": -35.778778076171875, "global_step": 292538, "epoch": 2417} {"train_loss": -41.47275161743164, "global_step": 292539, "epoch": 2417} {"train_loss": -41.19622802734375, "global_step": 292540, "epoch": 2417} {"train_loss": -41.51609802246094, "global_step": 292541, "epoch": 2417} {"train_loss": -40.66687774658203, "global_step": 292542, "epoch": 2417} {"train_loss": -40.90104293823242, "global_step": 292543, "epoch": 2417} {"train_loss": -40.531368255615234, "global_step": 292544, "epoch": 2417} {"train_loss": -40.25251388549805, "global_step": 292545, "epoch": 2417} {"train_loss": -40.733280181884766, "global_step": 292546, "epoch": 2417} {"train_loss": -41.087974548339844, "global_step": 292547, "epoch": 2417} {"train_loss": -40.0047492980957, "global_step": 292548, "epoch": 2417} {"train_loss": -42.262454986572266, "global_step": 292549, "epoch": 2417} {"train_loss": -41.60026931762695, "global_step": 292550, "epoch": 2417} {"train_loss": -40.9576301574707, "global_step": 292551, "epoch": 2417} {"train_loss": -42.33870315551758, "global_step": 292552, "epoch": 2417} {"train_loss": -41.541629791259766, "global_step": 292553, "epoch": 2417} {"train_loss": -42.2198371887207, "global_step": 292554, "epoch": 2417} {"train_loss": -42.65861892700195, "global_step": 292555, "epoch": 2417} {"train_loss": -41.20473861694336, "global_step": 292556, "epoch": 2417} {"train_loss": -42.503379821777344, "global_step": 292557, "epoch": 2417} {"train_loss": -42.664642333984375, "global_step": 292558, "epoch": 2417} {"train_loss": -41.52021026611328, "global_step": 292559, "epoch": 2417} {"train_loss": -42.826881408691406, "global_step": 292560, "epoch": 2417} {"train_loss": -41.111106872558594, "global_step": 292561, "epoch": 2417} {"train_loss": -43.11150360107422, "global_step": 292562, "epoch": 2417} {"train_loss": -43.04691696166992, "global_step": 292563, "epoch": 2417} {"train_loss": -42.759700775146484, "global_step": 292564, "epoch": 2417} {"train_loss": -43.372859954833984, "global_step": 292565, "epoch": 2417} {"train_loss": -42.903297424316406, "global_step": 292566, "epoch": 2417} {"train_loss": -42.6091423034668, "global_step": 292567, "epoch": 2417} {"train_loss": -42.97142028808594, "global_step": 292568, "epoch": 2417} {"train_loss": -44.02616500854492, "global_step": 292569, "epoch": 2417} {"train_loss": -42.348106384277344, "global_step": 292570, "epoch": 2417} {"train_loss": -42.769588470458984, "global_step": 292571, "epoch": 2417} {"train_loss": -42.600521087646484, "global_step": 292572, "epoch": 2417} {"train_loss": -43.57686996459961, "global_step": 292573, "epoch": 2417} {"train_loss": -43.11029052734375, "global_step": 292574, "epoch": 2417} {"train_loss": -43.287349700927734, "global_step": 292575, "epoch": 2417} {"train_loss": -43.58830261230469, "global_step": 292576, "epoch": 2417} {"train_loss": -42.173913498555336, "global_step": 292577, "epoch": 2417, "val_loss": 2415277.0} {"train_loss": -43.807674407958984, "global_step": 292578, "epoch": 2418} {"train_loss": -42.868953704833984, "global_step": 292579, "epoch": 2418} {"train_loss": -43.43770980834961, "global_step": 292580, "epoch": 2418} {"train_loss": -43.54605484008789, "global_step": 292581, "epoch": 2418} {"train_loss": -42.407470703125, "global_step": 292582, "epoch": 2418} {"train_loss": -43.54861068725586, "global_step": 292583, "epoch": 2418} {"train_loss": -43.24343490600586, "global_step": 292584, "epoch": 2418} {"train_loss": -44.02286148071289, "global_step": 292585, "epoch": 2418} {"train_loss": -43.81118392944336, "global_step": 292586, "epoch": 2418} {"train_loss": -43.67604446411133, "global_step": 292587, "epoch": 2418} {"train_loss": -43.63471603393555, "global_step": 292588, "epoch": 2418} {"train_loss": -43.99304962158203, "global_step": 292589, "epoch": 2418} {"train_loss": -43.849647521972656, "global_step": 292590, "epoch": 2418} {"train_loss": -43.69771194458008, "global_step": 292591, "epoch": 2418} {"train_loss": -43.326805114746094, "global_step": 292592, "epoch": 2418} {"train_loss": -43.72762680053711, "global_step": 292593, "epoch": 2418} {"train_loss": -43.24296188354492, "global_step": 292594, "epoch": 2418} {"train_loss": -43.58408737182617, "global_step": 292595, "epoch": 2418} {"train_loss": -43.9673957824707, "global_step": 292596, "epoch": 2418} {"train_loss": -43.96540451049805, "global_step": 292597, "epoch": 2418} {"train_loss": -43.87533187866211, "global_step": 292598, "epoch": 2418} {"train_loss": -43.7170295715332, "global_step": 292599, "epoch": 2418} {"train_loss": -43.864742279052734, "global_step": 292600, "epoch": 2418} {"train_loss": -43.716773986816406, "global_step": 292601, "epoch": 2418} {"train_loss": -43.64065933227539, "global_step": 292602, "epoch": 2418} {"train_loss": -44.08565139770508, "global_step": 292603, "epoch": 2418} {"train_loss": -43.4179801940918, "global_step": 292604, "epoch": 2418} {"train_loss": -44.159786224365234, "global_step": 292605, "epoch": 2418} {"train_loss": -44.47032928466797, "global_step": 292606, "epoch": 2418} {"train_loss": -43.81730270385742, "global_step": 292607, "epoch": 2418} {"train_loss": -43.82435607910156, "global_step": 292608, "epoch": 2418} {"train_loss": -43.77616882324219, "global_step": 292609, "epoch": 2418} {"train_loss": -43.844947814941406, "global_step": 292610, "epoch": 2418} {"train_loss": -43.97552490234375, "global_step": 292611, "epoch": 2418} {"train_loss": -42.9116325378418, "global_step": 292612, "epoch": 2418} {"train_loss": -41.160552978515625, "global_step": 292613, "epoch": 2418} {"train_loss": -39.12765121459961, "global_step": 292614, "epoch": 2418} {"train_loss": -42.71625900268555, "global_step": 292615, "epoch": 2418} {"train_loss": -42.9024772644043, "global_step": 292616, "epoch": 2418} {"train_loss": -43.0228385925293, "global_step": 292617, "epoch": 2418} {"train_loss": -43.49186325073242, "global_step": 292618, "epoch": 2418} {"train_loss": -42.01981735229492, "global_step": 292619, "epoch": 2418} {"train_loss": -43.385066986083984, "global_step": 292620, "epoch": 2418} {"train_loss": -44.100624084472656, "global_step": 292621, "epoch": 2418} {"train_loss": -42.8421745300293, "global_step": 292622, "epoch": 2418} {"train_loss": -43.41084289550781, "global_step": 292623, "epoch": 2418} {"train_loss": -43.908687591552734, "global_step": 292624, "epoch": 2418} {"train_loss": -43.83838653564453, "global_step": 292625, "epoch": 2418} {"train_loss": -42.74122619628906, "global_step": 292626, "epoch": 2418} {"train_loss": -43.48551559448242, "global_step": 292627, "epoch": 2418} {"train_loss": -43.518733978271484, "global_step": 292628, "epoch": 2418} {"train_loss": -43.89470291137695, "global_step": 292629, "epoch": 2418} {"train_loss": -43.631919860839844, "global_step": 292630, "epoch": 2418} {"train_loss": -43.59629440307617, "global_step": 292631, "epoch": 2418} {"train_loss": -43.648895263671875, "global_step": 292632, "epoch": 2418} {"train_loss": -43.31226348876953, "global_step": 292633, "epoch": 2418} {"train_loss": -42.79624557495117, "global_step": 292634, "epoch": 2418} {"train_loss": -43.29743576049805, "global_step": 292635, "epoch": 2418} {"train_loss": -43.38859558105469, "global_step": 292636, "epoch": 2418} {"train_loss": -43.41961669921875, "global_step": 292637, "epoch": 2418} {"train_loss": -42.61967849731445, "global_step": 292638, "epoch": 2418} {"train_loss": -41.81697463989258, "global_step": 292639, "epoch": 2418} {"train_loss": -42.11606216430664, "global_step": 292640, "epoch": 2418} {"train_loss": -41.66838836669922, "global_step": 292641, "epoch": 2418} {"train_loss": -41.47877883911133, "global_step": 292642, "epoch": 2418} {"train_loss": -42.85280990600586, "global_step": 292643, "epoch": 2418} {"train_loss": -38.914852142333984, "global_step": 292644, "epoch": 2418} {"train_loss": -42.26336669921875, "global_step": 292645, "epoch": 2418} {"train_loss": -41.715728759765625, "global_step": 292646, "epoch": 2418} {"train_loss": -39.40677261352539, "global_step": 292647, "epoch": 2418} {"train_loss": -43.1981315612793, "global_step": 292648, "epoch": 2418} {"train_loss": -40.20682907104492, "global_step": 292649, "epoch": 2418} {"train_loss": -40.69480514526367, "global_step": 292650, "epoch": 2418} {"train_loss": -42.84171676635742, "global_step": 292651, "epoch": 2418} {"train_loss": -38.60024642944336, "global_step": 292652, "epoch": 2418} {"train_loss": -41.55398178100586, "global_step": 292653, "epoch": 2418} {"train_loss": -38.80428695678711, "global_step": 292654, "epoch": 2418} {"train_loss": -39.07494354248047, "global_step": 292655, "epoch": 2418} {"train_loss": -39.14219284057617, "global_step": 292656, "epoch": 2418} {"train_loss": -41.634803771972656, "global_step": 292657, "epoch": 2418} {"train_loss": -40.69926834106445, "global_step": 292658, "epoch": 2418} {"train_loss": -42.6845588684082, "global_step": 292659, "epoch": 2418} {"train_loss": -40.18275833129883, "global_step": 292660, "epoch": 2418} {"train_loss": -42.12510299682617, "global_step": 292661, "epoch": 2418} {"train_loss": -41.560672760009766, "global_step": 292662, "epoch": 2418} {"train_loss": -42.84647750854492, "global_step": 292663, "epoch": 2418} {"train_loss": -41.783016204833984, "global_step": 292664, "epoch": 2418} {"train_loss": -42.354881286621094, "global_step": 292665, "epoch": 2418} {"train_loss": -41.705055236816406, "global_step": 292666, "epoch": 2418} {"train_loss": -41.46559524536133, "global_step": 292667, "epoch": 2418} {"train_loss": -43.10288619995117, "global_step": 292668, "epoch": 2418} {"train_loss": -41.976806640625, "global_step": 292669, "epoch": 2418} {"train_loss": -42.27254867553711, "global_step": 292670, "epoch": 2418} {"train_loss": -42.73305892944336, "global_step": 292671, "epoch": 2418} {"train_loss": -43.096343994140625, "global_step": 292672, "epoch": 2418} {"train_loss": -43.042449951171875, "global_step": 292673, "epoch": 2418} {"train_loss": -43.38837814331055, "global_step": 292674, "epoch": 2418} {"train_loss": -43.05961227416992, "global_step": 292675, "epoch": 2418} {"train_loss": -43.2698974609375, "global_step": 292676, "epoch": 2418} {"train_loss": -43.14829635620117, "global_step": 292677, "epoch": 2418} {"train_loss": -43.27753448486328, "global_step": 292678, "epoch": 2418} {"train_loss": -43.668540954589844, "global_step": 292679, "epoch": 2418} {"train_loss": -43.418601989746094, "global_step": 292680, "epoch": 2418} {"train_loss": -43.617095947265625, "global_step": 292681, "epoch": 2418} {"train_loss": -43.425331115722656, "global_step": 292682, "epoch": 2418} {"train_loss": -43.0183219909668, "global_step": 292683, "epoch": 2418} {"train_loss": -43.662025451660156, "global_step": 292684, "epoch": 2418} {"train_loss": -42.796417236328125, "global_step": 292685, "epoch": 2418} {"train_loss": -43.25629425048828, "global_step": 292686, "epoch": 2418} {"train_loss": -44.017860412597656, "global_step": 292687, "epoch": 2418} {"train_loss": -43.00712203979492, "global_step": 292688, "epoch": 2418} {"train_loss": -43.71529006958008, "global_step": 292689, "epoch": 2418} {"train_loss": -43.62767028808594, "global_step": 292690, "epoch": 2418} {"train_loss": -43.613624572753906, "global_step": 292691, "epoch": 2418} {"train_loss": -43.5697135925293, "global_step": 292692, "epoch": 2418} {"train_loss": -42.95377731323242, "global_step": 292693, "epoch": 2418} {"train_loss": -44.05451965332031, "global_step": 292694, "epoch": 2418} {"train_loss": -44.24626541137695, "global_step": 292695, "epoch": 2418} {"train_loss": -43.78179931640625, "global_step": 292696, "epoch": 2418} {"train_loss": -43.66109085083008, "global_step": 292697, "epoch": 2418} {"train_loss": -42.861349216177445, "global_step": 292698, "epoch": 2418, "val_loss": 2504868.75} {"train_loss": -43.66286087036133, "global_step": 292699, "epoch": 2419} {"train_loss": -43.225040435791016, "global_step": 292700, "epoch": 2419} {"train_loss": -43.69565963745117, "global_step": 292701, "epoch": 2419} {"train_loss": -44.3192253112793, "global_step": 292702, "epoch": 2419} {"train_loss": -43.79829025268555, "global_step": 292703, "epoch": 2419} {"train_loss": -43.12372970581055, "global_step": 292704, "epoch": 2419} {"train_loss": -44.42720413208008, "global_step": 292705, "epoch": 2419} {"train_loss": -43.902557373046875, "global_step": 292706, "epoch": 2419} {"train_loss": -42.87732696533203, "global_step": 292707, "epoch": 2419} {"train_loss": -42.134521484375, "global_step": 292708, "epoch": 2419} {"train_loss": -43.249305725097656, "global_step": 292709, "epoch": 2419} {"train_loss": -44.118797302246094, "global_step": 292710, "epoch": 2419} {"train_loss": -42.304115295410156, "global_step": 292711, "epoch": 2419} {"train_loss": -43.517303466796875, "global_step": 292712, "epoch": 2419} {"train_loss": -44.03398132324219, "global_step": 292713, "epoch": 2419} {"train_loss": -44.126041412353516, "global_step": 292714, "epoch": 2419} {"train_loss": -43.10671615600586, "global_step": 292715, "epoch": 2419} {"train_loss": -44.1924934387207, "global_step": 292716, "epoch": 2419} {"train_loss": -43.841407775878906, "global_step": 292717, "epoch": 2419} {"train_loss": -42.58817672729492, "global_step": 292718, "epoch": 2419} {"train_loss": -42.226234436035156, "global_step": 292719, "epoch": 2419} {"train_loss": -44.46635055541992, "global_step": 292720, "epoch": 2419} {"train_loss": -43.947994232177734, "global_step": 292721, "epoch": 2419} {"train_loss": -42.201908111572266, "global_step": 292722, "epoch": 2419} {"train_loss": -42.46440505981445, "global_step": 292723, "epoch": 2419} {"train_loss": -44.14874267578125, "global_step": 292724, "epoch": 2419} {"train_loss": -43.89436721801758, "global_step": 292725, "epoch": 2419} {"train_loss": -43.4387321472168, "global_step": 292726, "epoch": 2419} {"train_loss": -44.05327224731445, "global_step": 292727, "epoch": 2419} {"train_loss": -43.200958251953125, "global_step": 292728, "epoch": 2419} {"train_loss": -43.205631256103516, "global_step": 292729, "epoch": 2419} {"train_loss": -43.853389739990234, "global_step": 292730, "epoch": 2419} {"train_loss": -43.54287338256836, "global_step": 292731, "epoch": 2419} {"train_loss": -43.08857727050781, "global_step": 292732, "epoch": 2419} {"train_loss": -44.51668930053711, "global_step": 292733, "epoch": 2419} {"train_loss": -43.464969635009766, "global_step": 292734, "epoch": 2419} {"train_loss": -43.41972732543945, "global_step": 292735, "epoch": 2419} {"train_loss": -43.4544677734375, "global_step": 292736, "epoch": 2419} {"train_loss": -43.38039016723633, "global_step": 292737, "epoch": 2419} {"train_loss": -43.84855651855469, "global_step": 292738, "epoch": 2419} {"train_loss": -44.07805252075195, "global_step": 292739, "epoch": 2419} {"train_loss": -44.13020706176758, "global_step": 292740, "epoch": 2419} {"train_loss": -43.8376579284668, "global_step": 292741, "epoch": 2419} {"train_loss": -43.63170623779297, "global_step": 292742, "epoch": 2419} {"train_loss": -44.4746208190918, "global_step": 292743, "epoch": 2419} {"train_loss": -44.12290573120117, "global_step": 292744, "epoch": 2419} {"train_loss": -43.893245697021484, "global_step": 292745, "epoch": 2419} {"train_loss": -44.40290451049805, "global_step": 292746, "epoch": 2419} {"train_loss": -43.9375114440918, "global_step": 292747, "epoch": 2419} {"train_loss": -44.17484664916992, "global_step": 292748, "epoch": 2419} {"train_loss": -43.94385528564453, "global_step": 292749, "epoch": 2419} {"train_loss": -44.20125961303711, "global_step": 292750, "epoch": 2419} {"train_loss": -43.81673812866211, "global_step": 292751, "epoch": 2419} {"train_loss": -43.42600631713867, "global_step": 292752, "epoch": 2419} {"train_loss": -44.32155990600586, "global_step": 292753, "epoch": 2419} {"train_loss": -43.525421142578125, "global_step": 292754, "epoch": 2419} {"train_loss": -44.2620964050293, "global_step": 292755, "epoch": 2419} {"train_loss": -44.797889709472656, "global_step": 292756, "epoch": 2419} {"train_loss": -43.74494171142578, "global_step": 292757, "epoch": 2419} {"train_loss": -44.044830322265625, "global_step": 292758, "epoch": 2419} {"train_loss": -43.82037353515625, "global_step": 292759, "epoch": 2419} {"train_loss": -44.31461715698242, "global_step": 292760, "epoch": 2419} {"train_loss": -44.11823654174805, "global_step": 292761, "epoch": 2419} {"train_loss": -44.599403381347656, "global_step": 292762, "epoch": 2419} {"train_loss": -43.91053771972656, "global_step": 292763, "epoch": 2419} {"train_loss": -44.26655197143555, "global_step": 292764, "epoch": 2419} {"train_loss": -44.1357307434082, "global_step": 292765, "epoch": 2419} {"train_loss": -44.24554443359375, "global_step": 292766, "epoch": 2419} {"train_loss": -44.1070556640625, "global_step": 292767, "epoch": 2419} {"train_loss": -43.89631271362305, "global_step": 292768, "epoch": 2419} {"train_loss": -43.3670539855957, "global_step": 292769, "epoch": 2419} {"train_loss": -43.731605529785156, "global_step": 292770, "epoch": 2419} {"train_loss": -43.68426513671875, "global_step": 292771, "epoch": 2419} {"train_loss": -44.91775131225586, "global_step": 292772, "epoch": 2419} {"train_loss": -43.56659698486328, "global_step": 292773, "epoch": 2419} {"train_loss": -43.42333984375, "global_step": 292774, "epoch": 2419} {"train_loss": -43.6948356628418, "global_step": 292775, "epoch": 2419} {"train_loss": -43.9254264831543, "global_step": 292776, "epoch": 2419} {"train_loss": -44.546443939208984, "global_step": 292777, "epoch": 2419} {"train_loss": -44.183773040771484, "global_step": 292778, "epoch": 2419} {"train_loss": -44.45762252807617, "global_step": 292779, "epoch": 2419} {"train_loss": -44.66056442260742, "global_step": 292780, "epoch": 2419} {"train_loss": -43.642967224121094, "global_step": 292781, "epoch": 2419} {"train_loss": -43.703189849853516, "global_step": 292782, "epoch": 2419} {"train_loss": -43.41770553588867, "global_step": 292783, "epoch": 2419} {"train_loss": -43.106876373291016, "global_step": 292784, "epoch": 2419} {"train_loss": -41.65606689453125, "global_step": 292785, "epoch": 2419} {"train_loss": -40.97442626953125, "global_step": 292786, "epoch": 2419} {"train_loss": -42.2601432800293, "global_step": 292787, "epoch": 2419} {"train_loss": -42.66184616088867, "global_step": 292788, "epoch": 2419} {"train_loss": -43.474918365478516, "global_step": 292789, "epoch": 2419} {"train_loss": -43.694190979003906, "global_step": 292790, "epoch": 2419} {"train_loss": -42.78459167480469, "global_step": 292791, "epoch": 2419} {"train_loss": -42.93132781982422, "global_step": 292792, "epoch": 2419} {"train_loss": -43.703365325927734, "global_step": 292793, "epoch": 2419} {"train_loss": -43.105350494384766, "global_step": 292794, "epoch": 2419} {"train_loss": -43.389461517333984, "global_step": 292795, "epoch": 2419} {"train_loss": -43.75209426879883, "global_step": 292796, "epoch": 2419} {"train_loss": -43.81079864501953, "global_step": 292797, "epoch": 2419} {"train_loss": -43.36981201171875, "global_step": 292798, "epoch": 2419} {"train_loss": -44.04150390625, "global_step": 292799, "epoch": 2419} {"train_loss": -43.09666442871094, "global_step": 292800, "epoch": 2419} {"train_loss": -43.23286819458008, "global_step": 292801, "epoch": 2419} {"train_loss": -43.395538330078125, "global_step": 292802, "epoch": 2419} {"train_loss": -43.557167053222656, "global_step": 292803, "epoch": 2419} {"train_loss": -43.26288604736328, "global_step": 292804, "epoch": 2419} {"train_loss": -43.656044006347656, "global_step": 292805, "epoch": 2419} {"train_loss": -44.06620407104492, "global_step": 292806, "epoch": 2419} {"train_loss": -43.960693359375, "global_step": 292807, "epoch": 2419} {"train_loss": -43.82062911987305, "global_step": 292808, "epoch": 2419} {"train_loss": -44.42109298706055, "global_step": 292809, "epoch": 2419} {"train_loss": -44.05682373046875, "global_step": 292810, "epoch": 2419} {"train_loss": -44.507625579833984, "global_step": 292811, "epoch": 2419} {"train_loss": -44.64470291137695, "global_step": 292812, "epoch": 2419} {"train_loss": -43.40418243408203, "global_step": 292813, "epoch": 2419} {"train_loss": -44.25099563598633, "global_step": 292814, "epoch": 2419} {"train_loss": -43.93586349487305, "global_step": 292815, "epoch": 2419} {"train_loss": -44.28462219238281, "global_step": 292816, "epoch": 2419} {"train_loss": -43.758541107177734, "global_step": 292817, "epoch": 2419} {"train_loss": -44.429744720458984, "global_step": 292818, "epoch": 2419} {"train_loss": -43.69743999764939, "global_step": 292819, "epoch": 2419, "val_loss": 2521119.75} {"train_loss": -43.92376708984375, "global_step": 292820, "epoch": 2420} {"train_loss": -43.58289337158203, "global_step": 292821, "epoch": 2420} {"train_loss": -44.530426025390625, "global_step": 292822, "epoch": 2420} {"train_loss": -42.4980583190918, "global_step": 292823, "epoch": 2420} {"train_loss": -42.271644592285156, "global_step": 292824, "epoch": 2420} {"train_loss": -44.47636795043945, "global_step": 292825, "epoch": 2420} {"train_loss": -44.06864547729492, "global_step": 292826, "epoch": 2420} {"train_loss": -42.437904357910156, "global_step": 292827, "epoch": 2420} {"train_loss": -43.79046630859375, "global_step": 292828, "epoch": 2420} {"train_loss": -43.770538330078125, "global_step": 292829, "epoch": 2420} {"train_loss": -43.486385345458984, "global_step": 292830, "epoch": 2420} {"train_loss": -44.080772399902344, "global_step": 292831, "epoch": 2420} {"train_loss": -43.61015701293945, "global_step": 292832, "epoch": 2420} {"train_loss": -43.693992614746094, "global_step": 292833, "epoch": 2420} {"train_loss": -43.87999725341797, "global_step": 292834, "epoch": 2420} {"train_loss": -43.65179443359375, "global_step": 292835, "epoch": 2420} {"train_loss": -44.64799880981445, "global_step": 292836, "epoch": 2420} {"train_loss": -44.19805908203125, "global_step": 292837, "epoch": 2420} {"train_loss": -43.475425720214844, "global_step": 292838, "epoch": 2420} {"train_loss": -43.795772552490234, "global_step": 292839, "epoch": 2420} {"train_loss": -44.16033935546875, "global_step": 292840, "epoch": 2420} {"train_loss": -43.05439376831055, "global_step": 292841, "epoch": 2420} {"train_loss": -43.57659912109375, "global_step": 292842, "epoch": 2420} {"train_loss": -43.37813186645508, "global_step": 292843, "epoch": 2420} {"train_loss": -42.74898147583008, "global_step": 292844, "epoch": 2420} {"train_loss": -42.4387321472168, "global_step": 292845, "epoch": 2420} {"train_loss": -43.64374542236328, "global_step": 292846, "epoch": 2420} {"train_loss": -43.476531982421875, "global_step": 292847, "epoch": 2420} {"train_loss": -43.36288070678711, "global_step": 292848, "epoch": 2420} {"train_loss": -43.71627426147461, "global_step": 292849, "epoch": 2420} {"train_loss": -44.160648345947266, "global_step": 292850, "epoch": 2420} {"train_loss": -42.76906204223633, "global_step": 292851, "epoch": 2420} {"train_loss": -43.86446762084961, "global_step": 292852, "epoch": 2420} {"train_loss": -42.529212951660156, "global_step": 292853, "epoch": 2420} {"train_loss": -42.1524772644043, "global_step": 292854, "epoch": 2420} {"train_loss": -42.02737045288086, "global_step": 292855, "epoch": 2420} {"train_loss": -41.469425201416016, "global_step": 292856, "epoch": 2420} {"train_loss": -40.617794036865234, "global_step": 292857, "epoch": 2420} {"train_loss": -41.74946594238281, "global_step": 292858, "epoch": 2420} {"train_loss": -41.3947868347168, "global_step": 292859, "epoch": 2420} {"train_loss": -43.178955078125, "global_step": 292860, "epoch": 2420} {"train_loss": -42.488670349121094, "global_step": 292861, "epoch": 2420} {"train_loss": -43.74502182006836, "global_step": 292862, "epoch": 2420} {"train_loss": -41.38090133666992, "global_step": 292863, "epoch": 2420} {"train_loss": -42.92316818237305, "global_step": 292864, "epoch": 2420} {"train_loss": -42.271488189697266, "global_step": 292865, "epoch": 2420} {"train_loss": -43.719505310058594, "global_step": 292866, "epoch": 2420} {"train_loss": -43.217376708984375, "global_step": 292867, "epoch": 2420} {"train_loss": -40.71271896362305, "global_step": 292868, "epoch": 2420} {"train_loss": -41.713069915771484, "global_step": 292869, "epoch": 2420} {"train_loss": -42.33506393432617, "global_step": 292870, "epoch": 2420} {"train_loss": -42.470462799072266, "global_step": 292871, "epoch": 2420} {"train_loss": -40.69247055053711, "global_step": 292872, "epoch": 2420} {"train_loss": -43.00696563720703, "global_step": 292873, "epoch": 2420} {"train_loss": -42.30854415893555, "global_step": 292874, "epoch": 2420} {"train_loss": -42.71427917480469, "global_step": 292875, "epoch": 2420} {"train_loss": -43.763179779052734, "global_step": 292876, "epoch": 2420} {"train_loss": -41.9915657043457, "global_step": 292877, "epoch": 2420} {"train_loss": -43.74946212768555, "global_step": 292878, "epoch": 2420} {"train_loss": -42.86663818359375, "global_step": 292879, "epoch": 2420} {"train_loss": -43.24034118652344, "global_step": 292880, "epoch": 2420} {"train_loss": -42.70186996459961, "global_step": 292881, "epoch": 2420} {"train_loss": -43.20992660522461, "global_step": 292882, "epoch": 2420} {"train_loss": -44.052886962890625, "global_step": 292883, "epoch": 2420} {"train_loss": -44.0999641418457, "global_step": 292884, "epoch": 2420} {"train_loss": -43.86093521118164, "global_step": 292885, "epoch": 2420} {"train_loss": -40.451026916503906, "global_step": 292886, "epoch": 2420} {"train_loss": -44.045387268066406, "global_step": 292887, "epoch": 2420} {"train_loss": -43.71259689331055, "global_step": 292888, "epoch": 2420} {"train_loss": -44.198394775390625, "global_step": 292889, "epoch": 2420} {"train_loss": -43.50421142578125, "global_step": 292890, "epoch": 2420} {"train_loss": -44.38246536254883, "global_step": 292891, "epoch": 2420} {"train_loss": -43.047306060791016, "global_step": 292892, "epoch": 2420} {"train_loss": -43.8758659362793, "global_step": 292893, "epoch": 2420} {"train_loss": -44.14937210083008, "global_step": 292894, "epoch": 2420} {"train_loss": -43.24174118041992, "global_step": 292895, "epoch": 2420} {"train_loss": -43.808284759521484, "global_step": 292896, "epoch": 2420} {"train_loss": -44.14360809326172, "global_step": 292897, "epoch": 2420} {"train_loss": -43.65909194946289, "global_step": 292898, "epoch": 2420} {"train_loss": -44.002864837646484, "global_step": 292899, "epoch": 2420} {"train_loss": -43.860984802246094, "global_step": 292900, "epoch": 2420} {"train_loss": -43.233551025390625, "global_step": 292901, "epoch": 2420} {"train_loss": -43.841827392578125, "global_step": 292902, "epoch": 2420} {"train_loss": -44.12499237060547, "global_step": 292903, "epoch": 2420} {"train_loss": -43.266841888427734, "global_step": 292904, "epoch": 2420} {"train_loss": -44.00086212158203, "global_step": 292905, "epoch": 2420} {"train_loss": -44.23933029174805, "global_step": 292906, "epoch": 2420} {"train_loss": -43.86137771606445, "global_step": 292907, "epoch": 2420} {"train_loss": -43.2215690612793, "global_step": 292908, "epoch": 2420} {"train_loss": -44.5012321472168, "global_step": 292909, "epoch": 2420} {"train_loss": -44.36115646362305, "global_step": 292910, "epoch": 2420} {"train_loss": -43.37067794799805, "global_step": 292911, "epoch": 2420} {"train_loss": -41.83463668823242, "global_step": 292912, "epoch": 2420} {"train_loss": -42.89895248413086, "global_step": 292913, "epoch": 2420} {"train_loss": -43.383541107177734, "global_step": 292914, "epoch": 2420} {"train_loss": -42.80573654174805, "global_step": 292915, "epoch": 2420} {"train_loss": -41.88367462158203, "global_step": 292916, "epoch": 2420} {"train_loss": -44.07381057739258, "global_step": 292917, "epoch": 2420} {"train_loss": -43.38011169433594, "global_step": 292918, "epoch": 2420} {"train_loss": -42.99589157104492, "global_step": 292919, "epoch": 2420} {"train_loss": -43.225425720214844, "global_step": 292920, "epoch": 2420} {"train_loss": -43.76362228393555, "global_step": 292921, "epoch": 2420} {"train_loss": -43.19051742553711, "global_step": 292922, "epoch": 2420} {"train_loss": -43.2746696472168, "global_step": 292923, "epoch": 2420} {"train_loss": -43.77539825439453, "global_step": 292924, "epoch": 2420} {"train_loss": -43.03599548339844, "global_step": 292925, "epoch": 2420} {"train_loss": -42.79297637939453, "global_step": 292926, "epoch": 2420} {"train_loss": -43.27875518798828, "global_step": 292927, "epoch": 2420} {"train_loss": -42.89202880859375, "global_step": 292928, "epoch": 2420} {"train_loss": -42.644447326660156, "global_step": 292929, "epoch": 2420} {"train_loss": -42.167510986328125, "global_step": 292930, "epoch": 2420} {"train_loss": -43.773433685302734, "global_step": 292931, "epoch": 2420} {"train_loss": -43.50651168823242, "global_step": 292932, "epoch": 2420} {"train_loss": -42.55672073364258, "global_step": 292933, "epoch": 2420} {"train_loss": -43.01290512084961, "global_step": 292934, "epoch": 2420} {"train_loss": -43.581146240234375, "global_step": 292935, "epoch": 2420} {"train_loss": -42.348060607910156, "global_step": 292936, "epoch": 2420} {"train_loss": -43.52997970581055, "global_step": 292937, "epoch": 2420} {"train_loss": -43.147705078125, "global_step": 292938, "epoch": 2420} {"train_loss": -43.20558547973633, "global_step": 292939, "epoch": 2420} {"train_loss": -43.20857500438848, "global_step": 292940, "epoch": 2420, "val_loss": 2544034.75} {"train_loss": -43.47640609741211, "global_step": 292941, "epoch": 2421} {"train_loss": -42.60294723510742, "global_step": 292942, "epoch": 2421} {"train_loss": -42.606075286865234, "global_step": 292943, "epoch": 2421} {"train_loss": -43.61068344116211, "global_step": 292944, "epoch": 2421} {"train_loss": -43.50710678100586, "global_step": 292945, "epoch": 2421} {"train_loss": -42.60441589355469, "global_step": 292946, "epoch": 2421} {"train_loss": -42.95016098022461, "global_step": 292947, "epoch": 2421} {"train_loss": -43.87398910522461, "global_step": 292948, "epoch": 2421} {"train_loss": -42.26123046875, "global_step": 292949, "epoch": 2421} {"train_loss": -43.169593811035156, "global_step": 292950, "epoch": 2421} {"train_loss": -42.23657989501953, "global_step": 292951, "epoch": 2421} {"train_loss": -41.93368148803711, "global_step": 292952, "epoch": 2421} {"train_loss": -43.28297805786133, "global_step": 292953, "epoch": 2421} {"train_loss": -41.384986877441406, "global_step": 292954, "epoch": 2421} {"train_loss": -42.11470413208008, "global_step": 292955, "epoch": 2421} {"train_loss": -43.25476837158203, "global_step": 292956, "epoch": 2421} {"train_loss": -42.47831726074219, "global_step": 292957, "epoch": 2421} {"train_loss": -43.097015380859375, "global_step": 292958, "epoch": 2421} {"train_loss": -43.214271545410156, "global_step": 292959, "epoch": 2421} {"train_loss": -41.910194396972656, "global_step": 292960, "epoch": 2421} {"train_loss": -43.14873504638672, "global_step": 292961, "epoch": 2421} {"train_loss": -42.8663215637207, "global_step": 292962, "epoch": 2421} {"train_loss": -42.64166259765625, "global_step": 292963, "epoch": 2421} {"train_loss": -42.792701721191406, "global_step": 292964, "epoch": 2421} {"train_loss": -41.69035720825195, "global_step": 292965, "epoch": 2421} {"train_loss": -42.7177734375, "global_step": 292966, "epoch": 2421} {"train_loss": -42.934051513671875, "global_step": 292967, "epoch": 2421} {"train_loss": -43.249244689941406, "global_step": 292968, "epoch": 2421} {"train_loss": -42.960018157958984, "global_step": 292969, "epoch": 2421} {"train_loss": -43.81689453125, "global_step": 292970, "epoch": 2421} {"train_loss": -42.673336029052734, "global_step": 292971, "epoch": 2421} {"train_loss": -43.25172424316406, "global_step": 292972, "epoch": 2421} {"train_loss": -43.32102584838867, "global_step": 292973, "epoch": 2421} {"train_loss": -43.3624382019043, "global_step": 292974, "epoch": 2421} {"train_loss": -43.84442901611328, "global_step": 292975, "epoch": 2421} {"train_loss": -43.255672454833984, "global_step": 292976, "epoch": 2421} {"train_loss": -43.290462493896484, "global_step": 292977, "epoch": 2421} {"train_loss": -44.42085266113281, "global_step": 292978, "epoch": 2421} {"train_loss": -43.469905853271484, "global_step": 292979, "epoch": 2421} {"train_loss": -44.001617431640625, "global_step": 292980, "epoch": 2421} {"train_loss": -44.0942497253418, "global_step": 292981, "epoch": 2421} {"train_loss": -43.63043975830078, "global_step": 292982, "epoch": 2421} {"train_loss": -44.55060577392578, "global_step": 292983, "epoch": 2421} {"train_loss": -43.345558166503906, "global_step": 292984, "epoch": 2421} {"train_loss": -44.27775955200195, "global_step": 292985, "epoch": 2421} {"train_loss": -43.52631378173828, "global_step": 292986, "epoch": 2421} {"train_loss": -43.77565383911133, "global_step": 292987, "epoch": 2421} {"train_loss": -43.45259475708008, "global_step": 292988, "epoch": 2421} {"train_loss": -43.786434173583984, "global_step": 292989, "epoch": 2421} {"train_loss": -43.42317581176758, "global_step": 292990, "epoch": 2421} {"train_loss": -42.85688400268555, "global_step": 292991, "epoch": 2421} {"train_loss": -43.8403434753418, "global_step": 292992, "epoch": 2421} {"train_loss": -44.20707321166992, "global_step": 292993, "epoch": 2421} {"train_loss": -44.201412200927734, "global_step": 292994, "epoch": 2421} {"train_loss": -43.5167121887207, "global_step": 292995, "epoch": 2421} {"train_loss": -43.353450775146484, "global_step": 292996, "epoch": 2421} {"train_loss": -43.59078598022461, "global_step": 292997, "epoch": 2421} {"train_loss": -43.72172927856445, "global_step": 292998, "epoch": 2421} {"train_loss": -44.67844772338867, "global_step": 292999, "epoch": 2421} {"train_loss": -43.305843353271484, "global_step": 293000, "epoch": 2421} {"train_loss": -42.72206497192383, "global_step": 293001, "epoch": 2421} {"train_loss": -43.557350158691406, "global_step": 293002, "epoch": 2421} {"train_loss": -43.98031234741211, "global_step": 293003, "epoch": 2421} {"train_loss": -43.2745246887207, "global_step": 293004, "epoch": 2421} {"train_loss": -43.491363525390625, "global_step": 293005, "epoch": 2421} {"train_loss": -43.48579025268555, "global_step": 293006, "epoch": 2421} {"train_loss": -44.176631927490234, "global_step": 293007, "epoch": 2421} {"train_loss": -43.473731994628906, "global_step": 293008, "epoch": 2421} {"train_loss": -43.343772888183594, "global_step": 293009, "epoch": 2421} {"train_loss": -42.7546501159668, "global_step": 293010, "epoch": 2421} {"train_loss": -41.94109344482422, "global_step": 293011, "epoch": 2421} {"train_loss": -42.51728439331055, "global_step": 293012, "epoch": 2421} {"train_loss": -43.876007080078125, "global_step": 293013, "epoch": 2421} {"train_loss": -42.569740295410156, "global_step": 293014, "epoch": 2421} {"train_loss": -43.24897384643555, "global_step": 293015, "epoch": 2421} {"train_loss": -43.18075942993164, "global_step": 293016, "epoch": 2421} {"train_loss": -44.16579055786133, "global_step": 293017, "epoch": 2421} {"train_loss": -43.202880859375, "global_step": 293018, "epoch": 2421} {"train_loss": -43.3735237121582, "global_step": 293019, "epoch": 2421} {"train_loss": -44.00613021850586, "global_step": 293020, "epoch": 2421} {"train_loss": -43.88370895385742, "global_step": 293021, "epoch": 2421} {"train_loss": -42.614501953125, "global_step": 293022, "epoch": 2421} {"train_loss": -44.36965560913086, "global_step": 293023, "epoch": 2421} {"train_loss": -43.10749053955078, "global_step": 293024, "epoch": 2421} {"train_loss": -43.321468353271484, "global_step": 293025, "epoch": 2421} {"train_loss": -42.58063888549805, "global_step": 293026, "epoch": 2421} {"train_loss": -43.375423431396484, "global_step": 293027, "epoch": 2421} {"train_loss": -44.278865814208984, "global_step": 293028, "epoch": 2421} {"train_loss": -43.700679779052734, "global_step": 293029, "epoch": 2421} {"train_loss": -43.024959564208984, "global_step": 293030, "epoch": 2421} {"train_loss": -43.58055877685547, "global_step": 293031, "epoch": 2421} {"train_loss": -43.156105041503906, "global_step": 293032, "epoch": 2421} {"train_loss": -43.7567253112793, "global_step": 293033, "epoch": 2421} {"train_loss": -43.935604095458984, "global_step": 293034, "epoch": 2421} {"train_loss": -43.18745803833008, "global_step": 293035, "epoch": 2421} {"train_loss": -42.29219436645508, "global_step": 293036, "epoch": 2421} {"train_loss": -42.99304962158203, "global_step": 293037, "epoch": 2421} {"train_loss": -44.422035217285156, "global_step": 293038, "epoch": 2421} {"train_loss": -43.5915412902832, "global_step": 293039, "epoch": 2421} {"train_loss": -43.66315841674805, "global_step": 293040, "epoch": 2421} {"train_loss": -43.95206069946289, "global_step": 293041, "epoch": 2421} {"train_loss": -43.93918228149414, "global_step": 293042, "epoch": 2421} {"train_loss": -43.19009017944336, "global_step": 293043, "epoch": 2421} {"train_loss": -43.751251220703125, "global_step": 293044, "epoch": 2421} {"train_loss": -44.01885986328125, "global_step": 293045, "epoch": 2421} {"train_loss": -44.38302993774414, "global_step": 293046, "epoch": 2421} {"train_loss": -44.37139892578125, "global_step": 293047, "epoch": 2421} {"train_loss": -44.04087448120117, "global_step": 293048, "epoch": 2421} {"train_loss": -44.172603607177734, "global_step": 293049, "epoch": 2421} {"train_loss": -44.2729377746582, "global_step": 293050, "epoch": 2421} {"train_loss": -43.91438674926758, "global_step": 293051, "epoch": 2421} {"train_loss": -44.46601486206055, "global_step": 293052, "epoch": 2421} {"train_loss": -45.05257034301758, "global_step": 293053, "epoch": 2421} {"train_loss": -44.30879592895508, "global_step": 293054, "epoch": 2421} {"train_loss": -43.85183334350586, "global_step": 293055, "epoch": 2421} {"train_loss": -44.35470962524414, "global_step": 293056, "epoch": 2421} {"train_loss": -44.5560417175293, "global_step": 293057, "epoch": 2421} {"train_loss": -44.11196517944336, "global_step": 293058, "epoch": 2421} {"train_loss": -43.88264846801758, "global_step": 293059, "epoch": 2421} {"train_loss": -43.129268646240234, "global_step": 293060, "epoch": 2421} {"train_loss": -43.425449434390735, "global_step": 293061, "epoch": 2421, "val_loss": 2553151.0} {"train_loss": -44.67346954345703, "global_step": 293062, "epoch": 2422} {"train_loss": -42.5518684387207, "global_step": 293063, "epoch": 2422} {"train_loss": -42.67424011230469, "global_step": 293064, "epoch": 2422} {"train_loss": -44.06318664550781, "global_step": 293065, "epoch": 2422} {"train_loss": -44.28607177734375, "global_step": 293066, "epoch": 2422} {"train_loss": -43.4432258605957, "global_step": 293067, "epoch": 2422} {"train_loss": -43.837806701660156, "global_step": 293068, "epoch": 2422} {"train_loss": -43.96916961669922, "global_step": 293069, "epoch": 2422} {"train_loss": -44.110008239746094, "global_step": 293070, "epoch": 2422} {"train_loss": -43.23978042602539, "global_step": 293071, "epoch": 2422} {"train_loss": -44.145870208740234, "global_step": 293072, "epoch": 2422} {"train_loss": -44.26930618286133, "global_step": 293073, "epoch": 2422} {"train_loss": -43.85017013549805, "global_step": 293074, "epoch": 2422} {"train_loss": -43.85075378417969, "global_step": 293075, "epoch": 2422} {"train_loss": -44.65267562866211, "global_step": 293076, "epoch": 2422} {"train_loss": -42.37454605102539, "global_step": 293077, "epoch": 2422} {"train_loss": -44.37507247924805, "global_step": 293078, "epoch": 2422} {"train_loss": -44.09226608276367, "global_step": 293079, "epoch": 2422} {"train_loss": -43.36973190307617, "global_step": 293080, "epoch": 2422} {"train_loss": -43.322200775146484, "global_step": 293081, "epoch": 2422} {"train_loss": -44.47501754760742, "global_step": 293082, "epoch": 2422} {"train_loss": -42.36210632324219, "global_step": 293083, "epoch": 2422} {"train_loss": -44.50411605834961, "global_step": 293084, "epoch": 2422} {"train_loss": -43.14167785644531, "global_step": 293085, "epoch": 2422} {"train_loss": -43.00910568237305, "global_step": 293086, "epoch": 2422} {"train_loss": -43.3845329284668, "global_step": 293087, "epoch": 2422} {"train_loss": -44.679107666015625, "global_step": 293088, "epoch": 2422} {"train_loss": -42.967281341552734, "global_step": 293089, "epoch": 2422} {"train_loss": -44.2751579284668, "global_step": 293090, "epoch": 2422} {"train_loss": -43.84177780151367, "global_step": 293091, "epoch": 2422} {"train_loss": -43.87455368041992, "global_step": 293092, "epoch": 2422} {"train_loss": -44.3473014831543, "global_step": 293093, "epoch": 2422} {"train_loss": -44.13777542114258, "global_step": 293094, "epoch": 2422} {"train_loss": -43.970008850097656, "global_step": 293095, "epoch": 2422} {"train_loss": -43.69175338745117, "global_step": 293096, "epoch": 2422} {"train_loss": -43.132957458496094, "global_step": 293097, "epoch": 2422} {"train_loss": -43.5773811340332, "global_step": 293098, "epoch": 2422} {"train_loss": -43.87763214111328, "global_step": 293099, "epoch": 2422} {"train_loss": -43.110382080078125, "global_step": 293100, "epoch": 2422} {"train_loss": -41.89503860473633, "global_step": 293101, "epoch": 2422} {"train_loss": -43.66190719604492, "global_step": 293102, "epoch": 2422} {"train_loss": -43.70292282104492, "global_step": 293103, "epoch": 2422} {"train_loss": -41.854427337646484, "global_step": 293104, "epoch": 2422} {"train_loss": -43.550838470458984, "global_step": 293105, "epoch": 2422} {"train_loss": -43.65018844604492, "global_step": 293106, "epoch": 2422} {"train_loss": -43.3907356262207, "global_step": 293107, "epoch": 2422} {"train_loss": -43.2706413269043, "global_step": 293108, "epoch": 2422} {"train_loss": -42.127132415771484, "global_step": 293109, "epoch": 2422} {"train_loss": -44.3173713684082, "global_step": 293110, "epoch": 2422} {"train_loss": -42.359153747558594, "global_step": 293111, "epoch": 2422} {"train_loss": -43.220375061035156, "global_step": 293112, "epoch": 2422} {"train_loss": -43.213417053222656, "global_step": 293113, "epoch": 2422} {"train_loss": -43.65909957885742, "global_step": 293114, "epoch": 2422} {"train_loss": -43.441184997558594, "global_step": 293115, "epoch": 2422} {"train_loss": -42.519561767578125, "global_step": 293116, "epoch": 2422} {"train_loss": -44.16032409667969, "global_step": 293117, "epoch": 2422} {"train_loss": -43.30900573730469, "global_step": 293118, "epoch": 2422} {"train_loss": -43.219459533691406, "global_step": 293119, "epoch": 2422} {"train_loss": -43.58018112182617, "global_step": 293120, "epoch": 2422} {"train_loss": -44.02023696899414, "global_step": 293121, "epoch": 2422} {"train_loss": -43.86589050292969, "global_step": 293122, "epoch": 2422} {"train_loss": -43.8447151184082, "global_step": 293123, "epoch": 2422} {"train_loss": -44.482662200927734, "global_step": 293124, "epoch": 2422} {"train_loss": -43.19143295288086, "global_step": 293125, "epoch": 2422} {"train_loss": -43.90412139892578, "global_step": 293126, "epoch": 2422} {"train_loss": -43.2142448425293, "global_step": 293127, "epoch": 2422} {"train_loss": -44.27153396606445, "global_step": 293128, "epoch": 2422} {"train_loss": -42.85801315307617, "global_step": 293129, "epoch": 2422} {"train_loss": -43.620887756347656, "global_step": 293130, "epoch": 2422} {"train_loss": -43.590476989746094, "global_step": 293131, "epoch": 2422} {"train_loss": -44.324920654296875, "global_step": 293132, "epoch": 2422} {"train_loss": -43.147621154785156, "global_step": 293133, "epoch": 2422} {"train_loss": -44.97279739379883, "global_step": 293134, "epoch": 2422} {"train_loss": -43.801021575927734, "global_step": 293135, "epoch": 2422} {"train_loss": -44.31582260131836, "global_step": 293136, "epoch": 2422} {"train_loss": -43.525943756103516, "global_step": 293137, "epoch": 2422} {"train_loss": -44.142791748046875, "global_step": 293138, "epoch": 2422} {"train_loss": -44.1286735534668, "global_step": 293139, "epoch": 2422} {"train_loss": -43.86770248413086, "global_step": 293140, "epoch": 2422} {"train_loss": -43.6272087097168, "global_step": 293141, "epoch": 2422} {"train_loss": -44.015472412109375, "global_step": 293142, "epoch": 2422} {"train_loss": -44.38729476928711, "global_step": 293143, "epoch": 2422} {"train_loss": -44.32506561279297, "global_step": 293144, "epoch": 2422} {"train_loss": -43.50263214111328, "global_step": 293145, "epoch": 2422} {"train_loss": -44.599674224853516, "global_step": 293146, "epoch": 2422} {"train_loss": -44.290313720703125, "global_step": 293147, "epoch": 2422} {"train_loss": -43.79736328125, "global_step": 293148, "epoch": 2422} {"train_loss": -43.91149139404297, "global_step": 293149, "epoch": 2422} {"train_loss": -43.951595306396484, "global_step": 293150, "epoch": 2422} {"train_loss": -43.44507598876953, "global_step": 293151, "epoch": 2422} {"train_loss": -43.811378479003906, "global_step": 293152, "epoch": 2422} {"train_loss": -43.02616500854492, "global_step": 293153, "epoch": 2422} {"train_loss": -43.01819610595703, "global_step": 293154, "epoch": 2422} {"train_loss": -42.63285446166992, "global_step": 293155, "epoch": 2422} {"train_loss": -43.30085372924805, "global_step": 293156, "epoch": 2422} {"train_loss": -43.81980514526367, "global_step": 293157, "epoch": 2422} {"train_loss": -43.21220397949219, "global_step": 293158, "epoch": 2422} {"train_loss": -42.3941764831543, "global_step": 293159, "epoch": 2422} {"train_loss": -42.996009826660156, "global_step": 293160, "epoch": 2422} {"train_loss": -42.95359802246094, "global_step": 293161, "epoch": 2422} {"train_loss": -42.39593505859375, "global_step": 293162, "epoch": 2422} {"train_loss": -42.91444778442383, "global_step": 293163, "epoch": 2422} {"train_loss": -33.40024185180664, "global_step": 293164, "epoch": 2422} {"train_loss": -39.785213470458984, "global_step": 293165, "epoch": 2422} {"train_loss": -42.1981201171875, "global_step": 293166, "epoch": 2422} {"train_loss": -42.257354736328125, "global_step": 293167, "epoch": 2422} {"train_loss": -41.104671478271484, "global_step": 293168, "epoch": 2422} {"train_loss": -40.14249801635742, "global_step": 293169, "epoch": 2422} {"train_loss": -37.75508117675781, "global_step": 293170, "epoch": 2422} {"train_loss": -41.698299407958984, "global_step": 293171, "epoch": 2422} {"train_loss": -41.022335052490234, "global_step": 293172, "epoch": 2422} {"train_loss": -38.48947525024414, "global_step": 293173, "epoch": 2422} {"train_loss": -40.51650619506836, "global_step": 293174, "epoch": 2422} {"train_loss": -37.35022735595703, "global_step": 293175, "epoch": 2422} {"train_loss": -40.66703414916992, "global_step": 293176, "epoch": 2422} {"train_loss": -39.291744232177734, "global_step": 293177, "epoch": 2422} {"train_loss": -39.55678939819336, "global_step": 293178, "epoch": 2422} {"train_loss": -39.05753707885742, "global_step": 293179, "epoch": 2422} {"train_loss": -40.764808654785156, "global_step": 293180, "epoch": 2422} {"train_loss": -39.36572265625, "global_step": 293181, "epoch": 2422} {"train_loss": -42.996893606895256, "global_step": 293182, "epoch": 2422, "val_loss": 2612846.0} {"train_loss": -40.58742904663086, "global_step": 293183, "epoch": 2423} {"train_loss": -41.393646240234375, "global_step": 293184, "epoch": 2423} {"train_loss": -38.6688346862793, "global_step": 293185, "epoch": 2423} {"train_loss": -38.48348617553711, "global_step": 293186, "epoch": 2423} {"train_loss": -39.67981719970703, "global_step": 293187, "epoch": 2423} {"train_loss": -42.01754379272461, "global_step": 293188, "epoch": 2423} {"train_loss": -40.53010559082031, "global_step": 293189, "epoch": 2423} {"train_loss": -37.668190002441406, "global_step": 293190, "epoch": 2423} {"train_loss": -41.696903228759766, "global_step": 293191, "epoch": 2423} {"train_loss": -40.33115768432617, "global_step": 293192, "epoch": 2423} {"train_loss": -41.347740173339844, "global_step": 293193, "epoch": 2423} {"train_loss": -40.7051887512207, "global_step": 293194, "epoch": 2423} {"train_loss": -41.99441146850586, "global_step": 293195, "epoch": 2423} {"train_loss": -41.42808151245117, "global_step": 293196, "epoch": 2423} {"train_loss": -40.759090423583984, "global_step": 293197, "epoch": 2423} {"train_loss": -40.8382453918457, "global_step": 293198, "epoch": 2423} {"train_loss": -39.39524459838867, "global_step": 293199, "epoch": 2423} {"train_loss": -41.45017623901367, "global_step": 293200, "epoch": 2423} {"train_loss": -40.89228439331055, "global_step": 293201, "epoch": 2423} {"train_loss": -40.81761932373047, "global_step": 293202, "epoch": 2423} {"train_loss": -39.71235656738281, "global_step": 293203, "epoch": 2423} {"train_loss": -41.93459701538086, "global_step": 293204, "epoch": 2423} {"train_loss": -42.34421920776367, "global_step": 293205, "epoch": 2423} {"train_loss": -42.161293029785156, "global_step": 293206, "epoch": 2423} {"train_loss": -42.1912841796875, "global_step": 293207, "epoch": 2423} {"train_loss": -41.93762969970703, "global_step": 293208, "epoch": 2423} {"train_loss": -42.01813888549805, "global_step": 293209, "epoch": 2423} {"train_loss": -41.93010330200195, "global_step": 293210, "epoch": 2423} {"train_loss": -42.36176300048828, "global_step": 293211, "epoch": 2423} {"train_loss": -42.326873779296875, "global_step": 293212, "epoch": 2423} {"train_loss": -42.42153549194336, "global_step": 293213, "epoch": 2423} {"train_loss": -43.02474594116211, "global_step": 293214, "epoch": 2423} {"train_loss": -42.39820098876953, "global_step": 293215, "epoch": 2423} {"train_loss": -42.9721794128418, "global_step": 293216, "epoch": 2423} {"train_loss": -41.63254928588867, "global_step": 293217, "epoch": 2423} {"train_loss": -42.51100158691406, "global_step": 293218, "epoch": 2423} {"train_loss": -42.803436279296875, "global_step": 293219, "epoch": 2423} {"train_loss": -43.21198654174805, "global_step": 293220, "epoch": 2423} {"train_loss": -42.97517013549805, "global_step": 293221, "epoch": 2423} {"train_loss": -43.315006256103516, "global_step": 293222, "epoch": 2423} {"train_loss": -43.160343170166016, "global_step": 293223, "epoch": 2423} {"train_loss": -42.696929931640625, "global_step": 293224, "epoch": 2423} {"train_loss": -43.27449417114258, "global_step": 293225, "epoch": 2423} {"train_loss": -43.47519302368164, "global_step": 293226, "epoch": 2423} {"train_loss": -42.66971206665039, "global_step": 293227, "epoch": 2423} {"train_loss": -42.20051956176758, "global_step": 293228, "epoch": 2423} {"train_loss": -43.279632568359375, "global_step": 293229, "epoch": 2423} {"train_loss": -42.8960075378418, "global_step": 293230, "epoch": 2423} {"train_loss": -42.86579513549805, "global_step": 293231, "epoch": 2423} {"train_loss": -43.33087921142578, "global_step": 293232, "epoch": 2423} {"train_loss": -42.85915756225586, "global_step": 293233, "epoch": 2423} {"train_loss": -42.93135452270508, "global_step": 293234, "epoch": 2423} {"train_loss": -42.58382797241211, "global_step": 293235, "epoch": 2423} {"train_loss": -43.74076843261719, "global_step": 293236, "epoch": 2423} {"train_loss": -41.958065032958984, "global_step": 293237, "epoch": 2423} {"train_loss": -43.547523498535156, "global_step": 293238, "epoch": 2423} {"train_loss": -43.046382904052734, "global_step": 293239, "epoch": 2423} {"train_loss": -43.54221725463867, "global_step": 293240, "epoch": 2423} {"train_loss": -43.609161376953125, "global_step": 293241, "epoch": 2423} {"train_loss": -42.639381408691406, "global_step": 293242, "epoch": 2423} {"train_loss": -44.038814544677734, "global_step": 293243, "epoch": 2423} {"train_loss": -43.657161712646484, "global_step": 293244, "epoch": 2423} {"train_loss": -42.84396743774414, "global_step": 293245, "epoch": 2423} {"train_loss": -43.967342376708984, "global_step": 293246, "epoch": 2423} {"train_loss": -43.268898010253906, "global_step": 293247, "epoch": 2423} {"train_loss": -43.822967529296875, "global_step": 293248, "epoch": 2423} {"train_loss": -44.2929801940918, "global_step": 293249, "epoch": 2423} {"train_loss": -43.000328063964844, "global_step": 293250, "epoch": 2423} {"train_loss": -43.34297561645508, "global_step": 293251, "epoch": 2423} {"train_loss": -43.963134765625, "global_step": 293252, "epoch": 2423} {"train_loss": -43.81312942504883, "global_step": 293253, "epoch": 2423} {"train_loss": -43.773475646972656, "global_step": 293254, "epoch": 2423} {"train_loss": -43.85758590698242, "global_step": 293255, "epoch": 2423} {"train_loss": -44.04959487915039, "global_step": 293256, "epoch": 2423} {"train_loss": -44.42514419555664, "global_step": 293257, "epoch": 2423} {"train_loss": -44.18885803222656, "global_step": 293258, "epoch": 2423} {"train_loss": -44.2373046875, "global_step": 293259, "epoch": 2423} {"train_loss": -44.65993118286133, "global_step": 293260, "epoch": 2423} {"train_loss": -44.295204162597656, "global_step": 293261, "epoch": 2423} {"train_loss": -43.978172302246094, "global_step": 293262, "epoch": 2423} {"train_loss": -44.511226654052734, "global_step": 293263, "epoch": 2423} {"train_loss": -45.04862594604492, "global_step": 293264, "epoch": 2423} {"train_loss": -44.16517639160156, "global_step": 293265, "epoch": 2423} {"train_loss": -44.643287658691406, "global_step": 293266, "epoch": 2423} {"train_loss": -43.828834533691406, "global_step": 293267, "epoch": 2423} {"train_loss": -44.4450798034668, "global_step": 293268, "epoch": 2423} {"train_loss": -44.16240310668945, "global_step": 293269, "epoch": 2423} {"train_loss": -44.634803771972656, "global_step": 293270, "epoch": 2423} {"train_loss": -43.77834701538086, "global_step": 293271, "epoch": 2423} {"train_loss": -43.63570785522461, "global_step": 293272, "epoch": 2423} {"train_loss": -43.52362060546875, "global_step": 293273, "epoch": 2423} {"train_loss": -44.14661407470703, "global_step": 293274, "epoch": 2423} {"train_loss": -45.05964279174805, "global_step": 293275, "epoch": 2423} {"train_loss": -44.18059158325195, "global_step": 293276, "epoch": 2423} {"train_loss": -43.3435173034668, "global_step": 293277, "epoch": 2423} {"train_loss": -43.528717041015625, "global_step": 293278, "epoch": 2423} {"train_loss": -44.26443099975586, "global_step": 293279, "epoch": 2423} {"train_loss": -44.84493637084961, "global_step": 293280, "epoch": 2423} {"train_loss": -44.362239837646484, "global_step": 293281, "epoch": 2423} {"train_loss": -43.69839096069336, "global_step": 293282, "epoch": 2423} {"train_loss": -44.06405258178711, "global_step": 293283, "epoch": 2423} {"train_loss": -41.634376525878906, "global_step": 293284, "epoch": 2423} {"train_loss": -39.795475006103516, "global_step": 293285, "epoch": 2423} {"train_loss": -43.10719299316406, "global_step": 293286, "epoch": 2423} {"train_loss": -44.046142578125, "global_step": 293287, "epoch": 2423} {"train_loss": -44.0636100769043, "global_step": 293288, "epoch": 2423} {"train_loss": -44.59016418457031, "global_step": 293289, "epoch": 2423} {"train_loss": -43.87229537963867, "global_step": 293290, "epoch": 2423} {"train_loss": -42.701499938964844, "global_step": 293291, "epoch": 2423} {"train_loss": -43.58515548706055, "global_step": 293292, "epoch": 2423} {"train_loss": -42.085636138916016, "global_step": 293293, "epoch": 2423} {"train_loss": -40.045753479003906, "global_step": 293294, "epoch": 2423} {"train_loss": -41.76304244995117, "global_step": 293295, "epoch": 2423} {"train_loss": -40.2005500793457, "global_step": 293296, "epoch": 2423} {"train_loss": -39.98539733886719, "global_step": 293297, "epoch": 2423} {"train_loss": -42.25405502319336, "global_step": 293298, "epoch": 2423} {"train_loss": -38.4147834777832, "global_step": 293299, "epoch": 2423} {"train_loss": -40.38877487182617, "global_step": 293300, "epoch": 2423} {"train_loss": -38.2867546081543, "global_step": 293301, "epoch": 2423} {"train_loss": -41.51173782348633, "global_step": 293302, "epoch": 2423} {"train_loss": -42.59998696697645, "global_step": 293303, "epoch": 2423, "val_loss": 2495576.25} {"train_loss": -39.938350677490234, "global_step": 293304, "epoch": 2424} {"train_loss": -40.008113861083984, "global_step": 293305, "epoch": 2424} {"train_loss": -38.674102783203125, "global_step": 293306, "epoch": 2424} {"train_loss": -39.594295501708984, "global_step": 293307, "epoch": 2424} {"train_loss": -40.123817443847656, "global_step": 293308, "epoch": 2424} {"train_loss": -38.01118850708008, "global_step": 293309, "epoch": 2424} {"train_loss": -40.53646469116211, "global_step": 293310, "epoch": 2424} {"train_loss": -36.45219039916992, "global_step": 293311, "epoch": 2424} {"train_loss": -40.0675048828125, "global_step": 293312, "epoch": 2424} {"train_loss": -37.73664474487305, "global_step": 293313, "epoch": 2424} {"train_loss": -39.01483917236328, "global_step": 293314, "epoch": 2424} {"train_loss": -39.29740524291992, "global_step": 293315, "epoch": 2424} {"train_loss": -39.558143615722656, "global_step": 293316, "epoch": 2424} {"train_loss": -40.68691635131836, "global_step": 293317, "epoch": 2424} {"train_loss": -39.26057815551758, "global_step": 293318, "epoch": 2424} {"train_loss": -43.052642822265625, "global_step": 293319, "epoch": 2424} {"train_loss": -38.82735824584961, "global_step": 293320, "epoch": 2424} {"train_loss": -42.36859893798828, "global_step": 293321, "epoch": 2424} {"train_loss": -40.54545211791992, "global_step": 293322, "epoch": 2424} {"train_loss": -41.131160736083984, "global_step": 293323, "epoch": 2424} {"train_loss": -42.208702087402344, "global_step": 293324, "epoch": 2424} {"train_loss": -41.75588607788086, "global_step": 293325, "epoch": 2424} {"train_loss": -41.65792465209961, "global_step": 293326, "epoch": 2424} {"train_loss": -41.879268646240234, "global_step": 293327, "epoch": 2424} {"train_loss": -41.63434982299805, "global_step": 293328, "epoch": 2424} {"train_loss": -42.44570541381836, "global_step": 293329, "epoch": 2424} {"train_loss": -41.38715744018555, "global_step": 293330, "epoch": 2424} {"train_loss": -43.35083770751953, "global_step": 293331, "epoch": 2424} {"train_loss": -41.938209533691406, "global_step": 293332, "epoch": 2424} {"train_loss": -42.098121643066406, "global_step": 293333, "epoch": 2424} {"train_loss": -43.12263488769531, "global_step": 293334, "epoch": 2424} {"train_loss": -42.33258056640625, "global_step": 293335, "epoch": 2424} {"train_loss": -43.0949821472168, "global_step": 293336, "epoch": 2424} {"train_loss": -42.606868743896484, "global_step": 293337, "epoch": 2424} {"train_loss": -42.879432678222656, "global_step": 293338, "epoch": 2424} {"train_loss": -42.281593322753906, "global_step": 293339, "epoch": 2424} {"train_loss": -43.52573776245117, "global_step": 293340, "epoch": 2424} {"train_loss": -43.10085678100586, "global_step": 293341, "epoch": 2424} {"train_loss": -42.92596435546875, "global_step": 293342, "epoch": 2424} {"train_loss": -43.008056640625, "global_step": 293343, "epoch": 2424} {"train_loss": -43.27950668334961, "global_step": 293344, "epoch": 2424} {"train_loss": -42.77265167236328, "global_step": 293345, "epoch": 2424} {"train_loss": -42.804752349853516, "global_step": 293346, "epoch": 2424} {"train_loss": -43.30784225463867, "global_step": 293347, "epoch": 2424} {"train_loss": -42.978172302246094, "global_step": 293348, "epoch": 2424} {"train_loss": -43.77730941772461, "global_step": 293349, "epoch": 2424} {"train_loss": -42.19438552856445, "global_step": 293350, "epoch": 2424} {"train_loss": -42.81421661376953, "global_step": 293351, "epoch": 2424} {"train_loss": -42.86955642700195, "global_step": 293352, "epoch": 2424} {"train_loss": -43.67196273803711, "global_step": 293353, "epoch": 2424} {"train_loss": -43.10321807861328, "global_step": 293354, "epoch": 2424} {"train_loss": -43.443477630615234, "global_step": 293355, "epoch": 2424} {"train_loss": -43.82819747924805, "global_step": 293356, "epoch": 2424} {"train_loss": -43.37092971801758, "global_step": 293357, "epoch": 2424} {"train_loss": -43.60720443725586, "global_step": 293358, "epoch": 2424} {"train_loss": -43.268611907958984, "global_step": 293359, "epoch": 2424} {"train_loss": -43.864227294921875, "global_step": 293360, "epoch": 2424} {"train_loss": -43.88086700439453, "global_step": 293361, "epoch": 2424} {"train_loss": -44.17601013183594, "global_step": 293362, "epoch": 2424} {"train_loss": -43.539886474609375, "global_step": 293363, "epoch": 2424} {"train_loss": -43.63387680053711, "global_step": 293364, "epoch": 2424} {"train_loss": -44.32672119140625, "global_step": 293365, "epoch": 2424} {"train_loss": -43.79887771606445, "global_step": 293366, "epoch": 2424} {"train_loss": -44.18076705932617, "global_step": 293367, "epoch": 2424} {"train_loss": -43.79328536987305, "global_step": 293368, "epoch": 2424} {"train_loss": -44.383663177490234, "global_step": 293369, "epoch": 2424} {"train_loss": -44.15777587890625, "global_step": 293370, "epoch": 2424} {"train_loss": -44.54560470581055, "global_step": 293371, "epoch": 2424} {"train_loss": -44.46503829956055, "global_step": 293372, "epoch": 2424} {"train_loss": -44.26564407348633, "global_step": 293373, "epoch": 2424} {"train_loss": -44.57915496826172, "global_step": 293374, "epoch": 2424} {"train_loss": -44.31795883178711, "global_step": 293375, "epoch": 2424} {"train_loss": -44.40549850463867, "global_step": 293376, "epoch": 2424} {"train_loss": -44.89130783081055, "global_step": 293377, "epoch": 2424} {"train_loss": -44.4794921875, "global_step": 293378, "epoch": 2424} {"train_loss": -44.77174758911133, "global_step": 293379, "epoch": 2424} {"train_loss": -44.4793815612793, "global_step": 293380, "epoch": 2424} {"train_loss": -44.51456069946289, "global_step": 293381, "epoch": 2424} {"train_loss": -44.38389587402344, "global_step": 293382, "epoch": 2424} {"train_loss": -44.3708610534668, "global_step": 293383, "epoch": 2424} {"train_loss": -44.367244720458984, "global_step": 293384, "epoch": 2424} {"train_loss": -44.780731201171875, "global_step": 293385, "epoch": 2424} {"train_loss": -44.87180709838867, "global_step": 293386, "epoch": 2424} {"train_loss": -44.22796630859375, "global_step": 293387, "epoch": 2424} {"train_loss": -44.30509567260742, "global_step": 293388, "epoch": 2424} {"train_loss": -44.73295211791992, "global_step": 293389, "epoch": 2424} {"train_loss": -44.74776077270508, "global_step": 293390, "epoch": 2424} {"train_loss": -44.757442474365234, "global_step": 293391, "epoch": 2424} {"train_loss": -44.178157806396484, "global_step": 293392, "epoch": 2424} {"train_loss": -43.2885856628418, "global_step": 293393, "epoch": 2424} {"train_loss": -43.463558197021484, "global_step": 293394, "epoch": 2424} {"train_loss": -42.665771484375, "global_step": 293395, "epoch": 2424} {"train_loss": -41.65365219116211, "global_step": 293396, "epoch": 2424} {"train_loss": -42.87123489379883, "global_step": 293397, "epoch": 2424} {"train_loss": -42.33452606201172, "global_step": 293398, "epoch": 2424} {"train_loss": -43.52993392944336, "global_step": 293399, "epoch": 2424} {"train_loss": -44.656368255615234, "global_step": 293400, "epoch": 2424} {"train_loss": -44.17717361450195, "global_step": 293401, "epoch": 2424} {"train_loss": -44.0444450378418, "global_step": 293402, "epoch": 2424} {"train_loss": -43.27799606323242, "global_step": 293403, "epoch": 2424} {"train_loss": -43.472755432128906, "global_step": 293404, "epoch": 2424} {"train_loss": -44.17176818847656, "global_step": 293405, "epoch": 2424} {"train_loss": -43.7572135925293, "global_step": 293406, "epoch": 2424} {"train_loss": -43.31679916381836, "global_step": 293407, "epoch": 2424} {"train_loss": -42.36183547973633, "global_step": 293408, "epoch": 2424} {"train_loss": -43.376426696777344, "global_step": 293409, "epoch": 2424} {"train_loss": -44.36354446411133, "global_step": 293410, "epoch": 2424} {"train_loss": -41.26424026489258, "global_step": 293411, "epoch": 2424} {"train_loss": -42.860382080078125, "global_step": 293412, "epoch": 2424} {"train_loss": -44.09901809692383, "global_step": 293413, "epoch": 2424} {"train_loss": -43.91643142700195, "global_step": 293414, "epoch": 2424} {"train_loss": -42.775569915771484, "global_step": 293415, "epoch": 2424} {"train_loss": -43.33366775512695, "global_step": 293416, "epoch": 2424} {"train_loss": -44.30112838745117, "global_step": 293417, "epoch": 2424} {"train_loss": -43.533851623535156, "global_step": 293418, "epoch": 2424} {"train_loss": -42.59153747558594, "global_step": 293419, "epoch": 2424} {"train_loss": -44.20083236694336, "global_step": 293420, "epoch": 2424} {"train_loss": -43.60438919067383, "global_step": 293421, "epoch": 2424} {"train_loss": -44.25361633300781, "global_step": 293422, "epoch": 2424} {"train_loss": -43.78351593017578, "global_step": 293423, "epoch": 2424} {"train_loss": -42.87516633341135, "global_step": 293424, "epoch": 2424, "val_loss": 2468529.25} {"train_loss": -44.271976470947266, "global_step": 293425, "epoch": 2425} {"train_loss": -43.3033332824707, "global_step": 293426, "epoch": 2425} {"train_loss": -43.76960372924805, "global_step": 293427, "epoch": 2425} {"train_loss": -42.99592208862305, "global_step": 293428, "epoch": 2425} {"train_loss": -43.49115753173828, "global_step": 293429, "epoch": 2425} {"train_loss": -44.38407516479492, "global_step": 293430, "epoch": 2425} {"train_loss": -44.05686569213867, "global_step": 293431, "epoch": 2425} {"train_loss": -42.88851547241211, "global_step": 293432, "epoch": 2425} {"train_loss": -41.752655029296875, "global_step": 293433, "epoch": 2425} {"train_loss": -43.032291412353516, "global_step": 293434, "epoch": 2425} {"train_loss": -43.23522186279297, "global_step": 293435, "epoch": 2425} {"train_loss": -40.43162155151367, "global_step": 293436, "epoch": 2425} {"train_loss": -43.13343048095703, "global_step": 293437, "epoch": 2425} {"train_loss": -43.57307052612305, "global_step": 293438, "epoch": 2425} {"train_loss": -43.013580322265625, "global_step": 293439, "epoch": 2425} {"train_loss": -42.65996170043945, "global_step": 293440, "epoch": 2425} {"train_loss": -43.3807373046875, "global_step": 293441, "epoch": 2425} {"train_loss": -43.7691535949707, "global_step": 293442, "epoch": 2425} {"train_loss": -42.498626708984375, "global_step": 293443, "epoch": 2425} {"train_loss": -43.61060333251953, "global_step": 293444, "epoch": 2425} {"train_loss": -43.85218811035156, "global_step": 293445, "epoch": 2425} {"train_loss": -42.45969772338867, "global_step": 293446, "epoch": 2425} {"train_loss": -43.17477035522461, "global_step": 293447, "epoch": 2425} {"train_loss": -43.44585418701172, "global_step": 293448, "epoch": 2425} {"train_loss": -42.8204460144043, "global_step": 293449, "epoch": 2425} {"train_loss": -42.24525833129883, "global_step": 293450, "epoch": 2425} {"train_loss": -43.533931732177734, "global_step": 293451, "epoch": 2425} {"train_loss": -43.20063018798828, "global_step": 293452, "epoch": 2425} {"train_loss": -42.701717376708984, "global_step": 293453, "epoch": 2425} {"train_loss": -42.81112289428711, "global_step": 293454, "epoch": 2425} {"train_loss": -44.168861389160156, "global_step": 293455, "epoch": 2425} {"train_loss": -42.798683166503906, "global_step": 293456, "epoch": 2425} {"train_loss": -43.6435661315918, "global_step": 293457, "epoch": 2425} {"train_loss": -43.56780242919922, "global_step": 293458, "epoch": 2425} {"train_loss": -44.54386520385742, "global_step": 293459, "epoch": 2425} {"train_loss": -43.72944259643555, "global_step": 293460, "epoch": 2425} {"train_loss": -43.956817626953125, "global_step": 293461, "epoch": 2425} {"train_loss": -44.08448028564453, "global_step": 293462, "epoch": 2425} {"train_loss": -44.17523193359375, "global_step": 293463, "epoch": 2425} {"train_loss": -43.46200180053711, "global_step": 293464, "epoch": 2425} {"train_loss": -42.51637649536133, "global_step": 293465, "epoch": 2425} {"train_loss": -44.0681037902832, "global_step": 293466, "epoch": 2425} {"train_loss": -43.51576614379883, "global_step": 293467, "epoch": 2425} {"train_loss": -43.05787658691406, "global_step": 293468, "epoch": 2425} {"train_loss": -43.021358489990234, "global_step": 293469, "epoch": 2425} {"train_loss": -43.810604095458984, "global_step": 293470, "epoch": 2425} {"train_loss": -43.518348693847656, "global_step": 293471, "epoch": 2425} {"train_loss": -43.89808654785156, "global_step": 293472, "epoch": 2425} {"train_loss": -44.13410568237305, "global_step": 293473, "epoch": 2425} {"train_loss": -41.90808868408203, "global_step": 293474, "epoch": 2425} {"train_loss": -42.5516471862793, "global_step": 293475, "epoch": 2425} {"train_loss": -43.46694564819336, "global_step": 293476, "epoch": 2425} {"train_loss": -42.59302520751953, "global_step": 293477, "epoch": 2425} {"train_loss": -43.23656463623047, "global_step": 293478, "epoch": 2425} {"train_loss": -43.5107421875, "global_step": 293479, "epoch": 2425} {"train_loss": -43.209781646728516, "global_step": 293480, "epoch": 2425} {"train_loss": -42.43832778930664, "global_step": 293481, "epoch": 2425} {"train_loss": -44.08969497680664, "global_step": 293482, "epoch": 2425} {"train_loss": -43.948490142822266, "global_step": 293483, "epoch": 2425} {"train_loss": -43.282981872558594, "global_step": 293484, "epoch": 2425} {"train_loss": -43.060333251953125, "global_step": 293485, "epoch": 2425} {"train_loss": -44.178829193115234, "global_step": 293486, "epoch": 2425} {"train_loss": -43.29609680175781, "global_step": 293487, "epoch": 2425} {"train_loss": -43.348506927490234, "global_step": 293488, "epoch": 2425} {"train_loss": -43.32160568237305, "global_step": 293489, "epoch": 2425} {"train_loss": -44.431026458740234, "global_step": 293490, "epoch": 2425} {"train_loss": -43.52507400512695, "global_step": 293491, "epoch": 2425} {"train_loss": -43.85304641723633, "global_step": 293492, "epoch": 2425} {"train_loss": -43.46207809448242, "global_step": 293493, "epoch": 2425} {"train_loss": -43.27617263793945, "global_step": 293494, "epoch": 2425} {"train_loss": -43.62959671020508, "global_step": 293495, "epoch": 2425} {"train_loss": -43.9909782409668, "global_step": 293496, "epoch": 2425} {"train_loss": -43.92328643798828, "global_step": 293497, "epoch": 2425} {"train_loss": -43.75635528564453, "global_step": 293498, "epoch": 2425} {"train_loss": -44.465087890625, "global_step": 293499, "epoch": 2425} {"train_loss": -43.518707275390625, "global_step": 293500, "epoch": 2425} {"train_loss": -43.81663131713867, "global_step": 293501, "epoch": 2425} {"train_loss": -43.4395866394043, "global_step": 293502, "epoch": 2425} {"train_loss": -42.9167594909668, "global_step": 293503, "epoch": 2425} {"train_loss": -43.208900451660156, "global_step": 293504, "epoch": 2425} {"train_loss": -43.72357940673828, "global_step": 293505, "epoch": 2425} {"train_loss": -44.287078857421875, "global_step": 293506, "epoch": 2425} {"train_loss": -42.80691909790039, "global_step": 293507, "epoch": 2425} {"train_loss": -43.82832717895508, "global_step": 293508, "epoch": 2425} {"train_loss": -44.098182678222656, "global_step": 293509, "epoch": 2425} {"train_loss": -44.118621826171875, "global_step": 293510, "epoch": 2425} {"train_loss": -44.0516471862793, "global_step": 293511, "epoch": 2425} {"train_loss": -44.6811637878418, "global_step": 293512, "epoch": 2425} {"train_loss": -44.25386428833008, "global_step": 293513, "epoch": 2425} {"train_loss": -44.242679595947266, "global_step": 293514, "epoch": 2425} {"train_loss": -43.704193115234375, "global_step": 293515, "epoch": 2425} {"train_loss": -44.079341888427734, "global_step": 293516, "epoch": 2425} {"train_loss": -43.222259521484375, "global_step": 293517, "epoch": 2425} {"train_loss": -44.189422607421875, "global_step": 293518, "epoch": 2425} {"train_loss": -44.501461029052734, "global_step": 293519, "epoch": 2425} {"train_loss": -44.475852966308594, "global_step": 293520, "epoch": 2425} {"train_loss": -43.858245849609375, "global_step": 293521, "epoch": 2425} {"train_loss": -43.66858673095703, "global_step": 293522, "epoch": 2425} {"train_loss": -44.652400970458984, "global_step": 293523, "epoch": 2425} {"train_loss": -44.299434661865234, "global_step": 293524, "epoch": 2425} {"train_loss": -44.03268814086914, "global_step": 293525, "epoch": 2425} {"train_loss": -44.0672607421875, "global_step": 293526, "epoch": 2425} {"train_loss": -43.987518310546875, "global_step": 293527, "epoch": 2425} {"train_loss": -43.51625061035156, "global_step": 293528, "epoch": 2425} {"train_loss": -42.458335876464844, "global_step": 293529, "epoch": 2425} {"train_loss": -43.320396423339844, "global_step": 293530, "epoch": 2425} {"train_loss": -43.86973571777344, "global_step": 293531, "epoch": 2425} {"train_loss": -43.13970947265625, "global_step": 293532, "epoch": 2425} {"train_loss": -42.97713851928711, "global_step": 293533, "epoch": 2425} {"train_loss": -43.052978515625, "global_step": 293534, "epoch": 2425} {"train_loss": -42.10041427612305, "global_step": 293535, "epoch": 2425} {"train_loss": -44.334510803222656, "global_step": 293536, "epoch": 2425} {"train_loss": -43.1857795715332, "global_step": 293537, "epoch": 2425} {"train_loss": -40.29618453979492, "global_step": 293538, "epoch": 2425} {"train_loss": -44.08165740966797, "global_step": 293539, "epoch": 2425} {"train_loss": -43.04806137084961, "global_step": 293540, "epoch": 2425} {"train_loss": -40.622501373291016, "global_step": 293541, "epoch": 2425} {"train_loss": -43.839324951171875, "global_step": 293542, "epoch": 2425} {"train_loss": -40.819664001464844, "global_step": 293543, "epoch": 2425} {"train_loss": -42.9483757019043, "global_step": 293544, "epoch": 2425} {"train_loss": -43.415237994233436, "global_step": 293545, "epoch": 2425, "val_loss": 2548027.25} {"train_loss": -41.968929290771484, "global_step": 293546, "epoch": 2426} {"train_loss": -43.43976593017578, "global_step": 293547, "epoch": 2426} {"train_loss": -42.54785919189453, "global_step": 293548, "epoch": 2426} {"train_loss": -43.3274040222168, "global_step": 293549, "epoch": 2426} {"train_loss": -43.89973831176758, "global_step": 293550, "epoch": 2426} {"train_loss": -43.68976974487305, "global_step": 293551, "epoch": 2426} {"train_loss": -43.638484954833984, "global_step": 293552, "epoch": 2426} {"train_loss": -43.282344818115234, "global_step": 293553, "epoch": 2426} {"train_loss": -42.93131637573242, "global_step": 293554, "epoch": 2426} {"train_loss": -44.00592041015625, "global_step": 293555, "epoch": 2426} {"train_loss": -43.602535247802734, "global_step": 293556, "epoch": 2426} {"train_loss": -43.46328353881836, "global_step": 293557, "epoch": 2426} {"train_loss": -44.11469268798828, "global_step": 293558, "epoch": 2426} {"train_loss": -43.933441162109375, "global_step": 293559, "epoch": 2426} {"train_loss": -43.097930908203125, "global_step": 293560, "epoch": 2426} {"train_loss": -43.547607421875, "global_step": 293561, "epoch": 2426} {"train_loss": -44.05165481567383, "global_step": 293562, "epoch": 2426} {"train_loss": -43.80945587158203, "global_step": 293563, "epoch": 2426} {"train_loss": -43.733551025390625, "global_step": 293564, "epoch": 2426} {"train_loss": -44.01028060913086, "global_step": 293565, "epoch": 2426} {"train_loss": -43.61525344848633, "global_step": 293566, "epoch": 2426} {"train_loss": -43.66750717163086, "global_step": 293567, "epoch": 2426} {"train_loss": -44.143001556396484, "global_step": 293568, "epoch": 2426} {"train_loss": -44.13032913208008, "global_step": 293569, "epoch": 2426} {"train_loss": -43.080055236816406, "global_step": 293570, "epoch": 2426} {"train_loss": -43.69981002807617, "global_step": 293571, "epoch": 2426} {"train_loss": -43.4600715637207, "global_step": 293572, "epoch": 2426} {"train_loss": -43.59357452392578, "global_step": 293573, "epoch": 2426} {"train_loss": -44.13325881958008, "global_step": 293574, "epoch": 2426} {"train_loss": -43.794349670410156, "global_step": 293575, "epoch": 2426} {"train_loss": -44.405982971191406, "global_step": 293576, "epoch": 2426} {"train_loss": -44.404518127441406, "global_step": 293577, "epoch": 2426} {"train_loss": -44.1121711730957, "global_step": 293578, "epoch": 2426} {"train_loss": -44.421730041503906, "global_step": 293579, "epoch": 2426} {"train_loss": -44.82058334350586, "global_step": 293580, "epoch": 2426} {"train_loss": -44.37031173706055, "global_step": 293581, "epoch": 2426} {"train_loss": -44.69049072265625, "global_step": 293582, "epoch": 2426} {"train_loss": -44.98268508911133, "global_step": 293583, "epoch": 2426} {"train_loss": -44.52445602416992, "global_step": 293584, "epoch": 2426} {"train_loss": -44.69216537475586, "global_step": 293585, "epoch": 2426} {"train_loss": -44.629634857177734, "global_step": 293586, "epoch": 2426} {"train_loss": -44.130859375, "global_step": 293587, "epoch": 2426} {"train_loss": -45.04453659057617, "global_step": 293588, "epoch": 2426} {"train_loss": -44.42292022705078, "global_step": 293589, "epoch": 2426} {"train_loss": -44.76679229736328, "global_step": 293590, "epoch": 2426} {"train_loss": -44.35542678833008, "global_step": 293591, "epoch": 2426} {"train_loss": -44.40191650390625, "global_step": 293592, "epoch": 2426} {"train_loss": -44.88357162475586, "global_step": 293593, "epoch": 2426} {"train_loss": -44.51708221435547, "global_step": 293594, "epoch": 2426} {"train_loss": -44.179378509521484, "global_step": 293595, "epoch": 2426} {"train_loss": -44.36035919189453, "global_step": 293596, "epoch": 2426} {"train_loss": -44.50970458984375, "global_step": 293597, "epoch": 2426} {"train_loss": -43.587032318115234, "global_step": 293598, "epoch": 2426} {"train_loss": -44.63853073120117, "global_step": 293599, "epoch": 2426} {"train_loss": -44.21996307373047, "global_step": 293600, "epoch": 2426} {"train_loss": -43.38007354736328, "global_step": 293601, "epoch": 2426} {"train_loss": -44.123233795166016, "global_step": 293602, "epoch": 2426} {"train_loss": -43.942718505859375, "global_step": 293603, "epoch": 2426} {"train_loss": -43.02385330200195, "global_step": 293604, "epoch": 2426} {"train_loss": -43.81735610961914, "global_step": 293605, "epoch": 2426} {"train_loss": -43.93540573120117, "global_step": 293606, "epoch": 2426} {"train_loss": -41.818206787109375, "global_step": 293607, "epoch": 2426} {"train_loss": -42.38201904296875, "global_step": 293608, "epoch": 2426} {"train_loss": -43.37420654296875, "global_step": 293609, "epoch": 2426} {"train_loss": -43.57903289794922, "global_step": 293610, "epoch": 2426} {"train_loss": -43.90131378173828, "global_step": 293611, "epoch": 2426} {"train_loss": -42.81304931640625, "global_step": 293612, "epoch": 2426} {"train_loss": -44.297176361083984, "global_step": 293613, "epoch": 2426} {"train_loss": -43.58259963989258, "global_step": 293614, "epoch": 2426} {"train_loss": -44.09274673461914, "global_step": 293615, "epoch": 2426} {"train_loss": -43.771358489990234, "global_step": 293616, "epoch": 2426} {"train_loss": -43.174903869628906, "global_step": 293617, "epoch": 2426} {"train_loss": -44.06620788574219, "global_step": 293618, "epoch": 2426} {"train_loss": -43.16111755371094, "global_step": 293619, "epoch": 2426} {"train_loss": -42.362998962402344, "global_step": 293620, "epoch": 2426} {"train_loss": -42.51798629760742, "global_step": 293621, "epoch": 2426} {"train_loss": -43.94352340698242, "global_step": 293622, "epoch": 2426} {"train_loss": -42.550899505615234, "global_step": 293623, "epoch": 2426} {"train_loss": -43.51548385620117, "global_step": 293624, "epoch": 2426} {"train_loss": -43.85810089111328, "global_step": 293625, "epoch": 2426} {"train_loss": -43.1639404296875, "global_step": 293626, "epoch": 2426} {"train_loss": -44.462677001953125, "global_step": 293627, "epoch": 2426} {"train_loss": -42.980648040771484, "global_step": 293628, "epoch": 2426} {"train_loss": -43.06815719604492, "global_step": 293629, "epoch": 2426} {"train_loss": -44.07157897949219, "global_step": 293630, "epoch": 2426} {"train_loss": -42.879844665527344, "global_step": 293631, "epoch": 2426} {"train_loss": -42.113136291503906, "global_step": 293632, "epoch": 2426} {"train_loss": -44.418609619140625, "global_step": 293633, "epoch": 2426} {"train_loss": -43.065792083740234, "global_step": 293634, "epoch": 2426} {"train_loss": -42.5728874206543, "global_step": 293635, "epoch": 2426} {"train_loss": -44.09253692626953, "global_step": 293636, "epoch": 2426} {"train_loss": -43.144744873046875, "global_step": 293637, "epoch": 2426} {"train_loss": -43.72563171386719, "global_step": 293638, "epoch": 2426} {"train_loss": -44.15147018432617, "global_step": 293639, "epoch": 2426} {"train_loss": -43.000431060791016, "global_step": 293640, "epoch": 2426} {"train_loss": -43.24351501464844, "global_step": 293641, "epoch": 2426} {"train_loss": -44.438194274902344, "global_step": 293642, "epoch": 2426} {"train_loss": -43.0947265625, "global_step": 293643, "epoch": 2426} {"train_loss": -42.015777587890625, "global_step": 293644, "epoch": 2426} {"train_loss": -42.19187545776367, "global_step": 293645, "epoch": 2426} {"train_loss": -43.9183464050293, "global_step": 293646, "epoch": 2426} {"train_loss": -43.646724700927734, "global_step": 293647, "epoch": 2426} {"train_loss": -43.80027389526367, "global_step": 293648, "epoch": 2426} {"train_loss": -43.80531692504883, "global_step": 293649, "epoch": 2426} {"train_loss": -43.073612213134766, "global_step": 293650, "epoch": 2426} {"train_loss": -43.5814208984375, "global_step": 293651, "epoch": 2426} {"train_loss": -43.37083053588867, "global_step": 293652, "epoch": 2426} {"train_loss": -42.853965759277344, "global_step": 293653, "epoch": 2426} {"train_loss": -43.492008209228516, "global_step": 293654, "epoch": 2426} {"train_loss": -43.194358825683594, "global_step": 293655, "epoch": 2426} {"train_loss": -43.21039581298828, "global_step": 293656, "epoch": 2426} {"train_loss": -43.54814529418945, "global_step": 293657, "epoch": 2426} {"train_loss": -42.97683334350586, "global_step": 293658, "epoch": 2426} {"train_loss": -43.58026123046875, "global_step": 293659, "epoch": 2426} {"train_loss": -43.92631912231445, "global_step": 293660, "epoch": 2426} {"train_loss": -43.37965393066406, "global_step": 293661, "epoch": 2426} {"train_loss": -44.05170440673828, "global_step": 293662, "epoch": 2426} {"train_loss": -44.29983139038086, "global_step": 293663, "epoch": 2426} {"train_loss": -43.395137786865234, "global_step": 293664, "epoch": 2426} {"train_loss": -41.82764434814453, "global_step": 293665, "epoch": 2426} {"train_loss": -43.65862520076027, "global_step": 293666, "epoch": 2426, "val_loss": 2528268.5} {"train_loss": -42.40056610107422, "global_step": 293667, "epoch": 2427} {"train_loss": -39.33541488647461, "global_step": 293668, "epoch": 2427} {"train_loss": -43.438499450683594, "global_step": 293669, "epoch": 2427} {"train_loss": -39.07926559448242, "global_step": 293670, "epoch": 2427} {"train_loss": -43.40841293334961, "global_step": 293671, "epoch": 2427} {"train_loss": -38.7416877746582, "global_step": 293672, "epoch": 2427} {"train_loss": -41.23232650756836, "global_step": 293673, "epoch": 2427} {"train_loss": -39.24727249145508, "global_step": 293674, "epoch": 2427} {"train_loss": -38.887489318847656, "global_step": 293675, "epoch": 2427} {"train_loss": -40.70902633666992, "global_step": 293676, "epoch": 2427} {"train_loss": -41.18790817260742, "global_step": 293677, "epoch": 2427} {"train_loss": -42.46413803100586, "global_step": 293678, "epoch": 2427} {"train_loss": -42.55428695678711, "global_step": 293679, "epoch": 2427} {"train_loss": -42.004493713378906, "global_step": 293680, "epoch": 2427} {"train_loss": -43.258235931396484, "global_step": 293681, "epoch": 2427} {"train_loss": -42.88783264160156, "global_step": 293682, "epoch": 2427} {"train_loss": -43.595821380615234, "global_step": 293683, "epoch": 2427} {"train_loss": -42.460933685302734, "global_step": 293684, "epoch": 2427} {"train_loss": -43.6619758605957, "global_step": 293685, "epoch": 2427} {"train_loss": -42.4547233581543, "global_step": 293686, "epoch": 2427} {"train_loss": -43.894527435302734, "global_step": 293687, "epoch": 2427} {"train_loss": -42.565635681152344, "global_step": 293688, "epoch": 2427} {"train_loss": -43.73495101928711, "global_step": 293689, "epoch": 2427} {"train_loss": -43.09098434448242, "global_step": 293690, "epoch": 2427} {"train_loss": -43.441402435302734, "global_step": 293691, "epoch": 2427} {"train_loss": -43.3658561706543, "global_step": 293692, "epoch": 2427} {"train_loss": -43.87040328979492, "global_step": 293693, "epoch": 2427} {"train_loss": -42.32197952270508, "global_step": 293694, "epoch": 2427} {"train_loss": -43.92277145385742, "global_step": 293695, "epoch": 2427} {"train_loss": -43.25023651123047, "global_step": 293696, "epoch": 2427} {"train_loss": -43.712921142578125, "global_step": 293697, "epoch": 2427} {"train_loss": -43.537872314453125, "global_step": 293698, "epoch": 2427} {"train_loss": -43.50214767456055, "global_step": 293699, "epoch": 2427} {"train_loss": -43.61631393432617, "global_step": 293700, "epoch": 2427} {"train_loss": -44.31254577636719, "global_step": 293701, "epoch": 2427} {"train_loss": -43.37199020385742, "global_step": 293702, "epoch": 2427} {"train_loss": -43.791805267333984, "global_step": 293703, "epoch": 2427} {"train_loss": -43.85865783691406, "global_step": 293704, "epoch": 2427} {"train_loss": -44.7704963684082, "global_step": 293705, "epoch": 2427} {"train_loss": -44.05404281616211, "global_step": 293706, "epoch": 2427} {"train_loss": -44.22996139526367, "global_step": 293707, "epoch": 2427} {"train_loss": -43.8086051940918, "global_step": 293708, "epoch": 2427} {"train_loss": -44.41808319091797, "global_step": 293709, "epoch": 2427} {"train_loss": -43.960140228271484, "global_step": 293710, "epoch": 2427} {"train_loss": -44.329833984375, "global_step": 293711, "epoch": 2427} {"train_loss": -44.28369903564453, "global_step": 293712, "epoch": 2427} {"train_loss": -43.95276641845703, "global_step": 293713, "epoch": 2427} {"train_loss": -44.635826110839844, "global_step": 293714, "epoch": 2427} {"train_loss": -42.93949508666992, "global_step": 293715, "epoch": 2427} {"train_loss": -44.86146926879883, "global_step": 293716, "epoch": 2427} {"train_loss": -44.05704116821289, "global_step": 293717, "epoch": 2427} {"train_loss": -43.742286682128906, "global_step": 293718, "epoch": 2427} {"train_loss": -44.882606506347656, "global_step": 293719, "epoch": 2427} {"train_loss": -44.53022003173828, "global_step": 293720, "epoch": 2427} {"train_loss": -44.94935989379883, "global_step": 293721, "epoch": 2427} {"train_loss": -43.94059371948242, "global_step": 293722, "epoch": 2427} {"train_loss": -44.70207595825195, "global_step": 293723, "epoch": 2427} {"train_loss": -44.553924560546875, "global_step": 293724, "epoch": 2427} {"train_loss": -44.747188568115234, "global_step": 293725, "epoch": 2427} {"train_loss": -45.058345794677734, "global_step": 293726, "epoch": 2427} {"train_loss": -44.8228645324707, "global_step": 293727, "epoch": 2427} {"train_loss": -44.602439880371094, "global_step": 293728, "epoch": 2427} {"train_loss": -44.759857177734375, "global_step": 293729, "epoch": 2427} {"train_loss": -37.81732177734375, "global_step": 293730, "epoch": 2427} {"train_loss": -44.54555892944336, "global_step": 293731, "epoch": 2427} {"train_loss": -43.87881088256836, "global_step": 293732, "epoch": 2427} {"train_loss": -43.58033752441406, "global_step": 293733, "epoch": 2427} {"train_loss": -44.79225158691406, "global_step": 293734, "epoch": 2427} {"train_loss": -44.258872985839844, "global_step": 293735, "epoch": 2427} {"train_loss": -43.96113967895508, "global_step": 293736, "epoch": 2427} {"train_loss": -43.377010345458984, "global_step": 293737, "epoch": 2427} {"train_loss": -42.26696014404297, "global_step": 293738, "epoch": 2427} {"train_loss": -43.127071380615234, "global_step": 293739, "epoch": 2427} {"train_loss": -42.6546630859375, "global_step": 293740, "epoch": 2427} {"train_loss": -44.7080078125, "global_step": 293741, "epoch": 2427} {"train_loss": -43.9276237487793, "global_step": 293742, "epoch": 2427} {"train_loss": -41.86008834838867, "global_step": 293743, "epoch": 2427} {"train_loss": -42.5565185546875, "global_step": 293744, "epoch": 2427} {"train_loss": -39.49581527709961, "global_step": 293745, "epoch": 2427} {"train_loss": -41.51063919067383, "global_step": 293746, "epoch": 2427} {"train_loss": -42.60553741455078, "global_step": 293747, "epoch": 2427} {"train_loss": -42.84682083129883, "global_step": 293748, "epoch": 2427} {"train_loss": -43.77988815307617, "global_step": 293749, "epoch": 2427} {"train_loss": -44.09988021850586, "global_step": 293750, "epoch": 2427} {"train_loss": -43.72377395629883, "global_step": 293751, "epoch": 2427} {"train_loss": -42.54164123535156, "global_step": 293752, "epoch": 2427} {"train_loss": -44.17612838745117, "global_step": 293753, "epoch": 2427} {"train_loss": -43.95389938354492, "global_step": 293754, "epoch": 2427} {"train_loss": -39.40692138671875, "global_step": 293755, "epoch": 2427} {"train_loss": -42.324859619140625, "global_step": 293756, "epoch": 2427} {"train_loss": -43.24984359741211, "global_step": 293757, "epoch": 2427} {"train_loss": -41.68019104003906, "global_step": 293758, "epoch": 2427} {"train_loss": -41.97727584838867, "global_step": 293759, "epoch": 2427} {"train_loss": -43.562862396240234, "global_step": 293760, "epoch": 2427} {"train_loss": -44.16102981567383, "global_step": 293761, "epoch": 2427} {"train_loss": -43.78809356689453, "global_step": 293762, "epoch": 2427} {"train_loss": -43.26481246948242, "global_step": 293763, "epoch": 2427} {"train_loss": -42.45344924926758, "global_step": 293764, "epoch": 2427} {"train_loss": -43.22957229614258, "global_step": 293765, "epoch": 2427} {"train_loss": -42.55057144165039, "global_step": 293766, "epoch": 2427} {"train_loss": -41.59033203125, "global_step": 293767, "epoch": 2427} {"train_loss": -43.487648010253906, "global_step": 293768, "epoch": 2427} {"train_loss": -43.77901840209961, "global_step": 293769, "epoch": 2427} {"train_loss": -43.337005615234375, "global_step": 293770, "epoch": 2427} {"train_loss": -42.10488510131836, "global_step": 293771, "epoch": 2427} {"train_loss": -41.98512649536133, "global_step": 293772, "epoch": 2427} {"train_loss": -29.754810333251953, "global_step": 293773, "epoch": 2427} {"train_loss": -40.647682189941406, "global_step": 293774, "epoch": 2427} {"train_loss": -39.87005615234375, "global_step": 293775, "epoch": 2427} {"train_loss": -42.721073150634766, "global_step": 293776, "epoch": 2427} {"train_loss": -39.796630859375, "global_step": 293777, "epoch": 2427} {"train_loss": -36.555938720703125, "global_step": 293778, "epoch": 2427} {"train_loss": -41.42744827270508, "global_step": 293779, "epoch": 2427} {"train_loss": -42.70244598388672, "global_step": 293780, "epoch": 2427} {"train_loss": -41.13121795654297, "global_step": 293781, "epoch": 2427} {"train_loss": -39.828895568847656, "global_step": 293782, "epoch": 2427} {"train_loss": -41.363746643066406, "global_step": 293783, "epoch": 2427} {"train_loss": -41.11762619018555, "global_step": 293784, "epoch": 2427} {"train_loss": -41.3964958190918, "global_step": 293785, "epoch": 2427} {"train_loss": -42.025150299072266, "global_step": 293786, "epoch": 2427} {"train_loss": -42.72519557732196, "global_step": 293787, "epoch": 2427, "val_loss": 2491680.25} {"train_loss": -41.405765533447266, "global_step": 293788, "epoch": 2428} {"train_loss": -42.54568099975586, "global_step": 293789, "epoch": 2428} {"train_loss": -42.33313751220703, "global_step": 293790, "epoch": 2428} {"train_loss": -39.931697845458984, "global_step": 293791, "epoch": 2428} {"train_loss": -41.88179397583008, "global_step": 293792, "epoch": 2428} {"train_loss": -40.405513763427734, "global_step": 293793, "epoch": 2428} {"train_loss": -42.39617919921875, "global_step": 293794, "epoch": 2428} {"train_loss": -34.79010772705078, "global_step": 293795, "epoch": 2428} {"train_loss": -41.11231994628906, "global_step": 293796, "epoch": 2428} {"train_loss": -38.6309700012207, "global_step": 293797, "epoch": 2428} {"train_loss": -42.50996780395508, "global_step": 293798, "epoch": 2428} {"train_loss": -42.18156814575195, "global_step": 293799, "epoch": 2428} {"train_loss": -41.01566696166992, "global_step": 293800, "epoch": 2428} {"train_loss": -41.099674224853516, "global_step": 293801, "epoch": 2428} {"train_loss": -42.089630126953125, "global_step": 293802, "epoch": 2428} {"train_loss": -41.28263854980469, "global_step": 293803, "epoch": 2428} {"train_loss": -40.99229431152344, "global_step": 293804, "epoch": 2428} {"train_loss": -43.396095275878906, "global_step": 293805, "epoch": 2428} {"train_loss": -42.37775421142578, "global_step": 293806, "epoch": 2428} {"train_loss": -42.104549407958984, "global_step": 293807, "epoch": 2428} {"train_loss": -42.709407806396484, "global_step": 293808, "epoch": 2428} {"train_loss": -41.97321319580078, "global_step": 293809, "epoch": 2428} {"train_loss": -42.85909652709961, "global_step": 293810, "epoch": 2428} {"train_loss": -42.31191635131836, "global_step": 293811, "epoch": 2428} {"train_loss": -42.822566986083984, "global_step": 293812, "epoch": 2428} {"train_loss": -41.722713470458984, "global_step": 293813, "epoch": 2428} {"train_loss": -43.262977600097656, "global_step": 293814, "epoch": 2428} {"train_loss": -43.27549362182617, "global_step": 293815, "epoch": 2428} {"train_loss": -42.57448959350586, "global_step": 293816, "epoch": 2428} {"train_loss": -42.07387924194336, "global_step": 293817, "epoch": 2428} {"train_loss": -43.35174560546875, "global_step": 293818, "epoch": 2428} {"train_loss": -43.314571380615234, "global_step": 293819, "epoch": 2428} {"train_loss": -43.79058837890625, "global_step": 293820, "epoch": 2428} {"train_loss": -42.526611328125, "global_step": 293821, "epoch": 2428} {"train_loss": -42.901912689208984, "global_step": 293822, "epoch": 2428} {"train_loss": -43.04153060913086, "global_step": 293823, "epoch": 2428} {"train_loss": -43.84257125854492, "global_step": 293824, "epoch": 2428} {"train_loss": -43.284114837646484, "global_step": 293825, "epoch": 2428} {"train_loss": -43.54441452026367, "global_step": 293826, "epoch": 2428} {"train_loss": -44.120967864990234, "global_step": 293827, "epoch": 2428} {"train_loss": -42.867916107177734, "global_step": 293828, "epoch": 2428} {"train_loss": -43.449954986572266, "global_step": 293829, "epoch": 2428} {"train_loss": -43.609275817871094, "global_step": 293830, "epoch": 2428} {"train_loss": -43.73073196411133, "global_step": 293831, "epoch": 2428} {"train_loss": -43.09052658081055, "global_step": 293832, "epoch": 2428} {"train_loss": -43.75708770751953, "global_step": 293833, "epoch": 2428} {"train_loss": -43.58903121948242, "global_step": 293834, "epoch": 2428} {"train_loss": -43.51752853393555, "global_step": 293835, "epoch": 2428} {"train_loss": -43.47956466674805, "global_step": 293836, "epoch": 2428} {"train_loss": -43.787837982177734, "global_step": 293837, "epoch": 2428} {"train_loss": -44.176204681396484, "global_step": 293838, "epoch": 2428} {"train_loss": -43.691566467285156, "global_step": 293839, "epoch": 2428} {"train_loss": -44.2822265625, "global_step": 293840, "epoch": 2428} {"train_loss": -44.14036178588867, "global_step": 293841, "epoch": 2428} {"train_loss": -43.86798095703125, "global_step": 293842, "epoch": 2428} {"train_loss": -44.26057052612305, "global_step": 293843, "epoch": 2428} {"train_loss": -43.65824508666992, "global_step": 293844, "epoch": 2428} {"train_loss": -44.48812484741211, "global_step": 293845, "epoch": 2428} {"train_loss": -44.178016662597656, "global_step": 293846, "epoch": 2428} {"train_loss": -43.940731048583984, "global_step": 293847, "epoch": 2428} {"train_loss": -43.75409698486328, "global_step": 293848, "epoch": 2428} {"train_loss": -43.9123420715332, "global_step": 293849, "epoch": 2428} {"train_loss": -43.88916778564453, "global_step": 293850, "epoch": 2428} {"train_loss": -44.62629318237305, "global_step": 293851, "epoch": 2428} {"train_loss": -44.32710647583008, "global_step": 293852, "epoch": 2428} {"train_loss": -44.17745590209961, "global_step": 293853, "epoch": 2428} {"train_loss": -43.76131820678711, "global_step": 293854, "epoch": 2428} {"train_loss": -44.388343811035156, "global_step": 293855, "epoch": 2428} {"train_loss": -44.412506103515625, "global_step": 293856, "epoch": 2428} {"train_loss": -43.59172821044922, "global_step": 293857, "epoch": 2428} {"train_loss": -44.42427444458008, "global_step": 293858, "epoch": 2428} {"train_loss": -44.1781120300293, "global_step": 293859, "epoch": 2428} {"train_loss": -43.653526306152344, "global_step": 293860, "epoch": 2428} {"train_loss": -43.6523551940918, "global_step": 293861, "epoch": 2428} {"train_loss": -44.216400146484375, "global_step": 293862, "epoch": 2428} {"train_loss": -44.039649963378906, "global_step": 293863, "epoch": 2428} {"train_loss": -43.7507438659668, "global_step": 293864, "epoch": 2428} {"train_loss": -44.60608673095703, "global_step": 293865, "epoch": 2428} {"train_loss": -44.28492736816406, "global_step": 293866, "epoch": 2428} {"train_loss": -43.991207122802734, "global_step": 293867, "epoch": 2428} {"train_loss": -43.879188537597656, "global_step": 293868, "epoch": 2428} {"train_loss": -44.35721969604492, "global_step": 293869, "epoch": 2428} {"train_loss": -44.84634017944336, "global_step": 293870, "epoch": 2428} {"train_loss": -44.23350143432617, "global_step": 293871, "epoch": 2428} {"train_loss": -44.35848617553711, "global_step": 293872, "epoch": 2428} {"train_loss": -44.785396575927734, "global_step": 293873, "epoch": 2428} {"train_loss": -44.75204086303711, "global_step": 293874, "epoch": 2428} {"train_loss": -43.310482025146484, "global_step": 293875, "epoch": 2428} {"train_loss": -40.53902816772461, "global_step": 293876, "epoch": 2428} {"train_loss": -39.41809844970703, "global_step": 293877, "epoch": 2428} {"train_loss": -44.01392364501953, "global_step": 293878, "epoch": 2428} {"train_loss": -40.78388595581055, "global_step": 293879, "epoch": 2428} {"train_loss": -38.29331588745117, "global_step": 293880, "epoch": 2428} {"train_loss": -33.050106048583984, "global_step": 293881, "epoch": 2428} {"train_loss": -34.51010513305664, "global_step": 293882, "epoch": 2428} {"train_loss": -36.072505950927734, "global_step": 293883, "epoch": 2428} {"train_loss": -38.731895446777344, "global_step": 293884, "epoch": 2428} {"train_loss": -34.194698333740234, "global_step": 293885, "epoch": 2428} {"train_loss": -30.040990829467773, "global_step": 293886, "epoch": 2428} {"train_loss": -34.65858840942383, "global_step": 293887, "epoch": 2428} {"train_loss": -32.82497024536133, "global_step": 293888, "epoch": 2428} {"train_loss": -34.154354095458984, "global_step": 293889, "epoch": 2428} {"train_loss": -35.77529525756836, "global_step": 293890, "epoch": 2428} {"train_loss": -35.92414093017578, "global_step": 293891, "epoch": 2428} {"train_loss": -34.754146575927734, "global_step": 293892, "epoch": 2428} {"train_loss": -35.60403060913086, "global_step": 293893, "epoch": 2428} {"train_loss": -36.56478500366211, "global_step": 293894, "epoch": 2428} {"train_loss": -35.708900451660156, "global_step": 293895, "epoch": 2428} {"train_loss": -36.10909652709961, "global_step": 293896, "epoch": 2428} {"train_loss": -36.60126876831055, "global_step": 293897, "epoch": 2428} {"train_loss": -36.60466766357422, "global_step": 293898, "epoch": 2428} {"train_loss": -36.75408172607422, "global_step": 293899, "epoch": 2428} {"train_loss": -37.366214752197266, "global_step": 293900, "epoch": 2428} {"train_loss": -36.6531867980957, "global_step": 293901, "epoch": 2428} {"train_loss": -36.24335861206055, "global_step": 293902, "epoch": 2428} {"train_loss": -37.4184455871582, "global_step": 293903, "epoch": 2428} {"train_loss": -37.9316291809082, "global_step": 293904, "epoch": 2428} {"train_loss": -38.05583572387695, "global_step": 293905, "epoch": 2428} {"train_loss": -37.53020477294922, "global_step": 293906, "epoch": 2428} {"train_loss": -38.6071891784668, "global_step": 293907, "epoch": 2428} {"train_loss": -41.36033445941515, "global_step": 293908, "epoch": 2428, "val_loss": 2565155.0} {"train_loss": -38.3707389831543, "global_step": 293909, "epoch": 2429} {"train_loss": -38.68452072143555, "global_step": 293910, "epoch": 2429} {"train_loss": -37.52727508544922, "global_step": 293911, "epoch": 2429} {"train_loss": -37.46100997924805, "global_step": 293912, "epoch": 2429} {"train_loss": -38.22522735595703, "global_step": 293913, "epoch": 2429} {"train_loss": -39.06256103515625, "global_step": 293914, "epoch": 2429} {"train_loss": -39.27545166015625, "global_step": 293915, "epoch": 2429} {"train_loss": -38.63526153564453, "global_step": 293916, "epoch": 2429} {"train_loss": -38.50824737548828, "global_step": 293917, "epoch": 2429} {"train_loss": -38.767269134521484, "global_step": 293918, "epoch": 2429} {"train_loss": -39.298030853271484, "global_step": 293919, "epoch": 2429} {"train_loss": -38.955718994140625, "global_step": 293920, "epoch": 2429} {"train_loss": -39.7712516784668, "global_step": 293921, "epoch": 2429} {"train_loss": -38.77756118774414, "global_step": 293922, "epoch": 2429} {"train_loss": -39.54728698730469, "global_step": 293923, "epoch": 2429} {"train_loss": -39.32749557495117, "global_step": 293924, "epoch": 2429} {"train_loss": -38.962974548339844, "global_step": 293925, "epoch": 2429} {"train_loss": -39.82694625854492, "global_step": 293926, "epoch": 2429} {"train_loss": -39.250770568847656, "global_step": 293927, "epoch": 2429} {"train_loss": -39.60421371459961, "global_step": 293928, "epoch": 2429} {"train_loss": -39.60820770263672, "global_step": 293929, "epoch": 2429} {"train_loss": -39.73228454589844, "global_step": 293930, "epoch": 2429} {"train_loss": -39.671356201171875, "global_step": 293931, "epoch": 2429} {"train_loss": -39.642948150634766, "global_step": 293932, "epoch": 2429} {"train_loss": -40.43364334106445, "global_step": 293933, "epoch": 2429} {"train_loss": -39.61760330200195, "global_step": 293934, "epoch": 2429} {"train_loss": -40.3988037109375, "global_step": 293935, "epoch": 2429} {"train_loss": -40.5345344543457, "global_step": 293936, "epoch": 2429} {"train_loss": -40.148345947265625, "global_step": 293937, "epoch": 2429} {"train_loss": -39.99510955810547, "global_step": 293938, "epoch": 2429} {"train_loss": -39.35201644897461, "global_step": 293939, "epoch": 2429} {"train_loss": -39.57447052001953, "global_step": 293940, "epoch": 2429} {"train_loss": -40.644771575927734, "global_step": 293941, "epoch": 2429} {"train_loss": -40.149566650390625, "global_step": 293942, "epoch": 2429} {"train_loss": -39.4381103515625, "global_step": 293943, "epoch": 2429} {"train_loss": -39.76682662963867, "global_step": 293944, "epoch": 2429} {"train_loss": -39.59334945678711, "global_step": 293945, "epoch": 2429} {"train_loss": -40.25946044921875, "global_step": 293946, "epoch": 2429} {"train_loss": -39.726661682128906, "global_step": 293947, "epoch": 2429} {"train_loss": -40.70180130004883, "global_step": 293948, "epoch": 2429} {"train_loss": -40.42267608642578, "global_step": 293949, "epoch": 2429} {"train_loss": -41.653724670410156, "global_step": 293950, "epoch": 2429} {"train_loss": -40.41181564331055, "global_step": 293951, "epoch": 2429} {"train_loss": -40.704978942871094, "global_step": 293952, "epoch": 2429} {"train_loss": -41.3298454284668, "global_step": 293953, "epoch": 2429} {"train_loss": -40.86465835571289, "global_step": 293954, "epoch": 2429} {"train_loss": -41.3446044921875, "global_step": 293955, "epoch": 2429} {"train_loss": -41.468605041503906, "global_step": 293956, "epoch": 2429} {"train_loss": -41.30349349975586, "global_step": 293957, "epoch": 2429} {"train_loss": -41.78968811035156, "global_step": 293958, "epoch": 2429} {"train_loss": -40.81155014038086, "global_step": 293959, "epoch": 2429} {"train_loss": -40.8341178894043, "global_step": 293960, "epoch": 2429} {"train_loss": -40.61997604370117, "global_step": 293961, "epoch": 2429} {"train_loss": -41.21023941040039, "global_step": 293962, "epoch": 2429} {"train_loss": -41.32619094848633, "global_step": 293963, "epoch": 2429} {"train_loss": -41.583831787109375, "global_step": 293964, "epoch": 2429} {"train_loss": -41.23984146118164, "global_step": 293965, "epoch": 2429} {"train_loss": -41.365848541259766, "global_step": 293966, "epoch": 2429} {"train_loss": -41.56473922729492, "global_step": 293967, "epoch": 2429} {"train_loss": -41.67653274536133, "global_step": 293968, "epoch": 2429} {"train_loss": -41.18304443359375, "global_step": 293969, "epoch": 2429} {"train_loss": -41.48850631713867, "global_step": 293970, "epoch": 2429} {"train_loss": -41.68900680541992, "global_step": 293971, "epoch": 2429} {"train_loss": -41.30371856689453, "global_step": 293972, "epoch": 2429} {"train_loss": -41.78181076049805, "global_step": 293973, "epoch": 2429} {"train_loss": -41.730403900146484, "global_step": 293974, "epoch": 2429} {"train_loss": -41.26198959350586, "global_step": 293975, "epoch": 2429} {"train_loss": -40.75434112548828, "global_step": 293976, "epoch": 2429} {"train_loss": -41.205955505371094, "global_step": 293977, "epoch": 2429} {"train_loss": -41.34086227416992, "global_step": 293978, "epoch": 2429} {"train_loss": -41.55464553833008, "global_step": 293979, "epoch": 2429} {"train_loss": -41.15243148803711, "global_step": 293980, "epoch": 2429} {"train_loss": -40.374874114990234, "global_step": 293981, "epoch": 2429} {"train_loss": -40.05990219116211, "global_step": 293982, "epoch": 2429} {"train_loss": -39.06715393066406, "global_step": 293983, "epoch": 2429} {"train_loss": -37.714107513427734, "global_step": 293984, "epoch": 2429} {"train_loss": -40.608192443847656, "global_step": 293985, "epoch": 2429} {"train_loss": -39.88981628417969, "global_step": 293986, "epoch": 2429} {"train_loss": -39.287322998046875, "global_step": 293987, "epoch": 2429} {"train_loss": -41.26784896850586, "global_step": 293988, "epoch": 2429} {"train_loss": -41.234649658203125, "global_step": 293989, "epoch": 2429} {"train_loss": -37.17612838745117, "global_step": 293990, "epoch": 2429} {"train_loss": -39.302734375, "global_step": 293991, "epoch": 2429} {"train_loss": -40.5585823059082, "global_step": 293992, "epoch": 2429} {"train_loss": -41.40227127075195, "global_step": 293993, "epoch": 2429} {"train_loss": -39.536834716796875, "global_step": 293994, "epoch": 2429} {"train_loss": -40.28338623046875, "global_step": 293995, "epoch": 2429} {"train_loss": -42.0553092956543, "global_step": 293996, "epoch": 2429} {"train_loss": -40.62736129760742, "global_step": 293997, "epoch": 2429} {"train_loss": -41.000221252441406, "global_step": 293998, "epoch": 2429} {"train_loss": -41.102481842041016, "global_step": 293999, "epoch": 2429} {"train_loss": -41.52073287963867, "global_step": 294000, "epoch": 2429} {"train_loss": -41.782081604003906, "global_step": 294001, "epoch": 2429} {"train_loss": -41.29328536987305, "global_step": 294002, "epoch": 2429} {"train_loss": -40.74423599243164, "global_step": 294003, "epoch": 2429} {"train_loss": -41.7668342590332, "global_step": 294004, "epoch": 2429} {"train_loss": -41.91889572143555, "global_step": 294005, "epoch": 2429} {"train_loss": -41.73799514770508, "global_step": 294006, "epoch": 2429} {"train_loss": -42.22758102416992, "global_step": 294007, "epoch": 2429} {"train_loss": -41.99993896484375, "global_step": 294008, "epoch": 2429} {"train_loss": -42.121761322021484, "global_step": 294009, "epoch": 2429} {"train_loss": -42.14242172241211, "global_step": 294010, "epoch": 2429} {"train_loss": -42.10669708251953, "global_step": 294011, "epoch": 2429} {"train_loss": -42.37710189819336, "global_step": 294012, "epoch": 2429} {"train_loss": -42.0374755859375, "global_step": 294013, "epoch": 2429} {"train_loss": -40.31755447387695, "global_step": 294014, "epoch": 2429} {"train_loss": -41.697181701660156, "global_step": 294015, "epoch": 2429} {"train_loss": -42.37523651123047, "global_step": 294016, "epoch": 2429} {"train_loss": -42.51044845581055, "global_step": 294017, "epoch": 2429} {"train_loss": -42.11049270629883, "global_step": 294018, "epoch": 2429} {"train_loss": -42.57265853881836, "global_step": 294019, "epoch": 2429} {"train_loss": -42.04404067993164, "global_step": 294020, "epoch": 2429} {"train_loss": -42.65791320800781, "global_step": 294021, "epoch": 2429} {"train_loss": -42.41478729248047, "global_step": 294022, "epoch": 2429} {"train_loss": -41.715248107910156, "global_step": 294023, "epoch": 2429} {"train_loss": -42.22848129272461, "global_step": 294024, "epoch": 2429} {"train_loss": -42.057132720947266, "global_step": 294025, "epoch": 2429} {"train_loss": -42.76792907714844, "global_step": 294026, "epoch": 2429} {"train_loss": -41.958621978759766, "global_step": 294027, "epoch": 2429} {"train_loss": -41.57866287231445, "global_step": 294028, "epoch": 2429} {"train_loss": -40.63990994918445, "global_step": 294029, "epoch": 2429, "val_loss": 2553970.25} {"train_loss": -39.61880874633789, "global_step": 294030, "epoch": 2430} {"train_loss": -40.2525749206543, "global_step": 294031, "epoch": 2430} {"train_loss": -41.56669998168945, "global_step": 294032, "epoch": 2430} {"train_loss": -40.591609954833984, "global_step": 294033, "epoch": 2430} {"train_loss": -40.49361801147461, "global_step": 294034, "epoch": 2430} {"train_loss": -41.505367279052734, "global_step": 294035, "epoch": 2430} {"train_loss": -42.28017807006836, "global_step": 294036, "epoch": 2430} {"train_loss": -41.355064392089844, "global_step": 294037, "epoch": 2430} {"train_loss": -41.79472732543945, "global_step": 294038, "epoch": 2430} {"train_loss": -41.29459762573242, "global_step": 294039, "epoch": 2430} {"train_loss": -40.589595794677734, "global_step": 294040, "epoch": 2430} {"train_loss": -41.92983627319336, "global_step": 294041, "epoch": 2430} {"train_loss": -42.14773178100586, "global_step": 294042, "epoch": 2430} {"train_loss": -40.560394287109375, "global_step": 294043, "epoch": 2430} {"train_loss": -40.17675018310547, "global_step": 294044, "epoch": 2430} {"train_loss": -42.10952377319336, "global_step": 294045, "epoch": 2430} {"train_loss": -41.96049880981445, "global_step": 294046, "epoch": 2430} {"train_loss": -41.459686279296875, "global_step": 294047, "epoch": 2430} {"train_loss": -38.28877639770508, "global_step": 294048, "epoch": 2430} {"train_loss": -41.99552917480469, "global_step": 294049, "epoch": 2430} {"train_loss": -41.50764083862305, "global_step": 294050, "epoch": 2430} {"train_loss": -42.41019058227539, "global_step": 294051, "epoch": 2430} {"train_loss": -42.3558235168457, "global_step": 294052, "epoch": 2430} {"train_loss": -42.0262565612793, "global_step": 294053, "epoch": 2430} {"train_loss": -41.99864959716797, "global_step": 294054, "epoch": 2430} {"train_loss": -41.827518463134766, "global_step": 294055, "epoch": 2430} {"train_loss": -42.64760971069336, "global_step": 294056, "epoch": 2430} {"train_loss": -42.30500411987305, "global_step": 294057, "epoch": 2430} {"train_loss": -42.28300094604492, "global_step": 294058, "epoch": 2430} {"train_loss": -42.48371124267578, "global_step": 294059, "epoch": 2430} {"train_loss": -42.8529052734375, "global_step": 294060, "epoch": 2430} {"train_loss": -42.81817626953125, "global_step": 294061, "epoch": 2430} {"train_loss": -42.96942901611328, "global_step": 294062, "epoch": 2430} {"train_loss": -41.87480926513672, "global_step": 294063, "epoch": 2430} {"train_loss": -42.8033447265625, "global_step": 294064, "epoch": 2430} {"train_loss": -41.40475082397461, "global_step": 294065, "epoch": 2430} {"train_loss": -42.4641227722168, "global_step": 294066, "epoch": 2430} {"train_loss": -42.28840255737305, "global_step": 294067, "epoch": 2430} {"train_loss": -41.8360481262207, "global_step": 294068, "epoch": 2430} {"train_loss": -40.72878646850586, "global_step": 294069, "epoch": 2430} {"train_loss": -42.18281173706055, "global_step": 294070, "epoch": 2430} {"train_loss": -42.36996841430664, "global_step": 294071, "epoch": 2430} {"train_loss": -41.97797775268555, "global_step": 294072, "epoch": 2430} {"train_loss": -42.740020751953125, "global_step": 294073, "epoch": 2430} {"train_loss": -41.48478698730469, "global_step": 294074, "epoch": 2430} {"train_loss": -42.522987365722656, "global_step": 294075, "epoch": 2430} {"train_loss": -42.161895751953125, "global_step": 294076, "epoch": 2430} {"train_loss": -42.28894805908203, "global_step": 294077, "epoch": 2430} {"train_loss": -41.4691047668457, "global_step": 294078, "epoch": 2430} {"train_loss": -42.80790710449219, "global_step": 294079, "epoch": 2430} {"train_loss": -42.00053024291992, "global_step": 294080, "epoch": 2430} {"train_loss": -42.52484893798828, "global_step": 294081, "epoch": 2430} {"train_loss": -42.34121322631836, "global_step": 294082, "epoch": 2430} {"train_loss": -41.69959259033203, "global_step": 294083, "epoch": 2430} {"train_loss": -42.34434509277344, "global_step": 294084, "epoch": 2430} {"train_loss": -41.19166946411133, "global_step": 294085, "epoch": 2430} {"train_loss": -40.68954086303711, "global_step": 294086, "epoch": 2430} {"train_loss": -42.9375114440918, "global_step": 294087, "epoch": 2430} {"train_loss": -42.16044998168945, "global_step": 294088, "epoch": 2430} {"train_loss": -41.4156608581543, "global_step": 294089, "epoch": 2430} {"train_loss": -39.053462982177734, "global_step": 294090, "epoch": 2430} {"train_loss": -36.964630126953125, "global_step": 294091, "epoch": 2430} {"train_loss": -36.42507553100586, "global_step": 294092, "epoch": 2430} {"train_loss": -40.8493766784668, "global_step": 294093, "epoch": 2430} {"train_loss": -40.3276481628418, "global_step": 294094, "epoch": 2430} {"train_loss": -35.29232406616211, "global_step": 294095, "epoch": 2430} {"train_loss": -41.04638671875, "global_step": 294096, "epoch": 2430} {"train_loss": -38.672027587890625, "global_step": 294097, "epoch": 2430} {"train_loss": -40.86295700073242, "global_step": 294098, "epoch": 2430} {"train_loss": -40.54056930541992, "global_step": 294099, "epoch": 2430} {"train_loss": -37.31912612915039, "global_step": 294100, "epoch": 2430} {"train_loss": -42.00136184692383, "global_step": 294101, "epoch": 2430} {"train_loss": -40.9042854309082, "global_step": 294102, "epoch": 2430} {"train_loss": -41.644161224365234, "global_step": 294103, "epoch": 2430} {"train_loss": -39.885284423828125, "global_step": 294104, "epoch": 2430} {"train_loss": -41.333797454833984, "global_step": 294105, "epoch": 2430} {"train_loss": -39.72459030151367, "global_step": 294106, "epoch": 2430} {"train_loss": -41.38228988647461, "global_step": 294107, "epoch": 2430} {"train_loss": -39.87177276611328, "global_step": 294108, "epoch": 2430} {"train_loss": -39.66438674926758, "global_step": 294109, "epoch": 2430} {"train_loss": -38.39699172973633, "global_step": 294110, "epoch": 2430} {"train_loss": -38.69639205932617, "global_step": 294111, "epoch": 2430} {"train_loss": -39.02724838256836, "global_step": 294112, "epoch": 2430} {"train_loss": -40.382041931152344, "global_step": 294113, "epoch": 2430} {"train_loss": -39.89616012573242, "global_step": 294114, "epoch": 2430} {"train_loss": -39.78878402709961, "global_step": 294115, "epoch": 2430} {"train_loss": -34.706939697265625, "global_step": 294116, "epoch": 2430} {"train_loss": -37.58320236206055, "global_step": 294117, "epoch": 2430} {"train_loss": -42.260902404785156, "global_step": 294118, "epoch": 2430} {"train_loss": -37.47256088256836, "global_step": 294119, "epoch": 2430} {"train_loss": -36.58028793334961, "global_step": 294120, "epoch": 2430} {"train_loss": -38.45237350463867, "global_step": 294121, "epoch": 2430} {"train_loss": -34.87978744506836, "global_step": 294122, "epoch": 2430} {"train_loss": -38.9750862121582, "global_step": 294123, "epoch": 2430} {"train_loss": -32.553321838378906, "global_step": 294124, "epoch": 2430} {"train_loss": -36.702056884765625, "global_step": 294125, "epoch": 2430} {"train_loss": -34.60972213745117, "global_step": 294126, "epoch": 2430} {"train_loss": -30.207128524780273, "global_step": 294127, "epoch": 2430} {"train_loss": -36.11182403564453, "global_step": 294128, "epoch": 2430} {"train_loss": -38.72282028198242, "global_step": 294129, "epoch": 2430} {"train_loss": -34.06147766113281, "global_step": 294130, "epoch": 2430} {"train_loss": -37.949676513671875, "global_step": 294131, "epoch": 2430} {"train_loss": -34.85755157470703, "global_step": 294132, "epoch": 2430} {"train_loss": -34.79609298706055, "global_step": 294133, "epoch": 2430} {"train_loss": -38.815391540527344, "global_step": 294134, "epoch": 2430} {"train_loss": -38.06916427612305, "global_step": 294135, "epoch": 2430} {"train_loss": -32.780216217041016, "global_step": 294136, "epoch": 2430} {"train_loss": -38.34846115112305, "global_step": 294137, "epoch": 2430} {"train_loss": -37.99164581298828, "global_step": 294138, "epoch": 2430} {"train_loss": -36.708038330078125, "global_step": 294139, "epoch": 2430} {"train_loss": -36.455108642578125, "global_step": 294140, "epoch": 2430} {"train_loss": -38.141754150390625, "global_step": 294141, "epoch": 2430} {"train_loss": -38.38662338256836, "global_step": 294142, "epoch": 2430} {"train_loss": -39.74119186401367, "global_step": 294143, "epoch": 2430} {"train_loss": -39.53162384033203, "global_step": 294144, "epoch": 2430} {"train_loss": -38.938804626464844, "global_step": 294145, "epoch": 2430} {"train_loss": -39.02626419067383, "global_step": 294146, "epoch": 2430} {"train_loss": -39.32026290893555, "global_step": 294147, "epoch": 2430} {"train_loss": -37.709693908691406, "global_step": 294148, "epoch": 2430} {"train_loss": -39.857994079589844, "global_step": 294149, "epoch": 2430} {"train_loss": -39.989909447914314, "global_step": 294150, "epoch": 2430, "val_loss": 2978810.0} {"train_loss": -39.947288513183594, "global_step": 294151, "epoch": 2431} {"train_loss": -39.66946029663086, "global_step": 294152, "epoch": 2431} {"train_loss": -39.1201286315918, "global_step": 294153, "epoch": 2431} {"train_loss": -39.81386947631836, "global_step": 294154, "epoch": 2431} {"train_loss": -37.61408233642578, "global_step": 294155, "epoch": 2431} {"train_loss": -39.80434799194336, "global_step": 294156, "epoch": 2431} {"train_loss": -38.44649124145508, "global_step": 294157, "epoch": 2431} {"train_loss": -39.36160659790039, "global_step": 294158, "epoch": 2431} {"train_loss": -38.23518753051758, "global_step": 294159, "epoch": 2431} {"train_loss": -36.641761779785156, "global_step": 294160, "epoch": 2431} {"train_loss": -36.7569694519043, "global_step": 294161, "epoch": 2431} {"train_loss": -38.963130950927734, "global_step": 294162, "epoch": 2431} {"train_loss": -40.20734405517578, "global_step": 294163, "epoch": 2431} {"train_loss": -40.16701889038086, "global_step": 294164, "epoch": 2431} {"train_loss": -39.67551803588867, "global_step": 294165, "epoch": 2431} {"train_loss": -39.27003860473633, "global_step": 294166, "epoch": 2431} {"train_loss": -40.498573303222656, "global_step": 294167, "epoch": 2431} {"train_loss": -40.821632385253906, "global_step": 294168, "epoch": 2431} {"train_loss": -40.32499313354492, "global_step": 294169, "epoch": 2431} {"train_loss": -40.166015625, "global_step": 294170, "epoch": 2431} {"train_loss": -40.59132766723633, "global_step": 294171, "epoch": 2431} {"train_loss": -40.760040283203125, "global_step": 294172, "epoch": 2431} {"train_loss": -40.47860336303711, "global_step": 294173, "epoch": 2431} {"train_loss": -40.63077926635742, "global_step": 294174, "epoch": 2431} {"train_loss": -40.52201461791992, "global_step": 294175, "epoch": 2431} {"train_loss": -40.69561767578125, "global_step": 294176, "epoch": 2431} {"train_loss": -39.730926513671875, "global_step": 294177, "epoch": 2431} {"train_loss": -40.19736862182617, "global_step": 294178, "epoch": 2431} {"train_loss": -40.58622360229492, "global_step": 294179, "epoch": 2431} {"train_loss": -40.891841888427734, "global_step": 294180, "epoch": 2431} {"train_loss": -40.256256103515625, "global_step": 294181, "epoch": 2431} {"train_loss": -39.69430923461914, "global_step": 294182, "epoch": 2431} {"train_loss": -40.055599212646484, "global_step": 294183, "epoch": 2431} {"train_loss": -39.30488586425781, "global_step": 294184, "epoch": 2431} {"train_loss": -39.392364501953125, "global_step": 294185, "epoch": 2431} {"train_loss": -41.317291259765625, "global_step": 294186, "epoch": 2431} {"train_loss": -40.78031539916992, "global_step": 294187, "epoch": 2431} {"train_loss": -40.74094009399414, "global_step": 294188, "epoch": 2431} {"train_loss": -39.41978073120117, "global_step": 294189, "epoch": 2431} {"train_loss": -40.393455505371094, "global_step": 294190, "epoch": 2431} {"train_loss": -41.04127502441406, "global_step": 294191, "epoch": 2431} {"train_loss": -40.301143646240234, "global_step": 294192, "epoch": 2431} {"train_loss": -40.35863494873047, "global_step": 294193, "epoch": 2431} {"train_loss": -40.81205368041992, "global_step": 294194, "epoch": 2431} {"train_loss": -40.1898307800293, "global_step": 294195, "epoch": 2431} {"train_loss": -41.2205696105957, "global_step": 294196, "epoch": 2431} {"train_loss": -41.32523727416992, "global_step": 294197, "epoch": 2431} {"train_loss": -40.80216598510742, "global_step": 294198, "epoch": 2431} {"train_loss": -41.39138412475586, "global_step": 294199, "epoch": 2431} {"train_loss": -41.4146842956543, "global_step": 294200, "epoch": 2431} {"train_loss": -40.06594467163086, "global_step": 294201, "epoch": 2431} {"train_loss": -42.03712844848633, "global_step": 294202, "epoch": 2431} {"train_loss": -41.51066970825195, "global_step": 294203, "epoch": 2431} {"train_loss": -40.96736526489258, "global_step": 294204, "epoch": 2431} {"train_loss": -41.96628952026367, "global_step": 294205, "epoch": 2431} {"train_loss": -40.749874114990234, "global_step": 294206, "epoch": 2431} {"train_loss": -41.37876892089844, "global_step": 294207, "epoch": 2431} {"train_loss": -42.04862976074219, "global_step": 294208, "epoch": 2431} {"train_loss": -41.530250549316406, "global_step": 294209, "epoch": 2431} {"train_loss": -41.60316467285156, "global_step": 294210, "epoch": 2431} {"train_loss": -41.47846984863281, "global_step": 294211, "epoch": 2431} {"train_loss": -41.99745559692383, "global_step": 294212, "epoch": 2431} {"train_loss": -41.303585052490234, "global_step": 294213, "epoch": 2431} {"train_loss": -41.172306060791016, "global_step": 294214, "epoch": 2431} {"train_loss": -41.38993453979492, "global_step": 294215, "epoch": 2431} {"train_loss": -41.82182312011719, "global_step": 294216, "epoch": 2431} {"train_loss": -41.560546875, "global_step": 294217, "epoch": 2431} {"train_loss": -42.17958450317383, "global_step": 294218, "epoch": 2431} {"train_loss": -42.42142105102539, "global_step": 294219, "epoch": 2431} {"train_loss": -41.435791015625, "global_step": 294220, "epoch": 2431} {"train_loss": -41.47492599487305, "global_step": 294221, "epoch": 2431} {"train_loss": -41.62889862060547, "global_step": 294222, "epoch": 2431} {"train_loss": -41.10184860229492, "global_step": 294223, "epoch": 2431} {"train_loss": -42.0837287902832, "global_step": 294224, "epoch": 2431} {"train_loss": -41.64625930786133, "global_step": 294225, "epoch": 2431} {"train_loss": -41.22933578491211, "global_step": 294226, "epoch": 2431} {"train_loss": -39.1500244140625, "global_step": 294227, "epoch": 2431} {"train_loss": -37.80892562866211, "global_step": 294228, "epoch": 2431} {"train_loss": -35.958160400390625, "global_step": 294229, "epoch": 2431} {"train_loss": -34.075401306152344, "global_step": 294230, "epoch": 2431} {"train_loss": -40.63096237182617, "global_step": 294231, "epoch": 2431} {"train_loss": -37.56222152709961, "global_step": 294232, "epoch": 2431} {"train_loss": -35.06319046020508, "global_step": 294233, "epoch": 2431} {"train_loss": -41.35789108276367, "global_step": 294234, "epoch": 2431} {"train_loss": -37.0719108581543, "global_step": 294235, "epoch": 2431} {"train_loss": -40.45384979248047, "global_step": 294236, "epoch": 2431} {"train_loss": -40.1693229675293, "global_step": 294237, "epoch": 2431} {"train_loss": -40.92616271972656, "global_step": 294238, "epoch": 2431} {"train_loss": -38.61519241333008, "global_step": 294239, "epoch": 2431} {"train_loss": -41.00484848022461, "global_step": 294240, "epoch": 2431} {"train_loss": -39.72222137451172, "global_step": 294241, "epoch": 2431} {"train_loss": -41.20735549926758, "global_step": 294242, "epoch": 2431} {"train_loss": -41.071773529052734, "global_step": 294243, "epoch": 2431} {"train_loss": -36.38743209838867, "global_step": 294244, "epoch": 2431} {"train_loss": -40.152320861816406, "global_step": 294245, "epoch": 2431} {"train_loss": -41.16756820678711, "global_step": 294246, "epoch": 2431} {"train_loss": -40.964698791503906, "global_step": 294247, "epoch": 2431} {"train_loss": -40.6947135925293, "global_step": 294248, "epoch": 2431} {"train_loss": -40.79148483276367, "global_step": 294249, "epoch": 2431} {"train_loss": -39.477352142333984, "global_step": 294250, "epoch": 2431} {"train_loss": -40.7723503112793, "global_step": 294251, "epoch": 2431} {"train_loss": -39.8331413269043, "global_step": 294252, "epoch": 2431} {"train_loss": -40.146942138671875, "global_step": 294253, "epoch": 2431} {"train_loss": -39.19511032104492, "global_step": 294254, "epoch": 2431} {"train_loss": -40.00822067260742, "global_step": 294255, "epoch": 2431} {"train_loss": -39.934444427490234, "global_step": 294256, "epoch": 2431} {"train_loss": -41.28003692626953, "global_step": 294257, "epoch": 2431} {"train_loss": -40.71268844604492, "global_step": 294258, "epoch": 2431} {"train_loss": -40.4280891418457, "global_step": 294259, "epoch": 2431} {"train_loss": -40.44982147216797, "global_step": 294260, "epoch": 2431} {"train_loss": -40.02964782714844, "global_step": 294261, "epoch": 2431} {"train_loss": -40.657691955566406, "global_step": 294262, "epoch": 2431} {"train_loss": -41.44694519042969, "global_step": 294263, "epoch": 2431} {"train_loss": -41.3772087097168, "global_step": 294264, "epoch": 2431} {"train_loss": -41.09493637084961, "global_step": 294265, "epoch": 2431} {"train_loss": -40.434844970703125, "global_step": 294266, "epoch": 2431} {"train_loss": -40.18865966796875, "global_step": 294267, "epoch": 2431} {"train_loss": -41.38591384887695, "global_step": 294268, "epoch": 2431} {"train_loss": -38.42196273803711, "global_step": 294269, "epoch": 2431} {"train_loss": -41.052730560302734, "global_step": 294270, "epoch": 2431} {"train_loss": -40.26955038653917, "global_step": 294271, "epoch": 2431, "val_loss": 2697440.5} {"train_loss": -41.3877067565918, "global_step": 294272, "epoch": 2432} {"train_loss": -39.406036376953125, "global_step": 294273, "epoch": 2432} {"train_loss": -39.47652053833008, "global_step": 294274, "epoch": 2432} {"train_loss": -41.13137435913086, "global_step": 294275, "epoch": 2432} {"train_loss": -40.07911682128906, "global_step": 294276, "epoch": 2432} {"train_loss": -41.15312957763672, "global_step": 294277, "epoch": 2432} {"train_loss": -39.67081069946289, "global_step": 294278, "epoch": 2432} {"train_loss": -41.01039505004883, "global_step": 294279, "epoch": 2432} {"train_loss": -40.94981002807617, "global_step": 294280, "epoch": 2432} {"train_loss": -40.09517288208008, "global_step": 294281, "epoch": 2432} {"train_loss": -41.377132415771484, "global_step": 294282, "epoch": 2432} {"train_loss": -41.12192916870117, "global_step": 294283, "epoch": 2432} {"train_loss": -39.60124588012695, "global_step": 294284, "epoch": 2432} {"train_loss": -40.1512565612793, "global_step": 294285, "epoch": 2432} {"train_loss": -41.69864273071289, "global_step": 294286, "epoch": 2432} {"train_loss": -40.00146484375, "global_step": 294287, "epoch": 2432} {"train_loss": -41.47357940673828, "global_step": 294288, "epoch": 2432} {"train_loss": -39.46744918823242, "global_step": 294289, "epoch": 2432} {"train_loss": -41.47907638549805, "global_step": 294290, "epoch": 2432} {"train_loss": -40.594356536865234, "global_step": 294291, "epoch": 2432} {"train_loss": -40.0887451171875, "global_step": 294292, "epoch": 2432} {"train_loss": -41.322086334228516, "global_step": 294293, "epoch": 2432} {"train_loss": -42.39272689819336, "global_step": 294294, "epoch": 2432} {"train_loss": -40.86431121826172, "global_step": 294295, "epoch": 2432} {"train_loss": -40.71133041381836, "global_step": 294296, "epoch": 2432} {"train_loss": -40.26225280761719, "global_step": 294297, "epoch": 2432} {"train_loss": -41.19956588745117, "global_step": 294298, "epoch": 2432} {"train_loss": -42.056549072265625, "global_step": 294299, "epoch": 2432} {"train_loss": -34.86528396606445, "global_step": 294300, "epoch": 2432} {"train_loss": -41.41185760498047, "global_step": 294301, "epoch": 2432} {"train_loss": -41.2740364074707, "global_step": 294302, "epoch": 2432} {"train_loss": -41.45613479614258, "global_step": 294303, "epoch": 2432} {"train_loss": -41.69912338256836, "global_step": 294304, "epoch": 2432} {"train_loss": -39.86124038696289, "global_step": 294305, "epoch": 2432} {"train_loss": -41.015724182128906, "global_step": 294306, "epoch": 2432} {"train_loss": -41.887386322021484, "global_step": 294307, "epoch": 2432} {"train_loss": -41.56748580932617, "global_step": 294308, "epoch": 2432} {"train_loss": -40.9485969543457, "global_step": 294309, "epoch": 2432} {"train_loss": -40.6197395324707, "global_step": 294310, "epoch": 2432} {"train_loss": -41.836849212646484, "global_step": 294311, "epoch": 2432} {"train_loss": -41.45532989501953, "global_step": 294312, "epoch": 2432} {"train_loss": -42.0078125, "global_step": 294313, "epoch": 2432} {"train_loss": -40.29437255859375, "global_step": 294314, "epoch": 2432} {"train_loss": -40.720947265625, "global_step": 294315, "epoch": 2432} {"train_loss": -41.39314270019531, "global_step": 294316, "epoch": 2432} {"train_loss": -40.88478088378906, "global_step": 294317, "epoch": 2432} {"train_loss": -41.28950881958008, "global_step": 294318, "epoch": 2432} {"train_loss": -41.65540313720703, "global_step": 294319, "epoch": 2432} {"train_loss": -39.60288619995117, "global_step": 294320, "epoch": 2432} {"train_loss": -41.47736358642578, "global_step": 294321, "epoch": 2432} {"train_loss": -41.98456573486328, "global_step": 294322, "epoch": 2432} {"train_loss": -40.85771179199219, "global_step": 294323, "epoch": 2432} {"train_loss": -41.333248138427734, "global_step": 294324, "epoch": 2432} {"train_loss": -41.069087982177734, "global_step": 294325, "epoch": 2432} {"train_loss": -42.01530075073242, "global_step": 294326, "epoch": 2432} {"train_loss": -41.04365158081055, "global_step": 294327, "epoch": 2432} {"train_loss": -42.100704193115234, "global_step": 294328, "epoch": 2432} {"train_loss": -42.3281364440918, "global_step": 294329, "epoch": 2432} {"train_loss": -42.2780876159668, "global_step": 294330, "epoch": 2432} {"train_loss": -41.5008659362793, "global_step": 294331, "epoch": 2432} {"train_loss": -41.23401641845703, "global_step": 294332, "epoch": 2432} {"train_loss": -42.04273223876953, "global_step": 294333, "epoch": 2432} {"train_loss": -42.47391128540039, "global_step": 294334, "epoch": 2432} {"train_loss": -40.98688888549805, "global_step": 294335, "epoch": 2432} {"train_loss": -41.924560546875, "global_step": 294336, "epoch": 2432} {"train_loss": -41.47687911987305, "global_step": 294337, "epoch": 2432} {"train_loss": -42.29648208618164, "global_step": 294338, "epoch": 2432} {"train_loss": -40.17977523803711, "global_step": 294339, "epoch": 2432} {"train_loss": -42.565948486328125, "global_step": 294340, "epoch": 2432} {"train_loss": -41.502071380615234, "global_step": 294341, "epoch": 2432} {"train_loss": -42.56818771362305, "global_step": 294342, "epoch": 2432} {"train_loss": -42.10807800292969, "global_step": 294343, "epoch": 2432} {"train_loss": -41.479766845703125, "global_step": 294344, "epoch": 2432} {"train_loss": -40.16996383666992, "global_step": 294345, "epoch": 2432} {"train_loss": -41.512298583984375, "global_step": 294346, "epoch": 2432} {"train_loss": -40.58015823364258, "global_step": 294347, "epoch": 2432} {"train_loss": -38.242591857910156, "global_step": 294348, "epoch": 2432} {"train_loss": -40.37091064453125, "global_step": 294349, "epoch": 2432} {"train_loss": -40.9982795715332, "global_step": 294350, "epoch": 2432} {"train_loss": -42.073448181152344, "global_step": 294351, "epoch": 2432} {"train_loss": -41.670997619628906, "global_step": 294352, "epoch": 2432} {"train_loss": -39.745208740234375, "global_step": 294353, "epoch": 2432} {"train_loss": -42.003662109375, "global_step": 294354, "epoch": 2432} {"train_loss": -39.61232376098633, "global_step": 294355, "epoch": 2432} {"train_loss": -39.50846481323242, "global_step": 294356, "epoch": 2432} {"train_loss": -38.00156021118164, "global_step": 294357, "epoch": 2432} {"train_loss": -41.37946319580078, "global_step": 294358, "epoch": 2432} {"train_loss": -38.99007797241211, "global_step": 294359, "epoch": 2432} {"train_loss": -38.78133010864258, "global_step": 294360, "epoch": 2432} {"train_loss": -40.08867263793945, "global_step": 294361, "epoch": 2432} {"train_loss": -37.90530014038086, "global_step": 294362, "epoch": 2432} {"train_loss": -30.160343170166016, "global_step": 294363, "epoch": 2432} {"train_loss": -40.14984893798828, "global_step": 294364, "epoch": 2432} {"train_loss": -41.478885650634766, "global_step": 294365, "epoch": 2432} {"train_loss": -41.393611907958984, "global_step": 294366, "epoch": 2432} {"train_loss": -40.54713821411133, "global_step": 294367, "epoch": 2432} {"train_loss": -41.20827102661133, "global_step": 294368, "epoch": 2432} {"train_loss": -41.139869689941406, "global_step": 294369, "epoch": 2432} {"train_loss": -38.72167205810547, "global_step": 294370, "epoch": 2432} {"train_loss": -41.23893356323242, "global_step": 294371, "epoch": 2432} {"train_loss": -41.12954330444336, "global_step": 294372, "epoch": 2432} {"train_loss": -41.116737365722656, "global_step": 294373, "epoch": 2432} {"train_loss": -41.55860900878906, "global_step": 294374, "epoch": 2432} {"train_loss": -39.067195892333984, "global_step": 294375, "epoch": 2432} {"train_loss": -41.95581817626953, "global_step": 294376, "epoch": 2432} {"train_loss": -41.85382843017578, "global_step": 294377, "epoch": 2432} {"train_loss": -40.1168327331543, "global_step": 294378, "epoch": 2432} {"train_loss": -41.62469482421875, "global_step": 294379, "epoch": 2432} {"train_loss": -41.56428909301758, "global_step": 294380, "epoch": 2432} {"train_loss": -40.11878967285156, "global_step": 294381, "epoch": 2432} {"train_loss": -40.63045120239258, "global_step": 294382, "epoch": 2432} {"train_loss": -41.34080123901367, "global_step": 294383, "epoch": 2432} {"train_loss": -41.073360443115234, "global_step": 294384, "epoch": 2432} {"train_loss": -41.649593353271484, "global_step": 294385, "epoch": 2432} {"train_loss": -40.98696517944336, "global_step": 294386, "epoch": 2432} {"train_loss": -38.013668060302734, "global_step": 294387, "epoch": 2432} {"train_loss": -40.03036117553711, "global_step": 294388, "epoch": 2432} {"train_loss": -40.998382568359375, "global_step": 294389, "epoch": 2432} {"train_loss": -39.977779388427734, "global_step": 294390, "epoch": 2432} {"train_loss": -41.4008674621582, "global_step": 294391, "epoch": 2432} {"train_loss": -40.76747966797884, "global_step": 294392, "epoch": 2432, "val_loss": 3147802.0} {"train_loss": -40.410919189453125, "global_step": 294393, "epoch": 2433} {"train_loss": -40.73374557495117, "global_step": 294394, "epoch": 2433} {"train_loss": -41.12921905517578, "global_step": 294395, "epoch": 2433} {"train_loss": -40.36298370361328, "global_step": 294396, "epoch": 2433} {"train_loss": -40.15861129760742, "global_step": 294397, "epoch": 2433} {"train_loss": -41.19709014892578, "global_step": 294398, "epoch": 2433} {"train_loss": -39.8156852722168, "global_step": 294399, "epoch": 2433} {"train_loss": -40.98154830932617, "global_step": 294400, "epoch": 2433} {"train_loss": -42.13822555541992, "global_step": 294401, "epoch": 2433} {"train_loss": -39.17033004760742, "global_step": 294402, "epoch": 2433} {"train_loss": -40.32000732421875, "global_step": 294403, "epoch": 2433} {"train_loss": -41.50770950317383, "global_step": 294404, "epoch": 2433} {"train_loss": -39.645259857177734, "global_step": 294405, "epoch": 2433} {"train_loss": -41.55902099609375, "global_step": 294406, "epoch": 2433} {"train_loss": -40.9641227722168, "global_step": 294407, "epoch": 2433} {"train_loss": -41.91848373413086, "global_step": 294408, "epoch": 2433} {"train_loss": -41.754302978515625, "global_step": 294409, "epoch": 2433} {"train_loss": -41.86075973510742, "global_step": 294410, "epoch": 2433} {"train_loss": -41.15912628173828, "global_step": 294411, "epoch": 2433} {"train_loss": -35.266082763671875, "global_step": 294412, "epoch": 2433} {"train_loss": -41.61056137084961, "global_step": 294413, "epoch": 2433} {"train_loss": -39.33369827270508, "global_step": 294414, "epoch": 2433} {"train_loss": -41.68123245239258, "global_step": 294415, "epoch": 2433} {"train_loss": -41.45240783691406, "global_step": 294416, "epoch": 2433} {"train_loss": -40.675411224365234, "global_step": 294417, "epoch": 2433} {"train_loss": -40.38332748413086, "global_step": 294418, "epoch": 2433} {"train_loss": -38.10005569458008, "global_step": 294419, "epoch": 2433} {"train_loss": -40.76422119140625, "global_step": 294420, "epoch": 2433} {"train_loss": -39.9503288269043, "global_step": 294421, "epoch": 2433} {"train_loss": -38.30350875854492, "global_step": 294422, "epoch": 2433} {"train_loss": -40.433536529541016, "global_step": 294423, "epoch": 2433} {"train_loss": -41.82196807861328, "global_step": 294424, "epoch": 2433} {"train_loss": -40.86170196533203, "global_step": 294425, "epoch": 2433} {"train_loss": -38.96638870239258, "global_step": 294426, "epoch": 2433} {"train_loss": -38.45779800415039, "global_step": 294427, "epoch": 2433} {"train_loss": -41.57723617553711, "global_step": 294428, "epoch": 2433} {"train_loss": -41.30177688598633, "global_step": 294429, "epoch": 2433} {"train_loss": -40.43044662475586, "global_step": 294430, "epoch": 2433} {"train_loss": -40.64229965209961, "global_step": 294431, "epoch": 2433} {"train_loss": -41.732086181640625, "global_step": 294432, "epoch": 2433} {"train_loss": -40.99918746948242, "global_step": 294433, "epoch": 2433} {"train_loss": -42.21697998046875, "global_step": 294434, "epoch": 2433} {"train_loss": -39.42645263671875, "global_step": 294435, "epoch": 2433} {"train_loss": -41.36924362182617, "global_step": 294436, "epoch": 2433} {"train_loss": -40.75621032714844, "global_step": 294437, "epoch": 2433} {"train_loss": -35.23347854614258, "global_step": 294438, "epoch": 2433} {"train_loss": -41.57108688354492, "global_step": 294439, "epoch": 2433} {"train_loss": -40.54607009887695, "global_step": 294440, "epoch": 2433} {"train_loss": -41.01505661010742, "global_step": 294441, "epoch": 2433} {"train_loss": -39.997772216796875, "global_step": 294442, "epoch": 2433} {"train_loss": -40.296531677246094, "global_step": 294443, "epoch": 2433} {"train_loss": -39.64177322387695, "global_step": 294444, "epoch": 2433} {"train_loss": -40.57225036621094, "global_step": 294445, "epoch": 2433} {"train_loss": -37.949440002441406, "global_step": 294446, "epoch": 2433} {"train_loss": -41.039886474609375, "global_step": 294447, "epoch": 2433} {"train_loss": -40.35527801513672, "global_step": 294448, "epoch": 2433} {"train_loss": -38.43806076049805, "global_step": 294449, "epoch": 2433} {"train_loss": -39.84052276611328, "global_step": 294450, "epoch": 2433} {"train_loss": -38.080745697021484, "global_step": 294451, "epoch": 2433} {"train_loss": -33.75367736816406, "global_step": 294452, "epoch": 2433} {"train_loss": -39.685943603515625, "global_step": 294453, "epoch": 2433} {"train_loss": -37.999149322509766, "global_step": 294454, "epoch": 2433} {"train_loss": -40.66997528076172, "global_step": 294455, "epoch": 2433} {"train_loss": -36.971858978271484, "global_step": 294456, "epoch": 2433} {"train_loss": -24.3617000579834, "global_step": 294457, "epoch": 2433} {"train_loss": -33.01983642578125, "global_step": 294458, "epoch": 2433} {"train_loss": -19.886747360229492, "global_step": 294459, "epoch": 2433} {"train_loss": -38.861236572265625, "global_step": 294460, "epoch": 2433} {"train_loss": -15.457844734191895, "global_step": 294461, "epoch": 2433} {"train_loss": -30.238574981689453, "global_step": 294462, "epoch": 2433} {"train_loss": -33.13953399658203, "global_step": 294463, "epoch": 2433} {"train_loss": -36.985721588134766, "global_step": 294464, "epoch": 2433} {"train_loss": -36.67031478881836, "global_step": 294465, "epoch": 2433} {"train_loss": -34.52012634277344, "global_step": 294466, "epoch": 2433} {"train_loss": -35.46241760253906, "global_step": 294467, "epoch": 2433} {"train_loss": -37.17751693725586, "global_step": 294468, "epoch": 2433} {"train_loss": -37.82072830200195, "global_step": 294469, "epoch": 2433} {"train_loss": -33.77450942993164, "global_step": 294470, "epoch": 2433} {"train_loss": -37.686344146728516, "global_step": 294471, "epoch": 2433} {"train_loss": -38.43559265136719, "global_step": 294472, "epoch": 2433} {"train_loss": -38.39448928833008, "global_step": 294473, "epoch": 2433} {"train_loss": -36.31663131713867, "global_step": 294474, "epoch": 2433} {"train_loss": -38.442420959472656, "global_step": 294475, "epoch": 2433} {"train_loss": -38.303955078125, "global_step": 294476, "epoch": 2433} {"train_loss": -39.06850051879883, "global_step": 294477, "epoch": 2433} {"train_loss": -38.549312591552734, "global_step": 294478, "epoch": 2433} {"train_loss": -39.27199935913086, "global_step": 294479, "epoch": 2433} {"train_loss": -38.35823440551758, "global_step": 294480, "epoch": 2433} {"train_loss": -38.50786209106445, "global_step": 294481, "epoch": 2433} {"train_loss": -39.6861686706543, "global_step": 294482, "epoch": 2433} {"train_loss": -38.39181900024414, "global_step": 294483, "epoch": 2433} {"train_loss": -38.885406494140625, "global_step": 294484, "epoch": 2433} {"train_loss": -38.77989959716797, "global_step": 294485, "epoch": 2433} {"train_loss": -39.51203536987305, "global_step": 294486, "epoch": 2433} {"train_loss": -39.32889938354492, "global_step": 294487, "epoch": 2433} {"train_loss": -39.014076232910156, "global_step": 294488, "epoch": 2433} {"train_loss": -39.44487380981445, "global_step": 294489, "epoch": 2433} {"train_loss": -38.196258544921875, "global_step": 294490, "epoch": 2433} {"train_loss": -38.9620475769043, "global_step": 294491, "epoch": 2433} {"train_loss": -39.45307922363281, "global_step": 294492, "epoch": 2433} {"train_loss": -39.968257904052734, "global_step": 294493, "epoch": 2433} {"train_loss": -39.81200408935547, "global_step": 294494, "epoch": 2433} {"train_loss": -39.23786926269531, "global_step": 294495, "epoch": 2433} {"train_loss": -40.1347541809082, "global_step": 294496, "epoch": 2433} {"train_loss": -39.895809173583984, "global_step": 294497, "epoch": 2433} {"train_loss": -40.098854064941406, "global_step": 294498, "epoch": 2433} {"train_loss": -40.417999267578125, "global_step": 294499, "epoch": 2433} {"train_loss": -40.1656379699707, "global_step": 294500, "epoch": 2433} {"train_loss": -39.98495101928711, "global_step": 294501, "epoch": 2433} {"train_loss": -39.97213363647461, "global_step": 294502, "epoch": 2433} {"train_loss": -39.99277877807617, "global_step": 294503, "epoch": 2433} {"train_loss": -40.255775451660156, "global_step": 294504, "epoch": 2433} {"train_loss": -39.796356201171875, "global_step": 294505, "epoch": 2433} {"train_loss": -40.41645431518555, "global_step": 294506, "epoch": 2433} {"train_loss": -39.79320526123047, "global_step": 294507, "epoch": 2433} {"train_loss": -40.318275451660156, "global_step": 294508, "epoch": 2433} {"train_loss": -40.58644104003906, "global_step": 294509, "epoch": 2433} {"train_loss": -40.6067008972168, "global_step": 294510, "epoch": 2433} {"train_loss": -40.7913932800293, "global_step": 294511, "epoch": 2433} {"train_loss": -40.86391830444336, "global_step": 294512, "epoch": 2433} {"train_loss": -38.91908419427793, "global_step": 294513, "epoch": 2433, "val_loss": 2516410.75} {"train_loss": -40.83961868286133, "global_step": 294514, "epoch": 2434} {"train_loss": -41.039329528808594, "global_step": 294515, "epoch": 2434} {"train_loss": -40.335811614990234, "global_step": 294516, "epoch": 2434} {"train_loss": -40.725311279296875, "global_step": 294517, "epoch": 2434} {"train_loss": -40.06440353393555, "global_step": 294518, "epoch": 2434} {"train_loss": -41.02592468261719, "global_step": 294519, "epoch": 2434} {"train_loss": -40.9400634765625, "global_step": 294520, "epoch": 2434} {"train_loss": -39.73568344116211, "global_step": 294521, "epoch": 2434} {"train_loss": -40.90827178955078, "global_step": 294522, "epoch": 2434} {"train_loss": -40.4791259765625, "global_step": 294523, "epoch": 2434} {"train_loss": -41.37318801879883, "global_step": 294524, "epoch": 2434} {"train_loss": -41.33504867553711, "global_step": 294525, "epoch": 2434} {"train_loss": -41.23618698120117, "global_step": 294526, "epoch": 2434} {"train_loss": -41.49360275268555, "global_step": 294527, "epoch": 2434} {"train_loss": -41.612815856933594, "global_step": 294528, "epoch": 2434} {"train_loss": -41.210784912109375, "global_step": 294529, "epoch": 2434} {"train_loss": -41.283966064453125, "global_step": 294530, "epoch": 2434} {"train_loss": -41.18040084838867, "global_step": 294531, "epoch": 2434} {"train_loss": -41.14226531982422, "global_step": 294532, "epoch": 2434} {"train_loss": -41.3535270690918, "global_step": 294533, "epoch": 2434} {"train_loss": -40.70537185668945, "global_step": 294534, "epoch": 2434} {"train_loss": -41.01646041870117, "global_step": 294535, "epoch": 2434} {"train_loss": -41.05765914916992, "global_step": 294536, "epoch": 2434} {"train_loss": -41.540767669677734, "global_step": 294537, "epoch": 2434} {"train_loss": -40.835506439208984, "global_step": 294538, "epoch": 2434} {"train_loss": -42.035457611083984, "global_step": 294539, "epoch": 2434} {"train_loss": -41.80575942993164, "global_step": 294540, "epoch": 2434} {"train_loss": -41.42205810546875, "global_step": 294541, "epoch": 2434} {"train_loss": -41.2457275390625, "global_step": 294542, "epoch": 2434} {"train_loss": -41.32598114013672, "global_step": 294543, "epoch": 2434} {"train_loss": -41.385684967041016, "global_step": 294544, "epoch": 2434} {"train_loss": -41.64191436767578, "global_step": 294545, "epoch": 2434} {"train_loss": -41.51240158081055, "global_step": 294546, "epoch": 2434} {"train_loss": -41.70844268798828, "global_step": 294547, "epoch": 2434} {"train_loss": -41.64198303222656, "global_step": 294548, "epoch": 2434} {"train_loss": -42.116268157958984, "global_step": 294549, "epoch": 2434} {"train_loss": -41.582359313964844, "global_step": 294550, "epoch": 2434} {"train_loss": -41.85432052612305, "global_step": 294551, "epoch": 2434} {"train_loss": -41.07538986206055, "global_step": 294552, "epoch": 2434} {"train_loss": -41.681983947753906, "global_step": 294553, "epoch": 2434} {"train_loss": -41.6103401184082, "global_step": 294554, "epoch": 2434} {"train_loss": -41.69355010986328, "global_step": 294555, "epoch": 2434} {"train_loss": -42.2529182434082, "global_step": 294556, "epoch": 2434} {"train_loss": -42.281314849853516, "global_step": 294557, "epoch": 2434} {"train_loss": -42.09530258178711, "global_step": 294558, "epoch": 2434} {"train_loss": -42.22683334350586, "global_step": 294559, "epoch": 2434} {"train_loss": -42.196510314941406, "global_step": 294560, "epoch": 2434} {"train_loss": -41.481834411621094, "global_step": 294561, "epoch": 2434} {"train_loss": -41.7857780456543, "global_step": 294562, "epoch": 2434} {"train_loss": -42.1783447265625, "global_step": 294563, "epoch": 2434} {"train_loss": -42.182491302490234, "global_step": 294564, "epoch": 2434} {"train_loss": -42.17317581176758, "global_step": 294565, "epoch": 2434} {"train_loss": -41.753231048583984, "global_step": 294566, "epoch": 2434} {"train_loss": -41.67802047729492, "global_step": 294567, "epoch": 2434} {"train_loss": -41.42779541015625, "global_step": 294568, "epoch": 2434} {"train_loss": -42.05592727661133, "global_step": 294569, "epoch": 2434} {"train_loss": -42.44940948486328, "global_step": 294570, "epoch": 2434} {"train_loss": -41.84670639038086, "global_step": 294571, "epoch": 2434} {"train_loss": -40.49795150756836, "global_step": 294572, "epoch": 2434} {"train_loss": -42.199562072753906, "global_step": 294573, "epoch": 2434} {"train_loss": -42.028018951416016, "global_step": 294574, "epoch": 2434} {"train_loss": -41.95388412475586, "global_step": 294575, "epoch": 2434} {"train_loss": -40.988861083984375, "global_step": 294576, "epoch": 2434} {"train_loss": -41.75680160522461, "global_step": 294577, "epoch": 2434} {"train_loss": -41.50777816772461, "global_step": 294578, "epoch": 2434} {"train_loss": -38.331783294677734, "global_step": 294579, "epoch": 2434} {"train_loss": -39.21411895751953, "global_step": 294580, "epoch": 2434} {"train_loss": -41.31510925292969, "global_step": 294581, "epoch": 2434} {"train_loss": -39.18268966674805, "global_step": 294582, "epoch": 2434} {"train_loss": -40.915618896484375, "global_step": 294583, "epoch": 2434} {"train_loss": -40.18623733520508, "global_step": 294584, "epoch": 2434} {"train_loss": -41.343257904052734, "global_step": 294585, "epoch": 2434} {"train_loss": -42.06039810180664, "global_step": 294586, "epoch": 2434} {"train_loss": -41.17429733276367, "global_step": 294587, "epoch": 2434} {"train_loss": -41.999454498291016, "global_step": 294588, "epoch": 2434} {"train_loss": -41.040164947509766, "global_step": 294589, "epoch": 2434} {"train_loss": -40.93293380737305, "global_step": 294590, "epoch": 2434} {"train_loss": -40.90760040283203, "global_step": 294591, "epoch": 2434} {"train_loss": -41.26629638671875, "global_step": 294592, "epoch": 2434} {"train_loss": -41.531524658203125, "global_step": 294593, "epoch": 2434} {"train_loss": -40.06956100463867, "global_step": 294594, "epoch": 2434} {"train_loss": -40.59592056274414, "global_step": 294595, "epoch": 2434} {"train_loss": -41.47494125366211, "global_step": 294596, "epoch": 2434} {"train_loss": -41.28579330444336, "global_step": 294597, "epoch": 2434} {"train_loss": -39.99198913574219, "global_step": 294598, "epoch": 2434} {"train_loss": -39.08584213256836, "global_step": 294599, "epoch": 2434} {"train_loss": -41.00621032714844, "global_step": 294600, "epoch": 2434} {"train_loss": -41.46439743041992, "global_step": 294601, "epoch": 2434} {"train_loss": -39.585201263427734, "global_step": 294602, "epoch": 2434} {"train_loss": -39.52547073364258, "global_step": 294603, "epoch": 2434} {"train_loss": -41.1186408996582, "global_step": 294604, "epoch": 2434} {"train_loss": -40.95178985595703, "global_step": 294605, "epoch": 2434} {"train_loss": -39.940826416015625, "global_step": 294606, "epoch": 2434} {"train_loss": -39.91376495361328, "global_step": 294607, "epoch": 2434} {"train_loss": -42.14960479736328, "global_step": 294608, "epoch": 2434} {"train_loss": -41.0552978515625, "global_step": 294609, "epoch": 2434} {"train_loss": -41.14973831176758, "global_step": 294610, "epoch": 2434} {"train_loss": -41.53298568725586, "global_step": 294611, "epoch": 2434} {"train_loss": -41.15132522583008, "global_step": 294612, "epoch": 2434} {"train_loss": -39.90911865234375, "global_step": 294613, "epoch": 2434} {"train_loss": -42.377540588378906, "global_step": 294614, "epoch": 2434} {"train_loss": -41.01594924926758, "global_step": 294615, "epoch": 2434} {"train_loss": -41.7556266784668, "global_step": 294616, "epoch": 2434} {"train_loss": -41.54273223876953, "global_step": 294617, "epoch": 2434} {"train_loss": -41.20028305053711, "global_step": 294618, "epoch": 2434} {"train_loss": -41.955718994140625, "global_step": 294619, "epoch": 2434} {"train_loss": -40.99086380004883, "global_step": 294620, "epoch": 2434} {"train_loss": -40.86192321777344, "global_step": 294621, "epoch": 2434} {"train_loss": -41.68532180786133, "global_step": 294622, "epoch": 2434} {"train_loss": -41.116729736328125, "global_step": 294623, "epoch": 2434} {"train_loss": -41.92164993286133, "global_step": 294624, "epoch": 2434} {"train_loss": -41.60447311401367, "global_step": 294625, "epoch": 2434} {"train_loss": -42.7520866394043, "global_step": 294626, "epoch": 2434} {"train_loss": -41.81025314331055, "global_step": 294627, "epoch": 2434} {"train_loss": -42.7102165222168, "global_step": 294628, "epoch": 2434} {"train_loss": -41.75831604003906, "global_step": 294629, "epoch": 2434} {"train_loss": -41.98078536987305, "global_step": 294630, "epoch": 2434} {"train_loss": -41.63943099975586, "global_step": 294631, "epoch": 2434} {"train_loss": -42.40891647338867, "global_step": 294632, "epoch": 2434} {"train_loss": -42.59449005126953, "global_step": 294633, "epoch": 2434} {"train_loss": -41.302631409700254, "global_step": 294634, "epoch": 2434, "val_loss": 2514840.25} {"train_loss": -41.67677307128906, "global_step": 294635, "epoch": 2435} {"train_loss": -42.32632064819336, "global_step": 294636, "epoch": 2435} {"train_loss": -42.062294006347656, "global_step": 294637, "epoch": 2435} {"train_loss": -42.653316497802734, "global_step": 294638, "epoch": 2435} {"train_loss": -42.42222213745117, "global_step": 294639, "epoch": 2435} {"train_loss": -42.472232818603516, "global_step": 294640, "epoch": 2435} {"train_loss": -42.681793212890625, "global_step": 294641, "epoch": 2435} {"train_loss": -42.57661437988281, "global_step": 294642, "epoch": 2435} {"train_loss": -41.540489196777344, "global_step": 294643, "epoch": 2435} {"train_loss": -41.40350341796875, "global_step": 294644, "epoch": 2435} {"train_loss": -42.42750549316406, "global_step": 294645, "epoch": 2435} {"train_loss": -42.20310592651367, "global_step": 294646, "epoch": 2435} {"train_loss": -42.52256393432617, "global_step": 294647, "epoch": 2435} {"train_loss": -43.09544372558594, "global_step": 294648, "epoch": 2435} {"train_loss": -42.451263427734375, "global_step": 294649, "epoch": 2435} {"train_loss": -42.35163116455078, "global_step": 294650, "epoch": 2435} {"train_loss": -42.401092529296875, "global_step": 294651, "epoch": 2435} {"train_loss": -41.07578659057617, "global_step": 294652, "epoch": 2435} {"train_loss": -39.992618560791016, "global_step": 294653, "epoch": 2435} {"train_loss": -40.42753219604492, "global_step": 294654, "epoch": 2435} {"train_loss": -42.84596633911133, "global_step": 294655, "epoch": 2435} {"train_loss": -42.69248580932617, "global_step": 294656, "epoch": 2435} {"train_loss": -41.18120574951172, "global_step": 294657, "epoch": 2435} {"train_loss": -41.20002365112305, "global_step": 294658, "epoch": 2435} {"train_loss": -36.172542572021484, "global_step": 294659, "epoch": 2435} {"train_loss": -41.53443145751953, "global_step": 294660, "epoch": 2435} {"train_loss": -42.045631408691406, "global_step": 294661, "epoch": 2435} {"train_loss": -42.44838333129883, "global_step": 294662, "epoch": 2435} {"train_loss": -41.88808059692383, "global_step": 294663, "epoch": 2435} {"train_loss": -41.875343322753906, "global_step": 294664, "epoch": 2435} {"train_loss": -42.898433685302734, "global_step": 294665, "epoch": 2435} {"train_loss": -42.47970199584961, "global_step": 294666, "epoch": 2435} {"train_loss": -42.41337203979492, "global_step": 294667, "epoch": 2435} {"train_loss": -42.546817779541016, "global_step": 294668, "epoch": 2435} {"train_loss": -42.40693283081055, "global_step": 294669, "epoch": 2435} {"train_loss": -42.57713317871094, "global_step": 294670, "epoch": 2435} {"train_loss": -42.05271530151367, "global_step": 294671, "epoch": 2435} {"train_loss": -43.07682418823242, "global_step": 294672, "epoch": 2435} {"train_loss": -42.52311325073242, "global_step": 294673, "epoch": 2435} {"train_loss": -42.33367919921875, "global_step": 294674, "epoch": 2435} {"train_loss": -41.99897003173828, "global_step": 294675, "epoch": 2435} {"train_loss": -42.5861930847168, "global_step": 294676, "epoch": 2435} {"train_loss": -42.293888092041016, "global_step": 294677, "epoch": 2435} {"train_loss": -41.181148529052734, "global_step": 294678, "epoch": 2435} {"train_loss": -42.90005111694336, "global_step": 294679, "epoch": 2435} {"train_loss": -42.478614807128906, "global_step": 294680, "epoch": 2435} {"train_loss": -41.569068908691406, "global_step": 294681, "epoch": 2435} {"train_loss": -42.75032424926758, "global_step": 294682, "epoch": 2435} {"train_loss": -42.836280822753906, "global_step": 294683, "epoch": 2435} {"train_loss": -42.537654876708984, "global_step": 294684, "epoch": 2435} {"train_loss": -42.4704704284668, "global_step": 294685, "epoch": 2435} {"train_loss": -42.88788986206055, "global_step": 294686, "epoch": 2435} {"train_loss": -42.75368881225586, "global_step": 294687, "epoch": 2435} {"train_loss": -42.48072814941406, "global_step": 294688, "epoch": 2435} {"train_loss": -42.612770080566406, "global_step": 294689, "epoch": 2435} {"train_loss": -41.74342727661133, "global_step": 294690, "epoch": 2435} {"train_loss": -42.922767639160156, "global_step": 294691, "epoch": 2435} {"train_loss": -43.23125076293945, "global_step": 294692, "epoch": 2435} {"train_loss": -43.774898529052734, "global_step": 294693, "epoch": 2435} {"train_loss": -41.467262268066406, "global_step": 294694, "epoch": 2435} {"train_loss": -42.25135040283203, "global_step": 294695, "epoch": 2435} {"train_loss": -40.64324188232422, "global_step": 294696, "epoch": 2435} {"train_loss": -42.426509857177734, "global_step": 294697, "epoch": 2435} {"train_loss": -42.45310592651367, "global_step": 294698, "epoch": 2435} {"train_loss": -42.23102569580078, "global_step": 294699, "epoch": 2435} {"train_loss": -43.12266540527344, "global_step": 294700, "epoch": 2435} {"train_loss": -42.919525146484375, "global_step": 294701, "epoch": 2435} {"train_loss": -41.889076232910156, "global_step": 294702, "epoch": 2435} {"train_loss": -42.42748260498047, "global_step": 294703, "epoch": 2435} {"train_loss": -43.12251663208008, "global_step": 294704, "epoch": 2435} {"train_loss": -42.8162956237793, "global_step": 294705, "epoch": 2435} {"train_loss": -43.238616943359375, "global_step": 294706, "epoch": 2435} {"train_loss": -40.553985595703125, "global_step": 294707, "epoch": 2435} {"train_loss": -42.59046173095703, "global_step": 294708, "epoch": 2435} {"train_loss": -41.798763275146484, "global_step": 294709, "epoch": 2435} {"train_loss": -41.714263916015625, "global_step": 294710, "epoch": 2435} {"train_loss": -42.3421630859375, "global_step": 294711, "epoch": 2435} {"train_loss": -42.75840377807617, "global_step": 294712, "epoch": 2435} {"train_loss": -42.4149284362793, "global_step": 294713, "epoch": 2435} {"train_loss": -41.39192581176758, "global_step": 294714, "epoch": 2435} {"train_loss": -42.2358512878418, "global_step": 294715, "epoch": 2435} {"train_loss": -39.072879791259766, "global_step": 294716, "epoch": 2435} {"train_loss": -41.305824279785156, "global_step": 294717, "epoch": 2435} {"train_loss": -41.90507125854492, "global_step": 294718, "epoch": 2435} {"train_loss": -42.52275466918945, "global_step": 294719, "epoch": 2435} {"train_loss": -43.04171371459961, "global_step": 294720, "epoch": 2435} {"train_loss": -42.548519134521484, "global_step": 294721, "epoch": 2435} {"train_loss": -42.038848876953125, "global_step": 294722, "epoch": 2435} {"train_loss": -42.76213836669922, "global_step": 294723, "epoch": 2435} {"train_loss": -40.28053665161133, "global_step": 294724, "epoch": 2435} {"train_loss": -42.1585807800293, "global_step": 294725, "epoch": 2435} {"train_loss": -41.62771987915039, "global_step": 294726, "epoch": 2435} {"train_loss": -41.88129425048828, "global_step": 294727, "epoch": 2435} {"train_loss": -41.98688507080078, "global_step": 294728, "epoch": 2435} {"train_loss": -40.855560302734375, "global_step": 294729, "epoch": 2435} {"train_loss": -39.02065658569336, "global_step": 294730, "epoch": 2435} {"train_loss": -36.752071380615234, "global_step": 294731, "epoch": 2435} {"train_loss": -41.11882400512695, "global_step": 294732, "epoch": 2435} {"train_loss": -42.20162582397461, "global_step": 294733, "epoch": 2435} {"train_loss": -41.092098236083984, "global_step": 294734, "epoch": 2435} {"train_loss": -41.04808044433594, "global_step": 294735, "epoch": 2435} {"train_loss": -42.01804733276367, "global_step": 294736, "epoch": 2435} {"train_loss": -42.10903549194336, "global_step": 294737, "epoch": 2435} {"train_loss": -42.007686614990234, "global_step": 294738, "epoch": 2435} {"train_loss": -41.13182830810547, "global_step": 294739, "epoch": 2435} {"train_loss": -42.465145111083984, "global_step": 294740, "epoch": 2435} {"train_loss": -41.070613861083984, "global_step": 294741, "epoch": 2435} {"train_loss": -41.714088439941406, "global_step": 294742, "epoch": 2435} {"train_loss": -42.3955078125, "global_step": 294743, "epoch": 2435} {"train_loss": -42.94175720214844, "global_step": 294744, "epoch": 2435} {"train_loss": -42.92816925048828, "global_step": 294745, "epoch": 2435} {"train_loss": -42.625450134277344, "global_step": 294746, "epoch": 2435} {"train_loss": -43.01514434814453, "global_step": 294747, "epoch": 2435} {"train_loss": -42.37321853637695, "global_step": 294748, "epoch": 2435} {"train_loss": -42.11306381225586, "global_step": 294749, "epoch": 2435} {"train_loss": -42.44403076171875, "global_step": 294750, "epoch": 2435} {"train_loss": -42.61283493041992, "global_step": 294751, "epoch": 2435} {"train_loss": -42.03269577026367, "global_step": 294752, "epoch": 2435} {"train_loss": -42.132652282714844, "global_step": 294753, "epoch": 2435} {"train_loss": -42.5755729675293, "global_step": 294754, "epoch": 2435} {"train_loss": -42.04949178774495, "global_step": 294755, "epoch": 2435, "val_loss": 2464555.5} {"train_loss": -43.04999542236328, "global_step": 294756, "epoch": 2436} {"train_loss": -41.657711029052734, "global_step": 294757, "epoch": 2436} {"train_loss": -43.0572395324707, "global_step": 294758, "epoch": 2436} {"train_loss": -43.41608810424805, "global_step": 294759, "epoch": 2436} {"train_loss": -42.4904899597168, "global_step": 294760, "epoch": 2436} {"train_loss": -42.290584564208984, "global_step": 294761, "epoch": 2436} {"train_loss": -42.97042465209961, "global_step": 294762, "epoch": 2436} {"train_loss": -42.475189208984375, "global_step": 294763, "epoch": 2436} {"train_loss": -40.39472579956055, "global_step": 294764, "epoch": 2436} {"train_loss": -42.2648811340332, "global_step": 294765, "epoch": 2436} {"train_loss": -43.45309066772461, "global_step": 294766, "epoch": 2436} {"train_loss": -42.5181884765625, "global_step": 294767, "epoch": 2436} {"train_loss": -42.56111526489258, "global_step": 294768, "epoch": 2436} {"train_loss": -40.94120788574219, "global_step": 294769, "epoch": 2436} {"train_loss": -40.96742630004883, "global_step": 294770, "epoch": 2436} {"train_loss": -42.456966400146484, "global_step": 294771, "epoch": 2436} {"train_loss": -42.99795150756836, "global_step": 294772, "epoch": 2436} {"train_loss": -41.736083984375, "global_step": 294773, "epoch": 2436} {"train_loss": -40.213951110839844, "global_step": 294774, "epoch": 2436} {"train_loss": -40.935394287109375, "global_step": 294775, "epoch": 2436} {"train_loss": -42.5726318359375, "global_step": 294776, "epoch": 2436} {"train_loss": -40.40114212036133, "global_step": 294777, "epoch": 2436} {"train_loss": -41.85264205932617, "global_step": 294778, "epoch": 2436} {"train_loss": -42.473472595214844, "global_step": 294779, "epoch": 2436} {"train_loss": -43.030609130859375, "global_step": 294780, "epoch": 2436} {"train_loss": -41.82017135620117, "global_step": 294781, "epoch": 2436} {"train_loss": -40.15766143798828, "global_step": 294782, "epoch": 2436} {"train_loss": -40.61461639404297, "global_step": 294783, "epoch": 2436} {"train_loss": -41.22589111328125, "global_step": 294784, "epoch": 2436} {"train_loss": -42.65052032470703, "global_step": 294785, "epoch": 2436} {"train_loss": -42.78857421875, "global_step": 294786, "epoch": 2436} {"train_loss": -42.48873519897461, "global_step": 294787, "epoch": 2436} {"train_loss": -41.40947341918945, "global_step": 294788, "epoch": 2436} {"train_loss": -43.15359878540039, "global_step": 294789, "epoch": 2436} {"train_loss": -43.0885124206543, "global_step": 294790, "epoch": 2436} {"train_loss": -41.43842697143555, "global_step": 294791, "epoch": 2436} {"train_loss": -41.98816680908203, "global_step": 294792, "epoch": 2436} {"train_loss": -43.362098693847656, "global_step": 294793, "epoch": 2436} {"train_loss": -42.09351348876953, "global_step": 294794, "epoch": 2436} {"train_loss": -41.71326446533203, "global_step": 294795, "epoch": 2436} {"train_loss": -42.387733459472656, "global_step": 294796, "epoch": 2436} {"train_loss": -43.522491455078125, "global_step": 294797, "epoch": 2436} {"train_loss": -42.697689056396484, "global_step": 294798, "epoch": 2436} {"train_loss": -41.67100143432617, "global_step": 294799, "epoch": 2436} {"train_loss": -42.805091857910156, "global_step": 294800, "epoch": 2436} {"train_loss": -42.92360305786133, "global_step": 294801, "epoch": 2436} {"train_loss": -41.58857345581055, "global_step": 294802, "epoch": 2436} {"train_loss": -43.08150863647461, "global_step": 294803, "epoch": 2436} {"train_loss": -42.30359649658203, "global_step": 294804, "epoch": 2436} {"train_loss": -43.00728988647461, "global_step": 294805, "epoch": 2436} {"train_loss": -43.04673385620117, "global_step": 294806, "epoch": 2436} {"train_loss": -43.6027946472168, "global_step": 294807, "epoch": 2436} {"train_loss": -42.805721282958984, "global_step": 294808, "epoch": 2436} {"train_loss": -39.75312423706055, "global_step": 294809, "epoch": 2436} {"train_loss": -42.21961212158203, "global_step": 294810, "epoch": 2436} {"train_loss": -42.64617156982422, "global_step": 294811, "epoch": 2436} {"train_loss": -43.1926155090332, "global_step": 294812, "epoch": 2436} {"train_loss": -43.3471794128418, "global_step": 294813, "epoch": 2436} {"train_loss": -41.023773193359375, "global_step": 294814, "epoch": 2436} {"train_loss": -43.19439697265625, "global_step": 294815, "epoch": 2436} {"train_loss": -43.266719818115234, "global_step": 294816, "epoch": 2436} {"train_loss": -42.51365280151367, "global_step": 294817, "epoch": 2436} {"train_loss": -42.556251525878906, "global_step": 294818, "epoch": 2436} {"train_loss": -42.947174072265625, "global_step": 294819, "epoch": 2436} {"train_loss": -41.73676300048828, "global_step": 294820, "epoch": 2436} {"train_loss": -43.22490310668945, "global_step": 294821, "epoch": 2436} {"train_loss": -42.876922607421875, "global_step": 294822, "epoch": 2436} {"train_loss": -42.2154426574707, "global_step": 294823, "epoch": 2436} {"train_loss": -42.85145568847656, "global_step": 294824, "epoch": 2436} {"train_loss": -41.203277587890625, "global_step": 294825, "epoch": 2436} {"train_loss": -42.07883834838867, "global_step": 294826, "epoch": 2436} {"train_loss": -42.48639678955078, "global_step": 294827, "epoch": 2436} {"train_loss": -43.38388442993164, "global_step": 294828, "epoch": 2436} {"train_loss": -43.16352081298828, "global_step": 294829, "epoch": 2436} {"train_loss": -43.07740783691406, "global_step": 294830, "epoch": 2436} {"train_loss": -41.26129913330078, "global_step": 294831, "epoch": 2436} {"train_loss": -43.01177215576172, "global_step": 294832, "epoch": 2436} {"train_loss": -43.21152114868164, "global_step": 294833, "epoch": 2436} {"train_loss": -37.656517028808594, "global_step": 294834, "epoch": 2436} {"train_loss": -41.64362716674805, "global_step": 294835, "epoch": 2436} {"train_loss": -41.84513473510742, "global_step": 294836, "epoch": 2436} {"train_loss": -41.984130859375, "global_step": 294837, "epoch": 2436} {"train_loss": -35.535701751708984, "global_step": 294838, "epoch": 2436} {"train_loss": -37.71699905395508, "global_step": 294839, "epoch": 2436} {"train_loss": -39.24968338012695, "global_step": 294840, "epoch": 2436} {"train_loss": -40.118709564208984, "global_step": 294841, "epoch": 2436} {"train_loss": -37.21476364135742, "global_step": 294842, "epoch": 2436} {"train_loss": -38.98778533935547, "global_step": 294843, "epoch": 2436} {"train_loss": -39.412906646728516, "global_step": 294844, "epoch": 2436} {"train_loss": -36.482513427734375, "global_step": 294845, "epoch": 2436} {"train_loss": -35.88096618652344, "global_step": 294846, "epoch": 2436} {"train_loss": -38.38135528564453, "global_step": 294847, "epoch": 2436} {"train_loss": -39.08285140991211, "global_step": 294848, "epoch": 2436} {"train_loss": -40.7857551574707, "global_step": 294849, "epoch": 2436} {"train_loss": -37.75086212158203, "global_step": 294850, "epoch": 2436} {"train_loss": -39.07194900512695, "global_step": 294851, "epoch": 2436} {"train_loss": -35.57402801513672, "global_step": 294852, "epoch": 2436} {"train_loss": -40.80101776123047, "global_step": 294853, "epoch": 2436} {"train_loss": -40.53192901611328, "global_step": 294854, "epoch": 2436} {"train_loss": -39.13530731201172, "global_step": 294855, "epoch": 2436} {"train_loss": -38.59889221191406, "global_step": 294856, "epoch": 2436} {"train_loss": -38.57835006713867, "global_step": 294857, "epoch": 2436} {"train_loss": -41.0002555847168, "global_step": 294858, "epoch": 2436} {"train_loss": -39.95970916748047, "global_step": 294859, "epoch": 2436} {"train_loss": -40.55422592163086, "global_step": 294860, "epoch": 2436} {"train_loss": -39.694820404052734, "global_step": 294861, "epoch": 2436} {"train_loss": -40.38117599487305, "global_step": 294862, "epoch": 2436} {"train_loss": -39.70164108276367, "global_step": 294863, "epoch": 2436} {"train_loss": -37.05695724487305, "global_step": 294864, "epoch": 2436} {"train_loss": -38.9649543762207, "global_step": 294865, "epoch": 2436} {"train_loss": -41.14421463012695, "global_step": 294866, "epoch": 2436} {"train_loss": -38.87688064575195, "global_step": 294867, "epoch": 2436} {"train_loss": -40.0799560546875, "global_step": 294868, "epoch": 2436} {"train_loss": -39.17696762084961, "global_step": 294869, "epoch": 2436} {"train_loss": -38.71364974975586, "global_step": 294870, "epoch": 2436} {"train_loss": -41.335792541503906, "global_step": 294871, "epoch": 2436} {"train_loss": -39.477046966552734, "global_step": 294872, "epoch": 2436} {"train_loss": -40.602787017822266, "global_step": 294873, "epoch": 2436} {"train_loss": -40.28921127319336, "global_step": 294874, "epoch": 2436} {"train_loss": -39.50071716308594, "global_step": 294875, "epoch": 2436} {"train_loss": -41.24279454128801, "global_step": 294876, "epoch": 2436, "val_loss": 2511737.75} {"train_loss": -40.818260192871094, "global_step": 294877, "epoch": 2437} {"train_loss": -40.68961715698242, "global_step": 294878, "epoch": 2437} {"train_loss": -41.85966110229492, "global_step": 294879, "epoch": 2437} {"train_loss": -41.0623779296875, "global_step": 294880, "epoch": 2437} {"train_loss": -40.867523193359375, "global_step": 294881, "epoch": 2437} {"train_loss": -38.27987289428711, "global_step": 294882, "epoch": 2437} {"train_loss": -41.50581741333008, "global_step": 294883, "epoch": 2437} {"train_loss": -41.21956253051758, "global_step": 294884, "epoch": 2437} {"train_loss": -41.38850021362305, "global_step": 294885, "epoch": 2437} {"train_loss": -41.16792297363281, "global_step": 294886, "epoch": 2437} {"train_loss": -41.22683334350586, "global_step": 294887, "epoch": 2437} {"train_loss": -41.867977142333984, "global_step": 294888, "epoch": 2437} {"train_loss": -40.57783126831055, "global_step": 294889, "epoch": 2437} {"train_loss": -39.98109436035156, "global_step": 294890, "epoch": 2437} {"train_loss": -39.30224609375, "global_step": 294891, "epoch": 2437} {"train_loss": -40.87396240234375, "global_step": 294892, "epoch": 2437} {"train_loss": -39.15559005737305, "global_step": 294893, "epoch": 2437} {"train_loss": -40.934783935546875, "global_step": 294894, "epoch": 2437} {"train_loss": -40.45612335205078, "global_step": 294895, "epoch": 2437} {"train_loss": -41.508113861083984, "global_step": 294896, "epoch": 2437} {"train_loss": -42.18525314331055, "global_step": 294897, "epoch": 2437} {"train_loss": -41.145362854003906, "global_step": 294898, "epoch": 2437} {"train_loss": -40.56349182128906, "global_step": 294899, "epoch": 2437} {"train_loss": -41.61002731323242, "global_step": 294900, "epoch": 2437} {"train_loss": -41.76042556762695, "global_step": 294901, "epoch": 2437} {"train_loss": -42.161643981933594, "global_step": 294902, "epoch": 2437} {"train_loss": -41.27519607543945, "global_step": 294903, "epoch": 2437} {"train_loss": -41.664772033691406, "global_step": 294904, "epoch": 2437} {"train_loss": -41.87028503417969, "global_step": 294905, "epoch": 2437} {"train_loss": -42.01595687866211, "global_step": 294906, "epoch": 2437} {"train_loss": -41.028690338134766, "global_step": 294907, "epoch": 2437} {"train_loss": -42.178462982177734, "global_step": 294908, "epoch": 2437} {"train_loss": -43.004249572753906, "global_step": 294909, "epoch": 2437} {"train_loss": -42.02408218383789, "global_step": 294910, "epoch": 2437} {"train_loss": -42.418392181396484, "global_step": 294911, "epoch": 2437} {"train_loss": -41.80105209350586, "global_step": 294912, "epoch": 2437} {"train_loss": -41.140541076660156, "global_step": 294913, "epoch": 2437} {"train_loss": -42.12543869018555, "global_step": 294914, "epoch": 2437} {"train_loss": -41.379730224609375, "global_step": 294915, "epoch": 2437} {"train_loss": -41.59910583496094, "global_step": 294916, "epoch": 2437} {"train_loss": -41.71100997924805, "global_step": 294917, "epoch": 2437} {"train_loss": -41.61068344116211, "global_step": 294918, "epoch": 2437} {"train_loss": -41.90580368041992, "global_step": 294919, "epoch": 2437} {"train_loss": -42.993865966796875, "global_step": 294920, "epoch": 2437} {"train_loss": -39.474491119384766, "global_step": 294921, "epoch": 2437} {"train_loss": -42.298248291015625, "global_step": 294922, "epoch": 2437} {"train_loss": -41.89609909057617, "global_step": 294923, "epoch": 2437} {"train_loss": -42.5678596496582, "global_step": 294924, "epoch": 2437} {"train_loss": -39.762081146240234, "global_step": 294925, "epoch": 2437} {"train_loss": -39.10689163208008, "global_step": 294926, "epoch": 2437} {"train_loss": -42.00603485107422, "global_step": 294927, "epoch": 2437} {"train_loss": -41.14841842651367, "global_step": 294928, "epoch": 2437} {"train_loss": -40.96879196166992, "global_step": 294929, "epoch": 2437} {"train_loss": -41.18053436279297, "global_step": 294930, "epoch": 2437} {"train_loss": -42.628868103027344, "global_step": 294931, "epoch": 2437} {"train_loss": -41.4300651550293, "global_step": 294932, "epoch": 2437} {"train_loss": -41.6965446472168, "global_step": 294933, "epoch": 2437} {"train_loss": -41.069698333740234, "global_step": 294934, "epoch": 2437} {"train_loss": -41.40493392944336, "global_step": 294935, "epoch": 2437} {"train_loss": -41.96745681762695, "global_step": 294936, "epoch": 2437} {"train_loss": -41.61213302612305, "global_step": 294937, "epoch": 2437} {"train_loss": -41.269012451171875, "global_step": 294938, "epoch": 2437} {"train_loss": -41.43114471435547, "global_step": 294939, "epoch": 2437} {"train_loss": -43.05802536010742, "global_step": 294940, "epoch": 2437} {"train_loss": -41.77143096923828, "global_step": 294941, "epoch": 2437} {"train_loss": -41.58770751953125, "global_step": 294942, "epoch": 2437} {"train_loss": -42.06413650512695, "global_step": 294943, "epoch": 2437} {"train_loss": -40.313720703125, "global_step": 294944, "epoch": 2437} {"train_loss": -42.08047103881836, "global_step": 294945, "epoch": 2437} {"train_loss": -42.38420486450195, "global_step": 294946, "epoch": 2437} {"train_loss": -41.9610481262207, "global_step": 294947, "epoch": 2437} {"train_loss": -42.241554260253906, "global_step": 294948, "epoch": 2437} {"train_loss": -41.86246871948242, "global_step": 294949, "epoch": 2437} {"train_loss": -42.02585983276367, "global_step": 294950, "epoch": 2437} {"train_loss": -42.656768798828125, "global_step": 294951, "epoch": 2437} {"train_loss": -41.5831184387207, "global_step": 294952, "epoch": 2437} {"train_loss": -40.797637939453125, "global_step": 294953, "epoch": 2437} {"train_loss": -42.307369232177734, "global_step": 294954, "epoch": 2437} {"train_loss": -42.888362884521484, "global_step": 294955, "epoch": 2437} {"train_loss": -43.03413009643555, "global_step": 294956, "epoch": 2437} {"train_loss": -42.278324127197266, "global_step": 294957, "epoch": 2437} {"train_loss": -41.685638427734375, "global_step": 294958, "epoch": 2437} {"train_loss": -42.732295989990234, "global_step": 294959, "epoch": 2437} {"train_loss": -42.71645736694336, "global_step": 294960, "epoch": 2437} {"train_loss": -42.16594696044922, "global_step": 294961, "epoch": 2437} {"train_loss": -42.30390930175781, "global_step": 294962, "epoch": 2437} {"train_loss": -42.98389434814453, "global_step": 294963, "epoch": 2437} {"train_loss": -41.325042724609375, "global_step": 294964, "epoch": 2437} {"train_loss": -42.71012496948242, "global_step": 294965, "epoch": 2437} {"train_loss": -42.177494049072266, "global_step": 294966, "epoch": 2437} {"train_loss": -42.47990036010742, "global_step": 294967, "epoch": 2437} {"train_loss": -43.063533782958984, "global_step": 294968, "epoch": 2437} {"train_loss": -41.32553482055664, "global_step": 294969, "epoch": 2437} {"train_loss": -42.403358459472656, "global_step": 294970, "epoch": 2437} {"train_loss": -41.68784713745117, "global_step": 294971, "epoch": 2437} {"train_loss": -42.89858627319336, "global_step": 294972, "epoch": 2437} {"train_loss": -42.64288330078125, "global_step": 294973, "epoch": 2437} {"train_loss": -41.659019470214844, "global_step": 294974, "epoch": 2437} {"train_loss": -42.99648666381836, "global_step": 294975, "epoch": 2437} {"train_loss": -42.42240524291992, "global_step": 294976, "epoch": 2437} {"train_loss": -42.21389389038086, "global_step": 294977, "epoch": 2437} {"train_loss": -41.65380096435547, "global_step": 294978, "epoch": 2437} {"train_loss": -42.04636001586914, "global_step": 294979, "epoch": 2437} {"train_loss": -41.75932693481445, "global_step": 294980, "epoch": 2437} {"train_loss": -41.599365234375, "global_step": 294981, "epoch": 2437} {"train_loss": -41.05073165893555, "global_step": 294982, "epoch": 2437} {"train_loss": -41.90591049194336, "global_step": 294983, "epoch": 2437} {"train_loss": -42.528526306152344, "global_step": 294984, "epoch": 2437} {"train_loss": -42.08824157714844, "global_step": 294985, "epoch": 2437} {"train_loss": -42.91280746459961, "global_step": 294986, "epoch": 2437} {"train_loss": -41.77241134643555, "global_step": 294987, "epoch": 2437} {"train_loss": -43.04960250854492, "global_step": 294988, "epoch": 2437} {"train_loss": -42.20718765258789, "global_step": 294989, "epoch": 2437} {"train_loss": -41.043331146240234, "global_step": 294990, "epoch": 2437} {"train_loss": -41.687496185302734, "global_step": 294991, "epoch": 2437} {"train_loss": -42.53728485107422, "global_step": 294992, "epoch": 2437} {"train_loss": -42.53269577026367, "global_step": 294993, "epoch": 2437} {"train_loss": -42.917476654052734, "global_step": 294994, "epoch": 2437} {"train_loss": -43.067325592041016, "global_step": 294995, "epoch": 2437} {"train_loss": -41.64284133911133, "global_step": 294996, "epoch": 2437} {"train_loss": -41.720179250417665, "global_step": 294997, "epoch": 2437, "val_loss": 2501230.75} {"train_loss": -42.03016662597656, "global_step": 294998, "epoch": 2438} {"train_loss": -42.1079216003418, "global_step": 294999, "epoch": 2438} {"train_loss": -42.84823226928711, "global_step": 295000, "epoch": 2438} {"train_loss": -41.03779220581055, "global_step": 295001, "epoch": 2438} {"train_loss": -41.694793701171875, "global_step": 295002, "epoch": 2438} {"train_loss": -42.13726806640625, "global_step": 295003, "epoch": 2438} {"train_loss": -40.41704177856445, "global_step": 295004, "epoch": 2438} {"train_loss": -41.23603439331055, "global_step": 295005, "epoch": 2438} {"train_loss": -41.683929443359375, "global_step": 295006, "epoch": 2438} {"train_loss": -41.49374008178711, "global_step": 295007, "epoch": 2438} {"train_loss": -41.31374740600586, "global_step": 295008, "epoch": 2438} {"train_loss": -42.04340744018555, "global_step": 295009, "epoch": 2438} {"train_loss": -40.27204132080078, "global_step": 295010, "epoch": 2438} {"train_loss": -41.35136413574219, "global_step": 295011, "epoch": 2438} {"train_loss": -38.98832321166992, "global_step": 295012, "epoch": 2438} {"train_loss": -36.74225997924805, "global_step": 295013, "epoch": 2438} {"train_loss": -36.098262786865234, "global_step": 295014, "epoch": 2438} {"train_loss": -39.071231842041016, "global_step": 295015, "epoch": 2438} {"train_loss": -40.11615753173828, "global_step": 295016, "epoch": 2438} {"train_loss": -41.64657211303711, "global_step": 295017, "epoch": 2438} {"train_loss": -37.26191329956055, "global_step": 295018, "epoch": 2438} {"train_loss": -39.53238296508789, "global_step": 295019, "epoch": 2438} {"train_loss": -40.67771911621094, "global_step": 295020, "epoch": 2438} {"train_loss": -40.67932891845703, "global_step": 295021, "epoch": 2438} {"train_loss": -39.60269546508789, "global_step": 295022, "epoch": 2438} {"train_loss": -42.00272750854492, "global_step": 295023, "epoch": 2438} {"train_loss": -41.18197250366211, "global_step": 295024, "epoch": 2438} {"train_loss": -41.24557113647461, "global_step": 295025, "epoch": 2438} {"train_loss": -41.8871955871582, "global_step": 295026, "epoch": 2438} {"train_loss": -39.61764144897461, "global_step": 295027, "epoch": 2438} {"train_loss": -42.087955474853516, "global_step": 295028, "epoch": 2438} {"train_loss": -39.45721435546875, "global_step": 295029, "epoch": 2438} {"train_loss": -41.07950973510742, "global_step": 295030, "epoch": 2438} {"train_loss": -41.36735153198242, "global_step": 295031, "epoch": 2438} {"train_loss": -40.631900787353516, "global_step": 295032, "epoch": 2438} {"train_loss": -41.421932220458984, "global_step": 295033, "epoch": 2438} {"train_loss": -41.60311508178711, "global_step": 295034, "epoch": 2438} {"train_loss": -41.21588134765625, "global_step": 295035, "epoch": 2438} {"train_loss": -40.64989471435547, "global_step": 295036, "epoch": 2438} {"train_loss": -41.27994918823242, "global_step": 295037, "epoch": 2438} {"train_loss": -42.27962112426758, "global_step": 295038, "epoch": 2438} {"train_loss": -41.99440383911133, "global_step": 295039, "epoch": 2438} {"train_loss": -42.55522918701172, "global_step": 295040, "epoch": 2438} {"train_loss": -41.0411491394043, "global_step": 295041, "epoch": 2438} {"train_loss": -43.02206039428711, "global_step": 295042, "epoch": 2438} {"train_loss": -42.217533111572266, "global_step": 295043, "epoch": 2438} {"train_loss": -42.47062301635742, "global_step": 295044, "epoch": 2438} {"train_loss": -42.73386764526367, "global_step": 295045, "epoch": 2438} {"train_loss": -41.50232696533203, "global_step": 295046, "epoch": 2438} {"train_loss": -42.15778732299805, "global_step": 295047, "epoch": 2438} {"train_loss": -40.98029327392578, "global_step": 295048, "epoch": 2438} {"train_loss": -42.098976135253906, "global_step": 295049, "epoch": 2438} {"train_loss": -41.8778190612793, "global_step": 295050, "epoch": 2438} {"train_loss": -41.696197509765625, "global_step": 295051, "epoch": 2438} {"train_loss": -42.4951286315918, "global_step": 295052, "epoch": 2438} {"train_loss": -42.409645080566406, "global_step": 295053, "epoch": 2438} {"train_loss": -42.442604064941406, "global_step": 295054, "epoch": 2438} {"train_loss": -39.50883102416992, "global_step": 295055, "epoch": 2438} {"train_loss": -42.18513870239258, "global_step": 295056, "epoch": 2438} {"train_loss": -42.21234893798828, "global_step": 295057, "epoch": 2438} {"train_loss": -41.82368850708008, "global_step": 295058, "epoch": 2438} {"train_loss": -42.811500549316406, "global_step": 295059, "epoch": 2438} {"train_loss": -42.756065368652344, "global_step": 295060, "epoch": 2438} {"train_loss": -42.190364837646484, "global_step": 295061, "epoch": 2438} {"train_loss": -42.23331832885742, "global_step": 295062, "epoch": 2438} {"train_loss": -42.59530258178711, "global_step": 295063, "epoch": 2438} {"train_loss": -42.9331169128418, "global_step": 295064, "epoch": 2438} {"train_loss": -43.00981903076172, "global_step": 295065, "epoch": 2438} {"train_loss": -42.844024658203125, "global_step": 295066, "epoch": 2438} {"train_loss": -42.934993743896484, "global_step": 295067, "epoch": 2438} {"train_loss": -42.670188903808594, "global_step": 295068, "epoch": 2438} {"train_loss": -42.55034255981445, "global_step": 295069, "epoch": 2438} {"train_loss": -42.4730224609375, "global_step": 295070, "epoch": 2438} {"train_loss": -43.3237419128418, "global_step": 295071, "epoch": 2438} {"train_loss": -42.776824951171875, "global_step": 295072, "epoch": 2438} {"train_loss": -40.72194290161133, "global_step": 295073, "epoch": 2438} {"train_loss": -43.257747650146484, "global_step": 295074, "epoch": 2438} {"train_loss": -43.046932220458984, "global_step": 295075, "epoch": 2438} {"train_loss": -42.90250778198242, "global_step": 295076, "epoch": 2438} {"train_loss": -43.17527389526367, "global_step": 295077, "epoch": 2438} {"train_loss": -42.55524444580078, "global_step": 295078, "epoch": 2438} {"train_loss": -43.370723724365234, "global_step": 295079, "epoch": 2438} {"train_loss": -41.73859786987305, "global_step": 295080, "epoch": 2438} {"train_loss": -42.33382797241211, "global_step": 295081, "epoch": 2438} {"train_loss": -42.4789924621582, "global_step": 295082, "epoch": 2438} {"train_loss": -43.24471664428711, "global_step": 295083, "epoch": 2438} {"train_loss": -42.634395599365234, "global_step": 295084, "epoch": 2438} {"train_loss": -41.95341110229492, "global_step": 295085, "epoch": 2438} {"train_loss": -42.037750244140625, "global_step": 295086, "epoch": 2438} {"train_loss": -42.99058151245117, "global_step": 295087, "epoch": 2438} {"train_loss": -42.65817642211914, "global_step": 295088, "epoch": 2438} {"train_loss": -42.7552604675293, "global_step": 295089, "epoch": 2438} {"train_loss": -42.25345230102539, "global_step": 295090, "epoch": 2438} {"train_loss": -41.85615158081055, "global_step": 295091, "epoch": 2438} {"train_loss": -39.47589111328125, "global_step": 295092, "epoch": 2438} {"train_loss": -43.544002532958984, "global_step": 295093, "epoch": 2438} {"train_loss": -43.385284423828125, "global_step": 295094, "epoch": 2438} {"train_loss": -42.6488037109375, "global_step": 295095, "epoch": 2438} {"train_loss": -40.791194915771484, "global_step": 295096, "epoch": 2438} {"train_loss": -41.938899993896484, "global_step": 295097, "epoch": 2438} {"train_loss": -42.018070220947266, "global_step": 295098, "epoch": 2438} {"train_loss": -40.64971923828125, "global_step": 295099, "epoch": 2438} {"train_loss": -43.06632614135742, "global_step": 295100, "epoch": 2438} {"train_loss": -41.830745697021484, "global_step": 295101, "epoch": 2438} {"train_loss": -43.19138717651367, "global_step": 295102, "epoch": 2438} {"train_loss": -42.06672668457031, "global_step": 295103, "epoch": 2438} {"train_loss": -42.864013671875, "global_step": 295104, "epoch": 2438} {"train_loss": -43.225215911865234, "global_step": 295105, "epoch": 2438} {"train_loss": -42.87539291381836, "global_step": 295106, "epoch": 2438} {"train_loss": -42.02111053466797, "global_step": 295107, "epoch": 2438} {"train_loss": -36.23096466064453, "global_step": 295108, "epoch": 2438} {"train_loss": -42.148521423339844, "global_step": 295109, "epoch": 2438} {"train_loss": -42.12943649291992, "global_step": 295110, "epoch": 2438} {"train_loss": -42.7173957824707, "global_step": 295111, "epoch": 2438} {"train_loss": -38.928504943847656, "global_step": 295112, "epoch": 2438} {"train_loss": -43.1252555847168, "global_step": 295113, "epoch": 2438} {"train_loss": -42.26049041748047, "global_step": 295114, "epoch": 2438} {"train_loss": -42.84865188598633, "global_step": 295115, "epoch": 2438} {"train_loss": -40.165260314941406, "global_step": 295116, "epoch": 2438} {"train_loss": -40.65626907348633, "global_step": 295117, "epoch": 2438} {"train_loss": -41.69277165940971, "global_step": 295118, "epoch": 2438, "val_loss": 2491497.25} {"train_loss": -41.514930725097656, "global_step": 295119, "epoch": 2439} {"train_loss": -41.269039154052734, "global_step": 295120, "epoch": 2439} {"train_loss": -41.65940475463867, "global_step": 295121, "epoch": 2439} {"train_loss": -42.406707763671875, "global_step": 295122, "epoch": 2439} {"train_loss": -42.25761032104492, "global_step": 295123, "epoch": 2439} {"train_loss": -39.88056182861328, "global_step": 295124, "epoch": 2439} {"train_loss": -41.125606536865234, "global_step": 295125, "epoch": 2439} {"train_loss": -39.37078857421875, "global_step": 295126, "epoch": 2439} {"train_loss": -40.20383834838867, "global_step": 295127, "epoch": 2439} {"train_loss": -41.09779739379883, "global_step": 295128, "epoch": 2439} {"train_loss": -41.79281234741211, "global_step": 295129, "epoch": 2439} {"train_loss": -39.665252685546875, "global_step": 295130, "epoch": 2439} {"train_loss": -42.00562286376953, "global_step": 295131, "epoch": 2439} {"train_loss": -42.559974670410156, "global_step": 295132, "epoch": 2439} {"train_loss": -42.35791015625, "global_step": 295133, "epoch": 2439} {"train_loss": -42.42849349975586, "global_step": 295134, "epoch": 2439} {"train_loss": -42.682369232177734, "global_step": 295135, "epoch": 2439} {"train_loss": -40.25274658203125, "global_step": 295136, "epoch": 2439} {"train_loss": -40.34103012084961, "global_step": 295137, "epoch": 2439} {"train_loss": -41.543704986572266, "global_step": 295138, "epoch": 2439} {"train_loss": -42.038124084472656, "global_step": 295139, "epoch": 2439} {"train_loss": -41.575843811035156, "global_step": 295140, "epoch": 2439} {"train_loss": -41.211421966552734, "global_step": 295141, "epoch": 2439} {"train_loss": -40.92600631713867, "global_step": 295142, "epoch": 2439} {"train_loss": -37.660316467285156, "global_step": 295143, "epoch": 2439} {"train_loss": -40.9481315612793, "global_step": 295144, "epoch": 2439} {"train_loss": -41.377933502197266, "global_step": 295145, "epoch": 2439} {"train_loss": -35.918861389160156, "global_step": 295146, "epoch": 2439} {"train_loss": -41.658790588378906, "global_step": 295147, "epoch": 2439} {"train_loss": -41.944854736328125, "global_step": 295148, "epoch": 2439} {"train_loss": -39.78761291503906, "global_step": 295149, "epoch": 2439} {"train_loss": -42.334869384765625, "global_step": 295150, "epoch": 2439} {"train_loss": -41.91021728515625, "global_step": 295151, "epoch": 2439} {"train_loss": -41.68770980834961, "global_step": 295152, "epoch": 2439} {"train_loss": -42.16191482543945, "global_step": 295153, "epoch": 2439} {"train_loss": -41.47624969482422, "global_step": 295154, "epoch": 2439} {"train_loss": -41.88523483276367, "global_step": 295155, "epoch": 2439} {"train_loss": -41.60311508178711, "global_step": 295156, "epoch": 2439} {"train_loss": -42.498329162597656, "global_step": 295157, "epoch": 2439} {"train_loss": -39.87211608886719, "global_step": 295158, "epoch": 2439} {"train_loss": -42.420955657958984, "global_step": 295159, "epoch": 2439} {"train_loss": -38.718807220458984, "global_step": 295160, "epoch": 2439} {"train_loss": -41.81328201293945, "global_step": 295161, "epoch": 2439} {"train_loss": -40.082618713378906, "global_step": 295162, "epoch": 2439} {"train_loss": -41.98354721069336, "global_step": 295163, "epoch": 2439} {"train_loss": -42.76031494140625, "global_step": 295164, "epoch": 2439} {"train_loss": -41.668697357177734, "global_step": 295165, "epoch": 2439} {"train_loss": -41.983821868896484, "global_step": 295166, "epoch": 2439} {"train_loss": -42.1368293762207, "global_step": 295167, "epoch": 2439} {"train_loss": -41.82821273803711, "global_step": 295168, "epoch": 2439} {"train_loss": -42.650238037109375, "global_step": 295169, "epoch": 2439} {"train_loss": -39.641754150390625, "global_step": 295170, "epoch": 2439} {"train_loss": -41.17661666870117, "global_step": 295171, "epoch": 2439} {"train_loss": -41.76400375366211, "global_step": 295172, "epoch": 2439} {"train_loss": -41.99047088623047, "global_step": 295173, "epoch": 2439} {"train_loss": -41.56513595581055, "global_step": 295174, "epoch": 2439} {"train_loss": -42.690914154052734, "global_step": 295175, "epoch": 2439} {"train_loss": -38.48613357543945, "global_step": 295176, "epoch": 2439} {"train_loss": -40.6837158203125, "global_step": 295177, "epoch": 2439} {"train_loss": -42.41779708862305, "global_step": 295178, "epoch": 2439} {"train_loss": -40.9767951965332, "global_step": 295179, "epoch": 2439} {"train_loss": -40.907981872558594, "global_step": 295180, "epoch": 2439} {"train_loss": -42.990535736083984, "global_step": 295181, "epoch": 2439} {"train_loss": -41.59886932373047, "global_step": 295182, "epoch": 2439} {"train_loss": -42.36896896362305, "global_step": 295183, "epoch": 2439} {"train_loss": -38.859798431396484, "global_step": 295184, "epoch": 2439} {"train_loss": -42.06333541870117, "global_step": 295185, "epoch": 2439} {"train_loss": -40.220516204833984, "global_step": 295186, "epoch": 2439} {"train_loss": -41.37985610961914, "global_step": 295187, "epoch": 2439} {"train_loss": -42.246253967285156, "global_step": 295188, "epoch": 2439} {"train_loss": -39.13410186767578, "global_step": 295189, "epoch": 2439} {"train_loss": -42.79859161376953, "global_step": 295190, "epoch": 2439} {"train_loss": -42.679935455322266, "global_step": 295191, "epoch": 2439} {"train_loss": -41.92132568359375, "global_step": 295192, "epoch": 2439} {"train_loss": -42.56473159790039, "global_step": 295193, "epoch": 2439} {"train_loss": -42.645565032958984, "global_step": 295194, "epoch": 2439} {"train_loss": -42.4263801574707, "global_step": 295195, "epoch": 2439} {"train_loss": -41.902442932128906, "global_step": 295196, "epoch": 2439} {"train_loss": -42.26255798339844, "global_step": 295197, "epoch": 2439} {"train_loss": -42.62232208251953, "global_step": 295198, "epoch": 2439} {"train_loss": -42.3606071472168, "global_step": 295199, "epoch": 2439} {"train_loss": -42.72393798828125, "global_step": 295200, "epoch": 2439} {"train_loss": -42.75699996948242, "global_step": 295201, "epoch": 2439} {"train_loss": -42.72634506225586, "global_step": 295202, "epoch": 2439} {"train_loss": -43.08913803100586, "global_step": 295203, "epoch": 2439} {"train_loss": -41.89581298828125, "global_step": 295204, "epoch": 2439} {"train_loss": -43.030418395996094, "global_step": 295205, "epoch": 2439} {"train_loss": -43.23978042602539, "global_step": 295206, "epoch": 2439} {"train_loss": -42.92793273925781, "global_step": 295207, "epoch": 2439} {"train_loss": -43.24402618408203, "global_step": 295208, "epoch": 2439} {"train_loss": -43.14625930786133, "global_step": 295209, "epoch": 2439} {"train_loss": -41.87602996826172, "global_step": 295210, "epoch": 2439} {"train_loss": -43.22794723510742, "global_step": 295211, "epoch": 2439} {"train_loss": -43.260555267333984, "global_step": 295212, "epoch": 2439} {"train_loss": -42.90462875366211, "global_step": 295213, "epoch": 2439} {"train_loss": -43.2313232421875, "global_step": 295214, "epoch": 2439} {"train_loss": -42.7727165222168, "global_step": 295215, "epoch": 2439} {"train_loss": -42.948875427246094, "global_step": 295216, "epoch": 2439} {"train_loss": -43.092201232910156, "global_step": 295217, "epoch": 2439} {"train_loss": -43.03900909423828, "global_step": 295218, "epoch": 2439} {"train_loss": -42.72068786621094, "global_step": 295219, "epoch": 2439} {"train_loss": -42.053768157958984, "global_step": 295220, "epoch": 2439} {"train_loss": -42.55023956298828, "global_step": 295221, "epoch": 2439} {"train_loss": -42.84873962402344, "global_step": 295222, "epoch": 2439} {"train_loss": -43.46409225463867, "global_step": 295223, "epoch": 2439} {"train_loss": -43.43056869506836, "global_step": 295224, "epoch": 2439} {"train_loss": -42.56863021850586, "global_step": 295225, "epoch": 2439} {"train_loss": -42.68196487426758, "global_step": 295226, "epoch": 2439} {"train_loss": -43.265193939208984, "global_step": 295227, "epoch": 2439} {"train_loss": -42.147865295410156, "global_step": 295228, "epoch": 2439} {"train_loss": -42.88601303100586, "global_step": 295229, "epoch": 2439} {"train_loss": -42.756431579589844, "global_step": 295230, "epoch": 2439} {"train_loss": -42.891815185546875, "global_step": 295231, "epoch": 2439} {"train_loss": -41.458290100097656, "global_step": 295232, "epoch": 2439} {"train_loss": -41.0527229309082, "global_step": 295233, "epoch": 2439} {"train_loss": -42.180721282958984, "global_step": 295234, "epoch": 2439} {"train_loss": -42.104400634765625, "global_step": 295235, "epoch": 2439} {"train_loss": -42.33575439453125, "global_step": 295236, "epoch": 2439} {"train_loss": -43.152748107910156, "global_step": 295237, "epoch": 2439} {"train_loss": -42.83631134033203, "global_step": 295238, "epoch": 2439} {"train_loss": -41.826135934877, "global_step": 295239, "epoch": 2439, "val_loss": 2555597.75} {"train_loss": -42.445945739746094, "global_step": 295240, "epoch": 2440} {"train_loss": -42.3380241394043, "global_step": 295241, "epoch": 2440} {"train_loss": -42.18263626098633, "global_step": 295242, "epoch": 2440} {"train_loss": -42.220489501953125, "global_step": 295243, "epoch": 2440} {"train_loss": -42.06355667114258, "global_step": 295244, "epoch": 2440} {"train_loss": -42.4245491027832, "global_step": 295245, "epoch": 2440} {"train_loss": -42.674861907958984, "global_step": 295246, "epoch": 2440} {"train_loss": -42.792503356933594, "global_step": 295247, "epoch": 2440} {"train_loss": -41.75259780883789, "global_step": 295248, "epoch": 2440} {"train_loss": -40.913272857666016, "global_step": 295249, "epoch": 2440} {"train_loss": -42.75481414794922, "global_step": 295250, "epoch": 2440} {"train_loss": -42.435035705566406, "global_step": 295251, "epoch": 2440} {"train_loss": -40.139869689941406, "global_step": 295252, "epoch": 2440} {"train_loss": -37.686851501464844, "global_step": 295253, "epoch": 2440} {"train_loss": -36.665096282958984, "global_step": 295254, "epoch": 2440} {"train_loss": -33.11669921875, "global_step": 295255, "epoch": 2440} {"train_loss": -33.0556755065918, "global_step": 295256, "epoch": 2440} {"train_loss": -41.325199127197266, "global_step": 295257, "epoch": 2440} {"train_loss": -41.49340057373047, "global_step": 295258, "epoch": 2440} {"train_loss": -37.08781051635742, "global_step": 295259, "epoch": 2440} {"train_loss": -36.37007522583008, "global_step": 295260, "epoch": 2440} {"train_loss": -41.29402542114258, "global_step": 295261, "epoch": 2440} {"train_loss": -40.4406852722168, "global_step": 295262, "epoch": 2440} {"train_loss": -41.652076721191406, "global_step": 295263, "epoch": 2440} {"train_loss": -41.121925354003906, "global_step": 295264, "epoch": 2440} {"train_loss": -40.76354217529297, "global_step": 295265, "epoch": 2440} {"train_loss": -40.64344787597656, "global_step": 295266, "epoch": 2440} {"train_loss": -41.65177536010742, "global_step": 295267, "epoch": 2440} {"train_loss": -37.06460952758789, "global_step": 295268, "epoch": 2440} {"train_loss": -40.68104934692383, "global_step": 295269, "epoch": 2440} {"train_loss": -40.34941482543945, "global_step": 295270, "epoch": 2440} {"train_loss": -41.98735427856445, "global_step": 295271, "epoch": 2440} {"train_loss": -39.7766227722168, "global_step": 295272, "epoch": 2440} {"train_loss": -41.97724914550781, "global_step": 295273, "epoch": 2440} {"train_loss": -40.813255310058594, "global_step": 295274, "epoch": 2440} {"train_loss": -41.33659744262695, "global_step": 295275, "epoch": 2440} {"train_loss": -41.54426956176758, "global_step": 295276, "epoch": 2440} {"train_loss": -41.116615295410156, "global_step": 295277, "epoch": 2440} {"train_loss": -40.40216064453125, "global_step": 295278, "epoch": 2440} {"train_loss": -40.71246337890625, "global_step": 295279, "epoch": 2440} {"train_loss": -41.69248580932617, "global_step": 295280, "epoch": 2440} {"train_loss": -42.25897979736328, "global_step": 295281, "epoch": 2440} {"train_loss": -41.580806732177734, "global_step": 295282, "epoch": 2440} {"train_loss": -42.3993034362793, "global_step": 295283, "epoch": 2440} {"train_loss": -41.07856750488281, "global_step": 295284, "epoch": 2440} {"train_loss": -42.58135986328125, "global_step": 295285, "epoch": 2440} {"train_loss": -41.79630661010742, "global_step": 295286, "epoch": 2440} {"train_loss": -42.738277435302734, "global_step": 295287, "epoch": 2440} {"train_loss": -41.87238693237305, "global_step": 295288, "epoch": 2440} {"train_loss": -42.67958068847656, "global_step": 295289, "epoch": 2440} {"train_loss": -42.38794708251953, "global_step": 295290, "epoch": 2440} {"train_loss": -42.55738067626953, "global_step": 295291, "epoch": 2440} {"train_loss": -42.64419174194336, "global_step": 295292, "epoch": 2440} {"train_loss": -41.69804763793945, "global_step": 295293, "epoch": 2440} {"train_loss": -42.55122756958008, "global_step": 295294, "epoch": 2440} {"train_loss": -42.6290397644043, "global_step": 295295, "epoch": 2440} {"train_loss": -42.68269729614258, "global_step": 295296, "epoch": 2440} {"train_loss": -42.49730682373047, "global_step": 295297, "epoch": 2440} {"train_loss": -42.30460739135742, "global_step": 295298, "epoch": 2440} {"train_loss": -42.827362060546875, "global_step": 295299, "epoch": 2440} {"train_loss": -42.64387893676758, "global_step": 295300, "epoch": 2440} {"train_loss": -42.49235916137695, "global_step": 295301, "epoch": 2440} {"train_loss": -42.90131759643555, "global_step": 295302, "epoch": 2440} {"train_loss": -42.9101676940918, "global_step": 295303, "epoch": 2440} {"train_loss": -42.29217529296875, "global_step": 295304, "epoch": 2440} {"train_loss": -42.66112518310547, "global_step": 295305, "epoch": 2440} {"train_loss": -43.23965072631836, "global_step": 295306, "epoch": 2440} {"train_loss": -43.00982666015625, "global_step": 295307, "epoch": 2440} {"train_loss": -42.94211959838867, "global_step": 295308, "epoch": 2440} {"train_loss": -43.2369270324707, "global_step": 295309, "epoch": 2440} {"train_loss": -43.23453903198242, "global_step": 295310, "epoch": 2440} {"train_loss": -43.22562789916992, "global_step": 295311, "epoch": 2440} {"train_loss": -43.1490592956543, "global_step": 295312, "epoch": 2440} {"train_loss": -43.215450286865234, "global_step": 295313, "epoch": 2440} {"train_loss": -43.456153869628906, "global_step": 295314, "epoch": 2440} {"train_loss": -43.46128463745117, "global_step": 295315, "epoch": 2440} {"train_loss": -42.46554946899414, "global_step": 295316, "epoch": 2440} {"train_loss": -43.731201171875, "global_step": 295317, "epoch": 2440} {"train_loss": -43.66414260864258, "global_step": 295318, "epoch": 2440} {"train_loss": -43.63545608520508, "global_step": 295319, "epoch": 2440} {"train_loss": -43.47312927246094, "global_step": 295320, "epoch": 2440} {"train_loss": -43.71406555175781, "global_step": 295321, "epoch": 2440} {"train_loss": -44.02714920043945, "global_step": 295322, "epoch": 2440} {"train_loss": -43.389015197753906, "global_step": 295323, "epoch": 2440} {"train_loss": -43.85115051269531, "global_step": 295324, "epoch": 2440} {"train_loss": -43.123756408691406, "global_step": 295325, "epoch": 2440} {"train_loss": -43.69956588745117, "global_step": 295326, "epoch": 2440} {"train_loss": -43.679134368896484, "global_step": 295327, "epoch": 2440} {"train_loss": -43.50035095214844, "global_step": 295328, "epoch": 2440} {"train_loss": -43.854915618896484, "global_step": 295329, "epoch": 2440} {"train_loss": -43.58134841918945, "global_step": 295330, "epoch": 2440} {"train_loss": -43.77070617675781, "global_step": 295331, "epoch": 2440} {"train_loss": -42.86833572387695, "global_step": 295332, "epoch": 2440} {"train_loss": -43.80891799926758, "global_step": 295333, "epoch": 2440} {"train_loss": -43.88192367553711, "global_step": 295334, "epoch": 2440} {"train_loss": -43.85636520385742, "global_step": 295335, "epoch": 2440} {"train_loss": -44.2260856628418, "global_step": 295336, "epoch": 2440} {"train_loss": -42.80244064331055, "global_step": 295337, "epoch": 2440} {"train_loss": -43.313873291015625, "global_step": 295338, "epoch": 2440} {"train_loss": -43.14155960083008, "global_step": 295339, "epoch": 2440} {"train_loss": -43.73706817626953, "global_step": 295340, "epoch": 2440} {"train_loss": -44.002437591552734, "global_step": 295341, "epoch": 2440} {"train_loss": -43.67206573486328, "global_step": 295342, "epoch": 2440} {"train_loss": -43.82765197753906, "global_step": 295343, "epoch": 2440} {"train_loss": -43.62574768066406, "global_step": 295344, "epoch": 2440} {"train_loss": -42.32728958129883, "global_step": 295345, "epoch": 2440} {"train_loss": -43.1749267578125, "global_step": 295346, "epoch": 2440} {"train_loss": -42.55878829956055, "global_step": 295347, "epoch": 2440} {"train_loss": -42.94645690917969, "global_step": 295348, "epoch": 2440} {"train_loss": -43.22581100463867, "global_step": 295349, "epoch": 2440} {"train_loss": -42.18635559082031, "global_step": 295350, "epoch": 2440} {"train_loss": -41.908626556396484, "global_step": 295351, "epoch": 2440} {"train_loss": -38.439510345458984, "global_step": 295352, "epoch": 2440} {"train_loss": -36.467041015625, "global_step": 295353, "epoch": 2440} {"train_loss": -37.37546920776367, "global_step": 295354, "epoch": 2440} {"train_loss": -41.030006408691406, "global_step": 295355, "epoch": 2440} {"train_loss": -42.757625579833984, "global_step": 295356, "epoch": 2440} {"train_loss": -41.39173126220703, "global_step": 295357, "epoch": 2440} {"train_loss": -40.18000411987305, "global_step": 295358, "epoch": 2440} {"train_loss": -41.925140380859375, "global_step": 295359, "epoch": 2440} {"train_loss": -41.96152515253745, "global_step": 295360, "epoch": 2440, "val_loss": 2534921.5} {"train_loss": -41.51569747924805, "global_step": 295361, "epoch": 2441} {"train_loss": -42.2393684387207, "global_step": 295362, "epoch": 2441} {"train_loss": -42.93433380126953, "global_step": 295363, "epoch": 2441} {"train_loss": -43.150997161865234, "global_step": 295364, "epoch": 2441} {"train_loss": -42.71097946166992, "global_step": 295365, "epoch": 2441} {"train_loss": -42.760581970214844, "global_step": 295366, "epoch": 2441} {"train_loss": -43.148075103759766, "global_step": 295367, "epoch": 2441} {"train_loss": -42.25667953491211, "global_step": 295368, "epoch": 2441} {"train_loss": -42.521888732910156, "global_step": 295369, "epoch": 2441} {"train_loss": -40.7734489440918, "global_step": 295370, "epoch": 2441} {"train_loss": -42.4798698425293, "global_step": 295371, "epoch": 2441} {"train_loss": -41.41748809814453, "global_step": 295372, "epoch": 2441} {"train_loss": -42.131385803222656, "global_step": 295373, "epoch": 2441} {"train_loss": -42.03402328491211, "global_step": 295374, "epoch": 2441} {"train_loss": -42.34133529663086, "global_step": 295375, "epoch": 2441} {"train_loss": -41.6151237487793, "global_step": 295376, "epoch": 2441} {"train_loss": -41.988677978515625, "global_step": 295377, "epoch": 2441} {"train_loss": -41.09515380859375, "global_step": 295378, "epoch": 2441} {"train_loss": -39.964229583740234, "global_step": 295379, "epoch": 2441} {"train_loss": -42.13492965698242, "global_step": 295380, "epoch": 2441} {"train_loss": -39.756629943847656, "global_step": 295381, "epoch": 2441} {"train_loss": -42.16735076904297, "global_step": 295382, "epoch": 2441} {"train_loss": -42.626739501953125, "global_step": 295383, "epoch": 2441} {"train_loss": -42.31789016723633, "global_step": 295384, "epoch": 2441} {"train_loss": -42.44208908081055, "global_step": 295385, "epoch": 2441} {"train_loss": -42.66427230834961, "global_step": 295386, "epoch": 2441} {"train_loss": -42.238189697265625, "global_step": 295387, "epoch": 2441} {"train_loss": -42.10805130004883, "global_step": 295388, "epoch": 2441} {"train_loss": -42.842220306396484, "global_step": 295389, "epoch": 2441} {"train_loss": -42.458858489990234, "global_step": 295390, "epoch": 2441} {"train_loss": -42.6448974609375, "global_step": 295391, "epoch": 2441} {"train_loss": -40.3177604675293, "global_step": 295392, "epoch": 2441} {"train_loss": -41.083839416503906, "global_step": 295393, "epoch": 2441} {"train_loss": -42.68452072143555, "global_step": 295394, "epoch": 2441} {"train_loss": -41.972900390625, "global_step": 295395, "epoch": 2441} {"train_loss": -42.50494384765625, "global_step": 295396, "epoch": 2441} {"train_loss": -41.343406677246094, "global_step": 295397, "epoch": 2441} {"train_loss": -42.32808303833008, "global_step": 295398, "epoch": 2441} {"train_loss": -43.01206970214844, "global_step": 295399, "epoch": 2441} {"train_loss": -42.684688568115234, "global_step": 295400, "epoch": 2441} {"train_loss": -42.0999870300293, "global_step": 295401, "epoch": 2441} {"train_loss": -41.8635368347168, "global_step": 295402, "epoch": 2441} {"train_loss": -42.91876983642578, "global_step": 295403, "epoch": 2441} {"train_loss": -43.456600189208984, "global_step": 295404, "epoch": 2441} {"train_loss": -43.16122817993164, "global_step": 295405, "epoch": 2441} {"train_loss": -42.78366470336914, "global_step": 295406, "epoch": 2441} {"train_loss": -42.50520324707031, "global_step": 295407, "epoch": 2441} {"train_loss": -43.064632415771484, "global_step": 295408, "epoch": 2441} {"train_loss": -43.32267379760742, "global_step": 295409, "epoch": 2441} {"train_loss": -43.70998764038086, "global_step": 295410, "epoch": 2441} {"train_loss": -43.368499755859375, "global_step": 295411, "epoch": 2441} {"train_loss": -43.09971237182617, "global_step": 295412, "epoch": 2441} {"train_loss": -41.6523551940918, "global_step": 295413, "epoch": 2441} {"train_loss": -43.701534271240234, "global_step": 295414, "epoch": 2441} {"train_loss": -43.40771484375, "global_step": 295415, "epoch": 2441} {"train_loss": -42.00140380859375, "global_step": 295416, "epoch": 2441} {"train_loss": -43.52253341674805, "global_step": 295417, "epoch": 2441} {"train_loss": -42.5816764831543, "global_step": 295418, "epoch": 2441} {"train_loss": -43.283634185791016, "global_step": 295419, "epoch": 2441} {"train_loss": -43.154022216796875, "global_step": 295420, "epoch": 2441} {"train_loss": -43.77251052856445, "global_step": 295421, "epoch": 2441} {"train_loss": -42.74421691894531, "global_step": 295422, "epoch": 2441} {"train_loss": -43.61488723754883, "global_step": 295423, "epoch": 2441} {"train_loss": -42.551700592041016, "global_step": 295424, "epoch": 2441} {"train_loss": -43.45858383178711, "global_step": 295425, "epoch": 2441} {"train_loss": -43.14603805541992, "global_step": 295426, "epoch": 2441} {"train_loss": -43.09719467163086, "global_step": 295427, "epoch": 2441} {"train_loss": -43.4627685546875, "global_step": 295428, "epoch": 2441} {"train_loss": -43.10093307495117, "global_step": 295429, "epoch": 2441} {"train_loss": -43.18809127807617, "global_step": 295430, "epoch": 2441} {"train_loss": -42.9171257019043, "global_step": 295431, "epoch": 2441} {"train_loss": -43.37924575805664, "global_step": 295432, "epoch": 2441} {"train_loss": -43.79154586791992, "global_step": 295433, "epoch": 2441} {"train_loss": -43.31852722167969, "global_step": 295434, "epoch": 2441} {"train_loss": -43.32400894165039, "global_step": 295435, "epoch": 2441} {"train_loss": -43.71303176879883, "global_step": 295436, "epoch": 2441} {"train_loss": -43.50966262817383, "global_step": 295437, "epoch": 2441} {"train_loss": -42.71859359741211, "global_step": 295438, "epoch": 2441} {"train_loss": -42.8826904296875, "global_step": 295439, "epoch": 2441} {"train_loss": -42.20515060424805, "global_step": 295440, "epoch": 2441} {"train_loss": -43.724365234375, "global_step": 295441, "epoch": 2441} {"train_loss": -43.469337463378906, "global_step": 295442, "epoch": 2441} {"train_loss": -42.79732894897461, "global_step": 295443, "epoch": 2441} {"train_loss": -43.561832427978516, "global_step": 295444, "epoch": 2441} {"train_loss": -42.24726486206055, "global_step": 295445, "epoch": 2441} {"train_loss": -42.17625045776367, "global_step": 295446, "epoch": 2441} {"train_loss": -42.33125686645508, "global_step": 295447, "epoch": 2441} {"train_loss": -42.857662200927734, "global_step": 295448, "epoch": 2441} {"train_loss": -42.709163665771484, "global_step": 295449, "epoch": 2441} {"train_loss": -43.2893180847168, "global_step": 295450, "epoch": 2441} {"train_loss": -42.6513786315918, "global_step": 295451, "epoch": 2441} {"train_loss": -43.00564193725586, "global_step": 295452, "epoch": 2441} {"train_loss": -38.78253936767578, "global_step": 295453, "epoch": 2441} {"train_loss": -43.04213333129883, "global_step": 295454, "epoch": 2441} {"train_loss": -42.20088577270508, "global_step": 295455, "epoch": 2441} {"train_loss": -42.6966552734375, "global_step": 295456, "epoch": 2441} {"train_loss": -42.63417434692383, "global_step": 295457, "epoch": 2441} {"train_loss": -41.16425323486328, "global_step": 295458, "epoch": 2441} {"train_loss": -42.368988037109375, "global_step": 295459, "epoch": 2441} {"train_loss": -43.06283187866211, "global_step": 295460, "epoch": 2441} {"train_loss": -42.45661926269531, "global_step": 295461, "epoch": 2441} {"train_loss": -42.6872444152832, "global_step": 295462, "epoch": 2441} {"train_loss": -42.984886169433594, "global_step": 295463, "epoch": 2441} {"train_loss": -42.16294479370117, "global_step": 295464, "epoch": 2441} {"train_loss": -42.406551361083984, "global_step": 295465, "epoch": 2441} {"train_loss": -43.1288948059082, "global_step": 295466, "epoch": 2441} {"train_loss": -42.182979583740234, "global_step": 295467, "epoch": 2441} {"train_loss": -41.699581146240234, "global_step": 295468, "epoch": 2441} {"train_loss": -42.780941009521484, "global_step": 295469, "epoch": 2441} {"train_loss": -40.8653678894043, "global_step": 295470, "epoch": 2441} {"train_loss": -42.375877380371094, "global_step": 295471, "epoch": 2441} {"train_loss": -41.447425842285156, "global_step": 295472, "epoch": 2441} {"train_loss": -42.933753967285156, "global_step": 295473, "epoch": 2441} {"train_loss": -39.290950775146484, "global_step": 295474, "epoch": 2441} {"train_loss": -40.96372604370117, "global_step": 295475, "epoch": 2441} {"train_loss": -42.28189468383789, "global_step": 295476, "epoch": 2441} {"train_loss": -41.97035598754883, "global_step": 295477, "epoch": 2441} {"train_loss": -40.4578971862793, "global_step": 295478, "epoch": 2441} {"train_loss": -41.27958297729492, "global_step": 295479, "epoch": 2441} {"train_loss": -42.42548370361328, "global_step": 295480, "epoch": 2441} {"train_loss": -42.46312117773639, "global_step": 295481, "epoch": 2441, "val_loss": 2452583.25} {"train_loss": -42.89755630493164, "global_step": 295482, "epoch": 2442} {"train_loss": -40.983089447021484, "global_step": 295483, "epoch": 2442} {"train_loss": -41.61609649658203, "global_step": 295484, "epoch": 2442} {"train_loss": -41.434356689453125, "global_step": 295485, "epoch": 2442} {"train_loss": -39.152374267578125, "global_step": 295486, "epoch": 2442} {"train_loss": -41.54925537109375, "global_step": 295487, "epoch": 2442} {"train_loss": -41.0234489440918, "global_step": 295488, "epoch": 2442} {"train_loss": -41.87411117553711, "global_step": 295489, "epoch": 2442} {"train_loss": -41.36076736450195, "global_step": 295490, "epoch": 2442} {"train_loss": -42.408058166503906, "global_step": 295491, "epoch": 2442} {"train_loss": -42.00746536254883, "global_step": 295492, "epoch": 2442} {"train_loss": -42.19987106323242, "global_step": 295493, "epoch": 2442} {"train_loss": -43.08990478515625, "global_step": 295494, "epoch": 2442} {"train_loss": -41.20537185668945, "global_step": 295495, "epoch": 2442} {"train_loss": -42.92466354370117, "global_step": 295496, "epoch": 2442} {"train_loss": -41.671260833740234, "global_step": 295497, "epoch": 2442} {"train_loss": -39.43397903442383, "global_step": 295498, "epoch": 2442} {"train_loss": -39.29248809814453, "global_step": 295499, "epoch": 2442} {"train_loss": -40.77390670776367, "global_step": 295500, "epoch": 2442} {"train_loss": -40.41788101196289, "global_step": 295501, "epoch": 2442} {"train_loss": -37.17190170288086, "global_step": 295502, "epoch": 2442} {"train_loss": -40.520294189453125, "global_step": 295503, "epoch": 2442} {"train_loss": -35.25044250488281, "global_step": 295504, "epoch": 2442} {"train_loss": -36.87696075439453, "global_step": 295505, "epoch": 2442} {"train_loss": -41.968318939208984, "global_step": 295506, "epoch": 2442} {"train_loss": -38.971351623535156, "global_step": 295507, "epoch": 2442} {"train_loss": -41.451988220214844, "global_step": 295508, "epoch": 2442} {"train_loss": -40.067867279052734, "global_step": 295509, "epoch": 2442} {"train_loss": -40.224525451660156, "global_step": 295510, "epoch": 2442} {"train_loss": -41.57351303100586, "global_step": 295511, "epoch": 2442} {"train_loss": -35.918460845947266, "global_step": 295512, "epoch": 2442} {"train_loss": -41.190673828125, "global_step": 295513, "epoch": 2442} {"train_loss": -41.84172821044922, "global_step": 295514, "epoch": 2442} {"train_loss": -41.50045394897461, "global_step": 295515, "epoch": 2442} {"train_loss": -41.27120590209961, "global_step": 295516, "epoch": 2442} {"train_loss": -40.86519241333008, "global_step": 295517, "epoch": 2442} {"train_loss": -42.21505355834961, "global_step": 295518, "epoch": 2442} {"train_loss": -41.17102813720703, "global_step": 295519, "epoch": 2442} {"train_loss": -39.619056701660156, "global_step": 295520, "epoch": 2442} {"train_loss": -41.19820022583008, "global_step": 295521, "epoch": 2442} {"train_loss": -42.48250198364258, "global_step": 295522, "epoch": 2442} {"train_loss": -41.785186767578125, "global_step": 295523, "epoch": 2442} {"train_loss": -40.6239128112793, "global_step": 295524, "epoch": 2442} {"train_loss": -42.355804443359375, "global_step": 295525, "epoch": 2442} {"train_loss": -41.865325927734375, "global_step": 295526, "epoch": 2442} {"train_loss": -42.390567779541016, "global_step": 295527, "epoch": 2442} {"train_loss": -42.41984558105469, "global_step": 295528, "epoch": 2442} {"train_loss": -39.099884033203125, "global_step": 295529, "epoch": 2442} {"train_loss": -42.25167465209961, "global_step": 295530, "epoch": 2442} {"train_loss": -40.410911560058594, "global_step": 295531, "epoch": 2442} {"train_loss": -40.89984893798828, "global_step": 295532, "epoch": 2442} {"train_loss": -41.63289260864258, "global_step": 295533, "epoch": 2442} {"train_loss": -38.948246002197266, "global_step": 295534, "epoch": 2442} {"train_loss": -42.7324333190918, "global_step": 295535, "epoch": 2442} {"train_loss": -36.53536605834961, "global_step": 295536, "epoch": 2442} {"train_loss": -40.1397590637207, "global_step": 295537, "epoch": 2442} {"train_loss": -39.47298812866211, "global_step": 295538, "epoch": 2442} {"train_loss": -41.66668701171875, "global_step": 295539, "epoch": 2442} {"train_loss": -38.4829216003418, "global_step": 295540, "epoch": 2442} {"train_loss": -41.32792663574219, "global_step": 295541, "epoch": 2442} {"train_loss": -41.67684555053711, "global_step": 295542, "epoch": 2442} {"train_loss": -41.51316452026367, "global_step": 295543, "epoch": 2442} {"train_loss": -41.280948638916016, "global_step": 295544, "epoch": 2442} {"train_loss": -39.05855941772461, "global_step": 295545, "epoch": 2442} {"train_loss": -36.90729522705078, "global_step": 295546, "epoch": 2442} {"train_loss": -40.31277084350586, "global_step": 295547, "epoch": 2442} {"train_loss": -40.15584945678711, "global_step": 295548, "epoch": 2442} {"train_loss": -39.407596588134766, "global_step": 295549, "epoch": 2442} {"train_loss": -40.62836456298828, "global_step": 295550, "epoch": 2442} {"train_loss": -39.982852935791016, "global_step": 295551, "epoch": 2442} {"train_loss": -38.65556716918945, "global_step": 295552, "epoch": 2442} {"train_loss": -40.14860153198242, "global_step": 295553, "epoch": 2442} {"train_loss": -38.667842864990234, "global_step": 295554, "epoch": 2442} {"train_loss": -40.83126449584961, "global_step": 295555, "epoch": 2442} {"train_loss": -41.24750900268555, "global_step": 295556, "epoch": 2442} {"train_loss": -38.20258331298828, "global_step": 295557, "epoch": 2442} {"train_loss": -41.54517364501953, "global_step": 295558, "epoch": 2442} {"train_loss": -41.639434814453125, "global_step": 295559, "epoch": 2442} {"train_loss": -42.1761360168457, "global_step": 295560, "epoch": 2442} {"train_loss": -39.80377197265625, "global_step": 295561, "epoch": 2442} {"train_loss": -40.348960876464844, "global_step": 295562, "epoch": 2442} {"train_loss": -41.651363372802734, "global_step": 295563, "epoch": 2442} {"train_loss": -42.019317626953125, "global_step": 295564, "epoch": 2442} {"train_loss": -40.455543518066406, "global_step": 295565, "epoch": 2442} {"train_loss": -41.687129974365234, "global_step": 295566, "epoch": 2442} {"train_loss": -37.66157150268555, "global_step": 295567, "epoch": 2442} {"train_loss": -41.36359405517578, "global_step": 295568, "epoch": 2442} {"train_loss": -40.7380256652832, "global_step": 295569, "epoch": 2442} {"train_loss": -39.21052169799805, "global_step": 295570, "epoch": 2442} {"train_loss": -41.75588607788086, "global_step": 295571, "epoch": 2442} {"train_loss": -41.3869743347168, "global_step": 295572, "epoch": 2442} {"train_loss": -42.041236877441406, "global_step": 295573, "epoch": 2442} {"train_loss": -41.9114990234375, "global_step": 295574, "epoch": 2442} {"train_loss": -40.9918212890625, "global_step": 295575, "epoch": 2442} {"train_loss": -42.12654495239258, "global_step": 295576, "epoch": 2442} {"train_loss": -41.44467544555664, "global_step": 295577, "epoch": 2442} {"train_loss": -41.71989822387695, "global_step": 295578, "epoch": 2442} {"train_loss": -41.6849479675293, "global_step": 295579, "epoch": 2442} {"train_loss": -42.58451461791992, "global_step": 295580, "epoch": 2442} {"train_loss": -42.46718215942383, "global_step": 295581, "epoch": 2442} {"train_loss": -42.920814514160156, "global_step": 295582, "epoch": 2442} {"train_loss": -42.405635833740234, "global_step": 295583, "epoch": 2442} {"train_loss": -41.94158935546875, "global_step": 295584, "epoch": 2442} {"train_loss": -42.40825271606445, "global_step": 295585, "epoch": 2442} {"train_loss": -42.11434555053711, "global_step": 295586, "epoch": 2442} {"train_loss": -40.662235260009766, "global_step": 295587, "epoch": 2442} {"train_loss": -42.515907287597656, "global_step": 295588, "epoch": 2442} {"train_loss": -42.4903564453125, "global_step": 295589, "epoch": 2442} {"train_loss": -41.58417510986328, "global_step": 295590, "epoch": 2442} {"train_loss": -42.2628288269043, "global_step": 295591, "epoch": 2442} {"train_loss": -41.78727340698242, "global_step": 295592, "epoch": 2442} {"train_loss": -42.85349655151367, "global_step": 295593, "epoch": 2442} {"train_loss": -42.97164535522461, "global_step": 295594, "epoch": 2442} {"train_loss": -42.98859405517578, "global_step": 295595, "epoch": 2442} {"train_loss": -42.754512786865234, "global_step": 295596, "epoch": 2442} {"train_loss": -43.250885009765625, "global_step": 295597, "epoch": 2442} {"train_loss": -40.31719207763672, "global_step": 295598, "epoch": 2442} {"train_loss": -43.240325927734375, "global_step": 295599, "epoch": 2442} {"train_loss": -43.23809051513672, "global_step": 295600, "epoch": 2442} {"train_loss": -42.15949630737305, "global_step": 295601, "epoch": 2442} {"train_loss": -41.02802960734722, "global_step": 295602, "epoch": 2442, "val_loss": 2693966.5} {"train_loss": -42.98341751098633, "global_step": 295603, "epoch": 2443} {"train_loss": -41.148677825927734, "global_step": 295604, "epoch": 2443} {"train_loss": -42.179054260253906, "global_step": 295605, "epoch": 2443} {"train_loss": -43.09453201293945, "global_step": 295606, "epoch": 2443} {"train_loss": -42.372352600097656, "global_step": 295607, "epoch": 2443} {"train_loss": -42.75709915161133, "global_step": 295608, "epoch": 2443} {"train_loss": -43.19606399536133, "global_step": 295609, "epoch": 2443} {"train_loss": -42.6041374206543, "global_step": 295610, "epoch": 2443} {"train_loss": -42.863460540771484, "global_step": 295611, "epoch": 2443} {"train_loss": -43.20295333862305, "global_step": 295612, "epoch": 2443} {"train_loss": -42.4027214050293, "global_step": 295613, "epoch": 2443} {"train_loss": -42.52651596069336, "global_step": 295614, "epoch": 2443} {"train_loss": -43.3464241027832, "global_step": 295615, "epoch": 2443} {"train_loss": -41.600582122802734, "global_step": 295616, "epoch": 2443} {"train_loss": -41.427894592285156, "global_step": 295617, "epoch": 2443} {"train_loss": -42.66121292114258, "global_step": 295618, "epoch": 2443} {"train_loss": -43.0163688659668, "global_step": 295619, "epoch": 2443} {"train_loss": -42.7457160949707, "global_step": 295620, "epoch": 2443} {"train_loss": -40.319034576416016, "global_step": 295621, "epoch": 2443} {"train_loss": -41.910701751708984, "global_step": 295622, "epoch": 2443} {"train_loss": -42.845672607421875, "global_step": 295623, "epoch": 2443} {"train_loss": -41.730892181396484, "global_step": 295624, "epoch": 2443} {"train_loss": -42.64038848876953, "global_step": 295625, "epoch": 2443} {"train_loss": -42.15317916870117, "global_step": 295626, "epoch": 2443} {"train_loss": -42.66400909423828, "global_step": 295627, "epoch": 2443} {"train_loss": -42.10883331298828, "global_step": 295628, "epoch": 2443} {"train_loss": -42.70355987548828, "global_step": 295629, "epoch": 2443} {"train_loss": -42.64430236816406, "global_step": 295630, "epoch": 2443} {"train_loss": -42.778812408447266, "global_step": 295631, "epoch": 2443} {"train_loss": -43.04348373413086, "global_step": 295632, "epoch": 2443} {"train_loss": -42.739845275878906, "global_step": 295633, "epoch": 2443} {"train_loss": -43.345306396484375, "global_step": 295634, "epoch": 2443} {"train_loss": -42.83616256713867, "global_step": 295635, "epoch": 2443} {"train_loss": -42.88383102416992, "global_step": 295636, "epoch": 2443} {"train_loss": -42.67936325073242, "global_step": 295637, "epoch": 2443} {"train_loss": -42.95693588256836, "global_step": 295638, "epoch": 2443} {"train_loss": -42.93701171875, "global_step": 295639, "epoch": 2443} {"train_loss": -42.33177185058594, "global_step": 295640, "epoch": 2443} {"train_loss": -43.251949310302734, "global_step": 295641, "epoch": 2443} {"train_loss": -42.396018981933594, "global_step": 295642, "epoch": 2443} {"train_loss": -41.40022659301758, "global_step": 295643, "epoch": 2443} {"train_loss": -43.560482025146484, "global_step": 295644, "epoch": 2443} {"train_loss": -42.767154693603516, "global_step": 295645, "epoch": 2443} {"train_loss": -39.841758728027344, "global_step": 295646, "epoch": 2443} {"train_loss": -38.38406753540039, "global_step": 295647, "epoch": 2443} {"train_loss": -42.569698333740234, "global_step": 295648, "epoch": 2443} {"train_loss": -37.32847213745117, "global_step": 295649, "epoch": 2443} {"train_loss": -30.399301528930664, "global_step": 295650, "epoch": 2443} {"train_loss": -35.20841979980469, "global_step": 295651, "epoch": 2443} {"train_loss": -41.67618942260742, "global_step": 295652, "epoch": 2443} {"train_loss": -34.01716232299805, "global_step": 295653, "epoch": 2443} {"train_loss": -39.34910202026367, "global_step": 295654, "epoch": 2443} {"train_loss": -40.3354377746582, "global_step": 295655, "epoch": 2443} {"train_loss": -37.54323959350586, "global_step": 295656, "epoch": 2443} {"train_loss": -40.57243728637695, "global_step": 295657, "epoch": 2443} {"train_loss": -38.988189697265625, "global_step": 295658, "epoch": 2443} {"train_loss": -40.383052825927734, "global_step": 295659, "epoch": 2443} {"train_loss": -40.3462028503418, "global_step": 295660, "epoch": 2443} {"train_loss": -40.555843353271484, "global_step": 295661, "epoch": 2443} {"train_loss": -41.70268630981445, "global_step": 295662, "epoch": 2443} {"train_loss": -40.0139045715332, "global_step": 295663, "epoch": 2443} {"train_loss": -41.85755157470703, "global_step": 295664, "epoch": 2443} {"train_loss": -41.28634262084961, "global_step": 295665, "epoch": 2443} {"train_loss": -40.61711502075195, "global_step": 295666, "epoch": 2443} {"train_loss": -41.75802993774414, "global_step": 295667, "epoch": 2443} {"train_loss": -39.654090881347656, "global_step": 295668, "epoch": 2443} {"train_loss": -40.80332565307617, "global_step": 295669, "epoch": 2443} {"train_loss": -41.3813591003418, "global_step": 295670, "epoch": 2443} {"train_loss": -41.245357513427734, "global_step": 295671, "epoch": 2443} {"train_loss": -41.62981033325195, "global_step": 295672, "epoch": 2443} {"train_loss": -40.997314453125, "global_step": 295673, "epoch": 2443} {"train_loss": -41.9865608215332, "global_step": 295674, "epoch": 2443} {"train_loss": -41.57943344116211, "global_step": 295675, "epoch": 2443} {"train_loss": -41.54842758178711, "global_step": 295676, "epoch": 2443} {"train_loss": -42.80150604248047, "global_step": 295677, "epoch": 2443} {"train_loss": -41.5330924987793, "global_step": 295678, "epoch": 2443} {"train_loss": -42.4604606628418, "global_step": 295679, "epoch": 2443} {"train_loss": -41.282691955566406, "global_step": 295680, "epoch": 2443} {"train_loss": -42.683231353759766, "global_step": 295681, "epoch": 2443} {"train_loss": -41.87676239013672, "global_step": 295682, "epoch": 2443} {"train_loss": -42.68276596069336, "global_step": 295683, "epoch": 2443} {"train_loss": -41.528743743896484, "global_step": 295684, "epoch": 2443} {"train_loss": -42.1176872253418, "global_step": 295685, "epoch": 2443} {"train_loss": -42.61574935913086, "global_step": 295686, "epoch": 2443} {"train_loss": -42.76815414428711, "global_step": 295687, "epoch": 2443} {"train_loss": -43.05742263793945, "global_step": 295688, "epoch": 2443} {"train_loss": -43.031185150146484, "global_step": 295689, "epoch": 2443} {"train_loss": -42.329891204833984, "global_step": 295690, "epoch": 2443} {"train_loss": -42.500732421875, "global_step": 295691, "epoch": 2443} {"train_loss": -42.476436614990234, "global_step": 295692, "epoch": 2443} {"train_loss": -43.295101165771484, "global_step": 295693, "epoch": 2443} {"train_loss": -40.42966842651367, "global_step": 295694, "epoch": 2443} {"train_loss": -43.241886138916016, "global_step": 295695, "epoch": 2443} {"train_loss": -41.77923583984375, "global_step": 295696, "epoch": 2443} {"train_loss": -43.186241149902344, "global_step": 295697, "epoch": 2443} {"train_loss": -43.42637634277344, "global_step": 295698, "epoch": 2443} {"train_loss": -42.62385177612305, "global_step": 295699, "epoch": 2443} {"train_loss": -42.9201774597168, "global_step": 295700, "epoch": 2443} {"train_loss": -43.74882888793945, "global_step": 295701, "epoch": 2443} {"train_loss": -43.530242919921875, "global_step": 295702, "epoch": 2443} {"train_loss": -43.17611312866211, "global_step": 295703, "epoch": 2443} {"train_loss": -43.42972946166992, "global_step": 295704, "epoch": 2443} {"train_loss": -43.135372161865234, "global_step": 295705, "epoch": 2443} {"train_loss": -43.04206085205078, "global_step": 295706, "epoch": 2443} {"train_loss": -43.70271682739258, "global_step": 295707, "epoch": 2443} {"train_loss": -43.61385726928711, "global_step": 295708, "epoch": 2443} {"train_loss": -43.25750732421875, "global_step": 295709, "epoch": 2443} {"train_loss": -43.09724044799805, "global_step": 295710, "epoch": 2443} {"train_loss": -43.510398864746094, "global_step": 295711, "epoch": 2443} {"train_loss": -43.69138717651367, "global_step": 295712, "epoch": 2443} {"train_loss": -43.89948272705078, "global_step": 295713, "epoch": 2443} {"train_loss": -43.784942626953125, "global_step": 295714, "epoch": 2443} {"train_loss": -43.34601974487305, "global_step": 295715, "epoch": 2443} {"train_loss": -43.78290939331055, "global_step": 295716, "epoch": 2443} {"train_loss": -41.987953186035156, "global_step": 295717, "epoch": 2443} {"train_loss": -43.88862991333008, "global_step": 295718, "epoch": 2443} {"train_loss": -43.292781829833984, "global_step": 295719, "epoch": 2443} {"train_loss": -43.028236389160156, "global_step": 295720, "epoch": 2443} {"train_loss": -43.89789962768555, "global_step": 295721, "epoch": 2443} {"train_loss": -43.18636703491211, "global_step": 295722, "epoch": 2443} {"train_loss": -42.005507776559874, "global_step": 295723, "epoch": 2443, "val_loss": 2478776.5} {"train_loss": -43.106929779052734, "global_step": 295724, "epoch": 2444} {"train_loss": -43.649993896484375, "global_step": 295725, "epoch": 2444} {"train_loss": -43.68196105957031, "global_step": 295726, "epoch": 2444} {"train_loss": -42.1893424987793, "global_step": 295727, "epoch": 2444} {"train_loss": -44.00300216674805, "global_step": 295728, "epoch": 2444} {"train_loss": -43.72739791870117, "global_step": 295729, "epoch": 2444} {"train_loss": -44.03846740722656, "global_step": 295730, "epoch": 2444} {"train_loss": -43.593265533447266, "global_step": 295731, "epoch": 2444} {"train_loss": -43.155601501464844, "global_step": 295732, "epoch": 2444} {"train_loss": -43.99671936035156, "global_step": 295733, "epoch": 2444} {"train_loss": -43.546546936035156, "global_step": 295734, "epoch": 2444} {"train_loss": -43.47315216064453, "global_step": 295735, "epoch": 2444} {"train_loss": -44.00202560424805, "global_step": 295736, "epoch": 2444} {"train_loss": -43.48214340209961, "global_step": 295737, "epoch": 2444} {"train_loss": -43.37725830078125, "global_step": 295738, "epoch": 2444} {"train_loss": -42.8555793762207, "global_step": 295739, "epoch": 2444} {"train_loss": -43.99542999267578, "global_step": 295740, "epoch": 2444} {"train_loss": -43.83367156982422, "global_step": 295741, "epoch": 2444} {"train_loss": -44.22391891479492, "global_step": 295742, "epoch": 2444} {"train_loss": -43.55023956298828, "global_step": 295743, "epoch": 2444} {"train_loss": -43.91731262207031, "global_step": 295744, "epoch": 2444} {"train_loss": -43.6263313293457, "global_step": 295745, "epoch": 2444} {"train_loss": -43.94483947753906, "global_step": 295746, "epoch": 2444} {"train_loss": -42.9242057800293, "global_step": 295747, "epoch": 2444} {"train_loss": -42.4705810546875, "global_step": 295748, "epoch": 2444} {"train_loss": -41.47722244262695, "global_step": 295749, "epoch": 2444} {"train_loss": -41.40653610229492, "global_step": 295750, "epoch": 2444} {"train_loss": -42.37113571166992, "global_step": 295751, "epoch": 2444} {"train_loss": -41.97370529174805, "global_step": 295752, "epoch": 2444} {"train_loss": -42.32992172241211, "global_step": 295753, "epoch": 2444} {"train_loss": -42.744388580322266, "global_step": 295754, "epoch": 2444} {"train_loss": -43.433589935302734, "global_step": 295755, "epoch": 2444} {"train_loss": -42.97245788574219, "global_step": 295756, "epoch": 2444} {"train_loss": -42.01681900024414, "global_step": 295757, "epoch": 2444} {"train_loss": -40.47098922729492, "global_step": 295758, "epoch": 2444} {"train_loss": -43.34059524536133, "global_step": 295759, "epoch": 2444} {"train_loss": -40.710323333740234, "global_step": 295760, "epoch": 2444} {"train_loss": -39.58024597167969, "global_step": 295761, "epoch": 2444} {"train_loss": -40.5400505065918, "global_step": 295762, "epoch": 2444} {"train_loss": -42.27517318725586, "global_step": 295763, "epoch": 2444} {"train_loss": -40.91314697265625, "global_step": 295764, "epoch": 2444} {"train_loss": -37.933998107910156, "global_step": 295765, "epoch": 2444} {"train_loss": -37.16314697265625, "global_step": 295766, "epoch": 2444} {"train_loss": -40.367069244384766, "global_step": 295767, "epoch": 2444} {"train_loss": -42.10663986206055, "global_step": 295768, "epoch": 2444} {"train_loss": -39.933372497558594, "global_step": 295769, "epoch": 2444} {"train_loss": -41.167694091796875, "global_step": 295770, "epoch": 2444} {"train_loss": -41.899776458740234, "global_step": 295771, "epoch": 2444} {"train_loss": -41.27582931518555, "global_step": 295772, "epoch": 2444} {"train_loss": -42.17129135131836, "global_step": 295773, "epoch": 2444} {"train_loss": -41.856380462646484, "global_step": 295774, "epoch": 2444} {"train_loss": -40.638328552246094, "global_step": 295775, "epoch": 2444} {"train_loss": -42.489986419677734, "global_step": 295776, "epoch": 2444} {"train_loss": -41.471595764160156, "global_step": 295777, "epoch": 2444} {"train_loss": -42.038570404052734, "global_step": 295778, "epoch": 2444} {"train_loss": -41.06855392456055, "global_step": 295779, "epoch": 2444} {"train_loss": -42.0709228515625, "global_step": 295780, "epoch": 2444} {"train_loss": -42.55497360229492, "global_step": 295781, "epoch": 2444} {"train_loss": -42.58980941772461, "global_step": 295782, "epoch": 2444} {"train_loss": -42.79977798461914, "global_step": 295783, "epoch": 2444} {"train_loss": -42.267730712890625, "global_step": 295784, "epoch": 2444} {"train_loss": -42.64895248413086, "global_step": 295785, "epoch": 2444} {"train_loss": -42.53955841064453, "global_step": 295786, "epoch": 2444} {"train_loss": -42.602256774902344, "global_step": 295787, "epoch": 2444} {"train_loss": -41.92255401611328, "global_step": 295788, "epoch": 2444} {"train_loss": -42.69374465942383, "global_step": 295789, "epoch": 2444} {"train_loss": -42.34693908691406, "global_step": 295790, "epoch": 2444} {"train_loss": -43.10797119140625, "global_step": 295791, "epoch": 2444} {"train_loss": -42.49908447265625, "global_step": 295792, "epoch": 2444} {"train_loss": -43.05073928833008, "global_step": 295793, "epoch": 2444} {"train_loss": -43.12158203125, "global_step": 295794, "epoch": 2444} {"train_loss": -42.1966552734375, "global_step": 295795, "epoch": 2444} {"train_loss": -42.638641357421875, "global_step": 295796, "epoch": 2444} {"train_loss": -43.41504669189453, "global_step": 295797, "epoch": 2444} {"train_loss": -42.779701232910156, "global_step": 295798, "epoch": 2444} {"train_loss": -42.738197326660156, "global_step": 295799, "epoch": 2444} {"train_loss": -42.79962921142578, "global_step": 295800, "epoch": 2444} {"train_loss": -42.7209587097168, "global_step": 295801, "epoch": 2444} {"train_loss": -42.89018630981445, "global_step": 295802, "epoch": 2444} {"train_loss": -43.2900390625, "global_step": 295803, "epoch": 2444} {"train_loss": -42.941864013671875, "global_step": 295804, "epoch": 2444} {"train_loss": -43.204681396484375, "global_step": 295805, "epoch": 2444} {"train_loss": -43.00992965698242, "global_step": 295806, "epoch": 2444} {"train_loss": -43.47601318359375, "global_step": 295807, "epoch": 2444} {"train_loss": -42.4736328125, "global_step": 295808, "epoch": 2444} {"train_loss": -43.21744918823242, "global_step": 295809, "epoch": 2444} {"train_loss": -43.61475372314453, "global_step": 295810, "epoch": 2444} {"train_loss": -43.545711517333984, "global_step": 295811, "epoch": 2444} {"train_loss": -43.25691604614258, "global_step": 295812, "epoch": 2444} {"train_loss": -43.019264221191406, "global_step": 295813, "epoch": 2444} {"train_loss": -43.5195198059082, "global_step": 295814, "epoch": 2444} {"train_loss": -43.43291091918945, "global_step": 295815, "epoch": 2444} {"train_loss": -43.42156219482422, "global_step": 295816, "epoch": 2444} {"train_loss": -43.64575958251953, "global_step": 295817, "epoch": 2444} {"train_loss": -43.074607849121094, "global_step": 295818, "epoch": 2444} {"train_loss": -43.62655258178711, "global_step": 295819, "epoch": 2444} {"train_loss": -41.8102912902832, "global_step": 295820, "epoch": 2444} {"train_loss": -43.092716217041016, "global_step": 295821, "epoch": 2444} {"train_loss": -42.932212829589844, "global_step": 295822, "epoch": 2444} {"train_loss": -42.91819381713867, "global_step": 295823, "epoch": 2444} {"train_loss": -42.859107971191406, "global_step": 295824, "epoch": 2444} {"train_loss": -43.141231536865234, "global_step": 295825, "epoch": 2444} {"train_loss": -42.70209884643555, "global_step": 295826, "epoch": 2444} {"train_loss": -41.50147247314453, "global_step": 295827, "epoch": 2444} {"train_loss": -43.20811462402344, "global_step": 295828, "epoch": 2444} {"train_loss": -43.06028366088867, "global_step": 295829, "epoch": 2444} {"train_loss": -42.58278274536133, "global_step": 295830, "epoch": 2444} {"train_loss": -42.432159423828125, "global_step": 295831, "epoch": 2444} {"train_loss": -43.21125793457031, "global_step": 295832, "epoch": 2444} {"train_loss": -42.6175537109375, "global_step": 295833, "epoch": 2444} {"train_loss": -42.74239730834961, "global_step": 295834, "epoch": 2444} {"train_loss": -42.903743743896484, "global_step": 295835, "epoch": 2444} {"train_loss": -42.5257682800293, "global_step": 295836, "epoch": 2444} {"train_loss": -42.00114059448242, "global_step": 295837, "epoch": 2444} {"train_loss": -43.800636291503906, "global_step": 295838, "epoch": 2444} {"train_loss": -42.66799545288086, "global_step": 295839, "epoch": 2444} {"train_loss": -42.2238655090332, "global_step": 295840, "epoch": 2444} {"train_loss": -43.166072845458984, "global_step": 295841, "epoch": 2444} {"train_loss": -41.949546813964844, "global_step": 295842, "epoch": 2444} {"train_loss": -41.34249496459961, "global_step": 295843, "epoch": 2444} {"train_loss": -42.592658744370645, "global_step": 295844, "epoch": 2444, "val_loss": 2551672.75} {"train_loss": -41.94300079345703, "global_step": 295845, "epoch": 2445} {"train_loss": -41.959014892578125, "global_step": 295846, "epoch": 2445} {"train_loss": -43.196563720703125, "global_step": 295847, "epoch": 2445} {"train_loss": -40.99609375, "global_step": 295848, "epoch": 2445} {"train_loss": -42.94218063354492, "global_step": 295849, "epoch": 2445} {"train_loss": -42.446224212646484, "global_step": 295850, "epoch": 2445} {"train_loss": -42.173709869384766, "global_step": 295851, "epoch": 2445} {"train_loss": -42.97021484375, "global_step": 295852, "epoch": 2445} {"train_loss": -41.33686065673828, "global_step": 295853, "epoch": 2445} {"train_loss": -41.0785026550293, "global_step": 295854, "epoch": 2445} {"train_loss": -42.867713928222656, "global_step": 295855, "epoch": 2445} {"train_loss": -41.74951934814453, "global_step": 295856, "epoch": 2445} {"train_loss": -40.56473922729492, "global_step": 295857, "epoch": 2445} {"train_loss": -41.80869674682617, "global_step": 295858, "epoch": 2445} {"train_loss": -42.24442672729492, "global_step": 295859, "epoch": 2445} {"train_loss": -40.68050765991211, "global_step": 295860, "epoch": 2445} {"train_loss": -41.83619689941406, "global_step": 295861, "epoch": 2445} {"train_loss": -41.6420783996582, "global_step": 295862, "epoch": 2445} {"train_loss": -42.38520050048828, "global_step": 295863, "epoch": 2445} {"train_loss": -42.49578094482422, "global_step": 295864, "epoch": 2445} {"train_loss": -42.75798416137695, "global_step": 295865, "epoch": 2445} {"train_loss": -42.535030364990234, "global_step": 295866, "epoch": 2445} {"train_loss": -43.40168380737305, "global_step": 295867, "epoch": 2445} {"train_loss": -42.555625915527344, "global_step": 295868, "epoch": 2445} {"train_loss": -42.65322494506836, "global_step": 295869, "epoch": 2445} {"train_loss": -43.29264450073242, "global_step": 295870, "epoch": 2445} {"train_loss": -42.620460510253906, "global_step": 295871, "epoch": 2445} {"train_loss": -42.997493743896484, "global_step": 295872, "epoch": 2445} {"train_loss": -43.314632415771484, "global_step": 295873, "epoch": 2445} {"train_loss": -42.27920150756836, "global_step": 295874, "epoch": 2445} {"train_loss": -43.16355514526367, "global_step": 295875, "epoch": 2445} {"train_loss": -42.485267639160156, "global_step": 295876, "epoch": 2445} {"train_loss": -43.160247802734375, "global_step": 295877, "epoch": 2445} {"train_loss": -42.887962341308594, "global_step": 295878, "epoch": 2445} {"train_loss": -43.54885482788086, "global_step": 295879, "epoch": 2445} {"train_loss": -42.7801513671875, "global_step": 295880, "epoch": 2445} {"train_loss": -43.06039047241211, "global_step": 295881, "epoch": 2445} {"train_loss": -43.27227783203125, "global_step": 295882, "epoch": 2445} {"train_loss": -43.33243179321289, "global_step": 295883, "epoch": 2445} {"train_loss": -43.60714340209961, "global_step": 295884, "epoch": 2445} {"train_loss": -43.46133041381836, "global_step": 295885, "epoch": 2445} {"train_loss": -43.09513473510742, "global_step": 295886, "epoch": 2445} {"train_loss": -43.66453170776367, "global_step": 295887, "epoch": 2445} {"train_loss": -43.18285369873047, "global_step": 295888, "epoch": 2445} {"train_loss": -43.20331573486328, "global_step": 295889, "epoch": 2445} {"train_loss": -42.90270233154297, "global_step": 295890, "epoch": 2445} {"train_loss": -43.583316802978516, "global_step": 295891, "epoch": 2445} {"train_loss": -42.93122482299805, "global_step": 295892, "epoch": 2445} {"train_loss": -43.48421096801758, "global_step": 295893, "epoch": 2445} {"train_loss": -43.79343795776367, "global_step": 295894, "epoch": 2445} {"train_loss": -44.137447357177734, "global_step": 295895, "epoch": 2445} {"train_loss": -43.9150276184082, "global_step": 295896, "epoch": 2445} {"train_loss": -44.010780334472656, "global_step": 295897, "epoch": 2445} {"train_loss": -43.771514892578125, "global_step": 295898, "epoch": 2445} {"train_loss": -43.9349479675293, "global_step": 295899, "epoch": 2445} {"train_loss": -43.99851989746094, "global_step": 295900, "epoch": 2445} {"train_loss": -44.15665817260742, "global_step": 295901, "epoch": 2445} {"train_loss": -42.4798583984375, "global_step": 295902, "epoch": 2445} {"train_loss": -41.91107177734375, "global_step": 295903, "epoch": 2445} {"train_loss": -43.374324798583984, "global_step": 295904, "epoch": 2445} {"train_loss": -42.41483688354492, "global_step": 295905, "epoch": 2445} {"train_loss": -41.484188079833984, "global_step": 295906, "epoch": 2445} {"train_loss": -41.633338928222656, "global_step": 295907, "epoch": 2445} {"train_loss": -43.76945877075195, "global_step": 295908, "epoch": 2445} {"train_loss": -41.21156692504883, "global_step": 295909, "epoch": 2445} {"train_loss": -43.30707550048828, "global_step": 295910, "epoch": 2445} {"train_loss": -43.479671478271484, "global_step": 295911, "epoch": 2445} {"train_loss": -41.429405212402344, "global_step": 295912, "epoch": 2445} {"train_loss": -41.30727767944336, "global_step": 295913, "epoch": 2445} {"train_loss": -43.16059112548828, "global_step": 295914, "epoch": 2445} {"train_loss": -43.0407600402832, "global_step": 295915, "epoch": 2445} {"train_loss": -42.67792892456055, "global_step": 295916, "epoch": 2445} {"train_loss": -43.942012786865234, "global_step": 295917, "epoch": 2445} {"train_loss": -43.11967086791992, "global_step": 295918, "epoch": 2445} {"train_loss": -43.630062103271484, "global_step": 295919, "epoch": 2445} {"train_loss": -43.245601654052734, "global_step": 295920, "epoch": 2445} {"train_loss": -43.81174850463867, "global_step": 295921, "epoch": 2445} {"train_loss": -43.71809005737305, "global_step": 295922, "epoch": 2445} {"train_loss": -43.70725631713867, "global_step": 295923, "epoch": 2445} {"train_loss": -43.68037033081055, "global_step": 295924, "epoch": 2445} {"train_loss": -43.46662139892578, "global_step": 295925, "epoch": 2445} {"train_loss": -43.616493225097656, "global_step": 295926, "epoch": 2445} {"train_loss": -43.39059066772461, "global_step": 295927, "epoch": 2445} {"train_loss": -43.65109634399414, "global_step": 295928, "epoch": 2445} {"train_loss": -43.68320846557617, "global_step": 295929, "epoch": 2445} {"train_loss": -43.75942611694336, "global_step": 295930, "epoch": 2445} {"train_loss": -44.08417510986328, "global_step": 295931, "epoch": 2445} {"train_loss": -43.76308822631836, "global_step": 295932, "epoch": 2445} {"train_loss": -43.49531173706055, "global_step": 295933, "epoch": 2445} {"train_loss": -43.13605499267578, "global_step": 295934, "epoch": 2445} {"train_loss": -43.6484375, "global_step": 295935, "epoch": 2445} {"train_loss": -43.91179275512695, "global_step": 295936, "epoch": 2445} {"train_loss": -43.80733871459961, "global_step": 295937, "epoch": 2445} {"train_loss": -43.58718490600586, "global_step": 295938, "epoch": 2445} {"train_loss": -43.32038116455078, "global_step": 295939, "epoch": 2445} {"train_loss": -43.50486373901367, "global_step": 295940, "epoch": 2445} {"train_loss": -43.354339599609375, "global_step": 295941, "epoch": 2445} {"train_loss": -43.7993278503418, "global_step": 295942, "epoch": 2445} {"train_loss": -44.28904342651367, "global_step": 295943, "epoch": 2445} {"train_loss": -43.19343948364258, "global_step": 295944, "epoch": 2445} {"train_loss": -42.003997802734375, "global_step": 295945, "epoch": 2445} {"train_loss": -42.737091064453125, "global_step": 295946, "epoch": 2445} {"train_loss": -43.68384552001953, "global_step": 295947, "epoch": 2445} {"train_loss": -43.84688949584961, "global_step": 295948, "epoch": 2445} {"train_loss": -42.70553207397461, "global_step": 295949, "epoch": 2445} {"train_loss": -42.5276985168457, "global_step": 295950, "epoch": 2445} {"train_loss": -42.451255798339844, "global_step": 295951, "epoch": 2445} {"train_loss": -42.876731872558594, "global_step": 295952, "epoch": 2445} {"train_loss": -42.207069396972656, "global_step": 295953, "epoch": 2445} {"train_loss": -43.90190124511719, "global_step": 295954, "epoch": 2445} {"train_loss": -42.516788482666016, "global_step": 295955, "epoch": 2445} {"train_loss": -40.47127151489258, "global_step": 295956, "epoch": 2445} {"train_loss": -42.05039596557617, "global_step": 295957, "epoch": 2445} {"train_loss": -42.681941986083984, "global_step": 295958, "epoch": 2445} {"train_loss": -42.06650924682617, "global_step": 295959, "epoch": 2445} {"train_loss": -43.09797286987305, "global_step": 295960, "epoch": 2445} {"train_loss": -43.20166015625, "global_step": 295961, "epoch": 2445} {"train_loss": -41.217952728271484, "global_step": 295962, "epoch": 2445} {"train_loss": -41.88554000854492, "global_step": 295963, "epoch": 2445} {"train_loss": -43.5066032409668, "global_step": 295964, "epoch": 2445} {"train_loss": -42.909965168346055, "global_step": 295965, "epoch": 2445, "val_loss": 2561771.0} {"train_loss": -42.209320068359375, "global_step": 295966, "epoch": 2446} {"train_loss": -43.47150802612305, "global_step": 295967, "epoch": 2446} {"train_loss": -42.56218338012695, "global_step": 295968, "epoch": 2446} {"train_loss": -42.14973831176758, "global_step": 295969, "epoch": 2446} {"train_loss": -42.90190505981445, "global_step": 295970, "epoch": 2446} {"train_loss": -43.38984298706055, "global_step": 295971, "epoch": 2446} {"train_loss": -43.3453483581543, "global_step": 295972, "epoch": 2446} {"train_loss": -42.98966979980469, "global_step": 295973, "epoch": 2446} {"train_loss": -42.66172790527344, "global_step": 295974, "epoch": 2446} {"train_loss": -43.464778900146484, "global_step": 295975, "epoch": 2446} {"train_loss": -43.639991760253906, "global_step": 295976, "epoch": 2446} {"train_loss": -43.403743743896484, "global_step": 295977, "epoch": 2446} {"train_loss": -43.62083053588867, "global_step": 295978, "epoch": 2446} {"train_loss": -43.84657669067383, "global_step": 295979, "epoch": 2446} {"train_loss": -43.27381896972656, "global_step": 295980, "epoch": 2446} {"train_loss": -43.87849044799805, "global_step": 295981, "epoch": 2446} {"train_loss": -40.60847854614258, "global_step": 295982, "epoch": 2446} {"train_loss": -43.82696533203125, "global_step": 295983, "epoch": 2446} {"train_loss": -43.749996185302734, "global_step": 295984, "epoch": 2446} {"train_loss": -43.90129089355469, "global_step": 295985, "epoch": 2446} {"train_loss": -43.504573822021484, "global_step": 295986, "epoch": 2446} {"train_loss": -43.22583770751953, "global_step": 295987, "epoch": 2446} {"train_loss": -37.845298767089844, "global_step": 295988, "epoch": 2446} {"train_loss": -43.32882308959961, "global_step": 295989, "epoch": 2446} {"train_loss": -42.64150619506836, "global_step": 295990, "epoch": 2446} {"train_loss": -43.21357345581055, "global_step": 295991, "epoch": 2446} {"train_loss": -41.86346435546875, "global_step": 295992, "epoch": 2446} {"train_loss": -42.76251220703125, "global_step": 295993, "epoch": 2446} {"train_loss": -42.906768798828125, "global_step": 295994, "epoch": 2446} {"train_loss": -43.476776123046875, "global_step": 295995, "epoch": 2446} {"train_loss": -42.7645378112793, "global_step": 295996, "epoch": 2446} {"train_loss": -43.53706741333008, "global_step": 295997, "epoch": 2446} {"train_loss": -41.850399017333984, "global_step": 295998, "epoch": 2446} {"train_loss": -43.07206344604492, "global_step": 295999, "epoch": 2446} {"train_loss": -43.59943389892578, "global_step": 296000, "epoch": 2446} {"train_loss": -43.33595657348633, "global_step": 296001, "epoch": 2446} {"train_loss": -42.21958541870117, "global_step": 296002, "epoch": 2446} {"train_loss": -42.49539566040039, "global_step": 296003, "epoch": 2446} {"train_loss": -42.6278190612793, "global_step": 296004, "epoch": 2446} {"train_loss": -42.374969482421875, "global_step": 296005, "epoch": 2446} {"train_loss": -41.90020751953125, "global_step": 296006, "epoch": 2446} {"train_loss": -41.23689270019531, "global_step": 296007, "epoch": 2446} {"train_loss": -42.63549041748047, "global_step": 296008, "epoch": 2446} {"train_loss": -43.497047424316406, "global_step": 296009, "epoch": 2446} {"train_loss": -43.35591506958008, "global_step": 296010, "epoch": 2446} {"train_loss": -42.18501663208008, "global_step": 296011, "epoch": 2446} {"train_loss": -40.938720703125, "global_step": 296012, "epoch": 2446} {"train_loss": -43.304222106933594, "global_step": 296013, "epoch": 2446} {"train_loss": -43.31407165527344, "global_step": 296014, "epoch": 2446} {"train_loss": -42.45973205566406, "global_step": 296015, "epoch": 2446} {"train_loss": -42.78135299682617, "global_step": 296016, "epoch": 2446} {"train_loss": -42.80795669555664, "global_step": 296017, "epoch": 2446} {"train_loss": -42.1463737487793, "global_step": 296018, "epoch": 2446} {"train_loss": -42.74185562133789, "global_step": 296019, "epoch": 2446} {"train_loss": -42.74603271484375, "global_step": 296020, "epoch": 2446} {"train_loss": -42.92210006713867, "global_step": 296021, "epoch": 2446} {"train_loss": -43.24674606323242, "global_step": 296022, "epoch": 2446} {"train_loss": -34.77804183959961, "global_step": 296023, "epoch": 2446} {"train_loss": -43.04489517211914, "global_step": 296024, "epoch": 2446} {"train_loss": -41.039703369140625, "global_step": 296025, "epoch": 2446} {"train_loss": -42.4347038269043, "global_step": 296026, "epoch": 2446} {"train_loss": -43.249473571777344, "global_step": 296027, "epoch": 2446} {"train_loss": -42.72568893432617, "global_step": 296028, "epoch": 2446} {"train_loss": -41.39441680908203, "global_step": 296029, "epoch": 2446} {"train_loss": -40.8374137878418, "global_step": 296030, "epoch": 2446} {"train_loss": -42.743377685546875, "global_step": 296031, "epoch": 2446} {"train_loss": -42.77708053588867, "global_step": 296032, "epoch": 2446} {"train_loss": -43.449798583984375, "global_step": 296033, "epoch": 2446} {"train_loss": -40.35779571533203, "global_step": 296034, "epoch": 2446} {"train_loss": -40.132667541503906, "global_step": 296035, "epoch": 2446} {"train_loss": -39.78661346435547, "global_step": 296036, "epoch": 2446} {"train_loss": -42.1099739074707, "global_step": 296037, "epoch": 2446} {"train_loss": -31.540790557861328, "global_step": 296038, "epoch": 2446} {"train_loss": -39.1904411315918, "global_step": 296039, "epoch": 2446} {"train_loss": -37.468772888183594, "global_step": 296040, "epoch": 2446} {"train_loss": -37.31582260131836, "global_step": 296041, "epoch": 2446} {"train_loss": -40.34096908569336, "global_step": 296042, "epoch": 2446} {"train_loss": -39.017642974853516, "global_step": 296043, "epoch": 2446} {"train_loss": -39.1215934753418, "global_step": 296044, "epoch": 2446} {"train_loss": -38.4253044128418, "global_step": 296045, "epoch": 2446} {"train_loss": -38.7009391784668, "global_step": 296046, "epoch": 2446} {"train_loss": -40.81882095336914, "global_step": 296047, "epoch": 2446} {"train_loss": -40.3394889831543, "global_step": 296048, "epoch": 2446} {"train_loss": -37.61098861694336, "global_step": 296049, "epoch": 2446} {"train_loss": -37.81620788574219, "global_step": 296050, "epoch": 2446} {"train_loss": -32.37560272216797, "global_step": 296051, "epoch": 2446} {"train_loss": -41.26609802246094, "global_step": 296052, "epoch": 2446} {"train_loss": -40.44599151611328, "global_step": 296053, "epoch": 2446} {"train_loss": -41.14095687866211, "global_step": 296054, "epoch": 2446} {"train_loss": -39.147972106933594, "global_step": 296055, "epoch": 2446} {"train_loss": -39.68650436401367, "global_step": 296056, "epoch": 2446} {"train_loss": -36.502132415771484, "global_step": 296057, "epoch": 2446} {"train_loss": -35.91265869140625, "global_step": 296058, "epoch": 2446} {"train_loss": -38.88099670410156, "global_step": 296059, "epoch": 2446} {"train_loss": -41.79914093017578, "global_step": 296060, "epoch": 2446} {"train_loss": -40.72861862182617, "global_step": 296061, "epoch": 2446} {"train_loss": -41.25025939941406, "global_step": 296062, "epoch": 2446} {"train_loss": -39.17976760864258, "global_step": 296063, "epoch": 2446} {"train_loss": -40.91496658325195, "global_step": 296064, "epoch": 2446} {"train_loss": -39.31083297729492, "global_step": 296065, "epoch": 2446} {"train_loss": -40.288970947265625, "global_step": 296066, "epoch": 2446} {"train_loss": -39.95977783203125, "global_step": 296067, "epoch": 2446} {"train_loss": -38.907135009765625, "global_step": 296068, "epoch": 2446} {"train_loss": -40.739227294921875, "global_step": 296069, "epoch": 2446} {"train_loss": -42.09477615356445, "global_step": 296070, "epoch": 2446} {"train_loss": -41.98732376098633, "global_step": 296071, "epoch": 2446} {"train_loss": -41.718109130859375, "global_step": 296072, "epoch": 2446} {"train_loss": -35.604774475097656, "global_step": 296073, "epoch": 2446} {"train_loss": -41.2614631652832, "global_step": 296074, "epoch": 2446} {"train_loss": -40.96625518798828, "global_step": 296075, "epoch": 2446} {"train_loss": -40.6478157043457, "global_step": 296076, "epoch": 2446} {"train_loss": -41.27494430541992, "global_step": 296077, "epoch": 2446} {"train_loss": -39.68121337890625, "global_step": 296078, "epoch": 2446} {"train_loss": -41.39688491821289, "global_step": 296079, "epoch": 2446} {"train_loss": -40.868408203125, "global_step": 296080, "epoch": 2446} {"train_loss": -41.70390701293945, "global_step": 296081, "epoch": 2446} {"train_loss": -40.442352294921875, "global_step": 296082, "epoch": 2446} {"train_loss": -40.80381774902344, "global_step": 296083, "epoch": 2446} {"train_loss": -41.21067428588867, "global_step": 296084, "epoch": 2446} {"train_loss": -42.23401641845703, "global_step": 296085, "epoch": 2446} {"train_loss": -41.340849537494755, "global_step": 296086, "epoch": 2446, "val_loss": 2482610.25} {"train_loss": -41.71314239501953, "global_step": 296087, "epoch": 2447} {"train_loss": -40.835506439208984, "global_step": 296088, "epoch": 2447} {"train_loss": -41.488216400146484, "global_step": 296089, "epoch": 2447} {"train_loss": -41.845924377441406, "global_step": 296090, "epoch": 2447} {"train_loss": -41.3929557800293, "global_step": 296091, "epoch": 2447} {"train_loss": -42.16995620727539, "global_step": 296092, "epoch": 2447} {"train_loss": -40.382972717285156, "global_step": 296093, "epoch": 2447} {"train_loss": -42.13505172729492, "global_step": 296094, "epoch": 2447} {"train_loss": -41.178260803222656, "global_step": 296095, "epoch": 2447} {"train_loss": -41.606842041015625, "global_step": 296096, "epoch": 2447} {"train_loss": -41.94922637939453, "global_step": 296097, "epoch": 2447} {"train_loss": -39.65858840942383, "global_step": 296098, "epoch": 2447} {"train_loss": -40.674251556396484, "global_step": 296099, "epoch": 2447} {"train_loss": -41.77633285522461, "global_step": 296100, "epoch": 2447} {"train_loss": -41.21610641479492, "global_step": 296101, "epoch": 2447} {"train_loss": -42.141700744628906, "global_step": 296102, "epoch": 2447} {"train_loss": -42.28525924682617, "global_step": 296103, "epoch": 2447} {"train_loss": -42.15372848510742, "global_step": 296104, "epoch": 2447} {"train_loss": -41.925941467285156, "global_step": 296105, "epoch": 2447} {"train_loss": -41.57282257080078, "global_step": 296106, "epoch": 2447} {"train_loss": -41.419105529785156, "global_step": 296107, "epoch": 2447} {"train_loss": -42.25299835205078, "global_step": 296108, "epoch": 2447} {"train_loss": -41.59000778198242, "global_step": 296109, "epoch": 2447} {"train_loss": -41.8062629699707, "global_step": 296110, "epoch": 2447} {"train_loss": -42.36379623413086, "global_step": 296111, "epoch": 2447} {"train_loss": -40.995479583740234, "global_step": 296112, "epoch": 2447} {"train_loss": -42.098907470703125, "global_step": 296113, "epoch": 2447} {"train_loss": -41.89741897583008, "global_step": 296114, "epoch": 2447} {"train_loss": -42.2438850402832, "global_step": 296115, "epoch": 2447} {"train_loss": -42.153594970703125, "global_step": 296116, "epoch": 2447} {"train_loss": -41.25019836425781, "global_step": 296117, "epoch": 2447} {"train_loss": -42.27178955078125, "global_step": 296118, "epoch": 2447} {"train_loss": -42.38455581665039, "global_step": 296119, "epoch": 2447} {"train_loss": -41.80773162841797, "global_step": 296120, "epoch": 2447} {"train_loss": -42.890316009521484, "global_step": 296121, "epoch": 2447} {"train_loss": -42.11821746826172, "global_step": 296122, "epoch": 2447} {"train_loss": -41.619110107421875, "global_step": 296123, "epoch": 2447} {"train_loss": -42.948089599609375, "global_step": 296124, "epoch": 2447} {"train_loss": -42.49578094482422, "global_step": 296125, "epoch": 2447} {"train_loss": -41.38407516479492, "global_step": 296126, "epoch": 2447} {"train_loss": -41.90921401977539, "global_step": 296127, "epoch": 2447} {"train_loss": -42.66721725463867, "global_step": 296128, "epoch": 2447} {"train_loss": -42.69847106933594, "global_step": 296129, "epoch": 2447} {"train_loss": -42.59619140625, "global_step": 296130, "epoch": 2447} {"train_loss": -43.15989303588867, "global_step": 296131, "epoch": 2447} {"train_loss": -42.7229118347168, "global_step": 296132, "epoch": 2447} {"train_loss": -42.761592864990234, "global_step": 296133, "epoch": 2447} {"train_loss": -42.571998596191406, "global_step": 296134, "epoch": 2447} {"train_loss": -43.771663665771484, "global_step": 296135, "epoch": 2447} {"train_loss": -42.35368347167969, "global_step": 296136, "epoch": 2447} {"train_loss": -43.48268508911133, "global_step": 296137, "epoch": 2447} {"train_loss": -43.43680953979492, "global_step": 296138, "epoch": 2447} {"train_loss": -43.5584831237793, "global_step": 296139, "epoch": 2447} {"train_loss": -42.85921096801758, "global_step": 296140, "epoch": 2447} {"train_loss": -43.166805267333984, "global_step": 296141, "epoch": 2447} {"train_loss": -43.25120162963867, "global_step": 296142, "epoch": 2447} {"train_loss": -43.675777435302734, "global_step": 296143, "epoch": 2447} {"train_loss": -42.45210266113281, "global_step": 296144, "epoch": 2447} {"train_loss": -41.95039749145508, "global_step": 296145, "epoch": 2447} {"train_loss": -43.2097282409668, "global_step": 296146, "epoch": 2447} {"train_loss": -43.573543548583984, "global_step": 296147, "epoch": 2447} {"train_loss": -42.88412094116211, "global_step": 296148, "epoch": 2447} {"train_loss": -42.84572982788086, "global_step": 296149, "epoch": 2447} {"train_loss": -43.1834716796875, "global_step": 296150, "epoch": 2447} {"train_loss": -42.9620361328125, "global_step": 296151, "epoch": 2447} {"train_loss": -43.40851593017578, "global_step": 296152, "epoch": 2447} {"train_loss": -43.624969482421875, "global_step": 296153, "epoch": 2447} {"train_loss": -43.63307571411133, "global_step": 296154, "epoch": 2447} {"train_loss": -43.09832763671875, "global_step": 296155, "epoch": 2447} {"train_loss": -43.97452926635742, "global_step": 296156, "epoch": 2447} {"train_loss": -43.385250091552734, "global_step": 296157, "epoch": 2447} {"train_loss": -43.78105163574219, "global_step": 296158, "epoch": 2447} {"train_loss": -43.790401458740234, "global_step": 296159, "epoch": 2447} {"train_loss": -42.716182708740234, "global_step": 296160, "epoch": 2447} {"train_loss": -43.924903869628906, "global_step": 296161, "epoch": 2447} {"train_loss": -41.610042572021484, "global_step": 296162, "epoch": 2447} {"train_loss": -42.36610794067383, "global_step": 296163, "epoch": 2447} {"train_loss": -42.119869232177734, "global_step": 296164, "epoch": 2447} {"train_loss": -42.11625671386719, "global_step": 296165, "epoch": 2447} {"train_loss": -43.23244857788086, "global_step": 296166, "epoch": 2447} {"train_loss": -43.853858947753906, "global_step": 296167, "epoch": 2447} {"train_loss": -42.27555465698242, "global_step": 296168, "epoch": 2447} {"train_loss": -42.558101654052734, "global_step": 296169, "epoch": 2447} {"train_loss": -42.578407287597656, "global_step": 296170, "epoch": 2447} {"train_loss": -42.680946350097656, "global_step": 296171, "epoch": 2447} {"train_loss": -42.390716552734375, "global_step": 296172, "epoch": 2447} {"train_loss": -40.79376220703125, "global_step": 296173, "epoch": 2447} {"train_loss": -41.89005661010742, "global_step": 296174, "epoch": 2447} {"train_loss": -40.788917541503906, "global_step": 296175, "epoch": 2447} {"train_loss": -41.860450744628906, "global_step": 296176, "epoch": 2447} {"train_loss": -42.69869613647461, "global_step": 296177, "epoch": 2447} {"train_loss": -41.63956069946289, "global_step": 296178, "epoch": 2447} {"train_loss": -41.06239700317383, "global_step": 296179, "epoch": 2447} {"train_loss": -41.5255126953125, "global_step": 296180, "epoch": 2447} {"train_loss": -42.27848434448242, "global_step": 296181, "epoch": 2447} {"train_loss": -42.011680603027344, "global_step": 296182, "epoch": 2447} {"train_loss": -40.93670654296875, "global_step": 296183, "epoch": 2447} {"train_loss": -41.61186599731445, "global_step": 296184, "epoch": 2447} {"train_loss": -42.05270004272461, "global_step": 296185, "epoch": 2447} {"train_loss": -41.37690353393555, "global_step": 296186, "epoch": 2447} {"train_loss": -41.841590881347656, "global_step": 296187, "epoch": 2447} {"train_loss": -42.21664047241211, "global_step": 296188, "epoch": 2447} {"train_loss": -43.22516632080078, "global_step": 296189, "epoch": 2447} {"train_loss": -42.451171875, "global_step": 296190, "epoch": 2447} {"train_loss": -41.941829681396484, "global_step": 296191, "epoch": 2447} {"train_loss": -43.21017074584961, "global_step": 296192, "epoch": 2447} {"train_loss": -42.48026657104492, "global_step": 296193, "epoch": 2447} {"train_loss": -42.79737854003906, "global_step": 296194, "epoch": 2447} {"train_loss": -42.018707275390625, "global_step": 296195, "epoch": 2447} {"train_loss": -43.06570053100586, "global_step": 296196, "epoch": 2447} {"train_loss": -42.5892333984375, "global_step": 296197, "epoch": 2447} {"train_loss": -42.88355255126953, "global_step": 296198, "epoch": 2447} {"train_loss": -42.374412536621094, "global_step": 296199, "epoch": 2447} {"train_loss": -43.20403289794922, "global_step": 296200, "epoch": 2447} {"train_loss": -42.32822036743164, "global_step": 296201, "epoch": 2447} {"train_loss": -42.73769760131836, "global_step": 296202, "epoch": 2447} {"train_loss": -43.10696029663086, "global_step": 296203, "epoch": 2447} {"train_loss": -42.51946258544922, "global_step": 296204, "epoch": 2447} {"train_loss": -42.7835693359375, "global_step": 296205, "epoch": 2447} {"train_loss": -43.645267486572266, "global_step": 296206, "epoch": 2447} {"train_loss": -42.36115949015972, "global_step": 296207, "epoch": 2447, "val_loss": 2665204.75} {"train_loss": -42.9753532409668, "global_step": 296208, "epoch": 2448} {"train_loss": -43.07301712036133, "global_step": 296209, "epoch": 2448} {"train_loss": -43.1174201965332, "global_step": 296210, "epoch": 2448} {"train_loss": -43.07208251953125, "global_step": 296211, "epoch": 2448} {"train_loss": -42.839378356933594, "global_step": 296212, "epoch": 2448} {"train_loss": -42.862247467041016, "global_step": 296213, "epoch": 2448} {"train_loss": -42.60590744018555, "global_step": 296214, "epoch": 2448} {"train_loss": -42.69812774658203, "global_step": 296215, "epoch": 2448} {"train_loss": -43.56237030029297, "global_step": 296216, "epoch": 2448} {"train_loss": -43.51205062866211, "global_step": 296217, "epoch": 2448} {"train_loss": -42.69072723388672, "global_step": 296218, "epoch": 2448} {"train_loss": -41.8148078918457, "global_step": 296219, "epoch": 2448} {"train_loss": -43.31916427612305, "global_step": 296220, "epoch": 2448} {"train_loss": -42.73604965209961, "global_step": 296221, "epoch": 2448} {"train_loss": -41.8426628112793, "global_step": 296222, "epoch": 2448} {"train_loss": -42.14006042480469, "global_step": 296223, "epoch": 2448} {"train_loss": -42.80324172973633, "global_step": 296224, "epoch": 2448} {"train_loss": -43.711669921875, "global_step": 296225, "epoch": 2448} {"train_loss": -43.21609115600586, "global_step": 296226, "epoch": 2448} {"train_loss": -43.333839416503906, "global_step": 296227, "epoch": 2448} {"train_loss": -43.251991271972656, "global_step": 296228, "epoch": 2448} {"train_loss": -43.278709411621094, "global_step": 296229, "epoch": 2448} {"train_loss": -43.44257736206055, "global_step": 296230, "epoch": 2448} {"train_loss": -42.993465423583984, "global_step": 296231, "epoch": 2448} {"train_loss": -43.437843322753906, "global_step": 296232, "epoch": 2448} {"train_loss": -43.5963249206543, "global_step": 296233, "epoch": 2448} {"train_loss": -43.54016876220703, "global_step": 296234, "epoch": 2448} {"train_loss": -43.027610778808594, "global_step": 296235, "epoch": 2448} {"train_loss": -43.38082504272461, "global_step": 296236, "epoch": 2448} {"train_loss": -42.94447708129883, "global_step": 296237, "epoch": 2448} {"train_loss": -43.98495101928711, "global_step": 296238, "epoch": 2448} {"train_loss": -42.805519104003906, "global_step": 296239, "epoch": 2448} {"train_loss": -43.602622985839844, "global_step": 296240, "epoch": 2448} {"train_loss": -43.587947845458984, "global_step": 296241, "epoch": 2448} {"train_loss": -43.64265823364258, "global_step": 296242, "epoch": 2448} {"train_loss": -43.38617706298828, "global_step": 296243, "epoch": 2448} {"train_loss": -43.107940673828125, "global_step": 296244, "epoch": 2448} {"train_loss": -43.63581466674805, "global_step": 296245, "epoch": 2448} {"train_loss": -42.92206954956055, "global_step": 296246, "epoch": 2448} {"train_loss": -42.92772674560547, "global_step": 296247, "epoch": 2448} {"train_loss": -41.61553955078125, "global_step": 296248, "epoch": 2448} {"train_loss": -43.199623107910156, "global_step": 296249, "epoch": 2448} {"train_loss": -41.82833480834961, "global_step": 296250, "epoch": 2448} {"train_loss": -44.01628112792969, "global_step": 296251, "epoch": 2448} {"train_loss": -43.89591598510742, "global_step": 296252, "epoch": 2448} {"train_loss": -44.28985595703125, "global_step": 296253, "epoch": 2448} {"train_loss": -43.945438385009766, "global_step": 296254, "epoch": 2448} {"train_loss": -43.465938568115234, "global_step": 296255, "epoch": 2448} {"train_loss": -43.7432975769043, "global_step": 296256, "epoch": 2448} {"train_loss": -43.917415618896484, "global_step": 296257, "epoch": 2448} {"train_loss": -43.55015182495117, "global_step": 296258, "epoch": 2448} {"train_loss": -43.182613372802734, "global_step": 296259, "epoch": 2448} {"train_loss": -43.6695442199707, "global_step": 296260, "epoch": 2448} {"train_loss": -43.0733642578125, "global_step": 296261, "epoch": 2448} {"train_loss": -43.70016098022461, "global_step": 296262, "epoch": 2448} {"train_loss": -42.124080657958984, "global_step": 296263, "epoch": 2448} {"train_loss": -42.7796630859375, "global_step": 296264, "epoch": 2448} {"train_loss": -42.774349212646484, "global_step": 296265, "epoch": 2448} {"train_loss": -44.37457275390625, "global_step": 296266, "epoch": 2448} {"train_loss": -41.35322189331055, "global_step": 296267, "epoch": 2448} {"train_loss": -43.016700744628906, "global_step": 296268, "epoch": 2448} {"train_loss": -40.75291442871094, "global_step": 296269, "epoch": 2448} {"train_loss": -40.15328598022461, "global_step": 296270, "epoch": 2448} {"train_loss": -40.6190185546875, "global_step": 296271, "epoch": 2448} {"train_loss": -40.08858108520508, "global_step": 296272, "epoch": 2448} {"train_loss": -41.224327087402344, "global_step": 296273, "epoch": 2448} {"train_loss": -42.148681640625, "global_step": 296274, "epoch": 2448} {"train_loss": -42.20882797241211, "global_step": 296275, "epoch": 2448} {"train_loss": -40.404090881347656, "global_step": 296276, "epoch": 2448} {"train_loss": -39.499942779541016, "global_step": 296277, "epoch": 2448} {"train_loss": -42.02859115600586, "global_step": 296278, "epoch": 2448} {"train_loss": -41.14547348022461, "global_step": 296279, "epoch": 2448} {"train_loss": -40.540218353271484, "global_step": 296280, "epoch": 2448} {"train_loss": -42.680782318115234, "global_step": 296281, "epoch": 2448} {"train_loss": -42.320228576660156, "global_step": 296282, "epoch": 2448} {"train_loss": -42.27018737792969, "global_step": 296283, "epoch": 2448} {"train_loss": -42.020259857177734, "global_step": 296284, "epoch": 2448} {"train_loss": -41.88711166381836, "global_step": 296285, "epoch": 2448} {"train_loss": -42.16311264038086, "global_step": 296286, "epoch": 2448} {"train_loss": -42.90131759643555, "global_step": 296287, "epoch": 2448} {"train_loss": -41.81795120239258, "global_step": 296288, "epoch": 2448} {"train_loss": -43.2232780456543, "global_step": 296289, "epoch": 2448} {"train_loss": -43.117340087890625, "global_step": 296290, "epoch": 2448} {"train_loss": -42.40995407104492, "global_step": 296291, "epoch": 2448} {"train_loss": -40.99578094482422, "global_step": 296292, "epoch": 2448} {"train_loss": -42.8993034362793, "global_step": 296293, "epoch": 2448} {"train_loss": -43.39418029785156, "global_step": 296294, "epoch": 2448} {"train_loss": -42.47346878051758, "global_step": 296295, "epoch": 2448} {"train_loss": -43.56283187866211, "global_step": 296296, "epoch": 2448} {"train_loss": -42.56551742553711, "global_step": 296297, "epoch": 2448} {"train_loss": -41.34897232055664, "global_step": 296298, "epoch": 2448} {"train_loss": -42.45754623413086, "global_step": 296299, "epoch": 2448} {"train_loss": -43.388710021972656, "global_step": 296300, "epoch": 2448} {"train_loss": -42.488643646240234, "global_step": 296301, "epoch": 2448} {"train_loss": -43.37678909301758, "global_step": 296302, "epoch": 2448} {"train_loss": -43.04621505737305, "global_step": 296303, "epoch": 2448} {"train_loss": -41.97328567504883, "global_step": 296304, "epoch": 2448} {"train_loss": -42.55746078491211, "global_step": 296305, "epoch": 2448} {"train_loss": -42.74177551269531, "global_step": 296306, "epoch": 2448} {"train_loss": -43.00666046142578, "global_step": 296307, "epoch": 2448} {"train_loss": -42.671485900878906, "global_step": 296308, "epoch": 2448} {"train_loss": -42.72316360473633, "global_step": 296309, "epoch": 2448} {"train_loss": -43.622764587402344, "global_step": 296310, "epoch": 2448} {"train_loss": -43.24398422241211, "global_step": 296311, "epoch": 2448} {"train_loss": -42.81547927856445, "global_step": 296312, "epoch": 2448} {"train_loss": -43.20499801635742, "global_step": 296313, "epoch": 2448} {"train_loss": -42.32258987426758, "global_step": 296314, "epoch": 2448} {"train_loss": -42.201969146728516, "global_step": 296315, "epoch": 2448} {"train_loss": -43.16004943847656, "global_step": 296316, "epoch": 2448} {"train_loss": -42.98418426513672, "global_step": 296317, "epoch": 2448} {"train_loss": -42.1044807434082, "global_step": 296318, "epoch": 2448} {"train_loss": -43.256980895996094, "global_step": 296319, "epoch": 2448} {"train_loss": -42.442073822021484, "global_step": 296320, "epoch": 2448} {"train_loss": -43.249507904052734, "global_step": 296321, "epoch": 2448} {"train_loss": -43.118656158447266, "global_step": 296322, "epoch": 2448} {"train_loss": -42.47566223144531, "global_step": 296323, "epoch": 2448} {"train_loss": -43.63373565673828, "global_step": 296324, "epoch": 2448} {"train_loss": -43.297996520996094, "global_step": 296325, "epoch": 2448} {"train_loss": -43.99082565307617, "global_step": 296326, "epoch": 2448} {"train_loss": -43.35299301147461, "global_step": 296327, "epoch": 2448} {"train_loss": -42.77011433120602, "global_step": 296328, "epoch": 2448, "val_loss": 2639730.25} {"train_loss": -43.15796661376953, "global_step": 296329, "epoch": 2449} {"train_loss": -43.22443389892578, "global_step": 296330, "epoch": 2449} {"train_loss": -43.10185241699219, "global_step": 296331, "epoch": 2449} {"train_loss": -43.106685638427734, "global_step": 296332, "epoch": 2449} {"train_loss": -43.02234649658203, "global_step": 296333, "epoch": 2449} {"train_loss": -43.25180435180664, "global_step": 296334, "epoch": 2449} {"train_loss": -42.87519454956055, "global_step": 296335, "epoch": 2449} {"train_loss": -43.24039077758789, "global_step": 296336, "epoch": 2449} {"train_loss": -43.687904357910156, "global_step": 296337, "epoch": 2449} {"train_loss": -43.33488082885742, "global_step": 296338, "epoch": 2449} {"train_loss": -43.30394744873047, "global_step": 296339, "epoch": 2449} {"train_loss": -43.32235336303711, "global_step": 296340, "epoch": 2449} {"train_loss": -42.913421630859375, "global_step": 296341, "epoch": 2449} {"train_loss": -42.479244232177734, "global_step": 296342, "epoch": 2449} {"train_loss": -29.987058639526367, "global_step": 296343, "epoch": 2449} {"train_loss": -42.426841735839844, "global_step": 296344, "epoch": 2449} {"train_loss": -41.78705978393555, "global_step": 296345, "epoch": 2449} {"train_loss": -28.367002487182617, "global_step": 296346, "epoch": 2449} {"train_loss": -35.85055160522461, "global_step": 296347, "epoch": 2449} {"train_loss": -13.845885276794434, "global_step": 296348, "epoch": 2449} {"train_loss": -35.880218505859375, "global_step": 296349, "epoch": 2449} {"train_loss": -39.83231735229492, "global_step": 296350, "epoch": 2449} {"train_loss": -38.53900909423828, "global_step": 296351, "epoch": 2449} {"train_loss": -35.67832565307617, "global_step": 296352, "epoch": 2449} {"train_loss": -32.74116897583008, "global_step": 296353, "epoch": 2449} {"train_loss": -37.4945182800293, "global_step": 296354, "epoch": 2449} {"train_loss": -26.606786727905273, "global_step": 296355, "epoch": 2449} {"train_loss": -34.68549728393555, "global_step": 296356, "epoch": 2449} {"train_loss": -37.66718673706055, "global_step": 296357, "epoch": 2449} {"train_loss": -38.111934661865234, "global_step": 296358, "epoch": 2449} {"train_loss": -39.2008171081543, "global_step": 296359, "epoch": 2449} {"train_loss": -36.32482147216797, "global_step": 296360, "epoch": 2449} {"train_loss": -38.98484420776367, "global_step": 296361, "epoch": 2449} {"train_loss": -34.120399475097656, "global_step": 296362, "epoch": 2449} {"train_loss": -37.59326171875, "global_step": 296363, "epoch": 2449} {"train_loss": -35.36019515991211, "global_step": 296364, "epoch": 2449} {"train_loss": -36.20257568359375, "global_step": 296365, "epoch": 2449} {"train_loss": -25.0493221282959, "global_step": 296366, "epoch": 2449} {"train_loss": -37.81121826171875, "global_step": 296367, "epoch": 2449} {"train_loss": -38.83596420288086, "global_step": 296368, "epoch": 2449} {"train_loss": -36.339149475097656, "global_step": 296369, "epoch": 2449} {"train_loss": -35.589637756347656, "global_step": 296370, "epoch": 2449} {"train_loss": -35.77455520629883, "global_step": 296371, "epoch": 2449} {"train_loss": -38.35224151611328, "global_step": 296372, "epoch": 2449} {"train_loss": -38.86431121826172, "global_step": 296373, "epoch": 2449} {"train_loss": -37.643280029296875, "global_step": 296374, "epoch": 2449} {"train_loss": -35.170143127441406, "global_step": 296375, "epoch": 2449} {"train_loss": -37.21181869506836, "global_step": 296376, "epoch": 2449} {"train_loss": -33.97634506225586, "global_step": 296377, "epoch": 2449} {"train_loss": -39.520477294921875, "global_step": 296378, "epoch": 2449} {"train_loss": -37.50443649291992, "global_step": 296379, "epoch": 2449} {"train_loss": -39.13540267944336, "global_step": 296380, "epoch": 2449} {"train_loss": -37.928321838378906, "global_step": 296381, "epoch": 2449} {"train_loss": -40.03782272338867, "global_step": 296382, "epoch": 2449} {"train_loss": -39.77152633666992, "global_step": 296383, "epoch": 2449} {"train_loss": -39.25791549682617, "global_step": 296384, "epoch": 2449} {"train_loss": -40.714134216308594, "global_step": 296385, "epoch": 2449} {"train_loss": -38.770599365234375, "global_step": 296386, "epoch": 2449} {"train_loss": -40.02153396606445, "global_step": 296387, "epoch": 2449} {"train_loss": -39.07326889038086, "global_step": 296388, "epoch": 2449} {"train_loss": -39.13154602050781, "global_step": 296389, "epoch": 2449} {"train_loss": -38.6971435546875, "global_step": 296390, "epoch": 2449} {"train_loss": -38.64788818359375, "global_step": 296391, "epoch": 2449} {"train_loss": -40.15058517456055, "global_step": 296392, "epoch": 2449} {"train_loss": -40.65399169921875, "global_step": 296393, "epoch": 2449} {"train_loss": -39.1209602355957, "global_step": 296394, "epoch": 2449} {"train_loss": -40.45386505126953, "global_step": 296395, "epoch": 2449} {"train_loss": -40.35792541503906, "global_step": 296396, "epoch": 2449} {"train_loss": -40.01988220214844, "global_step": 296397, "epoch": 2449} {"train_loss": -39.996734619140625, "global_step": 296398, "epoch": 2449} {"train_loss": -39.623924255371094, "global_step": 296399, "epoch": 2449} {"train_loss": -40.67264938354492, "global_step": 296400, "epoch": 2449} {"train_loss": -40.25667953491211, "global_step": 296401, "epoch": 2449} {"train_loss": -40.11704635620117, "global_step": 296402, "epoch": 2449} {"train_loss": -40.3107795715332, "global_step": 296403, "epoch": 2449} {"train_loss": -40.16645431518555, "global_step": 296404, "epoch": 2449} {"train_loss": -41.11300277709961, "global_step": 296405, "epoch": 2449} {"train_loss": -40.74263381958008, "global_step": 296406, "epoch": 2449} {"train_loss": -41.257171630859375, "global_step": 296407, "epoch": 2449} {"train_loss": -41.31864547729492, "global_step": 296408, "epoch": 2449} {"train_loss": -41.164894104003906, "global_step": 296409, "epoch": 2449} {"train_loss": -41.0345344543457, "global_step": 296410, "epoch": 2449} {"train_loss": -41.27897262573242, "global_step": 296411, "epoch": 2449} {"train_loss": -40.89994430541992, "global_step": 296412, "epoch": 2449} {"train_loss": -40.28428268432617, "global_step": 296413, "epoch": 2449} {"train_loss": -41.270973205566406, "global_step": 296414, "epoch": 2449} {"train_loss": -41.44895935058594, "global_step": 296415, "epoch": 2449} {"train_loss": -40.89515686035156, "global_step": 296416, "epoch": 2449} {"train_loss": -40.83033752441406, "global_step": 296417, "epoch": 2449} {"train_loss": -41.42795944213867, "global_step": 296418, "epoch": 2449} {"train_loss": -41.09519577026367, "global_step": 296419, "epoch": 2449} {"train_loss": -41.5495719909668, "global_step": 296420, "epoch": 2449} {"train_loss": -42.27088165283203, "global_step": 296421, "epoch": 2449} {"train_loss": -41.74813461303711, "global_step": 296422, "epoch": 2449} {"train_loss": -41.70589065551758, "global_step": 296423, "epoch": 2449} {"train_loss": -40.96749496459961, "global_step": 296424, "epoch": 2449} {"train_loss": -42.36260223388672, "global_step": 296425, "epoch": 2449} {"train_loss": -42.53334045410156, "global_step": 296426, "epoch": 2449} {"train_loss": -41.93976974487305, "global_step": 296427, "epoch": 2449} {"train_loss": -41.24507141113281, "global_step": 296428, "epoch": 2449} {"train_loss": -41.81587600708008, "global_step": 296429, "epoch": 2449} {"train_loss": -41.42678451538086, "global_step": 296430, "epoch": 2449} {"train_loss": -42.73606491088867, "global_step": 296431, "epoch": 2449} {"train_loss": -41.27802658081055, "global_step": 296432, "epoch": 2449} {"train_loss": -42.44169998168945, "global_step": 296433, "epoch": 2449} {"train_loss": -41.55534362792969, "global_step": 296434, "epoch": 2449} {"train_loss": -42.55494689941406, "global_step": 296435, "epoch": 2449} {"train_loss": -41.936012268066406, "global_step": 296436, "epoch": 2449} {"train_loss": -42.068233489990234, "global_step": 296437, "epoch": 2449} {"train_loss": -41.56209945678711, "global_step": 296438, "epoch": 2449} {"train_loss": -42.02587890625, "global_step": 296439, "epoch": 2449} {"train_loss": -41.81145477294922, "global_step": 296440, "epoch": 2449} {"train_loss": -41.82917404174805, "global_step": 296441, "epoch": 2449} {"train_loss": -42.01349639892578, "global_step": 296442, "epoch": 2449} {"train_loss": -42.37128829956055, "global_step": 296443, "epoch": 2449} {"train_loss": -42.4223518371582, "global_step": 296444, "epoch": 2449} {"train_loss": -42.56673812866211, "global_step": 296445, "epoch": 2449} {"train_loss": -43.321407318115234, "global_step": 296446, "epoch": 2449} {"train_loss": -42.57366943359375, "global_step": 296447, "epoch": 2449} {"train_loss": -42.00002670288086, "global_step": 296448, "epoch": 2449} {"train_loss": -39.581448413123766, "global_step": 296449, "epoch": 2449, "val_loss": 2512915.75} {"train_loss": -42.10539627075195, "global_step": 296450, "epoch": 2450} {"train_loss": -42.03998565673828, "global_step": 296451, "epoch": 2450} {"train_loss": -41.98604202270508, "global_step": 296452, "epoch": 2450} {"train_loss": -42.340248107910156, "global_step": 296453, "epoch": 2450} {"train_loss": -42.447723388671875, "global_step": 296454, "epoch": 2450} {"train_loss": -43.15512466430664, "global_step": 296455, "epoch": 2450} {"train_loss": -43.26619338989258, "global_step": 296456, "epoch": 2450} {"train_loss": -42.82461166381836, "global_step": 296457, "epoch": 2450} {"train_loss": -43.454769134521484, "global_step": 296458, "epoch": 2450} {"train_loss": -42.34443283081055, "global_step": 296459, "epoch": 2450} {"train_loss": -41.380489349365234, "global_step": 296460, "epoch": 2450} {"train_loss": -41.92079544067383, "global_step": 296461, "epoch": 2450} {"train_loss": -43.31501388549805, "global_step": 296462, "epoch": 2450} {"train_loss": -43.071624755859375, "global_step": 296463, "epoch": 2450} {"train_loss": -43.27166748046875, "global_step": 296464, "epoch": 2450} {"train_loss": -42.82906723022461, "global_step": 296465, "epoch": 2450} {"train_loss": -42.401588439941406, "global_step": 296466, "epoch": 2450} {"train_loss": -43.38386154174805, "global_step": 296467, "epoch": 2450} {"train_loss": -42.611690521240234, "global_step": 296468, "epoch": 2450} {"train_loss": -42.99880599975586, "global_step": 296469, "epoch": 2450} {"train_loss": -42.87934494018555, "global_step": 296470, "epoch": 2450} {"train_loss": -42.39915084838867, "global_step": 296471, "epoch": 2450} {"train_loss": -42.821407318115234, "global_step": 296472, "epoch": 2450} {"train_loss": -42.16494369506836, "global_step": 296473, "epoch": 2450} {"train_loss": -42.7572135925293, "global_step": 296474, "epoch": 2450} {"train_loss": -43.040672302246094, "global_step": 296475, "epoch": 2450} {"train_loss": -42.70610427856445, "global_step": 296476, "epoch": 2450} {"train_loss": -42.47706985473633, "global_step": 296477, "epoch": 2450} {"train_loss": -43.07184982299805, "global_step": 296478, "epoch": 2450} {"train_loss": -42.97184371948242, "global_step": 296479, "epoch": 2450} {"train_loss": -42.9536247253418, "global_step": 296480, "epoch": 2450} {"train_loss": -43.5866813659668, "global_step": 296481, "epoch": 2450} {"train_loss": -43.16423416137695, "global_step": 296482, "epoch": 2450} {"train_loss": -43.0795783996582, "global_step": 296483, "epoch": 2450} {"train_loss": -43.22408676147461, "global_step": 296484, "epoch": 2450} {"train_loss": -42.79420852661133, "global_step": 296485, "epoch": 2450} {"train_loss": -43.07974624633789, "global_step": 296486, "epoch": 2450} {"train_loss": -43.23405838012695, "global_step": 296487, "epoch": 2450} {"train_loss": -43.80905532836914, "global_step": 296488, "epoch": 2450} {"train_loss": -43.51780700683594, "global_step": 296489, "epoch": 2450} {"train_loss": -43.29841232299805, "global_step": 296490, "epoch": 2450} {"train_loss": -43.65625, "global_step": 296491, "epoch": 2450} {"train_loss": -43.633338928222656, "global_step": 296492, "epoch": 2450} {"train_loss": -43.52791976928711, "global_step": 296493, "epoch": 2450} {"train_loss": -43.416725158691406, "global_step": 296494, "epoch": 2450} {"train_loss": -43.41731262207031, "global_step": 296495, "epoch": 2450} {"train_loss": -43.13098907470703, "global_step": 296496, "epoch": 2450} {"train_loss": -43.4248046875, "global_step": 296497, "epoch": 2450} {"train_loss": -43.396541595458984, "global_step": 296498, "epoch": 2450} {"train_loss": -44.11588668823242, "global_step": 296499, "epoch": 2450} {"train_loss": -43.7608642578125, "global_step": 296500, "epoch": 2450} {"train_loss": -43.397186279296875, "global_step": 296501, "epoch": 2450} {"train_loss": -41.644996643066406, "global_step": 296502, "epoch": 2450} {"train_loss": -43.12327194213867, "global_step": 296503, "epoch": 2450} {"train_loss": -42.98203659057617, "global_step": 296504, "epoch": 2450} {"train_loss": -42.767852783203125, "global_step": 296505, "epoch": 2450} {"train_loss": -42.79619216918945, "global_step": 296506, "epoch": 2450} {"train_loss": -43.393245697021484, "global_step": 296507, "epoch": 2450} {"train_loss": -43.09602737426758, "global_step": 296508, "epoch": 2450} {"train_loss": -43.378456115722656, "global_step": 296509, "epoch": 2450} {"train_loss": -42.39564895629883, "global_step": 296510, "epoch": 2450} {"train_loss": -40.82612228393555, "global_step": 296511, "epoch": 2450} {"train_loss": -37.14066696166992, "global_step": 296512, "epoch": 2450} {"train_loss": -29.230792999267578, "global_step": 296513, "epoch": 2450} {"train_loss": -23.46527671813965, "global_step": 296514, "epoch": 2450} {"train_loss": -35.620975494384766, "global_step": 296515, "epoch": 2450} {"train_loss": -38.231685638427734, "global_step": 296516, "epoch": 2450} {"train_loss": -39.32874298095703, "global_step": 296517, "epoch": 2450} {"train_loss": -35.23387908935547, "global_step": 296518, "epoch": 2450} {"train_loss": -41.19260787963867, "global_step": 296519, "epoch": 2450} {"train_loss": -37.18781661987305, "global_step": 296520, "epoch": 2450} {"train_loss": -39.53996276855469, "global_step": 296521, "epoch": 2450} {"train_loss": -39.35246276855469, "global_step": 296522, "epoch": 2450} {"train_loss": -36.99748229980469, "global_step": 296523, "epoch": 2450} {"train_loss": -40.15653610229492, "global_step": 296524, "epoch": 2450} {"train_loss": -35.49211502075195, "global_step": 296525, "epoch": 2450} {"train_loss": -39.58882522583008, "global_step": 296526, "epoch": 2450} {"train_loss": -37.48464584350586, "global_step": 296527, "epoch": 2450} {"train_loss": -39.254180908203125, "global_step": 296528, "epoch": 2450} {"train_loss": -40.46546936035156, "global_step": 296529, "epoch": 2450} {"train_loss": -37.8203010559082, "global_step": 296530, "epoch": 2450} {"train_loss": -41.659271240234375, "global_step": 296531, "epoch": 2450} {"train_loss": -39.509765625, "global_step": 296532, "epoch": 2450} {"train_loss": -39.754085540771484, "global_step": 296533, "epoch": 2450} {"train_loss": -41.924560546875, "global_step": 296534, "epoch": 2450} {"train_loss": -39.894832611083984, "global_step": 296535, "epoch": 2450} {"train_loss": -40.98011016845703, "global_step": 296536, "epoch": 2450} {"train_loss": -42.00249481201172, "global_step": 296537, "epoch": 2450} {"train_loss": -41.23542404174805, "global_step": 296538, "epoch": 2450} {"train_loss": -41.3554801940918, "global_step": 296539, "epoch": 2450} {"train_loss": -42.11414337158203, "global_step": 296540, "epoch": 2450} {"train_loss": -42.037105560302734, "global_step": 296541, "epoch": 2450} {"train_loss": -41.00774002075195, "global_step": 296542, "epoch": 2450} {"train_loss": -41.942955017089844, "global_step": 296543, "epoch": 2450} {"train_loss": -42.710906982421875, "global_step": 296544, "epoch": 2450} {"train_loss": -41.65644454956055, "global_step": 296545, "epoch": 2450} {"train_loss": -42.30451202392578, "global_step": 296546, "epoch": 2450} {"train_loss": -42.228424072265625, "global_step": 296547, "epoch": 2450} {"train_loss": -41.295318603515625, "global_step": 296548, "epoch": 2450} {"train_loss": -42.14823913574219, "global_step": 296549, "epoch": 2450} {"train_loss": -41.827274322509766, "global_step": 296550, "epoch": 2450} {"train_loss": -41.96826934814453, "global_step": 296551, "epoch": 2450} {"train_loss": -42.60858154296875, "global_step": 296552, "epoch": 2450} {"train_loss": -42.89089584350586, "global_step": 296553, "epoch": 2450} {"train_loss": -42.688880920410156, "global_step": 296554, "epoch": 2450} {"train_loss": -42.27365493774414, "global_step": 296555, "epoch": 2450} {"train_loss": -41.996891021728516, "global_step": 296556, "epoch": 2450} {"train_loss": -41.56641387939453, "global_step": 296557, "epoch": 2450} {"train_loss": -42.33864212036133, "global_step": 296558, "epoch": 2450} {"train_loss": -42.24892044067383, "global_step": 296559, "epoch": 2450} {"train_loss": -43.017295837402344, "global_step": 296560, "epoch": 2450} {"train_loss": -42.49283981323242, "global_step": 296561, "epoch": 2450} {"train_loss": -42.45963668823242, "global_step": 296562, "epoch": 2450} {"train_loss": -43.2684440612793, "global_step": 296563, "epoch": 2450} {"train_loss": -42.8496208190918, "global_step": 296564, "epoch": 2450} {"train_loss": -42.55424118041992, "global_step": 296565, "epoch": 2450} {"train_loss": -43.38082504272461, "global_step": 296566, "epoch": 2450} {"train_loss": -42.89644241333008, "global_step": 296567, "epoch": 2450} {"train_loss": -42.987831115722656, "global_step": 296568, "epoch": 2450} {"train_loss": -42.99482345581055, "global_step": 296569, "epoch": 2450} {"train_loss": -41.71026407982692, "global_step": 296570, "epoch": 2450, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4400000": 1.0, "test/sim_max_reward_4400001": 1.0, "test/sim_max_reward_4400002": 1.0, "test/sim_max_reward_4400003": 1.0, "test/sim_max_reward_4400004": 1.0, "test/sim_max_reward_4400005": 1.0, "test/sim_max_reward_4400006": 1.0, "test/sim_max_reward_4400007": 1.0, "test/sim_max_reward_4400008": 1.0, "test/sim_max_reward_4400009": 1.0, "test/sim_max_reward_4400010": 1.0, "test/sim_max_reward_4400011": 1.0, "test/sim_max_reward_4400012": 1.0, "test/sim_max_reward_4400013": 1.0, "test/sim_max_reward_4400014": 1.0, "test/sim_max_reward_4400015": 1.0, "test/sim_max_reward_4400016": 1.0, "test/sim_max_reward_4400017": 1.0, "test/sim_max_reward_4400018": 1.0, "test/sim_max_reward_4400019": 1.0, "test/sim_max_reward_4400020": 1.0, "test/sim_max_reward_4400021": 1.0, "train/mean_score": 1.0, "test/mean_score": 1.0, "val_loss": 2596634.0} {"train_loss": -43.206233978271484, "global_step": 296571, "epoch": 2451} {"train_loss": -43.18333053588867, "global_step": 296572, "epoch": 2451} {"train_loss": -43.697383880615234, "global_step": 296573, "epoch": 2451} {"train_loss": -43.22304916381836, "global_step": 296574, "epoch": 2451} {"train_loss": -42.811004638671875, "global_step": 296575, "epoch": 2451} {"train_loss": -43.626426696777344, "global_step": 296576, "epoch": 2451} {"train_loss": -43.414798736572266, "global_step": 296577, "epoch": 2451} {"train_loss": -42.919456481933594, "global_step": 296578, "epoch": 2451} {"train_loss": -43.7744255065918, "global_step": 296579, "epoch": 2451} {"train_loss": -43.61483383178711, "global_step": 296580, "epoch": 2451} {"train_loss": -43.587215423583984, "global_step": 296581, "epoch": 2451} {"train_loss": -42.96317672729492, "global_step": 296582, "epoch": 2451} {"train_loss": -43.58889389038086, "global_step": 296583, "epoch": 2451} {"train_loss": -43.70874786376953, "global_step": 296584, "epoch": 2451} {"train_loss": -44.38872146606445, "global_step": 296585, "epoch": 2451} {"train_loss": -44.07606506347656, "global_step": 296586, "epoch": 2451} {"train_loss": -44.13743209838867, "global_step": 296587, "epoch": 2451} {"train_loss": -43.4525032043457, "global_step": 296588, "epoch": 2451} {"train_loss": -43.437679290771484, "global_step": 296589, "epoch": 2451} {"train_loss": -44.144989013671875, "global_step": 296590, "epoch": 2451} {"train_loss": -43.69731521606445, "global_step": 296591, "epoch": 2451} {"train_loss": -43.17037582397461, "global_step": 296592, "epoch": 2451} {"train_loss": -44.120426177978516, "global_step": 296593, "epoch": 2451} {"train_loss": -43.64945602416992, "global_step": 296594, "epoch": 2451} {"train_loss": -43.545021057128906, "global_step": 296595, "epoch": 2451} {"train_loss": -43.748043060302734, "global_step": 296596, "epoch": 2451} {"train_loss": -43.03763961791992, "global_step": 296597, "epoch": 2451} {"train_loss": -44.00740432739258, "global_step": 296598, "epoch": 2451} {"train_loss": -44.34212875366211, "global_step": 296599, "epoch": 2451} {"train_loss": -42.76224899291992, "global_step": 296600, "epoch": 2451} {"train_loss": -42.755855560302734, "global_step": 296601, "epoch": 2451} {"train_loss": -40.7154541015625, "global_step": 296602, "epoch": 2451} {"train_loss": -39.251277923583984, "global_step": 296603, "epoch": 2451} {"train_loss": -39.105926513671875, "global_step": 296604, "epoch": 2451} {"train_loss": -39.64231491088867, "global_step": 296605, "epoch": 2451} {"train_loss": -40.58835983276367, "global_step": 296606, "epoch": 2451} {"train_loss": -41.65249252319336, "global_step": 296607, "epoch": 2451} {"train_loss": -41.96418380737305, "global_step": 296608, "epoch": 2451} {"train_loss": -42.41259765625, "global_step": 296609, "epoch": 2451} {"train_loss": -41.53092575073242, "global_step": 296610, "epoch": 2451} {"train_loss": -39.16230392456055, "global_step": 296611, "epoch": 2451} {"train_loss": -35.17684555053711, "global_step": 296612, "epoch": 2451} {"train_loss": -39.09123992919922, "global_step": 296613, "epoch": 2451} {"train_loss": -40.20846176147461, "global_step": 296614, "epoch": 2451} {"train_loss": -41.72571563720703, "global_step": 296615, "epoch": 2451} {"train_loss": -37.329185485839844, "global_step": 296616, "epoch": 2451} {"train_loss": -41.779415130615234, "global_step": 296617, "epoch": 2451} {"train_loss": -40.88652038574219, "global_step": 296618, "epoch": 2451} {"train_loss": -40.70095443725586, "global_step": 296619, "epoch": 2451} {"train_loss": -40.500404357910156, "global_step": 296620, "epoch": 2451} {"train_loss": -42.658424377441406, "global_step": 296621, "epoch": 2451} {"train_loss": -40.683773040771484, "global_step": 296622, "epoch": 2451} {"train_loss": -41.664546966552734, "global_step": 296623, "epoch": 2451} {"train_loss": -41.724945068359375, "global_step": 296624, "epoch": 2451} {"train_loss": -39.8241081237793, "global_step": 296625, "epoch": 2451} {"train_loss": -42.67424392700195, "global_step": 296626, "epoch": 2451} {"train_loss": -39.63444900512695, "global_step": 296627, "epoch": 2451} {"train_loss": -40.505889892578125, "global_step": 296628, "epoch": 2451} {"train_loss": -41.7492790222168, "global_step": 296629, "epoch": 2451} {"train_loss": -38.668190002441406, "global_step": 296630, "epoch": 2451} {"train_loss": -42.0973014831543, "global_step": 296631, "epoch": 2451} {"train_loss": -39.37345504760742, "global_step": 296632, "epoch": 2451} {"train_loss": -41.58747482299805, "global_step": 296633, "epoch": 2451} {"train_loss": -40.72722244262695, "global_step": 296634, "epoch": 2451} {"train_loss": -40.29290771484375, "global_step": 296635, "epoch": 2451} {"train_loss": -41.61724853515625, "global_step": 296636, "epoch": 2451} {"train_loss": -41.80632400512695, "global_step": 296637, "epoch": 2451} {"train_loss": -41.37221908569336, "global_step": 296638, "epoch": 2451} {"train_loss": -42.630332946777344, "global_step": 296639, "epoch": 2451} {"train_loss": -42.00798797607422, "global_step": 296640, "epoch": 2451} {"train_loss": -42.10679244995117, "global_step": 296641, "epoch": 2451} {"train_loss": -42.50381851196289, "global_step": 296642, "epoch": 2451} {"train_loss": -42.77346420288086, "global_step": 296643, "epoch": 2451} {"train_loss": -43.019500732421875, "global_step": 296644, "epoch": 2451} {"train_loss": -41.9085807800293, "global_step": 296645, "epoch": 2451} {"train_loss": -43.00310134887695, "global_step": 296646, "epoch": 2451} {"train_loss": -42.400142669677734, "global_step": 296647, "epoch": 2451} {"train_loss": -42.54016876220703, "global_step": 296648, "epoch": 2451} {"train_loss": -42.77311325073242, "global_step": 296649, "epoch": 2451} {"train_loss": -42.262916564941406, "global_step": 296650, "epoch": 2451} {"train_loss": -43.12268829345703, "global_step": 296651, "epoch": 2451} {"train_loss": -43.00990295410156, "global_step": 296652, "epoch": 2451} {"train_loss": -43.25930404663086, "global_step": 296653, "epoch": 2451} {"train_loss": -43.07171630859375, "global_step": 296654, "epoch": 2451} {"train_loss": -43.157264709472656, "global_step": 296655, "epoch": 2451} {"train_loss": -42.86885452270508, "global_step": 296656, "epoch": 2451} {"train_loss": -43.67615509033203, "global_step": 296657, "epoch": 2451} {"train_loss": -43.04597091674805, "global_step": 296658, "epoch": 2451} {"train_loss": -42.92818832397461, "global_step": 296659, "epoch": 2451} {"train_loss": -42.991661071777344, "global_step": 296660, "epoch": 2451} {"train_loss": -44.17240524291992, "global_step": 296661, "epoch": 2451} {"train_loss": -43.42987060546875, "global_step": 296662, "epoch": 2451} {"train_loss": -43.07928466796875, "global_step": 296663, "epoch": 2451} {"train_loss": -43.688987731933594, "global_step": 296664, "epoch": 2451} {"train_loss": -44.334415435791016, "global_step": 296665, "epoch": 2451} {"train_loss": -43.51303482055664, "global_step": 296666, "epoch": 2451} {"train_loss": -43.73622131347656, "global_step": 296667, "epoch": 2451} {"train_loss": -43.83298873901367, "global_step": 296668, "epoch": 2451} {"train_loss": -43.48298263549805, "global_step": 296669, "epoch": 2451} {"train_loss": -43.59220504760742, "global_step": 296670, "epoch": 2451} {"train_loss": -43.5251579284668, "global_step": 296671, "epoch": 2451} {"train_loss": -43.84124755859375, "global_step": 296672, "epoch": 2451} {"train_loss": -43.6128044128418, "global_step": 296673, "epoch": 2451} {"train_loss": -44.394256591796875, "global_step": 296674, "epoch": 2451} {"train_loss": -44.291770935058594, "global_step": 296675, "epoch": 2451} {"train_loss": -43.422237396240234, "global_step": 296676, "epoch": 2451} {"train_loss": -43.544952392578125, "global_step": 296677, "epoch": 2451} {"train_loss": -44.25435256958008, "global_step": 296678, "epoch": 2451} {"train_loss": -44.091121673583984, "global_step": 296679, "epoch": 2451} {"train_loss": -44.03580856323242, "global_step": 296680, "epoch": 2451} {"train_loss": -43.95510482788086, "global_step": 296681, "epoch": 2451} {"train_loss": -44.06147003173828, "global_step": 296682, "epoch": 2451} {"train_loss": -44.152000427246094, "global_step": 296683, "epoch": 2451} {"train_loss": -43.93073654174805, "global_step": 296684, "epoch": 2451} {"train_loss": -43.77180480957031, "global_step": 296685, "epoch": 2451} {"train_loss": -44.106929779052734, "global_step": 296686, "epoch": 2451} {"train_loss": -44.00250244140625, "global_step": 296687, "epoch": 2451} {"train_loss": -43.60450744628906, "global_step": 296688, "epoch": 2451} {"train_loss": -42.77901840209961, "global_step": 296689, "epoch": 2451} {"train_loss": -42.11155319213867, "global_step": 296690, "epoch": 2451} {"train_loss": -42.54127225008878, "global_step": 296691, "epoch": 2451, "val_loss": 2587451.0} {"train_loss": -42.04341125488281, "global_step": 296692, "epoch": 2452} {"train_loss": -41.111480712890625, "global_step": 296693, "epoch": 2452} {"train_loss": -41.07859420776367, "global_step": 296694, "epoch": 2452} {"train_loss": -40.88193130493164, "global_step": 296695, "epoch": 2452} {"train_loss": -42.7627067565918, "global_step": 296696, "epoch": 2452} {"train_loss": -43.671241760253906, "global_step": 296697, "epoch": 2452} {"train_loss": -43.921627044677734, "global_step": 296698, "epoch": 2452} {"train_loss": -42.66816329956055, "global_step": 296699, "epoch": 2452} {"train_loss": -43.285213470458984, "global_step": 296700, "epoch": 2452} {"train_loss": -43.31404113769531, "global_step": 296701, "epoch": 2452} {"train_loss": -43.52676010131836, "global_step": 296702, "epoch": 2452} {"train_loss": -42.7770881652832, "global_step": 296703, "epoch": 2452} {"train_loss": -42.94382858276367, "global_step": 296704, "epoch": 2452} {"train_loss": -43.601844787597656, "global_step": 296705, "epoch": 2452} {"train_loss": -43.39432144165039, "global_step": 296706, "epoch": 2452} {"train_loss": -43.26567459106445, "global_step": 296707, "epoch": 2452} {"train_loss": -43.379112243652344, "global_step": 296708, "epoch": 2452} {"train_loss": -43.67609786987305, "global_step": 296709, "epoch": 2452} {"train_loss": -42.697349548339844, "global_step": 296710, "epoch": 2452} {"train_loss": -42.54374313354492, "global_step": 296711, "epoch": 2452} {"train_loss": -43.426483154296875, "global_step": 296712, "epoch": 2452} {"train_loss": -42.48158264160156, "global_step": 296713, "epoch": 2452} {"train_loss": -41.80002975463867, "global_step": 296714, "epoch": 2452} {"train_loss": -42.790103912353516, "global_step": 296715, "epoch": 2452} {"train_loss": -43.16559600830078, "global_step": 296716, "epoch": 2452} {"train_loss": -42.466102600097656, "global_step": 296717, "epoch": 2452} {"train_loss": -42.41193771362305, "global_step": 296718, "epoch": 2452} {"train_loss": -42.81631088256836, "global_step": 296719, "epoch": 2452} {"train_loss": -42.259769439697266, "global_step": 296720, "epoch": 2452} {"train_loss": -40.086605072021484, "global_step": 296721, "epoch": 2452} {"train_loss": -40.73175048828125, "global_step": 296722, "epoch": 2452} {"train_loss": -42.71187210083008, "global_step": 296723, "epoch": 2452} {"train_loss": -40.7763557434082, "global_step": 296724, "epoch": 2452} {"train_loss": -40.21580123901367, "global_step": 296725, "epoch": 2452} {"train_loss": -40.93601989746094, "global_step": 296726, "epoch": 2452} {"train_loss": -42.71993637084961, "global_step": 296727, "epoch": 2452} {"train_loss": -42.0269660949707, "global_step": 296728, "epoch": 2452} {"train_loss": -41.600215911865234, "global_step": 296729, "epoch": 2452} {"train_loss": -43.36991500854492, "global_step": 296730, "epoch": 2452} {"train_loss": -43.20796203613281, "global_step": 296731, "epoch": 2452} {"train_loss": -42.79841232299805, "global_step": 296732, "epoch": 2452} {"train_loss": -42.47955322265625, "global_step": 296733, "epoch": 2452} {"train_loss": -43.27299880981445, "global_step": 296734, "epoch": 2452} {"train_loss": -41.71610641479492, "global_step": 296735, "epoch": 2452} {"train_loss": -39.95997619628906, "global_step": 296736, "epoch": 2452} {"train_loss": -42.91080856323242, "global_step": 296737, "epoch": 2452} {"train_loss": -40.13724899291992, "global_step": 296738, "epoch": 2452} {"train_loss": -42.2376823425293, "global_step": 296739, "epoch": 2452} {"train_loss": -42.268245697021484, "global_step": 296740, "epoch": 2452} {"train_loss": -41.74125289916992, "global_step": 296741, "epoch": 2452} {"train_loss": -42.654266357421875, "global_step": 296742, "epoch": 2452} {"train_loss": -42.96029281616211, "global_step": 296743, "epoch": 2452} {"train_loss": -42.4368782043457, "global_step": 296744, "epoch": 2452} {"train_loss": -42.655189514160156, "global_step": 296745, "epoch": 2452} {"train_loss": -43.76263427734375, "global_step": 296746, "epoch": 2452} {"train_loss": -41.56779098510742, "global_step": 296747, "epoch": 2452} {"train_loss": -42.5888557434082, "global_step": 296748, "epoch": 2452} {"train_loss": -43.23369216918945, "global_step": 296749, "epoch": 2452} {"train_loss": -41.32859420776367, "global_step": 296750, "epoch": 2452} {"train_loss": -43.168914794921875, "global_step": 296751, "epoch": 2452} {"train_loss": -43.34450912475586, "global_step": 296752, "epoch": 2452} {"train_loss": -42.39860916137695, "global_step": 296753, "epoch": 2452} {"train_loss": -41.30803298950195, "global_step": 296754, "epoch": 2452} {"train_loss": -43.26081466674805, "global_step": 296755, "epoch": 2452} {"train_loss": -41.39436721801758, "global_step": 296756, "epoch": 2452} {"train_loss": -43.01789474487305, "global_step": 296757, "epoch": 2452} {"train_loss": -42.9066047668457, "global_step": 296758, "epoch": 2452} {"train_loss": -41.83388137817383, "global_step": 296759, "epoch": 2452} {"train_loss": -42.50193405151367, "global_step": 296760, "epoch": 2452} {"train_loss": -42.33274459838867, "global_step": 296761, "epoch": 2452} {"train_loss": -41.17909240722656, "global_step": 296762, "epoch": 2452} {"train_loss": -42.621742248535156, "global_step": 296763, "epoch": 2452} {"train_loss": -42.103759765625, "global_step": 296764, "epoch": 2452} {"train_loss": -42.57611846923828, "global_step": 296765, "epoch": 2452} {"train_loss": -42.87111282348633, "global_step": 296766, "epoch": 2452} {"train_loss": -42.52157974243164, "global_step": 296767, "epoch": 2452} {"train_loss": -42.89173126220703, "global_step": 296768, "epoch": 2452} {"train_loss": -43.79213333129883, "global_step": 296769, "epoch": 2452} {"train_loss": -42.302223205566406, "global_step": 296770, "epoch": 2452} {"train_loss": -42.167999267578125, "global_step": 296771, "epoch": 2452} {"train_loss": -42.298866271972656, "global_step": 296772, "epoch": 2452} {"train_loss": -42.32778549194336, "global_step": 296773, "epoch": 2452} {"train_loss": -41.93424606323242, "global_step": 296774, "epoch": 2452} {"train_loss": -42.10595703125, "global_step": 296775, "epoch": 2452} {"train_loss": -42.630340576171875, "global_step": 296776, "epoch": 2452} {"train_loss": -41.96754837036133, "global_step": 296777, "epoch": 2452} {"train_loss": -42.57328414916992, "global_step": 296778, "epoch": 2452} {"train_loss": -42.28406524658203, "global_step": 296779, "epoch": 2452} {"train_loss": -42.130855560302734, "global_step": 296780, "epoch": 2452} {"train_loss": -42.26229476928711, "global_step": 296781, "epoch": 2452} {"train_loss": -43.3660774230957, "global_step": 296782, "epoch": 2452} {"train_loss": -42.54032516479492, "global_step": 296783, "epoch": 2452} {"train_loss": -42.49801254272461, "global_step": 296784, "epoch": 2452} {"train_loss": -42.79374313354492, "global_step": 296785, "epoch": 2452} {"train_loss": -42.95787811279297, "global_step": 296786, "epoch": 2452} {"train_loss": -43.08940505981445, "global_step": 296787, "epoch": 2452} {"train_loss": -43.4318733215332, "global_step": 296788, "epoch": 2452} {"train_loss": -43.27164840698242, "global_step": 296789, "epoch": 2452} {"train_loss": -43.356380462646484, "global_step": 296790, "epoch": 2452} {"train_loss": -43.50632858276367, "global_step": 296791, "epoch": 2452} {"train_loss": -43.33694076538086, "global_step": 296792, "epoch": 2452} {"train_loss": -43.11313247680664, "global_step": 296793, "epoch": 2452} {"train_loss": -43.5869140625, "global_step": 296794, "epoch": 2452} {"train_loss": -43.72101974487305, "global_step": 296795, "epoch": 2452} {"train_loss": -43.20016860961914, "global_step": 296796, "epoch": 2452} {"train_loss": -43.12818145751953, "global_step": 296797, "epoch": 2452} {"train_loss": -43.231563568115234, "global_step": 296798, "epoch": 2452} {"train_loss": -43.76597213745117, "global_step": 296799, "epoch": 2452} {"train_loss": -43.337677001953125, "global_step": 296800, "epoch": 2452} {"train_loss": -42.98007583618164, "global_step": 296801, "epoch": 2452} {"train_loss": -43.597991943359375, "global_step": 296802, "epoch": 2452} {"train_loss": -43.580440521240234, "global_step": 296803, "epoch": 2452} {"train_loss": -43.88296890258789, "global_step": 296804, "epoch": 2452} {"train_loss": -43.44059371948242, "global_step": 296805, "epoch": 2452} {"train_loss": -43.55292892456055, "global_step": 296806, "epoch": 2452} {"train_loss": -43.90349197387695, "global_step": 296807, "epoch": 2452} {"train_loss": -44.018798828125, "global_step": 296808, "epoch": 2452} {"train_loss": -43.46723556518555, "global_step": 296809, "epoch": 2452} {"train_loss": -43.453697204589844, "global_step": 296810, "epoch": 2452} {"train_loss": -43.891910552978516, "global_step": 296811, "epoch": 2452} {"train_loss": -42.652682627528165, "global_step": 296812, "epoch": 2452, "val_loss": 2559527.25} {"train_loss": -43.47683334350586, "global_step": 296813, "epoch": 2453} {"train_loss": -44.094451904296875, "global_step": 296814, "epoch": 2453} {"train_loss": -44.036251068115234, "global_step": 296815, "epoch": 2453} {"train_loss": -44.28234100341797, "global_step": 296816, "epoch": 2453} {"train_loss": -44.003875732421875, "global_step": 296817, "epoch": 2453} {"train_loss": -43.6016845703125, "global_step": 296818, "epoch": 2453} {"train_loss": -43.797576904296875, "global_step": 296819, "epoch": 2453} {"train_loss": -44.31691360473633, "global_step": 296820, "epoch": 2453} {"train_loss": -44.11520004272461, "global_step": 296821, "epoch": 2453} {"train_loss": -43.7427978515625, "global_step": 296822, "epoch": 2453} {"train_loss": -44.105194091796875, "global_step": 296823, "epoch": 2453} {"train_loss": -44.10698318481445, "global_step": 296824, "epoch": 2453} {"train_loss": -43.609920501708984, "global_step": 296825, "epoch": 2453} {"train_loss": -43.323631286621094, "global_step": 296826, "epoch": 2453} {"train_loss": -43.39052963256836, "global_step": 296827, "epoch": 2453} {"train_loss": -43.3341064453125, "global_step": 296828, "epoch": 2453} {"train_loss": -44.24993133544922, "global_step": 296829, "epoch": 2453} {"train_loss": -43.58292770385742, "global_step": 296830, "epoch": 2453} {"train_loss": -43.7100944519043, "global_step": 296831, "epoch": 2453} {"train_loss": -43.55224609375, "global_step": 296832, "epoch": 2453} {"train_loss": -40.750213623046875, "global_step": 296833, "epoch": 2453} {"train_loss": -35.8962287902832, "global_step": 296834, "epoch": 2453} {"train_loss": -38.45929718017578, "global_step": 296835, "epoch": 2453} {"train_loss": -42.940895080566406, "global_step": 296836, "epoch": 2453} {"train_loss": -40.128421783447266, "global_step": 296837, "epoch": 2453} {"train_loss": -37.5113639831543, "global_step": 296838, "epoch": 2453} {"train_loss": -34.75086975097656, "global_step": 296839, "epoch": 2453} {"train_loss": -39.490413665771484, "global_step": 296840, "epoch": 2453} {"train_loss": -41.75542068481445, "global_step": 296841, "epoch": 2453} {"train_loss": -38.17600631713867, "global_step": 296842, "epoch": 2453} {"train_loss": -41.53584671020508, "global_step": 296843, "epoch": 2453} {"train_loss": -42.23027038574219, "global_step": 296844, "epoch": 2453} {"train_loss": -41.7053337097168, "global_step": 296845, "epoch": 2453} {"train_loss": -41.539974212646484, "global_step": 296846, "epoch": 2453} {"train_loss": -43.69259262084961, "global_step": 296847, "epoch": 2453} {"train_loss": -42.528385162353516, "global_step": 296848, "epoch": 2453} {"train_loss": -43.26831817626953, "global_step": 296849, "epoch": 2453} {"train_loss": -42.178890228271484, "global_step": 296850, "epoch": 2453} {"train_loss": -42.53499984741211, "global_step": 296851, "epoch": 2453} {"train_loss": -43.595130920410156, "global_step": 296852, "epoch": 2453} {"train_loss": -42.878841400146484, "global_step": 296853, "epoch": 2453} {"train_loss": -43.326236724853516, "global_step": 296854, "epoch": 2453} {"train_loss": -43.62794494628906, "global_step": 296855, "epoch": 2453} {"train_loss": -43.53457260131836, "global_step": 296856, "epoch": 2453} {"train_loss": -43.33349609375, "global_step": 296857, "epoch": 2453} {"train_loss": -43.46855163574219, "global_step": 296858, "epoch": 2453} {"train_loss": -42.99233627319336, "global_step": 296859, "epoch": 2453} {"train_loss": -43.80056381225586, "global_step": 296860, "epoch": 2453} {"train_loss": -43.30900573730469, "global_step": 296861, "epoch": 2453} {"train_loss": -43.334712982177734, "global_step": 296862, "epoch": 2453} {"train_loss": -43.100215911865234, "global_step": 296863, "epoch": 2453} {"train_loss": -43.33845901489258, "global_step": 296864, "epoch": 2453} {"train_loss": -43.95730209350586, "global_step": 296865, "epoch": 2453} {"train_loss": -43.51701736450195, "global_step": 296866, "epoch": 2453} {"train_loss": -43.85555648803711, "global_step": 296867, "epoch": 2453} {"train_loss": -43.36711883544922, "global_step": 296868, "epoch": 2453} {"train_loss": -43.55051040649414, "global_step": 296869, "epoch": 2453} {"train_loss": -43.9227294921875, "global_step": 296870, "epoch": 2453} {"train_loss": -43.00739288330078, "global_step": 296871, "epoch": 2453} {"train_loss": -42.66073989868164, "global_step": 296872, "epoch": 2453} {"train_loss": -44.066890716552734, "global_step": 296873, "epoch": 2453} {"train_loss": -43.31254577636719, "global_step": 296874, "epoch": 2453} {"train_loss": -43.83457565307617, "global_step": 296875, "epoch": 2453} {"train_loss": -43.788551330566406, "global_step": 296876, "epoch": 2453} {"train_loss": -43.39681625366211, "global_step": 296877, "epoch": 2453} {"train_loss": -43.67524337768555, "global_step": 296878, "epoch": 2453} {"train_loss": -43.84121322631836, "global_step": 296879, "epoch": 2453} {"train_loss": -44.02328872680664, "global_step": 296880, "epoch": 2453} {"train_loss": -43.3465690612793, "global_step": 296881, "epoch": 2453} {"train_loss": -44.03564453125, "global_step": 296882, "epoch": 2453} {"train_loss": -43.890357971191406, "global_step": 296883, "epoch": 2453} {"train_loss": -44.097312927246094, "global_step": 296884, "epoch": 2453} {"train_loss": -44.03921127319336, "global_step": 296885, "epoch": 2453} {"train_loss": -44.48735427856445, "global_step": 296886, "epoch": 2453} {"train_loss": -44.1817512512207, "global_step": 296887, "epoch": 2453} {"train_loss": -43.980560302734375, "global_step": 296888, "epoch": 2453} {"train_loss": -43.855560302734375, "global_step": 296889, "epoch": 2453} {"train_loss": -44.33543395996094, "global_step": 296890, "epoch": 2453} {"train_loss": -44.164485931396484, "global_step": 296891, "epoch": 2453} {"train_loss": -43.74666976928711, "global_step": 296892, "epoch": 2453} {"train_loss": -44.00445556640625, "global_step": 296893, "epoch": 2453} {"train_loss": -44.35987091064453, "global_step": 296894, "epoch": 2453} {"train_loss": -44.29019546508789, "global_step": 296895, "epoch": 2453} {"train_loss": -43.76539993286133, "global_step": 296896, "epoch": 2453} {"train_loss": -44.17664337158203, "global_step": 296897, "epoch": 2453} {"train_loss": -44.183406829833984, "global_step": 296898, "epoch": 2453} {"train_loss": -44.475730895996094, "global_step": 296899, "epoch": 2453} {"train_loss": -44.468563079833984, "global_step": 296900, "epoch": 2453} {"train_loss": -43.96136474609375, "global_step": 296901, "epoch": 2453} {"train_loss": -44.5808219909668, "global_step": 296902, "epoch": 2453} {"train_loss": -44.41822052001953, "global_step": 296903, "epoch": 2453} {"train_loss": -45.010467529296875, "global_step": 296904, "epoch": 2453} {"train_loss": -44.1324462890625, "global_step": 296905, "epoch": 2453} {"train_loss": -44.663482666015625, "global_step": 296906, "epoch": 2453} {"train_loss": -44.670310974121094, "global_step": 296907, "epoch": 2453} {"train_loss": -44.52274703979492, "global_step": 296908, "epoch": 2453} {"train_loss": -44.27900314331055, "global_step": 296909, "epoch": 2453} {"train_loss": -43.84231185913086, "global_step": 296910, "epoch": 2453} {"train_loss": -44.40243148803711, "global_step": 296911, "epoch": 2453} {"train_loss": -43.94147872924805, "global_step": 296912, "epoch": 2453} {"train_loss": -44.00653076171875, "global_step": 296913, "epoch": 2453} {"train_loss": -44.14059066772461, "global_step": 296914, "epoch": 2453} {"train_loss": -44.684478759765625, "global_step": 296915, "epoch": 2453} {"train_loss": -44.304569244384766, "global_step": 296916, "epoch": 2453} {"train_loss": -44.2247314453125, "global_step": 296917, "epoch": 2453} {"train_loss": -43.70760726928711, "global_step": 296918, "epoch": 2453} {"train_loss": -44.07804489135742, "global_step": 296919, "epoch": 2453} {"train_loss": -44.2314567565918, "global_step": 296920, "epoch": 2453} {"train_loss": -43.39350891113281, "global_step": 296921, "epoch": 2453} {"train_loss": -41.77770233154297, "global_step": 296922, "epoch": 2453} {"train_loss": -43.937767028808594, "global_step": 296923, "epoch": 2453} {"train_loss": -42.090423583984375, "global_step": 296924, "epoch": 2453} {"train_loss": -34.78725814819336, "global_step": 296925, "epoch": 2453} {"train_loss": -20.514408111572266, "global_step": 296926, "epoch": 2453} {"train_loss": -22.40506362915039, "global_step": 296927, "epoch": 2453} {"train_loss": -33.39435958862305, "global_step": 296928, "epoch": 2453} {"train_loss": -28.255956649780273, "global_step": 296929, "epoch": 2453} {"train_loss": -39.697349548339844, "global_step": 296930, "epoch": 2453} {"train_loss": -34.74325180053711, "global_step": 296931, "epoch": 2453} {"train_loss": -39.94424819946289, "global_step": 296932, "epoch": 2453} {"train_loss": -42.47215840048041, "global_step": 296933, "epoch": 2453, "val_loss": 2559696.75} {"train_loss": -39.77757263183594, "global_step": 296934, "epoch": 2454} {"train_loss": -39.100162506103516, "global_step": 296935, "epoch": 2454} {"train_loss": -40.84407424926758, "global_step": 296936, "epoch": 2454} {"train_loss": -39.49947738647461, "global_step": 296937, "epoch": 2454} {"train_loss": -40.70762252807617, "global_step": 296938, "epoch": 2454} {"train_loss": -40.248291015625, "global_step": 296939, "epoch": 2454} {"train_loss": -39.90863037109375, "global_step": 296940, "epoch": 2454} {"train_loss": -40.4920539855957, "global_step": 296941, "epoch": 2454} {"train_loss": -40.8075065612793, "global_step": 296942, "epoch": 2454} {"train_loss": -41.49232864379883, "global_step": 296943, "epoch": 2454} {"train_loss": -40.96905517578125, "global_step": 296944, "epoch": 2454} {"train_loss": -41.92988967895508, "global_step": 296945, "epoch": 2454} {"train_loss": -41.39411163330078, "global_step": 296946, "epoch": 2454} {"train_loss": -40.68788528442383, "global_step": 296947, "epoch": 2454} {"train_loss": -42.32877731323242, "global_step": 296948, "epoch": 2454} {"train_loss": -41.97153091430664, "global_step": 296949, "epoch": 2454} {"train_loss": -42.208595275878906, "global_step": 296950, "epoch": 2454} {"train_loss": -42.703670501708984, "global_step": 296951, "epoch": 2454} {"train_loss": -42.10746765136719, "global_step": 296952, "epoch": 2454} {"train_loss": -42.242431640625, "global_step": 296953, "epoch": 2454} {"train_loss": -42.659114837646484, "global_step": 296954, "epoch": 2454} {"train_loss": -42.77388000488281, "global_step": 296955, "epoch": 2454} {"train_loss": -42.07578659057617, "global_step": 296956, "epoch": 2454} {"train_loss": -42.345149993896484, "global_step": 296957, "epoch": 2454} {"train_loss": -42.16557693481445, "global_step": 296958, "epoch": 2454} {"train_loss": -42.61375045776367, "global_step": 296959, "epoch": 2454} {"train_loss": -42.229488372802734, "global_step": 296960, "epoch": 2454} {"train_loss": -42.49913787841797, "global_step": 296961, "epoch": 2454} {"train_loss": -42.56026840209961, "global_step": 296962, "epoch": 2454} {"train_loss": -42.90230941772461, "global_step": 296963, "epoch": 2454} {"train_loss": -42.44773864746094, "global_step": 296964, "epoch": 2454} {"train_loss": -42.65434646606445, "global_step": 296965, "epoch": 2454} {"train_loss": -42.55125427246094, "global_step": 296966, "epoch": 2454} {"train_loss": -43.25368118286133, "global_step": 296967, "epoch": 2454} {"train_loss": -42.9649543762207, "global_step": 296968, "epoch": 2454} {"train_loss": -43.480682373046875, "global_step": 296969, "epoch": 2454} {"train_loss": -42.99589538574219, "global_step": 296970, "epoch": 2454} {"train_loss": -43.3721923828125, "global_step": 296971, "epoch": 2454} {"train_loss": -43.44603729248047, "global_step": 296972, "epoch": 2454} {"train_loss": -43.2801628112793, "global_step": 296973, "epoch": 2454} {"train_loss": -43.395469665527344, "global_step": 296974, "epoch": 2454} {"train_loss": -43.79924774169922, "global_step": 296975, "epoch": 2454} {"train_loss": -43.1921501159668, "global_step": 296976, "epoch": 2454} {"train_loss": -43.97468948364258, "global_step": 296977, "epoch": 2454} {"train_loss": -43.73626708984375, "global_step": 296978, "epoch": 2454} {"train_loss": -43.746124267578125, "global_step": 296979, "epoch": 2454} {"train_loss": -44.146034240722656, "global_step": 296980, "epoch": 2454} {"train_loss": -44.10748291015625, "global_step": 296981, "epoch": 2454} {"train_loss": -44.21748733520508, "global_step": 296982, "epoch": 2454} {"train_loss": -43.82722473144531, "global_step": 296983, "epoch": 2454} {"train_loss": -43.84123992919922, "global_step": 296984, "epoch": 2454} {"train_loss": -44.196624755859375, "global_step": 296985, "epoch": 2454} {"train_loss": -43.55247116088867, "global_step": 296986, "epoch": 2454} {"train_loss": -44.11198043823242, "global_step": 296987, "epoch": 2454} {"train_loss": -44.02425765991211, "global_step": 296988, "epoch": 2454} {"train_loss": -44.489925384521484, "global_step": 296989, "epoch": 2454} {"train_loss": -44.011573791503906, "global_step": 296990, "epoch": 2454} {"train_loss": -43.99870681762695, "global_step": 296991, "epoch": 2454} {"train_loss": -44.38404083251953, "global_step": 296992, "epoch": 2454} {"train_loss": -43.83829879760742, "global_step": 296993, "epoch": 2454} {"train_loss": -44.35260772705078, "global_step": 296994, "epoch": 2454} {"train_loss": -43.800819396972656, "global_step": 296995, "epoch": 2454} {"train_loss": -44.27683639526367, "global_step": 296996, "epoch": 2454} {"train_loss": -43.723236083984375, "global_step": 296997, "epoch": 2454} {"train_loss": -43.75328063964844, "global_step": 296998, "epoch": 2454} {"train_loss": -44.45184326171875, "global_step": 296999, "epoch": 2454} {"train_loss": -44.6356086730957, "global_step": 297000, "epoch": 2454} {"train_loss": -44.260921478271484, "global_step": 297001, "epoch": 2454} {"train_loss": -44.29365158081055, "global_step": 297002, "epoch": 2454} {"train_loss": -44.205562591552734, "global_step": 297003, "epoch": 2454} {"train_loss": -44.40788269042969, "global_step": 297004, "epoch": 2454} {"train_loss": -44.22744369506836, "global_step": 297005, "epoch": 2454} {"train_loss": -44.41998291015625, "global_step": 297006, "epoch": 2454} {"train_loss": -44.83163070678711, "global_step": 297007, "epoch": 2454} {"train_loss": -44.151824951171875, "global_step": 297008, "epoch": 2454} {"train_loss": -44.125728607177734, "global_step": 297009, "epoch": 2454} {"train_loss": -44.674903869628906, "global_step": 297010, "epoch": 2454} {"train_loss": -44.26687240600586, "global_step": 297011, "epoch": 2454} {"train_loss": -44.31257247924805, "global_step": 297012, "epoch": 2454} {"train_loss": -44.287513732910156, "global_step": 297013, "epoch": 2454} {"train_loss": -44.85710525512695, "global_step": 297014, "epoch": 2454} {"train_loss": -44.52131652832031, "global_step": 297015, "epoch": 2454} {"train_loss": -44.29997634887695, "global_step": 297016, "epoch": 2454} {"train_loss": -44.20306396484375, "global_step": 297017, "epoch": 2454} {"train_loss": -44.4893798828125, "global_step": 297018, "epoch": 2454} {"train_loss": -43.42439651489258, "global_step": 297019, "epoch": 2454} {"train_loss": -44.52373504638672, "global_step": 297020, "epoch": 2454} {"train_loss": -44.62050247192383, "global_step": 297021, "epoch": 2454} {"train_loss": -44.46146774291992, "global_step": 297022, "epoch": 2454} {"train_loss": -44.450374603271484, "global_step": 297023, "epoch": 2454} {"train_loss": -43.58185958862305, "global_step": 297024, "epoch": 2454} {"train_loss": -43.314117431640625, "global_step": 297025, "epoch": 2454} {"train_loss": -42.243377685546875, "global_step": 297026, "epoch": 2454} {"train_loss": -43.648746490478516, "global_step": 297027, "epoch": 2454} {"train_loss": -43.139739990234375, "global_step": 297028, "epoch": 2454} {"train_loss": -42.49152755737305, "global_step": 297029, "epoch": 2454} {"train_loss": -43.3001708984375, "global_step": 297030, "epoch": 2454} {"train_loss": -44.118839263916016, "global_step": 297031, "epoch": 2454} {"train_loss": -43.024261474609375, "global_step": 297032, "epoch": 2454} {"train_loss": -42.1807861328125, "global_step": 297033, "epoch": 2454} {"train_loss": -40.90883255004883, "global_step": 297034, "epoch": 2454} {"train_loss": -39.42824935913086, "global_step": 297035, "epoch": 2454} {"train_loss": -42.257625579833984, "global_step": 297036, "epoch": 2454} {"train_loss": -43.434051513671875, "global_step": 297037, "epoch": 2454} {"train_loss": -40.126800537109375, "global_step": 297038, "epoch": 2454} {"train_loss": -39.53876495361328, "global_step": 297039, "epoch": 2454} {"train_loss": -43.773040771484375, "global_step": 297040, "epoch": 2454} {"train_loss": -42.54622268676758, "global_step": 297041, "epoch": 2454} {"train_loss": -39.80989456176758, "global_step": 297042, "epoch": 2454} {"train_loss": -42.35477828979492, "global_step": 297043, "epoch": 2454} {"train_loss": -43.11631393432617, "global_step": 297044, "epoch": 2454} {"train_loss": -41.97239303588867, "global_step": 297045, "epoch": 2454} {"train_loss": -43.05625534057617, "global_step": 297046, "epoch": 2454} {"train_loss": -43.47755432128906, "global_step": 297047, "epoch": 2454} {"train_loss": -43.323036193847656, "global_step": 297048, "epoch": 2454} {"train_loss": -42.93829345703125, "global_step": 297049, "epoch": 2454} {"train_loss": -43.620601654052734, "global_step": 297050, "epoch": 2454} {"train_loss": -40.87018585205078, "global_step": 297051, "epoch": 2454} {"train_loss": -42.842037200927734, "global_step": 297052, "epoch": 2454} {"train_loss": -43.15699005126953, "global_step": 297053, "epoch": 2454} {"train_loss": -42.99092849227023, "global_step": 297054, "epoch": 2454, "val_loss": 2797380.0} {"train_loss": -42.73164749145508, "global_step": 297055, "epoch": 2455} {"train_loss": -43.29752731323242, "global_step": 297056, "epoch": 2455} {"train_loss": -42.80392074584961, "global_step": 297057, "epoch": 2455} {"train_loss": -42.225433349609375, "global_step": 297058, "epoch": 2455} {"train_loss": -42.28595733642578, "global_step": 297059, "epoch": 2455} {"train_loss": -42.61189270019531, "global_step": 297060, "epoch": 2455} {"train_loss": -40.6588134765625, "global_step": 297061, "epoch": 2455} {"train_loss": -39.51245880126953, "global_step": 297062, "epoch": 2455} {"train_loss": -38.65795135498047, "global_step": 297063, "epoch": 2455} {"train_loss": -41.771728515625, "global_step": 297064, "epoch": 2455} {"train_loss": -40.76263427734375, "global_step": 297065, "epoch": 2455} {"train_loss": -33.426856994628906, "global_step": 297066, "epoch": 2455} {"train_loss": -37.493080139160156, "global_step": 297067, "epoch": 2455} {"train_loss": -40.114131927490234, "global_step": 297068, "epoch": 2455} {"train_loss": -33.47803497314453, "global_step": 297069, "epoch": 2455} {"train_loss": -40.2651481628418, "global_step": 297070, "epoch": 2455} {"train_loss": -40.248775482177734, "global_step": 297071, "epoch": 2455} {"train_loss": -36.54551315307617, "global_step": 297072, "epoch": 2455} {"train_loss": -37.05241012573242, "global_step": 297073, "epoch": 2455} {"train_loss": -36.16791915893555, "global_step": 297074, "epoch": 2455} {"train_loss": -36.606903076171875, "global_step": 297075, "epoch": 2455} {"train_loss": -40.40089797973633, "global_step": 297076, "epoch": 2455} {"train_loss": -36.91970443725586, "global_step": 297077, "epoch": 2455} {"train_loss": -26.883581161499023, "global_step": 297078, "epoch": 2455} {"train_loss": -29.202869415283203, "global_step": 297079, "epoch": 2455} {"train_loss": -37.59855651855469, "global_step": 297080, "epoch": 2455} {"train_loss": -35.27381134033203, "global_step": 297081, "epoch": 2455} {"train_loss": -33.05843734741211, "global_step": 297082, "epoch": 2455} {"train_loss": -35.85616683959961, "global_step": 297083, "epoch": 2455} {"train_loss": -34.91385269165039, "global_step": 297084, "epoch": 2455} {"train_loss": -24.888639450073242, "global_step": 297085, "epoch": 2455} {"train_loss": -31.203649520874023, "global_step": 297086, "epoch": 2455} {"train_loss": -38.50603103637695, "global_step": 297087, "epoch": 2455} {"train_loss": -35.550697326660156, "global_step": 297088, "epoch": 2455} {"train_loss": -30.9219970703125, "global_step": 297089, "epoch": 2455} {"train_loss": -38.81287384033203, "global_step": 297090, "epoch": 2455} {"train_loss": -36.31641387939453, "global_step": 297091, "epoch": 2455} {"train_loss": -40.31072998046875, "global_step": 297092, "epoch": 2455} {"train_loss": -37.87457275390625, "global_step": 297093, "epoch": 2455} {"train_loss": -38.042236328125, "global_step": 297094, "epoch": 2455} {"train_loss": -29.800846099853516, "global_step": 297095, "epoch": 2455} {"train_loss": -37.624244689941406, "global_step": 297096, "epoch": 2455} {"train_loss": -35.20473098754883, "global_step": 297097, "epoch": 2455} {"train_loss": -38.961814880371094, "global_step": 297098, "epoch": 2455} {"train_loss": -39.86096954345703, "global_step": 297099, "epoch": 2455} {"train_loss": -39.058387756347656, "global_step": 297100, "epoch": 2455} {"train_loss": -39.064491271972656, "global_step": 297101, "epoch": 2455} {"train_loss": -37.37434768676758, "global_step": 297102, "epoch": 2455} {"train_loss": -38.77230453491211, "global_step": 297103, "epoch": 2455} {"train_loss": -38.755855560302734, "global_step": 297104, "epoch": 2455} {"train_loss": -40.1792106628418, "global_step": 297105, "epoch": 2455} {"train_loss": -36.997764587402344, "global_step": 297106, "epoch": 2455} {"train_loss": -38.34946823120117, "global_step": 297107, "epoch": 2455} {"train_loss": -39.57730484008789, "global_step": 297108, "epoch": 2455} {"train_loss": -39.469783782958984, "global_step": 297109, "epoch": 2455} {"train_loss": -39.310401916503906, "global_step": 297110, "epoch": 2455} {"train_loss": -40.575767517089844, "global_step": 297111, "epoch": 2455} {"train_loss": -38.843963623046875, "global_step": 297112, "epoch": 2455} {"train_loss": -38.026763916015625, "global_step": 297113, "epoch": 2455} {"train_loss": -40.315399169921875, "global_step": 297114, "epoch": 2455} {"train_loss": -39.430599212646484, "global_step": 297115, "epoch": 2455} {"train_loss": -39.15959167480469, "global_step": 297116, "epoch": 2455} {"train_loss": -41.210697174072266, "global_step": 297117, "epoch": 2455} {"train_loss": -40.209716796875, "global_step": 297118, "epoch": 2455} {"train_loss": -40.2674560546875, "global_step": 297119, "epoch": 2455} {"train_loss": -39.801788330078125, "global_step": 297120, "epoch": 2455} {"train_loss": -39.68403244018555, "global_step": 297121, "epoch": 2455} {"train_loss": -40.505367279052734, "global_step": 297122, "epoch": 2455} {"train_loss": -40.89022445678711, "global_step": 297123, "epoch": 2455} {"train_loss": -39.88686752319336, "global_step": 297124, "epoch": 2455} {"train_loss": -41.58320999145508, "global_step": 297125, "epoch": 2455} {"train_loss": -41.6873664855957, "global_step": 297126, "epoch": 2455} {"train_loss": -40.8995361328125, "global_step": 297127, "epoch": 2455} {"train_loss": -41.11703872680664, "global_step": 297128, "epoch": 2455} {"train_loss": -41.39644241333008, "global_step": 297129, "epoch": 2455} {"train_loss": -40.4442253112793, "global_step": 297130, "epoch": 2455} {"train_loss": -41.19775390625, "global_step": 297131, "epoch": 2455} {"train_loss": -40.132625579833984, "global_step": 297132, "epoch": 2455} {"train_loss": -41.551124572753906, "global_step": 297133, "epoch": 2455} {"train_loss": -41.82802963256836, "global_step": 297134, "epoch": 2455} {"train_loss": -41.85197067260742, "global_step": 297135, "epoch": 2455} {"train_loss": -41.37303161621094, "global_step": 297136, "epoch": 2455} {"train_loss": -40.443023681640625, "global_step": 297137, "epoch": 2455} {"train_loss": -40.19535446166992, "global_step": 297138, "epoch": 2455} {"train_loss": -41.77799606323242, "global_step": 297139, "epoch": 2455} {"train_loss": -40.96221923828125, "global_step": 297140, "epoch": 2455} {"train_loss": -41.2765007019043, "global_step": 297141, "epoch": 2455} {"train_loss": -41.91624069213867, "global_step": 297142, "epoch": 2455} {"train_loss": -41.940494537353516, "global_step": 297143, "epoch": 2455} {"train_loss": -41.954219818115234, "global_step": 297144, "epoch": 2455} {"train_loss": -41.53017807006836, "global_step": 297145, "epoch": 2455} {"train_loss": -42.059993743896484, "global_step": 297146, "epoch": 2455} {"train_loss": -41.72492599487305, "global_step": 297147, "epoch": 2455} {"train_loss": -41.5888671875, "global_step": 297148, "epoch": 2455} {"train_loss": -41.8248176574707, "global_step": 297149, "epoch": 2455} {"train_loss": -41.916255950927734, "global_step": 297150, "epoch": 2455} {"train_loss": -41.53037643432617, "global_step": 297151, "epoch": 2455} {"train_loss": -42.110321044921875, "global_step": 297152, "epoch": 2455} {"train_loss": -41.90663146972656, "global_step": 297153, "epoch": 2455} {"train_loss": -42.272247314453125, "global_step": 297154, "epoch": 2455} {"train_loss": -42.47421646118164, "global_step": 297155, "epoch": 2455} {"train_loss": -41.65589141845703, "global_step": 297156, "epoch": 2455} {"train_loss": -41.95624923706055, "global_step": 297157, "epoch": 2455} {"train_loss": -42.389610290527344, "global_step": 297158, "epoch": 2455} {"train_loss": -42.401920318603516, "global_step": 297159, "epoch": 2455} {"train_loss": -42.1761474609375, "global_step": 297160, "epoch": 2455} {"train_loss": -41.90278244018555, "global_step": 297161, "epoch": 2455} {"train_loss": -42.30434799194336, "global_step": 297162, "epoch": 2455} {"train_loss": -42.59328079223633, "global_step": 297163, "epoch": 2455} {"train_loss": -43.092952728271484, "global_step": 297164, "epoch": 2455} {"train_loss": -42.098609924316406, "global_step": 297165, "epoch": 2455} {"train_loss": -42.644439697265625, "global_step": 297166, "epoch": 2455} {"train_loss": -42.32624053955078, "global_step": 297167, "epoch": 2455} {"train_loss": -42.723388671875, "global_step": 297168, "epoch": 2455} {"train_loss": -43.252723693847656, "global_step": 297169, "epoch": 2455} {"train_loss": -42.89516830444336, "global_step": 297170, "epoch": 2455} {"train_loss": -42.01027297973633, "global_step": 297171, "epoch": 2455} {"train_loss": -43.0517692565918, "global_step": 297172, "epoch": 2455} {"train_loss": -41.95618438720703, "global_step": 297173, "epoch": 2455} {"train_loss": -43.173011779785156, "global_step": 297174, "epoch": 2455} {"train_loss": -39.612064503441175, "global_step": 297175, "epoch": 2455, "val_loss": 2543028.0} {"train_loss": -42.562103271484375, "global_step": 297176, "epoch": 2456} {"train_loss": -42.81591796875, "global_step": 297177, "epoch": 2456} {"train_loss": -42.775447845458984, "global_step": 297178, "epoch": 2456} {"train_loss": -43.19236755371094, "global_step": 297179, "epoch": 2456} {"train_loss": -42.794227600097656, "global_step": 297180, "epoch": 2456} {"train_loss": -42.981266021728516, "global_step": 297181, "epoch": 2456} {"train_loss": -42.54594039916992, "global_step": 297182, "epoch": 2456} {"train_loss": -43.50380325317383, "global_step": 297183, "epoch": 2456} {"train_loss": -43.17295455932617, "global_step": 297184, "epoch": 2456} {"train_loss": -43.17825698852539, "global_step": 297185, "epoch": 2456} {"train_loss": -43.364253997802734, "global_step": 297186, "epoch": 2456} {"train_loss": -43.533729553222656, "global_step": 297187, "epoch": 2456} {"train_loss": -43.05170440673828, "global_step": 297188, "epoch": 2456} {"train_loss": -42.88501739501953, "global_step": 297189, "epoch": 2456} {"train_loss": -42.99820327758789, "global_step": 297190, "epoch": 2456} {"train_loss": -43.41508102416992, "global_step": 297191, "epoch": 2456} {"train_loss": -43.46029281616211, "global_step": 297192, "epoch": 2456} {"train_loss": -43.511009216308594, "global_step": 297193, "epoch": 2456} {"train_loss": -43.327816009521484, "global_step": 297194, "epoch": 2456} {"train_loss": -42.93362045288086, "global_step": 297195, "epoch": 2456} {"train_loss": -43.71171951293945, "global_step": 297196, "epoch": 2456} {"train_loss": -42.310970306396484, "global_step": 297197, "epoch": 2456} {"train_loss": -43.123897552490234, "global_step": 297198, "epoch": 2456} {"train_loss": -42.73151779174805, "global_step": 297199, "epoch": 2456} {"train_loss": -43.36198043823242, "global_step": 297200, "epoch": 2456} {"train_loss": -43.027034759521484, "global_step": 297201, "epoch": 2456} {"train_loss": -43.599853515625, "global_step": 297202, "epoch": 2456} {"train_loss": -43.38534164428711, "global_step": 297203, "epoch": 2456} {"train_loss": -43.45115280151367, "global_step": 297204, "epoch": 2456} {"train_loss": -43.11528778076172, "global_step": 297205, "epoch": 2456} {"train_loss": -43.178646087646484, "global_step": 297206, "epoch": 2456} {"train_loss": -43.3979606628418, "global_step": 297207, "epoch": 2456} {"train_loss": -43.95292282104492, "global_step": 297208, "epoch": 2456} {"train_loss": -43.831703186035156, "global_step": 297209, "epoch": 2456} {"train_loss": -43.43148422241211, "global_step": 297210, "epoch": 2456} {"train_loss": -43.70783233642578, "global_step": 297211, "epoch": 2456} {"train_loss": -43.2520637512207, "global_step": 297212, "epoch": 2456} {"train_loss": -43.369171142578125, "global_step": 297213, "epoch": 2456} {"train_loss": -43.31025695800781, "global_step": 297214, "epoch": 2456} {"train_loss": -42.65454864501953, "global_step": 297215, "epoch": 2456} {"train_loss": -43.39406204223633, "global_step": 297216, "epoch": 2456} {"train_loss": -43.12290573120117, "global_step": 297217, "epoch": 2456} {"train_loss": -42.899227142333984, "global_step": 297218, "epoch": 2456} {"train_loss": -43.04084014892578, "global_step": 297219, "epoch": 2456} {"train_loss": -43.990604400634766, "global_step": 297220, "epoch": 2456} {"train_loss": -42.80835723876953, "global_step": 297221, "epoch": 2456} {"train_loss": -43.080623626708984, "global_step": 297222, "epoch": 2456} {"train_loss": -43.4128532409668, "global_step": 297223, "epoch": 2456} {"train_loss": -42.713722229003906, "global_step": 297224, "epoch": 2456} {"train_loss": -43.320796966552734, "global_step": 297225, "epoch": 2456} {"train_loss": -43.70800018310547, "global_step": 297226, "epoch": 2456} {"train_loss": -42.57757568359375, "global_step": 297227, "epoch": 2456} {"train_loss": -43.2902946472168, "global_step": 297228, "epoch": 2456} {"train_loss": -43.103031158447266, "global_step": 297229, "epoch": 2456} {"train_loss": -42.53973388671875, "global_step": 297230, "epoch": 2456} {"train_loss": -43.859039306640625, "global_step": 297231, "epoch": 2456} {"train_loss": -42.57633590698242, "global_step": 297232, "epoch": 2456} {"train_loss": -43.71298599243164, "global_step": 297233, "epoch": 2456} {"train_loss": -42.09821701049805, "global_step": 297234, "epoch": 2456} {"train_loss": -43.5755500793457, "global_step": 297235, "epoch": 2456} {"train_loss": -42.524200439453125, "global_step": 297236, "epoch": 2456} {"train_loss": -43.59650802612305, "global_step": 297237, "epoch": 2456} {"train_loss": -41.758544921875, "global_step": 297238, "epoch": 2456} {"train_loss": -43.60310745239258, "global_step": 297239, "epoch": 2456} {"train_loss": -42.38508605957031, "global_step": 297240, "epoch": 2456} {"train_loss": -43.95621871948242, "global_step": 297241, "epoch": 2456} {"train_loss": -43.67348098754883, "global_step": 297242, "epoch": 2456} {"train_loss": -43.9438362121582, "global_step": 297243, "epoch": 2456} {"train_loss": -42.72956466674805, "global_step": 297244, "epoch": 2456} {"train_loss": -43.46588897705078, "global_step": 297245, "epoch": 2456} {"train_loss": -42.678218841552734, "global_step": 297246, "epoch": 2456} {"train_loss": -42.97880935668945, "global_step": 297247, "epoch": 2456} {"train_loss": -43.9439582824707, "global_step": 297248, "epoch": 2456} {"train_loss": -43.7050895690918, "global_step": 297249, "epoch": 2456} {"train_loss": -43.32192611694336, "global_step": 297250, "epoch": 2456} {"train_loss": -43.41963577270508, "global_step": 297251, "epoch": 2456} {"train_loss": -43.92240524291992, "global_step": 297252, "epoch": 2456} {"train_loss": -44.236328125, "global_step": 297253, "epoch": 2456} {"train_loss": -44.04789352416992, "global_step": 297254, "epoch": 2456} {"train_loss": -44.441925048828125, "global_step": 297255, "epoch": 2456} {"train_loss": -42.99837875366211, "global_step": 297256, "epoch": 2456} {"train_loss": -43.926143646240234, "global_step": 297257, "epoch": 2456} {"train_loss": -43.44590377807617, "global_step": 297258, "epoch": 2456} {"train_loss": -43.4415397644043, "global_step": 297259, "epoch": 2456} {"train_loss": -43.905941009521484, "global_step": 297260, "epoch": 2456} {"train_loss": -43.35418701171875, "global_step": 297261, "epoch": 2456} {"train_loss": -43.167694091796875, "global_step": 297262, "epoch": 2456} {"train_loss": -43.44161605834961, "global_step": 297263, "epoch": 2456} {"train_loss": -43.26838302612305, "global_step": 297264, "epoch": 2456} {"train_loss": -44.37723159790039, "global_step": 297265, "epoch": 2456} {"train_loss": -43.19308853149414, "global_step": 297266, "epoch": 2456} {"train_loss": -41.54005432128906, "global_step": 297267, "epoch": 2456} {"train_loss": -40.25083541870117, "global_step": 297268, "epoch": 2456} {"train_loss": -36.31695556640625, "global_step": 297269, "epoch": 2456} {"train_loss": -32.617855072021484, "global_step": 297270, "epoch": 2456} {"train_loss": -30.235305786132812, "global_step": 297271, "epoch": 2456} {"train_loss": -42.37656784057617, "global_step": 297272, "epoch": 2456} {"train_loss": -39.964351654052734, "global_step": 297273, "epoch": 2456} {"train_loss": -34.852394104003906, "global_step": 297274, "epoch": 2456} {"train_loss": -41.13844299316406, "global_step": 297275, "epoch": 2456} {"train_loss": -40.566070556640625, "global_step": 297276, "epoch": 2456} {"train_loss": -38.004085540771484, "global_step": 297277, "epoch": 2456} {"train_loss": -42.1993408203125, "global_step": 297278, "epoch": 2456} {"train_loss": -40.82223129272461, "global_step": 297279, "epoch": 2456} {"train_loss": -40.831687927246094, "global_step": 297280, "epoch": 2456} {"train_loss": -42.613624572753906, "global_step": 297281, "epoch": 2456} {"train_loss": -42.179508209228516, "global_step": 297282, "epoch": 2456} {"train_loss": -42.76805114746094, "global_step": 297283, "epoch": 2456} {"train_loss": -42.2885856628418, "global_step": 297284, "epoch": 2456} {"train_loss": -42.506221771240234, "global_step": 297285, "epoch": 2456} {"train_loss": -41.700439453125, "global_step": 297286, "epoch": 2456} {"train_loss": -43.17908477783203, "global_step": 297287, "epoch": 2456} {"train_loss": -42.50535202026367, "global_step": 297288, "epoch": 2456} {"train_loss": -43.43208694458008, "global_step": 297289, "epoch": 2456} {"train_loss": -43.29151153564453, "global_step": 297290, "epoch": 2456} {"train_loss": -42.74549102783203, "global_step": 297291, "epoch": 2456} {"train_loss": -43.66091537475586, "global_step": 297292, "epoch": 2456} {"train_loss": -41.3648567199707, "global_step": 297293, "epoch": 2456} {"train_loss": -43.28229904174805, "global_step": 297294, "epoch": 2456} {"train_loss": -42.775238037109375, "global_step": 297295, "epoch": 2456} {"train_loss": -42.66366451042743, "global_step": 297296, "epoch": 2456, "val_loss": 2466760.25} {"train_loss": -43.68446731567383, "global_step": 297297, "epoch": 2457} {"train_loss": -42.84035110473633, "global_step": 297298, "epoch": 2457} {"train_loss": -43.54255294799805, "global_step": 297299, "epoch": 2457} {"train_loss": -43.128936767578125, "global_step": 297300, "epoch": 2457} {"train_loss": -43.493404388427734, "global_step": 297301, "epoch": 2457} {"train_loss": -43.55780029296875, "global_step": 297302, "epoch": 2457} {"train_loss": -43.659828186035156, "global_step": 297303, "epoch": 2457} {"train_loss": -43.43709945678711, "global_step": 297304, "epoch": 2457} {"train_loss": -43.31416702270508, "global_step": 297305, "epoch": 2457} {"train_loss": -43.50189208984375, "global_step": 297306, "epoch": 2457} {"train_loss": -43.659629821777344, "global_step": 297307, "epoch": 2457} {"train_loss": -43.48554229736328, "global_step": 297308, "epoch": 2457} {"train_loss": -43.3499870300293, "global_step": 297309, "epoch": 2457} {"train_loss": -43.787410736083984, "global_step": 297310, "epoch": 2457} {"train_loss": -43.224308013916016, "global_step": 297311, "epoch": 2457} {"train_loss": -43.64469528198242, "global_step": 297312, "epoch": 2457} {"train_loss": -43.561767578125, "global_step": 297313, "epoch": 2457} {"train_loss": -42.91089630126953, "global_step": 297314, "epoch": 2457} {"train_loss": -43.43449783325195, "global_step": 297315, "epoch": 2457} {"train_loss": -44.011165618896484, "global_step": 297316, "epoch": 2457} {"train_loss": -43.284034729003906, "global_step": 297317, "epoch": 2457} {"train_loss": -43.6423454284668, "global_step": 297318, "epoch": 2457} {"train_loss": -43.84627914428711, "global_step": 297319, "epoch": 2457} {"train_loss": -42.99013900756836, "global_step": 297320, "epoch": 2457} {"train_loss": -43.48905944824219, "global_step": 297321, "epoch": 2457} {"train_loss": -43.94208908081055, "global_step": 297322, "epoch": 2457} {"train_loss": -43.501407623291016, "global_step": 297323, "epoch": 2457} {"train_loss": -43.77208709716797, "global_step": 297324, "epoch": 2457} {"train_loss": -43.88016891479492, "global_step": 297325, "epoch": 2457} {"train_loss": -43.467628479003906, "global_step": 297326, "epoch": 2457} {"train_loss": -43.80995559692383, "global_step": 297327, "epoch": 2457} {"train_loss": -43.70771408081055, "global_step": 297328, "epoch": 2457} {"train_loss": -43.5887451171875, "global_step": 297329, "epoch": 2457} {"train_loss": -44.21428680419922, "global_step": 297330, "epoch": 2457} {"train_loss": -43.720672607421875, "global_step": 297331, "epoch": 2457} {"train_loss": -43.45746994018555, "global_step": 297332, "epoch": 2457} {"train_loss": -43.8975944519043, "global_step": 297333, "epoch": 2457} {"train_loss": -43.06559371948242, "global_step": 297334, "epoch": 2457} {"train_loss": -43.30955505371094, "global_step": 297335, "epoch": 2457} {"train_loss": -43.8065299987793, "global_step": 297336, "epoch": 2457} {"train_loss": -43.00380325317383, "global_step": 297337, "epoch": 2457} {"train_loss": -41.527889251708984, "global_step": 297338, "epoch": 2457} {"train_loss": -41.98476791381836, "global_step": 297339, "epoch": 2457} {"train_loss": -42.0852165222168, "global_step": 297340, "epoch": 2457} {"train_loss": -42.62470245361328, "global_step": 297341, "epoch": 2457} {"train_loss": -43.4027099609375, "global_step": 297342, "epoch": 2457} {"train_loss": -43.03961944580078, "global_step": 297343, "epoch": 2457} {"train_loss": -41.330474853515625, "global_step": 297344, "epoch": 2457} {"train_loss": -39.71964645385742, "global_step": 297345, "epoch": 2457} {"train_loss": -41.9354362487793, "global_step": 297346, "epoch": 2457} {"train_loss": -43.139034271240234, "global_step": 297347, "epoch": 2457} {"train_loss": -42.95256042480469, "global_step": 297348, "epoch": 2457} {"train_loss": -41.13241958618164, "global_step": 297349, "epoch": 2457} {"train_loss": -42.158203125, "global_step": 297350, "epoch": 2457} {"train_loss": -40.542198181152344, "global_step": 297351, "epoch": 2457} {"train_loss": -41.47747039794922, "global_step": 297352, "epoch": 2457} {"train_loss": -41.226593017578125, "global_step": 297353, "epoch": 2457} {"train_loss": -41.62085723876953, "global_step": 297354, "epoch": 2457} {"train_loss": -42.09043502807617, "global_step": 297355, "epoch": 2457} {"train_loss": -41.89127731323242, "global_step": 297356, "epoch": 2457} {"train_loss": -43.138938903808594, "global_step": 297357, "epoch": 2457} {"train_loss": -41.754329681396484, "global_step": 297358, "epoch": 2457} {"train_loss": -42.28357696533203, "global_step": 297359, "epoch": 2457} {"train_loss": -42.396907806396484, "global_step": 297360, "epoch": 2457} {"train_loss": -41.88079833984375, "global_step": 297361, "epoch": 2457} {"train_loss": -43.158653259277344, "global_step": 297362, "epoch": 2457} {"train_loss": -41.7762451171875, "global_step": 297363, "epoch": 2457} {"train_loss": -43.24374008178711, "global_step": 297364, "epoch": 2457} {"train_loss": -43.00873947143555, "global_step": 297365, "epoch": 2457} {"train_loss": -43.25922775268555, "global_step": 297366, "epoch": 2457} {"train_loss": -42.825927734375, "global_step": 297367, "epoch": 2457} {"train_loss": -42.8925666809082, "global_step": 297368, "epoch": 2457} {"train_loss": -42.3607292175293, "global_step": 297369, "epoch": 2457} {"train_loss": -42.8057975769043, "global_step": 297370, "epoch": 2457} {"train_loss": -42.46804428100586, "global_step": 297371, "epoch": 2457} {"train_loss": -42.98823165893555, "global_step": 297372, "epoch": 2457} {"train_loss": -41.635005950927734, "global_step": 297373, "epoch": 2457} {"train_loss": -41.39789962768555, "global_step": 297374, "epoch": 2457} {"train_loss": -42.983089447021484, "global_step": 297375, "epoch": 2457} {"train_loss": -40.538753509521484, "global_step": 297376, "epoch": 2457} {"train_loss": -41.4769401550293, "global_step": 297377, "epoch": 2457} {"train_loss": -42.56708908081055, "global_step": 297378, "epoch": 2457} {"train_loss": -41.86859893798828, "global_step": 297379, "epoch": 2457} {"train_loss": -41.45457077026367, "global_step": 297380, "epoch": 2457} {"train_loss": -43.232276916503906, "global_step": 297381, "epoch": 2457} {"train_loss": -42.086402893066406, "global_step": 297382, "epoch": 2457} {"train_loss": -42.1047248840332, "global_step": 297383, "epoch": 2457} {"train_loss": -43.28469467163086, "global_step": 297384, "epoch": 2457} {"train_loss": -42.06449508666992, "global_step": 297385, "epoch": 2457} {"train_loss": -42.99903106689453, "global_step": 297386, "epoch": 2457} {"train_loss": -41.3536376953125, "global_step": 297387, "epoch": 2457} {"train_loss": -42.82819747924805, "global_step": 297388, "epoch": 2457} {"train_loss": -41.92197799682617, "global_step": 297389, "epoch": 2457} {"train_loss": -42.201385498046875, "global_step": 297390, "epoch": 2457} {"train_loss": -42.55244064331055, "global_step": 297391, "epoch": 2457} {"train_loss": -41.66341781616211, "global_step": 297392, "epoch": 2457} {"train_loss": -42.72065734863281, "global_step": 297393, "epoch": 2457} {"train_loss": -41.59470748901367, "global_step": 297394, "epoch": 2457} {"train_loss": -42.99972152709961, "global_step": 297395, "epoch": 2457} {"train_loss": -42.52138900756836, "global_step": 297396, "epoch": 2457} {"train_loss": -42.951690673828125, "global_step": 297397, "epoch": 2457} {"train_loss": -42.12553787231445, "global_step": 297398, "epoch": 2457} {"train_loss": -43.30451202392578, "global_step": 297399, "epoch": 2457} {"train_loss": -43.12820053100586, "global_step": 297400, "epoch": 2457} {"train_loss": -42.74592590332031, "global_step": 297401, "epoch": 2457} {"train_loss": -43.49763107299805, "global_step": 297402, "epoch": 2457} {"train_loss": -42.79926681518555, "global_step": 297403, "epoch": 2457} {"train_loss": -42.89674758911133, "global_step": 297404, "epoch": 2457} {"train_loss": -43.43674850463867, "global_step": 297405, "epoch": 2457} {"train_loss": -42.907100677490234, "global_step": 297406, "epoch": 2457} {"train_loss": -43.4451904296875, "global_step": 297407, "epoch": 2457} {"train_loss": -43.36836242675781, "global_step": 297408, "epoch": 2457} {"train_loss": -43.2604866027832, "global_step": 297409, "epoch": 2457} {"train_loss": -43.658504486083984, "global_step": 297410, "epoch": 2457} {"train_loss": -43.6107177734375, "global_step": 297411, "epoch": 2457} {"train_loss": -42.663368225097656, "global_step": 297412, "epoch": 2457} {"train_loss": -43.27585983276367, "global_step": 297413, "epoch": 2457} {"train_loss": -43.74935531616211, "global_step": 297414, "epoch": 2457} {"train_loss": -42.87541961669922, "global_step": 297415, "epoch": 2457} {"train_loss": -43.35624313354492, "global_step": 297416, "epoch": 2457} {"train_loss": -42.82165896202907, "global_step": 297417, "epoch": 2457, "val_loss": 2618033.0} {"train_loss": -43.16268539428711, "global_step": 297418, "epoch": 2458} {"train_loss": -44.0406379699707, "global_step": 297419, "epoch": 2458} {"train_loss": -43.028656005859375, "global_step": 297420, "epoch": 2458} {"train_loss": -43.84588623046875, "global_step": 297421, "epoch": 2458} {"train_loss": -43.820220947265625, "global_step": 297422, "epoch": 2458} {"train_loss": -43.80018615722656, "global_step": 297423, "epoch": 2458} {"train_loss": -44.22093963623047, "global_step": 297424, "epoch": 2458} {"train_loss": -43.87530517578125, "global_step": 297425, "epoch": 2458} {"train_loss": -43.553646087646484, "global_step": 297426, "epoch": 2458} {"train_loss": -44.08644104003906, "global_step": 297427, "epoch": 2458} {"train_loss": -43.804290771484375, "global_step": 297428, "epoch": 2458} {"train_loss": -44.247833251953125, "global_step": 297429, "epoch": 2458} {"train_loss": -44.092132568359375, "global_step": 297430, "epoch": 2458} {"train_loss": -44.485782623291016, "global_step": 297431, "epoch": 2458} {"train_loss": -43.49074172973633, "global_step": 297432, "epoch": 2458} {"train_loss": -42.7269401550293, "global_step": 297433, "epoch": 2458} {"train_loss": -41.146175384521484, "global_step": 297434, "epoch": 2458} {"train_loss": -40.54134750366211, "global_step": 297435, "epoch": 2458} {"train_loss": -43.12044143676758, "global_step": 297436, "epoch": 2458} {"train_loss": -43.90314865112305, "global_step": 297437, "epoch": 2458} {"train_loss": -43.66302490234375, "global_step": 297438, "epoch": 2458} {"train_loss": -43.68013000488281, "global_step": 297439, "epoch": 2458} {"train_loss": -43.992435455322266, "global_step": 297440, "epoch": 2458} {"train_loss": -44.25044250488281, "global_step": 297441, "epoch": 2458} {"train_loss": -43.9873161315918, "global_step": 297442, "epoch": 2458} {"train_loss": -43.706058502197266, "global_step": 297443, "epoch": 2458} {"train_loss": -44.04958724975586, "global_step": 297444, "epoch": 2458} {"train_loss": -43.88051986694336, "global_step": 297445, "epoch": 2458} {"train_loss": -44.48153305053711, "global_step": 297446, "epoch": 2458} {"train_loss": -43.96572494506836, "global_step": 297447, "epoch": 2458} {"train_loss": -44.204078674316406, "global_step": 297448, "epoch": 2458} {"train_loss": -44.50738525390625, "global_step": 297449, "epoch": 2458} {"train_loss": -43.60780334472656, "global_step": 297450, "epoch": 2458} {"train_loss": -43.17182922363281, "global_step": 297451, "epoch": 2458} {"train_loss": -43.56388473510742, "global_step": 297452, "epoch": 2458} {"train_loss": -44.02183151245117, "global_step": 297453, "epoch": 2458} {"train_loss": -43.7552375793457, "global_step": 297454, "epoch": 2458} {"train_loss": -44.12171936035156, "global_step": 297455, "epoch": 2458} {"train_loss": -44.166194915771484, "global_step": 297456, "epoch": 2458} {"train_loss": -43.3863525390625, "global_step": 297457, "epoch": 2458} {"train_loss": -42.19328689575195, "global_step": 297458, "epoch": 2458} {"train_loss": -42.13620376586914, "global_step": 297459, "epoch": 2458} {"train_loss": -43.62800216674805, "global_step": 297460, "epoch": 2458} {"train_loss": -40.77987289428711, "global_step": 297461, "epoch": 2458} {"train_loss": -36.95548629760742, "global_step": 297462, "epoch": 2458} {"train_loss": -40.623680114746094, "global_step": 297463, "epoch": 2458} {"train_loss": -43.14094543457031, "global_step": 297464, "epoch": 2458} {"train_loss": -39.85171127319336, "global_step": 297465, "epoch": 2458} {"train_loss": -40.28373336791992, "global_step": 297466, "epoch": 2458} {"train_loss": -42.391265869140625, "global_step": 297467, "epoch": 2458} {"train_loss": -41.4791259765625, "global_step": 297468, "epoch": 2458} {"train_loss": -40.5919075012207, "global_step": 297469, "epoch": 2458} {"train_loss": -42.24129104614258, "global_step": 297470, "epoch": 2458} {"train_loss": -43.28703689575195, "global_step": 297471, "epoch": 2458} {"train_loss": -42.22300338745117, "global_step": 297472, "epoch": 2458} {"train_loss": -43.54024887084961, "global_step": 297473, "epoch": 2458} {"train_loss": -43.348812103271484, "global_step": 297474, "epoch": 2458} {"train_loss": -43.52426528930664, "global_step": 297475, "epoch": 2458} {"train_loss": -43.39105224609375, "global_step": 297476, "epoch": 2458} {"train_loss": -43.44939422607422, "global_step": 297477, "epoch": 2458} {"train_loss": -43.538883209228516, "global_step": 297478, "epoch": 2458} {"train_loss": -43.794471740722656, "global_step": 297479, "epoch": 2458} {"train_loss": -43.7420539855957, "global_step": 297480, "epoch": 2458} {"train_loss": -43.06827926635742, "global_step": 297481, "epoch": 2458} {"train_loss": -43.352455139160156, "global_step": 297482, "epoch": 2458} {"train_loss": -42.78697967529297, "global_step": 297483, "epoch": 2458} {"train_loss": -42.70529556274414, "global_step": 297484, "epoch": 2458} {"train_loss": -43.30160140991211, "global_step": 297485, "epoch": 2458} {"train_loss": -43.2005615234375, "global_step": 297486, "epoch": 2458} {"train_loss": -43.31216049194336, "global_step": 297487, "epoch": 2458} {"train_loss": -43.26906967163086, "global_step": 297488, "epoch": 2458} {"train_loss": -43.56068420410156, "global_step": 297489, "epoch": 2458} {"train_loss": -43.71089553833008, "global_step": 297490, "epoch": 2458} {"train_loss": -43.636714935302734, "global_step": 297491, "epoch": 2458} {"train_loss": -43.850433349609375, "global_step": 297492, "epoch": 2458} {"train_loss": -43.65395736694336, "global_step": 297493, "epoch": 2458} {"train_loss": -43.41488265991211, "global_step": 297494, "epoch": 2458} {"train_loss": -43.67244338989258, "global_step": 297495, "epoch": 2458} {"train_loss": -43.96871566772461, "global_step": 297496, "epoch": 2458} {"train_loss": -44.00126647949219, "global_step": 297497, "epoch": 2458} {"train_loss": -44.09550094604492, "global_step": 297498, "epoch": 2458} {"train_loss": -44.14573287963867, "global_step": 297499, "epoch": 2458} {"train_loss": -43.880897521972656, "global_step": 297500, "epoch": 2458} {"train_loss": -43.99558639526367, "global_step": 297501, "epoch": 2458} {"train_loss": -44.40623092651367, "global_step": 297502, "epoch": 2458} {"train_loss": -44.403785705566406, "global_step": 297503, "epoch": 2458} {"train_loss": -44.30344772338867, "global_step": 297504, "epoch": 2458} {"train_loss": -44.45972442626953, "global_step": 297505, "epoch": 2458} {"train_loss": -44.159908294677734, "global_step": 297506, "epoch": 2458} {"train_loss": -44.224361419677734, "global_step": 297507, "epoch": 2458} {"train_loss": -44.536354064941406, "global_step": 297508, "epoch": 2458} {"train_loss": -44.2750244140625, "global_step": 297509, "epoch": 2458} {"train_loss": -44.03142166137695, "global_step": 297510, "epoch": 2458} {"train_loss": -44.25996780395508, "global_step": 297511, "epoch": 2458} {"train_loss": -44.05747985839844, "global_step": 297512, "epoch": 2458} {"train_loss": -44.0715217590332, "global_step": 297513, "epoch": 2458} {"train_loss": -44.00582504272461, "global_step": 297514, "epoch": 2458} {"train_loss": -44.49721908569336, "global_step": 297515, "epoch": 2458} {"train_loss": -43.51652908325195, "global_step": 297516, "epoch": 2458} {"train_loss": -43.71876907348633, "global_step": 297517, "epoch": 2458} {"train_loss": -43.827022552490234, "global_step": 297518, "epoch": 2458} {"train_loss": -44.03750991821289, "global_step": 297519, "epoch": 2458} {"train_loss": -42.99420166015625, "global_step": 297520, "epoch": 2458} {"train_loss": -44.10500717163086, "global_step": 297521, "epoch": 2458} {"train_loss": -44.0195426940918, "global_step": 297522, "epoch": 2458} {"train_loss": -42.36572265625, "global_step": 297523, "epoch": 2458} {"train_loss": -41.02459716796875, "global_step": 297524, "epoch": 2458} {"train_loss": -42.21689224243164, "global_step": 297525, "epoch": 2458} {"train_loss": -43.28280258178711, "global_step": 297526, "epoch": 2458} {"train_loss": -43.8857536315918, "global_step": 297527, "epoch": 2458} {"train_loss": -40.92267608642578, "global_step": 297528, "epoch": 2458} {"train_loss": -41.624507904052734, "global_step": 297529, "epoch": 2458} {"train_loss": -43.03838348388672, "global_step": 297530, "epoch": 2458} {"train_loss": -44.31438064575195, "global_step": 297531, "epoch": 2458} {"train_loss": -43.23568344116211, "global_step": 297532, "epoch": 2458} {"train_loss": -43.7071418762207, "global_step": 297533, "epoch": 2458} {"train_loss": -42.9725341796875, "global_step": 297534, "epoch": 2458} {"train_loss": -43.74373245239258, "global_step": 297535, "epoch": 2458} {"train_loss": -43.029640197753906, "global_step": 297536, "epoch": 2458} {"train_loss": -43.40450668334961, "global_step": 297537, "epoch": 2458} {"train_loss": -43.33812912239516, "global_step": 297538, "epoch": 2458, "val_loss": 2579263.25} {"train_loss": -42.965126037597656, "global_step": 297539, "epoch": 2459} {"train_loss": -44.287391662597656, "global_step": 297540, "epoch": 2459} {"train_loss": -43.403568267822266, "global_step": 297541, "epoch": 2459} {"train_loss": -44.05089569091797, "global_step": 297542, "epoch": 2459} {"train_loss": -43.06330108642578, "global_step": 297543, "epoch": 2459} {"train_loss": -42.562744140625, "global_step": 297544, "epoch": 2459} {"train_loss": -43.774505615234375, "global_step": 297545, "epoch": 2459} {"train_loss": -43.8866081237793, "global_step": 297546, "epoch": 2459} {"train_loss": -43.7124137878418, "global_step": 297547, "epoch": 2459} {"train_loss": -44.291297912597656, "global_step": 297548, "epoch": 2459} {"train_loss": -43.8555908203125, "global_step": 297549, "epoch": 2459} {"train_loss": -43.89324951171875, "global_step": 297550, "epoch": 2459} {"train_loss": -44.203285217285156, "global_step": 297551, "epoch": 2459} {"train_loss": -43.59477615356445, "global_step": 297552, "epoch": 2459} {"train_loss": -42.91139221191406, "global_step": 297553, "epoch": 2459} {"train_loss": -43.84572219848633, "global_step": 297554, "epoch": 2459} {"train_loss": -43.6103515625, "global_step": 297555, "epoch": 2459} {"train_loss": -43.53510665893555, "global_step": 297556, "epoch": 2459} {"train_loss": -44.0440559387207, "global_step": 297557, "epoch": 2459} {"train_loss": -43.941402435302734, "global_step": 297558, "epoch": 2459} {"train_loss": -43.26405715942383, "global_step": 297559, "epoch": 2459} {"train_loss": -43.74195098876953, "global_step": 297560, "epoch": 2459} {"train_loss": -44.54965591430664, "global_step": 297561, "epoch": 2459} {"train_loss": -43.50819396972656, "global_step": 297562, "epoch": 2459} {"train_loss": -44.137271881103516, "global_step": 297563, "epoch": 2459} {"train_loss": -43.90135192871094, "global_step": 297564, "epoch": 2459} {"train_loss": -43.91460037231445, "global_step": 297565, "epoch": 2459} {"train_loss": -44.21573257446289, "global_step": 297566, "epoch": 2459} {"train_loss": -43.714080810546875, "global_step": 297567, "epoch": 2459} {"train_loss": -44.20186233520508, "global_step": 297568, "epoch": 2459} {"train_loss": -43.38761520385742, "global_step": 297569, "epoch": 2459} {"train_loss": -44.016963958740234, "global_step": 297570, "epoch": 2459} {"train_loss": -44.260005950927734, "global_step": 297571, "epoch": 2459} {"train_loss": -43.956119537353516, "global_step": 297572, "epoch": 2459} {"train_loss": -44.3946647644043, "global_step": 297573, "epoch": 2459} {"train_loss": -43.9466667175293, "global_step": 297574, "epoch": 2459} {"train_loss": -44.3931999206543, "global_step": 297575, "epoch": 2459} {"train_loss": -43.82855987548828, "global_step": 297576, "epoch": 2459} {"train_loss": -44.333980560302734, "global_step": 297577, "epoch": 2459} {"train_loss": -44.36603927612305, "global_step": 297578, "epoch": 2459} {"train_loss": -43.778709411621094, "global_step": 297579, "epoch": 2459} {"train_loss": -43.687679290771484, "global_step": 297580, "epoch": 2459} {"train_loss": -43.787193298339844, "global_step": 297581, "epoch": 2459} {"train_loss": -44.241329193115234, "global_step": 297582, "epoch": 2459} {"train_loss": -42.78169631958008, "global_step": 297583, "epoch": 2459} {"train_loss": -42.40996551513672, "global_step": 297584, "epoch": 2459} {"train_loss": -43.54263687133789, "global_step": 297585, "epoch": 2459} {"train_loss": -44.25335693359375, "global_step": 297586, "epoch": 2459} {"train_loss": -43.7866096496582, "global_step": 297587, "epoch": 2459} {"train_loss": -43.5130729675293, "global_step": 297588, "epoch": 2459} {"train_loss": -44.6577262878418, "global_step": 297589, "epoch": 2459} {"train_loss": -44.44013595581055, "global_step": 297590, "epoch": 2459} {"train_loss": -43.814720153808594, "global_step": 297591, "epoch": 2459} {"train_loss": -44.108028411865234, "global_step": 297592, "epoch": 2459} {"train_loss": -44.212989807128906, "global_step": 297593, "epoch": 2459} {"train_loss": -43.914886474609375, "global_step": 297594, "epoch": 2459} {"train_loss": -43.26761245727539, "global_step": 297595, "epoch": 2459} {"train_loss": -43.49824142456055, "global_step": 297596, "epoch": 2459} {"train_loss": -44.53853988647461, "global_step": 297597, "epoch": 2459} {"train_loss": -43.95441436767578, "global_step": 297598, "epoch": 2459} {"train_loss": -43.578250885009766, "global_step": 297599, "epoch": 2459} {"train_loss": -43.3951530456543, "global_step": 297600, "epoch": 2459} {"train_loss": -43.29316711425781, "global_step": 297601, "epoch": 2459} {"train_loss": -44.33740997314453, "global_step": 297602, "epoch": 2459} {"train_loss": -44.391456604003906, "global_step": 297603, "epoch": 2459} {"train_loss": -44.12897491455078, "global_step": 297604, "epoch": 2459} {"train_loss": -44.74888229370117, "global_step": 297605, "epoch": 2459} {"train_loss": -43.9240608215332, "global_step": 297606, "epoch": 2459} {"train_loss": -43.80402374267578, "global_step": 297607, "epoch": 2459} {"train_loss": -44.22906494140625, "global_step": 297608, "epoch": 2459} {"train_loss": -43.971378326416016, "global_step": 297609, "epoch": 2459} {"train_loss": -43.677852630615234, "global_step": 297610, "epoch": 2459} {"train_loss": -43.85749053955078, "global_step": 297611, "epoch": 2459} {"train_loss": -43.87456130981445, "global_step": 297612, "epoch": 2459} {"train_loss": -44.0407829284668, "global_step": 297613, "epoch": 2459} {"train_loss": -44.479671478271484, "global_step": 297614, "epoch": 2459} {"train_loss": -44.08017349243164, "global_step": 297615, "epoch": 2459} {"train_loss": -44.252132415771484, "global_step": 297616, "epoch": 2459} {"train_loss": -43.5050048828125, "global_step": 297617, "epoch": 2459} {"train_loss": -44.24400329589844, "global_step": 297618, "epoch": 2459} {"train_loss": -44.68717956542969, "global_step": 297619, "epoch": 2459} {"train_loss": -43.54985809326172, "global_step": 297620, "epoch": 2459} {"train_loss": -42.4984016418457, "global_step": 297621, "epoch": 2459} {"train_loss": -43.8501091003418, "global_step": 297622, "epoch": 2459} {"train_loss": -44.22842025756836, "global_step": 297623, "epoch": 2459} {"train_loss": -43.088348388671875, "global_step": 297624, "epoch": 2459} {"train_loss": -42.3470573425293, "global_step": 297625, "epoch": 2459} {"train_loss": -42.844520568847656, "global_step": 297626, "epoch": 2459} {"train_loss": -43.10329055786133, "global_step": 297627, "epoch": 2459} {"train_loss": -43.436763763427734, "global_step": 297628, "epoch": 2459} {"train_loss": -42.50742721557617, "global_step": 297629, "epoch": 2459} {"train_loss": -40.82735824584961, "global_step": 297630, "epoch": 2459} {"train_loss": -42.7088737487793, "global_step": 297631, "epoch": 2459} {"train_loss": -43.696815490722656, "global_step": 297632, "epoch": 2459} {"train_loss": -42.94782257080078, "global_step": 297633, "epoch": 2459} {"train_loss": -41.93404769897461, "global_step": 297634, "epoch": 2459} {"train_loss": -42.49897766113281, "global_step": 297635, "epoch": 2459} {"train_loss": -43.15406036376953, "global_step": 297636, "epoch": 2459} {"train_loss": -43.4897346496582, "global_step": 297637, "epoch": 2459} {"train_loss": -42.588531494140625, "global_step": 297638, "epoch": 2459} {"train_loss": -43.23981475830078, "global_step": 297639, "epoch": 2459} {"train_loss": -43.58083724975586, "global_step": 297640, "epoch": 2459} {"train_loss": -42.674339294433594, "global_step": 297641, "epoch": 2459} {"train_loss": -42.66773223876953, "global_step": 297642, "epoch": 2459} {"train_loss": -43.17031478881836, "global_step": 297643, "epoch": 2459} {"train_loss": -41.09529495239258, "global_step": 297644, "epoch": 2459} {"train_loss": -43.79580307006836, "global_step": 297645, "epoch": 2459} {"train_loss": -42.26357650756836, "global_step": 297646, "epoch": 2459} {"train_loss": -42.831642150878906, "global_step": 297647, "epoch": 2459} {"train_loss": -42.77650451660156, "global_step": 297648, "epoch": 2459} {"train_loss": -42.70152282714844, "global_step": 297649, "epoch": 2459} {"train_loss": -43.495635986328125, "global_step": 297650, "epoch": 2459} {"train_loss": -42.3599739074707, "global_step": 297651, "epoch": 2459} {"train_loss": -43.66057205200195, "global_step": 297652, "epoch": 2459} {"train_loss": -43.30703353881836, "global_step": 297653, "epoch": 2459} {"train_loss": -43.057308197021484, "global_step": 297654, "epoch": 2459} {"train_loss": -43.208492279052734, "global_step": 297655, "epoch": 2459} {"train_loss": -43.12369918823242, "global_step": 297656, "epoch": 2459} {"train_loss": -42.47743606567383, "global_step": 297657, "epoch": 2459} {"train_loss": -43.40210723876953, "global_step": 297658, "epoch": 2459} {"train_loss": -43.56546487098883, "global_step": 297659, "epoch": 2459, "val_loss": 2572831.75} {"train_loss": -43.05907440185547, "global_step": 297660, "epoch": 2460} {"train_loss": -43.32672882080078, "global_step": 297661, "epoch": 2460} {"train_loss": -43.66123580932617, "global_step": 297662, "epoch": 2460} {"train_loss": -43.56400680541992, "global_step": 297663, "epoch": 2460} {"train_loss": -44.19769287109375, "global_step": 297664, "epoch": 2460} {"train_loss": -44.138038635253906, "global_step": 297665, "epoch": 2460} {"train_loss": -43.71546173095703, "global_step": 297666, "epoch": 2460} {"train_loss": -43.623783111572266, "global_step": 297667, "epoch": 2460} {"train_loss": -43.68508529663086, "global_step": 297668, "epoch": 2460} {"train_loss": -44.24017333984375, "global_step": 297669, "epoch": 2460} {"train_loss": -43.52766036987305, "global_step": 297670, "epoch": 2460} {"train_loss": -43.989986419677734, "global_step": 297671, "epoch": 2460} {"train_loss": -44.596412658691406, "global_step": 297672, "epoch": 2460} {"train_loss": -43.57401657104492, "global_step": 297673, "epoch": 2460} {"train_loss": -42.68085479736328, "global_step": 297674, "epoch": 2460} {"train_loss": -43.97999572753906, "global_step": 297675, "epoch": 2460} {"train_loss": -44.22333908081055, "global_step": 297676, "epoch": 2460} {"train_loss": -43.46751403808594, "global_step": 297677, "epoch": 2460} {"train_loss": -43.92022705078125, "global_step": 297678, "epoch": 2460} {"train_loss": -44.20191192626953, "global_step": 297679, "epoch": 2460} {"train_loss": -42.7457160949707, "global_step": 297680, "epoch": 2460} {"train_loss": -44.29978561401367, "global_step": 297681, "epoch": 2460} {"train_loss": -44.06732177734375, "global_step": 297682, "epoch": 2460} {"train_loss": -43.952850341796875, "global_step": 297683, "epoch": 2460} {"train_loss": -44.06794738769531, "global_step": 297684, "epoch": 2460} {"train_loss": -43.90897750854492, "global_step": 297685, "epoch": 2460} {"train_loss": -43.79815673828125, "global_step": 297686, "epoch": 2460} {"train_loss": -43.770973205566406, "global_step": 297687, "epoch": 2460} {"train_loss": -44.22673034667969, "global_step": 297688, "epoch": 2460} {"train_loss": -43.912559509277344, "global_step": 297689, "epoch": 2460} {"train_loss": -44.47649002075195, "global_step": 297690, "epoch": 2460} {"train_loss": -44.32224655151367, "global_step": 297691, "epoch": 2460} {"train_loss": -43.775814056396484, "global_step": 297692, "epoch": 2460} {"train_loss": -43.703948974609375, "global_step": 297693, "epoch": 2460} {"train_loss": -44.05066680908203, "global_step": 297694, "epoch": 2460} {"train_loss": -43.32938003540039, "global_step": 297695, "epoch": 2460} {"train_loss": -43.3422737121582, "global_step": 297696, "epoch": 2460} {"train_loss": -44.29989242553711, "global_step": 297697, "epoch": 2460} {"train_loss": -43.5706672668457, "global_step": 297698, "epoch": 2460} {"train_loss": -42.994659423828125, "global_step": 297699, "epoch": 2460} {"train_loss": -41.045684814453125, "global_step": 297700, "epoch": 2460} {"train_loss": -43.003623962402344, "global_step": 297701, "epoch": 2460} {"train_loss": -41.85508728027344, "global_step": 297702, "epoch": 2460} {"train_loss": -42.43555450439453, "global_step": 297703, "epoch": 2460} {"train_loss": -43.51884078979492, "global_step": 297704, "epoch": 2460} {"train_loss": -43.059749603271484, "global_step": 297705, "epoch": 2460} {"train_loss": -40.82676315307617, "global_step": 297706, "epoch": 2460} {"train_loss": -39.2606315612793, "global_step": 297707, "epoch": 2460} {"train_loss": -40.45790100097656, "global_step": 297708, "epoch": 2460} {"train_loss": -41.65464401245117, "global_step": 297709, "epoch": 2460} {"train_loss": -42.73926544189453, "global_step": 297710, "epoch": 2460} {"train_loss": -43.202877044677734, "global_step": 297711, "epoch": 2460} {"train_loss": -41.52431106567383, "global_step": 297712, "epoch": 2460} {"train_loss": -41.8120002746582, "global_step": 297713, "epoch": 2460} {"train_loss": -42.608821868896484, "global_step": 297714, "epoch": 2460} {"train_loss": -42.7064094543457, "global_step": 297715, "epoch": 2460} {"train_loss": -42.8516731262207, "global_step": 297716, "epoch": 2460} {"train_loss": -42.52952194213867, "global_step": 297717, "epoch": 2460} {"train_loss": -42.310794830322266, "global_step": 297718, "epoch": 2460} {"train_loss": -39.770469665527344, "global_step": 297719, "epoch": 2460} {"train_loss": -41.94932174682617, "global_step": 297720, "epoch": 2460} {"train_loss": -41.52937698364258, "global_step": 297721, "epoch": 2460} {"train_loss": -43.5609016418457, "global_step": 297722, "epoch": 2460} {"train_loss": -40.90514373779297, "global_step": 297723, "epoch": 2460} {"train_loss": -43.326026916503906, "global_step": 297724, "epoch": 2460} {"train_loss": -42.371864318847656, "global_step": 297725, "epoch": 2460} {"train_loss": -42.44883346557617, "global_step": 297726, "epoch": 2460} {"train_loss": -42.12863540649414, "global_step": 297727, "epoch": 2460} {"train_loss": -43.162349700927734, "global_step": 297728, "epoch": 2460} {"train_loss": -41.92719650268555, "global_step": 297729, "epoch": 2460} {"train_loss": -40.0393180847168, "global_step": 297730, "epoch": 2460} {"train_loss": -42.941001892089844, "global_step": 297731, "epoch": 2460} {"train_loss": -41.39035415649414, "global_step": 297732, "epoch": 2460} {"train_loss": -43.2561149597168, "global_step": 297733, "epoch": 2460} {"train_loss": -42.946510314941406, "global_step": 297734, "epoch": 2460} {"train_loss": -40.792354583740234, "global_step": 297735, "epoch": 2460} {"train_loss": -43.354434967041016, "global_step": 297736, "epoch": 2460} {"train_loss": -40.136207580566406, "global_step": 297737, "epoch": 2460} {"train_loss": -43.27211380004883, "global_step": 297738, "epoch": 2460} {"train_loss": -42.08750534057617, "global_step": 297739, "epoch": 2460} {"train_loss": -42.10681915283203, "global_step": 297740, "epoch": 2460} {"train_loss": -43.16875457763672, "global_step": 297741, "epoch": 2460} {"train_loss": -42.482421875, "global_step": 297742, "epoch": 2460} {"train_loss": -42.89632034301758, "global_step": 297743, "epoch": 2460} {"train_loss": -44.07551193237305, "global_step": 297744, "epoch": 2460} {"train_loss": -42.549442291259766, "global_step": 297745, "epoch": 2460} {"train_loss": -42.657814025878906, "global_step": 297746, "epoch": 2460} {"train_loss": -44.0048713684082, "global_step": 297747, "epoch": 2460} {"train_loss": -42.42530059814453, "global_step": 297748, "epoch": 2460} {"train_loss": -43.494930267333984, "global_step": 297749, "epoch": 2460} {"train_loss": -44.18501663208008, "global_step": 297750, "epoch": 2460} {"train_loss": -43.45841979980469, "global_step": 297751, "epoch": 2460} {"train_loss": -43.885555267333984, "global_step": 297752, "epoch": 2460} {"train_loss": -43.4906005859375, "global_step": 297753, "epoch": 2460} {"train_loss": -44.183746337890625, "global_step": 297754, "epoch": 2460} {"train_loss": -43.610313415527344, "global_step": 297755, "epoch": 2460} {"train_loss": -42.24766159057617, "global_step": 297756, "epoch": 2460} {"train_loss": -44.16440963745117, "global_step": 297757, "epoch": 2460} {"train_loss": -44.53875732421875, "global_step": 297758, "epoch": 2460} {"train_loss": -44.163448333740234, "global_step": 297759, "epoch": 2460} {"train_loss": -44.42778396606445, "global_step": 297760, "epoch": 2460} {"train_loss": -44.059139251708984, "global_step": 297761, "epoch": 2460} {"train_loss": -44.3935661315918, "global_step": 297762, "epoch": 2460} {"train_loss": -44.60053253173828, "global_step": 297763, "epoch": 2460} {"train_loss": -43.52056884765625, "global_step": 297764, "epoch": 2460} {"train_loss": -44.63252639770508, "global_step": 297765, "epoch": 2460} {"train_loss": -44.20905685424805, "global_step": 297766, "epoch": 2460} {"train_loss": -44.38534164428711, "global_step": 297767, "epoch": 2460} {"train_loss": -44.27260208129883, "global_step": 297768, "epoch": 2460} {"train_loss": -44.37916946411133, "global_step": 297769, "epoch": 2460} {"train_loss": -43.97249984741211, "global_step": 297770, "epoch": 2460} {"train_loss": -44.51648712158203, "global_step": 297771, "epoch": 2460} {"train_loss": -44.77490997314453, "global_step": 297772, "epoch": 2460} {"train_loss": -44.23044204711914, "global_step": 297773, "epoch": 2460} {"train_loss": -44.75210952758789, "global_step": 297774, "epoch": 2460} {"train_loss": -44.20390701293945, "global_step": 297775, "epoch": 2460} {"train_loss": -44.30589294433594, "global_step": 297776, "epoch": 2460} {"train_loss": -44.666568756103516, "global_step": 297777, "epoch": 2460} {"train_loss": -44.31510543823242, "global_step": 297778, "epoch": 2460} {"train_loss": -44.51570510864258, "global_step": 297779, "epoch": 2460} {"train_loss": -43.25976821016674, "global_step": 297780, "epoch": 2460, "val_loss": 2584970.25} {"train_loss": -44.5334358215332, "global_step": 297781, "epoch": 2461} {"train_loss": -44.266143798828125, "global_step": 297782, "epoch": 2461} {"train_loss": -44.46906661987305, "global_step": 297783, "epoch": 2461} {"train_loss": -44.48743438720703, "global_step": 297784, "epoch": 2461} {"train_loss": -43.90195846557617, "global_step": 297785, "epoch": 2461} {"train_loss": -44.26398849487305, "global_step": 297786, "epoch": 2461} {"train_loss": -44.62066650390625, "global_step": 297787, "epoch": 2461} {"train_loss": -44.575225830078125, "global_step": 297788, "epoch": 2461} {"train_loss": -44.242401123046875, "global_step": 297789, "epoch": 2461} {"train_loss": -43.95044708251953, "global_step": 297790, "epoch": 2461} {"train_loss": -42.65465545654297, "global_step": 297791, "epoch": 2461} {"train_loss": -42.803199768066406, "global_step": 297792, "epoch": 2461} {"train_loss": -44.54280471801758, "global_step": 297793, "epoch": 2461} {"train_loss": -43.977413177490234, "global_step": 297794, "epoch": 2461} {"train_loss": -43.5020866394043, "global_step": 297795, "epoch": 2461} {"train_loss": -43.14753341674805, "global_step": 297796, "epoch": 2461} {"train_loss": -44.05758285522461, "global_step": 297797, "epoch": 2461} {"train_loss": -43.95496368408203, "global_step": 297798, "epoch": 2461} {"train_loss": -43.897865295410156, "global_step": 297799, "epoch": 2461} {"train_loss": -43.510433197021484, "global_step": 297800, "epoch": 2461} {"train_loss": -44.156734466552734, "global_step": 297801, "epoch": 2461} {"train_loss": -42.0504150390625, "global_step": 297802, "epoch": 2461} {"train_loss": -40.39735794067383, "global_step": 297803, "epoch": 2461} {"train_loss": -42.811458587646484, "global_step": 297804, "epoch": 2461} {"train_loss": -43.608116149902344, "global_step": 297805, "epoch": 2461} {"train_loss": -41.916812896728516, "global_step": 297806, "epoch": 2461} {"train_loss": -42.293861389160156, "global_step": 297807, "epoch": 2461} {"train_loss": -43.98956298828125, "global_step": 297808, "epoch": 2461} {"train_loss": -43.89240264892578, "global_step": 297809, "epoch": 2461} {"train_loss": -43.4578857421875, "global_step": 297810, "epoch": 2461} {"train_loss": -44.108184814453125, "global_step": 297811, "epoch": 2461} {"train_loss": -43.80772018432617, "global_step": 297812, "epoch": 2461} {"train_loss": -42.21299362182617, "global_step": 297813, "epoch": 2461} {"train_loss": -41.655635833740234, "global_step": 297814, "epoch": 2461} {"train_loss": -42.61503601074219, "global_step": 297815, "epoch": 2461} {"train_loss": -43.39984893798828, "global_step": 297816, "epoch": 2461} {"train_loss": -41.20417404174805, "global_step": 297817, "epoch": 2461} {"train_loss": -40.292091369628906, "global_step": 297818, "epoch": 2461} {"train_loss": -42.74851608276367, "global_step": 297819, "epoch": 2461} {"train_loss": -43.35809326171875, "global_step": 297820, "epoch": 2461} {"train_loss": -43.167877197265625, "global_step": 297821, "epoch": 2461} {"train_loss": -41.658912658691406, "global_step": 297822, "epoch": 2461} {"train_loss": -42.13460159301758, "global_step": 297823, "epoch": 2461} {"train_loss": -43.6959228515625, "global_step": 297824, "epoch": 2461} {"train_loss": -42.35688018798828, "global_step": 297825, "epoch": 2461} {"train_loss": -43.28528594970703, "global_step": 297826, "epoch": 2461} {"train_loss": -42.91544723510742, "global_step": 297827, "epoch": 2461} {"train_loss": -43.51003646850586, "global_step": 297828, "epoch": 2461} {"train_loss": -43.57169723510742, "global_step": 297829, "epoch": 2461} {"train_loss": -43.26713943481445, "global_step": 297830, "epoch": 2461} {"train_loss": -43.706764221191406, "global_step": 297831, "epoch": 2461} {"train_loss": -43.1598014831543, "global_step": 297832, "epoch": 2461} {"train_loss": -43.595794677734375, "global_step": 297833, "epoch": 2461} {"train_loss": -43.97156524658203, "global_step": 297834, "epoch": 2461} {"train_loss": -43.84745788574219, "global_step": 297835, "epoch": 2461} {"train_loss": -43.42469787597656, "global_step": 297836, "epoch": 2461} {"train_loss": -43.1448860168457, "global_step": 297837, "epoch": 2461} {"train_loss": -43.378944396972656, "global_step": 297838, "epoch": 2461} {"train_loss": -43.50230026245117, "global_step": 297839, "epoch": 2461} {"train_loss": -43.8420524597168, "global_step": 297840, "epoch": 2461} {"train_loss": -42.853607177734375, "global_step": 297841, "epoch": 2461} {"train_loss": -43.9288444519043, "global_step": 297842, "epoch": 2461} {"train_loss": -42.79740524291992, "global_step": 297843, "epoch": 2461} {"train_loss": -43.3368034362793, "global_step": 297844, "epoch": 2461} {"train_loss": -44.57548904418945, "global_step": 297845, "epoch": 2461} {"train_loss": -43.37797164916992, "global_step": 297846, "epoch": 2461} {"train_loss": -43.15826416015625, "global_step": 297847, "epoch": 2461} {"train_loss": -43.25413131713867, "global_step": 297848, "epoch": 2461} {"train_loss": -43.748104095458984, "global_step": 297849, "epoch": 2461} {"train_loss": -43.55507278442383, "global_step": 297850, "epoch": 2461} {"train_loss": -43.5225944519043, "global_step": 297851, "epoch": 2461} {"train_loss": -43.946956634521484, "global_step": 297852, "epoch": 2461} {"train_loss": -43.15232467651367, "global_step": 297853, "epoch": 2461} {"train_loss": -44.1756706237793, "global_step": 297854, "epoch": 2461} {"train_loss": -43.94724655151367, "global_step": 297855, "epoch": 2461} {"train_loss": -43.43388748168945, "global_step": 297856, "epoch": 2461} {"train_loss": -43.59001541137695, "global_step": 297857, "epoch": 2461} {"train_loss": -43.58585739135742, "global_step": 297858, "epoch": 2461} {"train_loss": -43.55595397949219, "global_step": 297859, "epoch": 2461} {"train_loss": -44.178924560546875, "global_step": 297860, "epoch": 2461} {"train_loss": -43.620357513427734, "global_step": 297861, "epoch": 2461} {"train_loss": -43.96916580200195, "global_step": 297862, "epoch": 2461} {"train_loss": -43.602577209472656, "global_step": 297863, "epoch": 2461} {"train_loss": -43.92369079589844, "global_step": 297864, "epoch": 2461} {"train_loss": -42.83131790161133, "global_step": 297865, "epoch": 2461} {"train_loss": -42.95155715942383, "global_step": 297866, "epoch": 2461} {"train_loss": -43.662330627441406, "global_step": 297867, "epoch": 2461} {"train_loss": -43.53159713745117, "global_step": 297868, "epoch": 2461} {"train_loss": -42.75985336303711, "global_step": 297869, "epoch": 2461} {"train_loss": -42.245826721191406, "global_step": 297870, "epoch": 2461} {"train_loss": -42.928558349609375, "global_step": 297871, "epoch": 2461} {"train_loss": -42.52462387084961, "global_step": 297872, "epoch": 2461} {"train_loss": -41.925350189208984, "global_step": 297873, "epoch": 2461} {"train_loss": -44.142452239990234, "global_step": 297874, "epoch": 2461} {"train_loss": -43.100830078125, "global_step": 297875, "epoch": 2461} {"train_loss": -42.343048095703125, "global_step": 297876, "epoch": 2461} {"train_loss": -42.73094940185547, "global_step": 297877, "epoch": 2461} {"train_loss": -41.35783004760742, "global_step": 297878, "epoch": 2461} {"train_loss": -43.076568603515625, "global_step": 297879, "epoch": 2461} {"train_loss": -40.78443145751953, "global_step": 297880, "epoch": 2461} {"train_loss": -40.43115234375, "global_step": 297881, "epoch": 2461} {"train_loss": -41.41619873046875, "global_step": 297882, "epoch": 2461} {"train_loss": -41.59737777709961, "global_step": 297883, "epoch": 2461} {"train_loss": -42.458980560302734, "global_step": 297884, "epoch": 2461} {"train_loss": -41.16868591308594, "global_step": 297885, "epoch": 2461} {"train_loss": -43.169677734375, "global_step": 297886, "epoch": 2461} {"train_loss": -42.649776458740234, "global_step": 297887, "epoch": 2461} {"train_loss": -42.481746673583984, "global_step": 297888, "epoch": 2461} {"train_loss": -44.012733459472656, "global_step": 297889, "epoch": 2461} {"train_loss": -42.4491081237793, "global_step": 297890, "epoch": 2461} {"train_loss": -44.003814697265625, "global_step": 297891, "epoch": 2461} {"train_loss": -43.36166000366211, "global_step": 297892, "epoch": 2461} {"train_loss": -43.598480224609375, "global_step": 297893, "epoch": 2461} {"train_loss": -43.66254806518555, "global_step": 297894, "epoch": 2461} {"train_loss": -42.83072280883789, "global_step": 297895, "epoch": 2461} {"train_loss": -43.60321044921875, "global_step": 297896, "epoch": 2461} {"train_loss": -43.53229904174805, "global_step": 297897, "epoch": 2461} {"train_loss": -44.09592819213867, "global_step": 297898, "epoch": 2461} {"train_loss": -42.645565032958984, "global_step": 297899, "epoch": 2461} {"train_loss": -43.93203353881836, "global_step": 297900, "epoch": 2461} {"train_loss": -43.21135327047553, "global_step": 297901, "epoch": 2461, "val_loss": 2587266.0} {"train_loss": -44.28403854370117, "global_step": 297902, "epoch": 2462} {"train_loss": -43.79659652709961, "global_step": 297903, "epoch": 2462} {"train_loss": -44.42018508911133, "global_step": 297904, "epoch": 2462} {"train_loss": -44.395545959472656, "global_step": 297905, "epoch": 2462} {"train_loss": -44.166500091552734, "global_step": 297906, "epoch": 2462} {"train_loss": -43.992252349853516, "global_step": 297907, "epoch": 2462} {"train_loss": -44.53195571899414, "global_step": 297908, "epoch": 2462} {"train_loss": -44.2285270690918, "global_step": 297909, "epoch": 2462} {"train_loss": -44.17558670043945, "global_step": 297910, "epoch": 2462} {"train_loss": -44.748634338378906, "global_step": 297911, "epoch": 2462} {"train_loss": -44.2893180847168, "global_step": 297912, "epoch": 2462} {"train_loss": -44.58921813964844, "global_step": 297913, "epoch": 2462} {"train_loss": -44.738582611083984, "global_step": 297914, "epoch": 2462} {"train_loss": -44.32435989379883, "global_step": 297915, "epoch": 2462} {"train_loss": -44.58600997924805, "global_step": 297916, "epoch": 2462} {"train_loss": -44.530765533447266, "global_step": 297917, "epoch": 2462} {"train_loss": -44.54121017456055, "global_step": 297918, "epoch": 2462} {"train_loss": -44.70817184448242, "global_step": 297919, "epoch": 2462} {"train_loss": -44.26079177856445, "global_step": 297920, "epoch": 2462} {"train_loss": -44.17966842651367, "global_step": 297921, "epoch": 2462} {"train_loss": -44.092994689941406, "global_step": 297922, "epoch": 2462} {"train_loss": -44.30306625366211, "global_step": 297923, "epoch": 2462} {"train_loss": -44.29897689819336, "global_step": 297924, "epoch": 2462} {"train_loss": -44.870662689208984, "global_step": 297925, "epoch": 2462} {"train_loss": -44.35478210449219, "global_step": 297926, "epoch": 2462} {"train_loss": -44.808006286621094, "global_step": 297927, "epoch": 2462} {"train_loss": -44.2072639465332, "global_step": 297928, "epoch": 2462} {"train_loss": -43.97414779663086, "global_step": 297929, "epoch": 2462} {"train_loss": -44.377471923828125, "global_step": 297930, "epoch": 2462} {"train_loss": -43.742122650146484, "global_step": 297931, "epoch": 2462} {"train_loss": -44.199764251708984, "global_step": 297932, "epoch": 2462} {"train_loss": -43.576385498046875, "global_step": 297933, "epoch": 2462} {"train_loss": -43.91324234008789, "global_step": 297934, "epoch": 2462} {"train_loss": -43.13966751098633, "global_step": 297935, "epoch": 2462} {"train_loss": -43.69284439086914, "global_step": 297936, "epoch": 2462} {"train_loss": -42.614410400390625, "global_step": 297937, "epoch": 2462} {"train_loss": -43.477054595947266, "global_step": 297938, "epoch": 2462} {"train_loss": -44.25065994262695, "global_step": 297939, "epoch": 2462} {"train_loss": -41.4916877746582, "global_step": 297940, "epoch": 2462} {"train_loss": -43.6876106262207, "global_step": 297941, "epoch": 2462} {"train_loss": -39.71236801147461, "global_step": 297942, "epoch": 2462} {"train_loss": -42.78517532348633, "global_step": 297943, "epoch": 2462} {"train_loss": -39.7066535949707, "global_step": 297944, "epoch": 2462} {"train_loss": -42.00080490112305, "global_step": 297945, "epoch": 2462} {"train_loss": -42.15455627441406, "global_step": 297946, "epoch": 2462} {"train_loss": -42.44703674316406, "global_step": 297947, "epoch": 2462} {"train_loss": -39.7359504699707, "global_step": 297948, "epoch": 2462} {"train_loss": -39.64887619018555, "global_step": 297949, "epoch": 2462} {"train_loss": -40.4443473815918, "global_step": 297950, "epoch": 2462} {"train_loss": -42.91597366333008, "global_step": 297951, "epoch": 2462} {"train_loss": -41.86701965332031, "global_step": 297952, "epoch": 2462} {"train_loss": -43.46253204345703, "global_step": 297953, "epoch": 2462} {"train_loss": -41.37874984741211, "global_step": 297954, "epoch": 2462} {"train_loss": -43.12522506713867, "global_step": 297955, "epoch": 2462} {"train_loss": -43.54006576538086, "global_step": 297956, "epoch": 2462} {"train_loss": -43.06687545776367, "global_step": 297957, "epoch": 2462} {"train_loss": -43.05727767944336, "global_step": 297958, "epoch": 2462} {"train_loss": -44.388614654541016, "global_step": 297959, "epoch": 2462} {"train_loss": -43.646873474121094, "global_step": 297960, "epoch": 2462} {"train_loss": -42.83528518676758, "global_step": 297961, "epoch": 2462} {"train_loss": -43.714149475097656, "global_step": 297962, "epoch": 2462} {"train_loss": -43.674560546875, "global_step": 297963, "epoch": 2462} {"train_loss": -42.418575286865234, "global_step": 297964, "epoch": 2462} {"train_loss": -40.31852722167969, "global_step": 297965, "epoch": 2462} {"train_loss": -42.99221420288086, "global_step": 297966, "epoch": 2462} {"train_loss": -43.34907913208008, "global_step": 297967, "epoch": 2462} {"train_loss": -41.95747756958008, "global_step": 297968, "epoch": 2462} {"train_loss": -42.540489196777344, "global_step": 297969, "epoch": 2462} {"train_loss": -43.76213455200195, "global_step": 297970, "epoch": 2462} {"train_loss": -43.4903564453125, "global_step": 297971, "epoch": 2462} {"train_loss": -42.7907600402832, "global_step": 297972, "epoch": 2462} {"train_loss": -43.28266525268555, "global_step": 297973, "epoch": 2462} {"train_loss": -44.289642333984375, "global_step": 297974, "epoch": 2462} {"train_loss": -42.5692024230957, "global_step": 297975, "epoch": 2462} {"train_loss": -43.857337951660156, "global_step": 297976, "epoch": 2462} {"train_loss": -44.02166748046875, "global_step": 297977, "epoch": 2462} {"train_loss": -43.41769027709961, "global_step": 297978, "epoch": 2462} {"train_loss": -43.91483688354492, "global_step": 297979, "epoch": 2462} {"train_loss": -44.24935531616211, "global_step": 297980, "epoch": 2462} {"train_loss": -44.36796188354492, "global_step": 297981, "epoch": 2462} {"train_loss": -43.59850311279297, "global_step": 297982, "epoch": 2462} {"train_loss": -43.98981857299805, "global_step": 297983, "epoch": 2462} {"train_loss": -44.22599792480469, "global_step": 297984, "epoch": 2462} {"train_loss": -43.9054069519043, "global_step": 297985, "epoch": 2462} {"train_loss": -44.191162109375, "global_step": 297986, "epoch": 2462} {"train_loss": -44.31990432739258, "global_step": 297987, "epoch": 2462} {"train_loss": -44.19424057006836, "global_step": 297988, "epoch": 2462} {"train_loss": -44.18864059448242, "global_step": 297989, "epoch": 2462} {"train_loss": -44.390296936035156, "global_step": 297990, "epoch": 2462} {"train_loss": -44.17319869995117, "global_step": 297991, "epoch": 2462} {"train_loss": -44.413734436035156, "global_step": 297992, "epoch": 2462} {"train_loss": -44.11930465698242, "global_step": 297993, "epoch": 2462} {"train_loss": -43.935401916503906, "global_step": 297994, "epoch": 2462} {"train_loss": -44.116146087646484, "global_step": 297995, "epoch": 2462} {"train_loss": -44.55184555053711, "global_step": 297996, "epoch": 2462} {"train_loss": -44.53001022338867, "global_step": 297997, "epoch": 2462} {"train_loss": -44.908199310302734, "global_step": 297998, "epoch": 2462} {"train_loss": -44.3523063659668, "global_step": 297999, "epoch": 2462} {"train_loss": -44.51509094238281, "global_step": 298000, "epoch": 2462} {"train_loss": -44.377174377441406, "global_step": 298001, "epoch": 2462} {"train_loss": -44.74325180053711, "global_step": 298002, "epoch": 2462} {"train_loss": -44.41284942626953, "global_step": 298003, "epoch": 2462} {"train_loss": -44.01036834716797, "global_step": 298004, "epoch": 2462} {"train_loss": -44.65367126464844, "global_step": 298005, "epoch": 2462} {"train_loss": -44.9797248840332, "global_step": 298006, "epoch": 2462} {"train_loss": -44.632442474365234, "global_step": 298007, "epoch": 2462} {"train_loss": -44.741432189941406, "global_step": 298008, "epoch": 2462} {"train_loss": -44.61591720581055, "global_step": 298009, "epoch": 2462} {"train_loss": -44.43104934692383, "global_step": 298010, "epoch": 2462} {"train_loss": -44.6601448059082, "global_step": 298011, "epoch": 2462} {"train_loss": -45.19868850708008, "global_step": 298012, "epoch": 2462} {"train_loss": -44.91108322143555, "global_step": 298013, "epoch": 2462} {"train_loss": -44.649024963378906, "global_step": 298014, "epoch": 2462} {"train_loss": -45.16146469116211, "global_step": 298015, "epoch": 2462} {"train_loss": -44.11897659301758, "global_step": 298016, "epoch": 2462} {"train_loss": -43.72783279418945, "global_step": 298017, "epoch": 2462} {"train_loss": -44.645809173583984, "global_step": 298018, "epoch": 2462} {"train_loss": -45.20513916015625, "global_step": 298019, "epoch": 2462} {"train_loss": -44.41171646118164, "global_step": 298020, "epoch": 2462} {"train_loss": -43.90031051635742, "global_step": 298021, "epoch": 2462} {"train_loss": -43.73648582017126, "global_step": 298022, "epoch": 2462, "val_loss": 2655932.25} {"train_loss": -44.37758255004883, "global_step": 298023, "epoch": 2463} {"train_loss": -44.4774055480957, "global_step": 298024, "epoch": 2463} {"train_loss": -44.419769287109375, "global_step": 298025, "epoch": 2463} {"train_loss": -44.35810470581055, "global_step": 298026, "epoch": 2463} {"train_loss": -43.865325927734375, "global_step": 298027, "epoch": 2463} {"train_loss": -41.61981964111328, "global_step": 298028, "epoch": 2463} {"train_loss": -39.28971481323242, "global_step": 298029, "epoch": 2463} {"train_loss": -38.990699768066406, "global_step": 298030, "epoch": 2463} {"train_loss": -40.299781799316406, "global_step": 298031, "epoch": 2463} {"train_loss": -43.58415603637695, "global_step": 298032, "epoch": 2463} {"train_loss": -38.42333984375, "global_step": 298033, "epoch": 2463} {"train_loss": -36.2635383605957, "global_step": 298034, "epoch": 2463} {"train_loss": -39.15098571777344, "global_step": 298035, "epoch": 2463} {"train_loss": -38.35517501831055, "global_step": 298036, "epoch": 2463} {"train_loss": -38.68994903564453, "global_step": 298037, "epoch": 2463} {"train_loss": -37.71268844604492, "global_step": 298038, "epoch": 2463} {"train_loss": -40.39310836791992, "global_step": 298039, "epoch": 2463} {"train_loss": -36.72582244873047, "global_step": 298040, "epoch": 2463} {"train_loss": -41.618831634521484, "global_step": 298041, "epoch": 2463} {"train_loss": -37.72744369506836, "global_step": 298042, "epoch": 2463} {"train_loss": -35.1456184387207, "global_step": 298043, "epoch": 2463} {"train_loss": -41.54133605957031, "global_step": 298044, "epoch": 2463} {"train_loss": -39.794918060302734, "global_step": 298045, "epoch": 2463} {"train_loss": -39.77383041381836, "global_step": 298046, "epoch": 2463} {"train_loss": -41.1352653503418, "global_step": 298047, "epoch": 2463} {"train_loss": -40.545509338378906, "global_step": 298048, "epoch": 2463} {"train_loss": -40.79743576049805, "global_step": 298049, "epoch": 2463} {"train_loss": -40.8399658203125, "global_step": 298050, "epoch": 2463} {"train_loss": -41.62312316894531, "global_step": 298051, "epoch": 2463} {"train_loss": -40.233978271484375, "global_step": 298052, "epoch": 2463} {"train_loss": -41.80196762084961, "global_step": 298053, "epoch": 2463} {"train_loss": -41.045413970947266, "global_step": 298054, "epoch": 2463} {"train_loss": -42.6002082824707, "global_step": 298055, "epoch": 2463} {"train_loss": -42.31507110595703, "global_step": 298056, "epoch": 2463} {"train_loss": -42.410560607910156, "global_step": 298057, "epoch": 2463} {"train_loss": -42.175838470458984, "global_step": 298058, "epoch": 2463} {"train_loss": -42.80097579956055, "global_step": 298059, "epoch": 2463} {"train_loss": -42.73138427734375, "global_step": 298060, "epoch": 2463} {"train_loss": -42.60308074951172, "global_step": 298061, "epoch": 2463} {"train_loss": -42.69839096069336, "global_step": 298062, "epoch": 2463} {"train_loss": -42.845619201660156, "global_step": 298063, "epoch": 2463} {"train_loss": -43.31288146972656, "global_step": 298064, "epoch": 2463} {"train_loss": -42.93041229248047, "global_step": 298065, "epoch": 2463} {"train_loss": -43.342079162597656, "global_step": 298066, "epoch": 2463} {"train_loss": -43.151615142822266, "global_step": 298067, "epoch": 2463} {"train_loss": -43.27849197387695, "global_step": 298068, "epoch": 2463} {"train_loss": -43.65194320678711, "global_step": 298069, "epoch": 2463} {"train_loss": -43.45719528198242, "global_step": 298070, "epoch": 2463} {"train_loss": -43.459877014160156, "global_step": 298071, "epoch": 2463} {"train_loss": -43.31663131713867, "global_step": 298072, "epoch": 2463} {"train_loss": -43.19339370727539, "global_step": 298073, "epoch": 2463} {"train_loss": -43.551422119140625, "global_step": 298074, "epoch": 2463} {"train_loss": -43.723506927490234, "global_step": 298075, "epoch": 2463} {"train_loss": -43.75715255737305, "global_step": 298076, "epoch": 2463} {"train_loss": -43.335391998291016, "global_step": 298077, "epoch": 2463} {"train_loss": -43.99409103393555, "global_step": 298078, "epoch": 2463} {"train_loss": -43.28664016723633, "global_step": 298079, "epoch": 2463} {"train_loss": -44.201053619384766, "global_step": 298080, "epoch": 2463} {"train_loss": -43.25834274291992, "global_step": 298081, "epoch": 2463} {"train_loss": -43.8645133972168, "global_step": 298082, "epoch": 2463} {"train_loss": -43.45560073852539, "global_step": 298083, "epoch": 2463} {"train_loss": -42.971256256103516, "global_step": 298084, "epoch": 2463} {"train_loss": -43.4813346862793, "global_step": 298085, "epoch": 2463} {"train_loss": -43.04604721069336, "global_step": 298086, "epoch": 2463} {"train_loss": -43.90302658081055, "global_step": 298087, "epoch": 2463} {"train_loss": -43.43196105957031, "global_step": 298088, "epoch": 2463} {"train_loss": -43.5901985168457, "global_step": 298089, "epoch": 2463} {"train_loss": -43.58750534057617, "global_step": 298090, "epoch": 2463} {"train_loss": -43.4693603515625, "global_step": 298091, "epoch": 2463} {"train_loss": -44.203025817871094, "global_step": 298092, "epoch": 2463} {"train_loss": -43.39992904663086, "global_step": 298093, "epoch": 2463} {"train_loss": -44.110328674316406, "global_step": 298094, "epoch": 2463} {"train_loss": -43.59270477294922, "global_step": 298095, "epoch": 2463} {"train_loss": -44.35293197631836, "global_step": 298096, "epoch": 2463} {"train_loss": -43.57780456542969, "global_step": 298097, "epoch": 2463} {"train_loss": -43.87233352661133, "global_step": 298098, "epoch": 2463} {"train_loss": -44.273502349853516, "global_step": 298099, "epoch": 2463} {"train_loss": -43.46944046020508, "global_step": 298100, "epoch": 2463} {"train_loss": -44.68407440185547, "global_step": 298101, "epoch": 2463} {"train_loss": -43.5340461730957, "global_step": 298102, "epoch": 2463} {"train_loss": -43.303932189941406, "global_step": 298103, "epoch": 2463} {"train_loss": -44.04316329956055, "global_step": 298104, "epoch": 2463} {"train_loss": -43.476112365722656, "global_step": 298105, "epoch": 2463} {"train_loss": -44.3848991394043, "global_step": 298106, "epoch": 2463} {"train_loss": -43.10133361816406, "global_step": 298107, "epoch": 2463} {"train_loss": -43.98490524291992, "global_step": 298108, "epoch": 2463} {"train_loss": -43.915496826171875, "global_step": 298109, "epoch": 2463} {"train_loss": -42.972412109375, "global_step": 298110, "epoch": 2463} {"train_loss": -43.629150390625, "global_step": 298111, "epoch": 2463} {"train_loss": -44.3421630859375, "global_step": 298112, "epoch": 2463} {"train_loss": -43.6866569519043, "global_step": 298113, "epoch": 2463} {"train_loss": -44.27874755859375, "global_step": 298114, "epoch": 2463} {"train_loss": -44.43586349487305, "global_step": 298115, "epoch": 2463} {"train_loss": -43.5971794128418, "global_step": 298116, "epoch": 2463} {"train_loss": -44.17833709716797, "global_step": 298117, "epoch": 2463} {"train_loss": -44.332820892333984, "global_step": 298118, "epoch": 2463} {"train_loss": -43.88917922973633, "global_step": 298119, "epoch": 2463} {"train_loss": -43.66986083984375, "global_step": 298120, "epoch": 2463} {"train_loss": -44.366416931152344, "global_step": 298121, "epoch": 2463} {"train_loss": -44.33758544921875, "global_step": 298122, "epoch": 2463} {"train_loss": -44.60818099975586, "global_step": 298123, "epoch": 2463} {"train_loss": -43.8490104675293, "global_step": 298124, "epoch": 2463} {"train_loss": -44.92018508911133, "global_step": 298125, "epoch": 2463} {"train_loss": -44.70719528198242, "global_step": 298126, "epoch": 2463} {"train_loss": -44.53115463256836, "global_step": 298127, "epoch": 2463} {"train_loss": -44.87398910522461, "global_step": 298128, "epoch": 2463} {"train_loss": -44.747352600097656, "global_step": 298129, "epoch": 2463} {"train_loss": -44.9460563659668, "global_step": 298130, "epoch": 2463} {"train_loss": -44.29697799682617, "global_step": 298131, "epoch": 2463} {"train_loss": -44.68798828125, "global_step": 298132, "epoch": 2463} {"train_loss": -44.466304779052734, "global_step": 298133, "epoch": 2463} {"train_loss": -44.92330551147461, "global_step": 298134, "epoch": 2463} {"train_loss": -44.2348518371582, "global_step": 298135, "epoch": 2463} {"train_loss": -43.843204498291016, "global_step": 298136, "epoch": 2463} {"train_loss": -44.74876022338867, "global_step": 298137, "epoch": 2463} {"train_loss": -44.82571029663086, "global_step": 298138, "epoch": 2463} {"train_loss": -44.64197540283203, "global_step": 298139, "epoch": 2463} {"train_loss": -44.695068359375, "global_step": 298140, "epoch": 2463} {"train_loss": -44.8614387512207, "global_step": 298141, "epoch": 2463} {"train_loss": -44.97951126098633, "global_step": 298142, "epoch": 2463} {"train_loss": -42.91787804847907, "global_step": 298143, "epoch": 2463, "val_loss": 2588525.75} {"train_loss": -44.12748336791992, "global_step": 298144, "epoch": 2464} {"train_loss": -44.84272384643555, "global_step": 298145, "epoch": 2464} {"train_loss": -44.82448959350586, "global_step": 298146, "epoch": 2464} {"train_loss": -44.8327522277832, "global_step": 298147, "epoch": 2464} {"train_loss": -44.957149505615234, "global_step": 298148, "epoch": 2464} {"train_loss": -44.25914001464844, "global_step": 298149, "epoch": 2464} {"train_loss": -44.19301986694336, "global_step": 298150, "epoch": 2464} {"train_loss": -44.787147521972656, "global_step": 298151, "epoch": 2464} {"train_loss": -44.28387451171875, "global_step": 298152, "epoch": 2464} {"train_loss": -44.5436897277832, "global_step": 298153, "epoch": 2464} {"train_loss": -44.65724563598633, "global_step": 298154, "epoch": 2464} {"train_loss": -44.698429107666016, "global_step": 298155, "epoch": 2464} {"train_loss": -44.10947799682617, "global_step": 298156, "epoch": 2464} {"train_loss": -44.68037796020508, "global_step": 298157, "epoch": 2464} {"train_loss": -45.00089645385742, "global_step": 298158, "epoch": 2464} {"train_loss": -43.51261901855469, "global_step": 298159, "epoch": 2464} {"train_loss": -44.09922409057617, "global_step": 298160, "epoch": 2464} {"train_loss": -43.728736877441406, "global_step": 298161, "epoch": 2464} {"train_loss": -43.196876525878906, "global_step": 298162, "epoch": 2464} {"train_loss": -42.749603271484375, "global_step": 298163, "epoch": 2464} {"train_loss": -43.4793815612793, "global_step": 298164, "epoch": 2464} {"train_loss": -43.559844970703125, "global_step": 298165, "epoch": 2464} {"train_loss": -43.22976303100586, "global_step": 298166, "epoch": 2464} {"train_loss": -43.447505950927734, "global_step": 298167, "epoch": 2464} {"train_loss": -42.603824615478516, "global_step": 298168, "epoch": 2464} {"train_loss": -40.72028732299805, "global_step": 298169, "epoch": 2464} {"train_loss": -42.50338363647461, "global_step": 298170, "epoch": 2464} {"train_loss": -43.792816162109375, "global_step": 298171, "epoch": 2464} {"train_loss": -36.97257614135742, "global_step": 298172, "epoch": 2464} {"train_loss": -38.35523223876953, "global_step": 298173, "epoch": 2464} {"train_loss": -41.50336456298828, "global_step": 298174, "epoch": 2464} {"train_loss": -38.70616912841797, "global_step": 298175, "epoch": 2464} {"train_loss": -38.79769515991211, "global_step": 298176, "epoch": 2464} {"train_loss": -41.40550231933594, "global_step": 298177, "epoch": 2464} {"train_loss": -41.75956344604492, "global_step": 298178, "epoch": 2464} {"train_loss": -40.03791427612305, "global_step": 298179, "epoch": 2464} {"train_loss": -40.673988342285156, "global_step": 298180, "epoch": 2464} {"train_loss": -42.72099685668945, "global_step": 298181, "epoch": 2464} {"train_loss": -40.25183868408203, "global_step": 298182, "epoch": 2464} {"train_loss": -39.3624153137207, "global_step": 298183, "epoch": 2464} {"train_loss": -41.85706329345703, "global_step": 298184, "epoch": 2464} {"train_loss": -42.20890808105469, "global_step": 298185, "epoch": 2464} {"train_loss": -40.54151153564453, "global_step": 298186, "epoch": 2464} {"train_loss": -42.67573928833008, "global_step": 298187, "epoch": 2464} {"train_loss": -42.95136260986328, "global_step": 298188, "epoch": 2464} {"train_loss": -41.90694808959961, "global_step": 298189, "epoch": 2464} {"train_loss": -42.58320236206055, "global_step": 298190, "epoch": 2464} {"train_loss": -42.61590576171875, "global_step": 298191, "epoch": 2464} {"train_loss": -42.60696029663086, "global_step": 298192, "epoch": 2464} {"train_loss": -43.010292053222656, "global_step": 298193, "epoch": 2464} {"train_loss": -43.5217399597168, "global_step": 298194, "epoch": 2464} {"train_loss": -43.02260971069336, "global_step": 298195, "epoch": 2464} {"train_loss": -43.10325241088867, "global_step": 298196, "epoch": 2464} {"train_loss": -43.44564437866211, "global_step": 298197, "epoch": 2464} {"train_loss": -43.35688400268555, "global_step": 298198, "epoch": 2464} {"train_loss": -44.2930908203125, "global_step": 298199, "epoch": 2464} {"train_loss": -43.01205825805664, "global_step": 298200, "epoch": 2464} {"train_loss": -43.29914474487305, "global_step": 298201, "epoch": 2464} {"train_loss": -43.94710159301758, "global_step": 298202, "epoch": 2464} {"train_loss": -42.71799850463867, "global_step": 298203, "epoch": 2464} {"train_loss": -44.571441650390625, "global_step": 298204, "epoch": 2464} {"train_loss": -43.47111129760742, "global_step": 298205, "epoch": 2464} {"train_loss": -44.061702728271484, "global_step": 298206, "epoch": 2464} {"train_loss": -43.427738189697266, "global_step": 298207, "epoch": 2464} {"train_loss": -43.736854553222656, "global_step": 298208, "epoch": 2464} {"train_loss": -43.501888275146484, "global_step": 298209, "epoch": 2464} {"train_loss": -43.73527908325195, "global_step": 298210, "epoch": 2464} {"train_loss": -43.64626693725586, "global_step": 298211, "epoch": 2464} {"train_loss": -43.954017639160156, "global_step": 298212, "epoch": 2464} {"train_loss": -44.07710647583008, "global_step": 298213, "epoch": 2464} {"train_loss": -43.483863830566406, "global_step": 298214, "epoch": 2464} {"train_loss": -43.432254791259766, "global_step": 298215, "epoch": 2464} {"train_loss": -43.89365768432617, "global_step": 298216, "epoch": 2464} {"train_loss": -43.95174789428711, "global_step": 298217, "epoch": 2464} {"train_loss": -44.02431869506836, "global_step": 298218, "epoch": 2464} {"train_loss": -44.19819259643555, "global_step": 298219, "epoch": 2464} {"train_loss": -44.21137619018555, "global_step": 298220, "epoch": 2464} {"train_loss": -43.8616943359375, "global_step": 298221, "epoch": 2464} {"train_loss": -43.2677116394043, "global_step": 298222, "epoch": 2464} {"train_loss": -44.076416015625, "global_step": 298223, "epoch": 2464} {"train_loss": -44.08632278442383, "global_step": 298224, "epoch": 2464} {"train_loss": -44.32062911987305, "global_step": 298225, "epoch": 2464} {"train_loss": -44.36880111694336, "global_step": 298226, "epoch": 2464} {"train_loss": -44.01321792602539, "global_step": 298227, "epoch": 2464} {"train_loss": -44.08062744140625, "global_step": 298228, "epoch": 2464} {"train_loss": -44.724178314208984, "global_step": 298229, "epoch": 2464} {"train_loss": -44.31417465209961, "global_step": 298230, "epoch": 2464} {"train_loss": -44.531982421875, "global_step": 298231, "epoch": 2464} {"train_loss": -44.601802825927734, "global_step": 298232, "epoch": 2464} {"train_loss": -44.7431526184082, "global_step": 298233, "epoch": 2464} {"train_loss": -44.875301361083984, "global_step": 298234, "epoch": 2464} {"train_loss": -44.7507209777832, "global_step": 298235, "epoch": 2464} {"train_loss": -44.7232666015625, "global_step": 298236, "epoch": 2464} {"train_loss": -44.28451156616211, "global_step": 298237, "epoch": 2464} {"train_loss": -44.54935836791992, "global_step": 298238, "epoch": 2464} {"train_loss": -44.83482360839844, "global_step": 298239, "epoch": 2464} {"train_loss": -44.824005126953125, "global_step": 298240, "epoch": 2464} {"train_loss": -44.957054138183594, "global_step": 298241, "epoch": 2464} {"train_loss": -44.92231750488281, "global_step": 298242, "epoch": 2464} {"train_loss": -44.53411865234375, "global_step": 298243, "epoch": 2464} {"train_loss": -44.980918884277344, "global_step": 298244, "epoch": 2464} {"train_loss": -44.535369873046875, "global_step": 298245, "epoch": 2464} {"train_loss": -45.09608840942383, "global_step": 298246, "epoch": 2464} {"train_loss": -45.09443283081055, "global_step": 298247, "epoch": 2464} {"train_loss": -43.887630462646484, "global_step": 298248, "epoch": 2464} {"train_loss": -44.58362579345703, "global_step": 298249, "epoch": 2464} {"train_loss": -45.20502471923828, "global_step": 298250, "epoch": 2464} {"train_loss": -44.90277099609375, "global_step": 298251, "epoch": 2464} {"train_loss": -45.42385482788086, "global_step": 298252, "epoch": 2464} {"train_loss": -44.86983108520508, "global_step": 298253, "epoch": 2464} {"train_loss": -44.7711067199707, "global_step": 298254, "epoch": 2464} {"train_loss": -44.182029724121094, "global_step": 298255, "epoch": 2464} {"train_loss": -44.464664459228516, "global_step": 298256, "epoch": 2464} {"train_loss": -45.09926986694336, "global_step": 298257, "epoch": 2464} {"train_loss": -45.10411834716797, "global_step": 298258, "epoch": 2464} {"train_loss": -44.31582260131836, "global_step": 298259, "epoch": 2464} {"train_loss": -42.13146209716797, "global_step": 298260, "epoch": 2464} {"train_loss": -41.2439079284668, "global_step": 298261, "epoch": 2464} {"train_loss": -41.77786636352539, "global_step": 298262, "epoch": 2464} {"train_loss": -44.4892692565918, "global_step": 298263, "epoch": 2464} {"train_loss": -43.49060969707394, "global_step": 298264, "epoch": 2464, "val_loss": 2680199.0} {"train_loss": -42.01885986328125, "global_step": 298265, "epoch": 2465} {"train_loss": -42.7473258972168, "global_step": 298266, "epoch": 2465} {"train_loss": -42.04518508911133, "global_step": 298267, "epoch": 2465} {"train_loss": -43.28489685058594, "global_step": 298268, "epoch": 2465} {"train_loss": -43.122779846191406, "global_step": 298269, "epoch": 2465} {"train_loss": -41.329280853271484, "global_step": 298270, "epoch": 2465} {"train_loss": -43.3361930847168, "global_step": 298271, "epoch": 2465} {"train_loss": -42.03876495361328, "global_step": 298272, "epoch": 2465} {"train_loss": -41.62904739379883, "global_step": 298273, "epoch": 2465} {"train_loss": -41.849998474121094, "global_step": 298274, "epoch": 2465} {"train_loss": -40.80347442626953, "global_step": 298275, "epoch": 2465} {"train_loss": -43.361083984375, "global_step": 298276, "epoch": 2465} {"train_loss": -42.95820236206055, "global_step": 298277, "epoch": 2465} {"train_loss": -42.0069580078125, "global_step": 298278, "epoch": 2465} {"train_loss": -42.122039794921875, "global_step": 298279, "epoch": 2465} {"train_loss": -42.0286865234375, "global_step": 298280, "epoch": 2465} {"train_loss": -43.6873779296875, "global_step": 298281, "epoch": 2465} {"train_loss": -42.614166259765625, "global_step": 298282, "epoch": 2465} {"train_loss": -43.58039474487305, "global_step": 298283, "epoch": 2465} {"train_loss": -43.62776565551758, "global_step": 298284, "epoch": 2465} {"train_loss": -42.821041107177734, "global_step": 298285, "epoch": 2465} {"train_loss": -43.98188400268555, "global_step": 298286, "epoch": 2465} {"train_loss": -44.13104248046875, "global_step": 298287, "epoch": 2465} {"train_loss": -43.263916015625, "global_step": 298288, "epoch": 2465} {"train_loss": -43.87837600708008, "global_step": 298289, "epoch": 2465} {"train_loss": -43.81540298461914, "global_step": 298290, "epoch": 2465} {"train_loss": -43.433937072753906, "global_step": 298291, "epoch": 2465} {"train_loss": -44.47369384765625, "global_step": 298292, "epoch": 2465} {"train_loss": -43.342586517333984, "global_step": 298293, "epoch": 2465} {"train_loss": -43.19332504272461, "global_step": 298294, "epoch": 2465} {"train_loss": -43.34819793701172, "global_step": 298295, "epoch": 2465} {"train_loss": -43.80671310424805, "global_step": 298296, "epoch": 2465} {"train_loss": -44.15365219116211, "global_step": 298297, "epoch": 2465} {"train_loss": -44.08289337158203, "global_step": 298298, "epoch": 2465} {"train_loss": -43.3928337097168, "global_step": 298299, "epoch": 2465} {"train_loss": -44.0745849609375, "global_step": 298300, "epoch": 2465} {"train_loss": -44.0181999206543, "global_step": 298301, "epoch": 2465} {"train_loss": -42.88946533203125, "global_step": 298302, "epoch": 2465} {"train_loss": -43.658721923828125, "global_step": 298303, "epoch": 2465} {"train_loss": -44.20159912109375, "global_step": 298304, "epoch": 2465} {"train_loss": -43.362178802490234, "global_step": 298305, "epoch": 2465} {"train_loss": -43.826751708984375, "global_step": 298306, "epoch": 2465} {"train_loss": -43.89762878417969, "global_step": 298307, "epoch": 2465} {"train_loss": -42.21015548706055, "global_step": 298308, "epoch": 2465} {"train_loss": -44.389408111572266, "global_step": 298309, "epoch": 2465} {"train_loss": -43.6784782409668, "global_step": 298310, "epoch": 2465} {"train_loss": -42.86296463012695, "global_step": 298311, "epoch": 2465} {"train_loss": -44.19044876098633, "global_step": 298312, "epoch": 2465} {"train_loss": -44.70866012573242, "global_step": 298313, "epoch": 2465} {"train_loss": -43.92181396484375, "global_step": 298314, "epoch": 2465} {"train_loss": -44.02138137817383, "global_step": 298315, "epoch": 2465} {"train_loss": -44.53937911987305, "global_step": 298316, "epoch": 2465} {"train_loss": -44.085205078125, "global_step": 298317, "epoch": 2465} {"train_loss": -43.535457611083984, "global_step": 298318, "epoch": 2465} {"train_loss": -43.48542404174805, "global_step": 298319, "epoch": 2465} {"train_loss": -44.27739334106445, "global_step": 298320, "epoch": 2465} {"train_loss": -44.27108383178711, "global_step": 298321, "epoch": 2465} {"train_loss": -43.76774978637695, "global_step": 298322, "epoch": 2465} {"train_loss": -43.04783630371094, "global_step": 298323, "epoch": 2465} {"train_loss": -43.094966888427734, "global_step": 298324, "epoch": 2465} {"train_loss": -43.908443450927734, "global_step": 298325, "epoch": 2465} {"train_loss": -43.44374084472656, "global_step": 298326, "epoch": 2465} {"train_loss": -42.59233474731445, "global_step": 298327, "epoch": 2465} {"train_loss": -42.928199768066406, "global_step": 298328, "epoch": 2465} {"train_loss": -43.08989334106445, "global_step": 298329, "epoch": 2465} {"train_loss": -43.954463958740234, "global_step": 298330, "epoch": 2465} {"train_loss": -43.689605712890625, "global_step": 298331, "epoch": 2465} {"train_loss": -43.71735382080078, "global_step": 298332, "epoch": 2465} {"train_loss": -44.068599700927734, "global_step": 298333, "epoch": 2465} {"train_loss": -44.08603286743164, "global_step": 298334, "epoch": 2465} {"train_loss": -43.765499114990234, "global_step": 298335, "epoch": 2465} {"train_loss": -43.86033248901367, "global_step": 298336, "epoch": 2465} {"train_loss": -43.979339599609375, "global_step": 298337, "epoch": 2465} {"train_loss": -42.64835739135742, "global_step": 298338, "epoch": 2465} {"train_loss": -42.21141815185547, "global_step": 298339, "epoch": 2465} {"train_loss": -44.5457878112793, "global_step": 298340, "epoch": 2465} {"train_loss": -43.35502243041992, "global_step": 298341, "epoch": 2465} {"train_loss": -41.553279876708984, "global_step": 298342, "epoch": 2465} {"train_loss": -43.656288146972656, "global_step": 298343, "epoch": 2465} {"train_loss": -43.48727035522461, "global_step": 298344, "epoch": 2465} {"train_loss": -42.73845291137695, "global_step": 298345, "epoch": 2465} {"train_loss": -44.07276916503906, "global_step": 298346, "epoch": 2465} {"train_loss": -43.856266021728516, "global_step": 298347, "epoch": 2465} {"train_loss": -43.07499313354492, "global_step": 298348, "epoch": 2465} {"train_loss": -43.92110824584961, "global_step": 298349, "epoch": 2465} {"train_loss": -43.63349533081055, "global_step": 298350, "epoch": 2465} {"train_loss": -42.933258056640625, "global_step": 298351, "epoch": 2465} {"train_loss": -44.1430549621582, "global_step": 298352, "epoch": 2465} {"train_loss": -43.89190673828125, "global_step": 298353, "epoch": 2465} {"train_loss": -43.76697540283203, "global_step": 298354, "epoch": 2465} {"train_loss": -43.77959442138672, "global_step": 298355, "epoch": 2465} {"train_loss": -42.80458068847656, "global_step": 298356, "epoch": 2465} {"train_loss": -43.58122634887695, "global_step": 298357, "epoch": 2465} {"train_loss": -43.51142501831055, "global_step": 298358, "epoch": 2465} {"train_loss": -44.23102951049805, "global_step": 298359, "epoch": 2465} {"train_loss": -43.5888557434082, "global_step": 298360, "epoch": 2465} {"train_loss": -44.064613342285156, "global_step": 298361, "epoch": 2465} {"train_loss": -43.86982727050781, "global_step": 298362, "epoch": 2465} {"train_loss": -43.016204833984375, "global_step": 298363, "epoch": 2465} {"train_loss": -43.222721099853516, "global_step": 298364, "epoch": 2465} {"train_loss": -43.67873001098633, "global_step": 298365, "epoch": 2465} {"train_loss": -42.466766357421875, "global_step": 298366, "epoch": 2465} {"train_loss": -42.72929382324219, "global_step": 298367, "epoch": 2465} {"train_loss": -43.5421257019043, "global_step": 298368, "epoch": 2465} {"train_loss": -43.481441497802734, "global_step": 298369, "epoch": 2465} {"train_loss": -42.535362243652344, "global_step": 298370, "epoch": 2465} {"train_loss": -42.07085418701172, "global_step": 298371, "epoch": 2465} {"train_loss": -42.91669845581055, "global_step": 298372, "epoch": 2465} {"train_loss": -42.58183670043945, "global_step": 298373, "epoch": 2465} {"train_loss": -42.29486846923828, "global_step": 298374, "epoch": 2465} {"train_loss": -41.19380569458008, "global_step": 298375, "epoch": 2465} {"train_loss": -41.69193649291992, "global_step": 298376, "epoch": 2465} {"train_loss": -42.870155334472656, "global_step": 298377, "epoch": 2465} {"train_loss": -42.34503936767578, "global_step": 298378, "epoch": 2465} {"train_loss": -42.29304122924805, "global_step": 298379, "epoch": 2465} {"train_loss": -42.84760284423828, "global_step": 298380, "epoch": 2465} {"train_loss": -42.973838806152344, "global_step": 298381, "epoch": 2465} {"train_loss": -40.55277633666992, "global_step": 298382, "epoch": 2465} {"train_loss": -43.97431564331055, "global_step": 298383, "epoch": 2465} {"train_loss": -40.63604736328125, "global_step": 298384, "epoch": 2465} {"train_loss": -43.24940077726506, "global_step": 298385, "epoch": 2465, "val_loss": 2698770.5} {"train_loss": -41.47043991088867, "global_step": 298386, "epoch": 2466} {"train_loss": -43.367427825927734, "global_step": 298387, "epoch": 2466} {"train_loss": -43.4104118347168, "global_step": 298388, "epoch": 2466} {"train_loss": -42.02630615234375, "global_step": 298389, "epoch": 2466} {"train_loss": -43.79972457885742, "global_step": 298390, "epoch": 2466} {"train_loss": -42.106624603271484, "global_step": 298391, "epoch": 2466} {"train_loss": -43.845333099365234, "global_step": 298392, "epoch": 2466} {"train_loss": -43.11683654785156, "global_step": 298393, "epoch": 2466} {"train_loss": -41.898765563964844, "global_step": 298394, "epoch": 2466} {"train_loss": -43.410804748535156, "global_step": 298395, "epoch": 2466} {"train_loss": -42.25337600708008, "global_step": 298396, "epoch": 2466} {"train_loss": -42.43770980834961, "global_step": 298397, "epoch": 2466} {"train_loss": -42.78626251220703, "global_step": 298398, "epoch": 2466} {"train_loss": -40.874568939208984, "global_step": 298399, "epoch": 2466} {"train_loss": -43.69707107543945, "global_step": 298400, "epoch": 2466} {"train_loss": -41.196590423583984, "global_step": 298401, "epoch": 2466} {"train_loss": -42.5556526184082, "global_step": 298402, "epoch": 2466} {"train_loss": -42.90460205078125, "global_step": 298403, "epoch": 2466} {"train_loss": -43.2330207824707, "global_step": 298404, "epoch": 2466} {"train_loss": -42.1392936706543, "global_step": 298405, "epoch": 2466} {"train_loss": -43.47975540161133, "global_step": 298406, "epoch": 2466} {"train_loss": -42.4322395324707, "global_step": 298407, "epoch": 2466} {"train_loss": -43.122222900390625, "global_step": 298408, "epoch": 2466} {"train_loss": -42.785640716552734, "global_step": 298409, "epoch": 2466} {"train_loss": -41.94865417480469, "global_step": 298410, "epoch": 2466} {"train_loss": -42.1124267578125, "global_step": 298411, "epoch": 2466} {"train_loss": -43.7739372253418, "global_step": 298412, "epoch": 2466} {"train_loss": -41.8176383972168, "global_step": 298413, "epoch": 2466} {"train_loss": -43.14844512939453, "global_step": 298414, "epoch": 2466} {"train_loss": -42.38169479370117, "global_step": 298415, "epoch": 2466} {"train_loss": -42.72581481933594, "global_step": 298416, "epoch": 2466} {"train_loss": -43.794429779052734, "global_step": 298417, "epoch": 2466} {"train_loss": -43.09756088256836, "global_step": 298418, "epoch": 2466} {"train_loss": -42.127559661865234, "global_step": 298419, "epoch": 2466} {"train_loss": -43.36376190185547, "global_step": 298420, "epoch": 2466} {"train_loss": -41.311885833740234, "global_step": 298421, "epoch": 2466} {"train_loss": -42.92904281616211, "global_step": 298422, "epoch": 2466} {"train_loss": -42.85075759887695, "global_step": 298423, "epoch": 2466} {"train_loss": -40.6952018737793, "global_step": 298424, "epoch": 2466} {"train_loss": -42.6739501953125, "global_step": 298425, "epoch": 2466} {"train_loss": -42.76631164550781, "global_step": 298426, "epoch": 2466} {"train_loss": -42.55939483642578, "global_step": 298427, "epoch": 2466} {"train_loss": -42.7448616027832, "global_step": 298428, "epoch": 2466} {"train_loss": -43.78303146362305, "global_step": 298429, "epoch": 2466} {"train_loss": -42.2823600769043, "global_step": 298430, "epoch": 2466} {"train_loss": -42.57126998901367, "global_step": 298431, "epoch": 2466} {"train_loss": -42.53602981567383, "global_step": 298432, "epoch": 2466} {"train_loss": -41.099552154541016, "global_step": 298433, "epoch": 2466} {"train_loss": -43.716304779052734, "global_step": 298434, "epoch": 2466} {"train_loss": -42.497161865234375, "global_step": 298435, "epoch": 2466} {"train_loss": -43.48531723022461, "global_step": 298436, "epoch": 2466} {"train_loss": -42.78722381591797, "global_step": 298437, "epoch": 2466} {"train_loss": -43.333412170410156, "global_step": 298438, "epoch": 2466} {"train_loss": -43.33037185668945, "global_step": 298439, "epoch": 2466} {"train_loss": -43.38767623901367, "global_step": 298440, "epoch": 2466} {"train_loss": -42.38628005981445, "global_step": 298441, "epoch": 2466} {"train_loss": -42.99134063720703, "global_step": 298442, "epoch": 2466} {"train_loss": -42.62227249145508, "global_step": 298443, "epoch": 2466} {"train_loss": -43.037471771240234, "global_step": 298444, "epoch": 2466} {"train_loss": -43.43305206298828, "global_step": 298445, "epoch": 2466} {"train_loss": -42.84995651245117, "global_step": 298446, "epoch": 2466} {"train_loss": -44.227500915527344, "global_step": 298447, "epoch": 2466} {"train_loss": -42.86127471923828, "global_step": 298448, "epoch": 2466} {"train_loss": -43.562686920166016, "global_step": 298449, "epoch": 2466} {"train_loss": -43.7456169128418, "global_step": 298450, "epoch": 2466} {"train_loss": -44.11673355102539, "global_step": 298451, "epoch": 2466} {"train_loss": -43.86738204956055, "global_step": 298452, "epoch": 2466} {"train_loss": -43.39303207397461, "global_step": 298453, "epoch": 2466} {"train_loss": -43.19648361206055, "global_step": 298454, "epoch": 2466} {"train_loss": -44.138092041015625, "global_step": 298455, "epoch": 2466} {"train_loss": -43.3604621887207, "global_step": 298456, "epoch": 2466} {"train_loss": -43.5374641418457, "global_step": 298457, "epoch": 2466} {"train_loss": -44.21686935424805, "global_step": 298458, "epoch": 2466} {"train_loss": -44.17469787597656, "global_step": 298459, "epoch": 2466} {"train_loss": -43.29368209838867, "global_step": 298460, "epoch": 2466} {"train_loss": -43.72249221801758, "global_step": 298461, "epoch": 2466} {"train_loss": -43.99247360229492, "global_step": 298462, "epoch": 2466} {"train_loss": -44.52429962158203, "global_step": 298463, "epoch": 2466} {"train_loss": -43.89848709106445, "global_step": 298464, "epoch": 2466} {"train_loss": -44.25361251831055, "global_step": 298465, "epoch": 2466} {"train_loss": -44.19729232788086, "global_step": 298466, "epoch": 2466} {"train_loss": -44.253047943115234, "global_step": 298467, "epoch": 2466} {"train_loss": -44.12725830078125, "global_step": 298468, "epoch": 2466} {"train_loss": -44.23066329956055, "global_step": 298469, "epoch": 2466} {"train_loss": -44.37508010864258, "global_step": 298470, "epoch": 2466} {"train_loss": -44.3681755065918, "global_step": 298471, "epoch": 2466} {"train_loss": -44.67084884643555, "global_step": 298472, "epoch": 2466} {"train_loss": -44.242469787597656, "global_step": 298473, "epoch": 2466} {"train_loss": -44.36033630371094, "global_step": 298474, "epoch": 2466} {"train_loss": -44.537593841552734, "global_step": 298475, "epoch": 2466} {"train_loss": -44.67420959472656, "global_step": 298476, "epoch": 2466} {"train_loss": -44.77733612060547, "global_step": 298477, "epoch": 2466} {"train_loss": -44.39662170410156, "global_step": 298478, "epoch": 2466} {"train_loss": -44.62189483642578, "global_step": 298479, "epoch": 2466} {"train_loss": -44.897789001464844, "global_step": 298480, "epoch": 2466} {"train_loss": -45.173763275146484, "global_step": 298481, "epoch": 2466} {"train_loss": -44.71696472167969, "global_step": 298482, "epoch": 2466} {"train_loss": -44.49345016479492, "global_step": 298483, "epoch": 2466} {"train_loss": -44.8214225769043, "global_step": 298484, "epoch": 2466} {"train_loss": -44.61623764038086, "global_step": 298485, "epoch": 2466} {"train_loss": -44.875083923339844, "global_step": 298486, "epoch": 2466} {"train_loss": -44.76203155517578, "global_step": 298487, "epoch": 2466} {"train_loss": -44.0371208190918, "global_step": 298488, "epoch": 2466} {"train_loss": -44.91096496582031, "global_step": 298489, "epoch": 2466} {"train_loss": -45.232208251953125, "global_step": 298490, "epoch": 2466} {"train_loss": -44.92456817626953, "global_step": 298491, "epoch": 2466} {"train_loss": -44.91355514526367, "global_step": 298492, "epoch": 2466} {"train_loss": -44.79374313354492, "global_step": 298493, "epoch": 2466} {"train_loss": -44.88886642456055, "global_step": 298494, "epoch": 2466} {"train_loss": -44.098487854003906, "global_step": 298495, "epoch": 2466} {"train_loss": -45.110748291015625, "global_step": 298496, "epoch": 2466} {"train_loss": -44.510887145996094, "global_step": 298497, "epoch": 2466} {"train_loss": -44.67813491821289, "global_step": 298498, "epoch": 2466} {"train_loss": -43.409202575683594, "global_step": 298499, "epoch": 2466} {"train_loss": -44.23209762573242, "global_step": 298500, "epoch": 2466} {"train_loss": -43.944881439208984, "global_step": 298501, "epoch": 2466} {"train_loss": -43.34852981567383, "global_step": 298502, "epoch": 2466} {"train_loss": -41.831451416015625, "global_step": 298503, "epoch": 2466} {"train_loss": -43.03363037109375, "global_step": 298504, "epoch": 2466} {"train_loss": -43.8789176940918, "global_step": 298505, "epoch": 2466} {"train_loss": -43.45462077117163, "global_step": 298506, "epoch": 2466, "val_loss": 2653633.0} {"train_loss": -44.83238983154297, "global_step": 298507, "epoch": 2467} {"train_loss": -44.00996017456055, "global_step": 298508, "epoch": 2467} {"train_loss": -43.090553283691406, "global_step": 298509, "epoch": 2467} {"train_loss": -42.24703598022461, "global_step": 298510, "epoch": 2467} {"train_loss": -42.908546447753906, "global_step": 298511, "epoch": 2467} {"train_loss": -43.1749153137207, "global_step": 298512, "epoch": 2467} {"train_loss": -44.314842224121094, "global_step": 298513, "epoch": 2467} {"train_loss": -43.86773681640625, "global_step": 298514, "epoch": 2467} {"train_loss": -43.782833099365234, "global_step": 298515, "epoch": 2467} {"train_loss": -43.196754455566406, "global_step": 298516, "epoch": 2467} {"train_loss": -43.473384857177734, "global_step": 298517, "epoch": 2467} {"train_loss": -44.41865921020508, "global_step": 298518, "epoch": 2467} {"train_loss": -43.627925872802734, "global_step": 298519, "epoch": 2467} {"train_loss": -44.83088684082031, "global_step": 298520, "epoch": 2467} {"train_loss": -42.333282470703125, "global_step": 298521, "epoch": 2467} {"train_loss": -43.02922821044922, "global_step": 298522, "epoch": 2467} {"train_loss": -43.843360900878906, "global_step": 298523, "epoch": 2467} {"train_loss": -40.535133361816406, "global_step": 298524, "epoch": 2467} {"train_loss": -42.95603561401367, "global_step": 298525, "epoch": 2467} {"train_loss": -42.47029113769531, "global_step": 298526, "epoch": 2467} {"train_loss": -42.8840446472168, "global_step": 298527, "epoch": 2467} {"train_loss": -42.305599212646484, "global_step": 298528, "epoch": 2467} {"train_loss": -41.93940353393555, "global_step": 298529, "epoch": 2467} {"train_loss": -43.53377151489258, "global_step": 298530, "epoch": 2467} {"train_loss": -43.26203155517578, "global_step": 298531, "epoch": 2467} {"train_loss": -39.957759857177734, "global_step": 298532, "epoch": 2467} {"train_loss": -42.95664596557617, "global_step": 298533, "epoch": 2467} {"train_loss": -34.73077392578125, "global_step": 298534, "epoch": 2467} {"train_loss": -39.48435592651367, "global_step": 298535, "epoch": 2467} {"train_loss": -37.85647201538086, "global_step": 298536, "epoch": 2467} {"train_loss": -35.18320846557617, "global_step": 298537, "epoch": 2467} {"train_loss": -40.55636215209961, "global_step": 298538, "epoch": 2467} {"train_loss": -37.62557601928711, "global_step": 298539, "epoch": 2467} {"train_loss": -34.57356262207031, "global_step": 298540, "epoch": 2467} {"train_loss": -37.3300895690918, "global_step": 298541, "epoch": 2467} {"train_loss": -38.481746673583984, "global_step": 298542, "epoch": 2467} {"train_loss": -37.167842864990234, "global_step": 298543, "epoch": 2467} {"train_loss": -36.72452926635742, "global_step": 298544, "epoch": 2467} {"train_loss": -38.94923782348633, "global_step": 298545, "epoch": 2467} {"train_loss": -37.490882873535156, "global_step": 298546, "epoch": 2467} {"train_loss": -39.282135009765625, "global_step": 298547, "epoch": 2467} {"train_loss": -39.912837982177734, "global_step": 298548, "epoch": 2467} {"train_loss": -40.41585159301758, "global_step": 298549, "epoch": 2467} {"train_loss": -40.279598236083984, "global_step": 298550, "epoch": 2467} {"train_loss": -42.00897979736328, "global_step": 298551, "epoch": 2467} {"train_loss": -39.76089096069336, "global_step": 298552, "epoch": 2467} {"train_loss": -40.70872497558594, "global_step": 298553, "epoch": 2467} {"train_loss": -38.98855209350586, "global_step": 298554, "epoch": 2467} {"train_loss": -41.945068359375, "global_step": 298555, "epoch": 2467} {"train_loss": -42.003623962402344, "global_step": 298556, "epoch": 2467} {"train_loss": -41.5623893737793, "global_step": 298557, "epoch": 2467} {"train_loss": -42.74277877807617, "global_step": 298558, "epoch": 2467} {"train_loss": -42.13855743408203, "global_step": 298559, "epoch": 2467} {"train_loss": -42.28288650512695, "global_step": 298560, "epoch": 2467} {"train_loss": -42.45381546020508, "global_step": 298561, "epoch": 2467} {"train_loss": -42.81395721435547, "global_step": 298562, "epoch": 2467} {"train_loss": -42.690372467041016, "global_step": 298563, "epoch": 2467} {"train_loss": -43.391685485839844, "global_step": 298564, "epoch": 2467} {"train_loss": -42.353824615478516, "global_step": 298565, "epoch": 2467} {"train_loss": -42.72420120239258, "global_step": 298566, "epoch": 2467} {"train_loss": -43.239070892333984, "global_step": 298567, "epoch": 2467} {"train_loss": -43.187129974365234, "global_step": 298568, "epoch": 2467} {"train_loss": -42.90959930419922, "global_step": 298569, "epoch": 2467} {"train_loss": -43.15071105957031, "global_step": 298570, "epoch": 2467} {"train_loss": -43.507423400878906, "global_step": 298571, "epoch": 2467} {"train_loss": -43.654510498046875, "global_step": 298572, "epoch": 2467} {"train_loss": -43.58175277709961, "global_step": 298573, "epoch": 2467} {"train_loss": -43.03237533569336, "global_step": 298574, "epoch": 2467} {"train_loss": -43.30241394042969, "global_step": 298575, "epoch": 2467} {"train_loss": -43.745548248291016, "global_step": 298576, "epoch": 2467} {"train_loss": -43.83474349975586, "global_step": 298577, "epoch": 2467} {"train_loss": -44.03418731689453, "global_step": 298578, "epoch": 2467} {"train_loss": -44.235450744628906, "global_step": 298579, "epoch": 2467} {"train_loss": -43.90410232543945, "global_step": 298580, "epoch": 2467} {"train_loss": -43.72989273071289, "global_step": 298581, "epoch": 2467} {"train_loss": -43.964969635009766, "global_step": 298582, "epoch": 2467} {"train_loss": -44.082130432128906, "global_step": 298583, "epoch": 2467} {"train_loss": -44.38159942626953, "global_step": 298584, "epoch": 2467} {"train_loss": -44.19260025024414, "global_step": 298585, "epoch": 2467} {"train_loss": -43.681053161621094, "global_step": 298586, "epoch": 2467} {"train_loss": -43.57378005981445, "global_step": 298587, "epoch": 2467} {"train_loss": -43.41581344604492, "global_step": 298588, "epoch": 2467} {"train_loss": -44.395015716552734, "global_step": 298589, "epoch": 2467} {"train_loss": -43.942726135253906, "global_step": 298590, "epoch": 2467} {"train_loss": -44.53524398803711, "global_step": 298591, "epoch": 2467} {"train_loss": -44.137264251708984, "global_step": 298592, "epoch": 2467} {"train_loss": -44.13866424560547, "global_step": 298593, "epoch": 2467} {"train_loss": -44.31838607788086, "global_step": 298594, "epoch": 2467} {"train_loss": -44.66351318359375, "global_step": 298595, "epoch": 2467} {"train_loss": -44.419185638427734, "global_step": 298596, "epoch": 2467} {"train_loss": -44.226863861083984, "global_step": 298597, "epoch": 2467} {"train_loss": -44.64359664916992, "global_step": 298598, "epoch": 2467} {"train_loss": -44.627811431884766, "global_step": 298599, "epoch": 2467} {"train_loss": -44.673667907714844, "global_step": 298600, "epoch": 2467} {"train_loss": -44.89188766479492, "global_step": 298601, "epoch": 2467} {"train_loss": -44.70551681518555, "global_step": 298602, "epoch": 2467} {"train_loss": -44.872100830078125, "global_step": 298603, "epoch": 2467} {"train_loss": -44.98781967163086, "global_step": 298604, "epoch": 2467} {"train_loss": -44.85709762573242, "global_step": 298605, "epoch": 2467} {"train_loss": -44.83002853393555, "global_step": 298606, "epoch": 2467} {"train_loss": -44.822750091552734, "global_step": 298607, "epoch": 2467} {"train_loss": -44.685035705566406, "global_step": 298608, "epoch": 2467} {"train_loss": -45.17673873901367, "global_step": 298609, "epoch": 2467} {"train_loss": -44.817195892333984, "global_step": 298610, "epoch": 2467} {"train_loss": -44.9423942565918, "global_step": 298611, "epoch": 2467} {"train_loss": -44.42583084106445, "global_step": 298612, "epoch": 2467} {"train_loss": -44.592742919921875, "global_step": 298613, "epoch": 2467} {"train_loss": -43.818885803222656, "global_step": 298614, "epoch": 2467} {"train_loss": -44.322200775146484, "global_step": 298615, "epoch": 2467} {"train_loss": -44.51708984375, "global_step": 298616, "epoch": 2467} {"train_loss": -45.09547424316406, "global_step": 298617, "epoch": 2467} {"train_loss": -44.4491081237793, "global_step": 298618, "epoch": 2467} {"train_loss": -44.63251495361328, "global_step": 298619, "epoch": 2467} {"train_loss": -44.64619064331055, "global_step": 298620, "epoch": 2467} {"train_loss": -44.43646240234375, "global_step": 298621, "epoch": 2467} {"train_loss": -44.64760971069336, "global_step": 298622, "epoch": 2467} {"train_loss": -44.88241195678711, "global_step": 298623, "epoch": 2467} {"train_loss": -44.89226150512695, "global_step": 298624, "epoch": 2467} {"train_loss": -44.79594802856445, "global_step": 298625, "epoch": 2467} {"train_loss": -44.7304801940918, "global_step": 298626, "epoch": 2467} {"train_loss": -42.814251923364054, "global_step": 298627, "epoch": 2467, "val_loss": 2518355.5} {"train_loss": -44.843990325927734, "global_step": 298628, "epoch": 2468} {"train_loss": -44.350929260253906, "global_step": 298629, "epoch": 2468} {"train_loss": -44.2801399230957, "global_step": 298630, "epoch": 2468} {"train_loss": -44.66900634765625, "global_step": 298631, "epoch": 2468} {"train_loss": -45.03957748413086, "global_step": 298632, "epoch": 2468} {"train_loss": -44.581703186035156, "global_step": 298633, "epoch": 2468} {"train_loss": -43.62917709350586, "global_step": 298634, "epoch": 2468} {"train_loss": -43.67816925048828, "global_step": 298635, "epoch": 2468} {"train_loss": -43.95991897583008, "global_step": 298636, "epoch": 2468} {"train_loss": -44.77936935424805, "global_step": 298637, "epoch": 2468} {"train_loss": -45.00646209716797, "global_step": 298638, "epoch": 2468} {"train_loss": -43.9157829284668, "global_step": 298639, "epoch": 2468} {"train_loss": -43.0785026550293, "global_step": 298640, "epoch": 2468} {"train_loss": -42.238563537597656, "global_step": 298641, "epoch": 2468} {"train_loss": -40.99245071411133, "global_step": 298642, "epoch": 2468} {"train_loss": -42.5670280456543, "global_step": 298643, "epoch": 2468} {"train_loss": -44.80439376831055, "global_step": 298644, "epoch": 2468} {"train_loss": -42.83646011352539, "global_step": 298645, "epoch": 2468} {"train_loss": -42.26686477661133, "global_step": 298646, "epoch": 2468} {"train_loss": -42.564945220947266, "global_step": 298647, "epoch": 2468} {"train_loss": -43.271095275878906, "global_step": 298648, "epoch": 2468} {"train_loss": -42.237091064453125, "global_step": 298649, "epoch": 2468} {"train_loss": -42.55508041381836, "global_step": 298650, "epoch": 2468} {"train_loss": -43.08993148803711, "global_step": 298651, "epoch": 2468} {"train_loss": -42.878963470458984, "global_step": 298652, "epoch": 2468} {"train_loss": -43.40733337402344, "global_step": 298653, "epoch": 2468} {"train_loss": -43.55715560913086, "global_step": 298654, "epoch": 2468} {"train_loss": -41.54465866088867, "global_step": 298655, "epoch": 2468} {"train_loss": -44.319637298583984, "global_step": 298656, "epoch": 2468} {"train_loss": -42.23185348510742, "global_step": 298657, "epoch": 2468} {"train_loss": -41.452152252197266, "global_step": 298658, "epoch": 2468} {"train_loss": -43.73280715942383, "global_step": 298659, "epoch": 2468} {"train_loss": -41.11204147338867, "global_step": 298660, "epoch": 2468} {"train_loss": -42.68147659301758, "global_step": 298661, "epoch": 2468} {"train_loss": -42.380821228027344, "global_step": 298662, "epoch": 2468} {"train_loss": -42.141693115234375, "global_step": 298663, "epoch": 2468} {"train_loss": -42.856285095214844, "global_step": 298664, "epoch": 2468} {"train_loss": -42.3371696472168, "global_step": 298665, "epoch": 2468} {"train_loss": -43.42186737060547, "global_step": 298666, "epoch": 2468} {"train_loss": -42.597503662109375, "global_step": 298667, "epoch": 2468} {"train_loss": -43.91582107543945, "global_step": 298668, "epoch": 2468} {"train_loss": -44.20035171508789, "global_step": 298669, "epoch": 2468} {"train_loss": -43.68024826049805, "global_step": 298670, "epoch": 2468} {"train_loss": -44.056922912597656, "global_step": 298671, "epoch": 2468} {"train_loss": -43.79092025756836, "global_step": 298672, "epoch": 2468} {"train_loss": -43.86447525024414, "global_step": 298673, "epoch": 2468} {"train_loss": -43.4465217590332, "global_step": 298674, "epoch": 2468} {"train_loss": -44.03242111206055, "global_step": 298675, "epoch": 2468} {"train_loss": -43.41975402832031, "global_step": 298676, "epoch": 2468} {"train_loss": -43.43989181518555, "global_step": 298677, "epoch": 2468} {"train_loss": -44.63161849975586, "global_step": 298678, "epoch": 2468} {"train_loss": -43.55022430419922, "global_step": 298679, "epoch": 2468} {"train_loss": -42.32741928100586, "global_step": 298680, "epoch": 2468} {"train_loss": -42.3614501953125, "global_step": 298681, "epoch": 2468} {"train_loss": -42.53562545776367, "global_step": 298682, "epoch": 2468} {"train_loss": -43.6860237121582, "global_step": 298683, "epoch": 2468} {"train_loss": -42.315670013427734, "global_step": 298684, "epoch": 2468} {"train_loss": -43.437381744384766, "global_step": 298685, "epoch": 2468} {"train_loss": -43.372798919677734, "global_step": 298686, "epoch": 2468} {"train_loss": -43.589134216308594, "global_step": 298687, "epoch": 2468} {"train_loss": -44.206024169921875, "global_step": 298688, "epoch": 2468} {"train_loss": -44.02198028564453, "global_step": 298689, "epoch": 2468} {"train_loss": -44.225887298583984, "global_step": 298690, "epoch": 2468} {"train_loss": -43.8283576965332, "global_step": 298691, "epoch": 2468} {"train_loss": -43.75779342651367, "global_step": 298692, "epoch": 2468} {"train_loss": -44.28263854980469, "global_step": 298693, "epoch": 2468} {"train_loss": -43.60445022583008, "global_step": 298694, "epoch": 2468} {"train_loss": -44.20569610595703, "global_step": 298695, "epoch": 2468} {"train_loss": -43.517616271972656, "global_step": 298696, "epoch": 2468} {"train_loss": -43.46797561645508, "global_step": 298697, "epoch": 2468} {"train_loss": -43.45521926879883, "global_step": 298698, "epoch": 2468} {"train_loss": -43.977264404296875, "global_step": 298699, "epoch": 2468} {"train_loss": -44.10773849487305, "global_step": 298700, "epoch": 2468} {"train_loss": -43.222381591796875, "global_step": 298701, "epoch": 2468} {"train_loss": -44.23707962036133, "global_step": 298702, "epoch": 2468} {"train_loss": -44.60740280151367, "global_step": 298703, "epoch": 2468} {"train_loss": -44.11634063720703, "global_step": 298704, "epoch": 2468} {"train_loss": -43.9568977355957, "global_step": 298705, "epoch": 2468} {"train_loss": -44.5874137878418, "global_step": 298706, "epoch": 2468} {"train_loss": -43.660640716552734, "global_step": 298707, "epoch": 2468} {"train_loss": -44.54066848754883, "global_step": 298708, "epoch": 2468} {"train_loss": -43.34004592895508, "global_step": 298709, "epoch": 2468} {"train_loss": -44.47750473022461, "global_step": 298710, "epoch": 2468} {"train_loss": -44.18449783325195, "global_step": 298711, "epoch": 2468} {"train_loss": -44.63792037963867, "global_step": 298712, "epoch": 2468} {"train_loss": -44.139095306396484, "global_step": 298713, "epoch": 2468} {"train_loss": -44.7546501159668, "global_step": 298714, "epoch": 2468} {"train_loss": -44.50156784057617, "global_step": 298715, "epoch": 2468} {"train_loss": -44.86244583129883, "global_step": 298716, "epoch": 2468} {"train_loss": -44.324180603027344, "global_step": 298717, "epoch": 2468} {"train_loss": -44.595767974853516, "global_step": 298718, "epoch": 2468} {"train_loss": -44.523460388183594, "global_step": 298719, "epoch": 2468} {"train_loss": -44.96441650390625, "global_step": 298720, "epoch": 2468} {"train_loss": -44.837738037109375, "global_step": 298721, "epoch": 2468} {"train_loss": -44.50910568237305, "global_step": 298722, "epoch": 2468} {"train_loss": -44.79718017578125, "global_step": 298723, "epoch": 2468} {"train_loss": -45.03205108642578, "global_step": 298724, "epoch": 2468} {"train_loss": -44.871456146240234, "global_step": 298725, "epoch": 2468} {"train_loss": -44.8083381652832, "global_step": 298726, "epoch": 2468} {"train_loss": -44.93744659423828, "global_step": 298727, "epoch": 2468} {"train_loss": -44.48276901245117, "global_step": 298728, "epoch": 2468} {"train_loss": -44.3954963684082, "global_step": 298729, "epoch": 2468} {"train_loss": -45.08305740356445, "global_step": 298730, "epoch": 2468} {"train_loss": -44.792457580566406, "global_step": 298731, "epoch": 2468} {"train_loss": -45.174560546875, "global_step": 298732, "epoch": 2468} {"train_loss": -43.75277328491211, "global_step": 298733, "epoch": 2468} {"train_loss": -44.491947174072266, "global_step": 298734, "epoch": 2468} {"train_loss": -44.399227142333984, "global_step": 298735, "epoch": 2468} {"train_loss": -44.751708984375, "global_step": 298736, "epoch": 2468} {"train_loss": -44.58488082885742, "global_step": 298737, "epoch": 2468} {"train_loss": -44.43061447143555, "global_step": 298738, "epoch": 2468} {"train_loss": -43.335018157958984, "global_step": 298739, "epoch": 2468} {"train_loss": -44.62138366699219, "global_step": 298740, "epoch": 2468} {"train_loss": -43.692440032958984, "global_step": 298741, "epoch": 2468} {"train_loss": -42.66707992553711, "global_step": 298742, "epoch": 2468} {"train_loss": -43.102725982666016, "global_step": 298743, "epoch": 2468} {"train_loss": -43.05377960205078, "global_step": 298744, "epoch": 2468} {"train_loss": -44.190338134765625, "global_step": 298745, "epoch": 2468} {"train_loss": -44.43404006958008, "global_step": 298746, "epoch": 2468} {"train_loss": -44.56911849975586, "global_step": 298747, "epoch": 2468} {"train_loss": -43.7763695835082, "global_step": 298748, "epoch": 2468, "val_loss": 2618537.25} {"train_loss": -44.124298095703125, "global_step": 298749, "epoch": 2469} {"train_loss": -45.021202087402344, "global_step": 298750, "epoch": 2469} {"train_loss": -44.58683395385742, "global_step": 298751, "epoch": 2469} {"train_loss": -44.62458419799805, "global_step": 298752, "epoch": 2469} {"train_loss": -44.17119598388672, "global_step": 298753, "epoch": 2469} {"train_loss": -44.28680419921875, "global_step": 298754, "epoch": 2469} {"train_loss": -44.43272018432617, "global_step": 298755, "epoch": 2469} {"train_loss": -44.63690948486328, "global_step": 298756, "epoch": 2469} {"train_loss": -44.17090606689453, "global_step": 298757, "epoch": 2469} {"train_loss": -42.92646408081055, "global_step": 298758, "epoch": 2469} {"train_loss": -43.77363204956055, "global_step": 298759, "epoch": 2469} {"train_loss": -43.96211624145508, "global_step": 298760, "epoch": 2469} {"train_loss": -43.89290237426758, "global_step": 298761, "epoch": 2469} {"train_loss": -42.54883575439453, "global_step": 298762, "epoch": 2469} {"train_loss": -43.28144454956055, "global_step": 298763, "epoch": 2469} {"train_loss": -44.66542434692383, "global_step": 298764, "epoch": 2469} {"train_loss": -44.57887649536133, "global_step": 298765, "epoch": 2469} {"train_loss": -42.56879806518555, "global_step": 298766, "epoch": 2469} {"train_loss": -41.92510986328125, "global_step": 298767, "epoch": 2469} {"train_loss": -44.266075134277344, "global_step": 298768, "epoch": 2469} {"train_loss": -44.87714385986328, "global_step": 298769, "epoch": 2469} {"train_loss": -43.76483917236328, "global_step": 298770, "epoch": 2469} {"train_loss": -43.57843780517578, "global_step": 298771, "epoch": 2469} {"train_loss": -44.05332565307617, "global_step": 298772, "epoch": 2469} {"train_loss": -44.989200592041016, "global_step": 298773, "epoch": 2469} {"train_loss": -44.35728073120117, "global_step": 298774, "epoch": 2469} {"train_loss": -44.20293045043945, "global_step": 298775, "epoch": 2469} {"train_loss": -42.919734954833984, "global_step": 298776, "epoch": 2469} {"train_loss": -43.61155319213867, "global_step": 298777, "epoch": 2469} {"train_loss": -44.71485137939453, "global_step": 298778, "epoch": 2469} {"train_loss": -44.19672775268555, "global_step": 298779, "epoch": 2469} {"train_loss": -43.71382522583008, "global_step": 298780, "epoch": 2469} {"train_loss": -43.89101028442383, "global_step": 298781, "epoch": 2469} {"train_loss": -43.5898323059082, "global_step": 298782, "epoch": 2469} {"train_loss": -42.26321029663086, "global_step": 298783, "epoch": 2469} {"train_loss": -43.52341079711914, "global_step": 298784, "epoch": 2469} {"train_loss": -44.2728157043457, "global_step": 298785, "epoch": 2469} {"train_loss": -43.29213333129883, "global_step": 298786, "epoch": 2469} {"train_loss": -43.79281234741211, "global_step": 298787, "epoch": 2469} {"train_loss": -44.49256896972656, "global_step": 298788, "epoch": 2469} {"train_loss": -44.348167419433594, "global_step": 298789, "epoch": 2469} {"train_loss": -43.6621208190918, "global_step": 298790, "epoch": 2469} {"train_loss": -44.058956146240234, "global_step": 298791, "epoch": 2469} {"train_loss": -44.39199447631836, "global_step": 298792, "epoch": 2469} {"train_loss": -44.16142654418945, "global_step": 298793, "epoch": 2469} {"train_loss": -42.51302719116211, "global_step": 298794, "epoch": 2469} {"train_loss": -43.637996673583984, "global_step": 298795, "epoch": 2469} {"train_loss": -44.70308303833008, "global_step": 298796, "epoch": 2469} {"train_loss": -43.41838073730469, "global_step": 298797, "epoch": 2469} {"train_loss": -43.39072799682617, "global_step": 298798, "epoch": 2469} {"train_loss": -44.30437088012695, "global_step": 298799, "epoch": 2469} {"train_loss": -44.43125534057617, "global_step": 298800, "epoch": 2469} {"train_loss": -43.79246139526367, "global_step": 298801, "epoch": 2469} {"train_loss": -43.76784133911133, "global_step": 298802, "epoch": 2469} {"train_loss": -44.70339584350586, "global_step": 298803, "epoch": 2469} {"train_loss": -43.67449951171875, "global_step": 298804, "epoch": 2469} {"train_loss": -43.54182815551758, "global_step": 298805, "epoch": 2469} {"train_loss": -43.97865295410156, "global_step": 298806, "epoch": 2469} {"train_loss": -44.20243453979492, "global_step": 298807, "epoch": 2469} {"train_loss": -43.91725540161133, "global_step": 298808, "epoch": 2469} {"train_loss": -44.363948822021484, "global_step": 298809, "epoch": 2469} {"train_loss": -44.411861419677734, "global_step": 298810, "epoch": 2469} {"train_loss": -44.66776657104492, "global_step": 298811, "epoch": 2469} {"train_loss": -43.89213180541992, "global_step": 298812, "epoch": 2469} {"train_loss": -42.48911666870117, "global_step": 298813, "epoch": 2469} {"train_loss": -43.47935485839844, "global_step": 298814, "epoch": 2469} {"train_loss": -44.289608001708984, "global_step": 298815, "epoch": 2469} {"train_loss": -44.661067962646484, "global_step": 298816, "epoch": 2469} {"train_loss": -44.15407180786133, "global_step": 298817, "epoch": 2469} {"train_loss": -44.26797103881836, "global_step": 298818, "epoch": 2469} {"train_loss": -44.739009857177734, "global_step": 298819, "epoch": 2469} {"train_loss": -44.92734909057617, "global_step": 298820, "epoch": 2469} {"train_loss": -44.565914154052734, "global_step": 298821, "epoch": 2469} {"train_loss": -44.09018325805664, "global_step": 298822, "epoch": 2469} {"train_loss": -43.93352508544922, "global_step": 298823, "epoch": 2469} {"train_loss": -44.524234771728516, "global_step": 298824, "epoch": 2469} {"train_loss": -44.525489807128906, "global_step": 298825, "epoch": 2469} {"train_loss": -43.04425811767578, "global_step": 298826, "epoch": 2469} {"train_loss": -43.969512939453125, "global_step": 298827, "epoch": 2469} {"train_loss": -42.73590850830078, "global_step": 298828, "epoch": 2469} {"train_loss": -42.753353118896484, "global_step": 298829, "epoch": 2469} {"train_loss": -42.910762786865234, "global_step": 298830, "epoch": 2469} {"train_loss": -43.924495697021484, "global_step": 298831, "epoch": 2469} {"train_loss": -42.17171096801758, "global_step": 298832, "epoch": 2469} {"train_loss": -43.831153869628906, "global_step": 298833, "epoch": 2469} {"train_loss": -43.296234130859375, "global_step": 298834, "epoch": 2469} {"train_loss": -42.041629791259766, "global_step": 298835, "epoch": 2469} {"train_loss": -44.403289794921875, "global_step": 298836, "epoch": 2469} {"train_loss": -41.91096115112305, "global_step": 298837, "epoch": 2469} {"train_loss": -42.20524215698242, "global_step": 298838, "epoch": 2469} {"train_loss": -43.737205505371094, "global_step": 298839, "epoch": 2469} {"train_loss": -42.519493103027344, "global_step": 298840, "epoch": 2469} {"train_loss": -43.66553497314453, "global_step": 298841, "epoch": 2469} {"train_loss": -43.5086784362793, "global_step": 298842, "epoch": 2469} {"train_loss": -43.383052825927734, "global_step": 298843, "epoch": 2469} {"train_loss": -43.9433708190918, "global_step": 298844, "epoch": 2469} {"train_loss": -44.29758834838867, "global_step": 298845, "epoch": 2469} {"train_loss": -42.94306945800781, "global_step": 298846, "epoch": 2469} {"train_loss": -43.23844528198242, "global_step": 298847, "epoch": 2469} {"train_loss": -44.129737854003906, "global_step": 298848, "epoch": 2469} {"train_loss": -43.92268753051758, "global_step": 298849, "epoch": 2469} {"train_loss": -43.60855484008789, "global_step": 298850, "epoch": 2469} {"train_loss": -43.96166229248047, "global_step": 298851, "epoch": 2469} {"train_loss": -44.39980697631836, "global_step": 298852, "epoch": 2469} {"train_loss": -43.167457580566406, "global_step": 298853, "epoch": 2469} {"train_loss": -43.740962982177734, "global_step": 298854, "epoch": 2469} {"train_loss": -44.3486442565918, "global_step": 298855, "epoch": 2469} {"train_loss": -44.577388763427734, "global_step": 298856, "epoch": 2469} {"train_loss": -43.883262634277344, "global_step": 298857, "epoch": 2469} {"train_loss": -43.8519401550293, "global_step": 298858, "epoch": 2469} {"train_loss": -43.49039840698242, "global_step": 298859, "epoch": 2469} {"train_loss": -43.62970733642578, "global_step": 298860, "epoch": 2469} {"train_loss": -44.78124237060547, "global_step": 298861, "epoch": 2469} {"train_loss": -43.46760940551758, "global_step": 298862, "epoch": 2469} {"train_loss": -43.604583740234375, "global_step": 298863, "epoch": 2469} {"train_loss": -43.647666931152344, "global_step": 298864, "epoch": 2469} {"train_loss": -43.47067642211914, "global_step": 298865, "epoch": 2469} {"train_loss": -43.964820861816406, "global_step": 298866, "epoch": 2469} {"train_loss": -44.10948944091797, "global_step": 298867, "epoch": 2469} {"train_loss": -42.721351623535156, "global_step": 298868, "epoch": 2469} {"train_loss": -43.807043595747515, "global_step": 298869, "epoch": 2469, "val_loss": 2690310.25} {"train_loss": -44.15837097167969, "global_step": 298870, "epoch": 2470} {"train_loss": -42.6701545715332, "global_step": 298871, "epoch": 2470} {"train_loss": -42.10258102416992, "global_step": 298872, "epoch": 2470} {"train_loss": -42.73838424682617, "global_step": 298873, "epoch": 2470} {"train_loss": -43.74589157104492, "global_step": 298874, "epoch": 2470} {"train_loss": -42.676177978515625, "global_step": 298875, "epoch": 2470} {"train_loss": -43.67192840576172, "global_step": 298876, "epoch": 2470} {"train_loss": -43.377952575683594, "global_step": 298877, "epoch": 2470} {"train_loss": -43.47814178466797, "global_step": 298878, "epoch": 2470} {"train_loss": -43.92070388793945, "global_step": 298879, "epoch": 2470} {"train_loss": -43.26091384887695, "global_step": 298880, "epoch": 2470} {"train_loss": -43.39765548706055, "global_step": 298881, "epoch": 2470} {"train_loss": -43.14957809448242, "global_step": 298882, "epoch": 2470} {"train_loss": -42.87264633178711, "global_step": 298883, "epoch": 2470} {"train_loss": -43.475135803222656, "global_step": 298884, "epoch": 2470} {"train_loss": -41.93732452392578, "global_step": 298885, "epoch": 2470} {"train_loss": -42.411991119384766, "global_step": 298886, "epoch": 2470} {"train_loss": -43.089603424072266, "global_step": 298887, "epoch": 2470} {"train_loss": -43.06962966918945, "global_step": 298888, "epoch": 2470} {"train_loss": -43.347312927246094, "global_step": 298889, "epoch": 2470} {"train_loss": -42.72401809692383, "global_step": 298890, "epoch": 2470} {"train_loss": -42.594032287597656, "global_step": 298891, "epoch": 2470} {"train_loss": -43.17570877075195, "global_step": 298892, "epoch": 2470} {"train_loss": -42.29862594604492, "global_step": 298893, "epoch": 2470} {"train_loss": -44.24442672729492, "global_step": 298894, "epoch": 2470} {"train_loss": -42.73186111450195, "global_step": 298895, "epoch": 2470} {"train_loss": -43.67402267456055, "global_step": 298896, "epoch": 2470} {"train_loss": -43.66986083984375, "global_step": 298897, "epoch": 2470} {"train_loss": -42.05909729003906, "global_step": 298898, "epoch": 2470} {"train_loss": -43.18171310424805, "global_step": 298899, "epoch": 2470} {"train_loss": -42.100135803222656, "global_step": 298900, "epoch": 2470} {"train_loss": -41.19995880126953, "global_step": 298901, "epoch": 2470} {"train_loss": -42.289058685302734, "global_step": 298902, "epoch": 2470} {"train_loss": -38.682586669921875, "global_step": 298903, "epoch": 2470} {"train_loss": -30.010639190673828, "global_step": 298904, "epoch": 2470} {"train_loss": -37.92564010620117, "global_step": 298905, "epoch": 2470} {"train_loss": -36.925899505615234, "global_step": 298906, "epoch": 2470} {"train_loss": -41.38898849487305, "global_step": 298907, "epoch": 2470} {"train_loss": -42.1230583190918, "global_step": 298908, "epoch": 2470} {"train_loss": -38.39999008178711, "global_step": 298909, "epoch": 2470} {"train_loss": -35.51754379272461, "global_step": 298910, "epoch": 2470} {"train_loss": -31.118131637573242, "global_step": 298911, "epoch": 2470} {"train_loss": -25.140836715698242, "global_step": 298912, "epoch": 2470} {"train_loss": -36.53956985473633, "global_step": 298913, "epoch": 2470} {"train_loss": -36.62936019897461, "global_step": 298914, "epoch": 2470} {"train_loss": -38.7581901550293, "global_step": 298915, "epoch": 2470} {"train_loss": -39.9011344909668, "global_step": 298916, "epoch": 2470} {"train_loss": -38.55664825439453, "global_step": 298917, "epoch": 2470} {"train_loss": -34.999942779541016, "global_step": 298918, "epoch": 2470} {"train_loss": -37.073184967041016, "global_step": 298919, "epoch": 2470} {"train_loss": -34.285247802734375, "global_step": 298920, "epoch": 2470} {"train_loss": -34.80900955200195, "global_step": 298921, "epoch": 2470} {"train_loss": -34.22262191772461, "global_step": 298922, "epoch": 2470} {"train_loss": -30.418943405151367, "global_step": 298923, "epoch": 2470} {"train_loss": -32.4802131652832, "global_step": 298924, "epoch": 2470} {"train_loss": -39.01337814331055, "global_step": 298925, "epoch": 2470} {"train_loss": -29.4450740814209, "global_step": 298926, "epoch": 2470} {"train_loss": -38.62553787231445, "global_step": 298927, "epoch": 2470} {"train_loss": -37.58061599731445, "global_step": 298928, "epoch": 2470} {"train_loss": -39.57933044433594, "global_step": 298929, "epoch": 2470} {"train_loss": -39.50528335571289, "global_step": 298930, "epoch": 2470} {"train_loss": -41.141273498535156, "global_step": 298931, "epoch": 2470} {"train_loss": -39.62588119506836, "global_step": 298932, "epoch": 2470} {"train_loss": -37.259857177734375, "global_step": 298933, "epoch": 2470} {"train_loss": -39.987545013427734, "global_step": 298934, "epoch": 2470} {"train_loss": -39.15935134887695, "global_step": 298935, "epoch": 2470} {"train_loss": -40.13175582885742, "global_step": 298936, "epoch": 2470} {"train_loss": -40.393035888671875, "global_step": 298937, "epoch": 2470} {"train_loss": -38.16602325439453, "global_step": 298938, "epoch": 2470} {"train_loss": -38.49439239501953, "global_step": 298939, "epoch": 2470} {"train_loss": -41.70011520385742, "global_step": 298940, "epoch": 2470} {"train_loss": -39.65424728393555, "global_step": 298941, "epoch": 2470} {"train_loss": -40.08418655395508, "global_step": 298942, "epoch": 2470} {"train_loss": -40.38676834106445, "global_step": 298943, "epoch": 2470} {"train_loss": -41.648536682128906, "global_step": 298944, "epoch": 2470} {"train_loss": -40.591552734375, "global_step": 298945, "epoch": 2470} {"train_loss": -40.3485107421875, "global_step": 298946, "epoch": 2470} {"train_loss": -41.09654998779297, "global_step": 298947, "epoch": 2470} {"train_loss": -41.48627853393555, "global_step": 298948, "epoch": 2470} {"train_loss": -41.5859489440918, "global_step": 298949, "epoch": 2470} {"train_loss": -42.377906799316406, "global_step": 298950, "epoch": 2470} {"train_loss": -42.56926727294922, "global_step": 298951, "epoch": 2470} {"train_loss": -41.68171310424805, "global_step": 298952, "epoch": 2470} {"train_loss": -41.85233688354492, "global_step": 298953, "epoch": 2470} {"train_loss": -40.74477767944336, "global_step": 298954, "epoch": 2470} {"train_loss": -42.48773193359375, "global_step": 298955, "epoch": 2470} {"train_loss": -41.893672943115234, "global_step": 298956, "epoch": 2470} {"train_loss": -40.83633041381836, "global_step": 298957, "epoch": 2470} {"train_loss": -42.40566635131836, "global_step": 298958, "epoch": 2470} {"train_loss": -42.28799057006836, "global_step": 298959, "epoch": 2470} {"train_loss": -42.30812454223633, "global_step": 298960, "epoch": 2470} {"train_loss": -41.95368576049805, "global_step": 298961, "epoch": 2470} {"train_loss": -41.663673400878906, "global_step": 298962, "epoch": 2470} {"train_loss": -42.43008041381836, "global_step": 298963, "epoch": 2470} {"train_loss": -42.0906867980957, "global_step": 298964, "epoch": 2470} {"train_loss": -41.98136520385742, "global_step": 298965, "epoch": 2470} {"train_loss": -42.639034271240234, "global_step": 298966, "epoch": 2470} {"train_loss": -42.58053207397461, "global_step": 298967, "epoch": 2470} {"train_loss": -42.625579833984375, "global_step": 298968, "epoch": 2470} {"train_loss": -41.8147087097168, "global_step": 298969, "epoch": 2470} {"train_loss": -42.68136978149414, "global_step": 298970, "epoch": 2470} {"train_loss": -41.834590911865234, "global_step": 298971, "epoch": 2470} {"train_loss": -43.07232666015625, "global_step": 298972, "epoch": 2470} {"train_loss": -43.29510498046875, "global_step": 298973, "epoch": 2470} {"train_loss": -42.70960235595703, "global_step": 298974, "epoch": 2470} {"train_loss": -40.83835983276367, "global_step": 298975, "epoch": 2470} {"train_loss": -42.57635498046875, "global_step": 298976, "epoch": 2470} {"train_loss": -42.72003173828125, "global_step": 298977, "epoch": 2470} {"train_loss": -42.75041580200195, "global_step": 298978, "epoch": 2470} {"train_loss": -42.18818283081055, "global_step": 298979, "epoch": 2470} {"train_loss": -42.90663528442383, "global_step": 298980, "epoch": 2470} {"train_loss": -42.74034881591797, "global_step": 298981, "epoch": 2470} {"train_loss": -43.31298065185547, "global_step": 298982, "epoch": 2470} {"train_loss": -42.13713455200195, "global_step": 298983, "epoch": 2470} {"train_loss": -42.3875732421875, "global_step": 298984, "epoch": 2470} {"train_loss": -43.48445129394531, "global_step": 298985, "epoch": 2470} {"train_loss": -43.17546081542969, "global_step": 298986, "epoch": 2470} {"train_loss": -43.29911804199219, "global_step": 298987, "epoch": 2470} {"train_loss": -43.08543014526367, "global_step": 298988, "epoch": 2470} {"train_loss": -42.78171157836914, "global_step": 298989, "epoch": 2470} {"train_loss": -40.72875834693593, "global_step": 298990, "epoch": 2470, "val_loss": 2563637.75} {"train_loss": -43.354366302490234, "global_step": 298991, "epoch": 2471} {"train_loss": -43.427154541015625, "global_step": 298992, "epoch": 2471} {"train_loss": -43.31935501098633, "global_step": 298993, "epoch": 2471} {"train_loss": -43.5374755859375, "global_step": 298994, "epoch": 2471} {"train_loss": -42.679100036621094, "global_step": 298995, "epoch": 2471} {"train_loss": -43.62299728393555, "global_step": 298996, "epoch": 2471} {"train_loss": -43.40423583984375, "global_step": 298997, "epoch": 2471} {"train_loss": -42.57157516479492, "global_step": 298998, "epoch": 2471} {"train_loss": -43.824764251708984, "global_step": 298999, "epoch": 2471} {"train_loss": -43.9365348815918, "global_step": 299000, "epoch": 2471} {"train_loss": -42.27613830566406, "global_step": 299001, "epoch": 2471} {"train_loss": -43.73897933959961, "global_step": 299002, "epoch": 2471} {"train_loss": -43.499549865722656, "global_step": 299003, "epoch": 2471} {"train_loss": -44.206600189208984, "global_step": 299004, "epoch": 2471} {"train_loss": -42.98773193359375, "global_step": 299005, "epoch": 2471} {"train_loss": -43.12923812866211, "global_step": 299006, "epoch": 2471} {"train_loss": -42.57026290893555, "global_step": 299007, "epoch": 2471} {"train_loss": -43.815589904785156, "global_step": 299008, "epoch": 2471} {"train_loss": -42.94963836669922, "global_step": 299009, "epoch": 2471} {"train_loss": -43.163604736328125, "global_step": 299010, "epoch": 2471} {"train_loss": -43.61737823486328, "global_step": 299011, "epoch": 2471} {"train_loss": -43.709877014160156, "global_step": 299012, "epoch": 2471} {"train_loss": -43.08522033691406, "global_step": 299013, "epoch": 2471} {"train_loss": -44.251220703125, "global_step": 299014, "epoch": 2471} {"train_loss": -44.776336669921875, "global_step": 299015, "epoch": 2471} {"train_loss": -42.93387985229492, "global_step": 299016, "epoch": 2471} {"train_loss": -42.601463317871094, "global_step": 299017, "epoch": 2471} {"train_loss": -44.198001861572266, "global_step": 299018, "epoch": 2471} {"train_loss": -44.02054977416992, "global_step": 299019, "epoch": 2471} {"train_loss": -43.53622055053711, "global_step": 299020, "epoch": 2471} {"train_loss": -43.04985427856445, "global_step": 299021, "epoch": 2471} {"train_loss": -43.92306137084961, "global_step": 299022, "epoch": 2471} {"train_loss": -42.565792083740234, "global_step": 299023, "epoch": 2471} {"train_loss": -43.4284553527832, "global_step": 299024, "epoch": 2471} {"train_loss": -43.68435287475586, "global_step": 299025, "epoch": 2471} {"train_loss": -43.61296463012695, "global_step": 299026, "epoch": 2471} {"train_loss": -41.691986083984375, "global_step": 299027, "epoch": 2471} {"train_loss": -43.26953887939453, "global_step": 299028, "epoch": 2471} {"train_loss": -44.103126525878906, "global_step": 299029, "epoch": 2471} {"train_loss": -43.69203567504883, "global_step": 299030, "epoch": 2471} {"train_loss": -41.4175910949707, "global_step": 299031, "epoch": 2471} {"train_loss": -39.15571594238281, "global_step": 299032, "epoch": 2471} {"train_loss": -42.41762161254883, "global_step": 299033, "epoch": 2471} {"train_loss": -41.57163619995117, "global_step": 299034, "epoch": 2471} {"train_loss": -42.58022689819336, "global_step": 299035, "epoch": 2471} {"train_loss": -42.08207321166992, "global_step": 299036, "epoch": 2471} {"train_loss": -39.260738372802734, "global_step": 299037, "epoch": 2471} {"train_loss": -41.533260345458984, "global_step": 299038, "epoch": 2471} {"train_loss": -36.77364730834961, "global_step": 299039, "epoch": 2471} {"train_loss": -36.79155349731445, "global_step": 299040, "epoch": 2471} {"train_loss": -36.84505844116211, "global_step": 299041, "epoch": 2471} {"train_loss": -36.11890411376953, "global_step": 299042, "epoch": 2471} {"train_loss": -36.406982421875, "global_step": 299043, "epoch": 2471} {"train_loss": -35.611846923828125, "global_step": 299044, "epoch": 2471} {"train_loss": -35.940032958984375, "global_step": 299045, "epoch": 2471} {"train_loss": -34.299652099609375, "global_step": 299046, "epoch": 2471} {"train_loss": -32.57209014892578, "global_step": 299047, "epoch": 2471} {"train_loss": -36.43378829956055, "global_step": 299048, "epoch": 2471} {"train_loss": -35.94130325317383, "global_step": 299049, "epoch": 2471} {"train_loss": -34.13125228881836, "global_step": 299050, "epoch": 2471} {"train_loss": -36.85625076293945, "global_step": 299051, "epoch": 2471} {"train_loss": -35.395389556884766, "global_step": 299052, "epoch": 2471} {"train_loss": -37.44135665893555, "global_step": 299053, "epoch": 2471} {"train_loss": -36.55680465698242, "global_step": 299054, "epoch": 2471} {"train_loss": -36.3987922668457, "global_step": 299055, "epoch": 2471} {"train_loss": -37.69662094116211, "global_step": 299056, "epoch": 2471} {"train_loss": -36.936279296875, "global_step": 299057, "epoch": 2471} {"train_loss": -38.180782318115234, "global_step": 299058, "epoch": 2471} {"train_loss": -37.17924880981445, "global_step": 299059, "epoch": 2471} {"train_loss": -38.74633026123047, "global_step": 299060, "epoch": 2471} {"train_loss": -37.992000579833984, "global_step": 299061, "epoch": 2471} {"train_loss": -38.481319427490234, "global_step": 299062, "epoch": 2471} {"train_loss": -37.8393440246582, "global_step": 299063, "epoch": 2471} {"train_loss": -38.43120193481445, "global_step": 299064, "epoch": 2471} {"train_loss": -38.74983215332031, "global_step": 299065, "epoch": 2471} {"train_loss": -39.523685455322266, "global_step": 299066, "epoch": 2471} {"train_loss": -39.3859748840332, "global_step": 299067, "epoch": 2471} {"train_loss": -38.901153564453125, "global_step": 299068, "epoch": 2471} {"train_loss": -39.479366302490234, "global_step": 299069, "epoch": 2471} {"train_loss": -39.271480560302734, "global_step": 299070, "epoch": 2471} {"train_loss": -39.57727813720703, "global_step": 299071, "epoch": 2471} {"train_loss": -39.7122917175293, "global_step": 299072, "epoch": 2471} {"train_loss": -40.01540756225586, "global_step": 299073, "epoch": 2471} {"train_loss": -39.4376106262207, "global_step": 299074, "epoch": 2471} {"train_loss": -40.18821334838867, "global_step": 299075, "epoch": 2471} {"train_loss": -40.0391960144043, "global_step": 299076, "epoch": 2471} {"train_loss": -40.4376106262207, "global_step": 299077, "epoch": 2471} {"train_loss": -39.858245849609375, "global_step": 299078, "epoch": 2471} {"train_loss": -40.3142204284668, "global_step": 299079, "epoch": 2471} {"train_loss": -40.8293342590332, "global_step": 299080, "epoch": 2471} {"train_loss": -40.413875579833984, "global_step": 299081, "epoch": 2471} {"train_loss": -40.87336349487305, "global_step": 299082, "epoch": 2471} {"train_loss": -41.042152404785156, "global_step": 299083, "epoch": 2471} {"train_loss": -40.411563873291016, "global_step": 299084, "epoch": 2471} {"train_loss": -40.49250411987305, "global_step": 299085, "epoch": 2471} {"train_loss": -40.59539794921875, "global_step": 299086, "epoch": 2471} {"train_loss": -41.55752944946289, "global_step": 299087, "epoch": 2471} {"train_loss": -41.140113830566406, "global_step": 299088, "epoch": 2471} {"train_loss": -41.44968795776367, "global_step": 299089, "epoch": 2471} {"train_loss": -41.580780029296875, "global_step": 299090, "epoch": 2471} {"train_loss": -41.5143928527832, "global_step": 299091, "epoch": 2471} {"train_loss": -41.049076080322266, "global_step": 299092, "epoch": 2471} {"train_loss": -41.571407318115234, "global_step": 299093, "epoch": 2471} {"train_loss": -42.09257888793945, "global_step": 299094, "epoch": 2471} {"train_loss": -41.7555046081543, "global_step": 299095, "epoch": 2471} {"train_loss": -41.921077728271484, "global_step": 299096, "epoch": 2471} {"train_loss": -41.535457611083984, "global_step": 299097, "epoch": 2471} {"train_loss": -41.01601791381836, "global_step": 299098, "epoch": 2471} {"train_loss": -40.68388366699219, "global_step": 299099, "epoch": 2471} {"train_loss": -41.12260818481445, "global_step": 299100, "epoch": 2471} {"train_loss": -40.671268463134766, "global_step": 299101, "epoch": 2471} {"train_loss": -41.67803955078125, "global_step": 299102, "epoch": 2471} {"train_loss": -41.98369216918945, "global_step": 299103, "epoch": 2471} {"train_loss": -40.76701736450195, "global_step": 299104, "epoch": 2471} {"train_loss": -41.279476165771484, "global_step": 299105, "epoch": 2471} {"train_loss": -40.71427917480469, "global_step": 299106, "epoch": 2471} {"train_loss": -41.521644592285156, "global_step": 299107, "epoch": 2471} {"train_loss": -41.83030319213867, "global_step": 299108, "epoch": 2471} {"train_loss": -41.20089340209961, "global_step": 299109, "epoch": 2471} {"train_loss": -42.39157485961914, "global_step": 299110, "epoch": 2471} {"train_loss": -40.77907161870279, "global_step": 299111, "epoch": 2471, "val_loss": 2740901.5} {"train_loss": -42.02158737182617, "global_step": 299112, "epoch": 2472} {"train_loss": -39.24442672729492, "global_step": 299113, "epoch": 2472} {"train_loss": -42.57316589355469, "global_step": 299114, "epoch": 2472} {"train_loss": -41.47211456298828, "global_step": 299115, "epoch": 2472} {"train_loss": -42.53059387207031, "global_step": 299116, "epoch": 2472} {"train_loss": -42.85325241088867, "global_step": 299117, "epoch": 2472} {"train_loss": -42.40370178222656, "global_step": 299118, "epoch": 2472} {"train_loss": -43.10395431518555, "global_step": 299119, "epoch": 2472} {"train_loss": -42.05166244506836, "global_step": 299120, "epoch": 2472} {"train_loss": -42.373165130615234, "global_step": 299121, "epoch": 2472} {"train_loss": -37.7633056640625, "global_step": 299122, "epoch": 2472} {"train_loss": -41.46910858154297, "global_step": 299123, "epoch": 2472} {"train_loss": -39.751888275146484, "global_step": 299124, "epoch": 2472} {"train_loss": -40.665748596191406, "global_step": 299125, "epoch": 2472} {"train_loss": -41.055599212646484, "global_step": 299126, "epoch": 2472} {"train_loss": -39.65730667114258, "global_step": 299127, "epoch": 2472} {"train_loss": -41.87655258178711, "global_step": 299128, "epoch": 2472} {"train_loss": -39.62701416015625, "global_step": 299129, "epoch": 2472} {"train_loss": -40.150360107421875, "global_step": 299130, "epoch": 2472} {"train_loss": -40.111610412597656, "global_step": 299131, "epoch": 2472} {"train_loss": -40.7484016418457, "global_step": 299132, "epoch": 2472} {"train_loss": -41.162841796875, "global_step": 299133, "epoch": 2472} {"train_loss": -40.13005065917969, "global_step": 299134, "epoch": 2472} {"train_loss": -41.45692825317383, "global_step": 299135, "epoch": 2472} {"train_loss": -40.32424545288086, "global_step": 299136, "epoch": 2472} {"train_loss": -40.64037322998047, "global_step": 299137, "epoch": 2472} {"train_loss": -41.96550369262695, "global_step": 299138, "epoch": 2472} {"train_loss": -40.92988586425781, "global_step": 299139, "epoch": 2472} {"train_loss": -40.92267990112305, "global_step": 299140, "epoch": 2472} {"train_loss": -42.45743942260742, "global_step": 299141, "epoch": 2472} {"train_loss": -41.426002502441406, "global_step": 299142, "epoch": 2472} {"train_loss": -42.724178314208984, "global_step": 299143, "epoch": 2472} {"train_loss": -41.67719650268555, "global_step": 299144, "epoch": 2472} {"train_loss": -41.87481689453125, "global_step": 299145, "epoch": 2472} {"train_loss": -41.77716064453125, "global_step": 299146, "epoch": 2472} {"train_loss": -42.38214874267578, "global_step": 299147, "epoch": 2472} {"train_loss": -42.04047775268555, "global_step": 299148, "epoch": 2472} {"train_loss": -42.064144134521484, "global_step": 299149, "epoch": 2472} {"train_loss": -41.71163558959961, "global_step": 299150, "epoch": 2472} {"train_loss": -42.763763427734375, "global_step": 299151, "epoch": 2472} {"train_loss": -41.46479415893555, "global_step": 299152, "epoch": 2472} {"train_loss": -40.93833541870117, "global_step": 299153, "epoch": 2472} {"train_loss": -41.71243667602539, "global_step": 299154, "epoch": 2472} {"train_loss": -41.74949645996094, "global_step": 299155, "epoch": 2472} {"train_loss": -42.314674377441406, "global_step": 299156, "epoch": 2472} {"train_loss": -41.96702194213867, "global_step": 299157, "epoch": 2472} {"train_loss": -42.17763900756836, "global_step": 299158, "epoch": 2472} {"train_loss": -42.68113708496094, "global_step": 299159, "epoch": 2472} {"train_loss": -42.1374626159668, "global_step": 299160, "epoch": 2472} {"train_loss": -42.370670318603516, "global_step": 299161, "epoch": 2472} {"train_loss": -42.10963821411133, "global_step": 299162, "epoch": 2472} {"train_loss": -40.8896369934082, "global_step": 299163, "epoch": 2472} {"train_loss": -40.92860412597656, "global_step": 299164, "epoch": 2472} {"train_loss": -39.67378616333008, "global_step": 299165, "epoch": 2472} {"train_loss": -39.57756042480469, "global_step": 299166, "epoch": 2472} {"train_loss": -41.352230072021484, "global_step": 299167, "epoch": 2472} {"train_loss": -41.61231994628906, "global_step": 299168, "epoch": 2472} {"train_loss": -39.86511993408203, "global_step": 299169, "epoch": 2472} {"train_loss": -42.50333023071289, "global_step": 299170, "epoch": 2472} {"train_loss": -40.381195068359375, "global_step": 299171, "epoch": 2472} {"train_loss": -41.53515625, "global_step": 299172, "epoch": 2472} {"train_loss": -41.108375549316406, "global_step": 299173, "epoch": 2472} {"train_loss": -41.181148529052734, "global_step": 299174, "epoch": 2472} {"train_loss": -41.73787307739258, "global_step": 299175, "epoch": 2472} {"train_loss": -38.975284576416016, "global_step": 299176, "epoch": 2472} {"train_loss": -41.352848052978516, "global_step": 299177, "epoch": 2472} {"train_loss": -38.68391036987305, "global_step": 299178, "epoch": 2472} {"train_loss": -40.79615783691406, "global_step": 299179, "epoch": 2472} {"train_loss": -41.09041976928711, "global_step": 299180, "epoch": 2472} {"train_loss": -36.58820343017578, "global_step": 299181, "epoch": 2472} {"train_loss": -35.81575393676758, "global_step": 299182, "epoch": 2472} {"train_loss": -38.55183029174805, "global_step": 299183, "epoch": 2472} {"train_loss": -41.73263168334961, "global_step": 299184, "epoch": 2472} {"train_loss": -36.778350830078125, "global_step": 299185, "epoch": 2472} {"train_loss": -34.264644622802734, "global_step": 299186, "epoch": 2472} {"train_loss": -38.54148864746094, "global_step": 299187, "epoch": 2472} {"train_loss": -41.1901969909668, "global_step": 299188, "epoch": 2472} {"train_loss": -37.74494552612305, "global_step": 299189, "epoch": 2472} {"train_loss": -35.21246337890625, "global_step": 299190, "epoch": 2472} {"train_loss": -41.84368896484375, "global_step": 299191, "epoch": 2472} {"train_loss": -37.5278434753418, "global_step": 299192, "epoch": 2472} {"train_loss": -38.744834899902344, "global_step": 299193, "epoch": 2472} {"train_loss": -40.77939987182617, "global_step": 299194, "epoch": 2472} {"train_loss": -39.587276458740234, "global_step": 299195, "epoch": 2472} {"train_loss": -40.47675323486328, "global_step": 299196, "epoch": 2472} {"train_loss": -38.94955062866211, "global_step": 299197, "epoch": 2472} {"train_loss": -40.517974853515625, "global_step": 299198, "epoch": 2472} {"train_loss": -41.030181884765625, "global_step": 299199, "epoch": 2472} {"train_loss": -40.5504150390625, "global_step": 299200, "epoch": 2472} {"train_loss": -41.731964111328125, "global_step": 299201, "epoch": 2472} {"train_loss": -41.13608169555664, "global_step": 299202, "epoch": 2472} {"train_loss": -39.187339782714844, "global_step": 299203, "epoch": 2472} {"train_loss": -40.50997543334961, "global_step": 299204, "epoch": 2472} {"train_loss": -40.046661376953125, "global_step": 299205, "epoch": 2472} {"train_loss": -41.6162109375, "global_step": 299206, "epoch": 2472} {"train_loss": -39.31106948852539, "global_step": 299207, "epoch": 2472} {"train_loss": -41.84614944458008, "global_step": 299208, "epoch": 2472} {"train_loss": -39.64951705932617, "global_step": 299209, "epoch": 2472} {"train_loss": -41.61124801635742, "global_step": 299210, "epoch": 2472} {"train_loss": -40.64947509765625, "global_step": 299211, "epoch": 2472} {"train_loss": -41.77492904663086, "global_step": 299212, "epoch": 2472} {"train_loss": -40.9269905090332, "global_step": 299213, "epoch": 2472} {"train_loss": -41.49683380126953, "global_step": 299214, "epoch": 2472} {"train_loss": -42.158321380615234, "global_step": 299215, "epoch": 2472} {"train_loss": -41.42789077758789, "global_step": 299216, "epoch": 2472} {"train_loss": -42.32120895385742, "global_step": 299217, "epoch": 2472} {"train_loss": -40.752532958984375, "global_step": 299218, "epoch": 2472} {"train_loss": -43.12565994262695, "global_step": 299219, "epoch": 2472} {"train_loss": -41.781124114990234, "global_step": 299220, "epoch": 2472} {"train_loss": -42.78214645385742, "global_step": 299221, "epoch": 2472} {"train_loss": -42.279964447021484, "global_step": 299222, "epoch": 2472} {"train_loss": -42.323795318603516, "global_step": 299223, "epoch": 2472} {"train_loss": -42.792938232421875, "global_step": 299224, "epoch": 2472} {"train_loss": -42.73311996459961, "global_step": 299225, "epoch": 2472} {"train_loss": -42.624908447265625, "global_step": 299226, "epoch": 2472} {"train_loss": -42.570247650146484, "global_step": 299227, "epoch": 2472} {"train_loss": -41.83085250854492, "global_step": 299228, "epoch": 2472} {"train_loss": -43.09043884277344, "global_step": 299229, "epoch": 2472} {"train_loss": -42.931880950927734, "global_step": 299230, "epoch": 2472} {"train_loss": -43.148006439208984, "global_step": 299231, "epoch": 2472} {"train_loss": -40.99270901010056, "global_step": 299232, "epoch": 2472, "val_loss": 2684980.75} {"train_loss": -42.00241470336914, "global_step": 299233, "epoch": 2473} {"train_loss": -42.95675277709961, "global_step": 299234, "epoch": 2473} {"train_loss": -42.88522720336914, "global_step": 299235, "epoch": 2473} {"train_loss": -43.1170539855957, "global_step": 299236, "epoch": 2473} {"train_loss": -43.060970306396484, "global_step": 299237, "epoch": 2473} {"train_loss": -43.181941986083984, "global_step": 299238, "epoch": 2473} {"train_loss": -42.790462493896484, "global_step": 299239, "epoch": 2473} {"train_loss": -43.34383010864258, "global_step": 299240, "epoch": 2473} {"train_loss": -43.74369430541992, "global_step": 299241, "epoch": 2473} {"train_loss": -43.77085494995117, "global_step": 299242, "epoch": 2473} {"train_loss": -43.47714614868164, "global_step": 299243, "epoch": 2473} {"train_loss": -43.7562370300293, "global_step": 299244, "epoch": 2473} {"train_loss": -43.61787796020508, "global_step": 299245, "epoch": 2473} {"train_loss": -43.753597259521484, "global_step": 299246, "epoch": 2473} {"train_loss": -43.62897872924805, "global_step": 299247, "epoch": 2473} {"train_loss": -44.10042190551758, "global_step": 299248, "epoch": 2473} {"train_loss": -43.23005294799805, "global_step": 299249, "epoch": 2473} {"train_loss": -43.9076042175293, "global_step": 299250, "epoch": 2473} {"train_loss": -43.6640739440918, "global_step": 299251, "epoch": 2473} {"train_loss": -44.01023483276367, "global_step": 299252, "epoch": 2473} {"train_loss": -44.06624221801758, "global_step": 299253, "epoch": 2473} {"train_loss": -44.198333740234375, "global_step": 299254, "epoch": 2473} {"train_loss": -44.246864318847656, "global_step": 299255, "epoch": 2473} {"train_loss": -43.85164260864258, "global_step": 299256, "epoch": 2473} {"train_loss": -43.6669921875, "global_step": 299257, "epoch": 2473} {"train_loss": -43.897884368896484, "global_step": 299258, "epoch": 2473} {"train_loss": -43.53596115112305, "global_step": 299259, "epoch": 2473} {"train_loss": -43.63155746459961, "global_step": 299260, "epoch": 2473} {"train_loss": -43.94073486328125, "global_step": 299261, "epoch": 2473} {"train_loss": -43.7053337097168, "global_step": 299262, "epoch": 2473} {"train_loss": -44.28047561645508, "global_step": 299263, "epoch": 2473} {"train_loss": -44.282413482666016, "global_step": 299264, "epoch": 2473} {"train_loss": -44.66183090209961, "global_step": 299265, "epoch": 2473} {"train_loss": -44.379207611083984, "global_step": 299266, "epoch": 2473} {"train_loss": -44.53605270385742, "global_step": 299267, "epoch": 2473} {"train_loss": -43.804283142089844, "global_step": 299268, "epoch": 2473} {"train_loss": -44.60315704345703, "global_step": 299269, "epoch": 2473} {"train_loss": -44.195701599121094, "global_step": 299270, "epoch": 2473} {"train_loss": -44.29488754272461, "global_step": 299271, "epoch": 2473} {"train_loss": -44.13322067260742, "global_step": 299272, "epoch": 2473} {"train_loss": -44.01304244995117, "global_step": 299273, "epoch": 2473} {"train_loss": -43.56158447265625, "global_step": 299274, "epoch": 2473} {"train_loss": -44.18839645385742, "global_step": 299275, "epoch": 2473} {"train_loss": -44.59035110473633, "global_step": 299276, "epoch": 2473} {"train_loss": -44.128089904785156, "global_step": 299277, "epoch": 2473} {"train_loss": -44.35001754760742, "global_step": 299278, "epoch": 2473} {"train_loss": -44.82160186767578, "global_step": 299279, "epoch": 2473} {"train_loss": -44.578792572021484, "global_step": 299280, "epoch": 2473} {"train_loss": -45.35982894897461, "global_step": 299281, "epoch": 2473} {"train_loss": -44.01377487182617, "global_step": 299282, "epoch": 2473} {"train_loss": -44.748714447021484, "global_step": 299283, "epoch": 2473} {"train_loss": -44.64424514770508, "global_step": 299284, "epoch": 2473} {"train_loss": -43.308387756347656, "global_step": 299285, "epoch": 2473} {"train_loss": -41.97735595703125, "global_step": 299286, "epoch": 2473} {"train_loss": -44.26555633544922, "global_step": 299287, "epoch": 2473} {"train_loss": -44.3957405090332, "global_step": 299288, "epoch": 2473} {"train_loss": -43.22661209106445, "global_step": 299289, "epoch": 2473} {"train_loss": -42.30317306518555, "global_step": 299290, "epoch": 2473} {"train_loss": -43.29353713989258, "global_step": 299291, "epoch": 2473} {"train_loss": -43.7204475402832, "global_step": 299292, "epoch": 2473} {"train_loss": -44.51239776611328, "global_step": 299293, "epoch": 2473} {"train_loss": -43.83943557739258, "global_step": 299294, "epoch": 2473} {"train_loss": -42.6771354675293, "global_step": 299295, "epoch": 2473} {"train_loss": -43.572505950927734, "global_step": 299296, "epoch": 2473} {"train_loss": -43.7352294921875, "global_step": 299297, "epoch": 2473} {"train_loss": -43.9141960144043, "global_step": 299298, "epoch": 2473} {"train_loss": -41.38247299194336, "global_step": 299299, "epoch": 2473} {"train_loss": -43.6038932800293, "global_step": 299300, "epoch": 2473} {"train_loss": -43.67451095581055, "global_step": 299301, "epoch": 2473} {"train_loss": -41.95581817626953, "global_step": 299302, "epoch": 2473} {"train_loss": -41.05601119995117, "global_step": 299303, "epoch": 2473} {"train_loss": -42.91875076293945, "global_step": 299304, "epoch": 2473} {"train_loss": -43.03411865234375, "global_step": 299305, "epoch": 2473} {"train_loss": -43.26765060424805, "global_step": 299306, "epoch": 2473} {"train_loss": -43.4956169128418, "global_step": 299307, "epoch": 2473} {"train_loss": -42.83015823364258, "global_step": 299308, "epoch": 2473} {"train_loss": -40.26753616333008, "global_step": 299309, "epoch": 2473} {"train_loss": -41.01689147949219, "global_step": 299310, "epoch": 2473} {"train_loss": -42.47846603393555, "global_step": 299311, "epoch": 2473} {"train_loss": -40.296852111816406, "global_step": 299312, "epoch": 2473} {"train_loss": -41.42509841918945, "global_step": 299313, "epoch": 2473} {"train_loss": -41.760223388671875, "global_step": 299314, "epoch": 2473} {"train_loss": -42.575679779052734, "global_step": 299315, "epoch": 2473} {"train_loss": -41.873287200927734, "global_step": 299316, "epoch": 2473} {"train_loss": -41.140045166015625, "global_step": 299317, "epoch": 2473} {"train_loss": -42.515262603759766, "global_step": 299318, "epoch": 2473} {"train_loss": -43.09490966796875, "global_step": 299319, "epoch": 2473} {"train_loss": -41.192745208740234, "global_step": 299320, "epoch": 2473} {"train_loss": -43.30839157104492, "global_step": 299321, "epoch": 2473} {"train_loss": -42.51488494873047, "global_step": 299322, "epoch": 2473} {"train_loss": -41.25569534301758, "global_step": 299323, "epoch": 2473} {"train_loss": -41.603057861328125, "global_step": 299324, "epoch": 2473} {"train_loss": -41.89186477661133, "global_step": 299325, "epoch": 2473} {"train_loss": -41.793373107910156, "global_step": 299326, "epoch": 2473} {"train_loss": -43.149017333984375, "global_step": 299327, "epoch": 2473} {"train_loss": -40.881866455078125, "global_step": 299328, "epoch": 2473} {"train_loss": -43.518882751464844, "global_step": 299329, "epoch": 2473} {"train_loss": -41.74570083618164, "global_step": 299330, "epoch": 2473} {"train_loss": -41.43475341796875, "global_step": 299331, "epoch": 2473} {"train_loss": -41.63882064819336, "global_step": 299332, "epoch": 2473} {"train_loss": -41.058475494384766, "global_step": 299333, "epoch": 2473} {"train_loss": -41.827735900878906, "global_step": 299334, "epoch": 2473} {"train_loss": -41.88090896606445, "global_step": 299335, "epoch": 2473} {"train_loss": -40.404090881347656, "global_step": 299336, "epoch": 2473} {"train_loss": -43.03912353515625, "global_step": 299337, "epoch": 2473} {"train_loss": -40.082515716552734, "global_step": 299338, "epoch": 2473} {"train_loss": -40.54997253417969, "global_step": 299339, "epoch": 2473} {"train_loss": -42.74607467651367, "global_step": 299340, "epoch": 2473} {"train_loss": -40.6834831237793, "global_step": 299341, "epoch": 2473} {"train_loss": -42.50215530395508, "global_step": 299342, "epoch": 2473} {"train_loss": -41.901485443115234, "global_step": 299343, "epoch": 2473} {"train_loss": -42.818267822265625, "global_step": 299344, "epoch": 2473} {"train_loss": -40.219058990478516, "global_step": 299345, "epoch": 2473} {"train_loss": -42.83456039428711, "global_step": 299346, "epoch": 2473} {"train_loss": -40.0225715637207, "global_step": 299347, "epoch": 2473} {"train_loss": -42.94904327392578, "global_step": 299348, "epoch": 2473} {"train_loss": -41.42817306518555, "global_step": 299349, "epoch": 2473} {"train_loss": -42.12114715576172, "global_step": 299350, "epoch": 2473} {"train_loss": -42.4243278503418, "global_step": 299351, "epoch": 2473} {"train_loss": -41.618865966796875, "global_step": 299352, "epoch": 2473} {"train_loss": -42.97290243984254, "global_step": 299353, "epoch": 2473, "val_loss": 2653220.0} {"train_loss": -42.5941276550293, "global_step": 299354, "epoch": 2474} {"train_loss": -42.084556579589844, "global_step": 299355, "epoch": 2474} {"train_loss": -42.81107711791992, "global_step": 299356, "epoch": 2474} {"train_loss": -43.05686569213867, "global_step": 299357, "epoch": 2474} {"train_loss": -41.1357307434082, "global_step": 299358, "epoch": 2474} {"train_loss": -42.84706497192383, "global_step": 299359, "epoch": 2474} {"train_loss": -42.80287551879883, "global_step": 299360, "epoch": 2474} {"train_loss": -43.1839714050293, "global_step": 299361, "epoch": 2474} {"train_loss": -42.868690490722656, "global_step": 299362, "epoch": 2474} {"train_loss": -43.66010665893555, "global_step": 299363, "epoch": 2474} {"train_loss": -42.99671936035156, "global_step": 299364, "epoch": 2474} {"train_loss": -43.75978088378906, "global_step": 299365, "epoch": 2474} {"train_loss": -42.570369720458984, "global_step": 299366, "epoch": 2474} {"train_loss": -43.81441879272461, "global_step": 299367, "epoch": 2474} {"train_loss": -42.95722198486328, "global_step": 299368, "epoch": 2474} {"train_loss": -42.967830657958984, "global_step": 299369, "epoch": 2474} {"train_loss": -42.23221206665039, "global_step": 299370, "epoch": 2474} {"train_loss": -42.095706939697266, "global_step": 299371, "epoch": 2474} {"train_loss": -43.25813674926758, "global_step": 299372, "epoch": 2474} {"train_loss": -43.135772705078125, "global_step": 299373, "epoch": 2474} {"train_loss": -43.2780647277832, "global_step": 299374, "epoch": 2474} {"train_loss": -43.06675338745117, "global_step": 299375, "epoch": 2474} {"train_loss": -44.1396598815918, "global_step": 299376, "epoch": 2474} {"train_loss": -43.38494873046875, "global_step": 299377, "epoch": 2474} {"train_loss": -43.57101058959961, "global_step": 299378, "epoch": 2474} {"train_loss": -44.35123062133789, "global_step": 299379, "epoch": 2474} {"train_loss": -43.693824768066406, "global_step": 299380, "epoch": 2474} {"train_loss": -44.11128616333008, "global_step": 299381, "epoch": 2474} {"train_loss": -44.146175384521484, "global_step": 299382, "epoch": 2474} {"train_loss": -43.577857971191406, "global_step": 299383, "epoch": 2474} {"train_loss": -43.34221267700195, "global_step": 299384, "epoch": 2474} {"train_loss": -43.8011474609375, "global_step": 299385, "epoch": 2474} {"train_loss": -43.74009323120117, "global_step": 299386, "epoch": 2474} {"train_loss": -44.284114837646484, "global_step": 299387, "epoch": 2474} {"train_loss": -44.3419303894043, "global_step": 299388, "epoch": 2474} {"train_loss": -43.67753219604492, "global_step": 299389, "epoch": 2474} {"train_loss": -44.23868179321289, "global_step": 299390, "epoch": 2474} {"train_loss": -44.428993225097656, "global_step": 299391, "epoch": 2474} {"train_loss": -44.5188102722168, "global_step": 299392, "epoch": 2474} {"train_loss": -44.298919677734375, "global_step": 299393, "epoch": 2474} {"train_loss": -44.026058197021484, "global_step": 299394, "epoch": 2474} {"train_loss": -44.39304733276367, "global_step": 299395, "epoch": 2474} {"train_loss": -44.47478485107422, "global_step": 299396, "epoch": 2474} {"train_loss": -43.70502471923828, "global_step": 299397, "epoch": 2474} {"train_loss": -44.405517578125, "global_step": 299398, "epoch": 2474} {"train_loss": -44.52133560180664, "global_step": 299399, "epoch": 2474} {"train_loss": -44.28779983520508, "global_step": 299400, "epoch": 2474} {"train_loss": -44.56502151489258, "global_step": 299401, "epoch": 2474} {"train_loss": -44.18099594116211, "global_step": 299402, "epoch": 2474} {"train_loss": -43.552364349365234, "global_step": 299403, "epoch": 2474} {"train_loss": -43.18085479736328, "global_step": 299404, "epoch": 2474} {"train_loss": -41.994873046875, "global_step": 299405, "epoch": 2474} {"train_loss": -44.490196228027344, "global_step": 299406, "epoch": 2474} {"train_loss": -43.7229118347168, "global_step": 299407, "epoch": 2474} {"train_loss": -43.1013298034668, "global_step": 299408, "epoch": 2474} {"train_loss": -43.51129913330078, "global_step": 299409, "epoch": 2474} {"train_loss": -42.15342712402344, "global_step": 299410, "epoch": 2474} {"train_loss": -44.44789123535156, "global_step": 299411, "epoch": 2474} {"train_loss": -44.27315902709961, "global_step": 299412, "epoch": 2474} {"train_loss": -43.15876388549805, "global_step": 299413, "epoch": 2474} {"train_loss": -42.37781524658203, "global_step": 299414, "epoch": 2474} {"train_loss": -43.956329345703125, "global_step": 299415, "epoch": 2474} {"train_loss": -42.76099395751953, "global_step": 299416, "epoch": 2474} {"train_loss": -44.45808792114258, "global_step": 299417, "epoch": 2474} {"train_loss": -42.56713104248047, "global_step": 299418, "epoch": 2474} {"train_loss": -43.94609451293945, "global_step": 299419, "epoch": 2474} {"train_loss": -44.53329086303711, "global_step": 299420, "epoch": 2474} {"train_loss": -43.91773223876953, "global_step": 299421, "epoch": 2474} {"train_loss": -43.90336990356445, "global_step": 299422, "epoch": 2474} {"train_loss": -44.102020263671875, "global_step": 299423, "epoch": 2474} {"train_loss": -44.277740478515625, "global_step": 299424, "epoch": 2474} {"train_loss": -44.0015983581543, "global_step": 299425, "epoch": 2474} {"train_loss": -44.23814010620117, "global_step": 299426, "epoch": 2474} {"train_loss": -43.79134750366211, "global_step": 299427, "epoch": 2474} {"train_loss": -44.6837272644043, "global_step": 299428, "epoch": 2474} {"train_loss": -44.001007080078125, "global_step": 299429, "epoch": 2474} {"train_loss": -44.30938720703125, "global_step": 299430, "epoch": 2474} {"train_loss": -42.894378662109375, "global_step": 299431, "epoch": 2474} {"train_loss": -43.86561965942383, "global_step": 299432, "epoch": 2474} {"train_loss": -44.04922103881836, "global_step": 299433, "epoch": 2474} {"train_loss": -42.86333465576172, "global_step": 299434, "epoch": 2474} {"train_loss": -43.783172607421875, "global_step": 299435, "epoch": 2474} {"train_loss": -42.4433708190918, "global_step": 299436, "epoch": 2474} {"train_loss": -44.520084381103516, "global_step": 299437, "epoch": 2474} {"train_loss": -42.9119758605957, "global_step": 299438, "epoch": 2474} {"train_loss": -44.69374465942383, "global_step": 299439, "epoch": 2474} {"train_loss": -42.49464416503906, "global_step": 299440, "epoch": 2474} {"train_loss": -43.91236114501953, "global_step": 299441, "epoch": 2474} {"train_loss": -42.98366165161133, "global_step": 299442, "epoch": 2474} {"train_loss": -44.27293014526367, "global_step": 299443, "epoch": 2474} {"train_loss": -43.259700775146484, "global_step": 299444, "epoch": 2474} {"train_loss": -43.40422821044922, "global_step": 299445, "epoch": 2474} {"train_loss": -43.40449142456055, "global_step": 299446, "epoch": 2474} {"train_loss": -42.965431213378906, "global_step": 299447, "epoch": 2474} {"train_loss": -43.7336311340332, "global_step": 299448, "epoch": 2474} {"train_loss": -42.8480339050293, "global_step": 299449, "epoch": 2474} {"train_loss": -43.719398498535156, "global_step": 299450, "epoch": 2474} {"train_loss": -42.39112091064453, "global_step": 299451, "epoch": 2474} {"train_loss": -44.16986846923828, "global_step": 299452, "epoch": 2474} {"train_loss": -43.3697395324707, "global_step": 299453, "epoch": 2474} {"train_loss": -43.71123123168945, "global_step": 299454, "epoch": 2474} {"train_loss": -42.4255256652832, "global_step": 299455, "epoch": 2474} {"train_loss": -44.15156173706055, "global_step": 299456, "epoch": 2474} {"train_loss": -42.50288391113281, "global_step": 299457, "epoch": 2474} {"train_loss": -43.49856185913086, "global_step": 299458, "epoch": 2474} {"train_loss": -43.719276428222656, "global_step": 299459, "epoch": 2474} {"train_loss": -44.07008743286133, "global_step": 299460, "epoch": 2474} {"train_loss": -43.51419448852539, "global_step": 299461, "epoch": 2474} {"train_loss": -43.119911193847656, "global_step": 299462, "epoch": 2474} {"train_loss": -44.14679718017578, "global_step": 299463, "epoch": 2474} {"train_loss": -44.02964401245117, "global_step": 299464, "epoch": 2474} {"train_loss": -42.86526107788086, "global_step": 299465, "epoch": 2474} {"train_loss": -43.547672271728516, "global_step": 299466, "epoch": 2474} {"train_loss": -43.54008102416992, "global_step": 299467, "epoch": 2474} {"train_loss": -41.34791564941406, "global_step": 299468, "epoch": 2474} {"train_loss": -44.04145050048828, "global_step": 299469, "epoch": 2474} {"train_loss": -40.38301467895508, "global_step": 299470, "epoch": 2474} {"train_loss": -43.52988815307617, "global_step": 299471, "epoch": 2474} {"train_loss": -38.01560592651367, "global_step": 299472, "epoch": 2474} {"train_loss": -42.86882781982422, "global_step": 299473, "epoch": 2474} {"train_loss": -43.395518468431206, "global_step": 299474, "epoch": 2474, "val_loss": 2613629.75} {"train_loss": -36.412841796875, "global_step": 299475, "epoch": 2475} {"train_loss": -39.064022064208984, "global_step": 299476, "epoch": 2475} {"train_loss": -38.44135665893555, "global_step": 299477, "epoch": 2475} {"train_loss": -36.46978759765625, "global_step": 299478, "epoch": 2475} {"train_loss": -37.266170501708984, "global_step": 299479, "epoch": 2475} {"train_loss": -39.59355926513672, "global_step": 299480, "epoch": 2475} {"train_loss": -37.787200927734375, "global_step": 299481, "epoch": 2475} {"train_loss": -40.73739242553711, "global_step": 299482, "epoch": 2475} {"train_loss": -39.65169906616211, "global_step": 299483, "epoch": 2475} {"train_loss": -37.63740158081055, "global_step": 299484, "epoch": 2475} {"train_loss": -38.94831466674805, "global_step": 299485, "epoch": 2475} {"train_loss": -39.716339111328125, "global_step": 299486, "epoch": 2475} {"train_loss": -40.81582260131836, "global_step": 299487, "epoch": 2475} {"train_loss": -38.9874382019043, "global_step": 299488, "epoch": 2475} {"train_loss": -40.118038177490234, "global_step": 299489, "epoch": 2475} {"train_loss": -40.99559020996094, "global_step": 299490, "epoch": 2475} {"train_loss": -40.92047119140625, "global_step": 299491, "epoch": 2475} {"train_loss": -42.31855010986328, "global_step": 299492, "epoch": 2475} {"train_loss": -40.4589958190918, "global_step": 299493, "epoch": 2475} {"train_loss": -42.31838607788086, "global_step": 299494, "epoch": 2475} {"train_loss": -40.509193420410156, "global_step": 299495, "epoch": 2475} {"train_loss": -41.51457595825195, "global_step": 299496, "epoch": 2475} {"train_loss": -41.929405212402344, "global_step": 299497, "epoch": 2475} {"train_loss": -41.41118240356445, "global_step": 299498, "epoch": 2475} {"train_loss": -42.428558349609375, "global_step": 299499, "epoch": 2475} {"train_loss": -42.12836837768555, "global_step": 299500, "epoch": 2475} {"train_loss": -42.381378173828125, "global_step": 299501, "epoch": 2475} {"train_loss": -42.34016036987305, "global_step": 299502, "epoch": 2475} {"train_loss": -42.362213134765625, "global_step": 299503, "epoch": 2475} {"train_loss": -42.72992706298828, "global_step": 299504, "epoch": 2475} {"train_loss": -41.82701110839844, "global_step": 299505, "epoch": 2475} {"train_loss": -42.53752517700195, "global_step": 299506, "epoch": 2475} {"train_loss": -42.60994338989258, "global_step": 299507, "epoch": 2475} {"train_loss": -42.10113525390625, "global_step": 299508, "epoch": 2475} {"train_loss": -43.4040641784668, "global_step": 299509, "epoch": 2475} {"train_loss": -42.466896057128906, "global_step": 299510, "epoch": 2475} {"train_loss": -42.87379837036133, "global_step": 299511, "epoch": 2475} {"train_loss": -43.04636764526367, "global_step": 299512, "epoch": 2475} {"train_loss": -43.7277717590332, "global_step": 299513, "epoch": 2475} {"train_loss": -43.033592224121094, "global_step": 299514, "epoch": 2475} {"train_loss": -42.855918884277344, "global_step": 299515, "epoch": 2475} {"train_loss": -43.380043029785156, "global_step": 299516, "epoch": 2475} {"train_loss": -43.36036682128906, "global_step": 299517, "epoch": 2475} {"train_loss": -43.530914306640625, "global_step": 299518, "epoch": 2475} {"train_loss": -42.81629180908203, "global_step": 299519, "epoch": 2475} {"train_loss": -44.053611755371094, "global_step": 299520, "epoch": 2475} {"train_loss": -43.51581573486328, "global_step": 299521, "epoch": 2475} {"train_loss": -44.05631637573242, "global_step": 299522, "epoch": 2475} {"train_loss": -43.246612548828125, "global_step": 299523, "epoch": 2475} {"train_loss": -43.93214416503906, "global_step": 299524, "epoch": 2475} {"train_loss": -43.33378601074219, "global_step": 299525, "epoch": 2475} {"train_loss": -43.05694580078125, "global_step": 299526, "epoch": 2475} {"train_loss": -43.61533737182617, "global_step": 299527, "epoch": 2475} {"train_loss": -42.33972930908203, "global_step": 299528, "epoch": 2475} {"train_loss": -43.05221176147461, "global_step": 299529, "epoch": 2475} {"train_loss": -43.32442092895508, "global_step": 299530, "epoch": 2475} {"train_loss": -43.60276412963867, "global_step": 299531, "epoch": 2475} {"train_loss": -42.9422721862793, "global_step": 299532, "epoch": 2475} {"train_loss": -43.80683135986328, "global_step": 299533, "epoch": 2475} {"train_loss": -43.396297454833984, "global_step": 299534, "epoch": 2475} {"train_loss": -42.41093063354492, "global_step": 299535, "epoch": 2475} {"train_loss": -43.83443832397461, "global_step": 299536, "epoch": 2475} {"train_loss": -41.55367660522461, "global_step": 299537, "epoch": 2475} {"train_loss": -43.04784393310547, "global_step": 299538, "epoch": 2475} {"train_loss": -43.01278305053711, "global_step": 299539, "epoch": 2475} {"train_loss": -42.15238952636719, "global_step": 299540, "epoch": 2475} {"train_loss": -44.14670944213867, "global_step": 299541, "epoch": 2475} {"train_loss": -41.875823974609375, "global_step": 299542, "epoch": 2475} {"train_loss": -43.54012680053711, "global_step": 299543, "epoch": 2475} {"train_loss": -42.374080657958984, "global_step": 299544, "epoch": 2475} {"train_loss": -42.25074768066406, "global_step": 299545, "epoch": 2475} {"train_loss": -43.568077087402344, "global_step": 299546, "epoch": 2475} {"train_loss": -43.065608978271484, "global_step": 299547, "epoch": 2475} {"train_loss": -44.09968185424805, "global_step": 299548, "epoch": 2475} {"train_loss": -43.43337631225586, "global_step": 299549, "epoch": 2475} {"train_loss": -42.54520034790039, "global_step": 299550, "epoch": 2475} {"train_loss": -44.01598358154297, "global_step": 299551, "epoch": 2475} {"train_loss": -42.66362380981445, "global_step": 299552, "epoch": 2475} {"train_loss": -43.8197135925293, "global_step": 299553, "epoch": 2475} {"train_loss": -43.8061408996582, "global_step": 299554, "epoch": 2475} {"train_loss": -43.13344955444336, "global_step": 299555, "epoch": 2475} {"train_loss": -43.97463607788086, "global_step": 299556, "epoch": 2475} {"train_loss": -42.30355453491211, "global_step": 299557, "epoch": 2475} {"train_loss": -43.69504928588867, "global_step": 299558, "epoch": 2475} {"train_loss": -43.276790618896484, "global_step": 299559, "epoch": 2475} {"train_loss": -42.82358932495117, "global_step": 299560, "epoch": 2475} {"train_loss": -44.228736877441406, "global_step": 299561, "epoch": 2475} {"train_loss": -43.1029167175293, "global_step": 299562, "epoch": 2475} {"train_loss": -44.4044189453125, "global_step": 299563, "epoch": 2475} {"train_loss": -43.78131866455078, "global_step": 299564, "epoch": 2475} {"train_loss": -42.697261810302734, "global_step": 299565, "epoch": 2475} {"train_loss": -43.48991012573242, "global_step": 299566, "epoch": 2475} {"train_loss": -43.6005973815918, "global_step": 299567, "epoch": 2475} {"train_loss": -44.177886962890625, "global_step": 299568, "epoch": 2475} {"train_loss": -43.783443450927734, "global_step": 299569, "epoch": 2475} {"train_loss": -43.77287673950195, "global_step": 299570, "epoch": 2475} {"train_loss": -43.705421447753906, "global_step": 299571, "epoch": 2475} {"train_loss": -42.915679931640625, "global_step": 299572, "epoch": 2475} {"train_loss": -43.2982063293457, "global_step": 299573, "epoch": 2475} {"train_loss": -43.37933349609375, "global_step": 299574, "epoch": 2475} {"train_loss": -43.78937911987305, "global_step": 299575, "epoch": 2475} {"train_loss": -44.22241973876953, "global_step": 299576, "epoch": 2475} {"train_loss": -42.85416793823242, "global_step": 299577, "epoch": 2475} {"train_loss": -44.34305953979492, "global_step": 299578, "epoch": 2475} {"train_loss": -44.27333450317383, "global_step": 299579, "epoch": 2475} {"train_loss": -43.07501983642578, "global_step": 299580, "epoch": 2475} {"train_loss": -42.85193634033203, "global_step": 299581, "epoch": 2475} {"train_loss": -43.11593246459961, "global_step": 299582, "epoch": 2475} {"train_loss": -43.425392150878906, "global_step": 299583, "epoch": 2475} {"train_loss": -44.33639144897461, "global_step": 299584, "epoch": 2475} {"train_loss": -43.83658981323242, "global_step": 299585, "epoch": 2475} {"train_loss": -43.10375213623047, "global_step": 299586, "epoch": 2475} {"train_loss": -43.3232307434082, "global_step": 299587, "epoch": 2475} {"train_loss": -43.83414077758789, "global_step": 299588, "epoch": 2475} {"train_loss": -44.425750732421875, "global_step": 299589, "epoch": 2475} {"train_loss": -44.33661651611328, "global_step": 299590, "epoch": 2475} {"train_loss": -44.5489387512207, "global_step": 299591, "epoch": 2475} {"train_loss": -44.3270263671875, "global_step": 299592, "epoch": 2475} {"train_loss": -44.08424758911133, "global_step": 299593, "epoch": 2475} {"train_loss": -43.799739837646484, "global_step": 299594, "epoch": 2475} {"train_loss": -42.58834198880787, "global_step": 299595, "epoch": 2475, "val_loss": 2614517.75} {"train_loss": -44.65072250366211, "global_step": 299596, "epoch": 2476} {"train_loss": -43.71321487426758, "global_step": 299597, "epoch": 2476} {"train_loss": -44.293907165527344, "global_step": 299598, "epoch": 2476} {"train_loss": -44.15085983276367, "global_step": 299599, "epoch": 2476} {"train_loss": -44.150001525878906, "global_step": 299600, "epoch": 2476} {"train_loss": -43.721595764160156, "global_step": 299601, "epoch": 2476} {"train_loss": -43.898338317871094, "global_step": 299602, "epoch": 2476} {"train_loss": -44.41825866699219, "global_step": 299603, "epoch": 2476} {"train_loss": -43.64553451538086, "global_step": 299604, "epoch": 2476} {"train_loss": -43.75031661987305, "global_step": 299605, "epoch": 2476} {"train_loss": -43.84284591674805, "global_step": 299606, "epoch": 2476} {"train_loss": -43.60565948486328, "global_step": 299607, "epoch": 2476} {"train_loss": -42.97608184814453, "global_step": 299608, "epoch": 2476} {"train_loss": -44.121429443359375, "global_step": 299609, "epoch": 2476} {"train_loss": -43.475372314453125, "global_step": 299610, "epoch": 2476} {"train_loss": -42.44894027709961, "global_step": 299611, "epoch": 2476} {"train_loss": -44.43374252319336, "global_step": 299612, "epoch": 2476} {"train_loss": -44.03032302856445, "global_step": 299613, "epoch": 2476} {"train_loss": -42.08309555053711, "global_step": 299614, "epoch": 2476} {"train_loss": -44.58095169067383, "global_step": 299615, "epoch": 2476} {"train_loss": -43.01375961303711, "global_step": 299616, "epoch": 2476} {"train_loss": -43.2567253112793, "global_step": 299617, "epoch": 2476} {"train_loss": -43.927425384521484, "global_step": 299618, "epoch": 2476} {"train_loss": -42.33768844604492, "global_step": 299619, "epoch": 2476} {"train_loss": -43.10171890258789, "global_step": 299620, "epoch": 2476} {"train_loss": -42.78050994873047, "global_step": 299621, "epoch": 2476} {"train_loss": -41.59810256958008, "global_step": 299622, "epoch": 2476} {"train_loss": -43.19649124145508, "global_step": 299623, "epoch": 2476} {"train_loss": -41.06608581542969, "global_step": 299624, "epoch": 2476} {"train_loss": -43.51229476928711, "global_step": 299625, "epoch": 2476} {"train_loss": -41.78803634643555, "global_step": 299626, "epoch": 2476} {"train_loss": -41.93087387084961, "global_step": 299627, "epoch": 2476} {"train_loss": -42.6099967956543, "global_step": 299628, "epoch": 2476} {"train_loss": -41.75782012939453, "global_step": 299629, "epoch": 2476} {"train_loss": -43.0716438293457, "global_step": 299630, "epoch": 2476} {"train_loss": -43.960323333740234, "global_step": 299631, "epoch": 2476} {"train_loss": -41.98237991333008, "global_step": 299632, "epoch": 2476} {"train_loss": -42.958900451660156, "global_step": 299633, "epoch": 2476} {"train_loss": -42.666748046875, "global_step": 299634, "epoch": 2476} {"train_loss": -43.89374542236328, "global_step": 299635, "epoch": 2476} {"train_loss": -42.30356979370117, "global_step": 299636, "epoch": 2476} {"train_loss": -44.368473052978516, "global_step": 299637, "epoch": 2476} {"train_loss": -43.03818893432617, "global_step": 299638, "epoch": 2476} {"train_loss": -43.61737060546875, "global_step": 299639, "epoch": 2476} {"train_loss": -43.965614318847656, "global_step": 299640, "epoch": 2476} {"train_loss": -44.291622161865234, "global_step": 299641, "epoch": 2476} {"train_loss": -43.60077667236328, "global_step": 299642, "epoch": 2476} {"train_loss": -43.59233474731445, "global_step": 299643, "epoch": 2476} {"train_loss": -44.41229248046875, "global_step": 299644, "epoch": 2476} {"train_loss": -44.2364501953125, "global_step": 299645, "epoch": 2476} {"train_loss": -44.216094970703125, "global_step": 299646, "epoch": 2476} {"train_loss": -44.33761215209961, "global_step": 299647, "epoch": 2476} {"train_loss": -44.64328384399414, "global_step": 299648, "epoch": 2476} {"train_loss": -44.0754508972168, "global_step": 299649, "epoch": 2476} {"train_loss": -43.61509323120117, "global_step": 299650, "epoch": 2476} {"train_loss": -42.661800384521484, "global_step": 299651, "epoch": 2476} {"train_loss": -43.803016662597656, "global_step": 299652, "epoch": 2476} {"train_loss": -44.39832305908203, "global_step": 299653, "epoch": 2476} {"train_loss": -43.642127990722656, "global_step": 299654, "epoch": 2476} {"train_loss": -43.46234130859375, "global_step": 299655, "epoch": 2476} {"train_loss": -43.033931732177734, "global_step": 299656, "epoch": 2476} {"train_loss": -44.28891372680664, "global_step": 299657, "epoch": 2476} {"train_loss": -44.24739456176758, "global_step": 299658, "epoch": 2476} {"train_loss": -41.91486740112305, "global_step": 299659, "epoch": 2476} {"train_loss": -44.384849548339844, "global_step": 299660, "epoch": 2476} {"train_loss": -42.92379379272461, "global_step": 299661, "epoch": 2476} {"train_loss": -40.974853515625, "global_step": 299662, "epoch": 2476} {"train_loss": -39.84392547607422, "global_step": 299663, "epoch": 2476} {"train_loss": -42.50800704956055, "global_step": 299664, "epoch": 2476} {"train_loss": -39.827266693115234, "global_step": 299665, "epoch": 2476} {"train_loss": -42.598079681396484, "global_step": 299666, "epoch": 2476} {"train_loss": -42.1672248840332, "global_step": 299667, "epoch": 2476} {"train_loss": -42.63186264038086, "global_step": 299668, "epoch": 2476} {"train_loss": -42.51091003417969, "global_step": 299669, "epoch": 2476} {"train_loss": -42.96199035644531, "global_step": 299670, "epoch": 2476} {"train_loss": -43.63662338256836, "global_step": 299671, "epoch": 2476} {"train_loss": -43.406349182128906, "global_step": 299672, "epoch": 2476} {"train_loss": -42.743526458740234, "global_step": 299673, "epoch": 2476} {"train_loss": -43.02632522583008, "global_step": 299674, "epoch": 2476} {"train_loss": -43.45771408081055, "global_step": 299675, "epoch": 2476} {"train_loss": -43.89786911010742, "global_step": 299676, "epoch": 2476} {"train_loss": -43.07722091674805, "global_step": 299677, "epoch": 2476} {"train_loss": -42.93130111694336, "global_step": 299678, "epoch": 2476} {"train_loss": -43.415802001953125, "global_step": 299679, "epoch": 2476} {"train_loss": -43.16746520996094, "global_step": 299680, "epoch": 2476} {"train_loss": -41.65568161010742, "global_step": 299681, "epoch": 2476} {"train_loss": -44.01618957519531, "global_step": 299682, "epoch": 2476} {"train_loss": -43.19938278198242, "global_step": 299683, "epoch": 2476} {"train_loss": -42.17586898803711, "global_step": 299684, "epoch": 2476} {"train_loss": -43.5761833190918, "global_step": 299685, "epoch": 2476} {"train_loss": -43.76594161987305, "global_step": 299686, "epoch": 2476} {"train_loss": -43.29115676879883, "global_step": 299687, "epoch": 2476} {"train_loss": -43.132511138916016, "global_step": 299688, "epoch": 2476} {"train_loss": -43.204776763916016, "global_step": 299689, "epoch": 2476} {"train_loss": -42.336971282958984, "global_step": 299690, "epoch": 2476} {"train_loss": -40.639892578125, "global_step": 299691, "epoch": 2476} {"train_loss": -41.43312454223633, "global_step": 299692, "epoch": 2476} {"train_loss": -42.0125617980957, "global_step": 299693, "epoch": 2476} {"train_loss": -41.31099319458008, "global_step": 299694, "epoch": 2476} {"train_loss": -41.934181213378906, "global_step": 299695, "epoch": 2476} {"train_loss": -42.810821533203125, "global_step": 299696, "epoch": 2476} {"train_loss": -42.3271598815918, "global_step": 299697, "epoch": 2476} {"train_loss": -43.086483001708984, "global_step": 299698, "epoch": 2476} {"train_loss": -43.22505569458008, "global_step": 299699, "epoch": 2476} {"train_loss": -43.47589111328125, "global_step": 299700, "epoch": 2476} {"train_loss": -43.4366569519043, "global_step": 299701, "epoch": 2476} {"train_loss": -42.936214447021484, "global_step": 299702, "epoch": 2476} {"train_loss": -44.22734069824219, "global_step": 299703, "epoch": 2476} {"train_loss": -43.605377197265625, "global_step": 299704, "epoch": 2476} {"train_loss": -43.48411178588867, "global_step": 299705, "epoch": 2476} {"train_loss": -42.8199462890625, "global_step": 299706, "epoch": 2476} {"train_loss": -41.84366989135742, "global_step": 299707, "epoch": 2476} {"train_loss": -43.73920822143555, "global_step": 299708, "epoch": 2476} {"train_loss": -43.051795959472656, "global_step": 299709, "epoch": 2476} {"train_loss": -43.677913665771484, "global_step": 299710, "epoch": 2476} {"train_loss": -43.329734802246094, "global_step": 299711, "epoch": 2476} {"train_loss": -43.83453369140625, "global_step": 299712, "epoch": 2476} {"train_loss": -43.64421081542969, "global_step": 299713, "epoch": 2476} {"train_loss": -42.08887481689453, "global_step": 299714, "epoch": 2476} {"train_loss": -44.42769241333008, "global_step": 299715, "epoch": 2476} {"train_loss": -43.1543458670624, "global_step": 299716, "epoch": 2476, "val_loss": 2606913.0} {"train_loss": -42.10651397705078, "global_step": 299717, "epoch": 2477} {"train_loss": -43.82875442504883, "global_step": 299718, "epoch": 2477} {"train_loss": -41.95841598510742, "global_step": 299719, "epoch": 2477} {"train_loss": -43.551326751708984, "global_step": 299720, "epoch": 2477} {"train_loss": -42.30256271362305, "global_step": 299721, "epoch": 2477} {"train_loss": -43.07831573486328, "global_step": 299722, "epoch": 2477} {"train_loss": -42.89872360229492, "global_step": 299723, "epoch": 2477} {"train_loss": -43.511932373046875, "global_step": 299724, "epoch": 2477} {"train_loss": -42.44038772583008, "global_step": 299725, "epoch": 2477} {"train_loss": -42.96729278564453, "global_step": 299726, "epoch": 2477} {"train_loss": -43.18446350097656, "global_step": 299727, "epoch": 2477} {"train_loss": -42.10584259033203, "global_step": 299728, "epoch": 2477} {"train_loss": -43.91727828979492, "global_step": 299729, "epoch": 2477} {"train_loss": -42.3808708190918, "global_step": 299730, "epoch": 2477} {"train_loss": -44.033294677734375, "global_step": 299731, "epoch": 2477} {"train_loss": -42.765472412109375, "global_step": 299732, "epoch": 2477} {"train_loss": -43.31055450439453, "global_step": 299733, "epoch": 2477} {"train_loss": -44.4144172668457, "global_step": 299734, "epoch": 2477} {"train_loss": -43.53078842163086, "global_step": 299735, "epoch": 2477} {"train_loss": -44.23017120361328, "global_step": 299736, "epoch": 2477} {"train_loss": -43.55628204345703, "global_step": 299737, "epoch": 2477} {"train_loss": -43.14211654663086, "global_step": 299738, "epoch": 2477} {"train_loss": -43.34979248046875, "global_step": 299739, "epoch": 2477} {"train_loss": -44.264278411865234, "global_step": 299740, "epoch": 2477} {"train_loss": -43.55842971801758, "global_step": 299741, "epoch": 2477} {"train_loss": -44.34003448486328, "global_step": 299742, "epoch": 2477} {"train_loss": -44.435997009277344, "global_step": 299743, "epoch": 2477} {"train_loss": -44.08579635620117, "global_step": 299744, "epoch": 2477} {"train_loss": -44.15421676635742, "global_step": 299745, "epoch": 2477} {"train_loss": -44.140625, "global_step": 299746, "epoch": 2477} {"train_loss": -43.929237365722656, "global_step": 299747, "epoch": 2477} {"train_loss": -44.55754470825195, "global_step": 299748, "epoch": 2477} {"train_loss": -44.130104064941406, "global_step": 299749, "epoch": 2477} {"train_loss": -44.37417221069336, "global_step": 299750, "epoch": 2477} {"train_loss": -44.48308181762695, "global_step": 299751, "epoch": 2477} {"train_loss": -44.46369934082031, "global_step": 299752, "epoch": 2477} {"train_loss": -44.3865852355957, "global_step": 299753, "epoch": 2477} {"train_loss": -43.55976486206055, "global_step": 299754, "epoch": 2477} {"train_loss": -43.71516799926758, "global_step": 299755, "epoch": 2477} {"train_loss": -44.13697814941406, "global_step": 299756, "epoch": 2477} {"train_loss": -42.81132888793945, "global_step": 299757, "epoch": 2477} {"train_loss": -43.273441314697266, "global_step": 299758, "epoch": 2477} {"train_loss": -43.17034912109375, "global_step": 299759, "epoch": 2477} {"train_loss": -43.48513412475586, "global_step": 299760, "epoch": 2477} {"train_loss": -43.155391693115234, "global_step": 299761, "epoch": 2477} {"train_loss": -43.986167907714844, "global_step": 299762, "epoch": 2477} {"train_loss": -43.264686584472656, "global_step": 299763, "epoch": 2477} {"train_loss": -43.6532096862793, "global_step": 299764, "epoch": 2477} {"train_loss": -44.114723205566406, "global_step": 299765, "epoch": 2477} {"train_loss": -42.32954025268555, "global_step": 299766, "epoch": 2477} {"train_loss": -44.042030334472656, "global_step": 299767, "epoch": 2477} {"train_loss": -43.37727737426758, "global_step": 299768, "epoch": 2477} {"train_loss": -43.18369674682617, "global_step": 299769, "epoch": 2477} {"train_loss": -43.84821701049805, "global_step": 299770, "epoch": 2477} {"train_loss": -43.629451751708984, "global_step": 299771, "epoch": 2477} {"train_loss": -43.880775451660156, "global_step": 299772, "epoch": 2477} {"train_loss": -43.75239181518555, "global_step": 299773, "epoch": 2477} {"train_loss": -43.81820297241211, "global_step": 299774, "epoch": 2477} {"train_loss": -44.125892639160156, "global_step": 299775, "epoch": 2477} {"train_loss": -43.42903518676758, "global_step": 299776, "epoch": 2477} {"train_loss": -44.32233810424805, "global_step": 299777, "epoch": 2477} {"train_loss": -43.52077865600586, "global_step": 299778, "epoch": 2477} {"train_loss": -43.2325439453125, "global_step": 299779, "epoch": 2477} {"train_loss": -43.62826919555664, "global_step": 299780, "epoch": 2477} {"train_loss": -43.93294143676758, "global_step": 299781, "epoch": 2477} {"train_loss": -41.91239547729492, "global_step": 299782, "epoch": 2477} {"train_loss": -43.68538284301758, "global_step": 299783, "epoch": 2477} {"train_loss": -43.77744674682617, "global_step": 299784, "epoch": 2477} {"train_loss": -44.120399475097656, "global_step": 299785, "epoch": 2477} {"train_loss": -43.248023986816406, "global_step": 299786, "epoch": 2477} {"train_loss": -44.031856536865234, "global_step": 299787, "epoch": 2477} {"train_loss": -44.481258392333984, "global_step": 299788, "epoch": 2477} {"train_loss": -42.93999481201172, "global_step": 299789, "epoch": 2477} {"train_loss": -42.210514068603516, "global_step": 299790, "epoch": 2477} {"train_loss": -43.716304779052734, "global_step": 299791, "epoch": 2477} {"train_loss": -43.587127685546875, "global_step": 299792, "epoch": 2477} {"train_loss": -43.72306823730469, "global_step": 299793, "epoch": 2477} {"train_loss": -43.005313873291016, "global_step": 299794, "epoch": 2477} {"train_loss": -44.32843780517578, "global_step": 299795, "epoch": 2477} {"train_loss": -43.16665267944336, "global_step": 299796, "epoch": 2477} {"train_loss": -39.83327102661133, "global_step": 299797, "epoch": 2477} {"train_loss": -43.26852035522461, "global_step": 299798, "epoch": 2477} {"train_loss": -43.22369384765625, "global_step": 299799, "epoch": 2477} {"train_loss": -43.86605453491211, "global_step": 299800, "epoch": 2477} {"train_loss": -43.3546028137207, "global_step": 299801, "epoch": 2477} {"train_loss": -44.34270095825195, "global_step": 299802, "epoch": 2477} {"train_loss": -43.619667053222656, "global_step": 299803, "epoch": 2477} {"train_loss": -44.238494873046875, "global_step": 299804, "epoch": 2477} {"train_loss": -44.64313507080078, "global_step": 299805, "epoch": 2477} {"train_loss": -44.28652572631836, "global_step": 299806, "epoch": 2477} {"train_loss": -43.78828048706055, "global_step": 299807, "epoch": 2477} {"train_loss": -43.304908752441406, "global_step": 299808, "epoch": 2477} {"train_loss": -43.95695114135742, "global_step": 299809, "epoch": 2477} {"train_loss": -44.6834716796875, "global_step": 299810, "epoch": 2477} {"train_loss": -44.121028900146484, "global_step": 299811, "epoch": 2477} {"train_loss": -44.30924606323242, "global_step": 299812, "epoch": 2477} {"train_loss": -44.1329345703125, "global_step": 299813, "epoch": 2477} {"train_loss": -43.99620056152344, "global_step": 299814, "epoch": 2477} {"train_loss": -43.58901596069336, "global_step": 299815, "epoch": 2477} {"train_loss": -43.69058609008789, "global_step": 299816, "epoch": 2477} {"train_loss": -44.52915954589844, "global_step": 299817, "epoch": 2477} {"train_loss": -44.23103332519531, "global_step": 299818, "epoch": 2477} {"train_loss": -44.69881057739258, "global_step": 299819, "epoch": 2477} {"train_loss": -44.205970764160156, "global_step": 299820, "epoch": 2477} {"train_loss": -44.78044509887695, "global_step": 299821, "epoch": 2477} {"train_loss": -44.12794876098633, "global_step": 299822, "epoch": 2477} {"train_loss": -43.3189697265625, "global_step": 299823, "epoch": 2477} {"train_loss": -44.114295959472656, "global_step": 299824, "epoch": 2477} {"train_loss": -44.47941207885742, "global_step": 299825, "epoch": 2477} {"train_loss": -44.20379638671875, "global_step": 299826, "epoch": 2477} {"train_loss": -43.476497650146484, "global_step": 299827, "epoch": 2477} {"train_loss": -44.667362213134766, "global_step": 299828, "epoch": 2477} {"train_loss": -43.65174865722656, "global_step": 299829, "epoch": 2477} {"train_loss": -37.9852409362793, "global_step": 299830, "epoch": 2477} {"train_loss": -41.683528900146484, "global_step": 299831, "epoch": 2477} {"train_loss": -42.652835845947266, "global_step": 299832, "epoch": 2477} {"train_loss": -42.537208557128906, "global_step": 299833, "epoch": 2477} {"train_loss": -43.335506439208984, "global_step": 299834, "epoch": 2477} {"train_loss": -42.34291458129883, "global_step": 299835, "epoch": 2477} {"train_loss": -43.01605224609375, "global_step": 299836, "epoch": 2477} {"train_loss": -43.55545397041258, "global_step": 299837, "epoch": 2477, "val_loss": 2665535.0} {"train_loss": -41.674659729003906, "global_step": 299838, "epoch": 2478} {"train_loss": -43.61385726928711, "global_step": 299839, "epoch": 2478} {"train_loss": -40.918819427490234, "global_step": 299840, "epoch": 2478} {"train_loss": -42.07163619995117, "global_step": 299841, "epoch": 2478} {"train_loss": -40.6322135925293, "global_step": 299842, "epoch": 2478} {"train_loss": -40.608314514160156, "global_step": 299843, "epoch": 2478} {"train_loss": -43.7421989440918, "global_step": 299844, "epoch": 2478} {"train_loss": -42.40857696533203, "global_step": 299845, "epoch": 2478} {"train_loss": -42.712100982666016, "global_step": 299846, "epoch": 2478} {"train_loss": -42.3516960144043, "global_step": 299847, "epoch": 2478} {"train_loss": -42.19679641723633, "global_step": 299848, "epoch": 2478} {"train_loss": -42.26579666137695, "global_step": 299849, "epoch": 2478} {"train_loss": -42.898277282714844, "global_step": 299850, "epoch": 2478} {"train_loss": -42.24717330932617, "global_step": 299851, "epoch": 2478} {"train_loss": -41.729393005371094, "global_step": 299852, "epoch": 2478} {"train_loss": -41.32546615600586, "global_step": 299853, "epoch": 2478} {"train_loss": -41.684627532958984, "global_step": 299854, "epoch": 2478} {"train_loss": -44.243629455566406, "global_step": 299855, "epoch": 2478} {"train_loss": -40.004051208496094, "global_step": 299856, "epoch": 2478} {"train_loss": -42.60527038574219, "global_step": 299857, "epoch": 2478} {"train_loss": -41.417213439941406, "global_step": 299858, "epoch": 2478} {"train_loss": -41.936431884765625, "global_step": 299859, "epoch": 2478} {"train_loss": -40.97581481933594, "global_step": 299860, "epoch": 2478} {"train_loss": -41.741180419921875, "global_step": 299861, "epoch": 2478} {"train_loss": -40.031612396240234, "global_step": 299862, "epoch": 2478} {"train_loss": -41.71993637084961, "global_step": 299863, "epoch": 2478} {"train_loss": -42.08565902709961, "global_step": 299864, "epoch": 2478} {"train_loss": -42.314449310302734, "global_step": 299865, "epoch": 2478} {"train_loss": -40.59711837768555, "global_step": 299866, "epoch": 2478} {"train_loss": -43.026248931884766, "global_step": 299867, "epoch": 2478} {"train_loss": -41.29428482055664, "global_step": 299868, "epoch": 2478} {"train_loss": -41.48169708251953, "global_step": 299869, "epoch": 2478} {"train_loss": -42.38412857055664, "global_step": 299870, "epoch": 2478} {"train_loss": -43.35614776611328, "global_step": 299871, "epoch": 2478} {"train_loss": -42.905853271484375, "global_step": 299872, "epoch": 2478} {"train_loss": -43.29830551147461, "global_step": 299873, "epoch": 2478} {"train_loss": -43.290191650390625, "global_step": 299874, "epoch": 2478} {"train_loss": -43.33271408081055, "global_step": 299875, "epoch": 2478} {"train_loss": -42.99479293823242, "global_step": 299876, "epoch": 2478} {"train_loss": -42.952693939208984, "global_step": 299877, "epoch": 2478} {"train_loss": -42.56814193725586, "global_step": 299878, "epoch": 2478} {"train_loss": -43.115360260009766, "global_step": 299879, "epoch": 2478} {"train_loss": -43.66545867919922, "global_step": 299880, "epoch": 2478} {"train_loss": -43.100460052490234, "global_step": 299881, "epoch": 2478} {"train_loss": -43.11152267456055, "global_step": 299882, "epoch": 2478} {"train_loss": -42.57554244995117, "global_step": 299883, "epoch": 2478} {"train_loss": -43.214271545410156, "global_step": 299884, "epoch": 2478} {"train_loss": -43.02431106567383, "global_step": 299885, "epoch": 2478} {"train_loss": -43.65914535522461, "global_step": 299886, "epoch": 2478} {"train_loss": -43.741943359375, "global_step": 299887, "epoch": 2478} {"train_loss": -42.274078369140625, "global_step": 299888, "epoch": 2478} {"train_loss": -43.66830062866211, "global_step": 299889, "epoch": 2478} {"train_loss": -43.47210693359375, "global_step": 299890, "epoch": 2478} {"train_loss": -43.64531326293945, "global_step": 299891, "epoch": 2478} {"train_loss": -43.991661071777344, "global_step": 299892, "epoch": 2478} {"train_loss": -43.798675537109375, "global_step": 299893, "epoch": 2478} {"train_loss": -43.89702224731445, "global_step": 299894, "epoch": 2478} {"train_loss": -42.7924690246582, "global_step": 299895, "epoch": 2478} {"train_loss": -42.742733001708984, "global_step": 299896, "epoch": 2478} {"train_loss": -43.74659729003906, "global_step": 299897, "epoch": 2478} {"train_loss": -44.05037307739258, "global_step": 299898, "epoch": 2478} {"train_loss": -43.03013229370117, "global_step": 299899, "epoch": 2478} {"train_loss": -43.830501556396484, "global_step": 299900, "epoch": 2478} {"train_loss": -44.4786376953125, "global_step": 299901, "epoch": 2478} {"train_loss": -43.826507568359375, "global_step": 299902, "epoch": 2478} {"train_loss": -43.482421875, "global_step": 299903, "epoch": 2478} {"train_loss": -44.04135513305664, "global_step": 299904, "epoch": 2478} {"train_loss": -44.238277435302734, "global_step": 299905, "epoch": 2478} {"train_loss": -44.121482849121094, "global_step": 299906, "epoch": 2478} {"train_loss": -43.441707611083984, "global_step": 299907, "epoch": 2478} {"train_loss": -43.255615234375, "global_step": 299908, "epoch": 2478} {"train_loss": -44.01241683959961, "global_step": 299909, "epoch": 2478} {"train_loss": -43.9460563659668, "global_step": 299910, "epoch": 2478} {"train_loss": -42.73895263671875, "global_step": 299911, "epoch": 2478} {"train_loss": -43.21794509887695, "global_step": 299912, "epoch": 2478} {"train_loss": -40.33220672607422, "global_step": 299913, "epoch": 2478} {"train_loss": -44.3612174987793, "global_step": 299914, "epoch": 2478} {"train_loss": -43.19265365600586, "global_step": 299915, "epoch": 2478} {"train_loss": -43.257572174072266, "global_step": 299916, "epoch": 2478} {"train_loss": -42.99746322631836, "global_step": 299917, "epoch": 2478} {"train_loss": -42.06623458862305, "global_step": 299918, "epoch": 2478} {"train_loss": -43.13793182373047, "global_step": 299919, "epoch": 2478} {"train_loss": -42.46786117553711, "global_step": 299920, "epoch": 2478} {"train_loss": -43.664024353027344, "global_step": 299921, "epoch": 2478} {"train_loss": -43.96584701538086, "global_step": 299922, "epoch": 2478} {"train_loss": -43.88648223876953, "global_step": 299923, "epoch": 2478} {"train_loss": -43.36172866821289, "global_step": 299924, "epoch": 2478} {"train_loss": -42.518768310546875, "global_step": 299925, "epoch": 2478} {"train_loss": -44.20339584350586, "global_step": 299926, "epoch": 2478} {"train_loss": -43.727081298828125, "global_step": 299927, "epoch": 2478} {"train_loss": -42.78535079956055, "global_step": 299928, "epoch": 2478} {"train_loss": -42.17562484741211, "global_step": 299929, "epoch": 2478} {"train_loss": -42.894683837890625, "global_step": 299930, "epoch": 2478} {"train_loss": -44.14398193359375, "global_step": 299931, "epoch": 2478} {"train_loss": -43.086753845214844, "global_step": 299932, "epoch": 2478} {"train_loss": -43.6764030456543, "global_step": 299933, "epoch": 2478} {"train_loss": -42.283119201660156, "global_step": 299934, "epoch": 2478} {"train_loss": -42.0316276550293, "global_step": 299935, "epoch": 2478} {"train_loss": -43.61517333984375, "global_step": 299936, "epoch": 2478} {"train_loss": -42.98653030395508, "global_step": 299937, "epoch": 2478} {"train_loss": -41.14674758911133, "global_step": 299938, "epoch": 2478} {"train_loss": -43.19426727294922, "global_step": 299939, "epoch": 2478} {"train_loss": -40.448177337646484, "global_step": 299940, "epoch": 2478} {"train_loss": -42.7862663269043, "global_step": 299941, "epoch": 2478} {"train_loss": -35.64731979370117, "global_step": 299942, "epoch": 2478} {"train_loss": -40.50142288208008, "global_step": 299943, "epoch": 2478} {"train_loss": -38.750518798828125, "global_step": 299944, "epoch": 2478} {"train_loss": -40.84132385253906, "global_step": 299945, "epoch": 2478} {"train_loss": -40.63246536254883, "global_step": 299946, "epoch": 2478} {"train_loss": -39.46598434448242, "global_step": 299947, "epoch": 2478} {"train_loss": -41.5471305847168, "global_step": 299948, "epoch": 2478} {"train_loss": -39.497310638427734, "global_step": 299949, "epoch": 2478} {"train_loss": -42.10773468017578, "global_step": 299950, "epoch": 2478} {"train_loss": -37.56465530395508, "global_step": 299951, "epoch": 2478} {"train_loss": -41.199581146240234, "global_step": 299952, "epoch": 2478} {"train_loss": -39.090919494628906, "global_step": 299953, "epoch": 2478} {"train_loss": -41.02812194824219, "global_step": 299954, "epoch": 2478} {"train_loss": -37.788665771484375, "global_step": 299955, "epoch": 2478} {"train_loss": -40.3834342956543, "global_step": 299956, "epoch": 2478} {"train_loss": -38.350860595703125, "global_step": 299957, "epoch": 2478} {"train_loss": -42.35273783660132, "global_step": 299958, "epoch": 2478, "val_loss": 2441062.0} {"train_loss": -40.876930236816406, "global_step": 299959, "epoch": 2479} {"train_loss": -38.78369903564453, "global_step": 299960, "epoch": 2479} {"train_loss": -39.114967346191406, "global_step": 299961, "epoch": 2479} {"train_loss": -40.4582633972168, "global_step": 299962, "epoch": 2479} {"train_loss": -39.68158721923828, "global_step": 299963, "epoch": 2479} {"train_loss": -40.82375717163086, "global_step": 299964, "epoch": 2479} {"train_loss": -40.743499755859375, "global_step": 299965, "epoch": 2479} {"train_loss": -40.66279220581055, "global_step": 299966, "epoch": 2479} {"train_loss": -40.590545654296875, "global_step": 299967, "epoch": 2479} {"train_loss": -40.7601203918457, "global_step": 299968, "epoch": 2479} {"train_loss": -42.30133819580078, "global_step": 299969, "epoch": 2479} {"train_loss": -40.58515548706055, "global_step": 299970, "epoch": 2479} {"train_loss": -40.92424774169922, "global_step": 299971, "epoch": 2479} {"train_loss": -42.476192474365234, "global_step": 299972, "epoch": 2479} {"train_loss": -41.52092361450195, "global_step": 299973, "epoch": 2479} {"train_loss": -41.70014572143555, "global_step": 299974, "epoch": 2479} {"train_loss": -41.24553298950195, "global_step": 299975, "epoch": 2479} {"train_loss": -41.64152145385742, "global_step": 299976, "epoch": 2479} {"train_loss": -42.03327178955078, "global_step": 299977, "epoch": 2479} {"train_loss": -42.407928466796875, "global_step": 299978, "epoch": 2479} {"train_loss": -43.00912094116211, "global_step": 299979, "epoch": 2479} {"train_loss": -42.160438537597656, "global_step": 299980, "epoch": 2479} {"train_loss": -42.84088897705078, "global_step": 299981, "epoch": 2479} {"train_loss": -42.61671829223633, "global_step": 299982, "epoch": 2479} {"train_loss": -43.682857513427734, "global_step": 299983, "epoch": 2479} {"train_loss": -42.66653060913086, "global_step": 299984, "epoch": 2479} {"train_loss": -43.18861389160156, "global_step": 299985, "epoch": 2479} {"train_loss": -43.3857307434082, "global_step": 299986, "epoch": 2479} {"train_loss": -43.262245178222656, "global_step": 299987, "epoch": 2479} {"train_loss": -43.699588775634766, "global_step": 299988, "epoch": 2479} {"train_loss": -43.196754455566406, "global_step": 299989, "epoch": 2479} {"train_loss": -43.01548385620117, "global_step": 299990, "epoch": 2479} {"train_loss": -43.722408294677734, "global_step": 299991, "epoch": 2479} {"train_loss": -43.4875373840332, "global_step": 299992, "epoch": 2479} {"train_loss": -43.68075180053711, "global_step": 299993, "epoch": 2479} {"train_loss": -43.626827239990234, "global_step": 299994, "epoch": 2479} {"train_loss": -44.03200149536133, "global_step": 299995, "epoch": 2479} {"train_loss": -43.38715744018555, "global_step": 299996, "epoch": 2479} {"train_loss": -43.42657470703125, "global_step": 299997, "epoch": 2479} {"train_loss": -43.33526611328125, "global_step": 299998, "epoch": 2479} {"train_loss": -43.77128219604492, "global_step": 299999, "epoch": 2479} {"train_loss": -43.71992111206055, "global_step": 300000, "epoch": 2479} {"train_loss": -44.02286911010742, "global_step": 300001, "epoch": 2479} {"train_loss": -43.031490325927734, "global_step": 300002, "epoch": 2479} {"train_loss": -43.006309509277344, "global_step": 300003, "epoch": 2479} {"train_loss": -43.4061279296875, "global_step": 300004, "epoch": 2479} {"train_loss": -43.72686767578125, "global_step": 300005, "epoch": 2479} {"train_loss": -42.56440734863281, "global_step": 300006, "epoch": 2479} {"train_loss": -42.35546875, "global_step": 300007, "epoch": 2479} {"train_loss": -43.956363677978516, "global_step": 300008, "epoch": 2479} {"train_loss": -43.104576110839844, "global_step": 300009, "epoch": 2479} {"train_loss": -42.145015716552734, "global_step": 300010, "epoch": 2479} {"train_loss": -42.86383819580078, "global_step": 300011, "epoch": 2479} {"train_loss": -43.65420150756836, "global_step": 300012, "epoch": 2479} {"train_loss": -41.9132194519043, "global_step": 300013, "epoch": 2479} {"train_loss": -43.811378479003906, "global_step": 300014, "epoch": 2479} {"train_loss": -43.802066802978516, "global_step": 300015, "epoch": 2479} {"train_loss": -43.0903205871582, "global_step": 300016, "epoch": 2479} {"train_loss": -44.04594421386719, "global_step": 300017, "epoch": 2479} {"train_loss": -43.15140914916992, "global_step": 300018, "epoch": 2479} {"train_loss": -43.803035736083984, "global_step": 300019, "epoch": 2479} {"train_loss": -43.96238708496094, "global_step": 300020, "epoch": 2479} {"train_loss": -43.359397888183594, "global_step": 300021, "epoch": 2479} {"train_loss": -43.3616828918457, "global_step": 300022, "epoch": 2479} {"train_loss": -43.85966110229492, "global_step": 300023, "epoch": 2479} {"train_loss": -43.5233039855957, "global_step": 300024, "epoch": 2479} {"train_loss": -44.13533020019531, "global_step": 300025, "epoch": 2479} {"train_loss": -44.19123458862305, "global_step": 300026, "epoch": 2479} {"train_loss": -43.82075119018555, "global_step": 300027, "epoch": 2479} {"train_loss": -44.05769348144531, "global_step": 300028, "epoch": 2479} {"train_loss": -44.275115966796875, "global_step": 300029, "epoch": 2479} {"train_loss": -42.96271514892578, "global_step": 300030, "epoch": 2479} {"train_loss": -44.587379455566406, "global_step": 300031, "epoch": 2479} {"train_loss": -44.29522705078125, "global_step": 300032, "epoch": 2479} {"train_loss": -43.79887771606445, "global_step": 300033, "epoch": 2479} {"train_loss": -43.879920959472656, "global_step": 300034, "epoch": 2479} {"train_loss": -43.43214797973633, "global_step": 300035, "epoch": 2479} {"train_loss": -43.47090530395508, "global_step": 300036, "epoch": 2479} {"train_loss": -43.87728500366211, "global_step": 300037, "epoch": 2479} {"train_loss": -43.467742919921875, "global_step": 300038, "epoch": 2479} {"train_loss": -43.910884857177734, "global_step": 300039, "epoch": 2479} {"train_loss": -43.63970184326172, "global_step": 300040, "epoch": 2479} {"train_loss": -42.53315353393555, "global_step": 300041, "epoch": 2479} {"train_loss": -43.71039962768555, "global_step": 300042, "epoch": 2479} {"train_loss": -44.07930374145508, "global_step": 300043, "epoch": 2479} {"train_loss": -44.929683685302734, "global_step": 300044, "epoch": 2479} {"train_loss": -43.530391693115234, "global_step": 300045, "epoch": 2479} {"train_loss": -42.860652923583984, "global_step": 300046, "epoch": 2479} {"train_loss": -44.53318405151367, "global_step": 300047, "epoch": 2479} {"train_loss": -43.16077423095703, "global_step": 300048, "epoch": 2479} {"train_loss": -41.8860969543457, "global_step": 300049, "epoch": 2479} {"train_loss": -44.1689338684082, "global_step": 300050, "epoch": 2479} {"train_loss": -43.55059814453125, "global_step": 300051, "epoch": 2479} {"train_loss": -43.137996673583984, "global_step": 300052, "epoch": 2479} {"train_loss": -43.71126174926758, "global_step": 300053, "epoch": 2479} {"train_loss": -43.30192947387695, "global_step": 300054, "epoch": 2479} {"train_loss": -43.31887435913086, "global_step": 300055, "epoch": 2479} {"train_loss": -44.26530075073242, "global_step": 300056, "epoch": 2479} {"train_loss": -43.812923431396484, "global_step": 300057, "epoch": 2479} {"train_loss": -44.11273193359375, "global_step": 300058, "epoch": 2479} {"train_loss": -44.33299255371094, "global_step": 300059, "epoch": 2479} {"train_loss": -44.17649459838867, "global_step": 300060, "epoch": 2479} {"train_loss": -44.3184928894043, "global_step": 300061, "epoch": 2479} {"train_loss": -44.2589111328125, "global_step": 300062, "epoch": 2479} {"train_loss": -44.62428665161133, "global_step": 300063, "epoch": 2479} {"train_loss": -42.42904281616211, "global_step": 300064, "epoch": 2479} {"train_loss": -44.2833366394043, "global_step": 300065, "epoch": 2479} {"train_loss": -44.62699508666992, "global_step": 300066, "epoch": 2479} {"train_loss": -44.157188415527344, "global_step": 300067, "epoch": 2479} {"train_loss": -44.314125061035156, "global_step": 300068, "epoch": 2479} {"train_loss": -44.115562438964844, "global_step": 300069, "epoch": 2479} {"train_loss": -44.0530891418457, "global_step": 300070, "epoch": 2479} {"train_loss": -41.45005416870117, "global_step": 300071, "epoch": 2479} {"train_loss": -43.58152389526367, "global_step": 300072, "epoch": 2479} {"train_loss": -42.01462173461914, "global_step": 300073, "epoch": 2479} {"train_loss": -43.410762786865234, "global_step": 300074, "epoch": 2479} {"train_loss": -44.02679443359375, "global_step": 300075, "epoch": 2479} {"train_loss": -43.50735092163086, "global_step": 300076, "epoch": 2479} {"train_loss": -42.74061584472656, "global_step": 300077, "epoch": 2479} {"train_loss": -42.941314697265625, "global_step": 300078, "epoch": 2479} {"train_loss": -43.04951962557706, "global_step": 300079, "epoch": 2479, "val_loss": 2618165.25} {"train_loss": -39.14070510864258, "global_step": 300080, "epoch": 2480} {"train_loss": -43.07878875732422, "global_step": 300081, "epoch": 2480} {"train_loss": -41.22817611694336, "global_step": 300082, "epoch": 2480} {"train_loss": -42.58414840698242, "global_step": 300083, "epoch": 2480} {"train_loss": -43.1379508972168, "global_step": 300084, "epoch": 2480} {"train_loss": -42.9630241394043, "global_step": 300085, "epoch": 2480} {"train_loss": -43.093414306640625, "global_step": 300086, "epoch": 2480} {"train_loss": -41.95313262939453, "global_step": 300087, "epoch": 2480} {"train_loss": -40.84735870361328, "global_step": 300088, "epoch": 2480} {"train_loss": -41.06229782104492, "global_step": 300089, "epoch": 2480} {"train_loss": -41.572486877441406, "global_step": 300090, "epoch": 2480} {"train_loss": -43.70754623413086, "global_step": 300091, "epoch": 2480} {"train_loss": -41.25265884399414, "global_step": 300092, "epoch": 2480} {"train_loss": -43.46697998046875, "global_step": 300093, "epoch": 2480} {"train_loss": -41.61317825317383, "global_step": 300094, "epoch": 2480} {"train_loss": -42.716087341308594, "global_step": 300095, "epoch": 2480} {"train_loss": -42.43818283081055, "global_step": 300096, "epoch": 2480} {"train_loss": -41.84259796142578, "global_step": 300097, "epoch": 2480} {"train_loss": -42.05788040161133, "global_step": 300098, "epoch": 2480} {"train_loss": -42.7939567565918, "global_step": 300099, "epoch": 2480} {"train_loss": -42.01839065551758, "global_step": 300100, "epoch": 2480} {"train_loss": -43.15239334106445, "global_step": 300101, "epoch": 2480} {"train_loss": -42.16621780395508, "global_step": 300102, "epoch": 2480} {"train_loss": -42.088775634765625, "global_step": 300103, "epoch": 2480} {"train_loss": -42.6483268737793, "global_step": 300104, "epoch": 2480} {"train_loss": -41.99430847167969, "global_step": 300105, "epoch": 2480} {"train_loss": -42.813255310058594, "global_step": 300106, "epoch": 2480} {"train_loss": -42.42232894897461, "global_step": 300107, "epoch": 2480} {"train_loss": -43.20856475830078, "global_step": 300108, "epoch": 2480} {"train_loss": -40.49699783325195, "global_step": 300109, "epoch": 2480} {"train_loss": -42.76911163330078, "global_step": 300110, "epoch": 2480} {"train_loss": -42.8816032409668, "global_step": 300111, "epoch": 2480} {"train_loss": -42.268333435058594, "global_step": 300112, "epoch": 2480} {"train_loss": -41.45436096191406, "global_step": 300113, "epoch": 2480} {"train_loss": -42.633941650390625, "global_step": 300114, "epoch": 2480} {"train_loss": -43.34181594848633, "global_step": 300115, "epoch": 2480} {"train_loss": -42.43888473510742, "global_step": 300116, "epoch": 2480} {"train_loss": -43.178367614746094, "global_step": 300117, "epoch": 2480} {"train_loss": -43.8540153503418, "global_step": 300118, "epoch": 2480} {"train_loss": -43.109066009521484, "global_step": 300119, "epoch": 2480} {"train_loss": -44.1051139831543, "global_step": 300120, "epoch": 2480} {"train_loss": -43.75228500366211, "global_step": 300121, "epoch": 2480} {"train_loss": -42.86923599243164, "global_step": 300122, "epoch": 2480} {"train_loss": -43.15279006958008, "global_step": 300123, "epoch": 2480} {"train_loss": -43.56789779663086, "global_step": 300124, "epoch": 2480} {"train_loss": -43.11697006225586, "global_step": 300125, "epoch": 2480} {"train_loss": -44.06532669067383, "global_step": 300126, "epoch": 2480} {"train_loss": -43.73353958129883, "global_step": 300127, "epoch": 2480} {"train_loss": -43.638092041015625, "global_step": 300128, "epoch": 2480} {"train_loss": -42.09653854370117, "global_step": 300129, "epoch": 2480} {"train_loss": -40.4300537109375, "global_step": 300130, "epoch": 2480} {"train_loss": -43.784603118896484, "global_step": 300131, "epoch": 2480} {"train_loss": -43.81935501098633, "global_step": 300132, "epoch": 2480} {"train_loss": -43.613136291503906, "global_step": 300133, "epoch": 2480} {"train_loss": -43.49296951293945, "global_step": 300134, "epoch": 2480} {"train_loss": -44.01887893676758, "global_step": 300135, "epoch": 2480} {"train_loss": -44.53654861450195, "global_step": 300136, "epoch": 2480} {"train_loss": -44.2811279296875, "global_step": 300137, "epoch": 2480} {"train_loss": -44.00790786743164, "global_step": 300138, "epoch": 2480} {"train_loss": -44.00959396362305, "global_step": 300139, "epoch": 2480} {"train_loss": -44.20961380004883, "global_step": 300140, "epoch": 2480} {"train_loss": -44.18037033081055, "global_step": 300141, "epoch": 2480} {"train_loss": -42.15132522583008, "global_step": 300142, "epoch": 2480} {"train_loss": -44.2065315246582, "global_step": 300143, "epoch": 2480} {"train_loss": -44.21833419799805, "global_step": 300144, "epoch": 2480} {"train_loss": -42.008056640625, "global_step": 300145, "epoch": 2480} {"train_loss": -42.7697639465332, "global_step": 300146, "epoch": 2480} {"train_loss": -44.39445495605469, "global_step": 300147, "epoch": 2480} {"train_loss": -43.975345611572266, "global_step": 300148, "epoch": 2480} {"train_loss": -43.512508392333984, "global_step": 300149, "epoch": 2480} {"train_loss": -41.11782455444336, "global_step": 300150, "epoch": 2480} {"train_loss": -43.65092849731445, "global_step": 300151, "epoch": 2480} {"train_loss": -43.944679260253906, "global_step": 300152, "epoch": 2480} {"train_loss": -37.7342414855957, "global_step": 300153, "epoch": 2480} {"train_loss": -43.318214416503906, "global_step": 300154, "epoch": 2480} {"train_loss": -43.61704635620117, "global_step": 300155, "epoch": 2480} {"train_loss": -44.07606506347656, "global_step": 300156, "epoch": 2480} {"train_loss": -44.100154876708984, "global_step": 300157, "epoch": 2480} {"train_loss": -43.41083526611328, "global_step": 300158, "epoch": 2480} {"train_loss": -42.20506286621094, "global_step": 300159, "epoch": 2480} {"train_loss": -41.2767448425293, "global_step": 300160, "epoch": 2480} {"train_loss": -44.12815856933594, "global_step": 300161, "epoch": 2480} {"train_loss": -42.333187103271484, "global_step": 300162, "epoch": 2480} {"train_loss": -44.855533599853516, "global_step": 300163, "epoch": 2480} {"train_loss": -43.264892578125, "global_step": 300164, "epoch": 2480} {"train_loss": -44.026023864746094, "global_step": 300165, "epoch": 2480} {"train_loss": -43.68593978881836, "global_step": 300166, "epoch": 2480} {"train_loss": -43.1529541015625, "global_step": 300167, "epoch": 2480} {"train_loss": -43.54669189453125, "global_step": 300168, "epoch": 2480} {"train_loss": -43.01101303100586, "global_step": 300169, "epoch": 2480} {"train_loss": -43.264095306396484, "global_step": 300170, "epoch": 2480} {"train_loss": -42.18788146972656, "global_step": 300171, "epoch": 2480} {"train_loss": -41.215999603271484, "global_step": 300172, "epoch": 2480} {"train_loss": -43.42814254760742, "global_step": 300173, "epoch": 2480} {"train_loss": -40.93655776977539, "global_step": 300174, "epoch": 2480} {"train_loss": -37.81938934326172, "global_step": 300175, "epoch": 2480} {"train_loss": -39.29204177856445, "global_step": 300176, "epoch": 2480} {"train_loss": -40.58643341064453, "global_step": 300177, "epoch": 2480} {"train_loss": -38.442691802978516, "global_step": 300178, "epoch": 2480} {"train_loss": -39.047584533691406, "global_step": 300179, "epoch": 2480} {"train_loss": -40.93250274658203, "global_step": 300180, "epoch": 2480} {"train_loss": -38.20443344116211, "global_step": 300181, "epoch": 2480} {"train_loss": -40.00299835205078, "global_step": 300182, "epoch": 2480} {"train_loss": -41.032508850097656, "global_step": 300183, "epoch": 2480} {"train_loss": -41.47465133666992, "global_step": 300184, "epoch": 2480} {"train_loss": -41.043148040771484, "global_step": 300185, "epoch": 2480} {"train_loss": -40.134132385253906, "global_step": 300186, "epoch": 2480} {"train_loss": -41.974849700927734, "global_step": 300187, "epoch": 2480} {"train_loss": -43.191856384277344, "global_step": 300188, "epoch": 2480} {"train_loss": -38.8554801940918, "global_step": 300189, "epoch": 2480} {"train_loss": -42.04193878173828, "global_step": 300190, "epoch": 2480} {"train_loss": -41.361305236816406, "global_step": 300191, "epoch": 2480} {"train_loss": -43.08710479736328, "global_step": 300192, "epoch": 2480} {"train_loss": -42.976837158203125, "global_step": 300193, "epoch": 2480} {"train_loss": -42.008514404296875, "global_step": 300194, "epoch": 2480} {"train_loss": -42.3547477722168, "global_step": 300195, "epoch": 2480} {"train_loss": -42.02249526977539, "global_step": 300196, "epoch": 2480} {"train_loss": -39.2462272644043, "global_step": 300197, "epoch": 2480} {"train_loss": -43.71370315551758, "global_step": 300198, "epoch": 2480} {"train_loss": -42.8983268737793, "global_step": 300199, "epoch": 2480} {"train_loss": -42.44920538279636, "global_step": 300200, "epoch": 2480, "val_loss": 3303450.0} {"train_loss": -42.99418258666992, "global_step": 300201, "epoch": 2481} {"train_loss": -43.12079620361328, "global_step": 300202, "epoch": 2481} {"train_loss": -43.22682571411133, "global_step": 300203, "epoch": 2481} {"train_loss": -42.339359283447266, "global_step": 300204, "epoch": 2481} {"train_loss": -42.925193786621094, "global_step": 300205, "epoch": 2481} {"train_loss": -42.8324089050293, "global_step": 300206, "epoch": 2481} {"train_loss": -42.11402130126953, "global_step": 300207, "epoch": 2481} {"train_loss": -43.68603515625, "global_step": 300208, "epoch": 2481} {"train_loss": -42.920223236083984, "global_step": 300209, "epoch": 2481} {"train_loss": -43.31414031982422, "global_step": 300210, "epoch": 2481} {"train_loss": -43.321590423583984, "global_step": 300211, "epoch": 2481} {"train_loss": -43.2299919128418, "global_step": 300212, "epoch": 2481} {"train_loss": -43.51395797729492, "global_step": 300213, "epoch": 2481} {"train_loss": -43.99325180053711, "global_step": 300214, "epoch": 2481} {"train_loss": -42.773189544677734, "global_step": 300215, "epoch": 2481} {"train_loss": -43.41070556640625, "global_step": 300216, "epoch": 2481} {"train_loss": -44.058929443359375, "global_step": 300217, "epoch": 2481} {"train_loss": -42.180423736572266, "global_step": 300218, "epoch": 2481} {"train_loss": -43.731597900390625, "global_step": 300219, "epoch": 2481} {"train_loss": -43.03873825073242, "global_step": 300220, "epoch": 2481} {"train_loss": -43.85836410522461, "global_step": 300221, "epoch": 2481} {"train_loss": -43.52694320678711, "global_step": 300222, "epoch": 2481} {"train_loss": -43.89583969116211, "global_step": 300223, "epoch": 2481} {"train_loss": -43.681217193603516, "global_step": 300224, "epoch": 2481} {"train_loss": -43.81110382080078, "global_step": 300225, "epoch": 2481} {"train_loss": -43.53285598754883, "global_step": 300226, "epoch": 2481} {"train_loss": -43.623531341552734, "global_step": 300227, "epoch": 2481} {"train_loss": -44.356197357177734, "global_step": 300228, "epoch": 2481} {"train_loss": -44.13947677612305, "global_step": 300229, "epoch": 2481} {"train_loss": -43.58233642578125, "global_step": 300230, "epoch": 2481} {"train_loss": -43.96043014526367, "global_step": 300231, "epoch": 2481} {"train_loss": -43.22190475463867, "global_step": 300232, "epoch": 2481} {"train_loss": -42.07867431640625, "global_step": 300233, "epoch": 2481} {"train_loss": -43.87704086303711, "global_step": 300234, "epoch": 2481} {"train_loss": -43.204307556152344, "global_step": 300235, "epoch": 2481} {"train_loss": -43.372528076171875, "global_step": 300236, "epoch": 2481} {"train_loss": -43.63456344604492, "global_step": 300237, "epoch": 2481} {"train_loss": -43.872371673583984, "global_step": 300238, "epoch": 2481} {"train_loss": -43.89189529418945, "global_step": 300239, "epoch": 2481} {"train_loss": -43.0635986328125, "global_step": 300240, "epoch": 2481} {"train_loss": -42.51245880126953, "global_step": 300241, "epoch": 2481} {"train_loss": -43.9925651550293, "global_step": 300242, "epoch": 2481} {"train_loss": -44.3070068359375, "global_step": 300243, "epoch": 2481} {"train_loss": -43.99985885620117, "global_step": 300244, "epoch": 2481} {"train_loss": -44.569419860839844, "global_step": 300245, "epoch": 2481} {"train_loss": -44.757144927978516, "global_step": 300246, "epoch": 2481} {"train_loss": -43.86261749267578, "global_step": 300247, "epoch": 2481} {"train_loss": -44.225284576416016, "global_step": 300248, "epoch": 2481} {"train_loss": -44.661312103271484, "global_step": 300249, "epoch": 2481} {"train_loss": -43.757911682128906, "global_step": 300250, "epoch": 2481} {"train_loss": -43.54324722290039, "global_step": 300251, "epoch": 2481} {"train_loss": -42.50518035888672, "global_step": 300252, "epoch": 2481} {"train_loss": -43.00761032104492, "global_step": 300253, "epoch": 2481} {"train_loss": -43.43197250366211, "global_step": 300254, "epoch": 2481} {"train_loss": -44.504310607910156, "global_step": 300255, "epoch": 2481} {"train_loss": -44.01313400268555, "global_step": 300256, "epoch": 2481} {"train_loss": -43.3380012512207, "global_step": 300257, "epoch": 2481} {"train_loss": -42.6446647644043, "global_step": 300258, "epoch": 2481} {"train_loss": -43.60549545288086, "global_step": 300259, "epoch": 2481} {"train_loss": -44.31513595581055, "global_step": 300260, "epoch": 2481} {"train_loss": -43.55542755126953, "global_step": 300261, "epoch": 2481} {"train_loss": -43.7264404296875, "global_step": 300262, "epoch": 2481} {"train_loss": -43.45082473754883, "global_step": 300263, "epoch": 2481} {"train_loss": -44.12018966674805, "global_step": 300264, "epoch": 2481} {"train_loss": -43.99555587768555, "global_step": 300265, "epoch": 2481} {"train_loss": -42.6389274597168, "global_step": 300266, "epoch": 2481} {"train_loss": -43.62484359741211, "global_step": 300267, "epoch": 2481} {"train_loss": -44.438018798828125, "global_step": 300268, "epoch": 2481} {"train_loss": -44.13335418701172, "global_step": 300269, "epoch": 2481} {"train_loss": -42.27320098876953, "global_step": 300270, "epoch": 2481} {"train_loss": -43.37517547607422, "global_step": 300271, "epoch": 2481} {"train_loss": -44.20048141479492, "global_step": 300272, "epoch": 2481} {"train_loss": -42.362342834472656, "global_step": 300273, "epoch": 2481} {"train_loss": -41.24617385864258, "global_step": 300274, "epoch": 2481} {"train_loss": -42.85793685913086, "global_step": 300275, "epoch": 2481} {"train_loss": -41.40620803833008, "global_step": 300276, "epoch": 2481} {"train_loss": -43.908851623535156, "global_step": 300277, "epoch": 2481} {"train_loss": -42.76539993286133, "global_step": 300278, "epoch": 2481} {"train_loss": -42.55021286010742, "global_step": 300279, "epoch": 2481} {"train_loss": -41.005184173583984, "global_step": 300280, "epoch": 2481} {"train_loss": -41.424800872802734, "global_step": 300281, "epoch": 2481} {"train_loss": -43.56688690185547, "global_step": 300282, "epoch": 2481} {"train_loss": -41.510379791259766, "global_step": 300283, "epoch": 2481} {"train_loss": -42.53617477416992, "global_step": 300284, "epoch": 2481} {"train_loss": -42.7998161315918, "global_step": 300285, "epoch": 2481} {"train_loss": -42.915462493896484, "global_step": 300286, "epoch": 2481} {"train_loss": -43.84235382080078, "global_step": 300287, "epoch": 2481} {"train_loss": -42.53547286987305, "global_step": 300288, "epoch": 2481} {"train_loss": -41.77076721191406, "global_step": 300289, "epoch": 2481} {"train_loss": -43.268890380859375, "global_step": 300290, "epoch": 2481} {"train_loss": -42.15268325805664, "global_step": 300291, "epoch": 2481} {"train_loss": -43.0870475769043, "global_step": 300292, "epoch": 2481} {"train_loss": -43.44272232055664, "global_step": 300293, "epoch": 2481} {"train_loss": -43.698883056640625, "global_step": 300294, "epoch": 2481} {"train_loss": -43.17792892456055, "global_step": 300295, "epoch": 2481} {"train_loss": -44.05097198486328, "global_step": 300296, "epoch": 2481} {"train_loss": -43.147132873535156, "global_step": 300297, "epoch": 2481} {"train_loss": -44.01239776611328, "global_step": 300298, "epoch": 2481} {"train_loss": -43.872432708740234, "global_step": 300299, "epoch": 2481} {"train_loss": -43.19063949584961, "global_step": 300300, "epoch": 2481} {"train_loss": -42.28141784667969, "global_step": 300301, "epoch": 2481} {"train_loss": -43.77381134033203, "global_step": 300302, "epoch": 2481} {"train_loss": -43.18076705932617, "global_step": 300303, "epoch": 2481} {"train_loss": -43.430274963378906, "global_step": 300304, "epoch": 2481} {"train_loss": -43.49374008178711, "global_step": 300305, "epoch": 2481} {"train_loss": -44.36933517456055, "global_step": 300306, "epoch": 2481} {"train_loss": -44.12591552734375, "global_step": 300307, "epoch": 2481} {"train_loss": -43.364501953125, "global_step": 300308, "epoch": 2481} {"train_loss": -43.74011993408203, "global_step": 300309, "epoch": 2481} {"train_loss": -44.08357620239258, "global_step": 300310, "epoch": 2481} {"train_loss": -43.326778411865234, "global_step": 300311, "epoch": 2481} {"train_loss": -43.045997619628906, "global_step": 300312, "epoch": 2481} {"train_loss": -43.932945251464844, "global_step": 300313, "epoch": 2481} {"train_loss": -44.3416633605957, "global_step": 300314, "epoch": 2481} {"train_loss": -43.357330322265625, "global_step": 300315, "epoch": 2481} {"train_loss": -42.96004104614258, "global_step": 300316, "epoch": 2481} {"train_loss": -43.32689666748047, "global_step": 300317, "epoch": 2481} {"train_loss": -44.21581268310547, "global_step": 300318, "epoch": 2481} {"train_loss": -44.039772033691406, "global_step": 300319, "epoch": 2481} {"train_loss": -41.978206634521484, "global_step": 300320, "epoch": 2481} {"train_loss": -43.36034632911367, "global_step": 300321, "epoch": 2481, "val_loss": 2588677.0} {"train_loss": -42.660858154296875, "global_step": 300322, "epoch": 2482} {"train_loss": -42.22627258300781, "global_step": 300323, "epoch": 2482} {"train_loss": -43.639076232910156, "global_step": 300324, "epoch": 2482} {"train_loss": -42.766292572021484, "global_step": 300325, "epoch": 2482} {"train_loss": -44.22595977783203, "global_step": 300326, "epoch": 2482} {"train_loss": -43.83660888671875, "global_step": 300327, "epoch": 2482} {"train_loss": -43.08614730834961, "global_step": 300328, "epoch": 2482} {"train_loss": -44.04547119140625, "global_step": 300329, "epoch": 2482} {"train_loss": -43.131465911865234, "global_step": 300330, "epoch": 2482} {"train_loss": -44.07379150390625, "global_step": 300331, "epoch": 2482} {"train_loss": -44.221858978271484, "global_step": 300332, "epoch": 2482} {"train_loss": -43.20652770996094, "global_step": 300333, "epoch": 2482} {"train_loss": -43.87308883666992, "global_step": 300334, "epoch": 2482} {"train_loss": -43.552669525146484, "global_step": 300335, "epoch": 2482} {"train_loss": -44.078285217285156, "global_step": 300336, "epoch": 2482} {"train_loss": -43.73716354370117, "global_step": 300337, "epoch": 2482} {"train_loss": -42.82749938964844, "global_step": 300338, "epoch": 2482} {"train_loss": -44.355194091796875, "global_step": 300339, "epoch": 2482} {"train_loss": -42.97211456298828, "global_step": 300340, "epoch": 2482} {"train_loss": -43.42045974731445, "global_step": 300341, "epoch": 2482} {"train_loss": -42.841957092285156, "global_step": 300342, "epoch": 2482} {"train_loss": -43.71158981323242, "global_step": 300343, "epoch": 2482} {"train_loss": -44.21873474121094, "global_step": 300344, "epoch": 2482} {"train_loss": -43.671607971191406, "global_step": 300345, "epoch": 2482} {"train_loss": -43.72456741333008, "global_step": 300346, "epoch": 2482} {"train_loss": -44.01876449584961, "global_step": 300347, "epoch": 2482} {"train_loss": -43.62490463256836, "global_step": 300348, "epoch": 2482} {"train_loss": -44.16054153442383, "global_step": 300349, "epoch": 2482} {"train_loss": -43.583797454833984, "global_step": 300350, "epoch": 2482} {"train_loss": -44.05808639526367, "global_step": 300351, "epoch": 2482} {"train_loss": -43.93056869506836, "global_step": 300352, "epoch": 2482} {"train_loss": -43.39384078979492, "global_step": 300353, "epoch": 2482} {"train_loss": -43.77199935913086, "global_step": 300354, "epoch": 2482} {"train_loss": -43.41112518310547, "global_step": 300355, "epoch": 2482} {"train_loss": -44.1773567199707, "global_step": 300356, "epoch": 2482} {"train_loss": -43.569305419921875, "global_step": 300357, "epoch": 2482} {"train_loss": -44.36200714111328, "global_step": 300358, "epoch": 2482} {"train_loss": -44.2571907043457, "global_step": 300359, "epoch": 2482} {"train_loss": -44.04360580444336, "global_step": 300360, "epoch": 2482} {"train_loss": -44.339210510253906, "global_step": 300361, "epoch": 2482} {"train_loss": -43.87955856323242, "global_step": 300362, "epoch": 2482} {"train_loss": -43.65877914428711, "global_step": 300363, "epoch": 2482} {"train_loss": -44.152137756347656, "global_step": 300364, "epoch": 2482} {"train_loss": -44.40086364746094, "global_step": 300365, "epoch": 2482} {"train_loss": -43.20559310913086, "global_step": 300366, "epoch": 2482} {"train_loss": -40.9681282043457, "global_step": 300367, "epoch": 2482} {"train_loss": -44.00818634033203, "global_step": 300368, "epoch": 2482} {"train_loss": -41.541175842285156, "global_step": 300369, "epoch": 2482} {"train_loss": -42.87052536010742, "global_step": 300370, "epoch": 2482} {"train_loss": -43.88368606567383, "global_step": 300371, "epoch": 2482} {"train_loss": -42.308387756347656, "global_step": 300372, "epoch": 2482} {"train_loss": -42.91276168823242, "global_step": 300373, "epoch": 2482} {"train_loss": -43.61237335205078, "global_step": 300374, "epoch": 2482} {"train_loss": -43.69737243652344, "global_step": 300375, "epoch": 2482} {"train_loss": -42.492332458496094, "global_step": 300376, "epoch": 2482} {"train_loss": -42.690120697021484, "global_step": 300377, "epoch": 2482} {"train_loss": -44.01837158203125, "global_step": 300378, "epoch": 2482} {"train_loss": -44.203399658203125, "global_step": 300379, "epoch": 2482} {"train_loss": -43.84975814819336, "global_step": 300380, "epoch": 2482} {"train_loss": -43.751258850097656, "global_step": 300381, "epoch": 2482} {"train_loss": -43.983306884765625, "global_step": 300382, "epoch": 2482} {"train_loss": -43.76494216918945, "global_step": 300383, "epoch": 2482} {"train_loss": -43.15827560424805, "global_step": 300384, "epoch": 2482} {"train_loss": -44.04473114013672, "global_step": 300385, "epoch": 2482} {"train_loss": -43.297096252441406, "global_step": 300386, "epoch": 2482} {"train_loss": -42.90198516845703, "global_step": 300387, "epoch": 2482} {"train_loss": -42.94210433959961, "global_step": 300388, "epoch": 2482} {"train_loss": -43.46781539916992, "global_step": 300389, "epoch": 2482} {"train_loss": -42.61563491821289, "global_step": 300390, "epoch": 2482} {"train_loss": -42.16011428833008, "global_step": 300391, "epoch": 2482} {"train_loss": -42.83453369140625, "global_step": 300392, "epoch": 2482} {"train_loss": -44.19143295288086, "global_step": 300393, "epoch": 2482} {"train_loss": -42.87673568725586, "global_step": 300394, "epoch": 2482} {"train_loss": -43.10786819458008, "global_step": 300395, "epoch": 2482} {"train_loss": -43.72241973876953, "global_step": 300396, "epoch": 2482} {"train_loss": -43.30117416381836, "global_step": 300397, "epoch": 2482} {"train_loss": -43.832489013671875, "global_step": 300398, "epoch": 2482} {"train_loss": -44.18021774291992, "global_step": 300399, "epoch": 2482} {"train_loss": -42.11616134643555, "global_step": 300400, "epoch": 2482} {"train_loss": -44.34349822998047, "global_step": 300401, "epoch": 2482} {"train_loss": -42.76690673828125, "global_step": 300402, "epoch": 2482} {"train_loss": -41.65317916870117, "global_step": 300403, "epoch": 2482} {"train_loss": -43.942527770996094, "global_step": 300404, "epoch": 2482} {"train_loss": -42.02322006225586, "global_step": 300405, "epoch": 2482} {"train_loss": -42.49502944946289, "global_step": 300406, "epoch": 2482} {"train_loss": -43.15167999267578, "global_step": 300407, "epoch": 2482} {"train_loss": -42.610103607177734, "global_step": 300408, "epoch": 2482} {"train_loss": -42.87980270385742, "global_step": 300409, "epoch": 2482} {"train_loss": -43.41316604614258, "global_step": 300410, "epoch": 2482} {"train_loss": -43.466224670410156, "global_step": 300411, "epoch": 2482} {"train_loss": -43.1641960144043, "global_step": 300412, "epoch": 2482} {"train_loss": -41.70960235595703, "global_step": 300413, "epoch": 2482} {"train_loss": -42.683650970458984, "global_step": 300414, "epoch": 2482} {"train_loss": -42.433509826660156, "global_step": 300415, "epoch": 2482} {"train_loss": -43.35777282714844, "global_step": 300416, "epoch": 2482} {"train_loss": -43.58030700683594, "global_step": 300417, "epoch": 2482} {"train_loss": -43.628700256347656, "global_step": 300418, "epoch": 2482} {"train_loss": -43.14577865600586, "global_step": 300419, "epoch": 2482} {"train_loss": -43.363807678222656, "global_step": 300420, "epoch": 2482} {"train_loss": -43.69498825073242, "global_step": 300421, "epoch": 2482} {"train_loss": -42.990814208984375, "global_step": 300422, "epoch": 2482} {"train_loss": -43.320552825927734, "global_step": 300423, "epoch": 2482} {"train_loss": -41.613426208496094, "global_step": 300424, "epoch": 2482} {"train_loss": -43.71918869018555, "global_step": 300425, "epoch": 2482} {"train_loss": -41.44822311401367, "global_step": 300426, "epoch": 2482} {"train_loss": -42.8097038269043, "global_step": 300427, "epoch": 2482} {"train_loss": -41.876983642578125, "global_step": 300428, "epoch": 2482} {"train_loss": -44.00477981567383, "global_step": 300429, "epoch": 2482} {"train_loss": -43.295108795166016, "global_step": 300430, "epoch": 2482} {"train_loss": -43.04354476928711, "global_step": 300431, "epoch": 2482} {"train_loss": -44.048091888427734, "global_step": 300432, "epoch": 2482} {"train_loss": -43.70207595825195, "global_step": 300433, "epoch": 2482} {"train_loss": -43.3591194152832, "global_step": 300434, "epoch": 2482} {"train_loss": -43.58438491821289, "global_step": 300435, "epoch": 2482} {"train_loss": -43.58176803588867, "global_step": 300436, "epoch": 2482} {"train_loss": -44.50272750854492, "global_step": 300437, "epoch": 2482} {"train_loss": -43.709598541259766, "global_step": 300438, "epoch": 2482} {"train_loss": -42.970947265625, "global_step": 300439, "epoch": 2482} {"train_loss": -42.073692321777344, "global_step": 300440, "epoch": 2482} {"train_loss": -43.492679595947266, "global_step": 300441, "epoch": 2482} {"train_loss": -43.35289893662634, "global_step": 300442, "epoch": 2482, "val_loss": 2489158.25} {"train_loss": -42.61497497558594, "global_step": 300443, "epoch": 2483} {"train_loss": -42.77801513671875, "global_step": 300444, "epoch": 2483} {"train_loss": -44.164791107177734, "global_step": 300445, "epoch": 2483} {"train_loss": -41.866668701171875, "global_step": 300446, "epoch": 2483} {"train_loss": -43.49187469482422, "global_step": 300447, "epoch": 2483} {"train_loss": -43.95746612548828, "global_step": 300448, "epoch": 2483} {"train_loss": -43.85687255859375, "global_step": 300449, "epoch": 2483} {"train_loss": -43.09165954589844, "global_step": 300450, "epoch": 2483} {"train_loss": -43.57135772705078, "global_step": 300451, "epoch": 2483} {"train_loss": -43.62729263305664, "global_step": 300452, "epoch": 2483} {"train_loss": -42.952789306640625, "global_step": 300453, "epoch": 2483} {"train_loss": -42.4652214050293, "global_step": 300454, "epoch": 2483} {"train_loss": -44.00962448120117, "global_step": 300455, "epoch": 2483} {"train_loss": -43.53882598876953, "global_step": 300456, "epoch": 2483} {"train_loss": -43.767181396484375, "global_step": 300457, "epoch": 2483} {"train_loss": -42.522216796875, "global_step": 300458, "epoch": 2483} {"train_loss": -43.1285400390625, "global_step": 300459, "epoch": 2483} {"train_loss": -43.979148864746094, "global_step": 300460, "epoch": 2483} {"train_loss": -43.35488510131836, "global_step": 300461, "epoch": 2483} {"train_loss": -43.70926284790039, "global_step": 300462, "epoch": 2483} {"train_loss": -43.827049255371094, "global_step": 300463, "epoch": 2483} {"train_loss": -43.7445068359375, "global_step": 300464, "epoch": 2483} {"train_loss": -43.841609954833984, "global_step": 300465, "epoch": 2483} {"train_loss": -44.047149658203125, "global_step": 300466, "epoch": 2483} {"train_loss": -43.6931037902832, "global_step": 300467, "epoch": 2483} {"train_loss": -43.552268981933594, "global_step": 300468, "epoch": 2483} {"train_loss": -43.924659729003906, "global_step": 300469, "epoch": 2483} {"train_loss": -43.01606750488281, "global_step": 300470, "epoch": 2483} {"train_loss": -43.25962448120117, "global_step": 300471, "epoch": 2483} {"train_loss": -43.58613967895508, "global_step": 300472, "epoch": 2483} {"train_loss": -43.701698303222656, "global_step": 300473, "epoch": 2483} {"train_loss": -43.03242874145508, "global_step": 300474, "epoch": 2483} {"train_loss": -43.6146125793457, "global_step": 300475, "epoch": 2483} {"train_loss": -44.009456634521484, "global_step": 300476, "epoch": 2483} {"train_loss": -44.576839447021484, "global_step": 300477, "epoch": 2483} {"train_loss": -43.601139068603516, "global_step": 300478, "epoch": 2483} {"train_loss": -43.6112174987793, "global_step": 300479, "epoch": 2483} {"train_loss": -44.243255615234375, "global_step": 300480, "epoch": 2483} {"train_loss": -44.3715705871582, "global_step": 300481, "epoch": 2483} {"train_loss": -43.816932678222656, "global_step": 300482, "epoch": 2483} {"train_loss": -43.75916290283203, "global_step": 300483, "epoch": 2483} {"train_loss": -43.3203010559082, "global_step": 300484, "epoch": 2483} {"train_loss": -43.693450927734375, "global_step": 300485, "epoch": 2483} {"train_loss": -42.79773712158203, "global_step": 300486, "epoch": 2483} {"train_loss": -42.37968063354492, "global_step": 300487, "epoch": 2483} {"train_loss": -44.51603317260742, "global_step": 300488, "epoch": 2483} {"train_loss": -42.919307708740234, "global_step": 300489, "epoch": 2483} {"train_loss": -42.237060546875, "global_step": 300490, "epoch": 2483} {"train_loss": -43.44260787963867, "global_step": 300491, "epoch": 2483} {"train_loss": -44.14570236206055, "global_step": 300492, "epoch": 2483} {"train_loss": -43.52533721923828, "global_step": 300493, "epoch": 2483} {"train_loss": -43.350223541259766, "global_step": 300494, "epoch": 2483} {"train_loss": -44.90218734741211, "global_step": 300495, "epoch": 2483} {"train_loss": -43.794654846191406, "global_step": 300496, "epoch": 2483} {"train_loss": -44.20405960083008, "global_step": 300497, "epoch": 2483} {"train_loss": -43.71647262573242, "global_step": 300498, "epoch": 2483} {"train_loss": -43.2285270690918, "global_step": 300499, "epoch": 2483} {"train_loss": -44.187191009521484, "global_step": 300500, "epoch": 2483} {"train_loss": -43.72834014892578, "global_step": 300501, "epoch": 2483} {"train_loss": -42.640865325927734, "global_step": 300502, "epoch": 2483} {"train_loss": -43.09464645385742, "global_step": 300503, "epoch": 2483} {"train_loss": -43.48702621459961, "global_step": 300504, "epoch": 2483} {"train_loss": -43.20964813232422, "global_step": 300505, "epoch": 2483} {"train_loss": -42.8768424987793, "global_step": 300506, "epoch": 2483} {"train_loss": -43.11261749267578, "global_step": 300507, "epoch": 2483} {"train_loss": -43.97825241088867, "global_step": 300508, "epoch": 2483} {"train_loss": -43.55819320678711, "global_step": 300509, "epoch": 2483} {"train_loss": -42.94736099243164, "global_step": 300510, "epoch": 2483} {"train_loss": -42.5472526550293, "global_step": 300511, "epoch": 2483} {"train_loss": -43.07627868652344, "global_step": 300512, "epoch": 2483} {"train_loss": -43.2916374206543, "global_step": 300513, "epoch": 2483} {"train_loss": -43.31757354736328, "global_step": 300514, "epoch": 2483} {"train_loss": -43.56538009643555, "global_step": 300515, "epoch": 2483} {"train_loss": -43.19767761230469, "global_step": 300516, "epoch": 2483} {"train_loss": -41.85346603393555, "global_step": 300517, "epoch": 2483} {"train_loss": -43.40096664428711, "global_step": 300518, "epoch": 2483} {"train_loss": -42.160823822021484, "global_step": 300519, "epoch": 2483} {"train_loss": -44.06498336791992, "global_step": 300520, "epoch": 2483} {"train_loss": -41.57061004638672, "global_step": 300521, "epoch": 2483} {"train_loss": -43.53519058227539, "global_step": 300522, "epoch": 2483} {"train_loss": -43.87092208862305, "global_step": 300523, "epoch": 2483} {"train_loss": -42.91794204711914, "global_step": 300524, "epoch": 2483} {"train_loss": -43.49008560180664, "global_step": 300525, "epoch": 2483} {"train_loss": -43.1710205078125, "global_step": 300526, "epoch": 2483} {"train_loss": -43.01585388183594, "global_step": 300527, "epoch": 2483} {"train_loss": -41.76701736450195, "global_step": 300528, "epoch": 2483} {"train_loss": -43.36385726928711, "global_step": 300529, "epoch": 2483} {"train_loss": -42.83859634399414, "global_step": 300530, "epoch": 2483} {"train_loss": -43.38021469116211, "global_step": 300531, "epoch": 2483} {"train_loss": -42.756011962890625, "global_step": 300532, "epoch": 2483} {"train_loss": -42.59928512573242, "global_step": 300533, "epoch": 2483} {"train_loss": -43.54812240600586, "global_step": 300534, "epoch": 2483} {"train_loss": -43.722530364990234, "global_step": 300535, "epoch": 2483} {"train_loss": -43.67948532104492, "global_step": 300536, "epoch": 2483} {"train_loss": -43.515804290771484, "global_step": 300537, "epoch": 2483} {"train_loss": -43.431575775146484, "global_step": 300538, "epoch": 2483} {"train_loss": -43.7584228515625, "global_step": 300539, "epoch": 2483} {"train_loss": -44.10264587402344, "global_step": 300540, "epoch": 2483} {"train_loss": -43.72234344482422, "global_step": 300541, "epoch": 2483} {"train_loss": -43.49772644042969, "global_step": 300542, "epoch": 2483} {"train_loss": -43.56719207763672, "global_step": 300543, "epoch": 2483} {"train_loss": -43.16707992553711, "global_step": 300544, "epoch": 2483} {"train_loss": -43.894935607910156, "global_step": 300545, "epoch": 2483} {"train_loss": -44.038185119628906, "global_step": 300546, "epoch": 2483} {"train_loss": -44.05356979370117, "global_step": 300547, "epoch": 2483} {"train_loss": -44.300209045410156, "global_step": 300548, "epoch": 2483} {"train_loss": -44.031105041503906, "global_step": 300549, "epoch": 2483} {"train_loss": -44.234737396240234, "global_step": 300550, "epoch": 2483} {"train_loss": -43.62006759643555, "global_step": 300551, "epoch": 2483} {"train_loss": -44.42153549194336, "global_step": 300552, "epoch": 2483} {"train_loss": -43.20949172973633, "global_step": 300553, "epoch": 2483} {"train_loss": -43.4268913269043, "global_step": 300554, "epoch": 2483} {"train_loss": -43.955745697021484, "global_step": 300555, "epoch": 2483} {"train_loss": -44.05662155151367, "global_step": 300556, "epoch": 2483} {"train_loss": -43.00741195678711, "global_step": 300557, "epoch": 2483} {"train_loss": -43.921321868896484, "global_step": 300558, "epoch": 2483} {"train_loss": -43.497352600097656, "global_step": 300559, "epoch": 2483} {"train_loss": -42.919403076171875, "global_step": 300560, "epoch": 2483} {"train_loss": -44.0845947265625, "global_step": 300561, "epoch": 2483} {"train_loss": -41.69967269897461, "global_step": 300562, "epoch": 2483} {"train_loss": -43.44833944651706, "global_step": 300563, "epoch": 2483, "val_loss": 2611374.25} {"train_loss": -43.20964431762695, "global_step": 300564, "epoch": 2484} {"train_loss": -41.72504425048828, "global_step": 300565, "epoch": 2484} {"train_loss": -43.3591194152832, "global_step": 300566, "epoch": 2484} {"train_loss": -42.355106353759766, "global_step": 300567, "epoch": 2484} {"train_loss": -42.4920768737793, "global_step": 300568, "epoch": 2484} {"train_loss": -43.084327697753906, "global_step": 300569, "epoch": 2484} {"train_loss": -43.498653411865234, "global_step": 300570, "epoch": 2484} {"train_loss": -43.470054626464844, "global_step": 300571, "epoch": 2484} {"train_loss": -42.415260314941406, "global_step": 300572, "epoch": 2484} {"train_loss": -43.86521530151367, "global_step": 300573, "epoch": 2484} {"train_loss": -43.84870529174805, "global_step": 300574, "epoch": 2484} {"train_loss": -43.52186965942383, "global_step": 300575, "epoch": 2484} {"train_loss": -43.742286682128906, "global_step": 300576, "epoch": 2484} {"train_loss": -43.981048583984375, "global_step": 300577, "epoch": 2484} {"train_loss": -42.322181701660156, "global_step": 300578, "epoch": 2484} {"train_loss": -42.41715621948242, "global_step": 300579, "epoch": 2484} {"train_loss": -44.18270492553711, "global_step": 300580, "epoch": 2484} {"train_loss": -42.0621452331543, "global_step": 300581, "epoch": 2484} {"train_loss": -44.09901809692383, "global_step": 300582, "epoch": 2484} {"train_loss": -42.75935745239258, "global_step": 300583, "epoch": 2484} {"train_loss": -43.01245880126953, "global_step": 300584, "epoch": 2484} {"train_loss": -44.521663665771484, "global_step": 300585, "epoch": 2484} {"train_loss": -42.52364730834961, "global_step": 300586, "epoch": 2484} {"train_loss": -43.43231964111328, "global_step": 300587, "epoch": 2484} {"train_loss": -43.76603698730469, "global_step": 300588, "epoch": 2484} {"train_loss": -42.52663803100586, "global_step": 300589, "epoch": 2484} {"train_loss": -44.107582092285156, "global_step": 300590, "epoch": 2484} {"train_loss": -43.592594146728516, "global_step": 300591, "epoch": 2484} {"train_loss": -42.6083869934082, "global_step": 300592, "epoch": 2484} {"train_loss": -44.07973861694336, "global_step": 300593, "epoch": 2484} {"train_loss": -42.24580001831055, "global_step": 300594, "epoch": 2484} {"train_loss": -42.73933792114258, "global_step": 300595, "epoch": 2484} {"train_loss": -44.15214920043945, "global_step": 300596, "epoch": 2484} {"train_loss": -41.58086395263672, "global_step": 300597, "epoch": 2484} {"train_loss": -44.530574798583984, "global_step": 300598, "epoch": 2484} {"train_loss": -39.12382125854492, "global_step": 300599, "epoch": 2484} {"train_loss": -44.25358200073242, "global_step": 300600, "epoch": 2484} {"train_loss": -43.50376510620117, "global_step": 300601, "epoch": 2484} {"train_loss": -43.00364303588867, "global_step": 300602, "epoch": 2484} {"train_loss": -43.72704315185547, "global_step": 300603, "epoch": 2484} {"train_loss": -43.14302062988281, "global_step": 300604, "epoch": 2484} {"train_loss": -42.271114349365234, "global_step": 300605, "epoch": 2484} {"train_loss": -42.79317855834961, "global_step": 300606, "epoch": 2484} {"train_loss": -39.22245788574219, "global_step": 300607, "epoch": 2484} {"train_loss": -40.86794662475586, "global_step": 300608, "epoch": 2484} {"train_loss": -43.30685043334961, "global_step": 300609, "epoch": 2484} {"train_loss": -43.41876220703125, "global_step": 300610, "epoch": 2484} {"train_loss": -43.85374069213867, "global_step": 300611, "epoch": 2484} {"train_loss": -43.17626190185547, "global_step": 300612, "epoch": 2484} {"train_loss": -44.10885238647461, "global_step": 300613, "epoch": 2484} {"train_loss": -43.63755416870117, "global_step": 300614, "epoch": 2484} {"train_loss": -41.90937042236328, "global_step": 300615, "epoch": 2484} {"train_loss": -43.23502731323242, "global_step": 300616, "epoch": 2484} {"train_loss": -42.834407806396484, "global_step": 300617, "epoch": 2484} {"train_loss": -43.10901641845703, "global_step": 300618, "epoch": 2484} {"train_loss": -40.15095138549805, "global_step": 300619, "epoch": 2484} {"train_loss": -43.37413024902344, "global_step": 300620, "epoch": 2484} {"train_loss": -32.665618896484375, "global_step": 300621, "epoch": 2484} {"train_loss": -39.355255126953125, "global_step": 300622, "epoch": 2484} {"train_loss": -43.21259307861328, "global_step": 300623, "epoch": 2484} {"train_loss": -42.00063705444336, "global_step": 300624, "epoch": 2484} {"train_loss": -41.990230560302734, "global_step": 300625, "epoch": 2484} {"train_loss": -43.646785736083984, "global_step": 300626, "epoch": 2484} {"train_loss": -42.27399444580078, "global_step": 300627, "epoch": 2484} {"train_loss": -39.82218551635742, "global_step": 300628, "epoch": 2484} {"train_loss": -41.55507278442383, "global_step": 300629, "epoch": 2484} {"train_loss": -40.870357513427734, "global_step": 300630, "epoch": 2484} {"train_loss": -42.119564056396484, "global_step": 300631, "epoch": 2484} {"train_loss": -41.98379135131836, "global_step": 300632, "epoch": 2484} {"train_loss": -43.09879684448242, "global_step": 300633, "epoch": 2484} {"train_loss": -40.659400939941406, "global_step": 300634, "epoch": 2484} {"train_loss": -43.5440673828125, "global_step": 300635, "epoch": 2484} {"train_loss": -41.340633392333984, "global_step": 300636, "epoch": 2484} {"train_loss": -42.728145599365234, "global_step": 300637, "epoch": 2484} {"train_loss": -42.67079544067383, "global_step": 300638, "epoch": 2484} {"train_loss": -42.482704162597656, "global_step": 300639, "epoch": 2484} {"train_loss": -42.36599349975586, "global_step": 300640, "epoch": 2484} {"train_loss": -39.40220260620117, "global_step": 300641, "epoch": 2484} {"train_loss": -43.47262191772461, "global_step": 300642, "epoch": 2484} {"train_loss": -43.67325973510742, "global_step": 300643, "epoch": 2484} {"train_loss": -42.96517562866211, "global_step": 300644, "epoch": 2484} {"train_loss": -43.80811309814453, "global_step": 300645, "epoch": 2484} {"train_loss": -43.335838317871094, "global_step": 300646, "epoch": 2484} {"train_loss": -42.66371536254883, "global_step": 300647, "epoch": 2484} {"train_loss": -43.45966720581055, "global_step": 300648, "epoch": 2484} {"train_loss": -43.38956069946289, "global_step": 300649, "epoch": 2484} {"train_loss": -43.45290756225586, "global_step": 300650, "epoch": 2484} {"train_loss": -43.48977279663086, "global_step": 300651, "epoch": 2484} {"train_loss": -42.206356048583984, "global_step": 300652, "epoch": 2484} {"train_loss": -43.65446090698242, "global_step": 300653, "epoch": 2484} {"train_loss": -43.2337646484375, "global_step": 300654, "epoch": 2484} {"train_loss": -43.584228515625, "global_step": 300655, "epoch": 2484} {"train_loss": -43.811161041259766, "global_step": 300656, "epoch": 2484} {"train_loss": -43.57706832885742, "global_step": 300657, "epoch": 2484} {"train_loss": -43.81169891357422, "global_step": 300658, "epoch": 2484} {"train_loss": -42.287567138671875, "global_step": 300659, "epoch": 2484} {"train_loss": -42.70276641845703, "global_step": 300660, "epoch": 2484} {"train_loss": -43.40018844604492, "global_step": 300661, "epoch": 2484} {"train_loss": -42.66325378417969, "global_step": 300662, "epoch": 2484} {"train_loss": -44.297828674316406, "global_step": 300663, "epoch": 2484} {"train_loss": -44.03413009643555, "global_step": 300664, "epoch": 2484} {"train_loss": -43.909297943115234, "global_step": 300665, "epoch": 2484} {"train_loss": -43.66707229614258, "global_step": 300666, "epoch": 2484} {"train_loss": -43.723995208740234, "global_step": 300667, "epoch": 2484} {"train_loss": -42.85757064819336, "global_step": 300668, "epoch": 2484} {"train_loss": -43.19194030761719, "global_step": 300669, "epoch": 2484} {"train_loss": -43.87885284423828, "global_step": 300670, "epoch": 2484} {"train_loss": -43.45573806762695, "global_step": 300671, "epoch": 2484} {"train_loss": -43.940643310546875, "global_step": 300672, "epoch": 2484} {"train_loss": -43.49414825439453, "global_step": 300673, "epoch": 2484} {"train_loss": -43.04412841796875, "global_step": 300674, "epoch": 2484} {"train_loss": -43.66011428833008, "global_step": 300675, "epoch": 2484} {"train_loss": -43.51805877685547, "global_step": 300676, "epoch": 2484} {"train_loss": -44.252620697021484, "global_step": 300677, "epoch": 2484} {"train_loss": -43.41872024536133, "global_step": 300678, "epoch": 2484} {"train_loss": -44.159305572509766, "global_step": 300679, "epoch": 2484} {"train_loss": -44.12517547607422, "global_step": 300680, "epoch": 2484} {"train_loss": -44.3249397277832, "global_step": 300681, "epoch": 2484} {"train_loss": -44.08034896850586, "global_step": 300682, "epoch": 2484} {"train_loss": -43.72086715698242, "global_step": 300683, "epoch": 2484} {"train_loss": -42.89727890392965, "global_step": 300684, "epoch": 2484, "val_loss": 2506750.25} {"train_loss": -44.60699462890625, "global_step": 300685, "epoch": 2485} {"train_loss": -43.52546691894531, "global_step": 300686, "epoch": 2485} {"train_loss": -43.462615966796875, "global_step": 300687, "epoch": 2485} {"train_loss": -41.68488693237305, "global_step": 300688, "epoch": 2485} {"train_loss": -42.33309555053711, "global_step": 300689, "epoch": 2485} {"train_loss": -43.26541519165039, "global_step": 300690, "epoch": 2485} {"train_loss": -42.35891342163086, "global_step": 300691, "epoch": 2485} {"train_loss": -40.753963470458984, "global_step": 300692, "epoch": 2485} {"train_loss": -42.73618698120117, "global_step": 300693, "epoch": 2485} {"train_loss": -41.05467987060547, "global_step": 300694, "epoch": 2485} {"train_loss": -42.85650634765625, "global_step": 300695, "epoch": 2485} {"train_loss": -40.832767486572266, "global_step": 300696, "epoch": 2485} {"train_loss": -39.60238265991211, "global_step": 300697, "epoch": 2485} {"train_loss": -42.94819259643555, "global_step": 300698, "epoch": 2485} {"train_loss": -41.51202392578125, "global_step": 300699, "epoch": 2485} {"train_loss": -43.04012680053711, "global_step": 300700, "epoch": 2485} {"train_loss": -41.794883728027344, "global_step": 300701, "epoch": 2485} {"train_loss": -44.02598190307617, "global_step": 300702, "epoch": 2485} {"train_loss": -41.99140167236328, "global_step": 300703, "epoch": 2485} {"train_loss": -41.0576171875, "global_step": 300704, "epoch": 2485} {"train_loss": -43.13811111450195, "global_step": 300705, "epoch": 2485} {"train_loss": -42.370361328125, "global_step": 300706, "epoch": 2485} {"train_loss": -43.47730255126953, "global_step": 300707, "epoch": 2485} {"train_loss": -42.15877914428711, "global_step": 300708, "epoch": 2485} {"train_loss": -43.748958587646484, "global_step": 300709, "epoch": 2485} {"train_loss": -42.14353561401367, "global_step": 300710, "epoch": 2485} {"train_loss": -42.649105072021484, "global_step": 300711, "epoch": 2485} {"train_loss": -42.673004150390625, "global_step": 300712, "epoch": 2485} {"train_loss": -43.89887619018555, "global_step": 300713, "epoch": 2485} {"train_loss": -43.608036041259766, "global_step": 300714, "epoch": 2485} {"train_loss": -43.14271926879883, "global_step": 300715, "epoch": 2485} {"train_loss": -43.57118606567383, "global_step": 300716, "epoch": 2485} {"train_loss": -42.73643493652344, "global_step": 300717, "epoch": 2485} {"train_loss": -43.5548210144043, "global_step": 300718, "epoch": 2485} {"train_loss": -43.20820236206055, "global_step": 300719, "epoch": 2485} {"train_loss": -43.30471420288086, "global_step": 300720, "epoch": 2485} {"train_loss": -43.3265266418457, "global_step": 300721, "epoch": 2485} {"train_loss": -41.980682373046875, "global_step": 300722, "epoch": 2485} {"train_loss": -42.60505294799805, "global_step": 300723, "epoch": 2485} {"train_loss": -43.93770217895508, "global_step": 300724, "epoch": 2485} {"train_loss": -43.66944122314453, "global_step": 300725, "epoch": 2485} {"train_loss": -43.52572250366211, "global_step": 300726, "epoch": 2485} {"train_loss": -43.67372512817383, "global_step": 300727, "epoch": 2485} {"train_loss": -41.849605560302734, "global_step": 300728, "epoch": 2485} {"train_loss": -44.01874542236328, "global_step": 300729, "epoch": 2485} {"train_loss": -42.95372772216797, "global_step": 300730, "epoch": 2485} {"train_loss": -43.676265716552734, "global_step": 300731, "epoch": 2485} {"train_loss": -43.69834899902344, "global_step": 300732, "epoch": 2485} {"train_loss": -42.51566696166992, "global_step": 300733, "epoch": 2485} {"train_loss": -43.53533172607422, "global_step": 300734, "epoch": 2485} {"train_loss": -42.8509635925293, "global_step": 300735, "epoch": 2485} {"train_loss": -42.262054443359375, "global_step": 300736, "epoch": 2485} {"train_loss": -44.4935302734375, "global_step": 300737, "epoch": 2485} {"train_loss": -43.404029846191406, "global_step": 300738, "epoch": 2485} {"train_loss": -43.825801849365234, "global_step": 300739, "epoch": 2485} {"train_loss": -43.92280960083008, "global_step": 300740, "epoch": 2485} {"train_loss": -43.56013870239258, "global_step": 300741, "epoch": 2485} {"train_loss": -44.01554489135742, "global_step": 300742, "epoch": 2485} {"train_loss": -42.526363372802734, "global_step": 300743, "epoch": 2485} {"train_loss": -43.383209228515625, "global_step": 300744, "epoch": 2485} {"train_loss": -44.00285339355469, "global_step": 300745, "epoch": 2485} {"train_loss": -43.469844818115234, "global_step": 300746, "epoch": 2485} {"train_loss": -43.06965255737305, "global_step": 300747, "epoch": 2485} {"train_loss": -43.38881301879883, "global_step": 300748, "epoch": 2485} {"train_loss": -43.41996383666992, "global_step": 300749, "epoch": 2485} {"train_loss": -44.12248229980469, "global_step": 300750, "epoch": 2485} {"train_loss": -44.092132568359375, "global_step": 300751, "epoch": 2485} {"train_loss": -44.084835052490234, "global_step": 300752, "epoch": 2485} {"train_loss": -43.938209533691406, "global_step": 300753, "epoch": 2485} {"train_loss": -43.82976150512695, "global_step": 300754, "epoch": 2485} {"train_loss": -43.903709411621094, "global_step": 300755, "epoch": 2485} {"train_loss": -43.76581954956055, "global_step": 300756, "epoch": 2485} {"train_loss": -43.84804153442383, "global_step": 300757, "epoch": 2485} {"train_loss": -44.2055778503418, "global_step": 300758, "epoch": 2485} {"train_loss": -43.69523620605469, "global_step": 300759, "epoch": 2485} {"train_loss": -44.35818099975586, "global_step": 300760, "epoch": 2485} {"train_loss": -43.50735092163086, "global_step": 300761, "epoch": 2485} {"train_loss": -44.72382736206055, "global_step": 300762, "epoch": 2485} {"train_loss": -44.38120651245117, "global_step": 300763, "epoch": 2485} {"train_loss": -43.97078323364258, "global_step": 300764, "epoch": 2485} {"train_loss": -43.74300003051758, "global_step": 300765, "epoch": 2485} {"train_loss": -44.188720703125, "global_step": 300766, "epoch": 2485} {"train_loss": -44.326904296875, "global_step": 300767, "epoch": 2485} {"train_loss": -43.637298583984375, "global_step": 300768, "epoch": 2485} {"train_loss": -42.53609848022461, "global_step": 300769, "epoch": 2485} {"train_loss": -44.347591400146484, "global_step": 300770, "epoch": 2485} {"train_loss": -43.79553985595703, "global_step": 300771, "epoch": 2485} {"train_loss": -44.66025161743164, "global_step": 300772, "epoch": 2485} {"train_loss": -44.292598724365234, "global_step": 300773, "epoch": 2485} {"train_loss": -43.8980827331543, "global_step": 300774, "epoch": 2485} {"train_loss": -43.0500602722168, "global_step": 300775, "epoch": 2485} {"train_loss": -43.771461486816406, "global_step": 300776, "epoch": 2485} {"train_loss": -44.41697311401367, "global_step": 300777, "epoch": 2485} {"train_loss": -43.919891357421875, "global_step": 300778, "epoch": 2485} {"train_loss": -43.91671371459961, "global_step": 300779, "epoch": 2485} {"train_loss": -45.06663131713867, "global_step": 300780, "epoch": 2485} {"train_loss": -42.91329574584961, "global_step": 300781, "epoch": 2485} {"train_loss": -43.89187240600586, "global_step": 300782, "epoch": 2485} {"train_loss": -44.27158737182617, "global_step": 300783, "epoch": 2485} {"train_loss": -44.51957321166992, "global_step": 300784, "epoch": 2485} {"train_loss": -44.760250091552734, "global_step": 300785, "epoch": 2485} {"train_loss": -44.24797058105469, "global_step": 300786, "epoch": 2485} {"train_loss": -44.27014923095703, "global_step": 300787, "epoch": 2485} {"train_loss": -43.329097747802734, "global_step": 300788, "epoch": 2485} {"train_loss": -43.769412994384766, "global_step": 300789, "epoch": 2485} {"train_loss": -43.382381439208984, "global_step": 300790, "epoch": 2485} {"train_loss": -43.62574768066406, "global_step": 300791, "epoch": 2485} {"train_loss": -43.55592727661133, "global_step": 300792, "epoch": 2485} {"train_loss": -43.68955612182617, "global_step": 300793, "epoch": 2485} {"train_loss": -43.16181182861328, "global_step": 300794, "epoch": 2485} {"train_loss": -43.31321334838867, "global_step": 300795, "epoch": 2485} {"train_loss": -42.314910888671875, "global_step": 300796, "epoch": 2485} {"train_loss": -42.50419616699219, "global_step": 300797, "epoch": 2485} {"train_loss": -42.91969680786133, "global_step": 300798, "epoch": 2485} {"train_loss": -42.19618606567383, "global_step": 300799, "epoch": 2485} {"train_loss": -42.51905059814453, "global_step": 300800, "epoch": 2485} {"train_loss": -40.12034225463867, "global_step": 300801, "epoch": 2485} {"train_loss": -42.10185623168945, "global_step": 300802, "epoch": 2485} {"train_loss": -36.78430938720703, "global_step": 300803, "epoch": 2485} {"train_loss": -33.6812858581543, "global_step": 300804, "epoch": 2485} {"train_loss": -43.01657325177153, "global_step": 300805, "epoch": 2485, "val_loss": 2615383.5} {"train_loss": -38.3743896484375, "global_step": 300806, "epoch": 2486} {"train_loss": -40.13310623168945, "global_step": 300807, "epoch": 2486} {"train_loss": -33.54463577270508, "global_step": 300808, "epoch": 2486} {"train_loss": -40.57493209838867, "global_step": 300809, "epoch": 2486} {"train_loss": -36.24821472167969, "global_step": 300810, "epoch": 2486} {"train_loss": -38.60950469970703, "global_step": 300811, "epoch": 2486} {"train_loss": -36.612220764160156, "global_step": 300812, "epoch": 2486} {"train_loss": -40.126792907714844, "global_step": 300813, "epoch": 2486} {"train_loss": -40.737525939941406, "global_step": 300814, "epoch": 2486} {"train_loss": -39.84646987915039, "global_step": 300815, "epoch": 2486} {"train_loss": -41.06679153442383, "global_step": 300816, "epoch": 2486} {"train_loss": -38.772884368896484, "global_step": 300817, "epoch": 2486} {"train_loss": -42.668251037597656, "global_step": 300818, "epoch": 2486} {"train_loss": -41.282737731933594, "global_step": 300819, "epoch": 2486} {"train_loss": -42.35791015625, "global_step": 300820, "epoch": 2486} {"train_loss": -40.15072250366211, "global_step": 300821, "epoch": 2486} {"train_loss": -41.8017463684082, "global_step": 300822, "epoch": 2486} {"train_loss": -40.067604064941406, "global_step": 300823, "epoch": 2486} {"train_loss": -41.529884338378906, "global_step": 300824, "epoch": 2486} {"train_loss": -40.656463623046875, "global_step": 300825, "epoch": 2486} {"train_loss": -40.88017272949219, "global_step": 300826, "epoch": 2486} {"train_loss": -41.305721282958984, "global_step": 300827, "epoch": 2486} {"train_loss": -41.384063720703125, "global_step": 300828, "epoch": 2486} {"train_loss": -41.94440841674805, "global_step": 300829, "epoch": 2486} {"train_loss": -41.844024658203125, "global_step": 300830, "epoch": 2486} {"train_loss": -41.470829010009766, "global_step": 300831, "epoch": 2486} {"train_loss": -42.2030143737793, "global_step": 300832, "epoch": 2486} {"train_loss": -41.430938720703125, "global_step": 300833, "epoch": 2486} {"train_loss": -41.75404739379883, "global_step": 300834, "epoch": 2486} {"train_loss": -42.785743713378906, "global_step": 300835, "epoch": 2486} {"train_loss": -42.300514221191406, "global_step": 300836, "epoch": 2486} {"train_loss": -42.612754821777344, "global_step": 300837, "epoch": 2486} {"train_loss": -42.65918731689453, "global_step": 300838, "epoch": 2486} {"train_loss": -42.51251983642578, "global_step": 300839, "epoch": 2486} {"train_loss": -43.55971908569336, "global_step": 300840, "epoch": 2486} {"train_loss": -42.2401123046875, "global_step": 300841, "epoch": 2486} {"train_loss": -43.0602912902832, "global_step": 300842, "epoch": 2486} {"train_loss": -42.04391098022461, "global_step": 300843, "epoch": 2486} {"train_loss": -43.13309860229492, "global_step": 300844, "epoch": 2486} {"train_loss": -42.58718490600586, "global_step": 300845, "epoch": 2486} {"train_loss": -43.64179611206055, "global_step": 300846, "epoch": 2486} {"train_loss": -42.529903411865234, "global_step": 300847, "epoch": 2486} {"train_loss": -42.415775299072266, "global_step": 300848, "epoch": 2486} {"train_loss": -43.582984924316406, "global_step": 300849, "epoch": 2486} {"train_loss": -42.76631164550781, "global_step": 300850, "epoch": 2486} {"train_loss": -43.50791549682617, "global_step": 300851, "epoch": 2486} {"train_loss": -43.4174690246582, "global_step": 300852, "epoch": 2486} {"train_loss": -43.1208610534668, "global_step": 300853, "epoch": 2486} {"train_loss": -43.7054443359375, "global_step": 300854, "epoch": 2486} {"train_loss": -43.412078857421875, "global_step": 300855, "epoch": 2486} {"train_loss": -43.526729583740234, "global_step": 300856, "epoch": 2486} {"train_loss": -42.89570236206055, "global_step": 300857, "epoch": 2486} {"train_loss": -43.47241973876953, "global_step": 300858, "epoch": 2486} {"train_loss": -43.3082275390625, "global_step": 300859, "epoch": 2486} {"train_loss": -43.96023178100586, "global_step": 300860, "epoch": 2486} {"train_loss": -42.79775619506836, "global_step": 300861, "epoch": 2486} {"train_loss": -43.97132110595703, "global_step": 300862, "epoch": 2486} {"train_loss": -43.5001220703125, "global_step": 300863, "epoch": 2486} {"train_loss": -43.78322982788086, "global_step": 300864, "epoch": 2486} {"train_loss": -43.1168212890625, "global_step": 300865, "epoch": 2486} {"train_loss": -43.80972671508789, "global_step": 300866, "epoch": 2486} {"train_loss": -40.744285583496094, "global_step": 300867, "epoch": 2486} {"train_loss": -43.70711898803711, "global_step": 300868, "epoch": 2486} {"train_loss": -42.458370208740234, "global_step": 300869, "epoch": 2486} {"train_loss": -43.6939582824707, "global_step": 300870, "epoch": 2486} {"train_loss": -42.7057991027832, "global_step": 300871, "epoch": 2486} {"train_loss": -43.92885971069336, "global_step": 300872, "epoch": 2486} {"train_loss": -42.82416915893555, "global_step": 300873, "epoch": 2486} {"train_loss": -42.852542877197266, "global_step": 300874, "epoch": 2486} {"train_loss": -43.487239837646484, "global_step": 300875, "epoch": 2486} {"train_loss": -43.53196716308594, "global_step": 300876, "epoch": 2486} {"train_loss": -42.269832611083984, "global_step": 300877, "epoch": 2486} {"train_loss": -43.035465240478516, "global_step": 300878, "epoch": 2486} {"train_loss": -42.363075256347656, "global_step": 300879, "epoch": 2486} {"train_loss": -41.861572265625, "global_step": 300880, "epoch": 2486} {"train_loss": -44.076961517333984, "global_step": 300881, "epoch": 2486} {"train_loss": -43.26911544799805, "global_step": 300882, "epoch": 2486} {"train_loss": -42.121604919433594, "global_step": 300883, "epoch": 2486} {"train_loss": -43.0319938659668, "global_step": 300884, "epoch": 2486} {"train_loss": -43.60184860229492, "global_step": 300885, "epoch": 2486} {"train_loss": -43.445308685302734, "global_step": 300886, "epoch": 2486} {"train_loss": -43.89323043823242, "global_step": 300887, "epoch": 2486} {"train_loss": -44.34129333496094, "global_step": 300888, "epoch": 2486} {"train_loss": -42.11517333984375, "global_step": 300889, "epoch": 2486} {"train_loss": -43.416839599609375, "global_step": 300890, "epoch": 2486} {"train_loss": -42.0433349609375, "global_step": 300891, "epoch": 2486} {"train_loss": -42.565372467041016, "global_step": 300892, "epoch": 2486} {"train_loss": -41.96001052856445, "global_step": 300893, "epoch": 2486} {"train_loss": -43.079566955566406, "global_step": 300894, "epoch": 2486} {"train_loss": -42.3572998046875, "global_step": 300895, "epoch": 2486} {"train_loss": -42.53728103637695, "global_step": 300896, "epoch": 2486} {"train_loss": -42.99300765991211, "global_step": 300897, "epoch": 2486} {"train_loss": -43.44198226928711, "global_step": 300898, "epoch": 2486} {"train_loss": -42.90434646606445, "global_step": 300899, "epoch": 2486} {"train_loss": -42.43543243408203, "global_step": 300900, "epoch": 2486} {"train_loss": -43.016632080078125, "global_step": 300901, "epoch": 2486} {"train_loss": -42.938446044921875, "global_step": 300902, "epoch": 2486} {"train_loss": -43.02709197998047, "global_step": 300903, "epoch": 2486} {"train_loss": -42.90089416503906, "global_step": 300904, "epoch": 2486} {"train_loss": -43.48546600341797, "global_step": 300905, "epoch": 2486} {"train_loss": -43.79585647583008, "global_step": 300906, "epoch": 2486} {"train_loss": -43.36777877807617, "global_step": 300907, "epoch": 2486} {"train_loss": -42.96161651611328, "global_step": 300908, "epoch": 2486} {"train_loss": -44.264808654785156, "global_step": 300909, "epoch": 2486} {"train_loss": -43.75141143798828, "global_step": 300910, "epoch": 2486} {"train_loss": -43.580413818359375, "global_step": 300911, "epoch": 2486} {"train_loss": -43.89653778076172, "global_step": 300912, "epoch": 2486} {"train_loss": -43.76057434082031, "global_step": 300913, "epoch": 2486} {"train_loss": -42.75144577026367, "global_step": 300914, "epoch": 2486} {"train_loss": -43.488651275634766, "global_step": 300915, "epoch": 2486} {"train_loss": -44.200843811035156, "global_step": 300916, "epoch": 2486} {"train_loss": -44.2307014465332, "global_step": 300917, "epoch": 2486} {"train_loss": -44.1585807800293, "global_step": 300918, "epoch": 2486} {"train_loss": -44.18546676635742, "global_step": 300919, "epoch": 2486} {"train_loss": -44.21485137939453, "global_step": 300920, "epoch": 2486} {"train_loss": -44.37221908569336, "global_step": 300921, "epoch": 2486} {"train_loss": -43.53913879394531, "global_step": 300922, "epoch": 2486} {"train_loss": -44.222225189208984, "global_step": 300923, "epoch": 2486} {"train_loss": -44.538631439208984, "global_step": 300924, "epoch": 2486} {"train_loss": -43.82065963745117, "global_step": 300925, "epoch": 2486} {"train_loss": -42.52326691052145, "global_step": 300926, "epoch": 2486, "val_loss": 2650241.25} {"train_loss": -44.8125114440918, "global_step": 300927, "epoch": 2487} {"train_loss": -44.15848922729492, "global_step": 300928, "epoch": 2487} {"train_loss": -44.08970260620117, "global_step": 300929, "epoch": 2487} {"train_loss": -44.547515869140625, "global_step": 300930, "epoch": 2487} {"train_loss": -44.553260803222656, "global_step": 300931, "epoch": 2487} {"train_loss": -44.286495208740234, "global_step": 300932, "epoch": 2487} {"train_loss": -44.619361877441406, "global_step": 300933, "epoch": 2487} {"train_loss": -44.53459548950195, "global_step": 300934, "epoch": 2487} {"train_loss": -44.348628997802734, "global_step": 300935, "epoch": 2487} {"train_loss": -44.72648239135742, "global_step": 300936, "epoch": 2487} {"train_loss": -43.541988372802734, "global_step": 300937, "epoch": 2487} {"train_loss": -44.16073226928711, "global_step": 300938, "epoch": 2487} {"train_loss": -44.38606262207031, "global_step": 300939, "epoch": 2487} {"train_loss": -44.14251708984375, "global_step": 300940, "epoch": 2487} {"train_loss": -44.88135528564453, "global_step": 300941, "epoch": 2487} {"train_loss": -44.66090774536133, "global_step": 300942, "epoch": 2487} {"train_loss": -44.40409469604492, "global_step": 300943, "epoch": 2487} {"train_loss": -44.42011642456055, "global_step": 300944, "epoch": 2487} {"train_loss": -43.64915084838867, "global_step": 300945, "epoch": 2487} {"train_loss": -44.053260803222656, "global_step": 300946, "epoch": 2487} {"train_loss": -44.96083450317383, "global_step": 300947, "epoch": 2487} {"train_loss": -44.28009033203125, "global_step": 300948, "epoch": 2487} {"train_loss": -43.787933349609375, "global_step": 300949, "epoch": 2487} {"train_loss": -42.144378662109375, "global_step": 300950, "epoch": 2487} {"train_loss": -41.67020797729492, "global_step": 300951, "epoch": 2487} {"train_loss": -40.76303482055664, "global_step": 300952, "epoch": 2487} {"train_loss": -41.40061569213867, "global_step": 300953, "epoch": 2487} {"train_loss": -42.4387092590332, "global_step": 300954, "epoch": 2487} {"train_loss": -44.594112396240234, "global_step": 300955, "epoch": 2487} {"train_loss": -43.72925567626953, "global_step": 300956, "epoch": 2487} {"train_loss": -42.63639450073242, "global_step": 300957, "epoch": 2487} {"train_loss": -43.49853515625, "global_step": 300958, "epoch": 2487} {"train_loss": -43.596378326416016, "global_step": 300959, "epoch": 2487} {"train_loss": -43.848297119140625, "global_step": 300960, "epoch": 2487} {"train_loss": -43.89285659790039, "global_step": 300961, "epoch": 2487} {"train_loss": -44.22688293457031, "global_step": 300962, "epoch": 2487} {"train_loss": -44.09853744506836, "global_step": 300963, "epoch": 2487} {"train_loss": -44.13629150390625, "global_step": 300964, "epoch": 2487} {"train_loss": -44.35186767578125, "global_step": 300965, "epoch": 2487} {"train_loss": -44.601409912109375, "global_step": 300966, "epoch": 2487} {"train_loss": -44.24402618408203, "global_step": 300967, "epoch": 2487} {"train_loss": -44.303035736083984, "global_step": 300968, "epoch": 2487} {"train_loss": -44.375030517578125, "global_step": 300969, "epoch": 2487} {"train_loss": -44.9394416809082, "global_step": 300970, "epoch": 2487} {"train_loss": -45.0992431640625, "global_step": 300971, "epoch": 2487} {"train_loss": -44.22236633300781, "global_step": 300972, "epoch": 2487} {"train_loss": -44.657691955566406, "global_step": 300973, "epoch": 2487} {"train_loss": -44.650814056396484, "global_step": 300974, "epoch": 2487} {"train_loss": -44.541500091552734, "global_step": 300975, "epoch": 2487} {"train_loss": -44.26157760620117, "global_step": 300976, "epoch": 2487} {"train_loss": -44.12158203125, "global_step": 300977, "epoch": 2487} {"train_loss": -44.405269622802734, "global_step": 300978, "epoch": 2487} {"train_loss": -44.18294906616211, "global_step": 300979, "epoch": 2487} {"train_loss": -43.661495208740234, "global_step": 300980, "epoch": 2487} {"train_loss": -44.93806076049805, "global_step": 300981, "epoch": 2487} {"train_loss": -44.62333679199219, "global_step": 300982, "epoch": 2487} {"train_loss": -44.44901657104492, "global_step": 300983, "epoch": 2487} {"train_loss": -44.33856201171875, "global_step": 300984, "epoch": 2487} {"train_loss": -43.57905197143555, "global_step": 300985, "epoch": 2487} {"train_loss": -44.292579650878906, "global_step": 300986, "epoch": 2487} {"train_loss": -43.721256256103516, "global_step": 300987, "epoch": 2487} {"train_loss": -42.450496673583984, "global_step": 300988, "epoch": 2487} {"train_loss": -43.18614959716797, "global_step": 300989, "epoch": 2487} {"train_loss": -38.70134735107422, "global_step": 300990, "epoch": 2487} {"train_loss": -42.425960540771484, "global_step": 300991, "epoch": 2487} {"train_loss": -32.51487350463867, "global_step": 300992, "epoch": 2487} {"train_loss": -41.6715202331543, "global_step": 300993, "epoch": 2487} {"train_loss": -34.13457489013672, "global_step": 300994, "epoch": 2487} {"train_loss": -37.974422454833984, "global_step": 300995, "epoch": 2487} {"train_loss": -37.67655563354492, "global_step": 300996, "epoch": 2487} {"train_loss": -34.96944046020508, "global_step": 300997, "epoch": 2487} {"train_loss": -39.28514862060547, "global_step": 300998, "epoch": 2487} {"train_loss": -34.742156982421875, "global_step": 300999, "epoch": 2487} {"train_loss": -40.855770111083984, "global_step": 301000, "epoch": 2487} {"train_loss": -37.086055755615234, "global_step": 301001, "epoch": 2487} {"train_loss": -38.15565872192383, "global_step": 301002, "epoch": 2487} {"train_loss": -37.41511154174805, "global_step": 301003, "epoch": 2487} {"train_loss": -38.293212890625, "global_step": 301004, "epoch": 2487} {"train_loss": -39.16738510131836, "global_step": 301005, "epoch": 2487} {"train_loss": -38.64368438720703, "global_step": 301006, "epoch": 2487} {"train_loss": -40.541358947753906, "global_step": 301007, "epoch": 2487} {"train_loss": -38.8032112121582, "global_step": 301008, "epoch": 2487} {"train_loss": -39.580989837646484, "global_step": 301009, "epoch": 2487} {"train_loss": -40.74700927734375, "global_step": 301010, "epoch": 2487} {"train_loss": -40.78326416015625, "global_step": 301011, "epoch": 2487} {"train_loss": -40.539398193359375, "global_step": 301012, "epoch": 2487} {"train_loss": -40.51622009277344, "global_step": 301013, "epoch": 2487} {"train_loss": -41.432796478271484, "global_step": 301014, "epoch": 2487} {"train_loss": -40.81095504760742, "global_step": 301015, "epoch": 2487} {"train_loss": -41.66936492919922, "global_step": 301016, "epoch": 2487} {"train_loss": -41.82118225097656, "global_step": 301017, "epoch": 2487} {"train_loss": -40.17161178588867, "global_step": 301018, "epoch": 2487} {"train_loss": -42.555484771728516, "global_step": 301019, "epoch": 2487} {"train_loss": -42.52869415283203, "global_step": 301020, "epoch": 2487} {"train_loss": -41.606719970703125, "global_step": 301021, "epoch": 2487} {"train_loss": -42.12073516845703, "global_step": 301022, "epoch": 2487} {"train_loss": -42.790767669677734, "global_step": 301023, "epoch": 2487} {"train_loss": -42.20995330810547, "global_step": 301024, "epoch": 2487} {"train_loss": -42.4377326965332, "global_step": 301025, "epoch": 2487} {"train_loss": -42.57474899291992, "global_step": 301026, "epoch": 2487} {"train_loss": -42.648067474365234, "global_step": 301027, "epoch": 2487} {"train_loss": -43.28390121459961, "global_step": 301028, "epoch": 2487} {"train_loss": -42.959835052490234, "global_step": 301029, "epoch": 2487} {"train_loss": -42.73563766479492, "global_step": 301030, "epoch": 2487} {"train_loss": -42.99580001831055, "global_step": 301031, "epoch": 2487} {"train_loss": -43.06185531616211, "global_step": 301032, "epoch": 2487} {"train_loss": -43.404659271240234, "global_step": 301033, "epoch": 2487} {"train_loss": -42.811275482177734, "global_step": 301034, "epoch": 2487} {"train_loss": -43.67325973510742, "global_step": 301035, "epoch": 2487} {"train_loss": -42.88503646850586, "global_step": 301036, "epoch": 2487} {"train_loss": -43.461021423339844, "global_step": 301037, "epoch": 2487} {"train_loss": -43.48833084106445, "global_step": 301038, "epoch": 2487} {"train_loss": -43.15359115600586, "global_step": 301039, "epoch": 2487} {"train_loss": -43.880069732666016, "global_step": 301040, "epoch": 2487} {"train_loss": -43.58173751831055, "global_step": 301041, "epoch": 2487} {"train_loss": -43.27643966674805, "global_step": 301042, "epoch": 2487} {"train_loss": -43.67352294921875, "global_step": 301043, "epoch": 2487} {"train_loss": -43.42255783081055, "global_step": 301044, "epoch": 2487} {"train_loss": -44.08760070800781, "global_step": 301045, "epoch": 2487} {"train_loss": -43.18341064453125, "global_step": 301046, "epoch": 2487} {"train_loss": -42.583652937707825, "global_step": 301047, "epoch": 2487, "val_loss": 2544488.0} {"train_loss": -43.9618034362793, "global_step": 301048, "epoch": 2488} {"train_loss": -43.373470306396484, "global_step": 301049, "epoch": 2488} {"train_loss": -44.54098129272461, "global_step": 301050, "epoch": 2488} {"train_loss": -44.12467575073242, "global_step": 301051, "epoch": 2488} {"train_loss": -44.15745162963867, "global_step": 301052, "epoch": 2488} {"train_loss": -44.45925521850586, "global_step": 301053, "epoch": 2488} {"train_loss": -44.100887298583984, "global_step": 301054, "epoch": 2488} {"train_loss": -44.225128173828125, "global_step": 301055, "epoch": 2488} {"train_loss": -44.18952560424805, "global_step": 301056, "epoch": 2488} {"train_loss": -44.19073486328125, "global_step": 301057, "epoch": 2488} {"train_loss": -44.47922897338867, "global_step": 301058, "epoch": 2488} {"train_loss": -44.4783821105957, "global_step": 301059, "epoch": 2488} {"train_loss": -44.28528594970703, "global_step": 301060, "epoch": 2488} {"train_loss": -44.38499450683594, "global_step": 301061, "epoch": 2488} {"train_loss": -44.52095413208008, "global_step": 301062, "epoch": 2488} {"train_loss": -44.24068069458008, "global_step": 301063, "epoch": 2488} {"train_loss": -44.559295654296875, "global_step": 301064, "epoch": 2488} {"train_loss": -44.6552734375, "global_step": 301065, "epoch": 2488} {"train_loss": -44.86350631713867, "global_step": 301066, "epoch": 2488} {"train_loss": -44.747806549072266, "global_step": 301067, "epoch": 2488} {"train_loss": -44.884037017822266, "global_step": 301068, "epoch": 2488} {"train_loss": -45.002349853515625, "global_step": 301069, "epoch": 2488} {"train_loss": -45.0278434753418, "global_step": 301070, "epoch": 2488} {"train_loss": -44.631011962890625, "global_step": 301071, "epoch": 2488} {"train_loss": -44.63905334472656, "global_step": 301072, "epoch": 2488} {"train_loss": -44.840057373046875, "global_step": 301073, "epoch": 2488} {"train_loss": -44.748939514160156, "global_step": 301074, "epoch": 2488} {"train_loss": -44.880462646484375, "global_step": 301075, "epoch": 2488} {"train_loss": -44.98264694213867, "global_step": 301076, "epoch": 2488} {"train_loss": -45.03910446166992, "global_step": 301077, "epoch": 2488} {"train_loss": -44.50025177001953, "global_step": 301078, "epoch": 2488} {"train_loss": -45.34872817993164, "global_step": 301079, "epoch": 2488} {"train_loss": -45.011985778808594, "global_step": 301080, "epoch": 2488} {"train_loss": -45.140384674072266, "global_step": 301081, "epoch": 2488} {"train_loss": -45.06132125854492, "global_step": 301082, "epoch": 2488} {"train_loss": -44.843841552734375, "global_step": 301083, "epoch": 2488} {"train_loss": -44.991268157958984, "global_step": 301084, "epoch": 2488} {"train_loss": -45.336524963378906, "global_step": 301085, "epoch": 2488} {"train_loss": -45.20052719116211, "global_step": 301086, "epoch": 2488} {"train_loss": -44.90277862548828, "global_step": 301087, "epoch": 2488} {"train_loss": -44.65525436401367, "global_step": 301088, "epoch": 2488} {"train_loss": -45.34559631347656, "global_step": 301089, "epoch": 2488} {"train_loss": -45.33246612548828, "global_step": 301090, "epoch": 2488} {"train_loss": -45.00028610229492, "global_step": 301091, "epoch": 2488} {"train_loss": -44.27593994140625, "global_step": 301092, "epoch": 2488} {"train_loss": -42.539058685302734, "global_step": 301093, "epoch": 2488} {"train_loss": -40.25382614135742, "global_step": 301094, "epoch": 2488} {"train_loss": -42.42399215698242, "global_step": 301095, "epoch": 2488} {"train_loss": -44.41288757324219, "global_step": 301096, "epoch": 2488} {"train_loss": -43.88373565673828, "global_step": 301097, "epoch": 2488} {"train_loss": -41.500179290771484, "global_step": 301098, "epoch": 2488} {"train_loss": -43.3139533996582, "global_step": 301099, "epoch": 2488} {"train_loss": -43.00019836425781, "global_step": 301100, "epoch": 2488} {"train_loss": -42.800228118896484, "global_step": 301101, "epoch": 2488} {"train_loss": -44.26862716674805, "global_step": 301102, "epoch": 2488} {"train_loss": -43.63251495361328, "global_step": 301103, "epoch": 2488} {"train_loss": -41.103145599365234, "global_step": 301104, "epoch": 2488} {"train_loss": -43.95330810546875, "global_step": 301105, "epoch": 2488} {"train_loss": -43.23835372924805, "global_step": 301106, "epoch": 2488} {"train_loss": -41.318973541259766, "global_step": 301107, "epoch": 2488} {"train_loss": -43.78516387939453, "global_step": 301108, "epoch": 2488} {"train_loss": -40.40609359741211, "global_step": 301109, "epoch": 2488} {"train_loss": -44.13825225830078, "global_step": 301110, "epoch": 2488} {"train_loss": -41.290157318115234, "global_step": 301111, "epoch": 2488} {"train_loss": -44.007774353027344, "global_step": 301112, "epoch": 2488} {"train_loss": -39.879940032958984, "global_step": 301113, "epoch": 2488} {"train_loss": -43.50874328613281, "global_step": 301114, "epoch": 2488} {"train_loss": -37.95241928100586, "global_step": 301115, "epoch": 2488} {"train_loss": -40.85592269897461, "global_step": 301116, "epoch": 2488} {"train_loss": -42.10553741455078, "global_step": 301117, "epoch": 2488} {"train_loss": -39.99810791015625, "global_step": 301118, "epoch": 2488} {"train_loss": -41.74448776245117, "global_step": 301119, "epoch": 2488} {"train_loss": -40.17406463623047, "global_step": 301120, "epoch": 2488} {"train_loss": -43.509578704833984, "global_step": 301121, "epoch": 2488} {"train_loss": -40.58371353149414, "global_step": 301122, "epoch": 2488} {"train_loss": -43.71039962768555, "global_step": 301123, "epoch": 2488} {"train_loss": -41.11738204956055, "global_step": 301124, "epoch": 2488} {"train_loss": -43.04804611206055, "global_step": 301125, "epoch": 2488} {"train_loss": -41.657020568847656, "global_step": 301126, "epoch": 2488} {"train_loss": -43.22035598754883, "global_step": 301127, "epoch": 2488} {"train_loss": -42.56496047973633, "global_step": 301128, "epoch": 2488} {"train_loss": -43.307167053222656, "global_step": 301129, "epoch": 2488} {"train_loss": -43.3286247253418, "global_step": 301130, "epoch": 2488} {"train_loss": -43.64337921142578, "global_step": 301131, "epoch": 2488} {"train_loss": -43.31037139892578, "global_step": 301132, "epoch": 2488} {"train_loss": -43.671356201171875, "global_step": 301133, "epoch": 2488} {"train_loss": -43.4145393371582, "global_step": 301134, "epoch": 2488} {"train_loss": -43.82039260864258, "global_step": 301135, "epoch": 2488} {"train_loss": -43.443267822265625, "global_step": 301136, "epoch": 2488} {"train_loss": -43.39863967895508, "global_step": 301137, "epoch": 2488} {"train_loss": -42.68561935424805, "global_step": 301138, "epoch": 2488} {"train_loss": -43.95490264892578, "global_step": 301139, "epoch": 2488} {"train_loss": -43.42816162109375, "global_step": 301140, "epoch": 2488} {"train_loss": -43.417842864990234, "global_step": 301141, "epoch": 2488} {"train_loss": -43.55561065673828, "global_step": 301142, "epoch": 2488} {"train_loss": -43.524288177490234, "global_step": 301143, "epoch": 2488} {"train_loss": -43.66429138183594, "global_step": 301144, "epoch": 2488} {"train_loss": -43.79778289794922, "global_step": 301145, "epoch": 2488} {"train_loss": -43.81258010864258, "global_step": 301146, "epoch": 2488} {"train_loss": -43.49392318725586, "global_step": 301147, "epoch": 2488} {"train_loss": -44.28739929199219, "global_step": 301148, "epoch": 2488} {"train_loss": -43.46835708618164, "global_step": 301149, "epoch": 2488} {"train_loss": -44.143211364746094, "global_step": 301150, "epoch": 2488} {"train_loss": -44.305450439453125, "global_step": 301151, "epoch": 2488} {"train_loss": -44.258235931396484, "global_step": 301152, "epoch": 2488} {"train_loss": -43.681026458740234, "global_step": 301153, "epoch": 2488} {"train_loss": -44.07228088378906, "global_step": 301154, "epoch": 2488} {"train_loss": -44.3958740234375, "global_step": 301155, "epoch": 2488} {"train_loss": -44.0936279296875, "global_step": 301156, "epoch": 2488} {"train_loss": -44.08372116088867, "global_step": 301157, "epoch": 2488} {"train_loss": -44.304378509521484, "global_step": 301158, "epoch": 2488} {"train_loss": -43.40013885498047, "global_step": 301159, "epoch": 2488} {"train_loss": -43.815364837646484, "global_step": 301160, "epoch": 2488} {"train_loss": -43.97465133666992, "global_step": 301161, "epoch": 2488} {"train_loss": -44.42618179321289, "global_step": 301162, "epoch": 2488} {"train_loss": -43.86729049682617, "global_step": 301163, "epoch": 2488} {"train_loss": -44.9869384765625, "global_step": 301164, "epoch": 2488} {"train_loss": -44.292388916015625, "global_step": 301165, "epoch": 2488} {"train_loss": -44.4659309387207, "global_step": 301166, "epoch": 2488} {"train_loss": -44.27840042114258, "global_step": 301167, "epoch": 2488} {"train_loss": -43.678079999182835, "global_step": 301168, "epoch": 2488, "val_loss": 2639325.75} {"train_loss": -44.32783126831055, "global_step": 301169, "epoch": 2489} {"train_loss": -44.35517501831055, "global_step": 301170, "epoch": 2489} {"train_loss": -44.98784255981445, "global_step": 301171, "epoch": 2489} {"train_loss": -44.51740264892578, "global_step": 301172, "epoch": 2489} {"train_loss": -43.653656005859375, "global_step": 301173, "epoch": 2489} {"train_loss": -44.186866760253906, "global_step": 301174, "epoch": 2489} {"train_loss": -44.55803680419922, "global_step": 301175, "epoch": 2489} {"train_loss": -43.47162628173828, "global_step": 301176, "epoch": 2489} {"train_loss": -43.596736907958984, "global_step": 301177, "epoch": 2489} {"train_loss": -44.18562698364258, "global_step": 301178, "epoch": 2489} {"train_loss": -43.95207595825195, "global_step": 301179, "epoch": 2489} {"train_loss": -42.48812484741211, "global_step": 301180, "epoch": 2489} {"train_loss": -43.384517669677734, "global_step": 301181, "epoch": 2489} {"train_loss": -43.86355972290039, "global_step": 301182, "epoch": 2489} {"train_loss": -42.652198791503906, "global_step": 301183, "epoch": 2489} {"train_loss": -42.918304443359375, "global_step": 301184, "epoch": 2489} {"train_loss": -43.695289611816406, "global_step": 301185, "epoch": 2489} {"train_loss": -43.553810119628906, "global_step": 301186, "epoch": 2489} {"train_loss": -42.77657699584961, "global_step": 301187, "epoch": 2489} {"train_loss": -43.41362762451172, "global_step": 301188, "epoch": 2489} {"train_loss": -43.86719512939453, "global_step": 301189, "epoch": 2489} {"train_loss": -44.44572448730469, "global_step": 301190, "epoch": 2489} {"train_loss": -43.64811325073242, "global_step": 301191, "epoch": 2489} {"train_loss": -43.87267303466797, "global_step": 301192, "epoch": 2489} {"train_loss": -44.25368881225586, "global_step": 301193, "epoch": 2489} {"train_loss": -44.188690185546875, "global_step": 301194, "epoch": 2489} {"train_loss": -43.90671157836914, "global_step": 301195, "epoch": 2489} {"train_loss": -43.8668098449707, "global_step": 301196, "epoch": 2489} {"train_loss": -43.56240463256836, "global_step": 301197, "epoch": 2489} {"train_loss": -42.86003494262695, "global_step": 301198, "epoch": 2489} {"train_loss": -44.04767990112305, "global_step": 301199, "epoch": 2489} {"train_loss": -43.62275314331055, "global_step": 301200, "epoch": 2489} {"train_loss": -44.625980377197266, "global_step": 301201, "epoch": 2489} {"train_loss": -43.988075256347656, "global_step": 301202, "epoch": 2489} {"train_loss": -43.635040283203125, "global_step": 301203, "epoch": 2489} {"train_loss": -43.881629943847656, "global_step": 301204, "epoch": 2489} {"train_loss": -44.23432540893555, "global_step": 301205, "epoch": 2489} {"train_loss": -43.470035552978516, "global_step": 301206, "epoch": 2489} {"train_loss": -42.80934143066406, "global_step": 301207, "epoch": 2489} {"train_loss": -43.71010208129883, "global_step": 301208, "epoch": 2489} {"train_loss": -43.78995895385742, "global_step": 301209, "epoch": 2489} {"train_loss": -44.43930435180664, "global_step": 301210, "epoch": 2489} {"train_loss": -43.6558723449707, "global_step": 301211, "epoch": 2489} {"train_loss": -43.528141021728516, "global_step": 301212, "epoch": 2489} {"train_loss": -42.63376235961914, "global_step": 301213, "epoch": 2489} {"train_loss": -42.509193420410156, "global_step": 301214, "epoch": 2489} {"train_loss": -43.38250732421875, "global_step": 301215, "epoch": 2489} {"train_loss": -43.801124572753906, "global_step": 301216, "epoch": 2489} {"train_loss": -42.31563949584961, "global_step": 301217, "epoch": 2489} {"train_loss": -43.55048370361328, "global_step": 301218, "epoch": 2489} {"train_loss": -43.35378646850586, "global_step": 301219, "epoch": 2489} {"train_loss": -43.62799835205078, "global_step": 301220, "epoch": 2489} {"train_loss": -44.1551399230957, "global_step": 301221, "epoch": 2489} {"train_loss": -43.060123443603516, "global_step": 301222, "epoch": 2489} {"train_loss": -42.32139205932617, "global_step": 301223, "epoch": 2489} {"train_loss": -43.177974700927734, "global_step": 301224, "epoch": 2489} {"train_loss": -44.14384078979492, "global_step": 301225, "epoch": 2489} {"train_loss": -43.1281852722168, "global_step": 301226, "epoch": 2489} {"train_loss": -41.98753356933594, "global_step": 301227, "epoch": 2489} {"train_loss": -43.06059265136719, "global_step": 301228, "epoch": 2489} {"train_loss": -44.42379379272461, "global_step": 301229, "epoch": 2489} {"train_loss": -43.57090377807617, "global_step": 301230, "epoch": 2489} {"train_loss": -43.14065933227539, "global_step": 301231, "epoch": 2489} {"train_loss": -44.05715560913086, "global_step": 301232, "epoch": 2489} {"train_loss": -43.82015609741211, "global_step": 301233, "epoch": 2489} {"train_loss": -40.72149658203125, "global_step": 301234, "epoch": 2489} {"train_loss": -44.22224044799805, "global_step": 301235, "epoch": 2489} {"train_loss": -41.60908889770508, "global_step": 301236, "epoch": 2489} {"train_loss": -41.32160568237305, "global_step": 301237, "epoch": 2489} {"train_loss": -42.1033821105957, "global_step": 301238, "epoch": 2489} {"train_loss": -41.39543151855469, "global_step": 301239, "epoch": 2489} {"train_loss": -43.11561584472656, "global_step": 301240, "epoch": 2489} {"train_loss": -42.162086486816406, "global_step": 301241, "epoch": 2489} {"train_loss": -42.53704833984375, "global_step": 301242, "epoch": 2489} {"train_loss": -43.38294219970703, "global_step": 301243, "epoch": 2489} {"train_loss": -41.8116455078125, "global_step": 301244, "epoch": 2489} {"train_loss": -42.69963455200195, "global_step": 301245, "epoch": 2489} {"train_loss": -42.21675491333008, "global_step": 301246, "epoch": 2489} {"train_loss": -44.67434310913086, "global_step": 301247, "epoch": 2489} {"train_loss": -42.8571891784668, "global_step": 301248, "epoch": 2489} {"train_loss": -41.06605911254883, "global_step": 301249, "epoch": 2489} {"train_loss": -43.79503631591797, "global_step": 301250, "epoch": 2489} {"train_loss": -43.00568771362305, "global_step": 301251, "epoch": 2489} {"train_loss": -41.8266487121582, "global_step": 301252, "epoch": 2489} {"train_loss": -43.97195053100586, "global_step": 301253, "epoch": 2489} {"train_loss": -41.88508987426758, "global_step": 301254, "epoch": 2489} {"train_loss": -43.83890914916992, "global_step": 301255, "epoch": 2489} {"train_loss": -42.36527633666992, "global_step": 301256, "epoch": 2489} {"train_loss": -42.96717071533203, "global_step": 301257, "epoch": 2489} {"train_loss": -43.9037971496582, "global_step": 301258, "epoch": 2489} {"train_loss": -43.225440979003906, "global_step": 301259, "epoch": 2489} {"train_loss": -43.84795379638672, "global_step": 301260, "epoch": 2489} {"train_loss": -43.93074417114258, "global_step": 301261, "epoch": 2489} {"train_loss": -43.71586990356445, "global_step": 301262, "epoch": 2489} {"train_loss": -44.20078659057617, "global_step": 301263, "epoch": 2489} {"train_loss": -44.31350326538086, "global_step": 301264, "epoch": 2489} {"train_loss": -44.158477783203125, "global_step": 301265, "epoch": 2489} {"train_loss": -44.493316650390625, "global_step": 301266, "epoch": 2489} {"train_loss": -44.19233322143555, "global_step": 301267, "epoch": 2489} {"train_loss": -44.173248291015625, "global_step": 301268, "epoch": 2489} {"train_loss": -44.06077194213867, "global_step": 301269, "epoch": 2489} {"train_loss": -44.20355987548828, "global_step": 301270, "epoch": 2489} {"train_loss": -43.59647750854492, "global_step": 301271, "epoch": 2489} {"train_loss": -44.434871673583984, "global_step": 301272, "epoch": 2489} {"train_loss": -44.123451232910156, "global_step": 301273, "epoch": 2489} {"train_loss": -43.8203010559082, "global_step": 301274, "epoch": 2489} {"train_loss": -44.257591247558594, "global_step": 301275, "epoch": 2489} {"train_loss": -43.79707336425781, "global_step": 301276, "epoch": 2489} {"train_loss": -43.628662109375, "global_step": 301277, "epoch": 2489} {"train_loss": -43.906375885009766, "global_step": 301278, "epoch": 2489} {"train_loss": -44.775360107421875, "global_step": 301279, "epoch": 2489} {"train_loss": -43.60299301147461, "global_step": 301280, "epoch": 2489} {"train_loss": -42.959808349609375, "global_step": 301281, "epoch": 2489} {"train_loss": -43.117713928222656, "global_step": 301282, "epoch": 2489} {"train_loss": -44.14376449584961, "global_step": 301283, "epoch": 2489} {"train_loss": -44.11564636230469, "global_step": 301284, "epoch": 2489} {"train_loss": -43.886905670166016, "global_step": 301285, "epoch": 2489} {"train_loss": -43.94771957397461, "global_step": 301286, "epoch": 2489} {"train_loss": -44.85841751098633, "global_step": 301287, "epoch": 2489} {"train_loss": -43.48728942871094, "global_step": 301288, "epoch": 2489} {"train_loss": -43.50099513156355, "global_step": 301289, "epoch": 2489, "val_loss": 2575074.5} {"train_loss": -44.611114501953125, "global_step": 301290, "epoch": 2490} {"train_loss": -44.39445114135742, "global_step": 301291, "epoch": 2490} {"train_loss": -44.15733337402344, "global_step": 301292, "epoch": 2490} {"train_loss": -44.63922882080078, "global_step": 301293, "epoch": 2490} {"train_loss": -44.27006149291992, "global_step": 301294, "epoch": 2490} {"train_loss": -43.95724105834961, "global_step": 301295, "epoch": 2490} {"train_loss": -44.161537170410156, "global_step": 301296, "epoch": 2490} {"train_loss": -44.68535232543945, "global_step": 301297, "epoch": 2490} {"train_loss": -44.1628532409668, "global_step": 301298, "epoch": 2490} {"train_loss": -44.077613830566406, "global_step": 301299, "epoch": 2490} {"train_loss": -44.6392936706543, "global_step": 301300, "epoch": 2490} {"train_loss": -44.719459533691406, "global_step": 301301, "epoch": 2490} {"train_loss": -44.43598556518555, "global_step": 301302, "epoch": 2490} {"train_loss": -44.2532958984375, "global_step": 301303, "epoch": 2490} {"train_loss": -44.53687286376953, "global_step": 301304, "epoch": 2490} {"train_loss": -44.63705825805664, "global_step": 301305, "epoch": 2490} {"train_loss": -45.02350616455078, "global_step": 301306, "epoch": 2490} {"train_loss": -44.66157150268555, "global_step": 301307, "epoch": 2490} {"train_loss": -44.17375564575195, "global_step": 301308, "epoch": 2490} {"train_loss": -44.706905364990234, "global_step": 301309, "epoch": 2490} {"train_loss": -45.27348709106445, "global_step": 301310, "epoch": 2490} {"train_loss": -44.53586196899414, "global_step": 301311, "epoch": 2490} {"train_loss": -44.99872970581055, "global_step": 301312, "epoch": 2490} {"train_loss": -44.762184143066406, "global_step": 301313, "epoch": 2490} {"train_loss": -44.587947845458984, "global_step": 301314, "epoch": 2490} {"train_loss": -44.44890213012695, "global_step": 301315, "epoch": 2490} {"train_loss": -45.25093078613281, "global_step": 301316, "epoch": 2490} {"train_loss": -44.63332748413086, "global_step": 301317, "epoch": 2490} {"train_loss": -43.295719146728516, "global_step": 301318, "epoch": 2490} {"train_loss": -43.39767074584961, "global_step": 301319, "epoch": 2490} {"train_loss": -44.14076232910156, "global_step": 301320, "epoch": 2490} {"train_loss": -43.498294830322266, "global_step": 301321, "epoch": 2490} {"train_loss": -44.49055099487305, "global_step": 301322, "epoch": 2490} {"train_loss": -43.016876220703125, "global_step": 301323, "epoch": 2490} {"train_loss": -40.572689056396484, "global_step": 301324, "epoch": 2490} {"train_loss": -42.505428314208984, "global_step": 301325, "epoch": 2490} {"train_loss": -38.1465950012207, "global_step": 301326, "epoch": 2490} {"train_loss": -40.77656936645508, "global_step": 301327, "epoch": 2490} {"train_loss": -41.00605010986328, "global_step": 301328, "epoch": 2490} {"train_loss": -40.4180793762207, "global_step": 301329, "epoch": 2490} {"train_loss": -39.268531799316406, "global_step": 301330, "epoch": 2490} {"train_loss": -40.975643157958984, "global_step": 301331, "epoch": 2490} {"train_loss": -39.881011962890625, "global_step": 301332, "epoch": 2490} {"train_loss": -41.289146423339844, "global_step": 301333, "epoch": 2490} {"train_loss": -40.2713623046875, "global_step": 301334, "epoch": 2490} {"train_loss": -42.75885772705078, "global_step": 301335, "epoch": 2490} {"train_loss": -39.8427734375, "global_step": 301336, "epoch": 2490} {"train_loss": -42.3072395324707, "global_step": 301337, "epoch": 2490} {"train_loss": -41.05129623413086, "global_step": 301338, "epoch": 2490} {"train_loss": -41.34514236450195, "global_step": 301339, "epoch": 2490} {"train_loss": -41.05608367919922, "global_step": 301340, "epoch": 2490} {"train_loss": -42.1041259765625, "global_step": 301341, "epoch": 2490} {"train_loss": -40.16524124145508, "global_step": 301342, "epoch": 2490} {"train_loss": -42.3181266784668, "global_step": 301343, "epoch": 2490} {"train_loss": -41.33363723754883, "global_step": 301344, "epoch": 2490} {"train_loss": -41.97159957885742, "global_step": 301345, "epoch": 2490} {"train_loss": -41.79194259643555, "global_step": 301346, "epoch": 2490} {"train_loss": -41.37484359741211, "global_step": 301347, "epoch": 2490} {"train_loss": -42.04763412475586, "global_step": 301348, "epoch": 2490} {"train_loss": -42.7244987487793, "global_step": 301349, "epoch": 2490} {"train_loss": -40.94448471069336, "global_step": 301350, "epoch": 2490} {"train_loss": -42.35801696777344, "global_step": 301351, "epoch": 2490} {"train_loss": -43.1826286315918, "global_step": 301352, "epoch": 2490} {"train_loss": -42.01383590698242, "global_step": 301353, "epoch": 2490} {"train_loss": -42.52632522583008, "global_step": 301354, "epoch": 2490} {"train_loss": -43.6955680847168, "global_step": 301355, "epoch": 2490} {"train_loss": -43.288177490234375, "global_step": 301356, "epoch": 2490} {"train_loss": -43.85398483276367, "global_step": 301357, "epoch": 2490} {"train_loss": -42.804718017578125, "global_step": 301358, "epoch": 2490} {"train_loss": -44.18148422241211, "global_step": 301359, "epoch": 2490} {"train_loss": -42.97482681274414, "global_step": 301360, "epoch": 2490} {"train_loss": -42.65877914428711, "global_step": 301361, "epoch": 2490} {"train_loss": -43.44416427612305, "global_step": 301362, "epoch": 2490} {"train_loss": -43.4525032043457, "global_step": 301363, "epoch": 2490} {"train_loss": -42.61396408081055, "global_step": 301364, "epoch": 2490} {"train_loss": -43.223907470703125, "global_step": 301365, "epoch": 2490} {"train_loss": -44.19374084472656, "global_step": 301366, "epoch": 2490} {"train_loss": -42.75349044799805, "global_step": 301367, "epoch": 2490} {"train_loss": -43.9334716796875, "global_step": 301368, "epoch": 2490} {"train_loss": -43.44203186035156, "global_step": 301369, "epoch": 2490} {"train_loss": -43.88763427734375, "global_step": 301370, "epoch": 2490} {"train_loss": -44.011043548583984, "global_step": 301371, "epoch": 2490} {"train_loss": -43.44465255737305, "global_step": 301372, "epoch": 2490} {"train_loss": -44.01273727416992, "global_step": 301373, "epoch": 2490} {"train_loss": -43.875732421875, "global_step": 301374, "epoch": 2490} {"train_loss": -44.06480407714844, "global_step": 301375, "epoch": 2490} {"train_loss": -44.01427459716797, "global_step": 301376, "epoch": 2490} {"train_loss": -43.83482360839844, "global_step": 301377, "epoch": 2490} {"train_loss": -43.75895309448242, "global_step": 301378, "epoch": 2490} {"train_loss": -43.41011047363281, "global_step": 301379, "epoch": 2490} {"train_loss": -43.76266098022461, "global_step": 301380, "epoch": 2490} {"train_loss": -44.33405685424805, "global_step": 301381, "epoch": 2490} {"train_loss": -44.34309768676758, "global_step": 301382, "epoch": 2490} {"train_loss": -44.670040130615234, "global_step": 301383, "epoch": 2490} {"train_loss": -44.52760314941406, "global_step": 301384, "epoch": 2490} {"train_loss": -43.53273010253906, "global_step": 301385, "epoch": 2490} {"train_loss": -44.10346221923828, "global_step": 301386, "epoch": 2490} {"train_loss": -44.3758544921875, "global_step": 301387, "epoch": 2490} {"train_loss": -43.934688568115234, "global_step": 301388, "epoch": 2490} {"train_loss": -43.629730224609375, "global_step": 301389, "epoch": 2490} {"train_loss": -44.096981048583984, "global_step": 301390, "epoch": 2490} {"train_loss": -44.375831604003906, "global_step": 301391, "epoch": 2490} {"train_loss": -44.213905334472656, "global_step": 301392, "epoch": 2490} {"train_loss": -44.6749382019043, "global_step": 301393, "epoch": 2490} {"train_loss": -44.871273040771484, "global_step": 301394, "epoch": 2490} {"train_loss": -44.20829391479492, "global_step": 301395, "epoch": 2490} {"train_loss": -44.17652130126953, "global_step": 301396, "epoch": 2490} {"train_loss": -44.6505241394043, "global_step": 301397, "epoch": 2490} {"train_loss": -44.32496643066406, "global_step": 301398, "epoch": 2490} {"train_loss": -44.7601432800293, "global_step": 301399, "epoch": 2490} {"train_loss": -44.57069778442383, "global_step": 301400, "epoch": 2490} {"train_loss": -44.54273223876953, "global_step": 301401, "epoch": 2490} {"train_loss": -44.5003547668457, "global_step": 301402, "epoch": 2490} {"train_loss": -44.50393295288086, "global_step": 301403, "epoch": 2490} {"train_loss": -43.96315383911133, "global_step": 301404, "epoch": 2490} {"train_loss": -44.60548782348633, "global_step": 301405, "epoch": 2490} {"train_loss": -45.07892608642578, "global_step": 301406, "epoch": 2490} {"train_loss": -43.99576950073242, "global_step": 301407, "epoch": 2490} {"train_loss": -43.911983489990234, "global_step": 301408, "epoch": 2490} {"train_loss": -42.0870361328125, "global_step": 301409, "epoch": 2490} {"train_loss": -43.38612807092588, "global_step": 301410, "epoch": 2490, "val_loss": 2519190.0} {"train_loss": -44.30898666381836, "global_step": 301411, "epoch": 2491} {"train_loss": -42.99739456176758, "global_step": 301412, "epoch": 2491} {"train_loss": -44.24836349487305, "global_step": 301413, "epoch": 2491} {"train_loss": -43.795692443847656, "global_step": 301414, "epoch": 2491} {"train_loss": -44.24079132080078, "global_step": 301415, "epoch": 2491} {"train_loss": -44.6231689453125, "global_step": 301416, "epoch": 2491} {"train_loss": -43.33502197265625, "global_step": 301417, "epoch": 2491} {"train_loss": -41.531227111816406, "global_step": 301418, "epoch": 2491} {"train_loss": -44.33486557006836, "global_step": 301419, "epoch": 2491} {"train_loss": -40.82598876953125, "global_step": 301420, "epoch": 2491} {"train_loss": -44.10360336303711, "global_step": 301421, "epoch": 2491} {"train_loss": -43.497737884521484, "global_step": 301422, "epoch": 2491} {"train_loss": -41.37984848022461, "global_step": 301423, "epoch": 2491} {"train_loss": -44.14110565185547, "global_step": 301424, "epoch": 2491} {"train_loss": -43.04970169067383, "global_step": 301425, "epoch": 2491} {"train_loss": -41.16279983520508, "global_step": 301426, "epoch": 2491} {"train_loss": -41.65682601928711, "global_step": 301427, "epoch": 2491} {"train_loss": -39.791770935058594, "global_step": 301428, "epoch": 2491} {"train_loss": -40.9443473815918, "global_step": 301429, "epoch": 2491} {"train_loss": -42.92210388183594, "global_step": 301430, "epoch": 2491} {"train_loss": -41.72623825073242, "global_step": 301431, "epoch": 2491} {"train_loss": -40.87986373901367, "global_step": 301432, "epoch": 2491} {"train_loss": -41.62890625, "global_step": 301433, "epoch": 2491} {"train_loss": -41.55842971801758, "global_step": 301434, "epoch": 2491} {"train_loss": -41.82246017456055, "global_step": 301435, "epoch": 2491} {"train_loss": -39.931724548339844, "global_step": 301436, "epoch": 2491} {"train_loss": -41.90336227416992, "global_step": 301437, "epoch": 2491} {"train_loss": -41.175533294677734, "global_step": 301438, "epoch": 2491} {"train_loss": -40.465911865234375, "global_step": 301439, "epoch": 2491} {"train_loss": -42.853538513183594, "global_step": 301440, "epoch": 2491} {"train_loss": -41.09353256225586, "global_step": 301441, "epoch": 2491} {"train_loss": -42.617244720458984, "global_step": 301442, "epoch": 2491} {"train_loss": -42.84498596191406, "global_step": 301443, "epoch": 2491} {"train_loss": -42.487545013427734, "global_step": 301444, "epoch": 2491} {"train_loss": -43.011688232421875, "global_step": 301445, "epoch": 2491} {"train_loss": -42.663414001464844, "global_step": 301446, "epoch": 2491} {"train_loss": -42.80268096923828, "global_step": 301447, "epoch": 2491} {"train_loss": -43.22107696533203, "global_step": 301448, "epoch": 2491} {"train_loss": -43.829036712646484, "global_step": 301449, "epoch": 2491} {"train_loss": -43.00552749633789, "global_step": 301450, "epoch": 2491} {"train_loss": -43.55253219604492, "global_step": 301451, "epoch": 2491} {"train_loss": -42.298160552978516, "global_step": 301452, "epoch": 2491} {"train_loss": -43.607704162597656, "global_step": 301453, "epoch": 2491} {"train_loss": -43.20682907104492, "global_step": 301454, "epoch": 2491} {"train_loss": -43.737892150878906, "global_step": 301455, "epoch": 2491} {"train_loss": -43.34373092651367, "global_step": 301456, "epoch": 2491} {"train_loss": -43.82844543457031, "global_step": 301457, "epoch": 2491} {"train_loss": -43.64644241333008, "global_step": 301458, "epoch": 2491} {"train_loss": -43.34345626831055, "global_step": 301459, "epoch": 2491} {"train_loss": -44.29044723510742, "global_step": 301460, "epoch": 2491} {"train_loss": -43.026302337646484, "global_step": 301461, "epoch": 2491} {"train_loss": -43.68014144897461, "global_step": 301462, "epoch": 2491} {"train_loss": -43.988311767578125, "global_step": 301463, "epoch": 2491} {"train_loss": -43.81711196899414, "global_step": 301464, "epoch": 2491} {"train_loss": -43.84518051147461, "global_step": 301465, "epoch": 2491} {"train_loss": -44.308250427246094, "global_step": 301466, "epoch": 2491} {"train_loss": -43.55828857421875, "global_step": 301467, "epoch": 2491} {"train_loss": -44.29690933227539, "global_step": 301468, "epoch": 2491} {"train_loss": -44.02101516723633, "global_step": 301469, "epoch": 2491} {"train_loss": -44.26694869995117, "global_step": 301470, "epoch": 2491} {"train_loss": -44.20948028564453, "global_step": 301471, "epoch": 2491} {"train_loss": -44.4233283996582, "global_step": 301472, "epoch": 2491} {"train_loss": -44.19646072387695, "global_step": 301473, "epoch": 2491} {"train_loss": -44.7432975769043, "global_step": 301474, "epoch": 2491} {"train_loss": -44.628173828125, "global_step": 301475, "epoch": 2491} {"train_loss": -44.536983489990234, "global_step": 301476, "epoch": 2491} {"train_loss": -44.7757568359375, "global_step": 301477, "epoch": 2491} {"train_loss": -44.442718505859375, "global_step": 301478, "epoch": 2491} {"train_loss": -44.85599899291992, "global_step": 301479, "epoch": 2491} {"train_loss": -44.95693588256836, "global_step": 301480, "epoch": 2491} {"train_loss": -45.031288146972656, "global_step": 301481, "epoch": 2491} {"train_loss": -44.90419387817383, "global_step": 301482, "epoch": 2491} {"train_loss": -44.9787712097168, "global_step": 301483, "epoch": 2491} {"train_loss": -45.09451675415039, "global_step": 301484, "epoch": 2491} {"train_loss": -44.90776443481445, "global_step": 301485, "epoch": 2491} {"train_loss": -44.734352111816406, "global_step": 301486, "epoch": 2491} {"train_loss": -44.96515655517578, "global_step": 301487, "epoch": 2491} {"train_loss": -44.75789260864258, "global_step": 301488, "epoch": 2491} {"train_loss": -44.79539108276367, "global_step": 301489, "epoch": 2491} {"train_loss": -44.58749008178711, "global_step": 301490, "epoch": 2491} {"train_loss": -44.9177131652832, "global_step": 301491, "epoch": 2491} {"train_loss": -45.21217727661133, "global_step": 301492, "epoch": 2491} {"train_loss": -45.06064224243164, "global_step": 301493, "epoch": 2491} {"train_loss": -45.18265914916992, "global_step": 301494, "epoch": 2491} {"train_loss": -45.04533004760742, "global_step": 301495, "epoch": 2491} {"train_loss": -44.88346481323242, "global_step": 301496, "epoch": 2491} {"train_loss": -45.35038375854492, "global_step": 301497, "epoch": 2491} {"train_loss": -45.54290771484375, "global_step": 301498, "epoch": 2491} {"train_loss": -45.3680534362793, "global_step": 301499, "epoch": 2491} {"train_loss": -45.26278305053711, "global_step": 301500, "epoch": 2491} {"train_loss": -45.391082763671875, "global_step": 301501, "epoch": 2491} {"train_loss": -44.93146896362305, "global_step": 301502, "epoch": 2491} {"train_loss": -44.38430404663086, "global_step": 301503, "epoch": 2491} {"train_loss": -45.538330078125, "global_step": 301504, "epoch": 2491} {"train_loss": -44.7889404296875, "global_step": 301505, "epoch": 2491} {"train_loss": -44.902706146240234, "global_step": 301506, "epoch": 2491} {"train_loss": -43.74726104736328, "global_step": 301507, "epoch": 2491} {"train_loss": -42.658023834228516, "global_step": 301508, "epoch": 2491} {"train_loss": -38.9669075012207, "global_step": 301509, "epoch": 2491} {"train_loss": -37.69752883911133, "global_step": 301510, "epoch": 2491} {"train_loss": -40.525909423828125, "global_step": 301511, "epoch": 2491} {"train_loss": -40.598228454589844, "global_step": 301512, "epoch": 2491} {"train_loss": -38.6301383972168, "global_step": 301513, "epoch": 2491} {"train_loss": -40.037410736083984, "global_step": 301514, "epoch": 2491} {"train_loss": -40.01017761230469, "global_step": 301515, "epoch": 2491} {"train_loss": -39.506099700927734, "global_step": 301516, "epoch": 2491} {"train_loss": -41.13804244995117, "global_step": 301517, "epoch": 2491} {"train_loss": -40.96728515625, "global_step": 301518, "epoch": 2491} {"train_loss": -40.29048156738281, "global_step": 301519, "epoch": 2491} {"train_loss": -40.56470489501953, "global_step": 301520, "epoch": 2491} {"train_loss": -40.561763763427734, "global_step": 301521, "epoch": 2491} {"train_loss": -41.646942138671875, "global_step": 301522, "epoch": 2491} {"train_loss": -41.17171096801758, "global_step": 301523, "epoch": 2491} {"train_loss": -40.8691520690918, "global_step": 301524, "epoch": 2491} {"train_loss": -40.9283561706543, "global_step": 301525, "epoch": 2491} {"train_loss": -40.69330596923828, "global_step": 301526, "epoch": 2491} {"train_loss": -40.99916458129883, "global_step": 301527, "epoch": 2491} {"train_loss": -41.375518798828125, "global_step": 301528, "epoch": 2491} {"train_loss": -41.216094970703125, "global_step": 301529, "epoch": 2491} {"train_loss": -41.7266960144043, "global_step": 301530, "epoch": 2491} {"train_loss": -43.02865001583888, "global_step": 301531, "epoch": 2491, "val_loss": 2627601.0} {"train_loss": -42.59881591796875, "global_step": 301532, "epoch": 2492} {"train_loss": -42.09737777709961, "global_step": 301533, "epoch": 2492} {"train_loss": -42.656002044677734, "global_step": 301534, "epoch": 2492} {"train_loss": -42.89297866821289, "global_step": 301535, "epoch": 2492} {"train_loss": -43.22979736328125, "global_step": 301536, "epoch": 2492} {"train_loss": -43.24238967895508, "global_step": 301537, "epoch": 2492} {"train_loss": -43.66822814941406, "global_step": 301538, "epoch": 2492} {"train_loss": -43.0771598815918, "global_step": 301539, "epoch": 2492} {"train_loss": -43.42794418334961, "global_step": 301540, "epoch": 2492} {"train_loss": -43.8128547668457, "global_step": 301541, "epoch": 2492} {"train_loss": -43.2005729675293, "global_step": 301542, "epoch": 2492} {"train_loss": -43.259368896484375, "global_step": 301543, "epoch": 2492} {"train_loss": -44.091285705566406, "global_step": 301544, "epoch": 2492} {"train_loss": -42.95685958862305, "global_step": 301545, "epoch": 2492} {"train_loss": -44.0744514465332, "global_step": 301546, "epoch": 2492} {"train_loss": -43.67853927612305, "global_step": 301547, "epoch": 2492} {"train_loss": -43.996395111083984, "global_step": 301548, "epoch": 2492} {"train_loss": -42.299686431884766, "global_step": 301549, "epoch": 2492} {"train_loss": -43.357704162597656, "global_step": 301550, "epoch": 2492} {"train_loss": -41.863487243652344, "global_step": 301551, "epoch": 2492} {"train_loss": -42.225765228271484, "global_step": 301552, "epoch": 2492} {"train_loss": -43.094810485839844, "global_step": 301553, "epoch": 2492} {"train_loss": -42.058197021484375, "global_step": 301554, "epoch": 2492} {"train_loss": -42.27021408081055, "global_step": 301555, "epoch": 2492} {"train_loss": -42.69974899291992, "global_step": 301556, "epoch": 2492} {"train_loss": -40.275184631347656, "global_step": 301557, "epoch": 2492} {"train_loss": -37.934547424316406, "global_step": 301558, "epoch": 2492} {"train_loss": -39.77836227416992, "global_step": 301559, "epoch": 2492} {"train_loss": -40.39973068237305, "global_step": 301560, "epoch": 2492} {"train_loss": -38.77193069458008, "global_step": 301561, "epoch": 2492} {"train_loss": -41.470848083496094, "global_step": 301562, "epoch": 2492} {"train_loss": -41.48921585083008, "global_step": 301563, "epoch": 2492} {"train_loss": -40.19413375854492, "global_step": 301564, "epoch": 2492} {"train_loss": -36.237003326416016, "global_step": 301565, "epoch": 2492} {"train_loss": -32.91427230834961, "global_step": 301566, "epoch": 2492} {"train_loss": -35.80607604980469, "global_step": 301567, "epoch": 2492} {"train_loss": -38.59376907348633, "global_step": 301568, "epoch": 2492} {"train_loss": -38.38709259033203, "global_step": 301569, "epoch": 2492} {"train_loss": -34.4871826171875, "global_step": 301570, "epoch": 2492} {"train_loss": -37.93040466308594, "global_step": 301571, "epoch": 2492} {"train_loss": -37.040950775146484, "global_step": 301572, "epoch": 2492} {"train_loss": -35.73516082763672, "global_step": 301573, "epoch": 2492} {"train_loss": -37.009220123291016, "global_step": 301574, "epoch": 2492} {"train_loss": -39.27738571166992, "global_step": 301575, "epoch": 2492} {"train_loss": -37.73053741455078, "global_step": 301576, "epoch": 2492} {"train_loss": -40.69633102416992, "global_step": 301577, "epoch": 2492} {"train_loss": -37.425533294677734, "global_step": 301578, "epoch": 2492} {"train_loss": -40.59212112426758, "global_step": 301579, "epoch": 2492} {"train_loss": -37.96732711791992, "global_step": 301580, "epoch": 2492} {"train_loss": -38.69978713989258, "global_step": 301581, "epoch": 2492} {"train_loss": -40.45559310913086, "global_step": 301582, "epoch": 2492} {"train_loss": -38.962799072265625, "global_step": 301583, "epoch": 2492} {"train_loss": -40.13534164428711, "global_step": 301584, "epoch": 2492} {"train_loss": -39.204872131347656, "global_step": 301585, "epoch": 2492} {"train_loss": -41.73234939575195, "global_step": 301586, "epoch": 2492} {"train_loss": -41.02339172363281, "global_step": 301587, "epoch": 2492} {"train_loss": -42.687557220458984, "global_step": 301588, "epoch": 2492} {"train_loss": -41.040279388427734, "global_step": 301589, "epoch": 2492} {"train_loss": -42.092041015625, "global_step": 301590, "epoch": 2492} {"train_loss": -41.74643325805664, "global_step": 301591, "epoch": 2492} {"train_loss": -42.031471252441406, "global_step": 301592, "epoch": 2492} {"train_loss": -42.6256103515625, "global_step": 301593, "epoch": 2492} {"train_loss": -41.900604248046875, "global_step": 301594, "epoch": 2492} {"train_loss": -42.25344467163086, "global_step": 301595, "epoch": 2492} {"train_loss": -42.757118225097656, "global_step": 301596, "epoch": 2492} {"train_loss": -43.42743682861328, "global_step": 301597, "epoch": 2492} {"train_loss": -42.571311950683594, "global_step": 301598, "epoch": 2492} {"train_loss": -43.0218620300293, "global_step": 301599, "epoch": 2492} {"train_loss": -42.57658386230469, "global_step": 301600, "epoch": 2492} {"train_loss": -43.262332916259766, "global_step": 301601, "epoch": 2492} {"train_loss": -43.32273483276367, "global_step": 301602, "epoch": 2492} {"train_loss": -43.453617095947266, "global_step": 301603, "epoch": 2492} {"train_loss": -42.80097579956055, "global_step": 301604, "epoch": 2492} {"train_loss": -42.96281051635742, "global_step": 301605, "epoch": 2492} {"train_loss": -43.3407096862793, "global_step": 301606, "epoch": 2492} {"train_loss": -43.2325439453125, "global_step": 301607, "epoch": 2492} {"train_loss": -43.660457611083984, "global_step": 301608, "epoch": 2492} {"train_loss": -43.02244567871094, "global_step": 301609, "epoch": 2492} {"train_loss": -43.4847412109375, "global_step": 301610, "epoch": 2492} {"train_loss": -43.53390121459961, "global_step": 301611, "epoch": 2492} {"train_loss": -43.57209014892578, "global_step": 301612, "epoch": 2492} {"train_loss": -42.53988265991211, "global_step": 301613, "epoch": 2492} {"train_loss": -43.31703186035156, "global_step": 301614, "epoch": 2492} {"train_loss": -43.8065071105957, "global_step": 301615, "epoch": 2492} {"train_loss": -43.231685638427734, "global_step": 301616, "epoch": 2492} {"train_loss": -43.55703353881836, "global_step": 301617, "epoch": 2492} {"train_loss": -43.4234504699707, "global_step": 301618, "epoch": 2492} {"train_loss": -43.63551712036133, "global_step": 301619, "epoch": 2492} {"train_loss": -44.09303665161133, "global_step": 301620, "epoch": 2492} {"train_loss": -43.72126007080078, "global_step": 301621, "epoch": 2492} {"train_loss": -43.68485641479492, "global_step": 301622, "epoch": 2492} {"train_loss": -43.84550857543945, "global_step": 301623, "epoch": 2492} {"train_loss": -44.10651397705078, "global_step": 301624, "epoch": 2492} {"train_loss": -44.64662551879883, "global_step": 301625, "epoch": 2492} {"train_loss": -43.879310607910156, "global_step": 301626, "epoch": 2492} {"train_loss": -44.06122970581055, "global_step": 301627, "epoch": 2492} {"train_loss": -43.61564636230469, "global_step": 301628, "epoch": 2492} {"train_loss": -44.584197998046875, "global_step": 301629, "epoch": 2492} {"train_loss": -44.648555755615234, "global_step": 301630, "epoch": 2492} {"train_loss": -44.43960189819336, "global_step": 301631, "epoch": 2492} {"train_loss": -44.03446578979492, "global_step": 301632, "epoch": 2492} {"train_loss": -44.477996826171875, "global_step": 301633, "epoch": 2492} {"train_loss": -44.6744384765625, "global_step": 301634, "epoch": 2492} {"train_loss": -44.37571334838867, "global_step": 301635, "epoch": 2492} {"train_loss": -44.698280334472656, "global_step": 301636, "epoch": 2492} {"train_loss": -44.497127532958984, "global_step": 301637, "epoch": 2492} {"train_loss": -44.36458969116211, "global_step": 301638, "epoch": 2492} {"train_loss": -44.65864944458008, "global_step": 301639, "epoch": 2492} {"train_loss": -44.3793830871582, "global_step": 301640, "epoch": 2492} {"train_loss": -44.63850402832031, "global_step": 301641, "epoch": 2492} {"train_loss": -44.71059799194336, "global_step": 301642, "epoch": 2492} {"train_loss": -44.519020080566406, "global_step": 301643, "epoch": 2492} {"train_loss": -44.58980178833008, "global_step": 301644, "epoch": 2492} {"train_loss": -44.71023941040039, "global_step": 301645, "epoch": 2492} {"train_loss": -44.60129928588867, "global_step": 301646, "epoch": 2492} {"train_loss": -44.4671516418457, "global_step": 301647, "epoch": 2492} {"train_loss": -45.01469039916992, "global_step": 301648, "epoch": 2492} {"train_loss": -44.03363800048828, "global_step": 301649, "epoch": 2492} {"train_loss": -44.968135833740234, "global_step": 301650, "epoch": 2492} {"train_loss": -44.89309310913086, "global_step": 301651, "epoch": 2492} {"train_loss": -42.2556984326071, "global_step": 301652, "epoch": 2492, "val_loss": 2629471.75} {"train_loss": -45.1963996887207, "global_step": 301653, "epoch": 2493} {"train_loss": -44.81338882446289, "global_step": 301654, "epoch": 2493} {"train_loss": -45.173675537109375, "global_step": 301655, "epoch": 2493} {"train_loss": -44.56733322143555, "global_step": 301656, "epoch": 2493} {"train_loss": -45.02427291870117, "global_step": 301657, "epoch": 2493} {"train_loss": -45.21426773071289, "global_step": 301658, "epoch": 2493} {"train_loss": -44.625144958496094, "global_step": 301659, "epoch": 2493} {"train_loss": -45.08481979370117, "global_step": 301660, "epoch": 2493} {"train_loss": -45.134559631347656, "global_step": 301661, "epoch": 2493} {"train_loss": -44.3048095703125, "global_step": 301662, "epoch": 2493} {"train_loss": -44.86840057373047, "global_step": 301663, "epoch": 2493} {"train_loss": -44.91375732421875, "global_step": 301664, "epoch": 2493} {"train_loss": -44.80199432373047, "global_step": 301665, "epoch": 2493} {"train_loss": -42.960052490234375, "global_step": 301666, "epoch": 2493} {"train_loss": -42.04294967651367, "global_step": 301667, "epoch": 2493} {"train_loss": -43.58921813964844, "global_step": 301668, "epoch": 2493} {"train_loss": -43.703670501708984, "global_step": 301669, "epoch": 2493} {"train_loss": -43.751434326171875, "global_step": 301670, "epoch": 2493} {"train_loss": -44.441890716552734, "global_step": 301671, "epoch": 2493} {"train_loss": -44.393707275390625, "global_step": 301672, "epoch": 2493} {"train_loss": -43.996795654296875, "global_step": 301673, "epoch": 2493} {"train_loss": -44.097450256347656, "global_step": 301674, "epoch": 2493} {"train_loss": -43.57674789428711, "global_step": 301675, "epoch": 2493} {"train_loss": -43.71039962768555, "global_step": 301676, "epoch": 2493} {"train_loss": -44.37511444091797, "global_step": 301677, "epoch": 2493} {"train_loss": -43.959716796875, "global_step": 301678, "epoch": 2493} {"train_loss": -43.333106994628906, "global_step": 301679, "epoch": 2493} {"train_loss": -44.205806732177734, "global_step": 301680, "epoch": 2493} {"train_loss": -44.675537109375, "global_step": 301681, "epoch": 2493} {"train_loss": -42.909278869628906, "global_step": 301682, "epoch": 2493} {"train_loss": -44.292415618896484, "global_step": 301683, "epoch": 2493} {"train_loss": -43.495872497558594, "global_step": 301684, "epoch": 2493} {"train_loss": -42.09635543823242, "global_step": 301685, "epoch": 2493} {"train_loss": -43.96818923950195, "global_step": 301686, "epoch": 2493} {"train_loss": -43.12257766723633, "global_step": 301687, "epoch": 2493} {"train_loss": -43.786128997802734, "global_step": 301688, "epoch": 2493} {"train_loss": -44.47552490234375, "global_step": 301689, "epoch": 2493} {"train_loss": -42.59914779663086, "global_step": 301690, "epoch": 2493} {"train_loss": -42.84847640991211, "global_step": 301691, "epoch": 2493} {"train_loss": -43.581939697265625, "global_step": 301692, "epoch": 2493} {"train_loss": -42.8513069152832, "global_step": 301693, "epoch": 2493} {"train_loss": -43.55813217163086, "global_step": 301694, "epoch": 2493} {"train_loss": -42.945068359375, "global_step": 301695, "epoch": 2493} {"train_loss": -43.465755462646484, "global_step": 301696, "epoch": 2493} {"train_loss": -43.646427154541016, "global_step": 301697, "epoch": 2493} {"train_loss": -43.7877311706543, "global_step": 301698, "epoch": 2493} {"train_loss": -43.94780731201172, "global_step": 301699, "epoch": 2493} {"train_loss": -43.67286682128906, "global_step": 301700, "epoch": 2493} {"train_loss": -43.97907638549805, "global_step": 301701, "epoch": 2493} {"train_loss": -42.873355865478516, "global_step": 301702, "epoch": 2493} {"train_loss": -43.60810089111328, "global_step": 301703, "epoch": 2493} {"train_loss": -43.41024398803711, "global_step": 301704, "epoch": 2493} {"train_loss": -43.55322265625, "global_step": 301705, "epoch": 2493} {"train_loss": -44.53347396850586, "global_step": 301706, "epoch": 2493} {"train_loss": -44.13145065307617, "global_step": 301707, "epoch": 2493} {"train_loss": -43.83341979980469, "global_step": 301708, "epoch": 2493} {"train_loss": -43.43191146850586, "global_step": 301709, "epoch": 2493} {"train_loss": -44.5517463684082, "global_step": 301710, "epoch": 2493} {"train_loss": -44.42185592651367, "global_step": 301711, "epoch": 2493} {"train_loss": -44.40095138549805, "global_step": 301712, "epoch": 2493} {"train_loss": -44.368709564208984, "global_step": 301713, "epoch": 2493} {"train_loss": -44.16950988769531, "global_step": 301714, "epoch": 2493} {"train_loss": -44.40031051635742, "global_step": 301715, "epoch": 2493} {"train_loss": -44.44874954223633, "global_step": 301716, "epoch": 2493} {"train_loss": -44.322052001953125, "global_step": 301717, "epoch": 2493} {"train_loss": -44.528194427490234, "global_step": 301718, "epoch": 2493} {"train_loss": -44.5074577331543, "global_step": 301719, "epoch": 2493} {"train_loss": -44.7105712890625, "global_step": 301720, "epoch": 2493} {"train_loss": -44.482177734375, "global_step": 301721, "epoch": 2493} {"train_loss": -44.4507942199707, "global_step": 301722, "epoch": 2493} {"train_loss": -43.70830154418945, "global_step": 301723, "epoch": 2493} {"train_loss": -43.37343978881836, "global_step": 301724, "epoch": 2493} {"train_loss": -43.27964401245117, "global_step": 301725, "epoch": 2493} {"train_loss": -44.23560333251953, "global_step": 301726, "epoch": 2493} {"train_loss": -44.18868637084961, "global_step": 301727, "epoch": 2493} {"train_loss": -44.93224334716797, "global_step": 301728, "epoch": 2493} {"train_loss": -45.0609245300293, "global_step": 301729, "epoch": 2493} {"train_loss": -43.4494743347168, "global_step": 301730, "epoch": 2493} {"train_loss": -44.10821533203125, "global_step": 301731, "epoch": 2493} {"train_loss": -44.30150604248047, "global_step": 301732, "epoch": 2493} {"train_loss": -43.49516677856445, "global_step": 301733, "epoch": 2493} {"train_loss": -44.85963821411133, "global_step": 301734, "epoch": 2493} {"train_loss": -43.83732223510742, "global_step": 301735, "epoch": 2493} {"train_loss": -43.99650955200195, "global_step": 301736, "epoch": 2493} {"train_loss": -44.073307037353516, "global_step": 301737, "epoch": 2493} {"train_loss": -43.9224967956543, "global_step": 301738, "epoch": 2493} {"train_loss": -43.93699264526367, "global_step": 301739, "epoch": 2493} {"train_loss": -43.5346794128418, "global_step": 301740, "epoch": 2493} {"train_loss": -43.938655853271484, "global_step": 301741, "epoch": 2493} {"train_loss": -43.28081130981445, "global_step": 301742, "epoch": 2493} {"train_loss": -41.07521057128906, "global_step": 301743, "epoch": 2493} {"train_loss": -43.44328689575195, "global_step": 301744, "epoch": 2493} {"train_loss": -42.02790451049805, "global_step": 301745, "epoch": 2493} {"train_loss": -42.535545349121094, "global_step": 301746, "epoch": 2493} {"train_loss": -41.053680419921875, "global_step": 301747, "epoch": 2493} {"train_loss": -42.59364318847656, "global_step": 301748, "epoch": 2493} {"train_loss": -42.40532302856445, "global_step": 301749, "epoch": 2493} {"train_loss": -41.71258544921875, "global_step": 301750, "epoch": 2493} {"train_loss": -43.469303131103516, "global_step": 301751, "epoch": 2493} {"train_loss": -43.188995361328125, "global_step": 301752, "epoch": 2493} {"train_loss": -44.11904525756836, "global_step": 301753, "epoch": 2493} {"train_loss": -42.15181350708008, "global_step": 301754, "epoch": 2493} {"train_loss": -40.50944900512695, "global_step": 301755, "epoch": 2493} {"train_loss": -43.25104904174805, "global_step": 301756, "epoch": 2493} {"train_loss": -42.79410934448242, "global_step": 301757, "epoch": 2493} {"train_loss": -40.56751251220703, "global_step": 301758, "epoch": 2493} {"train_loss": -42.434478759765625, "global_step": 301759, "epoch": 2493} {"train_loss": -43.163246154785156, "global_step": 301760, "epoch": 2493} {"train_loss": -41.99319076538086, "global_step": 301761, "epoch": 2493} {"train_loss": -42.60369110107422, "global_step": 301762, "epoch": 2493} {"train_loss": -41.10493469238281, "global_step": 301763, "epoch": 2493} {"train_loss": -43.66718673706055, "global_step": 301764, "epoch": 2493} {"train_loss": -40.68817138671875, "global_step": 301765, "epoch": 2493} {"train_loss": -42.95934295654297, "global_step": 301766, "epoch": 2493} {"train_loss": -40.7227783203125, "global_step": 301767, "epoch": 2493} {"train_loss": -42.121482849121094, "global_step": 301768, "epoch": 2493} {"train_loss": -42.0353889465332, "global_step": 301769, "epoch": 2493} {"train_loss": -41.21858215332031, "global_step": 301770, "epoch": 2493} {"train_loss": -41.35160446166992, "global_step": 301771, "epoch": 2493} {"train_loss": -41.91679000854492, "global_step": 301772, "epoch": 2493} {"train_loss": -43.534844958092556, "global_step": 301773, "epoch": 2493, "val_loss": 2553678.75} {"train_loss": -40.54374694824219, "global_step": 301774, "epoch": 2494} {"train_loss": -36.267906188964844, "global_step": 301775, "epoch": 2494} {"train_loss": -40.814720153808594, "global_step": 301776, "epoch": 2494} {"train_loss": -41.40696334838867, "global_step": 301777, "epoch": 2494} {"train_loss": -39.200809478759766, "global_step": 301778, "epoch": 2494} {"train_loss": -40.68412780761719, "global_step": 301779, "epoch": 2494} {"train_loss": -40.255428314208984, "global_step": 301780, "epoch": 2494} {"train_loss": -41.208770751953125, "global_step": 301781, "epoch": 2494} {"train_loss": -41.03342819213867, "global_step": 301782, "epoch": 2494} {"train_loss": -41.28538131713867, "global_step": 301783, "epoch": 2494} {"train_loss": -39.48714065551758, "global_step": 301784, "epoch": 2494} {"train_loss": -40.62441635131836, "global_step": 301785, "epoch": 2494} {"train_loss": -41.246009826660156, "global_step": 301786, "epoch": 2494} {"train_loss": -41.0264892578125, "global_step": 301787, "epoch": 2494} {"train_loss": -40.136409759521484, "global_step": 301788, "epoch": 2494} {"train_loss": -41.84891891479492, "global_step": 301789, "epoch": 2494} {"train_loss": -41.25001907348633, "global_step": 301790, "epoch": 2494} {"train_loss": -41.694969177246094, "global_step": 301791, "epoch": 2494} {"train_loss": -42.023956298828125, "global_step": 301792, "epoch": 2494} {"train_loss": -42.0069465637207, "global_step": 301793, "epoch": 2494} {"train_loss": -40.85691452026367, "global_step": 301794, "epoch": 2494} {"train_loss": -41.7044677734375, "global_step": 301795, "epoch": 2494} {"train_loss": -42.104244232177734, "global_step": 301796, "epoch": 2494} {"train_loss": -42.00774002075195, "global_step": 301797, "epoch": 2494} {"train_loss": -42.49190902709961, "global_step": 301798, "epoch": 2494} {"train_loss": -42.98889923095703, "global_step": 301799, "epoch": 2494} {"train_loss": -42.13412094116211, "global_step": 301800, "epoch": 2494} {"train_loss": -42.050785064697266, "global_step": 301801, "epoch": 2494} {"train_loss": -42.137996673583984, "global_step": 301802, "epoch": 2494} {"train_loss": -39.814979553222656, "global_step": 301803, "epoch": 2494} {"train_loss": -42.35984420776367, "global_step": 301804, "epoch": 2494} {"train_loss": -42.09571838378906, "global_step": 301805, "epoch": 2494} {"train_loss": -42.907135009765625, "global_step": 301806, "epoch": 2494} {"train_loss": -42.82436752319336, "global_step": 301807, "epoch": 2494} {"train_loss": -42.49090576171875, "global_step": 301808, "epoch": 2494} {"train_loss": -42.8387451171875, "global_step": 301809, "epoch": 2494} {"train_loss": -42.703182220458984, "global_step": 301810, "epoch": 2494} {"train_loss": -42.97390365600586, "global_step": 301811, "epoch": 2494} {"train_loss": -42.302734375, "global_step": 301812, "epoch": 2494} {"train_loss": -42.626991271972656, "global_step": 301813, "epoch": 2494} {"train_loss": -42.62967300415039, "global_step": 301814, "epoch": 2494} {"train_loss": -42.209693908691406, "global_step": 301815, "epoch": 2494} {"train_loss": -41.872535705566406, "global_step": 301816, "epoch": 2494} {"train_loss": -42.01259994506836, "global_step": 301817, "epoch": 2494} {"train_loss": -42.812347412109375, "global_step": 301818, "epoch": 2494} {"train_loss": -42.489990234375, "global_step": 301819, "epoch": 2494} {"train_loss": -41.5909423828125, "global_step": 301820, "epoch": 2494} {"train_loss": -42.612972259521484, "global_step": 301821, "epoch": 2494} {"train_loss": -43.161781311035156, "global_step": 301822, "epoch": 2494} {"train_loss": -41.883060455322266, "global_step": 301823, "epoch": 2494} {"train_loss": -43.55786895751953, "global_step": 301824, "epoch": 2494} {"train_loss": -43.334041595458984, "global_step": 301825, "epoch": 2494} {"train_loss": -42.6773567199707, "global_step": 301826, "epoch": 2494} {"train_loss": -42.27656173706055, "global_step": 301827, "epoch": 2494} {"train_loss": -43.00178909301758, "global_step": 301828, "epoch": 2494} {"train_loss": -43.03447341918945, "global_step": 301829, "epoch": 2494} {"train_loss": -43.47991180419922, "global_step": 301830, "epoch": 2494} {"train_loss": -43.06321716308594, "global_step": 301831, "epoch": 2494} {"train_loss": -43.00705337524414, "global_step": 301832, "epoch": 2494} {"train_loss": -43.59638595581055, "global_step": 301833, "epoch": 2494} {"train_loss": -42.74254608154297, "global_step": 301834, "epoch": 2494} {"train_loss": -34.2681999206543, "global_step": 301835, "epoch": 2494} {"train_loss": -43.59590148925781, "global_step": 301836, "epoch": 2494} {"train_loss": -42.27106475830078, "global_step": 301837, "epoch": 2494} {"train_loss": -42.82307052612305, "global_step": 301838, "epoch": 2494} {"train_loss": -43.17287063598633, "global_step": 301839, "epoch": 2494} {"train_loss": -42.10710525512695, "global_step": 301840, "epoch": 2494} {"train_loss": -43.309139251708984, "global_step": 301841, "epoch": 2494} {"train_loss": -43.23866653442383, "global_step": 301842, "epoch": 2494} {"train_loss": -42.88468551635742, "global_step": 301843, "epoch": 2494} {"train_loss": -43.46122360229492, "global_step": 301844, "epoch": 2494} {"train_loss": -43.96805191040039, "global_step": 301845, "epoch": 2494} {"train_loss": -43.77513122558594, "global_step": 301846, "epoch": 2494} {"train_loss": -43.42575454711914, "global_step": 301847, "epoch": 2494} {"train_loss": -42.77095413208008, "global_step": 301848, "epoch": 2494} {"train_loss": -43.92352294921875, "global_step": 301849, "epoch": 2494} {"train_loss": -43.673431396484375, "global_step": 301850, "epoch": 2494} {"train_loss": -43.87263870239258, "global_step": 301851, "epoch": 2494} {"train_loss": -43.52369689941406, "global_step": 301852, "epoch": 2494} {"train_loss": -43.6015625, "global_step": 301853, "epoch": 2494} {"train_loss": -43.54228591918945, "global_step": 301854, "epoch": 2494} {"train_loss": -43.01922607421875, "global_step": 301855, "epoch": 2494} {"train_loss": -43.821075439453125, "global_step": 301856, "epoch": 2494} {"train_loss": -43.115570068359375, "global_step": 301857, "epoch": 2494} {"train_loss": -44.36994552612305, "global_step": 301858, "epoch": 2494} {"train_loss": -44.22567367553711, "global_step": 301859, "epoch": 2494} {"train_loss": -44.24850082397461, "global_step": 301860, "epoch": 2494} {"train_loss": -43.284908294677734, "global_step": 301861, "epoch": 2494} {"train_loss": -43.39244079589844, "global_step": 301862, "epoch": 2494} {"train_loss": -44.06948471069336, "global_step": 301863, "epoch": 2494} {"train_loss": -43.309078216552734, "global_step": 301864, "epoch": 2494} {"train_loss": -44.00227737426758, "global_step": 301865, "epoch": 2494} {"train_loss": -43.618255615234375, "global_step": 301866, "epoch": 2494} {"train_loss": -43.65887451171875, "global_step": 301867, "epoch": 2494} {"train_loss": -43.63979721069336, "global_step": 301868, "epoch": 2494} {"train_loss": -44.28565216064453, "global_step": 301869, "epoch": 2494} {"train_loss": -43.22555923461914, "global_step": 301870, "epoch": 2494} {"train_loss": -41.49087142944336, "global_step": 301871, "epoch": 2494} {"train_loss": -43.986732482910156, "global_step": 301872, "epoch": 2494} {"train_loss": -43.26222229003906, "global_step": 301873, "epoch": 2494} {"train_loss": -42.01868438720703, "global_step": 301874, "epoch": 2494} {"train_loss": -44.27208709716797, "global_step": 301875, "epoch": 2494} {"train_loss": -43.636322021484375, "global_step": 301876, "epoch": 2494} {"train_loss": -41.380462646484375, "global_step": 301877, "epoch": 2494} {"train_loss": -43.27039337158203, "global_step": 301878, "epoch": 2494} {"train_loss": -44.6175537109375, "global_step": 301879, "epoch": 2494} {"train_loss": -42.45263671875, "global_step": 301880, "epoch": 2494} {"train_loss": -42.539546966552734, "global_step": 301881, "epoch": 2494} {"train_loss": -42.576698303222656, "global_step": 301882, "epoch": 2494} {"train_loss": -42.24105453491211, "global_step": 301883, "epoch": 2494} {"train_loss": -41.38774108886719, "global_step": 301884, "epoch": 2494} {"train_loss": -43.7294921875, "global_step": 301885, "epoch": 2494} {"train_loss": -41.341182708740234, "global_step": 301886, "epoch": 2494} {"train_loss": -43.511653900146484, "global_step": 301887, "epoch": 2494} {"train_loss": -40.62900924682617, "global_step": 301888, "epoch": 2494} {"train_loss": -42.614990234375, "global_step": 301889, "epoch": 2494} {"train_loss": -36.6791877746582, "global_step": 301890, "epoch": 2494} {"train_loss": -36.73789596557617, "global_step": 301891, "epoch": 2494} {"train_loss": -38.352630615234375, "global_step": 301892, "epoch": 2494} {"train_loss": -36.70763397216797, "global_step": 301893, "epoch": 2494} {"train_loss": -42.21809913698307, "global_step": 301894, "epoch": 2494, "val_loss": 2594930.25} {"train_loss": -38.79094314575195, "global_step": 301895, "epoch": 2495} {"train_loss": -37.01716613769531, "global_step": 301896, "epoch": 2495} {"train_loss": -38.447853088378906, "global_step": 301897, "epoch": 2495} {"train_loss": -37.91927719116211, "global_step": 301898, "epoch": 2495} {"train_loss": -38.72788619995117, "global_step": 301899, "epoch": 2495} {"train_loss": -38.53055953979492, "global_step": 301900, "epoch": 2495} {"train_loss": -39.205570220947266, "global_step": 301901, "epoch": 2495} {"train_loss": -38.357940673828125, "global_step": 301902, "epoch": 2495} {"train_loss": -39.45866775512695, "global_step": 301903, "epoch": 2495} {"train_loss": -38.8632698059082, "global_step": 301904, "epoch": 2495} {"train_loss": -39.80870056152344, "global_step": 301905, "epoch": 2495} {"train_loss": -39.20216369628906, "global_step": 301906, "epoch": 2495} {"train_loss": -39.907447814941406, "global_step": 301907, "epoch": 2495} {"train_loss": -39.716548919677734, "global_step": 301908, "epoch": 2495} {"train_loss": -39.63556671142578, "global_step": 301909, "epoch": 2495} {"train_loss": -40.05161666870117, "global_step": 301910, "epoch": 2495} {"train_loss": -39.70684814453125, "global_step": 301911, "epoch": 2495} {"train_loss": -39.11664581298828, "global_step": 301912, "epoch": 2495} {"train_loss": -40.654212951660156, "global_step": 301913, "epoch": 2495} {"train_loss": -40.628570556640625, "global_step": 301914, "epoch": 2495} {"train_loss": -39.729915618896484, "global_step": 301915, "epoch": 2495} {"train_loss": -38.92486572265625, "global_step": 301916, "epoch": 2495} {"train_loss": -39.88560485839844, "global_step": 301917, "epoch": 2495} {"train_loss": -40.88556671142578, "global_step": 301918, "epoch": 2495} {"train_loss": -39.48370361328125, "global_step": 301919, "epoch": 2495} {"train_loss": -40.29551315307617, "global_step": 301920, "epoch": 2495} {"train_loss": -41.25997543334961, "global_step": 301921, "epoch": 2495} {"train_loss": -40.517940521240234, "global_step": 301922, "epoch": 2495} {"train_loss": -41.438533782958984, "global_step": 301923, "epoch": 2495} {"train_loss": -41.05554962158203, "global_step": 301924, "epoch": 2495} {"train_loss": -40.776336669921875, "global_step": 301925, "epoch": 2495} {"train_loss": -41.70849609375, "global_step": 301926, "epoch": 2495} {"train_loss": -41.2285270690918, "global_step": 301927, "epoch": 2495} {"train_loss": -40.97616195678711, "global_step": 301928, "epoch": 2495} {"train_loss": -41.8297119140625, "global_step": 301929, "epoch": 2495} {"train_loss": -40.574642181396484, "global_step": 301930, "epoch": 2495} {"train_loss": -41.971195220947266, "global_step": 301931, "epoch": 2495} {"train_loss": -41.27303695678711, "global_step": 301932, "epoch": 2495} {"train_loss": -41.87973403930664, "global_step": 301933, "epoch": 2495} {"train_loss": -41.0543327331543, "global_step": 301934, "epoch": 2495} {"train_loss": -41.752315521240234, "global_step": 301935, "epoch": 2495} {"train_loss": -41.53496170043945, "global_step": 301936, "epoch": 2495} {"train_loss": -41.031471252441406, "global_step": 301937, "epoch": 2495} {"train_loss": -40.314361572265625, "global_step": 301938, "epoch": 2495} {"train_loss": -41.45539474487305, "global_step": 301939, "epoch": 2495} {"train_loss": -41.59123229980469, "global_step": 301940, "epoch": 2495} {"train_loss": -40.609031677246094, "global_step": 301941, "epoch": 2495} {"train_loss": -39.501739501953125, "global_step": 301942, "epoch": 2495} {"train_loss": -41.74782180786133, "global_step": 301943, "epoch": 2495} {"train_loss": -39.371700286865234, "global_step": 301944, "epoch": 2495} {"train_loss": -41.12733840942383, "global_step": 301945, "epoch": 2495} {"train_loss": -40.447505950927734, "global_step": 301946, "epoch": 2495} {"train_loss": -41.0093994140625, "global_step": 301947, "epoch": 2495} {"train_loss": -40.89190673828125, "global_step": 301948, "epoch": 2495} {"train_loss": -40.03753662109375, "global_step": 301949, "epoch": 2495} {"train_loss": -40.60765075683594, "global_step": 301950, "epoch": 2495} {"train_loss": -40.68939971923828, "global_step": 301951, "epoch": 2495} {"train_loss": -41.3452262878418, "global_step": 301952, "epoch": 2495} {"train_loss": -40.557289123535156, "global_step": 301953, "epoch": 2495} {"train_loss": -41.412696838378906, "global_step": 301954, "epoch": 2495} {"train_loss": -41.84495162963867, "global_step": 301955, "epoch": 2495} {"train_loss": -41.13642120361328, "global_step": 301956, "epoch": 2495} {"train_loss": -42.171714782714844, "global_step": 301957, "epoch": 2495} {"train_loss": -40.93243408203125, "global_step": 301958, "epoch": 2495} {"train_loss": -42.629398345947266, "global_step": 301959, "epoch": 2495} {"train_loss": -40.75323486328125, "global_step": 301960, "epoch": 2495} {"train_loss": -42.219093322753906, "global_step": 301961, "epoch": 2495} {"train_loss": -41.69285202026367, "global_step": 301962, "epoch": 2495} {"train_loss": -41.5076904296875, "global_step": 301963, "epoch": 2495} {"train_loss": -42.5259895324707, "global_step": 301964, "epoch": 2495} {"train_loss": -40.18545150756836, "global_step": 301965, "epoch": 2495} {"train_loss": -42.69611740112305, "global_step": 301966, "epoch": 2495} {"train_loss": -40.02830123901367, "global_step": 301967, "epoch": 2495} {"train_loss": -41.985652923583984, "global_step": 301968, "epoch": 2495} {"train_loss": -42.19487762451172, "global_step": 301969, "epoch": 2495} {"train_loss": -40.457271575927734, "global_step": 301970, "epoch": 2495} {"train_loss": -42.07022476196289, "global_step": 301971, "epoch": 2495} {"train_loss": -42.126251220703125, "global_step": 301972, "epoch": 2495} {"train_loss": -40.458099365234375, "global_step": 301973, "epoch": 2495} {"train_loss": -42.097442626953125, "global_step": 301974, "epoch": 2495} {"train_loss": -40.773895263671875, "global_step": 301975, "epoch": 2495} {"train_loss": -42.6273078918457, "global_step": 301976, "epoch": 2495} {"train_loss": -41.90201950073242, "global_step": 301977, "epoch": 2495} {"train_loss": -38.17999267578125, "global_step": 301978, "epoch": 2495} {"train_loss": -36.613555908203125, "global_step": 301979, "epoch": 2495} {"train_loss": -40.83534240722656, "global_step": 301980, "epoch": 2495} {"train_loss": -40.79143142700195, "global_step": 301981, "epoch": 2495} {"train_loss": -38.52824783325195, "global_step": 301982, "epoch": 2495} {"train_loss": -40.204288482666016, "global_step": 301983, "epoch": 2495} {"train_loss": -40.931190490722656, "global_step": 301984, "epoch": 2495} {"train_loss": -38.97864532470703, "global_step": 301985, "epoch": 2495} {"train_loss": -40.34431076049805, "global_step": 301986, "epoch": 2495} {"train_loss": -39.11334991455078, "global_step": 301987, "epoch": 2495} {"train_loss": -41.6204833984375, "global_step": 301988, "epoch": 2495} {"train_loss": -40.47023010253906, "global_step": 301989, "epoch": 2495} {"train_loss": -41.33405303955078, "global_step": 301990, "epoch": 2495} {"train_loss": -39.6347541809082, "global_step": 301991, "epoch": 2495} {"train_loss": -42.58087158203125, "global_step": 301992, "epoch": 2495} {"train_loss": -41.11138916015625, "global_step": 301993, "epoch": 2495} {"train_loss": -41.9592399597168, "global_step": 301994, "epoch": 2495} {"train_loss": -41.6876335144043, "global_step": 301995, "epoch": 2495} {"train_loss": -40.578369140625, "global_step": 301996, "epoch": 2495} {"train_loss": -41.327545166015625, "global_step": 301997, "epoch": 2495} {"train_loss": -41.510711669921875, "global_step": 301998, "epoch": 2495} {"train_loss": -41.7673454284668, "global_step": 301999, "epoch": 2495} {"train_loss": -41.950401306152344, "global_step": 302000, "epoch": 2495} {"train_loss": -41.1199836730957, "global_step": 302001, "epoch": 2495} {"train_loss": -42.08479690551758, "global_step": 302002, "epoch": 2495} {"train_loss": -41.72475051879883, "global_step": 302003, "epoch": 2495} {"train_loss": -41.98380661010742, "global_step": 302004, "epoch": 2495} {"train_loss": -42.30662536621094, "global_step": 302005, "epoch": 2495} {"train_loss": -42.45359420776367, "global_step": 302006, "epoch": 2495} {"train_loss": -42.3115119934082, "global_step": 302007, "epoch": 2495} {"train_loss": -42.297332763671875, "global_step": 302008, "epoch": 2495} {"train_loss": -42.26081466674805, "global_step": 302009, "epoch": 2495} {"train_loss": -42.161678314208984, "global_step": 302010, "epoch": 2495} {"train_loss": -42.81761169433594, "global_step": 302011, "epoch": 2495} {"train_loss": -42.42658615112305, "global_step": 302012, "epoch": 2495} {"train_loss": -42.99201583862305, "global_step": 302013, "epoch": 2495} {"train_loss": -42.32719421386719, "global_step": 302014, "epoch": 2495} {"train_loss": -40.831499746023134, "global_step": 302015, "epoch": 2495, "val_loss": 2662357.75} {"train_loss": -42.602108001708984, "global_step": 302016, "epoch": 2496} {"train_loss": -42.600494384765625, "global_step": 302017, "epoch": 2496} {"train_loss": -43.07106399536133, "global_step": 302018, "epoch": 2496} {"train_loss": -42.43743133544922, "global_step": 302019, "epoch": 2496} {"train_loss": -42.40998458862305, "global_step": 302020, "epoch": 2496} {"train_loss": -42.81658935546875, "global_step": 302021, "epoch": 2496} {"train_loss": -42.9787483215332, "global_step": 302022, "epoch": 2496} {"train_loss": -42.9824333190918, "global_step": 302023, "epoch": 2496} {"train_loss": -43.019744873046875, "global_step": 302024, "epoch": 2496} {"train_loss": -43.13637924194336, "global_step": 302025, "epoch": 2496} {"train_loss": -43.08824157714844, "global_step": 302026, "epoch": 2496} {"train_loss": -43.252506256103516, "global_step": 302027, "epoch": 2496} {"train_loss": -42.22380447387695, "global_step": 302028, "epoch": 2496} {"train_loss": -41.66594696044922, "global_step": 302029, "epoch": 2496} {"train_loss": -42.084468841552734, "global_step": 302030, "epoch": 2496} {"train_loss": -42.96647262573242, "global_step": 302031, "epoch": 2496} {"train_loss": -43.31892776489258, "global_step": 302032, "epoch": 2496} {"train_loss": -43.18496322631836, "global_step": 302033, "epoch": 2496} {"train_loss": -42.864925384521484, "global_step": 302034, "epoch": 2496} {"train_loss": -42.67176818847656, "global_step": 302035, "epoch": 2496} {"train_loss": -43.30332946777344, "global_step": 302036, "epoch": 2496} {"train_loss": -43.1937370300293, "global_step": 302037, "epoch": 2496} {"train_loss": -42.80675506591797, "global_step": 302038, "epoch": 2496} {"train_loss": -43.17171096801758, "global_step": 302039, "epoch": 2496} {"train_loss": -43.49528121948242, "global_step": 302040, "epoch": 2496} {"train_loss": -43.0848274230957, "global_step": 302041, "epoch": 2496} {"train_loss": -42.861106872558594, "global_step": 302042, "epoch": 2496} {"train_loss": -43.27085494995117, "global_step": 302043, "epoch": 2496} {"train_loss": -43.46674728393555, "global_step": 302044, "epoch": 2496} {"train_loss": -43.036109924316406, "global_step": 302045, "epoch": 2496} {"train_loss": -42.72893142700195, "global_step": 302046, "epoch": 2496} {"train_loss": -42.9456672668457, "global_step": 302047, "epoch": 2496} {"train_loss": -43.36906051635742, "global_step": 302048, "epoch": 2496} {"train_loss": -43.49043655395508, "global_step": 302049, "epoch": 2496} {"train_loss": -43.53567123413086, "global_step": 302050, "epoch": 2496} {"train_loss": -43.59377670288086, "global_step": 302051, "epoch": 2496} {"train_loss": -43.8087158203125, "global_step": 302052, "epoch": 2496} {"train_loss": -42.772918701171875, "global_step": 302053, "epoch": 2496} {"train_loss": -41.60026168823242, "global_step": 302054, "epoch": 2496} {"train_loss": -40.55386734008789, "global_step": 302055, "epoch": 2496} {"train_loss": -42.623870849609375, "global_step": 302056, "epoch": 2496} {"train_loss": -43.64949035644531, "global_step": 302057, "epoch": 2496} {"train_loss": -42.40068435668945, "global_step": 302058, "epoch": 2496} {"train_loss": -40.22056198120117, "global_step": 302059, "epoch": 2496} {"train_loss": -40.260826110839844, "global_step": 302060, "epoch": 2496} {"train_loss": -41.497291564941406, "global_step": 302061, "epoch": 2496} {"train_loss": -42.35222244262695, "global_step": 302062, "epoch": 2496} {"train_loss": -42.62876510620117, "global_step": 302063, "epoch": 2496} {"train_loss": -41.823883056640625, "global_step": 302064, "epoch": 2496} {"train_loss": -42.16642761230469, "global_step": 302065, "epoch": 2496} {"train_loss": -42.38054656982422, "global_step": 302066, "epoch": 2496} {"train_loss": -42.93587875366211, "global_step": 302067, "epoch": 2496} {"train_loss": -43.3759651184082, "global_step": 302068, "epoch": 2496} {"train_loss": -42.798072814941406, "global_step": 302069, "epoch": 2496} {"train_loss": -43.03078842163086, "global_step": 302070, "epoch": 2496} {"train_loss": -43.366024017333984, "global_step": 302071, "epoch": 2496} {"train_loss": -42.45524597167969, "global_step": 302072, "epoch": 2496} {"train_loss": -42.95020294189453, "global_step": 302073, "epoch": 2496} {"train_loss": -43.02800369262695, "global_step": 302074, "epoch": 2496} {"train_loss": -43.31185531616211, "global_step": 302075, "epoch": 2496} {"train_loss": -42.337425231933594, "global_step": 302076, "epoch": 2496} {"train_loss": -43.14247512817383, "global_step": 302077, "epoch": 2496} {"train_loss": -42.867652893066406, "global_step": 302078, "epoch": 2496} {"train_loss": -43.4674072265625, "global_step": 302079, "epoch": 2496} {"train_loss": -43.1977653503418, "global_step": 302080, "epoch": 2496} {"train_loss": -43.04732131958008, "global_step": 302081, "epoch": 2496} {"train_loss": -42.53203201293945, "global_step": 302082, "epoch": 2496} {"train_loss": -42.1903076171875, "global_step": 302083, "epoch": 2496} {"train_loss": -40.72539138793945, "global_step": 302084, "epoch": 2496} {"train_loss": -38.41616439819336, "global_step": 302085, "epoch": 2496} {"train_loss": -39.90715789794922, "global_step": 302086, "epoch": 2496} {"train_loss": -42.83701705932617, "global_step": 302087, "epoch": 2496} {"train_loss": -40.31800079345703, "global_step": 302088, "epoch": 2496} {"train_loss": -37.020198822021484, "global_step": 302089, "epoch": 2496} {"train_loss": -39.8635368347168, "global_step": 302090, "epoch": 2496} {"train_loss": -40.79034423828125, "global_step": 302091, "epoch": 2496} {"train_loss": -38.5978889465332, "global_step": 302092, "epoch": 2496} {"train_loss": -41.87763595581055, "global_step": 302093, "epoch": 2496} {"train_loss": -39.4421272277832, "global_step": 302094, "epoch": 2496} {"train_loss": -43.458831787109375, "global_step": 302095, "epoch": 2496} {"train_loss": -39.391292572021484, "global_step": 302096, "epoch": 2496} {"train_loss": -43.01557540893555, "global_step": 302097, "epoch": 2496} {"train_loss": -41.095088958740234, "global_step": 302098, "epoch": 2496} {"train_loss": -42.584964752197266, "global_step": 302099, "epoch": 2496} {"train_loss": -42.06913375854492, "global_step": 302100, "epoch": 2496} {"train_loss": -42.94710922241211, "global_step": 302101, "epoch": 2496} {"train_loss": -42.325164794921875, "global_step": 302102, "epoch": 2496} {"train_loss": -42.98307800292969, "global_step": 302103, "epoch": 2496} {"train_loss": -42.34665298461914, "global_step": 302104, "epoch": 2496} {"train_loss": -43.26933670043945, "global_step": 302105, "epoch": 2496} {"train_loss": -43.09871292114258, "global_step": 302106, "epoch": 2496} {"train_loss": -43.56144332885742, "global_step": 302107, "epoch": 2496} {"train_loss": -42.45995330810547, "global_step": 302108, "epoch": 2496} {"train_loss": -42.93842315673828, "global_step": 302109, "epoch": 2496} {"train_loss": -43.08150863647461, "global_step": 302110, "epoch": 2496} {"train_loss": -42.8068733215332, "global_step": 302111, "epoch": 2496} {"train_loss": -43.507198333740234, "global_step": 302112, "epoch": 2496} {"train_loss": -42.776084899902344, "global_step": 302113, "epoch": 2496} {"train_loss": -43.0157470703125, "global_step": 302114, "epoch": 2496} {"train_loss": -43.106483459472656, "global_step": 302115, "epoch": 2496} {"train_loss": -42.75455856323242, "global_step": 302116, "epoch": 2496} {"train_loss": -42.94489669799805, "global_step": 302117, "epoch": 2496} {"train_loss": -41.79702377319336, "global_step": 302118, "epoch": 2496} {"train_loss": -41.00016403198242, "global_step": 302119, "epoch": 2496} {"train_loss": -42.19231033325195, "global_step": 302120, "epoch": 2496} {"train_loss": -43.26029586791992, "global_step": 302121, "epoch": 2496} {"train_loss": -42.604698181152344, "global_step": 302122, "epoch": 2496} {"train_loss": -40.54054641723633, "global_step": 302123, "epoch": 2496} {"train_loss": -43.0804328918457, "global_step": 302124, "epoch": 2496} {"train_loss": -43.3669548034668, "global_step": 302125, "epoch": 2496} {"train_loss": -40.74148178100586, "global_step": 302126, "epoch": 2496} {"train_loss": -38.292842864990234, "global_step": 302127, "epoch": 2496} {"train_loss": -42.86057662963867, "global_step": 302128, "epoch": 2496} {"train_loss": -43.34598922729492, "global_step": 302129, "epoch": 2496} {"train_loss": -41.138973236083984, "global_step": 302130, "epoch": 2496} {"train_loss": -41.368465423583984, "global_step": 302131, "epoch": 2496} {"train_loss": -41.247901916503906, "global_step": 302132, "epoch": 2496} {"train_loss": -21.4593563079834, "global_step": 302133, "epoch": 2496} {"train_loss": -37.73707962036133, "global_step": 302134, "epoch": 2496} {"train_loss": -42.29352569580078, "global_step": 302135, "epoch": 2496} {"train_loss": -42.138614291987146, "global_step": 302136, "epoch": 2496, "val_loss": 4401985.5} {"train_loss": -15.483197212219238, "global_step": 302137, "epoch": 2497} {"train_loss": -27.902484893798828, "global_step": 302138, "epoch": 2497} {"train_loss": -22.655012130737305, "global_step": 302139, "epoch": 2497} {"train_loss": -35.13579177856445, "global_step": 302140, "epoch": 2497} {"train_loss": -24.750566482543945, "global_step": 302141, "epoch": 2497} {"train_loss": -17.392330169677734, "global_step": 302142, "epoch": 2497} {"train_loss": -27.174774169921875, "global_step": 302143, "epoch": 2497} {"train_loss": -32.22540283203125, "global_step": 302144, "epoch": 2497} {"train_loss": -31.492385864257812, "global_step": 302145, "epoch": 2497} {"train_loss": -27.64165687561035, "global_step": 302146, "epoch": 2497} {"train_loss": -3.0595033168792725, "global_step": 302147, "epoch": 2497} {"train_loss": -35.7500114440918, "global_step": 302148, "epoch": 2497} {"train_loss": -31.75103759765625, "global_step": 302149, "epoch": 2497} {"train_loss": -35.197383880615234, "global_step": 302150, "epoch": 2497} {"train_loss": -30.3065128326416, "global_step": 302151, "epoch": 2497} {"train_loss": -34.685081481933594, "global_step": 302152, "epoch": 2497} {"train_loss": -26.373132705688477, "global_step": 302153, "epoch": 2497} {"train_loss": -30.593460083007812, "global_step": 302154, "epoch": 2497} {"train_loss": -27.262592315673828, "global_step": 302155, "epoch": 2497} {"train_loss": -34.3193473815918, "global_step": 302156, "epoch": 2497} {"train_loss": -35.66200637817383, "global_step": 302157, "epoch": 2497} {"train_loss": -35.57822799682617, "global_step": 302158, "epoch": 2497} {"train_loss": -34.306819915771484, "global_step": 302159, "epoch": 2497} {"train_loss": -33.615360260009766, "global_step": 302160, "epoch": 2497} {"train_loss": -36.472835540771484, "global_step": 302161, "epoch": 2497} {"train_loss": -37.09825134277344, "global_step": 302162, "epoch": 2497} {"train_loss": -36.74531936645508, "global_step": 302163, "epoch": 2497} {"train_loss": -36.99615478515625, "global_step": 302164, "epoch": 2497} {"train_loss": -37.00782012939453, "global_step": 302165, "epoch": 2497} {"train_loss": -37.622039794921875, "global_step": 302166, "epoch": 2497} {"train_loss": -36.67053985595703, "global_step": 302167, "epoch": 2497} {"train_loss": -36.320491790771484, "global_step": 302168, "epoch": 2497} {"train_loss": -37.429649353027344, "global_step": 302169, "epoch": 2497} {"train_loss": -36.85591506958008, "global_step": 302170, "epoch": 2497} {"train_loss": -37.11579132080078, "global_step": 302171, "epoch": 2497} {"train_loss": -38.648555755615234, "global_step": 302172, "epoch": 2497} {"train_loss": -37.47085189819336, "global_step": 302173, "epoch": 2497} {"train_loss": -37.17329025268555, "global_step": 302174, "epoch": 2497} {"train_loss": -36.930335998535156, "global_step": 302175, "epoch": 2497} {"train_loss": -37.93333053588867, "global_step": 302176, "epoch": 2497} {"train_loss": -36.87763595581055, "global_step": 302177, "epoch": 2497} {"train_loss": -37.345123291015625, "global_step": 302178, "epoch": 2497} {"train_loss": -38.68281936645508, "global_step": 302179, "epoch": 2497} {"train_loss": -37.79332733154297, "global_step": 302180, "epoch": 2497} {"train_loss": -37.69315719604492, "global_step": 302181, "epoch": 2497} {"train_loss": -38.430908203125, "global_step": 302182, "epoch": 2497} {"train_loss": -38.58384323120117, "global_step": 302183, "epoch": 2497} {"train_loss": -38.53689193725586, "global_step": 302184, "epoch": 2497} {"train_loss": -37.5275993347168, "global_step": 302185, "epoch": 2497} {"train_loss": -36.42243194580078, "global_step": 302186, "epoch": 2497} {"train_loss": -38.26004409790039, "global_step": 302187, "epoch": 2497} {"train_loss": -38.759521484375, "global_step": 302188, "epoch": 2497} {"train_loss": -37.58613204956055, "global_step": 302189, "epoch": 2497} {"train_loss": -38.3789176940918, "global_step": 302190, "epoch": 2497} {"train_loss": -38.79486083984375, "global_step": 302191, "epoch": 2497} {"train_loss": -38.32284927368164, "global_step": 302192, "epoch": 2497} {"train_loss": -38.17205810546875, "global_step": 302193, "epoch": 2497} {"train_loss": -34.857513427734375, "global_step": 302194, "epoch": 2497} {"train_loss": -39.657569885253906, "global_step": 302195, "epoch": 2497} {"train_loss": -38.61102294921875, "global_step": 302196, "epoch": 2497} {"train_loss": -39.328369140625, "global_step": 302197, "epoch": 2497} {"train_loss": -38.503902435302734, "global_step": 302198, "epoch": 2497} {"train_loss": -38.5625, "global_step": 302199, "epoch": 2497} {"train_loss": -39.11545944213867, "global_step": 302200, "epoch": 2497} {"train_loss": -38.959739685058594, "global_step": 302201, "epoch": 2497} {"train_loss": -39.14677429199219, "global_step": 302202, "epoch": 2497} {"train_loss": -39.70667266845703, "global_step": 302203, "epoch": 2497} {"train_loss": -39.70848846435547, "global_step": 302204, "epoch": 2497} {"train_loss": -38.670223236083984, "global_step": 302205, "epoch": 2497} {"train_loss": -39.4560546875, "global_step": 302206, "epoch": 2497} {"train_loss": -38.333168029785156, "global_step": 302207, "epoch": 2497} {"train_loss": -39.23934555053711, "global_step": 302208, "epoch": 2497} {"train_loss": -40.261451721191406, "global_step": 302209, "epoch": 2497} {"train_loss": -39.641029357910156, "global_step": 302210, "epoch": 2497} {"train_loss": -39.657188415527344, "global_step": 302211, "epoch": 2497} {"train_loss": -39.26496124267578, "global_step": 302212, "epoch": 2497} {"train_loss": -40.28997802734375, "global_step": 302213, "epoch": 2497} {"train_loss": -40.25203323364258, "global_step": 302214, "epoch": 2497} {"train_loss": -39.347713470458984, "global_step": 302215, "epoch": 2497} {"train_loss": -39.19519805908203, "global_step": 302216, "epoch": 2497} {"train_loss": -39.41352844238281, "global_step": 302217, "epoch": 2497} {"train_loss": -40.04499816894531, "global_step": 302218, "epoch": 2497} {"train_loss": -39.565895080566406, "global_step": 302219, "epoch": 2497} {"train_loss": -39.21200180053711, "global_step": 302220, "epoch": 2497} {"train_loss": -38.73857116699219, "global_step": 302221, "epoch": 2497} {"train_loss": -40.327762603759766, "global_step": 302222, "epoch": 2497} {"train_loss": -40.135223388671875, "global_step": 302223, "epoch": 2497} {"train_loss": -39.94710922241211, "global_step": 302224, "epoch": 2497} {"train_loss": -39.84299850463867, "global_step": 302225, "epoch": 2497} {"train_loss": -40.65369415283203, "global_step": 302226, "epoch": 2497} {"train_loss": -39.50480651855469, "global_step": 302227, "epoch": 2497} {"train_loss": -39.20302200317383, "global_step": 302228, "epoch": 2497} {"train_loss": -39.35493850708008, "global_step": 302229, "epoch": 2497} {"train_loss": -39.74043655395508, "global_step": 302230, "epoch": 2497} {"train_loss": -39.74959182739258, "global_step": 302231, "epoch": 2497} {"train_loss": -40.6496467590332, "global_step": 302232, "epoch": 2497} {"train_loss": -40.876373291015625, "global_step": 302233, "epoch": 2497} {"train_loss": -41.13105392456055, "global_step": 302234, "epoch": 2497} {"train_loss": -40.90983200073242, "global_step": 302235, "epoch": 2497} {"train_loss": -39.7130012512207, "global_step": 302236, "epoch": 2497} {"train_loss": -40.75144577026367, "global_step": 302237, "epoch": 2497} {"train_loss": -41.72752380371094, "global_step": 302238, "epoch": 2497} {"train_loss": -40.67499923706055, "global_step": 302239, "epoch": 2497} {"train_loss": -40.66753387451172, "global_step": 302240, "epoch": 2497} {"train_loss": -41.18265914916992, "global_step": 302241, "epoch": 2497} {"train_loss": -40.80950164794922, "global_step": 302242, "epoch": 2497} {"train_loss": -41.41381072998047, "global_step": 302243, "epoch": 2497} {"train_loss": -40.969398498535156, "global_step": 302244, "epoch": 2497} {"train_loss": -40.52911376953125, "global_step": 302245, "epoch": 2497} {"train_loss": -41.98507308959961, "global_step": 302246, "epoch": 2497} {"train_loss": -41.68511962890625, "global_step": 302247, "epoch": 2497} {"train_loss": -42.05111312866211, "global_step": 302248, "epoch": 2497} {"train_loss": -41.17490768432617, "global_step": 302249, "epoch": 2497} {"train_loss": -39.5021858215332, "global_step": 302250, "epoch": 2497} {"train_loss": -40.79054641723633, "global_step": 302251, "epoch": 2497} {"train_loss": -40.336219787597656, "global_step": 302252, "epoch": 2497} {"train_loss": -41.65537643432617, "global_step": 302253, "epoch": 2497} {"train_loss": -41.60775375366211, "global_step": 302254, "epoch": 2497} {"train_loss": -41.547508239746094, "global_step": 302255, "epoch": 2497} {"train_loss": -41.041202545166016, "global_step": 302256, "epoch": 2497} {"train_loss": -37.1280058297244, "global_step": 302257, "epoch": 2497, "val_loss": 2605210.25} {"train_loss": -41.42133331298828, "global_step": 302258, "epoch": 2498} {"train_loss": -41.7730712890625, "global_step": 302259, "epoch": 2498} {"train_loss": -41.082305908203125, "global_step": 302260, "epoch": 2498} {"train_loss": -41.09517288208008, "global_step": 302261, "epoch": 2498} {"train_loss": -41.43112564086914, "global_step": 302262, "epoch": 2498} {"train_loss": -41.59017562866211, "global_step": 302263, "epoch": 2498} {"train_loss": -41.52016830444336, "global_step": 302264, "epoch": 2498} {"train_loss": -42.30241394042969, "global_step": 302265, "epoch": 2498} {"train_loss": -42.037750244140625, "global_step": 302266, "epoch": 2498} {"train_loss": -41.69845199584961, "global_step": 302267, "epoch": 2498} {"train_loss": -42.72023391723633, "global_step": 302268, "epoch": 2498} {"train_loss": -42.110801696777344, "global_step": 302269, "epoch": 2498} {"train_loss": -42.459815979003906, "global_step": 302270, "epoch": 2498} {"train_loss": -41.11433792114258, "global_step": 302271, "epoch": 2498} {"train_loss": -41.79679489135742, "global_step": 302272, "epoch": 2498} {"train_loss": -41.70488357543945, "global_step": 302273, "epoch": 2498} {"train_loss": -41.920921325683594, "global_step": 302274, "epoch": 2498} {"train_loss": -42.169559478759766, "global_step": 302275, "epoch": 2498} {"train_loss": -42.57503128051758, "global_step": 302276, "epoch": 2498} {"train_loss": -42.0653190612793, "global_step": 302277, "epoch": 2498} {"train_loss": -41.99394989013672, "global_step": 302278, "epoch": 2498} {"train_loss": -41.9146842956543, "global_step": 302279, "epoch": 2498} {"train_loss": -42.21482467651367, "global_step": 302280, "epoch": 2498} {"train_loss": -42.25191116333008, "global_step": 302281, "epoch": 2498} {"train_loss": -41.955989837646484, "global_step": 302282, "epoch": 2498} {"train_loss": -41.81685256958008, "global_step": 302283, "epoch": 2498} {"train_loss": -42.19166564941406, "global_step": 302284, "epoch": 2498} {"train_loss": -41.75564956665039, "global_step": 302285, "epoch": 2498} {"train_loss": -41.89365768432617, "global_step": 302286, "epoch": 2498} {"train_loss": -41.904052734375, "global_step": 302287, "epoch": 2498} {"train_loss": -42.63277053833008, "global_step": 302288, "epoch": 2498} {"train_loss": -42.15118408203125, "global_step": 302289, "epoch": 2498} {"train_loss": -42.767982482910156, "global_step": 302290, "epoch": 2498} {"train_loss": -41.571319580078125, "global_step": 302291, "epoch": 2498} {"train_loss": -42.863094329833984, "global_step": 302292, "epoch": 2498} {"train_loss": -42.14306640625, "global_step": 302293, "epoch": 2498} {"train_loss": -42.3129997253418, "global_step": 302294, "epoch": 2498} {"train_loss": -43.09168243408203, "global_step": 302295, "epoch": 2498} {"train_loss": -42.47919464111328, "global_step": 302296, "epoch": 2498} {"train_loss": -42.213966369628906, "global_step": 302297, "epoch": 2498} {"train_loss": -43.356895446777344, "global_step": 302298, "epoch": 2498} {"train_loss": -42.351158142089844, "global_step": 302299, "epoch": 2498} {"train_loss": -41.96520233154297, "global_step": 302300, "epoch": 2498} {"train_loss": -42.501888275146484, "global_step": 302301, "epoch": 2498} {"train_loss": -42.87765121459961, "global_step": 302302, "epoch": 2498} {"train_loss": -41.86501693725586, "global_step": 302303, "epoch": 2498} {"train_loss": -41.24061584472656, "global_step": 302304, "epoch": 2498} {"train_loss": -38.1615104675293, "global_step": 302305, "epoch": 2498} {"train_loss": -39.162445068359375, "global_step": 302306, "epoch": 2498} {"train_loss": -42.27019119262695, "global_step": 302307, "epoch": 2498} {"train_loss": -40.7475700378418, "global_step": 302308, "epoch": 2498} {"train_loss": -38.221805572509766, "global_step": 302309, "epoch": 2498} {"train_loss": -39.12464141845703, "global_step": 302310, "epoch": 2498} {"train_loss": -43.40534591674805, "global_step": 302311, "epoch": 2498} {"train_loss": -39.20843505859375, "global_step": 302312, "epoch": 2498} {"train_loss": -37.4417610168457, "global_step": 302313, "epoch": 2498} {"train_loss": -42.831512451171875, "global_step": 302314, "epoch": 2498} {"train_loss": -38.1164665222168, "global_step": 302315, "epoch": 2498} {"train_loss": -39.54337692260742, "global_step": 302316, "epoch": 2498} {"train_loss": -42.28870391845703, "global_step": 302317, "epoch": 2498} {"train_loss": -40.355140686035156, "global_step": 302318, "epoch": 2498} {"train_loss": -42.08934020996094, "global_step": 302319, "epoch": 2498} {"train_loss": -39.375282287597656, "global_step": 302320, "epoch": 2498} {"train_loss": -41.00234603881836, "global_step": 302321, "epoch": 2498} {"train_loss": -41.976898193359375, "global_step": 302322, "epoch": 2498} {"train_loss": -40.77090072631836, "global_step": 302323, "epoch": 2498} {"train_loss": -42.49058151245117, "global_step": 302324, "epoch": 2498} {"train_loss": -40.56771469116211, "global_step": 302325, "epoch": 2498} {"train_loss": -42.45600128173828, "global_step": 302326, "epoch": 2498} {"train_loss": -41.1380729675293, "global_step": 302327, "epoch": 2498} {"train_loss": -42.3770637512207, "global_step": 302328, "epoch": 2498} {"train_loss": -41.953304290771484, "global_step": 302329, "epoch": 2498} {"train_loss": -42.547908782958984, "global_step": 302330, "epoch": 2498} {"train_loss": -41.494667053222656, "global_step": 302331, "epoch": 2498} {"train_loss": -42.75735855102539, "global_step": 302332, "epoch": 2498} {"train_loss": -41.969974517822266, "global_step": 302333, "epoch": 2498} {"train_loss": -41.514076232910156, "global_step": 302334, "epoch": 2498} {"train_loss": -41.49189758300781, "global_step": 302335, "epoch": 2498} {"train_loss": -41.76943588256836, "global_step": 302336, "epoch": 2498} {"train_loss": -42.8462028503418, "global_step": 302337, "epoch": 2498} {"train_loss": -42.05997848510742, "global_step": 302338, "epoch": 2498} {"train_loss": -41.15707015991211, "global_step": 302339, "epoch": 2498} {"train_loss": -41.94148635864258, "global_step": 302340, "epoch": 2498} {"train_loss": -42.5213737487793, "global_step": 302341, "epoch": 2498} {"train_loss": -42.10107421875, "global_step": 302342, "epoch": 2498} {"train_loss": -42.12305450439453, "global_step": 302343, "epoch": 2498} {"train_loss": -42.4129524230957, "global_step": 302344, "epoch": 2498} {"train_loss": -41.868412017822266, "global_step": 302345, "epoch": 2498} {"train_loss": -42.58095932006836, "global_step": 302346, "epoch": 2498} {"train_loss": -41.71934127807617, "global_step": 302347, "epoch": 2498} {"train_loss": -39.783294677734375, "global_step": 302348, "epoch": 2498} {"train_loss": -42.237831115722656, "global_step": 302349, "epoch": 2498} {"train_loss": -41.981689453125, "global_step": 302350, "epoch": 2498} {"train_loss": -42.17158889770508, "global_step": 302351, "epoch": 2498} {"train_loss": -41.634246826171875, "global_step": 302352, "epoch": 2498} {"train_loss": -43.162288665771484, "global_step": 302353, "epoch": 2498} {"train_loss": -40.78445053100586, "global_step": 302354, "epoch": 2498} {"train_loss": -40.465816497802734, "global_step": 302355, "epoch": 2498} {"train_loss": -41.830787658691406, "global_step": 302356, "epoch": 2498} {"train_loss": -42.052978515625, "global_step": 302357, "epoch": 2498} {"train_loss": -41.18427658081055, "global_step": 302358, "epoch": 2498} {"train_loss": -41.67928695678711, "global_step": 302359, "epoch": 2498} {"train_loss": -42.734527587890625, "global_step": 302360, "epoch": 2498} {"train_loss": -34.89548110961914, "global_step": 302361, "epoch": 2498} {"train_loss": -40.9929084777832, "global_step": 302362, "epoch": 2498} {"train_loss": -41.381771087646484, "global_step": 302363, "epoch": 2498} {"train_loss": -41.72658920288086, "global_step": 302364, "epoch": 2498} {"train_loss": -42.54128646850586, "global_step": 302365, "epoch": 2498} {"train_loss": -41.481876373291016, "global_step": 302366, "epoch": 2498} {"train_loss": -42.05696487426758, "global_step": 302367, "epoch": 2498} {"train_loss": -41.16718292236328, "global_step": 302368, "epoch": 2498} {"train_loss": -40.2651481628418, "global_step": 302369, "epoch": 2498} {"train_loss": -42.01813507080078, "global_step": 302370, "epoch": 2498} {"train_loss": -40.396461486816406, "global_step": 302371, "epoch": 2498} {"train_loss": -41.7534065246582, "global_step": 302372, "epoch": 2498} {"train_loss": -42.0461311340332, "global_step": 302373, "epoch": 2498} {"train_loss": -30.68181800842285, "global_step": 302374, "epoch": 2498} {"train_loss": -41.644439697265625, "global_step": 302375, "epoch": 2498} {"train_loss": -39.79852294921875, "global_step": 302376, "epoch": 2498} {"train_loss": -41.48225784301758, "global_step": 302377, "epoch": 2498} {"train_loss": -41.48909253522384, "global_step": 302378, "epoch": 2498, "val_loss": 2608717.0} {"train_loss": -41.97188949584961, "global_step": 302379, "epoch": 2499} {"train_loss": -42.32964324951172, "global_step": 302380, "epoch": 2499} {"train_loss": -42.02401351928711, "global_step": 302381, "epoch": 2499} {"train_loss": -42.01389694213867, "global_step": 302382, "epoch": 2499} {"train_loss": -41.89875030517578, "global_step": 302383, "epoch": 2499} {"train_loss": -41.412010192871094, "global_step": 302384, "epoch": 2499} {"train_loss": -40.699501037597656, "global_step": 302385, "epoch": 2499} {"train_loss": -41.76986312866211, "global_step": 302386, "epoch": 2499} {"train_loss": -41.941558837890625, "global_step": 302387, "epoch": 2499} {"train_loss": -42.9314079284668, "global_step": 302388, "epoch": 2499} {"train_loss": -42.748046875, "global_step": 302389, "epoch": 2499} {"train_loss": -42.78692626953125, "global_step": 302390, "epoch": 2499} {"train_loss": -41.8071174621582, "global_step": 302391, "epoch": 2499} {"train_loss": -42.34621047973633, "global_step": 302392, "epoch": 2499} {"train_loss": -42.670650482177734, "global_step": 302393, "epoch": 2499} {"train_loss": -41.49135208129883, "global_step": 302394, "epoch": 2499} {"train_loss": -41.481224060058594, "global_step": 302395, "epoch": 2499} {"train_loss": -41.18463897705078, "global_step": 302396, "epoch": 2499} {"train_loss": -42.221553802490234, "global_step": 302397, "epoch": 2499} {"train_loss": -42.137264251708984, "global_step": 302398, "epoch": 2499} {"train_loss": -41.97378921508789, "global_step": 302399, "epoch": 2499} {"train_loss": -42.8034782409668, "global_step": 302400, "epoch": 2499} {"train_loss": -42.5923957824707, "global_step": 302401, "epoch": 2499} {"train_loss": -42.978782653808594, "global_step": 302402, "epoch": 2499} {"train_loss": -42.05106735229492, "global_step": 302403, "epoch": 2499} {"train_loss": -41.833168029785156, "global_step": 302404, "epoch": 2499} {"train_loss": -42.37651443481445, "global_step": 302405, "epoch": 2499} {"train_loss": -42.111297607421875, "global_step": 302406, "epoch": 2499} {"train_loss": -40.988258361816406, "global_step": 302407, "epoch": 2499} {"train_loss": -39.25185012817383, "global_step": 302408, "epoch": 2499} {"train_loss": -41.27165985107422, "global_step": 302409, "epoch": 2499} {"train_loss": -42.01552200317383, "global_step": 302410, "epoch": 2499} {"train_loss": -41.894527435302734, "global_step": 302411, "epoch": 2499} {"train_loss": -42.89785385131836, "global_step": 302412, "epoch": 2499} {"train_loss": -42.399757385253906, "global_step": 302413, "epoch": 2499} {"train_loss": -42.34726333618164, "global_step": 302414, "epoch": 2499} {"train_loss": -42.55577850341797, "global_step": 302415, "epoch": 2499} {"train_loss": -42.98589324951172, "global_step": 302416, "epoch": 2499} {"train_loss": -41.576358795166016, "global_step": 302417, "epoch": 2499} {"train_loss": -41.37629318237305, "global_step": 302418, "epoch": 2499} {"train_loss": -42.44198226928711, "global_step": 302419, "epoch": 2499} {"train_loss": -41.52138137817383, "global_step": 302420, "epoch": 2499} {"train_loss": -40.773780822753906, "global_step": 302421, "epoch": 2499} {"train_loss": -42.46623992919922, "global_step": 302422, "epoch": 2499} {"train_loss": -41.6753044128418, "global_step": 302423, "epoch": 2499} {"train_loss": -41.38239669799805, "global_step": 302424, "epoch": 2499} {"train_loss": -42.3772087097168, "global_step": 302425, "epoch": 2499} {"train_loss": -41.38218307495117, "global_step": 302426, "epoch": 2499} {"train_loss": -41.53261184692383, "global_step": 302427, "epoch": 2499} {"train_loss": -40.591339111328125, "global_step": 302428, "epoch": 2499} {"train_loss": -41.2645149230957, "global_step": 302429, "epoch": 2499} {"train_loss": -41.20394515991211, "global_step": 302430, "epoch": 2499} {"train_loss": -40.42985534667969, "global_step": 302431, "epoch": 2499} {"train_loss": -41.98723220825195, "global_step": 302432, "epoch": 2499} {"train_loss": -42.54157638549805, "global_step": 302433, "epoch": 2499} {"train_loss": -42.08587646484375, "global_step": 302434, "epoch": 2499} {"train_loss": -33.592926025390625, "global_step": 302435, "epoch": 2499} {"train_loss": -42.21137237548828, "global_step": 302436, "epoch": 2499} {"train_loss": -41.73385238647461, "global_step": 302437, "epoch": 2499} {"train_loss": -42.653682708740234, "global_step": 302438, "epoch": 2499} {"train_loss": -42.972103118896484, "global_step": 302439, "epoch": 2499} {"train_loss": -39.178688049316406, "global_step": 302440, "epoch": 2499} {"train_loss": -40.90497589111328, "global_step": 302441, "epoch": 2499} {"train_loss": -40.15015411376953, "global_step": 302442, "epoch": 2499} {"train_loss": -37.134063720703125, "global_step": 302443, "epoch": 2499} {"train_loss": -40.36259078979492, "global_step": 302444, "epoch": 2499} {"train_loss": -40.478065490722656, "global_step": 302445, "epoch": 2499} {"train_loss": -29.350461959838867, "global_step": 302446, "epoch": 2499} {"train_loss": -39.86106491088867, "global_step": 302447, "epoch": 2499} {"train_loss": -40.394378662109375, "global_step": 302448, "epoch": 2499} {"train_loss": -39.47385025024414, "global_step": 302449, "epoch": 2499} {"train_loss": -40.8177604675293, "global_step": 302450, "epoch": 2499} {"train_loss": -39.939449310302734, "global_step": 302451, "epoch": 2499} {"train_loss": -41.139339447021484, "global_step": 302452, "epoch": 2499} {"train_loss": -37.35401153564453, "global_step": 302453, "epoch": 2499} {"train_loss": -39.77518844604492, "global_step": 302454, "epoch": 2499} {"train_loss": -41.544551849365234, "global_step": 302455, "epoch": 2499} {"train_loss": -40.187435150146484, "global_step": 302456, "epoch": 2499} {"train_loss": -39.93119430541992, "global_step": 302457, "epoch": 2499} {"train_loss": -41.1351203918457, "global_step": 302458, "epoch": 2499} {"train_loss": -38.14435577392578, "global_step": 302459, "epoch": 2499} {"train_loss": -41.52724075317383, "global_step": 302460, "epoch": 2499} {"train_loss": -40.59501647949219, "global_step": 302461, "epoch": 2499} {"train_loss": -38.166751861572266, "global_step": 302462, "epoch": 2499} {"train_loss": -42.112449645996094, "global_step": 302463, "epoch": 2499} {"train_loss": -39.75300216674805, "global_step": 302464, "epoch": 2499} {"train_loss": -39.93727493286133, "global_step": 302465, "epoch": 2499} {"train_loss": -41.5838508605957, "global_step": 302466, "epoch": 2499} {"train_loss": -37.99717712402344, "global_step": 302467, "epoch": 2499} {"train_loss": -41.63119888305664, "global_step": 302468, "epoch": 2499} {"train_loss": -41.14545822143555, "global_step": 302469, "epoch": 2499} {"train_loss": -38.839111328125, "global_step": 302470, "epoch": 2499} {"train_loss": -40.10551071166992, "global_step": 302471, "epoch": 2499} {"train_loss": -35.397315979003906, "global_step": 302472, "epoch": 2499} {"train_loss": -35.55707931518555, "global_step": 302473, "epoch": 2499} {"train_loss": -40.382320404052734, "global_step": 302474, "epoch": 2499} {"train_loss": -39.61872863769531, "global_step": 302475, "epoch": 2499} {"train_loss": -41.9412727355957, "global_step": 302476, "epoch": 2499} {"train_loss": -41.07748794555664, "global_step": 302477, "epoch": 2499} {"train_loss": -35.303070068359375, "global_step": 302478, "epoch": 2499} {"train_loss": -40.60245132446289, "global_step": 302479, "epoch": 2499} {"train_loss": -39.72683334350586, "global_step": 302480, "epoch": 2499} {"train_loss": -40.546932220458984, "global_step": 302481, "epoch": 2499} {"train_loss": -38.4246826171875, "global_step": 302482, "epoch": 2499} {"train_loss": -38.9417610168457, "global_step": 302483, "epoch": 2499} {"train_loss": -39.20643997192383, "global_step": 302484, "epoch": 2499} {"train_loss": -31.580503463745117, "global_step": 302485, "epoch": 2499} {"train_loss": -37.221519470214844, "global_step": 302486, "epoch": 2499} {"train_loss": -39.30892562866211, "global_step": 302487, "epoch": 2499} {"train_loss": -37.091697692871094, "global_step": 302488, "epoch": 2499} {"train_loss": -35.385433197021484, "global_step": 302489, "epoch": 2499} {"train_loss": -41.155426025390625, "global_step": 302490, "epoch": 2499} {"train_loss": -39.2119140625, "global_step": 302491, "epoch": 2499} {"train_loss": -41.27360916137695, "global_step": 302492, "epoch": 2499} {"train_loss": -38.43476486206055, "global_step": 302493, "epoch": 2499} {"train_loss": -41.43682861328125, "global_step": 302494, "epoch": 2499} {"train_loss": -39.93937301635742, "global_step": 302495, "epoch": 2499} {"train_loss": -40.36208724975586, "global_step": 302496, "epoch": 2499} {"train_loss": -39.79981994628906, "global_step": 302497, "epoch": 2499} {"train_loss": -40.617652893066406, "global_step": 302498, "epoch": 2499} {"train_loss": -40.56111069356115, "global_step": 302499, "epoch": 2499, "val_loss": 2607347.0} {"train_loss": -41.946388244628906, "global_step": 302500, "epoch": 2500} {"train_loss": -40.18328094482422, "global_step": 302501, "epoch": 2500} {"train_loss": -41.27250671386719, "global_step": 302502, "epoch": 2500} {"train_loss": -32.66524124145508, "global_step": 302503, "epoch": 2500} {"train_loss": -40.855690002441406, "global_step": 302504, "epoch": 2500} {"train_loss": -39.9906120300293, "global_step": 302505, "epoch": 2500} {"train_loss": -40.45612335205078, "global_step": 302506, "epoch": 2500} {"train_loss": -39.4436149597168, "global_step": 302507, "epoch": 2500} {"train_loss": -41.4421501159668, "global_step": 302508, "epoch": 2500} {"train_loss": -39.94451141357422, "global_step": 302509, "epoch": 2500} {"train_loss": -38.88813400268555, "global_step": 302510, "epoch": 2500} {"train_loss": -39.6832275390625, "global_step": 302511, "epoch": 2500} {"train_loss": -41.194515228271484, "global_step": 302512, "epoch": 2500} {"train_loss": -41.307472229003906, "global_step": 302513, "epoch": 2500} {"train_loss": -41.227115631103516, "global_step": 302514, "epoch": 2500} {"train_loss": -41.10326385498047, "global_step": 302515, "epoch": 2500} {"train_loss": -40.65708541870117, "global_step": 302516, "epoch": 2500} {"train_loss": -41.56195068359375, "global_step": 302517, "epoch": 2500} {"train_loss": -40.920467376708984, "global_step": 302518, "epoch": 2500} {"train_loss": -40.545448303222656, "global_step": 302519, "epoch": 2500} {"train_loss": -40.843292236328125, "global_step": 302520, "epoch": 2500} {"train_loss": -35.765220642089844, "global_step": 302521, "epoch": 2500} {"train_loss": -41.63216018676758, "global_step": 302522, "epoch": 2500} {"train_loss": -36.00886154174805, "global_step": 302523, "epoch": 2500} {"train_loss": -40.23777389526367, "global_step": 302524, "epoch": 2500} {"train_loss": -39.458980560302734, "global_step": 302525, "epoch": 2500} {"train_loss": -39.564598083496094, "global_step": 302526, "epoch": 2500} {"train_loss": -41.53778076171875, "global_step": 302527, "epoch": 2500} {"train_loss": -40.90564727783203, "global_step": 302528, "epoch": 2500} {"train_loss": -36.92841339111328, "global_step": 302529, "epoch": 2500} {"train_loss": -40.95869064331055, "global_step": 302530, "epoch": 2500} {"train_loss": -36.50325393676758, "global_step": 302531, "epoch": 2500} {"train_loss": -35.137508392333984, "global_step": 302532, "epoch": 2500} {"train_loss": -38.2110710144043, "global_step": 302533, "epoch": 2500} {"train_loss": -40.266109466552734, "global_step": 302534, "epoch": 2500} {"train_loss": -40.436580657958984, "global_step": 302535, "epoch": 2500} {"train_loss": -40.77604293823242, "global_step": 302536, "epoch": 2500} {"train_loss": -40.72805404663086, "global_step": 302537, "epoch": 2500} {"train_loss": -39.4188117980957, "global_step": 302538, "epoch": 2500} {"train_loss": -40.490108489990234, "global_step": 302539, "epoch": 2500} {"train_loss": -36.25103759765625, "global_step": 302540, "epoch": 2500} {"train_loss": -40.16695785522461, "global_step": 302541, "epoch": 2500} {"train_loss": -40.65127182006836, "global_step": 302542, "epoch": 2500} {"train_loss": -39.39225387573242, "global_step": 302543, "epoch": 2500} {"train_loss": -40.06989669799805, "global_step": 302544, "epoch": 2500} {"train_loss": -39.65715408325195, "global_step": 302545, "epoch": 2500} {"train_loss": -40.826576232910156, "global_step": 302546, "epoch": 2500} {"train_loss": -38.947628021240234, "global_step": 302547, "epoch": 2500} {"train_loss": -40.91667556762695, "global_step": 302548, "epoch": 2500} {"train_loss": -41.456058502197266, "global_step": 302549, "epoch": 2500} {"train_loss": -40.0040168762207, "global_step": 302550, "epoch": 2500} {"train_loss": -40.15255355834961, "global_step": 302551, "epoch": 2500} {"train_loss": -40.44148635864258, "global_step": 302552, "epoch": 2500} {"train_loss": -39.56904220581055, "global_step": 302553, "epoch": 2500} {"train_loss": -41.486602783203125, "global_step": 302554, "epoch": 2500} {"train_loss": -40.936458587646484, "global_step": 302555, "epoch": 2500} {"train_loss": -40.650367736816406, "global_step": 302556, "epoch": 2500} {"train_loss": -40.59111404418945, "global_step": 302557, "epoch": 2500} {"train_loss": -40.383583068847656, "global_step": 302558, "epoch": 2500} {"train_loss": -41.232112884521484, "global_step": 302559, "epoch": 2500} {"train_loss": -41.29179000854492, "global_step": 302560, "epoch": 2500} {"train_loss": -41.195831298828125, "global_step": 302561, "epoch": 2500} {"train_loss": -40.54787826538086, "global_step": 302562, "epoch": 2500} {"train_loss": -40.6595344543457, "global_step": 302563, "epoch": 2500} {"train_loss": -41.30799102783203, "global_step": 302564, "epoch": 2500} {"train_loss": -40.804405212402344, "global_step": 302565, "epoch": 2500} {"train_loss": -42.26747512817383, "global_step": 302566, "epoch": 2500} {"train_loss": -41.44624710083008, "global_step": 302567, "epoch": 2500} {"train_loss": -41.5572624206543, "global_step": 302568, "epoch": 2500} {"train_loss": -40.996177673339844, "global_step": 302569, "epoch": 2500} {"train_loss": -42.05198669433594, "global_step": 302570, "epoch": 2500} {"train_loss": -42.3004035949707, "global_step": 302571, "epoch": 2500} {"train_loss": -41.730499267578125, "global_step": 302572, "epoch": 2500} {"train_loss": -41.031463623046875, "global_step": 302573, "epoch": 2500} {"train_loss": -41.560157775878906, "global_step": 302574, "epoch": 2500} {"train_loss": -42.1840705871582, "global_step": 302575, "epoch": 2500} {"train_loss": -41.11651611328125, "global_step": 302576, "epoch": 2500} {"train_loss": -41.88312530517578, "global_step": 302577, "epoch": 2500} {"train_loss": -41.63625717163086, "global_step": 302578, "epoch": 2500} {"train_loss": -40.731327056884766, "global_step": 302579, "epoch": 2500} {"train_loss": -42.069580078125, "global_step": 302580, "epoch": 2500} {"train_loss": -42.36272048950195, "global_step": 302581, "epoch": 2500} {"train_loss": -40.3519401550293, "global_step": 302582, "epoch": 2500} {"train_loss": -41.63767623901367, "global_step": 302583, "epoch": 2500} {"train_loss": -41.47751998901367, "global_step": 302584, "epoch": 2500} {"train_loss": -41.3098258972168, "global_step": 302585, "epoch": 2500} {"train_loss": -41.60071563720703, "global_step": 302586, "epoch": 2500} {"train_loss": -42.34775924682617, "global_step": 302587, "epoch": 2500} {"train_loss": -41.57296371459961, "global_step": 302588, "epoch": 2500} {"train_loss": -40.578125, "global_step": 302589, "epoch": 2500} {"train_loss": -41.517234802246094, "global_step": 302590, "epoch": 2500} {"train_loss": -41.89045715332031, "global_step": 302591, "epoch": 2500} {"train_loss": -42.03056716918945, "global_step": 302592, "epoch": 2500} {"train_loss": -42.30103302001953, "global_step": 302593, "epoch": 2500} {"train_loss": -42.34101104736328, "global_step": 302594, "epoch": 2500} {"train_loss": -42.440887451171875, "global_step": 302595, "epoch": 2500} {"train_loss": -42.56698989868164, "global_step": 302596, "epoch": 2500} {"train_loss": -41.51715087890625, "global_step": 302597, "epoch": 2500} {"train_loss": -41.12356185913086, "global_step": 302598, "epoch": 2500} {"train_loss": -41.99338912963867, "global_step": 302599, "epoch": 2500} {"train_loss": -41.836639404296875, "global_step": 302600, "epoch": 2500} {"train_loss": -42.503135681152344, "global_step": 302601, "epoch": 2500} {"train_loss": -42.44124984741211, "global_step": 302602, "epoch": 2500} {"train_loss": -42.34333419799805, "global_step": 302603, "epoch": 2500} {"train_loss": -42.952091217041016, "global_step": 302604, "epoch": 2500} {"train_loss": -40.967384338378906, "global_step": 302605, "epoch": 2500} {"train_loss": -42.150325775146484, "global_step": 302606, "epoch": 2500} {"train_loss": -41.425933837890625, "global_step": 302607, "epoch": 2500} {"train_loss": -42.5495491027832, "global_step": 302608, "epoch": 2500} {"train_loss": -41.99836349487305, "global_step": 302609, "epoch": 2500} {"train_loss": -41.95988082885742, "global_step": 302610, "epoch": 2500} {"train_loss": -41.88806915283203, "global_step": 302611, "epoch": 2500} {"train_loss": -42.3122673034668, "global_step": 302612, "epoch": 2500} {"train_loss": -41.66379928588867, "global_step": 302613, "epoch": 2500} {"train_loss": -41.91323471069336, "global_step": 302614, "epoch": 2500} {"train_loss": -43.15407943725586, "global_step": 302615, "epoch": 2500} {"train_loss": -41.354801177978516, "global_step": 302616, "epoch": 2500} {"train_loss": -42.25590133666992, "global_step": 302617, "epoch": 2500} {"train_loss": -42.02814865112305, "global_step": 302618, "epoch": 2500} {"train_loss": -41.97170639038086, "global_step": 302619, "epoch": 2500} {"train_loss": -40.841360170979144, "global_step": 302620, "epoch": 2500, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4400000": 1.0, "test/sim_max_reward_4400001": 1.0, "test/sim_max_reward_4400002": 1.0, "test/sim_max_reward_4400003": 0.0, "test/sim_max_reward_4400004": 1.0, "test/sim_max_reward_4400005": 1.0, "test/sim_max_reward_4400006": 1.0, "test/sim_max_reward_4400007": 1.0, "test/sim_max_reward_4400008": 1.0, "test/sim_max_reward_4400009": 1.0, "test/sim_max_reward_4400010": 1.0, "test/sim_max_reward_4400011": 1.0, "test/sim_max_reward_4400012": 1.0, "test/sim_max_reward_4400013": 1.0, "test/sim_max_reward_4400014": 1.0, "test/sim_max_reward_4400015": 1.0, "test/sim_max_reward_4400016": 1.0, "test/sim_max_reward_4400017": 1.0, "test/sim_max_reward_4400018": 1.0, "test/sim_max_reward_4400019": 1.0, "test/sim_max_reward_4400020": 1.0, "test/sim_max_reward_4400021": 1.0, "train/mean_score": 1.0, "test/mean_score": 0.9545454545454546, "val_loss": 2461408.75} {"train_loss": -42.505615234375, "global_step": 302621, "epoch": 2501} {"train_loss": -42.507816314697266, "global_step": 302622, "epoch": 2501} {"train_loss": -42.23931884765625, "global_step": 302623, "epoch": 2501} {"train_loss": -41.74132537841797, "global_step": 302624, "epoch": 2501} {"train_loss": -41.09482955932617, "global_step": 302625, "epoch": 2501} {"train_loss": -41.6292610168457, "global_step": 302626, "epoch": 2501} {"train_loss": -42.71798324584961, "global_step": 302627, "epoch": 2501} {"train_loss": -41.54631423950195, "global_step": 302628, "epoch": 2501} {"train_loss": -40.18035125732422, "global_step": 302629, "epoch": 2501} {"train_loss": -39.963687896728516, "global_step": 302630, "epoch": 2501} {"train_loss": -42.563594818115234, "global_step": 302631, "epoch": 2501} {"train_loss": -41.40412139892578, "global_step": 302632, "epoch": 2501} {"train_loss": -41.96755599975586, "global_step": 302633, "epoch": 2501} {"train_loss": -42.001869201660156, "global_step": 302634, "epoch": 2501} {"train_loss": -42.36150360107422, "global_step": 302635, "epoch": 2501} {"train_loss": -42.96073913574219, "global_step": 302636, "epoch": 2501} {"train_loss": -41.66505813598633, "global_step": 302637, "epoch": 2501} {"train_loss": -41.95391082763672, "global_step": 302638, "epoch": 2501} {"train_loss": -42.45429229736328, "global_step": 302639, "epoch": 2501} {"train_loss": -39.316810607910156, "global_step": 302640, "epoch": 2501} {"train_loss": -41.566383361816406, "global_step": 302641, "epoch": 2501} {"train_loss": -40.50362014770508, "global_step": 302642, "epoch": 2501} {"train_loss": -39.86257553100586, "global_step": 302643, "epoch": 2501} {"train_loss": -41.37122344970703, "global_step": 302644, "epoch": 2501} {"train_loss": -42.76668930053711, "global_step": 302645, "epoch": 2501} {"train_loss": -42.5214958190918, "global_step": 302646, "epoch": 2501} {"train_loss": -41.5141716003418, "global_step": 302647, "epoch": 2501} {"train_loss": -36.76297378540039, "global_step": 302648, "epoch": 2501} {"train_loss": -42.14966583251953, "global_step": 302649, "epoch": 2501} {"train_loss": -40.62931442260742, "global_step": 302650, "epoch": 2501} {"train_loss": -40.34843063354492, "global_step": 302651, "epoch": 2501} {"train_loss": -42.13014602661133, "global_step": 302652, "epoch": 2501} {"train_loss": -41.153602600097656, "global_step": 302653, "epoch": 2501} {"train_loss": -41.44370651245117, "global_step": 302654, "epoch": 2501} {"train_loss": -42.18962860107422, "global_step": 302655, "epoch": 2501} {"train_loss": -38.559261322021484, "global_step": 302656, "epoch": 2501} {"train_loss": -31.789026260375977, "global_step": 302657, "epoch": 2501} {"train_loss": -40.02616500854492, "global_step": 302658, "epoch": 2501} {"train_loss": -41.970699310302734, "global_step": 302659, "epoch": 2501} {"train_loss": -41.0450553894043, "global_step": 302660, "epoch": 2501} {"train_loss": -41.475467681884766, "global_step": 302661, "epoch": 2501} {"train_loss": -38.7762451171875, "global_step": 302662, "epoch": 2501} {"train_loss": -41.662933349609375, "global_step": 302663, "epoch": 2501} {"train_loss": -41.705589294433594, "global_step": 302664, "epoch": 2501} {"train_loss": -40.956642150878906, "global_step": 302665, "epoch": 2501} {"train_loss": -41.738189697265625, "global_step": 302666, "epoch": 2501} {"train_loss": -41.41957092285156, "global_step": 302667, "epoch": 2501} {"train_loss": -42.32129669189453, "global_step": 302668, "epoch": 2501} {"train_loss": -42.11076736450195, "global_step": 302669, "epoch": 2501} {"train_loss": -41.62562561035156, "global_step": 302670, "epoch": 2501} {"train_loss": -42.13665771484375, "global_step": 302671, "epoch": 2501} {"train_loss": -41.7976188659668, "global_step": 302672, "epoch": 2501} {"train_loss": -42.135616302490234, "global_step": 302673, "epoch": 2501} {"train_loss": -39.563907623291016, "global_step": 302674, "epoch": 2501} {"train_loss": -41.51142501831055, "global_step": 302675, "epoch": 2501} {"train_loss": -41.15620803833008, "global_step": 302676, "epoch": 2501} {"train_loss": -41.23287582397461, "global_step": 302677, "epoch": 2501} {"train_loss": -42.25672149658203, "global_step": 302678, "epoch": 2501} {"train_loss": -41.9207878112793, "global_step": 302679, "epoch": 2501} {"train_loss": -40.584571838378906, "global_step": 302680, "epoch": 2501} {"train_loss": -41.68365478515625, "global_step": 302681, "epoch": 2501} {"train_loss": -41.877784729003906, "global_step": 302682, "epoch": 2501} {"train_loss": -41.849491119384766, "global_step": 302683, "epoch": 2501} {"train_loss": -41.775814056396484, "global_step": 302684, "epoch": 2501} {"train_loss": -41.466087341308594, "global_step": 302685, "epoch": 2501} {"train_loss": -42.13153076171875, "global_step": 302686, "epoch": 2501} {"train_loss": -41.365787506103516, "global_step": 302687, "epoch": 2501} {"train_loss": -41.590030670166016, "global_step": 302688, "epoch": 2501} {"train_loss": -42.05103302001953, "global_step": 302689, "epoch": 2501} {"train_loss": -41.4772834777832, "global_step": 302690, "epoch": 2501} {"train_loss": -41.469276428222656, "global_step": 302691, "epoch": 2501} {"train_loss": -41.76625442504883, "global_step": 302692, "epoch": 2501} {"train_loss": -41.642818450927734, "global_step": 302693, "epoch": 2501} {"train_loss": -41.19948959350586, "global_step": 302694, "epoch": 2501} {"train_loss": -42.54698944091797, "global_step": 302695, "epoch": 2501} {"train_loss": -42.532867431640625, "global_step": 302696, "epoch": 2501} {"train_loss": -42.54475021362305, "global_step": 302697, "epoch": 2501} {"train_loss": -41.967926025390625, "global_step": 302698, "epoch": 2501} {"train_loss": -42.33942794799805, "global_step": 302699, "epoch": 2501} {"train_loss": -41.8484001159668, "global_step": 302700, "epoch": 2501} {"train_loss": -43.22682571411133, "global_step": 302701, "epoch": 2501} {"train_loss": -42.12097930908203, "global_step": 302702, "epoch": 2501} {"train_loss": -42.13667678833008, "global_step": 302703, "epoch": 2501} {"train_loss": -40.12722396850586, "global_step": 302704, "epoch": 2501} {"train_loss": -42.848365783691406, "global_step": 302705, "epoch": 2501} {"train_loss": -42.65607452392578, "global_step": 302706, "epoch": 2501} {"train_loss": -42.57677459716797, "global_step": 302707, "epoch": 2501} {"train_loss": -43.040584564208984, "global_step": 302708, "epoch": 2501} {"train_loss": -42.04726791381836, "global_step": 302709, "epoch": 2501} {"train_loss": -42.44486618041992, "global_step": 302710, "epoch": 2501} {"train_loss": -42.50202178955078, "global_step": 302711, "epoch": 2501} {"train_loss": -42.45256423950195, "global_step": 302712, "epoch": 2501} {"train_loss": -42.17544174194336, "global_step": 302713, "epoch": 2501} {"train_loss": -41.30802536010742, "global_step": 302714, "epoch": 2501} {"train_loss": -43.03092575073242, "global_step": 302715, "epoch": 2501} {"train_loss": -42.4384651184082, "global_step": 302716, "epoch": 2501} {"train_loss": -42.05802536010742, "global_step": 302717, "epoch": 2501} {"train_loss": -42.67897415161133, "global_step": 302718, "epoch": 2501} {"train_loss": -43.12349319458008, "global_step": 302719, "epoch": 2501} {"train_loss": -42.65407180786133, "global_step": 302720, "epoch": 2501} {"train_loss": -42.902008056640625, "global_step": 302721, "epoch": 2501} {"train_loss": -42.72389602661133, "global_step": 302722, "epoch": 2501} {"train_loss": -42.954036712646484, "global_step": 302723, "epoch": 2501} {"train_loss": -42.60184860229492, "global_step": 302724, "epoch": 2501} {"train_loss": -43.391822814941406, "global_step": 302725, "epoch": 2501} {"train_loss": -42.41729736328125, "global_step": 302726, "epoch": 2501} {"train_loss": -42.464622497558594, "global_step": 302727, "epoch": 2501} {"train_loss": -43.285011291503906, "global_step": 302728, "epoch": 2501} {"train_loss": -42.8499641418457, "global_step": 302729, "epoch": 2501} {"train_loss": -43.316627502441406, "global_step": 302730, "epoch": 2501} {"train_loss": -43.576087951660156, "global_step": 302731, "epoch": 2501} {"train_loss": -43.7601432800293, "global_step": 302732, "epoch": 2501} {"train_loss": -42.78798294067383, "global_step": 302733, "epoch": 2501} {"train_loss": -42.84409713745117, "global_step": 302734, "epoch": 2501} {"train_loss": -43.61967086791992, "global_step": 302735, "epoch": 2501} {"train_loss": -43.75647735595703, "global_step": 302736, "epoch": 2501} {"train_loss": -43.2062873840332, "global_step": 302737, "epoch": 2501} {"train_loss": -42.951412200927734, "global_step": 302738, "epoch": 2501} {"train_loss": -43.00225830078125, "global_step": 302739, "epoch": 2501} {"train_loss": -43.73274230957031, "global_step": 302740, "epoch": 2501} {"train_loss": -41.84389078124496, "global_step": 302741, "epoch": 2501, "val_loss": 2457333.25} {"train_loss": -43.650001525878906, "global_step": 302742, "epoch": 2502} {"train_loss": -43.13003158569336, "global_step": 302743, "epoch": 2502} {"train_loss": -42.94597244262695, "global_step": 302744, "epoch": 2502} {"train_loss": -43.29987716674805, "global_step": 302745, "epoch": 2502} {"train_loss": -41.1136589050293, "global_step": 302746, "epoch": 2502} {"train_loss": -43.4605827331543, "global_step": 302747, "epoch": 2502} {"train_loss": -43.932281494140625, "global_step": 302748, "epoch": 2502} {"train_loss": -42.744606018066406, "global_step": 302749, "epoch": 2502} {"train_loss": -43.11863708496094, "global_step": 302750, "epoch": 2502} {"train_loss": -42.328773498535156, "global_step": 302751, "epoch": 2502} {"train_loss": -40.103851318359375, "global_step": 302752, "epoch": 2502} {"train_loss": -31.281919479370117, "global_step": 302753, "epoch": 2502} {"train_loss": -16.28535270690918, "global_step": 302754, "epoch": 2502} {"train_loss": -19.805112838745117, "global_step": 302755, "epoch": 2502} {"train_loss": -40.83466339111328, "global_step": 302756, "epoch": 2502} {"train_loss": -25.466482162475586, "global_step": 302757, "epoch": 2502} {"train_loss": -32.21620559692383, "global_step": 302758, "epoch": 2502} {"train_loss": -39.480350494384766, "global_step": 302759, "epoch": 2502} {"train_loss": -32.142051696777344, "global_step": 302760, "epoch": 2502} {"train_loss": -41.596214294433594, "global_step": 302761, "epoch": 2502} {"train_loss": -32.38208770751953, "global_step": 302762, "epoch": 2502} {"train_loss": -37.68016815185547, "global_step": 302763, "epoch": 2502} {"train_loss": -34.3982048034668, "global_step": 302764, "epoch": 2502} {"train_loss": -38.52083969116211, "global_step": 302765, "epoch": 2502} {"train_loss": -36.11615753173828, "global_step": 302766, "epoch": 2502} {"train_loss": -40.2752799987793, "global_step": 302767, "epoch": 2502} {"train_loss": -36.77232360839844, "global_step": 302768, "epoch": 2502} {"train_loss": -38.86983871459961, "global_step": 302769, "epoch": 2502} {"train_loss": -40.18592071533203, "global_step": 302770, "epoch": 2502} {"train_loss": -37.346473693847656, "global_step": 302771, "epoch": 2502} {"train_loss": -40.88663864135742, "global_step": 302772, "epoch": 2502} {"train_loss": -39.358219146728516, "global_step": 302773, "epoch": 2502} {"train_loss": -39.676429748535156, "global_step": 302774, "epoch": 2502} {"train_loss": -40.598567962646484, "global_step": 302775, "epoch": 2502} {"train_loss": -40.14502716064453, "global_step": 302776, "epoch": 2502} {"train_loss": -41.171409606933594, "global_step": 302777, "epoch": 2502} {"train_loss": -38.96870803833008, "global_step": 302778, "epoch": 2502} {"train_loss": -41.532283782958984, "global_step": 302779, "epoch": 2502} {"train_loss": -40.396968841552734, "global_step": 302780, "epoch": 2502} {"train_loss": -40.167869567871094, "global_step": 302781, "epoch": 2502} {"train_loss": -41.0013313293457, "global_step": 302782, "epoch": 2502} {"train_loss": -41.703853607177734, "global_step": 302783, "epoch": 2502} {"train_loss": -40.92837142944336, "global_step": 302784, "epoch": 2502} {"train_loss": -41.30082702636719, "global_step": 302785, "epoch": 2502} {"train_loss": -41.861270904541016, "global_step": 302786, "epoch": 2502} {"train_loss": -41.6533088684082, "global_step": 302787, "epoch": 2502} {"train_loss": -41.31804275512695, "global_step": 302788, "epoch": 2502} {"train_loss": -40.55418014526367, "global_step": 302789, "epoch": 2502} {"train_loss": -41.36669158935547, "global_step": 302790, "epoch": 2502} {"train_loss": -41.550106048583984, "global_step": 302791, "epoch": 2502} {"train_loss": -41.39990997314453, "global_step": 302792, "epoch": 2502} {"train_loss": -41.85002899169922, "global_step": 302793, "epoch": 2502} {"train_loss": -41.52988815307617, "global_step": 302794, "epoch": 2502} {"train_loss": -41.51491165161133, "global_step": 302795, "epoch": 2502} {"train_loss": -41.700172424316406, "global_step": 302796, "epoch": 2502} {"train_loss": -42.163875579833984, "global_step": 302797, "epoch": 2502} {"train_loss": -41.94038009643555, "global_step": 302798, "epoch": 2502} {"train_loss": -41.68750762939453, "global_step": 302799, "epoch": 2502} {"train_loss": -42.3488883972168, "global_step": 302800, "epoch": 2502} {"train_loss": -42.73258590698242, "global_step": 302801, "epoch": 2502} {"train_loss": -42.653926849365234, "global_step": 302802, "epoch": 2502} {"train_loss": -41.8887825012207, "global_step": 302803, "epoch": 2502} {"train_loss": -42.50189971923828, "global_step": 302804, "epoch": 2502} {"train_loss": -42.40412139892578, "global_step": 302805, "epoch": 2502} {"train_loss": -42.525997161865234, "global_step": 302806, "epoch": 2502} {"train_loss": -42.868282318115234, "global_step": 302807, "epoch": 2502} {"train_loss": -42.69776153564453, "global_step": 302808, "epoch": 2502} {"train_loss": -42.96309280395508, "global_step": 302809, "epoch": 2502} {"train_loss": -42.57218551635742, "global_step": 302810, "epoch": 2502} {"train_loss": -43.11196517944336, "global_step": 302811, "epoch": 2502} {"train_loss": -42.792972564697266, "global_step": 302812, "epoch": 2502} {"train_loss": -43.0139274597168, "global_step": 302813, "epoch": 2502} {"train_loss": -42.82978820800781, "global_step": 302814, "epoch": 2502} {"train_loss": -42.68915939331055, "global_step": 302815, "epoch": 2502} {"train_loss": -42.7149772644043, "global_step": 302816, "epoch": 2502} {"train_loss": -42.06658935546875, "global_step": 302817, "epoch": 2502} {"train_loss": -43.20392608642578, "global_step": 302818, "epoch": 2502} {"train_loss": -43.03072738647461, "global_step": 302819, "epoch": 2502} {"train_loss": -43.206886291503906, "global_step": 302820, "epoch": 2502} {"train_loss": -43.3532600402832, "global_step": 302821, "epoch": 2502} {"train_loss": -43.12010955810547, "global_step": 302822, "epoch": 2502} {"train_loss": -43.37763595581055, "global_step": 302823, "epoch": 2502} {"train_loss": -42.99619674682617, "global_step": 302824, "epoch": 2502} {"train_loss": -42.94868469238281, "global_step": 302825, "epoch": 2502} {"train_loss": -43.3223876953125, "global_step": 302826, "epoch": 2502} {"train_loss": -43.1635856628418, "global_step": 302827, "epoch": 2502} {"train_loss": -43.599952697753906, "global_step": 302828, "epoch": 2502} {"train_loss": -42.76993942260742, "global_step": 302829, "epoch": 2502} {"train_loss": -43.966041564941406, "global_step": 302830, "epoch": 2502} {"train_loss": -42.66690444946289, "global_step": 302831, "epoch": 2502} {"train_loss": -43.17586898803711, "global_step": 302832, "epoch": 2502} {"train_loss": -43.37385940551758, "global_step": 302833, "epoch": 2502} {"train_loss": -43.51923370361328, "global_step": 302834, "epoch": 2502} {"train_loss": -43.42094039916992, "global_step": 302835, "epoch": 2502} {"train_loss": -43.34239959716797, "global_step": 302836, "epoch": 2502} {"train_loss": -43.29767990112305, "global_step": 302837, "epoch": 2502} {"train_loss": -43.56998825073242, "global_step": 302838, "epoch": 2502} {"train_loss": -43.553096771240234, "global_step": 302839, "epoch": 2502} {"train_loss": -43.47028732299805, "global_step": 302840, "epoch": 2502} {"train_loss": -43.66209030151367, "global_step": 302841, "epoch": 2502} {"train_loss": -43.56772994995117, "global_step": 302842, "epoch": 2502} {"train_loss": -43.428009033203125, "global_step": 302843, "epoch": 2502} {"train_loss": -43.879329681396484, "global_step": 302844, "epoch": 2502} {"train_loss": -43.18056869506836, "global_step": 302845, "epoch": 2502} {"train_loss": -43.944068908691406, "global_step": 302846, "epoch": 2502} {"train_loss": -43.27445602416992, "global_step": 302847, "epoch": 2502} {"train_loss": -43.622859954833984, "global_step": 302848, "epoch": 2502} {"train_loss": -44.05613708496094, "global_step": 302849, "epoch": 2502} {"train_loss": -43.629207611083984, "global_step": 302850, "epoch": 2502} {"train_loss": -43.780494689941406, "global_step": 302851, "epoch": 2502} {"train_loss": -43.602752685546875, "global_step": 302852, "epoch": 2502} {"train_loss": -43.86845016479492, "global_step": 302853, "epoch": 2502} {"train_loss": -43.78020095825195, "global_step": 302854, "epoch": 2502} {"train_loss": -43.197975158691406, "global_step": 302855, "epoch": 2502} {"train_loss": -43.740718841552734, "global_step": 302856, "epoch": 2502} {"train_loss": -43.4498176574707, "global_step": 302857, "epoch": 2502} {"train_loss": -43.131343841552734, "global_step": 302858, "epoch": 2502} {"train_loss": -42.2467041015625, "global_step": 302859, "epoch": 2502} {"train_loss": -40.506404876708984, "global_step": 302860, "epoch": 2502} {"train_loss": -37.510677337646484, "global_step": 302861, "epoch": 2502} {"train_loss": -41.10460246693004, "global_step": 302862, "epoch": 2502, "val_loss": 2562547.75} {"train_loss": -31.731672286987305, "global_step": 302863, "epoch": 2503} {"train_loss": -37.22285079956055, "global_step": 302864, "epoch": 2503} {"train_loss": -42.46710205078125, "global_step": 302865, "epoch": 2503} {"train_loss": -39.42133331298828, "global_step": 302866, "epoch": 2503} {"train_loss": -41.15758514404297, "global_step": 302867, "epoch": 2503} {"train_loss": -40.46954345703125, "global_step": 302868, "epoch": 2503} {"train_loss": -39.894893646240234, "global_step": 302869, "epoch": 2503} {"train_loss": -40.955726623535156, "global_step": 302870, "epoch": 2503} {"train_loss": -37.69356918334961, "global_step": 302871, "epoch": 2503} {"train_loss": -41.36628341674805, "global_step": 302872, "epoch": 2503} {"train_loss": -37.952754974365234, "global_step": 302873, "epoch": 2503} {"train_loss": -41.2666130065918, "global_step": 302874, "epoch": 2503} {"train_loss": -39.74188995361328, "global_step": 302875, "epoch": 2503} {"train_loss": -40.956451416015625, "global_step": 302876, "epoch": 2503} {"train_loss": -40.57326126098633, "global_step": 302877, "epoch": 2503} {"train_loss": -39.69974899291992, "global_step": 302878, "epoch": 2503} {"train_loss": -41.62903594970703, "global_step": 302879, "epoch": 2503} {"train_loss": -39.60012435913086, "global_step": 302880, "epoch": 2503} {"train_loss": -40.543434143066406, "global_step": 302881, "epoch": 2503} {"train_loss": -39.991024017333984, "global_step": 302882, "epoch": 2503} {"train_loss": -41.37284469604492, "global_step": 302883, "epoch": 2503} {"train_loss": -41.57462692260742, "global_step": 302884, "epoch": 2503} {"train_loss": -41.2419319152832, "global_step": 302885, "epoch": 2503} {"train_loss": -42.346405029296875, "global_step": 302886, "epoch": 2503} {"train_loss": -41.1428108215332, "global_step": 302887, "epoch": 2503} {"train_loss": -41.63032913208008, "global_step": 302888, "epoch": 2503} {"train_loss": -41.75562286376953, "global_step": 302889, "epoch": 2503} {"train_loss": -41.17463684082031, "global_step": 302890, "epoch": 2503} {"train_loss": -41.8503532409668, "global_step": 302891, "epoch": 2503} {"train_loss": -42.40070724487305, "global_step": 302892, "epoch": 2503} {"train_loss": -42.18628692626953, "global_step": 302893, "epoch": 2503} {"train_loss": -42.209293365478516, "global_step": 302894, "epoch": 2503} {"train_loss": -41.9755973815918, "global_step": 302895, "epoch": 2503} {"train_loss": -42.565185546875, "global_step": 302896, "epoch": 2503} {"train_loss": -41.43994903564453, "global_step": 302897, "epoch": 2503} {"train_loss": -42.81395721435547, "global_step": 302898, "epoch": 2503} {"train_loss": -42.098506927490234, "global_step": 302899, "epoch": 2503} {"train_loss": -42.75459671020508, "global_step": 302900, "epoch": 2503} {"train_loss": -42.62347412109375, "global_step": 302901, "epoch": 2503} {"train_loss": -42.33980941772461, "global_step": 302902, "epoch": 2503} {"train_loss": -41.998016357421875, "global_step": 302903, "epoch": 2503} {"train_loss": -42.538063049316406, "global_step": 302904, "epoch": 2503} {"train_loss": -43.44584274291992, "global_step": 302905, "epoch": 2503} {"train_loss": -43.18327713012695, "global_step": 302906, "epoch": 2503} {"train_loss": -42.660850524902344, "global_step": 302907, "epoch": 2503} {"train_loss": -42.52737808227539, "global_step": 302908, "epoch": 2503} {"train_loss": -42.70161056518555, "global_step": 302909, "epoch": 2503} {"train_loss": -42.40237808227539, "global_step": 302910, "epoch": 2503} {"train_loss": -43.17637252807617, "global_step": 302911, "epoch": 2503} {"train_loss": -42.72052764892578, "global_step": 302912, "epoch": 2503} {"train_loss": -42.918601989746094, "global_step": 302913, "epoch": 2503} {"train_loss": -43.417789459228516, "global_step": 302914, "epoch": 2503} {"train_loss": -42.964168548583984, "global_step": 302915, "epoch": 2503} {"train_loss": -43.05429458618164, "global_step": 302916, "epoch": 2503} {"train_loss": -43.19847106933594, "global_step": 302917, "epoch": 2503} {"train_loss": -43.025665283203125, "global_step": 302918, "epoch": 2503} {"train_loss": -43.44074630737305, "global_step": 302919, "epoch": 2503} {"train_loss": -43.00590896606445, "global_step": 302920, "epoch": 2503} {"train_loss": -43.330631256103516, "global_step": 302921, "epoch": 2503} {"train_loss": -43.43854904174805, "global_step": 302922, "epoch": 2503} {"train_loss": -43.19249725341797, "global_step": 302923, "epoch": 2503} {"train_loss": -43.098445892333984, "global_step": 302924, "epoch": 2503} {"train_loss": -43.47644805908203, "global_step": 302925, "epoch": 2503} {"train_loss": -42.9821662902832, "global_step": 302926, "epoch": 2503} {"train_loss": -43.129154205322266, "global_step": 302927, "epoch": 2503} {"train_loss": -43.58618927001953, "global_step": 302928, "epoch": 2503} {"train_loss": -42.975791931152344, "global_step": 302929, "epoch": 2503} {"train_loss": -43.961944580078125, "global_step": 302930, "epoch": 2503} {"train_loss": -42.80057907104492, "global_step": 302931, "epoch": 2503} {"train_loss": -43.30583953857422, "global_step": 302932, "epoch": 2503} {"train_loss": -43.079349517822266, "global_step": 302933, "epoch": 2503} {"train_loss": -42.872135162353516, "global_step": 302934, "epoch": 2503} {"train_loss": -43.491249084472656, "global_step": 302935, "epoch": 2503} {"train_loss": -43.2657470703125, "global_step": 302936, "epoch": 2503} {"train_loss": -43.37314987182617, "global_step": 302937, "epoch": 2503} {"train_loss": -43.30735778808594, "global_step": 302938, "epoch": 2503} {"train_loss": -43.3052864074707, "global_step": 302939, "epoch": 2503} {"train_loss": -43.57057571411133, "global_step": 302940, "epoch": 2503} {"train_loss": -44.050559997558594, "global_step": 302941, "epoch": 2503} {"train_loss": -43.45621109008789, "global_step": 302942, "epoch": 2503} {"train_loss": -43.34228515625, "global_step": 302943, "epoch": 2503} {"train_loss": -43.66045379638672, "global_step": 302944, "epoch": 2503} {"train_loss": -43.85620880126953, "global_step": 302945, "epoch": 2503} {"train_loss": -43.01239776611328, "global_step": 302946, "epoch": 2503} {"train_loss": -43.78668975830078, "global_step": 302947, "epoch": 2503} {"train_loss": -43.42463302612305, "global_step": 302948, "epoch": 2503} {"train_loss": -43.539669036865234, "global_step": 302949, "epoch": 2503} {"train_loss": -41.77250289916992, "global_step": 302950, "epoch": 2503} {"train_loss": -43.76960754394531, "global_step": 302951, "epoch": 2503} {"train_loss": -43.92647933959961, "global_step": 302952, "epoch": 2503} {"train_loss": -44.305519104003906, "global_step": 302953, "epoch": 2503} {"train_loss": -43.68284225463867, "global_step": 302954, "epoch": 2503} {"train_loss": -43.561981201171875, "global_step": 302955, "epoch": 2503} {"train_loss": -43.420223236083984, "global_step": 302956, "epoch": 2503} {"train_loss": -44.08359146118164, "global_step": 302957, "epoch": 2503} {"train_loss": -43.31212615966797, "global_step": 302958, "epoch": 2503} {"train_loss": -43.024234771728516, "global_step": 302959, "epoch": 2503} {"train_loss": -44.21603012084961, "global_step": 302960, "epoch": 2503} {"train_loss": -43.88044357299805, "global_step": 302961, "epoch": 2503} {"train_loss": -42.6583251953125, "global_step": 302962, "epoch": 2503} {"train_loss": -42.238121032714844, "global_step": 302963, "epoch": 2503} {"train_loss": -42.32215118408203, "global_step": 302964, "epoch": 2503} {"train_loss": -44.083831787109375, "global_step": 302965, "epoch": 2503} {"train_loss": -44.15584182739258, "global_step": 302966, "epoch": 2503} {"train_loss": -43.031768798828125, "global_step": 302967, "epoch": 2503} {"train_loss": -43.21096420288086, "global_step": 302968, "epoch": 2503} {"train_loss": -42.87215805053711, "global_step": 302969, "epoch": 2503} {"train_loss": -44.06565475463867, "global_step": 302970, "epoch": 2503} {"train_loss": -42.90309143066406, "global_step": 302971, "epoch": 2503} {"train_loss": -42.30961990356445, "global_step": 302972, "epoch": 2503} {"train_loss": -43.37131118774414, "global_step": 302973, "epoch": 2503} {"train_loss": -42.9638786315918, "global_step": 302974, "epoch": 2503} {"train_loss": -40.850852966308594, "global_step": 302975, "epoch": 2503} {"train_loss": -41.54409408569336, "global_step": 302976, "epoch": 2503} {"train_loss": -43.38854217529297, "global_step": 302977, "epoch": 2503} {"train_loss": -41.0463752746582, "global_step": 302978, "epoch": 2503} {"train_loss": -40.9015998840332, "global_step": 302979, "epoch": 2503} {"train_loss": -42.74786376953125, "global_step": 302980, "epoch": 2503} {"train_loss": -40.842403411865234, "global_step": 302981, "epoch": 2503} {"train_loss": -38.799591064453125, "global_step": 302982, "epoch": 2503} {"train_loss": -42.308370464104264, "global_step": 302983, "epoch": 2503, "val_loss": 2580301.0} {"train_loss": -40.98146438598633, "global_step": 302984, "epoch": 2504} {"train_loss": -40.63316345214844, "global_step": 302985, "epoch": 2504} {"train_loss": -41.74824905395508, "global_step": 302986, "epoch": 2504} {"train_loss": -42.88066101074219, "global_step": 302987, "epoch": 2504} {"train_loss": -41.86903762817383, "global_step": 302988, "epoch": 2504} {"train_loss": -40.91330337524414, "global_step": 302989, "epoch": 2504} {"train_loss": -43.08073043823242, "global_step": 302990, "epoch": 2504} {"train_loss": -42.42751693725586, "global_step": 302991, "epoch": 2504} {"train_loss": -42.43745422363281, "global_step": 302992, "epoch": 2504} {"train_loss": -41.8256950378418, "global_step": 302993, "epoch": 2504} {"train_loss": -41.74060821533203, "global_step": 302994, "epoch": 2504} {"train_loss": -42.928749084472656, "global_step": 302995, "epoch": 2504} {"train_loss": -42.614131927490234, "global_step": 302996, "epoch": 2504} {"train_loss": -42.5637092590332, "global_step": 302997, "epoch": 2504} {"train_loss": -42.96178436279297, "global_step": 302998, "epoch": 2504} {"train_loss": -42.99885177612305, "global_step": 302999, "epoch": 2504} {"train_loss": -42.87244415283203, "global_step": 303000, "epoch": 2504} {"train_loss": -41.3531494140625, "global_step": 303001, "epoch": 2504} {"train_loss": -43.073299407958984, "global_step": 303002, "epoch": 2504} {"train_loss": -42.40245056152344, "global_step": 303003, "epoch": 2504} {"train_loss": -41.76982498168945, "global_step": 303004, "epoch": 2504} {"train_loss": -42.44579315185547, "global_step": 303005, "epoch": 2504} {"train_loss": -42.1723518371582, "global_step": 303006, "epoch": 2504} {"train_loss": -42.43398666381836, "global_step": 303007, "epoch": 2504} {"train_loss": -42.59109115600586, "global_step": 303008, "epoch": 2504} {"train_loss": -42.9561882019043, "global_step": 303009, "epoch": 2504} {"train_loss": -42.805660247802734, "global_step": 303010, "epoch": 2504} {"train_loss": -43.02345657348633, "global_step": 303011, "epoch": 2504} {"train_loss": -42.86512756347656, "global_step": 303012, "epoch": 2504} {"train_loss": -43.31586837768555, "global_step": 303013, "epoch": 2504} {"train_loss": -43.28828048706055, "global_step": 303014, "epoch": 2504} {"train_loss": -42.460365295410156, "global_step": 303015, "epoch": 2504} {"train_loss": -43.05493927001953, "global_step": 303016, "epoch": 2504} {"train_loss": -43.02665328979492, "global_step": 303017, "epoch": 2504} {"train_loss": -43.224361419677734, "global_step": 303018, "epoch": 2504} {"train_loss": -42.3310546875, "global_step": 303019, "epoch": 2504} {"train_loss": -43.23663330078125, "global_step": 303020, "epoch": 2504} {"train_loss": -43.0672721862793, "global_step": 303021, "epoch": 2504} {"train_loss": -43.298519134521484, "global_step": 303022, "epoch": 2504} {"train_loss": -42.7083740234375, "global_step": 303023, "epoch": 2504} {"train_loss": -43.20647430419922, "global_step": 303024, "epoch": 2504} {"train_loss": -41.31644058227539, "global_step": 303025, "epoch": 2504} {"train_loss": -42.725189208984375, "global_step": 303026, "epoch": 2504} {"train_loss": -42.77400588989258, "global_step": 303027, "epoch": 2504} {"train_loss": -43.65623092651367, "global_step": 303028, "epoch": 2504} {"train_loss": -42.71906280517578, "global_step": 303029, "epoch": 2504} {"train_loss": -43.474544525146484, "global_step": 303030, "epoch": 2504} {"train_loss": -43.08419418334961, "global_step": 303031, "epoch": 2504} {"train_loss": -43.51044464111328, "global_step": 303032, "epoch": 2504} {"train_loss": -42.44700241088867, "global_step": 303033, "epoch": 2504} {"train_loss": -42.022212982177734, "global_step": 303034, "epoch": 2504} {"train_loss": -43.04011917114258, "global_step": 303035, "epoch": 2504} {"train_loss": -42.010353088378906, "global_step": 303036, "epoch": 2504} {"train_loss": -43.73642349243164, "global_step": 303037, "epoch": 2504} {"train_loss": -43.4187126159668, "global_step": 303038, "epoch": 2504} {"train_loss": -43.36888122558594, "global_step": 303039, "epoch": 2504} {"train_loss": -34.05470657348633, "global_step": 303040, "epoch": 2504} {"train_loss": -43.48579025268555, "global_step": 303041, "epoch": 2504} {"train_loss": -43.621185302734375, "global_step": 303042, "epoch": 2504} {"train_loss": -43.346858978271484, "global_step": 303043, "epoch": 2504} {"train_loss": -42.74993896484375, "global_step": 303044, "epoch": 2504} {"train_loss": -43.59535598754883, "global_step": 303045, "epoch": 2504} {"train_loss": -42.93226623535156, "global_step": 303046, "epoch": 2504} {"train_loss": -39.635101318359375, "global_step": 303047, "epoch": 2504} {"train_loss": -43.40610122680664, "global_step": 303048, "epoch": 2504} {"train_loss": -42.93684005737305, "global_step": 303049, "epoch": 2504} {"train_loss": -42.74560546875, "global_step": 303050, "epoch": 2504} {"train_loss": -36.85724639892578, "global_step": 303051, "epoch": 2504} {"train_loss": -43.03973388671875, "global_step": 303052, "epoch": 2504} {"train_loss": -42.77216720581055, "global_step": 303053, "epoch": 2504} {"train_loss": -42.92277526855469, "global_step": 303054, "epoch": 2504} {"train_loss": -42.70237350463867, "global_step": 303055, "epoch": 2504} {"train_loss": -42.66427230834961, "global_step": 303056, "epoch": 2504} {"train_loss": -43.5021858215332, "global_step": 303057, "epoch": 2504} {"train_loss": -43.20986557006836, "global_step": 303058, "epoch": 2504} {"train_loss": -42.355674743652344, "global_step": 303059, "epoch": 2504} {"train_loss": -43.02717208862305, "global_step": 303060, "epoch": 2504} {"train_loss": -41.939109802246094, "global_step": 303061, "epoch": 2504} {"train_loss": -42.534889221191406, "global_step": 303062, "epoch": 2504} {"train_loss": -42.796958923339844, "global_step": 303063, "epoch": 2504} {"train_loss": -42.970130920410156, "global_step": 303064, "epoch": 2504} {"train_loss": -43.7450065612793, "global_step": 303065, "epoch": 2504} {"train_loss": -43.87984848022461, "global_step": 303066, "epoch": 2504} {"train_loss": -39.6578254699707, "global_step": 303067, "epoch": 2504} {"train_loss": -43.0223503112793, "global_step": 303068, "epoch": 2504} {"train_loss": -41.920684814453125, "global_step": 303069, "epoch": 2504} {"train_loss": -41.01458740234375, "global_step": 303070, "epoch": 2504} {"train_loss": -40.280364990234375, "global_step": 303071, "epoch": 2504} {"train_loss": -42.5668830871582, "global_step": 303072, "epoch": 2504} {"train_loss": -42.231842041015625, "global_step": 303073, "epoch": 2504} {"train_loss": -31.364171981811523, "global_step": 303074, "epoch": 2504} {"train_loss": -40.28142166137695, "global_step": 303075, "epoch": 2504} {"train_loss": -37.0915412902832, "global_step": 303076, "epoch": 2504} {"train_loss": -38.677711486816406, "global_step": 303077, "epoch": 2504} {"train_loss": -33.13172912597656, "global_step": 303078, "epoch": 2504} {"train_loss": -9.126283645629883, "global_step": 303079, "epoch": 2504} {"train_loss": -37.847251892089844, "global_step": 303080, "epoch": 2504} {"train_loss": -34.387569427490234, "global_step": 303081, "epoch": 2504} {"train_loss": -27.83808708190918, "global_step": 303082, "epoch": 2504} {"train_loss": -34.99946212768555, "global_step": 303083, "epoch": 2504} {"train_loss": -34.13572311401367, "global_step": 303084, "epoch": 2504} {"train_loss": -34.6313591003418, "global_step": 303085, "epoch": 2504} {"train_loss": -31.577392578125, "global_step": 303086, "epoch": 2504} {"train_loss": -34.8153076171875, "global_step": 303087, "epoch": 2504} {"train_loss": -35.87948226928711, "global_step": 303088, "epoch": 2504} {"train_loss": -37.216712951660156, "global_step": 303089, "epoch": 2504} {"train_loss": -34.16040802001953, "global_step": 303090, "epoch": 2504} {"train_loss": -31.274572372436523, "global_step": 303091, "epoch": 2504} {"train_loss": -25.543121337890625, "global_step": 303092, "epoch": 2504} {"train_loss": -34.8422966003418, "global_step": 303093, "epoch": 2504} {"train_loss": -37.418495178222656, "global_step": 303094, "epoch": 2504} {"train_loss": -36.913246154785156, "global_step": 303095, "epoch": 2504} {"train_loss": -36.62214279174805, "global_step": 303096, "epoch": 2504} {"train_loss": -31.893335342407227, "global_step": 303097, "epoch": 2504} {"train_loss": -34.24956130981445, "global_step": 303098, "epoch": 2504} {"train_loss": -36.66417694091797, "global_step": 303099, "epoch": 2504} {"train_loss": -28.176162719726562, "global_step": 303100, "epoch": 2504} {"train_loss": -32.81022644042969, "global_step": 303101, "epoch": 2504} {"train_loss": -37.030792236328125, "global_step": 303102, "epoch": 2504} {"train_loss": -37.39268493652344, "global_step": 303103, "epoch": 2504} {"train_loss": -40.1934566813067, "global_step": 303104, "epoch": 2504, "val_loss": 2768698.0} {"train_loss": -37.22178268432617, "global_step": 303105, "epoch": 2505} {"train_loss": -36.83906555175781, "global_step": 303106, "epoch": 2505} {"train_loss": -36.98014831542969, "global_step": 303107, "epoch": 2505} {"train_loss": -36.95463943481445, "global_step": 303108, "epoch": 2505} {"train_loss": -34.865386962890625, "global_step": 303109, "epoch": 2505} {"train_loss": -35.551578521728516, "global_step": 303110, "epoch": 2505} {"train_loss": -36.49580764770508, "global_step": 303111, "epoch": 2505} {"train_loss": -38.20500183105469, "global_step": 303112, "epoch": 2505} {"train_loss": -38.31008529663086, "global_step": 303113, "epoch": 2505} {"train_loss": -38.13181686401367, "global_step": 303114, "epoch": 2505} {"train_loss": -35.108524322509766, "global_step": 303115, "epoch": 2505} {"train_loss": -37.4394416809082, "global_step": 303116, "epoch": 2505} {"train_loss": -37.821197509765625, "global_step": 303117, "epoch": 2505} {"train_loss": -37.22121810913086, "global_step": 303118, "epoch": 2505} {"train_loss": -38.363521575927734, "global_step": 303119, "epoch": 2505} {"train_loss": -38.969539642333984, "global_step": 303120, "epoch": 2505} {"train_loss": -37.26755142211914, "global_step": 303121, "epoch": 2505} {"train_loss": -38.03855514526367, "global_step": 303122, "epoch": 2505} {"train_loss": -36.879241943359375, "global_step": 303123, "epoch": 2505} {"train_loss": -38.3718376159668, "global_step": 303124, "epoch": 2505} {"train_loss": -38.93659591674805, "global_step": 303125, "epoch": 2505} {"train_loss": -39.0233268737793, "global_step": 303126, "epoch": 2505} {"train_loss": -38.49089431762695, "global_step": 303127, "epoch": 2505} {"train_loss": -38.8757209777832, "global_step": 303128, "epoch": 2505} {"train_loss": -39.435176849365234, "global_step": 303129, "epoch": 2505} {"train_loss": -39.60749053955078, "global_step": 303130, "epoch": 2505} {"train_loss": -39.57032012939453, "global_step": 303131, "epoch": 2505} {"train_loss": -39.471797943115234, "global_step": 303132, "epoch": 2505} {"train_loss": -38.52381134033203, "global_step": 303133, "epoch": 2505} {"train_loss": -39.781044006347656, "global_step": 303134, "epoch": 2505} {"train_loss": -38.984859466552734, "global_step": 303135, "epoch": 2505} {"train_loss": -38.4443359375, "global_step": 303136, "epoch": 2505} {"train_loss": -39.40235137939453, "global_step": 303137, "epoch": 2505} {"train_loss": -39.62020492553711, "global_step": 303138, "epoch": 2505} {"train_loss": -39.97365951538086, "global_step": 303139, "epoch": 2505} {"train_loss": -39.730201721191406, "global_step": 303140, "epoch": 2505} {"train_loss": -38.61434555053711, "global_step": 303141, "epoch": 2505} {"train_loss": -39.75825881958008, "global_step": 303142, "epoch": 2505} {"train_loss": -40.01389694213867, "global_step": 303143, "epoch": 2505} {"train_loss": -40.18984603881836, "global_step": 303144, "epoch": 2505} {"train_loss": -40.28037643432617, "global_step": 303145, "epoch": 2505} {"train_loss": -39.297706604003906, "global_step": 303146, "epoch": 2505} {"train_loss": -40.42720413208008, "global_step": 303147, "epoch": 2505} {"train_loss": -40.461097717285156, "global_step": 303148, "epoch": 2505} {"train_loss": -40.18229293823242, "global_step": 303149, "epoch": 2505} {"train_loss": -40.35110092163086, "global_step": 303150, "epoch": 2505} {"train_loss": -40.347389221191406, "global_step": 303151, "epoch": 2505} {"train_loss": -40.410545349121094, "global_step": 303152, "epoch": 2505} {"train_loss": -39.82109451293945, "global_step": 303153, "epoch": 2505} {"train_loss": -39.487060546875, "global_step": 303154, "epoch": 2505} {"train_loss": -40.72536849975586, "global_step": 303155, "epoch": 2505} {"train_loss": -40.78605651855469, "global_step": 303156, "epoch": 2505} {"train_loss": -40.516292572021484, "global_step": 303157, "epoch": 2505} {"train_loss": -40.78001022338867, "global_step": 303158, "epoch": 2505} {"train_loss": -39.74967956542969, "global_step": 303159, "epoch": 2505} {"train_loss": -40.989253997802734, "global_step": 303160, "epoch": 2505} {"train_loss": -40.21257400512695, "global_step": 303161, "epoch": 2505} {"train_loss": -40.96529769897461, "global_step": 303162, "epoch": 2505} {"train_loss": -41.160980224609375, "global_step": 303163, "epoch": 2505} {"train_loss": -40.011959075927734, "global_step": 303164, "epoch": 2505} {"train_loss": -41.10929489135742, "global_step": 303165, "epoch": 2505} {"train_loss": -40.87569808959961, "global_step": 303166, "epoch": 2505} {"train_loss": -41.243473052978516, "global_step": 303167, "epoch": 2505} {"train_loss": -40.7143669128418, "global_step": 303168, "epoch": 2505} {"train_loss": -41.2349739074707, "global_step": 303169, "epoch": 2505} {"train_loss": -41.01810836791992, "global_step": 303170, "epoch": 2505} {"train_loss": -41.43321228027344, "global_step": 303171, "epoch": 2505} {"train_loss": -40.58169174194336, "global_step": 303172, "epoch": 2505} {"train_loss": -41.42414474487305, "global_step": 303173, "epoch": 2505} {"train_loss": -41.343929290771484, "global_step": 303174, "epoch": 2505} {"train_loss": -41.25204086303711, "global_step": 303175, "epoch": 2505} {"train_loss": -40.97014236450195, "global_step": 303176, "epoch": 2505} {"train_loss": -41.44005584716797, "global_step": 303177, "epoch": 2505} {"train_loss": -39.98823928833008, "global_step": 303178, "epoch": 2505} {"train_loss": -42.0018424987793, "global_step": 303179, "epoch": 2505} {"train_loss": -41.2700309753418, "global_step": 303180, "epoch": 2505} {"train_loss": -41.474483489990234, "global_step": 303181, "epoch": 2505} {"train_loss": -40.9122314453125, "global_step": 303182, "epoch": 2505} {"train_loss": -41.38543701171875, "global_step": 303183, "epoch": 2505} {"train_loss": -41.554344177246094, "global_step": 303184, "epoch": 2505} {"train_loss": -40.81575393676758, "global_step": 303185, "epoch": 2505} {"train_loss": -41.86812210083008, "global_step": 303186, "epoch": 2505} {"train_loss": -41.597877502441406, "global_step": 303187, "epoch": 2505} {"train_loss": -41.95219039916992, "global_step": 303188, "epoch": 2505} {"train_loss": -41.3249626159668, "global_step": 303189, "epoch": 2505} {"train_loss": -42.1800651550293, "global_step": 303190, "epoch": 2505} {"train_loss": -41.22884750366211, "global_step": 303191, "epoch": 2505} {"train_loss": -40.074462890625, "global_step": 303192, "epoch": 2505} {"train_loss": -42.04939651489258, "global_step": 303193, "epoch": 2505} {"train_loss": -41.43182373046875, "global_step": 303194, "epoch": 2505} {"train_loss": -41.421905517578125, "global_step": 303195, "epoch": 2505} {"train_loss": -41.79207992553711, "global_step": 303196, "epoch": 2505} {"train_loss": -42.07852554321289, "global_step": 303197, "epoch": 2505} {"train_loss": -42.00239181518555, "global_step": 303198, "epoch": 2505} {"train_loss": -42.0333137512207, "global_step": 303199, "epoch": 2505} {"train_loss": -42.18805694580078, "global_step": 303200, "epoch": 2505} {"train_loss": -42.214691162109375, "global_step": 303201, "epoch": 2505} {"train_loss": -41.99077224731445, "global_step": 303202, "epoch": 2505} {"train_loss": -41.1611213684082, "global_step": 303203, "epoch": 2505} {"train_loss": -41.13591384887695, "global_step": 303204, "epoch": 2505} {"train_loss": -42.19544219970703, "global_step": 303205, "epoch": 2505} {"train_loss": -42.3542594909668, "global_step": 303206, "epoch": 2505} {"train_loss": -41.18584060668945, "global_step": 303207, "epoch": 2505} {"train_loss": -42.5267219543457, "global_step": 303208, "epoch": 2505} {"train_loss": -40.79593276977539, "global_step": 303209, "epoch": 2505} {"train_loss": -42.67153549194336, "global_step": 303210, "epoch": 2505} {"train_loss": -42.4411735534668, "global_step": 303211, "epoch": 2505} {"train_loss": -42.2543830871582, "global_step": 303212, "epoch": 2505} {"train_loss": -42.64445114135742, "global_step": 303213, "epoch": 2505} {"train_loss": -42.3256950378418, "global_step": 303214, "epoch": 2505} {"train_loss": -42.94038772583008, "global_step": 303215, "epoch": 2505} {"train_loss": -42.15659713745117, "global_step": 303216, "epoch": 2505} {"train_loss": -42.844181060791016, "global_step": 303217, "epoch": 2505} {"train_loss": -42.69261932373047, "global_step": 303218, "epoch": 2505} {"train_loss": -42.00827407836914, "global_step": 303219, "epoch": 2505} {"train_loss": -41.8145866394043, "global_step": 303220, "epoch": 2505} {"train_loss": -42.572509765625, "global_step": 303221, "epoch": 2505} {"train_loss": -42.88486862182617, "global_step": 303222, "epoch": 2505} {"train_loss": -42.79982376098633, "global_step": 303223, "epoch": 2505} {"train_loss": -42.046783447265625, "global_step": 303224, "epoch": 2505} {"train_loss": -40.35675099270403, "global_step": 303225, "epoch": 2505, "val_loss": 2540819.25} {"train_loss": -42.6304931640625, "global_step": 303226, "epoch": 2506} {"train_loss": -42.96990966796875, "global_step": 303227, "epoch": 2506} {"train_loss": -42.5895881652832, "global_step": 303228, "epoch": 2506} {"train_loss": -41.766212463378906, "global_step": 303229, "epoch": 2506} {"train_loss": -41.9991455078125, "global_step": 303230, "epoch": 2506} {"train_loss": -42.81998825073242, "global_step": 303231, "epoch": 2506} {"train_loss": -43.11714553833008, "global_step": 303232, "epoch": 2506} {"train_loss": -43.28742980957031, "global_step": 303233, "epoch": 2506} {"train_loss": -41.71424102783203, "global_step": 303234, "epoch": 2506} {"train_loss": -42.52892303466797, "global_step": 303235, "epoch": 2506} {"train_loss": -42.61153030395508, "global_step": 303236, "epoch": 2506} {"train_loss": -41.672908782958984, "global_step": 303237, "epoch": 2506} {"train_loss": -42.14097595214844, "global_step": 303238, "epoch": 2506} {"train_loss": -41.3216552734375, "global_step": 303239, "epoch": 2506} {"train_loss": -42.48281478881836, "global_step": 303240, "epoch": 2506} {"train_loss": -42.83283615112305, "global_step": 303241, "epoch": 2506} {"train_loss": -40.94047927856445, "global_step": 303242, "epoch": 2506} {"train_loss": -41.711421966552734, "global_step": 303243, "epoch": 2506} {"train_loss": -42.83491897583008, "global_step": 303244, "epoch": 2506} {"train_loss": -42.304481506347656, "global_step": 303245, "epoch": 2506} {"train_loss": -42.05367660522461, "global_step": 303246, "epoch": 2506} {"train_loss": -40.53402328491211, "global_step": 303247, "epoch": 2506} {"train_loss": -42.85591506958008, "global_step": 303248, "epoch": 2506} {"train_loss": -42.002960205078125, "global_step": 303249, "epoch": 2506} {"train_loss": -40.85112762451172, "global_step": 303250, "epoch": 2506} {"train_loss": -40.977596282958984, "global_step": 303251, "epoch": 2506} {"train_loss": -42.86982727050781, "global_step": 303252, "epoch": 2506} {"train_loss": -41.59291076660156, "global_step": 303253, "epoch": 2506} {"train_loss": -42.40314483642578, "global_step": 303254, "epoch": 2506} {"train_loss": -42.315303802490234, "global_step": 303255, "epoch": 2506} {"train_loss": -42.94961166381836, "global_step": 303256, "epoch": 2506} {"train_loss": -43.237125396728516, "global_step": 303257, "epoch": 2506} {"train_loss": -42.752254486083984, "global_step": 303258, "epoch": 2506} {"train_loss": -42.50737762451172, "global_step": 303259, "epoch": 2506} {"train_loss": -41.82057189941406, "global_step": 303260, "epoch": 2506} {"train_loss": -42.622314453125, "global_step": 303261, "epoch": 2506} {"train_loss": -41.682960510253906, "global_step": 303262, "epoch": 2506} {"train_loss": -42.920135498046875, "global_step": 303263, "epoch": 2506} {"train_loss": -43.203575134277344, "global_step": 303264, "epoch": 2506} {"train_loss": -42.719356536865234, "global_step": 303265, "epoch": 2506} {"train_loss": -42.82246398925781, "global_step": 303266, "epoch": 2506} {"train_loss": -42.92084503173828, "global_step": 303267, "epoch": 2506} {"train_loss": -43.24455642700195, "global_step": 303268, "epoch": 2506} {"train_loss": -42.22185134887695, "global_step": 303269, "epoch": 2506} {"train_loss": -40.98040008544922, "global_step": 303270, "epoch": 2506} {"train_loss": -42.5134162902832, "global_step": 303271, "epoch": 2506} {"train_loss": -41.748680114746094, "global_step": 303272, "epoch": 2506} {"train_loss": -42.03174591064453, "global_step": 303273, "epoch": 2506} {"train_loss": -42.82832717895508, "global_step": 303274, "epoch": 2506} {"train_loss": -42.59012222290039, "global_step": 303275, "epoch": 2506} {"train_loss": -41.77161407470703, "global_step": 303276, "epoch": 2506} {"train_loss": -41.26805877685547, "global_step": 303277, "epoch": 2506} {"train_loss": -42.592586517333984, "global_step": 303278, "epoch": 2506} {"train_loss": -42.272457122802734, "global_step": 303279, "epoch": 2506} {"train_loss": -41.743812561035156, "global_step": 303280, "epoch": 2506} {"train_loss": -42.44484329223633, "global_step": 303281, "epoch": 2506} {"train_loss": -42.5423698425293, "global_step": 303282, "epoch": 2506} {"train_loss": -42.520626068115234, "global_step": 303283, "epoch": 2506} {"train_loss": -42.609249114990234, "global_step": 303284, "epoch": 2506} {"train_loss": -41.082210540771484, "global_step": 303285, "epoch": 2506} {"train_loss": -41.616146087646484, "global_step": 303286, "epoch": 2506} {"train_loss": -42.43165969848633, "global_step": 303287, "epoch": 2506} {"train_loss": -43.086246490478516, "global_step": 303288, "epoch": 2506} {"train_loss": -42.36381149291992, "global_step": 303289, "epoch": 2506} {"train_loss": -43.28571701049805, "global_step": 303290, "epoch": 2506} {"train_loss": -42.402679443359375, "global_step": 303291, "epoch": 2506} {"train_loss": -41.71357345581055, "global_step": 303292, "epoch": 2506} {"train_loss": -42.36342239379883, "global_step": 303293, "epoch": 2506} {"train_loss": -42.66313552856445, "global_step": 303294, "epoch": 2506} {"train_loss": -42.554073333740234, "global_step": 303295, "epoch": 2506} {"train_loss": -42.345428466796875, "global_step": 303296, "epoch": 2506} {"train_loss": -43.324668884277344, "global_step": 303297, "epoch": 2506} {"train_loss": -41.21759033203125, "global_step": 303298, "epoch": 2506} {"train_loss": -43.25565719604492, "global_step": 303299, "epoch": 2506} {"train_loss": -42.54603958129883, "global_step": 303300, "epoch": 2506} {"train_loss": -42.69851303100586, "global_step": 303301, "epoch": 2506} {"train_loss": -42.79956817626953, "global_step": 303302, "epoch": 2506} {"train_loss": -43.22364044189453, "global_step": 303303, "epoch": 2506} {"train_loss": -43.30400466918945, "global_step": 303304, "epoch": 2506} {"train_loss": -41.938270568847656, "global_step": 303305, "epoch": 2506} {"train_loss": -43.2558479309082, "global_step": 303306, "epoch": 2506} {"train_loss": -43.203094482421875, "global_step": 303307, "epoch": 2506} {"train_loss": -43.02567672729492, "global_step": 303308, "epoch": 2506} {"train_loss": -43.151771545410156, "global_step": 303309, "epoch": 2506} {"train_loss": -42.5427360534668, "global_step": 303310, "epoch": 2506} {"train_loss": -43.27863693237305, "global_step": 303311, "epoch": 2506} {"train_loss": -42.968292236328125, "global_step": 303312, "epoch": 2506} {"train_loss": -42.55537796020508, "global_step": 303313, "epoch": 2506} {"train_loss": -43.22419357299805, "global_step": 303314, "epoch": 2506} {"train_loss": -43.048641204833984, "global_step": 303315, "epoch": 2506} {"train_loss": -43.456600189208984, "global_step": 303316, "epoch": 2506} {"train_loss": -42.417415618896484, "global_step": 303317, "epoch": 2506} {"train_loss": -42.77861785888672, "global_step": 303318, "epoch": 2506} {"train_loss": -41.947444915771484, "global_step": 303319, "epoch": 2506} {"train_loss": -41.359493255615234, "global_step": 303320, "epoch": 2506} {"train_loss": -43.275550842285156, "global_step": 303321, "epoch": 2506} {"train_loss": -42.38895797729492, "global_step": 303322, "epoch": 2506} {"train_loss": -42.438411712646484, "global_step": 303323, "epoch": 2506} {"train_loss": -42.62482833862305, "global_step": 303324, "epoch": 2506} {"train_loss": -40.936256408691406, "global_step": 303325, "epoch": 2506} {"train_loss": -39.47892379760742, "global_step": 303326, "epoch": 2506} {"train_loss": -41.850555419921875, "global_step": 303327, "epoch": 2506} {"train_loss": -39.093711853027344, "global_step": 303328, "epoch": 2506} {"train_loss": -41.34745788574219, "global_step": 303329, "epoch": 2506} {"train_loss": -42.34035873413086, "global_step": 303330, "epoch": 2506} {"train_loss": -41.855384826660156, "global_step": 303331, "epoch": 2506} {"train_loss": -42.191650390625, "global_step": 303332, "epoch": 2506} {"train_loss": -42.775760650634766, "global_step": 303333, "epoch": 2506} {"train_loss": -40.737003326416016, "global_step": 303334, "epoch": 2506} {"train_loss": -40.16963577270508, "global_step": 303335, "epoch": 2506} {"train_loss": -42.37703323364258, "global_step": 303336, "epoch": 2506} {"train_loss": -42.327693939208984, "global_step": 303337, "epoch": 2506} {"train_loss": -39.828182220458984, "global_step": 303338, "epoch": 2506} {"train_loss": -40.41335678100586, "global_step": 303339, "epoch": 2506} {"train_loss": -38.12618637084961, "global_step": 303340, "epoch": 2506} {"train_loss": -41.72263717651367, "global_step": 303341, "epoch": 2506} {"train_loss": -41.98490905761719, "global_step": 303342, "epoch": 2506} {"train_loss": -41.348419189453125, "global_step": 303343, "epoch": 2506} {"train_loss": -41.94113540649414, "global_step": 303344, "epoch": 2506} {"train_loss": -41.491302490234375, "global_step": 303345, "epoch": 2506} {"train_loss": -42.196811013970496, "global_step": 303346, "epoch": 2506, "val_loss": 2647308.25} {"train_loss": -41.70238494873047, "global_step": 303347, "epoch": 2507} {"train_loss": -42.39748764038086, "global_step": 303348, "epoch": 2507} {"train_loss": -38.329158782958984, "global_step": 303349, "epoch": 2507} {"train_loss": -41.42177200317383, "global_step": 303350, "epoch": 2507} {"train_loss": -42.811744689941406, "global_step": 303351, "epoch": 2507} {"train_loss": -37.92038345336914, "global_step": 303352, "epoch": 2507} {"train_loss": -39.7027702331543, "global_step": 303353, "epoch": 2507} {"train_loss": -41.193695068359375, "global_step": 303354, "epoch": 2507} {"train_loss": -41.943214416503906, "global_step": 303355, "epoch": 2507} {"train_loss": -41.981319427490234, "global_step": 303356, "epoch": 2507} {"train_loss": -41.01446533203125, "global_step": 303357, "epoch": 2507} {"train_loss": -41.41781997680664, "global_step": 303358, "epoch": 2507} {"train_loss": -41.79871368408203, "global_step": 303359, "epoch": 2507} {"train_loss": -42.32380676269531, "global_step": 303360, "epoch": 2507} {"train_loss": -41.79181671142578, "global_step": 303361, "epoch": 2507} {"train_loss": -42.66343307495117, "global_step": 303362, "epoch": 2507} {"train_loss": -38.327186584472656, "global_step": 303363, "epoch": 2507} {"train_loss": -42.092079162597656, "global_step": 303364, "epoch": 2507} {"train_loss": -30.537616729736328, "global_step": 303365, "epoch": 2507} {"train_loss": -39.86313247680664, "global_step": 303366, "epoch": 2507} {"train_loss": -40.67048263549805, "global_step": 303367, "epoch": 2507} {"train_loss": -41.413143157958984, "global_step": 303368, "epoch": 2507} {"train_loss": -41.51176071166992, "global_step": 303369, "epoch": 2507} {"train_loss": -41.107421875, "global_step": 303370, "epoch": 2507} {"train_loss": -40.9459114074707, "global_step": 303371, "epoch": 2507} {"train_loss": -41.922576904296875, "global_step": 303372, "epoch": 2507} {"train_loss": -40.19156265258789, "global_step": 303373, "epoch": 2507} {"train_loss": -42.093849182128906, "global_step": 303374, "epoch": 2507} {"train_loss": -37.707645416259766, "global_step": 303375, "epoch": 2507} {"train_loss": -41.567893981933594, "global_step": 303376, "epoch": 2507} {"train_loss": -42.26434326171875, "global_step": 303377, "epoch": 2507} {"train_loss": -39.20473861694336, "global_step": 303378, "epoch": 2507} {"train_loss": -41.5731201171875, "global_step": 303379, "epoch": 2507} {"train_loss": -41.982704162597656, "global_step": 303380, "epoch": 2507} {"train_loss": -41.985313415527344, "global_step": 303381, "epoch": 2507} {"train_loss": -39.85184860229492, "global_step": 303382, "epoch": 2507} {"train_loss": -38.09165573120117, "global_step": 303383, "epoch": 2507} {"train_loss": -42.17336654663086, "global_step": 303384, "epoch": 2507} {"train_loss": -42.171390533447266, "global_step": 303385, "epoch": 2507} {"train_loss": -41.98189163208008, "global_step": 303386, "epoch": 2507} {"train_loss": -39.001502990722656, "global_step": 303387, "epoch": 2507} {"train_loss": -38.51533126831055, "global_step": 303388, "epoch": 2507} {"train_loss": -42.48086166381836, "global_step": 303389, "epoch": 2507} {"train_loss": -40.698768615722656, "global_step": 303390, "epoch": 2507} {"train_loss": -38.779048919677734, "global_step": 303391, "epoch": 2507} {"train_loss": -42.2868766784668, "global_step": 303392, "epoch": 2507} {"train_loss": -41.761566162109375, "global_step": 303393, "epoch": 2507} {"train_loss": -41.046688079833984, "global_step": 303394, "epoch": 2507} {"train_loss": -41.86588668823242, "global_step": 303395, "epoch": 2507} {"train_loss": -41.28800582885742, "global_step": 303396, "epoch": 2507} {"train_loss": -42.48887634277344, "global_step": 303397, "epoch": 2507} {"train_loss": -42.26906204223633, "global_step": 303398, "epoch": 2507} {"train_loss": -41.797698974609375, "global_step": 303399, "epoch": 2507} {"train_loss": -40.221580505371094, "global_step": 303400, "epoch": 2507} {"train_loss": -38.69883346557617, "global_step": 303401, "epoch": 2507} {"train_loss": -39.97895050048828, "global_step": 303402, "epoch": 2507} {"train_loss": -42.13840866088867, "global_step": 303403, "epoch": 2507} {"train_loss": -41.580745697021484, "global_step": 303404, "epoch": 2507} {"train_loss": -41.546688079833984, "global_step": 303405, "epoch": 2507} {"train_loss": -41.976871490478516, "global_step": 303406, "epoch": 2507} {"train_loss": -41.650936126708984, "global_step": 303407, "epoch": 2507} {"train_loss": -41.764625549316406, "global_step": 303408, "epoch": 2507} {"train_loss": -42.82929611206055, "global_step": 303409, "epoch": 2507} {"train_loss": -41.587886810302734, "global_step": 303410, "epoch": 2507} {"train_loss": -42.89457321166992, "global_step": 303411, "epoch": 2507} {"train_loss": -40.84727096557617, "global_step": 303412, "epoch": 2507} {"train_loss": -42.24928283691406, "global_step": 303413, "epoch": 2507} {"train_loss": -43.106441497802734, "global_step": 303414, "epoch": 2507} {"train_loss": -39.9954719543457, "global_step": 303415, "epoch": 2507} {"train_loss": -42.48126220703125, "global_step": 303416, "epoch": 2507} {"train_loss": -42.07509231567383, "global_step": 303417, "epoch": 2507} {"train_loss": -42.013671875, "global_step": 303418, "epoch": 2507} {"train_loss": -39.293827056884766, "global_step": 303419, "epoch": 2507} {"train_loss": -42.95322799682617, "global_step": 303420, "epoch": 2507} {"train_loss": -42.537044525146484, "global_step": 303421, "epoch": 2507} {"train_loss": -42.98323440551758, "global_step": 303422, "epoch": 2507} {"train_loss": -42.89230728149414, "global_step": 303423, "epoch": 2507} {"train_loss": -42.73191452026367, "global_step": 303424, "epoch": 2507} {"train_loss": -42.848724365234375, "global_step": 303425, "epoch": 2507} {"train_loss": -40.44826889038086, "global_step": 303426, "epoch": 2507} {"train_loss": -43.084625244140625, "global_step": 303427, "epoch": 2507} {"train_loss": -42.945037841796875, "global_step": 303428, "epoch": 2507} {"train_loss": -43.10145568847656, "global_step": 303429, "epoch": 2507} {"train_loss": -41.790313720703125, "global_step": 303430, "epoch": 2507} {"train_loss": -42.3072624206543, "global_step": 303431, "epoch": 2507} {"train_loss": -42.38035202026367, "global_step": 303432, "epoch": 2507} {"train_loss": -42.97444534301758, "global_step": 303433, "epoch": 2507} {"train_loss": -42.77676010131836, "global_step": 303434, "epoch": 2507} {"train_loss": -42.750789642333984, "global_step": 303435, "epoch": 2507} {"train_loss": -43.32563400268555, "global_step": 303436, "epoch": 2507} {"train_loss": -41.94169616699219, "global_step": 303437, "epoch": 2507} {"train_loss": -40.55180740356445, "global_step": 303438, "epoch": 2507} {"train_loss": -42.9607048034668, "global_step": 303439, "epoch": 2507} {"train_loss": -43.409847259521484, "global_step": 303440, "epoch": 2507} {"train_loss": -42.964630126953125, "global_step": 303441, "epoch": 2507} {"train_loss": -42.73515701293945, "global_step": 303442, "epoch": 2507} {"train_loss": -43.38130569458008, "global_step": 303443, "epoch": 2507} {"train_loss": -41.361595153808594, "global_step": 303444, "epoch": 2507} {"train_loss": -43.31051254272461, "global_step": 303445, "epoch": 2507} {"train_loss": -42.420162200927734, "global_step": 303446, "epoch": 2507} {"train_loss": -40.64729690551758, "global_step": 303447, "epoch": 2507} {"train_loss": -40.596736907958984, "global_step": 303448, "epoch": 2507} {"train_loss": -41.645057678222656, "global_step": 303449, "epoch": 2507} {"train_loss": -40.970821380615234, "global_step": 303450, "epoch": 2507} {"train_loss": -42.15426254272461, "global_step": 303451, "epoch": 2507} {"train_loss": -42.50685501098633, "global_step": 303452, "epoch": 2507} {"train_loss": -42.724952697753906, "global_step": 303453, "epoch": 2507} {"train_loss": -42.368507385253906, "global_step": 303454, "epoch": 2507} {"train_loss": -42.623538970947266, "global_step": 303455, "epoch": 2507} {"train_loss": -40.91705322265625, "global_step": 303456, "epoch": 2507} {"train_loss": -42.516510009765625, "global_step": 303457, "epoch": 2507} {"train_loss": -40.7851448059082, "global_step": 303458, "epoch": 2507} {"train_loss": -38.34134292602539, "global_step": 303459, "epoch": 2507} {"train_loss": -41.958526611328125, "global_step": 303460, "epoch": 2507} {"train_loss": -40.82146072387695, "global_step": 303461, "epoch": 2507} {"train_loss": -42.96806716918945, "global_step": 303462, "epoch": 2507} {"train_loss": -40.87428665161133, "global_step": 303463, "epoch": 2507} {"train_loss": -41.6202278137207, "global_step": 303464, "epoch": 2507} {"train_loss": -41.9785041809082, "global_step": 303465, "epoch": 2507} {"train_loss": -42.598419189453125, "global_step": 303466, "epoch": 2507} {"train_loss": -41.485002880254065, "global_step": 303467, "epoch": 2507, "val_loss": 2987165.25} {"train_loss": -41.9827880859375, "global_step": 303468, "epoch": 2508} {"train_loss": -42.49154281616211, "global_step": 303469, "epoch": 2508} {"train_loss": -43.46102523803711, "global_step": 303470, "epoch": 2508} {"train_loss": -43.060306549072266, "global_step": 303471, "epoch": 2508} {"train_loss": -41.7574462890625, "global_step": 303472, "epoch": 2508} {"train_loss": -43.34840774536133, "global_step": 303473, "epoch": 2508} {"train_loss": -42.16689682006836, "global_step": 303474, "epoch": 2508} {"train_loss": -42.85160827636719, "global_step": 303475, "epoch": 2508} {"train_loss": -43.201637268066406, "global_step": 303476, "epoch": 2508} {"train_loss": -42.82259750366211, "global_step": 303477, "epoch": 2508} {"train_loss": -42.882930755615234, "global_step": 303478, "epoch": 2508} {"train_loss": -43.40009307861328, "global_step": 303479, "epoch": 2508} {"train_loss": -43.17158126831055, "global_step": 303480, "epoch": 2508} {"train_loss": -43.54885482788086, "global_step": 303481, "epoch": 2508} {"train_loss": -41.62721633911133, "global_step": 303482, "epoch": 2508} {"train_loss": -43.11379623413086, "global_step": 303483, "epoch": 2508} {"train_loss": -43.22349166870117, "global_step": 303484, "epoch": 2508} {"train_loss": -43.57405090332031, "global_step": 303485, "epoch": 2508} {"train_loss": -43.93044662475586, "global_step": 303486, "epoch": 2508} {"train_loss": -43.602516174316406, "global_step": 303487, "epoch": 2508} {"train_loss": -42.721004486083984, "global_step": 303488, "epoch": 2508} {"train_loss": -43.19698715209961, "global_step": 303489, "epoch": 2508} {"train_loss": -43.17056655883789, "global_step": 303490, "epoch": 2508} {"train_loss": -43.149837493896484, "global_step": 303491, "epoch": 2508} {"train_loss": -42.32339096069336, "global_step": 303492, "epoch": 2508} {"train_loss": -43.41166305541992, "global_step": 303493, "epoch": 2508} {"train_loss": -43.63033676147461, "global_step": 303494, "epoch": 2508} {"train_loss": -42.69020462036133, "global_step": 303495, "epoch": 2508} {"train_loss": -41.9998893737793, "global_step": 303496, "epoch": 2508} {"train_loss": -42.34608840942383, "global_step": 303497, "epoch": 2508} {"train_loss": -42.8182258605957, "global_step": 303498, "epoch": 2508} {"train_loss": -41.62318420410156, "global_step": 303499, "epoch": 2508} {"train_loss": -41.95735549926758, "global_step": 303500, "epoch": 2508} {"train_loss": -41.4270133972168, "global_step": 303501, "epoch": 2508} {"train_loss": -42.73722839355469, "global_step": 303502, "epoch": 2508} {"train_loss": -42.4574089050293, "global_step": 303503, "epoch": 2508} {"train_loss": -42.702003479003906, "global_step": 303504, "epoch": 2508} {"train_loss": -43.242000579833984, "global_step": 303505, "epoch": 2508} {"train_loss": -42.63416290283203, "global_step": 303506, "epoch": 2508} {"train_loss": -42.12522506713867, "global_step": 303507, "epoch": 2508} {"train_loss": -42.35443878173828, "global_step": 303508, "epoch": 2508} {"train_loss": -41.608558654785156, "global_step": 303509, "epoch": 2508} {"train_loss": -42.43434524536133, "global_step": 303510, "epoch": 2508} {"train_loss": -42.841915130615234, "global_step": 303511, "epoch": 2508} {"train_loss": -40.70307159423828, "global_step": 303512, "epoch": 2508} {"train_loss": -43.367462158203125, "global_step": 303513, "epoch": 2508} {"train_loss": -42.9947395324707, "global_step": 303514, "epoch": 2508} {"train_loss": -42.88997268676758, "global_step": 303515, "epoch": 2508} {"train_loss": -37.23187255859375, "global_step": 303516, "epoch": 2508} {"train_loss": -41.242645263671875, "global_step": 303517, "epoch": 2508} {"train_loss": -42.0506477355957, "global_step": 303518, "epoch": 2508} {"train_loss": -42.68535614013672, "global_step": 303519, "epoch": 2508} {"train_loss": -42.57694625854492, "global_step": 303520, "epoch": 2508} {"train_loss": -42.822784423828125, "global_step": 303521, "epoch": 2508} {"train_loss": -41.3110466003418, "global_step": 303522, "epoch": 2508} {"train_loss": -42.30154037475586, "global_step": 303523, "epoch": 2508} {"train_loss": -42.126590728759766, "global_step": 303524, "epoch": 2508} {"train_loss": -42.020912170410156, "global_step": 303525, "epoch": 2508} {"train_loss": -37.181007385253906, "global_step": 303526, "epoch": 2508} {"train_loss": -40.55887985229492, "global_step": 303527, "epoch": 2508} {"train_loss": -41.486427307128906, "global_step": 303528, "epoch": 2508} {"train_loss": -41.907596588134766, "global_step": 303529, "epoch": 2508} {"train_loss": -39.05595016479492, "global_step": 303530, "epoch": 2508} {"train_loss": -39.347164154052734, "global_step": 303531, "epoch": 2508} {"train_loss": -39.168296813964844, "global_step": 303532, "epoch": 2508} {"train_loss": -39.59639358520508, "global_step": 303533, "epoch": 2508} {"train_loss": -38.80665969848633, "global_step": 303534, "epoch": 2508} {"train_loss": -39.9094123840332, "global_step": 303535, "epoch": 2508} {"train_loss": -40.58246994018555, "global_step": 303536, "epoch": 2508} {"train_loss": -40.879920959472656, "global_step": 303537, "epoch": 2508} {"train_loss": -39.489891052246094, "global_step": 303538, "epoch": 2508} {"train_loss": -40.33767318725586, "global_step": 303539, "epoch": 2508} {"train_loss": -40.792354583740234, "global_step": 303540, "epoch": 2508} {"train_loss": -37.2308235168457, "global_step": 303541, "epoch": 2508} {"train_loss": -41.09508514404297, "global_step": 303542, "epoch": 2508} {"train_loss": -39.61204147338867, "global_step": 303543, "epoch": 2508} {"train_loss": -41.6363410949707, "global_step": 303544, "epoch": 2508} {"train_loss": -40.37549591064453, "global_step": 303545, "epoch": 2508} {"train_loss": -38.63368606567383, "global_step": 303546, "epoch": 2508} {"train_loss": -40.47491455078125, "global_step": 303547, "epoch": 2508} {"train_loss": -41.81689453125, "global_step": 303548, "epoch": 2508} {"train_loss": -41.9034423828125, "global_step": 303549, "epoch": 2508} {"train_loss": -40.14072799682617, "global_step": 303550, "epoch": 2508} {"train_loss": -42.330379486083984, "global_step": 303551, "epoch": 2508} {"train_loss": -41.794525146484375, "global_step": 303552, "epoch": 2508} {"train_loss": -41.44057083129883, "global_step": 303553, "epoch": 2508} {"train_loss": -42.553497314453125, "global_step": 303554, "epoch": 2508} {"train_loss": -41.76145553588867, "global_step": 303555, "epoch": 2508} {"train_loss": -40.39935302734375, "global_step": 303556, "epoch": 2508} {"train_loss": -42.535457611083984, "global_step": 303557, "epoch": 2508} {"train_loss": -42.022682189941406, "global_step": 303558, "epoch": 2508} {"train_loss": -41.51762008666992, "global_step": 303559, "epoch": 2508} {"train_loss": -41.535614013671875, "global_step": 303560, "epoch": 2508} {"train_loss": -41.86321258544922, "global_step": 303561, "epoch": 2508} {"train_loss": -41.441158294677734, "global_step": 303562, "epoch": 2508} {"train_loss": -42.32266616821289, "global_step": 303563, "epoch": 2508} {"train_loss": -42.083988189697266, "global_step": 303564, "epoch": 2508} {"train_loss": -41.22445297241211, "global_step": 303565, "epoch": 2508} {"train_loss": -41.96592330932617, "global_step": 303566, "epoch": 2508} {"train_loss": -42.23566818237305, "global_step": 303567, "epoch": 2508} {"train_loss": -41.6759033203125, "global_step": 303568, "epoch": 2508} {"train_loss": -42.785186767578125, "global_step": 303569, "epoch": 2508} {"train_loss": -40.62724304199219, "global_step": 303570, "epoch": 2508} {"train_loss": -41.35247802734375, "global_step": 303571, "epoch": 2508} {"train_loss": -41.56175231933594, "global_step": 303572, "epoch": 2508} {"train_loss": -42.009925842285156, "global_step": 303573, "epoch": 2508} {"train_loss": -41.19559860229492, "global_step": 303574, "epoch": 2508} {"train_loss": -41.608463287353516, "global_step": 303575, "epoch": 2508} {"train_loss": -42.502174377441406, "global_step": 303576, "epoch": 2508} {"train_loss": -41.47032928466797, "global_step": 303577, "epoch": 2508} {"train_loss": -41.30906295776367, "global_step": 303578, "epoch": 2508} {"train_loss": -42.703956604003906, "global_step": 303579, "epoch": 2508} {"train_loss": -42.73061752319336, "global_step": 303580, "epoch": 2508} {"train_loss": -41.021575927734375, "global_step": 303581, "epoch": 2508} {"train_loss": -41.59121322631836, "global_step": 303582, "epoch": 2508} {"train_loss": -42.63441848754883, "global_step": 303583, "epoch": 2508} {"train_loss": -42.61609649658203, "global_step": 303584, "epoch": 2508} {"train_loss": -41.62030792236328, "global_step": 303585, "epoch": 2508} {"train_loss": -43.1110954284668, "global_step": 303586, "epoch": 2508} {"train_loss": -42.130279541015625, "global_step": 303587, "epoch": 2508} {"train_loss": -41.81728854849319, "global_step": 303588, "epoch": 2508, "val_loss": 2943664.25} {"train_loss": -42.870731353759766, "global_step": 303589, "epoch": 2509} {"train_loss": -42.2094841003418, "global_step": 303590, "epoch": 2509} {"train_loss": -41.89138412475586, "global_step": 303591, "epoch": 2509} {"train_loss": -41.69857406616211, "global_step": 303592, "epoch": 2509} {"train_loss": -42.16846466064453, "global_step": 303593, "epoch": 2509} {"train_loss": -41.15287780761719, "global_step": 303594, "epoch": 2509} {"train_loss": -42.618858337402344, "global_step": 303595, "epoch": 2509} {"train_loss": -43.226524353027344, "global_step": 303596, "epoch": 2509} {"train_loss": -42.164588928222656, "global_step": 303597, "epoch": 2509} {"train_loss": -41.33861541748047, "global_step": 303598, "epoch": 2509} {"train_loss": -42.71148681640625, "global_step": 303599, "epoch": 2509} {"train_loss": -42.619789123535156, "global_step": 303600, "epoch": 2509} {"train_loss": -43.02077865600586, "global_step": 303601, "epoch": 2509} {"train_loss": -42.11957550048828, "global_step": 303602, "epoch": 2509} {"train_loss": -40.16042709350586, "global_step": 303603, "epoch": 2509} {"train_loss": -41.221920013427734, "global_step": 303604, "epoch": 2509} {"train_loss": -41.798824310302734, "global_step": 303605, "epoch": 2509} {"train_loss": -42.93580627441406, "global_step": 303606, "epoch": 2509} {"train_loss": -43.20979690551758, "global_step": 303607, "epoch": 2509} {"train_loss": -42.97819137573242, "global_step": 303608, "epoch": 2509} {"train_loss": -42.5605354309082, "global_step": 303609, "epoch": 2509} {"train_loss": -42.48170852661133, "global_step": 303610, "epoch": 2509} {"train_loss": -43.42701721191406, "global_step": 303611, "epoch": 2509} {"train_loss": -43.184295654296875, "global_step": 303612, "epoch": 2509} {"train_loss": -42.611663818359375, "global_step": 303613, "epoch": 2509} {"train_loss": -38.44609069824219, "global_step": 303614, "epoch": 2509} {"train_loss": -42.27113723754883, "global_step": 303615, "epoch": 2509} {"train_loss": -43.46310806274414, "global_step": 303616, "epoch": 2509} {"train_loss": -43.070743560791016, "global_step": 303617, "epoch": 2509} {"train_loss": -42.1198844909668, "global_step": 303618, "epoch": 2509} {"train_loss": -42.94754409790039, "global_step": 303619, "epoch": 2509} {"train_loss": -43.39482879638672, "global_step": 303620, "epoch": 2509} {"train_loss": -43.20595932006836, "global_step": 303621, "epoch": 2509} {"train_loss": -43.01496124267578, "global_step": 303622, "epoch": 2509} {"train_loss": -42.428592681884766, "global_step": 303623, "epoch": 2509} {"train_loss": -41.8172607421875, "global_step": 303624, "epoch": 2509} {"train_loss": -43.521549224853516, "global_step": 303625, "epoch": 2509} {"train_loss": -43.713130950927734, "global_step": 303626, "epoch": 2509} {"train_loss": -43.779762268066406, "global_step": 303627, "epoch": 2509} {"train_loss": -42.22613525390625, "global_step": 303628, "epoch": 2509} {"train_loss": -43.32402420043945, "global_step": 303629, "epoch": 2509} {"train_loss": -41.59114456176758, "global_step": 303630, "epoch": 2509} {"train_loss": -41.45196533203125, "global_step": 303631, "epoch": 2509} {"train_loss": -40.761539459228516, "global_step": 303632, "epoch": 2509} {"train_loss": -43.46428298950195, "global_step": 303633, "epoch": 2509} {"train_loss": -42.6889762878418, "global_step": 303634, "epoch": 2509} {"train_loss": -41.896480560302734, "global_step": 303635, "epoch": 2509} {"train_loss": -43.302268981933594, "global_step": 303636, "epoch": 2509} {"train_loss": -43.13838195800781, "global_step": 303637, "epoch": 2509} {"train_loss": -40.96576690673828, "global_step": 303638, "epoch": 2509} {"train_loss": -41.7444953918457, "global_step": 303639, "epoch": 2509} {"train_loss": -42.493927001953125, "global_step": 303640, "epoch": 2509} {"train_loss": -41.82908248901367, "global_step": 303641, "epoch": 2509} {"train_loss": -43.30574035644531, "global_step": 303642, "epoch": 2509} {"train_loss": -42.70310592651367, "global_step": 303643, "epoch": 2509} {"train_loss": -43.25439453125, "global_step": 303644, "epoch": 2509} {"train_loss": -43.47462844848633, "global_step": 303645, "epoch": 2509} {"train_loss": -40.47380447387695, "global_step": 303646, "epoch": 2509} {"train_loss": -42.966548919677734, "global_step": 303647, "epoch": 2509} {"train_loss": -40.78451156616211, "global_step": 303648, "epoch": 2509} {"train_loss": -43.04270935058594, "global_step": 303649, "epoch": 2509} {"train_loss": -42.12382507324219, "global_step": 303650, "epoch": 2509} {"train_loss": -42.79084396362305, "global_step": 303651, "epoch": 2509} {"train_loss": -42.72096633911133, "global_step": 303652, "epoch": 2509} {"train_loss": -41.49542999267578, "global_step": 303653, "epoch": 2509} {"train_loss": -41.63595199584961, "global_step": 303654, "epoch": 2509} {"train_loss": -42.4140739440918, "global_step": 303655, "epoch": 2509} {"train_loss": -42.10563278198242, "global_step": 303656, "epoch": 2509} {"train_loss": -40.75253677368164, "global_step": 303657, "epoch": 2509} {"train_loss": -42.64691162109375, "global_step": 303658, "epoch": 2509} {"train_loss": -39.16193389892578, "global_step": 303659, "epoch": 2509} {"train_loss": -42.194313049316406, "global_step": 303660, "epoch": 2509} {"train_loss": -41.187740325927734, "global_step": 303661, "epoch": 2509} {"train_loss": -40.4491081237793, "global_step": 303662, "epoch": 2509} {"train_loss": -42.23250198364258, "global_step": 303663, "epoch": 2509} {"train_loss": -41.343624114990234, "global_step": 303664, "epoch": 2509} {"train_loss": -39.37263870239258, "global_step": 303665, "epoch": 2509} {"train_loss": -39.39413070678711, "global_step": 303666, "epoch": 2509} {"train_loss": -42.21072006225586, "global_step": 303667, "epoch": 2509} {"train_loss": -42.626129150390625, "global_step": 303668, "epoch": 2509} {"train_loss": -41.60530471801758, "global_step": 303669, "epoch": 2509} {"train_loss": -41.03646469116211, "global_step": 303670, "epoch": 2509} {"train_loss": -40.24053955078125, "global_step": 303671, "epoch": 2509} {"train_loss": -41.35854721069336, "global_step": 303672, "epoch": 2509} {"train_loss": -40.98421859741211, "global_step": 303673, "epoch": 2509} {"train_loss": -39.22739791870117, "global_step": 303674, "epoch": 2509} {"train_loss": -42.56293869018555, "global_step": 303675, "epoch": 2509} {"train_loss": -41.18302536010742, "global_step": 303676, "epoch": 2509} {"train_loss": -43.19971466064453, "global_step": 303677, "epoch": 2509} {"train_loss": -40.84922409057617, "global_step": 303678, "epoch": 2509} {"train_loss": -42.51300811767578, "global_step": 303679, "epoch": 2509} {"train_loss": -42.672332763671875, "global_step": 303680, "epoch": 2509} {"train_loss": -41.75887680053711, "global_step": 303681, "epoch": 2509} {"train_loss": -41.501434326171875, "global_step": 303682, "epoch": 2509} {"train_loss": -42.72865676879883, "global_step": 303683, "epoch": 2509} {"train_loss": -41.54472732543945, "global_step": 303684, "epoch": 2509} {"train_loss": -42.45815658569336, "global_step": 303685, "epoch": 2509} {"train_loss": -42.73627853393555, "global_step": 303686, "epoch": 2509} {"train_loss": -41.19002914428711, "global_step": 303687, "epoch": 2509} {"train_loss": -42.84870147705078, "global_step": 303688, "epoch": 2509} {"train_loss": -42.439571380615234, "global_step": 303689, "epoch": 2509} {"train_loss": -41.786800384521484, "global_step": 303690, "epoch": 2509} {"train_loss": -43.035186767578125, "global_step": 303691, "epoch": 2509} {"train_loss": -40.08639144897461, "global_step": 303692, "epoch": 2509} {"train_loss": -42.82008743286133, "global_step": 303693, "epoch": 2509} {"train_loss": -42.4642333984375, "global_step": 303694, "epoch": 2509} {"train_loss": -42.46925354003906, "global_step": 303695, "epoch": 2509} {"train_loss": -42.94456481933594, "global_step": 303696, "epoch": 2509} {"train_loss": -41.53293228149414, "global_step": 303697, "epoch": 2509} {"train_loss": -42.35244369506836, "global_step": 303698, "epoch": 2509} {"train_loss": -42.9951286315918, "global_step": 303699, "epoch": 2509} {"train_loss": -42.2463493347168, "global_step": 303700, "epoch": 2509} {"train_loss": -41.121299743652344, "global_step": 303701, "epoch": 2509} {"train_loss": -42.356903076171875, "global_step": 303702, "epoch": 2509} {"train_loss": -41.225341796875, "global_step": 303703, "epoch": 2509} {"train_loss": -42.19126510620117, "global_step": 303704, "epoch": 2509} {"train_loss": -41.8718147277832, "global_step": 303705, "epoch": 2509} {"train_loss": -42.20878982543945, "global_step": 303706, "epoch": 2509} {"train_loss": -41.91898727416992, "global_step": 303707, "epoch": 2509} {"train_loss": -42.80928039550781, "global_step": 303708, "epoch": 2509} {"train_loss": -42.10707026079667, "global_step": 303709, "epoch": 2509, "val_loss": 2620476.75} {"train_loss": -41.687461853027344, "global_step": 303710, "epoch": 2510} {"train_loss": -42.3784294128418, "global_step": 303711, "epoch": 2510} {"train_loss": -40.39187240600586, "global_step": 303712, "epoch": 2510} {"train_loss": -43.16927719116211, "global_step": 303713, "epoch": 2510} {"train_loss": -42.8182373046875, "global_step": 303714, "epoch": 2510} {"train_loss": -42.028316497802734, "global_step": 303715, "epoch": 2510} {"train_loss": -42.8941764831543, "global_step": 303716, "epoch": 2510} {"train_loss": -43.461116790771484, "global_step": 303717, "epoch": 2510} {"train_loss": -42.99636459350586, "global_step": 303718, "epoch": 2510} {"train_loss": -42.159202575683594, "global_step": 303719, "epoch": 2510} {"train_loss": -43.702091217041016, "global_step": 303720, "epoch": 2510} {"train_loss": -42.8690299987793, "global_step": 303721, "epoch": 2510} {"train_loss": -43.4404296875, "global_step": 303722, "epoch": 2510} {"train_loss": -43.0307502746582, "global_step": 303723, "epoch": 2510} {"train_loss": -42.75393295288086, "global_step": 303724, "epoch": 2510} {"train_loss": -43.16263198852539, "global_step": 303725, "epoch": 2510} {"train_loss": -41.09171676635742, "global_step": 303726, "epoch": 2510} {"train_loss": -43.297786712646484, "global_step": 303727, "epoch": 2510} {"train_loss": -41.69504928588867, "global_step": 303728, "epoch": 2510} {"train_loss": -43.496620178222656, "global_step": 303729, "epoch": 2510} {"train_loss": -42.1873893737793, "global_step": 303730, "epoch": 2510} {"train_loss": -42.929073333740234, "global_step": 303731, "epoch": 2510} {"train_loss": -42.93564987182617, "global_step": 303732, "epoch": 2510} {"train_loss": -42.4511604309082, "global_step": 303733, "epoch": 2510} {"train_loss": -43.26152420043945, "global_step": 303734, "epoch": 2510} {"train_loss": -42.283050537109375, "global_step": 303735, "epoch": 2510} {"train_loss": -42.46859359741211, "global_step": 303736, "epoch": 2510} {"train_loss": -42.79319381713867, "global_step": 303737, "epoch": 2510} {"train_loss": -41.50358200073242, "global_step": 303738, "epoch": 2510} {"train_loss": -42.18973922729492, "global_step": 303739, "epoch": 2510} {"train_loss": -43.023040771484375, "global_step": 303740, "epoch": 2510} {"train_loss": -40.49274444580078, "global_step": 303741, "epoch": 2510} {"train_loss": -43.31504440307617, "global_step": 303742, "epoch": 2510} {"train_loss": -40.07893371582031, "global_step": 303743, "epoch": 2510} {"train_loss": -42.87564468383789, "global_step": 303744, "epoch": 2510} {"train_loss": -42.415443420410156, "global_step": 303745, "epoch": 2510} {"train_loss": -41.337257385253906, "global_step": 303746, "epoch": 2510} {"train_loss": -43.070770263671875, "global_step": 303747, "epoch": 2510} {"train_loss": -43.043514251708984, "global_step": 303748, "epoch": 2510} {"train_loss": -42.774742126464844, "global_step": 303749, "epoch": 2510} {"train_loss": -42.7828254699707, "global_step": 303750, "epoch": 2510} {"train_loss": -42.825225830078125, "global_step": 303751, "epoch": 2510} {"train_loss": -42.6392822265625, "global_step": 303752, "epoch": 2510} {"train_loss": -43.88999557495117, "global_step": 303753, "epoch": 2510} {"train_loss": -42.13086700439453, "global_step": 303754, "epoch": 2510} {"train_loss": -42.49858474731445, "global_step": 303755, "epoch": 2510} {"train_loss": -43.710750579833984, "global_step": 303756, "epoch": 2510} {"train_loss": -43.00596237182617, "global_step": 303757, "epoch": 2510} {"train_loss": -42.83551025390625, "global_step": 303758, "epoch": 2510} {"train_loss": -42.78466796875, "global_step": 303759, "epoch": 2510} {"train_loss": -41.995216369628906, "global_step": 303760, "epoch": 2510} {"train_loss": -42.12986373901367, "global_step": 303761, "epoch": 2510} {"train_loss": -42.08856964111328, "global_step": 303762, "epoch": 2510} {"train_loss": -43.06892013549805, "global_step": 303763, "epoch": 2510} {"train_loss": -42.844295501708984, "global_step": 303764, "epoch": 2510} {"train_loss": -42.44818878173828, "global_step": 303765, "epoch": 2510} {"train_loss": -43.2334098815918, "global_step": 303766, "epoch": 2510} {"train_loss": -43.5966796875, "global_step": 303767, "epoch": 2510} {"train_loss": -42.60022735595703, "global_step": 303768, "epoch": 2510} {"train_loss": -42.77982711791992, "global_step": 303769, "epoch": 2510} {"train_loss": -43.812103271484375, "global_step": 303770, "epoch": 2510} {"train_loss": -43.540157318115234, "global_step": 303771, "epoch": 2510} {"train_loss": -43.12947082519531, "global_step": 303772, "epoch": 2510} {"train_loss": -43.227237701416016, "global_step": 303773, "epoch": 2510} {"train_loss": -42.93726348876953, "global_step": 303774, "epoch": 2510} {"train_loss": -41.792823791503906, "global_step": 303775, "epoch": 2510} {"train_loss": -43.30048751831055, "global_step": 303776, "epoch": 2510} {"train_loss": -43.18229675292969, "global_step": 303777, "epoch": 2510} {"train_loss": -43.33296585083008, "global_step": 303778, "epoch": 2510} {"train_loss": -43.31391143798828, "global_step": 303779, "epoch": 2510} {"train_loss": -43.787113189697266, "global_step": 303780, "epoch": 2510} {"train_loss": -42.225013732910156, "global_step": 303781, "epoch": 2510} {"train_loss": -43.778533935546875, "global_step": 303782, "epoch": 2510} {"train_loss": -43.28357696533203, "global_step": 303783, "epoch": 2510} {"train_loss": -42.72482681274414, "global_step": 303784, "epoch": 2510} {"train_loss": -41.42592239379883, "global_step": 303785, "epoch": 2510} {"train_loss": -43.054779052734375, "global_step": 303786, "epoch": 2510} {"train_loss": -43.77445602416992, "global_step": 303787, "epoch": 2510} {"train_loss": -41.12587356567383, "global_step": 303788, "epoch": 2510} {"train_loss": -41.6002197265625, "global_step": 303789, "epoch": 2510} {"train_loss": -39.66769027709961, "global_step": 303790, "epoch": 2510} {"train_loss": -41.687625885009766, "global_step": 303791, "epoch": 2510} {"train_loss": -43.657806396484375, "global_step": 303792, "epoch": 2510} {"train_loss": -40.91683578491211, "global_step": 303793, "epoch": 2510} {"train_loss": -37.19929122924805, "global_step": 303794, "epoch": 2510} {"train_loss": -37.14727783203125, "global_step": 303795, "epoch": 2510} {"train_loss": -42.1386604309082, "global_step": 303796, "epoch": 2510} {"train_loss": -42.579933166503906, "global_step": 303797, "epoch": 2510} {"train_loss": -36.34917068481445, "global_step": 303798, "epoch": 2510} {"train_loss": -38.31032943725586, "global_step": 303799, "epoch": 2510} {"train_loss": -42.69356155395508, "global_step": 303800, "epoch": 2510} {"train_loss": -42.50941848754883, "global_step": 303801, "epoch": 2510} {"train_loss": -41.750762939453125, "global_step": 303802, "epoch": 2510} {"train_loss": -41.90424728393555, "global_step": 303803, "epoch": 2510} {"train_loss": -43.339317321777344, "global_step": 303804, "epoch": 2510} {"train_loss": -42.167015075683594, "global_step": 303805, "epoch": 2510} {"train_loss": -41.2547492980957, "global_step": 303806, "epoch": 2510} {"train_loss": -43.39642333984375, "global_step": 303807, "epoch": 2510} {"train_loss": -42.47088623046875, "global_step": 303808, "epoch": 2510} {"train_loss": -40.746734619140625, "global_step": 303809, "epoch": 2510} {"train_loss": -42.92304611206055, "global_step": 303810, "epoch": 2510} {"train_loss": -40.56880569458008, "global_step": 303811, "epoch": 2510} {"train_loss": -43.22085952758789, "global_step": 303812, "epoch": 2510} {"train_loss": -42.67829513549805, "global_step": 303813, "epoch": 2510} {"train_loss": -41.767677307128906, "global_step": 303814, "epoch": 2510} {"train_loss": -44.030948638916016, "global_step": 303815, "epoch": 2510} {"train_loss": -41.943397521972656, "global_step": 303816, "epoch": 2510} {"train_loss": -43.53205871582031, "global_step": 303817, "epoch": 2510} {"train_loss": -42.99215316772461, "global_step": 303818, "epoch": 2510} {"train_loss": -42.46992111206055, "global_step": 303819, "epoch": 2510} {"train_loss": -43.31991958618164, "global_step": 303820, "epoch": 2510} {"train_loss": -42.64469528198242, "global_step": 303821, "epoch": 2510} {"train_loss": -43.37392807006836, "global_step": 303822, "epoch": 2510} {"train_loss": -42.2022590637207, "global_step": 303823, "epoch": 2510} {"train_loss": -42.4718132019043, "global_step": 303824, "epoch": 2510} {"train_loss": -42.998233795166016, "global_step": 303825, "epoch": 2510} {"train_loss": -42.21379852294922, "global_step": 303826, "epoch": 2510} {"train_loss": -43.54912185668945, "global_step": 303827, "epoch": 2510} {"train_loss": -42.28365707397461, "global_step": 303828, "epoch": 2510} {"train_loss": -43.60224151611328, "global_step": 303829, "epoch": 2510} {"train_loss": -42.42566684060846, "global_step": 303830, "epoch": 2510, "val_loss": 2679024.75} {"train_loss": -43.649539947509766, "global_step": 303831, "epoch": 2511} {"train_loss": -43.619293212890625, "global_step": 303832, "epoch": 2511} {"train_loss": -42.93067169189453, "global_step": 303833, "epoch": 2511} {"train_loss": -43.17629623413086, "global_step": 303834, "epoch": 2511} {"train_loss": -43.65940475463867, "global_step": 303835, "epoch": 2511} {"train_loss": -44.09623718261719, "global_step": 303836, "epoch": 2511} {"train_loss": -43.45106887817383, "global_step": 303837, "epoch": 2511} {"train_loss": -43.0390739440918, "global_step": 303838, "epoch": 2511} {"train_loss": -43.46485137939453, "global_step": 303839, "epoch": 2511} {"train_loss": -43.57060623168945, "global_step": 303840, "epoch": 2511} {"train_loss": -44.04556655883789, "global_step": 303841, "epoch": 2511} {"train_loss": -43.57640838623047, "global_step": 303842, "epoch": 2511} {"train_loss": -43.816646575927734, "global_step": 303843, "epoch": 2511} {"train_loss": -43.67826461791992, "global_step": 303844, "epoch": 2511} {"train_loss": -43.37612533569336, "global_step": 303845, "epoch": 2511} {"train_loss": -43.03499984741211, "global_step": 303846, "epoch": 2511} {"train_loss": -43.85392761230469, "global_step": 303847, "epoch": 2511} {"train_loss": -43.634891510009766, "global_step": 303848, "epoch": 2511} {"train_loss": -43.676353454589844, "global_step": 303849, "epoch": 2511} {"train_loss": -43.46866989135742, "global_step": 303850, "epoch": 2511} {"train_loss": -43.7210578918457, "global_step": 303851, "epoch": 2511} {"train_loss": -43.8917121887207, "global_step": 303852, "epoch": 2511} {"train_loss": -43.02980041503906, "global_step": 303853, "epoch": 2511} {"train_loss": -43.831329345703125, "global_step": 303854, "epoch": 2511} {"train_loss": -43.711463928222656, "global_step": 303855, "epoch": 2511} {"train_loss": -43.51670455932617, "global_step": 303856, "epoch": 2511} {"train_loss": -43.2812614440918, "global_step": 303857, "epoch": 2511} {"train_loss": -43.607479095458984, "global_step": 303858, "epoch": 2511} {"train_loss": -43.626953125, "global_step": 303859, "epoch": 2511} {"train_loss": -43.48405456542969, "global_step": 303860, "epoch": 2511} {"train_loss": -42.294525146484375, "global_step": 303861, "epoch": 2511} {"train_loss": -37.00642776489258, "global_step": 303862, "epoch": 2511} {"train_loss": -35.47146987915039, "global_step": 303863, "epoch": 2511} {"train_loss": -38.050838470458984, "global_step": 303864, "epoch": 2511} {"train_loss": -39.05442810058594, "global_step": 303865, "epoch": 2511} {"train_loss": -42.6821403503418, "global_step": 303866, "epoch": 2511} {"train_loss": -38.98406982421875, "global_step": 303867, "epoch": 2511} {"train_loss": -40.66661071777344, "global_step": 303868, "epoch": 2511} {"train_loss": -43.04044723510742, "global_step": 303869, "epoch": 2511} {"train_loss": -37.452789306640625, "global_step": 303870, "epoch": 2511} {"train_loss": -37.468666076660156, "global_step": 303871, "epoch": 2511} {"train_loss": -41.44166564941406, "global_step": 303872, "epoch": 2511} {"train_loss": -42.350772857666016, "global_step": 303873, "epoch": 2511} {"train_loss": -40.7844352722168, "global_step": 303874, "epoch": 2511} {"train_loss": -42.064632415771484, "global_step": 303875, "epoch": 2511} {"train_loss": -39.921348571777344, "global_step": 303876, "epoch": 2511} {"train_loss": -39.257266998291016, "global_step": 303877, "epoch": 2511} {"train_loss": -42.83784866333008, "global_step": 303878, "epoch": 2511} {"train_loss": -40.45441436767578, "global_step": 303879, "epoch": 2511} {"train_loss": -42.3779411315918, "global_step": 303880, "epoch": 2511} {"train_loss": -42.32428741455078, "global_step": 303881, "epoch": 2511} {"train_loss": -41.913848876953125, "global_step": 303882, "epoch": 2511} {"train_loss": -42.488128662109375, "global_step": 303883, "epoch": 2511} {"train_loss": -43.16328811645508, "global_step": 303884, "epoch": 2511} {"train_loss": -42.72468185424805, "global_step": 303885, "epoch": 2511} {"train_loss": -42.377315521240234, "global_step": 303886, "epoch": 2511} {"train_loss": -42.76595687866211, "global_step": 303887, "epoch": 2511} {"train_loss": -43.30511474609375, "global_step": 303888, "epoch": 2511} {"train_loss": -42.73067855834961, "global_step": 303889, "epoch": 2511} {"train_loss": -43.06925964355469, "global_step": 303890, "epoch": 2511} {"train_loss": -42.602508544921875, "global_step": 303891, "epoch": 2511} {"train_loss": -42.89937973022461, "global_step": 303892, "epoch": 2511} {"train_loss": -43.35371780395508, "global_step": 303893, "epoch": 2511} {"train_loss": -41.451473236083984, "global_step": 303894, "epoch": 2511} {"train_loss": -43.036678314208984, "global_step": 303895, "epoch": 2511} {"train_loss": -43.19171142578125, "global_step": 303896, "epoch": 2511} {"train_loss": -43.264644622802734, "global_step": 303897, "epoch": 2511} {"train_loss": -43.65693283081055, "global_step": 303898, "epoch": 2511} {"train_loss": -43.30489730834961, "global_step": 303899, "epoch": 2511} {"train_loss": -43.13358688354492, "global_step": 303900, "epoch": 2511} {"train_loss": -42.921566009521484, "global_step": 303901, "epoch": 2511} {"train_loss": -43.61295700073242, "global_step": 303902, "epoch": 2511} {"train_loss": -42.9779052734375, "global_step": 303903, "epoch": 2511} {"train_loss": -43.50918197631836, "global_step": 303904, "epoch": 2511} {"train_loss": -43.20286178588867, "global_step": 303905, "epoch": 2511} {"train_loss": -43.65692138671875, "global_step": 303906, "epoch": 2511} {"train_loss": -43.10934066772461, "global_step": 303907, "epoch": 2511} {"train_loss": -43.13102722167969, "global_step": 303908, "epoch": 2511} {"train_loss": -43.99959182739258, "global_step": 303909, "epoch": 2511} {"train_loss": -42.90776824951172, "global_step": 303910, "epoch": 2511} {"train_loss": -43.24830627441406, "global_step": 303911, "epoch": 2511} {"train_loss": -43.09135437011719, "global_step": 303912, "epoch": 2511} {"train_loss": -42.58811569213867, "global_step": 303913, "epoch": 2511} {"train_loss": -43.31234359741211, "global_step": 303914, "epoch": 2511} {"train_loss": -42.845481872558594, "global_step": 303915, "epoch": 2511} {"train_loss": -43.50200271606445, "global_step": 303916, "epoch": 2511} {"train_loss": -43.350643157958984, "global_step": 303917, "epoch": 2511} {"train_loss": -43.30604934692383, "global_step": 303918, "epoch": 2511} {"train_loss": -42.194881439208984, "global_step": 303919, "epoch": 2511} {"train_loss": -43.3949089050293, "global_step": 303920, "epoch": 2511} {"train_loss": -33.44158172607422, "global_step": 303921, "epoch": 2511} {"train_loss": -42.521339416503906, "global_step": 303922, "epoch": 2511} {"train_loss": -42.44178009033203, "global_step": 303923, "epoch": 2511} {"train_loss": -42.45825958251953, "global_step": 303924, "epoch": 2511} {"train_loss": -32.08584976196289, "global_step": 303925, "epoch": 2511} {"train_loss": -42.407894134521484, "global_step": 303926, "epoch": 2511} {"train_loss": -40.376399993896484, "global_step": 303927, "epoch": 2511} {"train_loss": -32.64422607421875, "global_step": 303928, "epoch": 2511} {"train_loss": -41.62790298461914, "global_step": 303929, "epoch": 2511} {"train_loss": -40.94654083251953, "global_step": 303930, "epoch": 2511} {"train_loss": -42.59084701538086, "global_step": 303931, "epoch": 2511} {"train_loss": -42.77647018432617, "global_step": 303932, "epoch": 2511} {"train_loss": -41.912296295166016, "global_step": 303933, "epoch": 2511} {"train_loss": -38.98395919799805, "global_step": 303934, "epoch": 2511} {"train_loss": -38.5371208190918, "global_step": 303935, "epoch": 2511} {"train_loss": -37.77815628051758, "global_step": 303936, "epoch": 2511} {"train_loss": -41.336936950683594, "global_step": 303937, "epoch": 2511} {"train_loss": -37.206398010253906, "global_step": 303938, "epoch": 2511} {"train_loss": -40.414310455322266, "global_step": 303939, "epoch": 2511} {"train_loss": -40.6411018371582, "global_step": 303940, "epoch": 2511} {"train_loss": -41.22784423828125, "global_step": 303941, "epoch": 2511} {"train_loss": -38.04304122924805, "global_step": 303942, "epoch": 2511} {"train_loss": -36.91646194458008, "global_step": 303943, "epoch": 2511} {"train_loss": -36.634132385253906, "global_step": 303944, "epoch": 2511} {"train_loss": -40.26116180419922, "global_step": 303945, "epoch": 2511} {"train_loss": -34.68016815185547, "global_step": 303946, "epoch": 2511} {"train_loss": -39.3829460144043, "global_step": 303947, "epoch": 2511} {"train_loss": -38.71528244018555, "global_step": 303948, "epoch": 2511} {"train_loss": -40.57719421386719, "global_step": 303949, "epoch": 2511} {"train_loss": -40.55601501464844, "global_step": 303950, "epoch": 2511} {"train_loss": -41.74981541278934, "global_step": 303951, "epoch": 2511, "val_loss": 3091099.25} {"train_loss": -40.79120635986328, "global_step": 303952, "epoch": 2512} {"train_loss": -39.87065505981445, "global_step": 303953, "epoch": 2512} {"train_loss": -40.9852409362793, "global_step": 303954, "epoch": 2512} {"train_loss": -41.12533187866211, "global_step": 303955, "epoch": 2512} {"train_loss": -39.64762496948242, "global_step": 303956, "epoch": 2512} {"train_loss": -41.061241149902344, "global_step": 303957, "epoch": 2512} {"train_loss": -40.38253402709961, "global_step": 303958, "epoch": 2512} {"train_loss": -41.48923873901367, "global_step": 303959, "epoch": 2512} {"train_loss": -41.99980163574219, "global_step": 303960, "epoch": 2512} {"train_loss": -41.68778991699219, "global_step": 303961, "epoch": 2512} {"train_loss": -41.48882293701172, "global_step": 303962, "epoch": 2512} {"train_loss": -38.59871292114258, "global_step": 303963, "epoch": 2512} {"train_loss": -42.22498321533203, "global_step": 303964, "epoch": 2512} {"train_loss": -41.054195404052734, "global_step": 303965, "epoch": 2512} {"train_loss": -41.53173828125, "global_step": 303966, "epoch": 2512} {"train_loss": -42.224273681640625, "global_step": 303967, "epoch": 2512} {"train_loss": -41.88124465942383, "global_step": 303968, "epoch": 2512} {"train_loss": -41.57965850830078, "global_step": 303969, "epoch": 2512} {"train_loss": -40.78379440307617, "global_step": 303970, "epoch": 2512} {"train_loss": -40.49787521362305, "global_step": 303971, "epoch": 2512} {"train_loss": -42.091400146484375, "global_step": 303972, "epoch": 2512} {"train_loss": -42.41611862182617, "global_step": 303973, "epoch": 2512} {"train_loss": -39.3488655090332, "global_step": 303974, "epoch": 2512} {"train_loss": -41.003719329833984, "global_step": 303975, "epoch": 2512} {"train_loss": -39.281776428222656, "global_step": 303976, "epoch": 2512} {"train_loss": -42.15085983276367, "global_step": 303977, "epoch": 2512} {"train_loss": -41.06818389892578, "global_step": 303978, "epoch": 2512} {"train_loss": -42.27772903442383, "global_step": 303979, "epoch": 2512} {"train_loss": -41.74787521362305, "global_step": 303980, "epoch": 2512} {"train_loss": -42.32115173339844, "global_step": 303981, "epoch": 2512} {"train_loss": -41.52739334106445, "global_step": 303982, "epoch": 2512} {"train_loss": -41.90902328491211, "global_step": 303983, "epoch": 2512} {"train_loss": -41.29127883911133, "global_step": 303984, "epoch": 2512} {"train_loss": -41.08686828613281, "global_step": 303985, "epoch": 2512} {"train_loss": -42.05664825439453, "global_step": 303986, "epoch": 2512} {"train_loss": -42.54658508300781, "global_step": 303987, "epoch": 2512} {"train_loss": -42.86492919921875, "global_step": 303988, "epoch": 2512} {"train_loss": -42.51152038574219, "global_step": 303989, "epoch": 2512} {"train_loss": -42.212974548339844, "global_step": 303990, "epoch": 2512} {"train_loss": -42.71826934814453, "global_step": 303991, "epoch": 2512} {"train_loss": -42.81449508666992, "global_step": 303992, "epoch": 2512} {"train_loss": -41.35774612426758, "global_step": 303993, "epoch": 2512} {"train_loss": -42.11851119995117, "global_step": 303994, "epoch": 2512} {"train_loss": -43.21735763549805, "global_step": 303995, "epoch": 2512} {"train_loss": -42.85990524291992, "global_step": 303996, "epoch": 2512} {"train_loss": -43.07046890258789, "global_step": 303997, "epoch": 2512} {"train_loss": -42.603721618652344, "global_step": 303998, "epoch": 2512} {"train_loss": -43.31890869140625, "global_step": 303999, "epoch": 2512} {"train_loss": -42.06215286254883, "global_step": 304000, "epoch": 2512} {"train_loss": -43.515838623046875, "global_step": 304001, "epoch": 2512} {"train_loss": -39.36176300048828, "global_step": 304002, "epoch": 2512} {"train_loss": -43.386775970458984, "global_step": 304003, "epoch": 2512} {"train_loss": -42.12776565551758, "global_step": 304004, "epoch": 2512} {"train_loss": -40.96413040161133, "global_step": 304005, "epoch": 2512} {"train_loss": -42.376983642578125, "global_step": 304006, "epoch": 2512} {"train_loss": -43.1090087890625, "global_step": 304007, "epoch": 2512} {"train_loss": -43.68241500854492, "global_step": 304008, "epoch": 2512} {"train_loss": -42.04219055175781, "global_step": 304009, "epoch": 2512} {"train_loss": -42.12827682495117, "global_step": 304010, "epoch": 2512} {"train_loss": -43.09035110473633, "global_step": 304011, "epoch": 2512} {"train_loss": -43.02402877807617, "global_step": 304012, "epoch": 2512} {"train_loss": -43.672664642333984, "global_step": 304013, "epoch": 2512} {"train_loss": -43.48337936401367, "global_step": 304014, "epoch": 2512} {"train_loss": -43.304840087890625, "global_step": 304015, "epoch": 2512} {"train_loss": -42.377376556396484, "global_step": 304016, "epoch": 2512} {"train_loss": -43.460479736328125, "global_step": 304017, "epoch": 2512} {"train_loss": -42.682315826416016, "global_step": 304018, "epoch": 2512} {"train_loss": -42.767005920410156, "global_step": 304019, "epoch": 2512} {"train_loss": -43.41579818725586, "global_step": 304020, "epoch": 2512} {"train_loss": -43.50118637084961, "global_step": 304021, "epoch": 2512} {"train_loss": -40.935935974121094, "global_step": 304022, "epoch": 2512} {"train_loss": -43.326988220214844, "global_step": 304023, "epoch": 2512} {"train_loss": -43.52238082885742, "global_step": 304024, "epoch": 2512} {"train_loss": -43.16804885864258, "global_step": 304025, "epoch": 2512} {"train_loss": -38.17475509643555, "global_step": 304026, "epoch": 2512} {"train_loss": -43.293331146240234, "global_step": 304027, "epoch": 2512} {"train_loss": -43.782894134521484, "global_step": 304028, "epoch": 2512} {"train_loss": -43.183738708496094, "global_step": 304029, "epoch": 2512} {"train_loss": -43.787288665771484, "global_step": 304030, "epoch": 2512} {"train_loss": -43.821815490722656, "global_step": 304031, "epoch": 2512} {"train_loss": -43.46378707885742, "global_step": 304032, "epoch": 2512} {"train_loss": -42.876373291015625, "global_step": 304033, "epoch": 2512} {"train_loss": -42.886749267578125, "global_step": 304034, "epoch": 2512} {"train_loss": -42.75450897216797, "global_step": 304035, "epoch": 2512} {"train_loss": -41.5692138671875, "global_step": 304036, "epoch": 2512} {"train_loss": -43.98856735229492, "global_step": 304037, "epoch": 2512} {"train_loss": -43.61748123168945, "global_step": 304038, "epoch": 2512} {"train_loss": -44.105194091796875, "global_step": 304039, "epoch": 2512} {"train_loss": -43.07591247558594, "global_step": 304040, "epoch": 2512} {"train_loss": -43.70454406738281, "global_step": 304041, "epoch": 2512} {"train_loss": -43.716861724853516, "global_step": 304042, "epoch": 2512} {"train_loss": -43.85462951660156, "global_step": 304043, "epoch": 2512} {"train_loss": -43.55027389526367, "global_step": 304044, "epoch": 2512} {"train_loss": -43.55156326293945, "global_step": 304045, "epoch": 2512} {"train_loss": -42.529781341552734, "global_step": 304046, "epoch": 2512} {"train_loss": -43.8425407409668, "global_step": 304047, "epoch": 2512} {"train_loss": -43.18488311767578, "global_step": 304048, "epoch": 2512} {"train_loss": -42.4201774597168, "global_step": 304049, "epoch": 2512} {"train_loss": -42.518287658691406, "global_step": 304050, "epoch": 2512} {"train_loss": -43.575679779052734, "global_step": 304051, "epoch": 2512} {"train_loss": -43.26600646972656, "global_step": 304052, "epoch": 2512} {"train_loss": -44.05622100830078, "global_step": 304053, "epoch": 2512} {"train_loss": -43.528053283691406, "global_step": 304054, "epoch": 2512} {"train_loss": -42.093055725097656, "global_step": 304055, "epoch": 2512} {"train_loss": -42.88563919067383, "global_step": 304056, "epoch": 2512} {"train_loss": -42.67523956298828, "global_step": 304057, "epoch": 2512} {"train_loss": -42.66119384765625, "global_step": 304058, "epoch": 2512} {"train_loss": -40.61750030517578, "global_step": 304059, "epoch": 2512} {"train_loss": -43.336971282958984, "global_step": 304060, "epoch": 2512} {"train_loss": -37.800628662109375, "global_step": 304061, "epoch": 2512} {"train_loss": -41.4217643737793, "global_step": 304062, "epoch": 2512} {"train_loss": -41.14189529418945, "global_step": 304063, "epoch": 2512} {"train_loss": -42.98802947998047, "global_step": 304064, "epoch": 2512} {"train_loss": -40.75185775756836, "global_step": 304065, "epoch": 2512} {"train_loss": -43.60107421875, "global_step": 304066, "epoch": 2512} {"train_loss": -40.0184326171875, "global_step": 304067, "epoch": 2512} {"train_loss": -41.45362091064453, "global_step": 304068, "epoch": 2512} {"train_loss": -42.67912673950195, "global_step": 304069, "epoch": 2512} {"train_loss": -36.34865951538086, "global_step": 304070, "epoch": 2512} {"train_loss": -39.982398986816406, "global_step": 304071, "epoch": 2512} {"train_loss": -42.181073496164366, "global_step": 304072, "epoch": 2512, "val_loss": 2498691.75} {"train_loss": -43.1396598815918, "global_step": 304073, "epoch": 2513} {"train_loss": -38.305030822753906, "global_step": 304074, "epoch": 2513} {"train_loss": -42.44218063354492, "global_step": 304075, "epoch": 2513} {"train_loss": -42.5656852722168, "global_step": 304076, "epoch": 2513} {"train_loss": -40.90687942504883, "global_step": 304077, "epoch": 2513} {"train_loss": -40.926429748535156, "global_step": 304078, "epoch": 2513} {"train_loss": -42.02546310424805, "global_step": 304079, "epoch": 2513} {"train_loss": -42.560298919677734, "global_step": 304080, "epoch": 2513} {"train_loss": -42.3942756652832, "global_step": 304081, "epoch": 2513} {"train_loss": -42.152191162109375, "global_step": 304082, "epoch": 2513} {"train_loss": -40.60811233520508, "global_step": 304083, "epoch": 2513} {"train_loss": -42.51312255859375, "global_step": 304084, "epoch": 2513} {"train_loss": -41.87888717651367, "global_step": 304085, "epoch": 2513} {"train_loss": -39.23208236694336, "global_step": 304086, "epoch": 2513} {"train_loss": -40.25263595581055, "global_step": 304087, "epoch": 2513} {"train_loss": -42.263301849365234, "global_step": 304088, "epoch": 2513} {"train_loss": -42.95766830444336, "global_step": 304089, "epoch": 2513} {"train_loss": -43.06205749511719, "global_step": 304090, "epoch": 2513} {"train_loss": -42.581356048583984, "global_step": 304091, "epoch": 2513} {"train_loss": -42.76223373413086, "global_step": 304092, "epoch": 2513} {"train_loss": -43.08187484741211, "global_step": 304093, "epoch": 2513} {"train_loss": -42.52118682861328, "global_step": 304094, "epoch": 2513} {"train_loss": -40.40436935424805, "global_step": 304095, "epoch": 2513} {"train_loss": -42.12801742553711, "global_step": 304096, "epoch": 2513} {"train_loss": -40.864418029785156, "global_step": 304097, "epoch": 2513} {"train_loss": -42.86037826538086, "global_step": 304098, "epoch": 2513} {"train_loss": -42.74649429321289, "global_step": 304099, "epoch": 2513} {"train_loss": -41.84919357299805, "global_step": 304100, "epoch": 2513} {"train_loss": -42.016761779785156, "global_step": 304101, "epoch": 2513} {"train_loss": -41.933685302734375, "global_step": 304102, "epoch": 2513} {"train_loss": -40.2791633605957, "global_step": 304103, "epoch": 2513} {"train_loss": -42.4635009765625, "global_step": 304104, "epoch": 2513} {"train_loss": -41.85029220581055, "global_step": 304105, "epoch": 2513} {"train_loss": -43.37559127807617, "global_step": 304106, "epoch": 2513} {"train_loss": -41.68082809448242, "global_step": 304107, "epoch": 2513} {"train_loss": -41.99299240112305, "global_step": 304108, "epoch": 2513} {"train_loss": -41.91196823120117, "global_step": 304109, "epoch": 2513} {"train_loss": -42.47872543334961, "global_step": 304110, "epoch": 2513} {"train_loss": -40.92591094970703, "global_step": 304111, "epoch": 2513} {"train_loss": -42.321937561035156, "global_step": 304112, "epoch": 2513} {"train_loss": -41.996517181396484, "global_step": 304113, "epoch": 2513} {"train_loss": -43.24602127075195, "global_step": 304114, "epoch": 2513} {"train_loss": -41.179595947265625, "global_step": 304115, "epoch": 2513} {"train_loss": -42.79520797729492, "global_step": 304116, "epoch": 2513} {"train_loss": -43.516563415527344, "global_step": 304117, "epoch": 2513} {"train_loss": -42.18330383300781, "global_step": 304118, "epoch": 2513} {"train_loss": -42.30642318725586, "global_step": 304119, "epoch": 2513} {"train_loss": -42.84260177612305, "global_step": 304120, "epoch": 2513} {"train_loss": -41.84395217895508, "global_step": 304121, "epoch": 2513} {"train_loss": -42.889312744140625, "global_step": 304122, "epoch": 2513} {"train_loss": -42.771366119384766, "global_step": 304123, "epoch": 2513} {"train_loss": -43.35013198852539, "global_step": 304124, "epoch": 2513} {"train_loss": -43.45674133300781, "global_step": 304125, "epoch": 2513} {"train_loss": -41.52177047729492, "global_step": 304126, "epoch": 2513} {"train_loss": -43.278724670410156, "global_step": 304127, "epoch": 2513} {"train_loss": -42.74355697631836, "global_step": 304128, "epoch": 2513} {"train_loss": -43.15641403198242, "global_step": 304129, "epoch": 2513} {"train_loss": -43.23530960083008, "global_step": 304130, "epoch": 2513} {"train_loss": -43.17805862426758, "global_step": 304131, "epoch": 2513} {"train_loss": -43.23408889770508, "global_step": 304132, "epoch": 2513} {"train_loss": -42.493385314941406, "global_step": 304133, "epoch": 2513} {"train_loss": -43.37411117553711, "global_step": 304134, "epoch": 2513} {"train_loss": -42.84817123413086, "global_step": 304135, "epoch": 2513} {"train_loss": -43.31685256958008, "global_step": 304136, "epoch": 2513} {"train_loss": -43.013916015625, "global_step": 304137, "epoch": 2513} {"train_loss": -42.75518035888672, "global_step": 304138, "epoch": 2513} {"train_loss": -42.60963439941406, "global_step": 304139, "epoch": 2513} {"train_loss": -43.08149337768555, "global_step": 304140, "epoch": 2513} {"train_loss": -43.23615646362305, "global_step": 304141, "epoch": 2513} {"train_loss": -42.94542694091797, "global_step": 304142, "epoch": 2513} {"train_loss": -43.00046920776367, "global_step": 304143, "epoch": 2513} {"train_loss": -42.57722091674805, "global_step": 304144, "epoch": 2513} {"train_loss": -38.853336334228516, "global_step": 304145, "epoch": 2513} {"train_loss": -41.92816162109375, "global_step": 304146, "epoch": 2513} {"train_loss": -43.27152633666992, "global_step": 304147, "epoch": 2513} {"train_loss": -43.010128021240234, "global_step": 304148, "epoch": 2513} {"train_loss": -43.178558349609375, "global_step": 304149, "epoch": 2513} {"train_loss": -42.27765655517578, "global_step": 304150, "epoch": 2513} {"train_loss": -39.92068862915039, "global_step": 304151, "epoch": 2513} {"train_loss": -42.73029708862305, "global_step": 304152, "epoch": 2513} {"train_loss": -44.0206298828125, "global_step": 304153, "epoch": 2513} {"train_loss": -43.28194808959961, "global_step": 304154, "epoch": 2513} {"train_loss": -42.31501388549805, "global_step": 304155, "epoch": 2513} {"train_loss": -43.27218246459961, "global_step": 304156, "epoch": 2513} {"train_loss": -42.963043212890625, "global_step": 304157, "epoch": 2513} {"train_loss": -43.84750747680664, "global_step": 304158, "epoch": 2513} {"train_loss": -43.60543441772461, "global_step": 304159, "epoch": 2513} {"train_loss": -42.2362174987793, "global_step": 304160, "epoch": 2513} {"train_loss": -42.874000549316406, "global_step": 304161, "epoch": 2513} {"train_loss": -42.60447311401367, "global_step": 304162, "epoch": 2513} {"train_loss": -43.04975891113281, "global_step": 304163, "epoch": 2513} {"train_loss": -41.60182189941406, "global_step": 304164, "epoch": 2513} {"train_loss": -40.75397872924805, "global_step": 304165, "epoch": 2513} {"train_loss": -43.720184326171875, "global_step": 304166, "epoch": 2513} {"train_loss": -43.39411544799805, "global_step": 304167, "epoch": 2513} {"train_loss": -44.21794128417969, "global_step": 304168, "epoch": 2513} {"train_loss": -43.88588333129883, "global_step": 304169, "epoch": 2513} {"train_loss": -43.38502883911133, "global_step": 304170, "epoch": 2513} {"train_loss": -43.9705924987793, "global_step": 304171, "epoch": 2513} {"train_loss": -43.48417663574219, "global_step": 304172, "epoch": 2513} {"train_loss": -40.86983871459961, "global_step": 304173, "epoch": 2513} {"train_loss": -43.4024772644043, "global_step": 304174, "epoch": 2513} {"train_loss": -43.48057174682617, "global_step": 304175, "epoch": 2513} {"train_loss": -42.731990814208984, "global_step": 304176, "epoch": 2513} {"train_loss": -42.29014205932617, "global_step": 304177, "epoch": 2513} {"train_loss": -42.09795379638672, "global_step": 304178, "epoch": 2513} {"train_loss": -42.577213287353516, "global_step": 304179, "epoch": 2513} {"train_loss": -42.344173431396484, "global_step": 304180, "epoch": 2513} {"train_loss": -42.58359909057617, "global_step": 304181, "epoch": 2513} {"train_loss": -43.04212188720703, "global_step": 304182, "epoch": 2513} {"train_loss": -41.13288497924805, "global_step": 304183, "epoch": 2513} {"train_loss": -41.599159240722656, "global_step": 304184, "epoch": 2513} {"train_loss": -42.34724044799805, "global_step": 304185, "epoch": 2513} {"train_loss": -42.85420608520508, "global_step": 304186, "epoch": 2513} {"train_loss": -43.72279357910156, "global_step": 304187, "epoch": 2513} {"train_loss": -42.379119873046875, "global_step": 304188, "epoch": 2513} {"train_loss": -41.29817581176758, "global_step": 304189, "epoch": 2513} {"train_loss": -41.715431213378906, "global_step": 304190, "epoch": 2513} {"train_loss": -42.32927322387695, "global_step": 304191, "epoch": 2513} {"train_loss": -41.525142669677734, "global_step": 304192, "epoch": 2513} {"train_loss": -42.394547391528924, "global_step": 304193, "epoch": 2513, "val_loss": 2532181.75} {"train_loss": -41.48335647583008, "global_step": 304194, "epoch": 2514} {"train_loss": -39.431427001953125, "global_step": 304195, "epoch": 2514} {"train_loss": -38.36188507080078, "global_step": 304196, "epoch": 2514} {"train_loss": -39.285518646240234, "global_step": 304197, "epoch": 2514} {"train_loss": -41.68842697143555, "global_step": 304198, "epoch": 2514} {"train_loss": -39.13262176513672, "global_step": 304199, "epoch": 2514} {"train_loss": -39.203975677490234, "global_step": 304200, "epoch": 2514} {"train_loss": -41.03806686401367, "global_step": 304201, "epoch": 2514} {"train_loss": -41.342803955078125, "global_step": 304202, "epoch": 2514} {"train_loss": -40.01141357421875, "global_step": 304203, "epoch": 2514} {"train_loss": -41.632503509521484, "global_step": 304204, "epoch": 2514} {"train_loss": -41.883270263671875, "global_step": 304205, "epoch": 2514} {"train_loss": -41.577816009521484, "global_step": 304206, "epoch": 2514} {"train_loss": -41.745967864990234, "global_step": 304207, "epoch": 2514} {"train_loss": -40.75648880004883, "global_step": 304208, "epoch": 2514} {"train_loss": -41.2065544128418, "global_step": 304209, "epoch": 2514} {"train_loss": -42.373878479003906, "global_step": 304210, "epoch": 2514} {"train_loss": -42.665504455566406, "global_step": 304211, "epoch": 2514} {"train_loss": -41.638824462890625, "global_step": 304212, "epoch": 2514} {"train_loss": -41.729549407958984, "global_step": 304213, "epoch": 2514} {"train_loss": -42.34368133544922, "global_step": 304214, "epoch": 2514} {"train_loss": -41.686012268066406, "global_step": 304215, "epoch": 2514} {"train_loss": -42.839637756347656, "global_step": 304216, "epoch": 2514} {"train_loss": -43.16652297973633, "global_step": 304217, "epoch": 2514} {"train_loss": -43.10746383666992, "global_step": 304218, "epoch": 2514} {"train_loss": -43.024078369140625, "global_step": 304219, "epoch": 2514} {"train_loss": -43.36841583251953, "global_step": 304220, "epoch": 2514} {"train_loss": -42.35646438598633, "global_step": 304221, "epoch": 2514} {"train_loss": -43.29695510864258, "global_step": 304222, "epoch": 2514} {"train_loss": -43.2639045715332, "global_step": 304223, "epoch": 2514} {"train_loss": -42.380062103271484, "global_step": 304224, "epoch": 2514} {"train_loss": -43.4299430847168, "global_step": 304225, "epoch": 2514} {"train_loss": -42.74453353881836, "global_step": 304226, "epoch": 2514} {"train_loss": -43.250640869140625, "global_step": 304227, "epoch": 2514} {"train_loss": -42.94893264770508, "global_step": 304228, "epoch": 2514} {"train_loss": -39.94951248168945, "global_step": 304229, "epoch": 2514} {"train_loss": -42.439422607421875, "global_step": 304230, "epoch": 2514} {"train_loss": -43.14250946044922, "global_step": 304231, "epoch": 2514} {"train_loss": -42.793941497802734, "global_step": 304232, "epoch": 2514} {"train_loss": -43.898963928222656, "global_step": 304233, "epoch": 2514} {"train_loss": -43.4858283996582, "global_step": 304234, "epoch": 2514} {"train_loss": -43.47415542602539, "global_step": 304235, "epoch": 2514} {"train_loss": -43.451393127441406, "global_step": 304236, "epoch": 2514} {"train_loss": -43.28192138671875, "global_step": 304237, "epoch": 2514} {"train_loss": -42.70172882080078, "global_step": 304238, "epoch": 2514} {"train_loss": -43.034236907958984, "global_step": 304239, "epoch": 2514} {"train_loss": -43.562286376953125, "global_step": 304240, "epoch": 2514} {"train_loss": -42.71569061279297, "global_step": 304241, "epoch": 2514} {"train_loss": -43.817237854003906, "global_step": 304242, "epoch": 2514} {"train_loss": -44.04834747314453, "global_step": 304243, "epoch": 2514} {"train_loss": -43.4958381652832, "global_step": 304244, "epoch": 2514} {"train_loss": -43.55927658081055, "global_step": 304245, "epoch": 2514} {"train_loss": -43.2381706237793, "global_step": 304246, "epoch": 2514} {"train_loss": -43.308475494384766, "global_step": 304247, "epoch": 2514} {"train_loss": -43.22330856323242, "global_step": 304248, "epoch": 2514} {"train_loss": -43.80879592895508, "global_step": 304249, "epoch": 2514} {"train_loss": -44.058895111083984, "global_step": 304250, "epoch": 2514} {"train_loss": -43.33879852294922, "global_step": 304251, "epoch": 2514} {"train_loss": -43.09748077392578, "global_step": 304252, "epoch": 2514} {"train_loss": -43.460487365722656, "global_step": 304253, "epoch": 2514} {"train_loss": -43.94451904296875, "global_step": 304254, "epoch": 2514} {"train_loss": -43.584228515625, "global_step": 304255, "epoch": 2514} {"train_loss": -43.83527374267578, "global_step": 304256, "epoch": 2514} {"train_loss": -43.5422248840332, "global_step": 304257, "epoch": 2514} {"train_loss": -42.87737274169922, "global_step": 304258, "epoch": 2514} {"train_loss": -43.772884368896484, "global_step": 304259, "epoch": 2514} {"train_loss": -43.68571853637695, "global_step": 304260, "epoch": 2514} {"train_loss": -43.85055160522461, "global_step": 304261, "epoch": 2514} {"train_loss": -44.00366973876953, "global_step": 304262, "epoch": 2514} {"train_loss": -44.114044189453125, "global_step": 304263, "epoch": 2514} {"train_loss": -44.045021057128906, "global_step": 304264, "epoch": 2514} {"train_loss": -44.12025833129883, "global_step": 304265, "epoch": 2514} {"train_loss": -44.48728561401367, "global_step": 304266, "epoch": 2514} {"train_loss": -44.05784225463867, "global_step": 304267, "epoch": 2514} {"train_loss": -44.49304962158203, "global_step": 304268, "epoch": 2514} {"train_loss": -43.81456756591797, "global_step": 304269, "epoch": 2514} {"train_loss": -43.65081787109375, "global_step": 304270, "epoch": 2514} {"train_loss": -44.000614166259766, "global_step": 304271, "epoch": 2514} {"train_loss": -43.94670867919922, "global_step": 304272, "epoch": 2514} {"train_loss": -43.75203323364258, "global_step": 304273, "epoch": 2514} {"train_loss": -43.99757385253906, "global_step": 304274, "epoch": 2514} {"train_loss": -44.343719482421875, "global_step": 304275, "epoch": 2514} {"train_loss": -44.6051139831543, "global_step": 304276, "epoch": 2514} {"train_loss": -43.51597213745117, "global_step": 304277, "epoch": 2514} {"train_loss": -42.82957077026367, "global_step": 304278, "epoch": 2514} {"train_loss": -43.0693244934082, "global_step": 304279, "epoch": 2514} {"train_loss": -43.96592330932617, "global_step": 304280, "epoch": 2514} {"train_loss": -44.239437103271484, "global_step": 304281, "epoch": 2514} {"train_loss": -42.981971740722656, "global_step": 304282, "epoch": 2514} {"train_loss": -43.0588493347168, "global_step": 304283, "epoch": 2514} {"train_loss": -43.032859802246094, "global_step": 304284, "epoch": 2514} {"train_loss": -43.554447174072266, "global_step": 304285, "epoch": 2514} {"train_loss": -42.51882553100586, "global_step": 304286, "epoch": 2514} {"train_loss": -41.22724533081055, "global_step": 304287, "epoch": 2514} {"train_loss": -41.45479202270508, "global_step": 304288, "epoch": 2514} {"train_loss": -41.14748001098633, "global_step": 304289, "epoch": 2514} {"train_loss": -41.00080108642578, "global_step": 304290, "epoch": 2514} {"train_loss": -41.0156364440918, "global_step": 304291, "epoch": 2514} {"train_loss": -42.650047302246094, "global_step": 304292, "epoch": 2514} {"train_loss": -40.70137023925781, "global_step": 304293, "epoch": 2514} {"train_loss": -40.27942657470703, "global_step": 304294, "epoch": 2514} {"train_loss": -42.24032974243164, "global_step": 304295, "epoch": 2514} {"train_loss": -42.43508529663086, "global_step": 304296, "epoch": 2514} {"train_loss": -41.626075744628906, "global_step": 304297, "epoch": 2514} {"train_loss": -39.87868881225586, "global_step": 304298, "epoch": 2514} {"train_loss": -41.94377136230469, "global_step": 304299, "epoch": 2514} {"train_loss": -40.3936882019043, "global_step": 304300, "epoch": 2514} {"train_loss": -40.34359359741211, "global_step": 304301, "epoch": 2514} {"train_loss": -42.34773635864258, "global_step": 304302, "epoch": 2514} {"train_loss": -41.38772201538086, "global_step": 304303, "epoch": 2514} {"train_loss": -39.297183990478516, "global_step": 304304, "epoch": 2514} {"train_loss": -38.853302001953125, "global_step": 304305, "epoch": 2514} {"train_loss": -42.49019241333008, "global_step": 304306, "epoch": 2514} {"train_loss": -39.08706283569336, "global_step": 304307, "epoch": 2514} {"train_loss": -39.90565872192383, "global_step": 304308, "epoch": 2514} {"train_loss": -42.29937744140625, "global_step": 304309, "epoch": 2514} {"train_loss": -40.91997146606445, "global_step": 304310, "epoch": 2514} {"train_loss": -42.53886795043945, "global_step": 304311, "epoch": 2514} {"train_loss": -42.497352600097656, "global_step": 304312, "epoch": 2514} {"train_loss": -42.96262741088867, "global_step": 304313, "epoch": 2514} {"train_loss": -42.47898104959283, "global_step": 304314, "epoch": 2514, "val_loss": 2708880.0} {"train_loss": -42.344173431396484, "global_step": 304315, "epoch": 2515} {"train_loss": -42.932220458984375, "global_step": 304316, "epoch": 2515} {"train_loss": -42.586185455322266, "global_step": 304317, "epoch": 2515} {"train_loss": -43.18412399291992, "global_step": 304318, "epoch": 2515} {"train_loss": -42.46209716796875, "global_step": 304319, "epoch": 2515} {"train_loss": -42.76930618286133, "global_step": 304320, "epoch": 2515} {"train_loss": -42.9815559387207, "global_step": 304321, "epoch": 2515} {"train_loss": -43.09670639038086, "global_step": 304322, "epoch": 2515} {"train_loss": -42.875335693359375, "global_step": 304323, "epoch": 2515} {"train_loss": -42.76216506958008, "global_step": 304324, "epoch": 2515} {"train_loss": -42.76215744018555, "global_step": 304325, "epoch": 2515} {"train_loss": -43.086036682128906, "global_step": 304326, "epoch": 2515} {"train_loss": -42.80072021484375, "global_step": 304327, "epoch": 2515} {"train_loss": -43.54989242553711, "global_step": 304328, "epoch": 2515} {"train_loss": -42.45989990234375, "global_step": 304329, "epoch": 2515} {"train_loss": -42.50333023071289, "global_step": 304330, "epoch": 2515} {"train_loss": -43.704925537109375, "global_step": 304331, "epoch": 2515} {"train_loss": -41.870052337646484, "global_step": 304332, "epoch": 2515} {"train_loss": -42.652435302734375, "global_step": 304333, "epoch": 2515} {"train_loss": -43.05707931518555, "global_step": 304334, "epoch": 2515} {"train_loss": -43.1013298034668, "global_step": 304335, "epoch": 2515} {"train_loss": -43.27389144897461, "global_step": 304336, "epoch": 2515} {"train_loss": -43.16815185546875, "global_step": 304337, "epoch": 2515} {"train_loss": -42.84837341308594, "global_step": 304338, "epoch": 2515} {"train_loss": -41.077327728271484, "global_step": 304339, "epoch": 2515} {"train_loss": -43.710845947265625, "global_step": 304340, "epoch": 2515} {"train_loss": -41.8050422668457, "global_step": 304341, "epoch": 2515} {"train_loss": -43.15696334838867, "global_step": 304342, "epoch": 2515} {"train_loss": -43.350067138671875, "global_step": 304343, "epoch": 2515} {"train_loss": -42.7238655090332, "global_step": 304344, "epoch": 2515} {"train_loss": -43.6637077331543, "global_step": 304345, "epoch": 2515} {"train_loss": -43.9473762512207, "global_step": 304346, "epoch": 2515} {"train_loss": -42.52814865112305, "global_step": 304347, "epoch": 2515} {"train_loss": -43.40144348144531, "global_step": 304348, "epoch": 2515} {"train_loss": -43.97744369506836, "global_step": 304349, "epoch": 2515} {"train_loss": -43.09713363647461, "global_step": 304350, "epoch": 2515} {"train_loss": -42.38077163696289, "global_step": 304351, "epoch": 2515} {"train_loss": -43.23344039916992, "global_step": 304352, "epoch": 2515} {"train_loss": -43.38553237915039, "global_step": 304353, "epoch": 2515} {"train_loss": -42.813228607177734, "global_step": 304354, "epoch": 2515} {"train_loss": -43.46187973022461, "global_step": 304355, "epoch": 2515} {"train_loss": -43.01170349121094, "global_step": 304356, "epoch": 2515} {"train_loss": -43.29388427734375, "global_step": 304357, "epoch": 2515} {"train_loss": -41.6522331237793, "global_step": 304358, "epoch": 2515} {"train_loss": -42.33968734741211, "global_step": 304359, "epoch": 2515} {"train_loss": -43.5716438293457, "global_step": 304360, "epoch": 2515} {"train_loss": -43.72703170776367, "global_step": 304361, "epoch": 2515} {"train_loss": -42.79623031616211, "global_step": 304362, "epoch": 2515} {"train_loss": -43.651649475097656, "global_step": 304363, "epoch": 2515} {"train_loss": -42.9355583190918, "global_step": 304364, "epoch": 2515} {"train_loss": -43.3093147277832, "global_step": 304365, "epoch": 2515} {"train_loss": -43.2419319152832, "global_step": 304366, "epoch": 2515} {"train_loss": -43.94254684448242, "global_step": 304367, "epoch": 2515} {"train_loss": -43.6845588684082, "global_step": 304368, "epoch": 2515} {"train_loss": -42.67302322387695, "global_step": 304369, "epoch": 2515} {"train_loss": -43.15869140625, "global_step": 304370, "epoch": 2515} {"train_loss": -44.064552307128906, "global_step": 304371, "epoch": 2515} {"train_loss": -43.08930587768555, "global_step": 304372, "epoch": 2515} {"train_loss": -42.26578903198242, "global_step": 304373, "epoch": 2515} {"train_loss": -43.64590072631836, "global_step": 304374, "epoch": 2515} {"train_loss": -42.56239700317383, "global_step": 304375, "epoch": 2515} {"train_loss": -43.35509490966797, "global_step": 304376, "epoch": 2515} {"train_loss": -43.630821228027344, "global_step": 304377, "epoch": 2515} {"train_loss": -42.886627197265625, "global_step": 304378, "epoch": 2515} {"train_loss": -42.59558868408203, "global_step": 304379, "epoch": 2515} {"train_loss": -43.250640869140625, "global_step": 304380, "epoch": 2515} {"train_loss": -43.974342346191406, "global_step": 304381, "epoch": 2515} {"train_loss": -43.43947219848633, "global_step": 304382, "epoch": 2515} {"train_loss": -43.67015838623047, "global_step": 304383, "epoch": 2515} {"train_loss": -44.07527160644531, "global_step": 304384, "epoch": 2515} {"train_loss": -43.19755172729492, "global_step": 304385, "epoch": 2515} {"train_loss": -42.789649963378906, "global_step": 304386, "epoch": 2515} {"train_loss": -43.9898796081543, "global_step": 304387, "epoch": 2515} {"train_loss": -43.98647689819336, "global_step": 304388, "epoch": 2515} {"train_loss": -42.81147003173828, "global_step": 304389, "epoch": 2515} {"train_loss": -43.70550537109375, "global_step": 304390, "epoch": 2515} {"train_loss": -43.68490219116211, "global_step": 304391, "epoch": 2515} {"train_loss": -43.613258361816406, "global_step": 304392, "epoch": 2515} {"train_loss": -43.44979476928711, "global_step": 304393, "epoch": 2515} {"train_loss": -43.64838790893555, "global_step": 304394, "epoch": 2515} {"train_loss": -43.05264663696289, "global_step": 304395, "epoch": 2515} {"train_loss": -43.14357376098633, "global_step": 304396, "epoch": 2515} {"train_loss": -43.871368408203125, "global_step": 304397, "epoch": 2515} {"train_loss": -43.67527389526367, "global_step": 304398, "epoch": 2515} {"train_loss": -43.579811096191406, "global_step": 304399, "epoch": 2515} {"train_loss": -44.11564254760742, "global_step": 304400, "epoch": 2515} {"train_loss": -41.290103912353516, "global_step": 304401, "epoch": 2515} {"train_loss": -43.41431427001953, "global_step": 304402, "epoch": 2515} {"train_loss": -44.001888275146484, "global_step": 304403, "epoch": 2515} {"train_loss": -43.03175735473633, "global_step": 304404, "epoch": 2515} {"train_loss": -39.77218246459961, "global_step": 304405, "epoch": 2515} {"train_loss": -39.21826934814453, "global_step": 304406, "epoch": 2515} {"train_loss": -38.46718215942383, "global_step": 304407, "epoch": 2515} {"train_loss": -39.4001350402832, "global_step": 304408, "epoch": 2515} {"train_loss": -41.5606575012207, "global_step": 304409, "epoch": 2515} {"train_loss": -43.19829177856445, "global_step": 304410, "epoch": 2515} {"train_loss": -42.121543884277344, "global_step": 304411, "epoch": 2515} {"train_loss": -40.80134201049805, "global_step": 304412, "epoch": 2515} {"train_loss": -42.49421691894531, "global_step": 304413, "epoch": 2515} {"train_loss": -42.60047149658203, "global_step": 304414, "epoch": 2515} {"train_loss": -42.82131576538086, "global_step": 304415, "epoch": 2515} {"train_loss": -43.27266311645508, "global_step": 304416, "epoch": 2515} {"train_loss": -42.633155822753906, "global_step": 304417, "epoch": 2515} {"train_loss": -42.97017288208008, "global_step": 304418, "epoch": 2515} {"train_loss": -43.280391693115234, "global_step": 304419, "epoch": 2515} {"train_loss": -43.15047836303711, "global_step": 304420, "epoch": 2515} {"train_loss": -41.080162048339844, "global_step": 304421, "epoch": 2515} {"train_loss": -43.06124496459961, "global_step": 304422, "epoch": 2515} {"train_loss": -43.620452880859375, "global_step": 304423, "epoch": 2515} {"train_loss": -42.97432327270508, "global_step": 304424, "epoch": 2515} {"train_loss": -43.42549133300781, "global_step": 304425, "epoch": 2515} {"train_loss": -43.40668869018555, "global_step": 304426, "epoch": 2515} {"train_loss": -43.56789779663086, "global_step": 304427, "epoch": 2515} {"train_loss": -42.386741638183594, "global_step": 304428, "epoch": 2515} {"train_loss": -42.88360595703125, "global_step": 304429, "epoch": 2515} {"train_loss": -38.8457145690918, "global_step": 304430, "epoch": 2515} {"train_loss": -41.10225296020508, "global_step": 304431, "epoch": 2515} {"train_loss": -42.210453033447266, "global_step": 304432, "epoch": 2515} {"train_loss": -42.287567138671875, "global_step": 304433, "epoch": 2515} {"train_loss": -42.822669982910156, "global_step": 304434, "epoch": 2515} {"train_loss": -42.86942940704093, "global_step": 304435, "epoch": 2515, "val_loss": 2706613.0} {"train_loss": -41.46516799926758, "global_step": 304436, "epoch": 2516} {"train_loss": -42.48294448852539, "global_step": 304437, "epoch": 2516} {"train_loss": -41.915653228759766, "global_step": 304438, "epoch": 2516} {"train_loss": -43.07963180541992, "global_step": 304439, "epoch": 2516} {"train_loss": -42.46393585205078, "global_step": 304440, "epoch": 2516} {"train_loss": -42.9794807434082, "global_step": 304441, "epoch": 2516} {"train_loss": -42.889217376708984, "global_step": 304442, "epoch": 2516} {"train_loss": -43.52012252807617, "global_step": 304443, "epoch": 2516} {"train_loss": -42.22175979614258, "global_step": 304444, "epoch": 2516} {"train_loss": -41.565128326416016, "global_step": 304445, "epoch": 2516} {"train_loss": -41.462432861328125, "global_step": 304446, "epoch": 2516} {"train_loss": -42.89441680908203, "global_step": 304447, "epoch": 2516} {"train_loss": -43.744956970214844, "global_step": 304448, "epoch": 2516} {"train_loss": -42.748050689697266, "global_step": 304449, "epoch": 2516} {"train_loss": -43.378719329833984, "global_step": 304450, "epoch": 2516} {"train_loss": -42.725502014160156, "global_step": 304451, "epoch": 2516} {"train_loss": -41.99082565307617, "global_step": 304452, "epoch": 2516} {"train_loss": -43.57923889160156, "global_step": 304453, "epoch": 2516} {"train_loss": -39.30414581298828, "global_step": 304454, "epoch": 2516} {"train_loss": -43.52054214477539, "global_step": 304455, "epoch": 2516} {"train_loss": -41.1637077331543, "global_step": 304456, "epoch": 2516} {"train_loss": -42.09794235229492, "global_step": 304457, "epoch": 2516} {"train_loss": -42.55799865722656, "global_step": 304458, "epoch": 2516} {"train_loss": -43.56077194213867, "global_step": 304459, "epoch": 2516} {"train_loss": -43.39471435546875, "global_step": 304460, "epoch": 2516} {"train_loss": -42.50605392456055, "global_step": 304461, "epoch": 2516} {"train_loss": -43.267879486083984, "global_step": 304462, "epoch": 2516} {"train_loss": -43.205055236816406, "global_step": 304463, "epoch": 2516} {"train_loss": -42.801300048828125, "global_step": 304464, "epoch": 2516} {"train_loss": -41.91140365600586, "global_step": 304465, "epoch": 2516} {"train_loss": -42.29026412963867, "global_step": 304466, "epoch": 2516} {"train_loss": -43.631282806396484, "global_step": 304467, "epoch": 2516} {"train_loss": -42.80326461791992, "global_step": 304468, "epoch": 2516} {"train_loss": -42.6158332824707, "global_step": 304469, "epoch": 2516} {"train_loss": -43.2320556640625, "global_step": 304470, "epoch": 2516} {"train_loss": -43.578956604003906, "global_step": 304471, "epoch": 2516} {"train_loss": -43.54340744018555, "global_step": 304472, "epoch": 2516} {"train_loss": -43.46434020996094, "global_step": 304473, "epoch": 2516} {"train_loss": -41.83761215209961, "global_step": 304474, "epoch": 2516} {"train_loss": -42.3008918762207, "global_step": 304475, "epoch": 2516} {"train_loss": -41.89003372192383, "global_step": 304476, "epoch": 2516} {"train_loss": -42.21329116821289, "global_step": 304477, "epoch": 2516} {"train_loss": -40.50603103637695, "global_step": 304478, "epoch": 2516} {"train_loss": -39.600223541259766, "global_step": 304479, "epoch": 2516} {"train_loss": -43.07942199707031, "global_step": 304480, "epoch": 2516} {"train_loss": -42.30303192138672, "global_step": 304481, "epoch": 2516} {"train_loss": -42.838233947753906, "global_step": 304482, "epoch": 2516} {"train_loss": -43.047264099121094, "global_step": 304483, "epoch": 2516} {"train_loss": -42.47799301147461, "global_step": 304484, "epoch": 2516} {"train_loss": -42.6790657043457, "global_step": 304485, "epoch": 2516} {"train_loss": -43.08028030395508, "global_step": 304486, "epoch": 2516} {"train_loss": -42.24584197998047, "global_step": 304487, "epoch": 2516} {"train_loss": -39.4273681640625, "global_step": 304488, "epoch": 2516} {"train_loss": -42.887752532958984, "global_step": 304489, "epoch": 2516} {"train_loss": -41.74817657470703, "global_step": 304490, "epoch": 2516} {"train_loss": -42.046016693115234, "global_step": 304491, "epoch": 2516} {"train_loss": -43.534706115722656, "global_step": 304492, "epoch": 2516} {"train_loss": -42.2525749206543, "global_step": 304493, "epoch": 2516} {"train_loss": -42.03713607788086, "global_step": 304494, "epoch": 2516} {"train_loss": -42.19054412841797, "global_step": 304495, "epoch": 2516} {"train_loss": -42.503997802734375, "global_step": 304496, "epoch": 2516} {"train_loss": -42.975582122802734, "global_step": 304497, "epoch": 2516} {"train_loss": -42.84288024902344, "global_step": 304498, "epoch": 2516} {"train_loss": -42.12492752075195, "global_step": 304499, "epoch": 2516} {"train_loss": -43.241943359375, "global_step": 304500, "epoch": 2516} {"train_loss": -42.500118255615234, "global_step": 304501, "epoch": 2516} {"train_loss": -42.88441848754883, "global_step": 304502, "epoch": 2516} {"train_loss": -43.0472412109375, "global_step": 304503, "epoch": 2516} {"train_loss": -42.359004974365234, "global_step": 304504, "epoch": 2516} {"train_loss": -43.41416549682617, "global_step": 304505, "epoch": 2516} {"train_loss": -43.0933952331543, "global_step": 304506, "epoch": 2516} {"train_loss": -43.15131759643555, "global_step": 304507, "epoch": 2516} {"train_loss": -43.111324310302734, "global_step": 304508, "epoch": 2516} {"train_loss": -43.253108978271484, "global_step": 304509, "epoch": 2516} {"train_loss": -43.108375549316406, "global_step": 304510, "epoch": 2516} {"train_loss": -43.563961029052734, "global_step": 304511, "epoch": 2516} {"train_loss": -43.54958724975586, "global_step": 304512, "epoch": 2516} {"train_loss": -42.56672286987305, "global_step": 304513, "epoch": 2516} {"train_loss": -42.90204620361328, "global_step": 304514, "epoch": 2516} {"train_loss": -42.959354400634766, "global_step": 304515, "epoch": 2516} {"train_loss": -44.23214340209961, "global_step": 304516, "epoch": 2516} {"train_loss": -43.5991325378418, "global_step": 304517, "epoch": 2516} {"train_loss": -41.66542053222656, "global_step": 304518, "epoch": 2516} {"train_loss": -43.010597229003906, "global_step": 304519, "epoch": 2516} {"train_loss": -43.535179138183594, "global_step": 304520, "epoch": 2516} {"train_loss": -42.934295654296875, "global_step": 304521, "epoch": 2516} {"train_loss": -43.440242767333984, "global_step": 304522, "epoch": 2516} {"train_loss": -43.681983947753906, "global_step": 304523, "epoch": 2516} {"train_loss": -43.317012786865234, "global_step": 304524, "epoch": 2516} {"train_loss": -44.013362884521484, "global_step": 304525, "epoch": 2516} {"train_loss": -43.62986755371094, "global_step": 304526, "epoch": 2516} {"train_loss": -43.730709075927734, "global_step": 304527, "epoch": 2516} {"train_loss": -43.5862922668457, "global_step": 304528, "epoch": 2516} {"train_loss": -42.85076904296875, "global_step": 304529, "epoch": 2516} {"train_loss": -43.33705520629883, "global_step": 304530, "epoch": 2516} {"train_loss": -43.7337760925293, "global_step": 304531, "epoch": 2516} {"train_loss": -43.95144271850586, "global_step": 304532, "epoch": 2516} {"train_loss": -43.09601974487305, "global_step": 304533, "epoch": 2516} {"train_loss": -43.36610794067383, "global_step": 304534, "epoch": 2516} {"train_loss": -44.18571853637695, "global_step": 304535, "epoch": 2516} {"train_loss": -43.84331512451172, "global_step": 304536, "epoch": 2516} {"train_loss": -43.66765213012695, "global_step": 304537, "epoch": 2516} {"train_loss": -44.434173583984375, "global_step": 304538, "epoch": 2516} {"train_loss": -44.102874755859375, "global_step": 304539, "epoch": 2516} {"train_loss": -43.353782653808594, "global_step": 304540, "epoch": 2516} {"train_loss": -44.32499313354492, "global_step": 304541, "epoch": 2516} {"train_loss": -42.74235534667969, "global_step": 304542, "epoch": 2516} {"train_loss": -44.05564498901367, "global_step": 304543, "epoch": 2516} {"train_loss": -44.122920989990234, "global_step": 304544, "epoch": 2516} {"train_loss": -43.85215377807617, "global_step": 304545, "epoch": 2516} {"train_loss": -43.73529815673828, "global_step": 304546, "epoch": 2516} {"train_loss": -43.89723587036133, "global_step": 304547, "epoch": 2516} {"train_loss": -43.15153884887695, "global_step": 304548, "epoch": 2516} {"train_loss": -43.14198303222656, "global_step": 304549, "epoch": 2516} {"train_loss": -43.41105270385742, "global_step": 304550, "epoch": 2516} {"train_loss": -44.08768844604492, "global_step": 304551, "epoch": 2516} {"train_loss": -43.897396087646484, "global_step": 304552, "epoch": 2516} {"train_loss": -43.8468132019043, "global_step": 304553, "epoch": 2516} {"train_loss": -43.6331901550293, "global_step": 304554, "epoch": 2516} {"train_loss": -44.12179946899414, "global_step": 304555, "epoch": 2516} {"train_loss": -42.93408054950809, "global_step": 304556, "epoch": 2516, "val_loss": 2673842.25} {"train_loss": -43.92073059082031, "global_step": 304557, "epoch": 2517} {"train_loss": -43.488826751708984, "global_step": 304558, "epoch": 2517} {"train_loss": -44.04555892944336, "global_step": 304559, "epoch": 2517} {"train_loss": -44.04274368286133, "global_step": 304560, "epoch": 2517} {"train_loss": -44.28643798828125, "global_step": 304561, "epoch": 2517} {"train_loss": -43.883705139160156, "global_step": 304562, "epoch": 2517} {"train_loss": -44.00651168823242, "global_step": 304563, "epoch": 2517} {"train_loss": -44.6140022277832, "global_step": 304564, "epoch": 2517} {"train_loss": -43.64722442626953, "global_step": 304565, "epoch": 2517} {"train_loss": -44.092071533203125, "global_step": 304566, "epoch": 2517} {"train_loss": -43.96140670776367, "global_step": 304567, "epoch": 2517} {"train_loss": -44.54294967651367, "global_step": 304568, "epoch": 2517} {"train_loss": -43.844295501708984, "global_step": 304569, "epoch": 2517} {"train_loss": -44.526023864746094, "global_step": 304570, "epoch": 2517} {"train_loss": -43.72512435913086, "global_step": 304571, "epoch": 2517} {"train_loss": -43.38842010498047, "global_step": 304572, "epoch": 2517} {"train_loss": -44.3497428894043, "global_step": 304573, "epoch": 2517} {"train_loss": -42.97444534301758, "global_step": 304574, "epoch": 2517} {"train_loss": -42.24025344848633, "global_step": 304575, "epoch": 2517} {"train_loss": -43.45037841796875, "global_step": 304576, "epoch": 2517} {"train_loss": -43.57465744018555, "global_step": 304577, "epoch": 2517} {"train_loss": -42.641448974609375, "global_step": 304578, "epoch": 2517} {"train_loss": -43.212093353271484, "global_step": 304579, "epoch": 2517} {"train_loss": -44.341941833496094, "global_step": 304580, "epoch": 2517} {"train_loss": -43.32155990600586, "global_step": 304581, "epoch": 2517} {"train_loss": -42.34961700439453, "global_step": 304582, "epoch": 2517} {"train_loss": -43.86831283569336, "global_step": 304583, "epoch": 2517} {"train_loss": -43.079315185546875, "global_step": 304584, "epoch": 2517} {"train_loss": -43.98115539550781, "global_step": 304585, "epoch": 2517} {"train_loss": -43.8416633605957, "global_step": 304586, "epoch": 2517} {"train_loss": -41.96086502075195, "global_step": 304587, "epoch": 2517} {"train_loss": -38.905372619628906, "global_step": 304588, "epoch": 2517} {"train_loss": -37.539466857910156, "global_step": 304589, "epoch": 2517} {"train_loss": -40.99396896362305, "global_step": 304590, "epoch": 2517} {"train_loss": -42.63458251953125, "global_step": 304591, "epoch": 2517} {"train_loss": -41.3468132019043, "global_step": 304592, "epoch": 2517} {"train_loss": -40.99714279174805, "global_step": 304593, "epoch": 2517} {"train_loss": -42.70574188232422, "global_step": 304594, "epoch": 2517} {"train_loss": -38.155548095703125, "global_step": 304595, "epoch": 2517} {"train_loss": -37.0214729309082, "global_step": 304596, "epoch": 2517} {"train_loss": -41.01426696777344, "global_step": 304597, "epoch": 2517} {"train_loss": -42.047725677490234, "global_step": 304598, "epoch": 2517} {"train_loss": -40.67573928833008, "global_step": 304599, "epoch": 2517} {"train_loss": -42.16329574584961, "global_step": 304600, "epoch": 2517} {"train_loss": -41.921897888183594, "global_step": 304601, "epoch": 2517} {"train_loss": -42.40763854980469, "global_step": 304602, "epoch": 2517} {"train_loss": -42.25246047973633, "global_step": 304603, "epoch": 2517} {"train_loss": -40.40781021118164, "global_step": 304604, "epoch": 2517} {"train_loss": -42.24109649658203, "global_step": 304605, "epoch": 2517} {"train_loss": -40.675846099853516, "global_step": 304606, "epoch": 2517} {"train_loss": -42.119625091552734, "global_step": 304607, "epoch": 2517} {"train_loss": -42.29043197631836, "global_step": 304608, "epoch": 2517} {"train_loss": -40.8501091003418, "global_step": 304609, "epoch": 2517} {"train_loss": -39.886512756347656, "global_step": 304610, "epoch": 2517} {"train_loss": -42.71212387084961, "global_step": 304611, "epoch": 2517} {"train_loss": -42.594661712646484, "global_step": 304612, "epoch": 2517} {"train_loss": -43.35682678222656, "global_step": 304613, "epoch": 2517} {"train_loss": -43.1453857421875, "global_step": 304614, "epoch": 2517} {"train_loss": -42.46670913696289, "global_step": 304615, "epoch": 2517} {"train_loss": -42.31557846069336, "global_step": 304616, "epoch": 2517} {"train_loss": -43.16777038574219, "global_step": 304617, "epoch": 2517} {"train_loss": -42.718807220458984, "global_step": 304618, "epoch": 2517} {"train_loss": -38.01633071899414, "global_step": 304619, "epoch": 2517} {"train_loss": -41.483642578125, "global_step": 304620, "epoch": 2517} {"train_loss": -43.61488723754883, "global_step": 304621, "epoch": 2517} {"train_loss": -41.714534759521484, "global_step": 304622, "epoch": 2517} {"train_loss": -41.14600372314453, "global_step": 304623, "epoch": 2517} {"train_loss": -40.67390823364258, "global_step": 304624, "epoch": 2517} {"train_loss": -42.753143310546875, "global_step": 304625, "epoch": 2517} {"train_loss": -41.39955520629883, "global_step": 304626, "epoch": 2517} {"train_loss": -43.306068420410156, "global_step": 304627, "epoch": 2517} {"train_loss": -41.69390869140625, "global_step": 304628, "epoch": 2517} {"train_loss": -43.251014709472656, "global_step": 304629, "epoch": 2517} {"train_loss": -41.28258514404297, "global_step": 304630, "epoch": 2517} {"train_loss": -42.76155471801758, "global_step": 304631, "epoch": 2517} {"train_loss": -43.51823806762695, "global_step": 304632, "epoch": 2517} {"train_loss": -43.36302947998047, "global_step": 304633, "epoch": 2517} {"train_loss": -43.90883255004883, "global_step": 304634, "epoch": 2517} {"train_loss": -43.601905822753906, "global_step": 304635, "epoch": 2517} {"train_loss": -43.37188720703125, "global_step": 304636, "epoch": 2517} {"train_loss": -43.533870697021484, "global_step": 304637, "epoch": 2517} {"train_loss": -42.21862030029297, "global_step": 304638, "epoch": 2517} {"train_loss": -42.835601806640625, "global_step": 304639, "epoch": 2517} {"train_loss": -43.573795318603516, "global_step": 304640, "epoch": 2517} {"train_loss": -43.65396499633789, "global_step": 304641, "epoch": 2517} {"train_loss": -43.45895004272461, "global_step": 304642, "epoch": 2517} {"train_loss": -44.269012451171875, "global_step": 304643, "epoch": 2517} {"train_loss": -42.64639663696289, "global_step": 304644, "epoch": 2517} {"train_loss": -43.80446243286133, "global_step": 304645, "epoch": 2517} {"train_loss": -43.89632797241211, "global_step": 304646, "epoch": 2517} {"train_loss": -43.05573654174805, "global_step": 304647, "epoch": 2517} {"train_loss": -44.1365852355957, "global_step": 304648, "epoch": 2517} {"train_loss": -44.29153823852539, "global_step": 304649, "epoch": 2517} {"train_loss": -43.3389892578125, "global_step": 304650, "epoch": 2517} {"train_loss": -42.98801803588867, "global_step": 304651, "epoch": 2517} {"train_loss": -43.8894157409668, "global_step": 304652, "epoch": 2517} {"train_loss": -43.189537048339844, "global_step": 304653, "epoch": 2517} {"train_loss": -41.984771728515625, "global_step": 304654, "epoch": 2517} {"train_loss": -42.247962951660156, "global_step": 304655, "epoch": 2517} {"train_loss": -41.371246337890625, "global_step": 304656, "epoch": 2517} {"train_loss": -43.8805046081543, "global_step": 304657, "epoch": 2517} {"train_loss": -44.12575149536133, "global_step": 304658, "epoch": 2517} {"train_loss": -43.89993667602539, "global_step": 304659, "epoch": 2517} {"train_loss": -44.43121337890625, "global_step": 304660, "epoch": 2517} {"train_loss": -43.13902282714844, "global_step": 304661, "epoch": 2517} {"train_loss": -44.091346740722656, "global_step": 304662, "epoch": 2517} {"train_loss": -43.09463119506836, "global_step": 304663, "epoch": 2517} {"train_loss": -44.10900115966797, "global_step": 304664, "epoch": 2517} {"train_loss": -44.46493911743164, "global_step": 304665, "epoch": 2517} {"train_loss": -43.711769104003906, "global_step": 304666, "epoch": 2517} {"train_loss": -43.632164001464844, "global_step": 304667, "epoch": 2517} {"train_loss": -44.40818405151367, "global_step": 304668, "epoch": 2517} {"train_loss": -43.921199798583984, "global_step": 304669, "epoch": 2517} {"train_loss": -44.121726989746094, "global_step": 304670, "epoch": 2517} {"train_loss": -43.779396057128906, "global_step": 304671, "epoch": 2517} {"train_loss": -44.433189392089844, "global_step": 304672, "epoch": 2517} {"train_loss": -44.497310638427734, "global_step": 304673, "epoch": 2517} {"train_loss": -44.290157318115234, "global_step": 304674, "epoch": 2517} {"train_loss": -43.995765686035156, "global_step": 304675, "epoch": 2517} {"train_loss": -43.86094284057617, "global_step": 304676, "epoch": 2517} {"train_loss": -42.861928987108975, "global_step": 304677, "epoch": 2517, "val_loss": 2762847.25} {"train_loss": -44.343780517578125, "global_step": 304678, "epoch": 2518} {"train_loss": -43.80430221557617, "global_step": 304679, "epoch": 2518} {"train_loss": -39.513370513916016, "global_step": 304680, "epoch": 2518} {"train_loss": -43.9171257019043, "global_step": 304681, "epoch": 2518} {"train_loss": -42.72369384765625, "global_step": 304682, "epoch": 2518} {"train_loss": -43.02958297729492, "global_step": 304683, "epoch": 2518} {"train_loss": -43.19700241088867, "global_step": 304684, "epoch": 2518} {"train_loss": -40.924381256103516, "global_step": 304685, "epoch": 2518} {"train_loss": -40.77594757080078, "global_step": 304686, "epoch": 2518} {"train_loss": -42.778236389160156, "global_step": 304687, "epoch": 2518} {"train_loss": -43.4870719909668, "global_step": 304688, "epoch": 2518} {"train_loss": -42.18645095825195, "global_step": 304689, "epoch": 2518} {"train_loss": -41.74473190307617, "global_step": 304690, "epoch": 2518} {"train_loss": -42.97825622558594, "global_step": 304691, "epoch": 2518} {"train_loss": -43.1362419128418, "global_step": 304692, "epoch": 2518} {"train_loss": -44.14201354980469, "global_step": 304693, "epoch": 2518} {"train_loss": -43.35968780517578, "global_step": 304694, "epoch": 2518} {"train_loss": -42.82975387573242, "global_step": 304695, "epoch": 2518} {"train_loss": -42.86149978637695, "global_step": 304696, "epoch": 2518} {"train_loss": -43.492488861083984, "global_step": 304697, "epoch": 2518} {"train_loss": -43.572505950927734, "global_step": 304698, "epoch": 2518} {"train_loss": -41.93751907348633, "global_step": 304699, "epoch": 2518} {"train_loss": -42.31593322753906, "global_step": 304700, "epoch": 2518} {"train_loss": -34.84586715698242, "global_step": 304701, "epoch": 2518} {"train_loss": -35.92278289794922, "global_step": 304702, "epoch": 2518} {"train_loss": -42.179988861083984, "global_step": 304703, "epoch": 2518} {"train_loss": -42.01809310913086, "global_step": 304704, "epoch": 2518} {"train_loss": -43.67843246459961, "global_step": 304705, "epoch": 2518} {"train_loss": -42.912899017333984, "global_step": 304706, "epoch": 2518} {"train_loss": -40.4957389831543, "global_step": 304707, "epoch": 2518} {"train_loss": -41.69700241088867, "global_step": 304708, "epoch": 2518} {"train_loss": -43.54008865356445, "global_step": 304709, "epoch": 2518} {"train_loss": -43.1716423034668, "global_step": 304710, "epoch": 2518} {"train_loss": -38.08134078979492, "global_step": 304711, "epoch": 2518} {"train_loss": -39.673736572265625, "global_step": 304712, "epoch": 2518} {"train_loss": -42.64140319824219, "global_step": 304713, "epoch": 2518} {"train_loss": -42.421791076660156, "global_step": 304714, "epoch": 2518} {"train_loss": -41.480960845947266, "global_step": 304715, "epoch": 2518} {"train_loss": -43.07413864135742, "global_step": 304716, "epoch": 2518} {"train_loss": -41.754268646240234, "global_step": 304717, "epoch": 2518} {"train_loss": -43.526947021484375, "global_step": 304718, "epoch": 2518} {"train_loss": -42.5129280090332, "global_step": 304719, "epoch": 2518} {"train_loss": -42.36532974243164, "global_step": 304720, "epoch": 2518} {"train_loss": -35.481266021728516, "global_step": 304721, "epoch": 2518} {"train_loss": -42.30363845825195, "global_step": 304722, "epoch": 2518} {"train_loss": -40.53639602661133, "global_step": 304723, "epoch": 2518} {"train_loss": -42.27352523803711, "global_step": 304724, "epoch": 2518} {"train_loss": -43.489925384521484, "global_step": 304725, "epoch": 2518} {"train_loss": -41.99448776245117, "global_step": 304726, "epoch": 2518} {"train_loss": -43.051361083984375, "global_step": 304727, "epoch": 2518} {"train_loss": -43.040184020996094, "global_step": 304728, "epoch": 2518} {"train_loss": -42.412994384765625, "global_step": 304729, "epoch": 2518} {"train_loss": -42.60435104370117, "global_step": 304730, "epoch": 2518} {"train_loss": -37.574527740478516, "global_step": 304731, "epoch": 2518} {"train_loss": -40.05854415893555, "global_step": 304732, "epoch": 2518} {"train_loss": -42.6853141784668, "global_step": 304733, "epoch": 2518} {"train_loss": -39.89860153198242, "global_step": 304734, "epoch": 2518} {"train_loss": -43.12092208862305, "global_step": 304735, "epoch": 2518} {"train_loss": -42.738311767578125, "global_step": 304736, "epoch": 2518} {"train_loss": -35.31494140625, "global_step": 304737, "epoch": 2518} {"train_loss": -42.881195068359375, "global_step": 304738, "epoch": 2518} {"train_loss": -42.80719757080078, "global_step": 304739, "epoch": 2518} {"train_loss": -43.61399841308594, "global_step": 304740, "epoch": 2518} {"train_loss": -43.341346740722656, "global_step": 304741, "epoch": 2518} {"train_loss": -42.52787780761719, "global_step": 304742, "epoch": 2518} {"train_loss": -43.07281494140625, "global_step": 304743, "epoch": 2518} {"train_loss": -43.84930419921875, "global_step": 304744, "epoch": 2518} {"train_loss": -43.18844223022461, "global_step": 304745, "epoch": 2518} {"train_loss": -42.439632415771484, "global_step": 304746, "epoch": 2518} {"train_loss": -42.92532730102539, "global_step": 304747, "epoch": 2518} {"train_loss": -41.806522369384766, "global_step": 304748, "epoch": 2518} {"train_loss": -40.94614791870117, "global_step": 304749, "epoch": 2518} {"train_loss": -42.638668060302734, "global_step": 304750, "epoch": 2518} {"train_loss": -43.20464324951172, "global_step": 304751, "epoch": 2518} {"train_loss": -43.03761672973633, "global_step": 304752, "epoch": 2518} {"train_loss": -42.07008743286133, "global_step": 304753, "epoch": 2518} {"train_loss": -43.43593978881836, "global_step": 304754, "epoch": 2518} {"train_loss": -43.344764709472656, "global_step": 304755, "epoch": 2518} {"train_loss": -43.2850456237793, "global_step": 304756, "epoch": 2518} {"train_loss": -38.97578430175781, "global_step": 304757, "epoch": 2518} {"train_loss": -42.59791946411133, "global_step": 304758, "epoch": 2518} {"train_loss": -42.62702560424805, "global_step": 304759, "epoch": 2518} {"train_loss": -41.64930725097656, "global_step": 304760, "epoch": 2518} {"train_loss": -42.6784553527832, "global_step": 304761, "epoch": 2518} {"train_loss": -43.77874755859375, "global_step": 304762, "epoch": 2518} {"train_loss": -43.6035270690918, "global_step": 304763, "epoch": 2518} {"train_loss": -43.77375411987305, "global_step": 304764, "epoch": 2518} {"train_loss": -43.344207763671875, "global_step": 304765, "epoch": 2518} {"train_loss": -43.45069122314453, "global_step": 304766, "epoch": 2518} {"train_loss": -42.82016372680664, "global_step": 304767, "epoch": 2518} {"train_loss": -43.249412536621094, "global_step": 304768, "epoch": 2518} {"train_loss": -43.76974105834961, "global_step": 304769, "epoch": 2518} {"train_loss": -43.24457550048828, "global_step": 304770, "epoch": 2518} {"train_loss": -42.75197982788086, "global_step": 304771, "epoch": 2518} {"train_loss": -43.83393859863281, "global_step": 304772, "epoch": 2518} {"train_loss": -43.3763427734375, "global_step": 304773, "epoch": 2518} {"train_loss": -42.38039779663086, "global_step": 304774, "epoch": 2518} {"train_loss": -42.60356903076172, "global_step": 304775, "epoch": 2518} {"train_loss": -42.85835647583008, "global_step": 304776, "epoch": 2518} {"train_loss": -43.574337005615234, "global_step": 304777, "epoch": 2518} {"train_loss": -43.69503402709961, "global_step": 304778, "epoch": 2518} {"train_loss": -44.0072135925293, "global_step": 304779, "epoch": 2518} {"train_loss": -43.65249252319336, "global_step": 304780, "epoch": 2518} {"train_loss": -43.4947509765625, "global_step": 304781, "epoch": 2518} {"train_loss": -41.437461853027344, "global_step": 304782, "epoch": 2518} {"train_loss": -43.45363998413086, "global_step": 304783, "epoch": 2518} {"train_loss": -42.79166793823242, "global_step": 304784, "epoch": 2518} {"train_loss": -43.85618591308594, "global_step": 304785, "epoch": 2518} {"train_loss": -43.61907958984375, "global_step": 304786, "epoch": 2518} {"train_loss": -43.52114486694336, "global_step": 304787, "epoch": 2518} {"train_loss": -44.48066329956055, "global_step": 304788, "epoch": 2518} {"train_loss": -44.134639739990234, "global_step": 304789, "epoch": 2518} {"train_loss": -44.150447845458984, "global_step": 304790, "epoch": 2518} {"train_loss": -43.88206100463867, "global_step": 304791, "epoch": 2518} {"train_loss": -44.107730865478516, "global_step": 304792, "epoch": 2518} {"train_loss": -43.49760055541992, "global_step": 304793, "epoch": 2518} {"train_loss": -40.59470748901367, "global_step": 304794, "epoch": 2518} {"train_loss": -43.338436126708984, "global_step": 304795, "epoch": 2518} {"train_loss": -43.84165573120117, "global_step": 304796, "epoch": 2518} {"train_loss": -43.62321090698242, "global_step": 304797, "epoch": 2518} {"train_loss": -42.46584770896218, "global_step": 304798, "epoch": 2518, "val_loss": 2657671.25} {"train_loss": -43.9466552734375, "global_step": 304799, "epoch": 2519} {"train_loss": -44.56928634643555, "global_step": 304800, "epoch": 2519} {"train_loss": -42.926856994628906, "global_step": 304801, "epoch": 2519} {"train_loss": -43.24601745605469, "global_step": 304802, "epoch": 2519} {"train_loss": -43.844139099121094, "global_step": 304803, "epoch": 2519} {"train_loss": -43.850196838378906, "global_step": 304804, "epoch": 2519} {"train_loss": -44.19734573364258, "global_step": 304805, "epoch": 2519} {"train_loss": -43.47697067260742, "global_step": 304806, "epoch": 2519} {"train_loss": -43.82931137084961, "global_step": 304807, "epoch": 2519} {"train_loss": -42.903499603271484, "global_step": 304808, "epoch": 2519} {"train_loss": -42.60500717163086, "global_step": 304809, "epoch": 2519} {"train_loss": -44.09968185424805, "global_step": 304810, "epoch": 2519} {"train_loss": -44.02766036987305, "global_step": 304811, "epoch": 2519} {"train_loss": -44.01041793823242, "global_step": 304812, "epoch": 2519} {"train_loss": -42.23947525024414, "global_step": 304813, "epoch": 2519} {"train_loss": -44.16557693481445, "global_step": 304814, "epoch": 2519} {"train_loss": -43.48471450805664, "global_step": 304815, "epoch": 2519} {"train_loss": -43.563716888427734, "global_step": 304816, "epoch": 2519} {"train_loss": -44.09952163696289, "global_step": 304817, "epoch": 2519} {"train_loss": -44.139774322509766, "global_step": 304818, "epoch": 2519} {"train_loss": -44.2059211730957, "global_step": 304819, "epoch": 2519} {"train_loss": -41.6949462890625, "global_step": 304820, "epoch": 2519} {"train_loss": -43.152618408203125, "global_step": 304821, "epoch": 2519} {"train_loss": -43.288448333740234, "global_step": 304822, "epoch": 2519} {"train_loss": -42.236305236816406, "global_step": 304823, "epoch": 2519} {"train_loss": -42.724483489990234, "global_step": 304824, "epoch": 2519} {"train_loss": -42.42592239379883, "global_step": 304825, "epoch": 2519} {"train_loss": -40.721656799316406, "global_step": 304826, "epoch": 2519} {"train_loss": -42.71413040161133, "global_step": 304827, "epoch": 2519} {"train_loss": -42.242767333984375, "global_step": 304828, "epoch": 2519} {"train_loss": -42.4822883605957, "global_step": 304829, "epoch": 2519} {"train_loss": -43.052284240722656, "global_step": 304830, "epoch": 2519} {"train_loss": -41.80767059326172, "global_step": 304831, "epoch": 2519} {"train_loss": -40.41341781616211, "global_step": 304832, "epoch": 2519} {"train_loss": -42.14252471923828, "global_step": 304833, "epoch": 2519} {"train_loss": -41.62608337402344, "global_step": 304834, "epoch": 2519} {"train_loss": -42.121212005615234, "global_step": 304835, "epoch": 2519} {"train_loss": -39.871315002441406, "global_step": 304836, "epoch": 2519} {"train_loss": -42.54463577270508, "global_step": 304837, "epoch": 2519} {"train_loss": -42.7330207824707, "global_step": 304838, "epoch": 2519} {"train_loss": -42.616756439208984, "global_step": 304839, "epoch": 2519} {"train_loss": -43.358795166015625, "global_step": 304840, "epoch": 2519} {"train_loss": -41.971012115478516, "global_step": 304841, "epoch": 2519} {"train_loss": -42.536109924316406, "global_step": 304842, "epoch": 2519} {"train_loss": -43.101505279541016, "global_step": 304843, "epoch": 2519} {"train_loss": -41.9127082824707, "global_step": 304844, "epoch": 2519} {"train_loss": -41.514930725097656, "global_step": 304845, "epoch": 2519} {"train_loss": -36.425506591796875, "global_step": 304846, "epoch": 2519} {"train_loss": -42.28321075439453, "global_step": 304847, "epoch": 2519} {"train_loss": -37.87150192260742, "global_step": 304848, "epoch": 2519} {"train_loss": -40.486263275146484, "global_step": 304849, "epoch": 2519} {"train_loss": -37.89417266845703, "global_step": 304850, "epoch": 2519} {"train_loss": -43.128719329833984, "global_step": 304851, "epoch": 2519} {"train_loss": -37.21723175048828, "global_step": 304852, "epoch": 2519} {"train_loss": -41.75584030151367, "global_step": 304853, "epoch": 2519} {"train_loss": -40.595882415771484, "global_step": 304854, "epoch": 2519} {"train_loss": -37.18345260620117, "global_step": 304855, "epoch": 2519} {"train_loss": -41.5754508972168, "global_step": 304856, "epoch": 2519} {"train_loss": -39.04635238647461, "global_step": 304857, "epoch": 2519} {"train_loss": -41.84199523925781, "global_step": 304858, "epoch": 2519} {"train_loss": -38.24801254272461, "global_step": 304859, "epoch": 2519} {"train_loss": -40.4514045715332, "global_step": 304860, "epoch": 2519} {"train_loss": -40.17562484741211, "global_step": 304861, "epoch": 2519} {"train_loss": -41.60604476928711, "global_step": 304862, "epoch": 2519} {"train_loss": -39.449058532714844, "global_step": 304863, "epoch": 2519} {"train_loss": -40.96392059326172, "global_step": 304864, "epoch": 2519} {"train_loss": -40.81716537475586, "global_step": 304865, "epoch": 2519} {"train_loss": -40.60157012939453, "global_step": 304866, "epoch": 2519} {"train_loss": -41.297061920166016, "global_step": 304867, "epoch": 2519} {"train_loss": -41.46566390991211, "global_step": 304868, "epoch": 2519} {"train_loss": -39.29506301879883, "global_step": 304869, "epoch": 2519} {"train_loss": -42.6064567565918, "global_step": 304870, "epoch": 2519} {"train_loss": -39.30879592895508, "global_step": 304871, "epoch": 2519} {"train_loss": -41.35610580444336, "global_step": 304872, "epoch": 2519} {"train_loss": -40.78744125366211, "global_step": 304873, "epoch": 2519} {"train_loss": -42.491363525390625, "global_step": 304874, "epoch": 2519} {"train_loss": -40.537452697753906, "global_step": 304875, "epoch": 2519} {"train_loss": -42.079444885253906, "global_step": 304876, "epoch": 2519} {"train_loss": -41.453765869140625, "global_step": 304877, "epoch": 2519} {"train_loss": -42.214752197265625, "global_step": 304878, "epoch": 2519} {"train_loss": -41.397457122802734, "global_step": 304879, "epoch": 2519} {"train_loss": -41.15865707397461, "global_step": 304880, "epoch": 2519} {"train_loss": -42.330806732177734, "global_step": 304881, "epoch": 2519} {"train_loss": -43.22751998901367, "global_step": 304882, "epoch": 2519} {"train_loss": -42.7857780456543, "global_step": 304883, "epoch": 2519} {"train_loss": -42.63502502441406, "global_step": 304884, "epoch": 2519} {"train_loss": -42.807247161865234, "global_step": 304885, "epoch": 2519} {"train_loss": -42.6748046875, "global_step": 304886, "epoch": 2519} {"train_loss": -43.39284133911133, "global_step": 304887, "epoch": 2519} {"train_loss": -42.849822998046875, "global_step": 304888, "epoch": 2519} {"train_loss": -43.358436584472656, "global_step": 304889, "epoch": 2519} {"train_loss": -43.04254913330078, "global_step": 304890, "epoch": 2519} {"train_loss": -42.77435302734375, "global_step": 304891, "epoch": 2519} {"train_loss": -43.22419738769531, "global_step": 304892, "epoch": 2519} {"train_loss": -43.788082122802734, "global_step": 304893, "epoch": 2519} {"train_loss": -43.288875579833984, "global_step": 304894, "epoch": 2519} {"train_loss": -42.27860641479492, "global_step": 304895, "epoch": 2519} {"train_loss": -42.85869598388672, "global_step": 304896, "epoch": 2519} {"train_loss": -43.09724807739258, "global_step": 304897, "epoch": 2519} {"train_loss": -43.16605758666992, "global_step": 304898, "epoch": 2519} {"train_loss": -43.652191162109375, "global_step": 304899, "epoch": 2519} {"train_loss": -43.775760650634766, "global_step": 304900, "epoch": 2519} {"train_loss": -43.99675369262695, "global_step": 304901, "epoch": 2519} {"train_loss": -43.210540771484375, "global_step": 304902, "epoch": 2519} {"train_loss": -43.2568473815918, "global_step": 304903, "epoch": 2519} {"train_loss": -43.886009216308594, "global_step": 304904, "epoch": 2519} {"train_loss": -44.0728874206543, "global_step": 304905, "epoch": 2519} {"train_loss": -44.177703857421875, "global_step": 304906, "epoch": 2519} {"train_loss": -44.023563385009766, "global_step": 304907, "epoch": 2519} {"train_loss": -44.237327575683594, "global_step": 304908, "epoch": 2519} {"train_loss": -43.99299240112305, "global_step": 304909, "epoch": 2519} {"train_loss": -43.91843032836914, "global_step": 304910, "epoch": 2519} {"train_loss": -44.36355209350586, "global_step": 304911, "epoch": 2519} {"train_loss": -44.17222213745117, "global_step": 304912, "epoch": 2519} {"train_loss": -44.28782272338867, "global_step": 304913, "epoch": 2519} {"train_loss": -44.4459342956543, "global_step": 304914, "epoch": 2519} {"train_loss": -44.22080993652344, "global_step": 304915, "epoch": 2519} {"train_loss": -44.454586029052734, "global_step": 304916, "epoch": 2519} {"train_loss": -44.14913558959961, "global_step": 304917, "epoch": 2519} {"train_loss": -44.28876876831055, "global_step": 304918, "epoch": 2519} {"train_loss": -42.397103806172524, "global_step": 304919, "epoch": 2519, "val_loss": 2589709.0} {"train_loss": -43.895904541015625, "global_step": 304920, "epoch": 2520} {"train_loss": -44.09793472290039, "global_step": 304921, "epoch": 2520} {"train_loss": -44.35091781616211, "global_step": 304922, "epoch": 2520} {"train_loss": -44.5467529296875, "global_step": 304923, "epoch": 2520} {"train_loss": -44.456199645996094, "global_step": 304924, "epoch": 2520} {"train_loss": -44.42570114135742, "global_step": 304925, "epoch": 2520} {"train_loss": -44.702999114990234, "global_step": 304926, "epoch": 2520} {"train_loss": -43.71404266357422, "global_step": 304927, "epoch": 2520} {"train_loss": -44.632938385009766, "global_step": 304928, "epoch": 2520} {"train_loss": -44.89603805541992, "global_step": 304929, "epoch": 2520} {"train_loss": -44.37147903442383, "global_step": 304930, "epoch": 2520} {"train_loss": -44.47383499145508, "global_step": 304931, "epoch": 2520} {"train_loss": -44.76821517944336, "global_step": 304932, "epoch": 2520} {"train_loss": -44.366065979003906, "global_step": 304933, "epoch": 2520} {"train_loss": -44.20558547973633, "global_step": 304934, "epoch": 2520} {"train_loss": -44.03826904296875, "global_step": 304935, "epoch": 2520} {"train_loss": -43.49503707885742, "global_step": 304936, "epoch": 2520} {"train_loss": -42.49264144897461, "global_step": 304937, "epoch": 2520} {"train_loss": -41.19923782348633, "global_step": 304938, "epoch": 2520} {"train_loss": -37.10365676879883, "global_step": 304939, "epoch": 2520} {"train_loss": -32.97869873046875, "global_step": 304940, "epoch": 2520} {"train_loss": -34.839996337890625, "global_step": 304941, "epoch": 2520} {"train_loss": -40.08745193481445, "global_step": 304942, "epoch": 2520} {"train_loss": -42.364051818847656, "global_step": 304943, "epoch": 2520} {"train_loss": -39.35137939453125, "global_step": 304944, "epoch": 2520} {"train_loss": -40.63985061645508, "global_step": 304945, "epoch": 2520} {"train_loss": -42.547821044921875, "global_step": 304946, "epoch": 2520} {"train_loss": -42.07395553588867, "global_step": 304947, "epoch": 2520} {"train_loss": -40.9420166015625, "global_step": 304948, "epoch": 2520} {"train_loss": -43.01205062866211, "global_step": 304949, "epoch": 2520} {"train_loss": -42.069236755371094, "global_step": 304950, "epoch": 2520} {"train_loss": -39.42472457885742, "global_step": 304951, "epoch": 2520} {"train_loss": -41.8422966003418, "global_step": 304952, "epoch": 2520} {"train_loss": -42.011146545410156, "global_step": 304953, "epoch": 2520} {"train_loss": -40.84552001953125, "global_step": 304954, "epoch": 2520} {"train_loss": -40.60197067260742, "global_step": 304955, "epoch": 2520} {"train_loss": -39.92061996459961, "global_step": 304956, "epoch": 2520} {"train_loss": -41.84772491455078, "global_step": 304957, "epoch": 2520} {"train_loss": -41.93635177612305, "global_step": 304958, "epoch": 2520} {"train_loss": -39.890316009521484, "global_step": 304959, "epoch": 2520} {"train_loss": -42.605918884277344, "global_step": 304960, "epoch": 2520} {"train_loss": -41.382381439208984, "global_step": 304961, "epoch": 2520} {"train_loss": -41.882869720458984, "global_step": 304962, "epoch": 2520} {"train_loss": -41.648681640625, "global_step": 304963, "epoch": 2520} {"train_loss": -42.16267776489258, "global_step": 304964, "epoch": 2520} {"train_loss": -42.34345626831055, "global_step": 304965, "epoch": 2520} {"train_loss": -41.92148971557617, "global_step": 304966, "epoch": 2520} {"train_loss": -42.55062484741211, "global_step": 304967, "epoch": 2520} {"train_loss": -42.87815475463867, "global_step": 304968, "epoch": 2520} {"train_loss": -42.72420883178711, "global_step": 304969, "epoch": 2520} {"train_loss": -43.354698181152344, "global_step": 304970, "epoch": 2520} {"train_loss": -42.69927978515625, "global_step": 304971, "epoch": 2520} {"train_loss": -43.1092643737793, "global_step": 304972, "epoch": 2520} {"train_loss": -43.52865219116211, "global_step": 304973, "epoch": 2520} {"train_loss": -43.25287628173828, "global_step": 304974, "epoch": 2520} {"train_loss": -43.429969787597656, "global_step": 304975, "epoch": 2520} {"train_loss": -42.725120544433594, "global_step": 304976, "epoch": 2520} {"train_loss": -43.203529357910156, "global_step": 304977, "epoch": 2520} {"train_loss": -42.32638931274414, "global_step": 304978, "epoch": 2520} {"train_loss": -43.33671569824219, "global_step": 304979, "epoch": 2520} {"train_loss": -43.229942321777344, "global_step": 304980, "epoch": 2520} {"train_loss": -43.4996337890625, "global_step": 304981, "epoch": 2520} {"train_loss": -43.27875518798828, "global_step": 304982, "epoch": 2520} {"train_loss": -43.5821418762207, "global_step": 304983, "epoch": 2520} {"train_loss": -43.0183219909668, "global_step": 304984, "epoch": 2520} {"train_loss": -42.89823532104492, "global_step": 304985, "epoch": 2520} {"train_loss": -43.27797317504883, "global_step": 304986, "epoch": 2520} {"train_loss": -43.03258514404297, "global_step": 304987, "epoch": 2520} {"train_loss": -43.946590423583984, "global_step": 304988, "epoch": 2520} {"train_loss": -43.4005126953125, "global_step": 304989, "epoch": 2520} {"train_loss": -43.8127555847168, "global_step": 304990, "epoch": 2520} {"train_loss": -43.20127487182617, "global_step": 304991, "epoch": 2520} {"train_loss": -43.87789535522461, "global_step": 304992, "epoch": 2520} {"train_loss": -43.4552116394043, "global_step": 304993, "epoch": 2520} {"train_loss": -43.494808197021484, "global_step": 304994, "epoch": 2520} {"train_loss": -43.3515739440918, "global_step": 304995, "epoch": 2520} {"train_loss": -43.54372024536133, "global_step": 304996, "epoch": 2520} {"train_loss": -43.16563034057617, "global_step": 304997, "epoch": 2520} {"train_loss": -43.6911735534668, "global_step": 304998, "epoch": 2520} {"train_loss": -43.825408935546875, "global_step": 304999, "epoch": 2520} {"train_loss": -43.00011444091797, "global_step": 305000, "epoch": 2520} {"train_loss": -43.23734664916992, "global_step": 305001, "epoch": 2520} {"train_loss": -43.31373977661133, "global_step": 305002, "epoch": 2520} {"train_loss": -43.855892181396484, "global_step": 305003, "epoch": 2520} {"train_loss": -43.25071334838867, "global_step": 305004, "epoch": 2520} {"train_loss": -43.46513366699219, "global_step": 305005, "epoch": 2520} {"train_loss": -43.704837799072266, "global_step": 305006, "epoch": 2520} {"train_loss": -42.666175842285156, "global_step": 305007, "epoch": 2520} {"train_loss": -42.74484634399414, "global_step": 305008, "epoch": 2520} {"train_loss": -43.79484176635742, "global_step": 305009, "epoch": 2520} {"train_loss": -43.170467376708984, "global_step": 305010, "epoch": 2520} {"train_loss": -43.61445999145508, "global_step": 305011, "epoch": 2520} {"train_loss": -43.98698806762695, "global_step": 305012, "epoch": 2520} {"train_loss": -43.88608932495117, "global_step": 305013, "epoch": 2520} {"train_loss": -44.407894134521484, "global_step": 305014, "epoch": 2520} {"train_loss": -43.37600326538086, "global_step": 305015, "epoch": 2520} {"train_loss": -44.31441879272461, "global_step": 305016, "epoch": 2520} {"train_loss": -43.399696350097656, "global_step": 305017, "epoch": 2520} {"train_loss": -44.278656005859375, "global_step": 305018, "epoch": 2520} {"train_loss": -43.49904251098633, "global_step": 305019, "epoch": 2520} {"train_loss": -43.718971252441406, "global_step": 305020, "epoch": 2520} {"train_loss": -44.27460479736328, "global_step": 305021, "epoch": 2520} {"train_loss": -44.00362014770508, "global_step": 305022, "epoch": 2520} {"train_loss": -44.434051513671875, "global_step": 305023, "epoch": 2520} {"train_loss": -44.35264587402344, "global_step": 305024, "epoch": 2520} {"train_loss": -44.00522994995117, "global_step": 305025, "epoch": 2520} {"train_loss": -44.55316925048828, "global_step": 305026, "epoch": 2520} {"train_loss": -44.75765609741211, "global_step": 305027, "epoch": 2520} {"train_loss": -43.641029357910156, "global_step": 305028, "epoch": 2520} {"train_loss": -43.98216247558594, "global_step": 305029, "epoch": 2520} {"train_loss": -44.09333801269531, "global_step": 305030, "epoch": 2520} {"train_loss": -43.40436935424805, "global_step": 305031, "epoch": 2520} {"train_loss": -44.16652297973633, "global_step": 305032, "epoch": 2520} {"train_loss": -44.409149169921875, "global_step": 305033, "epoch": 2520} {"train_loss": -44.046627044677734, "global_step": 305034, "epoch": 2520} {"train_loss": -44.03032302856445, "global_step": 305035, "epoch": 2520} {"train_loss": -44.082252502441406, "global_step": 305036, "epoch": 2520} {"train_loss": -43.949432373046875, "global_step": 305037, "epoch": 2520} {"train_loss": -43.87827682495117, "global_step": 305038, "epoch": 2520} {"train_loss": -43.567508697509766, "global_step": 305039, "epoch": 2520} {"train_loss": -42.98685846249919, "global_step": 305040, "epoch": 2520, "val_loss": 2573014.25} {"train_loss": -44.211822509765625, "global_step": 305041, "epoch": 2521} {"train_loss": -43.63888168334961, "global_step": 305042, "epoch": 2521} {"train_loss": -43.75202178955078, "global_step": 305043, "epoch": 2521} {"train_loss": -43.7806510925293, "global_step": 305044, "epoch": 2521} {"train_loss": -43.893348693847656, "global_step": 305045, "epoch": 2521} {"train_loss": -43.472198486328125, "global_step": 305046, "epoch": 2521} {"train_loss": -42.37361145019531, "global_step": 305047, "epoch": 2521} {"train_loss": -41.85640335083008, "global_step": 305048, "epoch": 2521} {"train_loss": -41.55381774902344, "global_step": 305049, "epoch": 2521} {"train_loss": -41.34082794189453, "global_step": 305050, "epoch": 2521} {"train_loss": -43.44475555419922, "global_step": 305051, "epoch": 2521} {"train_loss": -44.143646240234375, "global_step": 305052, "epoch": 2521} {"train_loss": -42.802581787109375, "global_step": 305053, "epoch": 2521} {"train_loss": -42.4470100402832, "global_step": 305054, "epoch": 2521} {"train_loss": -41.67266845703125, "global_step": 305055, "epoch": 2521} {"train_loss": -42.991085052490234, "global_step": 305056, "epoch": 2521} {"train_loss": -43.532073974609375, "global_step": 305057, "epoch": 2521} {"train_loss": -43.846309661865234, "global_step": 305058, "epoch": 2521} {"train_loss": -42.98566436767578, "global_step": 305059, "epoch": 2521} {"train_loss": -43.34198760986328, "global_step": 305060, "epoch": 2521} {"train_loss": -43.9211540222168, "global_step": 305061, "epoch": 2521} {"train_loss": -43.19218444824219, "global_step": 305062, "epoch": 2521} {"train_loss": -43.37205123901367, "global_step": 305063, "epoch": 2521} {"train_loss": -42.12800598144531, "global_step": 305064, "epoch": 2521} {"train_loss": -42.57889938354492, "global_step": 305065, "epoch": 2521} {"train_loss": -43.24066925048828, "global_step": 305066, "epoch": 2521} {"train_loss": -42.92475509643555, "global_step": 305067, "epoch": 2521} {"train_loss": -42.921688079833984, "global_step": 305068, "epoch": 2521} {"train_loss": -44.004940032958984, "global_step": 305069, "epoch": 2521} {"train_loss": -44.07821273803711, "global_step": 305070, "epoch": 2521} {"train_loss": -43.491233825683594, "global_step": 305071, "epoch": 2521} {"train_loss": -41.946781158447266, "global_step": 305072, "epoch": 2521} {"train_loss": -43.0516242980957, "global_step": 305073, "epoch": 2521} {"train_loss": -41.59251022338867, "global_step": 305074, "epoch": 2521} {"train_loss": -42.33143615722656, "global_step": 305075, "epoch": 2521} {"train_loss": -34.708072662353516, "global_step": 305076, "epoch": 2521} {"train_loss": -39.68748092651367, "global_step": 305077, "epoch": 2521} {"train_loss": -42.81510543823242, "global_step": 305078, "epoch": 2521} {"train_loss": -42.204750061035156, "global_step": 305079, "epoch": 2521} {"train_loss": -42.10954666137695, "global_step": 305080, "epoch": 2521} {"train_loss": -43.337677001953125, "global_step": 305081, "epoch": 2521} {"train_loss": -35.61384201049805, "global_step": 305082, "epoch": 2521} {"train_loss": -42.85515213012695, "global_step": 305083, "epoch": 2521} {"train_loss": -43.55057907104492, "global_step": 305084, "epoch": 2521} {"train_loss": -42.77003479003906, "global_step": 305085, "epoch": 2521} {"train_loss": -43.25385665893555, "global_step": 305086, "epoch": 2521} {"train_loss": -42.061458587646484, "global_step": 305087, "epoch": 2521} {"train_loss": -43.10966491699219, "global_step": 305088, "epoch": 2521} {"train_loss": -43.114227294921875, "global_step": 305089, "epoch": 2521} {"train_loss": -42.7508544921875, "global_step": 305090, "epoch": 2521} {"train_loss": -42.746517181396484, "global_step": 305091, "epoch": 2521} {"train_loss": -44.00175476074219, "global_step": 305092, "epoch": 2521} {"train_loss": -43.05226135253906, "global_step": 305093, "epoch": 2521} {"train_loss": -43.53950500488281, "global_step": 305094, "epoch": 2521} {"train_loss": -43.28497314453125, "global_step": 305095, "epoch": 2521} {"train_loss": -42.91108322143555, "global_step": 305096, "epoch": 2521} {"train_loss": -43.816070556640625, "global_step": 305097, "epoch": 2521} {"train_loss": -43.30770492553711, "global_step": 305098, "epoch": 2521} {"train_loss": -43.456790924072266, "global_step": 305099, "epoch": 2521} {"train_loss": -43.616390228271484, "global_step": 305100, "epoch": 2521} {"train_loss": -43.16618347167969, "global_step": 305101, "epoch": 2521} {"train_loss": -43.6201286315918, "global_step": 305102, "epoch": 2521} {"train_loss": -43.483577728271484, "global_step": 305103, "epoch": 2521} {"train_loss": -41.96517562866211, "global_step": 305104, "epoch": 2521} {"train_loss": -42.598114013671875, "global_step": 305105, "epoch": 2521} {"train_loss": -43.517757415771484, "global_step": 305106, "epoch": 2521} {"train_loss": -43.37381362915039, "global_step": 305107, "epoch": 2521} {"train_loss": -43.45029830932617, "global_step": 305108, "epoch": 2521} {"train_loss": -43.954837799072266, "global_step": 305109, "epoch": 2521} {"train_loss": -43.71531295776367, "global_step": 305110, "epoch": 2521} {"train_loss": -44.31980514526367, "global_step": 305111, "epoch": 2521} {"train_loss": -43.82464599609375, "global_step": 305112, "epoch": 2521} {"train_loss": -43.271968841552734, "global_step": 305113, "epoch": 2521} {"train_loss": -43.86836624145508, "global_step": 305114, "epoch": 2521} {"train_loss": -44.02915573120117, "global_step": 305115, "epoch": 2521} {"train_loss": -42.89693069458008, "global_step": 305116, "epoch": 2521} {"train_loss": -43.56387710571289, "global_step": 305117, "epoch": 2521} {"train_loss": -43.394691467285156, "global_step": 305118, "epoch": 2521} {"train_loss": -42.8904914855957, "global_step": 305119, "epoch": 2521} {"train_loss": -42.943153381347656, "global_step": 305120, "epoch": 2521} {"train_loss": -43.4326286315918, "global_step": 305121, "epoch": 2521} {"train_loss": -43.81766891479492, "global_step": 305122, "epoch": 2521} {"train_loss": -43.370792388916016, "global_step": 305123, "epoch": 2521} {"train_loss": -43.844966888427734, "global_step": 305124, "epoch": 2521} {"train_loss": -44.243560791015625, "global_step": 305125, "epoch": 2521} {"train_loss": -43.776702880859375, "global_step": 305126, "epoch": 2521} {"train_loss": -43.79737854003906, "global_step": 305127, "epoch": 2521} {"train_loss": -43.85810089111328, "global_step": 305128, "epoch": 2521} {"train_loss": -44.29386520385742, "global_step": 305129, "epoch": 2521} {"train_loss": -44.15145492553711, "global_step": 305130, "epoch": 2521} {"train_loss": -42.714813232421875, "global_step": 305131, "epoch": 2521} {"train_loss": -43.83024215698242, "global_step": 305132, "epoch": 2521} {"train_loss": -44.464271545410156, "global_step": 305133, "epoch": 2521} {"train_loss": -43.32328414916992, "global_step": 305134, "epoch": 2521} {"train_loss": -43.304588317871094, "global_step": 305135, "epoch": 2521} {"train_loss": -43.90653610229492, "global_step": 305136, "epoch": 2521} {"train_loss": -43.97624206542969, "global_step": 305137, "epoch": 2521} {"train_loss": -43.91213607788086, "global_step": 305138, "epoch": 2521} {"train_loss": -43.88667678833008, "global_step": 305139, "epoch": 2521} {"train_loss": -44.04872512817383, "global_step": 305140, "epoch": 2521} {"train_loss": -43.965572357177734, "global_step": 305141, "epoch": 2521} {"train_loss": -42.71149444580078, "global_step": 305142, "epoch": 2521} {"train_loss": -43.26939010620117, "global_step": 305143, "epoch": 2521} {"train_loss": -43.360286712646484, "global_step": 305144, "epoch": 2521} {"train_loss": -42.32371520996094, "global_step": 305145, "epoch": 2521} {"train_loss": -41.62699508666992, "global_step": 305146, "epoch": 2521} {"train_loss": -43.259056091308594, "global_step": 305147, "epoch": 2521} {"train_loss": -43.35010528564453, "global_step": 305148, "epoch": 2521} {"train_loss": -42.51401901245117, "global_step": 305149, "epoch": 2521} {"train_loss": -42.37739181518555, "global_step": 305150, "epoch": 2521} {"train_loss": -42.61388397216797, "global_step": 305151, "epoch": 2521} {"train_loss": -43.921142578125, "global_step": 305152, "epoch": 2521} {"train_loss": -43.48230743408203, "global_step": 305153, "epoch": 2521} {"train_loss": -42.87173080444336, "global_step": 305154, "epoch": 2521} {"train_loss": -42.780120849609375, "global_step": 305155, "epoch": 2521} {"train_loss": -43.471675872802734, "global_step": 305156, "epoch": 2521} {"train_loss": -43.619136810302734, "global_step": 305157, "epoch": 2521} {"train_loss": -42.95093536376953, "global_step": 305158, "epoch": 2521} {"train_loss": -42.29213333129883, "global_step": 305159, "epoch": 2521} {"train_loss": -43.857093811035156, "global_step": 305160, "epoch": 2521} {"train_loss": -43.06979108447871, "global_step": 305161, "epoch": 2521, "val_loss": 2771995.25} {"train_loss": -42.08383560180664, "global_step": 305162, "epoch": 2522} {"train_loss": -41.365325927734375, "global_step": 305163, "epoch": 2522} {"train_loss": -43.44535446166992, "global_step": 305164, "epoch": 2522} {"train_loss": -43.51176071166992, "global_step": 305165, "epoch": 2522} {"train_loss": -42.82797622680664, "global_step": 305166, "epoch": 2522} {"train_loss": -42.60129928588867, "global_step": 305167, "epoch": 2522} {"train_loss": -43.250572204589844, "global_step": 305168, "epoch": 2522} {"train_loss": -42.4859733581543, "global_step": 305169, "epoch": 2522} {"train_loss": -43.25682830810547, "global_step": 305170, "epoch": 2522} {"train_loss": -44.248016357421875, "global_step": 305171, "epoch": 2522} {"train_loss": -42.152584075927734, "global_step": 305172, "epoch": 2522} {"train_loss": -42.454322814941406, "global_step": 305173, "epoch": 2522} {"train_loss": -43.695926666259766, "global_step": 305174, "epoch": 2522} {"train_loss": -42.91642379760742, "global_step": 305175, "epoch": 2522} {"train_loss": -43.25812530517578, "global_step": 305176, "epoch": 2522} {"train_loss": -43.997802734375, "global_step": 305177, "epoch": 2522} {"train_loss": -43.26279067993164, "global_step": 305178, "epoch": 2522} {"train_loss": -43.89599609375, "global_step": 305179, "epoch": 2522} {"train_loss": -43.976654052734375, "global_step": 305180, "epoch": 2522} {"train_loss": -43.48012924194336, "global_step": 305181, "epoch": 2522} {"train_loss": -43.60603713989258, "global_step": 305182, "epoch": 2522} {"train_loss": -43.51369094848633, "global_step": 305183, "epoch": 2522} {"train_loss": -43.793766021728516, "global_step": 305184, "epoch": 2522} {"train_loss": -44.275535583496094, "global_step": 305185, "epoch": 2522} {"train_loss": -43.67170333862305, "global_step": 305186, "epoch": 2522} {"train_loss": -44.134098052978516, "global_step": 305187, "epoch": 2522} {"train_loss": -44.207313537597656, "global_step": 305188, "epoch": 2522} {"train_loss": -43.918861389160156, "global_step": 305189, "epoch": 2522} {"train_loss": -43.083709716796875, "global_step": 305190, "epoch": 2522} {"train_loss": -43.61922836303711, "global_step": 305191, "epoch": 2522} {"train_loss": -43.92676544189453, "global_step": 305192, "epoch": 2522} {"train_loss": -44.51836013793945, "global_step": 305193, "epoch": 2522} {"train_loss": -44.30499267578125, "global_step": 305194, "epoch": 2522} {"train_loss": -44.24850082397461, "global_step": 305195, "epoch": 2522} {"train_loss": -44.311256408691406, "global_step": 305196, "epoch": 2522} {"train_loss": -44.06917953491211, "global_step": 305197, "epoch": 2522} {"train_loss": -43.4878044128418, "global_step": 305198, "epoch": 2522} {"train_loss": -44.4591178894043, "global_step": 305199, "epoch": 2522} {"train_loss": -44.72446823120117, "global_step": 305200, "epoch": 2522} {"train_loss": -43.61027145385742, "global_step": 305201, "epoch": 2522} {"train_loss": -43.17596435546875, "global_step": 305202, "epoch": 2522} {"train_loss": -43.797325134277344, "global_step": 305203, "epoch": 2522} {"train_loss": -44.59200668334961, "global_step": 305204, "epoch": 2522} {"train_loss": -44.62057113647461, "global_step": 305205, "epoch": 2522} {"train_loss": -44.81441116333008, "global_step": 305206, "epoch": 2522} {"train_loss": -43.846832275390625, "global_step": 305207, "epoch": 2522} {"train_loss": -43.95510482788086, "global_step": 305208, "epoch": 2522} {"train_loss": -44.15061569213867, "global_step": 305209, "epoch": 2522} {"train_loss": -44.242897033691406, "global_step": 305210, "epoch": 2522} {"train_loss": -43.88886260986328, "global_step": 305211, "epoch": 2522} {"train_loss": -44.15131378173828, "global_step": 305212, "epoch": 2522} {"train_loss": -44.381927490234375, "global_step": 305213, "epoch": 2522} {"train_loss": -44.71859359741211, "global_step": 305214, "epoch": 2522} {"train_loss": -43.528133392333984, "global_step": 305215, "epoch": 2522} {"train_loss": -44.26970672607422, "global_step": 305216, "epoch": 2522} {"train_loss": -44.36893844604492, "global_step": 305217, "epoch": 2522} {"train_loss": -44.09177780151367, "global_step": 305218, "epoch": 2522} {"train_loss": -43.97706985473633, "global_step": 305219, "epoch": 2522} {"train_loss": -44.18861389160156, "global_step": 305220, "epoch": 2522} {"train_loss": -42.8145751953125, "global_step": 305221, "epoch": 2522} {"train_loss": -42.89183044433594, "global_step": 305222, "epoch": 2522} {"train_loss": -44.0788688659668, "global_step": 305223, "epoch": 2522} {"train_loss": -43.825992584228516, "global_step": 305224, "epoch": 2522} {"train_loss": -43.019989013671875, "global_step": 305225, "epoch": 2522} {"train_loss": -43.547271728515625, "global_step": 305226, "epoch": 2522} {"train_loss": -43.79314422607422, "global_step": 305227, "epoch": 2522} {"train_loss": -43.19529342651367, "global_step": 305228, "epoch": 2522} {"train_loss": -43.99485397338867, "global_step": 305229, "epoch": 2522} {"train_loss": -43.89118576049805, "global_step": 305230, "epoch": 2522} {"train_loss": -41.826663970947266, "global_step": 305231, "epoch": 2522} {"train_loss": -40.59530258178711, "global_step": 305232, "epoch": 2522} {"train_loss": -42.48659133911133, "global_step": 305233, "epoch": 2522} {"train_loss": -42.575965881347656, "global_step": 305234, "epoch": 2522} {"train_loss": -42.37685012817383, "global_step": 305235, "epoch": 2522} {"train_loss": -41.22793197631836, "global_step": 305236, "epoch": 2522} {"train_loss": -42.76372146606445, "global_step": 305237, "epoch": 2522} {"train_loss": -42.0302734375, "global_step": 305238, "epoch": 2522} {"train_loss": -41.764434814453125, "global_step": 305239, "epoch": 2522} {"train_loss": -42.71487045288086, "global_step": 305240, "epoch": 2522} {"train_loss": -41.18845748901367, "global_step": 305241, "epoch": 2522} {"train_loss": -41.21723556518555, "global_step": 305242, "epoch": 2522} {"train_loss": -42.34482955932617, "global_step": 305243, "epoch": 2522} {"train_loss": -39.29108428955078, "global_step": 305244, "epoch": 2522} {"train_loss": -43.59853744506836, "global_step": 305245, "epoch": 2522} {"train_loss": -40.25957489013672, "global_step": 305246, "epoch": 2522} {"train_loss": -43.08866500854492, "global_step": 305247, "epoch": 2522} {"train_loss": -40.02263259887695, "global_step": 305248, "epoch": 2522} {"train_loss": -43.609092712402344, "global_step": 305249, "epoch": 2522} {"train_loss": -41.4571418762207, "global_step": 305250, "epoch": 2522} {"train_loss": -43.76491928100586, "global_step": 305251, "epoch": 2522} {"train_loss": -41.07743835449219, "global_step": 305252, "epoch": 2522} {"train_loss": -43.36465072631836, "global_step": 305253, "epoch": 2522} {"train_loss": -43.245216369628906, "global_step": 305254, "epoch": 2522} {"train_loss": -43.56199264526367, "global_step": 305255, "epoch": 2522} {"train_loss": -42.66592025756836, "global_step": 305256, "epoch": 2522} {"train_loss": -43.470123291015625, "global_step": 305257, "epoch": 2522} {"train_loss": -42.487060546875, "global_step": 305258, "epoch": 2522} {"train_loss": -43.892662048339844, "global_step": 305259, "epoch": 2522} {"train_loss": -43.186458587646484, "global_step": 305260, "epoch": 2522} {"train_loss": -42.88692092895508, "global_step": 305261, "epoch": 2522} {"train_loss": -42.870765686035156, "global_step": 305262, "epoch": 2522} {"train_loss": -43.2935905456543, "global_step": 305263, "epoch": 2522} {"train_loss": -42.50381851196289, "global_step": 305264, "epoch": 2522} {"train_loss": -43.30327224731445, "global_step": 305265, "epoch": 2522} {"train_loss": -42.84228515625, "global_step": 305266, "epoch": 2522} {"train_loss": -43.781673431396484, "global_step": 305267, "epoch": 2522} {"train_loss": -43.04308319091797, "global_step": 305268, "epoch": 2522} {"train_loss": -43.379150390625, "global_step": 305269, "epoch": 2522} {"train_loss": -43.55308532714844, "global_step": 305270, "epoch": 2522} {"train_loss": -43.5601921081543, "global_step": 305271, "epoch": 2522} {"train_loss": -43.36848449707031, "global_step": 305272, "epoch": 2522} {"train_loss": -42.840606689453125, "global_step": 305273, "epoch": 2522} {"train_loss": -42.47614288330078, "global_step": 305274, "epoch": 2522} {"train_loss": -42.262725830078125, "global_step": 305275, "epoch": 2522} {"train_loss": -42.953887939453125, "global_step": 305276, "epoch": 2522} {"train_loss": -42.33256912231445, "global_step": 305277, "epoch": 2522} {"train_loss": -43.289363861083984, "global_step": 305278, "epoch": 2522} {"train_loss": -41.13985824584961, "global_step": 305279, "epoch": 2522} {"train_loss": -43.11458206176758, "global_step": 305280, "epoch": 2522} {"train_loss": -43.019622802734375, "global_step": 305281, "epoch": 2522} {"train_loss": -43.195820106947714, "global_step": 305282, "epoch": 2522, "val_loss": 2672989.0} {"train_loss": -41.66462326049805, "global_step": 305283, "epoch": 2523} {"train_loss": -43.22964096069336, "global_step": 305284, "epoch": 2523} {"train_loss": -43.018428802490234, "global_step": 305285, "epoch": 2523} {"train_loss": -42.718807220458984, "global_step": 305286, "epoch": 2523} {"train_loss": -42.988582611083984, "global_step": 305287, "epoch": 2523} {"train_loss": -43.39979934692383, "global_step": 305288, "epoch": 2523} {"train_loss": -43.506591796875, "global_step": 305289, "epoch": 2523} {"train_loss": -42.66677474975586, "global_step": 305290, "epoch": 2523} {"train_loss": -43.76933670043945, "global_step": 305291, "epoch": 2523} {"train_loss": -43.5076789855957, "global_step": 305292, "epoch": 2523} {"train_loss": -43.26060485839844, "global_step": 305293, "epoch": 2523} {"train_loss": -43.060787200927734, "global_step": 305294, "epoch": 2523} {"train_loss": -43.23019790649414, "global_step": 305295, "epoch": 2523} {"train_loss": -43.58526611328125, "global_step": 305296, "epoch": 2523} {"train_loss": -43.3731803894043, "global_step": 305297, "epoch": 2523} {"train_loss": -43.40322494506836, "global_step": 305298, "epoch": 2523} {"train_loss": -43.752079010009766, "global_step": 305299, "epoch": 2523} {"train_loss": -43.88381576538086, "global_step": 305300, "epoch": 2523} {"train_loss": -43.1758918762207, "global_step": 305301, "epoch": 2523} {"train_loss": -44.062679290771484, "global_step": 305302, "epoch": 2523} {"train_loss": -44.086368560791016, "global_step": 305303, "epoch": 2523} {"train_loss": -43.63385772705078, "global_step": 305304, "epoch": 2523} {"train_loss": -43.797977447509766, "global_step": 305305, "epoch": 2523} {"train_loss": -43.94953155517578, "global_step": 305306, "epoch": 2523} {"train_loss": -43.6556282043457, "global_step": 305307, "epoch": 2523} {"train_loss": -44.49652099609375, "global_step": 305308, "epoch": 2523} {"train_loss": -43.39820861816406, "global_step": 305309, "epoch": 2523} {"train_loss": -43.239471435546875, "global_step": 305310, "epoch": 2523} {"train_loss": -44.26200485229492, "global_step": 305311, "epoch": 2523} {"train_loss": -43.90338134765625, "global_step": 305312, "epoch": 2523} {"train_loss": -44.18312454223633, "global_step": 305313, "epoch": 2523} {"train_loss": -44.35538864135742, "global_step": 305314, "epoch": 2523} {"train_loss": -43.9148063659668, "global_step": 305315, "epoch": 2523} {"train_loss": -44.34641647338867, "global_step": 305316, "epoch": 2523} {"train_loss": -44.55864334106445, "global_step": 305317, "epoch": 2523} {"train_loss": -44.2523307800293, "global_step": 305318, "epoch": 2523} {"train_loss": -44.33317184448242, "global_step": 305319, "epoch": 2523} {"train_loss": -42.927711486816406, "global_step": 305320, "epoch": 2523} {"train_loss": -43.581031799316406, "global_step": 305321, "epoch": 2523} {"train_loss": -44.074432373046875, "global_step": 305322, "epoch": 2523} {"train_loss": -44.169551849365234, "global_step": 305323, "epoch": 2523} {"train_loss": -43.797203063964844, "global_step": 305324, "epoch": 2523} {"train_loss": -43.65949630737305, "global_step": 305325, "epoch": 2523} {"train_loss": -43.30327224731445, "global_step": 305326, "epoch": 2523} {"train_loss": -43.77872085571289, "global_step": 305327, "epoch": 2523} {"train_loss": -43.99329376220703, "global_step": 305328, "epoch": 2523} {"train_loss": -43.95028305053711, "global_step": 305329, "epoch": 2523} {"train_loss": -43.903499603271484, "global_step": 305330, "epoch": 2523} {"train_loss": -44.596405029296875, "global_step": 305331, "epoch": 2523} {"train_loss": -44.08235549926758, "global_step": 305332, "epoch": 2523} {"train_loss": -43.38462829589844, "global_step": 305333, "epoch": 2523} {"train_loss": -42.6173210144043, "global_step": 305334, "epoch": 2523} {"train_loss": -42.56941604614258, "global_step": 305335, "epoch": 2523} {"train_loss": -43.094295501708984, "global_step": 305336, "epoch": 2523} {"train_loss": -42.708106994628906, "global_step": 305337, "epoch": 2523} {"train_loss": -43.72824478149414, "global_step": 305338, "epoch": 2523} {"train_loss": -44.65821838378906, "global_step": 305339, "epoch": 2523} {"train_loss": -43.72150802612305, "global_step": 305340, "epoch": 2523} {"train_loss": -42.40217971801758, "global_step": 305341, "epoch": 2523} {"train_loss": -44.1000862121582, "global_step": 305342, "epoch": 2523} {"train_loss": -44.347206115722656, "global_step": 305343, "epoch": 2523} {"train_loss": -42.64807891845703, "global_step": 305344, "epoch": 2523} {"train_loss": -43.53139114379883, "global_step": 305345, "epoch": 2523} {"train_loss": -42.92774200439453, "global_step": 305346, "epoch": 2523} {"train_loss": -43.10493087768555, "global_step": 305347, "epoch": 2523} {"train_loss": -43.07046127319336, "global_step": 305348, "epoch": 2523} {"train_loss": -43.79505920410156, "global_step": 305349, "epoch": 2523} {"train_loss": -42.44198226928711, "global_step": 305350, "epoch": 2523} {"train_loss": -41.86198806762695, "global_step": 305351, "epoch": 2523} {"train_loss": -43.9397087097168, "global_step": 305352, "epoch": 2523} {"train_loss": -44.52091979980469, "global_step": 305353, "epoch": 2523} {"train_loss": -42.97725296020508, "global_step": 305354, "epoch": 2523} {"train_loss": -42.50421905517578, "global_step": 305355, "epoch": 2523} {"train_loss": -43.6638069152832, "global_step": 305356, "epoch": 2523} {"train_loss": -44.32880401611328, "global_step": 305357, "epoch": 2523} {"train_loss": -42.94124984741211, "global_step": 305358, "epoch": 2523} {"train_loss": -43.19631576538086, "global_step": 305359, "epoch": 2523} {"train_loss": -44.06400680541992, "global_step": 305360, "epoch": 2523} {"train_loss": -41.77537155151367, "global_step": 305361, "epoch": 2523} {"train_loss": -44.09807586669922, "global_step": 305362, "epoch": 2523} {"train_loss": -44.53977966308594, "global_step": 305363, "epoch": 2523} {"train_loss": -43.61823654174805, "global_step": 305364, "epoch": 2523} {"train_loss": -43.096099853515625, "global_step": 305365, "epoch": 2523} {"train_loss": -42.76078414916992, "global_step": 305366, "epoch": 2523} {"train_loss": -42.333248138427734, "global_step": 305367, "epoch": 2523} {"train_loss": -42.88302230834961, "global_step": 305368, "epoch": 2523} {"train_loss": -43.34699630737305, "global_step": 305369, "epoch": 2523} {"train_loss": -44.29446792602539, "global_step": 305370, "epoch": 2523} {"train_loss": -42.59772872924805, "global_step": 305371, "epoch": 2523} {"train_loss": -41.790340423583984, "global_step": 305372, "epoch": 2523} {"train_loss": -43.761600494384766, "global_step": 305373, "epoch": 2523} {"train_loss": -39.36123275756836, "global_step": 305374, "epoch": 2523} {"train_loss": -43.84017562866211, "global_step": 305375, "epoch": 2523} {"train_loss": -39.72884750366211, "global_step": 305376, "epoch": 2523} {"train_loss": -36.775177001953125, "global_step": 305377, "epoch": 2523} {"train_loss": -40.21803665161133, "global_step": 305378, "epoch": 2523} {"train_loss": -39.812862396240234, "global_step": 305379, "epoch": 2523} {"train_loss": -38.45969772338867, "global_step": 305380, "epoch": 2523} {"train_loss": -41.223236083984375, "global_step": 305381, "epoch": 2523} {"train_loss": -39.42198181152344, "global_step": 305382, "epoch": 2523} {"train_loss": -40.8382453918457, "global_step": 305383, "epoch": 2523} {"train_loss": -38.26668167114258, "global_step": 305384, "epoch": 2523} {"train_loss": -39.45056915283203, "global_step": 305385, "epoch": 2523} {"train_loss": -40.46232223510742, "global_step": 305386, "epoch": 2523} {"train_loss": -39.860694885253906, "global_step": 305387, "epoch": 2523} {"train_loss": -40.904502868652344, "global_step": 305388, "epoch": 2523} {"train_loss": -41.60435104370117, "global_step": 305389, "epoch": 2523} {"train_loss": -41.94819641113281, "global_step": 305390, "epoch": 2523} {"train_loss": -40.43210220336914, "global_step": 305391, "epoch": 2523} {"train_loss": -41.63435745239258, "global_step": 305392, "epoch": 2523} {"train_loss": -40.926063537597656, "global_step": 305393, "epoch": 2523} {"train_loss": -40.615028381347656, "global_step": 305394, "epoch": 2523} {"train_loss": -41.710609436035156, "global_step": 305395, "epoch": 2523} {"train_loss": -39.925804138183594, "global_step": 305396, "epoch": 2523} {"train_loss": -41.763458251953125, "global_step": 305397, "epoch": 2523} {"train_loss": -41.81989288330078, "global_step": 305398, "epoch": 2523} {"train_loss": -41.561561584472656, "global_step": 305399, "epoch": 2523} {"train_loss": -42.41801834106445, "global_step": 305400, "epoch": 2523} {"train_loss": -42.06875228881836, "global_step": 305401, "epoch": 2523} {"train_loss": -42.129852294921875, "global_step": 305402, "epoch": 2523} {"train_loss": -42.80047389889552, "global_step": 305403, "epoch": 2523, "val_loss": 2584600.75} {"train_loss": -41.98765182495117, "global_step": 305404, "epoch": 2524} {"train_loss": -42.681251525878906, "global_step": 305405, "epoch": 2524} {"train_loss": -42.08502197265625, "global_step": 305406, "epoch": 2524} {"train_loss": -42.29399490356445, "global_step": 305407, "epoch": 2524} {"train_loss": -42.88202667236328, "global_step": 305408, "epoch": 2524} {"train_loss": -42.32106018066406, "global_step": 305409, "epoch": 2524} {"train_loss": -42.57261276245117, "global_step": 305410, "epoch": 2524} {"train_loss": -43.1926155090332, "global_step": 305411, "epoch": 2524} {"train_loss": -42.53618240356445, "global_step": 305412, "epoch": 2524} {"train_loss": -42.49972915649414, "global_step": 305413, "epoch": 2524} {"train_loss": -43.5218391418457, "global_step": 305414, "epoch": 2524} {"train_loss": -42.7650260925293, "global_step": 305415, "epoch": 2524} {"train_loss": -43.106689453125, "global_step": 305416, "epoch": 2524} {"train_loss": -42.91245651245117, "global_step": 305417, "epoch": 2524} {"train_loss": -43.67995071411133, "global_step": 305418, "epoch": 2524} {"train_loss": -43.38068389892578, "global_step": 305419, "epoch": 2524} {"train_loss": -43.62766647338867, "global_step": 305420, "epoch": 2524} {"train_loss": -43.25520324707031, "global_step": 305421, "epoch": 2524} {"train_loss": -43.837890625, "global_step": 305422, "epoch": 2524} {"train_loss": -43.8556022644043, "global_step": 305423, "epoch": 2524} {"train_loss": -44.06453323364258, "global_step": 305424, "epoch": 2524} {"train_loss": -43.69332504272461, "global_step": 305425, "epoch": 2524} {"train_loss": -43.66547775268555, "global_step": 305426, "epoch": 2524} {"train_loss": -43.7598762512207, "global_step": 305427, "epoch": 2524} {"train_loss": -43.9775276184082, "global_step": 305428, "epoch": 2524} {"train_loss": -43.684200286865234, "global_step": 305429, "epoch": 2524} {"train_loss": -43.934173583984375, "global_step": 305430, "epoch": 2524} {"train_loss": -43.506263732910156, "global_step": 305431, "epoch": 2524} {"train_loss": -44.06001281738281, "global_step": 305432, "epoch": 2524} {"train_loss": -43.59402847290039, "global_step": 305433, "epoch": 2524} {"train_loss": -43.57029342651367, "global_step": 305434, "epoch": 2524} {"train_loss": -43.42010498046875, "global_step": 305435, "epoch": 2524} {"train_loss": -43.98081588745117, "global_step": 305436, "epoch": 2524} {"train_loss": -44.356170654296875, "global_step": 305437, "epoch": 2524} {"train_loss": -44.05781936645508, "global_step": 305438, "epoch": 2524} {"train_loss": -44.09647750854492, "global_step": 305439, "epoch": 2524} {"train_loss": -44.290157318115234, "global_step": 305440, "epoch": 2524} {"train_loss": -44.57240676879883, "global_step": 305441, "epoch": 2524} {"train_loss": -44.51241683959961, "global_step": 305442, "epoch": 2524} {"train_loss": -44.541969299316406, "global_step": 305443, "epoch": 2524} {"train_loss": -44.32533264160156, "global_step": 305444, "epoch": 2524} {"train_loss": -44.61872100830078, "global_step": 305445, "epoch": 2524} {"train_loss": -44.711883544921875, "global_step": 305446, "epoch": 2524} {"train_loss": -44.52919006347656, "global_step": 305447, "epoch": 2524} {"train_loss": -44.443885803222656, "global_step": 305448, "epoch": 2524} {"train_loss": -44.535518646240234, "global_step": 305449, "epoch": 2524} {"train_loss": -44.51420974731445, "global_step": 305450, "epoch": 2524} {"train_loss": -44.53597640991211, "global_step": 305451, "epoch": 2524} {"train_loss": -44.47383499145508, "global_step": 305452, "epoch": 2524} {"train_loss": -44.69002914428711, "global_step": 305453, "epoch": 2524} {"train_loss": -44.52939987182617, "global_step": 305454, "epoch": 2524} {"train_loss": -44.819217681884766, "global_step": 305455, "epoch": 2524} {"train_loss": -44.78867721557617, "global_step": 305456, "epoch": 2524} {"train_loss": -44.69658660888672, "global_step": 305457, "epoch": 2524} {"train_loss": -44.42104721069336, "global_step": 305458, "epoch": 2524} {"train_loss": -45.06716537475586, "global_step": 305459, "epoch": 2524} {"train_loss": -44.36790084838867, "global_step": 305460, "epoch": 2524} {"train_loss": -43.84499740600586, "global_step": 305461, "epoch": 2524} {"train_loss": -44.34565734863281, "global_step": 305462, "epoch": 2524} {"train_loss": -44.57255172729492, "global_step": 305463, "epoch": 2524} {"train_loss": -44.574180603027344, "global_step": 305464, "epoch": 2524} {"train_loss": -44.46503448486328, "global_step": 305465, "epoch": 2524} {"train_loss": -44.44830322265625, "global_step": 305466, "epoch": 2524} {"train_loss": -44.290340423583984, "global_step": 305467, "epoch": 2524} {"train_loss": -43.643768310546875, "global_step": 305468, "epoch": 2524} {"train_loss": -44.24388885498047, "global_step": 305469, "epoch": 2524} {"train_loss": -44.28594970703125, "global_step": 305470, "epoch": 2524} {"train_loss": -43.76521682739258, "global_step": 305471, "epoch": 2524} {"train_loss": -44.041316986083984, "global_step": 305472, "epoch": 2524} {"train_loss": -44.771358489990234, "global_step": 305473, "epoch": 2524} {"train_loss": -43.9947624206543, "global_step": 305474, "epoch": 2524} {"train_loss": -43.14720916748047, "global_step": 305475, "epoch": 2524} {"train_loss": -44.341617584228516, "global_step": 305476, "epoch": 2524} {"train_loss": -43.918392181396484, "global_step": 305477, "epoch": 2524} {"train_loss": -43.044429779052734, "global_step": 305478, "epoch": 2524} {"train_loss": -43.35533142089844, "global_step": 305479, "epoch": 2524} {"train_loss": -44.133880615234375, "global_step": 305480, "epoch": 2524} {"train_loss": -42.766048431396484, "global_step": 305481, "epoch": 2524} {"train_loss": -43.84556198120117, "global_step": 305482, "epoch": 2524} {"train_loss": -43.772064208984375, "global_step": 305483, "epoch": 2524} {"train_loss": -42.86593246459961, "global_step": 305484, "epoch": 2524} {"train_loss": -42.64458084106445, "global_step": 305485, "epoch": 2524} {"train_loss": -41.91460037231445, "global_step": 305486, "epoch": 2524} {"train_loss": -42.49784469604492, "global_step": 305487, "epoch": 2524} {"train_loss": -43.08890914916992, "global_step": 305488, "epoch": 2524} {"train_loss": -41.8969612121582, "global_step": 305489, "epoch": 2524} {"train_loss": -41.73584747314453, "global_step": 305490, "epoch": 2524} {"train_loss": -43.97815704345703, "global_step": 305491, "epoch": 2524} {"train_loss": -41.869754791259766, "global_step": 305492, "epoch": 2524} {"train_loss": -42.39957809448242, "global_step": 305493, "epoch": 2524} {"train_loss": -43.69961166381836, "global_step": 305494, "epoch": 2524} {"train_loss": -42.58709716796875, "global_step": 305495, "epoch": 2524} {"train_loss": -42.24723434448242, "global_step": 305496, "epoch": 2524} {"train_loss": -43.40470504760742, "global_step": 305497, "epoch": 2524} {"train_loss": -42.34774398803711, "global_step": 305498, "epoch": 2524} {"train_loss": -43.73379898071289, "global_step": 305499, "epoch": 2524} {"train_loss": -43.1946907043457, "global_step": 305500, "epoch": 2524} {"train_loss": -43.174232482910156, "global_step": 305501, "epoch": 2524} {"train_loss": -44.13465118408203, "global_step": 305502, "epoch": 2524} {"train_loss": -43.502986907958984, "global_step": 305503, "epoch": 2524} {"train_loss": -43.71590042114258, "global_step": 305504, "epoch": 2524} {"train_loss": -43.41450881958008, "global_step": 305505, "epoch": 2524} {"train_loss": -43.39509582519531, "global_step": 305506, "epoch": 2524} {"train_loss": -42.810543060302734, "global_step": 305507, "epoch": 2524} {"train_loss": -43.639739990234375, "global_step": 305508, "epoch": 2524} {"train_loss": -43.79541015625, "global_step": 305509, "epoch": 2524} {"train_loss": -43.26179504394531, "global_step": 305510, "epoch": 2524} {"train_loss": -43.201297760009766, "global_step": 305511, "epoch": 2524} {"train_loss": -43.72075271606445, "global_step": 305512, "epoch": 2524} {"train_loss": -43.29602813720703, "global_step": 305513, "epoch": 2524} {"train_loss": -43.646846771240234, "global_step": 305514, "epoch": 2524} {"train_loss": -43.21364212036133, "global_step": 305515, "epoch": 2524} {"train_loss": -42.94700241088867, "global_step": 305516, "epoch": 2524} {"train_loss": -42.95947265625, "global_step": 305517, "epoch": 2524} {"train_loss": -44.353271484375, "global_step": 305518, "epoch": 2524} {"train_loss": -43.214420318603516, "global_step": 305519, "epoch": 2524} {"train_loss": -42.7400016784668, "global_step": 305520, "epoch": 2524} {"train_loss": -43.185546875, "global_step": 305521, "epoch": 2524} {"train_loss": -44.263668060302734, "global_step": 305522, "epoch": 2524} {"train_loss": -42.42676544189453, "global_step": 305523, "epoch": 2524} {"train_loss": -43.60006026591151, "global_step": 305524, "epoch": 2524, "val_loss": 2671690.75} {"train_loss": -43.793575286865234, "global_step": 305525, "epoch": 2525} {"train_loss": -42.3213005065918, "global_step": 305526, "epoch": 2525} {"train_loss": -43.233890533447266, "global_step": 305527, "epoch": 2525} {"train_loss": -42.935211181640625, "global_step": 305528, "epoch": 2525} {"train_loss": -41.517826080322266, "global_step": 305529, "epoch": 2525} {"train_loss": -43.68585968017578, "global_step": 305530, "epoch": 2525} {"train_loss": -41.287269592285156, "global_step": 305531, "epoch": 2525} {"train_loss": -43.94834899902344, "global_step": 305532, "epoch": 2525} {"train_loss": -42.32433319091797, "global_step": 305533, "epoch": 2525} {"train_loss": -42.58602523803711, "global_step": 305534, "epoch": 2525} {"train_loss": -43.453487396240234, "global_step": 305535, "epoch": 2525} {"train_loss": -44.1430778503418, "global_step": 305536, "epoch": 2525} {"train_loss": -43.51951599121094, "global_step": 305537, "epoch": 2525} {"train_loss": -43.608985900878906, "global_step": 305538, "epoch": 2525} {"train_loss": -43.30293273925781, "global_step": 305539, "epoch": 2525} {"train_loss": -44.45566940307617, "global_step": 305540, "epoch": 2525} {"train_loss": -43.62881088256836, "global_step": 305541, "epoch": 2525} {"train_loss": -42.82096481323242, "global_step": 305542, "epoch": 2525} {"train_loss": -43.84464645385742, "global_step": 305543, "epoch": 2525} {"train_loss": -43.77296829223633, "global_step": 305544, "epoch": 2525} {"train_loss": -43.90159606933594, "global_step": 305545, "epoch": 2525} {"train_loss": -43.398956298828125, "global_step": 305546, "epoch": 2525} {"train_loss": -43.976226806640625, "global_step": 305547, "epoch": 2525} {"train_loss": -44.20627975463867, "global_step": 305548, "epoch": 2525} {"train_loss": -44.18564224243164, "global_step": 305549, "epoch": 2525} {"train_loss": -44.64715576171875, "global_step": 305550, "epoch": 2525} {"train_loss": -44.31325912475586, "global_step": 305551, "epoch": 2525} {"train_loss": -43.968936920166016, "global_step": 305552, "epoch": 2525} {"train_loss": -44.29454040527344, "global_step": 305553, "epoch": 2525} {"train_loss": -44.3335075378418, "global_step": 305554, "epoch": 2525} {"train_loss": -44.59220886230469, "global_step": 305555, "epoch": 2525} {"train_loss": -44.45939254760742, "global_step": 305556, "epoch": 2525} {"train_loss": -44.393821716308594, "global_step": 305557, "epoch": 2525} {"train_loss": -44.64524459838867, "global_step": 305558, "epoch": 2525} {"train_loss": -44.45263671875, "global_step": 305559, "epoch": 2525} {"train_loss": -44.42194747924805, "global_step": 305560, "epoch": 2525} {"train_loss": -44.50596237182617, "global_step": 305561, "epoch": 2525} {"train_loss": -43.84174728393555, "global_step": 305562, "epoch": 2525} {"train_loss": -44.87839889526367, "global_step": 305563, "epoch": 2525} {"train_loss": -43.62733459472656, "global_step": 305564, "epoch": 2525} {"train_loss": -43.867042541503906, "global_step": 305565, "epoch": 2525} {"train_loss": -44.73370361328125, "global_step": 305566, "epoch": 2525} {"train_loss": -44.14687728881836, "global_step": 305567, "epoch": 2525} {"train_loss": -44.18267822265625, "global_step": 305568, "epoch": 2525} {"train_loss": -43.586769104003906, "global_step": 305569, "epoch": 2525} {"train_loss": -44.67441940307617, "global_step": 305570, "epoch": 2525} {"train_loss": -44.60332107543945, "global_step": 305571, "epoch": 2525} {"train_loss": -44.075016021728516, "global_step": 305572, "epoch": 2525} {"train_loss": -44.09395217895508, "global_step": 305573, "epoch": 2525} {"train_loss": -43.879364013671875, "global_step": 305574, "epoch": 2525} {"train_loss": -43.61286163330078, "global_step": 305575, "epoch": 2525} {"train_loss": -42.483272552490234, "global_step": 305576, "epoch": 2525} {"train_loss": -41.85627365112305, "global_step": 305577, "epoch": 2525} {"train_loss": -44.576026916503906, "global_step": 305578, "epoch": 2525} {"train_loss": -43.50809097290039, "global_step": 305579, "epoch": 2525} {"train_loss": -42.810585021972656, "global_step": 305580, "epoch": 2525} {"train_loss": -44.11267852783203, "global_step": 305581, "epoch": 2525} {"train_loss": -43.87939453125, "global_step": 305582, "epoch": 2525} {"train_loss": -43.130367279052734, "global_step": 305583, "epoch": 2525} {"train_loss": -43.559104919433594, "global_step": 305584, "epoch": 2525} {"train_loss": -44.30908203125, "global_step": 305585, "epoch": 2525} {"train_loss": -44.316993713378906, "global_step": 305586, "epoch": 2525} {"train_loss": -44.0992431640625, "global_step": 305587, "epoch": 2525} {"train_loss": -44.42069625854492, "global_step": 305588, "epoch": 2525} {"train_loss": -44.194313049316406, "global_step": 305589, "epoch": 2525} {"train_loss": -43.44712829589844, "global_step": 305590, "epoch": 2525} {"train_loss": -44.67257308959961, "global_step": 305591, "epoch": 2525} {"train_loss": -43.919960021972656, "global_step": 305592, "epoch": 2525} {"train_loss": -44.454872131347656, "global_step": 305593, "epoch": 2525} {"train_loss": -44.49386215209961, "global_step": 305594, "epoch": 2525} {"train_loss": -43.94636535644531, "global_step": 305595, "epoch": 2525} {"train_loss": -43.46987533569336, "global_step": 305596, "epoch": 2525} {"train_loss": -43.06405258178711, "global_step": 305597, "epoch": 2525} {"train_loss": -44.417152404785156, "global_step": 305598, "epoch": 2525} {"train_loss": -44.25625228881836, "global_step": 305599, "epoch": 2525} {"train_loss": -44.022891998291016, "global_step": 305600, "epoch": 2525} {"train_loss": -44.12467956542969, "global_step": 305601, "epoch": 2525} {"train_loss": -43.589717864990234, "global_step": 305602, "epoch": 2525} {"train_loss": -43.2702751159668, "global_step": 305603, "epoch": 2525} {"train_loss": -42.81077575683594, "global_step": 305604, "epoch": 2525} {"train_loss": -41.43669509887695, "global_step": 305605, "epoch": 2525} {"train_loss": -42.839141845703125, "global_step": 305606, "epoch": 2525} {"train_loss": -43.049068450927734, "global_step": 305607, "epoch": 2525} {"train_loss": -42.42995834350586, "global_step": 305608, "epoch": 2525} {"train_loss": -43.230438232421875, "global_step": 305609, "epoch": 2525} {"train_loss": -43.8770866394043, "global_step": 305610, "epoch": 2525} {"train_loss": -43.992305755615234, "global_step": 305611, "epoch": 2525} {"train_loss": -42.83217239379883, "global_step": 305612, "epoch": 2525} {"train_loss": -42.702728271484375, "global_step": 305613, "epoch": 2525} {"train_loss": -42.702247619628906, "global_step": 305614, "epoch": 2525} {"train_loss": -40.468055725097656, "global_step": 305615, "epoch": 2525} {"train_loss": -44.05826950073242, "global_step": 305616, "epoch": 2525} {"train_loss": -43.049415588378906, "global_step": 305617, "epoch": 2525} {"train_loss": -41.27651596069336, "global_step": 305618, "epoch": 2525} {"train_loss": -40.59103012084961, "global_step": 305619, "epoch": 2525} {"train_loss": -43.42729187011719, "global_step": 305620, "epoch": 2525} {"train_loss": -41.56962203979492, "global_step": 305621, "epoch": 2525} {"train_loss": -40.474308013916016, "global_step": 305622, "epoch": 2525} {"train_loss": -41.67888259887695, "global_step": 305623, "epoch": 2525} {"train_loss": -43.801292419433594, "global_step": 305624, "epoch": 2525} {"train_loss": -42.69210433959961, "global_step": 305625, "epoch": 2525} {"train_loss": -41.86277389526367, "global_step": 305626, "epoch": 2525} {"train_loss": -43.7935791015625, "global_step": 305627, "epoch": 2525} {"train_loss": -43.05489730834961, "global_step": 305628, "epoch": 2525} {"train_loss": -42.78031539916992, "global_step": 305629, "epoch": 2525} {"train_loss": -42.40012741088867, "global_step": 305630, "epoch": 2525} {"train_loss": -43.982635498046875, "global_step": 305631, "epoch": 2525} {"train_loss": -41.4985466003418, "global_step": 305632, "epoch": 2525} {"train_loss": -43.117767333984375, "global_step": 305633, "epoch": 2525} {"train_loss": -43.0302734375, "global_step": 305634, "epoch": 2525} {"train_loss": -42.64946746826172, "global_step": 305635, "epoch": 2525} {"train_loss": -43.75604248046875, "global_step": 305636, "epoch": 2525} {"train_loss": -43.591217041015625, "global_step": 305637, "epoch": 2525} {"train_loss": -43.75856018066406, "global_step": 305638, "epoch": 2525} {"train_loss": -43.97025680541992, "global_step": 305639, "epoch": 2525} {"train_loss": -43.89506530761719, "global_step": 305640, "epoch": 2525} {"train_loss": -44.004127502441406, "global_step": 305641, "epoch": 2525} {"train_loss": -43.25901794433594, "global_step": 305642, "epoch": 2525} {"train_loss": -44.1905403137207, "global_step": 305643, "epoch": 2525} {"train_loss": -44.123268127441406, "global_step": 305644, "epoch": 2525} {"train_loss": -43.48407426944449, "global_step": 305645, "epoch": 2525, "val_loss": 2640147.25} {"train_loss": -44.23948287963867, "global_step": 305646, "epoch": 2526} {"train_loss": -43.836238861083984, "global_step": 305647, "epoch": 2526} {"train_loss": -43.834964752197266, "global_step": 305648, "epoch": 2526} {"train_loss": -43.99778366088867, "global_step": 305649, "epoch": 2526} {"train_loss": -42.99471664428711, "global_step": 305650, "epoch": 2526} {"train_loss": -44.304649353027344, "global_step": 305651, "epoch": 2526} {"train_loss": -43.038387298583984, "global_step": 305652, "epoch": 2526} {"train_loss": -43.14030075073242, "global_step": 305653, "epoch": 2526} {"train_loss": -44.50316619873047, "global_step": 305654, "epoch": 2526} {"train_loss": -43.111019134521484, "global_step": 305655, "epoch": 2526} {"train_loss": -43.710262298583984, "global_step": 305656, "epoch": 2526} {"train_loss": -43.71913528442383, "global_step": 305657, "epoch": 2526} {"train_loss": -43.332183837890625, "global_step": 305658, "epoch": 2526} {"train_loss": -44.3376350402832, "global_step": 305659, "epoch": 2526} {"train_loss": -44.068050384521484, "global_step": 305660, "epoch": 2526} {"train_loss": -44.085933685302734, "global_step": 305661, "epoch": 2526} {"train_loss": -44.79701614379883, "global_step": 305662, "epoch": 2526} {"train_loss": -44.1044807434082, "global_step": 305663, "epoch": 2526} {"train_loss": -44.401756286621094, "global_step": 305664, "epoch": 2526} {"train_loss": -43.710689544677734, "global_step": 305665, "epoch": 2526} {"train_loss": -44.26670455932617, "global_step": 305666, "epoch": 2526} {"train_loss": -44.564754486083984, "global_step": 305667, "epoch": 2526} {"train_loss": -44.17342758178711, "global_step": 305668, "epoch": 2526} {"train_loss": -43.740142822265625, "global_step": 305669, "epoch": 2526} {"train_loss": -44.12006759643555, "global_step": 305670, "epoch": 2526} {"train_loss": -44.4428825378418, "global_step": 305671, "epoch": 2526} {"train_loss": -44.38077926635742, "global_step": 305672, "epoch": 2526} {"train_loss": -44.54204177856445, "global_step": 305673, "epoch": 2526} {"train_loss": -44.32281494140625, "global_step": 305674, "epoch": 2526} {"train_loss": -43.99003601074219, "global_step": 305675, "epoch": 2526} {"train_loss": -44.72553253173828, "global_step": 305676, "epoch": 2526} {"train_loss": -44.1273078918457, "global_step": 305677, "epoch": 2526} {"train_loss": -43.74005126953125, "global_step": 305678, "epoch": 2526} {"train_loss": -42.8391227722168, "global_step": 305679, "epoch": 2526} {"train_loss": -41.37565612792969, "global_step": 305680, "epoch": 2526} {"train_loss": -42.65999984741211, "global_step": 305681, "epoch": 2526} {"train_loss": -44.43180465698242, "global_step": 305682, "epoch": 2526} {"train_loss": -44.40608596801758, "global_step": 305683, "epoch": 2526} {"train_loss": -42.87820816040039, "global_step": 305684, "epoch": 2526} {"train_loss": -42.88182067871094, "global_step": 305685, "epoch": 2526} {"train_loss": -43.74229049682617, "global_step": 305686, "epoch": 2526} {"train_loss": -44.1078987121582, "global_step": 305687, "epoch": 2526} {"train_loss": -43.53418731689453, "global_step": 305688, "epoch": 2526} {"train_loss": -41.58974838256836, "global_step": 305689, "epoch": 2526} {"train_loss": -42.03068923950195, "global_step": 305690, "epoch": 2526} {"train_loss": -42.35877227783203, "global_step": 305691, "epoch": 2526} {"train_loss": -43.98072052001953, "global_step": 305692, "epoch": 2526} {"train_loss": -43.965126037597656, "global_step": 305693, "epoch": 2526} {"train_loss": -43.4417724609375, "global_step": 305694, "epoch": 2526} {"train_loss": -42.91495895385742, "global_step": 305695, "epoch": 2526} {"train_loss": -43.522422790527344, "global_step": 305696, "epoch": 2526} {"train_loss": -43.25895309448242, "global_step": 305697, "epoch": 2526} {"train_loss": -44.010677337646484, "global_step": 305698, "epoch": 2526} {"train_loss": -44.01035690307617, "global_step": 305699, "epoch": 2526} {"train_loss": -43.96474075317383, "global_step": 305700, "epoch": 2526} {"train_loss": -43.3426513671875, "global_step": 305701, "epoch": 2526} {"train_loss": -42.472206115722656, "global_step": 305702, "epoch": 2526} {"train_loss": -43.85198211669922, "global_step": 305703, "epoch": 2526} {"train_loss": -43.55247116088867, "global_step": 305704, "epoch": 2526} {"train_loss": -42.14231491088867, "global_step": 305705, "epoch": 2526} {"train_loss": -42.55515670776367, "global_step": 305706, "epoch": 2526} {"train_loss": -42.138465881347656, "global_step": 305707, "epoch": 2526} {"train_loss": -42.30597686767578, "global_step": 305708, "epoch": 2526} {"train_loss": -44.17900085449219, "global_step": 305709, "epoch": 2526} {"train_loss": -42.44863510131836, "global_step": 305710, "epoch": 2526} {"train_loss": -42.330345153808594, "global_step": 305711, "epoch": 2526} {"train_loss": -43.61078643798828, "global_step": 305712, "epoch": 2526} {"train_loss": -42.01514434814453, "global_step": 305713, "epoch": 2526} {"train_loss": -43.877288818359375, "global_step": 305714, "epoch": 2526} {"train_loss": -43.02641677856445, "global_step": 305715, "epoch": 2526} {"train_loss": -42.83340072631836, "global_step": 305716, "epoch": 2526} {"train_loss": -43.33013916015625, "global_step": 305717, "epoch": 2526} {"train_loss": -42.9117546081543, "global_step": 305718, "epoch": 2526} {"train_loss": -43.392486572265625, "global_step": 305719, "epoch": 2526} {"train_loss": -42.89780807495117, "global_step": 305720, "epoch": 2526} {"train_loss": -43.409576416015625, "global_step": 305721, "epoch": 2526} {"train_loss": -43.32502746582031, "global_step": 305722, "epoch": 2526} {"train_loss": -43.72103500366211, "global_step": 305723, "epoch": 2526} {"train_loss": -43.914215087890625, "global_step": 305724, "epoch": 2526} {"train_loss": -43.591651916503906, "global_step": 305725, "epoch": 2526} {"train_loss": -43.370784759521484, "global_step": 305726, "epoch": 2526} {"train_loss": -43.23933792114258, "global_step": 305727, "epoch": 2526} {"train_loss": -42.651432037353516, "global_step": 305728, "epoch": 2526} {"train_loss": -43.69865036010742, "global_step": 305729, "epoch": 2526} {"train_loss": -43.4880485534668, "global_step": 305730, "epoch": 2526} {"train_loss": -42.05046844482422, "global_step": 305731, "epoch": 2526} {"train_loss": -43.64805221557617, "global_step": 305732, "epoch": 2526} {"train_loss": -42.826568603515625, "global_step": 305733, "epoch": 2526} {"train_loss": -42.61552047729492, "global_step": 305734, "epoch": 2526} {"train_loss": -44.1482048034668, "global_step": 305735, "epoch": 2526} {"train_loss": -42.46223831176758, "global_step": 305736, "epoch": 2526} {"train_loss": -43.67681121826172, "global_step": 305737, "epoch": 2526} {"train_loss": -43.910888671875, "global_step": 305738, "epoch": 2526} {"train_loss": -43.04909896850586, "global_step": 305739, "epoch": 2526} {"train_loss": -44.13664245605469, "global_step": 305740, "epoch": 2526} {"train_loss": -43.21836471557617, "global_step": 305741, "epoch": 2526} {"train_loss": -44.04731750488281, "global_step": 305742, "epoch": 2526} {"train_loss": -43.9672737121582, "global_step": 305743, "epoch": 2526} {"train_loss": -43.712459564208984, "global_step": 305744, "epoch": 2526} {"train_loss": -43.96310043334961, "global_step": 305745, "epoch": 2526} {"train_loss": -43.965023040771484, "global_step": 305746, "epoch": 2526} {"train_loss": -44.038719177246094, "global_step": 305747, "epoch": 2526} {"train_loss": -43.662601470947266, "global_step": 305748, "epoch": 2526} {"train_loss": -44.237483978271484, "global_step": 305749, "epoch": 2526} {"train_loss": -43.713436126708984, "global_step": 305750, "epoch": 2526} {"train_loss": -43.187904357910156, "global_step": 305751, "epoch": 2526} {"train_loss": -44.25053787231445, "global_step": 305752, "epoch": 2526} {"train_loss": -43.96760177612305, "global_step": 305753, "epoch": 2526} {"train_loss": -44.31034851074219, "global_step": 305754, "epoch": 2526} {"train_loss": -44.07598876953125, "global_step": 305755, "epoch": 2526} {"train_loss": -44.47560501098633, "global_step": 305756, "epoch": 2526} {"train_loss": -43.79401397705078, "global_step": 305757, "epoch": 2526} {"train_loss": -43.94746017456055, "global_step": 305758, "epoch": 2526} {"train_loss": -43.85837936401367, "global_step": 305759, "epoch": 2526} {"train_loss": -44.69072723388672, "global_step": 305760, "epoch": 2526} {"train_loss": -44.7094841003418, "global_step": 305761, "epoch": 2526} {"train_loss": -44.160369873046875, "global_step": 305762, "epoch": 2526} {"train_loss": -44.57014465332031, "global_step": 305763, "epoch": 2526} {"train_loss": -44.371395111083984, "global_step": 305764, "epoch": 2526} {"train_loss": -44.37752151489258, "global_step": 305765, "epoch": 2526} {"train_loss": -43.60430151568956, "global_step": 305766, "epoch": 2526, "val_loss": 2589757.0} {"train_loss": -44.50228500366211, "global_step": 305767, "epoch": 2527} {"train_loss": -44.14036560058594, "global_step": 305768, "epoch": 2527} {"train_loss": -44.330440521240234, "global_step": 305769, "epoch": 2527} {"train_loss": -44.528045654296875, "global_step": 305770, "epoch": 2527} {"train_loss": -44.048641204833984, "global_step": 305771, "epoch": 2527} {"train_loss": -43.30916976928711, "global_step": 305772, "epoch": 2527} {"train_loss": -44.37744903564453, "global_step": 305773, "epoch": 2527} {"train_loss": -44.06843185424805, "global_step": 305774, "epoch": 2527} {"train_loss": -43.69771957397461, "global_step": 305775, "epoch": 2527} {"train_loss": -44.60383224487305, "global_step": 305776, "epoch": 2527} {"train_loss": -44.49105453491211, "global_step": 305777, "epoch": 2527} {"train_loss": -44.29765319824219, "global_step": 305778, "epoch": 2527} {"train_loss": -44.62987518310547, "global_step": 305779, "epoch": 2527} {"train_loss": -44.00540542602539, "global_step": 305780, "epoch": 2527} {"train_loss": -44.09285354614258, "global_step": 305781, "epoch": 2527} {"train_loss": -44.32271957397461, "global_step": 305782, "epoch": 2527} {"train_loss": -44.15686798095703, "global_step": 305783, "epoch": 2527} {"train_loss": -43.81119918823242, "global_step": 305784, "epoch": 2527} {"train_loss": -44.48221969604492, "global_step": 305785, "epoch": 2527} {"train_loss": -43.50056076049805, "global_step": 305786, "epoch": 2527} {"train_loss": -43.75757598876953, "global_step": 305787, "epoch": 2527} {"train_loss": -44.18697738647461, "global_step": 305788, "epoch": 2527} {"train_loss": -43.628570556640625, "global_step": 305789, "epoch": 2527} {"train_loss": -43.192481994628906, "global_step": 305790, "epoch": 2527} {"train_loss": -44.32658386230469, "global_step": 305791, "epoch": 2527} {"train_loss": -44.01613235473633, "global_step": 305792, "epoch": 2527} {"train_loss": -43.22747802734375, "global_step": 305793, "epoch": 2527} {"train_loss": -43.489540100097656, "global_step": 305794, "epoch": 2527} {"train_loss": -43.70978927612305, "global_step": 305795, "epoch": 2527} {"train_loss": -43.41070556640625, "global_step": 305796, "epoch": 2527} {"train_loss": -42.10616683959961, "global_step": 305797, "epoch": 2527} {"train_loss": -42.766212463378906, "global_step": 305798, "epoch": 2527} {"train_loss": -43.9000358581543, "global_step": 305799, "epoch": 2527} {"train_loss": -43.769874572753906, "global_step": 305800, "epoch": 2527} {"train_loss": -43.187007904052734, "global_step": 305801, "epoch": 2527} {"train_loss": -43.446285247802734, "global_step": 305802, "epoch": 2527} {"train_loss": -43.28958511352539, "global_step": 305803, "epoch": 2527} {"train_loss": -42.66574478149414, "global_step": 305804, "epoch": 2527} {"train_loss": -43.37389373779297, "global_step": 305805, "epoch": 2527} {"train_loss": -43.62638473510742, "global_step": 305806, "epoch": 2527} {"train_loss": -43.83869934082031, "global_step": 305807, "epoch": 2527} {"train_loss": -43.41025161743164, "global_step": 305808, "epoch": 2527} {"train_loss": -43.31262969970703, "global_step": 305809, "epoch": 2527} {"train_loss": -43.201171875, "global_step": 305810, "epoch": 2527} {"train_loss": -43.57150650024414, "global_step": 305811, "epoch": 2527} {"train_loss": -44.15871810913086, "global_step": 305812, "epoch": 2527} {"train_loss": -43.40684127807617, "global_step": 305813, "epoch": 2527} {"train_loss": -41.8828010559082, "global_step": 305814, "epoch": 2527} {"train_loss": -43.882484436035156, "global_step": 305815, "epoch": 2527} {"train_loss": -42.747901916503906, "global_step": 305816, "epoch": 2527} {"train_loss": -42.63523483276367, "global_step": 305817, "epoch": 2527} {"train_loss": -43.88967514038086, "global_step": 305818, "epoch": 2527} {"train_loss": -43.859527587890625, "global_step": 305819, "epoch": 2527} {"train_loss": -42.99001693725586, "global_step": 305820, "epoch": 2527} {"train_loss": -41.74513626098633, "global_step": 305821, "epoch": 2527} {"train_loss": -42.617061614990234, "global_step": 305822, "epoch": 2527} {"train_loss": -43.75885772705078, "global_step": 305823, "epoch": 2527} {"train_loss": -42.97943115234375, "global_step": 305824, "epoch": 2527} {"train_loss": -42.46088409423828, "global_step": 305825, "epoch": 2527} {"train_loss": -41.551902770996094, "global_step": 305826, "epoch": 2527} {"train_loss": -43.3473014831543, "global_step": 305827, "epoch": 2527} {"train_loss": -42.98148727416992, "global_step": 305828, "epoch": 2527} {"train_loss": -41.74360656738281, "global_step": 305829, "epoch": 2527} {"train_loss": -43.53517150878906, "global_step": 305830, "epoch": 2527} {"train_loss": -42.41359329223633, "global_step": 305831, "epoch": 2527} {"train_loss": -41.02360916137695, "global_step": 305832, "epoch": 2527} {"train_loss": -42.669532775878906, "global_step": 305833, "epoch": 2527} {"train_loss": -40.152748107910156, "global_step": 305834, "epoch": 2527} {"train_loss": -42.13741683959961, "global_step": 305835, "epoch": 2527} {"train_loss": -40.25394058227539, "global_step": 305836, "epoch": 2527} {"train_loss": -42.581966400146484, "global_step": 305837, "epoch": 2527} {"train_loss": -41.11420440673828, "global_step": 305838, "epoch": 2527} {"train_loss": -42.80134201049805, "global_step": 305839, "epoch": 2527} {"train_loss": -41.4377326965332, "global_step": 305840, "epoch": 2527} {"train_loss": -42.75350570678711, "global_step": 305841, "epoch": 2527} {"train_loss": -41.64331817626953, "global_step": 305842, "epoch": 2527} {"train_loss": -43.27267074584961, "global_step": 305843, "epoch": 2527} {"train_loss": -40.617061614990234, "global_step": 305844, "epoch": 2527} {"train_loss": -42.96116256713867, "global_step": 305845, "epoch": 2527} {"train_loss": -41.00487518310547, "global_step": 305846, "epoch": 2527} {"train_loss": -43.01986312866211, "global_step": 305847, "epoch": 2527} {"train_loss": -41.80937957763672, "global_step": 305848, "epoch": 2527} {"train_loss": -44.270442962646484, "global_step": 305849, "epoch": 2527} {"train_loss": -42.18015670776367, "global_step": 305850, "epoch": 2527} {"train_loss": -42.80234146118164, "global_step": 305851, "epoch": 2527} {"train_loss": -42.05451202392578, "global_step": 305852, "epoch": 2527} {"train_loss": -43.50735092163086, "global_step": 305853, "epoch": 2527} {"train_loss": -42.26356887817383, "global_step": 305854, "epoch": 2527} {"train_loss": -42.822235107421875, "global_step": 305855, "epoch": 2527} {"train_loss": -42.47105026245117, "global_step": 305856, "epoch": 2527} {"train_loss": -42.218509674072266, "global_step": 305857, "epoch": 2527} {"train_loss": -42.02137756347656, "global_step": 305858, "epoch": 2527} {"train_loss": -43.211212158203125, "global_step": 305859, "epoch": 2527} {"train_loss": -41.663822174072266, "global_step": 305860, "epoch": 2527} {"train_loss": -43.48126983642578, "global_step": 305861, "epoch": 2527} {"train_loss": -42.617645263671875, "global_step": 305862, "epoch": 2527} {"train_loss": -41.312442779541016, "global_step": 305863, "epoch": 2527} {"train_loss": -43.465213775634766, "global_step": 305864, "epoch": 2527} {"train_loss": -42.65459060668945, "global_step": 305865, "epoch": 2527} {"train_loss": -43.534358978271484, "global_step": 305866, "epoch": 2527} {"train_loss": -43.58205032348633, "global_step": 305867, "epoch": 2527} {"train_loss": -42.94157791137695, "global_step": 305868, "epoch": 2527} {"train_loss": -43.22357177734375, "global_step": 305869, "epoch": 2527} {"train_loss": -43.349910736083984, "global_step": 305870, "epoch": 2527} {"train_loss": -43.881351470947266, "global_step": 305871, "epoch": 2527} {"train_loss": -43.31617736816406, "global_step": 305872, "epoch": 2527} {"train_loss": -42.9819221496582, "global_step": 305873, "epoch": 2527} {"train_loss": -42.81391143798828, "global_step": 305874, "epoch": 2527} {"train_loss": -43.831233978271484, "global_step": 305875, "epoch": 2527} {"train_loss": -43.403900146484375, "global_step": 305876, "epoch": 2527} {"train_loss": -43.6452751159668, "global_step": 305877, "epoch": 2527} {"train_loss": -43.44071578979492, "global_step": 305878, "epoch": 2527} {"train_loss": -43.78080368041992, "global_step": 305879, "epoch": 2527} {"train_loss": -43.4215202331543, "global_step": 305880, "epoch": 2527} {"train_loss": -42.66425704956055, "global_step": 305881, "epoch": 2527} {"train_loss": -43.308712005615234, "global_step": 305882, "epoch": 2527} {"train_loss": -43.4750862121582, "global_step": 305883, "epoch": 2527} {"train_loss": -43.50425338745117, "global_step": 305884, "epoch": 2527} {"train_loss": -43.59504318237305, "global_step": 305885, "epoch": 2527} {"train_loss": -43.598995208740234, "global_step": 305886, "epoch": 2527} {"train_loss": -43.1348283310567, "global_step": 305887, "epoch": 2527, "val_loss": 2629720.0} {"train_loss": -43.38373565673828, "global_step": 305888, "epoch": 2528} {"train_loss": -43.67190170288086, "global_step": 305889, "epoch": 2528} {"train_loss": -43.02810287475586, "global_step": 305890, "epoch": 2528} {"train_loss": -43.332881927490234, "global_step": 305891, "epoch": 2528} {"train_loss": -43.98521041870117, "global_step": 305892, "epoch": 2528} {"train_loss": -44.11723709106445, "global_step": 305893, "epoch": 2528} {"train_loss": -44.130653381347656, "global_step": 305894, "epoch": 2528} {"train_loss": -44.05605697631836, "global_step": 305895, "epoch": 2528} {"train_loss": -43.91410446166992, "global_step": 305896, "epoch": 2528} {"train_loss": -42.662960052490234, "global_step": 305897, "epoch": 2528} {"train_loss": -44.72589874267578, "global_step": 305898, "epoch": 2528} {"train_loss": -43.274322509765625, "global_step": 305899, "epoch": 2528} {"train_loss": -43.334754943847656, "global_step": 305900, "epoch": 2528} {"train_loss": -43.810543060302734, "global_step": 305901, "epoch": 2528} {"train_loss": -43.59640121459961, "global_step": 305902, "epoch": 2528} {"train_loss": -43.23455810546875, "global_step": 305903, "epoch": 2528} {"train_loss": -43.89529800415039, "global_step": 305904, "epoch": 2528} {"train_loss": -43.38471984863281, "global_step": 305905, "epoch": 2528} {"train_loss": -42.78396224975586, "global_step": 305906, "epoch": 2528} {"train_loss": -44.59088897705078, "global_step": 305907, "epoch": 2528} {"train_loss": -43.75665283203125, "global_step": 305908, "epoch": 2528} {"train_loss": -43.8890495300293, "global_step": 305909, "epoch": 2528} {"train_loss": -44.01528549194336, "global_step": 305910, "epoch": 2528} {"train_loss": -43.8065299987793, "global_step": 305911, "epoch": 2528} {"train_loss": -44.66607666015625, "global_step": 305912, "epoch": 2528} {"train_loss": -43.894798278808594, "global_step": 305913, "epoch": 2528} {"train_loss": -44.3353271484375, "global_step": 305914, "epoch": 2528} {"train_loss": -44.344398498535156, "global_step": 305915, "epoch": 2528} {"train_loss": -44.732181549072266, "global_step": 305916, "epoch": 2528} {"train_loss": -44.246273040771484, "global_step": 305917, "epoch": 2528} {"train_loss": -44.27866744995117, "global_step": 305918, "epoch": 2528} {"train_loss": -44.57625961303711, "global_step": 305919, "epoch": 2528} {"train_loss": -44.50302505493164, "global_step": 305920, "epoch": 2528} {"train_loss": -44.5691032409668, "global_step": 305921, "epoch": 2528} {"train_loss": -44.07868194580078, "global_step": 305922, "epoch": 2528} {"train_loss": -44.68338394165039, "global_step": 305923, "epoch": 2528} {"train_loss": -44.468505859375, "global_step": 305924, "epoch": 2528} {"train_loss": -43.93843460083008, "global_step": 305925, "epoch": 2528} {"train_loss": -44.153682708740234, "global_step": 305926, "epoch": 2528} {"train_loss": -44.50383377075195, "global_step": 305927, "epoch": 2528} {"train_loss": -44.779510498046875, "global_step": 305928, "epoch": 2528} {"train_loss": -44.50935745239258, "global_step": 305929, "epoch": 2528} {"train_loss": -43.872581481933594, "global_step": 305930, "epoch": 2528} {"train_loss": -44.540706634521484, "global_step": 305931, "epoch": 2528} {"train_loss": -44.75754928588867, "global_step": 305932, "epoch": 2528} {"train_loss": -43.87986755371094, "global_step": 305933, "epoch": 2528} {"train_loss": -44.137054443359375, "global_step": 305934, "epoch": 2528} {"train_loss": -44.93559646606445, "global_step": 305935, "epoch": 2528} {"train_loss": -43.765724182128906, "global_step": 305936, "epoch": 2528} {"train_loss": -43.49699020385742, "global_step": 305937, "epoch": 2528} {"train_loss": -43.846736907958984, "global_step": 305938, "epoch": 2528} {"train_loss": -43.64027786254883, "global_step": 305939, "epoch": 2528} {"train_loss": -44.346229553222656, "global_step": 305940, "epoch": 2528} {"train_loss": -44.53416061401367, "global_step": 305941, "epoch": 2528} {"train_loss": -45.04179763793945, "global_step": 305942, "epoch": 2528} {"train_loss": -44.50382614135742, "global_step": 305943, "epoch": 2528} {"train_loss": -44.161720275878906, "global_step": 305944, "epoch": 2528} {"train_loss": -44.473236083984375, "global_step": 305945, "epoch": 2528} {"train_loss": -44.58925247192383, "global_step": 305946, "epoch": 2528} {"train_loss": -45.144989013671875, "global_step": 305947, "epoch": 2528} {"train_loss": -44.46647262573242, "global_step": 305948, "epoch": 2528} {"train_loss": -44.471675872802734, "global_step": 305949, "epoch": 2528} {"train_loss": -43.871578216552734, "global_step": 305950, "epoch": 2528} {"train_loss": -44.07306671142578, "global_step": 305951, "epoch": 2528} {"train_loss": -44.49177932739258, "global_step": 305952, "epoch": 2528} {"train_loss": -43.52576446533203, "global_step": 305953, "epoch": 2528} {"train_loss": -44.21295166015625, "global_step": 305954, "epoch": 2528} {"train_loss": -44.33477783203125, "global_step": 305955, "epoch": 2528} {"train_loss": -43.952632904052734, "global_step": 305956, "epoch": 2528} {"train_loss": -42.1634407043457, "global_step": 305957, "epoch": 2528} {"train_loss": -41.27743911743164, "global_step": 305958, "epoch": 2528} {"train_loss": -43.037696838378906, "global_step": 305959, "epoch": 2528} {"train_loss": -40.3349494934082, "global_step": 305960, "epoch": 2528} {"train_loss": -40.64246368408203, "global_step": 305961, "epoch": 2528} {"train_loss": -42.20295715332031, "global_step": 305962, "epoch": 2528} {"train_loss": -39.48292922973633, "global_step": 305963, "epoch": 2528} {"train_loss": -40.991668701171875, "global_step": 305964, "epoch": 2528} {"train_loss": -40.35866928100586, "global_step": 305965, "epoch": 2528} {"train_loss": -42.13983154296875, "global_step": 305966, "epoch": 2528} {"train_loss": -37.60432815551758, "global_step": 305967, "epoch": 2528} {"train_loss": -36.1134147644043, "global_step": 305968, "epoch": 2528} {"train_loss": -35.66504669189453, "global_step": 305969, "epoch": 2528} {"train_loss": -37.864070892333984, "global_step": 305970, "epoch": 2528} {"train_loss": -35.25339889526367, "global_step": 305971, "epoch": 2528} {"train_loss": -35.97249221801758, "global_step": 305972, "epoch": 2528} {"train_loss": -37.52521514892578, "global_step": 305973, "epoch": 2528} {"train_loss": -36.401405334472656, "global_step": 305974, "epoch": 2528} {"train_loss": -35.48181915283203, "global_step": 305975, "epoch": 2528} {"train_loss": -38.53805160522461, "global_step": 305976, "epoch": 2528} {"train_loss": -35.01059341430664, "global_step": 305977, "epoch": 2528} {"train_loss": -38.70162582397461, "global_step": 305978, "epoch": 2528} {"train_loss": -33.23073959350586, "global_step": 305979, "epoch": 2528} {"train_loss": -40.22324752807617, "global_step": 305980, "epoch": 2528} {"train_loss": -37.692684173583984, "global_step": 305981, "epoch": 2528} {"train_loss": -38.78062438964844, "global_step": 305982, "epoch": 2528} {"train_loss": -41.037940979003906, "global_step": 305983, "epoch": 2528} {"train_loss": -38.81061935424805, "global_step": 305984, "epoch": 2528} {"train_loss": -39.497528076171875, "global_step": 305985, "epoch": 2528} {"train_loss": -41.561031341552734, "global_step": 305986, "epoch": 2528} {"train_loss": -38.607704162597656, "global_step": 305987, "epoch": 2528} {"train_loss": -40.49577713012695, "global_step": 305988, "epoch": 2528} {"train_loss": -41.95497512817383, "global_step": 305989, "epoch": 2528} {"train_loss": -39.675228118896484, "global_step": 305990, "epoch": 2528} {"train_loss": -38.44607162475586, "global_step": 305991, "epoch": 2528} {"train_loss": -42.33420944213867, "global_step": 305992, "epoch": 2528} {"train_loss": -40.68691635131836, "global_step": 305993, "epoch": 2528} {"train_loss": -40.969356536865234, "global_step": 305994, "epoch": 2528} {"train_loss": -39.7442741394043, "global_step": 305995, "epoch": 2528} {"train_loss": -43.18960189819336, "global_step": 305996, "epoch": 2528} {"train_loss": -41.43223190307617, "global_step": 305997, "epoch": 2528} {"train_loss": -40.43406295776367, "global_step": 305998, "epoch": 2528} {"train_loss": -41.940853118896484, "global_step": 305999, "epoch": 2528} {"train_loss": -43.1019401550293, "global_step": 306000, "epoch": 2528} {"train_loss": -41.86220932006836, "global_step": 306001, "epoch": 2528} {"train_loss": -41.64321517944336, "global_step": 306002, "epoch": 2528} {"train_loss": -41.71249008178711, "global_step": 306003, "epoch": 2528} {"train_loss": -43.3950309753418, "global_step": 306004, "epoch": 2528} {"train_loss": -41.95569610595703, "global_step": 306005, "epoch": 2528} {"train_loss": -42.05247116088867, "global_step": 306006, "epoch": 2528} {"train_loss": -42.75809860229492, "global_step": 306007, "epoch": 2528} {"train_loss": -42.299138723326124, "global_step": 306008, "epoch": 2528, "val_loss": 2642824.0} {"train_loss": -43.274635314941406, "global_step": 306009, "epoch": 2529} {"train_loss": -43.16370391845703, "global_step": 306010, "epoch": 2529} {"train_loss": -43.21645736694336, "global_step": 306011, "epoch": 2529} {"train_loss": -43.21668243408203, "global_step": 306012, "epoch": 2529} {"train_loss": -43.88201904296875, "global_step": 306013, "epoch": 2529} {"train_loss": -43.44584655761719, "global_step": 306014, "epoch": 2529} {"train_loss": -43.78992462158203, "global_step": 306015, "epoch": 2529} {"train_loss": -43.357635498046875, "global_step": 306016, "epoch": 2529} {"train_loss": -43.804046630859375, "global_step": 306017, "epoch": 2529} {"train_loss": -44.15559768676758, "global_step": 306018, "epoch": 2529} {"train_loss": -43.71427536010742, "global_step": 306019, "epoch": 2529} {"train_loss": -43.70577621459961, "global_step": 306020, "epoch": 2529} {"train_loss": -43.97085189819336, "global_step": 306021, "epoch": 2529} {"train_loss": -44.08501434326172, "global_step": 306022, "epoch": 2529} {"train_loss": -44.382991790771484, "global_step": 306023, "epoch": 2529} {"train_loss": -44.2685661315918, "global_step": 306024, "epoch": 2529} {"train_loss": -44.09450912475586, "global_step": 306025, "epoch": 2529} {"train_loss": -44.37955856323242, "global_step": 306026, "epoch": 2529} {"train_loss": -44.63080978393555, "global_step": 306027, "epoch": 2529} {"train_loss": -44.393348693847656, "global_step": 306028, "epoch": 2529} {"train_loss": -44.25995635986328, "global_step": 306029, "epoch": 2529} {"train_loss": -44.29572677612305, "global_step": 306030, "epoch": 2529} {"train_loss": -44.41145706176758, "global_step": 306031, "epoch": 2529} {"train_loss": -44.7490234375, "global_step": 306032, "epoch": 2529} {"train_loss": -44.7963752746582, "global_step": 306033, "epoch": 2529} {"train_loss": -44.25149917602539, "global_step": 306034, "epoch": 2529} {"train_loss": -44.54542922973633, "global_step": 306035, "epoch": 2529} {"train_loss": -44.85206985473633, "global_step": 306036, "epoch": 2529} {"train_loss": -44.43225860595703, "global_step": 306037, "epoch": 2529} {"train_loss": -44.95188903808594, "global_step": 306038, "epoch": 2529} {"train_loss": -44.60488510131836, "global_step": 306039, "epoch": 2529} {"train_loss": -44.3721923828125, "global_step": 306040, "epoch": 2529} {"train_loss": -44.9088020324707, "global_step": 306041, "epoch": 2529} {"train_loss": -44.84901809692383, "global_step": 306042, "epoch": 2529} {"train_loss": -45.0444450378418, "global_step": 306043, "epoch": 2529} {"train_loss": -44.888206481933594, "global_step": 306044, "epoch": 2529} {"train_loss": -44.98204040527344, "global_step": 306045, "epoch": 2529} {"train_loss": -44.76166915893555, "global_step": 306046, "epoch": 2529} {"train_loss": -45.089866638183594, "global_step": 306047, "epoch": 2529} {"train_loss": -44.579437255859375, "global_step": 306048, "epoch": 2529} {"train_loss": -45.23324203491211, "global_step": 306049, "epoch": 2529} {"train_loss": -45.24324035644531, "global_step": 306050, "epoch": 2529} {"train_loss": -44.97882080078125, "global_step": 306051, "epoch": 2529} {"train_loss": -44.94950866699219, "global_step": 306052, "epoch": 2529} {"train_loss": -45.04580307006836, "global_step": 306053, "epoch": 2529} {"train_loss": -44.93448257446289, "global_step": 306054, "epoch": 2529} {"train_loss": -45.17261505126953, "global_step": 306055, "epoch": 2529} {"train_loss": -45.035369873046875, "global_step": 306056, "epoch": 2529} {"train_loss": -45.40926742553711, "global_step": 306057, "epoch": 2529} {"train_loss": -45.14122772216797, "global_step": 306058, "epoch": 2529} {"train_loss": -45.540252685546875, "global_step": 306059, "epoch": 2529} {"train_loss": -45.44413375854492, "global_step": 306060, "epoch": 2529} {"train_loss": -45.26450729370117, "global_step": 306061, "epoch": 2529} {"train_loss": -45.39246368408203, "global_step": 306062, "epoch": 2529} {"train_loss": -45.26003646850586, "global_step": 306063, "epoch": 2529} {"train_loss": -45.43424606323242, "global_step": 306064, "epoch": 2529} {"train_loss": -45.4437255859375, "global_step": 306065, "epoch": 2529} {"train_loss": -44.7872428894043, "global_step": 306066, "epoch": 2529} {"train_loss": -44.66157913208008, "global_step": 306067, "epoch": 2529} {"train_loss": -45.02106857299805, "global_step": 306068, "epoch": 2529} {"train_loss": -45.0274772644043, "global_step": 306069, "epoch": 2529} {"train_loss": -45.210235595703125, "global_step": 306070, "epoch": 2529} {"train_loss": -45.33773422241211, "global_step": 306071, "epoch": 2529} {"train_loss": -45.663414001464844, "global_step": 306072, "epoch": 2529} {"train_loss": -45.34568405151367, "global_step": 306073, "epoch": 2529} {"train_loss": -44.96978759765625, "global_step": 306074, "epoch": 2529} {"train_loss": -44.01710510253906, "global_step": 306075, "epoch": 2529} {"train_loss": -40.63758087158203, "global_step": 306076, "epoch": 2529} {"train_loss": -36.560489654541016, "global_step": 306077, "epoch": 2529} {"train_loss": -27.567920684814453, "global_step": 306078, "epoch": 2529} {"train_loss": -39.5374870300293, "global_step": 306079, "epoch": 2529} {"train_loss": -35.43949508666992, "global_step": 306080, "epoch": 2529} {"train_loss": -26.123321533203125, "global_step": 306081, "epoch": 2529} {"train_loss": -37.07045364379883, "global_step": 306082, "epoch": 2529} {"train_loss": -31.677600860595703, "global_step": 306083, "epoch": 2529} {"train_loss": -32.60666275024414, "global_step": 306084, "epoch": 2529} {"train_loss": -36.637489318847656, "global_step": 306085, "epoch": 2529} {"train_loss": -37.597076416015625, "global_step": 306086, "epoch": 2529} {"train_loss": -37.54984664916992, "global_step": 306087, "epoch": 2529} {"train_loss": -37.015052795410156, "global_step": 306088, "epoch": 2529} {"train_loss": -37.95412063598633, "global_step": 306089, "epoch": 2529} {"train_loss": -37.64628219604492, "global_step": 306090, "epoch": 2529} {"train_loss": -37.623382568359375, "global_step": 306091, "epoch": 2529} {"train_loss": -37.619606018066406, "global_step": 306092, "epoch": 2529} {"train_loss": -37.133907318115234, "global_step": 306093, "epoch": 2529} {"train_loss": -39.36565017700195, "global_step": 306094, "epoch": 2529} {"train_loss": -37.96736526489258, "global_step": 306095, "epoch": 2529} {"train_loss": -39.04128646850586, "global_step": 306096, "epoch": 2529} {"train_loss": -39.783782958984375, "global_step": 306097, "epoch": 2529} {"train_loss": -38.439056396484375, "global_step": 306098, "epoch": 2529} {"train_loss": -38.98008728027344, "global_step": 306099, "epoch": 2529} {"train_loss": -38.22333526611328, "global_step": 306100, "epoch": 2529} {"train_loss": -40.138397216796875, "global_step": 306101, "epoch": 2529} {"train_loss": -38.84633255004883, "global_step": 306102, "epoch": 2529} {"train_loss": -38.952880859375, "global_step": 306103, "epoch": 2529} {"train_loss": -39.35721206665039, "global_step": 306104, "epoch": 2529} {"train_loss": -38.780433654785156, "global_step": 306105, "epoch": 2529} {"train_loss": -40.04121398925781, "global_step": 306106, "epoch": 2529} {"train_loss": -39.23073196411133, "global_step": 306107, "epoch": 2529} {"train_loss": -40.73552322387695, "global_step": 306108, "epoch": 2529} {"train_loss": -39.437252044677734, "global_step": 306109, "epoch": 2529} {"train_loss": -40.51506423950195, "global_step": 306110, "epoch": 2529} {"train_loss": -40.01247024536133, "global_step": 306111, "epoch": 2529} {"train_loss": -39.474853515625, "global_step": 306112, "epoch": 2529} {"train_loss": -40.55048751831055, "global_step": 306113, "epoch": 2529} {"train_loss": -40.272010803222656, "global_step": 306114, "epoch": 2529} {"train_loss": -40.647369384765625, "global_step": 306115, "epoch": 2529} {"train_loss": -39.67006301879883, "global_step": 306116, "epoch": 2529} {"train_loss": -39.74565124511719, "global_step": 306117, "epoch": 2529} {"train_loss": -40.59762191772461, "global_step": 306118, "epoch": 2529} {"train_loss": -40.97670364379883, "global_step": 306119, "epoch": 2529} {"train_loss": -41.122554779052734, "global_step": 306120, "epoch": 2529} {"train_loss": -40.494911193847656, "global_step": 306121, "epoch": 2529} {"train_loss": -40.61252975463867, "global_step": 306122, "epoch": 2529} {"train_loss": -41.194786071777344, "global_step": 306123, "epoch": 2529} {"train_loss": -41.03570556640625, "global_step": 306124, "epoch": 2529} {"train_loss": -41.53839874267578, "global_step": 306125, "epoch": 2529} {"train_loss": -41.65459060668945, "global_step": 306126, "epoch": 2529} {"train_loss": -41.316871643066406, "global_step": 306127, "epoch": 2529} {"train_loss": -41.618587493896484, "global_step": 306128, "epoch": 2529} {"train_loss": -41.94938426372433, "global_step": 306129, "epoch": 2529, "val_loss": 2622675.0} {"train_loss": -41.905025482177734, "global_step": 306130, "epoch": 2530} {"train_loss": -41.502769470214844, "global_step": 306131, "epoch": 2530} {"train_loss": -42.36243438720703, "global_step": 306132, "epoch": 2530} {"train_loss": -42.11431121826172, "global_step": 306133, "epoch": 2530} {"train_loss": -42.617431640625, "global_step": 306134, "epoch": 2530} {"train_loss": -42.32069778442383, "global_step": 306135, "epoch": 2530} {"train_loss": -42.3896484375, "global_step": 306136, "epoch": 2530} {"train_loss": -42.486846923828125, "global_step": 306137, "epoch": 2530} {"train_loss": -42.107669830322266, "global_step": 306138, "epoch": 2530} {"train_loss": -42.49300765991211, "global_step": 306139, "epoch": 2530} {"train_loss": -42.559364318847656, "global_step": 306140, "epoch": 2530} {"train_loss": -42.8531494140625, "global_step": 306141, "epoch": 2530} {"train_loss": -43.024993896484375, "global_step": 306142, "epoch": 2530} {"train_loss": -42.240509033203125, "global_step": 306143, "epoch": 2530} {"train_loss": -42.96590805053711, "global_step": 306144, "epoch": 2530} {"train_loss": -43.024757385253906, "global_step": 306145, "epoch": 2530} {"train_loss": -43.137657165527344, "global_step": 306146, "epoch": 2530} {"train_loss": -42.6573600769043, "global_step": 306147, "epoch": 2530} {"train_loss": -42.93547821044922, "global_step": 306148, "epoch": 2530} {"train_loss": -43.316898345947266, "global_step": 306149, "epoch": 2530} {"train_loss": -43.054683685302734, "global_step": 306150, "epoch": 2530} {"train_loss": -43.0706672668457, "global_step": 306151, "epoch": 2530} {"train_loss": -43.35456466674805, "global_step": 306152, "epoch": 2530} {"train_loss": -43.52674102783203, "global_step": 306153, "epoch": 2530} {"train_loss": -43.25773620605469, "global_step": 306154, "epoch": 2530} {"train_loss": -43.83891677856445, "global_step": 306155, "epoch": 2530} {"train_loss": -43.959144592285156, "global_step": 306156, "epoch": 2530} {"train_loss": -43.59463119506836, "global_step": 306157, "epoch": 2530} {"train_loss": -43.77766799926758, "global_step": 306158, "epoch": 2530} {"train_loss": -44.293052673339844, "global_step": 306159, "epoch": 2530} {"train_loss": -44.30628967285156, "global_step": 306160, "epoch": 2530} {"train_loss": -44.39764404296875, "global_step": 306161, "epoch": 2530} {"train_loss": -43.57231903076172, "global_step": 306162, "epoch": 2530} {"train_loss": -44.49892044067383, "global_step": 306163, "epoch": 2530} {"train_loss": -44.61601257324219, "global_step": 306164, "epoch": 2530} {"train_loss": -44.56291198730469, "global_step": 306165, "epoch": 2530} {"train_loss": -44.929603576660156, "global_step": 306166, "epoch": 2530} {"train_loss": -44.84321212768555, "global_step": 306167, "epoch": 2530} {"train_loss": -44.479305267333984, "global_step": 306168, "epoch": 2530} {"train_loss": -43.77708435058594, "global_step": 306169, "epoch": 2530} {"train_loss": -42.96543502807617, "global_step": 306170, "epoch": 2530} {"train_loss": -43.923152923583984, "global_step": 306171, "epoch": 2530} {"train_loss": -44.11796951293945, "global_step": 306172, "epoch": 2530} {"train_loss": -43.58930206298828, "global_step": 306173, "epoch": 2530} {"train_loss": -42.637996673583984, "global_step": 306174, "epoch": 2530} {"train_loss": -43.984718322753906, "global_step": 306175, "epoch": 2530} {"train_loss": -44.48308563232422, "global_step": 306176, "epoch": 2530} {"train_loss": -43.55910873413086, "global_step": 306177, "epoch": 2530} {"train_loss": -44.0992431640625, "global_step": 306178, "epoch": 2530} {"train_loss": -43.83604049682617, "global_step": 306179, "epoch": 2530} {"train_loss": -43.99126052856445, "global_step": 306180, "epoch": 2530} {"train_loss": -43.97452926635742, "global_step": 306181, "epoch": 2530} {"train_loss": -43.88542175292969, "global_step": 306182, "epoch": 2530} {"train_loss": -43.982784271240234, "global_step": 306183, "epoch": 2530} {"train_loss": -43.32089614868164, "global_step": 306184, "epoch": 2530} {"train_loss": -43.6647834777832, "global_step": 306185, "epoch": 2530} {"train_loss": -44.28837203979492, "global_step": 306186, "epoch": 2530} {"train_loss": -43.49796676635742, "global_step": 306187, "epoch": 2530} {"train_loss": -43.92647933959961, "global_step": 306188, "epoch": 2530} {"train_loss": -44.217926025390625, "global_step": 306189, "epoch": 2530} {"train_loss": -43.952449798583984, "global_step": 306190, "epoch": 2530} {"train_loss": -43.789520263671875, "global_step": 306191, "epoch": 2530} {"train_loss": -44.8369026184082, "global_step": 306192, "epoch": 2530} {"train_loss": -41.652408599853516, "global_step": 306193, "epoch": 2530} {"train_loss": -44.1893424987793, "global_step": 306194, "epoch": 2530} {"train_loss": -40.85404968261719, "global_step": 306195, "epoch": 2530} {"train_loss": -43.33002853393555, "global_step": 306196, "epoch": 2530} {"train_loss": -44.445892333984375, "global_step": 306197, "epoch": 2530} {"train_loss": -43.564571380615234, "global_step": 306198, "epoch": 2530} {"train_loss": -43.23927307128906, "global_step": 306199, "epoch": 2530} {"train_loss": -43.4398307800293, "global_step": 306200, "epoch": 2530} {"train_loss": -31.840702056884766, "global_step": 306201, "epoch": 2530} {"train_loss": -43.90644454956055, "global_step": 306202, "epoch": 2530} {"train_loss": -42.86244583129883, "global_step": 306203, "epoch": 2530} {"train_loss": -42.416343688964844, "global_step": 306204, "epoch": 2530} {"train_loss": -43.1246452331543, "global_step": 306205, "epoch": 2530} {"train_loss": -41.68731689453125, "global_step": 306206, "epoch": 2530} {"train_loss": -42.951107025146484, "global_step": 306207, "epoch": 2530} {"train_loss": -39.39282989501953, "global_step": 306208, "epoch": 2530} {"train_loss": -42.543025970458984, "global_step": 306209, "epoch": 2530} {"train_loss": -41.07076644897461, "global_step": 306210, "epoch": 2530} {"train_loss": -42.07279968261719, "global_step": 306211, "epoch": 2530} {"train_loss": -42.3559684753418, "global_step": 306212, "epoch": 2530} {"train_loss": -41.25614547729492, "global_step": 306213, "epoch": 2530} {"train_loss": -41.697017669677734, "global_step": 306214, "epoch": 2530} {"train_loss": -40.834957122802734, "global_step": 306215, "epoch": 2530} {"train_loss": -42.15293502807617, "global_step": 306216, "epoch": 2530} {"train_loss": -39.79694747924805, "global_step": 306217, "epoch": 2530} {"train_loss": -42.73331832885742, "global_step": 306218, "epoch": 2530} {"train_loss": -42.3010139465332, "global_step": 306219, "epoch": 2530} {"train_loss": -38.81549072265625, "global_step": 306220, "epoch": 2530} {"train_loss": -41.186614990234375, "global_step": 306221, "epoch": 2530} {"train_loss": -41.79205322265625, "global_step": 306222, "epoch": 2530} {"train_loss": -41.243770599365234, "global_step": 306223, "epoch": 2530} {"train_loss": -27.502593994140625, "global_step": 306224, "epoch": 2530} {"train_loss": -34.399105072021484, "global_step": 306225, "epoch": 2530} {"train_loss": -36.75626754760742, "global_step": 306226, "epoch": 2530} {"train_loss": -41.046913146972656, "global_step": 306227, "epoch": 2530} {"train_loss": -41.00974655151367, "global_step": 306228, "epoch": 2530} {"train_loss": -40.01357650756836, "global_step": 306229, "epoch": 2530} {"train_loss": -39.90556335449219, "global_step": 306230, "epoch": 2530} {"train_loss": -39.34107208251953, "global_step": 306231, "epoch": 2530} {"train_loss": -35.212562561035156, "global_step": 306232, "epoch": 2530} {"train_loss": -38.0319938659668, "global_step": 306233, "epoch": 2530} {"train_loss": -32.46369171142578, "global_step": 306234, "epoch": 2530} {"train_loss": -39.69105911254883, "global_step": 306235, "epoch": 2530} {"train_loss": -41.37168884277344, "global_step": 306236, "epoch": 2530} {"train_loss": -39.46526336669922, "global_step": 306237, "epoch": 2530} {"train_loss": -40.24968338012695, "global_step": 306238, "epoch": 2530} {"train_loss": -40.3256721496582, "global_step": 306239, "epoch": 2530} {"train_loss": -39.118953704833984, "global_step": 306240, "epoch": 2530} {"train_loss": -42.048824310302734, "global_step": 306241, "epoch": 2530} {"train_loss": -40.67600631713867, "global_step": 306242, "epoch": 2530} {"train_loss": -41.68324279785156, "global_step": 306243, "epoch": 2530} {"train_loss": -41.41175842285156, "global_step": 306244, "epoch": 2530} {"train_loss": -37.59790802001953, "global_step": 306245, "epoch": 2530} {"train_loss": -35.616573333740234, "global_step": 306246, "epoch": 2530} {"train_loss": -37.94459915161133, "global_step": 306247, "epoch": 2530} {"train_loss": -41.23391342163086, "global_step": 306248, "epoch": 2530} {"train_loss": -40.12939453125, "global_step": 306249, "epoch": 2530} {"train_loss": -41.94680515005569, "global_step": 306250, "epoch": 2530, "val_loss": 2473780.0} {"train_loss": -40.18889617919922, "global_step": 306251, "epoch": 2531} {"train_loss": -41.35015869140625, "global_step": 306252, "epoch": 2531} {"train_loss": -40.5689811706543, "global_step": 306253, "epoch": 2531} {"train_loss": -41.80405807495117, "global_step": 306254, "epoch": 2531} {"train_loss": -40.028560638427734, "global_step": 306255, "epoch": 2531} {"train_loss": -41.03926467895508, "global_step": 306256, "epoch": 2531} {"train_loss": -41.725860595703125, "global_step": 306257, "epoch": 2531} {"train_loss": -41.985618591308594, "global_step": 306258, "epoch": 2531} {"train_loss": -40.55377960205078, "global_step": 306259, "epoch": 2531} {"train_loss": -40.23277282714844, "global_step": 306260, "epoch": 2531} {"train_loss": -41.07780075073242, "global_step": 306261, "epoch": 2531} {"train_loss": -41.272274017333984, "global_step": 306262, "epoch": 2531} {"train_loss": -42.02476119995117, "global_step": 306263, "epoch": 2531} {"train_loss": -41.703880310058594, "global_step": 306264, "epoch": 2531} {"train_loss": -41.492950439453125, "global_step": 306265, "epoch": 2531} {"train_loss": -42.88349533081055, "global_step": 306266, "epoch": 2531} {"train_loss": -42.76577377319336, "global_step": 306267, "epoch": 2531} {"train_loss": -41.65875244140625, "global_step": 306268, "epoch": 2531} {"train_loss": -42.124176025390625, "global_step": 306269, "epoch": 2531} {"train_loss": -42.1132698059082, "global_step": 306270, "epoch": 2531} {"train_loss": -43.09345626831055, "global_step": 306271, "epoch": 2531} {"train_loss": -43.0400276184082, "global_step": 306272, "epoch": 2531} {"train_loss": -43.68354415893555, "global_step": 306273, "epoch": 2531} {"train_loss": -43.296241760253906, "global_step": 306274, "epoch": 2531} {"train_loss": -43.04215621948242, "global_step": 306275, "epoch": 2531} {"train_loss": -41.459007263183594, "global_step": 306276, "epoch": 2531} {"train_loss": -43.145904541015625, "global_step": 306277, "epoch": 2531} {"train_loss": -41.33726501464844, "global_step": 306278, "epoch": 2531} {"train_loss": -43.13282775878906, "global_step": 306279, "epoch": 2531} {"train_loss": -43.535369873046875, "global_step": 306280, "epoch": 2531} {"train_loss": -43.5754508972168, "global_step": 306281, "epoch": 2531} {"train_loss": -43.631072998046875, "global_step": 306282, "epoch": 2531} {"train_loss": -43.481327056884766, "global_step": 306283, "epoch": 2531} {"train_loss": -42.85844802856445, "global_step": 306284, "epoch": 2531} {"train_loss": -42.791542053222656, "global_step": 306285, "epoch": 2531} {"train_loss": -43.48573684692383, "global_step": 306286, "epoch": 2531} {"train_loss": -44.20109558105469, "global_step": 306287, "epoch": 2531} {"train_loss": -43.25997543334961, "global_step": 306288, "epoch": 2531} {"train_loss": -42.81201934814453, "global_step": 306289, "epoch": 2531} {"train_loss": -43.51891326904297, "global_step": 306290, "epoch": 2531} {"train_loss": -43.63036346435547, "global_step": 306291, "epoch": 2531} {"train_loss": -43.973026275634766, "global_step": 306292, "epoch": 2531} {"train_loss": -43.48176956176758, "global_step": 306293, "epoch": 2531} {"train_loss": -42.69365310668945, "global_step": 306294, "epoch": 2531} {"train_loss": -43.953792572021484, "global_step": 306295, "epoch": 2531} {"train_loss": -42.969482421875, "global_step": 306296, "epoch": 2531} {"train_loss": -43.375423431396484, "global_step": 306297, "epoch": 2531} {"train_loss": -43.24982833862305, "global_step": 306298, "epoch": 2531} {"train_loss": -43.341522216796875, "global_step": 306299, "epoch": 2531} {"train_loss": -43.701873779296875, "global_step": 306300, "epoch": 2531} {"train_loss": -43.416603088378906, "global_step": 306301, "epoch": 2531} {"train_loss": -43.242034912109375, "global_step": 306302, "epoch": 2531} {"train_loss": -43.132545471191406, "global_step": 306303, "epoch": 2531} {"train_loss": -43.027305603027344, "global_step": 306304, "epoch": 2531} {"train_loss": -43.06559371948242, "global_step": 306305, "epoch": 2531} {"train_loss": -43.075809478759766, "global_step": 306306, "epoch": 2531} {"train_loss": -43.44112777709961, "global_step": 306307, "epoch": 2531} {"train_loss": -44.08613967895508, "global_step": 306308, "epoch": 2531} {"train_loss": -43.40230941772461, "global_step": 306309, "epoch": 2531} {"train_loss": -43.686248779296875, "global_step": 306310, "epoch": 2531} {"train_loss": -43.84858703613281, "global_step": 306311, "epoch": 2531} {"train_loss": -43.95627975463867, "global_step": 306312, "epoch": 2531} {"train_loss": -43.565059661865234, "global_step": 306313, "epoch": 2531} {"train_loss": -44.19361877441406, "global_step": 306314, "epoch": 2531} {"train_loss": -43.944026947021484, "global_step": 306315, "epoch": 2531} {"train_loss": -43.86942672729492, "global_step": 306316, "epoch": 2531} {"train_loss": -42.70014190673828, "global_step": 306317, "epoch": 2531} {"train_loss": -42.88629913330078, "global_step": 306318, "epoch": 2531} {"train_loss": -43.71477127075195, "global_step": 306319, "epoch": 2531} {"train_loss": -43.785438537597656, "global_step": 306320, "epoch": 2531} {"train_loss": -43.440940856933594, "global_step": 306321, "epoch": 2531} {"train_loss": -43.2405891418457, "global_step": 306322, "epoch": 2531} {"train_loss": -44.465065002441406, "global_step": 306323, "epoch": 2531} {"train_loss": -43.82094192504883, "global_step": 306324, "epoch": 2531} {"train_loss": -43.064064025878906, "global_step": 306325, "epoch": 2531} {"train_loss": -43.5809211730957, "global_step": 306326, "epoch": 2531} {"train_loss": -42.801246643066406, "global_step": 306327, "epoch": 2531} {"train_loss": -41.691280364990234, "global_step": 306328, "epoch": 2531} {"train_loss": -41.91548156738281, "global_step": 306329, "epoch": 2531} {"train_loss": -41.74225997924805, "global_step": 306330, "epoch": 2531} {"train_loss": -43.45697784423828, "global_step": 306331, "epoch": 2531} {"train_loss": -43.05302047729492, "global_step": 306332, "epoch": 2531} {"train_loss": -42.37873077392578, "global_step": 306333, "epoch": 2531} {"train_loss": -43.01802062988281, "global_step": 306334, "epoch": 2531} {"train_loss": -42.49230194091797, "global_step": 306335, "epoch": 2531} {"train_loss": -42.70418930053711, "global_step": 306336, "epoch": 2531} {"train_loss": -41.20736312866211, "global_step": 306337, "epoch": 2531} {"train_loss": -42.15290451049805, "global_step": 306338, "epoch": 2531} {"train_loss": -42.11684799194336, "global_step": 306339, "epoch": 2531} {"train_loss": -41.705875396728516, "global_step": 306340, "epoch": 2531} {"train_loss": -43.40322494506836, "global_step": 306341, "epoch": 2531} {"train_loss": -41.272491455078125, "global_step": 306342, "epoch": 2531} {"train_loss": -42.392189025878906, "global_step": 306343, "epoch": 2531} {"train_loss": -41.479408264160156, "global_step": 306344, "epoch": 2531} {"train_loss": -42.768863677978516, "global_step": 306345, "epoch": 2531} {"train_loss": -41.857940673828125, "global_step": 306346, "epoch": 2531} {"train_loss": -43.59819030761719, "global_step": 306347, "epoch": 2531} {"train_loss": -41.69769287109375, "global_step": 306348, "epoch": 2531} {"train_loss": -43.515716552734375, "global_step": 306349, "epoch": 2531} {"train_loss": -42.52788162231445, "global_step": 306350, "epoch": 2531} {"train_loss": -41.49903869628906, "global_step": 306351, "epoch": 2531} {"train_loss": -43.2390251159668, "global_step": 306352, "epoch": 2531} {"train_loss": -40.6357536315918, "global_step": 306353, "epoch": 2531} {"train_loss": -42.306365966796875, "global_step": 306354, "epoch": 2531} {"train_loss": -40.35732650756836, "global_step": 306355, "epoch": 2531} {"train_loss": -40.706092834472656, "global_step": 306356, "epoch": 2531} {"train_loss": -38.96781921386719, "global_step": 306357, "epoch": 2531} {"train_loss": -40.598876953125, "global_step": 306358, "epoch": 2531} {"train_loss": -41.32052230834961, "global_step": 306359, "epoch": 2531} {"train_loss": -41.2741584777832, "global_step": 306360, "epoch": 2531} {"train_loss": -42.60415267944336, "global_step": 306361, "epoch": 2531} {"train_loss": -42.225624084472656, "global_step": 306362, "epoch": 2531} {"train_loss": -42.08557891845703, "global_step": 306363, "epoch": 2531} {"train_loss": -42.73087692260742, "global_step": 306364, "epoch": 2531} {"train_loss": -41.977272033691406, "global_step": 306365, "epoch": 2531} {"train_loss": -43.43831253051758, "global_step": 306366, "epoch": 2531} {"train_loss": -41.57389450073242, "global_step": 306367, "epoch": 2531} {"train_loss": -40.66004180908203, "global_step": 306368, "epoch": 2531} {"train_loss": -41.08927536010742, "global_step": 306369, "epoch": 2531} {"train_loss": -42.038421630859375, "global_step": 306370, "epoch": 2531} {"train_loss": -42.518020503777116, "global_step": 306371, "epoch": 2531, "val_loss": 2496639.75} {"train_loss": -33.96968078613281, "global_step": 306372, "epoch": 2532} {"train_loss": -41.17155838012695, "global_step": 306373, "epoch": 2532} {"train_loss": -41.1750373840332, "global_step": 306374, "epoch": 2532} {"train_loss": -39.31486892700195, "global_step": 306375, "epoch": 2532} {"train_loss": -41.832740783691406, "global_step": 306376, "epoch": 2532} {"train_loss": -40.198204040527344, "global_step": 306377, "epoch": 2532} {"train_loss": -41.43281173706055, "global_step": 306378, "epoch": 2532} {"train_loss": -40.40506362915039, "global_step": 306379, "epoch": 2532} {"train_loss": -41.724857330322266, "global_step": 306380, "epoch": 2532} {"train_loss": -41.3628044128418, "global_step": 306381, "epoch": 2532} {"train_loss": -42.78562545776367, "global_step": 306382, "epoch": 2532} {"train_loss": -41.193973541259766, "global_step": 306383, "epoch": 2532} {"train_loss": -42.508827209472656, "global_step": 306384, "epoch": 2532} {"train_loss": -41.445343017578125, "global_step": 306385, "epoch": 2532} {"train_loss": -42.479671478271484, "global_step": 306386, "epoch": 2532} {"train_loss": -41.71954345703125, "global_step": 306387, "epoch": 2532} {"train_loss": -41.972816467285156, "global_step": 306388, "epoch": 2532} {"train_loss": -42.07689666748047, "global_step": 306389, "epoch": 2532} {"train_loss": -42.70685577392578, "global_step": 306390, "epoch": 2532} {"train_loss": -42.47623825073242, "global_step": 306391, "epoch": 2532} {"train_loss": -43.07548904418945, "global_step": 306392, "epoch": 2532} {"train_loss": -42.59865951538086, "global_step": 306393, "epoch": 2532} {"train_loss": -43.24203872680664, "global_step": 306394, "epoch": 2532} {"train_loss": -42.20161819458008, "global_step": 306395, "epoch": 2532} {"train_loss": -43.04376983642578, "global_step": 306396, "epoch": 2532} {"train_loss": -42.997833251953125, "global_step": 306397, "epoch": 2532} {"train_loss": -43.03339767456055, "global_step": 306398, "epoch": 2532} {"train_loss": -41.873252868652344, "global_step": 306399, "epoch": 2532} {"train_loss": -42.87051010131836, "global_step": 306400, "epoch": 2532} {"train_loss": -43.02777862548828, "global_step": 306401, "epoch": 2532} {"train_loss": -43.63581085205078, "global_step": 306402, "epoch": 2532} {"train_loss": -42.77444076538086, "global_step": 306403, "epoch": 2532} {"train_loss": -43.26656723022461, "global_step": 306404, "epoch": 2532} {"train_loss": -42.443511962890625, "global_step": 306405, "epoch": 2532} {"train_loss": -43.295745849609375, "global_step": 306406, "epoch": 2532} {"train_loss": -42.7447624206543, "global_step": 306407, "epoch": 2532} {"train_loss": -43.69886779785156, "global_step": 306408, "epoch": 2532} {"train_loss": -43.106990814208984, "global_step": 306409, "epoch": 2532} {"train_loss": -43.779903411865234, "global_step": 306410, "epoch": 2532} {"train_loss": -43.153175354003906, "global_step": 306411, "epoch": 2532} {"train_loss": -44.0633430480957, "global_step": 306412, "epoch": 2532} {"train_loss": -43.363983154296875, "global_step": 306413, "epoch": 2532} {"train_loss": -42.91328811645508, "global_step": 306414, "epoch": 2532} {"train_loss": -43.94165802001953, "global_step": 306415, "epoch": 2532} {"train_loss": -43.53830337524414, "global_step": 306416, "epoch": 2532} {"train_loss": -43.48101806640625, "global_step": 306417, "epoch": 2532} {"train_loss": -43.19326400756836, "global_step": 306418, "epoch": 2532} {"train_loss": -43.30323028564453, "global_step": 306419, "epoch": 2532} {"train_loss": -43.70316696166992, "global_step": 306420, "epoch": 2532} {"train_loss": -43.81193923950195, "global_step": 306421, "epoch": 2532} {"train_loss": -43.80391311645508, "global_step": 306422, "epoch": 2532} {"train_loss": -43.81551742553711, "global_step": 306423, "epoch": 2532} {"train_loss": -44.072265625, "global_step": 306424, "epoch": 2532} {"train_loss": -44.06503677368164, "global_step": 306425, "epoch": 2532} {"train_loss": -44.41248321533203, "global_step": 306426, "epoch": 2532} {"train_loss": -43.83945846557617, "global_step": 306427, "epoch": 2532} {"train_loss": -44.25027084350586, "global_step": 306428, "epoch": 2532} {"train_loss": -43.61526107788086, "global_step": 306429, "epoch": 2532} {"train_loss": -44.07538986206055, "global_step": 306430, "epoch": 2532} {"train_loss": -43.56211853027344, "global_step": 306431, "epoch": 2532} {"train_loss": -44.34306716918945, "global_step": 306432, "epoch": 2532} {"train_loss": -43.93404006958008, "global_step": 306433, "epoch": 2532} {"train_loss": -44.248016357421875, "global_step": 306434, "epoch": 2532} {"train_loss": -43.49827194213867, "global_step": 306435, "epoch": 2532} {"train_loss": -44.4099006652832, "global_step": 306436, "epoch": 2532} {"train_loss": -44.51520538330078, "global_step": 306437, "epoch": 2532} {"train_loss": -44.58393096923828, "global_step": 306438, "epoch": 2532} {"train_loss": -44.15910720825195, "global_step": 306439, "epoch": 2532} {"train_loss": -44.25189971923828, "global_step": 306440, "epoch": 2532} {"train_loss": -44.29092025756836, "global_step": 306441, "epoch": 2532} {"train_loss": -44.4218635559082, "global_step": 306442, "epoch": 2532} {"train_loss": -44.76115036010742, "global_step": 306443, "epoch": 2532} {"train_loss": -44.512081146240234, "global_step": 306444, "epoch": 2532} {"train_loss": -44.41841506958008, "global_step": 306445, "epoch": 2532} {"train_loss": -43.52302169799805, "global_step": 306446, "epoch": 2532} {"train_loss": -43.77688217163086, "global_step": 306447, "epoch": 2532} {"train_loss": -44.074153900146484, "global_step": 306448, "epoch": 2532} {"train_loss": -43.862064361572266, "global_step": 306449, "epoch": 2532} {"train_loss": -44.44668197631836, "global_step": 306450, "epoch": 2532} {"train_loss": -44.54568099975586, "global_step": 306451, "epoch": 2532} {"train_loss": -43.578094482421875, "global_step": 306452, "epoch": 2532} {"train_loss": -42.354278564453125, "global_step": 306453, "epoch": 2532} {"train_loss": -43.60860824584961, "global_step": 306454, "epoch": 2532} {"train_loss": -43.851043701171875, "global_step": 306455, "epoch": 2532} {"train_loss": -43.36385726928711, "global_step": 306456, "epoch": 2532} {"train_loss": -42.05457305908203, "global_step": 306457, "epoch": 2532} {"train_loss": -41.57709884643555, "global_step": 306458, "epoch": 2532} {"train_loss": -43.7364616394043, "global_step": 306459, "epoch": 2532} {"train_loss": -41.6789665222168, "global_step": 306460, "epoch": 2532} {"train_loss": -42.146724700927734, "global_step": 306461, "epoch": 2532} {"train_loss": -41.992549896240234, "global_step": 306462, "epoch": 2532} {"train_loss": -43.328495025634766, "global_step": 306463, "epoch": 2532} {"train_loss": -41.53595733642578, "global_step": 306464, "epoch": 2532} {"train_loss": -42.94064712524414, "global_step": 306465, "epoch": 2532} {"train_loss": -43.60580062866211, "global_step": 306466, "epoch": 2532} {"train_loss": -40.69955062866211, "global_step": 306467, "epoch": 2532} {"train_loss": -37.1494140625, "global_step": 306468, "epoch": 2532} {"train_loss": -40.94294357299805, "global_step": 306469, "epoch": 2532} {"train_loss": -42.96305465698242, "global_step": 306470, "epoch": 2532} {"train_loss": -41.546600341796875, "global_step": 306471, "epoch": 2532} {"train_loss": -41.184505462646484, "global_step": 306472, "epoch": 2532} {"train_loss": -42.63853073120117, "global_step": 306473, "epoch": 2532} {"train_loss": -41.204673767089844, "global_step": 306474, "epoch": 2532} {"train_loss": -40.98655700683594, "global_step": 306475, "epoch": 2532} {"train_loss": -43.49428939819336, "global_step": 306476, "epoch": 2532} {"train_loss": -41.70475769042969, "global_step": 306477, "epoch": 2532} {"train_loss": -40.68960189819336, "global_step": 306478, "epoch": 2532} {"train_loss": -41.00508499145508, "global_step": 306479, "epoch": 2532} {"train_loss": -42.233699798583984, "global_step": 306480, "epoch": 2532} {"train_loss": -42.54562759399414, "global_step": 306481, "epoch": 2532} {"train_loss": -42.770111083984375, "global_step": 306482, "epoch": 2532} {"train_loss": -42.500389099121094, "global_step": 306483, "epoch": 2532} {"train_loss": -42.234153747558594, "global_step": 306484, "epoch": 2532} {"train_loss": -43.54425048828125, "global_step": 306485, "epoch": 2532} {"train_loss": -42.56288528442383, "global_step": 306486, "epoch": 2532} {"train_loss": -42.106597900390625, "global_step": 306487, "epoch": 2532} {"train_loss": -43.167518615722656, "global_step": 306488, "epoch": 2532} {"train_loss": -43.160667419433594, "global_step": 306489, "epoch": 2532} {"train_loss": -43.41288375854492, "global_step": 306490, "epoch": 2532} {"train_loss": -42.80016326904297, "global_step": 306491, "epoch": 2532} {"train_loss": -42.78975891869916, "global_step": 306492, "epoch": 2532, "val_loss": 2677641.25} {"train_loss": -44.03894805908203, "global_step": 306493, "epoch": 2533} {"train_loss": -43.288246154785156, "global_step": 306494, "epoch": 2533} {"train_loss": -43.55556106567383, "global_step": 306495, "epoch": 2533} {"train_loss": -44.287025451660156, "global_step": 306496, "epoch": 2533} {"train_loss": -42.86117172241211, "global_step": 306497, "epoch": 2533} {"train_loss": -43.247047424316406, "global_step": 306498, "epoch": 2533} {"train_loss": -44.05473709106445, "global_step": 306499, "epoch": 2533} {"train_loss": -44.105533599853516, "global_step": 306500, "epoch": 2533} {"train_loss": -43.804931640625, "global_step": 306501, "epoch": 2533} {"train_loss": -43.30405807495117, "global_step": 306502, "epoch": 2533} {"train_loss": -44.26621627807617, "global_step": 306503, "epoch": 2533} {"train_loss": -43.829734802246094, "global_step": 306504, "epoch": 2533} {"train_loss": -44.045223236083984, "global_step": 306505, "epoch": 2533} {"train_loss": -43.9867057800293, "global_step": 306506, "epoch": 2533} {"train_loss": -44.37757110595703, "global_step": 306507, "epoch": 2533} {"train_loss": -43.7882194519043, "global_step": 306508, "epoch": 2533} {"train_loss": -44.160335540771484, "global_step": 306509, "epoch": 2533} {"train_loss": -44.28128433227539, "global_step": 306510, "epoch": 2533} {"train_loss": -44.92384719848633, "global_step": 306511, "epoch": 2533} {"train_loss": -44.5388298034668, "global_step": 306512, "epoch": 2533} {"train_loss": -44.09091567993164, "global_step": 306513, "epoch": 2533} {"train_loss": -44.096683502197266, "global_step": 306514, "epoch": 2533} {"train_loss": -44.64158248901367, "global_step": 306515, "epoch": 2533} {"train_loss": -44.2921142578125, "global_step": 306516, "epoch": 2533} {"train_loss": -44.722412109375, "global_step": 306517, "epoch": 2533} {"train_loss": -44.69123458862305, "global_step": 306518, "epoch": 2533} {"train_loss": -43.854000091552734, "global_step": 306519, "epoch": 2533} {"train_loss": -44.44521713256836, "global_step": 306520, "epoch": 2533} {"train_loss": -43.93386459350586, "global_step": 306521, "epoch": 2533} {"train_loss": -43.91238021850586, "global_step": 306522, "epoch": 2533} {"train_loss": -44.43525314331055, "global_step": 306523, "epoch": 2533} {"train_loss": -44.60056686401367, "global_step": 306524, "epoch": 2533} {"train_loss": -44.78006362915039, "global_step": 306525, "epoch": 2533} {"train_loss": -44.3492546081543, "global_step": 306526, "epoch": 2533} {"train_loss": -44.2129020690918, "global_step": 306527, "epoch": 2533} {"train_loss": -44.191802978515625, "global_step": 306528, "epoch": 2533} {"train_loss": -44.01727294921875, "global_step": 306529, "epoch": 2533} {"train_loss": -44.39738845825195, "global_step": 306530, "epoch": 2533} {"train_loss": -44.277523040771484, "global_step": 306531, "epoch": 2533} {"train_loss": -44.92045974731445, "global_step": 306532, "epoch": 2533} {"train_loss": -44.945045471191406, "global_step": 306533, "epoch": 2533} {"train_loss": -44.51975631713867, "global_step": 306534, "epoch": 2533} {"train_loss": -44.513301849365234, "global_step": 306535, "epoch": 2533} {"train_loss": -44.47677230834961, "global_step": 306536, "epoch": 2533} {"train_loss": -43.93091583251953, "global_step": 306537, "epoch": 2533} {"train_loss": -43.23784255981445, "global_step": 306538, "epoch": 2533} {"train_loss": -43.8720817565918, "global_step": 306539, "epoch": 2533} {"train_loss": -43.317909240722656, "global_step": 306540, "epoch": 2533} {"train_loss": -42.18424606323242, "global_step": 306541, "epoch": 2533} {"train_loss": -42.242916107177734, "global_step": 306542, "epoch": 2533} {"train_loss": -42.920654296875, "global_step": 306543, "epoch": 2533} {"train_loss": -43.79128646850586, "global_step": 306544, "epoch": 2533} {"train_loss": -43.92457962036133, "global_step": 306545, "epoch": 2533} {"train_loss": -44.131439208984375, "global_step": 306546, "epoch": 2533} {"train_loss": -43.358882904052734, "global_step": 306547, "epoch": 2533} {"train_loss": -42.82760238647461, "global_step": 306548, "epoch": 2533} {"train_loss": -43.170928955078125, "global_step": 306549, "epoch": 2533} {"train_loss": -43.74868392944336, "global_step": 306550, "epoch": 2533} {"train_loss": -43.371543884277344, "global_step": 306551, "epoch": 2533} {"train_loss": -42.870967864990234, "global_step": 306552, "epoch": 2533} {"train_loss": -43.56511688232422, "global_step": 306553, "epoch": 2533} {"train_loss": -43.890193939208984, "global_step": 306554, "epoch": 2533} {"train_loss": -43.038597106933594, "global_step": 306555, "epoch": 2533} {"train_loss": -42.793487548828125, "global_step": 306556, "epoch": 2533} {"train_loss": -43.70881271362305, "global_step": 306557, "epoch": 2533} {"train_loss": -42.43645095825195, "global_step": 306558, "epoch": 2533} {"train_loss": -42.72271728515625, "global_step": 306559, "epoch": 2533} {"train_loss": -43.632965087890625, "global_step": 306560, "epoch": 2533} {"train_loss": -44.51017761230469, "global_step": 306561, "epoch": 2533} {"train_loss": -43.06329345703125, "global_step": 306562, "epoch": 2533} {"train_loss": -43.47865295410156, "global_step": 306563, "epoch": 2533} {"train_loss": -43.28082275390625, "global_step": 306564, "epoch": 2533} {"train_loss": -43.25200271606445, "global_step": 306565, "epoch": 2533} {"train_loss": -42.77102279663086, "global_step": 306566, "epoch": 2533} {"train_loss": -43.204097747802734, "global_step": 306567, "epoch": 2533} {"train_loss": -43.176239013671875, "global_step": 306568, "epoch": 2533} {"train_loss": -42.06425857543945, "global_step": 306569, "epoch": 2533} {"train_loss": -43.15949630737305, "global_step": 306570, "epoch": 2533} {"train_loss": -41.72842788696289, "global_step": 306571, "epoch": 2533} {"train_loss": -42.637935638427734, "global_step": 306572, "epoch": 2533} {"train_loss": -41.96376419067383, "global_step": 306573, "epoch": 2533} {"train_loss": -42.80072784423828, "global_step": 306574, "epoch": 2533} {"train_loss": -42.05786895751953, "global_step": 306575, "epoch": 2533} {"train_loss": -43.5992317199707, "global_step": 306576, "epoch": 2533} {"train_loss": -42.58753204345703, "global_step": 306577, "epoch": 2533} {"train_loss": -42.79471969604492, "global_step": 306578, "epoch": 2533} {"train_loss": -42.35565948486328, "global_step": 306579, "epoch": 2533} {"train_loss": -43.3446044921875, "global_step": 306580, "epoch": 2533} {"train_loss": -41.93220138549805, "global_step": 306581, "epoch": 2533} {"train_loss": -42.378570556640625, "global_step": 306582, "epoch": 2533} {"train_loss": -43.15640640258789, "global_step": 306583, "epoch": 2533} {"train_loss": -42.91372299194336, "global_step": 306584, "epoch": 2533} {"train_loss": -43.81761169433594, "global_step": 306585, "epoch": 2533} {"train_loss": -43.54935836791992, "global_step": 306586, "epoch": 2533} {"train_loss": -42.576507568359375, "global_step": 306587, "epoch": 2533} {"train_loss": -43.95002365112305, "global_step": 306588, "epoch": 2533} {"train_loss": -42.7582893371582, "global_step": 306589, "epoch": 2533} {"train_loss": -43.94389724731445, "global_step": 306590, "epoch": 2533} {"train_loss": -43.07719039916992, "global_step": 306591, "epoch": 2533} {"train_loss": -43.07975387573242, "global_step": 306592, "epoch": 2533} {"train_loss": -43.39177703857422, "global_step": 306593, "epoch": 2533} {"train_loss": -43.177982330322266, "global_step": 306594, "epoch": 2533} {"train_loss": -43.91086959838867, "global_step": 306595, "epoch": 2533} {"train_loss": -43.9847297668457, "global_step": 306596, "epoch": 2533} {"train_loss": -43.793888092041016, "global_step": 306597, "epoch": 2533} {"train_loss": -43.94462203979492, "global_step": 306598, "epoch": 2533} {"train_loss": -44.244564056396484, "global_step": 306599, "epoch": 2533} {"train_loss": -42.931671142578125, "global_step": 306600, "epoch": 2533} {"train_loss": -43.32709884643555, "global_step": 306601, "epoch": 2533} {"train_loss": -43.09682846069336, "global_step": 306602, "epoch": 2533} {"train_loss": -43.571632385253906, "global_step": 306603, "epoch": 2533} {"train_loss": -43.25816345214844, "global_step": 306604, "epoch": 2533} {"train_loss": -44.19346237182617, "global_step": 306605, "epoch": 2533} {"train_loss": -43.70083999633789, "global_step": 306606, "epoch": 2533} {"train_loss": -43.83681106567383, "global_step": 306607, "epoch": 2533} {"train_loss": -44.07220458984375, "global_step": 306608, "epoch": 2533} {"train_loss": -44.63959884643555, "global_step": 306609, "epoch": 2533} {"train_loss": -44.4306640625, "global_step": 306610, "epoch": 2533} {"train_loss": -43.870635986328125, "global_step": 306611, "epoch": 2533} {"train_loss": -44.15351867675781, "global_step": 306612, "epoch": 2533} {"train_loss": -43.616794460075944, "global_step": 306613, "epoch": 2533, "val_loss": 2619646.75} {"train_loss": -43.464447021484375, "global_step": 306614, "epoch": 2534} {"train_loss": -42.889930725097656, "global_step": 306615, "epoch": 2534} {"train_loss": -43.65598678588867, "global_step": 306616, "epoch": 2534} {"train_loss": -44.01984786987305, "global_step": 306617, "epoch": 2534} {"train_loss": -43.2790412902832, "global_step": 306618, "epoch": 2534} {"train_loss": -43.925533294677734, "global_step": 306619, "epoch": 2534} {"train_loss": -42.6249885559082, "global_step": 306620, "epoch": 2534} {"train_loss": -44.38690185546875, "global_step": 306621, "epoch": 2534} {"train_loss": -44.045936584472656, "global_step": 306622, "epoch": 2534} {"train_loss": -43.384029388427734, "global_step": 306623, "epoch": 2534} {"train_loss": -44.25462341308594, "global_step": 306624, "epoch": 2534} {"train_loss": -43.10752487182617, "global_step": 306625, "epoch": 2534} {"train_loss": -44.52179718017578, "global_step": 306626, "epoch": 2534} {"train_loss": -44.48977279663086, "global_step": 306627, "epoch": 2534} {"train_loss": -43.820709228515625, "global_step": 306628, "epoch": 2534} {"train_loss": -43.5018310546875, "global_step": 306629, "epoch": 2534} {"train_loss": -43.68650436401367, "global_step": 306630, "epoch": 2534} {"train_loss": -43.67217254638672, "global_step": 306631, "epoch": 2534} {"train_loss": -43.790584564208984, "global_step": 306632, "epoch": 2534} {"train_loss": -44.12626266479492, "global_step": 306633, "epoch": 2534} {"train_loss": -44.23987579345703, "global_step": 306634, "epoch": 2534} {"train_loss": -43.934326171875, "global_step": 306635, "epoch": 2534} {"train_loss": -44.251304626464844, "global_step": 306636, "epoch": 2534} {"train_loss": -44.113990783691406, "global_step": 306637, "epoch": 2534} {"train_loss": -44.600608825683594, "global_step": 306638, "epoch": 2534} {"train_loss": -45.09056854248047, "global_step": 306639, "epoch": 2534} {"train_loss": -44.232357025146484, "global_step": 306640, "epoch": 2534} {"train_loss": -44.126564025878906, "global_step": 306641, "epoch": 2534} {"train_loss": -43.552452087402344, "global_step": 306642, "epoch": 2534} {"train_loss": -44.817867279052734, "global_step": 306643, "epoch": 2534} {"train_loss": -44.34765625, "global_step": 306644, "epoch": 2534} {"train_loss": -43.1894645690918, "global_step": 306645, "epoch": 2534} {"train_loss": -44.731990814208984, "global_step": 306646, "epoch": 2534} {"train_loss": -42.400909423828125, "global_step": 306647, "epoch": 2534} {"train_loss": -43.904972076416016, "global_step": 306648, "epoch": 2534} {"train_loss": -44.226295471191406, "global_step": 306649, "epoch": 2534} {"train_loss": -43.39399337768555, "global_step": 306650, "epoch": 2534} {"train_loss": -43.052162170410156, "global_step": 306651, "epoch": 2534} {"train_loss": -43.721595764160156, "global_step": 306652, "epoch": 2534} {"train_loss": -44.444580078125, "global_step": 306653, "epoch": 2534} {"train_loss": -43.99150848388672, "global_step": 306654, "epoch": 2534} {"train_loss": -44.29938507080078, "global_step": 306655, "epoch": 2534} {"train_loss": -44.41189193725586, "global_step": 306656, "epoch": 2534} {"train_loss": -43.41775131225586, "global_step": 306657, "epoch": 2534} {"train_loss": -42.66341781616211, "global_step": 306658, "epoch": 2534} {"train_loss": -44.04435348510742, "global_step": 306659, "epoch": 2534} {"train_loss": -41.65507507324219, "global_step": 306660, "epoch": 2534} {"train_loss": -44.23721694946289, "global_step": 306661, "epoch": 2534} {"train_loss": -40.72329330444336, "global_step": 306662, "epoch": 2534} {"train_loss": -42.82133102416992, "global_step": 306663, "epoch": 2534} {"train_loss": -41.695796966552734, "global_step": 306664, "epoch": 2534} {"train_loss": -41.905635833740234, "global_step": 306665, "epoch": 2534} {"train_loss": -42.4100456237793, "global_step": 306666, "epoch": 2534} {"train_loss": -42.74817657470703, "global_step": 306667, "epoch": 2534} {"train_loss": -42.92277908325195, "global_step": 306668, "epoch": 2534} {"train_loss": -43.3712043762207, "global_step": 306669, "epoch": 2534} {"train_loss": -42.84597396850586, "global_step": 306670, "epoch": 2534} {"train_loss": -41.86029815673828, "global_step": 306671, "epoch": 2534} {"train_loss": -42.578582763671875, "global_step": 306672, "epoch": 2534} {"train_loss": -43.643184661865234, "global_step": 306673, "epoch": 2534} {"train_loss": -42.396175384521484, "global_step": 306674, "epoch": 2534} {"train_loss": -42.61565399169922, "global_step": 306675, "epoch": 2534} {"train_loss": -44.006168365478516, "global_step": 306676, "epoch": 2534} {"train_loss": -43.69081115722656, "global_step": 306677, "epoch": 2534} {"train_loss": -43.64848327636719, "global_step": 306678, "epoch": 2534} {"train_loss": -42.83860778808594, "global_step": 306679, "epoch": 2534} {"train_loss": -43.79268264770508, "global_step": 306680, "epoch": 2534} {"train_loss": -43.71431350708008, "global_step": 306681, "epoch": 2534} {"train_loss": -43.788330078125, "global_step": 306682, "epoch": 2534} {"train_loss": -43.790035247802734, "global_step": 306683, "epoch": 2534} {"train_loss": -44.25519561767578, "global_step": 306684, "epoch": 2534} {"train_loss": -44.29506301879883, "global_step": 306685, "epoch": 2534} {"train_loss": -44.127532958984375, "global_step": 306686, "epoch": 2534} {"train_loss": -44.125160217285156, "global_step": 306687, "epoch": 2534} {"train_loss": -43.07271957397461, "global_step": 306688, "epoch": 2534} {"train_loss": -43.59597396850586, "global_step": 306689, "epoch": 2534} {"train_loss": -43.91889572143555, "global_step": 306690, "epoch": 2534} {"train_loss": -44.077308654785156, "global_step": 306691, "epoch": 2534} {"train_loss": -44.11983871459961, "global_step": 306692, "epoch": 2534} {"train_loss": -43.83563232421875, "global_step": 306693, "epoch": 2534} {"train_loss": -43.73542785644531, "global_step": 306694, "epoch": 2534} {"train_loss": -44.060035705566406, "global_step": 306695, "epoch": 2534} {"train_loss": -44.338077545166016, "global_step": 306696, "epoch": 2534} {"train_loss": -43.68817138671875, "global_step": 306697, "epoch": 2534} {"train_loss": -43.7474479675293, "global_step": 306698, "epoch": 2534} {"train_loss": -44.74153518676758, "global_step": 306699, "epoch": 2534} {"train_loss": -43.962677001953125, "global_step": 306700, "epoch": 2534} {"train_loss": -43.056373596191406, "global_step": 306701, "epoch": 2534} {"train_loss": -44.2586784362793, "global_step": 306702, "epoch": 2534} {"train_loss": -44.59821319580078, "global_step": 306703, "epoch": 2534} {"train_loss": -43.81772232055664, "global_step": 306704, "epoch": 2534} {"train_loss": -43.31262969970703, "global_step": 306705, "epoch": 2534} {"train_loss": -43.43451690673828, "global_step": 306706, "epoch": 2534} {"train_loss": -43.51213073730469, "global_step": 306707, "epoch": 2534} {"train_loss": -44.09347152709961, "global_step": 306708, "epoch": 2534} {"train_loss": -43.720672607421875, "global_step": 306709, "epoch": 2534} {"train_loss": -43.5252685546875, "global_step": 306710, "epoch": 2534} {"train_loss": -42.5620002746582, "global_step": 306711, "epoch": 2534} {"train_loss": -43.51638412475586, "global_step": 306712, "epoch": 2534} {"train_loss": -43.40449142456055, "global_step": 306713, "epoch": 2534} {"train_loss": -42.57257080078125, "global_step": 306714, "epoch": 2534} {"train_loss": -43.761390686035156, "global_step": 306715, "epoch": 2534} {"train_loss": -42.82674026489258, "global_step": 306716, "epoch": 2534} {"train_loss": -42.7187385559082, "global_step": 306717, "epoch": 2534} {"train_loss": -43.422489166259766, "global_step": 306718, "epoch": 2534} {"train_loss": -43.31946563720703, "global_step": 306719, "epoch": 2534} {"train_loss": -43.893653869628906, "global_step": 306720, "epoch": 2534} {"train_loss": -43.872371673583984, "global_step": 306721, "epoch": 2534} {"train_loss": -44.1576042175293, "global_step": 306722, "epoch": 2534} {"train_loss": -44.32393264770508, "global_step": 306723, "epoch": 2534} {"train_loss": -44.69588088989258, "global_step": 306724, "epoch": 2534} {"train_loss": -44.73786544799805, "global_step": 306725, "epoch": 2534} {"train_loss": -44.07088851928711, "global_step": 306726, "epoch": 2534} {"train_loss": -44.63584518432617, "global_step": 306727, "epoch": 2534} {"train_loss": -44.687435150146484, "global_step": 306728, "epoch": 2534} {"train_loss": -44.357666015625, "global_step": 306729, "epoch": 2534} {"train_loss": -44.71023178100586, "global_step": 306730, "epoch": 2534} {"train_loss": -45.167152404785156, "global_step": 306731, "epoch": 2534} {"train_loss": -44.59568405151367, "global_step": 306732, "epoch": 2534} {"train_loss": -44.491756439208984, "global_step": 306733, "epoch": 2534} {"train_loss": -43.70412854911867, "global_step": 306734, "epoch": 2534, "val_loss": 2561984.0} {"train_loss": -44.557533264160156, "global_step": 306735, "epoch": 2535} {"train_loss": -44.0535774230957, "global_step": 306736, "epoch": 2535} {"train_loss": -44.0252571105957, "global_step": 306737, "epoch": 2535} {"train_loss": -43.242244720458984, "global_step": 306738, "epoch": 2535} {"train_loss": -42.80780029296875, "global_step": 306739, "epoch": 2535} {"train_loss": -44.139373779296875, "global_step": 306740, "epoch": 2535} {"train_loss": -44.515045166015625, "global_step": 306741, "epoch": 2535} {"train_loss": -44.768611907958984, "global_step": 306742, "epoch": 2535} {"train_loss": -44.89902114868164, "global_step": 306743, "epoch": 2535} {"train_loss": -45.01152420043945, "global_step": 306744, "epoch": 2535} {"train_loss": -45.23069381713867, "global_step": 306745, "epoch": 2535} {"train_loss": -44.85963821411133, "global_step": 306746, "epoch": 2535} {"train_loss": -44.88560104370117, "global_step": 306747, "epoch": 2535} {"train_loss": -44.7033576965332, "global_step": 306748, "epoch": 2535} {"train_loss": -44.234588623046875, "global_step": 306749, "epoch": 2535} {"train_loss": -44.75199890136719, "global_step": 306750, "epoch": 2535} {"train_loss": -44.908199310302734, "global_step": 306751, "epoch": 2535} {"train_loss": -45.005767822265625, "global_step": 306752, "epoch": 2535} {"train_loss": -44.773014068603516, "global_step": 306753, "epoch": 2535} {"train_loss": -45.607208251953125, "global_step": 306754, "epoch": 2535} {"train_loss": -44.58622360229492, "global_step": 306755, "epoch": 2535} {"train_loss": -45.1180419921875, "global_step": 306756, "epoch": 2535} {"train_loss": -43.96596908569336, "global_step": 306757, "epoch": 2535} {"train_loss": -43.78794479370117, "global_step": 306758, "epoch": 2535} {"train_loss": -44.84218978881836, "global_step": 306759, "epoch": 2535} {"train_loss": -43.70210266113281, "global_step": 306760, "epoch": 2535} {"train_loss": -44.24927520751953, "global_step": 306761, "epoch": 2535} {"train_loss": -43.923580169677734, "global_step": 306762, "epoch": 2535} {"train_loss": -43.903900146484375, "global_step": 306763, "epoch": 2535} {"train_loss": -42.404396057128906, "global_step": 306764, "epoch": 2535} {"train_loss": -43.538047790527344, "global_step": 306765, "epoch": 2535} {"train_loss": -44.33729553222656, "global_step": 306766, "epoch": 2535} {"train_loss": -42.79655456542969, "global_step": 306767, "epoch": 2535} {"train_loss": -44.02053451538086, "global_step": 306768, "epoch": 2535} {"train_loss": -42.406490325927734, "global_step": 306769, "epoch": 2535} {"train_loss": -43.10026168823242, "global_step": 306770, "epoch": 2535} {"train_loss": -42.139015197753906, "global_step": 306771, "epoch": 2535} {"train_loss": -43.4228401184082, "global_step": 306772, "epoch": 2535} {"train_loss": -43.4349365234375, "global_step": 306773, "epoch": 2535} {"train_loss": -42.47397994995117, "global_step": 306774, "epoch": 2535} {"train_loss": -43.563072204589844, "global_step": 306775, "epoch": 2535} {"train_loss": -44.06168746948242, "global_step": 306776, "epoch": 2535} {"train_loss": -41.806827545166016, "global_step": 306777, "epoch": 2535} {"train_loss": -43.85395431518555, "global_step": 306778, "epoch": 2535} {"train_loss": -37.652557373046875, "global_step": 306779, "epoch": 2535} {"train_loss": -41.343082427978516, "global_step": 306780, "epoch": 2535} {"train_loss": -24.797178268432617, "global_step": 306781, "epoch": 2535} {"train_loss": -39.45192337036133, "global_step": 306782, "epoch": 2535} {"train_loss": -31.984907150268555, "global_step": 306783, "epoch": 2535} {"train_loss": -0.21017980575561523, "global_step": 306784, "epoch": 2535} {"train_loss": -17.075387954711914, "global_step": 306785, "epoch": 2535} {"train_loss": -21.159934997558594, "global_step": 306786, "epoch": 2535} {"train_loss": -17.682064056396484, "global_step": 306787, "epoch": 2535} {"train_loss": -25.766986846923828, "global_step": 306788, "epoch": 2535} {"train_loss": -31.0022029876709, "global_step": 306789, "epoch": 2535} {"train_loss": -24.503894805908203, "global_step": 306790, "epoch": 2535} {"train_loss": -36.170555114746094, "global_step": 306791, "epoch": 2535} {"train_loss": -28.137893676757812, "global_step": 306792, "epoch": 2535} {"train_loss": -32.700740814208984, "global_step": 306793, "epoch": 2535} {"train_loss": -35.93365478515625, "global_step": 306794, "epoch": 2535} {"train_loss": -29.841001510620117, "global_step": 306795, "epoch": 2535} {"train_loss": -35.33941650390625, "global_step": 306796, "epoch": 2535} {"train_loss": -37.092376708984375, "global_step": 306797, "epoch": 2535} {"train_loss": -30.77901268005371, "global_step": 306798, "epoch": 2535} {"train_loss": -34.634857177734375, "global_step": 306799, "epoch": 2535} {"train_loss": -37.13203048706055, "global_step": 306800, "epoch": 2535} {"train_loss": -36.333717346191406, "global_step": 306801, "epoch": 2535} {"train_loss": -35.25750732421875, "global_step": 306802, "epoch": 2535} {"train_loss": -36.62955856323242, "global_step": 306803, "epoch": 2535} {"train_loss": -37.67230224609375, "global_step": 306804, "epoch": 2535} {"train_loss": -36.63431930541992, "global_step": 306805, "epoch": 2535} {"train_loss": -37.2689323425293, "global_step": 306806, "epoch": 2535} {"train_loss": -37.19364547729492, "global_step": 306807, "epoch": 2535} {"train_loss": -37.490230560302734, "global_step": 306808, "epoch": 2535} {"train_loss": -37.752254486083984, "global_step": 306809, "epoch": 2535} {"train_loss": -38.05199432373047, "global_step": 306810, "epoch": 2535} {"train_loss": -37.933650970458984, "global_step": 306811, "epoch": 2535} {"train_loss": -37.86063766479492, "global_step": 306812, "epoch": 2535} {"train_loss": -38.53214645385742, "global_step": 306813, "epoch": 2535} {"train_loss": -38.335052490234375, "global_step": 306814, "epoch": 2535} {"train_loss": -39.011146545410156, "global_step": 306815, "epoch": 2535} {"train_loss": -38.36834716796875, "global_step": 306816, "epoch": 2535} {"train_loss": -38.821754455566406, "global_step": 306817, "epoch": 2535} {"train_loss": -38.9062385559082, "global_step": 306818, "epoch": 2535} {"train_loss": -39.23158645629883, "global_step": 306819, "epoch": 2535} {"train_loss": -39.4013557434082, "global_step": 306820, "epoch": 2535} {"train_loss": -39.687747955322266, "global_step": 306821, "epoch": 2535} {"train_loss": -39.042938232421875, "global_step": 306822, "epoch": 2535} {"train_loss": -39.4202880859375, "global_step": 306823, "epoch": 2535} {"train_loss": -39.65185546875, "global_step": 306824, "epoch": 2535} {"train_loss": -39.469905853271484, "global_step": 306825, "epoch": 2535} {"train_loss": -40.15675735473633, "global_step": 306826, "epoch": 2535} {"train_loss": -39.66980743408203, "global_step": 306827, "epoch": 2535} {"train_loss": -39.884613037109375, "global_step": 306828, "epoch": 2535} {"train_loss": -39.96706771850586, "global_step": 306829, "epoch": 2535} {"train_loss": -40.399749755859375, "global_step": 306830, "epoch": 2535} {"train_loss": -40.04851150512695, "global_step": 306831, "epoch": 2535} {"train_loss": -40.16303634643555, "global_step": 306832, "epoch": 2535} {"train_loss": -39.9963493347168, "global_step": 306833, "epoch": 2535} {"train_loss": -40.24861526489258, "global_step": 306834, "epoch": 2535} {"train_loss": -40.05680465698242, "global_step": 306835, "epoch": 2535} {"train_loss": -40.65159225463867, "global_step": 306836, "epoch": 2535} {"train_loss": -40.57659912109375, "global_step": 306837, "epoch": 2535} {"train_loss": -40.43677520751953, "global_step": 306838, "epoch": 2535} {"train_loss": -40.4891471862793, "global_step": 306839, "epoch": 2535} {"train_loss": -40.59835433959961, "global_step": 306840, "epoch": 2535} {"train_loss": -41.03242492675781, "global_step": 306841, "epoch": 2535} {"train_loss": -40.938026428222656, "global_step": 306842, "epoch": 2535} {"train_loss": -41.08445358276367, "global_step": 306843, "epoch": 2535} {"train_loss": -40.90700912475586, "global_step": 306844, "epoch": 2535} {"train_loss": -41.063865661621094, "global_step": 306845, "epoch": 2535} {"train_loss": -40.721614837646484, "global_step": 306846, "epoch": 2535} {"train_loss": -41.24919509887695, "global_step": 306847, "epoch": 2535} {"train_loss": -41.363121032714844, "global_step": 306848, "epoch": 2535} {"train_loss": -41.43714141845703, "global_step": 306849, "epoch": 2535} {"train_loss": -41.319698333740234, "global_step": 306850, "epoch": 2535} {"train_loss": -41.615962982177734, "global_step": 306851, "epoch": 2535} {"train_loss": -41.668148040771484, "global_step": 306852, "epoch": 2535} {"train_loss": -41.72071075439453, "global_step": 306853, "epoch": 2535} {"train_loss": -41.492130279541016, "global_step": 306854, "epoch": 2535} {"train_loss": -39.371116650006, "global_step": 306855, "epoch": 2535, "val_loss": 2554574.75} {"train_loss": -41.9659538269043, "global_step": 306856, "epoch": 2536} {"train_loss": -41.874698638916016, "global_step": 306857, "epoch": 2536} {"train_loss": -42.3979606628418, "global_step": 306858, "epoch": 2536} {"train_loss": -42.298126220703125, "global_step": 306859, "epoch": 2536} {"train_loss": -42.09516525268555, "global_step": 306860, "epoch": 2536} {"train_loss": -42.24613571166992, "global_step": 306861, "epoch": 2536} {"train_loss": -42.317909240722656, "global_step": 306862, "epoch": 2536} {"train_loss": -42.5054931640625, "global_step": 306863, "epoch": 2536} {"train_loss": -42.620574951171875, "global_step": 306864, "epoch": 2536} {"train_loss": -42.4632453918457, "global_step": 306865, "epoch": 2536} {"train_loss": -42.45366287231445, "global_step": 306866, "epoch": 2536} {"train_loss": -42.529842376708984, "global_step": 306867, "epoch": 2536} {"train_loss": -42.62294006347656, "global_step": 306868, "epoch": 2536} {"train_loss": -42.352577209472656, "global_step": 306869, "epoch": 2536} {"train_loss": -42.06604766845703, "global_step": 306870, "epoch": 2536} {"train_loss": -41.22258377075195, "global_step": 306871, "epoch": 2536} {"train_loss": -40.73525619506836, "global_step": 306872, "epoch": 2536} {"train_loss": -42.81305694580078, "global_step": 306873, "epoch": 2536} {"train_loss": -42.21895980834961, "global_step": 306874, "epoch": 2536} {"train_loss": -42.22089385986328, "global_step": 306875, "epoch": 2536} {"train_loss": -42.901309967041016, "global_step": 306876, "epoch": 2536} {"train_loss": -42.57636642456055, "global_step": 306877, "epoch": 2536} {"train_loss": -42.5274658203125, "global_step": 306878, "epoch": 2536} {"train_loss": -42.61529541015625, "global_step": 306879, "epoch": 2536} {"train_loss": -42.50325012207031, "global_step": 306880, "epoch": 2536} {"train_loss": -42.654327392578125, "global_step": 306881, "epoch": 2536} {"train_loss": -42.2767219543457, "global_step": 306882, "epoch": 2536} {"train_loss": -41.866207122802734, "global_step": 306883, "epoch": 2536} {"train_loss": -42.100215911865234, "global_step": 306884, "epoch": 2536} {"train_loss": -42.833152770996094, "global_step": 306885, "epoch": 2536} {"train_loss": -43.04853439331055, "global_step": 306886, "epoch": 2536} {"train_loss": -42.516780853271484, "global_step": 306887, "epoch": 2536} {"train_loss": -42.9820442199707, "global_step": 306888, "epoch": 2536} {"train_loss": -42.578468322753906, "global_step": 306889, "epoch": 2536} {"train_loss": -41.98703384399414, "global_step": 306890, "epoch": 2536} {"train_loss": -42.40312576293945, "global_step": 306891, "epoch": 2536} {"train_loss": -42.186767578125, "global_step": 306892, "epoch": 2536} {"train_loss": -42.116737365722656, "global_step": 306893, "epoch": 2536} {"train_loss": -40.20785140991211, "global_step": 306894, "epoch": 2536} {"train_loss": -36.55691146850586, "global_step": 306895, "epoch": 2536} {"train_loss": -38.652191162109375, "global_step": 306896, "epoch": 2536} {"train_loss": -41.90102005004883, "global_step": 306897, "epoch": 2536} {"train_loss": -40.12118911743164, "global_step": 306898, "epoch": 2536} {"train_loss": -39.17841339111328, "global_step": 306899, "epoch": 2536} {"train_loss": -42.48051071166992, "global_step": 306900, "epoch": 2536} {"train_loss": -40.97014236450195, "global_step": 306901, "epoch": 2536} {"train_loss": -40.86330795288086, "global_step": 306902, "epoch": 2536} {"train_loss": -42.7638053894043, "global_step": 306903, "epoch": 2536} {"train_loss": -40.18050765991211, "global_step": 306904, "epoch": 2536} {"train_loss": -42.64726638793945, "global_step": 306905, "epoch": 2536} {"train_loss": -41.75226974487305, "global_step": 306906, "epoch": 2536} {"train_loss": -42.15515899658203, "global_step": 306907, "epoch": 2536} {"train_loss": -42.48301315307617, "global_step": 306908, "epoch": 2536} {"train_loss": -41.779457092285156, "global_step": 306909, "epoch": 2536} {"train_loss": -41.41886901855469, "global_step": 306910, "epoch": 2536} {"train_loss": -41.061614990234375, "global_step": 306911, "epoch": 2536} {"train_loss": -42.39432907104492, "global_step": 306912, "epoch": 2536} {"train_loss": -42.01192855834961, "global_step": 306913, "epoch": 2536} {"train_loss": -42.819820404052734, "global_step": 306914, "epoch": 2536} {"train_loss": -42.32074737548828, "global_step": 306915, "epoch": 2536} {"train_loss": -43.35988998413086, "global_step": 306916, "epoch": 2536} {"train_loss": -42.31782150268555, "global_step": 306917, "epoch": 2536} {"train_loss": -43.23836898803711, "global_step": 306918, "epoch": 2536} {"train_loss": -42.52297592163086, "global_step": 306919, "epoch": 2536} {"train_loss": -43.1108512878418, "global_step": 306920, "epoch": 2536} {"train_loss": -42.9549674987793, "global_step": 306921, "epoch": 2536} {"train_loss": -42.486175537109375, "global_step": 306922, "epoch": 2536} {"train_loss": -43.07270050048828, "global_step": 306923, "epoch": 2536} {"train_loss": -42.72785568237305, "global_step": 306924, "epoch": 2536} {"train_loss": -42.53042221069336, "global_step": 306925, "epoch": 2536} {"train_loss": -42.99172592163086, "global_step": 306926, "epoch": 2536} {"train_loss": -42.2772331237793, "global_step": 306927, "epoch": 2536} {"train_loss": -43.48145294189453, "global_step": 306928, "epoch": 2536} {"train_loss": -40.71710968017578, "global_step": 306929, "epoch": 2536} {"train_loss": -43.20205307006836, "global_step": 306930, "epoch": 2536} {"train_loss": -42.3525276184082, "global_step": 306931, "epoch": 2536} {"train_loss": -43.042823791503906, "global_step": 306932, "epoch": 2536} {"train_loss": -42.895015716552734, "global_step": 306933, "epoch": 2536} {"train_loss": -43.35729217529297, "global_step": 306934, "epoch": 2536} {"train_loss": -42.07709884643555, "global_step": 306935, "epoch": 2536} {"train_loss": -43.29275894165039, "global_step": 306936, "epoch": 2536} {"train_loss": -42.84609603881836, "global_step": 306937, "epoch": 2536} {"train_loss": -42.85825729370117, "global_step": 306938, "epoch": 2536} {"train_loss": -42.8697624206543, "global_step": 306939, "epoch": 2536} {"train_loss": -43.42927551269531, "global_step": 306940, "epoch": 2536} {"train_loss": -43.23389434814453, "global_step": 306941, "epoch": 2536} {"train_loss": -43.6796760559082, "global_step": 306942, "epoch": 2536} {"train_loss": -43.78052520751953, "global_step": 306943, "epoch": 2536} {"train_loss": -43.55207061767578, "global_step": 306944, "epoch": 2536} {"train_loss": -43.159507751464844, "global_step": 306945, "epoch": 2536} {"train_loss": -43.37004852294922, "global_step": 306946, "epoch": 2536} {"train_loss": -43.2862434387207, "global_step": 306947, "epoch": 2536} {"train_loss": -43.529354095458984, "global_step": 306948, "epoch": 2536} {"train_loss": -43.08095932006836, "global_step": 306949, "epoch": 2536} {"train_loss": -43.28751754760742, "global_step": 306950, "epoch": 2536} {"train_loss": -43.12735366821289, "global_step": 306951, "epoch": 2536} {"train_loss": -43.94611740112305, "global_step": 306952, "epoch": 2536} {"train_loss": -43.88150405883789, "global_step": 306953, "epoch": 2536} {"train_loss": -43.42281723022461, "global_step": 306954, "epoch": 2536} {"train_loss": -43.64048385620117, "global_step": 306955, "epoch": 2536} {"train_loss": -43.28273391723633, "global_step": 306956, "epoch": 2536} {"train_loss": -43.382354736328125, "global_step": 306957, "epoch": 2536} {"train_loss": -42.963478088378906, "global_step": 306958, "epoch": 2536} {"train_loss": -41.751556396484375, "global_step": 306959, "epoch": 2536} {"train_loss": -40.673866271972656, "global_step": 306960, "epoch": 2536} {"train_loss": -42.41793441772461, "global_step": 306961, "epoch": 2536} {"train_loss": -43.18867874145508, "global_step": 306962, "epoch": 2536} {"train_loss": -41.01582717895508, "global_step": 306963, "epoch": 2536} {"train_loss": -42.40044403076172, "global_step": 306964, "epoch": 2536} {"train_loss": -43.42391586303711, "global_step": 306965, "epoch": 2536} {"train_loss": -42.014957427978516, "global_step": 306966, "epoch": 2536} {"train_loss": -41.091957092285156, "global_step": 306967, "epoch": 2536} {"train_loss": -42.723907470703125, "global_step": 306968, "epoch": 2536} {"train_loss": -41.753883361816406, "global_step": 306969, "epoch": 2536} {"train_loss": -41.71124267578125, "global_step": 306970, "epoch": 2536} {"train_loss": -40.4457893371582, "global_step": 306971, "epoch": 2536} {"train_loss": -37.516929626464844, "global_step": 306972, "epoch": 2536} {"train_loss": -40.1068229675293, "global_step": 306973, "epoch": 2536} {"train_loss": -40.15699005126953, "global_step": 306974, "epoch": 2536} {"train_loss": -42.34732437133789, "global_step": 306975, "epoch": 2536} {"train_loss": -42.256933543307724, "global_step": 306976, "epoch": 2536, "val_loss": 2573223.75} {"train_loss": -40.502174377441406, "global_step": 306977, "epoch": 2537} {"train_loss": -40.31697082519531, "global_step": 306978, "epoch": 2537} {"train_loss": -42.02230453491211, "global_step": 306979, "epoch": 2537} {"train_loss": -40.486114501953125, "global_step": 306980, "epoch": 2537} {"train_loss": -41.72502517700195, "global_step": 306981, "epoch": 2537} {"train_loss": -40.86273193359375, "global_step": 306982, "epoch": 2537} {"train_loss": -40.885284423828125, "global_step": 306983, "epoch": 2537} {"train_loss": -40.127708435058594, "global_step": 306984, "epoch": 2537} {"train_loss": -39.57960891723633, "global_step": 306985, "epoch": 2537} {"train_loss": -37.267860412597656, "global_step": 306986, "epoch": 2537} {"train_loss": -40.39124298095703, "global_step": 306987, "epoch": 2537} {"train_loss": -42.069091796875, "global_step": 306988, "epoch": 2537} {"train_loss": -40.256221771240234, "global_step": 306989, "epoch": 2537} {"train_loss": -42.5880126953125, "global_step": 306990, "epoch": 2537} {"train_loss": -41.043663024902344, "global_step": 306991, "epoch": 2537} {"train_loss": -41.075069427490234, "global_step": 306992, "epoch": 2537} {"train_loss": -40.88446044921875, "global_step": 306993, "epoch": 2537} {"train_loss": -41.79875564575195, "global_step": 306994, "epoch": 2537} {"train_loss": -41.038307189941406, "global_step": 306995, "epoch": 2537} {"train_loss": -41.97624969482422, "global_step": 306996, "epoch": 2537} {"train_loss": -41.75339889526367, "global_step": 306997, "epoch": 2537} {"train_loss": -41.675323486328125, "global_step": 306998, "epoch": 2537} {"train_loss": -41.49153137207031, "global_step": 306999, "epoch": 2537} {"train_loss": -41.263790130615234, "global_step": 307000, "epoch": 2537} {"train_loss": -42.087623596191406, "global_step": 307001, "epoch": 2537} {"train_loss": -40.933753967285156, "global_step": 307002, "epoch": 2537} {"train_loss": -41.9159049987793, "global_step": 307003, "epoch": 2537} {"train_loss": -41.4514274597168, "global_step": 307004, "epoch": 2537} {"train_loss": -42.44162368774414, "global_step": 307005, "epoch": 2537} {"train_loss": -40.91520309448242, "global_step": 307006, "epoch": 2537} {"train_loss": -40.85226821899414, "global_step": 307007, "epoch": 2537} {"train_loss": -42.07376480102539, "global_step": 307008, "epoch": 2537} {"train_loss": -42.08903121948242, "global_step": 307009, "epoch": 2537} {"train_loss": -41.921730041503906, "global_step": 307010, "epoch": 2537} {"train_loss": -41.57785415649414, "global_step": 307011, "epoch": 2537} {"train_loss": -42.01406478881836, "global_step": 307012, "epoch": 2537} {"train_loss": -42.351680755615234, "global_step": 307013, "epoch": 2537} {"train_loss": -40.929744720458984, "global_step": 307014, "epoch": 2537} {"train_loss": -40.7889289855957, "global_step": 307015, "epoch": 2537} {"train_loss": -41.34867858886719, "global_step": 307016, "epoch": 2537} {"train_loss": -42.28104782104492, "global_step": 307017, "epoch": 2537} {"train_loss": -42.812744140625, "global_step": 307018, "epoch": 2537} {"train_loss": -42.298885345458984, "global_step": 307019, "epoch": 2537} {"train_loss": -42.34652328491211, "global_step": 307020, "epoch": 2537} {"train_loss": -42.330657958984375, "global_step": 307021, "epoch": 2537} {"train_loss": -42.603633880615234, "global_step": 307022, "epoch": 2537} {"train_loss": -42.66840362548828, "global_step": 307023, "epoch": 2537} {"train_loss": -42.64235305786133, "global_step": 307024, "epoch": 2537} {"train_loss": -42.71930694580078, "global_step": 307025, "epoch": 2537} {"train_loss": -42.84444808959961, "global_step": 307026, "epoch": 2537} {"train_loss": -42.58823013305664, "global_step": 307027, "epoch": 2537} {"train_loss": -41.371341705322266, "global_step": 307028, "epoch": 2537} {"train_loss": -43.47343444824219, "global_step": 307029, "epoch": 2537} {"train_loss": -42.79014205932617, "global_step": 307030, "epoch": 2537} {"train_loss": -43.371917724609375, "global_step": 307031, "epoch": 2537} {"train_loss": -43.150672912597656, "global_step": 307032, "epoch": 2537} {"train_loss": -43.275245666503906, "global_step": 307033, "epoch": 2537} {"train_loss": -43.0194206237793, "global_step": 307034, "epoch": 2537} {"train_loss": -43.4726676940918, "global_step": 307035, "epoch": 2537} {"train_loss": -43.324554443359375, "global_step": 307036, "epoch": 2537} {"train_loss": -43.445552825927734, "global_step": 307037, "epoch": 2537} {"train_loss": -43.652381896972656, "global_step": 307038, "epoch": 2537} {"train_loss": -43.319549560546875, "global_step": 307039, "epoch": 2537} {"train_loss": -43.29701614379883, "global_step": 307040, "epoch": 2537} {"train_loss": -43.01589584350586, "global_step": 307041, "epoch": 2537} {"train_loss": -43.076873779296875, "global_step": 307042, "epoch": 2537} {"train_loss": -43.5291633605957, "global_step": 307043, "epoch": 2537} {"train_loss": -43.26383590698242, "global_step": 307044, "epoch": 2537} {"train_loss": -43.96106719970703, "global_step": 307045, "epoch": 2537} {"train_loss": -43.6829948425293, "global_step": 307046, "epoch": 2537} {"train_loss": -43.93154525756836, "global_step": 307047, "epoch": 2537} {"train_loss": -43.76168441772461, "global_step": 307048, "epoch": 2537} {"train_loss": -43.680233001708984, "global_step": 307049, "epoch": 2537} {"train_loss": -43.569091796875, "global_step": 307050, "epoch": 2537} {"train_loss": -43.47591781616211, "global_step": 307051, "epoch": 2537} {"train_loss": -43.52236557006836, "global_step": 307052, "epoch": 2537} {"train_loss": -43.59939193725586, "global_step": 307053, "epoch": 2537} {"train_loss": -43.8719367980957, "global_step": 307054, "epoch": 2537} {"train_loss": -43.79738998413086, "global_step": 307055, "epoch": 2537} {"train_loss": -42.79218673706055, "global_step": 307056, "epoch": 2537} {"train_loss": -43.317378997802734, "global_step": 307057, "epoch": 2537} {"train_loss": -43.93386459350586, "global_step": 307058, "epoch": 2537} {"train_loss": -43.69285202026367, "global_step": 307059, "epoch": 2537} {"train_loss": -43.324981689453125, "global_step": 307060, "epoch": 2537} {"train_loss": -43.8382682800293, "global_step": 307061, "epoch": 2537} {"train_loss": -43.65952682495117, "global_step": 307062, "epoch": 2537} {"train_loss": -42.99359893798828, "global_step": 307063, "epoch": 2537} {"train_loss": -43.471160888671875, "global_step": 307064, "epoch": 2537} {"train_loss": -43.93133544921875, "global_step": 307065, "epoch": 2537} {"train_loss": -43.651302337646484, "global_step": 307066, "epoch": 2537} {"train_loss": -43.13853073120117, "global_step": 307067, "epoch": 2537} {"train_loss": -43.771759033203125, "global_step": 307068, "epoch": 2537} {"train_loss": -43.83803176879883, "global_step": 307069, "epoch": 2537} {"train_loss": -43.95939254760742, "global_step": 307070, "epoch": 2537} {"train_loss": -43.89126205444336, "global_step": 307071, "epoch": 2537} {"train_loss": -43.986846923828125, "global_step": 307072, "epoch": 2537} {"train_loss": -43.571529388427734, "global_step": 307073, "epoch": 2537} {"train_loss": -43.75908279418945, "global_step": 307074, "epoch": 2537} {"train_loss": -42.92825698852539, "global_step": 307075, "epoch": 2537} {"train_loss": -43.053646087646484, "global_step": 307076, "epoch": 2537} {"train_loss": -43.242393493652344, "global_step": 307077, "epoch": 2537} {"train_loss": -43.5178337097168, "global_step": 307078, "epoch": 2537} {"train_loss": -44.31061935424805, "global_step": 307079, "epoch": 2537} {"train_loss": -43.962947845458984, "global_step": 307080, "epoch": 2537} {"train_loss": -43.804832458496094, "global_step": 307081, "epoch": 2537} {"train_loss": -41.19985580444336, "global_step": 307082, "epoch": 2537} {"train_loss": -41.50140380859375, "global_step": 307083, "epoch": 2537} {"train_loss": -39.286712646484375, "global_step": 307084, "epoch": 2537} {"train_loss": -37.85177230834961, "global_step": 307085, "epoch": 2537} {"train_loss": -40.73255157470703, "global_step": 307086, "epoch": 2537} {"train_loss": -41.85770797729492, "global_step": 307087, "epoch": 2537} {"train_loss": -42.20870590209961, "global_step": 307088, "epoch": 2537} {"train_loss": -42.45220184326172, "global_step": 307089, "epoch": 2537} {"train_loss": -43.02477264404297, "global_step": 307090, "epoch": 2537} {"train_loss": -42.910621643066406, "global_step": 307091, "epoch": 2537} {"train_loss": -41.97157669067383, "global_step": 307092, "epoch": 2537} {"train_loss": -42.374473571777344, "global_step": 307093, "epoch": 2537} {"train_loss": -42.75238800048828, "global_step": 307094, "epoch": 2537} {"train_loss": -42.11783981323242, "global_step": 307095, "epoch": 2537} {"train_loss": -42.01151657104492, "global_step": 307096, "epoch": 2537} {"train_loss": -42.39831145735812, "global_step": 307097, "epoch": 2537, "val_loss": 2578073.0} {"train_loss": -42.43980026245117, "global_step": 307098, "epoch": 2538} {"train_loss": -42.5560302734375, "global_step": 307099, "epoch": 2538} {"train_loss": -42.60145950317383, "global_step": 307100, "epoch": 2538} {"train_loss": -41.68642807006836, "global_step": 307101, "epoch": 2538} {"train_loss": -42.81522750854492, "global_step": 307102, "epoch": 2538} {"train_loss": -40.36440658569336, "global_step": 307103, "epoch": 2538} {"train_loss": -41.592063903808594, "global_step": 307104, "epoch": 2538} {"train_loss": -42.1032829284668, "global_step": 307105, "epoch": 2538} {"train_loss": -42.661312103271484, "global_step": 307106, "epoch": 2538} {"train_loss": -42.72237014770508, "global_step": 307107, "epoch": 2538} {"train_loss": -41.96538162231445, "global_step": 307108, "epoch": 2538} {"train_loss": -41.51325225830078, "global_step": 307109, "epoch": 2538} {"train_loss": -42.068756103515625, "global_step": 307110, "epoch": 2538} {"train_loss": -38.50541305541992, "global_step": 307111, "epoch": 2538} {"train_loss": -37.006492614746094, "global_step": 307112, "epoch": 2538} {"train_loss": -40.65658950805664, "global_step": 307113, "epoch": 2538} {"train_loss": -41.632476806640625, "global_step": 307114, "epoch": 2538} {"train_loss": -42.05966567993164, "global_step": 307115, "epoch": 2538} {"train_loss": -40.892372131347656, "global_step": 307116, "epoch": 2538} {"train_loss": -41.971675872802734, "global_step": 307117, "epoch": 2538} {"train_loss": -42.346405029296875, "global_step": 307118, "epoch": 2538} {"train_loss": -39.20002365112305, "global_step": 307119, "epoch": 2538} {"train_loss": -39.7364387512207, "global_step": 307120, "epoch": 2538} {"train_loss": -40.59120178222656, "global_step": 307121, "epoch": 2538} {"train_loss": -40.91331100463867, "global_step": 307122, "epoch": 2538} {"train_loss": -41.345458984375, "global_step": 307123, "epoch": 2538} {"train_loss": -38.74135208129883, "global_step": 307124, "epoch": 2538} {"train_loss": -33.80125045776367, "global_step": 307125, "epoch": 2538} {"train_loss": -41.27427291870117, "global_step": 307126, "epoch": 2538} {"train_loss": -39.21261978149414, "global_step": 307127, "epoch": 2538} {"train_loss": -36.05390167236328, "global_step": 307128, "epoch": 2538} {"train_loss": -38.97941589355469, "global_step": 307129, "epoch": 2538} {"train_loss": -39.6967658996582, "global_step": 307130, "epoch": 2538} {"train_loss": -41.40720748901367, "global_step": 307131, "epoch": 2538} {"train_loss": -39.451087951660156, "global_step": 307132, "epoch": 2538} {"train_loss": -39.8953971862793, "global_step": 307133, "epoch": 2538} {"train_loss": -33.36509323120117, "global_step": 307134, "epoch": 2538} {"train_loss": -37.445919036865234, "global_step": 307135, "epoch": 2538} {"train_loss": -41.016971588134766, "global_step": 307136, "epoch": 2538} {"train_loss": -27.00131607055664, "global_step": 307137, "epoch": 2538} {"train_loss": -34.10554122924805, "global_step": 307138, "epoch": 2538} {"train_loss": -39.84605026245117, "global_step": 307139, "epoch": 2538} {"train_loss": -33.63086700439453, "global_step": 307140, "epoch": 2538} {"train_loss": -38.5169792175293, "global_step": 307141, "epoch": 2538} {"train_loss": -39.23942184448242, "global_step": 307142, "epoch": 2538} {"train_loss": -39.58115768432617, "global_step": 307143, "epoch": 2538} {"train_loss": -39.43037796020508, "global_step": 307144, "epoch": 2538} {"train_loss": -39.73330307006836, "global_step": 307145, "epoch": 2538} {"train_loss": -36.7265510559082, "global_step": 307146, "epoch": 2538} {"train_loss": -41.49421310424805, "global_step": 307147, "epoch": 2538} {"train_loss": -35.57572555541992, "global_step": 307148, "epoch": 2538} {"train_loss": -40.14579391479492, "global_step": 307149, "epoch": 2538} {"train_loss": -41.27765655517578, "global_step": 307150, "epoch": 2538} {"train_loss": -39.356510162353516, "global_step": 307151, "epoch": 2538} {"train_loss": -39.24285888671875, "global_step": 307152, "epoch": 2538} {"train_loss": -40.275428771972656, "global_step": 307153, "epoch": 2538} {"train_loss": -40.416542053222656, "global_step": 307154, "epoch": 2538} {"train_loss": -39.42130661010742, "global_step": 307155, "epoch": 2538} {"train_loss": -38.60029220581055, "global_step": 307156, "epoch": 2538} {"train_loss": -38.723052978515625, "global_step": 307157, "epoch": 2538} {"train_loss": -40.91699981689453, "global_step": 307158, "epoch": 2538} {"train_loss": -41.848968505859375, "global_step": 307159, "epoch": 2538} {"train_loss": -41.5590934753418, "global_step": 307160, "epoch": 2538} {"train_loss": -41.575313568115234, "global_step": 307161, "epoch": 2538} {"train_loss": -39.74492263793945, "global_step": 307162, "epoch": 2538} {"train_loss": -40.823219299316406, "global_step": 307163, "epoch": 2538} {"train_loss": -40.73600769042969, "global_step": 307164, "epoch": 2538} {"train_loss": -40.32674789428711, "global_step": 307165, "epoch": 2538} {"train_loss": -41.08732604980469, "global_step": 307166, "epoch": 2538} {"train_loss": -37.75751876831055, "global_step": 307167, "epoch": 2538} {"train_loss": -40.80369186401367, "global_step": 307168, "epoch": 2538} {"train_loss": -40.10927200317383, "global_step": 307169, "epoch": 2538} {"train_loss": -40.39997100830078, "global_step": 307170, "epoch": 2538} {"train_loss": -41.71930694580078, "global_step": 307171, "epoch": 2538} {"train_loss": -40.30524826049805, "global_step": 307172, "epoch": 2538} {"train_loss": -38.17216873168945, "global_step": 307173, "epoch": 2538} {"train_loss": -37.9183349609375, "global_step": 307174, "epoch": 2538} {"train_loss": -41.34449005126953, "global_step": 307175, "epoch": 2538} {"train_loss": -39.75312805175781, "global_step": 307176, "epoch": 2538} {"train_loss": -40.070186614990234, "global_step": 307177, "epoch": 2538} {"train_loss": -41.77717208862305, "global_step": 307178, "epoch": 2538} {"train_loss": -40.86611557006836, "global_step": 307179, "epoch": 2538} {"train_loss": -40.89627456665039, "global_step": 307180, "epoch": 2538} {"train_loss": -40.406166076660156, "global_step": 307181, "epoch": 2538} {"train_loss": -41.26885223388672, "global_step": 307182, "epoch": 2538} {"train_loss": -39.222530364990234, "global_step": 307183, "epoch": 2538} {"train_loss": -40.555049896240234, "global_step": 307184, "epoch": 2538} {"train_loss": -41.25883865356445, "global_step": 307185, "epoch": 2538} {"train_loss": -40.4516716003418, "global_step": 307186, "epoch": 2538} {"train_loss": -39.428749084472656, "global_step": 307187, "epoch": 2538} {"train_loss": -40.49592208862305, "global_step": 307188, "epoch": 2538} {"train_loss": -40.36221694946289, "global_step": 307189, "epoch": 2538} {"train_loss": -42.17259216308594, "global_step": 307190, "epoch": 2538} {"train_loss": -41.39906692504883, "global_step": 307191, "epoch": 2538} {"train_loss": -40.417762756347656, "global_step": 307192, "epoch": 2538} {"train_loss": -41.365718841552734, "global_step": 307193, "epoch": 2538} {"train_loss": -41.61317825317383, "global_step": 307194, "epoch": 2538} {"train_loss": -41.77416229248047, "global_step": 307195, "epoch": 2538} {"train_loss": -40.997474670410156, "global_step": 307196, "epoch": 2538} {"train_loss": -40.967193603515625, "global_step": 307197, "epoch": 2538} {"train_loss": -40.76571273803711, "global_step": 307198, "epoch": 2538} {"train_loss": -41.381263732910156, "global_step": 307199, "epoch": 2538} {"train_loss": -41.90690612792969, "global_step": 307200, "epoch": 2538} {"train_loss": -41.792083740234375, "global_step": 307201, "epoch": 2538} {"train_loss": -41.9801139831543, "global_step": 307202, "epoch": 2538} {"train_loss": -40.96543502807617, "global_step": 307203, "epoch": 2538} {"train_loss": -42.069881439208984, "global_step": 307204, "epoch": 2538} {"train_loss": -41.858154296875, "global_step": 307205, "epoch": 2538} {"train_loss": -42.089107513427734, "global_step": 307206, "epoch": 2538} {"train_loss": -42.09444046020508, "global_step": 307207, "epoch": 2538} {"train_loss": -41.70735549926758, "global_step": 307208, "epoch": 2538} {"train_loss": -41.86508560180664, "global_step": 307209, "epoch": 2538} {"train_loss": -42.24845504760742, "global_step": 307210, "epoch": 2538} {"train_loss": -43.09914779663086, "global_step": 307211, "epoch": 2538} {"train_loss": -40.710697174072266, "global_step": 307212, "epoch": 2538} {"train_loss": -41.85665512084961, "global_step": 307213, "epoch": 2538} {"train_loss": -41.36739730834961, "global_step": 307214, "epoch": 2538} {"train_loss": -41.89991760253906, "global_step": 307215, "epoch": 2538} {"train_loss": -40.650177001953125, "global_step": 307216, "epoch": 2538} {"train_loss": -41.80584716796875, "global_step": 307217, "epoch": 2538} {"train_loss": -40.31238864867155, "global_step": 307218, "epoch": 2538, "val_loss": 2752060.25} {"train_loss": -42.25264358520508, "global_step": 307219, "epoch": 2539} {"train_loss": -42.40718460083008, "global_step": 307220, "epoch": 2539} {"train_loss": -43.16762161254883, "global_step": 307221, "epoch": 2539} {"train_loss": -42.445369720458984, "global_step": 307222, "epoch": 2539} {"train_loss": -42.25214767456055, "global_step": 307223, "epoch": 2539} {"train_loss": -42.623016357421875, "global_step": 307224, "epoch": 2539} {"train_loss": -42.328983306884766, "global_step": 307225, "epoch": 2539} {"train_loss": -42.543128967285156, "global_step": 307226, "epoch": 2539} {"train_loss": -43.12237548828125, "global_step": 307227, "epoch": 2539} {"train_loss": -42.941951751708984, "global_step": 307228, "epoch": 2539} {"train_loss": -42.74080276489258, "global_step": 307229, "epoch": 2539} {"train_loss": -42.40534210205078, "global_step": 307230, "epoch": 2539} {"train_loss": -41.41090393066406, "global_step": 307231, "epoch": 2539} {"train_loss": -43.123443603515625, "global_step": 307232, "epoch": 2539} {"train_loss": -42.3593635559082, "global_step": 307233, "epoch": 2539} {"train_loss": -40.418670654296875, "global_step": 307234, "epoch": 2539} {"train_loss": -42.88843536376953, "global_step": 307235, "epoch": 2539} {"train_loss": -42.87565994262695, "global_step": 307236, "epoch": 2539} {"train_loss": -43.052459716796875, "global_step": 307237, "epoch": 2539} {"train_loss": -38.42975616455078, "global_step": 307238, "epoch": 2539} {"train_loss": -42.62256622314453, "global_step": 307239, "epoch": 2539} {"train_loss": -42.68711853027344, "global_step": 307240, "epoch": 2539} {"train_loss": -42.569915771484375, "global_step": 307241, "epoch": 2539} {"train_loss": -42.66672897338867, "global_step": 307242, "epoch": 2539} {"train_loss": -41.86248779296875, "global_step": 307243, "epoch": 2539} {"train_loss": -30.17169761657715, "global_step": 307244, "epoch": 2539} {"train_loss": -42.61884307861328, "global_step": 307245, "epoch": 2539} {"train_loss": -42.587215423583984, "global_step": 307246, "epoch": 2539} {"train_loss": -41.99605941772461, "global_step": 307247, "epoch": 2539} {"train_loss": -40.191505432128906, "global_step": 307248, "epoch": 2539} {"train_loss": -41.985652923583984, "global_step": 307249, "epoch": 2539} {"train_loss": -42.14626693725586, "global_step": 307250, "epoch": 2539} {"train_loss": -41.1536865234375, "global_step": 307251, "epoch": 2539} {"train_loss": -40.76227569580078, "global_step": 307252, "epoch": 2539} {"train_loss": -41.91238021850586, "global_step": 307253, "epoch": 2539} {"train_loss": -41.69580078125, "global_step": 307254, "epoch": 2539} {"train_loss": -32.71516036987305, "global_step": 307255, "epoch": 2539} {"train_loss": -40.6479377746582, "global_step": 307256, "epoch": 2539} {"train_loss": -40.38597869873047, "global_step": 307257, "epoch": 2539} {"train_loss": -41.33740234375, "global_step": 307258, "epoch": 2539} {"train_loss": -42.053890228271484, "global_step": 307259, "epoch": 2539} {"train_loss": -41.060848236083984, "global_step": 307260, "epoch": 2539} {"train_loss": -41.5467529296875, "global_step": 307261, "epoch": 2539} {"train_loss": -41.73965072631836, "global_step": 307262, "epoch": 2539} {"train_loss": -42.810508728027344, "global_step": 307263, "epoch": 2539} {"train_loss": -41.80844497680664, "global_step": 307264, "epoch": 2539} {"train_loss": -40.97318649291992, "global_step": 307265, "epoch": 2539} {"train_loss": -42.177181243896484, "global_step": 307266, "epoch": 2539} {"train_loss": -42.66597366333008, "global_step": 307267, "epoch": 2539} {"train_loss": -40.403419494628906, "global_step": 307268, "epoch": 2539} {"train_loss": -41.51034164428711, "global_step": 307269, "epoch": 2539} {"train_loss": -39.72047805786133, "global_step": 307270, "epoch": 2539} {"train_loss": -41.19227600097656, "global_step": 307271, "epoch": 2539} {"train_loss": -41.63261032104492, "global_step": 307272, "epoch": 2539} {"train_loss": -41.20980453491211, "global_step": 307273, "epoch": 2539} {"train_loss": -33.634700775146484, "global_step": 307274, "epoch": 2539} {"train_loss": -41.03547286987305, "global_step": 307275, "epoch": 2539} {"train_loss": -41.684959411621094, "global_step": 307276, "epoch": 2539} {"train_loss": -36.586055755615234, "global_step": 307277, "epoch": 2539} {"train_loss": -38.756500244140625, "global_step": 307278, "epoch": 2539} {"train_loss": -37.284278869628906, "global_step": 307279, "epoch": 2539} {"train_loss": -37.86135482788086, "global_step": 307280, "epoch": 2539} {"train_loss": -34.476776123046875, "global_step": 307281, "epoch": 2539} {"train_loss": -36.98167037963867, "global_step": 307282, "epoch": 2539} {"train_loss": -35.63340377807617, "global_step": 307283, "epoch": 2539} {"train_loss": -32.865562438964844, "global_step": 307284, "epoch": 2539} {"train_loss": -37.421241760253906, "global_step": 307285, "epoch": 2539} {"train_loss": -29.7623291015625, "global_step": 307286, "epoch": 2539} {"train_loss": -19.02484130859375, "global_step": 307287, "epoch": 2539} {"train_loss": -35.638607025146484, "global_step": 307288, "epoch": 2539} {"train_loss": -26.701696395874023, "global_step": 307289, "epoch": 2539} {"train_loss": -36.2051887512207, "global_step": 307290, "epoch": 2539} {"train_loss": -31.991825103759766, "global_step": 307291, "epoch": 2539} {"train_loss": -33.84511947631836, "global_step": 307292, "epoch": 2539} {"train_loss": -30.065549850463867, "global_step": 307293, "epoch": 2539} {"train_loss": -31.4088134765625, "global_step": 307294, "epoch": 2539} {"train_loss": -29.583541870117188, "global_step": 307295, "epoch": 2539} {"train_loss": -36.74155044555664, "global_step": 307296, "epoch": 2539} {"train_loss": -36.01912307739258, "global_step": 307297, "epoch": 2539} {"train_loss": -35.91408920288086, "global_step": 307298, "epoch": 2539} {"train_loss": -30.784011840820312, "global_step": 307299, "epoch": 2539} {"train_loss": -34.216278076171875, "global_step": 307300, "epoch": 2539} {"train_loss": -35.44247055053711, "global_step": 307301, "epoch": 2539} {"train_loss": -34.093441009521484, "global_step": 307302, "epoch": 2539} {"train_loss": -33.688812255859375, "global_step": 307303, "epoch": 2539} {"train_loss": -20.48430824279785, "global_step": 307304, "epoch": 2539} {"train_loss": -34.97394943237305, "global_step": 307305, "epoch": 2539} {"train_loss": -34.2672004699707, "global_step": 307306, "epoch": 2539} {"train_loss": -33.3930778503418, "global_step": 307307, "epoch": 2539} {"train_loss": -32.78083419799805, "global_step": 307308, "epoch": 2539} {"train_loss": -36.33401107788086, "global_step": 307309, "epoch": 2539} {"train_loss": -31.418701171875, "global_step": 307310, "epoch": 2539} {"train_loss": -37.5303840637207, "global_step": 307311, "epoch": 2539} {"train_loss": -36.41550827026367, "global_step": 307312, "epoch": 2539} {"train_loss": -35.280113220214844, "global_step": 307313, "epoch": 2539} {"train_loss": -36.69643783569336, "global_step": 307314, "epoch": 2539} {"train_loss": -35.5384407043457, "global_step": 307315, "epoch": 2539} {"train_loss": -37.40409851074219, "global_step": 307316, "epoch": 2539} {"train_loss": -36.66461944580078, "global_step": 307317, "epoch": 2539} {"train_loss": -35.16482925415039, "global_step": 307318, "epoch": 2539} {"train_loss": -29.459686279296875, "global_step": 307319, "epoch": 2539} {"train_loss": -36.99298858642578, "global_step": 307320, "epoch": 2539} {"train_loss": -38.026859283447266, "global_step": 307321, "epoch": 2539} {"train_loss": -37.53558349609375, "global_step": 307322, "epoch": 2539} {"train_loss": -37.562774658203125, "global_step": 307323, "epoch": 2539} {"train_loss": -37.38786697387695, "global_step": 307324, "epoch": 2539} {"train_loss": -37.49177169799805, "global_step": 307325, "epoch": 2539} {"train_loss": -35.80611801147461, "global_step": 307326, "epoch": 2539} {"train_loss": -36.91351318359375, "global_step": 307327, "epoch": 2539} {"train_loss": -37.76883316040039, "global_step": 307328, "epoch": 2539} {"train_loss": -37.25262451171875, "global_step": 307329, "epoch": 2539} {"train_loss": -38.631866455078125, "global_step": 307330, "epoch": 2539} {"train_loss": -37.907493591308594, "global_step": 307331, "epoch": 2539} {"train_loss": -37.388710021972656, "global_step": 307332, "epoch": 2539} {"train_loss": -37.502166748046875, "global_step": 307333, "epoch": 2539} {"train_loss": -38.73173904418945, "global_step": 307334, "epoch": 2539} {"train_loss": -37.548309326171875, "global_step": 307335, "epoch": 2539} {"train_loss": -38.830780029296875, "global_step": 307336, "epoch": 2539} {"train_loss": -38.492313385009766, "global_step": 307337, "epoch": 2539} {"train_loss": -38.5174674987793, "global_step": 307338, "epoch": 2539} {"train_loss": -38.07472787021605, "global_step": 307339, "epoch": 2539, "val_loss": 2637391.75} {"train_loss": -39.55854034423828, "global_step": 307340, "epoch": 2540} {"train_loss": -39.12699508666992, "global_step": 307341, "epoch": 2540} {"train_loss": -38.496192932128906, "global_step": 307342, "epoch": 2540} {"train_loss": -39.024574279785156, "global_step": 307343, "epoch": 2540} {"train_loss": -38.0797119140625, "global_step": 307344, "epoch": 2540} {"train_loss": -39.19317626953125, "global_step": 307345, "epoch": 2540} {"train_loss": -38.77873611450195, "global_step": 307346, "epoch": 2540} {"train_loss": -38.980587005615234, "global_step": 307347, "epoch": 2540} {"train_loss": -39.13328170776367, "global_step": 307348, "epoch": 2540} {"train_loss": -39.0545654296875, "global_step": 307349, "epoch": 2540} {"train_loss": -39.6009521484375, "global_step": 307350, "epoch": 2540} {"train_loss": -39.29664993286133, "global_step": 307351, "epoch": 2540} {"train_loss": -40.050148010253906, "global_step": 307352, "epoch": 2540} {"train_loss": -38.72461700439453, "global_step": 307353, "epoch": 2540} {"train_loss": -39.841365814208984, "global_step": 307354, "epoch": 2540} {"train_loss": -40.28706741333008, "global_step": 307355, "epoch": 2540} {"train_loss": -39.86433029174805, "global_step": 307356, "epoch": 2540} {"train_loss": -38.67597579956055, "global_step": 307357, "epoch": 2540} {"train_loss": -39.31892013549805, "global_step": 307358, "epoch": 2540} {"train_loss": -39.11773681640625, "global_step": 307359, "epoch": 2540} {"train_loss": -39.19061279296875, "global_step": 307360, "epoch": 2540} {"train_loss": -40.09029769897461, "global_step": 307361, "epoch": 2540} {"train_loss": -39.57265853881836, "global_step": 307362, "epoch": 2540} {"train_loss": -39.64234161376953, "global_step": 307363, "epoch": 2540} {"train_loss": -39.66561508178711, "global_step": 307364, "epoch": 2540} {"train_loss": -39.59878921508789, "global_step": 307365, "epoch": 2540} {"train_loss": -40.17241287231445, "global_step": 307366, "epoch": 2540} {"train_loss": -40.26567840576172, "global_step": 307367, "epoch": 2540} {"train_loss": -39.28800582885742, "global_step": 307368, "epoch": 2540} {"train_loss": -40.56718444824219, "global_step": 307369, "epoch": 2540} {"train_loss": -40.155879974365234, "global_step": 307370, "epoch": 2540} {"train_loss": -39.579097747802734, "global_step": 307371, "epoch": 2540} {"train_loss": -40.8689079284668, "global_step": 307372, "epoch": 2540} {"train_loss": -40.76454162597656, "global_step": 307373, "epoch": 2540} {"train_loss": -40.54244613647461, "global_step": 307374, "epoch": 2540} {"train_loss": -40.84749984741211, "global_step": 307375, "epoch": 2540} {"train_loss": -39.94244384765625, "global_step": 307376, "epoch": 2540} {"train_loss": -40.37370681762695, "global_step": 307377, "epoch": 2540} {"train_loss": -40.194759368896484, "global_step": 307378, "epoch": 2540} {"train_loss": -39.96723556518555, "global_step": 307379, "epoch": 2540} {"train_loss": -40.527584075927734, "global_step": 307380, "epoch": 2540} {"train_loss": -40.33327865600586, "global_step": 307381, "epoch": 2540} {"train_loss": -40.60221481323242, "global_step": 307382, "epoch": 2540} {"train_loss": -40.678260803222656, "global_step": 307383, "epoch": 2540} {"train_loss": -40.48657989501953, "global_step": 307384, "epoch": 2540} {"train_loss": -41.336509704589844, "global_step": 307385, "epoch": 2540} {"train_loss": -40.80562973022461, "global_step": 307386, "epoch": 2540} {"train_loss": -40.76174545288086, "global_step": 307387, "epoch": 2540} {"train_loss": -40.34524917602539, "global_step": 307388, "epoch": 2540} {"train_loss": -40.852455139160156, "global_step": 307389, "epoch": 2540} {"train_loss": -40.3437614440918, "global_step": 307390, "epoch": 2540} {"train_loss": -40.63671875, "global_step": 307391, "epoch": 2540} {"train_loss": -40.34402847290039, "global_step": 307392, "epoch": 2540} {"train_loss": -40.21837615966797, "global_step": 307393, "epoch": 2540} {"train_loss": -40.770912170410156, "global_step": 307394, "epoch": 2540} {"train_loss": -40.69063186645508, "global_step": 307395, "epoch": 2540} {"train_loss": -41.39998245239258, "global_step": 307396, "epoch": 2540} {"train_loss": -41.0739860534668, "global_step": 307397, "epoch": 2540} {"train_loss": -41.46242141723633, "global_step": 307398, "epoch": 2540} {"train_loss": -40.981597900390625, "global_step": 307399, "epoch": 2540} {"train_loss": -40.92153549194336, "global_step": 307400, "epoch": 2540} {"train_loss": -41.0587272644043, "global_step": 307401, "epoch": 2540} {"train_loss": -41.65597152709961, "global_step": 307402, "epoch": 2540} {"train_loss": -41.63624572753906, "global_step": 307403, "epoch": 2540} {"train_loss": -41.60388946533203, "global_step": 307404, "epoch": 2540} {"train_loss": -41.328609466552734, "global_step": 307405, "epoch": 2540} {"train_loss": -41.27277755737305, "global_step": 307406, "epoch": 2540} {"train_loss": -40.88154220581055, "global_step": 307407, "epoch": 2540} {"train_loss": -41.038299560546875, "global_step": 307408, "epoch": 2540} {"train_loss": -41.29381561279297, "global_step": 307409, "epoch": 2540} {"train_loss": -41.87089157104492, "global_step": 307410, "epoch": 2540} {"train_loss": -40.58271789550781, "global_step": 307411, "epoch": 2540} {"train_loss": -41.59521484375, "global_step": 307412, "epoch": 2540} {"train_loss": -42.125179290771484, "global_step": 307413, "epoch": 2540} {"train_loss": -41.62376022338867, "global_step": 307414, "epoch": 2540} {"train_loss": -41.51108932495117, "global_step": 307415, "epoch": 2540} {"train_loss": -41.52150344848633, "global_step": 307416, "epoch": 2540} {"train_loss": -41.973812103271484, "global_step": 307417, "epoch": 2540} {"train_loss": -41.523311614990234, "global_step": 307418, "epoch": 2540} {"train_loss": -41.707000732421875, "global_step": 307419, "epoch": 2540} {"train_loss": -41.73080062866211, "global_step": 307420, "epoch": 2540} {"train_loss": -42.2124137878418, "global_step": 307421, "epoch": 2540} {"train_loss": -42.009315490722656, "global_step": 307422, "epoch": 2540} {"train_loss": -41.6681022644043, "global_step": 307423, "epoch": 2540} {"train_loss": -40.92265701293945, "global_step": 307424, "epoch": 2540} {"train_loss": -41.56528854370117, "global_step": 307425, "epoch": 2540} {"train_loss": -42.07864761352539, "global_step": 307426, "epoch": 2540} {"train_loss": -41.9612922668457, "global_step": 307427, "epoch": 2540} {"train_loss": -42.093631744384766, "global_step": 307428, "epoch": 2540} {"train_loss": -41.93642044067383, "global_step": 307429, "epoch": 2540} {"train_loss": -42.09199142456055, "global_step": 307430, "epoch": 2540} {"train_loss": -41.99413299560547, "global_step": 307431, "epoch": 2540} {"train_loss": -41.47568893432617, "global_step": 307432, "epoch": 2540} {"train_loss": -42.28650665283203, "global_step": 307433, "epoch": 2540} {"train_loss": -42.17595672607422, "global_step": 307434, "epoch": 2540} {"train_loss": -41.761226654052734, "global_step": 307435, "epoch": 2540} {"train_loss": -42.189659118652344, "global_step": 307436, "epoch": 2540} {"train_loss": -42.133243560791016, "global_step": 307437, "epoch": 2540} {"train_loss": -42.3247184753418, "global_step": 307438, "epoch": 2540} {"train_loss": -42.227882385253906, "global_step": 307439, "epoch": 2540} {"train_loss": -41.800209045410156, "global_step": 307440, "epoch": 2540} {"train_loss": -41.61432647705078, "global_step": 307441, "epoch": 2540} {"train_loss": -42.69092559814453, "global_step": 307442, "epoch": 2540} {"train_loss": -42.28571319580078, "global_step": 307443, "epoch": 2540} {"train_loss": -42.41720199584961, "global_step": 307444, "epoch": 2540} {"train_loss": -41.71045684814453, "global_step": 307445, "epoch": 2540} {"train_loss": -42.32477951049805, "global_step": 307446, "epoch": 2540} {"train_loss": -42.31655502319336, "global_step": 307447, "epoch": 2540} {"train_loss": -42.38237380981445, "global_step": 307448, "epoch": 2540} {"train_loss": -41.97461700439453, "global_step": 307449, "epoch": 2540} {"train_loss": -41.92019271850586, "global_step": 307450, "epoch": 2540} {"train_loss": -42.022857666015625, "global_step": 307451, "epoch": 2540} {"train_loss": -41.8983268737793, "global_step": 307452, "epoch": 2540} {"train_loss": -41.72450637817383, "global_step": 307453, "epoch": 2540} {"train_loss": -41.35660171508789, "global_step": 307454, "epoch": 2540} {"train_loss": -41.6386833190918, "global_step": 307455, "epoch": 2540} {"train_loss": -41.621028900146484, "global_step": 307456, "epoch": 2540} {"train_loss": -41.773677825927734, "global_step": 307457, "epoch": 2540} {"train_loss": -41.778472900390625, "global_step": 307458, "epoch": 2540} {"train_loss": -40.21044921875, "global_step": 307459, "epoch": 2540} {"train_loss": -40.88307123735917, "global_step": 307460, "epoch": 2540, "val_loss": 2709394.5} {"train_loss": -40.56850051879883, "global_step": 307461, "epoch": 2541} {"train_loss": -40.363765716552734, "global_step": 307462, "epoch": 2541} {"train_loss": -40.2470588684082, "global_step": 307463, "epoch": 2541} {"train_loss": -40.00442123413086, "global_step": 307464, "epoch": 2541} {"train_loss": -40.053924560546875, "global_step": 307465, "epoch": 2541} {"train_loss": -39.089599609375, "global_step": 307466, "epoch": 2541} {"train_loss": -39.4632453918457, "global_step": 307467, "epoch": 2541} {"train_loss": -41.5778694152832, "global_step": 307468, "epoch": 2541} {"train_loss": -38.5113639831543, "global_step": 307469, "epoch": 2541} {"train_loss": -41.511505126953125, "global_step": 307470, "epoch": 2541} {"train_loss": -40.521827697753906, "global_step": 307471, "epoch": 2541} {"train_loss": -38.4336051940918, "global_step": 307472, "epoch": 2541} {"train_loss": -38.62245559692383, "global_step": 307473, "epoch": 2541} {"train_loss": -39.21479797363281, "global_step": 307474, "epoch": 2541} {"train_loss": -41.18679428100586, "global_step": 307475, "epoch": 2541} {"train_loss": -40.11857604980469, "global_step": 307476, "epoch": 2541} {"train_loss": -36.05691146850586, "global_step": 307477, "epoch": 2541} {"train_loss": -40.87010955810547, "global_step": 307478, "epoch": 2541} {"train_loss": -40.43922805786133, "global_step": 307479, "epoch": 2541} {"train_loss": -37.7048454284668, "global_step": 307480, "epoch": 2541} {"train_loss": -38.350486755371094, "global_step": 307481, "epoch": 2541} {"train_loss": -40.57474899291992, "global_step": 307482, "epoch": 2541} {"train_loss": -40.03654098510742, "global_step": 307483, "epoch": 2541} {"train_loss": -39.50531768798828, "global_step": 307484, "epoch": 2541} {"train_loss": -41.23093795776367, "global_step": 307485, "epoch": 2541} {"train_loss": -40.79130172729492, "global_step": 307486, "epoch": 2541} {"train_loss": -39.92832565307617, "global_step": 307487, "epoch": 2541} {"train_loss": -40.18303298950195, "global_step": 307488, "epoch": 2541} {"train_loss": -40.595027923583984, "global_step": 307489, "epoch": 2541} {"train_loss": -41.57721710205078, "global_step": 307490, "epoch": 2541} {"train_loss": -39.44973373413086, "global_step": 307491, "epoch": 2541} {"train_loss": -41.4021110534668, "global_step": 307492, "epoch": 2541} {"train_loss": -38.7124137878418, "global_step": 307493, "epoch": 2541} {"train_loss": -40.78578567504883, "global_step": 307494, "epoch": 2541} {"train_loss": -39.616546630859375, "global_step": 307495, "epoch": 2541} {"train_loss": -40.8678092956543, "global_step": 307496, "epoch": 2541} {"train_loss": -39.08122634887695, "global_step": 307497, "epoch": 2541} {"train_loss": -40.6081657409668, "global_step": 307498, "epoch": 2541} {"train_loss": -40.896846771240234, "global_step": 307499, "epoch": 2541} {"train_loss": -40.769962310791016, "global_step": 307500, "epoch": 2541} {"train_loss": -40.83546829223633, "global_step": 307501, "epoch": 2541} {"train_loss": -38.87046432495117, "global_step": 307502, "epoch": 2541} {"train_loss": -41.72344207763672, "global_step": 307503, "epoch": 2541} {"train_loss": -40.69417953491211, "global_step": 307504, "epoch": 2541} {"train_loss": -40.124000549316406, "global_step": 307505, "epoch": 2541} {"train_loss": -41.95737838745117, "global_step": 307506, "epoch": 2541} {"train_loss": -40.65406036376953, "global_step": 307507, "epoch": 2541} {"train_loss": -41.32633590698242, "global_step": 307508, "epoch": 2541} {"train_loss": -40.89815902709961, "global_step": 307509, "epoch": 2541} {"train_loss": -40.55296325683594, "global_step": 307510, "epoch": 2541} {"train_loss": -42.55178451538086, "global_step": 307511, "epoch": 2541} {"train_loss": -40.62314224243164, "global_step": 307512, "epoch": 2541} {"train_loss": -40.70664596557617, "global_step": 307513, "epoch": 2541} {"train_loss": -41.44999694824219, "global_step": 307514, "epoch": 2541} {"train_loss": -41.195762634277344, "global_step": 307515, "epoch": 2541} {"train_loss": -41.9268798828125, "global_step": 307516, "epoch": 2541} {"train_loss": -41.581050872802734, "global_step": 307517, "epoch": 2541} {"train_loss": -41.70650863647461, "global_step": 307518, "epoch": 2541} {"train_loss": -42.43483352661133, "global_step": 307519, "epoch": 2541} {"train_loss": -41.30729293823242, "global_step": 307520, "epoch": 2541} {"train_loss": -41.242591857910156, "global_step": 307521, "epoch": 2541} {"train_loss": -42.10791778564453, "global_step": 307522, "epoch": 2541} {"train_loss": -41.76960372924805, "global_step": 307523, "epoch": 2541} {"train_loss": -42.341915130615234, "global_step": 307524, "epoch": 2541} {"train_loss": -42.55095291137695, "global_step": 307525, "epoch": 2541} {"train_loss": -41.71603012084961, "global_step": 307526, "epoch": 2541} {"train_loss": -42.330345153808594, "global_step": 307527, "epoch": 2541} {"train_loss": -42.62795639038086, "global_step": 307528, "epoch": 2541} {"train_loss": -41.73532485961914, "global_step": 307529, "epoch": 2541} {"train_loss": -42.5340576171875, "global_step": 307530, "epoch": 2541} {"train_loss": -42.30891036987305, "global_step": 307531, "epoch": 2541} {"train_loss": -42.203163146972656, "global_step": 307532, "epoch": 2541} {"train_loss": -42.65863037109375, "global_step": 307533, "epoch": 2541} {"train_loss": -42.06748580932617, "global_step": 307534, "epoch": 2541} {"train_loss": -42.55772018432617, "global_step": 307535, "epoch": 2541} {"train_loss": -42.3606071472168, "global_step": 307536, "epoch": 2541} {"train_loss": -42.42085647583008, "global_step": 307537, "epoch": 2541} {"train_loss": -42.53173828125, "global_step": 307538, "epoch": 2541} {"train_loss": -42.05268859863281, "global_step": 307539, "epoch": 2541} {"train_loss": -42.573699951171875, "global_step": 307540, "epoch": 2541} {"train_loss": -42.363250732421875, "global_step": 307541, "epoch": 2541} {"train_loss": -42.6030158996582, "global_step": 307542, "epoch": 2541} {"train_loss": -42.72744369506836, "global_step": 307543, "epoch": 2541} {"train_loss": -42.2962760925293, "global_step": 307544, "epoch": 2541} {"train_loss": -42.810028076171875, "global_step": 307545, "epoch": 2541} {"train_loss": -42.83039855957031, "global_step": 307546, "epoch": 2541} {"train_loss": -42.123104095458984, "global_step": 307547, "epoch": 2541} {"train_loss": -42.540523529052734, "global_step": 307548, "epoch": 2541} {"train_loss": -42.27164077758789, "global_step": 307549, "epoch": 2541} {"train_loss": -42.412776947021484, "global_step": 307550, "epoch": 2541} {"train_loss": -42.4343376159668, "global_step": 307551, "epoch": 2541} {"train_loss": -42.85163497924805, "global_step": 307552, "epoch": 2541} {"train_loss": -43.175899505615234, "global_step": 307553, "epoch": 2541} {"train_loss": -42.71721267700195, "global_step": 307554, "epoch": 2541} {"train_loss": -42.324398040771484, "global_step": 307555, "epoch": 2541} {"train_loss": -43.255184173583984, "global_step": 307556, "epoch": 2541} {"train_loss": -42.92959213256836, "global_step": 307557, "epoch": 2541} {"train_loss": -42.6839599609375, "global_step": 307558, "epoch": 2541} {"train_loss": -43.278133392333984, "global_step": 307559, "epoch": 2541} {"train_loss": -42.61061477661133, "global_step": 307560, "epoch": 2541} {"train_loss": -42.31820297241211, "global_step": 307561, "epoch": 2541} {"train_loss": -42.958251953125, "global_step": 307562, "epoch": 2541} {"train_loss": -43.228668212890625, "global_step": 307563, "epoch": 2541} {"train_loss": -42.71637725830078, "global_step": 307564, "epoch": 2541} {"train_loss": -43.266117095947266, "global_step": 307565, "epoch": 2541} {"train_loss": -43.10660171508789, "global_step": 307566, "epoch": 2541} {"train_loss": -42.9959831237793, "global_step": 307567, "epoch": 2541} {"train_loss": -43.12099075317383, "global_step": 307568, "epoch": 2541} {"train_loss": -43.21224594116211, "global_step": 307569, "epoch": 2541} {"train_loss": -42.584312438964844, "global_step": 307570, "epoch": 2541} {"train_loss": -42.92611312866211, "global_step": 307571, "epoch": 2541} {"train_loss": -42.82700729370117, "global_step": 307572, "epoch": 2541} {"train_loss": -42.82920837402344, "global_step": 307573, "epoch": 2541} {"train_loss": -43.06221008300781, "global_step": 307574, "epoch": 2541} {"train_loss": -42.113216400146484, "global_step": 307575, "epoch": 2541} {"train_loss": -42.78682327270508, "global_step": 307576, "epoch": 2541} {"train_loss": -43.24843215942383, "global_step": 307577, "epoch": 2541} {"train_loss": -42.86246871948242, "global_step": 307578, "epoch": 2541} {"train_loss": -42.60466003417969, "global_step": 307579, "epoch": 2541} {"train_loss": -43.3421630859375, "global_step": 307580, "epoch": 2541} {"train_loss": -41.505331055191924, "global_step": 307581, "epoch": 2541, "val_loss": 2623900.25} {"train_loss": -43.25756072998047, "global_step": 307582, "epoch": 2542} {"train_loss": -43.549781799316406, "global_step": 307583, "epoch": 2542} {"train_loss": -42.90305709838867, "global_step": 307584, "epoch": 2542} {"train_loss": -43.302181243896484, "global_step": 307585, "epoch": 2542} {"train_loss": -42.397640228271484, "global_step": 307586, "epoch": 2542} {"train_loss": -43.43671798706055, "global_step": 307587, "epoch": 2542} {"train_loss": -42.53596878051758, "global_step": 307588, "epoch": 2542} {"train_loss": -42.74107360839844, "global_step": 307589, "epoch": 2542} {"train_loss": -42.46476364135742, "global_step": 307590, "epoch": 2542} {"train_loss": -41.979644775390625, "global_step": 307591, "epoch": 2542} {"train_loss": -42.615699768066406, "global_step": 307592, "epoch": 2542} {"train_loss": -42.634857177734375, "global_step": 307593, "epoch": 2542} {"train_loss": -42.33039093017578, "global_step": 307594, "epoch": 2542} {"train_loss": -41.34952926635742, "global_step": 307595, "epoch": 2542} {"train_loss": -42.16904830932617, "global_step": 307596, "epoch": 2542} {"train_loss": -43.21802520751953, "global_step": 307597, "epoch": 2542} {"train_loss": -42.67958450317383, "global_step": 307598, "epoch": 2542} {"train_loss": -42.374332427978516, "global_step": 307599, "epoch": 2542} {"train_loss": -42.54598617553711, "global_step": 307600, "epoch": 2542} {"train_loss": -42.9501838684082, "global_step": 307601, "epoch": 2542} {"train_loss": -42.61733627319336, "global_step": 307602, "epoch": 2542} {"train_loss": -42.46697998046875, "global_step": 307603, "epoch": 2542} {"train_loss": -42.401790618896484, "global_step": 307604, "epoch": 2542} {"train_loss": -43.501861572265625, "global_step": 307605, "epoch": 2542} {"train_loss": -43.056331634521484, "global_step": 307606, "epoch": 2542} {"train_loss": -42.928123474121094, "global_step": 307607, "epoch": 2542} {"train_loss": -43.69929122924805, "global_step": 307608, "epoch": 2542} {"train_loss": -43.25962448120117, "global_step": 307609, "epoch": 2542} {"train_loss": -43.66346740722656, "global_step": 307610, "epoch": 2542} {"train_loss": -43.325565338134766, "global_step": 307611, "epoch": 2542} {"train_loss": -43.10343551635742, "global_step": 307612, "epoch": 2542} {"train_loss": -42.50120162963867, "global_step": 307613, "epoch": 2542} {"train_loss": -41.52335739135742, "global_step": 307614, "epoch": 2542} {"train_loss": -42.73731231689453, "global_step": 307615, "epoch": 2542} {"train_loss": -42.21564865112305, "global_step": 307616, "epoch": 2542} {"train_loss": -43.00739288330078, "global_step": 307617, "epoch": 2542} {"train_loss": -43.121620178222656, "global_step": 307618, "epoch": 2542} {"train_loss": -43.446563720703125, "global_step": 307619, "epoch": 2542} {"train_loss": -43.20249557495117, "global_step": 307620, "epoch": 2542} {"train_loss": -42.97251510620117, "global_step": 307621, "epoch": 2542} {"train_loss": -43.4100227355957, "global_step": 307622, "epoch": 2542} {"train_loss": -42.9066162109375, "global_step": 307623, "epoch": 2542} {"train_loss": -42.862911224365234, "global_step": 307624, "epoch": 2542} {"train_loss": -43.080440521240234, "global_step": 307625, "epoch": 2542} {"train_loss": -43.199031829833984, "global_step": 307626, "epoch": 2542} {"train_loss": -42.763458251953125, "global_step": 307627, "epoch": 2542} {"train_loss": -41.353271484375, "global_step": 307628, "epoch": 2542} {"train_loss": -41.16901779174805, "global_step": 307629, "epoch": 2542} {"train_loss": -42.53021240234375, "global_step": 307630, "epoch": 2542} {"train_loss": -41.80549240112305, "global_step": 307631, "epoch": 2542} {"train_loss": -36.628143310546875, "global_step": 307632, "epoch": 2542} {"train_loss": -39.2708625793457, "global_step": 307633, "epoch": 2542} {"train_loss": -38.305294036865234, "global_step": 307634, "epoch": 2542} {"train_loss": -42.70002365112305, "global_step": 307635, "epoch": 2542} {"train_loss": -39.818965911865234, "global_step": 307636, "epoch": 2542} {"train_loss": -38.71285629272461, "global_step": 307637, "epoch": 2542} {"train_loss": -38.82746505737305, "global_step": 307638, "epoch": 2542} {"train_loss": -39.518680572509766, "global_step": 307639, "epoch": 2542} {"train_loss": -40.76188278198242, "global_step": 307640, "epoch": 2542} {"train_loss": -41.6652946472168, "global_step": 307641, "epoch": 2542} {"train_loss": -40.8703727722168, "global_step": 307642, "epoch": 2542} {"train_loss": -40.802852630615234, "global_step": 307643, "epoch": 2542} {"train_loss": -41.132381439208984, "global_step": 307644, "epoch": 2542} {"train_loss": -41.90871810913086, "global_step": 307645, "epoch": 2542} {"train_loss": -41.12041473388672, "global_step": 307646, "epoch": 2542} {"train_loss": -41.95361328125, "global_step": 307647, "epoch": 2542} {"train_loss": -39.87802505493164, "global_step": 307648, "epoch": 2542} {"train_loss": -42.71261978149414, "global_step": 307649, "epoch": 2542} {"train_loss": -41.232200622558594, "global_step": 307650, "epoch": 2542} {"train_loss": -41.2046012878418, "global_step": 307651, "epoch": 2542} {"train_loss": -41.67355728149414, "global_step": 307652, "epoch": 2542} {"train_loss": -42.188720703125, "global_step": 307653, "epoch": 2542} {"train_loss": -42.28608322143555, "global_step": 307654, "epoch": 2542} {"train_loss": -42.31337356567383, "global_step": 307655, "epoch": 2542} {"train_loss": -41.843849182128906, "global_step": 307656, "epoch": 2542} {"train_loss": -41.08338165283203, "global_step": 307657, "epoch": 2542} {"train_loss": -42.2470817565918, "global_step": 307658, "epoch": 2542} {"train_loss": -42.5059928894043, "global_step": 307659, "epoch": 2542} {"train_loss": -41.538330078125, "global_step": 307660, "epoch": 2542} {"train_loss": -43.04878616333008, "global_step": 307661, "epoch": 2542} {"train_loss": -42.313655853271484, "global_step": 307662, "epoch": 2542} {"train_loss": -42.70302963256836, "global_step": 307663, "epoch": 2542} {"train_loss": -42.67028045654297, "global_step": 307664, "epoch": 2542} {"train_loss": -42.74569320678711, "global_step": 307665, "epoch": 2542} {"train_loss": -41.900787353515625, "global_step": 307666, "epoch": 2542} {"train_loss": -42.735774993896484, "global_step": 307667, "epoch": 2542} {"train_loss": -42.4683837890625, "global_step": 307668, "epoch": 2542} {"train_loss": -41.06257247924805, "global_step": 307669, "epoch": 2542} {"train_loss": -43.258338928222656, "global_step": 307670, "epoch": 2542} {"train_loss": -42.90560531616211, "global_step": 307671, "epoch": 2542} {"train_loss": -43.030784606933594, "global_step": 307672, "epoch": 2542} {"train_loss": -43.315731048583984, "global_step": 307673, "epoch": 2542} {"train_loss": -43.223628997802734, "global_step": 307674, "epoch": 2542} {"train_loss": -42.9876594543457, "global_step": 307675, "epoch": 2542} {"train_loss": -42.7105712890625, "global_step": 307676, "epoch": 2542} {"train_loss": -43.72469711303711, "global_step": 307677, "epoch": 2542} {"train_loss": -43.34918975830078, "global_step": 307678, "epoch": 2542} {"train_loss": -43.30268096923828, "global_step": 307679, "epoch": 2542} {"train_loss": -43.271968841552734, "global_step": 307680, "epoch": 2542} {"train_loss": -42.76223373413086, "global_step": 307681, "epoch": 2542} {"train_loss": -43.928367614746094, "global_step": 307682, "epoch": 2542} {"train_loss": -43.019248962402344, "global_step": 307683, "epoch": 2542} {"train_loss": -43.282997131347656, "global_step": 307684, "epoch": 2542} {"train_loss": -43.316673278808594, "global_step": 307685, "epoch": 2542} {"train_loss": -43.905433654785156, "global_step": 307686, "epoch": 2542} {"train_loss": -43.214595794677734, "global_step": 307687, "epoch": 2542} {"train_loss": -44.395198822021484, "global_step": 307688, "epoch": 2542} {"train_loss": -43.02268981933594, "global_step": 307689, "epoch": 2542} {"train_loss": -43.28956985473633, "global_step": 307690, "epoch": 2542} {"train_loss": -42.99563980102539, "global_step": 307691, "epoch": 2542} {"train_loss": -43.36227798461914, "global_step": 307692, "epoch": 2542} {"train_loss": -43.430171966552734, "global_step": 307693, "epoch": 2542} {"train_loss": -43.07673263549805, "global_step": 307694, "epoch": 2542} {"train_loss": -43.71086502075195, "global_step": 307695, "epoch": 2542} {"train_loss": -43.40178298950195, "global_step": 307696, "epoch": 2542} {"train_loss": -43.25532531738281, "global_step": 307697, "epoch": 2542} {"train_loss": -43.57960891723633, "global_step": 307698, "epoch": 2542} {"train_loss": -43.84120559692383, "global_step": 307699, "epoch": 2542} {"train_loss": -43.7439079284668, "global_step": 307700, "epoch": 2542} {"train_loss": -43.770626068115234, "global_step": 307701, "epoch": 2542} {"train_loss": -42.45107742183465, "global_step": 307702, "epoch": 2542, "val_loss": 2706014.0} {"train_loss": -43.90507888793945, "global_step": 307703, "epoch": 2543} {"train_loss": -43.64974594116211, "global_step": 307704, "epoch": 2543} {"train_loss": -44.245147705078125, "global_step": 307705, "epoch": 2543} {"train_loss": -43.5076789855957, "global_step": 307706, "epoch": 2543} {"train_loss": -43.32249450683594, "global_step": 307707, "epoch": 2543} {"train_loss": -43.63119125366211, "global_step": 307708, "epoch": 2543} {"train_loss": -43.1641960144043, "global_step": 307709, "epoch": 2543} {"train_loss": -43.59004592895508, "global_step": 307710, "epoch": 2543} {"train_loss": -42.05010223388672, "global_step": 307711, "epoch": 2543} {"train_loss": -39.14406204223633, "global_step": 307712, "epoch": 2543} {"train_loss": -34.768402099609375, "global_step": 307713, "epoch": 2543} {"train_loss": -23.08125877380371, "global_step": 307714, "epoch": 2543} {"train_loss": -21.307209014892578, "global_step": 307715, "epoch": 2543} {"train_loss": -37.03491973876953, "global_step": 307716, "epoch": 2543} {"train_loss": -39.1478271484375, "global_step": 307717, "epoch": 2543} {"train_loss": -31.9476318359375, "global_step": 307718, "epoch": 2543} {"train_loss": -39.41392135620117, "global_step": 307719, "epoch": 2543} {"train_loss": -32.53030014038086, "global_step": 307720, "epoch": 2543} {"train_loss": -36.76656723022461, "global_step": 307721, "epoch": 2543} {"train_loss": -38.12245178222656, "global_step": 307722, "epoch": 2543} {"train_loss": -38.02777862548828, "global_step": 307723, "epoch": 2543} {"train_loss": -35.53239059448242, "global_step": 307724, "epoch": 2543} {"train_loss": -38.47148513793945, "global_step": 307725, "epoch": 2543} {"train_loss": -37.23545455932617, "global_step": 307726, "epoch": 2543} {"train_loss": -40.32228469848633, "global_step": 307727, "epoch": 2543} {"train_loss": -36.573726654052734, "global_step": 307728, "epoch": 2543} {"train_loss": -40.66829299926758, "global_step": 307729, "epoch": 2543} {"train_loss": -37.981468200683594, "global_step": 307730, "epoch": 2543} {"train_loss": -41.48827362060547, "global_step": 307731, "epoch": 2543} {"train_loss": -38.715450286865234, "global_step": 307732, "epoch": 2543} {"train_loss": -41.546791076660156, "global_step": 307733, "epoch": 2543} {"train_loss": -40.35548782348633, "global_step": 307734, "epoch": 2543} {"train_loss": -40.194190979003906, "global_step": 307735, "epoch": 2543} {"train_loss": -41.532894134521484, "global_step": 307736, "epoch": 2543} {"train_loss": -40.17779541015625, "global_step": 307737, "epoch": 2543} {"train_loss": -40.06243133544922, "global_step": 307738, "epoch": 2543} {"train_loss": -41.840633392333984, "global_step": 307739, "epoch": 2543} {"train_loss": -40.13493728637695, "global_step": 307740, "epoch": 2543} {"train_loss": -41.53416061401367, "global_step": 307741, "epoch": 2543} {"train_loss": -41.672096252441406, "global_step": 307742, "epoch": 2543} {"train_loss": -41.04697799682617, "global_step": 307743, "epoch": 2543} {"train_loss": -41.689666748046875, "global_step": 307744, "epoch": 2543} {"train_loss": -41.09992980957031, "global_step": 307745, "epoch": 2543} {"train_loss": -41.77840042114258, "global_step": 307746, "epoch": 2543} {"train_loss": -42.0089111328125, "global_step": 307747, "epoch": 2543} {"train_loss": -42.12350845336914, "global_step": 307748, "epoch": 2543} {"train_loss": -41.88712692260742, "global_step": 307749, "epoch": 2543} {"train_loss": -40.913570404052734, "global_step": 307750, "epoch": 2543} {"train_loss": -41.108516693115234, "global_step": 307751, "epoch": 2543} {"train_loss": -41.796382904052734, "global_step": 307752, "epoch": 2543} {"train_loss": -41.89100646972656, "global_step": 307753, "epoch": 2543} {"train_loss": -41.13153076171875, "global_step": 307754, "epoch": 2543} {"train_loss": -42.88228225708008, "global_step": 307755, "epoch": 2543} {"train_loss": -42.36013412475586, "global_step": 307756, "epoch": 2543} {"train_loss": -42.50551986694336, "global_step": 307757, "epoch": 2543} {"train_loss": -42.22123336791992, "global_step": 307758, "epoch": 2543} {"train_loss": -41.7750129699707, "global_step": 307759, "epoch": 2543} {"train_loss": -42.3831787109375, "global_step": 307760, "epoch": 2543} {"train_loss": -42.1618537902832, "global_step": 307761, "epoch": 2543} {"train_loss": -42.364723205566406, "global_step": 307762, "epoch": 2543} {"train_loss": -42.427833557128906, "global_step": 307763, "epoch": 2543} {"train_loss": -42.482357025146484, "global_step": 307764, "epoch": 2543} {"train_loss": -42.795387268066406, "global_step": 307765, "epoch": 2543} {"train_loss": -42.76735305786133, "global_step": 307766, "epoch": 2543} {"train_loss": -42.61220932006836, "global_step": 307767, "epoch": 2543} {"train_loss": -42.7066764831543, "global_step": 307768, "epoch": 2543} {"train_loss": -42.49235153198242, "global_step": 307769, "epoch": 2543} {"train_loss": -43.28303146362305, "global_step": 307770, "epoch": 2543} {"train_loss": -43.110801696777344, "global_step": 307771, "epoch": 2543} {"train_loss": -42.57425308227539, "global_step": 307772, "epoch": 2543} {"train_loss": -42.337432861328125, "global_step": 307773, "epoch": 2543} {"train_loss": -42.170867919921875, "global_step": 307774, "epoch": 2543} {"train_loss": -43.027748107910156, "global_step": 307775, "epoch": 2543} {"train_loss": -43.53639221191406, "global_step": 307776, "epoch": 2543} {"train_loss": -42.81654357910156, "global_step": 307777, "epoch": 2543} {"train_loss": -43.326290130615234, "global_step": 307778, "epoch": 2543} {"train_loss": -43.15239715576172, "global_step": 307779, "epoch": 2543} {"train_loss": -42.25606918334961, "global_step": 307780, "epoch": 2543} {"train_loss": -40.559722900390625, "global_step": 307781, "epoch": 2543} {"train_loss": -42.894020080566406, "global_step": 307782, "epoch": 2543} {"train_loss": -43.381591796875, "global_step": 307783, "epoch": 2543} {"train_loss": -42.79226303100586, "global_step": 307784, "epoch": 2543} {"train_loss": -42.161415100097656, "global_step": 307785, "epoch": 2543} {"train_loss": -43.52390670776367, "global_step": 307786, "epoch": 2543} {"train_loss": -43.48163986206055, "global_step": 307787, "epoch": 2543} {"train_loss": -40.374088287353516, "global_step": 307788, "epoch": 2543} {"train_loss": -43.55162811279297, "global_step": 307789, "epoch": 2543} {"train_loss": -43.36274719238281, "global_step": 307790, "epoch": 2543} {"train_loss": -43.316768646240234, "global_step": 307791, "epoch": 2543} {"train_loss": -43.05344772338867, "global_step": 307792, "epoch": 2543} {"train_loss": -42.37729263305664, "global_step": 307793, "epoch": 2543} {"train_loss": -43.06010818481445, "global_step": 307794, "epoch": 2543} {"train_loss": -43.273216247558594, "global_step": 307795, "epoch": 2543} {"train_loss": -43.26182174682617, "global_step": 307796, "epoch": 2543} {"train_loss": -43.510345458984375, "global_step": 307797, "epoch": 2543} {"train_loss": -43.44718551635742, "global_step": 307798, "epoch": 2543} {"train_loss": -43.89951705932617, "global_step": 307799, "epoch": 2543} {"train_loss": -44.051612854003906, "global_step": 307800, "epoch": 2543} {"train_loss": -43.926536560058594, "global_step": 307801, "epoch": 2543} {"train_loss": -43.690673828125, "global_step": 307802, "epoch": 2543} {"train_loss": -43.327327728271484, "global_step": 307803, "epoch": 2543} {"train_loss": -43.26559066772461, "global_step": 307804, "epoch": 2543} {"train_loss": -43.276214599609375, "global_step": 307805, "epoch": 2543} {"train_loss": -43.866519927978516, "global_step": 307806, "epoch": 2543} {"train_loss": -43.878173828125, "global_step": 307807, "epoch": 2543} {"train_loss": -43.751808166503906, "global_step": 307808, "epoch": 2543} {"train_loss": -43.9600830078125, "global_step": 307809, "epoch": 2543} {"train_loss": -43.687660217285156, "global_step": 307810, "epoch": 2543} {"train_loss": -43.082393646240234, "global_step": 307811, "epoch": 2543} {"train_loss": -43.99761199951172, "global_step": 307812, "epoch": 2543} {"train_loss": -43.68537521362305, "global_step": 307813, "epoch": 2543} {"train_loss": -43.58767318725586, "global_step": 307814, "epoch": 2543} {"train_loss": -43.230037689208984, "global_step": 307815, "epoch": 2543} {"train_loss": -44.13737106323242, "global_step": 307816, "epoch": 2543} {"train_loss": -42.00105667114258, "global_step": 307817, "epoch": 2543} {"train_loss": -44.33667755126953, "global_step": 307818, "epoch": 2543} {"train_loss": -43.72309494018555, "global_step": 307819, "epoch": 2543} {"train_loss": -43.550594329833984, "global_step": 307820, "epoch": 2543} {"train_loss": -43.6229248046875, "global_step": 307821, "epoch": 2543} {"train_loss": -43.88246154785156, "global_step": 307822, "epoch": 2543} {"train_loss": -41.554527802900836, "global_step": 307823, "epoch": 2543, "val_loss": 2693783.25} {"train_loss": -44.42601776123047, "global_step": 307824, "epoch": 2544} {"train_loss": -44.0695686340332, "global_step": 307825, "epoch": 2544} {"train_loss": -43.98772048950195, "global_step": 307826, "epoch": 2544} {"train_loss": -42.98631286621094, "global_step": 307827, "epoch": 2544} {"train_loss": -44.064083099365234, "global_step": 307828, "epoch": 2544} {"train_loss": -43.258235931396484, "global_step": 307829, "epoch": 2544} {"train_loss": -43.59392166137695, "global_step": 307830, "epoch": 2544} {"train_loss": -43.738441467285156, "global_step": 307831, "epoch": 2544} {"train_loss": -43.14370346069336, "global_step": 307832, "epoch": 2544} {"train_loss": -43.520751953125, "global_step": 307833, "epoch": 2544} {"train_loss": -43.92123031616211, "global_step": 307834, "epoch": 2544} {"train_loss": -43.87722396850586, "global_step": 307835, "epoch": 2544} {"train_loss": -42.90780258178711, "global_step": 307836, "epoch": 2544} {"train_loss": -41.60207748413086, "global_step": 307837, "epoch": 2544} {"train_loss": -42.255794525146484, "global_step": 307838, "epoch": 2544} {"train_loss": -42.78540802001953, "global_step": 307839, "epoch": 2544} {"train_loss": -39.809322357177734, "global_step": 307840, "epoch": 2544} {"train_loss": -42.92138671875, "global_step": 307841, "epoch": 2544} {"train_loss": -43.3713493347168, "global_step": 307842, "epoch": 2544} {"train_loss": -41.56812286376953, "global_step": 307843, "epoch": 2544} {"train_loss": -42.718326568603516, "global_step": 307844, "epoch": 2544} {"train_loss": -43.559085845947266, "global_step": 307845, "epoch": 2544} {"train_loss": -42.895843505859375, "global_step": 307846, "epoch": 2544} {"train_loss": -42.84530258178711, "global_step": 307847, "epoch": 2544} {"train_loss": -43.816680908203125, "global_step": 307848, "epoch": 2544} {"train_loss": -40.84017562866211, "global_step": 307849, "epoch": 2544} {"train_loss": -43.36908721923828, "global_step": 307850, "epoch": 2544} {"train_loss": -43.0675048828125, "global_step": 307851, "epoch": 2544} {"train_loss": -43.058990478515625, "global_step": 307852, "epoch": 2544} {"train_loss": -40.57362747192383, "global_step": 307853, "epoch": 2544} {"train_loss": -41.72182083129883, "global_step": 307854, "epoch": 2544} {"train_loss": -39.54832077026367, "global_step": 307855, "epoch": 2544} {"train_loss": -38.73487091064453, "global_step": 307856, "epoch": 2544} {"train_loss": -42.79962158203125, "global_step": 307857, "epoch": 2544} {"train_loss": -38.21492385864258, "global_step": 307858, "epoch": 2544} {"train_loss": -40.588775634765625, "global_step": 307859, "epoch": 2544} {"train_loss": -40.81340026855469, "global_step": 307860, "epoch": 2544} {"train_loss": -42.20364761352539, "global_step": 307861, "epoch": 2544} {"train_loss": -42.57182693481445, "global_step": 307862, "epoch": 2544} {"train_loss": -41.791481018066406, "global_step": 307863, "epoch": 2544} {"train_loss": -24.82106590270996, "global_step": 307864, "epoch": 2544} {"train_loss": -37.262474060058594, "global_step": 307865, "epoch": 2544} {"train_loss": -33.664344787597656, "global_step": 307866, "epoch": 2544} {"train_loss": -36.7154426574707, "global_step": 307867, "epoch": 2544} {"train_loss": -37.85744094848633, "global_step": 307868, "epoch": 2544} {"train_loss": -32.761009216308594, "global_step": 307869, "epoch": 2544} {"train_loss": -33.07949447631836, "global_step": 307870, "epoch": 2544} {"train_loss": -38.32334518432617, "global_step": 307871, "epoch": 2544} {"train_loss": -35.68075942993164, "global_step": 307872, "epoch": 2544} {"train_loss": -34.724735260009766, "global_step": 307873, "epoch": 2544} {"train_loss": -37.95180130004883, "global_step": 307874, "epoch": 2544} {"train_loss": -35.7985725402832, "global_step": 307875, "epoch": 2544} {"train_loss": -38.15693283081055, "global_step": 307876, "epoch": 2544} {"train_loss": -21.874652862548828, "global_step": 307877, "epoch": 2544} {"train_loss": -30.80548095703125, "global_step": 307878, "epoch": 2544} {"train_loss": -31.06709861755371, "global_step": 307879, "epoch": 2544} {"train_loss": -37.46793746948242, "global_step": 307880, "epoch": 2544} {"train_loss": -36.8113899230957, "global_step": 307881, "epoch": 2544} {"train_loss": -30.207015991210938, "global_step": 307882, "epoch": 2544} {"train_loss": -37.99919891357422, "global_step": 307883, "epoch": 2544} {"train_loss": -34.271087646484375, "global_step": 307884, "epoch": 2544} {"train_loss": -35.49513626098633, "global_step": 307885, "epoch": 2544} {"train_loss": -37.04810333251953, "global_step": 307886, "epoch": 2544} {"train_loss": -35.79989242553711, "global_step": 307887, "epoch": 2544} {"train_loss": -36.66435623168945, "global_step": 307888, "epoch": 2544} {"train_loss": -37.56565475463867, "global_step": 307889, "epoch": 2544} {"train_loss": -33.82201385498047, "global_step": 307890, "epoch": 2544} {"train_loss": -38.30569839477539, "global_step": 307891, "epoch": 2544} {"train_loss": -39.196903228759766, "global_step": 307892, "epoch": 2544} {"train_loss": -37.65007019042969, "global_step": 307893, "epoch": 2544} {"train_loss": -40.252418518066406, "global_step": 307894, "epoch": 2544} {"train_loss": -37.7053337097168, "global_step": 307895, "epoch": 2544} {"train_loss": -38.68239974975586, "global_step": 307896, "epoch": 2544} {"train_loss": -39.704200744628906, "global_step": 307897, "epoch": 2544} {"train_loss": -38.85029220581055, "global_step": 307898, "epoch": 2544} {"train_loss": -39.892250061035156, "global_step": 307899, "epoch": 2544} {"train_loss": -39.65315628051758, "global_step": 307900, "epoch": 2544} {"train_loss": -39.689491271972656, "global_step": 307901, "epoch": 2544} {"train_loss": -39.71799850463867, "global_step": 307902, "epoch": 2544} {"train_loss": -39.579376220703125, "global_step": 307903, "epoch": 2544} {"train_loss": -40.719966888427734, "global_step": 307904, "epoch": 2544} {"train_loss": -38.95754623413086, "global_step": 307905, "epoch": 2544} {"train_loss": -40.6645622253418, "global_step": 307906, "epoch": 2544} {"train_loss": -40.604888916015625, "global_step": 307907, "epoch": 2544} {"train_loss": -40.139427185058594, "global_step": 307908, "epoch": 2544} {"train_loss": -38.7930908203125, "global_step": 307909, "epoch": 2544} {"train_loss": -40.406761169433594, "global_step": 307910, "epoch": 2544} {"train_loss": -38.765785217285156, "global_step": 307911, "epoch": 2544} {"train_loss": -40.636329650878906, "global_step": 307912, "epoch": 2544} {"train_loss": -40.36553192138672, "global_step": 307913, "epoch": 2544} {"train_loss": -39.7262077331543, "global_step": 307914, "epoch": 2544} {"train_loss": -40.38410568237305, "global_step": 307915, "epoch": 2544} {"train_loss": -40.88059997558594, "global_step": 307916, "epoch": 2544} {"train_loss": -41.01822280883789, "global_step": 307917, "epoch": 2544} {"train_loss": -40.23303985595703, "global_step": 307918, "epoch": 2544} {"train_loss": -40.98711013793945, "global_step": 307919, "epoch": 2544} {"train_loss": -41.35464859008789, "global_step": 307920, "epoch": 2544} {"train_loss": -41.01887130737305, "global_step": 307921, "epoch": 2544} {"train_loss": -41.103004455566406, "global_step": 307922, "epoch": 2544} {"train_loss": -41.01469039916992, "global_step": 307923, "epoch": 2544} {"train_loss": -40.516517639160156, "global_step": 307924, "epoch": 2544} {"train_loss": -40.10517501831055, "global_step": 307925, "epoch": 2544} {"train_loss": -42.1011962890625, "global_step": 307926, "epoch": 2544} {"train_loss": -40.606536865234375, "global_step": 307927, "epoch": 2544} {"train_loss": -41.8380012512207, "global_step": 307928, "epoch": 2544} {"train_loss": -39.98799514770508, "global_step": 307929, "epoch": 2544} {"train_loss": -40.899749755859375, "global_step": 307930, "epoch": 2544} {"train_loss": -41.65607833862305, "global_step": 307931, "epoch": 2544} {"train_loss": -41.94719314575195, "global_step": 307932, "epoch": 2544} {"train_loss": -40.47742462158203, "global_step": 307933, "epoch": 2544} {"train_loss": -41.8445930480957, "global_step": 307934, "epoch": 2544} {"train_loss": -40.75922775268555, "global_step": 307935, "epoch": 2544} {"train_loss": -40.765560150146484, "global_step": 307936, "epoch": 2544} {"train_loss": -41.75075912475586, "global_step": 307937, "epoch": 2544} {"train_loss": -40.735530853271484, "global_step": 307938, "epoch": 2544} {"train_loss": -41.11526107788086, "global_step": 307939, "epoch": 2544} {"train_loss": -42.37555694580078, "global_step": 307940, "epoch": 2544} {"train_loss": -40.397666931152344, "global_step": 307941, "epoch": 2544} {"train_loss": -41.28009796142578, "global_step": 307942, "epoch": 2544} {"train_loss": -40.32537078857422, "global_step": 307943, "epoch": 2544} {"train_loss": -39.75744004683061, "global_step": 307944, "epoch": 2544, "val_loss": 2848262.75} {"train_loss": -42.2539176940918, "global_step": 307945, "epoch": 2545} {"train_loss": -41.71511459350586, "global_step": 307946, "epoch": 2545} {"train_loss": -41.59883499145508, "global_step": 307947, "epoch": 2545} {"train_loss": -41.61536407470703, "global_step": 307948, "epoch": 2545} {"train_loss": -42.066036224365234, "global_step": 307949, "epoch": 2545} {"train_loss": -41.574825286865234, "global_step": 307950, "epoch": 2545} {"train_loss": -42.0551643371582, "global_step": 307951, "epoch": 2545} {"train_loss": -42.32222366333008, "global_step": 307952, "epoch": 2545} {"train_loss": -42.13814926147461, "global_step": 307953, "epoch": 2545} {"train_loss": -42.102783203125, "global_step": 307954, "epoch": 2545} {"train_loss": -42.684574127197266, "global_step": 307955, "epoch": 2545} {"train_loss": -42.15836715698242, "global_step": 307956, "epoch": 2545} {"train_loss": -42.459354400634766, "global_step": 307957, "epoch": 2545} {"train_loss": -42.00341796875, "global_step": 307958, "epoch": 2545} {"train_loss": -41.95377731323242, "global_step": 307959, "epoch": 2545} {"train_loss": -38.837738037109375, "global_step": 307960, "epoch": 2545} {"train_loss": -41.0786018371582, "global_step": 307961, "epoch": 2545} {"train_loss": -42.122676849365234, "global_step": 307962, "epoch": 2545} {"train_loss": -43.0418815612793, "global_step": 307963, "epoch": 2545} {"train_loss": -42.0665283203125, "global_step": 307964, "epoch": 2545} {"train_loss": -41.579280853271484, "global_step": 307965, "epoch": 2545} {"train_loss": -41.744842529296875, "global_step": 307966, "epoch": 2545} {"train_loss": -42.04077911376953, "global_step": 307967, "epoch": 2545} {"train_loss": -42.422122955322266, "global_step": 307968, "epoch": 2545} {"train_loss": -41.52878952026367, "global_step": 307969, "epoch": 2545} {"train_loss": -41.388160705566406, "global_step": 307970, "epoch": 2545} {"train_loss": -42.35134506225586, "global_step": 307971, "epoch": 2545} {"train_loss": -42.821712493896484, "global_step": 307972, "epoch": 2545} {"train_loss": -42.66465377807617, "global_step": 307973, "epoch": 2545} {"train_loss": -41.830810546875, "global_step": 307974, "epoch": 2545} {"train_loss": -41.65081787109375, "global_step": 307975, "epoch": 2545} {"train_loss": -41.5671272277832, "global_step": 307976, "epoch": 2545} {"train_loss": -41.95586013793945, "global_step": 307977, "epoch": 2545} {"train_loss": -42.60084915161133, "global_step": 307978, "epoch": 2545} {"train_loss": -42.77482986450195, "global_step": 307979, "epoch": 2545} {"train_loss": -42.66962432861328, "global_step": 307980, "epoch": 2545} {"train_loss": -43.170440673828125, "global_step": 307981, "epoch": 2545} {"train_loss": -41.53884506225586, "global_step": 307982, "epoch": 2545} {"train_loss": -42.81840896606445, "global_step": 307983, "epoch": 2545} {"train_loss": -41.940982818603516, "global_step": 307984, "epoch": 2545} {"train_loss": -43.07215118408203, "global_step": 307985, "epoch": 2545} {"train_loss": -42.790283203125, "global_step": 307986, "epoch": 2545} {"train_loss": -41.437255859375, "global_step": 307987, "epoch": 2545} {"train_loss": -41.26286315917969, "global_step": 307988, "epoch": 2545} {"train_loss": -42.557212829589844, "global_step": 307989, "epoch": 2545} {"train_loss": -42.845367431640625, "global_step": 307990, "epoch": 2545} {"train_loss": -42.73365783691406, "global_step": 307991, "epoch": 2545} {"train_loss": -43.073482513427734, "global_step": 307992, "epoch": 2545} {"train_loss": -42.707984924316406, "global_step": 307993, "epoch": 2545} {"train_loss": -42.7861213684082, "global_step": 307994, "epoch": 2545} {"train_loss": -43.1102409362793, "global_step": 307995, "epoch": 2545} {"train_loss": -43.165557861328125, "global_step": 307996, "epoch": 2545} {"train_loss": -41.61547088623047, "global_step": 307997, "epoch": 2545} {"train_loss": -42.70878982543945, "global_step": 307998, "epoch": 2545} {"train_loss": -39.029537200927734, "global_step": 307999, "epoch": 2545} {"train_loss": -43.264766693115234, "global_step": 308000, "epoch": 2545} {"train_loss": -42.43993377685547, "global_step": 308001, "epoch": 2545} {"train_loss": -42.9052848815918, "global_step": 308002, "epoch": 2545} {"train_loss": -42.87356185913086, "global_step": 308003, "epoch": 2545} {"train_loss": -42.77589797973633, "global_step": 308004, "epoch": 2545} {"train_loss": -42.83132553100586, "global_step": 308005, "epoch": 2545} {"train_loss": -42.0593376159668, "global_step": 308006, "epoch": 2545} {"train_loss": -42.42417907714844, "global_step": 308007, "epoch": 2545} {"train_loss": -42.8879508972168, "global_step": 308008, "epoch": 2545} {"train_loss": -42.970211029052734, "global_step": 308009, "epoch": 2545} {"train_loss": -43.01952362060547, "global_step": 308010, "epoch": 2545} {"train_loss": -43.20345687866211, "global_step": 308011, "epoch": 2545} {"train_loss": -42.75674057006836, "global_step": 308012, "epoch": 2545} {"train_loss": -42.418006896972656, "global_step": 308013, "epoch": 2545} {"train_loss": -43.11652374267578, "global_step": 308014, "epoch": 2545} {"train_loss": -43.12290573120117, "global_step": 308015, "epoch": 2545} {"train_loss": -42.772499084472656, "global_step": 308016, "epoch": 2545} {"train_loss": -43.3211555480957, "global_step": 308017, "epoch": 2545} {"train_loss": -43.31327438354492, "global_step": 308018, "epoch": 2545} {"train_loss": -43.42398452758789, "global_step": 308019, "epoch": 2545} {"train_loss": -42.89239501953125, "global_step": 308020, "epoch": 2545} {"train_loss": -43.13501739501953, "global_step": 308021, "epoch": 2545} {"train_loss": -43.36850357055664, "global_step": 308022, "epoch": 2545} {"train_loss": -41.798431396484375, "global_step": 308023, "epoch": 2545} {"train_loss": -42.84714889526367, "global_step": 308024, "epoch": 2545} {"train_loss": -42.32683181762695, "global_step": 308025, "epoch": 2545} {"train_loss": -43.0875358581543, "global_step": 308026, "epoch": 2545} {"train_loss": -43.407257080078125, "global_step": 308027, "epoch": 2545} {"train_loss": -43.35994338989258, "global_step": 308028, "epoch": 2545} {"train_loss": -43.30118942260742, "global_step": 308029, "epoch": 2545} {"train_loss": -43.06154251098633, "global_step": 308030, "epoch": 2545} {"train_loss": -42.933326721191406, "global_step": 308031, "epoch": 2545} {"train_loss": -42.73223876953125, "global_step": 308032, "epoch": 2545} {"train_loss": -43.17329025268555, "global_step": 308033, "epoch": 2545} {"train_loss": -42.8286247253418, "global_step": 308034, "epoch": 2545} {"train_loss": -40.83884811401367, "global_step": 308035, "epoch": 2545} {"train_loss": -42.342769622802734, "global_step": 308036, "epoch": 2545} {"train_loss": -42.551513671875, "global_step": 308037, "epoch": 2545} {"train_loss": -42.488521575927734, "global_step": 308038, "epoch": 2545} {"train_loss": -42.796627044677734, "global_step": 308039, "epoch": 2545} {"train_loss": -41.828792572021484, "global_step": 308040, "epoch": 2545} {"train_loss": -42.22422790527344, "global_step": 308041, "epoch": 2545} {"train_loss": -42.00398635864258, "global_step": 308042, "epoch": 2545} {"train_loss": -43.050941467285156, "global_step": 308043, "epoch": 2545} {"train_loss": -42.451419830322266, "global_step": 308044, "epoch": 2545} {"train_loss": -42.721839904785156, "global_step": 308045, "epoch": 2545} {"train_loss": -40.703670501708984, "global_step": 308046, "epoch": 2545} {"train_loss": -39.0473747253418, "global_step": 308047, "epoch": 2545} {"train_loss": -40.926612854003906, "global_step": 308048, "epoch": 2545} {"train_loss": -42.864986419677734, "global_step": 308049, "epoch": 2545} {"train_loss": -40.36727523803711, "global_step": 308050, "epoch": 2545} {"train_loss": -40.367305755615234, "global_step": 308051, "epoch": 2545} {"train_loss": -41.87583541870117, "global_step": 308052, "epoch": 2545} {"train_loss": -42.543819427490234, "global_step": 308053, "epoch": 2545} {"train_loss": -39.62653350830078, "global_step": 308054, "epoch": 2545} {"train_loss": -42.05778121948242, "global_step": 308055, "epoch": 2545} {"train_loss": -42.530643463134766, "global_step": 308056, "epoch": 2545} {"train_loss": -37.819732666015625, "global_step": 308057, "epoch": 2545} {"train_loss": -39.2254524230957, "global_step": 308058, "epoch": 2545} {"train_loss": -41.63309860229492, "global_step": 308059, "epoch": 2545} {"train_loss": -42.78196334838867, "global_step": 308060, "epoch": 2545} {"train_loss": -41.01595687866211, "global_step": 308061, "epoch": 2545} {"train_loss": -39.79378890991211, "global_step": 308062, "epoch": 2545} {"train_loss": -41.33555221557617, "global_step": 308063, "epoch": 2545} {"train_loss": -42.26955795288086, "global_step": 308064, "epoch": 2545} {"train_loss": -42.180556147551734, "global_step": 308065, "epoch": 2545, "val_loss": 2699508.75} {"train_loss": -42.62434005737305, "global_step": 308066, "epoch": 2546} {"train_loss": -42.73106384277344, "global_step": 308067, "epoch": 2546} {"train_loss": -41.96476364135742, "global_step": 308068, "epoch": 2546} {"train_loss": -42.90373611450195, "global_step": 308069, "epoch": 2546} {"train_loss": -42.09791946411133, "global_step": 308070, "epoch": 2546} {"train_loss": -42.34897994995117, "global_step": 308071, "epoch": 2546} {"train_loss": -41.99329376220703, "global_step": 308072, "epoch": 2546} {"train_loss": -42.881378173828125, "global_step": 308073, "epoch": 2546} {"train_loss": -41.89522171020508, "global_step": 308074, "epoch": 2546} {"train_loss": -43.1871452331543, "global_step": 308075, "epoch": 2546} {"train_loss": -42.57261276245117, "global_step": 308076, "epoch": 2546} {"train_loss": -43.04816436767578, "global_step": 308077, "epoch": 2546} {"train_loss": -42.201107025146484, "global_step": 308078, "epoch": 2546} {"train_loss": -43.5614128112793, "global_step": 308079, "epoch": 2546} {"train_loss": -42.281314849853516, "global_step": 308080, "epoch": 2546} {"train_loss": -42.81047439575195, "global_step": 308081, "epoch": 2546} {"train_loss": -42.37538528442383, "global_step": 308082, "epoch": 2546} {"train_loss": -42.729827880859375, "global_step": 308083, "epoch": 2546} {"train_loss": -42.72758483886719, "global_step": 308084, "epoch": 2546} {"train_loss": -42.59599685668945, "global_step": 308085, "epoch": 2546} {"train_loss": -43.12171173095703, "global_step": 308086, "epoch": 2546} {"train_loss": -42.66436767578125, "global_step": 308087, "epoch": 2546} {"train_loss": -42.79903793334961, "global_step": 308088, "epoch": 2546} {"train_loss": -42.8319091796875, "global_step": 308089, "epoch": 2546} {"train_loss": -42.083778381347656, "global_step": 308090, "epoch": 2546} {"train_loss": -43.13684844970703, "global_step": 308091, "epoch": 2546} {"train_loss": -42.5877571105957, "global_step": 308092, "epoch": 2546} {"train_loss": -42.9959831237793, "global_step": 308093, "epoch": 2546} {"train_loss": -43.116363525390625, "global_step": 308094, "epoch": 2546} {"train_loss": -42.81324768066406, "global_step": 308095, "epoch": 2546} {"train_loss": -43.524330139160156, "global_step": 308096, "epoch": 2546} {"train_loss": -43.100399017333984, "global_step": 308097, "epoch": 2546} {"train_loss": -42.70709991455078, "global_step": 308098, "epoch": 2546} {"train_loss": -43.59760284423828, "global_step": 308099, "epoch": 2546} {"train_loss": -42.3737678527832, "global_step": 308100, "epoch": 2546} {"train_loss": -42.504207611083984, "global_step": 308101, "epoch": 2546} {"train_loss": -43.409915924072266, "global_step": 308102, "epoch": 2546} {"train_loss": -43.030757904052734, "global_step": 308103, "epoch": 2546} {"train_loss": -42.182456970214844, "global_step": 308104, "epoch": 2546} {"train_loss": -42.6030387878418, "global_step": 308105, "epoch": 2546} {"train_loss": -40.0151481628418, "global_step": 308106, "epoch": 2546} {"train_loss": -42.75798034667969, "global_step": 308107, "epoch": 2546} {"train_loss": -38.00678253173828, "global_step": 308108, "epoch": 2546} {"train_loss": -38.3867301940918, "global_step": 308109, "epoch": 2546} {"train_loss": -39.82415771484375, "global_step": 308110, "epoch": 2546} {"train_loss": -40.268001556396484, "global_step": 308111, "epoch": 2546} {"train_loss": -42.4370002746582, "global_step": 308112, "epoch": 2546} {"train_loss": -37.10722732543945, "global_step": 308113, "epoch": 2546} {"train_loss": -39.82063674926758, "global_step": 308114, "epoch": 2546} {"train_loss": -42.867774963378906, "global_step": 308115, "epoch": 2546} {"train_loss": -40.07587814331055, "global_step": 308116, "epoch": 2546} {"train_loss": -40.26020431518555, "global_step": 308117, "epoch": 2546} {"train_loss": -42.60389709472656, "global_step": 308118, "epoch": 2546} {"train_loss": -42.26240158081055, "global_step": 308119, "epoch": 2546} {"train_loss": -41.367469787597656, "global_step": 308120, "epoch": 2546} {"train_loss": -42.75057601928711, "global_step": 308121, "epoch": 2546} {"train_loss": -41.963130950927734, "global_step": 308122, "epoch": 2546} {"train_loss": -42.44416046142578, "global_step": 308123, "epoch": 2546} {"train_loss": -42.2436637878418, "global_step": 308124, "epoch": 2546} {"train_loss": -41.12860870361328, "global_step": 308125, "epoch": 2546} {"train_loss": -39.56660079956055, "global_step": 308126, "epoch": 2546} {"train_loss": -42.39398193359375, "global_step": 308127, "epoch": 2546} {"train_loss": -42.985992431640625, "global_step": 308128, "epoch": 2546} {"train_loss": -42.96103286743164, "global_step": 308129, "epoch": 2546} {"train_loss": -43.32130432128906, "global_step": 308130, "epoch": 2546} {"train_loss": -42.401092529296875, "global_step": 308131, "epoch": 2546} {"train_loss": -42.76168441772461, "global_step": 308132, "epoch": 2546} {"train_loss": -43.40052032470703, "global_step": 308133, "epoch": 2546} {"train_loss": -43.62028121948242, "global_step": 308134, "epoch": 2546} {"train_loss": -42.42284393310547, "global_step": 308135, "epoch": 2546} {"train_loss": -42.997615814208984, "global_step": 308136, "epoch": 2546} {"train_loss": -43.225406646728516, "global_step": 308137, "epoch": 2546} {"train_loss": -43.07215118408203, "global_step": 308138, "epoch": 2546} {"train_loss": -43.22080612182617, "global_step": 308139, "epoch": 2546} {"train_loss": -42.830101013183594, "global_step": 308140, "epoch": 2546} {"train_loss": -43.67341232299805, "global_step": 308141, "epoch": 2546} {"train_loss": -42.821746826171875, "global_step": 308142, "epoch": 2546} {"train_loss": -43.31801986694336, "global_step": 308143, "epoch": 2546} {"train_loss": -43.223690032958984, "global_step": 308144, "epoch": 2546} {"train_loss": -43.12418746948242, "global_step": 308145, "epoch": 2546} {"train_loss": -43.62477111816406, "global_step": 308146, "epoch": 2546} {"train_loss": -43.04789352416992, "global_step": 308147, "epoch": 2546} {"train_loss": -42.9937744140625, "global_step": 308148, "epoch": 2546} {"train_loss": -43.42612075805664, "global_step": 308149, "epoch": 2546} {"train_loss": -42.80400466918945, "global_step": 308150, "epoch": 2546} {"train_loss": -40.96408462524414, "global_step": 308151, "epoch": 2546} {"train_loss": -43.33294677734375, "global_step": 308152, "epoch": 2546} {"train_loss": -43.377925872802734, "global_step": 308153, "epoch": 2546} {"train_loss": -43.075836181640625, "global_step": 308154, "epoch": 2546} {"train_loss": -43.86712646484375, "global_step": 308155, "epoch": 2546} {"train_loss": -43.7327995300293, "global_step": 308156, "epoch": 2546} {"train_loss": -43.316959381103516, "global_step": 308157, "epoch": 2546} {"train_loss": -43.569454193115234, "global_step": 308158, "epoch": 2546} {"train_loss": -43.10348129272461, "global_step": 308159, "epoch": 2546} {"train_loss": -43.85514831542969, "global_step": 308160, "epoch": 2546} {"train_loss": -43.666175842285156, "global_step": 308161, "epoch": 2546} {"train_loss": -43.82561111450195, "global_step": 308162, "epoch": 2546} {"train_loss": -42.95676803588867, "global_step": 308163, "epoch": 2546} {"train_loss": -42.41177749633789, "global_step": 308164, "epoch": 2546} {"train_loss": -43.46834945678711, "global_step": 308165, "epoch": 2546} {"train_loss": -41.044593811035156, "global_step": 308166, "epoch": 2546} {"train_loss": -43.31455993652344, "global_step": 308167, "epoch": 2546} {"train_loss": -41.63032913208008, "global_step": 308168, "epoch": 2546} {"train_loss": -43.353431701660156, "global_step": 308169, "epoch": 2546} {"train_loss": -42.88531494140625, "global_step": 308170, "epoch": 2546} {"train_loss": -39.54524230957031, "global_step": 308171, "epoch": 2546} {"train_loss": -42.9888916015625, "global_step": 308172, "epoch": 2546} {"train_loss": -43.33402633666992, "global_step": 308173, "epoch": 2546} {"train_loss": -43.6595573425293, "global_step": 308174, "epoch": 2546} {"train_loss": -43.3213005065918, "global_step": 308175, "epoch": 2546} {"train_loss": -44.06976318359375, "global_step": 308176, "epoch": 2546} {"train_loss": -42.810401916503906, "global_step": 308177, "epoch": 2546} {"train_loss": -43.57816696166992, "global_step": 308178, "epoch": 2546} {"train_loss": -43.29240036010742, "global_step": 308179, "epoch": 2546} {"train_loss": -43.560909271240234, "global_step": 308180, "epoch": 2546} {"train_loss": -43.47077560424805, "global_step": 308181, "epoch": 2546} {"train_loss": -43.0001106262207, "global_step": 308182, "epoch": 2546} {"train_loss": -42.306678771972656, "global_step": 308183, "epoch": 2546} {"train_loss": -43.044612884521484, "global_step": 308184, "epoch": 2546} {"train_loss": -40.69061279296875, "global_step": 308185, "epoch": 2546} {"train_loss": -42.541827209724865, "global_step": 308186, "epoch": 2546, "val_loss": 2656890.0} {"train_loss": -42.93543243408203, "global_step": 308187, "epoch": 2547} {"train_loss": -43.8670768737793, "global_step": 308188, "epoch": 2547} {"train_loss": -42.94321823120117, "global_step": 308189, "epoch": 2547} {"train_loss": -43.24309539794922, "global_step": 308190, "epoch": 2547} {"train_loss": -42.26156997680664, "global_step": 308191, "epoch": 2547} {"train_loss": -41.834495544433594, "global_step": 308192, "epoch": 2547} {"train_loss": -43.01934814453125, "global_step": 308193, "epoch": 2547} {"train_loss": -42.93756103515625, "global_step": 308194, "epoch": 2547} {"train_loss": -40.68424606323242, "global_step": 308195, "epoch": 2547} {"train_loss": -42.139862060546875, "global_step": 308196, "epoch": 2547} {"train_loss": -42.84437942504883, "global_step": 308197, "epoch": 2547} {"train_loss": -40.7456169128418, "global_step": 308198, "epoch": 2547} {"train_loss": -42.1219596862793, "global_step": 308199, "epoch": 2547} {"train_loss": -42.95725631713867, "global_step": 308200, "epoch": 2547} {"train_loss": -38.995765686035156, "global_step": 308201, "epoch": 2547} {"train_loss": -42.78554916381836, "global_step": 308202, "epoch": 2547} {"train_loss": -40.81451416015625, "global_step": 308203, "epoch": 2547} {"train_loss": -42.25910568237305, "global_step": 308204, "epoch": 2547} {"train_loss": -41.47868728637695, "global_step": 308205, "epoch": 2547} {"train_loss": -42.66196823120117, "global_step": 308206, "epoch": 2547} {"train_loss": -39.23664474487305, "global_step": 308207, "epoch": 2547} {"train_loss": -42.946441650390625, "global_step": 308208, "epoch": 2547} {"train_loss": -42.317848205566406, "global_step": 308209, "epoch": 2547} {"train_loss": -40.610260009765625, "global_step": 308210, "epoch": 2547} {"train_loss": -41.75762939453125, "global_step": 308211, "epoch": 2547} {"train_loss": -39.7805290222168, "global_step": 308212, "epoch": 2547} {"train_loss": -42.01179122924805, "global_step": 308213, "epoch": 2547} {"train_loss": -40.95951461791992, "global_step": 308214, "epoch": 2547} {"train_loss": -41.097469329833984, "global_step": 308215, "epoch": 2547} {"train_loss": -40.9356803894043, "global_step": 308216, "epoch": 2547} {"train_loss": -41.63257598876953, "global_step": 308217, "epoch": 2547} {"train_loss": -41.9028434753418, "global_step": 308218, "epoch": 2547} {"train_loss": -41.481021881103516, "global_step": 308219, "epoch": 2547} {"train_loss": -42.25059127807617, "global_step": 308220, "epoch": 2547} {"train_loss": -42.729408264160156, "global_step": 308221, "epoch": 2547} {"train_loss": -41.56589889526367, "global_step": 308222, "epoch": 2547} {"train_loss": -42.17919921875, "global_step": 308223, "epoch": 2547} {"train_loss": -41.730560302734375, "global_step": 308224, "epoch": 2547} {"train_loss": -42.389610290527344, "global_step": 308225, "epoch": 2547} {"train_loss": -42.90001678466797, "global_step": 308226, "epoch": 2547} {"train_loss": -40.36224365234375, "global_step": 308227, "epoch": 2547} {"train_loss": -42.33317184448242, "global_step": 308228, "epoch": 2547} {"train_loss": -42.414939880371094, "global_step": 308229, "epoch": 2547} {"train_loss": -42.234004974365234, "global_step": 308230, "epoch": 2547} {"train_loss": -41.7736701965332, "global_step": 308231, "epoch": 2547} {"train_loss": -43.246028900146484, "global_step": 308232, "epoch": 2547} {"train_loss": -42.225826263427734, "global_step": 308233, "epoch": 2547} {"train_loss": -43.381649017333984, "global_step": 308234, "epoch": 2547} {"train_loss": -40.17768478393555, "global_step": 308235, "epoch": 2547} {"train_loss": -41.293975830078125, "global_step": 308236, "epoch": 2547} {"train_loss": -43.2138786315918, "global_step": 308237, "epoch": 2547} {"train_loss": -42.505489349365234, "global_step": 308238, "epoch": 2547} {"train_loss": -43.30038833618164, "global_step": 308239, "epoch": 2547} {"train_loss": -43.223854064941406, "global_step": 308240, "epoch": 2547} {"train_loss": -41.74491500854492, "global_step": 308241, "epoch": 2547} {"train_loss": -43.15944290161133, "global_step": 308242, "epoch": 2547} {"train_loss": -38.816436767578125, "global_step": 308243, "epoch": 2547} {"train_loss": -42.35187530517578, "global_step": 308244, "epoch": 2547} {"train_loss": -42.62900924682617, "global_step": 308245, "epoch": 2547} {"train_loss": -41.208248138427734, "global_step": 308246, "epoch": 2547} {"train_loss": -40.735694885253906, "global_step": 308247, "epoch": 2547} {"train_loss": -41.552425384521484, "global_step": 308248, "epoch": 2547} {"train_loss": -40.25696563720703, "global_step": 308249, "epoch": 2547} {"train_loss": -42.60231018066406, "global_step": 308250, "epoch": 2547} {"train_loss": -42.78109359741211, "global_step": 308251, "epoch": 2547} {"train_loss": -42.210662841796875, "global_step": 308252, "epoch": 2547} {"train_loss": -42.05561447143555, "global_step": 308253, "epoch": 2547} {"train_loss": -41.736331939697266, "global_step": 308254, "epoch": 2547} {"train_loss": -42.362709045410156, "global_step": 308255, "epoch": 2547} {"train_loss": -34.352638244628906, "global_step": 308256, "epoch": 2547} {"train_loss": -39.58625411987305, "global_step": 308257, "epoch": 2547} {"train_loss": -40.46643829345703, "global_step": 308258, "epoch": 2547} {"train_loss": -39.889766693115234, "global_step": 308259, "epoch": 2547} {"train_loss": -10.862051963806152, "global_step": 308260, "epoch": 2547} {"train_loss": -40.454986572265625, "global_step": 308261, "epoch": 2547} {"train_loss": -37.23008728027344, "global_step": 308262, "epoch": 2547} {"train_loss": -29.66470718383789, "global_step": 308263, "epoch": 2547} {"train_loss": -26.02444839477539, "global_step": 308264, "epoch": 2547} {"train_loss": -32.8620719909668, "global_step": 308265, "epoch": 2547} {"train_loss": -37.84761047363281, "global_step": 308266, "epoch": 2547} {"train_loss": -31.373640060424805, "global_step": 308267, "epoch": 2547} {"train_loss": -20.171823501586914, "global_step": 308268, "epoch": 2547} {"train_loss": -34.13762664794922, "global_step": 308269, "epoch": 2547} {"train_loss": -38.345375061035156, "global_step": 308270, "epoch": 2547} {"train_loss": -36.68505859375, "global_step": 308271, "epoch": 2547} {"train_loss": -21.940807342529297, "global_step": 308272, "epoch": 2547} {"train_loss": -33.483943939208984, "global_step": 308273, "epoch": 2547} {"train_loss": -30.452417373657227, "global_step": 308274, "epoch": 2547} {"train_loss": -37.52193069458008, "global_step": 308275, "epoch": 2547} {"train_loss": -33.41523361206055, "global_step": 308276, "epoch": 2547} {"train_loss": -33.88957977294922, "global_step": 308277, "epoch": 2547} {"train_loss": -34.702239990234375, "global_step": 308278, "epoch": 2547} {"train_loss": -36.412349700927734, "global_step": 308279, "epoch": 2547} {"train_loss": -37.8618278503418, "global_step": 308280, "epoch": 2547} {"train_loss": -36.833675384521484, "global_step": 308281, "epoch": 2547} {"train_loss": -38.24432373046875, "global_step": 308282, "epoch": 2547} {"train_loss": -37.48012161254883, "global_step": 308283, "epoch": 2547} {"train_loss": -35.81354904174805, "global_step": 308284, "epoch": 2547} {"train_loss": -35.792396545410156, "global_step": 308285, "epoch": 2547} {"train_loss": -38.511932373046875, "global_step": 308286, "epoch": 2547} {"train_loss": -31.060989379882812, "global_step": 308287, "epoch": 2547} {"train_loss": -35.37133026123047, "global_step": 308288, "epoch": 2547} {"train_loss": -36.32072448730469, "global_step": 308289, "epoch": 2547} {"train_loss": -38.30718994140625, "global_step": 308290, "epoch": 2547} {"train_loss": -38.70199203491211, "global_step": 308291, "epoch": 2547} {"train_loss": -37.5321159362793, "global_step": 308292, "epoch": 2547} {"train_loss": -38.98811340332031, "global_step": 308293, "epoch": 2547} {"train_loss": -37.66157150268555, "global_step": 308294, "epoch": 2547} {"train_loss": -38.48369216918945, "global_step": 308295, "epoch": 2547} {"train_loss": -39.149715423583984, "global_step": 308296, "epoch": 2547} {"train_loss": -38.895263671875, "global_step": 308297, "epoch": 2547} {"train_loss": -39.59943389892578, "global_step": 308298, "epoch": 2547} {"train_loss": -38.27537155151367, "global_step": 308299, "epoch": 2547} {"train_loss": -38.30886459350586, "global_step": 308300, "epoch": 2547} {"train_loss": -39.344093322753906, "global_step": 308301, "epoch": 2547} {"train_loss": -39.782283782958984, "global_step": 308302, "epoch": 2547} {"train_loss": -39.44819259643555, "global_step": 308303, "epoch": 2547} {"train_loss": -38.33455276489258, "global_step": 308304, "epoch": 2547} {"train_loss": -39.90061569213867, "global_step": 308305, "epoch": 2547} {"train_loss": -39.72168731689453, "global_step": 308306, "epoch": 2547} {"train_loss": -39.24716830450641, "global_step": 308307, "epoch": 2547, "val_loss": 2816462.75} {"train_loss": -39.98025131225586, "global_step": 308308, "epoch": 2548} {"train_loss": -39.825469970703125, "global_step": 308309, "epoch": 2548} {"train_loss": -39.370201110839844, "global_step": 308310, "epoch": 2548} {"train_loss": -39.97522735595703, "global_step": 308311, "epoch": 2548} {"train_loss": -39.38640594482422, "global_step": 308312, "epoch": 2548} {"train_loss": -39.2694206237793, "global_step": 308313, "epoch": 2548} {"train_loss": -39.83818817138672, "global_step": 308314, "epoch": 2548} {"train_loss": -40.44504928588867, "global_step": 308315, "epoch": 2548} {"train_loss": -40.55192184448242, "global_step": 308316, "epoch": 2548} {"train_loss": -40.17196273803711, "global_step": 308317, "epoch": 2548} {"train_loss": -40.287654876708984, "global_step": 308318, "epoch": 2548} {"train_loss": -40.519630432128906, "global_step": 308319, "epoch": 2548} {"train_loss": -40.298805236816406, "global_step": 308320, "epoch": 2548} {"train_loss": -40.292354583740234, "global_step": 308321, "epoch": 2548} {"train_loss": -40.51656723022461, "global_step": 308322, "epoch": 2548} {"train_loss": -40.631927490234375, "global_step": 308323, "epoch": 2548} {"train_loss": -40.50226593017578, "global_step": 308324, "epoch": 2548} {"train_loss": -40.869808197021484, "global_step": 308325, "epoch": 2548} {"train_loss": -40.590675354003906, "global_step": 308326, "epoch": 2548} {"train_loss": -40.667049407958984, "global_step": 308327, "epoch": 2548} {"train_loss": -40.63847351074219, "global_step": 308328, "epoch": 2548} {"train_loss": -40.726661682128906, "global_step": 308329, "epoch": 2548} {"train_loss": -40.99103927612305, "global_step": 308330, "epoch": 2548} {"train_loss": -40.693443298339844, "global_step": 308331, "epoch": 2548} {"train_loss": -40.86930465698242, "global_step": 308332, "epoch": 2548} {"train_loss": -40.937660217285156, "global_step": 308333, "epoch": 2548} {"train_loss": -40.9881591796875, "global_step": 308334, "epoch": 2548} {"train_loss": -41.120155334472656, "global_step": 308335, "epoch": 2548} {"train_loss": -41.08207321166992, "global_step": 308336, "epoch": 2548} {"train_loss": -41.039825439453125, "global_step": 308337, "epoch": 2548} {"train_loss": -41.17718505859375, "global_step": 308338, "epoch": 2548} {"train_loss": -41.68129348754883, "global_step": 308339, "epoch": 2548} {"train_loss": -41.19517135620117, "global_step": 308340, "epoch": 2548} {"train_loss": -41.396461486816406, "global_step": 308341, "epoch": 2548} {"train_loss": -41.42001724243164, "global_step": 308342, "epoch": 2548} {"train_loss": -41.25852966308594, "global_step": 308343, "epoch": 2548} {"train_loss": -41.67958068847656, "global_step": 308344, "epoch": 2548} {"train_loss": -41.643062591552734, "global_step": 308345, "epoch": 2548} {"train_loss": -41.47211456298828, "global_step": 308346, "epoch": 2548} {"train_loss": -41.36233139038086, "global_step": 308347, "epoch": 2548} {"train_loss": -41.75184631347656, "global_step": 308348, "epoch": 2548} {"train_loss": -42.094478607177734, "global_step": 308349, "epoch": 2548} {"train_loss": -41.74752426147461, "global_step": 308350, "epoch": 2548} {"train_loss": -41.757545471191406, "global_step": 308351, "epoch": 2548} {"train_loss": -41.84242248535156, "global_step": 308352, "epoch": 2548} {"train_loss": -41.73414993286133, "global_step": 308353, "epoch": 2548} {"train_loss": -42.12067413330078, "global_step": 308354, "epoch": 2548} {"train_loss": -40.48311233520508, "global_step": 308355, "epoch": 2548} {"train_loss": -42.092994689941406, "global_step": 308356, "epoch": 2548} {"train_loss": -41.91701126098633, "global_step": 308357, "epoch": 2548} {"train_loss": -42.24497604370117, "global_step": 308358, "epoch": 2548} {"train_loss": -41.779109954833984, "global_step": 308359, "epoch": 2548} {"train_loss": -42.088409423828125, "global_step": 308360, "epoch": 2548} {"train_loss": -41.48343276977539, "global_step": 308361, "epoch": 2548} {"train_loss": -42.16059875488281, "global_step": 308362, "epoch": 2548} {"train_loss": -42.28731155395508, "global_step": 308363, "epoch": 2548} {"train_loss": -41.796504974365234, "global_step": 308364, "epoch": 2548} {"train_loss": -42.12814712524414, "global_step": 308365, "epoch": 2548} {"train_loss": -42.23642349243164, "global_step": 308366, "epoch": 2548} {"train_loss": -42.442012786865234, "global_step": 308367, "epoch": 2548} {"train_loss": -42.149959564208984, "global_step": 308368, "epoch": 2548} {"train_loss": -42.456485748291016, "global_step": 308369, "epoch": 2548} {"train_loss": -42.106658935546875, "global_step": 308370, "epoch": 2548} {"train_loss": -42.604122161865234, "global_step": 308371, "epoch": 2548} {"train_loss": -42.298892974853516, "global_step": 308372, "epoch": 2548} {"train_loss": -42.547279357910156, "global_step": 308373, "epoch": 2548} {"train_loss": -42.495601654052734, "global_step": 308374, "epoch": 2548} {"train_loss": -42.27749252319336, "global_step": 308375, "epoch": 2548} {"train_loss": -42.553993225097656, "global_step": 308376, "epoch": 2548} {"train_loss": -42.657772064208984, "global_step": 308377, "epoch": 2548} {"train_loss": -42.77196502685547, "global_step": 308378, "epoch": 2548} {"train_loss": -42.24297332763672, "global_step": 308379, "epoch": 2548} {"train_loss": -42.967628479003906, "global_step": 308380, "epoch": 2548} {"train_loss": -42.94425582885742, "global_step": 308381, "epoch": 2548} {"train_loss": -42.211761474609375, "global_step": 308382, "epoch": 2548} {"train_loss": -42.499027252197266, "global_step": 308383, "epoch": 2548} {"train_loss": -42.301448822021484, "global_step": 308384, "epoch": 2548} {"train_loss": -42.7046012878418, "global_step": 308385, "epoch": 2548} {"train_loss": -43.2532958984375, "global_step": 308386, "epoch": 2548} {"train_loss": -42.77632522583008, "global_step": 308387, "epoch": 2548} {"train_loss": -41.811763763427734, "global_step": 308388, "epoch": 2548} {"train_loss": -43.021095275878906, "global_step": 308389, "epoch": 2548} {"train_loss": -42.84690475463867, "global_step": 308390, "epoch": 2548} {"train_loss": -43.14994430541992, "global_step": 308391, "epoch": 2548} {"train_loss": -43.10040283203125, "global_step": 308392, "epoch": 2548} {"train_loss": -42.797767639160156, "global_step": 308393, "epoch": 2548} {"train_loss": -42.393917083740234, "global_step": 308394, "epoch": 2548} {"train_loss": -43.1089973449707, "global_step": 308395, "epoch": 2548} {"train_loss": -43.1336555480957, "global_step": 308396, "epoch": 2548} {"train_loss": -43.286170959472656, "global_step": 308397, "epoch": 2548} {"train_loss": -42.9504508972168, "global_step": 308398, "epoch": 2548} {"train_loss": -42.95552444458008, "global_step": 308399, "epoch": 2548} {"train_loss": -43.103458404541016, "global_step": 308400, "epoch": 2548} {"train_loss": -43.10647201538086, "global_step": 308401, "epoch": 2548} {"train_loss": -43.13369369506836, "global_step": 308402, "epoch": 2548} {"train_loss": -43.2779655456543, "global_step": 308403, "epoch": 2548} {"train_loss": -43.13606643676758, "global_step": 308404, "epoch": 2548} {"train_loss": -43.1993522644043, "global_step": 308405, "epoch": 2548} {"train_loss": -42.73147201538086, "global_step": 308406, "epoch": 2548} {"train_loss": -42.84688186645508, "global_step": 308407, "epoch": 2548} {"train_loss": -43.33980941772461, "global_step": 308408, "epoch": 2548} {"train_loss": -43.265254974365234, "global_step": 308409, "epoch": 2548} {"train_loss": -43.44443130493164, "global_step": 308410, "epoch": 2548} {"train_loss": -43.04048538208008, "global_step": 308411, "epoch": 2548} {"train_loss": -43.358489990234375, "global_step": 308412, "epoch": 2548} {"train_loss": -42.84033203125, "global_step": 308413, "epoch": 2548} {"train_loss": -43.0936393737793, "global_step": 308414, "epoch": 2548} {"train_loss": -29.880268096923828, "global_step": 308415, "epoch": 2548} {"train_loss": -41.471031188964844, "global_step": 308416, "epoch": 2548} {"train_loss": -39.182838439941406, "global_step": 308417, "epoch": 2548} {"train_loss": -41.50917434692383, "global_step": 308418, "epoch": 2548} {"train_loss": -42.26851272583008, "global_step": 308419, "epoch": 2548} {"train_loss": -34.52366638183594, "global_step": 308420, "epoch": 2548} {"train_loss": -41.86310577392578, "global_step": 308421, "epoch": 2548} {"train_loss": -33.93867111206055, "global_step": 308422, "epoch": 2548} {"train_loss": -32.608943939208984, "global_step": 308423, "epoch": 2548} {"train_loss": -40.99613571166992, "global_step": 308424, "epoch": 2548} {"train_loss": -33.69878005981445, "global_step": 308425, "epoch": 2548} {"train_loss": -33.7563362121582, "global_step": 308426, "epoch": 2548} {"train_loss": -41.94200897216797, "global_step": 308427, "epoch": 2548} {"train_loss": -41.34260332091781, "global_step": 308428, "epoch": 2548, "val_loss": 2703959.75} {"train_loss": -40.44526290893555, "global_step": 308429, "epoch": 2549} {"train_loss": -37.02314376831055, "global_step": 308430, "epoch": 2549} {"train_loss": -40.86781692504883, "global_step": 308431, "epoch": 2549} {"train_loss": -16.640111923217773, "global_step": 308432, "epoch": 2549} {"train_loss": -40.550086975097656, "global_step": 308433, "epoch": 2549} {"train_loss": -40.10432052612305, "global_step": 308434, "epoch": 2549} {"train_loss": -37.40782928466797, "global_step": 308435, "epoch": 2549} {"train_loss": -36.6665153503418, "global_step": 308436, "epoch": 2549} {"train_loss": -37.10298538208008, "global_step": 308437, "epoch": 2549} {"train_loss": -35.38520431518555, "global_step": 308438, "epoch": 2549} {"train_loss": -27.556005477905273, "global_step": 308439, "epoch": 2549} {"train_loss": -33.26821517944336, "global_step": 308440, "epoch": 2549} {"train_loss": -36.75086212158203, "global_step": 308441, "epoch": 2549} {"train_loss": -39.90533447265625, "global_step": 308442, "epoch": 2549} {"train_loss": -39.44950866699219, "global_step": 308443, "epoch": 2549} {"train_loss": -38.59306716918945, "global_step": 308444, "epoch": 2549} {"train_loss": -32.68302536010742, "global_step": 308445, "epoch": 2549} {"train_loss": -27.327030181884766, "global_step": 308446, "epoch": 2549} {"train_loss": -34.75385284423828, "global_step": 308447, "epoch": 2549} {"train_loss": -35.86159133911133, "global_step": 308448, "epoch": 2549} {"train_loss": -36.86275100708008, "global_step": 308449, "epoch": 2549} {"train_loss": -38.7088508605957, "global_step": 308450, "epoch": 2549} {"train_loss": -39.56387710571289, "global_step": 308451, "epoch": 2549} {"train_loss": -40.036930084228516, "global_step": 308452, "epoch": 2549} {"train_loss": -37.41242218017578, "global_step": 308453, "epoch": 2549} {"train_loss": -39.69050979614258, "global_step": 308454, "epoch": 2549} {"train_loss": -39.72297286987305, "global_step": 308455, "epoch": 2549} {"train_loss": -35.99123001098633, "global_step": 308456, "epoch": 2549} {"train_loss": -38.34661865234375, "global_step": 308457, "epoch": 2549} {"train_loss": -39.137569427490234, "global_step": 308458, "epoch": 2549} {"train_loss": -39.44929504394531, "global_step": 308459, "epoch": 2549} {"train_loss": -40.48711395263672, "global_step": 308460, "epoch": 2549} {"train_loss": -38.7225456237793, "global_step": 308461, "epoch": 2549} {"train_loss": -40.030914306640625, "global_step": 308462, "epoch": 2549} {"train_loss": -38.509307861328125, "global_step": 308463, "epoch": 2549} {"train_loss": -38.6413459777832, "global_step": 308464, "epoch": 2549} {"train_loss": -40.056663513183594, "global_step": 308465, "epoch": 2549} {"train_loss": -39.63899612426758, "global_step": 308466, "epoch": 2549} {"train_loss": -38.44226837158203, "global_step": 308467, "epoch": 2549} {"train_loss": -37.18319320678711, "global_step": 308468, "epoch": 2549} {"train_loss": -39.85948181152344, "global_step": 308469, "epoch": 2549} {"train_loss": -40.84194564819336, "global_step": 308470, "epoch": 2549} {"train_loss": -40.579811096191406, "global_step": 308471, "epoch": 2549} {"train_loss": -40.99453353881836, "global_step": 308472, "epoch": 2549} {"train_loss": -40.74154281616211, "global_step": 308473, "epoch": 2549} {"train_loss": -40.5917854309082, "global_step": 308474, "epoch": 2549} {"train_loss": -39.77162170410156, "global_step": 308475, "epoch": 2549} {"train_loss": -40.61082458496094, "global_step": 308476, "epoch": 2549} {"train_loss": -40.695369720458984, "global_step": 308477, "epoch": 2549} {"train_loss": -41.0510368347168, "global_step": 308478, "epoch": 2549} {"train_loss": -41.22050094604492, "global_step": 308479, "epoch": 2549} {"train_loss": -41.44290542602539, "global_step": 308480, "epoch": 2549} {"train_loss": -40.52952194213867, "global_step": 308481, "epoch": 2549} {"train_loss": -40.47898483276367, "global_step": 308482, "epoch": 2549} {"train_loss": -40.669227600097656, "global_step": 308483, "epoch": 2549} {"train_loss": -41.2837028503418, "global_step": 308484, "epoch": 2549} {"train_loss": -40.594940185546875, "global_step": 308485, "epoch": 2549} {"train_loss": -41.527923583984375, "global_step": 308486, "epoch": 2549} {"train_loss": -36.51258087158203, "global_step": 308487, "epoch": 2549} {"train_loss": -41.574153900146484, "global_step": 308488, "epoch": 2549} {"train_loss": -41.4070930480957, "global_step": 308489, "epoch": 2549} {"train_loss": -41.697349548339844, "global_step": 308490, "epoch": 2549} {"train_loss": -42.03129577636719, "global_step": 308491, "epoch": 2549} {"train_loss": -41.13544464111328, "global_step": 308492, "epoch": 2549} {"train_loss": -40.04117965698242, "global_step": 308493, "epoch": 2549} {"train_loss": -41.81128692626953, "global_step": 308494, "epoch": 2549} {"train_loss": -41.05918502807617, "global_step": 308495, "epoch": 2549} {"train_loss": -41.68904495239258, "global_step": 308496, "epoch": 2549} {"train_loss": -41.4930534362793, "global_step": 308497, "epoch": 2549} {"train_loss": -41.2165641784668, "global_step": 308498, "epoch": 2549} {"train_loss": -41.994361877441406, "global_step": 308499, "epoch": 2549} {"train_loss": -41.5067138671875, "global_step": 308500, "epoch": 2549} {"train_loss": -41.631202697753906, "global_step": 308501, "epoch": 2549} {"train_loss": -41.88288497924805, "global_step": 308502, "epoch": 2549} {"train_loss": -41.805267333984375, "global_step": 308503, "epoch": 2549} {"train_loss": -41.83686065673828, "global_step": 308504, "epoch": 2549} {"train_loss": -42.1131591796875, "global_step": 308505, "epoch": 2549} {"train_loss": -42.30465316772461, "global_step": 308506, "epoch": 2549} {"train_loss": -41.135982513427734, "global_step": 308507, "epoch": 2549} {"train_loss": -42.36166000366211, "global_step": 308508, "epoch": 2549} {"train_loss": -42.283180236816406, "global_step": 308509, "epoch": 2549} {"train_loss": -41.29198455810547, "global_step": 308510, "epoch": 2549} {"train_loss": -41.98114776611328, "global_step": 308511, "epoch": 2549} {"train_loss": -42.08292770385742, "global_step": 308512, "epoch": 2549} {"train_loss": -42.29570388793945, "global_step": 308513, "epoch": 2549} {"train_loss": -42.600765228271484, "global_step": 308514, "epoch": 2549} {"train_loss": -42.35309600830078, "global_step": 308515, "epoch": 2549} {"train_loss": -42.14069366455078, "global_step": 308516, "epoch": 2549} {"train_loss": -42.57389450073242, "global_step": 308517, "epoch": 2549} {"train_loss": -42.524200439453125, "global_step": 308518, "epoch": 2549} {"train_loss": -42.2619743347168, "global_step": 308519, "epoch": 2549} {"train_loss": -42.070472717285156, "global_step": 308520, "epoch": 2549} {"train_loss": -42.699554443359375, "global_step": 308521, "epoch": 2549} {"train_loss": -42.244163513183594, "global_step": 308522, "epoch": 2549} {"train_loss": -41.5168571472168, "global_step": 308523, "epoch": 2549} {"train_loss": -42.0865592956543, "global_step": 308524, "epoch": 2549} {"train_loss": -42.621726989746094, "global_step": 308525, "epoch": 2549} {"train_loss": -41.52002716064453, "global_step": 308526, "epoch": 2549} {"train_loss": -42.6389045715332, "global_step": 308527, "epoch": 2549} {"train_loss": -42.10768508911133, "global_step": 308528, "epoch": 2549} {"train_loss": -42.834712982177734, "global_step": 308529, "epoch": 2549} {"train_loss": -42.25412368774414, "global_step": 308530, "epoch": 2549} {"train_loss": -42.92645263671875, "global_step": 308531, "epoch": 2549} {"train_loss": -42.81923294067383, "global_step": 308532, "epoch": 2549} {"train_loss": -42.21966552734375, "global_step": 308533, "epoch": 2549} {"train_loss": -41.91655349731445, "global_step": 308534, "epoch": 2549} {"train_loss": -42.16352844238281, "global_step": 308535, "epoch": 2549} {"train_loss": -42.545963287353516, "global_step": 308536, "epoch": 2549} {"train_loss": -41.800453186035156, "global_step": 308537, "epoch": 2549} {"train_loss": -42.08084487915039, "global_step": 308538, "epoch": 2549} {"train_loss": -42.71900177001953, "global_step": 308539, "epoch": 2549} {"train_loss": -42.34865951538086, "global_step": 308540, "epoch": 2549} {"train_loss": -42.490333557128906, "global_step": 308541, "epoch": 2549} {"train_loss": -43.0111083984375, "global_step": 308542, "epoch": 2549} {"train_loss": -42.4067497253418, "global_step": 308543, "epoch": 2549} {"train_loss": -42.62447738647461, "global_step": 308544, "epoch": 2549} {"train_loss": -42.30886459350586, "global_step": 308545, "epoch": 2549} {"train_loss": -42.805423736572266, "global_step": 308546, "epoch": 2549} {"train_loss": -43.033714294433594, "global_step": 308547, "epoch": 2549} {"train_loss": -40.718727111816406, "global_step": 308548, "epoch": 2549} {"train_loss": -40.19644124054712, "global_step": 308549, "epoch": 2549, "val_loss": 2870732.25} {"train_loss": -42.66267013549805, "global_step": 308550, "epoch": 2550} {"train_loss": -42.78860092163086, "global_step": 308551, "epoch": 2550} {"train_loss": -42.87415313720703, "global_step": 308552, "epoch": 2550} {"train_loss": -41.7260856628418, "global_step": 308553, "epoch": 2550} {"train_loss": -43.49457550048828, "global_step": 308554, "epoch": 2550} {"train_loss": -42.28019332885742, "global_step": 308555, "epoch": 2550} {"train_loss": -43.45780563354492, "global_step": 308556, "epoch": 2550} {"train_loss": -43.05098342895508, "global_step": 308557, "epoch": 2550} {"train_loss": -42.7484245300293, "global_step": 308558, "epoch": 2550} {"train_loss": -43.1722526550293, "global_step": 308559, "epoch": 2550} {"train_loss": -43.31350326538086, "global_step": 308560, "epoch": 2550} {"train_loss": -42.75703048706055, "global_step": 308561, "epoch": 2550} {"train_loss": -43.048301696777344, "global_step": 308562, "epoch": 2550} {"train_loss": -43.11881637573242, "global_step": 308563, "epoch": 2550} {"train_loss": -43.04519271850586, "global_step": 308564, "epoch": 2550} {"train_loss": -43.609310150146484, "global_step": 308565, "epoch": 2550} {"train_loss": -42.89453125, "global_step": 308566, "epoch": 2550} {"train_loss": -42.72111892700195, "global_step": 308567, "epoch": 2550} {"train_loss": -42.66267013549805, "global_step": 308568, "epoch": 2550} {"train_loss": -41.23835372924805, "global_step": 308569, "epoch": 2550} {"train_loss": -42.09568405151367, "global_step": 308570, "epoch": 2550} {"train_loss": -41.47897720336914, "global_step": 308571, "epoch": 2550} {"train_loss": -41.2908935546875, "global_step": 308572, "epoch": 2550} {"train_loss": -41.558082580566406, "global_step": 308573, "epoch": 2550} {"train_loss": -42.75813674926758, "global_step": 308574, "epoch": 2550} {"train_loss": -41.07548141479492, "global_step": 308575, "epoch": 2550} {"train_loss": -39.19023513793945, "global_step": 308576, "epoch": 2550} {"train_loss": -38.42242431640625, "global_step": 308577, "epoch": 2550} {"train_loss": -41.88644790649414, "global_step": 308578, "epoch": 2550} {"train_loss": -42.78070068359375, "global_step": 308579, "epoch": 2550} {"train_loss": -41.208866119384766, "global_step": 308580, "epoch": 2550} {"train_loss": -40.97614669799805, "global_step": 308581, "epoch": 2550} {"train_loss": -43.02189636230469, "global_step": 308582, "epoch": 2550} {"train_loss": -41.38643264770508, "global_step": 308583, "epoch": 2550} {"train_loss": -42.01755142211914, "global_step": 308584, "epoch": 2550} {"train_loss": -40.84575271606445, "global_step": 308585, "epoch": 2550} {"train_loss": -42.32786178588867, "global_step": 308586, "epoch": 2550} {"train_loss": -42.87187576293945, "global_step": 308587, "epoch": 2550} {"train_loss": -41.92656326293945, "global_step": 308588, "epoch": 2550} {"train_loss": -42.1235237121582, "global_step": 308589, "epoch": 2550} {"train_loss": -42.97296142578125, "global_step": 308590, "epoch": 2550} {"train_loss": -42.104225158691406, "global_step": 308591, "epoch": 2550} {"train_loss": -42.584320068359375, "global_step": 308592, "epoch": 2550} {"train_loss": -42.54061508178711, "global_step": 308593, "epoch": 2550} {"train_loss": -41.903099060058594, "global_step": 308594, "epoch": 2550} {"train_loss": -43.005043029785156, "global_step": 308595, "epoch": 2550} {"train_loss": -41.5791130065918, "global_step": 308596, "epoch": 2550} {"train_loss": -43.0897331237793, "global_step": 308597, "epoch": 2550} {"train_loss": -42.4355583190918, "global_step": 308598, "epoch": 2550} {"train_loss": -41.62510299682617, "global_step": 308599, "epoch": 2550} {"train_loss": -43.35634231567383, "global_step": 308600, "epoch": 2550} {"train_loss": -42.75492477416992, "global_step": 308601, "epoch": 2550} {"train_loss": -42.7767219543457, "global_step": 308602, "epoch": 2550} {"train_loss": -42.448402404785156, "global_step": 308603, "epoch": 2550} {"train_loss": -43.06081771850586, "global_step": 308604, "epoch": 2550} {"train_loss": -43.10555648803711, "global_step": 308605, "epoch": 2550} {"train_loss": -42.26253128051758, "global_step": 308606, "epoch": 2550} {"train_loss": -43.01263427734375, "global_step": 308607, "epoch": 2550} {"train_loss": -43.22942352294922, "global_step": 308608, "epoch": 2550} {"train_loss": -42.65449142456055, "global_step": 308609, "epoch": 2550} {"train_loss": -42.722572326660156, "global_step": 308610, "epoch": 2550} {"train_loss": -43.0994987487793, "global_step": 308611, "epoch": 2550} {"train_loss": -43.168365478515625, "global_step": 308612, "epoch": 2550} {"train_loss": -42.9360466003418, "global_step": 308613, "epoch": 2550} {"train_loss": -43.05830383300781, "global_step": 308614, "epoch": 2550} {"train_loss": -43.222110748291016, "global_step": 308615, "epoch": 2550} {"train_loss": -42.149192810058594, "global_step": 308616, "epoch": 2550} {"train_loss": -43.07809066772461, "global_step": 308617, "epoch": 2550} {"train_loss": -41.28631591796875, "global_step": 308618, "epoch": 2550} {"train_loss": -40.973663330078125, "global_step": 308619, "epoch": 2550} {"train_loss": -38.80704879760742, "global_step": 308620, "epoch": 2550} {"train_loss": -38.20208740234375, "global_step": 308621, "epoch": 2550} {"train_loss": -41.676265716552734, "global_step": 308622, "epoch": 2550} {"train_loss": -42.51123046875, "global_step": 308623, "epoch": 2550} {"train_loss": -40.37014389038086, "global_step": 308624, "epoch": 2550} {"train_loss": -39.61399459838867, "global_step": 308625, "epoch": 2550} {"train_loss": -42.39318084716797, "global_step": 308626, "epoch": 2550} {"train_loss": -42.459259033203125, "global_step": 308627, "epoch": 2550} {"train_loss": -38.73088455200195, "global_step": 308628, "epoch": 2550} {"train_loss": -37.57802200317383, "global_step": 308629, "epoch": 2550} {"train_loss": -41.93655014038086, "global_step": 308630, "epoch": 2550} {"train_loss": -38.0003662109375, "global_step": 308631, "epoch": 2550} {"train_loss": -33.772560119628906, "global_step": 308632, "epoch": 2550} {"train_loss": -41.59963607788086, "global_step": 308633, "epoch": 2550} {"train_loss": -37.9543342590332, "global_step": 308634, "epoch": 2550} {"train_loss": -36.962825775146484, "global_step": 308635, "epoch": 2550} {"train_loss": -41.45032501220703, "global_step": 308636, "epoch": 2550} {"train_loss": -37.34212875366211, "global_step": 308637, "epoch": 2550} {"train_loss": -40.31119918823242, "global_step": 308638, "epoch": 2550} {"train_loss": -36.63869857788086, "global_step": 308639, "epoch": 2550} {"train_loss": -38.3697509765625, "global_step": 308640, "epoch": 2550} {"train_loss": -38.963417053222656, "global_step": 308641, "epoch": 2550} {"train_loss": -38.725074768066406, "global_step": 308642, "epoch": 2550} {"train_loss": -41.74365997314453, "global_step": 308643, "epoch": 2550} {"train_loss": -38.58358383178711, "global_step": 308644, "epoch": 2550} {"train_loss": -42.05339050292969, "global_step": 308645, "epoch": 2550} {"train_loss": -39.52523422241211, "global_step": 308646, "epoch": 2550} {"train_loss": -41.492000579833984, "global_step": 308647, "epoch": 2550} {"train_loss": -39.04274368286133, "global_step": 308648, "epoch": 2550} {"train_loss": -41.747406005859375, "global_step": 308649, "epoch": 2550} {"train_loss": -40.06608963012695, "global_step": 308650, "epoch": 2550} {"train_loss": -41.2948112487793, "global_step": 308651, "epoch": 2550} {"train_loss": -40.193511962890625, "global_step": 308652, "epoch": 2550} {"train_loss": -41.900413513183594, "global_step": 308653, "epoch": 2550} {"train_loss": -40.80045700073242, "global_step": 308654, "epoch": 2550} {"train_loss": -41.77524185180664, "global_step": 308655, "epoch": 2550} {"train_loss": -40.74752426147461, "global_step": 308656, "epoch": 2550} {"train_loss": -41.74895477294922, "global_step": 308657, "epoch": 2550} {"train_loss": -41.07916259765625, "global_step": 308658, "epoch": 2550} {"train_loss": -42.53962707519531, "global_step": 308659, "epoch": 2550} {"train_loss": -41.85490036010742, "global_step": 308660, "epoch": 2550} {"train_loss": -41.85302734375, "global_step": 308661, "epoch": 2550} {"train_loss": -42.184356689453125, "global_step": 308662, "epoch": 2550} {"train_loss": -41.598426818847656, "global_step": 308663, "epoch": 2550} {"train_loss": -41.390342712402344, "global_step": 308664, "epoch": 2550} {"train_loss": -42.119529724121094, "global_step": 308665, "epoch": 2550} {"train_loss": -42.37853240966797, "global_step": 308666, "epoch": 2550} {"train_loss": -42.14070129394531, "global_step": 308667, "epoch": 2550} {"train_loss": -42.470035552978516, "global_step": 308668, "epoch": 2550} {"train_loss": -40.48300552368164, "global_step": 308669, "epoch": 2550} {"train_loss": -41.55381825344622, "global_step": 308670, "epoch": 2550, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 0.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4400000": 1.0, "test/sim_max_reward_4400001": 1.0, "test/sim_max_reward_4400002": 1.0, "test/sim_max_reward_4400003": 0.0, "test/sim_max_reward_4400004": 1.0, "test/sim_max_reward_4400005": 1.0, "test/sim_max_reward_4400006": 1.0, "test/sim_max_reward_4400007": 1.0, "test/sim_max_reward_4400008": 1.0, "test/sim_max_reward_4400009": 1.0, "test/sim_max_reward_4400010": 1.0, "test/sim_max_reward_4400011": 1.0, "test/sim_max_reward_4400012": 1.0, "test/sim_max_reward_4400013": 1.0, "test/sim_max_reward_4400014": 1.0, "test/sim_max_reward_4400015": 1.0, "test/sim_max_reward_4400016": 1.0, "test/sim_max_reward_4400017": 1.0, "test/sim_max_reward_4400018": 1.0, "test/sim_max_reward_4400019": 1.0, "test/sim_max_reward_4400020": 1.0, "test/sim_max_reward_4400021": 1.0, "train/mean_score": 0.8333333333333334, "test/mean_score": 0.9545454545454546, "val_loss": 2988936.75} {"train_loss": -42.49784851074219, "global_step": 308671, "epoch": 2551} {"train_loss": -42.8969841003418, "global_step": 308672, "epoch": 2551} {"train_loss": -41.44379806518555, "global_step": 308673, "epoch": 2551} {"train_loss": -41.56499099731445, "global_step": 308674, "epoch": 2551} {"train_loss": -42.24870681762695, "global_step": 308675, "epoch": 2551} {"train_loss": -42.26521301269531, "global_step": 308676, "epoch": 2551} {"train_loss": -42.7276496887207, "global_step": 308677, "epoch": 2551} {"train_loss": -41.73726272583008, "global_step": 308678, "epoch": 2551} {"train_loss": -42.73933792114258, "global_step": 308679, "epoch": 2551} {"train_loss": -42.73464584350586, "global_step": 308680, "epoch": 2551} {"train_loss": -41.56458282470703, "global_step": 308681, "epoch": 2551} {"train_loss": -42.94519805908203, "global_step": 308682, "epoch": 2551} {"train_loss": -42.18977355957031, "global_step": 308683, "epoch": 2551} {"train_loss": -42.64497756958008, "global_step": 308684, "epoch": 2551} {"train_loss": -42.67643356323242, "global_step": 308685, "epoch": 2551} {"train_loss": -42.86834716796875, "global_step": 308686, "epoch": 2551} {"train_loss": -42.984405517578125, "global_step": 308687, "epoch": 2551} {"train_loss": -43.024803161621094, "global_step": 308688, "epoch": 2551} {"train_loss": -43.41498947143555, "global_step": 308689, "epoch": 2551} {"train_loss": -43.34543991088867, "global_step": 308690, "epoch": 2551} {"train_loss": -42.923736572265625, "global_step": 308691, "epoch": 2551} {"train_loss": -43.53875732421875, "global_step": 308692, "epoch": 2551} {"train_loss": -42.81901931762695, "global_step": 308693, "epoch": 2551} {"train_loss": -43.295230865478516, "global_step": 308694, "epoch": 2551} {"train_loss": -43.30834197998047, "global_step": 308695, "epoch": 2551} {"train_loss": -43.56450653076172, "global_step": 308696, "epoch": 2551} {"train_loss": -43.5457763671875, "global_step": 308697, "epoch": 2551} {"train_loss": -43.5657958984375, "global_step": 308698, "epoch": 2551} {"train_loss": -43.101043701171875, "global_step": 308699, "epoch": 2551} {"train_loss": -43.17582321166992, "global_step": 308700, "epoch": 2551} {"train_loss": -43.90810775756836, "global_step": 308701, "epoch": 2551} {"train_loss": -43.505340576171875, "global_step": 308702, "epoch": 2551} {"train_loss": -43.78034210205078, "global_step": 308703, "epoch": 2551} {"train_loss": -43.28749465942383, "global_step": 308704, "epoch": 2551} {"train_loss": -43.77373504638672, "global_step": 308705, "epoch": 2551} {"train_loss": -43.3009033203125, "global_step": 308706, "epoch": 2551} {"train_loss": -43.55649948120117, "global_step": 308707, "epoch": 2551} {"train_loss": -43.1866340637207, "global_step": 308708, "epoch": 2551} {"train_loss": -43.70305252075195, "global_step": 308709, "epoch": 2551} {"train_loss": -42.90684127807617, "global_step": 308710, "epoch": 2551} {"train_loss": -43.70564651489258, "global_step": 308711, "epoch": 2551} {"train_loss": -43.7164421081543, "global_step": 308712, "epoch": 2551} {"train_loss": -43.7265739440918, "global_step": 308713, "epoch": 2551} {"train_loss": -44.08315658569336, "global_step": 308714, "epoch": 2551} {"train_loss": -43.59188461303711, "global_step": 308715, "epoch": 2551} {"train_loss": -43.70901107788086, "global_step": 308716, "epoch": 2551} {"train_loss": -43.66779708862305, "global_step": 308717, "epoch": 2551} {"train_loss": -43.927791595458984, "global_step": 308718, "epoch": 2551} {"train_loss": -43.668983459472656, "global_step": 308719, "epoch": 2551} {"train_loss": -43.56795883178711, "global_step": 308720, "epoch": 2551} {"train_loss": -43.61351013183594, "global_step": 308721, "epoch": 2551} {"train_loss": -43.780967712402344, "global_step": 308722, "epoch": 2551} {"train_loss": -43.3217887878418, "global_step": 308723, "epoch": 2551} {"train_loss": -43.68598556518555, "global_step": 308724, "epoch": 2551} {"train_loss": -43.489200592041016, "global_step": 308725, "epoch": 2551} {"train_loss": -43.5408821105957, "global_step": 308726, "epoch": 2551} {"train_loss": -43.54835891723633, "global_step": 308727, "epoch": 2551} {"train_loss": -43.49542236328125, "global_step": 308728, "epoch": 2551} {"train_loss": -43.804046630859375, "global_step": 308729, "epoch": 2551} {"train_loss": -43.54719543457031, "global_step": 308730, "epoch": 2551} {"train_loss": -43.81356430053711, "global_step": 308731, "epoch": 2551} {"train_loss": -41.772220611572266, "global_step": 308732, "epoch": 2551} {"train_loss": -43.33889389038086, "global_step": 308733, "epoch": 2551} {"train_loss": -43.620277404785156, "global_step": 308734, "epoch": 2551} {"train_loss": -43.52228927612305, "global_step": 308735, "epoch": 2551} {"train_loss": -42.33283615112305, "global_step": 308736, "epoch": 2551} {"train_loss": -43.536956787109375, "global_step": 308737, "epoch": 2551} {"train_loss": -43.52253341674805, "global_step": 308738, "epoch": 2551} {"train_loss": -42.4514274597168, "global_step": 308739, "epoch": 2551} {"train_loss": -43.32651901245117, "global_step": 308740, "epoch": 2551} {"train_loss": -43.494319915771484, "global_step": 308741, "epoch": 2551} {"train_loss": -38.43425369262695, "global_step": 308742, "epoch": 2551} {"train_loss": -43.83534622192383, "global_step": 308743, "epoch": 2551} {"train_loss": -43.66394805908203, "global_step": 308744, "epoch": 2551} {"train_loss": -42.32571029663086, "global_step": 308745, "epoch": 2551} {"train_loss": -43.07105255126953, "global_step": 308746, "epoch": 2551} {"train_loss": -42.20584487915039, "global_step": 308747, "epoch": 2551} {"train_loss": -38.56129837036133, "global_step": 308748, "epoch": 2551} {"train_loss": -42.73625183105469, "global_step": 308749, "epoch": 2551} {"train_loss": -41.56999969482422, "global_step": 308750, "epoch": 2551} {"train_loss": -40.297969818115234, "global_step": 308751, "epoch": 2551} {"train_loss": -38.74152755737305, "global_step": 308752, "epoch": 2551} {"train_loss": -38.45296096801758, "global_step": 308753, "epoch": 2551} {"train_loss": -39.595706939697266, "global_step": 308754, "epoch": 2551} {"train_loss": -39.96272659301758, "global_step": 308755, "epoch": 2551} {"train_loss": -39.435420989990234, "global_step": 308756, "epoch": 2551} {"train_loss": -42.13962936401367, "global_step": 308757, "epoch": 2551} {"train_loss": -36.76716232299805, "global_step": 308758, "epoch": 2551} {"train_loss": -41.00899124145508, "global_step": 308759, "epoch": 2551} {"train_loss": -41.30145263671875, "global_step": 308760, "epoch": 2551} {"train_loss": -40.4865837097168, "global_step": 308761, "epoch": 2551} {"train_loss": -40.68762969970703, "global_step": 308762, "epoch": 2551} {"train_loss": -40.11068344116211, "global_step": 308763, "epoch": 2551} {"train_loss": -41.8448486328125, "global_step": 308764, "epoch": 2551} {"train_loss": -40.253814697265625, "global_step": 308765, "epoch": 2551} {"train_loss": -39.775333404541016, "global_step": 308766, "epoch": 2551} {"train_loss": -40.753292083740234, "global_step": 308767, "epoch": 2551} {"train_loss": -41.10274887084961, "global_step": 308768, "epoch": 2551} {"train_loss": -38.6994743347168, "global_step": 308769, "epoch": 2551} {"train_loss": -41.0416374206543, "global_step": 308770, "epoch": 2551} {"train_loss": -39.011444091796875, "global_step": 308771, "epoch": 2551} {"train_loss": -40.32989501953125, "global_step": 308772, "epoch": 2551} {"train_loss": -40.87152099609375, "global_step": 308773, "epoch": 2551} {"train_loss": -41.37801742553711, "global_step": 308774, "epoch": 2551} {"train_loss": -41.41605758666992, "global_step": 308775, "epoch": 2551} {"train_loss": -40.51382064819336, "global_step": 308776, "epoch": 2551} {"train_loss": -41.037567138671875, "global_step": 308777, "epoch": 2551} {"train_loss": -42.00704574584961, "global_step": 308778, "epoch": 2551} {"train_loss": -41.284908294677734, "global_step": 308779, "epoch": 2551} {"train_loss": -42.22550582885742, "global_step": 308780, "epoch": 2551} {"train_loss": -42.156471252441406, "global_step": 308781, "epoch": 2551} {"train_loss": -42.3917236328125, "global_step": 308782, "epoch": 2551} {"train_loss": -40.966243743896484, "global_step": 308783, "epoch": 2551} {"train_loss": -42.562782287597656, "global_step": 308784, "epoch": 2551} {"train_loss": -41.646480560302734, "global_step": 308785, "epoch": 2551} {"train_loss": -42.40925216674805, "global_step": 308786, "epoch": 2551} {"train_loss": -42.42329788208008, "global_step": 308787, "epoch": 2551} {"train_loss": -42.641353607177734, "global_step": 308788, "epoch": 2551} {"train_loss": -42.58472442626953, "global_step": 308789, "epoch": 2551} {"train_loss": -41.603511810302734, "global_step": 308790, "epoch": 2551} {"train_loss": -42.29812719802226, "global_step": 308791, "epoch": 2551, "val_loss": 2670384.0} {"train_loss": -42.38075637817383, "global_step": 308792, "epoch": 2552} {"train_loss": -42.56759262084961, "global_step": 308793, "epoch": 2552} {"train_loss": -41.47854232788086, "global_step": 308794, "epoch": 2552} {"train_loss": -42.72663497924805, "global_step": 308795, "epoch": 2552} {"train_loss": -41.913509368896484, "global_step": 308796, "epoch": 2552} {"train_loss": -42.944732666015625, "global_step": 308797, "epoch": 2552} {"train_loss": -42.748565673828125, "global_step": 308798, "epoch": 2552} {"train_loss": -42.72445297241211, "global_step": 308799, "epoch": 2552} {"train_loss": -42.82886505126953, "global_step": 308800, "epoch": 2552} {"train_loss": -42.98463821411133, "global_step": 308801, "epoch": 2552} {"train_loss": -42.496192932128906, "global_step": 308802, "epoch": 2552} {"train_loss": -42.67123031616211, "global_step": 308803, "epoch": 2552} {"train_loss": -42.428436279296875, "global_step": 308804, "epoch": 2552} {"train_loss": -42.7099609375, "global_step": 308805, "epoch": 2552} {"train_loss": -42.988075256347656, "global_step": 308806, "epoch": 2552} {"train_loss": -43.04445266723633, "global_step": 308807, "epoch": 2552} {"train_loss": -42.52747344970703, "global_step": 308808, "epoch": 2552} {"train_loss": -43.60360336303711, "global_step": 308809, "epoch": 2552} {"train_loss": -42.767845153808594, "global_step": 308810, "epoch": 2552} {"train_loss": -43.540626525878906, "global_step": 308811, "epoch": 2552} {"train_loss": -42.7808952331543, "global_step": 308812, "epoch": 2552} {"train_loss": -43.02434158325195, "global_step": 308813, "epoch": 2552} {"train_loss": -43.150386810302734, "global_step": 308814, "epoch": 2552} {"train_loss": -43.15024948120117, "global_step": 308815, "epoch": 2552} {"train_loss": -43.42475128173828, "global_step": 308816, "epoch": 2552} {"train_loss": -42.87580871582031, "global_step": 308817, "epoch": 2552} {"train_loss": -43.13752746582031, "global_step": 308818, "epoch": 2552} {"train_loss": -42.77874755859375, "global_step": 308819, "epoch": 2552} {"train_loss": -43.34128952026367, "global_step": 308820, "epoch": 2552} {"train_loss": -43.35445022583008, "global_step": 308821, "epoch": 2552} {"train_loss": -43.4724006652832, "global_step": 308822, "epoch": 2552} {"train_loss": -43.57794952392578, "global_step": 308823, "epoch": 2552} {"train_loss": -43.34075927734375, "global_step": 308824, "epoch": 2552} {"train_loss": -43.19799041748047, "global_step": 308825, "epoch": 2552} {"train_loss": -43.87116241455078, "global_step": 308826, "epoch": 2552} {"train_loss": -43.5157470703125, "global_step": 308827, "epoch": 2552} {"train_loss": -43.254974365234375, "global_step": 308828, "epoch": 2552} {"train_loss": -42.87272262573242, "global_step": 308829, "epoch": 2552} {"train_loss": -43.00819778442383, "global_step": 308830, "epoch": 2552} {"train_loss": -43.1574821472168, "global_step": 308831, "epoch": 2552} {"train_loss": -43.39863586425781, "global_step": 308832, "epoch": 2552} {"train_loss": -43.87388229370117, "global_step": 308833, "epoch": 2552} {"train_loss": -43.10841751098633, "global_step": 308834, "epoch": 2552} {"train_loss": -44.12321853637695, "global_step": 308835, "epoch": 2552} {"train_loss": -43.19627380371094, "global_step": 308836, "epoch": 2552} {"train_loss": -43.237972259521484, "global_step": 308837, "epoch": 2552} {"train_loss": -43.22944259643555, "global_step": 308838, "epoch": 2552} {"train_loss": -43.852874755859375, "global_step": 308839, "epoch": 2552} {"train_loss": -43.26311111450195, "global_step": 308840, "epoch": 2552} {"train_loss": -43.23649597167969, "global_step": 308841, "epoch": 2552} {"train_loss": -43.67892074584961, "global_step": 308842, "epoch": 2552} {"train_loss": -44.23810958862305, "global_step": 308843, "epoch": 2552} {"train_loss": -43.55257797241211, "global_step": 308844, "epoch": 2552} {"train_loss": -43.09890365600586, "global_step": 308845, "epoch": 2552} {"train_loss": -40.56513214111328, "global_step": 308846, "epoch": 2552} {"train_loss": -42.97127151489258, "global_step": 308847, "epoch": 2552} {"train_loss": -42.97066116333008, "global_step": 308848, "epoch": 2552} {"train_loss": -43.0966682434082, "global_step": 308849, "epoch": 2552} {"train_loss": -43.3607063293457, "global_step": 308850, "epoch": 2552} {"train_loss": -43.75705337524414, "global_step": 308851, "epoch": 2552} {"train_loss": -39.8271369934082, "global_step": 308852, "epoch": 2552} {"train_loss": -41.09782409667969, "global_step": 308853, "epoch": 2552} {"train_loss": -38.42622375488281, "global_step": 308854, "epoch": 2552} {"train_loss": -42.49502944946289, "global_step": 308855, "epoch": 2552} {"train_loss": -42.96453857421875, "global_step": 308856, "epoch": 2552} {"train_loss": -43.381832122802734, "global_step": 308857, "epoch": 2552} {"train_loss": -42.606319427490234, "global_step": 308858, "epoch": 2552} {"train_loss": -42.75016403198242, "global_step": 308859, "epoch": 2552} {"train_loss": -42.228206634521484, "global_step": 308860, "epoch": 2552} {"train_loss": -43.91982650756836, "global_step": 308861, "epoch": 2552} {"train_loss": -42.80691146850586, "global_step": 308862, "epoch": 2552} {"train_loss": -43.29642868041992, "global_step": 308863, "epoch": 2552} {"train_loss": -43.092952728271484, "global_step": 308864, "epoch": 2552} {"train_loss": -42.85980224609375, "global_step": 308865, "epoch": 2552} {"train_loss": -43.58806228637695, "global_step": 308866, "epoch": 2552} {"train_loss": -43.221920013427734, "global_step": 308867, "epoch": 2552} {"train_loss": -37.9775505065918, "global_step": 308868, "epoch": 2552} {"train_loss": -43.078041076660156, "global_step": 308869, "epoch": 2552} {"train_loss": -42.7439079284668, "global_step": 308870, "epoch": 2552} {"train_loss": -42.614986419677734, "global_step": 308871, "epoch": 2552} {"train_loss": -42.445526123046875, "global_step": 308872, "epoch": 2552} {"train_loss": -42.744781494140625, "global_step": 308873, "epoch": 2552} {"train_loss": -42.54132843017578, "global_step": 308874, "epoch": 2552} {"train_loss": -43.27852249145508, "global_step": 308875, "epoch": 2552} {"train_loss": -42.058509826660156, "global_step": 308876, "epoch": 2552} {"train_loss": -41.515533447265625, "global_step": 308877, "epoch": 2552} {"train_loss": -43.29230880737305, "global_step": 308878, "epoch": 2552} {"train_loss": -37.2275505065918, "global_step": 308879, "epoch": 2552} {"train_loss": -43.56028747558594, "global_step": 308880, "epoch": 2552} {"train_loss": -42.66925811767578, "global_step": 308881, "epoch": 2552} {"train_loss": -42.6808967590332, "global_step": 308882, "epoch": 2552} {"train_loss": -43.098182678222656, "global_step": 308883, "epoch": 2552} {"train_loss": -41.92095947265625, "global_step": 308884, "epoch": 2552} {"train_loss": -43.36348342895508, "global_step": 308885, "epoch": 2552} {"train_loss": -42.566505432128906, "global_step": 308886, "epoch": 2552} {"train_loss": -43.3554801940918, "global_step": 308887, "epoch": 2552} {"train_loss": -43.09298324584961, "global_step": 308888, "epoch": 2552} {"train_loss": -43.611602783203125, "global_step": 308889, "epoch": 2552} {"train_loss": -40.430843353271484, "global_step": 308890, "epoch": 2552} {"train_loss": -42.00492477416992, "global_step": 308891, "epoch": 2552} {"train_loss": -42.073341369628906, "global_step": 308892, "epoch": 2552} {"train_loss": -43.65983200073242, "global_step": 308893, "epoch": 2552} {"train_loss": -41.76905822753906, "global_step": 308894, "epoch": 2552} {"train_loss": -42.19976806640625, "global_step": 308895, "epoch": 2552} {"train_loss": -42.88434982299805, "global_step": 308896, "epoch": 2552} {"train_loss": -43.15290451049805, "global_step": 308897, "epoch": 2552} {"train_loss": -43.4976692199707, "global_step": 308898, "epoch": 2552} {"train_loss": -41.45975112915039, "global_step": 308899, "epoch": 2552} {"train_loss": -41.54924392700195, "global_step": 308900, "epoch": 2552} {"train_loss": -41.5863151550293, "global_step": 308901, "epoch": 2552} {"train_loss": -43.64915466308594, "global_step": 308902, "epoch": 2552} {"train_loss": -41.54337692260742, "global_step": 308903, "epoch": 2552} {"train_loss": -43.60067367553711, "global_step": 308904, "epoch": 2552} {"train_loss": -42.1209716796875, "global_step": 308905, "epoch": 2552} {"train_loss": -42.31109619140625, "global_step": 308906, "epoch": 2552} {"train_loss": -41.25063705444336, "global_step": 308907, "epoch": 2552} {"train_loss": -42.896331787109375, "global_step": 308908, "epoch": 2552} {"train_loss": -42.628475189208984, "global_step": 308909, "epoch": 2552} {"train_loss": -42.606441497802734, "global_step": 308910, "epoch": 2552} {"train_loss": -43.31864929199219, "global_step": 308911, "epoch": 2552} {"train_loss": -42.72675143785713, "global_step": 308912, "epoch": 2552, "val_loss": 3087838.25} {"train_loss": -42.12961959838867, "global_step": 308913, "epoch": 2553} {"train_loss": -42.32569885253906, "global_step": 308914, "epoch": 2553} {"train_loss": -43.1505241394043, "global_step": 308915, "epoch": 2553} {"train_loss": -43.48655700683594, "global_step": 308916, "epoch": 2553} {"train_loss": -43.13397216796875, "global_step": 308917, "epoch": 2553} {"train_loss": -42.82050704956055, "global_step": 308918, "epoch": 2553} {"train_loss": -40.63138961791992, "global_step": 308919, "epoch": 2553} {"train_loss": -42.0782585144043, "global_step": 308920, "epoch": 2553} {"train_loss": -40.876556396484375, "global_step": 308921, "epoch": 2553} {"train_loss": -43.144386291503906, "global_step": 308922, "epoch": 2553} {"train_loss": -43.28766632080078, "global_step": 308923, "epoch": 2553} {"train_loss": -43.150691986083984, "global_step": 308924, "epoch": 2553} {"train_loss": -42.972259521484375, "global_step": 308925, "epoch": 2553} {"train_loss": -41.10120391845703, "global_step": 308926, "epoch": 2553} {"train_loss": -40.84204864501953, "global_step": 308927, "epoch": 2553} {"train_loss": -43.60322189331055, "global_step": 308928, "epoch": 2553} {"train_loss": -42.9233283996582, "global_step": 308929, "epoch": 2553} {"train_loss": -41.57133865356445, "global_step": 308930, "epoch": 2553} {"train_loss": -41.87214279174805, "global_step": 308931, "epoch": 2553} {"train_loss": -41.9586067199707, "global_step": 308932, "epoch": 2553} {"train_loss": -42.71136474609375, "global_step": 308933, "epoch": 2553} {"train_loss": -43.16661834716797, "global_step": 308934, "epoch": 2553} {"train_loss": -42.60997772216797, "global_step": 308935, "epoch": 2553} {"train_loss": -40.3599739074707, "global_step": 308936, "epoch": 2553} {"train_loss": -40.720035552978516, "global_step": 308937, "epoch": 2553} {"train_loss": -42.07297897338867, "global_step": 308938, "epoch": 2553} {"train_loss": -42.427364349365234, "global_step": 308939, "epoch": 2553} {"train_loss": -41.52566146850586, "global_step": 308940, "epoch": 2553} {"train_loss": -41.555755615234375, "global_step": 308941, "epoch": 2553} {"train_loss": -42.94234085083008, "global_step": 308942, "epoch": 2553} {"train_loss": -40.8134880065918, "global_step": 308943, "epoch": 2553} {"train_loss": -42.279754638671875, "global_step": 308944, "epoch": 2553} {"train_loss": -40.8723258972168, "global_step": 308945, "epoch": 2553} {"train_loss": -42.74154281616211, "global_step": 308946, "epoch": 2553} {"train_loss": -42.7270622253418, "global_step": 308947, "epoch": 2553} {"train_loss": -43.28873062133789, "global_step": 308948, "epoch": 2553} {"train_loss": -42.15993881225586, "global_step": 308949, "epoch": 2553} {"train_loss": -42.66169357299805, "global_step": 308950, "epoch": 2553} {"train_loss": -42.87921905517578, "global_step": 308951, "epoch": 2553} {"train_loss": -42.88707733154297, "global_step": 308952, "epoch": 2553} {"train_loss": -42.280433654785156, "global_step": 308953, "epoch": 2553} {"train_loss": -42.786590576171875, "global_step": 308954, "epoch": 2553} {"train_loss": -40.46935272216797, "global_step": 308955, "epoch": 2553} {"train_loss": -42.86149215698242, "global_step": 308956, "epoch": 2553} {"train_loss": -42.55422592163086, "global_step": 308957, "epoch": 2553} {"train_loss": -40.474853515625, "global_step": 308958, "epoch": 2553} {"train_loss": -43.18104934692383, "global_step": 308959, "epoch": 2553} {"train_loss": -43.20453643798828, "global_step": 308960, "epoch": 2553} {"train_loss": -40.93368148803711, "global_step": 308961, "epoch": 2553} {"train_loss": -41.942440032958984, "global_step": 308962, "epoch": 2553} {"train_loss": -42.03693389892578, "global_step": 308963, "epoch": 2553} {"train_loss": -42.36663818359375, "global_step": 308964, "epoch": 2553} {"train_loss": -43.04292297363281, "global_step": 308965, "epoch": 2553} {"train_loss": -40.86100387573242, "global_step": 308966, "epoch": 2553} {"train_loss": -43.03749465942383, "global_step": 308967, "epoch": 2553} {"train_loss": -42.15732955932617, "global_step": 308968, "epoch": 2553} {"train_loss": -42.96563720703125, "global_step": 308969, "epoch": 2553} {"train_loss": -42.78385925292969, "global_step": 308970, "epoch": 2553} {"train_loss": -42.434547424316406, "global_step": 308971, "epoch": 2553} {"train_loss": -43.2479362487793, "global_step": 308972, "epoch": 2553} {"train_loss": -42.617095947265625, "global_step": 308973, "epoch": 2553} {"train_loss": -42.46458435058594, "global_step": 308974, "epoch": 2553} {"train_loss": -41.5732307434082, "global_step": 308975, "epoch": 2553} {"train_loss": -42.77088165283203, "global_step": 308976, "epoch": 2553} {"train_loss": -42.20563888549805, "global_step": 308977, "epoch": 2553} {"train_loss": -43.640010833740234, "global_step": 308978, "epoch": 2553} {"train_loss": -42.98727035522461, "global_step": 308979, "epoch": 2553} {"train_loss": -43.1307487487793, "global_step": 308980, "epoch": 2553} {"train_loss": -42.64105224609375, "global_step": 308981, "epoch": 2553} {"train_loss": -43.6809196472168, "global_step": 308982, "epoch": 2553} {"train_loss": -43.2213020324707, "global_step": 308983, "epoch": 2553} {"train_loss": -42.244930267333984, "global_step": 308984, "epoch": 2553} {"train_loss": -43.60495376586914, "global_step": 308985, "epoch": 2553} {"train_loss": -42.7718505859375, "global_step": 308986, "epoch": 2553} {"train_loss": -42.9296760559082, "global_step": 308987, "epoch": 2553} {"train_loss": -42.99459457397461, "global_step": 308988, "epoch": 2553} {"train_loss": -43.29507064819336, "global_step": 308989, "epoch": 2553} {"train_loss": -43.21323776245117, "global_step": 308990, "epoch": 2553} {"train_loss": -42.403465270996094, "global_step": 308991, "epoch": 2553} {"train_loss": -41.6470947265625, "global_step": 308992, "epoch": 2553} {"train_loss": -42.12834167480469, "global_step": 308993, "epoch": 2553} {"train_loss": -43.15301513671875, "global_step": 308994, "epoch": 2553} {"train_loss": -42.310638427734375, "global_step": 308995, "epoch": 2553} {"train_loss": -42.477108001708984, "global_step": 308996, "epoch": 2553} {"train_loss": -42.904754638671875, "global_step": 308997, "epoch": 2553} {"train_loss": -43.12974166870117, "global_step": 308998, "epoch": 2553} {"train_loss": -43.1735954284668, "global_step": 308999, "epoch": 2553} {"train_loss": -43.025630950927734, "global_step": 309000, "epoch": 2553} {"train_loss": -43.492347717285156, "global_step": 309001, "epoch": 2553} {"train_loss": -43.68716812133789, "global_step": 309002, "epoch": 2553} {"train_loss": -43.905696868896484, "global_step": 309003, "epoch": 2553} {"train_loss": -43.34624481201172, "global_step": 309004, "epoch": 2553} {"train_loss": -43.18571853637695, "global_step": 309005, "epoch": 2553} {"train_loss": -44.050941467285156, "global_step": 309006, "epoch": 2553} {"train_loss": -43.288639068603516, "global_step": 309007, "epoch": 2553} {"train_loss": -42.900150299072266, "global_step": 309008, "epoch": 2553} {"train_loss": -42.390625, "global_step": 309009, "epoch": 2553} {"train_loss": -42.53227233886719, "global_step": 309010, "epoch": 2553} {"train_loss": -43.10374069213867, "global_step": 309011, "epoch": 2553} {"train_loss": -41.23210144042969, "global_step": 309012, "epoch": 2553} {"train_loss": -41.44126510620117, "global_step": 309013, "epoch": 2553} {"train_loss": -42.8267707824707, "global_step": 309014, "epoch": 2553} {"train_loss": -42.12596893310547, "global_step": 309015, "epoch": 2553} {"train_loss": -41.24116897583008, "global_step": 309016, "epoch": 2553} {"train_loss": -41.55048370361328, "global_step": 309017, "epoch": 2553} {"train_loss": -41.52766036987305, "global_step": 309018, "epoch": 2553} {"train_loss": -42.20328903198242, "global_step": 309019, "epoch": 2553} {"train_loss": -42.91592788696289, "global_step": 309020, "epoch": 2553} {"train_loss": -42.540016174316406, "global_step": 309021, "epoch": 2553} {"train_loss": -42.03851318359375, "global_step": 309022, "epoch": 2553} {"train_loss": -42.45464324951172, "global_step": 309023, "epoch": 2553} {"train_loss": -42.982177734375, "global_step": 309024, "epoch": 2553} {"train_loss": -41.36787796020508, "global_step": 309025, "epoch": 2553} {"train_loss": -41.8842658996582, "global_step": 309026, "epoch": 2553} {"train_loss": -42.14779281616211, "global_step": 309027, "epoch": 2553} {"train_loss": -43.52283477783203, "global_step": 309028, "epoch": 2553} {"train_loss": -41.703887939453125, "global_step": 309029, "epoch": 2553} {"train_loss": -42.775909423828125, "global_step": 309030, "epoch": 2553} {"train_loss": -43.217529296875, "global_step": 309031, "epoch": 2553} {"train_loss": -41.13276672363281, "global_step": 309032, "epoch": 2553} {"train_loss": -42.462203506595834, "global_step": 309033, "epoch": 2553, "val_loss": 2834806.0} {"train_loss": -42.898155212402344, "global_step": 309034, "epoch": 2554} {"train_loss": -43.04994583129883, "global_step": 309035, "epoch": 2554} {"train_loss": -42.69507598876953, "global_step": 309036, "epoch": 2554} {"train_loss": -42.3612174987793, "global_step": 309037, "epoch": 2554} {"train_loss": -43.0772590637207, "global_step": 309038, "epoch": 2554} {"train_loss": -43.10591506958008, "global_step": 309039, "epoch": 2554} {"train_loss": -42.464447021484375, "global_step": 309040, "epoch": 2554} {"train_loss": -43.60121154785156, "global_step": 309041, "epoch": 2554} {"train_loss": -42.47385787963867, "global_step": 309042, "epoch": 2554} {"train_loss": -43.79655838012695, "global_step": 309043, "epoch": 2554} {"train_loss": -43.24127197265625, "global_step": 309044, "epoch": 2554} {"train_loss": -42.779964447021484, "global_step": 309045, "epoch": 2554} {"train_loss": -42.91606903076172, "global_step": 309046, "epoch": 2554} {"train_loss": -42.512935638427734, "global_step": 309047, "epoch": 2554} {"train_loss": -42.595699310302734, "global_step": 309048, "epoch": 2554} {"train_loss": -43.877532958984375, "global_step": 309049, "epoch": 2554} {"train_loss": -42.99796676635742, "global_step": 309050, "epoch": 2554} {"train_loss": -43.4503059387207, "global_step": 309051, "epoch": 2554} {"train_loss": -42.83772659301758, "global_step": 309052, "epoch": 2554} {"train_loss": -43.8628044128418, "global_step": 309053, "epoch": 2554} {"train_loss": -43.27383804321289, "global_step": 309054, "epoch": 2554} {"train_loss": -43.62266159057617, "global_step": 309055, "epoch": 2554} {"train_loss": -43.46522903442383, "global_step": 309056, "epoch": 2554} {"train_loss": -43.11279296875, "global_step": 309057, "epoch": 2554} {"train_loss": -43.54258346557617, "global_step": 309058, "epoch": 2554} {"train_loss": -43.76898956298828, "global_step": 309059, "epoch": 2554} {"train_loss": -43.58414077758789, "global_step": 309060, "epoch": 2554} {"train_loss": -43.60316848754883, "global_step": 309061, "epoch": 2554} {"train_loss": -43.49180221557617, "global_step": 309062, "epoch": 2554} {"train_loss": -43.43766784667969, "global_step": 309063, "epoch": 2554} {"train_loss": -42.55712890625, "global_step": 309064, "epoch": 2554} {"train_loss": -43.21779251098633, "global_step": 309065, "epoch": 2554} {"train_loss": -43.30953598022461, "global_step": 309066, "epoch": 2554} {"train_loss": -43.48554611206055, "global_step": 309067, "epoch": 2554} {"train_loss": -43.12639617919922, "global_step": 309068, "epoch": 2554} {"train_loss": -43.637176513671875, "global_step": 309069, "epoch": 2554} {"train_loss": -43.0329475402832, "global_step": 309070, "epoch": 2554} {"train_loss": -42.9880485534668, "global_step": 309071, "epoch": 2554} {"train_loss": -42.66646957397461, "global_step": 309072, "epoch": 2554} {"train_loss": -43.757728576660156, "global_step": 309073, "epoch": 2554} {"train_loss": -43.39170455932617, "global_step": 309074, "epoch": 2554} {"train_loss": -42.49665832519531, "global_step": 309075, "epoch": 2554} {"train_loss": -43.283485412597656, "global_step": 309076, "epoch": 2554} {"train_loss": -43.53721237182617, "global_step": 309077, "epoch": 2554} {"train_loss": -40.71181869506836, "global_step": 309078, "epoch": 2554} {"train_loss": -39.581764221191406, "global_step": 309079, "epoch": 2554} {"train_loss": -42.85427474975586, "global_step": 309080, "epoch": 2554} {"train_loss": -43.45954132080078, "global_step": 309081, "epoch": 2554} {"train_loss": -40.92389678955078, "global_step": 309082, "epoch": 2554} {"train_loss": -42.31889343261719, "global_step": 309083, "epoch": 2554} {"train_loss": -43.2847785949707, "global_step": 309084, "epoch": 2554} {"train_loss": -42.020164489746094, "global_step": 309085, "epoch": 2554} {"train_loss": -42.182777404785156, "global_step": 309086, "epoch": 2554} {"train_loss": -42.194740295410156, "global_step": 309087, "epoch": 2554} {"train_loss": -43.16089630126953, "global_step": 309088, "epoch": 2554} {"train_loss": -41.880123138427734, "global_step": 309089, "epoch": 2554} {"train_loss": -41.19852828979492, "global_step": 309090, "epoch": 2554} {"train_loss": -42.272212982177734, "global_step": 309091, "epoch": 2554} {"train_loss": -42.31429672241211, "global_step": 309092, "epoch": 2554} {"train_loss": -42.12995147705078, "global_step": 309093, "epoch": 2554} {"train_loss": -41.59934997558594, "global_step": 309094, "epoch": 2554} {"train_loss": -41.41986083984375, "global_step": 309095, "epoch": 2554} {"train_loss": -41.60982894897461, "global_step": 309096, "epoch": 2554} {"train_loss": -42.7357063293457, "global_step": 309097, "epoch": 2554} {"train_loss": -42.19574737548828, "global_step": 309098, "epoch": 2554} {"train_loss": -42.39509201049805, "global_step": 309099, "epoch": 2554} {"train_loss": -42.27478790283203, "global_step": 309100, "epoch": 2554} {"train_loss": -42.38739776611328, "global_step": 309101, "epoch": 2554} {"train_loss": -42.08335494995117, "global_step": 309102, "epoch": 2554} {"train_loss": -42.5280647277832, "global_step": 309103, "epoch": 2554} {"train_loss": -42.203529357910156, "global_step": 309104, "epoch": 2554} {"train_loss": -42.74471664428711, "global_step": 309105, "epoch": 2554} {"train_loss": -41.70591735839844, "global_step": 309106, "epoch": 2554} {"train_loss": -42.90181350708008, "global_step": 309107, "epoch": 2554} {"train_loss": -42.32529830932617, "global_step": 309108, "epoch": 2554} {"train_loss": -42.51029586791992, "global_step": 309109, "epoch": 2554} {"train_loss": -42.860877990722656, "global_step": 309110, "epoch": 2554} {"train_loss": -43.585487365722656, "global_step": 309111, "epoch": 2554} {"train_loss": -43.154727935791016, "global_step": 309112, "epoch": 2554} {"train_loss": -41.97637939453125, "global_step": 309113, "epoch": 2554} {"train_loss": -42.332550048828125, "global_step": 309114, "epoch": 2554} {"train_loss": -43.14955520629883, "global_step": 309115, "epoch": 2554} {"train_loss": -43.38945388793945, "global_step": 309116, "epoch": 2554} {"train_loss": -43.34321975708008, "global_step": 309117, "epoch": 2554} {"train_loss": -43.30835723876953, "global_step": 309118, "epoch": 2554} {"train_loss": -42.86568069458008, "global_step": 309119, "epoch": 2554} {"train_loss": -43.25529479980469, "global_step": 309120, "epoch": 2554} {"train_loss": -43.48897933959961, "global_step": 309121, "epoch": 2554} {"train_loss": -43.05458450317383, "global_step": 309122, "epoch": 2554} {"train_loss": -43.61899948120117, "global_step": 309123, "epoch": 2554} {"train_loss": -43.618316650390625, "global_step": 309124, "epoch": 2554} {"train_loss": -42.260704040527344, "global_step": 309125, "epoch": 2554} {"train_loss": -43.62413024902344, "global_step": 309126, "epoch": 2554} {"train_loss": -42.72602844238281, "global_step": 309127, "epoch": 2554} {"train_loss": -44.07949447631836, "global_step": 309128, "epoch": 2554} {"train_loss": -43.626461029052734, "global_step": 309129, "epoch": 2554} {"train_loss": -43.679256439208984, "global_step": 309130, "epoch": 2554} {"train_loss": -43.85994338989258, "global_step": 309131, "epoch": 2554} {"train_loss": -43.240699768066406, "global_step": 309132, "epoch": 2554} {"train_loss": -43.66447067260742, "global_step": 309133, "epoch": 2554} {"train_loss": -44.085914611816406, "global_step": 309134, "epoch": 2554} {"train_loss": -43.660831451416016, "global_step": 309135, "epoch": 2554} {"train_loss": -43.53627395629883, "global_step": 309136, "epoch": 2554} {"train_loss": -43.271453857421875, "global_step": 309137, "epoch": 2554} {"train_loss": -43.0847282409668, "global_step": 309138, "epoch": 2554} {"train_loss": -43.814979553222656, "global_step": 309139, "epoch": 2554} {"train_loss": -43.676815032958984, "global_step": 309140, "epoch": 2554} {"train_loss": -43.594722747802734, "global_step": 309141, "epoch": 2554} {"train_loss": -43.136417388916016, "global_step": 309142, "epoch": 2554} {"train_loss": -44.08100509643555, "global_step": 309143, "epoch": 2554} {"train_loss": -43.513893127441406, "global_step": 309144, "epoch": 2554} {"train_loss": -42.8094596862793, "global_step": 309145, "epoch": 2554} {"train_loss": -43.19818878173828, "global_step": 309146, "epoch": 2554} {"train_loss": -44.12228775024414, "global_step": 309147, "epoch": 2554} {"train_loss": -43.08309555053711, "global_step": 309148, "epoch": 2554} {"train_loss": -43.2326774597168, "global_step": 309149, "epoch": 2554} {"train_loss": -43.57072067260742, "global_step": 309150, "epoch": 2554} {"train_loss": -43.865821838378906, "global_step": 309151, "epoch": 2554} {"train_loss": -43.92644119262695, "global_step": 309152, "epoch": 2554} {"train_loss": -43.160797119140625, "global_step": 309153, "epoch": 2554} {"train_loss": -42.979116613214664, "global_step": 309154, "epoch": 2554, "val_loss": 2622751.25} {"train_loss": -43.63788604736328, "global_step": 309155, "epoch": 2555} {"train_loss": -42.5631103515625, "global_step": 309156, "epoch": 2555} {"train_loss": -43.626617431640625, "global_step": 309157, "epoch": 2555} {"train_loss": -43.299964904785156, "global_step": 309158, "epoch": 2555} {"train_loss": -43.060115814208984, "global_step": 309159, "epoch": 2555} {"train_loss": -42.661643981933594, "global_step": 309160, "epoch": 2555} {"train_loss": -43.1679801940918, "global_step": 309161, "epoch": 2555} {"train_loss": -42.2015495300293, "global_step": 309162, "epoch": 2555} {"train_loss": -42.463287353515625, "global_step": 309163, "epoch": 2555} {"train_loss": -42.57693099975586, "global_step": 309164, "epoch": 2555} {"train_loss": -42.309505462646484, "global_step": 309165, "epoch": 2555} {"train_loss": -42.48474884033203, "global_step": 309166, "epoch": 2555} {"train_loss": -41.654781341552734, "global_step": 309167, "epoch": 2555} {"train_loss": -42.37651443481445, "global_step": 309168, "epoch": 2555} {"train_loss": -41.69815444946289, "global_step": 309169, "epoch": 2555} {"train_loss": -43.561180114746094, "global_step": 309170, "epoch": 2555} {"train_loss": -41.355621337890625, "global_step": 309171, "epoch": 2555} {"train_loss": -42.01251220703125, "global_step": 309172, "epoch": 2555} {"train_loss": -42.15475082397461, "global_step": 309173, "epoch": 2555} {"train_loss": -43.15958786010742, "global_step": 309174, "epoch": 2555} {"train_loss": -42.37421417236328, "global_step": 309175, "epoch": 2555} {"train_loss": -41.4547004699707, "global_step": 309176, "epoch": 2555} {"train_loss": -43.211700439453125, "global_step": 309177, "epoch": 2555} {"train_loss": -43.52274703979492, "global_step": 309178, "epoch": 2555} {"train_loss": -42.361141204833984, "global_step": 309179, "epoch": 2555} {"train_loss": -41.26700973510742, "global_step": 309180, "epoch": 2555} {"train_loss": -43.32115936279297, "global_step": 309181, "epoch": 2555} {"train_loss": -42.370521545410156, "global_step": 309182, "epoch": 2555} {"train_loss": -41.51587677001953, "global_step": 309183, "epoch": 2555} {"train_loss": -42.11946105957031, "global_step": 309184, "epoch": 2555} {"train_loss": -43.04670333862305, "global_step": 309185, "epoch": 2555} {"train_loss": -42.78802490234375, "global_step": 309186, "epoch": 2555} {"train_loss": -41.2568359375, "global_step": 309187, "epoch": 2555} {"train_loss": -41.772254943847656, "global_step": 309188, "epoch": 2555} {"train_loss": -43.0281867980957, "global_step": 309189, "epoch": 2555} {"train_loss": -42.23592758178711, "global_step": 309190, "epoch": 2555} {"train_loss": -41.875118255615234, "global_step": 309191, "epoch": 2555} {"train_loss": -43.43703079223633, "global_step": 309192, "epoch": 2555} {"train_loss": -39.99208068847656, "global_step": 309193, "epoch": 2555} {"train_loss": -40.051849365234375, "global_step": 309194, "epoch": 2555} {"train_loss": -42.563899993896484, "global_step": 309195, "epoch": 2555} {"train_loss": -37.977779388427734, "global_step": 309196, "epoch": 2555} {"train_loss": -40.803707122802734, "global_step": 309197, "epoch": 2555} {"train_loss": -41.46945571899414, "global_step": 309198, "epoch": 2555} {"train_loss": -42.131553649902344, "global_step": 309199, "epoch": 2555} {"train_loss": -41.90674591064453, "global_step": 309200, "epoch": 2555} {"train_loss": -42.5153923034668, "global_step": 309201, "epoch": 2555} {"train_loss": -41.16252517700195, "global_step": 309202, "epoch": 2555} {"train_loss": -42.021663665771484, "global_step": 309203, "epoch": 2555} {"train_loss": -42.63080978393555, "global_step": 309204, "epoch": 2555} {"train_loss": -42.58468246459961, "global_step": 309205, "epoch": 2555} {"train_loss": -42.42392349243164, "global_step": 309206, "epoch": 2555} {"train_loss": -42.4080696105957, "global_step": 309207, "epoch": 2555} {"train_loss": -42.4207763671875, "global_step": 309208, "epoch": 2555} {"train_loss": -43.00718307495117, "global_step": 309209, "epoch": 2555} {"train_loss": -42.93425369262695, "global_step": 309210, "epoch": 2555} {"train_loss": -43.45673370361328, "global_step": 309211, "epoch": 2555} {"train_loss": -42.90907669067383, "global_step": 309212, "epoch": 2555} {"train_loss": -43.823970794677734, "global_step": 309213, "epoch": 2555} {"train_loss": -43.049102783203125, "global_step": 309214, "epoch": 2555} {"train_loss": -42.82168197631836, "global_step": 309215, "epoch": 2555} {"train_loss": -43.75095748901367, "global_step": 309216, "epoch": 2555} {"train_loss": -42.82611846923828, "global_step": 309217, "epoch": 2555} {"train_loss": -43.29655838012695, "global_step": 309218, "epoch": 2555} {"train_loss": -42.92838668823242, "global_step": 309219, "epoch": 2555} {"train_loss": -43.032527923583984, "global_step": 309220, "epoch": 2555} {"train_loss": -44.08270263671875, "global_step": 309221, "epoch": 2555} {"train_loss": -42.009918212890625, "global_step": 309222, "epoch": 2555} {"train_loss": -42.50326919555664, "global_step": 309223, "epoch": 2555} {"train_loss": -43.49577331542969, "global_step": 309224, "epoch": 2555} {"train_loss": -42.7303581237793, "global_step": 309225, "epoch": 2555} {"train_loss": -43.12885665893555, "global_step": 309226, "epoch": 2555} {"train_loss": -42.922767639160156, "global_step": 309227, "epoch": 2555} {"train_loss": -43.30674362182617, "global_step": 309228, "epoch": 2555} {"train_loss": -42.51762008666992, "global_step": 309229, "epoch": 2555} {"train_loss": -43.23745346069336, "global_step": 309230, "epoch": 2555} {"train_loss": -43.71071243286133, "global_step": 309231, "epoch": 2555} {"train_loss": -43.26358413696289, "global_step": 309232, "epoch": 2555} {"train_loss": -42.989681243896484, "global_step": 309233, "epoch": 2555} {"train_loss": -43.05076217651367, "global_step": 309234, "epoch": 2555} {"train_loss": -42.86231231689453, "global_step": 309235, "epoch": 2555} {"train_loss": -42.456756591796875, "global_step": 309236, "epoch": 2555} {"train_loss": -43.65224838256836, "global_step": 309237, "epoch": 2555} {"train_loss": -43.689571380615234, "global_step": 309238, "epoch": 2555} {"train_loss": -43.28132247924805, "global_step": 309239, "epoch": 2555} {"train_loss": -44.12778854370117, "global_step": 309240, "epoch": 2555} {"train_loss": -43.45752716064453, "global_step": 309241, "epoch": 2555} {"train_loss": -43.23125076293945, "global_step": 309242, "epoch": 2555} {"train_loss": -43.910396575927734, "global_step": 309243, "epoch": 2555} {"train_loss": -43.55824661254883, "global_step": 309244, "epoch": 2555} {"train_loss": -43.79922103881836, "global_step": 309245, "epoch": 2555} {"train_loss": -43.40468978881836, "global_step": 309246, "epoch": 2555} {"train_loss": -44.07208251953125, "global_step": 309247, "epoch": 2555} {"train_loss": -43.271026611328125, "global_step": 309248, "epoch": 2555} {"train_loss": -43.94318389892578, "global_step": 309249, "epoch": 2555} {"train_loss": -43.182186126708984, "global_step": 309250, "epoch": 2555} {"train_loss": -43.57177734375, "global_step": 309251, "epoch": 2555} {"train_loss": -43.940223693847656, "global_step": 309252, "epoch": 2555} {"train_loss": -42.9943962097168, "global_step": 309253, "epoch": 2555} {"train_loss": -43.51677703857422, "global_step": 309254, "epoch": 2555} {"train_loss": -44.0902214050293, "global_step": 309255, "epoch": 2555} {"train_loss": -43.92112350463867, "global_step": 309256, "epoch": 2555} {"train_loss": -41.876277923583984, "global_step": 309257, "epoch": 2555} {"train_loss": -42.64508056640625, "global_step": 309258, "epoch": 2555} {"train_loss": -43.81483840942383, "global_step": 309259, "epoch": 2555} {"train_loss": -43.1356315612793, "global_step": 309260, "epoch": 2555} {"train_loss": -43.32599639892578, "global_step": 309261, "epoch": 2555} {"train_loss": -43.502681732177734, "global_step": 309262, "epoch": 2555} {"train_loss": -41.28737258911133, "global_step": 309263, "epoch": 2555} {"train_loss": -43.363494873046875, "global_step": 309264, "epoch": 2555} {"train_loss": -42.91123580932617, "global_step": 309265, "epoch": 2555} {"train_loss": -42.53579330444336, "global_step": 309266, "epoch": 2555} {"train_loss": -43.12440872192383, "global_step": 309267, "epoch": 2555} {"train_loss": -43.62935256958008, "global_step": 309268, "epoch": 2555} {"train_loss": -42.863006591796875, "global_step": 309269, "epoch": 2555} {"train_loss": -43.12630081176758, "global_step": 309270, "epoch": 2555} {"train_loss": -43.614112854003906, "global_step": 309271, "epoch": 2555} {"train_loss": -43.2674446105957, "global_step": 309272, "epoch": 2555} {"train_loss": -42.758419036865234, "global_step": 309273, "epoch": 2555} {"train_loss": -43.30517578125, "global_step": 309274, "epoch": 2555} {"train_loss": -42.77307217180236, "global_step": 309275, "epoch": 2555, "val_loss": 2684036.25} {"train_loss": -43.0984001159668, "global_step": 309276, "epoch": 2556} {"train_loss": -43.403846740722656, "global_step": 309277, "epoch": 2556} {"train_loss": -42.66364288330078, "global_step": 309278, "epoch": 2556} {"train_loss": -42.96027755737305, "global_step": 309279, "epoch": 2556} {"train_loss": -43.65166091918945, "global_step": 309280, "epoch": 2556} {"train_loss": -42.89440155029297, "global_step": 309281, "epoch": 2556} {"train_loss": -42.64142608642578, "global_step": 309282, "epoch": 2556} {"train_loss": -41.377376556396484, "global_step": 309283, "epoch": 2556} {"train_loss": -42.67029571533203, "global_step": 309284, "epoch": 2556} {"train_loss": -43.841949462890625, "global_step": 309285, "epoch": 2556} {"train_loss": -42.388160705566406, "global_step": 309286, "epoch": 2556} {"train_loss": -42.399818420410156, "global_step": 309287, "epoch": 2556} {"train_loss": -42.712467193603516, "global_step": 309288, "epoch": 2556} {"train_loss": -42.4461784362793, "global_step": 309289, "epoch": 2556} {"train_loss": -41.128719329833984, "global_step": 309290, "epoch": 2556} {"train_loss": -42.38783264160156, "global_step": 309291, "epoch": 2556} {"train_loss": -42.776641845703125, "global_step": 309292, "epoch": 2556} {"train_loss": -43.725196838378906, "global_step": 309293, "epoch": 2556} {"train_loss": -43.49448776245117, "global_step": 309294, "epoch": 2556} {"train_loss": -43.13695526123047, "global_step": 309295, "epoch": 2556} {"train_loss": -42.464515686035156, "global_step": 309296, "epoch": 2556} {"train_loss": -42.919700622558594, "global_step": 309297, "epoch": 2556} {"train_loss": -43.7336311340332, "global_step": 309298, "epoch": 2556} {"train_loss": -43.355899810791016, "global_step": 309299, "epoch": 2556} {"train_loss": -43.95386505126953, "global_step": 309300, "epoch": 2556} {"train_loss": -44.03705596923828, "global_step": 309301, "epoch": 2556} {"train_loss": -43.632911682128906, "global_step": 309302, "epoch": 2556} {"train_loss": -42.69614791870117, "global_step": 309303, "epoch": 2556} {"train_loss": -43.82493591308594, "global_step": 309304, "epoch": 2556} {"train_loss": -44.09666061401367, "global_step": 309305, "epoch": 2556} {"train_loss": -43.56424331665039, "global_step": 309306, "epoch": 2556} {"train_loss": -43.9718132019043, "global_step": 309307, "epoch": 2556} {"train_loss": -43.60107421875, "global_step": 309308, "epoch": 2556} {"train_loss": -43.63111877441406, "global_step": 309309, "epoch": 2556} {"train_loss": -43.85173416137695, "global_step": 309310, "epoch": 2556} {"train_loss": -43.299415588378906, "global_step": 309311, "epoch": 2556} {"train_loss": -43.694759368896484, "global_step": 309312, "epoch": 2556} {"train_loss": -42.7282600402832, "global_step": 309313, "epoch": 2556} {"train_loss": -43.56355667114258, "global_step": 309314, "epoch": 2556} {"train_loss": -44.094905853271484, "global_step": 309315, "epoch": 2556} {"train_loss": -42.57082748413086, "global_step": 309316, "epoch": 2556} {"train_loss": -44.187713623046875, "global_step": 309317, "epoch": 2556} {"train_loss": -43.71799850463867, "global_step": 309318, "epoch": 2556} {"train_loss": -43.35727310180664, "global_step": 309319, "epoch": 2556} {"train_loss": -43.759979248046875, "global_step": 309320, "epoch": 2556} {"train_loss": -43.9282112121582, "global_step": 309321, "epoch": 2556} {"train_loss": -43.38388442993164, "global_step": 309322, "epoch": 2556} {"train_loss": -43.53913116455078, "global_step": 309323, "epoch": 2556} {"train_loss": -42.39198684692383, "global_step": 309324, "epoch": 2556} {"train_loss": -42.65747833251953, "global_step": 309325, "epoch": 2556} {"train_loss": -43.1451301574707, "global_step": 309326, "epoch": 2556} {"train_loss": -42.75188064575195, "global_step": 309327, "epoch": 2556} {"train_loss": -43.75436019897461, "global_step": 309328, "epoch": 2556} {"train_loss": -42.282772064208984, "global_step": 309329, "epoch": 2556} {"train_loss": -43.6916618347168, "global_step": 309330, "epoch": 2556} {"train_loss": -42.05864334106445, "global_step": 309331, "epoch": 2556} {"train_loss": -41.376991271972656, "global_step": 309332, "epoch": 2556} {"train_loss": -43.41948699951172, "global_step": 309333, "epoch": 2556} {"train_loss": -42.35757827758789, "global_step": 309334, "epoch": 2556} {"train_loss": -41.44423294067383, "global_step": 309335, "epoch": 2556} {"train_loss": -43.46223449707031, "global_step": 309336, "epoch": 2556} {"train_loss": -42.67306137084961, "global_step": 309337, "epoch": 2556} {"train_loss": -42.73430252075195, "global_step": 309338, "epoch": 2556} {"train_loss": -43.27128219604492, "global_step": 309339, "epoch": 2556} {"train_loss": -43.34242630004883, "global_step": 309340, "epoch": 2556} {"train_loss": -41.78102493286133, "global_step": 309341, "epoch": 2556} {"train_loss": -38.31602096557617, "global_step": 309342, "epoch": 2556} {"train_loss": -41.445064544677734, "global_step": 309343, "epoch": 2556} {"train_loss": -43.50284957885742, "global_step": 309344, "epoch": 2556} {"train_loss": -39.8510627746582, "global_step": 309345, "epoch": 2556} {"train_loss": -39.41447448730469, "global_step": 309346, "epoch": 2556} {"train_loss": -40.9825553894043, "global_step": 309347, "epoch": 2556} {"train_loss": -44.029598236083984, "global_step": 309348, "epoch": 2556} {"train_loss": -42.36701965332031, "global_step": 309349, "epoch": 2556} {"train_loss": -41.4296760559082, "global_step": 309350, "epoch": 2556} {"train_loss": -42.594669342041016, "global_step": 309351, "epoch": 2556} {"train_loss": -42.761322021484375, "global_step": 309352, "epoch": 2556} {"train_loss": -42.775184631347656, "global_step": 309353, "epoch": 2556} {"train_loss": -42.07627487182617, "global_step": 309354, "epoch": 2556} {"train_loss": -42.96137237548828, "global_step": 309355, "epoch": 2556} {"train_loss": -43.362648010253906, "global_step": 309356, "epoch": 2556} {"train_loss": -43.13032150268555, "global_step": 309357, "epoch": 2556} {"train_loss": -43.4041633605957, "global_step": 309358, "epoch": 2556} {"train_loss": -43.630645751953125, "global_step": 309359, "epoch": 2556} {"train_loss": -42.73305130004883, "global_step": 309360, "epoch": 2556} {"train_loss": -43.3005485534668, "global_step": 309361, "epoch": 2556} {"train_loss": -41.91726303100586, "global_step": 309362, "epoch": 2556} {"train_loss": -43.2025146484375, "global_step": 309363, "epoch": 2556} {"train_loss": -43.33858108520508, "global_step": 309364, "epoch": 2556} {"train_loss": -43.21432113647461, "global_step": 309365, "epoch": 2556} {"train_loss": -42.968414306640625, "global_step": 309366, "epoch": 2556} {"train_loss": -42.79581832885742, "global_step": 309367, "epoch": 2556} {"train_loss": -43.11671829223633, "global_step": 309368, "epoch": 2556} {"train_loss": -43.061614990234375, "global_step": 309369, "epoch": 2556} {"train_loss": -43.1972770690918, "global_step": 309370, "epoch": 2556} {"train_loss": -43.20841598510742, "global_step": 309371, "epoch": 2556} {"train_loss": -43.8204345703125, "global_step": 309372, "epoch": 2556} {"train_loss": -43.6496696472168, "global_step": 309373, "epoch": 2556} {"train_loss": -43.780921936035156, "global_step": 309374, "epoch": 2556} {"train_loss": -43.9102668762207, "global_step": 309375, "epoch": 2556} {"train_loss": -44.30227279663086, "global_step": 309376, "epoch": 2556} {"train_loss": -44.16655349731445, "global_step": 309377, "epoch": 2556} {"train_loss": -43.805355072021484, "global_step": 309378, "epoch": 2556} {"train_loss": -43.09699249267578, "global_step": 309379, "epoch": 2556} {"train_loss": -43.70896530151367, "global_step": 309380, "epoch": 2556} {"train_loss": -44.05560302734375, "global_step": 309381, "epoch": 2556} {"train_loss": -43.91303634643555, "global_step": 309382, "epoch": 2556} {"train_loss": -43.66743087768555, "global_step": 309383, "epoch": 2556} {"train_loss": -43.5595703125, "global_step": 309384, "epoch": 2556} {"train_loss": -43.74703598022461, "global_step": 309385, "epoch": 2556} {"train_loss": -43.648101806640625, "global_step": 309386, "epoch": 2556} {"train_loss": -44.3116569519043, "global_step": 309387, "epoch": 2556} {"train_loss": -44.25837707519531, "global_step": 309388, "epoch": 2556} {"train_loss": -43.84688949584961, "global_step": 309389, "epoch": 2556} {"train_loss": -43.830379486083984, "global_step": 309390, "epoch": 2556} {"train_loss": -44.2142448425293, "global_step": 309391, "epoch": 2556} {"train_loss": -44.02384567260742, "global_step": 309392, "epoch": 2556} {"train_loss": -43.80486297607422, "global_step": 309393, "epoch": 2556} {"train_loss": -44.40446090698242, "global_step": 309394, "epoch": 2556} {"train_loss": -43.995418548583984, "global_step": 309395, "epoch": 2556} {"train_loss": -43.103649959091314, "global_step": 309396, "epoch": 2556, "val_loss": 2689800.0} {"train_loss": -44.24076843261719, "global_step": 309397, "epoch": 2557} {"train_loss": -44.3724479675293, "global_step": 309398, "epoch": 2557} {"train_loss": -43.89814758300781, "global_step": 309399, "epoch": 2557} {"train_loss": -44.06159591674805, "global_step": 309400, "epoch": 2557} {"train_loss": -44.03054428100586, "global_step": 309401, "epoch": 2557} {"train_loss": -43.57863998413086, "global_step": 309402, "epoch": 2557} {"train_loss": -43.091251373291016, "global_step": 309403, "epoch": 2557} {"train_loss": -42.58905792236328, "global_step": 309404, "epoch": 2557} {"train_loss": -43.59244918823242, "global_step": 309405, "epoch": 2557} {"train_loss": -43.837642669677734, "global_step": 309406, "epoch": 2557} {"train_loss": -43.94430160522461, "global_step": 309407, "epoch": 2557} {"train_loss": -43.9676628112793, "global_step": 309408, "epoch": 2557} {"train_loss": -43.34365463256836, "global_step": 309409, "epoch": 2557} {"train_loss": -42.54220199584961, "global_step": 309410, "epoch": 2557} {"train_loss": -43.86293411254883, "global_step": 309411, "epoch": 2557} {"train_loss": -44.41195297241211, "global_step": 309412, "epoch": 2557} {"train_loss": -43.17864227294922, "global_step": 309413, "epoch": 2557} {"train_loss": -43.85750961303711, "global_step": 309414, "epoch": 2557} {"train_loss": -43.70417404174805, "global_step": 309415, "epoch": 2557} {"train_loss": -43.73553466796875, "global_step": 309416, "epoch": 2557} {"train_loss": -42.81623077392578, "global_step": 309417, "epoch": 2557} {"train_loss": -43.444149017333984, "global_step": 309418, "epoch": 2557} {"train_loss": -43.91040802001953, "global_step": 309419, "epoch": 2557} {"train_loss": -42.0146369934082, "global_step": 309420, "epoch": 2557} {"train_loss": -42.32289123535156, "global_step": 309421, "epoch": 2557} {"train_loss": -42.361751556396484, "global_step": 309422, "epoch": 2557} {"train_loss": -41.445335388183594, "global_step": 309423, "epoch": 2557} {"train_loss": -40.38677978515625, "global_step": 309424, "epoch": 2557} {"train_loss": -41.269378662109375, "global_step": 309425, "epoch": 2557} {"train_loss": -40.633174896240234, "global_step": 309426, "epoch": 2557} {"train_loss": -40.90340805053711, "global_step": 309427, "epoch": 2557} {"train_loss": -40.309059143066406, "global_step": 309428, "epoch": 2557} {"train_loss": -38.88920211791992, "global_step": 309429, "epoch": 2557} {"train_loss": -38.33784103393555, "global_step": 309430, "epoch": 2557} {"train_loss": -38.207942962646484, "global_step": 309431, "epoch": 2557} {"train_loss": -41.07169723510742, "global_step": 309432, "epoch": 2557} {"train_loss": -40.08211898803711, "global_step": 309433, "epoch": 2557} {"train_loss": -40.54865646362305, "global_step": 309434, "epoch": 2557} {"train_loss": -41.28529739379883, "global_step": 309435, "epoch": 2557} {"train_loss": -40.67058181762695, "global_step": 309436, "epoch": 2557} {"train_loss": -41.36823272705078, "global_step": 309437, "epoch": 2557} {"train_loss": -42.19773483276367, "global_step": 309438, "epoch": 2557} {"train_loss": -41.911163330078125, "global_step": 309439, "epoch": 2557} {"train_loss": -41.67832565307617, "global_step": 309440, "epoch": 2557} {"train_loss": -42.511199951171875, "global_step": 309441, "epoch": 2557} {"train_loss": -42.242530822753906, "global_step": 309442, "epoch": 2557} {"train_loss": -42.37050247192383, "global_step": 309443, "epoch": 2557} {"train_loss": -42.32013702392578, "global_step": 309444, "epoch": 2557} {"train_loss": -41.722530364990234, "global_step": 309445, "epoch": 2557} {"train_loss": -43.378753662109375, "global_step": 309446, "epoch": 2557} {"train_loss": -42.617855072021484, "global_step": 309447, "epoch": 2557} {"train_loss": -42.79881286621094, "global_step": 309448, "epoch": 2557} {"train_loss": -42.904239654541016, "global_step": 309449, "epoch": 2557} {"train_loss": -42.09688949584961, "global_step": 309450, "epoch": 2557} {"train_loss": -43.31494903564453, "global_step": 309451, "epoch": 2557} {"train_loss": -42.875850677490234, "global_step": 309452, "epoch": 2557} {"train_loss": -42.48994064331055, "global_step": 309453, "epoch": 2557} {"train_loss": -42.50748062133789, "global_step": 309454, "epoch": 2557} {"train_loss": -42.33256149291992, "global_step": 309455, "epoch": 2557} {"train_loss": -43.09307098388672, "global_step": 309456, "epoch": 2557} {"train_loss": -41.907806396484375, "global_step": 309457, "epoch": 2557} {"train_loss": -42.99312973022461, "global_step": 309458, "epoch": 2557} {"train_loss": -42.123016357421875, "global_step": 309459, "epoch": 2557} {"train_loss": -42.91804885864258, "global_step": 309460, "epoch": 2557} {"train_loss": -42.293006896972656, "global_step": 309461, "epoch": 2557} {"train_loss": -43.66825485229492, "global_step": 309462, "epoch": 2557} {"train_loss": -42.74312210083008, "global_step": 309463, "epoch": 2557} {"train_loss": -43.87235641479492, "global_step": 309464, "epoch": 2557} {"train_loss": -43.41299057006836, "global_step": 309465, "epoch": 2557} {"train_loss": -43.949275970458984, "global_step": 309466, "epoch": 2557} {"train_loss": -43.6120491027832, "global_step": 309467, "epoch": 2557} {"train_loss": -43.796775817871094, "global_step": 309468, "epoch": 2557} {"train_loss": -43.441349029541016, "global_step": 309469, "epoch": 2557} {"train_loss": -43.688175201416016, "global_step": 309470, "epoch": 2557} {"train_loss": -43.58252716064453, "global_step": 309471, "epoch": 2557} {"train_loss": -44.061279296875, "global_step": 309472, "epoch": 2557} {"train_loss": -43.95618438720703, "global_step": 309473, "epoch": 2557} {"train_loss": -43.650142669677734, "global_step": 309474, "epoch": 2557} {"train_loss": -44.128173828125, "global_step": 309475, "epoch": 2557} {"train_loss": -43.85957717895508, "global_step": 309476, "epoch": 2557} {"train_loss": -43.73896789550781, "global_step": 309477, "epoch": 2557} {"train_loss": -43.930355072021484, "global_step": 309478, "epoch": 2557} {"train_loss": -44.32754898071289, "global_step": 309479, "epoch": 2557} {"train_loss": -44.34957504272461, "global_step": 309480, "epoch": 2557} {"train_loss": -44.100746154785156, "global_step": 309481, "epoch": 2557} {"train_loss": -44.268463134765625, "global_step": 309482, "epoch": 2557} {"train_loss": -44.45029830932617, "global_step": 309483, "epoch": 2557} {"train_loss": -44.33437728881836, "global_step": 309484, "epoch": 2557} {"train_loss": -44.615814208984375, "global_step": 309485, "epoch": 2557} {"train_loss": -43.78609848022461, "global_step": 309486, "epoch": 2557} {"train_loss": -44.3883171081543, "global_step": 309487, "epoch": 2557} {"train_loss": -44.04673767089844, "global_step": 309488, "epoch": 2557} {"train_loss": -44.449562072753906, "global_step": 309489, "epoch": 2557} {"train_loss": -44.20531463623047, "global_step": 309490, "epoch": 2557} {"train_loss": -44.147308349609375, "global_step": 309491, "epoch": 2557} {"train_loss": -44.56648635864258, "global_step": 309492, "epoch": 2557} {"train_loss": -44.84831237792969, "global_step": 309493, "epoch": 2557} {"train_loss": -44.631649017333984, "global_step": 309494, "epoch": 2557} {"train_loss": -44.65764236450195, "global_step": 309495, "epoch": 2557} {"train_loss": -44.68123245239258, "global_step": 309496, "epoch": 2557} {"train_loss": -44.31185531616211, "global_step": 309497, "epoch": 2557} {"train_loss": -44.70009994506836, "global_step": 309498, "epoch": 2557} {"train_loss": -44.9442024230957, "global_step": 309499, "epoch": 2557} {"train_loss": -44.13453674316406, "global_step": 309500, "epoch": 2557} {"train_loss": -44.78190994262695, "global_step": 309501, "epoch": 2557} {"train_loss": -44.710960388183594, "global_step": 309502, "epoch": 2557} {"train_loss": -44.9039192199707, "global_step": 309503, "epoch": 2557} {"train_loss": -44.712257385253906, "global_step": 309504, "epoch": 2557} {"train_loss": -44.08694076538086, "global_step": 309505, "epoch": 2557} {"train_loss": -45.14105224609375, "global_step": 309506, "epoch": 2557} {"train_loss": -44.55891418457031, "global_step": 309507, "epoch": 2557} {"train_loss": -44.57209396362305, "global_step": 309508, "epoch": 2557} {"train_loss": -44.927459716796875, "global_step": 309509, "epoch": 2557} {"train_loss": -44.28811264038086, "global_step": 309510, "epoch": 2557} {"train_loss": -44.09894561767578, "global_step": 309511, "epoch": 2557} {"train_loss": -44.46668243408203, "global_step": 309512, "epoch": 2557} {"train_loss": -44.437042236328125, "global_step": 309513, "epoch": 2557} {"train_loss": -43.43174362182617, "global_step": 309514, "epoch": 2557} {"train_loss": -43.366390228271484, "global_step": 309515, "epoch": 2557} {"train_loss": -42.72740936279297, "global_step": 309516, "epoch": 2557} {"train_loss": -43.20882346413352, "global_step": 309517, "epoch": 2557, "val_loss": 2679566.75} {"train_loss": -42.87396240234375, "global_step": 309518, "epoch": 2558} {"train_loss": -41.56303024291992, "global_step": 309519, "epoch": 2558} {"train_loss": -41.94437789916992, "global_step": 309520, "epoch": 2558} {"train_loss": -42.26054000854492, "global_step": 309521, "epoch": 2558} {"train_loss": -41.727752685546875, "global_step": 309522, "epoch": 2558} {"train_loss": -42.14487075805664, "global_step": 309523, "epoch": 2558} {"train_loss": -42.612762451171875, "global_step": 309524, "epoch": 2558} {"train_loss": -43.6098747253418, "global_step": 309525, "epoch": 2558} {"train_loss": -42.708160400390625, "global_step": 309526, "epoch": 2558} {"train_loss": -41.256378173828125, "global_step": 309527, "epoch": 2558} {"train_loss": -41.160125732421875, "global_step": 309528, "epoch": 2558} {"train_loss": -42.61651611328125, "global_step": 309529, "epoch": 2558} {"train_loss": -42.71208190917969, "global_step": 309530, "epoch": 2558} {"train_loss": -39.86328125, "global_step": 309531, "epoch": 2558} {"train_loss": -33.9128532409668, "global_step": 309532, "epoch": 2558} {"train_loss": -31.615400314331055, "global_step": 309533, "epoch": 2558} {"train_loss": -37.61385726928711, "global_step": 309534, "epoch": 2558} {"train_loss": -40.5544319152832, "global_step": 309535, "epoch": 2558} {"train_loss": -38.92963409423828, "global_step": 309536, "epoch": 2558} {"train_loss": -39.37702560424805, "global_step": 309537, "epoch": 2558} {"train_loss": -39.935001373291016, "global_step": 309538, "epoch": 2558} {"train_loss": -35.71298599243164, "global_step": 309539, "epoch": 2558} {"train_loss": -38.8217887878418, "global_step": 309540, "epoch": 2558} {"train_loss": -40.558441162109375, "global_step": 309541, "epoch": 2558} {"train_loss": -39.850852966308594, "global_step": 309542, "epoch": 2558} {"train_loss": -41.58010482788086, "global_step": 309543, "epoch": 2558} {"train_loss": -36.90644454956055, "global_step": 309544, "epoch": 2558} {"train_loss": -40.93498611450195, "global_step": 309545, "epoch": 2558} {"train_loss": -39.106300354003906, "global_step": 309546, "epoch": 2558} {"train_loss": -41.04994583129883, "global_step": 309547, "epoch": 2558} {"train_loss": -38.49496841430664, "global_step": 309548, "epoch": 2558} {"train_loss": -42.24489974975586, "global_step": 309549, "epoch": 2558} {"train_loss": -38.628936767578125, "global_step": 309550, "epoch": 2558} {"train_loss": -41.532676696777344, "global_step": 309551, "epoch": 2558} {"train_loss": -40.66850280761719, "global_step": 309552, "epoch": 2558} {"train_loss": -41.1693000793457, "global_step": 309553, "epoch": 2558} {"train_loss": -40.76180648803711, "global_step": 309554, "epoch": 2558} {"train_loss": -41.69118881225586, "global_step": 309555, "epoch": 2558} {"train_loss": -42.417362213134766, "global_step": 309556, "epoch": 2558} {"train_loss": -41.0384521484375, "global_step": 309557, "epoch": 2558} {"train_loss": -42.89268112182617, "global_step": 309558, "epoch": 2558} {"train_loss": -41.776161193847656, "global_step": 309559, "epoch": 2558} {"train_loss": -42.66962814331055, "global_step": 309560, "epoch": 2558} {"train_loss": -42.116390228271484, "global_step": 309561, "epoch": 2558} {"train_loss": -42.79806900024414, "global_step": 309562, "epoch": 2558} {"train_loss": -42.97175216674805, "global_step": 309563, "epoch": 2558} {"train_loss": -42.35993576049805, "global_step": 309564, "epoch": 2558} {"train_loss": -42.611690521240234, "global_step": 309565, "epoch": 2558} {"train_loss": -42.913063049316406, "global_step": 309566, "epoch": 2558} {"train_loss": -42.33954620361328, "global_step": 309567, "epoch": 2558} {"train_loss": -43.17678451538086, "global_step": 309568, "epoch": 2558} {"train_loss": -42.40503692626953, "global_step": 309569, "epoch": 2558} {"train_loss": -43.511505126953125, "global_step": 309570, "epoch": 2558} {"train_loss": -42.62393569946289, "global_step": 309571, "epoch": 2558} {"train_loss": -43.505489349365234, "global_step": 309572, "epoch": 2558} {"train_loss": -43.0923957824707, "global_step": 309573, "epoch": 2558} {"train_loss": -43.55501174926758, "global_step": 309574, "epoch": 2558} {"train_loss": -43.320892333984375, "global_step": 309575, "epoch": 2558} {"train_loss": -43.80323028564453, "global_step": 309576, "epoch": 2558} {"train_loss": -43.57296371459961, "global_step": 309577, "epoch": 2558} {"train_loss": -43.74789810180664, "global_step": 309578, "epoch": 2558} {"train_loss": -44.11677551269531, "global_step": 309579, "epoch": 2558} {"train_loss": -43.63417434692383, "global_step": 309580, "epoch": 2558} {"train_loss": -43.845333099365234, "global_step": 309581, "epoch": 2558} {"train_loss": -44.15418243408203, "global_step": 309582, "epoch": 2558} {"train_loss": -44.29705810546875, "global_step": 309583, "epoch": 2558} {"train_loss": -43.78562545776367, "global_step": 309584, "epoch": 2558} {"train_loss": -44.05074691772461, "global_step": 309585, "epoch": 2558} {"train_loss": -43.744850158691406, "global_step": 309586, "epoch": 2558} {"train_loss": -44.17192459106445, "global_step": 309587, "epoch": 2558} {"train_loss": -43.848419189453125, "global_step": 309588, "epoch": 2558} {"train_loss": -43.90468978881836, "global_step": 309589, "epoch": 2558} {"train_loss": -44.265926361083984, "global_step": 309590, "epoch": 2558} {"train_loss": -44.251522064208984, "global_step": 309591, "epoch": 2558} {"train_loss": -44.42898941040039, "global_step": 309592, "epoch": 2558} {"train_loss": -43.963382720947266, "global_step": 309593, "epoch": 2558} {"train_loss": -44.14872360229492, "global_step": 309594, "epoch": 2558} {"train_loss": -44.218833923339844, "global_step": 309595, "epoch": 2558} {"train_loss": -44.18702697753906, "global_step": 309596, "epoch": 2558} {"train_loss": -44.338958740234375, "global_step": 309597, "epoch": 2558} {"train_loss": -43.968666076660156, "global_step": 309598, "epoch": 2558} {"train_loss": -44.549625396728516, "global_step": 309599, "epoch": 2558} {"train_loss": -44.41427993774414, "global_step": 309600, "epoch": 2558} {"train_loss": -43.98797607421875, "global_step": 309601, "epoch": 2558} {"train_loss": -44.49283981323242, "global_step": 309602, "epoch": 2558} {"train_loss": -44.704444885253906, "global_step": 309603, "epoch": 2558} {"train_loss": -44.336307525634766, "global_step": 309604, "epoch": 2558} {"train_loss": -44.54024124145508, "global_step": 309605, "epoch": 2558} {"train_loss": -44.59891891479492, "global_step": 309606, "epoch": 2558} {"train_loss": -44.793949127197266, "global_step": 309607, "epoch": 2558} {"train_loss": -44.310638427734375, "global_step": 309608, "epoch": 2558} {"train_loss": -44.47017288208008, "global_step": 309609, "epoch": 2558} {"train_loss": -44.52900314331055, "global_step": 309610, "epoch": 2558} {"train_loss": -44.784820556640625, "global_step": 309611, "epoch": 2558} {"train_loss": -44.677276611328125, "global_step": 309612, "epoch": 2558} {"train_loss": -44.81960678100586, "global_step": 309613, "epoch": 2558} {"train_loss": -44.850521087646484, "global_step": 309614, "epoch": 2558} {"train_loss": -44.777339935302734, "global_step": 309615, "epoch": 2558} {"train_loss": -44.709346771240234, "global_step": 309616, "epoch": 2558} {"train_loss": -45.10118865966797, "global_step": 309617, "epoch": 2558} {"train_loss": -44.867347717285156, "global_step": 309618, "epoch": 2558} {"train_loss": -44.52342224121094, "global_step": 309619, "epoch": 2558} {"train_loss": -44.34913635253906, "global_step": 309620, "epoch": 2558} {"train_loss": -44.51711654663086, "global_step": 309621, "epoch": 2558} {"train_loss": -44.765785217285156, "global_step": 309622, "epoch": 2558} {"train_loss": -44.71073532104492, "global_step": 309623, "epoch": 2558} {"train_loss": -44.537513732910156, "global_step": 309624, "epoch": 2558} {"train_loss": -44.71270751953125, "global_step": 309625, "epoch": 2558} {"train_loss": -44.611183166503906, "global_step": 309626, "epoch": 2558} {"train_loss": -44.52447509765625, "global_step": 309627, "epoch": 2558} {"train_loss": -44.67379379272461, "global_step": 309628, "epoch": 2558} {"train_loss": -44.67002868652344, "global_step": 309629, "epoch": 2558} {"train_loss": -44.32112121582031, "global_step": 309630, "epoch": 2558} {"train_loss": -44.076961517333984, "global_step": 309631, "epoch": 2558} {"train_loss": -44.48394775390625, "global_step": 309632, "epoch": 2558} {"train_loss": -44.25571060180664, "global_step": 309633, "epoch": 2558} {"train_loss": -44.882293701171875, "global_step": 309634, "epoch": 2558} {"train_loss": -44.20429611206055, "global_step": 309635, "epoch": 2558} {"train_loss": -43.937129974365234, "global_step": 309636, "epoch": 2558} {"train_loss": -44.311065673828125, "global_step": 309637, "epoch": 2558} {"train_loss": -42.80081490445728, "global_step": 309638, "epoch": 2558, "val_loss": 2749871.0} {"train_loss": -42.90283966064453, "global_step": 309639, "epoch": 2559} {"train_loss": -41.73779296875, "global_step": 309640, "epoch": 2559} {"train_loss": -35.05501174926758, "global_step": 309641, "epoch": 2559} {"train_loss": -30.707172393798828, "global_step": 309642, "epoch": 2559} {"train_loss": -21.485580444335938, "global_step": 309643, "epoch": 2559} {"train_loss": -8.621837615966797, "global_step": 309644, "epoch": 2559} {"train_loss": -19.552915573120117, "global_step": 309645, "epoch": 2559} {"train_loss": -36.396400451660156, "global_step": 309646, "epoch": 2559} {"train_loss": -33.542327880859375, "global_step": 309647, "epoch": 2559} {"train_loss": -34.25996017456055, "global_step": 309648, "epoch": 2559} {"train_loss": -37.71887969970703, "global_step": 309649, "epoch": 2559} {"train_loss": -33.88957595825195, "global_step": 309650, "epoch": 2559} {"train_loss": -38.842498779296875, "global_step": 309651, "epoch": 2559} {"train_loss": -37.0810546875, "global_step": 309652, "epoch": 2559} {"train_loss": -38.4651985168457, "global_step": 309653, "epoch": 2559} {"train_loss": -37.671993255615234, "global_step": 309654, "epoch": 2559} {"train_loss": -37.475341796875, "global_step": 309655, "epoch": 2559} {"train_loss": -38.05377960205078, "global_step": 309656, "epoch": 2559} {"train_loss": -37.850704193115234, "global_step": 309657, "epoch": 2559} {"train_loss": -40.23381423950195, "global_step": 309658, "epoch": 2559} {"train_loss": -37.98628616333008, "global_step": 309659, "epoch": 2559} {"train_loss": -40.55619430541992, "global_step": 309660, "epoch": 2559} {"train_loss": -39.222835540771484, "global_step": 309661, "epoch": 2559} {"train_loss": -40.63764190673828, "global_step": 309662, "epoch": 2559} {"train_loss": -40.85951232910156, "global_step": 309663, "epoch": 2559} {"train_loss": -40.775672912597656, "global_step": 309664, "epoch": 2559} {"train_loss": -41.1441535949707, "global_step": 309665, "epoch": 2559} {"train_loss": -40.25189208984375, "global_step": 309666, "epoch": 2559} {"train_loss": -41.355018615722656, "global_step": 309667, "epoch": 2559} {"train_loss": -41.15711975097656, "global_step": 309668, "epoch": 2559} {"train_loss": -41.42424392700195, "global_step": 309669, "epoch": 2559} {"train_loss": -40.98321533203125, "global_step": 309670, "epoch": 2559} {"train_loss": -42.036964416503906, "global_step": 309671, "epoch": 2559} {"train_loss": -41.68697738647461, "global_step": 309672, "epoch": 2559} {"train_loss": -42.04566192626953, "global_step": 309673, "epoch": 2559} {"train_loss": -42.14716720581055, "global_step": 309674, "epoch": 2559} {"train_loss": -41.694576263427734, "global_step": 309675, "epoch": 2559} {"train_loss": -42.66679763793945, "global_step": 309676, "epoch": 2559} {"train_loss": -41.07666015625, "global_step": 309677, "epoch": 2559} {"train_loss": -42.31089401245117, "global_step": 309678, "epoch": 2559} {"train_loss": -41.65269088745117, "global_step": 309679, "epoch": 2559} {"train_loss": -42.487213134765625, "global_step": 309680, "epoch": 2559} {"train_loss": -42.74201202392578, "global_step": 309681, "epoch": 2559} {"train_loss": -42.814334869384766, "global_step": 309682, "epoch": 2559} {"train_loss": -42.94099044799805, "global_step": 309683, "epoch": 2559} {"train_loss": -42.710296630859375, "global_step": 309684, "epoch": 2559} {"train_loss": -42.72011947631836, "global_step": 309685, "epoch": 2559} {"train_loss": -42.850830078125, "global_step": 309686, "epoch": 2559} {"train_loss": -42.833316802978516, "global_step": 309687, "epoch": 2559} {"train_loss": -42.988975524902344, "global_step": 309688, "epoch": 2559} {"train_loss": -43.106300354003906, "global_step": 309689, "epoch": 2559} {"train_loss": -43.05644607543945, "global_step": 309690, "epoch": 2559} {"train_loss": -43.307594299316406, "global_step": 309691, "epoch": 2559} {"train_loss": -43.50162887573242, "global_step": 309692, "epoch": 2559} {"train_loss": -43.18046188354492, "global_step": 309693, "epoch": 2559} {"train_loss": -43.2061653137207, "global_step": 309694, "epoch": 2559} {"train_loss": -43.52602005004883, "global_step": 309695, "epoch": 2559} {"train_loss": -43.6087760925293, "global_step": 309696, "epoch": 2559} {"train_loss": -43.742679595947266, "global_step": 309697, "epoch": 2559} {"train_loss": -43.12575912475586, "global_step": 309698, "epoch": 2559} {"train_loss": -43.90095138549805, "global_step": 309699, "epoch": 2559} {"train_loss": -43.539764404296875, "global_step": 309700, "epoch": 2559} {"train_loss": -43.36809158325195, "global_step": 309701, "epoch": 2559} {"train_loss": -43.59279251098633, "global_step": 309702, "epoch": 2559} {"train_loss": -43.624122619628906, "global_step": 309703, "epoch": 2559} {"train_loss": -43.790740966796875, "global_step": 309704, "epoch": 2559} {"train_loss": -43.620849609375, "global_step": 309705, "epoch": 2559} {"train_loss": -43.82994079589844, "global_step": 309706, "epoch": 2559} {"train_loss": -42.728370666503906, "global_step": 309707, "epoch": 2559} {"train_loss": -42.62910842895508, "global_step": 309708, "epoch": 2559} {"train_loss": -42.74385452270508, "global_step": 309709, "epoch": 2559} {"train_loss": -43.8400764465332, "global_step": 309710, "epoch": 2559} {"train_loss": -44.0610466003418, "global_step": 309711, "epoch": 2559} {"train_loss": -44.169307708740234, "global_step": 309712, "epoch": 2559} {"train_loss": -44.21825408935547, "global_step": 309713, "epoch": 2559} {"train_loss": -44.22675704956055, "global_step": 309714, "epoch": 2559} {"train_loss": -43.87363815307617, "global_step": 309715, "epoch": 2559} {"train_loss": -43.74074172973633, "global_step": 309716, "epoch": 2559} {"train_loss": -43.97978591918945, "global_step": 309717, "epoch": 2559} {"train_loss": -44.20906448364258, "global_step": 309718, "epoch": 2559} {"train_loss": -43.83766555786133, "global_step": 309719, "epoch": 2559} {"train_loss": -44.07295227050781, "global_step": 309720, "epoch": 2559} {"train_loss": -44.072845458984375, "global_step": 309721, "epoch": 2559} {"train_loss": -44.262542724609375, "global_step": 309722, "epoch": 2559} {"train_loss": -44.07194900512695, "global_step": 309723, "epoch": 2559} {"train_loss": -43.85017395019531, "global_step": 309724, "epoch": 2559} {"train_loss": -44.348236083984375, "global_step": 309725, "epoch": 2559} {"train_loss": -44.38580322265625, "global_step": 309726, "epoch": 2559} {"train_loss": -44.467124938964844, "global_step": 309727, "epoch": 2559} {"train_loss": -44.467063903808594, "global_step": 309728, "epoch": 2559} {"train_loss": -44.530303955078125, "global_step": 309729, "epoch": 2559} {"train_loss": -44.525543212890625, "global_step": 309730, "epoch": 2559} {"train_loss": -44.251014709472656, "global_step": 309731, "epoch": 2559} {"train_loss": -44.37626266479492, "global_step": 309732, "epoch": 2559} {"train_loss": -44.80463790893555, "global_step": 309733, "epoch": 2559} {"train_loss": -44.55317306518555, "global_step": 309734, "epoch": 2559} {"train_loss": -44.425445556640625, "global_step": 309735, "epoch": 2559} {"train_loss": -44.62007141113281, "global_step": 309736, "epoch": 2559} {"train_loss": -44.46466827392578, "global_step": 309737, "epoch": 2559} {"train_loss": -44.70851135253906, "global_step": 309738, "epoch": 2559} {"train_loss": -44.59666061401367, "global_step": 309739, "epoch": 2559} {"train_loss": -44.7158088684082, "global_step": 309740, "epoch": 2559} {"train_loss": -44.69953536987305, "global_step": 309741, "epoch": 2559} {"train_loss": -44.75985336303711, "global_step": 309742, "epoch": 2559} {"train_loss": -44.59402084350586, "global_step": 309743, "epoch": 2559} {"train_loss": -44.723384857177734, "global_step": 309744, "epoch": 2559} {"train_loss": -44.692832946777344, "global_step": 309745, "epoch": 2559} {"train_loss": -45.022987365722656, "global_step": 309746, "epoch": 2559} {"train_loss": -44.97774887084961, "global_step": 309747, "epoch": 2559} {"train_loss": -45.18325424194336, "global_step": 309748, "epoch": 2559} {"train_loss": -45.127017974853516, "global_step": 309749, "epoch": 2559} {"train_loss": -44.92426681518555, "global_step": 309750, "epoch": 2559} {"train_loss": -44.863487243652344, "global_step": 309751, "epoch": 2559} {"train_loss": -45.10740280151367, "global_step": 309752, "epoch": 2559} {"train_loss": -44.7955207824707, "global_step": 309753, "epoch": 2559} {"train_loss": -44.80490493774414, "global_step": 309754, "epoch": 2559} {"train_loss": -44.788692474365234, "global_step": 309755, "epoch": 2559} {"train_loss": -44.62974548339844, "global_step": 309756, "epoch": 2559} {"train_loss": -44.70766830444336, "global_step": 309757, "epoch": 2559} {"train_loss": -44.84598922729492, "global_step": 309758, "epoch": 2559} {"train_loss": -41.85368014564199, "global_step": 309759, "epoch": 2559, "val_loss": 2828973.75} {"train_loss": -44.549583435058594, "global_step": 309760, "epoch": 2560} {"train_loss": -44.34077072143555, "global_step": 309761, "epoch": 2560} {"train_loss": -44.905189514160156, "global_step": 309762, "epoch": 2560} {"train_loss": -44.4775390625, "global_step": 309763, "epoch": 2560} {"train_loss": -44.87062454223633, "global_step": 309764, "epoch": 2560} {"train_loss": -44.95125198364258, "global_step": 309765, "epoch": 2560} {"train_loss": -44.684879302978516, "global_step": 309766, "epoch": 2560} {"train_loss": -44.764793395996094, "global_step": 309767, "epoch": 2560} {"train_loss": -45.147029876708984, "global_step": 309768, "epoch": 2560} {"train_loss": -45.20491409301758, "global_step": 309769, "epoch": 2560} {"train_loss": -44.3704719543457, "global_step": 309770, "epoch": 2560} {"train_loss": -44.856285095214844, "global_step": 309771, "epoch": 2560} {"train_loss": -45.07084655761719, "global_step": 309772, "epoch": 2560} {"train_loss": -45.21479034423828, "global_step": 309773, "epoch": 2560} {"train_loss": -44.73942565917969, "global_step": 309774, "epoch": 2560} {"train_loss": -44.90114212036133, "global_step": 309775, "epoch": 2560} {"train_loss": -44.7691650390625, "global_step": 309776, "epoch": 2560} {"train_loss": -39.01382064819336, "global_step": 309777, "epoch": 2560} {"train_loss": -44.81170654296875, "global_step": 309778, "epoch": 2560} {"train_loss": -44.28689193725586, "global_step": 309779, "epoch": 2560} {"train_loss": -44.972164154052734, "global_step": 309780, "epoch": 2560} {"train_loss": -44.97050094604492, "global_step": 309781, "epoch": 2560} {"train_loss": -44.41697311401367, "global_step": 309782, "epoch": 2560} {"train_loss": -44.926231384277344, "global_step": 309783, "epoch": 2560} {"train_loss": -44.74505615234375, "global_step": 309784, "epoch": 2560} {"train_loss": -44.19222640991211, "global_step": 309785, "epoch": 2560} {"train_loss": -42.581878662109375, "global_step": 309786, "epoch": 2560} {"train_loss": -37.19600296020508, "global_step": 309787, "epoch": 2560} {"train_loss": -44.869972229003906, "global_step": 309788, "epoch": 2560} {"train_loss": -43.55438995361328, "global_step": 309789, "epoch": 2560} {"train_loss": -42.628639221191406, "global_step": 309790, "epoch": 2560} {"train_loss": -41.37467575073242, "global_step": 309791, "epoch": 2560} {"train_loss": -30.564252853393555, "global_step": 309792, "epoch": 2560} {"train_loss": -31.158010482788086, "global_step": 309793, "epoch": 2560} {"train_loss": -38.52677536010742, "global_step": 309794, "epoch": 2560} {"train_loss": -36.90952682495117, "global_step": 309795, "epoch": 2560} {"train_loss": -41.92555618286133, "global_step": 309796, "epoch": 2560} {"train_loss": -39.27803421020508, "global_step": 309797, "epoch": 2560} {"train_loss": -32.920013427734375, "global_step": 309798, "epoch": 2560} {"train_loss": -36.44157791137695, "global_step": 309799, "epoch": 2560} {"train_loss": -32.2734489440918, "global_step": 309800, "epoch": 2560} {"train_loss": -36.66741943359375, "global_step": 309801, "epoch": 2560} {"train_loss": -39.0672492980957, "global_step": 309802, "epoch": 2560} {"train_loss": -21.04314613342285, "global_step": 309803, "epoch": 2560} {"train_loss": -40.44157409667969, "global_step": 309804, "epoch": 2560} {"train_loss": -33.118648529052734, "global_step": 309805, "epoch": 2560} {"train_loss": -17.968244552612305, "global_step": 309806, "epoch": 2560} {"train_loss": -38.017059326171875, "global_step": 309807, "epoch": 2560} {"train_loss": -37.501773834228516, "global_step": 309808, "epoch": 2560} {"train_loss": -18.590810775756836, "global_step": 309809, "epoch": 2560} {"train_loss": -28.286306381225586, "global_step": 309810, "epoch": 2560} {"train_loss": -38.481868743896484, "global_step": 309811, "epoch": 2560} {"train_loss": -35.05289840698242, "global_step": 309812, "epoch": 2560} {"train_loss": -39.46090316772461, "global_step": 309813, "epoch": 2560} {"train_loss": -31.29249382019043, "global_step": 309814, "epoch": 2560} {"train_loss": -29.8720703125, "global_step": 309815, "epoch": 2560} {"train_loss": -38.01015090942383, "global_step": 309816, "epoch": 2560} {"train_loss": -37.24235534667969, "global_step": 309817, "epoch": 2560} {"train_loss": -35.14994812011719, "global_step": 309818, "epoch": 2560} {"train_loss": -34.842369079589844, "global_step": 309819, "epoch": 2560} {"train_loss": -38.03131866455078, "global_step": 309820, "epoch": 2560} {"train_loss": -35.5373420715332, "global_step": 309821, "epoch": 2560} {"train_loss": -25.03451919555664, "global_step": 309822, "epoch": 2560} {"train_loss": -39.51375961303711, "global_step": 309823, "epoch": 2560} {"train_loss": -39.68769454956055, "global_step": 309824, "epoch": 2560} {"train_loss": -39.90148162841797, "global_step": 309825, "epoch": 2560} {"train_loss": -37.87858581542969, "global_step": 309826, "epoch": 2560} {"train_loss": -39.162837982177734, "global_step": 309827, "epoch": 2560} {"train_loss": -37.198577880859375, "global_step": 309828, "epoch": 2560} {"train_loss": -36.56210708618164, "global_step": 309829, "epoch": 2560} {"train_loss": -38.53079605102539, "global_step": 309830, "epoch": 2560} {"train_loss": -36.8802375793457, "global_step": 309831, "epoch": 2560} {"train_loss": -39.952884674072266, "global_step": 309832, "epoch": 2560} {"train_loss": -39.357017517089844, "global_step": 309833, "epoch": 2560} {"train_loss": -39.006099700927734, "global_step": 309834, "epoch": 2560} {"train_loss": -39.06074905395508, "global_step": 309835, "epoch": 2560} {"train_loss": -38.90165328979492, "global_step": 309836, "epoch": 2560} {"train_loss": -40.251625061035156, "global_step": 309837, "epoch": 2560} {"train_loss": -41.08970260620117, "global_step": 309838, "epoch": 2560} {"train_loss": -27.457258224487305, "global_step": 309839, "epoch": 2560} {"train_loss": -40.01052474975586, "global_step": 309840, "epoch": 2560} {"train_loss": -40.281410217285156, "global_step": 309841, "epoch": 2560} {"train_loss": -41.10113525390625, "global_step": 309842, "epoch": 2560} {"train_loss": -39.631065368652344, "global_step": 309843, "epoch": 2560} {"train_loss": -39.41938400268555, "global_step": 309844, "epoch": 2560} {"train_loss": -40.12289047241211, "global_step": 309845, "epoch": 2560} {"train_loss": -40.96920394897461, "global_step": 309846, "epoch": 2560} {"train_loss": -40.405181884765625, "global_step": 309847, "epoch": 2560} {"train_loss": -40.51478576660156, "global_step": 309848, "epoch": 2560} {"train_loss": -40.608985900878906, "global_step": 309849, "epoch": 2560} {"train_loss": -40.22938919067383, "global_step": 309850, "epoch": 2560} {"train_loss": -39.69867706298828, "global_step": 309851, "epoch": 2560} {"train_loss": -38.22425079345703, "global_step": 309852, "epoch": 2560} {"train_loss": -39.84634017944336, "global_step": 309853, "epoch": 2560} {"train_loss": -41.1336784362793, "global_step": 309854, "epoch": 2560} {"train_loss": -39.967506408691406, "global_step": 309855, "epoch": 2560} {"train_loss": -40.465450286865234, "global_step": 309856, "epoch": 2560} {"train_loss": -41.14008712768555, "global_step": 309857, "epoch": 2560} {"train_loss": -40.30474090576172, "global_step": 309858, "epoch": 2560} {"train_loss": -41.568023681640625, "global_step": 309859, "epoch": 2560} {"train_loss": -40.8798942565918, "global_step": 309860, "epoch": 2560} {"train_loss": -41.302120208740234, "global_step": 309861, "epoch": 2560} {"train_loss": -41.20138168334961, "global_step": 309862, "epoch": 2560} {"train_loss": -41.31589889526367, "global_step": 309863, "epoch": 2560} {"train_loss": -41.22378158569336, "global_step": 309864, "epoch": 2560} {"train_loss": -41.70437240600586, "global_step": 309865, "epoch": 2560} {"train_loss": -41.328067779541016, "global_step": 309866, "epoch": 2560} {"train_loss": -41.27124786376953, "global_step": 309867, "epoch": 2560} {"train_loss": -41.22620391845703, "global_step": 309868, "epoch": 2560} {"train_loss": -41.5704231262207, "global_step": 309869, "epoch": 2560} {"train_loss": -41.03904724121094, "global_step": 309870, "epoch": 2560} {"train_loss": -40.802791595458984, "global_step": 309871, "epoch": 2560} {"train_loss": -40.6242561340332, "global_step": 309872, "epoch": 2560} {"train_loss": -41.745521545410156, "global_step": 309873, "epoch": 2560} {"train_loss": -41.3221435546875, "global_step": 309874, "epoch": 2560} {"train_loss": -41.72028732299805, "global_step": 309875, "epoch": 2560} {"train_loss": -41.2655143737793, "global_step": 309876, "epoch": 2560} {"train_loss": -40.84706115722656, "global_step": 309877, "epoch": 2560} {"train_loss": -41.042362213134766, "global_step": 309878, "epoch": 2560} {"train_loss": -41.285926818847656, "global_step": 309879, "epoch": 2560} {"train_loss": -39.51409473892086, "global_step": 309880, "epoch": 2560, "val_loss": 2671576.5} {"train_loss": -41.37297439575195, "global_step": 309881, "epoch": 2561} {"train_loss": -41.774391174316406, "global_step": 309882, "epoch": 2561} {"train_loss": -42.47096252441406, "global_step": 309883, "epoch": 2561} {"train_loss": -42.14207458496094, "global_step": 309884, "epoch": 2561} {"train_loss": -42.19343566894531, "global_step": 309885, "epoch": 2561} {"train_loss": -39.12704086303711, "global_step": 309886, "epoch": 2561} {"train_loss": -42.232337951660156, "global_step": 309887, "epoch": 2561} {"train_loss": -41.77752685546875, "global_step": 309888, "epoch": 2561} {"train_loss": -41.72164535522461, "global_step": 309889, "epoch": 2561} {"train_loss": -42.504241943359375, "global_step": 309890, "epoch": 2561} {"train_loss": -41.26054000854492, "global_step": 309891, "epoch": 2561} {"train_loss": -42.45270919799805, "global_step": 309892, "epoch": 2561} {"train_loss": -42.074127197265625, "global_step": 309893, "epoch": 2561} {"train_loss": -41.958553314208984, "global_step": 309894, "epoch": 2561} {"train_loss": -41.9669189453125, "global_step": 309895, "epoch": 2561} {"train_loss": -42.72721481323242, "global_step": 309896, "epoch": 2561} {"train_loss": -42.32770919799805, "global_step": 309897, "epoch": 2561} {"train_loss": -42.759212493896484, "global_step": 309898, "epoch": 2561} {"train_loss": -42.402462005615234, "global_step": 309899, "epoch": 2561} {"train_loss": -43.13631057739258, "global_step": 309900, "epoch": 2561} {"train_loss": -43.02700424194336, "global_step": 309901, "epoch": 2561} {"train_loss": -40.907161712646484, "global_step": 309902, "epoch": 2561} {"train_loss": -43.635467529296875, "global_step": 309903, "epoch": 2561} {"train_loss": -40.95954513549805, "global_step": 309904, "epoch": 2561} {"train_loss": -42.351097106933594, "global_step": 309905, "epoch": 2561} {"train_loss": -43.19134521484375, "global_step": 309906, "epoch": 2561} {"train_loss": -42.76852035522461, "global_step": 309907, "epoch": 2561} {"train_loss": -42.69721984863281, "global_step": 309908, "epoch": 2561} {"train_loss": -42.00431442260742, "global_step": 309909, "epoch": 2561} {"train_loss": -42.267242431640625, "global_step": 309910, "epoch": 2561} {"train_loss": -42.555171966552734, "global_step": 309911, "epoch": 2561} {"train_loss": -43.07991027832031, "global_step": 309912, "epoch": 2561} {"train_loss": -43.20198440551758, "global_step": 309913, "epoch": 2561} {"train_loss": -41.94120788574219, "global_step": 309914, "epoch": 2561} {"train_loss": -42.144874572753906, "global_step": 309915, "epoch": 2561} {"train_loss": -42.97275161743164, "global_step": 309916, "epoch": 2561} {"train_loss": -41.9715461730957, "global_step": 309917, "epoch": 2561} {"train_loss": -42.89181137084961, "global_step": 309918, "epoch": 2561} {"train_loss": -42.91645812988281, "global_step": 309919, "epoch": 2561} {"train_loss": -42.89271926879883, "global_step": 309920, "epoch": 2561} {"train_loss": -43.100677490234375, "global_step": 309921, "epoch": 2561} {"train_loss": -42.479286193847656, "global_step": 309922, "epoch": 2561} {"train_loss": -41.94646453857422, "global_step": 309923, "epoch": 2561} {"train_loss": -42.5760612487793, "global_step": 309924, "epoch": 2561} {"train_loss": -43.1446647644043, "global_step": 309925, "epoch": 2561} {"train_loss": -42.98231887817383, "global_step": 309926, "epoch": 2561} {"train_loss": -42.40488815307617, "global_step": 309927, "epoch": 2561} {"train_loss": -43.12496566772461, "global_step": 309928, "epoch": 2561} {"train_loss": -42.38349533081055, "global_step": 309929, "epoch": 2561} {"train_loss": -42.95901870727539, "global_step": 309930, "epoch": 2561} {"train_loss": -42.81526565551758, "global_step": 309931, "epoch": 2561} {"train_loss": -43.502479553222656, "global_step": 309932, "epoch": 2561} {"train_loss": -42.42033004760742, "global_step": 309933, "epoch": 2561} {"train_loss": -43.6511344909668, "global_step": 309934, "epoch": 2561} {"train_loss": -42.69633102416992, "global_step": 309935, "epoch": 2561} {"train_loss": -42.17671585083008, "global_step": 309936, "epoch": 2561} {"train_loss": -43.64275360107422, "global_step": 309937, "epoch": 2561} {"train_loss": -42.56299591064453, "global_step": 309938, "epoch": 2561} {"train_loss": -43.9424934387207, "global_step": 309939, "epoch": 2561} {"train_loss": -43.64944076538086, "global_step": 309940, "epoch": 2561} {"train_loss": -42.377052307128906, "global_step": 309941, "epoch": 2561} {"train_loss": -42.86219787597656, "global_step": 309942, "epoch": 2561} {"train_loss": -43.0516471862793, "global_step": 309943, "epoch": 2561} {"train_loss": -43.46686935424805, "global_step": 309944, "epoch": 2561} {"train_loss": -43.688079833984375, "global_step": 309945, "epoch": 2561} {"train_loss": -43.480655670166016, "global_step": 309946, "epoch": 2561} {"train_loss": -42.56113052368164, "global_step": 309947, "epoch": 2561} {"train_loss": -43.37852096557617, "global_step": 309948, "epoch": 2561} {"train_loss": -43.6331787109375, "global_step": 309949, "epoch": 2561} {"train_loss": -42.853736877441406, "global_step": 309950, "epoch": 2561} {"train_loss": -43.93021774291992, "global_step": 309951, "epoch": 2561} {"train_loss": -43.073272705078125, "global_step": 309952, "epoch": 2561} {"train_loss": -43.61640548706055, "global_step": 309953, "epoch": 2561} {"train_loss": -43.700443267822266, "global_step": 309954, "epoch": 2561} {"train_loss": -43.52799606323242, "global_step": 309955, "epoch": 2561} {"train_loss": -43.439239501953125, "global_step": 309956, "epoch": 2561} {"train_loss": -42.24180221557617, "global_step": 309957, "epoch": 2561} {"train_loss": -43.81699752807617, "global_step": 309958, "epoch": 2561} {"train_loss": -43.53356170654297, "global_step": 309959, "epoch": 2561} {"train_loss": -43.48612594604492, "global_step": 309960, "epoch": 2561} {"train_loss": -43.409034729003906, "global_step": 309961, "epoch": 2561} {"train_loss": -43.4010124206543, "global_step": 309962, "epoch": 2561} {"train_loss": -43.790924072265625, "global_step": 309963, "epoch": 2561} {"train_loss": -43.47642135620117, "global_step": 309964, "epoch": 2561} {"train_loss": -44.15273666381836, "global_step": 309965, "epoch": 2561} {"train_loss": -43.17384338378906, "global_step": 309966, "epoch": 2561} {"train_loss": -43.335018157958984, "global_step": 309967, "epoch": 2561} {"train_loss": -43.21333694458008, "global_step": 309968, "epoch": 2561} {"train_loss": -43.40621566772461, "global_step": 309969, "epoch": 2561} {"train_loss": -41.604759216308594, "global_step": 309970, "epoch": 2561} {"train_loss": -43.5544548034668, "global_step": 309971, "epoch": 2561} {"train_loss": -44.3137321472168, "global_step": 309972, "epoch": 2561} {"train_loss": -44.166542053222656, "global_step": 309973, "epoch": 2561} {"train_loss": -43.246883392333984, "global_step": 309974, "epoch": 2561} {"train_loss": -43.20016098022461, "global_step": 309975, "epoch": 2561} {"train_loss": -43.50521469116211, "global_step": 309976, "epoch": 2561} {"train_loss": -43.7396125793457, "global_step": 309977, "epoch": 2561} {"train_loss": -44.39616775512695, "global_step": 309978, "epoch": 2561} {"train_loss": -43.18734359741211, "global_step": 309979, "epoch": 2561} {"train_loss": -43.904502868652344, "global_step": 309980, "epoch": 2561} {"train_loss": -43.2486572265625, "global_step": 309981, "epoch": 2561} {"train_loss": -43.52470016479492, "global_step": 309982, "epoch": 2561} {"train_loss": -44.11589431762695, "global_step": 309983, "epoch": 2561} {"train_loss": -43.6832160949707, "global_step": 309984, "epoch": 2561} {"train_loss": -43.989376068115234, "global_step": 309985, "epoch": 2561} {"train_loss": -43.146175384521484, "global_step": 309986, "epoch": 2561} {"train_loss": -43.664005279541016, "global_step": 309987, "epoch": 2561} {"train_loss": -42.45534896850586, "global_step": 309988, "epoch": 2561} {"train_loss": -42.58175277709961, "global_step": 309989, "epoch": 2561} {"train_loss": -43.74790573120117, "global_step": 309990, "epoch": 2561} {"train_loss": -43.86555099487305, "global_step": 309991, "epoch": 2561} {"train_loss": -43.22758865356445, "global_step": 309992, "epoch": 2561} {"train_loss": -42.432159423828125, "global_step": 309993, "epoch": 2561} {"train_loss": -43.251075744628906, "global_step": 309994, "epoch": 2561} {"train_loss": -42.52242660522461, "global_step": 309995, "epoch": 2561} {"train_loss": -42.31716537475586, "global_step": 309996, "epoch": 2561} {"train_loss": -43.19657897949219, "global_step": 309997, "epoch": 2561} {"train_loss": -42.004085540771484, "global_step": 309998, "epoch": 2561} {"train_loss": -41.10480499267578, "global_step": 309999, "epoch": 2561} {"train_loss": -41.13605880737305, "global_step": 310000, "epoch": 2561} {"train_loss": -42.84590249810337, "global_step": 310001, "epoch": 2561, "val_loss": 2822719.0} {"train_loss": -41.15898513793945, "global_step": 310002, "epoch": 2562} {"train_loss": -41.495994567871094, "global_step": 310003, "epoch": 2562} {"train_loss": -41.51057434082031, "global_step": 310004, "epoch": 2562} {"train_loss": -42.122798919677734, "global_step": 310005, "epoch": 2562} {"train_loss": -41.30899429321289, "global_step": 310006, "epoch": 2562} {"train_loss": -41.934967041015625, "global_step": 310007, "epoch": 2562} {"train_loss": -42.020294189453125, "global_step": 310008, "epoch": 2562} {"train_loss": -41.988243103027344, "global_step": 310009, "epoch": 2562} {"train_loss": -42.6529655456543, "global_step": 310010, "epoch": 2562} {"train_loss": -40.82802963256836, "global_step": 310011, "epoch": 2562} {"train_loss": -41.86701202392578, "global_step": 310012, "epoch": 2562} {"train_loss": -42.131805419921875, "global_step": 310013, "epoch": 2562} {"train_loss": -42.93464660644531, "global_step": 310014, "epoch": 2562} {"train_loss": -41.7824821472168, "global_step": 310015, "epoch": 2562} {"train_loss": -42.580135345458984, "global_step": 310016, "epoch": 2562} {"train_loss": -41.815673828125, "global_step": 310017, "epoch": 2562} {"train_loss": -41.264583587646484, "global_step": 310018, "epoch": 2562} {"train_loss": -42.82712936401367, "global_step": 310019, "epoch": 2562} {"train_loss": -42.170284271240234, "global_step": 310020, "epoch": 2562} {"train_loss": -42.53662872314453, "global_step": 310021, "epoch": 2562} {"train_loss": -43.173316955566406, "global_step": 310022, "epoch": 2562} {"train_loss": -41.73770523071289, "global_step": 310023, "epoch": 2562} {"train_loss": -41.39559555053711, "global_step": 310024, "epoch": 2562} {"train_loss": -42.86932373046875, "global_step": 310025, "epoch": 2562} {"train_loss": -42.00637435913086, "global_step": 310026, "epoch": 2562} {"train_loss": -41.64374923706055, "global_step": 310027, "epoch": 2562} {"train_loss": -41.42890548706055, "global_step": 310028, "epoch": 2562} {"train_loss": -42.08514404296875, "global_step": 310029, "epoch": 2562} {"train_loss": -42.26959991455078, "global_step": 310030, "epoch": 2562} {"train_loss": -42.87281036376953, "global_step": 310031, "epoch": 2562} {"train_loss": -43.154541015625, "global_step": 310032, "epoch": 2562} {"train_loss": -42.650856018066406, "global_step": 310033, "epoch": 2562} {"train_loss": -42.95664596557617, "global_step": 310034, "epoch": 2562} {"train_loss": -42.1248779296875, "global_step": 310035, "epoch": 2562} {"train_loss": -42.6831169128418, "global_step": 310036, "epoch": 2562} {"train_loss": -43.2475471496582, "global_step": 310037, "epoch": 2562} {"train_loss": -42.7269172668457, "global_step": 310038, "epoch": 2562} {"train_loss": -43.071998596191406, "global_step": 310039, "epoch": 2562} {"train_loss": -42.69350051879883, "global_step": 310040, "epoch": 2562} {"train_loss": -43.23933792114258, "global_step": 310041, "epoch": 2562} {"train_loss": -42.32870101928711, "global_step": 310042, "epoch": 2562} {"train_loss": -42.33987808227539, "global_step": 310043, "epoch": 2562} {"train_loss": -42.86124801635742, "global_step": 310044, "epoch": 2562} {"train_loss": -42.31148910522461, "global_step": 310045, "epoch": 2562} {"train_loss": -42.598934173583984, "global_step": 310046, "epoch": 2562} {"train_loss": -42.8193359375, "global_step": 310047, "epoch": 2562} {"train_loss": -42.27239990234375, "global_step": 310048, "epoch": 2562} {"train_loss": -42.787479400634766, "global_step": 310049, "epoch": 2562} {"train_loss": -41.05875778198242, "global_step": 310050, "epoch": 2562} {"train_loss": -42.571041107177734, "global_step": 310051, "epoch": 2562} {"train_loss": -42.91394805908203, "global_step": 310052, "epoch": 2562} {"train_loss": -42.490901947021484, "global_step": 310053, "epoch": 2562} {"train_loss": -40.836002349853516, "global_step": 310054, "epoch": 2562} {"train_loss": -42.16571807861328, "global_step": 310055, "epoch": 2562} {"train_loss": -41.20339584350586, "global_step": 310056, "epoch": 2562} {"train_loss": -42.776119232177734, "global_step": 310057, "epoch": 2562} {"train_loss": -41.36360549926758, "global_step": 310058, "epoch": 2562} {"train_loss": -43.11251449584961, "global_step": 310059, "epoch": 2562} {"train_loss": -39.75764083862305, "global_step": 310060, "epoch": 2562} {"train_loss": -42.28171920776367, "global_step": 310061, "epoch": 2562} {"train_loss": -42.44083786010742, "global_step": 310062, "epoch": 2562} {"train_loss": -42.0443000793457, "global_step": 310063, "epoch": 2562} {"train_loss": -42.7218132019043, "global_step": 310064, "epoch": 2562} {"train_loss": -43.048439025878906, "global_step": 310065, "epoch": 2562} {"train_loss": -42.65694808959961, "global_step": 310066, "epoch": 2562} {"train_loss": -43.346920013427734, "global_step": 310067, "epoch": 2562} {"train_loss": -43.133697509765625, "global_step": 310068, "epoch": 2562} {"train_loss": -42.625221252441406, "global_step": 310069, "epoch": 2562} {"train_loss": -42.60752487182617, "global_step": 310070, "epoch": 2562} {"train_loss": -43.5628776550293, "global_step": 310071, "epoch": 2562} {"train_loss": -43.11758041381836, "global_step": 310072, "epoch": 2562} {"train_loss": -43.371978759765625, "global_step": 310073, "epoch": 2562} {"train_loss": -43.06728744506836, "global_step": 310074, "epoch": 2562} {"train_loss": -43.356285095214844, "global_step": 310075, "epoch": 2562} {"train_loss": -43.0155143737793, "global_step": 310076, "epoch": 2562} {"train_loss": -43.20402145385742, "global_step": 310077, "epoch": 2562} {"train_loss": -43.44518280029297, "global_step": 310078, "epoch": 2562} {"train_loss": -43.836299896240234, "global_step": 310079, "epoch": 2562} {"train_loss": -43.38558578491211, "global_step": 310080, "epoch": 2562} {"train_loss": -43.308441162109375, "global_step": 310081, "epoch": 2562} {"train_loss": -44.080745697021484, "global_step": 310082, "epoch": 2562} {"train_loss": -43.0826530456543, "global_step": 310083, "epoch": 2562} {"train_loss": -43.57809066772461, "global_step": 310084, "epoch": 2562} {"train_loss": -43.94847869873047, "global_step": 310085, "epoch": 2562} {"train_loss": -44.019954681396484, "global_step": 310086, "epoch": 2562} {"train_loss": -44.110504150390625, "global_step": 310087, "epoch": 2562} {"train_loss": -43.77958297729492, "global_step": 310088, "epoch": 2562} {"train_loss": -44.04806900024414, "global_step": 310089, "epoch": 2562} {"train_loss": -43.968544006347656, "global_step": 310090, "epoch": 2562} {"train_loss": -43.82582473754883, "global_step": 310091, "epoch": 2562} {"train_loss": -43.874629974365234, "global_step": 310092, "epoch": 2562} {"train_loss": -43.297969818115234, "global_step": 310093, "epoch": 2562} {"train_loss": -44.59596633911133, "global_step": 310094, "epoch": 2562} {"train_loss": -44.4047966003418, "global_step": 310095, "epoch": 2562} {"train_loss": -44.836727142333984, "global_step": 310096, "epoch": 2562} {"train_loss": -43.98545455932617, "global_step": 310097, "epoch": 2562} {"train_loss": -43.69186782836914, "global_step": 310098, "epoch": 2562} {"train_loss": -43.486549377441406, "global_step": 310099, "epoch": 2562} {"train_loss": -43.06134796142578, "global_step": 310100, "epoch": 2562} {"train_loss": -43.430145263671875, "global_step": 310101, "epoch": 2562} {"train_loss": -43.1765251159668, "global_step": 310102, "epoch": 2562} {"train_loss": -44.394195556640625, "global_step": 310103, "epoch": 2562} {"train_loss": -43.52128601074219, "global_step": 310104, "epoch": 2562} {"train_loss": -43.02032470703125, "global_step": 310105, "epoch": 2562} {"train_loss": -42.34743118286133, "global_step": 310106, "epoch": 2562} {"train_loss": -41.99231719970703, "global_step": 310107, "epoch": 2562} {"train_loss": -43.260066986083984, "global_step": 310108, "epoch": 2562} {"train_loss": -43.62907409667969, "global_step": 310109, "epoch": 2562} {"train_loss": -42.718414306640625, "global_step": 310110, "epoch": 2562} {"train_loss": -43.34560775756836, "global_step": 310111, "epoch": 2562} {"train_loss": -43.478271484375, "global_step": 310112, "epoch": 2562} {"train_loss": -42.9423942565918, "global_step": 310113, "epoch": 2562} {"train_loss": -42.22428512573242, "global_step": 310114, "epoch": 2562} {"train_loss": -42.12416458129883, "global_step": 310115, "epoch": 2562} {"train_loss": -43.153018951416016, "global_step": 310116, "epoch": 2562} {"train_loss": -44.2186279296875, "global_step": 310117, "epoch": 2562} {"train_loss": -43.4368782043457, "global_step": 310118, "epoch": 2562} {"train_loss": -42.972808837890625, "global_step": 310119, "epoch": 2562} {"train_loss": -42.1454963684082, "global_step": 310120, "epoch": 2562} {"train_loss": -41.12995529174805, "global_step": 310121, "epoch": 2562} {"train_loss": -42.74027015749088, "global_step": 310122, "epoch": 2562, "val_loss": 2663495.25} {"train_loss": -42.815826416015625, "global_step": 310123, "epoch": 2563} {"train_loss": -41.822078704833984, "global_step": 310124, "epoch": 2563} {"train_loss": -40.66852951049805, "global_step": 310125, "epoch": 2563} {"train_loss": -42.7498893737793, "global_step": 310126, "epoch": 2563} {"train_loss": -43.044803619384766, "global_step": 310127, "epoch": 2563} {"train_loss": -41.83774948120117, "global_step": 310128, "epoch": 2563} {"train_loss": -28.82148551940918, "global_step": 310129, "epoch": 2563} {"train_loss": -42.70573425292969, "global_step": 310130, "epoch": 2563} {"train_loss": -38.375946044921875, "global_step": 310131, "epoch": 2563} {"train_loss": -42.872554779052734, "global_step": 310132, "epoch": 2563} {"train_loss": -42.965511322021484, "global_step": 310133, "epoch": 2563} {"train_loss": -42.64545822143555, "global_step": 310134, "epoch": 2563} {"train_loss": -41.04471206665039, "global_step": 310135, "epoch": 2563} {"train_loss": -33.33351516723633, "global_step": 310136, "epoch": 2563} {"train_loss": -42.273658752441406, "global_step": 310137, "epoch": 2563} {"train_loss": -42.83658218383789, "global_step": 310138, "epoch": 2563} {"train_loss": -37.26538848876953, "global_step": 310139, "epoch": 2563} {"train_loss": -42.22566604614258, "global_step": 310140, "epoch": 2563} {"train_loss": -39.160823822021484, "global_step": 310141, "epoch": 2563} {"train_loss": -42.720550537109375, "global_step": 310142, "epoch": 2563} {"train_loss": -42.758182525634766, "global_step": 310143, "epoch": 2563} {"train_loss": -42.23269271850586, "global_step": 310144, "epoch": 2563} {"train_loss": -41.849098205566406, "global_step": 310145, "epoch": 2563} {"train_loss": -43.2536735534668, "global_step": 310146, "epoch": 2563} {"train_loss": -42.49018096923828, "global_step": 310147, "epoch": 2563} {"train_loss": -42.21977615356445, "global_step": 310148, "epoch": 2563} {"train_loss": -42.23235321044922, "global_step": 310149, "epoch": 2563} {"train_loss": -41.11343002319336, "global_step": 310150, "epoch": 2563} {"train_loss": -41.19923782348633, "global_step": 310151, "epoch": 2563} {"train_loss": -39.29437255859375, "global_step": 310152, "epoch": 2563} {"train_loss": -38.92776107788086, "global_step": 310153, "epoch": 2563} {"train_loss": -42.63132858276367, "global_step": 310154, "epoch": 2563} {"train_loss": -40.61354446411133, "global_step": 310155, "epoch": 2563} {"train_loss": -39.5345458984375, "global_step": 310156, "epoch": 2563} {"train_loss": -41.84130859375, "global_step": 310157, "epoch": 2563} {"train_loss": -41.2779655456543, "global_step": 310158, "epoch": 2563} {"train_loss": -41.59003829956055, "global_step": 310159, "epoch": 2563} {"train_loss": -41.6545524597168, "global_step": 310160, "epoch": 2563} {"train_loss": -40.728755950927734, "global_step": 310161, "epoch": 2563} {"train_loss": -40.14169692993164, "global_step": 310162, "epoch": 2563} {"train_loss": -41.63450241088867, "global_step": 310163, "epoch": 2563} {"train_loss": -41.750274658203125, "global_step": 310164, "epoch": 2563} {"train_loss": -38.40906524658203, "global_step": 310165, "epoch": 2563} {"train_loss": -41.76079559326172, "global_step": 310166, "epoch": 2563} {"train_loss": -42.053199768066406, "global_step": 310167, "epoch": 2563} {"train_loss": -42.0806770324707, "global_step": 310168, "epoch": 2563} {"train_loss": -41.89649200439453, "global_step": 310169, "epoch": 2563} {"train_loss": -40.81593704223633, "global_step": 310170, "epoch": 2563} {"train_loss": -41.58417510986328, "global_step": 310171, "epoch": 2563} {"train_loss": -40.18254089355469, "global_step": 310172, "epoch": 2563} {"train_loss": -40.903072357177734, "global_step": 310173, "epoch": 2563} {"train_loss": -41.90272903442383, "global_step": 310174, "epoch": 2563} {"train_loss": -36.713783264160156, "global_step": 310175, "epoch": 2563} {"train_loss": -40.15681838989258, "global_step": 310176, "epoch": 2563} {"train_loss": -39.30257797241211, "global_step": 310177, "epoch": 2563} {"train_loss": -42.32262420654297, "global_step": 310178, "epoch": 2563} {"train_loss": -41.45992660522461, "global_step": 310179, "epoch": 2563} {"train_loss": -41.81622314453125, "global_step": 310180, "epoch": 2563} {"train_loss": -41.74970626831055, "global_step": 310181, "epoch": 2563} {"train_loss": -42.82445526123047, "global_step": 310182, "epoch": 2563} {"train_loss": -41.64033889770508, "global_step": 310183, "epoch": 2563} {"train_loss": -38.45621871948242, "global_step": 310184, "epoch": 2563} {"train_loss": -40.67927169799805, "global_step": 310185, "epoch": 2563} {"train_loss": -42.400814056396484, "global_step": 310186, "epoch": 2563} {"train_loss": -41.28325271606445, "global_step": 310187, "epoch": 2563} {"train_loss": -41.146358489990234, "global_step": 310188, "epoch": 2563} {"train_loss": -40.79450988769531, "global_step": 310189, "epoch": 2563} {"train_loss": -40.916534423828125, "global_step": 310190, "epoch": 2563} {"train_loss": -38.948585510253906, "global_step": 310191, "epoch": 2563} {"train_loss": -37.1113395690918, "global_step": 310192, "epoch": 2563} {"train_loss": -42.03829574584961, "global_step": 310193, "epoch": 2563} {"train_loss": -40.85185623168945, "global_step": 310194, "epoch": 2563} {"train_loss": -40.241268157958984, "global_step": 310195, "epoch": 2563} {"train_loss": -41.81759262084961, "global_step": 310196, "epoch": 2563} {"train_loss": -42.30951690673828, "global_step": 310197, "epoch": 2563} {"train_loss": -40.918006896972656, "global_step": 310198, "epoch": 2563} {"train_loss": -39.296077728271484, "global_step": 310199, "epoch": 2563} {"train_loss": -41.5373420715332, "global_step": 310200, "epoch": 2563} {"train_loss": -38.618770599365234, "global_step": 310201, "epoch": 2563} {"train_loss": -40.0133171081543, "global_step": 310202, "epoch": 2563} {"train_loss": -39.350379943847656, "global_step": 310203, "epoch": 2563} {"train_loss": -42.0526123046875, "global_step": 310204, "epoch": 2563} {"train_loss": -41.56808090209961, "global_step": 310205, "epoch": 2563} {"train_loss": -37.964698791503906, "global_step": 310206, "epoch": 2563} {"train_loss": -41.500465393066406, "global_step": 310207, "epoch": 2563} {"train_loss": -40.55946731567383, "global_step": 310208, "epoch": 2563} {"train_loss": -41.83158493041992, "global_step": 310209, "epoch": 2563} {"train_loss": -40.717262268066406, "global_step": 310210, "epoch": 2563} {"train_loss": -41.613616943359375, "global_step": 310211, "epoch": 2563} {"train_loss": -40.883399963378906, "global_step": 310212, "epoch": 2563} {"train_loss": -41.42830276489258, "global_step": 310213, "epoch": 2563} {"train_loss": -41.796241760253906, "global_step": 310214, "epoch": 2563} {"train_loss": -41.13981628417969, "global_step": 310215, "epoch": 2563} {"train_loss": -39.17511749267578, "global_step": 310216, "epoch": 2563} {"train_loss": -42.10988998413086, "global_step": 310217, "epoch": 2563} {"train_loss": -40.10398483276367, "global_step": 310218, "epoch": 2563} {"train_loss": -40.124671936035156, "global_step": 310219, "epoch": 2563} {"train_loss": -40.465023040771484, "global_step": 310220, "epoch": 2563} {"train_loss": -39.956111907958984, "global_step": 310221, "epoch": 2563} {"train_loss": -41.48086166381836, "global_step": 310222, "epoch": 2563} {"train_loss": -41.420013427734375, "global_step": 310223, "epoch": 2563} {"train_loss": -42.4187126159668, "global_step": 310224, "epoch": 2563} {"train_loss": -38.28349685668945, "global_step": 310225, "epoch": 2563} {"train_loss": -37.28460693359375, "global_step": 310226, "epoch": 2563} {"train_loss": -40.52058029174805, "global_step": 310227, "epoch": 2563} {"train_loss": -40.990806579589844, "global_step": 310228, "epoch": 2563} {"train_loss": -39.29634475708008, "global_step": 310229, "epoch": 2563} {"train_loss": -37.43281173706055, "global_step": 310230, "epoch": 2563} {"train_loss": -40.78446578979492, "global_step": 310231, "epoch": 2563} {"train_loss": -35.36670684814453, "global_step": 310232, "epoch": 2563} {"train_loss": -39.95614242553711, "global_step": 310233, "epoch": 2563} {"train_loss": -40.2655029296875, "global_step": 310234, "epoch": 2563} {"train_loss": -41.24744415283203, "global_step": 310235, "epoch": 2563} {"train_loss": -40.25823974609375, "global_step": 310236, "epoch": 2563} {"train_loss": -40.1348876953125, "global_step": 310237, "epoch": 2563} {"train_loss": -40.24347686767578, "global_step": 310238, "epoch": 2563} {"train_loss": -40.47758102416992, "global_step": 310239, "epoch": 2563} {"train_loss": -41.79757308959961, "global_step": 310240, "epoch": 2563} {"train_loss": -39.72755813598633, "global_step": 310241, "epoch": 2563} {"train_loss": -39.38017654418945, "global_step": 310242, "epoch": 2563} {"train_loss": -40.712630106397896, "global_step": 310243, "epoch": 2563, "val_loss": 2840388.0} {"train_loss": -39.21843338012695, "global_step": 310244, "epoch": 2564} {"train_loss": -39.38209533691406, "global_step": 310245, "epoch": 2564} {"train_loss": -41.321144104003906, "global_step": 310246, "epoch": 2564} {"train_loss": -42.01165771484375, "global_step": 310247, "epoch": 2564} {"train_loss": -42.128963470458984, "global_step": 310248, "epoch": 2564} {"train_loss": -41.800960540771484, "global_step": 310249, "epoch": 2564} {"train_loss": -42.37464904785156, "global_step": 310250, "epoch": 2564} {"train_loss": -39.34905242919922, "global_step": 310251, "epoch": 2564} {"train_loss": -40.77997970581055, "global_step": 310252, "epoch": 2564} {"train_loss": -40.84741973876953, "global_step": 310253, "epoch": 2564} {"train_loss": -40.36861801147461, "global_step": 310254, "epoch": 2564} {"train_loss": -40.93605041503906, "global_step": 310255, "epoch": 2564} {"train_loss": -42.47178268432617, "global_step": 310256, "epoch": 2564} {"train_loss": -41.886573791503906, "global_step": 310257, "epoch": 2564} {"train_loss": -40.308135986328125, "global_step": 310258, "epoch": 2564} {"train_loss": -41.24793243408203, "global_step": 310259, "epoch": 2564} {"train_loss": -39.43574142456055, "global_step": 310260, "epoch": 2564} {"train_loss": -41.082557678222656, "global_step": 310261, "epoch": 2564} {"train_loss": -42.00324249267578, "global_step": 310262, "epoch": 2564} {"train_loss": -42.074607849121094, "global_step": 310263, "epoch": 2564} {"train_loss": -40.087215423583984, "global_step": 310264, "epoch": 2564} {"train_loss": -40.21242904663086, "global_step": 310265, "epoch": 2564} {"train_loss": -41.68857955932617, "global_step": 310266, "epoch": 2564} {"train_loss": -41.86005783081055, "global_step": 310267, "epoch": 2564} {"train_loss": -42.686058044433594, "global_step": 310268, "epoch": 2564} {"train_loss": -41.7438850402832, "global_step": 310269, "epoch": 2564} {"train_loss": -41.07968521118164, "global_step": 310270, "epoch": 2564} {"train_loss": -41.860836029052734, "global_step": 310271, "epoch": 2564} {"train_loss": -41.96577072143555, "global_step": 310272, "epoch": 2564} {"train_loss": -41.92221450805664, "global_step": 310273, "epoch": 2564} {"train_loss": -41.59051513671875, "global_step": 310274, "epoch": 2564} {"train_loss": -42.27024459838867, "global_step": 310275, "epoch": 2564} {"train_loss": -40.69942092895508, "global_step": 310276, "epoch": 2564} {"train_loss": -41.184200286865234, "global_step": 310277, "epoch": 2564} {"train_loss": -41.048980712890625, "global_step": 310278, "epoch": 2564} {"train_loss": -40.280208587646484, "global_step": 310279, "epoch": 2564} {"train_loss": -40.012489318847656, "global_step": 310280, "epoch": 2564} {"train_loss": -42.51972198486328, "global_step": 310281, "epoch": 2564} {"train_loss": -41.54246139526367, "global_step": 310282, "epoch": 2564} {"train_loss": -41.805355072021484, "global_step": 310283, "epoch": 2564} {"train_loss": -40.3863410949707, "global_step": 310284, "epoch": 2564} {"train_loss": -41.35005569458008, "global_step": 310285, "epoch": 2564} {"train_loss": -41.70954895019531, "global_step": 310286, "epoch": 2564} {"train_loss": -39.786521911621094, "global_step": 310287, "epoch": 2564} {"train_loss": -40.83985900878906, "global_step": 310288, "epoch": 2564} {"train_loss": -41.32080841064453, "global_step": 310289, "epoch": 2564} {"train_loss": -42.2134895324707, "global_step": 310290, "epoch": 2564} {"train_loss": -41.88164520263672, "global_step": 310291, "epoch": 2564} {"train_loss": -41.88559341430664, "global_step": 310292, "epoch": 2564} {"train_loss": -38.647865295410156, "global_step": 310293, "epoch": 2564} {"train_loss": -40.82162094116211, "global_step": 310294, "epoch": 2564} {"train_loss": -42.397918701171875, "global_step": 310295, "epoch": 2564} {"train_loss": -41.92039108276367, "global_step": 310296, "epoch": 2564} {"train_loss": -42.50818634033203, "global_step": 310297, "epoch": 2564} {"train_loss": -42.61177444458008, "global_step": 310298, "epoch": 2564} {"train_loss": -41.79085922241211, "global_step": 310299, "epoch": 2564} {"train_loss": -42.53007507324219, "global_step": 310300, "epoch": 2564} {"train_loss": -41.98809814453125, "global_step": 310301, "epoch": 2564} {"train_loss": -42.4561882019043, "global_step": 310302, "epoch": 2564} {"train_loss": -40.92157745361328, "global_step": 310303, "epoch": 2564} {"train_loss": -40.20365524291992, "global_step": 310304, "epoch": 2564} {"train_loss": -41.33977508544922, "global_step": 310305, "epoch": 2564} {"train_loss": -42.63422393798828, "global_step": 310306, "epoch": 2564} {"train_loss": -42.02498245239258, "global_step": 310307, "epoch": 2564} {"train_loss": -42.41148376464844, "global_step": 310308, "epoch": 2564} {"train_loss": -41.801334381103516, "global_step": 310309, "epoch": 2564} {"train_loss": -41.71080780029297, "global_step": 310310, "epoch": 2564} {"train_loss": -41.646724700927734, "global_step": 310311, "epoch": 2564} {"train_loss": -41.17647171020508, "global_step": 310312, "epoch": 2564} {"train_loss": -42.330039978027344, "global_step": 310313, "epoch": 2564} {"train_loss": -42.4283332824707, "global_step": 310314, "epoch": 2564} {"train_loss": -41.85024642944336, "global_step": 310315, "epoch": 2564} {"train_loss": -42.054317474365234, "global_step": 310316, "epoch": 2564} {"train_loss": -38.40449142456055, "global_step": 310317, "epoch": 2564} {"train_loss": -42.451637268066406, "global_step": 310318, "epoch": 2564} {"train_loss": -41.1200065612793, "global_step": 310319, "epoch": 2564} {"train_loss": -41.83916091918945, "global_step": 310320, "epoch": 2564} {"train_loss": -42.05424880981445, "global_step": 310321, "epoch": 2564} {"train_loss": -41.51759338378906, "global_step": 310322, "epoch": 2564} {"train_loss": -41.479331970214844, "global_step": 310323, "epoch": 2564} {"train_loss": -39.26184844970703, "global_step": 310324, "epoch": 2564} {"train_loss": -41.84843444824219, "global_step": 310325, "epoch": 2564} {"train_loss": -40.744686126708984, "global_step": 310326, "epoch": 2564} {"train_loss": -42.004390716552734, "global_step": 310327, "epoch": 2564} {"train_loss": -41.14204788208008, "global_step": 310328, "epoch": 2564} {"train_loss": -40.653480529785156, "global_step": 310329, "epoch": 2564} {"train_loss": -41.81373977661133, "global_step": 310330, "epoch": 2564} {"train_loss": -41.25230407714844, "global_step": 310331, "epoch": 2564} {"train_loss": -41.2019157409668, "global_step": 310332, "epoch": 2564} {"train_loss": -33.8372917175293, "global_step": 310333, "epoch": 2564} {"train_loss": -40.899131774902344, "global_step": 310334, "epoch": 2564} {"train_loss": -41.07624053955078, "global_step": 310335, "epoch": 2564} {"train_loss": -39.7307014465332, "global_step": 310336, "epoch": 2564} {"train_loss": -37.64335250854492, "global_step": 310337, "epoch": 2564} {"train_loss": -41.333343505859375, "global_step": 310338, "epoch": 2564} {"train_loss": -37.15230178833008, "global_step": 310339, "epoch": 2564} {"train_loss": -41.41594314575195, "global_step": 310340, "epoch": 2564} {"train_loss": -36.41333770751953, "global_step": 310341, "epoch": 2564} {"train_loss": -41.086570739746094, "global_step": 310342, "epoch": 2564} {"train_loss": -41.630775451660156, "global_step": 310343, "epoch": 2564} {"train_loss": -35.64234161376953, "global_step": 310344, "epoch": 2564} {"train_loss": -35.14516067504883, "global_step": 310345, "epoch": 2564} {"train_loss": -39.57876968383789, "global_step": 310346, "epoch": 2564} {"train_loss": -41.7839241027832, "global_step": 310347, "epoch": 2564} {"train_loss": -41.64210891723633, "global_step": 310348, "epoch": 2564} {"train_loss": -42.29387283325195, "global_step": 310349, "epoch": 2564} {"train_loss": -41.67804718017578, "global_step": 310350, "epoch": 2564} {"train_loss": -40.31611251831055, "global_step": 310351, "epoch": 2564} {"train_loss": -39.27518844604492, "global_step": 310352, "epoch": 2564} {"train_loss": -41.09060287475586, "global_step": 310353, "epoch": 2564} {"train_loss": -40.33988571166992, "global_step": 310354, "epoch": 2564} {"train_loss": -39.43522262573242, "global_step": 310355, "epoch": 2564} {"train_loss": -40.856056213378906, "global_step": 310356, "epoch": 2564} {"train_loss": -42.14205551147461, "global_step": 310357, "epoch": 2564} {"train_loss": -41.39524841308594, "global_step": 310358, "epoch": 2564} {"train_loss": -42.08232116699219, "global_step": 310359, "epoch": 2564} {"train_loss": -40.21017074584961, "global_step": 310360, "epoch": 2564} {"train_loss": -40.25544357299805, "global_step": 310361, "epoch": 2564} {"train_loss": -42.5003776550293, "global_step": 310362, "epoch": 2564} {"train_loss": -39.63152313232422, "global_step": 310363, "epoch": 2564} {"train_loss": -41.01564382127494, "global_step": 310364, "epoch": 2564, "val_loss": 2708226.25} {"train_loss": -41.85758590698242, "global_step": 310365, "epoch": 2565} {"train_loss": -41.860260009765625, "global_step": 310366, "epoch": 2565} {"train_loss": -41.55167770385742, "global_step": 310367, "epoch": 2565} {"train_loss": -40.94857406616211, "global_step": 310368, "epoch": 2565} {"train_loss": -41.19784164428711, "global_step": 310369, "epoch": 2565} {"train_loss": -41.18583297729492, "global_step": 310370, "epoch": 2565} {"train_loss": -41.3674201965332, "global_step": 310371, "epoch": 2565} {"train_loss": -41.71675491333008, "global_step": 310372, "epoch": 2565} {"train_loss": -35.17616653442383, "global_step": 310373, "epoch": 2565} {"train_loss": -41.61219024658203, "global_step": 310374, "epoch": 2565} {"train_loss": -41.66274642944336, "global_step": 310375, "epoch": 2565} {"train_loss": -42.70345687866211, "global_step": 310376, "epoch": 2565} {"train_loss": -41.35880661010742, "global_step": 310377, "epoch": 2565} {"train_loss": -42.1983642578125, "global_step": 310378, "epoch": 2565} {"train_loss": -41.557186126708984, "global_step": 310379, "epoch": 2565} {"train_loss": -40.754127502441406, "global_step": 310380, "epoch": 2565} {"train_loss": -42.42805099487305, "global_step": 310381, "epoch": 2565} {"train_loss": -42.39519500732422, "global_step": 310382, "epoch": 2565} {"train_loss": -42.922977447509766, "global_step": 310383, "epoch": 2565} {"train_loss": -39.5162353515625, "global_step": 310384, "epoch": 2565} {"train_loss": -42.42619705200195, "global_step": 310385, "epoch": 2565} {"train_loss": -42.63538360595703, "global_step": 310386, "epoch": 2565} {"train_loss": -42.24361801147461, "global_step": 310387, "epoch": 2565} {"train_loss": -42.13912582397461, "global_step": 310388, "epoch": 2565} {"train_loss": -42.6961784362793, "global_step": 310389, "epoch": 2565} {"train_loss": -42.435054779052734, "global_step": 310390, "epoch": 2565} {"train_loss": -41.732635498046875, "global_step": 310391, "epoch": 2565} {"train_loss": -40.551300048828125, "global_step": 310392, "epoch": 2565} {"train_loss": -42.831993103027344, "global_step": 310393, "epoch": 2565} {"train_loss": -42.992210388183594, "global_step": 310394, "epoch": 2565} {"train_loss": -42.92316436767578, "global_step": 310395, "epoch": 2565} {"train_loss": -41.04682159423828, "global_step": 310396, "epoch": 2565} {"train_loss": -42.12915802001953, "global_step": 310397, "epoch": 2565} {"train_loss": -41.83753967285156, "global_step": 310398, "epoch": 2565} {"train_loss": -43.137672424316406, "global_step": 310399, "epoch": 2565} {"train_loss": -42.1940803527832, "global_step": 310400, "epoch": 2565} {"train_loss": -42.84603500366211, "global_step": 310401, "epoch": 2565} {"train_loss": -42.48935317993164, "global_step": 310402, "epoch": 2565} {"train_loss": -42.987117767333984, "global_step": 310403, "epoch": 2565} {"train_loss": -42.53859329223633, "global_step": 310404, "epoch": 2565} {"train_loss": -42.47089767456055, "global_step": 310405, "epoch": 2565} {"train_loss": -42.80607223510742, "global_step": 310406, "epoch": 2565} {"train_loss": -41.932861328125, "global_step": 310407, "epoch": 2565} {"train_loss": -42.899017333984375, "global_step": 310408, "epoch": 2565} {"train_loss": -42.62851333618164, "global_step": 310409, "epoch": 2565} {"train_loss": -42.38206100463867, "global_step": 310410, "epoch": 2565} {"train_loss": -39.86383056640625, "global_step": 310411, "epoch": 2565} {"train_loss": -42.18087387084961, "global_step": 310412, "epoch": 2565} {"train_loss": -42.657264709472656, "global_step": 310413, "epoch": 2565} {"train_loss": -42.79084014892578, "global_step": 310414, "epoch": 2565} {"train_loss": -42.145259857177734, "global_step": 310415, "epoch": 2565} {"train_loss": -42.52143096923828, "global_step": 310416, "epoch": 2565} {"train_loss": -42.32278823852539, "global_step": 310417, "epoch": 2565} {"train_loss": -42.31107711791992, "global_step": 310418, "epoch": 2565} {"train_loss": -40.53810501098633, "global_step": 310419, "epoch": 2565} {"train_loss": -41.81352615356445, "global_step": 310420, "epoch": 2565} {"train_loss": -42.19673156738281, "global_step": 310421, "epoch": 2565} {"train_loss": -42.37803268432617, "global_step": 310422, "epoch": 2565} {"train_loss": -42.84192657470703, "global_step": 310423, "epoch": 2565} {"train_loss": -42.87385177612305, "global_step": 310424, "epoch": 2565} {"train_loss": -43.01882553100586, "global_step": 310425, "epoch": 2565} {"train_loss": -42.722835540771484, "global_step": 310426, "epoch": 2565} {"train_loss": -42.98051834106445, "global_step": 310427, "epoch": 2565} {"train_loss": -42.910621643066406, "global_step": 310428, "epoch": 2565} {"train_loss": -36.47953414916992, "global_step": 310429, "epoch": 2565} {"train_loss": -42.260555267333984, "global_step": 310430, "epoch": 2565} {"train_loss": -43.128047943115234, "global_step": 310431, "epoch": 2565} {"train_loss": -41.77372360229492, "global_step": 310432, "epoch": 2565} {"train_loss": -41.500709533691406, "global_step": 310433, "epoch": 2565} {"train_loss": -42.04718780517578, "global_step": 310434, "epoch": 2565} {"train_loss": -42.40666580200195, "global_step": 310435, "epoch": 2565} {"train_loss": -42.29834747314453, "global_step": 310436, "epoch": 2565} {"train_loss": -41.393272399902344, "global_step": 310437, "epoch": 2565} {"train_loss": -42.73244857788086, "global_step": 310438, "epoch": 2565} {"train_loss": -41.868751525878906, "global_step": 310439, "epoch": 2565} {"train_loss": -42.14321517944336, "global_step": 310440, "epoch": 2565} {"train_loss": -41.98106002807617, "global_step": 310441, "epoch": 2565} {"train_loss": -42.62678146362305, "global_step": 310442, "epoch": 2565} {"train_loss": -42.62580108642578, "global_step": 310443, "epoch": 2565} {"train_loss": -42.686363220214844, "global_step": 310444, "epoch": 2565} {"train_loss": -42.34260177612305, "global_step": 310445, "epoch": 2565} {"train_loss": -43.2418212890625, "global_step": 310446, "epoch": 2565} {"train_loss": -42.706302642822266, "global_step": 310447, "epoch": 2565} {"train_loss": -42.676490783691406, "global_step": 310448, "epoch": 2565} {"train_loss": -42.30831527709961, "global_step": 310449, "epoch": 2565} {"train_loss": -42.761512756347656, "global_step": 310450, "epoch": 2565} {"train_loss": -42.918121337890625, "global_step": 310451, "epoch": 2565} {"train_loss": -42.962188720703125, "global_step": 310452, "epoch": 2565} {"train_loss": -43.38309860229492, "global_step": 310453, "epoch": 2565} {"train_loss": -43.43411636352539, "global_step": 310454, "epoch": 2565} {"train_loss": -42.9132080078125, "global_step": 310455, "epoch": 2565} {"train_loss": -42.71072006225586, "global_step": 310456, "epoch": 2565} {"train_loss": -42.8439826965332, "global_step": 310457, "epoch": 2565} {"train_loss": -43.674964904785156, "global_step": 310458, "epoch": 2565} {"train_loss": -42.42211151123047, "global_step": 310459, "epoch": 2565} {"train_loss": -42.13069534301758, "global_step": 310460, "epoch": 2565} {"train_loss": -42.78430938720703, "global_step": 310461, "epoch": 2565} {"train_loss": -42.78935623168945, "global_step": 310462, "epoch": 2565} {"train_loss": -42.188785552978516, "global_step": 310463, "epoch": 2565} {"train_loss": -42.59386444091797, "global_step": 310464, "epoch": 2565} {"train_loss": -42.464019775390625, "global_step": 310465, "epoch": 2565} {"train_loss": -43.20426559448242, "global_step": 310466, "epoch": 2565} {"train_loss": -42.77470016479492, "global_step": 310467, "epoch": 2565} {"train_loss": -41.95552444458008, "global_step": 310468, "epoch": 2565} {"train_loss": -41.685447692871094, "global_step": 310469, "epoch": 2565} {"train_loss": -42.37603759765625, "global_step": 310470, "epoch": 2565} {"train_loss": -42.79029846191406, "global_step": 310471, "epoch": 2565} {"train_loss": -42.006595611572266, "global_step": 310472, "epoch": 2565} {"train_loss": -41.273658752441406, "global_step": 310473, "epoch": 2565} {"train_loss": -42.685237884521484, "global_step": 310474, "epoch": 2565} {"train_loss": -42.81724166870117, "global_step": 310475, "epoch": 2565} {"train_loss": -42.76483154296875, "global_step": 310476, "epoch": 2565} {"train_loss": -42.96232604980469, "global_step": 310477, "epoch": 2565} {"train_loss": -42.536354064941406, "global_step": 310478, "epoch": 2565} {"train_loss": -41.54279708862305, "global_step": 310479, "epoch": 2565} {"train_loss": -42.289241790771484, "global_step": 310480, "epoch": 2565} {"train_loss": -43.267005920410156, "global_step": 310481, "epoch": 2565} {"train_loss": -42.78884506225586, "global_step": 310482, "epoch": 2565} {"train_loss": -42.886043548583984, "global_step": 310483, "epoch": 2565} {"train_loss": -40.91806411743164, "global_step": 310484, "epoch": 2565} {"train_loss": -42.16694297475263, "global_step": 310485, "epoch": 2565, "val_loss": 2824578.75} {"train_loss": -40.3723258972168, "global_step": 310486, "epoch": 2566} {"train_loss": -42.64525604248047, "global_step": 310487, "epoch": 2566} {"train_loss": -40.91602325439453, "global_step": 310488, "epoch": 2566} {"train_loss": -41.054683685302734, "global_step": 310489, "epoch": 2566} {"train_loss": -42.34055709838867, "global_step": 310490, "epoch": 2566} {"train_loss": -42.288185119628906, "global_step": 310491, "epoch": 2566} {"train_loss": -42.9373664855957, "global_step": 310492, "epoch": 2566} {"train_loss": -42.812538146972656, "global_step": 310493, "epoch": 2566} {"train_loss": -43.02412033081055, "global_step": 310494, "epoch": 2566} {"train_loss": -43.287811279296875, "global_step": 310495, "epoch": 2566} {"train_loss": -42.057533264160156, "global_step": 310496, "epoch": 2566} {"train_loss": -42.632469177246094, "global_step": 310497, "epoch": 2566} {"train_loss": -42.913021087646484, "global_step": 310498, "epoch": 2566} {"train_loss": -43.54850769042969, "global_step": 310499, "epoch": 2566} {"train_loss": -42.23978805541992, "global_step": 310500, "epoch": 2566} {"train_loss": -43.15955352783203, "global_step": 310501, "epoch": 2566} {"train_loss": -43.607933044433594, "global_step": 310502, "epoch": 2566} {"train_loss": -42.59529495239258, "global_step": 310503, "epoch": 2566} {"train_loss": -42.87434005737305, "global_step": 310504, "epoch": 2566} {"train_loss": -43.02203369140625, "global_step": 310505, "epoch": 2566} {"train_loss": -42.82158279418945, "global_step": 310506, "epoch": 2566} {"train_loss": -43.51668930053711, "global_step": 310507, "epoch": 2566} {"train_loss": -42.1525764465332, "global_step": 310508, "epoch": 2566} {"train_loss": -43.45339584350586, "global_step": 310509, "epoch": 2566} {"train_loss": -42.2116584777832, "global_step": 310510, "epoch": 2566} {"train_loss": -43.63181686401367, "global_step": 310511, "epoch": 2566} {"train_loss": -42.97734069824219, "global_step": 310512, "epoch": 2566} {"train_loss": -43.0319709777832, "global_step": 310513, "epoch": 2566} {"train_loss": -42.8302001953125, "global_step": 310514, "epoch": 2566} {"train_loss": -43.42537307739258, "global_step": 310515, "epoch": 2566} {"train_loss": -43.600955963134766, "global_step": 310516, "epoch": 2566} {"train_loss": -43.059295654296875, "global_step": 310517, "epoch": 2566} {"train_loss": -43.7509880065918, "global_step": 310518, "epoch": 2566} {"train_loss": -43.53559494018555, "global_step": 310519, "epoch": 2566} {"train_loss": -43.29777145385742, "global_step": 310520, "epoch": 2566} {"train_loss": -43.948970794677734, "global_step": 310521, "epoch": 2566} {"train_loss": -43.02518844604492, "global_step": 310522, "epoch": 2566} {"train_loss": -43.20132827758789, "global_step": 310523, "epoch": 2566} {"train_loss": -42.94709014892578, "global_step": 310524, "epoch": 2566} {"train_loss": -43.507572174072266, "global_step": 310525, "epoch": 2566} {"train_loss": -43.16651153564453, "global_step": 310526, "epoch": 2566} {"train_loss": -42.55645751953125, "global_step": 310527, "epoch": 2566} {"train_loss": -43.426063537597656, "global_step": 310528, "epoch": 2566} {"train_loss": -43.7718620300293, "global_step": 310529, "epoch": 2566} {"train_loss": -42.9152946472168, "global_step": 310530, "epoch": 2566} {"train_loss": -42.24871063232422, "global_step": 310531, "epoch": 2566} {"train_loss": -43.23014831542969, "global_step": 310532, "epoch": 2566} {"train_loss": -43.45072937011719, "global_step": 310533, "epoch": 2566} {"train_loss": -43.5069465637207, "global_step": 310534, "epoch": 2566} {"train_loss": -42.47528076171875, "global_step": 310535, "epoch": 2566} {"train_loss": -43.80903625488281, "global_step": 310536, "epoch": 2566} {"train_loss": -43.54056167602539, "global_step": 310537, "epoch": 2566} {"train_loss": -43.74576950073242, "global_step": 310538, "epoch": 2566} {"train_loss": -43.23860168457031, "global_step": 310539, "epoch": 2566} {"train_loss": -42.83561325073242, "global_step": 310540, "epoch": 2566} {"train_loss": -43.51292037963867, "global_step": 310541, "epoch": 2566} {"train_loss": -43.48025131225586, "global_step": 310542, "epoch": 2566} {"train_loss": -42.54642868041992, "global_step": 310543, "epoch": 2566} {"train_loss": -43.44157028198242, "global_step": 310544, "epoch": 2566} {"train_loss": -43.11002731323242, "global_step": 310545, "epoch": 2566} {"train_loss": -43.84218978881836, "global_step": 310546, "epoch": 2566} {"train_loss": -43.41485595703125, "global_step": 310547, "epoch": 2566} {"train_loss": -43.80208969116211, "global_step": 310548, "epoch": 2566} {"train_loss": -43.968788146972656, "global_step": 310549, "epoch": 2566} {"train_loss": -44.1019401550293, "global_step": 310550, "epoch": 2566} {"train_loss": -43.83747482299805, "global_step": 310551, "epoch": 2566} {"train_loss": -43.75564193725586, "global_step": 310552, "epoch": 2566} {"train_loss": -43.904388427734375, "global_step": 310553, "epoch": 2566} {"train_loss": -43.3071174621582, "global_step": 310554, "epoch": 2566} {"train_loss": -43.111202239990234, "global_step": 310555, "epoch": 2566} {"train_loss": -42.16169357299805, "global_step": 310556, "epoch": 2566} {"train_loss": -42.530635833740234, "global_step": 310557, "epoch": 2566} {"train_loss": -40.756011962890625, "global_step": 310558, "epoch": 2566} {"train_loss": -39.087772369384766, "global_step": 310559, "epoch": 2566} {"train_loss": -37.92374801635742, "global_step": 310560, "epoch": 2566} {"train_loss": -38.387855529785156, "global_step": 310561, "epoch": 2566} {"train_loss": -39.853607177734375, "global_step": 310562, "epoch": 2566} {"train_loss": -42.201656341552734, "global_step": 310563, "epoch": 2566} {"train_loss": -42.08330154418945, "global_step": 310564, "epoch": 2566} {"train_loss": -40.75605773925781, "global_step": 310565, "epoch": 2566} {"train_loss": -42.22707748413086, "global_step": 310566, "epoch": 2566} {"train_loss": -42.14126205444336, "global_step": 310567, "epoch": 2566} {"train_loss": -39.97053909301758, "global_step": 310568, "epoch": 2566} {"train_loss": -42.066287994384766, "global_step": 310569, "epoch": 2566} {"train_loss": -42.43824005126953, "global_step": 310570, "epoch": 2566} {"train_loss": -41.41816329956055, "global_step": 310571, "epoch": 2566} {"train_loss": -42.06824493408203, "global_step": 310572, "epoch": 2566} {"train_loss": -41.96440124511719, "global_step": 310573, "epoch": 2566} {"train_loss": -41.42716979980469, "global_step": 310574, "epoch": 2566} {"train_loss": -41.87652587890625, "global_step": 310575, "epoch": 2566} {"train_loss": -42.918365478515625, "global_step": 310576, "epoch": 2566} {"train_loss": -42.37053680419922, "global_step": 310577, "epoch": 2566} {"train_loss": -42.75361251831055, "global_step": 310578, "epoch": 2566} {"train_loss": -42.858211517333984, "global_step": 310579, "epoch": 2566} {"train_loss": -42.315589904785156, "global_step": 310580, "epoch": 2566} {"train_loss": -43.11707305908203, "global_step": 310581, "epoch": 2566} {"train_loss": -42.410438537597656, "global_step": 310582, "epoch": 2566} {"train_loss": -42.3059196472168, "global_step": 310583, "epoch": 2566} {"train_loss": -43.1690673828125, "global_step": 310584, "epoch": 2566} {"train_loss": -42.642093658447266, "global_step": 310585, "epoch": 2566} {"train_loss": -42.874576568603516, "global_step": 310586, "epoch": 2566} {"train_loss": -42.587642669677734, "global_step": 310587, "epoch": 2566} {"train_loss": -42.8145866394043, "global_step": 310588, "epoch": 2566} {"train_loss": -43.46885299682617, "global_step": 310589, "epoch": 2566} {"train_loss": -42.46966552734375, "global_step": 310590, "epoch": 2566} {"train_loss": -42.561065673828125, "global_step": 310591, "epoch": 2566} {"train_loss": -42.59609603881836, "global_step": 310592, "epoch": 2566} {"train_loss": -43.09246826171875, "global_step": 310593, "epoch": 2566} {"train_loss": -43.409584045410156, "global_step": 310594, "epoch": 2566} {"train_loss": -43.50809860229492, "global_step": 310595, "epoch": 2566} {"train_loss": -44.0670166015625, "global_step": 310596, "epoch": 2566} {"train_loss": -43.60233688354492, "global_step": 310597, "epoch": 2566} {"train_loss": -43.263587951660156, "global_step": 310598, "epoch": 2566} {"train_loss": -43.34352493286133, "global_step": 310599, "epoch": 2566} {"train_loss": -43.25719451904297, "global_step": 310600, "epoch": 2566} {"train_loss": -42.37965774536133, "global_step": 310601, "epoch": 2566} {"train_loss": -43.25731658935547, "global_step": 310602, "epoch": 2566} {"train_loss": -43.421356201171875, "global_step": 310603, "epoch": 2566} {"train_loss": -43.88588333129883, "global_step": 310604, "epoch": 2566} {"train_loss": -43.45225143432617, "global_step": 310605, "epoch": 2566} {"train_loss": -42.74393636530096, "global_step": 310606, "epoch": 2566, "val_loss": 2755336.0} {"train_loss": -43.794281005859375, "global_step": 310607, "epoch": 2567} {"train_loss": -43.97312545776367, "global_step": 310608, "epoch": 2567} {"train_loss": -43.47746658325195, "global_step": 310609, "epoch": 2567} {"train_loss": -43.56772232055664, "global_step": 310610, "epoch": 2567} {"train_loss": -43.59782791137695, "global_step": 310611, "epoch": 2567} {"train_loss": -43.914283752441406, "global_step": 310612, "epoch": 2567} {"train_loss": -43.68529510498047, "global_step": 310613, "epoch": 2567} {"train_loss": -43.2532958984375, "global_step": 310614, "epoch": 2567} {"train_loss": -43.97639083862305, "global_step": 310615, "epoch": 2567} {"train_loss": -44.139949798583984, "global_step": 310616, "epoch": 2567} {"train_loss": -44.0308952331543, "global_step": 310617, "epoch": 2567} {"train_loss": -43.83976745605469, "global_step": 310618, "epoch": 2567} {"train_loss": -44.01213073730469, "global_step": 310619, "epoch": 2567} {"train_loss": -44.38201141357422, "global_step": 310620, "epoch": 2567} {"train_loss": -43.52174758911133, "global_step": 310621, "epoch": 2567} {"train_loss": -44.23530960083008, "global_step": 310622, "epoch": 2567} {"train_loss": -43.598575592041016, "global_step": 310623, "epoch": 2567} {"train_loss": -44.341487884521484, "global_step": 310624, "epoch": 2567} {"train_loss": -44.39265060424805, "global_step": 310625, "epoch": 2567} {"train_loss": -43.83185958862305, "global_step": 310626, "epoch": 2567} {"train_loss": -43.86756896972656, "global_step": 310627, "epoch": 2567} {"train_loss": -44.363094329833984, "global_step": 310628, "epoch": 2567} {"train_loss": -43.45121383666992, "global_step": 310629, "epoch": 2567} {"train_loss": -44.33979415893555, "global_step": 310630, "epoch": 2567} {"train_loss": -43.61085510253906, "global_step": 310631, "epoch": 2567} {"train_loss": -43.00625228881836, "global_step": 310632, "epoch": 2567} {"train_loss": -44.30863571166992, "global_step": 310633, "epoch": 2567} {"train_loss": -44.322174072265625, "global_step": 310634, "epoch": 2567} {"train_loss": -43.93855667114258, "global_step": 310635, "epoch": 2567} {"train_loss": -44.09169006347656, "global_step": 310636, "epoch": 2567} {"train_loss": -43.98163986206055, "global_step": 310637, "epoch": 2567} {"train_loss": -42.64861297607422, "global_step": 310638, "epoch": 2567} {"train_loss": -40.275306701660156, "global_step": 310639, "epoch": 2567} {"train_loss": -39.11103057861328, "global_step": 310640, "epoch": 2567} {"train_loss": -36.6058349609375, "global_step": 310641, "epoch": 2567} {"train_loss": -39.04372024536133, "global_step": 310642, "epoch": 2567} {"train_loss": -41.67606735229492, "global_step": 310643, "epoch": 2567} {"train_loss": -43.089839935302734, "global_step": 310644, "epoch": 2567} {"train_loss": -41.18963623046875, "global_step": 310645, "epoch": 2567} {"train_loss": -40.460140228271484, "global_step": 310646, "epoch": 2567} {"train_loss": -41.6619987487793, "global_step": 310647, "epoch": 2567} {"train_loss": -43.25028610229492, "global_step": 310648, "epoch": 2567} {"train_loss": -42.4160041809082, "global_step": 310649, "epoch": 2567} {"train_loss": -42.58155059814453, "global_step": 310650, "epoch": 2567} {"train_loss": -41.688289642333984, "global_step": 310651, "epoch": 2567} {"train_loss": -42.54215621948242, "global_step": 310652, "epoch": 2567} {"train_loss": -41.49086380004883, "global_step": 310653, "epoch": 2567} {"train_loss": -42.57050323486328, "global_step": 310654, "epoch": 2567} {"train_loss": -42.441688537597656, "global_step": 310655, "epoch": 2567} {"train_loss": -40.363433837890625, "global_step": 310656, "epoch": 2567} {"train_loss": -42.44500732421875, "global_step": 310657, "epoch": 2567} {"train_loss": -42.470428466796875, "global_step": 310658, "epoch": 2567} {"train_loss": -43.6783332824707, "global_step": 310659, "epoch": 2567} {"train_loss": -42.246089935302734, "global_step": 310660, "epoch": 2567} {"train_loss": -42.8878288269043, "global_step": 310661, "epoch": 2567} {"train_loss": -42.3519287109375, "global_step": 310662, "epoch": 2567} {"train_loss": -41.209747314453125, "global_step": 310663, "epoch": 2567} {"train_loss": -43.249420166015625, "global_step": 310664, "epoch": 2567} {"train_loss": -42.487220764160156, "global_step": 310665, "epoch": 2567} {"train_loss": -42.61087417602539, "global_step": 310666, "epoch": 2567} {"train_loss": -42.751773834228516, "global_step": 310667, "epoch": 2567} {"train_loss": -41.9339485168457, "global_step": 310668, "epoch": 2567} {"train_loss": -42.34701156616211, "global_step": 310669, "epoch": 2567} {"train_loss": -42.34125518798828, "global_step": 310670, "epoch": 2567} {"train_loss": -41.906097412109375, "global_step": 310671, "epoch": 2567} {"train_loss": -42.94702911376953, "global_step": 310672, "epoch": 2567} {"train_loss": -42.53300094604492, "global_step": 310673, "epoch": 2567} {"train_loss": -41.695125579833984, "global_step": 310674, "epoch": 2567} {"train_loss": -42.74619674682617, "global_step": 310675, "epoch": 2567} {"train_loss": -43.66011428833008, "global_step": 310676, "epoch": 2567} {"train_loss": -41.98386764526367, "global_step": 310677, "epoch": 2567} {"train_loss": -42.509769439697266, "global_step": 310678, "epoch": 2567} {"train_loss": -42.24626922607422, "global_step": 310679, "epoch": 2567} {"train_loss": -43.02417755126953, "global_step": 310680, "epoch": 2567} {"train_loss": -43.18415451049805, "global_step": 310681, "epoch": 2567} {"train_loss": -42.861080169677734, "global_step": 310682, "epoch": 2567} {"train_loss": -43.21763229370117, "global_step": 310683, "epoch": 2567} {"train_loss": -43.563045501708984, "global_step": 310684, "epoch": 2567} {"train_loss": -43.2669792175293, "global_step": 310685, "epoch": 2567} {"train_loss": -43.83955001831055, "global_step": 310686, "epoch": 2567} {"train_loss": -42.90399169921875, "global_step": 310687, "epoch": 2567} {"train_loss": -43.8089599609375, "global_step": 310688, "epoch": 2567} {"train_loss": -43.0780143737793, "global_step": 310689, "epoch": 2567} {"train_loss": -43.769317626953125, "global_step": 310690, "epoch": 2567} {"train_loss": -43.7802848815918, "global_step": 310691, "epoch": 2567} {"train_loss": -43.37759017944336, "global_step": 310692, "epoch": 2567} {"train_loss": -43.66880416870117, "global_step": 310693, "epoch": 2567} {"train_loss": -43.873313903808594, "global_step": 310694, "epoch": 2567} {"train_loss": -43.90184783935547, "global_step": 310695, "epoch": 2567} {"train_loss": -43.23737716674805, "global_step": 310696, "epoch": 2567} {"train_loss": -43.71500778198242, "global_step": 310697, "epoch": 2567} {"train_loss": -43.9965934753418, "global_step": 310698, "epoch": 2567} {"train_loss": -44.389461517333984, "global_step": 310699, "epoch": 2567} {"train_loss": -44.02964401245117, "global_step": 310700, "epoch": 2567} {"train_loss": -43.95738220214844, "global_step": 310701, "epoch": 2567} {"train_loss": -43.82119369506836, "global_step": 310702, "epoch": 2567} {"train_loss": -43.62119674682617, "global_step": 310703, "epoch": 2567} {"train_loss": -43.79789733886719, "global_step": 310704, "epoch": 2567} {"train_loss": -43.35188674926758, "global_step": 310705, "epoch": 2567} {"train_loss": -44.08443069458008, "global_step": 310706, "epoch": 2567} {"train_loss": -43.903263092041016, "global_step": 310707, "epoch": 2567} {"train_loss": -44.30128860473633, "global_step": 310708, "epoch": 2567} {"train_loss": -44.09326171875, "global_step": 310709, "epoch": 2567} {"train_loss": -43.618412017822266, "global_step": 310710, "epoch": 2567} {"train_loss": -44.460365295410156, "global_step": 310711, "epoch": 2567} {"train_loss": -44.59763717651367, "global_step": 310712, "epoch": 2567} {"train_loss": -43.673927307128906, "global_step": 310713, "epoch": 2567} {"train_loss": -43.97915267944336, "global_step": 310714, "epoch": 2567} {"train_loss": -44.10639572143555, "global_step": 310715, "epoch": 2567} {"train_loss": -44.522987365722656, "global_step": 310716, "epoch": 2567} {"train_loss": -44.6181755065918, "global_step": 310717, "epoch": 2567} {"train_loss": -43.93907928466797, "global_step": 310718, "epoch": 2567} {"train_loss": -44.592403411865234, "global_step": 310719, "epoch": 2567} {"train_loss": -44.37295150756836, "global_step": 310720, "epoch": 2567} {"train_loss": -44.12921142578125, "global_step": 310721, "epoch": 2567} {"train_loss": -43.69710159301758, "global_step": 310722, "epoch": 2567} {"train_loss": -43.58391189575195, "global_step": 310723, "epoch": 2567} {"train_loss": -44.25651931762695, "global_step": 310724, "epoch": 2567} {"train_loss": -43.09637451171875, "global_step": 310725, "epoch": 2567} {"train_loss": -43.848567962646484, "global_step": 310726, "epoch": 2567} {"train_loss": -43.184169422496446, "global_step": 310727, "epoch": 2567, "val_loss": 2807157.75} {"train_loss": -43.922603607177734, "global_step": 310728, "epoch": 2568} {"train_loss": -43.098819732666016, "global_step": 310729, "epoch": 2568} {"train_loss": -43.40633773803711, "global_step": 310730, "epoch": 2568} {"train_loss": -43.39364242553711, "global_step": 310731, "epoch": 2568} {"train_loss": -43.846435546875, "global_step": 310732, "epoch": 2568} {"train_loss": -43.02493667602539, "global_step": 310733, "epoch": 2568} {"train_loss": -43.93632888793945, "global_step": 310734, "epoch": 2568} {"train_loss": -43.80814743041992, "global_step": 310735, "epoch": 2568} {"train_loss": -43.27720260620117, "global_step": 310736, "epoch": 2568} {"train_loss": -42.699764251708984, "global_step": 310737, "epoch": 2568} {"train_loss": -43.69574737548828, "global_step": 310738, "epoch": 2568} {"train_loss": -41.97983932495117, "global_step": 310739, "epoch": 2568} {"train_loss": -40.459869384765625, "global_step": 310740, "epoch": 2568} {"train_loss": -42.46657943725586, "global_step": 310741, "epoch": 2568} {"train_loss": -42.629512786865234, "global_step": 310742, "epoch": 2568} {"train_loss": -42.595497131347656, "global_step": 310743, "epoch": 2568} {"train_loss": -41.257076263427734, "global_step": 310744, "epoch": 2568} {"train_loss": -42.18984603881836, "global_step": 310745, "epoch": 2568} {"train_loss": -37.951873779296875, "global_step": 310746, "epoch": 2568} {"train_loss": -41.03815841674805, "global_step": 310747, "epoch": 2568} {"train_loss": -40.14073181152344, "global_step": 310748, "epoch": 2568} {"train_loss": -41.36619186401367, "global_step": 310749, "epoch": 2568} {"train_loss": -42.015743255615234, "global_step": 310750, "epoch": 2568} {"train_loss": -41.039669036865234, "global_step": 310751, "epoch": 2568} {"train_loss": -42.360443115234375, "global_step": 310752, "epoch": 2568} {"train_loss": -42.637977600097656, "global_step": 310753, "epoch": 2568} {"train_loss": -41.52370834350586, "global_step": 310754, "epoch": 2568} {"train_loss": -41.75336456298828, "global_step": 310755, "epoch": 2568} {"train_loss": -42.76784133911133, "global_step": 310756, "epoch": 2568} {"train_loss": -41.91474151611328, "global_step": 310757, "epoch": 2568} {"train_loss": -42.87395477294922, "global_step": 310758, "epoch": 2568} {"train_loss": -40.971153259277344, "global_step": 310759, "epoch": 2568} {"train_loss": -41.441097259521484, "global_step": 310760, "epoch": 2568} {"train_loss": -42.13335037231445, "global_step": 310761, "epoch": 2568} {"train_loss": -41.260005950927734, "global_step": 310762, "epoch": 2568} {"train_loss": -41.34003448486328, "global_step": 310763, "epoch": 2568} {"train_loss": -39.652435302734375, "global_step": 310764, "epoch": 2568} {"train_loss": -42.36620330810547, "global_step": 310765, "epoch": 2568} {"train_loss": -41.280025482177734, "global_step": 310766, "epoch": 2568} {"train_loss": -40.5932731628418, "global_step": 310767, "epoch": 2568} {"train_loss": -40.753597259521484, "global_step": 310768, "epoch": 2568} {"train_loss": -42.32633590698242, "global_step": 310769, "epoch": 2568} {"train_loss": -40.986629486083984, "global_step": 310770, "epoch": 2568} {"train_loss": -41.98322677612305, "global_step": 310771, "epoch": 2568} {"train_loss": -41.300445556640625, "global_step": 310772, "epoch": 2568} {"train_loss": -42.10922622680664, "global_step": 310773, "epoch": 2568} {"train_loss": -41.422943115234375, "global_step": 310774, "epoch": 2568} {"train_loss": -42.78181838989258, "global_step": 310775, "epoch": 2568} {"train_loss": -41.52006149291992, "global_step": 310776, "epoch": 2568} {"train_loss": -41.73422622680664, "global_step": 310777, "epoch": 2568} {"train_loss": -42.27766036987305, "global_step": 310778, "epoch": 2568} {"train_loss": -42.35890197753906, "global_step": 310779, "epoch": 2568} {"train_loss": -42.33360290527344, "global_step": 310780, "epoch": 2568} {"train_loss": -42.85858917236328, "global_step": 310781, "epoch": 2568} {"train_loss": -42.402626037597656, "global_step": 310782, "epoch": 2568} {"train_loss": -43.09355926513672, "global_step": 310783, "epoch": 2568} {"train_loss": -43.20243453979492, "global_step": 310784, "epoch": 2568} {"train_loss": -42.8026123046875, "global_step": 310785, "epoch": 2568} {"train_loss": -43.53420639038086, "global_step": 310786, "epoch": 2568} {"train_loss": -43.3558235168457, "global_step": 310787, "epoch": 2568} {"train_loss": -42.69941711425781, "global_step": 310788, "epoch": 2568} {"train_loss": -43.401283264160156, "global_step": 310789, "epoch": 2568} {"train_loss": -43.04679489135742, "global_step": 310790, "epoch": 2568} {"train_loss": -43.85060119628906, "global_step": 310791, "epoch": 2568} {"train_loss": -43.508514404296875, "global_step": 310792, "epoch": 2568} {"train_loss": -43.314517974853516, "global_step": 310793, "epoch": 2568} {"train_loss": -44.076210021972656, "global_step": 310794, "epoch": 2568} {"train_loss": -43.78269577026367, "global_step": 310795, "epoch": 2568} {"train_loss": -43.28049850463867, "global_step": 310796, "epoch": 2568} {"train_loss": -44.050201416015625, "global_step": 310797, "epoch": 2568} {"train_loss": -43.4296760559082, "global_step": 310798, "epoch": 2568} {"train_loss": -43.62800216674805, "global_step": 310799, "epoch": 2568} {"train_loss": -43.72291946411133, "global_step": 310800, "epoch": 2568} {"train_loss": -43.55698776245117, "global_step": 310801, "epoch": 2568} {"train_loss": -43.692501068115234, "global_step": 310802, "epoch": 2568} {"train_loss": -44.1669807434082, "global_step": 310803, "epoch": 2568} {"train_loss": -43.1496467590332, "global_step": 310804, "epoch": 2568} {"train_loss": -43.0516471862793, "global_step": 310805, "epoch": 2568} {"train_loss": -44.3043098449707, "global_step": 310806, "epoch": 2568} {"train_loss": -43.31352615356445, "global_step": 310807, "epoch": 2568} {"train_loss": -43.8054313659668, "global_step": 310808, "epoch": 2568} {"train_loss": -44.01606369018555, "global_step": 310809, "epoch": 2568} {"train_loss": -43.551082611083984, "global_step": 310810, "epoch": 2568} {"train_loss": -43.71174240112305, "global_step": 310811, "epoch": 2568} {"train_loss": -44.545440673828125, "global_step": 310812, "epoch": 2568} {"train_loss": -43.95694351196289, "global_step": 310813, "epoch": 2568} {"train_loss": -44.0219841003418, "global_step": 310814, "epoch": 2568} {"train_loss": -43.98629379272461, "global_step": 310815, "epoch": 2568} {"train_loss": -43.997642517089844, "global_step": 310816, "epoch": 2568} {"train_loss": -44.058692932128906, "global_step": 310817, "epoch": 2568} {"train_loss": -44.292049407958984, "global_step": 310818, "epoch": 2568} {"train_loss": -44.44379806518555, "global_step": 310819, "epoch": 2568} {"train_loss": -44.3981819152832, "global_step": 310820, "epoch": 2568} {"train_loss": -43.80131530761719, "global_step": 310821, "epoch": 2568} {"train_loss": -43.87389373779297, "global_step": 310822, "epoch": 2568} {"train_loss": -44.5283088684082, "global_step": 310823, "epoch": 2568} {"train_loss": -43.88393020629883, "global_step": 310824, "epoch": 2568} {"train_loss": -44.43202209472656, "global_step": 310825, "epoch": 2568} {"train_loss": -44.31768035888672, "global_step": 310826, "epoch": 2568} {"train_loss": -44.306129455566406, "global_step": 310827, "epoch": 2568} {"train_loss": -44.64022445678711, "global_step": 310828, "epoch": 2568} {"train_loss": -44.301979064941406, "global_step": 310829, "epoch": 2568} {"train_loss": -44.18903350830078, "global_step": 310830, "epoch": 2568} {"train_loss": -42.49650192260742, "global_step": 310831, "epoch": 2568} {"train_loss": -43.311683654785156, "global_step": 310832, "epoch": 2568} {"train_loss": -43.718406677246094, "global_step": 310833, "epoch": 2568} {"train_loss": -43.7582893371582, "global_step": 310834, "epoch": 2568} {"train_loss": -43.6829719543457, "global_step": 310835, "epoch": 2568} {"train_loss": -42.89827346801758, "global_step": 310836, "epoch": 2568} {"train_loss": -42.61494064331055, "global_step": 310837, "epoch": 2568} {"train_loss": -43.937862396240234, "global_step": 310838, "epoch": 2568} {"train_loss": -44.14558792114258, "global_step": 310839, "epoch": 2568} {"train_loss": -42.5418815612793, "global_step": 310840, "epoch": 2568} {"train_loss": -40.416011810302734, "global_step": 310841, "epoch": 2568} {"train_loss": -42.17778015136719, "global_step": 310842, "epoch": 2568} {"train_loss": -43.93052291870117, "global_step": 310843, "epoch": 2568} {"train_loss": -41.34275817871094, "global_step": 310844, "epoch": 2568} {"train_loss": -35.47858810424805, "global_step": 310845, "epoch": 2568} {"train_loss": -30.888391494750977, "global_step": 310846, "epoch": 2568} {"train_loss": -35.554805755615234, "global_step": 310847, "epoch": 2568} {"train_loss": -42.63914166600251, "global_step": 310848, "epoch": 2568, "val_loss": 2807634.25} {"train_loss": -40.39335632324219, "global_step": 310849, "epoch": 2569} {"train_loss": -40.66291809082031, "global_step": 310850, "epoch": 2569} {"train_loss": -40.7226676940918, "global_step": 310851, "epoch": 2569} {"train_loss": -40.50835037231445, "global_step": 310852, "epoch": 2569} {"train_loss": -41.03011703491211, "global_step": 310853, "epoch": 2569} {"train_loss": -41.682918548583984, "global_step": 310854, "epoch": 2569} {"train_loss": -40.251502990722656, "global_step": 310855, "epoch": 2569} {"train_loss": -41.24077224731445, "global_step": 310856, "epoch": 2569} {"train_loss": -38.944610595703125, "global_step": 310857, "epoch": 2569} {"train_loss": -42.23886489868164, "global_step": 310858, "epoch": 2569} {"train_loss": -41.96660614013672, "global_step": 310859, "epoch": 2569} {"train_loss": -38.33620834350586, "global_step": 310860, "epoch": 2569} {"train_loss": -42.05200958251953, "global_step": 310861, "epoch": 2569} {"train_loss": -40.64792251586914, "global_step": 310862, "epoch": 2569} {"train_loss": -42.091796875, "global_step": 310863, "epoch": 2569} {"train_loss": -41.11082077026367, "global_step": 310864, "epoch": 2569} {"train_loss": -41.15584945678711, "global_step": 310865, "epoch": 2569} {"train_loss": -41.749595642089844, "global_step": 310866, "epoch": 2569} {"train_loss": -41.55646896362305, "global_step": 310867, "epoch": 2569} {"train_loss": -42.10178756713867, "global_step": 310868, "epoch": 2569} {"train_loss": -40.711769104003906, "global_step": 310869, "epoch": 2569} {"train_loss": -42.125282287597656, "global_step": 310870, "epoch": 2569} {"train_loss": -43.16331100463867, "global_step": 310871, "epoch": 2569} {"train_loss": -42.919837951660156, "global_step": 310872, "epoch": 2569} {"train_loss": -42.841007232666016, "global_step": 310873, "epoch": 2569} {"train_loss": -40.940181732177734, "global_step": 310874, "epoch": 2569} {"train_loss": -43.00349044799805, "global_step": 310875, "epoch": 2569} {"train_loss": -43.610374450683594, "global_step": 310876, "epoch": 2569} {"train_loss": -43.04315185546875, "global_step": 310877, "epoch": 2569} {"train_loss": -43.75881576538086, "global_step": 310878, "epoch": 2569} {"train_loss": -43.21833038330078, "global_step": 310879, "epoch": 2569} {"train_loss": -43.39435577392578, "global_step": 310880, "epoch": 2569} {"train_loss": -43.02836227416992, "global_step": 310881, "epoch": 2569} {"train_loss": -42.84457015991211, "global_step": 310882, "epoch": 2569} {"train_loss": -43.43433380126953, "global_step": 310883, "epoch": 2569} {"train_loss": -43.233577728271484, "global_step": 310884, "epoch": 2569} {"train_loss": -42.445404052734375, "global_step": 310885, "epoch": 2569} {"train_loss": -42.968788146972656, "global_step": 310886, "epoch": 2569} {"train_loss": -41.79030990600586, "global_step": 310887, "epoch": 2569} {"train_loss": -36.61769485473633, "global_step": 310888, "epoch": 2569} {"train_loss": -43.55410385131836, "global_step": 310889, "epoch": 2569} {"train_loss": -42.58798599243164, "global_step": 310890, "epoch": 2569} {"train_loss": -43.10395431518555, "global_step": 310891, "epoch": 2569} {"train_loss": -42.94365692138672, "global_step": 310892, "epoch": 2569} {"train_loss": -43.56288528442383, "global_step": 310893, "epoch": 2569} {"train_loss": -41.9911003112793, "global_step": 310894, "epoch": 2569} {"train_loss": -41.13178634643555, "global_step": 310895, "epoch": 2569} {"train_loss": -42.341407775878906, "global_step": 310896, "epoch": 2569} {"train_loss": -40.793983459472656, "global_step": 310897, "epoch": 2569} {"train_loss": -43.33541488647461, "global_step": 310898, "epoch": 2569} {"train_loss": -43.98065948486328, "global_step": 310899, "epoch": 2569} {"train_loss": -43.41288757324219, "global_step": 310900, "epoch": 2569} {"train_loss": -42.9244499206543, "global_step": 310901, "epoch": 2569} {"train_loss": -43.70133590698242, "global_step": 310902, "epoch": 2569} {"train_loss": -43.86234664916992, "global_step": 310903, "epoch": 2569} {"train_loss": -43.93634796142578, "global_step": 310904, "epoch": 2569} {"train_loss": -43.80294418334961, "global_step": 310905, "epoch": 2569} {"train_loss": -43.94358444213867, "global_step": 310906, "epoch": 2569} {"train_loss": -43.721920013427734, "global_step": 310907, "epoch": 2569} {"train_loss": -44.0800666809082, "global_step": 310908, "epoch": 2569} {"train_loss": -43.42022705078125, "global_step": 310909, "epoch": 2569} {"train_loss": -41.78313064575195, "global_step": 310910, "epoch": 2569} {"train_loss": -42.75647735595703, "global_step": 310911, "epoch": 2569} {"train_loss": -39.57414627075195, "global_step": 310912, "epoch": 2569} {"train_loss": -43.53290557861328, "global_step": 310913, "epoch": 2569} {"train_loss": -43.39994430541992, "global_step": 310914, "epoch": 2569} {"train_loss": -44.21009063720703, "global_step": 310915, "epoch": 2569} {"train_loss": -43.805355072021484, "global_step": 310916, "epoch": 2569} {"train_loss": -30.79364585876465, "global_step": 310917, "epoch": 2569} {"train_loss": -42.805389404296875, "global_step": 310918, "epoch": 2569} {"train_loss": -41.648311614990234, "global_step": 310919, "epoch": 2569} {"train_loss": -43.30689239501953, "global_step": 310920, "epoch": 2569} {"train_loss": -42.48842239379883, "global_step": 310921, "epoch": 2569} {"train_loss": -43.210384368896484, "global_step": 310922, "epoch": 2569} {"train_loss": -41.71701431274414, "global_step": 310923, "epoch": 2569} {"train_loss": -42.17841720581055, "global_step": 310924, "epoch": 2569} {"train_loss": -40.01963424682617, "global_step": 310925, "epoch": 2569} {"train_loss": -42.3581657409668, "global_step": 310926, "epoch": 2569} {"train_loss": -42.84846115112305, "global_step": 310927, "epoch": 2569} {"train_loss": -41.11602783203125, "global_step": 310928, "epoch": 2569} {"train_loss": -42.972808837890625, "global_step": 310929, "epoch": 2569} {"train_loss": -35.875240325927734, "global_step": 310930, "epoch": 2569} {"train_loss": -42.57871627807617, "global_step": 310931, "epoch": 2569} {"train_loss": -41.132667541503906, "global_step": 310932, "epoch": 2569} {"train_loss": -41.089054107666016, "global_step": 310933, "epoch": 2569} {"train_loss": -42.076663970947266, "global_step": 310934, "epoch": 2569} {"train_loss": -42.2849006652832, "global_step": 310935, "epoch": 2569} {"train_loss": -41.06227493286133, "global_step": 310936, "epoch": 2569} {"train_loss": -42.61302185058594, "global_step": 310937, "epoch": 2569} {"train_loss": -41.22447967529297, "global_step": 310938, "epoch": 2569} {"train_loss": -42.9110221862793, "global_step": 310939, "epoch": 2569} {"train_loss": -35.360939025878906, "global_step": 310940, "epoch": 2569} {"train_loss": -41.04970932006836, "global_step": 310941, "epoch": 2569} {"train_loss": -39.914588928222656, "global_step": 310942, "epoch": 2569} {"train_loss": -40.32087326049805, "global_step": 310943, "epoch": 2569} {"train_loss": -40.17668914794922, "global_step": 310944, "epoch": 2569} {"train_loss": -42.0800666809082, "global_step": 310945, "epoch": 2569} {"train_loss": -42.750728607177734, "global_step": 310946, "epoch": 2569} {"train_loss": -43.1621208190918, "global_step": 310947, "epoch": 2569} {"train_loss": -42.486366271972656, "global_step": 310948, "epoch": 2569} {"train_loss": -42.86842727661133, "global_step": 310949, "epoch": 2569} {"train_loss": -35.6679801940918, "global_step": 310950, "epoch": 2569} {"train_loss": -43.03071212768555, "global_step": 310951, "epoch": 2569} {"train_loss": -40.428184509277344, "global_step": 310952, "epoch": 2569} {"train_loss": -42.08988571166992, "global_step": 310953, "epoch": 2569} {"train_loss": -40.636634826660156, "global_step": 310954, "epoch": 2569} {"train_loss": -43.12120819091797, "global_step": 310955, "epoch": 2569} {"train_loss": -38.81606674194336, "global_step": 310956, "epoch": 2569} {"train_loss": -40.784454345703125, "global_step": 310957, "epoch": 2569} {"train_loss": -41.66610336303711, "global_step": 310958, "epoch": 2569} {"train_loss": -42.32904815673828, "global_step": 310959, "epoch": 2569} {"train_loss": -40.49320983886719, "global_step": 310960, "epoch": 2569} {"train_loss": -42.14845657348633, "global_step": 310961, "epoch": 2569} {"train_loss": -41.741973876953125, "global_step": 310962, "epoch": 2569} {"train_loss": -41.940670013427734, "global_step": 310963, "epoch": 2569} {"train_loss": -40.79911422729492, "global_step": 310964, "epoch": 2569} {"train_loss": -42.2337646484375, "global_step": 310965, "epoch": 2569} {"train_loss": -40.71961212158203, "global_step": 310966, "epoch": 2569} {"train_loss": -42.25627136230469, "global_step": 310967, "epoch": 2569} {"train_loss": -40.01463317871094, "global_step": 310968, "epoch": 2569} {"train_loss": -41.80863787122994, "global_step": 310969, "epoch": 2569, "val_loss": 2778972.75} {"train_loss": -40.92985153198242, "global_step": 310970, "epoch": 2570} {"train_loss": -42.422367095947266, "global_step": 310971, "epoch": 2570} {"train_loss": -42.04865646362305, "global_step": 310972, "epoch": 2570} {"train_loss": -42.073150634765625, "global_step": 310973, "epoch": 2570} {"train_loss": -41.71769332885742, "global_step": 310974, "epoch": 2570} {"train_loss": -42.99348068237305, "global_step": 310975, "epoch": 2570} {"train_loss": -42.935752868652344, "global_step": 310976, "epoch": 2570} {"train_loss": -39.76795959472656, "global_step": 310977, "epoch": 2570} {"train_loss": -40.683807373046875, "global_step": 310978, "epoch": 2570} {"train_loss": -41.5162353515625, "global_step": 310979, "epoch": 2570} {"train_loss": -42.073524475097656, "global_step": 310980, "epoch": 2570} {"train_loss": -41.56001281738281, "global_step": 310981, "epoch": 2570} {"train_loss": -43.258460998535156, "global_step": 310982, "epoch": 2570} {"train_loss": -42.91558837890625, "global_step": 310983, "epoch": 2570} {"train_loss": -42.12612533569336, "global_step": 310984, "epoch": 2570} {"train_loss": -38.44092559814453, "global_step": 310985, "epoch": 2570} {"train_loss": -43.05576705932617, "global_step": 310986, "epoch": 2570} {"train_loss": -43.2557258605957, "global_step": 310987, "epoch": 2570} {"train_loss": -42.487674713134766, "global_step": 310988, "epoch": 2570} {"train_loss": -42.79265594482422, "global_step": 310989, "epoch": 2570} {"train_loss": -41.797237396240234, "global_step": 310990, "epoch": 2570} {"train_loss": -41.64773941040039, "global_step": 310991, "epoch": 2570} {"train_loss": -43.44651412963867, "global_step": 310992, "epoch": 2570} {"train_loss": -42.559322357177734, "global_step": 310993, "epoch": 2570} {"train_loss": -42.59108352661133, "global_step": 310994, "epoch": 2570} {"train_loss": -43.08903121948242, "global_step": 310995, "epoch": 2570} {"train_loss": -40.76331329345703, "global_step": 310996, "epoch": 2570} {"train_loss": -39.823760986328125, "global_step": 310997, "epoch": 2570} {"train_loss": -41.34403610229492, "global_step": 310998, "epoch": 2570} {"train_loss": -42.136817932128906, "global_step": 310999, "epoch": 2570} {"train_loss": -43.4262580871582, "global_step": 311000, "epoch": 2570} {"train_loss": -41.2905158996582, "global_step": 311001, "epoch": 2570} {"train_loss": -42.43171310424805, "global_step": 311002, "epoch": 2570} {"train_loss": -43.01798629760742, "global_step": 311003, "epoch": 2570} {"train_loss": -43.17904281616211, "global_step": 311004, "epoch": 2570} {"train_loss": -42.38499069213867, "global_step": 311005, "epoch": 2570} {"train_loss": -42.87229537963867, "global_step": 311006, "epoch": 2570} {"train_loss": -40.943016052246094, "global_step": 311007, "epoch": 2570} {"train_loss": -42.5189208984375, "global_step": 311008, "epoch": 2570} {"train_loss": -43.541595458984375, "global_step": 311009, "epoch": 2570} {"train_loss": -43.096832275390625, "global_step": 311010, "epoch": 2570} {"train_loss": -43.352081298828125, "global_step": 311011, "epoch": 2570} {"train_loss": -42.92974090576172, "global_step": 311012, "epoch": 2570} {"train_loss": -42.627166748046875, "global_step": 311013, "epoch": 2570} {"train_loss": -41.005615234375, "global_step": 311014, "epoch": 2570} {"train_loss": -41.71195983886719, "global_step": 311015, "epoch": 2570} {"train_loss": -43.376121520996094, "global_step": 311016, "epoch": 2570} {"train_loss": -43.100433349609375, "global_step": 311017, "epoch": 2570} {"train_loss": -43.044769287109375, "global_step": 311018, "epoch": 2570} {"train_loss": -42.712074279785156, "global_step": 311019, "epoch": 2570} {"train_loss": -42.22774887084961, "global_step": 311020, "epoch": 2570} {"train_loss": -42.746070861816406, "global_step": 311021, "epoch": 2570} {"train_loss": -41.648834228515625, "global_step": 311022, "epoch": 2570} {"train_loss": -42.5634651184082, "global_step": 311023, "epoch": 2570} {"train_loss": -43.26880645751953, "global_step": 311024, "epoch": 2570} {"train_loss": -42.69370651245117, "global_step": 311025, "epoch": 2570} {"train_loss": -43.45011520385742, "global_step": 311026, "epoch": 2570} {"train_loss": -42.073265075683594, "global_step": 311027, "epoch": 2570} {"train_loss": -40.381011962890625, "global_step": 311028, "epoch": 2570} {"train_loss": -43.193077087402344, "global_step": 311029, "epoch": 2570} {"train_loss": -40.90552520751953, "global_step": 311030, "epoch": 2570} {"train_loss": -42.44362258911133, "global_step": 311031, "epoch": 2570} {"train_loss": -43.31028366088867, "global_step": 311032, "epoch": 2570} {"train_loss": -43.02096939086914, "global_step": 311033, "epoch": 2570} {"train_loss": -41.95685577392578, "global_step": 311034, "epoch": 2570} {"train_loss": -42.5415153503418, "global_step": 311035, "epoch": 2570} {"train_loss": -43.30398178100586, "global_step": 311036, "epoch": 2570} {"train_loss": -43.6080436706543, "global_step": 311037, "epoch": 2570} {"train_loss": -43.60976028442383, "global_step": 311038, "epoch": 2570} {"train_loss": -43.44637680053711, "global_step": 311039, "epoch": 2570} {"train_loss": -43.49250411987305, "global_step": 311040, "epoch": 2570} {"train_loss": -42.2194938659668, "global_step": 311041, "epoch": 2570} {"train_loss": -43.56215286254883, "global_step": 311042, "epoch": 2570} {"train_loss": -42.5684928894043, "global_step": 311043, "epoch": 2570} {"train_loss": -43.06710433959961, "global_step": 311044, "epoch": 2570} {"train_loss": -43.54732894897461, "global_step": 311045, "epoch": 2570} {"train_loss": -43.5324592590332, "global_step": 311046, "epoch": 2570} {"train_loss": -43.851806640625, "global_step": 311047, "epoch": 2570} {"train_loss": -43.466304779052734, "global_step": 311048, "epoch": 2570} {"train_loss": -43.838539123535156, "global_step": 311049, "epoch": 2570} {"train_loss": -43.92476272583008, "global_step": 311050, "epoch": 2570} {"train_loss": -43.143123626708984, "global_step": 311051, "epoch": 2570} {"train_loss": -44.259727478027344, "global_step": 311052, "epoch": 2570} {"train_loss": -43.29298782348633, "global_step": 311053, "epoch": 2570} {"train_loss": -44.19426345825195, "global_step": 311054, "epoch": 2570} {"train_loss": -43.871063232421875, "global_step": 311055, "epoch": 2570} {"train_loss": -44.00324630737305, "global_step": 311056, "epoch": 2570} {"train_loss": -43.98365783691406, "global_step": 311057, "epoch": 2570} {"train_loss": -42.95262908935547, "global_step": 311058, "epoch": 2570} {"train_loss": -44.17654037475586, "global_step": 311059, "epoch": 2570} {"train_loss": -44.58754348754883, "global_step": 311060, "epoch": 2570} {"train_loss": -44.028072357177734, "global_step": 311061, "epoch": 2570} {"train_loss": -43.574371337890625, "global_step": 311062, "epoch": 2570} {"train_loss": -44.40314483642578, "global_step": 311063, "epoch": 2570} {"train_loss": -43.56901931762695, "global_step": 311064, "epoch": 2570} {"train_loss": -43.40678024291992, "global_step": 311065, "epoch": 2570} {"train_loss": -43.562164306640625, "global_step": 311066, "epoch": 2570} {"train_loss": -44.27396011352539, "global_step": 311067, "epoch": 2570} {"train_loss": -44.29245376586914, "global_step": 311068, "epoch": 2570} {"train_loss": -43.39145278930664, "global_step": 311069, "epoch": 2570} {"train_loss": -43.9575309753418, "global_step": 311070, "epoch": 2570} {"train_loss": -43.832759857177734, "global_step": 311071, "epoch": 2570} {"train_loss": -44.330841064453125, "global_step": 311072, "epoch": 2570} {"train_loss": -42.107757568359375, "global_step": 311073, "epoch": 2570} {"train_loss": -44.26323318481445, "global_step": 311074, "epoch": 2570} {"train_loss": -43.58844757080078, "global_step": 311075, "epoch": 2570} {"train_loss": -41.61554718017578, "global_step": 311076, "epoch": 2570} {"train_loss": -43.90608596801758, "global_step": 311077, "epoch": 2570} {"train_loss": -43.573543548583984, "global_step": 311078, "epoch": 2570} {"train_loss": -44.36255645751953, "global_step": 311079, "epoch": 2570} {"train_loss": -43.42530059814453, "global_step": 311080, "epoch": 2570} {"train_loss": -42.40189743041992, "global_step": 311081, "epoch": 2570} {"train_loss": -42.47352981567383, "global_step": 311082, "epoch": 2570} {"train_loss": -41.105438232421875, "global_step": 311083, "epoch": 2570} {"train_loss": -42.631099700927734, "global_step": 311084, "epoch": 2570} {"train_loss": -44.1401481628418, "global_step": 311085, "epoch": 2570} {"train_loss": -42.72465133666992, "global_step": 311086, "epoch": 2570} {"train_loss": -41.62786865234375, "global_step": 311087, "epoch": 2570} {"train_loss": -38.77029800415039, "global_step": 311088, "epoch": 2570} {"train_loss": -39.43088912963867, "global_step": 311089, "epoch": 2570} {"train_loss": -42.71665267313807, "global_step": 311090, "epoch": 2570, "val_loss": 2756920.75} {"train_loss": -42.16437530517578, "global_step": 311091, "epoch": 2571} {"train_loss": -42.76189041137695, "global_step": 311092, "epoch": 2571} {"train_loss": -41.56970977783203, "global_step": 311093, "epoch": 2571} {"train_loss": -41.29658889770508, "global_step": 311094, "epoch": 2571} {"train_loss": -43.31736373901367, "global_step": 311095, "epoch": 2571} {"train_loss": -43.047298431396484, "global_step": 311096, "epoch": 2571} {"train_loss": -41.7150993347168, "global_step": 311097, "epoch": 2571} {"train_loss": -43.50444412231445, "global_step": 311098, "epoch": 2571} {"train_loss": -42.73312759399414, "global_step": 311099, "epoch": 2571} {"train_loss": -40.640193939208984, "global_step": 311100, "epoch": 2571} {"train_loss": -43.3509407043457, "global_step": 311101, "epoch": 2571} {"train_loss": -43.402950286865234, "global_step": 311102, "epoch": 2571} {"train_loss": -41.88132858276367, "global_step": 311103, "epoch": 2571} {"train_loss": -37.18787384033203, "global_step": 311104, "epoch": 2571} {"train_loss": -38.46564865112305, "global_step": 311105, "epoch": 2571} {"train_loss": -42.85285186767578, "global_step": 311106, "epoch": 2571} {"train_loss": -41.85306930541992, "global_step": 311107, "epoch": 2571} {"train_loss": -41.94282913208008, "global_step": 311108, "epoch": 2571} {"train_loss": -38.39478302001953, "global_step": 311109, "epoch": 2571} {"train_loss": -40.80527877807617, "global_step": 311110, "epoch": 2571} {"train_loss": -43.17668533325195, "global_step": 311111, "epoch": 2571} {"train_loss": -40.93963623046875, "global_step": 311112, "epoch": 2571} {"train_loss": -42.399131774902344, "global_step": 311113, "epoch": 2571} {"train_loss": -42.31045150756836, "global_step": 311114, "epoch": 2571} {"train_loss": -42.04793167114258, "global_step": 311115, "epoch": 2571} {"train_loss": -42.70590591430664, "global_step": 311116, "epoch": 2571} {"train_loss": -41.34865951538086, "global_step": 311117, "epoch": 2571} {"train_loss": -39.97359085083008, "global_step": 311118, "epoch": 2571} {"train_loss": -40.84513473510742, "global_step": 311119, "epoch": 2571} {"train_loss": -42.76462936401367, "global_step": 311120, "epoch": 2571} {"train_loss": -39.41733932495117, "global_step": 311121, "epoch": 2571} {"train_loss": -43.104164123535156, "global_step": 311122, "epoch": 2571} {"train_loss": -38.83563995361328, "global_step": 311123, "epoch": 2571} {"train_loss": -38.84225082397461, "global_step": 311124, "epoch": 2571} {"train_loss": -40.594295501708984, "global_step": 311125, "epoch": 2571} {"train_loss": -41.94916534423828, "global_step": 311126, "epoch": 2571} {"train_loss": -41.7152214050293, "global_step": 311127, "epoch": 2571} {"train_loss": -42.55019760131836, "global_step": 311128, "epoch": 2571} {"train_loss": -39.51377487182617, "global_step": 311129, "epoch": 2571} {"train_loss": -39.80035400390625, "global_step": 311130, "epoch": 2571} {"train_loss": -41.55836868286133, "global_step": 311131, "epoch": 2571} {"train_loss": -41.70412063598633, "global_step": 311132, "epoch": 2571} {"train_loss": -41.260616302490234, "global_step": 311133, "epoch": 2571} {"train_loss": -42.433135986328125, "global_step": 311134, "epoch": 2571} {"train_loss": -42.25659942626953, "global_step": 311135, "epoch": 2571} {"train_loss": -42.44161605834961, "global_step": 311136, "epoch": 2571} {"train_loss": -43.41599655151367, "global_step": 311137, "epoch": 2571} {"train_loss": -39.56473922729492, "global_step": 311138, "epoch": 2571} {"train_loss": -42.37348937988281, "global_step": 311139, "epoch": 2571} {"train_loss": -42.42850112915039, "global_step": 311140, "epoch": 2571} {"train_loss": -41.838233947753906, "global_step": 311141, "epoch": 2571} {"train_loss": -40.37683868408203, "global_step": 311142, "epoch": 2571} {"train_loss": -41.70009231567383, "global_step": 311143, "epoch": 2571} {"train_loss": -41.1928825378418, "global_step": 311144, "epoch": 2571} {"train_loss": -36.88584899902344, "global_step": 311145, "epoch": 2571} {"train_loss": -40.77421188354492, "global_step": 311146, "epoch": 2571} {"train_loss": -41.483642578125, "global_step": 311147, "epoch": 2571} {"train_loss": -42.3055305480957, "global_step": 311148, "epoch": 2571} {"train_loss": -42.410221099853516, "global_step": 311149, "epoch": 2571} {"train_loss": -42.14000701904297, "global_step": 311150, "epoch": 2571} {"train_loss": -42.1782112121582, "global_step": 311151, "epoch": 2571} {"train_loss": -42.795982360839844, "global_step": 311152, "epoch": 2571} {"train_loss": -41.4559440612793, "global_step": 311153, "epoch": 2571} {"train_loss": -42.22663879394531, "global_step": 311154, "epoch": 2571} {"train_loss": -43.51782989501953, "global_step": 311155, "epoch": 2571} {"train_loss": -42.96292495727539, "global_step": 311156, "epoch": 2571} {"train_loss": -43.23329544067383, "global_step": 311157, "epoch": 2571} {"train_loss": -42.90127182006836, "global_step": 311158, "epoch": 2571} {"train_loss": -42.25529861450195, "global_step": 311159, "epoch": 2571} {"train_loss": -43.687583923339844, "global_step": 311160, "epoch": 2571} {"train_loss": -42.96623229980469, "global_step": 311161, "epoch": 2571} {"train_loss": -43.43587112426758, "global_step": 311162, "epoch": 2571} {"train_loss": -42.494449615478516, "global_step": 311163, "epoch": 2571} {"train_loss": -43.069210052490234, "global_step": 311164, "epoch": 2571} {"train_loss": -43.09882354736328, "global_step": 311165, "epoch": 2571} {"train_loss": -43.83168411254883, "global_step": 311166, "epoch": 2571} {"train_loss": -41.43085479736328, "global_step": 311167, "epoch": 2571} {"train_loss": -43.26322937011719, "global_step": 311168, "epoch": 2571} {"train_loss": -41.68684005737305, "global_step": 311169, "epoch": 2571} {"train_loss": -41.32204055786133, "global_step": 311170, "epoch": 2571} {"train_loss": -42.948974609375, "global_step": 311171, "epoch": 2571} {"train_loss": -42.66793441772461, "global_step": 311172, "epoch": 2571} {"train_loss": -43.28376007080078, "global_step": 311173, "epoch": 2571} {"train_loss": -43.66231155395508, "global_step": 311174, "epoch": 2571} {"train_loss": -43.088314056396484, "global_step": 311175, "epoch": 2571} {"train_loss": -43.83260726928711, "global_step": 311176, "epoch": 2571} {"train_loss": -43.62648391723633, "global_step": 311177, "epoch": 2571} {"train_loss": -43.09456253051758, "global_step": 311178, "epoch": 2571} {"train_loss": -43.44070053100586, "global_step": 311179, "epoch": 2571} {"train_loss": -40.9156608581543, "global_step": 311180, "epoch": 2571} {"train_loss": -41.90092086791992, "global_step": 311181, "epoch": 2571} {"train_loss": -43.35112380981445, "global_step": 311182, "epoch": 2571} {"train_loss": -43.8971061706543, "global_step": 311183, "epoch": 2571} {"train_loss": -41.312740325927734, "global_step": 311184, "epoch": 2571} {"train_loss": -43.33844757080078, "global_step": 311185, "epoch": 2571} {"train_loss": -43.492637634277344, "global_step": 311186, "epoch": 2571} {"train_loss": -43.6567497253418, "global_step": 311187, "epoch": 2571} {"train_loss": -43.513607025146484, "global_step": 311188, "epoch": 2571} {"train_loss": -42.90825653076172, "global_step": 311189, "epoch": 2571} {"train_loss": -43.70835494995117, "global_step": 311190, "epoch": 2571} {"train_loss": -43.56435012817383, "global_step": 311191, "epoch": 2571} {"train_loss": -41.743831634521484, "global_step": 311192, "epoch": 2571} {"train_loss": -42.996795654296875, "global_step": 311193, "epoch": 2571} {"train_loss": -42.675086975097656, "global_step": 311194, "epoch": 2571} {"train_loss": -43.05817413330078, "global_step": 311195, "epoch": 2571} {"train_loss": -43.551490783691406, "global_step": 311196, "epoch": 2571} {"train_loss": -43.62437057495117, "global_step": 311197, "epoch": 2571} {"train_loss": -43.997623443603516, "global_step": 311198, "epoch": 2571} {"train_loss": -43.078712463378906, "global_step": 311199, "epoch": 2571} {"train_loss": -42.15522384643555, "global_step": 311200, "epoch": 2571} {"train_loss": -42.50139236450195, "global_step": 311201, "epoch": 2571} {"train_loss": -43.837406158447266, "global_step": 311202, "epoch": 2571} {"train_loss": -44.32160186767578, "global_step": 311203, "epoch": 2571} {"train_loss": -43.0785026550293, "global_step": 311204, "epoch": 2571} {"train_loss": -40.05605697631836, "global_step": 311205, "epoch": 2571} {"train_loss": -43.61314010620117, "global_step": 311206, "epoch": 2571} {"train_loss": -43.75988006591797, "global_step": 311207, "epoch": 2571} {"train_loss": -42.8067626953125, "global_step": 311208, "epoch": 2571} {"train_loss": -41.6065559387207, "global_step": 311209, "epoch": 2571} {"train_loss": -43.498390197753906, "global_step": 311210, "epoch": 2571} {"train_loss": -42.200776628226286, "global_step": 311211, "epoch": 2571, "val_loss": 2848943.25} {"train_loss": -41.21821594238281, "global_step": 311212, "epoch": 2572} {"train_loss": -42.056129455566406, "global_step": 311213, "epoch": 2572} {"train_loss": -43.770565032958984, "global_step": 311214, "epoch": 2572} {"train_loss": -41.55868148803711, "global_step": 311215, "epoch": 2572} {"train_loss": -40.21503448486328, "global_step": 311216, "epoch": 2572} {"train_loss": -41.68246078491211, "global_step": 311217, "epoch": 2572} {"train_loss": -42.23086166381836, "global_step": 311218, "epoch": 2572} {"train_loss": -41.21092224121094, "global_step": 311219, "epoch": 2572} {"train_loss": -39.7822380065918, "global_step": 311220, "epoch": 2572} {"train_loss": -42.71118927001953, "global_step": 311221, "epoch": 2572} {"train_loss": -40.90009307861328, "global_step": 311222, "epoch": 2572} {"train_loss": -41.54319381713867, "global_step": 311223, "epoch": 2572} {"train_loss": -42.00884246826172, "global_step": 311224, "epoch": 2572} {"train_loss": -42.46377182006836, "global_step": 311225, "epoch": 2572} {"train_loss": -41.48483657836914, "global_step": 311226, "epoch": 2572} {"train_loss": -43.13609313964844, "global_step": 311227, "epoch": 2572} {"train_loss": -40.411460876464844, "global_step": 311228, "epoch": 2572} {"train_loss": -41.679683685302734, "global_step": 311229, "epoch": 2572} {"train_loss": -43.153350830078125, "global_step": 311230, "epoch": 2572} {"train_loss": -41.514373779296875, "global_step": 311231, "epoch": 2572} {"train_loss": -41.8504753112793, "global_step": 311232, "epoch": 2572} {"train_loss": -43.15650177001953, "global_step": 311233, "epoch": 2572} {"train_loss": -42.6913948059082, "global_step": 311234, "epoch": 2572} {"train_loss": -41.968780517578125, "global_step": 311235, "epoch": 2572} {"train_loss": -42.515846252441406, "global_step": 311236, "epoch": 2572} {"train_loss": -41.99937438964844, "global_step": 311237, "epoch": 2572} {"train_loss": -41.37147521972656, "global_step": 311238, "epoch": 2572} {"train_loss": -41.69942855834961, "global_step": 311239, "epoch": 2572} {"train_loss": -41.48350143432617, "global_step": 311240, "epoch": 2572} {"train_loss": -42.590362548828125, "global_step": 311241, "epoch": 2572} {"train_loss": -42.808963775634766, "global_step": 311242, "epoch": 2572} {"train_loss": -42.66372299194336, "global_step": 311243, "epoch": 2572} {"train_loss": -43.34129333496094, "global_step": 311244, "epoch": 2572} {"train_loss": -41.432350158691406, "global_step": 311245, "epoch": 2572} {"train_loss": -42.2799186706543, "global_step": 311246, "epoch": 2572} {"train_loss": -41.05245590209961, "global_step": 311247, "epoch": 2572} {"train_loss": -40.76300811767578, "global_step": 311248, "epoch": 2572} {"train_loss": -41.28919219970703, "global_step": 311249, "epoch": 2572} {"train_loss": -40.85811233520508, "global_step": 311250, "epoch": 2572} {"train_loss": -41.30392074584961, "global_step": 311251, "epoch": 2572} {"train_loss": -40.70008850097656, "global_step": 311252, "epoch": 2572} {"train_loss": -41.89863967895508, "global_step": 311253, "epoch": 2572} {"train_loss": -42.244911193847656, "global_step": 311254, "epoch": 2572} {"train_loss": -41.677093505859375, "global_step": 311255, "epoch": 2572} {"train_loss": -42.13892364501953, "global_step": 311256, "epoch": 2572} {"train_loss": -42.835567474365234, "global_step": 311257, "epoch": 2572} {"train_loss": -41.61829376220703, "global_step": 311258, "epoch": 2572} {"train_loss": -43.0223274230957, "global_step": 311259, "epoch": 2572} {"train_loss": -42.507774353027344, "global_step": 311260, "epoch": 2572} {"train_loss": -43.236305236816406, "global_step": 311261, "epoch": 2572} {"train_loss": -42.63898468017578, "global_step": 311262, "epoch": 2572} {"train_loss": -43.21199417114258, "global_step": 311263, "epoch": 2572} {"train_loss": -42.89141845703125, "global_step": 311264, "epoch": 2572} {"train_loss": -43.68926239013672, "global_step": 311265, "epoch": 2572} {"train_loss": -42.934566497802734, "global_step": 311266, "epoch": 2572} {"train_loss": -43.196170806884766, "global_step": 311267, "epoch": 2572} {"train_loss": -42.143646240234375, "global_step": 311268, "epoch": 2572} {"train_loss": -42.70138931274414, "global_step": 311269, "epoch": 2572} {"train_loss": -43.80843734741211, "global_step": 311270, "epoch": 2572} {"train_loss": -43.64923858642578, "global_step": 311271, "epoch": 2572} {"train_loss": -43.19183349609375, "global_step": 311272, "epoch": 2572} {"train_loss": -42.573974609375, "global_step": 311273, "epoch": 2572} {"train_loss": -43.776248931884766, "global_step": 311274, "epoch": 2572} {"train_loss": -43.45773696899414, "global_step": 311275, "epoch": 2572} {"train_loss": -43.728736877441406, "global_step": 311276, "epoch": 2572} {"train_loss": -43.514564514160156, "global_step": 311277, "epoch": 2572} {"train_loss": -42.231754302978516, "global_step": 311278, "epoch": 2572} {"train_loss": -43.95719528198242, "global_step": 311279, "epoch": 2572} {"train_loss": -43.99985885620117, "global_step": 311280, "epoch": 2572} {"train_loss": -43.7601432800293, "global_step": 311281, "epoch": 2572} {"train_loss": -43.85091781616211, "global_step": 311282, "epoch": 2572} {"train_loss": -43.36896896362305, "global_step": 311283, "epoch": 2572} {"train_loss": -43.79105758666992, "global_step": 311284, "epoch": 2572} {"train_loss": -42.99306869506836, "global_step": 311285, "epoch": 2572} {"train_loss": -43.26544952392578, "global_step": 311286, "epoch": 2572} {"train_loss": -43.02386474609375, "global_step": 311287, "epoch": 2572} {"train_loss": -42.88582992553711, "global_step": 311288, "epoch": 2572} {"train_loss": -43.57347869873047, "global_step": 311289, "epoch": 2572} {"train_loss": -42.56223678588867, "global_step": 311290, "epoch": 2572} {"train_loss": -44.21315002441406, "global_step": 311291, "epoch": 2572} {"train_loss": -43.53434753417969, "global_step": 311292, "epoch": 2572} {"train_loss": -43.238956451416016, "global_step": 311293, "epoch": 2572} {"train_loss": -42.91536331176758, "global_step": 311294, "epoch": 2572} {"train_loss": -43.43706130981445, "global_step": 311295, "epoch": 2572} {"train_loss": -43.27014923095703, "global_step": 311296, "epoch": 2572} {"train_loss": -43.64765548706055, "global_step": 311297, "epoch": 2572} {"train_loss": -43.25992965698242, "global_step": 311298, "epoch": 2572} {"train_loss": -42.770835876464844, "global_step": 311299, "epoch": 2572} {"train_loss": -43.80216979980469, "global_step": 311300, "epoch": 2572} {"train_loss": -44.076263427734375, "global_step": 311301, "epoch": 2572} {"train_loss": -43.41490173339844, "global_step": 311302, "epoch": 2572} {"train_loss": -43.98469924926758, "global_step": 311303, "epoch": 2572} {"train_loss": -43.71321105957031, "global_step": 311304, "epoch": 2572} {"train_loss": -43.1216926574707, "global_step": 311305, "epoch": 2572} {"train_loss": -43.19620895385742, "global_step": 311306, "epoch": 2572} {"train_loss": -43.29304885864258, "global_step": 311307, "epoch": 2572} {"train_loss": -42.2916374206543, "global_step": 311308, "epoch": 2572} {"train_loss": -43.77528762817383, "global_step": 311309, "epoch": 2572} {"train_loss": -44.028419494628906, "global_step": 311310, "epoch": 2572} {"train_loss": -44.50667190551758, "global_step": 311311, "epoch": 2572} {"train_loss": -43.95269775390625, "global_step": 311312, "epoch": 2572} {"train_loss": -43.81764602661133, "global_step": 311313, "epoch": 2572} {"train_loss": -43.624900817871094, "global_step": 311314, "epoch": 2572} {"train_loss": -43.0290412902832, "global_step": 311315, "epoch": 2572} {"train_loss": -43.075042724609375, "global_step": 311316, "epoch": 2572} {"train_loss": -44.21257019042969, "global_step": 311317, "epoch": 2572} {"train_loss": -43.60688781738281, "global_step": 311318, "epoch": 2572} {"train_loss": -43.96906661987305, "global_step": 311319, "epoch": 2572} {"train_loss": -43.703041076660156, "global_step": 311320, "epoch": 2572} {"train_loss": -43.659912109375, "global_step": 311321, "epoch": 2572} {"train_loss": -44.043182373046875, "global_step": 311322, "epoch": 2572} {"train_loss": -43.671932220458984, "global_step": 311323, "epoch": 2572} {"train_loss": -44.04337692260742, "global_step": 311324, "epoch": 2572} {"train_loss": -42.613258361816406, "global_step": 311325, "epoch": 2572} {"train_loss": -43.667274475097656, "global_step": 311326, "epoch": 2572} {"train_loss": -43.28623962402344, "global_step": 311327, "epoch": 2572} {"train_loss": -44.21603012084961, "global_step": 311328, "epoch": 2572} {"train_loss": -43.66053009033203, "global_step": 311329, "epoch": 2572} {"train_loss": -44.051429748535156, "global_step": 311330, "epoch": 2572} {"train_loss": -42.38466262817383, "global_step": 311331, "epoch": 2572} {"train_loss": -42.81084915035027, "global_step": 311332, "epoch": 2572, "val_loss": 2834284.25} {"train_loss": -43.370819091796875, "global_step": 311333, "epoch": 2573} {"train_loss": -42.161834716796875, "global_step": 311334, "epoch": 2573} {"train_loss": -40.62517166137695, "global_step": 311335, "epoch": 2573} {"train_loss": -44.0605583190918, "global_step": 311336, "epoch": 2573} {"train_loss": -43.94673538208008, "global_step": 311337, "epoch": 2573} {"train_loss": -44.2108039855957, "global_step": 311338, "epoch": 2573} {"train_loss": -43.4030647277832, "global_step": 311339, "epoch": 2573} {"train_loss": -43.014984130859375, "global_step": 311340, "epoch": 2573} {"train_loss": -42.038265228271484, "global_step": 311341, "epoch": 2573} {"train_loss": -43.07685470581055, "global_step": 311342, "epoch": 2573} {"train_loss": -44.191932678222656, "global_step": 311343, "epoch": 2573} {"train_loss": -42.744140625, "global_step": 311344, "epoch": 2573} {"train_loss": -43.14870834350586, "global_step": 311345, "epoch": 2573} {"train_loss": -36.00875473022461, "global_step": 311346, "epoch": 2573} {"train_loss": -43.16474533081055, "global_step": 311347, "epoch": 2573} {"train_loss": -44.00162124633789, "global_step": 311348, "epoch": 2573} {"train_loss": -42.1932373046875, "global_step": 311349, "epoch": 2573} {"train_loss": -41.78448486328125, "global_step": 311350, "epoch": 2573} {"train_loss": -42.13465118408203, "global_step": 311351, "epoch": 2573} {"train_loss": -42.50962448120117, "global_step": 311352, "epoch": 2573} {"train_loss": -42.61259078979492, "global_step": 311353, "epoch": 2573} {"train_loss": -43.4987678527832, "global_step": 311354, "epoch": 2573} {"train_loss": -42.94907760620117, "global_step": 311355, "epoch": 2573} {"train_loss": -43.88142013549805, "global_step": 311356, "epoch": 2573} {"train_loss": -42.70929718017578, "global_step": 311357, "epoch": 2573} {"train_loss": 14.208813667297363, "global_step": 311358, "epoch": 2573} {"train_loss": -40.52421951293945, "global_step": 311359, "epoch": 2573} {"train_loss": -41.66534423828125, "global_step": 311360, "epoch": 2573} {"train_loss": -39.15261459350586, "global_step": 311361, "epoch": 2573} {"train_loss": -41.14442825317383, "global_step": 311362, "epoch": 2573} {"train_loss": -39.72381591796875, "global_step": 311363, "epoch": 2573} {"train_loss": -40.526851654052734, "global_step": 311364, "epoch": 2573} {"train_loss": -41.38767623901367, "global_step": 311365, "epoch": 2573} {"train_loss": -39.774330139160156, "global_step": 311366, "epoch": 2573} {"train_loss": -34.95962142944336, "global_step": 311367, "epoch": 2573} {"train_loss": -39.79799270629883, "global_step": 311368, "epoch": 2573} {"train_loss": -31.773483276367188, "global_step": 311369, "epoch": 2573} {"train_loss": -39.26542282104492, "global_step": 311370, "epoch": 2573} {"train_loss": -40.617488861083984, "global_step": 311371, "epoch": 2573} {"train_loss": -37.78872299194336, "global_step": 311372, "epoch": 2573} {"train_loss": -23.8164005279541, "global_step": 311373, "epoch": 2573} {"train_loss": -39.313629150390625, "global_step": 311374, "epoch": 2573} {"train_loss": -41.06620407104492, "global_step": 311375, "epoch": 2573} {"train_loss": -39.23443603515625, "global_step": 311376, "epoch": 2573} {"train_loss": -41.225704193115234, "global_step": 311377, "epoch": 2573} {"train_loss": -41.425331115722656, "global_step": 311378, "epoch": 2573} {"train_loss": -28.207921981811523, "global_step": 311379, "epoch": 2573} {"train_loss": -41.182430267333984, "global_step": 311380, "epoch": 2573} {"train_loss": -36.08401107788086, "global_step": 311381, "epoch": 2573} {"train_loss": -39.158287048339844, "global_step": 311382, "epoch": 2573} {"train_loss": -40.8066520690918, "global_step": 311383, "epoch": 2573} {"train_loss": -38.76532745361328, "global_step": 311384, "epoch": 2573} {"train_loss": -40.07666015625, "global_step": 311385, "epoch": 2573} {"train_loss": -39.54330062866211, "global_step": 311386, "epoch": 2573} {"train_loss": -39.999019622802734, "global_step": 311387, "epoch": 2573} {"train_loss": -34.86983871459961, "global_step": 311388, "epoch": 2573} {"train_loss": -37.90219497680664, "global_step": 311389, "epoch": 2573} {"train_loss": -39.20388412475586, "global_step": 311390, "epoch": 2573} {"train_loss": -38.266876220703125, "global_step": 311391, "epoch": 2573} {"train_loss": -41.280941009521484, "global_step": 311392, "epoch": 2573} {"train_loss": -41.92216491699219, "global_step": 311393, "epoch": 2573} {"train_loss": -41.29502487182617, "global_step": 311394, "epoch": 2573} {"train_loss": -40.31232452392578, "global_step": 311395, "epoch": 2573} {"train_loss": -42.03981018066406, "global_step": 311396, "epoch": 2573} {"train_loss": -41.87630844116211, "global_step": 311397, "epoch": 2573} {"train_loss": -40.69853591918945, "global_step": 311398, "epoch": 2573} {"train_loss": -41.62008285522461, "global_step": 311399, "epoch": 2573} {"train_loss": -40.97355270385742, "global_step": 311400, "epoch": 2573} {"train_loss": -41.814979553222656, "global_step": 311401, "epoch": 2573} {"train_loss": -41.73468017578125, "global_step": 311402, "epoch": 2573} {"train_loss": -42.25398254394531, "global_step": 311403, "epoch": 2573} {"train_loss": -42.013240814208984, "global_step": 311404, "epoch": 2573} {"train_loss": -42.24980163574219, "global_step": 311405, "epoch": 2573} {"train_loss": -42.04621505737305, "global_step": 311406, "epoch": 2573} {"train_loss": -41.27886962890625, "global_step": 311407, "epoch": 2573} {"train_loss": -41.31340408325195, "global_step": 311408, "epoch": 2573} {"train_loss": -41.72758102416992, "global_step": 311409, "epoch": 2573} {"train_loss": -40.854225158691406, "global_step": 311410, "epoch": 2573} {"train_loss": -42.13014602661133, "global_step": 311411, "epoch": 2573} {"train_loss": -42.355712890625, "global_step": 311412, "epoch": 2573} {"train_loss": -42.486175537109375, "global_step": 311413, "epoch": 2573} {"train_loss": -42.15327072143555, "global_step": 311414, "epoch": 2573} {"train_loss": -42.48934555053711, "global_step": 311415, "epoch": 2573} {"train_loss": -41.535770416259766, "global_step": 311416, "epoch": 2573} {"train_loss": -42.678409576416016, "global_step": 311417, "epoch": 2573} {"train_loss": -42.35224151611328, "global_step": 311418, "epoch": 2573} {"train_loss": -42.68539047241211, "global_step": 311419, "epoch": 2573} {"train_loss": -42.75201416015625, "global_step": 311420, "epoch": 2573} {"train_loss": -42.8620719909668, "global_step": 311421, "epoch": 2573} {"train_loss": -41.862266540527344, "global_step": 311422, "epoch": 2573} {"train_loss": -41.55141830444336, "global_step": 311423, "epoch": 2573} {"train_loss": -42.8852424621582, "global_step": 311424, "epoch": 2573} {"train_loss": -43.06352233886719, "global_step": 311425, "epoch": 2573} {"train_loss": -42.19354248046875, "global_step": 311426, "epoch": 2573} {"train_loss": -42.95760726928711, "global_step": 311427, "epoch": 2573} {"train_loss": -43.005672454833984, "global_step": 311428, "epoch": 2573} {"train_loss": -42.97256088256836, "global_step": 311429, "epoch": 2573} {"train_loss": -42.850364685058594, "global_step": 311430, "epoch": 2573} {"train_loss": -43.179359436035156, "global_step": 311431, "epoch": 2573} {"train_loss": -43.342140197753906, "global_step": 311432, "epoch": 2573} {"train_loss": -42.939208984375, "global_step": 311433, "epoch": 2573} {"train_loss": -42.090946197509766, "global_step": 311434, "epoch": 2573} {"train_loss": -43.117061614990234, "global_step": 311435, "epoch": 2573} {"train_loss": -43.59326934814453, "global_step": 311436, "epoch": 2573} {"train_loss": -42.076454162597656, "global_step": 311437, "epoch": 2573} {"train_loss": -43.479583740234375, "global_step": 311438, "epoch": 2573} {"train_loss": -43.63043212890625, "global_step": 311439, "epoch": 2573} {"train_loss": -43.43600082397461, "global_step": 311440, "epoch": 2573} {"train_loss": -42.55631637573242, "global_step": 311441, "epoch": 2573} {"train_loss": -42.75947189331055, "global_step": 311442, "epoch": 2573} {"train_loss": -43.46333312988281, "global_step": 311443, "epoch": 2573} {"train_loss": -43.78878402709961, "global_step": 311444, "epoch": 2573} {"train_loss": -43.30972671508789, "global_step": 311445, "epoch": 2573} {"train_loss": -43.172584533691406, "global_step": 311446, "epoch": 2573} {"train_loss": -43.21125030517578, "global_step": 311447, "epoch": 2573} {"train_loss": -42.27021408081055, "global_step": 311448, "epoch": 2573} {"train_loss": -43.525821685791016, "global_step": 311449, "epoch": 2573} {"train_loss": -43.06092071533203, "global_step": 311450, "epoch": 2573} {"train_loss": -43.49930953979492, "global_step": 311451, "epoch": 2573} {"train_loss": -43.558929443359375, "global_step": 311452, "epoch": 2573} {"train_loss": -40.932591107266006, "global_step": 311453, "epoch": 2573, "val_loss": 2633135.5} {"train_loss": -43.13666915893555, "global_step": 311454, "epoch": 2574} {"train_loss": -43.594539642333984, "global_step": 311455, "epoch": 2574} {"train_loss": -43.769325256347656, "global_step": 311456, "epoch": 2574} {"train_loss": -43.8369026184082, "global_step": 311457, "epoch": 2574} {"train_loss": -44.17097854614258, "global_step": 311458, "epoch": 2574} {"train_loss": -43.797969818115234, "global_step": 311459, "epoch": 2574} {"train_loss": -44.0920295715332, "global_step": 311460, "epoch": 2574} {"train_loss": -44.07221221923828, "global_step": 311461, "epoch": 2574} {"train_loss": -44.02264404296875, "global_step": 311462, "epoch": 2574} {"train_loss": -43.694766998291016, "global_step": 311463, "epoch": 2574} {"train_loss": -43.90171432495117, "global_step": 311464, "epoch": 2574} {"train_loss": -43.405391693115234, "global_step": 311465, "epoch": 2574} {"train_loss": -44.30521774291992, "global_step": 311466, "epoch": 2574} {"train_loss": -43.8061637878418, "global_step": 311467, "epoch": 2574} {"train_loss": -44.10129928588867, "global_step": 311468, "epoch": 2574} {"train_loss": -43.37039566040039, "global_step": 311469, "epoch": 2574} {"train_loss": -43.44387435913086, "global_step": 311470, "epoch": 2574} {"train_loss": -43.73101043701172, "global_step": 311471, "epoch": 2574} {"train_loss": -43.73435592651367, "global_step": 311472, "epoch": 2574} {"train_loss": -43.986473083496094, "global_step": 311473, "epoch": 2574} {"train_loss": -43.44788360595703, "global_step": 311474, "epoch": 2574} {"train_loss": -42.90089416503906, "global_step": 311475, "epoch": 2574} {"train_loss": -43.76203155517578, "global_step": 311476, "epoch": 2574} {"train_loss": -44.36288070678711, "global_step": 311477, "epoch": 2574} {"train_loss": -43.483463287353516, "global_step": 311478, "epoch": 2574} {"train_loss": -42.16556930541992, "global_step": 311479, "epoch": 2574} {"train_loss": -42.674434661865234, "global_step": 311480, "epoch": 2574} {"train_loss": -43.849647521972656, "global_step": 311481, "epoch": 2574} {"train_loss": -44.0871467590332, "global_step": 311482, "epoch": 2574} {"train_loss": -43.43305206298828, "global_step": 311483, "epoch": 2574} {"train_loss": -42.125057220458984, "global_step": 311484, "epoch": 2574} {"train_loss": -42.96464157104492, "global_step": 311485, "epoch": 2574} {"train_loss": -43.861881256103516, "global_step": 311486, "epoch": 2574} {"train_loss": -43.98850631713867, "global_step": 311487, "epoch": 2574} {"train_loss": -43.855560302734375, "global_step": 311488, "epoch": 2574} {"train_loss": -43.327327728271484, "global_step": 311489, "epoch": 2574} {"train_loss": -42.956695556640625, "global_step": 311490, "epoch": 2574} {"train_loss": -43.175716400146484, "global_step": 311491, "epoch": 2574} {"train_loss": -43.17123031616211, "global_step": 311492, "epoch": 2574} {"train_loss": -43.26955032348633, "global_step": 311493, "epoch": 2574} {"train_loss": -43.694801330566406, "global_step": 311494, "epoch": 2574} {"train_loss": -41.61750030517578, "global_step": 311495, "epoch": 2574} {"train_loss": -37.6806755065918, "global_step": 311496, "epoch": 2574} {"train_loss": -32.94035720825195, "global_step": 311497, "epoch": 2574} {"train_loss": -28.010961532592773, "global_step": 311498, "epoch": 2574} {"train_loss": -20.882055282592773, "global_step": 311499, "epoch": 2574} {"train_loss": -32.082862854003906, "global_step": 311500, "epoch": 2574} {"train_loss": -38.60407638549805, "global_step": 311501, "epoch": 2574} {"train_loss": -20.68507194519043, "global_step": 311502, "epoch": 2574} {"train_loss": -23.49510955810547, "global_step": 311503, "epoch": 2574} {"train_loss": -38.458370208740234, "global_step": 311504, "epoch": 2574} {"train_loss": -20.25265121459961, "global_step": 311505, "epoch": 2574} {"train_loss": -35.17331314086914, "global_step": 311506, "epoch": 2574} {"train_loss": -23.36212730407715, "global_step": 311507, "epoch": 2574} {"train_loss": -38.224605560302734, "global_step": 311508, "epoch": 2574} {"train_loss": -23.123172760009766, "global_step": 311509, "epoch": 2574} {"train_loss": -36.713111877441406, "global_step": 311510, "epoch": 2574} {"train_loss": -27.49232292175293, "global_step": 311511, "epoch": 2574} {"train_loss": -35.30290603637695, "global_step": 311512, "epoch": 2574} {"train_loss": -31.530780792236328, "global_step": 311513, "epoch": 2574} {"train_loss": -36.24660873413086, "global_step": 311514, "epoch": 2574} {"train_loss": -38.55876922607422, "global_step": 311515, "epoch": 2574} {"train_loss": -33.26986312866211, "global_step": 311516, "epoch": 2574} {"train_loss": -37.4403076171875, "global_step": 311517, "epoch": 2574} {"train_loss": -37.870933532714844, "global_step": 311518, "epoch": 2574} {"train_loss": -37.40177536010742, "global_step": 311519, "epoch": 2574} {"train_loss": -37.70758819580078, "global_step": 311520, "epoch": 2574} {"train_loss": -40.494625091552734, "global_step": 311521, "epoch": 2574} {"train_loss": -38.38047409057617, "global_step": 311522, "epoch": 2574} {"train_loss": -38.582069396972656, "global_step": 311523, "epoch": 2574} {"train_loss": -39.418983459472656, "global_step": 311524, "epoch": 2574} {"train_loss": -39.89656448364258, "global_step": 311525, "epoch": 2574} {"train_loss": -39.58061599731445, "global_step": 311526, "epoch": 2574} {"train_loss": -40.073360443115234, "global_step": 311527, "epoch": 2574} {"train_loss": -40.85200119018555, "global_step": 311528, "epoch": 2574} {"train_loss": -40.07478713989258, "global_step": 311529, "epoch": 2574} {"train_loss": -40.163204193115234, "global_step": 311530, "epoch": 2574} {"train_loss": -40.801998138427734, "global_step": 311531, "epoch": 2574} {"train_loss": -40.6906852722168, "global_step": 311532, "epoch": 2574} {"train_loss": -40.225521087646484, "global_step": 311533, "epoch": 2574} {"train_loss": -40.676090240478516, "global_step": 311534, "epoch": 2574} {"train_loss": -40.90450668334961, "global_step": 311535, "epoch": 2574} {"train_loss": -40.906463623046875, "global_step": 311536, "epoch": 2574} {"train_loss": -41.0877571105957, "global_step": 311537, "epoch": 2574} {"train_loss": -41.04341506958008, "global_step": 311538, "epoch": 2574} {"train_loss": -41.74208450317383, "global_step": 311539, "epoch": 2574} {"train_loss": -40.55375289916992, "global_step": 311540, "epoch": 2574} {"train_loss": -41.40705108642578, "global_step": 311541, "epoch": 2574} {"train_loss": -40.81105422973633, "global_step": 311542, "epoch": 2574} {"train_loss": -41.28931427001953, "global_step": 311543, "epoch": 2574} {"train_loss": -41.66353988647461, "global_step": 311544, "epoch": 2574} {"train_loss": -41.64744186401367, "global_step": 311545, "epoch": 2574} {"train_loss": -41.11153793334961, "global_step": 311546, "epoch": 2574} {"train_loss": -41.674922943115234, "global_step": 311547, "epoch": 2574} {"train_loss": -41.56538009643555, "global_step": 311548, "epoch": 2574} {"train_loss": -41.74544906616211, "global_step": 311549, "epoch": 2574} {"train_loss": -41.466461181640625, "global_step": 311550, "epoch": 2574} {"train_loss": -41.553829193115234, "global_step": 311551, "epoch": 2574} {"train_loss": -41.66868591308594, "global_step": 311552, "epoch": 2574} {"train_loss": -41.689178466796875, "global_step": 311553, "epoch": 2574} {"train_loss": -42.1452751159668, "global_step": 311554, "epoch": 2574} {"train_loss": -41.981658935546875, "global_step": 311555, "epoch": 2574} {"train_loss": -42.44343185424805, "global_step": 311556, "epoch": 2574} {"train_loss": -42.1678352355957, "global_step": 311557, "epoch": 2574} {"train_loss": -42.47330093383789, "global_step": 311558, "epoch": 2574} {"train_loss": -42.48491668701172, "global_step": 311559, "epoch": 2574} {"train_loss": -42.112972259521484, "global_step": 311560, "epoch": 2574} {"train_loss": -42.25857925415039, "global_step": 311561, "epoch": 2574} {"train_loss": -42.55282211303711, "global_step": 311562, "epoch": 2574} {"train_loss": -42.4018669128418, "global_step": 311563, "epoch": 2574} {"train_loss": -42.33488082885742, "global_step": 311564, "epoch": 2574} {"train_loss": -42.520599365234375, "global_step": 311565, "epoch": 2574} {"train_loss": -42.79279327392578, "global_step": 311566, "epoch": 2574} {"train_loss": -42.427879333496094, "global_step": 311567, "epoch": 2574} {"train_loss": -42.74300765991211, "global_step": 311568, "epoch": 2574} {"train_loss": -42.89645004272461, "global_step": 311569, "epoch": 2574} {"train_loss": -42.73371124267578, "global_step": 311570, "epoch": 2574} {"train_loss": -42.770668029785156, "global_step": 311571, "epoch": 2574} {"train_loss": -42.8380241394043, "global_step": 311572, "epoch": 2574} {"train_loss": -43.14540481567383, "global_step": 311573, "epoch": 2574} {"train_loss": -40.237064913284684, "global_step": 311574, "epoch": 2574, "val_loss": 2753622.75} {"train_loss": -43.03022003173828, "global_step": 311575, "epoch": 2575} {"train_loss": -42.61381912231445, "global_step": 311576, "epoch": 2575} {"train_loss": -43.17792510986328, "global_step": 311577, "epoch": 2575} {"train_loss": -42.8838005065918, "global_step": 311578, "epoch": 2575} {"train_loss": -43.38869857788086, "global_step": 311579, "epoch": 2575} {"train_loss": -43.30401611328125, "global_step": 311580, "epoch": 2575} {"train_loss": -43.373050689697266, "global_step": 311581, "epoch": 2575} {"train_loss": -42.98759078979492, "global_step": 311582, "epoch": 2575} {"train_loss": -43.433685302734375, "global_step": 311583, "epoch": 2575} {"train_loss": -43.28633499145508, "global_step": 311584, "epoch": 2575} {"train_loss": -42.95668411254883, "global_step": 311585, "epoch": 2575} {"train_loss": -43.930511474609375, "global_step": 311586, "epoch": 2575} {"train_loss": -43.20895004272461, "global_step": 311587, "epoch": 2575} {"train_loss": -43.265987396240234, "global_step": 311588, "epoch": 2575} {"train_loss": -43.83053207397461, "global_step": 311589, "epoch": 2575} {"train_loss": -43.63923263549805, "global_step": 311590, "epoch": 2575} {"train_loss": -43.496376037597656, "global_step": 311591, "epoch": 2575} {"train_loss": -43.241554260253906, "global_step": 311592, "epoch": 2575} {"train_loss": -44.02415466308594, "global_step": 311593, "epoch": 2575} {"train_loss": -43.54340744018555, "global_step": 311594, "epoch": 2575} {"train_loss": -43.745849609375, "global_step": 311595, "epoch": 2575} {"train_loss": -43.99674606323242, "global_step": 311596, "epoch": 2575} {"train_loss": -44.025508880615234, "global_step": 311597, "epoch": 2575} {"train_loss": -43.31289291381836, "global_step": 311598, "epoch": 2575} {"train_loss": -43.84843826293945, "global_step": 311599, "epoch": 2575} {"train_loss": -42.886085510253906, "global_step": 311600, "epoch": 2575} {"train_loss": -43.853858947753906, "global_step": 311601, "epoch": 2575} {"train_loss": -43.95733642578125, "global_step": 311602, "epoch": 2575} {"train_loss": -43.944496154785156, "global_step": 311603, "epoch": 2575} {"train_loss": -43.73504638671875, "global_step": 311604, "epoch": 2575} {"train_loss": -43.66357421875, "global_step": 311605, "epoch": 2575} {"train_loss": -44.14057922363281, "global_step": 311606, "epoch": 2575} {"train_loss": -44.16887664794922, "global_step": 311607, "epoch": 2575} {"train_loss": -43.212440490722656, "global_step": 311608, "epoch": 2575} {"train_loss": -43.87523651123047, "global_step": 311609, "epoch": 2575} {"train_loss": -43.853431701660156, "global_step": 311610, "epoch": 2575} {"train_loss": -44.338069915771484, "global_step": 311611, "epoch": 2575} {"train_loss": -43.61058044433594, "global_step": 311612, "epoch": 2575} {"train_loss": -44.01604080200195, "global_step": 311613, "epoch": 2575} {"train_loss": -44.299983978271484, "global_step": 311614, "epoch": 2575} {"train_loss": -43.81779479980469, "global_step": 311615, "epoch": 2575} {"train_loss": -44.344112396240234, "global_step": 311616, "epoch": 2575} {"train_loss": -44.3795051574707, "global_step": 311617, "epoch": 2575} {"train_loss": -43.382877349853516, "global_step": 311618, "epoch": 2575} {"train_loss": -44.1143684387207, "global_step": 311619, "epoch": 2575} {"train_loss": -43.986602783203125, "global_step": 311620, "epoch": 2575} {"train_loss": -44.369903564453125, "global_step": 311621, "epoch": 2575} {"train_loss": -43.86591339111328, "global_step": 311622, "epoch": 2575} {"train_loss": -44.410491943359375, "global_step": 311623, "epoch": 2575} {"train_loss": -44.25322341918945, "global_step": 311624, "epoch": 2575} {"train_loss": -43.87856674194336, "global_step": 311625, "epoch": 2575} {"train_loss": -44.03715133666992, "global_step": 311626, "epoch": 2575} {"train_loss": -44.456233978271484, "global_step": 311627, "epoch": 2575} {"train_loss": -44.20333480834961, "global_step": 311628, "epoch": 2575} {"train_loss": -44.19517135620117, "global_step": 311629, "epoch": 2575} {"train_loss": -43.90682601928711, "global_step": 311630, "epoch": 2575} {"train_loss": -43.896602630615234, "global_step": 311631, "epoch": 2575} {"train_loss": -44.2838134765625, "global_step": 311632, "epoch": 2575} {"train_loss": -43.9147834777832, "global_step": 311633, "epoch": 2575} {"train_loss": -43.781410217285156, "global_step": 311634, "epoch": 2575} {"train_loss": -43.94843292236328, "global_step": 311635, "epoch": 2575} {"train_loss": -43.9035530090332, "global_step": 311636, "epoch": 2575} {"train_loss": -44.58917236328125, "global_step": 311637, "epoch": 2575} {"train_loss": -44.398746490478516, "global_step": 311638, "epoch": 2575} {"train_loss": -44.11567306518555, "global_step": 311639, "epoch": 2575} {"train_loss": -44.518592834472656, "global_step": 311640, "epoch": 2575} {"train_loss": -44.440425872802734, "global_step": 311641, "epoch": 2575} {"train_loss": -44.17975997924805, "global_step": 311642, "epoch": 2575} {"train_loss": -44.18362808227539, "global_step": 311643, "epoch": 2575} {"train_loss": -44.163143157958984, "global_step": 311644, "epoch": 2575} {"train_loss": -42.989662170410156, "global_step": 311645, "epoch": 2575} {"train_loss": -43.856178283691406, "global_step": 311646, "epoch": 2575} {"train_loss": -44.64600372314453, "global_step": 311647, "epoch": 2575} {"train_loss": -44.31599044799805, "global_step": 311648, "epoch": 2575} {"train_loss": -44.579193115234375, "global_step": 311649, "epoch": 2575} {"train_loss": -44.7704963684082, "global_step": 311650, "epoch": 2575} {"train_loss": -43.97871017456055, "global_step": 311651, "epoch": 2575} {"train_loss": -44.50590133666992, "global_step": 311652, "epoch": 2575} {"train_loss": -44.55379867553711, "global_step": 311653, "epoch": 2575} {"train_loss": -44.0586051940918, "global_step": 311654, "epoch": 2575} {"train_loss": -44.336727142333984, "global_step": 311655, "epoch": 2575} {"train_loss": -42.53239822387695, "global_step": 311656, "epoch": 2575} {"train_loss": -43.735816955566406, "global_step": 311657, "epoch": 2575} {"train_loss": -43.8062858581543, "global_step": 311658, "epoch": 2575} {"train_loss": -43.525047302246094, "global_step": 311659, "epoch": 2575} {"train_loss": -42.50772476196289, "global_step": 311660, "epoch": 2575} {"train_loss": -41.021846771240234, "global_step": 311661, "epoch": 2575} {"train_loss": -40.88156509399414, "global_step": 311662, "epoch": 2575} {"train_loss": -40.407867431640625, "global_step": 311663, "epoch": 2575} {"train_loss": -38.3389778137207, "global_step": 311664, "epoch": 2575} {"train_loss": -36.72673416137695, "global_step": 311665, "epoch": 2575} {"train_loss": -33.535499572753906, "global_step": 311666, "epoch": 2575} {"train_loss": -36.306182861328125, "global_step": 311667, "epoch": 2575} {"train_loss": -38.26634979248047, "global_step": 311668, "epoch": 2575} {"train_loss": -38.8109016418457, "global_step": 311669, "epoch": 2575} {"train_loss": -42.05586242675781, "global_step": 311670, "epoch": 2575} {"train_loss": -40.07900619506836, "global_step": 311671, "epoch": 2575} {"train_loss": -40.33455276489258, "global_step": 311672, "epoch": 2575} {"train_loss": -40.99974060058594, "global_step": 311673, "epoch": 2575} {"train_loss": -43.01800537109375, "global_step": 311674, "epoch": 2575} {"train_loss": -40.57339096069336, "global_step": 311675, "epoch": 2575} {"train_loss": -41.55201721191406, "global_step": 311676, "epoch": 2575} {"train_loss": -41.354976654052734, "global_step": 311677, "epoch": 2575} {"train_loss": -40.674617767333984, "global_step": 311678, "epoch": 2575} {"train_loss": -39.45246505737305, "global_step": 311679, "epoch": 2575} {"train_loss": -42.56020736694336, "global_step": 311680, "epoch": 2575} {"train_loss": -39.96887969970703, "global_step": 311681, "epoch": 2575} {"train_loss": -42.71548080444336, "global_step": 311682, "epoch": 2575} {"train_loss": -41.14216995239258, "global_step": 311683, "epoch": 2575} {"train_loss": -42.61960983276367, "global_step": 311684, "epoch": 2575} {"train_loss": -41.893829345703125, "global_step": 311685, "epoch": 2575} {"train_loss": -42.143367767333984, "global_step": 311686, "epoch": 2575} {"train_loss": -41.42963790893555, "global_step": 311687, "epoch": 2575} {"train_loss": -42.82887649536133, "global_step": 311688, "epoch": 2575} {"train_loss": -41.11187744140625, "global_step": 311689, "epoch": 2575} {"train_loss": -43.399871826171875, "global_step": 311690, "epoch": 2575} {"train_loss": -42.653507232666016, "global_step": 311691, "epoch": 2575} {"train_loss": -42.545143127441406, "global_step": 311692, "epoch": 2575} {"train_loss": -42.846126556396484, "global_step": 311693, "epoch": 2575} {"train_loss": -42.49106979370117, "global_step": 311694, "epoch": 2575} {"train_loss": -42.960073234621156, "global_step": 311695, "epoch": 2575, "val_loss": 2732720.75} {"train_loss": -43.19197082519531, "global_step": 311696, "epoch": 2576} {"train_loss": -42.21343994140625, "global_step": 311697, "epoch": 2576} {"train_loss": -41.973567962646484, "global_step": 311698, "epoch": 2576} {"train_loss": -42.743408203125, "global_step": 311699, "epoch": 2576} {"train_loss": -41.76738357543945, "global_step": 311700, "epoch": 2576} {"train_loss": -42.18081283569336, "global_step": 311701, "epoch": 2576} {"train_loss": -42.21475601196289, "global_step": 311702, "epoch": 2576} {"train_loss": -43.25038528442383, "global_step": 311703, "epoch": 2576} {"train_loss": -42.460384368896484, "global_step": 311704, "epoch": 2576} {"train_loss": -42.145904541015625, "global_step": 311705, "epoch": 2576} {"train_loss": -42.864051818847656, "global_step": 311706, "epoch": 2576} {"train_loss": -42.59503936767578, "global_step": 311707, "epoch": 2576} {"train_loss": -42.62858963012695, "global_step": 311708, "epoch": 2576} {"train_loss": -42.59646224975586, "global_step": 311709, "epoch": 2576} {"train_loss": -43.451637268066406, "global_step": 311710, "epoch": 2576} {"train_loss": -43.009307861328125, "global_step": 311711, "epoch": 2576} {"train_loss": -43.27448654174805, "global_step": 311712, "epoch": 2576} {"train_loss": -43.30851364135742, "global_step": 311713, "epoch": 2576} {"train_loss": -42.578834533691406, "global_step": 311714, "epoch": 2576} {"train_loss": -43.326229095458984, "global_step": 311715, "epoch": 2576} {"train_loss": -42.977783203125, "global_step": 311716, "epoch": 2576} {"train_loss": -43.775611877441406, "global_step": 311717, "epoch": 2576} {"train_loss": -43.643043518066406, "global_step": 311718, "epoch": 2576} {"train_loss": -43.42726516723633, "global_step": 311719, "epoch": 2576} {"train_loss": -43.992027282714844, "global_step": 311720, "epoch": 2576} {"train_loss": -42.178466796875, "global_step": 311721, "epoch": 2576} {"train_loss": -43.76858139038086, "global_step": 311722, "epoch": 2576} {"train_loss": -43.556182861328125, "global_step": 311723, "epoch": 2576} {"train_loss": -43.64174270629883, "global_step": 311724, "epoch": 2576} {"train_loss": -43.6733512878418, "global_step": 311725, "epoch": 2576} {"train_loss": -43.912322998046875, "global_step": 311726, "epoch": 2576} {"train_loss": -43.7650032043457, "global_step": 311727, "epoch": 2576} {"train_loss": -43.98365020751953, "global_step": 311728, "epoch": 2576} {"train_loss": -43.67289733886719, "global_step": 311729, "epoch": 2576} {"train_loss": -43.83567428588867, "global_step": 311730, "epoch": 2576} {"train_loss": -44.432064056396484, "global_step": 311731, "epoch": 2576} {"train_loss": -44.15350341796875, "global_step": 311732, "epoch": 2576} {"train_loss": -44.131507873535156, "global_step": 311733, "epoch": 2576} {"train_loss": -43.86759567260742, "global_step": 311734, "epoch": 2576} {"train_loss": -43.85246276855469, "global_step": 311735, "epoch": 2576} {"train_loss": -43.22017288208008, "global_step": 311736, "epoch": 2576} {"train_loss": -43.823177337646484, "global_step": 311737, "epoch": 2576} {"train_loss": -44.02597427368164, "global_step": 311738, "epoch": 2576} {"train_loss": -43.74203872680664, "global_step": 311739, "epoch": 2576} {"train_loss": -44.20078659057617, "global_step": 311740, "epoch": 2576} {"train_loss": -44.22346115112305, "global_step": 311741, "epoch": 2576} {"train_loss": -43.8731803894043, "global_step": 311742, "epoch": 2576} {"train_loss": -43.95123291015625, "global_step": 311743, "epoch": 2576} {"train_loss": -44.33549499511719, "global_step": 311744, "epoch": 2576} {"train_loss": -43.810157775878906, "global_step": 311745, "epoch": 2576} {"train_loss": -43.86300277709961, "global_step": 311746, "epoch": 2576} {"train_loss": -43.916053771972656, "global_step": 311747, "epoch": 2576} {"train_loss": -44.21066665649414, "global_step": 311748, "epoch": 2576} {"train_loss": -43.38103103637695, "global_step": 311749, "epoch": 2576} {"train_loss": -44.022430419921875, "global_step": 311750, "epoch": 2576} {"train_loss": -44.1917839050293, "global_step": 311751, "epoch": 2576} {"train_loss": -44.0799674987793, "global_step": 311752, "epoch": 2576} {"train_loss": -44.185813903808594, "global_step": 311753, "epoch": 2576} {"train_loss": -44.08930587768555, "global_step": 311754, "epoch": 2576} {"train_loss": -43.804969787597656, "global_step": 311755, "epoch": 2576} {"train_loss": -44.03263473510742, "global_step": 311756, "epoch": 2576} {"train_loss": -39.16785430908203, "global_step": 311757, "epoch": 2576} {"train_loss": -44.26560592651367, "global_step": 311758, "epoch": 2576} {"train_loss": -44.09079360961914, "global_step": 311759, "epoch": 2576} {"train_loss": -42.06901168823242, "global_step": 311760, "epoch": 2576} {"train_loss": -42.118080139160156, "global_step": 311761, "epoch": 2576} {"train_loss": -42.504764556884766, "global_step": 311762, "epoch": 2576} {"train_loss": -44.10108184814453, "global_step": 311763, "epoch": 2576} {"train_loss": -42.732662200927734, "global_step": 311764, "epoch": 2576} {"train_loss": -40.63201904296875, "global_step": 311765, "epoch": 2576} {"train_loss": -41.30922317504883, "global_step": 311766, "epoch": 2576} {"train_loss": -42.444374084472656, "global_step": 311767, "epoch": 2576} {"train_loss": -39.147422790527344, "global_step": 311768, "epoch": 2576} {"train_loss": -38.28861999511719, "global_step": 311769, "epoch": 2576} {"train_loss": -42.74569320678711, "global_step": 311770, "epoch": 2576} {"train_loss": -40.318695068359375, "global_step": 311771, "epoch": 2576} {"train_loss": -38.50786590576172, "global_step": 311772, "epoch": 2576} {"train_loss": -43.30527877807617, "global_step": 311773, "epoch": 2576} {"train_loss": -39.74978256225586, "global_step": 311774, "epoch": 2576} {"train_loss": -40.99008560180664, "global_step": 311775, "epoch": 2576} {"train_loss": -42.70242691040039, "global_step": 311776, "epoch": 2576} {"train_loss": -41.30106735229492, "global_step": 311777, "epoch": 2576} {"train_loss": -41.870121002197266, "global_step": 311778, "epoch": 2576} {"train_loss": -42.36602020263672, "global_step": 311779, "epoch": 2576} {"train_loss": -42.52680587768555, "global_step": 311780, "epoch": 2576} {"train_loss": -42.27820587158203, "global_step": 311781, "epoch": 2576} {"train_loss": -41.14349365234375, "global_step": 311782, "epoch": 2576} {"train_loss": -42.829429626464844, "global_step": 311783, "epoch": 2576} {"train_loss": -41.41366195678711, "global_step": 311784, "epoch": 2576} {"train_loss": -42.61356735229492, "global_step": 311785, "epoch": 2576} {"train_loss": -40.76856994628906, "global_step": 311786, "epoch": 2576} {"train_loss": -42.644134521484375, "global_step": 311787, "epoch": 2576} {"train_loss": -41.25492477416992, "global_step": 311788, "epoch": 2576} {"train_loss": -43.173030853271484, "global_step": 311789, "epoch": 2576} {"train_loss": -41.7532958984375, "global_step": 311790, "epoch": 2576} {"train_loss": -42.81001663208008, "global_step": 311791, "epoch": 2576} {"train_loss": -42.096309661865234, "global_step": 311792, "epoch": 2576} {"train_loss": -42.34608840942383, "global_step": 311793, "epoch": 2576} {"train_loss": -42.4404296875, "global_step": 311794, "epoch": 2576} {"train_loss": -42.92841339111328, "global_step": 311795, "epoch": 2576} {"train_loss": -41.99296188354492, "global_step": 311796, "epoch": 2576} {"train_loss": -42.72944259643555, "global_step": 311797, "epoch": 2576} {"train_loss": -43.1069450378418, "global_step": 311798, "epoch": 2576} {"train_loss": -42.69184494018555, "global_step": 311799, "epoch": 2576} {"train_loss": -43.40841293334961, "global_step": 311800, "epoch": 2576} {"train_loss": -43.6827507019043, "global_step": 311801, "epoch": 2576} {"train_loss": -43.329673767089844, "global_step": 311802, "epoch": 2576} {"train_loss": -43.23359298706055, "global_step": 311803, "epoch": 2576} {"train_loss": -42.99884033203125, "global_step": 311804, "epoch": 2576} {"train_loss": -43.561370849609375, "global_step": 311805, "epoch": 2576} {"train_loss": -43.34870147705078, "global_step": 311806, "epoch": 2576} {"train_loss": -42.91252899169922, "global_step": 311807, "epoch": 2576} {"train_loss": -43.45454025268555, "global_step": 311808, "epoch": 2576} {"train_loss": -43.539764404296875, "global_step": 311809, "epoch": 2576} {"train_loss": -42.16341018676758, "global_step": 311810, "epoch": 2576} {"train_loss": -43.3638916015625, "global_step": 311811, "epoch": 2576} {"train_loss": -44.00334548950195, "global_step": 311812, "epoch": 2576} {"train_loss": -43.63515853881836, "global_step": 311813, "epoch": 2576} {"train_loss": -43.20611572265625, "global_step": 311814, "epoch": 2576} {"train_loss": -43.501155853271484, "global_step": 311815, "epoch": 2576} {"train_loss": -42.89019633521718, "global_step": 311816, "epoch": 2576, "val_loss": 2785901.75} {"train_loss": -43.80778121948242, "global_step": 311817, "epoch": 2577} {"train_loss": -43.5829963684082, "global_step": 311818, "epoch": 2577} {"train_loss": -43.35416030883789, "global_step": 311819, "epoch": 2577} {"train_loss": -43.759212493896484, "global_step": 311820, "epoch": 2577} {"train_loss": -43.84797286987305, "global_step": 311821, "epoch": 2577} {"train_loss": -43.65318298339844, "global_step": 311822, "epoch": 2577} {"train_loss": -42.47809600830078, "global_step": 311823, "epoch": 2577} {"train_loss": -43.83463668823242, "global_step": 311824, "epoch": 2577} {"train_loss": -43.62189483642578, "global_step": 311825, "epoch": 2577} {"train_loss": -43.9011116027832, "global_step": 311826, "epoch": 2577} {"train_loss": -44.04964828491211, "global_step": 311827, "epoch": 2577} {"train_loss": -43.554473876953125, "global_step": 311828, "epoch": 2577} {"train_loss": -44.4198112487793, "global_step": 311829, "epoch": 2577} {"train_loss": -43.718055725097656, "global_step": 311830, "epoch": 2577} {"train_loss": -43.37361526489258, "global_step": 311831, "epoch": 2577} {"train_loss": -43.213134765625, "global_step": 311832, "epoch": 2577} {"train_loss": -43.829254150390625, "global_step": 311833, "epoch": 2577} {"train_loss": -43.54953384399414, "global_step": 311834, "epoch": 2577} {"train_loss": -43.9501953125, "global_step": 311835, "epoch": 2577} {"train_loss": -43.3447380065918, "global_step": 311836, "epoch": 2577} {"train_loss": -44.00799560546875, "global_step": 311837, "epoch": 2577} {"train_loss": -43.57868576049805, "global_step": 311838, "epoch": 2577} {"train_loss": -43.66328811645508, "global_step": 311839, "epoch": 2577} {"train_loss": -44.16305160522461, "global_step": 311840, "epoch": 2577} {"train_loss": -43.99279022216797, "global_step": 311841, "epoch": 2577} {"train_loss": -43.79244613647461, "global_step": 311842, "epoch": 2577} {"train_loss": -43.87818145751953, "global_step": 311843, "epoch": 2577} {"train_loss": -44.405548095703125, "global_step": 311844, "epoch": 2577} {"train_loss": -44.234535217285156, "global_step": 311845, "epoch": 2577} {"train_loss": -44.01357650756836, "global_step": 311846, "epoch": 2577} {"train_loss": -44.119258880615234, "global_step": 311847, "epoch": 2577} {"train_loss": -44.21549606323242, "global_step": 311848, "epoch": 2577} {"train_loss": -44.04255294799805, "global_step": 311849, "epoch": 2577} {"train_loss": -44.02655029296875, "global_step": 311850, "epoch": 2577} {"train_loss": -43.763607025146484, "global_step": 311851, "epoch": 2577} {"train_loss": -43.07417297363281, "global_step": 311852, "epoch": 2577} {"train_loss": -43.08945846557617, "global_step": 311853, "epoch": 2577} {"train_loss": -43.4953498840332, "global_step": 311854, "epoch": 2577} {"train_loss": -44.47657012939453, "global_step": 311855, "epoch": 2577} {"train_loss": -43.87216567993164, "global_step": 311856, "epoch": 2577} {"train_loss": -44.2021369934082, "global_step": 311857, "epoch": 2577} {"train_loss": -44.42397689819336, "global_step": 311858, "epoch": 2577} {"train_loss": -44.18621826171875, "global_step": 311859, "epoch": 2577} {"train_loss": -44.43770980834961, "global_step": 311860, "epoch": 2577} {"train_loss": -44.73876190185547, "global_step": 311861, "epoch": 2577} {"train_loss": -43.65366744995117, "global_step": 311862, "epoch": 2577} {"train_loss": -44.22744369506836, "global_step": 311863, "epoch": 2577} {"train_loss": -43.69422912597656, "global_step": 311864, "epoch": 2577} {"train_loss": -43.98691940307617, "global_step": 311865, "epoch": 2577} {"train_loss": -45.041709899902344, "global_step": 311866, "epoch": 2577} {"train_loss": -43.67055130004883, "global_step": 311867, "epoch": 2577} {"train_loss": -44.73257827758789, "global_step": 311868, "epoch": 2577} {"train_loss": -44.07280731201172, "global_step": 311869, "epoch": 2577} {"train_loss": -44.51329040527344, "global_step": 311870, "epoch": 2577} {"train_loss": -44.229244232177734, "global_step": 311871, "epoch": 2577} {"train_loss": -44.183467864990234, "global_step": 311872, "epoch": 2577} {"train_loss": -43.8665771484375, "global_step": 311873, "epoch": 2577} {"train_loss": -42.09177017211914, "global_step": 311874, "epoch": 2577} {"train_loss": -38.823463439941406, "global_step": 311875, "epoch": 2577} {"train_loss": -35.764827728271484, "global_step": 311876, "epoch": 2577} {"train_loss": -35.9972038269043, "global_step": 311877, "epoch": 2577} {"train_loss": -38.35979080200195, "global_step": 311878, "epoch": 2577} {"train_loss": -40.688926696777344, "global_step": 311879, "epoch": 2577} {"train_loss": -40.98978805541992, "global_step": 311880, "epoch": 2577} {"train_loss": -38.38344192504883, "global_step": 311881, "epoch": 2577} {"train_loss": -40.25486755371094, "global_step": 311882, "epoch": 2577} {"train_loss": -38.892635345458984, "global_step": 311883, "epoch": 2577} {"train_loss": -42.908233642578125, "global_step": 311884, "epoch": 2577} {"train_loss": -40.07966232299805, "global_step": 311885, "epoch": 2577} {"train_loss": -41.4033088684082, "global_step": 311886, "epoch": 2577} {"train_loss": -40.441490173339844, "global_step": 311887, "epoch": 2577} {"train_loss": -40.07428741455078, "global_step": 311888, "epoch": 2577} {"train_loss": -40.746826171875, "global_step": 311889, "epoch": 2577} {"train_loss": -39.88149642944336, "global_step": 311890, "epoch": 2577} {"train_loss": -38.455162048339844, "global_step": 311891, "epoch": 2577} {"train_loss": -39.4934196472168, "global_step": 311892, "epoch": 2577} {"train_loss": -41.758766174316406, "global_step": 311893, "epoch": 2577} {"train_loss": -39.90591049194336, "global_step": 311894, "epoch": 2577} {"train_loss": -41.85874557495117, "global_step": 311895, "epoch": 2577} {"train_loss": -41.37622833251953, "global_step": 311896, "epoch": 2577} {"train_loss": -41.3442268371582, "global_step": 311897, "epoch": 2577} {"train_loss": -41.368831634521484, "global_step": 311898, "epoch": 2577} {"train_loss": -42.031551361083984, "global_step": 311899, "epoch": 2577} {"train_loss": -41.22309112548828, "global_step": 311900, "epoch": 2577} {"train_loss": -42.21622848510742, "global_step": 311901, "epoch": 2577} {"train_loss": -42.47804641723633, "global_step": 311902, "epoch": 2577} {"train_loss": -41.513206481933594, "global_step": 311903, "epoch": 2577} {"train_loss": -43.01748275756836, "global_step": 311904, "epoch": 2577} {"train_loss": -42.30525588989258, "global_step": 311905, "epoch": 2577} {"train_loss": -43.08580780029297, "global_step": 311906, "epoch": 2577} {"train_loss": -41.91590118408203, "global_step": 311907, "epoch": 2577} {"train_loss": -41.54509353637695, "global_step": 311908, "epoch": 2577} {"train_loss": -43.14686584472656, "global_step": 311909, "epoch": 2577} {"train_loss": -42.24430465698242, "global_step": 311910, "epoch": 2577} {"train_loss": -42.754188537597656, "global_step": 311911, "epoch": 2577} {"train_loss": -42.612091064453125, "global_step": 311912, "epoch": 2577} {"train_loss": -42.237545013427734, "global_step": 311913, "epoch": 2577} {"train_loss": -42.324180603027344, "global_step": 311914, "epoch": 2577} {"train_loss": -43.53358840942383, "global_step": 311915, "epoch": 2577} {"train_loss": -42.7244758605957, "global_step": 311916, "epoch": 2577} {"train_loss": -42.81268310546875, "global_step": 311917, "epoch": 2577} {"train_loss": -43.02825927734375, "global_step": 311918, "epoch": 2577} {"train_loss": -42.036869049072266, "global_step": 311919, "epoch": 2577} {"train_loss": -42.22813034057617, "global_step": 311920, "epoch": 2577} {"train_loss": -43.27141189575195, "global_step": 311921, "epoch": 2577} {"train_loss": -42.28337478637695, "global_step": 311922, "epoch": 2577} {"train_loss": -42.840301513671875, "global_step": 311923, "epoch": 2577} {"train_loss": -43.30189895629883, "global_step": 311924, "epoch": 2577} {"train_loss": -42.763648986816406, "global_step": 311925, "epoch": 2577} {"train_loss": -43.178955078125, "global_step": 311926, "epoch": 2577} {"train_loss": -43.63167190551758, "global_step": 311927, "epoch": 2577} {"train_loss": -43.36845016479492, "global_step": 311928, "epoch": 2577} {"train_loss": -42.54253387451172, "global_step": 311929, "epoch": 2577} {"train_loss": -43.42656326293945, "global_step": 311930, "epoch": 2577} {"train_loss": -42.27643585205078, "global_step": 311931, "epoch": 2577} {"train_loss": -43.4655647277832, "global_step": 311932, "epoch": 2577} {"train_loss": -43.52956008911133, "global_step": 311933, "epoch": 2577} {"train_loss": -43.283668518066406, "global_step": 311934, "epoch": 2577} {"train_loss": -43.27975082397461, "global_step": 311935, "epoch": 2577} {"train_loss": -44.33463668823242, "global_step": 311936, "epoch": 2577} {"train_loss": -42.73776440581015, "global_step": 311937, "epoch": 2577, "val_loss": 2730144.75} {"train_loss": -43.79825973510742, "global_step": 311938, "epoch": 2578} {"train_loss": -43.8955192565918, "global_step": 311939, "epoch": 2578} {"train_loss": -43.81753158569336, "global_step": 311940, "epoch": 2578} {"train_loss": -43.84577941894531, "global_step": 311941, "epoch": 2578} {"train_loss": -44.212364196777344, "global_step": 311942, "epoch": 2578} {"train_loss": -42.7661247253418, "global_step": 311943, "epoch": 2578} {"train_loss": -44.28837966918945, "global_step": 311944, "epoch": 2578} {"train_loss": -44.12547302246094, "global_step": 311945, "epoch": 2578} {"train_loss": -43.47967529296875, "global_step": 311946, "epoch": 2578} {"train_loss": -44.19536209106445, "global_step": 311947, "epoch": 2578} {"train_loss": -43.68099594116211, "global_step": 311948, "epoch": 2578} {"train_loss": -43.70656204223633, "global_step": 311949, "epoch": 2578} {"train_loss": -44.04948425292969, "global_step": 311950, "epoch": 2578} {"train_loss": -43.91463851928711, "global_step": 311951, "epoch": 2578} {"train_loss": -44.4395866394043, "global_step": 311952, "epoch": 2578} {"train_loss": -44.38513946533203, "global_step": 311953, "epoch": 2578} {"train_loss": -44.220069885253906, "global_step": 311954, "epoch": 2578} {"train_loss": -43.6036491394043, "global_step": 311955, "epoch": 2578} {"train_loss": -44.027706146240234, "global_step": 311956, "epoch": 2578} {"train_loss": -43.93733215332031, "global_step": 311957, "epoch": 2578} {"train_loss": -43.35036087036133, "global_step": 311958, "epoch": 2578} {"train_loss": -44.40102005004883, "global_step": 311959, "epoch": 2578} {"train_loss": -43.277503967285156, "global_step": 311960, "epoch": 2578} {"train_loss": -44.093963623046875, "global_step": 311961, "epoch": 2578} {"train_loss": -43.922298431396484, "global_step": 311962, "epoch": 2578} {"train_loss": -43.66024398803711, "global_step": 311963, "epoch": 2578} {"train_loss": -44.327327728271484, "global_step": 311964, "epoch": 2578} {"train_loss": -43.52468490600586, "global_step": 311965, "epoch": 2578} {"train_loss": -43.92393112182617, "global_step": 311966, "epoch": 2578} {"train_loss": -43.709625244140625, "global_step": 311967, "epoch": 2578} {"train_loss": -44.041046142578125, "global_step": 311968, "epoch": 2578} {"train_loss": -43.876121520996094, "global_step": 311969, "epoch": 2578} {"train_loss": -44.56256103515625, "global_step": 311970, "epoch": 2578} {"train_loss": -44.188026428222656, "global_step": 311971, "epoch": 2578} {"train_loss": -43.36770248413086, "global_step": 311972, "epoch": 2578} {"train_loss": -44.460811614990234, "global_step": 311973, "epoch": 2578} {"train_loss": -44.59148025512695, "global_step": 311974, "epoch": 2578} {"train_loss": -43.93285369873047, "global_step": 311975, "epoch": 2578} {"train_loss": -44.20125961303711, "global_step": 311976, "epoch": 2578} {"train_loss": -44.65064239501953, "global_step": 311977, "epoch": 2578} {"train_loss": -44.16230392456055, "global_step": 311978, "epoch": 2578} {"train_loss": -42.19281768798828, "global_step": 311979, "epoch": 2578} {"train_loss": -42.07006072998047, "global_step": 311980, "epoch": 2578} {"train_loss": -44.35721969604492, "global_step": 311981, "epoch": 2578} {"train_loss": -44.19379425048828, "global_step": 311982, "epoch": 2578} {"train_loss": -43.25416564941406, "global_step": 311983, "epoch": 2578} {"train_loss": -42.92490768432617, "global_step": 311984, "epoch": 2578} {"train_loss": -43.02744674682617, "global_step": 311985, "epoch": 2578} {"train_loss": -43.44157791137695, "global_step": 311986, "epoch": 2578} {"train_loss": -41.075958251953125, "global_step": 311987, "epoch": 2578} {"train_loss": -41.06745147705078, "global_step": 311988, "epoch": 2578} {"train_loss": -43.25154495239258, "global_step": 311989, "epoch": 2578} {"train_loss": -37.28017807006836, "global_step": 311990, "epoch": 2578} {"train_loss": -36.08069610595703, "global_step": 311991, "epoch": 2578} {"train_loss": -42.61689758300781, "global_step": 311992, "epoch": 2578} {"train_loss": -41.21169662475586, "global_step": 311993, "epoch": 2578} {"train_loss": -42.01559066772461, "global_step": 311994, "epoch": 2578} {"train_loss": -43.150726318359375, "global_step": 311995, "epoch": 2578} {"train_loss": -42.68876647949219, "global_step": 311996, "epoch": 2578} {"train_loss": -43.502349853515625, "global_step": 311997, "epoch": 2578} {"train_loss": -42.703125, "global_step": 311998, "epoch": 2578} {"train_loss": -42.972686767578125, "global_step": 311999, "epoch": 2578} {"train_loss": -42.66394805908203, "global_step": 312000, "epoch": 2578} {"train_loss": -43.821773529052734, "global_step": 312001, "epoch": 2578} {"train_loss": -43.65876007080078, "global_step": 312002, "epoch": 2578} {"train_loss": -43.658626556396484, "global_step": 312003, "epoch": 2578} {"train_loss": -43.48775100708008, "global_step": 312004, "epoch": 2578} {"train_loss": -43.64646911621094, "global_step": 312005, "epoch": 2578} {"train_loss": -43.59112548828125, "global_step": 312006, "epoch": 2578} {"train_loss": -43.28349304199219, "global_step": 312007, "epoch": 2578} {"train_loss": -43.79127883911133, "global_step": 312008, "epoch": 2578} {"train_loss": -43.5604133605957, "global_step": 312009, "epoch": 2578} {"train_loss": -44.16437530517578, "global_step": 312010, "epoch": 2578} {"train_loss": -44.155845642089844, "global_step": 312011, "epoch": 2578} {"train_loss": -43.960540771484375, "global_step": 312012, "epoch": 2578} {"train_loss": -43.82588577270508, "global_step": 312013, "epoch": 2578} {"train_loss": -44.114158630371094, "global_step": 312014, "epoch": 2578} {"train_loss": -44.10029220581055, "global_step": 312015, "epoch": 2578} {"train_loss": -44.051170349121094, "global_step": 312016, "epoch": 2578} {"train_loss": -43.989383697509766, "global_step": 312017, "epoch": 2578} {"train_loss": -44.1895751953125, "global_step": 312018, "epoch": 2578} {"train_loss": -43.773597717285156, "global_step": 312019, "epoch": 2578} {"train_loss": -44.001441955566406, "global_step": 312020, "epoch": 2578} {"train_loss": -44.37844467163086, "global_step": 312021, "epoch": 2578} {"train_loss": -44.00734329223633, "global_step": 312022, "epoch": 2578} {"train_loss": -44.38018035888672, "global_step": 312023, "epoch": 2578} {"train_loss": -44.454288482666016, "global_step": 312024, "epoch": 2578} {"train_loss": -44.25650405883789, "global_step": 312025, "epoch": 2578} {"train_loss": -43.95786666870117, "global_step": 312026, "epoch": 2578} {"train_loss": -44.26862335205078, "global_step": 312027, "epoch": 2578} {"train_loss": -43.81395721435547, "global_step": 312028, "epoch": 2578} {"train_loss": -44.45377731323242, "global_step": 312029, "epoch": 2578} {"train_loss": -44.787532806396484, "global_step": 312030, "epoch": 2578} {"train_loss": -44.29587936401367, "global_step": 312031, "epoch": 2578} {"train_loss": -43.1489372253418, "global_step": 312032, "epoch": 2578} {"train_loss": -44.457759857177734, "global_step": 312033, "epoch": 2578} {"train_loss": -44.517189025878906, "global_step": 312034, "epoch": 2578} {"train_loss": -44.6138801574707, "global_step": 312035, "epoch": 2578} {"train_loss": -44.69956588745117, "global_step": 312036, "epoch": 2578} {"train_loss": -43.713775634765625, "global_step": 312037, "epoch": 2578} {"train_loss": -43.750732421875, "global_step": 312038, "epoch": 2578} {"train_loss": -45.044105529785156, "global_step": 312039, "epoch": 2578} {"train_loss": -43.51873779296875, "global_step": 312040, "epoch": 2578} {"train_loss": -43.15053939819336, "global_step": 312041, "epoch": 2578} {"train_loss": -42.2006950378418, "global_step": 312042, "epoch": 2578} {"train_loss": -43.53072738647461, "global_step": 312043, "epoch": 2578} {"train_loss": -42.813167572021484, "global_step": 312044, "epoch": 2578} {"train_loss": -43.680904388427734, "global_step": 312045, "epoch": 2578} {"train_loss": -44.1364860534668, "global_step": 312046, "epoch": 2578} {"train_loss": -43.739013671875, "global_step": 312047, "epoch": 2578} {"train_loss": -43.749237060546875, "global_step": 312048, "epoch": 2578} {"train_loss": -44.26416015625, "global_step": 312049, "epoch": 2578} {"train_loss": -43.98446273803711, "global_step": 312050, "epoch": 2578} {"train_loss": -43.94645309448242, "global_step": 312051, "epoch": 2578} {"train_loss": -43.43668746948242, "global_step": 312052, "epoch": 2578} {"train_loss": -43.64132308959961, "global_step": 312053, "epoch": 2578} {"train_loss": -43.65498352050781, "global_step": 312054, "epoch": 2578} {"train_loss": -43.91048049926758, "global_step": 312055, "epoch": 2578} {"train_loss": -44.08454513549805, "global_step": 312056, "epoch": 2578} {"train_loss": -43.72400665283203, "global_step": 312057, "epoch": 2578} {"train_loss": -43.611304448655815, "global_step": 312058, "epoch": 2578, "val_loss": 2756884.0} {"train_loss": -43.83626174926758, "global_step": 312059, "epoch": 2579} {"train_loss": -44.018489837646484, "global_step": 312060, "epoch": 2579} {"train_loss": -44.080543518066406, "global_step": 312061, "epoch": 2579} {"train_loss": -43.39616012573242, "global_step": 312062, "epoch": 2579} {"train_loss": -44.2954216003418, "global_step": 312063, "epoch": 2579} {"train_loss": -44.04975509643555, "global_step": 312064, "epoch": 2579} {"train_loss": -44.28923034667969, "global_step": 312065, "epoch": 2579} {"train_loss": -44.46860885620117, "global_step": 312066, "epoch": 2579} {"train_loss": -44.333282470703125, "global_step": 312067, "epoch": 2579} {"train_loss": -44.529361724853516, "global_step": 312068, "epoch": 2579} {"train_loss": -43.881221771240234, "global_step": 312069, "epoch": 2579} {"train_loss": -44.03997039794922, "global_step": 312070, "epoch": 2579} {"train_loss": -43.01792907714844, "global_step": 312071, "epoch": 2579} {"train_loss": -43.6071662902832, "global_step": 312072, "epoch": 2579} {"train_loss": -42.98296356201172, "global_step": 312073, "epoch": 2579} {"train_loss": -40.98976516723633, "global_step": 312074, "epoch": 2579} {"train_loss": -42.87358474731445, "global_step": 312075, "epoch": 2579} {"train_loss": -43.457054138183594, "global_step": 312076, "epoch": 2579} {"train_loss": -43.42610549926758, "global_step": 312077, "epoch": 2579} {"train_loss": -42.7226676940918, "global_step": 312078, "epoch": 2579} {"train_loss": -42.92159652709961, "global_step": 312079, "epoch": 2579} {"train_loss": -43.69646072387695, "global_step": 312080, "epoch": 2579} {"train_loss": -43.77873611450195, "global_step": 312081, "epoch": 2579} {"train_loss": -43.17169189453125, "global_step": 312082, "epoch": 2579} {"train_loss": -43.270240783691406, "global_step": 312083, "epoch": 2579} {"train_loss": -43.89092254638672, "global_step": 312084, "epoch": 2579} {"train_loss": -43.9783935546875, "global_step": 312085, "epoch": 2579} {"train_loss": -44.05117416381836, "global_step": 312086, "epoch": 2579} {"train_loss": -43.8535270690918, "global_step": 312087, "epoch": 2579} {"train_loss": -42.95337677001953, "global_step": 312088, "epoch": 2579} {"train_loss": -43.61025619506836, "global_step": 312089, "epoch": 2579} {"train_loss": -43.84096908569336, "global_step": 312090, "epoch": 2579} {"train_loss": -43.67359161376953, "global_step": 312091, "epoch": 2579} {"train_loss": -43.871131896972656, "global_step": 312092, "epoch": 2579} {"train_loss": -44.49837875366211, "global_step": 312093, "epoch": 2579} {"train_loss": -43.56295394897461, "global_step": 312094, "epoch": 2579} {"train_loss": -43.30781936645508, "global_step": 312095, "epoch": 2579} {"train_loss": -43.508419036865234, "global_step": 312096, "epoch": 2579} {"train_loss": -44.22856903076172, "global_step": 312097, "epoch": 2579} {"train_loss": -41.95280075073242, "global_step": 312098, "epoch": 2579} {"train_loss": -43.34330368041992, "global_step": 312099, "epoch": 2579} {"train_loss": -43.707122802734375, "global_step": 312100, "epoch": 2579} {"train_loss": -43.508399963378906, "global_step": 312101, "epoch": 2579} {"train_loss": -43.449676513671875, "global_step": 312102, "epoch": 2579} {"train_loss": -43.216407775878906, "global_step": 312103, "epoch": 2579} {"train_loss": -43.729244232177734, "global_step": 312104, "epoch": 2579} {"train_loss": -41.0897102355957, "global_step": 312105, "epoch": 2579} {"train_loss": -43.790382385253906, "global_step": 312106, "epoch": 2579} {"train_loss": -42.99911117553711, "global_step": 312107, "epoch": 2579} {"train_loss": -43.38798904418945, "global_step": 312108, "epoch": 2579} {"train_loss": -43.29277038574219, "global_step": 312109, "epoch": 2579} {"train_loss": -43.45935821533203, "global_step": 312110, "epoch": 2579} {"train_loss": -44.01470947265625, "global_step": 312111, "epoch": 2579} {"train_loss": -43.477630615234375, "global_step": 312112, "epoch": 2579} {"train_loss": -43.3753547668457, "global_step": 312113, "epoch": 2579} {"train_loss": -43.902793884277344, "global_step": 312114, "epoch": 2579} {"train_loss": -43.742000579833984, "global_step": 312115, "epoch": 2579} {"train_loss": -43.27910614013672, "global_step": 312116, "epoch": 2579} {"train_loss": -43.70663070678711, "global_step": 312117, "epoch": 2579} {"train_loss": -43.49577331542969, "global_step": 312118, "epoch": 2579} {"train_loss": -43.55337142944336, "global_step": 312119, "epoch": 2579} {"train_loss": -41.4223747253418, "global_step": 312120, "epoch": 2579} {"train_loss": -43.09431457519531, "global_step": 312121, "epoch": 2579} {"train_loss": -43.467254638671875, "global_step": 312122, "epoch": 2579} {"train_loss": -43.77830123901367, "global_step": 312123, "epoch": 2579} {"train_loss": -42.59711456298828, "global_step": 312124, "epoch": 2579} {"train_loss": -42.44571304321289, "global_step": 312125, "epoch": 2579} {"train_loss": -43.9163932800293, "global_step": 312126, "epoch": 2579} {"train_loss": -42.868751525878906, "global_step": 312127, "epoch": 2579} {"train_loss": -42.5058708190918, "global_step": 312128, "epoch": 2579} {"train_loss": -42.2653694152832, "global_step": 312129, "epoch": 2579} {"train_loss": -43.0467643737793, "global_step": 312130, "epoch": 2579} {"train_loss": -43.049415588378906, "global_step": 312131, "epoch": 2579} {"train_loss": -43.60783004760742, "global_step": 312132, "epoch": 2579} {"train_loss": -43.32277297973633, "global_step": 312133, "epoch": 2579} {"train_loss": -43.626075744628906, "global_step": 312134, "epoch": 2579} {"train_loss": -43.297115325927734, "global_step": 312135, "epoch": 2579} {"train_loss": -43.359230041503906, "global_step": 312136, "epoch": 2579} {"train_loss": -43.3990592956543, "global_step": 312137, "epoch": 2579} {"train_loss": -44.00661849975586, "global_step": 312138, "epoch": 2579} {"train_loss": -44.03839111328125, "global_step": 312139, "epoch": 2579} {"train_loss": -42.279502868652344, "global_step": 312140, "epoch": 2579} {"train_loss": -43.17626953125, "global_step": 312141, "epoch": 2579} {"train_loss": -43.57937240600586, "global_step": 312142, "epoch": 2579} {"train_loss": -43.29143142700195, "global_step": 312143, "epoch": 2579} {"train_loss": -42.580787658691406, "global_step": 312144, "epoch": 2579} {"train_loss": -41.8065071105957, "global_step": 312145, "epoch": 2579} {"train_loss": -43.287635803222656, "global_step": 312146, "epoch": 2579} {"train_loss": -43.68498611450195, "global_step": 312147, "epoch": 2579} {"train_loss": -43.29307174682617, "global_step": 312148, "epoch": 2579} {"train_loss": -43.79038619995117, "global_step": 312149, "epoch": 2579} {"train_loss": -43.38654708862305, "global_step": 312150, "epoch": 2579} {"train_loss": -43.83494186401367, "global_step": 312151, "epoch": 2579} {"train_loss": -42.699581146240234, "global_step": 312152, "epoch": 2579} {"train_loss": -41.52958679199219, "global_step": 312153, "epoch": 2579} {"train_loss": -43.08391189575195, "global_step": 312154, "epoch": 2579} {"train_loss": -43.53169250488281, "global_step": 312155, "epoch": 2579} {"train_loss": -41.41428756713867, "global_step": 312156, "epoch": 2579} {"train_loss": -42.27168273925781, "global_step": 312157, "epoch": 2579} {"train_loss": -43.84000778198242, "global_step": 312158, "epoch": 2579} {"train_loss": -42.70859146118164, "global_step": 312159, "epoch": 2579} {"train_loss": -42.096736907958984, "global_step": 312160, "epoch": 2579} {"train_loss": -43.118629455566406, "global_step": 312161, "epoch": 2579} {"train_loss": -43.21516036987305, "global_step": 312162, "epoch": 2579} {"train_loss": -38.92702102661133, "global_step": 312163, "epoch": 2579} {"train_loss": -41.78154754638672, "global_step": 312164, "epoch": 2579} {"train_loss": -43.52193069458008, "global_step": 312165, "epoch": 2579} {"train_loss": -41.68394088745117, "global_step": 312166, "epoch": 2579} {"train_loss": -41.633338928222656, "global_step": 312167, "epoch": 2579} {"train_loss": -43.94627380371094, "global_step": 312168, "epoch": 2579} {"train_loss": -42.272071838378906, "global_step": 312169, "epoch": 2579} {"train_loss": -41.88753128051758, "global_step": 312170, "epoch": 2579} {"train_loss": -43.842079162597656, "global_step": 312171, "epoch": 2579} {"train_loss": -42.339298248291016, "global_step": 312172, "epoch": 2579} {"train_loss": -42.43601608276367, "global_step": 312173, "epoch": 2579} {"train_loss": -42.71380615234375, "global_step": 312174, "epoch": 2579} {"train_loss": -41.658321380615234, "global_step": 312175, "epoch": 2579} {"train_loss": -41.8449592590332, "global_step": 312176, "epoch": 2579} {"train_loss": -42.9354362487793, "global_step": 312177, "epoch": 2579} {"train_loss": -42.35709762573242, "global_step": 312178, "epoch": 2579} {"train_loss": -43.17605675941657, "global_step": 312179, "epoch": 2579, "val_loss": 2723971.75} {"train_loss": -42.64331817626953, "global_step": 312180, "epoch": 2580} {"train_loss": -43.17868423461914, "global_step": 312181, "epoch": 2580} {"train_loss": -42.55500030517578, "global_step": 312182, "epoch": 2580} {"train_loss": -40.65090560913086, "global_step": 312183, "epoch": 2580} {"train_loss": -42.048091888427734, "global_step": 312184, "epoch": 2580} {"train_loss": -42.92863082885742, "global_step": 312185, "epoch": 2580} {"train_loss": -41.37005615234375, "global_step": 312186, "epoch": 2580} {"train_loss": -41.711788177490234, "global_step": 312187, "epoch": 2580} {"train_loss": -43.626502990722656, "global_step": 312188, "epoch": 2580} {"train_loss": -41.793212890625, "global_step": 312189, "epoch": 2580} {"train_loss": -42.98212432861328, "global_step": 312190, "epoch": 2580} {"train_loss": -43.17031478881836, "global_step": 312191, "epoch": 2580} {"train_loss": -43.535274505615234, "global_step": 312192, "epoch": 2580} {"train_loss": -43.054378509521484, "global_step": 312193, "epoch": 2580} {"train_loss": -43.46845245361328, "global_step": 312194, "epoch": 2580} {"train_loss": -43.36444854736328, "global_step": 312195, "epoch": 2580} {"train_loss": -43.96940231323242, "global_step": 312196, "epoch": 2580} {"train_loss": -43.89288330078125, "global_step": 312197, "epoch": 2580} {"train_loss": -43.45530319213867, "global_step": 312198, "epoch": 2580} {"train_loss": -43.33684158325195, "global_step": 312199, "epoch": 2580} {"train_loss": -43.136573791503906, "global_step": 312200, "epoch": 2580} {"train_loss": -43.96429443359375, "global_step": 312201, "epoch": 2580} {"train_loss": -43.52851486206055, "global_step": 312202, "epoch": 2580} {"train_loss": -43.9920654296875, "global_step": 312203, "epoch": 2580} {"train_loss": -44.033241271972656, "global_step": 312204, "epoch": 2580} {"train_loss": -44.49009323120117, "global_step": 312205, "epoch": 2580} {"train_loss": -44.01123046875, "global_step": 312206, "epoch": 2580} {"train_loss": -43.950504302978516, "global_step": 312207, "epoch": 2580} {"train_loss": -43.61396026611328, "global_step": 312208, "epoch": 2580} {"train_loss": -43.93914794921875, "global_step": 312209, "epoch": 2580} {"train_loss": -43.91215515136719, "global_step": 312210, "epoch": 2580} {"train_loss": -44.1727180480957, "global_step": 312211, "epoch": 2580} {"train_loss": -43.77671813964844, "global_step": 312212, "epoch": 2580} {"train_loss": -43.6783561706543, "global_step": 312213, "epoch": 2580} {"train_loss": -43.4935188293457, "global_step": 312214, "epoch": 2580} {"train_loss": -43.74467086791992, "global_step": 312215, "epoch": 2580} {"train_loss": -43.713165283203125, "global_step": 312216, "epoch": 2580} {"train_loss": -43.94550323486328, "global_step": 312217, "epoch": 2580} {"train_loss": -44.20113754272461, "global_step": 312218, "epoch": 2580} {"train_loss": -43.77976608276367, "global_step": 312219, "epoch": 2580} {"train_loss": -44.15776062011719, "global_step": 312220, "epoch": 2580} {"train_loss": -43.868324279785156, "global_step": 312221, "epoch": 2580} {"train_loss": -44.12703323364258, "global_step": 312222, "epoch": 2580} {"train_loss": -44.728981018066406, "global_step": 312223, "epoch": 2580} {"train_loss": -44.2150993347168, "global_step": 312224, "epoch": 2580} {"train_loss": -44.40713882446289, "global_step": 312225, "epoch": 2580} {"train_loss": -44.4007453918457, "global_step": 312226, "epoch": 2580} {"train_loss": -44.226356506347656, "global_step": 312227, "epoch": 2580} {"train_loss": -43.993377685546875, "global_step": 312228, "epoch": 2580} {"train_loss": -44.10334014892578, "global_step": 312229, "epoch": 2580} {"train_loss": -43.81589889526367, "global_step": 312230, "epoch": 2580} {"train_loss": -43.512115478515625, "global_step": 312231, "epoch": 2580} {"train_loss": -43.955318450927734, "global_step": 312232, "epoch": 2580} {"train_loss": -44.3048210144043, "global_step": 312233, "epoch": 2580} {"train_loss": -44.30803298950195, "global_step": 312234, "epoch": 2580} {"train_loss": -44.634742736816406, "global_step": 312235, "epoch": 2580} {"train_loss": -43.21797561645508, "global_step": 312236, "epoch": 2580} {"train_loss": -44.07352828979492, "global_step": 312237, "epoch": 2580} {"train_loss": -43.849361419677734, "global_step": 312238, "epoch": 2580} {"train_loss": -43.876121520996094, "global_step": 312239, "epoch": 2580} {"train_loss": -43.79843521118164, "global_step": 312240, "epoch": 2580} {"train_loss": -44.00284957885742, "global_step": 312241, "epoch": 2580} {"train_loss": -44.47872543334961, "global_step": 312242, "epoch": 2580} {"train_loss": -44.495216369628906, "global_step": 312243, "epoch": 2580} {"train_loss": -43.70646667480469, "global_step": 312244, "epoch": 2580} {"train_loss": -42.903133392333984, "global_step": 312245, "epoch": 2580} {"train_loss": -43.01064682006836, "global_step": 312246, "epoch": 2580} {"train_loss": -44.180519104003906, "global_step": 312247, "epoch": 2580} {"train_loss": -44.16067123413086, "global_step": 312248, "epoch": 2580} {"train_loss": -43.5307731628418, "global_step": 312249, "epoch": 2580} {"train_loss": -43.858154296875, "global_step": 312250, "epoch": 2580} {"train_loss": -43.78251266479492, "global_step": 312251, "epoch": 2580} {"train_loss": -41.802284240722656, "global_step": 312252, "epoch": 2580} {"train_loss": -42.2879753112793, "global_step": 312253, "epoch": 2580} {"train_loss": -43.42889404296875, "global_step": 312254, "epoch": 2580} {"train_loss": -43.63649368286133, "global_step": 312255, "epoch": 2580} {"train_loss": -43.20158767700195, "global_step": 312256, "epoch": 2580} {"train_loss": -43.11840057373047, "global_step": 312257, "epoch": 2580} {"train_loss": -43.400264739990234, "global_step": 312258, "epoch": 2580} {"train_loss": -41.98916244506836, "global_step": 312259, "epoch": 2580} {"train_loss": -42.83528137207031, "global_step": 312260, "epoch": 2580} {"train_loss": -43.35818099975586, "global_step": 312261, "epoch": 2580} {"train_loss": -43.51165771484375, "global_step": 312262, "epoch": 2580} {"train_loss": -44.17266082763672, "global_step": 312263, "epoch": 2580} {"train_loss": -43.43618392944336, "global_step": 312264, "epoch": 2580} {"train_loss": -43.679962158203125, "global_step": 312265, "epoch": 2580} {"train_loss": -44.185604095458984, "global_step": 312266, "epoch": 2580} {"train_loss": -44.271461486816406, "global_step": 312267, "epoch": 2580} {"train_loss": -43.28919219970703, "global_step": 312268, "epoch": 2580} {"train_loss": -43.829132080078125, "global_step": 312269, "epoch": 2580} {"train_loss": -43.511314392089844, "global_step": 312270, "epoch": 2580} {"train_loss": -43.42122268676758, "global_step": 312271, "epoch": 2580} {"train_loss": -44.05829620361328, "global_step": 312272, "epoch": 2580} {"train_loss": -43.9465446472168, "global_step": 312273, "epoch": 2580} {"train_loss": -43.76557540893555, "global_step": 312274, "epoch": 2580} {"train_loss": -43.419612884521484, "global_step": 312275, "epoch": 2580} {"train_loss": -43.71244430541992, "global_step": 312276, "epoch": 2580} {"train_loss": -43.77708435058594, "global_step": 312277, "epoch": 2580} {"train_loss": -43.45790481567383, "global_step": 312278, "epoch": 2580} {"train_loss": -44.59255599975586, "global_step": 312279, "epoch": 2580} {"train_loss": -43.993228912353516, "global_step": 312280, "epoch": 2580} {"train_loss": -44.406246185302734, "global_step": 312281, "epoch": 2580} {"train_loss": -44.018192291259766, "global_step": 312282, "epoch": 2580} {"train_loss": -44.266876220703125, "global_step": 312283, "epoch": 2580} {"train_loss": -43.787384033203125, "global_step": 312284, "epoch": 2580} {"train_loss": -44.02241897583008, "global_step": 312285, "epoch": 2580} {"train_loss": -43.87004852294922, "global_step": 312286, "epoch": 2580} {"train_loss": -43.57106399536133, "global_step": 312287, "epoch": 2580} {"train_loss": -43.23027801513672, "global_step": 312288, "epoch": 2580} {"train_loss": -43.68523025512695, "global_step": 312289, "epoch": 2580} {"train_loss": -44.053340911865234, "global_step": 312290, "epoch": 2580} {"train_loss": -43.943416595458984, "global_step": 312291, "epoch": 2580} {"train_loss": -42.848941802978516, "global_step": 312292, "epoch": 2580} {"train_loss": -43.2697639465332, "global_step": 312293, "epoch": 2580} {"train_loss": -44.19175720214844, "global_step": 312294, "epoch": 2580} {"train_loss": -44.126888275146484, "global_step": 312295, "epoch": 2580} {"train_loss": -43.52037048339844, "global_step": 312296, "epoch": 2580} {"train_loss": -44.0283088684082, "global_step": 312297, "epoch": 2580} {"train_loss": -41.692474365234375, "global_step": 312298, "epoch": 2580} {"train_loss": -41.10587692260742, "global_step": 312299, "epoch": 2580} {"train_loss": -43.58356781636388, "global_step": 312300, "epoch": 2580, "val_loss": 2763131.5} {"train_loss": -42.52309036254883, "global_step": 312301, "epoch": 2581} {"train_loss": -41.02466583251953, "global_step": 312302, "epoch": 2581} {"train_loss": -43.85312271118164, "global_step": 312303, "epoch": 2581} {"train_loss": -40.6603889465332, "global_step": 312304, "epoch": 2581} {"train_loss": -42.89699935913086, "global_step": 312305, "epoch": 2581} {"train_loss": -42.510765075683594, "global_step": 312306, "epoch": 2581} {"train_loss": -40.78292465209961, "global_step": 312307, "epoch": 2581} {"train_loss": -42.608245849609375, "global_step": 312308, "epoch": 2581} {"train_loss": -43.868587493896484, "global_step": 312309, "epoch": 2581} {"train_loss": -42.19375991821289, "global_step": 312310, "epoch": 2581} {"train_loss": -43.186187744140625, "global_step": 312311, "epoch": 2581} {"train_loss": -43.30392837524414, "global_step": 312312, "epoch": 2581} {"train_loss": -42.50309371948242, "global_step": 312313, "epoch": 2581} {"train_loss": -44.00625228881836, "global_step": 312314, "epoch": 2581} {"train_loss": -42.996429443359375, "global_step": 312315, "epoch": 2581} {"train_loss": -42.73747634887695, "global_step": 312316, "epoch": 2581} {"train_loss": -42.81288146972656, "global_step": 312317, "epoch": 2581} {"train_loss": -43.00941848754883, "global_step": 312318, "epoch": 2581} {"train_loss": -43.251800537109375, "global_step": 312319, "epoch": 2581} {"train_loss": -43.352169036865234, "global_step": 312320, "epoch": 2581} {"train_loss": -43.66384506225586, "global_step": 312321, "epoch": 2581} {"train_loss": -42.7020378112793, "global_step": 312322, "epoch": 2581} {"train_loss": -44.29169464111328, "global_step": 312323, "epoch": 2581} {"train_loss": -42.66062545776367, "global_step": 312324, "epoch": 2581} {"train_loss": -43.139801025390625, "global_step": 312325, "epoch": 2581} {"train_loss": -43.45671463012695, "global_step": 312326, "epoch": 2581} {"train_loss": -41.802398681640625, "global_step": 312327, "epoch": 2581} {"train_loss": -43.61103057861328, "global_step": 312328, "epoch": 2581} {"train_loss": -42.116878509521484, "global_step": 312329, "epoch": 2581} {"train_loss": -44.45835494995117, "global_step": 312330, "epoch": 2581} {"train_loss": -42.86153793334961, "global_step": 312331, "epoch": 2581} {"train_loss": -43.252010345458984, "global_step": 312332, "epoch": 2581} {"train_loss": -43.68463134765625, "global_step": 312333, "epoch": 2581} {"train_loss": -42.56414794921875, "global_step": 312334, "epoch": 2581} {"train_loss": -43.584903717041016, "global_step": 312335, "epoch": 2581} {"train_loss": -43.0103874206543, "global_step": 312336, "epoch": 2581} {"train_loss": -43.93851089477539, "global_step": 312337, "epoch": 2581} {"train_loss": -42.58401107788086, "global_step": 312338, "epoch": 2581} {"train_loss": -43.617279052734375, "global_step": 312339, "epoch": 2581} {"train_loss": -39.666290283203125, "global_step": 312340, "epoch": 2581} {"train_loss": -42.612735748291016, "global_step": 312341, "epoch": 2581} {"train_loss": -40.82707214355469, "global_step": 312342, "epoch": 2581} {"train_loss": -42.72529602050781, "global_step": 312343, "epoch": 2581} {"train_loss": -40.963592529296875, "global_step": 312344, "epoch": 2581} {"train_loss": -38.55765914916992, "global_step": 312345, "epoch": 2581} {"train_loss": -32.45806884765625, "global_step": 312346, "epoch": 2581} {"train_loss": -33.71408462524414, "global_step": 312347, "epoch": 2581} {"train_loss": -40.34849548339844, "global_step": 312348, "epoch": 2581} {"train_loss": -38.37443161010742, "global_step": 312349, "epoch": 2581} {"train_loss": -42.099578857421875, "global_step": 312350, "epoch": 2581} {"train_loss": -35.0363883972168, "global_step": 312351, "epoch": 2581} {"train_loss": -36.881996154785156, "global_step": 312352, "epoch": 2581} {"train_loss": -41.57423400878906, "global_step": 312353, "epoch": 2581} {"train_loss": -35.609432220458984, "global_step": 312354, "epoch": 2581} {"train_loss": -36.16334915161133, "global_step": 312355, "epoch": 2581} {"train_loss": -31.20829200744629, "global_step": 312356, "epoch": 2581} {"train_loss": -29.031436920166016, "global_step": 312357, "epoch": 2581} {"train_loss": -37.42387771606445, "global_step": 312358, "epoch": 2581} {"train_loss": -33.25695037841797, "global_step": 312359, "epoch": 2581} {"train_loss": -31.22942543029785, "global_step": 312360, "epoch": 2581} {"train_loss": -33.53156661987305, "global_step": 312361, "epoch": 2581} {"train_loss": -24.345993041992188, "global_step": 312362, "epoch": 2581} {"train_loss": -35.269615173339844, "global_step": 312363, "epoch": 2581} {"train_loss": -22.452123641967773, "global_step": 312364, "epoch": 2581} {"train_loss": -30.551166534423828, "global_step": 312365, "epoch": 2581} {"train_loss": -32.67100143432617, "global_step": 312366, "epoch": 2581} {"train_loss": -27.47524070739746, "global_step": 312367, "epoch": 2581} {"train_loss": -32.352970123291016, "global_step": 312368, "epoch": 2581} {"train_loss": -25.89314079284668, "global_step": 312369, "epoch": 2581} {"train_loss": -34.784706115722656, "global_step": 312370, "epoch": 2581} {"train_loss": -36.6425895690918, "global_step": 312371, "epoch": 2581} {"train_loss": -29.53203773498535, "global_step": 312372, "epoch": 2581} {"train_loss": -34.02429962158203, "global_step": 312373, "epoch": 2581} {"train_loss": -33.07040023803711, "global_step": 312374, "epoch": 2581} {"train_loss": -32.4012336730957, "global_step": 312375, "epoch": 2581} {"train_loss": -29.865772247314453, "global_step": 312376, "epoch": 2581} {"train_loss": -35.76947021484375, "global_step": 312377, "epoch": 2581} {"train_loss": -35.293243408203125, "global_step": 312378, "epoch": 2581} {"train_loss": -37.08845901489258, "global_step": 312379, "epoch": 2581} {"train_loss": -34.07046890258789, "global_step": 312380, "epoch": 2581} {"train_loss": -35.61334228515625, "global_step": 312381, "epoch": 2581} {"train_loss": -34.369239807128906, "global_step": 312382, "epoch": 2581} {"train_loss": -38.43278884887695, "global_step": 312383, "epoch": 2581} {"train_loss": -38.39622116088867, "global_step": 312384, "epoch": 2581} {"train_loss": -37.754600524902344, "global_step": 312385, "epoch": 2581} {"train_loss": -36.25640106201172, "global_step": 312386, "epoch": 2581} {"train_loss": -37.325157165527344, "global_step": 312387, "epoch": 2581} {"train_loss": -37.445980072021484, "global_step": 312388, "epoch": 2581} {"train_loss": -37.74062728881836, "global_step": 312389, "epoch": 2581} {"train_loss": -32.80119705200195, "global_step": 312390, "epoch": 2581} {"train_loss": -39.36271286010742, "global_step": 312391, "epoch": 2581} {"train_loss": -38.52642059326172, "global_step": 312392, "epoch": 2581} {"train_loss": -38.034847259521484, "global_step": 312393, "epoch": 2581} {"train_loss": -38.21406555175781, "global_step": 312394, "epoch": 2581} {"train_loss": -37.716636657714844, "global_step": 312395, "epoch": 2581} {"train_loss": -39.13846969604492, "global_step": 312396, "epoch": 2581} {"train_loss": -38.41899490356445, "global_step": 312397, "epoch": 2581} {"train_loss": -39.62993621826172, "global_step": 312398, "epoch": 2581} {"train_loss": -38.399749755859375, "global_step": 312399, "epoch": 2581} {"train_loss": -39.685787200927734, "global_step": 312400, "epoch": 2581} {"train_loss": -40.67092514038086, "global_step": 312401, "epoch": 2581} {"train_loss": -38.53109359741211, "global_step": 312402, "epoch": 2581} {"train_loss": -39.171844482421875, "global_step": 312403, "epoch": 2581} {"train_loss": -39.873653411865234, "global_step": 312404, "epoch": 2581} {"train_loss": -39.4670295715332, "global_step": 312405, "epoch": 2581} {"train_loss": -39.163387298583984, "global_step": 312406, "epoch": 2581} {"train_loss": -39.469417572021484, "global_step": 312407, "epoch": 2581} {"train_loss": -38.91132354736328, "global_step": 312408, "epoch": 2581} {"train_loss": -39.93037796020508, "global_step": 312409, "epoch": 2581} {"train_loss": -39.62263870239258, "global_step": 312410, "epoch": 2581} {"train_loss": -40.14561462402344, "global_step": 312411, "epoch": 2581} {"train_loss": -40.39844512939453, "global_step": 312412, "epoch": 2581} {"train_loss": -39.40427780151367, "global_step": 312413, "epoch": 2581} {"train_loss": -39.55447006225586, "global_step": 312414, "epoch": 2581} {"train_loss": -39.517906188964844, "global_step": 312415, "epoch": 2581} {"train_loss": -40.384883880615234, "global_step": 312416, "epoch": 2581} {"train_loss": -40.302001953125, "global_step": 312417, "epoch": 2581} {"train_loss": -41.2474365234375, "global_step": 312418, "epoch": 2581} {"train_loss": -39.92072677612305, "global_step": 312419, "epoch": 2581} {"train_loss": -39.20389175415039, "global_step": 312420, "epoch": 2581} {"train_loss": -38.68432626645427, "global_step": 312421, "epoch": 2581, "val_loss": 2794863.0} {"train_loss": -40.720794677734375, "global_step": 312422, "epoch": 2582} {"train_loss": -40.443389892578125, "global_step": 312423, "epoch": 2582} {"train_loss": -40.536720275878906, "global_step": 312424, "epoch": 2582} {"train_loss": -40.618953704833984, "global_step": 312425, "epoch": 2582} {"train_loss": -40.315528869628906, "global_step": 312426, "epoch": 2582} {"train_loss": -40.66181564331055, "global_step": 312427, "epoch": 2582} {"train_loss": -40.65846633911133, "global_step": 312428, "epoch": 2582} {"train_loss": -41.518280029296875, "global_step": 312429, "epoch": 2582} {"train_loss": -41.19953155517578, "global_step": 312430, "epoch": 2582} {"train_loss": -41.082313537597656, "global_step": 312431, "epoch": 2582} {"train_loss": -39.813568115234375, "global_step": 312432, "epoch": 2582} {"train_loss": -40.93510055541992, "global_step": 312433, "epoch": 2582} {"train_loss": -40.903865814208984, "global_step": 312434, "epoch": 2582} {"train_loss": -40.5316047668457, "global_step": 312435, "epoch": 2582} {"train_loss": -41.74465560913086, "global_step": 312436, "epoch": 2582} {"train_loss": -40.4796028137207, "global_step": 312437, "epoch": 2582} {"train_loss": -40.947505950927734, "global_step": 312438, "epoch": 2582} {"train_loss": -41.441383361816406, "global_step": 312439, "epoch": 2582} {"train_loss": -40.727108001708984, "global_step": 312440, "epoch": 2582} {"train_loss": -41.249000549316406, "global_step": 312441, "epoch": 2582} {"train_loss": -41.15188217163086, "global_step": 312442, "epoch": 2582} {"train_loss": -40.8441276550293, "global_step": 312443, "epoch": 2582} {"train_loss": -41.132930755615234, "global_step": 312444, "epoch": 2582} {"train_loss": -40.80561447143555, "global_step": 312445, "epoch": 2582} {"train_loss": -41.65810775756836, "global_step": 312446, "epoch": 2582} {"train_loss": -40.698036193847656, "global_step": 312447, "epoch": 2582} {"train_loss": -41.257965087890625, "global_step": 312448, "epoch": 2582} {"train_loss": -41.7050895690918, "global_step": 312449, "epoch": 2582} {"train_loss": -41.386146545410156, "global_step": 312450, "epoch": 2582} {"train_loss": -41.65938186645508, "global_step": 312451, "epoch": 2582} {"train_loss": -39.990726470947266, "global_step": 312452, "epoch": 2582} {"train_loss": -41.61531448364258, "global_step": 312453, "epoch": 2582} {"train_loss": -41.214378356933594, "global_step": 312454, "epoch": 2582} {"train_loss": -41.6644287109375, "global_step": 312455, "epoch": 2582} {"train_loss": -42.28185272216797, "global_step": 312456, "epoch": 2582} {"train_loss": -42.189903259277344, "global_step": 312457, "epoch": 2582} {"train_loss": -41.61725997924805, "global_step": 312458, "epoch": 2582} {"train_loss": -42.21582794189453, "global_step": 312459, "epoch": 2582} {"train_loss": -42.55693817138672, "global_step": 312460, "epoch": 2582} {"train_loss": -42.08635330200195, "global_step": 312461, "epoch": 2582} {"train_loss": -41.90836715698242, "global_step": 312462, "epoch": 2582} {"train_loss": -42.068294525146484, "global_step": 312463, "epoch": 2582} {"train_loss": -42.19878005981445, "global_step": 312464, "epoch": 2582} {"train_loss": -42.35538864135742, "global_step": 312465, "epoch": 2582} {"train_loss": -42.101253509521484, "global_step": 312466, "epoch": 2582} {"train_loss": -42.21042251586914, "global_step": 312467, "epoch": 2582} {"train_loss": -41.93491744995117, "global_step": 312468, "epoch": 2582} {"train_loss": -42.24974822998047, "global_step": 312469, "epoch": 2582} {"train_loss": -42.910396575927734, "global_step": 312470, "epoch": 2582} {"train_loss": -41.834102630615234, "global_step": 312471, "epoch": 2582} {"train_loss": -42.271575927734375, "global_step": 312472, "epoch": 2582} {"train_loss": -41.9233512878418, "global_step": 312473, "epoch": 2582} {"train_loss": -42.371009826660156, "global_step": 312474, "epoch": 2582} {"train_loss": -42.04421615600586, "global_step": 312475, "epoch": 2582} {"train_loss": -43.3790168762207, "global_step": 312476, "epoch": 2582} {"train_loss": -41.14333724975586, "global_step": 312477, "epoch": 2582} {"train_loss": -42.76984405517578, "global_step": 312478, "epoch": 2582} {"train_loss": -42.1198844909668, "global_step": 312479, "epoch": 2582} {"train_loss": -42.9107666015625, "global_step": 312480, "epoch": 2582} {"train_loss": -42.7827262878418, "global_step": 312481, "epoch": 2582} {"train_loss": -42.43935012817383, "global_step": 312482, "epoch": 2582} {"train_loss": -42.33710479736328, "global_step": 312483, "epoch": 2582} {"train_loss": -41.47679138183594, "global_step": 312484, "epoch": 2582} {"train_loss": -42.067108154296875, "global_step": 312485, "epoch": 2582} {"train_loss": -42.82374954223633, "global_step": 312486, "epoch": 2582} {"train_loss": -43.26163864135742, "global_step": 312487, "epoch": 2582} {"train_loss": -43.188270568847656, "global_step": 312488, "epoch": 2582} {"train_loss": -42.62225341796875, "global_step": 312489, "epoch": 2582} {"train_loss": -42.166194915771484, "global_step": 312490, "epoch": 2582} {"train_loss": -43.070343017578125, "global_step": 312491, "epoch": 2582} {"train_loss": -43.37466049194336, "global_step": 312492, "epoch": 2582} {"train_loss": -42.696407318115234, "global_step": 312493, "epoch": 2582} {"train_loss": -42.97933578491211, "global_step": 312494, "epoch": 2582} {"train_loss": -43.05978012084961, "global_step": 312495, "epoch": 2582} {"train_loss": -43.23678207397461, "global_step": 312496, "epoch": 2582} {"train_loss": -43.00664138793945, "global_step": 312497, "epoch": 2582} {"train_loss": -43.0804328918457, "global_step": 312498, "epoch": 2582} {"train_loss": -43.022220611572266, "global_step": 312499, "epoch": 2582} {"train_loss": -42.82632064819336, "global_step": 312500, "epoch": 2582} {"train_loss": -42.74406814575195, "global_step": 312501, "epoch": 2582} {"train_loss": -43.206092834472656, "global_step": 312502, "epoch": 2582} {"train_loss": -43.21857452392578, "global_step": 312503, "epoch": 2582} {"train_loss": -43.55326461791992, "global_step": 312504, "epoch": 2582} {"train_loss": -43.04985809326172, "global_step": 312505, "epoch": 2582} {"train_loss": -43.6026725769043, "global_step": 312506, "epoch": 2582} {"train_loss": -42.94356918334961, "global_step": 312507, "epoch": 2582} {"train_loss": -43.43943405151367, "global_step": 312508, "epoch": 2582} {"train_loss": -43.361446380615234, "global_step": 312509, "epoch": 2582} {"train_loss": -43.05697250366211, "global_step": 312510, "epoch": 2582} {"train_loss": -43.884117126464844, "global_step": 312511, "epoch": 2582} {"train_loss": -42.86790466308594, "global_step": 312512, "epoch": 2582} {"train_loss": -43.21137619018555, "global_step": 312513, "epoch": 2582} {"train_loss": -43.495296478271484, "global_step": 312514, "epoch": 2582} {"train_loss": -43.16943359375, "global_step": 312515, "epoch": 2582} {"train_loss": -43.08138656616211, "global_step": 312516, "epoch": 2582} {"train_loss": -43.481624603271484, "global_step": 312517, "epoch": 2582} {"train_loss": -42.87411117553711, "global_step": 312518, "epoch": 2582} {"train_loss": -43.69913864135742, "global_step": 312519, "epoch": 2582} {"train_loss": -42.861873626708984, "global_step": 312520, "epoch": 2582} {"train_loss": -43.66971206665039, "global_step": 312521, "epoch": 2582} {"train_loss": -43.634002685546875, "global_step": 312522, "epoch": 2582} {"train_loss": -43.23514938354492, "global_step": 312523, "epoch": 2582} {"train_loss": -42.720306396484375, "global_step": 312524, "epoch": 2582} {"train_loss": -43.97803497314453, "global_step": 312525, "epoch": 2582} {"train_loss": -43.15568161010742, "global_step": 312526, "epoch": 2582} {"train_loss": -43.67329788208008, "global_step": 312527, "epoch": 2582} {"train_loss": -43.78022003173828, "global_step": 312528, "epoch": 2582} {"train_loss": -44.235721588134766, "global_step": 312529, "epoch": 2582} {"train_loss": -42.85673904418945, "global_step": 312530, "epoch": 2582} {"train_loss": -43.766231536865234, "global_step": 312531, "epoch": 2582} {"train_loss": -43.2747917175293, "global_step": 312532, "epoch": 2582} {"train_loss": -43.34943771362305, "global_step": 312533, "epoch": 2582} {"train_loss": -43.677398681640625, "global_step": 312534, "epoch": 2582} {"train_loss": -43.829524993896484, "global_step": 312535, "epoch": 2582} {"train_loss": -43.11140823364258, "global_step": 312536, "epoch": 2582} {"train_loss": -42.98303985595703, "global_step": 312537, "epoch": 2582} {"train_loss": -43.10432052612305, "global_step": 312538, "epoch": 2582} {"train_loss": -43.34859848022461, "global_step": 312539, "epoch": 2582} {"train_loss": -43.73476791381836, "global_step": 312540, "epoch": 2582} {"train_loss": -42.9708366394043, "global_step": 312541, "epoch": 2582} {"train_loss": -42.34147212130964, "global_step": 312542, "epoch": 2582, "val_loss": 2734986.25} {"train_loss": -43.52678298950195, "global_step": 312543, "epoch": 2583} {"train_loss": -42.32889938354492, "global_step": 312544, "epoch": 2583} {"train_loss": -42.9994010925293, "global_step": 312545, "epoch": 2583} {"train_loss": -43.192474365234375, "global_step": 312546, "epoch": 2583} {"train_loss": -43.32611083984375, "global_step": 312547, "epoch": 2583} {"train_loss": -43.187957763671875, "global_step": 312548, "epoch": 2583} {"train_loss": -42.446693420410156, "global_step": 312549, "epoch": 2583} {"train_loss": -42.65141677856445, "global_step": 312550, "epoch": 2583} {"train_loss": -44.03150177001953, "global_step": 312551, "epoch": 2583} {"train_loss": -43.53144454956055, "global_step": 312552, "epoch": 2583} {"train_loss": -42.714359283447266, "global_step": 312553, "epoch": 2583} {"train_loss": -43.25703430175781, "global_step": 312554, "epoch": 2583} {"train_loss": -43.9522590637207, "global_step": 312555, "epoch": 2583} {"train_loss": -43.8643913269043, "global_step": 312556, "epoch": 2583} {"train_loss": -42.07662582397461, "global_step": 312557, "epoch": 2583} {"train_loss": -43.34609603881836, "global_step": 312558, "epoch": 2583} {"train_loss": -43.76754379272461, "global_step": 312559, "epoch": 2583} {"train_loss": -42.74021530151367, "global_step": 312560, "epoch": 2583} {"train_loss": -43.138587951660156, "global_step": 312561, "epoch": 2583} {"train_loss": -43.342464447021484, "global_step": 312562, "epoch": 2583} {"train_loss": -43.531402587890625, "global_step": 312563, "epoch": 2583} {"train_loss": -43.59933090209961, "global_step": 312564, "epoch": 2583} {"train_loss": -43.31574630737305, "global_step": 312565, "epoch": 2583} {"train_loss": -42.697837829589844, "global_step": 312566, "epoch": 2583} {"train_loss": -40.89567947387695, "global_step": 312567, "epoch": 2583} {"train_loss": -42.67338943481445, "global_step": 312568, "epoch": 2583} {"train_loss": -42.34333419799805, "global_step": 312569, "epoch": 2583} {"train_loss": -41.10951614379883, "global_step": 312570, "epoch": 2583} {"train_loss": -39.74009323120117, "global_step": 312571, "epoch": 2583} {"train_loss": -42.138084411621094, "global_step": 312572, "epoch": 2583} {"train_loss": -40.85493087768555, "global_step": 312573, "epoch": 2583} {"train_loss": -39.17379379272461, "global_step": 312574, "epoch": 2583} {"train_loss": -38.30369186401367, "global_step": 312575, "epoch": 2583} {"train_loss": -41.40058135986328, "global_step": 312576, "epoch": 2583} {"train_loss": -40.58803176879883, "global_step": 312577, "epoch": 2583} {"train_loss": -39.58173751831055, "global_step": 312578, "epoch": 2583} {"train_loss": -35.421844482421875, "global_step": 312579, "epoch": 2583} {"train_loss": -40.580745697021484, "global_step": 312580, "epoch": 2583} {"train_loss": -37.20970916748047, "global_step": 312581, "epoch": 2583} {"train_loss": -27.49199867248535, "global_step": 312582, "epoch": 2583} {"train_loss": -40.71784210205078, "global_step": 312583, "epoch": 2583} {"train_loss": -24.096805572509766, "global_step": 312584, "epoch": 2583} {"train_loss": -40.11247253417969, "global_step": 312585, "epoch": 2583} {"train_loss": -30.227325439453125, "global_step": 312586, "epoch": 2583} {"train_loss": -38.22047805786133, "global_step": 312587, "epoch": 2583} {"train_loss": -35.3811149597168, "global_step": 312588, "epoch": 2583} {"train_loss": -39.147518157958984, "global_step": 312589, "epoch": 2583} {"train_loss": -31.449689865112305, "global_step": 312590, "epoch": 2583} {"train_loss": -39.64951705932617, "global_step": 312591, "epoch": 2583} {"train_loss": -38.711463928222656, "global_step": 312592, "epoch": 2583} {"train_loss": -37.97153854370117, "global_step": 312593, "epoch": 2583} {"train_loss": -37.308074951171875, "global_step": 312594, "epoch": 2583} {"train_loss": -41.001155853271484, "global_step": 312595, "epoch": 2583} {"train_loss": -38.71305465698242, "global_step": 312596, "epoch": 2583} {"train_loss": -40.885589599609375, "global_step": 312597, "epoch": 2583} {"train_loss": -38.941932678222656, "global_step": 312598, "epoch": 2583} {"train_loss": -41.34688949584961, "global_step": 312599, "epoch": 2583} {"train_loss": -40.778968811035156, "global_step": 312600, "epoch": 2583} {"train_loss": -41.107078552246094, "global_step": 312601, "epoch": 2583} {"train_loss": -40.409114837646484, "global_step": 312602, "epoch": 2583} {"train_loss": -40.98181915283203, "global_step": 312603, "epoch": 2583} {"train_loss": -41.63238525390625, "global_step": 312604, "epoch": 2583} {"train_loss": -40.40224838256836, "global_step": 312605, "epoch": 2583} {"train_loss": -41.60101318359375, "global_step": 312606, "epoch": 2583} {"train_loss": -41.03028106689453, "global_step": 312607, "epoch": 2583} {"train_loss": -41.19279098510742, "global_step": 312608, "epoch": 2583} {"train_loss": -41.651432037353516, "global_step": 312609, "epoch": 2583} {"train_loss": -41.36117172241211, "global_step": 312610, "epoch": 2583} {"train_loss": -41.671363830566406, "global_step": 312611, "epoch": 2583} {"train_loss": -41.97396469116211, "global_step": 312612, "epoch": 2583} {"train_loss": -42.205848693847656, "global_step": 312613, "epoch": 2583} {"train_loss": -41.53463363647461, "global_step": 312614, "epoch": 2583} {"train_loss": -41.36941146850586, "global_step": 312615, "epoch": 2583} {"train_loss": -42.46394729614258, "global_step": 312616, "epoch": 2583} {"train_loss": -42.169586181640625, "global_step": 312617, "epoch": 2583} {"train_loss": -42.410945892333984, "global_step": 312618, "epoch": 2583} {"train_loss": -42.369869232177734, "global_step": 312619, "epoch": 2583} {"train_loss": -42.113868713378906, "global_step": 312620, "epoch": 2583} {"train_loss": -42.35980224609375, "global_step": 312621, "epoch": 2583} {"train_loss": -42.46173858642578, "global_step": 312622, "epoch": 2583} {"train_loss": -41.92689895629883, "global_step": 312623, "epoch": 2583} {"train_loss": -42.5290641784668, "global_step": 312624, "epoch": 2583} {"train_loss": -43.010223388671875, "global_step": 312625, "epoch": 2583} {"train_loss": -42.34161376953125, "global_step": 312626, "epoch": 2583} {"train_loss": -42.52090835571289, "global_step": 312627, "epoch": 2583} {"train_loss": -42.190338134765625, "global_step": 312628, "epoch": 2583} {"train_loss": -42.300567626953125, "global_step": 312629, "epoch": 2583} {"train_loss": -42.959041595458984, "global_step": 312630, "epoch": 2583} {"train_loss": -43.1856689453125, "global_step": 312631, "epoch": 2583} {"train_loss": -42.510066986083984, "global_step": 312632, "epoch": 2583} {"train_loss": -43.3548583984375, "global_step": 312633, "epoch": 2583} {"train_loss": -43.03467559814453, "global_step": 312634, "epoch": 2583} {"train_loss": -42.8200798034668, "global_step": 312635, "epoch": 2583} {"train_loss": -42.98501205444336, "global_step": 312636, "epoch": 2583} {"train_loss": -43.3729248046875, "global_step": 312637, "epoch": 2583} {"train_loss": -43.32073974609375, "global_step": 312638, "epoch": 2583} {"train_loss": -43.359249114990234, "global_step": 312639, "epoch": 2583} {"train_loss": -42.61381912231445, "global_step": 312640, "epoch": 2583} {"train_loss": -43.02947998046875, "global_step": 312641, "epoch": 2583} {"train_loss": -43.548805236816406, "global_step": 312642, "epoch": 2583} {"train_loss": -43.1612663269043, "global_step": 312643, "epoch": 2583} {"train_loss": -43.4056282043457, "global_step": 312644, "epoch": 2583} {"train_loss": -43.305885314941406, "global_step": 312645, "epoch": 2583} {"train_loss": -43.81825256347656, "global_step": 312646, "epoch": 2583} {"train_loss": -43.6759147644043, "global_step": 312647, "epoch": 2583} {"train_loss": -44.01186752319336, "global_step": 312648, "epoch": 2583} {"train_loss": -43.64868927001953, "global_step": 312649, "epoch": 2583} {"train_loss": -43.35075378417969, "global_step": 312650, "epoch": 2583} {"train_loss": -43.983009338378906, "global_step": 312651, "epoch": 2583} {"train_loss": -43.04010772705078, "global_step": 312652, "epoch": 2583} {"train_loss": -44.09991455078125, "global_step": 312653, "epoch": 2583} {"train_loss": -43.79537582397461, "global_step": 312654, "epoch": 2583} {"train_loss": -43.84955596923828, "global_step": 312655, "epoch": 2583} {"train_loss": -43.51237869262695, "global_step": 312656, "epoch": 2583} {"train_loss": -43.56704330444336, "global_step": 312657, "epoch": 2583} {"train_loss": -43.21148681640625, "global_step": 312658, "epoch": 2583} {"train_loss": -43.61140823364258, "global_step": 312659, "epoch": 2583} {"train_loss": -44.02138137817383, "global_step": 312660, "epoch": 2583} {"train_loss": -43.6096076965332, "global_step": 312661, "epoch": 2583} {"train_loss": -43.95729064941406, "global_step": 312662, "epoch": 2583} {"train_loss": -41.57044737004051, "global_step": 312663, "epoch": 2583, "val_loss": 2819128.0} {"train_loss": -43.924007415771484, "global_step": 312664, "epoch": 2584} {"train_loss": -44.180870056152344, "global_step": 312665, "epoch": 2584} {"train_loss": -44.57535171508789, "global_step": 312666, "epoch": 2584} {"train_loss": -43.6257209777832, "global_step": 312667, "epoch": 2584} {"train_loss": -44.531349182128906, "global_step": 312668, "epoch": 2584} {"train_loss": -43.78062057495117, "global_step": 312669, "epoch": 2584} {"train_loss": -43.103546142578125, "global_step": 312670, "epoch": 2584} {"train_loss": -44.4532356262207, "global_step": 312671, "epoch": 2584} {"train_loss": -44.56409454345703, "global_step": 312672, "epoch": 2584} {"train_loss": -44.24202346801758, "global_step": 312673, "epoch": 2584} {"train_loss": -44.00271987915039, "global_step": 312674, "epoch": 2584} {"train_loss": -43.7548828125, "global_step": 312675, "epoch": 2584} {"train_loss": -44.49471664428711, "global_step": 312676, "epoch": 2584} {"train_loss": -44.14066696166992, "global_step": 312677, "epoch": 2584} {"train_loss": -43.910614013671875, "global_step": 312678, "epoch": 2584} {"train_loss": -44.331111907958984, "global_step": 312679, "epoch": 2584} {"train_loss": -44.01231002807617, "global_step": 312680, "epoch": 2584} {"train_loss": -44.48528289794922, "global_step": 312681, "epoch": 2584} {"train_loss": -44.726016998291016, "global_step": 312682, "epoch": 2584} {"train_loss": -43.77444076538086, "global_step": 312683, "epoch": 2584} {"train_loss": -43.9768180847168, "global_step": 312684, "epoch": 2584} {"train_loss": -44.40037536621094, "global_step": 312685, "epoch": 2584} {"train_loss": -44.47209930419922, "global_step": 312686, "epoch": 2584} {"train_loss": -44.87644577026367, "global_step": 312687, "epoch": 2584} {"train_loss": -44.96335220336914, "global_step": 312688, "epoch": 2584} {"train_loss": -44.37797164916992, "global_step": 312689, "epoch": 2584} {"train_loss": -44.147457122802734, "global_step": 312690, "epoch": 2584} {"train_loss": -44.4886589050293, "global_step": 312691, "epoch": 2584} {"train_loss": -43.6325798034668, "global_step": 312692, "epoch": 2584} {"train_loss": -44.12060546875, "global_step": 312693, "epoch": 2584} {"train_loss": -44.42015075683594, "global_step": 312694, "epoch": 2584} {"train_loss": -43.75374221801758, "global_step": 312695, "epoch": 2584} {"train_loss": -42.941280364990234, "global_step": 312696, "epoch": 2584} {"train_loss": -42.02424621582031, "global_step": 312697, "epoch": 2584} {"train_loss": -39.29104232788086, "global_step": 312698, "epoch": 2584} {"train_loss": -34.05805206298828, "global_step": 312699, "epoch": 2584} {"train_loss": -32.269386291503906, "global_step": 312700, "epoch": 2584} {"train_loss": -38.435150146484375, "global_step": 312701, "epoch": 2584} {"train_loss": -42.39768981933594, "global_step": 312702, "epoch": 2584} {"train_loss": -41.48232650756836, "global_step": 312703, "epoch": 2584} {"train_loss": -41.62642288208008, "global_step": 312704, "epoch": 2584} {"train_loss": -41.87099075317383, "global_step": 312705, "epoch": 2584} {"train_loss": -41.7210807800293, "global_step": 312706, "epoch": 2584} {"train_loss": -42.6888427734375, "global_step": 312707, "epoch": 2584} {"train_loss": -42.44538116455078, "global_step": 312708, "epoch": 2584} {"train_loss": -42.647491455078125, "global_step": 312709, "epoch": 2584} {"train_loss": -42.28953170776367, "global_step": 312710, "epoch": 2584} {"train_loss": -42.62263870239258, "global_step": 312711, "epoch": 2584} {"train_loss": -42.161617279052734, "global_step": 312712, "epoch": 2584} {"train_loss": -42.80860900878906, "global_step": 312713, "epoch": 2584} {"train_loss": -41.47454833984375, "global_step": 312714, "epoch": 2584} {"train_loss": -42.097625732421875, "global_step": 312715, "epoch": 2584} {"train_loss": -43.023834228515625, "global_step": 312716, "epoch": 2584} {"train_loss": -43.482322692871094, "global_step": 312717, "epoch": 2584} {"train_loss": -43.09310531616211, "global_step": 312718, "epoch": 2584} {"train_loss": -43.576690673828125, "global_step": 312719, "epoch": 2584} {"train_loss": -43.14058303833008, "global_step": 312720, "epoch": 2584} {"train_loss": -42.71913146972656, "global_step": 312721, "epoch": 2584} {"train_loss": -43.68335723876953, "global_step": 312722, "epoch": 2584} {"train_loss": -42.16622543334961, "global_step": 312723, "epoch": 2584} {"train_loss": -43.00240707397461, "global_step": 312724, "epoch": 2584} {"train_loss": -42.972259521484375, "global_step": 312725, "epoch": 2584} {"train_loss": -42.05128860473633, "global_step": 312726, "epoch": 2584} {"train_loss": -42.83125686645508, "global_step": 312727, "epoch": 2584} {"train_loss": -42.99786376953125, "global_step": 312728, "epoch": 2584} {"train_loss": -43.380126953125, "global_step": 312729, "epoch": 2584} {"train_loss": -42.74177169799805, "global_step": 312730, "epoch": 2584} {"train_loss": -42.8471794128418, "global_step": 312731, "epoch": 2584} {"train_loss": -42.51252365112305, "global_step": 312732, "epoch": 2584} {"train_loss": -43.5816535949707, "global_step": 312733, "epoch": 2584} {"train_loss": -43.40908432006836, "global_step": 312734, "epoch": 2584} {"train_loss": -42.495338439941406, "global_step": 312735, "epoch": 2584} {"train_loss": -43.56897735595703, "global_step": 312736, "epoch": 2584} {"train_loss": -42.51328659057617, "global_step": 312737, "epoch": 2584} {"train_loss": -40.919681549072266, "global_step": 312738, "epoch": 2584} {"train_loss": -41.034400939941406, "global_step": 312739, "epoch": 2584} {"train_loss": -41.87287521362305, "global_step": 312740, "epoch": 2584} {"train_loss": -43.74811553955078, "global_step": 312741, "epoch": 2584} {"train_loss": -44.06824493408203, "global_step": 312742, "epoch": 2584} {"train_loss": -43.96061325073242, "global_step": 312743, "epoch": 2584} {"train_loss": -43.8604850769043, "global_step": 312744, "epoch": 2584} {"train_loss": -44.04865646362305, "global_step": 312745, "epoch": 2584} {"train_loss": -43.20271682739258, "global_step": 312746, "epoch": 2584} {"train_loss": -44.29962921142578, "global_step": 312747, "epoch": 2584} {"train_loss": -43.601844787597656, "global_step": 312748, "epoch": 2584} {"train_loss": -43.822723388671875, "global_step": 312749, "epoch": 2584} {"train_loss": -43.67435836791992, "global_step": 312750, "epoch": 2584} {"train_loss": -43.78654098510742, "global_step": 312751, "epoch": 2584} {"train_loss": -43.76309585571289, "global_step": 312752, "epoch": 2584} {"train_loss": -43.943572998046875, "global_step": 312753, "epoch": 2584} {"train_loss": -43.40428161621094, "global_step": 312754, "epoch": 2584} {"train_loss": -44.36831283569336, "global_step": 312755, "epoch": 2584} {"train_loss": -43.88677978515625, "global_step": 312756, "epoch": 2584} {"train_loss": -44.01835632324219, "global_step": 312757, "epoch": 2584} {"train_loss": -43.83333206176758, "global_step": 312758, "epoch": 2584} {"train_loss": -42.767547607421875, "global_step": 312759, "epoch": 2584} {"train_loss": -39.250999450683594, "global_step": 312760, "epoch": 2584} {"train_loss": -40.99788284301758, "global_step": 312761, "epoch": 2584} {"train_loss": -43.83529281616211, "global_step": 312762, "epoch": 2584} {"train_loss": -44.3271369934082, "global_step": 312763, "epoch": 2584} {"train_loss": -40.50559616088867, "global_step": 312764, "epoch": 2584} {"train_loss": -29.7943058013916, "global_step": 312765, "epoch": 2584} {"train_loss": -40.417724609375, "global_step": 312766, "epoch": 2584} {"train_loss": -40.545806884765625, "global_step": 312767, "epoch": 2584} {"train_loss": -35.677974700927734, "global_step": 312768, "epoch": 2584} {"train_loss": -33.99412536621094, "global_step": 312769, "epoch": 2584} {"train_loss": -41.299190521240234, "global_step": 312770, "epoch": 2584} {"train_loss": -39.26617431640625, "global_step": 312771, "epoch": 2584} {"train_loss": -29.32175636291504, "global_step": 312772, "epoch": 2584} {"train_loss": -35.39754867553711, "global_step": 312773, "epoch": 2584} {"train_loss": -32.17131042480469, "global_step": 312774, "epoch": 2584} {"train_loss": -39.215057373046875, "global_step": 312775, "epoch": 2584} {"train_loss": -38.269500732421875, "global_step": 312776, "epoch": 2584} {"train_loss": -37.10295486450195, "global_step": 312777, "epoch": 2584} {"train_loss": -35.8725471496582, "global_step": 312778, "epoch": 2584} {"train_loss": -34.93328094482422, "global_step": 312779, "epoch": 2584} {"train_loss": -29.979902267456055, "global_step": 312780, "epoch": 2584} {"train_loss": -33.13398742675781, "global_step": 312781, "epoch": 2584} {"train_loss": -39.02366256713867, "global_step": 312782, "epoch": 2584} {"train_loss": -37.86420822143555, "global_step": 312783, "epoch": 2584} {"train_loss": -41.8398573221254, "global_step": 312784, "epoch": 2584, "val_loss": 2907071.75} {"train_loss": -39.88393020629883, "global_step": 312785, "epoch": 2585} {"train_loss": -37.34210205078125, "global_step": 312786, "epoch": 2585} {"train_loss": -25.8489933013916, "global_step": 312787, "epoch": 2585} {"train_loss": -32.835357666015625, "global_step": 312788, "epoch": 2585} {"train_loss": -33.15285110473633, "global_step": 312789, "epoch": 2585} {"train_loss": -37.94630813598633, "global_step": 312790, "epoch": 2585} {"train_loss": -39.784114837646484, "global_step": 312791, "epoch": 2585} {"train_loss": -34.58852005004883, "global_step": 312792, "epoch": 2585} {"train_loss": -39.99872589111328, "global_step": 312793, "epoch": 2585} {"train_loss": -36.2479248046875, "global_step": 312794, "epoch": 2585} {"train_loss": -38.166934967041016, "global_step": 312795, "epoch": 2585} {"train_loss": -37.80889892578125, "global_step": 312796, "epoch": 2585} {"train_loss": -39.32072067260742, "global_step": 312797, "epoch": 2585} {"train_loss": -40.1330451965332, "global_step": 312798, "epoch": 2585} {"train_loss": -39.358238220214844, "global_step": 312799, "epoch": 2585} {"train_loss": -37.97321319580078, "global_step": 312800, "epoch": 2585} {"train_loss": -38.99927520751953, "global_step": 312801, "epoch": 2585} {"train_loss": -39.19296646118164, "global_step": 312802, "epoch": 2585} {"train_loss": -37.11492919921875, "global_step": 312803, "epoch": 2585} {"train_loss": -38.61249542236328, "global_step": 312804, "epoch": 2585} {"train_loss": -38.2760009765625, "global_step": 312805, "epoch": 2585} {"train_loss": -36.58844757080078, "global_step": 312806, "epoch": 2585} {"train_loss": -38.77783966064453, "global_step": 312807, "epoch": 2585} {"train_loss": -39.61045455932617, "global_step": 312808, "epoch": 2585} {"train_loss": -40.2086181640625, "global_step": 312809, "epoch": 2585} {"train_loss": -39.10429000854492, "global_step": 312810, "epoch": 2585} {"train_loss": -40.422576904296875, "global_step": 312811, "epoch": 2585} {"train_loss": -40.20695877075195, "global_step": 312812, "epoch": 2585} {"train_loss": -40.694522857666016, "global_step": 312813, "epoch": 2585} {"train_loss": -40.64262390136719, "global_step": 312814, "epoch": 2585} {"train_loss": -40.56770706176758, "global_step": 312815, "epoch": 2585} {"train_loss": -40.969268798828125, "global_step": 312816, "epoch": 2585} {"train_loss": -41.40520095825195, "global_step": 312817, "epoch": 2585} {"train_loss": -38.9654426574707, "global_step": 312818, "epoch": 2585} {"train_loss": -40.83353042602539, "global_step": 312819, "epoch": 2585} {"train_loss": -40.910377502441406, "global_step": 312820, "epoch": 2585} {"train_loss": -41.02099609375, "global_step": 312821, "epoch": 2585} {"train_loss": -40.29936218261719, "global_step": 312822, "epoch": 2585} {"train_loss": -41.49748611450195, "global_step": 312823, "epoch": 2585} {"train_loss": -40.34632110595703, "global_step": 312824, "epoch": 2585} {"train_loss": -41.46598434448242, "global_step": 312825, "epoch": 2585} {"train_loss": -40.84503173828125, "global_step": 312826, "epoch": 2585} {"train_loss": -40.936744689941406, "global_step": 312827, "epoch": 2585} {"train_loss": -40.899024963378906, "global_step": 312828, "epoch": 2585} {"train_loss": -41.90052032470703, "global_step": 312829, "epoch": 2585} {"train_loss": -41.85398864746094, "global_step": 312830, "epoch": 2585} {"train_loss": -41.646568298339844, "global_step": 312831, "epoch": 2585} {"train_loss": -41.601375579833984, "global_step": 312832, "epoch": 2585} {"train_loss": -41.865692138671875, "global_step": 312833, "epoch": 2585} {"train_loss": -41.21859359741211, "global_step": 312834, "epoch": 2585} {"train_loss": -41.41669464111328, "global_step": 312835, "epoch": 2585} {"train_loss": -41.79244613647461, "global_step": 312836, "epoch": 2585} {"train_loss": -42.6253547668457, "global_step": 312837, "epoch": 2585} {"train_loss": -42.00852584838867, "global_step": 312838, "epoch": 2585} {"train_loss": -41.683929443359375, "global_step": 312839, "epoch": 2585} {"train_loss": -41.960750579833984, "global_step": 312840, "epoch": 2585} {"train_loss": -42.18131637573242, "global_step": 312841, "epoch": 2585} {"train_loss": -41.50851058959961, "global_step": 312842, "epoch": 2585} {"train_loss": -42.62550354003906, "global_step": 312843, "epoch": 2585} {"train_loss": -42.550148010253906, "global_step": 312844, "epoch": 2585} {"train_loss": -41.99709701538086, "global_step": 312845, "epoch": 2585} {"train_loss": -42.401275634765625, "global_step": 312846, "epoch": 2585} {"train_loss": -42.617210388183594, "global_step": 312847, "epoch": 2585} {"train_loss": -40.90580368041992, "global_step": 312848, "epoch": 2585} {"train_loss": -41.601783752441406, "global_step": 312849, "epoch": 2585} {"train_loss": -42.330196380615234, "global_step": 312850, "epoch": 2585} {"train_loss": -42.52397537231445, "global_step": 312851, "epoch": 2585} {"train_loss": -42.34624099731445, "global_step": 312852, "epoch": 2585} {"train_loss": -42.902530670166016, "global_step": 312853, "epoch": 2585} {"train_loss": -42.45016098022461, "global_step": 312854, "epoch": 2585} {"train_loss": -42.42747116088867, "global_step": 312855, "epoch": 2585} {"train_loss": -42.790016174316406, "global_step": 312856, "epoch": 2585} {"train_loss": -42.2971076965332, "global_step": 312857, "epoch": 2585} {"train_loss": -43.01597213745117, "global_step": 312858, "epoch": 2585} {"train_loss": -42.434547424316406, "global_step": 312859, "epoch": 2585} {"train_loss": -43.247596740722656, "global_step": 312860, "epoch": 2585} {"train_loss": -42.16157150268555, "global_step": 312861, "epoch": 2585} {"train_loss": -42.43490219116211, "global_step": 312862, "epoch": 2585} {"train_loss": -42.754764556884766, "global_step": 312863, "epoch": 2585} {"train_loss": -41.75853729248047, "global_step": 312864, "epoch": 2585} {"train_loss": -42.64662170410156, "global_step": 312865, "epoch": 2585} {"train_loss": -42.24684143066406, "global_step": 312866, "epoch": 2585} {"train_loss": -42.346282958984375, "global_step": 312867, "epoch": 2585} {"train_loss": -42.0654411315918, "global_step": 312868, "epoch": 2585} {"train_loss": -42.868534088134766, "global_step": 312869, "epoch": 2585} {"train_loss": -42.311702728271484, "global_step": 312870, "epoch": 2585} {"train_loss": -42.970947265625, "global_step": 312871, "epoch": 2585} {"train_loss": -42.56048583984375, "global_step": 312872, "epoch": 2585} {"train_loss": -42.75016403198242, "global_step": 312873, "epoch": 2585} {"train_loss": -43.35810470581055, "global_step": 312874, "epoch": 2585} {"train_loss": -42.78334426879883, "global_step": 312875, "epoch": 2585} {"train_loss": -43.48768615722656, "global_step": 312876, "epoch": 2585} {"train_loss": -43.23750686645508, "global_step": 312877, "epoch": 2585} {"train_loss": -43.50245666503906, "global_step": 312878, "epoch": 2585} {"train_loss": -43.37940216064453, "global_step": 312879, "epoch": 2585} {"train_loss": -42.86758041381836, "global_step": 312880, "epoch": 2585} {"train_loss": -43.245079040527344, "global_step": 312881, "epoch": 2585} {"train_loss": -43.46760940551758, "global_step": 312882, "epoch": 2585} {"train_loss": -43.40031051635742, "global_step": 312883, "epoch": 2585} {"train_loss": -42.62357711791992, "global_step": 312884, "epoch": 2585} {"train_loss": -43.46611785888672, "global_step": 312885, "epoch": 2585} {"train_loss": -43.5474967956543, "global_step": 312886, "epoch": 2585} {"train_loss": -43.346988677978516, "global_step": 312887, "epoch": 2585} {"train_loss": -43.072750091552734, "global_step": 312888, "epoch": 2585} {"train_loss": -43.37842559814453, "global_step": 312889, "epoch": 2585} {"train_loss": -43.23136520385742, "global_step": 312890, "epoch": 2585} {"train_loss": -43.65288543701172, "global_step": 312891, "epoch": 2585} {"train_loss": -43.6484260559082, "global_step": 312892, "epoch": 2585} {"train_loss": -43.65987777709961, "global_step": 312893, "epoch": 2585} {"train_loss": -43.752296447753906, "global_step": 312894, "epoch": 2585} {"train_loss": -42.83271408081055, "global_step": 312895, "epoch": 2585} {"train_loss": -42.867679595947266, "global_step": 312896, "epoch": 2585} {"train_loss": -41.68135452270508, "global_step": 312897, "epoch": 2585} {"train_loss": -42.25746536254883, "global_step": 312898, "epoch": 2585} {"train_loss": -43.68270492553711, "global_step": 312899, "epoch": 2585} {"train_loss": -43.537445068359375, "global_step": 312900, "epoch": 2585} {"train_loss": -43.82548141479492, "global_step": 312901, "epoch": 2585} {"train_loss": -43.2746696472168, "global_step": 312902, "epoch": 2585} {"train_loss": -43.61399841308594, "global_step": 312903, "epoch": 2585} {"train_loss": -43.94038391113281, "global_step": 312904, "epoch": 2585} {"train_loss": -41.284871424525235, "global_step": 312905, "epoch": 2585, "val_loss": 2743122.0} {"train_loss": -43.52415084838867, "global_step": 312906, "epoch": 2586} {"train_loss": -43.5842399597168, "global_step": 312907, "epoch": 2586} {"train_loss": -42.92049789428711, "global_step": 312908, "epoch": 2586} {"train_loss": -43.727294921875, "global_step": 312909, "epoch": 2586} {"train_loss": -42.85329055786133, "global_step": 312910, "epoch": 2586} {"train_loss": -43.81202697753906, "global_step": 312911, "epoch": 2586} {"train_loss": -43.31489944458008, "global_step": 312912, "epoch": 2586} {"train_loss": -42.68006134033203, "global_step": 312913, "epoch": 2586} {"train_loss": -43.285945892333984, "global_step": 312914, "epoch": 2586} {"train_loss": -43.360225677490234, "global_step": 312915, "epoch": 2586} {"train_loss": -44.086708068847656, "global_step": 312916, "epoch": 2586} {"train_loss": -43.37813949584961, "global_step": 312917, "epoch": 2586} {"train_loss": -43.722633361816406, "global_step": 312918, "epoch": 2586} {"train_loss": -43.62665557861328, "global_step": 312919, "epoch": 2586} {"train_loss": -43.282623291015625, "global_step": 312920, "epoch": 2586} {"train_loss": -42.95754623413086, "global_step": 312921, "epoch": 2586} {"train_loss": -42.97096633911133, "global_step": 312922, "epoch": 2586} {"train_loss": -43.08057403564453, "global_step": 312923, "epoch": 2586} {"train_loss": -42.65842819213867, "global_step": 312924, "epoch": 2586} {"train_loss": -40.20604705810547, "global_step": 312925, "epoch": 2586} {"train_loss": -42.061092376708984, "global_step": 312926, "epoch": 2586} {"train_loss": -43.65093994140625, "global_step": 312927, "epoch": 2586} {"train_loss": -41.272071838378906, "global_step": 312928, "epoch": 2586} {"train_loss": -40.98320007324219, "global_step": 312929, "epoch": 2586} {"train_loss": -43.12260055541992, "global_step": 312930, "epoch": 2586} {"train_loss": -43.52083206176758, "global_step": 312931, "epoch": 2586} {"train_loss": -42.34008026123047, "global_step": 312932, "epoch": 2586} {"train_loss": -42.20355987548828, "global_step": 312933, "epoch": 2586} {"train_loss": -42.214149475097656, "global_step": 312934, "epoch": 2586} {"train_loss": -43.7123908996582, "global_step": 312935, "epoch": 2586} {"train_loss": -43.468292236328125, "global_step": 312936, "epoch": 2586} {"train_loss": -41.619476318359375, "global_step": 312937, "epoch": 2586} {"train_loss": -37.41676712036133, "global_step": 312938, "epoch": 2586} {"train_loss": -41.43867111206055, "global_step": 312939, "epoch": 2586} {"train_loss": -42.731178283691406, "global_step": 312940, "epoch": 2586} {"train_loss": -38.927364349365234, "global_step": 312941, "epoch": 2586} {"train_loss": -38.73456954956055, "global_step": 312942, "epoch": 2586} {"train_loss": -42.529876708984375, "global_step": 312943, "epoch": 2586} {"train_loss": -42.2557487487793, "global_step": 312944, "epoch": 2586} {"train_loss": -42.44547653198242, "global_step": 312945, "epoch": 2586} {"train_loss": -41.9276123046875, "global_step": 312946, "epoch": 2586} {"train_loss": -42.01540756225586, "global_step": 312947, "epoch": 2586} {"train_loss": -41.34619140625, "global_step": 312948, "epoch": 2586} {"train_loss": -42.169342041015625, "global_step": 312949, "epoch": 2586} {"train_loss": -41.615821838378906, "global_step": 312950, "epoch": 2586} {"train_loss": -41.053245544433594, "global_step": 312951, "epoch": 2586} {"train_loss": -42.815711975097656, "global_step": 312952, "epoch": 2586} {"train_loss": -42.475196838378906, "global_step": 312953, "epoch": 2586} {"train_loss": -42.277950286865234, "global_step": 312954, "epoch": 2586} {"train_loss": -42.26422882080078, "global_step": 312955, "epoch": 2586} {"train_loss": -40.10691833496094, "global_step": 312956, "epoch": 2586} {"train_loss": -43.364479064941406, "global_step": 312957, "epoch": 2586} {"train_loss": -42.152099609375, "global_step": 312958, "epoch": 2586} {"train_loss": -41.51353454589844, "global_step": 312959, "epoch": 2586} {"train_loss": -42.72282409667969, "global_step": 312960, "epoch": 2586} {"train_loss": -42.57536697387695, "global_step": 312961, "epoch": 2586} {"train_loss": -41.830074310302734, "global_step": 312962, "epoch": 2586} {"train_loss": -41.2961311340332, "global_step": 312963, "epoch": 2586} {"train_loss": -42.97792434692383, "global_step": 312964, "epoch": 2586} {"train_loss": -41.81047058105469, "global_step": 312965, "epoch": 2586} {"train_loss": -41.7538948059082, "global_step": 312966, "epoch": 2586} {"train_loss": -43.548728942871094, "global_step": 312967, "epoch": 2586} {"train_loss": -42.645755767822266, "global_step": 312968, "epoch": 2586} {"train_loss": -43.511474609375, "global_step": 312969, "epoch": 2586} {"train_loss": -42.15819549560547, "global_step": 312970, "epoch": 2586} {"train_loss": -43.239261627197266, "global_step": 312971, "epoch": 2586} {"train_loss": -43.18036651611328, "global_step": 312972, "epoch": 2586} {"train_loss": -43.0372314453125, "global_step": 312973, "epoch": 2586} {"train_loss": -43.31627655029297, "global_step": 312974, "epoch": 2586} {"train_loss": -43.08271408081055, "global_step": 312975, "epoch": 2586} {"train_loss": -43.63505172729492, "global_step": 312976, "epoch": 2586} {"train_loss": -42.98283004760742, "global_step": 312977, "epoch": 2586} {"train_loss": -43.75788497924805, "global_step": 312978, "epoch": 2586} {"train_loss": -43.41749954223633, "global_step": 312979, "epoch": 2586} {"train_loss": -43.15825271606445, "global_step": 312980, "epoch": 2586} {"train_loss": -42.89577865600586, "global_step": 312981, "epoch": 2586} {"train_loss": -43.441925048828125, "global_step": 312982, "epoch": 2586} {"train_loss": -43.83881759643555, "global_step": 312983, "epoch": 2586} {"train_loss": -43.90597152709961, "global_step": 312984, "epoch": 2586} {"train_loss": -41.91843032836914, "global_step": 312985, "epoch": 2586} {"train_loss": -43.28392791748047, "global_step": 312986, "epoch": 2586} {"train_loss": -43.80581283569336, "global_step": 312987, "epoch": 2586} {"train_loss": -43.35160446166992, "global_step": 312988, "epoch": 2586} {"train_loss": -43.568973541259766, "global_step": 312989, "epoch": 2586} {"train_loss": -43.80530548095703, "global_step": 312990, "epoch": 2586} {"train_loss": -43.59212875366211, "global_step": 312991, "epoch": 2586} {"train_loss": -43.38296127319336, "global_step": 312992, "epoch": 2586} {"train_loss": -42.944698333740234, "global_step": 312993, "epoch": 2586} {"train_loss": -43.08356857299805, "global_step": 312994, "epoch": 2586} {"train_loss": -43.79612350463867, "global_step": 312995, "epoch": 2586} {"train_loss": -43.603721618652344, "global_step": 312996, "epoch": 2586} {"train_loss": -43.465328216552734, "global_step": 312997, "epoch": 2586} {"train_loss": -43.38195037841797, "global_step": 312998, "epoch": 2586} {"train_loss": -43.675941467285156, "global_step": 312999, "epoch": 2586} {"train_loss": -43.81601333618164, "global_step": 313000, "epoch": 2586} {"train_loss": -43.532466888427734, "global_step": 313001, "epoch": 2586} {"train_loss": -44.03033447265625, "global_step": 313002, "epoch": 2586} {"train_loss": -43.63018798828125, "global_step": 313003, "epoch": 2586} {"train_loss": -43.69466781616211, "global_step": 313004, "epoch": 2586} {"train_loss": -43.678466796875, "global_step": 313005, "epoch": 2586} {"train_loss": -42.7467041015625, "global_step": 313006, "epoch": 2586} {"train_loss": -43.115604400634766, "global_step": 313007, "epoch": 2586} {"train_loss": -43.45500564575195, "global_step": 313008, "epoch": 2586} {"train_loss": -43.430179595947266, "global_step": 313009, "epoch": 2586} {"train_loss": -43.58107376098633, "global_step": 313010, "epoch": 2586} {"train_loss": -44.12417221069336, "global_step": 313011, "epoch": 2586} {"train_loss": -43.63363265991211, "global_step": 313012, "epoch": 2586} {"train_loss": -43.67185592651367, "global_step": 313013, "epoch": 2586} {"train_loss": -43.658016204833984, "global_step": 313014, "epoch": 2586} {"train_loss": -43.49412536621094, "global_step": 313015, "epoch": 2586} {"train_loss": -43.68545150756836, "global_step": 313016, "epoch": 2586} {"train_loss": -40.783477783203125, "global_step": 313017, "epoch": 2586} {"train_loss": -42.6893424987793, "global_step": 313018, "epoch": 2586} {"train_loss": -43.50806427001953, "global_step": 313019, "epoch": 2586} {"train_loss": -42.54197692871094, "global_step": 313020, "epoch": 2586} {"train_loss": -44.09077835083008, "global_step": 313021, "epoch": 2586} {"train_loss": -43.15509796142578, "global_step": 313022, "epoch": 2586} {"train_loss": -43.79206466674805, "global_step": 313023, "epoch": 2586} {"train_loss": -42.83047103881836, "global_step": 313024, "epoch": 2586} {"train_loss": -43.33037185668945, "global_step": 313025, "epoch": 2586} {"train_loss": -42.818420567788365, "global_step": 313026, "epoch": 2586, "val_loss": 2702111.5} {"train_loss": -42.417579650878906, "global_step": 313027, "epoch": 2587} {"train_loss": -39.43197250366211, "global_step": 313028, "epoch": 2587} {"train_loss": -41.35783004760742, "global_step": 313029, "epoch": 2587} {"train_loss": -42.49872970581055, "global_step": 313030, "epoch": 2587} {"train_loss": -43.349571228027344, "global_step": 313031, "epoch": 2587} {"train_loss": -42.741390228271484, "global_step": 313032, "epoch": 2587} {"train_loss": -42.180599212646484, "global_step": 313033, "epoch": 2587} {"train_loss": -40.00788497924805, "global_step": 313034, "epoch": 2587} {"train_loss": -42.05707550048828, "global_step": 313035, "epoch": 2587} {"train_loss": -43.08962631225586, "global_step": 313036, "epoch": 2587} {"train_loss": -42.94391632080078, "global_step": 313037, "epoch": 2587} {"train_loss": -40.85700607299805, "global_step": 313038, "epoch": 2587} {"train_loss": -40.78707504272461, "global_step": 313039, "epoch": 2587} {"train_loss": -41.66604232788086, "global_step": 313040, "epoch": 2587} {"train_loss": -41.444149017333984, "global_step": 313041, "epoch": 2587} {"train_loss": -42.1745719909668, "global_step": 313042, "epoch": 2587} {"train_loss": -41.691280364990234, "global_step": 313043, "epoch": 2587} {"train_loss": -42.26602554321289, "global_step": 313044, "epoch": 2587} {"train_loss": -40.1546630859375, "global_step": 313045, "epoch": 2587} {"train_loss": -42.628387451171875, "global_step": 313046, "epoch": 2587} {"train_loss": -43.19209289550781, "global_step": 313047, "epoch": 2587} {"train_loss": -41.48867416381836, "global_step": 313048, "epoch": 2587} {"train_loss": -41.697654724121094, "global_step": 313049, "epoch": 2587} {"train_loss": -43.21889877319336, "global_step": 313050, "epoch": 2587} {"train_loss": -42.74291229248047, "global_step": 313051, "epoch": 2587} {"train_loss": -42.88352584838867, "global_step": 313052, "epoch": 2587} {"train_loss": -43.1248664855957, "global_step": 313053, "epoch": 2587} {"train_loss": -43.55547332763672, "global_step": 313054, "epoch": 2587} {"train_loss": -43.44960021972656, "global_step": 313055, "epoch": 2587} {"train_loss": -43.1679573059082, "global_step": 313056, "epoch": 2587} {"train_loss": -43.9596061706543, "global_step": 313057, "epoch": 2587} {"train_loss": -43.94675827026367, "global_step": 313058, "epoch": 2587} {"train_loss": -43.49473190307617, "global_step": 313059, "epoch": 2587} {"train_loss": -43.29842758178711, "global_step": 313060, "epoch": 2587} {"train_loss": -41.94016647338867, "global_step": 313061, "epoch": 2587} {"train_loss": -43.083892822265625, "global_step": 313062, "epoch": 2587} {"train_loss": -42.59575271606445, "global_step": 313063, "epoch": 2587} {"train_loss": -43.66292953491211, "global_step": 313064, "epoch": 2587} {"train_loss": -43.76955032348633, "global_step": 313065, "epoch": 2587} {"train_loss": -43.692787170410156, "global_step": 313066, "epoch": 2587} {"train_loss": -43.908687591552734, "global_step": 313067, "epoch": 2587} {"train_loss": -43.475399017333984, "global_step": 313068, "epoch": 2587} {"train_loss": -42.89142608642578, "global_step": 313069, "epoch": 2587} {"train_loss": -43.22935104370117, "global_step": 313070, "epoch": 2587} {"train_loss": -43.12761306762695, "global_step": 313071, "epoch": 2587} {"train_loss": -43.629669189453125, "global_step": 313072, "epoch": 2587} {"train_loss": -43.70573043823242, "global_step": 313073, "epoch": 2587} {"train_loss": -44.128780364990234, "global_step": 313074, "epoch": 2587} {"train_loss": -42.83724594116211, "global_step": 313075, "epoch": 2587} {"train_loss": -43.148231506347656, "global_step": 313076, "epoch": 2587} {"train_loss": -42.3494873046875, "global_step": 313077, "epoch": 2587} {"train_loss": -43.77373123168945, "global_step": 313078, "epoch": 2587} {"train_loss": -42.98236846923828, "global_step": 313079, "epoch": 2587} {"train_loss": -43.93503952026367, "global_step": 313080, "epoch": 2587} {"train_loss": -43.690467834472656, "global_step": 313081, "epoch": 2587} {"train_loss": -41.79227828979492, "global_step": 313082, "epoch": 2587} {"train_loss": -43.91923141479492, "global_step": 313083, "epoch": 2587} {"train_loss": -43.35634231567383, "global_step": 313084, "epoch": 2587} {"train_loss": -44.26603317260742, "global_step": 313085, "epoch": 2587} {"train_loss": -42.33696746826172, "global_step": 313086, "epoch": 2587} {"train_loss": -43.66658401489258, "global_step": 313087, "epoch": 2587} {"train_loss": -42.50630569458008, "global_step": 313088, "epoch": 2587} {"train_loss": -43.66458511352539, "global_step": 313089, "epoch": 2587} {"train_loss": -43.505836486816406, "global_step": 313090, "epoch": 2587} {"train_loss": -43.4567985534668, "global_step": 313091, "epoch": 2587} {"train_loss": -43.306724548339844, "global_step": 313092, "epoch": 2587} {"train_loss": -42.99795913696289, "global_step": 313093, "epoch": 2587} {"train_loss": -42.67881393432617, "global_step": 313094, "epoch": 2587} {"train_loss": -37.9206428527832, "global_step": 313095, "epoch": 2587} {"train_loss": -42.481658935546875, "global_step": 313096, "epoch": 2587} {"train_loss": -39.358673095703125, "global_step": 313097, "epoch": 2587} {"train_loss": -43.46681213378906, "global_step": 313098, "epoch": 2587} {"train_loss": -41.241764068603516, "global_step": 313099, "epoch": 2587} {"train_loss": -41.59269714355469, "global_step": 313100, "epoch": 2587} {"train_loss": -38.062442779541016, "global_step": 313101, "epoch": 2587} {"train_loss": -38.10615539550781, "global_step": 313102, "epoch": 2587} {"train_loss": -40.79421615600586, "global_step": 313103, "epoch": 2587} {"train_loss": -38.32805252075195, "global_step": 313104, "epoch": 2587} {"train_loss": -27.350849151611328, "global_step": 313105, "epoch": 2587} {"train_loss": -38.542903900146484, "global_step": 313106, "epoch": 2587} {"train_loss": -38.1529426574707, "global_step": 313107, "epoch": 2587} {"train_loss": -42.097450256347656, "global_step": 313108, "epoch": 2587} {"train_loss": -40.80308151245117, "global_step": 313109, "epoch": 2587} {"train_loss": -42.54648971557617, "global_step": 313110, "epoch": 2587} {"train_loss": -39.7333984375, "global_step": 313111, "epoch": 2587} {"train_loss": -12.126653671264648, "global_step": 313112, "epoch": 2587} {"train_loss": -38.7936897277832, "global_step": 313113, "epoch": 2587} {"train_loss": -33.7764778137207, "global_step": 313114, "epoch": 2587} {"train_loss": -36.45732498168945, "global_step": 313115, "epoch": 2587} {"train_loss": -40.58428955078125, "global_step": 313116, "epoch": 2587} {"train_loss": -38.375789642333984, "global_step": 313117, "epoch": 2587} {"train_loss": -32.81991195678711, "global_step": 313118, "epoch": 2587} {"train_loss": -32.724117279052734, "global_step": 313119, "epoch": 2587} {"train_loss": -34.8355827331543, "global_step": 313120, "epoch": 2587} {"train_loss": -36.81792068481445, "global_step": 313121, "epoch": 2587} {"train_loss": -35.99831008911133, "global_step": 313122, "epoch": 2587} {"train_loss": -33.23865509033203, "global_step": 313123, "epoch": 2587} {"train_loss": -34.5643424987793, "global_step": 313124, "epoch": 2587} {"train_loss": -34.06311798095703, "global_step": 313125, "epoch": 2587} {"train_loss": -39.44224548339844, "global_step": 313126, "epoch": 2587} {"train_loss": -38.049659729003906, "global_step": 313127, "epoch": 2587} {"train_loss": -38.89039993286133, "global_step": 313128, "epoch": 2587} {"train_loss": -40.05860137939453, "global_step": 313129, "epoch": 2587} {"train_loss": -39.68223190307617, "global_step": 313130, "epoch": 2587} {"train_loss": -38.75996017456055, "global_step": 313131, "epoch": 2587} {"train_loss": -39.31401443481445, "global_step": 313132, "epoch": 2587} {"train_loss": -38.80161666870117, "global_step": 313133, "epoch": 2587} {"train_loss": -39.93918228149414, "global_step": 313134, "epoch": 2587} {"train_loss": -40.6799430847168, "global_step": 313135, "epoch": 2587} {"train_loss": -37.62541198730469, "global_step": 313136, "epoch": 2587} {"train_loss": -40.679317474365234, "global_step": 313137, "epoch": 2587} {"train_loss": -39.81631088256836, "global_step": 313138, "epoch": 2587} {"train_loss": -38.1778678894043, "global_step": 313139, "epoch": 2587} {"train_loss": -39.22273254394531, "global_step": 313140, "epoch": 2587} {"train_loss": -40.17081832885742, "global_step": 313141, "epoch": 2587} {"train_loss": -38.47667694091797, "global_step": 313142, "epoch": 2587} {"train_loss": -40.353668212890625, "global_step": 313143, "epoch": 2587} {"train_loss": -40.79628372192383, "global_step": 313144, "epoch": 2587} {"train_loss": -41.22842025756836, "global_step": 313145, "epoch": 2587} {"train_loss": -41.148651123046875, "global_step": 313146, "epoch": 2587} {"train_loss": -40.72858465210465, "global_step": 313147, "epoch": 2587, "val_loss": 2997083.25} {"train_loss": -41.355323791503906, "global_step": 313148, "epoch": 2588} {"train_loss": -40.64695358276367, "global_step": 313149, "epoch": 2588} {"train_loss": -39.95658493041992, "global_step": 313150, "epoch": 2588} {"train_loss": -38.59292221069336, "global_step": 313151, "epoch": 2588} {"train_loss": -40.3742790222168, "global_step": 313152, "epoch": 2588} {"train_loss": -39.92558670043945, "global_step": 313153, "epoch": 2588} {"train_loss": -40.63142395019531, "global_step": 313154, "epoch": 2588} {"train_loss": -40.599884033203125, "global_step": 313155, "epoch": 2588} {"train_loss": -41.625335693359375, "global_step": 313156, "epoch": 2588} {"train_loss": -41.680419921875, "global_step": 313157, "epoch": 2588} {"train_loss": -40.9500617980957, "global_step": 313158, "epoch": 2588} {"train_loss": -41.01655197143555, "global_step": 313159, "epoch": 2588} {"train_loss": -40.90254592895508, "global_step": 313160, "epoch": 2588} {"train_loss": -41.02309799194336, "global_step": 313161, "epoch": 2588} {"train_loss": -42.07169723510742, "global_step": 313162, "epoch": 2588} {"train_loss": -40.74612045288086, "global_step": 313163, "epoch": 2588} {"train_loss": -41.65446472167969, "global_step": 313164, "epoch": 2588} {"train_loss": -41.64704132080078, "global_step": 313165, "epoch": 2588} {"train_loss": -42.061519622802734, "global_step": 313166, "epoch": 2588} {"train_loss": -40.47292709350586, "global_step": 313167, "epoch": 2588} {"train_loss": -41.675350189208984, "global_step": 313168, "epoch": 2588} {"train_loss": -41.86880111694336, "global_step": 313169, "epoch": 2588} {"train_loss": -41.00484085083008, "global_step": 313170, "epoch": 2588} {"train_loss": -41.8414421081543, "global_step": 313171, "epoch": 2588} {"train_loss": -42.218482971191406, "global_step": 313172, "epoch": 2588} {"train_loss": -41.83972930908203, "global_step": 313173, "epoch": 2588} {"train_loss": -41.60026931762695, "global_step": 313174, "epoch": 2588} {"train_loss": -42.2462043762207, "global_step": 313175, "epoch": 2588} {"train_loss": -42.22990798950195, "global_step": 313176, "epoch": 2588} {"train_loss": -41.69295883178711, "global_step": 313177, "epoch": 2588} {"train_loss": -42.43667221069336, "global_step": 313178, "epoch": 2588} {"train_loss": -42.47819137573242, "global_step": 313179, "epoch": 2588} {"train_loss": -42.39980697631836, "global_step": 313180, "epoch": 2588} {"train_loss": -41.371253967285156, "global_step": 313181, "epoch": 2588} {"train_loss": -41.870025634765625, "global_step": 313182, "epoch": 2588} {"train_loss": -42.40863800048828, "global_step": 313183, "epoch": 2588} {"train_loss": -42.29828643798828, "global_step": 313184, "epoch": 2588} {"train_loss": -42.167476654052734, "global_step": 313185, "epoch": 2588} {"train_loss": -42.97141647338867, "global_step": 313186, "epoch": 2588} {"train_loss": -42.82207107543945, "global_step": 313187, "epoch": 2588} {"train_loss": -42.19012451171875, "global_step": 313188, "epoch": 2588} {"train_loss": -42.571346282958984, "global_step": 313189, "epoch": 2588} {"train_loss": -41.95563888549805, "global_step": 313190, "epoch": 2588} {"train_loss": -42.67692184448242, "global_step": 313191, "epoch": 2588} {"train_loss": -42.600521087646484, "global_step": 313192, "epoch": 2588} {"train_loss": -42.89426803588867, "global_step": 313193, "epoch": 2588} {"train_loss": -42.768218994140625, "global_step": 313194, "epoch": 2588} {"train_loss": -42.89760208129883, "global_step": 313195, "epoch": 2588} {"train_loss": -42.56355667114258, "global_step": 313196, "epoch": 2588} {"train_loss": -42.660430908203125, "global_step": 313197, "epoch": 2588} {"train_loss": -42.9604606628418, "global_step": 313198, "epoch": 2588} {"train_loss": -42.90808868408203, "global_step": 313199, "epoch": 2588} {"train_loss": -42.33175277709961, "global_step": 313200, "epoch": 2588} {"train_loss": -42.93511962890625, "global_step": 313201, "epoch": 2588} {"train_loss": -43.25068283081055, "global_step": 313202, "epoch": 2588} {"train_loss": -42.810611724853516, "global_step": 313203, "epoch": 2588} {"train_loss": -43.092323303222656, "global_step": 313204, "epoch": 2588} {"train_loss": -43.28528594970703, "global_step": 313205, "epoch": 2588} {"train_loss": -42.7853889465332, "global_step": 313206, "epoch": 2588} {"train_loss": -43.595951080322266, "global_step": 313207, "epoch": 2588} {"train_loss": -43.21525192260742, "global_step": 313208, "epoch": 2588} {"train_loss": -43.39699935913086, "global_step": 313209, "epoch": 2588} {"train_loss": -42.863868713378906, "global_step": 313210, "epoch": 2588} {"train_loss": -43.27720260620117, "global_step": 313211, "epoch": 2588} {"train_loss": -43.006622314453125, "global_step": 313212, "epoch": 2588} {"train_loss": -43.67066192626953, "global_step": 313213, "epoch": 2588} {"train_loss": -43.04048538208008, "global_step": 313214, "epoch": 2588} {"train_loss": -43.40764236450195, "global_step": 313215, "epoch": 2588} {"train_loss": -43.25858688354492, "global_step": 313216, "epoch": 2588} {"train_loss": -43.090248107910156, "global_step": 313217, "epoch": 2588} {"train_loss": -43.53036117553711, "global_step": 313218, "epoch": 2588} {"train_loss": -42.89610290527344, "global_step": 313219, "epoch": 2588} {"train_loss": -42.27162551879883, "global_step": 313220, "epoch": 2588} {"train_loss": -43.216766357421875, "global_step": 313221, "epoch": 2588} {"train_loss": -43.0675163269043, "global_step": 313222, "epoch": 2588} {"train_loss": -43.558509826660156, "global_step": 313223, "epoch": 2588} {"train_loss": -43.73666000366211, "global_step": 313224, "epoch": 2588} {"train_loss": -43.51591110229492, "global_step": 313225, "epoch": 2588} {"train_loss": -43.77920913696289, "global_step": 313226, "epoch": 2588} {"train_loss": -43.439369201660156, "global_step": 313227, "epoch": 2588} {"train_loss": -43.743919372558594, "global_step": 313228, "epoch": 2588} {"train_loss": -43.709999084472656, "global_step": 313229, "epoch": 2588} {"train_loss": -43.266876220703125, "global_step": 313230, "epoch": 2588} {"train_loss": -43.41989517211914, "global_step": 313231, "epoch": 2588} {"train_loss": -43.26744842529297, "global_step": 313232, "epoch": 2588} {"train_loss": -43.49927520751953, "global_step": 313233, "epoch": 2588} {"train_loss": -42.86883544921875, "global_step": 313234, "epoch": 2588} {"train_loss": -42.40652084350586, "global_step": 313235, "epoch": 2588} {"train_loss": -43.51827621459961, "global_step": 313236, "epoch": 2588} {"train_loss": -43.328250885009766, "global_step": 313237, "epoch": 2588} {"train_loss": -42.20222091674805, "global_step": 313238, "epoch": 2588} {"train_loss": -42.967491149902344, "global_step": 313239, "epoch": 2588} {"train_loss": -42.58150100708008, "global_step": 313240, "epoch": 2588} {"train_loss": -42.30630111694336, "global_step": 313241, "epoch": 2588} {"train_loss": -42.7842903137207, "global_step": 313242, "epoch": 2588} {"train_loss": -43.69839859008789, "global_step": 313243, "epoch": 2588} {"train_loss": -43.53363800048828, "global_step": 313244, "epoch": 2588} {"train_loss": -42.92891311645508, "global_step": 313245, "epoch": 2588} {"train_loss": -43.24738311767578, "global_step": 313246, "epoch": 2588} {"train_loss": -43.53458023071289, "global_step": 313247, "epoch": 2588} {"train_loss": -42.74711227416992, "global_step": 313248, "epoch": 2588} {"train_loss": -42.477020263671875, "global_step": 313249, "epoch": 2588} {"train_loss": -41.82196807861328, "global_step": 313250, "epoch": 2588} {"train_loss": -41.777687072753906, "global_step": 313251, "epoch": 2588} {"train_loss": -42.621395111083984, "global_step": 313252, "epoch": 2588} {"train_loss": -43.47639846801758, "global_step": 313253, "epoch": 2588} {"train_loss": -41.7571907043457, "global_step": 313254, "epoch": 2588} {"train_loss": -39.02216720581055, "global_step": 313255, "epoch": 2588} {"train_loss": -37.1583251953125, "global_step": 313256, "epoch": 2588} {"train_loss": -42.48989486694336, "global_step": 313257, "epoch": 2588} {"train_loss": -39.831817626953125, "global_step": 313258, "epoch": 2588} {"train_loss": -30.857126235961914, "global_step": 313259, "epoch": 2588} {"train_loss": -27.919601440429688, "global_step": 313260, "epoch": 2588} {"train_loss": -36.85029602050781, "global_step": 313261, "epoch": 2588} {"train_loss": -38.544891357421875, "global_step": 313262, "epoch": 2588} {"train_loss": -22.052967071533203, "global_step": 313263, "epoch": 2588} {"train_loss": -31.801008224487305, "global_step": 313264, "epoch": 2588} {"train_loss": -35.926170349121094, "global_step": 313265, "epoch": 2588} {"train_loss": -29.905059814453125, "global_step": 313266, "epoch": 2588} {"train_loss": -39.68673324584961, "global_step": 313267, "epoch": 2588} {"train_loss": -41.549409346147016, "global_step": 313268, "epoch": 2588, "val_loss": 2691197.5} {"train_loss": -39.974029541015625, "global_step": 313269, "epoch": 2589} {"train_loss": -36.35977554321289, "global_step": 313270, "epoch": 2589} {"train_loss": -39.14297103881836, "global_step": 313271, "epoch": 2589} {"train_loss": -36.11248779296875, "global_step": 313272, "epoch": 2589} {"train_loss": -39.688785552978516, "global_step": 313273, "epoch": 2589} {"train_loss": -38.25504684448242, "global_step": 313274, "epoch": 2589} {"train_loss": -36.63789749145508, "global_step": 313275, "epoch": 2589} {"train_loss": -40.07589340209961, "global_step": 313276, "epoch": 2589} {"train_loss": -37.19536209106445, "global_step": 313277, "epoch": 2589} {"train_loss": -40.510841369628906, "global_step": 313278, "epoch": 2589} {"train_loss": -39.33876037597656, "global_step": 313279, "epoch": 2589} {"train_loss": -39.14549255371094, "global_step": 313280, "epoch": 2589} {"train_loss": -39.69088363647461, "global_step": 313281, "epoch": 2589} {"train_loss": -39.33758544921875, "global_step": 313282, "epoch": 2589} {"train_loss": -39.3358268737793, "global_step": 313283, "epoch": 2589} {"train_loss": -40.332313537597656, "global_step": 313284, "epoch": 2589} {"train_loss": -39.605445861816406, "global_step": 313285, "epoch": 2589} {"train_loss": -41.228111267089844, "global_step": 313286, "epoch": 2589} {"train_loss": -40.2427864074707, "global_step": 313287, "epoch": 2589} {"train_loss": -40.736263275146484, "global_step": 313288, "epoch": 2589} {"train_loss": -41.47691345214844, "global_step": 313289, "epoch": 2589} {"train_loss": -40.83313751220703, "global_step": 313290, "epoch": 2589} {"train_loss": -41.6529426574707, "global_step": 313291, "epoch": 2589} {"train_loss": -41.5288200378418, "global_step": 313292, "epoch": 2589} {"train_loss": -41.06591033935547, "global_step": 313293, "epoch": 2589} {"train_loss": -41.91230392456055, "global_step": 313294, "epoch": 2589} {"train_loss": -41.95219802856445, "global_step": 313295, "epoch": 2589} {"train_loss": -42.19070053100586, "global_step": 313296, "epoch": 2589} {"train_loss": -42.49979782104492, "global_step": 313297, "epoch": 2589} {"train_loss": -41.76244354248047, "global_step": 313298, "epoch": 2589} {"train_loss": -42.17060089111328, "global_step": 313299, "epoch": 2589} {"train_loss": -42.02128601074219, "global_step": 313300, "epoch": 2589} {"train_loss": -41.3549919128418, "global_step": 313301, "epoch": 2589} {"train_loss": -42.44157791137695, "global_step": 313302, "epoch": 2589} {"train_loss": -42.097930908203125, "global_step": 313303, "epoch": 2589} {"train_loss": -42.33573532104492, "global_step": 313304, "epoch": 2589} {"train_loss": -42.47886276245117, "global_step": 313305, "epoch": 2589} {"train_loss": -42.61015319824219, "global_step": 313306, "epoch": 2589} {"train_loss": -42.3237190246582, "global_step": 313307, "epoch": 2589} {"train_loss": -42.819026947021484, "global_step": 313308, "epoch": 2589} {"train_loss": -42.79362487792969, "global_step": 313309, "epoch": 2589} {"train_loss": -42.4797477722168, "global_step": 313310, "epoch": 2589} {"train_loss": -42.301509857177734, "global_step": 313311, "epoch": 2589} {"train_loss": -42.99260330200195, "global_step": 313312, "epoch": 2589} {"train_loss": -42.938133239746094, "global_step": 313313, "epoch": 2589} {"train_loss": -43.098182678222656, "global_step": 313314, "epoch": 2589} {"train_loss": -42.963531494140625, "global_step": 313315, "epoch": 2589} {"train_loss": -43.2453727722168, "global_step": 313316, "epoch": 2589} {"train_loss": -42.9873046875, "global_step": 313317, "epoch": 2589} {"train_loss": -42.74082565307617, "global_step": 313318, "epoch": 2589} {"train_loss": -42.82780456542969, "global_step": 313319, "epoch": 2589} {"train_loss": -43.12692642211914, "global_step": 313320, "epoch": 2589} {"train_loss": -42.9555549621582, "global_step": 313321, "epoch": 2589} {"train_loss": -43.1743278503418, "global_step": 313322, "epoch": 2589} {"train_loss": -43.3984260559082, "global_step": 313323, "epoch": 2589} {"train_loss": -43.09126663208008, "global_step": 313324, "epoch": 2589} {"train_loss": -43.026588439941406, "global_step": 313325, "epoch": 2589} {"train_loss": -43.18867492675781, "global_step": 313326, "epoch": 2589} {"train_loss": -43.1673583984375, "global_step": 313327, "epoch": 2589} {"train_loss": -43.20287322998047, "global_step": 313328, "epoch": 2589} {"train_loss": -43.00307846069336, "global_step": 313329, "epoch": 2589} {"train_loss": -43.47074890136719, "global_step": 313330, "epoch": 2589} {"train_loss": -43.508949279785156, "global_step": 313331, "epoch": 2589} {"train_loss": -42.9670295715332, "global_step": 313332, "epoch": 2589} {"train_loss": -43.49009704589844, "global_step": 313333, "epoch": 2589} {"train_loss": -43.306800842285156, "global_step": 313334, "epoch": 2589} {"train_loss": -42.805912017822266, "global_step": 313335, "epoch": 2589} {"train_loss": -43.43854522705078, "global_step": 313336, "epoch": 2589} {"train_loss": -43.69406509399414, "global_step": 313337, "epoch": 2589} {"train_loss": -43.215003967285156, "global_step": 313338, "epoch": 2589} {"train_loss": -43.52911376953125, "global_step": 313339, "epoch": 2589} {"train_loss": -43.619789123535156, "global_step": 313340, "epoch": 2589} {"train_loss": -43.57719039916992, "global_step": 313341, "epoch": 2589} {"train_loss": -43.706787109375, "global_step": 313342, "epoch": 2589} {"train_loss": -43.678707122802734, "global_step": 313343, "epoch": 2589} {"train_loss": -43.63926315307617, "global_step": 313344, "epoch": 2589} {"train_loss": -43.688350677490234, "global_step": 313345, "epoch": 2589} {"train_loss": -43.28113555908203, "global_step": 313346, "epoch": 2589} {"train_loss": -43.4910888671875, "global_step": 313347, "epoch": 2589} {"train_loss": -43.705814361572266, "global_step": 313348, "epoch": 2589} {"train_loss": -43.69928741455078, "global_step": 313349, "epoch": 2589} {"train_loss": -43.74060821533203, "global_step": 313350, "epoch": 2589} {"train_loss": -43.8128547668457, "global_step": 313351, "epoch": 2589} {"train_loss": -43.27333450317383, "global_step": 313352, "epoch": 2589} {"train_loss": -43.7121696472168, "global_step": 313353, "epoch": 2589} {"train_loss": -43.8816032409668, "global_step": 313354, "epoch": 2589} {"train_loss": -44.0200309753418, "global_step": 313355, "epoch": 2589} {"train_loss": -44.2514762878418, "global_step": 313356, "epoch": 2589} {"train_loss": -43.484676361083984, "global_step": 313357, "epoch": 2589} {"train_loss": -44.083740234375, "global_step": 313358, "epoch": 2589} {"train_loss": -43.617698669433594, "global_step": 313359, "epoch": 2589} {"train_loss": -43.72361373901367, "global_step": 313360, "epoch": 2589} {"train_loss": -43.989994049072266, "global_step": 313361, "epoch": 2589} {"train_loss": -42.23301315307617, "global_step": 313362, "epoch": 2589} {"train_loss": -43.06435012817383, "global_step": 313363, "epoch": 2589} {"train_loss": -43.0374641418457, "global_step": 313364, "epoch": 2589} {"train_loss": -43.36560821533203, "global_step": 313365, "epoch": 2589} {"train_loss": -43.204444885253906, "global_step": 313366, "epoch": 2589} {"train_loss": -43.99251937866211, "global_step": 313367, "epoch": 2589} {"train_loss": -43.35606002807617, "global_step": 313368, "epoch": 2589} {"train_loss": -41.0057258605957, "global_step": 313369, "epoch": 2589} {"train_loss": -43.66947555541992, "global_step": 313370, "epoch": 2589} {"train_loss": -43.36606979370117, "global_step": 313371, "epoch": 2589} {"train_loss": -43.62116622924805, "global_step": 313372, "epoch": 2589} {"train_loss": -43.57688522338867, "global_step": 313373, "epoch": 2589} {"train_loss": -41.98517990112305, "global_step": 313374, "epoch": 2589} {"train_loss": -41.644290924072266, "global_step": 313375, "epoch": 2589} {"train_loss": -41.699275970458984, "global_step": 313376, "epoch": 2589} {"train_loss": -43.4690055847168, "global_step": 313377, "epoch": 2589} {"train_loss": -44.31516647338867, "global_step": 313378, "epoch": 2589} {"train_loss": -42.38402557373047, "global_step": 313379, "epoch": 2589} {"train_loss": -42.07808303833008, "global_step": 313380, "epoch": 2589} {"train_loss": -42.925071716308594, "global_step": 313381, "epoch": 2589} {"train_loss": -43.78718948364258, "global_step": 313382, "epoch": 2589} {"train_loss": -43.196449279785156, "global_step": 313383, "epoch": 2589} {"train_loss": -42.808929443359375, "global_step": 313384, "epoch": 2589} {"train_loss": -42.09661865234375, "global_step": 313385, "epoch": 2589} {"train_loss": -41.936798095703125, "global_step": 313386, "epoch": 2589} {"train_loss": -43.07686996459961, "global_step": 313387, "epoch": 2589} {"train_loss": -44.041656494140625, "global_step": 313388, "epoch": 2589} {"train_loss": -42.32632657516101, "global_step": 313389, "epoch": 2589, "val_loss": 2772718.5} {"train_loss": -41.944217681884766, "global_step": 313390, "epoch": 2590} {"train_loss": -43.356971740722656, "global_step": 313391, "epoch": 2590} {"train_loss": -43.674678802490234, "global_step": 313392, "epoch": 2590} {"train_loss": -42.40424346923828, "global_step": 313393, "epoch": 2590} {"train_loss": -41.80080032348633, "global_step": 313394, "epoch": 2590} {"train_loss": -42.89894104003906, "global_step": 313395, "epoch": 2590} {"train_loss": -43.9280891418457, "global_step": 313396, "epoch": 2590} {"train_loss": -40.80985641479492, "global_step": 313397, "epoch": 2590} {"train_loss": -40.82839584350586, "global_step": 313398, "epoch": 2590} {"train_loss": -42.8878288269043, "global_step": 313399, "epoch": 2590} {"train_loss": -40.78356170654297, "global_step": 313400, "epoch": 2590} {"train_loss": -39.185264587402344, "global_step": 313401, "epoch": 2590} {"train_loss": -41.51474380493164, "global_step": 313402, "epoch": 2590} {"train_loss": -42.625614166259766, "global_step": 313403, "epoch": 2590} {"train_loss": -39.9835319519043, "global_step": 313404, "epoch": 2590} {"train_loss": -40.990413665771484, "global_step": 313405, "epoch": 2590} {"train_loss": -41.462337493896484, "global_step": 313406, "epoch": 2590} {"train_loss": -38.87324142456055, "global_step": 313407, "epoch": 2590} {"train_loss": -40.839107513427734, "global_step": 313408, "epoch": 2590} {"train_loss": -40.620201110839844, "global_step": 313409, "epoch": 2590} {"train_loss": -41.38276290893555, "global_step": 313410, "epoch": 2590} {"train_loss": -42.458351135253906, "global_step": 313411, "epoch": 2590} {"train_loss": -41.12461471557617, "global_step": 313412, "epoch": 2590} {"train_loss": -41.3657112121582, "global_step": 313413, "epoch": 2590} {"train_loss": -42.700660705566406, "global_step": 313414, "epoch": 2590} {"train_loss": -41.34839630126953, "global_step": 313415, "epoch": 2590} {"train_loss": -43.04194259643555, "global_step": 313416, "epoch": 2590} {"train_loss": -41.18916702270508, "global_step": 313417, "epoch": 2590} {"train_loss": -43.06793212890625, "global_step": 313418, "epoch": 2590} {"train_loss": -42.870460510253906, "global_step": 313419, "epoch": 2590} {"train_loss": -41.88678741455078, "global_step": 313420, "epoch": 2590} {"train_loss": -42.93400573730469, "global_step": 313421, "epoch": 2590} {"train_loss": -42.90077590942383, "global_step": 313422, "epoch": 2590} {"train_loss": -42.31758117675781, "global_step": 313423, "epoch": 2590} {"train_loss": -42.875057220458984, "global_step": 313424, "epoch": 2590} {"train_loss": -42.70949935913086, "global_step": 313425, "epoch": 2590} {"train_loss": -42.8890266418457, "global_step": 313426, "epoch": 2590} {"train_loss": -43.393798828125, "global_step": 313427, "epoch": 2590} {"train_loss": -43.287757873535156, "global_step": 313428, "epoch": 2590} {"train_loss": -42.65877914428711, "global_step": 313429, "epoch": 2590} {"train_loss": -43.3408317565918, "global_step": 313430, "epoch": 2590} {"train_loss": -43.36387252807617, "global_step": 313431, "epoch": 2590} {"train_loss": -42.775901794433594, "global_step": 313432, "epoch": 2590} {"train_loss": -42.939632415771484, "global_step": 313433, "epoch": 2590} {"train_loss": -43.049312591552734, "global_step": 313434, "epoch": 2590} {"train_loss": -43.74449157714844, "global_step": 313435, "epoch": 2590} {"train_loss": -42.9377326965332, "global_step": 313436, "epoch": 2590} {"train_loss": -42.50135040283203, "global_step": 313437, "epoch": 2590} {"train_loss": -43.58164596557617, "global_step": 313438, "epoch": 2590} {"train_loss": -43.84487533569336, "global_step": 313439, "epoch": 2590} {"train_loss": -43.7273063659668, "global_step": 313440, "epoch": 2590} {"train_loss": -43.432735443115234, "global_step": 313441, "epoch": 2590} {"train_loss": -43.916534423828125, "global_step": 313442, "epoch": 2590} {"train_loss": -43.0857048034668, "global_step": 313443, "epoch": 2590} {"train_loss": -43.37794876098633, "global_step": 313444, "epoch": 2590} {"train_loss": -43.4845085144043, "global_step": 313445, "epoch": 2590} {"train_loss": -43.4161491394043, "global_step": 313446, "epoch": 2590} {"train_loss": -43.41129684448242, "global_step": 313447, "epoch": 2590} {"train_loss": -42.99298858642578, "global_step": 313448, "epoch": 2590} {"train_loss": -42.62759017944336, "global_step": 313449, "epoch": 2590} {"train_loss": -42.847286224365234, "global_step": 313450, "epoch": 2590} {"train_loss": -42.343292236328125, "global_step": 313451, "epoch": 2590} {"train_loss": -42.60984420776367, "global_step": 313452, "epoch": 2590} {"train_loss": -43.53345489501953, "global_step": 313453, "epoch": 2590} {"train_loss": -43.057518005371094, "global_step": 313454, "epoch": 2590} {"train_loss": -42.835205078125, "global_step": 313455, "epoch": 2590} {"train_loss": -43.14818572998047, "global_step": 313456, "epoch": 2590} {"train_loss": -43.69160842895508, "global_step": 313457, "epoch": 2590} {"train_loss": -43.58659362792969, "global_step": 313458, "epoch": 2590} {"train_loss": -43.32048416137695, "global_step": 313459, "epoch": 2590} {"train_loss": -43.60809326171875, "global_step": 313460, "epoch": 2590} {"train_loss": -43.993995666503906, "global_step": 313461, "epoch": 2590} {"train_loss": -42.99747848510742, "global_step": 313462, "epoch": 2590} {"train_loss": -43.25614929199219, "global_step": 313463, "epoch": 2590} {"train_loss": -43.537349700927734, "global_step": 313464, "epoch": 2590} {"train_loss": -43.807682037353516, "global_step": 313465, "epoch": 2590} {"train_loss": -43.76637649536133, "global_step": 313466, "epoch": 2590} {"train_loss": -43.47777557373047, "global_step": 313467, "epoch": 2590} {"train_loss": -43.539825439453125, "global_step": 313468, "epoch": 2590} {"train_loss": -42.59144592285156, "global_step": 313469, "epoch": 2590} {"train_loss": -42.323974609375, "global_step": 313470, "epoch": 2590} {"train_loss": -43.89044952392578, "global_step": 313471, "epoch": 2590} {"train_loss": -43.16740036010742, "global_step": 313472, "epoch": 2590} {"train_loss": -41.628448486328125, "global_step": 313473, "epoch": 2590} {"train_loss": -41.08163833618164, "global_step": 313474, "epoch": 2590} {"train_loss": -43.443721771240234, "global_step": 313475, "epoch": 2590} {"train_loss": -42.780330657958984, "global_step": 313476, "epoch": 2590} {"train_loss": -41.4948616027832, "global_step": 313477, "epoch": 2590} {"train_loss": -41.7153205871582, "global_step": 313478, "epoch": 2590} {"train_loss": -43.05475616455078, "global_step": 313479, "epoch": 2590} {"train_loss": -43.426300048828125, "global_step": 313480, "epoch": 2590} {"train_loss": -42.95747756958008, "global_step": 313481, "epoch": 2590} {"train_loss": -42.658809661865234, "global_step": 313482, "epoch": 2590} {"train_loss": -43.5526123046875, "global_step": 313483, "epoch": 2590} {"train_loss": -41.4627799987793, "global_step": 313484, "epoch": 2590} {"train_loss": -41.15925216674805, "global_step": 313485, "epoch": 2590} {"train_loss": -40.67545700073242, "global_step": 313486, "epoch": 2590} {"train_loss": -42.11977767944336, "global_step": 313487, "epoch": 2590} {"train_loss": -42.250301361083984, "global_step": 313488, "epoch": 2590} {"train_loss": -41.02326965332031, "global_step": 313489, "epoch": 2590} {"train_loss": -42.693931579589844, "global_step": 313490, "epoch": 2590} {"train_loss": -42.30797576904297, "global_step": 313491, "epoch": 2590} {"train_loss": -41.86698532104492, "global_step": 313492, "epoch": 2590} {"train_loss": -43.37160873413086, "global_step": 313493, "epoch": 2590} {"train_loss": -41.02842330932617, "global_step": 313494, "epoch": 2590} {"train_loss": -41.7989616394043, "global_step": 313495, "epoch": 2590} {"train_loss": -42.257545471191406, "global_step": 313496, "epoch": 2590} {"train_loss": -39.195167541503906, "global_step": 313497, "epoch": 2590} {"train_loss": -41.645843505859375, "global_step": 313498, "epoch": 2590} {"train_loss": -42.440818786621094, "global_step": 313499, "epoch": 2590} {"train_loss": -39.840145111083984, "global_step": 313500, "epoch": 2590} {"train_loss": -42.85769271850586, "global_step": 313501, "epoch": 2590} {"train_loss": -40.40771484375, "global_step": 313502, "epoch": 2590} {"train_loss": -43.48580551147461, "global_step": 313503, "epoch": 2590} {"train_loss": -41.776893615722656, "global_step": 313504, "epoch": 2590} {"train_loss": -43.22665023803711, "global_step": 313505, "epoch": 2590} {"train_loss": -42.273983001708984, "global_step": 313506, "epoch": 2590} {"train_loss": -43.1777229309082, "global_step": 313507, "epoch": 2590} {"train_loss": -42.681270599365234, "global_step": 313508, "epoch": 2590} {"train_loss": -42.697410583496094, "global_step": 313509, "epoch": 2590} {"train_loss": -42.48060191761363, "global_step": 313510, "epoch": 2590, "val_loss": 2772955.0} {"train_loss": -43.07273864746094, "global_step": 313511, "epoch": 2591} {"train_loss": -42.8143196105957, "global_step": 313512, "epoch": 2591} {"train_loss": -43.60732650756836, "global_step": 313513, "epoch": 2591} {"train_loss": -42.45147705078125, "global_step": 313514, "epoch": 2591} {"train_loss": -43.82856369018555, "global_step": 313515, "epoch": 2591} {"train_loss": -43.694854736328125, "global_step": 313516, "epoch": 2591} {"train_loss": -39.03651428222656, "global_step": 313517, "epoch": 2591} {"train_loss": -43.95341873168945, "global_step": 313518, "epoch": 2591} {"train_loss": -43.54547882080078, "global_step": 313519, "epoch": 2591} {"train_loss": -43.513729095458984, "global_step": 313520, "epoch": 2591} {"train_loss": -44.09296798706055, "global_step": 313521, "epoch": 2591} {"train_loss": -43.79548263549805, "global_step": 313522, "epoch": 2591} {"train_loss": -43.82585525512695, "global_step": 313523, "epoch": 2591} {"train_loss": -43.55937576293945, "global_step": 313524, "epoch": 2591} {"train_loss": -43.64295196533203, "global_step": 313525, "epoch": 2591} {"train_loss": -44.053951263427734, "global_step": 313526, "epoch": 2591} {"train_loss": -43.6679801940918, "global_step": 313527, "epoch": 2591} {"train_loss": -44.39854049682617, "global_step": 313528, "epoch": 2591} {"train_loss": -44.0771484375, "global_step": 313529, "epoch": 2591} {"train_loss": -43.78013229370117, "global_step": 313530, "epoch": 2591} {"train_loss": -43.729366302490234, "global_step": 313531, "epoch": 2591} {"train_loss": -43.825355529785156, "global_step": 313532, "epoch": 2591} {"train_loss": -44.30013656616211, "global_step": 313533, "epoch": 2591} {"train_loss": -41.36116409301758, "global_step": 313534, "epoch": 2591} {"train_loss": -43.868648529052734, "global_step": 313535, "epoch": 2591} {"train_loss": -44.04300308227539, "global_step": 313536, "epoch": 2591} {"train_loss": -43.13984298706055, "global_step": 313537, "epoch": 2591} {"train_loss": -43.4820556640625, "global_step": 313538, "epoch": 2591} {"train_loss": -43.95676803588867, "global_step": 313539, "epoch": 2591} {"train_loss": -40.76948165893555, "global_step": 313540, "epoch": 2591} {"train_loss": -43.29353713989258, "global_step": 313541, "epoch": 2591} {"train_loss": -42.94484329223633, "global_step": 313542, "epoch": 2591} {"train_loss": -44.36300277709961, "global_step": 313543, "epoch": 2591} {"train_loss": -43.42311096191406, "global_step": 313544, "epoch": 2591} {"train_loss": -43.991085052490234, "global_step": 313545, "epoch": 2591} {"train_loss": -43.93821334838867, "global_step": 313546, "epoch": 2591} {"train_loss": -43.71073532104492, "global_step": 313547, "epoch": 2591} {"train_loss": -43.52045822143555, "global_step": 313548, "epoch": 2591} {"train_loss": -42.568939208984375, "global_step": 313549, "epoch": 2591} {"train_loss": -43.92180633544922, "global_step": 313550, "epoch": 2591} {"train_loss": -43.58186721801758, "global_step": 313551, "epoch": 2591} {"train_loss": -43.906185150146484, "global_step": 313552, "epoch": 2591} {"train_loss": -42.59143829345703, "global_step": 313553, "epoch": 2591} {"train_loss": -44.41075134277344, "global_step": 313554, "epoch": 2591} {"train_loss": -44.12968063354492, "global_step": 313555, "epoch": 2591} {"train_loss": -44.131446838378906, "global_step": 313556, "epoch": 2591} {"train_loss": -43.65747833251953, "global_step": 313557, "epoch": 2591} {"train_loss": -44.291107177734375, "global_step": 313558, "epoch": 2591} {"train_loss": -43.81596755981445, "global_step": 313559, "epoch": 2591} {"train_loss": -44.05343246459961, "global_step": 313560, "epoch": 2591} {"train_loss": -44.44390106201172, "global_step": 313561, "epoch": 2591} {"train_loss": -44.1892204284668, "global_step": 313562, "epoch": 2591} {"train_loss": -44.27791976928711, "global_step": 313563, "epoch": 2591} {"train_loss": -44.50004959106445, "global_step": 313564, "epoch": 2591} {"train_loss": -43.747379302978516, "global_step": 313565, "epoch": 2591} {"train_loss": -44.61077880859375, "global_step": 313566, "epoch": 2591} {"train_loss": -43.67306137084961, "global_step": 313567, "epoch": 2591} {"train_loss": -44.597198486328125, "global_step": 313568, "epoch": 2591} {"train_loss": -44.48891830444336, "global_step": 313569, "epoch": 2591} {"train_loss": -43.42788314819336, "global_step": 313570, "epoch": 2591} {"train_loss": -43.92015075683594, "global_step": 313571, "epoch": 2591} {"train_loss": -44.12434768676758, "global_step": 313572, "epoch": 2591} {"train_loss": -44.46337890625, "global_step": 313573, "epoch": 2591} {"train_loss": -43.98148727416992, "global_step": 313574, "epoch": 2591} {"train_loss": -44.21613693237305, "global_step": 313575, "epoch": 2591} {"train_loss": -44.28430938720703, "global_step": 313576, "epoch": 2591} {"train_loss": -43.60683822631836, "global_step": 313577, "epoch": 2591} {"train_loss": -43.47234344482422, "global_step": 313578, "epoch": 2591} {"train_loss": -44.1818962097168, "global_step": 313579, "epoch": 2591} {"train_loss": -43.86833572387695, "global_step": 313580, "epoch": 2591} {"train_loss": -43.86073684692383, "global_step": 313581, "epoch": 2591} {"train_loss": -43.4058723449707, "global_step": 313582, "epoch": 2591} {"train_loss": -42.058135986328125, "global_step": 313583, "epoch": 2591} {"train_loss": -43.77610778808594, "global_step": 313584, "epoch": 2591} {"train_loss": -44.2381477355957, "global_step": 313585, "epoch": 2591} {"train_loss": -44.12528610229492, "global_step": 313586, "epoch": 2591} {"train_loss": -43.27732467651367, "global_step": 313587, "epoch": 2591} {"train_loss": -43.539337158203125, "global_step": 313588, "epoch": 2591} {"train_loss": -43.92115020751953, "global_step": 313589, "epoch": 2591} {"train_loss": -42.53440856933594, "global_step": 313590, "epoch": 2591} {"train_loss": -43.737701416015625, "global_step": 313591, "epoch": 2591} {"train_loss": -44.33712387084961, "global_step": 313592, "epoch": 2591} {"train_loss": -43.24110794067383, "global_step": 313593, "epoch": 2591} {"train_loss": -44.34482192993164, "global_step": 313594, "epoch": 2591} {"train_loss": -43.73198318481445, "global_step": 313595, "epoch": 2591} {"train_loss": -43.10222244262695, "global_step": 313596, "epoch": 2591} {"train_loss": -43.597312927246094, "global_step": 313597, "epoch": 2591} {"train_loss": -43.8112907409668, "global_step": 313598, "epoch": 2591} {"train_loss": -41.16746139526367, "global_step": 313599, "epoch": 2591} {"train_loss": -37.835723876953125, "global_step": 313600, "epoch": 2591} {"train_loss": -37.47578048706055, "global_step": 313601, "epoch": 2591} {"train_loss": -40.77885818481445, "global_step": 313602, "epoch": 2591} {"train_loss": -43.39338302612305, "global_step": 313603, "epoch": 2591} {"train_loss": -43.12527847290039, "global_step": 313604, "epoch": 2591} {"train_loss": -42.232486724853516, "global_step": 313605, "epoch": 2591} {"train_loss": -43.17171096801758, "global_step": 313606, "epoch": 2591} {"train_loss": -43.07866287231445, "global_step": 313607, "epoch": 2591} {"train_loss": -43.41006088256836, "global_step": 313608, "epoch": 2591} {"train_loss": -43.39687728881836, "global_step": 313609, "epoch": 2591} {"train_loss": -42.7822151184082, "global_step": 313610, "epoch": 2591} {"train_loss": -43.326629638671875, "global_step": 313611, "epoch": 2591} {"train_loss": -43.122398376464844, "global_step": 313612, "epoch": 2591} {"train_loss": -43.01470184326172, "global_step": 313613, "epoch": 2591} {"train_loss": -43.8753547668457, "global_step": 313614, "epoch": 2591} {"train_loss": -43.35363006591797, "global_step": 313615, "epoch": 2591} {"train_loss": -43.090614318847656, "global_step": 313616, "epoch": 2591} {"train_loss": -43.64384078979492, "global_step": 313617, "epoch": 2591} {"train_loss": -42.65546798706055, "global_step": 313618, "epoch": 2591} {"train_loss": -43.7775993347168, "global_step": 313619, "epoch": 2591} {"train_loss": -43.35523986816406, "global_step": 313620, "epoch": 2591} {"train_loss": -43.74772262573242, "global_step": 313621, "epoch": 2591} {"train_loss": -43.592620849609375, "global_step": 313622, "epoch": 2591} {"train_loss": -43.65913772583008, "global_step": 313623, "epoch": 2591} {"train_loss": -43.44818115234375, "global_step": 313624, "epoch": 2591} {"train_loss": -43.459468841552734, "global_step": 313625, "epoch": 2591} {"train_loss": -43.78681564331055, "global_step": 313626, "epoch": 2591} {"train_loss": -43.559303283691406, "global_step": 313627, "epoch": 2591} {"train_loss": -43.869869232177734, "global_step": 313628, "epoch": 2591} {"train_loss": -44.322444915771484, "global_step": 313629, "epoch": 2591} {"train_loss": -43.509639739990234, "global_step": 313630, "epoch": 2591} {"train_loss": -43.448830060722415, "global_step": 313631, "epoch": 2591, "val_loss": 2730648.0} {"train_loss": -43.6846809387207, "global_step": 313632, "epoch": 2592} {"train_loss": -43.02190399169922, "global_step": 313633, "epoch": 2592} {"train_loss": -42.731895446777344, "global_step": 313634, "epoch": 2592} {"train_loss": -43.05378723144531, "global_step": 313635, "epoch": 2592} {"train_loss": -42.515804290771484, "global_step": 313636, "epoch": 2592} {"train_loss": -44.08523178100586, "global_step": 313637, "epoch": 2592} {"train_loss": -43.2912483215332, "global_step": 313638, "epoch": 2592} {"train_loss": -42.2890625, "global_step": 313639, "epoch": 2592} {"train_loss": -43.930564880371094, "global_step": 313640, "epoch": 2592} {"train_loss": -43.95636749267578, "global_step": 313641, "epoch": 2592} {"train_loss": -43.748695373535156, "global_step": 313642, "epoch": 2592} {"train_loss": -44.20109939575195, "global_step": 313643, "epoch": 2592} {"train_loss": -44.69499969482422, "global_step": 313644, "epoch": 2592} {"train_loss": -42.92954635620117, "global_step": 313645, "epoch": 2592} {"train_loss": -44.42105484008789, "global_step": 313646, "epoch": 2592} {"train_loss": -43.923500061035156, "global_step": 313647, "epoch": 2592} {"train_loss": -42.83817672729492, "global_step": 313648, "epoch": 2592} {"train_loss": -44.59975051879883, "global_step": 313649, "epoch": 2592} {"train_loss": -44.89419174194336, "global_step": 313650, "epoch": 2592} {"train_loss": -44.408729553222656, "global_step": 313651, "epoch": 2592} {"train_loss": -44.45497512817383, "global_step": 313652, "epoch": 2592} {"train_loss": -44.690792083740234, "global_step": 313653, "epoch": 2592} {"train_loss": -43.04658126831055, "global_step": 313654, "epoch": 2592} {"train_loss": -44.4473876953125, "global_step": 313655, "epoch": 2592} {"train_loss": -44.437828063964844, "global_step": 313656, "epoch": 2592} {"train_loss": -44.08466339111328, "global_step": 313657, "epoch": 2592} {"train_loss": -42.00791931152344, "global_step": 313658, "epoch": 2592} {"train_loss": -44.076446533203125, "global_step": 313659, "epoch": 2592} {"train_loss": -43.14902877807617, "global_step": 313660, "epoch": 2592} {"train_loss": -44.07502365112305, "global_step": 313661, "epoch": 2592} {"train_loss": -43.95089340209961, "global_step": 313662, "epoch": 2592} {"train_loss": -43.344749450683594, "global_step": 313663, "epoch": 2592} {"train_loss": -42.99336242675781, "global_step": 313664, "epoch": 2592} {"train_loss": -43.34804916381836, "global_step": 313665, "epoch": 2592} {"train_loss": -43.108726501464844, "global_step": 313666, "epoch": 2592} {"train_loss": -43.84600830078125, "global_step": 313667, "epoch": 2592} {"train_loss": -44.34419631958008, "global_step": 313668, "epoch": 2592} {"train_loss": -43.65388107299805, "global_step": 313669, "epoch": 2592} {"train_loss": -44.355674743652344, "global_step": 313670, "epoch": 2592} {"train_loss": -44.32746124267578, "global_step": 313671, "epoch": 2592} {"train_loss": -44.29274368286133, "global_step": 313672, "epoch": 2592} {"train_loss": -43.96014404296875, "global_step": 313673, "epoch": 2592} {"train_loss": -43.99163818359375, "global_step": 313674, "epoch": 2592} {"train_loss": -44.3077507019043, "global_step": 313675, "epoch": 2592} {"train_loss": -44.303955078125, "global_step": 313676, "epoch": 2592} {"train_loss": -44.473533630371094, "global_step": 313677, "epoch": 2592} {"train_loss": -44.12477493286133, "global_step": 313678, "epoch": 2592} {"train_loss": -41.542110443115234, "global_step": 313679, "epoch": 2592} {"train_loss": -43.538543701171875, "global_step": 313680, "epoch": 2592} {"train_loss": -43.908870697021484, "global_step": 313681, "epoch": 2592} {"train_loss": -43.682064056396484, "global_step": 313682, "epoch": 2592} {"train_loss": -43.52052688598633, "global_step": 313683, "epoch": 2592} {"train_loss": -44.51827621459961, "global_step": 313684, "epoch": 2592} {"train_loss": -43.81955337524414, "global_step": 313685, "epoch": 2592} {"train_loss": -44.14613723754883, "global_step": 313686, "epoch": 2592} {"train_loss": -42.167449951171875, "global_step": 313687, "epoch": 2592} {"train_loss": -44.383541107177734, "global_step": 313688, "epoch": 2592} {"train_loss": -42.790565490722656, "global_step": 313689, "epoch": 2592} {"train_loss": -42.59788513183594, "global_step": 313690, "epoch": 2592} {"train_loss": -41.145362854003906, "global_step": 313691, "epoch": 2592} {"train_loss": -44.05131149291992, "global_step": 313692, "epoch": 2592} {"train_loss": -43.424232482910156, "global_step": 313693, "epoch": 2592} {"train_loss": -44.038631439208984, "global_step": 313694, "epoch": 2592} {"train_loss": -42.91371536254883, "global_step": 313695, "epoch": 2592} {"train_loss": -43.199790954589844, "global_step": 313696, "epoch": 2592} {"train_loss": -43.85490036010742, "global_step": 313697, "epoch": 2592} {"train_loss": -43.16856002807617, "global_step": 313698, "epoch": 2592} {"train_loss": -43.04325485229492, "global_step": 313699, "epoch": 2592} {"train_loss": -42.761322021484375, "global_step": 313700, "epoch": 2592} {"train_loss": -43.00669479370117, "global_step": 313701, "epoch": 2592} {"train_loss": -43.899505615234375, "global_step": 313702, "epoch": 2592} {"train_loss": -43.46049499511719, "global_step": 313703, "epoch": 2592} {"train_loss": -42.52585983276367, "global_step": 313704, "epoch": 2592} {"train_loss": -42.62909698486328, "global_step": 313705, "epoch": 2592} {"train_loss": -41.734493255615234, "global_step": 313706, "epoch": 2592} {"train_loss": -42.44173049926758, "global_step": 313707, "epoch": 2592} {"train_loss": -41.55324935913086, "global_step": 313708, "epoch": 2592} {"train_loss": -42.794185638427734, "global_step": 313709, "epoch": 2592} {"train_loss": -42.1141242980957, "global_step": 313710, "epoch": 2592} {"train_loss": -42.96144485473633, "global_step": 313711, "epoch": 2592} {"train_loss": -43.3636360168457, "global_step": 313712, "epoch": 2592} {"train_loss": -43.11088943481445, "global_step": 313713, "epoch": 2592} {"train_loss": -42.90753936767578, "global_step": 313714, "epoch": 2592} {"train_loss": -43.70937728881836, "global_step": 313715, "epoch": 2592} {"train_loss": -43.63779067993164, "global_step": 313716, "epoch": 2592} {"train_loss": -44.098751068115234, "global_step": 313717, "epoch": 2592} {"train_loss": -44.30375671386719, "global_step": 313718, "epoch": 2592} {"train_loss": -44.05418395996094, "global_step": 313719, "epoch": 2592} {"train_loss": -44.34067916870117, "global_step": 313720, "epoch": 2592} {"train_loss": -43.4743766784668, "global_step": 313721, "epoch": 2592} {"train_loss": -43.15413284301758, "global_step": 313722, "epoch": 2592} {"train_loss": -42.37863540649414, "global_step": 313723, "epoch": 2592} {"train_loss": -43.86845016479492, "global_step": 313724, "epoch": 2592} {"train_loss": -44.33485794067383, "global_step": 313725, "epoch": 2592} {"train_loss": -43.1038932800293, "global_step": 313726, "epoch": 2592} {"train_loss": -43.3184928894043, "global_step": 313727, "epoch": 2592} {"train_loss": -43.750038146972656, "global_step": 313728, "epoch": 2592} {"train_loss": -44.01538848876953, "global_step": 313729, "epoch": 2592} {"train_loss": -44.3902473449707, "global_step": 313730, "epoch": 2592} {"train_loss": -43.118141174316406, "global_step": 313731, "epoch": 2592} {"train_loss": -43.86162185668945, "global_step": 313732, "epoch": 2592} {"train_loss": -43.84050369262695, "global_step": 313733, "epoch": 2592} {"train_loss": -43.51754379272461, "global_step": 313734, "epoch": 2592} {"train_loss": -43.66731643676758, "global_step": 313735, "epoch": 2592} {"train_loss": -44.13631057739258, "global_step": 313736, "epoch": 2592} {"train_loss": -41.128726959228516, "global_step": 313737, "epoch": 2592} {"train_loss": -43.790077209472656, "global_step": 313738, "epoch": 2592} {"train_loss": -44.12109375, "global_step": 313739, "epoch": 2592} {"train_loss": -42.91870880126953, "global_step": 313740, "epoch": 2592} {"train_loss": -44.160797119140625, "global_step": 313741, "epoch": 2592} {"train_loss": -42.733211517333984, "global_step": 313742, "epoch": 2592} {"train_loss": -42.97182846069336, "global_step": 313743, "epoch": 2592} {"train_loss": -43.826751708984375, "global_step": 313744, "epoch": 2592} {"train_loss": -41.59792709350586, "global_step": 313745, "epoch": 2592} {"train_loss": -42.63542556762695, "global_step": 313746, "epoch": 2592} {"train_loss": -44.3984375, "global_step": 313747, "epoch": 2592} {"train_loss": -41.311195373535156, "global_step": 313748, "epoch": 2592} {"train_loss": -43.67879867553711, "global_step": 313749, "epoch": 2592} {"train_loss": -30.0173282623291, "global_step": 313750, "epoch": 2592} {"train_loss": -39.13352966308594, "global_step": 313751, "epoch": 2592} {"train_loss": -43.31774251323101, "global_step": 313752, "epoch": 2592, "val_loss": 2844304.0} {"train_loss": -40.37805938720703, "global_step": 313753, "epoch": 2593} {"train_loss": -42.730281829833984, "global_step": 313754, "epoch": 2593} {"train_loss": -41.405921936035156, "global_step": 313755, "epoch": 2593} {"train_loss": -40.982784271240234, "global_step": 313756, "epoch": 2593} {"train_loss": -40.59980392456055, "global_step": 313757, "epoch": 2593} {"train_loss": -32.11240768432617, "global_step": 313758, "epoch": 2593} {"train_loss": -40.689754486083984, "global_step": 313759, "epoch": 2593} {"train_loss": -40.746429443359375, "global_step": 313760, "epoch": 2593} {"train_loss": -33.569580078125, "global_step": 313761, "epoch": 2593} {"train_loss": -40.78025436401367, "global_step": 313762, "epoch": 2593} {"train_loss": -27.46311378479004, "global_step": 313763, "epoch": 2593} {"train_loss": -28.605112075805664, "global_step": 313764, "epoch": 2593} {"train_loss": -38.55267333984375, "global_step": 313765, "epoch": 2593} {"train_loss": -20.422033309936523, "global_step": 313766, "epoch": 2593} {"train_loss": -37.92820358276367, "global_step": 313767, "epoch": 2593} {"train_loss": -39.90127944946289, "global_step": 313768, "epoch": 2593} {"train_loss": -39.47197341918945, "global_step": 313769, "epoch": 2593} {"train_loss": -39.45395278930664, "global_step": 313770, "epoch": 2593} {"train_loss": -38.23968505859375, "global_step": 313771, "epoch": 2593} {"train_loss": -35.327735900878906, "global_step": 313772, "epoch": 2593} {"train_loss": -38.07816696166992, "global_step": 313773, "epoch": 2593} {"train_loss": -29.96225357055664, "global_step": 313774, "epoch": 2593} {"train_loss": -38.42838668823242, "global_step": 313775, "epoch": 2593} {"train_loss": -36.38873291015625, "global_step": 313776, "epoch": 2593} {"train_loss": -36.874916076660156, "global_step": 313777, "epoch": 2593} {"train_loss": -35.787845611572266, "global_step": 313778, "epoch": 2593} {"train_loss": -36.383697509765625, "global_step": 313779, "epoch": 2593} {"train_loss": -33.79019546508789, "global_step": 313780, "epoch": 2593} {"train_loss": -37.7297477722168, "global_step": 313781, "epoch": 2593} {"train_loss": -36.574562072753906, "global_step": 313782, "epoch": 2593} {"train_loss": -40.67765426635742, "global_step": 313783, "epoch": 2593} {"train_loss": -39.043453216552734, "global_step": 313784, "epoch": 2593} {"train_loss": -38.588539123535156, "global_step": 313785, "epoch": 2593} {"train_loss": -38.99586486816406, "global_step": 313786, "epoch": 2593} {"train_loss": -40.41644287109375, "global_step": 313787, "epoch": 2593} {"train_loss": -39.0487060546875, "global_step": 313788, "epoch": 2593} {"train_loss": -41.11481857299805, "global_step": 313789, "epoch": 2593} {"train_loss": -40.44390106201172, "global_step": 313790, "epoch": 2593} {"train_loss": -39.56131362915039, "global_step": 313791, "epoch": 2593} {"train_loss": -40.517364501953125, "global_step": 313792, "epoch": 2593} {"train_loss": -39.337581634521484, "global_step": 313793, "epoch": 2593} {"train_loss": -36.454261779785156, "global_step": 313794, "epoch": 2593} {"train_loss": -41.59510040283203, "global_step": 313795, "epoch": 2593} {"train_loss": -40.502960205078125, "global_step": 313796, "epoch": 2593} {"train_loss": -40.979278564453125, "global_step": 313797, "epoch": 2593} {"train_loss": -39.24245071411133, "global_step": 313798, "epoch": 2593} {"train_loss": -41.300445556640625, "global_step": 313799, "epoch": 2593} {"train_loss": -37.67269515991211, "global_step": 313800, "epoch": 2593} {"train_loss": -40.63684844970703, "global_step": 313801, "epoch": 2593} {"train_loss": -41.011497497558594, "global_step": 313802, "epoch": 2593} {"train_loss": -41.503997802734375, "global_step": 313803, "epoch": 2593} {"train_loss": -38.21244812011719, "global_step": 313804, "epoch": 2593} {"train_loss": -41.081390380859375, "global_step": 313805, "epoch": 2593} {"train_loss": -41.257232666015625, "global_step": 313806, "epoch": 2593} {"train_loss": -41.0432243347168, "global_step": 313807, "epoch": 2593} {"train_loss": -40.17070388793945, "global_step": 313808, "epoch": 2593} {"train_loss": -41.43465805053711, "global_step": 313809, "epoch": 2593} {"train_loss": -40.96101760864258, "global_step": 313810, "epoch": 2593} {"train_loss": -40.329856872558594, "global_step": 313811, "epoch": 2593} {"train_loss": -41.41965866088867, "global_step": 313812, "epoch": 2593} {"train_loss": -41.60760498046875, "global_step": 313813, "epoch": 2593} {"train_loss": -41.38163757324219, "global_step": 313814, "epoch": 2593} {"train_loss": -42.10850143432617, "global_step": 313815, "epoch": 2593} {"train_loss": -42.21609878540039, "global_step": 313816, "epoch": 2593} {"train_loss": -41.49886703491211, "global_step": 313817, "epoch": 2593} {"train_loss": -42.288612365722656, "global_step": 313818, "epoch": 2593} {"train_loss": -42.26259994506836, "global_step": 313819, "epoch": 2593} {"train_loss": -42.15198516845703, "global_step": 313820, "epoch": 2593} {"train_loss": -42.03580856323242, "global_step": 313821, "epoch": 2593} {"train_loss": -40.846126556396484, "global_step": 313822, "epoch": 2593} {"train_loss": -42.194190979003906, "global_step": 313823, "epoch": 2593} {"train_loss": -40.91542434692383, "global_step": 313824, "epoch": 2593} {"train_loss": -42.46175003051758, "global_step": 313825, "epoch": 2593} {"train_loss": -42.42014694213867, "global_step": 313826, "epoch": 2593} {"train_loss": -41.58268356323242, "global_step": 313827, "epoch": 2593} {"train_loss": -42.53706741333008, "global_step": 313828, "epoch": 2593} {"train_loss": -41.43452072143555, "global_step": 313829, "epoch": 2593} {"train_loss": -41.794193267822266, "global_step": 313830, "epoch": 2593} {"train_loss": -42.313995361328125, "global_step": 313831, "epoch": 2593} {"train_loss": -42.06301498413086, "global_step": 313832, "epoch": 2593} {"train_loss": -41.42974853515625, "global_step": 313833, "epoch": 2593} {"train_loss": -42.80695724487305, "global_step": 313834, "epoch": 2593} {"train_loss": -41.97738265991211, "global_step": 313835, "epoch": 2593} {"train_loss": -42.426212310791016, "global_step": 313836, "epoch": 2593} {"train_loss": -42.6749267578125, "global_step": 313837, "epoch": 2593} {"train_loss": -42.66319274902344, "global_step": 313838, "epoch": 2593} {"train_loss": -42.025856018066406, "global_step": 313839, "epoch": 2593} {"train_loss": -42.79767990112305, "global_step": 313840, "epoch": 2593} {"train_loss": -41.579505920410156, "global_step": 313841, "epoch": 2593} {"train_loss": -42.925228118896484, "global_step": 313842, "epoch": 2593} {"train_loss": -42.81878662109375, "global_step": 313843, "epoch": 2593} {"train_loss": -43.22571563720703, "global_step": 313844, "epoch": 2593} {"train_loss": -43.18169403076172, "global_step": 313845, "epoch": 2593} {"train_loss": -43.3372688293457, "global_step": 313846, "epoch": 2593} {"train_loss": -42.80471420288086, "global_step": 313847, "epoch": 2593} {"train_loss": -42.74850082397461, "global_step": 313848, "epoch": 2593} {"train_loss": -43.481483459472656, "global_step": 313849, "epoch": 2593} {"train_loss": -42.99485778808594, "global_step": 313850, "epoch": 2593} {"train_loss": -43.09841537475586, "global_step": 313851, "epoch": 2593} {"train_loss": -42.72025680541992, "global_step": 313852, "epoch": 2593} {"train_loss": -43.500423431396484, "global_step": 313853, "epoch": 2593} {"train_loss": -43.17045974731445, "global_step": 313854, "epoch": 2593} {"train_loss": -40.39113998413086, "global_step": 313855, "epoch": 2593} {"train_loss": -43.527400970458984, "global_step": 313856, "epoch": 2593} {"train_loss": -42.93574905395508, "global_step": 313857, "epoch": 2593} {"train_loss": -43.61947250366211, "global_step": 313858, "epoch": 2593} {"train_loss": -43.063682556152344, "global_step": 313859, "epoch": 2593} {"train_loss": -43.65583038330078, "global_step": 313860, "epoch": 2593} {"train_loss": -43.46162033081055, "global_step": 313861, "epoch": 2593} {"train_loss": -43.574398040771484, "global_step": 313862, "epoch": 2593} {"train_loss": -43.47248458862305, "global_step": 313863, "epoch": 2593} {"train_loss": -43.229610443115234, "global_step": 313864, "epoch": 2593} {"train_loss": -43.64435577392578, "global_step": 313865, "epoch": 2593} {"train_loss": -43.281246185302734, "global_step": 313866, "epoch": 2593} {"train_loss": -43.34803009033203, "global_step": 313867, "epoch": 2593} {"train_loss": -43.6540641784668, "global_step": 313868, "epoch": 2593} {"train_loss": -43.28017807006836, "global_step": 313869, "epoch": 2593} {"train_loss": -43.598388671875, "global_step": 313870, "epoch": 2593} {"train_loss": -43.20427703857422, "global_step": 313871, "epoch": 2593} {"train_loss": -43.1988410949707, "global_step": 313872, "epoch": 2593} {"train_loss": -40.51520476853552, "global_step": 313873, "epoch": 2593, "val_loss": 2717503.75} {"train_loss": -43.27257537841797, "global_step": 313874, "epoch": 2594} {"train_loss": -44.13965606689453, "global_step": 313875, "epoch": 2594} {"train_loss": -43.62873458862305, "global_step": 313876, "epoch": 2594} {"train_loss": -44.05905532836914, "global_step": 313877, "epoch": 2594} {"train_loss": -43.63466262817383, "global_step": 313878, "epoch": 2594} {"train_loss": -44.01679992675781, "global_step": 313879, "epoch": 2594} {"train_loss": -43.26754379272461, "global_step": 313880, "epoch": 2594} {"train_loss": -43.66071319580078, "global_step": 313881, "epoch": 2594} {"train_loss": -43.86052322387695, "global_step": 313882, "epoch": 2594} {"train_loss": -43.49769973754883, "global_step": 313883, "epoch": 2594} {"train_loss": -43.830787658691406, "global_step": 313884, "epoch": 2594} {"train_loss": -43.97333526611328, "global_step": 313885, "epoch": 2594} {"train_loss": -43.390594482421875, "global_step": 313886, "epoch": 2594} {"train_loss": -43.66327667236328, "global_step": 313887, "epoch": 2594} {"train_loss": -44.1705207824707, "global_step": 313888, "epoch": 2594} {"train_loss": -43.663063049316406, "global_step": 313889, "epoch": 2594} {"train_loss": -44.204444885253906, "global_step": 313890, "epoch": 2594} {"train_loss": -43.61899948120117, "global_step": 313891, "epoch": 2594} {"train_loss": -43.97267532348633, "global_step": 313892, "epoch": 2594} {"train_loss": -43.29911804199219, "global_step": 313893, "epoch": 2594} {"train_loss": -43.85954666137695, "global_step": 313894, "epoch": 2594} {"train_loss": -43.67739486694336, "global_step": 313895, "epoch": 2594} {"train_loss": -43.44371795654297, "global_step": 313896, "epoch": 2594} {"train_loss": -43.86378479003906, "global_step": 313897, "epoch": 2594} {"train_loss": -43.867733001708984, "global_step": 313898, "epoch": 2594} {"train_loss": -44.45595932006836, "global_step": 313899, "epoch": 2594} {"train_loss": -44.26225662231445, "global_step": 313900, "epoch": 2594} {"train_loss": -43.88581085205078, "global_step": 313901, "epoch": 2594} {"train_loss": -42.18538284301758, "global_step": 313902, "epoch": 2594} {"train_loss": -43.99135971069336, "global_step": 313903, "epoch": 2594} {"train_loss": -44.06299591064453, "global_step": 313904, "epoch": 2594} {"train_loss": -43.827003479003906, "global_step": 313905, "epoch": 2594} {"train_loss": -43.399078369140625, "global_step": 313906, "epoch": 2594} {"train_loss": -44.37260055541992, "global_step": 313907, "epoch": 2594} {"train_loss": -43.70804977416992, "global_step": 313908, "epoch": 2594} {"train_loss": -43.66836166381836, "global_step": 313909, "epoch": 2594} {"train_loss": -43.31460189819336, "global_step": 313910, "epoch": 2594} {"train_loss": -43.768306732177734, "global_step": 313911, "epoch": 2594} {"train_loss": -43.60121536254883, "global_step": 313912, "epoch": 2594} {"train_loss": -42.7779426574707, "global_step": 313913, "epoch": 2594} {"train_loss": -42.585384368896484, "global_step": 313914, "epoch": 2594} {"train_loss": -41.62775421142578, "global_step": 313915, "epoch": 2594} {"train_loss": -42.87682342529297, "global_step": 313916, "epoch": 2594} {"train_loss": -42.754432678222656, "global_step": 313917, "epoch": 2594} {"train_loss": -42.183937072753906, "global_step": 313918, "epoch": 2594} {"train_loss": -43.286712646484375, "global_step": 313919, "epoch": 2594} {"train_loss": -42.7576789855957, "global_step": 313920, "epoch": 2594} {"train_loss": -43.73679733276367, "global_step": 313921, "epoch": 2594} {"train_loss": -42.42869186401367, "global_step": 313922, "epoch": 2594} {"train_loss": -41.458534240722656, "global_step": 313923, "epoch": 2594} {"train_loss": -42.703548431396484, "global_step": 313924, "epoch": 2594} {"train_loss": -41.98822021484375, "global_step": 313925, "epoch": 2594} {"train_loss": -42.75639724731445, "global_step": 313926, "epoch": 2594} {"train_loss": -42.27299880981445, "global_step": 313927, "epoch": 2594} {"train_loss": -42.85614776611328, "global_step": 313928, "epoch": 2594} {"train_loss": -42.007102966308594, "global_step": 313929, "epoch": 2594} {"train_loss": -39.86524200439453, "global_step": 313930, "epoch": 2594} {"train_loss": -40.815887451171875, "global_step": 313931, "epoch": 2594} {"train_loss": -42.65520095825195, "global_step": 313932, "epoch": 2594} {"train_loss": -38.381839752197266, "global_step": 313933, "epoch": 2594} {"train_loss": -34.888736724853516, "global_step": 313934, "epoch": 2594} {"train_loss": -37.54584503173828, "global_step": 313935, "epoch": 2594} {"train_loss": -40.09292221069336, "global_step": 313936, "epoch": 2594} {"train_loss": -41.344398498535156, "global_step": 313937, "epoch": 2594} {"train_loss": -40.72038650512695, "global_step": 313938, "epoch": 2594} {"train_loss": -39.16396713256836, "global_step": 313939, "epoch": 2594} {"train_loss": -40.20838165283203, "global_step": 313940, "epoch": 2594} {"train_loss": -40.19643783569336, "global_step": 313941, "epoch": 2594} {"train_loss": -41.90119552612305, "global_step": 313942, "epoch": 2594} {"train_loss": -41.37052536010742, "global_step": 313943, "epoch": 2594} {"train_loss": -42.19292068481445, "global_step": 313944, "epoch": 2594} {"train_loss": -41.34312438964844, "global_step": 313945, "epoch": 2594} {"train_loss": -42.32434844970703, "global_step": 313946, "epoch": 2594} {"train_loss": -41.57405471801758, "global_step": 313947, "epoch": 2594} {"train_loss": -41.58989334106445, "global_step": 313948, "epoch": 2594} {"train_loss": -42.04948806762695, "global_step": 313949, "epoch": 2594} {"train_loss": -41.2735710144043, "global_step": 313950, "epoch": 2594} {"train_loss": -41.25649642944336, "global_step": 313951, "epoch": 2594} {"train_loss": -41.71044158935547, "global_step": 313952, "epoch": 2594} {"train_loss": -42.225032806396484, "global_step": 313953, "epoch": 2594} {"train_loss": -42.05292892456055, "global_step": 313954, "epoch": 2594} {"train_loss": -41.13359832763672, "global_step": 313955, "epoch": 2594} {"train_loss": -42.83147048950195, "global_step": 313956, "epoch": 2594} {"train_loss": -42.227115631103516, "global_step": 313957, "epoch": 2594} {"train_loss": -42.41782760620117, "global_step": 313958, "epoch": 2594} {"train_loss": -43.12264633178711, "global_step": 313959, "epoch": 2594} {"train_loss": -41.47481918334961, "global_step": 313960, "epoch": 2594} {"train_loss": -43.00246810913086, "global_step": 313961, "epoch": 2594} {"train_loss": -42.10319137573242, "global_step": 313962, "epoch": 2594} {"train_loss": -42.55670166015625, "global_step": 313963, "epoch": 2594} {"train_loss": -42.5523567199707, "global_step": 313964, "epoch": 2594} {"train_loss": -43.391448974609375, "global_step": 313965, "epoch": 2594} {"train_loss": -42.0843620300293, "global_step": 313966, "epoch": 2594} {"train_loss": -43.20686340332031, "global_step": 313967, "epoch": 2594} {"train_loss": -42.79998779296875, "global_step": 313968, "epoch": 2594} {"train_loss": -42.72951126098633, "global_step": 313969, "epoch": 2594} {"train_loss": -42.509674072265625, "global_step": 313970, "epoch": 2594} {"train_loss": -43.114871978759766, "global_step": 313971, "epoch": 2594} {"train_loss": -42.7916259765625, "global_step": 313972, "epoch": 2594} {"train_loss": -42.779048919677734, "global_step": 313973, "epoch": 2594} {"train_loss": -43.09080505371094, "global_step": 313974, "epoch": 2594} {"train_loss": -42.17045211791992, "global_step": 313975, "epoch": 2594} {"train_loss": -43.64006423950195, "global_step": 313976, "epoch": 2594} {"train_loss": -41.95003128051758, "global_step": 313977, "epoch": 2594} {"train_loss": -42.1139030456543, "global_step": 313978, "epoch": 2594} {"train_loss": -43.2647590637207, "global_step": 313979, "epoch": 2594} {"train_loss": -42.39299392700195, "global_step": 313980, "epoch": 2594} {"train_loss": -43.119564056396484, "global_step": 313981, "epoch": 2594} {"train_loss": -43.4748649597168, "global_step": 313982, "epoch": 2594} {"train_loss": -42.147701263427734, "global_step": 313983, "epoch": 2594} {"train_loss": -43.9140625, "global_step": 313984, "epoch": 2594} {"train_loss": -42.933319091796875, "global_step": 313985, "epoch": 2594} {"train_loss": -42.700748443603516, "global_step": 313986, "epoch": 2594} {"train_loss": -43.558040618896484, "global_step": 313987, "epoch": 2594} {"train_loss": -41.99422836303711, "global_step": 313988, "epoch": 2594} {"train_loss": -43.26666259765625, "global_step": 313989, "epoch": 2594} {"train_loss": -43.5487174987793, "global_step": 313990, "epoch": 2594} {"train_loss": -42.433067321777344, "global_step": 313991, "epoch": 2594} {"train_loss": -42.771732330322266, "global_step": 313992, "epoch": 2594} {"train_loss": -43.21744918823242, "global_step": 313993, "epoch": 2594} {"train_loss": -42.6259902764943, "global_step": 313994, "epoch": 2594, "val_loss": 2769585.75} {"train_loss": -43.51780319213867, "global_step": 313995, "epoch": 2595} {"train_loss": -42.98521041870117, "global_step": 313996, "epoch": 2595} {"train_loss": -43.289894104003906, "global_step": 313997, "epoch": 2595} {"train_loss": -43.75752258300781, "global_step": 313998, "epoch": 2595} {"train_loss": -43.35113525390625, "global_step": 313999, "epoch": 2595} {"train_loss": -44.07448959350586, "global_step": 314000, "epoch": 2595} {"train_loss": -43.87691879272461, "global_step": 314001, "epoch": 2595} {"train_loss": -43.675331115722656, "global_step": 314002, "epoch": 2595} {"train_loss": -44.02153396606445, "global_step": 314003, "epoch": 2595} {"train_loss": -44.072750091552734, "global_step": 314004, "epoch": 2595} {"train_loss": -43.57343673706055, "global_step": 314005, "epoch": 2595} {"train_loss": -43.72366714477539, "global_step": 314006, "epoch": 2595} {"train_loss": -44.23260498046875, "global_step": 314007, "epoch": 2595} {"train_loss": -43.994686126708984, "global_step": 314008, "epoch": 2595} {"train_loss": -44.147220611572266, "global_step": 314009, "epoch": 2595} {"train_loss": -44.12800979614258, "global_step": 314010, "epoch": 2595} {"train_loss": -43.93319320678711, "global_step": 314011, "epoch": 2595} {"train_loss": -44.28717803955078, "global_step": 314012, "epoch": 2595} {"train_loss": -44.03298568725586, "global_step": 314013, "epoch": 2595} {"train_loss": -44.367156982421875, "global_step": 314014, "epoch": 2595} {"train_loss": -43.993309020996094, "global_step": 314015, "epoch": 2595} {"train_loss": -43.96220016479492, "global_step": 314016, "epoch": 2595} {"train_loss": -44.494384765625, "global_step": 314017, "epoch": 2595} {"train_loss": -44.351016998291016, "global_step": 314018, "epoch": 2595} {"train_loss": -44.24091720581055, "global_step": 314019, "epoch": 2595} {"train_loss": -44.59514236450195, "global_step": 314020, "epoch": 2595} {"train_loss": -44.49989700317383, "global_step": 314021, "epoch": 2595} {"train_loss": -44.45808410644531, "global_step": 314022, "epoch": 2595} {"train_loss": -44.71772384643555, "global_step": 314023, "epoch": 2595} {"train_loss": -44.44613265991211, "global_step": 314024, "epoch": 2595} {"train_loss": -44.578697204589844, "global_step": 314025, "epoch": 2595} {"train_loss": -44.71049118041992, "global_step": 314026, "epoch": 2595} {"train_loss": -44.4245719909668, "global_step": 314027, "epoch": 2595} {"train_loss": -44.70762252807617, "global_step": 314028, "epoch": 2595} {"train_loss": -43.92413330078125, "global_step": 314029, "epoch": 2595} {"train_loss": -44.531288146972656, "global_step": 314030, "epoch": 2595} {"train_loss": -44.7196159362793, "global_step": 314031, "epoch": 2595} {"train_loss": -44.48417282104492, "global_step": 314032, "epoch": 2595} {"train_loss": -44.29935836791992, "global_step": 314033, "epoch": 2595} {"train_loss": -44.231903076171875, "global_step": 314034, "epoch": 2595} {"train_loss": -44.24887466430664, "global_step": 314035, "epoch": 2595} {"train_loss": -43.899288177490234, "global_step": 314036, "epoch": 2595} {"train_loss": -44.1598014831543, "global_step": 314037, "epoch": 2595} {"train_loss": -44.575435638427734, "global_step": 314038, "epoch": 2595} {"train_loss": -44.50533676147461, "global_step": 314039, "epoch": 2595} {"train_loss": -43.802181243896484, "global_step": 314040, "epoch": 2595} {"train_loss": -44.499813079833984, "global_step": 314041, "epoch": 2595} {"train_loss": -44.8209228515625, "global_step": 314042, "epoch": 2595} {"train_loss": -43.25434494018555, "global_step": 314043, "epoch": 2595} {"train_loss": -43.581024169921875, "global_step": 314044, "epoch": 2595} {"train_loss": -43.767234802246094, "global_step": 314045, "epoch": 2595} {"train_loss": -44.51511764526367, "global_step": 314046, "epoch": 2595} {"train_loss": -43.62972640991211, "global_step": 314047, "epoch": 2595} {"train_loss": -42.563289642333984, "global_step": 314048, "epoch": 2595} {"train_loss": -43.5736083984375, "global_step": 314049, "epoch": 2595} {"train_loss": -43.60896301269531, "global_step": 314050, "epoch": 2595} {"train_loss": -43.51277542114258, "global_step": 314051, "epoch": 2595} {"train_loss": -42.27775573730469, "global_step": 314052, "epoch": 2595} {"train_loss": -41.5781135559082, "global_step": 314053, "epoch": 2595} {"train_loss": -41.551971435546875, "global_step": 314054, "epoch": 2595} {"train_loss": -43.48357391357422, "global_step": 314055, "epoch": 2595} {"train_loss": -42.30924987792969, "global_step": 314056, "epoch": 2595} {"train_loss": -37.63907241821289, "global_step": 314057, "epoch": 2595} {"train_loss": -36.82715606689453, "global_step": 314058, "epoch": 2595} {"train_loss": -35.14218521118164, "global_step": 314059, "epoch": 2595} {"train_loss": -36.55266189575195, "global_step": 314060, "epoch": 2595} {"train_loss": -37.74317169189453, "global_step": 314061, "epoch": 2595} {"train_loss": -37.13429641723633, "global_step": 314062, "epoch": 2595} {"train_loss": -29.35760498046875, "global_step": 314063, "epoch": 2595} {"train_loss": -39.382667541503906, "global_step": 314064, "epoch": 2595} {"train_loss": -35.2435417175293, "global_step": 314065, "epoch": 2595} {"train_loss": -34.699073791503906, "global_step": 314066, "epoch": 2595} {"train_loss": -40.09882736206055, "global_step": 314067, "epoch": 2595} {"train_loss": -36.6142692565918, "global_step": 314068, "epoch": 2595} {"train_loss": -37.0256233215332, "global_step": 314069, "epoch": 2595} {"train_loss": -39.434757232666016, "global_step": 314070, "epoch": 2595} {"train_loss": -37.23577880859375, "global_step": 314071, "epoch": 2595} {"train_loss": -38.86131286621094, "global_step": 314072, "epoch": 2595} {"train_loss": -38.53876876831055, "global_step": 314073, "epoch": 2595} {"train_loss": -39.7724609375, "global_step": 314074, "epoch": 2595} {"train_loss": -40.483917236328125, "global_step": 314075, "epoch": 2595} {"train_loss": -39.86273193359375, "global_step": 314076, "epoch": 2595} {"train_loss": -40.76424026489258, "global_step": 314077, "epoch": 2595} {"train_loss": -41.29985427856445, "global_step": 314078, "epoch": 2595} {"train_loss": -40.43071746826172, "global_step": 314079, "epoch": 2595} {"train_loss": -41.41569900512695, "global_step": 314080, "epoch": 2595} {"train_loss": -41.146663665771484, "global_step": 314081, "epoch": 2595} {"train_loss": -42.08547592163086, "global_step": 314082, "epoch": 2595} {"train_loss": -41.415531158447266, "global_step": 314083, "epoch": 2595} {"train_loss": -41.827362060546875, "global_step": 314084, "epoch": 2595} {"train_loss": -42.21813201904297, "global_step": 314085, "epoch": 2595} {"train_loss": -41.88520812988281, "global_step": 314086, "epoch": 2595} {"train_loss": -41.89718246459961, "global_step": 314087, "epoch": 2595} {"train_loss": -41.726131439208984, "global_step": 314088, "epoch": 2595} {"train_loss": -42.44197463989258, "global_step": 314089, "epoch": 2595} {"train_loss": -42.33737564086914, "global_step": 314090, "epoch": 2595} {"train_loss": -42.31671142578125, "global_step": 314091, "epoch": 2595} {"train_loss": -42.6712532043457, "global_step": 314092, "epoch": 2595} {"train_loss": -42.38142013549805, "global_step": 314093, "epoch": 2595} {"train_loss": -42.583187103271484, "global_step": 314094, "epoch": 2595} {"train_loss": -42.908687591552734, "global_step": 314095, "epoch": 2595} {"train_loss": -42.761146545410156, "global_step": 314096, "epoch": 2595} {"train_loss": -42.53908157348633, "global_step": 314097, "epoch": 2595} {"train_loss": -43.11652755737305, "global_step": 314098, "epoch": 2595} {"train_loss": -43.56370162963867, "global_step": 314099, "epoch": 2595} {"train_loss": -42.876441955566406, "global_step": 314100, "epoch": 2595} {"train_loss": -43.2862548828125, "global_step": 314101, "epoch": 2595} {"train_loss": -43.28032302856445, "global_step": 314102, "epoch": 2595} {"train_loss": -43.33674621582031, "global_step": 314103, "epoch": 2595} {"train_loss": -43.27761459350586, "global_step": 314104, "epoch": 2595} {"train_loss": -43.61811065673828, "global_step": 314105, "epoch": 2595} {"train_loss": -43.203182220458984, "global_step": 314106, "epoch": 2595} {"train_loss": -43.02511215209961, "global_step": 314107, "epoch": 2595} {"train_loss": -43.35947799682617, "global_step": 314108, "epoch": 2595} {"train_loss": -43.255699157714844, "global_step": 314109, "epoch": 2595} {"train_loss": -43.32100296020508, "global_step": 314110, "epoch": 2595} {"train_loss": -43.64984893798828, "global_step": 314111, "epoch": 2595} {"train_loss": -43.673492431640625, "global_step": 314112, "epoch": 2595} {"train_loss": -43.794071197509766, "global_step": 314113, "epoch": 2595} {"train_loss": -43.43075180053711, "global_step": 314114, "epoch": 2595} {"train_loss": -42.421442552046344, "global_step": 314115, "epoch": 2595, "val_loss": 2755268.0} {"train_loss": -43.84159469604492, "global_step": 314116, "epoch": 2596} {"train_loss": -43.83716583251953, "global_step": 314117, "epoch": 2596} {"train_loss": -43.81307601928711, "global_step": 314118, "epoch": 2596} {"train_loss": -43.97127914428711, "global_step": 314119, "epoch": 2596} {"train_loss": -44.195220947265625, "global_step": 314120, "epoch": 2596} {"train_loss": -44.102481842041016, "global_step": 314121, "epoch": 2596} {"train_loss": -44.1407470703125, "global_step": 314122, "epoch": 2596} {"train_loss": -43.866512298583984, "global_step": 314123, "epoch": 2596} {"train_loss": -44.388736724853516, "global_step": 314124, "epoch": 2596} {"train_loss": -44.181846618652344, "global_step": 314125, "epoch": 2596} {"train_loss": -44.35939407348633, "global_step": 314126, "epoch": 2596} {"train_loss": -43.55780792236328, "global_step": 314127, "epoch": 2596} {"train_loss": -44.461734771728516, "global_step": 314128, "epoch": 2596} {"train_loss": -44.34551239013672, "global_step": 314129, "epoch": 2596} {"train_loss": -44.131683349609375, "global_step": 314130, "epoch": 2596} {"train_loss": -44.409019470214844, "global_step": 314131, "epoch": 2596} {"train_loss": -44.247135162353516, "global_step": 314132, "epoch": 2596} {"train_loss": -44.656105041503906, "global_step": 314133, "epoch": 2596} {"train_loss": -44.129852294921875, "global_step": 314134, "epoch": 2596} {"train_loss": -44.822425842285156, "global_step": 314135, "epoch": 2596} {"train_loss": -43.91514205932617, "global_step": 314136, "epoch": 2596} {"train_loss": -44.21540069580078, "global_step": 314137, "epoch": 2596} {"train_loss": -44.339439392089844, "global_step": 314138, "epoch": 2596} {"train_loss": -44.404022216796875, "global_step": 314139, "epoch": 2596} {"train_loss": -44.65937423706055, "global_step": 314140, "epoch": 2596} {"train_loss": -44.56357955932617, "global_step": 314141, "epoch": 2596} {"train_loss": -44.45884323120117, "global_step": 314142, "epoch": 2596} {"train_loss": -42.99447250366211, "global_step": 314143, "epoch": 2596} {"train_loss": -44.7815055847168, "global_step": 314144, "epoch": 2596} {"train_loss": -44.48604965209961, "global_step": 314145, "epoch": 2596} {"train_loss": -44.796627044677734, "global_step": 314146, "epoch": 2596} {"train_loss": -44.7838020324707, "global_step": 314147, "epoch": 2596} {"train_loss": -44.03462219238281, "global_step": 314148, "epoch": 2596} {"train_loss": -44.89535140991211, "global_step": 314149, "epoch": 2596} {"train_loss": -44.541988372802734, "global_step": 314150, "epoch": 2596} {"train_loss": -44.756587982177734, "global_step": 314151, "epoch": 2596} {"train_loss": -44.600189208984375, "global_step": 314152, "epoch": 2596} {"train_loss": -44.215694427490234, "global_step": 314153, "epoch": 2596} {"train_loss": -44.96936798095703, "global_step": 314154, "epoch": 2596} {"train_loss": -44.9228630065918, "global_step": 314155, "epoch": 2596} {"train_loss": -44.64570999145508, "global_step": 314156, "epoch": 2596} {"train_loss": -44.48907470703125, "global_step": 314157, "epoch": 2596} {"train_loss": -44.64652633666992, "global_step": 314158, "epoch": 2596} {"train_loss": -44.648006439208984, "global_step": 314159, "epoch": 2596} {"train_loss": -44.90853500366211, "global_step": 314160, "epoch": 2596} {"train_loss": -44.546329498291016, "global_step": 314161, "epoch": 2596} {"train_loss": -44.901947021484375, "global_step": 314162, "epoch": 2596} {"train_loss": -44.41313171386719, "global_step": 314163, "epoch": 2596} {"train_loss": -44.9051513671875, "global_step": 314164, "epoch": 2596} {"train_loss": -44.96917724609375, "global_step": 314165, "epoch": 2596} {"train_loss": -44.915653228759766, "global_step": 314166, "epoch": 2596} {"train_loss": -44.63960647583008, "global_step": 314167, "epoch": 2596} {"train_loss": -44.81867599487305, "global_step": 314168, "epoch": 2596} {"train_loss": -43.94020462036133, "global_step": 314169, "epoch": 2596} {"train_loss": -45.11953353881836, "global_step": 314170, "epoch": 2596} {"train_loss": -44.83476638793945, "global_step": 314171, "epoch": 2596} {"train_loss": -44.51963424682617, "global_step": 314172, "epoch": 2596} {"train_loss": -45.09916305541992, "global_step": 314173, "epoch": 2596} {"train_loss": -44.72125244140625, "global_step": 314174, "epoch": 2596} {"train_loss": -44.8646125793457, "global_step": 314175, "epoch": 2596} {"train_loss": -44.60543441772461, "global_step": 314176, "epoch": 2596} {"train_loss": -44.542884826660156, "global_step": 314177, "epoch": 2596} {"train_loss": -45.02405548095703, "global_step": 314178, "epoch": 2596} {"train_loss": -45.14040756225586, "global_step": 314179, "epoch": 2596} {"train_loss": -44.35453414916992, "global_step": 314180, "epoch": 2596} {"train_loss": -45.14752197265625, "global_step": 314181, "epoch": 2596} {"train_loss": -44.16994857788086, "global_step": 314182, "epoch": 2596} {"train_loss": -43.0057373046875, "global_step": 314183, "epoch": 2596} {"train_loss": -43.372901916503906, "global_step": 314184, "epoch": 2596} {"train_loss": -40.39934158325195, "global_step": 314185, "epoch": 2596} {"train_loss": -34.25267028808594, "global_step": 314186, "epoch": 2596} {"train_loss": -40.26462936401367, "global_step": 314187, "epoch": 2596} {"train_loss": -43.52474594116211, "global_step": 314188, "epoch": 2596} {"train_loss": -39.56194305419922, "global_step": 314189, "epoch": 2596} {"train_loss": -34.08005905151367, "global_step": 314190, "epoch": 2596} {"train_loss": -38.3792724609375, "global_step": 314191, "epoch": 2596} {"train_loss": -41.3268928527832, "global_step": 314192, "epoch": 2596} {"train_loss": -43.274776458740234, "global_step": 314193, "epoch": 2596} {"train_loss": -42.25057601928711, "global_step": 314194, "epoch": 2596} {"train_loss": -41.37017059326172, "global_step": 314195, "epoch": 2596} {"train_loss": -42.279335021972656, "global_step": 314196, "epoch": 2596} {"train_loss": -43.048667907714844, "global_step": 314197, "epoch": 2596} {"train_loss": -43.220436096191406, "global_step": 314198, "epoch": 2596} {"train_loss": -43.5827751159668, "global_step": 314199, "epoch": 2596} {"train_loss": -42.9310188293457, "global_step": 314200, "epoch": 2596} {"train_loss": -43.456092834472656, "global_step": 314201, "epoch": 2596} {"train_loss": -43.6471061706543, "global_step": 314202, "epoch": 2596} {"train_loss": -43.76933670043945, "global_step": 314203, "epoch": 2596} {"train_loss": -43.346473693847656, "global_step": 314204, "epoch": 2596} {"train_loss": -41.91758346557617, "global_step": 314205, "epoch": 2596} {"train_loss": -43.11115646362305, "global_step": 314206, "epoch": 2596} {"train_loss": -43.09733200073242, "global_step": 314207, "epoch": 2596} {"train_loss": -43.54652786254883, "global_step": 314208, "epoch": 2596} {"train_loss": -43.16555404663086, "global_step": 314209, "epoch": 2596} {"train_loss": -42.80847930908203, "global_step": 314210, "epoch": 2596} {"train_loss": -43.1912727355957, "global_step": 314211, "epoch": 2596} {"train_loss": -43.38296890258789, "global_step": 314212, "epoch": 2596} {"train_loss": -43.70576477050781, "global_step": 314213, "epoch": 2596} {"train_loss": -43.55680847167969, "global_step": 314214, "epoch": 2596} {"train_loss": -44.08687973022461, "global_step": 314215, "epoch": 2596} {"train_loss": -43.0301628112793, "global_step": 314216, "epoch": 2596} {"train_loss": -43.12971878051758, "global_step": 314217, "epoch": 2596} {"train_loss": -43.35462188720703, "global_step": 314218, "epoch": 2596} {"train_loss": -42.70658493041992, "global_step": 314219, "epoch": 2596} {"train_loss": -42.66378402709961, "global_step": 314220, "epoch": 2596} {"train_loss": -43.62330627441406, "global_step": 314221, "epoch": 2596} {"train_loss": -43.1875, "global_step": 314222, "epoch": 2596} {"train_loss": -41.75582504272461, "global_step": 314223, "epoch": 2596} {"train_loss": -42.61745071411133, "global_step": 314224, "epoch": 2596} {"train_loss": -43.177127838134766, "global_step": 314225, "epoch": 2596} {"train_loss": -42.4727783203125, "global_step": 314226, "epoch": 2596} {"train_loss": -43.05460739135742, "global_step": 314227, "epoch": 2596} {"train_loss": -43.8075065612793, "global_step": 314228, "epoch": 2596} {"train_loss": -42.96543502807617, "global_step": 314229, "epoch": 2596} {"train_loss": -41.815460205078125, "global_step": 314230, "epoch": 2596} {"train_loss": -43.923824310302734, "global_step": 314231, "epoch": 2596} {"train_loss": -43.60702133178711, "global_step": 314232, "epoch": 2596} {"train_loss": -43.53916931152344, "global_step": 314233, "epoch": 2596} {"train_loss": -43.56147003173828, "global_step": 314234, "epoch": 2596} {"train_loss": -43.74850082397461, "global_step": 314235, "epoch": 2596} {"train_loss": -43.59516906738281, "global_step": 314236, "epoch": 2596, "val_loss": 2757481.75} {"train_loss": -44.051692962646484, "global_step": 314237, "epoch": 2597} {"train_loss": -43.657100677490234, "global_step": 314238, "epoch": 2597} {"train_loss": -43.71453094482422, "global_step": 314239, "epoch": 2597} {"train_loss": -43.44892883300781, "global_step": 314240, "epoch": 2597} {"train_loss": -42.297725677490234, "global_step": 314241, "epoch": 2597} {"train_loss": -44.195045471191406, "global_step": 314242, "epoch": 2597} {"train_loss": -43.609886169433594, "global_step": 314243, "epoch": 2597} {"train_loss": -43.24208450317383, "global_step": 314244, "epoch": 2597} {"train_loss": -42.79644775390625, "global_step": 314245, "epoch": 2597} {"train_loss": -43.96675491333008, "global_step": 314246, "epoch": 2597} {"train_loss": -43.59029769897461, "global_step": 314247, "epoch": 2597} {"train_loss": -44.3691520690918, "global_step": 314248, "epoch": 2597} {"train_loss": -43.84858322143555, "global_step": 314249, "epoch": 2597} {"train_loss": -43.93789291381836, "global_step": 314250, "epoch": 2597} {"train_loss": -44.45339584350586, "global_step": 314251, "epoch": 2597} {"train_loss": -43.58540725708008, "global_step": 314252, "epoch": 2597} {"train_loss": -43.571903228759766, "global_step": 314253, "epoch": 2597} {"train_loss": -44.223819732666016, "global_step": 314254, "epoch": 2597} {"train_loss": -42.22698974609375, "global_step": 314255, "epoch": 2597} {"train_loss": -44.31514358520508, "global_step": 314256, "epoch": 2597} {"train_loss": -44.023040771484375, "global_step": 314257, "epoch": 2597} {"train_loss": -44.14006042480469, "global_step": 314258, "epoch": 2597} {"train_loss": -44.20999526977539, "global_step": 314259, "epoch": 2597} {"train_loss": -44.10354995727539, "global_step": 314260, "epoch": 2597} {"train_loss": -44.589820861816406, "global_step": 314261, "epoch": 2597} {"train_loss": -44.37038040161133, "global_step": 314262, "epoch": 2597} {"train_loss": -44.56260299682617, "global_step": 314263, "epoch": 2597} {"train_loss": -41.660919189453125, "global_step": 314264, "epoch": 2597} {"train_loss": -44.58964538574219, "global_step": 314265, "epoch": 2597} {"train_loss": -38.91679763793945, "global_step": 314266, "epoch": 2597} {"train_loss": -44.3205680847168, "global_step": 314267, "epoch": 2597} {"train_loss": -43.601016998291016, "global_step": 314268, "epoch": 2597} {"train_loss": -42.92730712890625, "global_step": 314269, "epoch": 2597} {"train_loss": -43.89775466918945, "global_step": 314270, "epoch": 2597} {"train_loss": -43.42771530151367, "global_step": 314271, "epoch": 2597} {"train_loss": -37.79679870605469, "global_step": 314272, "epoch": 2597} {"train_loss": -43.628108978271484, "global_step": 314273, "epoch": 2597} {"train_loss": -43.85645294189453, "global_step": 314274, "epoch": 2597} {"train_loss": -43.49953079223633, "global_step": 314275, "epoch": 2597} {"train_loss": -43.179439544677734, "global_step": 314276, "epoch": 2597} {"train_loss": -44.09169006347656, "global_step": 314277, "epoch": 2597} {"train_loss": -43.92753982543945, "global_step": 314278, "epoch": 2597} {"train_loss": -43.439231872558594, "global_step": 314279, "epoch": 2597} {"train_loss": -43.680694580078125, "global_step": 314280, "epoch": 2597} {"train_loss": -43.50428009033203, "global_step": 314281, "epoch": 2597} {"train_loss": -42.135169982910156, "global_step": 314282, "epoch": 2597} {"train_loss": -41.37606430053711, "global_step": 314283, "epoch": 2597} {"train_loss": -43.74447250366211, "global_step": 314284, "epoch": 2597} {"train_loss": -43.60207748413086, "global_step": 314285, "epoch": 2597} {"train_loss": -40.45515823364258, "global_step": 314286, "epoch": 2597} {"train_loss": -40.16548156738281, "global_step": 314287, "epoch": 2597} {"train_loss": -42.95504379272461, "global_step": 314288, "epoch": 2597} {"train_loss": -40.32280349731445, "global_step": 314289, "epoch": 2597} {"train_loss": -44.2564811706543, "global_step": 314290, "epoch": 2597} {"train_loss": -43.58768844604492, "global_step": 314291, "epoch": 2597} {"train_loss": -36.62184524536133, "global_step": 314292, "epoch": 2597} {"train_loss": -42.41448974609375, "global_step": 314293, "epoch": 2597} {"train_loss": -40.723148345947266, "global_step": 314294, "epoch": 2597} {"train_loss": -41.857975006103516, "global_step": 314295, "epoch": 2597} {"train_loss": -42.004127502441406, "global_step": 314296, "epoch": 2597} {"train_loss": -43.285972595214844, "global_step": 314297, "epoch": 2597} {"train_loss": -42.70907211303711, "global_step": 314298, "epoch": 2597} {"train_loss": -38.795475006103516, "global_step": 314299, "epoch": 2597} {"train_loss": -39.835670471191406, "global_step": 314300, "epoch": 2597} {"train_loss": -40.832462310791016, "global_step": 314301, "epoch": 2597} {"train_loss": -42.9038200378418, "global_step": 314302, "epoch": 2597} {"train_loss": -37.90614700317383, "global_step": 314303, "epoch": 2597} {"train_loss": -43.215999603271484, "global_step": 314304, "epoch": 2597} {"train_loss": -42.585716247558594, "global_step": 314305, "epoch": 2597} {"train_loss": -42.76902389526367, "global_step": 314306, "epoch": 2597} {"train_loss": -42.77218246459961, "global_step": 314307, "epoch": 2597} {"train_loss": -42.15119934082031, "global_step": 314308, "epoch": 2597} {"train_loss": -40.287261962890625, "global_step": 314309, "epoch": 2597} {"train_loss": -42.58663558959961, "global_step": 314310, "epoch": 2597} {"train_loss": -41.703548431396484, "global_step": 314311, "epoch": 2597} {"train_loss": -43.43986892700195, "global_step": 314312, "epoch": 2597} {"train_loss": -40.850250244140625, "global_step": 314313, "epoch": 2597} {"train_loss": -43.446319580078125, "global_step": 314314, "epoch": 2597} {"train_loss": -41.78901290893555, "global_step": 314315, "epoch": 2597} {"train_loss": -42.92143630981445, "global_step": 314316, "epoch": 2597} {"train_loss": -43.219886779785156, "global_step": 314317, "epoch": 2597} {"train_loss": -41.304229736328125, "global_step": 314318, "epoch": 2597} {"train_loss": -43.49281692504883, "global_step": 314319, "epoch": 2597} {"train_loss": -42.64885330200195, "global_step": 314320, "epoch": 2597} {"train_loss": -41.937042236328125, "global_step": 314321, "epoch": 2597} {"train_loss": -41.066650390625, "global_step": 314322, "epoch": 2597} {"train_loss": -43.7978401184082, "global_step": 314323, "epoch": 2597} {"train_loss": -43.97506332397461, "global_step": 314324, "epoch": 2597} {"train_loss": -43.29433822631836, "global_step": 314325, "epoch": 2597} {"train_loss": -42.99528121948242, "global_step": 314326, "epoch": 2597} {"train_loss": -44.41474533081055, "global_step": 314327, "epoch": 2597} {"train_loss": -42.86561965942383, "global_step": 314328, "epoch": 2597} {"train_loss": -44.091529846191406, "global_step": 314329, "epoch": 2597} {"train_loss": -40.450069427490234, "global_step": 314330, "epoch": 2597} {"train_loss": -40.16086196899414, "global_step": 314331, "epoch": 2597} {"train_loss": -43.61723709106445, "global_step": 314332, "epoch": 2597} {"train_loss": -43.6141357421875, "global_step": 314333, "epoch": 2597} {"train_loss": -42.90911865234375, "global_step": 314334, "epoch": 2597} {"train_loss": -43.714717864990234, "global_step": 314335, "epoch": 2597} {"train_loss": -42.79256057739258, "global_step": 314336, "epoch": 2597} {"train_loss": -43.92277526855469, "global_step": 314337, "epoch": 2597} {"train_loss": -43.84783172607422, "global_step": 314338, "epoch": 2597} {"train_loss": -41.808040618896484, "global_step": 314339, "epoch": 2597} {"train_loss": -42.37870407104492, "global_step": 314340, "epoch": 2597} {"train_loss": -42.367706298828125, "global_step": 314341, "epoch": 2597} {"train_loss": -43.57780456542969, "global_step": 314342, "epoch": 2597} {"train_loss": -42.82136154174805, "global_step": 314343, "epoch": 2597} {"train_loss": -43.67483901977539, "global_step": 314344, "epoch": 2597} {"train_loss": -43.40251922607422, "global_step": 314345, "epoch": 2597} {"train_loss": -42.207313537597656, "global_step": 314346, "epoch": 2597} {"train_loss": -43.058589935302734, "global_step": 314347, "epoch": 2597} {"train_loss": -42.42768478393555, "global_step": 314348, "epoch": 2597} {"train_loss": -42.75223922729492, "global_step": 314349, "epoch": 2597} {"train_loss": -41.023719787597656, "global_step": 314350, "epoch": 2597} {"train_loss": -43.5859489440918, "global_step": 314351, "epoch": 2597} {"train_loss": -43.08948516845703, "global_step": 314352, "epoch": 2597} {"train_loss": -43.36823272705078, "global_step": 314353, "epoch": 2597} {"train_loss": -42.53611373901367, "global_step": 314354, "epoch": 2597} {"train_loss": -43.54116439819336, "global_step": 314355, "epoch": 2597} {"train_loss": -41.65131759643555, "global_step": 314356, "epoch": 2597} {"train_loss": -42.7909312287638, "global_step": 314357, "epoch": 2597, "val_loss": 2747069.0} {"train_loss": -42.55179214477539, "global_step": 314358, "epoch": 2598} {"train_loss": -43.63148880004883, "global_step": 314359, "epoch": 2598} {"train_loss": -40.49285888671875, "global_step": 314360, "epoch": 2598} {"train_loss": -43.53999328613281, "global_step": 314361, "epoch": 2598} {"train_loss": -43.25359344482422, "global_step": 314362, "epoch": 2598} {"train_loss": -43.66764450073242, "global_step": 314363, "epoch": 2598} {"train_loss": -43.34120559692383, "global_step": 314364, "epoch": 2598} {"train_loss": -42.84697723388672, "global_step": 314365, "epoch": 2598} {"train_loss": -43.973655700683594, "global_step": 314366, "epoch": 2598} {"train_loss": -42.78791427612305, "global_step": 314367, "epoch": 2598} {"train_loss": -43.65376281738281, "global_step": 314368, "epoch": 2598} {"train_loss": -42.95481491088867, "global_step": 314369, "epoch": 2598} {"train_loss": -43.427574157714844, "global_step": 314370, "epoch": 2598} {"train_loss": -43.08070755004883, "global_step": 314371, "epoch": 2598} {"train_loss": -42.8770637512207, "global_step": 314372, "epoch": 2598} {"train_loss": -43.473541259765625, "global_step": 314373, "epoch": 2598} {"train_loss": -43.733455657958984, "global_step": 314374, "epoch": 2598} {"train_loss": -42.9674072265625, "global_step": 314375, "epoch": 2598} {"train_loss": -43.61383056640625, "global_step": 314376, "epoch": 2598} {"train_loss": -43.55253982543945, "global_step": 314377, "epoch": 2598} {"train_loss": -43.7003059387207, "global_step": 314378, "epoch": 2598} {"train_loss": -43.427825927734375, "global_step": 314379, "epoch": 2598} {"train_loss": -43.99138641357422, "global_step": 314380, "epoch": 2598} {"train_loss": -43.42900848388672, "global_step": 314381, "epoch": 2598} {"train_loss": -44.18394470214844, "global_step": 314382, "epoch": 2598} {"train_loss": -44.47508239746094, "global_step": 314383, "epoch": 2598} {"train_loss": -44.0083122253418, "global_step": 314384, "epoch": 2598} {"train_loss": -44.264244079589844, "global_step": 314385, "epoch": 2598} {"train_loss": -43.629722595214844, "global_step": 314386, "epoch": 2598} {"train_loss": -44.54464340209961, "global_step": 314387, "epoch": 2598} {"train_loss": -44.3922004699707, "global_step": 314388, "epoch": 2598} {"train_loss": -43.98101806640625, "global_step": 314389, "epoch": 2598} {"train_loss": -44.41769790649414, "global_step": 314390, "epoch": 2598} {"train_loss": -44.81261444091797, "global_step": 314391, "epoch": 2598} {"train_loss": -44.40701675415039, "global_step": 314392, "epoch": 2598} {"train_loss": -44.88787841796875, "global_step": 314393, "epoch": 2598} {"train_loss": -44.51832962036133, "global_step": 314394, "epoch": 2598} {"train_loss": -44.534297943115234, "global_step": 314395, "epoch": 2598} {"train_loss": -44.68479537963867, "global_step": 314396, "epoch": 2598} {"train_loss": -44.25640106201172, "global_step": 314397, "epoch": 2598} {"train_loss": -44.14646530151367, "global_step": 314398, "epoch": 2598} {"train_loss": -43.917903900146484, "global_step": 314399, "epoch": 2598} {"train_loss": -44.06223678588867, "global_step": 314400, "epoch": 2598} {"train_loss": -42.79553985595703, "global_step": 314401, "epoch": 2598} {"train_loss": -44.113441467285156, "global_step": 314402, "epoch": 2598} {"train_loss": -44.06015396118164, "global_step": 314403, "epoch": 2598} {"train_loss": -43.992591857910156, "global_step": 314404, "epoch": 2598} {"train_loss": -43.635982513427734, "global_step": 314405, "epoch": 2598} {"train_loss": -43.745758056640625, "global_step": 314406, "epoch": 2598} {"train_loss": -42.285614013671875, "global_step": 314407, "epoch": 2598} {"train_loss": -43.04863739013672, "global_step": 314408, "epoch": 2598} {"train_loss": -43.36508560180664, "global_step": 314409, "epoch": 2598} {"train_loss": -43.89750289916992, "global_step": 314410, "epoch": 2598} {"train_loss": -42.07334518432617, "global_step": 314411, "epoch": 2598} {"train_loss": -42.57754135131836, "global_step": 314412, "epoch": 2598} {"train_loss": -43.04975509643555, "global_step": 314413, "epoch": 2598} {"train_loss": -40.82413101196289, "global_step": 314414, "epoch": 2598} {"train_loss": -41.653438568115234, "global_step": 314415, "epoch": 2598} {"train_loss": -43.649288177490234, "global_step": 314416, "epoch": 2598} {"train_loss": -43.75071334838867, "global_step": 314417, "epoch": 2598} {"train_loss": -35.9839973449707, "global_step": 314418, "epoch": 2598} {"train_loss": -38.98784255981445, "global_step": 314419, "epoch": 2598} {"train_loss": -43.35880661010742, "global_step": 314420, "epoch": 2598} {"train_loss": -44.06587600708008, "global_step": 314421, "epoch": 2598} {"train_loss": -42.96855545043945, "global_step": 314422, "epoch": 2598} {"train_loss": -39.844276428222656, "global_step": 314423, "epoch": 2598} {"train_loss": -41.489044189453125, "global_step": 314424, "epoch": 2598} {"train_loss": -42.99226760864258, "global_step": 314425, "epoch": 2598} {"train_loss": -42.22018051147461, "global_step": 314426, "epoch": 2598} {"train_loss": -40.472774505615234, "global_step": 314427, "epoch": 2598} {"train_loss": -42.5557746887207, "global_step": 314428, "epoch": 2598} {"train_loss": -40.40916061401367, "global_step": 314429, "epoch": 2598} {"train_loss": -39.38987350463867, "global_step": 314430, "epoch": 2598} {"train_loss": -42.22014617919922, "global_step": 314431, "epoch": 2598} {"train_loss": -43.15757369995117, "global_step": 314432, "epoch": 2598} {"train_loss": -41.43513107299805, "global_step": 314433, "epoch": 2598} {"train_loss": -42.71276092529297, "global_step": 314434, "epoch": 2598} {"train_loss": -39.776756286621094, "global_step": 314435, "epoch": 2598} {"train_loss": -40.52983474731445, "global_step": 314436, "epoch": 2598} {"train_loss": -42.12425231933594, "global_step": 314437, "epoch": 2598} {"train_loss": -42.08835983276367, "global_step": 314438, "epoch": 2598} {"train_loss": -42.256343841552734, "global_step": 314439, "epoch": 2598} {"train_loss": -43.4529914855957, "global_step": 314440, "epoch": 2598} {"train_loss": -41.17311477661133, "global_step": 314441, "epoch": 2598} {"train_loss": -42.995662689208984, "global_step": 314442, "epoch": 2598} {"train_loss": -41.6220817565918, "global_step": 314443, "epoch": 2598} {"train_loss": -42.548072814941406, "global_step": 314444, "epoch": 2598} {"train_loss": -43.11418151855469, "global_step": 314445, "epoch": 2598} {"train_loss": -41.230560302734375, "global_step": 314446, "epoch": 2598} {"train_loss": -42.877681732177734, "global_step": 314447, "epoch": 2598} {"train_loss": -43.19404220581055, "global_step": 314448, "epoch": 2598} {"train_loss": -42.08913803100586, "global_step": 314449, "epoch": 2598} {"train_loss": -42.8531608581543, "global_step": 314450, "epoch": 2598} {"train_loss": -43.175689697265625, "global_step": 314451, "epoch": 2598} {"train_loss": -41.611637115478516, "global_step": 314452, "epoch": 2598} {"train_loss": -43.13310623168945, "global_step": 314453, "epoch": 2598} {"train_loss": -43.29812240600586, "global_step": 314454, "epoch": 2598} {"train_loss": -43.01978302001953, "global_step": 314455, "epoch": 2598} {"train_loss": -41.70552444458008, "global_step": 314456, "epoch": 2598} {"train_loss": -42.90069580078125, "global_step": 314457, "epoch": 2598} {"train_loss": -42.7798957824707, "global_step": 314458, "epoch": 2598} {"train_loss": -41.35346221923828, "global_step": 314459, "epoch": 2598} {"train_loss": -43.15180206298828, "global_step": 314460, "epoch": 2598} {"train_loss": -43.14238357543945, "global_step": 314461, "epoch": 2598} {"train_loss": -43.25959777832031, "global_step": 314462, "epoch": 2598} {"train_loss": -43.402565002441406, "global_step": 314463, "epoch": 2598} {"train_loss": -43.23661422729492, "global_step": 314464, "epoch": 2598} {"train_loss": -42.83921432495117, "global_step": 314465, "epoch": 2598} {"train_loss": -42.80051803588867, "global_step": 314466, "epoch": 2598} {"train_loss": -43.04372024536133, "global_step": 314467, "epoch": 2598} {"train_loss": -43.42972946166992, "global_step": 314468, "epoch": 2598} {"train_loss": -43.17132568359375, "global_step": 314469, "epoch": 2598} {"train_loss": -43.86708068847656, "global_step": 314470, "epoch": 2598} {"train_loss": -41.45536804199219, "global_step": 314471, "epoch": 2598} {"train_loss": -43.06340408325195, "global_step": 314472, "epoch": 2598} {"train_loss": -43.64089584350586, "global_step": 314473, "epoch": 2598} {"train_loss": -41.20380401611328, "global_step": 314474, "epoch": 2598} {"train_loss": -42.88506317138672, "global_step": 314475, "epoch": 2598} {"train_loss": -43.56847381591797, "global_step": 314476, "epoch": 2598} {"train_loss": -42.304100036621094, "global_step": 314477, "epoch": 2598} {"train_loss": -42.88865570194465, "global_step": 314478, "epoch": 2598, "val_loss": 2776253.75} {"train_loss": -42.57750701904297, "global_step": 314479, "epoch": 2599} {"train_loss": -40.961238861083984, "global_step": 314480, "epoch": 2599} {"train_loss": -41.84807205200195, "global_step": 314481, "epoch": 2599} {"train_loss": -42.26909255981445, "global_step": 314482, "epoch": 2599} {"train_loss": -43.12960433959961, "global_step": 314483, "epoch": 2599} {"train_loss": -43.07159423828125, "global_step": 314484, "epoch": 2599} {"train_loss": -42.135475158691406, "global_step": 314485, "epoch": 2599} {"train_loss": -43.849430084228516, "global_step": 314486, "epoch": 2599} {"train_loss": -42.42515182495117, "global_step": 314487, "epoch": 2599} {"train_loss": -41.8483772277832, "global_step": 314488, "epoch": 2599} {"train_loss": -42.5794792175293, "global_step": 314489, "epoch": 2599} {"train_loss": -43.35488510131836, "global_step": 314490, "epoch": 2599} {"train_loss": -43.027889251708984, "global_step": 314491, "epoch": 2599} {"train_loss": -42.52737045288086, "global_step": 314492, "epoch": 2599} {"train_loss": -43.464900970458984, "global_step": 314493, "epoch": 2599} {"train_loss": -42.67299270629883, "global_step": 314494, "epoch": 2599} {"train_loss": -43.4858512878418, "global_step": 314495, "epoch": 2599} {"train_loss": -43.06550216674805, "global_step": 314496, "epoch": 2599} {"train_loss": -43.65835189819336, "global_step": 314497, "epoch": 2599} {"train_loss": -43.45545196533203, "global_step": 314498, "epoch": 2599} {"train_loss": -43.794673919677734, "global_step": 314499, "epoch": 2599} {"train_loss": -42.88222122192383, "global_step": 314500, "epoch": 2599} {"train_loss": -42.76081085205078, "global_step": 314501, "epoch": 2599} {"train_loss": -43.44211959838867, "global_step": 314502, "epoch": 2599} {"train_loss": -42.404911041259766, "global_step": 314503, "epoch": 2599} {"train_loss": -43.39554977416992, "global_step": 314504, "epoch": 2599} {"train_loss": -43.46285629272461, "global_step": 314505, "epoch": 2599} {"train_loss": -42.1186637878418, "global_step": 314506, "epoch": 2599} {"train_loss": -43.22599411010742, "global_step": 314507, "epoch": 2599} {"train_loss": -43.954864501953125, "global_step": 314508, "epoch": 2599} {"train_loss": -42.76549530029297, "global_step": 314509, "epoch": 2599} {"train_loss": -43.46842575073242, "global_step": 314510, "epoch": 2599} {"train_loss": -43.939491271972656, "global_step": 314511, "epoch": 2599} {"train_loss": -43.06328201293945, "global_step": 314512, "epoch": 2599} {"train_loss": -43.282814025878906, "global_step": 314513, "epoch": 2599} {"train_loss": -43.30195999145508, "global_step": 314514, "epoch": 2599} {"train_loss": -41.5655517578125, "global_step": 314515, "epoch": 2599} {"train_loss": -43.4206428527832, "global_step": 314516, "epoch": 2599} {"train_loss": -43.87820053100586, "global_step": 314517, "epoch": 2599} {"train_loss": -42.70458984375, "global_step": 314518, "epoch": 2599} {"train_loss": -43.13014602661133, "global_step": 314519, "epoch": 2599} {"train_loss": -41.10578918457031, "global_step": 314520, "epoch": 2599} {"train_loss": -43.263153076171875, "global_step": 314521, "epoch": 2599} {"train_loss": -41.39963912963867, "global_step": 314522, "epoch": 2599} {"train_loss": -43.012611389160156, "global_step": 314523, "epoch": 2599} {"train_loss": -42.52085876464844, "global_step": 314524, "epoch": 2599} {"train_loss": -42.85670471191406, "global_step": 314525, "epoch": 2599} {"train_loss": -42.40357208251953, "global_step": 314526, "epoch": 2599} {"train_loss": -41.12934875488281, "global_step": 314527, "epoch": 2599} {"train_loss": -40.09210205078125, "global_step": 314528, "epoch": 2599} {"train_loss": -41.17658615112305, "global_step": 314529, "epoch": 2599} {"train_loss": -42.328731536865234, "global_step": 314530, "epoch": 2599} {"train_loss": -43.31101608276367, "global_step": 314531, "epoch": 2599} {"train_loss": -40.09192657470703, "global_step": 314532, "epoch": 2599} {"train_loss": -41.907958984375, "global_step": 314533, "epoch": 2599} {"train_loss": -43.25069808959961, "global_step": 314534, "epoch": 2599} {"train_loss": -38.203731536865234, "global_step": 314535, "epoch": 2599} {"train_loss": -40.386962890625, "global_step": 314536, "epoch": 2599} {"train_loss": -42.67463302612305, "global_step": 314537, "epoch": 2599} {"train_loss": -39.38375473022461, "global_step": 314538, "epoch": 2599} {"train_loss": -42.59478759765625, "global_step": 314539, "epoch": 2599} {"train_loss": -40.984771728515625, "global_step": 314540, "epoch": 2599} {"train_loss": -40.42865753173828, "global_step": 314541, "epoch": 2599} {"train_loss": -42.12251663208008, "global_step": 314542, "epoch": 2599} {"train_loss": -37.633853912353516, "global_step": 314543, "epoch": 2599} {"train_loss": -41.947669982910156, "global_step": 314544, "epoch": 2599} {"train_loss": -37.174354553222656, "global_step": 314545, "epoch": 2599} {"train_loss": -39.07419967651367, "global_step": 314546, "epoch": 2599} {"train_loss": -40.73533248901367, "global_step": 314547, "epoch": 2599} {"train_loss": -37.77206802368164, "global_step": 314548, "epoch": 2599} {"train_loss": -40.9095458984375, "global_step": 314549, "epoch": 2599} {"train_loss": -40.109779357910156, "global_step": 314550, "epoch": 2599} {"train_loss": -41.61294937133789, "global_step": 314551, "epoch": 2599} {"train_loss": -38.76703643798828, "global_step": 314552, "epoch": 2599} {"train_loss": -40.955657958984375, "global_step": 314553, "epoch": 2599} {"train_loss": -39.8111686706543, "global_step": 314554, "epoch": 2599} {"train_loss": -41.98371505737305, "global_step": 314555, "epoch": 2599} {"train_loss": -40.750240325927734, "global_step": 314556, "epoch": 2599} {"train_loss": -41.063838958740234, "global_step": 314557, "epoch": 2599} {"train_loss": -39.83123779296875, "global_step": 314558, "epoch": 2599} {"train_loss": -41.713531494140625, "global_step": 314559, "epoch": 2599} {"train_loss": -42.386653900146484, "global_step": 314560, "epoch": 2599} {"train_loss": -40.73859405517578, "global_step": 314561, "epoch": 2599} {"train_loss": -39.37324142456055, "global_step": 314562, "epoch": 2599} {"train_loss": -39.87977981567383, "global_step": 314563, "epoch": 2599} {"train_loss": -41.2775993347168, "global_step": 314564, "epoch": 2599} {"train_loss": -40.48505401611328, "global_step": 314565, "epoch": 2599} {"train_loss": -40.070167541503906, "global_step": 314566, "epoch": 2599} {"train_loss": -41.21997833251953, "global_step": 314567, "epoch": 2599} {"train_loss": -39.231178283691406, "global_step": 314568, "epoch": 2599} {"train_loss": -41.74115753173828, "global_step": 314569, "epoch": 2599} {"train_loss": -41.48594665527344, "global_step": 314570, "epoch": 2599} {"train_loss": -41.72280502319336, "global_step": 314571, "epoch": 2599} {"train_loss": -41.66487503051758, "global_step": 314572, "epoch": 2599} {"train_loss": -40.847896575927734, "global_step": 314573, "epoch": 2599} {"train_loss": -41.69328689575195, "global_step": 314574, "epoch": 2599} {"train_loss": -42.84395217895508, "global_step": 314575, "epoch": 2599} {"train_loss": -35.95081329345703, "global_step": 314576, "epoch": 2599} {"train_loss": -39.54544448852539, "global_step": 314577, "epoch": 2599} {"train_loss": -42.37251663208008, "global_step": 314578, "epoch": 2599} {"train_loss": -40.27082443237305, "global_step": 314579, "epoch": 2599} {"train_loss": -40.7878532409668, "global_step": 314580, "epoch": 2599} {"train_loss": -40.578125, "global_step": 314581, "epoch": 2599} {"train_loss": -41.182044982910156, "global_step": 314582, "epoch": 2599} {"train_loss": -41.28474807739258, "global_step": 314583, "epoch": 2599} {"train_loss": -38.241127014160156, "global_step": 314584, "epoch": 2599} {"train_loss": -40.76105499267578, "global_step": 314585, "epoch": 2599} {"train_loss": -41.92676544189453, "global_step": 314586, "epoch": 2599} {"train_loss": -38.02828598022461, "global_step": 314587, "epoch": 2599} {"train_loss": -38.86084747314453, "global_step": 314588, "epoch": 2599} {"train_loss": -41.326141357421875, "global_step": 314589, "epoch": 2599} {"train_loss": -41.59548568725586, "global_step": 314590, "epoch": 2599} {"train_loss": -40.0001220703125, "global_step": 314591, "epoch": 2599} {"train_loss": -40.042938232421875, "global_step": 314592, "epoch": 2599} {"train_loss": -42.4995002746582, "global_step": 314593, "epoch": 2599} {"train_loss": -41.38203811645508, "global_step": 314594, "epoch": 2599} {"train_loss": -41.42433547973633, "global_step": 314595, "epoch": 2599} {"train_loss": -37.68042755126953, "global_step": 314596, "epoch": 2599} {"train_loss": -41.82340621948242, "global_step": 314597, "epoch": 2599} {"train_loss": -40.38225173950195, "global_step": 314598, "epoch": 2599} {"train_loss": -41.52439747960114, "global_step": 314599, "epoch": 2599, "val_loss": 2742469.75} {"train_loss": -39.8831672668457, "global_step": 314600, "epoch": 2600} {"train_loss": -41.72711181640625, "global_step": 314601, "epoch": 2600} {"train_loss": -41.46242904663086, "global_step": 314602, "epoch": 2600} {"train_loss": -39.8912353515625, "global_step": 314603, "epoch": 2600} {"train_loss": -42.63336944580078, "global_step": 314604, "epoch": 2600} {"train_loss": -41.060848236083984, "global_step": 314605, "epoch": 2600} {"train_loss": -41.46504592895508, "global_step": 314606, "epoch": 2600} {"train_loss": -41.49509048461914, "global_step": 314607, "epoch": 2600} {"train_loss": -41.48383712768555, "global_step": 314608, "epoch": 2600} {"train_loss": -41.79645538330078, "global_step": 314609, "epoch": 2600} {"train_loss": -40.64345932006836, "global_step": 314610, "epoch": 2600} {"train_loss": -42.670494079589844, "global_step": 314611, "epoch": 2600} {"train_loss": -42.49216842651367, "global_step": 314612, "epoch": 2600} {"train_loss": -40.666717529296875, "global_step": 314613, "epoch": 2600} {"train_loss": -42.62452697753906, "global_step": 314614, "epoch": 2600} {"train_loss": -42.160518646240234, "global_step": 314615, "epoch": 2600} {"train_loss": -42.247066497802734, "global_step": 314616, "epoch": 2600} {"train_loss": -41.783260345458984, "global_step": 314617, "epoch": 2600} {"train_loss": -40.7391242980957, "global_step": 314618, "epoch": 2600} {"train_loss": -41.475257873535156, "global_step": 314619, "epoch": 2600} {"train_loss": -42.74518966674805, "global_step": 314620, "epoch": 2600} {"train_loss": -42.401283264160156, "global_step": 314621, "epoch": 2600} {"train_loss": -42.792842864990234, "global_step": 314622, "epoch": 2600} {"train_loss": -42.11143112182617, "global_step": 314623, "epoch": 2600} {"train_loss": -42.39051055908203, "global_step": 314624, "epoch": 2600} {"train_loss": -42.87470245361328, "global_step": 314625, "epoch": 2600} {"train_loss": -40.4641227722168, "global_step": 314626, "epoch": 2600} {"train_loss": -41.16592025756836, "global_step": 314627, "epoch": 2600} {"train_loss": -42.85862350463867, "global_step": 314628, "epoch": 2600} {"train_loss": -42.573238372802734, "global_step": 314629, "epoch": 2600} {"train_loss": -41.57257843017578, "global_step": 314630, "epoch": 2600} {"train_loss": -41.971641540527344, "global_step": 314631, "epoch": 2600} {"train_loss": -42.499298095703125, "global_step": 314632, "epoch": 2600} {"train_loss": -41.60273361206055, "global_step": 314633, "epoch": 2600} {"train_loss": -43.1160888671875, "global_step": 314634, "epoch": 2600} {"train_loss": -42.914424896240234, "global_step": 314635, "epoch": 2600} {"train_loss": -39.91921615600586, "global_step": 314636, "epoch": 2600} {"train_loss": -42.82406234741211, "global_step": 314637, "epoch": 2600} {"train_loss": -42.16096878051758, "global_step": 314638, "epoch": 2600} {"train_loss": -42.19075012207031, "global_step": 314639, "epoch": 2600} {"train_loss": -43.5451774597168, "global_step": 314640, "epoch": 2600} {"train_loss": -42.63817596435547, "global_step": 314641, "epoch": 2600} {"train_loss": -43.30483627319336, "global_step": 314642, "epoch": 2600} {"train_loss": -42.60152816772461, "global_step": 314643, "epoch": 2600} {"train_loss": -42.93720245361328, "global_step": 314644, "epoch": 2600} {"train_loss": -43.14290237426758, "global_step": 314645, "epoch": 2600} {"train_loss": -42.564762115478516, "global_step": 314646, "epoch": 2600} {"train_loss": -43.15846633911133, "global_step": 314647, "epoch": 2600} {"train_loss": -43.103755950927734, "global_step": 314648, "epoch": 2600} {"train_loss": -43.3245735168457, "global_step": 314649, "epoch": 2600} {"train_loss": -43.25967025756836, "global_step": 314650, "epoch": 2600} {"train_loss": -43.07227325439453, "global_step": 314651, "epoch": 2600} {"train_loss": -44.07686996459961, "global_step": 314652, "epoch": 2600} {"train_loss": -43.29959487915039, "global_step": 314653, "epoch": 2600} {"train_loss": -43.05164337158203, "global_step": 314654, "epoch": 2600} {"train_loss": -42.41679000854492, "global_step": 314655, "epoch": 2600} {"train_loss": -43.106788635253906, "global_step": 314656, "epoch": 2600} {"train_loss": -43.2871208190918, "global_step": 314657, "epoch": 2600} {"train_loss": -43.38957595825195, "global_step": 314658, "epoch": 2600} {"train_loss": -43.17137145996094, "global_step": 314659, "epoch": 2600} {"train_loss": -42.798500061035156, "global_step": 314660, "epoch": 2600} {"train_loss": -43.76241683959961, "global_step": 314661, "epoch": 2600} {"train_loss": -42.96967315673828, "global_step": 314662, "epoch": 2600} {"train_loss": -43.4630241394043, "global_step": 314663, "epoch": 2600} {"train_loss": -43.420406341552734, "global_step": 314664, "epoch": 2600} {"train_loss": -43.460205078125, "global_step": 314665, "epoch": 2600} {"train_loss": -43.51367950439453, "global_step": 314666, "epoch": 2600} {"train_loss": -43.033084869384766, "global_step": 314667, "epoch": 2600} {"train_loss": -43.762176513671875, "global_step": 314668, "epoch": 2600} {"train_loss": -43.43281936645508, "global_step": 314669, "epoch": 2600} {"train_loss": -43.068363189697266, "global_step": 314670, "epoch": 2600} {"train_loss": -43.58957290649414, "global_step": 314671, "epoch": 2600} {"train_loss": -43.66548538208008, "global_step": 314672, "epoch": 2600} {"train_loss": -43.652137756347656, "global_step": 314673, "epoch": 2600} {"train_loss": -44.3687629699707, "global_step": 314674, "epoch": 2600} {"train_loss": -43.66984176635742, "global_step": 314675, "epoch": 2600} {"train_loss": -44.236629486083984, "global_step": 314676, "epoch": 2600} {"train_loss": -44.007537841796875, "global_step": 314677, "epoch": 2600} {"train_loss": -43.8067741394043, "global_step": 314678, "epoch": 2600} {"train_loss": -43.67771911621094, "global_step": 314679, "epoch": 2600} {"train_loss": -43.263519287109375, "global_step": 314680, "epoch": 2600} {"train_loss": -43.98320770263672, "global_step": 314681, "epoch": 2600} {"train_loss": -43.3530158996582, "global_step": 314682, "epoch": 2600} {"train_loss": -43.30277633666992, "global_step": 314683, "epoch": 2600} {"train_loss": -42.98887634277344, "global_step": 314684, "epoch": 2600} {"train_loss": -43.58848190307617, "global_step": 314685, "epoch": 2600} {"train_loss": -43.27895736694336, "global_step": 314686, "epoch": 2600} {"train_loss": -44.03715133666992, "global_step": 314687, "epoch": 2600} {"train_loss": -43.97649002075195, "global_step": 314688, "epoch": 2600} {"train_loss": -43.79548263549805, "global_step": 314689, "epoch": 2600} {"train_loss": -43.95673751831055, "global_step": 314690, "epoch": 2600} {"train_loss": -44.08353805541992, "global_step": 314691, "epoch": 2600} {"train_loss": -43.271705627441406, "global_step": 314692, "epoch": 2600} {"train_loss": -43.76628494262695, "global_step": 314693, "epoch": 2600} {"train_loss": -42.883888244628906, "global_step": 314694, "epoch": 2600} {"train_loss": -43.87703323364258, "global_step": 314695, "epoch": 2600} {"train_loss": -43.72794723510742, "global_step": 314696, "epoch": 2600} {"train_loss": -43.72455978393555, "global_step": 314697, "epoch": 2600} {"train_loss": -43.89191818237305, "global_step": 314698, "epoch": 2600} {"train_loss": -43.6030158996582, "global_step": 314699, "epoch": 2600} {"train_loss": -42.68950653076172, "global_step": 314700, "epoch": 2600} {"train_loss": -43.49384689331055, "global_step": 314701, "epoch": 2600} {"train_loss": -44.09018325805664, "global_step": 314702, "epoch": 2600} {"train_loss": -43.57792282104492, "global_step": 314703, "epoch": 2600} {"train_loss": -42.30806350708008, "global_step": 314704, "epoch": 2600} {"train_loss": -41.9111328125, "global_step": 314705, "epoch": 2600} {"train_loss": -41.195003509521484, "global_step": 314706, "epoch": 2600} {"train_loss": -41.812068939208984, "global_step": 314707, "epoch": 2600} {"train_loss": -42.54366683959961, "global_step": 314708, "epoch": 2600} {"train_loss": -42.7816047668457, "global_step": 314709, "epoch": 2600} {"train_loss": -43.75388717651367, "global_step": 314710, "epoch": 2600} {"train_loss": -43.1200065612793, "global_step": 314711, "epoch": 2600} {"train_loss": -42.861759185791016, "global_step": 314712, "epoch": 2600} {"train_loss": -41.464229583740234, "global_step": 314713, "epoch": 2600} {"train_loss": -43.31171417236328, "global_step": 314714, "epoch": 2600} {"train_loss": -43.320274353027344, "global_step": 314715, "epoch": 2600} {"train_loss": -43.27574920654297, "global_step": 314716, "epoch": 2600} {"train_loss": -42.25020980834961, "global_step": 314717, "epoch": 2600} {"train_loss": -43.01699447631836, "global_step": 314718, "epoch": 2600} {"train_loss": -43.85184860229492, "global_step": 314719, "epoch": 2600} {"train_loss": -42.803564402682724, "global_step": 314720, "epoch": 2600, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4400000": 1.0, "test/sim_max_reward_4400001": 1.0, "test/sim_max_reward_4400002": 1.0, "test/sim_max_reward_4400003": 1.0, "test/sim_max_reward_4400004": 1.0, "test/sim_max_reward_4400005": 1.0, "test/sim_max_reward_4400006": 1.0, "test/sim_max_reward_4400007": 1.0, "test/sim_max_reward_4400008": 1.0, "test/sim_max_reward_4400009": 0.0, "test/sim_max_reward_4400010": 1.0, "test/sim_max_reward_4400011": 1.0, "test/sim_max_reward_4400012": 1.0, "test/sim_max_reward_4400013": 1.0, "test/sim_max_reward_4400014": 1.0, "test/sim_max_reward_4400015": 1.0, "test/sim_max_reward_4400016": 1.0, "test/sim_max_reward_4400017": 1.0, "test/sim_max_reward_4400018": 1.0, "test/sim_max_reward_4400019": 1.0, "test/sim_max_reward_4400020": 1.0, "test/sim_max_reward_4400021": 1.0, "train/mean_score": 1.0, "test/mean_score": 0.9545454545454546, "val_loss": 2681581.5} {"train_loss": -43.26302719116211, "global_step": 314721, "epoch": 2601} {"train_loss": -42.77342224121094, "global_step": 314722, "epoch": 2601} {"train_loss": -42.4107780456543, "global_step": 314723, "epoch": 2601} {"train_loss": -41.8674430847168, "global_step": 314724, "epoch": 2601} {"train_loss": -43.045310974121094, "global_step": 314725, "epoch": 2601} {"train_loss": -42.645145416259766, "global_step": 314726, "epoch": 2601} {"train_loss": -42.019561767578125, "global_step": 314727, "epoch": 2601} {"train_loss": -41.103458404541016, "global_step": 314728, "epoch": 2601} {"train_loss": -42.718536376953125, "global_step": 314729, "epoch": 2601} {"train_loss": -42.701515197753906, "global_step": 314730, "epoch": 2601} {"train_loss": -42.82404327392578, "global_step": 314731, "epoch": 2601} {"train_loss": -42.27729034423828, "global_step": 314732, "epoch": 2601} {"train_loss": -41.73750686645508, "global_step": 314733, "epoch": 2601} {"train_loss": -42.57318115234375, "global_step": 314734, "epoch": 2601} {"train_loss": -42.3343391418457, "global_step": 314735, "epoch": 2601} {"train_loss": -39.98747253417969, "global_step": 314736, "epoch": 2601} {"train_loss": -40.67406463623047, "global_step": 314737, "epoch": 2601} {"train_loss": -42.230098724365234, "global_step": 314738, "epoch": 2601} {"train_loss": -42.181365966796875, "global_step": 314739, "epoch": 2601} {"train_loss": -42.942256927490234, "global_step": 314740, "epoch": 2601} {"train_loss": -41.92202377319336, "global_step": 314741, "epoch": 2601} {"train_loss": -41.893741607666016, "global_step": 314742, "epoch": 2601} {"train_loss": -42.02009201049805, "global_step": 314743, "epoch": 2601} {"train_loss": -42.2234001159668, "global_step": 314744, "epoch": 2601} {"train_loss": -42.3552360534668, "global_step": 314745, "epoch": 2601} {"train_loss": -41.975563049316406, "global_step": 314746, "epoch": 2601} {"train_loss": -42.21745681762695, "global_step": 314747, "epoch": 2601} {"train_loss": -42.94881820678711, "global_step": 314748, "epoch": 2601} {"train_loss": -42.72683334350586, "global_step": 314749, "epoch": 2601} {"train_loss": -43.169185638427734, "global_step": 314750, "epoch": 2601} {"train_loss": -41.77059555053711, "global_step": 314751, "epoch": 2601} {"train_loss": -42.3809928894043, "global_step": 314752, "epoch": 2601} {"train_loss": -42.89892578125, "global_step": 314753, "epoch": 2601} {"train_loss": -42.712257385253906, "global_step": 314754, "epoch": 2601} {"train_loss": -42.87795639038086, "global_step": 314755, "epoch": 2601} {"train_loss": -42.57658004760742, "global_step": 314756, "epoch": 2601} {"train_loss": -42.959407806396484, "global_step": 314757, "epoch": 2601} {"train_loss": -40.5710563659668, "global_step": 314758, "epoch": 2601} {"train_loss": -41.3568229675293, "global_step": 314759, "epoch": 2601} {"train_loss": -42.98946762084961, "global_step": 314760, "epoch": 2601} {"train_loss": -42.59641647338867, "global_step": 314761, "epoch": 2601} {"train_loss": -41.1336669921875, "global_step": 314762, "epoch": 2601} {"train_loss": -35.4091796875, "global_step": 314763, "epoch": 2601} {"train_loss": -40.84211349487305, "global_step": 314764, "epoch": 2601} {"train_loss": -41.542301177978516, "global_step": 314765, "epoch": 2601} {"train_loss": -40.78398513793945, "global_step": 314766, "epoch": 2601} {"train_loss": -42.80062484741211, "global_step": 314767, "epoch": 2601} {"train_loss": -40.2451057434082, "global_step": 314768, "epoch": 2601} {"train_loss": -39.974456787109375, "global_step": 314769, "epoch": 2601} {"train_loss": -40.72428512573242, "global_step": 314770, "epoch": 2601} {"train_loss": -41.8596076965332, "global_step": 314771, "epoch": 2601} {"train_loss": -41.51423263549805, "global_step": 314772, "epoch": 2601} {"train_loss": -42.465763092041016, "global_step": 314773, "epoch": 2601} {"train_loss": -40.577816009521484, "global_step": 314774, "epoch": 2601} {"train_loss": -41.872344970703125, "global_step": 314775, "epoch": 2601} {"train_loss": -42.17548751831055, "global_step": 314776, "epoch": 2601} {"train_loss": -42.3391227722168, "global_step": 314777, "epoch": 2601} {"train_loss": -42.56330108642578, "global_step": 314778, "epoch": 2601} {"train_loss": -43.1400146484375, "global_step": 314779, "epoch": 2601} {"train_loss": -43.01036834716797, "global_step": 314780, "epoch": 2601} {"train_loss": -41.11752700805664, "global_step": 314781, "epoch": 2601} {"train_loss": -41.550838470458984, "global_step": 314782, "epoch": 2601} {"train_loss": -42.908504486083984, "global_step": 314783, "epoch": 2601} {"train_loss": -41.88901901245117, "global_step": 314784, "epoch": 2601} {"train_loss": -43.49214172363281, "global_step": 314785, "epoch": 2601} {"train_loss": -43.24354934692383, "global_step": 314786, "epoch": 2601} {"train_loss": -43.47966766357422, "global_step": 314787, "epoch": 2601} {"train_loss": -43.28937911987305, "global_step": 314788, "epoch": 2601} {"train_loss": -43.79611587524414, "global_step": 314789, "epoch": 2601} {"train_loss": -42.54480743408203, "global_step": 314790, "epoch": 2601} {"train_loss": -43.59154510498047, "global_step": 314791, "epoch": 2601} {"train_loss": -41.64564514160156, "global_step": 314792, "epoch": 2601} {"train_loss": -43.54500198364258, "global_step": 314793, "epoch": 2601} {"train_loss": -43.05071258544922, "global_step": 314794, "epoch": 2601} {"train_loss": -43.62595748901367, "global_step": 314795, "epoch": 2601} {"train_loss": -43.09006881713867, "global_step": 314796, "epoch": 2601} {"train_loss": -43.58989334106445, "global_step": 314797, "epoch": 2601} {"train_loss": -43.26804733276367, "global_step": 314798, "epoch": 2601} {"train_loss": -42.309112548828125, "global_step": 314799, "epoch": 2601} {"train_loss": -43.20298385620117, "global_step": 314800, "epoch": 2601} {"train_loss": -43.89622116088867, "global_step": 314801, "epoch": 2601} {"train_loss": -43.700767517089844, "global_step": 314802, "epoch": 2601} {"train_loss": -43.2021369934082, "global_step": 314803, "epoch": 2601} {"train_loss": -42.74394607543945, "global_step": 314804, "epoch": 2601} {"train_loss": -44.15803909301758, "global_step": 314805, "epoch": 2601} {"train_loss": -43.434078216552734, "global_step": 314806, "epoch": 2601} {"train_loss": -43.628089904785156, "global_step": 314807, "epoch": 2601} {"train_loss": -42.67063522338867, "global_step": 314808, "epoch": 2601} {"train_loss": -42.67250061035156, "global_step": 314809, "epoch": 2601} {"train_loss": -42.676326751708984, "global_step": 314810, "epoch": 2601} {"train_loss": -43.600582122802734, "global_step": 314811, "epoch": 2601} {"train_loss": -42.940792083740234, "global_step": 314812, "epoch": 2601} {"train_loss": -43.94673156738281, "global_step": 314813, "epoch": 2601} {"train_loss": -43.80576705932617, "global_step": 314814, "epoch": 2601} {"train_loss": -43.75587844848633, "global_step": 314815, "epoch": 2601} {"train_loss": -43.37873458862305, "global_step": 314816, "epoch": 2601} {"train_loss": -43.54055404663086, "global_step": 314817, "epoch": 2601} {"train_loss": -44.04542541503906, "global_step": 314818, "epoch": 2601} {"train_loss": -43.787593841552734, "global_step": 314819, "epoch": 2601} {"train_loss": -43.66523361206055, "global_step": 314820, "epoch": 2601} {"train_loss": -44.243873596191406, "global_step": 314821, "epoch": 2601} {"train_loss": -43.58378982543945, "global_step": 314822, "epoch": 2601} {"train_loss": -43.707462310791016, "global_step": 314823, "epoch": 2601} {"train_loss": -43.7276611328125, "global_step": 314824, "epoch": 2601} {"train_loss": -43.635719299316406, "global_step": 314825, "epoch": 2601} {"train_loss": -44.139522552490234, "global_step": 314826, "epoch": 2601} {"train_loss": -42.86948776245117, "global_step": 314827, "epoch": 2601} {"train_loss": -43.20316696166992, "global_step": 314828, "epoch": 2601} {"train_loss": -44.058895111083984, "global_step": 314829, "epoch": 2601} {"train_loss": -43.92611312866211, "global_step": 314830, "epoch": 2601} {"train_loss": -43.760799407958984, "global_step": 314831, "epoch": 2601} {"train_loss": -44.68476867675781, "global_step": 314832, "epoch": 2601} {"train_loss": -42.777339935302734, "global_step": 314833, "epoch": 2601} {"train_loss": -43.54621124267578, "global_step": 314834, "epoch": 2601} {"train_loss": -43.621864318847656, "global_step": 314835, "epoch": 2601} {"train_loss": -43.66242218017578, "global_step": 314836, "epoch": 2601} {"train_loss": -43.13618087768555, "global_step": 314837, "epoch": 2601} {"train_loss": -43.52235794067383, "global_step": 314838, "epoch": 2601} {"train_loss": -42.360836029052734, "global_step": 314839, "epoch": 2601} {"train_loss": -44.105003356933594, "global_step": 314840, "epoch": 2601} {"train_loss": -42.65847226607898, "global_step": 314841, "epoch": 2601, "val_loss": 2695173.5} {"train_loss": -42.931983947753906, "global_step": 314842, "epoch": 2602} {"train_loss": -43.29237747192383, "global_step": 314843, "epoch": 2602} {"train_loss": -43.010982513427734, "global_step": 314844, "epoch": 2602} {"train_loss": -42.27373123168945, "global_step": 314845, "epoch": 2602} {"train_loss": -42.943458557128906, "global_step": 314846, "epoch": 2602} {"train_loss": -42.703590393066406, "global_step": 314847, "epoch": 2602} {"train_loss": -41.597015380859375, "global_step": 314848, "epoch": 2602} {"train_loss": -40.70514678955078, "global_step": 314849, "epoch": 2602} {"train_loss": -43.616878509521484, "global_step": 314850, "epoch": 2602} {"train_loss": -42.528133392333984, "global_step": 314851, "epoch": 2602} {"train_loss": -40.207374572753906, "global_step": 314852, "epoch": 2602} {"train_loss": -42.34663009643555, "global_step": 314853, "epoch": 2602} {"train_loss": -41.8074836730957, "global_step": 314854, "epoch": 2602} {"train_loss": -38.4956169128418, "global_step": 314855, "epoch": 2602} {"train_loss": -36.236183166503906, "global_step": 314856, "epoch": 2602} {"train_loss": -39.82131576538086, "global_step": 314857, "epoch": 2602} {"train_loss": -40.1689567565918, "global_step": 314858, "epoch": 2602} {"train_loss": -36.1699104309082, "global_step": 314859, "epoch": 2602} {"train_loss": -41.183685302734375, "global_step": 314860, "epoch": 2602} {"train_loss": -39.47990417480469, "global_step": 314861, "epoch": 2602} {"train_loss": -41.68059158325195, "global_step": 314862, "epoch": 2602} {"train_loss": -39.688636779785156, "global_step": 314863, "epoch": 2602} {"train_loss": -41.16331481933594, "global_step": 314864, "epoch": 2602} {"train_loss": -42.30733108520508, "global_step": 314865, "epoch": 2602} {"train_loss": -40.494876861572266, "global_step": 314866, "epoch": 2602} {"train_loss": -40.340187072753906, "global_step": 314867, "epoch": 2602} {"train_loss": -41.75325012207031, "global_step": 314868, "epoch": 2602} {"train_loss": -37.4782829284668, "global_step": 314869, "epoch": 2602} {"train_loss": -32.13560104370117, "global_step": 314870, "epoch": 2602} {"train_loss": -40.544734954833984, "global_step": 314871, "epoch": 2602} {"train_loss": -40.492584228515625, "global_step": 314872, "epoch": 2602} {"train_loss": -41.11665725708008, "global_step": 314873, "epoch": 2602} {"train_loss": -39.94594955444336, "global_step": 314874, "epoch": 2602} {"train_loss": -39.40406036376953, "global_step": 314875, "epoch": 2602} {"train_loss": -40.30437088012695, "global_step": 314876, "epoch": 2602} {"train_loss": -41.37421798706055, "global_step": 314877, "epoch": 2602} {"train_loss": -39.06089401245117, "global_step": 314878, "epoch": 2602} {"train_loss": -39.87464141845703, "global_step": 314879, "epoch": 2602} {"train_loss": -40.486724853515625, "global_step": 314880, "epoch": 2602} {"train_loss": -40.27325439453125, "global_step": 314881, "epoch": 2602} {"train_loss": -41.337127685546875, "global_step": 314882, "epoch": 2602} {"train_loss": -41.963233947753906, "global_step": 314883, "epoch": 2602} {"train_loss": -39.95077133178711, "global_step": 314884, "epoch": 2602} {"train_loss": -42.559513092041016, "global_step": 314885, "epoch": 2602} {"train_loss": -40.381134033203125, "global_step": 314886, "epoch": 2602} {"train_loss": -41.63123321533203, "global_step": 314887, "epoch": 2602} {"train_loss": -40.938419342041016, "global_step": 314888, "epoch": 2602} {"train_loss": -41.8570442199707, "global_step": 314889, "epoch": 2602} {"train_loss": -40.634063720703125, "global_step": 314890, "epoch": 2602} {"train_loss": -42.084835052490234, "global_step": 314891, "epoch": 2602} {"train_loss": -41.228641510009766, "global_step": 314892, "epoch": 2602} {"train_loss": -42.235687255859375, "global_step": 314893, "epoch": 2602} {"train_loss": -42.576942443847656, "global_step": 314894, "epoch": 2602} {"train_loss": -42.19581985473633, "global_step": 314895, "epoch": 2602} {"train_loss": -42.26639938354492, "global_step": 314896, "epoch": 2602} {"train_loss": -41.33491897583008, "global_step": 314897, "epoch": 2602} {"train_loss": -42.4363899230957, "global_step": 314898, "epoch": 2602} {"train_loss": -42.05746078491211, "global_step": 314899, "epoch": 2602} {"train_loss": -42.84125900268555, "global_step": 314900, "epoch": 2602} {"train_loss": -41.90644073486328, "global_step": 314901, "epoch": 2602} {"train_loss": -42.842018127441406, "global_step": 314902, "epoch": 2602} {"train_loss": -42.65591049194336, "global_step": 314903, "epoch": 2602} {"train_loss": -42.94199752807617, "global_step": 314904, "epoch": 2602} {"train_loss": -42.998592376708984, "global_step": 314905, "epoch": 2602} {"train_loss": -41.523048400878906, "global_step": 314906, "epoch": 2602} {"train_loss": -42.37542724609375, "global_step": 314907, "epoch": 2602} {"train_loss": -42.69793701171875, "global_step": 314908, "epoch": 2602} {"train_loss": -40.56386947631836, "global_step": 314909, "epoch": 2602} {"train_loss": -42.855037689208984, "global_step": 314910, "epoch": 2602} {"train_loss": -42.23988723754883, "global_step": 314911, "epoch": 2602} {"train_loss": -42.82524871826172, "global_step": 314912, "epoch": 2602} {"train_loss": -42.84626388549805, "global_step": 314913, "epoch": 2602} {"train_loss": -43.148616790771484, "global_step": 314914, "epoch": 2602} {"train_loss": -43.1104850769043, "global_step": 314915, "epoch": 2602} {"train_loss": -43.40511703491211, "global_step": 314916, "epoch": 2602} {"train_loss": -34.830848693847656, "global_step": 314917, "epoch": 2602} {"train_loss": -37.3642463684082, "global_step": 314918, "epoch": 2602} {"train_loss": -42.08406448364258, "global_step": 314919, "epoch": 2602} {"train_loss": -42.264129638671875, "global_step": 314920, "epoch": 2602} {"train_loss": -42.276588439941406, "global_step": 314921, "epoch": 2602} {"train_loss": -40.38642501831055, "global_step": 314922, "epoch": 2602} {"train_loss": -40.96037673950195, "global_step": 314923, "epoch": 2602} {"train_loss": -41.74067306518555, "global_step": 314924, "epoch": 2602} {"train_loss": -41.949493408203125, "global_step": 314925, "epoch": 2602} {"train_loss": -39.26340866088867, "global_step": 314926, "epoch": 2602} {"train_loss": -42.13872528076172, "global_step": 314927, "epoch": 2602} {"train_loss": -39.961212158203125, "global_step": 314928, "epoch": 2602} {"train_loss": -38.99576950073242, "global_step": 314929, "epoch": 2602} {"train_loss": -41.43343734741211, "global_step": 314930, "epoch": 2602} {"train_loss": -41.343658447265625, "global_step": 314931, "epoch": 2602} {"train_loss": -41.82523727416992, "global_step": 314932, "epoch": 2602} {"train_loss": -40.220420837402344, "global_step": 314933, "epoch": 2602} {"train_loss": -39.264564514160156, "global_step": 314934, "epoch": 2602} {"train_loss": -36.84050369262695, "global_step": 314935, "epoch": 2602} {"train_loss": -40.518733978271484, "global_step": 314936, "epoch": 2602} {"train_loss": -41.170833587646484, "global_step": 314937, "epoch": 2602} {"train_loss": -40.96392059326172, "global_step": 314938, "epoch": 2602} {"train_loss": -40.65129089355469, "global_step": 314939, "epoch": 2602} {"train_loss": -39.49058151245117, "global_step": 314940, "epoch": 2602} {"train_loss": -39.08146286010742, "global_step": 314941, "epoch": 2602} {"train_loss": -39.20695114135742, "global_step": 314942, "epoch": 2602} {"train_loss": -36.2359733581543, "global_step": 314943, "epoch": 2602} {"train_loss": -35.89693069458008, "global_step": 314944, "epoch": 2602} {"train_loss": -39.964332580566406, "global_step": 314945, "epoch": 2602} {"train_loss": -37.15803146362305, "global_step": 314946, "epoch": 2602} {"train_loss": -39.15924835205078, "global_step": 314947, "epoch": 2602} {"train_loss": -40.56096649169922, "global_step": 314948, "epoch": 2602} {"train_loss": -36.80906295776367, "global_step": 314949, "epoch": 2602} {"train_loss": -40.413875579833984, "global_step": 314950, "epoch": 2602} {"train_loss": -41.687896728515625, "global_step": 314951, "epoch": 2602} {"train_loss": -36.783973693847656, "global_step": 314952, "epoch": 2602} {"train_loss": -40.79038619995117, "global_step": 314953, "epoch": 2602} {"train_loss": -41.0233268737793, "global_step": 314954, "epoch": 2602} {"train_loss": -37.420631408691406, "global_step": 314955, "epoch": 2602} {"train_loss": -37.244075775146484, "global_step": 314956, "epoch": 2602} {"train_loss": -38.459068298339844, "global_step": 314957, "epoch": 2602} {"train_loss": -39.85792541503906, "global_step": 314958, "epoch": 2602} {"train_loss": -41.511505126953125, "global_step": 314959, "epoch": 2602} {"train_loss": -42.02832794189453, "global_step": 314960, "epoch": 2602} {"train_loss": -40.25611877441406, "global_step": 314961, "epoch": 2602} {"train_loss": -40.70821929175006, "global_step": 314962, "epoch": 2602, "val_loss": 2650619.25} {"train_loss": -40.71687316894531, "global_step": 314963, "epoch": 2603} {"train_loss": -40.7286491394043, "global_step": 314964, "epoch": 2603} {"train_loss": -41.54499053955078, "global_step": 314965, "epoch": 2603} {"train_loss": -41.183815002441406, "global_step": 314966, "epoch": 2603} {"train_loss": -40.716304779052734, "global_step": 314967, "epoch": 2603} {"train_loss": -41.790409088134766, "global_step": 314968, "epoch": 2603} {"train_loss": -40.867977142333984, "global_step": 314969, "epoch": 2603} {"train_loss": -38.33964157104492, "global_step": 314970, "epoch": 2603} {"train_loss": -41.416290283203125, "global_step": 314971, "epoch": 2603} {"train_loss": -41.531307220458984, "global_step": 314972, "epoch": 2603} {"train_loss": -41.65462112426758, "global_step": 314973, "epoch": 2603} {"train_loss": -42.06947708129883, "global_step": 314974, "epoch": 2603} {"train_loss": -41.89990997314453, "global_step": 314975, "epoch": 2603} {"train_loss": -41.4537467956543, "global_step": 314976, "epoch": 2603} {"train_loss": -41.641876220703125, "global_step": 314977, "epoch": 2603} {"train_loss": -41.85626220703125, "global_step": 314978, "epoch": 2603} {"train_loss": -41.86220169067383, "global_step": 314979, "epoch": 2603} {"train_loss": -41.97422409057617, "global_step": 314980, "epoch": 2603} {"train_loss": -41.264068603515625, "global_step": 314981, "epoch": 2603} {"train_loss": -42.154083251953125, "global_step": 314982, "epoch": 2603} {"train_loss": -42.29767990112305, "global_step": 314983, "epoch": 2603} {"train_loss": -42.60270690917969, "global_step": 314984, "epoch": 2603} {"train_loss": -42.83097839355469, "global_step": 314985, "epoch": 2603} {"train_loss": -42.34613037109375, "global_step": 314986, "epoch": 2603} {"train_loss": -41.40277862548828, "global_step": 314987, "epoch": 2603} {"train_loss": -42.316505432128906, "global_step": 314988, "epoch": 2603} {"train_loss": -41.5578727722168, "global_step": 314989, "epoch": 2603} {"train_loss": -42.572242736816406, "global_step": 314990, "epoch": 2603} {"train_loss": -42.33596420288086, "global_step": 314991, "epoch": 2603} {"train_loss": -42.86920928955078, "global_step": 314992, "epoch": 2603} {"train_loss": -42.46333312988281, "global_step": 314993, "epoch": 2603} {"train_loss": -42.79849624633789, "global_step": 314994, "epoch": 2603} {"train_loss": -42.34345245361328, "global_step": 314995, "epoch": 2603} {"train_loss": -42.25027084350586, "global_step": 314996, "epoch": 2603} {"train_loss": -42.81783676147461, "global_step": 314997, "epoch": 2603} {"train_loss": -43.18411636352539, "global_step": 314998, "epoch": 2603} {"train_loss": -42.4373893737793, "global_step": 314999, "epoch": 2603} {"train_loss": -42.84444808959961, "global_step": 315000, "epoch": 2603} {"train_loss": -43.131710052490234, "global_step": 315001, "epoch": 2603} {"train_loss": -40.632667541503906, "global_step": 315002, "epoch": 2603} {"train_loss": -41.96389389038086, "global_step": 315003, "epoch": 2603} {"train_loss": -43.26907730102539, "global_step": 315004, "epoch": 2603} {"train_loss": -42.68255615234375, "global_step": 315005, "epoch": 2603} {"train_loss": -42.2000732421875, "global_step": 315006, "epoch": 2603} {"train_loss": -43.10927963256836, "global_step": 315007, "epoch": 2603} {"train_loss": -43.389808654785156, "global_step": 315008, "epoch": 2603} {"train_loss": -42.679080963134766, "global_step": 315009, "epoch": 2603} {"train_loss": -43.29833221435547, "global_step": 315010, "epoch": 2603} {"train_loss": -43.6870002746582, "global_step": 315011, "epoch": 2603} {"train_loss": -42.8282470703125, "global_step": 315012, "epoch": 2603} {"train_loss": -43.53938293457031, "global_step": 315013, "epoch": 2603} {"train_loss": -43.3221549987793, "global_step": 315014, "epoch": 2603} {"train_loss": -43.73936080932617, "global_step": 315015, "epoch": 2603} {"train_loss": -43.452911376953125, "global_step": 315016, "epoch": 2603} {"train_loss": -43.48940658569336, "global_step": 315017, "epoch": 2603} {"train_loss": -43.67692947387695, "global_step": 315018, "epoch": 2603} {"train_loss": -43.76305389404297, "global_step": 315019, "epoch": 2603} {"train_loss": -43.00501251220703, "global_step": 315020, "epoch": 2603} {"train_loss": -42.83625411987305, "global_step": 315021, "epoch": 2603} {"train_loss": -43.537864685058594, "global_step": 315022, "epoch": 2603} {"train_loss": -43.10288619995117, "global_step": 315023, "epoch": 2603} {"train_loss": -43.816864013671875, "global_step": 315024, "epoch": 2603} {"train_loss": -42.43931198120117, "global_step": 315025, "epoch": 2603} {"train_loss": -43.46379089355469, "global_step": 315026, "epoch": 2603} {"train_loss": -42.89306640625, "global_step": 315027, "epoch": 2603} {"train_loss": -42.861446380615234, "global_step": 315028, "epoch": 2603} {"train_loss": -43.20740509033203, "global_step": 315029, "epoch": 2603} {"train_loss": -42.985225677490234, "global_step": 315030, "epoch": 2603} {"train_loss": -43.429317474365234, "global_step": 315031, "epoch": 2603} {"train_loss": -43.46543502807617, "global_step": 315032, "epoch": 2603} {"train_loss": -43.617977142333984, "global_step": 315033, "epoch": 2603} {"train_loss": -43.76484298706055, "global_step": 315034, "epoch": 2603} {"train_loss": -43.83707809448242, "global_step": 315035, "epoch": 2603} {"train_loss": -42.82025146484375, "global_step": 315036, "epoch": 2603} {"train_loss": -43.91267013549805, "global_step": 315037, "epoch": 2603} {"train_loss": -42.356502532958984, "global_step": 315038, "epoch": 2603} {"train_loss": -43.40028762817383, "global_step": 315039, "epoch": 2603} {"train_loss": -43.69287109375, "global_step": 315040, "epoch": 2603} {"train_loss": -43.63778305053711, "global_step": 315041, "epoch": 2603} {"train_loss": -43.638607025146484, "global_step": 315042, "epoch": 2603} {"train_loss": -43.475311279296875, "global_step": 315043, "epoch": 2603} {"train_loss": -41.8206901550293, "global_step": 315044, "epoch": 2603} {"train_loss": -43.8304328918457, "global_step": 315045, "epoch": 2603} {"train_loss": -43.67268753051758, "global_step": 315046, "epoch": 2603} {"train_loss": -43.15884017944336, "global_step": 315047, "epoch": 2603} {"train_loss": -42.45863723754883, "global_step": 315048, "epoch": 2603} {"train_loss": -41.38251876831055, "global_step": 315049, "epoch": 2603} {"train_loss": -41.01143264770508, "global_step": 315050, "epoch": 2603} {"train_loss": -41.566741943359375, "global_step": 315051, "epoch": 2603} {"train_loss": -42.01949691772461, "global_step": 315052, "epoch": 2603} {"train_loss": -43.39850997924805, "global_step": 315053, "epoch": 2603} {"train_loss": -43.284908294677734, "global_step": 315054, "epoch": 2603} {"train_loss": -43.26646041870117, "global_step": 315055, "epoch": 2603} {"train_loss": -43.68906784057617, "global_step": 315056, "epoch": 2603} {"train_loss": -43.53544616699219, "global_step": 315057, "epoch": 2603} {"train_loss": -42.98504638671875, "global_step": 315058, "epoch": 2603} {"train_loss": -43.67377853393555, "global_step": 315059, "epoch": 2603} {"train_loss": -42.88247299194336, "global_step": 315060, "epoch": 2603} {"train_loss": -43.60139465332031, "global_step": 315061, "epoch": 2603} {"train_loss": -43.16668701171875, "global_step": 315062, "epoch": 2603} {"train_loss": -43.40727233886719, "global_step": 315063, "epoch": 2603} {"train_loss": -43.5567512512207, "global_step": 315064, "epoch": 2603} {"train_loss": -43.48543167114258, "global_step": 315065, "epoch": 2603} {"train_loss": -42.824825286865234, "global_step": 315066, "epoch": 2603} {"train_loss": -43.237892150878906, "global_step": 315067, "epoch": 2603} {"train_loss": -42.295955657958984, "global_step": 315068, "epoch": 2603} {"train_loss": -43.45138168334961, "global_step": 315069, "epoch": 2603} {"train_loss": -43.231597900390625, "global_step": 315070, "epoch": 2603} {"train_loss": -43.476253509521484, "global_step": 315071, "epoch": 2603} {"train_loss": -43.10917282104492, "global_step": 315072, "epoch": 2603} {"train_loss": -41.104740142822266, "global_step": 315073, "epoch": 2603} {"train_loss": -39.1161003112793, "global_step": 315074, "epoch": 2603} {"train_loss": -38.154972076416016, "global_step": 315075, "epoch": 2603} {"train_loss": -37.47265625, "global_step": 315076, "epoch": 2603} {"train_loss": -40.00651931762695, "global_step": 315077, "epoch": 2603} {"train_loss": -43.38393783569336, "global_step": 315078, "epoch": 2603} {"train_loss": -39.77199935913086, "global_step": 315079, "epoch": 2603} {"train_loss": -37.29099655151367, "global_step": 315080, "epoch": 2603} {"train_loss": -41.99964141845703, "global_step": 315081, "epoch": 2603} {"train_loss": -41.83016586303711, "global_step": 315082, "epoch": 2603} {"train_loss": -42.4232860596712, "global_step": 315083, "epoch": 2603, "val_loss": 2707598.75} {"train_loss": -41.91788864135742, "global_step": 315084, "epoch": 2604} {"train_loss": -41.23981475830078, "global_step": 315085, "epoch": 2604} {"train_loss": -40.849266052246094, "global_step": 315086, "epoch": 2604} {"train_loss": -42.1620979309082, "global_step": 315087, "epoch": 2604} {"train_loss": -42.58441162109375, "global_step": 315088, "epoch": 2604} {"train_loss": -41.99884033203125, "global_step": 315089, "epoch": 2604} {"train_loss": -42.56388473510742, "global_step": 315090, "epoch": 2604} {"train_loss": -40.39117431640625, "global_step": 315091, "epoch": 2604} {"train_loss": -42.474365234375, "global_step": 315092, "epoch": 2604} {"train_loss": -42.291378021240234, "global_step": 315093, "epoch": 2604} {"train_loss": -41.377227783203125, "global_step": 315094, "epoch": 2604} {"train_loss": -43.00358963012695, "global_step": 315095, "epoch": 2604} {"train_loss": -41.359283447265625, "global_step": 315096, "epoch": 2604} {"train_loss": -42.515899658203125, "global_step": 315097, "epoch": 2604} {"train_loss": -42.97927474975586, "global_step": 315098, "epoch": 2604} {"train_loss": -42.800052642822266, "global_step": 315099, "epoch": 2604} {"train_loss": -43.26467514038086, "global_step": 315100, "epoch": 2604} {"train_loss": -42.882667541503906, "global_step": 315101, "epoch": 2604} {"train_loss": -43.108428955078125, "global_step": 315102, "epoch": 2604} {"train_loss": -42.901878356933594, "global_step": 315103, "epoch": 2604} {"train_loss": -43.409420013427734, "global_step": 315104, "epoch": 2604} {"train_loss": -43.36520004272461, "global_step": 315105, "epoch": 2604} {"train_loss": -43.16963195800781, "global_step": 315106, "epoch": 2604} {"train_loss": -43.15473556518555, "global_step": 315107, "epoch": 2604} {"train_loss": -43.463653564453125, "global_step": 315108, "epoch": 2604} {"train_loss": -43.25230407714844, "global_step": 315109, "epoch": 2604} {"train_loss": -43.163936614990234, "global_step": 315110, "epoch": 2604} {"train_loss": -43.14557647705078, "global_step": 315111, "epoch": 2604} {"train_loss": -44.10464096069336, "global_step": 315112, "epoch": 2604} {"train_loss": -42.52097702026367, "global_step": 315113, "epoch": 2604} {"train_loss": -43.59226989746094, "global_step": 315114, "epoch": 2604} {"train_loss": -43.413482666015625, "global_step": 315115, "epoch": 2604} {"train_loss": -43.496185302734375, "global_step": 315116, "epoch": 2604} {"train_loss": -43.95270919799805, "global_step": 315117, "epoch": 2604} {"train_loss": -43.32204055786133, "global_step": 315118, "epoch": 2604} {"train_loss": -43.12251281738281, "global_step": 315119, "epoch": 2604} {"train_loss": -44.058982849121094, "global_step": 315120, "epoch": 2604} {"train_loss": -43.43740463256836, "global_step": 315121, "epoch": 2604} {"train_loss": -43.26332473754883, "global_step": 315122, "epoch": 2604} {"train_loss": -43.362945556640625, "global_step": 315123, "epoch": 2604} {"train_loss": -43.37080383300781, "global_step": 315124, "epoch": 2604} {"train_loss": -43.49309539794922, "global_step": 315125, "epoch": 2604} {"train_loss": -43.068538665771484, "global_step": 315126, "epoch": 2604} {"train_loss": -43.93619918823242, "global_step": 315127, "epoch": 2604} {"train_loss": -44.13883590698242, "global_step": 315128, "epoch": 2604} {"train_loss": -43.16154098510742, "global_step": 315129, "epoch": 2604} {"train_loss": -44.08051681518555, "global_step": 315130, "epoch": 2604} {"train_loss": -43.83185958862305, "global_step": 315131, "epoch": 2604} {"train_loss": -44.17266082763672, "global_step": 315132, "epoch": 2604} {"train_loss": -43.99625015258789, "global_step": 315133, "epoch": 2604} {"train_loss": -44.07028579711914, "global_step": 315134, "epoch": 2604} {"train_loss": -43.870235443115234, "global_step": 315135, "epoch": 2604} {"train_loss": -44.03396987915039, "global_step": 315136, "epoch": 2604} {"train_loss": -44.12350082397461, "global_step": 315137, "epoch": 2604} {"train_loss": -43.87807083129883, "global_step": 315138, "epoch": 2604} {"train_loss": -43.85014724731445, "global_step": 315139, "epoch": 2604} {"train_loss": -44.31990432739258, "global_step": 315140, "epoch": 2604} {"train_loss": -43.52213668823242, "global_step": 315141, "epoch": 2604} {"train_loss": -44.27427291870117, "global_step": 315142, "epoch": 2604} {"train_loss": -44.137630462646484, "global_step": 315143, "epoch": 2604} {"train_loss": -44.029964447021484, "global_step": 315144, "epoch": 2604} {"train_loss": -44.46881103515625, "global_step": 315145, "epoch": 2604} {"train_loss": -43.75328826904297, "global_step": 315146, "epoch": 2604} {"train_loss": -44.30971145629883, "global_step": 315147, "epoch": 2604} {"train_loss": -43.884552001953125, "global_step": 315148, "epoch": 2604} {"train_loss": -43.089046478271484, "global_step": 315149, "epoch": 2604} {"train_loss": -43.304786682128906, "global_step": 315150, "epoch": 2604} {"train_loss": -44.31829071044922, "global_step": 315151, "epoch": 2604} {"train_loss": -43.715667724609375, "global_step": 315152, "epoch": 2604} {"train_loss": -44.25346755981445, "global_step": 315153, "epoch": 2604} {"train_loss": -43.580116271972656, "global_step": 315154, "epoch": 2604} {"train_loss": -43.700157165527344, "global_step": 315155, "epoch": 2604} {"train_loss": -44.370052337646484, "global_step": 315156, "epoch": 2604} {"train_loss": -43.73637008666992, "global_step": 315157, "epoch": 2604} {"train_loss": -41.88136291503906, "global_step": 315158, "epoch": 2604} {"train_loss": -43.09132766723633, "global_step": 315159, "epoch": 2604} {"train_loss": -43.34562683105469, "global_step": 315160, "epoch": 2604} {"train_loss": -43.666622161865234, "global_step": 315161, "epoch": 2604} {"train_loss": -43.17205047607422, "global_step": 315162, "epoch": 2604} {"train_loss": -43.409584045410156, "global_step": 315163, "epoch": 2604} {"train_loss": -44.284603118896484, "global_step": 315164, "epoch": 2604} {"train_loss": -43.10254669189453, "global_step": 315165, "epoch": 2604} {"train_loss": -41.49746322631836, "global_step": 315166, "epoch": 2604} {"train_loss": -42.928157806396484, "global_step": 315167, "epoch": 2604} {"train_loss": -43.297428131103516, "global_step": 315168, "epoch": 2604} {"train_loss": -42.243080139160156, "global_step": 315169, "epoch": 2604} {"train_loss": -41.59287643432617, "global_step": 315170, "epoch": 2604} {"train_loss": -43.3862190246582, "global_step": 315171, "epoch": 2604} {"train_loss": -43.64570999145508, "global_step": 315172, "epoch": 2604} {"train_loss": -42.77213668823242, "global_step": 315173, "epoch": 2604} {"train_loss": -42.333980560302734, "global_step": 315174, "epoch": 2604} {"train_loss": -42.86530303955078, "global_step": 315175, "epoch": 2604} {"train_loss": -42.76638412475586, "global_step": 315176, "epoch": 2604} {"train_loss": -41.409454345703125, "global_step": 315177, "epoch": 2604} {"train_loss": -42.779640197753906, "global_step": 315178, "epoch": 2604} {"train_loss": -42.993431091308594, "global_step": 315179, "epoch": 2604} {"train_loss": -41.83723068237305, "global_step": 315180, "epoch": 2604} {"train_loss": -42.81020736694336, "global_step": 315181, "epoch": 2604} {"train_loss": -43.20307922363281, "global_step": 315182, "epoch": 2604} {"train_loss": -42.482643127441406, "global_step": 315183, "epoch": 2604} {"train_loss": -43.71456527709961, "global_step": 315184, "epoch": 2604} {"train_loss": -42.42472457885742, "global_step": 315185, "epoch": 2604} {"train_loss": -41.584510803222656, "global_step": 315186, "epoch": 2604} {"train_loss": -43.402496337890625, "global_step": 315187, "epoch": 2604} {"train_loss": -41.13068389892578, "global_step": 315188, "epoch": 2604} {"train_loss": -40.65188217163086, "global_step": 315189, "epoch": 2604} {"train_loss": -42.44783020019531, "global_step": 315190, "epoch": 2604} {"train_loss": -42.67893600463867, "global_step": 315191, "epoch": 2604} {"train_loss": -42.43999099731445, "global_step": 315192, "epoch": 2604} {"train_loss": -42.42328643798828, "global_step": 315193, "epoch": 2604} {"train_loss": -40.81744384765625, "global_step": 315194, "epoch": 2604} {"train_loss": -43.2718391418457, "global_step": 315195, "epoch": 2604} {"train_loss": -41.96866989135742, "global_step": 315196, "epoch": 2604} {"train_loss": -41.85205841064453, "global_step": 315197, "epoch": 2604} {"train_loss": -42.76311111450195, "global_step": 315198, "epoch": 2604} {"train_loss": -42.52375411987305, "global_step": 315199, "epoch": 2604} {"train_loss": -42.4611930847168, "global_step": 315200, "epoch": 2604} {"train_loss": -42.7476806640625, "global_step": 315201, "epoch": 2604} {"train_loss": -43.4727783203125, "global_step": 315202, "epoch": 2604} {"train_loss": -42.77177047729492, "global_step": 315203, "epoch": 2604} {"train_loss": -43.039632781478, "global_step": 315204, "epoch": 2604, "val_loss": 2759632.25} {"train_loss": -42.86422348022461, "global_step": 315205, "epoch": 2605} {"train_loss": -43.57638931274414, "global_step": 315206, "epoch": 2605} {"train_loss": -42.86639404296875, "global_step": 315207, "epoch": 2605} {"train_loss": -42.95247268676758, "global_step": 315208, "epoch": 2605} {"train_loss": -43.1367073059082, "global_step": 315209, "epoch": 2605} {"train_loss": -43.47637939453125, "global_step": 315210, "epoch": 2605} {"train_loss": -43.540828704833984, "global_step": 315211, "epoch": 2605} {"train_loss": -43.57600784301758, "global_step": 315212, "epoch": 2605} {"train_loss": -43.35331344604492, "global_step": 315213, "epoch": 2605} {"train_loss": -43.42621994018555, "global_step": 315214, "epoch": 2605} {"train_loss": -43.1356086730957, "global_step": 315215, "epoch": 2605} {"train_loss": -43.711177825927734, "global_step": 315216, "epoch": 2605} {"train_loss": -43.45111846923828, "global_step": 315217, "epoch": 2605} {"train_loss": -43.88505554199219, "global_step": 315218, "epoch": 2605} {"train_loss": -43.80410385131836, "global_step": 315219, "epoch": 2605} {"train_loss": -44.097389221191406, "global_step": 315220, "epoch": 2605} {"train_loss": -43.83642578125, "global_step": 315221, "epoch": 2605} {"train_loss": -43.85432815551758, "global_step": 315222, "epoch": 2605} {"train_loss": -44.266456604003906, "global_step": 315223, "epoch": 2605} {"train_loss": -44.15761184692383, "global_step": 315224, "epoch": 2605} {"train_loss": -43.62019729614258, "global_step": 315225, "epoch": 2605} {"train_loss": -44.280517578125, "global_step": 315226, "epoch": 2605} {"train_loss": -43.252620697021484, "global_step": 315227, "epoch": 2605} {"train_loss": -44.215087890625, "global_step": 315228, "epoch": 2605} {"train_loss": -43.962406158447266, "global_step": 315229, "epoch": 2605} {"train_loss": -44.30849075317383, "global_step": 315230, "epoch": 2605} {"train_loss": -44.29533004760742, "global_step": 315231, "epoch": 2605} {"train_loss": -43.71259307861328, "global_step": 315232, "epoch": 2605} {"train_loss": -44.214351654052734, "global_step": 315233, "epoch": 2605} {"train_loss": -44.02829360961914, "global_step": 315234, "epoch": 2605} {"train_loss": -43.9641227722168, "global_step": 315235, "epoch": 2605} {"train_loss": -43.93915939331055, "global_step": 315236, "epoch": 2605} {"train_loss": -44.241947174072266, "global_step": 315237, "epoch": 2605} {"train_loss": -44.3359260559082, "global_step": 315238, "epoch": 2605} {"train_loss": -43.936065673828125, "global_step": 315239, "epoch": 2605} {"train_loss": -44.31282424926758, "global_step": 315240, "epoch": 2605} {"train_loss": -43.86787796020508, "global_step": 315241, "epoch": 2605} {"train_loss": -44.705902099609375, "global_step": 315242, "epoch": 2605} {"train_loss": -44.02681350708008, "global_step": 315243, "epoch": 2605} {"train_loss": -43.34919357299805, "global_step": 315244, "epoch": 2605} {"train_loss": -44.63239288330078, "global_step": 315245, "epoch": 2605} {"train_loss": -44.41656494140625, "global_step": 315246, "epoch": 2605} {"train_loss": -44.45968246459961, "global_step": 315247, "epoch": 2605} {"train_loss": -44.371883392333984, "global_step": 315248, "epoch": 2605} {"train_loss": -44.35525131225586, "global_step": 315249, "epoch": 2605} {"train_loss": -44.66874313354492, "global_step": 315250, "epoch": 2605} {"train_loss": -44.654720306396484, "global_step": 315251, "epoch": 2605} {"train_loss": -44.88859558105469, "global_step": 315252, "epoch": 2605} {"train_loss": -44.09597396850586, "global_step": 315253, "epoch": 2605} {"train_loss": -43.77375030517578, "global_step": 315254, "epoch": 2605} {"train_loss": -43.659305572509766, "global_step": 315255, "epoch": 2605} {"train_loss": -41.76160430908203, "global_step": 315256, "epoch": 2605} {"train_loss": -37.70241165161133, "global_step": 315257, "epoch": 2605} {"train_loss": -29.352930068969727, "global_step": 315258, "epoch": 2605} {"train_loss": -28.26905632019043, "global_step": 315259, "epoch": 2605} {"train_loss": -39.5890998840332, "global_step": 315260, "epoch": 2605} {"train_loss": -39.53688430786133, "global_step": 315261, "epoch": 2605} {"train_loss": -35.63065719604492, "global_step": 315262, "epoch": 2605} {"train_loss": -40.970306396484375, "global_step": 315263, "epoch": 2605} {"train_loss": -39.43743133544922, "global_step": 315264, "epoch": 2605} {"train_loss": -38.02014923095703, "global_step": 315265, "epoch": 2605} {"train_loss": -41.62552261352539, "global_step": 315266, "epoch": 2605} {"train_loss": -39.8091926574707, "global_step": 315267, "epoch": 2605} {"train_loss": -42.2513427734375, "global_step": 315268, "epoch": 2605} {"train_loss": -40.41554641723633, "global_step": 315269, "epoch": 2605} {"train_loss": -41.93912887573242, "global_step": 315270, "epoch": 2605} {"train_loss": -40.3506965637207, "global_step": 315271, "epoch": 2605} {"train_loss": -39.69145584106445, "global_step": 315272, "epoch": 2605} {"train_loss": -42.105934143066406, "global_step": 315273, "epoch": 2605} {"train_loss": -39.96954345703125, "global_step": 315274, "epoch": 2605} {"train_loss": -42.386783599853516, "global_step": 315275, "epoch": 2605} {"train_loss": -39.58686065673828, "global_step": 315276, "epoch": 2605} {"train_loss": -43.05195236206055, "global_step": 315277, "epoch": 2605} {"train_loss": -41.70503234863281, "global_step": 315278, "epoch": 2605} {"train_loss": -42.64402389526367, "global_step": 315279, "epoch": 2605} {"train_loss": -42.05191421508789, "global_step": 315280, "epoch": 2605} {"train_loss": -43.164180755615234, "global_step": 315281, "epoch": 2605} {"train_loss": -43.071414947509766, "global_step": 315282, "epoch": 2605} {"train_loss": -42.76667022705078, "global_step": 315283, "epoch": 2605} {"train_loss": -43.5346794128418, "global_step": 315284, "epoch": 2605} {"train_loss": -43.425331115722656, "global_step": 315285, "epoch": 2605} {"train_loss": -42.742942810058594, "global_step": 315286, "epoch": 2605} {"train_loss": -43.42045211791992, "global_step": 315287, "epoch": 2605} {"train_loss": -43.068153381347656, "global_step": 315288, "epoch": 2605} {"train_loss": -43.58448791503906, "global_step": 315289, "epoch": 2605} {"train_loss": -43.35822296142578, "global_step": 315290, "epoch": 2605} {"train_loss": -43.779109954833984, "global_step": 315291, "epoch": 2605} {"train_loss": -43.62641143798828, "global_step": 315292, "epoch": 2605} {"train_loss": -43.71162033081055, "global_step": 315293, "epoch": 2605} {"train_loss": -43.57271194458008, "global_step": 315294, "epoch": 2605} {"train_loss": -43.98573303222656, "global_step": 315295, "epoch": 2605} {"train_loss": -43.88448715209961, "global_step": 315296, "epoch": 2605} {"train_loss": -43.8376579284668, "global_step": 315297, "epoch": 2605} {"train_loss": -44.0791015625, "global_step": 315298, "epoch": 2605} {"train_loss": -44.08274459838867, "global_step": 315299, "epoch": 2605} {"train_loss": -43.98773956298828, "global_step": 315300, "epoch": 2605} {"train_loss": -44.14677047729492, "global_step": 315301, "epoch": 2605} {"train_loss": -44.33171844482422, "global_step": 315302, "epoch": 2605} {"train_loss": -44.43095016479492, "global_step": 315303, "epoch": 2605} {"train_loss": -44.142547607421875, "global_step": 315304, "epoch": 2605} {"train_loss": -44.7294807434082, "global_step": 315305, "epoch": 2605} {"train_loss": -44.14982986450195, "global_step": 315306, "epoch": 2605} {"train_loss": -44.441585540771484, "global_step": 315307, "epoch": 2605} {"train_loss": -44.73527145385742, "global_step": 315308, "epoch": 2605} {"train_loss": -44.21504592895508, "global_step": 315309, "epoch": 2605} {"train_loss": -44.078792572021484, "global_step": 315310, "epoch": 2605} {"train_loss": -44.49320602416992, "global_step": 315311, "epoch": 2605} {"train_loss": -44.254608154296875, "global_step": 315312, "epoch": 2605} {"train_loss": -44.04004669189453, "global_step": 315313, "epoch": 2605} {"train_loss": -44.6860237121582, "global_step": 315314, "epoch": 2605} {"train_loss": -44.4996337890625, "global_step": 315315, "epoch": 2605} {"train_loss": -44.31814193725586, "global_step": 315316, "epoch": 2605} {"train_loss": -44.83325958251953, "global_step": 315317, "epoch": 2605} {"train_loss": -44.7033805847168, "global_step": 315318, "epoch": 2605} {"train_loss": -44.5903205871582, "global_step": 315319, "epoch": 2605} {"train_loss": -44.5252685546875, "global_step": 315320, "epoch": 2605} {"train_loss": -44.17033767700195, "global_step": 315321, "epoch": 2605} {"train_loss": -44.61531448364258, "global_step": 315322, "epoch": 2605} {"train_loss": -44.664581298828125, "global_step": 315323, "epoch": 2605} {"train_loss": -44.96429443359375, "global_step": 315324, "epoch": 2605} {"train_loss": -43.06794719853677, "global_step": 315325, "epoch": 2605, "val_loss": 2723494.75} {"train_loss": -44.26406478881836, "global_step": 315326, "epoch": 2606} {"train_loss": -44.93119430541992, "global_step": 315327, "epoch": 2606} {"train_loss": -44.64471435546875, "global_step": 315328, "epoch": 2606} {"train_loss": -44.65715408325195, "global_step": 315329, "epoch": 2606} {"train_loss": -44.896827697753906, "global_step": 315330, "epoch": 2606} {"train_loss": -44.29291915893555, "global_step": 315331, "epoch": 2606} {"train_loss": -44.49177932739258, "global_step": 315332, "epoch": 2606} {"train_loss": -44.476226806640625, "global_step": 315333, "epoch": 2606} {"train_loss": -44.135597229003906, "global_step": 315334, "epoch": 2606} {"train_loss": -44.57222366333008, "global_step": 315335, "epoch": 2606} {"train_loss": -44.61699676513672, "global_step": 315336, "epoch": 2606} {"train_loss": -44.80972671508789, "global_step": 315337, "epoch": 2606} {"train_loss": -44.81352615356445, "global_step": 315338, "epoch": 2606} {"train_loss": -44.83481979370117, "global_step": 315339, "epoch": 2606} {"train_loss": -44.758419036865234, "global_step": 315340, "epoch": 2606} {"train_loss": -44.8590087890625, "global_step": 315341, "epoch": 2606} {"train_loss": -44.99330520629883, "global_step": 315342, "epoch": 2606} {"train_loss": -44.996116638183594, "global_step": 315343, "epoch": 2606} {"train_loss": -44.85342788696289, "global_step": 315344, "epoch": 2606} {"train_loss": -45.09090805053711, "global_step": 315345, "epoch": 2606} {"train_loss": -44.36302947998047, "global_step": 315346, "epoch": 2606} {"train_loss": -44.52486801147461, "global_step": 315347, "epoch": 2606} {"train_loss": -43.39498519897461, "global_step": 315348, "epoch": 2606} {"train_loss": -43.461612701416016, "global_step": 315349, "epoch": 2606} {"train_loss": -43.43012619018555, "global_step": 315350, "epoch": 2606} {"train_loss": -44.159481048583984, "global_step": 315351, "epoch": 2606} {"train_loss": -44.45986557006836, "global_step": 315352, "epoch": 2606} {"train_loss": -44.458534240722656, "global_step": 315353, "epoch": 2606} {"train_loss": -44.0648078918457, "global_step": 315354, "epoch": 2606} {"train_loss": -43.76683044433594, "global_step": 315355, "epoch": 2606} {"train_loss": -44.85206985473633, "global_step": 315356, "epoch": 2606} {"train_loss": -43.82639694213867, "global_step": 315357, "epoch": 2606} {"train_loss": -42.801822662353516, "global_step": 315358, "epoch": 2606} {"train_loss": -41.854347229003906, "global_step": 315359, "epoch": 2606} {"train_loss": -41.01467514038086, "global_step": 315360, "epoch": 2606} {"train_loss": -41.808387756347656, "global_step": 315361, "epoch": 2606} {"train_loss": -41.45753479003906, "global_step": 315362, "epoch": 2606} {"train_loss": -43.11317825317383, "global_step": 315363, "epoch": 2606} {"train_loss": -41.790340423583984, "global_step": 315364, "epoch": 2606} {"train_loss": -39.80823516845703, "global_step": 315365, "epoch": 2606} {"train_loss": -37.35512924194336, "global_step": 315366, "epoch": 2606} {"train_loss": -41.20968246459961, "global_step": 315367, "epoch": 2606} {"train_loss": -42.369834899902344, "global_step": 315368, "epoch": 2606} {"train_loss": -39.59029006958008, "global_step": 315369, "epoch": 2606} {"train_loss": -38.22731399536133, "global_step": 315370, "epoch": 2606} {"train_loss": -42.87168502807617, "global_step": 315371, "epoch": 2606} {"train_loss": -41.86981201171875, "global_step": 315372, "epoch": 2606} {"train_loss": -39.71843719482422, "global_step": 315373, "epoch": 2606} {"train_loss": -41.24351501464844, "global_step": 315374, "epoch": 2606} {"train_loss": -41.130523681640625, "global_step": 315375, "epoch": 2606} {"train_loss": -40.61253356933594, "global_step": 315376, "epoch": 2606} {"train_loss": -40.13331604003906, "global_step": 315377, "epoch": 2606} {"train_loss": -40.83732986450195, "global_step": 315378, "epoch": 2606} {"train_loss": -42.537933349609375, "global_step": 315379, "epoch": 2606} {"train_loss": -41.0411376953125, "global_step": 315380, "epoch": 2606} {"train_loss": -41.35187530517578, "global_step": 315381, "epoch": 2606} {"train_loss": -42.17741012573242, "global_step": 315382, "epoch": 2606} {"train_loss": -39.56624221801758, "global_step": 315383, "epoch": 2606} {"train_loss": -42.26980209350586, "global_step": 315384, "epoch": 2606} {"train_loss": -40.764320373535156, "global_step": 315385, "epoch": 2606} {"train_loss": -41.18345260620117, "global_step": 315386, "epoch": 2606} {"train_loss": -42.82524490356445, "global_step": 315387, "epoch": 2606} {"train_loss": -40.9046516418457, "global_step": 315388, "epoch": 2606} {"train_loss": -42.72148132324219, "global_step": 315389, "epoch": 2606} {"train_loss": -41.85868835449219, "global_step": 315390, "epoch": 2606} {"train_loss": -43.43272018432617, "global_step": 315391, "epoch": 2606} {"train_loss": -42.701778411865234, "global_step": 315392, "epoch": 2606} {"train_loss": -43.209842681884766, "global_step": 315393, "epoch": 2606} {"train_loss": -43.06563186645508, "global_step": 315394, "epoch": 2606} {"train_loss": -42.92329788208008, "global_step": 315395, "epoch": 2606} {"train_loss": -42.70644760131836, "global_step": 315396, "epoch": 2606} {"train_loss": -43.32394790649414, "global_step": 315397, "epoch": 2606} {"train_loss": -42.60100555419922, "global_step": 315398, "epoch": 2606} {"train_loss": -43.041664123535156, "global_step": 315399, "epoch": 2606} {"train_loss": -42.7384147644043, "global_step": 315400, "epoch": 2606} {"train_loss": -42.99892807006836, "global_step": 315401, "epoch": 2606} {"train_loss": -43.1409797668457, "global_step": 315402, "epoch": 2606} {"train_loss": -43.72402572631836, "global_step": 315403, "epoch": 2606} {"train_loss": -43.043270111083984, "global_step": 315404, "epoch": 2606} {"train_loss": -43.176727294921875, "global_step": 315405, "epoch": 2606} {"train_loss": -42.622650146484375, "global_step": 315406, "epoch": 2606} {"train_loss": -43.77302169799805, "global_step": 315407, "epoch": 2606} {"train_loss": -42.37888717651367, "global_step": 315408, "epoch": 2606} {"train_loss": -44.050289154052734, "global_step": 315409, "epoch": 2606} {"train_loss": -42.96443557739258, "global_step": 315410, "epoch": 2606} {"train_loss": -43.374202728271484, "global_step": 315411, "epoch": 2606} {"train_loss": -43.57688522338867, "global_step": 315412, "epoch": 2606} {"train_loss": -43.97270965576172, "global_step": 315413, "epoch": 2606} {"train_loss": -43.9962272644043, "global_step": 315414, "epoch": 2606} {"train_loss": -44.027679443359375, "global_step": 315415, "epoch": 2606} {"train_loss": -43.9904899597168, "global_step": 315416, "epoch": 2606} {"train_loss": -44.07750701904297, "global_step": 315417, "epoch": 2606} {"train_loss": -43.501380920410156, "global_step": 315418, "epoch": 2606} {"train_loss": -44.18136215209961, "global_step": 315419, "epoch": 2606} {"train_loss": -43.6128044128418, "global_step": 315420, "epoch": 2606} {"train_loss": -44.1792106628418, "global_step": 315421, "epoch": 2606} {"train_loss": -43.4191780090332, "global_step": 315422, "epoch": 2606} {"train_loss": -43.90679931640625, "global_step": 315423, "epoch": 2606} {"train_loss": -43.89829635620117, "global_step": 315424, "epoch": 2606} {"train_loss": -44.129520416259766, "global_step": 315425, "epoch": 2606} {"train_loss": -43.888729095458984, "global_step": 315426, "epoch": 2606} {"train_loss": -43.70465850830078, "global_step": 315427, "epoch": 2606} {"train_loss": -44.35410690307617, "global_step": 315428, "epoch": 2606} {"train_loss": -43.93048095703125, "global_step": 315429, "epoch": 2606} {"train_loss": -43.686065673828125, "global_step": 315430, "epoch": 2606} {"train_loss": -44.395751953125, "global_step": 315431, "epoch": 2606} {"train_loss": -43.408668518066406, "global_step": 315432, "epoch": 2606} {"train_loss": -44.17269515991211, "global_step": 315433, "epoch": 2606} {"train_loss": -44.25570297241211, "global_step": 315434, "epoch": 2606} {"train_loss": -43.84080123901367, "global_step": 315435, "epoch": 2606} {"train_loss": -44.02937698364258, "global_step": 315436, "epoch": 2606} {"train_loss": -44.428157806396484, "global_step": 315437, "epoch": 2606} {"train_loss": -44.6219596862793, "global_step": 315438, "epoch": 2606} {"train_loss": -44.18026351928711, "global_step": 315439, "epoch": 2606} {"train_loss": -44.759334564208984, "global_step": 315440, "epoch": 2606} {"train_loss": -44.505672454833984, "global_step": 315441, "epoch": 2606} {"train_loss": -44.3972053527832, "global_step": 315442, "epoch": 2606} {"train_loss": -44.69731521606445, "global_step": 315443, "epoch": 2606} {"train_loss": -44.60630416870117, "global_step": 315444, "epoch": 2606} {"train_loss": -44.30332565307617, "global_step": 315445, "epoch": 2606} {"train_loss": -43.23208501516295, "global_step": 315446, "epoch": 2606, "val_loss": 2702571.75} {"train_loss": -43.9891242980957, "global_step": 315447, "epoch": 2607} {"train_loss": -44.215606689453125, "global_step": 315448, "epoch": 2607} {"train_loss": -44.92965316772461, "global_step": 315449, "epoch": 2607} {"train_loss": -44.0799674987793, "global_step": 315450, "epoch": 2607} {"train_loss": -44.26911544799805, "global_step": 315451, "epoch": 2607} {"train_loss": -44.341957092285156, "global_step": 315452, "epoch": 2607} {"train_loss": -44.57758712768555, "global_step": 315453, "epoch": 2607} {"train_loss": -44.632171630859375, "global_step": 315454, "epoch": 2607} {"train_loss": -44.167388916015625, "global_step": 315455, "epoch": 2607} {"train_loss": -44.813568115234375, "global_step": 315456, "epoch": 2607} {"train_loss": -44.78490447998047, "global_step": 315457, "epoch": 2607} {"train_loss": -44.92037582397461, "global_step": 315458, "epoch": 2607} {"train_loss": -44.707740783691406, "global_step": 315459, "epoch": 2607} {"train_loss": -45.141292572021484, "global_step": 315460, "epoch": 2607} {"train_loss": -44.32407760620117, "global_step": 315461, "epoch": 2607} {"train_loss": -44.8129997253418, "global_step": 315462, "epoch": 2607} {"train_loss": -44.5681037902832, "global_step": 315463, "epoch": 2607} {"train_loss": -43.974021911621094, "global_step": 315464, "epoch": 2607} {"train_loss": -43.61274719238281, "global_step": 315465, "epoch": 2607} {"train_loss": -42.64497756958008, "global_step": 315466, "epoch": 2607} {"train_loss": -43.84571838378906, "global_step": 315467, "epoch": 2607} {"train_loss": -44.86936950683594, "global_step": 315468, "epoch": 2607} {"train_loss": -43.92171859741211, "global_step": 315469, "epoch": 2607} {"train_loss": -43.35438537597656, "global_step": 315470, "epoch": 2607} {"train_loss": -43.653194427490234, "global_step": 315471, "epoch": 2607} {"train_loss": -44.48329544067383, "global_step": 315472, "epoch": 2607} {"train_loss": -44.07939529418945, "global_step": 315473, "epoch": 2607} {"train_loss": -43.7768669128418, "global_step": 315474, "epoch": 2607} {"train_loss": -43.797157287597656, "global_step": 315475, "epoch": 2607} {"train_loss": -43.74076843261719, "global_step": 315476, "epoch": 2607} {"train_loss": -42.35405349731445, "global_step": 315477, "epoch": 2607} {"train_loss": -41.775489807128906, "global_step": 315478, "epoch": 2607} {"train_loss": -43.53428268432617, "global_step": 315479, "epoch": 2607} {"train_loss": -43.54304122924805, "global_step": 315480, "epoch": 2607} {"train_loss": -42.65456771850586, "global_step": 315481, "epoch": 2607} {"train_loss": -43.99134063720703, "global_step": 315482, "epoch": 2607} {"train_loss": -40.70246887207031, "global_step": 315483, "epoch": 2607} {"train_loss": -37.43142318725586, "global_step": 315484, "epoch": 2607} {"train_loss": -38.43410110473633, "global_step": 315485, "epoch": 2607} {"train_loss": -40.52417755126953, "global_step": 315486, "epoch": 2607} {"train_loss": -41.27899932861328, "global_step": 315487, "epoch": 2607} {"train_loss": -43.03862380981445, "global_step": 315488, "epoch": 2607} {"train_loss": -41.317020416259766, "global_step": 315489, "epoch": 2607} {"train_loss": -42.18092727661133, "global_step": 315490, "epoch": 2607} {"train_loss": -41.89967727661133, "global_step": 315491, "epoch": 2607} {"train_loss": -40.48114776611328, "global_step": 315492, "epoch": 2607} {"train_loss": -42.137935638427734, "global_step": 315493, "epoch": 2607} {"train_loss": -42.0831298828125, "global_step": 315494, "epoch": 2607} {"train_loss": -40.4046516418457, "global_step": 315495, "epoch": 2607} {"train_loss": -42.07798385620117, "global_step": 315496, "epoch": 2607} {"train_loss": -42.27749252319336, "global_step": 315497, "epoch": 2607} {"train_loss": -41.901573181152344, "global_step": 315498, "epoch": 2607} {"train_loss": -42.279232025146484, "global_step": 315499, "epoch": 2607} {"train_loss": -43.39103317260742, "global_step": 315500, "epoch": 2607} {"train_loss": -41.71350860595703, "global_step": 315501, "epoch": 2607} {"train_loss": -43.59930419921875, "global_step": 315502, "epoch": 2607} {"train_loss": -43.357322692871094, "global_step": 315503, "epoch": 2607} {"train_loss": -43.700557708740234, "global_step": 315504, "epoch": 2607} {"train_loss": -43.98253631591797, "global_step": 315505, "epoch": 2607} {"train_loss": -43.43464279174805, "global_step": 315506, "epoch": 2607} {"train_loss": -43.92769241333008, "global_step": 315507, "epoch": 2607} {"train_loss": -43.94381332397461, "global_step": 315508, "epoch": 2607} {"train_loss": -43.27328109741211, "global_step": 315509, "epoch": 2607} {"train_loss": -44.19009017944336, "global_step": 315510, "epoch": 2607} {"train_loss": -43.70139694213867, "global_step": 315511, "epoch": 2607} {"train_loss": -43.7530632019043, "global_step": 315512, "epoch": 2607} {"train_loss": -44.22085189819336, "global_step": 315513, "epoch": 2607} {"train_loss": -43.44711685180664, "global_step": 315514, "epoch": 2607} {"train_loss": -43.803375244140625, "global_step": 315515, "epoch": 2607} {"train_loss": -43.88827133178711, "global_step": 315516, "epoch": 2607} {"train_loss": -43.67892074584961, "global_step": 315517, "epoch": 2607} {"train_loss": -44.10118865966797, "global_step": 315518, "epoch": 2607} {"train_loss": -43.68825912475586, "global_step": 315519, "epoch": 2607} {"train_loss": -44.306602478027344, "global_step": 315520, "epoch": 2607} {"train_loss": -43.16761016845703, "global_step": 315521, "epoch": 2607} {"train_loss": -44.03341293334961, "global_step": 315522, "epoch": 2607} {"train_loss": -43.972896575927734, "global_step": 315523, "epoch": 2607} {"train_loss": -43.62438201904297, "global_step": 315524, "epoch": 2607} {"train_loss": -44.42108917236328, "global_step": 315525, "epoch": 2607} {"train_loss": -43.63910675048828, "global_step": 315526, "epoch": 2607} {"train_loss": -44.4543571472168, "global_step": 315527, "epoch": 2607} {"train_loss": -44.18059158325195, "global_step": 315528, "epoch": 2607} {"train_loss": -43.72660446166992, "global_step": 315529, "epoch": 2607} {"train_loss": -44.34945297241211, "global_step": 315530, "epoch": 2607} {"train_loss": -43.30055618286133, "global_step": 315531, "epoch": 2607} {"train_loss": -43.572235107421875, "global_step": 315532, "epoch": 2607} {"train_loss": -44.4370231628418, "global_step": 315533, "epoch": 2607} {"train_loss": -43.942420959472656, "global_step": 315534, "epoch": 2607} {"train_loss": -43.48524856567383, "global_step": 315535, "epoch": 2607} {"train_loss": -44.08354949951172, "global_step": 315536, "epoch": 2607} {"train_loss": -44.01447677612305, "global_step": 315537, "epoch": 2607} {"train_loss": -42.92124557495117, "global_step": 315538, "epoch": 2607} {"train_loss": -43.081886291503906, "global_step": 315539, "epoch": 2607} {"train_loss": -43.834014892578125, "global_step": 315540, "epoch": 2607} {"train_loss": -42.48977279663086, "global_step": 315541, "epoch": 2607} {"train_loss": -42.84757614135742, "global_step": 315542, "epoch": 2607} {"train_loss": -44.49713897705078, "global_step": 315543, "epoch": 2607} {"train_loss": -42.99930953979492, "global_step": 315544, "epoch": 2607} {"train_loss": -41.71376419067383, "global_step": 315545, "epoch": 2607} {"train_loss": -43.217647552490234, "global_step": 315546, "epoch": 2607} {"train_loss": -41.896209716796875, "global_step": 315547, "epoch": 2607} {"train_loss": -42.257869720458984, "global_step": 315548, "epoch": 2607} {"train_loss": -42.18684005737305, "global_step": 315549, "epoch": 2607} {"train_loss": -43.485321044921875, "global_step": 315550, "epoch": 2607} {"train_loss": -42.27820587158203, "global_step": 315551, "epoch": 2607} {"train_loss": -42.445491790771484, "global_step": 315552, "epoch": 2607} {"train_loss": -42.770015716552734, "global_step": 315553, "epoch": 2607} {"train_loss": -40.91056442260742, "global_step": 315554, "epoch": 2607} {"train_loss": -43.642459869384766, "global_step": 315555, "epoch": 2607} {"train_loss": -41.775421142578125, "global_step": 315556, "epoch": 2607} {"train_loss": -42.1131706237793, "global_step": 315557, "epoch": 2607} {"train_loss": -42.09934616088867, "global_step": 315558, "epoch": 2607} {"train_loss": -42.82013702392578, "global_step": 315559, "epoch": 2607} {"train_loss": -42.182647705078125, "global_step": 315560, "epoch": 2607} {"train_loss": -42.90407943725586, "global_step": 315561, "epoch": 2607} {"train_loss": -43.50868225097656, "global_step": 315562, "epoch": 2607} {"train_loss": -43.07315444946289, "global_step": 315563, "epoch": 2607} {"train_loss": -43.031715393066406, "global_step": 315564, "epoch": 2607} {"train_loss": -43.853736877441406, "global_step": 315565, "epoch": 2607} {"train_loss": -42.51004409790039, "global_step": 315566, "epoch": 2607} {"train_loss": -43.23649404856784, "global_step": 315567, "epoch": 2607, "val_loss": 2710874.75} {"train_loss": -43.30037307739258, "global_step": 315568, "epoch": 2608} {"train_loss": -43.751121520996094, "global_step": 315569, "epoch": 2608} {"train_loss": -43.70029830932617, "global_step": 315570, "epoch": 2608} {"train_loss": -43.428436279296875, "global_step": 315571, "epoch": 2608} {"train_loss": -43.79673385620117, "global_step": 315572, "epoch": 2608} {"train_loss": -43.55556869506836, "global_step": 315573, "epoch": 2608} {"train_loss": -43.693721771240234, "global_step": 315574, "epoch": 2608} {"train_loss": -43.27242660522461, "global_step": 315575, "epoch": 2608} {"train_loss": -44.040870666503906, "global_step": 315576, "epoch": 2608} {"train_loss": -43.58858871459961, "global_step": 315577, "epoch": 2608} {"train_loss": -43.072444915771484, "global_step": 315578, "epoch": 2608} {"train_loss": -44.70867919921875, "global_step": 315579, "epoch": 2608} {"train_loss": -43.97880172729492, "global_step": 315580, "epoch": 2608} {"train_loss": -43.88468551635742, "global_step": 315581, "epoch": 2608} {"train_loss": -44.51043701171875, "global_step": 315582, "epoch": 2608} {"train_loss": -43.99742889404297, "global_step": 315583, "epoch": 2608} {"train_loss": -44.0545539855957, "global_step": 315584, "epoch": 2608} {"train_loss": -44.111576080322266, "global_step": 315585, "epoch": 2608} {"train_loss": -44.029640197753906, "global_step": 315586, "epoch": 2608} {"train_loss": -43.99176025390625, "global_step": 315587, "epoch": 2608} {"train_loss": -44.523155212402344, "global_step": 315588, "epoch": 2608} {"train_loss": -44.67243194580078, "global_step": 315589, "epoch": 2608} {"train_loss": -44.57617950439453, "global_step": 315590, "epoch": 2608} {"train_loss": -44.60329818725586, "global_step": 315591, "epoch": 2608} {"train_loss": -44.34212112426758, "global_step": 315592, "epoch": 2608} {"train_loss": -44.476417541503906, "global_step": 315593, "epoch": 2608} {"train_loss": -45.013362884521484, "global_step": 315594, "epoch": 2608} {"train_loss": -44.60880661010742, "global_step": 315595, "epoch": 2608} {"train_loss": -44.82351303100586, "global_step": 315596, "epoch": 2608} {"train_loss": -45.15618896484375, "global_step": 315597, "epoch": 2608} {"train_loss": -44.47990417480469, "global_step": 315598, "epoch": 2608} {"train_loss": -44.541927337646484, "global_step": 315599, "epoch": 2608} {"train_loss": -44.53701400756836, "global_step": 315600, "epoch": 2608} {"train_loss": -44.68553161621094, "global_step": 315601, "epoch": 2608} {"train_loss": -44.950069427490234, "global_step": 315602, "epoch": 2608} {"train_loss": -45.021156311035156, "global_step": 315603, "epoch": 2608} {"train_loss": -44.16658020019531, "global_step": 315604, "epoch": 2608} {"train_loss": -45.00550079345703, "global_step": 315605, "epoch": 2608} {"train_loss": -45.179054260253906, "global_step": 315606, "epoch": 2608} {"train_loss": -44.16547393798828, "global_step": 315607, "epoch": 2608} {"train_loss": -44.78220748901367, "global_step": 315608, "epoch": 2608} {"train_loss": -45.05066680908203, "global_step": 315609, "epoch": 2608} {"train_loss": -44.37175369262695, "global_step": 315610, "epoch": 2608} {"train_loss": -44.3030891418457, "global_step": 315611, "epoch": 2608} {"train_loss": -45.09348678588867, "global_step": 315612, "epoch": 2608} {"train_loss": -45.11103439331055, "global_step": 315613, "epoch": 2608} {"train_loss": -44.35633850097656, "global_step": 315614, "epoch": 2608} {"train_loss": -45.07877731323242, "global_step": 315615, "epoch": 2608} {"train_loss": -45.11386489868164, "global_step": 315616, "epoch": 2608} {"train_loss": -44.82174301147461, "global_step": 315617, "epoch": 2608} {"train_loss": -44.209808349609375, "global_step": 315618, "epoch": 2608} {"train_loss": -44.10999298095703, "global_step": 315619, "epoch": 2608} {"train_loss": -44.955806732177734, "global_step": 315620, "epoch": 2608} {"train_loss": -45.30514907836914, "global_step": 315621, "epoch": 2608} {"train_loss": -45.223594665527344, "global_step": 315622, "epoch": 2608} {"train_loss": -45.10685348510742, "global_step": 315623, "epoch": 2608} {"train_loss": -44.862701416015625, "global_step": 315624, "epoch": 2608} {"train_loss": -44.50360870361328, "global_step": 315625, "epoch": 2608} {"train_loss": -44.46684646606445, "global_step": 315626, "epoch": 2608} {"train_loss": -43.296138763427734, "global_step": 315627, "epoch": 2608} {"train_loss": -41.294273376464844, "global_step": 315628, "epoch": 2608} {"train_loss": -42.33877182006836, "global_step": 315629, "epoch": 2608} {"train_loss": -44.09735870361328, "global_step": 315630, "epoch": 2608} {"train_loss": -44.319847106933594, "global_step": 315631, "epoch": 2608} {"train_loss": -43.34617233276367, "global_step": 315632, "epoch": 2608} {"train_loss": -43.50689697265625, "global_step": 315633, "epoch": 2608} {"train_loss": -42.361915588378906, "global_step": 315634, "epoch": 2608} {"train_loss": -41.1276741027832, "global_step": 315635, "epoch": 2608} {"train_loss": -39.4135856628418, "global_step": 315636, "epoch": 2608} {"train_loss": -40.049072265625, "global_step": 315637, "epoch": 2608} {"train_loss": -42.961360931396484, "global_step": 315638, "epoch": 2608} {"train_loss": -41.25318908691406, "global_step": 315639, "epoch": 2608} {"train_loss": -39.73032760620117, "global_step": 315640, "epoch": 2608} {"train_loss": -39.12056350708008, "global_step": 315641, "epoch": 2608} {"train_loss": -40.47344970703125, "global_step": 315642, "epoch": 2608} {"train_loss": -41.87556076049805, "global_step": 315643, "epoch": 2608} {"train_loss": -40.30874252319336, "global_step": 315644, "epoch": 2608} {"train_loss": -41.72058868408203, "global_step": 315645, "epoch": 2608} {"train_loss": -40.86115264892578, "global_step": 315646, "epoch": 2608} {"train_loss": -40.66718673706055, "global_step": 315647, "epoch": 2608} {"train_loss": -42.05348587036133, "global_step": 315648, "epoch": 2608} {"train_loss": -39.79053497314453, "global_step": 315649, "epoch": 2608} {"train_loss": -39.89620590209961, "global_step": 315650, "epoch": 2608} {"train_loss": -39.68771743774414, "global_step": 315651, "epoch": 2608} {"train_loss": -42.69497299194336, "global_step": 315652, "epoch": 2608} {"train_loss": -42.7061882019043, "global_step": 315653, "epoch": 2608} {"train_loss": -42.71923828125, "global_step": 315654, "epoch": 2608} {"train_loss": -43.136714935302734, "global_step": 315655, "epoch": 2608} {"train_loss": -42.58384704589844, "global_step": 315656, "epoch": 2608} {"train_loss": -42.83332443237305, "global_step": 315657, "epoch": 2608} {"train_loss": -43.28827667236328, "global_step": 315658, "epoch": 2608} {"train_loss": -41.4776611328125, "global_step": 315659, "epoch": 2608} {"train_loss": -41.150238037109375, "global_step": 315660, "epoch": 2608} {"train_loss": -43.42641830444336, "global_step": 315661, "epoch": 2608} {"train_loss": -41.843868255615234, "global_step": 315662, "epoch": 2608} {"train_loss": -41.07240295410156, "global_step": 315663, "epoch": 2608} {"train_loss": -43.72487258911133, "global_step": 315664, "epoch": 2608} {"train_loss": -42.49831008911133, "global_step": 315665, "epoch": 2608} {"train_loss": -42.1359748840332, "global_step": 315666, "epoch": 2608} {"train_loss": -43.18099594116211, "global_step": 315667, "epoch": 2608} {"train_loss": -42.9457893371582, "global_step": 315668, "epoch": 2608} {"train_loss": -43.66870880126953, "global_step": 315669, "epoch": 2608} {"train_loss": -43.426753997802734, "global_step": 315670, "epoch": 2608} {"train_loss": -43.08414840698242, "global_step": 315671, "epoch": 2608} {"train_loss": -43.29146957397461, "global_step": 315672, "epoch": 2608} {"train_loss": -43.33528518676758, "global_step": 315673, "epoch": 2608} {"train_loss": -43.340641021728516, "global_step": 315674, "epoch": 2608} {"train_loss": -43.921085357666016, "global_step": 315675, "epoch": 2608} {"train_loss": -44.00657272338867, "global_step": 315676, "epoch": 2608} {"train_loss": -43.891231536865234, "global_step": 315677, "epoch": 2608} {"train_loss": -44.34954833984375, "global_step": 315678, "epoch": 2608} {"train_loss": -43.805519104003906, "global_step": 315679, "epoch": 2608} {"train_loss": -44.14094543457031, "global_step": 315680, "epoch": 2608} {"train_loss": -44.08744812011719, "global_step": 315681, "epoch": 2608} {"train_loss": -43.85280990600586, "global_step": 315682, "epoch": 2608} {"train_loss": -44.19917678833008, "global_step": 315683, "epoch": 2608} {"train_loss": -44.0904426574707, "global_step": 315684, "epoch": 2608} {"train_loss": -44.266273498535156, "global_step": 315685, "epoch": 2608} {"train_loss": -44.283912658691406, "global_step": 315686, "epoch": 2608} {"train_loss": -44.21479415893555, "global_step": 315687, "epoch": 2608} {"train_loss": -43.45205701087132, "global_step": 315688, "epoch": 2608, "val_loss": 2697579.25} {"train_loss": -44.509822845458984, "global_step": 315689, "epoch": 2609} {"train_loss": -44.84632873535156, "global_step": 315690, "epoch": 2609} {"train_loss": -44.27512741088867, "global_step": 315691, "epoch": 2609} {"train_loss": -44.91102981567383, "global_step": 315692, "epoch": 2609} {"train_loss": -44.582271575927734, "global_step": 315693, "epoch": 2609} {"train_loss": -44.745033264160156, "global_step": 315694, "epoch": 2609} {"train_loss": -44.11152267456055, "global_step": 315695, "epoch": 2609} {"train_loss": -45.02128982543945, "global_step": 315696, "epoch": 2609} {"train_loss": -44.70675277709961, "global_step": 315697, "epoch": 2609} {"train_loss": -44.557613372802734, "global_step": 315698, "epoch": 2609} {"train_loss": -45.0104866027832, "global_step": 315699, "epoch": 2609} {"train_loss": -44.786067962646484, "global_step": 315700, "epoch": 2609} {"train_loss": -44.9694938659668, "global_step": 315701, "epoch": 2609} {"train_loss": -45.14807891845703, "global_step": 315702, "epoch": 2609} {"train_loss": -44.56941223144531, "global_step": 315703, "epoch": 2609} {"train_loss": -44.81492233276367, "global_step": 315704, "epoch": 2609} {"train_loss": -45.223350524902344, "global_step": 315705, "epoch": 2609} {"train_loss": -45.17720413208008, "global_step": 315706, "epoch": 2609} {"train_loss": -44.93264389038086, "global_step": 315707, "epoch": 2609} {"train_loss": -44.875244140625, "global_step": 315708, "epoch": 2609} {"train_loss": -44.96843719482422, "global_step": 315709, "epoch": 2609} {"train_loss": -44.7984733581543, "global_step": 315710, "epoch": 2609} {"train_loss": -45.10723876953125, "global_step": 315711, "epoch": 2609} {"train_loss": -44.7875862121582, "global_step": 315712, "epoch": 2609} {"train_loss": -44.891029357910156, "global_step": 315713, "epoch": 2609} {"train_loss": -45.00567626953125, "global_step": 315714, "epoch": 2609} {"train_loss": -44.319801330566406, "global_step": 315715, "epoch": 2609} {"train_loss": -45.13450241088867, "global_step": 315716, "epoch": 2609} {"train_loss": -44.18783187866211, "global_step": 315717, "epoch": 2609} {"train_loss": -43.7054557800293, "global_step": 315718, "epoch": 2609} {"train_loss": -44.70374298095703, "global_step": 315719, "epoch": 2609} {"train_loss": -44.53924560546875, "global_step": 315720, "epoch": 2609} {"train_loss": -45.148006439208984, "global_step": 315721, "epoch": 2609} {"train_loss": -44.05445098876953, "global_step": 315722, "epoch": 2609} {"train_loss": -44.672908782958984, "global_step": 315723, "epoch": 2609} {"train_loss": -44.93433380126953, "global_step": 315724, "epoch": 2609} {"train_loss": -44.70457077026367, "global_step": 315725, "epoch": 2609} {"train_loss": -44.346778869628906, "global_step": 315726, "epoch": 2609} {"train_loss": -44.115753173828125, "global_step": 315727, "epoch": 2609} {"train_loss": -44.905982971191406, "global_step": 315728, "epoch": 2609} {"train_loss": -44.77219772338867, "global_step": 315729, "epoch": 2609} {"train_loss": -44.979183197021484, "global_step": 315730, "epoch": 2609} {"train_loss": -44.579490661621094, "global_step": 315731, "epoch": 2609} {"train_loss": -44.19131088256836, "global_step": 315732, "epoch": 2609} {"train_loss": -44.79728698730469, "global_step": 315733, "epoch": 2609} {"train_loss": -44.372554779052734, "global_step": 315734, "epoch": 2609} {"train_loss": -44.292022705078125, "global_step": 315735, "epoch": 2609} {"train_loss": -44.702510833740234, "global_step": 315736, "epoch": 2609} {"train_loss": -44.53331756591797, "global_step": 315737, "epoch": 2609} {"train_loss": -42.812767028808594, "global_step": 315738, "epoch": 2609} {"train_loss": -42.69537353515625, "global_step": 315739, "epoch": 2609} {"train_loss": -43.687862396240234, "global_step": 315740, "epoch": 2609} {"train_loss": -43.42558288574219, "global_step": 315741, "epoch": 2609} {"train_loss": -42.66478729248047, "global_step": 315742, "epoch": 2609} {"train_loss": -41.83540725708008, "global_step": 315743, "epoch": 2609} {"train_loss": -43.35566329956055, "global_step": 315744, "epoch": 2609} {"train_loss": -43.66067886352539, "global_step": 315745, "epoch": 2609} {"train_loss": -43.38178634643555, "global_step": 315746, "epoch": 2609} {"train_loss": -42.349090576171875, "global_step": 315747, "epoch": 2609} {"train_loss": -43.318992614746094, "global_step": 315748, "epoch": 2609} {"train_loss": -43.58804702758789, "global_step": 315749, "epoch": 2609} {"train_loss": -42.59906005859375, "global_step": 315750, "epoch": 2609} {"train_loss": -42.418113708496094, "global_step": 315751, "epoch": 2609} {"train_loss": -44.450218200683594, "global_step": 315752, "epoch": 2609} {"train_loss": -41.691402435302734, "global_step": 315753, "epoch": 2609} {"train_loss": -39.898311614990234, "global_step": 315754, "epoch": 2609} {"train_loss": -42.280731201171875, "global_step": 315755, "epoch": 2609} {"train_loss": -43.9559326171875, "global_step": 315756, "epoch": 2609} {"train_loss": -42.13126754760742, "global_step": 315757, "epoch": 2609} {"train_loss": -41.63787841796875, "global_step": 315758, "epoch": 2609} {"train_loss": -43.05131149291992, "global_step": 315759, "epoch": 2609} {"train_loss": -41.67140579223633, "global_step": 315760, "epoch": 2609} {"train_loss": -42.491432189941406, "global_step": 315761, "epoch": 2609} {"train_loss": -42.97021484375, "global_step": 315762, "epoch": 2609} {"train_loss": -40.98794937133789, "global_step": 315763, "epoch": 2609} {"train_loss": -42.59174728393555, "global_step": 315764, "epoch": 2609} {"train_loss": -41.2587890625, "global_step": 315765, "epoch": 2609} {"train_loss": -41.470062255859375, "global_step": 315766, "epoch": 2609} {"train_loss": -42.843406677246094, "global_step": 315767, "epoch": 2609} {"train_loss": -41.495635986328125, "global_step": 315768, "epoch": 2609} {"train_loss": -41.694313049316406, "global_step": 315769, "epoch": 2609} {"train_loss": -43.01759338378906, "global_step": 315770, "epoch": 2609} {"train_loss": -43.28768539428711, "global_step": 315771, "epoch": 2609} {"train_loss": -42.688472747802734, "global_step": 315772, "epoch": 2609} {"train_loss": -43.09952163696289, "global_step": 315773, "epoch": 2609} {"train_loss": -43.80524826049805, "global_step": 315774, "epoch": 2609} {"train_loss": -42.71403884887695, "global_step": 315775, "epoch": 2609} {"train_loss": -43.234649658203125, "global_step": 315776, "epoch": 2609} {"train_loss": -43.005123138427734, "global_step": 315777, "epoch": 2609} {"train_loss": -43.82792282104492, "global_step": 315778, "epoch": 2609} {"train_loss": -43.08649826049805, "global_step": 315779, "epoch": 2609} {"train_loss": -43.77691650390625, "global_step": 315780, "epoch": 2609} {"train_loss": -43.76726150512695, "global_step": 315781, "epoch": 2609} {"train_loss": -43.87471008300781, "global_step": 315782, "epoch": 2609} {"train_loss": -43.712337493896484, "global_step": 315783, "epoch": 2609} {"train_loss": -43.94108200073242, "global_step": 315784, "epoch": 2609} {"train_loss": -43.79416275024414, "global_step": 315785, "epoch": 2609} {"train_loss": -43.77874755859375, "global_step": 315786, "epoch": 2609} {"train_loss": -44.14850997924805, "global_step": 315787, "epoch": 2609} {"train_loss": -43.7337646484375, "global_step": 315788, "epoch": 2609} {"train_loss": -44.595733642578125, "global_step": 315789, "epoch": 2609} {"train_loss": -44.13606643676758, "global_step": 315790, "epoch": 2609} {"train_loss": -44.094764709472656, "global_step": 315791, "epoch": 2609} {"train_loss": -44.58620834350586, "global_step": 315792, "epoch": 2609} {"train_loss": -44.37424850463867, "global_step": 315793, "epoch": 2609} {"train_loss": -44.19524002075195, "global_step": 315794, "epoch": 2609} {"train_loss": -44.441837310791016, "global_step": 315795, "epoch": 2609} {"train_loss": -44.301055908203125, "global_step": 315796, "epoch": 2609} {"train_loss": -44.5411491394043, "global_step": 315797, "epoch": 2609} {"train_loss": -44.38743591308594, "global_step": 315798, "epoch": 2609} {"train_loss": -44.34732437133789, "global_step": 315799, "epoch": 2609} {"train_loss": -44.2747802734375, "global_step": 315800, "epoch": 2609} {"train_loss": -44.789642333984375, "global_step": 315801, "epoch": 2609} {"train_loss": -44.48356246948242, "global_step": 315802, "epoch": 2609} {"train_loss": -44.52706527709961, "global_step": 315803, "epoch": 2609} {"train_loss": -45.0498161315918, "global_step": 315804, "epoch": 2609} {"train_loss": -45.031551361083984, "global_step": 315805, "epoch": 2609} {"train_loss": -44.651275634765625, "global_step": 315806, "epoch": 2609} {"train_loss": -45.0883674621582, "global_step": 315807, "epoch": 2609} {"train_loss": -44.61697006225586, "global_step": 315808, "epoch": 2609} {"train_loss": -43.90244476066148, "global_step": 315809, "epoch": 2609, "val_loss": 2717532.75} {"train_loss": -45.13566589355469, "global_step": 315810, "epoch": 2610} {"train_loss": -44.58754348754883, "global_step": 315811, "epoch": 2610} {"train_loss": -44.598838806152344, "global_step": 315812, "epoch": 2610} {"train_loss": -44.9315071105957, "global_step": 315813, "epoch": 2610} {"train_loss": -44.71500778198242, "global_step": 315814, "epoch": 2610} {"train_loss": -44.43889236450195, "global_step": 315815, "epoch": 2610} {"train_loss": -45.15485763549805, "global_step": 315816, "epoch": 2610} {"train_loss": -44.779232025146484, "global_step": 315817, "epoch": 2610} {"train_loss": -44.07546615600586, "global_step": 315818, "epoch": 2610} {"train_loss": -44.29114532470703, "global_step": 315819, "epoch": 2610} {"train_loss": -44.429012298583984, "global_step": 315820, "epoch": 2610} {"train_loss": -45.111392974853516, "global_step": 315821, "epoch": 2610} {"train_loss": -44.42688751220703, "global_step": 315822, "epoch": 2610} {"train_loss": -43.487945556640625, "global_step": 315823, "epoch": 2610} {"train_loss": -44.515193939208984, "global_step": 315824, "epoch": 2610} {"train_loss": -44.57828140258789, "global_step": 315825, "epoch": 2610} {"train_loss": -41.99494171142578, "global_step": 315826, "epoch": 2610} {"train_loss": -43.60373306274414, "global_step": 315827, "epoch": 2610} {"train_loss": -44.99318313598633, "global_step": 315828, "epoch": 2610} {"train_loss": -44.70237350463867, "global_step": 315829, "epoch": 2610} {"train_loss": -44.29935073852539, "global_step": 315830, "epoch": 2610} {"train_loss": -44.258522033691406, "global_step": 315831, "epoch": 2610} {"train_loss": -44.3087043762207, "global_step": 315832, "epoch": 2610} {"train_loss": -44.626556396484375, "global_step": 315833, "epoch": 2610} {"train_loss": -43.9824104309082, "global_step": 315834, "epoch": 2610} {"train_loss": -44.492435455322266, "global_step": 315835, "epoch": 2610} {"train_loss": -45.06989669799805, "global_step": 315836, "epoch": 2610} {"train_loss": -43.84885787963867, "global_step": 315837, "epoch": 2610} {"train_loss": -44.28840637207031, "global_step": 315838, "epoch": 2610} {"train_loss": -43.35935592651367, "global_step": 315839, "epoch": 2610} {"train_loss": -42.12390899658203, "global_step": 315840, "epoch": 2610} {"train_loss": -44.402976989746094, "global_step": 315841, "epoch": 2610} {"train_loss": -43.62189865112305, "global_step": 315842, "epoch": 2610} {"train_loss": -41.04757308959961, "global_step": 315843, "epoch": 2610} {"train_loss": -42.676456451416016, "global_step": 315844, "epoch": 2610} {"train_loss": -43.8292350769043, "global_step": 315845, "epoch": 2610} {"train_loss": -41.704368591308594, "global_step": 315846, "epoch": 2610} {"train_loss": -41.37260055541992, "global_step": 315847, "epoch": 2610} {"train_loss": -43.13886260986328, "global_step": 315848, "epoch": 2610} {"train_loss": -43.181297302246094, "global_step": 315849, "epoch": 2610} {"train_loss": -43.567203521728516, "global_step": 315850, "epoch": 2610} {"train_loss": -42.93429183959961, "global_step": 315851, "epoch": 2610} {"train_loss": -42.86619186401367, "global_step": 315852, "epoch": 2610} {"train_loss": -44.40317916870117, "global_step": 315853, "epoch": 2610} {"train_loss": -43.57576370239258, "global_step": 315854, "epoch": 2610} {"train_loss": -43.04008865356445, "global_step": 315855, "epoch": 2610} {"train_loss": -43.78023910522461, "global_step": 315856, "epoch": 2610} {"train_loss": -43.187660217285156, "global_step": 315857, "epoch": 2610} {"train_loss": -44.21289825439453, "global_step": 315858, "epoch": 2610} {"train_loss": -43.9113655090332, "global_step": 315859, "epoch": 2610} {"train_loss": -43.950462341308594, "global_step": 315860, "epoch": 2610} {"train_loss": -43.4136962890625, "global_step": 315861, "epoch": 2610} {"train_loss": -43.226558685302734, "global_step": 315862, "epoch": 2610} {"train_loss": -44.192501068115234, "global_step": 315863, "epoch": 2610} {"train_loss": -43.40755844116211, "global_step": 315864, "epoch": 2610} {"train_loss": -44.415618896484375, "global_step": 315865, "epoch": 2610} {"train_loss": -43.942813873291016, "global_step": 315866, "epoch": 2610} {"train_loss": -43.94329833984375, "global_step": 315867, "epoch": 2610} {"train_loss": -44.655487060546875, "global_step": 315868, "epoch": 2610} {"train_loss": -43.76773452758789, "global_step": 315869, "epoch": 2610} {"train_loss": -44.40473556518555, "global_step": 315870, "epoch": 2610} {"train_loss": -43.81104278564453, "global_step": 315871, "epoch": 2610} {"train_loss": -44.638832092285156, "global_step": 315872, "epoch": 2610} {"train_loss": -43.97280502319336, "global_step": 315873, "epoch": 2610} {"train_loss": -44.188411712646484, "global_step": 315874, "epoch": 2610} {"train_loss": -44.43156814575195, "global_step": 315875, "epoch": 2610} {"train_loss": -44.139217376708984, "global_step": 315876, "epoch": 2610} {"train_loss": -44.354312896728516, "global_step": 315877, "epoch": 2610} {"train_loss": -44.14105987548828, "global_step": 315878, "epoch": 2610} {"train_loss": -44.50762176513672, "global_step": 315879, "epoch": 2610} {"train_loss": -44.29823684692383, "global_step": 315880, "epoch": 2610} {"train_loss": -44.1433219909668, "global_step": 315881, "epoch": 2610} {"train_loss": -44.2136344909668, "global_step": 315882, "epoch": 2610} {"train_loss": -43.74102020263672, "global_step": 315883, "epoch": 2610} {"train_loss": -44.56814193725586, "global_step": 315884, "epoch": 2610} {"train_loss": -43.66070556640625, "global_step": 315885, "epoch": 2610} {"train_loss": -44.44880294799805, "global_step": 315886, "epoch": 2610} {"train_loss": -43.63953399658203, "global_step": 315887, "epoch": 2610} {"train_loss": -44.558982849121094, "global_step": 315888, "epoch": 2610} {"train_loss": -44.34562301635742, "global_step": 315889, "epoch": 2610} {"train_loss": -44.60018539428711, "global_step": 315890, "epoch": 2610} {"train_loss": -43.8861083984375, "global_step": 315891, "epoch": 2610} {"train_loss": -44.218719482421875, "global_step": 315892, "epoch": 2610} {"train_loss": -44.358638763427734, "global_step": 315893, "epoch": 2610} {"train_loss": -44.35148239135742, "global_step": 315894, "epoch": 2610} {"train_loss": -45.10251998901367, "global_step": 315895, "epoch": 2610} {"train_loss": -44.82344055175781, "global_step": 315896, "epoch": 2610} {"train_loss": -43.60429763793945, "global_step": 315897, "epoch": 2610} {"train_loss": -43.5280876159668, "global_step": 315898, "epoch": 2610} {"train_loss": -44.44804763793945, "global_step": 315899, "epoch": 2610} {"train_loss": -44.562110900878906, "global_step": 315900, "epoch": 2610} {"train_loss": -43.92487335205078, "global_step": 315901, "epoch": 2610} {"train_loss": -43.767513275146484, "global_step": 315902, "epoch": 2610} {"train_loss": -44.77170181274414, "global_step": 315903, "epoch": 2610} {"train_loss": -44.13407516479492, "global_step": 315904, "epoch": 2610} {"train_loss": -43.854461669921875, "global_step": 315905, "epoch": 2610} {"train_loss": -43.40727233886719, "global_step": 315906, "epoch": 2610} {"train_loss": -43.312862396240234, "global_step": 315907, "epoch": 2610} {"train_loss": -43.164100646972656, "global_step": 315908, "epoch": 2610} {"train_loss": -43.68231201171875, "global_step": 315909, "epoch": 2610} {"train_loss": -43.82478332519531, "global_step": 315910, "epoch": 2610} {"train_loss": -44.024654388427734, "global_step": 315911, "epoch": 2610} {"train_loss": -44.44116973876953, "global_step": 315912, "epoch": 2610} {"train_loss": -43.420616149902344, "global_step": 315913, "epoch": 2610} {"train_loss": -43.134029388427734, "global_step": 315914, "epoch": 2610} {"train_loss": -42.621917724609375, "global_step": 315915, "epoch": 2610} {"train_loss": -41.68619918823242, "global_step": 315916, "epoch": 2610} {"train_loss": -41.83968734741211, "global_step": 315917, "epoch": 2610} {"train_loss": -43.13941192626953, "global_step": 315918, "epoch": 2610} {"train_loss": -43.74827194213867, "global_step": 315919, "epoch": 2610} {"train_loss": -42.96229553222656, "global_step": 315920, "epoch": 2610} {"train_loss": -41.511192321777344, "global_step": 315921, "epoch": 2610} {"train_loss": -41.968379974365234, "global_step": 315922, "epoch": 2610} {"train_loss": -42.47711181640625, "global_step": 315923, "epoch": 2610} {"train_loss": -43.91410446166992, "global_step": 315924, "epoch": 2610} {"train_loss": -43.076839447021484, "global_step": 315925, "epoch": 2610} {"train_loss": -41.15668869018555, "global_step": 315926, "epoch": 2610} {"train_loss": -41.279876708984375, "global_step": 315927, "epoch": 2610} {"train_loss": -43.601619720458984, "global_step": 315928, "epoch": 2610} {"train_loss": -43.617950439453125, "global_step": 315929, "epoch": 2610} {"train_loss": -43.80101136136646, "global_step": 315930, "epoch": 2610, "val_loss": 2701601.0} {"train_loss": -43.65095138549805, "global_step": 315931, "epoch": 2611} {"train_loss": -43.645904541015625, "global_step": 315932, "epoch": 2611} {"train_loss": -44.547080993652344, "global_step": 315933, "epoch": 2611} {"train_loss": -43.054317474365234, "global_step": 315934, "epoch": 2611} {"train_loss": -43.57880401611328, "global_step": 315935, "epoch": 2611} {"train_loss": -44.23014450073242, "global_step": 315936, "epoch": 2611} {"train_loss": -43.387489318847656, "global_step": 315937, "epoch": 2611} {"train_loss": -43.4294319152832, "global_step": 315938, "epoch": 2611} {"train_loss": -44.3613166809082, "global_step": 315939, "epoch": 2611} {"train_loss": -43.594844818115234, "global_step": 315940, "epoch": 2611} {"train_loss": -43.86478805541992, "global_step": 315941, "epoch": 2611} {"train_loss": -44.12541198730469, "global_step": 315942, "epoch": 2611} {"train_loss": -43.99843215942383, "global_step": 315943, "epoch": 2611} {"train_loss": -44.32728958129883, "global_step": 315944, "epoch": 2611} {"train_loss": -43.91120910644531, "global_step": 315945, "epoch": 2611} {"train_loss": -44.112239837646484, "global_step": 315946, "epoch": 2611} {"train_loss": -44.60352325439453, "global_step": 315947, "epoch": 2611} {"train_loss": -44.8840446472168, "global_step": 315948, "epoch": 2611} {"train_loss": -44.600894927978516, "global_step": 315949, "epoch": 2611} {"train_loss": -44.77850341796875, "global_step": 315950, "epoch": 2611} {"train_loss": -44.60505294799805, "global_step": 315951, "epoch": 2611} {"train_loss": -45.105709075927734, "global_step": 315952, "epoch": 2611} {"train_loss": -44.99964904785156, "global_step": 315953, "epoch": 2611} {"train_loss": -44.7809944152832, "global_step": 315954, "epoch": 2611} {"train_loss": -44.93292999267578, "global_step": 315955, "epoch": 2611} {"train_loss": -44.862030029296875, "global_step": 315956, "epoch": 2611} {"train_loss": -44.68978500366211, "global_step": 315957, "epoch": 2611} {"train_loss": -45.1698112487793, "global_step": 315958, "epoch": 2611} {"train_loss": -44.34007263183594, "global_step": 315959, "epoch": 2611} {"train_loss": -44.589813232421875, "global_step": 315960, "epoch": 2611} {"train_loss": -44.5710334777832, "global_step": 315961, "epoch": 2611} {"train_loss": -45.02545928955078, "global_step": 315962, "epoch": 2611} {"train_loss": -43.97277069091797, "global_step": 315963, "epoch": 2611} {"train_loss": -44.664764404296875, "global_step": 315964, "epoch": 2611} {"train_loss": -44.948665618896484, "global_step": 315965, "epoch": 2611} {"train_loss": -44.61520767211914, "global_step": 315966, "epoch": 2611} {"train_loss": -44.557613372802734, "global_step": 315967, "epoch": 2611} {"train_loss": -45.182369232177734, "global_step": 315968, "epoch": 2611} {"train_loss": -44.71657180786133, "global_step": 315969, "epoch": 2611} {"train_loss": -44.29829025268555, "global_step": 315970, "epoch": 2611} {"train_loss": -44.20585250854492, "global_step": 315971, "epoch": 2611} {"train_loss": -44.808380126953125, "global_step": 315972, "epoch": 2611} {"train_loss": -45.48538589477539, "global_step": 315973, "epoch": 2611} {"train_loss": -44.81949996948242, "global_step": 315974, "epoch": 2611} {"train_loss": -44.81494903564453, "global_step": 315975, "epoch": 2611} {"train_loss": -44.77618408203125, "global_step": 315976, "epoch": 2611} {"train_loss": -44.83027267456055, "global_step": 315977, "epoch": 2611} {"train_loss": -44.821807861328125, "global_step": 315978, "epoch": 2611} {"train_loss": -44.02668380737305, "global_step": 315979, "epoch": 2611} {"train_loss": -43.69290542602539, "global_step": 315980, "epoch": 2611} {"train_loss": -42.72524642944336, "global_step": 315981, "epoch": 2611} {"train_loss": -43.97772216796875, "global_step": 315982, "epoch": 2611} {"train_loss": -44.55985641479492, "global_step": 315983, "epoch": 2611} {"train_loss": -43.71162033081055, "global_step": 315984, "epoch": 2611} {"train_loss": -42.51838684082031, "global_step": 315985, "epoch": 2611} {"train_loss": -43.996273040771484, "global_step": 315986, "epoch": 2611} {"train_loss": -44.376827239990234, "global_step": 315987, "epoch": 2611} {"train_loss": -42.71494674682617, "global_step": 315988, "epoch": 2611} {"train_loss": -42.130165100097656, "global_step": 315989, "epoch": 2611} {"train_loss": -41.274818420410156, "global_step": 315990, "epoch": 2611} {"train_loss": -42.953025817871094, "global_step": 315991, "epoch": 2611} {"train_loss": -43.550262451171875, "global_step": 315992, "epoch": 2611} {"train_loss": -44.19794464111328, "global_step": 315993, "epoch": 2611} {"train_loss": -43.2414665222168, "global_step": 315994, "epoch": 2611} {"train_loss": -42.9448356628418, "global_step": 315995, "epoch": 2611} {"train_loss": -44.09654998779297, "global_step": 315996, "epoch": 2611} {"train_loss": -42.966304779052734, "global_step": 315997, "epoch": 2611} {"train_loss": -41.42662811279297, "global_step": 315998, "epoch": 2611} {"train_loss": -44.68534469604492, "global_step": 315999, "epoch": 2611} {"train_loss": -43.49934005737305, "global_step": 316000, "epoch": 2611} {"train_loss": -42.20232009887695, "global_step": 316001, "epoch": 2611} {"train_loss": -43.941036224365234, "global_step": 316002, "epoch": 2611} {"train_loss": -42.469730377197266, "global_step": 316003, "epoch": 2611} {"train_loss": -42.34512710571289, "global_step": 316004, "epoch": 2611} {"train_loss": -43.105567932128906, "global_step": 316005, "epoch": 2611} {"train_loss": -43.29281234741211, "global_step": 316006, "epoch": 2611} {"train_loss": -43.349891662597656, "global_step": 316007, "epoch": 2611} {"train_loss": -43.22609329223633, "global_step": 316008, "epoch": 2611} {"train_loss": -43.317108154296875, "global_step": 316009, "epoch": 2611} {"train_loss": -44.017494201660156, "global_step": 316010, "epoch": 2611} {"train_loss": -42.61790084838867, "global_step": 316011, "epoch": 2611} {"train_loss": -42.67649459838867, "global_step": 316012, "epoch": 2611} {"train_loss": -43.11320114135742, "global_step": 316013, "epoch": 2611} {"train_loss": -43.222557067871094, "global_step": 316014, "epoch": 2611} {"train_loss": -42.7746467590332, "global_step": 316015, "epoch": 2611} {"train_loss": -43.83544158935547, "global_step": 316016, "epoch": 2611} {"train_loss": -43.52437210083008, "global_step": 316017, "epoch": 2611} {"train_loss": -43.84330368041992, "global_step": 316018, "epoch": 2611} {"train_loss": -43.9703369140625, "global_step": 316019, "epoch": 2611} {"train_loss": -43.77577209472656, "global_step": 316020, "epoch": 2611} {"train_loss": -43.684932708740234, "global_step": 316021, "epoch": 2611} {"train_loss": -42.08742904663086, "global_step": 316022, "epoch": 2611} {"train_loss": -43.48199462890625, "global_step": 316023, "epoch": 2611} {"train_loss": -42.48075485229492, "global_step": 316024, "epoch": 2611} {"train_loss": -42.734004974365234, "global_step": 316025, "epoch": 2611} {"train_loss": -42.03108596801758, "global_step": 316026, "epoch": 2611} {"train_loss": -43.83723068237305, "global_step": 316027, "epoch": 2611} {"train_loss": -43.420654296875, "global_step": 316028, "epoch": 2611} {"train_loss": -43.57575607299805, "global_step": 316029, "epoch": 2611} {"train_loss": -42.70500564575195, "global_step": 316030, "epoch": 2611} {"train_loss": -43.82001876831055, "global_step": 316031, "epoch": 2611} {"train_loss": -43.770992279052734, "global_step": 316032, "epoch": 2611} {"train_loss": -43.27425765991211, "global_step": 316033, "epoch": 2611} {"train_loss": -44.246238708496094, "global_step": 316034, "epoch": 2611} {"train_loss": -44.337337493896484, "global_step": 316035, "epoch": 2611} {"train_loss": -43.953758239746094, "global_step": 316036, "epoch": 2611} {"train_loss": -44.28807067871094, "global_step": 316037, "epoch": 2611} {"train_loss": -44.611568450927734, "global_step": 316038, "epoch": 2611} {"train_loss": -44.27494430541992, "global_step": 316039, "epoch": 2611} {"train_loss": -43.49188995361328, "global_step": 316040, "epoch": 2611} {"train_loss": -44.48188400268555, "global_step": 316041, "epoch": 2611} {"train_loss": -43.9703369140625, "global_step": 316042, "epoch": 2611} {"train_loss": -42.72471237182617, "global_step": 316043, "epoch": 2611} {"train_loss": -44.20164489746094, "global_step": 316044, "epoch": 2611} {"train_loss": -44.608665466308594, "global_step": 316045, "epoch": 2611} {"train_loss": -42.88460159301758, "global_step": 316046, "epoch": 2611} {"train_loss": -43.76070785522461, "global_step": 316047, "epoch": 2611} {"train_loss": -44.61501693725586, "global_step": 316048, "epoch": 2611} {"train_loss": -43.145484924316406, "global_step": 316049, "epoch": 2611} {"train_loss": -44.4570426940918, "global_step": 316050, "epoch": 2611} {"train_loss": -43.84312735313226, "global_step": 316051, "epoch": 2611, "val_loss": 2716174.75} {"train_loss": -43.62803268432617, "global_step": 316052, "epoch": 2612} {"train_loss": -44.54777145385742, "global_step": 316053, "epoch": 2612} {"train_loss": -44.5693359375, "global_step": 316054, "epoch": 2612} {"train_loss": -43.6762580871582, "global_step": 316055, "epoch": 2612} {"train_loss": -44.65748596191406, "global_step": 316056, "epoch": 2612} {"train_loss": -43.349300384521484, "global_step": 316057, "epoch": 2612} {"train_loss": -44.39980697631836, "global_step": 316058, "epoch": 2612} {"train_loss": -44.14575958251953, "global_step": 316059, "epoch": 2612} {"train_loss": -43.069252014160156, "global_step": 316060, "epoch": 2612} {"train_loss": -44.55976486206055, "global_step": 316061, "epoch": 2612} {"train_loss": -43.800048828125, "global_step": 316062, "epoch": 2612} {"train_loss": -43.825416564941406, "global_step": 316063, "epoch": 2612} {"train_loss": -44.445274353027344, "global_step": 316064, "epoch": 2612} {"train_loss": -44.395057678222656, "global_step": 316065, "epoch": 2612} {"train_loss": -44.706783294677734, "global_step": 316066, "epoch": 2612} {"train_loss": -44.47834396362305, "global_step": 316067, "epoch": 2612} {"train_loss": -44.452999114990234, "global_step": 316068, "epoch": 2612} {"train_loss": -44.60578918457031, "global_step": 316069, "epoch": 2612} {"train_loss": -44.582733154296875, "global_step": 316070, "epoch": 2612} {"train_loss": -45.024837493896484, "global_step": 316071, "epoch": 2612} {"train_loss": -44.17750930786133, "global_step": 316072, "epoch": 2612} {"train_loss": -44.736366271972656, "global_step": 316073, "epoch": 2612} {"train_loss": -44.878997802734375, "global_step": 316074, "epoch": 2612} {"train_loss": -44.75630187988281, "global_step": 316075, "epoch": 2612} {"train_loss": -44.174560546875, "global_step": 316076, "epoch": 2612} {"train_loss": -44.7237663269043, "global_step": 316077, "epoch": 2612} {"train_loss": -40.264949798583984, "global_step": 316078, "epoch": 2612} {"train_loss": -44.40576171875, "global_step": 316079, "epoch": 2612} {"train_loss": -44.56800079345703, "global_step": 316080, "epoch": 2612} {"train_loss": -44.78923797607422, "global_step": 316081, "epoch": 2612} {"train_loss": -44.220890045166016, "global_step": 316082, "epoch": 2612} {"train_loss": -45.028011322021484, "global_step": 316083, "epoch": 2612} {"train_loss": -38.03417205810547, "global_step": 316084, "epoch": 2612} {"train_loss": -30.211851119995117, "global_step": 316085, "epoch": 2612} {"train_loss": -42.0291748046875, "global_step": 316086, "epoch": 2612} {"train_loss": -40.353515625, "global_step": 316087, "epoch": 2612} {"train_loss": -40.6307373046875, "global_step": 316088, "epoch": 2612} {"train_loss": -16.146516799926758, "global_step": 316089, "epoch": 2612} {"train_loss": -40.58018112182617, "global_step": 316090, "epoch": 2612} {"train_loss": -36.454830169677734, "global_step": 316091, "epoch": 2612} {"train_loss": -26.162878036499023, "global_step": 316092, "epoch": 2612} {"train_loss": -36.7916145324707, "global_step": 316093, "epoch": 2612} {"train_loss": -17.250261306762695, "global_step": 316094, "epoch": 2612} {"train_loss": -27.685001373291016, "global_step": 316095, "epoch": 2612} {"train_loss": -36.15932083129883, "global_step": 316096, "epoch": 2612} {"train_loss": -38.0910758972168, "global_step": 316097, "epoch": 2612} {"train_loss": -29.86240005493164, "global_step": 316098, "epoch": 2612} {"train_loss": -34.26997375488281, "global_step": 316099, "epoch": 2612} {"train_loss": -32.259620666503906, "global_step": 316100, "epoch": 2612} {"train_loss": -3.3981308937072754, "global_step": 316101, "epoch": 2612} {"train_loss": -20.8719539642334, "global_step": 316102, "epoch": 2612} {"train_loss": -29.087146759033203, "global_step": 316103, "epoch": 2612} {"train_loss": -36.135658264160156, "global_step": 316104, "epoch": 2612} {"train_loss": -32.23373031616211, "global_step": 316105, "epoch": 2612} {"train_loss": -27.57596206665039, "global_step": 316106, "epoch": 2612} {"train_loss": -30.073087692260742, "global_step": 316107, "epoch": 2612} {"train_loss": -32.87763595581055, "global_step": 316108, "epoch": 2612} {"train_loss": -37.55672073364258, "global_step": 316109, "epoch": 2612} {"train_loss": -35.32170486450195, "global_step": 316110, "epoch": 2612} {"train_loss": -35.48224639892578, "global_step": 316111, "epoch": 2612} {"train_loss": -36.04475021362305, "global_step": 316112, "epoch": 2612} {"train_loss": -35.787288665771484, "global_step": 316113, "epoch": 2612} {"train_loss": -36.78156280517578, "global_step": 316114, "epoch": 2612} {"train_loss": -36.814170837402344, "global_step": 316115, "epoch": 2612} {"train_loss": -37.295658111572266, "global_step": 316116, "epoch": 2612} {"train_loss": -37.551631927490234, "global_step": 316117, "epoch": 2612} {"train_loss": -36.96402359008789, "global_step": 316118, "epoch": 2612} {"train_loss": -36.69797897338867, "global_step": 316119, "epoch": 2612} {"train_loss": -34.84563064575195, "global_step": 316120, "epoch": 2612} {"train_loss": -39.1440544128418, "global_step": 316121, "epoch": 2612} {"train_loss": -38.15153884887695, "global_step": 316122, "epoch": 2612} {"train_loss": -38.798336029052734, "global_step": 316123, "epoch": 2612} {"train_loss": -37.358646392822266, "global_step": 316124, "epoch": 2612} {"train_loss": -39.49412155151367, "global_step": 316125, "epoch": 2612} {"train_loss": -37.39875411987305, "global_step": 316126, "epoch": 2612} {"train_loss": -38.85638427734375, "global_step": 316127, "epoch": 2612} {"train_loss": -38.47754669189453, "global_step": 316128, "epoch": 2612} {"train_loss": -39.13381576538086, "global_step": 316129, "epoch": 2612} {"train_loss": -38.36871337890625, "global_step": 316130, "epoch": 2612} {"train_loss": -39.6531982421875, "global_step": 316131, "epoch": 2612} {"train_loss": -36.31638717651367, "global_step": 316132, "epoch": 2612} {"train_loss": -39.234100341796875, "global_step": 316133, "epoch": 2612} {"train_loss": -40.06150436401367, "global_step": 316134, "epoch": 2612} {"train_loss": -39.720333099365234, "global_step": 316135, "epoch": 2612} {"train_loss": -38.849609375, "global_step": 316136, "epoch": 2612} {"train_loss": -39.61893844604492, "global_step": 316137, "epoch": 2612} {"train_loss": -39.76015090942383, "global_step": 316138, "epoch": 2612} {"train_loss": -39.566062927246094, "global_step": 316139, "epoch": 2612} {"train_loss": -39.07322311401367, "global_step": 316140, "epoch": 2612} {"train_loss": -40.22520065307617, "global_step": 316141, "epoch": 2612} {"train_loss": -39.77803421020508, "global_step": 316142, "epoch": 2612} {"train_loss": -38.963050842285156, "global_step": 316143, "epoch": 2612} {"train_loss": -39.355186462402344, "global_step": 316144, "epoch": 2612} {"train_loss": -39.09669876098633, "global_step": 316145, "epoch": 2612} {"train_loss": -40.40273666381836, "global_step": 316146, "epoch": 2612} {"train_loss": -40.60274124145508, "global_step": 316147, "epoch": 2612} {"train_loss": -40.39695358276367, "global_step": 316148, "epoch": 2612} {"train_loss": -39.51167678833008, "global_step": 316149, "epoch": 2612} {"train_loss": -40.766788482666016, "global_step": 316150, "epoch": 2612} {"train_loss": -40.499366760253906, "global_step": 316151, "epoch": 2612} {"train_loss": -39.90483474731445, "global_step": 316152, "epoch": 2612} {"train_loss": -41.61909866333008, "global_step": 316153, "epoch": 2612} {"train_loss": -41.09480285644531, "global_step": 316154, "epoch": 2612} {"train_loss": -40.04059982299805, "global_step": 316155, "epoch": 2612} {"train_loss": -39.70893096923828, "global_step": 316156, "epoch": 2612} {"train_loss": -41.75746154785156, "global_step": 316157, "epoch": 2612} {"train_loss": -40.6162109375, "global_step": 316158, "epoch": 2612} {"train_loss": -41.34292221069336, "global_step": 316159, "epoch": 2612} {"train_loss": -39.970977783203125, "global_step": 316160, "epoch": 2612} {"train_loss": -39.30116271972656, "global_step": 316161, "epoch": 2612} {"train_loss": -41.529930114746094, "global_step": 316162, "epoch": 2612} {"train_loss": -39.977474212646484, "global_step": 316163, "epoch": 2612} {"train_loss": -41.88833236694336, "global_step": 316164, "epoch": 2612} {"train_loss": -41.466766357421875, "global_step": 316165, "epoch": 2612} {"train_loss": -39.58850860595703, "global_step": 316166, "epoch": 2612} {"train_loss": -41.526832580566406, "global_step": 316167, "epoch": 2612} {"train_loss": -40.97661209106445, "global_step": 316168, "epoch": 2612} {"train_loss": -41.40156936645508, "global_step": 316169, "epoch": 2612} {"train_loss": -40.60299301147461, "global_step": 316170, "epoch": 2612} {"train_loss": -40.70488357543945, "global_step": 316171, "epoch": 2612} {"train_loss": -38.848016049251086, "global_step": 316172, "epoch": 2612, "val_loss": 2579975.25} {"train_loss": -41.59001541137695, "global_step": 316173, "epoch": 2613} {"train_loss": -41.7713737487793, "global_step": 316174, "epoch": 2613} {"train_loss": -41.04705810546875, "global_step": 316175, "epoch": 2613} {"train_loss": -42.185447692871094, "global_step": 316176, "epoch": 2613} {"train_loss": -39.29751205444336, "global_step": 316177, "epoch": 2613} {"train_loss": -41.859413146972656, "global_step": 316178, "epoch": 2613} {"train_loss": -40.33699417114258, "global_step": 316179, "epoch": 2613} {"train_loss": -42.38016891479492, "global_step": 316180, "epoch": 2613} {"train_loss": -42.39697265625, "global_step": 316181, "epoch": 2613} {"train_loss": -41.72587203979492, "global_step": 316182, "epoch": 2613} {"train_loss": -41.31373977661133, "global_step": 316183, "epoch": 2613} {"train_loss": -41.716033935546875, "global_step": 316184, "epoch": 2613} {"train_loss": -42.246097564697266, "global_step": 316185, "epoch": 2613} {"train_loss": -41.85540771484375, "global_step": 316186, "epoch": 2613} {"train_loss": -42.64481735229492, "global_step": 316187, "epoch": 2613} {"train_loss": -42.29165267944336, "global_step": 316188, "epoch": 2613} {"train_loss": -41.891357421875, "global_step": 316189, "epoch": 2613} {"train_loss": -40.60540771484375, "global_step": 316190, "epoch": 2613} {"train_loss": -41.990150451660156, "global_step": 316191, "epoch": 2613} {"train_loss": -41.6097412109375, "global_step": 316192, "epoch": 2613} {"train_loss": -41.654273986816406, "global_step": 316193, "epoch": 2613} {"train_loss": -41.265411376953125, "global_step": 316194, "epoch": 2613} {"train_loss": -42.462440490722656, "global_step": 316195, "epoch": 2613} {"train_loss": -42.28446578979492, "global_step": 316196, "epoch": 2613} {"train_loss": -42.726261138916016, "global_step": 316197, "epoch": 2613} {"train_loss": -41.98596954345703, "global_step": 316198, "epoch": 2613} {"train_loss": -41.96617889404297, "global_step": 316199, "epoch": 2613} {"train_loss": -41.111976623535156, "global_step": 316200, "epoch": 2613} {"train_loss": -41.90704345703125, "global_step": 316201, "epoch": 2613} {"train_loss": -42.677486419677734, "global_step": 316202, "epoch": 2613} {"train_loss": -41.83126449584961, "global_step": 316203, "epoch": 2613} {"train_loss": -42.71338653564453, "global_step": 316204, "epoch": 2613} {"train_loss": -36.84439468383789, "global_step": 316205, "epoch": 2613} {"train_loss": -41.979915618896484, "global_step": 316206, "epoch": 2613} {"train_loss": -42.12276840209961, "global_step": 316207, "epoch": 2613} {"train_loss": -42.830055236816406, "global_step": 316208, "epoch": 2613} {"train_loss": -42.82193374633789, "global_step": 316209, "epoch": 2613} {"train_loss": -42.13496017456055, "global_step": 316210, "epoch": 2613} {"train_loss": -42.41415786743164, "global_step": 316211, "epoch": 2613} {"train_loss": -42.372005462646484, "global_step": 316212, "epoch": 2613} {"train_loss": -42.865421295166016, "global_step": 316213, "epoch": 2613} {"train_loss": -41.44108963012695, "global_step": 316214, "epoch": 2613} {"train_loss": -42.900394439697266, "global_step": 316215, "epoch": 2613} {"train_loss": -41.805763244628906, "global_step": 316216, "epoch": 2613} {"train_loss": -42.97987747192383, "global_step": 316217, "epoch": 2613} {"train_loss": -41.64863204956055, "global_step": 316218, "epoch": 2613} {"train_loss": -41.98782730102539, "global_step": 316219, "epoch": 2613} {"train_loss": -42.02552032470703, "global_step": 316220, "epoch": 2613} {"train_loss": -42.792449951171875, "global_step": 316221, "epoch": 2613} {"train_loss": -41.946746826171875, "global_step": 316222, "epoch": 2613} {"train_loss": -41.3939323425293, "global_step": 316223, "epoch": 2613} {"train_loss": -42.27970886230469, "global_step": 316224, "epoch": 2613} {"train_loss": -42.09650802612305, "global_step": 316225, "epoch": 2613} {"train_loss": -41.891517639160156, "global_step": 316226, "epoch": 2613} {"train_loss": -43.24151611328125, "global_step": 316227, "epoch": 2613} {"train_loss": -43.11956787109375, "global_step": 316228, "epoch": 2613} {"train_loss": -42.6572380065918, "global_step": 316229, "epoch": 2613} {"train_loss": -43.731590270996094, "global_step": 316230, "epoch": 2613} {"train_loss": -43.147640228271484, "global_step": 316231, "epoch": 2613} {"train_loss": -41.58173370361328, "global_step": 316232, "epoch": 2613} {"train_loss": -42.7099494934082, "global_step": 316233, "epoch": 2613} {"train_loss": -43.115150451660156, "global_step": 316234, "epoch": 2613} {"train_loss": -42.61015319824219, "global_step": 316235, "epoch": 2613} {"train_loss": -43.46773910522461, "global_step": 316236, "epoch": 2613} {"train_loss": -43.161834716796875, "global_step": 316237, "epoch": 2613} {"train_loss": -42.16550064086914, "global_step": 316238, "epoch": 2613} {"train_loss": -43.2032470703125, "global_step": 316239, "epoch": 2613} {"train_loss": -42.88190460205078, "global_step": 316240, "epoch": 2613} {"train_loss": -42.971900939941406, "global_step": 316241, "epoch": 2613} {"train_loss": -42.45396041870117, "global_step": 316242, "epoch": 2613} {"train_loss": -43.99281692504883, "global_step": 316243, "epoch": 2613} {"train_loss": -42.66621017456055, "global_step": 316244, "epoch": 2613} {"train_loss": -43.811912536621094, "global_step": 316245, "epoch": 2613} {"train_loss": -42.688045501708984, "global_step": 316246, "epoch": 2613} {"train_loss": -42.22793197631836, "global_step": 316247, "epoch": 2613} {"train_loss": -43.64759826660156, "global_step": 316248, "epoch": 2613} {"train_loss": -43.48922348022461, "global_step": 316249, "epoch": 2613} {"train_loss": -42.01459503173828, "global_step": 316250, "epoch": 2613} {"train_loss": -43.42802429199219, "global_step": 316251, "epoch": 2613} {"train_loss": -42.731971740722656, "global_step": 316252, "epoch": 2613} {"train_loss": -43.7522087097168, "global_step": 316253, "epoch": 2613} {"train_loss": -42.83994674682617, "global_step": 316254, "epoch": 2613} {"train_loss": -43.30120849609375, "global_step": 316255, "epoch": 2613} {"train_loss": -43.56380081176758, "global_step": 316256, "epoch": 2613} {"train_loss": -43.861873626708984, "global_step": 316257, "epoch": 2613} {"train_loss": -43.99702835083008, "global_step": 316258, "epoch": 2613} {"train_loss": -43.49628448486328, "global_step": 316259, "epoch": 2613} {"train_loss": -43.7032470703125, "global_step": 316260, "epoch": 2613} {"train_loss": -43.13058853149414, "global_step": 316261, "epoch": 2613} {"train_loss": -43.73160171508789, "global_step": 316262, "epoch": 2613} {"train_loss": -43.9371337890625, "global_step": 316263, "epoch": 2613} {"train_loss": -43.74153518676758, "global_step": 316264, "epoch": 2613} {"train_loss": -42.93495559692383, "global_step": 316265, "epoch": 2613} {"train_loss": -43.52964401245117, "global_step": 316266, "epoch": 2613} {"train_loss": -43.682308197021484, "global_step": 316267, "epoch": 2613} {"train_loss": -43.63528823852539, "global_step": 316268, "epoch": 2613} {"train_loss": -43.53860092163086, "global_step": 316269, "epoch": 2613} {"train_loss": -43.84697723388672, "global_step": 316270, "epoch": 2613} {"train_loss": -43.620975494384766, "global_step": 316271, "epoch": 2613} {"train_loss": -43.201499938964844, "global_step": 316272, "epoch": 2613} {"train_loss": -43.44172286987305, "global_step": 316273, "epoch": 2613} {"train_loss": -43.044677734375, "global_step": 316274, "epoch": 2613} {"train_loss": -43.47256088256836, "global_step": 316275, "epoch": 2613} {"train_loss": -44.18058776855469, "global_step": 316276, "epoch": 2613} {"train_loss": -43.80485534667969, "global_step": 316277, "epoch": 2613} {"train_loss": -43.73655319213867, "global_step": 316278, "epoch": 2613} {"train_loss": -44.11361312866211, "global_step": 316279, "epoch": 2613} {"train_loss": -43.7811279296875, "global_step": 316280, "epoch": 2613} {"train_loss": -43.74570846557617, "global_step": 316281, "epoch": 2613} {"train_loss": -44.363155364990234, "global_step": 316282, "epoch": 2613} {"train_loss": -42.93675231933594, "global_step": 316283, "epoch": 2613} {"train_loss": -43.31476593017578, "global_step": 316284, "epoch": 2613} {"train_loss": -43.207088470458984, "global_step": 316285, "epoch": 2613} {"train_loss": -43.92710494995117, "global_step": 316286, "epoch": 2613} {"train_loss": -42.721736907958984, "global_step": 316287, "epoch": 2613} {"train_loss": -43.79134750366211, "global_step": 316288, "epoch": 2613} {"train_loss": -44.006439208984375, "global_step": 316289, "epoch": 2613} {"train_loss": -44.52595520019531, "global_step": 316290, "epoch": 2613} {"train_loss": -43.84247970581055, "global_step": 316291, "epoch": 2613} {"train_loss": -43.20730209350586, "global_step": 316292, "epoch": 2613} {"train_loss": -42.69165086352135, "global_step": 316293, "epoch": 2613, "val_loss": 2649931.25} {"train_loss": -44.55670928955078, "global_step": 316294, "epoch": 2614} {"train_loss": -43.981109619140625, "global_step": 316295, "epoch": 2614} {"train_loss": -42.55103302001953, "global_step": 316296, "epoch": 2614} {"train_loss": -43.594451904296875, "global_step": 316297, "epoch": 2614} {"train_loss": -42.05912399291992, "global_step": 316298, "epoch": 2614} {"train_loss": -43.50785446166992, "global_step": 316299, "epoch": 2614} {"train_loss": -42.378231048583984, "global_step": 316300, "epoch": 2614} {"train_loss": -44.000770568847656, "global_step": 316301, "epoch": 2614} {"train_loss": -41.56586837768555, "global_step": 316302, "epoch": 2614} {"train_loss": -42.89200973510742, "global_step": 316303, "epoch": 2614} {"train_loss": -43.18748474121094, "global_step": 316304, "epoch": 2614} {"train_loss": -42.93183135986328, "global_step": 316305, "epoch": 2614} {"train_loss": -43.32014846801758, "global_step": 316306, "epoch": 2614} {"train_loss": -43.45600128173828, "global_step": 316307, "epoch": 2614} {"train_loss": -42.433895111083984, "global_step": 316308, "epoch": 2614} {"train_loss": -44.03386688232422, "global_step": 316309, "epoch": 2614} {"train_loss": -42.86025619506836, "global_step": 316310, "epoch": 2614} {"train_loss": -43.220130920410156, "global_step": 316311, "epoch": 2614} {"train_loss": -43.35575485229492, "global_step": 316312, "epoch": 2614} {"train_loss": -43.75284957885742, "global_step": 316313, "epoch": 2614} {"train_loss": -42.674522399902344, "global_step": 316314, "epoch": 2614} {"train_loss": -43.712646484375, "global_step": 316315, "epoch": 2614} {"train_loss": -42.267120361328125, "global_step": 316316, "epoch": 2614} {"train_loss": -42.89436340332031, "global_step": 316317, "epoch": 2614} {"train_loss": -43.0373649597168, "global_step": 316318, "epoch": 2614} {"train_loss": -43.702064514160156, "global_step": 316319, "epoch": 2614} {"train_loss": -42.80100631713867, "global_step": 316320, "epoch": 2614} {"train_loss": -42.5142936706543, "global_step": 316321, "epoch": 2614} {"train_loss": -42.83112335205078, "global_step": 316322, "epoch": 2614} {"train_loss": -42.4034538269043, "global_step": 316323, "epoch": 2614} {"train_loss": -43.72528839111328, "global_step": 316324, "epoch": 2614} {"train_loss": -43.427005767822266, "global_step": 316325, "epoch": 2614} {"train_loss": -43.08108139038086, "global_step": 316326, "epoch": 2614} {"train_loss": -43.40523910522461, "global_step": 316327, "epoch": 2614} {"train_loss": -42.57723617553711, "global_step": 316328, "epoch": 2614} {"train_loss": -40.44453048706055, "global_step": 316329, "epoch": 2614} {"train_loss": -41.5816764831543, "global_step": 316330, "epoch": 2614} {"train_loss": -42.4310302734375, "global_step": 316331, "epoch": 2614} {"train_loss": -42.7746696472168, "global_step": 316332, "epoch": 2614} {"train_loss": -41.92000198364258, "global_step": 316333, "epoch": 2614} {"train_loss": -41.943145751953125, "global_step": 316334, "epoch": 2614} {"train_loss": -43.63529586791992, "global_step": 316335, "epoch": 2614} {"train_loss": -42.697540283203125, "global_step": 316336, "epoch": 2614} {"train_loss": -40.968841552734375, "global_step": 316337, "epoch": 2614} {"train_loss": -43.21213912963867, "global_step": 316338, "epoch": 2614} {"train_loss": -42.979488372802734, "global_step": 316339, "epoch": 2614} {"train_loss": -42.84487533569336, "global_step": 316340, "epoch": 2614} {"train_loss": -42.221622467041016, "global_step": 316341, "epoch": 2614} {"train_loss": -43.32038497924805, "global_step": 316342, "epoch": 2614} {"train_loss": -42.621883392333984, "global_step": 316343, "epoch": 2614} {"train_loss": -42.77946090698242, "global_step": 316344, "epoch": 2614} {"train_loss": -42.46641540527344, "global_step": 316345, "epoch": 2614} {"train_loss": -42.78335189819336, "global_step": 316346, "epoch": 2614} {"train_loss": -42.32058334350586, "global_step": 316347, "epoch": 2614} {"train_loss": -43.49201202392578, "global_step": 316348, "epoch": 2614} {"train_loss": -42.05038070678711, "global_step": 316349, "epoch": 2614} {"train_loss": -42.961727142333984, "global_step": 316350, "epoch": 2614} {"train_loss": -42.63597106933594, "global_step": 316351, "epoch": 2614} {"train_loss": -41.50214767456055, "global_step": 316352, "epoch": 2614} {"train_loss": -41.59645462036133, "global_step": 316353, "epoch": 2614} {"train_loss": -41.364463806152344, "global_step": 316354, "epoch": 2614} {"train_loss": -41.16903305053711, "global_step": 316355, "epoch": 2614} {"train_loss": -42.24895477294922, "global_step": 316356, "epoch": 2614} {"train_loss": -42.334938049316406, "global_step": 316357, "epoch": 2614} {"train_loss": -42.1441535949707, "global_step": 316358, "epoch": 2614} {"train_loss": -43.059844970703125, "global_step": 316359, "epoch": 2614} {"train_loss": -42.47756576538086, "global_step": 316360, "epoch": 2614} {"train_loss": -42.565860748291016, "global_step": 316361, "epoch": 2614} {"train_loss": -41.96775436401367, "global_step": 316362, "epoch": 2614} {"train_loss": -43.4797248840332, "global_step": 316363, "epoch": 2614} {"train_loss": -41.583377838134766, "global_step": 316364, "epoch": 2614} {"train_loss": -42.772804260253906, "global_step": 316365, "epoch": 2614} {"train_loss": -42.730770111083984, "global_step": 316366, "epoch": 2614} {"train_loss": -41.10221862792969, "global_step": 316367, "epoch": 2614} {"train_loss": -39.353118896484375, "global_step": 316368, "epoch": 2614} {"train_loss": -42.09067153930664, "global_step": 316369, "epoch": 2614} {"train_loss": -42.374446868896484, "global_step": 316370, "epoch": 2614} {"train_loss": -42.1109504699707, "global_step": 316371, "epoch": 2614} {"train_loss": -40.88685607910156, "global_step": 316372, "epoch": 2614} {"train_loss": -42.66440963745117, "global_step": 316373, "epoch": 2614} {"train_loss": -42.355140686035156, "global_step": 316374, "epoch": 2614} {"train_loss": -40.32913589477539, "global_step": 316375, "epoch": 2614} {"train_loss": -42.741947174072266, "global_step": 316376, "epoch": 2614} {"train_loss": -42.342933654785156, "global_step": 316377, "epoch": 2614} {"train_loss": -39.81817626953125, "global_step": 316378, "epoch": 2614} {"train_loss": -40.57322311401367, "global_step": 316379, "epoch": 2614} {"train_loss": -43.03449630737305, "global_step": 316380, "epoch": 2614} {"train_loss": -41.63172149658203, "global_step": 316381, "epoch": 2614} {"train_loss": -42.25051498413086, "global_step": 316382, "epoch": 2614} {"train_loss": -42.72669982910156, "global_step": 316383, "epoch": 2614} {"train_loss": -42.598323822021484, "global_step": 316384, "epoch": 2614} {"train_loss": -42.87897491455078, "global_step": 316385, "epoch": 2614} {"train_loss": -42.44572830200195, "global_step": 316386, "epoch": 2614} {"train_loss": -42.204402923583984, "global_step": 316387, "epoch": 2614} {"train_loss": -43.16847229003906, "global_step": 316388, "epoch": 2614} {"train_loss": -40.987335205078125, "global_step": 316389, "epoch": 2614} {"train_loss": -43.189701080322266, "global_step": 316390, "epoch": 2614} {"train_loss": -41.81196594238281, "global_step": 316391, "epoch": 2614} {"train_loss": -43.46539306640625, "global_step": 316392, "epoch": 2614} {"train_loss": -42.98249435424805, "global_step": 316393, "epoch": 2614} {"train_loss": -42.33880615234375, "global_step": 316394, "epoch": 2614} {"train_loss": -43.779937744140625, "global_step": 316395, "epoch": 2614} {"train_loss": -42.33358383178711, "global_step": 316396, "epoch": 2614} {"train_loss": -43.28791427612305, "global_step": 316397, "epoch": 2614} {"train_loss": -42.5672721862793, "global_step": 316398, "epoch": 2614} {"train_loss": -42.447715759277344, "global_step": 316399, "epoch": 2614} {"train_loss": -43.54084014892578, "global_step": 316400, "epoch": 2614} {"train_loss": -42.124874114990234, "global_step": 316401, "epoch": 2614} {"train_loss": -43.010467529296875, "global_step": 316402, "epoch": 2614} {"train_loss": -42.981956481933594, "global_step": 316403, "epoch": 2614} {"train_loss": -43.304046630859375, "global_step": 316404, "epoch": 2614} {"train_loss": -43.96419906616211, "global_step": 316405, "epoch": 2614} {"train_loss": -43.56290817260742, "global_step": 316406, "epoch": 2614} {"train_loss": -43.61606979370117, "global_step": 316407, "epoch": 2614} {"train_loss": -43.275936126708984, "global_step": 316408, "epoch": 2614} {"train_loss": -43.07571792602539, "global_step": 316409, "epoch": 2614} {"train_loss": -43.25593948364258, "global_step": 316410, "epoch": 2614} {"train_loss": -42.725341796875, "global_step": 316411, "epoch": 2614} {"train_loss": -43.39855194091797, "global_step": 316412, "epoch": 2614} {"train_loss": -43.066165924072266, "global_step": 316413, "epoch": 2614} {"train_loss": -42.63034848930422, "global_step": 316414, "epoch": 2614, "val_loss": 2669602.0} {"train_loss": -43.47334671020508, "global_step": 316415, "epoch": 2615} {"train_loss": -43.657928466796875, "global_step": 316416, "epoch": 2615} {"train_loss": -43.4212532043457, "global_step": 316417, "epoch": 2615} {"train_loss": -43.444515228271484, "global_step": 316418, "epoch": 2615} {"train_loss": -43.599388122558594, "global_step": 316419, "epoch": 2615} {"train_loss": -43.815399169921875, "global_step": 316420, "epoch": 2615} {"train_loss": -43.94256591796875, "global_step": 316421, "epoch": 2615} {"train_loss": -43.1802864074707, "global_step": 316422, "epoch": 2615} {"train_loss": -44.346534729003906, "global_step": 316423, "epoch": 2615} {"train_loss": -42.991943359375, "global_step": 316424, "epoch": 2615} {"train_loss": -44.16827392578125, "global_step": 316425, "epoch": 2615} {"train_loss": -44.065364837646484, "global_step": 316426, "epoch": 2615} {"train_loss": -43.93819808959961, "global_step": 316427, "epoch": 2615} {"train_loss": -44.09455490112305, "global_step": 316428, "epoch": 2615} {"train_loss": -43.48867416381836, "global_step": 316429, "epoch": 2615} {"train_loss": -44.47676467895508, "global_step": 316430, "epoch": 2615} {"train_loss": -43.81154251098633, "global_step": 316431, "epoch": 2615} {"train_loss": -42.93853759765625, "global_step": 316432, "epoch": 2615} {"train_loss": -43.25521469116211, "global_step": 316433, "epoch": 2615} {"train_loss": -43.8139533996582, "global_step": 316434, "epoch": 2615} {"train_loss": -42.98338317871094, "global_step": 316435, "epoch": 2615} {"train_loss": -43.957332611083984, "global_step": 316436, "epoch": 2615} {"train_loss": -43.86695098876953, "global_step": 316437, "epoch": 2615} {"train_loss": -43.456687927246094, "global_step": 316438, "epoch": 2615} {"train_loss": -44.303321838378906, "global_step": 316439, "epoch": 2615} {"train_loss": -44.21388626098633, "global_step": 316440, "epoch": 2615} {"train_loss": -43.30043411254883, "global_step": 316441, "epoch": 2615} {"train_loss": -43.67036056518555, "global_step": 316442, "epoch": 2615} {"train_loss": -44.57326889038086, "global_step": 316443, "epoch": 2615} {"train_loss": -43.69712448120117, "global_step": 316444, "epoch": 2615} {"train_loss": -44.51274490356445, "global_step": 316445, "epoch": 2615} {"train_loss": -44.69538116455078, "global_step": 316446, "epoch": 2615} {"train_loss": -44.118621826171875, "global_step": 316447, "epoch": 2615} {"train_loss": -43.71272659301758, "global_step": 316448, "epoch": 2615} {"train_loss": -44.80831527709961, "global_step": 316449, "epoch": 2615} {"train_loss": -44.17512893676758, "global_step": 316450, "epoch": 2615} {"train_loss": -44.56637954711914, "global_step": 316451, "epoch": 2615} {"train_loss": -44.75830078125, "global_step": 316452, "epoch": 2615} {"train_loss": -43.118343353271484, "global_step": 316453, "epoch": 2615} {"train_loss": -44.38039779663086, "global_step": 316454, "epoch": 2615} {"train_loss": -43.883758544921875, "global_step": 316455, "epoch": 2615} {"train_loss": -42.78157424926758, "global_step": 316456, "epoch": 2615} {"train_loss": -38.21224594116211, "global_step": 316457, "epoch": 2615} {"train_loss": -27.824914932250977, "global_step": 316458, "epoch": 2615} {"train_loss": -42.04478073120117, "global_step": 316459, "epoch": 2615} {"train_loss": -33.824520111083984, "global_step": 316460, "epoch": 2615} {"train_loss": -12.261515617370605, "global_step": 316461, "epoch": 2615} {"train_loss": -28.467609405517578, "global_step": 316462, "epoch": 2615} {"train_loss": -41.417945861816406, "global_step": 316463, "epoch": 2615} {"train_loss": -25.02971649169922, "global_step": 316464, "epoch": 2615} {"train_loss": -32.17279815673828, "global_step": 316465, "epoch": 2615} {"train_loss": -40.68331527709961, "global_step": 316466, "epoch": 2615} {"train_loss": -34.870582580566406, "global_step": 316467, "epoch": 2615} {"train_loss": -40.9510498046875, "global_step": 316468, "epoch": 2615} {"train_loss": -38.06997299194336, "global_step": 316469, "epoch": 2615} {"train_loss": -40.89988708496094, "global_step": 316470, "epoch": 2615} {"train_loss": -37.67082977294922, "global_step": 316471, "epoch": 2615} {"train_loss": -39.5996208190918, "global_step": 316472, "epoch": 2615} {"train_loss": -39.85493469238281, "global_step": 316473, "epoch": 2615} {"train_loss": -40.64702224731445, "global_step": 316474, "epoch": 2615} {"train_loss": -39.57444381713867, "global_step": 316475, "epoch": 2615} {"train_loss": -40.1339225769043, "global_step": 316476, "epoch": 2615} {"train_loss": -39.862918853759766, "global_step": 316477, "epoch": 2615} {"train_loss": -41.83140182495117, "global_step": 316478, "epoch": 2615} {"train_loss": -40.26008605957031, "global_step": 316479, "epoch": 2615} {"train_loss": -42.70693588256836, "global_step": 316480, "epoch": 2615} {"train_loss": -41.16368103027344, "global_step": 316481, "epoch": 2615} {"train_loss": -39.89870071411133, "global_step": 316482, "epoch": 2615} {"train_loss": -41.98335647583008, "global_step": 316483, "epoch": 2615} {"train_loss": -40.478328704833984, "global_step": 316484, "epoch": 2615} {"train_loss": -42.01485824584961, "global_step": 316485, "epoch": 2615} {"train_loss": -41.5611686706543, "global_step": 316486, "epoch": 2615} {"train_loss": -41.725826263427734, "global_step": 316487, "epoch": 2615} {"train_loss": -41.607967376708984, "global_step": 316488, "epoch": 2615} {"train_loss": -41.02455139160156, "global_step": 316489, "epoch": 2615} {"train_loss": -42.200862884521484, "global_step": 316490, "epoch": 2615} {"train_loss": -41.56635284423828, "global_step": 316491, "epoch": 2615} {"train_loss": -41.95623779296875, "global_step": 316492, "epoch": 2615} {"train_loss": -41.10590744018555, "global_step": 316493, "epoch": 2615} {"train_loss": -41.53679656982422, "global_step": 316494, "epoch": 2615} {"train_loss": -43.202030181884766, "global_step": 316495, "epoch": 2615} {"train_loss": -41.647701263427734, "global_step": 316496, "epoch": 2615} {"train_loss": -41.54423141479492, "global_step": 316497, "epoch": 2615} {"train_loss": -41.72304916381836, "global_step": 316498, "epoch": 2615} {"train_loss": -42.607177734375, "global_step": 316499, "epoch": 2615} {"train_loss": -42.10694885253906, "global_step": 316500, "epoch": 2615} {"train_loss": -42.78227233886719, "global_step": 316501, "epoch": 2615} {"train_loss": -40.2621955871582, "global_step": 316502, "epoch": 2615} {"train_loss": -43.01559066772461, "global_step": 316503, "epoch": 2615} {"train_loss": -42.80288314819336, "global_step": 316504, "epoch": 2615} {"train_loss": -42.61122512817383, "global_step": 316505, "epoch": 2615} {"train_loss": -42.36555099487305, "global_step": 316506, "epoch": 2615} {"train_loss": -42.975337982177734, "global_step": 316507, "epoch": 2615} {"train_loss": -43.10415267944336, "global_step": 316508, "epoch": 2615} {"train_loss": -43.49992370605469, "global_step": 316509, "epoch": 2615} {"train_loss": -43.32525634765625, "global_step": 316510, "epoch": 2615} {"train_loss": -43.09652328491211, "global_step": 316511, "epoch": 2615} {"train_loss": -42.53768539428711, "global_step": 316512, "epoch": 2615} {"train_loss": -42.073524475097656, "global_step": 316513, "epoch": 2615} {"train_loss": -42.67129135131836, "global_step": 316514, "epoch": 2615} {"train_loss": -43.225563049316406, "global_step": 316515, "epoch": 2615} {"train_loss": -43.48691940307617, "global_step": 316516, "epoch": 2615} {"train_loss": -43.58928298950195, "global_step": 316517, "epoch": 2615} {"train_loss": -43.15602111816406, "global_step": 316518, "epoch": 2615} {"train_loss": -42.65077590942383, "global_step": 316519, "epoch": 2615} {"train_loss": -42.6758918762207, "global_step": 316520, "epoch": 2615} {"train_loss": -43.502864837646484, "global_step": 316521, "epoch": 2615} {"train_loss": -42.9157829284668, "global_step": 316522, "epoch": 2615} {"train_loss": -43.531593322753906, "global_step": 316523, "epoch": 2615} {"train_loss": -43.09772491455078, "global_step": 316524, "epoch": 2615} {"train_loss": -43.42195129394531, "global_step": 316525, "epoch": 2615} {"train_loss": -43.68681716918945, "global_step": 316526, "epoch": 2615} {"train_loss": -42.67123031616211, "global_step": 316527, "epoch": 2615} {"train_loss": -43.990394592285156, "global_step": 316528, "epoch": 2615} {"train_loss": -43.71566390991211, "global_step": 316529, "epoch": 2615} {"train_loss": -43.635162353515625, "global_step": 316530, "epoch": 2615} {"train_loss": -44.06151580810547, "global_step": 316531, "epoch": 2615} {"train_loss": -43.72629928588867, "global_step": 316532, "epoch": 2615} {"train_loss": -43.774288177490234, "global_step": 316533, "epoch": 2615} {"train_loss": -43.08576583862305, "global_step": 316534, "epoch": 2615} {"train_loss": -41.8314790725708, "global_step": 316535, "epoch": 2615, "val_loss": 2789702.5} {"train_loss": -44.24280548095703, "global_step": 316536, "epoch": 2616} {"train_loss": -43.310638427734375, "global_step": 316537, "epoch": 2616} {"train_loss": -44.16205978393555, "global_step": 316538, "epoch": 2616} {"train_loss": -44.15608596801758, "global_step": 316539, "epoch": 2616} {"train_loss": -44.29606246948242, "global_step": 316540, "epoch": 2616} {"train_loss": -42.26250076293945, "global_step": 316541, "epoch": 2616} {"train_loss": -42.96105194091797, "global_step": 316542, "epoch": 2616} {"train_loss": -43.96200180053711, "global_step": 316543, "epoch": 2616} {"train_loss": -43.48896789550781, "global_step": 316544, "epoch": 2616} {"train_loss": -44.61390686035156, "global_step": 316545, "epoch": 2616} {"train_loss": -43.9508056640625, "global_step": 316546, "epoch": 2616} {"train_loss": -43.319000244140625, "global_step": 316547, "epoch": 2616} {"train_loss": -41.73200225830078, "global_step": 316548, "epoch": 2616} {"train_loss": -42.76015853881836, "global_step": 316549, "epoch": 2616} {"train_loss": -43.67279815673828, "global_step": 316550, "epoch": 2616} {"train_loss": -44.78913116455078, "global_step": 316551, "epoch": 2616} {"train_loss": -43.33220672607422, "global_step": 316552, "epoch": 2616} {"train_loss": -44.31681442260742, "global_step": 316553, "epoch": 2616} {"train_loss": -43.56965255737305, "global_step": 316554, "epoch": 2616} {"train_loss": -44.25283432006836, "global_step": 316555, "epoch": 2616} {"train_loss": -42.89085006713867, "global_step": 316556, "epoch": 2616} {"train_loss": -44.27841567993164, "global_step": 316557, "epoch": 2616} {"train_loss": -43.917686462402344, "global_step": 316558, "epoch": 2616} {"train_loss": -44.09076690673828, "global_step": 316559, "epoch": 2616} {"train_loss": -43.948516845703125, "global_step": 316560, "epoch": 2616} {"train_loss": -43.00532913208008, "global_step": 316561, "epoch": 2616} {"train_loss": -43.39387893676758, "global_step": 316562, "epoch": 2616} {"train_loss": -44.17158126831055, "global_step": 316563, "epoch": 2616} {"train_loss": -43.47635269165039, "global_step": 316564, "epoch": 2616} {"train_loss": -44.556480407714844, "global_step": 316565, "epoch": 2616} {"train_loss": -41.68008041381836, "global_step": 316566, "epoch": 2616} {"train_loss": -41.42305374145508, "global_step": 316567, "epoch": 2616} {"train_loss": -41.017974853515625, "global_step": 316568, "epoch": 2616} {"train_loss": -44.17161178588867, "global_step": 316569, "epoch": 2616} {"train_loss": -43.756263732910156, "global_step": 316570, "epoch": 2616} {"train_loss": -41.25078201293945, "global_step": 316571, "epoch": 2616} {"train_loss": -44.18041229248047, "global_step": 316572, "epoch": 2616} {"train_loss": -43.90229034423828, "global_step": 316573, "epoch": 2616} {"train_loss": -44.441585540771484, "global_step": 316574, "epoch": 2616} {"train_loss": -34.23579788208008, "global_step": 316575, "epoch": 2616} {"train_loss": -44.45174026489258, "global_step": 316576, "epoch": 2616} {"train_loss": -43.901790618896484, "global_step": 316577, "epoch": 2616} {"train_loss": -43.84917068481445, "global_step": 316578, "epoch": 2616} {"train_loss": -43.40169906616211, "global_step": 316579, "epoch": 2616} {"train_loss": -43.92407989501953, "global_step": 316580, "epoch": 2616} {"train_loss": -43.919403076171875, "global_step": 316581, "epoch": 2616} {"train_loss": -43.7619514465332, "global_step": 316582, "epoch": 2616} {"train_loss": -44.607295989990234, "global_step": 316583, "epoch": 2616} {"train_loss": -33.24082946777344, "global_step": 316584, "epoch": 2616} {"train_loss": -40.25808334350586, "global_step": 316585, "epoch": 2616} {"train_loss": -40.431026458740234, "global_step": 316586, "epoch": 2616} {"train_loss": -42.70822525024414, "global_step": 316587, "epoch": 2616} {"train_loss": -43.80379104614258, "global_step": 316588, "epoch": 2616} {"train_loss": -43.51424026489258, "global_step": 316589, "epoch": 2616} {"train_loss": -44.1880989074707, "global_step": 316590, "epoch": 2616} {"train_loss": -43.301090240478516, "global_step": 316591, "epoch": 2616} {"train_loss": -40.78082275390625, "global_step": 316592, "epoch": 2616} {"train_loss": -42.25325393676758, "global_step": 316593, "epoch": 2616} {"train_loss": -39.97144317626953, "global_step": 316594, "epoch": 2616} {"train_loss": -43.37464904785156, "global_step": 316595, "epoch": 2616} {"train_loss": -40.02899932861328, "global_step": 316596, "epoch": 2616} {"train_loss": -42.71771240234375, "global_step": 316597, "epoch": 2616} {"train_loss": -42.13711929321289, "global_step": 316598, "epoch": 2616} {"train_loss": -43.46747970581055, "global_step": 316599, "epoch": 2616} {"train_loss": -42.878597259521484, "global_step": 316600, "epoch": 2616} {"train_loss": -43.235862731933594, "global_step": 316601, "epoch": 2616} {"train_loss": -43.23633575439453, "global_step": 316602, "epoch": 2616} {"train_loss": -43.5098876953125, "global_step": 316603, "epoch": 2616} {"train_loss": -43.16429901123047, "global_step": 316604, "epoch": 2616} {"train_loss": -43.11600875854492, "global_step": 316605, "epoch": 2616} {"train_loss": -43.6728630065918, "global_step": 316606, "epoch": 2616} {"train_loss": -42.880916595458984, "global_step": 316607, "epoch": 2616} {"train_loss": -43.20675277709961, "global_step": 316608, "epoch": 2616} {"train_loss": -43.171913146972656, "global_step": 316609, "epoch": 2616} {"train_loss": -43.42660903930664, "global_step": 316610, "epoch": 2616} {"train_loss": -42.1464958190918, "global_step": 316611, "epoch": 2616} {"train_loss": -42.49892807006836, "global_step": 316612, "epoch": 2616} {"train_loss": -42.7607307434082, "global_step": 316613, "epoch": 2616} {"train_loss": -44.02778244018555, "global_step": 316614, "epoch": 2616} {"train_loss": -40.43267822265625, "global_step": 316615, "epoch": 2616} {"train_loss": -43.353919982910156, "global_step": 316616, "epoch": 2616} {"train_loss": -43.38474655151367, "global_step": 316617, "epoch": 2616} {"train_loss": -44.13819122314453, "global_step": 316618, "epoch": 2616} {"train_loss": -44.037567138671875, "global_step": 316619, "epoch": 2616} {"train_loss": -43.53657150268555, "global_step": 316620, "epoch": 2616} {"train_loss": -43.631507873535156, "global_step": 316621, "epoch": 2616} {"train_loss": -43.61579895019531, "global_step": 316622, "epoch": 2616} {"train_loss": -43.579925537109375, "global_step": 316623, "epoch": 2616} {"train_loss": -42.9870719909668, "global_step": 316624, "epoch": 2616} {"train_loss": -43.82225036621094, "global_step": 316625, "epoch": 2616} {"train_loss": -43.861114501953125, "global_step": 316626, "epoch": 2616} {"train_loss": -42.12202072143555, "global_step": 316627, "epoch": 2616} {"train_loss": -43.2999153137207, "global_step": 316628, "epoch": 2616} {"train_loss": -43.24794387817383, "global_step": 316629, "epoch": 2616} {"train_loss": -42.53975296020508, "global_step": 316630, "epoch": 2616} {"train_loss": -43.84861373901367, "global_step": 316631, "epoch": 2616} {"train_loss": -44.217010498046875, "global_step": 316632, "epoch": 2616} {"train_loss": -43.724422454833984, "global_step": 316633, "epoch": 2616} {"train_loss": -43.54458236694336, "global_step": 316634, "epoch": 2616} {"train_loss": -41.990142822265625, "global_step": 316635, "epoch": 2616} {"train_loss": -43.198814392089844, "global_step": 316636, "epoch": 2616} {"train_loss": -44.07291793823242, "global_step": 316637, "epoch": 2616} {"train_loss": -43.909767150878906, "global_step": 316638, "epoch": 2616} {"train_loss": -42.89628219604492, "global_step": 316639, "epoch": 2616} {"train_loss": -43.607364654541016, "global_step": 316640, "epoch": 2616} {"train_loss": -43.77036666870117, "global_step": 316641, "epoch": 2616} {"train_loss": -43.52417755126953, "global_step": 316642, "epoch": 2616} {"train_loss": -42.92091751098633, "global_step": 316643, "epoch": 2616} {"train_loss": -43.03744125366211, "global_step": 316644, "epoch": 2616} {"train_loss": -43.492252349853516, "global_step": 316645, "epoch": 2616} {"train_loss": -43.720821380615234, "global_step": 316646, "epoch": 2616} {"train_loss": -43.37799072265625, "global_step": 316647, "epoch": 2616} {"train_loss": -43.49917221069336, "global_step": 316648, "epoch": 2616} {"train_loss": -42.70064163208008, "global_step": 316649, "epoch": 2616} {"train_loss": -42.694862365722656, "global_step": 316650, "epoch": 2616} {"train_loss": -43.25198745727539, "global_step": 316651, "epoch": 2616} {"train_loss": -42.48108673095703, "global_step": 316652, "epoch": 2616} {"train_loss": -43.545875549316406, "global_step": 316653, "epoch": 2616} {"train_loss": -43.615657806396484, "global_step": 316654, "epoch": 2616} {"train_loss": -42.724090576171875, "global_step": 316655, "epoch": 2616} {"train_loss": -43.096098151088746, "global_step": 316656, "epoch": 2616, "val_loss": 2594851.75} {"train_loss": -43.74110794067383, "global_step": 316657, "epoch": 2617} {"train_loss": -43.43788528442383, "global_step": 316658, "epoch": 2617} {"train_loss": -42.976375579833984, "global_step": 316659, "epoch": 2617} {"train_loss": -43.04254913330078, "global_step": 316660, "epoch": 2617} {"train_loss": -43.44240951538086, "global_step": 316661, "epoch": 2617} {"train_loss": -43.87136459350586, "global_step": 316662, "epoch": 2617} {"train_loss": -43.512237548828125, "global_step": 316663, "epoch": 2617} {"train_loss": -43.736717224121094, "global_step": 316664, "epoch": 2617} {"train_loss": -43.84114456176758, "global_step": 316665, "epoch": 2617} {"train_loss": -44.11914825439453, "global_step": 316666, "epoch": 2617} {"train_loss": -44.35065841674805, "global_step": 316667, "epoch": 2617} {"train_loss": -43.354774475097656, "global_step": 316668, "epoch": 2617} {"train_loss": -44.9107551574707, "global_step": 316669, "epoch": 2617} {"train_loss": -43.080665588378906, "global_step": 316670, "epoch": 2617} {"train_loss": -42.163822174072266, "global_step": 316671, "epoch": 2617} {"train_loss": -43.77180862426758, "global_step": 316672, "epoch": 2617} {"train_loss": -41.73393630981445, "global_step": 316673, "epoch": 2617} {"train_loss": -42.52743148803711, "global_step": 316674, "epoch": 2617} {"train_loss": -44.173789978027344, "global_step": 316675, "epoch": 2617} {"train_loss": -42.640804290771484, "global_step": 316676, "epoch": 2617} {"train_loss": -41.743465423583984, "global_step": 316677, "epoch": 2617} {"train_loss": -44.2668571472168, "global_step": 316678, "epoch": 2617} {"train_loss": -43.275081634521484, "global_step": 316679, "epoch": 2617} {"train_loss": -43.874629974365234, "global_step": 316680, "epoch": 2617} {"train_loss": -42.78401565551758, "global_step": 316681, "epoch": 2617} {"train_loss": -43.664703369140625, "global_step": 316682, "epoch": 2617} {"train_loss": -43.984066009521484, "global_step": 316683, "epoch": 2617} {"train_loss": -44.04420471191406, "global_step": 316684, "epoch": 2617} {"train_loss": -43.80572509765625, "global_step": 316685, "epoch": 2617} {"train_loss": -44.673458099365234, "global_step": 316686, "epoch": 2617} {"train_loss": -43.73243713378906, "global_step": 316687, "epoch": 2617} {"train_loss": -42.50657272338867, "global_step": 316688, "epoch": 2617} {"train_loss": -43.91035461425781, "global_step": 316689, "epoch": 2617} {"train_loss": -43.65919876098633, "global_step": 316690, "epoch": 2617} {"train_loss": -44.05322265625, "global_step": 316691, "epoch": 2617} {"train_loss": -43.812068939208984, "global_step": 316692, "epoch": 2617} {"train_loss": -43.13286590576172, "global_step": 316693, "epoch": 2617} {"train_loss": -43.7768669128418, "global_step": 316694, "epoch": 2617} {"train_loss": -43.30696105957031, "global_step": 316695, "epoch": 2617} {"train_loss": -42.77239990234375, "global_step": 316696, "epoch": 2617} {"train_loss": -43.774112701416016, "global_step": 316697, "epoch": 2617} {"train_loss": -40.648155212402344, "global_step": 316698, "epoch": 2617} {"train_loss": -41.34206771850586, "global_step": 316699, "epoch": 2617} {"train_loss": -41.83753204345703, "global_step": 316700, "epoch": 2617} {"train_loss": -42.474727630615234, "global_step": 316701, "epoch": 2617} {"train_loss": -44.027565002441406, "global_step": 316702, "epoch": 2617} {"train_loss": -41.620609283447266, "global_step": 316703, "epoch": 2617} {"train_loss": -43.03859329223633, "global_step": 316704, "epoch": 2617} {"train_loss": -42.82288360595703, "global_step": 316705, "epoch": 2617} {"train_loss": -41.737247467041016, "global_step": 316706, "epoch": 2617} {"train_loss": -37.60872268676758, "global_step": 316707, "epoch": 2617} {"train_loss": -42.7095947265625, "global_step": 316708, "epoch": 2617} {"train_loss": -43.42489242553711, "global_step": 316709, "epoch": 2617} {"train_loss": -43.510765075683594, "global_step": 316710, "epoch": 2617} {"train_loss": -32.643367767333984, "global_step": 316711, "epoch": 2617} {"train_loss": -37.13346481323242, "global_step": 316712, "epoch": 2617} {"train_loss": -40.8494873046875, "global_step": 316713, "epoch": 2617} {"train_loss": -38.162349700927734, "global_step": 316714, "epoch": 2617} {"train_loss": -29.2885799407959, "global_step": 316715, "epoch": 2617} {"train_loss": 5.729323863983154, "global_step": 316716, "epoch": 2617} {"train_loss": -14.283187866210938, "global_step": 316717, "epoch": 2617} {"train_loss": -25.040578842163086, "global_step": 316718, "epoch": 2617} {"train_loss": -22.895605087280273, "global_step": 316719, "epoch": 2617} {"train_loss": -21.485645294189453, "global_step": 316720, "epoch": 2617} {"train_loss": -22.44605827331543, "global_step": 316721, "epoch": 2617} {"train_loss": -25.716699600219727, "global_step": 316722, "epoch": 2617} {"train_loss": -26.98356056213379, "global_step": 316723, "epoch": 2617} {"train_loss": -22.758270263671875, "global_step": 316724, "epoch": 2617} {"train_loss": -28.400976181030273, "global_step": 316725, "epoch": 2617} {"train_loss": -16.875736236572266, "global_step": 316726, "epoch": 2617} {"train_loss": -20.650611877441406, "global_step": 316727, "epoch": 2617} {"train_loss": -29.100616455078125, "global_step": 316728, "epoch": 2617} {"train_loss": -34.0637321472168, "global_step": 316729, "epoch": 2617} {"train_loss": -30.828161239624023, "global_step": 316730, "epoch": 2617} {"train_loss": -35.34151840209961, "global_step": 316731, "epoch": 2617} {"train_loss": -28.3626651763916, "global_step": 316732, "epoch": 2617} {"train_loss": -31.826745986938477, "global_step": 316733, "epoch": 2617} {"train_loss": -34.02227783203125, "global_step": 316734, "epoch": 2617} {"train_loss": -33.748199462890625, "global_step": 316735, "epoch": 2617} {"train_loss": -33.74650955200195, "global_step": 316736, "epoch": 2617} {"train_loss": -35.896385192871094, "global_step": 316737, "epoch": 2617} {"train_loss": -33.97905349731445, "global_step": 316738, "epoch": 2617} {"train_loss": -36.17908477783203, "global_step": 316739, "epoch": 2617} {"train_loss": -36.70557403564453, "global_step": 316740, "epoch": 2617} {"train_loss": -37.214576721191406, "global_step": 316741, "epoch": 2617} {"train_loss": -37.717201232910156, "global_step": 316742, "epoch": 2617} {"train_loss": -37.78825759887695, "global_step": 316743, "epoch": 2617} {"train_loss": -36.84502029418945, "global_step": 316744, "epoch": 2617} {"train_loss": -37.96809005737305, "global_step": 316745, "epoch": 2617} {"train_loss": -36.97088623046875, "global_step": 316746, "epoch": 2617} {"train_loss": -36.38837814331055, "global_step": 316747, "epoch": 2617} {"train_loss": -35.14841079711914, "global_step": 316748, "epoch": 2617} {"train_loss": -36.052589416503906, "global_step": 316749, "epoch": 2617} {"train_loss": -35.462772369384766, "global_step": 316750, "epoch": 2617} {"train_loss": -36.77582550048828, "global_step": 316751, "epoch": 2617} {"train_loss": -38.04209518432617, "global_step": 316752, "epoch": 2617} {"train_loss": -37.87052536010742, "global_step": 316753, "epoch": 2617} {"train_loss": -37.66432571411133, "global_step": 316754, "epoch": 2617} {"train_loss": -38.06801223754883, "global_step": 316755, "epoch": 2617} {"train_loss": -38.83512496948242, "global_step": 316756, "epoch": 2617} {"train_loss": -38.0075569152832, "global_step": 316757, "epoch": 2617} {"train_loss": -37.888607025146484, "global_step": 316758, "epoch": 2617} {"train_loss": -38.14590835571289, "global_step": 316759, "epoch": 2617} {"train_loss": -38.02524948120117, "global_step": 316760, "epoch": 2617} {"train_loss": -38.075531005859375, "global_step": 316761, "epoch": 2617} {"train_loss": -39.00069808959961, "global_step": 316762, "epoch": 2617} {"train_loss": -38.84244918823242, "global_step": 316763, "epoch": 2617} {"train_loss": -38.30113220214844, "global_step": 316764, "epoch": 2617} {"train_loss": -37.979122161865234, "global_step": 316765, "epoch": 2617} {"train_loss": -38.70545196533203, "global_step": 316766, "epoch": 2617} {"train_loss": -38.67500686645508, "global_step": 316767, "epoch": 2617} {"train_loss": -39.25164031982422, "global_step": 316768, "epoch": 2617} {"train_loss": -37.85514450073242, "global_step": 316769, "epoch": 2617} {"train_loss": -38.95445251464844, "global_step": 316770, "epoch": 2617} {"train_loss": -38.164154052734375, "global_step": 316771, "epoch": 2617} {"train_loss": -38.95418167114258, "global_step": 316772, "epoch": 2617} {"train_loss": -38.4211540222168, "global_step": 316773, "epoch": 2617} {"train_loss": -38.64936447143555, "global_step": 316774, "epoch": 2617} {"train_loss": -38.33534622192383, "global_step": 316775, "epoch": 2617} {"train_loss": -39.466796875, "global_step": 316776, "epoch": 2617} {"train_loss": -37.916563085288054, "global_step": 316777, "epoch": 2617, "val_loss": 2500763.75} {"train_loss": -38.969730377197266, "global_step": 316778, "epoch": 2618} {"train_loss": -38.97600173950195, "global_step": 316779, "epoch": 2618} {"train_loss": -39.84847640991211, "global_step": 316780, "epoch": 2618} {"train_loss": -38.7367057800293, "global_step": 316781, "epoch": 2618} {"train_loss": -39.76241683959961, "global_step": 316782, "epoch": 2618} {"train_loss": -39.45543670654297, "global_step": 316783, "epoch": 2618} {"train_loss": -39.84486770629883, "global_step": 316784, "epoch": 2618} {"train_loss": -39.733543395996094, "global_step": 316785, "epoch": 2618} {"train_loss": -39.49896240234375, "global_step": 316786, "epoch": 2618} {"train_loss": -39.885433197021484, "global_step": 316787, "epoch": 2618} {"train_loss": -40.10576248168945, "global_step": 316788, "epoch": 2618} {"train_loss": -39.679012298583984, "global_step": 316789, "epoch": 2618} {"train_loss": -39.7431640625, "global_step": 316790, "epoch": 2618} {"train_loss": -39.963966369628906, "global_step": 316791, "epoch": 2618} {"train_loss": -40.29301452636719, "global_step": 316792, "epoch": 2618} {"train_loss": -40.591670989990234, "global_step": 316793, "epoch": 2618} {"train_loss": -39.956790924072266, "global_step": 316794, "epoch": 2618} {"train_loss": -39.432987213134766, "global_step": 316795, "epoch": 2618} {"train_loss": -40.378509521484375, "global_step": 316796, "epoch": 2618} {"train_loss": -40.317161560058594, "global_step": 316797, "epoch": 2618} {"train_loss": -40.46390914916992, "global_step": 316798, "epoch": 2618} {"train_loss": -39.57925033569336, "global_step": 316799, "epoch": 2618} {"train_loss": -40.4229736328125, "global_step": 316800, "epoch": 2618} {"train_loss": -39.44951248168945, "global_step": 316801, "epoch": 2618} {"train_loss": -40.95358657836914, "global_step": 316802, "epoch": 2618} {"train_loss": -40.45814895629883, "global_step": 316803, "epoch": 2618} {"train_loss": -40.26581954956055, "global_step": 316804, "epoch": 2618} {"train_loss": -39.890716552734375, "global_step": 316805, "epoch": 2618} {"train_loss": -39.50954818725586, "global_step": 316806, "epoch": 2618} {"train_loss": -41.27901840209961, "global_step": 316807, "epoch": 2618} {"train_loss": -40.88307571411133, "global_step": 316808, "epoch": 2618} {"train_loss": -40.37009811401367, "global_step": 316809, "epoch": 2618} {"train_loss": -41.381343841552734, "global_step": 316810, "epoch": 2618} {"train_loss": -40.721858978271484, "global_step": 316811, "epoch": 2618} {"train_loss": -40.694271087646484, "global_step": 316812, "epoch": 2618} {"train_loss": -40.45016098022461, "global_step": 316813, "epoch": 2618} {"train_loss": -41.00386047363281, "global_step": 316814, "epoch": 2618} {"train_loss": -40.61307907104492, "global_step": 316815, "epoch": 2618} {"train_loss": -40.550750732421875, "global_step": 316816, "epoch": 2618} {"train_loss": -41.15460205078125, "global_step": 316817, "epoch": 2618} {"train_loss": -41.42784881591797, "global_step": 316818, "epoch": 2618} {"train_loss": -41.12934494018555, "global_step": 316819, "epoch": 2618} {"train_loss": -41.159767150878906, "global_step": 316820, "epoch": 2618} {"train_loss": -40.17626953125, "global_step": 316821, "epoch": 2618} {"train_loss": -41.18449783325195, "global_step": 316822, "epoch": 2618} {"train_loss": -40.86393356323242, "global_step": 316823, "epoch": 2618} {"train_loss": -41.28461456298828, "global_step": 316824, "epoch": 2618} {"train_loss": -40.731727600097656, "global_step": 316825, "epoch": 2618} {"train_loss": -41.25688552856445, "global_step": 316826, "epoch": 2618} {"train_loss": -41.40926742553711, "global_step": 316827, "epoch": 2618} {"train_loss": -41.77263259887695, "global_step": 316828, "epoch": 2618} {"train_loss": -41.794429779052734, "global_step": 316829, "epoch": 2618} {"train_loss": -41.2653923034668, "global_step": 316830, "epoch": 2618} {"train_loss": -41.100399017333984, "global_step": 316831, "epoch": 2618} {"train_loss": -40.79923629760742, "global_step": 316832, "epoch": 2618} {"train_loss": -40.95692825317383, "global_step": 316833, "epoch": 2618} {"train_loss": -41.85535430908203, "global_step": 316834, "epoch": 2618} {"train_loss": -41.63007354736328, "global_step": 316835, "epoch": 2618} {"train_loss": -41.315364837646484, "global_step": 316836, "epoch": 2618} {"train_loss": -41.40298080444336, "global_step": 316837, "epoch": 2618} {"train_loss": -41.564903259277344, "global_step": 316838, "epoch": 2618} {"train_loss": -40.88618087768555, "global_step": 316839, "epoch": 2618} {"train_loss": -41.38473129272461, "global_step": 316840, "epoch": 2618} {"train_loss": -41.55458068847656, "global_step": 316841, "epoch": 2618} {"train_loss": -41.54862976074219, "global_step": 316842, "epoch": 2618} {"train_loss": -41.6729850769043, "global_step": 316843, "epoch": 2618} {"train_loss": -41.60920333862305, "global_step": 316844, "epoch": 2618} {"train_loss": -41.98698806762695, "global_step": 316845, "epoch": 2618} {"train_loss": -42.61027526855469, "global_step": 316846, "epoch": 2618} {"train_loss": -42.09544372558594, "global_step": 316847, "epoch": 2618} {"train_loss": -41.79450225830078, "global_step": 316848, "epoch": 2618} {"train_loss": -42.27561569213867, "global_step": 316849, "epoch": 2618} {"train_loss": -41.60253143310547, "global_step": 316850, "epoch": 2618} {"train_loss": -41.5188102722168, "global_step": 316851, "epoch": 2618} {"train_loss": -41.68983840942383, "global_step": 316852, "epoch": 2618} {"train_loss": -42.20835876464844, "global_step": 316853, "epoch": 2618} {"train_loss": -41.70327377319336, "global_step": 316854, "epoch": 2618} {"train_loss": -42.17368698120117, "global_step": 316855, "epoch": 2618} {"train_loss": -42.467620849609375, "global_step": 316856, "epoch": 2618} {"train_loss": -42.447479248046875, "global_step": 316857, "epoch": 2618} {"train_loss": -41.27925491333008, "global_step": 316858, "epoch": 2618} {"train_loss": -41.87104034423828, "global_step": 316859, "epoch": 2618} {"train_loss": -42.16334915161133, "global_step": 316860, "epoch": 2618} {"train_loss": -42.3714599609375, "global_step": 316861, "epoch": 2618} {"train_loss": -41.74553298950195, "global_step": 316862, "epoch": 2618} {"train_loss": -41.95609664916992, "global_step": 316863, "epoch": 2618} {"train_loss": -42.48067092895508, "global_step": 316864, "epoch": 2618} {"train_loss": -41.69959259033203, "global_step": 316865, "epoch": 2618} {"train_loss": -42.17744827270508, "global_step": 316866, "epoch": 2618} {"train_loss": -41.91483688354492, "global_step": 316867, "epoch": 2618} {"train_loss": -42.92619705200195, "global_step": 316868, "epoch": 2618} {"train_loss": -42.692630767822266, "global_step": 316869, "epoch": 2618} {"train_loss": -42.21302795410156, "global_step": 316870, "epoch": 2618} {"train_loss": -42.229835510253906, "global_step": 316871, "epoch": 2618} {"train_loss": -43.15346908569336, "global_step": 316872, "epoch": 2618} {"train_loss": -42.84946823120117, "global_step": 316873, "epoch": 2618} {"train_loss": -42.15792465209961, "global_step": 316874, "epoch": 2618} {"train_loss": -41.82524490356445, "global_step": 316875, "epoch": 2618} {"train_loss": -42.15426254272461, "global_step": 316876, "epoch": 2618} {"train_loss": -42.39591979980469, "global_step": 316877, "epoch": 2618} {"train_loss": -42.35596466064453, "global_step": 316878, "epoch": 2618} {"train_loss": -42.07941818237305, "global_step": 316879, "epoch": 2618} {"train_loss": -41.87321853637695, "global_step": 316880, "epoch": 2618} {"train_loss": -42.69761276245117, "global_step": 316881, "epoch": 2618} {"train_loss": -42.65279769897461, "global_step": 316882, "epoch": 2618} {"train_loss": -42.95635223388672, "global_step": 316883, "epoch": 2618} {"train_loss": -42.77650833129883, "global_step": 316884, "epoch": 2618} {"train_loss": -41.91331100463867, "global_step": 316885, "epoch": 2618} {"train_loss": -42.34141540527344, "global_step": 316886, "epoch": 2618} {"train_loss": -42.12075424194336, "global_step": 316887, "epoch": 2618} {"train_loss": -42.445648193359375, "global_step": 316888, "epoch": 2618} {"train_loss": -42.80561447143555, "global_step": 316889, "epoch": 2618} {"train_loss": -42.34700393676758, "global_step": 316890, "epoch": 2618} {"train_loss": -42.312652587890625, "global_step": 316891, "epoch": 2618} {"train_loss": -42.988224029541016, "global_step": 316892, "epoch": 2618} {"train_loss": -43.24162292480469, "global_step": 316893, "epoch": 2618} {"train_loss": -42.01264572143555, "global_step": 316894, "epoch": 2618} {"train_loss": -42.63056182861328, "global_step": 316895, "epoch": 2618} {"train_loss": -43.00120162963867, "global_step": 316896, "epoch": 2618} {"train_loss": -42.97159957885742, "global_step": 316897, "epoch": 2618} {"train_loss": -41.36003298798868, "global_step": 316898, "epoch": 2618, "val_loss": 2537069.25} {"train_loss": -42.59925079345703, "global_step": 316899, "epoch": 2619} {"train_loss": -43.019325256347656, "global_step": 316900, "epoch": 2619} {"train_loss": -42.136199951171875, "global_step": 316901, "epoch": 2619} {"train_loss": -43.3564453125, "global_step": 316902, "epoch": 2619} {"train_loss": -42.95991897583008, "global_step": 316903, "epoch": 2619} {"train_loss": -43.877498626708984, "global_step": 316904, "epoch": 2619} {"train_loss": -43.444210052490234, "global_step": 316905, "epoch": 2619} {"train_loss": -43.24333572387695, "global_step": 316906, "epoch": 2619} {"train_loss": -42.65793991088867, "global_step": 316907, "epoch": 2619} {"train_loss": -42.936431884765625, "global_step": 316908, "epoch": 2619} {"train_loss": -43.3091926574707, "global_step": 316909, "epoch": 2619} {"train_loss": -43.07161331176758, "global_step": 316910, "epoch": 2619} {"train_loss": -43.0267333984375, "global_step": 316911, "epoch": 2619} {"train_loss": -44.07905578613281, "global_step": 316912, "epoch": 2619} {"train_loss": -43.03118896484375, "global_step": 316913, "epoch": 2619} {"train_loss": -43.36321258544922, "global_step": 316914, "epoch": 2619} {"train_loss": -42.916385650634766, "global_step": 316915, "epoch": 2619} {"train_loss": -42.40434646606445, "global_step": 316916, "epoch": 2619} {"train_loss": -43.845027923583984, "global_step": 316917, "epoch": 2619} {"train_loss": -42.756710052490234, "global_step": 316918, "epoch": 2619} {"train_loss": -42.96486282348633, "global_step": 316919, "epoch": 2619} {"train_loss": -43.32882308959961, "global_step": 316920, "epoch": 2619} {"train_loss": -42.3661994934082, "global_step": 316921, "epoch": 2619} {"train_loss": -43.1467399597168, "global_step": 316922, "epoch": 2619} {"train_loss": -43.48127365112305, "global_step": 316923, "epoch": 2619} {"train_loss": -43.229427337646484, "global_step": 316924, "epoch": 2619} {"train_loss": -43.93785858154297, "global_step": 316925, "epoch": 2619} {"train_loss": -43.4697265625, "global_step": 316926, "epoch": 2619} {"train_loss": -43.55629348754883, "global_step": 316927, "epoch": 2619} {"train_loss": -42.95722198486328, "global_step": 316928, "epoch": 2619} {"train_loss": -42.51441955566406, "global_step": 316929, "epoch": 2619} {"train_loss": -42.40363693237305, "global_step": 316930, "epoch": 2619} {"train_loss": -43.12820053100586, "global_step": 316931, "epoch": 2619} {"train_loss": -43.623104095458984, "global_step": 316932, "epoch": 2619} {"train_loss": -43.24247360229492, "global_step": 316933, "epoch": 2619} {"train_loss": -42.78082275390625, "global_step": 316934, "epoch": 2619} {"train_loss": -43.0907096862793, "global_step": 316935, "epoch": 2619} {"train_loss": -43.24201583862305, "global_step": 316936, "epoch": 2619} {"train_loss": -43.69772720336914, "global_step": 316937, "epoch": 2619} {"train_loss": -42.849422454833984, "global_step": 316938, "epoch": 2619} {"train_loss": -43.06073760986328, "global_step": 316939, "epoch": 2619} {"train_loss": -42.39609909057617, "global_step": 316940, "epoch": 2619} {"train_loss": -43.58590316772461, "global_step": 316941, "epoch": 2619} {"train_loss": -43.31565475463867, "global_step": 316942, "epoch": 2619} {"train_loss": -42.96290969848633, "global_step": 316943, "epoch": 2619} {"train_loss": -42.27855682373047, "global_step": 316944, "epoch": 2619} {"train_loss": -42.03925323486328, "global_step": 316945, "epoch": 2619} {"train_loss": -42.9564208984375, "global_step": 316946, "epoch": 2619} {"train_loss": -43.03944396972656, "global_step": 316947, "epoch": 2619} {"train_loss": -42.539737701416016, "global_step": 316948, "epoch": 2619} {"train_loss": -43.82255172729492, "global_step": 316949, "epoch": 2619} {"train_loss": -43.47310256958008, "global_step": 316950, "epoch": 2619} {"train_loss": -43.34792709350586, "global_step": 316951, "epoch": 2619} {"train_loss": -40.3271369934082, "global_step": 316952, "epoch": 2619} {"train_loss": -41.897705078125, "global_step": 316953, "epoch": 2619} {"train_loss": -42.05670166015625, "global_step": 316954, "epoch": 2619} {"train_loss": -42.41946029663086, "global_step": 316955, "epoch": 2619} {"train_loss": -41.50175094604492, "global_step": 316956, "epoch": 2619} {"train_loss": -41.01789474487305, "global_step": 316957, "epoch": 2619} {"train_loss": -41.23354721069336, "global_step": 316958, "epoch": 2619} {"train_loss": -42.94770431518555, "global_step": 316959, "epoch": 2619} {"train_loss": -39.4027099609375, "global_step": 316960, "epoch": 2619} {"train_loss": -41.18989944458008, "global_step": 316961, "epoch": 2619} {"train_loss": -43.578792572021484, "global_step": 316962, "epoch": 2619} {"train_loss": -42.0810546875, "global_step": 316963, "epoch": 2619} {"train_loss": -38.55765914916992, "global_step": 316964, "epoch": 2619} {"train_loss": -43.06605911254883, "global_step": 316965, "epoch": 2619} {"train_loss": -41.73063278198242, "global_step": 316966, "epoch": 2619} {"train_loss": -40.33234786987305, "global_step": 316967, "epoch": 2619} {"train_loss": -42.818321228027344, "global_step": 316968, "epoch": 2619} {"train_loss": -42.47719955444336, "global_step": 316969, "epoch": 2619} {"train_loss": -41.7181396484375, "global_step": 316970, "epoch": 2619} {"train_loss": -41.8584098815918, "global_step": 316971, "epoch": 2619} {"train_loss": -42.93634796142578, "global_step": 316972, "epoch": 2619} {"train_loss": -40.78610610961914, "global_step": 316973, "epoch": 2619} {"train_loss": -42.440101623535156, "global_step": 316974, "epoch": 2619} {"train_loss": -42.482208251953125, "global_step": 316975, "epoch": 2619} {"train_loss": -42.74900436401367, "global_step": 316976, "epoch": 2619} {"train_loss": -42.4583854675293, "global_step": 316977, "epoch": 2619} {"train_loss": -41.71229553222656, "global_step": 316978, "epoch": 2619} {"train_loss": -41.51606369018555, "global_step": 316979, "epoch": 2619} {"train_loss": -42.0882682800293, "global_step": 316980, "epoch": 2619} {"train_loss": -42.916385650634766, "global_step": 316981, "epoch": 2619} {"train_loss": -42.60291290283203, "global_step": 316982, "epoch": 2619} {"train_loss": -41.601253509521484, "global_step": 316983, "epoch": 2619} {"train_loss": -42.59871292114258, "global_step": 316984, "epoch": 2619} {"train_loss": -42.38972854614258, "global_step": 316985, "epoch": 2619} {"train_loss": -42.38105010986328, "global_step": 316986, "epoch": 2619} {"train_loss": -43.14431381225586, "global_step": 316987, "epoch": 2619} {"train_loss": -43.13206100463867, "global_step": 316988, "epoch": 2619} {"train_loss": -42.690643310546875, "global_step": 316989, "epoch": 2619} {"train_loss": -43.27034378051758, "global_step": 316990, "epoch": 2619} {"train_loss": -42.35560989379883, "global_step": 316991, "epoch": 2619} {"train_loss": -43.38130187988281, "global_step": 316992, "epoch": 2619} {"train_loss": -43.51064682006836, "global_step": 316993, "epoch": 2619} {"train_loss": -42.75486373901367, "global_step": 316994, "epoch": 2619} {"train_loss": -43.48921585083008, "global_step": 316995, "epoch": 2619} {"train_loss": -43.43312454223633, "global_step": 316996, "epoch": 2619} {"train_loss": -43.370704650878906, "global_step": 316997, "epoch": 2619} {"train_loss": -43.64458084106445, "global_step": 316998, "epoch": 2619} {"train_loss": -43.50982666015625, "global_step": 316999, "epoch": 2619} {"train_loss": -43.06160354614258, "global_step": 317000, "epoch": 2619} {"train_loss": -42.19349670410156, "global_step": 317001, "epoch": 2619} {"train_loss": -43.02554702758789, "global_step": 317002, "epoch": 2619} {"train_loss": -43.016353607177734, "global_step": 317003, "epoch": 2619} {"train_loss": -43.42461395263672, "global_step": 317004, "epoch": 2619} {"train_loss": -43.034908294677734, "global_step": 317005, "epoch": 2619} {"train_loss": -42.661617279052734, "global_step": 317006, "epoch": 2619} {"train_loss": -43.14614486694336, "global_step": 317007, "epoch": 2619} {"train_loss": -42.657196044921875, "global_step": 317008, "epoch": 2619} {"train_loss": -42.82607650756836, "global_step": 317009, "epoch": 2619} {"train_loss": -42.79392623901367, "global_step": 317010, "epoch": 2619} {"train_loss": -43.01261520385742, "global_step": 317011, "epoch": 2619} {"train_loss": -43.179744720458984, "global_step": 317012, "epoch": 2619} {"train_loss": -43.61933898925781, "global_step": 317013, "epoch": 2619} {"train_loss": -43.45962142944336, "global_step": 317014, "epoch": 2619} {"train_loss": -43.67153549194336, "global_step": 317015, "epoch": 2619} {"train_loss": -43.38775634765625, "global_step": 317016, "epoch": 2619} {"train_loss": -43.56610870361328, "global_step": 317017, "epoch": 2619} {"train_loss": -43.298641204833984, "global_step": 317018, "epoch": 2619} {"train_loss": -42.75656175219323, "global_step": 317019, "epoch": 2619, "val_loss": 2494827.25} {"train_loss": -43.20528793334961, "global_step": 317020, "epoch": 2620} {"train_loss": -43.6432991027832, "global_step": 317021, "epoch": 2620} {"train_loss": -42.79777526855469, "global_step": 317022, "epoch": 2620} {"train_loss": -43.39234161376953, "global_step": 317023, "epoch": 2620} {"train_loss": -41.43183517456055, "global_step": 317024, "epoch": 2620} {"train_loss": -40.7533073425293, "global_step": 317025, "epoch": 2620} {"train_loss": -42.72300720214844, "global_step": 317026, "epoch": 2620} {"train_loss": -41.7314567565918, "global_step": 317027, "epoch": 2620} {"train_loss": -39.262508392333984, "global_step": 317028, "epoch": 2620} {"train_loss": -42.20705795288086, "global_step": 317029, "epoch": 2620} {"train_loss": -41.851802825927734, "global_step": 317030, "epoch": 2620} {"train_loss": -41.39472198486328, "global_step": 317031, "epoch": 2620} {"train_loss": -43.08144760131836, "global_step": 317032, "epoch": 2620} {"train_loss": -41.04105758666992, "global_step": 317033, "epoch": 2620} {"train_loss": -42.845516204833984, "global_step": 317034, "epoch": 2620} {"train_loss": -42.568111419677734, "global_step": 317035, "epoch": 2620} {"train_loss": -41.68345260620117, "global_step": 317036, "epoch": 2620} {"train_loss": -42.13786697387695, "global_step": 317037, "epoch": 2620} {"train_loss": -42.08318328857422, "global_step": 317038, "epoch": 2620} {"train_loss": -43.26321029663086, "global_step": 317039, "epoch": 2620} {"train_loss": -42.54328536987305, "global_step": 317040, "epoch": 2620} {"train_loss": -42.0575065612793, "global_step": 317041, "epoch": 2620} {"train_loss": -42.89506149291992, "global_step": 317042, "epoch": 2620} {"train_loss": -42.01656723022461, "global_step": 317043, "epoch": 2620} {"train_loss": -42.48273849487305, "global_step": 317044, "epoch": 2620} {"train_loss": -43.6643180847168, "global_step": 317045, "epoch": 2620} {"train_loss": -43.063411712646484, "global_step": 317046, "epoch": 2620} {"train_loss": -42.4293327331543, "global_step": 317047, "epoch": 2620} {"train_loss": -43.45362091064453, "global_step": 317048, "epoch": 2620} {"train_loss": -42.7487907409668, "global_step": 317049, "epoch": 2620} {"train_loss": -43.195064544677734, "global_step": 317050, "epoch": 2620} {"train_loss": -43.5421142578125, "global_step": 317051, "epoch": 2620} {"train_loss": -43.47041320800781, "global_step": 317052, "epoch": 2620} {"train_loss": -43.583343505859375, "global_step": 317053, "epoch": 2620} {"train_loss": -43.11899948120117, "global_step": 317054, "epoch": 2620} {"train_loss": -43.67155075073242, "global_step": 317055, "epoch": 2620} {"train_loss": -43.90579605102539, "global_step": 317056, "epoch": 2620} {"train_loss": -43.56611251831055, "global_step": 317057, "epoch": 2620} {"train_loss": -44.28475570678711, "global_step": 317058, "epoch": 2620} {"train_loss": -43.44404220581055, "global_step": 317059, "epoch": 2620} {"train_loss": -43.34273147583008, "global_step": 317060, "epoch": 2620} {"train_loss": -43.092994689941406, "global_step": 317061, "epoch": 2620} {"train_loss": -43.35089874267578, "global_step": 317062, "epoch": 2620} {"train_loss": -43.71476364135742, "global_step": 317063, "epoch": 2620} {"train_loss": -44.27275466918945, "global_step": 317064, "epoch": 2620} {"train_loss": -44.13262939453125, "global_step": 317065, "epoch": 2620} {"train_loss": -43.97372055053711, "global_step": 317066, "epoch": 2620} {"train_loss": -44.237056732177734, "global_step": 317067, "epoch": 2620} {"train_loss": -43.55527877807617, "global_step": 317068, "epoch": 2620} {"train_loss": -43.957672119140625, "global_step": 317069, "epoch": 2620} {"train_loss": -43.25381851196289, "global_step": 317070, "epoch": 2620} {"train_loss": -44.048736572265625, "global_step": 317071, "epoch": 2620} {"train_loss": -44.593780517578125, "global_step": 317072, "epoch": 2620} {"train_loss": -43.7818603515625, "global_step": 317073, "epoch": 2620} {"train_loss": -44.41437911987305, "global_step": 317074, "epoch": 2620} {"train_loss": -43.74123001098633, "global_step": 317075, "epoch": 2620} {"train_loss": -43.757137298583984, "global_step": 317076, "epoch": 2620} {"train_loss": -42.4983024597168, "global_step": 317077, "epoch": 2620} {"train_loss": -43.96767807006836, "global_step": 317078, "epoch": 2620} {"train_loss": -43.73026657104492, "global_step": 317079, "epoch": 2620} {"train_loss": -42.85817337036133, "global_step": 317080, "epoch": 2620} {"train_loss": -43.37697982788086, "global_step": 317081, "epoch": 2620} {"train_loss": -43.489295959472656, "global_step": 317082, "epoch": 2620} {"train_loss": -43.525054931640625, "global_step": 317083, "epoch": 2620} {"train_loss": -44.00442123413086, "global_step": 317084, "epoch": 2620} {"train_loss": -43.92232131958008, "global_step": 317085, "epoch": 2620} {"train_loss": -43.1077766418457, "global_step": 317086, "epoch": 2620} {"train_loss": -43.28853988647461, "global_step": 317087, "epoch": 2620} {"train_loss": -43.05964279174805, "global_step": 317088, "epoch": 2620} {"train_loss": -42.6754150390625, "global_step": 317089, "epoch": 2620} {"train_loss": -40.63816452026367, "global_step": 317090, "epoch": 2620} {"train_loss": -41.461944580078125, "global_step": 317091, "epoch": 2620} {"train_loss": -42.066768646240234, "global_step": 317092, "epoch": 2620} {"train_loss": -43.759857177734375, "global_step": 317093, "epoch": 2620} {"train_loss": -43.7154655456543, "global_step": 317094, "epoch": 2620} {"train_loss": -42.93874740600586, "global_step": 317095, "epoch": 2620} {"train_loss": -41.74217987060547, "global_step": 317096, "epoch": 2620} {"train_loss": -43.60715866088867, "global_step": 317097, "epoch": 2620} {"train_loss": -42.813472747802734, "global_step": 317098, "epoch": 2620} {"train_loss": -42.84736251831055, "global_step": 317099, "epoch": 2620} {"train_loss": -41.838348388671875, "global_step": 317100, "epoch": 2620} {"train_loss": -43.95415115356445, "global_step": 317101, "epoch": 2620} {"train_loss": -42.796356201171875, "global_step": 317102, "epoch": 2620} {"train_loss": -43.002967834472656, "global_step": 317103, "epoch": 2620} {"train_loss": -44.055538177490234, "global_step": 317104, "epoch": 2620} {"train_loss": -43.448307037353516, "global_step": 317105, "epoch": 2620} {"train_loss": -43.89535140991211, "global_step": 317106, "epoch": 2620} {"train_loss": -43.68489456176758, "global_step": 317107, "epoch": 2620} {"train_loss": -43.89582443237305, "global_step": 317108, "epoch": 2620} {"train_loss": -43.546836853027344, "global_step": 317109, "epoch": 2620} {"train_loss": -42.6547966003418, "global_step": 317110, "epoch": 2620} {"train_loss": -43.16730880737305, "global_step": 317111, "epoch": 2620} {"train_loss": -43.49724197387695, "global_step": 317112, "epoch": 2620} {"train_loss": -42.65790939331055, "global_step": 317113, "epoch": 2620} {"train_loss": -43.4351921081543, "global_step": 317114, "epoch": 2620} {"train_loss": -43.962310791015625, "global_step": 317115, "epoch": 2620} {"train_loss": -43.680965423583984, "global_step": 317116, "epoch": 2620} {"train_loss": -43.059295654296875, "global_step": 317117, "epoch": 2620} {"train_loss": -43.00202560424805, "global_step": 317118, "epoch": 2620} {"train_loss": -42.967220306396484, "global_step": 317119, "epoch": 2620} {"train_loss": -42.699562072753906, "global_step": 317120, "epoch": 2620} {"train_loss": -44.17115783691406, "global_step": 317121, "epoch": 2620} {"train_loss": -43.40617752075195, "global_step": 317122, "epoch": 2620} {"train_loss": -44.16874694824219, "global_step": 317123, "epoch": 2620} {"train_loss": -43.065345764160156, "global_step": 317124, "epoch": 2620} {"train_loss": -43.110816955566406, "global_step": 317125, "epoch": 2620} {"train_loss": -43.246498107910156, "global_step": 317126, "epoch": 2620} {"train_loss": -42.856990814208984, "global_step": 317127, "epoch": 2620} {"train_loss": -43.25117111206055, "global_step": 317128, "epoch": 2620} {"train_loss": -42.748958587646484, "global_step": 317129, "epoch": 2620} {"train_loss": -43.18806838989258, "global_step": 317130, "epoch": 2620} {"train_loss": -42.00200271606445, "global_step": 317131, "epoch": 2620} {"train_loss": -43.279876708984375, "global_step": 317132, "epoch": 2620} {"train_loss": -43.083309173583984, "global_step": 317133, "epoch": 2620} {"train_loss": -43.28178024291992, "global_step": 317134, "epoch": 2620} {"train_loss": -42.67045593261719, "global_step": 317135, "epoch": 2620} {"train_loss": -42.708126068115234, "global_step": 317136, "epoch": 2620} {"train_loss": -41.97285079956055, "global_step": 317137, "epoch": 2620} {"train_loss": -43.99155807495117, "global_step": 317138, "epoch": 2620} {"train_loss": -43.120628356933594, "global_step": 317139, "epoch": 2620} {"train_loss": -43.072885150751794, "global_step": 317140, "epoch": 2620, "val_loss": 2536086.0} {"train_loss": -43.2873420715332, "global_step": 317141, "epoch": 2621} {"train_loss": -42.93845748901367, "global_step": 317142, "epoch": 2621} {"train_loss": -42.754737854003906, "global_step": 317143, "epoch": 2621} {"train_loss": -41.35227584838867, "global_step": 317144, "epoch": 2621} {"train_loss": -42.08912658691406, "global_step": 317145, "epoch": 2621} {"train_loss": -43.3088493347168, "global_step": 317146, "epoch": 2621} {"train_loss": -42.697235107421875, "global_step": 317147, "epoch": 2621} {"train_loss": -41.9659423828125, "global_step": 317148, "epoch": 2621} {"train_loss": -42.04929733276367, "global_step": 317149, "epoch": 2621} {"train_loss": -42.04582595825195, "global_step": 317150, "epoch": 2621} {"train_loss": -41.7931022644043, "global_step": 317151, "epoch": 2621} {"train_loss": -41.82432174682617, "global_step": 317152, "epoch": 2621} {"train_loss": -41.701454162597656, "global_step": 317153, "epoch": 2621} {"train_loss": -41.141292572021484, "global_step": 317154, "epoch": 2621} {"train_loss": -41.471378326416016, "global_step": 317155, "epoch": 2621} {"train_loss": -41.56779861450195, "global_step": 317156, "epoch": 2621} {"train_loss": -41.750038146972656, "global_step": 317157, "epoch": 2621} {"train_loss": -41.826759338378906, "global_step": 317158, "epoch": 2621} {"train_loss": -41.23713684082031, "global_step": 317159, "epoch": 2621} {"train_loss": -40.85572052001953, "global_step": 317160, "epoch": 2621} {"train_loss": -42.222042083740234, "global_step": 317161, "epoch": 2621} {"train_loss": -43.615394592285156, "global_step": 317162, "epoch": 2621} {"train_loss": -42.532188415527344, "global_step": 317163, "epoch": 2621} {"train_loss": -42.61252975463867, "global_step": 317164, "epoch": 2621} {"train_loss": -43.99748992919922, "global_step": 317165, "epoch": 2621} {"train_loss": -42.16349792480469, "global_step": 317166, "epoch": 2621} {"train_loss": -43.74076461791992, "global_step": 317167, "epoch": 2621} {"train_loss": -43.826988220214844, "global_step": 317168, "epoch": 2621} {"train_loss": -42.99579620361328, "global_step": 317169, "epoch": 2621} {"train_loss": -42.73998260498047, "global_step": 317170, "epoch": 2621} {"train_loss": -43.19569396972656, "global_step": 317171, "epoch": 2621} {"train_loss": -43.33613586425781, "global_step": 317172, "epoch": 2621} {"train_loss": -43.33346176147461, "global_step": 317173, "epoch": 2621} {"train_loss": -43.347198486328125, "global_step": 317174, "epoch": 2621} {"train_loss": -42.73661422729492, "global_step": 317175, "epoch": 2621} {"train_loss": -43.25444412231445, "global_step": 317176, "epoch": 2621} {"train_loss": -44.11591339111328, "global_step": 317177, "epoch": 2621} {"train_loss": -43.1978874206543, "global_step": 317178, "epoch": 2621} {"train_loss": -42.52753829956055, "global_step": 317179, "epoch": 2621} {"train_loss": -43.977752685546875, "global_step": 317180, "epoch": 2621} {"train_loss": -42.8380012512207, "global_step": 317181, "epoch": 2621} {"train_loss": -43.667625427246094, "global_step": 317182, "epoch": 2621} {"train_loss": -42.862918853759766, "global_step": 317183, "epoch": 2621} {"train_loss": -41.58502960205078, "global_step": 317184, "epoch": 2621} {"train_loss": -43.01751708984375, "global_step": 317185, "epoch": 2621} {"train_loss": -42.3852653503418, "global_step": 317186, "epoch": 2621} {"train_loss": -42.77410125732422, "global_step": 317187, "epoch": 2621} {"train_loss": -43.721435546875, "global_step": 317188, "epoch": 2621} {"train_loss": -42.7179069519043, "global_step": 317189, "epoch": 2621} {"train_loss": -43.74355697631836, "global_step": 317190, "epoch": 2621} {"train_loss": -42.15032958984375, "global_step": 317191, "epoch": 2621} {"train_loss": -42.74771499633789, "global_step": 317192, "epoch": 2621} {"train_loss": -43.122493743896484, "global_step": 317193, "epoch": 2621} {"train_loss": -42.46208572387695, "global_step": 317194, "epoch": 2621} {"train_loss": -43.28534698486328, "global_step": 317195, "epoch": 2621} {"train_loss": -41.877235412597656, "global_step": 317196, "epoch": 2621} {"train_loss": -43.069854736328125, "global_step": 317197, "epoch": 2621} {"train_loss": -44.168148040771484, "global_step": 317198, "epoch": 2621} {"train_loss": -41.9439697265625, "global_step": 317199, "epoch": 2621} {"train_loss": -43.31395721435547, "global_step": 317200, "epoch": 2621} {"train_loss": -43.53823471069336, "global_step": 317201, "epoch": 2621} {"train_loss": -42.270118713378906, "global_step": 317202, "epoch": 2621} {"train_loss": -43.60147476196289, "global_step": 317203, "epoch": 2621} {"train_loss": -43.490821838378906, "global_step": 317204, "epoch": 2621} {"train_loss": -43.5265007019043, "global_step": 317205, "epoch": 2621} {"train_loss": -43.483943939208984, "global_step": 317206, "epoch": 2621} {"train_loss": -43.42864990234375, "global_step": 317207, "epoch": 2621} {"train_loss": -43.51877975463867, "global_step": 317208, "epoch": 2621} {"train_loss": -43.47771072387695, "global_step": 317209, "epoch": 2621} {"train_loss": -43.64259338378906, "global_step": 317210, "epoch": 2621} {"train_loss": -43.50587844848633, "global_step": 317211, "epoch": 2621} {"train_loss": -43.5467643737793, "global_step": 317212, "epoch": 2621} {"train_loss": -43.75480270385742, "global_step": 317213, "epoch": 2621} {"train_loss": -42.7940788269043, "global_step": 317214, "epoch": 2621} {"train_loss": -43.510765075683594, "global_step": 317215, "epoch": 2621} {"train_loss": -41.57342529296875, "global_step": 317216, "epoch": 2621} {"train_loss": -42.847328186035156, "global_step": 317217, "epoch": 2621} {"train_loss": -43.93629837036133, "global_step": 317218, "epoch": 2621} {"train_loss": -42.61350631713867, "global_step": 317219, "epoch": 2621} {"train_loss": -44.44771194458008, "global_step": 317220, "epoch": 2621} {"train_loss": -44.011993408203125, "global_step": 317221, "epoch": 2621} {"train_loss": -43.71079635620117, "global_step": 317222, "epoch": 2621} {"train_loss": -42.912628173828125, "global_step": 317223, "epoch": 2621} {"train_loss": -44.06934356689453, "global_step": 317224, "epoch": 2621} {"train_loss": -44.0109977722168, "global_step": 317225, "epoch": 2621} {"train_loss": -43.119300842285156, "global_step": 317226, "epoch": 2621} {"train_loss": -44.109840393066406, "global_step": 317227, "epoch": 2621} {"train_loss": -43.9090461730957, "global_step": 317228, "epoch": 2621} {"train_loss": -42.54839324951172, "global_step": 317229, "epoch": 2621} {"train_loss": -43.419288635253906, "global_step": 317230, "epoch": 2621} {"train_loss": -43.877681732177734, "global_step": 317231, "epoch": 2621} {"train_loss": -41.589962005615234, "global_step": 317232, "epoch": 2621} {"train_loss": -42.673004150390625, "global_step": 317233, "epoch": 2621} {"train_loss": -43.849910736083984, "global_step": 317234, "epoch": 2621} {"train_loss": -42.376312255859375, "global_step": 317235, "epoch": 2621} {"train_loss": -43.30059814453125, "global_step": 317236, "epoch": 2621} {"train_loss": -42.7035026550293, "global_step": 317237, "epoch": 2621} {"train_loss": -42.12038040161133, "global_step": 317238, "epoch": 2621} {"train_loss": -41.99917221069336, "global_step": 317239, "epoch": 2621} {"train_loss": -43.61659622192383, "global_step": 317240, "epoch": 2621} {"train_loss": -41.566585540771484, "global_step": 317241, "epoch": 2621} {"train_loss": -39.64754104614258, "global_step": 317242, "epoch": 2621} {"train_loss": -44.04118728637695, "global_step": 317243, "epoch": 2621} {"train_loss": -40.85149002075195, "global_step": 317244, "epoch": 2621} {"train_loss": -41.94657516479492, "global_step": 317245, "epoch": 2621} {"train_loss": -43.2431755065918, "global_step": 317246, "epoch": 2621} {"train_loss": -39.697120666503906, "global_step": 317247, "epoch": 2621} {"train_loss": -38.22158432006836, "global_step": 317248, "epoch": 2621} {"train_loss": -42.04299545288086, "global_step": 317249, "epoch": 2621} {"train_loss": -41.31020736694336, "global_step": 317250, "epoch": 2621} {"train_loss": -42.03739547729492, "global_step": 317251, "epoch": 2621} {"train_loss": -40.08584213256836, "global_step": 317252, "epoch": 2621} {"train_loss": -39.62800979614258, "global_step": 317253, "epoch": 2621} {"train_loss": -40.65366744995117, "global_step": 317254, "epoch": 2621} {"train_loss": -41.03916549682617, "global_step": 317255, "epoch": 2621} {"train_loss": -41.67664337158203, "global_step": 317256, "epoch": 2621} {"train_loss": -41.44947052001953, "global_step": 317257, "epoch": 2621} {"train_loss": -40.6753044128418, "global_step": 317258, "epoch": 2621} {"train_loss": -42.432884216308594, "global_step": 317259, "epoch": 2621} {"train_loss": -40.322757720947266, "global_step": 317260, "epoch": 2621} {"train_loss": -42.61276078027142, "global_step": 317261, "epoch": 2621, "val_loss": 2527075.25} {"train_loss": -41.95937728881836, "global_step": 317262, "epoch": 2622} {"train_loss": -42.272640228271484, "global_step": 317263, "epoch": 2622} {"train_loss": -43.09839630126953, "global_step": 317264, "epoch": 2622} {"train_loss": -42.45682907104492, "global_step": 317265, "epoch": 2622} {"train_loss": -41.5738525390625, "global_step": 317266, "epoch": 2622} {"train_loss": -42.945064544677734, "global_step": 317267, "epoch": 2622} {"train_loss": -42.94734573364258, "global_step": 317268, "epoch": 2622} {"train_loss": -42.200042724609375, "global_step": 317269, "epoch": 2622} {"train_loss": -43.27893829345703, "global_step": 317270, "epoch": 2622} {"train_loss": -43.094356536865234, "global_step": 317271, "epoch": 2622} {"train_loss": -41.45024490356445, "global_step": 317272, "epoch": 2622} {"train_loss": -41.41726303100586, "global_step": 317273, "epoch": 2622} {"train_loss": -42.98604202270508, "global_step": 317274, "epoch": 2622} {"train_loss": -43.08617401123047, "global_step": 317275, "epoch": 2622} {"train_loss": -43.508750915527344, "global_step": 317276, "epoch": 2622} {"train_loss": -43.09354782104492, "global_step": 317277, "epoch": 2622} {"train_loss": -43.555660247802734, "global_step": 317278, "epoch": 2622} {"train_loss": -43.600135803222656, "global_step": 317279, "epoch": 2622} {"train_loss": -43.863033294677734, "global_step": 317280, "epoch": 2622} {"train_loss": -42.328182220458984, "global_step": 317281, "epoch": 2622} {"train_loss": -43.56809616088867, "global_step": 317282, "epoch": 2622} {"train_loss": -43.5791130065918, "global_step": 317283, "epoch": 2622} {"train_loss": -43.386383056640625, "global_step": 317284, "epoch": 2622} {"train_loss": -43.79261779785156, "global_step": 317285, "epoch": 2622} {"train_loss": -42.24538040161133, "global_step": 317286, "epoch": 2622} {"train_loss": -44.22441482543945, "global_step": 317287, "epoch": 2622} {"train_loss": -42.98442459106445, "global_step": 317288, "epoch": 2622} {"train_loss": -43.94380187988281, "global_step": 317289, "epoch": 2622} {"train_loss": -43.37177276611328, "global_step": 317290, "epoch": 2622} {"train_loss": -42.35631561279297, "global_step": 317291, "epoch": 2622} {"train_loss": -44.291439056396484, "global_step": 317292, "epoch": 2622} {"train_loss": -42.9351806640625, "global_step": 317293, "epoch": 2622} {"train_loss": -44.211055755615234, "global_step": 317294, "epoch": 2622} {"train_loss": -43.61301040649414, "global_step": 317295, "epoch": 2622} {"train_loss": -43.96822738647461, "global_step": 317296, "epoch": 2622} {"train_loss": -44.0985107421875, "global_step": 317297, "epoch": 2622} {"train_loss": -43.62579345703125, "global_step": 317298, "epoch": 2622} {"train_loss": -44.0965461730957, "global_step": 317299, "epoch": 2622} {"train_loss": -43.572750091552734, "global_step": 317300, "epoch": 2622} {"train_loss": -43.38845443725586, "global_step": 317301, "epoch": 2622} {"train_loss": -43.9521598815918, "global_step": 317302, "epoch": 2622} {"train_loss": -43.97833251953125, "global_step": 317303, "epoch": 2622} {"train_loss": -43.9883918762207, "global_step": 317304, "epoch": 2622} {"train_loss": -42.82965850830078, "global_step": 317305, "epoch": 2622} {"train_loss": -42.59904479980469, "global_step": 317306, "epoch": 2622} {"train_loss": -43.80843734741211, "global_step": 317307, "epoch": 2622} {"train_loss": -43.78092956542969, "global_step": 317308, "epoch": 2622} {"train_loss": -43.37165832519531, "global_step": 317309, "epoch": 2622} {"train_loss": -43.171016693115234, "global_step": 317310, "epoch": 2622} {"train_loss": -44.3306999206543, "global_step": 317311, "epoch": 2622} {"train_loss": -43.3209228515625, "global_step": 317312, "epoch": 2622} {"train_loss": -44.54885482788086, "global_step": 317313, "epoch": 2622} {"train_loss": -43.40248489379883, "global_step": 317314, "epoch": 2622} {"train_loss": -43.73604965209961, "global_step": 317315, "epoch": 2622} {"train_loss": -44.018043518066406, "global_step": 317316, "epoch": 2622} {"train_loss": -43.398189544677734, "global_step": 317317, "epoch": 2622} {"train_loss": -43.1183967590332, "global_step": 317318, "epoch": 2622} {"train_loss": -44.0427131652832, "global_step": 317319, "epoch": 2622} {"train_loss": -44.449378967285156, "global_step": 317320, "epoch": 2622} {"train_loss": -44.286258697509766, "global_step": 317321, "epoch": 2622} {"train_loss": -43.48685073852539, "global_step": 317322, "epoch": 2622} {"train_loss": -43.502044677734375, "global_step": 317323, "epoch": 2622} {"train_loss": -43.81161880493164, "global_step": 317324, "epoch": 2622} {"train_loss": -44.156166076660156, "global_step": 317325, "epoch": 2622} {"train_loss": -43.522762298583984, "global_step": 317326, "epoch": 2622} {"train_loss": -42.55369567871094, "global_step": 317327, "epoch": 2622} {"train_loss": -42.57826614379883, "global_step": 317328, "epoch": 2622} {"train_loss": -43.81946563720703, "global_step": 317329, "epoch": 2622} {"train_loss": -44.58148956298828, "global_step": 317330, "epoch": 2622} {"train_loss": -43.01594543457031, "global_step": 317331, "epoch": 2622} {"train_loss": -44.02311325073242, "global_step": 317332, "epoch": 2622} {"train_loss": -42.219215393066406, "global_step": 317333, "epoch": 2622} {"train_loss": -44.239654541015625, "global_step": 317334, "epoch": 2622} {"train_loss": -44.19108963012695, "global_step": 317335, "epoch": 2622} {"train_loss": -44.13935470581055, "global_step": 317336, "epoch": 2622} {"train_loss": -43.51472854614258, "global_step": 317337, "epoch": 2622} {"train_loss": -42.805885314941406, "global_step": 317338, "epoch": 2622} {"train_loss": -43.6942138671875, "global_step": 317339, "epoch": 2622} {"train_loss": -44.424983978271484, "global_step": 317340, "epoch": 2622} {"train_loss": -44.07277297973633, "global_step": 317341, "epoch": 2622} {"train_loss": -42.74274826049805, "global_step": 317342, "epoch": 2622} {"train_loss": -44.19025802612305, "global_step": 317343, "epoch": 2622} {"train_loss": -44.652915954589844, "global_step": 317344, "epoch": 2622} {"train_loss": -43.36198043823242, "global_step": 317345, "epoch": 2622} {"train_loss": -43.65019607543945, "global_step": 317346, "epoch": 2622} {"train_loss": -43.32183837890625, "global_step": 317347, "epoch": 2622} {"train_loss": -43.388519287109375, "global_step": 317348, "epoch": 2622} {"train_loss": -42.08234405517578, "global_step": 317349, "epoch": 2622} {"train_loss": -43.91428756713867, "global_step": 317350, "epoch": 2622} {"train_loss": -43.916439056396484, "global_step": 317351, "epoch": 2622} {"train_loss": -44.37818908691406, "global_step": 317352, "epoch": 2622} {"train_loss": -42.298465728759766, "global_step": 317353, "epoch": 2622} {"train_loss": -43.037445068359375, "global_step": 317354, "epoch": 2622} {"train_loss": -42.8309211730957, "global_step": 317355, "epoch": 2622} {"train_loss": -42.30926513671875, "global_step": 317356, "epoch": 2622} {"train_loss": -43.80921936035156, "global_step": 317357, "epoch": 2622} {"train_loss": -43.90071105957031, "global_step": 317358, "epoch": 2622} {"train_loss": -42.8213005065918, "global_step": 317359, "epoch": 2622} {"train_loss": -42.19610595703125, "global_step": 317360, "epoch": 2622} {"train_loss": -42.1517219543457, "global_step": 317361, "epoch": 2622} {"train_loss": -44.33631134033203, "global_step": 317362, "epoch": 2622} {"train_loss": -43.65707015991211, "global_step": 317363, "epoch": 2622} {"train_loss": -40.465389251708984, "global_step": 317364, "epoch": 2622} {"train_loss": -37.37894821166992, "global_step": 317365, "epoch": 2622} {"train_loss": -35.78780746459961, "global_step": 317366, "epoch": 2622} {"train_loss": -42.28064727783203, "global_step": 317367, "epoch": 2622} {"train_loss": -31.782434463500977, "global_step": 317368, "epoch": 2622} {"train_loss": -42.77534103393555, "global_step": 317369, "epoch": 2622} {"train_loss": -32.6136589050293, "global_step": 317370, "epoch": 2622} {"train_loss": -36.821956634521484, "global_step": 317371, "epoch": 2622} {"train_loss": -40.67867660522461, "global_step": 317372, "epoch": 2622} {"train_loss": -35.603424072265625, "global_step": 317373, "epoch": 2622} {"train_loss": -39.01894760131836, "global_step": 317374, "epoch": 2622} {"train_loss": -40.793121337890625, "global_step": 317375, "epoch": 2622} {"train_loss": -37.67285919189453, "global_step": 317376, "epoch": 2622} {"train_loss": -41.43141555786133, "global_step": 317377, "epoch": 2622} {"train_loss": -37.77154541015625, "global_step": 317378, "epoch": 2622} {"train_loss": -41.22735595703125, "global_step": 317379, "epoch": 2622} {"train_loss": -39.8947639465332, "global_step": 317380, "epoch": 2622} {"train_loss": -36.54277420043945, "global_step": 317381, "epoch": 2622} {"train_loss": -42.616607933990224, "global_step": 317382, "epoch": 2622, "val_loss": 2580072.75} {"train_loss": -39.55258560180664, "global_step": 317383, "epoch": 2623} {"train_loss": -41.22601318359375, "global_step": 317384, "epoch": 2623} {"train_loss": -40.717567443847656, "global_step": 317385, "epoch": 2623} {"train_loss": -41.468624114990234, "global_step": 317386, "epoch": 2623} {"train_loss": -41.921871185302734, "global_step": 317387, "epoch": 2623} {"train_loss": -41.38356018066406, "global_step": 317388, "epoch": 2623} {"train_loss": -40.92346954345703, "global_step": 317389, "epoch": 2623} {"train_loss": -42.33705139160156, "global_step": 317390, "epoch": 2623} {"train_loss": -42.085105895996094, "global_step": 317391, "epoch": 2623} {"train_loss": -42.29448318481445, "global_step": 317392, "epoch": 2623} {"train_loss": -42.018856048583984, "global_step": 317393, "epoch": 2623} {"train_loss": -42.031654357910156, "global_step": 317394, "epoch": 2623} {"train_loss": -43.072181701660156, "global_step": 317395, "epoch": 2623} {"train_loss": -40.01675033569336, "global_step": 317396, "epoch": 2623} {"train_loss": -42.516204833984375, "global_step": 317397, "epoch": 2623} {"train_loss": -42.91636276245117, "global_step": 317398, "epoch": 2623} {"train_loss": -43.27082824707031, "global_step": 317399, "epoch": 2623} {"train_loss": -42.570594787597656, "global_step": 317400, "epoch": 2623} {"train_loss": -42.49940872192383, "global_step": 317401, "epoch": 2623} {"train_loss": -42.97332000732422, "global_step": 317402, "epoch": 2623} {"train_loss": -41.182369232177734, "global_step": 317403, "epoch": 2623} {"train_loss": -43.577877044677734, "global_step": 317404, "epoch": 2623} {"train_loss": -42.30221176147461, "global_step": 317405, "epoch": 2623} {"train_loss": -42.89146423339844, "global_step": 317406, "epoch": 2623} {"train_loss": -42.98532485961914, "global_step": 317407, "epoch": 2623} {"train_loss": -42.8856086730957, "global_step": 317408, "epoch": 2623} {"train_loss": -42.53453063964844, "global_step": 317409, "epoch": 2623} {"train_loss": -43.868099212646484, "global_step": 317410, "epoch": 2623} {"train_loss": -42.8548583984375, "global_step": 317411, "epoch": 2623} {"train_loss": -43.510738372802734, "global_step": 317412, "epoch": 2623} {"train_loss": -42.450965881347656, "global_step": 317413, "epoch": 2623} {"train_loss": -43.605464935302734, "global_step": 317414, "epoch": 2623} {"train_loss": -43.97788619995117, "global_step": 317415, "epoch": 2623} {"train_loss": -43.43633270263672, "global_step": 317416, "epoch": 2623} {"train_loss": -43.69765090942383, "global_step": 317417, "epoch": 2623} {"train_loss": -44.02279281616211, "global_step": 317418, "epoch": 2623} {"train_loss": -43.29341506958008, "global_step": 317419, "epoch": 2623} {"train_loss": -43.68781661987305, "global_step": 317420, "epoch": 2623} {"train_loss": -43.45173645019531, "global_step": 317421, "epoch": 2623} {"train_loss": -44.11654281616211, "global_step": 317422, "epoch": 2623} {"train_loss": -43.65494155883789, "global_step": 317423, "epoch": 2623} {"train_loss": -43.30223846435547, "global_step": 317424, "epoch": 2623} {"train_loss": -43.74552917480469, "global_step": 317425, "epoch": 2623} {"train_loss": -44.39762878417969, "global_step": 317426, "epoch": 2623} {"train_loss": -44.074684143066406, "global_step": 317427, "epoch": 2623} {"train_loss": -44.16136169433594, "global_step": 317428, "epoch": 2623} {"train_loss": -43.75165939331055, "global_step": 317429, "epoch": 2623} {"train_loss": -44.13837432861328, "global_step": 317430, "epoch": 2623} {"train_loss": -43.933895111083984, "global_step": 317431, "epoch": 2623} {"train_loss": -44.05146026611328, "global_step": 317432, "epoch": 2623} {"train_loss": -43.741050720214844, "global_step": 317433, "epoch": 2623} {"train_loss": -44.04902648925781, "global_step": 317434, "epoch": 2623} {"train_loss": -44.3000602722168, "global_step": 317435, "epoch": 2623} {"train_loss": -44.546600341796875, "global_step": 317436, "epoch": 2623} {"train_loss": -44.28207015991211, "global_step": 317437, "epoch": 2623} {"train_loss": -44.39921951293945, "global_step": 317438, "epoch": 2623} {"train_loss": -44.380794525146484, "global_step": 317439, "epoch": 2623} {"train_loss": -42.64167404174805, "global_step": 317440, "epoch": 2623} {"train_loss": -43.575965881347656, "global_step": 317441, "epoch": 2623} {"train_loss": -43.96724319458008, "global_step": 317442, "epoch": 2623} {"train_loss": -44.211055755615234, "global_step": 317443, "epoch": 2623} {"train_loss": -44.76858139038086, "global_step": 317444, "epoch": 2623} {"train_loss": -44.900081634521484, "global_step": 317445, "epoch": 2623} {"train_loss": -41.69047927856445, "global_step": 317446, "epoch": 2623} {"train_loss": -40.33039474487305, "global_step": 317447, "epoch": 2623} {"train_loss": -44.260887145996094, "global_step": 317448, "epoch": 2623} {"train_loss": -44.08205795288086, "global_step": 317449, "epoch": 2623} {"train_loss": -43.94808578491211, "global_step": 317450, "epoch": 2623} {"train_loss": -41.49573516845703, "global_step": 317451, "epoch": 2623} {"train_loss": -43.202266693115234, "global_step": 317452, "epoch": 2623} {"train_loss": -43.857173919677734, "global_step": 317453, "epoch": 2623} {"train_loss": -44.804901123046875, "global_step": 317454, "epoch": 2623} {"train_loss": -44.529579162597656, "global_step": 317455, "epoch": 2623} {"train_loss": -44.27056884765625, "global_step": 317456, "epoch": 2623} {"train_loss": -44.4543342590332, "global_step": 317457, "epoch": 2623} {"train_loss": -44.411773681640625, "global_step": 317458, "epoch": 2623} {"train_loss": -44.82880783081055, "global_step": 317459, "epoch": 2623} {"train_loss": -43.546504974365234, "global_step": 317460, "epoch": 2623} {"train_loss": -44.61664962768555, "global_step": 317461, "epoch": 2623} {"train_loss": -44.5587158203125, "global_step": 317462, "epoch": 2623} {"train_loss": -43.81515884399414, "global_step": 317463, "epoch": 2623} {"train_loss": -44.52639389038086, "global_step": 317464, "epoch": 2623} {"train_loss": -43.99860763549805, "global_step": 317465, "epoch": 2623} {"train_loss": -44.30073928833008, "global_step": 317466, "epoch": 2623} {"train_loss": -44.653541564941406, "global_step": 317467, "epoch": 2623} {"train_loss": -44.29914093017578, "global_step": 317468, "epoch": 2623} {"train_loss": -44.789241790771484, "global_step": 317469, "epoch": 2623} {"train_loss": -44.31995391845703, "global_step": 317470, "epoch": 2623} {"train_loss": -44.58687210083008, "global_step": 317471, "epoch": 2623} {"train_loss": -43.2468147277832, "global_step": 317472, "epoch": 2623} {"train_loss": -43.928619384765625, "global_step": 317473, "epoch": 2623} {"train_loss": -44.314605712890625, "global_step": 317474, "epoch": 2623} {"train_loss": -44.75773239135742, "global_step": 317475, "epoch": 2623} {"train_loss": -44.807830810546875, "global_step": 317476, "epoch": 2623} {"train_loss": -44.32481002807617, "global_step": 317477, "epoch": 2623} {"train_loss": -44.28159713745117, "global_step": 317478, "epoch": 2623} {"train_loss": -43.749263763427734, "global_step": 317479, "epoch": 2623} {"train_loss": -43.63066482543945, "global_step": 317480, "epoch": 2623} {"train_loss": -41.97391891479492, "global_step": 317481, "epoch": 2623} {"train_loss": -43.440093994140625, "global_step": 317482, "epoch": 2623} {"train_loss": -42.6688232421875, "global_step": 317483, "epoch": 2623} {"train_loss": -41.57760238647461, "global_step": 317484, "epoch": 2623} {"train_loss": -40.15761947631836, "global_step": 317485, "epoch": 2623} {"train_loss": -41.69446563720703, "global_step": 317486, "epoch": 2623} {"train_loss": -43.5030632019043, "global_step": 317487, "epoch": 2623} {"train_loss": -42.183815002441406, "global_step": 317488, "epoch": 2623} {"train_loss": -38.67363357543945, "global_step": 317489, "epoch": 2623} {"train_loss": -41.43449020385742, "global_step": 317490, "epoch": 2623} {"train_loss": -43.938106536865234, "global_step": 317491, "epoch": 2623} {"train_loss": -40.70935821533203, "global_step": 317492, "epoch": 2623} {"train_loss": -41.11838912963867, "global_step": 317493, "epoch": 2623} {"train_loss": -44.008628845214844, "global_step": 317494, "epoch": 2623} {"train_loss": -41.757625579833984, "global_step": 317495, "epoch": 2623} {"train_loss": -42.995094299316406, "global_step": 317496, "epoch": 2623} {"train_loss": -44.148799896240234, "global_step": 317497, "epoch": 2623} {"train_loss": -41.63871383666992, "global_step": 317498, "epoch": 2623} {"train_loss": -42.4410514831543, "global_step": 317499, "epoch": 2623} {"train_loss": -43.103729248046875, "global_step": 317500, "epoch": 2623} {"train_loss": -41.23429870605469, "global_step": 317501, "epoch": 2623} {"train_loss": -43.62868881225586, "global_step": 317502, "epoch": 2623} {"train_loss": -43.17154611634814, "global_step": 317503, "epoch": 2623, "val_loss": 2658926.75} {"train_loss": -42.89048385620117, "global_step": 317504, "epoch": 2624} {"train_loss": -42.72066116333008, "global_step": 317505, "epoch": 2624} {"train_loss": -42.52729034423828, "global_step": 317506, "epoch": 2624} {"train_loss": -42.74945068359375, "global_step": 317507, "epoch": 2624} {"train_loss": -41.2490119934082, "global_step": 317508, "epoch": 2624} {"train_loss": -43.01807403564453, "global_step": 317509, "epoch": 2624} {"train_loss": -42.84344482421875, "global_step": 317510, "epoch": 2624} {"train_loss": -41.738525390625, "global_step": 317511, "epoch": 2624} {"train_loss": -42.303585052490234, "global_step": 317512, "epoch": 2624} {"train_loss": -42.41021728515625, "global_step": 317513, "epoch": 2624} {"train_loss": -43.26139450073242, "global_step": 317514, "epoch": 2624} {"train_loss": -41.36365509033203, "global_step": 317515, "epoch": 2624} {"train_loss": -43.47941207885742, "global_step": 317516, "epoch": 2624} {"train_loss": -42.023651123046875, "global_step": 317517, "epoch": 2624} {"train_loss": -42.8471565246582, "global_step": 317518, "epoch": 2624} {"train_loss": -43.59615707397461, "global_step": 317519, "epoch": 2624} {"train_loss": -43.660526275634766, "global_step": 317520, "epoch": 2624} {"train_loss": -43.2242317199707, "global_step": 317521, "epoch": 2624} {"train_loss": -43.54163360595703, "global_step": 317522, "epoch": 2624} {"train_loss": -43.5842170715332, "global_step": 317523, "epoch": 2624} {"train_loss": -43.188716888427734, "global_step": 317524, "epoch": 2624} {"train_loss": -44.07674789428711, "global_step": 317525, "epoch": 2624} {"train_loss": -43.517791748046875, "global_step": 317526, "epoch": 2624} {"train_loss": -44.25701904296875, "global_step": 317527, "epoch": 2624} {"train_loss": -43.93385696411133, "global_step": 317528, "epoch": 2624} {"train_loss": -43.67959976196289, "global_step": 317529, "epoch": 2624} {"train_loss": -43.82697296142578, "global_step": 317530, "epoch": 2624} {"train_loss": -44.07563400268555, "global_step": 317531, "epoch": 2624} {"train_loss": -43.08272933959961, "global_step": 317532, "epoch": 2624} {"train_loss": -44.47053527832031, "global_step": 317533, "epoch": 2624} {"train_loss": -43.58701705932617, "global_step": 317534, "epoch": 2624} {"train_loss": -44.50111770629883, "global_step": 317535, "epoch": 2624} {"train_loss": -44.3477668762207, "global_step": 317536, "epoch": 2624} {"train_loss": -43.97469711303711, "global_step": 317537, "epoch": 2624} {"train_loss": -43.591854095458984, "global_step": 317538, "epoch": 2624} {"train_loss": -43.80220413208008, "global_step": 317539, "epoch": 2624} {"train_loss": -44.34659957885742, "global_step": 317540, "epoch": 2624} {"train_loss": -43.92951965332031, "global_step": 317541, "epoch": 2624} {"train_loss": -44.26649856567383, "global_step": 317542, "epoch": 2624} {"train_loss": -43.71963119506836, "global_step": 317543, "epoch": 2624} {"train_loss": -43.9962158203125, "global_step": 317544, "epoch": 2624} {"train_loss": -43.557621002197266, "global_step": 317545, "epoch": 2624} {"train_loss": -44.75796127319336, "global_step": 317546, "epoch": 2624} {"train_loss": -44.7876091003418, "global_step": 317547, "epoch": 2624} {"train_loss": -44.238624572753906, "global_step": 317548, "epoch": 2624} {"train_loss": -44.520843505859375, "global_step": 317549, "epoch": 2624} {"train_loss": -43.91343307495117, "global_step": 317550, "epoch": 2624} {"train_loss": -44.49920654296875, "global_step": 317551, "epoch": 2624} {"train_loss": -44.2251091003418, "global_step": 317552, "epoch": 2624} {"train_loss": -44.48332595825195, "global_step": 317553, "epoch": 2624} {"train_loss": -44.14482498168945, "global_step": 317554, "epoch": 2624} {"train_loss": -44.328975677490234, "global_step": 317555, "epoch": 2624} {"train_loss": -44.831077575683594, "global_step": 317556, "epoch": 2624} {"train_loss": -44.735477447509766, "global_step": 317557, "epoch": 2624} {"train_loss": -45.0009880065918, "global_step": 317558, "epoch": 2624} {"train_loss": -44.35439682006836, "global_step": 317559, "epoch": 2624} {"train_loss": -44.56245803833008, "global_step": 317560, "epoch": 2624} {"train_loss": -45.01302719116211, "global_step": 317561, "epoch": 2624} {"train_loss": -44.301536560058594, "global_step": 317562, "epoch": 2624} {"train_loss": -44.12471389770508, "global_step": 317563, "epoch": 2624} {"train_loss": -43.90030288696289, "global_step": 317564, "epoch": 2624} {"train_loss": -44.720088958740234, "global_step": 317565, "epoch": 2624} {"train_loss": -44.59284210205078, "global_step": 317566, "epoch": 2624} {"train_loss": -44.39713668823242, "global_step": 317567, "epoch": 2624} {"train_loss": -43.90053939819336, "global_step": 317568, "epoch": 2624} {"train_loss": -44.610103607177734, "global_step": 317569, "epoch": 2624} {"train_loss": -43.7435417175293, "global_step": 317570, "epoch": 2624} {"train_loss": -44.57366180419922, "global_step": 317571, "epoch": 2624} {"train_loss": -44.4031867980957, "global_step": 317572, "epoch": 2624} {"train_loss": -43.807456970214844, "global_step": 317573, "epoch": 2624} {"train_loss": -44.692562103271484, "global_step": 317574, "epoch": 2624} {"train_loss": -44.432857513427734, "global_step": 317575, "epoch": 2624} {"train_loss": -43.70846176147461, "global_step": 317576, "epoch": 2624} {"train_loss": -44.55831527709961, "global_step": 317577, "epoch": 2624} {"train_loss": -43.927490234375, "global_step": 317578, "epoch": 2624} {"train_loss": -44.08531951904297, "global_step": 317579, "epoch": 2624} {"train_loss": -44.4242057800293, "global_step": 317580, "epoch": 2624} {"train_loss": -44.04244613647461, "global_step": 317581, "epoch": 2624} {"train_loss": -44.767147064208984, "global_step": 317582, "epoch": 2624} {"train_loss": -43.82137680053711, "global_step": 317583, "epoch": 2624} {"train_loss": -43.00102615356445, "global_step": 317584, "epoch": 2624} {"train_loss": -43.551292419433594, "global_step": 317585, "epoch": 2624} {"train_loss": -43.86970138549805, "global_step": 317586, "epoch": 2624} {"train_loss": -44.24270248413086, "global_step": 317587, "epoch": 2624} {"train_loss": -44.05331039428711, "global_step": 317588, "epoch": 2624} {"train_loss": -44.1519889831543, "global_step": 317589, "epoch": 2624} {"train_loss": -44.08837890625, "global_step": 317590, "epoch": 2624} {"train_loss": -43.67184829711914, "global_step": 317591, "epoch": 2624} {"train_loss": -44.180477142333984, "global_step": 317592, "epoch": 2624} {"train_loss": -44.22442626953125, "global_step": 317593, "epoch": 2624} {"train_loss": -43.63257598876953, "global_step": 317594, "epoch": 2624} {"train_loss": -44.77151107788086, "global_step": 317595, "epoch": 2624} {"train_loss": -44.07194519042969, "global_step": 317596, "epoch": 2624} {"train_loss": -45.02273941040039, "global_step": 317597, "epoch": 2624} {"train_loss": -43.364803314208984, "global_step": 317598, "epoch": 2624} {"train_loss": -42.79050827026367, "global_step": 317599, "epoch": 2624} {"train_loss": -41.75712203979492, "global_step": 317600, "epoch": 2624} {"train_loss": -38.97832107543945, "global_step": 317601, "epoch": 2624} {"train_loss": -42.873497009277344, "global_step": 317602, "epoch": 2624} {"train_loss": -41.73598861694336, "global_step": 317603, "epoch": 2624} {"train_loss": -42.141780853271484, "global_step": 317604, "epoch": 2624} {"train_loss": -42.472591400146484, "global_step": 317605, "epoch": 2624} {"train_loss": -42.13483810424805, "global_step": 317606, "epoch": 2624} {"train_loss": -39.44866943359375, "global_step": 317607, "epoch": 2624} {"train_loss": -42.5273323059082, "global_step": 317608, "epoch": 2624} {"train_loss": -40.908782958984375, "global_step": 317609, "epoch": 2624} {"train_loss": -40.080352783203125, "global_step": 317610, "epoch": 2624} {"train_loss": -42.2507209777832, "global_step": 317611, "epoch": 2624} {"train_loss": -39.760406494140625, "global_step": 317612, "epoch": 2624} {"train_loss": -41.66935729980469, "global_step": 317613, "epoch": 2624} {"train_loss": -43.04228591918945, "global_step": 317614, "epoch": 2624} {"train_loss": -41.284889221191406, "global_step": 317615, "epoch": 2624} {"train_loss": -41.78731918334961, "global_step": 317616, "epoch": 2624} {"train_loss": -41.61536407470703, "global_step": 317617, "epoch": 2624} {"train_loss": -42.26530075073242, "global_step": 317618, "epoch": 2624} {"train_loss": -39.74386215209961, "global_step": 317619, "epoch": 2624} {"train_loss": -40.88114929199219, "global_step": 317620, "epoch": 2624} {"train_loss": -41.86871337890625, "global_step": 317621, "epoch": 2624} {"train_loss": -40.93684768676758, "global_step": 317622, "epoch": 2624} {"train_loss": -41.874839782714844, "global_step": 317623, "epoch": 2624} {"train_loss": -43.34926346707935, "global_step": 317624, "epoch": 2624, "val_loss": 2656867.0} {"train_loss": -42.72405242919922, "global_step": 317625, "epoch": 2625} {"train_loss": -40.86042022705078, "global_step": 317626, "epoch": 2625} {"train_loss": -42.18912887573242, "global_step": 317627, "epoch": 2625} {"train_loss": -43.33292770385742, "global_step": 317628, "epoch": 2625} {"train_loss": -41.59675216674805, "global_step": 317629, "epoch": 2625} {"train_loss": -42.45838165283203, "global_step": 317630, "epoch": 2625} {"train_loss": -42.7968864440918, "global_step": 317631, "epoch": 2625} {"train_loss": -41.656288146972656, "global_step": 317632, "epoch": 2625} {"train_loss": -42.65953826904297, "global_step": 317633, "epoch": 2625} {"train_loss": -42.4288444519043, "global_step": 317634, "epoch": 2625} {"train_loss": -40.8707160949707, "global_step": 317635, "epoch": 2625} {"train_loss": -43.690574645996094, "global_step": 317636, "epoch": 2625} {"train_loss": -42.47126007080078, "global_step": 317637, "epoch": 2625} {"train_loss": -42.940826416015625, "global_step": 317638, "epoch": 2625} {"train_loss": -42.736812591552734, "global_step": 317639, "epoch": 2625} {"train_loss": -43.53342056274414, "global_step": 317640, "epoch": 2625} {"train_loss": -42.874046325683594, "global_step": 317641, "epoch": 2625} {"train_loss": -43.42237091064453, "global_step": 317642, "epoch": 2625} {"train_loss": -42.799041748046875, "global_step": 317643, "epoch": 2625} {"train_loss": -44.08787536621094, "global_step": 317644, "epoch": 2625} {"train_loss": -43.177162170410156, "global_step": 317645, "epoch": 2625} {"train_loss": -43.88923645019531, "global_step": 317646, "epoch": 2625} {"train_loss": -43.45879364013672, "global_step": 317647, "epoch": 2625} {"train_loss": -43.655521392822266, "global_step": 317648, "epoch": 2625} {"train_loss": -43.813968658447266, "global_step": 317649, "epoch": 2625} {"train_loss": -43.343482971191406, "global_step": 317650, "epoch": 2625} {"train_loss": -43.5495719909668, "global_step": 317651, "epoch": 2625} {"train_loss": -43.916378021240234, "global_step": 317652, "epoch": 2625} {"train_loss": -43.825836181640625, "global_step": 317653, "epoch": 2625} {"train_loss": -44.2048454284668, "global_step": 317654, "epoch": 2625} {"train_loss": -43.7706184387207, "global_step": 317655, "epoch": 2625} {"train_loss": -43.69354248046875, "global_step": 317656, "epoch": 2625} {"train_loss": -43.94179153442383, "global_step": 317657, "epoch": 2625} {"train_loss": -44.070064544677734, "global_step": 317658, "epoch": 2625} {"train_loss": -43.65000534057617, "global_step": 317659, "epoch": 2625} {"train_loss": -44.2148551940918, "global_step": 317660, "epoch": 2625} {"train_loss": -43.76552963256836, "global_step": 317661, "epoch": 2625} {"train_loss": -44.01467514038086, "global_step": 317662, "epoch": 2625} {"train_loss": -44.38740158081055, "global_step": 317663, "epoch": 2625} {"train_loss": -43.27898025512695, "global_step": 317664, "epoch": 2625} {"train_loss": -43.572879791259766, "global_step": 317665, "epoch": 2625} {"train_loss": -44.630836486816406, "global_step": 317666, "epoch": 2625} {"train_loss": -43.77785873413086, "global_step": 317667, "epoch": 2625} {"train_loss": -44.531982421875, "global_step": 317668, "epoch": 2625} {"train_loss": -43.84650802612305, "global_step": 317669, "epoch": 2625} {"train_loss": -44.3801383972168, "global_step": 317670, "epoch": 2625} {"train_loss": -44.763282775878906, "global_step": 317671, "epoch": 2625} {"train_loss": -44.5009880065918, "global_step": 317672, "epoch": 2625} {"train_loss": -44.770137786865234, "global_step": 317673, "epoch": 2625} {"train_loss": -44.7723388671875, "global_step": 317674, "epoch": 2625} {"train_loss": -44.61829376220703, "global_step": 317675, "epoch": 2625} {"train_loss": -44.80707931518555, "global_step": 317676, "epoch": 2625} {"train_loss": -44.65398025512695, "global_step": 317677, "epoch": 2625} {"train_loss": -45.01680374145508, "global_step": 317678, "epoch": 2625} {"train_loss": -44.61595916748047, "global_step": 317679, "epoch": 2625} {"train_loss": -44.851863861083984, "global_step": 317680, "epoch": 2625} {"train_loss": -44.64262771606445, "global_step": 317681, "epoch": 2625} {"train_loss": -44.88161087036133, "global_step": 317682, "epoch": 2625} {"train_loss": -44.74064254760742, "global_step": 317683, "epoch": 2625} {"train_loss": -44.29682540893555, "global_step": 317684, "epoch": 2625} {"train_loss": -43.800289154052734, "global_step": 317685, "epoch": 2625} {"train_loss": -43.32139205932617, "global_step": 317686, "epoch": 2625} {"train_loss": -44.38446044921875, "global_step": 317687, "epoch": 2625} {"train_loss": -43.935951232910156, "global_step": 317688, "epoch": 2625} {"train_loss": -44.62308883666992, "global_step": 317689, "epoch": 2625} {"train_loss": -44.19173812866211, "global_step": 317690, "epoch": 2625} {"train_loss": -44.45317459106445, "global_step": 317691, "epoch": 2625} {"train_loss": -44.373714447021484, "global_step": 317692, "epoch": 2625} {"train_loss": -44.86823654174805, "global_step": 317693, "epoch": 2625} {"train_loss": -44.65955352783203, "global_step": 317694, "epoch": 2625} {"train_loss": -44.37348175048828, "global_step": 317695, "epoch": 2625} {"train_loss": -44.69209671020508, "global_step": 317696, "epoch": 2625} {"train_loss": -44.53348922729492, "global_step": 317697, "epoch": 2625} {"train_loss": -44.40936279296875, "global_step": 317698, "epoch": 2625} {"train_loss": -43.6522102355957, "global_step": 317699, "epoch": 2625} {"train_loss": -44.92780303955078, "global_step": 317700, "epoch": 2625} {"train_loss": -43.50800323486328, "global_step": 317701, "epoch": 2625} {"train_loss": -44.6116943359375, "global_step": 317702, "epoch": 2625} {"train_loss": -44.367671966552734, "global_step": 317703, "epoch": 2625} {"train_loss": -44.10980987548828, "global_step": 317704, "epoch": 2625} {"train_loss": -44.13695526123047, "global_step": 317705, "epoch": 2625} {"train_loss": -44.309688568115234, "global_step": 317706, "epoch": 2625} {"train_loss": -44.50678253173828, "global_step": 317707, "epoch": 2625} {"train_loss": -44.74943542480469, "global_step": 317708, "epoch": 2625} {"train_loss": -44.37264633178711, "global_step": 317709, "epoch": 2625} {"train_loss": -44.74469757080078, "global_step": 317710, "epoch": 2625} {"train_loss": -44.62082290649414, "global_step": 317711, "epoch": 2625} {"train_loss": -44.93860626220703, "global_step": 317712, "epoch": 2625} {"train_loss": -44.2124137878418, "global_step": 317713, "epoch": 2625} {"train_loss": -44.55733108520508, "global_step": 317714, "epoch": 2625} {"train_loss": -43.649330139160156, "global_step": 317715, "epoch": 2625} {"train_loss": -44.12133026123047, "global_step": 317716, "epoch": 2625} {"train_loss": -44.422115325927734, "global_step": 317717, "epoch": 2625} {"train_loss": -44.0161018371582, "global_step": 317718, "epoch": 2625} {"train_loss": -43.564598083496094, "global_step": 317719, "epoch": 2625} {"train_loss": -42.940860748291016, "global_step": 317720, "epoch": 2625} {"train_loss": -41.995906829833984, "global_step": 317721, "epoch": 2625} {"train_loss": -40.690853118896484, "global_step": 317722, "epoch": 2625} {"train_loss": -42.836605072021484, "global_step": 317723, "epoch": 2625} {"train_loss": -43.172210693359375, "global_step": 317724, "epoch": 2625} {"train_loss": -41.91189193725586, "global_step": 317725, "epoch": 2625} {"train_loss": -40.695655822753906, "global_step": 317726, "epoch": 2625} {"train_loss": -42.225433349609375, "global_step": 317727, "epoch": 2625} {"train_loss": -44.076698303222656, "global_step": 317728, "epoch": 2625} {"train_loss": -41.025421142578125, "global_step": 317729, "epoch": 2625} {"train_loss": -39.882747650146484, "global_step": 317730, "epoch": 2625} {"train_loss": -43.72139358520508, "global_step": 317731, "epoch": 2625} {"train_loss": -43.088783264160156, "global_step": 317732, "epoch": 2625} {"train_loss": -40.216548919677734, "global_step": 317733, "epoch": 2625} {"train_loss": -42.33399200439453, "global_step": 317734, "epoch": 2625} {"train_loss": -42.59804153442383, "global_step": 317735, "epoch": 2625} {"train_loss": -38.681148529052734, "global_step": 317736, "epoch": 2625} {"train_loss": -42.341766357421875, "global_step": 317737, "epoch": 2625} {"train_loss": -42.6570930480957, "global_step": 317738, "epoch": 2625} {"train_loss": -43.14846420288086, "global_step": 317739, "epoch": 2625} {"train_loss": -43.65353012084961, "global_step": 317740, "epoch": 2625} {"train_loss": -41.75189208984375, "global_step": 317741, "epoch": 2625} {"train_loss": -42.127220153808594, "global_step": 317742, "epoch": 2625} {"train_loss": -43.70073318481445, "global_step": 317743, "epoch": 2625} {"train_loss": -43.14040756225586, "global_step": 317744, "epoch": 2625} {"train_loss": -43.530708659778945, "global_step": 317745, "epoch": 2625, "val_loss": 2661280.25} {"train_loss": -42.70100784301758, "global_step": 317746, "epoch": 2626} {"train_loss": -42.99073028564453, "global_step": 317747, "epoch": 2626} {"train_loss": -42.76301193237305, "global_step": 317748, "epoch": 2626} {"train_loss": -42.83187484741211, "global_step": 317749, "epoch": 2626} {"train_loss": -43.681373596191406, "global_step": 317750, "epoch": 2626} {"train_loss": -43.15245056152344, "global_step": 317751, "epoch": 2626} {"train_loss": -42.943965911865234, "global_step": 317752, "epoch": 2626} {"train_loss": -42.754302978515625, "global_step": 317753, "epoch": 2626} {"train_loss": -43.4865837097168, "global_step": 317754, "epoch": 2626} {"train_loss": -43.76982879638672, "global_step": 317755, "epoch": 2626} {"train_loss": -43.36269760131836, "global_step": 317756, "epoch": 2626} {"train_loss": -43.91025924682617, "global_step": 317757, "epoch": 2626} {"train_loss": -44.01539611816406, "global_step": 317758, "epoch": 2626} {"train_loss": -43.45949172973633, "global_step": 317759, "epoch": 2626} {"train_loss": -43.932491302490234, "global_step": 317760, "epoch": 2626} {"train_loss": -43.66555404663086, "global_step": 317761, "epoch": 2626} {"train_loss": -43.8283576965332, "global_step": 317762, "epoch": 2626} {"train_loss": -43.848018646240234, "global_step": 317763, "epoch": 2626} {"train_loss": -43.87946701049805, "global_step": 317764, "epoch": 2626} {"train_loss": -44.05942153930664, "global_step": 317765, "epoch": 2626} {"train_loss": -43.64628982543945, "global_step": 317766, "epoch": 2626} {"train_loss": -44.40138244628906, "global_step": 317767, "epoch": 2626} {"train_loss": -43.27451705932617, "global_step": 317768, "epoch": 2626} {"train_loss": -44.02686309814453, "global_step": 317769, "epoch": 2626} {"train_loss": -44.221275329589844, "global_step": 317770, "epoch": 2626} {"train_loss": -44.22042465209961, "global_step": 317771, "epoch": 2626} {"train_loss": -44.146785736083984, "global_step": 317772, "epoch": 2626} {"train_loss": -43.401161193847656, "global_step": 317773, "epoch": 2626} {"train_loss": -44.497596740722656, "global_step": 317774, "epoch": 2626} {"train_loss": -42.042598724365234, "global_step": 317775, "epoch": 2626} {"train_loss": -43.499732971191406, "global_step": 317776, "epoch": 2626} {"train_loss": -43.67280197143555, "global_step": 317777, "epoch": 2626} {"train_loss": -44.16670608520508, "global_step": 317778, "epoch": 2626} {"train_loss": -43.1289176940918, "global_step": 317779, "epoch": 2626} {"train_loss": -43.823463439941406, "global_step": 317780, "epoch": 2626} {"train_loss": -43.791316986083984, "global_step": 317781, "epoch": 2626} {"train_loss": -43.2523307800293, "global_step": 317782, "epoch": 2626} {"train_loss": -44.098594665527344, "global_step": 317783, "epoch": 2626} {"train_loss": -44.17848587036133, "global_step": 317784, "epoch": 2626} {"train_loss": -44.444950103759766, "global_step": 317785, "epoch": 2626} {"train_loss": -44.210723876953125, "global_step": 317786, "epoch": 2626} {"train_loss": -43.79231643676758, "global_step": 317787, "epoch": 2626} {"train_loss": -44.58994674682617, "global_step": 317788, "epoch": 2626} {"train_loss": -44.42931365966797, "global_step": 317789, "epoch": 2626} {"train_loss": -43.8448486328125, "global_step": 317790, "epoch": 2626} {"train_loss": -44.80561447143555, "global_step": 317791, "epoch": 2626} {"train_loss": -43.697906494140625, "global_step": 317792, "epoch": 2626} {"train_loss": -44.29806137084961, "global_step": 317793, "epoch": 2626} {"train_loss": -43.729251861572266, "global_step": 317794, "epoch": 2626} {"train_loss": -44.088260650634766, "global_step": 317795, "epoch": 2626} {"train_loss": -42.604400634765625, "global_step": 317796, "epoch": 2626} {"train_loss": -44.3658332824707, "global_step": 317797, "epoch": 2626} {"train_loss": -43.3898811340332, "global_step": 317798, "epoch": 2626} {"train_loss": -43.22053146362305, "global_step": 317799, "epoch": 2626} {"train_loss": -43.52092361450195, "global_step": 317800, "epoch": 2626} {"train_loss": -44.15794372558594, "global_step": 317801, "epoch": 2626} {"train_loss": -44.063777923583984, "global_step": 317802, "epoch": 2626} {"train_loss": -42.6834716796875, "global_step": 317803, "epoch": 2626} {"train_loss": -42.950897216796875, "global_step": 317804, "epoch": 2626} {"train_loss": -43.5621223449707, "global_step": 317805, "epoch": 2626} {"train_loss": -43.25526809692383, "global_step": 317806, "epoch": 2626} {"train_loss": -42.95195388793945, "global_step": 317807, "epoch": 2626} {"train_loss": -43.2822151184082, "global_step": 317808, "epoch": 2626} {"train_loss": -44.38469696044922, "global_step": 317809, "epoch": 2626} {"train_loss": -43.392879486083984, "global_step": 317810, "epoch": 2626} {"train_loss": -43.77389144897461, "global_step": 317811, "epoch": 2626} {"train_loss": -43.17265319824219, "global_step": 317812, "epoch": 2626} {"train_loss": -42.60839080810547, "global_step": 317813, "epoch": 2626} {"train_loss": -43.53593063354492, "global_step": 317814, "epoch": 2626} {"train_loss": -43.77659225463867, "global_step": 317815, "epoch": 2626} {"train_loss": -42.45162582397461, "global_step": 317816, "epoch": 2626} {"train_loss": -43.46665573120117, "global_step": 317817, "epoch": 2626} {"train_loss": -44.27069091796875, "global_step": 317818, "epoch": 2626} {"train_loss": -43.93510055541992, "global_step": 317819, "epoch": 2626} {"train_loss": -43.366573333740234, "global_step": 317820, "epoch": 2626} {"train_loss": -43.082149505615234, "global_step": 317821, "epoch": 2626} {"train_loss": -44.09835433959961, "global_step": 317822, "epoch": 2626} {"train_loss": -43.076725006103516, "global_step": 317823, "epoch": 2626} {"train_loss": -43.30898666381836, "global_step": 317824, "epoch": 2626} {"train_loss": -43.935970306396484, "global_step": 317825, "epoch": 2626} {"train_loss": -43.335968017578125, "global_step": 317826, "epoch": 2626} {"train_loss": -44.2188606262207, "global_step": 317827, "epoch": 2626} {"train_loss": -43.474605560302734, "global_step": 317828, "epoch": 2626} {"train_loss": -42.81368637084961, "global_step": 317829, "epoch": 2626} {"train_loss": -43.8629264831543, "global_step": 317830, "epoch": 2626} {"train_loss": -43.441890716552734, "global_step": 317831, "epoch": 2626} {"train_loss": -43.205810546875, "global_step": 317832, "epoch": 2626} {"train_loss": -43.464813232421875, "global_step": 317833, "epoch": 2626} {"train_loss": -43.61564254760742, "global_step": 317834, "epoch": 2626} {"train_loss": -43.55022048950195, "global_step": 317835, "epoch": 2626} {"train_loss": -42.523719787597656, "global_step": 317836, "epoch": 2626} {"train_loss": -43.76972579956055, "global_step": 317837, "epoch": 2626} {"train_loss": -42.87643051147461, "global_step": 317838, "epoch": 2626} {"train_loss": -41.88938522338867, "global_step": 317839, "epoch": 2626} {"train_loss": -43.03239059448242, "global_step": 317840, "epoch": 2626} {"train_loss": -43.81659698486328, "global_step": 317841, "epoch": 2626} {"train_loss": -41.67702102661133, "global_step": 317842, "epoch": 2626} {"train_loss": -43.003944396972656, "global_step": 317843, "epoch": 2626} {"train_loss": -43.943809509277344, "global_step": 317844, "epoch": 2626} {"train_loss": -42.56830596923828, "global_step": 317845, "epoch": 2626} {"train_loss": -44.15178680419922, "global_step": 317846, "epoch": 2626} {"train_loss": -43.90262985229492, "global_step": 317847, "epoch": 2626} {"train_loss": -42.59546661376953, "global_step": 317848, "epoch": 2626} {"train_loss": -43.639251708984375, "global_step": 317849, "epoch": 2626} {"train_loss": -43.76673889160156, "global_step": 317850, "epoch": 2626} {"train_loss": -43.25221633911133, "global_step": 317851, "epoch": 2626} {"train_loss": -43.642189025878906, "global_step": 317852, "epoch": 2626} {"train_loss": -43.44746017456055, "global_step": 317853, "epoch": 2626} {"train_loss": -43.86292266845703, "global_step": 317854, "epoch": 2626} {"train_loss": -43.6790657043457, "global_step": 317855, "epoch": 2626} {"train_loss": -44.02836227416992, "global_step": 317856, "epoch": 2626} {"train_loss": -44.53407669067383, "global_step": 317857, "epoch": 2626} {"train_loss": -36.21259689331055, "global_step": 317858, "epoch": 2626} {"train_loss": -44.165706634521484, "global_step": 317859, "epoch": 2626} {"train_loss": -43.657283782958984, "global_step": 317860, "epoch": 2626} {"train_loss": -43.80672073364258, "global_step": 317861, "epoch": 2626} {"train_loss": -43.77975082397461, "global_step": 317862, "epoch": 2626} {"train_loss": -43.719085693359375, "global_step": 317863, "epoch": 2626} {"train_loss": -44.03244400024414, "global_step": 317864, "epoch": 2626} {"train_loss": -43.824378967285156, "global_step": 317865, "epoch": 2626} {"train_loss": -43.512217624128354, "global_step": 317866, "epoch": 2626, "val_loss": 2652274.75} {"train_loss": -42.09627914428711, "global_step": 317867, "epoch": 2627} {"train_loss": -44.10725021362305, "global_step": 317868, "epoch": 2627} {"train_loss": -43.22138595581055, "global_step": 317869, "epoch": 2627} {"train_loss": -43.87066650390625, "global_step": 317870, "epoch": 2627} {"train_loss": -43.17744827270508, "global_step": 317871, "epoch": 2627} {"train_loss": -42.59658432006836, "global_step": 317872, "epoch": 2627} {"train_loss": -43.763702392578125, "global_step": 317873, "epoch": 2627} {"train_loss": -43.04548263549805, "global_step": 317874, "epoch": 2627} {"train_loss": -43.32707214355469, "global_step": 317875, "epoch": 2627} {"train_loss": -44.164825439453125, "global_step": 317876, "epoch": 2627} {"train_loss": -42.759891510009766, "global_step": 317877, "epoch": 2627} {"train_loss": -43.077327728271484, "global_step": 317878, "epoch": 2627} {"train_loss": -43.96854782104492, "global_step": 317879, "epoch": 2627} {"train_loss": -42.94071578979492, "global_step": 317880, "epoch": 2627} {"train_loss": -43.58726119995117, "global_step": 317881, "epoch": 2627} {"train_loss": -42.9277458190918, "global_step": 317882, "epoch": 2627} {"train_loss": -43.70390319824219, "global_step": 317883, "epoch": 2627} {"train_loss": -43.193939208984375, "global_step": 317884, "epoch": 2627} {"train_loss": -43.766029357910156, "global_step": 317885, "epoch": 2627} {"train_loss": -43.00638961791992, "global_step": 317886, "epoch": 2627} {"train_loss": -43.779144287109375, "global_step": 317887, "epoch": 2627} {"train_loss": -43.33821487426758, "global_step": 317888, "epoch": 2627} {"train_loss": -42.28352355957031, "global_step": 317889, "epoch": 2627} {"train_loss": -42.905426025390625, "global_step": 317890, "epoch": 2627} {"train_loss": -44.656158447265625, "global_step": 317891, "epoch": 2627} {"train_loss": -43.71650695800781, "global_step": 317892, "epoch": 2627} {"train_loss": -43.77433395385742, "global_step": 317893, "epoch": 2627} {"train_loss": -44.4022331237793, "global_step": 317894, "epoch": 2627} {"train_loss": -43.79875183105469, "global_step": 317895, "epoch": 2627} {"train_loss": -44.55757522583008, "global_step": 317896, "epoch": 2627} {"train_loss": -44.31092834472656, "global_step": 317897, "epoch": 2627} {"train_loss": -42.372955322265625, "global_step": 317898, "epoch": 2627} {"train_loss": -44.399471282958984, "global_step": 317899, "epoch": 2627} {"train_loss": -42.95554733276367, "global_step": 317900, "epoch": 2627} {"train_loss": -43.725440979003906, "global_step": 317901, "epoch": 2627} {"train_loss": -42.9713249206543, "global_step": 317902, "epoch": 2627} {"train_loss": -44.24781036376953, "global_step": 317903, "epoch": 2627} {"train_loss": -38.50714111328125, "global_step": 317904, "epoch": 2627} {"train_loss": -43.91786575317383, "global_step": 317905, "epoch": 2627} {"train_loss": -44.08765411376953, "global_step": 317906, "epoch": 2627} {"train_loss": -42.2429313659668, "global_step": 317907, "epoch": 2627} {"train_loss": -42.78236770629883, "global_step": 317908, "epoch": 2627} {"train_loss": -43.0454216003418, "global_step": 317909, "epoch": 2627} {"train_loss": -43.514862060546875, "global_step": 317910, "epoch": 2627} {"train_loss": -43.1533317565918, "global_step": 317911, "epoch": 2627} {"train_loss": -44.177833557128906, "global_step": 317912, "epoch": 2627} {"train_loss": -39.45697021484375, "global_step": 317913, "epoch": 2627} {"train_loss": -43.88731002807617, "global_step": 317914, "epoch": 2627} {"train_loss": -43.474464416503906, "global_step": 317915, "epoch": 2627} {"train_loss": -42.239990234375, "global_step": 317916, "epoch": 2627} {"train_loss": -42.71526336669922, "global_step": 317917, "epoch": 2627} {"train_loss": -43.22015380859375, "global_step": 317918, "epoch": 2627} {"train_loss": -41.52353286743164, "global_step": 317919, "epoch": 2627} {"train_loss": -41.6592903137207, "global_step": 317920, "epoch": 2627} {"train_loss": -44.09292221069336, "global_step": 317921, "epoch": 2627} {"train_loss": -42.76649856567383, "global_step": 317922, "epoch": 2627} {"train_loss": -42.87209701538086, "global_step": 317923, "epoch": 2627} {"train_loss": -43.33649444580078, "global_step": 317924, "epoch": 2627} {"train_loss": -42.14018630981445, "global_step": 317925, "epoch": 2627} {"train_loss": -43.64376449584961, "global_step": 317926, "epoch": 2627} {"train_loss": -41.89021682739258, "global_step": 317927, "epoch": 2627} {"train_loss": -44.13640213012695, "global_step": 317928, "epoch": 2627} {"train_loss": -42.254825592041016, "global_step": 317929, "epoch": 2627} {"train_loss": -42.65484619140625, "global_step": 317930, "epoch": 2627} {"train_loss": -37.2846565246582, "global_step": 317931, "epoch": 2627} {"train_loss": -42.19460678100586, "global_step": 317932, "epoch": 2627} {"train_loss": -43.420101165771484, "global_step": 317933, "epoch": 2627} {"train_loss": -43.8841552734375, "global_step": 317934, "epoch": 2627} {"train_loss": -41.84954833984375, "global_step": 317935, "epoch": 2627} {"train_loss": -43.157161712646484, "global_step": 317936, "epoch": 2627} {"train_loss": -43.33243942260742, "global_step": 317937, "epoch": 2627} {"train_loss": -40.78416442871094, "global_step": 317938, "epoch": 2627} {"train_loss": -44.165382385253906, "global_step": 317939, "epoch": 2627} {"train_loss": -41.56399154663086, "global_step": 317940, "epoch": 2627} {"train_loss": -42.12360382080078, "global_step": 317941, "epoch": 2627} {"train_loss": -42.81153869628906, "global_step": 317942, "epoch": 2627} {"train_loss": -43.63576889038086, "global_step": 317943, "epoch": 2627} {"train_loss": -42.99717330932617, "global_step": 317944, "epoch": 2627} {"train_loss": -43.299381256103516, "global_step": 317945, "epoch": 2627} {"train_loss": -43.39657211303711, "global_step": 317946, "epoch": 2627} {"train_loss": -43.00429153442383, "global_step": 317947, "epoch": 2627} {"train_loss": -42.00165557861328, "global_step": 317948, "epoch": 2627} {"train_loss": -44.01650619506836, "global_step": 317949, "epoch": 2627} {"train_loss": -39.38873291015625, "global_step": 317950, "epoch": 2627} {"train_loss": -42.496788024902344, "global_step": 317951, "epoch": 2627} {"train_loss": -43.54752731323242, "global_step": 317952, "epoch": 2627} {"train_loss": -41.17192840576172, "global_step": 317953, "epoch": 2627} {"train_loss": -42.61530685424805, "global_step": 317954, "epoch": 2627} {"train_loss": -43.30099105834961, "global_step": 317955, "epoch": 2627} {"train_loss": -43.83625030517578, "global_step": 317956, "epoch": 2627} {"train_loss": -44.062355041503906, "global_step": 317957, "epoch": 2627} {"train_loss": -44.27920150756836, "global_step": 317958, "epoch": 2627} {"train_loss": -42.54071807861328, "global_step": 317959, "epoch": 2627} {"train_loss": -44.0046501159668, "global_step": 317960, "epoch": 2627} {"train_loss": -42.139835357666016, "global_step": 317961, "epoch": 2627} {"train_loss": -43.67104721069336, "global_step": 317962, "epoch": 2627} {"train_loss": -43.892677307128906, "global_step": 317963, "epoch": 2627} {"train_loss": -43.42267990112305, "global_step": 317964, "epoch": 2627} {"train_loss": -41.66215896606445, "global_step": 317965, "epoch": 2627} {"train_loss": -44.012916564941406, "global_step": 317966, "epoch": 2627} {"train_loss": -43.63499450683594, "global_step": 317967, "epoch": 2627} {"train_loss": -43.70223617553711, "global_step": 317968, "epoch": 2627} {"train_loss": -40.5297966003418, "global_step": 317969, "epoch": 2627} {"train_loss": -36.468257904052734, "global_step": 317970, "epoch": 2627} {"train_loss": -43.817169189453125, "global_step": 317971, "epoch": 2627} {"train_loss": -43.881690979003906, "global_step": 317972, "epoch": 2627} {"train_loss": -43.8208122253418, "global_step": 317973, "epoch": 2627} {"train_loss": -43.65562057495117, "global_step": 317974, "epoch": 2627} {"train_loss": -44.04304885864258, "global_step": 317975, "epoch": 2627} {"train_loss": -43.10395050048828, "global_step": 317976, "epoch": 2627} {"train_loss": -44.05635070800781, "global_step": 317977, "epoch": 2627} {"train_loss": -43.35309600830078, "global_step": 317978, "epoch": 2627} {"train_loss": -43.283077239990234, "global_step": 317979, "epoch": 2627} {"train_loss": -41.94252014160156, "global_step": 317980, "epoch": 2627} {"train_loss": -43.984039306640625, "global_step": 317981, "epoch": 2627} {"train_loss": -43.350311279296875, "global_step": 317982, "epoch": 2627} {"train_loss": -44.71807098388672, "global_step": 317983, "epoch": 2627} {"train_loss": -44.023590087890625, "global_step": 317984, "epoch": 2627} {"train_loss": -42.67727279663086, "global_step": 317985, "epoch": 2627} {"train_loss": -43.70344161987305, "global_step": 317986, "epoch": 2627} {"train_loss": -43.0319884118955, "global_step": 317987, "epoch": 2627, "val_loss": 2532373.25} {"train_loss": -43.8896598815918, "global_step": 317988, "epoch": 2628} {"train_loss": -44.52663040161133, "global_step": 317989, "epoch": 2628} {"train_loss": -44.8387451171875, "global_step": 317990, "epoch": 2628} {"train_loss": -43.82408142089844, "global_step": 317991, "epoch": 2628} {"train_loss": -44.3109130859375, "global_step": 317992, "epoch": 2628} {"train_loss": -43.71278381347656, "global_step": 317993, "epoch": 2628} {"train_loss": -43.8623161315918, "global_step": 317994, "epoch": 2628} {"train_loss": -43.11782455444336, "global_step": 317995, "epoch": 2628} {"train_loss": -43.972503662109375, "global_step": 317996, "epoch": 2628} {"train_loss": -43.65400314331055, "global_step": 317997, "epoch": 2628} {"train_loss": -41.863216400146484, "global_step": 317998, "epoch": 2628} {"train_loss": -43.66068649291992, "global_step": 317999, "epoch": 2628} {"train_loss": -43.02879333496094, "global_step": 318000, "epoch": 2628} {"train_loss": -42.724693298339844, "global_step": 318001, "epoch": 2628} {"train_loss": -43.78232955932617, "global_step": 318002, "epoch": 2628} {"train_loss": -40.599342346191406, "global_step": 318003, "epoch": 2628} {"train_loss": -39.35991668701172, "global_step": 318004, "epoch": 2628} {"train_loss": -41.952796936035156, "global_step": 318005, "epoch": 2628} {"train_loss": -40.947227478027344, "global_step": 318006, "epoch": 2628} {"train_loss": -42.50868225097656, "global_step": 318007, "epoch": 2628} {"train_loss": -41.06747055053711, "global_step": 318008, "epoch": 2628} {"train_loss": -41.17628479003906, "global_step": 318009, "epoch": 2628} {"train_loss": -42.32049560546875, "global_step": 318010, "epoch": 2628} {"train_loss": -39.76810073852539, "global_step": 318011, "epoch": 2628} {"train_loss": -42.19171905517578, "global_step": 318012, "epoch": 2628} {"train_loss": -42.601619720458984, "global_step": 318013, "epoch": 2628} {"train_loss": -42.61654281616211, "global_step": 318014, "epoch": 2628} {"train_loss": -43.296142578125, "global_step": 318015, "epoch": 2628} {"train_loss": -41.39402389526367, "global_step": 318016, "epoch": 2628} {"train_loss": -43.11397933959961, "global_step": 318017, "epoch": 2628} {"train_loss": -43.01639938354492, "global_step": 318018, "epoch": 2628} {"train_loss": -41.24502182006836, "global_step": 318019, "epoch": 2628} {"train_loss": -42.355674743652344, "global_step": 318020, "epoch": 2628} {"train_loss": -43.33697509765625, "global_step": 318021, "epoch": 2628} {"train_loss": -41.3918342590332, "global_step": 318022, "epoch": 2628} {"train_loss": -40.21693801879883, "global_step": 318023, "epoch": 2628} {"train_loss": -41.67958450317383, "global_step": 318024, "epoch": 2628} {"train_loss": -43.79252243041992, "global_step": 318025, "epoch": 2628} {"train_loss": -42.14339828491211, "global_step": 318026, "epoch": 2628} {"train_loss": -42.4671630859375, "global_step": 318027, "epoch": 2628} {"train_loss": -42.537349700927734, "global_step": 318028, "epoch": 2628} {"train_loss": -42.620697021484375, "global_step": 318029, "epoch": 2628} {"train_loss": -43.28520584106445, "global_step": 318030, "epoch": 2628} {"train_loss": -42.4748420715332, "global_step": 318031, "epoch": 2628} {"train_loss": -42.651363372802734, "global_step": 318032, "epoch": 2628} {"train_loss": -43.4110221862793, "global_step": 318033, "epoch": 2628} {"train_loss": -42.8956413269043, "global_step": 318034, "epoch": 2628} {"train_loss": -43.5212516784668, "global_step": 318035, "epoch": 2628} {"train_loss": -42.536293029785156, "global_step": 318036, "epoch": 2628} {"train_loss": -43.76652145385742, "global_step": 318037, "epoch": 2628} {"train_loss": -43.367340087890625, "global_step": 318038, "epoch": 2628} {"train_loss": -42.98236846923828, "global_step": 318039, "epoch": 2628} {"train_loss": -43.50313949584961, "global_step": 318040, "epoch": 2628} {"train_loss": -43.851863861083984, "global_step": 318041, "epoch": 2628} {"train_loss": -43.80462646484375, "global_step": 318042, "epoch": 2628} {"train_loss": -44.288387298583984, "global_step": 318043, "epoch": 2628} {"train_loss": -44.01458740234375, "global_step": 318044, "epoch": 2628} {"train_loss": -44.21501922607422, "global_step": 318045, "epoch": 2628} {"train_loss": -44.52367401123047, "global_step": 318046, "epoch": 2628} {"train_loss": -44.27317428588867, "global_step": 318047, "epoch": 2628} {"train_loss": -44.16908645629883, "global_step": 318048, "epoch": 2628} {"train_loss": -44.59896469116211, "global_step": 318049, "epoch": 2628} {"train_loss": -43.80005645751953, "global_step": 318050, "epoch": 2628} {"train_loss": -43.6722412109375, "global_step": 318051, "epoch": 2628} {"train_loss": -44.47005081176758, "global_step": 318052, "epoch": 2628} {"train_loss": -44.04986572265625, "global_step": 318053, "epoch": 2628} {"train_loss": -44.408870697021484, "global_step": 318054, "epoch": 2628} {"train_loss": -44.55996322631836, "global_step": 318055, "epoch": 2628} {"train_loss": -44.55939483642578, "global_step": 318056, "epoch": 2628} {"train_loss": -44.17981719970703, "global_step": 318057, "epoch": 2628} {"train_loss": -44.9018669128418, "global_step": 318058, "epoch": 2628} {"train_loss": -43.58320236206055, "global_step": 318059, "epoch": 2628} {"train_loss": -44.685821533203125, "global_step": 318060, "epoch": 2628} {"train_loss": -44.66593551635742, "global_step": 318061, "epoch": 2628} {"train_loss": -44.07038879394531, "global_step": 318062, "epoch": 2628} {"train_loss": -43.13286209106445, "global_step": 318063, "epoch": 2628} {"train_loss": -43.29547119140625, "global_step": 318064, "epoch": 2628} {"train_loss": -43.47393035888672, "global_step": 318065, "epoch": 2628} {"train_loss": -43.89365005493164, "global_step": 318066, "epoch": 2628} {"train_loss": -43.59739685058594, "global_step": 318067, "epoch": 2628} {"train_loss": -44.74107360839844, "global_step": 318068, "epoch": 2628} {"train_loss": -44.03908157348633, "global_step": 318069, "epoch": 2628} {"train_loss": -44.14617919921875, "global_step": 318070, "epoch": 2628} {"train_loss": -44.36307907104492, "global_step": 318071, "epoch": 2628} {"train_loss": -43.92525863647461, "global_step": 318072, "epoch": 2628} {"train_loss": -44.04093933105469, "global_step": 318073, "epoch": 2628} {"train_loss": -44.33258056640625, "global_step": 318074, "epoch": 2628} {"train_loss": -44.15900421142578, "global_step": 318075, "epoch": 2628} {"train_loss": -43.31318283081055, "global_step": 318076, "epoch": 2628} {"train_loss": -44.13058090209961, "global_step": 318077, "epoch": 2628} {"train_loss": -44.1445198059082, "global_step": 318078, "epoch": 2628} {"train_loss": -43.12367630004883, "global_step": 318079, "epoch": 2628} {"train_loss": -43.17177200317383, "global_step": 318080, "epoch": 2628} {"train_loss": -43.4535026550293, "global_step": 318081, "epoch": 2628} {"train_loss": -43.02229309082031, "global_step": 318082, "epoch": 2628} {"train_loss": -43.93464279174805, "global_step": 318083, "epoch": 2628} {"train_loss": -43.39213180541992, "global_step": 318084, "epoch": 2628} {"train_loss": -41.703548431396484, "global_step": 318085, "epoch": 2628} {"train_loss": -41.21442794799805, "global_step": 318086, "epoch": 2628} {"train_loss": -41.745452880859375, "global_step": 318087, "epoch": 2628} {"train_loss": -41.824134826660156, "global_step": 318088, "epoch": 2628} {"train_loss": -42.54275131225586, "global_step": 318089, "epoch": 2628} {"train_loss": -43.94082260131836, "global_step": 318090, "epoch": 2628} {"train_loss": -44.44929122924805, "global_step": 318091, "epoch": 2628} {"train_loss": -43.677528381347656, "global_step": 318092, "epoch": 2628} {"train_loss": -44.06681442260742, "global_step": 318093, "epoch": 2628} {"train_loss": -44.52102279663086, "global_step": 318094, "epoch": 2628} {"train_loss": -42.88908386230469, "global_step": 318095, "epoch": 2628} {"train_loss": -42.47220993041992, "global_step": 318096, "epoch": 2628} {"train_loss": -44.00316619873047, "global_step": 318097, "epoch": 2628} {"train_loss": -43.725521087646484, "global_step": 318098, "epoch": 2628} {"train_loss": -42.49467086791992, "global_step": 318099, "epoch": 2628} {"train_loss": -42.95061492919922, "global_step": 318100, "epoch": 2628} {"train_loss": -43.60618591308594, "global_step": 318101, "epoch": 2628} {"train_loss": -41.82665252685547, "global_step": 318102, "epoch": 2628} {"train_loss": -42.85137939453125, "global_step": 318103, "epoch": 2628} {"train_loss": -42.69512176513672, "global_step": 318104, "epoch": 2628} {"train_loss": -42.710262298583984, "global_step": 318105, "epoch": 2628} {"train_loss": -44.33937454223633, "global_step": 318106, "epoch": 2628} {"train_loss": -44.305599212646484, "global_step": 318107, "epoch": 2628} {"train_loss": -43.22411176192859, "global_step": 318108, "epoch": 2628, "val_loss": 2741362.75} {"train_loss": -43.5464973449707, "global_step": 318109, "epoch": 2629} {"train_loss": -44.06754684448242, "global_step": 318110, "epoch": 2629} {"train_loss": -43.295494079589844, "global_step": 318111, "epoch": 2629} {"train_loss": -43.924407958984375, "global_step": 318112, "epoch": 2629} {"train_loss": -42.2921142578125, "global_step": 318113, "epoch": 2629} {"train_loss": -41.7088737487793, "global_step": 318114, "epoch": 2629} {"train_loss": -42.9399528503418, "global_step": 318115, "epoch": 2629} {"train_loss": -43.72209167480469, "global_step": 318116, "epoch": 2629} {"train_loss": -42.44519805908203, "global_step": 318117, "epoch": 2629} {"train_loss": -43.05332565307617, "global_step": 318118, "epoch": 2629} {"train_loss": -43.25084686279297, "global_step": 318119, "epoch": 2629} {"train_loss": -43.3333625793457, "global_step": 318120, "epoch": 2629} {"train_loss": -43.83246612548828, "global_step": 318121, "epoch": 2629} {"train_loss": -42.81748962402344, "global_step": 318122, "epoch": 2629} {"train_loss": -43.81997299194336, "global_step": 318123, "epoch": 2629} {"train_loss": -41.639705657958984, "global_step": 318124, "epoch": 2629} {"train_loss": -43.041439056396484, "global_step": 318125, "epoch": 2629} {"train_loss": -42.184417724609375, "global_step": 318126, "epoch": 2629} {"train_loss": -42.96931457519531, "global_step": 318127, "epoch": 2629} {"train_loss": -43.40071487426758, "global_step": 318128, "epoch": 2629} {"train_loss": -43.47637176513672, "global_step": 318129, "epoch": 2629} {"train_loss": -43.120941162109375, "global_step": 318130, "epoch": 2629} {"train_loss": -43.259090423583984, "global_step": 318131, "epoch": 2629} {"train_loss": -43.18866729736328, "global_step": 318132, "epoch": 2629} {"train_loss": -43.65530014038086, "global_step": 318133, "epoch": 2629} {"train_loss": -43.626888275146484, "global_step": 318134, "epoch": 2629} {"train_loss": -44.311397552490234, "global_step": 318135, "epoch": 2629} {"train_loss": -43.84660720825195, "global_step": 318136, "epoch": 2629} {"train_loss": -43.55964279174805, "global_step": 318137, "epoch": 2629} {"train_loss": -43.520225524902344, "global_step": 318138, "epoch": 2629} {"train_loss": -43.96145248413086, "global_step": 318139, "epoch": 2629} {"train_loss": -44.04767990112305, "global_step": 318140, "epoch": 2629} {"train_loss": -43.73917770385742, "global_step": 318141, "epoch": 2629} {"train_loss": -44.18020248413086, "global_step": 318142, "epoch": 2629} {"train_loss": -44.167667388916016, "global_step": 318143, "epoch": 2629} {"train_loss": -44.05177688598633, "global_step": 318144, "epoch": 2629} {"train_loss": -43.9818115234375, "global_step": 318145, "epoch": 2629} {"train_loss": -43.40135955810547, "global_step": 318146, "epoch": 2629} {"train_loss": -44.81847381591797, "global_step": 318147, "epoch": 2629} {"train_loss": -44.298004150390625, "global_step": 318148, "epoch": 2629} {"train_loss": -44.43424606323242, "global_step": 318149, "epoch": 2629} {"train_loss": -43.99995803833008, "global_step": 318150, "epoch": 2629} {"train_loss": -43.25672149658203, "global_step": 318151, "epoch": 2629} {"train_loss": -44.6290168762207, "global_step": 318152, "epoch": 2629} {"train_loss": -43.253150939941406, "global_step": 318153, "epoch": 2629} {"train_loss": -43.55930709838867, "global_step": 318154, "epoch": 2629} {"train_loss": -44.36530303955078, "global_step": 318155, "epoch": 2629} {"train_loss": -43.65924072265625, "global_step": 318156, "epoch": 2629} {"train_loss": -44.13826370239258, "global_step": 318157, "epoch": 2629} {"train_loss": -43.14606857299805, "global_step": 318158, "epoch": 2629} {"train_loss": -43.93389892578125, "global_step": 318159, "epoch": 2629} {"train_loss": -44.014381408691406, "global_step": 318160, "epoch": 2629} {"train_loss": -44.06113815307617, "global_step": 318161, "epoch": 2629} {"train_loss": -43.15867233276367, "global_step": 318162, "epoch": 2629} {"train_loss": -43.02231979370117, "global_step": 318163, "epoch": 2629} {"train_loss": -44.605804443359375, "global_step": 318164, "epoch": 2629} {"train_loss": -42.943328857421875, "global_step": 318165, "epoch": 2629} {"train_loss": -42.219356536865234, "global_step": 318166, "epoch": 2629} {"train_loss": -41.21295928955078, "global_step": 318167, "epoch": 2629} {"train_loss": -41.472267150878906, "global_step": 318168, "epoch": 2629} {"train_loss": -41.584815979003906, "global_step": 318169, "epoch": 2629} {"train_loss": -43.359981536865234, "global_step": 318170, "epoch": 2629} {"train_loss": -41.632686614990234, "global_step": 318171, "epoch": 2629} {"train_loss": -40.762447357177734, "global_step": 318172, "epoch": 2629} {"train_loss": -41.99807357788086, "global_step": 318173, "epoch": 2629} {"train_loss": -43.13718795776367, "global_step": 318174, "epoch": 2629} {"train_loss": -42.483802795410156, "global_step": 318175, "epoch": 2629} {"train_loss": -43.21857833862305, "global_step": 318176, "epoch": 2629} {"train_loss": -42.98635482788086, "global_step": 318177, "epoch": 2629} {"train_loss": -42.72021484375, "global_step": 318178, "epoch": 2629} {"train_loss": -43.11211013793945, "global_step": 318179, "epoch": 2629} {"train_loss": -43.48002243041992, "global_step": 318180, "epoch": 2629} {"train_loss": -44.113250732421875, "global_step": 318181, "epoch": 2629} {"train_loss": -43.81551742553711, "global_step": 318182, "epoch": 2629} {"train_loss": -44.273895263671875, "global_step": 318183, "epoch": 2629} {"train_loss": -43.98342514038086, "global_step": 318184, "epoch": 2629} {"train_loss": -44.33790588378906, "global_step": 318185, "epoch": 2629} {"train_loss": -43.294349670410156, "global_step": 318186, "epoch": 2629} {"train_loss": -44.289405822753906, "global_step": 318187, "epoch": 2629} {"train_loss": -43.842803955078125, "global_step": 318188, "epoch": 2629} {"train_loss": -43.78011703491211, "global_step": 318189, "epoch": 2629} {"train_loss": -44.473567962646484, "global_step": 318190, "epoch": 2629} {"train_loss": -43.76877975463867, "global_step": 318191, "epoch": 2629} {"train_loss": -44.631778717041016, "global_step": 318192, "epoch": 2629} {"train_loss": -44.243839263916016, "global_step": 318193, "epoch": 2629} {"train_loss": -43.87959671020508, "global_step": 318194, "epoch": 2629} {"train_loss": -44.76223373413086, "global_step": 318195, "epoch": 2629} {"train_loss": -44.27825927734375, "global_step": 318196, "epoch": 2629} {"train_loss": -44.6432991027832, "global_step": 318197, "epoch": 2629} {"train_loss": -44.3474006652832, "global_step": 318198, "epoch": 2629} {"train_loss": -44.650299072265625, "global_step": 318199, "epoch": 2629} {"train_loss": -44.986663818359375, "global_step": 318200, "epoch": 2629} {"train_loss": -43.666133880615234, "global_step": 318201, "epoch": 2629} {"train_loss": -44.06201934814453, "global_step": 318202, "epoch": 2629} {"train_loss": -44.8864860534668, "global_step": 318203, "epoch": 2629} {"train_loss": -43.90787124633789, "global_step": 318204, "epoch": 2629} {"train_loss": -44.12006759643555, "global_step": 318205, "epoch": 2629} {"train_loss": -44.52667236328125, "global_step": 318206, "epoch": 2629} {"train_loss": -44.55314254760742, "global_step": 318207, "epoch": 2629} {"train_loss": -43.95334243774414, "global_step": 318208, "epoch": 2629} {"train_loss": -44.63160705566406, "global_step": 318209, "epoch": 2629} {"train_loss": -44.017555236816406, "global_step": 318210, "epoch": 2629} {"train_loss": -44.218196868896484, "global_step": 318211, "epoch": 2629} {"train_loss": -44.18276596069336, "global_step": 318212, "epoch": 2629} {"train_loss": -44.26740646362305, "global_step": 318213, "epoch": 2629} {"train_loss": -44.8572998046875, "global_step": 318214, "epoch": 2629} {"train_loss": -43.47682571411133, "global_step": 318215, "epoch": 2629} {"train_loss": -44.34674835205078, "global_step": 318216, "epoch": 2629} {"train_loss": -43.47999954223633, "global_step": 318217, "epoch": 2629} {"train_loss": -43.71474838256836, "global_step": 318218, "epoch": 2629} {"train_loss": -43.27180862426758, "global_step": 318219, "epoch": 2629} {"train_loss": -43.37967300415039, "global_step": 318220, "epoch": 2629} {"train_loss": -43.885475158691406, "global_step": 318221, "epoch": 2629} {"train_loss": -42.94095993041992, "global_step": 318222, "epoch": 2629} {"train_loss": -40.58980941772461, "global_step": 318223, "epoch": 2629} {"train_loss": -42.27012252807617, "global_step": 318224, "epoch": 2629} {"train_loss": -43.71166229248047, "global_step": 318225, "epoch": 2629} {"train_loss": -42.03586959838867, "global_step": 318226, "epoch": 2629} {"train_loss": -40.730995178222656, "global_step": 318227, "epoch": 2629} {"train_loss": -43.31370544433594, "global_step": 318228, "epoch": 2629} {"train_loss": -43.52251960817448, "global_step": 318229, "epoch": 2629, "val_loss": 2653892.25} {"train_loss": -42.17906188964844, "global_step": 318230, "epoch": 2630} {"train_loss": -44.20918655395508, "global_step": 318231, "epoch": 2630} {"train_loss": -43.20894241333008, "global_step": 318232, "epoch": 2630} {"train_loss": -42.96881866455078, "global_step": 318233, "epoch": 2630} {"train_loss": -45.33433532714844, "global_step": 318234, "epoch": 2630} {"train_loss": -42.67292404174805, "global_step": 318235, "epoch": 2630} {"train_loss": -44.14059829711914, "global_step": 318236, "epoch": 2630} {"train_loss": -42.480751037597656, "global_step": 318237, "epoch": 2630} {"train_loss": -40.85877227783203, "global_step": 318238, "epoch": 2630} {"train_loss": -43.634517669677734, "global_step": 318239, "epoch": 2630} {"train_loss": -43.78969955444336, "global_step": 318240, "epoch": 2630} {"train_loss": -42.149574279785156, "global_step": 318241, "epoch": 2630} {"train_loss": -43.492279052734375, "global_step": 318242, "epoch": 2630} {"train_loss": -42.086002349853516, "global_step": 318243, "epoch": 2630} {"train_loss": -43.42265701293945, "global_step": 318244, "epoch": 2630} {"train_loss": -44.08526611328125, "global_step": 318245, "epoch": 2630} {"train_loss": -42.7717399597168, "global_step": 318246, "epoch": 2630} {"train_loss": -41.99897766113281, "global_step": 318247, "epoch": 2630} {"train_loss": -43.872352600097656, "global_step": 318248, "epoch": 2630} {"train_loss": -43.05161666870117, "global_step": 318249, "epoch": 2630} {"train_loss": -43.69985580444336, "global_step": 318250, "epoch": 2630} {"train_loss": -42.94260787963867, "global_step": 318251, "epoch": 2630} {"train_loss": -43.55366134643555, "global_step": 318252, "epoch": 2630} {"train_loss": -44.72333908081055, "global_step": 318253, "epoch": 2630} {"train_loss": -43.2843017578125, "global_step": 318254, "epoch": 2630} {"train_loss": -43.25032424926758, "global_step": 318255, "epoch": 2630} {"train_loss": -42.42208480834961, "global_step": 318256, "epoch": 2630} {"train_loss": -43.76642990112305, "global_step": 318257, "epoch": 2630} {"train_loss": -43.82445526123047, "global_step": 318258, "epoch": 2630} {"train_loss": -42.7825927734375, "global_step": 318259, "epoch": 2630} {"train_loss": -43.706787109375, "global_step": 318260, "epoch": 2630} {"train_loss": -43.66895294189453, "global_step": 318261, "epoch": 2630} {"train_loss": -41.721038818359375, "global_step": 318262, "epoch": 2630} {"train_loss": -41.04392623901367, "global_step": 318263, "epoch": 2630} {"train_loss": -44.24781799316406, "global_step": 318264, "epoch": 2630} {"train_loss": -41.663734436035156, "global_step": 318265, "epoch": 2630} {"train_loss": -41.3520622253418, "global_step": 318266, "epoch": 2630} {"train_loss": -44.30776596069336, "global_step": 318267, "epoch": 2630} {"train_loss": -41.907772064208984, "global_step": 318268, "epoch": 2630} {"train_loss": -42.4632453918457, "global_step": 318269, "epoch": 2630} {"train_loss": -42.82546615600586, "global_step": 318270, "epoch": 2630} {"train_loss": -43.11328125, "global_step": 318271, "epoch": 2630} {"train_loss": -42.842037200927734, "global_step": 318272, "epoch": 2630} {"train_loss": -43.588829040527344, "global_step": 318273, "epoch": 2630} {"train_loss": -42.75723648071289, "global_step": 318274, "epoch": 2630} {"train_loss": -43.2534065246582, "global_step": 318275, "epoch": 2630} {"train_loss": -43.515045166015625, "global_step": 318276, "epoch": 2630} {"train_loss": -42.80561447143555, "global_step": 318277, "epoch": 2630} {"train_loss": -43.209503173828125, "global_step": 318278, "epoch": 2630} {"train_loss": -43.702171325683594, "global_step": 318279, "epoch": 2630} {"train_loss": -42.0134391784668, "global_step": 318280, "epoch": 2630} {"train_loss": -43.64394760131836, "global_step": 318281, "epoch": 2630} {"train_loss": -43.76160430908203, "global_step": 318282, "epoch": 2630} {"train_loss": -41.57154846191406, "global_step": 318283, "epoch": 2630} {"train_loss": -43.54207992553711, "global_step": 318284, "epoch": 2630} {"train_loss": -44.10484313964844, "global_step": 318285, "epoch": 2630} {"train_loss": -42.898048400878906, "global_step": 318286, "epoch": 2630} {"train_loss": -44.48293685913086, "global_step": 318287, "epoch": 2630} {"train_loss": -44.542335510253906, "global_step": 318288, "epoch": 2630} {"train_loss": -44.08949279785156, "global_step": 318289, "epoch": 2630} {"train_loss": -44.26015090942383, "global_step": 318290, "epoch": 2630} {"train_loss": -44.60942459106445, "global_step": 318291, "epoch": 2630} {"train_loss": -44.087432861328125, "global_step": 318292, "epoch": 2630} {"train_loss": -44.14203643798828, "global_step": 318293, "epoch": 2630} {"train_loss": -44.16363525390625, "global_step": 318294, "epoch": 2630} {"train_loss": -44.3379020690918, "global_step": 318295, "epoch": 2630} {"train_loss": -43.88617706298828, "global_step": 318296, "epoch": 2630} {"train_loss": -44.38325119018555, "global_step": 318297, "epoch": 2630} {"train_loss": -44.3714485168457, "global_step": 318298, "epoch": 2630} {"train_loss": -44.51801681518555, "global_step": 318299, "epoch": 2630} {"train_loss": -44.34039306640625, "global_step": 318300, "epoch": 2630} {"train_loss": -44.51543045043945, "global_step": 318301, "epoch": 2630} {"train_loss": -44.70858383178711, "global_step": 318302, "epoch": 2630} {"train_loss": -44.328758239746094, "global_step": 318303, "epoch": 2630} {"train_loss": -44.38984298706055, "global_step": 318304, "epoch": 2630} {"train_loss": -44.6897087097168, "global_step": 318305, "epoch": 2630} {"train_loss": -45.1421012878418, "global_step": 318306, "epoch": 2630} {"train_loss": -44.06336212158203, "global_step": 318307, "epoch": 2630} {"train_loss": -44.77832794189453, "global_step": 318308, "epoch": 2630} {"train_loss": -44.49419021606445, "global_step": 318309, "epoch": 2630} {"train_loss": -44.133419036865234, "global_step": 318310, "epoch": 2630} {"train_loss": -44.95954895019531, "global_step": 318311, "epoch": 2630} {"train_loss": -44.61946105957031, "global_step": 318312, "epoch": 2630} {"train_loss": -44.75517654418945, "global_step": 318313, "epoch": 2630} {"train_loss": -45.20186996459961, "global_step": 318314, "epoch": 2630} {"train_loss": -44.36886978149414, "global_step": 318315, "epoch": 2630} {"train_loss": -43.64718246459961, "global_step": 318316, "epoch": 2630} {"train_loss": -44.86180877685547, "global_step": 318317, "epoch": 2630} {"train_loss": -44.3714599609375, "global_step": 318318, "epoch": 2630} {"train_loss": -43.505279541015625, "global_step": 318319, "epoch": 2630} {"train_loss": -44.67950439453125, "global_step": 318320, "epoch": 2630} {"train_loss": -43.63174057006836, "global_step": 318321, "epoch": 2630} {"train_loss": -43.19365310668945, "global_step": 318322, "epoch": 2630} {"train_loss": -44.24072265625, "global_step": 318323, "epoch": 2630} {"train_loss": -42.56539535522461, "global_step": 318324, "epoch": 2630} {"train_loss": -44.09566879272461, "global_step": 318325, "epoch": 2630} {"train_loss": -44.025142669677734, "global_step": 318326, "epoch": 2630} {"train_loss": -43.133419036865234, "global_step": 318327, "epoch": 2630} {"train_loss": -43.02739334106445, "global_step": 318328, "epoch": 2630} {"train_loss": -43.86153793334961, "global_step": 318329, "epoch": 2630} {"train_loss": -43.778079986572266, "global_step": 318330, "epoch": 2630} {"train_loss": -43.220619201660156, "global_step": 318331, "epoch": 2630} {"train_loss": -43.77949142456055, "global_step": 318332, "epoch": 2630} {"train_loss": -43.4851188659668, "global_step": 318333, "epoch": 2630} {"train_loss": -44.58512496948242, "global_step": 318334, "epoch": 2630} {"train_loss": -44.735355377197266, "global_step": 318335, "epoch": 2630} {"train_loss": -43.75973129272461, "global_step": 318336, "epoch": 2630} {"train_loss": -43.8692741394043, "global_step": 318337, "epoch": 2630} {"train_loss": -44.38230514526367, "global_step": 318338, "epoch": 2630} {"train_loss": -44.00679016113281, "global_step": 318339, "epoch": 2630} {"train_loss": -44.62749099731445, "global_step": 318340, "epoch": 2630} {"train_loss": -44.40748977661133, "global_step": 318341, "epoch": 2630} {"train_loss": -44.7773323059082, "global_step": 318342, "epoch": 2630} {"train_loss": -43.8961181640625, "global_step": 318343, "epoch": 2630} {"train_loss": -44.73460006713867, "global_step": 318344, "epoch": 2630} {"train_loss": -44.266029357910156, "global_step": 318345, "epoch": 2630} {"train_loss": -43.1141242980957, "global_step": 318346, "epoch": 2630} {"train_loss": -43.869850158691406, "global_step": 318347, "epoch": 2630} {"train_loss": -44.66044998168945, "global_step": 318348, "epoch": 2630} {"train_loss": -44.01522445678711, "global_step": 318349, "epoch": 2630} {"train_loss": -43.65917382358519, "global_step": 318350, "epoch": 2630, "val_loss": 2737534.0} {"train_loss": -43.224273681640625, "global_step": 318351, "epoch": 2631} {"train_loss": -44.49899673461914, "global_step": 318352, "epoch": 2631} {"train_loss": -44.477928161621094, "global_step": 318353, "epoch": 2631} {"train_loss": -43.493194580078125, "global_step": 318354, "epoch": 2631} {"train_loss": -44.11173629760742, "global_step": 318355, "epoch": 2631} {"train_loss": -44.968788146972656, "global_step": 318356, "epoch": 2631} {"train_loss": -43.5436897277832, "global_step": 318357, "epoch": 2631} {"train_loss": -41.80974197387695, "global_step": 318358, "epoch": 2631} {"train_loss": -43.12199401855469, "global_step": 318359, "epoch": 2631} {"train_loss": -43.64785385131836, "global_step": 318360, "epoch": 2631} {"train_loss": -41.688636779785156, "global_step": 318361, "epoch": 2631} {"train_loss": -43.84406280517578, "global_step": 318362, "epoch": 2631} {"train_loss": -43.64122009277344, "global_step": 318363, "epoch": 2631} {"train_loss": -42.87799072265625, "global_step": 318364, "epoch": 2631} {"train_loss": -41.66081619262695, "global_step": 318365, "epoch": 2631} {"train_loss": -43.8471565246582, "global_step": 318366, "epoch": 2631} {"train_loss": -43.80256271362305, "global_step": 318367, "epoch": 2631} {"train_loss": -42.832664489746094, "global_step": 318368, "epoch": 2631} {"train_loss": -44.02582550048828, "global_step": 318369, "epoch": 2631} {"train_loss": -44.59021759033203, "global_step": 318370, "epoch": 2631} {"train_loss": -44.49568557739258, "global_step": 318371, "epoch": 2631} {"train_loss": -44.72562789916992, "global_step": 318372, "epoch": 2631} {"train_loss": -43.24504852294922, "global_step": 318373, "epoch": 2631} {"train_loss": -44.64683151245117, "global_step": 318374, "epoch": 2631} {"train_loss": -44.4720573425293, "global_step": 318375, "epoch": 2631} {"train_loss": -42.316097259521484, "global_step": 318376, "epoch": 2631} {"train_loss": -44.439491271972656, "global_step": 318377, "epoch": 2631} {"train_loss": -44.24934768676758, "global_step": 318378, "epoch": 2631} {"train_loss": -43.92866134643555, "global_step": 318379, "epoch": 2631} {"train_loss": -44.613407135009766, "global_step": 318380, "epoch": 2631} {"train_loss": -44.33937454223633, "global_step": 318381, "epoch": 2631} {"train_loss": -43.44321060180664, "global_step": 318382, "epoch": 2631} {"train_loss": -44.1671257019043, "global_step": 318383, "epoch": 2631} {"train_loss": -43.908992767333984, "global_step": 318384, "epoch": 2631} {"train_loss": -44.69894027709961, "global_step": 318385, "epoch": 2631} {"train_loss": -43.672847747802734, "global_step": 318386, "epoch": 2631} {"train_loss": -43.56162643432617, "global_step": 318387, "epoch": 2631} {"train_loss": -44.012184143066406, "global_step": 318388, "epoch": 2631} {"train_loss": -44.16044616699219, "global_step": 318389, "epoch": 2631} {"train_loss": -43.5133171081543, "global_step": 318390, "epoch": 2631} {"train_loss": -43.493080139160156, "global_step": 318391, "epoch": 2631} {"train_loss": -44.269287109375, "global_step": 318392, "epoch": 2631} {"train_loss": -44.442909240722656, "global_step": 318393, "epoch": 2631} {"train_loss": -44.14925003051758, "global_step": 318394, "epoch": 2631} {"train_loss": -44.49359130859375, "global_step": 318395, "epoch": 2631} {"train_loss": -44.09849166870117, "global_step": 318396, "epoch": 2631} {"train_loss": -43.934688568115234, "global_step": 318397, "epoch": 2631} {"train_loss": -44.29742431640625, "global_step": 318398, "epoch": 2631} {"train_loss": -44.4157600402832, "global_step": 318399, "epoch": 2631} {"train_loss": -44.01091003417969, "global_step": 318400, "epoch": 2631} {"train_loss": -44.42950439453125, "global_step": 318401, "epoch": 2631} {"train_loss": -44.528690338134766, "global_step": 318402, "epoch": 2631} {"train_loss": -44.209877014160156, "global_step": 318403, "epoch": 2631} {"train_loss": -44.167457580566406, "global_step": 318404, "epoch": 2631} {"train_loss": -43.93378448486328, "global_step": 318405, "epoch": 2631} {"train_loss": -44.5297966003418, "global_step": 318406, "epoch": 2631} {"train_loss": -44.09141540527344, "global_step": 318407, "epoch": 2631} {"train_loss": -44.768707275390625, "global_step": 318408, "epoch": 2631} {"train_loss": -44.502681732177734, "global_step": 318409, "epoch": 2631} {"train_loss": -44.3209342956543, "global_step": 318410, "epoch": 2631} {"train_loss": -44.342323303222656, "global_step": 318411, "epoch": 2631} {"train_loss": -44.36159896850586, "global_step": 318412, "epoch": 2631} {"train_loss": -44.40948486328125, "global_step": 318413, "epoch": 2631} {"train_loss": -44.12804412841797, "global_step": 318414, "epoch": 2631} {"train_loss": -44.943111419677734, "global_step": 318415, "epoch": 2631} {"train_loss": -44.626808166503906, "global_step": 318416, "epoch": 2631} {"train_loss": -44.87097930908203, "global_step": 318417, "epoch": 2631} {"train_loss": -44.791465759277344, "global_step": 318418, "epoch": 2631} {"train_loss": -44.38845443725586, "global_step": 318419, "epoch": 2631} {"train_loss": -43.993343353271484, "global_step": 318420, "epoch": 2631} {"train_loss": -44.45101547241211, "global_step": 318421, "epoch": 2631} {"train_loss": -44.334163665771484, "global_step": 318422, "epoch": 2631} {"train_loss": -43.426448822021484, "global_step": 318423, "epoch": 2631} {"train_loss": -42.831356048583984, "global_step": 318424, "epoch": 2631} {"train_loss": -44.281639099121094, "global_step": 318425, "epoch": 2631} {"train_loss": -43.97787094116211, "global_step": 318426, "epoch": 2631} {"train_loss": -43.567989349365234, "global_step": 318427, "epoch": 2631} {"train_loss": -43.74180221557617, "global_step": 318428, "epoch": 2631} {"train_loss": -44.22661590576172, "global_step": 318429, "epoch": 2631} {"train_loss": -43.769203186035156, "global_step": 318430, "epoch": 2631} {"train_loss": -44.23821258544922, "global_step": 318431, "epoch": 2631} {"train_loss": -43.82467269897461, "global_step": 318432, "epoch": 2631} {"train_loss": -44.0645637512207, "global_step": 318433, "epoch": 2631} {"train_loss": -44.297340393066406, "global_step": 318434, "epoch": 2631} {"train_loss": -43.98959732055664, "global_step": 318435, "epoch": 2631} {"train_loss": -43.554569244384766, "global_step": 318436, "epoch": 2631} {"train_loss": -44.18134689331055, "global_step": 318437, "epoch": 2631} {"train_loss": -44.62346267700195, "global_step": 318438, "epoch": 2631} {"train_loss": -42.79039764404297, "global_step": 318439, "epoch": 2631} {"train_loss": -43.02458953857422, "global_step": 318440, "epoch": 2631} {"train_loss": -44.06663131713867, "global_step": 318441, "epoch": 2631} {"train_loss": -44.68540573120117, "global_step": 318442, "epoch": 2631} {"train_loss": -44.032588958740234, "global_step": 318443, "epoch": 2631} {"train_loss": -44.54841613769531, "global_step": 318444, "epoch": 2631} {"train_loss": -43.600250244140625, "global_step": 318445, "epoch": 2631} {"train_loss": -44.25010299682617, "global_step": 318446, "epoch": 2631} {"train_loss": -44.74186325073242, "global_step": 318447, "epoch": 2631} {"train_loss": -44.53268051147461, "global_step": 318448, "epoch": 2631} {"train_loss": -44.38131332397461, "global_step": 318449, "epoch": 2631} {"train_loss": -44.4591178894043, "global_step": 318450, "epoch": 2631} {"train_loss": -44.782012939453125, "global_step": 318451, "epoch": 2631} {"train_loss": -44.5758171081543, "global_step": 318452, "epoch": 2631} {"train_loss": -43.764312744140625, "global_step": 318453, "epoch": 2631} {"train_loss": -43.709693908691406, "global_step": 318454, "epoch": 2631} {"train_loss": -44.321163177490234, "global_step": 318455, "epoch": 2631} {"train_loss": -44.4311637878418, "global_step": 318456, "epoch": 2631} {"train_loss": -43.72625732421875, "global_step": 318457, "epoch": 2631} {"train_loss": -44.177947998046875, "global_step": 318458, "epoch": 2631} {"train_loss": -39.799007415771484, "global_step": 318459, "epoch": 2631} {"train_loss": -40.07033920288086, "global_step": 318460, "epoch": 2631} {"train_loss": -41.861812591552734, "global_step": 318461, "epoch": 2631} {"train_loss": -43.83218002319336, "global_step": 318462, "epoch": 2631} {"train_loss": -40.898983001708984, "global_step": 318463, "epoch": 2631} {"train_loss": -44.2170524597168, "global_step": 318464, "epoch": 2631} {"train_loss": -39.369049072265625, "global_step": 318465, "epoch": 2631} {"train_loss": -43.73630142211914, "global_step": 318466, "epoch": 2631} {"train_loss": -40.19151306152344, "global_step": 318467, "epoch": 2631} {"train_loss": -42.314361572265625, "global_step": 318468, "epoch": 2631} {"train_loss": -42.726009368896484, "global_step": 318469, "epoch": 2631} {"train_loss": -43.09959411621094, "global_step": 318470, "epoch": 2631} {"train_loss": -43.79401605779474, "global_step": 318471, "epoch": 2631, "val_loss": 2708095.75} {"train_loss": -41.07639694213867, "global_step": 318472, "epoch": 2632} {"train_loss": -42.6492919921875, "global_step": 318473, "epoch": 2632} {"train_loss": -43.755836486816406, "global_step": 318474, "epoch": 2632} {"train_loss": -43.43811798095703, "global_step": 318475, "epoch": 2632} {"train_loss": -43.108985900878906, "global_step": 318476, "epoch": 2632} {"train_loss": -42.76277160644531, "global_step": 318477, "epoch": 2632} {"train_loss": -43.345821380615234, "global_step": 318478, "epoch": 2632} {"train_loss": -43.45505905151367, "global_step": 318479, "epoch": 2632} {"train_loss": -41.95160675048828, "global_step": 318480, "epoch": 2632} {"train_loss": -43.2498893737793, "global_step": 318481, "epoch": 2632} {"train_loss": -43.264461517333984, "global_step": 318482, "epoch": 2632} {"train_loss": -43.75312423706055, "global_step": 318483, "epoch": 2632} {"train_loss": -42.65765380859375, "global_step": 318484, "epoch": 2632} {"train_loss": -43.58407974243164, "global_step": 318485, "epoch": 2632} {"train_loss": -43.903690338134766, "global_step": 318486, "epoch": 2632} {"train_loss": -43.6244010925293, "global_step": 318487, "epoch": 2632} {"train_loss": -42.67827224731445, "global_step": 318488, "epoch": 2632} {"train_loss": -43.268287658691406, "global_step": 318489, "epoch": 2632} {"train_loss": -44.030311584472656, "global_step": 318490, "epoch": 2632} {"train_loss": -43.80686569213867, "global_step": 318491, "epoch": 2632} {"train_loss": -43.35437774658203, "global_step": 318492, "epoch": 2632} {"train_loss": -43.47684860229492, "global_step": 318493, "epoch": 2632} {"train_loss": -43.993709564208984, "global_step": 318494, "epoch": 2632} {"train_loss": -43.7537956237793, "global_step": 318495, "epoch": 2632} {"train_loss": -43.44887161254883, "global_step": 318496, "epoch": 2632} {"train_loss": -42.10905838012695, "global_step": 318497, "epoch": 2632} {"train_loss": -44.06372833251953, "global_step": 318498, "epoch": 2632} {"train_loss": -42.77779006958008, "global_step": 318499, "epoch": 2632} {"train_loss": -43.5424919128418, "global_step": 318500, "epoch": 2632} {"train_loss": -44.35390853881836, "global_step": 318501, "epoch": 2632} {"train_loss": -43.20148849487305, "global_step": 318502, "epoch": 2632} {"train_loss": -43.86221694946289, "global_step": 318503, "epoch": 2632} {"train_loss": -44.329429626464844, "global_step": 318504, "epoch": 2632} {"train_loss": -43.537899017333984, "global_step": 318505, "epoch": 2632} {"train_loss": -44.41215133666992, "global_step": 318506, "epoch": 2632} {"train_loss": -43.63114547729492, "global_step": 318507, "epoch": 2632} {"train_loss": -43.82035446166992, "global_step": 318508, "epoch": 2632} {"train_loss": -44.571815490722656, "global_step": 318509, "epoch": 2632} {"train_loss": -44.2084846496582, "global_step": 318510, "epoch": 2632} {"train_loss": -44.032325744628906, "global_step": 318511, "epoch": 2632} {"train_loss": -44.039283752441406, "global_step": 318512, "epoch": 2632} {"train_loss": -43.48147964477539, "global_step": 318513, "epoch": 2632} {"train_loss": -43.976112365722656, "global_step": 318514, "epoch": 2632} {"train_loss": -44.14231872558594, "global_step": 318515, "epoch": 2632} {"train_loss": -44.2486686706543, "global_step": 318516, "epoch": 2632} {"train_loss": -44.51375961303711, "global_step": 318517, "epoch": 2632} {"train_loss": -44.254730224609375, "global_step": 318518, "epoch": 2632} {"train_loss": -44.36838912963867, "global_step": 318519, "epoch": 2632} {"train_loss": -44.8485221862793, "global_step": 318520, "epoch": 2632} {"train_loss": -44.84412384033203, "global_step": 318521, "epoch": 2632} {"train_loss": -44.599403381347656, "global_step": 318522, "epoch": 2632} {"train_loss": -44.76111602783203, "global_step": 318523, "epoch": 2632} {"train_loss": -44.558837890625, "global_step": 318524, "epoch": 2632} {"train_loss": -43.56148910522461, "global_step": 318525, "epoch": 2632} {"train_loss": -45.119144439697266, "global_step": 318526, "epoch": 2632} {"train_loss": -44.24800491333008, "global_step": 318527, "epoch": 2632} {"train_loss": -43.597225189208984, "global_step": 318528, "epoch": 2632} {"train_loss": -44.33000564575195, "global_step": 318529, "epoch": 2632} {"train_loss": -44.51968765258789, "global_step": 318530, "epoch": 2632} {"train_loss": -44.15800857543945, "global_step": 318531, "epoch": 2632} {"train_loss": -44.91487503051758, "global_step": 318532, "epoch": 2632} {"train_loss": -44.830604553222656, "global_step": 318533, "epoch": 2632} {"train_loss": -44.84821701049805, "global_step": 318534, "epoch": 2632} {"train_loss": -45.063720703125, "global_step": 318535, "epoch": 2632} {"train_loss": -44.51668167114258, "global_step": 318536, "epoch": 2632} {"train_loss": -44.63848876953125, "global_step": 318537, "epoch": 2632} {"train_loss": -44.8455924987793, "global_step": 318538, "epoch": 2632} {"train_loss": -45.23003005981445, "global_step": 318539, "epoch": 2632} {"train_loss": -44.864864349365234, "global_step": 318540, "epoch": 2632} {"train_loss": -44.23537063598633, "global_step": 318541, "epoch": 2632} {"train_loss": -44.700042724609375, "global_step": 318542, "epoch": 2632} {"train_loss": -44.95038604736328, "global_step": 318543, "epoch": 2632} {"train_loss": -44.819950103759766, "global_step": 318544, "epoch": 2632} {"train_loss": -44.139793395996094, "global_step": 318545, "epoch": 2632} {"train_loss": -44.29747772216797, "global_step": 318546, "epoch": 2632} {"train_loss": -44.80048370361328, "global_step": 318547, "epoch": 2632} {"train_loss": -45.327213287353516, "global_step": 318548, "epoch": 2632} {"train_loss": -44.53496170043945, "global_step": 318549, "epoch": 2632} {"train_loss": -44.6871337890625, "global_step": 318550, "epoch": 2632} {"train_loss": -45.06992721557617, "global_step": 318551, "epoch": 2632} {"train_loss": -45.51700973510742, "global_step": 318552, "epoch": 2632} {"train_loss": -45.014278411865234, "global_step": 318553, "epoch": 2632} {"train_loss": -44.962093353271484, "global_step": 318554, "epoch": 2632} {"train_loss": -45.054622650146484, "global_step": 318555, "epoch": 2632} {"train_loss": -44.63653564453125, "global_step": 318556, "epoch": 2632} {"train_loss": -44.5863037109375, "global_step": 318557, "epoch": 2632} {"train_loss": -44.835811614990234, "global_step": 318558, "epoch": 2632} {"train_loss": -44.36849594116211, "global_step": 318559, "epoch": 2632} {"train_loss": -44.96540451049805, "global_step": 318560, "epoch": 2632} {"train_loss": -45.15498733520508, "global_step": 318561, "epoch": 2632} {"train_loss": -44.78703689575195, "global_step": 318562, "epoch": 2632} {"train_loss": -44.820770263671875, "global_step": 318563, "epoch": 2632} {"train_loss": -44.901214599609375, "global_step": 318564, "epoch": 2632} {"train_loss": -44.880184173583984, "global_step": 318565, "epoch": 2632} {"train_loss": -44.763832092285156, "global_step": 318566, "epoch": 2632} {"train_loss": -42.06296920776367, "global_step": 318567, "epoch": 2632} {"train_loss": -45.217498779296875, "global_step": 318568, "epoch": 2632} {"train_loss": -44.5979118347168, "global_step": 318569, "epoch": 2632} {"train_loss": -43.46916580200195, "global_step": 318570, "epoch": 2632} {"train_loss": -43.24843215942383, "global_step": 318571, "epoch": 2632} {"train_loss": -43.13115310668945, "global_step": 318572, "epoch": 2632} {"train_loss": -43.13079833984375, "global_step": 318573, "epoch": 2632} {"train_loss": -43.83901596069336, "global_step": 318574, "epoch": 2632} {"train_loss": -44.03948974609375, "global_step": 318575, "epoch": 2632} {"train_loss": -43.581546783447266, "global_step": 318576, "epoch": 2632} {"train_loss": -43.344966888427734, "global_step": 318577, "epoch": 2632} {"train_loss": -44.64382553100586, "global_step": 318578, "epoch": 2632} {"train_loss": -44.3036994934082, "global_step": 318579, "epoch": 2632} {"train_loss": -43.75993347167969, "global_step": 318580, "epoch": 2632} {"train_loss": -44.122169494628906, "global_step": 318581, "epoch": 2632} {"train_loss": -43.622276306152344, "global_step": 318582, "epoch": 2632} {"train_loss": -42.441810607910156, "global_step": 318583, "epoch": 2632} {"train_loss": -42.683040618896484, "global_step": 318584, "epoch": 2632} {"train_loss": -41.15156173706055, "global_step": 318585, "epoch": 2632} {"train_loss": -42.36764144897461, "global_step": 318586, "epoch": 2632} {"train_loss": -42.2123908996582, "global_step": 318587, "epoch": 2632} {"train_loss": -42.94275665283203, "global_step": 318588, "epoch": 2632} {"train_loss": -41.82123947143555, "global_step": 318589, "epoch": 2632} {"train_loss": -42.03578567504883, "global_step": 318590, "epoch": 2632} {"train_loss": -41.48331832885742, "global_step": 318591, "epoch": 2632} {"train_loss": -43.92145866204884, "global_step": 318592, "epoch": 2632, "val_loss": 2769244.25} {"train_loss": -43.817604064941406, "global_step": 318593, "epoch": 2633} {"train_loss": -41.98868942260742, "global_step": 318594, "epoch": 2633} {"train_loss": -42.35136032104492, "global_step": 318595, "epoch": 2633} {"train_loss": -40.58552169799805, "global_step": 318596, "epoch": 2633} {"train_loss": -43.42108154296875, "global_step": 318597, "epoch": 2633} {"train_loss": -41.786781311035156, "global_step": 318598, "epoch": 2633} {"train_loss": -40.905399322509766, "global_step": 318599, "epoch": 2633} {"train_loss": -41.38286209106445, "global_step": 318600, "epoch": 2633} {"train_loss": -43.28768539428711, "global_step": 318601, "epoch": 2633} {"train_loss": -42.12437057495117, "global_step": 318602, "epoch": 2633} {"train_loss": -43.867584228515625, "global_step": 318603, "epoch": 2633} {"train_loss": -42.22489929199219, "global_step": 318604, "epoch": 2633} {"train_loss": -37.97608184814453, "global_step": 318605, "epoch": 2633} {"train_loss": -43.724090576171875, "global_step": 318606, "epoch": 2633} {"train_loss": -42.14150619506836, "global_step": 318607, "epoch": 2633} {"train_loss": -42.3546028137207, "global_step": 318608, "epoch": 2633} {"train_loss": -43.441768646240234, "global_step": 318609, "epoch": 2633} {"train_loss": -43.84310531616211, "global_step": 318610, "epoch": 2633} {"train_loss": -43.993629455566406, "global_step": 318611, "epoch": 2633} {"train_loss": -42.42168045043945, "global_step": 318612, "epoch": 2633} {"train_loss": -42.16769027709961, "global_step": 318613, "epoch": 2633} {"train_loss": -42.89201354980469, "global_step": 318614, "epoch": 2633} {"train_loss": -43.023414611816406, "global_step": 318615, "epoch": 2633} {"train_loss": -43.2940788269043, "global_step": 318616, "epoch": 2633} {"train_loss": -43.56471633911133, "global_step": 318617, "epoch": 2633} {"train_loss": -41.93088150024414, "global_step": 318618, "epoch": 2633} {"train_loss": -43.2467041015625, "global_step": 318619, "epoch": 2633} {"train_loss": -44.09760665893555, "global_step": 318620, "epoch": 2633} {"train_loss": -43.11497497558594, "global_step": 318621, "epoch": 2633} {"train_loss": -41.28761672973633, "global_step": 318622, "epoch": 2633} {"train_loss": -43.68036651611328, "global_step": 318623, "epoch": 2633} {"train_loss": -43.94956588745117, "global_step": 318624, "epoch": 2633} {"train_loss": -43.22126388549805, "global_step": 318625, "epoch": 2633} {"train_loss": -44.05845260620117, "global_step": 318626, "epoch": 2633} {"train_loss": -43.60059356689453, "global_step": 318627, "epoch": 2633} {"train_loss": -43.81352996826172, "global_step": 318628, "epoch": 2633} {"train_loss": -43.34209060668945, "global_step": 318629, "epoch": 2633} {"train_loss": -44.05935287475586, "global_step": 318630, "epoch": 2633} {"train_loss": -43.38947677612305, "global_step": 318631, "epoch": 2633} {"train_loss": -43.9090461730957, "global_step": 318632, "epoch": 2633} {"train_loss": -44.22733688354492, "global_step": 318633, "epoch": 2633} {"train_loss": -44.243385314941406, "global_step": 318634, "epoch": 2633} {"train_loss": -43.43528366088867, "global_step": 318635, "epoch": 2633} {"train_loss": -44.078399658203125, "global_step": 318636, "epoch": 2633} {"train_loss": -42.59309768676758, "global_step": 318637, "epoch": 2633} {"train_loss": -44.86280059814453, "global_step": 318638, "epoch": 2633} {"train_loss": -43.579830169677734, "global_step": 318639, "epoch": 2633} {"train_loss": -44.0011100769043, "global_step": 318640, "epoch": 2633} {"train_loss": -43.60056686401367, "global_step": 318641, "epoch": 2633} {"train_loss": -43.53276443481445, "global_step": 318642, "epoch": 2633} {"train_loss": -43.94350814819336, "global_step": 318643, "epoch": 2633} {"train_loss": -43.05805206298828, "global_step": 318644, "epoch": 2633} {"train_loss": -44.08954620361328, "global_step": 318645, "epoch": 2633} {"train_loss": -44.50680160522461, "global_step": 318646, "epoch": 2633} {"train_loss": -44.492305755615234, "global_step": 318647, "epoch": 2633} {"train_loss": -44.95722579956055, "global_step": 318648, "epoch": 2633} {"train_loss": -44.562957763671875, "global_step": 318649, "epoch": 2633} {"train_loss": -44.612667083740234, "global_step": 318650, "epoch": 2633} {"train_loss": -44.7032356262207, "global_step": 318651, "epoch": 2633} {"train_loss": -43.09614181518555, "global_step": 318652, "epoch": 2633} {"train_loss": -44.51803207397461, "global_step": 318653, "epoch": 2633} {"train_loss": -44.24730682373047, "global_step": 318654, "epoch": 2633} {"train_loss": -44.40864562988281, "global_step": 318655, "epoch": 2633} {"train_loss": -44.5230827331543, "global_step": 318656, "epoch": 2633} {"train_loss": -42.68413162231445, "global_step": 318657, "epoch": 2633} {"train_loss": -44.31161880493164, "global_step": 318658, "epoch": 2633} {"train_loss": -44.64289474487305, "global_step": 318659, "epoch": 2633} {"train_loss": -44.95717239379883, "global_step": 318660, "epoch": 2633} {"train_loss": -44.26165771484375, "global_step": 318661, "epoch": 2633} {"train_loss": -42.4395751953125, "global_step": 318662, "epoch": 2633} {"train_loss": -44.50818634033203, "global_step": 318663, "epoch": 2633} {"train_loss": -44.611549377441406, "global_step": 318664, "epoch": 2633} {"train_loss": -43.8258171081543, "global_step": 318665, "epoch": 2633} {"train_loss": -44.084259033203125, "global_step": 318666, "epoch": 2633} {"train_loss": -41.288970947265625, "global_step": 318667, "epoch": 2633} {"train_loss": -44.444374084472656, "global_step": 318668, "epoch": 2633} {"train_loss": -44.28193283081055, "global_step": 318669, "epoch": 2633} {"train_loss": -43.78584671020508, "global_step": 318670, "epoch": 2633} {"train_loss": -43.9283447265625, "global_step": 318671, "epoch": 2633} {"train_loss": -45.1906852722168, "global_step": 318672, "epoch": 2633} {"train_loss": -43.37886428833008, "global_step": 318673, "epoch": 2633} {"train_loss": -41.244384765625, "global_step": 318674, "epoch": 2633} {"train_loss": -42.69883346557617, "global_step": 318675, "epoch": 2633} {"train_loss": -43.494789123535156, "global_step": 318676, "epoch": 2633} {"train_loss": -43.806190490722656, "global_step": 318677, "epoch": 2633} {"train_loss": -43.85416030883789, "global_step": 318678, "epoch": 2633} {"train_loss": -41.517147064208984, "global_step": 318679, "epoch": 2633} {"train_loss": -43.85946273803711, "global_step": 318680, "epoch": 2633} {"train_loss": -42.811614990234375, "global_step": 318681, "epoch": 2633} {"train_loss": -44.16647720336914, "global_step": 318682, "epoch": 2633} {"train_loss": -43.14402389526367, "global_step": 318683, "epoch": 2633} {"train_loss": -44.37617874145508, "global_step": 318684, "epoch": 2633} {"train_loss": -44.2608757019043, "global_step": 318685, "epoch": 2633} {"train_loss": -43.0911979675293, "global_step": 318686, "epoch": 2633} {"train_loss": -44.02043533325195, "global_step": 318687, "epoch": 2633} {"train_loss": -44.840702056884766, "global_step": 318688, "epoch": 2633} {"train_loss": -43.60049057006836, "global_step": 318689, "epoch": 2633} {"train_loss": -44.689273834228516, "global_step": 318690, "epoch": 2633} {"train_loss": -43.78728485107422, "global_step": 318691, "epoch": 2633} {"train_loss": -44.414390563964844, "global_step": 318692, "epoch": 2633} {"train_loss": -44.092403411865234, "global_step": 318693, "epoch": 2633} {"train_loss": -44.484073638916016, "global_step": 318694, "epoch": 2633} {"train_loss": -44.26580810546875, "global_step": 318695, "epoch": 2633} {"train_loss": -42.67570877075195, "global_step": 318696, "epoch": 2633} {"train_loss": -43.29517364501953, "global_step": 318697, "epoch": 2633} {"train_loss": -42.3577766418457, "global_step": 318698, "epoch": 2633} {"train_loss": -43.012508392333984, "global_step": 318699, "epoch": 2633} {"train_loss": -42.19441604614258, "global_step": 318700, "epoch": 2633} {"train_loss": -38.66645431518555, "global_step": 318701, "epoch": 2633} {"train_loss": -43.133296966552734, "global_step": 318702, "epoch": 2633} {"train_loss": -41.35081100463867, "global_step": 318703, "epoch": 2633} {"train_loss": -37.37160873413086, "global_step": 318704, "epoch": 2633} {"train_loss": -32.26220703125, "global_step": 318705, "epoch": 2633} {"train_loss": -36.994380950927734, "global_step": 318706, "epoch": 2633} {"train_loss": -41.4693603515625, "global_step": 318707, "epoch": 2633} {"train_loss": -38.12760543823242, "global_step": 318708, "epoch": 2633} {"train_loss": -41.72517395019531, "global_step": 318709, "epoch": 2633} {"train_loss": -33.343299865722656, "global_step": 318710, "epoch": 2633} {"train_loss": -38.45551681518555, "global_step": 318711, "epoch": 2633} {"train_loss": -40.850582122802734, "global_step": 318712, "epoch": 2633} {"train_loss": -42.861664606519966, "global_step": 318713, "epoch": 2633, "val_loss": 2598876.5} {"train_loss": -39.726890563964844, "global_step": 318714, "epoch": 2634} {"train_loss": -36.65228271484375, "global_step": 318715, "epoch": 2634} {"train_loss": -31.439380645751953, "global_step": 318716, "epoch": 2634} {"train_loss": -42.13521957397461, "global_step": 318717, "epoch": 2634} {"train_loss": -32.504608154296875, "global_step": 318718, "epoch": 2634} {"train_loss": -40.98246383666992, "global_step": 318719, "epoch": 2634} {"train_loss": -36.998931884765625, "global_step": 318720, "epoch": 2634} {"train_loss": -40.78404998779297, "global_step": 318721, "epoch": 2634} {"train_loss": -36.03690719604492, "global_step": 318722, "epoch": 2634} {"train_loss": -38.8750114440918, "global_step": 318723, "epoch": 2634} {"train_loss": -38.15583419799805, "global_step": 318724, "epoch": 2634} {"train_loss": -40.08640670776367, "global_step": 318725, "epoch": 2634} {"train_loss": -37.435733795166016, "global_step": 318726, "epoch": 2634} {"train_loss": -40.124725341796875, "global_step": 318727, "epoch": 2634} {"train_loss": -40.308528900146484, "global_step": 318728, "epoch": 2634} {"train_loss": -42.15509796142578, "global_step": 318729, "epoch": 2634} {"train_loss": -39.678802490234375, "global_step": 318730, "epoch": 2634} {"train_loss": -37.308326721191406, "global_step": 318731, "epoch": 2634} {"train_loss": -41.73173141479492, "global_step": 318732, "epoch": 2634} {"train_loss": -41.53599166870117, "global_step": 318733, "epoch": 2634} {"train_loss": -42.03129959106445, "global_step": 318734, "epoch": 2634} {"train_loss": -41.0921630859375, "global_step": 318735, "epoch": 2634} {"train_loss": -42.72324752807617, "global_step": 318736, "epoch": 2634} {"train_loss": -41.49921798706055, "global_step": 318737, "epoch": 2634} {"train_loss": -43.06432342529297, "global_step": 318738, "epoch": 2634} {"train_loss": -41.657596588134766, "global_step": 318739, "epoch": 2634} {"train_loss": -43.029541015625, "global_step": 318740, "epoch": 2634} {"train_loss": -41.64387893676758, "global_step": 318741, "epoch": 2634} {"train_loss": -42.5097541809082, "global_step": 318742, "epoch": 2634} {"train_loss": -42.67173385620117, "global_step": 318743, "epoch": 2634} {"train_loss": -43.22197341918945, "global_step": 318744, "epoch": 2634} {"train_loss": -42.68757247924805, "global_step": 318745, "epoch": 2634} {"train_loss": -42.55550003051758, "global_step": 318746, "epoch": 2634} {"train_loss": -43.17250442504883, "global_step": 318747, "epoch": 2634} {"train_loss": -42.8227653503418, "global_step": 318748, "epoch": 2634} {"train_loss": -43.28307342529297, "global_step": 318749, "epoch": 2634} {"train_loss": -42.294795989990234, "global_step": 318750, "epoch": 2634} {"train_loss": -42.95926284790039, "global_step": 318751, "epoch": 2634} {"train_loss": -43.00288009643555, "global_step": 318752, "epoch": 2634} {"train_loss": -43.05922317504883, "global_step": 318753, "epoch": 2634} {"train_loss": -42.66671371459961, "global_step": 318754, "epoch": 2634} {"train_loss": -43.39337158203125, "global_step": 318755, "epoch": 2634} {"train_loss": -42.76947021484375, "global_step": 318756, "epoch": 2634} {"train_loss": -42.890193939208984, "global_step": 318757, "epoch": 2634} {"train_loss": -43.47941207885742, "global_step": 318758, "epoch": 2634} {"train_loss": -43.43861770629883, "global_step": 318759, "epoch": 2634} {"train_loss": -43.37128829956055, "global_step": 318760, "epoch": 2634} {"train_loss": -42.809410095214844, "global_step": 318761, "epoch": 2634} {"train_loss": -44.40885543823242, "global_step": 318762, "epoch": 2634} {"train_loss": -43.391387939453125, "global_step": 318763, "epoch": 2634} {"train_loss": -43.899635314941406, "global_step": 318764, "epoch": 2634} {"train_loss": -43.8171272277832, "global_step": 318765, "epoch": 2634} {"train_loss": -43.79252243041992, "global_step": 318766, "epoch": 2634} {"train_loss": -43.80476379394531, "global_step": 318767, "epoch": 2634} {"train_loss": -43.482723236083984, "global_step": 318768, "epoch": 2634} {"train_loss": -43.67512893676758, "global_step": 318769, "epoch": 2634} {"train_loss": -44.31605529785156, "global_step": 318770, "epoch": 2634} {"train_loss": -43.85573196411133, "global_step": 318771, "epoch": 2634} {"train_loss": -44.58848571777344, "global_step": 318772, "epoch": 2634} {"train_loss": -44.10033416748047, "global_step": 318773, "epoch": 2634} {"train_loss": -44.31846618652344, "global_step": 318774, "epoch": 2634} {"train_loss": -44.59803009033203, "global_step": 318775, "epoch": 2634} {"train_loss": -44.669490814208984, "global_step": 318776, "epoch": 2634} {"train_loss": -44.52363967895508, "global_step": 318777, "epoch": 2634} {"train_loss": -44.55982208251953, "global_step": 318778, "epoch": 2634} {"train_loss": -44.651851654052734, "global_step": 318779, "epoch": 2634} {"train_loss": -44.397682189941406, "global_step": 318780, "epoch": 2634} {"train_loss": -44.854679107666016, "global_step": 318781, "epoch": 2634} {"train_loss": -44.556819915771484, "global_step": 318782, "epoch": 2634} {"train_loss": -44.09909439086914, "global_step": 318783, "epoch": 2634} {"train_loss": -44.691505432128906, "global_step": 318784, "epoch": 2634} {"train_loss": -44.67620086669922, "global_step": 318785, "epoch": 2634} {"train_loss": -44.579071044921875, "global_step": 318786, "epoch": 2634} {"train_loss": -44.9769401550293, "global_step": 318787, "epoch": 2634} {"train_loss": -44.66181182861328, "global_step": 318788, "epoch": 2634} {"train_loss": -44.78871536254883, "global_step": 318789, "epoch": 2634} {"train_loss": -44.78639221191406, "global_step": 318790, "epoch": 2634} {"train_loss": -44.63739013671875, "global_step": 318791, "epoch": 2634} {"train_loss": -44.62387466430664, "global_step": 318792, "epoch": 2634} {"train_loss": -45.00991439819336, "global_step": 318793, "epoch": 2634} {"train_loss": -44.494895935058594, "global_step": 318794, "epoch": 2634} {"train_loss": -45.068946838378906, "global_step": 318795, "epoch": 2634} {"train_loss": -44.28581619262695, "global_step": 318796, "epoch": 2634} {"train_loss": -44.9307746887207, "global_step": 318797, "epoch": 2634} {"train_loss": -44.5585823059082, "global_step": 318798, "epoch": 2634} {"train_loss": -44.576881408691406, "global_step": 318799, "epoch": 2634} {"train_loss": -44.66179275512695, "global_step": 318800, "epoch": 2634} {"train_loss": -44.91929244995117, "global_step": 318801, "epoch": 2634} {"train_loss": -44.99970245361328, "global_step": 318802, "epoch": 2634} {"train_loss": -44.87421798706055, "global_step": 318803, "epoch": 2634} {"train_loss": -44.263946533203125, "global_step": 318804, "epoch": 2634} {"train_loss": -44.804107666015625, "global_step": 318805, "epoch": 2634} {"train_loss": -44.43059158325195, "global_step": 318806, "epoch": 2634} {"train_loss": -44.7296142578125, "global_step": 318807, "epoch": 2634} {"train_loss": -44.56806564331055, "global_step": 318808, "epoch": 2634} {"train_loss": -44.62993621826172, "global_step": 318809, "epoch": 2634} {"train_loss": -45.05348587036133, "global_step": 318810, "epoch": 2634} {"train_loss": -44.67783737182617, "global_step": 318811, "epoch": 2634} {"train_loss": -44.19782257080078, "global_step": 318812, "epoch": 2634} {"train_loss": -44.9493408203125, "global_step": 318813, "epoch": 2634} {"train_loss": -45.22522735595703, "global_step": 318814, "epoch": 2634} {"train_loss": -44.31922149658203, "global_step": 318815, "epoch": 2634} {"train_loss": -44.656070709228516, "global_step": 318816, "epoch": 2634} {"train_loss": -45.02096176147461, "global_step": 318817, "epoch": 2634} {"train_loss": -45.169525146484375, "global_step": 318818, "epoch": 2634} {"train_loss": -44.56232452392578, "global_step": 318819, "epoch": 2634} {"train_loss": -44.93038558959961, "global_step": 318820, "epoch": 2634} {"train_loss": -45.119136810302734, "global_step": 318821, "epoch": 2634} {"train_loss": -45.350093841552734, "global_step": 318822, "epoch": 2634} {"train_loss": -45.23784255981445, "global_step": 318823, "epoch": 2634} {"train_loss": -44.877845764160156, "global_step": 318824, "epoch": 2634} {"train_loss": -44.47288131713867, "global_step": 318825, "epoch": 2634} {"train_loss": -44.88358688354492, "global_step": 318826, "epoch": 2634} {"train_loss": -45.190670013427734, "global_step": 318827, "epoch": 2634} {"train_loss": -45.087677001953125, "global_step": 318828, "epoch": 2634} {"train_loss": -45.45786666870117, "global_step": 318829, "epoch": 2634} {"train_loss": -44.72581100463867, "global_step": 318830, "epoch": 2634} {"train_loss": -45.061073303222656, "global_step": 318831, "epoch": 2634} {"train_loss": -44.85635757446289, "global_step": 318832, "epoch": 2634} {"train_loss": -44.764827728271484, "global_step": 318833, "epoch": 2634} {"train_loss": -43.199213043717315, "global_step": 318834, "epoch": 2634, "val_loss": 2672893.25} {"train_loss": -43.70035171508789, "global_step": 318835, "epoch": 2635} {"train_loss": -44.01047897338867, "global_step": 318836, "epoch": 2635} {"train_loss": -43.93205642700195, "global_step": 318837, "epoch": 2635} {"train_loss": -44.44365692138672, "global_step": 318838, "epoch": 2635} {"train_loss": -43.56916427612305, "global_step": 318839, "epoch": 2635} {"train_loss": -42.35319137573242, "global_step": 318840, "epoch": 2635} {"train_loss": -43.183013916015625, "global_step": 318841, "epoch": 2635} {"train_loss": -44.06270980834961, "global_step": 318842, "epoch": 2635} {"train_loss": -44.62919235229492, "global_step": 318843, "epoch": 2635} {"train_loss": -42.60034942626953, "global_step": 318844, "epoch": 2635} {"train_loss": -41.57221603393555, "global_step": 318845, "epoch": 2635} {"train_loss": -43.678466796875, "global_step": 318846, "epoch": 2635} {"train_loss": -43.6715087890625, "global_step": 318847, "epoch": 2635} {"train_loss": -39.46425247192383, "global_step": 318848, "epoch": 2635} {"train_loss": -43.40186309814453, "global_step": 318849, "epoch": 2635} {"train_loss": -43.72468566894531, "global_step": 318850, "epoch": 2635} {"train_loss": -41.2172737121582, "global_step": 318851, "epoch": 2635} {"train_loss": -40.74795150756836, "global_step": 318852, "epoch": 2635} {"train_loss": -39.72943115234375, "global_step": 318853, "epoch": 2635} {"train_loss": -39.05778121948242, "global_step": 318854, "epoch": 2635} {"train_loss": -39.86777877807617, "global_step": 318855, "epoch": 2635} {"train_loss": -41.3542594909668, "global_step": 318856, "epoch": 2635} {"train_loss": -41.92873001098633, "global_step": 318857, "epoch": 2635} {"train_loss": -41.20524978637695, "global_step": 318858, "epoch": 2635} {"train_loss": -43.25977325439453, "global_step": 318859, "epoch": 2635} {"train_loss": -42.70193862915039, "global_step": 318860, "epoch": 2635} {"train_loss": -41.91776657104492, "global_step": 318861, "epoch": 2635} {"train_loss": -43.605262756347656, "global_step": 318862, "epoch": 2635} {"train_loss": -42.42048645019531, "global_step": 318863, "epoch": 2635} {"train_loss": -42.71181106567383, "global_step": 318864, "epoch": 2635} {"train_loss": -43.63030242919922, "global_step": 318865, "epoch": 2635} {"train_loss": -41.733558654785156, "global_step": 318866, "epoch": 2635} {"train_loss": -43.29879379272461, "global_step": 318867, "epoch": 2635} {"train_loss": -43.4535026550293, "global_step": 318868, "epoch": 2635} {"train_loss": -42.5731315612793, "global_step": 318869, "epoch": 2635} {"train_loss": -43.777706146240234, "global_step": 318870, "epoch": 2635} {"train_loss": -43.41862106323242, "global_step": 318871, "epoch": 2635} {"train_loss": -43.656795501708984, "global_step": 318872, "epoch": 2635} {"train_loss": -43.1333122253418, "global_step": 318873, "epoch": 2635} {"train_loss": -43.365394592285156, "global_step": 318874, "epoch": 2635} {"train_loss": -43.64935302734375, "global_step": 318875, "epoch": 2635} {"train_loss": -43.40663528442383, "global_step": 318876, "epoch": 2635} {"train_loss": -43.99103546142578, "global_step": 318877, "epoch": 2635} {"train_loss": -43.52509689331055, "global_step": 318878, "epoch": 2635} {"train_loss": -44.4050407409668, "global_step": 318879, "epoch": 2635} {"train_loss": -43.788509368896484, "global_step": 318880, "epoch": 2635} {"train_loss": -44.208187103271484, "global_step": 318881, "epoch": 2635} {"train_loss": -44.488868713378906, "global_step": 318882, "epoch": 2635} {"train_loss": -44.1107177734375, "global_step": 318883, "epoch": 2635} {"train_loss": -43.71390914916992, "global_step": 318884, "epoch": 2635} {"train_loss": -43.63520050048828, "global_step": 318885, "epoch": 2635} {"train_loss": -44.427059173583984, "global_step": 318886, "epoch": 2635} {"train_loss": -43.264522552490234, "global_step": 318887, "epoch": 2635} {"train_loss": -44.31240463256836, "global_step": 318888, "epoch": 2635} {"train_loss": -43.69984817504883, "global_step": 318889, "epoch": 2635} {"train_loss": -44.017181396484375, "global_step": 318890, "epoch": 2635} {"train_loss": -44.067195892333984, "global_step": 318891, "epoch": 2635} {"train_loss": -44.20640182495117, "global_step": 318892, "epoch": 2635} {"train_loss": -44.270606994628906, "global_step": 318893, "epoch": 2635} {"train_loss": -44.7564811706543, "global_step": 318894, "epoch": 2635} {"train_loss": -44.359066009521484, "global_step": 318895, "epoch": 2635} {"train_loss": -44.13104248046875, "global_step": 318896, "epoch": 2635} {"train_loss": -44.707393646240234, "global_step": 318897, "epoch": 2635} {"train_loss": -44.05942916870117, "global_step": 318898, "epoch": 2635} {"train_loss": -44.03498458862305, "global_step": 318899, "epoch": 2635} {"train_loss": -44.76533126831055, "global_step": 318900, "epoch": 2635} {"train_loss": -43.49699783325195, "global_step": 318901, "epoch": 2635} {"train_loss": -44.290653228759766, "global_step": 318902, "epoch": 2635} {"train_loss": -43.629085540771484, "global_step": 318903, "epoch": 2635} {"train_loss": -43.9141845703125, "global_step": 318904, "epoch": 2635} {"train_loss": -43.98777389526367, "global_step": 318905, "epoch": 2635} {"train_loss": -42.624996185302734, "global_step": 318906, "epoch": 2635} {"train_loss": -45.0389404296875, "global_step": 318907, "epoch": 2635} {"train_loss": -43.9862060546875, "global_step": 318908, "epoch": 2635} {"train_loss": -44.94281768798828, "global_step": 318909, "epoch": 2635} {"train_loss": -44.319602966308594, "global_step": 318910, "epoch": 2635} {"train_loss": -44.30180740356445, "global_step": 318911, "epoch": 2635} {"train_loss": -44.8245735168457, "global_step": 318912, "epoch": 2635} {"train_loss": -43.89143753051758, "global_step": 318913, "epoch": 2635} {"train_loss": -44.60187530517578, "global_step": 318914, "epoch": 2635} {"train_loss": -44.18478775024414, "global_step": 318915, "epoch": 2635} {"train_loss": -44.38288497924805, "global_step": 318916, "epoch": 2635} {"train_loss": -44.6991081237793, "global_step": 318917, "epoch": 2635} {"train_loss": -44.15712356567383, "global_step": 318918, "epoch": 2635} {"train_loss": -45.108177185058594, "global_step": 318919, "epoch": 2635} {"train_loss": -44.30735397338867, "global_step": 318920, "epoch": 2635} {"train_loss": -45.19292068481445, "global_step": 318921, "epoch": 2635} {"train_loss": -44.09579849243164, "global_step": 318922, "epoch": 2635} {"train_loss": -44.635353088378906, "global_step": 318923, "epoch": 2635} {"train_loss": -44.72795104980469, "global_step": 318924, "epoch": 2635} {"train_loss": -44.580909729003906, "global_step": 318925, "epoch": 2635} {"train_loss": -44.77264404296875, "global_step": 318926, "epoch": 2635} {"train_loss": -44.54441452026367, "global_step": 318927, "epoch": 2635} {"train_loss": -44.810890197753906, "global_step": 318928, "epoch": 2635} {"train_loss": -44.16801071166992, "global_step": 318929, "epoch": 2635} {"train_loss": -44.44325637817383, "global_step": 318930, "epoch": 2635} {"train_loss": -43.98750686645508, "global_step": 318931, "epoch": 2635} {"train_loss": -44.7147102355957, "global_step": 318932, "epoch": 2635} {"train_loss": -44.30464553833008, "global_step": 318933, "epoch": 2635} {"train_loss": -44.13871765136719, "global_step": 318934, "epoch": 2635} {"train_loss": -44.4149169921875, "global_step": 318935, "epoch": 2635} {"train_loss": -43.5029411315918, "global_step": 318936, "epoch": 2635} {"train_loss": -44.18508529663086, "global_step": 318937, "epoch": 2635} {"train_loss": -43.87641525268555, "global_step": 318938, "epoch": 2635} {"train_loss": -43.78040313720703, "global_step": 318939, "epoch": 2635} {"train_loss": -44.810951232910156, "global_step": 318940, "epoch": 2635} {"train_loss": -43.30412673950195, "global_step": 318941, "epoch": 2635} {"train_loss": -44.34521484375, "global_step": 318942, "epoch": 2635} {"train_loss": -43.56591033935547, "global_step": 318943, "epoch": 2635} {"train_loss": -44.47556686401367, "global_step": 318944, "epoch": 2635} {"train_loss": -44.2161750793457, "global_step": 318945, "epoch": 2635} {"train_loss": -44.278194427490234, "global_step": 318946, "epoch": 2635} {"train_loss": -44.3149299621582, "global_step": 318947, "epoch": 2635} {"train_loss": -44.113441467285156, "global_step": 318948, "epoch": 2635} {"train_loss": -44.111839294433594, "global_step": 318949, "epoch": 2635} {"train_loss": -44.57883071899414, "global_step": 318950, "epoch": 2635} {"train_loss": -44.3140983581543, "global_step": 318951, "epoch": 2635} {"train_loss": -44.85816955566406, "global_step": 318952, "epoch": 2635} {"train_loss": -43.83370590209961, "global_step": 318953, "epoch": 2635} {"train_loss": -45.428367614746094, "global_step": 318954, "epoch": 2635} {"train_loss": -43.70336743819812, "global_step": 318955, "epoch": 2635, "val_loss": 2645598.75} {"train_loss": -44.09530258178711, "global_step": 318956, "epoch": 2636} {"train_loss": -44.20439529418945, "global_step": 318957, "epoch": 2636} {"train_loss": -42.669368743896484, "global_step": 318958, "epoch": 2636} {"train_loss": -44.70357894897461, "global_step": 318959, "epoch": 2636} {"train_loss": -42.9208869934082, "global_step": 318960, "epoch": 2636} {"train_loss": -42.812618255615234, "global_step": 318961, "epoch": 2636} {"train_loss": -43.68795394897461, "global_step": 318962, "epoch": 2636} {"train_loss": -44.26506042480469, "global_step": 318963, "epoch": 2636} {"train_loss": -43.74258041381836, "global_step": 318964, "epoch": 2636} {"train_loss": -42.150943756103516, "global_step": 318965, "epoch": 2636} {"train_loss": -43.69680404663086, "global_step": 318966, "epoch": 2636} {"train_loss": -44.49234390258789, "global_step": 318967, "epoch": 2636} {"train_loss": -43.24729537963867, "global_step": 318968, "epoch": 2636} {"train_loss": -43.955902099609375, "global_step": 318969, "epoch": 2636} {"train_loss": -44.232940673828125, "global_step": 318970, "epoch": 2636} {"train_loss": -41.94068145751953, "global_step": 318971, "epoch": 2636} {"train_loss": -44.15582275390625, "global_step": 318972, "epoch": 2636} {"train_loss": -42.19890213012695, "global_step": 318973, "epoch": 2636} {"train_loss": -42.152976989746094, "global_step": 318974, "epoch": 2636} {"train_loss": -43.16463088989258, "global_step": 318975, "epoch": 2636} {"train_loss": -41.405067443847656, "global_step": 318976, "epoch": 2636} {"train_loss": -43.2831916809082, "global_step": 318977, "epoch": 2636} {"train_loss": -43.33962631225586, "global_step": 318978, "epoch": 2636} {"train_loss": -43.284908294677734, "global_step": 318979, "epoch": 2636} {"train_loss": -44.09503173828125, "global_step": 318980, "epoch": 2636} {"train_loss": -41.140167236328125, "global_step": 318981, "epoch": 2636} {"train_loss": -43.54024887084961, "global_step": 318982, "epoch": 2636} {"train_loss": -42.844444274902344, "global_step": 318983, "epoch": 2636} {"train_loss": -44.15211868286133, "global_step": 318984, "epoch": 2636} {"train_loss": -43.420135498046875, "global_step": 318985, "epoch": 2636} {"train_loss": -43.39022445678711, "global_step": 318986, "epoch": 2636} {"train_loss": -42.92585372924805, "global_step": 318987, "epoch": 2636} {"train_loss": -44.69221115112305, "global_step": 318988, "epoch": 2636} {"train_loss": -43.691871643066406, "global_step": 318989, "epoch": 2636} {"train_loss": -44.60103225708008, "global_step": 318990, "epoch": 2636} {"train_loss": -43.9433479309082, "global_step": 318991, "epoch": 2636} {"train_loss": -44.74752426147461, "global_step": 318992, "epoch": 2636} {"train_loss": -44.09224319458008, "global_step": 318993, "epoch": 2636} {"train_loss": -44.524044036865234, "global_step": 318994, "epoch": 2636} {"train_loss": -43.949981689453125, "global_step": 318995, "epoch": 2636} {"train_loss": -43.643348693847656, "global_step": 318996, "epoch": 2636} {"train_loss": -44.75091552734375, "global_step": 318997, "epoch": 2636} {"train_loss": -40.503456115722656, "global_step": 318998, "epoch": 2636} {"train_loss": -44.83505630493164, "global_step": 318999, "epoch": 2636} {"train_loss": -44.341552734375, "global_step": 319000, "epoch": 2636} {"train_loss": -44.64133834838867, "global_step": 319001, "epoch": 2636} {"train_loss": -38.81096649169922, "global_step": 319002, "epoch": 2636} {"train_loss": -43.72208786010742, "global_step": 319003, "epoch": 2636} {"train_loss": -44.26972579956055, "global_step": 319004, "epoch": 2636} {"train_loss": -44.198036193847656, "global_step": 319005, "epoch": 2636} {"train_loss": -43.44865036010742, "global_step": 319006, "epoch": 2636} {"train_loss": -44.72231674194336, "global_step": 319007, "epoch": 2636} {"train_loss": -43.432945251464844, "global_step": 319008, "epoch": 2636} {"train_loss": -44.334529876708984, "global_step": 319009, "epoch": 2636} {"train_loss": -43.8382568359375, "global_step": 319010, "epoch": 2636} {"train_loss": -44.568214416503906, "global_step": 319011, "epoch": 2636} {"train_loss": -43.29366683959961, "global_step": 319012, "epoch": 2636} {"train_loss": -44.563777923583984, "global_step": 319013, "epoch": 2636} {"train_loss": -43.5413932800293, "global_step": 319014, "epoch": 2636} {"train_loss": -42.783843994140625, "global_step": 319015, "epoch": 2636} {"train_loss": -41.175453186035156, "global_step": 319016, "epoch": 2636} {"train_loss": -43.734432220458984, "global_step": 319017, "epoch": 2636} {"train_loss": -44.19588851928711, "global_step": 319018, "epoch": 2636} {"train_loss": -43.838233947753906, "global_step": 319019, "epoch": 2636} {"train_loss": -43.39815902709961, "global_step": 319020, "epoch": 2636} {"train_loss": -44.693355560302734, "global_step": 319021, "epoch": 2636} {"train_loss": -44.48108673095703, "global_step": 319022, "epoch": 2636} {"train_loss": -40.37689971923828, "global_step": 319023, "epoch": 2636} {"train_loss": -44.36154556274414, "global_step": 319024, "epoch": 2636} {"train_loss": -43.67151641845703, "global_step": 319025, "epoch": 2636} {"train_loss": -44.171913146972656, "global_step": 319026, "epoch": 2636} {"train_loss": -44.04580307006836, "global_step": 319027, "epoch": 2636} {"train_loss": -44.282814025878906, "global_step": 319028, "epoch": 2636} {"train_loss": -44.25616455078125, "global_step": 319029, "epoch": 2636} {"train_loss": -43.20499801635742, "global_step": 319030, "epoch": 2636} {"train_loss": -44.4623908996582, "global_step": 319031, "epoch": 2636} {"train_loss": -44.48447799682617, "global_step": 319032, "epoch": 2636} {"train_loss": -44.27116012573242, "global_step": 319033, "epoch": 2636} {"train_loss": -44.238399505615234, "global_step": 319034, "epoch": 2636} {"train_loss": -44.670196533203125, "global_step": 319035, "epoch": 2636} {"train_loss": -44.25208282470703, "global_step": 319036, "epoch": 2636} {"train_loss": -44.68788146972656, "global_step": 319037, "epoch": 2636} {"train_loss": -44.661922454833984, "global_step": 319038, "epoch": 2636} {"train_loss": -44.044979095458984, "global_step": 319039, "epoch": 2636} {"train_loss": -44.24543380737305, "global_step": 319040, "epoch": 2636} {"train_loss": -44.0257453918457, "global_step": 319041, "epoch": 2636} {"train_loss": -44.2519645690918, "global_step": 319042, "epoch": 2636} {"train_loss": -41.819087982177734, "global_step": 319043, "epoch": 2636} {"train_loss": -43.90679168701172, "global_step": 319044, "epoch": 2636} {"train_loss": -42.95942306518555, "global_step": 319045, "epoch": 2636} {"train_loss": -43.55038070678711, "global_step": 319046, "epoch": 2636} {"train_loss": -43.524105072021484, "global_step": 319047, "epoch": 2636} {"train_loss": -42.37616729736328, "global_step": 319048, "epoch": 2636} {"train_loss": -43.88486862182617, "global_step": 319049, "epoch": 2636} {"train_loss": -44.74845504760742, "global_step": 319050, "epoch": 2636} {"train_loss": -43.209136962890625, "global_step": 319051, "epoch": 2636} {"train_loss": -42.70332336425781, "global_step": 319052, "epoch": 2636} {"train_loss": -43.60588455200195, "global_step": 319053, "epoch": 2636} {"train_loss": -43.76444625854492, "global_step": 319054, "epoch": 2636} {"train_loss": -43.79751205444336, "global_step": 319055, "epoch": 2636} {"train_loss": -44.11135482788086, "global_step": 319056, "epoch": 2636} {"train_loss": -44.515960693359375, "global_step": 319057, "epoch": 2636} {"train_loss": -43.8143424987793, "global_step": 319058, "epoch": 2636} {"train_loss": -42.24333572387695, "global_step": 319059, "epoch": 2636} {"train_loss": -42.562740325927734, "global_step": 319060, "epoch": 2636} {"train_loss": -43.83964157104492, "global_step": 319061, "epoch": 2636} {"train_loss": -42.928340911865234, "global_step": 319062, "epoch": 2636} {"train_loss": -43.477210998535156, "global_step": 319063, "epoch": 2636} {"train_loss": -43.29541015625, "global_step": 319064, "epoch": 2636} {"train_loss": -43.48469543457031, "global_step": 319065, "epoch": 2636} {"train_loss": -44.0614128112793, "global_step": 319066, "epoch": 2636} {"train_loss": -43.17490768432617, "global_step": 319067, "epoch": 2636} {"train_loss": -43.946224212646484, "global_step": 319068, "epoch": 2636} {"train_loss": -43.141578674316406, "global_step": 319069, "epoch": 2636} {"train_loss": -43.78322982788086, "global_step": 319070, "epoch": 2636} {"train_loss": -43.59690475463867, "global_step": 319071, "epoch": 2636} {"train_loss": -43.880062103271484, "global_step": 319072, "epoch": 2636} {"train_loss": -42.87260437011719, "global_step": 319073, "epoch": 2636} {"train_loss": -43.439491271972656, "global_step": 319074, "epoch": 2636} {"train_loss": -43.48240661621094, "global_step": 319075, "epoch": 2636} {"train_loss": -43.601165267061596, "global_step": 319076, "epoch": 2636, "val_loss": 2597384.75} {"train_loss": -41.70206832885742, "global_step": 319077, "epoch": 2637} {"train_loss": -42.94243240356445, "global_step": 319078, "epoch": 2637} {"train_loss": -42.237701416015625, "global_step": 319079, "epoch": 2637} {"train_loss": -43.63492965698242, "global_step": 319080, "epoch": 2637} {"train_loss": -43.93354415893555, "global_step": 319081, "epoch": 2637} {"train_loss": -41.679073333740234, "global_step": 319082, "epoch": 2637} {"train_loss": -43.759803771972656, "global_step": 319083, "epoch": 2637} {"train_loss": -42.84699249267578, "global_step": 319084, "epoch": 2637} {"train_loss": -41.5774040222168, "global_step": 319085, "epoch": 2637} {"train_loss": -42.290252685546875, "global_step": 319086, "epoch": 2637} {"train_loss": -43.70466995239258, "global_step": 319087, "epoch": 2637} {"train_loss": -43.61765670776367, "global_step": 319088, "epoch": 2637} {"train_loss": -43.1129150390625, "global_step": 319089, "epoch": 2637} {"train_loss": -43.68443298339844, "global_step": 319090, "epoch": 2637} {"train_loss": -43.830909729003906, "global_step": 319091, "epoch": 2637} {"train_loss": -44.01880645751953, "global_step": 319092, "epoch": 2637} {"train_loss": -43.218685150146484, "global_step": 319093, "epoch": 2637} {"train_loss": -43.172855377197266, "global_step": 319094, "epoch": 2637} {"train_loss": -44.24109649658203, "global_step": 319095, "epoch": 2637} {"train_loss": -43.94613265991211, "global_step": 319096, "epoch": 2637} {"train_loss": -44.321205139160156, "global_step": 319097, "epoch": 2637} {"train_loss": -44.2968635559082, "global_step": 319098, "epoch": 2637} {"train_loss": -43.76017379760742, "global_step": 319099, "epoch": 2637} {"train_loss": -43.920589447021484, "global_step": 319100, "epoch": 2637} {"train_loss": -44.00165939331055, "global_step": 319101, "epoch": 2637} {"train_loss": -44.721614837646484, "global_step": 319102, "epoch": 2637} {"train_loss": -44.75503921508789, "global_step": 319103, "epoch": 2637} {"train_loss": -44.25596237182617, "global_step": 319104, "epoch": 2637} {"train_loss": -43.91630172729492, "global_step": 319105, "epoch": 2637} {"train_loss": -44.015384674072266, "global_step": 319106, "epoch": 2637} {"train_loss": -44.3884162902832, "global_step": 319107, "epoch": 2637} {"train_loss": -44.72431564331055, "global_step": 319108, "epoch": 2637} {"train_loss": -44.13007736206055, "global_step": 319109, "epoch": 2637} {"train_loss": -44.292964935302734, "global_step": 319110, "epoch": 2637} {"train_loss": -44.769630432128906, "global_step": 319111, "epoch": 2637} {"train_loss": -44.352027893066406, "global_step": 319112, "epoch": 2637} {"train_loss": -44.57328796386719, "global_step": 319113, "epoch": 2637} {"train_loss": -44.26395797729492, "global_step": 319114, "epoch": 2637} {"train_loss": -43.84442138671875, "global_step": 319115, "epoch": 2637} {"train_loss": -44.669673919677734, "global_step": 319116, "epoch": 2637} {"train_loss": -44.9991569519043, "global_step": 319117, "epoch": 2637} {"train_loss": -44.25489044189453, "global_step": 319118, "epoch": 2637} {"train_loss": -44.984004974365234, "global_step": 319119, "epoch": 2637} {"train_loss": -44.747554779052734, "global_step": 319120, "epoch": 2637} {"train_loss": -42.614593505859375, "global_step": 319121, "epoch": 2637} {"train_loss": -44.155067443847656, "global_step": 319122, "epoch": 2637} {"train_loss": -45.05635452270508, "global_step": 319123, "epoch": 2637} {"train_loss": -43.9712028503418, "global_step": 319124, "epoch": 2637} {"train_loss": -40.66034698486328, "global_step": 319125, "epoch": 2637} {"train_loss": -44.7396354675293, "global_step": 319126, "epoch": 2637} {"train_loss": -44.542999267578125, "global_step": 319127, "epoch": 2637} {"train_loss": -44.2265739440918, "global_step": 319128, "epoch": 2637} {"train_loss": -44.167964935302734, "global_step": 319129, "epoch": 2637} {"train_loss": -44.5388298034668, "global_step": 319130, "epoch": 2637} {"train_loss": -44.14459228515625, "global_step": 319131, "epoch": 2637} {"train_loss": -44.25225830078125, "global_step": 319132, "epoch": 2637} {"train_loss": -41.53744125366211, "global_step": 319133, "epoch": 2637} {"train_loss": -43.451515197753906, "global_step": 319134, "epoch": 2637} {"train_loss": -38.21938705444336, "global_step": 319135, "epoch": 2637} {"train_loss": -42.9157600402832, "global_step": 319136, "epoch": 2637} {"train_loss": -44.72853469848633, "global_step": 319137, "epoch": 2637} {"train_loss": -44.29664993286133, "global_step": 319138, "epoch": 2637} {"train_loss": -44.251068115234375, "global_step": 319139, "epoch": 2637} {"train_loss": -44.57634353637695, "global_step": 319140, "epoch": 2637} {"train_loss": -39.097900390625, "global_step": 319141, "epoch": 2637} {"train_loss": -43.63273620605469, "global_step": 319142, "epoch": 2637} {"train_loss": -43.80411911010742, "global_step": 319143, "epoch": 2637} {"train_loss": -43.58059310913086, "global_step": 319144, "epoch": 2637} {"train_loss": -42.72681427001953, "global_step": 319145, "epoch": 2637} {"train_loss": -43.02667999267578, "global_step": 319146, "epoch": 2637} {"train_loss": -43.65849304199219, "global_step": 319147, "epoch": 2637} {"train_loss": -42.72056198120117, "global_step": 319148, "epoch": 2637} {"train_loss": -42.38869857788086, "global_step": 319149, "epoch": 2637} {"train_loss": -42.68270492553711, "global_step": 319150, "epoch": 2637} {"train_loss": -44.09920120239258, "global_step": 319151, "epoch": 2637} {"train_loss": -42.7561149597168, "global_step": 319152, "epoch": 2637} {"train_loss": -41.99453353881836, "global_step": 319153, "epoch": 2637} {"train_loss": -43.135215759277344, "global_step": 319154, "epoch": 2637} {"train_loss": -43.82706832885742, "global_step": 319155, "epoch": 2637} {"train_loss": -44.23257827758789, "global_step": 319156, "epoch": 2637} {"train_loss": -44.45402145385742, "global_step": 319157, "epoch": 2637} {"train_loss": -43.21840286254883, "global_step": 319158, "epoch": 2637} {"train_loss": -43.5211181640625, "global_step": 319159, "epoch": 2637} {"train_loss": -43.15169906616211, "global_step": 319160, "epoch": 2637} {"train_loss": -43.734649658203125, "global_step": 319161, "epoch": 2637} {"train_loss": -42.12825012207031, "global_step": 319162, "epoch": 2637} {"train_loss": -38.45417404174805, "global_step": 319163, "epoch": 2637} {"train_loss": -39.59829330444336, "global_step": 319164, "epoch": 2637} {"train_loss": -41.0521240234375, "global_step": 319165, "epoch": 2637} {"train_loss": -38.68798828125, "global_step": 319166, "epoch": 2637} {"train_loss": -43.44021224975586, "global_step": 319167, "epoch": 2637} {"train_loss": -33.174598693847656, "global_step": 319168, "epoch": 2637} {"train_loss": -24.73351287841797, "global_step": 319169, "epoch": 2637} {"train_loss": -38.70254135131836, "global_step": 319170, "epoch": 2637} {"train_loss": -42.140254974365234, "global_step": 319171, "epoch": 2637} {"train_loss": -36.08222579956055, "global_step": 319172, "epoch": 2637} {"train_loss": -41.22528076171875, "global_step": 319173, "epoch": 2637} {"train_loss": -41.39345932006836, "global_step": 319174, "epoch": 2637} {"train_loss": -39.29365921020508, "global_step": 319175, "epoch": 2637} {"train_loss": -41.780555725097656, "global_step": 319176, "epoch": 2637} {"train_loss": -39.28657913208008, "global_step": 319177, "epoch": 2637} {"train_loss": -40.44240188598633, "global_step": 319178, "epoch": 2637} {"train_loss": -39.8675651550293, "global_step": 319179, "epoch": 2637} {"train_loss": -40.7667121887207, "global_step": 319180, "epoch": 2637} {"train_loss": -41.47845458984375, "global_step": 319181, "epoch": 2637} {"train_loss": -40.624855041503906, "global_step": 319182, "epoch": 2637} {"train_loss": -41.47246170043945, "global_step": 319183, "epoch": 2637} {"train_loss": -40.259212493896484, "global_step": 319184, "epoch": 2637} {"train_loss": -42.30246353149414, "global_step": 319185, "epoch": 2637} {"train_loss": -41.59808349609375, "global_step": 319186, "epoch": 2637} {"train_loss": -41.92316436767578, "global_step": 319187, "epoch": 2637} {"train_loss": -41.62446975708008, "global_step": 319188, "epoch": 2637} {"train_loss": -41.27252197265625, "global_step": 319189, "epoch": 2637} {"train_loss": -40.758785247802734, "global_step": 319190, "epoch": 2637} {"train_loss": -42.74939727783203, "global_step": 319191, "epoch": 2637} {"train_loss": -41.39347457885742, "global_step": 319192, "epoch": 2637} {"train_loss": -43.142181396484375, "global_step": 319193, "epoch": 2637} {"train_loss": -42.290096282958984, "global_step": 319194, "epoch": 2637} {"train_loss": -42.7634391784668, "global_step": 319195, "epoch": 2637} {"train_loss": -41.821632385253906, "global_step": 319196, "epoch": 2637} {"train_loss": -42.62843442554316, "global_step": 319197, "epoch": 2637, "val_loss": 2594460.75} {"train_loss": -42.15289306640625, "global_step": 319198, "epoch": 2638} {"train_loss": -43.04218292236328, "global_step": 319199, "epoch": 2638} {"train_loss": -42.89524841308594, "global_step": 319200, "epoch": 2638} {"train_loss": -43.39656448364258, "global_step": 319201, "epoch": 2638} {"train_loss": -43.23513412475586, "global_step": 319202, "epoch": 2638} {"train_loss": -43.54035186767578, "global_step": 319203, "epoch": 2638} {"train_loss": -42.954872131347656, "global_step": 319204, "epoch": 2638} {"train_loss": -42.91974639892578, "global_step": 319205, "epoch": 2638} {"train_loss": -42.99872970581055, "global_step": 319206, "epoch": 2638} {"train_loss": -43.064876556396484, "global_step": 319207, "epoch": 2638} {"train_loss": -42.90309524536133, "global_step": 319208, "epoch": 2638} {"train_loss": -43.69365310668945, "global_step": 319209, "epoch": 2638} {"train_loss": -42.609432220458984, "global_step": 319210, "epoch": 2638} {"train_loss": -43.29572677612305, "global_step": 319211, "epoch": 2638} {"train_loss": -43.51899719238281, "global_step": 319212, "epoch": 2638} {"train_loss": -42.94131851196289, "global_step": 319213, "epoch": 2638} {"train_loss": -42.939208984375, "global_step": 319214, "epoch": 2638} {"train_loss": -43.34123611450195, "global_step": 319215, "epoch": 2638} {"train_loss": -43.65543746948242, "global_step": 319216, "epoch": 2638} {"train_loss": -43.06991958618164, "global_step": 319217, "epoch": 2638} {"train_loss": -42.82830810546875, "global_step": 319218, "epoch": 2638} {"train_loss": -43.514766693115234, "global_step": 319219, "epoch": 2638} {"train_loss": -42.82001876831055, "global_step": 319220, "epoch": 2638} {"train_loss": -43.65890121459961, "global_step": 319221, "epoch": 2638} {"train_loss": -44.4417839050293, "global_step": 319222, "epoch": 2638} {"train_loss": -43.86167526245117, "global_step": 319223, "epoch": 2638} {"train_loss": -43.870147705078125, "global_step": 319224, "epoch": 2638} {"train_loss": -44.35944747924805, "global_step": 319225, "epoch": 2638} {"train_loss": -43.92671585083008, "global_step": 319226, "epoch": 2638} {"train_loss": -43.959327697753906, "global_step": 319227, "epoch": 2638} {"train_loss": -44.5016975402832, "global_step": 319228, "epoch": 2638} {"train_loss": -44.01485824584961, "global_step": 319229, "epoch": 2638} {"train_loss": -44.2510871887207, "global_step": 319230, "epoch": 2638} {"train_loss": -43.81513214111328, "global_step": 319231, "epoch": 2638} {"train_loss": -44.014617919921875, "global_step": 319232, "epoch": 2638} {"train_loss": -43.9356575012207, "global_step": 319233, "epoch": 2638} {"train_loss": -44.11482620239258, "global_step": 319234, "epoch": 2638} {"train_loss": -44.67314910888672, "global_step": 319235, "epoch": 2638} {"train_loss": -43.93453598022461, "global_step": 319236, "epoch": 2638} {"train_loss": -44.26567077636719, "global_step": 319237, "epoch": 2638} {"train_loss": -44.45283126831055, "global_step": 319238, "epoch": 2638} {"train_loss": -44.218990325927734, "global_step": 319239, "epoch": 2638} {"train_loss": -44.13894271850586, "global_step": 319240, "epoch": 2638} {"train_loss": -43.433345794677734, "global_step": 319241, "epoch": 2638} {"train_loss": -44.90229034423828, "global_step": 319242, "epoch": 2638} {"train_loss": -44.58295440673828, "global_step": 319243, "epoch": 2638} {"train_loss": -44.27133560180664, "global_step": 319244, "epoch": 2638} {"train_loss": -44.657920837402344, "global_step": 319245, "epoch": 2638} {"train_loss": -44.335296630859375, "global_step": 319246, "epoch": 2638} {"train_loss": -44.19480514526367, "global_step": 319247, "epoch": 2638} {"train_loss": -44.43119430541992, "global_step": 319248, "epoch": 2638} {"train_loss": -44.67122268676758, "global_step": 319249, "epoch": 2638} {"train_loss": -44.82344055175781, "global_step": 319250, "epoch": 2638} {"train_loss": -44.69732666015625, "global_step": 319251, "epoch": 2638} {"train_loss": -44.64175033569336, "global_step": 319252, "epoch": 2638} {"train_loss": -44.71440505981445, "global_step": 319253, "epoch": 2638} {"train_loss": -45.02658462524414, "global_step": 319254, "epoch": 2638} {"train_loss": -45.177982330322266, "global_step": 319255, "epoch": 2638} {"train_loss": -44.6085319519043, "global_step": 319256, "epoch": 2638} {"train_loss": -45.459228515625, "global_step": 319257, "epoch": 2638} {"train_loss": -45.30389404296875, "global_step": 319258, "epoch": 2638} {"train_loss": -44.9272575378418, "global_step": 319259, "epoch": 2638} {"train_loss": -45.256370544433594, "global_step": 319260, "epoch": 2638} {"train_loss": -44.26117706298828, "global_step": 319261, "epoch": 2638} {"train_loss": -45.03745651245117, "global_step": 319262, "epoch": 2638} {"train_loss": -44.856136322021484, "global_step": 319263, "epoch": 2638} {"train_loss": -44.915855407714844, "global_step": 319264, "epoch": 2638} {"train_loss": -45.253570556640625, "global_step": 319265, "epoch": 2638} {"train_loss": -45.45212936401367, "global_step": 319266, "epoch": 2638} {"train_loss": -44.905330657958984, "global_step": 319267, "epoch": 2638} {"train_loss": -45.1989631652832, "global_step": 319268, "epoch": 2638} {"train_loss": -45.300662994384766, "global_step": 319269, "epoch": 2638} {"train_loss": -44.73067855834961, "global_step": 319270, "epoch": 2638} {"train_loss": -45.2508659362793, "global_step": 319271, "epoch": 2638} {"train_loss": -45.39107894897461, "global_step": 319272, "epoch": 2638} {"train_loss": -45.39470291137695, "global_step": 319273, "epoch": 2638} {"train_loss": -45.73063278198242, "global_step": 319274, "epoch": 2638} {"train_loss": -44.84751510620117, "global_step": 319275, "epoch": 2638} {"train_loss": -44.783992767333984, "global_step": 319276, "epoch": 2638} {"train_loss": -45.357200622558594, "global_step": 319277, "epoch": 2638} {"train_loss": -45.58293914794922, "global_step": 319278, "epoch": 2638} {"train_loss": -44.6125602722168, "global_step": 319279, "epoch": 2638} {"train_loss": -44.6732063293457, "global_step": 319280, "epoch": 2638} {"train_loss": -45.42240524291992, "global_step": 319281, "epoch": 2638} {"train_loss": -44.5548210144043, "global_step": 319282, "epoch": 2638} {"train_loss": -44.93622970581055, "global_step": 319283, "epoch": 2638} {"train_loss": -45.31428909301758, "global_step": 319284, "epoch": 2638} {"train_loss": -44.872047424316406, "global_step": 319285, "epoch": 2638} {"train_loss": -42.99163055419922, "global_step": 319286, "epoch": 2638} {"train_loss": -41.447471618652344, "global_step": 319287, "epoch": 2638} {"train_loss": -38.69768142700195, "global_step": 319288, "epoch": 2638} {"train_loss": -43.53068923950195, "global_step": 319289, "epoch": 2638} {"train_loss": -30.409040451049805, "global_step": 319290, "epoch": 2638} {"train_loss": -11.29460334777832, "global_step": 319291, "epoch": 2638} {"train_loss": -30.679677963256836, "global_step": 319292, "epoch": 2638} {"train_loss": -34.22181701660156, "global_step": 319293, "epoch": 2638} {"train_loss": -19.209014892578125, "global_step": 319294, "epoch": 2638} {"train_loss": -24.17349624633789, "global_step": 319295, "epoch": 2638} {"train_loss": -29.26725196838379, "global_step": 319296, "epoch": 2638} {"train_loss": -36.222042083740234, "global_step": 319297, "epoch": 2638} {"train_loss": -33.76178741455078, "global_step": 319298, "epoch": 2638} {"train_loss": -37.457332611083984, "global_step": 319299, "epoch": 2638} {"train_loss": -36.268531799316406, "global_step": 319300, "epoch": 2638} {"train_loss": -36.5803337097168, "global_step": 319301, "epoch": 2638} {"train_loss": -38.77144241333008, "global_step": 319302, "epoch": 2638} {"train_loss": -38.448421478271484, "global_step": 319303, "epoch": 2638} {"train_loss": -38.00764846801758, "global_step": 319304, "epoch": 2638} {"train_loss": -39.830047607421875, "global_step": 319305, "epoch": 2638} {"train_loss": -38.63138961791992, "global_step": 319306, "epoch": 2638} {"train_loss": -38.893550872802734, "global_step": 319307, "epoch": 2638} {"train_loss": -40.6961784362793, "global_step": 319308, "epoch": 2638} {"train_loss": -40.77144241333008, "global_step": 319309, "epoch": 2638} {"train_loss": -40.13776397705078, "global_step": 319310, "epoch": 2638} {"train_loss": -40.810462951660156, "global_step": 319311, "epoch": 2638} {"train_loss": -41.51320266723633, "global_step": 319312, "epoch": 2638} {"train_loss": -41.2630500793457, "global_step": 319313, "epoch": 2638} {"train_loss": -42.16657257080078, "global_step": 319314, "epoch": 2638} {"train_loss": -42.031341552734375, "global_step": 319315, "epoch": 2638} {"train_loss": -42.24178695678711, "global_step": 319316, "epoch": 2638} {"train_loss": -41.1401481628418, "global_step": 319317, "epoch": 2638} {"train_loss": -42.224400134126014, "global_step": 319318, "epoch": 2638, "val_loss": 2645923.0} {"train_loss": -41.46730041503906, "global_step": 319319, "epoch": 2639} {"train_loss": -41.589866638183594, "global_step": 319320, "epoch": 2639} {"train_loss": -42.49819564819336, "global_step": 319321, "epoch": 2639} {"train_loss": -43.030372619628906, "global_step": 319322, "epoch": 2639} {"train_loss": -42.22488784790039, "global_step": 319323, "epoch": 2639} {"train_loss": -41.907344818115234, "global_step": 319324, "epoch": 2639} {"train_loss": -42.12519073486328, "global_step": 319325, "epoch": 2639} {"train_loss": -43.06782913208008, "global_step": 319326, "epoch": 2639} {"train_loss": -42.56817626953125, "global_step": 319327, "epoch": 2639} {"train_loss": -43.013755798339844, "global_step": 319328, "epoch": 2639} {"train_loss": -43.05526351928711, "global_step": 319329, "epoch": 2639} {"train_loss": -42.95053482055664, "global_step": 319330, "epoch": 2639} {"train_loss": -43.1655387878418, "global_step": 319331, "epoch": 2639} {"train_loss": -43.27000427246094, "global_step": 319332, "epoch": 2639} {"train_loss": -42.66577911376953, "global_step": 319333, "epoch": 2639} {"train_loss": -43.33308029174805, "global_step": 319334, "epoch": 2639} {"train_loss": -42.959014892578125, "global_step": 319335, "epoch": 2639} {"train_loss": -43.64936447143555, "global_step": 319336, "epoch": 2639} {"train_loss": -42.912506103515625, "global_step": 319337, "epoch": 2639} {"train_loss": -42.98892593383789, "global_step": 319338, "epoch": 2639} {"train_loss": -43.733360290527344, "global_step": 319339, "epoch": 2639} {"train_loss": -43.4416618347168, "global_step": 319340, "epoch": 2639} {"train_loss": -42.93099594116211, "global_step": 319341, "epoch": 2639} {"train_loss": -43.928340911865234, "global_step": 319342, "epoch": 2639} {"train_loss": -43.918243408203125, "global_step": 319343, "epoch": 2639} {"train_loss": -43.36117172241211, "global_step": 319344, "epoch": 2639} {"train_loss": -43.5903205871582, "global_step": 319345, "epoch": 2639} {"train_loss": -43.77973556518555, "global_step": 319346, "epoch": 2639} {"train_loss": -43.961524963378906, "global_step": 319347, "epoch": 2639} {"train_loss": -43.69148635864258, "global_step": 319348, "epoch": 2639} {"train_loss": -43.57965087890625, "global_step": 319349, "epoch": 2639} {"train_loss": -43.947265625, "global_step": 319350, "epoch": 2639} {"train_loss": -44.06851577758789, "global_step": 319351, "epoch": 2639} {"train_loss": -44.53725051879883, "global_step": 319352, "epoch": 2639} {"train_loss": -44.37995529174805, "global_step": 319353, "epoch": 2639} {"train_loss": -44.08504104614258, "global_step": 319354, "epoch": 2639} {"train_loss": -43.972225189208984, "global_step": 319355, "epoch": 2639} {"train_loss": -44.000606536865234, "global_step": 319356, "epoch": 2639} {"train_loss": -44.72890853881836, "global_step": 319357, "epoch": 2639} {"train_loss": -43.808895111083984, "global_step": 319358, "epoch": 2639} {"train_loss": -44.400856018066406, "global_step": 319359, "epoch": 2639} {"train_loss": -44.736637115478516, "global_step": 319360, "epoch": 2639} {"train_loss": -44.69059371948242, "global_step": 319361, "epoch": 2639} {"train_loss": -44.70334243774414, "global_step": 319362, "epoch": 2639} {"train_loss": -44.535736083984375, "global_step": 319363, "epoch": 2639} {"train_loss": -44.25246047973633, "global_step": 319364, "epoch": 2639} {"train_loss": -44.69297409057617, "global_step": 319365, "epoch": 2639} {"train_loss": -44.287357330322266, "global_step": 319366, "epoch": 2639} {"train_loss": -44.41823959350586, "global_step": 319367, "epoch": 2639} {"train_loss": -44.72990036010742, "global_step": 319368, "epoch": 2639} {"train_loss": -44.7225456237793, "global_step": 319369, "epoch": 2639} {"train_loss": -44.70920181274414, "global_step": 319370, "epoch": 2639} {"train_loss": -44.11625289916992, "global_step": 319371, "epoch": 2639} {"train_loss": -45.02260208129883, "global_step": 319372, "epoch": 2639} {"train_loss": -44.87860107421875, "global_step": 319373, "epoch": 2639} {"train_loss": -45.02129364013672, "global_step": 319374, "epoch": 2639} {"train_loss": -44.415035247802734, "global_step": 319375, "epoch": 2639} {"train_loss": -44.60902786254883, "global_step": 319376, "epoch": 2639} {"train_loss": -45.07322311401367, "global_step": 319377, "epoch": 2639} {"train_loss": -45.048362731933594, "global_step": 319378, "epoch": 2639} {"train_loss": -45.07745361328125, "global_step": 319379, "epoch": 2639} {"train_loss": -44.76892852783203, "global_step": 319380, "epoch": 2639} {"train_loss": -45.02840042114258, "global_step": 319381, "epoch": 2639} {"train_loss": -44.73870849609375, "global_step": 319382, "epoch": 2639} {"train_loss": -44.692317962646484, "global_step": 319383, "epoch": 2639} {"train_loss": -45.15803909301758, "global_step": 319384, "epoch": 2639} {"train_loss": -44.152278900146484, "global_step": 319385, "epoch": 2639} {"train_loss": -45.16592025756836, "global_step": 319386, "epoch": 2639} {"train_loss": -44.54465866088867, "global_step": 319387, "epoch": 2639} {"train_loss": -44.8265266418457, "global_step": 319388, "epoch": 2639} {"train_loss": -44.25473403930664, "global_step": 319389, "epoch": 2639} {"train_loss": -45.250789642333984, "global_step": 319390, "epoch": 2639} {"train_loss": -44.463130950927734, "global_step": 319391, "epoch": 2639} {"train_loss": -44.3649787902832, "global_step": 319392, "epoch": 2639} {"train_loss": -44.43977737426758, "global_step": 319393, "epoch": 2639} {"train_loss": -44.257564544677734, "global_step": 319394, "epoch": 2639} {"train_loss": -45.354827880859375, "global_step": 319395, "epoch": 2639} {"train_loss": -44.674983978271484, "global_step": 319396, "epoch": 2639} {"train_loss": -44.64981460571289, "global_step": 319397, "epoch": 2639} {"train_loss": -45.111549377441406, "global_step": 319398, "epoch": 2639} {"train_loss": -44.78165817260742, "global_step": 319399, "epoch": 2639} {"train_loss": -44.364620208740234, "global_step": 319400, "epoch": 2639} {"train_loss": -45.6137809753418, "global_step": 319401, "epoch": 2639} {"train_loss": -45.25935745239258, "global_step": 319402, "epoch": 2639} {"train_loss": -44.83893966674805, "global_step": 319403, "epoch": 2639} {"train_loss": -44.74480056762695, "global_step": 319404, "epoch": 2639} {"train_loss": -45.11017990112305, "global_step": 319405, "epoch": 2639} {"train_loss": -44.663795471191406, "global_step": 319406, "epoch": 2639} {"train_loss": -44.78656005859375, "global_step": 319407, "epoch": 2639} {"train_loss": -45.10787582397461, "global_step": 319408, "epoch": 2639} {"train_loss": -44.504093170166016, "global_step": 319409, "epoch": 2639} {"train_loss": -44.5787353515625, "global_step": 319410, "epoch": 2639} {"train_loss": -45.24053955078125, "global_step": 319411, "epoch": 2639} {"train_loss": -44.76171875, "global_step": 319412, "epoch": 2639} {"train_loss": -45.200592041015625, "global_step": 319413, "epoch": 2639} {"train_loss": -45.17255783081055, "global_step": 319414, "epoch": 2639} {"train_loss": -44.838741302490234, "global_step": 319415, "epoch": 2639} {"train_loss": -44.78466796875, "global_step": 319416, "epoch": 2639} {"train_loss": -44.706905364990234, "global_step": 319417, "epoch": 2639} {"train_loss": -44.70967102050781, "global_step": 319418, "epoch": 2639} {"train_loss": -44.95208740234375, "global_step": 319419, "epoch": 2639} {"train_loss": -45.175811767578125, "global_step": 319420, "epoch": 2639} {"train_loss": -44.80705642700195, "global_step": 319421, "epoch": 2639} {"train_loss": -44.78062057495117, "global_step": 319422, "epoch": 2639} {"train_loss": -44.900978088378906, "global_step": 319423, "epoch": 2639} {"train_loss": -44.51899337768555, "global_step": 319424, "epoch": 2639} {"train_loss": -44.88987731933594, "global_step": 319425, "epoch": 2639} {"train_loss": -45.19350814819336, "global_step": 319426, "epoch": 2639} {"train_loss": -45.07586669921875, "global_step": 319427, "epoch": 2639} {"train_loss": -45.0543098449707, "global_step": 319428, "epoch": 2639} {"train_loss": -45.313106536865234, "global_step": 319429, "epoch": 2639} {"train_loss": -44.24911117553711, "global_step": 319430, "epoch": 2639} {"train_loss": -42.0221061706543, "global_step": 319431, "epoch": 2639} {"train_loss": -38.88257598876953, "global_step": 319432, "epoch": 2639} {"train_loss": -37.050350189208984, "global_step": 319433, "epoch": 2639} {"train_loss": -35.686527252197266, "global_step": 319434, "epoch": 2639} {"train_loss": -38.38201904296875, "global_step": 319435, "epoch": 2639} {"train_loss": -42.56853103637695, "global_step": 319436, "epoch": 2639} {"train_loss": -42.016822814941406, "global_step": 319437, "epoch": 2639} {"train_loss": -40.57223892211914, "global_step": 319438, "epoch": 2639} {"train_loss": -43.94442436911843, "global_step": 319439, "epoch": 2639, "val_loss": 2710467.5} {"train_loss": -41.273902893066406, "global_step": 319440, "epoch": 2640} {"train_loss": -41.728271484375, "global_step": 319441, "epoch": 2640} {"train_loss": -42.86650466918945, "global_step": 319442, "epoch": 2640} {"train_loss": -40.95614242553711, "global_step": 319443, "epoch": 2640} {"train_loss": -42.64559555053711, "global_step": 319444, "epoch": 2640} {"train_loss": -41.996124267578125, "global_step": 319445, "epoch": 2640} {"train_loss": -41.9920654296875, "global_step": 319446, "epoch": 2640} {"train_loss": -42.24641036987305, "global_step": 319447, "epoch": 2640} {"train_loss": -42.337867736816406, "global_step": 319448, "epoch": 2640} {"train_loss": -42.59439468383789, "global_step": 319449, "epoch": 2640} {"train_loss": -42.25584030151367, "global_step": 319450, "epoch": 2640} {"train_loss": -41.92805480957031, "global_step": 319451, "epoch": 2640} {"train_loss": -41.86933135986328, "global_step": 319452, "epoch": 2640} {"train_loss": -42.823368072509766, "global_step": 319453, "epoch": 2640} {"train_loss": -41.996883392333984, "global_step": 319454, "epoch": 2640} {"train_loss": -43.20307159423828, "global_step": 319455, "epoch": 2640} {"train_loss": -42.43473434448242, "global_step": 319456, "epoch": 2640} {"train_loss": -43.54304885864258, "global_step": 319457, "epoch": 2640} {"train_loss": -43.16159439086914, "global_step": 319458, "epoch": 2640} {"train_loss": -43.3121452331543, "global_step": 319459, "epoch": 2640} {"train_loss": -43.43424606323242, "global_step": 319460, "epoch": 2640} {"train_loss": -43.99436569213867, "global_step": 319461, "epoch": 2640} {"train_loss": -43.311737060546875, "global_step": 319462, "epoch": 2640} {"train_loss": -43.39370346069336, "global_step": 319463, "epoch": 2640} {"train_loss": -43.45967483520508, "global_step": 319464, "epoch": 2640} {"train_loss": -43.5158576965332, "global_step": 319465, "epoch": 2640} {"train_loss": -44.36419677734375, "global_step": 319466, "epoch": 2640} {"train_loss": -43.47930908203125, "global_step": 319467, "epoch": 2640} {"train_loss": -43.52216339111328, "global_step": 319468, "epoch": 2640} {"train_loss": -43.72808837890625, "global_step": 319469, "epoch": 2640} {"train_loss": -43.33918380737305, "global_step": 319470, "epoch": 2640} {"train_loss": -43.551815032958984, "global_step": 319471, "epoch": 2640} {"train_loss": -43.304222106933594, "global_step": 319472, "epoch": 2640} {"train_loss": -43.75986099243164, "global_step": 319473, "epoch": 2640} {"train_loss": -44.173614501953125, "global_step": 319474, "epoch": 2640} {"train_loss": -44.0228385925293, "global_step": 319475, "epoch": 2640} {"train_loss": -43.486576080322266, "global_step": 319476, "epoch": 2640} {"train_loss": -43.95664978027344, "global_step": 319477, "epoch": 2640} {"train_loss": -44.40070724487305, "global_step": 319478, "epoch": 2640} {"train_loss": -44.4777717590332, "global_step": 319479, "epoch": 2640} {"train_loss": -44.25620651245117, "global_step": 319480, "epoch": 2640} {"train_loss": -44.45786666870117, "global_step": 319481, "epoch": 2640} {"train_loss": -44.22003173828125, "global_step": 319482, "epoch": 2640} {"train_loss": -44.49851608276367, "global_step": 319483, "epoch": 2640} {"train_loss": -44.326881408691406, "global_step": 319484, "epoch": 2640} {"train_loss": -44.63637161254883, "global_step": 319485, "epoch": 2640} {"train_loss": -44.35952377319336, "global_step": 319486, "epoch": 2640} {"train_loss": -44.232887268066406, "global_step": 319487, "epoch": 2640} {"train_loss": -44.55564498901367, "global_step": 319488, "epoch": 2640} {"train_loss": -44.47831726074219, "global_step": 319489, "epoch": 2640} {"train_loss": -43.96881866455078, "global_step": 319490, "epoch": 2640} {"train_loss": -43.98190689086914, "global_step": 319491, "epoch": 2640} {"train_loss": -44.223628997802734, "global_step": 319492, "epoch": 2640} {"train_loss": -43.99822998046875, "global_step": 319493, "epoch": 2640} {"train_loss": -45.29720687866211, "global_step": 319494, "epoch": 2640} {"train_loss": -44.801063537597656, "global_step": 319495, "epoch": 2640} {"train_loss": -44.44186019897461, "global_step": 319496, "epoch": 2640} {"train_loss": -44.44509506225586, "global_step": 319497, "epoch": 2640} {"train_loss": -44.78596496582031, "global_step": 319498, "epoch": 2640} {"train_loss": -44.70561599731445, "global_step": 319499, "epoch": 2640} {"train_loss": -44.1944465637207, "global_step": 319500, "epoch": 2640} {"train_loss": -44.86470413208008, "global_step": 319501, "epoch": 2640} {"train_loss": -44.635704040527344, "global_step": 319502, "epoch": 2640} {"train_loss": -44.87614822387695, "global_step": 319503, "epoch": 2640} {"train_loss": -44.378501892089844, "global_step": 319504, "epoch": 2640} {"train_loss": -44.4229850769043, "global_step": 319505, "epoch": 2640} {"train_loss": -44.94314193725586, "global_step": 319506, "epoch": 2640} {"train_loss": -44.60744094848633, "global_step": 319507, "epoch": 2640} {"train_loss": -44.71749496459961, "global_step": 319508, "epoch": 2640} {"train_loss": -44.53120040893555, "global_step": 319509, "epoch": 2640} {"train_loss": -44.8093147277832, "global_step": 319510, "epoch": 2640} {"train_loss": -44.272308349609375, "global_step": 319511, "epoch": 2640} {"train_loss": -44.53656005859375, "global_step": 319512, "epoch": 2640} {"train_loss": -45.39606475830078, "global_step": 319513, "epoch": 2640} {"train_loss": -44.93815231323242, "global_step": 319514, "epoch": 2640} {"train_loss": -44.658443450927734, "global_step": 319515, "epoch": 2640} {"train_loss": -44.96439743041992, "global_step": 319516, "epoch": 2640} {"train_loss": -45.16022491455078, "global_step": 319517, "epoch": 2640} {"train_loss": -45.134300231933594, "global_step": 319518, "epoch": 2640} {"train_loss": -44.883575439453125, "global_step": 319519, "epoch": 2640} {"train_loss": -45.08576583862305, "global_step": 319520, "epoch": 2640} {"train_loss": -44.97664260864258, "global_step": 319521, "epoch": 2640} {"train_loss": -45.064083099365234, "global_step": 319522, "epoch": 2640} {"train_loss": -44.912681579589844, "global_step": 319523, "epoch": 2640} {"train_loss": -45.1634635925293, "global_step": 319524, "epoch": 2640} {"train_loss": -45.515472412109375, "global_step": 319525, "epoch": 2640} {"train_loss": -45.410858154296875, "global_step": 319526, "epoch": 2640} {"train_loss": -45.14290237426758, "global_step": 319527, "epoch": 2640} {"train_loss": -44.90946960449219, "global_step": 319528, "epoch": 2640} {"train_loss": -45.18470764160156, "global_step": 319529, "epoch": 2640} {"train_loss": -44.80929183959961, "global_step": 319530, "epoch": 2640} {"train_loss": -45.14652633666992, "global_step": 319531, "epoch": 2640} {"train_loss": -45.047672271728516, "global_step": 319532, "epoch": 2640} {"train_loss": -44.8673095703125, "global_step": 319533, "epoch": 2640} {"train_loss": -44.4976921081543, "global_step": 319534, "epoch": 2640} {"train_loss": -43.16646194458008, "global_step": 319535, "epoch": 2640} {"train_loss": -42.875526428222656, "global_step": 319536, "epoch": 2640} {"train_loss": -43.45809555053711, "global_step": 319537, "epoch": 2640} {"train_loss": -44.814125061035156, "global_step": 319538, "epoch": 2640} {"train_loss": -45.20927047729492, "global_step": 319539, "epoch": 2640} {"train_loss": -44.96157455444336, "global_step": 319540, "epoch": 2640} {"train_loss": -42.679969787597656, "global_step": 319541, "epoch": 2640} {"train_loss": -39.031795501708984, "global_step": 319542, "epoch": 2640} {"train_loss": -40.68106460571289, "global_step": 319543, "epoch": 2640} {"train_loss": -41.65078353881836, "global_step": 319544, "epoch": 2640} {"train_loss": -44.140724182128906, "global_step": 319545, "epoch": 2640} {"train_loss": -44.326107025146484, "global_step": 319546, "epoch": 2640} {"train_loss": -44.287353515625, "global_step": 319547, "epoch": 2640} {"train_loss": -43.64384841918945, "global_step": 319548, "epoch": 2640} {"train_loss": -43.9809684753418, "global_step": 319549, "epoch": 2640} {"train_loss": -42.38228988647461, "global_step": 319550, "epoch": 2640} {"train_loss": -43.52613067626953, "global_step": 319551, "epoch": 2640} {"train_loss": -39.87728500366211, "global_step": 319552, "epoch": 2640} {"train_loss": -39.742794036865234, "global_step": 319553, "epoch": 2640} {"train_loss": -44.30940246582031, "global_step": 319554, "epoch": 2640} {"train_loss": -41.55868148803711, "global_step": 319555, "epoch": 2640} {"train_loss": -41.00705337524414, "global_step": 319556, "epoch": 2640} {"train_loss": -44.16352462768555, "global_step": 319557, "epoch": 2640} {"train_loss": -39.7684211730957, "global_step": 319558, "epoch": 2640} {"train_loss": -41.244781494140625, "global_step": 319559, "epoch": 2640} {"train_loss": -43.707625775297814, "global_step": 319560, "epoch": 2640, "val_loss": 2627787.75} {"train_loss": -40.239105224609375, "global_step": 319561, "epoch": 2641} {"train_loss": -43.478858947753906, "global_step": 319562, "epoch": 2641} {"train_loss": -41.82537841796875, "global_step": 319563, "epoch": 2641} {"train_loss": -43.04458236694336, "global_step": 319564, "epoch": 2641} {"train_loss": -41.00832748413086, "global_step": 319565, "epoch": 2641} {"train_loss": -42.37494659423828, "global_step": 319566, "epoch": 2641} {"train_loss": -42.07217025756836, "global_step": 319567, "epoch": 2641} {"train_loss": -43.67765426635742, "global_step": 319568, "epoch": 2641} {"train_loss": -43.22171401977539, "global_step": 319569, "epoch": 2641} {"train_loss": -43.108516693115234, "global_step": 319570, "epoch": 2641} {"train_loss": -42.94818115234375, "global_step": 319571, "epoch": 2641} {"train_loss": -42.2868766784668, "global_step": 319572, "epoch": 2641} {"train_loss": -42.90606689453125, "global_step": 319573, "epoch": 2641} {"train_loss": -42.79996871948242, "global_step": 319574, "epoch": 2641} {"train_loss": -42.979164123535156, "global_step": 319575, "epoch": 2641} {"train_loss": -42.75834274291992, "global_step": 319576, "epoch": 2641} {"train_loss": -43.81336212158203, "global_step": 319577, "epoch": 2641} {"train_loss": -42.71489715576172, "global_step": 319578, "epoch": 2641} {"train_loss": -43.3995246887207, "global_step": 319579, "epoch": 2641} {"train_loss": -43.11750411987305, "global_step": 319580, "epoch": 2641} {"train_loss": -43.62362289428711, "global_step": 319581, "epoch": 2641} {"train_loss": -43.018035888671875, "global_step": 319582, "epoch": 2641} {"train_loss": -43.73594284057617, "global_step": 319583, "epoch": 2641} {"train_loss": -43.690616607666016, "global_step": 319584, "epoch": 2641} {"train_loss": -43.48531723022461, "global_step": 319585, "epoch": 2641} {"train_loss": -43.897369384765625, "global_step": 319586, "epoch": 2641} {"train_loss": -42.94443893432617, "global_step": 319587, "epoch": 2641} {"train_loss": -44.14751434326172, "global_step": 319588, "epoch": 2641} {"train_loss": -42.74497604370117, "global_step": 319589, "epoch": 2641} {"train_loss": -44.05717849731445, "global_step": 319590, "epoch": 2641} {"train_loss": -43.927425384521484, "global_step": 319591, "epoch": 2641} {"train_loss": -44.27605056762695, "global_step": 319592, "epoch": 2641} {"train_loss": -44.31128692626953, "global_step": 319593, "epoch": 2641} {"train_loss": -43.926204681396484, "global_step": 319594, "epoch": 2641} {"train_loss": -44.2078857421875, "global_step": 319595, "epoch": 2641} {"train_loss": -43.82291030883789, "global_step": 319596, "epoch": 2641} {"train_loss": -43.290565490722656, "global_step": 319597, "epoch": 2641} {"train_loss": -43.70524978637695, "global_step": 319598, "epoch": 2641} {"train_loss": -44.33816146850586, "global_step": 319599, "epoch": 2641} {"train_loss": -43.910057067871094, "global_step": 319600, "epoch": 2641} {"train_loss": -43.41931915283203, "global_step": 319601, "epoch": 2641} {"train_loss": -44.533172607421875, "global_step": 319602, "epoch": 2641} {"train_loss": -44.487823486328125, "global_step": 319603, "epoch": 2641} {"train_loss": -43.13821029663086, "global_step": 319604, "epoch": 2641} {"train_loss": -42.18223190307617, "global_step": 319605, "epoch": 2641} {"train_loss": -44.13441848754883, "global_step": 319606, "epoch": 2641} {"train_loss": -44.383174896240234, "global_step": 319607, "epoch": 2641} {"train_loss": -44.5002555847168, "global_step": 319608, "epoch": 2641} {"train_loss": -43.45328140258789, "global_step": 319609, "epoch": 2641} {"train_loss": -44.28634262084961, "global_step": 319610, "epoch": 2641} {"train_loss": -44.97212219238281, "global_step": 319611, "epoch": 2641} {"train_loss": -44.06367111206055, "global_step": 319612, "epoch": 2641} {"train_loss": -43.5727424621582, "global_step": 319613, "epoch": 2641} {"train_loss": -44.28731155395508, "global_step": 319614, "epoch": 2641} {"train_loss": -45.27039337158203, "global_step": 319615, "epoch": 2641} {"train_loss": -44.1177864074707, "global_step": 319616, "epoch": 2641} {"train_loss": -43.76998519897461, "global_step": 319617, "epoch": 2641} {"train_loss": -44.691768646240234, "global_step": 319618, "epoch": 2641} {"train_loss": -43.65686798095703, "global_step": 319619, "epoch": 2641} {"train_loss": -43.85920715332031, "global_step": 319620, "epoch": 2641} {"train_loss": -43.80751419067383, "global_step": 319621, "epoch": 2641} {"train_loss": -45.204994201660156, "global_step": 319622, "epoch": 2641} {"train_loss": -44.103309631347656, "global_step": 319623, "epoch": 2641} {"train_loss": -44.07172775268555, "global_step": 319624, "epoch": 2641} {"train_loss": -44.90192413330078, "global_step": 319625, "epoch": 2641} {"train_loss": -43.53167724609375, "global_step": 319626, "epoch": 2641} {"train_loss": -44.19965362548828, "global_step": 319627, "epoch": 2641} {"train_loss": -44.85512161254883, "global_step": 319628, "epoch": 2641} {"train_loss": -44.17952346801758, "global_step": 319629, "epoch": 2641} {"train_loss": -43.76643753051758, "global_step": 319630, "epoch": 2641} {"train_loss": -44.438934326171875, "global_step": 319631, "epoch": 2641} {"train_loss": -44.672935485839844, "global_step": 319632, "epoch": 2641} {"train_loss": -43.241207122802734, "global_step": 319633, "epoch": 2641} {"train_loss": -44.48777389526367, "global_step": 319634, "epoch": 2641} {"train_loss": -45.186317443847656, "global_step": 319635, "epoch": 2641} {"train_loss": -43.07441329956055, "global_step": 319636, "epoch": 2641} {"train_loss": -44.27280807495117, "global_step": 319637, "epoch": 2641} {"train_loss": -44.947139739990234, "global_step": 319638, "epoch": 2641} {"train_loss": -43.276123046875, "global_step": 319639, "epoch": 2641} {"train_loss": -44.37116622924805, "global_step": 319640, "epoch": 2641} {"train_loss": -45.1500358581543, "global_step": 319641, "epoch": 2641} {"train_loss": -43.209659576416016, "global_step": 319642, "epoch": 2641} {"train_loss": -42.925636291503906, "global_step": 319643, "epoch": 2641} {"train_loss": -45.12970733642578, "global_step": 319644, "epoch": 2641} {"train_loss": -43.89691162109375, "global_step": 319645, "epoch": 2641} {"train_loss": -43.45475387573242, "global_step": 319646, "epoch": 2641} {"train_loss": -44.52542495727539, "global_step": 319647, "epoch": 2641} {"train_loss": -44.17890167236328, "global_step": 319648, "epoch": 2641} {"train_loss": -43.584808349609375, "global_step": 319649, "epoch": 2641} {"train_loss": -44.95954132080078, "global_step": 319650, "epoch": 2641} {"train_loss": -44.01125717163086, "global_step": 319651, "epoch": 2641} {"train_loss": -44.32108688354492, "global_step": 319652, "epoch": 2641} {"train_loss": -43.91852569580078, "global_step": 319653, "epoch": 2641} {"train_loss": -43.79133224487305, "global_step": 319654, "epoch": 2641} {"train_loss": -43.95722961425781, "global_step": 319655, "epoch": 2641} {"train_loss": -44.774288177490234, "global_step": 319656, "epoch": 2641} {"train_loss": -44.00520706176758, "global_step": 319657, "epoch": 2641} {"train_loss": -43.56667709350586, "global_step": 319658, "epoch": 2641} {"train_loss": -44.25271987915039, "global_step": 319659, "epoch": 2641} {"train_loss": -44.419189453125, "global_step": 319660, "epoch": 2641} {"train_loss": -44.30085372924805, "global_step": 319661, "epoch": 2641} {"train_loss": -44.13928985595703, "global_step": 319662, "epoch": 2641} {"train_loss": -45.2850341796875, "global_step": 319663, "epoch": 2641} {"train_loss": -43.61659622192383, "global_step": 319664, "epoch": 2641} {"train_loss": -44.669166564941406, "global_step": 319665, "epoch": 2641} {"train_loss": -44.87093734741211, "global_step": 319666, "epoch": 2641} {"train_loss": -45.1765251159668, "global_step": 319667, "epoch": 2641} {"train_loss": -45.05778884887695, "global_step": 319668, "epoch": 2641} {"train_loss": -44.923072814941406, "global_step": 319669, "epoch": 2641} {"train_loss": -45.05649185180664, "global_step": 319670, "epoch": 2641} {"train_loss": -44.32403564453125, "global_step": 319671, "epoch": 2641} {"train_loss": -44.60028076171875, "global_step": 319672, "epoch": 2641} {"train_loss": -44.720272064208984, "global_step": 319673, "epoch": 2641} {"train_loss": -44.60848617553711, "global_step": 319674, "epoch": 2641} {"train_loss": -44.611480712890625, "global_step": 319675, "epoch": 2641} {"train_loss": -44.780479431152344, "global_step": 319676, "epoch": 2641} {"train_loss": -43.389827728271484, "global_step": 319677, "epoch": 2641} {"train_loss": -44.8794059753418, "global_step": 319678, "epoch": 2641} {"train_loss": -44.17236328125, "global_step": 319679, "epoch": 2641} {"train_loss": -43.11048126220703, "global_step": 319680, "epoch": 2641} {"train_loss": -43.88916157493907, "global_step": 319681, "epoch": 2641, "val_loss": 2600973.5} {"train_loss": -45.193695068359375, "global_step": 319682, "epoch": 2642} {"train_loss": -43.22201156616211, "global_step": 319683, "epoch": 2642} {"train_loss": -43.243526458740234, "global_step": 319684, "epoch": 2642} {"train_loss": -44.59176254272461, "global_step": 319685, "epoch": 2642} {"train_loss": -44.25844955444336, "global_step": 319686, "epoch": 2642} {"train_loss": -44.048309326171875, "global_step": 319687, "epoch": 2642} {"train_loss": -44.93752670288086, "global_step": 319688, "epoch": 2642} {"train_loss": -43.96689987182617, "global_step": 319689, "epoch": 2642} {"train_loss": -44.60762405395508, "global_step": 319690, "epoch": 2642} {"train_loss": -44.50007247924805, "global_step": 319691, "epoch": 2642} {"train_loss": -43.68394088745117, "global_step": 319692, "epoch": 2642} {"train_loss": -43.4511604309082, "global_step": 319693, "epoch": 2642} {"train_loss": -44.768184661865234, "global_step": 319694, "epoch": 2642} {"train_loss": -44.10203552246094, "global_step": 319695, "epoch": 2642} {"train_loss": -44.050289154052734, "global_step": 319696, "epoch": 2642} {"train_loss": -44.261409759521484, "global_step": 319697, "epoch": 2642} {"train_loss": -44.525508880615234, "global_step": 319698, "epoch": 2642} {"train_loss": -44.4471549987793, "global_step": 319699, "epoch": 2642} {"train_loss": -44.9679069519043, "global_step": 319700, "epoch": 2642} {"train_loss": -44.232975006103516, "global_step": 319701, "epoch": 2642} {"train_loss": -45.165218353271484, "global_step": 319702, "epoch": 2642} {"train_loss": -44.5438232421875, "global_step": 319703, "epoch": 2642} {"train_loss": -43.896175384521484, "global_step": 319704, "epoch": 2642} {"train_loss": -44.006568908691406, "global_step": 319705, "epoch": 2642} {"train_loss": -44.97193145751953, "global_step": 319706, "epoch": 2642} {"train_loss": -43.966548919677734, "global_step": 319707, "epoch": 2642} {"train_loss": -44.52778244018555, "global_step": 319708, "epoch": 2642} {"train_loss": -44.8270149230957, "global_step": 319709, "epoch": 2642} {"train_loss": -43.90838623046875, "global_step": 319710, "epoch": 2642} {"train_loss": -44.78244400024414, "global_step": 319711, "epoch": 2642} {"train_loss": -44.66498947143555, "global_step": 319712, "epoch": 2642} {"train_loss": -43.66688537597656, "global_step": 319713, "epoch": 2642} {"train_loss": -44.199668884277344, "global_step": 319714, "epoch": 2642} {"train_loss": -43.53689193725586, "global_step": 319715, "epoch": 2642} {"train_loss": -43.21065902709961, "global_step": 319716, "epoch": 2642} {"train_loss": -43.92109680175781, "global_step": 319717, "epoch": 2642} {"train_loss": -43.932464599609375, "global_step": 319718, "epoch": 2642} {"train_loss": -43.55132293701172, "global_step": 319719, "epoch": 2642} {"train_loss": -43.394775390625, "global_step": 319720, "epoch": 2642} {"train_loss": -44.204158782958984, "global_step": 319721, "epoch": 2642} {"train_loss": -40.67823028564453, "global_step": 319722, "epoch": 2642} {"train_loss": -39.56064987182617, "global_step": 319723, "epoch": 2642} {"train_loss": -42.29270935058594, "global_step": 319724, "epoch": 2642} {"train_loss": -43.14090347290039, "global_step": 319725, "epoch": 2642} {"train_loss": -38.314735412597656, "global_step": 319726, "epoch": 2642} {"train_loss": -43.785640716552734, "global_step": 319727, "epoch": 2642} {"train_loss": -36.39967346191406, "global_step": 319728, "epoch": 2642} {"train_loss": -42.21254348754883, "global_step": 319729, "epoch": 2642} {"train_loss": -38.822261810302734, "global_step": 319730, "epoch": 2642} {"train_loss": -42.88795852661133, "global_step": 319731, "epoch": 2642} {"train_loss": -40.227783203125, "global_step": 319732, "epoch": 2642} {"train_loss": -42.725547790527344, "global_step": 319733, "epoch": 2642} {"train_loss": -41.95166778564453, "global_step": 319734, "epoch": 2642} {"train_loss": -41.301082611083984, "global_step": 319735, "epoch": 2642} {"train_loss": -42.6909065246582, "global_step": 319736, "epoch": 2642} {"train_loss": -41.427467346191406, "global_step": 319737, "epoch": 2642} {"train_loss": -40.36625289916992, "global_step": 319738, "epoch": 2642} {"train_loss": -42.192657470703125, "global_step": 319739, "epoch": 2642} {"train_loss": -41.23440170288086, "global_step": 319740, "epoch": 2642} {"train_loss": -43.100555419921875, "global_step": 319741, "epoch": 2642} {"train_loss": -40.12653732299805, "global_step": 319742, "epoch": 2642} {"train_loss": -42.63430404663086, "global_step": 319743, "epoch": 2642} {"train_loss": -43.452980041503906, "global_step": 319744, "epoch": 2642} {"train_loss": -42.096412658691406, "global_step": 319745, "epoch": 2642} {"train_loss": -43.12369918823242, "global_step": 319746, "epoch": 2642} {"train_loss": -43.473628997802734, "global_step": 319747, "epoch": 2642} {"train_loss": -42.616390228271484, "global_step": 319748, "epoch": 2642} {"train_loss": -44.141029357910156, "global_step": 319749, "epoch": 2642} {"train_loss": -42.74849319458008, "global_step": 319750, "epoch": 2642} {"train_loss": -44.27323913574219, "global_step": 319751, "epoch": 2642} {"train_loss": -42.80487823486328, "global_step": 319752, "epoch": 2642} {"train_loss": -43.79488754272461, "global_step": 319753, "epoch": 2642} {"train_loss": -42.55011749267578, "global_step": 319754, "epoch": 2642} {"train_loss": -42.52125930786133, "global_step": 319755, "epoch": 2642} {"train_loss": -43.76546859741211, "global_step": 319756, "epoch": 2642} {"train_loss": -43.66478729248047, "global_step": 319757, "epoch": 2642} {"train_loss": -43.20956802368164, "global_step": 319758, "epoch": 2642} {"train_loss": -43.40456008911133, "global_step": 319759, "epoch": 2642} {"train_loss": -43.92604446411133, "global_step": 319760, "epoch": 2642} {"train_loss": -44.05656814575195, "global_step": 319761, "epoch": 2642} {"train_loss": -42.87501525878906, "global_step": 319762, "epoch": 2642} {"train_loss": -44.09960174560547, "global_step": 319763, "epoch": 2642} {"train_loss": -43.898345947265625, "global_step": 319764, "epoch": 2642} {"train_loss": -44.35065460205078, "global_step": 319765, "epoch": 2642} {"train_loss": -43.73019027709961, "global_step": 319766, "epoch": 2642} {"train_loss": -43.9689826965332, "global_step": 319767, "epoch": 2642} {"train_loss": -44.15739059448242, "global_step": 319768, "epoch": 2642} {"train_loss": -43.98468017578125, "global_step": 319769, "epoch": 2642} {"train_loss": -44.360633850097656, "global_step": 319770, "epoch": 2642} {"train_loss": -44.067481994628906, "global_step": 319771, "epoch": 2642} {"train_loss": -43.95787811279297, "global_step": 319772, "epoch": 2642} {"train_loss": -44.363502502441406, "global_step": 319773, "epoch": 2642} {"train_loss": -44.10334396362305, "global_step": 319774, "epoch": 2642} {"train_loss": -44.48381042480469, "global_step": 319775, "epoch": 2642} {"train_loss": -43.745216369628906, "global_step": 319776, "epoch": 2642} {"train_loss": -44.530029296875, "global_step": 319777, "epoch": 2642} {"train_loss": -43.943511962890625, "global_step": 319778, "epoch": 2642} {"train_loss": -44.76673126220703, "global_step": 319779, "epoch": 2642} {"train_loss": -44.63289260864258, "global_step": 319780, "epoch": 2642} {"train_loss": -43.42452621459961, "global_step": 319781, "epoch": 2642} {"train_loss": -44.74250411987305, "global_step": 319782, "epoch": 2642} {"train_loss": -43.660953521728516, "global_step": 319783, "epoch": 2642} {"train_loss": -44.15986251831055, "global_step": 319784, "epoch": 2642} {"train_loss": -43.96430206298828, "global_step": 319785, "epoch": 2642} {"train_loss": -44.807167053222656, "global_step": 319786, "epoch": 2642} {"train_loss": -44.32583236694336, "global_step": 319787, "epoch": 2642} {"train_loss": -44.08766174316406, "global_step": 319788, "epoch": 2642} {"train_loss": -44.06850051879883, "global_step": 319789, "epoch": 2642} {"train_loss": -44.02345657348633, "global_step": 319790, "epoch": 2642} {"train_loss": -44.42202377319336, "global_step": 319791, "epoch": 2642} {"train_loss": -43.14725875854492, "global_step": 319792, "epoch": 2642} {"train_loss": -44.58211898803711, "global_step": 319793, "epoch": 2642} {"train_loss": -43.09401321411133, "global_step": 319794, "epoch": 2642} {"train_loss": -44.892940521240234, "global_step": 319795, "epoch": 2642} {"train_loss": -43.80982208251953, "global_step": 319796, "epoch": 2642} {"train_loss": -44.68465042114258, "global_step": 319797, "epoch": 2642} {"train_loss": -44.437618255615234, "global_step": 319798, "epoch": 2642} {"train_loss": -44.20553207397461, "global_step": 319799, "epoch": 2642} {"train_loss": -44.525325775146484, "global_step": 319800, "epoch": 2642} {"train_loss": -44.7074089050293, "global_step": 319801, "epoch": 2642} {"train_loss": -43.52097588531242, "global_step": 319802, "epoch": 2642, "val_loss": 2756394.25} {"train_loss": -44.08102035522461, "global_step": 319803, "epoch": 2643} {"train_loss": -45.199317932128906, "global_step": 319804, "epoch": 2643} {"train_loss": -44.82196807861328, "global_step": 319805, "epoch": 2643} {"train_loss": -43.93265914916992, "global_step": 319806, "epoch": 2643} {"train_loss": -44.08954620361328, "global_step": 319807, "epoch": 2643} {"train_loss": -44.62726593017578, "global_step": 319808, "epoch": 2643} {"train_loss": -44.171119689941406, "global_step": 319809, "epoch": 2643} {"train_loss": -43.371368408203125, "global_step": 319810, "epoch": 2643} {"train_loss": -44.2331428527832, "global_step": 319811, "epoch": 2643} {"train_loss": -44.53631591796875, "global_step": 319812, "epoch": 2643} {"train_loss": -44.220340728759766, "global_step": 319813, "epoch": 2643} {"train_loss": -44.93941879272461, "global_step": 319814, "epoch": 2643} {"train_loss": -44.89845657348633, "global_step": 319815, "epoch": 2643} {"train_loss": -43.58767318725586, "global_step": 319816, "epoch": 2643} {"train_loss": -44.53463363647461, "global_step": 319817, "epoch": 2643} {"train_loss": -45.68595504760742, "global_step": 319818, "epoch": 2643} {"train_loss": -44.66238784790039, "global_step": 319819, "epoch": 2643} {"train_loss": -44.9970588684082, "global_step": 319820, "epoch": 2643} {"train_loss": -45.1944694519043, "global_step": 319821, "epoch": 2643} {"train_loss": -45.4362678527832, "global_step": 319822, "epoch": 2643} {"train_loss": -45.176231384277344, "global_step": 319823, "epoch": 2643} {"train_loss": -42.82952880859375, "global_step": 319824, "epoch": 2643} {"train_loss": -45.34160232543945, "global_step": 319825, "epoch": 2643} {"train_loss": -45.09830856323242, "global_step": 319826, "epoch": 2643} {"train_loss": -45.034420013427734, "global_step": 319827, "epoch": 2643} {"train_loss": -45.102169036865234, "global_step": 319828, "epoch": 2643} {"train_loss": -43.89852523803711, "global_step": 319829, "epoch": 2643} {"train_loss": -43.21101379394531, "global_step": 319830, "epoch": 2643} {"train_loss": -44.53042221069336, "global_step": 319831, "epoch": 2643} {"train_loss": -40.88142013549805, "global_step": 319832, "epoch": 2643} {"train_loss": -43.71168899536133, "global_step": 319833, "epoch": 2643} {"train_loss": -44.75739288330078, "global_step": 319834, "epoch": 2643} {"train_loss": -43.5111083984375, "global_step": 319835, "epoch": 2643} {"train_loss": -40.13087844848633, "global_step": 319836, "epoch": 2643} {"train_loss": -38.931758880615234, "global_step": 319837, "epoch": 2643} {"train_loss": -37.6171989440918, "global_step": 319838, "epoch": 2643} {"train_loss": -42.3692741394043, "global_step": 319839, "epoch": 2643} {"train_loss": -40.10654830932617, "global_step": 319840, "epoch": 2643} {"train_loss": -16.314481735229492, "global_step": 319841, "epoch": 2643} {"train_loss": -41.920528411865234, "global_step": 319842, "epoch": 2643} {"train_loss": -34.38212966918945, "global_step": 319843, "epoch": 2643} {"train_loss": -38.894195556640625, "global_step": 319844, "epoch": 2643} {"train_loss": -41.36330795288086, "global_step": 319845, "epoch": 2643} {"train_loss": -37.229061126708984, "global_step": 319846, "epoch": 2643} {"train_loss": -39.06122589111328, "global_step": 319847, "epoch": 2643} {"train_loss": -34.97224807739258, "global_step": 319848, "epoch": 2643} {"train_loss": -36.662296295166016, "global_step": 319849, "epoch": 2643} {"train_loss": -38.15046691894531, "global_step": 319850, "epoch": 2643} {"train_loss": -39.28227233886719, "global_step": 319851, "epoch": 2643} {"train_loss": -38.899837493896484, "global_step": 319852, "epoch": 2643} {"train_loss": -40.2990837097168, "global_step": 319853, "epoch": 2643} {"train_loss": -40.216854095458984, "global_step": 319854, "epoch": 2643} {"train_loss": -35.53676986694336, "global_step": 319855, "epoch": 2643} {"train_loss": -40.543739318847656, "global_step": 319856, "epoch": 2643} {"train_loss": -39.86382293701172, "global_step": 319857, "epoch": 2643} {"train_loss": -38.6500358581543, "global_step": 319858, "epoch": 2643} {"train_loss": -38.587886810302734, "global_step": 319859, "epoch": 2643} {"train_loss": -41.0083122253418, "global_step": 319860, "epoch": 2643} {"train_loss": -40.452754974365234, "global_step": 319861, "epoch": 2643} {"train_loss": -40.448429107666016, "global_step": 319862, "epoch": 2643} {"train_loss": -41.535614013671875, "global_step": 319863, "epoch": 2643} {"train_loss": -40.25584030151367, "global_step": 319864, "epoch": 2643} {"train_loss": -42.1895866394043, "global_step": 319865, "epoch": 2643} {"train_loss": -38.4830436706543, "global_step": 319866, "epoch": 2643} {"train_loss": -42.353878021240234, "global_step": 319867, "epoch": 2643} {"train_loss": -39.97505569458008, "global_step": 319868, "epoch": 2643} {"train_loss": -41.46523666381836, "global_step": 319869, "epoch": 2643} {"train_loss": -41.49522018432617, "global_step": 319870, "epoch": 2643} {"train_loss": -41.45187759399414, "global_step": 319871, "epoch": 2643} {"train_loss": -42.851139068603516, "global_step": 319872, "epoch": 2643} {"train_loss": -39.9380989074707, "global_step": 319873, "epoch": 2643} {"train_loss": -40.64445114135742, "global_step": 319874, "epoch": 2643} {"train_loss": -41.19060134887695, "global_step": 319875, "epoch": 2643} {"train_loss": -42.76064682006836, "global_step": 319876, "epoch": 2643} {"train_loss": -42.825172424316406, "global_step": 319877, "epoch": 2643} {"train_loss": -41.84628677368164, "global_step": 319878, "epoch": 2643} {"train_loss": -41.936092376708984, "global_step": 319879, "epoch": 2643} {"train_loss": -42.93791580200195, "global_step": 319880, "epoch": 2643} {"train_loss": -42.23330307006836, "global_step": 319881, "epoch": 2643} {"train_loss": -41.5069580078125, "global_step": 319882, "epoch": 2643} {"train_loss": -42.764766693115234, "global_step": 319883, "epoch": 2643} {"train_loss": -41.579689025878906, "global_step": 319884, "epoch": 2643} {"train_loss": -43.16070556640625, "global_step": 319885, "epoch": 2643} {"train_loss": -43.1616096496582, "global_step": 319886, "epoch": 2643} {"train_loss": -42.099281311035156, "global_step": 319887, "epoch": 2643} {"train_loss": -42.921024322509766, "global_step": 319888, "epoch": 2643} {"train_loss": -41.7961311340332, "global_step": 319889, "epoch": 2643} {"train_loss": -43.35152816772461, "global_step": 319890, "epoch": 2643} {"train_loss": -42.6877555847168, "global_step": 319891, "epoch": 2643} {"train_loss": -41.72779083251953, "global_step": 319892, "epoch": 2643} {"train_loss": -43.41926193237305, "global_step": 319893, "epoch": 2643} {"train_loss": -42.90397262573242, "global_step": 319894, "epoch": 2643} {"train_loss": -43.17600631713867, "global_step": 319895, "epoch": 2643} {"train_loss": -42.00626754760742, "global_step": 319896, "epoch": 2643} {"train_loss": -43.51533126831055, "global_step": 319897, "epoch": 2643} {"train_loss": -43.146263122558594, "global_step": 319898, "epoch": 2643} {"train_loss": -43.06258773803711, "global_step": 319899, "epoch": 2643} {"train_loss": -43.122371673583984, "global_step": 319900, "epoch": 2643} {"train_loss": -43.651039123535156, "global_step": 319901, "epoch": 2643} {"train_loss": -43.768714904785156, "global_step": 319902, "epoch": 2643} {"train_loss": -43.56492233276367, "global_step": 319903, "epoch": 2643} {"train_loss": -43.4315185546875, "global_step": 319904, "epoch": 2643} {"train_loss": -42.77095031738281, "global_step": 319905, "epoch": 2643} {"train_loss": -42.56511306762695, "global_step": 319906, "epoch": 2643} {"train_loss": -43.3037109375, "global_step": 319907, "epoch": 2643} {"train_loss": -42.83412170410156, "global_step": 319908, "epoch": 2643} {"train_loss": -43.048152923583984, "global_step": 319909, "epoch": 2643} {"train_loss": -43.69271469116211, "global_step": 319910, "epoch": 2643} {"train_loss": -42.950531005859375, "global_step": 319911, "epoch": 2643} {"train_loss": -42.90921401977539, "global_step": 319912, "epoch": 2643} {"train_loss": -43.59682083129883, "global_step": 319913, "epoch": 2643} {"train_loss": -43.77447509765625, "global_step": 319914, "epoch": 2643} {"train_loss": -43.99978256225586, "global_step": 319915, "epoch": 2643} {"train_loss": -44.138946533203125, "global_step": 319916, "epoch": 2643} {"train_loss": -43.69765090942383, "global_step": 319917, "epoch": 2643} {"train_loss": -42.40258026123047, "global_step": 319918, "epoch": 2643} {"train_loss": -43.512351989746094, "global_step": 319919, "epoch": 2643} {"train_loss": -43.72846221923828, "global_step": 319920, "epoch": 2643} {"train_loss": -43.8350944519043, "global_step": 319921, "epoch": 2643} {"train_loss": -44.149166107177734, "global_step": 319922, "epoch": 2643} {"train_loss": -42.10395940670297, "global_step": 319923, "epoch": 2643, "val_loss": 2508790.0} {"train_loss": -43.89326477050781, "global_step": 319924, "epoch": 2644} {"train_loss": -43.763214111328125, "global_step": 319925, "epoch": 2644} {"train_loss": -44.30403518676758, "global_step": 319926, "epoch": 2644} {"train_loss": -43.61090850830078, "global_step": 319927, "epoch": 2644} {"train_loss": -44.06096267700195, "global_step": 319928, "epoch": 2644} {"train_loss": -44.555450439453125, "global_step": 319929, "epoch": 2644} {"train_loss": -44.59512710571289, "global_step": 319930, "epoch": 2644} {"train_loss": -43.55219650268555, "global_step": 319931, "epoch": 2644} {"train_loss": -43.87458038330078, "global_step": 319932, "epoch": 2644} {"train_loss": -44.30109786987305, "global_step": 319933, "epoch": 2644} {"train_loss": -43.802555084228516, "global_step": 319934, "epoch": 2644} {"train_loss": -43.71240234375, "global_step": 319935, "epoch": 2644} {"train_loss": -43.8956184387207, "global_step": 319936, "epoch": 2644} {"train_loss": -44.31733703613281, "global_step": 319937, "epoch": 2644} {"train_loss": -44.27741622924805, "global_step": 319938, "epoch": 2644} {"train_loss": -44.54134750366211, "global_step": 319939, "epoch": 2644} {"train_loss": -44.295169830322266, "global_step": 319940, "epoch": 2644} {"train_loss": -44.133270263671875, "global_step": 319941, "epoch": 2644} {"train_loss": -44.34560012817383, "global_step": 319942, "epoch": 2644} {"train_loss": -44.13960266113281, "global_step": 319943, "epoch": 2644} {"train_loss": -44.3090934753418, "global_step": 319944, "epoch": 2644} {"train_loss": -44.061309814453125, "global_step": 319945, "epoch": 2644} {"train_loss": -44.66022491455078, "global_step": 319946, "epoch": 2644} {"train_loss": -43.56546401977539, "global_step": 319947, "epoch": 2644} {"train_loss": -43.92828369140625, "global_step": 319948, "epoch": 2644} {"train_loss": -44.27607345581055, "global_step": 319949, "epoch": 2644} {"train_loss": -44.247215270996094, "global_step": 319950, "epoch": 2644} {"train_loss": -44.0367546081543, "global_step": 319951, "epoch": 2644} {"train_loss": -44.445526123046875, "global_step": 319952, "epoch": 2644} {"train_loss": -44.70669937133789, "global_step": 319953, "epoch": 2644} {"train_loss": -44.36782455444336, "global_step": 319954, "epoch": 2644} {"train_loss": -42.26066207885742, "global_step": 319955, "epoch": 2644} {"train_loss": -44.5277099609375, "global_step": 319956, "epoch": 2644} {"train_loss": -44.08052062988281, "global_step": 319957, "epoch": 2644} {"train_loss": -42.591880798339844, "global_step": 319958, "epoch": 2644} {"train_loss": -43.731651306152344, "global_step": 319959, "epoch": 2644} {"train_loss": -44.29257583618164, "global_step": 319960, "epoch": 2644} {"train_loss": -43.21232604980469, "global_step": 319961, "epoch": 2644} {"train_loss": -43.70703887939453, "global_step": 319962, "epoch": 2644} {"train_loss": -43.88444900512695, "global_step": 319963, "epoch": 2644} {"train_loss": -43.086585998535156, "global_step": 319964, "epoch": 2644} {"train_loss": -43.88502502441406, "global_step": 319965, "epoch": 2644} {"train_loss": -43.616737365722656, "global_step": 319966, "epoch": 2644} {"train_loss": -44.503318786621094, "global_step": 319967, "epoch": 2644} {"train_loss": -44.35494613647461, "global_step": 319968, "epoch": 2644} {"train_loss": -43.74177932739258, "global_step": 319969, "epoch": 2644} {"train_loss": -44.070884704589844, "global_step": 319970, "epoch": 2644} {"train_loss": -43.92517852783203, "global_step": 319971, "epoch": 2644} {"train_loss": -43.03351974487305, "global_step": 319972, "epoch": 2644} {"train_loss": -42.72314453125, "global_step": 319973, "epoch": 2644} {"train_loss": -43.300758361816406, "global_step": 319974, "epoch": 2644} {"train_loss": -44.156333923339844, "global_step": 319975, "epoch": 2644} {"train_loss": -44.09379959106445, "global_step": 319976, "epoch": 2644} {"train_loss": -43.527381896972656, "global_step": 319977, "epoch": 2644} {"train_loss": -43.806819915771484, "global_step": 319978, "epoch": 2644} {"train_loss": -43.3004150390625, "global_step": 319979, "epoch": 2644} {"train_loss": -40.73838806152344, "global_step": 319980, "epoch": 2644} {"train_loss": -40.169647216796875, "global_step": 319981, "epoch": 2644} {"train_loss": -41.794677734375, "global_step": 319982, "epoch": 2644} {"train_loss": -43.43171310424805, "global_step": 319983, "epoch": 2644} {"train_loss": -41.38340377807617, "global_step": 319984, "epoch": 2644} {"train_loss": -41.40576934814453, "global_step": 319985, "epoch": 2644} {"train_loss": -42.948158264160156, "global_step": 319986, "epoch": 2644} {"train_loss": -41.63641357421875, "global_step": 319987, "epoch": 2644} {"train_loss": -42.965938568115234, "global_step": 319988, "epoch": 2644} {"train_loss": -43.01467514038086, "global_step": 319989, "epoch": 2644} {"train_loss": -41.75288009643555, "global_step": 319990, "epoch": 2644} {"train_loss": -42.659324645996094, "global_step": 319991, "epoch": 2644} {"train_loss": -41.531471252441406, "global_step": 319992, "epoch": 2644} {"train_loss": -40.178462982177734, "global_step": 319993, "epoch": 2644} {"train_loss": -41.269954681396484, "global_step": 319994, "epoch": 2644} {"train_loss": -40.9434928894043, "global_step": 319995, "epoch": 2644} {"train_loss": -40.58721923828125, "global_step": 319996, "epoch": 2644} {"train_loss": -43.46883010864258, "global_step": 319997, "epoch": 2644} {"train_loss": -42.40983200073242, "global_step": 319998, "epoch": 2644} {"train_loss": -42.36637496948242, "global_step": 319999, "epoch": 2644} {"train_loss": -42.857784271240234, "global_step": 320000, "epoch": 2644} {"train_loss": -43.65918731689453, "global_step": 320001, "epoch": 2644} {"train_loss": -43.061439514160156, "global_step": 320002, "epoch": 2644} {"train_loss": -44.2332878112793, "global_step": 320003, "epoch": 2644} {"train_loss": -43.231998443603516, "global_step": 320004, "epoch": 2644} {"train_loss": -43.410316467285156, "global_step": 320005, "epoch": 2644} {"train_loss": -42.771541595458984, "global_step": 320006, "epoch": 2644} {"train_loss": -43.37626647949219, "global_step": 320007, "epoch": 2644} {"train_loss": -43.34545135498047, "global_step": 320008, "epoch": 2644} {"train_loss": -43.529502868652344, "global_step": 320009, "epoch": 2644} {"train_loss": -43.73152160644531, "global_step": 320010, "epoch": 2644} {"train_loss": -43.67863082885742, "global_step": 320011, "epoch": 2644} {"train_loss": -44.10941696166992, "global_step": 320012, "epoch": 2644} {"train_loss": -43.37494659423828, "global_step": 320013, "epoch": 2644} {"train_loss": -43.35185241699219, "global_step": 320014, "epoch": 2644} {"train_loss": -43.90525436401367, "global_step": 320015, "epoch": 2644} {"train_loss": -43.65182113647461, "global_step": 320016, "epoch": 2644} {"train_loss": -43.346168518066406, "global_step": 320017, "epoch": 2644} {"train_loss": -43.38227081298828, "global_step": 320018, "epoch": 2644} {"train_loss": -43.74736404418945, "global_step": 320019, "epoch": 2644} {"train_loss": -43.783451080322266, "global_step": 320020, "epoch": 2644} {"train_loss": -43.559139251708984, "global_step": 320021, "epoch": 2644} {"train_loss": -42.811012268066406, "global_step": 320022, "epoch": 2644} {"train_loss": -43.270111083984375, "global_step": 320023, "epoch": 2644} {"train_loss": -43.29989242553711, "global_step": 320024, "epoch": 2644} {"train_loss": -43.041133880615234, "global_step": 320025, "epoch": 2644} {"train_loss": -41.839881896972656, "global_step": 320026, "epoch": 2644} {"train_loss": -43.311641693115234, "global_step": 320027, "epoch": 2644} {"train_loss": -43.41915512084961, "global_step": 320028, "epoch": 2644} {"train_loss": -43.6398811340332, "global_step": 320029, "epoch": 2644} {"train_loss": -43.40904235839844, "global_step": 320030, "epoch": 2644} {"train_loss": -44.2725944519043, "global_step": 320031, "epoch": 2644} {"train_loss": -43.5573616027832, "global_step": 320032, "epoch": 2644} {"train_loss": -43.63602828979492, "global_step": 320033, "epoch": 2644} {"train_loss": -44.057945251464844, "global_step": 320034, "epoch": 2644} {"train_loss": -43.81196212768555, "global_step": 320035, "epoch": 2644} {"train_loss": -43.47500228881836, "global_step": 320036, "epoch": 2644} {"train_loss": -43.7266960144043, "global_step": 320037, "epoch": 2644} {"train_loss": -42.91352081298828, "global_step": 320038, "epoch": 2644} {"train_loss": -42.96828079223633, "global_step": 320039, "epoch": 2644} {"train_loss": -43.99052047729492, "global_step": 320040, "epoch": 2644} {"train_loss": -43.34280014038086, "global_step": 320041, "epoch": 2644} {"train_loss": -43.52396774291992, "global_step": 320042, "epoch": 2644} {"train_loss": -43.88434982299805, "global_step": 320043, "epoch": 2644} {"train_loss": -43.39857173951204, "global_step": 320044, "epoch": 2644, "val_loss": 2406258.0} {"train_loss": -44.37685775756836, "global_step": 320045, "epoch": 2645} {"train_loss": -43.483551025390625, "global_step": 320046, "epoch": 2645} {"train_loss": -43.44832229614258, "global_step": 320047, "epoch": 2645} {"train_loss": -44.05904006958008, "global_step": 320048, "epoch": 2645} {"train_loss": -42.729644775390625, "global_step": 320049, "epoch": 2645} {"train_loss": -43.11332321166992, "global_step": 320050, "epoch": 2645} {"train_loss": -43.33277130126953, "global_step": 320051, "epoch": 2645} {"train_loss": -44.4731330871582, "global_step": 320052, "epoch": 2645} {"train_loss": -42.66903305053711, "global_step": 320053, "epoch": 2645} {"train_loss": -40.329994201660156, "global_step": 320054, "epoch": 2645} {"train_loss": -44.10580062866211, "global_step": 320055, "epoch": 2645} {"train_loss": -41.840267181396484, "global_step": 320056, "epoch": 2645} {"train_loss": -40.76856231689453, "global_step": 320057, "epoch": 2645} {"train_loss": -42.6129035949707, "global_step": 320058, "epoch": 2645} {"train_loss": -43.04838180541992, "global_step": 320059, "epoch": 2645} {"train_loss": -42.56675338745117, "global_step": 320060, "epoch": 2645} {"train_loss": -42.10457992553711, "global_step": 320061, "epoch": 2645} {"train_loss": -42.466041564941406, "global_step": 320062, "epoch": 2645} {"train_loss": -42.48069381713867, "global_step": 320063, "epoch": 2645} {"train_loss": -43.46902084350586, "global_step": 320064, "epoch": 2645} {"train_loss": -43.25295639038086, "global_step": 320065, "epoch": 2645} {"train_loss": -43.0506706237793, "global_step": 320066, "epoch": 2645} {"train_loss": -43.05088424682617, "global_step": 320067, "epoch": 2645} {"train_loss": -43.76050567626953, "global_step": 320068, "epoch": 2645} {"train_loss": -42.63706588745117, "global_step": 320069, "epoch": 2645} {"train_loss": -42.9627799987793, "global_step": 320070, "epoch": 2645} {"train_loss": -42.42780303955078, "global_step": 320071, "epoch": 2645} {"train_loss": -43.7047233581543, "global_step": 320072, "epoch": 2645} {"train_loss": -43.87820053100586, "global_step": 320073, "epoch": 2645} {"train_loss": -42.907745361328125, "global_step": 320074, "epoch": 2645} {"train_loss": -42.5723876953125, "global_step": 320075, "epoch": 2645} {"train_loss": -43.52875900268555, "global_step": 320076, "epoch": 2645} {"train_loss": -43.38450241088867, "global_step": 320077, "epoch": 2645} {"train_loss": -40.50960922241211, "global_step": 320078, "epoch": 2645} {"train_loss": -44.22702407836914, "global_step": 320079, "epoch": 2645} {"train_loss": -42.21961212158203, "global_step": 320080, "epoch": 2645} {"train_loss": -41.13875961303711, "global_step": 320081, "epoch": 2645} {"train_loss": -43.26182556152344, "global_step": 320082, "epoch": 2645} {"train_loss": -41.81339645385742, "global_step": 320083, "epoch": 2645} {"train_loss": -41.169830322265625, "global_step": 320084, "epoch": 2645} {"train_loss": -42.93232345581055, "global_step": 320085, "epoch": 2645} {"train_loss": -42.29360580444336, "global_step": 320086, "epoch": 2645} {"train_loss": -41.806148529052734, "global_step": 320087, "epoch": 2645} {"train_loss": -41.825096130371094, "global_step": 320088, "epoch": 2645} {"train_loss": -43.443153381347656, "global_step": 320089, "epoch": 2645} {"train_loss": -42.81775665283203, "global_step": 320090, "epoch": 2645} {"train_loss": -43.066925048828125, "global_step": 320091, "epoch": 2645} {"train_loss": -43.418399810791016, "global_step": 320092, "epoch": 2645} {"train_loss": -42.67221450805664, "global_step": 320093, "epoch": 2645} {"train_loss": -44.00484085083008, "global_step": 320094, "epoch": 2645} {"train_loss": -42.971961975097656, "global_step": 320095, "epoch": 2645} {"train_loss": -43.4904899597168, "global_step": 320096, "epoch": 2645} {"train_loss": -43.624752044677734, "global_step": 320097, "epoch": 2645} {"train_loss": -42.4495735168457, "global_step": 320098, "epoch": 2645} {"train_loss": -43.860599517822266, "global_step": 320099, "epoch": 2645} {"train_loss": -43.78285598754883, "global_step": 320100, "epoch": 2645} {"train_loss": -43.13670349121094, "global_step": 320101, "epoch": 2645} {"train_loss": -44.449920654296875, "global_step": 320102, "epoch": 2645} {"train_loss": -44.070377349853516, "global_step": 320103, "epoch": 2645} {"train_loss": -43.19163513183594, "global_step": 320104, "epoch": 2645} {"train_loss": -44.19929122924805, "global_step": 320105, "epoch": 2645} {"train_loss": -43.97319030761719, "global_step": 320106, "epoch": 2645} {"train_loss": -44.25872039794922, "global_step": 320107, "epoch": 2645} {"train_loss": -44.220130920410156, "global_step": 320108, "epoch": 2645} {"train_loss": -44.32485580444336, "global_step": 320109, "epoch": 2645} {"train_loss": -44.235870361328125, "global_step": 320110, "epoch": 2645} {"train_loss": -44.451683044433594, "global_step": 320111, "epoch": 2645} {"train_loss": -44.05229568481445, "global_step": 320112, "epoch": 2645} {"train_loss": -44.280574798583984, "global_step": 320113, "epoch": 2645} {"train_loss": -44.374507904052734, "global_step": 320114, "epoch": 2645} {"train_loss": -44.36623764038086, "global_step": 320115, "epoch": 2645} {"train_loss": -44.600563049316406, "global_step": 320116, "epoch": 2645} {"train_loss": -43.64016342163086, "global_step": 320117, "epoch": 2645} {"train_loss": -44.294368743896484, "global_step": 320118, "epoch": 2645} {"train_loss": -44.7581901550293, "global_step": 320119, "epoch": 2645} {"train_loss": -43.87770462036133, "global_step": 320120, "epoch": 2645} {"train_loss": -44.46189498901367, "global_step": 320121, "epoch": 2645} {"train_loss": -43.972049713134766, "global_step": 320122, "epoch": 2645} {"train_loss": -44.668399810791016, "global_step": 320123, "epoch": 2645} {"train_loss": -44.2192497253418, "global_step": 320124, "epoch": 2645} {"train_loss": -44.97157669067383, "global_step": 320125, "epoch": 2645} {"train_loss": -44.98495864868164, "global_step": 320126, "epoch": 2645} {"train_loss": -44.922401428222656, "global_step": 320127, "epoch": 2645} {"train_loss": -44.08555603027344, "global_step": 320128, "epoch": 2645} {"train_loss": -44.98664474487305, "global_step": 320129, "epoch": 2645} {"train_loss": -44.702816009521484, "global_step": 320130, "epoch": 2645} {"train_loss": -44.7382926940918, "global_step": 320131, "epoch": 2645} {"train_loss": -45.35410690307617, "global_step": 320132, "epoch": 2645} {"train_loss": -45.26981735229492, "global_step": 320133, "epoch": 2645} {"train_loss": -44.9727668762207, "global_step": 320134, "epoch": 2645} {"train_loss": -44.60369873046875, "global_step": 320135, "epoch": 2645} {"train_loss": -44.73674011230469, "global_step": 320136, "epoch": 2645} {"train_loss": -44.42678451538086, "global_step": 320137, "epoch": 2645} {"train_loss": -44.32032012939453, "global_step": 320138, "epoch": 2645} {"train_loss": -44.68756866455078, "global_step": 320139, "epoch": 2645} {"train_loss": -45.45201873779297, "global_step": 320140, "epoch": 2645} {"train_loss": -44.07589340209961, "global_step": 320141, "epoch": 2645} {"train_loss": -44.111568450927734, "global_step": 320142, "epoch": 2645} {"train_loss": -45.16974639892578, "global_step": 320143, "epoch": 2645} {"train_loss": -45.231048583984375, "global_step": 320144, "epoch": 2645} {"train_loss": -45.18781661987305, "global_step": 320145, "epoch": 2645} {"train_loss": -45.23617172241211, "global_step": 320146, "epoch": 2645} {"train_loss": -44.94187545776367, "global_step": 320147, "epoch": 2645} {"train_loss": -44.57535934448242, "global_step": 320148, "epoch": 2645} {"train_loss": -45.221099853515625, "global_step": 320149, "epoch": 2645} {"train_loss": -44.986141204833984, "global_step": 320150, "epoch": 2645} {"train_loss": -44.3834114074707, "global_step": 320151, "epoch": 2645} {"train_loss": -44.685237884521484, "global_step": 320152, "epoch": 2645} {"train_loss": -44.80942916870117, "global_step": 320153, "epoch": 2645} {"train_loss": -45.17369079589844, "global_step": 320154, "epoch": 2645} {"train_loss": -44.81350326538086, "global_step": 320155, "epoch": 2645} {"train_loss": -44.95595932006836, "global_step": 320156, "epoch": 2645} {"train_loss": -44.81179428100586, "global_step": 320157, "epoch": 2645} {"train_loss": -45.185054779052734, "global_step": 320158, "epoch": 2645} {"train_loss": -45.30567932128906, "global_step": 320159, "epoch": 2645} {"train_loss": -45.10148239135742, "global_step": 320160, "epoch": 2645} {"train_loss": -44.975608825683594, "global_step": 320161, "epoch": 2645} {"train_loss": -44.09765625, "global_step": 320162, "epoch": 2645} {"train_loss": -44.0208854675293, "global_step": 320163, "epoch": 2645} {"train_loss": -44.8779182434082, "global_step": 320164, "epoch": 2645} {"train_loss": -43.79007052587084, "global_step": 320165, "epoch": 2645, "val_loss": 2545546.25} {"train_loss": -42.3244743347168, "global_step": 320166, "epoch": 2646} {"train_loss": -42.771522521972656, "global_step": 320167, "epoch": 2646} {"train_loss": -44.10976791381836, "global_step": 320168, "epoch": 2646} {"train_loss": -44.139156341552734, "global_step": 320169, "epoch": 2646} {"train_loss": -43.725669860839844, "global_step": 320170, "epoch": 2646} {"train_loss": -43.93264389038086, "global_step": 320171, "epoch": 2646} {"train_loss": -44.490394592285156, "global_step": 320172, "epoch": 2646} {"train_loss": -43.306514739990234, "global_step": 320173, "epoch": 2646} {"train_loss": -43.84667205810547, "global_step": 320174, "epoch": 2646} {"train_loss": -43.77808380126953, "global_step": 320175, "epoch": 2646} {"train_loss": -42.78597640991211, "global_step": 320176, "epoch": 2646} {"train_loss": -43.005489349365234, "global_step": 320177, "epoch": 2646} {"train_loss": -41.19271469116211, "global_step": 320178, "epoch": 2646} {"train_loss": -41.79531478881836, "global_step": 320179, "epoch": 2646} {"train_loss": -43.62295150756836, "global_step": 320180, "epoch": 2646} {"train_loss": -42.53882598876953, "global_step": 320181, "epoch": 2646} {"train_loss": -43.45405960083008, "global_step": 320182, "epoch": 2646} {"train_loss": -43.7533073425293, "global_step": 320183, "epoch": 2646} {"train_loss": -43.122371673583984, "global_step": 320184, "epoch": 2646} {"train_loss": -40.63292694091797, "global_step": 320185, "epoch": 2646} {"train_loss": -39.28399658203125, "global_step": 320186, "epoch": 2646} {"train_loss": -43.23480987548828, "global_step": 320187, "epoch": 2646} {"train_loss": -43.32241439819336, "global_step": 320188, "epoch": 2646} {"train_loss": -41.371925354003906, "global_step": 320189, "epoch": 2646} {"train_loss": -42.61227035522461, "global_step": 320190, "epoch": 2646} {"train_loss": -42.44518280029297, "global_step": 320191, "epoch": 2646} {"train_loss": -43.265811920166016, "global_step": 320192, "epoch": 2646} {"train_loss": -42.99345779418945, "global_step": 320193, "epoch": 2646} {"train_loss": -42.188453674316406, "global_step": 320194, "epoch": 2646} {"train_loss": -42.87881088256836, "global_step": 320195, "epoch": 2646} {"train_loss": -39.151302337646484, "global_step": 320196, "epoch": 2646} {"train_loss": -42.008113861083984, "global_step": 320197, "epoch": 2646} {"train_loss": -42.3624267578125, "global_step": 320198, "epoch": 2646} {"train_loss": -41.038875579833984, "global_step": 320199, "epoch": 2646} {"train_loss": -41.5617790222168, "global_step": 320200, "epoch": 2646} {"train_loss": -41.44519805908203, "global_step": 320201, "epoch": 2646} {"train_loss": -42.55610656738281, "global_step": 320202, "epoch": 2646} {"train_loss": -40.280250549316406, "global_step": 320203, "epoch": 2646} {"train_loss": -42.242958068847656, "global_step": 320204, "epoch": 2646} {"train_loss": -40.927589416503906, "global_step": 320205, "epoch": 2646} {"train_loss": -42.609214782714844, "global_step": 320206, "epoch": 2646} {"train_loss": -41.97206497192383, "global_step": 320207, "epoch": 2646} {"train_loss": -42.25379180908203, "global_step": 320208, "epoch": 2646} {"train_loss": -41.81669998168945, "global_step": 320209, "epoch": 2646} {"train_loss": -42.87337112426758, "global_step": 320210, "epoch": 2646} {"train_loss": -42.192928314208984, "global_step": 320211, "epoch": 2646} {"train_loss": -42.353878021240234, "global_step": 320212, "epoch": 2646} {"train_loss": -42.698875427246094, "global_step": 320213, "epoch": 2646} {"train_loss": -42.079071044921875, "global_step": 320214, "epoch": 2646} {"train_loss": -42.97806930541992, "global_step": 320215, "epoch": 2646} {"train_loss": -43.27970504760742, "global_step": 320216, "epoch": 2646} {"train_loss": -42.65785598754883, "global_step": 320217, "epoch": 2646} {"train_loss": -43.7231330871582, "global_step": 320218, "epoch": 2646} {"train_loss": -42.05591583251953, "global_step": 320219, "epoch": 2646} {"train_loss": -43.39508056640625, "global_step": 320220, "epoch": 2646} {"train_loss": -43.28495407104492, "global_step": 320221, "epoch": 2646} {"train_loss": -42.566131591796875, "global_step": 320222, "epoch": 2646} {"train_loss": -43.364139556884766, "global_step": 320223, "epoch": 2646} {"train_loss": -42.43898391723633, "global_step": 320224, "epoch": 2646} {"train_loss": -41.60433578491211, "global_step": 320225, "epoch": 2646} {"train_loss": -43.310054779052734, "global_step": 320226, "epoch": 2646} {"train_loss": -43.13396453857422, "global_step": 320227, "epoch": 2646} {"train_loss": -42.673946380615234, "global_step": 320228, "epoch": 2646} {"train_loss": -43.93971633911133, "global_step": 320229, "epoch": 2646} {"train_loss": -42.93186950683594, "global_step": 320230, "epoch": 2646} {"train_loss": -43.316864013671875, "global_step": 320231, "epoch": 2646} {"train_loss": -43.5731315612793, "global_step": 320232, "epoch": 2646} {"train_loss": -43.19576644897461, "global_step": 320233, "epoch": 2646} {"train_loss": -44.077056884765625, "global_step": 320234, "epoch": 2646} {"train_loss": -43.7686767578125, "global_step": 320235, "epoch": 2646} {"train_loss": -44.0359001159668, "global_step": 320236, "epoch": 2646} {"train_loss": -43.71307373046875, "global_step": 320237, "epoch": 2646} {"train_loss": -44.0169677734375, "global_step": 320238, "epoch": 2646} {"train_loss": -44.105865478515625, "global_step": 320239, "epoch": 2646} {"train_loss": -43.7905387878418, "global_step": 320240, "epoch": 2646} {"train_loss": -44.66868209838867, "global_step": 320241, "epoch": 2646} {"train_loss": -44.0695915222168, "global_step": 320242, "epoch": 2646} {"train_loss": -44.16252899169922, "global_step": 320243, "epoch": 2646} {"train_loss": -44.4022331237793, "global_step": 320244, "epoch": 2646} {"train_loss": -44.1684455871582, "global_step": 320245, "epoch": 2646} {"train_loss": -44.48543930053711, "global_step": 320246, "epoch": 2646} {"train_loss": -44.45709228515625, "global_step": 320247, "epoch": 2646} {"train_loss": -44.677223205566406, "global_step": 320248, "epoch": 2646} {"train_loss": -44.834983825683594, "global_step": 320249, "epoch": 2646} {"train_loss": -44.45461654663086, "global_step": 320250, "epoch": 2646} {"train_loss": -44.89603805541992, "global_step": 320251, "epoch": 2646} {"train_loss": -44.730682373046875, "global_step": 320252, "epoch": 2646} {"train_loss": -44.214656829833984, "global_step": 320253, "epoch": 2646} {"train_loss": -44.89126205444336, "global_step": 320254, "epoch": 2646} {"train_loss": -44.93636703491211, "global_step": 320255, "epoch": 2646} {"train_loss": -44.5225830078125, "global_step": 320256, "epoch": 2646} {"train_loss": -44.82606506347656, "global_step": 320257, "epoch": 2646} {"train_loss": -44.949806213378906, "global_step": 320258, "epoch": 2646} {"train_loss": -44.96525192260742, "global_step": 320259, "epoch": 2646} {"train_loss": -44.77773666381836, "global_step": 320260, "epoch": 2646} {"train_loss": -45.10332107543945, "global_step": 320261, "epoch": 2646} {"train_loss": -45.08003234863281, "global_step": 320262, "epoch": 2646} {"train_loss": -44.86433792114258, "global_step": 320263, "epoch": 2646} {"train_loss": -45.06640625, "global_step": 320264, "epoch": 2646} {"train_loss": -44.09579086303711, "global_step": 320265, "epoch": 2646} {"train_loss": -44.399444580078125, "global_step": 320266, "epoch": 2646} {"train_loss": -44.790321350097656, "global_step": 320267, "epoch": 2646} {"train_loss": -44.62471008300781, "global_step": 320268, "epoch": 2646} {"train_loss": -43.642333984375, "global_step": 320269, "epoch": 2646} {"train_loss": -44.9978141784668, "global_step": 320270, "epoch": 2646} {"train_loss": -43.9603157043457, "global_step": 320271, "epoch": 2646} {"train_loss": -44.20732116699219, "global_step": 320272, "epoch": 2646} {"train_loss": -44.90312957763672, "global_step": 320273, "epoch": 2646} {"train_loss": -44.48442840576172, "global_step": 320274, "epoch": 2646} {"train_loss": -43.98945999145508, "global_step": 320275, "epoch": 2646} {"train_loss": -44.9417839050293, "global_step": 320276, "epoch": 2646} {"train_loss": -44.979427337646484, "global_step": 320277, "epoch": 2646} {"train_loss": -44.63535690307617, "global_step": 320278, "epoch": 2646} {"train_loss": -45.10944366455078, "global_step": 320279, "epoch": 2646} {"train_loss": -45.153541564941406, "global_step": 320280, "epoch": 2646} {"train_loss": -45.26667404174805, "global_step": 320281, "epoch": 2646} {"train_loss": -45.215003967285156, "global_step": 320282, "epoch": 2646} {"train_loss": -45.156307220458984, "global_step": 320283, "epoch": 2646} {"train_loss": -44.72469711303711, "global_step": 320284, "epoch": 2646} {"train_loss": -44.9103889465332, "global_step": 320285, "epoch": 2646} {"train_loss": -43.47323126044155, "global_step": 320286, "epoch": 2646, "val_loss": 2568736.0} {"train_loss": -45.2640495300293, "global_step": 320287, "epoch": 2647} {"train_loss": -45.0333366394043, "global_step": 320288, "epoch": 2647} {"train_loss": -44.855281829833984, "global_step": 320289, "epoch": 2647} {"train_loss": -45.149776458740234, "global_step": 320290, "epoch": 2647} {"train_loss": -44.932594299316406, "global_step": 320291, "epoch": 2647} {"train_loss": -45.144935607910156, "global_step": 320292, "epoch": 2647} {"train_loss": -45.34199905395508, "global_step": 320293, "epoch": 2647} {"train_loss": -44.97896957397461, "global_step": 320294, "epoch": 2647} {"train_loss": -45.674007415771484, "global_step": 320295, "epoch": 2647} {"train_loss": -45.41701889038086, "global_step": 320296, "epoch": 2647} {"train_loss": -45.05891418457031, "global_step": 320297, "epoch": 2647} {"train_loss": -44.50393295288086, "global_step": 320298, "epoch": 2647} {"train_loss": -44.48250961303711, "global_step": 320299, "epoch": 2647} {"train_loss": -44.0435905456543, "global_step": 320300, "epoch": 2647} {"train_loss": -44.68255615234375, "global_step": 320301, "epoch": 2647} {"train_loss": -45.07528305053711, "global_step": 320302, "epoch": 2647} {"train_loss": -43.2601318359375, "global_step": 320303, "epoch": 2647} {"train_loss": -42.4964599609375, "global_step": 320304, "epoch": 2647} {"train_loss": -42.41070556640625, "global_step": 320305, "epoch": 2647} {"train_loss": -44.796836853027344, "global_step": 320306, "epoch": 2647} {"train_loss": -43.37852096557617, "global_step": 320307, "epoch": 2647} {"train_loss": -42.907833099365234, "global_step": 320308, "epoch": 2647} {"train_loss": -44.0341911315918, "global_step": 320309, "epoch": 2647} {"train_loss": -44.0624885559082, "global_step": 320310, "epoch": 2647} {"train_loss": -42.910667419433594, "global_step": 320311, "epoch": 2647} {"train_loss": -44.05506896972656, "global_step": 320312, "epoch": 2647} {"train_loss": -42.84294891357422, "global_step": 320313, "epoch": 2647} {"train_loss": -44.0543327331543, "global_step": 320314, "epoch": 2647} {"train_loss": -44.77207565307617, "global_step": 320315, "epoch": 2647} {"train_loss": -44.11001205444336, "global_step": 320316, "epoch": 2647} {"train_loss": -43.690853118896484, "global_step": 320317, "epoch": 2647} {"train_loss": -43.68832015991211, "global_step": 320318, "epoch": 2647} {"train_loss": -44.63370895385742, "global_step": 320319, "epoch": 2647} {"train_loss": -43.93258285522461, "global_step": 320320, "epoch": 2647} {"train_loss": -43.392181396484375, "global_step": 320321, "epoch": 2647} {"train_loss": -42.706600189208984, "global_step": 320322, "epoch": 2647} {"train_loss": -43.944725036621094, "global_step": 320323, "epoch": 2647} {"train_loss": -44.3474235534668, "global_step": 320324, "epoch": 2647} {"train_loss": -43.597442626953125, "global_step": 320325, "epoch": 2647} {"train_loss": -43.69172668457031, "global_step": 320326, "epoch": 2647} {"train_loss": -43.567726135253906, "global_step": 320327, "epoch": 2647} {"train_loss": -42.12134552001953, "global_step": 320328, "epoch": 2647} {"train_loss": -41.971614837646484, "global_step": 320329, "epoch": 2647} {"train_loss": -42.672645568847656, "global_step": 320330, "epoch": 2647} {"train_loss": -42.62249755859375, "global_step": 320331, "epoch": 2647} {"train_loss": -42.25896072387695, "global_step": 320332, "epoch": 2647} {"train_loss": -42.169036865234375, "global_step": 320333, "epoch": 2647} {"train_loss": -42.82283401489258, "global_step": 320334, "epoch": 2647} {"train_loss": -39.50960922241211, "global_step": 320335, "epoch": 2647} {"train_loss": -43.047847747802734, "global_step": 320336, "epoch": 2647} {"train_loss": -42.52781295776367, "global_step": 320337, "epoch": 2647} {"train_loss": -41.27903747558594, "global_step": 320338, "epoch": 2647} {"train_loss": -42.43582534790039, "global_step": 320339, "epoch": 2647} {"train_loss": -41.92512893676758, "global_step": 320340, "epoch": 2647} {"train_loss": -41.794612884521484, "global_step": 320341, "epoch": 2647} {"train_loss": -42.017330169677734, "global_step": 320342, "epoch": 2647} {"train_loss": -42.95271682739258, "global_step": 320343, "epoch": 2647} {"train_loss": -41.64868927001953, "global_step": 320344, "epoch": 2647} {"train_loss": -41.4433479309082, "global_step": 320345, "epoch": 2647} {"train_loss": -42.5626220703125, "global_step": 320346, "epoch": 2647} {"train_loss": -42.44023132324219, "global_step": 320347, "epoch": 2647} {"train_loss": -42.04045867919922, "global_step": 320348, "epoch": 2647} {"train_loss": -41.974998474121094, "global_step": 320349, "epoch": 2647} {"train_loss": -43.38581085205078, "global_step": 320350, "epoch": 2647} {"train_loss": -40.4830436706543, "global_step": 320351, "epoch": 2647} {"train_loss": -42.6361198425293, "global_step": 320352, "epoch": 2647} {"train_loss": -41.16939163208008, "global_step": 320353, "epoch": 2647} {"train_loss": -41.64618682861328, "global_step": 320354, "epoch": 2647} {"train_loss": -41.80000686645508, "global_step": 320355, "epoch": 2647} {"train_loss": -41.97953796386719, "global_step": 320356, "epoch": 2647} {"train_loss": -42.09303665161133, "global_step": 320357, "epoch": 2647} {"train_loss": -40.13195037841797, "global_step": 320358, "epoch": 2647} {"train_loss": -39.568572998046875, "global_step": 320359, "epoch": 2647} {"train_loss": -41.21908187866211, "global_step": 320360, "epoch": 2647} {"train_loss": -41.57538986206055, "global_step": 320361, "epoch": 2647} {"train_loss": -41.16791534423828, "global_step": 320362, "epoch": 2647} {"train_loss": -42.94236373901367, "global_step": 320363, "epoch": 2647} {"train_loss": -41.97187423706055, "global_step": 320364, "epoch": 2647} {"train_loss": -40.901588439941406, "global_step": 320365, "epoch": 2647} {"train_loss": -43.222328186035156, "global_step": 320366, "epoch": 2647} {"train_loss": -41.13447952270508, "global_step": 320367, "epoch": 2647} {"train_loss": -43.15092086791992, "global_step": 320368, "epoch": 2647} {"train_loss": -42.71998977661133, "global_step": 320369, "epoch": 2647} {"train_loss": -42.638671875, "global_step": 320370, "epoch": 2647} {"train_loss": -42.7343635559082, "global_step": 320371, "epoch": 2647} {"train_loss": -43.30149459838867, "global_step": 320372, "epoch": 2647} {"train_loss": -43.17683029174805, "global_step": 320373, "epoch": 2647} {"train_loss": -43.73696517944336, "global_step": 320374, "epoch": 2647} {"train_loss": -43.30381393432617, "global_step": 320375, "epoch": 2647} {"train_loss": -43.94132614135742, "global_step": 320376, "epoch": 2647} {"train_loss": -43.266822814941406, "global_step": 320377, "epoch": 2647} {"train_loss": -42.948387145996094, "global_step": 320378, "epoch": 2647} {"train_loss": -42.7401237487793, "global_step": 320379, "epoch": 2647} {"train_loss": -43.21250534057617, "global_step": 320380, "epoch": 2647} {"train_loss": -43.9364013671875, "global_step": 320381, "epoch": 2647} {"train_loss": -43.424049377441406, "global_step": 320382, "epoch": 2647} {"train_loss": -43.01886749267578, "global_step": 320383, "epoch": 2647} {"train_loss": -43.61690139770508, "global_step": 320384, "epoch": 2647} {"train_loss": -43.31105422973633, "global_step": 320385, "epoch": 2647} {"train_loss": -43.06057357788086, "global_step": 320386, "epoch": 2647} {"train_loss": -43.74862289428711, "global_step": 320387, "epoch": 2647} {"train_loss": -43.638301849365234, "global_step": 320388, "epoch": 2647} {"train_loss": -43.37154769897461, "global_step": 320389, "epoch": 2647} {"train_loss": -43.45294952392578, "global_step": 320390, "epoch": 2647} {"train_loss": -42.59131622314453, "global_step": 320391, "epoch": 2647} {"train_loss": -43.70400619506836, "global_step": 320392, "epoch": 2647} {"train_loss": -43.50001907348633, "global_step": 320393, "epoch": 2647} {"train_loss": -43.113868713378906, "global_step": 320394, "epoch": 2647} {"train_loss": -44.10535430908203, "global_step": 320395, "epoch": 2647} {"train_loss": -43.9551887512207, "global_step": 320396, "epoch": 2647} {"train_loss": -43.808326721191406, "global_step": 320397, "epoch": 2647} {"train_loss": -43.92390441894531, "global_step": 320398, "epoch": 2647} {"train_loss": -44.149085998535156, "global_step": 320399, "epoch": 2647} {"train_loss": -43.974578857421875, "global_step": 320400, "epoch": 2647} {"train_loss": -44.21220016479492, "global_step": 320401, "epoch": 2647} {"train_loss": -44.135292053222656, "global_step": 320402, "epoch": 2647} {"train_loss": -44.28093338012695, "global_step": 320403, "epoch": 2647} {"train_loss": -44.31855010986328, "global_step": 320404, "epoch": 2647} {"train_loss": -43.90182113647461, "global_step": 320405, "epoch": 2647} {"train_loss": -43.880943298339844, "global_step": 320406, "epoch": 2647} {"train_loss": -43.20805415634281, "global_step": 320407, "epoch": 2647, "val_loss": 2534454.75} {"train_loss": -43.99208450317383, "global_step": 320408, "epoch": 2648} {"train_loss": -44.750919342041016, "global_step": 320409, "epoch": 2648} {"train_loss": -44.79829788208008, "global_step": 320410, "epoch": 2648} {"train_loss": -43.95734405517578, "global_step": 320411, "epoch": 2648} {"train_loss": -44.89173126220703, "global_step": 320412, "epoch": 2648} {"train_loss": -44.37049102783203, "global_step": 320413, "epoch": 2648} {"train_loss": -44.311553955078125, "global_step": 320414, "epoch": 2648} {"train_loss": -44.831695556640625, "global_step": 320415, "epoch": 2648} {"train_loss": -44.851985931396484, "global_step": 320416, "epoch": 2648} {"train_loss": -44.42515182495117, "global_step": 320417, "epoch": 2648} {"train_loss": -44.74894332885742, "global_step": 320418, "epoch": 2648} {"train_loss": -44.621429443359375, "global_step": 320419, "epoch": 2648} {"train_loss": -44.50968551635742, "global_step": 320420, "epoch": 2648} {"train_loss": -44.464168548583984, "global_step": 320421, "epoch": 2648} {"train_loss": -44.638248443603516, "global_step": 320422, "epoch": 2648} {"train_loss": -44.41385269165039, "global_step": 320423, "epoch": 2648} {"train_loss": -44.3826789855957, "global_step": 320424, "epoch": 2648} {"train_loss": -44.33455276489258, "global_step": 320425, "epoch": 2648} {"train_loss": -44.52374267578125, "global_step": 320426, "epoch": 2648} {"train_loss": -44.573219299316406, "global_step": 320427, "epoch": 2648} {"train_loss": -44.38127517700195, "global_step": 320428, "epoch": 2648} {"train_loss": -44.858062744140625, "global_step": 320429, "epoch": 2648} {"train_loss": -45.3653450012207, "global_step": 320430, "epoch": 2648} {"train_loss": -43.84756088256836, "global_step": 320431, "epoch": 2648} {"train_loss": -44.94025802612305, "global_step": 320432, "epoch": 2648} {"train_loss": -45.139320373535156, "global_step": 320433, "epoch": 2648} {"train_loss": -44.99020767211914, "global_step": 320434, "epoch": 2648} {"train_loss": -45.152793884277344, "global_step": 320435, "epoch": 2648} {"train_loss": -44.856746673583984, "global_step": 320436, "epoch": 2648} {"train_loss": -44.830562591552734, "global_step": 320437, "epoch": 2648} {"train_loss": -45.143428802490234, "global_step": 320438, "epoch": 2648} {"train_loss": -45.28082275390625, "global_step": 320439, "epoch": 2648} {"train_loss": -45.032222747802734, "global_step": 320440, "epoch": 2648} {"train_loss": -45.52403259277344, "global_step": 320441, "epoch": 2648} {"train_loss": -45.18966293334961, "global_step": 320442, "epoch": 2648} {"train_loss": -44.79801559448242, "global_step": 320443, "epoch": 2648} {"train_loss": -45.12315368652344, "global_step": 320444, "epoch": 2648} {"train_loss": -45.32166290283203, "global_step": 320445, "epoch": 2648} {"train_loss": -45.373653411865234, "global_step": 320446, "epoch": 2648} {"train_loss": -45.00069808959961, "global_step": 320447, "epoch": 2648} {"train_loss": -45.11016845703125, "global_step": 320448, "epoch": 2648} {"train_loss": -45.22547912597656, "global_step": 320449, "epoch": 2648} {"train_loss": -45.5776481628418, "global_step": 320450, "epoch": 2648} {"train_loss": -44.95733642578125, "global_step": 320451, "epoch": 2648} {"train_loss": -44.87289047241211, "global_step": 320452, "epoch": 2648} {"train_loss": -45.21883773803711, "global_step": 320453, "epoch": 2648} {"train_loss": -44.92228317260742, "global_step": 320454, "epoch": 2648} {"train_loss": -44.81821823120117, "global_step": 320455, "epoch": 2648} {"train_loss": -45.47148513793945, "global_step": 320456, "epoch": 2648} {"train_loss": -45.596858978271484, "global_step": 320457, "epoch": 2648} {"train_loss": -44.59764862060547, "global_step": 320458, "epoch": 2648} {"train_loss": -44.277889251708984, "global_step": 320459, "epoch": 2648} {"train_loss": -45.351966857910156, "global_step": 320460, "epoch": 2648} {"train_loss": -45.088069915771484, "global_step": 320461, "epoch": 2648} {"train_loss": -44.6180534362793, "global_step": 320462, "epoch": 2648} {"train_loss": -45.80709457397461, "global_step": 320463, "epoch": 2648} {"train_loss": -45.166908264160156, "global_step": 320464, "epoch": 2648} {"train_loss": -44.68396759033203, "global_step": 320465, "epoch": 2648} {"train_loss": -44.70368957519531, "global_step": 320466, "epoch": 2648} {"train_loss": -44.524085998535156, "global_step": 320467, "epoch": 2648} {"train_loss": -45.18536376953125, "global_step": 320468, "epoch": 2648} {"train_loss": -44.626625061035156, "global_step": 320469, "epoch": 2648} {"train_loss": -44.33806610107422, "global_step": 320470, "epoch": 2648} {"train_loss": -44.92466354370117, "global_step": 320471, "epoch": 2648} {"train_loss": -44.048377990722656, "global_step": 320472, "epoch": 2648} {"train_loss": -43.3701057434082, "global_step": 320473, "epoch": 2648} {"train_loss": -43.706764221191406, "global_step": 320474, "epoch": 2648} {"train_loss": -43.76025390625, "global_step": 320475, "epoch": 2648} {"train_loss": -44.91372299194336, "global_step": 320476, "epoch": 2648} {"train_loss": -44.3151969909668, "global_step": 320477, "epoch": 2648} {"train_loss": -42.945003509521484, "global_step": 320478, "epoch": 2648} {"train_loss": -42.217281341552734, "global_step": 320479, "epoch": 2648} {"train_loss": -42.8542594909668, "global_step": 320480, "epoch": 2648} {"train_loss": -42.62295913696289, "global_step": 320481, "epoch": 2648} {"train_loss": -43.41036605834961, "global_step": 320482, "epoch": 2648} {"train_loss": -43.41315841674805, "global_step": 320483, "epoch": 2648} {"train_loss": -43.899017333984375, "global_step": 320484, "epoch": 2648} {"train_loss": -43.76923370361328, "global_step": 320485, "epoch": 2648} {"train_loss": -43.419532775878906, "global_step": 320486, "epoch": 2648} {"train_loss": -42.640052795410156, "global_step": 320487, "epoch": 2648} {"train_loss": -43.75628662109375, "global_step": 320488, "epoch": 2648} {"train_loss": -44.0792121887207, "global_step": 320489, "epoch": 2648} {"train_loss": -42.46204376220703, "global_step": 320490, "epoch": 2648} {"train_loss": -42.973175048828125, "global_step": 320491, "epoch": 2648} {"train_loss": -42.245784759521484, "global_step": 320492, "epoch": 2648} {"train_loss": -40.95207595825195, "global_step": 320493, "epoch": 2648} {"train_loss": -43.66508102416992, "global_step": 320494, "epoch": 2648} {"train_loss": -43.34812545776367, "global_step": 320495, "epoch": 2648} {"train_loss": -41.5710563659668, "global_step": 320496, "epoch": 2648} {"train_loss": -40.9281005859375, "global_step": 320497, "epoch": 2648} {"train_loss": -42.64242172241211, "global_step": 320498, "epoch": 2648} {"train_loss": -41.00090026855469, "global_step": 320499, "epoch": 2648} {"train_loss": -40.50659942626953, "global_step": 320500, "epoch": 2648} {"train_loss": -42.6128044128418, "global_step": 320501, "epoch": 2648} {"train_loss": -41.589698791503906, "global_step": 320502, "epoch": 2648} {"train_loss": -42.170772552490234, "global_step": 320503, "epoch": 2648} {"train_loss": -43.33721923828125, "global_step": 320504, "epoch": 2648} {"train_loss": -42.28662109375, "global_step": 320505, "epoch": 2648} {"train_loss": -41.920555114746094, "global_step": 320506, "epoch": 2648} {"train_loss": -42.75680160522461, "global_step": 320507, "epoch": 2648} {"train_loss": -41.6309928894043, "global_step": 320508, "epoch": 2648} {"train_loss": -42.097869873046875, "global_step": 320509, "epoch": 2648} {"train_loss": -43.6243896484375, "global_step": 320510, "epoch": 2648} {"train_loss": -41.91572189331055, "global_step": 320511, "epoch": 2648} {"train_loss": -42.45610427856445, "global_step": 320512, "epoch": 2648} {"train_loss": -42.51582717895508, "global_step": 320513, "epoch": 2648} {"train_loss": -42.298683166503906, "global_step": 320514, "epoch": 2648} {"train_loss": -43.95154571533203, "global_step": 320515, "epoch": 2648} {"train_loss": -43.50288009643555, "global_step": 320516, "epoch": 2648} {"train_loss": -42.899688720703125, "global_step": 320517, "epoch": 2648} {"train_loss": -43.484615325927734, "global_step": 320518, "epoch": 2648} {"train_loss": -43.46590805053711, "global_step": 320519, "epoch": 2648} {"train_loss": -43.046669006347656, "global_step": 320520, "epoch": 2648} {"train_loss": -43.88442611694336, "global_step": 320521, "epoch": 2648} {"train_loss": -43.326717376708984, "global_step": 320522, "epoch": 2648} {"train_loss": -43.737361907958984, "global_step": 320523, "epoch": 2648} {"train_loss": -43.465789794921875, "global_step": 320524, "epoch": 2648} {"train_loss": -44.2097053527832, "global_step": 320525, "epoch": 2648} {"train_loss": -44.057891845703125, "global_step": 320526, "epoch": 2648} {"train_loss": -44.2864875793457, "global_step": 320527, "epoch": 2648} {"train_loss": -43.96757151075631, "global_step": 320528, "epoch": 2648, "val_loss": 2547098.25} {"train_loss": -44.32929611206055, "global_step": 320529, "epoch": 2649} {"train_loss": -44.686614990234375, "global_step": 320530, "epoch": 2649} {"train_loss": -44.1435546875, "global_step": 320531, "epoch": 2649} {"train_loss": -44.32900619506836, "global_step": 320532, "epoch": 2649} {"train_loss": -44.54127502441406, "global_step": 320533, "epoch": 2649} {"train_loss": -44.133724212646484, "global_step": 320534, "epoch": 2649} {"train_loss": -44.330501556396484, "global_step": 320535, "epoch": 2649} {"train_loss": -44.52528762817383, "global_step": 320536, "epoch": 2649} {"train_loss": -44.639286041259766, "global_step": 320537, "epoch": 2649} {"train_loss": -44.10896301269531, "global_step": 320538, "epoch": 2649} {"train_loss": -44.76310348510742, "global_step": 320539, "epoch": 2649} {"train_loss": -44.423160552978516, "global_step": 320540, "epoch": 2649} {"train_loss": -44.28757858276367, "global_step": 320541, "epoch": 2649} {"train_loss": -44.65433120727539, "global_step": 320542, "epoch": 2649} {"train_loss": -44.6499137878418, "global_step": 320543, "epoch": 2649} {"train_loss": -44.601104736328125, "global_step": 320544, "epoch": 2649} {"train_loss": -44.638763427734375, "global_step": 320545, "epoch": 2649} {"train_loss": -44.52088165283203, "global_step": 320546, "epoch": 2649} {"train_loss": -44.716766357421875, "global_step": 320547, "epoch": 2649} {"train_loss": -44.68773651123047, "global_step": 320548, "epoch": 2649} {"train_loss": -44.8453254699707, "global_step": 320549, "epoch": 2649} {"train_loss": -44.82082748413086, "global_step": 320550, "epoch": 2649} {"train_loss": -45.045654296875, "global_step": 320551, "epoch": 2649} {"train_loss": -44.75252151489258, "global_step": 320552, "epoch": 2649} {"train_loss": -44.344482421875, "global_step": 320553, "epoch": 2649} {"train_loss": -44.47463607788086, "global_step": 320554, "epoch": 2649} {"train_loss": -45.25579833984375, "global_step": 320555, "epoch": 2649} {"train_loss": -43.714393615722656, "global_step": 320556, "epoch": 2649} {"train_loss": -44.709922790527344, "global_step": 320557, "epoch": 2649} {"train_loss": -45.228633880615234, "global_step": 320558, "epoch": 2649} {"train_loss": -44.352134704589844, "global_step": 320559, "epoch": 2649} {"train_loss": -44.34434127807617, "global_step": 320560, "epoch": 2649} {"train_loss": -45.11409378051758, "global_step": 320561, "epoch": 2649} {"train_loss": -44.1889533996582, "global_step": 320562, "epoch": 2649} {"train_loss": -45.28520202636719, "global_step": 320563, "epoch": 2649} {"train_loss": -45.135494232177734, "global_step": 320564, "epoch": 2649} {"train_loss": -44.15699768066406, "global_step": 320565, "epoch": 2649} {"train_loss": -44.3001823425293, "global_step": 320566, "epoch": 2649} {"train_loss": -44.984100341796875, "global_step": 320567, "epoch": 2649} {"train_loss": -44.305667877197266, "global_step": 320568, "epoch": 2649} {"train_loss": -44.4965705871582, "global_step": 320569, "epoch": 2649} {"train_loss": -44.93830871582031, "global_step": 320570, "epoch": 2649} {"train_loss": -44.23089599609375, "global_step": 320571, "epoch": 2649} {"train_loss": -44.56056213378906, "global_step": 320572, "epoch": 2649} {"train_loss": -44.217010498046875, "global_step": 320573, "epoch": 2649} {"train_loss": -44.60250473022461, "global_step": 320574, "epoch": 2649} {"train_loss": -44.6694450378418, "global_step": 320575, "epoch": 2649} {"train_loss": -44.15775680541992, "global_step": 320576, "epoch": 2649} {"train_loss": -43.3056526184082, "global_step": 320577, "epoch": 2649} {"train_loss": -43.89143371582031, "global_step": 320578, "epoch": 2649} {"train_loss": -44.46944046020508, "global_step": 320579, "epoch": 2649} {"train_loss": -44.31229782104492, "global_step": 320580, "epoch": 2649} {"train_loss": -44.370243072509766, "global_step": 320581, "epoch": 2649} {"train_loss": -44.44648361206055, "global_step": 320582, "epoch": 2649} {"train_loss": -44.069725036621094, "global_step": 320583, "epoch": 2649} {"train_loss": -44.524715423583984, "global_step": 320584, "epoch": 2649} {"train_loss": -44.85601043701172, "global_step": 320585, "epoch": 2649} {"train_loss": -43.92654037475586, "global_step": 320586, "epoch": 2649} {"train_loss": -44.78585433959961, "global_step": 320587, "epoch": 2649} {"train_loss": -44.44060516357422, "global_step": 320588, "epoch": 2649} {"train_loss": -44.943992614746094, "global_step": 320589, "epoch": 2649} {"train_loss": -44.85292434692383, "global_step": 320590, "epoch": 2649} {"train_loss": -44.75792694091797, "global_step": 320591, "epoch": 2649} {"train_loss": -45.26613998413086, "global_step": 320592, "epoch": 2649} {"train_loss": -44.779781341552734, "global_step": 320593, "epoch": 2649} {"train_loss": -44.26871871948242, "global_step": 320594, "epoch": 2649} {"train_loss": -44.12397384643555, "global_step": 320595, "epoch": 2649} {"train_loss": -43.52501678466797, "global_step": 320596, "epoch": 2649} {"train_loss": -44.237545013427734, "global_step": 320597, "epoch": 2649} {"train_loss": -44.887569427490234, "global_step": 320598, "epoch": 2649} {"train_loss": -43.90176010131836, "global_step": 320599, "epoch": 2649} {"train_loss": -44.27036666870117, "global_step": 320600, "epoch": 2649} {"train_loss": -44.06256866455078, "global_step": 320601, "epoch": 2649} {"train_loss": -43.61594009399414, "global_step": 320602, "epoch": 2649} {"train_loss": -42.50304412841797, "global_step": 320603, "epoch": 2649} {"train_loss": -43.76839828491211, "global_step": 320604, "epoch": 2649} {"train_loss": -43.372562408447266, "global_step": 320605, "epoch": 2649} {"train_loss": -44.495338439941406, "global_step": 320606, "epoch": 2649} {"train_loss": -42.99753189086914, "global_step": 320607, "epoch": 2649} {"train_loss": -43.82520294189453, "global_step": 320608, "epoch": 2649} {"train_loss": -44.113155364990234, "global_step": 320609, "epoch": 2649} {"train_loss": -43.3281135559082, "global_step": 320610, "epoch": 2649} {"train_loss": -43.90537643432617, "global_step": 320611, "epoch": 2649} {"train_loss": -44.2394905090332, "global_step": 320612, "epoch": 2649} {"train_loss": -41.8112907409668, "global_step": 320613, "epoch": 2649} {"train_loss": -43.54252243041992, "global_step": 320614, "epoch": 2649} {"train_loss": -44.03736877441406, "global_step": 320615, "epoch": 2649} {"train_loss": -43.308345794677734, "global_step": 320616, "epoch": 2649} {"train_loss": -43.50921630859375, "global_step": 320617, "epoch": 2649} {"train_loss": -43.80082321166992, "global_step": 320618, "epoch": 2649} {"train_loss": -43.374000549316406, "global_step": 320619, "epoch": 2649} {"train_loss": -44.46372604370117, "global_step": 320620, "epoch": 2649} {"train_loss": -43.79213333129883, "global_step": 320621, "epoch": 2649} {"train_loss": -44.24093246459961, "global_step": 320622, "epoch": 2649} {"train_loss": -44.4755859375, "global_step": 320623, "epoch": 2649} {"train_loss": -44.13707733154297, "global_step": 320624, "epoch": 2649} {"train_loss": -44.44964599609375, "global_step": 320625, "epoch": 2649} {"train_loss": -44.098365783691406, "global_step": 320626, "epoch": 2649} {"train_loss": -44.86690139770508, "global_step": 320627, "epoch": 2649} {"train_loss": -43.77339553833008, "global_step": 320628, "epoch": 2649} {"train_loss": -43.94537353515625, "global_step": 320629, "epoch": 2649} {"train_loss": -44.3216667175293, "global_step": 320630, "epoch": 2649} {"train_loss": -43.650943756103516, "global_step": 320631, "epoch": 2649} {"train_loss": -43.56266403198242, "global_step": 320632, "epoch": 2649} {"train_loss": -44.07304000854492, "global_step": 320633, "epoch": 2649} {"train_loss": -44.48379135131836, "global_step": 320634, "epoch": 2649} {"train_loss": -43.728179931640625, "global_step": 320635, "epoch": 2649} {"train_loss": -44.3113899230957, "global_step": 320636, "epoch": 2649} {"train_loss": -44.200565338134766, "global_step": 320637, "epoch": 2649} {"train_loss": -44.570125579833984, "global_step": 320638, "epoch": 2649} {"train_loss": -44.30233383178711, "global_step": 320639, "epoch": 2649} {"train_loss": -44.07648468017578, "global_step": 320640, "epoch": 2649} {"train_loss": -44.0820198059082, "global_step": 320641, "epoch": 2649} {"train_loss": -44.14021682739258, "global_step": 320642, "epoch": 2649} {"train_loss": -44.65315628051758, "global_step": 320643, "epoch": 2649} {"train_loss": -43.32514572143555, "global_step": 320644, "epoch": 2649} {"train_loss": -43.702980041503906, "global_step": 320645, "epoch": 2649} {"train_loss": -44.115482330322266, "global_step": 320646, "epoch": 2649} {"train_loss": -44.590126037597656, "global_step": 320647, "epoch": 2649} {"train_loss": -43.472267150878906, "global_step": 320648, "epoch": 2649} {"train_loss": -44.246496531588974, "global_step": 320649, "epoch": 2649, "val_loss": 2482711.5} {"train_loss": -43.47666549682617, "global_step": 320650, "epoch": 2650} {"train_loss": -44.113189697265625, "global_step": 320651, "epoch": 2650} {"train_loss": -44.60558319091797, "global_step": 320652, "epoch": 2650} {"train_loss": -43.26009750366211, "global_step": 320653, "epoch": 2650} {"train_loss": -44.18534469604492, "global_step": 320654, "epoch": 2650} {"train_loss": -45.117000579833984, "global_step": 320655, "epoch": 2650} {"train_loss": -44.736572265625, "global_step": 320656, "epoch": 2650} {"train_loss": -44.14299774169922, "global_step": 320657, "epoch": 2650} {"train_loss": -44.65757751464844, "global_step": 320658, "epoch": 2650} {"train_loss": -44.8308219909668, "global_step": 320659, "epoch": 2650} {"train_loss": -44.61078643798828, "global_step": 320660, "epoch": 2650} {"train_loss": -44.04999542236328, "global_step": 320661, "epoch": 2650} {"train_loss": -44.0790901184082, "global_step": 320662, "epoch": 2650} {"train_loss": -45.031341552734375, "global_step": 320663, "epoch": 2650} {"train_loss": -44.78279113769531, "global_step": 320664, "epoch": 2650} {"train_loss": -43.8782958984375, "global_step": 320665, "epoch": 2650} {"train_loss": -44.39741897583008, "global_step": 320666, "epoch": 2650} {"train_loss": -45.064666748046875, "global_step": 320667, "epoch": 2650} {"train_loss": -43.784828186035156, "global_step": 320668, "epoch": 2650} {"train_loss": -42.46525955200195, "global_step": 320669, "epoch": 2650} {"train_loss": -44.86466598510742, "global_step": 320670, "epoch": 2650} {"train_loss": -43.87559127807617, "global_step": 320671, "epoch": 2650} {"train_loss": -43.4227294921875, "global_step": 320672, "epoch": 2650} {"train_loss": -44.215206146240234, "global_step": 320673, "epoch": 2650} {"train_loss": -44.827327728271484, "global_step": 320674, "epoch": 2650} {"train_loss": -44.34159469604492, "global_step": 320675, "epoch": 2650} {"train_loss": -42.4211311340332, "global_step": 320676, "epoch": 2650} {"train_loss": -44.1651611328125, "global_step": 320677, "epoch": 2650} {"train_loss": -44.278297424316406, "global_step": 320678, "epoch": 2650} {"train_loss": -44.276973724365234, "global_step": 320679, "epoch": 2650} {"train_loss": -44.22479248046875, "global_step": 320680, "epoch": 2650} {"train_loss": -44.5745849609375, "global_step": 320681, "epoch": 2650} {"train_loss": -44.62702560424805, "global_step": 320682, "epoch": 2650} {"train_loss": -44.85614013671875, "global_step": 320683, "epoch": 2650} {"train_loss": -44.7498893737793, "global_step": 320684, "epoch": 2650} {"train_loss": -44.471649169921875, "global_step": 320685, "epoch": 2650} {"train_loss": -44.92689514160156, "global_step": 320686, "epoch": 2650} {"train_loss": -44.437530517578125, "global_step": 320687, "epoch": 2650} {"train_loss": -45.038631439208984, "global_step": 320688, "epoch": 2650} {"train_loss": -44.506465911865234, "global_step": 320689, "epoch": 2650} {"train_loss": -45.04674530029297, "global_step": 320690, "epoch": 2650} {"train_loss": -44.812103271484375, "global_step": 320691, "epoch": 2650} {"train_loss": -44.52961349487305, "global_step": 320692, "epoch": 2650} {"train_loss": -43.748451232910156, "global_step": 320693, "epoch": 2650} {"train_loss": -44.398956298828125, "global_step": 320694, "epoch": 2650} {"train_loss": -44.40298843383789, "global_step": 320695, "epoch": 2650} {"train_loss": -43.9459342956543, "global_step": 320696, "epoch": 2650} {"train_loss": -45.14717483520508, "global_step": 320697, "epoch": 2650} {"train_loss": -44.8210563659668, "global_step": 320698, "epoch": 2650} {"train_loss": -44.083274841308594, "global_step": 320699, "epoch": 2650} {"train_loss": -44.697425842285156, "global_step": 320700, "epoch": 2650} {"train_loss": -45.33845901489258, "global_step": 320701, "epoch": 2650} {"train_loss": -44.339412689208984, "global_step": 320702, "epoch": 2650} {"train_loss": -43.62075424194336, "global_step": 320703, "epoch": 2650} {"train_loss": -43.408660888671875, "global_step": 320704, "epoch": 2650} {"train_loss": -43.7017822265625, "global_step": 320705, "epoch": 2650} {"train_loss": -43.42694091796875, "global_step": 320706, "epoch": 2650} {"train_loss": -43.5808219909668, "global_step": 320707, "epoch": 2650} {"train_loss": -44.410396575927734, "global_step": 320708, "epoch": 2650} {"train_loss": -42.419212341308594, "global_step": 320709, "epoch": 2650} {"train_loss": -42.272789001464844, "global_step": 320710, "epoch": 2650} {"train_loss": -43.821651458740234, "global_step": 320711, "epoch": 2650} {"train_loss": -42.87087631225586, "global_step": 320712, "epoch": 2650} {"train_loss": -42.4741096496582, "global_step": 320713, "epoch": 2650} {"train_loss": -42.73637771606445, "global_step": 320714, "epoch": 2650} {"train_loss": -42.693721771240234, "global_step": 320715, "epoch": 2650} {"train_loss": -43.905208587646484, "global_step": 320716, "epoch": 2650} {"train_loss": -42.472267150878906, "global_step": 320717, "epoch": 2650} {"train_loss": -43.59550094604492, "global_step": 320718, "epoch": 2650} {"train_loss": -42.266422271728516, "global_step": 320719, "epoch": 2650} {"train_loss": -43.50362777709961, "global_step": 320720, "epoch": 2650} {"train_loss": -42.349056243896484, "global_step": 320721, "epoch": 2650} {"train_loss": -41.55778503417969, "global_step": 320722, "epoch": 2650} {"train_loss": -44.30866622924805, "global_step": 320723, "epoch": 2650} {"train_loss": -42.729278564453125, "global_step": 320724, "epoch": 2650} {"train_loss": -40.832618713378906, "global_step": 320725, "epoch": 2650} {"train_loss": -42.564205169677734, "global_step": 320726, "epoch": 2650} {"train_loss": -44.062225341796875, "global_step": 320727, "epoch": 2650} {"train_loss": -41.749752044677734, "global_step": 320728, "epoch": 2650} {"train_loss": -42.556854248046875, "global_step": 320729, "epoch": 2650} {"train_loss": -43.41767501831055, "global_step": 320730, "epoch": 2650} {"train_loss": -41.375972747802734, "global_step": 320731, "epoch": 2650} {"train_loss": -42.09206008911133, "global_step": 320732, "epoch": 2650} {"train_loss": -42.99638748168945, "global_step": 320733, "epoch": 2650} {"train_loss": -42.88650894165039, "global_step": 320734, "epoch": 2650} {"train_loss": -42.99988555908203, "global_step": 320735, "epoch": 2650} {"train_loss": -43.49235916137695, "global_step": 320736, "epoch": 2650} {"train_loss": -41.68140411376953, "global_step": 320737, "epoch": 2650} {"train_loss": -43.84904479980469, "global_step": 320738, "epoch": 2650} {"train_loss": -42.48476028442383, "global_step": 320739, "epoch": 2650} {"train_loss": -41.97173309326172, "global_step": 320740, "epoch": 2650} {"train_loss": -43.666683197021484, "global_step": 320741, "epoch": 2650} {"train_loss": -43.07183074951172, "global_step": 320742, "epoch": 2650} {"train_loss": -42.41887283325195, "global_step": 320743, "epoch": 2650} {"train_loss": -41.42373275756836, "global_step": 320744, "epoch": 2650} {"train_loss": -43.200462341308594, "global_step": 320745, "epoch": 2650} {"train_loss": -42.30595016479492, "global_step": 320746, "epoch": 2650} {"train_loss": -42.27503204345703, "global_step": 320747, "epoch": 2650} {"train_loss": -43.6400146484375, "global_step": 320748, "epoch": 2650} {"train_loss": -42.69009780883789, "global_step": 320749, "epoch": 2650} {"train_loss": -41.48469543457031, "global_step": 320750, "epoch": 2650} {"train_loss": -42.92658615112305, "global_step": 320751, "epoch": 2650} {"train_loss": -42.813594818115234, "global_step": 320752, "epoch": 2650} {"train_loss": -42.97124099731445, "global_step": 320753, "epoch": 2650} {"train_loss": -43.12351608276367, "global_step": 320754, "epoch": 2650} {"train_loss": -43.71389389038086, "global_step": 320755, "epoch": 2650} {"train_loss": -41.609886169433594, "global_step": 320756, "epoch": 2650} {"train_loss": -42.99208068847656, "global_step": 320757, "epoch": 2650} {"train_loss": -43.1489372253418, "global_step": 320758, "epoch": 2650} {"train_loss": -41.71537780761719, "global_step": 320759, "epoch": 2650} {"train_loss": -42.46844482421875, "global_step": 320760, "epoch": 2650} {"train_loss": -41.78467559814453, "global_step": 320761, "epoch": 2650} {"train_loss": -43.58989334106445, "global_step": 320762, "epoch": 2650} {"train_loss": -42.138832092285156, "global_step": 320763, "epoch": 2650} {"train_loss": -43.969749450683594, "global_step": 320764, "epoch": 2650} {"train_loss": -42.7597770690918, "global_step": 320765, "epoch": 2650} {"train_loss": -42.8753547668457, "global_step": 320766, "epoch": 2650} {"train_loss": -42.77070999145508, "global_step": 320767, "epoch": 2650} {"train_loss": -42.81360626220703, "global_step": 320768, "epoch": 2650} {"train_loss": -43.30175018310547, "global_step": 320769, "epoch": 2650} {"train_loss": -43.506565062467715, "global_step": 320770, "epoch": 2650, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4400000": 1.0, "test/sim_max_reward_4400001": 1.0, "test/sim_max_reward_4400002": 1.0, "test/sim_max_reward_4400003": 1.0, "test/sim_max_reward_4400004": 1.0, "test/sim_max_reward_4400005": 1.0, "test/sim_max_reward_4400006": 1.0, "test/sim_max_reward_4400007": 1.0, "test/sim_max_reward_4400008": 1.0, "test/sim_max_reward_4400009": 1.0, "test/sim_max_reward_4400010": 1.0, "test/sim_max_reward_4400011": 1.0, "test/sim_max_reward_4400012": 1.0, "test/sim_max_reward_4400013": 1.0, "test/sim_max_reward_4400014": 1.0, "test/sim_max_reward_4400015": 1.0, "test/sim_max_reward_4400016": 1.0, "test/sim_max_reward_4400017": 1.0, "test/sim_max_reward_4400018": 1.0, "test/sim_max_reward_4400019": 1.0, "test/sim_max_reward_4400020": 1.0, "test/sim_max_reward_4400021": 1.0, "train/mean_score": 1.0, "test/mean_score": 1.0, "val_loss": 2504409.75} {"train_loss": -42.57428741455078, "global_step": 320771, "epoch": 2651} {"train_loss": -43.939453125, "global_step": 320772, "epoch": 2651} {"train_loss": -43.24380111694336, "global_step": 320773, "epoch": 2651} {"train_loss": -43.823341369628906, "global_step": 320774, "epoch": 2651} {"train_loss": -44.482540130615234, "global_step": 320775, "epoch": 2651} {"train_loss": -42.9395637512207, "global_step": 320776, "epoch": 2651} {"train_loss": -43.22759246826172, "global_step": 320777, "epoch": 2651} {"train_loss": -44.346466064453125, "global_step": 320778, "epoch": 2651} {"train_loss": -43.90011215209961, "global_step": 320779, "epoch": 2651} {"train_loss": -44.56740951538086, "global_step": 320780, "epoch": 2651} {"train_loss": -43.79409408569336, "global_step": 320781, "epoch": 2651} {"train_loss": -44.0186882019043, "global_step": 320782, "epoch": 2651} {"train_loss": -44.26756286621094, "global_step": 320783, "epoch": 2651} {"train_loss": -44.5953254699707, "global_step": 320784, "epoch": 2651} {"train_loss": -43.87966537475586, "global_step": 320785, "epoch": 2651} {"train_loss": -43.73125076293945, "global_step": 320786, "epoch": 2651} {"train_loss": -44.002525329589844, "global_step": 320787, "epoch": 2651} {"train_loss": -44.0279541015625, "global_step": 320788, "epoch": 2651} {"train_loss": -43.32680130004883, "global_step": 320789, "epoch": 2651} {"train_loss": -44.848785400390625, "global_step": 320790, "epoch": 2651} {"train_loss": -44.28231430053711, "global_step": 320791, "epoch": 2651} {"train_loss": -44.36865997314453, "global_step": 320792, "epoch": 2651} {"train_loss": -44.54191207885742, "global_step": 320793, "epoch": 2651} {"train_loss": -44.12776565551758, "global_step": 320794, "epoch": 2651} {"train_loss": -44.81637954711914, "global_step": 320795, "epoch": 2651} {"train_loss": -44.18819808959961, "global_step": 320796, "epoch": 2651} {"train_loss": -44.27054977416992, "global_step": 320797, "epoch": 2651} {"train_loss": -44.580230712890625, "global_step": 320798, "epoch": 2651} {"train_loss": -44.553955078125, "global_step": 320799, "epoch": 2651} {"train_loss": -44.236507415771484, "global_step": 320800, "epoch": 2651} {"train_loss": -44.77535629272461, "global_step": 320801, "epoch": 2651} {"train_loss": -44.527339935302734, "global_step": 320802, "epoch": 2651} {"train_loss": -43.65717315673828, "global_step": 320803, "epoch": 2651} {"train_loss": -44.63417434692383, "global_step": 320804, "epoch": 2651} {"train_loss": -44.01001739501953, "global_step": 320805, "epoch": 2651} {"train_loss": -44.79989242553711, "global_step": 320806, "epoch": 2651} {"train_loss": -44.15131378173828, "global_step": 320807, "epoch": 2651} {"train_loss": -44.930206298828125, "global_step": 320808, "epoch": 2651} {"train_loss": -44.769508361816406, "global_step": 320809, "epoch": 2651} {"train_loss": -44.625404357910156, "global_step": 320810, "epoch": 2651} {"train_loss": -44.99174880981445, "global_step": 320811, "epoch": 2651} {"train_loss": -44.50282287597656, "global_step": 320812, "epoch": 2651} {"train_loss": -44.88222122192383, "global_step": 320813, "epoch": 2651} {"train_loss": -45.15152359008789, "global_step": 320814, "epoch": 2651} {"train_loss": -44.54020309448242, "global_step": 320815, "epoch": 2651} {"train_loss": -44.99470138549805, "global_step": 320816, "epoch": 2651} {"train_loss": -44.76145553588867, "global_step": 320817, "epoch": 2651} {"train_loss": -45.10017013549805, "global_step": 320818, "epoch": 2651} {"train_loss": -44.69735336303711, "global_step": 320819, "epoch": 2651} {"train_loss": -45.01463317871094, "global_step": 320820, "epoch": 2651} {"train_loss": -45.33506393432617, "global_step": 320821, "epoch": 2651} {"train_loss": -45.0298957824707, "global_step": 320822, "epoch": 2651} {"train_loss": -45.26250457763672, "global_step": 320823, "epoch": 2651} {"train_loss": -45.3731575012207, "global_step": 320824, "epoch": 2651} {"train_loss": -44.71761703491211, "global_step": 320825, "epoch": 2651} {"train_loss": -45.17363357543945, "global_step": 320826, "epoch": 2651} {"train_loss": -45.37308883666992, "global_step": 320827, "epoch": 2651} {"train_loss": -45.07699203491211, "global_step": 320828, "epoch": 2651} {"train_loss": -45.37335968017578, "global_step": 320829, "epoch": 2651} {"train_loss": -44.80335235595703, "global_step": 320830, "epoch": 2651} {"train_loss": -45.2601318359375, "global_step": 320831, "epoch": 2651} {"train_loss": -45.56722640991211, "global_step": 320832, "epoch": 2651} {"train_loss": -44.75657653808594, "global_step": 320833, "epoch": 2651} {"train_loss": -45.239402770996094, "global_step": 320834, "epoch": 2651} {"train_loss": -44.829036712646484, "global_step": 320835, "epoch": 2651} {"train_loss": -44.9034538269043, "global_step": 320836, "epoch": 2651} {"train_loss": -45.14423370361328, "global_step": 320837, "epoch": 2651} {"train_loss": -44.4306640625, "global_step": 320838, "epoch": 2651} {"train_loss": -44.93716049194336, "global_step": 320839, "epoch": 2651} {"train_loss": -45.28241729736328, "global_step": 320840, "epoch": 2651} {"train_loss": -44.01468276977539, "global_step": 320841, "epoch": 2651} {"train_loss": -43.91689682006836, "global_step": 320842, "epoch": 2651} {"train_loss": -44.8305549621582, "global_step": 320843, "epoch": 2651} {"train_loss": -44.55214309692383, "global_step": 320844, "epoch": 2651} {"train_loss": -44.695457458496094, "global_step": 320845, "epoch": 2651} {"train_loss": -44.77370071411133, "global_step": 320846, "epoch": 2651} {"train_loss": -42.772247314453125, "global_step": 320847, "epoch": 2651} {"train_loss": -43.55839157104492, "global_step": 320848, "epoch": 2651} {"train_loss": -45.352054595947266, "global_step": 320849, "epoch": 2651} {"train_loss": -43.4473762512207, "global_step": 320850, "epoch": 2651} {"train_loss": -43.16270065307617, "global_step": 320851, "epoch": 2651} {"train_loss": -44.633235931396484, "global_step": 320852, "epoch": 2651} {"train_loss": -42.786224365234375, "global_step": 320853, "epoch": 2651} {"train_loss": -40.94380569458008, "global_step": 320854, "epoch": 2651} {"train_loss": -44.24691390991211, "global_step": 320855, "epoch": 2651} {"train_loss": -39.39021682739258, "global_step": 320856, "epoch": 2651} {"train_loss": -43.87776565551758, "global_step": 320857, "epoch": 2651} {"train_loss": -39.62679672241211, "global_step": 320858, "epoch": 2651} {"train_loss": -42.70893096923828, "global_step": 320859, "epoch": 2651} {"train_loss": -42.23107147216797, "global_step": 320860, "epoch": 2651} {"train_loss": -42.209896087646484, "global_step": 320861, "epoch": 2651} {"train_loss": -42.91346740722656, "global_step": 320862, "epoch": 2651} {"train_loss": -41.313106536865234, "global_step": 320863, "epoch": 2651} {"train_loss": -43.140220642089844, "global_step": 320864, "epoch": 2651} {"train_loss": -42.399295806884766, "global_step": 320865, "epoch": 2651} {"train_loss": -43.32246780395508, "global_step": 320866, "epoch": 2651} {"train_loss": -42.57354736328125, "global_step": 320867, "epoch": 2651} {"train_loss": -44.02211380004883, "global_step": 320868, "epoch": 2651} {"train_loss": -43.679141998291016, "global_step": 320869, "epoch": 2651} {"train_loss": -42.905941009521484, "global_step": 320870, "epoch": 2651} {"train_loss": -44.1644172668457, "global_step": 320871, "epoch": 2651} {"train_loss": -43.388023376464844, "global_step": 320872, "epoch": 2651} {"train_loss": -43.6597785949707, "global_step": 320873, "epoch": 2651} {"train_loss": -43.350372314453125, "global_step": 320874, "epoch": 2651} {"train_loss": -43.48299789428711, "global_step": 320875, "epoch": 2651} {"train_loss": -43.5081787109375, "global_step": 320876, "epoch": 2651} {"train_loss": -42.3069953918457, "global_step": 320877, "epoch": 2651} {"train_loss": -43.94586181640625, "global_step": 320878, "epoch": 2651} {"train_loss": -42.9958610534668, "global_step": 320879, "epoch": 2651} {"train_loss": -43.27315902709961, "global_step": 320880, "epoch": 2651} {"train_loss": -43.01844787597656, "global_step": 320881, "epoch": 2651} {"train_loss": -41.81599807739258, "global_step": 320882, "epoch": 2651} {"train_loss": -42.98688507080078, "global_step": 320883, "epoch": 2651} {"train_loss": -43.131797790527344, "global_step": 320884, "epoch": 2651} {"train_loss": -43.1629753112793, "global_step": 320885, "epoch": 2651} {"train_loss": -42.97010040283203, "global_step": 320886, "epoch": 2651} {"train_loss": -43.277252197265625, "global_step": 320887, "epoch": 2651} {"train_loss": -43.997894287109375, "global_step": 320888, "epoch": 2651} {"train_loss": -43.370643615722656, "global_step": 320889, "epoch": 2651} {"train_loss": -44.30903244018555, "global_step": 320890, "epoch": 2651} {"train_loss": -43.97375406312548, "global_step": 320891, "epoch": 2651, "val_loss": 2728983.5} {"train_loss": -44.07900619506836, "global_step": 320892, "epoch": 2652} {"train_loss": -43.9058952331543, "global_step": 320893, "epoch": 2652} {"train_loss": -43.0124626159668, "global_step": 320894, "epoch": 2652} {"train_loss": -44.41916275024414, "global_step": 320895, "epoch": 2652} {"train_loss": -43.98517990112305, "global_step": 320896, "epoch": 2652} {"train_loss": -43.78125762939453, "global_step": 320897, "epoch": 2652} {"train_loss": -43.79444885253906, "global_step": 320898, "epoch": 2652} {"train_loss": -44.247962951660156, "global_step": 320899, "epoch": 2652} {"train_loss": -44.36319351196289, "global_step": 320900, "epoch": 2652} {"train_loss": -44.220001220703125, "global_step": 320901, "epoch": 2652} {"train_loss": -44.59762191772461, "global_step": 320902, "epoch": 2652} {"train_loss": -44.22269821166992, "global_step": 320903, "epoch": 2652} {"train_loss": -44.54269027709961, "global_step": 320904, "epoch": 2652} {"train_loss": -43.937355041503906, "global_step": 320905, "epoch": 2652} {"train_loss": -44.36825180053711, "global_step": 320906, "epoch": 2652} {"train_loss": -44.40654754638672, "global_step": 320907, "epoch": 2652} {"train_loss": -44.529205322265625, "global_step": 320908, "epoch": 2652} {"train_loss": -44.41904830932617, "global_step": 320909, "epoch": 2652} {"train_loss": -44.49174880981445, "global_step": 320910, "epoch": 2652} {"train_loss": -44.52995681762695, "global_step": 320911, "epoch": 2652} {"train_loss": -44.3023796081543, "global_step": 320912, "epoch": 2652} {"train_loss": -44.9385986328125, "global_step": 320913, "epoch": 2652} {"train_loss": -44.78656768798828, "global_step": 320914, "epoch": 2652} {"train_loss": -44.8239860534668, "global_step": 320915, "epoch": 2652} {"train_loss": -44.96034622192383, "global_step": 320916, "epoch": 2652} {"train_loss": -44.90753173828125, "global_step": 320917, "epoch": 2652} {"train_loss": -44.591392517089844, "global_step": 320918, "epoch": 2652} {"train_loss": -44.8408203125, "global_step": 320919, "epoch": 2652} {"train_loss": -45.02239990234375, "global_step": 320920, "epoch": 2652} {"train_loss": -44.91720199584961, "global_step": 320921, "epoch": 2652} {"train_loss": -44.68404769897461, "global_step": 320922, "epoch": 2652} {"train_loss": -45.24998092651367, "global_step": 320923, "epoch": 2652} {"train_loss": -45.24833679199219, "global_step": 320924, "epoch": 2652} {"train_loss": -44.69936752319336, "global_step": 320925, "epoch": 2652} {"train_loss": -45.184749603271484, "global_step": 320926, "epoch": 2652} {"train_loss": -45.395877838134766, "global_step": 320927, "epoch": 2652} {"train_loss": -45.35652542114258, "global_step": 320928, "epoch": 2652} {"train_loss": -45.0183219909668, "global_step": 320929, "epoch": 2652} {"train_loss": -45.05012130737305, "global_step": 320930, "epoch": 2652} {"train_loss": -45.4099006652832, "global_step": 320931, "epoch": 2652} {"train_loss": -45.62496566772461, "global_step": 320932, "epoch": 2652} {"train_loss": -45.51343536376953, "global_step": 320933, "epoch": 2652} {"train_loss": -45.232421875, "global_step": 320934, "epoch": 2652} {"train_loss": -45.63871383666992, "global_step": 320935, "epoch": 2652} {"train_loss": -45.57365798950195, "global_step": 320936, "epoch": 2652} {"train_loss": -44.96026611328125, "global_step": 320937, "epoch": 2652} {"train_loss": -45.26398849487305, "global_step": 320938, "epoch": 2652} {"train_loss": -45.4251823425293, "global_step": 320939, "epoch": 2652} {"train_loss": -45.62095642089844, "global_step": 320940, "epoch": 2652} {"train_loss": -45.085506439208984, "global_step": 320941, "epoch": 2652} {"train_loss": -45.32345199584961, "global_step": 320942, "epoch": 2652} {"train_loss": -45.120330810546875, "global_step": 320943, "epoch": 2652} {"train_loss": -45.537025451660156, "global_step": 320944, "epoch": 2652} {"train_loss": -45.82810974121094, "global_step": 320945, "epoch": 2652} {"train_loss": -45.34379959106445, "global_step": 320946, "epoch": 2652} {"train_loss": -45.50508117675781, "global_step": 320947, "epoch": 2652} {"train_loss": -45.46684646606445, "global_step": 320948, "epoch": 2652} {"train_loss": -45.5452766418457, "global_step": 320949, "epoch": 2652} {"train_loss": -44.57769775390625, "global_step": 320950, "epoch": 2652} {"train_loss": -44.77616882324219, "global_step": 320951, "epoch": 2652} {"train_loss": -45.508182525634766, "global_step": 320952, "epoch": 2652} {"train_loss": -45.35750961303711, "global_step": 320953, "epoch": 2652} {"train_loss": -45.168434143066406, "global_step": 320954, "epoch": 2652} {"train_loss": -44.948936462402344, "global_step": 320955, "epoch": 2652} {"train_loss": -44.66061019897461, "global_step": 320956, "epoch": 2652} {"train_loss": -44.16274642944336, "global_step": 320957, "epoch": 2652} {"train_loss": -43.682701110839844, "global_step": 320958, "epoch": 2652} {"train_loss": -42.92677688598633, "global_step": 320959, "epoch": 2652} {"train_loss": -42.75092697143555, "global_step": 320960, "epoch": 2652} {"train_loss": -44.31919479370117, "global_step": 320961, "epoch": 2652} {"train_loss": -43.1710319519043, "global_step": 320962, "epoch": 2652} {"train_loss": -44.09443664550781, "global_step": 320963, "epoch": 2652} {"train_loss": -44.03527069091797, "global_step": 320964, "epoch": 2652} {"train_loss": -44.85894775390625, "global_step": 320965, "epoch": 2652} {"train_loss": -43.99405288696289, "global_step": 320966, "epoch": 2652} {"train_loss": -43.99037551879883, "global_step": 320967, "epoch": 2652} {"train_loss": -43.40328598022461, "global_step": 320968, "epoch": 2652} {"train_loss": -43.906917572021484, "global_step": 320969, "epoch": 2652} {"train_loss": -44.75348663330078, "global_step": 320970, "epoch": 2652} {"train_loss": -44.42045974731445, "global_step": 320971, "epoch": 2652} {"train_loss": -44.45058059692383, "global_step": 320972, "epoch": 2652} {"train_loss": -45.0030403137207, "global_step": 320973, "epoch": 2652} {"train_loss": -44.204586029052734, "global_step": 320974, "epoch": 2652} {"train_loss": -44.428218841552734, "global_step": 320975, "epoch": 2652} {"train_loss": -45.01019287109375, "global_step": 320976, "epoch": 2652} {"train_loss": -44.10002136230469, "global_step": 320977, "epoch": 2652} {"train_loss": -43.904083251953125, "global_step": 320978, "epoch": 2652} {"train_loss": -44.76884841918945, "global_step": 320979, "epoch": 2652} {"train_loss": -43.90018844604492, "global_step": 320980, "epoch": 2652} {"train_loss": -43.85599899291992, "global_step": 320981, "epoch": 2652} {"train_loss": -44.015953063964844, "global_step": 320982, "epoch": 2652} {"train_loss": -43.82063674926758, "global_step": 320983, "epoch": 2652} {"train_loss": -44.51958084106445, "global_step": 320984, "epoch": 2652} {"train_loss": -43.6615104675293, "global_step": 320985, "epoch": 2652} {"train_loss": -45.135616302490234, "global_step": 320986, "epoch": 2652} {"train_loss": -44.14516067504883, "global_step": 320987, "epoch": 2652} {"train_loss": -44.25307083129883, "global_step": 320988, "epoch": 2652} {"train_loss": -44.51262664794922, "global_step": 320989, "epoch": 2652} {"train_loss": -43.27097702026367, "global_step": 320990, "epoch": 2652} {"train_loss": -44.27740478515625, "global_step": 320991, "epoch": 2652} {"train_loss": -43.13425827026367, "global_step": 320992, "epoch": 2652} {"train_loss": -41.19160079956055, "global_step": 320993, "epoch": 2652} {"train_loss": -42.45551681518555, "global_step": 320994, "epoch": 2652} {"train_loss": -43.008296966552734, "global_step": 320995, "epoch": 2652} {"train_loss": -44.018157958984375, "global_step": 320996, "epoch": 2652} {"train_loss": -43.85517120361328, "global_step": 320997, "epoch": 2652} {"train_loss": -41.69852828979492, "global_step": 320998, "epoch": 2652} {"train_loss": -41.172210693359375, "global_step": 320999, "epoch": 2652} {"train_loss": -42.50715255737305, "global_step": 321000, "epoch": 2652} {"train_loss": -43.417259216308594, "global_step": 321001, "epoch": 2652} {"train_loss": -41.434913635253906, "global_step": 321002, "epoch": 2652} {"train_loss": -41.77610778808594, "global_step": 321003, "epoch": 2652} {"train_loss": -42.985286712646484, "global_step": 321004, "epoch": 2652} {"train_loss": -42.54053497314453, "global_step": 321005, "epoch": 2652} {"train_loss": -40.166748046875, "global_step": 321006, "epoch": 2652} {"train_loss": -43.389835357666016, "global_step": 321007, "epoch": 2652} {"train_loss": -39.696571350097656, "global_step": 321008, "epoch": 2652} {"train_loss": -41.617652893066406, "global_step": 321009, "epoch": 2652} {"train_loss": -42.93502426147461, "global_step": 321010, "epoch": 2652} {"train_loss": -39.5987663269043, "global_step": 321011, "epoch": 2652} {"train_loss": -44.1591850154656, "global_step": 321012, "epoch": 2652, "val_loss": 2495214.75} {"train_loss": -37.836544036865234, "global_step": 321013, "epoch": 2653} {"train_loss": -41.07387924194336, "global_step": 321014, "epoch": 2653} {"train_loss": -39.827205657958984, "global_step": 321015, "epoch": 2653} {"train_loss": -41.083065032958984, "global_step": 321016, "epoch": 2653} {"train_loss": -38.69832992553711, "global_step": 321017, "epoch": 2653} {"train_loss": -42.09352493286133, "global_step": 321018, "epoch": 2653} {"train_loss": -37.20001983642578, "global_step": 321019, "epoch": 2653} {"train_loss": -42.059112548828125, "global_step": 321020, "epoch": 2653} {"train_loss": -39.16654586791992, "global_step": 321021, "epoch": 2653} {"train_loss": -41.0313720703125, "global_step": 321022, "epoch": 2653} {"train_loss": -41.78229904174805, "global_step": 321023, "epoch": 2653} {"train_loss": -40.48890686035156, "global_step": 321024, "epoch": 2653} {"train_loss": -42.04846954345703, "global_step": 321025, "epoch": 2653} {"train_loss": -40.312862396240234, "global_step": 321026, "epoch": 2653} {"train_loss": -42.073204040527344, "global_step": 321027, "epoch": 2653} {"train_loss": -41.2348747253418, "global_step": 321028, "epoch": 2653} {"train_loss": -43.089847564697266, "global_step": 321029, "epoch": 2653} {"train_loss": -41.511043548583984, "global_step": 321030, "epoch": 2653} {"train_loss": -42.8245849609375, "global_step": 321031, "epoch": 2653} {"train_loss": -42.821807861328125, "global_step": 321032, "epoch": 2653} {"train_loss": -42.64459228515625, "global_step": 321033, "epoch": 2653} {"train_loss": -42.995033264160156, "global_step": 321034, "epoch": 2653} {"train_loss": -42.63839340209961, "global_step": 321035, "epoch": 2653} {"train_loss": -43.000003814697266, "global_step": 321036, "epoch": 2653} {"train_loss": -43.26742172241211, "global_step": 321037, "epoch": 2653} {"train_loss": -42.942543029785156, "global_step": 321038, "epoch": 2653} {"train_loss": -43.75025177001953, "global_step": 321039, "epoch": 2653} {"train_loss": -42.88214874267578, "global_step": 321040, "epoch": 2653} {"train_loss": -43.48494338989258, "global_step": 321041, "epoch": 2653} {"train_loss": -43.63798141479492, "global_step": 321042, "epoch": 2653} {"train_loss": -43.593544006347656, "global_step": 321043, "epoch": 2653} {"train_loss": -43.77848434448242, "global_step": 321044, "epoch": 2653} {"train_loss": -43.55683517456055, "global_step": 321045, "epoch": 2653} {"train_loss": -44.295223236083984, "global_step": 321046, "epoch": 2653} {"train_loss": -43.91312026977539, "global_step": 321047, "epoch": 2653} {"train_loss": -44.61953353881836, "global_step": 321048, "epoch": 2653} {"train_loss": -44.26559066772461, "global_step": 321049, "epoch": 2653} {"train_loss": -44.459842681884766, "global_step": 321050, "epoch": 2653} {"train_loss": -44.43911361694336, "global_step": 321051, "epoch": 2653} {"train_loss": -44.4761962890625, "global_step": 321052, "epoch": 2653} {"train_loss": -44.38056945800781, "global_step": 321053, "epoch": 2653} {"train_loss": -44.799476623535156, "global_step": 321054, "epoch": 2653} {"train_loss": -44.8507080078125, "global_step": 321055, "epoch": 2653} {"train_loss": -44.950477600097656, "global_step": 321056, "epoch": 2653} {"train_loss": -44.641334533691406, "global_step": 321057, "epoch": 2653} {"train_loss": -45.4862174987793, "global_step": 321058, "epoch": 2653} {"train_loss": -45.01936721801758, "global_step": 321059, "epoch": 2653} {"train_loss": -44.94026565551758, "global_step": 321060, "epoch": 2653} {"train_loss": -44.93450927734375, "global_step": 321061, "epoch": 2653} {"train_loss": -44.75466537475586, "global_step": 321062, "epoch": 2653} {"train_loss": -45.03640365600586, "global_step": 321063, "epoch": 2653} {"train_loss": -45.01308822631836, "global_step": 321064, "epoch": 2653} {"train_loss": -44.78607940673828, "global_step": 321065, "epoch": 2653} {"train_loss": -45.00775146484375, "global_step": 321066, "epoch": 2653} {"train_loss": -45.07073974609375, "global_step": 321067, "epoch": 2653} {"train_loss": -44.82466506958008, "global_step": 321068, "epoch": 2653} {"train_loss": -44.868812561035156, "global_step": 321069, "epoch": 2653} {"train_loss": -45.43592071533203, "global_step": 321070, "epoch": 2653} {"train_loss": -44.9067497253418, "global_step": 321071, "epoch": 2653} {"train_loss": -45.29643630981445, "global_step": 321072, "epoch": 2653} {"train_loss": -45.08485794067383, "global_step": 321073, "epoch": 2653} {"train_loss": -45.58043670654297, "global_step": 321074, "epoch": 2653} {"train_loss": -44.86517333984375, "global_step": 321075, "epoch": 2653} {"train_loss": -44.7776985168457, "global_step": 321076, "epoch": 2653} {"train_loss": -45.19249725341797, "global_step": 321077, "epoch": 2653} {"train_loss": -45.02196502685547, "global_step": 321078, "epoch": 2653} {"train_loss": -45.323143005371094, "global_step": 321079, "epoch": 2653} {"train_loss": -45.05701446533203, "global_step": 321080, "epoch": 2653} {"train_loss": -45.45347213745117, "global_step": 321081, "epoch": 2653} {"train_loss": -45.20283126831055, "global_step": 321082, "epoch": 2653} {"train_loss": -45.817527770996094, "global_step": 321083, "epoch": 2653} {"train_loss": -45.30420684814453, "global_step": 321084, "epoch": 2653} {"train_loss": -45.79176712036133, "global_step": 321085, "epoch": 2653} {"train_loss": -45.21464920043945, "global_step": 321086, "epoch": 2653} {"train_loss": -45.65104293823242, "global_step": 321087, "epoch": 2653} {"train_loss": -45.12739562988281, "global_step": 321088, "epoch": 2653} {"train_loss": -46.025146484375, "global_step": 321089, "epoch": 2653} {"train_loss": -45.47639083862305, "global_step": 321090, "epoch": 2653} {"train_loss": -45.27040481567383, "global_step": 321091, "epoch": 2653} {"train_loss": -45.35831832885742, "global_step": 321092, "epoch": 2653} {"train_loss": -45.401695251464844, "global_step": 321093, "epoch": 2653} {"train_loss": -45.62284469604492, "global_step": 321094, "epoch": 2653} {"train_loss": -45.0091438293457, "global_step": 321095, "epoch": 2653} {"train_loss": -45.87726593017578, "global_step": 321096, "epoch": 2653} {"train_loss": -45.42930221557617, "global_step": 321097, "epoch": 2653} {"train_loss": -45.47380447387695, "global_step": 321098, "epoch": 2653} {"train_loss": -45.85465621948242, "global_step": 321099, "epoch": 2653} {"train_loss": -45.18936538696289, "global_step": 321100, "epoch": 2653} {"train_loss": -44.97072982788086, "global_step": 321101, "epoch": 2653} {"train_loss": -46.08894348144531, "global_step": 321102, "epoch": 2653} {"train_loss": -45.2293815612793, "global_step": 321103, "epoch": 2653} {"train_loss": -45.49056625366211, "global_step": 321104, "epoch": 2653} {"train_loss": -45.218379974365234, "global_step": 321105, "epoch": 2653} {"train_loss": -44.21958923339844, "global_step": 321106, "epoch": 2653} {"train_loss": -44.67741775512695, "global_step": 321107, "epoch": 2653} {"train_loss": -44.12150192260742, "global_step": 321108, "epoch": 2653} {"train_loss": -44.48490524291992, "global_step": 321109, "epoch": 2653} {"train_loss": -44.2246208190918, "global_step": 321110, "epoch": 2653} {"train_loss": -45.253292083740234, "global_step": 321111, "epoch": 2653} {"train_loss": -45.61894989013672, "global_step": 321112, "epoch": 2653} {"train_loss": -45.05070114135742, "global_step": 321113, "epoch": 2653} {"train_loss": -45.689693450927734, "global_step": 321114, "epoch": 2653} {"train_loss": -45.0903205871582, "global_step": 321115, "epoch": 2653} {"train_loss": -45.0699577331543, "global_step": 321116, "epoch": 2653} {"train_loss": -44.63482666015625, "global_step": 321117, "epoch": 2653} {"train_loss": -44.71049118041992, "global_step": 321118, "epoch": 2653} {"train_loss": -45.108272552490234, "global_step": 321119, "epoch": 2653} {"train_loss": -45.09261703491211, "global_step": 321120, "epoch": 2653} {"train_loss": -44.3730583190918, "global_step": 321121, "epoch": 2653} {"train_loss": -41.672828674316406, "global_step": 321122, "epoch": 2653} {"train_loss": -40.06388473510742, "global_step": 321123, "epoch": 2653} {"train_loss": -43.66701889038086, "global_step": 321124, "epoch": 2653} {"train_loss": -35.12506866455078, "global_step": 321125, "epoch": 2653} {"train_loss": -43.68812561035156, "global_step": 321126, "epoch": 2653} {"train_loss": -36.33960723876953, "global_step": 321127, "epoch": 2653} {"train_loss": -36.12136459350586, "global_step": 321128, "epoch": 2653} {"train_loss": -38.19736862182617, "global_step": 321129, "epoch": 2653} {"train_loss": -39.13151168823242, "global_step": 321130, "epoch": 2653} {"train_loss": -35.098060607910156, "global_step": 321131, "epoch": 2653} {"train_loss": -37.83611297607422, "global_step": 321132, "epoch": 2653} {"train_loss": -43.550154662329305, "global_step": 321133, "epoch": 2653, "val_loss": 2510189.25} {"train_loss": -39.32402420043945, "global_step": 321134, "epoch": 2654} {"train_loss": -40.95662307739258, "global_step": 321135, "epoch": 2654} {"train_loss": -39.81483840942383, "global_step": 321136, "epoch": 2654} {"train_loss": -39.6268424987793, "global_step": 321137, "epoch": 2654} {"train_loss": -39.989070892333984, "global_step": 321138, "epoch": 2654} {"train_loss": -37.9819450378418, "global_step": 321139, "epoch": 2654} {"train_loss": -41.98259353637695, "global_step": 321140, "epoch": 2654} {"train_loss": -39.19471740722656, "global_step": 321141, "epoch": 2654} {"train_loss": -41.40336227416992, "global_step": 321142, "epoch": 2654} {"train_loss": -40.573143005371094, "global_step": 321143, "epoch": 2654} {"train_loss": -41.499691009521484, "global_step": 321144, "epoch": 2654} {"train_loss": -42.18359375, "global_step": 321145, "epoch": 2654} {"train_loss": -40.14498519897461, "global_step": 321146, "epoch": 2654} {"train_loss": -42.595245361328125, "global_step": 321147, "epoch": 2654} {"train_loss": -41.95420837402344, "global_step": 321148, "epoch": 2654} {"train_loss": -41.94184494018555, "global_step": 321149, "epoch": 2654} {"train_loss": -43.502445220947266, "global_step": 321150, "epoch": 2654} {"train_loss": -41.4216423034668, "global_step": 321151, "epoch": 2654} {"train_loss": -42.6741828918457, "global_step": 321152, "epoch": 2654} {"train_loss": -42.53409194946289, "global_step": 321153, "epoch": 2654} {"train_loss": -42.01275634765625, "global_step": 321154, "epoch": 2654} {"train_loss": -43.062984466552734, "global_step": 321155, "epoch": 2654} {"train_loss": -41.5042839050293, "global_step": 321156, "epoch": 2654} {"train_loss": -42.89441680908203, "global_step": 321157, "epoch": 2654} {"train_loss": -42.502445220947266, "global_step": 321158, "epoch": 2654} {"train_loss": -43.391109466552734, "global_step": 321159, "epoch": 2654} {"train_loss": -43.0697021484375, "global_step": 321160, "epoch": 2654} {"train_loss": -43.54359436035156, "global_step": 321161, "epoch": 2654} {"train_loss": -42.99919128417969, "global_step": 321162, "epoch": 2654} {"train_loss": -43.36375045776367, "global_step": 321163, "epoch": 2654} {"train_loss": -43.04762268066406, "global_step": 321164, "epoch": 2654} {"train_loss": -42.915103912353516, "global_step": 321165, "epoch": 2654} {"train_loss": -43.6448860168457, "global_step": 321166, "epoch": 2654} {"train_loss": -43.30527877807617, "global_step": 321167, "epoch": 2654} {"train_loss": -43.050819396972656, "global_step": 321168, "epoch": 2654} {"train_loss": -43.83850860595703, "global_step": 321169, "epoch": 2654} {"train_loss": -43.74237060546875, "global_step": 321170, "epoch": 2654} {"train_loss": -43.7812614440918, "global_step": 321171, "epoch": 2654} {"train_loss": -43.62131881713867, "global_step": 321172, "epoch": 2654} {"train_loss": -43.48560333251953, "global_step": 321173, "epoch": 2654} {"train_loss": -43.65403366088867, "global_step": 321174, "epoch": 2654} {"train_loss": -43.83760452270508, "global_step": 321175, "epoch": 2654} {"train_loss": -43.99750900268555, "global_step": 321176, "epoch": 2654} {"train_loss": -43.89943313598633, "global_step": 321177, "epoch": 2654} {"train_loss": -43.83844757080078, "global_step": 321178, "epoch": 2654} {"train_loss": -44.50046920776367, "global_step": 321179, "epoch": 2654} {"train_loss": -44.22380447387695, "global_step": 321180, "epoch": 2654} {"train_loss": -44.243072509765625, "global_step": 321181, "epoch": 2654} {"train_loss": -44.05335235595703, "global_step": 321182, "epoch": 2654} {"train_loss": -43.95796203613281, "global_step": 321183, "epoch": 2654} {"train_loss": -44.54140090942383, "global_step": 321184, "epoch": 2654} {"train_loss": -43.78601837158203, "global_step": 321185, "epoch": 2654} {"train_loss": -44.053321838378906, "global_step": 321186, "epoch": 2654} {"train_loss": -45.169532775878906, "global_step": 321187, "epoch": 2654} {"train_loss": -44.38248825073242, "global_step": 321188, "epoch": 2654} {"train_loss": -44.45707321166992, "global_step": 321189, "epoch": 2654} {"train_loss": -44.922698974609375, "global_step": 321190, "epoch": 2654} {"train_loss": -44.71094512939453, "global_step": 321191, "epoch": 2654} {"train_loss": -44.98878860473633, "global_step": 321192, "epoch": 2654} {"train_loss": -45.119991302490234, "global_step": 321193, "epoch": 2654} {"train_loss": -44.81484603881836, "global_step": 321194, "epoch": 2654} {"train_loss": -44.87562942504883, "global_step": 321195, "epoch": 2654} {"train_loss": -45.167930603027344, "global_step": 321196, "epoch": 2654} {"train_loss": -44.89633560180664, "global_step": 321197, "epoch": 2654} {"train_loss": -45.47742462158203, "global_step": 321198, "epoch": 2654} {"train_loss": -45.16016387939453, "global_step": 321199, "epoch": 2654} {"train_loss": -45.328765869140625, "global_step": 321200, "epoch": 2654} {"train_loss": -45.27069854736328, "global_step": 321201, "epoch": 2654} {"train_loss": -45.005611419677734, "global_step": 321202, "epoch": 2654} {"train_loss": -45.537208557128906, "global_step": 321203, "epoch": 2654} {"train_loss": -44.903167724609375, "global_step": 321204, "epoch": 2654} {"train_loss": -45.154075622558594, "global_step": 321205, "epoch": 2654} {"train_loss": -45.21113204956055, "global_step": 321206, "epoch": 2654} {"train_loss": -45.16555404663086, "global_step": 321207, "epoch": 2654} {"train_loss": -45.373348236083984, "global_step": 321208, "epoch": 2654} {"train_loss": -45.0499153137207, "global_step": 321209, "epoch": 2654} {"train_loss": -45.65266799926758, "global_step": 321210, "epoch": 2654} {"train_loss": -44.63113021850586, "global_step": 321211, "epoch": 2654} {"train_loss": -44.7844352722168, "global_step": 321212, "epoch": 2654} {"train_loss": -44.58961486816406, "global_step": 321213, "epoch": 2654} {"train_loss": -44.50770950317383, "global_step": 321214, "epoch": 2654} {"train_loss": -42.88558578491211, "global_step": 321215, "epoch": 2654} {"train_loss": -43.500911712646484, "global_step": 321216, "epoch": 2654} {"train_loss": -43.500362396240234, "global_step": 321217, "epoch": 2654} {"train_loss": -42.645442962646484, "global_step": 321218, "epoch": 2654} {"train_loss": -44.238887786865234, "global_step": 321219, "epoch": 2654} {"train_loss": -45.02648162841797, "global_step": 321220, "epoch": 2654} {"train_loss": -44.819496154785156, "global_step": 321221, "epoch": 2654} {"train_loss": -44.803707122802734, "global_step": 321222, "epoch": 2654} {"train_loss": -44.586952209472656, "global_step": 321223, "epoch": 2654} {"train_loss": -45.355438232421875, "global_step": 321224, "epoch": 2654} {"train_loss": -45.12116622924805, "global_step": 321225, "epoch": 2654} {"train_loss": -44.1664924621582, "global_step": 321226, "epoch": 2654} {"train_loss": -44.0556755065918, "global_step": 321227, "epoch": 2654} {"train_loss": -43.022090911865234, "global_step": 321228, "epoch": 2654} {"train_loss": -43.130165100097656, "global_step": 321229, "epoch": 2654} {"train_loss": -44.23556137084961, "global_step": 321230, "epoch": 2654} {"train_loss": -45.521236419677734, "global_step": 321231, "epoch": 2654} {"train_loss": -45.08785629272461, "global_step": 321232, "epoch": 2654} {"train_loss": -44.25263977050781, "global_step": 321233, "epoch": 2654} {"train_loss": -44.73336410522461, "global_step": 321234, "epoch": 2654} {"train_loss": -45.2893180847168, "global_step": 321235, "epoch": 2654} {"train_loss": -44.83723068237305, "global_step": 321236, "epoch": 2654} {"train_loss": -44.20951461791992, "global_step": 321237, "epoch": 2654} {"train_loss": -44.43935012817383, "global_step": 321238, "epoch": 2654} {"train_loss": -45.31142807006836, "global_step": 321239, "epoch": 2654} {"train_loss": -43.94903564453125, "global_step": 321240, "epoch": 2654} {"train_loss": -43.15987014770508, "global_step": 321241, "epoch": 2654} {"train_loss": -44.152496337890625, "global_step": 321242, "epoch": 2654} {"train_loss": -44.77403259277344, "global_step": 321243, "epoch": 2654} {"train_loss": -43.638553619384766, "global_step": 321244, "epoch": 2654} {"train_loss": -43.782142639160156, "global_step": 321245, "epoch": 2654} {"train_loss": -44.17487716674805, "global_step": 321246, "epoch": 2654} {"train_loss": -45.106048583984375, "global_step": 321247, "epoch": 2654} {"train_loss": -44.53253936767578, "global_step": 321248, "epoch": 2654} {"train_loss": -43.721858978271484, "global_step": 321249, "epoch": 2654} {"train_loss": -44.94969177246094, "global_step": 321250, "epoch": 2654} {"train_loss": -45.08620071411133, "global_step": 321251, "epoch": 2654} {"train_loss": -45.52910232543945, "global_step": 321252, "epoch": 2654} {"train_loss": -44.656307220458984, "global_step": 321253, "epoch": 2654} {"train_loss": -43.73226966542646, "global_step": 321254, "epoch": 2654, "val_loss": 2497182.75} {"train_loss": -44.7172966003418, "global_step": 321255, "epoch": 2655} {"train_loss": -44.65813446044922, "global_step": 321256, "epoch": 2655} {"train_loss": -44.73042297363281, "global_step": 321257, "epoch": 2655} {"train_loss": -44.89289474487305, "global_step": 321258, "epoch": 2655} {"train_loss": -44.15303039550781, "global_step": 321259, "epoch": 2655} {"train_loss": -44.212581634521484, "global_step": 321260, "epoch": 2655} {"train_loss": -44.41428756713867, "global_step": 321261, "epoch": 2655} {"train_loss": -44.53736114501953, "global_step": 321262, "epoch": 2655} {"train_loss": -44.612449645996094, "global_step": 321263, "epoch": 2655} {"train_loss": -43.67753982543945, "global_step": 321264, "epoch": 2655} {"train_loss": -43.97502136230469, "global_step": 321265, "epoch": 2655} {"train_loss": -45.30483627319336, "global_step": 321266, "epoch": 2655} {"train_loss": -44.42781448364258, "global_step": 321267, "epoch": 2655} {"train_loss": -44.8778190612793, "global_step": 321268, "epoch": 2655} {"train_loss": -44.994380950927734, "global_step": 321269, "epoch": 2655} {"train_loss": -44.862422943115234, "global_step": 321270, "epoch": 2655} {"train_loss": -45.05585479736328, "global_step": 321271, "epoch": 2655} {"train_loss": -45.054481506347656, "global_step": 321272, "epoch": 2655} {"train_loss": -45.2581901550293, "global_step": 321273, "epoch": 2655} {"train_loss": -45.19858932495117, "global_step": 321274, "epoch": 2655} {"train_loss": -44.98039245605469, "global_step": 321275, "epoch": 2655} {"train_loss": -45.07697677612305, "global_step": 321276, "epoch": 2655} {"train_loss": -44.971656799316406, "global_step": 321277, "epoch": 2655} {"train_loss": -45.05302810668945, "global_step": 321278, "epoch": 2655} {"train_loss": -44.971527099609375, "global_step": 321279, "epoch": 2655} {"train_loss": -45.30647277832031, "global_step": 321280, "epoch": 2655} {"train_loss": -45.42692184448242, "global_step": 321281, "epoch": 2655} {"train_loss": -45.22280502319336, "global_step": 321282, "epoch": 2655} {"train_loss": -45.30127716064453, "global_step": 321283, "epoch": 2655} {"train_loss": -44.651817321777344, "global_step": 321284, "epoch": 2655} {"train_loss": -44.89142990112305, "global_step": 321285, "epoch": 2655} {"train_loss": -44.77687072753906, "global_step": 321286, "epoch": 2655} {"train_loss": -45.07218933105469, "global_step": 321287, "epoch": 2655} {"train_loss": -45.49493408203125, "global_step": 321288, "epoch": 2655} {"train_loss": -45.20219802856445, "global_step": 321289, "epoch": 2655} {"train_loss": -45.23929977416992, "global_step": 321290, "epoch": 2655} {"train_loss": -44.66154098510742, "global_step": 321291, "epoch": 2655} {"train_loss": -44.701873779296875, "global_step": 321292, "epoch": 2655} {"train_loss": -44.75700378417969, "global_step": 321293, "epoch": 2655} {"train_loss": -42.93467330932617, "global_step": 321294, "epoch": 2655} {"train_loss": -44.702980041503906, "global_step": 321295, "epoch": 2655} {"train_loss": -44.569618225097656, "global_step": 321296, "epoch": 2655} {"train_loss": -42.68553924560547, "global_step": 321297, "epoch": 2655} {"train_loss": -41.647396087646484, "global_step": 321298, "epoch": 2655} {"train_loss": -43.791500091552734, "global_step": 321299, "epoch": 2655} {"train_loss": -44.016902923583984, "global_step": 321300, "epoch": 2655} {"train_loss": -43.776180267333984, "global_step": 321301, "epoch": 2655} {"train_loss": -42.1361083984375, "global_step": 321302, "epoch": 2655} {"train_loss": -42.99211502075195, "global_step": 321303, "epoch": 2655} {"train_loss": -43.100013732910156, "global_step": 321304, "epoch": 2655} {"train_loss": -42.418087005615234, "global_step": 321305, "epoch": 2655} {"train_loss": -43.14997482299805, "global_step": 321306, "epoch": 2655} {"train_loss": -43.5201530456543, "global_step": 321307, "epoch": 2655} {"train_loss": -44.26066207885742, "global_step": 321308, "epoch": 2655} {"train_loss": -40.5374641418457, "global_step": 321309, "epoch": 2655} {"train_loss": -40.73869323730469, "global_step": 321310, "epoch": 2655} {"train_loss": -41.56756591796875, "global_step": 321311, "epoch": 2655} {"train_loss": -40.4678840637207, "global_step": 321312, "epoch": 2655} {"train_loss": -41.174156188964844, "global_step": 321313, "epoch": 2655} {"train_loss": -39.78982162475586, "global_step": 321314, "epoch": 2655} {"train_loss": -43.55253219604492, "global_step": 321315, "epoch": 2655} {"train_loss": -41.336483001708984, "global_step": 321316, "epoch": 2655} {"train_loss": -41.71943283081055, "global_step": 321317, "epoch": 2655} {"train_loss": -41.96099853515625, "global_step": 321318, "epoch": 2655} {"train_loss": -41.17871856689453, "global_step": 321319, "epoch": 2655} {"train_loss": -41.88349914550781, "global_step": 321320, "epoch": 2655} {"train_loss": -42.52535629272461, "global_step": 321321, "epoch": 2655} {"train_loss": -41.84220504760742, "global_step": 321322, "epoch": 2655} {"train_loss": -42.90599060058594, "global_step": 321323, "epoch": 2655} {"train_loss": -43.275203704833984, "global_step": 321324, "epoch": 2655} {"train_loss": -42.098960876464844, "global_step": 321325, "epoch": 2655} {"train_loss": -43.61073303222656, "global_step": 321326, "epoch": 2655} {"train_loss": -41.92218780517578, "global_step": 321327, "epoch": 2655} {"train_loss": -43.49433135986328, "global_step": 321328, "epoch": 2655} {"train_loss": -42.69776153564453, "global_step": 321329, "epoch": 2655} {"train_loss": -43.646854400634766, "global_step": 321330, "epoch": 2655} {"train_loss": -43.12672805786133, "global_step": 321331, "epoch": 2655} {"train_loss": -43.10549545288086, "global_step": 321332, "epoch": 2655} {"train_loss": -43.92219161987305, "global_step": 321333, "epoch": 2655} {"train_loss": -43.58347702026367, "global_step": 321334, "epoch": 2655} {"train_loss": -43.64556884765625, "global_step": 321335, "epoch": 2655} {"train_loss": -44.05045700073242, "global_step": 321336, "epoch": 2655} {"train_loss": -43.14699172973633, "global_step": 321337, "epoch": 2655} {"train_loss": -44.31103515625, "global_step": 321338, "epoch": 2655} {"train_loss": -43.89154052734375, "global_step": 321339, "epoch": 2655} {"train_loss": -43.485137939453125, "global_step": 321340, "epoch": 2655} {"train_loss": -44.08039474487305, "global_step": 321341, "epoch": 2655} {"train_loss": -43.93207931518555, "global_step": 321342, "epoch": 2655} {"train_loss": -44.2312126159668, "global_step": 321343, "epoch": 2655} {"train_loss": -44.02322006225586, "global_step": 321344, "epoch": 2655} {"train_loss": -44.04557418823242, "global_step": 321345, "epoch": 2655} {"train_loss": -44.61790084838867, "global_step": 321346, "epoch": 2655} {"train_loss": -44.544647216796875, "global_step": 321347, "epoch": 2655} {"train_loss": -44.50545883178711, "global_step": 321348, "epoch": 2655} {"train_loss": -44.082740783691406, "global_step": 321349, "epoch": 2655} {"train_loss": -44.30522537231445, "global_step": 321350, "epoch": 2655} {"train_loss": -44.71647644042969, "global_step": 321351, "epoch": 2655} {"train_loss": -44.77991485595703, "global_step": 321352, "epoch": 2655} {"train_loss": -44.62112045288086, "global_step": 321353, "epoch": 2655} {"train_loss": -44.70222854614258, "global_step": 321354, "epoch": 2655} {"train_loss": -44.51066970825195, "global_step": 321355, "epoch": 2655} {"train_loss": -44.6203727722168, "global_step": 321356, "epoch": 2655} {"train_loss": -44.40717315673828, "global_step": 321357, "epoch": 2655} {"train_loss": -44.812923431396484, "global_step": 321358, "epoch": 2655} {"train_loss": -44.975135803222656, "global_step": 321359, "epoch": 2655} {"train_loss": -44.40804672241211, "global_step": 321360, "epoch": 2655} {"train_loss": -44.77804183959961, "global_step": 321361, "epoch": 2655} {"train_loss": -44.46746063232422, "global_step": 321362, "epoch": 2655} {"train_loss": -44.47213363647461, "global_step": 321363, "epoch": 2655} {"train_loss": -45.1908073425293, "global_step": 321364, "epoch": 2655} {"train_loss": -44.440711975097656, "global_step": 321365, "epoch": 2655} {"train_loss": -45.01939010620117, "global_step": 321366, "epoch": 2655} {"train_loss": -44.096858978271484, "global_step": 321367, "epoch": 2655} {"train_loss": -45.1850471496582, "global_step": 321368, "epoch": 2655} {"train_loss": -45.26411819458008, "global_step": 321369, "epoch": 2655} {"train_loss": -44.0109748840332, "global_step": 321370, "epoch": 2655} {"train_loss": -45.04460144042969, "global_step": 321371, "epoch": 2655} {"train_loss": -44.739559173583984, "global_step": 321372, "epoch": 2655} {"train_loss": -45.18643569946289, "global_step": 321373, "epoch": 2655} {"train_loss": -44.695613861083984, "global_step": 321374, "epoch": 2655} {"train_loss": -43.964604117653586, "global_step": 321375, "epoch": 2655, "val_loss": 2525391.0} {"train_loss": -45.14559555053711, "global_step": 321376, "epoch": 2656} {"train_loss": -45.3776969909668, "global_step": 321377, "epoch": 2656} {"train_loss": -44.88540267944336, "global_step": 321378, "epoch": 2656} {"train_loss": -45.1243782043457, "global_step": 321379, "epoch": 2656} {"train_loss": -45.33183670043945, "global_step": 321380, "epoch": 2656} {"train_loss": -44.99969482421875, "global_step": 321381, "epoch": 2656} {"train_loss": -45.22842025756836, "global_step": 321382, "epoch": 2656} {"train_loss": -45.01508712768555, "global_step": 321383, "epoch": 2656} {"train_loss": -45.06820297241211, "global_step": 321384, "epoch": 2656} {"train_loss": -44.92433166503906, "global_step": 321385, "epoch": 2656} {"train_loss": -44.85689926147461, "global_step": 321386, "epoch": 2656} {"train_loss": -44.90507507324219, "global_step": 321387, "epoch": 2656} {"train_loss": -44.9556999206543, "global_step": 321388, "epoch": 2656} {"train_loss": -44.366172790527344, "global_step": 321389, "epoch": 2656} {"train_loss": -44.92599105834961, "global_step": 321390, "epoch": 2656} {"train_loss": -45.16402053833008, "global_step": 321391, "epoch": 2656} {"train_loss": -44.78431701660156, "global_step": 321392, "epoch": 2656} {"train_loss": -44.766780853271484, "global_step": 321393, "epoch": 2656} {"train_loss": -44.65418243408203, "global_step": 321394, "epoch": 2656} {"train_loss": -44.36798095703125, "global_step": 321395, "epoch": 2656} {"train_loss": -44.42314147949219, "global_step": 321396, "epoch": 2656} {"train_loss": -44.87258529663086, "global_step": 321397, "epoch": 2656} {"train_loss": -45.383907318115234, "global_step": 321398, "epoch": 2656} {"train_loss": -44.51780319213867, "global_step": 321399, "epoch": 2656} {"train_loss": -44.95808029174805, "global_step": 321400, "epoch": 2656} {"train_loss": -43.964935302734375, "global_step": 321401, "epoch": 2656} {"train_loss": -45.03272247314453, "global_step": 321402, "epoch": 2656} {"train_loss": -44.573665618896484, "global_step": 321403, "epoch": 2656} {"train_loss": -44.9572868347168, "global_step": 321404, "epoch": 2656} {"train_loss": -45.408992767333984, "global_step": 321405, "epoch": 2656} {"train_loss": -44.39864730834961, "global_step": 321406, "epoch": 2656} {"train_loss": -44.4898796081543, "global_step": 321407, "epoch": 2656} {"train_loss": -45.0233039855957, "global_step": 321408, "epoch": 2656} {"train_loss": -44.71830368041992, "global_step": 321409, "epoch": 2656} {"train_loss": -44.65507888793945, "global_step": 321410, "epoch": 2656} {"train_loss": -44.27715301513672, "global_step": 321411, "epoch": 2656} {"train_loss": -44.651737213134766, "global_step": 321412, "epoch": 2656} {"train_loss": -44.01749801635742, "global_step": 321413, "epoch": 2656} {"train_loss": -43.741024017333984, "global_step": 321414, "epoch": 2656} {"train_loss": -43.077857971191406, "global_step": 321415, "epoch": 2656} {"train_loss": -42.69346237182617, "global_step": 321416, "epoch": 2656} {"train_loss": -43.14820098876953, "global_step": 321417, "epoch": 2656} {"train_loss": -44.29582595825195, "global_step": 321418, "epoch": 2656} {"train_loss": -44.30322265625, "global_step": 321419, "epoch": 2656} {"train_loss": -44.599308013916016, "global_step": 321420, "epoch": 2656} {"train_loss": -44.66167449951172, "global_step": 321421, "epoch": 2656} {"train_loss": -44.942527770996094, "global_step": 321422, "epoch": 2656} {"train_loss": -44.185543060302734, "global_step": 321423, "epoch": 2656} {"train_loss": -45.21406936645508, "global_step": 321424, "epoch": 2656} {"train_loss": -44.1599235534668, "global_step": 321425, "epoch": 2656} {"train_loss": -45.04880905151367, "global_step": 321426, "epoch": 2656} {"train_loss": -44.72859191894531, "global_step": 321427, "epoch": 2656} {"train_loss": -44.679359436035156, "global_step": 321428, "epoch": 2656} {"train_loss": -45.207923889160156, "global_step": 321429, "epoch": 2656} {"train_loss": -44.99983215332031, "global_step": 321430, "epoch": 2656} {"train_loss": -44.296077728271484, "global_step": 321431, "epoch": 2656} {"train_loss": -44.23945999145508, "global_step": 321432, "epoch": 2656} {"train_loss": -44.25225067138672, "global_step": 321433, "epoch": 2656} {"train_loss": -44.82761764526367, "global_step": 321434, "epoch": 2656} {"train_loss": -44.61089324951172, "global_step": 321435, "epoch": 2656} {"train_loss": -43.55149459838867, "global_step": 321436, "epoch": 2656} {"train_loss": -43.578250885009766, "global_step": 321437, "epoch": 2656} {"train_loss": -44.60146713256836, "global_step": 321438, "epoch": 2656} {"train_loss": -44.27848434448242, "global_step": 321439, "epoch": 2656} {"train_loss": -43.5117073059082, "global_step": 321440, "epoch": 2656} {"train_loss": -44.27552032470703, "global_step": 321441, "epoch": 2656} {"train_loss": -44.22230911254883, "global_step": 321442, "epoch": 2656} {"train_loss": -44.512508392333984, "global_step": 321443, "epoch": 2656} {"train_loss": -44.14371871948242, "global_step": 321444, "epoch": 2656} {"train_loss": -43.26679992675781, "global_step": 321445, "epoch": 2656} {"train_loss": -41.63638687133789, "global_step": 321446, "epoch": 2656} {"train_loss": -43.316566467285156, "global_step": 321447, "epoch": 2656} {"train_loss": -44.11790084838867, "global_step": 321448, "epoch": 2656} {"train_loss": -42.60035705566406, "global_step": 321449, "epoch": 2656} {"train_loss": -44.64501953125, "global_step": 321450, "epoch": 2656} {"train_loss": -45.24250030517578, "global_step": 321451, "epoch": 2656} {"train_loss": -44.052711486816406, "global_step": 321452, "epoch": 2656} {"train_loss": -44.425724029541016, "global_step": 321453, "epoch": 2656} {"train_loss": -44.88495635986328, "global_step": 321454, "epoch": 2656} {"train_loss": -44.4828987121582, "global_step": 321455, "epoch": 2656} {"train_loss": -44.001251220703125, "global_step": 321456, "epoch": 2656} {"train_loss": -44.5067024230957, "global_step": 321457, "epoch": 2656} {"train_loss": -43.682586669921875, "global_step": 321458, "epoch": 2656} {"train_loss": -43.41787338256836, "global_step": 321459, "epoch": 2656} {"train_loss": -43.06184768676758, "global_step": 321460, "epoch": 2656} {"train_loss": -42.785152435302734, "global_step": 321461, "epoch": 2656} {"train_loss": -43.97310256958008, "global_step": 321462, "epoch": 2656} {"train_loss": -43.779964447021484, "global_step": 321463, "epoch": 2656} {"train_loss": -42.40021514892578, "global_step": 321464, "epoch": 2656} {"train_loss": -42.04941177368164, "global_step": 321465, "epoch": 2656} {"train_loss": -44.182273864746094, "global_step": 321466, "epoch": 2656} {"train_loss": -42.5802001953125, "global_step": 321467, "epoch": 2656} {"train_loss": -44.37656784057617, "global_step": 321468, "epoch": 2656} {"train_loss": -42.68081283569336, "global_step": 321469, "epoch": 2656} {"train_loss": -44.07599639892578, "global_step": 321470, "epoch": 2656} {"train_loss": -42.7293586730957, "global_step": 321471, "epoch": 2656} {"train_loss": -43.295013427734375, "global_step": 321472, "epoch": 2656} {"train_loss": -43.25542449951172, "global_step": 321473, "epoch": 2656} {"train_loss": -43.681968688964844, "global_step": 321474, "epoch": 2656} {"train_loss": -44.014827728271484, "global_step": 321475, "epoch": 2656} {"train_loss": -43.907955169677734, "global_step": 321476, "epoch": 2656} {"train_loss": -44.22892379760742, "global_step": 321477, "epoch": 2656} {"train_loss": -43.28205871582031, "global_step": 321478, "epoch": 2656} {"train_loss": -43.6728401184082, "global_step": 321479, "epoch": 2656} {"train_loss": -43.75152587890625, "global_step": 321480, "epoch": 2656} {"train_loss": -43.12172317504883, "global_step": 321481, "epoch": 2656} {"train_loss": -44.39803695678711, "global_step": 321482, "epoch": 2656} {"train_loss": -44.209754943847656, "global_step": 321483, "epoch": 2656} {"train_loss": -43.125301361083984, "global_step": 321484, "epoch": 2656} {"train_loss": -44.52114486694336, "global_step": 321485, "epoch": 2656} {"train_loss": -42.325870513916016, "global_step": 321486, "epoch": 2656} {"train_loss": -43.96843719482422, "global_step": 321487, "epoch": 2656} {"train_loss": -42.22766876220703, "global_step": 321488, "epoch": 2656} {"train_loss": -42.39483642578125, "global_step": 321489, "epoch": 2656} {"train_loss": -43.396324157714844, "global_step": 321490, "epoch": 2656} {"train_loss": -42.70246505737305, "global_step": 321491, "epoch": 2656} {"train_loss": -43.44730758666992, "global_step": 321492, "epoch": 2656} {"train_loss": -41.51939392089844, "global_step": 321493, "epoch": 2656} {"train_loss": -44.3013916015625, "global_step": 321494, "epoch": 2656} {"train_loss": -41.597660064697266, "global_step": 321495, "epoch": 2656} {"train_loss": -44.09984222916532, "global_step": 321496, "epoch": 2656, "val_loss": 2479004.75} {"train_loss": -41.408103942871094, "global_step": 321497, "epoch": 2657} {"train_loss": -40.96610641479492, "global_step": 321498, "epoch": 2657} {"train_loss": -43.48560333251953, "global_step": 321499, "epoch": 2657} {"train_loss": -42.37311553955078, "global_step": 321500, "epoch": 2657} {"train_loss": -42.331390380859375, "global_step": 321501, "epoch": 2657} {"train_loss": -43.692684173583984, "global_step": 321502, "epoch": 2657} {"train_loss": -43.20135498046875, "global_step": 321503, "epoch": 2657} {"train_loss": -43.548561096191406, "global_step": 321504, "epoch": 2657} {"train_loss": -43.55803298950195, "global_step": 321505, "epoch": 2657} {"train_loss": -43.43552780151367, "global_step": 321506, "epoch": 2657} {"train_loss": -42.40492630004883, "global_step": 321507, "epoch": 2657} {"train_loss": -42.774925231933594, "global_step": 321508, "epoch": 2657} {"train_loss": -43.11581039428711, "global_step": 321509, "epoch": 2657} {"train_loss": -43.045589447021484, "global_step": 321510, "epoch": 2657} {"train_loss": -43.80784225463867, "global_step": 321511, "epoch": 2657} {"train_loss": -42.71931076049805, "global_step": 321512, "epoch": 2657} {"train_loss": -43.62255859375, "global_step": 321513, "epoch": 2657} {"train_loss": -43.501075744628906, "global_step": 321514, "epoch": 2657} {"train_loss": -43.054443359375, "global_step": 321515, "epoch": 2657} {"train_loss": -44.270530700683594, "global_step": 321516, "epoch": 2657} {"train_loss": -42.841888427734375, "global_step": 321517, "epoch": 2657} {"train_loss": -44.46371078491211, "global_step": 321518, "epoch": 2657} {"train_loss": -43.82572555541992, "global_step": 321519, "epoch": 2657} {"train_loss": -44.28498458862305, "global_step": 321520, "epoch": 2657} {"train_loss": -43.20002365112305, "global_step": 321521, "epoch": 2657} {"train_loss": -43.792110443115234, "global_step": 321522, "epoch": 2657} {"train_loss": -43.889034271240234, "global_step": 321523, "epoch": 2657} {"train_loss": -43.62351608276367, "global_step": 321524, "epoch": 2657} {"train_loss": -43.98707580566406, "global_step": 321525, "epoch": 2657} {"train_loss": -43.611392974853516, "global_step": 321526, "epoch": 2657} {"train_loss": -44.62153244018555, "global_step": 321527, "epoch": 2657} {"train_loss": -43.32818603515625, "global_step": 321528, "epoch": 2657} {"train_loss": -44.29751205444336, "global_step": 321529, "epoch": 2657} {"train_loss": -44.773834228515625, "global_step": 321530, "epoch": 2657} {"train_loss": -44.14321517944336, "global_step": 321531, "epoch": 2657} {"train_loss": -44.00699996948242, "global_step": 321532, "epoch": 2657} {"train_loss": -44.72538375854492, "global_step": 321533, "epoch": 2657} {"train_loss": -44.1333122253418, "global_step": 321534, "epoch": 2657} {"train_loss": -43.32353973388672, "global_step": 321535, "epoch": 2657} {"train_loss": -44.75598907470703, "global_step": 321536, "epoch": 2657} {"train_loss": -44.3322868347168, "global_step": 321537, "epoch": 2657} {"train_loss": -44.20872116088867, "global_step": 321538, "epoch": 2657} {"train_loss": -43.9735221862793, "global_step": 321539, "epoch": 2657} {"train_loss": -44.14488220214844, "global_step": 321540, "epoch": 2657} {"train_loss": -44.77961730957031, "global_step": 321541, "epoch": 2657} {"train_loss": -43.51485824584961, "global_step": 321542, "epoch": 2657} {"train_loss": -45.04914474487305, "global_step": 321543, "epoch": 2657} {"train_loss": -44.048458099365234, "global_step": 321544, "epoch": 2657} {"train_loss": -44.960166931152344, "global_step": 321545, "epoch": 2657} {"train_loss": -44.2536506652832, "global_step": 321546, "epoch": 2657} {"train_loss": -44.89349365234375, "global_step": 321547, "epoch": 2657} {"train_loss": -44.47495651245117, "global_step": 321548, "epoch": 2657} {"train_loss": -45.20747756958008, "global_step": 321549, "epoch": 2657} {"train_loss": -44.38452911376953, "global_step": 321550, "epoch": 2657} {"train_loss": -45.07605743408203, "global_step": 321551, "epoch": 2657} {"train_loss": -44.75966262817383, "global_step": 321552, "epoch": 2657} {"train_loss": -44.72159194946289, "global_step": 321553, "epoch": 2657} {"train_loss": -45.39187240600586, "global_step": 321554, "epoch": 2657} {"train_loss": -45.08126449584961, "global_step": 321555, "epoch": 2657} {"train_loss": -45.34926223754883, "global_step": 321556, "epoch": 2657} {"train_loss": -44.8230094909668, "global_step": 321557, "epoch": 2657} {"train_loss": -45.257816314697266, "global_step": 321558, "epoch": 2657} {"train_loss": -44.637535095214844, "global_step": 321559, "epoch": 2657} {"train_loss": -45.39259338378906, "global_step": 321560, "epoch": 2657} {"train_loss": -45.36968994140625, "global_step": 321561, "epoch": 2657} {"train_loss": -45.058837890625, "global_step": 321562, "epoch": 2657} {"train_loss": -45.51292037963867, "global_step": 321563, "epoch": 2657} {"train_loss": -45.324275970458984, "global_step": 321564, "epoch": 2657} {"train_loss": -44.600399017333984, "global_step": 321565, "epoch": 2657} {"train_loss": -45.482460021972656, "global_step": 321566, "epoch": 2657} {"train_loss": -45.28754425048828, "global_step": 321567, "epoch": 2657} {"train_loss": -45.61528015136719, "global_step": 321568, "epoch": 2657} {"train_loss": -45.13463592529297, "global_step": 321569, "epoch": 2657} {"train_loss": -45.46363067626953, "global_step": 321570, "epoch": 2657} {"train_loss": -45.60246658325195, "global_step": 321571, "epoch": 2657} {"train_loss": -45.29071807861328, "global_step": 321572, "epoch": 2657} {"train_loss": -45.528533935546875, "global_step": 321573, "epoch": 2657} {"train_loss": -45.28540802001953, "global_step": 321574, "epoch": 2657} {"train_loss": -44.947689056396484, "global_step": 321575, "epoch": 2657} {"train_loss": -43.56863021850586, "global_step": 321576, "epoch": 2657} {"train_loss": -40.08960723876953, "global_step": 321577, "epoch": 2657} {"train_loss": -42.025142669677734, "global_step": 321578, "epoch": 2657} {"train_loss": -43.84393310546875, "global_step": 321579, "epoch": 2657} {"train_loss": -43.74901580810547, "global_step": 321580, "epoch": 2657} {"train_loss": -40.455909729003906, "global_step": 321581, "epoch": 2657} {"train_loss": -44.54191207885742, "global_step": 321582, "epoch": 2657} {"train_loss": -42.123268127441406, "global_step": 321583, "epoch": 2657} {"train_loss": -41.96599197387695, "global_step": 321584, "epoch": 2657} {"train_loss": -44.24980545043945, "global_step": 321585, "epoch": 2657} {"train_loss": -42.70025634765625, "global_step": 321586, "epoch": 2657} {"train_loss": -41.687076568603516, "global_step": 321587, "epoch": 2657} {"train_loss": -42.50191879272461, "global_step": 321588, "epoch": 2657} {"train_loss": -38.3673095703125, "global_step": 321589, "epoch": 2657} {"train_loss": -39.5890007019043, "global_step": 321590, "epoch": 2657} {"train_loss": -40.93044662475586, "global_step": 321591, "epoch": 2657} {"train_loss": -39.03532791137695, "global_step": 321592, "epoch": 2657} {"train_loss": -42.19281005859375, "global_step": 321593, "epoch": 2657} {"train_loss": -42.00582504272461, "global_step": 321594, "epoch": 2657} {"train_loss": -43.17610168457031, "global_step": 321595, "epoch": 2657} {"train_loss": -42.01858139038086, "global_step": 321596, "epoch": 2657} {"train_loss": -41.584651947021484, "global_step": 321597, "epoch": 2657} {"train_loss": -41.30281448364258, "global_step": 321598, "epoch": 2657} {"train_loss": -42.9094352722168, "global_step": 321599, "epoch": 2657} {"train_loss": -39.33602523803711, "global_step": 321600, "epoch": 2657} {"train_loss": -42.07139205932617, "global_step": 321601, "epoch": 2657} {"train_loss": -42.93061447143555, "global_step": 321602, "epoch": 2657} {"train_loss": -41.91706466674805, "global_step": 321603, "epoch": 2657} {"train_loss": -43.18880844116211, "global_step": 321604, "epoch": 2657} {"train_loss": -43.1768798828125, "global_step": 321605, "epoch": 2657} {"train_loss": -43.120235443115234, "global_step": 321606, "epoch": 2657} {"train_loss": -42.73220443725586, "global_step": 321607, "epoch": 2657} {"train_loss": -43.2802619934082, "global_step": 321608, "epoch": 2657} {"train_loss": -41.23009490966797, "global_step": 321609, "epoch": 2657} {"train_loss": -42.994300842285156, "global_step": 321610, "epoch": 2657} {"train_loss": -40.93263244628906, "global_step": 321611, "epoch": 2657} {"train_loss": -41.11170959472656, "global_step": 321612, "epoch": 2657} {"train_loss": -42.03780746459961, "global_step": 321613, "epoch": 2657} {"train_loss": -42.52669906616211, "global_step": 321614, "epoch": 2657} {"train_loss": -40.9459114074707, "global_step": 321615, "epoch": 2657} {"train_loss": -40.978668212890625, "global_step": 321616, "epoch": 2657} {"train_loss": -43.4432480867244, "global_step": 321617, "epoch": 2657, "val_loss": 2532514.5} {"train_loss": -40.73380661010742, "global_step": 321618, "epoch": 2658} {"train_loss": -41.330718994140625, "global_step": 321619, "epoch": 2658} {"train_loss": -40.694610595703125, "global_step": 321620, "epoch": 2658} {"train_loss": -40.79850387573242, "global_step": 321621, "epoch": 2658} {"train_loss": -42.60219955444336, "global_step": 321622, "epoch": 2658} {"train_loss": -40.07146072387695, "global_step": 321623, "epoch": 2658} {"train_loss": -40.685943603515625, "global_step": 321624, "epoch": 2658} {"train_loss": -40.747432708740234, "global_step": 321625, "epoch": 2658} {"train_loss": -41.7276611328125, "global_step": 321626, "epoch": 2658} {"train_loss": -40.47061538696289, "global_step": 321627, "epoch": 2658} {"train_loss": -40.032569885253906, "global_step": 321628, "epoch": 2658} {"train_loss": -42.44392776489258, "global_step": 321629, "epoch": 2658} {"train_loss": -42.27604293823242, "global_step": 321630, "epoch": 2658} {"train_loss": -40.75098419189453, "global_step": 321631, "epoch": 2658} {"train_loss": -40.87917709350586, "global_step": 321632, "epoch": 2658} {"train_loss": -42.55916213989258, "global_step": 321633, "epoch": 2658} {"train_loss": -42.23377227783203, "global_step": 321634, "epoch": 2658} {"train_loss": -39.10795211791992, "global_step": 321635, "epoch": 2658} {"train_loss": -39.729957580566406, "global_step": 321636, "epoch": 2658} {"train_loss": -41.17487716674805, "global_step": 321637, "epoch": 2658} {"train_loss": -42.87359619140625, "global_step": 321638, "epoch": 2658} {"train_loss": -41.42866516113281, "global_step": 321639, "epoch": 2658} {"train_loss": -40.870269775390625, "global_step": 321640, "epoch": 2658} {"train_loss": -37.56205368041992, "global_step": 321641, "epoch": 2658} {"train_loss": -42.04710388183594, "global_step": 321642, "epoch": 2658} {"train_loss": -41.850250244140625, "global_step": 321643, "epoch": 2658} {"train_loss": -42.71855545043945, "global_step": 321644, "epoch": 2658} {"train_loss": -41.405296325683594, "global_step": 321645, "epoch": 2658} {"train_loss": -42.34340286254883, "global_step": 321646, "epoch": 2658} {"train_loss": -41.23378372192383, "global_step": 321647, "epoch": 2658} {"train_loss": -42.09534454345703, "global_step": 321648, "epoch": 2658} {"train_loss": -42.581912994384766, "global_step": 321649, "epoch": 2658} {"train_loss": -42.675537109375, "global_step": 321650, "epoch": 2658} {"train_loss": -38.550594329833984, "global_step": 321651, "epoch": 2658} {"train_loss": -43.12043380737305, "global_step": 321652, "epoch": 2658} {"train_loss": -43.382850646972656, "global_step": 321653, "epoch": 2658} {"train_loss": -40.149898529052734, "global_step": 321654, "epoch": 2658} {"train_loss": -43.04527282714844, "global_step": 321655, "epoch": 2658} {"train_loss": -42.604103088378906, "global_step": 321656, "epoch": 2658} {"train_loss": -42.63901901245117, "global_step": 321657, "epoch": 2658} {"train_loss": -42.16352462768555, "global_step": 321658, "epoch": 2658} {"train_loss": -41.19487380981445, "global_step": 321659, "epoch": 2658} {"train_loss": -43.48897933959961, "global_step": 321660, "epoch": 2658} {"train_loss": -40.172271728515625, "global_step": 321661, "epoch": 2658} {"train_loss": -43.7520866394043, "global_step": 321662, "epoch": 2658} {"train_loss": -43.177520751953125, "global_step": 321663, "epoch": 2658} {"train_loss": -40.928340911865234, "global_step": 321664, "epoch": 2658} {"train_loss": -43.28764724731445, "global_step": 321665, "epoch": 2658} {"train_loss": -43.28501510620117, "global_step": 321666, "epoch": 2658} {"train_loss": -42.755226135253906, "global_step": 321667, "epoch": 2658} {"train_loss": -43.63269805908203, "global_step": 321668, "epoch": 2658} {"train_loss": -41.48794174194336, "global_step": 321669, "epoch": 2658} {"train_loss": -42.74506759643555, "global_step": 321670, "epoch": 2658} {"train_loss": -41.39967727661133, "global_step": 321671, "epoch": 2658} {"train_loss": -43.03953170776367, "global_step": 321672, "epoch": 2658} {"train_loss": -43.64988327026367, "global_step": 321673, "epoch": 2658} {"train_loss": -43.03338623046875, "global_step": 321674, "epoch": 2658} {"train_loss": -43.15047073364258, "global_step": 321675, "epoch": 2658} {"train_loss": -41.917930603027344, "global_step": 321676, "epoch": 2658} {"train_loss": -43.32179260253906, "global_step": 321677, "epoch": 2658} {"train_loss": -43.36693572998047, "global_step": 321678, "epoch": 2658} {"train_loss": -42.8230094909668, "global_step": 321679, "epoch": 2658} {"train_loss": -43.00895309448242, "global_step": 321680, "epoch": 2658} {"train_loss": -43.7086296081543, "global_step": 321681, "epoch": 2658} {"train_loss": -43.710086822509766, "global_step": 321682, "epoch": 2658} {"train_loss": -40.90425491333008, "global_step": 321683, "epoch": 2658} {"train_loss": -43.18951416015625, "global_step": 321684, "epoch": 2658} {"train_loss": -43.078548431396484, "global_step": 321685, "epoch": 2658} {"train_loss": -43.808902740478516, "global_step": 321686, "epoch": 2658} {"train_loss": -44.25248336791992, "global_step": 321687, "epoch": 2658} {"train_loss": -44.0501708984375, "global_step": 321688, "epoch": 2658} {"train_loss": -44.22246170043945, "global_step": 321689, "epoch": 2658} {"train_loss": -43.344512939453125, "global_step": 321690, "epoch": 2658} {"train_loss": -43.89106750488281, "global_step": 321691, "epoch": 2658} {"train_loss": -43.52059555053711, "global_step": 321692, "epoch": 2658} {"train_loss": -43.7109489440918, "global_step": 321693, "epoch": 2658} {"train_loss": -43.010738372802734, "global_step": 321694, "epoch": 2658} {"train_loss": -44.26395797729492, "global_step": 321695, "epoch": 2658} {"train_loss": -44.012874603271484, "global_step": 321696, "epoch": 2658} {"train_loss": -44.308692932128906, "global_step": 321697, "epoch": 2658} {"train_loss": -42.72697830200195, "global_step": 321698, "epoch": 2658} {"train_loss": -43.907283782958984, "global_step": 321699, "epoch": 2658} {"train_loss": -41.153907775878906, "global_step": 321700, "epoch": 2658} {"train_loss": -44.09749221801758, "global_step": 321701, "epoch": 2658} {"train_loss": -42.072444915771484, "global_step": 321702, "epoch": 2658} {"train_loss": -44.002010345458984, "global_step": 321703, "epoch": 2658} {"train_loss": -44.42953109741211, "global_step": 321704, "epoch": 2658} {"train_loss": -44.42905807495117, "global_step": 321705, "epoch": 2658} {"train_loss": -43.92314910888672, "global_step": 321706, "epoch": 2658} {"train_loss": -44.315982818603516, "global_step": 321707, "epoch": 2658} {"train_loss": -44.12588882446289, "global_step": 321708, "epoch": 2658} {"train_loss": -44.3395881652832, "global_step": 321709, "epoch": 2658} {"train_loss": -44.71918869018555, "global_step": 321710, "epoch": 2658} {"train_loss": -44.23081588745117, "global_step": 321711, "epoch": 2658} {"train_loss": -44.75333023071289, "global_step": 321712, "epoch": 2658} {"train_loss": -44.479896545410156, "global_step": 321713, "epoch": 2658} {"train_loss": -44.75368118286133, "global_step": 321714, "epoch": 2658} {"train_loss": -44.6449089050293, "global_step": 321715, "epoch": 2658} {"train_loss": -44.6942253112793, "global_step": 321716, "epoch": 2658} {"train_loss": -44.99699783325195, "global_step": 321717, "epoch": 2658} {"train_loss": -44.38187026977539, "global_step": 321718, "epoch": 2658} {"train_loss": -44.78654098510742, "global_step": 321719, "epoch": 2658} {"train_loss": -44.84688186645508, "global_step": 321720, "epoch": 2658} {"train_loss": -44.5848503112793, "global_step": 321721, "epoch": 2658} {"train_loss": -45.292755126953125, "global_step": 321722, "epoch": 2658} {"train_loss": -44.27012634277344, "global_step": 321723, "epoch": 2658} {"train_loss": -44.952171325683594, "global_step": 321724, "epoch": 2658} {"train_loss": -45.105037689208984, "global_step": 321725, "epoch": 2658} {"train_loss": -45.014923095703125, "global_step": 321726, "epoch": 2658} {"train_loss": -44.72941207885742, "global_step": 321727, "epoch": 2658} {"train_loss": -45.094661712646484, "global_step": 321728, "epoch": 2658} {"train_loss": -45.04302215576172, "global_step": 321729, "epoch": 2658} {"train_loss": -44.72959518432617, "global_step": 321730, "epoch": 2658} {"train_loss": -45.05663299560547, "global_step": 321731, "epoch": 2658} {"train_loss": -42.89005661010742, "global_step": 321732, "epoch": 2658} {"train_loss": -45.166297912597656, "global_step": 321733, "epoch": 2658} {"train_loss": -44.657833099365234, "global_step": 321734, "epoch": 2658} {"train_loss": -44.3641471862793, "global_step": 321735, "epoch": 2658} {"train_loss": -45.245582580566406, "global_step": 321736, "epoch": 2658} {"train_loss": -45.25392532348633, "global_step": 321737, "epoch": 2658} {"train_loss": -42.96885214561273, "global_step": 321738, "epoch": 2658, "val_loss": 2568870.5} {"train_loss": -45.23430633544922, "global_step": 321739, "epoch": 2659} {"train_loss": -44.69673538208008, "global_step": 321740, "epoch": 2659} {"train_loss": -44.35846710205078, "global_step": 321741, "epoch": 2659} {"train_loss": -45.30135726928711, "global_step": 321742, "epoch": 2659} {"train_loss": -44.946075439453125, "global_step": 321743, "epoch": 2659} {"train_loss": -45.25881576538086, "global_step": 321744, "epoch": 2659} {"train_loss": -44.343318939208984, "global_step": 321745, "epoch": 2659} {"train_loss": -44.979766845703125, "global_step": 321746, "epoch": 2659} {"train_loss": -45.04928970336914, "global_step": 321747, "epoch": 2659} {"train_loss": -44.52387619018555, "global_step": 321748, "epoch": 2659} {"train_loss": -44.11342239379883, "global_step": 321749, "epoch": 2659} {"train_loss": -43.45124435424805, "global_step": 321750, "epoch": 2659} {"train_loss": -44.55085754394531, "global_step": 321751, "epoch": 2659} {"train_loss": -44.57695770263672, "global_step": 321752, "epoch": 2659} {"train_loss": -44.43043899536133, "global_step": 321753, "epoch": 2659} {"train_loss": -42.06597900390625, "global_step": 321754, "epoch": 2659} {"train_loss": -40.64106369018555, "global_step": 321755, "epoch": 2659} {"train_loss": -41.193172454833984, "global_step": 321756, "epoch": 2659} {"train_loss": -41.65791320800781, "global_step": 321757, "epoch": 2659} {"train_loss": -39.48214340209961, "global_step": 321758, "epoch": 2659} {"train_loss": -40.766456604003906, "global_step": 321759, "epoch": 2659} {"train_loss": -40.14200973510742, "global_step": 321760, "epoch": 2659} {"train_loss": -40.568660736083984, "global_step": 321761, "epoch": 2659} {"train_loss": -42.53365707397461, "global_step": 321762, "epoch": 2659} {"train_loss": -41.659088134765625, "global_step": 321763, "epoch": 2659} {"train_loss": -41.206390380859375, "global_step": 321764, "epoch": 2659} {"train_loss": -41.666290283203125, "global_step": 321765, "epoch": 2659} {"train_loss": -44.10232162475586, "global_step": 321766, "epoch": 2659} {"train_loss": -42.2863883972168, "global_step": 321767, "epoch": 2659} {"train_loss": -42.67655944824219, "global_step": 321768, "epoch": 2659} {"train_loss": -43.13359451293945, "global_step": 321769, "epoch": 2659} {"train_loss": -42.41494369506836, "global_step": 321770, "epoch": 2659} {"train_loss": -43.33137130737305, "global_step": 321771, "epoch": 2659} {"train_loss": -42.35094451904297, "global_step": 321772, "epoch": 2659} {"train_loss": -43.074989318847656, "global_step": 321773, "epoch": 2659} {"train_loss": -43.66340255737305, "global_step": 321774, "epoch": 2659} {"train_loss": -42.55305480957031, "global_step": 321775, "epoch": 2659} {"train_loss": -41.12175369262695, "global_step": 321776, "epoch": 2659} {"train_loss": -43.56464385986328, "global_step": 321777, "epoch": 2659} {"train_loss": -43.06936264038086, "global_step": 321778, "epoch": 2659} {"train_loss": -42.17229080200195, "global_step": 321779, "epoch": 2659} {"train_loss": -42.98811721801758, "global_step": 321780, "epoch": 2659} {"train_loss": -43.29262924194336, "global_step": 321781, "epoch": 2659} {"train_loss": -42.66106414794922, "global_step": 321782, "epoch": 2659} {"train_loss": -42.83453369140625, "global_step": 321783, "epoch": 2659} {"train_loss": -44.08015823364258, "global_step": 321784, "epoch": 2659} {"train_loss": -42.51472854614258, "global_step": 321785, "epoch": 2659} {"train_loss": -42.99396896362305, "global_step": 321786, "epoch": 2659} {"train_loss": -42.91481018066406, "global_step": 321787, "epoch": 2659} {"train_loss": -42.92577362060547, "global_step": 321788, "epoch": 2659} {"train_loss": -44.06414794921875, "global_step": 321789, "epoch": 2659} {"train_loss": -43.39603805541992, "global_step": 321790, "epoch": 2659} {"train_loss": -43.53213119506836, "global_step": 321791, "epoch": 2659} {"train_loss": -43.102577209472656, "global_step": 321792, "epoch": 2659} {"train_loss": -43.843841552734375, "global_step": 321793, "epoch": 2659} {"train_loss": -43.38167190551758, "global_step": 321794, "epoch": 2659} {"train_loss": -43.59708786010742, "global_step": 321795, "epoch": 2659} {"train_loss": -43.303367614746094, "global_step": 321796, "epoch": 2659} {"train_loss": -42.769805908203125, "global_step": 321797, "epoch": 2659} {"train_loss": -44.114620208740234, "global_step": 321798, "epoch": 2659} {"train_loss": -43.4437255859375, "global_step": 321799, "epoch": 2659} {"train_loss": -42.91462326049805, "global_step": 321800, "epoch": 2659} {"train_loss": -43.569374084472656, "global_step": 321801, "epoch": 2659} {"train_loss": -42.999813079833984, "global_step": 321802, "epoch": 2659} {"train_loss": -44.18335723876953, "global_step": 321803, "epoch": 2659} {"train_loss": -43.13014221191406, "global_step": 321804, "epoch": 2659} {"train_loss": -43.12187957763672, "global_step": 321805, "epoch": 2659} {"train_loss": -42.91598129272461, "global_step": 321806, "epoch": 2659} {"train_loss": -43.5526237487793, "global_step": 321807, "epoch": 2659} {"train_loss": -43.9082145690918, "global_step": 321808, "epoch": 2659} {"train_loss": -43.15577697753906, "global_step": 321809, "epoch": 2659} {"train_loss": -43.636383056640625, "global_step": 321810, "epoch": 2659} {"train_loss": -44.07817459106445, "global_step": 321811, "epoch": 2659} {"train_loss": -44.24597930908203, "global_step": 321812, "epoch": 2659} {"train_loss": -44.21916961669922, "global_step": 321813, "epoch": 2659} {"train_loss": -44.03096008300781, "global_step": 321814, "epoch": 2659} {"train_loss": -44.11915969848633, "global_step": 321815, "epoch": 2659} {"train_loss": -43.782649993896484, "global_step": 321816, "epoch": 2659} {"train_loss": -44.6854248046875, "global_step": 321817, "epoch": 2659} {"train_loss": -43.6147346496582, "global_step": 321818, "epoch": 2659} {"train_loss": -44.10111618041992, "global_step": 321819, "epoch": 2659} {"train_loss": -43.377777099609375, "global_step": 321820, "epoch": 2659} {"train_loss": -43.57176971435547, "global_step": 321821, "epoch": 2659} {"train_loss": -44.34562301635742, "global_step": 321822, "epoch": 2659} {"train_loss": -43.81734848022461, "global_step": 321823, "epoch": 2659} {"train_loss": -44.34013366699219, "global_step": 321824, "epoch": 2659} {"train_loss": -44.29316329956055, "global_step": 321825, "epoch": 2659} {"train_loss": -43.96031951904297, "global_step": 321826, "epoch": 2659} {"train_loss": -44.59638214111328, "global_step": 321827, "epoch": 2659} {"train_loss": -44.08806228637695, "global_step": 321828, "epoch": 2659} {"train_loss": -43.8679084777832, "global_step": 321829, "epoch": 2659} {"train_loss": -44.482635498046875, "global_step": 321830, "epoch": 2659} {"train_loss": -44.4167594909668, "global_step": 321831, "epoch": 2659} {"train_loss": -44.06866455078125, "global_step": 321832, "epoch": 2659} {"train_loss": -43.626319885253906, "global_step": 321833, "epoch": 2659} {"train_loss": -44.01266098022461, "global_step": 321834, "epoch": 2659} {"train_loss": -43.4976921081543, "global_step": 321835, "epoch": 2659} {"train_loss": -44.83940505981445, "global_step": 321836, "epoch": 2659} {"train_loss": -43.0446891784668, "global_step": 321837, "epoch": 2659} {"train_loss": -43.510902404785156, "global_step": 321838, "epoch": 2659} {"train_loss": -43.76716232299805, "global_step": 321839, "epoch": 2659} {"train_loss": -43.65456008911133, "global_step": 321840, "epoch": 2659} {"train_loss": -44.962493896484375, "global_step": 321841, "epoch": 2659} {"train_loss": -43.86787033081055, "global_step": 321842, "epoch": 2659} {"train_loss": -42.386962890625, "global_step": 321843, "epoch": 2659} {"train_loss": -44.9976692199707, "global_step": 321844, "epoch": 2659} {"train_loss": -44.37014389038086, "global_step": 321845, "epoch": 2659} {"train_loss": -43.71569061279297, "global_step": 321846, "epoch": 2659} {"train_loss": -44.752655029296875, "global_step": 321847, "epoch": 2659} {"train_loss": -44.5306510925293, "global_step": 321848, "epoch": 2659} {"train_loss": -44.46436309814453, "global_step": 321849, "epoch": 2659} {"train_loss": -44.76481628417969, "global_step": 321850, "epoch": 2659} {"train_loss": -44.48347091674805, "global_step": 321851, "epoch": 2659} {"train_loss": -44.7335090637207, "global_step": 321852, "epoch": 2659} {"train_loss": -44.667110443115234, "global_step": 321853, "epoch": 2659} {"train_loss": -44.32001495361328, "global_step": 321854, "epoch": 2659} {"train_loss": -44.495521545410156, "global_step": 321855, "epoch": 2659} {"train_loss": -44.37911605834961, "global_step": 321856, "epoch": 2659} {"train_loss": -43.797306060791016, "global_step": 321857, "epoch": 2659} {"train_loss": -45.14088821411133, "global_step": 321858, "epoch": 2659} {"train_loss": -43.54894612840385, "global_step": 321859, "epoch": 2659, "val_loss": 2589115.5} {"train_loss": -45.030757904052734, "global_step": 321860, "epoch": 2660} {"train_loss": -44.54702377319336, "global_step": 321861, "epoch": 2660} {"train_loss": -44.46544647216797, "global_step": 321862, "epoch": 2660} {"train_loss": -44.7011604309082, "global_step": 321863, "epoch": 2660} {"train_loss": -45.34769821166992, "global_step": 321864, "epoch": 2660} {"train_loss": -44.53059005737305, "global_step": 321865, "epoch": 2660} {"train_loss": -44.83124923706055, "global_step": 321866, "epoch": 2660} {"train_loss": -44.910030364990234, "global_step": 321867, "epoch": 2660} {"train_loss": -44.85015869140625, "global_step": 321868, "epoch": 2660} {"train_loss": -45.478363037109375, "global_step": 321869, "epoch": 2660} {"train_loss": -45.115596771240234, "global_step": 321870, "epoch": 2660} {"train_loss": -44.658992767333984, "global_step": 321871, "epoch": 2660} {"train_loss": -45.15134811401367, "global_step": 321872, "epoch": 2660} {"train_loss": -44.372779846191406, "global_step": 321873, "epoch": 2660} {"train_loss": -44.4303092956543, "global_step": 321874, "epoch": 2660} {"train_loss": -44.237545013427734, "global_step": 321875, "epoch": 2660} {"train_loss": -44.31682205200195, "global_step": 321876, "epoch": 2660} {"train_loss": -44.136512756347656, "global_step": 321877, "epoch": 2660} {"train_loss": -43.820858001708984, "global_step": 321878, "epoch": 2660} {"train_loss": -43.97703170776367, "global_step": 321879, "epoch": 2660} {"train_loss": -45.266841888427734, "global_step": 321880, "epoch": 2660} {"train_loss": -43.95401382446289, "global_step": 321881, "epoch": 2660} {"train_loss": -41.87467575073242, "global_step": 321882, "epoch": 2660} {"train_loss": -43.435543060302734, "global_step": 321883, "epoch": 2660} {"train_loss": -44.366756439208984, "global_step": 321884, "epoch": 2660} {"train_loss": -43.22612380981445, "global_step": 321885, "epoch": 2660} {"train_loss": -41.49234390258789, "global_step": 321886, "epoch": 2660} {"train_loss": -43.06260681152344, "global_step": 321887, "epoch": 2660} {"train_loss": -44.28047561645508, "global_step": 321888, "epoch": 2660} {"train_loss": -43.41035079956055, "global_step": 321889, "epoch": 2660} {"train_loss": -43.24966049194336, "global_step": 321890, "epoch": 2660} {"train_loss": -44.13829803466797, "global_step": 321891, "epoch": 2660} {"train_loss": -43.242855072021484, "global_step": 321892, "epoch": 2660} {"train_loss": -42.58352279663086, "global_step": 321893, "epoch": 2660} {"train_loss": -43.017452239990234, "global_step": 321894, "epoch": 2660} {"train_loss": -43.787960052490234, "global_step": 321895, "epoch": 2660} {"train_loss": -43.963844299316406, "global_step": 321896, "epoch": 2660} {"train_loss": -43.89823532104492, "global_step": 321897, "epoch": 2660} {"train_loss": -42.744625091552734, "global_step": 321898, "epoch": 2660} {"train_loss": -44.52824020385742, "global_step": 321899, "epoch": 2660} {"train_loss": -43.6934928894043, "global_step": 321900, "epoch": 2660} {"train_loss": -43.73185348510742, "global_step": 321901, "epoch": 2660} {"train_loss": -43.33073806762695, "global_step": 321902, "epoch": 2660} {"train_loss": -44.249053955078125, "global_step": 321903, "epoch": 2660} {"train_loss": -44.07888412475586, "global_step": 321904, "epoch": 2660} {"train_loss": -43.93154525756836, "global_step": 321905, "epoch": 2660} {"train_loss": -42.89849853515625, "global_step": 321906, "epoch": 2660} {"train_loss": -43.26567077636719, "global_step": 321907, "epoch": 2660} {"train_loss": -43.845001220703125, "global_step": 321908, "epoch": 2660} {"train_loss": -44.04580307006836, "global_step": 321909, "epoch": 2660} {"train_loss": -42.54035186767578, "global_step": 321910, "epoch": 2660} {"train_loss": -43.324764251708984, "global_step": 321911, "epoch": 2660} {"train_loss": -44.31678009033203, "global_step": 321912, "epoch": 2660} {"train_loss": -43.023738861083984, "global_step": 321913, "epoch": 2660} {"train_loss": -43.342376708984375, "global_step": 321914, "epoch": 2660} {"train_loss": -43.78822326660156, "global_step": 321915, "epoch": 2660} {"train_loss": -43.52651596069336, "global_step": 321916, "epoch": 2660} {"train_loss": -44.0101203918457, "global_step": 321917, "epoch": 2660} {"train_loss": -42.73149490356445, "global_step": 321918, "epoch": 2660} {"train_loss": -43.839752197265625, "global_step": 321919, "epoch": 2660} {"train_loss": -42.50615310668945, "global_step": 321920, "epoch": 2660} {"train_loss": -42.83759307861328, "global_step": 321921, "epoch": 2660} {"train_loss": -41.4031982421875, "global_step": 321922, "epoch": 2660} {"train_loss": -41.95344924926758, "global_step": 321923, "epoch": 2660} {"train_loss": -41.94095993041992, "global_step": 321924, "epoch": 2660} {"train_loss": -42.878135681152344, "global_step": 321925, "epoch": 2660} {"train_loss": -44.546836853027344, "global_step": 321926, "epoch": 2660} {"train_loss": -43.2520637512207, "global_step": 321927, "epoch": 2660} {"train_loss": -43.25334548950195, "global_step": 321928, "epoch": 2660} {"train_loss": -44.023502349853516, "global_step": 321929, "epoch": 2660} {"train_loss": -44.443023681640625, "global_step": 321930, "epoch": 2660} {"train_loss": -44.19537353515625, "global_step": 321931, "epoch": 2660} {"train_loss": -44.4326057434082, "global_step": 321932, "epoch": 2660} {"train_loss": -44.099761962890625, "global_step": 321933, "epoch": 2660} {"train_loss": -43.8475341796875, "global_step": 321934, "epoch": 2660} {"train_loss": -45.21485137939453, "global_step": 321935, "epoch": 2660} {"train_loss": -39.738380432128906, "global_step": 321936, "epoch": 2660} {"train_loss": -42.61541748046875, "global_step": 321937, "epoch": 2660} {"train_loss": -43.6534309387207, "global_step": 321938, "epoch": 2660} {"train_loss": -44.172706604003906, "global_step": 321939, "epoch": 2660} {"train_loss": -43.96804428100586, "global_step": 321940, "epoch": 2660} {"train_loss": -43.907962799072266, "global_step": 321941, "epoch": 2660} {"train_loss": -43.76691818237305, "global_step": 321942, "epoch": 2660} {"train_loss": -39.50431442260742, "global_step": 321943, "epoch": 2660} {"train_loss": -35.016170501708984, "global_step": 321944, "epoch": 2660} {"train_loss": -38.36458969116211, "global_step": 321945, "epoch": 2660} {"train_loss": -43.14432907104492, "global_step": 321946, "epoch": 2660} {"train_loss": -43.055694580078125, "global_step": 321947, "epoch": 2660} {"train_loss": -44.07789993286133, "global_step": 321948, "epoch": 2660} {"train_loss": -44.416629791259766, "global_step": 321949, "epoch": 2660} {"train_loss": -22.98167610168457, "global_step": 321950, "epoch": 2660} {"train_loss": -43.97990036010742, "global_step": 321951, "epoch": 2660} {"train_loss": -42.42209243774414, "global_step": 321952, "epoch": 2660} {"train_loss": -39.33707809448242, "global_step": 321953, "epoch": 2660} {"train_loss": -41.108333587646484, "global_step": 321954, "epoch": 2660} {"train_loss": -39.348358154296875, "global_step": 321955, "epoch": 2660} {"train_loss": -37.86419677734375, "global_step": 321956, "epoch": 2660} {"train_loss": -32.69575881958008, "global_step": 321957, "epoch": 2660} {"train_loss": -34.72541046142578, "global_step": 321958, "epoch": 2660} {"train_loss": -39.8414421081543, "global_step": 321959, "epoch": 2660} {"train_loss": -40.30662536621094, "global_step": 321960, "epoch": 2660} {"train_loss": -41.24654769897461, "global_step": 321961, "epoch": 2660} {"train_loss": -39.184349060058594, "global_step": 321962, "epoch": 2660} {"train_loss": -38.72744369506836, "global_step": 321963, "epoch": 2660} {"train_loss": -40.20023727416992, "global_step": 321964, "epoch": 2660} {"train_loss": -40.73894119262695, "global_step": 321965, "epoch": 2660} {"train_loss": -41.80378723144531, "global_step": 321966, "epoch": 2660} {"train_loss": -39.86479187011719, "global_step": 321967, "epoch": 2660} {"train_loss": -40.833839416503906, "global_step": 321968, "epoch": 2660} {"train_loss": -40.61042785644531, "global_step": 321969, "epoch": 2660} {"train_loss": -41.25220489501953, "global_step": 321970, "epoch": 2660} {"train_loss": -38.406612396240234, "global_step": 321971, "epoch": 2660} {"train_loss": -40.85636520385742, "global_step": 321972, "epoch": 2660} {"train_loss": -41.72030258178711, "global_step": 321973, "epoch": 2660} {"train_loss": -41.63788986206055, "global_step": 321974, "epoch": 2660} {"train_loss": -41.61200714111328, "global_step": 321975, "epoch": 2660} {"train_loss": -41.69956588745117, "global_step": 321976, "epoch": 2660} {"train_loss": -42.55979537963867, "global_step": 321977, "epoch": 2660} {"train_loss": -41.981651306152344, "global_step": 321978, "epoch": 2660} {"train_loss": -42.25415802001953, "global_step": 321979, "epoch": 2660} {"train_loss": -42.58360626283756, "global_step": 321980, "epoch": 2660, "val_loss": 2894735.75} {"train_loss": -43.094844818115234, "global_step": 321981, "epoch": 2661} {"train_loss": -42.87955856323242, "global_step": 321982, "epoch": 2661} {"train_loss": -42.600528717041016, "global_step": 321983, "epoch": 2661} {"train_loss": -42.24811935424805, "global_step": 321984, "epoch": 2661} {"train_loss": -42.32935333251953, "global_step": 321985, "epoch": 2661} {"train_loss": -43.29329299926758, "global_step": 321986, "epoch": 2661} {"train_loss": -41.002655029296875, "global_step": 321987, "epoch": 2661} {"train_loss": -41.0406608581543, "global_step": 321988, "epoch": 2661} {"train_loss": -41.92195510864258, "global_step": 321989, "epoch": 2661} {"train_loss": -43.21921920776367, "global_step": 321990, "epoch": 2661} {"train_loss": -42.73954391479492, "global_step": 321991, "epoch": 2661} {"train_loss": -42.9779167175293, "global_step": 321992, "epoch": 2661} {"train_loss": -42.805843353271484, "global_step": 321993, "epoch": 2661} {"train_loss": -43.83351516723633, "global_step": 321994, "epoch": 2661} {"train_loss": -42.91145706176758, "global_step": 321995, "epoch": 2661} {"train_loss": -42.92243576049805, "global_step": 321996, "epoch": 2661} {"train_loss": -43.0963249206543, "global_step": 321997, "epoch": 2661} {"train_loss": -42.249244689941406, "global_step": 321998, "epoch": 2661} {"train_loss": -44.22595977783203, "global_step": 321999, "epoch": 2661} {"train_loss": -42.94172668457031, "global_step": 322000, "epoch": 2661} {"train_loss": -43.475440979003906, "global_step": 322001, "epoch": 2661} {"train_loss": -44.05784225463867, "global_step": 322002, "epoch": 2661} {"train_loss": -42.68730545043945, "global_step": 322003, "epoch": 2661} {"train_loss": -43.22878646850586, "global_step": 322004, "epoch": 2661} {"train_loss": -43.30653762817383, "global_step": 322005, "epoch": 2661} {"train_loss": -43.48109817504883, "global_step": 322006, "epoch": 2661} {"train_loss": -43.76975631713867, "global_step": 322007, "epoch": 2661} {"train_loss": -43.77111053466797, "global_step": 322008, "epoch": 2661} {"train_loss": -43.45125961303711, "global_step": 322009, "epoch": 2661} {"train_loss": -43.321414947509766, "global_step": 322010, "epoch": 2661} {"train_loss": -42.5118522644043, "global_step": 322011, "epoch": 2661} {"train_loss": -44.49514389038086, "global_step": 322012, "epoch": 2661} {"train_loss": -44.20637893676758, "global_step": 322013, "epoch": 2661} {"train_loss": -43.37220001220703, "global_step": 322014, "epoch": 2661} {"train_loss": -43.56669235229492, "global_step": 322015, "epoch": 2661} {"train_loss": -43.73193359375, "global_step": 322016, "epoch": 2661} {"train_loss": -43.985042572021484, "global_step": 322017, "epoch": 2661} {"train_loss": -43.6323127746582, "global_step": 322018, "epoch": 2661} {"train_loss": -43.93440628051758, "global_step": 322019, "epoch": 2661} {"train_loss": -42.676753997802734, "global_step": 322020, "epoch": 2661} {"train_loss": -44.70698547363281, "global_step": 322021, "epoch": 2661} {"train_loss": -44.29971694946289, "global_step": 322022, "epoch": 2661} {"train_loss": -44.203033447265625, "global_step": 322023, "epoch": 2661} {"train_loss": -44.39213943481445, "global_step": 322024, "epoch": 2661} {"train_loss": -44.03636932373047, "global_step": 322025, "epoch": 2661} {"train_loss": -44.485897064208984, "global_step": 322026, "epoch": 2661} {"train_loss": -44.01951599121094, "global_step": 322027, "epoch": 2661} {"train_loss": -44.29746627807617, "global_step": 322028, "epoch": 2661} {"train_loss": -44.40247344970703, "global_step": 322029, "epoch": 2661} {"train_loss": -43.495994567871094, "global_step": 322030, "epoch": 2661} {"train_loss": -45.10024642944336, "global_step": 322031, "epoch": 2661} {"train_loss": -44.79240798950195, "global_step": 322032, "epoch": 2661} {"train_loss": -44.55512619018555, "global_step": 322033, "epoch": 2661} {"train_loss": -44.97777557373047, "global_step": 322034, "epoch": 2661} {"train_loss": -43.507293701171875, "global_step": 322035, "epoch": 2661} {"train_loss": -45.5563850402832, "global_step": 322036, "epoch": 2661} {"train_loss": -44.45250701904297, "global_step": 322037, "epoch": 2661} {"train_loss": -44.41382598876953, "global_step": 322038, "epoch": 2661} {"train_loss": -44.422149658203125, "global_step": 322039, "epoch": 2661} {"train_loss": -44.64706802368164, "global_step": 322040, "epoch": 2661} {"train_loss": -44.55599594116211, "global_step": 322041, "epoch": 2661} {"train_loss": -44.203765869140625, "global_step": 322042, "epoch": 2661} {"train_loss": -43.94648742675781, "global_step": 322043, "epoch": 2661} {"train_loss": -44.10921859741211, "global_step": 322044, "epoch": 2661} {"train_loss": -42.871009826660156, "global_step": 322045, "epoch": 2661} {"train_loss": -41.47883987426758, "global_step": 322046, "epoch": 2661} {"train_loss": -41.99822998046875, "global_step": 322047, "epoch": 2661} {"train_loss": -42.0500602722168, "global_step": 322048, "epoch": 2661} {"train_loss": -43.515262603759766, "global_step": 322049, "epoch": 2661} {"train_loss": -43.62295150756836, "global_step": 322050, "epoch": 2661} {"train_loss": -42.22269821166992, "global_step": 322051, "epoch": 2661} {"train_loss": -41.004661560058594, "global_step": 322052, "epoch": 2661} {"train_loss": -41.697731018066406, "global_step": 322053, "epoch": 2661} {"train_loss": -41.25680160522461, "global_step": 322054, "epoch": 2661} {"train_loss": -42.144866943359375, "global_step": 322055, "epoch": 2661} {"train_loss": -42.326019287109375, "global_step": 322056, "epoch": 2661} {"train_loss": -40.350379943847656, "global_step": 322057, "epoch": 2661} {"train_loss": -42.012081146240234, "global_step": 322058, "epoch": 2661} {"train_loss": -41.4105339050293, "global_step": 322059, "epoch": 2661} {"train_loss": -42.60361862182617, "global_step": 322060, "epoch": 2661} {"train_loss": -41.15333938598633, "global_step": 322061, "epoch": 2661} {"train_loss": -42.397674560546875, "global_step": 322062, "epoch": 2661} {"train_loss": -41.99746322631836, "global_step": 322063, "epoch": 2661} {"train_loss": -42.24654006958008, "global_step": 322064, "epoch": 2661} {"train_loss": -41.813934326171875, "global_step": 322065, "epoch": 2661} {"train_loss": -42.355709075927734, "global_step": 322066, "epoch": 2661} {"train_loss": -43.68410873413086, "global_step": 322067, "epoch": 2661} {"train_loss": -42.89263916015625, "global_step": 322068, "epoch": 2661} {"train_loss": -43.599220275878906, "global_step": 322069, "epoch": 2661} {"train_loss": -43.98588180541992, "global_step": 322070, "epoch": 2661} {"train_loss": -42.27884292602539, "global_step": 322071, "epoch": 2661} {"train_loss": -43.872920989990234, "global_step": 322072, "epoch": 2661} {"train_loss": -43.06632614135742, "global_step": 322073, "epoch": 2661} {"train_loss": -43.605491638183594, "global_step": 322074, "epoch": 2661} {"train_loss": -42.78419494628906, "global_step": 322075, "epoch": 2661} {"train_loss": -43.6165885925293, "global_step": 322076, "epoch": 2661} {"train_loss": -43.572166442871094, "global_step": 322077, "epoch": 2661} {"train_loss": -44.20359420776367, "global_step": 322078, "epoch": 2661} {"train_loss": -43.44450759887695, "global_step": 322079, "epoch": 2661} {"train_loss": -43.722381591796875, "global_step": 322080, "epoch": 2661} {"train_loss": -44.3883056640625, "global_step": 322081, "epoch": 2661} {"train_loss": -44.553951263427734, "global_step": 322082, "epoch": 2661} {"train_loss": -44.39510726928711, "global_step": 322083, "epoch": 2661} {"train_loss": -43.60865020751953, "global_step": 322084, "epoch": 2661} {"train_loss": -44.160430908203125, "global_step": 322085, "epoch": 2661} {"train_loss": -44.301265716552734, "global_step": 322086, "epoch": 2661} {"train_loss": -43.63560104370117, "global_step": 322087, "epoch": 2661} {"train_loss": -44.80366897583008, "global_step": 322088, "epoch": 2661} {"train_loss": -44.16999435424805, "global_step": 322089, "epoch": 2661} {"train_loss": -43.92293930053711, "global_step": 322090, "epoch": 2661} {"train_loss": -44.80476379394531, "global_step": 322091, "epoch": 2661} {"train_loss": -44.24619674682617, "global_step": 322092, "epoch": 2661} {"train_loss": -43.934532165527344, "global_step": 322093, "epoch": 2661} {"train_loss": -44.613311767578125, "global_step": 322094, "epoch": 2661} {"train_loss": -43.04799270629883, "global_step": 322095, "epoch": 2661} {"train_loss": -43.42863082885742, "global_step": 322096, "epoch": 2661} {"train_loss": -44.419368743896484, "global_step": 322097, "epoch": 2661} {"train_loss": -43.43613052368164, "global_step": 322098, "epoch": 2661} {"train_loss": -44.40838623046875, "global_step": 322099, "epoch": 2661} {"train_loss": -44.05055618286133, "global_step": 322100, "epoch": 2661} {"train_loss": -43.38540926846591, "global_step": 322101, "epoch": 2661, "val_loss": 2709813.0} {"train_loss": -44.30317306518555, "global_step": 322102, "epoch": 2662} {"train_loss": -44.26375961303711, "global_step": 322103, "epoch": 2662} {"train_loss": -45.08056640625, "global_step": 322104, "epoch": 2662} {"train_loss": -45.01606369018555, "global_step": 322105, "epoch": 2662} {"train_loss": -44.70713806152344, "global_step": 322106, "epoch": 2662} {"train_loss": -44.2649040222168, "global_step": 322107, "epoch": 2662} {"train_loss": -44.679229736328125, "global_step": 322108, "epoch": 2662} {"train_loss": -44.76815414428711, "global_step": 322109, "epoch": 2662} {"train_loss": -44.0879020690918, "global_step": 322110, "epoch": 2662} {"train_loss": -43.84326171875, "global_step": 322111, "epoch": 2662} {"train_loss": -44.465511322021484, "global_step": 322112, "epoch": 2662} {"train_loss": -43.90689468383789, "global_step": 322113, "epoch": 2662} {"train_loss": -43.955535888671875, "global_step": 322114, "epoch": 2662} {"train_loss": -44.813968658447266, "global_step": 322115, "epoch": 2662} {"train_loss": -44.2325553894043, "global_step": 322116, "epoch": 2662} {"train_loss": -44.27720642089844, "global_step": 322117, "epoch": 2662} {"train_loss": -44.1230583190918, "global_step": 322118, "epoch": 2662} {"train_loss": -44.87344741821289, "global_step": 322119, "epoch": 2662} {"train_loss": -44.58854293823242, "global_step": 322120, "epoch": 2662} {"train_loss": -44.80424118041992, "global_step": 322121, "epoch": 2662} {"train_loss": -43.54923629760742, "global_step": 322122, "epoch": 2662} {"train_loss": -43.443817138671875, "global_step": 322123, "epoch": 2662} {"train_loss": -43.96965408325195, "global_step": 322124, "epoch": 2662} {"train_loss": -42.617191314697266, "global_step": 322125, "epoch": 2662} {"train_loss": -44.006832122802734, "global_step": 322126, "epoch": 2662} {"train_loss": -44.84163284301758, "global_step": 322127, "epoch": 2662} {"train_loss": -42.98043441772461, "global_step": 322128, "epoch": 2662} {"train_loss": -41.27315902709961, "global_step": 322129, "epoch": 2662} {"train_loss": -43.31055450439453, "global_step": 322130, "epoch": 2662} {"train_loss": -43.00761032104492, "global_step": 322131, "epoch": 2662} {"train_loss": -41.80922317504883, "global_step": 322132, "epoch": 2662} {"train_loss": -43.728477478027344, "global_step": 322133, "epoch": 2662} {"train_loss": -41.21961212158203, "global_step": 322134, "epoch": 2662} {"train_loss": -39.639434814453125, "global_step": 322135, "epoch": 2662} {"train_loss": -43.454071044921875, "global_step": 322136, "epoch": 2662} {"train_loss": -38.54671096801758, "global_step": 322137, "epoch": 2662} {"train_loss": -44.290748596191406, "global_step": 322138, "epoch": 2662} {"train_loss": -39.81175231933594, "global_step": 322139, "epoch": 2662} {"train_loss": -41.5676383972168, "global_step": 322140, "epoch": 2662} {"train_loss": -43.010196685791016, "global_step": 322141, "epoch": 2662} {"train_loss": -43.08742904663086, "global_step": 322142, "epoch": 2662} {"train_loss": -42.95804977416992, "global_step": 322143, "epoch": 2662} {"train_loss": -43.19208908081055, "global_step": 322144, "epoch": 2662} {"train_loss": -42.19260025024414, "global_step": 322145, "epoch": 2662} {"train_loss": -42.81582260131836, "global_step": 322146, "epoch": 2662} {"train_loss": -43.15275573730469, "global_step": 322147, "epoch": 2662} {"train_loss": -41.8294677734375, "global_step": 322148, "epoch": 2662} {"train_loss": -43.83831787109375, "global_step": 322149, "epoch": 2662} {"train_loss": -42.770320892333984, "global_step": 322150, "epoch": 2662} {"train_loss": -42.80630874633789, "global_step": 322151, "epoch": 2662} {"train_loss": -43.66425704956055, "global_step": 322152, "epoch": 2662} {"train_loss": -42.49007797241211, "global_step": 322153, "epoch": 2662} {"train_loss": -42.59786605834961, "global_step": 322154, "epoch": 2662} {"train_loss": -43.47487258911133, "global_step": 322155, "epoch": 2662} {"train_loss": -42.95244216918945, "global_step": 322156, "epoch": 2662} {"train_loss": -42.51925277709961, "global_step": 322157, "epoch": 2662} {"train_loss": -43.75168228149414, "global_step": 322158, "epoch": 2662} {"train_loss": -42.8234977722168, "global_step": 322159, "epoch": 2662} {"train_loss": -44.25734329223633, "global_step": 322160, "epoch": 2662} {"train_loss": -44.00606918334961, "global_step": 322161, "epoch": 2662} {"train_loss": -43.50300216674805, "global_step": 322162, "epoch": 2662} {"train_loss": -44.021751403808594, "global_step": 322163, "epoch": 2662} {"train_loss": -43.220375061035156, "global_step": 322164, "epoch": 2662} {"train_loss": -43.672264099121094, "global_step": 322165, "epoch": 2662} {"train_loss": -43.74480438232422, "global_step": 322166, "epoch": 2662} {"train_loss": -43.523841857910156, "global_step": 322167, "epoch": 2662} {"train_loss": -43.48261260986328, "global_step": 322168, "epoch": 2662} {"train_loss": -44.16960144042969, "global_step": 322169, "epoch": 2662} {"train_loss": -43.53754425048828, "global_step": 322170, "epoch": 2662} {"train_loss": -42.90614700317383, "global_step": 322171, "epoch": 2662} {"train_loss": -44.13202667236328, "global_step": 322172, "epoch": 2662} {"train_loss": -42.89964294433594, "global_step": 322173, "epoch": 2662} {"train_loss": -44.344661712646484, "global_step": 322174, "epoch": 2662} {"train_loss": -43.16056442260742, "global_step": 322175, "epoch": 2662} {"train_loss": -43.3981819152832, "global_step": 322176, "epoch": 2662} {"train_loss": -42.97239303588867, "global_step": 322177, "epoch": 2662} {"train_loss": -43.64056396484375, "global_step": 322178, "epoch": 2662} {"train_loss": -44.146785736083984, "global_step": 322179, "epoch": 2662} {"train_loss": -44.38562774658203, "global_step": 322180, "epoch": 2662} {"train_loss": -44.16352462768555, "global_step": 322181, "epoch": 2662} {"train_loss": -43.945960998535156, "global_step": 322182, "epoch": 2662} {"train_loss": -43.84456253051758, "global_step": 322183, "epoch": 2662} {"train_loss": -43.81193161010742, "global_step": 322184, "epoch": 2662} {"train_loss": -43.692962646484375, "global_step": 322185, "epoch": 2662} {"train_loss": -44.57361602783203, "global_step": 322186, "epoch": 2662} {"train_loss": -44.82379150390625, "global_step": 322187, "epoch": 2662} {"train_loss": -44.183006286621094, "global_step": 322188, "epoch": 2662} {"train_loss": -44.229156494140625, "global_step": 322189, "epoch": 2662} {"train_loss": -44.52616500854492, "global_step": 322190, "epoch": 2662} {"train_loss": -43.980018615722656, "global_step": 322191, "epoch": 2662} {"train_loss": -44.81116485595703, "global_step": 322192, "epoch": 2662} {"train_loss": -44.24253463745117, "global_step": 322193, "epoch": 2662} {"train_loss": -44.3956298828125, "global_step": 322194, "epoch": 2662} {"train_loss": -44.678123474121094, "global_step": 322195, "epoch": 2662} {"train_loss": -44.250030517578125, "global_step": 322196, "epoch": 2662} {"train_loss": -44.25099563598633, "global_step": 322197, "epoch": 2662} {"train_loss": -42.662818908691406, "global_step": 322198, "epoch": 2662} {"train_loss": -43.660579681396484, "global_step": 322199, "epoch": 2662} {"train_loss": -43.7786979675293, "global_step": 322200, "epoch": 2662} {"train_loss": -44.571712493896484, "global_step": 322201, "epoch": 2662} {"train_loss": -43.49506378173828, "global_step": 322202, "epoch": 2662} {"train_loss": -43.778900146484375, "global_step": 322203, "epoch": 2662} {"train_loss": -44.697052001953125, "global_step": 322204, "epoch": 2662} {"train_loss": -44.81106185913086, "global_step": 322205, "epoch": 2662} {"train_loss": -44.39739990234375, "global_step": 322206, "epoch": 2662} {"train_loss": -45.040557861328125, "global_step": 322207, "epoch": 2662} {"train_loss": -44.87384033203125, "global_step": 322208, "epoch": 2662} {"train_loss": -44.1669921875, "global_step": 322209, "epoch": 2662} {"train_loss": -44.7263298034668, "global_step": 322210, "epoch": 2662} {"train_loss": -42.8474235534668, "global_step": 322211, "epoch": 2662} {"train_loss": -44.47467803955078, "global_step": 322212, "epoch": 2662} {"train_loss": -44.49065017700195, "global_step": 322213, "epoch": 2662} {"train_loss": -44.087764739990234, "global_step": 322214, "epoch": 2662} {"train_loss": -44.46957015991211, "global_step": 322215, "epoch": 2662} {"train_loss": -44.70115280151367, "global_step": 322216, "epoch": 2662} {"train_loss": -38.02455139160156, "global_step": 322217, "epoch": 2662} {"train_loss": -43.550533294677734, "global_step": 322218, "epoch": 2662} {"train_loss": -44.51156234741211, "global_step": 322219, "epoch": 2662} {"train_loss": -44.5530891418457, "global_step": 322220, "epoch": 2662} {"train_loss": -44.303401947021484, "global_step": 322221, "epoch": 2662} {"train_loss": -43.63605133561063, "global_step": 322222, "epoch": 2662, "val_loss": 2675065.25} {"train_loss": -44.187232971191406, "global_step": 322223, "epoch": 2663} {"train_loss": -45.09170150756836, "global_step": 322224, "epoch": 2663} {"train_loss": -44.705379486083984, "global_step": 322225, "epoch": 2663} {"train_loss": -43.01999282836914, "global_step": 322226, "epoch": 2663} {"train_loss": -44.31133270263672, "global_step": 322227, "epoch": 2663} {"train_loss": -44.9713020324707, "global_step": 322228, "epoch": 2663} {"train_loss": -44.10136413574219, "global_step": 322229, "epoch": 2663} {"train_loss": -44.35028076171875, "global_step": 322230, "epoch": 2663} {"train_loss": -42.87581253051758, "global_step": 322231, "epoch": 2663} {"train_loss": -44.58835983276367, "global_step": 322232, "epoch": 2663} {"train_loss": -43.979549407958984, "global_step": 322233, "epoch": 2663} {"train_loss": -43.93928146362305, "global_step": 322234, "epoch": 2663} {"train_loss": -43.58098602294922, "global_step": 322235, "epoch": 2663} {"train_loss": -42.6126823425293, "global_step": 322236, "epoch": 2663} {"train_loss": -44.152252197265625, "global_step": 322237, "epoch": 2663} {"train_loss": -44.642024993896484, "global_step": 322238, "epoch": 2663} {"train_loss": -44.80817413330078, "global_step": 322239, "epoch": 2663} {"train_loss": -44.4168701171875, "global_step": 322240, "epoch": 2663} {"train_loss": -44.273651123046875, "global_step": 322241, "epoch": 2663} {"train_loss": -44.008453369140625, "global_step": 322242, "epoch": 2663} {"train_loss": -44.70351028442383, "global_step": 322243, "epoch": 2663} {"train_loss": -43.34418869018555, "global_step": 322244, "epoch": 2663} {"train_loss": -44.070228576660156, "global_step": 322245, "epoch": 2663} {"train_loss": -44.13922882080078, "global_step": 322246, "epoch": 2663} {"train_loss": -44.47201156616211, "global_step": 322247, "epoch": 2663} {"train_loss": -43.71427536010742, "global_step": 322248, "epoch": 2663} {"train_loss": -41.351661682128906, "global_step": 322249, "epoch": 2663} {"train_loss": -38.327083587646484, "global_step": 322250, "epoch": 2663} {"train_loss": -42.660125732421875, "global_step": 322251, "epoch": 2663} {"train_loss": -42.769954681396484, "global_step": 322252, "epoch": 2663} {"train_loss": -41.11051559448242, "global_step": 322253, "epoch": 2663} {"train_loss": -43.19393539428711, "global_step": 322254, "epoch": 2663} {"train_loss": -43.75765609741211, "global_step": 322255, "epoch": 2663} {"train_loss": -41.69441604614258, "global_step": 322256, "epoch": 2663} {"train_loss": -40.535091400146484, "global_step": 322257, "epoch": 2663} {"train_loss": -43.33305358886719, "global_step": 322258, "epoch": 2663} {"train_loss": -42.74274444580078, "global_step": 322259, "epoch": 2663} {"train_loss": -40.68817901611328, "global_step": 322260, "epoch": 2663} {"train_loss": -43.68567657470703, "global_step": 322261, "epoch": 2663} {"train_loss": -40.89814758300781, "global_step": 322262, "epoch": 2663} {"train_loss": -40.6971549987793, "global_step": 322263, "epoch": 2663} {"train_loss": -43.915748596191406, "global_step": 322264, "epoch": 2663} {"train_loss": -42.19924545288086, "global_step": 322265, "epoch": 2663} {"train_loss": -41.79863739013672, "global_step": 322266, "epoch": 2663} {"train_loss": -43.42940902709961, "global_step": 322267, "epoch": 2663} {"train_loss": -42.6171989440918, "global_step": 322268, "epoch": 2663} {"train_loss": -43.742530822753906, "global_step": 322269, "epoch": 2663} {"train_loss": -41.80353927612305, "global_step": 322270, "epoch": 2663} {"train_loss": -42.88772964477539, "global_step": 322271, "epoch": 2663} {"train_loss": -43.80709457397461, "global_step": 322272, "epoch": 2663} {"train_loss": -43.353538513183594, "global_step": 322273, "epoch": 2663} {"train_loss": -43.27305603027344, "global_step": 322274, "epoch": 2663} {"train_loss": -42.12075424194336, "global_step": 322275, "epoch": 2663} {"train_loss": -41.873104095458984, "global_step": 322276, "epoch": 2663} {"train_loss": -42.72613525390625, "global_step": 322277, "epoch": 2663} {"train_loss": -44.41569900512695, "global_step": 322278, "epoch": 2663} {"train_loss": -42.529052734375, "global_step": 322279, "epoch": 2663} {"train_loss": -40.19174575805664, "global_step": 322280, "epoch": 2663} {"train_loss": -43.59559631347656, "global_step": 322281, "epoch": 2663} {"train_loss": -40.112152099609375, "global_step": 322282, "epoch": 2663} {"train_loss": -38.86543655395508, "global_step": 322283, "epoch": 2663} {"train_loss": -42.40739822387695, "global_step": 322284, "epoch": 2663} {"train_loss": -42.442718505859375, "global_step": 322285, "epoch": 2663} {"train_loss": -42.04731369018555, "global_step": 322286, "epoch": 2663} {"train_loss": -42.906070709228516, "global_step": 322287, "epoch": 2663} {"train_loss": -42.791316986083984, "global_step": 322288, "epoch": 2663} {"train_loss": -42.78397750854492, "global_step": 322289, "epoch": 2663} {"train_loss": -43.79452896118164, "global_step": 322290, "epoch": 2663} {"train_loss": -42.194393157958984, "global_step": 322291, "epoch": 2663} {"train_loss": -42.66987228393555, "global_step": 322292, "epoch": 2663} {"train_loss": -44.019508361816406, "global_step": 322293, "epoch": 2663} {"train_loss": -42.431575775146484, "global_step": 322294, "epoch": 2663} {"train_loss": -43.589595794677734, "global_step": 322295, "epoch": 2663} {"train_loss": -43.32068634033203, "global_step": 322296, "epoch": 2663} {"train_loss": -43.6693000793457, "global_step": 322297, "epoch": 2663} {"train_loss": -43.72602462768555, "global_step": 322298, "epoch": 2663} {"train_loss": -43.40690231323242, "global_step": 322299, "epoch": 2663} {"train_loss": -43.4918212890625, "global_step": 322300, "epoch": 2663} {"train_loss": -44.020851135253906, "global_step": 322301, "epoch": 2663} {"train_loss": -43.787681579589844, "global_step": 322302, "epoch": 2663} {"train_loss": -43.799007415771484, "global_step": 322303, "epoch": 2663} {"train_loss": -44.017024993896484, "global_step": 322304, "epoch": 2663} {"train_loss": -43.74934005737305, "global_step": 322305, "epoch": 2663} {"train_loss": -44.23379135131836, "global_step": 322306, "epoch": 2663} {"train_loss": -43.48622131347656, "global_step": 322307, "epoch": 2663} {"train_loss": -43.85831832885742, "global_step": 322308, "epoch": 2663} {"train_loss": -43.43998336791992, "global_step": 322309, "epoch": 2663} {"train_loss": -43.35994338989258, "global_step": 322310, "epoch": 2663} {"train_loss": -43.62397384643555, "global_step": 322311, "epoch": 2663} {"train_loss": -43.77372360229492, "global_step": 322312, "epoch": 2663} {"train_loss": -43.62327194213867, "global_step": 322313, "epoch": 2663} {"train_loss": -43.97896194458008, "global_step": 322314, "epoch": 2663} {"train_loss": -44.273094177246094, "global_step": 322315, "epoch": 2663} {"train_loss": -43.84218215942383, "global_step": 322316, "epoch": 2663} {"train_loss": -43.97666931152344, "global_step": 322317, "epoch": 2663} {"train_loss": -43.666202545166016, "global_step": 322318, "epoch": 2663} {"train_loss": -44.952980041503906, "global_step": 322319, "epoch": 2663} {"train_loss": -44.36061477661133, "global_step": 322320, "epoch": 2663} {"train_loss": -43.81973648071289, "global_step": 322321, "epoch": 2663} {"train_loss": -44.228511810302734, "global_step": 322322, "epoch": 2663} {"train_loss": -44.21759796142578, "global_step": 322323, "epoch": 2663} {"train_loss": -44.004615783691406, "global_step": 322324, "epoch": 2663} {"train_loss": -43.50856399536133, "global_step": 322325, "epoch": 2663} {"train_loss": -44.5831298828125, "global_step": 322326, "epoch": 2663} {"train_loss": -44.15739059448242, "global_step": 322327, "epoch": 2663} {"train_loss": -43.80234909057617, "global_step": 322328, "epoch": 2663} {"train_loss": -43.88186264038086, "global_step": 322329, "epoch": 2663} {"train_loss": -41.78828048706055, "global_step": 322330, "epoch": 2663} {"train_loss": -43.445491790771484, "global_step": 322331, "epoch": 2663} {"train_loss": -43.651405334472656, "global_step": 322332, "epoch": 2663} {"train_loss": -42.664493560791016, "global_step": 322333, "epoch": 2663} {"train_loss": -43.137786865234375, "global_step": 322334, "epoch": 2663} {"train_loss": -43.453182220458984, "global_step": 322335, "epoch": 2663} {"train_loss": -43.31058883666992, "global_step": 322336, "epoch": 2663} {"train_loss": -44.0059814453125, "global_step": 322337, "epoch": 2663} {"train_loss": -43.204750061035156, "global_step": 322338, "epoch": 2663} {"train_loss": -43.674442291259766, "global_step": 322339, "epoch": 2663} {"train_loss": -43.61004638671875, "global_step": 322340, "epoch": 2663} {"train_loss": -43.167816162109375, "global_step": 322341, "epoch": 2663} {"train_loss": -44.1944694519043, "global_step": 322342, "epoch": 2663} {"train_loss": -43.26909842372926, "global_step": 322343, "epoch": 2663, "val_loss": 2661211.25} {"train_loss": -44.34876251220703, "global_step": 322344, "epoch": 2664} {"train_loss": -43.91094970703125, "global_step": 322345, "epoch": 2664} {"train_loss": -44.674537658691406, "global_step": 322346, "epoch": 2664} {"train_loss": -43.866294860839844, "global_step": 322347, "epoch": 2664} {"train_loss": -44.76640701293945, "global_step": 322348, "epoch": 2664} {"train_loss": -44.34125518798828, "global_step": 322349, "epoch": 2664} {"train_loss": -43.95650863647461, "global_step": 322350, "epoch": 2664} {"train_loss": -44.552207946777344, "global_step": 322351, "epoch": 2664} {"train_loss": -44.481082916259766, "global_step": 322352, "epoch": 2664} {"train_loss": -44.028629302978516, "global_step": 322353, "epoch": 2664} {"train_loss": -44.528316497802734, "global_step": 322354, "epoch": 2664} {"train_loss": -44.20698165893555, "global_step": 322355, "epoch": 2664} {"train_loss": -43.744537353515625, "global_step": 322356, "epoch": 2664} {"train_loss": -44.98708724975586, "global_step": 322357, "epoch": 2664} {"train_loss": -44.12689208984375, "global_step": 322358, "epoch": 2664} {"train_loss": -44.98713302612305, "global_step": 322359, "epoch": 2664} {"train_loss": -43.876468658447266, "global_step": 322360, "epoch": 2664} {"train_loss": -44.349239349365234, "global_step": 322361, "epoch": 2664} {"train_loss": -44.37479782104492, "global_step": 322362, "epoch": 2664} {"train_loss": -44.72221755981445, "global_step": 322363, "epoch": 2664} {"train_loss": -44.660980224609375, "global_step": 322364, "epoch": 2664} {"train_loss": -45.05482864379883, "global_step": 322365, "epoch": 2664} {"train_loss": -44.75242614746094, "global_step": 322366, "epoch": 2664} {"train_loss": -44.832420349121094, "global_step": 322367, "epoch": 2664} {"train_loss": -44.85649490356445, "global_step": 322368, "epoch": 2664} {"train_loss": -44.609169006347656, "global_step": 322369, "epoch": 2664} {"train_loss": -44.714046478271484, "global_step": 322370, "epoch": 2664} {"train_loss": -44.4513053894043, "global_step": 322371, "epoch": 2664} {"train_loss": -45.470516204833984, "global_step": 322372, "epoch": 2664} {"train_loss": -44.677330017089844, "global_step": 322373, "epoch": 2664} {"train_loss": -44.98690414428711, "global_step": 322374, "epoch": 2664} {"train_loss": -44.56357955932617, "global_step": 322375, "epoch": 2664} {"train_loss": -44.90190887451172, "global_step": 322376, "epoch": 2664} {"train_loss": -44.445003509521484, "global_step": 322377, "epoch": 2664} {"train_loss": -45.27141189575195, "global_step": 322378, "epoch": 2664} {"train_loss": -44.65555191040039, "global_step": 322379, "epoch": 2664} {"train_loss": -44.43327713012695, "global_step": 322380, "epoch": 2664} {"train_loss": -44.4398193359375, "global_step": 322381, "epoch": 2664} {"train_loss": -44.489585876464844, "global_step": 322382, "epoch": 2664} {"train_loss": -44.4589958190918, "global_step": 322383, "epoch": 2664} {"train_loss": -44.3892822265625, "global_step": 322384, "epoch": 2664} {"train_loss": -44.938941955566406, "global_step": 322385, "epoch": 2664} {"train_loss": -44.48403549194336, "global_step": 322386, "epoch": 2664} {"train_loss": -44.343929290771484, "global_step": 322387, "epoch": 2664} {"train_loss": -42.81498336791992, "global_step": 322388, "epoch": 2664} {"train_loss": -42.325347900390625, "global_step": 322389, "epoch": 2664} {"train_loss": -44.45673370361328, "global_step": 322390, "epoch": 2664} {"train_loss": -41.08121871948242, "global_step": 322391, "epoch": 2664} {"train_loss": -40.9115104675293, "global_step": 322392, "epoch": 2664} {"train_loss": -43.46002960205078, "global_step": 322393, "epoch": 2664} {"train_loss": -43.41098403930664, "global_step": 322394, "epoch": 2664} {"train_loss": -42.84029769897461, "global_step": 322395, "epoch": 2664} {"train_loss": -42.05894088745117, "global_step": 322396, "epoch": 2664} {"train_loss": -43.58026123046875, "global_step": 322397, "epoch": 2664} {"train_loss": -42.7175178527832, "global_step": 322398, "epoch": 2664} {"train_loss": -42.37825393676758, "global_step": 322399, "epoch": 2664} {"train_loss": -43.34768295288086, "global_step": 322400, "epoch": 2664} {"train_loss": -43.48061752319336, "global_step": 322401, "epoch": 2664} {"train_loss": -43.16743087768555, "global_step": 322402, "epoch": 2664} {"train_loss": -43.3202018737793, "global_step": 322403, "epoch": 2664} {"train_loss": -43.62226104736328, "global_step": 322404, "epoch": 2664} {"train_loss": -44.012001037597656, "global_step": 322405, "epoch": 2664} {"train_loss": -44.13942337036133, "global_step": 322406, "epoch": 2664} {"train_loss": -43.274940490722656, "global_step": 322407, "epoch": 2664} {"train_loss": -42.37983322143555, "global_step": 322408, "epoch": 2664} {"train_loss": -44.855098724365234, "global_step": 322409, "epoch": 2664} {"train_loss": -43.038856506347656, "global_step": 322410, "epoch": 2664} {"train_loss": -43.072696685791016, "global_step": 322411, "epoch": 2664} {"train_loss": -44.50619125366211, "global_step": 322412, "epoch": 2664} {"train_loss": -43.94807052612305, "global_step": 322413, "epoch": 2664} {"train_loss": -43.99190139770508, "global_step": 322414, "epoch": 2664} {"train_loss": -44.171356201171875, "global_step": 322415, "epoch": 2664} {"train_loss": -44.06128692626953, "global_step": 322416, "epoch": 2664} {"train_loss": -43.5157470703125, "global_step": 322417, "epoch": 2664} {"train_loss": -43.870845794677734, "global_step": 322418, "epoch": 2664} {"train_loss": -44.44077682495117, "global_step": 322419, "epoch": 2664} {"train_loss": -43.86982727050781, "global_step": 322420, "epoch": 2664} {"train_loss": -44.38666915893555, "global_step": 322421, "epoch": 2664} {"train_loss": -43.668067932128906, "global_step": 322422, "epoch": 2664} {"train_loss": -44.0468635559082, "global_step": 322423, "epoch": 2664} {"train_loss": -44.450172424316406, "global_step": 322424, "epoch": 2664} {"train_loss": -44.61350631713867, "global_step": 322425, "epoch": 2664} {"train_loss": -44.469444274902344, "global_step": 322426, "epoch": 2664} {"train_loss": -44.32387924194336, "global_step": 322427, "epoch": 2664} {"train_loss": -44.72137451171875, "global_step": 322428, "epoch": 2664} {"train_loss": -44.62766647338867, "global_step": 322429, "epoch": 2664} {"train_loss": -44.035987854003906, "global_step": 322430, "epoch": 2664} {"train_loss": -44.606014251708984, "global_step": 322431, "epoch": 2664} {"train_loss": -45.08479309082031, "global_step": 322432, "epoch": 2664} {"train_loss": -44.3289794921875, "global_step": 322433, "epoch": 2664} {"train_loss": -44.5219841003418, "global_step": 322434, "epoch": 2664} {"train_loss": -44.084144592285156, "global_step": 322435, "epoch": 2664} {"train_loss": -44.59299850463867, "global_step": 322436, "epoch": 2664} {"train_loss": -44.533294677734375, "global_step": 322437, "epoch": 2664} {"train_loss": -43.82550811767578, "global_step": 322438, "epoch": 2664} {"train_loss": -44.62274169921875, "global_step": 322439, "epoch": 2664} {"train_loss": -44.537776947021484, "global_step": 322440, "epoch": 2664} {"train_loss": -44.381893157958984, "global_step": 322441, "epoch": 2664} {"train_loss": -44.56300735473633, "global_step": 322442, "epoch": 2664} {"train_loss": -44.11349105834961, "global_step": 322443, "epoch": 2664} {"train_loss": -44.73488235473633, "global_step": 322444, "epoch": 2664} {"train_loss": -44.570919036865234, "global_step": 322445, "epoch": 2664} {"train_loss": -44.883060455322266, "global_step": 322446, "epoch": 2664} {"train_loss": -44.32740020751953, "global_step": 322447, "epoch": 2664} {"train_loss": -43.71950149536133, "global_step": 322448, "epoch": 2664} {"train_loss": -44.65043640136719, "global_step": 322449, "epoch": 2664} {"train_loss": -44.34078598022461, "global_step": 322450, "epoch": 2664} {"train_loss": -44.59601593017578, "global_step": 322451, "epoch": 2664} {"train_loss": -45.01068115234375, "global_step": 322452, "epoch": 2664} {"train_loss": -43.47272491455078, "global_step": 322453, "epoch": 2664} {"train_loss": -43.930870056152344, "global_step": 322454, "epoch": 2664} {"train_loss": -44.84744644165039, "global_step": 322455, "epoch": 2664} {"train_loss": -44.57889938354492, "global_step": 322456, "epoch": 2664} {"train_loss": -44.19908905029297, "global_step": 322457, "epoch": 2664} {"train_loss": -43.96771240234375, "global_step": 322458, "epoch": 2664} {"train_loss": -44.67224884033203, "global_step": 322459, "epoch": 2664} {"train_loss": -44.96726608276367, "global_step": 322460, "epoch": 2664} {"train_loss": -44.81496810913086, "global_step": 322461, "epoch": 2664} {"train_loss": -44.95640182495117, "global_step": 322462, "epoch": 2664} {"train_loss": -45.096717834472656, "global_step": 322463, "epoch": 2664} {"train_loss": -44.17620165485981, "global_step": 322464, "epoch": 2664, "val_loss": 2653567.0} {"train_loss": -44.678016662597656, "global_step": 322465, "epoch": 2665} {"train_loss": -45.02747344970703, "global_step": 322466, "epoch": 2665} {"train_loss": -45.14103317260742, "global_step": 322467, "epoch": 2665} {"train_loss": -44.95670700073242, "global_step": 322468, "epoch": 2665} {"train_loss": -43.8887939453125, "global_step": 322469, "epoch": 2665} {"train_loss": -43.71023178100586, "global_step": 322470, "epoch": 2665} {"train_loss": -43.93559265136719, "global_step": 322471, "epoch": 2665} {"train_loss": -44.70737838745117, "global_step": 322472, "epoch": 2665} {"train_loss": -45.347412109375, "global_step": 322473, "epoch": 2665} {"train_loss": -44.42826843261719, "global_step": 322474, "epoch": 2665} {"train_loss": -43.184852600097656, "global_step": 322475, "epoch": 2665} {"train_loss": -40.98360061645508, "global_step": 322476, "epoch": 2665} {"train_loss": -41.68143081665039, "global_step": 322477, "epoch": 2665} {"train_loss": -43.5247917175293, "global_step": 322478, "epoch": 2665} {"train_loss": -44.7458381652832, "global_step": 322479, "epoch": 2665} {"train_loss": -44.362884521484375, "global_step": 322480, "epoch": 2665} {"train_loss": -43.93610382080078, "global_step": 322481, "epoch": 2665} {"train_loss": -43.795528411865234, "global_step": 322482, "epoch": 2665} {"train_loss": -43.201072692871094, "global_step": 322483, "epoch": 2665} {"train_loss": -44.09943389892578, "global_step": 322484, "epoch": 2665} {"train_loss": -44.50007247924805, "global_step": 322485, "epoch": 2665} {"train_loss": -44.02812957763672, "global_step": 322486, "epoch": 2665} {"train_loss": -44.71648025512695, "global_step": 322487, "epoch": 2665} {"train_loss": -44.91080093383789, "global_step": 322488, "epoch": 2665} {"train_loss": -43.61897277832031, "global_step": 322489, "epoch": 2665} {"train_loss": -44.30927276611328, "global_step": 322490, "epoch": 2665} {"train_loss": -44.333831787109375, "global_step": 322491, "epoch": 2665} {"train_loss": -43.71317672729492, "global_step": 322492, "epoch": 2665} {"train_loss": -43.62786865234375, "global_step": 322493, "epoch": 2665} {"train_loss": -44.943450927734375, "global_step": 322494, "epoch": 2665} {"train_loss": -44.564300537109375, "global_step": 322495, "epoch": 2665} {"train_loss": -44.60154724121094, "global_step": 322496, "epoch": 2665} {"train_loss": -43.799251556396484, "global_step": 322497, "epoch": 2665} {"train_loss": -43.90090560913086, "global_step": 322498, "epoch": 2665} {"train_loss": -44.26744842529297, "global_step": 322499, "epoch": 2665} {"train_loss": -44.474239349365234, "global_step": 322500, "epoch": 2665} {"train_loss": -43.547725677490234, "global_step": 322501, "epoch": 2665} {"train_loss": -43.998390197753906, "global_step": 322502, "epoch": 2665} {"train_loss": -43.71195602416992, "global_step": 322503, "epoch": 2665} {"train_loss": -43.690364837646484, "global_step": 322504, "epoch": 2665} {"train_loss": -40.34769821166992, "global_step": 322505, "epoch": 2665} {"train_loss": -43.35736846923828, "global_step": 322506, "epoch": 2665} {"train_loss": -44.14918518066406, "global_step": 322507, "epoch": 2665} {"train_loss": -43.05575180053711, "global_step": 322508, "epoch": 2665} {"train_loss": -43.282958984375, "global_step": 322509, "epoch": 2665} {"train_loss": -44.50654220581055, "global_step": 322510, "epoch": 2665} {"train_loss": -42.78559494018555, "global_step": 322511, "epoch": 2665} {"train_loss": -43.82401657104492, "global_step": 322512, "epoch": 2665} {"train_loss": -44.52133560180664, "global_step": 322513, "epoch": 2665} {"train_loss": -44.19255447387695, "global_step": 322514, "epoch": 2665} {"train_loss": -44.06633377075195, "global_step": 322515, "epoch": 2665} {"train_loss": -44.40681076049805, "global_step": 322516, "epoch": 2665} {"train_loss": -44.036251068115234, "global_step": 322517, "epoch": 2665} {"train_loss": -44.324459075927734, "global_step": 322518, "epoch": 2665} {"train_loss": -44.338539123535156, "global_step": 322519, "epoch": 2665} {"train_loss": -43.72866439819336, "global_step": 322520, "epoch": 2665} {"train_loss": -44.814361572265625, "global_step": 322521, "epoch": 2665} {"train_loss": -42.49961471557617, "global_step": 322522, "epoch": 2665} {"train_loss": -43.39810562133789, "global_step": 322523, "epoch": 2665} {"train_loss": -44.14664840698242, "global_step": 322524, "epoch": 2665} {"train_loss": -42.31802749633789, "global_step": 322525, "epoch": 2665} {"train_loss": -44.015357971191406, "global_step": 322526, "epoch": 2665} {"train_loss": -42.5020637512207, "global_step": 322527, "epoch": 2665} {"train_loss": -41.8809700012207, "global_step": 322528, "epoch": 2665} {"train_loss": -43.58960723876953, "global_step": 322529, "epoch": 2665} {"train_loss": -44.094642639160156, "global_step": 322530, "epoch": 2665} {"train_loss": -43.77759552001953, "global_step": 322531, "epoch": 2665} {"train_loss": -43.49045944213867, "global_step": 322532, "epoch": 2665} {"train_loss": -44.10174560546875, "global_step": 322533, "epoch": 2665} {"train_loss": -44.56312942504883, "global_step": 322534, "epoch": 2665} {"train_loss": -44.17110824584961, "global_step": 322535, "epoch": 2665} {"train_loss": -43.74674606323242, "global_step": 322536, "epoch": 2665} {"train_loss": -43.07120895385742, "global_step": 322537, "epoch": 2665} {"train_loss": -44.79158020019531, "global_step": 322538, "epoch": 2665} {"train_loss": -44.1597900390625, "global_step": 322539, "epoch": 2665} {"train_loss": -44.073238372802734, "global_step": 322540, "epoch": 2665} {"train_loss": -43.92769241333008, "global_step": 322541, "epoch": 2665} {"train_loss": -44.418212890625, "global_step": 322542, "epoch": 2665} {"train_loss": -44.15399932861328, "global_step": 322543, "epoch": 2665} {"train_loss": -44.13279342651367, "global_step": 322544, "epoch": 2665} {"train_loss": -44.24628829956055, "global_step": 322545, "epoch": 2665} {"train_loss": -44.081642150878906, "global_step": 322546, "epoch": 2665} {"train_loss": -44.27790069580078, "global_step": 322547, "epoch": 2665} {"train_loss": -44.63748550415039, "global_step": 322548, "epoch": 2665} {"train_loss": -44.672054290771484, "global_step": 322549, "epoch": 2665} {"train_loss": -44.79420852661133, "global_step": 322550, "epoch": 2665} {"train_loss": -44.462432861328125, "global_step": 322551, "epoch": 2665} {"train_loss": -44.573238372802734, "global_step": 322552, "epoch": 2665} {"train_loss": -44.86257553100586, "global_step": 322553, "epoch": 2665} {"train_loss": -44.284759521484375, "global_step": 322554, "epoch": 2665} {"train_loss": -44.74653244018555, "global_step": 322555, "epoch": 2665} {"train_loss": -43.99558639526367, "global_step": 322556, "epoch": 2665} {"train_loss": -44.807716369628906, "global_step": 322557, "epoch": 2665} {"train_loss": -43.67885971069336, "global_step": 322558, "epoch": 2665} {"train_loss": -43.154354095458984, "global_step": 322559, "epoch": 2665} {"train_loss": -44.11484909057617, "global_step": 322560, "epoch": 2665} {"train_loss": -44.00982666015625, "global_step": 322561, "epoch": 2665} {"train_loss": -43.8733024597168, "global_step": 322562, "epoch": 2665} {"train_loss": -42.685882568359375, "global_step": 322563, "epoch": 2665} {"train_loss": -42.749855041503906, "global_step": 322564, "epoch": 2665} {"train_loss": -42.794246673583984, "global_step": 322565, "epoch": 2665} {"train_loss": -43.124244689941406, "global_step": 322566, "epoch": 2665} {"train_loss": -44.06509017944336, "global_step": 322567, "epoch": 2665} {"train_loss": -42.88365936279297, "global_step": 322568, "epoch": 2665} {"train_loss": -43.94649887084961, "global_step": 322569, "epoch": 2665} {"train_loss": -44.231666564941406, "global_step": 322570, "epoch": 2665} {"train_loss": -44.1448974609375, "global_step": 322571, "epoch": 2665} {"train_loss": -44.0275764465332, "global_step": 322572, "epoch": 2665} {"train_loss": -43.2729377746582, "global_step": 322573, "epoch": 2665} {"train_loss": -43.51212692260742, "global_step": 322574, "epoch": 2665} {"train_loss": -43.796234130859375, "global_step": 322575, "epoch": 2665} {"train_loss": -43.58393096923828, "global_step": 322576, "epoch": 2665} {"train_loss": -44.52463912963867, "global_step": 322577, "epoch": 2665} {"train_loss": -42.5514030456543, "global_step": 322578, "epoch": 2665} {"train_loss": -44.62522506713867, "global_step": 322579, "epoch": 2665} {"train_loss": -43.90473556518555, "global_step": 322580, "epoch": 2665} {"train_loss": -41.56439971923828, "global_step": 322581, "epoch": 2665} {"train_loss": -44.62370681762695, "global_step": 322582, "epoch": 2665} {"train_loss": -43.487388610839844, "global_step": 322583, "epoch": 2665} {"train_loss": -43.16788864135742, "global_step": 322584, "epoch": 2665} {"train_loss": -43.886011297052555, "global_step": 322585, "epoch": 2665, "val_loss": 2687628.75} {"train_loss": -42.17448806762695, "global_step": 322586, "epoch": 2666} {"train_loss": -44.21797561645508, "global_step": 322587, "epoch": 2666} {"train_loss": -42.184410095214844, "global_step": 322588, "epoch": 2666} {"train_loss": -41.0189094543457, "global_step": 322589, "epoch": 2666} {"train_loss": -44.164466857910156, "global_step": 322590, "epoch": 2666} {"train_loss": -40.85354232788086, "global_step": 322591, "epoch": 2666} {"train_loss": -44.120052337646484, "global_step": 322592, "epoch": 2666} {"train_loss": -41.95003890991211, "global_step": 322593, "epoch": 2666} {"train_loss": -42.69440841674805, "global_step": 322594, "epoch": 2666} {"train_loss": -43.04021453857422, "global_step": 322595, "epoch": 2666} {"train_loss": -42.945716857910156, "global_step": 322596, "epoch": 2666} {"train_loss": -43.39723587036133, "global_step": 322597, "epoch": 2666} {"train_loss": -42.214481353759766, "global_step": 322598, "epoch": 2666} {"train_loss": -43.85416793823242, "global_step": 322599, "epoch": 2666} {"train_loss": -43.017372131347656, "global_step": 322600, "epoch": 2666} {"train_loss": -44.093116760253906, "global_step": 322601, "epoch": 2666} {"train_loss": -42.799537658691406, "global_step": 322602, "epoch": 2666} {"train_loss": -43.81715774536133, "global_step": 322603, "epoch": 2666} {"train_loss": -43.42594528198242, "global_step": 322604, "epoch": 2666} {"train_loss": -42.840240478515625, "global_step": 322605, "epoch": 2666} {"train_loss": -42.27885055541992, "global_step": 322606, "epoch": 2666} {"train_loss": -43.769866943359375, "global_step": 322607, "epoch": 2666} {"train_loss": -42.557701110839844, "global_step": 322608, "epoch": 2666} {"train_loss": -42.07762145996094, "global_step": 322609, "epoch": 2666} {"train_loss": -43.403987884521484, "global_step": 322610, "epoch": 2666} {"train_loss": -42.87913131713867, "global_step": 322611, "epoch": 2666} {"train_loss": -43.83749008178711, "global_step": 322612, "epoch": 2666} {"train_loss": -42.236000061035156, "global_step": 322613, "epoch": 2666} {"train_loss": -44.08171463012695, "global_step": 322614, "epoch": 2666} {"train_loss": -42.673824310302734, "global_step": 322615, "epoch": 2666} {"train_loss": -43.79465866088867, "global_step": 322616, "epoch": 2666} {"train_loss": -43.0792350769043, "global_step": 322617, "epoch": 2666} {"train_loss": -43.01146697998047, "global_step": 322618, "epoch": 2666} {"train_loss": -43.3252067565918, "global_step": 322619, "epoch": 2666} {"train_loss": -43.69142532348633, "global_step": 322620, "epoch": 2666} {"train_loss": -43.66787338256836, "global_step": 322621, "epoch": 2666} {"train_loss": -43.70948791503906, "global_step": 322622, "epoch": 2666} {"train_loss": -44.148223876953125, "global_step": 322623, "epoch": 2666} {"train_loss": -44.30103302001953, "global_step": 322624, "epoch": 2666} {"train_loss": -44.20772171020508, "global_step": 322625, "epoch": 2666} {"train_loss": -44.25994110107422, "global_step": 322626, "epoch": 2666} {"train_loss": -44.509315490722656, "global_step": 322627, "epoch": 2666} {"train_loss": -44.50571823120117, "global_step": 322628, "epoch": 2666} {"train_loss": -44.786441802978516, "global_step": 322629, "epoch": 2666} {"train_loss": -44.730472564697266, "global_step": 322630, "epoch": 2666} {"train_loss": -44.670989990234375, "global_step": 322631, "epoch": 2666} {"train_loss": -44.49900436401367, "global_step": 322632, "epoch": 2666} {"train_loss": -44.932064056396484, "global_step": 322633, "epoch": 2666} {"train_loss": -44.67020034790039, "global_step": 322634, "epoch": 2666} {"train_loss": -44.993865966796875, "global_step": 322635, "epoch": 2666} {"train_loss": -44.97892379760742, "global_step": 322636, "epoch": 2666} {"train_loss": -44.845787048339844, "global_step": 322637, "epoch": 2666} {"train_loss": -44.710784912109375, "global_step": 322638, "epoch": 2666} {"train_loss": -45.04457473754883, "global_step": 322639, "epoch": 2666} {"train_loss": -45.060516357421875, "global_step": 322640, "epoch": 2666} {"train_loss": -45.06290054321289, "global_step": 322641, "epoch": 2666} {"train_loss": -44.86438751220703, "global_step": 322642, "epoch": 2666} {"train_loss": -44.894813537597656, "global_step": 322643, "epoch": 2666} {"train_loss": -45.29647445678711, "global_step": 322644, "epoch": 2666} {"train_loss": -45.0770149230957, "global_step": 322645, "epoch": 2666} {"train_loss": -45.1441650390625, "global_step": 322646, "epoch": 2666} {"train_loss": -45.078556060791016, "global_step": 322647, "epoch": 2666} {"train_loss": -45.325496673583984, "global_step": 322648, "epoch": 2666} {"train_loss": -44.68121337890625, "global_step": 322649, "epoch": 2666} {"train_loss": -45.539730072021484, "global_step": 322650, "epoch": 2666} {"train_loss": -45.0787239074707, "global_step": 322651, "epoch": 2666} {"train_loss": -44.31333923339844, "global_step": 322652, "epoch": 2666} {"train_loss": -43.52728271484375, "global_step": 322653, "epoch": 2666} {"train_loss": -45.36932373046875, "global_step": 322654, "epoch": 2666} {"train_loss": -44.5714225769043, "global_step": 322655, "epoch": 2666} {"train_loss": -44.629798889160156, "global_step": 322656, "epoch": 2666} {"train_loss": -43.917789459228516, "global_step": 322657, "epoch": 2666} {"train_loss": -44.82766342163086, "global_step": 322658, "epoch": 2666} {"train_loss": -44.158260345458984, "global_step": 322659, "epoch": 2666} {"train_loss": -43.49203109741211, "global_step": 322660, "epoch": 2666} {"train_loss": -43.25275802612305, "global_step": 322661, "epoch": 2666} {"train_loss": -44.64287185668945, "global_step": 322662, "epoch": 2666} {"train_loss": -44.62275314331055, "global_step": 322663, "epoch": 2666} {"train_loss": -44.03981018066406, "global_step": 322664, "epoch": 2666} {"train_loss": -43.77719497680664, "global_step": 322665, "epoch": 2666} {"train_loss": -43.52259063720703, "global_step": 322666, "epoch": 2666} {"train_loss": -44.23865509033203, "global_step": 322667, "epoch": 2666} {"train_loss": -44.273841857910156, "global_step": 322668, "epoch": 2666} {"train_loss": -44.373226165771484, "global_step": 322669, "epoch": 2666} {"train_loss": -44.37846755981445, "global_step": 322670, "epoch": 2666} {"train_loss": -44.43361282348633, "global_step": 322671, "epoch": 2666} {"train_loss": -44.47237777709961, "global_step": 322672, "epoch": 2666} {"train_loss": -45.4766960144043, "global_step": 322673, "epoch": 2666} {"train_loss": -44.47994613647461, "global_step": 322674, "epoch": 2666} {"train_loss": -43.27387237548828, "global_step": 322675, "epoch": 2666} {"train_loss": -44.37117385864258, "global_step": 322676, "epoch": 2666} {"train_loss": -44.78831481933594, "global_step": 322677, "epoch": 2666} {"train_loss": -44.1034049987793, "global_step": 322678, "epoch": 2666} {"train_loss": -44.598365783691406, "global_step": 322679, "epoch": 2666} {"train_loss": -45.28023147583008, "global_step": 322680, "epoch": 2666} {"train_loss": -44.5528450012207, "global_step": 322681, "epoch": 2666} {"train_loss": -44.0445556640625, "global_step": 322682, "epoch": 2666} {"train_loss": -44.534427642822266, "global_step": 322683, "epoch": 2666} {"train_loss": -44.76123046875, "global_step": 322684, "epoch": 2666} {"train_loss": -44.653316497802734, "global_step": 322685, "epoch": 2666} {"train_loss": -43.29283142089844, "global_step": 322686, "epoch": 2666} {"train_loss": -43.72322082519531, "global_step": 322687, "epoch": 2666} {"train_loss": -44.03562545776367, "global_step": 322688, "epoch": 2666} {"train_loss": -44.70542526245117, "global_step": 322689, "epoch": 2666} {"train_loss": -43.400634765625, "global_step": 322690, "epoch": 2666} {"train_loss": -43.77238845825195, "global_step": 322691, "epoch": 2666} {"train_loss": -43.6570930480957, "global_step": 322692, "epoch": 2666} {"train_loss": -43.790016174316406, "global_step": 322693, "epoch": 2666} {"train_loss": -44.90776824951172, "global_step": 322694, "epoch": 2666} {"train_loss": -44.74128723144531, "global_step": 322695, "epoch": 2666} {"train_loss": -44.314857482910156, "global_step": 322696, "epoch": 2666} {"train_loss": -44.66938018798828, "global_step": 322697, "epoch": 2666} {"train_loss": -45.20267868041992, "global_step": 322698, "epoch": 2666} {"train_loss": -44.89519119262695, "global_step": 322699, "epoch": 2666} {"train_loss": -44.46949005126953, "global_step": 322700, "epoch": 2666} {"train_loss": -44.88447952270508, "global_step": 322701, "epoch": 2666} {"train_loss": -44.75443649291992, "global_step": 322702, "epoch": 2666} {"train_loss": -44.73615264892578, "global_step": 322703, "epoch": 2666} {"train_loss": -45.33629608154297, "global_step": 322704, "epoch": 2666} {"train_loss": -44.7608757019043, "global_step": 322705, "epoch": 2666} {"train_loss": -44.07219156943077, "global_step": 322706, "epoch": 2666, "val_loss": 2885228.75} {"train_loss": -45.14157485961914, "global_step": 322707, "epoch": 2667} {"train_loss": -44.46355056762695, "global_step": 322708, "epoch": 2667} {"train_loss": -44.47487258911133, "global_step": 322709, "epoch": 2667} {"train_loss": -44.518917083740234, "global_step": 322710, "epoch": 2667} {"train_loss": -44.48280715942383, "global_step": 322711, "epoch": 2667} {"train_loss": -44.853816986083984, "global_step": 322712, "epoch": 2667} {"train_loss": -45.484161376953125, "global_step": 322713, "epoch": 2667} {"train_loss": -44.19219970703125, "global_step": 322714, "epoch": 2667} {"train_loss": -43.69242477416992, "global_step": 322715, "epoch": 2667} {"train_loss": -43.22643280029297, "global_step": 322716, "epoch": 2667} {"train_loss": -43.88572311401367, "global_step": 322717, "epoch": 2667} {"train_loss": -45.175228118896484, "global_step": 322718, "epoch": 2667} {"train_loss": -44.98573684692383, "global_step": 322719, "epoch": 2667} {"train_loss": -43.38924789428711, "global_step": 322720, "epoch": 2667} {"train_loss": -41.905555725097656, "global_step": 322721, "epoch": 2667} {"train_loss": -44.36506271362305, "global_step": 322722, "epoch": 2667} {"train_loss": -40.87062454223633, "global_step": 322723, "epoch": 2667} {"train_loss": -43.08600616455078, "global_step": 322724, "epoch": 2667} {"train_loss": -41.559051513671875, "global_step": 322725, "epoch": 2667} {"train_loss": -42.708892822265625, "global_step": 322726, "epoch": 2667} {"train_loss": -43.65049743652344, "global_step": 322727, "epoch": 2667} {"train_loss": -43.315494537353516, "global_step": 322728, "epoch": 2667} {"train_loss": -39.101314544677734, "global_step": 322729, "epoch": 2667} {"train_loss": -43.47736740112305, "global_step": 322730, "epoch": 2667} {"train_loss": -43.608970642089844, "global_step": 322731, "epoch": 2667} {"train_loss": -43.57126998901367, "global_step": 322732, "epoch": 2667} {"train_loss": -43.18895721435547, "global_step": 322733, "epoch": 2667} {"train_loss": -43.29934310913086, "global_step": 322734, "epoch": 2667} {"train_loss": -43.41044235229492, "global_step": 322735, "epoch": 2667} {"train_loss": -42.02591323852539, "global_step": 322736, "epoch": 2667} {"train_loss": -37.70368194580078, "global_step": 322737, "epoch": 2667} {"train_loss": -39.09841537475586, "global_step": 322738, "epoch": 2667} {"train_loss": -35.972652435302734, "global_step": 322739, "epoch": 2667} {"train_loss": -42.4661750793457, "global_step": 322740, "epoch": 2667} {"train_loss": -37.45071029663086, "global_step": 322741, "epoch": 2667} {"train_loss": -41.31803894042969, "global_step": 322742, "epoch": 2667} {"train_loss": -39.88845443725586, "global_step": 322743, "epoch": 2667} {"train_loss": -41.59906768798828, "global_step": 322744, "epoch": 2667} {"train_loss": -40.78763961791992, "global_step": 322745, "epoch": 2667} {"train_loss": -37.30320358276367, "global_step": 322746, "epoch": 2667} {"train_loss": -41.28184127807617, "global_step": 322747, "epoch": 2667} {"train_loss": -38.085994720458984, "global_step": 322748, "epoch": 2667} {"train_loss": -42.76585388183594, "global_step": 322749, "epoch": 2667} {"train_loss": -40.31074905395508, "global_step": 322750, "epoch": 2667} {"train_loss": -40.50979232788086, "global_step": 322751, "epoch": 2667} {"train_loss": -42.21564865112305, "global_step": 322752, "epoch": 2667} {"train_loss": -41.17967987060547, "global_step": 322753, "epoch": 2667} {"train_loss": -41.728477478027344, "global_step": 322754, "epoch": 2667} {"train_loss": -42.59400177001953, "global_step": 322755, "epoch": 2667} {"train_loss": -43.41902160644531, "global_step": 322756, "epoch": 2667} {"train_loss": -42.52251434326172, "global_step": 322757, "epoch": 2667} {"train_loss": -42.6228141784668, "global_step": 322758, "epoch": 2667} {"train_loss": -42.313560485839844, "global_step": 322759, "epoch": 2667} {"train_loss": -43.21403884887695, "global_step": 322760, "epoch": 2667} {"train_loss": -42.458187103271484, "global_step": 322761, "epoch": 2667} {"train_loss": -43.65163803100586, "global_step": 322762, "epoch": 2667} {"train_loss": -42.37762451171875, "global_step": 322763, "epoch": 2667} {"train_loss": -43.0169792175293, "global_step": 322764, "epoch": 2667} {"train_loss": -43.094764709472656, "global_step": 322765, "epoch": 2667} {"train_loss": -43.41811752319336, "global_step": 322766, "epoch": 2667} {"train_loss": -43.42081832885742, "global_step": 322767, "epoch": 2667} {"train_loss": -43.80183792114258, "global_step": 322768, "epoch": 2667} {"train_loss": -43.4470329284668, "global_step": 322769, "epoch": 2667} {"train_loss": -43.9177131652832, "global_step": 322770, "epoch": 2667} {"train_loss": -43.39045715332031, "global_step": 322771, "epoch": 2667} {"train_loss": -44.135929107666016, "global_step": 322772, "epoch": 2667} {"train_loss": -44.0969352722168, "global_step": 322773, "epoch": 2667} {"train_loss": -43.8001823425293, "global_step": 322774, "epoch": 2667} {"train_loss": -43.69554138183594, "global_step": 322775, "epoch": 2667} {"train_loss": -44.36790084838867, "global_step": 322776, "epoch": 2667} {"train_loss": -42.44316101074219, "global_step": 322777, "epoch": 2667} {"train_loss": -44.70087432861328, "global_step": 322778, "epoch": 2667} {"train_loss": -43.32392883300781, "global_step": 322779, "epoch": 2667} {"train_loss": -43.74686813354492, "global_step": 322780, "epoch": 2667} {"train_loss": -44.0507926940918, "global_step": 322781, "epoch": 2667} {"train_loss": -44.2632942199707, "global_step": 322782, "epoch": 2667} {"train_loss": -43.75779342651367, "global_step": 322783, "epoch": 2667} {"train_loss": -44.50278854370117, "global_step": 322784, "epoch": 2667} {"train_loss": -44.15720748901367, "global_step": 322785, "epoch": 2667} {"train_loss": -43.63521194458008, "global_step": 322786, "epoch": 2667} {"train_loss": -44.01067352294922, "global_step": 322787, "epoch": 2667} {"train_loss": -44.562522888183594, "global_step": 322788, "epoch": 2667} {"train_loss": -43.817962646484375, "global_step": 322789, "epoch": 2667} {"train_loss": -44.544647216796875, "global_step": 322790, "epoch": 2667} {"train_loss": -44.542110443115234, "global_step": 322791, "epoch": 2667} {"train_loss": -44.7156982421875, "global_step": 322792, "epoch": 2667} {"train_loss": -44.79884338378906, "global_step": 322793, "epoch": 2667} {"train_loss": -45.23837661743164, "global_step": 322794, "epoch": 2667} {"train_loss": -44.303916931152344, "global_step": 322795, "epoch": 2667} {"train_loss": -44.713802337646484, "global_step": 322796, "epoch": 2667} {"train_loss": -44.851783752441406, "global_step": 322797, "epoch": 2667} {"train_loss": -45.45741653442383, "global_step": 322798, "epoch": 2667} {"train_loss": -44.796234130859375, "global_step": 322799, "epoch": 2667} {"train_loss": -44.76125717163086, "global_step": 322800, "epoch": 2667} {"train_loss": -45.212257385253906, "global_step": 322801, "epoch": 2667} {"train_loss": -45.122650146484375, "global_step": 322802, "epoch": 2667} {"train_loss": -44.973304748535156, "global_step": 322803, "epoch": 2667} {"train_loss": -45.19777297973633, "global_step": 322804, "epoch": 2667} {"train_loss": -45.5309944152832, "global_step": 322805, "epoch": 2667} {"train_loss": -45.29759216308594, "global_step": 322806, "epoch": 2667} {"train_loss": -44.831180572509766, "global_step": 322807, "epoch": 2667} {"train_loss": -45.118011474609375, "global_step": 322808, "epoch": 2667} {"train_loss": -44.29557418823242, "global_step": 322809, "epoch": 2667} {"train_loss": -44.85227584838867, "global_step": 322810, "epoch": 2667} {"train_loss": -45.01361846923828, "global_step": 322811, "epoch": 2667} {"train_loss": -45.360450744628906, "global_step": 322812, "epoch": 2667} {"train_loss": -44.620399475097656, "global_step": 322813, "epoch": 2667} {"train_loss": -45.03045654296875, "global_step": 322814, "epoch": 2667} {"train_loss": -45.67413330078125, "global_step": 322815, "epoch": 2667} {"train_loss": -45.74837112426758, "global_step": 322816, "epoch": 2667} {"train_loss": -45.189552307128906, "global_step": 322817, "epoch": 2667} {"train_loss": -45.23710250854492, "global_step": 322818, "epoch": 2667} {"train_loss": -45.328922271728516, "global_step": 322819, "epoch": 2667} {"train_loss": -45.02398681640625, "global_step": 322820, "epoch": 2667} {"train_loss": -44.76497268676758, "global_step": 322821, "epoch": 2667} {"train_loss": -45.60218048095703, "global_step": 322822, "epoch": 2667} {"train_loss": -45.25328826904297, "global_step": 322823, "epoch": 2667} {"train_loss": -45.053951263427734, "global_step": 322824, "epoch": 2667} {"train_loss": -45.68478775024414, "global_step": 322825, "epoch": 2667} {"train_loss": -44.7788200378418, "global_step": 322826, "epoch": 2667} {"train_loss": -43.48778294334727, "global_step": 322827, "epoch": 2667, "val_loss": 2666428.0} {"train_loss": -44.633113861083984, "global_step": 322828, "epoch": 2668} {"train_loss": -45.087554931640625, "global_step": 322829, "epoch": 2668} {"train_loss": -45.37388610839844, "global_step": 322830, "epoch": 2668} {"train_loss": -45.32630920410156, "global_step": 322831, "epoch": 2668} {"train_loss": -44.990882873535156, "global_step": 322832, "epoch": 2668} {"train_loss": -43.03843307495117, "global_step": 322833, "epoch": 2668} {"train_loss": -40.70034408569336, "global_step": 322834, "epoch": 2668} {"train_loss": -38.8652458190918, "global_step": 322835, "epoch": 2668} {"train_loss": -41.956565856933594, "global_step": 322836, "epoch": 2668} {"train_loss": -44.925445556640625, "global_step": 322837, "epoch": 2668} {"train_loss": -43.477943420410156, "global_step": 322838, "epoch": 2668} {"train_loss": -43.394710540771484, "global_step": 322839, "epoch": 2668} {"train_loss": -42.37004470825195, "global_step": 322840, "epoch": 2668} {"train_loss": -44.32558822631836, "global_step": 322841, "epoch": 2668} {"train_loss": -44.844818115234375, "global_step": 322842, "epoch": 2668} {"train_loss": -43.37738037109375, "global_step": 322843, "epoch": 2668} {"train_loss": -42.21267318725586, "global_step": 322844, "epoch": 2668} {"train_loss": -43.9493293762207, "global_step": 322845, "epoch": 2668} {"train_loss": -43.917579650878906, "global_step": 322846, "epoch": 2668} {"train_loss": -42.847469329833984, "global_step": 322847, "epoch": 2668} {"train_loss": -43.15530014038086, "global_step": 322848, "epoch": 2668} {"train_loss": -42.5011100769043, "global_step": 322849, "epoch": 2668} {"train_loss": -41.399349212646484, "global_step": 322850, "epoch": 2668} {"train_loss": -43.15351867675781, "global_step": 322851, "epoch": 2668} {"train_loss": -44.610595703125, "global_step": 322852, "epoch": 2668} {"train_loss": -41.43722152709961, "global_step": 322853, "epoch": 2668} {"train_loss": -43.942138671875, "global_step": 322854, "epoch": 2668} {"train_loss": -44.45017623901367, "global_step": 322855, "epoch": 2668} {"train_loss": -42.64848709106445, "global_step": 322856, "epoch": 2668} {"train_loss": -41.8734130859375, "global_step": 322857, "epoch": 2668} {"train_loss": -43.46759033203125, "global_step": 322858, "epoch": 2668} {"train_loss": -43.3775520324707, "global_step": 322859, "epoch": 2668} {"train_loss": -42.898216247558594, "global_step": 322860, "epoch": 2668} {"train_loss": -42.429725646972656, "global_step": 322861, "epoch": 2668} {"train_loss": -43.16960525512695, "global_step": 322862, "epoch": 2668} {"train_loss": -44.32981491088867, "global_step": 322863, "epoch": 2668} {"train_loss": -42.329750061035156, "global_step": 322864, "epoch": 2668} {"train_loss": -42.40703201293945, "global_step": 322865, "epoch": 2668} {"train_loss": -44.01227569580078, "global_step": 322866, "epoch": 2668} {"train_loss": -43.641963958740234, "global_step": 322867, "epoch": 2668} {"train_loss": -42.319393157958984, "global_step": 322868, "epoch": 2668} {"train_loss": -43.885440826416016, "global_step": 322869, "epoch": 2668} {"train_loss": -44.16423416137695, "global_step": 322870, "epoch": 2668} {"train_loss": -44.240291595458984, "global_step": 322871, "epoch": 2668} {"train_loss": -43.67073440551758, "global_step": 322872, "epoch": 2668} {"train_loss": -44.529563903808594, "global_step": 322873, "epoch": 2668} {"train_loss": -44.55636215209961, "global_step": 322874, "epoch": 2668} {"train_loss": -43.167030334472656, "global_step": 322875, "epoch": 2668} {"train_loss": -44.98031997680664, "global_step": 322876, "epoch": 2668} {"train_loss": -43.701148986816406, "global_step": 322877, "epoch": 2668} {"train_loss": -44.01630783081055, "global_step": 322878, "epoch": 2668} {"train_loss": -44.96207809448242, "global_step": 322879, "epoch": 2668} {"train_loss": -44.28977584838867, "global_step": 322880, "epoch": 2668} {"train_loss": -44.2454833984375, "global_step": 322881, "epoch": 2668} {"train_loss": -43.9973030090332, "global_step": 322882, "epoch": 2668} {"train_loss": -44.6027946472168, "global_step": 322883, "epoch": 2668} {"train_loss": -44.62324142456055, "global_step": 322884, "epoch": 2668} {"train_loss": -44.39548873901367, "global_step": 322885, "epoch": 2668} {"train_loss": -43.70555877685547, "global_step": 322886, "epoch": 2668} {"train_loss": -44.255638122558594, "global_step": 322887, "epoch": 2668} {"train_loss": -44.70785903930664, "global_step": 322888, "epoch": 2668} {"train_loss": -43.23690414428711, "global_step": 322889, "epoch": 2668} {"train_loss": -44.6619873046875, "global_step": 322890, "epoch": 2668} {"train_loss": -43.69869613647461, "global_step": 322891, "epoch": 2668} {"train_loss": -44.024574279785156, "global_step": 322892, "epoch": 2668} {"train_loss": -44.67346954345703, "global_step": 322893, "epoch": 2668} {"train_loss": -44.48460006713867, "global_step": 322894, "epoch": 2668} {"train_loss": -44.65018844604492, "global_step": 322895, "epoch": 2668} {"train_loss": -44.32149887084961, "global_step": 322896, "epoch": 2668} {"train_loss": -44.7235221862793, "global_step": 322897, "epoch": 2668} {"train_loss": -44.17824935913086, "global_step": 322898, "epoch": 2668} {"train_loss": -44.600074768066406, "global_step": 322899, "epoch": 2668} {"train_loss": -44.3769416809082, "global_step": 322900, "epoch": 2668} {"train_loss": -43.172306060791016, "global_step": 322901, "epoch": 2668} {"train_loss": -42.51953887939453, "global_step": 322902, "epoch": 2668} {"train_loss": -45.20658493041992, "global_step": 322903, "epoch": 2668} {"train_loss": -43.733028411865234, "global_step": 322904, "epoch": 2668} {"train_loss": -43.35636520385742, "global_step": 322905, "epoch": 2668} {"train_loss": -44.81362533569336, "global_step": 322906, "epoch": 2668} {"train_loss": -43.91493606567383, "global_step": 322907, "epoch": 2668} {"train_loss": -42.53352737426758, "global_step": 322908, "epoch": 2668} {"train_loss": -44.68292236328125, "global_step": 322909, "epoch": 2668} {"train_loss": -42.56489944458008, "global_step": 322910, "epoch": 2668} {"train_loss": -43.227294921875, "global_step": 322911, "epoch": 2668} {"train_loss": -45.4266357421875, "global_step": 322912, "epoch": 2668} {"train_loss": -42.782623291015625, "global_step": 322913, "epoch": 2668} {"train_loss": -42.89632034301758, "global_step": 322914, "epoch": 2668} {"train_loss": -44.814231872558594, "global_step": 322915, "epoch": 2668} {"train_loss": -43.994503021240234, "global_step": 322916, "epoch": 2668} {"train_loss": -43.75444412231445, "global_step": 322917, "epoch": 2668} {"train_loss": -44.55316925048828, "global_step": 322918, "epoch": 2668} {"train_loss": -43.50161361694336, "global_step": 322919, "epoch": 2668} {"train_loss": -44.07235336303711, "global_step": 322920, "epoch": 2668} {"train_loss": -44.37800216674805, "global_step": 322921, "epoch": 2668} {"train_loss": -44.2310676574707, "global_step": 322922, "epoch": 2668} {"train_loss": -44.1329345703125, "global_step": 322923, "epoch": 2668} {"train_loss": -43.473358154296875, "global_step": 322924, "epoch": 2668} {"train_loss": -43.5601921081543, "global_step": 322925, "epoch": 2668} {"train_loss": -43.44276809692383, "global_step": 322926, "epoch": 2668} {"train_loss": -42.99988555908203, "global_step": 322927, "epoch": 2668} {"train_loss": -43.717689514160156, "global_step": 322928, "epoch": 2668} {"train_loss": -44.414405822753906, "global_step": 322929, "epoch": 2668} {"train_loss": -42.9273567199707, "global_step": 322930, "epoch": 2668} {"train_loss": -44.205989837646484, "global_step": 322931, "epoch": 2668} {"train_loss": -44.101043701171875, "global_step": 322932, "epoch": 2668} {"train_loss": -43.77014923095703, "global_step": 322933, "epoch": 2668} {"train_loss": -44.282684326171875, "global_step": 322934, "epoch": 2668} {"train_loss": -44.44911575317383, "global_step": 322935, "epoch": 2668} {"train_loss": -44.16966247558594, "global_step": 322936, "epoch": 2668} {"train_loss": -44.398921966552734, "global_step": 322937, "epoch": 2668} {"train_loss": -44.905208587646484, "global_step": 322938, "epoch": 2668} {"train_loss": -44.67780303955078, "global_step": 322939, "epoch": 2668} {"train_loss": -44.564308166503906, "global_step": 322940, "epoch": 2668} {"train_loss": -44.62154769897461, "global_step": 322941, "epoch": 2668} {"train_loss": -44.609806060791016, "global_step": 322942, "epoch": 2668} {"train_loss": -44.61695098876953, "global_step": 322943, "epoch": 2668} {"train_loss": -44.421592712402344, "global_step": 322944, "epoch": 2668} {"train_loss": -44.456756591796875, "global_step": 322945, "epoch": 2668} {"train_loss": -45.14213180541992, "global_step": 322946, "epoch": 2668} {"train_loss": -44.33406066894531, "global_step": 322947, "epoch": 2668} {"train_loss": -43.822461687828884, "global_step": 322948, "epoch": 2668, "val_loss": 2714856.25} {"train_loss": -44.563716888427734, "global_step": 322949, "epoch": 2669} {"train_loss": -44.581634521484375, "global_step": 322950, "epoch": 2669} {"train_loss": -44.80203628540039, "global_step": 322951, "epoch": 2669} {"train_loss": -44.52532958984375, "global_step": 322952, "epoch": 2669} {"train_loss": -45.188350677490234, "global_step": 322953, "epoch": 2669} {"train_loss": -44.79634475708008, "global_step": 322954, "epoch": 2669} {"train_loss": -44.65229415893555, "global_step": 322955, "epoch": 2669} {"train_loss": -44.78678512573242, "global_step": 322956, "epoch": 2669} {"train_loss": -44.41550064086914, "global_step": 322957, "epoch": 2669} {"train_loss": -44.60950469970703, "global_step": 322958, "epoch": 2669} {"train_loss": -44.03505325317383, "global_step": 322959, "epoch": 2669} {"train_loss": -44.59983444213867, "global_step": 322960, "epoch": 2669} {"train_loss": -44.91134262084961, "global_step": 322961, "epoch": 2669} {"train_loss": -44.8930778503418, "global_step": 322962, "epoch": 2669} {"train_loss": -44.73220443725586, "global_step": 322963, "epoch": 2669} {"train_loss": -44.54177474975586, "global_step": 322964, "epoch": 2669} {"train_loss": -44.85906982421875, "global_step": 322965, "epoch": 2669} {"train_loss": -44.42318344116211, "global_step": 322966, "epoch": 2669} {"train_loss": -44.6754150390625, "global_step": 322967, "epoch": 2669} {"train_loss": -42.50691223144531, "global_step": 322968, "epoch": 2669} {"train_loss": -43.88882064819336, "global_step": 322969, "epoch": 2669} {"train_loss": -44.26047897338867, "global_step": 322970, "epoch": 2669} {"train_loss": -44.6026725769043, "global_step": 322971, "epoch": 2669} {"train_loss": -44.49387741088867, "global_step": 322972, "epoch": 2669} {"train_loss": -44.09303283691406, "global_step": 322973, "epoch": 2669} {"train_loss": -45.39738082885742, "global_step": 322974, "epoch": 2669} {"train_loss": -42.29474639892578, "global_step": 322975, "epoch": 2669} {"train_loss": -44.03478240966797, "global_step": 322976, "epoch": 2669} {"train_loss": -43.75293731689453, "global_step": 322977, "epoch": 2669} {"train_loss": -44.61396026611328, "global_step": 322978, "epoch": 2669} {"train_loss": -43.3527946472168, "global_step": 322979, "epoch": 2669} {"train_loss": -44.50774383544922, "global_step": 322980, "epoch": 2669} {"train_loss": -44.29069519042969, "global_step": 322981, "epoch": 2669} {"train_loss": -43.977508544921875, "global_step": 322982, "epoch": 2669} {"train_loss": -42.911407470703125, "global_step": 322983, "epoch": 2669} {"train_loss": -41.455135345458984, "global_step": 322984, "epoch": 2669} {"train_loss": -43.659942626953125, "global_step": 322985, "epoch": 2669} {"train_loss": -42.700984954833984, "global_step": 322986, "epoch": 2669} {"train_loss": -43.9763069152832, "global_step": 322987, "epoch": 2669} {"train_loss": -41.95768356323242, "global_step": 322988, "epoch": 2669} {"train_loss": -44.14785385131836, "global_step": 322989, "epoch": 2669} {"train_loss": -42.592071533203125, "global_step": 322990, "epoch": 2669} {"train_loss": -42.23762893676758, "global_step": 322991, "epoch": 2669} {"train_loss": -43.442623138427734, "global_step": 322992, "epoch": 2669} {"train_loss": -43.825130462646484, "global_step": 322993, "epoch": 2669} {"train_loss": -43.371429443359375, "global_step": 322994, "epoch": 2669} {"train_loss": -42.742286682128906, "global_step": 322995, "epoch": 2669} {"train_loss": -42.38262176513672, "global_step": 322996, "epoch": 2669} {"train_loss": -42.94767379760742, "global_step": 322997, "epoch": 2669} {"train_loss": -43.59603500366211, "global_step": 322998, "epoch": 2669} {"train_loss": -43.551937103271484, "global_step": 322999, "epoch": 2669} {"train_loss": -40.80483627319336, "global_step": 323000, "epoch": 2669} {"train_loss": -43.2015266418457, "global_step": 323001, "epoch": 2669} {"train_loss": -43.81857681274414, "global_step": 323002, "epoch": 2669} {"train_loss": -42.96260452270508, "global_step": 323003, "epoch": 2669} {"train_loss": -42.608009338378906, "global_step": 323004, "epoch": 2669} {"train_loss": -43.701751708984375, "global_step": 323005, "epoch": 2669} {"train_loss": -42.98628234863281, "global_step": 323006, "epoch": 2669} {"train_loss": -43.157440185546875, "global_step": 323007, "epoch": 2669} {"train_loss": -43.675270080566406, "global_step": 323008, "epoch": 2669} {"train_loss": -43.206459045410156, "global_step": 323009, "epoch": 2669} {"train_loss": -44.308223724365234, "global_step": 323010, "epoch": 2669} {"train_loss": -43.07870101928711, "global_step": 323011, "epoch": 2669} {"train_loss": -43.930171966552734, "global_step": 323012, "epoch": 2669} {"train_loss": -44.452754974365234, "global_step": 323013, "epoch": 2669} {"train_loss": -42.89052200317383, "global_step": 323014, "epoch": 2669} {"train_loss": -43.53746795654297, "global_step": 323015, "epoch": 2669} {"train_loss": -43.649078369140625, "global_step": 323016, "epoch": 2669} {"train_loss": -43.12800979614258, "global_step": 323017, "epoch": 2669} {"train_loss": -43.613460540771484, "global_step": 323018, "epoch": 2669} {"train_loss": -43.4948844909668, "global_step": 323019, "epoch": 2669} {"train_loss": -43.931209564208984, "global_step": 323020, "epoch": 2669} {"train_loss": -42.62897872924805, "global_step": 323021, "epoch": 2669} {"train_loss": -44.09577941894531, "global_step": 323022, "epoch": 2669} {"train_loss": -42.717464447021484, "global_step": 323023, "epoch": 2669} {"train_loss": -43.78813552856445, "global_step": 323024, "epoch": 2669} {"train_loss": -44.15039825439453, "global_step": 323025, "epoch": 2669} {"train_loss": -42.674495697021484, "global_step": 323026, "epoch": 2669} {"train_loss": -44.169769287109375, "global_step": 323027, "epoch": 2669} {"train_loss": -43.62720489501953, "global_step": 323028, "epoch": 2669} {"train_loss": -42.81934356689453, "global_step": 323029, "epoch": 2669} {"train_loss": -44.657989501953125, "global_step": 323030, "epoch": 2669} {"train_loss": -43.05554962158203, "global_step": 323031, "epoch": 2669} {"train_loss": -43.78268814086914, "global_step": 323032, "epoch": 2669} {"train_loss": -44.269283294677734, "global_step": 323033, "epoch": 2669} {"train_loss": -44.36884689331055, "global_step": 323034, "epoch": 2669} {"train_loss": -44.10350036621094, "global_step": 323035, "epoch": 2669} {"train_loss": -44.45469284057617, "global_step": 323036, "epoch": 2669} {"train_loss": -43.8062629699707, "global_step": 323037, "epoch": 2669} {"train_loss": -44.9000358581543, "global_step": 323038, "epoch": 2669} {"train_loss": -43.77157211303711, "global_step": 323039, "epoch": 2669} {"train_loss": -43.34807586669922, "global_step": 323040, "epoch": 2669} {"train_loss": -44.05046844482422, "global_step": 323041, "epoch": 2669} {"train_loss": -44.42321014404297, "global_step": 323042, "epoch": 2669} {"train_loss": -44.64659118652344, "global_step": 323043, "epoch": 2669} {"train_loss": -43.9491081237793, "global_step": 323044, "epoch": 2669} {"train_loss": -44.648292541503906, "global_step": 323045, "epoch": 2669} {"train_loss": -44.26314926147461, "global_step": 323046, "epoch": 2669} {"train_loss": -44.304195404052734, "global_step": 323047, "epoch": 2669} {"train_loss": -44.01640319824219, "global_step": 323048, "epoch": 2669} {"train_loss": -44.5998420715332, "global_step": 323049, "epoch": 2669} {"train_loss": -44.0435676574707, "global_step": 323050, "epoch": 2669} {"train_loss": -43.812957763671875, "global_step": 323051, "epoch": 2669} {"train_loss": -43.98643112182617, "global_step": 323052, "epoch": 2669} {"train_loss": -44.71210861206055, "global_step": 323053, "epoch": 2669} {"train_loss": -43.704833984375, "global_step": 323054, "epoch": 2669} {"train_loss": -44.50008010864258, "global_step": 323055, "epoch": 2669} {"train_loss": -44.36385726928711, "global_step": 323056, "epoch": 2669} {"train_loss": -43.92238235473633, "global_step": 323057, "epoch": 2669} {"train_loss": -44.64009094238281, "global_step": 323058, "epoch": 2669} {"train_loss": -45.018524169921875, "global_step": 323059, "epoch": 2669} {"train_loss": -44.63296127319336, "global_step": 323060, "epoch": 2669} {"train_loss": -44.103939056396484, "global_step": 323061, "epoch": 2669} {"train_loss": -43.87113571166992, "global_step": 323062, "epoch": 2669} {"train_loss": -45.051177978515625, "global_step": 323063, "epoch": 2669} {"train_loss": -44.56441116333008, "global_step": 323064, "epoch": 2669} {"train_loss": -45.00798034667969, "global_step": 323065, "epoch": 2669} {"train_loss": -45.10139846801758, "global_step": 323066, "epoch": 2669} {"train_loss": -44.391231536865234, "global_step": 323067, "epoch": 2669} {"train_loss": -45.27321243286133, "global_step": 323068, "epoch": 2669} {"train_loss": -43.90715433546334, "global_step": 323069, "epoch": 2669, "val_loss": 2683478.75} {"train_loss": -44.638729095458984, "global_step": 323070, "epoch": 2670} {"train_loss": -42.64970016479492, "global_step": 323071, "epoch": 2670} {"train_loss": -43.997310638427734, "global_step": 323072, "epoch": 2670} {"train_loss": -44.22095489501953, "global_step": 323073, "epoch": 2670} {"train_loss": -44.362022399902344, "global_step": 323074, "epoch": 2670} {"train_loss": -44.22370147705078, "global_step": 323075, "epoch": 2670} {"train_loss": -43.871028900146484, "global_step": 323076, "epoch": 2670} {"train_loss": -43.940738677978516, "global_step": 323077, "epoch": 2670} {"train_loss": -42.64027786254883, "global_step": 323078, "epoch": 2670} {"train_loss": -44.76510238647461, "global_step": 323079, "epoch": 2670} {"train_loss": -44.00649642944336, "global_step": 323080, "epoch": 2670} {"train_loss": -45.12739944458008, "global_step": 323081, "epoch": 2670} {"train_loss": -43.849727630615234, "global_step": 323082, "epoch": 2670} {"train_loss": -44.63395309448242, "global_step": 323083, "epoch": 2670} {"train_loss": -43.61037826538086, "global_step": 323084, "epoch": 2670} {"train_loss": -44.413875579833984, "global_step": 323085, "epoch": 2670} {"train_loss": -44.5640983581543, "global_step": 323086, "epoch": 2670} {"train_loss": -44.33425521850586, "global_step": 323087, "epoch": 2670} {"train_loss": -44.53444290161133, "global_step": 323088, "epoch": 2670} {"train_loss": -43.88057327270508, "global_step": 323089, "epoch": 2670} {"train_loss": -43.836334228515625, "global_step": 323090, "epoch": 2670} {"train_loss": -43.39876937866211, "global_step": 323091, "epoch": 2670} {"train_loss": -42.44868087768555, "global_step": 323092, "epoch": 2670} {"train_loss": -44.276302337646484, "global_step": 323093, "epoch": 2670} {"train_loss": -43.588497161865234, "global_step": 323094, "epoch": 2670} {"train_loss": -42.956092834472656, "global_step": 323095, "epoch": 2670} {"train_loss": -43.166290283203125, "global_step": 323096, "epoch": 2670} {"train_loss": -44.58088684082031, "global_step": 323097, "epoch": 2670} {"train_loss": -43.65653991699219, "global_step": 323098, "epoch": 2670} {"train_loss": -44.49647903442383, "global_step": 323099, "epoch": 2670} {"train_loss": -43.668251037597656, "global_step": 323100, "epoch": 2670} {"train_loss": -44.65900802612305, "global_step": 323101, "epoch": 2670} {"train_loss": -44.444252014160156, "global_step": 323102, "epoch": 2670} {"train_loss": -43.368682861328125, "global_step": 323103, "epoch": 2670} {"train_loss": -43.725555419921875, "global_step": 323104, "epoch": 2670} {"train_loss": -43.703487396240234, "global_step": 323105, "epoch": 2670} {"train_loss": -42.57686233520508, "global_step": 323106, "epoch": 2670} {"train_loss": -42.81248092651367, "global_step": 323107, "epoch": 2670} {"train_loss": -43.722591400146484, "global_step": 323108, "epoch": 2670} {"train_loss": -43.93589401245117, "global_step": 323109, "epoch": 2670} {"train_loss": -43.01186752319336, "global_step": 323110, "epoch": 2670} {"train_loss": -43.99730682373047, "global_step": 323111, "epoch": 2670} {"train_loss": -43.65714645385742, "global_step": 323112, "epoch": 2670} {"train_loss": -44.047080993652344, "global_step": 323113, "epoch": 2670} {"train_loss": -43.23099899291992, "global_step": 323114, "epoch": 2670} {"train_loss": -44.593692779541016, "global_step": 323115, "epoch": 2670} {"train_loss": -44.42287826538086, "global_step": 323116, "epoch": 2670} {"train_loss": -42.36932373046875, "global_step": 323117, "epoch": 2670} {"train_loss": -43.19074249267578, "global_step": 323118, "epoch": 2670} {"train_loss": -43.98228454589844, "global_step": 323119, "epoch": 2670} {"train_loss": -43.93111801147461, "global_step": 323120, "epoch": 2670} {"train_loss": -44.477264404296875, "global_step": 323121, "epoch": 2670} {"train_loss": -43.331478118896484, "global_step": 323122, "epoch": 2670} {"train_loss": -43.717525482177734, "global_step": 323123, "epoch": 2670} {"train_loss": -43.74266815185547, "global_step": 323124, "epoch": 2670} {"train_loss": -43.92980194091797, "global_step": 323125, "epoch": 2670} {"train_loss": -44.85830307006836, "global_step": 323126, "epoch": 2670} {"train_loss": -44.26317596435547, "global_step": 323127, "epoch": 2670} {"train_loss": -43.01567840576172, "global_step": 323128, "epoch": 2670} {"train_loss": -44.75635528564453, "global_step": 323129, "epoch": 2670} {"train_loss": -43.69880294799805, "global_step": 323130, "epoch": 2670} {"train_loss": -41.13043975830078, "global_step": 323131, "epoch": 2670} {"train_loss": -42.059471130371094, "global_step": 323132, "epoch": 2670} {"train_loss": -44.60163116455078, "global_step": 323133, "epoch": 2670} {"train_loss": -42.5205078125, "global_step": 323134, "epoch": 2670} {"train_loss": -42.679603576660156, "global_step": 323135, "epoch": 2670} {"train_loss": -44.611507415771484, "global_step": 323136, "epoch": 2670} {"train_loss": -44.53083038330078, "global_step": 323137, "epoch": 2670} {"train_loss": -42.64863967895508, "global_step": 323138, "epoch": 2670} {"train_loss": -43.33214569091797, "global_step": 323139, "epoch": 2670} {"train_loss": -44.09955596923828, "global_step": 323140, "epoch": 2670} {"train_loss": -43.858001708984375, "global_step": 323141, "epoch": 2670} {"train_loss": -44.122169494628906, "global_step": 323142, "epoch": 2670} {"train_loss": -44.2233772277832, "global_step": 323143, "epoch": 2670} {"train_loss": -44.90721130371094, "global_step": 323144, "epoch": 2670} {"train_loss": -44.1362419128418, "global_step": 323145, "epoch": 2670} {"train_loss": -44.974876403808594, "global_step": 323146, "epoch": 2670} {"train_loss": -44.09430694580078, "global_step": 323147, "epoch": 2670} {"train_loss": -44.66444778442383, "global_step": 323148, "epoch": 2670} {"train_loss": -44.98090744018555, "global_step": 323149, "epoch": 2670} {"train_loss": -44.42787551879883, "global_step": 323150, "epoch": 2670} {"train_loss": -44.66019058227539, "global_step": 323151, "epoch": 2670} {"train_loss": -45.26039505004883, "global_step": 323152, "epoch": 2670} {"train_loss": -44.828102111816406, "global_step": 323153, "epoch": 2670} {"train_loss": -44.72127151489258, "global_step": 323154, "epoch": 2670} {"train_loss": -44.4466438293457, "global_step": 323155, "epoch": 2670} {"train_loss": -43.95534896850586, "global_step": 323156, "epoch": 2670} {"train_loss": -43.59545135498047, "global_step": 323157, "epoch": 2670} {"train_loss": -44.56834030151367, "global_step": 323158, "epoch": 2670} {"train_loss": -43.66665267944336, "global_step": 323159, "epoch": 2670} {"train_loss": -39.099082946777344, "global_step": 323160, "epoch": 2670} {"train_loss": -39.70272445678711, "global_step": 323161, "epoch": 2670} {"train_loss": -41.933349609375, "global_step": 323162, "epoch": 2670} {"train_loss": -43.59733200073242, "global_step": 323163, "epoch": 2670} {"train_loss": -43.22831344604492, "global_step": 323164, "epoch": 2670} {"train_loss": -40.3049430847168, "global_step": 323165, "epoch": 2670} {"train_loss": -38.36932373046875, "global_step": 323166, "epoch": 2670} {"train_loss": -42.40810012817383, "global_step": 323167, "epoch": 2670} {"train_loss": -43.57357406616211, "global_step": 323168, "epoch": 2670} {"train_loss": -42.5874137878418, "global_step": 323169, "epoch": 2670} {"train_loss": -42.620582580566406, "global_step": 323170, "epoch": 2670} {"train_loss": -41.964996337890625, "global_step": 323171, "epoch": 2670} {"train_loss": -41.299556732177734, "global_step": 323172, "epoch": 2670} {"train_loss": -43.810646057128906, "global_step": 323173, "epoch": 2670} {"train_loss": -41.50545883178711, "global_step": 323174, "epoch": 2670} {"train_loss": -42.14650344848633, "global_step": 323175, "epoch": 2670} {"train_loss": -41.82365798950195, "global_step": 323176, "epoch": 2670} {"train_loss": -41.87945556640625, "global_step": 323177, "epoch": 2670} {"train_loss": -41.62361526489258, "global_step": 323178, "epoch": 2670} {"train_loss": -42.8486213684082, "global_step": 323179, "epoch": 2670} {"train_loss": -43.88257598876953, "global_step": 323180, "epoch": 2670} {"train_loss": -42.671382904052734, "global_step": 323181, "epoch": 2670} {"train_loss": -42.506134033203125, "global_step": 323182, "epoch": 2670} {"train_loss": -43.77037048339844, "global_step": 323183, "epoch": 2670} {"train_loss": -42.8873405456543, "global_step": 323184, "epoch": 2670} {"train_loss": -42.529476165771484, "global_step": 323185, "epoch": 2670} {"train_loss": -43.380699157714844, "global_step": 323186, "epoch": 2670} {"train_loss": -42.21235275268555, "global_step": 323187, "epoch": 2670} {"train_loss": -43.33234786987305, "global_step": 323188, "epoch": 2670} {"train_loss": -42.45901107788086, "global_step": 323189, "epoch": 2670} {"train_loss": -43.476259247330596, "global_step": 323190, "epoch": 2670, "val_loss": 2726434.75} {"train_loss": -43.39803695678711, "global_step": 323191, "epoch": 2671} {"train_loss": -43.39211654663086, "global_step": 323192, "epoch": 2671} {"train_loss": -43.48905563354492, "global_step": 323193, "epoch": 2671} {"train_loss": -44.012996673583984, "global_step": 323194, "epoch": 2671} {"train_loss": -43.03394317626953, "global_step": 323195, "epoch": 2671} {"train_loss": -42.749114990234375, "global_step": 323196, "epoch": 2671} {"train_loss": -43.57956314086914, "global_step": 323197, "epoch": 2671} {"train_loss": -44.34529495239258, "global_step": 323198, "epoch": 2671} {"train_loss": -43.574554443359375, "global_step": 323199, "epoch": 2671} {"train_loss": -43.6135368347168, "global_step": 323200, "epoch": 2671} {"train_loss": -43.80031967163086, "global_step": 323201, "epoch": 2671} {"train_loss": -43.0760383605957, "global_step": 323202, "epoch": 2671} {"train_loss": -42.90232849121094, "global_step": 323203, "epoch": 2671} {"train_loss": -43.218833923339844, "global_step": 323204, "epoch": 2671} {"train_loss": -43.50642776489258, "global_step": 323205, "epoch": 2671} {"train_loss": -43.13866424560547, "global_step": 323206, "epoch": 2671} {"train_loss": -42.8742561340332, "global_step": 323207, "epoch": 2671} {"train_loss": -43.65742874145508, "global_step": 323208, "epoch": 2671} {"train_loss": -44.23102951049805, "global_step": 323209, "epoch": 2671} {"train_loss": -42.99081802368164, "global_step": 323210, "epoch": 2671} {"train_loss": -44.08991241455078, "global_step": 323211, "epoch": 2671} {"train_loss": -43.8195915222168, "global_step": 323212, "epoch": 2671} {"train_loss": -44.16896438598633, "global_step": 323213, "epoch": 2671} {"train_loss": -43.764930725097656, "global_step": 323214, "epoch": 2671} {"train_loss": -44.00495529174805, "global_step": 323215, "epoch": 2671} {"train_loss": -44.25695037841797, "global_step": 323216, "epoch": 2671} {"train_loss": -44.54399490356445, "global_step": 323217, "epoch": 2671} {"train_loss": -44.38991928100586, "global_step": 323218, "epoch": 2671} {"train_loss": -44.08439254760742, "global_step": 323219, "epoch": 2671} {"train_loss": -44.322898864746094, "global_step": 323220, "epoch": 2671} {"train_loss": -44.646095275878906, "global_step": 323221, "epoch": 2671} {"train_loss": -44.64582443237305, "global_step": 323222, "epoch": 2671} {"train_loss": -44.99746322631836, "global_step": 323223, "epoch": 2671} {"train_loss": -44.634742736816406, "global_step": 323224, "epoch": 2671} {"train_loss": -44.90561294555664, "global_step": 323225, "epoch": 2671} {"train_loss": -45.090816497802734, "global_step": 323226, "epoch": 2671} {"train_loss": -44.03817367553711, "global_step": 323227, "epoch": 2671} {"train_loss": -44.7835807800293, "global_step": 323228, "epoch": 2671} {"train_loss": -44.23575973510742, "global_step": 323229, "epoch": 2671} {"train_loss": -44.565975189208984, "global_step": 323230, "epoch": 2671} {"train_loss": -44.664710998535156, "global_step": 323231, "epoch": 2671} {"train_loss": -44.6497802734375, "global_step": 323232, "epoch": 2671} {"train_loss": -44.63053894042969, "global_step": 323233, "epoch": 2671} {"train_loss": -44.876609802246094, "global_step": 323234, "epoch": 2671} {"train_loss": -44.98452377319336, "global_step": 323235, "epoch": 2671} {"train_loss": -44.565792083740234, "global_step": 323236, "epoch": 2671} {"train_loss": -45.33537673950195, "global_step": 323237, "epoch": 2671} {"train_loss": -45.385677337646484, "global_step": 323238, "epoch": 2671} {"train_loss": -45.11838912963867, "global_step": 323239, "epoch": 2671} {"train_loss": -45.10463333129883, "global_step": 323240, "epoch": 2671} {"train_loss": -45.06499099731445, "global_step": 323241, "epoch": 2671} {"train_loss": -45.2124137878418, "global_step": 323242, "epoch": 2671} {"train_loss": -44.781002044677734, "global_step": 323243, "epoch": 2671} {"train_loss": -45.13867950439453, "global_step": 323244, "epoch": 2671} {"train_loss": -45.521446228027344, "global_step": 323245, "epoch": 2671} {"train_loss": -45.084041595458984, "global_step": 323246, "epoch": 2671} {"train_loss": -44.603118896484375, "global_step": 323247, "epoch": 2671} {"train_loss": -45.2252311706543, "global_step": 323248, "epoch": 2671} {"train_loss": -45.18218994140625, "global_step": 323249, "epoch": 2671} {"train_loss": -44.42103958129883, "global_step": 323250, "epoch": 2671} {"train_loss": -44.65348434448242, "global_step": 323251, "epoch": 2671} {"train_loss": -45.38827133178711, "global_step": 323252, "epoch": 2671} {"train_loss": -45.36758041381836, "global_step": 323253, "epoch": 2671} {"train_loss": -43.632606506347656, "global_step": 323254, "epoch": 2671} {"train_loss": -42.12470245361328, "global_step": 323255, "epoch": 2671} {"train_loss": -43.383026123046875, "global_step": 323256, "epoch": 2671} {"train_loss": -43.2987060546875, "global_step": 323257, "epoch": 2671} {"train_loss": -44.1700439453125, "global_step": 323258, "epoch": 2671} {"train_loss": -44.90717697143555, "global_step": 323259, "epoch": 2671} {"train_loss": -44.9050178527832, "global_step": 323260, "epoch": 2671} {"train_loss": -43.78425216674805, "global_step": 323261, "epoch": 2671} {"train_loss": -43.505611419677734, "global_step": 323262, "epoch": 2671} {"train_loss": -43.04389572143555, "global_step": 323263, "epoch": 2671} {"train_loss": -42.74977493286133, "global_step": 323264, "epoch": 2671} {"train_loss": -44.41357421875, "global_step": 323265, "epoch": 2671} {"train_loss": -44.27511215209961, "global_step": 323266, "epoch": 2671} {"train_loss": -43.777587890625, "global_step": 323267, "epoch": 2671} {"train_loss": -44.525203704833984, "global_step": 323268, "epoch": 2671} {"train_loss": -44.23062515258789, "global_step": 323269, "epoch": 2671} {"train_loss": -44.12823486328125, "global_step": 323270, "epoch": 2671} {"train_loss": -44.7685546875, "global_step": 323271, "epoch": 2671} {"train_loss": -44.3521614074707, "global_step": 323272, "epoch": 2671} {"train_loss": -45.337005615234375, "global_step": 323273, "epoch": 2671} {"train_loss": -44.614112854003906, "global_step": 323274, "epoch": 2671} {"train_loss": -44.68158721923828, "global_step": 323275, "epoch": 2671} {"train_loss": -45.078643798828125, "global_step": 323276, "epoch": 2671} {"train_loss": -43.559173583984375, "global_step": 323277, "epoch": 2671} {"train_loss": -42.4983024597168, "global_step": 323278, "epoch": 2671} {"train_loss": -42.5096435546875, "global_step": 323279, "epoch": 2671} {"train_loss": -44.101558685302734, "global_step": 323280, "epoch": 2671} {"train_loss": -45.08797836303711, "global_step": 323281, "epoch": 2671} {"train_loss": -43.248287200927734, "global_step": 323282, "epoch": 2671} {"train_loss": -44.45842361450195, "global_step": 323283, "epoch": 2671} {"train_loss": -44.91328048706055, "global_step": 323284, "epoch": 2671} {"train_loss": -43.52207565307617, "global_step": 323285, "epoch": 2671} {"train_loss": -44.13063049316406, "global_step": 323286, "epoch": 2671} {"train_loss": -43.854530334472656, "global_step": 323287, "epoch": 2671} {"train_loss": -44.715755462646484, "global_step": 323288, "epoch": 2671} {"train_loss": -44.615169525146484, "global_step": 323289, "epoch": 2671} {"train_loss": -43.71470260620117, "global_step": 323290, "epoch": 2671} {"train_loss": -44.77887725830078, "global_step": 323291, "epoch": 2671} {"train_loss": -44.48627853393555, "global_step": 323292, "epoch": 2671} {"train_loss": -43.942012786865234, "global_step": 323293, "epoch": 2671} {"train_loss": -44.02598190307617, "global_step": 323294, "epoch": 2671} {"train_loss": -44.2629508972168, "global_step": 323295, "epoch": 2671} {"train_loss": -44.70565414428711, "global_step": 323296, "epoch": 2671} {"train_loss": -44.31779861450195, "global_step": 323297, "epoch": 2671} {"train_loss": -44.68067932128906, "global_step": 323298, "epoch": 2671} {"train_loss": -43.99650192260742, "global_step": 323299, "epoch": 2671} {"train_loss": -43.30705642700195, "global_step": 323300, "epoch": 2671} {"train_loss": -43.906898498535156, "global_step": 323301, "epoch": 2671} {"train_loss": -44.03558349609375, "global_step": 323302, "epoch": 2671} {"train_loss": -44.2895622253418, "global_step": 323303, "epoch": 2671} {"train_loss": -44.87933349609375, "global_step": 323304, "epoch": 2671} {"train_loss": -44.2469596862793, "global_step": 323305, "epoch": 2671} {"train_loss": -44.8759765625, "global_step": 323306, "epoch": 2671} {"train_loss": -44.164241790771484, "global_step": 323307, "epoch": 2671} {"train_loss": -43.78995895385742, "global_step": 323308, "epoch": 2671} {"train_loss": -44.964420318603516, "global_step": 323309, "epoch": 2671} {"train_loss": -44.33698654174805, "global_step": 323310, "epoch": 2671} {"train_loss": -44.21327259914934, "global_step": 323311, "epoch": 2671, "val_loss": 2702824.0} {"train_loss": -43.13808822631836, "global_step": 323312, "epoch": 2672} {"train_loss": -43.21564483642578, "global_step": 323313, "epoch": 2672} {"train_loss": -42.95178985595703, "global_step": 323314, "epoch": 2672} {"train_loss": -43.915321350097656, "global_step": 323315, "epoch": 2672} {"train_loss": -44.881202697753906, "global_step": 323316, "epoch": 2672} {"train_loss": -44.272987365722656, "global_step": 323317, "epoch": 2672} {"train_loss": -44.39278793334961, "global_step": 323318, "epoch": 2672} {"train_loss": -44.25007247924805, "global_step": 323319, "epoch": 2672} {"train_loss": -44.164608001708984, "global_step": 323320, "epoch": 2672} {"train_loss": -44.15433883666992, "global_step": 323321, "epoch": 2672} {"train_loss": -44.40949249267578, "global_step": 323322, "epoch": 2672} {"train_loss": -43.49073028564453, "global_step": 323323, "epoch": 2672} {"train_loss": -44.113426208496094, "global_step": 323324, "epoch": 2672} {"train_loss": -45.007144927978516, "global_step": 323325, "epoch": 2672} {"train_loss": -43.43850326538086, "global_step": 323326, "epoch": 2672} {"train_loss": -43.55564498901367, "global_step": 323327, "epoch": 2672} {"train_loss": -43.904048919677734, "global_step": 323328, "epoch": 2672} {"train_loss": -44.1601676940918, "global_step": 323329, "epoch": 2672} {"train_loss": -44.881649017333984, "global_step": 323330, "epoch": 2672} {"train_loss": -43.76967239379883, "global_step": 323331, "epoch": 2672} {"train_loss": -39.69244384765625, "global_step": 323332, "epoch": 2672} {"train_loss": -43.4222297668457, "global_step": 323333, "epoch": 2672} {"train_loss": -43.4959831237793, "global_step": 323334, "epoch": 2672} {"train_loss": -43.1466064453125, "global_step": 323335, "epoch": 2672} {"train_loss": -44.624141693115234, "global_step": 323336, "epoch": 2672} {"train_loss": -43.03003692626953, "global_step": 323337, "epoch": 2672} {"train_loss": -43.89101791381836, "global_step": 323338, "epoch": 2672} {"train_loss": -42.87392044067383, "global_step": 323339, "epoch": 2672} {"train_loss": -43.357967376708984, "global_step": 323340, "epoch": 2672} {"train_loss": -43.167911529541016, "global_step": 323341, "epoch": 2672} {"train_loss": -43.34083557128906, "global_step": 323342, "epoch": 2672} {"train_loss": -42.09994888305664, "global_step": 323343, "epoch": 2672} {"train_loss": -42.29426956176758, "global_step": 323344, "epoch": 2672} {"train_loss": -43.37433624267578, "global_step": 323345, "epoch": 2672} {"train_loss": -41.08170700073242, "global_step": 323346, "epoch": 2672} {"train_loss": -44.19672775268555, "global_step": 323347, "epoch": 2672} {"train_loss": -43.02943801879883, "global_step": 323348, "epoch": 2672} {"train_loss": -43.268428802490234, "global_step": 323349, "epoch": 2672} {"train_loss": -43.554134368896484, "global_step": 323350, "epoch": 2672} {"train_loss": -41.84305953979492, "global_step": 323351, "epoch": 2672} {"train_loss": -44.34362030029297, "global_step": 323352, "epoch": 2672} {"train_loss": -42.70553207397461, "global_step": 323353, "epoch": 2672} {"train_loss": -43.43967056274414, "global_step": 323354, "epoch": 2672} {"train_loss": -43.75696563720703, "global_step": 323355, "epoch": 2672} {"train_loss": -41.63710403442383, "global_step": 323356, "epoch": 2672} {"train_loss": -43.43861770629883, "global_step": 323357, "epoch": 2672} {"train_loss": -42.18996047973633, "global_step": 323358, "epoch": 2672} {"train_loss": -43.137245178222656, "global_step": 323359, "epoch": 2672} {"train_loss": -43.71145248413086, "global_step": 323360, "epoch": 2672} {"train_loss": -42.68118667602539, "global_step": 323361, "epoch": 2672} {"train_loss": -44.68404006958008, "global_step": 323362, "epoch": 2672} {"train_loss": -43.329566955566406, "global_step": 323363, "epoch": 2672} {"train_loss": -43.67059326171875, "global_step": 323364, "epoch": 2672} {"train_loss": -44.28376388549805, "global_step": 323365, "epoch": 2672} {"train_loss": -44.332801818847656, "global_step": 323366, "epoch": 2672} {"train_loss": -44.50913619995117, "global_step": 323367, "epoch": 2672} {"train_loss": -43.40540313720703, "global_step": 323368, "epoch": 2672} {"train_loss": -44.33243942260742, "global_step": 323369, "epoch": 2672} {"train_loss": -44.663108825683594, "global_step": 323370, "epoch": 2672} {"train_loss": -43.986480712890625, "global_step": 323371, "epoch": 2672} {"train_loss": -44.90404510498047, "global_step": 323372, "epoch": 2672} {"train_loss": -43.852638244628906, "global_step": 323373, "epoch": 2672} {"train_loss": -44.96773147583008, "global_step": 323374, "epoch": 2672} {"train_loss": -44.262691497802734, "global_step": 323375, "epoch": 2672} {"train_loss": -45.01962661743164, "global_step": 323376, "epoch": 2672} {"train_loss": -44.10633087158203, "global_step": 323377, "epoch": 2672} {"train_loss": -44.441917419433594, "global_step": 323378, "epoch": 2672} {"train_loss": -44.52595901489258, "global_step": 323379, "epoch": 2672} {"train_loss": -44.12587356567383, "global_step": 323380, "epoch": 2672} {"train_loss": -44.84206771850586, "global_step": 323381, "epoch": 2672} {"train_loss": -44.12778854370117, "global_step": 323382, "epoch": 2672} {"train_loss": -44.6654052734375, "global_step": 323383, "epoch": 2672} {"train_loss": -44.14585876464844, "global_step": 323384, "epoch": 2672} {"train_loss": -44.8061637878418, "global_step": 323385, "epoch": 2672} {"train_loss": -44.45854949951172, "global_step": 323386, "epoch": 2672} {"train_loss": -44.92829132080078, "global_step": 323387, "epoch": 2672} {"train_loss": -44.1578369140625, "global_step": 323388, "epoch": 2672} {"train_loss": -44.25647735595703, "global_step": 323389, "epoch": 2672} {"train_loss": -44.61589050292969, "global_step": 323390, "epoch": 2672} {"train_loss": -44.95664596557617, "global_step": 323391, "epoch": 2672} {"train_loss": -44.70844268798828, "global_step": 323392, "epoch": 2672} {"train_loss": -44.48723220825195, "global_step": 323393, "epoch": 2672} {"train_loss": -44.25058364868164, "global_step": 323394, "epoch": 2672} {"train_loss": -44.534645080566406, "global_step": 323395, "epoch": 2672} {"train_loss": -44.095272064208984, "global_step": 323396, "epoch": 2672} {"train_loss": -44.61113357543945, "global_step": 323397, "epoch": 2672} {"train_loss": -44.798397064208984, "global_step": 323398, "epoch": 2672} {"train_loss": -43.26310348510742, "global_step": 323399, "epoch": 2672} {"train_loss": -42.5760612487793, "global_step": 323400, "epoch": 2672} {"train_loss": -41.84182357788086, "global_step": 323401, "epoch": 2672} {"train_loss": -44.95207214355469, "global_step": 323402, "epoch": 2672} {"train_loss": -43.73385238647461, "global_step": 323403, "epoch": 2672} {"train_loss": -43.90338134765625, "global_step": 323404, "epoch": 2672} {"train_loss": -44.293373107910156, "global_step": 323405, "epoch": 2672} {"train_loss": -44.81884765625, "global_step": 323406, "epoch": 2672} {"train_loss": -45.2393913269043, "global_step": 323407, "epoch": 2672} {"train_loss": -44.45641326904297, "global_step": 323408, "epoch": 2672} {"train_loss": -44.214752197265625, "global_step": 323409, "epoch": 2672} {"train_loss": -44.70069122314453, "global_step": 323410, "epoch": 2672} {"train_loss": -45.47916793823242, "global_step": 323411, "epoch": 2672} {"train_loss": -44.93562316894531, "global_step": 323412, "epoch": 2672} {"train_loss": -45.01357650756836, "global_step": 323413, "epoch": 2672} {"train_loss": -45.04148483276367, "global_step": 323414, "epoch": 2672} {"train_loss": -44.89150619506836, "global_step": 323415, "epoch": 2672} {"train_loss": -44.80548095703125, "global_step": 323416, "epoch": 2672} {"train_loss": -44.84212112426758, "global_step": 323417, "epoch": 2672} {"train_loss": -44.954036712646484, "global_step": 323418, "epoch": 2672} {"train_loss": -44.768062591552734, "global_step": 323419, "epoch": 2672} {"train_loss": -44.14276885986328, "global_step": 323420, "epoch": 2672} {"train_loss": -44.82746505737305, "global_step": 323421, "epoch": 2672} {"train_loss": -44.62803268432617, "global_step": 323422, "epoch": 2672} {"train_loss": -44.11985778808594, "global_step": 323423, "epoch": 2672} {"train_loss": -45.13363265991211, "global_step": 323424, "epoch": 2672} {"train_loss": -45.249794006347656, "global_step": 323425, "epoch": 2672} {"train_loss": -45.27568817138672, "global_step": 323426, "epoch": 2672} {"train_loss": -45.48106002807617, "global_step": 323427, "epoch": 2672} {"train_loss": -45.87697982788086, "global_step": 323428, "epoch": 2672} {"train_loss": -44.94509506225586, "global_step": 323429, "epoch": 2672} {"train_loss": -44.575496673583984, "global_step": 323430, "epoch": 2672} {"train_loss": -44.8399772644043, "global_step": 323431, "epoch": 2672} {"train_loss": -44.047408868458646, "global_step": 323432, "epoch": 2672, "val_loss": 2762157.5} {"train_loss": -44.542171478271484, "global_step": 323433, "epoch": 2673} {"train_loss": -44.0158576965332, "global_step": 323434, "epoch": 2673} {"train_loss": -44.865901947021484, "global_step": 323435, "epoch": 2673} {"train_loss": -44.204139709472656, "global_step": 323436, "epoch": 2673} {"train_loss": -43.48188400268555, "global_step": 323437, "epoch": 2673} {"train_loss": -43.626930236816406, "global_step": 323438, "epoch": 2673} {"train_loss": -44.382625579833984, "global_step": 323439, "epoch": 2673} {"train_loss": -41.436214447021484, "global_step": 323440, "epoch": 2673} {"train_loss": -41.821571350097656, "global_step": 323441, "epoch": 2673} {"train_loss": -44.309078216552734, "global_step": 323442, "epoch": 2673} {"train_loss": -42.52827072143555, "global_step": 323443, "epoch": 2673} {"train_loss": -42.46170425415039, "global_step": 323444, "epoch": 2673} {"train_loss": -43.19816207885742, "global_step": 323445, "epoch": 2673} {"train_loss": -43.43351745605469, "global_step": 323446, "epoch": 2673} {"train_loss": -43.46902084350586, "global_step": 323447, "epoch": 2673} {"train_loss": -41.3113899230957, "global_step": 323448, "epoch": 2673} {"train_loss": -43.3638916015625, "global_step": 323449, "epoch": 2673} {"train_loss": -42.430274963378906, "global_step": 323450, "epoch": 2673} {"train_loss": -43.2615966796875, "global_step": 323451, "epoch": 2673} {"train_loss": -43.84428405761719, "global_step": 323452, "epoch": 2673} {"train_loss": -42.945926666259766, "global_step": 323453, "epoch": 2673} {"train_loss": -36.856197357177734, "global_step": 323454, "epoch": 2673} {"train_loss": -43.62771987915039, "global_step": 323455, "epoch": 2673} {"train_loss": -42.67055892944336, "global_step": 323456, "epoch": 2673} {"train_loss": -42.72853469848633, "global_step": 323457, "epoch": 2673} {"train_loss": -43.4576416015625, "global_step": 323458, "epoch": 2673} {"train_loss": -42.621063232421875, "global_step": 323459, "epoch": 2673} {"train_loss": -43.161170959472656, "global_step": 323460, "epoch": 2673} {"train_loss": -42.79066848754883, "global_step": 323461, "epoch": 2673} {"train_loss": -43.481781005859375, "global_step": 323462, "epoch": 2673} {"train_loss": -44.4530143737793, "global_step": 323463, "epoch": 2673} {"train_loss": -43.84125900268555, "global_step": 323464, "epoch": 2673} {"train_loss": -42.40354537963867, "global_step": 323465, "epoch": 2673} {"train_loss": -43.320526123046875, "global_step": 323466, "epoch": 2673} {"train_loss": -42.518402099609375, "global_step": 323467, "epoch": 2673} {"train_loss": -41.73326873779297, "global_step": 323468, "epoch": 2673} {"train_loss": -42.275691986083984, "global_step": 323469, "epoch": 2673} {"train_loss": -44.32889938354492, "global_step": 323470, "epoch": 2673} {"train_loss": -44.01062774658203, "global_step": 323471, "epoch": 2673} {"train_loss": -42.38339614868164, "global_step": 323472, "epoch": 2673} {"train_loss": -41.49357223510742, "global_step": 323473, "epoch": 2673} {"train_loss": -41.65939712524414, "global_step": 323474, "epoch": 2673} {"train_loss": -38.981380462646484, "global_step": 323475, "epoch": 2673} {"train_loss": -42.62942123413086, "global_step": 323476, "epoch": 2673} {"train_loss": -42.361541748046875, "global_step": 323477, "epoch": 2673} {"train_loss": -43.5299186706543, "global_step": 323478, "epoch": 2673} {"train_loss": -43.10541915893555, "global_step": 323479, "epoch": 2673} {"train_loss": -42.172767639160156, "global_step": 323480, "epoch": 2673} {"train_loss": -42.95125198364258, "global_step": 323481, "epoch": 2673} {"train_loss": -33.66500473022461, "global_step": 323482, "epoch": 2673} {"train_loss": -40.5040397644043, "global_step": 323483, "epoch": 2673} {"train_loss": -38.12148666381836, "global_step": 323484, "epoch": 2673} {"train_loss": -38.11231231689453, "global_step": 323485, "epoch": 2673} {"train_loss": -40.722389221191406, "global_step": 323486, "epoch": 2673} {"train_loss": -41.1154670715332, "global_step": 323487, "epoch": 2673} {"train_loss": -37.03084182739258, "global_step": 323488, "epoch": 2673} {"train_loss": -38.60713577270508, "global_step": 323489, "epoch": 2673} {"train_loss": -39.70094680786133, "global_step": 323490, "epoch": 2673} {"train_loss": -38.2349739074707, "global_step": 323491, "epoch": 2673} {"train_loss": -39.40370178222656, "global_step": 323492, "epoch": 2673} {"train_loss": -41.181819915771484, "global_step": 323493, "epoch": 2673} {"train_loss": -36.888885498046875, "global_step": 323494, "epoch": 2673} {"train_loss": -42.2365837097168, "global_step": 323495, "epoch": 2673} {"train_loss": -38.43571853637695, "global_step": 323496, "epoch": 2673} {"train_loss": -42.864070892333984, "global_step": 323497, "epoch": 2673} {"train_loss": -38.407588958740234, "global_step": 323498, "epoch": 2673} {"train_loss": -42.09425735473633, "global_step": 323499, "epoch": 2673} {"train_loss": -37.88924789428711, "global_step": 323500, "epoch": 2673} {"train_loss": -43.00327682495117, "global_step": 323501, "epoch": 2673} {"train_loss": -39.6747932434082, "global_step": 323502, "epoch": 2673} {"train_loss": -42.61928176879883, "global_step": 323503, "epoch": 2673} {"train_loss": -40.9448127746582, "global_step": 323504, "epoch": 2673} {"train_loss": -41.81393051147461, "global_step": 323505, "epoch": 2673} {"train_loss": -41.866241455078125, "global_step": 323506, "epoch": 2673} {"train_loss": -42.24460220336914, "global_step": 323507, "epoch": 2673} {"train_loss": -42.486366271972656, "global_step": 323508, "epoch": 2673} {"train_loss": -41.819766998291016, "global_step": 323509, "epoch": 2673} {"train_loss": -42.61809158325195, "global_step": 323510, "epoch": 2673} {"train_loss": -43.063907623291016, "global_step": 323511, "epoch": 2673} {"train_loss": -42.52627182006836, "global_step": 323512, "epoch": 2673} {"train_loss": -43.29275131225586, "global_step": 323513, "epoch": 2673} {"train_loss": -43.11614227294922, "global_step": 323514, "epoch": 2673} {"train_loss": -43.38612365722656, "global_step": 323515, "epoch": 2673} {"train_loss": -43.05315399169922, "global_step": 323516, "epoch": 2673} {"train_loss": -41.64731979370117, "global_step": 323517, "epoch": 2673} {"train_loss": -43.327640533447266, "global_step": 323518, "epoch": 2673} {"train_loss": -43.34269714355469, "global_step": 323519, "epoch": 2673} {"train_loss": -41.64290237426758, "global_step": 323520, "epoch": 2673} {"train_loss": -43.315425872802734, "global_step": 323521, "epoch": 2673} {"train_loss": -43.77280807495117, "global_step": 323522, "epoch": 2673} {"train_loss": -43.82358932495117, "global_step": 323523, "epoch": 2673} {"train_loss": -43.7487907409668, "global_step": 323524, "epoch": 2673} {"train_loss": -43.17273712158203, "global_step": 323525, "epoch": 2673} {"train_loss": -43.43242263793945, "global_step": 323526, "epoch": 2673} {"train_loss": -43.99736022949219, "global_step": 323527, "epoch": 2673} {"train_loss": -41.400150299072266, "global_step": 323528, "epoch": 2673} {"train_loss": -43.64344024658203, "global_step": 323529, "epoch": 2673} {"train_loss": -43.61069107055664, "global_step": 323530, "epoch": 2673} {"train_loss": -43.3314094543457, "global_step": 323531, "epoch": 2673} {"train_loss": -43.559566497802734, "global_step": 323532, "epoch": 2673} {"train_loss": -43.41902160644531, "global_step": 323533, "epoch": 2673} {"train_loss": -44.30007553100586, "global_step": 323534, "epoch": 2673} {"train_loss": -42.61005783081055, "global_step": 323535, "epoch": 2673} {"train_loss": -42.698177337646484, "global_step": 323536, "epoch": 2673} {"train_loss": -42.91254806518555, "global_step": 323537, "epoch": 2673} {"train_loss": -43.75532913208008, "global_step": 323538, "epoch": 2673} {"train_loss": -42.8693733215332, "global_step": 323539, "epoch": 2673} {"train_loss": -44.07749938964844, "global_step": 323540, "epoch": 2673} {"train_loss": -43.90772247314453, "global_step": 323541, "epoch": 2673} {"train_loss": -42.3933219909668, "global_step": 323542, "epoch": 2673} {"train_loss": -40.25021743774414, "global_step": 323543, "epoch": 2673} {"train_loss": -43.87604522705078, "global_step": 323544, "epoch": 2673} {"train_loss": -43.86179733276367, "global_step": 323545, "epoch": 2673} {"train_loss": -44.177852630615234, "global_step": 323546, "epoch": 2673} {"train_loss": -42.99123001098633, "global_step": 323547, "epoch": 2673} {"train_loss": -43.64812088012695, "global_step": 323548, "epoch": 2673} {"train_loss": -44.20647048950195, "global_step": 323549, "epoch": 2673} {"train_loss": -44.028228759765625, "global_step": 323550, "epoch": 2673} {"train_loss": -44.90671157836914, "global_step": 323551, "epoch": 2673} {"train_loss": -44.16898727416992, "global_step": 323552, "epoch": 2673} {"train_loss": -42.37137597454481, "global_step": 323553, "epoch": 2673, "val_loss": 2705804.0} {"train_loss": -43.2145881652832, "global_step": 323554, "epoch": 2674} {"train_loss": -44.02482986450195, "global_step": 323555, "epoch": 2674} {"train_loss": -44.13617706298828, "global_step": 323556, "epoch": 2674} {"train_loss": -43.44872283935547, "global_step": 323557, "epoch": 2674} {"train_loss": -43.379451751708984, "global_step": 323558, "epoch": 2674} {"train_loss": -42.97650146484375, "global_step": 323559, "epoch": 2674} {"train_loss": -43.815059661865234, "global_step": 323560, "epoch": 2674} {"train_loss": -43.0294075012207, "global_step": 323561, "epoch": 2674} {"train_loss": -44.58099365234375, "global_step": 323562, "epoch": 2674} {"train_loss": -44.351016998291016, "global_step": 323563, "epoch": 2674} {"train_loss": -43.32381820678711, "global_step": 323564, "epoch": 2674} {"train_loss": -44.4254150390625, "global_step": 323565, "epoch": 2674} {"train_loss": -43.60390853881836, "global_step": 323566, "epoch": 2674} {"train_loss": -43.88565444946289, "global_step": 323567, "epoch": 2674} {"train_loss": -44.2612419128418, "global_step": 323568, "epoch": 2674} {"train_loss": -43.77129364013672, "global_step": 323569, "epoch": 2674} {"train_loss": -44.44778060913086, "global_step": 323570, "epoch": 2674} {"train_loss": -42.755611419677734, "global_step": 323571, "epoch": 2674} {"train_loss": -44.2887077331543, "global_step": 323572, "epoch": 2674} {"train_loss": -44.74062728881836, "global_step": 323573, "epoch": 2674} {"train_loss": -44.60474395751953, "global_step": 323574, "epoch": 2674} {"train_loss": -44.18293762207031, "global_step": 323575, "epoch": 2674} {"train_loss": -44.25231170654297, "global_step": 323576, "epoch": 2674} {"train_loss": -44.811344146728516, "global_step": 323577, "epoch": 2674} {"train_loss": -44.37519073486328, "global_step": 323578, "epoch": 2674} {"train_loss": -44.12431716918945, "global_step": 323579, "epoch": 2674} {"train_loss": -44.272979736328125, "global_step": 323580, "epoch": 2674} {"train_loss": -44.30863952636719, "global_step": 323581, "epoch": 2674} {"train_loss": -44.37635040283203, "global_step": 323582, "epoch": 2674} {"train_loss": -44.93409729003906, "global_step": 323583, "epoch": 2674} {"train_loss": -44.18046188354492, "global_step": 323584, "epoch": 2674} {"train_loss": -44.13705062866211, "global_step": 323585, "epoch": 2674} {"train_loss": -43.65578079223633, "global_step": 323586, "epoch": 2674} {"train_loss": -43.62623977661133, "global_step": 323587, "epoch": 2674} {"train_loss": -44.4863166809082, "global_step": 323588, "epoch": 2674} {"train_loss": -44.165950775146484, "global_step": 323589, "epoch": 2674} {"train_loss": -41.939308166503906, "global_step": 323590, "epoch": 2674} {"train_loss": -42.860328674316406, "global_step": 323591, "epoch": 2674} {"train_loss": -40.74555206298828, "global_step": 323592, "epoch": 2674} {"train_loss": -42.93222427368164, "global_step": 323593, "epoch": 2674} {"train_loss": -43.4249382019043, "global_step": 323594, "epoch": 2674} {"train_loss": -41.6733283996582, "global_step": 323595, "epoch": 2674} {"train_loss": -42.13100051879883, "global_step": 323596, "epoch": 2674} {"train_loss": -41.6996955871582, "global_step": 323597, "epoch": 2674} {"train_loss": -40.452659606933594, "global_step": 323598, "epoch": 2674} {"train_loss": -43.50580978393555, "global_step": 323599, "epoch": 2674} {"train_loss": -43.28980255126953, "global_step": 323600, "epoch": 2674} {"train_loss": -43.006591796875, "global_step": 323601, "epoch": 2674} {"train_loss": -43.241981506347656, "global_step": 323602, "epoch": 2674} {"train_loss": -43.35078048706055, "global_step": 323603, "epoch": 2674} {"train_loss": -42.89722442626953, "global_step": 323604, "epoch": 2674} {"train_loss": -42.26975631713867, "global_step": 323605, "epoch": 2674} {"train_loss": -41.896053314208984, "global_step": 323606, "epoch": 2674} {"train_loss": -43.2365608215332, "global_step": 323607, "epoch": 2674} {"train_loss": -44.09967803955078, "global_step": 323608, "epoch": 2674} {"train_loss": -42.62892532348633, "global_step": 323609, "epoch": 2674} {"train_loss": -42.3925895690918, "global_step": 323610, "epoch": 2674} {"train_loss": -42.49988555908203, "global_step": 323611, "epoch": 2674} {"train_loss": -42.7962532043457, "global_step": 323612, "epoch": 2674} {"train_loss": -43.710872650146484, "global_step": 323613, "epoch": 2674} {"train_loss": -43.485198974609375, "global_step": 323614, "epoch": 2674} {"train_loss": -42.96859359741211, "global_step": 323615, "epoch": 2674} {"train_loss": -43.88190841674805, "global_step": 323616, "epoch": 2674} {"train_loss": -42.53693771362305, "global_step": 323617, "epoch": 2674} {"train_loss": -42.7969970703125, "global_step": 323618, "epoch": 2674} {"train_loss": -42.626014709472656, "global_step": 323619, "epoch": 2674} {"train_loss": -43.70890426635742, "global_step": 323620, "epoch": 2674} {"train_loss": -42.85415267944336, "global_step": 323621, "epoch": 2674} {"train_loss": -42.50087356567383, "global_step": 323622, "epoch": 2674} {"train_loss": -43.37888717651367, "global_step": 323623, "epoch": 2674} {"train_loss": -42.5875244140625, "global_step": 323624, "epoch": 2674} {"train_loss": -39.55977249145508, "global_step": 323625, "epoch": 2674} {"train_loss": -43.590633392333984, "global_step": 323626, "epoch": 2674} {"train_loss": -43.87239074707031, "global_step": 323627, "epoch": 2674} {"train_loss": -42.08638000488281, "global_step": 323628, "epoch": 2674} {"train_loss": -43.43344497680664, "global_step": 323629, "epoch": 2674} {"train_loss": -42.94422912597656, "global_step": 323630, "epoch": 2674} {"train_loss": -43.325191497802734, "global_step": 323631, "epoch": 2674} {"train_loss": -42.05732727050781, "global_step": 323632, "epoch": 2674} {"train_loss": -42.050960540771484, "global_step": 323633, "epoch": 2674} {"train_loss": -44.015716552734375, "global_step": 323634, "epoch": 2674} {"train_loss": -43.64320755004883, "global_step": 323635, "epoch": 2674} {"train_loss": -42.6768798828125, "global_step": 323636, "epoch": 2674} {"train_loss": -42.35589599609375, "global_step": 323637, "epoch": 2674} {"train_loss": -43.6500244140625, "global_step": 323638, "epoch": 2674} {"train_loss": -43.569496154785156, "global_step": 323639, "epoch": 2674} {"train_loss": -42.35325241088867, "global_step": 323640, "epoch": 2674} {"train_loss": -43.48598098754883, "global_step": 323641, "epoch": 2674} {"train_loss": -43.8664436340332, "global_step": 323642, "epoch": 2674} {"train_loss": -44.332210540771484, "global_step": 323643, "epoch": 2674} {"train_loss": -44.43822479248047, "global_step": 323644, "epoch": 2674} {"train_loss": -44.30758285522461, "global_step": 323645, "epoch": 2674} {"train_loss": -44.29781723022461, "global_step": 323646, "epoch": 2674} {"train_loss": -43.953094482421875, "global_step": 323647, "epoch": 2674} {"train_loss": -44.57301330566406, "global_step": 323648, "epoch": 2674} {"train_loss": -44.3018798828125, "global_step": 323649, "epoch": 2674} {"train_loss": -44.060935974121094, "global_step": 323650, "epoch": 2674} {"train_loss": -44.20417022705078, "global_step": 323651, "epoch": 2674} {"train_loss": -44.799007415771484, "global_step": 323652, "epoch": 2674} {"train_loss": -44.06486129760742, "global_step": 323653, "epoch": 2674} {"train_loss": -43.776100158691406, "global_step": 323654, "epoch": 2674} {"train_loss": -44.4881706237793, "global_step": 323655, "epoch": 2674} {"train_loss": -44.23453903198242, "global_step": 323656, "epoch": 2674} {"train_loss": -44.87373733520508, "global_step": 323657, "epoch": 2674} {"train_loss": -44.321529388427734, "global_step": 323658, "epoch": 2674} {"train_loss": -43.20084762573242, "global_step": 323659, "epoch": 2674} {"train_loss": -43.938289642333984, "global_step": 323660, "epoch": 2674} {"train_loss": -43.70620346069336, "global_step": 323661, "epoch": 2674} {"train_loss": -42.53923797607422, "global_step": 323662, "epoch": 2674} {"train_loss": -43.70245361328125, "global_step": 323663, "epoch": 2674} {"train_loss": -43.90053939819336, "global_step": 323664, "epoch": 2674} {"train_loss": -44.88737869262695, "global_step": 323665, "epoch": 2674} {"train_loss": -43.27946090698242, "global_step": 323666, "epoch": 2674} {"train_loss": -43.9124755859375, "global_step": 323667, "epoch": 2674} {"train_loss": -43.83095169067383, "global_step": 323668, "epoch": 2674} {"train_loss": -44.10034942626953, "global_step": 323669, "epoch": 2674} {"train_loss": -44.079193115234375, "global_step": 323670, "epoch": 2674} {"train_loss": -43.67856979370117, "global_step": 323671, "epoch": 2674} {"train_loss": -43.64329147338867, "global_step": 323672, "epoch": 2674} {"train_loss": -44.1192512512207, "global_step": 323673, "epoch": 2674} {"train_loss": -43.49388097337455, "global_step": 323674, "epoch": 2674, "val_loss": 2802451.25} {"train_loss": -43.44797897338867, "global_step": 323675, "epoch": 2675} {"train_loss": -44.22098922729492, "global_step": 323676, "epoch": 2675} {"train_loss": -44.44935989379883, "global_step": 323677, "epoch": 2675} {"train_loss": -43.591835021972656, "global_step": 323678, "epoch": 2675} {"train_loss": -43.943511962890625, "global_step": 323679, "epoch": 2675} {"train_loss": -44.365760803222656, "global_step": 323680, "epoch": 2675} {"train_loss": -43.33420944213867, "global_step": 323681, "epoch": 2675} {"train_loss": -43.104469299316406, "global_step": 323682, "epoch": 2675} {"train_loss": -42.88326644897461, "global_step": 323683, "epoch": 2675} {"train_loss": -42.49076461791992, "global_step": 323684, "epoch": 2675} {"train_loss": -42.626861572265625, "global_step": 323685, "epoch": 2675} {"train_loss": -42.682281494140625, "global_step": 323686, "epoch": 2675} {"train_loss": -44.668861389160156, "global_step": 323687, "epoch": 2675} {"train_loss": -44.144248962402344, "global_step": 323688, "epoch": 2675} {"train_loss": -42.96267318725586, "global_step": 323689, "epoch": 2675} {"train_loss": -44.58961486816406, "global_step": 323690, "epoch": 2675} {"train_loss": -44.4697265625, "global_step": 323691, "epoch": 2675} {"train_loss": -43.48106384277344, "global_step": 323692, "epoch": 2675} {"train_loss": -44.82219314575195, "global_step": 323693, "epoch": 2675} {"train_loss": -43.5452995300293, "global_step": 323694, "epoch": 2675} {"train_loss": -43.1588249206543, "global_step": 323695, "epoch": 2675} {"train_loss": -44.24262619018555, "global_step": 323696, "epoch": 2675} {"train_loss": -43.976402282714844, "global_step": 323697, "epoch": 2675} {"train_loss": -44.212066650390625, "global_step": 323698, "epoch": 2675} {"train_loss": -44.04999923706055, "global_step": 323699, "epoch": 2675} {"train_loss": -44.30783462524414, "global_step": 323700, "epoch": 2675} {"train_loss": -44.638973236083984, "global_step": 323701, "epoch": 2675} {"train_loss": -45.020694732666016, "global_step": 323702, "epoch": 2675} {"train_loss": -43.710060119628906, "global_step": 323703, "epoch": 2675} {"train_loss": -44.68827438354492, "global_step": 323704, "epoch": 2675} {"train_loss": -44.715396881103516, "global_step": 323705, "epoch": 2675} {"train_loss": -44.545345306396484, "global_step": 323706, "epoch": 2675} {"train_loss": -44.74215316772461, "global_step": 323707, "epoch": 2675} {"train_loss": -44.734405517578125, "global_step": 323708, "epoch": 2675} {"train_loss": -44.29670333862305, "global_step": 323709, "epoch": 2675} {"train_loss": -43.6879768371582, "global_step": 323710, "epoch": 2675} {"train_loss": -44.77552032470703, "global_step": 323711, "epoch": 2675} {"train_loss": -44.75613021850586, "global_step": 323712, "epoch": 2675} {"train_loss": -44.858184814453125, "global_step": 323713, "epoch": 2675} {"train_loss": -44.748138427734375, "global_step": 323714, "epoch": 2675} {"train_loss": -44.94102096557617, "global_step": 323715, "epoch": 2675} {"train_loss": -45.04938888549805, "global_step": 323716, "epoch": 2675} {"train_loss": -44.971126556396484, "global_step": 323717, "epoch": 2675} {"train_loss": -45.06120681762695, "global_step": 323718, "epoch": 2675} {"train_loss": -44.90678405761719, "global_step": 323719, "epoch": 2675} {"train_loss": -44.193267822265625, "global_step": 323720, "epoch": 2675} {"train_loss": -44.67097091674805, "global_step": 323721, "epoch": 2675} {"train_loss": -45.059288024902344, "global_step": 323722, "epoch": 2675} {"train_loss": -45.10054397583008, "global_step": 323723, "epoch": 2675} {"train_loss": -45.29524230957031, "global_step": 323724, "epoch": 2675} {"train_loss": -44.627235412597656, "global_step": 323725, "epoch": 2675} {"train_loss": -44.02058029174805, "global_step": 323726, "epoch": 2675} {"train_loss": -43.055397033691406, "global_step": 323727, "epoch": 2675} {"train_loss": -43.79523849487305, "global_step": 323728, "epoch": 2675} {"train_loss": -44.249080657958984, "global_step": 323729, "epoch": 2675} {"train_loss": -44.40522003173828, "global_step": 323730, "epoch": 2675} {"train_loss": -44.97459030151367, "global_step": 323731, "epoch": 2675} {"train_loss": -45.063106536865234, "global_step": 323732, "epoch": 2675} {"train_loss": -44.26316452026367, "global_step": 323733, "epoch": 2675} {"train_loss": -44.9058952331543, "global_step": 323734, "epoch": 2675} {"train_loss": -44.5645751953125, "global_step": 323735, "epoch": 2675} {"train_loss": -44.00706100463867, "global_step": 323736, "epoch": 2675} {"train_loss": -42.402584075927734, "global_step": 323737, "epoch": 2675} {"train_loss": -39.76833724975586, "global_step": 323738, "epoch": 2675} {"train_loss": -42.94517135620117, "global_step": 323739, "epoch": 2675} {"train_loss": -43.258628845214844, "global_step": 323740, "epoch": 2675} {"train_loss": -42.50238037109375, "global_step": 323741, "epoch": 2675} {"train_loss": -44.65639114379883, "global_step": 323742, "epoch": 2675} {"train_loss": -43.04791259765625, "global_step": 323743, "epoch": 2675} {"train_loss": -40.57239532470703, "global_step": 323744, "epoch": 2675} {"train_loss": -42.13875961303711, "global_step": 323745, "epoch": 2675} {"train_loss": -43.6107292175293, "global_step": 323746, "epoch": 2675} {"train_loss": -43.26836013793945, "global_step": 323747, "epoch": 2675} {"train_loss": -42.576759338378906, "global_step": 323748, "epoch": 2675} {"train_loss": -44.07465744018555, "global_step": 323749, "epoch": 2675} {"train_loss": -43.38838577270508, "global_step": 323750, "epoch": 2675} {"train_loss": -40.92392349243164, "global_step": 323751, "epoch": 2675} {"train_loss": -43.88129425048828, "global_step": 323752, "epoch": 2675} {"train_loss": -43.07212448120117, "global_step": 323753, "epoch": 2675} {"train_loss": -42.025386810302734, "global_step": 323754, "epoch": 2675} {"train_loss": -43.36664962768555, "global_step": 323755, "epoch": 2675} {"train_loss": -43.61320114135742, "global_step": 323756, "epoch": 2675} {"train_loss": -43.4336051940918, "global_step": 323757, "epoch": 2675} {"train_loss": -43.27754592895508, "global_step": 323758, "epoch": 2675} {"train_loss": -43.60677719116211, "global_step": 323759, "epoch": 2675} {"train_loss": -43.56429672241211, "global_step": 323760, "epoch": 2675} {"train_loss": -44.65507125854492, "global_step": 323761, "epoch": 2675} {"train_loss": -43.47801208496094, "global_step": 323762, "epoch": 2675} {"train_loss": -43.89350891113281, "global_step": 323763, "epoch": 2675} {"train_loss": -44.484718322753906, "global_step": 323764, "epoch": 2675} {"train_loss": -43.968719482421875, "global_step": 323765, "epoch": 2675} {"train_loss": -43.770381927490234, "global_step": 323766, "epoch": 2675} {"train_loss": -44.418853759765625, "global_step": 323767, "epoch": 2675} {"train_loss": -43.6972541809082, "global_step": 323768, "epoch": 2675} {"train_loss": -42.56129837036133, "global_step": 323769, "epoch": 2675} {"train_loss": -42.86761474609375, "global_step": 323770, "epoch": 2675} {"train_loss": -43.5257682800293, "global_step": 323771, "epoch": 2675} {"train_loss": -42.87741470336914, "global_step": 323772, "epoch": 2675} {"train_loss": -41.70302200317383, "global_step": 323773, "epoch": 2675} {"train_loss": -42.10572052001953, "global_step": 323774, "epoch": 2675} {"train_loss": -43.800716400146484, "global_step": 323775, "epoch": 2675} {"train_loss": -42.04633712768555, "global_step": 323776, "epoch": 2675} {"train_loss": -42.5202751159668, "global_step": 323777, "epoch": 2675} {"train_loss": -44.4409065246582, "global_step": 323778, "epoch": 2675} {"train_loss": -43.66465759277344, "global_step": 323779, "epoch": 2675} {"train_loss": -43.662193298339844, "global_step": 323780, "epoch": 2675} {"train_loss": -43.1943473815918, "global_step": 323781, "epoch": 2675} {"train_loss": -44.233985900878906, "global_step": 323782, "epoch": 2675} {"train_loss": -43.041160583496094, "global_step": 323783, "epoch": 2675} {"train_loss": -44.12704086303711, "global_step": 323784, "epoch": 2675} {"train_loss": -44.21649932861328, "global_step": 323785, "epoch": 2675} {"train_loss": -43.15291976928711, "global_step": 323786, "epoch": 2675} {"train_loss": -44.069454193115234, "global_step": 323787, "epoch": 2675} {"train_loss": -42.915435791015625, "global_step": 323788, "epoch": 2675} {"train_loss": -42.86948776245117, "global_step": 323789, "epoch": 2675} {"train_loss": -44.27506637573242, "global_step": 323790, "epoch": 2675} {"train_loss": -42.41683578491211, "global_step": 323791, "epoch": 2675} {"train_loss": -42.37297439575195, "global_step": 323792, "epoch": 2675} {"train_loss": -43.427852630615234, "global_step": 323793, "epoch": 2675} {"train_loss": -42.9200439453125, "global_step": 323794, "epoch": 2675} {"train_loss": -43.710691625421696, "global_step": 323795, "epoch": 2675, "val_loss": 2689758.25} {"train_loss": -43.71997833251953, "global_step": 323796, "epoch": 2676} {"train_loss": -41.55009078979492, "global_step": 323797, "epoch": 2676} {"train_loss": -43.3071403503418, "global_step": 323798, "epoch": 2676} {"train_loss": -43.547332763671875, "global_step": 323799, "epoch": 2676} {"train_loss": -42.94800567626953, "global_step": 323800, "epoch": 2676} {"train_loss": -43.30453872680664, "global_step": 323801, "epoch": 2676} {"train_loss": -43.867591857910156, "global_step": 323802, "epoch": 2676} {"train_loss": -43.65964889526367, "global_step": 323803, "epoch": 2676} {"train_loss": -44.095272064208984, "global_step": 323804, "epoch": 2676} {"train_loss": -44.0844612121582, "global_step": 323805, "epoch": 2676} {"train_loss": -44.196998596191406, "global_step": 323806, "epoch": 2676} {"train_loss": -44.944313049316406, "global_step": 323807, "epoch": 2676} {"train_loss": -44.21824264526367, "global_step": 323808, "epoch": 2676} {"train_loss": -43.845672607421875, "global_step": 323809, "epoch": 2676} {"train_loss": -44.480262756347656, "global_step": 323810, "epoch": 2676} {"train_loss": -43.85833740234375, "global_step": 323811, "epoch": 2676} {"train_loss": -44.7697639465332, "global_step": 323812, "epoch": 2676} {"train_loss": -44.235107421875, "global_step": 323813, "epoch": 2676} {"train_loss": -43.476966857910156, "global_step": 323814, "epoch": 2676} {"train_loss": -43.70954513549805, "global_step": 323815, "epoch": 2676} {"train_loss": -43.9039306640625, "global_step": 323816, "epoch": 2676} {"train_loss": -43.82191848754883, "global_step": 323817, "epoch": 2676} {"train_loss": -43.9682731628418, "global_step": 323818, "epoch": 2676} {"train_loss": -44.782291412353516, "global_step": 323819, "epoch": 2676} {"train_loss": -43.839752197265625, "global_step": 323820, "epoch": 2676} {"train_loss": -44.08347702026367, "global_step": 323821, "epoch": 2676} {"train_loss": -45.085365295410156, "global_step": 323822, "epoch": 2676} {"train_loss": -43.434078216552734, "global_step": 323823, "epoch": 2676} {"train_loss": -44.4702262878418, "global_step": 323824, "epoch": 2676} {"train_loss": -45.11725616455078, "global_step": 323825, "epoch": 2676} {"train_loss": -43.42597579956055, "global_step": 323826, "epoch": 2676} {"train_loss": -43.401912689208984, "global_step": 323827, "epoch": 2676} {"train_loss": -44.4150276184082, "global_step": 323828, "epoch": 2676} {"train_loss": -43.584346771240234, "global_step": 323829, "epoch": 2676} {"train_loss": -44.66270446777344, "global_step": 323830, "epoch": 2676} {"train_loss": -44.6846923828125, "global_step": 323831, "epoch": 2676} {"train_loss": -44.25536346435547, "global_step": 323832, "epoch": 2676} {"train_loss": -45.26601791381836, "global_step": 323833, "epoch": 2676} {"train_loss": -43.74033737182617, "global_step": 323834, "epoch": 2676} {"train_loss": -44.23350143432617, "global_step": 323835, "epoch": 2676} {"train_loss": -44.74675369262695, "global_step": 323836, "epoch": 2676} {"train_loss": -43.82662582397461, "global_step": 323837, "epoch": 2676} {"train_loss": -43.04109573364258, "global_step": 323838, "epoch": 2676} {"train_loss": -44.86438751220703, "global_step": 323839, "epoch": 2676} {"train_loss": -44.322547912597656, "global_step": 323840, "epoch": 2676} {"train_loss": -45.124935150146484, "global_step": 323841, "epoch": 2676} {"train_loss": -45.09640121459961, "global_step": 323842, "epoch": 2676} {"train_loss": -44.67533493041992, "global_step": 323843, "epoch": 2676} {"train_loss": -44.93310546875, "global_step": 323844, "epoch": 2676} {"train_loss": -44.89609909057617, "global_step": 323845, "epoch": 2676} {"train_loss": -45.178802490234375, "global_step": 323846, "epoch": 2676} {"train_loss": -44.72114181518555, "global_step": 323847, "epoch": 2676} {"train_loss": -44.50669479370117, "global_step": 323848, "epoch": 2676} {"train_loss": -44.898223876953125, "global_step": 323849, "epoch": 2676} {"train_loss": -43.7166633605957, "global_step": 323850, "epoch": 2676} {"train_loss": -44.14033126831055, "global_step": 323851, "epoch": 2676} {"train_loss": -44.78064727783203, "global_step": 323852, "epoch": 2676} {"train_loss": -43.98271560668945, "global_step": 323853, "epoch": 2676} {"train_loss": -44.89970779418945, "global_step": 323854, "epoch": 2676} {"train_loss": -43.7860107421875, "global_step": 323855, "epoch": 2676} {"train_loss": -45.45827102661133, "global_step": 323856, "epoch": 2676} {"train_loss": -43.442501068115234, "global_step": 323857, "epoch": 2676} {"train_loss": -44.960628509521484, "global_step": 323858, "epoch": 2676} {"train_loss": -43.60860061645508, "global_step": 323859, "epoch": 2676} {"train_loss": -44.873748779296875, "global_step": 323860, "epoch": 2676} {"train_loss": -45.05703353881836, "global_step": 323861, "epoch": 2676} {"train_loss": -44.964881896972656, "global_step": 323862, "epoch": 2676} {"train_loss": -45.391475677490234, "global_step": 323863, "epoch": 2676} {"train_loss": -44.79502868652344, "global_step": 323864, "epoch": 2676} {"train_loss": -44.42710876464844, "global_step": 323865, "epoch": 2676} {"train_loss": -44.99016189575195, "global_step": 323866, "epoch": 2676} {"train_loss": -45.43111038208008, "global_step": 323867, "epoch": 2676} {"train_loss": -45.043556213378906, "global_step": 323868, "epoch": 2676} {"train_loss": -45.45589065551758, "global_step": 323869, "epoch": 2676} {"train_loss": -45.03032302856445, "global_step": 323870, "epoch": 2676} {"train_loss": -45.47129440307617, "global_step": 323871, "epoch": 2676} {"train_loss": -44.85369873046875, "global_step": 323872, "epoch": 2676} {"train_loss": -45.21628952026367, "global_step": 323873, "epoch": 2676} {"train_loss": -44.62071990966797, "global_step": 323874, "epoch": 2676} {"train_loss": -45.188232421875, "global_step": 323875, "epoch": 2676} {"train_loss": -45.46165084838867, "global_step": 323876, "epoch": 2676} {"train_loss": -45.600830078125, "global_step": 323877, "epoch": 2676} {"train_loss": -45.368751525878906, "global_step": 323878, "epoch": 2676} {"train_loss": -45.2876091003418, "global_step": 323879, "epoch": 2676} {"train_loss": -45.32119369506836, "global_step": 323880, "epoch": 2676} {"train_loss": -45.19245147705078, "global_step": 323881, "epoch": 2676} {"train_loss": -45.26727294921875, "global_step": 323882, "epoch": 2676} {"train_loss": -45.0656852722168, "global_step": 323883, "epoch": 2676} {"train_loss": -44.82744216918945, "global_step": 323884, "epoch": 2676} {"train_loss": -43.31246566772461, "global_step": 323885, "epoch": 2676} {"train_loss": -39.2433967590332, "global_step": 323886, "epoch": 2676} {"train_loss": -38.71963119506836, "global_step": 323887, "epoch": 2676} {"train_loss": -44.833736419677734, "global_step": 323888, "epoch": 2676} {"train_loss": -38.68883514404297, "global_step": 323889, "epoch": 2676} {"train_loss": -33.699432373046875, "global_step": 323890, "epoch": 2676} {"train_loss": -17.60590934753418, "global_step": 323891, "epoch": 2676} {"train_loss": -32.286903381347656, "global_step": 323892, "epoch": 2676} {"train_loss": -22.479549407958984, "global_step": 323893, "epoch": 2676} {"train_loss": -31.944366455078125, "global_step": 323894, "epoch": 2676} {"train_loss": -32.258113861083984, "global_step": 323895, "epoch": 2676} {"train_loss": -25.81207847595215, "global_step": 323896, "epoch": 2676} {"train_loss": -33.00456619262695, "global_step": 323897, "epoch": 2676} {"train_loss": -33.31634521484375, "global_step": 323898, "epoch": 2676} {"train_loss": -32.0213623046875, "global_step": 323899, "epoch": 2676} {"train_loss": -30.754369735717773, "global_step": 323900, "epoch": 2676} {"train_loss": -34.76398468017578, "global_step": 323901, "epoch": 2676} {"train_loss": -34.44956588745117, "global_step": 323902, "epoch": 2676} {"train_loss": -31.5472354888916, "global_step": 323903, "epoch": 2676} {"train_loss": -33.405941009521484, "global_step": 323904, "epoch": 2676} {"train_loss": -34.95207977294922, "global_step": 323905, "epoch": 2676} {"train_loss": -33.192100524902344, "global_step": 323906, "epoch": 2676} {"train_loss": -32.92753982543945, "global_step": 323907, "epoch": 2676} {"train_loss": -34.03606033325195, "global_step": 323908, "epoch": 2676} {"train_loss": -35.6575813293457, "global_step": 323909, "epoch": 2676} {"train_loss": -35.16813278198242, "global_step": 323910, "epoch": 2676} {"train_loss": -33.77482986450195, "global_step": 323911, "epoch": 2676} {"train_loss": -35.16004180908203, "global_step": 323912, "epoch": 2676} {"train_loss": -35.71997833251953, "global_step": 323913, "epoch": 2676} {"train_loss": -35.908443450927734, "global_step": 323914, "epoch": 2676} {"train_loss": -34.79258728027344, "global_step": 323915, "epoch": 2676} {"train_loss": -41.62595515605832, "global_step": 323916, "epoch": 2676, "val_loss": 2712451.0} {"train_loss": -34.96723556518555, "global_step": 323917, "epoch": 2677} {"train_loss": -36.101966857910156, "global_step": 323918, "epoch": 2677} {"train_loss": -36.16472625732422, "global_step": 323919, "epoch": 2677} {"train_loss": -35.47547149658203, "global_step": 323920, "epoch": 2677} {"train_loss": -35.99931716918945, "global_step": 323921, "epoch": 2677} {"train_loss": -36.58424758911133, "global_step": 323922, "epoch": 2677} {"train_loss": -35.3248176574707, "global_step": 323923, "epoch": 2677} {"train_loss": -35.72799301147461, "global_step": 323924, "epoch": 2677} {"train_loss": -37.13595199584961, "global_step": 323925, "epoch": 2677} {"train_loss": -36.1088752746582, "global_step": 323926, "epoch": 2677} {"train_loss": -36.181060791015625, "global_step": 323927, "epoch": 2677} {"train_loss": -36.46498107910156, "global_step": 323928, "epoch": 2677} {"train_loss": -36.69563293457031, "global_step": 323929, "epoch": 2677} {"train_loss": -37.032508850097656, "global_step": 323930, "epoch": 2677} {"train_loss": -37.41850662231445, "global_step": 323931, "epoch": 2677} {"train_loss": -37.91901779174805, "global_step": 323932, "epoch": 2677} {"train_loss": -37.395870208740234, "global_step": 323933, "epoch": 2677} {"train_loss": -37.16184616088867, "global_step": 323934, "epoch": 2677} {"train_loss": -37.976844787597656, "global_step": 323935, "epoch": 2677} {"train_loss": -38.147613525390625, "global_step": 323936, "epoch": 2677} {"train_loss": -38.189056396484375, "global_step": 323937, "epoch": 2677} {"train_loss": -37.79978561401367, "global_step": 323938, "epoch": 2677} {"train_loss": -38.7733268737793, "global_step": 323939, "epoch": 2677} {"train_loss": -38.328853607177734, "global_step": 323940, "epoch": 2677} {"train_loss": -37.7484130859375, "global_step": 323941, "epoch": 2677} {"train_loss": -38.55459213256836, "global_step": 323942, "epoch": 2677} {"train_loss": -37.64154815673828, "global_step": 323943, "epoch": 2677} {"train_loss": -38.534088134765625, "global_step": 323944, "epoch": 2677} {"train_loss": -39.102291107177734, "global_step": 323945, "epoch": 2677} {"train_loss": -38.4264030456543, "global_step": 323946, "epoch": 2677} {"train_loss": -39.374481201171875, "global_step": 323947, "epoch": 2677} {"train_loss": -38.293243408203125, "global_step": 323948, "epoch": 2677} {"train_loss": -38.759368896484375, "global_step": 323949, "epoch": 2677} {"train_loss": -38.69609451293945, "global_step": 323950, "epoch": 2677} {"train_loss": -39.46014404296875, "global_step": 323951, "epoch": 2677} {"train_loss": -39.5394401550293, "global_step": 323952, "epoch": 2677} {"train_loss": -39.718223571777344, "global_step": 323953, "epoch": 2677} {"train_loss": -39.0744743347168, "global_step": 323954, "epoch": 2677} {"train_loss": -39.22603988647461, "global_step": 323955, "epoch": 2677} {"train_loss": -39.10572052001953, "global_step": 323956, "epoch": 2677} {"train_loss": -39.460670471191406, "global_step": 323957, "epoch": 2677} {"train_loss": -39.43581771850586, "global_step": 323958, "epoch": 2677} {"train_loss": -39.46549606323242, "global_step": 323959, "epoch": 2677} {"train_loss": -39.603878021240234, "global_step": 323960, "epoch": 2677} {"train_loss": -39.896240234375, "global_step": 323961, "epoch": 2677} {"train_loss": -40.34879684448242, "global_step": 323962, "epoch": 2677} {"train_loss": -40.58074951171875, "global_step": 323963, "epoch": 2677} {"train_loss": -40.24773025512695, "global_step": 323964, "epoch": 2677} {"train_loss": -40.17316818237305, "global_step": 323965, "epoch": 2677} {"train_loss": -40.265350341796875, "global_step": 323966, "epoch": 2677} {"train_loss": -40.27131652832031, "global_step": 323967, "epoch": 2677} {"train_loss": -40.750389099121094, "global_step": 323968, "epoch": 2677} {"train_loss": -40.73208236694336, "global_step": 323969, "epoch": 2677} {"train_loss": -40.77415084838867, "global_step": 323970, "epoch": 2677} {"train_loss": -40.525856018066406, "global_step": 323971, "epoch": 2677} {"train_loss": -40.53203582763672, "global_step": 323972, "epoch": 2677} {"train_loss": -40.36551284790039, "global_step": 323973, "epoch": 2677} {"train_loss": -40.789058685302734, "global_step": 323974, "epoch": 2677} {"train_loss": -41.04307174682617, "global_step": 323975, "epoch": 2677} {"train_loss": -41.21449661254883, "global_step": 323976, "epoch": 2677} {"train_loss": -41.1712760925293, "global_step": 323977, "epoch": 2677} {"train_loss": -41.20176315307617, "global_step": 323978, "epoch": 2677} {"train_loss": -40.637855529785156, "global_step": 323979, "epoch": 2677} {"train_loss": -41.17552185058594, "global_step": 323980, "epoch": 2677} {"train_loss": -40.3229866027832, "global_step": 323981, "epoch": 2677} {"train_loss": -40.43699264526367, "global_step": 323982, "epoch": 2677} {"train_loss": -40.206787109375, "global_step": 323983, "epoch": 2677} {"train_loss": -42.138118743896484, "global_step": 323984, "epoch": 2677} {"train_loss": -41.13578414916992, "global_step": 323985, "epoch": 2677} {"train_loss": -39.28169631958008, "global_step": 323986, "epoch": 2677} {"train_loss": -41.72689437866211, "global_step": 323987, "epoch": 2677} {"train_loss": -41.27617263793945, "global_step": 323988, "epoch": 2677} {"train_loss": -40.97674560546875, "global_step": 323989, "epoch": 2677} {"train_loss": -40.14924240112305, "global_step": 323990, "epoch": 2677} {"train_loss": -41.77714538574219, "global_step": 323991, "epoch": 2677} {"train_loss": -40.956756591796875, "global_step": 323992, "epoch": 2677} {"train_loss": -40.8021240234375, "global_step": 323993, "epoch": 2677} {"train_loss": -42.1989631652832, "global_step": 323994, "epoch": 2677} {"train_loss": -41.53557205200195, "global_step": 323995, "epoch": 2677} {"train_loss": -41.87148666381836, "global_step": 323996, "epoch": 2677} {"train_loss": -41.25022888183594, "global_step": 323997, "epoch": 2677} {"train_loss": -41.67818069458008, "global_step": 323998, "epoch": 2677} {"train_loss": -41.91084671020508, "global_step": 323999, "epoch": 2677} {"train_loss": -41.14397430419922, "global_step": 324000, "epoch": 2677} {"train_loss": -41.453548431396484, "global_step": 324001, "epoch": 2677} {"train_loss": -41.618717193603516, "global_step": 324002, "epoch": 2677} {"train_loss": -42.404911041259766, "global_step": 324003, "epoch": 2677} {"train_loss": -41.71621322631836, "global_step": 324004, "epoch": 2677} {"train_loss": -41.56755447387695, "global_step": 324005, "epoch": 2677} {"train_loss": -41.401981353759766, "global_step": 324006, "epoch": 2677} {"train_loss": -41.42681121826172, "global_step": 324007, "epoch": 2677} {"train_loss": -42.57546615600586, "global_step": 324008, "epoch": 2677} {"train_loss": -42.804115295410156, "global_step": 324009, "epoch": 2677} {"train_loss": -42.15676498413086, "global_step": 324010, "epoch": 2677} {"train_loss": -40.3939094543457, "global_step": 324011, "epoch": 2677} {"train_loss": -42.349891662597656, "global_step": 324012, "epoch": 2677} {"train_loss": -42.53068542480469, "global_step": 324013, "epoch": 2677} {"train_loss": -42.491050720214844, "global_step": 324014, "epoch": 2677} {"train_loss": -42.87858200073242, "global_step": 324015, "epoch": 2677} {"train_loss": -42.57330322265625, "global_step": 324016, "epoch": 2677} {"train_loss": -42.258583068847656, "global_step": 324017, "epoch": 2677} {"train_loss": -42.21690368652344, "global_step": 324018, "epoch": 2677} {"train_loss": -42.16071701049805, "global_step": 324019, "epoch": 2677} {"train_loss": -42.44263458251953, "global_step": 324020, "epoch": 2677} {"train_loss": -42.5516242980957, "global_step": 324021, "epoch": 2677} {"train_loss": -42.4286994934082, "global_step": 324022, "epoch": 2677} {"train_loss": -40.56686019897461, "global_step": 324023, "epoch": 2677} {"train_loss": -37.965911865234375, "global_step": 324024, "epoch": 2677} {"train_loss": -40.79951477050781, "global_step": 324025, "epoch": 2677} {"train_loss": -42.13923263549805, "global_step": 324026, "epoch": 2677} {"train_loss": -41.84017562866211, "global_step": 324027, "epoch": 2677} {"train_loss": -42.822364807128906, "global_step": 324028, "epoch": 2677} {"train_loss": -39.24848556518555, "global_step": 324029, "epoch": 2677} {"train_loss": -41.20981979370117, "global_step": 324030, "epoch": 2677} {"train_loss": -41.63856506347656, "global_step": 324031, "epoch": 2677} {"train_loss": -39.691261291503906, "global_step": 324032, "epoch": 2677} {"train_loss": -41.12516403198242, "global_step": 324033, "epoch": 2677} {"train_loss": -40.19428634643555, "global_step": 324034, "epoch": 2677} {"train_loss": -37.54337692260742, "global_step": 324035, "epoch": 2677} {"train_loss": -41.732948303222656, "global_step": 324036, "epoch": 2677} {"train_loss": -39.95369881243745, "global_step": 324037, "epoch": 2677, "val_loss": 2692845.25} {"train_loss": -30.39739418029785, "global_step": 324038, "epoch": 2678} {"train_loss": -42.06123733520508, "global_step": 324039, "epoch": 2678} {"train_loss": -37.8261833190918, "global_step": 324040, "epoch": 2678} {"train_loss": -34.636592864990234, "global_step": 324041, "epoch": 2678} {"train_loss": -23.689226150512695, "global_step": 324042, "epoch": 2678} {"train_loss": -40.039730072021484, "global_step": 324043, "epoch": 2678} {"train_loss": -39.482975006103516, "global_step": 324044, "epoch": 2678} {"train_loss": -34.794063568115234, "global_step": 324045, "epoch": 2678} {"train_loss": -28.220474243164062, "global_step": 324046, "epoch": 2678} {"train_loss": -28.906269073486328, "global_step": 324047, "epoch": 2678} {"train_loss": -17.703296661376953, "global_step": 324048, "epoch": 2678} {"train_loss": -35.60184097290039, "global_step": 324049, "epoch": 2678} {"train_loss": -26.699735641479492, "global_step": 324050, "epoch": 2678} {"train_loss": -33.71012496948242, "global_step": 324051, "epoch": 2678} {"train_loss": -34.67102813720703, "global_step": 324052, "epoch": 2678} {"train_loss": -29.326444625854492, "global_step": 324053, "epoch": 2678} {"train_loss": -35.93156433105469, "global_step": 324054, "epoch": 2678} {"train_loss": -34.32651901245117, "global_step": 324055, "epoch": 2678} {"train_loss": -24.782861709594727, "global_step": 324056, "epoch": 2678} {"train_loss": -34.277442932128906, "global_step": 324057, "epoch": 2678} {"train_loss": -36.655982971191406, "global_step": 324058, "epoch": 2678} {"train_loss": -35.56975173950195, "global_step": 324059, "epoch": 2678} {"train_loss": -34.543006896972656, "global_step": 324060, "epoch": 2678} {"train_loss": -36.39370346069336, "global_step": 324061, "epoch": 2678} {"train_loss": -37.262935638427734, "global_step": 324062, "epoch": 2678} {"train_loss": -35.092838287353516, "global_step": 324063, "epoch": 2678} {"train_loss": -31.865467071533203, "global_step": 324064, "epoch": 2678} {"train_loss": -34.37446975708008, "global_step": 324065, "epoch": 2678} {"train_loss": -35.677486419677734, "global_step": 324066, "epoch": 2678} {"train_loss": -37.260799407958984, "global_step": 324067, "epoch": 2678} {"train_loss": -37.842037200927734, "global_step": 324068, "epoch": 2678} {"train_loss": -37.36354446411133, "global_step": 324069, "epoch": 2678} {"train_loss": -37.97062301635742, "global_step": 324070, "epoch": 2678} {"train_loss": -37.3138313293457, "global_step": 324071, "epoch": 2678} {"train_loss": -36.93817138671875, "global_step": 324072, "epoch": 2678} {"train_loss": -37.627620697021484, "global_step": 324073, "epoch": 2678} {"train_loss": -38.06135177612305, "global_step": 324074, "epoch": 2678} {"train_loss": -37.45594787597656, "global_step": 324075, "epoch": 2678} {"train_loss": -38.220455169677734, "global_step": 324076, "epoch": 2678} {"train_loss": -37.66033935546875, "global_step": 324077, "epoch": 2678} {"train_loss": -38.36807632446289, "global_step": 324078, "epoch": 2678} {"train_loss": -37.714813232421875, "global_step": 324079, "epoch": 2678} {"train_loss": -37.98130416870117, "global_step": 324080, "epoch": 2678} {"train_loss": -38.142791748046875, "global_step": 324081, "epoch": 2678} {"train_loss": -37.8418083190918, "global_step": 324082, "epoch": 2678} {"train_loss": -37.91047286987305, "global_step": 324083, "epoch": 2678} {"train_loss": -38.52713394165039, "global_step": 324084, "epoch": 2678} {"train_loss": -38.52912139892578, "global_step": 324085, "epoch": 2678} {"train_loss": -37.44437789916992, "global_step": 324086, "epoch": 2678} {"train_loss": -38.45907211303711, "global_step": 324087, "epoch": 2678} {"train_loss": -39.36463928222656, "global_step": 324088, "epoch": 2678} {"train_loss": -38.13617706298828, "global_step": 324089, "epoch": 2678} {"train_loss": -39.22468948364258, "global_step": 324090, "epoch": 2678} {"train_loss": -38.41621780395508, "global_step": 324091, "epoch": 2678} {"train_loss": -39.55118942260742, "global_step": 324092, "epoch": 2678} {"train_loss": -37.85276412963867, "global_step": 324093, "epoch": 2678} {"train_loss": -38.97516632080078, "global_step": 324094, "epoch": 2678} {"train_loss": -39.10392379760742, "global_step": 324095, "epoch": 2678} {"train_loss": -39.47495651245117, "global_step": 324096, "epoch": 2678} {"train_loss": -39.54703903198242, "global_step": 324097, "epoch": 2678} {"train_loss": -39.32735824584961, "global_step": 324098, "epoch": 2678} {"train_loss": -39.92667770385742, "global_step": 324099, "epoch": 2678} {"train_loss": -39.56050491333008, "global_step": 324100, "epoch": 2678} {"train_loss": -39.10798263549805, "global_step": 324101, "epoch": 2678} {"train_loss": -40.18440246582031, "global_step": 324102, "epoch": 2678} {"train_loss": -39.25212097167969, "global_step": 324103, "epoch": 2678} {"train_loss": -39.31742477416992, "global_step": 324104, "epoch": 2678} {"train_loss": -39.305572509765625, "global_step": 324105, "epoch": 2678} {"train_loss": -39.7755241394043, "global_step": 324106, "epoch": 2678} {"train_loss": -39.62321472167969, "global_step": 324107, "epoch": 2678} {"train_loss": -39.86367416381836, "global_step": 324108, "epoch": 2678} {"train_loss": -39.953636169433594, "global_step": 324109, "epoch": 2678} {"train_loss": -39.671478271484375, "global_step": 324110, "epoch": 2678} {"train_loss": -39.631378173828125, "global_step": 324111, "epoch": 2678} {"train_loss": -39.50702667236328, "global_step": 324112, "epoch": 2678} {"train_loss": -40.45086669921875, "global_step": 324113, "epoch": 2678} {"train_loss": -39.268348693847656, "global_step": 324114, "epoch": 2678} {"train_loss": -39.34296417236328, "global_step": 324115, "epoch": 2678} {"train_loss": -40.865726470947266, "global_step": 324116, "epoch": 2678} {"train_loss": -40.73652267456055, "global_step": 324117, "epoch": 2678} {"train_loss": -40.17148971557617, "global_step": 324118, "epoch": 2678} {"train_loss": -40.43999099731445, "global_step": 324119, "epoch": 2678} {"train_loss": -40.51150131225586, "global_step": 324120, "epoch": 2678} {"train_loss": -40.24677658081055, "global_step": 324121, "epoch": 2678} {"train_loss": -40.22684860229492, "global_step": 324122, "epoch": 2678} {"train_loss": -40.24852752685547, "global_step": 324123, "epoch": 2678} {"train_loss": -40.61174392700195, "global_step": 324124, "epoch": 2678} {"train_loss": -40.33275604248047, "global_step": 324125, "epoch": 2678} {"train_loss": -40.27511978149414, "global_step": 324126, "epoch": 2678} {"train_loss": -40.4240837097168, "global_step": 324127, "epoch": 2678} {"train_loss": -40.50100326538086, "global_step": 324128, "epoch": 2678} {"train_loss": -40.9179801940918, "global_step": 324129, "epoch": 2678} {"train_loss": -41.03123092651367, "global_step": 324130, "epoch": 2678} {"train_loss": -39.62824630737305, "global_step": 324131, "epoch": 2678} {"train_loss": -40.870357513427734, "global_step": 324132, "epoch": 2678} {"train_loss": -41.28017807006836, "global_step": 324133, "epoch": 2678} {"train_loss": -40.452022552490234, "global_step": 324134, "epoch": 2678} {"train_loss": -39.07967758178711, "global_step": 324135, "epoch": 2678} {"train_loss": -40.95785140991211, "global_step": 324136, "epoch": 2678} {"train_loss": -40.78789520263672, "global_step": 324137, "epoch": 2678} {"train_loss": -40.475704193115234, "global_step": 324138, "epoch": 2678} {"train_loss": -40.81287384033203, "global_step": 324139, "epoch": 2678} {"train_loss": -38.82356262207031, "global_step": 324140, "epoch": 2678} {"train_loss": -40.86103057861328, "global_step": 324141, "epoch": 2678} {"train_loss": -41.56138229370117, "global_step": 324142, "epoch": 2678} {"train_loss": -41.046875, "global_step": 324143, "epoch": 2678} {"train_loss": -40.98929977416992, "global_step": 324144, "epoch": 2678} {"train_loss": -41.455787658691406, "global_step": 324145, "epoch": 2678} {"train_loss": -39.936553955078125, "global_step": 324146, "epoch": 2678} {"train_loss": -41.25300216674805, "global_step": 324147, "epoch": 2678} {"train_loss": -41.05125045776367, "global_step": 324148, "epoch": 2678} {"train_loss": -41.12510299682617, "global_step": 324149, "epoch": 2678} {"train_loss": -41.388946533203125, "global_step": 324150, "epoch": 2678} {"train_loss": -41.36467361450195, "global_step": 324151, "epoch": 2678} {"train_loss": -37.04889678955078, "global_step": 324152, "epoch": 2678} {"train_loss": -40.726806640625, "global_step": 324153, "epoch": 2678} {"train_loss": -41.733123779296875, "global_step": 324154, "epoch": 2678} {"train_loss": -40.715389251708984, "global_step": 324155, "epoch": 2678} {"train_loss": -41.694454193115234, "global_step": 324156, "epoch": 2678} {"train_loss": -41.26936721801758, "global_step": 324157, "epoch": 2678} {"train_loss": -38.092746277486, "global_step": 324158, "epoch": 2678, "val_loss": 2786707.25} {"train_loss": -40.08840560913086, "global_step": 324159, "epoch": 2679} {"train_loss": -39.37943649291992, "global_step": 324160, "epoch": 2679} {"train_loss": -42.18227767944336, "global_step": 324161, "epoch": 2679} {"train_loss": -38.652565002441406, "global_step": 324162, "epoch": 2679} {"train_loss": -40.90371322631836, "global_step": 324163, "epoch": 2679} {"train_loss": -40.34912872314453, "global_step": 324164, "epoch": 2679} {"train_loss": -41.977638244628906, "global_step": 324165, "epoch": 2679} {"train_loss": -42.05598068237305, "global_step": 324166, "epoch": 2679} {"train_loss": -39.83118438720703, "global_step": 324167, "epoch": 2679} {"train_loss": -41.704559326171875, "global_step": 324168, "epoch": 2679} {"train_loss": -40.51310348510742, "global_step": 324169, "epoch": 2679} {"train_loss": -41.00880813598633, "global_step": 324170, "epoch": 2679} {"train_loss": -41.351627349853516, "global_step": 324171, "epoch": 2679} {"train_loss": -38.90791702270508, "global_step": 324172, "epoch": 2679} {"train_loss": -41.45462417602539, "global_step": 324173, "epoch": 2679} {"train_loss": -39.28581619262695, "global_step": 324174, "epoch": 2679} {"train_loss": -41.46751022338867, "global_step": 324175, "epoch": 2679} {"train_loss": -41.513771057128906, "global_step": 324176, "epoch": 2679} {"train_loss": -39.611488342285156, "global_step": 324177, "epoch": 2679} {"train_loss": -40.080841064453125, "global_step": 324178, "epoch": 2679} {"train_loss": -41.32509994506836, "global_step": 324179, "epoch": 2679} {"train_loss": -41.36262893676758, "global_step": 324180, "epoch": 2679} {"train_loss": -39.128273010253906, "global_step": 324181, "epoch": 2679} {"train_loss": -39.52962875366211, "global_step": 324182, "epoch": 2679} {"train_loss": -39.600730895996094, "global_step": 324183, "epoch": 2679} {"train_loss": -36.9846305847168, "global_step": 324184, "epoch": 2679} {"train_loss": -39.20040512084961, "global_step": 324185, "epoch": 2679} {"train_loss": -40.997093200683594, "global_step": 324186, "epoch": 2679} {"train_loss": -39.49436569213867, "global_step": 324187, "epoch": 2679} {"train_loss": -40.38662338256836, "global_step": 324188, "epoch": 2679} {"train_loss": -40.95260238647461, "global_step": 324189, "epoch": 2679} {"train_loss": -40.08144760131836, "global_step": 324190, "epoch": 2679} {"train_loss": -40.969764709472656, "global_step": 324191, "epoch": 2679} {"train_loss": -40.914031982421875, "global_step": 324192, "epoch": 2679} {"train_loss": -41.7958869934082, "global_step": 324193, "epoch": 2679} {"train_loss": -41.779964447021484, "global_step": 324194, "epoch": 2679} {"train_loss": -40.96106719970703, "global_step": 324195, "epoch": 2679} {"train_loss": -41.47978591918945, "global_step": 324196, "epoch": 2679} {"train_loss": -42.20581817626953, "global_step": 324197, "epoch": 2679} {"train_loss": -41.81201171875, "global_step": 324198, "epoch": 2679} {"train_loss": -40.91626739501953, "global_step": 324199, "epoch": 2679} {"train_loss": -41.2435302734375, "global_step": 324200, "epoch": 2679} {"train_loss": -39.94773483276367, "global_step": 324201, "epoch": 2679} {"train_loss": -40.897193908691406, "global_step": 324202, "epoch": 2679} {"train_loss": -41.25832748413086, "global_step": 324203, "epoch": 2679} {"train_loss": -41.286109924316406, "global_step": 324204, "epoch": 2679} {"train_loss": -41.68625259399414, "global_step": 324205, "epoch": 2679} {"train_loss": -41.56611251831055, "global_step": 324206, "epoch": 2679} {"train_loss": -39.793636322021484, "global_step": 324207, "epoch": 2679} {"train_loss": -41.55039596557617, "global_step": 324208, "epoch": 2679} {"train_loss": -40.89408874511719, "global_step": 324209, "epoch": 2679} {"train_loss": -42.59455490112305, "global_step": 324210, "epoch": 2679} {"train_loss": -41.520503997802734, "global_step": 324211, "epoch": 2679} {"train_loss": -40.18754196166992, "global_step": 324212, "epoch": 2679} {"train_loss": -40.242488861083984, "global_step": 324213, "epoch": 2679} {"train_loss": -41.99712371826172, "global_step": 324214, "epoch": 2679} {"train_loss": -41.571937561035156, "global_step": 324215, "epoch": 2679} {"train_loss": -41.822021484375, "global_step": 324216, "epoch": 2679} {"train_loss": -41.39435958862305, "global_step": 324217, "epoch": 2679} {"train_loss": -41.26770782470703, "global_step": 324218, "epoch": 2679} {"train_loss": -42.004058837890625, "global_step": 324219, "epoch": 2679} {"train_loss": -40.86766815185547, "global_step": 324220, "epoch": 2679} {"train_loss": -41.897979736328125, "global_step": 324221, "epoch": 2679} {"train_loss": -40.858062744140625, "global_step": 324222, "epoch": 2679} {"train_loss": -39.43238830566406, "global_step": 324223, "epoch": 2679} {"train_loss": -39.56535720825195, "global_step": 324224, "epoch": 2679} {"train_loss": -40.31415939331055, "global_step": 324225, "epoch": 2679} {"train_loss": -41.55021286010742, "global_step": 324226, "epoch": 2679} {"train_loss": -41.08306884765625, "global_step": 324227, "epoch": 2679} {"train_loss": -39.8474235534668, "global_step": 324228, "epoch": 2679} {"train_loss": -41.24879837036133, "global_step": 324229, "epoch": 2679} {"train_loss": -41.024105072021484, "global_step": 324230, "epoch": 2679} {"train_loss": -40.53573989868164, "global_step": 324231, "epoch": 2679} {"train_loss": -41.76527404785156, "global_step": 324232, "epoch": 2679} {"train_loss": -40.86003875732422, "global_step": 324233, "epoch": 2679} {"train_loss": -42.239898681640625, "global_step": 324234, "epoch": 2679} {"train_loss": -41.66511154174805, "global_step": 324235, "epoch": 2679} {"train_loss": -41.44197463989258, "global_step": 324236, "epoch": 2679} {"train_loss": -41.06462097167969, "global_step": 324237, "epoch": 2679} {"train_loss": -41.63386917114258, "global_step": 324238, "epoch": 2679} {"train_loss": -42.137855529785156, "global_step": 324239, "epoch": 2679} {"train_loss": -41.98622512817383, "global_step": 324240, "epoch": 2679} {"train_loss": -40.98873519897461, "global_step": 324241, "epoch": 2679} {"train_loss": -41.30365753173828, "global_step": 324242, "epoch": 2679} {"train_loss": -41.25031280517578, "global_step": 324243, "epoch": 2679} {"train_loss": -40.597625732421875, "global_step": 324244, "epoch": 2679} {"train_loss": -40.23575973510742, "global_step": 324245, "epoch": 2679} {"train_loss": -41.770145416259766, "global_step": 324246, "epoch": 2679} {"train_loss": -41.2277717590332, "global_step": 324247, "epoch": 2679} {"train_loss": -39.879634857177734, "global_step": 324248, "epoch": 2679} {"train_loss": -41.66617965698242, "global_step": 324249, "epoch": 2679} {"train_loss": -41.89878463745117, "global_step": 324250, "epoch": 2679} {"train_loss": -41.55521774291992, "global_step": 324251, "epoch": 2679} {"train_loss": -41.81022262573242, "global_step": 324252, "epoch": 2679} {"train_loss": -42.023590087890625, "global_step": 324253, "epoch": 2679} {"train_loss": -41.47998046875, "global_step": 324254, "epoch": 2679} {"train_loss": -39.8275260925293, "global_step": 324255, "epoch": 2679} {"train_loss": -41.25444412231445, "global_step": 324256, "epoch": 2679} {"train_loss": -41.91853713989258, "global_step": 324257, "epoch": 2679} {"train_loss": -41.638336181640625, "global_step": 324258, "epoch": 2679} {"train_loss": -42.4420280456543, "global_step": 324259, "epoch": 2679} {"train_loss": -42.57306671142578, "global_step": 324260, "epoch": 2679} {"train_loss": -39.77378463745117, "global_step": 324261, "epoch": 2679} {"train_loss": -41.71206283569336, "global_step": 324262, "epoch": 2679} {"train_loss": -41.784236907958984, "global_step": 324263, "epoch": 2679} {"train_loss": -40.94631576538086, "global_step": 324264, "epoch": 2679} {"train_loss": -42.89665985107422, "global_step": 324265, "epoch": 2679} {"train_loss": -43.143226623535156, "global_step": 324266, "epoch": 2679} {"train_loss": -42.630977630615234, "global_step": 324267, "epoch": 2679} {"train_loss": -42.55438232421875, "global_step": 324268, "epoch": 2679} {"train_loss": -42.67685317993164, "global_step": 324269, "epoch": 2679} {"train_loss": -42.23080062866211, "global_step": 324270, "epoch": 2679} {"train_loss": -41.5588493347168, "global_step": 324271, "epoch": 2679} {"train_loss": -42.80991744995117, "global_step": 324272, "epoch": 2679} {"train_loss": -42.7559814453125, "global_step": 324273, "epoch": 2679} {"train_loss": -41.9227294921875, "global_step": 324274, "epoch": 2679} {"train_loss": -41.67243576049805, "global_step": 324275, "epoch": 2679} {"train_loss": -42.39748001098633, "global_step": 324276, "epoch": 2679} {"train_loss": -41.89594268798828, "global_step": 324277, "epoch": 2679} {"train_loss": -42.841888427734375, "global_step": 324278, "epoch": 2679} {"train_loss": -41.1547749101623, "global_step": 324279, "epoch": 2679, "val_loss": 2813596.75} {"train_loss": -42.49810791015625, "global_step": 324280, "epoch": 2680} {"train_loss": -42.44782638549805, "global_step": 324281, "epoch": 2680} {"train_loss": -42.53403854370117, "global_step": 324282, "epoch": 2680} {"train_loss": -42.326820373535156, "global_step": 324283, "epoch": 2680} {"train_loss": -41.539756774902344, "global_step": 324284, "epoch": 2680} {"train_loss": -43.07514190673828, "global_step": 324285, "epoch": 2680} {"train_loss": -42.60322189331055, "global_step": 324286, "epoch": 2680} {"train_loss": -42.10535430908203, "global_step": 324287, "epoch": 2680} {"train_loss": -41.977577209472656, "global_step": 324288, "epoch": 2680} {"train_loss": -42.46636199951172, "global_step": 324289, "epoch": 2680} {"train_loss": -41.58819580078125, "global_step": 324290, "epoch": 2680} {"train_loss": -40.10836410522461, "global_step": 324291, "epoch": 2680} {"train_loss": -43.55458068847656, "global_step": 324292, "epoch": 2680} {"train_loss": -42.041202545166016, "global_step": 324293, "epoch": 2680} {"train_loss": -43.19005584716797, "global_step": 324294, "epoch": 2680} {"train_loss": -42.91998291015625, "global_step": 324295, "epoch": 2680} {"train_loss": -42.234554290771484, "global_step": 324296, "epoch": 2680} {"train_loss": -39.453426361083984, "global_step": 324297, "epoch": 2680} {"train_loss": -36.9736442565918, "global_step": 324298, "epoch": 2680} {"train_loss": -38.08937454223633, "global_step": 324299, "epoch": 2680} {"train_loss": -42.07964324951172, "global_step": 324300, "epoch": 2680} {"train_loss": -41.268157958984375, "global_step": 324301, "epoch": 2680} {"train_loss": -39.47060012817383, "global_step": 324302, "epoch": 2680} {"train_loss": -40.499847412109375, "global_step": 324303, "epoch": 2680} {"train_loss": -41.579280853271484, "global_step": 324304, "epoch": 2680} {"train_loss": -35.664207458496094, "global_step": 324305, "epoch": 2680} {"train_loss": -41.07965087890625, "global_step": 324306, "epoch": 2680} {"train_loss": -41.01580810546875, "global_step": 324307, "epoch": 2680} {"train_loss": -17.138620376586914, "global_step": 324308, "epoch": 2680} {"train_loss": -42.149959564208984, "global_step": 324309, "epoch": 2680} {"train_loss": -39.01300811767578, "global_step": 324310, "epoch": 2680} {"train_loss": -40.06878662109375, "global_step": 324311, "epoch": 2680} {"train_loss": -39.97239685058594, "global_step": 324312, "epoch": 2680} {"train_loss": -39.87641525268555, "global_step": 324313, "epoch": 2680} {"train_loss": -29.312335968017578, "global_step": 324314, "epoch": 2680} {"train_loss": -40.371456146240234, "global_step": 324315, "epoch": 2680} {"train_loss": -40.870113372802734, "global_step": 324316, "epoch": 2680} {"train_loss": -36.44868087768555, "global_step": 324317, "epoch": 2680} {"train_loss": -40.85651779174805, "global_step": 324318, "epoch": 2680} {"train_loss": -40.5191650390625, "global_step": 324319, "epoch": 2680} {"train_loss": -41.22310256958008, "global_step": 324320, "epoch": 2680} {"train_loss": -40.21107864379883, "global_step": 324321, "epoch": 2680} {"train_loss": -37.59238815307617, "global_step": 324322, "epoch": 2680} {"train_loss": -39.399864196777344, "global_step": 324323, "epoch": 2680} {"train_loss": -36.33864212036133, "global_step": 324324, "epoch": 2680} {"train_loss": -40.41059494018555, "global_step": 324325, "epoch": 2680} {"train_loss": -7.564601898193359, "global_step": 324326, "epoch": 2680} {"train_loss": -39.89900207519531, "global_step": 324327, "epoch": 2680} {"train_loss": -38.62575912475586, "global_step": 324328, "epoch": 2680} {"train_loss": -37.701229095458984, "global_step": 324329, "epoch": 2680} {"train_loss": -38.026939392089844, "global_step": 324330, "epoch": 2680} {"train_loss": -40.47272491455078, "global_step": 324331, "epoch": 2680} {"train_loss": -28.94720458984375, "global_step": 324332, "epoch": 2680} {"train_loss": -39.346553802490234, "global_step": 324333, "epoch": 2680} {"train_loss": -39.43706130981445, "global_step": 324334, "epoch": 2680} {"train_loss": -39.52392578125, "global_step": 324335, "epoch": 2680} {"train_loss": -38.43862533569336, "global_step": 324336, "epoch": 2680} {"train_loss": -39.29351806640625, "global_step": 324337, "epoch": 2680} {"train_loss": -40.390289306640625, "global_step": 324338, "epoch": 2680} {"train_loss": -40.00442886352539, "global_step": 324339, "epoch": 2680} {"train_loss": -39.58441162109375, "global_step": 324340, "epoch": 2680} {"train_loss": -40.22841262817383, "global_step": 324341, "epoch": 2680} {"train_loss": -39.16229248046875, "global_step": 324342, "epoch": 2680} {"train_loss": -39.79167556762695, "global_step": 324343, "epoch": 2680} {"train_loss": -40.584434509277344, "global_step": 324344, "epoch": 2680} {"train_loss": -38.63199996948242, "global_step": 324345, "epoch": 2680} {"train_loss": -40.3405647277832, "global_step": 324346, "epoch": 2680} {"train_loss": -40.60866928100586, "global_step": 324347, "epoch": 2680} {"train_loss": -40.51171112060547, "global_step": 324348, "epoch": 2680} {"train_loss": -37.014957427978516, "global_step": 324349, "epoch": 2680} {"train_loss": -40.123043060302734, "global_step": 324350, "epoch": 2680} {"train_loss": -40.538387298583984, "global_step": 324351, "epoch": 2680} {"train_loss": -40.52650833129883, "global_step": 324352, "epoch": 2680} {"train_loss": -41.50584030151367, "global_step": 324353, "epoch": 2680} {"train_loss": -40.27656173706055, "global_step": 324354, "epoch": 2680} {"train_loss": -41.5409049987793, "global_step": 324355, "epoch": 2680} {"train_loss": -41.30986022949219, "global_step": 324356, "epoch": 2680} {"train_loss": -39.662960052490234, "global_step": 324357, "epoch": 2680} {"train_loss": -39.04954147338867, "global_step": 324358, "epoch": 2680} {"train_loss": -38.26087951660156, "global_step": 324359, "epoch": 2680} {"train_loss": -40.53414535522461, "global_step": 324360, "epoch": 2680} {"train_loss": -40.859901428222656, "global_step": 324361, "epoch": 2680} {"train_loss": -40.79081344604492, "global_step": 324362, "epoch": 2680} {"train_loss": -40.89028549194336, "global_step": 324363, "epoch": 2680} {"train_loss": -40.75797653198242, "global_step": 324364, "epoch": 2680} {"train_loss": -40.450294494628906, "global_step": 324365, "epoch": 2680} {"train_loss": -41.26322555541992, "global_step": 324366, "epoch": 2680} {"train_loss": -41.4720573425293, "global_step": 324367, "epoch": 2680} {"train_loss": -40.977455139160156, "global_step": 324368, "epoch": 2680} {"train_loss": -40.26738357543945, "global_step": 324369, "epoch": 2680} {"train_loss": -41.22339630126953, "global_step": 324370, "epoch": 2680} {"train_loss": -39.688819885253906, "global_step": 324371, "epoch": 2680} {"train_loss": -38.82563018798828, "global_step": 324372, "epoch": 2680} {"train_loss": -40.50313186645508, "global_step": 324373, "epoch": 2680} {"train_loss": -40.82131576538086, "global_step": 324374, "epoch": 2680} {"train_loss": -40.38508987426758, "global_step": 324375, "epoch": 2680} {"train_loss": -41.10918045043945, "global_step": 324376, "epoch": 2680} {"train_loss": -39.88933181762695, "global_step": 324377, "epoch": 2680} {"train_loss": -41.28855514526367, "global_step": 324378, "epoch": 2680} {"train_loss": -40.84124755859375, "global_step": 324379, "epoch": 2680} {"train_loss": -41.72726821899414, "global_step": 324380, "epoch": 2680} {"train_loss": -41.83230209350586, "global_step": 324381, "epoch": 2680} {"train_loss": -41.222816467285156, "global_step": 324382, "epoch": 2680} {"train_loss": -40.449092864990234, "global_step": 324383, "epoch": 2680} {"train_loss": -40.70907974243164, "global_step": 324384, "epoch": 2680} {"train_loss": -41.71638107299805, "global_step": 324385, "epoch": 2680} {"train_loss": -40.36153793334961, "global_step": 324386, "epoch": 2680} {"train_loss": -41.517765045166016, "global_step": 324387, "epoch": 2680} {"train_loss": -41.2776985168457, "global_step": 324388, "epoch": 2680} {"train_loss": -41.47216796875, "global_step": 324389, "epoch": 2680} {"train_loss": -40.4556770324707, "global_step": 324390, "epoch": 2680} {"train_loss": -41.862789154052734, "global_step": 324391, "epoch": 2680} {"train_loss": -41.792823791503906, "global_step": 324392, "epoch": 2680} {"train_loss": -41.48801803588867, "global_step": 324393, "epoch": 2680} {"train_loss": -41.45125961303711, "global_step": 324394, "epoch": 2680} {"train_loss": -42.54621505737305, "global_step": 324395, "epoch": 2680} {"train_loss": -42.08390426635742, "global_step": 324396, "epoch": 2680} {"train_loss": -41.582054138183594, "global_step": 324397, "epoch": 2680} {"train_loss": -42.14478302001953, "global_step": 324398, "epoch": 2680} {"train_loss": -42.06721878051758, "global_step": 324399, "epoch": 2680} {"train_loss": -39.9150375965213, "global_step": 324400, "epoch": 2680, "val_loss": 2706182.0} {"train_loss": -41.64319610595703, "global_step": 324401, "epoch": 2681} {"train_loss": -41.27226638793945, "global_step": 324402, "epoch": 2681} {"train_loss": -41.456451416015625, "global_step": 324403, "epoch": 2681} {"train_loss": -41.00490951538086, "global_step": 324404, "epoch": 2681} {"train_loss": -41.4802360534668, "global_step": 324405, "epoch": 2681} {"train_loss": -42.67839431762695, "global_step": 324406, "epoch": 2681} {"train_loss": -40.155303955078125, "global_step": 324407, "epoch": 2681} {"train_loss": -41.130859375, "global_step": 324408, "epoch": 2681} {"train_loss": -42.05887222290039, "global_step": 324409, "epoch": 2681} {"train_loss": -40.55007553100586, "global_step": 324410, "epoch": 2681} {"train_loss": -42.316009521484375, "global_step": 324411, "epoch": 2681} {"train_loss": -42.403926849365234, "global_step": 324412, "epoch": 2681} {"train_loss": -42.14360427856445, "global_step": 324413, "epoch": 2681} {"train_loss": -42.77820587158203, "global_step": 324414, "epoch": 2681} {"train_loss": -42.67214584350586, "global_step": 324415, "epoch": 2681} {"train_loss": -42.39714813232422, "global_step": 324416, "epoch": 2681} {"train_loss": -42.80947494506836, "global_step": 324417, "epoch": 2681} {"train_loss": -42.451473236083984, "global_step": 324418, "epoch": 2681} {"train_loss": -42.52410125732422, "global_step": 324419, "epoch": 2681} {"train_loss": -41.47017288208008, "global_step": 324420, "epoch": 2681} {"train_loss": -42.80415344238281, "global_step": 324421, "epoch": 2681} {"train_loss": -40.48072052001953, "global_step": 324422, "epoch": 2681} {"train_loss": -42.402339935302734, "global_step": 324423, "epoch": 2681} {"train_loss": -43.08557891845703, "global_step": 324424, "epoch": 2681} {"train_loss": -42.469539642333984, "global_step": 324425, "epoch": 2681} {"train_loss": -42.81317138671875, "global_step": 324426, "epoch": 2681} {"train_loss": -42.748958587646484, "global_step": 324427, "epoch": 2681} {"train_loss": -41.6274528503418, "global_step": 324428, "epoch": 2681} {"train_loss": -42.577144622802734, "global_step": 324429, "epoch": 2681} {"train_loss": -42.26557540893555, "global_step": 324430, "epoch": 2681} {"train_loss": -40.9113883972168, "global_step": 324431, "epoch": 2681} {"train_loss": -41.788970947265625, "global_step": 324432, "epoch": 2681} {"train_loss": -41.99760818481445, "global_step": 324433, "epoch": 2681} {"train_loss": -42.391212463378906, "global_step": 324434, "epoch": 2681} {"train_loss": -42.023067474365234, "global_step": 324435, "epoch": 2681} {"train_loss": -42.63094711303711, "global_step": 324436, "epoch": 2681} {"train_loss": -42.299747467041016, "global_step": 324437, "epoch": 2681} {"train_loss": -42.45193099975586, "global_step": 324438, "epoch": 2681} {"train_loss": -40.40316390991211, "global_step": 324439, "epoch": 2681} {"train_loss": -43.277584075927734, "global_step": 324440, "epoch": 2681} {"train_loss": -41.5712890625, "global_step": 324441, "epoch": 2681} {"train_loss": -40.7078857421875, "global_step": 324442, "epoch": 2681} {"train_loss": -42.42603302001953, "global_step": 324443, "epoch": 2681} {"train_loss": -42.28338623046875, "global_step": 324444, "epoch": 2681} {"train_loss": -43.130428314208984, "global_step": 324445, "epoch": 2681} {"train_loss": -41.884132385253906, "global_step": 324446, "epoch": 2681} {"train_loss": -41.37699508666992, "global_step": 324447, "epoch": 2681} {"train_loss": -41.76361846923828, "global_step": 324448, "epoch": 2681} {"train_loss": -41.18792724609375, "global_step": 324449, "epoch": 2681} {"train_loss": -43.19374465942383, "global_step": 324450, "epoch": 2681} {"train_loss": -42.05381774902344, "global_step": 324451, "epoch": 2681} {"train_loss": -42.13249206542969, "global_step": 324452, "epoch": 2681} {"train_loss": -41.986793518066406, "global_step": 324453, "epoch": 2681} {"train_loss": -42.9224967956543, "global_step": 324454, "epoch": 2681} {"train_loss": -41.8765983581543, "global_step": 324455, "epoch": 2681} {"train_loss": -39.28737258911133, "global_step": 324456, "epoch": 2681} {"train_loss": -37.36416244506836, "global_step": 324457, "epoch": 2681} {"train_loss": -42.21147155761719, "global_step": 324458, "epoch": 2681} {"train_loss": -42.45606994628906, "global_step": 324459, "epoch": 2681} {"train_loss": -39.661231994628906, "global_step": 324460, "epoch": 2681} {"train_loss": -41.88784408569336, "global_step": 324461, "epoch": 2681} {"train_loss": -41.93549346923828, "global_step": 324462, "epoch": 2681} {"train_loss": -42.30781173706055, "global_step": 324463, "epoch": 2681} {"train_loss": -41.5070686340332, "global_step": 324464, "epoch": 2681} {"train_loss": -41.18031692504883, "global_step": 324465, "epoch": 2681} {"train_loss": -41.178672790527344, "global_step": 324466, "epoch": 2681} {"train_loss": -42.53612518310547, "global_step": 324467, "epoch": 2681} {"train_loss": -42.01572799682617, "global_step": 324468, "epoch": 2681} {"train_loss": -41.37772750854492, "global_step": 324469, "epoch": 2681} {"train_loss": -41.6146240234375, "global_step": 324470, "epoch": 2681} {"train_loss": -40.70620346069336, "global_step": 324471, "epoch": 2681} {"train_loss": -41.70649719238281, "global_step": 324472, "epoch": 2681} {"train_loss": -35.751033782958984, "global_step": 324473, "epoch": 2681} {"train_loss": -42.43333053588867, "global_step": 324474, "epoch": 2681} {"train_loss": -42.31110763549805, "global_step": 324475, "epoch": 2681} {"train_loss": -42.354915618896484, "global_step": 324476, "epoch": 2681} {"train_loss": -41.994598388671875, "global_step": 324477, "epoch": 2681} {"train_loss": -42.5173225402832, "global_step": 324478, "epoch": 2681} {"train_loss": -43.007686614990234, "global_step": 324479, "epoch": 2681} {"train_loss": -42.08113479614258, "global_step": 324480, "epoch": 2681} {"train_loss": -41.975887298583984, "global_step": 324481, "epoch": 2681} {"train_loss": -42.30009078979492, "global_step": 324482, "epoch": 2681} {"train_loss": -42.491703033447266, "global_step": 324483, "epoch": 2681} {"train_loss": -36.952308654785156, "global_step": 324484, "epoch": 2681} {"train_loss": -38.85248565673828, "global_step": 324485, "epoch": 2681} {"train_loss": -42.6030158996582, "global_step": 324486, "epoch": 2681} {"train_loss": -42.61409378051758, "global_step": 324487, "epoch": 2681} {"train_loss": -42.6191520690918, "global_step": 324488, "epoch": 2681} {"train_loss": -43.15996551513672, "global_step": 324489, "epoch": 2681} {"train_loss": -42.28831481933594, "global_step": 324490, "epoch": 2681} {"train_loss": -42.070281982421875, "global_step": 324491, "epoch": 2681} {"train_loss": -42.83612823486328, "global_step": 324492, "epoch": 2681} {"train_loss": -42.56633377075195, "global_step": 324493, "epoch": 2681} {"train_loss": -41.73052978515625, "global_step": 324494, "epoch": 2681} {"train_loss": -42.819156646728516, "global_step": 324495, "epoch": 2681} {"train_loss": -41.39654541015625, "global_step": 324496, "epoch": 2681} {"train_loss": -42.035945892333984, "global_step": 324497, "epoch": 2681} {"train_loss": -42.17434310913086, "global_step": 324498, "epoch": 2681} {"train_loss": -42.83031463623047, "global_step": 324499, "epoch": 2681} {"train_loss": -42.6826057434082, "global_step": 324500, "epoch": 2681} {"train_loss": -42.97066879272461, "global_step": 324501, "epoch": 2681} {"train_loss": -42.28004837036133, "global_step": 324502, "epoch": 2681} {"train_loss": -42.58445358276367, "global_step": 324503, "epoch": 2681} {"train_loss": -43.586692810058594, "global_step": 324504, "epoch": 2681} {"train_loss": -41.9171028137207, "global_step": 324505, "epoch": 2681} {"train_loss": -41.54555130004883, "global_step": 324506, "epoch": 2681} {"train_loss": -37.055660247802734, "global_step": 324507, "epoch": 2681} {"train_loss": -39.65593719482422, "global_step": 324508, "epoch": 2681} {"train_loss": -40.10454177856445, "global_step": 324509, "epoch": 2681} {"train_loss": -42.744388580322266, "global_step": 324510, "epoch": 2681} {"train_loss": -43.14786911010742, "global_step": 324511, "epoch": 2681} {"train_loss": -41.692134857177734, "global_step": 324512, "epoch": 2681} {"train_loss": -41.136531829833984, "global_step": 324513, "epoch": 2681} {"train_loss": -42.4481315612793, "global_step": 324514, "epoch": 2681} {"train_loss": -35.053524017333984, "global_step": 324515, "epoch": 2681} {"train_loss": -41.374916076660156, "global_step": 324516, "epoch": 2681} {"train_loss": -41.665645599365234, "global_step": 324517, "epoch": 2681} {"train_loss": -41.82047653198242, "global_step": 324518, "epoch": 2681} {"train_loss": -43.017601013183594, "global_step": 324519, "epoch": 2681} {"train_loss": -41.08957290649414, "global_step": 324520, "epoch": 2681} {"train_loss": -41.72869955015577, "global_step": 324521, "epoch": 2681, "val_loss": 2640368.25} {"train_loss": -42.3470458984375, "global_step": 324522, "epoch": 2682} {"train_loss": -42.43629837036133, "global_step": 324523, "epoch": 2682} {"train_loss": -41.751888275146484, "global_step": 324524, "epoch": 2682} {"train_loss": -40.95859909057617, "global_step": 324525, "epoch": 2682} {"train_loss": -40.79562759399414, "global_step": 324526, "epoch": 2682} {"train_loss": -42.107906341552734, "global_step": 324527, "epoch": 2682} {"train_loss": -41.6661491394043, "global_step": 324528, "epoch": 2682} {"train_loss": -42.709869384765625, "global_step": 324529, "epoch": 2682} {"train_loss": -40.16675567626953, "global_step": 324530, "epoch": 2682} {"train_loss": -39.54623794555664, "global_step": 324531, "epoch": 2682} {"train_loss": -42.33206558227539, "global_step": 324532, "epoch": 2682} {"train_loss": -41.73234939575195, "global_step": 324533, "epoch": 2682} {"train_loss": -42.482444763183594, "global_step": 324534, "epoch": 2682} {"train_loss": -39.16565704345703, "global_step": 324535, "epoch": 2682} {"train_loss": -40.54553985595703, "global_step": 324536, "epoch": 2682} {"train_loss": -36.61977005004883, "global_step": 324537, "epoch": 2682} {"train_loss": -41.63918685913086, "global_step": 324538, "epoch": 2682} {"train_loss": -39.39689254760742, "global_step": 324539, "epoch": 2682} {"train_loss": -41.642913818359375, "global_step": 324540, "epoch": 2682} {"train_loss": -41.25282669067383, "global_step": 324541, "epoch": 2682} {"train_loss": -41.054744720458984, "global_step": 324542, "epoch": 2682} {"train_loss": -42.208187103271484, "global_step": 324543, "epoch": 2682} {"train_loss": -41.901302337646484, "global_step": 324544, "epoch": 2682} {"train_loss": -40.69015121459961, "global_step": 324545, "epoch": 2682} {"train_loss": -42.27947998046875, "global_step": 324546, "epoch": 2682} {"train_loss": -41.784000396728516, "global_step": 324547, "epoch": 2682} {"train_loss": -42.26740264892578, "global_step": 324548, "epoch": 2682} {"train_loss": -42.57796096801758, "global_step": 324549, "epoch": 2682} {"train_loss": -41.636436462402344, "global_step": 324550, "epoch": 2682} {"train_loss": -40.486690521240234, "global_step": 324551, "epoch": 2682} {"train_loss": -41.59540939331055, "global_step": 324552, "epoch": 2682} {"train_loss": -40.2073974609375, "global_step": 324553, "epoch": 2682} {"train_loss": -40.98939514160156, "global_step": 324554, "epoch": 2682} {"train_loss": -41.50791549682617, "global_step": 324555, "epoch": 2682} {"train_loss": -40.58099365234375, "global_step": 324556, "epoch": 2682} {"train_loss": -41.23775863647461, "global_step": 324557, "epoch": 2682} {"train_loss": -42.24372482299805, "global_step": 324558, "epoch": 2682} {"train_loss": -41.98667526245117, "global_step": 324559, "epoch": 2682} {"train_loss": -40.76152038574219, "global_step": 324560, "epoch": 2682} {"train_loss": -41.163787841796875, "global_step": 324561, "epoch": 2682} {"train_loss": -41.48603439331055, "global_step": 324562, "epoch": 2682} {"train_loss": -41.58689498901367, "global_step": 324563, "epoch": 2682} {"train_loss": -41.611541748046875, "global_step": 324564, "epoch": 2682} {"train_loss": -41.49170684814453, "global_step": 324565, "epoch": 2682} {"train_loss": -42.10353469848633, "global_step": 324566, "epoch": 2682} {"train_loss": -42.30186080932617, "global_step": 324567, "epoch": 2682} {"train_loss": -42.41695785522461, "global_step": 324568, "epoch": 2682} {"train_loss": -41.360652923583984, "global_step": 324569, "epoch": 2682} {"train_loss": -41.31370162963867, "global_step": 324570, "epoch": 2682} {"train_loss": -42.287635803222656, "global_step": 324571, "epoch": 2682} {"train_loss": -42.09333038330078, "global_step": 324572, "epoch": 2682} {"train_loss": -41.35895538330078, "global_step": 324573, "epoch": 2682} {"train_loss": -41.96528244018555, "global_step": 324574, "epoch": 2682} {"train_loss": -42.41710662841797, "global_step": 324575, "epoch": 2682} {"train_loss": -42.944034576416016, "global_step": 324576, "epoch": 2682} {"train_loss": -42.531856536865234, "global_step": 324577, "epoch": 2682} {"train_loss": -42.23645782470703, "global_step": 324578, "epoch": 2682} {"train_loss": -42.15983963012695, "global_step": 324579, "epoch": 2682} {"train_loss": -40.925140380859375, "global_step": 324580, "epoch": 2682} {"train_loss": -41.92666244506836, "global_step": 324581, "epoch": 2682} {"train_loss": -41.63357162475586, "global_step": 324582, "epoch": 2682} {"train_loss": -42.083961486816406, "global_step": 324583, "epoch": 2682} {"train_loss": -43.166038513183594, "global_step": 324584, "epoch": 2682} {"train_loss": -42.12935256958008, "global_step": 324585, "epoch": 2682} {"train_loss": -42.46477127075195, "global_step": 324586, "epoch": 2682} {"train_loss": -42.039363861083984, "global_step": 324587, "epoch": 2682} {"train_loss": -42.48928451538086, "global_step": 324588, "epoch": 2682} {"train_loss": -42.74116134643555, "global_step": 324589, "epoch": 2682} {"train_loss": -41.80255126953125, "global_step": 324590, "epoch": 2682} {"train_loss": -42.7895393371582, "global_step": 324591, "epoch": 2682} {"train_loss": -42.31717300415039, "global_step": 324592, "epoch": 2682} {"train_loss": -43.28630828857422, "global_step": 324593, "epoch": 2682} {"train_loss": -42.55601119995117, "global_step": 324594, "epoch": 2682} {"train_loss": -43.04313659667969, "global_step": 324595, "epoch": 2682} {"train_loss": -43.427486419677734, "global_step": 324596, "epoch": 2682} {"train_loss": -42.67631149291992, "global_step": 324597, "epoch": 2682} {"train_loss": -42.6107292175293, "global_step": 324598, "epoch": 2682} {"train_loss": -42.035926818847656, "global_step": 324599, "epoch": 2682} {"train_loss": -41.21181106567383, "global_step": 324600, "epoch": 2682} {"train_loss": -41.45874786376953, "global_step": 324601, "epoch": 2682} {"train_loss": -42.63246154785156, "global_step": 324602, "epoch": 2682} {"train_loss": -42.637081146240234, "global_step": 324603, "epoch": 2682} {"train_loss": -40.01920700073242, "global_step": 324604, "epoch": 2682} {"train_loss": -41.804420471191406, "global_step": 324605, "epoch": 2682} {"train_loss": -43.03529739379883, "global_step": 324606, "epoch": 2682} {"train_loss": -42.7740592956543, "global_step": 324607, "epoch": 2682} {"train_loss": -41.3277702331543, "global_step": 324608, "epoch": 2682} {"train_loss": -36.400611877441406, "global_step": 324609, "epoch": 2682} {"train_loss": -41.42152786254883, "global_step": 324610, "epoch": 2682} {"train_loss": -42.17796325683594, "global_step": 324611, "epoch": 2682} {"train_loss": -41.68363571166992, "global_step": 324612, "epoch": 2682} {"train_loss": -42.32936096191406, "global_step": 324613, "epoch": 2682} {"train_loss": -39.701541900634766, "global_step": 324614, "epoch": 2682} {"train_loss": -41.84066390991211, "global_step": 324615, "epoch": 2682} {"train_loss": -40.733341217041016, "global_step": 324616, "epoch": 2682} {"train_loss": -41.36605453491211, "global_step": 324617, "epoch": 2682} {"train_loss": -40.64253616333008, "global_step": 324618, "epoch": 2682} {"train_loss": -41.959163665771484, "global_step": 324619, "epoch": 2682} {"train_loss": -42.2010498046875, "global_step": 324620, "epoch": 2682} {"train_loss": -40.289485931396484, "global_step": 324621, "epoch": 2682} {"train_loss": -40.997528076171875, "global_step": 324622, "epoch": 2682} {"train_loss": -41.8582649230957, "global_step": 324623, "epoch": 2682} {"train_loss": -40.40882110595703, "global_step": 324624, "epoch": 2682} {"train_loss": -41.31675338745117, "global_step": 324625, "epoch": 2682} {"train_loss": -41.155029296875, "global_step": 324626, "epoch": 2682} {"train_loss": -42.58634948730469, "global_step": 324627, "epoch": 2682} {"train_loss": -42.3525276184082, "global_step": 324628, "epoch": 2682} {"train_loss": -39.9318733215332, "global_step": 324629, "epoch": 2682} {"train_loss": -42.81279754638672, "global_step": 324630, "epoch": 2682} {"train_loss": -41.52996826171875, "global_step": 324631, "epoch": 2682} {"train_loss": -41.972694396972656, "global_step": 324632, "epoch": 2682} {"train_loss": -42.94306182861328, "global_step": 324633, "epoch": 2682} {"train_loss": -41.65336227416992, "global_step": 324634, "epoch": 2682} {"train_loss": -41.92133712768555, "global_step": 324635, "epoch": 2682} {"train_loss": -42.24845504760742, "global_step": 324636, "epoch": 2682} {"train_loss": -42.23004150390625, "global_step": 324637, "epoch": 2682} {"train_loss": -42.578269958496094, "global_step": 324638, "epoch": 2682} {"train_loss": -41.855384826660156, "global_step": 324639, "epoch": 2682} {"train_loss": -43.02768325805664, "global_step": 324640, "epoch": 2682} {"train_loss": -43.33995819091797, "global_step": 324641, "epoch": 2682} {"train_loss": -41.670577656139024, "global_step": 324642, "epoch": 2682, "val_loss": 2683978.0} {"train_loss": -41.609920501708984, "global_step": 324643, "epoch": 2683} {"train_loss": -42.97896957397461, "global_step": 324644, "epoch": 2683} {"train_loss": -42.74433135986328, "global_step": 324645, "epoch": 2683} {"train_loss": -41.71113204956055, "global_step": 324646, "epoch": 2683} {"train_loss": -42.10525131225586, "global_step": 324647, "epoch": 2683} {"train_loss": -42.419620513916016, "global_step": 324648, "epoch": 2683} {"train_loss": -42.5533332824707, "global_step": 324649, "epoch": 2683} {"train_loss": -42.868038177490234, "global_step": 324650, "epoch": 2683} {"train_loss": -41.70472717285156, "global_step": 324651, "epoch": 2683} {"train_loss": -42.485565185546875, "global_step": 324652, "epoch": 2683} {"train_loss": -42.85089874267578, "global_step": 324653, "epoch": 2683} {"train_loss": -42.72648239135742, "global_step": 324654, "epoch": 2683} {"train_loss": -41.97791290283203, "global_step": 324655, "epoch": 2683} {"train_loss": -40.467529296875, "global_step": 324656, "epoch": 2683} {"train_loss": -41.119869232177734, "global_step": 324657, "epoch": 2683} {"train_loss": -42.03635025024414, "global_step": 324658, "epoch": 2683} {"train_loss": -41.92412185668945, "global_step": 324659, "epoch": 2683} {"train_loss": -42.859188079833984, "global_step": 324660, "epoch": 2683} {"train_loss": -40.5853385925293, "global_step": 324661, "epoch": 2683} {"train_loss": -41.71138381958008, "global_step": 324662, "epoch": 2683} {"train_loss": -42.35839080810547, "global_step": 324663, "epoch": 2683} {"train_loss": -42.26224899291992, "global_step": 324664, "epoch": 2683} {"train_loss": -42.48081970214844, "global_step": 324665, "epoch": 2683} {"train_loss": -41.1080436706543, "global_step": 324666, "epoch": 2683} {"train_loss": -40.53913116455078, "global_step": 324667, "epoch": 2683} {"train_loss": -40.19919967651367, "global_step": 324668, "epoch": 2683} {"train_loss": -40.63248825073242, "global_step": 324669, "epoch": 2683} {"train_loss": -41.137691497802734, "global_step": 324670, "epoch": 2683} {"train_loss": -40.596492767333984, "global_step": 324671, "epoch": 2683} {"train_loss": -42.42761993408203, "global_step": 324672, "epoch": 2683} {"train_loss": -42.15735626220703, "global_step": 324673, "epoch": 2683} {"train_loss": -41.6807861328125, "global_step": 324674, "epoch": 2683} {"train_loss": -42.125579833984375, "global_step": 324675, "epoch": 2683} {"train_loss": -41.29595184326172, "global_step": 324676, "epoch": 2683} {"train_loss": -39.91844177246094, "global_step": 324677, "epoch": 2683} {"train_loss": -42.6839599609375, "global_step": 324678, "epoch": 2683} {"train_loss": -42.30855941772461, "global_step": 324679, "epoch": 2683} {"train_loss": -40.77605438232422, "global_step": 324680, "epoch": 2683} {"train_loss": -40.72591781616211, "global_step": 324681, "epoch": 2683} {"train_loss": -42.68905258178711, "global_step": 324682, "epoch": 2683} {"train_loss": -41.155487060546875, "global_step": 324683, "epoch": 2683} {"train_loss": -41.604515075683594, "global_step": 324684, "epoch": 2683} {"train_loss": -41.763343811035156, "global_step": 324685, "epoch": 2683} {"train_loss": -41.99203109741211, "global_step": 324686, "epoch": 2683} {"train_loss": -42.09104537963867, "global_step": 324687, "epoch": 2683} {"train_loss": -41.761714935302734, "global_step": 324688, "epoch": 2683} {"train_loss": -41.29218292236328, "global_step": 324689, "epoch": 2683} {"train_loss": -41.41410446166992, "global_step": 324690, "epoch": 2683} {"train_loss": -42.215999603271484, "global_step": 324691, "epoch": 2683} {"train_loss": -41.75588607788086, "global_step": 324692, "epoch": 2683} {"train_loss": -41.61346435546875, "global_step": 324693, "epoch": 2683} {"train_loss": -41.00328063964844, "global_step": 324694, "epoch": 2683} {"train_loss": -43.269710540771484, "global_step": 324695, "epoch": 2683} {"train_loss": -39.87725830078125, "global_step": 324696, "epoch": 2683} {"train_loss": -42.11315155029297, "global_step": 324697, "epoch": 2683} {"train_loss": -40.299190521240234, "global_step": 324698, "epoch": 2683} {"train_loss": -42.060455322265625, "global_step": 324699, "epoch": 2683} {"train_loss": -39.27570343017578, "global_step": 324700, "epoch": 2683} {"train_loss": -42.22841262817383, "global_step": 324701, "epoch": 2683} {"train_loss": -37.561683654785156, "global_step": 324702, "epoch": 2683} {"train_loss": -40.616695404052734, "global_step": 324703, "epoch": 2683} {"train_loss": -41.4144287109375, "global_step": 324704, "epoch": 2683} {"train_loss": -41.04607009887695, "global_step": 324705, "epoch": 2683} {"train_loss": -40.3538818359375, "global_step": 324706, "epoch": 2683} {"train_loss": -42.10720443725586, "global_step": 324707, "epoch": 2683} {"train_loss": -41.26124954223633, "global_step": 324708, "epoch": 2683} {"train_loss": -40.51526641845703, "global_step": 324709, "epoch": 2683} {"train_loss": -40.94026184082031, "global_step": 324710, "epoch": 2683} {"train_loss": -40.626346588134766, "global_step": 324711, "epoch": 2683} {"train_loss": -40.12346267700195, "global_step": 324712, "epoch": 2683} {"train_loss": -41.39213943481445, "global_step": 324713, "epoch": 2683} {"train_loss": -42.18952560424805, "global_step": 324714, "epoch": 2683} {"train_loss": -41.261722564697266, "global_step": 324715, "epoch": 2683} {"train_loss": -32.744937896728516, "global_step": 324716, "epoch": 2683} {"train_loss": -41.2529411315918, "global_step": 324717, "epoch": 2683} {"train_loss": -39.36656951904297, "global_step": 324718, "epoch": 2683} {"train_loss": -42.426631927490234, "global_step": 324719, "epoch": 2683} {"train_loss": -41.209922790527344, "global_step": 324720, "epoch": 2683} {"train_loss": -41.220123291015625, "global_step": 324721, "epoch": 2683} {"train_loss": -41.568077087402344, "global_step": 324722, "epoch": 2683} {"train_loss": -41.30857467651367, "global_step": 324723, "epoch": 2683} {"train_loss": -42.04999923706055, "global_step": 324724, "epoch": 2683} {"train_loss": -40.683837890625, "global_step": 324725, "epoch": 2683} {"train_loss": -35.9257926940918, "global_step": 324726, "epoch": 2683} {"train_loss": -40.63877868652344, "global_step": 324727, "epoch": 2683} {"train_loss": -38.94357681274414, "global_step": 324728, "epoch": 2683} {"train_loss": -41.23629379272461, "global_step": 324729, "epoch": 2683} {"train_loss": -41.2961311340332, "global_step": 324730, "epoch": 2683} {"train_loss": -41.161617279052734, "global_step": 324731, "epoch": 2683} {"train_loss": -40.69218063354492, "global_step": 324732, "epoch": 2683} {"train_loss": -38.66426467895508, "global_step": 324733, "epoch": 2683} {"train_loss": -41.27433776855469, "global_step": 324734, "epoch": 2683} {"train_loss": -42.247432708740234, "global_step": 324735, "epoch": 2683} {"train_loss": -40.93754196166992, "global_step": 324736, "epoch": 2683} {"train_loss": -42.5679931640625, "global_step": 324737, "epoch": 2683} {"train_loss": -42.54578399658203, "global_step": 324738, "epoch": 2683} {"train_loss": -41.839603424072266, "global_step": 324739, "epoch": 2683} {"train_loss": -39.23318099975586, "global_step": 324740, "epoch": 2683} {"train_loss": -42.61637496948242, "global_step": 324741, "epoch": 2683} {"train_loss": -39.53143310546875, "global_step": 324742, "epoch": 2683} {"train_loss": -40.68074417114258, "global_step": 324743, "epoch": 2683} {"train_loss": -41.2457160949707, "global_step": 324744, "epoch": 2683} {"train_loss": -40.4296875, "global_step": 324745, "epoch": 2683} {"train_loss": -39.88045883178711, "global_step": 324746, "epoch": 2683} {"train_loss": -41.709442138671875, "global_step": 324747, "epoch": 2683} {"train_loss": -42.0555534362793, "global_step": 324748, "epoch": 2683} {"train_loss": -41.82625198364258, "global_step": 324749, "epoch": 2683} {"train_loss": -39.87557601928711, "global_step": 324750, "epoch": 2683} {"train_loss": -41.194847106933594, "global_step": 324751, "epoch": 2683} {"train_loss": -40.372100830078125, "global_step": 324752, "epoch": 2683} {"train_loss": -42.1290283203125, "global_step": 324753, "epoch": 2683} {"train_loss": -40.87363815307617, "global_step": 324754, "epoch": 2683} {"train_loss": -42.70467758178711, "global_step": 324755, "epoch": 2683} {"train_loss": -42.251808166503906, "global_step": 324756, "epoch": 2683} {"train_loss": -41.16926193237305, "global_step": 324757, "epoch": 2683} {"train_loss": -40.39766311645508, "global_step": 324758, "epoch": 2683} {"train_loss": -42.348060607910156, "global_step": 324759, "epoch": 2683} {"train_loss": -41.77015686035156, "global_step": 324760, "epoch": 2683} {"train_loss": -42.54736328125, "global_step": 324761, "epoch": 2683} {"train_loss": -42.87993240356445, "global_step": 324762, "epoch": 2683} {"train_loss": -41.2936107856183, "global_step": 324763, "epoch": 2683, "val_loss": 2653753.75} {"train_loss": -43.14915466308594, "global_step": 324764, "epoch": 2684} {"train_loss": -42.477657318115234, "global_step": 324765, "epoch": 2684} {"train_loss": -41.0730094909668, "global_step": 324766, "epoch": 2684} {"train_loss": -42.565425872802734, "global_step": 324767, "epoch": 2684} {"train_loss": -42.55166244506836, "global_step": 324768, "epoch": 2684} {"train_loss": -42.656436920166016, "global_step": 324769, "epoch": 2684} {"train_loss": -41.14014434814453, "global_step": 324770, "epoch": 2684} {"train_loss": -42.90007400512695, "global_step": 324771, "epoch": 2684} {"train_loss": -42.52975082397461, "global_step": 324772, "epoch": 2684} {"train_loss": -41.8279914855957, "global_step": 324773, "epoch": 2684} {"train_loss": -42.8245849609375, "global_step": 324774, "epoch": 2684} {"train_loss": -42.388641357421875, "global_step": 324775, "epoch": 2684} {"train_loss": -43.0815544128418, "global_step": 324776, "epoch": 2684} {"train_loss": -42.43648147583008, "global_step": 324777, "epoch": 2684} {"train_loss": -42.8377799987793, "global_step": 324778, "epoch": 2684} {"train_loss": -41.90219497680664, "global_step": 324779, "epoch": 2684} {"train_loss": -41.76021194458008, "global_step": 324780, "epoch": 2684} {"train_loss": -41.33870315551758, "global_step": 324781, "epoch": 2684} {"train_loss": -42.67867660522461, "global_step": 324782, "epoch": 2684} {"train_loss": -43.08911895751953, "global_step": 324783, "epoch": 2684} {"train_loss": -42.85798645019531, "global_step": 324784, "epoch": 2684} {"train_loss": -42.78347396850586, "global_step": 324785, "epoch": 2684} {"train_loss": -42.04182052612305, "global_step": 324786, "epoch": 2684} {"train_loss": -43.17399978637695, "global_step": 324787, "epoch": 2684} {"train_loss": -43.48311233520508, "global_step": 324788, "epoch": 2684} {"train_loss": -42.632137298583984, "global_step": 324789, "epoch": 2684} {"train_loss": -43.150020599365234, "global_step": 324790, "epoch": 2684} {"train_loss": -41.8643798828125, "global_step": 324791, "epoch": 2684} {"train_loss": -42.84829330444336, "global_step": 324792, "epoch": 2684} {"train_loss": -43.190303802490234, "global_step": 324793, "epoch": 2684} {"train_loss": -43.1998176574707, "global_step": 324794, "epoch": 2684} {"train_loss": -43.166072845458984, "global_step": 324795, "epoch": 2684} {"train_loss": -43.10931396484375, "global_step": 324796, "epoch": 2684} {"train_loss": -42.40414047241211, "global_step": 324797, "epoch": 2684} {"train_loss": -43.404205322265625, "global_step": 324798, "epoch": 2684} {"train_loss": -43.655609130859375, "global_step": 324799, "epoch": 2684} {"train_loss": -43.43215560913086, "global_step": 324800, "epoch": 2684} {"train_loss": -43.45784378051758, "global_step": 324801, "epoch": 2684} {"train_loss": -42.640357971191406, "global_step": 324802, "epoch": 2684} {"train_loss": -42.5172119140625, "global_step": 324803, "epoch": 2684} {"train_loss": -42.64992904663086, "global_step": 324804, "epoch": 2684} {"train_loss": -43.45965576171875, "global_step": 324805, "epoch": 2684} {"train_loss": -41.914695739746094, "global_step": 324806, "epoch": 2684} {"train_loss": -41.10968780517578, "global_step": 324807, "epoch": 2684} {"train_loss": -43.150848388671875, "global_step": 324808, "epoch": 2684} {"train_loss": -42.55419158935547, "global_step": 324809, "epoch": 2684} {"train_loss": -42.41548156738281, "global_step": 324810, "epoch": 2684} {"train_loss": -42.105384826660156, "global_step": 324811, "epoch": 2684} {"train_loss": -42.681941986083984, "global_step": 324812, "epoch": 2684} {"train_loss": -42.35574722290039, "global_step": 324813, "epoch": 2684} {"train_loss": -42.28581619262695, "global_step": 324814, "epoch": 2684} {"train_loss": -43.323238372802734, "global_step": 324815, "epoch": 2684} {"train_loss": -40.15519332885742, "global_step": 324816, "epoch": 2684} {"train_loss": -42.72860336303711, "global_step": 324817, "epoch": 2684} {"train_loss": -42.5394287109375, "global_step": 324818, "epoch": 2684} {"train_loss": -43.4789924621582, "global_step": 324819, "epoch": 2684} {"train_loss": -43.36680603027344, "global_step": 324820, "epoch": 2684} {"train_loss": -43.462867736816406, "global_step": 324821, "epoch": 2684} {"train_loss": -42.50602340698242, "global_step": 324822, "epoch": 2684} {"train_loss": -42.6287956237793, "global_step": 324823, "epoch": 2684} {"train_loss": -40.651119232177734, "global_step": 324824, "epoch": 2684} {"train_loss": -42.20471954345703, "global_step": 324825, "epoch": 2684} {"train_loss": -42.276981353759766, "global_step": 324826, "epoch": 2684} {"train_loss": -38.8180046081543, "global_step": 324827, "epoch": 2684} {"train_loss": -40.98994064331055, "global_step": 324828, "epoch": 2684} {"train_loss": -40.10100173950195, "global_step": 324829, "epoch": 2684} {"train_loss": -36.576995849609375, "global_step": 324830, "epoch": 2684} {"train_loss": -36.122554779052734, "global_step": 324831, "epoch": 2684} {"train_loss": -38.1093864440918, "global_step": 324832, "epoch": 2684} {"train_loss": -41.79168701171875, "global_step": 324833, "epoch": 2684} {"train_loss": -39.61036682128906, "global_step": 324834, "epoch": 2684} {"train_loss": -39.924800872802734, "global_step": 324835, "epoch": 2684} {"train_loss": -37.4013557434082, "global_step": 324836, "epoch": 2684} {"train_loss": -40.055816650390625, "global_step": 324837, "epoch": 2684} {"train_loss": -39.87898635864258, "global_step": 324838, "epoch": 2684} {"train_loss": -39.73499298095703, "global_step": 324839, "epoch": 2684} {"train_loss": -42.511783599853516, "global_step": 324840, "epoch": 2684} {"train_loss": -39.29604721069336, "global_step": 324841, "epoch": 2684} {"train_loss": -41.08091735839844, "global_step": 324842, "epoch": 2684} {"train_loss": -38.78431701660156, "global_step": 324843, "epoch": 2684} {"train_loss": -41.16295623779297, "global_step": 324844, "epoch": 2684} {"train_loss": -42.436275482177734, "global_step": 324845, "epoch": 2684} {"train_loss": -41.026710510253906, "global_step": 324846, "epoch": 2684} {"train_loss": -39.85862350463867, "global_step": 324847, "epoch": 2684} {"train_loss": -41.2963752746582, "global_step": 324848, "epoch": 2684} {"train_loss": -42.9527587890625, "global_step": 324849, "epoch": 2684} {"train_loss": -41.670955657958984, "global_step": 324850, "epoch": 2684} {"train_loss": -41.64023971557617, "global_step": 324851, "epoch": 2684} {"train_loss": -41.22016525268555, "global_step": 324852, "epoch": 2684} {"train_loss": -42.28835678100586, "global_step": 324853, "epoch": 2684} {"train_loss": -42.02766418457031, "global_step": 324854, "epoch": 2684} {"train_loss": -42.55068588256836, "global_step": 324855, "epoch": 2684} {"train_loss": -42.16194534301758, "global_step": 324856, "epoch": 2684} {"train_loss": -42.26630783081055, "global_step": 324857, "epoch": 2684} {"train_loss": -41.7637939453125, "global_step": 324858, "epoch": 2684} {"train_loss": -42.605098724365234, "global_step": 324859, "epoch": 2684} {"train_loss": -42.205867767333984, "global_step": 324860, "epoch": 2684} {"train_loss": -42.76869201660156, "global_step": 324861, "epoch": 2684} {"train_loss": -42.764373779296875, "global_step": 324862, "epoch": 2684} {"train_loss": -42.59352493286133, "global_step": 324863, "epoch": 2684} {"train_loss": -42.7946662902832, "global_step": 324864, "epoch": 2684} {"train_loss": -41.290000915527344, "global_step": 324865, "epoch": 2684} {"train_loss": -42.95943069458008, "global_step": 324866, "epoch": 2684} {"train_loss": -42.954017639160156, "global_step": 324867, "epoch": 2684} {"train_loss": -40.607723236083984, "global_step": 324868, "epoch": 2684} {"train_loss": -42.40015411376953, "global_step": 324869, "epoch": 2684} {"train_loss": -42.10367965698242, "global_step": 324870, "epoch": 2684} {"train_loss": -41.9978141784668, "global_step": 324871, "epoch": 2684} {"train_loss": -42.790260314941406, "global_step": 324872, "epoch": 2684} {"train_loss": -42.47756576538086, "global_step": 324873, "epoch": 2684} {"train_loss": -42.56545639038086, "global_step": 324874, "epoch": 2684} {"train_loss": -42.77352523803711, "global_step": 324875, "epoch": 2684} {"train_loss": -43.070796966552734, "global_step": 324876, "epoch": 2684} {"train_loss": -43.10698318481445, "global_step": 324877, "epoch": 2684} {"train_loss": -42.69485855102539, "global_step": 324878, "epoch": 2684} {"train_loss": -42.56251907348633, "global_step": 324879, "epoch": 2684} {"train_loss": -43.40475845336914, "global_step": 324880, "epoch": 2684} {"train_loss": -42.357547760009766, "global_step": 324881, "epoch": 2684} {"train_loss": -38.234161376953125, "global_step": 324882, "epoch": 2684} {"train_loss": -41.76677322387695, "global_step": 324883, "epoch": 2684} {"train_loss": -41.98472998753067, "global_step": 324884, "epoch": 2684, "val_loss": 2657076.5} {"train_loss": -42.197078704833984, "global_step": 324885, "epoch": 2685} {"train_loss": -43.02183532714844, "global_step": 324886, "epoch": 2685} {"train_loss": -41.28784942626953, "global_step": 324887, "epoch": 2685} {"train_loss": -43.82041549682617, "global_step": 324888, "epoch": 2685} {"train_loss": -38.77933120727539, "global_step": 324889, "epoch": 2685} {"train_loss": -42.553443908691406, "global_step": 324890, "epoch": 2685} {"train_loss": -42.191856384277344, "global_step": 324891, "epoch": 2685} {"train_loss": -38.6434326171875, "global_step": 324892, "epoch": 2685} {"train_loss": -39.80472946166992, "global_step": 324893, "epoch": 2685} {"train_loss": -41.44034957885742, "global_step": 324894, "epoch": 2685} {"train_loss": -41.39419174194336, "global_step": 324895, "epoch": 2685} {"train_loss": -40.09652328491211, "global_step": 324896, "epoch": 2685} {"train_loss": -41.73696517944336, "global_step": 324897, "epoch": 2685} {"train_loss": -42.429073333740234, "global_step": 324898, "epoch": 2685} {"train_loss": -41.961097717285156, "global_step": 324899, "epoch": 2685} {"train_loss": -42.63204574584961, "global_step": 324900, "epoch": 2685} {"train_loss": -41.5892333984375, "global_step": 324901, "epoch": 2685} {"train_loss": -42.230342864990234, "global_step": 324902, "epoch": 2685} {"train_loss": -40.87727737426758, "global_step": 324903, "epoch": 2685} {"train_loss": -41.93022155761719, "global_step": 324904, "epoch": 2685} {"train_loss": -41.8748779296875, "global_step": 324905, "epoch": 2685} {"train_loss": -41.91417694091797, "global_step": 324906, "epoch": 2685} {"train_loss": -42.216705322265625, "global_step": 324907, "epoch": 2685} {"train_loss": -41.413414001464844, "global_step": 324908, "epoch": 2685} {"train_loss": -43.09074020385742, "global_step": 324909, "epoch": 2685} {"train_loss": -43.00679016113281, "global_step": 324910, "epoch": 2685} {"train_loss": -41.33412170410156, "global_step": 324911, "epoch": 2685} {"train_loss": -41.28347396850586, "global_step": 324912, "epoch": 2685} {"train_loss": -41.24182891845703, "global_step": 324913, "epoch": 2685} {"train_loss": -42.14265060424805, "global_step": 324914, "epoch": 2685} {"train_loss": -42.289588928222656, "global_step": 324915, "epoch": 2685} {"train_loss": -43.43600082397461, "global_step": 324916, "epoch": 2685} {"train_loss": -43.18570327758789, "global_step": 324917, "epoch": 2685} {"train_loss": -41.49092483520508, "global_step": 324918, "epoch": 2685} {"train_loss": -42.96860885620117, "global_step": 324919, "epoch": 2685} {"train_loss": -41.54332733154297, "global_step": 324920, "epoch": 2685} {"train_loss": -42.727012634277344, "global_step": 324921, "epoch": 2685} {"train_loss": -42.08837890625, "global_step": 324922, "epoch": 2685} {"train_loss": -42.35996627807617, "global_step": 324923, "epoch": 2685} {"train_loss": -42.810420989990234, "global_step": 324924, "epoch": 2685} {"train_loss": -43.43864059448242, "global_step": 324925, "epoch": 2685} {"train_loss": -42.89902877807617, "global_step": 324926, "epoch": 2685} {"train_loss": -43.07832336425781, "global_step": 324927, "epoch": 2685} {"train_loss": -42.86930465698242, "global_step": 324928, "epoch": 2685} {"train_loss": -42.77296447753906, "global_step": 324929, "epoch": 2685} {"train_loss": -43.641937255859375, "global_step": 324930, "epoch": 2685} {"train_loss": -41.75157165527344, "global_step": 324931, "epoch": 2685} {"train_loss": -41.55036544799805, "global_step": 324932, "epoch": 2685} {"train_loss": -42.263458251953125, "global_step": 324933, "epoch": 2685} {"train_loss": -42.7963981628418, "global_step": 324934, "epoch": 2685} {"train_loss": -43.28815460205078, "global_step": 324935, "epoch": 2685} {"train_loss": -42.7639045715332, "global_step": 324936, "epoch": 2685} {"train_loss": -43.173526763916016, "global_step": 324937, "epoch": 2685} {"train_loss": -43.26632308959961, "global_step": 324938, "epoch": 2685} {"train_loss": -42.61310577392578, "global_step": 324939, "epoch": 2685} {"train_loss": -42.57621383666992, "global_step": 324940, "epoch": 2685} {"train_loss": -42.95450973510742, "global_step": 324941, "epoch": 2685} {"train_loss": -43.0447883605957, "global_step": 324942, "epoch": 2685} {"train_loss": -42.900062561035156, "global_step": 324943, "epoch": 2685} {"train_loss": -42.5999755859375, "global_step": 324944, "epoch": 2685} {"train_loss": -41.36145782470703, "global_step": 324945, "epoch": 2685} {"train_loss": -42.91972732543945, "global_step": 324946, "epoch": 2685} {"train_loss": -41.466060638427734, "global_step": 324947, "epoch": 2685} {"train_loss": -43.156646728515625, "global_step": 324948, "epoch": 2685} {"train_loss": -43.276363372802734, "global_step": 324949, "epoch": 2685} {"train_loss": -42.42736053466797, "global_step": 324950, "epoch": 2685} {"train_loss": -43.897804260253906, "global_step": 324951, "epoch": 2685} {"train_loss": -41.99211502075195, "global_step": 324952, "epoch": 2685} {"train_loss": -41.90690231323242, "global_step": 324953, "epoch": 2685} {"train_loss": -43.3624267578125, "global_step": 324954, "epoch": 2685} {"train_loss": -42.83723068237305, "global_step": 324955, "epoch": 2685} {"train_loss": -42.33692169189453, "global_step": 324956, "epoch": 2685} {"train_loss": -40.88978958129883, "global_step": 324957, "epoch": 2685} {"train_loss": -42.9332275390625, "global_step": 324958, "epoch": 2685} {"train_loss": -42.4492301940918, "global_step": 324959, "epoch": 2685} {"train_loss": -42.49880599975586, "global_step": 324960, "epoch": 2685} {"train_loss": -39.991703033447266, "global_step": 324961, "epoch": 2685} {"train_loss": -42.222373962402344, "global_step": 324962, "epoch": 2685} {"train_loss": -42.784969329833984, "global_step": 324963, "epoch": 2685} {"train_loss": -42.69562530517578, "global_step": 324964, "epoch": 2685} {"train_loss": -42.3751220703125, "global_step": 324965, "epoch": 2685} {"train_loss": -41.37415313720703, "global_step": 324966, "epoch": 2685} {"train_loss": -42.58729934692383, "global_step": 324967, "epoch": 2685} {"train_loss": -43.23953628540039, "global_step": 324968, "epoch": 2685} {"train_loss": -43.602962493896484, "global_step": 324969, "epoch": 2685} {"train_loss": -42.57902145385742, "global_step": 324970, "epoch": 2685} {"train_loss": -43.200008392333984, "global_step": 324971, "epoch": 2685} {"train_loss": -42.70113754272461, "global_step": 324972, "epoch": 2685} {"train_loss": -41.885040283203125, "global_step": 324973, "epoch": 2685} {"train_loss": -42.1247673034668, "global_step": 324974, "epoch": 2685} {"train_loss": -41.63920974731445, "global_step": 324975, "epoch": 2685} {"train_loss": -41.78252029418945, "global_step": 324976, "epoch": 2685} {"train_loss": -42.426788330078125, "global_step": 324977, "epoch": 2685} {"train_loss": -43.246490478515625, "global_step": 324978, "epoch": 2685} {"train_loss": -42.252349853515625, "global_step": 324979, "epoch": 2685} {"train_loss": -43.121334075927734, "global_step": 324980, "epoch": 2685} {"train_loss": -43.78271484375, "global_step": 324981, "epoch": 2685} {"train_loss": -43.27633285522461, "global_step": 324982, "epoch": 2685} {"train_loss": -43.218353271484375, "global_step": 324983, "epoch": 2685} {"train_loss": -43.09843826293945, "global_step": 324984, "epoch": 2685} {"train_loss": -42.67338180541992, "global_step": 324985, "epoch": 2685} {"train_loss": -42.54392623901367, "global_step": 324986, "epoch": 2685} {"train_loss": -43.47514724731445, "global_step": 324987, "epoch": 2685} {"train_loss": -43.173744201660156, "global_step": 324988, "epoch": 2685} {"train_loss": -43.746002197265625, "global_step": 324989, "epoch": 2685} {"train_loss": -43.96040725708008, "global_step": 324990, "epoch": 2685} {"train_loss": -42.9954719543457, "global_step": 324991, "epoch": 2685} {"train_loss": -43.455116271972656, "global_step": 324992, "epoch": 2685} {"train_loss": -43.1939811706543, "global_step": 324993, "epoch": 2685} {"train_loss": -43.552459716796875, "global_step": 324994, "epoch": 2685} {"train_loss": -43.8521842956543, "global_step": 324995, "epoch": 2685} {"train_loss": -42.74168014526367, "global_step": 324996, "epoch": 2685} {"train_loss": -42.94842529296875, "global_step": 324997, "epoch": 2685} {"train_loss": -42.91842269897461, "global_step": 324998, "epoch": 2685} {"train_loss": -43.40581130981445, "global_step": 324999, "epoch": 2685} {"train_loss": -43.441158294677734, "global_step": 325000, "epoch": 2685} {"train_loss": -38.829036712646484, "global_step": 325001, "epoch": 2685} {"train_loss": -43.04090881347656, "global_step": 325002, "epoch": 2685} {"train_loss": -43.855159759521484, "global_step": 325003, "epoch": 2685} {"train_loss": -43.92684555053711, "global_step": 325004, "epoch": 2685} {"train_loss": -42.448736080453415, "global_step": 325005, "epoch": 2685, "val_loss": 2843666.75} {"train_loss": -43.21442794799805, "global_step": 325006, "epoch": 2686} {"train_loss": -43.5919075012207, "global_step": 325007, "epoch": 2686} {"train_loss": -43.00886917114258, "global_step": 325008, "epoch": 2686} {"train_loss": -42.40389633178711, "global_step": 325009, "epoch": 2686} {"train_loss": -42.64670944213867, "global_step": 325010, "epoch": 2686} {"train_loss": -43.129127502441406, "global_step": 325011, "epoch": 2686} {"train_loss": -42.11783981323242, "global_step": 325012, "epoch": 2686} {"train_loss": -42.423858642578125, "global_step": 325013, "epoch": 2686} {"train_loss": -43.018455505371094, "global_step": 325014, "epoch": 2686} {"train_loss": -43.67879104614258, "global_step": 325015, "epoch": 2686} {"train_loss": -40.951637268066406, "global_step": 325016, "epoch": 2686} {"train_loss": -42.77998733520508, "global_step": 325017, "epoch": 2686} {"train_loss": -42.5710334777832, "global_step": 325018, "epoch": 2686} {"train_loss": -43.3757209777832, "global_step": 325019, "epoch": 2686} {"train_loss": -42.35612106323242, "global_step": 325020, "epoch": 2686} {"train_loss": -43.47200393676758, "global_step": 325021, "epoch": 2686} {"train_loss": -43.231544494628906, "global_step": 325022, "epoch": 2686} {"train_loss": -43.446590423583984, "global_step": 325023, "epoch": 2686} {"train_loss": -42.79572677612305, "global_step": 325024, "epoch": 2686} {"train_loss": -42.4060173034668, "global_step": 325025, "epoch": 2686} {"train_loss": -43.15670394897461, "global_step": 325026, "epoch": 2686} {"train_loss": -43.047115325927734, "global_step": 325027, "epoch": 2686} {"train_loss": -43.72111511230469, "global_step": 325028, "epoch": 2686} {"train_loss": -43.03498077392578, "global_step": 325029, "epoch": 2686} {"train_loss": -42.714111328125, "global_step": 325030, "epoch": 2686} {"train_loss": -41.76662826538086, "global_step": 325031, "epoch": 2686} {"train_loss": -41.811771392822266, "global_step": 325032, "epoch": 2686} {"train_loss": -42.83081817626953, "global_step": 325033, "epoch": 2686} {"train_loss": -43.29893112182617, "global_step": 325034, "epoch": 2686} {"train_loss": -42.49210739135742, "global_step": 325035, "epoch": 2686} {"train_loss": -41.01222610473633, "global_step": 325036, "epoch": 2686} {"train_loss": -39.2673225402832, "global_step": 325037, "epoch": 2686} {"train_loss": -41.505210876464844, "global_step": 325038, "epoch": 2686} {"train_loss": -43.37831497192383, "global_step": 325039, "epoch": 2686} {"train_loss": -40.47209548950195, "global_step": 325040, "epoch": 2686} {"train_loss": -40.78256607055664, "global_step": 325041, "epoch": 2686} {"train_loss": -41.85519027709961, "global_step": 325042, "epoch": 2686} {"train_loss": -41.5267333984375, "global_step": 325043, "epoch": 2686} {"train_loss": -40.4965705871582, "global_step": 325044, "epoch": 2686} {"train_loss": -38.82804489135742, "global_step": 325045, "epoch": 2686} {"train_loss": -41.56279373168945, "global_step": 325046, "epoch": 2686} {"train_loss": -39.96281814575195, "global_step": 325047, "epoch": 2686} {"train_loss": -41.3228874206543, "global_step": 325048, "epoch": 2686} {"train_loss": -40.72401428222656, "global_step": 325049, "epoch": 2686} {"train_loss": -42.31927490234375, "global_step": 325050, "epoch": 2686} {"train_loss": -42.65212631225586, "global_step": 325051, "epoch": 2686} {"train_loss": -40.301055908203125, "global_step": 325052, "epoch": 2686} {"train_loss": -40.93571090698242, "global_step": 325053, "epoch": 2686} {"train_loss": -40.64825439453125, "global_step": 325054, "epoch": 2686} {"train_loss": -38.77287673950195, "global_step": 325055, "epoch": 2686} {"train_loss": -41.17206573486328, "global_step": 325056, "epoch": 2686} {"train_loss": -41.23734664916992, "global_step": 325057, "epoch": 2686} {"train_loss": -40.96826934814453, "global_step": 325058, "epoch": 2686} {"train_loss": -42.73080062866211, "global_step": 325059, "epoch": 2686} {"train_loss": -41.07163619995117, "global_step": 325060, "epoch": 2686} {"train_loss": -42.14911651611328, "global_step": 325061, "epoch": 2686} {"train_loss": -41.25542068481445, "global_step": 325062, "epoch": 2686} {"train_loss": -42.48722457885742, "global_step": 325063, "epoch": 2686} {"train_loss": -41.46661376953125, "global_step": 325064, "epoch": 2686} {"train_loss": -41.93314743041992, "global_step": 325065, "epoch": 2686} {"train_loss": -42.98138427734375, "global_step": 325066, "epoch": 2686} {"train_loss": -41.25797653198242, "global_step": 325067, "epoch": 2686} {"train_loss": -42.72012710571289, "global_step": 325068, "epoch": 2686} {"train_loss": -42.487239837646484, "global_step": 325069, "epoch": 2686} {"train_loss": -42.10321807861328, "global_step": 325070, "epoch": 2686} {"train_loss": -42.73405075073242, "global_step": 325071, "epoch": 2686} {"train_loss": -43.43235778808594, "global_step": 325072, "epoch": 2686} {"train_loss": -43.35588455200195, "global_step": 325073, "epoch": 2686} {"train_loss": -43.04560089111328, "global_step": 325074, "epoch": 2686} {"train_loss": -42.497283935546875, "global_step": 325075, "epoch": 2686} {"train_loss": -43.01878356933594, "global_step": 325076, "epoch": 2686} {"train_loss": -43.286399841308594, "global_step": 325077, "epoch": 2686} {"train_loss": -43.11713409423828, "global_step": 325078, "epoch": 2686} {"train_loss": -43.17064666748047, "global_step": 325079, "epoch": 2686} {"train_loss": -41.04191207885742, "global_step": 325080, "epoch": 2686} {"train_loss": -42.01310348510742, "global_step": 325081, "epoch": 2686} {"train_loss": -43.10023880004883, "global_step": 325082, "epoch": 2686} {"train_loss": -43.21546173095703, "global_step": 325083, "epoch": 2686} {"train_loss": -42.9260368347168, "global_step": 325084, "epoch": 2686} {"train_loss": -41.327510833740234, "global_step": 325085, "epoch": 2686} {"train_loss": -41.744110107421875, "global_step": 325086, "epoch": 2686} {"train_loss": -43.08065414428711, "global_step": 325087, "epoch": 2686} {"train_loss": -43.11777877807617, "global_step": 325088, "epoch": 2686} {"train_loss": -42.006744384765625, "global_step": 325089, "epoch": 2686} {"train_loss": -41.539608001708984, "global_step": 325090, "epoch": 2686} {"train_loss": -43.54983139038086, "global_step": 325091, "epoch": 2686} {"train_loss": -42.66730499267578, "global_step": 325092, "epoch": 2686} {"train_loss": -41.72358322143555, "global_step": 325093, "epoch": 2686} {"train_loss": -42.54698181152344, "global_step": 325094, "epoch": 2686} {"train_loss": -41.796321868896484, "global_step": 325095, "epoch": 2686} {"train_loss": -42.636844635009766, "global_step": 325096, "epoch": 2686} {"train_loss": -42.95149612426758, "global_step": 325097, "epoch": 2686} {"train_loss": -43.53014373779297, "global_step": 325098, "epoch": 2686} {"train_loss": -43.018062591552734, "global_step": 325099, "epoch": 2686} {"train_loss": -41.320919036865234, "global_step": 325100, "epoch": 2686} {"train_loss": -43.189910888671875, "global_step": 325101, "epoch": 2686} {"train_loss": -43.30814743041992, "global_step": 325102, "epoch": 2686} {"train_loss": -41.81319046020508, "global_step": 325103, "epoch": 2686} {"train_loss": -41.36527633666992, "global_step": 325104, "epoch": 2686} {"train_loss": -43.23614501953125, "global_step": 325105, "epoch": 2686} {"train_loss": -43.51055145263672, "global_step": 325106, "epoch": 2686} {"train_loss": -42.75754928588867, "global_step": 325107, "epoch": 2686} {"train_loss": -43.01240539550781, "global_step": 325108, "epoch": 2686} {"train_loss": -43.51420593261719, "global_step": 325109, "epoch": 2686} {"train_loss": -43.57831954956055, "global_step": 325110, "epoch": 2686} {"train_loss": -43.78609848022461, "global_step": 325111, "epoch": 2686} {"train_loss": -43.15118408203125, "global_step": 325112, "epoch": 2686} {"train_loss": -43.8712043762207, "global_step": 325113, "epoch": 2686} {"train_loss": -43.27974319458008, "global_step": 325114, "epoch": 2686} {"train_loss": -43.74867248535156, "global_step": 325115, "epoch": 2686} {"train_loss": -43.512874603271484, "global_step": 325116, "epoch": 2686} {"train_loss": -42.97959518432617, "global_step": 325117, "epoch": 2686} {"train_loss": -42.76475143432617, "global_step": 325118, "epoch": 2686} {"train_loss": -44.045631408691406, "global_step": 325119, "epoch": 2686} {"train_loss": -43.12981033325195, "global_step": 325120, "epoch": 2686} {"train_loss": -43.57012176513672, "global_step": 325121, "epoch": 2686} {"train_loss": -43.61948013305664, "global_step": 325122, "epoch": 2686} {"train_loss": -43.87969207763672, "global_step": 325123, "epoch": 2686} {"train_loss": -43.21403121948242, "global_step": 325124, "epoch": 2686} {"train_loss": -42.6658935546875, "global_step": 325125, "epoch": 2686} {"train_loss": -42.429723566228695, "global_step": 325126, "epoch": 2686, "val_loss": 2935213.25} {"train_loss": -43.74897003173828, "global_step": 325127, "epoch": 2687} {"train_loss": -42.56093978881836, "global_step": 325128, "epoch": 2687} {"train_loss": -42.93523025512695, "global_step": 325129, "epoch": 2687} {"train_loss": -42.819190979003906, "global_step": 325130, "epoch": 2687} {"train_loss": -43.70299530029297, "global_step": 325131, "epoch": 2687} {"train_loss": -43.84845733642578, "global_step": 325132, "epoch": 2687} {"train_loss": -43.05961227416992, "global_step": 325133, "epoch": 2687} {"train_loss": -42.79051208496094, "global_step": 325134, "epoch": 2687} {"train_loss": -43.9756965637207, "global_step": 325135, "epoch": 2687} {"train_loss": -43.553165435791016, "global_step": 325136, "epoch": 2687} {"train_loss": -43.818824768066406, "global_step": 325137, "epoch": 2687} {"train_loss": -43.88665771484375, "global_step": 325138, "epoch": 2687} {"train_loss": -43.509700775146484, "global_step": 325139, "epoch": 2687} {"train_loss": -43.299781799316406, "global_step": 325140, "epoch": 2687} {"train_loss": -42.736228942871094, "global_step": 325141, "epoch": 2687} {"train_loss": -42.06310272216797, "global_step": 325142, "epoch": 2687} {"train_loss": -43.68696975708008, "global_step": 325143, "epoch": 2687} {"train_loss": -42.86419677734375, "global_step": 325144, "epoch": 2687} {"train_loss": -43.902069091796875, "global_step": 325145, "epoch": 2687} {"train_loss": -43.57462692260742, "global_step": 325146, "epoch": 2687} {"train_loss": -42.14127731323242, "global_step": 325147, "epoch": 2687} {"train_loss": -40.191715240478516, "global_step": 325148, "epoch": 2687} {"train_loss": -40.20273971557617, "global_step": 325149, "epoch": 2687} {"train_loss": -41.35646057128906, "global_step": 325150, "epoch": 2687} {"train_loss": -43.43136215209961, "global_step": 325151, "epoch": 2687} {"train_loss": -41.76411056518555, "global_step": 325152, "epoch": 2687} {"train_loss": -40.04572677612305, "global_step": 325153, "epoch": 2687} {"train_loss": -38.87891387939453, "global_step": 325154, "epoch": 2687} {"train_loss": -41.7409553527832, "global_step": 325155, "epoch": 2687} {"train_loss": -42.33696365356445, "global_step": 325156, "epoch": 2687} {"train_loss": -41.66093063354492, "global_step": 325157, "epoch": 2687} {"train_loss": -41.08171463012695, "global_step": 325158, "epoch": 2687} {"train_loss": -43.01081085205078, "global_step": 325159, "epoch": 2687} {"train_loss": -42.42744827270508, "global_step": 325160, "epoch": 2687} {"train_loss": -42.306697845458984, "global_step": 325161, "epoch": 2687} {"train_loss": -43.077850341796875, "global_step": 325162, "epoch": 2687} {"train_loss": -42.978004455566406, "global_step": 325163, "epoch": 2687} {"train_loss": -41.04494094848633, "global_step": 325164, "epoch": 2687} {"train_loss": -41.86611557006836, "global_step": 325165, "epoch": 2687} {"train_loss": -43.07636642456055, "global_step": 325166, "epoch": 2687} {"train_loss": -42.0805778503418, "global_step": 325167, "epoch": 2687} {"train_loss": -41.24540710449219, "global_step": 325168, "epoch": 2687} {"train_loss": -43.10612869262695, "global_step": 325169, "epoch": 2687} {"train_loss": -41.41350173950195, "global_step": 325170, "epoch": 2687} {"train_loss": -41.56767654418945, "global_step": 325171, "epoch": 2687} {"train_loss": -42.332637786865234, "global_step": 325172, "epoch": 2687} {"train_loss": -42.85929489135742, "global_step": 325173, "epoch": 2687} {"train_loss": -41.171913146972656, "global_step": 325174, "epoch": 2687} {"train_loss": -43.509185791015625, "global_step": 325175, "epoch": 2687} {"train_loss": -42.713653564453125, "global_step": 325176, "epoch": 2687} {"train_loss": -40.480098724365234, "global_step": 325177, "epoch": 2687} {"train_loss": -42.98731231689453, "global_step": 325178, "epoch": 2687} {"train_loss": -42.029205322265625, "global_step": 325179, "epoch": 2687} {"train_loss": -42.152076721191406, "global_step": 325180, "epoch": 2687} {"train_loss": -43.08883285522461, "global_step": 325181, "epoch": 2687} {"train_loss": -42.53160095214844, "global_step": 325182, "epoch": 2687} {"train_loss": -42.9892692565918, "global_step": 325183, "epoch": 2687} {"train_loss": -42.889400482177734, "global_step": 325184, "epoch": 2687} {"train_loss": -41.976104736328125, "global_step": 325185, "epoch": 2687} {"train_loss": -43.287750244140625, "global_step": 325186, "epoch": 2687} {"train_loss": -43.10075378417969, "global_step": 325187, "epoch": 2687} {"train_loss": -41.94351577758789, "global_step": 325188, "epoch": 2687} {"train_loss": -43.1370735168457, "global_step": 325189, "epoch": 2687} {"train_loss": -41.83555221557617, "global_step": 325190, "epoch": 2687} {"train_loss": -42.95667266845703, "global_step": 325191, "epoch": 2687} {"train_loss": -42.8962516784668, "global_step": 325192, "epoch": 2687} {"train_loss": -41.83454132080078, "global_step": 325193, "epoch": 2687} {"train_loss": -44.135040283203125, "global_step": 325194, "epoch": 2687} {"train_loss": -42.07596206665039, "global_step": 325195, "epoch": 2687} {"train_loss": -43.14034652709961, "global_step": 325196, "epoch": 2687} {"train_loss": -43.477813720703125, "global_step": 325197, "epoch": 2687} {"train_loss": -42.88826370239258, "global_step": 325198, "epoch": 2687} {"train_loss": -43.25197219848633, "global_step": 325199, "epoch": 2687} {"train_loss": -40.897159576416016, "global_step": 325200, "epoch": 2687} {"train_loss": -43.77587890625, "global_step": 325201, "epoch": 2687} {"train_loss": -42.82503890991211, "global_step": 325202, "epoch": 2687} {"train_loss": -43.24376678466797, "global_step": 325203, "epoch": 2687} {"train_loss": -42.836570739746094, "global_step": 325204, "epoch": 2687} {"train_loss": -43.09796142578125, "global_step": 325205, "epoch": 2687} {"train_loss": -43.60663604736328, "global_step": 325206, "epoch": 2687} {"train_loss": -42.51034164428711, "global_step": 325207, "epoch": 2687} {"train_loss": -43.01411819458008, "global_step": 325208, "epoch": 2687} {"train_loss": -42.817604064941406, "global_step": 325209, "epoch": 2687} {"train_loss": -43.632572174072266, "global_step": 325210, "epoch": 2687} {"train_loss": -43.26711654663086, "global_step": 325211, "epoch": 2687} {"train_loss": -43.439613342285156, "global_step": 325212, "epoch": 2687} {"train_loss": -43.33564376831055, "global_step": 325213, "epoch": 2687} {"train_loss": -42.78678512573242, "global_step": 325214, "epoch": 2687} {"train_loss": -43.48579025268555, "global_step": 325215, "epoch": 2687} {"train_loss": -43.53900146484375, "global_step": 325216, "epoch": 2687} {"train_loss": -43.82291793823242, "global_step": 325217, "epoch": 2687} {"train_loss": -43.42574691772461, "global_step": 325218, "epoch": 2687} {"train_loss": -43.623504638671875, "global_step": 325219, "epoch": 2687} {"train_loss": -43.714576721191406, "global_step": 325220, "epoch": 2687} {"train_loss": -43.30532455444336, "global_step": 325221, "epoch": 2687} {"train_loss": -44.10579299926758, "global_step": 325222, "epoch": 2687} {"train_loss": -43.260406494140625, "global_step": 325223, "epoch": 2687} {"train_loss": -43.94378662109375, "global_step": 325224, "epoch": 2687} {"train_loss": -43.526546478271484, "global_step": 325225, "epoch": 2687} {"train_loss": -43.863094329833984, "global_step": 325226, "epoch": 2687} {"train_loss": -43.641666412353516, "global_step": 325227, "epoch": 2687} {"train_loss": -43.1274299621582, "global_step": 325228, "epoch": 2687} {"train_loss": -43.84915542602539, "global_step": 325229, "epoch": 2687} {"train_loss": -43.88614273071289, "global_step": 325230, "epoch": 2687} {"train_loss": -43.74607467651367, "global_step": 325231, "epoch": 2687} {"train_loss": -44.10826110839844, "global_step": 325232, "epoch": 2687} {"train_loss": -43.64854049682617, "global_step": 325233, "epoch": 2687} {"train_loss": -43.922481536865234, "global_step": 325234, "epoch": 2687} {"train_loss": -43.58036422729492, "global_step": 325235, "epoch": 2687} {"train_loss": -43.9783935546875, "global_step": 325236, "epoch": 2687} {"train_loss": -43.71208572387695, "global_step": 325237, "epoch": 2687} {"train_loss": -43.46116256713867, "global_step": 325238, "epoch": 2687} {"train_loss": -43.980934143066406, "global_step": 325239, "epoch": 2687} {"train_loss": -43.72324752807617, "global_step": 325240, "epoch": 2687} {"train_loss": -43.517181396484375, "global_step": 325241, "epoch": 2687} {"train_loss": -42.8730583190918, "global_step": 325242, "epoch": 2687} {"train_loss": -44.46501541137695, "global_step": 325243, "epoch": 2687} {"train_loss": -42.96409225463867, "global_step": 325244, "epoch": 2687} {"train_loss": -42.16413879394531, "global_step": 325245, "epoch": 2687} {"train_loss": -42.192195892333984, "global_step": 325246, "epoch": 2687} {"train_loss": -42.86392842442536, "global_step": 325247, "epoch": 2687, "val_loss": 2780577.0} {"train_loss": -43.12848663330078, "global_step": 325248, "epoch": 2688} {"train_loss": -43.61806869506836, "global_step": 325249, "epoch": 2688} {"train_loss": -41.69771194458008, "global_step": 325250, "epoch": 2688} {"train_loss": -41.11033248901367, "global_step": 325251, "epoch": 2688} {"train_loss": -42.499481201171875, "global_step": 325252, "epoch": 2688} {"train_loss": -42.49748611450195, "global_step": 325253, "epoch": 2688} {"train_loss": -43.37872314453125, "global_step": 325254, "epoch": 2688} {"train_loss": -41.47871780395508, "global_step": 325255, "epoch": 2688} {"train_loss": -42.82223129272461, "global_step": 325256, "epoch": 2688} {"train_loss": -41.877044677734375, "global_step": 325257, "epoch": 2688} {"train_loss": -42.85723114013672, "global_step": 325258, "epoch": 2688} {"train_loss": -39.694923400878906, "global_step": 325259, "epoch": 2688} {"train_loss": -41.28219223022461, "global_step": 325260, "epoch": 2688} {"train_loss": -41.65567398071289, "global_step": 325261, "epoch": 2688} {"train_loss": -39.47983932495117, "global_step": 325262, "epoch": 2688} {"train_loss": -42.00474548339844, "global_step": 325263, "epoch": 2688} {"train_loss": -42.746700286865234, "global_step": 325264, "epoch": 2688} {"train_loss": -39.327674865722656, "global_step": 325265, "epoch": 2688} {"train_loss": -41.7278938293457, "global_step": 325266, "epoch": 2688} {"train_loss": -40.554473876953125, "global_step": 325267, "epoch": 2688} {"train_loss": -42.10283660888672, "global_step": 325268, "epoch": 2688} {"train_loss": -40.74603271484375, "global_step": 325269, "epoch": 2688} {"train_loss": -40.76992416381836, "global_step": 325270, "epoch": 2688} {"train_loss": -42.363746643066406, "global_step": 325271, "epoch": 2688} {"train_loss": -38.40782928466797, "global_step": 325272, "epoch": 2688} {"train_loss": -42.41435241699219, "global_step": 325273, "epoch": 2688} {"train_loss": -41.76279830932617, "global_step": 325274, "epoch": 2688} {"train_loss": -40.774776458740234, "global_step": 325275, "epoch": 2688} {"train_loss": -43.01998519897461, "global_step": 325276, "epoch": 2688} {"train_loss": -42.8092155456543, "global_step": 325277, "epoch": 2688} {"train_loss": -40.63486862182617, "global_step": 325278, "epoch": 2688} {"train_loss": -42.5676155090332, "global_step": 325279, "epoch": 2688} {"train_loss": -41.876502990722656, "global_step": 325280, "epoch": 2688} {"train_loss": -41.96468734741211, "global_step": 325281, "epoch": 2688} {"train_loss": -43.22663497924805, "global_step": 325282, "epoch": 2688} {"train_loss": -42.60250473022461, "global_step": 325283, "epoch": 2688} {"train_loss": -42.51068115234375, "global_step": 325284, "epoch": 2688} {"train_loss": -42.23414611816406, "global_step": 325285, "epoch": 2688} {"train_loss": -43.006954193115234, "global_step": 325286, "epoch": 2688} {"train_loss": -42.87290573120117, "global_step": 325287, "epoch": 2688} {"train_loss": -42.926002502441406, "global_step": 325288, "epoch": 2688} {"train_loss": -43.06452560424805, "global_step": 325289, "epoch": 2688} {"train_loss": -43.19234085083008, "global_step": 325290, "epoch": 2688} {"train_loss": -43.36870193481445, "global_step": 325291, "epoch": 2688} {"train_loss": -43.66070556640625, "global_step": 325292, "epoch": 2688} {"train_loss": -42.4760856628418, "global_step": 325293, "epoch": 2688} {"train_loss": -43.536659240722656, "global_step": 325294, "epoch": 2688} {"train_loss": -42.81206130981445, "global_step": 325295, "epoch": 2688} {"train_loss": -43.60270690917969, "global_step": 325296, "epoch": 2688} {"train_loss": -43.70746612548828, "global_step": 325297, "epoch": 2688} {"train_loss": -43.37523651123047, "global_step": 325298, "epoch": 2688} {"train_loss": -44.11381149291992, "global_step": 325299, "epoch": 2688} {"train_loss": -42.96282958984375, "global_step": 325300, "epoch": 2688} {"train_loss": -43.91561508178711, "global_step": 325301, "epoch": 2688} {"train_loss": -43.374916076660156, "global_step": 325302, "epoch": 2688} {"train_loss": -42.93933868408203, "global_step": 325303, "epoch": 2688} {"train_loss": -44.13291549682617, "global_step": 325304, "epoch": 2688} {"train_loss": -43.20339584350586, "global_step": 325305, "epoch": 2688} {"train_loss": -43.869991302490234, "global_step": 325306, "epoch": 2688} {"train_loss": -44.17444610595703, "global_step": 325307, "epoch": 2688} {"train_loss": -43.836544036865234, "global_step": 325308, "epoch": 2688} {"train_loss": -44.15877914428711, "global_step": 325309, "epoch": 2688} {"train_loss": -43.88001251220703, "global_step": 325310, "epoch": 2688} {"train_loss": -44.01240921020508, "global_step": 325311, "epoch": 2688} {"train_loss": -44.237586975097656, "global_step": 325312, "epoch": 2688} {"train_loss": -44.55003356933594, "global_step": 325313, "epoch": 2688} {"train_loss": -44.47377395629883, "global_step": 325314, "epoch": 2688} {"train_loss": -44.34724044799805, "global_step": 325315, "epoch": 2688} {"train_loss": -43.90129470825195, "global_step": 325316, "epoch": 2688} {"train_loss": -43.60417938232422, "global_step": 325317, "epoch": 2688} {"train_loss": -44.55567932128906, "global_step": 325318, "epoch": 2688} {"train_loss": -43.79413986206055, "global_step": 325319, "epoch": 2688} {"train_loss": -43.83733367919922, "global_step": 325320, "epoch": 2688} {"train_loss": -42.77903366088867, "global_step": 325321, "epoch": 2688} {"train_loss": -42.773555755615234, "global_step": 325322, "epoch": 2688} {"train_loss": -42.53693389892578, "global_step": 325323, "epoch": 2688} {"train_loss": -41.438232421875, "global_step": 325324, "epoch": 2688} {"train_loss": -42.48398971557617, "global_step": 325325, "epoch": 2688} {"train_loss": -42.857818603515625, "global_step": 325326, "epoch": 2688} {"train_loss": -42.81948471069336, "global_step": 325327, "epoch": 2688} {"train_loss": -41.87517166137695, "global_step": 325328, "epoch": 2688} {"train_loss": -40.00350570678711, "global_step": 325329, "epoch": 2688} {"train_loss": -39.53498458862305, "global_step": 325330, "epoch": 2688} {"train_loss": -43.213714599609375, "global_step": 325331, "epoch": 2688} {"train_loss": -42.17462158203125, "global_step": 325332, "epoch": 2688} {"train_loss": -37.44191360473633, "global_step": 325333, "epoch": 2688} {"train_loss": -41.122676849365234, "global_step": 325334, "epoch": 2688} {"train_loss": -42.375492095947266, "global_step": 325335, "epoch": 2688} {"train_loss": -41.931800842285156, "global_step": 325336, "epoch": 2688} {"train_loss": -41.412147521972656, "global_step": 325337, "epoch": 2688} {"train_loss": -42.87346649169922, "global_step": 325338, "epoch": 2688} {"train_loss": -43.78997039794922, "global_step": 325339, "epoch": 2688} {"train_loss": -43.109039306640625, "global_step": 325340, "epoch": 2688} {"train_loss": -43.44963455200195, "global_step": 325341, "epoch": 2688} {"train_loss": -43.541847229003906, "global_step": 325342, "epoch": 2688} {"train_loss": -42.951168060302734, "global_step": 325343, "epoch": 2688} {"train_loss": -42.877506256103516, "global_step": 325344, "epoch": 2688} {"train_loss": -43.82032012939453, "global_step": 325345, "epoch": 2688} {"train_loss": -43.12077331542969, "global_step": 325346, "epoch": 2688} {"train_loss": -43.13941192626953, "global_step": 325347, "epoch": 2688} {"train_loss": -43.9520378112793, "global_step": 325348, "epoch": 2688} {"train_loss": -43.36585235595703, "global_step": 325349, "epoch": 2688} {"train_loss": -43.20567321777344, "global_step": 325350, "epoch": 2688} {"train_loss": -44.0328254699707, "global_step": 325351, "epoch": 2688} {"train_loss": -43.67927551269531, "global_step": 325352, "epoch": 2688} {"train_loss": -43.68927764892578, "global_step": 325353, "epoch": 2688} {"train_loss": -43.912410736083984, "global_step": 325354, "epoch": 2688} {"train_loss": -44.0710563659668, "global_step": 325355, "epoch": 2688} {"train_loss": -43.45296096801758, "global_step": 325356, "epoch": 2688} {"train_loss": -43.54575729370117, "global_step": 325357, "epoch": 2688} {"train_loss": -41.902366638183594, "global_step": 325358, "epoch": 2688} {"train_loss": -43.83246994018555, "global_step": 325359, "epoch": 2688} {"train_loss": -42.25149917602539, "global_step": 325360, "epoch": 2688} {"train_loss": -42.22907638549805, "global_step": 325361, "epoch": 2688} {"train_loss": -43.25258255004883, "global_step": 325362, "epoch": 2688} {"train_loss": -42.22489547729492, "global_step": 325363, "epoch": 2688} {"train_loss": -39.52192306518555, "global_step": 325364, "epoch": 2688} {"train_loss": -42.999080657958984, "global_step": 325365, "epoch": 2688} {"train_loss": -38.825130462646484, "global_step": 325366, "epoch": 2688} {"train_loss": -42.36005783081055, "global_step": 325367, "epoch": 2688} {"train_loss": -42.61363194993705, "global_step": 325368, "epoch": 2688, "val_loss": 2730232.75} {"train_loss": -32.51750946044922, "global_step": 325369, "epoch": 2689} {"train_loss": -33.82162094116211, "global_step": 325370, "epoch": 2689} {"train_loss": -41.91989517211914, "global_step": 325371, "epoch": 2689} {"train_loss": -41.54384231567383, "global_step": 325372, "epoch": 2689} {"train_loss": -40.717376708984375, "global_step": 325373, "epoch": 2689} {"train_loss": -40.62346267700195, "global_step": 325374, "epoch": 2689} {"train_loss": -37.6712760925293, "global_step": 325375, "epoch": 2689} {"train_loss": -32.01248550415039, "global_step": 325376, "epoch": 2689} {"train_loss": -34.44270324707031, "global_step": 325377, "epoch": 2689} {"train_loss": -36.22399139404297, "global_step": 325378, "epoch": 2689} {"train_loss": -32.339298248291016, "global_step": 325379, "epoch": 2689} {"train_loss": -36.299530029296875, "global_step": 325380, "epoch": 2689} {"train_loss": -38.24940872192383, "global_step": 325381, "epoch": 2689} {"train_loss": -36.86039352416992, "global_step": 325382, "epoch": 2689} {"train_loss": -39.45881652832031, "global_step": 325383, "epoch": 2689} {"train_loss": -36.597267150878906, "global_step": 325384, "epoch": 2689} {"train_loss": -38.509151458740234, "global_step": 325385, "epoch": 2689} {"train_loss": -36.863670349121094, "global_step": 325386, "epoch": 2689} {"train_loss": -26.110937118530273, "global_step": 325387, "epoch": 2689} {"train_loss": -38.65067672729492, "global_step": 325388, "epoch": 2689} {"train_loss": -37.28506088256836, "global_step": 325389, "epoch": 2689} {"train_loss": -36.0990104675293, "global_step": 325390, "epoch": 2689} {"train_loss": -35.19143295288086, "global_step": 325391, "epoch": 2689} {"train_loss": -37.686405181884766, "global_step": 325392, "epoch": 2689} {"train_loss": -36.10321044921875, "global_step": 325393, "epoch": 2689} {"train_loss": -40.3033561706543, "global_step": 325394, "epoch": 2689} {"train_loss": -38.693477630615234, "global_step": 325395, "epoch": 2689} {"train_loss": -37.19575119018555, "global_step": 325396, "epoch": 2689} {"train_loss": -34.61796188354492, "global_step": 325397, "epoch": 2689} {"train_loss": -39.40535354614258, "global_step": 325398, "epoch": 2689} {"train_loss": -37.41524124145508, "global_step": 325399, "epoch": 2689} {"train_loss": -38.054405212402344, "global_step": 325400, "epoch": 2689} {"train_loss": -41.98687744140625, "global_step": 325401, "epoch": 2689} {"train_loss": -38.03704071044922, "global_step": 325402, "epoch": 2689} {"train_loss": -37.63697814941406, "global_step": 325403, "epoch": 2689} {"train_loss": -39.046592712402344, "global_step": 325404, "epoch": 2689} {"train_loss": -36.0959358215332, "global_step": 325405, "epoch": 2689} {"train_loss": -38.61585235595703, "global_step": 325406, "epoch": 2689} {"train_loss": -35.95094680786133, "global_step": 325407, "epoch": 2689} {"train_loss": -40.886165618896484, "global_step": 325408, "epoch": 2689} {"train_loss": -37.66169357299805, "global_step": 325409, "epoch": 2689} {"train_loss": -40.4326286315918, "global_step": 325410, "epoch": 2689} {"train_loss": -40.91722869873047, "global_step": 325411, "epoch": 2689} {"train_loss": -39.75859832763672, "global_step": 325412, "epoch": 2689} {"train_loss": -39.648414611816406, "global_step": 325413, "epoch": 2689} {"train_loss": -41.3380012512207, "global_step": 325414, "epoch": 2689} {"train_loss": -39.24761962890625, "global_step": 325415, "epoch": 2689} {"train_loss": -40.973506927490234, "global_step": 325416, "epoch": 2689} {"train_loss": -40.43682861328125, "global_step": 325417, "epoch": 2689} {"train_loss": -40.0761604309082, "global_step": 325418, "epoch": 2689} {"train_loss": -40.71904373168945, "global_step": 325419, "epoch": 2689} {"train_loss": -40.74434280395508, "global_step": 325420, "epoch": 2689} {"train_loss": -39.64809799194336, "global_step": 325421, "epoch": 2689} {"train_loss": -38.41172409057617, "global_step": 325422, "epoch": 2689} {"train_loss": -40.66706466674805, "global_step": 325423, "epoch": 2689} {"train_loss": -41.52580261230469, "global_step": 325424, "epoch": 2689} {"train_loss": -41.610374450683594, "global_step": 325425, "epoch": 2689} {"train_loss": -41.47849655151367, "global_step": 325426, "epoch": 2689} {"train_loss": -39.724449157714844, "global_step": 325427, "epoch": 2689} {"train_loss": -41.21931076049805, "global_step": 325428, "epoch": 2689} {"train_loss": -41.075172424316406, "global_step": 325429, "epoch": 2689} {"train_loss": -39.070735931396484, "global_step": 325430, "epoch": 2689} {"train_loss": -41.839744567871094, "global_step": 325431, "epoch": 2689} {"train_loss": -40.75741195678711, "global_step": 325432, "epoch": 2689} {"train_loss": -39.01008224487305, "global_step": 325433, "epoch": 2689} {"train_loss": -41.17625045776367, "global_step": 325434, "epoch": 2689} {"train_loss": -42.36991882324219, "global_step": 325435, "epoch": 2689} {"train_loss": -40.685630798339844, "global_step": 325436, "epoch": 2689} {"train_loss": -41.91310501098633, "global_step": 325437, "epoch": 2689} {"train_loss": -41.701412200927734, "global_step": 325438, "epoch": 2689} {"train_loss": -41.63037109375, "global_step": 325439, "epoch": 2689} {"train_loss": -41.819583892822266, "global_step": 325440, "epoch": 2689} {"train_loss": -41.37484359741211, "global_step": 325441, "epoch": 2689} {"train_loss": -42.027252197265625, "global_step": 325442, "epoch": 2689} {"train_loss": -41.451637268066406, "global_step": 325443, "epoch": 2689} {"train_loss": -41.70130920410156, "global_step": 325444, "epoch": 2689} {"train_loss": -41.21271896362305, "global_step": 325445, "epoch": 2689} {"train_loss": -41.467159271240234, "global_step": 325446, "epoch": 2689} {"train_loss": -42.21140670776367, "global_step": 325447, "epoch": 2689} {"train_loss": -41.533695220947266, "global_step": 325448, "epoch": 2689} {"train_loss": -41.35932540893555, "global_step": 325449, "epoch": 2689} {"train_loss": -40.6822624206543, "global_step": 325450, "epoch": 2689} {"train_loss": -41.422908782958984, "global_step": 325451, "epoch": 2689} {"train_loss": -42.4553337097168, "global_step": 325452, "epoch": 2689} {"train_loss": -41.98223876953125, "global_step": 325453, "epoch": 2689} {"train_loss": -42.178428649902344, "global_step": 325454, "epoch": 2689} {"train_loss": -42.01705551147461, "global_step": 325455, "epoch": 2689} {"train_loss": -42.20486068725586, "global_step": 325456, "epoch": 2689} {"train_loss": -42.83339309692383, "global_step": 325457, "epoch": 2689} {"train_loss": -41.744476318359375, "global_step": 325458, "epoch": 2689} {"train_loss": -42.8047981262207, "global_step": 325459, "epoch": 2689} {"train_loss": -42.37775802612305, "global_step": 325460, "epoch": 2689} {"train_loss": -42.740081787109375, "global_step": 325461, "epoch": 2689} {"train_loss": -42.80799102783203, "global_step": 325462, "epoch": 2689} {"train_loss": -42.49538803100586, "global_step": 325463, "epoch": 2689} {"train_loss": -42.88418197631836, "global_step": 325464, "epoch": 2689} {"train_loss": -42.572879791259766, "global_step": 325465, "epoch": 2689} {"train_loss": -42.61418533325195, "global_step": 325466, "epoch": 2689} {"train_loss": -42.553077697753906, "global_step": 325467, "epoch": 2689} {"train_loss": -42.92449951171875, "global_step": 325468, "epoch": 2689} {"train_loss": -42.65452194213867, "global_step": 325469, "epoch": 2689} {"train_loss": -42.626895904541016, "global_step": 325470, "epoch": 2689} {"train_loss": -43.1090202331543, "global_step": 325471, "epoch": 2689} {"train_loss": -42.736083984375, "global_step": 325472, "epoch": 2689} {"train_loss": -42.49720001220703, "global_step": 325473, "epoch": 2689} {"train_loss": -43.33173751831055, "global_step": 325474, "epoch": 2689} {"train_loss": -43.313323974609375, "global_step": 325475, "epoch": 2689} {"train_loss": -42.95903015136719, "global_step": 325476, "epoch": 2689} {"train_loss": -43.32014846801758, "global_step": 325477, "epoch": 2689} {"train_loss": -43.16642761230469, "global_step": 325478, "epoch": 2689} {"train_loss": -42.97624969482422, "global_step": 325479, "epoch": 2689} {"train_loss": -42.663822174072266, "global_step": 325480, "epoch": 2689} {"train_loss": -43.428321838378906, "global_step": 325481, "epoch": 2689} {"train_loss": -42.395416259765625, "global_step": 325482, "epoch": 2689} {"train_loss": -42.05910110473633, "global_step": 325483, "epoch": 2689} {"train_loss": -41.97163772583008, "global_step": 325484, "epoch": 2689} {"train_loss": -42.425235748291016, "global_step": 325485, "epoch": 2689} {"train_loss": -43.44932174682617, "global_step": 325486, "epoch": 2689} {"train_loss": -42.52131271362305, "global_step": 325487, "epoch": 2689} {"train_loss": -42.530242919921875, "global_step": 325488, "epoch": 2689} {"train_loss": -40.20608096477414, "global_step": 325489, "epoch": 2689, "val_loss": 2864248.0} {"train_loss": -42.69293975830078, "global_step": 325490, "epoch": 2690} {"train_loss": -43.38351821899414, "global_step": 325491, "epoch": 2690} {"train_loss": -42.9567756652832, "global_step": 325492, "epoch": 2690} {"train_loss": -42.61843490600586, "global_step": 325493, "epoch": 2690} {"train_loss": -42.26477813720703, "global_step": 325494, "epoch": 2690} {"train_loss": -43.1235237121582, "global_step": 325495, "epoch": 2690} {"train_loss": -43.653560638427734, "global_step": 325496, "epoch": 2690} {"train_loss": -43.3131217956543, "global_step": 325497, "epoch": 2690} {"train_loss": -43.4317741394043, "global_step": 325498, "epoch": 2690} {"train_loss": -43.07057571411133, "global_step": 325499, "epoch": 2690} {"train_loss": -43.988861083984375, "global_step": 325500, "epoch": 2690} {"train_loss": -43.66266632080078, "global_step": 325501, "epoch": 2690} {"train_loss": -43.4920768737793, "global_step": 325502, "epoch": 2690} {"train_loss": -43.5346565246582, "global_step": 325503, "epoch": 2690} {"train_loss": -43.02399826049805, "global_step": 325504, "epoch": 2690} {"train_loss": -44.00474166870117, "global_step": 325505, "epoch": 2690} {"train_loss": -43.48342514038086, "global_step": 325506, "epoch": 2690} {"train_loss": -43.242767333984375, "global_step": 325507, "epoch": 2690} {"train_loss": -42.51365280151367, "global_step": 325508, "epoch": 2690} {"train_loss": -43.603919982910156, "global_step": 325509, "epoch": 2690} {"train_loss": -43.86605453491211, "global_step": 325510, "epoch": 2690} {"train_loss": -43.44873046875, "global_step": 325511, "epoch": 2690} {"train_loss": -43.58211135864258, "global_step": 325512, "epoch": 2690} {"train_loss": -42.84861373901367, "global_step": 325513, "epoch": 2690} {"train_loss": -43.34889602661133, "global_step": 325514, "epoch": 2690} {"train_loss": -43.860477447509766, "global_step": 325515, "epoch": 2690} {"train_loss": -44.1764030456543, "global_step": 325516, "epoch": 2690} {"train_loss": -43.49384307861328, "global_step": 325517, "epoch": 2690} {"train_loss": -44.15088653564453, "global_step": 325518, "epoch": 2690} {"train_loss": -42.9879035949707, "global_step": 325519, "epoch": 2690} {"train_loss": -43.36040115356445, "global_step": 325520, "epoch": 2690} {"train_loss": -42.97331237792969, "global_step": 325521, "epoch": 2690} {"train_loss": -43.691436767578125, "global_step": 325522, "epoch": 2690} {"train_loss": -43.88135528564453, "global_step": 325523, "epoch": 2690} {"train_loss": -43.45151138305664, "global_step": 325524, "epoch": 2690} {"train_loss": -43.092811584472656, "global_step": 325525, "epoch": 2690} {"train_loss": -44.12360763549805, "global_step": 325526, "epoch": 2690} {"train_loss": -43.6623649597168, "global_step": 325527, "epoch": 2690} {"train_loss": -43.897212982177734, "global_step": 325528, "epoch": 2690} {"train_loss": -44.30712127685547, "global_step": 325529, "epoch": 2690} {"train_loss": -44.052032470703125, "global_step": 325530, "epoch": 2690} {"train_loss": -43.56879425048828, "global_step": 325531, "epoch": 2690} {"train_loss": -43.493743896484375, "global_step": 325532, "epoch": 2690} {"train_loss": -44.251808166503906, "global_step": 325533, "epoch": 2690} {"train_loss": -44.29053497314453, "global_step": 325534, "epoch": 2690} {"train_loss": -43.66769027709961, "global_step": 325535, "epoch": 2690} {"train_loss": -44.1134033203125, "global_step": 325536, "epoch": 2690} {"train_loss": -44.29857635498047, "global_step": 325537, "epoch": 2690} {"train_loss": -42.86708450317383, "global_step": 325538, "epoch": 2690} {"train_loss": -41.16255569458008, "global_step": 325539, "epoch": 2690} {"train_loss": -35.02345657348633, "global_step": 325540, "epoch": 2690} {"train_loss": -21.9655704498291, "global_step": 325541, "epoch": 2690} {"train_loss": -22.216869354248047, "global_step": 325542, "epoch": 2690} {"train_loss": -40.3911247253418, "global_step": 325543, "epoch": 2690} {"train_loss": -35.249507904052734, "global_step": 325544, "epoch": 2690} {"train_loss": -13.350494384765625, "global_step": 325545, "epoch": 2690} {"train_loss": -27.646459579467773, "global_step": 325546, "epoch": 2690} {"train_loss": -33.30200958251953, "global_step": 325547, "epoch": 2690} {"train_loss": -17.911399841308594, "global_step": 325548, "epoch": 2690} {"train_loss": -33.73155212402344, "global_step": 325549, "epoch": 2690} {"train_loss": -23.71828842163086, "global_step": 325550, "epoch": 2690} {"train_loss": -32.615814208984375, "global_step": 325551, "epoch": 2690} {"train_loss": -31.91583251953125, "global_step": 325552, "epoch": 2690} {"train_loss": -27.595630645751953, "global_step": 325553, "epoch": 2690} {"train_loss": -39.326351165771484, "global_step": 325554, "epoch": 2690} {"train_loss": -29.8070125579834, "global_step": 325555, "epoch": 2690} {"train_loss": -35.09934616088867, "global_step": 325556, "epoch": 2690} {"train_loss": -37.88932418823242, "global_step": 325557, "epoch": 2690} {"train_loss": -32.32171630859375, "global_step": 325558, "epoch": 2690} {"train_loss": -37.724090576171875, "global_step": 325559, "epoch": 2690} {"train_loss": -38.14359664916992, "global_step": 325560, "epoch": 2690} {"train_loss": -35.89608383178711, "global_step": 325561, "epoch": 2690} {"train_loss": -36.164947509765625, "global_step": 325562, "epoch": 2690} {"train_loss": -39.18637466430664, "global_step": 325563, "epoch": 2690} {"train_loss": -37.550594329833984, "global_step": 325564, "epoch": 2690} {"train_loss": -37.50736618041992, "global_step": 325565, "epoch": 2690} {"train_loss": -39.558658599853516, "global_step": 325566, "epoch": 2690} {"train_loss": -39.08808135986328, "global_step": 325567, "epoch": 2690} {"train_loss": -38.30458450317383, "global_step": 325568, "epoch": 2690} {"train_loss": -38.93052291870117, "global_step": 325569, "epoch": 2690} {"train_loss": -40.08686447143555, "global_step": 325570, "epoch": 2690} {"train_loss": -39.300899505615234, "global_step": 325571, "epoch": 2690} {"train_loss": -38.80364990234375, "global_step": 325572, "epoch": 2690} {"train_loss": -39.93134307861328, "global_step": 325573, "epoch": 2690} {"train_loss": -40.740257263183594, "global_step": 325574, "epoch": 2690} {"train_loss": -40.33960723876953, "global_step": 325575, "epoch": 2690} {"train_loss": -39.883575439453125, "global_step": 325576, "epoch": 2690} {"train_loss": -40.6613655090332, "global_step": 325577, "epoch": 2690} {"train_loss": -41.31032943725586, "global_step": 325578, "epoch": 2690} {"train_loss": -40.542823791503906, "global_step": 325579, "epoch": 2690} {"train_loss": -40.163177490234375, "global_step": 325580, "epoch": 2690} {"train_loss": -41.02193069458008, "global_step": 325581, "epoch": 2690} {"train_loss": -40.95808410644531, "global_step": 325582, "epoch": 2690} {"train_loss": -40.85893249511719, "global_step": 325583, "epoch": 2690} {"train_loss": -41.02694320678711, "global_step": 325584, "epoch": 2690} {"train_loss": -40.98086929321289, "global_step": 325585, "epoch": 2690} {"train_loss": -41.64779281616211, "global_step": 325586, "epoch": 2690} {"train_loss": -41.62032699584961, "global_step": 325587, "epoch": 2690} {"train_loss": -41.46570587158203, "global_step": 325588, "epoch": 2690} {"train_loss": -41.08533477783203, "global_step": 325589, "epoch": 2690} {"train_loss": -41.64332580566406, "global_step": 325590, "epoch": 2690} {"train_loss": -41.93558120727539, "global_step": 325591, "epoch": 2690} {"train_loss": -41.43738555908203, "global_step": 325592, "epoch": 2690} {"train_loss": -41.648494720458984, "global_step": 325593, "epoch": 2690} {"train_loss": -41.46409225463867, "global_step": 325594, "epoch": 2690} {"train_loss": -41.91279220581055, "global_step": 325595, "epoch": 2690} {"train_loss": -41.91366195678711, "global_step": 325596, "epoch": 2690} {"train_loss": -41.80740737915039, "global_step": 325597, "epoch": 2690} {"train_loss": -42.19915771484375, "global_step": 325598, "epoch": 2690} {"train_loss": -41.87647247314453, "global_step": 325599, "epoch": 2690} {"train_loss": -42.37942886352539, "global_step": 325600, "epoch": 2690} {"train_loss": -42.24197006225586, "global_step": 325601, "epoch": 2690} {"train_loss": -42.18745803833008, "global_step": 325602, "epoch": 2690} {"train_loss": -41.92655944824219, "global_step": 325603, "epoch": 2690} {"train_loss": -42.2520751953125, "global_step": 325604, "epoch": 2690} {"train_loss": -42.15279769897461, "global_step": 325605, "epoch": 2690} {"train_loss": -42.250831604003906, "global_step": 325606, "epoch": 2690} {"train_loss": -42.1829948425293, "global_step": 325607, "epoch": 2690} {"train_loss": -42.475074768066406, "global_step": 325608, "epoch": 2690} {"train_loss": -42.76994705200195, "global_step": 325609, "epoch": 2690} {"train_loss": -40.148119319568984, "global_step": 325610, "epoch": 2690, "val_loss": 2728860.75} {"train_loss": -42.6766357421875, "global_step": 325611, "epoch": 2691} {"train_loss": -42.583892822265625, "global_step": 325612, "epoch": 2691} {"train_loss": -42.35354232788086, "global_step": 325613, "epoch": 2691} {"train_loss": -42.471656799316406, "global_step": 325614, "epoch": 2691} {"train_loss": -42.8918571472168, "global_step": 325615, "epoch": 2691} {"train_loss": -42.46709060668945, "global_step": 325616, "epoch": 2691} {"train_loss": -42.703922271728516, "global_step": 325617, "epoch": 2691} {"train_loss": -42.902008056640625, "global_step": 325618, "epoch": 2691} {"train_loss": -43.42741012573242, "global_step": 325619, "epoch": 2691} {"train_loss": -43.14255905151367, "global_step": 325620, "epoch": 2691} {"train_loss": -43.24850082397461, "global_step": 325621, "epoch": 2691} {"train_loss": -43.1648063659668, "global_step": 325622, "epoch": 2691} {"train_loss": -43.23405838012695, "global_step": 325623, "epoch": 2691} {"train_loss": -42.90354537963867, "global_step": 325624, "epoch": 2691} {"train_loss": -43.2436408996582, "global_step": 325625, "epoch": 2691} {"train_loss": -43.330299377441406, "global_step": 325626, "epoch": 2691} {"train_loss": -43.11860656738281, "global_step": 325627, "epoch": 2691} {"train_loss": -43.51662826538086, "global_step": 325628, "epoch": 2691} {"train_loss": -43.43375015258789, "global_step": 325629, "epoch": 2691} {"train_loss": -43.263187408447266, "global_step": 325630, "epoch": 2691} {"train_loss": -43.094783782958984, "global_step": 325631, "epoch": 2691} {"train_loss": -43.39960861206055, "global_step": 325632, "epoch": 2691} {"train_loss": -43.20182418823242, "global_step": 325633, "epoch": 2691} {"train_loss": -43.65234375, "global_step": 325634, "epoch": 2691} {"train_loss": -43.3721923828125, "global_step": 325635, "epoch": 2691} {"train_loss": -43.57527542114258, "global_step": 325636, "epoch": 2691} {"train_loss": -43.465511322021484, "global_step": 325637, "epoch": 2691} {"train_loss": -43.3680534362793, "global_step": 325638, "epoch": 2691} {"train_loss": -43.52992630004883, "global_step": 325639, "epoch": 2691} {"train_loss": -43.78749465942383, "global_step": 325640, "epoch": 2691} {"train_loss": -43.745025634765625, "global_step": 325641, "epoch": 2691} {"train_loss": -43.72860336303711, "global_step": 325642, "epoch": 2691} {"train_loss": -44.03548812866211, "global_step": 325643, "epoch": 2691} {"train_loss": -43.92473220825195, "global_step": 325644, "epoch": 2691} {"train_loss": -43.7895622253418, "global_step": 325645, "epoch": 2691} {"train_loss": -44.035621643066406, "global_step": 325646, "epoch": 2691} {"train_loss": -43.591312408447266, "global_step": 325647, "epoch": 2691} {"train_loss": -43.7959098815918, "global_step": 325648, "epoch": 2691} {"train_loss": -43.701168060302734, "global_step": 325649, "epoch": 2691} {"train_loss": -43.884613037109375, "global_step": 325650, "epoch": 2691} {"train_loss": -43.70941925048828, "global_step": 325651, "epoch": 2691} {"train_loss": -43.7022590637207, "global_step": 325652, "epoch": 2691} {"train_loss": -44.11271286010742, "global_step": 325653, "epoch": 2691} {"train_loss": -44.10686492919922, "global_step": 325654, "epoch": 2691} {"train_loss": -44.15883255004883, "global_step": 325655, "epoch": 2691} {"train_loss": -44.07313537597656, "global_step": 325656, "epoch": 2691} {"train_loss": -43.073944091796875, "global_step": 325657, "epoch": 2691} {"train_loss": -43.890567779541016, "global_step": 325658, "epoch": 2691} {"train_loss": -44.296443939208984, "global_step": 325659, "epoch": 2691} {"train_loss": -44.39799499511719, "global_step": 325660, "epoch": 2691} {"train_loss": -44.32372283935547, "global_step": 325661, "epoch": 2691} {"train_loss": -44.05859375, "global_step": 325662, "epoch": 2691} {"train_loss": -44.20970153808594, "global_step": 325663, "epoch": 2691} {"train_loss": -44.434940338134766, "global_step": 325664, "epoch": 2691} {"train_loss": -44.67245864868164, "global_step": 325665, "epoch": 2691} {"train_loss": -44.10331344604492, "global_step": 325666, "epoch": 2691} {"train_loss": -44.76712417602539, "global_step": 325667, "epoch": 2691} {"train_loss": -43.88718795776367, "global_step": 325668, "epoch": 2691} {"train_loss": -44.26914596557617, "global_step": 325669, "epoch": 2691} {"train_loss": -43.79527282714844, "global_step": 325670, "epoch": 2691} {"train_loss": -43.24386215209961, "global_step": 325671, "epoch": 2691} {"train_loss": -44.09426498413086, "global_step": 325672, "epoch": 2691} {"train_loss": -42.605079650878906, "global_step": 325673, "epoch": 2691} {"train_loss": -42.29604721069336, "global_step": 325674, "epoch": 2691} {"train_loss": -43.095638275146484, "global_step": 325675, "epoch": 2691} {"train_loss": -42.12614059448242, "global_step": 325676, "epoch": 2691} {"train_loss": -42.181636810302734, "global_step": 325677, "epoch": 2691} {"train_loss": -40.6280632019043, "global_step": 325678, "epoch": 2691} {"train_loss": -38.948360443115234, "global_step": 325679, "epoch": 2691} {"train_loss": -38.303707122802734, "global_step": 325680, "epoch": 2691} {"train_loss": -40.441925048828125, "global_step": 325681, "epoch": 2691} {"train_loss": -43.26252746582031, "global_step": 325682, "epoch": 2691} {"train_loss": -43.326778411865234, "global_step": 325683, "epoch": 2691} {"train_loss": -41.0111198425293, "global_step": 325684, "epoch": 2691} {"train_loss": -41.8241081237793, "global_step": 325685, "epoch": 2691} {"train_loss": -43.454307556152344, "global_step": 325686, "epoch": 2691} {"train_loss": -40.06602096557617, "global_step": 325687, "epoch": 2691} {"train_loss": -40.443115234375, "global_step": 325688, "epoch": 2691} {"train_loss": -43.150787353515625, "global_step": 325689, "epoch": 2691} {"train_loss": -43.079158782958984, "global_step": 325690, "epoch": 2691} {"train_loss": -36.41180419921875, "global_step": 325691, "epoch": 2691} {"train_loss": -43.40495681762695, "global_step": 325692, "epoch": 2691} {"train_loss": -42.54436111450195, "global_step": 325693, "epoch": 2691} {"train_loss": -42.28501510620117, "global_step": 325694, "epoch": 2691} {"train_loss": -42.31941604614258, "global_step": 325695, "epoch": 2691} {"train_loss": -39.3228759765625, "global_step": 325696, "epoch": 2691} {"train_loss": -41.88339614868164, "global_step": 325697, "epoch": 2691} {"train_loss": -41.673004150390625, "global_step": 325698, "epoch": 2691} {"train_loss": -41.0672721862793, "global_step": 325699, "epoch": 2691} {"train_loss": -42.43472671508789, "global_step": 325700, "epoch": 2691} {"train_loss": -38.195289611816406, "global_step": 325701, "epoch": 2691} {"train_loss": -40.710079193115234, "global_step": 325702, "epoch": 2691} {"train_loss": -40.852561950683594, "global_step": 325703, "epoch": 2691} {"train_loss": -42.10299301147461, "global_step": 325704, "epoch": 2691} {"train_loss": -41.71100997924805, "global_step": 325705, "epoch": 2691} {"train_loss": -42.63374710083008, "global_step": 325706, "epoch": 2691} {"train_loss": -40.76004409790039, "global_step": 325707, "epoch": 2691} {"train_loss": -41.363224029541016, "global_step": 325708, "epoch": 2691} {"train_loss": -39.189453125, "global_step": 325709, "epoch": 2691} {"train_loss": -40.89683151245117, "global_step": 325710, "epoch": 2691} {"train_loss": -42.46443557739258, "global_step": 325711, "epoch": 2691} {"train_loss": -41.939918518066406, "global_step": 325712, "epoch": 2691} {"train_loss": -39.41648483276367, "global_step": 325713, "epoch": 2691} {"train_loss": -38.766151428222656, "global_step": 325714, "epoch": 2691} {"train_loss": -42.09675216674805, "global_step": 325715, "epoch": 2691} {"train_loss": -42.68313217163086, "global_step": 325716, "epoch": 2691} {"train_loss": -40.55208969116211, "global_step": 325717, "epoch": 2691} {"train_loss": -41.859371185302734, "global_step": 325718, "epoch": 2691} {"train_loss": -42.490753173828125, "global_step": 325719, "epoch": 2691} {"train_loss": -40.79867172241211, "global_step": 325720, "epoch": 2691} {"train_loss": -41.52046585083008, "global_step": 325721, "epoch": 2691} {"train_loss": -41.74334716796875, "global_step": 325722, "epoch": 2691} {"train_loss": -39.58979415893555, "global_step": 325723, "epoch": 2691} {"train_loss": -41.39425277709961, "global_step": 325724, "epoch": 2691} {"train_loss": -42.088069915771484, "global_step": 325725, "epoch": 2691} {"train_loss": -41.66072463989258, "global_step": 325726, "epoch": 2691} {"train_loss": -42.08467483520508, "global_step": 325727, "epoch": 2691} {"train_loss": -42.918495178222656, "global_step": 325728, "epoch": 2691} {"train_loss": -41.46342086791992, "global_step": 325729, "epoch": 2691} {"train_loss": -42.87969970703125, "global_step": 325730, "epoch": 2691} {"train_loss": -42.54459109976272, "global_step": 325731, "epoch": 2691, "val_loss": 2809974.0} {"train_loss": -42.966156005859375, "global_step": 325732, "epoch": 2692} {"train_loss": -42.150169372558594, "global_step": 325733, "epoch": 2692} {"train_loss": -43.01431655883789, "global_step": 325734, "epoch": 2692} {"train_loss": -43.47554397583008, "global_step": 325735, "epoch": 2692} {"train_loss": -42.64976119995117, "global_step": 325736, "epoch": 2692} {"train_loss": -41.41094970703125, "global_step": 325737, "epoch": 2692} {"train_loss": -42.7222900390625, "global_step": 325738, "epoch": 2692} {"train_loss": -42.68310546875, "global_step": 325739, "epoch": 2692} {"train_loss": -41.503414154052734, "global_step": 325740, "epoch": 2692} {"train_loss": -43.06648635864258, "global_step": 325741, "epoch": 2692} {"train_loss": -42.352752685546875, "global_step": 325742, "epoch": 2692} {"train_loss": -43.40180969238281, "global_step": 325743, "epoch": 2692} {"train_loss": -41.98143005371094, "global_step": 325744, "epoch": 2692} {"train_loss": -43.45244216918945, "global_step": 325745, "epoch": 2692} {"train_loss": -43.197998046875, "global_step": 325746, "epoch": 2692} {"train_loss": -43.836605072021484, "global_step": 325747, "epoch": 2692} {"train_loss": -41.46035385131836, "global_step": 325748, "epoch": 2692} {"train_loss": -42.90629959106445, "global_step": 325749, "epoch": 2692} {"train_loss": -41.38058853149414, "global_step": 325750, "epoch": 2692} {"train_loss": -42.513057708740234, "global_step": 325751, "epoch": 2692} {"train_loss": -41.75545883178711, "global_step": 325752, "epoch": 2692} {"train_loss": -43.157691955566406, "global_step": 325753, "epoch": 2692} {"train_loss": -41.03071975708008, "global_step": 325754, "epoch": 2692} {"train_loss": -43.032875061035156, "global_step": 325755, "epoch": 2692} {"train_loss": -40.26414489746094, "global_step": 325756, "epoch": 2692} {"train_loss": -43.58342742919922, "global_step": 325757, "epoch": 2692} {"train_loss": -42.7592887878418, "global_step": 325758, "epoch": 2692} {"train_loss": -43.74952697753906, "global_step": 325759, "epoch": 2692} {"train_loss": -43.76941680908203, "global_step": 325760, "epoch": 2692} {"train_loss": -43.71205520629883, "global_step": 325761, "epoch": 2692} {"train_loss": -43.7615852355957, "global_step": 325762, "epoch": 2692} {"train_loss": -43.2104606628418, "global_step": 325763, "epoch": 2692} {"train_loss": -44.087467193603516, "global_step": 325764, "epoch": 2692} {"train_loss": -42.74808883666992, "global_step": 325765, "epoch": 2692} {"train_loss": -43.2723274230957, "global_step": 325766, "epoch": 2692} {"train_loss": -39.656341552734375, "global_step": 325767, "epoch": 2692} {"train_loss": -42.58939743041992, "global_step": 325768, "epoch": 2692} {"train_loss": -43.73051071166992, "global_step": 325769, "epoch": 2692} {"train_loss": -42.20717239379883, "global_step": 325770, "epoch": 2692} {"train_loss": -43.6659049987793, "global_step": 325771, "epoch": 2692} {"train_loss": -42.7996940612793, "global_step": 325772, "epoch": 2692} {"train_loss": -40.47410202026367, "global_step": 325773, "epoch": 2692} {"train_loss": -43.22237014770508, "global_step": 325774, "epoch": 2692} {"train_loss": -43.218990325927734, "global_step": 325775, "epoch": 2692} {"train_loss": -43.8003044128418, "global_step": 325776, "epoch": 2692} {"train_loss": -43.45071029663086, "global_step": 325777, "epoch": 2692} {"train_loss": -42.96842575073242, "global_step": 325778, "epoch": 2692} {"train_loss": -42.59070587158203, "global_step": 325779, "epoch": 2692} {"train_loss": -42.94301223754883, "global_step": 325780, "epoch": 2692} {"train_loss": -42.7821159362793, "global_step": 325781, "epoch": 2692} {"train_loss": -42.22211456298828, "global_step": 325782, "epoch": 2692} {"train_loss": -43.021751403808594, "global_step": 325783, "epoch": 2692} {"train_loss": -43.81661605834961, "global_step": 325784, "epoch": 2692} {"train_loss": -43.09138870239258, "global_step": 325785, "epoch": 2692} {"train_loss": -43.73226547241211, "global_step": 325786, "epoch": 2692} {"train_loss": -43.74380874633789, "global_step": 325787, "epoch": 2692} {"train_loss": -43.16709518432617, "global_step": 325788, "epoch": 2692} {"train_loss": -43.42289733886719, "global_step": 325789, "epoch": 2692} {"train_loss": -43.75339126586914, "global_step": 325790, "epoch": 2692} {"train_loss": -44.1418342590332, "global_step": 325791, "epoch": 2692} {"train_loss": -42.12563705444336, "global_step": 325792, "epoch": 2692} {"train_loss": -41.917701721191406, "global_step": 325793, "epoch": 2692} {"train_loss": -43.46382522583008, "global_step": 325794, "epoch": 2692} {"train_loss": -43.73863220214844, "global_step": 325795, "epoch": 2692} {"train_loss": -44.04812240600586, "global_step": 325796, "epoch": 2692} {"train_loss": -42.87407684326172, "global_step": 325797, "epoch": 2692} {"train_loss": -44.152828216552734, "global_step": 325798, "epoch": 2692} {"train_loss": -42.89138412475586, "global_step": 325799, "epoch": 2692} {"train_loss": -43.74196243286133, "global_step": 325800, "epoch": 2692} {"train_loss": -44.429840087890625, "global_step": 325801, "epoch": 2692} {"train_loss": -44.03904342651367, "global_step": 325802, "epoch": 2692} {"train_loss": -44.10719299316406, "global_step": 325803, "epoch": 2692} {"train_loss": -43.67570877075195, "global_step": 325804, "epoch": 2692} {"train_loss": -44.042640686035156, "global_step": 325805, "epoch": 2692} {"train_loss": -44.3904914855957, "global_step": 325806, "epoch": 2692} {"train_loss": -43.74104309082031, "global_step": 325807, "epoch": 2692} {"train_loss": -44.421913146972656, "global_step": 325808, "epoch": 2692} {"train_loss": -44.16355514526367, "global_step": 325809, "epoch": 2692} {"train_loss": -44.2189826965332, "global_step": 325810, "epoch": 2692} {"train_loss": -44.196197509765625, "global_step": 325811, "epoch": 2692} {"train_loss": -44.240203857421875, "global_step": 325812, "epoch": 2692} {"train_loss": -42.34515380859375, "global_step": 325813, "epoch": 2692} {"train_loss": -43.87238693237305, "global_step": 325814, "epoch": 2692} {"train_loss": -44.011558532714844, "global_step": 325815, "epoch": 2692} {"train_loss": -43.55320739746094, "global_step": 325816, "epoch": 2692} {"train_loss": -41.1745719909668, "global_step": 325817, "epoch": 2692} {"train_loss": -39.186588287353516, "global_step": 325818, "epoch": 2692} {"train_loss": -41.26986312866211, "global_step": 325819, "epoch": 2692} {"train_loss": -39.99401092529297, "global_step": 325820, "epoch": 2692} {"train_loss": -43.741146087646484, "global_step": 325821, "epoch": 2692} {"train_loss": -36.49406814575195, "global_step": 325822, "epoch": 2692} {"train_loss": -40.96125030517578, "global_step": 325823, "epoch": 2692} {"train_loss": -39.848976135253906, "global_step": 325824, "epoch": 2692} {"train_loss": -42.39703369140625, "global_step": 325825, "epoch": 2692} {"train_loss": -38.95121383666992, "global_step": 325826, "epoch": 2692} {"train_loss": -41.27419662475586, "global_step": 325827, "epoch": 2692} {"train_loss": -41.84366989135742, "global_step": 325828, "epoch": 2692} {"train_loss": -42.73011016845703, "global_step": 325829, "epoch": 2692} {"train_loss": -38.89278793334961, "global_step": 325830, "epoch": 2692} {"train_loss": -41.3228645324707, "global_step": 325831, "epoch": 2692} {"train_loss": -40.61648178100586, "global_step": 325832, "epoch": 2692} {"train_loss": -42.613616943359375, "global_step": 325833, "epoch": 2692} {"train_loss": -38.0853157043457, "global_step": 325834, "epoch": 2692} {"train_loss": -37.362159729003906, "global_step": 325835, "epoch": 2692} {"train_loss": -36.32975769042969, "global_step": 325836, "epoch": 2692} {"train_loss": -32.69012451171875, "global_step": 325837, "epoch": 2692} {"train_loss": -37.42067337036133, "global_step": 325838, "epoch": 2692} {"train_loss": -36.985130310058594, "global_step": 325839, "epoch": 2692} {"train_loss": -39.14898681640625, "global_step": 325840, "epoch": 2692} {"train_loss": -35.851898193359375, "global_step": 325841, "epoch": 2692} {"train_loss": -40.18842315673828, "global_step": 325842, "epoch": 2692} {"train_loss": -39.52654266357422, "global_step": 325843, "epoch": 2692} {"train_loss": -41.68134307861328, "global_step": 325844, "epoch": 2692} {"train_loss": -38.67141342163086, "global_step": 325845, "epoch": 2692} {"train_loss": -40.36198043823242, "global_step": 325846, "epoch": 2692} {"train_loss": -41.93632888793945, "global_step": 325847, "epoch": 2692} {"train_loss": -39.12797164916992, "global_step": 325848, "epoch": 2692} {"train_loss": -38.84577178955078, "global_step": 325849, "epoch": 2692} {"train_loss": -41.32949447631836, "global_step": 325850, "epoch": 2692} {"train_loss": -40.94442367553711, "global_step": 325851, "epoch": 2692} {"train_loss": -42.09934174718936, "global_step": 325852, "epoch": 2692, "val_loss": 3109254.25} {"train_loss": -41.718971252441406, "global_step": 325853, "epoch": 2693} {"train_loss": -42.269142150878906, "global_step": 325854, "epoch": 2693} {"train_loss": -42.80845642089844, "global_step": 325855, "epoch": 2693} {"train_loss": -41.84016799926758, "global_step": 325856, "epoch": 2693} {"train_loss": -41.04075241088867, "global_step": 325857, "epoch": 2693} {"train_loss": -38.745155334472656, "global_step": 325858, "epoch": 2693} {"train_loss": -41.14321517944336, "global_step": 325859, "epoch": 2693} {"train_loss": -41.72479248046875, "global_step": 325860, "epoch": 2693} {"train_loss": -41.21415328979492, "global_step": 325861, "epoch": 2693} {"train_loss": -41.7570686340332, "global_step": 325862, "epoch": 2693} {"train_loss": -41.835487365722656, "global_step": 325863, "epoch": 2693} {"train_loss": -40.88655471801758, "global_step": 325864, "epoch": 2693} {"train_loss": -42.151275634765625, "global_step": 325865, "epoch": 2693} {"train_loss": -41.98539733886719, "global_step": 325866, "epoch": 2693} {"train_loss": -42.419952392578125, "global_step": 325867, "epoch": 2693} {"train_loss": -41.65959548950195, "global_step": 325868, "epoch": 2693} {"train_loss": -41.74178695678711, "global_step": 325869, "epoch": 2693} {"train_loss": -40.186073303222656, "global_step": 325870, "epoch": 2693} {"train_loss": -41.805023193359375, "global_step": 325871, "epoch": 2693} {"train_loss": -42.004554748535156, "global_step": 325872, "epoch": 2693} {"train_loss": -41.60187530517578, "global_step": 325873, "epoch": 2693} {"train_loss": -41.66141891479492, "global_step": 325874, "epoch": 2693} {"train_loss": -41.768943786621094, "global_step": 325875, "epoch": 2693} {"train_loss": -39.77334213256836, "global_step": 325876, "epoch": 2693} {"train_loss": -41.14095687866211, "global_step": 325877, "epoch": 2693} {"train_loss": -37.89920425415039, "global_step": 325878, "epoch": 2693} {"train_loss": -42.41737365722656, "global_step": 325879, "epoch": 2693} {"train_loss": -41.283660888671875, "global_step": 325880, "epoch": 2693} {"train_loss": -42.12862777709961, "global_step": 325881, "epoch": 2693} {"train_loss": -43.234004974365234, "global_step": 325882, "epoch": 2693} {"train_loss": -39.96318435668945, "global_step": 325883, "epoch": 2693} {"train_loss": -42.90778732299805, "global_step": 325884, "epoch": 2693} {"train_loss": -41.67570114135742, "global_step": 325885, "epoch": 2693} {"train_loss": -40.98576736450195, "global_step": 325886, "epoch": 2693} {"train_loss": -41.35645294189453, "global_step": 325887, "epoch": 2693} {"train_loss": -43.09307861328125, "global_step": 325888, "epoch": 2693} {"train_loss": -40.75433349609375, "global_step": 325889, "epoch": 2693} {"train_loss": -42.73246383666992, "global_step": 325890, "epoch": 2693} {"train_loss": -41.32877731323242, "global_step": 325891, "epoch": 2693} {"train_loss": -37.24174118041992, "global_step": 325892, "epoch": 2693} {"train_loss": -42.3390998840332, "global_step": 325893, "epoch": 2693} {"train_loss": -41.882171630859375, "global_step": 325894, "epoch": 2693} {"train_loss": -40.07120895385742, "global_step": 325895, "epoch": 2693} {"train_loss": -42.81696701049805, "global_step": 325896, "epoch": 2693} {"train_loss": -42.10840606689453, "global_step": 325897, "epoch": 2693} {"train_loss": -43.25950241088867, "global_step": 325898, "epoch": 2693} {"train_loss": -40.966121673583984, "global_step": 325899, "epoch": 2693} {"train_loss": -42.320526123046875, "global_step": 325900, "epoch": 2693} {"train_loss": -42.563560485839844, "global_step": 325901, "epoch": 2693} {"train_loss": -42.76585006713867, "global_step": 325902, "epoch": 2693} {"train_loss": -41.5295295715332, "global_step": 325903, "epoch": 2693} {"train_loss": -42.1095085144043, "global_step": 325904, "epoch": 2693} {"train_loss": -42.759857177734375, "global_step": 325905, "epoch": 2693} {"train_loss": -42.10943603515625, "global_step": 325906, "epoch": 2693} {"train_loss": -41.87788772583008, "global_step": 325907, "epoch": 2693} {"train_loss": -42.937957763671875, "global_step": 325908, "epoch": 2693} {"train_loss": -42.560028076171875, "global_step": 325909, "epoch": 2693} {"train_loss": -42.59193801879883, "global_step": 325910, "epoch": 2693} {"train_loss": -42.31954574584961, "global_step": 325911, "epoch": 2693} {"train_loss": -40.98749923706055, "global_step": 325912, "epoch": 2693} {"train_loss": -41.058387756347656, "global_step": 325913, "epoch": 2693} {"train_loss": -41.190818786621094, "global_step": 325914, "epoch": 2693} {"train_loss": -43.321014404296875, "global_step": 325915, "epoch": 2693} {"train_loss": -42.30440902709961, "global_step": 325916, "epoch": 2693} {"train_loss": -43.321510314941406, "global_step": 325917, "epoch": 2693} {"train_loss": -42.963130950927734, "global_step": 325918, "epoch": 2693} {"train_loss": -43.302669525146484, "global_step": 325919, "epoch": 2693} {"train_loss": -42.82046127319336, "global_step": 325920, "epoch": 2693} {"train_loss": -42.03310012817383, "global_step": 325921, "epoch": 2693} {"train_loss": -41.993343353271484, "global_step": 325922, "epoch": 2693} {"train_loss": -42.81343078613281, "global_step": 325923, "epoch": 2693} {"train_loss": -43.24470138549805, "global_step": 325924, "epoch": 2693} {"train_loss": -41.925025939941406, "global_step": 325925, "epoch": 2693} {"train_loss": -41.37968063354492, "global_step": 325926, "epoch": 2693} {"train_loss": -42.04487991333008, "global_step": 325927, "epoch": 2693} {"train_loss": -42.342464447021484, "global_step": 325928, "epoch": 2693} {"train_loss": -42.65407943725586, "global_step": 325929, "epoch": 2693} {"train_loss": -43.11433792114258, "global_step": 325930, "epoch": 2693} {"train_loss": -43.05571365356445, "global_step": 325931, "epoch": 2693} {"train_loss": -43.295440673828125, "global_step": 325932, "epoch": 2693} {"train_loss": -42.85026550292969, "global_step": 325933, "epoch": 2693} {"train_loss": -43.5289421081543, "global_step": 325934, "epoch": 2693} {"train_loss": -43.4134521484375, "global_step": 325935, "epoch": 2693} {"train_loss": -43.41889572143555, "global_step": 325936, "epoch": 2693} {"train_loss": -43.10908508300781, "global_step": 325937, "epoch": 2693} {"train_loss": -43.48421859741211, "global_step": 325938, "epoch": 2693} {"train_loss": -43.85144805908203, "global_step": 325939, "epoch": 2693} {"train_loss": -43.595069885253906, "global_step": 325940, "epoch": 2693} {"train_loss": -42.952091217041016, "global_step": 325941, "epoch": 2693} {"train_loss": -42.72687530517578, "global_step": 325942, "epoch": 2693} {"train_loss": -43.16584396362305, "global_step": 325943, "epoch": 2693} {"train_loss": -43.66132354736328, "global_step": 325944, "epoch": 2693} {"train_loss": -43.82304000854492, "global_step": 325945, "epoch": 2693} {"train_loss": -43.85509490966797, "global_step": 325946, "epoch": 2693} {"train_loss": -43.04154968261719, "global_step": 325947, "epoch": 2693} {"train_loss": -43.10353469848633, "global_step": 325948, "epoch": 2693} {"train_loss": -43.759986877441406, "global_step": 325949, "epoch": 2693} {"train_loss": -43.86784744262695, "global_step": 325950, "epoch": 2693} {"train_loss": -43.722877502441406, "global_step": 325951, "epoch": 2693} {"train_loss": -43.565650939941406, "global_step": 325952, "epoch": 2693} {"train_loss": -43.293514251708984, "global_step": 325953, "epoch": 2693} {"train_loss": -43.87546920776367, "global_step": 325954, "epoch": 2693} {"train_loss": -43.956298828125, "global_step": 325955, "epoch": 2693} {"train_loss": -43.11593246459961, "global_step": 325956, "epoch": 2693} {"train_loss": -43.74026107788086, "global_step": 325957, "epoch": 2693} {"train_loss": -42.80789566040039, "global_step": 325958, "epoch": 2693} {"train_loss": -44.18458557128906, "global_step": 325959, "epoch": 2693} {"train_loss": -43.653255462646484, "global_step": 325960, "epoch": 2693} {"train_loss": -43.22174072265625, "global_step": 325961, "epoch": 2693} {"train_loss": -41.81503677368164, "global_step": 325962, "epoch": 2693} {"train_loss": -43.118682861328125, "global_step": 325963, "epoch": 2693} {"train_loss": -43.71577835083008, "global_step": 325964, "epoch": 2693} {"train_loss": -43.540809631347656, "global_step": 325965, "epoch": 2693} {"train_loss": -43.68339538574219, "global_step": 325966, "epoch": 2693} {"train_loss": -42.969425201416016, "global_step": 325967, "epoch": 2693} {"train_loss": -42.93935012817383, "global_step": 325968, "epoch": 2693} {"train_loss": -43.14651107788086, "global_step": 325969, "epoch": 2693} {"train_loss": -43.81427764892578, "global_step": 325970, "epoch": 2693} {"train_loss": -43.34908676147461, "global_step": 325971, "epoch": 2693} {"train_loss": -43.60908126831055, "global_step": 325972, "epoch": 2693} {"train_loss": -42.381902489780394, "global_step": 325973, "epoch": 2693, "val_loss": 2890524.75} {"train_loss": -43.252593994140625, "global_step": 325974, "epoch": 2694} {"train_loss": -43.52478790283203, "global_step": 325975, "epoch": 2694} {"train_loss": -43.76986312866211, "global_step": 325976, "epoch": 2694} {"train_loss": -43.182899475097656, "global_step": 325977, "epoch": 2694} {"train_loss": -43.89141082763672, "global_step": 325978, "epoch": 2694} {"train_loss": -43.074462890625, "global_step": 325979, "epoch": 2694} {"train_loss": -42.4724006652832, "global_step": 325980, "epoch": 2694} {"train_loss": -42.14801788330078, "global_step": 325981, "epoch": 2694} {"train_loss": -42.31691360473633, "global_step": 325982, "epoch": 2694} {"train_loss": -42.71867370605469, "global_step": 325983, "epoch": 2694} {"train_loss": -42.70262145996094, "global_step": 325984, "epoch": 2694} {"train_loss": -42.70037078857422, "global_step": 325985, "epoch": 2694} {"train_loss": -43.20633316040039, "global_step": 325986, "epoch": 2694} {"train_loss": -43.26411056518555, "global_step": 325987, "epoch": 2694} {"train_loss": -42.724517822265625, "global_step": 325988, "epoch": 2694} {"train_loss": -41.375335693359375, "global_step": 325989, "epoch": 2694} {"train_loss": -36.017330169677734, "global_step": 325990, "epoch": 2694} {"train_loss": -38.806488037109375, "global_step": 325991, "epoch": 2694} {"train_loss": -41.72740173339844, "global_step": 325992, "epoch": 2694} {"train_loss": -42.48801040649414, "global_step": 325993, "epoch": 2694} {"train_loss": -40.25787353515625, "global_step": 325994, "epoch": 2694} {"train_loss": -37.6112060546875, "global_step": 325995, "epoch": 2694} {"train_loss": -40.09922409057617, "global_step": 325996, "epoch": 2694} {"train_loss": -35.716217041015625, "global_step": 325997, "epoch": 2694} {"train_loss": -36.28191375732422, "global_step": 325998, "epoch": 2694} {"train_loss": -41.69350051879883, "global_step": 325999, "epoch": 2694} {"train_loss": -35.18380355834961, "global_step": 326000, "epoch": 2694} {"train_loss": -41.21513748168945, "global_step": 326001, "epoch": 2694} {"train_loss": -38.654483795166016, "global_step": 326002, "epoch": 2694} {"train_loss": -38.6350212097168, "global_step": 326003, "epoch": 2694} {"train_loss": -41.8343620300293, "global_step": 326004, "epoch": 2694} {"train_loss": -38.023658752441406, "global_step": 326005, "epoch": 2694} {"train_loss": -42.31620788574219, "global_step": 326006, "epoch": 2694} {"train_loss": -39.6936149597168, "global_step": 326007, "epoch": 2694} {"train_loss": -41.96200180053711, "global_step": 326008, "epoch": 2694} {"train_loss": -41.25838851928711, "global_step": 326009, "epoch": 2694} {"train_loss": -40.59141159057617, "global_step": 326010, "epoch": 2694} {"train_loss": -41.2371826171875, "global_step": 326011, "epoch": 2694} {"train_loss": -42.51628112792969, "global_step": 326012, "epoch": 2694} {"train_loss": -40.946842193603516, "global_step": 326013, "epoch": 2694} {"train_loss": -42.098262786865234, "global_step": 326014, "epoch": 2694} {"train_loss": -40.79425048828125, "global_step": 326015, "epoch": 2694} {"train_loss": -42.881160736083984, "global_step": 326016, "epoch": 2694} {"train_loss": -41.81086349487305, "global_step": 326017, "epoch": 2694} {"train_loss": -42.27283477783203, "global_step": 326018, "epoch": 2694} {"train_loss": -42.288997650146484, "global_step": 326019, "epoch": 2694} {"train_loss": -41.812103271484375, "global_step": 326020, "epoch": 2694} {"train_loss": -42.29572296142578, "global_step": 326021, "epoch": 2694} {"train_loss": -42.431026458740234, "global_step": 326022, "epoch": 2694} {"train_loss": -43.01685333251953, "global_step": 326023, "epoch": 2694} {"train_loss": -42.29282760620117, "global_step": 326024, "epoch": 2694} {"train_loss": -42.7629508972168, "global_step": 326025, "epoch": 2694} {"train_loss": -42.33452224731445, "global_step": 326026, "epoch": 2694} {"train_loss": -39.948787689208984, "global_step": 326027, "epoch": 2694} {"train_loss": -42.855228424072266, "global_step": 326028, "epoch": 2694} {"train_loss": -43.26594161987305, "global_step": 326029, "epoch": 2694} {"train_loss": -43.34585189819336, "global_step": 326030, "epoch": 2694} {"train_loss": -42.762325286865234, "global_step": 326031, "epoch": 2694} {"train_loss": -43.204280853271484, "global_step": 326032, "epoch": 2694} {"train_loss": -43.32491683959961, "global_step": 326033, "epoch": 2694} {"train_loss": -43.05115509033203, "global_step": 326034, "epoch": 2694} {"train_loss": -41.59674835205078, "global_step": 326035, "epoch": 2694} {"train_loss": -42.543190002441406, "global_step": 326036, "epoch": 2694} {"train_loss": -42.762855529785156, "global_step": 326037, "epoch": 2694} {"train_loss": -43.129600524902344, "global_step": 326038, "epoch": 2694} {"train_loss": -43.42390823364258, "global_step": 326039, "epoch": 2694} {"train_loss": -43.11769485473633, "global_step": 326040, "epoch": 2694} {"train_loss": -43.58184814453125, "global_step": 326041, "epoch": 2694} {"train_loss": -43.377933502197266, "global_step": 326042, "epoch": 2694} {"train_loss": -43.68052291870117, "global_step": 326043, "epoch": 2694} {"train_loss": -43.21900177001953, "global_step": 326044, "epoch": 2694} {"train_loss": -42.347938537597656, "global_step": 326045, "epoch": 2694} {"train_loss": -43.4954833984375, "global_step": 326046, "epoch": 2694} {"train_loss": -43.969642639160156, "global_step": 326047, "epoch": 2694} {"train_loss": -43.7841682434082, "global_step": 326048, "epoch": 2694} {"train_loss": -43.59025955200195, "global_step": 326049, "epoch": 2694} {"train_loss": -43.4478874206543, "global_step": 326050, "epoch": 2694} {"train_loss": -43.63520050048828, "global_step": 326051, "epoch": 2694} {"train_loss": -43.41469192504883, "global_step": 326052, "epoch": 2694} {"train_loss": -43.11737060546875, "global_step": 326053, "epoch": 2694} {"train_loss": -43.62970733642578, "global_step": 326054, "epoch": 2694} {"train_loss": -43.42513656616211, "global_step": 326055, "epoch": 2694} {"train_loss": -43.99363327026367, "global_step": 326056, "epoch": 2694} {"train_loss": -43.520103454589844, "global_step": 326057, "epoch": 2694} {"train_loss": -43.60124206542969, "global_step": 326058, "epoch": 2694} {"train_loss": -43.662757873535156, "global_step": 326059, "epoch": 2694} {"train_loss": -43.93912887573242, "global_step": 326060, "epoch": 2694} {"train_loss": -43.60236358642578, "global_step": 326061, "epoch": 2694} {"train_loss": -43.659698486328125, "global_step": 326062, "epoch": 2694} {"train_loss": -43.8275146484375, "global_step": 326063, "epoch": 2694} {"train_loss": -43.46662139892578, "global_step": 326064, "epoch": 2694} {"train_loss": -43.405269622802734, "global_step": 326065, "epoch": 2694} {"train_loss": -43.33051681518555, "global_step": 326066, "epoch": 2694} {"train_loss": -43.390926361083984, "global_step": 326067, "epoch": 2694} {"train_loss": -43.926517486572266, "global_step": 326068, "epoch": 2694} {"train_loss": -43.60236358642578, "global_step": 326069, "epoch": 2694} {"train_loss": -43.60083770751953, "global_step": 326070, "epoch": 2694} {"train_loss": -42.17698669433594, "global_step": 326071, "epoch": 2694} {"train_loss": -43.78608703613281, "global_step": 326072, "epoch": 2694} {"train_loss": -43.46714401245117, "global_step": 326073, "epoch": 2694} {"train_loss": -44.37775802612305, "global_step": 326074, "epoch": 2694} {"train_loss": -44.17725372314453, "global_step": 326075, "epoch": 2694} {"train_loss": -43.40053939819336, "global_step": 326076, "epoch": 2694} {"train_loss": -43.79266357421875, "global_step": 326077, "epoch": 2694} {"train_loss": -43.90003204345703, "global_step": 326078, "epoch": 2694} {"train_loss": -43.46006393432617, "global_step": 326079, "epoch": 2694} {"train_loss": -44.16315841674805, "global_step": 326080, "epoch": 2694} {"train_loss": -44.08146667480469, "global_step": 326081, "epoch": 2694} {"train_loss": -44.139583587646484, "global_step": 326082, "epoch": 2694} {"train_loss": -44.077728271484375, "global_step": 326083, "epoch": 2694} {"train_loss": -43.61867904663086, "global_step": 326084, "epoch": 2694} {"train_loss": -43.62552261352539, "global_step": 326085, "epoch": 2694} {"train_loss": -42.98926544189453, "global_step": 326086, "epoch": 2694} {"train_loss": -41.04200744628906, "global_step": 326087, "epoch": 2694} {"train_loss": -42.4556884765625, "global_step": 326088, "epoch": 2694} {"train_loss": -42.731109619140625, "global_step": 326089, "epoch": 2694} {"train_loss": -42.70192337036133, "global_step": 326090, "epoch": 2694} {"train_loss": -43.9586067199707, "global_step": 326091, "epoch": 2694} {"train_loss": -44.29711151123047, "global_step": 326092, "epoch": 2694} {"train_loss": -44.27657699584961, "global_step": 326093, "epoch": 2694} {"train_loss": -42.474451049300264, "global_step": 326094, "epoch": 2694, "val_loss": 2832364.0} {"train_loss": -43.160945892333984, "global_step": 326095, "epoch": 2695} {"train_loss": -43.49668502807617, "global_step": 326096, "epoch": 2695} {"train_loss": -42.83590316772461, "global_step": 326097, "epoch": 2695} {"train_loss": -43.4771728515625, "global_step": 326098, "epoch": 2695} {"train_loss": -42.74373245239258, "global_step": 326099, "epoch": 2695} {"train_loss": -40.23690414428711, "global_step": 326100, "epoch": 2695} {"train_loss": -41.22425079345703, "global_step": 326101, "epoch": 2695} {"train_loss": -43.2698860168457, "global_step": 326102, "epoch": 2695} {"train_loss": -43.379940032958984, "global_step": 326103, "epoch": 2695} {"train_loss": -41.405818939208984, "global_step": 326104, "epoch": 2695} {"train_loss": -42.82198715209961, "global_step": 326105, "epoch": 2695} {"train_loss": -43.504112243652344, "global_step": 326106, "epoch": 2695} {"train_loss": -42.812232971191406, "global_step": 326107, "epoch": 2695} {"train_loss": -42.0024528503418, "global_step": 326108, "epoch": 2695} {"train_loss": -39.96499252319336, "global_step": 326109, "epoch": 2695} {"train_loss": -39.24508285522461, "global_step": 326110, "epoch": 2695} {"train_loss": -43.36357498168945, "global_step": 326111, "epoch": 2695} {"train_loss": -43.54774856567383, "global_step": 326112, "epoch": 2695} {"train_loss": -42.353553771972656, "global_step": 326113, "epoch": 2695} {"train_loss": -42.43658447265625, "global_step": 326114, "epoch": 2695} {"train_loss": -42.1820182800293, "global_step": 326115, "epoch": 2695} {"train_loss": -43.27582550048828, "global_step": 326116, "epoch": 2695} {"train_loss": -43.1478271484375, "global_step": 326117, "epoch": 2695} {"train_loss": -39.73507308959961, "global_step": 326118, "epoch": 2695} {"train_loss": -42.656524658203125, "global_step": 326119, "epoch": 2695} {"train_loss": -43.24763107299805, "global_step": 326120, "epoch": 2695} {"train_loss": -43.49396896362305, "global_step": 326121, "epoch": 2695} {"train_loss": -42.41717529296875, "global_step": 326122, "epoch": 2695} {"train_loss": -43.4644889831543, "global_step": 326123, "epoch": 2695} {"train_loss": -43.142452239990234, "global_step": 326124, "epoch": 2695} {"train_loss": -43.32949447631836, "global_step": 326125, "epoch": 2695} {"train_loss": -43.5595817565918, "global_step": 326126, "epoch": 2695} {"train_loss": -43.61646270751953, "global_step": 326127, "epoch": 2695} {"train_loss": -43.52400588989258, "global_step": 326128, "epoch": 2695} {"train_loss": -42.97984313964844, "global_step": 326129, "epoch": 2695} {"train_loss": -43.804542541503906, "global_step": 326130, "epoch": 2695} {"train_loss": -43.34066390991211, "global_step": 326131, "epoch": 2695} {"train_loss": -41.4549674987793, "global_step": 326132, "epoch": 2695} {"train_loss": -39.96863555908203, "global_step": 326133, "epoch": 2695} {"train_loss": -40.49170684814453, "global_step": 326134, "epoch": 2695} {"train_loss": -43.14665222167969, "global_step": 326135, "epoch": 2695} {"train_loss": -43.88985061645508, "global_step": 326136, "epoch": 2695} {"train_loss": -43.46718978881836, "global_step": 326137, "epoch": 2695} {"train_loss": -43.71627426147461, "global_step": 326138, "epoch": 2695} {"train_loss": -39.833560943603516, "global_step": 326139, "epoch": 2695} {"train_loss": -43.4176139831543, "global_step": 326140, "epoch": 2695} {"train_loss": -43.6353759765625, "global_step": 326141, "epoch": 2695} {"train_loss": -43.55463790893555, "global_step": 326142, "epoch": 2695} {"train_loss": -43.12372970581055, "global_step": 326143, "epoch": 2695} {"train_loss": -43.37263107299805, "global_step": 326144, "epoch": 2695} {"train_loss": -43.73115921020508, "global_step": 326145, "epoch": 2695} {"train_loss": -43.3551139831543, "global_step": 326146, "epoch": 2695} {"train_loss": -42.897857666015625, "global_step": 326147, "epoch": 2695} {"train_loss": -42.229217529296875, "global_step": 326148, "epoch": 2695} {"train_loss": -43.39695358276367, "global_step": 326149, "epoch": 2695} {"train_loss": -41.77183151245117, "global_step": 326150, "epoch": 2695} {"train_loss": -43.03629684448242, "global_step": 326151, "epoch": 2695} {"train_loss": -42.85184097290039, "global_step": 326152, "epoch": 2695} {"train_loss": -43.01727294921875, "global_step": 326153, "epoch": 2695} {"train_loss": -43.6026725769043, "global_step": 326154, "epoch": 2695} {"train_loss": -43.9381217956543, "global_step": 326155, "epoch": 2695} {"train_loss": -42.59381866455078, "global_step": 326156, "epoch": 2695} {"train_loss": -42.841346740722656, "global_step": 326157, "epoch": 2695} {"train_loss": -43.088783264160156, "global_step": 326158, "epoch": 2695} {"train_loss": -43.92576599121094, "global_step": 326159, "epoch": 2695} {"train_loss": -43.179901123046875, "global_step": 326160, "epoch": 2695} {"train_loss": -43.1984748840332, "global_step": 326161, "epoch": 2695} {"train_loss": -41.55543518066406, "global_step": 326162, "epoch": 2695} {"train_loss": -43.03445816040039, "global_step": 326163, "epoch": 2695} {"train_loss": -40.355220794677734, "global_step": 326164, "epoch": 2695} {"train_loss": -40.51682662963867, "global_step": 326165, "epoch": 2695} {"train_loss": -43.52822494506836, "global_step": 326166, "epoch": 2695} {"train_loss": -43.5709228515625, "global_step": 326167, "epoch": 2695} {"train_loss": -43.31414031982422, "global_step": 326168, "epoch": 2695} {"train_loss": -41.57839584350586, "global_step": 326169, "epoch": 2695} {"train_loss": -43.42706298828125, "global_step": 326170, "epoch": 2695} {"train_loss": -43.5326042175293, "global_step": 326171, "epoch": 2695} {"train_loss": -43.55678176879883, "global_step": 326172, "epoch": 2695} {"train_loss": -40.934722900390625, "global_step": 326173, "epoch": 2695} {"train_loss": -42.4561882019043, "global_step": 326174, "epoch": 2695} {"train_loss": -34.632080078125, "global_step": 326175, "epoch": 2695} {"train_loss": -41.88285827636719, "global_step": 326176, "epoch": 2695} {"train_loss": -42.71382522583008, "global_step": 326177, "epoch": 2695} {"train_loss": -41.96867752075195, "global_step": 326178, "epoch": 2695} {"train_loss": -39.40362548828125, "global_step": 326179, "epoch": 2695} {"train_loss": -42.566650390625, "global_step": 326180, "epoch": 2695} {"train_loss": -41.927490234375, "global_step": 326181, "epoch": 2695} {"train_loss": -40.31022644042969, "global_step": 326182, "epoch": 2695} {"train_loss": -37.047515869140625, "global_step": 326183, "epoch": 2695} {"train_loss": -39.1191520690918, "global_step": 326184, "epoch": 2695} {"train_loss": -27.314115524291992, "global_step": 326185, "epoch": 2695} {"train_loss": -40.36629867553711, "global_step": 326186, "epoch": 2695} {"train_loss": -40.1320686340332, "global_step": 326187, "epoch": 2695} {"train_loss": -37.23554611206055, "global_step": 326188, "epoch": 2695} {"train_loss": -40.782535552978516, "global_step": 326189, "epoch": 2695} {"train_loss": -38.91499710083008, "global_step": 326190, "epoch": 2695} {"train_loss": -42.15972900390625, "global_step": 326191, "epoch": 2695} {"train_loss": -41.65770721435547, "global_step": 326192, "epoch": 2695} {"train_loss": -41.7480354309082, "global_step": 326193, "epoch": 2695} {"train_loss": -42.00864791870117, "global_step": 326194, "epoch": 2695} {"train_loss": -20.05156898498535, "global_step": 326195, "epoch": 2695} {"train_loss": -42.07477951049805, "global_step": 326196, "epoch": 2695} {"train_loss": -39.09779357910156, "global_step": 326197, "epoch": 2695} {"train_loss": -41.68874740600586, "global_step": 326198, "epoch": 2695} {"train_loss": -41.75123977661133, "global_step": 326199, "epoch": 2695} {"train_loss": -41.907283782958984, "global_step": 326200, "epoch": 2695} {"train_loss": -36.38043212890625, "global_step": 326201, "epoch": 2695} {"train_loss": -37.5626106262207, "global_step": 326202, "epoch": 2695} {"train_loss": -37.83028793334961, "global_step": 326203, "epoch": 2695} {"train_loss": -38.181251525878906, "global_step": 326204, "epoch": 2695} {"train_loss": -30.733509063720703, "global_step": 326205, "epoch": 2695} {"train_loss": -39.87935256958008, "global_step": 326206, "epoch": 2695} {"train_loss": -38.76266098022461, "global_step": 326207, "epoch": 2695} {"train_loss": -40.568355560302734, "global_step": 326208, "epoch": 2695} {"train_loss": -41.00299835205078, "global_step": 326209, "epoch": 2695} {"train_loss": -38.152828216552734, "global_step": 326210, "epoch": 2695} {"train_loss": -32.629547119140625, "global_step": 326211, "epoch": 2695} {"train_loss": -36.906951904296875, "global_step": 326212, "epoch": 2695} {"train_loss": -37.5284538269043, "global_step": 326213, "epoch": 2695} {"train_loss": -37.54698944091797, "global_step": 326214, "epoch": 2695} {"train_loss": -41.28027807188428, "global_step": 326215, "epoch": 2695, "val_loss": 2969088.0} {"train_loss": -39.2199592590332, "global_step": 326216, "epoch": 2696} {"train_loss": -39.05790328979492, "global_step": 326217, "epoch": 2696} {"train_loss": -40.069332122802734, "global_step": 326218, "epoch": 2696} {"train_loss": -39.406490325927734, "global_step": 326219, "epoch": 2696} {"train_loss": -40.48170852661133, "global_step": 326220, "epoch": 2696} {"train_loss": -39.56012725830078, "global_step": 326221, "epoch": 2696} {"train_loss": -39.1385383605957, "global_step": 326222, "epoch": 2696} {"train_loss": -40.96772003173828, "global_step": 326223, "epoch": 2696} {"train_loss": -40.45948028564453, "global_step": 326224, "epoch": 2696} {"train_loss": -41.18832778930664, "global_step": 326225, "epoch": 2696} {"train_loss": -39.60244369506836, "global_step": 326226, "epoch": 2696} {"train_loss": -36.07243728637695, "global_step": 326227, "epoch": 2696} {"train_loss": -41.83103561401367, "global_step": 326228, "epoch": 2696} {"train_loss": -41.7728385925293, "global_step": 326229, "epoch": 2696} {"train_loss": -40.801639556884766, "global_step": 326230, "epoch": 2696} {"train_loss": -41.0389289855957, "global_step": 326231, "epoch": 2696} {"train_loss": -40.45042037963867, "global_step": 326232, "epoch": 2696} {"train_loss": -40.64216995239258, "global_step": 326233, "epoch": 2696} {"train_loss": -40.44240188598633, "global_step": 326234, "epoch": 2696} {"train_loss": -37.02070617675781, "global_step": 326235, "epoch": 2696} {"train_loss": -41.400325775146484, "global_step": 326236, "epoch": 2696} {"train_loss": -41.8805046081543, "global_step": 326237, "epoch": 2696} {"train_loss": -41.09709548950195, "global_step": 326238, "epoch": 2696} {"train_loss": -41.074459075927734, "global_step": 326239, "epoch": 2696} {"train_loss": -41.73111343383789, "global_step": 326240, "epoch": 2696} {"train_loss": -41.705013275146484, "global_step": 326241, "epoch": 2696} {"train_loss": -37.86149215698242, "global_step": 326242, "epoch": 2696} {"train_loss": -39.922889709472656, "global_step": 326243, "epoch": 2696} {"train_loss": -41.53610610961914, "global_step": 326244, "epoch": 2696} {"train_loss": -41.4443244934082, "global_step": 326245, "epoch": 2696} {"train_loss": -40.67460250854492, "global_step": 326246, "epoch": 2696} {"train_loss": -41.855892181396484, "global_step": 326247, "epoch": 2696} {"train_loss": -42.03103256225586, "global_step": 326248, "epoch": 2696} {"train_loss": -41.56574630737305, "global_step": 326249, "epoch": 2696} {"train_loss": -41.82050323486328, "global_step": 326250, "epoch": 2696} {"train_loss": -41.0979118347168, "global_step": 326251, "epoch": 2696} {"train_loss": -41.77915954589844, "global_step": 326252, "epoch": 2696} {"train_loss": -42.32820510864258, "global_step": 326253, "epoch": 2696} {"train_loss": -41.702667236328125, "global_step": 326254, "epoch": 2696} {"train_loss": -34.111572265625, "global_step": 326255, "epoch": 2696} {"train_loss": -42.13722229003906, "global_step": 326256, "epoch": 2696} {"train_loss": -41.51678466796875, "global_step": 326257, "epoch": 2696} {"train_loss": -41.149085998535156, "global_step": 326258, "epoch": 2696} {"train_loss": -41.61277770996094, "global_step": 326259, "epoch": 2696} {"train_loss": -40.416866302490234, "global_step": 326260, "epoch": 2696} {"train_loss": -41.86677169799805, "global_step": 326261, "epoch": 2696} {"train_loss": -41.327857971191406, "global_step": 326262, "epoch": 2696} {"train_loss": -37.12175369262695, "global_step": 326263, "epoch": 2696} {"train_loss": -41.5463981628418, "global_step": 326264, "epoch": 2696} {"train_loss": -41.642459869384766, "global_step": 326265, "epoch": 2696} {"train_loss": -41.33991241455078, "global_step": 326266, "epoch": 2696} {"train_loss": -41.07223129272461, "global_step": 326267, "epoch": 2696} {"train_loss": -40.95608139038086, "global_step": 326268, "epoch": 2696} {"train_loss": -42.3074951171875, "global_step": 326269, "epoch": 2696} {"train_loss": -40.1192626953125, "global_step": 326270, "epoch": 2696} {"train_loss": -41.648529052734375, "global_step": 326271, "epoch": 2696} {"train_loss": -41.43206024169922, "global_step": 326272, "epoch": 2696} {"train_loss": -40.56783676147461, "global_step": 326273, "epoch": 2696} {"train_loss": -41.727630615234375, "global_step": 326274, "epoch": 2696} {"train_loss": -42.09125900268555, "global_step": 326275, "epoch": 2696} {"train_loss": -41.9101676940918, "global_step": 326276, "epoch": 2696} {"train_loss": -42.35213088989258, "global_step": 326277, "epoch": 2696} {"train_loss": -41.23964309692383, "global_step": 326278, "epoch": 2696} {"train_loss": -41.19350814819336, "global_step": 326279, "epoch": 2696} {"train_loss": -42.188880920410156, "global_step": 326280, "epoch": 2696} {"train_loss": -42.205989837646484, "global_step": 326281, "epoch": 2696} {"train_loss": -40.97719955444336, "global_step": 326282, "epoch": 2696} {"train_loss": -42.481441497802734, "global_step": 326283, "epoch": 2696} {"train_loss": -41.871646881103516, "global_step": 326284, "epoch": 2696} {"train_loss": -41.18496322631836, "global_step": 326285, "epoch": 2696} {"train_loss": -41.79219055175781, "global_step": 326286, "epoch": 2696} {"train_loss": -42.2500114440918, "global_step": 326287, "epoch": 2696} {"train_loss": -41.722835540771484, "global_step": 326288, "epoch": 2696} {"train_loss": -37.9551887512207, "global_step": 326289, "epoch": 2696} {"train_loss": -42.712982177734375, "global_step": 326290, "epoch": 2696} {"train_loss": -41.6456413269043, "global_step": 326291, "epoch": 2696} {"train_loss": -41.587379455566406, "global_step": 326292, "epoch": 2696} {"train_loss": -42.68782424926758, "global_step": 326293, "epoch": 2696} {"train_loss": -41.076141357421875, "global_step": 326294, "epoch": 2696} {"train_loss": -42.33366394042969, "global_step": 326295, "epoch": 2696} {"train_loss": -41.45982360839844, "global_step": 326296, "epoch": 2696} {"train_loss": -41.3620719909668, "global_step": 326297, "epoch": 2696} {"train_loss": -41.772918701171875, "global_step": 326298, "epoch": 2696} {"train_loss": -41.90398025512695, "global_step": 326299, "epoch": 2696} {"train_loss": -42.21137619018555, "global_step": 326300, "epoch": 2696} {"train_loss": -42.97507858276367, "global_step": 326301, "epoch": 2696} {"train_loss": -42.283721923828125, "global_step": 326302, "epoch": 2696} {"train_loss": -42.1030158996582, "global_step": 326303, "epoch": 2696} {"train_loss": -42.85233688354492, "global_step": 326304, "epoch": 2696} {"train_loss": -41.974063873291016, "global_step": 326305, "epoch": 2696} {"train_loss": -42.750221252441406, "global_step": 326306, "epoch": 2696} {"train_loss": -42.7270393371582, "global_step": 326307, "epoch": 2696} {"train_loss": -40.98394012451172, "global_step": 326308, "epoch": 2696} {"train_loss": -43.071388244628906, "global_step": 326309, "epoch": 2696} {"train_loss": -42.89361572265625, "global_step": 326310, "epoch": 2696} {"train_loss": -43.01522445678711, "global_step": 326311, "epoch": 2696} {"train_loss": -40.99111557006836, "global_step": 326312, "epoch": 2696} {"train_loss": -41.373653411865234, "global_step": 326313, "epoch": 2696} {"train_loss": -41.26383590698242, "global_step": 326314, "epoch": 2696} {"train_loss": -42.570858001708984, "global_step": 326315, "epoch": 2696} {"train_loss": -41.44794845581055, "global_step": 326316, "epoch": 2696} {"train_loss": -41.90367889404297, "global_step": 326317, "epoch": 2696} {"train_loss": -41.498531341552734, "global_step": 326318, "epoch": 2696} {"train_loss": -42.16428756713867, "global_step": 326319, "epoch": 2696} {"train_loss": -41.80622863769531, "global_step": 326320, "epoch": 2696} {"train_loss": -42.281829833984375, "global_step": 326321, "epoch": 2696} {"train_loss": -42.36994552612305, "global_step": 326322, "epoch": 2696} {"train_loss": -43.32093811035156, "global_step": 326323, "epoch": 2696} {"train_loss": -42.86334991455078, "global_step": 326324, "epoch": 2696} {"train_loss": -43.3083381652832, "global_step": 326325, "epoch": 2696} {"train_loss": -42.6722297668457, "global_step": 326326, "epoch": 2696} {"train_loss": -41.87373733520508, "global_step": 326327, "epoch": 2696} {"train_loss": -42.86574172973633, "global_step": 326328, "epoch": 2696} {"train_loss": -43.2959098815918, "global_step": 326329, "epoch": 2696} {"train_loss": -43.07764434814453, "global_step": 326330, "epoch": 2696} {"train_loss": -42.648834228515625, "global_step": 326331, "epoch": 2696} {"train_loss": -42.89352035522461, "global_step": 326332, "epoch": 2696} {"train_loss": -43.04140090942383, "global_step": 326333, "epoch": 2696} {"train_loss": -43.333892822265625, "global_step": 326334, "epoch": 2696} {"train_loss": -42.7443962097168, "global_step": 326335, "epoch": 2696} {"train_loss": -41.41612363452754, "global_step": 326336, "epoch": 2696, "val_loss": 2655249.0} {"train_loss": -42.36936950683594, "global_step": 326337, "epoch": 2697} {"train_loss": -42.887969970703125, "global_step": 326338, "epoch": 2697} {"train_loss": -42.85393142700195, "global_step": 326339, "epoch": 2697} {"train_loss": -43.02016830444336, "global_step": 326340, "epoch": 2697} {"train_loss": -43.44734573364258, "global_step": 326341, "epoch": 2697} {"train_loss": -43.34120559692383, "global_step": 326342, "epoch": 2697} {"train_loss": -42.24403762817383, "global_step": 326343, "epoch": 2697} {"train_loss": -43.25559616088867, "global_step": 326344, "epoch": 2697} {"train_loss": -43.04063034057617, "global_step": 326345, "epoch": 2697} {"train_loss": -43.0886344909668, "global_step": 326346, "epoch": 2697} {"train_loss": -42.85042190551758, "global_step": 326347, "epoch": 2697} {"train_loss": -43.48124694824219, "global_step": 326348, "epoch": 2697} {"train_loss": -43.2026252746582, "global_step": 326349, "epoch": 2697} {"train_loss": -42.87196731567383, "global_step": 326350, "epoch": 2697} {"train_loss": -42.1872673034668, "global_step": 326351, "epoch": 2697} {"train_loss": -42.14155197143555, "global_step": 326352, "epoch": 2697} {"train_loss": -43.33779525756836, "global_step": 326353, "epoch": 2697} {"train_loss": -41.96428680419922, "global_step": 326354, "epoch": 2697} {"train_loss": -43.10689926147461, "global_step": 326355, "epoch": 2697} {"train_loss": -42.159908294677734, "global_step": 326356, "epoch": 2697} {"train_loss": -43.623626708984375, "global_step": 326357, "epoch": 2697} {"train_loss": -42.90166473388672, "global_step": 326358, "epoch": 2697} {"train_loss": -43.01737594604492, "global_step": 326359, "epoch": 2697} {"train_loss": -43.645957946777344, "global_step": 326360, "epoch": 2697} {"train_loss": -43.53464889526367, "global_step": 326361, "epoch": 2697} {"train_loss": -43.2532958984375, "global_step": 326362, "epoch": 2697} {"train_loss": -42.93662643432617, "global_step": 326363, "epoch": 2697} {"train_loss": -41.54448699951172, "global_step": 326364, "epoch": 2697} {"train_loss": -42.26312255859375, "global_step": 326365, "epoch": 2697} {"train_loss": -43.32709884643555, "global_step": 326366, "epoch": 2697} {"train_loss": -41.55904769897461, "global_step": 326367, "epoch": 2697} {"train_loss": -43.466949462890625, "global_step": 326368, "epoch": 2697} {"train_loss": -41.962764739990234, "global_step": 326369, "epoch": 2697} {"train_loss": -42.540283203125, "global_step": 326370, "epoch": 2697} {"train_loss": -42.770992279052734, "global_step": 326371, "epoch": 2697} {"train_loss": -42.70429229736328, "global_step": 326372, "epoch": 2697} {"train_loss": -43.296180725097656, "global_step": 326373, "epoch": 2697} {"train_loss": -41.69744873046875, "global_step": 326374, "epoch": 2697} {"train_loss": -43.115570068359375, "global_step": 326375, "epoch": 2697} {"train_loss": -42.17362976074219, "global_step": 326376, "epoch": 2697} {"train_loss": -42.68201446533203, "global_step": 326377, "epoch": 2697} {"train_loss": -43.67684555053711, "global_step": 326378, "epoch": 2697} {"train_loss": -42.93855667114258, "global_step": 326379, "epoch": 2697} {"train_loss": -43.24525833129883, "global_step": 326380, "epoch": 2697} {"train_loss": -43.85641098022461, "global_step": 326381, "epoch": 2697} {"train_loss": -43.77515411376953, "global_step": 326382, "epoch": 2697} {"train_loss": -43.91476058959961, "global_step": 326383, "epoch": 2697} {"train_loss": -43.63984298706055, "global_step": 326384, "epoch": 2697} {"train_loss": -43.5377082824707, "global_step": 326385, "epoch": 2697} {"train_loss": -43.38521194458008, "global_step": 326386, "epoch": 2697} {"train_loss": -43.35663986206055, "global_step": 326387, "epoch": 2697} {"train_loss": -42.91352462768555, "global_step": 326388, "epoch": 2697} {"train_loss": -43.29286575317383, "global_step": 326389, "epoch": 2697} {"train_loss": -42.05947494506836, "global_step": 326390, "epoch": 2697} {"train_loss": -43.382137298583984, "global_step": 326391, "epoch": 2697} {"train_loss": -39.93569564819336, "global_step": 326392, "epoch": 2697} {"train_loss": -41.04816818237305, "global_step": 326393, "epoch": 2697} {"train_loss": -43.63859558105469, "global_step": 326394, "epoch": 2697} {"train_loss": -41.559749603271484, "global_step": 326395, "epoch": 2697} {"train_loss": -40.674251556396484, "global_step": 326396, "epoch": 2697} {"train_loss": -41.04460525512695, "global_step": 326397, "epoch": 2697} {"train_loss": -43.048187255859375, "global_step": 326398, "epoch": 2697} {"train_loss": -43.25260543823242, "global_step": 326399, "epoch": 2697} {"train_loss": -43.812355041503906, "global_step": 326400, "epoch": 2697} {"train_loss": -43.49350357055664, "global_step": 326401, "epoch": 2697} {"train_loss": -43.687740325927734, "global_step": 326402, "epoch": 2697} {"train_loss": -42.3579216003418, "global_step": 326403, "epoch": 2697} {"train_loss": -43.202205657958984, "global_step": 326404, "epoch": 2697} {"train_loss": -41.482177734375, "global_step": 326405, "epoch": 2697} {"train_loss": -42.71590042114258, "global_step": 326406, "epoch": 2697} {"train_loss": -40.89618682861328, "global_step": 326407, "epoch": 2697} {"train_loss": -43.48936080932617, "global_step": 326408, "epoch": 2697} {"train_loss": -43.04310989379883, "global_step": 326409, "epoch": 2697} {"train_loss": -43.26557540893555, "global_step": 326410, "epoch": 2697} {"train_loss": -42.446861267089844, "global_step": 326411, "epoch": 2697} {"train_loss": -42.23637771606445, "global_step": 326412, "epoch": 2697} {"train_loss": -40.71760177612305, "global_step": 326413, "epoch": 2697} {"train_loss": -41.23615646362305, "global_step": 326414, "epoch": 2697} {"train_loss": -39.53742218017578, "global_step": 326415, "epoch": 2697} {"train_loss": -36.42605209350586, "global_step": 326416, "epoch": 2697} {"train_loss": -40.49260330200195, "global_step": 326417, "epoch": 2697} {"train_loss": -40.55546951293945, "global_step": 326418, "epoch": 2697} {"train_loss": -39.57477951049805, "global_step": 326419, "epoch": 2697} {"train_loss": -38.12051773071289, "global_step": 326420, "epoch": 2697} {"train_loss": -39.30322265625, "global_step": 326421, "epoch": 2697} {"train_loss": -39.557518005371094, "global_step": 326422, "epoch": 2697} {"train_loss": -41.27336120605469, "global_step": 326423, "epoch": 2697} {"train_loss": -40.947723388671875, "global_step": 326424, "epoch": 2697} {"train_loss": -40.330989837646484, "global_step": 326425, "epoch": 2697} {"train_loss": -41.50962448120117, "global_step": 326426, "epoch": 2697} {"train_loss": -42.38331985473633, "global_step": 326427, "epoch": 2697} {"train_loss": -41.41844177246094, "global_step": 326428, "epoch": 2697} {"train_loss": -41.179744720458984, "global_step": 326429, "epoch": 2697} {"train_loss": -40.9461669921875, "global_step": 326430, "epoch": 2697} {"train_loss": -41.42138671875, "global_step": 326431, "epoch": 2697} {"train_loss": -39.664642333984375, "global_step": 326432, "epoch": 2697} {"train_loss": -42.40251159667969, "global_step": 326433, "epoch": 2697} {"train_loss": -41.8251953125, "global_step": 326434, "epoch": 2697} {"train_loss": -41.99821853637695, "global_step": 326435, "epoch": 2697} {"train_loss": -42.509010314941406, "global_step": 326436, "epoch": 2697} {"train_loss": -41.811317443847656, "global_step": 326437, "epoch": 2697} {"train_loss": -42.47568130493164, "global_step": 326438, "epoch": 2697} {"train_loss": -42.723594665527344, "global_step": 326439, "epoch": 2697} {"train_loss": -42.0450325012207, "global_step": 326440, "epoch": 2697} {"train_loss": -42.77117919921875, "global_step": 326441, "epoch": 2697} {"train_loss": -41.680946350097656, "global_step": 326442, "epoch": 2697} {"train_loss": -42.171321868896484, "global_step": 326443, "epoch": 2697} {"train_loss": -40.855628967285156, "global_step": 326444, "epoch": 2697} {"train_loss": -42.66978073120117, "global_step": 326445, "epoch": 2697} {"train_loss": -43.41402053833008, "global_step": 326446, "epoch": 2697} {"train_loss": -41.45082473754883, "global_step": 326447, "epoch": 2697} {"train_loss": -42.89493942260742, "global_step": 326448, "epoch": 2697} {"train_loss": -42.503028869628906, "global_step": 326449, "epoch": 2697} {"train_loss": -42.92346954345703, "global_step": 326450, "epoch": 2697} {"train_loss": -43.08195877075195, "global_step": 326451, "epoch": 2697} {"train_loss": -42.055152893066406, "global_step": 326452, "epoch": 2697} {"train_loss": -42.96387481689453, "global_step": 326453, "epoch": 2697} {"train_loss": -42.98847961425781, "global_step": 326454, "epoch": 2697} {"train_loss": -43.0910530090332, "global_step": 326455, "epoch": 2697} {"train_loss": -43.47792434692383, "global_step": 326456, "epoch": 2697} {"train_loss": -42.31866206019378, "global_step": 326457, "epoch": 2697, "val_loss": 2646693.0} {"train_loss": -42.7348518371582, "global_step": 326458, "epoch": 2698} {"train_loss": -43.23686599731445, "global_step": 326459, "epoch": 2698} {"train_loss": -43.34254837036133, "global_step": 326460, "epoch": 2698} {"train_loss": -43.329139709472656, "global_step": 326461, "epoch": 2698} {"train_loss": -43.13773727416992, "global_step": 326462, "epoch": 2698} {"train_loss": -43.7337760925293, "global_step": 326463, "epoch": 2698} {"train_loss": -42.97977828979492, "global_step": 326464, "epoch": 2698} {"train_loss": -43.08930969238281, "global_step": 326465, "epoch": 2698} {"train_loss": -42.744930267333984, "global_step": 326466, "epoch": 2698} {"train_loss": -43.63640213012695, "global_step": 326467, "epoch": 2698} {"train_loss": -43.48652267456055, "global_step": 326468, "epoch": 2698} {"train_loss": -43.915748596191406, "global_step": 326469, "epoch": 2698} {"train_loss": -43.52836227416992, "global_step": 326470, "epoch": 2698} {"train_loss": -43.28059005737305, "global_step": 326471, "epoch": 2698} {"train_loss": -43.03480911254883, "global_step": 326472, "epoch": 2698} {"train_loss": -43.8736686706543, "global_step": 326473, "epoch": 2698} {"train_loss": -42.762081146240234, "global_step": 326474, "epoch": 2698} {"train_loss": -43.49369430541992, "global_step": 326475, "epoch": 2698} {"train_loss": -44.094268798828125, "global_step": 326476, "epoch": 2698} {"train_loss": -43.59021759033203, "global_step": 326477, "epoch": 2698} {"train_loss": -43.673973083496094, "global_step": 326478, "epoch": 2698} {"train_loss": -43.257442474365234, "global_step": 326479, "epoch": 2698} {"train_loss": -43.07022476196289, "global_step": 326480, "epoch": 2698} {"train_loss": -43.30225372314453, "global_step": 326481, "epoch": 2698} {"train_loss": -43.78474044799805, "global_step": 326482, "epoch": 2698} {"train_loss": -43.421443939208984, "global_step": 326483, "epoch": 2698} {"train_loss": -44.1091423034668, "global_step": 326484, "epoch": 2698} {"train_loss": -43.06156539916992, "global_step": 326485, "epoch": 2698} {"train_loss": -42.29507064819336, "global_step": 326486, "epoch": 2698} {"train_loss": -43.52462387084961, "global_step": 326487, "epoch": 2698} {"train_loss": -43.52851104736328, "global_step": 326488, "epoch": 2698} {"train_loss": -41.96238327026367, "global_step": 326489, "epoch": 2698} {"train_loss": -43.31917190551758, "global_step": 326490, "epoch": 2698} {"train_loss": -43.700828552246094, "global_step": 326491, "epoch": 2698} {"train_loss": -41.77960205078125, "global_step": 326492, "epoch": 2698} {"train_loss": -44.20250701904297, "global_step": 326493, "epoch": 2698} {"train_loss": -43.56959915161133, "global_step": 326494, "epoch": 2698} {"train_loss": -42.274749755859375, "global_step": 326495, "epoch": 2698} {"train_loss": -42.17977523803711, "global_step": 326496, "epoch": 2698} {"train_loss": -42.32324981689453, "global_step": 326497, "epoch": 2698} {"train_loss": -42.95161056518555, "global_step": 326498, "epoch": 2698} {"train_loss": -43.501922607421875, "global_step": 326499, "epoch": 2698} {"train_loss": -43.359493255615234, "global_step": 326500, "epoch": 2698} {"train_loss": -43.08198165893555, "global_step": 326501, "epoch": 2698} {"train_loss": -43.03693389892578, "global_step": 326502, "epoch": 2698} {"train_loss": -43.3832893371582, "global_step": 326503, "epoch": 2698} {"train_loss": -43.58390426635742, "global_step": 326504, "epoch": 2698} {"train_loss": -43.46055603027344, "global_step": 326505, "epoch": 2698} {"train_loss": -43.18831253051758, "global_step": 326506, "epoch": 2698} {"train_loss": -43.68253707885742, "global_step": 326507, "epoch": 2698} {"train_loss": -43.32586669921875, "global_step": 326508, "epoch": 2698} {"train_loss": -43.13458251953125, "global_step": 326509, "epoch": 2698} {"train_loss": -42.58448028564453, "global_step": 326510, "epoch": 2698} {"train_loss": -40.49910354614258, "global_step": 326511, "epoch": 2698} {"train_loss": -42.557411193847656, "global_step": 326512, "epoch": 2698} {"train_loss": -42.50300598144531, "global_step": 326513, "epoch": 2698} {"train_loss": -43.682281494140625, "global_step": 326514, "epoch": 2698} {"train_loss": -42.26973342895508, "global_step": 326515, "epoch": 2698} {"train_loss": -42.26600646972656, "global_step": 326516, "epoch": 2698} {"train_loss": -41.546104431152344, "global_step": 326517, "epoch": 2698} {"train_loss": -43.112300872802734, "global_step": 326518, "epoch": 2698} {"train_loss": -42.171077728271484, "global_step": 326519, "epoch": 2698} {"train_loss": -41.99384689331055, "global_step": 326520, "epoch": 2698} {"train_loss": -41.63291549682617, "global_step": 326521, "epoch": 2698} {"train_loss": -43.5057487487793, "global_step": 326522, "epoch": 2698} {"train_loss": -41.390811920166016, "global_step": 326523, "epoch": 2698} {"train_loss": -39.13025665283203, "global_step": 326524, "epoch": 2698} {"train_loss": -41.66207504272461, "global_step": 326525, "epoch": 2698} {"train_loss": -39.60832595825195, "global_step": 326526, "epoch": 2698} {"train_loss": -39.26415252685547, "global_step": 326527, "epoch": 2698} {"train_loss": -40.62498092651367, "global_step": 326528, "epoch": 2698} {"train_loss": -40.282875061035156, "global_step": 326529, "epoch": 2698} {"train_loss": -41.33936309814453, "global_step": 326530, "epoch": 2698} {"train_loss": -41.05459213256836, "global_step": 326531, "epoch": 2698} {"train_loss": -41.562355041503906, "global_step": 326532, "epoch": 2698} {"train_loss": -41.72098922729492, "global_step": 326533, "epoch": 2698} {"train_loss": -41.44623947143555, "global_step": 326534, "epoch": 2698} {"train_loss": -41.11970901489258, "global_step": 326535, "epoch": 2698} {"train_loss": -42.87211608886719, "global_step": 326536, "epoch": 2698} {"train_loss": -42.437068939208984, "global_step": 326537, "epoch": 2698} {"train_loss": -42.43929672241211, "global_step": 326538, "epoch": 2698} {"train_loss": -42.129180908203125, "global_step": 326539, "epoch": 2698} {"train_loss": -42.89774703979492, "global_step": 326540, "epoch": 2698} {"train_loss": -43.0506706237793, "global_step": 326541, "epoch": 2698} {"train_loss": -42.93638610839844, "global_step": 326542, "epoch": 2698} {"train_loss": -43.56168746948242, "global_step": 326543, "epoch": 2698} {"train_loss": -43.075565338134766, "global_step": 326544, "epoch": 2698} {"train_loss": -43.5905876159668, "global_step": 326545, "epoch": 2698} {"train_loss": -43.0465202331543, "global_step": 326546, "epoch": 2698} {"train_loss": -43.10390853881836, "global_step": 326547, "epoch": 2698} {"train_loss": -43.82110595703125, "global_step": 326548, "epoch": 2698} {"train_loss": -43.21753692626953, "global_step": 326549, "epoch": 2698} {"train_loss": -43.451385498046875, "global_step": 326550, "epoch": 2698} {"train_loss": -43.05353927612305, "global_step": 326551, "epoch": 2698} {"train_loss": -43.26272201538086, "global_step": 326552, "epoch": 2698} {"train_loss": -43.3275032043457, "global_step": 326553, "epoch": 2698} {"train_loss": -43.02821731567383, "global_step": 326554, "epoch": 2698} {"train_loss": -43.21309280395508, "global_step": 326555, "epoch": 2698} {"train_loss": -43.832698822021484, "global_step": 326556, "epoch": 2698} {"train_loss": -43.183319091796875, "global_step": 326557, "epoch": 2698} {"train_loss": -44.152828216552734, "global_step": 326558, "epoch": 2698} {"train_loss": -43.60810470581055, "global_step": 326559, "epoch": 2698} {"train_loss": -42.8046760559082, "global_step": 326560, "epoch": 2698} {"train_loss": -43.81278610229492, "global_step": 326561, "epoch": 2698} {"train_loss": -43.24666213989258, "global_step": 326562, "epoch": 2698} {"train_loss": -42.99677276611328, "global_step": 326563, "epoch": 2698} {"train_loss": -42.76925277709961, "global_step": 326564, "epoch": 2698} {"train_loss": -42.78575134277344, "global_step": 326565, "epoch": 2698} {"train_loss": -43.05012130737305, "global_step": 326566, "epoch": 2698} {"train_loss": -43.9303092956543, "global_step": 326567, "epoch": 2698} {"train_loss": -43.6599235534668, "global_step": 326568, "epoch": 2698} {"train_loss": -43.67832565307617, "global_step": 326569, "epoch": 2698} {"train_loss": -43.29305648803711, "global_step": 326570, "epoch": 2698} {"train_loss": -42.578033447265625, "global_step": 326571, "epoch": 2698} {"train_loss": -44.08171463012695, "global_step": 326572, "epoch": 2698} {"train_loss": -43.32167434692383, "global_step": 326573, "epoch": 2698} {"train_loss": -42.35687255859375, "global_step": 326574, "epoch": 2698} {"train_loss": -43.71808624267578, "global_step": 326575, "epoch": 2698} {"train_loss": -43.246337890625, "global_step": 326576, "epoch": 2698} {"train_loss": -43.6591682434082, "global_step": 326577, "epoch": 2698} {"train_loss": -42.87665608303606, "global_step": 326578, "epoch": 2698, "val_loss": 2708171.25} {"train_loss": -43.02060317993164, "global_step": 326579, "epoch": 2699} {"train_loss": -43.145790100097656, "global_step": 326580, "epoch": 2699} {"train_loss": -43.750946044921875, "global_step": 326581, "epoch": 2699} {"train_loss": -40.31608200073242, "global_step": 326582, "epoch": 2699} {"train_loss": -44.067115783691406, "global_step": 326583, "epoch": 2699} {"train_loss": -43.32294464111328, "global_step": 326584, "epoch": 2699} {"train_loss": -42.62409591674805, "global_step": 326585, "epoch": 2699} {"train_loss": -41.703792572021484, "global_step": 326586, "epoch": 2699} {"train_loss": -43.65202713012695, "global_step": 326587, "epoch": 2699} {"train_loss": -43.400856018066406, "global_step": 326588, "epoch": 2699} {"train_loss": -43.803428649902344, "global_step": 326589, "epoch": 2699} {"train_loss": -43.63363265991211, "global_step": 326590, "epoch": 2699} {"train_loss": -43.61189651489258, "global_step": 326591, "epoch": 2699} {"train_loss": -42.184810638427734, "global_step": 326592, "epoch": 2699} {"train_loss": -42.68135452270508, "global_step": 326593, "epoch": 2699} {"train_loss": -42.904232025146484, "global_step": 326594, "epoch": 2699} {"train_loss": -43.92739486694336, "global_step": 326595, "epoch": 2699} {"train_loss": -42.83358383178711, "global_step": 326596, "epoch": 2699} {"train_loss": -42.704708099365234, "global_step": 326597, "epoch": 2699} {"train_loss": -43.52589797973633, "global_step": 326598, "epoch": 2699} {"train_loss": -43.4879264831543, "global_step": 326599, "epoch": 2699} {"train_loss": -43.22771453857422, "global_step": 326600, "epoch": 2699} {"train_loss": -43.55231857299805, "global_step": 326601, "epoch": 2699} {"train_loss": -43.38844680786133, "global_step": 326602, "epoch": 2699} {"train_loss": -43.830604553222656, "global_step": 326603, "epoch": 2699} {"train_loss": -44.278907775878906, "global_step": 326604, "epoch": 2699} {"train_loss": -43.125667572021484, "global_step": 326605, "epoch": 2699} {"train_loss": -43.75217819213867, "global_step": 326606, "epoch": 2699} {"train_loss": -43.91177749633789, "global_step": 326607, "epoch": 2699} {"train_loss": -43.20755386352539, "global_step": 326608, "epoch": 2699} {"train_loss": -43.63344192504883, "global_step": 326609, "epoch": 2699} {"train_loss": -43.778076171875, "global_step": 326610, "epoch": 2699} {"train_loss": -43.73209762573242, "global_step": 326611, "epoch": 2699} {"train_loss": -44.11482620239258, "global_step": 326612, "epoch": 2699} {"train_loss": -44.23904800415039, "global_step": 326613, "epoch": 2699} {"train_loss": -44.46156311035156, "global_step": 326614, "epoch": 2699} {"train_loss": -44.31100082397461, "global_step": 326615, "epoch": 2699} {"train_loss": -44.4649543762207, "global_step": 326616, "epoch": 2699} {"train_loss": -43.152706146240234, "global_step": 326617, "epoch": 2699} {"train_loss": -43.83425521850586, "global_step": 326618, "epoch": 2699} {"train_loss": -43.80588150024414, "global_step": 326619, "epoch": 2699} {"train_loss": -44.273193359375, "global_step": 326620, "epoch": 2699} {"train_loss": -43.77338790893555, "global_step": 326621, "epoch": 2699} {"train_loss": -43.955352783203125, "global_step": 326622, "epoch": 2699} {"train_loss": -43.334835052490234, "global_step": 326623, "epoch": 2699} {"train_loss": -43.18455505371094, "global_step": 326624, "epoch": 2699} {"train_loss": -43.7210807800293, "global_step": 326625, "epoch": 2699} {"train_loss": -43.30411911010742, "global_step": 326626, "epoch": 2699} {"train_loss": -43.37651062011719, "global_step": 326627, "epoch": 2699} {"train_loss": -43.396820068359375, "global_step": 326628, "epoch": 2699} {"train_loss": -42.97178268432617, "global_step": 326629, "epoch": 2699} {"train_loss": -42.787227630615234, "global_step": 326630, "epoch": 2699} {"train_loss": -43.25202560424805, "global_step": 326631, "epoch": 2699} {"train_loss": -42.306636810302734, "global_step": 326632, "epoch": 2699} {"train_loss": -42.73435974121094, "global_step": 326633, "epoch": 2699} {"train_loss": -42.66965866088867, "global_step": 326634, "epoch": 2699} {"train_loss": -42.609737396240234, "global_step": 326635, "epoch": 2699} {"train_loss": -42.90883255004883, "global_step": 326636, "epoch": 2699} {"train_loss": -43.0191650390625, "global_step": 326637, "epoch": 2699} {"train_loss": -40.50199508666992, "global_step": 326638, "epoch": 2699} {"train_loss": -43.321380615234375, "global_step": 326639, "epoch": 2699} {"train_loss": -40.49240493774414, "global_step": 326640, "epoch": 2699} {"train_loss": -40.34767150878906, "global_step": 326641, "epoch": 2699} {"train_loss": -42.3979606628418, "global_step": 326642, "epoch": 2699} {"train_loss": -42.21732711791992, "global_step": 326643, "epoch": 2699} {"train_loss": -40.851661682128906, "global_step": 326644, "epoch": 2699} {"train_loss": -41.25211715698242, "global_step": 326645, "epoch": 2699} {"train_loss": -41.86539840698242, "global_step": 326646, "epoch": 2699} {"train_loss": -42.79066467285156, "global_step": 326647, "epoch": 2699} {"train_loss": -41.575897216796875, "global_step": 326648, "epoch": 2699} {"train_loss": -42.915645599365234, "global_step": 326649, "epoch": 2699} {"train_loss": -42.42226028442383, "global_step": 326650, "epoch": 2699} {"train_loss": -42.653682708740234, "global_step": 326651, "epoch": 2699} {"train_loss": -37.583621978759766, "global_step": 326652, "epoch": 2699} {"train_loss": -41.62554931640625, "global_step": 326653, "epoch": 2699} {"train_loss": -35.9614372253418, "global_step": 326654, "epoch": 2699} {"train_loss": -41.80915832519531, "global_step": 326655, "epoch": 2699} {"train_loss": -41.6174430847168, "global_step": 326656, "epoch": 2699} {"train_loss": -42.70832443237305, "global_step": 326657, "epoch": 2699} {"train_loss": -41.762359619140625, "global_step": 326658, "epoch": 2699} {"train_loss": -41.965431213378906, "global_step": 326659, "epoch": 2699} {"train_loss": -42.24882125854492, "global_step": 326660, "epoch": 2699} {"train_loss": -37.212432861328125, "global_step": 326661, "epoch": 2699} {"train_loss": -34.33015823364258, "global_step": 326662, "epoch": 2699} {"train_loss": -41.58824157714844, "global_step": 326663, "epoch": 2699} {"train_loss": -41.398372650146484, "global_step": 326664, "epoch": 2699} {"train_loss": -42.023719787597656, "global_step": 326665, "epoch": 2699} {"train_loss": -40.06875228881836, "global_step": 326666, "epoch": 2699} {"train_loss": -40.350128173828125, "global_step": 326667, "epoch": 2699} {"train_loss": -42.18915557861328, "global_step": 326668, "epoch": 2699} {"train_loss": -40.51906204223633, "global_step": 326669, "epoch": 2699} {"train_loss": -40.7890625, "global_step": 326670, "epoch": 2699} {"train_loss": -37.4931755065918, "global_step": 326671, "epoch": 2699} {"train_loss": -39.387752532958984, "global_step": 326672, "epoch": 2699} {"train_loss": -41.153446197509766, "global_step": 326673, "epoch": 2699} {"train_loss": -38.82276916503906, "global_step": 326674, "epoch": 2699} {"train_loss": -39.48377227783203, "global_step": 326675, "epoch": 2699} {"train_loss": -40.778560638427734, "global_step": 326676, "epoch": 2699} {"train_loss": -40.60614013671875, "global_step": 326677, "epoch": 2699} {"train_loss": -42.66731643676758, "global_step": 326678, "epoch": 2699} {"train_loss": -42.3778076171875, "global_step": 326679, "epoch": 2699} {"train_loss": -41.270320892333984, "global_step": 326680, "epoch": 2699} {"train_loss": -42.54248046875, "global_step": 326681, "epoch": 2699} {"train_loss": -40.040306091308594, "global_step": 326682, "epoch": 2699} {"train_loss": -41.846065521240234, "global_step": 326683, "epoch": 2699} {"train_loss": -41.11981964111328, "global_step": 326684, "epoch": 2699} {"train_loss": -42.0212287902832, "global_step": 326685, "epoch": 2699} {"train_loss": -41.472999572753906, "global_step": 326686, "epoch": 2699} {"train_loss": -43.22502517700195, "global_step": 326687, "epoch": 2699} {"train_loss": -40.666378021240234, "global_step": 326688, "epoch": 2699} {"train_loss": -40.60957717895508, "global_step": 326689, "epoch": 2699} {"train_loss": -41.36619186401367, "global_step": 326690, "epoch": 2699} {"train_loss": -42.26754379272461, "global_step": 326691, "epoch": 2699} {"train_loss": -41.8642463684082, "global_step": 326692, "epoch": 2699} {"train_loss": -43.087623596191406, "global_step": 326693, "epoch": 2699} {"train_loss": -42.97025680541992, "global_step": 326694, "epoch": 2699} {"train_loss": -42.92823028564453, "global_step": 326695, "epoch": 2699} {"train_loss": -41.309139251708984, "global_step": 326696, "epoch": 2699} {"train_loss": -42.601497650146484, "global_step": 326697, "epoch": 2699} {"train_loss": -42.965187072753906, "global_step": 326698, "epoch": 2699} {"train_loss": -42.25697014548562, "global_step": 326699, "epoch": 2699, "val_loss": 2568233.75} {"train_loss": -42.851924896240234, "global_step": 326700, "epoch": 2700} {"train_loss": -43.176170349121094, "global_step": 326701, "epoch": 2700} {"train_loss": -43.34194564819336, "global_step": 326702, "epoch": 2700} {"train_loss": -43.387672424316406, "global_step": 326703, "epoch": 2700} {"train_loss": -43.02690505981445, "global_step": 326704, "epoch": 2700} {"train_loss": -43.29035568237305, "global_step": 326705, "epoch": 2700} {"train_loss": -42.76058578491211, "global_step": 326706, "epoch": 2700} {"train_loss": -43.09566879272461, "global_step": 326707, "epoch": 2700} {"train_loss": -43.22163772583008, "global_step": 326708, "epoch": 2700} {"train_loss": -43.05181884765625, "global_step": 326709, "epoch": 2700} {"train_loss": -43.06008529663086, "global_step": 326710, "epoch": 2700} {"train_loss": -40.649227142333984, "global_step": 326711, "epoch": 2700} {"train_loss": -34.17295455932617, "global_step": 326712, "epoch": 2700} {"train_loss": -42.86464309692383, "global_step": 326713, "epoch": 2700} {"train_loss": -41.03662109375, "global_step": 326714, "epoch": 2700} {"train_loss": -41.97562789916992, "global_step": 326715, "epoch": 2700} {"train_loss": -40.18191146850586, "global_step": 326716, "epoch": 2700} {"train_loss": -42.34116744995117, "global_step": 326717, "epoch": 2700} {"train_loss": -43.37654113769531, "global_step": 326718, "epoch": 2700} {"train_loss": -43.01906967163086, "global_step": 326719, "epoch": 2700} {"train_loss": -41.81826400756836, "global_step": 326720, "epoch": 2700} {"train_loss": -42.9824333190918, "global_step": 326721, "epoch": 2700} {"train_loss": -42.76252365112305, "global_step": 326722, "epoch": 2700} {"train_loss": -42.74947738647461, "global_step": 326723, "epoch": 2700} {"train_loss": -41.79560089111328, "global_step": 326724, "epoch": 2700} {"train_loss": -42.59995651245117, "global_step": 326725, "epoch": 2700} {"train_loss": -43.59522247314453, "global_step": 326726, "epoch": 2700} {"train_loss": -42.55706787109375, "global_step": 326727, "epoch": 2700} {"train_loss": -43.5781135559082, "global_step": 326728, "epoch": 2700} {"train_loss": -41.226287841796875, "global_step": 326729, "epoch": 2700} {"train_loss": -43.58015823364258, "global_step": 326730, "epoch": 2700} {"train_loss": -43.44684982299805, "global_step": 326731, "epoch": 2700} {"train_loss": -43.43050765991211, "global_step": 326732, "epoch": 2700} {"train_loss": -41.862483978271484, "global_step": 326733, "epoch": 2700} {"train_loss": -43.13146209716797, "global_step": 326734, "epoch": 2700} {"train_loss": -42.681983947753906, "global_step": 326735, "epoch": 2700} {"train_loss": -41.51018142700195, "global_step": 326736, "epoch": 2700} {"train_loss": -42.006954193115234, "global_step": 326737, "epoch": 2700} {"train_loss": -43.298072814941406, "global_step": 326738, "epoch": 2700} {"train_loss": -43.7716064453125, "global_step": 326739, "epoch": 2700} {"train_loss": -41.21848678588867, "global_step": 326740, "epoch": 2700} {"train_loss": -43.78515625, "global_step": 326741, "epoch": 2700} {"train_loss": -42.45835494995117, "global_step": 326742, "epoch": 2700} {"train_loss": -43.06761169433594, "global_step": 326743, "epoch": 2700} {"train_loss": -42.579010009765625, "global_step": 326744, "epoch": 2700} {"train_loss": -43.02323532104492, "global_step": 326745, "epoch": 2700} {"train_loss": -43.61881637573242, "global_step": 326746, "epoch": 2700} {"train_loss": -42.58701705932617, "global_step": 326747, "epoch": 2700} {"train_loss": -42.673973083496094, "global_step": 326748, "epoch": 2700} {"train_loss": -43.329837799072266, "global_step": 326749, "epoch": 2700} {"train_loss": -42.55424118041992, "global_step": 326750, "epoch": 2700} {"train_loss": -42.57041549682617, "global_step": 326751, "epoch": 2700} {"train_loss": -43.07573318481445, "global_step": 326752, "epoch": 2700} {"train_loss": -43.494564056396484, "global_step": 326753, "epoch": 2700} {"train_loss": -42.332664489746094, "global_step": 326754, "epoch": 2700} {"train_loss": -43.80183029174805, "global_step": 326755, "epoch": 2700} {"train_loss": -42.78599166870117, "global_step": 326756, "epoch": 2700} {"train_loss": -41.79917526245117, "global_step": 326757, "epoch": 2700} {"train_loss": -42.483760833740234, "global_step": 326758, "epoch": 2700} {"train_loss": -41.933780670166016, "global_step": 326759, "epoch": 2700} {"train_loss": -43.20855712890625, "global_step": 326760, "epoch": 2700} {"train_loss": -38.965126037597656, "global_step": 326761, "epoch": 2700} {"train_loss": -43.11391830444336, "global_step": 326762, "epoch": 2700} {"train_loss": -43.861202239990234, "global_step": 326763, "epoch": 2700} {"train_loss": -41.317623138427734, "global_step": 326764, "epoch": 2700} {"train_loss": -42.516963958740234, "global_step": 326765, "epoch": 2700} {"train_loss": -42.515350341796875, "global_step": 326766, "epoch": 2700} {"train_loss": -42.701080322265625, "global_step": 326767, "epoch": 2700} {"train_loss": -40.81851577758789, "global_step": 326768, "epoch": 2700} {"train_loss": -42.839168548583984, "global_step": 326769, "epoch": 2700} {"train_loss": -42.93528747558594, "global_step": 326770, "epoch": 2700} {"train_loss": -43.2026252746582, "global_step": 326771, "epoch": 2700} {"train_loss": -42.701446533203125, "global_step": 326772, "epoch": 2700} {"train_loss": -43.517738342285156, "global_step": 326773, "epoch": 2700} {"train_loss": -43.34108352661133, "global_step": 326774, "epoch": 2700} {"train_loss": -43.081748962402344, "global_step": 326775, "epoch": 2700} {"train_loss": -41.76613998413086, "global_step": 326776, "epoch": 2700} {"train_loss": -42.626399993896484, "global_step": 326777, "epoch": 2700} {"train_loss": -42.357749938964844, "global_step": 326778, "epoch": 2700} {"train_loss": -43.0185432434082, "global_step": 326779, "epoch": 2700} {"train_loss": -42.47907638549805, "global_step": 326780, "epoch": 2700} {"train_loss": -43.41504669189453, "global_step": 326781, "epoch": 2700} {"train_loss": -42.28866195678711, "global_step": 326782, "epoch": 2700} {"train_loss": -42.56940841674805, "global_step": 326783, "epoch": 2700} {"train_loss": -43.50651168823242, "global_step": 326784, "epoch": 2700} {"train_loss": -43.215057373046875, "global_step": 326785, "epoch": 2700} {"train_loss": -42.55828857421875, "global_step": 326786, "epoch": 2700} {"train_loss": -44.14736557006836, "global_step": 326787, "epoch": 2700} {"train_loss": -38.62122344970703, "global_step": 326788, "epoch": 2700} {"train_loss": -39.48474884033203, "global_step": 326789, "epoch": 2700} {"train_loss": -39.19770812988281, "global_step": 326790, "epoch": 2700} {"train_loss": -42.33393859863281, "global_step": 326791, "epoch": 2700} {"train_loss": -41.94783401489258, "global_step": 326792, "epoch": 2700} {"train_loss": -43.172542572021484, "global_step": 326793, "epoch": 2700} {"train_loss": -41.71088409423828, "global_step": 326794, "epoch": 2700} {"train_loss": -42.44913864135742, "global_step": 326795, "epoch": 2700} {"train_loss": -42.88439178466797, "global_step": 326796, "epoch": 2700} {"train_loss": -43.10517120361328, "global_step": 326797, "epoch": 2700} {"train_loss": -43.10331726074219, "global_step": 326798, "epoch": 2700} {"train_loss": -42.68417739868164, "global_step": 326799, "epoch": 2700} {"train_loss": -43.79548263549805, "global_step": 326800, "epoch": 2700} {"train_loss": -41.59166717529297, "global_step": 326801, "epoch": 2700} {"train_loss": -40.96194076538086, "global_step": 326802, "epoch": 2700} {"train_loss": -42.744667053222656, "global_step": 326803, "epoch": 2700} {"train_loss": -42.844661712646484, "global_step": 326804, "epoch": 2700} {"train_loss": -42.95886993408203, "global_step": 326805, "epoch": 2700} {"train_loss": -43.22605895996094, "global_step": 326806, "epoch": 2700} {"train_loss": -41.95272445678711, "global_step": 326807, "epoch": 2700} {"train_loss": -41.25031280517578, "global_step": 326808, "epoch": 2700} {"train_loss": -41.1068229675293, "global_step": 326809, "epoch": 2700} {"train_loss": -43.17145919799805, "global_step": 326810, "epoch": 2700} {"train_loss": -42.3241081237793, "global_step": 326811, "epoch": 2700} {"train_loss": -41.90485382080078, "global_step": 326812, "epoch": 2700} {"train_loss": -41.209083557128906, "global_step": 326813, "epoch": 2700} {"train_loss": -42.410858154296875, "global_step": 326814, "epoch": 2700} {"train_loss": -41.78770065307617, "global_step": 326815, "epoch": 2700} {"train_loss": -38.39221954345703, "global_step": 326816, "epoch": 2700} {"train_loss": -42.18939208984375, "global_step": 326817, "epoch": 2700} {"train_loss": -42.95370101928711, "global_step": 326818, "epoch": 2700} {"train_loss": -42.123023986816406, "global_step": 326819, "epoch": 2700} {"train_loss": -42.41488363723124, "global_step": 326820, "epoch": 2700, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4400000": 1.0, "test/sim_max_reward_4400001": 1.0, "test/sim_max_reward_4400002": 1.0, "test/sim_max_reward_4400003": 0.0, "test/sim_max_reward_4400004": 1.0, "test/sim_max_reward_4400005": 1.0, "test/sim_max_reward_4400006": 1.0, "test/sim_max_reward_4400007": 1.0, "test/sim_max_reward_4400008": 1.0, "test/sim_max_reward_4400009": 1.0, "test/sim_max_reward_4400010": 1.0, "test/sim_max_reward_4400011": 1.0, "test/sim_max_reward_4400012": 1.0, "test/sim_max_reward_4400013": 1.0, "test/sim_max_reward_4400014": 1.0, "test/sim_max_reward_4400015": 1.0, "test/sim_max_reward_4400016": 1.0, "test/sim_max_reward_4400017": 1.0, "test/sim_max_reward_4400018": 1.0, "test/sim_max_reward_4400019": 1.0, "test/sim_max_reward_4400020": 1.0, "test/sim_max_reward_4400021": 1.0, "train/mean_score": 1.0, "test/mean_score": 0.9545454545454546, "val_loss": 2539716.75} {"train_loss": -43.10072326660156, "global_step": 326821, "epoch": 2701} {"train_loss": -42.07423782348633, "global_step": 326822, "epoch": 2701} {"train_loss": -42.73419189453125, "global_step": 326823, "epoch": 2701} {"train_loss": -43.35848617553711, "global_step": 326824, "epoch": 2701} {"train_loss": -42.789669036865234, "global_step": 326825, "epoch": 2701} {"train_loss": -42.37668991088867, "global_step": 326826, "epoch": 2701} {"train_loss": -43.38326644897461, "global_step": 326827, "epoch": 2701} {"train_loss": -42.8583869934082, "global_step": 326828, "epoch": 2701} {"train_loss": -42.16329574584961, "global_step": 326829, "epoch": 2701} {"train_loss": -42.55221176147461, "global_step": 326830, "epoch": 2701} {"train_loss": -42.93364334106445, "global_step": 326831, "epoch": 2701} {"train_loss": -42.60563278198242, "global_step": 326832, "epoch": 2701} {"train_loss": -42.652488708496094, "global_step": 326833, "epoch": 2701} {"train_loss": -42.542362213134766, "global_step": 326834, "epoch": 2701} {"train_loss": -40.50281524658203, "global_step": 326835, "epoch": 2701} {"train_loss": -42.14290237426758, "global_step": 326836, "epoch": 2701} {"train_loss": -42.45708084106445, "global_step": 326837, "epoch": 2701} {"train_loss": -43.46989440917969, "global_step": 326838, "epoch": 2701} {"train_loss": -43.39120101928711, "global_step": 326839, "epoch": 2701} {"train_loss": -42.12279510498047, "global_step": 326840, "epoch": 2701} {"train_loss": -42.909271240234375, "global_step": 326841, "epoch": 2701} {"train_loss": -43.2073860168457, "global_step": 326842, "epoch": 2701} {"train_loss": -43.9970588684082, "global_step": 326843, "epoch": 2701} {"train_loss": -43.275794982910156, "global_step": 326844, "epoch": 2701} {"train_loss": -42.52958297729492, "global_step": 326845, "epoch": 2701} {"train_loss": -43.2880859375, "global_step": 326846, "epoch": 2701} {"train_loss": -43.18875503540039, "global_step": 326847, "epoch": 2701} {"train_loss": -42.74238204956055, "global_step": 326848, "epoch": 2701} {"train_loss": -43.47311019897461, "global_step": 326849, "epoch": 2701} {"train_loss": -42.63978958129883, "global_step": 326850, "epoch": 2701} {"train_loss": -41.75754165649414, "global_step": 326851, "epoch": 2701} {"train_loss": -43.4342155456543, "global_step": 326852, "epoch": 2701} {"train_loss": -42.962623596191406, "global_step": 326853, "epoch": 2701} {"train_loss": -41.78207015991211, "global_step": 326854, "epoch": 2701} {"train_loss": -41.730857849121094, "global_step": 326855, "epoch": 2701} {"train_loss": -42.2905158996582, "global_step": 326856, "epoch": 2701} {"train_loss": -42.376686096191406, "global_step": 326857, "epoch": 2701} {"train_loss": -41.80055236816406, "global_step": 326858, "epoch": 2701} {"train_loss": -42.994197845458984, "global_step": 326859, "epoch": 2701} {"train_loss": -43.63462829589844, "global_step": 326860, "epoch": 2701} {"train_loss": -43.32435989379883, "global_step": 326861, "epoch": 2701} {"train_loss": -43.145992279052734, "global_step": 326862, "epoch": 2701} {"train_loss": -41.92261505126953, "global_step": 326863, "epoch": 2701} {"train_loss": -43.3072509765625, "global_step": 326864, "epoch": 2701} {"train_loss": -42.55066680908203, "global_step": 326865, "epoch": 2701} {"train_loss": -43.975887298583984, "global_step": 326866, "epoch": 2701} {"train_loss": -43.11323547363281, "global_step": 326867, "epoch": 2701} {"train_loss": -41.9771842956543, "global_step": 326868, "epoch": 2701} {"train_loss": -43.12398910522461, "global_step": 326869, "epoch": 2701} {"train_loss": -43.31032943725586, "global_step": 326870, "epoch": 2701} {"train_loss": -42.875091552734375, "global_step": 326871, "epoch": 2701} {"train_loss": -43.86971664428711, "global_step": 326872, "epoch": 2701} {"train_loss": -42.35111618041992, "global_step": 326873, "epoch": 2701} {"train_loss": -43.42566680908203, "global_step": 326874, "epoch": 2701} {"train_loss": -43.0760612487793, "global_step": 326875, "epoch": 2701} {"train_loss": -43.414794921875, "global_step": 326876, "epoch": 2701} {"train_loss": -43.20321273803711, "global_step": 326877, "epoch": 2701} {"train_loss": -41.49892044067383, "global_step": 326878, "epoch": 2701} {"train_loss": -42.4432487487793, "global_step": 326879, "epoch": 2701} {"train_loss": -43.363800048828125, "global_step": 326880, "epoch": 2701} {"train_loss": -43.68378829956055, "global_step": 326881, "epoch": 2701} {"train_loss": -43.22442626953125, "global_step": 326882, "epoch": 2701} {"train_loss": -43.45132064819336, "global_step": 326883, "epoch": 2701} {"train_loss": -43.2633171081543, "global_step": 326884, "epoch": 2701} {"train_loss": -43.4423713684082, "global_step": 326885, "epoch": 2701} {"train_loss": -43.29798126220703, "global_step": 326886, "epoch": 2701} {"train_loss": -42.916656494140625, "global_step": 326887, "epoch": 2701} {"train_loss": -42.78951644897461, "global_step": 326888, "epoch": 2701} {"train_loss": -42.93947982788086, "global_step": 326889, "epoch": 2701} {"train_loss": -41.97396469116211, "global_step": 326890, "epoch": 2701} {"train_loss": -42.8537483215332, "global_step": 326891, "epoch": 2701} {"train_loss": -42.660369873046875, "global_step": 326892, "epoch": 2701} {"train_loss": -43.19321823120117, "global_step": 326893, "epoch": 2701} {"train_loss": -42.95846176147461, "global_step": 326894, "epoch": 2701} {"train_loss": -42.732452392578125, "global_step": 326895, "epoch": 2701} {"train_loss": -41.7777099609375, "global_step": 326896, "epoch": 2701} {"train_loss": -42.34865188598633, "global_step": 326897, "epoch": 2701} {"train_loss": -41.10300827026367, "global_step": 326898, "epoch": 2701} {"train_loss": -42.422359466552734, "global_step": 326899, "epoch": 2701} {"train_loss": -40.748565673828125, "global_step": 326900, "epoch": 2701} {"train_loss": -41.06324005126953, "global_step": 326901, "epoch": 2701} {"train_loss": -41.06959915161133, "global_step": 326902, "epoch": 2701} {"train_loss": -42.01344680786133, "global_step": 326903, "epoch": 2701} {"train_loss": -41.4289436340332, "global_step": 326904, "epoch": 2701} {"train_loss": -42.15754318237305, "global_step": 326905, "epoch": 2701} {"train_loss": -42.02753448486328, "global_step": 326906, "epoch": 2701} {"train_loss": -41.516357421875, "global_step": 326907, "epoch": 2701} {"train_loss": -41.88300704956055, "global_step": 326908, "epoch": 2701} {"train_loss": -40.69537353515625, "global_step": 326909, "epoch": 2701} {"train_loss": -39.33330154418945, "global_step": 326910, "epoch": 2701} {"train_loss": -42.76544952392578, "global_step": 326911, "epoch": 2701} {"train_loss": -41.189754486083984, "global_step": 326912, "epoch": 2701} {"train_loss": -41.15605163574219, "global_step": 326913, "epoch": 2701} {"train_loss": -42.337947845458984, "global_step": 326914, "epoch": 2701} {"train_loss": -40.42075729370117, "global_step": 326915, "epoch": 2701} {"train_loss": -41.006683349609375, "global_step": 326916, "epoch": 2701} {"train_loss": -41.101844787597656, "global_step": 326917, "epoch": 2701} {"train_loss": -39.72218704223633, "global_step": 326918, "epoch": 2701} {"train_loss": -39.13173294067383, "global_step": 326919, "epoch": 2701} {"train_loss": -40.76668167114258, "global_step": 326920, "epoch": 2701} {"train_loss": -41.48177719116211, "global_step": 326921, "epoch": 2701} {"train_loss": -39.57625198364258, "global_step": 326922, "epoch": 2701} {"train_loss": -42.389095306396484, "global_step": 326923, "epoch": 2701} {"train_loss": -39.46882247924805, "global_step": 326924, "epoch": 2701} {"train_loss": -39.34467697143555, "global_step": 326925, "epoch": 2701} {"train_loss": -41.16160583496094, "global_step": 326926, "epoch": 2701} {"train_loss": -41.853515625, "global_step": 326927, "epoch": 2701} {"train_loss": -40.97308349609375, "global_step": 326928, "epoch": 2701} {"train_loss": -40.63521194458008, "global_step": 326929, "epoch": 2701} {"train_loss": -41.80155944824219, "global_step": 326930, "epoch": 2701} {"train_loss": -41.023250579833984, "global_step": 326931, "epoch": 2701} {"train_loss": -41.685054779052734, "global_step": 326932, "epoch": 2701} {"train_loss": -39.7115364074707, "global_step": 326933, "epoch": 2701} {"train_loss": -42.09269714355469, "global_step": 326934, "epoch": 2701} {"train_loss": -40.17549133300781, "global_step": 326935, "epoch": 2701} {"train_loss": -42.26408004760742, "global_step": 326936, "epoch": 2701} {"train_loss": -39.566829681396484, "global_step": 326937, "epoch": 2701} {"train_loss": -42.01262283325195, "global_step": 326938, "epoch": 2701} {"train_loss": -39.66436767578125, "global_step": 326939, "epoch": 2701} {"train_loss": -41.53815460205078, "global_step": 326940, "epoch": 2701} {"train_loss": -42.180930303148, "global_step": 326941, "epoch": 2701, "val_loss": 2501448.75} {"train_loss": -40.052974700927734, "global_step": 326942, "epoch": 2702} {"train_loss": -42.35834503173828, "global_step": 326943, "epoch": 2702} {"train_loss": -39.97407150268555, "global_step": 326944, "epoch": 2702} {"train_loss": -42.29193878173828, "global_step": 326945, "epoch": 2702} {"train_loss": -38.9350471496582, "global_step": 326946, "epoch": 2702} {"train_loss": -42.5484733581543, "global_step": 326947, "epoch": 2702} {"train_loss": -40.313961029052734, "global_step": 326948, "epoch": 2702} {"train_loss": -42.42366409301758, "global_step": 326949, "epoch": 2702} {"train_loss": -40.70589828491211, "global_step": 326950, "epoch": 2702} {"train_loss": -42.74445343017578, "global_step": 326951, "epoch": 2702} {"train_loss": -40.919952392578125, "global_step": 326952, "epoch": 2702} {"train_loss": -43.093990325927734, "global_step": 326953, "epoch": 2702} {"train_loss": -42.25634765625, "global_step": 326954, "epoch": 2702} {"train_loss": -42.810794830322266, "global_step": 326955, "epoch": 2702} {"train_loss": -43.08699417114258, "global_step": 326956, "epoch": 2702} {"train_loss": -42.86007308959961, "global_step": 326957, "epoch": 2702} {"train_loss": -43.0191650390625, "global_step": 326958, "epoch": 2702} {"train_loss": -42.90282440185547, "global_step": 326959, "epoch": 2702} {"train_loss": -43.051204681396484, "global_step": 326960, "epoch": 2702} {"train_loss": -43.092647552490234, "global_step": 326961, "epoch": 2702} {"train_loss": -43.57069778442383, "global_step": 326962, "epoch": 2702} {"train_loss": -42.44390869140625, "global_step": 326963, "epoch": 2702} {"train_loss": -43.72263717651367, "global_step": 326964, "epoch": 2702} {"train_loss": -43.381954193115234, "global_step": 326965, "epoch": 2702} {"train_loss": -43.83246994018555, "global_step": 326966, "epoch": 2702} {"train_loss": -43.44328308105469, "global_step": 326967, "epoch": 2702} {"train_loss": -43.795284271240234, "global_step": 326968, "epoch": 2702} {"train_loss": -43.64824295043945, "global_step": 326969, "epoch": 2702} {"train_loss": -43.79755401611328, "global_step": 326970, "epoch": 2702} {"train_loss": -43.41149139404297, "global_step": 326971, "epoch": 2702} {"train_loss": -44.189537048339844, "global_step": 326972, "epoch": 2702} {"train_loss": -43.790184020996094, "global_step": 326973, "epoch": 2702} {"train_loss": -43.53118896484375, "global_step": 326974, "epoch": 2702} {"train_loss": -43.74837875366211, "global_step": 326975, "epoch": 2702} {"train_loss": -43.82694625854492, "global_step": 326976, "epoch": 2702} {"train_loss": -44.037532806396484, "global_step": 326977, "epoch": 2702} {"train_loss": -43.58585739135742, "global_step": 326978, "epoch": 2702} {"train_loss": -43.217018127441406, "global_step": 326979, "epoch": 2702} {"train_loss": -43.9807243347168, "global_step": 326980, "epoch": 2702} {"train_loss": -44.02336502075195, "global_step": 326981, "epoch": 2702} {"train_loss": -43.86520767211914, "global_step": 326982, "epoch": 2702} {"train_loss": -44.162330627441406, "global_step": 326983, "epoch": 2702} {"train_loss": -44.28839111328125, "global_step": 326984, "epoch": 2702} {"train_loss": -44.2652587890625, "global_step": 326985, "epoch": 2702} {"train_loss": -44.273712158203125, "global_step": 326986, "epoch": 2702} {"train_loss": -44.36790084838867, "global_step": 326987, "epoch": 2702} {"train_loss": -44.32292938232422, "global_step": 326988, "epoch": 2702} {"train_loss": -44.333282470703125, "global_step": 326989, "epoch": 2702} {"train_loss": -43.93450927734375, "global_step": 326990, "epoch": 2702} {"train_loss": -44.485816955566406, "global_step": 326991, "epoch": 2702} {"train_loss": -44.04627227783203, "global_step": 326992, "epoch": 2702} {"train_loss": -44.39406967163086, "global_step": 326993, "epoch": 2702} {"train_loss": -43.7943229675293, "global_step": 326994, "epoch": 2702} {"train_loss": -44.395137786865234, "global_step": 326995, "epoch": 2702} {"train_loss": -44.36001205444336, "global_step": 326996, "epoch": 2702} {"train_loss": -44.166114807128906, "global_step": 326997, "epoch": 2702} {"train_loss": -44.50272750854492, "global_step": 326998, "epoch": 2702} {"train_loss": -43.92706298828125, "global_step": 326999, "epoch": 2702} {"train_loss": -43.62041473388672, "global_step": 327000, "epoch": 2702} {"train_loss": -43.8008918762207, "global_step": 327001, "epoch": 2702} {"train_loss": -44.21221923828125, "global_step": 327002, "epoch": 2702} {"train_loss": -44.760589599609375, "global_step": 327003, "epoch": 2702} {"train_loss": -44.35645294189453, "global_step": 327004, "epoch": 2702} {"train_loss": -43.957332611083984, "global_step": 327005, "epoch": 2702} {"train_loss": -43.250789642333984, "global_step": 327006, "epoch": 2702} {"train_loss": -41.853607177734375, "global_step": 327007, "epoch": 2702} {"train_loss": -38.58022689819336, "global_step": 327008, "epoch": 2702} {"train_loss": -35.004329681396484, "global_step": 327009, "epoch": 2702} {"train_loss": -36.79279708862305, "global_step": 327010, "epoch": 2702} {"train_loss": -41.382808685302734, "global_step": 327011, "epoch": 2702} {"train_loss": -43.14393997192383, "global_step": 327012, "epoch": 2702} {"train_loss": -42.66083908081055, "global_step": 327013, "epoch": 2702} {"train_loss": -42.43911361694336, "global_step": 327014, "epoch": 2702} {"train_loss": -43.842281341552734, "global_step": 327015, "epoch": 2702} {"train_loss": -42.612064361572266, "global_step": 327016, "epoch": 2702} {"train_loss": -42.13237380981445, "global_step": 327017, "epoch": 2702} {"train_loss": -42.00736999511719, "global_step": 327018, "epoch": 2702} {"train_loss": -43.257381439208984, "global_step": 327019, "epoch": 2702} {"train_loss": -43.08226013183594, "global_step": 327020, "epoch": 2702} {"train_loss": -42.56185531616211, "global_step": 327021, "epoch": 2702} {"train_loss": -44.088497161865234, "global_step": 327022, "epoch": 2702} {"train_loss": -41.74991989135742, "global_step": 327023, "epoch": 2702} {"train_loss": -41.622623443603516, "global_step": 327024, "epoch": 2702} {"train_loss": -43.68791580200195, "global_step": 327025, "epoch": 2702} {"train_loss": -42.91791915893555, "global_step": 327026, "epoch": 2702} {"train_loss": -42.27364730834961, "global_step": 327027, "epoch": 2702} {"train_loss": -43.20278549194336, "global_step": 327028, "epoch": 2702} {"train_loss": -43.11408996582031, "global_step": 327029, "epoch": 2702} {"train_loss": -41.504730224609375, "global_step": 327030, "epoch": 2702} {"train_loss": -43.5887336730957, "global_step": 327031, "epoch": 2702} {"train_loss": -41.42263412475586, "global_step": 327032, "epoch": 2702} {"train_loss": -41.559669494628906, "global_step": 327033, "epoch": 2702} {"train_loss": -43.238807678222656, "global_step": 327034, "epoch": 2702} {"train_loss": -41.72865676879883, "global_step": 327035, "epoch": 2702} {"train_loss": -41.799705505371094, "global_step": 327036, "epoch": 2702} {"train_loss": -42.64685821533203, "global_step": 327037, "epoch": 2702} {"train_loss": -42.19070816040039, "global_step": 327038, "epoch": 2702} {"train_loss": -42.969661712646484, "global_step": 327039, "epoch": 2702} {"train_loss": -43.32069396972656, "global_step": 327040, "epoch": 2702} {"train_loss": -43.37543487548828, "global_step": 327041, "epoch": 2702} {"train_loss": -42.504058837890625, "global_step": 327042, "epoch": 2702} {"train_loss": -42.772857666015625, "global_step": 327043, "epoch": 2702} {"train_loss": -43.56471633911133, "global_step": 327044, "epoch": 2702} {"train_loss": -43.56074142456055, "global_step": 327045, "epoch": 2702} {"train_loss": -42.80256271362305, "global_step": 327046, "epoch": 2702} {"train_loss": -41.65558624267578, "global_step": 327047, "epoch": 2702} {"train_loss": -42.39457321166992, "global_step": 327048, "epoch": 2702} {"train_loss": -43.662818908691406, "global_step": 327049, "epoch": 2702} {"train_loss": -42.275978088378906, "global_step": 327050, "epoch": 2702} {"train_loss": -42.22089767456055, "global_step": 327051, "epoch": 2702} {"train_loss": -42.65644454956055, "global_step": 327052, "epoch": 2702} {"train_loss": -42.73384475708008, "global_step": 327053, "epoch": 2702} {"train_loss": -42.58286666870117, "global_step": 327054, "epoch": 2702} {"train_loss": -42.676883697509766, "global_step": 327055, "epoch": 2702} {"train_loss": -42.15019989013672, "global_step": 327056, "epoch": 2702} {"train_loss": -38.838130950927734, "global_step": 327057, "epoch": 2702} {"train_loss": -44.17505645751953, "global_step": 327058, "epoch": 2702} {"train_loss": -42.75879669189453, "global_step": 327059, "epoch": 2702} {"train_loss": -43.541351318359375, "global_step": 327060, "epoch": 2702} {"train_loss": -43.2843017578125, "global_step": 327061, "epoch": 2702} {"train_loss": -42.84281924539361, "global_step": 327062, "epoch": 2702, "val_loss": 2515375.25} {"train_loss": -43.46311569213867, "global_step": 327063, "epoch": 2703} {"train_loss": -43.286590576171875, "global_step": 327064, "epoch": 2703} {"train_loss": -43.5080451965332, "global_step": 327065, "epoch": 2703} {"train_loss": -43.49613952636719, "global_step": 327066, "epoch": 2703} {"train_loss": -43.79779052734375, "global_step": 327067, "epoch": 2703} {"train_loss": -43.79582595825195, "global_step": 327068, "epoch": 2703} {"train_loss": -43.66057205200195, "global_step": 327069, "epoch": 2703} {"train_loss": -43.63560104370117, "global_step": 327070, "epoch": 2703} {"train_loss": -43.046478271484375, "global_step": 327071, "epoch": 2703} {"train_loss": -43.84995651245117, "global_step": 327072, "epoch": 2703} {"train_loss": -43.26142120361328, "global_step": 327073, "epoch": 2703} {"train_loss": -43.07139205932617, "global_step": 327074, "epoch": 2703} {"train_loss": -41.35633087158203, "global_step": 327075, "epoch": 2703} {"train_loss": -43.81858444213867, "global_step": 327076, "epoch": 2703} {"train_loss": -43.530662536621094, "global_step": 327077, "epoch": 2703} {"train_loss": -43.73974609375, "global_step": 327078, "epoch": 2703} {"train_loss": -41.78758239746094, "global_step": 327079, "epoch": 2703} {"train_loss": -43.26613235473633, "global_step": 327080, "epoch": 2703} {"train_loss": -43.5920295715332, "global_step": 327081, "epoch": 2703} {"train_loss": -43.82819366455078, "global_step": 327082, "epoch": 2703} {"train_loss": -43.716033935546875, "global_step": 327083, "epoch": 2703} {"train_loss": -43.85390853881836, "global_step": 327084, "epoch": 2703} {"train_loss": -42.734134674072266, "global_step": 327085, "epoch": 2703} {"train_loss": -42.85710906982422, "global_step": 327086, "epoch": 2703} {"train_loss": -43.644344329833984, "global_step": 327087, "epoch": 2703} {"train_loss": -43.13448715209961, "global_step": 327088, "epoch": 2703} {"train_loss": -43.312896728515625, "global_step": 327089, "epoch": 2703} {"train_loss": -42.29446792602539, "global_step": 327090, "epoch": 2703} {"train_loss": -43.69239807128906, "global_step": 327091, "epoch": 2703} {"train_loss": -43.125701904296875, "global_step": 327092, "epoch": 2703} {"train_loss": -43.3896369934082, "global_step": 327093, "epoch": 2703} {"train_loss": -44.217369079589844, "global_step": 327094, "epoch": 2703} {"train_loss": -43.566673278808594, "global_step": 327095, "epoch": 2703} {"train_loss": -43.54623031616211, "global_step": 327096, "epoch": 2703} {"train_loss": -44.208526611328125, "global_step": 327097, "epoch": 2703} {"train_loss": -43.868350982666016, "global_step": 327098, "epoch": 2703} {"train_loss": -43.963008880615234, "global_step": 327099, "epoch": 2703} {"train_loss": -35.83315658569336, "global_step": 327100, "epoch": 2703} {"train_loss": -43.99415588378906, "global_step": 327101, "epoch": 2703} {"train_loss": -42.83345413208008, "global_step": 327102, "epoch": 2703} {"train_loss": -43.71295166015625, "global_step": 327103, "epoch": 2703} {"train_loss": -43.98091506958008, "global_step": 327104, "epoch": 2703} {"train_loss": -43.790679931640625, "global_step": 327105, "epoch": 2703} {"train_loss": -42.258201599121094, "global_step": 327106, "epoch": 2703} {"train_loss": -44.05248260498047, "global_step": 327107, "epoch": 2703} {"train_loss": -44.54384994506836, "global_step": 327108, "epoch": 2703} {"train_loss": -43.985015869140625, "global_step": 327109, "epoch": 2703} {"train_loss": -43.382179260253906, "global_step": 327110, "epoch": 2703} {"train_loss": -43.745574951171875, "global_step": 327111, "epoch": 2703} {"train_loss": -42.41495895385742, "global_step": 327112, "epoch": 2703} {"train_loss": -42.91817855834961, "global_step": 327113, "epoch": 2703} {"train_loss": -42.87860107421875, "global_step": 327114, "epoch": 2703} {"train_loss": -42.6844482421875, "global_step": 327115, "epoch": 2703} {"train_loss": -42.79229736328125, "global_step": 327116, "epoch": 2703} {"train_loss": -43.51097869873047, "global_step": 327117, "epoch": 2703} {"train_loss": -43.744869232177734, "global_step": 327118, "epoch": 2703} {"train_loss": -35.71089553833008, "global_step": 327119, "epoch": 2703} {"train_loss": -39.707855224609375, "global_step": 327120, "epoch": 2703} {"train_loss": -41.50815963745117, "global_step": 327121, "epoch": 2703} {"train_loss": -40.85260772705078, "global_step": 327122, "epoch": 2703} {"train_loss": -42.691307067871094, "global_step": 327123, "epoch": 2703} {"train_loss": -42.07009506225586, "global_step": 327124, "epoch": 2703} {"train_loss": -38.90974426269531, "global_step": 327125, "epoch": 2703} {"train_loss": -42.75452423095703, "global_step": 327126, "epoch": 2703} {"train_loss": -41.56489181518555, "global_step": 327127, "epoch": 2703} {"train_loss": -42.14044189453125, "global_step": 327128, "epoch": 2703} {"train_loss": -41.40841293334961, "global_step": 327129, "epoch": 2703} {"train_loss": -40.23940658569336, "global_step": 327130, "epoch": 2703} {"train_loss": -40.15605163574219, "global_step": 327131, "epoch": 2703} {"train_loss": -41.56940460205078, "global_step": 327132, "epoch": 2703} {"train_loss": -30.64313316345215, "global_step": 327133, "epoch": 2703} {"train_loss": -37.52033615112305, "global_step": 327134, "epoch": 2703} {"train_loss": -35.249568939208984, "global_step": 327135, "epoch": 2703} {"train_loss": -40.76398849487305, "global_step": 327136, "epoch": 2703} {"train_loss": -40.84788131713867, "global_step": 327137, "epoch": 2703} {"train_loss": -40.1968994140625, "global_step": 327138, "epoch": 2703} {"train_loss": -38.014259338378906, "global_step": 327139, "epoch": 2703} {"train_loss": -38.274993896484375, "global_step": 327140, "epoch": 2703} {"train_loss": -41.504329681396484, "global_step": 327141, "epoch": 2703} {"train_loss": -39.43284225463867, "global_step": 327142, "epoch": 2703} {"train_loss": -41.550819396972656, "global_step": 327143, "epoch": 2703} {"train_loss": -40.91634750366211, "global_step": 327144, "epoch": 2703} {"train_loss": -39.26554489135742, "global_step": 327145, "epoch": 2703} {"train_loss": -38.38169479370117, "global_step": 327146, "epoch": 2703} {"train_loss": -37.840572357177734, "global_step": 327147, "epoch": 2703} {"train_loss": -38.66773223876953, "global_step": 327148, "epoch": 2703} {"train_loss": -39.96128463745117, "global_step": 327149, "epoch": 2703} {"train_loss": -35.94860076904297, "global_step": 327150, "epoch": 2703} {"train_loss": -41.576904296875, "global_step": 327151, "epoch": 2703} {"train_loss": -38.34133529663086, "global_step": 327152, "epoch": 2703} {"train_loss": -40.6103401184082, "global_step": 327153, "epoch": 2703} {"train_loss": -40.8807258605957, "global_step": 327154, "epoch": 2703} {"train_loss": -40.649322509765625, "global_step": 327155, "epoch": 2703} {"train_loss": -38.87866973876953, "global_step": 327156, "epoch": 2703} {"train_loss": -41.4318962097168, "global_step": 327157, "epoch": 2703} {"train_loss": -40.36835861206055, "global_step": 327158, "epoch": 2703} {"train_loss": -38.8525505065918, "global_step": 327159, "epoch": 2703} {"train_loss": -41.33222198486328, "global_step": 327160, "epoch": 2703} {"train_loss": -40.64316940307617, "global_step": 327161, "epoch": 2703} {"train_loss": -41.957881927490234, "global_step": 327162, "epoch": 2703} {"train_loss": -40.66123580932617, "global_step": 327163, "epoch": 2703} {"train_loss": -40.55312728881836, "global_step": 327164, "epoch": 2703} {"train_loss": -42.428043365478516, "global_step": 327165, "epoch": 2703} {"train_loss": -41.759307861328125, "global_step": 327166, "epoch": 2703} {"train_loss": -40.79526901245117, "global_step": 327167, "epoch": 2703} {"train_loss": -40.1689338684082, "global_step": 327168, "epoch": 2703} {"train_loss": -39.92280197143555, "global_step": 327169, "epoch": 2703} {"train_loss": -42.508575439453125, "global_step": 327170, "epoch": 2703} {"train_loss": -42.70878219604492, "global_step": 327171, "epoch": 2703} {"train_loss": -42.40998077392578, "global_step": 327172, "epoch": 2703} {"train_loss": -41.92086410522461, "global_step": 327173, "epoch": 2703} {"train_loss": -42.047218322753906, "global_step": 327174, "epoch": 2703} {"train_loss": -41.93524169921875, "global_step": 327175, "epoch": 2703} {"train_loss": -39.4897575378418, "global_step": 327176, "epoch": 2703} {"train_loss": -42.281272888183594, "global_step": 327177, "epoch": 2703} {"train_loss": -42.602989196777344, "global_step": 327178, "epoch": 2703} {"train_loss": -42.3150520324707, "global_step": 327179, "epoch": 2703} {"train_loss": -42.31264877319336, "global_step": 327180, "epoch": 2703} {"train_loss": -42.70248031616211, "global_step": 327181, "epoch": 2703} {"train_loss": -41.82857894897461, "global_step": 327182, "epoch": 2703} {"train_loss": -41.729603144748154, "global_step": 327183, "epoch": 2703, "val_loss": 2522403.25} {"train_loss": -42.4252815246582, "global_step": 327184, "epoch": 2704} {"train_loss": -41.8436164855957, "global_step": 327185, "epoch": 2704} {"train_loss": -42.40815353393555, "global_step": 327186, "epoch": 2704} {"train_loss": -42.04874801635742, "global_step": 327187, "epoch": 2704} {"train_loss": -41.70430374145508, "global_step": 327188, "epoch": 2704} {"train_loss": -41.91962814331055, "global_step": 327189, "epoch": 2704} {"train_loss": -42.457820892333984, "global_step": 327190, "epoch": 2704} {"train_loss": -41.69001770019531, "global_step": 327191, "epoch": 2704} {"train_loss": -42.68635940551758, "global_step": 327192, "epoch": 2704} {"train_loss": -42.474449157714844, "global_step": 327193, "epoch": 2704} {"train_loss": -42.0325813293457, "global_step": 327194, "epoch": 2704} {"train_loss": -41.71294021606445, "global_step": 327195, "epoch": 2704} {"train_loss": -42.15373229980469, "global_step": 327196, "epoch": 2704} {"train_loss": -42.05491256713867, "global_step": 327197, "epoch": 2704} {"train_loss": -41.27669906616211, "global_step": 327198, "epoch": 2704} {"train_loss": -42.0965461730957, "global_step": 327199, "epoch": 2704} {"train_loss": -42.99863815307617, "global_step": 327200, "epoch": 2704} {"train_loss": -42.399471282958984, "global_step": 327201, "epoch": 2704} {"train_loss": -42.72492599487305, "global_step": 327202, "epoch": 2704} {"train_loss": -42.51520919799805, "global_step": 327203, "epoch": 2704} {"train_loss": -42.72034454345703, "global_step": 327204, "epoch": 2704} {"train_loss": -43.3336296081543, "global_step": 327205, "epoch": 2704} {"train_loss": -41.33026885986328, "global_step": 327206, "epoch": 2704} {"train_loss": -43.2667121887207, "global_step": 327207, "epoch": 2704} {"train_loss": -42.99391555786133, "global_step": 327208, "epoch": 2704} {"train_loss": -41.75260543823242, "global_step": 327209, "epoch": 2704} {"train_loss": -43.127838134765625, "global_step": 327210, "epoch": 2704} {"train_loss": -42.23578643798828, "global_step": 327211, "epoch": 2704} {"train_loss": -42.07655715942383, "global_step": 327212, "epoch": 2704} {"train_loss": -43.1002311706543, "global_step": 327213, "epoch": 2704} {"train_loss": -42.8922233581543, "global_step": 327214, "epoch": 2704} {"train_loss": -41.840816497802734, "global_step": 327215, "epoch": 2704} {"train_loss": -42.64483642578125, "global_step": 327216, "epoch": 2704} {"train_loss": -43.20417404174805, "global_step": 327217, "epoch": 2704} {"train_loss": -43.266212463378906, "global_step": 327218, "epoch": 2704} {"train_loss": -43.14652633666992, "global_step": 327219, "epoch": 2704} {"train_loss": -42.06980514526367, "global_step": 327220, "epoch": 2704} {"train_loss": -43.598602294921875, "global_step": 327221, "epoch": 2704} {"train_loss": -43.63246536254883, "global_step": 327222, "epoch": 2704} {"train_loss": -43.70058059692383, "global_step": 327223, "epoch": 2704} {"train_loss": -43.500789642333984, "global_step": 327224, "epoch": 2704} {"train_loss": -43.059326171875, "global_step": 327225, "epoch": 2704} {"train_loss": -43.47011947631836, "global_step": 327226, "epoch": 2704} {"train_loss": -43.40793991088867, "global_step": 327227, "epoch": 2704} {"train_loss": -43.942108154296875, "global_step": 327228, "epoch": 2704} {"train_loss": -43.82023239135742, "global_step": 327229, "epoch": 2704} {"train_loss": -43.52804946899414, "global_step": 327230, "epoch": 2704} {"train_loss": -43.28455352783203, "global_step": 327231, "epoch": 2704} {"train_loss": -42.729854583740234, "global_step": 327232, "epoch": 2704} {"train_loss": -43.5410270690918, "global_step": 327233, "epoch": 2704} {"train_loss": -43.62002182006836, "global_step": 327234, "epoch": 2704} {"train_loss": -43.985687255859375, "global_step": 327235, "epoch": 2704} {"train_loss": -43.70435333251953, "global_step": 327236, "epoch": 2704} {"train_loss": -43.90528106689453, "global_step": 327237, "epoch": 2704} {"train_loss": -42.82529830932617, "global_step": 327238, "epoch": 2704} {"train_loss": -43.2783317565918, "global_step": 327239, "epoch": 2704} {"train_loss": -43.55315017700195, "global_step": 327240, "epoch": 2704} {"train_loss": -43.3003044128418, "global_step": 327241, "epoch": 2704} {"train_loss": -41.394935607910156, "global_step": 327242, "epoch": 2704} {"train_loss": -43.66765213012695, "global_step": 327243, "epoch": 2704} {"train_loss": -44.24331283569336, "global_step": 327244, "epoch": 2704} {"train_loss": -44.05742263793945, "global_step": 327245, "epoch": 2704} {"train_loss": -43.03561019897461, "global_step": 327246, "epoch": 2704} {"train_loss": -43.7764892578125, "global_step": 327247, "epoch": 2704} {"train_loss": -43.3032341003418, "global_step": 327248, "epoch": 2704} {"train_loss": -41.695770263671875, "global_step": 327249, "epoch": 2704} {"train_loss": -43.2158088684082, "global_step": 327250, "epoch": 2704} {"train_loss": -43.867244720458984, "global_step": 327251, "epoch": 2704} {"train_loss": -43.5716667175293, "global_step": 327252, "epoch": 2704} {"train_loss": -44.152503967285156, "global_step": 327253, "epoch": 2704} {"train_loss": -43.49404525756836, "global_step": 327254, "epoch": 2704} {"train_loss": -43.848419189453125, "global_step": 327255, "epoch": 2704} {"train_loss": -43.925209045410156, "global_step": 327256, "epoch": 2704} {"train_loss": -43.842201232910156, "global_step": 327257, "epoch": 2704} {"train_loss": -43.9889030456543, "global_step": 327258, "epoch": 2704} {"train_loss": -44.14174270629883, "global_step": 327259, "epoch": 2704} {"train_loss": -44.45185852050781, "global_step": 327260, "epoch": 2704} {"train_loss": -43.57509994506836, "global_step": 327261, "epoch": 2704} {"train_loss": -43.916748046875, "global_step": 327262, "epoch": 2704} {"train_loss": -43.73405838012695, "global_step": 327263, "epoch": 2704} {"train_loss": -43.8736457824707, "global_step": 327264, "epoch": 2704} {"train_loss": -43.8553352355957, "global_step": 327265, "epoch": 2704} {"train_loss": -43.038082122802734, "global_step": 327266, "epoch": 2704} {"train_loss": -43.64927291870117, "global_step": 327267, "epoch": 2704} {"train_loss": -44.00094223022461, "global_step": 327268, "epoch": 2704} {"train_loss": -43.77400588989258, "global_step": 327269, "epoch": 2704} {"train_loss": -43.50107192993164, "global_step": 327270, "epoch": 2704} {"train_loss": -42.63507080078125, "global_step": 327271, "epoch": 2704} {"train_loss": -43.51375198364258, "global_step": 327272, "epoch": 2704} {"train_loss": -43.35459518432617, "global_step": 327273, "epoch": 2704} {"train_loss": -43.40974807739258, "global_step": 327274, "epoch": 2704} {"train_loss": -43.769081115722656, "global_step": 327275, "epoch": 2704} {"train_loss": -43.39764404296875, "global_step": 327276, "epoch": 2704} {"train_loss": -43.761444091796875, "global_step": 327277, "epoch": 2704} {"train_loss": -43.64691925048828, "global_step": 327278, "epoch": 2704} {"train_loss": -43.36178207397461, "global_step": 327279, "epoch": 2704} {"train_loss": -43.153541564941406, "global_step": 327280, "epoch": 2704} {"train_loss": -39.285823822021484, "global_step": 327281, "epoch": 2704} {"train_loss": -34.34199142456055, "global_step": 327282, "epoch": 2704} {"train_loss": -39.55458450317383, "global_step": 327283, "epoch": 2704} {"train_loss": -42.2652473449707, "global_step": 327284, "epoch": 2704} {"train_loss": -37.38133239746094, "global_step": 327285, "epoch": 2704} {"train_loss": -35.417476654052734, "global_step": 327286, "epoch": 2704} {"train_loss": -41.73659896850586, "global_step": 327287, "epoch": 2704} {"train_loss": -37.57929611206055, "global_step": 327288, "epoch": 2704} {"train_loss": -33.527462005615234, "global_step": 327289, "epoch": 2704} {"train_loss": -35.64239501953125, "global_step": 327290, "epoch": 2704} {"train_loss": -41.284461975097656, "global_step": 327291, "epoch": 2704} {"train_loss": -32.100276947021484, "global_step": 327292, "epoch": 2704} {"train_loss": -37.76529312133789, "global_step": 327293, "epoch": 2704} {"train_loss": -40.75510787963867, "global_step": 327294, "epoch": 2704} {"train_loss": -39.62276840209961, "global_step": 327295, "epoch": 2704} {"train_loss": -40.534263610839844, "global_step": 327296, "epoch": 2704} {"train_loss": -38.031394958496094, "global_step": 327297, "epoch": 2704} {"train_loss": -40.05561447143555, "global_step": 327298, "epoch": 2704} {"train_loss": -40.50965118408203, "global_step": 327299, "epoch": 2704} {"train_loss": -40.812042236328125, "global_step": 327300, "epoch": 2704} {"train_loss": -41.05390930175781, "global_step": 327301, "epoch": 2704} {"train_loss": -40.86224365234375, "global_step": 327302, "epoch": 2704} {"train_loss": -41.066864013671875, "global_step": 327303, "epoch": 2704} {"train_loss": -42.247163945978336, "global_step": 327304, "epoch": 2704, "val_loss": 2674708.75} {"train_loss": -41.916744232177734, "global_step": 327305, "epoch": 2705} {"train_loss": -40.1412467956543, "global_step": 327306, "epoch": 2705} {"train_loss": -42.10060501098633, "global_step": 327307, "epoch": 2705} {"train_loss": -41.39673614501953, "global_step": 327308, "epoch": 2705} {"train_loss": -41.5853385925293, "global_step": 327309, "epoch": 2705} {"train_loss": -42.713592529296875, "global_step": 327310, "epoch": 2705} {"train_loss": -40.102718353271484, "global_step": 327311, "epoch": 2705} {"train_loss": -42.39696502685547, "global_step": 327312, "epoch": 2705} {"train_loss": -42.89017868041992, "global_step": 327313, "epoch": 2705} {"train_loss": -42.59700012207031, "global_step": 327314, "epoch": 2705} {"train_loss": -42.70306396484375, "global_step": 327315, "epoch": 2705} {"train_loss": -42.160579681396484, "global_step": 327316, "epoch": 2705} {"train_loss": -42.80006790161133, "global_step": 327317, "epoch": 2705} {"train_loss": -42.4027099609375, "global_step": 327318, "epoch": 2705} {"train_loss": -42.16665267944336, "global_step": 327319, "epoch": 2705} {"train_loss": -43.14898681640625, "global_step": 327320, "epoch": 2705} {"train_loss": -42.82466506958008, "global_step": 327321, "epoch": 2705} {"train_loss": -42.34772872924805, "global_step": 327322, "epoch": 2705} {"train_loss": -43.05146408081055, "global_step": 327323, "epoch": 2705} {"train_loss": -43.33134078979492, "global_step": 327324, "epoch": 2705} {"train_loss": -42.844852447509766, "global_step": 327325, "epoch": 2705} {"train_loss": -43.07577896118164, "global_step": 327326, "epoch": 2705} {"train_loss": -42.20882797241211, "global_step": 327327, "epoch": 2705} {"train_loss": -42.815399169921875, "global_step": 327328, "epoch": 2705} {"train_loss": -43.5739631652832, "global_step": 327329, "epoch": 2705} {"train_loss": -43.51719284057617, "global_step": 327330, "epoch": 2705} {"train_loss": -43.613040924072266, "global_step": 327331, "epoch": 2705} {"train_loss": -43.548980712890625, "global_step": 327332, "epoch": 2705} {"train_loss": -43.18864059448242, "global_step": 327333, "epoch": 2705} {"train_loss": -43.101661682128906, "global_step": 327334, "epoch": 2705} {"train_loss": -43.0602912902832, "global_step": 327335, "epoch": 2705} {"train_loss": -43.69173049926758, "global_step": 327336, "epoch": 2705} {"train_loss": -43.73320388793945, "global_step": 327337, "epoch": 2705} {"train_loss": -43.608299255371094, "global_step": 327338, "epoch": 2705} {"train_loss": -43.17470169067383, "global_step": 327339, "epoch": 2705} {"train_loss": -43.8298454284668, "global_step": 327340, "epoch": 2705} {"train_loss": -44.32473373413086, "global_step": 327341, "epoch": 2705} {"train_loss": -43.57748031616211, "global_step": 327342, "epoch": 2705} {"train_loss": -43.56101608276367, "global_step": 327343, "epoch": 2705} {"train_loss": -44.03685760498047, "global_step": 327344, "epoch": 2705} {"train_loss": -44.155452728271484, "global_step": 327345, "epoch": 2705} {"train_loss": -44.17940902709961, "global_step": 327346, "epoch": 2705} {"train_loss": -43.8584098815918, "global_step": 327347, "epoch": 2705} {"train_loss": -44.43037796020508, "global_step": 327348, "epoch": 2705} {"train_loss": -43.953460693359375, "global_step": 327349, "epoch": 2705} {"train_loss": -43.785301208496094, "global_step": 327350, "epoch": 2705} {"train_loss": -44.00458908081055, "global_step": 327351, "epoch": 2705} {"train_loss": -43.70786666870117, "global_step": 327352, "epoch": 2705} {"train_loss": -44.41083908081055, "global_step": 327353, "epoch": 2705} {"train_loss": -43.592628479003906, "global_step": 327354, "epoch": 2705} {"train_loss": -44.0725212097168, "global_step": 327355, "epoch": 2705} {"train_loss": -44.3397102355957, "global_step": 327356, "epoch": 2705} {"train_loss": -43.76674270629883, "global_step": 327357, "epoch": 2705} {"train_loss": -43.603206634521484, "global_step": 327358, "epoch": 2705} {"train_loss": -44.20829772949219, "global_step": 327359, "epoch": 2705} {"train_loss": -42.16353988647461, "global_step": 327360, "epoch": 2705} {"train_loss": -44.50423049926758, "global_step": 327361, "epoch": 2705} {"train_loss": -44.27299118041992, "global_step": 327362, "epoch": 2705} {"train_loss": -43.75928497314453, "global_step": 327363, "epoch": 2705} {"train_loss": -43.825653076171875, "global_step": 327364, "epoch": 2705} {"train_loss": -41.861427307128906, "global_step": 327365, "epoch": 2705} {"train_loss": -44.344234466552734, "global_step": 327366, "epoch": 2705} {"train_loss": -44.61555480957031, "global_step": 327367, "epoch": 2705} {"train_loss": -44.18342208862305, "global_step": 327368, "epoch": 2705} {"train_loss": -44.02500534057617, "global_step": 327369, "epoch": 2705} {"train_loss": -44.34498977661133, "global_step": 327370, "epoch": 2705} {"train_loss": -44.33776092529297, "global_step": 327371, "epoch": 2705} {"train_loss": -44.048248291015625, "global_step": 327372, "epoch": 2705} {"train_loss": -44.88176345825195, "global_step": 327373, "epoch": 2705} {"train_loss": -44.26321029663086, "global_step": 327374, "epoch": 2705} {"train_loss": -44.761512756347656, "global_step": 327375, "epoch": 2705} {"train_loss": -45.04243850708008, "global_step": 327376, "epoch": 2705} {"train_loss": -44.625465393066406, "global_step": 327377, "epoch": 2705} {"train_loss": -44.691890716552734, "global_step": 327378, "epoch": 2705} {"train_loss": -44.48114013671875, "global_step": 327379, "epoch": 2705} {"train_loss": -43.47861862182617, "global_step": 327380, "epoch": 2705} {"train_loss": -42.073150634765625, "global_step": 327381, "epoch": 2705} {"train_loss": -37.7855339050293, "global_step": 327382, "epoch": 2705} {"train_loss": -35.05827713012695, "global_step": 327383, "epoch": 2705} {"train_loss": -34.528236389160156, "global_step": 327384, "epoch": 2705} {"train_loss": -38.0322151184082, "global_step": 327385, "epoch": 2705} {"train_loss": -42.89352035522461, "global_step": 327386, "epoch": 2705} {"train_loss": -40.53849792480469, "global_step": 327387, "epoch": 2705} {"train_loss": -34.85724639892578, "global_step": 327388, "epoch": 2705} {"train_loss": -39.88690948486328, "global_step": 327389, "epoch": 2705} {"train_loss": -42.97679138183594, "global_step": 327390, "epoch": 2705} {"train_loss": -41.461830139160156, "global_step": 327391, "epoch": 2705} {"train_loss": -42.544918060302734, "global_step": 327392, "epoch": 2705} {"train_loss": -42.33795928955078, "global_step": 327393, "epoch": 2705} {"train_loss": -41.690757751464844, "global_step": 327394, "epoch": 2705} {"train_loss": -42.8248291015625, "global_step": 327395, "epoch": 2705} {"train_loss": -43.15836715698242, "global_step": 327396, "epoch": 2705} {"train_loss": -42.99638748168945, "global_step": 327397, "epoch": 2705} {"train_loss": -42.862972259521484, "global_step": 327398, "epoch": 2705} {"train_loss": -42.86867141723633, "global_step": 327399, "epoch": 2705} {"train_loss": -43.24223327636719, "global_step": 327400, "epoch": 2705} {"train_loss": -43.09021759033203, "global_step": 327401, "epoch": 2705} {"train_loss": -42.7442741394043, "global_step": 327402, "epoch": 2705} {"train_loss": -42.891910552978516, "global_step": 327403, "epoch": 2705} {"train_loss": -42.245262145996094, "global_step": 327404, "epoch": 2705} {"train_loss": -43.625892639160156, "global_step": 327405, "epoch": 2705} {"train_loss": -42.40236282348633, "global_step": 327406, "epoch": 2705} {"train_loss": -43.201358795166016, "global_step": 327407, "epoch": 2705} {"train_loss": -42.778663635253906, "global_step": 327408, "epoch": 2705} {"train_loss": -43.668575286865234, "global_step": 327409, "epoch": 2705} {"train_loss": -42.77567672729492, "global_step": 327410, "epoch": 2705} {"train_loss": -43.45722579956055, "global_step": 327411, "epoch": 2705} {"train_loss": -43.25449752807617, "global_step": 327412, "epoch": 2705} {"train_loss": -42.9036979675293, "global_step": 327413, "epoch": 2705} {"train_loss": -43.22384262084961, "global_step": 327414, "epoch": 2705} {"train_loss": -43.49410629272461, "global_step": 327415, "epoch": 2705} {"train_loss": -43.87229537963867, "global_step": 327416, "epoch": 2705} {"train_loss": -43.828365325927734, "global_step": 327417, "epoch": 2705} {"train_loss": -44.21201705932617, "global_step": 327418, "epoch": 2705} {"train_loss": -43.77384567260742, "global_step": 327419, "epoch": 2705} {"train_loss": -43.65330123901367, "global_step": 327420, "epoch": 2705} {"train_loss": -43.97168731689453, "global_step": 327421, "epoch": 2705} {"train_loss": -44.32991409301758, "global_step": 327422, "epoch": 2705} {"train_loss": -43.85398483276367, "global_step": 327423, "epoch": 2705} {"train_loss": -43.320533752441406, "global_step": 327424, "epoch": 2705} {"train_loss": -42.96731939394612, "global_step": 327425, "epoch": 2705, "val_loss": 2542297.5} {"train_loss": -44.009185791015625, "global_step": 327426, "epoch": 2706} {"train_loss": -44.73259353637695, "global_step": 327427, "epoch": 2706} {"train_loss": -44.25920486450195, "global_step": 327428, "epoch": 2706} {"train_loss": -43.73188400268555, "global_step": 327429, "epoch": 2706} {"train_loss": -44.21841812133789, "global_step": 327430, "epoch": 2706} {"train_loss": -44.449378967285156, "global_step": 327431, "epoch": 2706} {"train_loss": -44.14567184448242, "global_step": 327432, "epoch": 2706} {"train_loss": -44.355712890625, "global_step": 327433, "epoch": 2706} {"train_loss": -44.64640426635742, "global_step": 327434, "epoch": 2706} {"train_loss": -44.363807678222656, "global_step": 327435, "epoch": 2706} {"train_loss": -44.614376068115234, "global_step": 327436, "epoch": 2706} {"train_loss": -44.17495346069336, "global_step": 327437, "epoch": 2706} {"train_loss": -43.68498611450195, "global_step": 327438, "epoch": 2706} {"train_loss": -44.561767578125, "global_step": 327439, "epoch": 2706} {"train_loss": -44.233638763427734, "global_step": 327440, "epoch": 2706} {"train_loss": -44.31870651245117, "global_step": 327441, "epoch": 2706} {"train_loss": -44.591026306152344, "global_step": 327442, "epoch": 2706} {"train_loss": -44.46403121948242, "global_step": 327443, "epoch": 2706} {"train_loss": -44.65597152709961, "global_step": 327444, "epoch": 2706} {"train_loss": -43.78833770751953, "global_step": 327445, "epoch": 2706} {"train_loss": -44.18033981323242, "global_step": 327446, "epoch": 2706} {"train_loss": -43.70093536376953, "global_step": 327447, "epoch": 2706} {"train_loss": -43.9462890625, "global_step": 327448, "epoch": 2706} {"train_loss": -42.28290939331055, "global_step": 327449, "epoch": 2706} {"train_loss": -43.53052520751953, "global_step": 327450, "epoch": 2706} {"train_loss": -42.745399475097656, "global_step": 327451, "epoch": 2706} {"train_loss": -42.49544906616211, "global_step": 327452, "epoch": 2706} {"train_loss": -43.27534103393555, "global_step": 327453, "epoch": 2706} {"train_loss": -43.129859924316406, "global_step": 327454, "epoch": 2706} {"train_loss": -44.35677719116211, "global_step": 327455, "epoch": 2706} {"train_loss": -43.44131088256836, "global_step": 327456, "epoch": 2706} {"train_loss": -37.335472106933594, "global_step": 327457, "epoch": 2706} {"train_loss": -43.1335563659668, "global_step": 327458, "epoch": 2706} {"train_loss": -42.065765380859375, "global_step": 327459, "epoch": 2706} {"train_loss": -41.578285217285156, "global_step": 327460, "epoch": 2706} {"train_loss": -41.821006774902344, "global_step": 327461, "epoch": 2706} {"train_loss": -39.64968490600586, "global_step": 327462, "epoch": 2706} {"train_loss": -36.972686767578125, "global_step": 327463, "epoch": 2706} {"train_loss": -41.06425094604492, "global_step": 327464, "epoch": 2706} {"train_loss": -42.26484298706055, "global_step": 327465, "epoch": 2706} {"train_loss": -43.266502380371094, "global_step": 327466, "epoch": 2706} {"train_loss": -41.817832946777344, "global_step": 327467, "epoch": 2706} {"train_loss": -40.39790344238281, "global_step": 327468, "epoch": 2706} {"train_loss": -40.52236557006836, "global_step": 327469, "epoch": 2706} {"train_loss": -40.46616744995117, "global_step": 327470, "epoch": 2706} {"train_loss": -39.857486724853516, "global_step": 327471, "epoch": 2706} {"train_loss": -40.12614059448242, "global_step": 327472, "epoch": 2706} {"train_loss": -41.156795501708984, "global_step": 327473, "epoch": 2706} {"train_loss": -42.089900970458984, "global_step": 327474, "epoch": 2706} {"train_loss": -37.169593811035156, "global_step": 327475, "epoch": 2706} {"train_loss": -40.484130859375, "global_step": 327476, "epoch": 2706} {"train_loss": -40.394142150878906, "global_step": 327477, "epoch": 2706} {"train_loss": -41.440914154052734, "global_step": 327478, "epoch": 2706} {"train_loss": -42.27786636352539, "global_step": 327479, "epoch": 2706} {"train_loss": -41.142005920410156, "global_step": 327480, "epoch": 2706} {"train_loss": -41.960201263427734, "global_step": 327481, "epoch": 2706} {"train_loss": -41.08308029174805, "global_step": 327482, "epoch": 2706} {"train_loss": -39.17914962768555, "global_step": 327483, "epoch": 2706} {"train_loss": -39.82283401489258, "global_step": 327484, "epoch": 2706} {"train_loss": -32.018341064453125, "global_step": 327485, "epoch": 2706} {"train_loss": -39.08720016479492, "global_step": 327486, "epoch": 2706} {"train_loss": -42.57353591918945, "global_step": 327487, "epoch": 2706} {"train_loss": -38.75674057006836, "global_step": 327488, "epoch": 2706} {"train_loss": -40.530792236328125, "global_step": 327489, "epoch": 2706} {"train_loss": -40.02473068237305, "global_step": 327490, "epoch": 2706} {"train_loss": -41.43658447265625, "global_step": 327491, "epoch": 2706} {"train_loss": -41.060157775878906, "global_step": 327492, "epoch": 2706} {"train_loss": -37.392669677734375, "global_step": 327493, "epoch": 2706} {"train_loss": -37.56206130981445, "global_step": 327494, "epoch": 2706} {"train_loss": -41.42102813720703, "global_step": 327495, "epoch": 2706} {"train_loss": -36.76637649536133, "global_step": 327496, "epoch": 2706} {"train_loss": -41.52082061767578, "global_step": 327497, "epoch": 2706} {"train_loss": -37.722900390625, "global_step": 327498, "epoch": 2706} {"train_loss": -37.388851165771484, "global_step": 327499, "epoch": 2706} {"train_loss": -39.93308639526367, "global_step": 327500, "epoch": 2706} {"train_loss": -41.35760498046875, "global_step": 327501, "epoch": 2706} {"train_loss": -41.51432418823242, "global_step": 327502, "epoch": 2706} {"train_loss": -41.68958282470703, "global_step": 327503, "epoch": 2706} {"train_loss": -41.84532928466797, "global_step": 327504, "epoch": 2706} {"train_loss": -40.821346282958984, "global_step": 327505, "epoch": 2706} {"train_loss": -41.62424850463867, "global_step": 327506, "epoch": 2706} {"train_loss": -41.50623321533203, "global_step": 327507, "epoch": 2706} {"train_loss": -42.60357666015625, "global_step": 327508, "epoch": 2706} {"train_loss": -41.99325942993164, "global_step": 327509, "epoch": 2706} {"train_loss": -40.92494583129883, "global_step": 327510, "epoch": 2706} {"train_loss": -42.25759506225586, "global_step": 327511, "epoch": 2706} {"train_loss": -42.30729293823242, "global_step": 327512, "epoch": 2706} {"train_loss": -41.91885757446289, "global_step": 327513, "epoch": 2706} {"train_loss": -43.01526641845703, "global_step": 327514, "epoch": 2706} {"train_loss": -41.69407272338867, "global_step": 327515, "epoch": 2706} {"train_loss": -42.18821716308594, "global_step": 327516, "epoch": 2706} {"train_loss": -42.092079162597656, "global_step": 327517, "epoch": 2706} {"train_loss": -41.52924346923828, "global_step": 327518, "epoch": 2706} {"train_loss": -41.84853744506836, "global_step": 327519, "epoch": 2706} {"train_loss": -42.72343826293945, "global_step": 327520, "epoch": 2706} {"train_loss": -42.834754943847656, "global_step": 327521, "epoch": 2706} {"train_loss": -42.95790100097656, "global_step": 327522, "epoch": 2706} {"train_loss": -41.93458938598633, "global_step": 327523, "epoch": 2706} {"train_loss": -41.41542053222656, "global_step": 327524, "epoch": 2706} {"train_loss": -32.88959884643555, "global_step": 327525, "epoch": 2706} {"train_loss": -40.5718879699707, "global_step": 327526, "epoch": 2706} {"train_loss": -39.6112174987793, "global_step": 327527, "epoch": 2706} {"train_loss": -41.242942810058594, "global_step": 327528, "epoch": 2706} {"train_loss": -41.795562744140625, "global_step": 327529, "epoch": 2706} {"train_loss": -37.05447006225586, "global_step": 327530, "epoch": 2706} {"train_loss": -42.45311737060547, "global_step": 327531, "epoch": 2706} {"train_loss": -41.81219482421875, "global_step": 327532, "epoch": 2706} {"train_loss": -42.33488464355469, "global_step": 327533, "epoch": 2706} {"train_loss": -40.562435150146484, "global_step": 327534, "epoch": 2706} {"train_loss": -42.13882827758789, "global_step": 327535, "epoch": 2706} {"train_loss": -41.04462814331055, "global_step": 327536, "epoch": 2706} {"train_loss": -41.210472106933594, "global_step": 327537, "epoch": 2706} {"train_loss": -42.2089729309082, "global_step": 327538, "epoch": 2706} {"train_loss": -42.519325256347656, "global_step": 327539, "epoch": 2706} {"train_loss": -42.01054000854492, "global_step": 327540, "epoch": 2706} {"train_loss": -40.88039779663086, "global_step": 327541, "epoch": 2706} {"train_loss": -41.523231506347656, "global_step": 327542, "epoch": 2706} {"train_loss": -42.90784454345703, "global_step": 327543, "epoch": 2706} {"train_loss": -43.299434661865234, "global_step": 327544, "epoch": 2706} {"train_loss": -41.90349197387695, "global_step": 327545, "epoch": 2706} {"train_loss": -41.64942695680729, "global_step": 327546, "epoch": 2706, "val_loss": 2846174.75} {"train_loss": -41.392024993896484, "global_step": 327547, "epoch": 2707} {"train_loss": -42.38515853881836, "global_step": 327548, "epoch": 2707} {"train_loss": -42.91816329956055, "global_step": 327549, "epoch": 2707} {"train_loss": -42.51717758178711, "global_step": 327550, "epoch": 2707} {"train_loss": -42.26472091674805, "global_step": 327551, "epoch": 2707} {"train_loss": -42.7991828918457, "global_step": 327552, "epoch": 2707} {"train_loss": -42.88261032104492, "global_step": 327553, "epoch": 2707} {"train_loss": -41.94271469116211, "global_step": 327554, "epoch": 2707} {"train_loss": -42.586124420166016, "global_step": 327555, "epoch": 2707} {"train_loss": -42.89664840698242, "global_step": 327556, "epoch": 2707} {"train_loss": -42.07890701293945, "global_step": 327557, "epoch": 2707} {"train_loss": -43.35178756713867, "global_step": 327558, "epoch": 2707} {"train_loss": -41.949161529541016, "global_step": 327559, "epoch": 2707} {"train_loss": -40.4173469543457, "global_step": 327560, "epoch": 2707} {"train_loss": -41.20469284057617, "global_step": 327561, "epoch": 2707} {"train_loss": -40.44811248779297, "global_step": 327562, "epoch": 2707} {"train_loss": -42.03640365600586, "global_step": 327563, "epoch": 2707} {"train_loss": -43.25312423706055, "global_step": 327564, "epoch": 2707} {"train_loss": -42.78049850463867, "global_step": 327565, "epoch": 2707} {"train_loss": -43.1414909362793, "global_step": 327566, "epoch": 2707} {"train_loss": -42.26845932006836, "global_step": 327567, "epoch": 2707} {"train_loss": -42.72755432128906, "global_step": 327568, "epoch": 2707} {"train_loss": -42.64314651489258, "global_step": 327569, "epoch": 2707} {"train_loss": -42.27360153198242, "global_step": 327570, "epoch": 2707} {"train_loss": -42.74672317504883, "global_step": 327571, "epoch": 2707} {"train_loss": -42.891605377197266, "global_step": 327572, "epoch": 2707} {"train_loss": -42.73804473876953, "global_step": 327573, "epoch": 2707} {"train_loss": -42.24870681762695, "global_step": 327574, "epoch": 2707} {"train_loss": -42.29433822631836, "global_step": 327575, "epoch": 2707} {"train_loss": -43.02265167236328, "global_step": 327576, "epoch": 2707} {"train_loss": -43.23554992675781, "global_step": 327577, "epoch": 2707} {"train_loss": -43.1855583190918, "global_step": 327578, "epoch": 2707} {"train_loss": -42.70553207397461, "global_step": 327579, "epoch": 2707} {"train_loss": -43.054439544677734, "global_step": 327580, "epoch": 2707} {"train_loss": -43.00932312011719, "global_step": 327581, "epoch": 2707} {"train_loss": -42.04792022705078, "global_step": 327582, "epoch": 2707} {"train_loss": -42.80364990234375, "global_step": 327583, "epoch": 2707} {"train_loss": -41.554534912109375, "global_step": 327584, "epoch": 2707} {"train_loss": -42.1156005859375, "global_step": 327585, "epoch": 2707} {"train_loss": -43.06624221801758, "global_step": 327586, "epoch": 2707} {"train_loss": -42.67013168334961, "global_step": 327587, "epoch": 2707} {"train_loss": -43.23435592651367, "global_step": 327588, "epoch": 2707} {"train_loss": -42.233951568603516, "global_step": 327589, "epoch": 2707} {"train_loss": -43.26162338256836, "global_step": 327590, "epoch": 2707} {"train_loss": -43.21082305908203, "global_step": 327591, "epoch": 2707} {"train_loss": -42.92378616333008, "global_step": 327592, "epoch": 2707} {"train_loss": -43.38286209106445, "global_step": 327593, "epoch": 2707} {"train_loss": -43.07833480834961, "global_step": 327594, "epoch": 2707} {"train_loss": -43.832679748535156, "global_step": 327595, "epoch": 2707} {"train_loss": -43.70610046386719, "global_step": 327596, "epoch": 2707} {"train_loss": -43.61570358276367, "global_step": 327597, "epoch": 2707} {"train_loss": -43.47365951538086, "global_step": 327598, "epoch": 2707} {"train_loss": -42.88131332397461, "global_step": 327599, "epoch": 2707} {"train_loss": -43.66461944580078, "global_step": 327600, "epoch": 2707} {"train_loss": -42.90081787109375, "global_step": 327601, "epoch": 2707} {"train_loss": -44.07123947143555, "global_step": 327602, "epoch": 2707} {"train_loss": -42.38203048706055, "global_step": 327603, "epoch": 2707} {"train_loss": -40.896148681640625, "global_step": 327604, "epoch": 2707} {"train_loss": -44.25794219970703, "global_step": 327605, "epoch": 2707} {"train_loss": -43.4729118347168, "global_step": 327606, "epoch": 2707} {"train_loss": -44.37083435058594, "global_step": 327607, "epoch": 2707} {"train_loss": -43.151187896728516, "global_step": 327608, "epoch": 2707} {"train_loss": -42.85888671875, "global_step": 327609, "epoch": 2707} {"train_loss": -43.818233489990234, "global_step": 327610, "epoch": 2707} {"train_loss": -43.36153030395508, "global_step": 327611, "epoch": 2707} {"train_loss": -44.22617721557617, "global_step": 327612, "epoch": 2707} {"train_loss": -42.60214614868164, "global_step": 327613, "epoch": 2707} {"train_loss": -43.897178649902344, "global_step": 327614, "epoch": 2707} {"train_loss": -42.60504150390625, "global_step": 327615, "epoch": 2707} {"train_loss": -44.2730712890625, "global_step": 327616, "epoch": 2707} {"train_loss": -42.19358825683594, "global_step": 327617, "epoch": 2707} {"train_loss": -37.36271667480469, "global_step": 327618, "epoch": 2707} {"train_loss": -43.305355072021484, "global_step": 327619, "epoch": 2707} {"train_loss": -43.55373001098633, "global_step": 327620, "epoch": 2707} {"train_loss": -42.76503372192383, "global_step": 327621, "epoch": 2707} {"train_loss": -38.6766242980957, "global_step": 327622, "epoch": 2707} {"train_loss": -43.579219818115234, "global_step": 327623, "epoch": 2707} {"train_loss": -43.1066780090332, "global_step": 327624, "epoch": 2707} {"train_loss": -43.22557067871094, "global_step": 327625, "epoch": 2707} {"train_loss": -43.60014724731445, "global_step": 327626, "epoch": 2707} {"train_loss": -43.269874572753906, "global_step": 327627, "epoch": 2707} {"train_loss": -43.12939453125, "global_step": 327628, "epoch": 2707} {"train_loss": -42.67900466918945, "global_step": 327629, "epoch": 2707} {"train_loss": -43.64054489135742, "global_step": 327630, "epoch": 2707} {"train_loss": -43.383636474609375, "global_step": 327631, "epoch": 2707} {"train_loss": -43.49732971191406, "global_step": 327632, "epoch": 2707} {"train_loss": -42.051395416259766, "global_step": 327633, "epoch": 2707} {"train_loss": -34.4127197265625, "global_step": 327634, "epoch": 2707} {"train_loss": -43.34439468383789, "global_step": 327635, "epoch": 2707} {"train_loss": -41.85041427612305, "global_step": 327636, "epoch": 2707} {"train_loss": -42.350746154785156, "global_step": 327637, "epoch": 2707} {"train_loss": -42.82489776611328, "global_step": 327638, "epoch": 2707} {"train_loss": -42.889739990234375, "global_step": 327639, "epoch": 2707} {"train_loss": -41.20326614379883, "global_step": 327640, "epoch": 2707} {"train_loss": -41.669647216796875, "global_step": 327641, "epoch": 2707} {"train_loss": -42.65676498413086, "global_step": 327642, "epoch": 2707} {"train_loss": -38.806793212890625, "global_step": 327643, "epoch": 2707} {"train_loss": -43.600948333740234, "global_step": 327644, "epoch": 2707} {"train_loss": -38.056026458740234, "global_step": 327645, "epoch": 2707} {"train_loss": -41.86346435546875, "global_step": 327646, "epoch": 2707} {"train_loss": -42.5386962890625, "global_step": 327647, "epoch": 2707} {"train_loss": -41.71501541137695, "global_step": 327648, "epoch": 2707} {"train_loss": -42.63271713256836, "global_step": 327649, "epoch": 2707} {"train_loss": -39.93785858154297, "global_step": 327650, "epoch": 2707} {"train_loss": -40.97667694091797, "global_step": 327651, "epoch": 2707} {"train_loss": -40.9151496887207, "global_step": 327652, "epoch": 2707} {"train_loss": -41.60859298706055, "global_step": 327653, "epoch": 2707} {"train_loss": -41.26398849487305, "global_step": 327654, "epoch": 2707} {"train_loss": -42.63960266113281, "global_step": 327655, "epoch": 2707} {"train_loss": -42.2608642578125, "global_step": 327656, "epoch": 2707} {"train_loss": -41.44497299194336, "global_step": 327657, "epoch": 2707} {"train_loss": -40.69385528564453, "global_step": 327658, "epoch": 2707} {"train_loss": -39.31782150268555, "global_step": 327659, "epoch": 2707} {"train_loss": -42.273681640625, "global_step": 327660, "epoch": 2707} {"train_loss": -42.405208587646484, "global_step": 327661, "epoch": 2707} {"train_loss": -42.87031173706055, "global_step": 327662, "epoch": 2707} {"train_loss": -43.008331298828125, "global_step": 327663, "epoch": 2707} {"train_loss": -41.6976432800293, "global_step": 327664, "epoch": 2707} {"train_loss": -42.936737060546875, "global_step": 327665, "epoch": 2707} {"train_loss": -42.62232208251953, "global_step": 327666, "epoch": 2707} {"train_loss": -42.42437091543655, "global_step": 327667, "epoch": 2707, "val_loss": 2655106.75} {"train_loss": -41.923431396484375, "global_step": 327668, "epoch": 2708} {"train_loss": -43.65802001953125, "global_step": 327669, "epoch": 2708} {"train_loss": -42.652069091796875, "global_step": 327670, "epoch": 2708} {"train_loss": -43.5201301574707, "global_step": 327671, "epoch": 2708} {"train_loss": -42.80980682373047, "global_step": 327672, "epoch": 2708} {"train_loss": -42.03972625732422, "global_step": 327673, "epoch": 2708} {"train_loss": -43.170074462890625, "global_step": 327674, "epoch": 2708} {"train_loss": -40.30124282836914, "global_step": 327675, "epoch": 2708} {"train_loss": -42.43559265136719, "global_step": 327676, "epoch": 2708} {"train_loss": -43.366004943847656, "global_step": 327677, "epoch": 2708} {"train_loss": -43.14060592651367, "global_step": 327678, "epoch": 2708} {"train_loss": -42.973140716552734, "global_step": 327679, "epoch": 2708} {"train_loss": -42.461524963378906, "global_step": 327680, "epoch": 2708} {"train_loss": -43.15960693359375, "global_step": 327681, "epoch": 2708} {"train_loss": -41.666194915771484, "global_step": 327682, "epoch": 2708} {"train_loss": -42.191558837890625, "global_step": 327683, "epoch": 2708} {"train_loss": -41.78041458129883, "global_step": 327684, "epoch": 2708} {"train_loss": -42.48573684692383, "global_step": 327685, "epoch": 2708} {"train_loss": -43.357337951660156, "global_step": 327686, "epoch": 2708} {"train_loss": -43.226959228515625, "global_step": 327687, "epoch": 2708} {"train_loss": -43.33102035522461, "global_step": 327688, "epoch": 2708} {"train_loss": -43.529052734375, "global_step": 327689, "epoch": 2708} {"train_loss": -42.57391357421875, "global_step": 327690, "epoch": 2708} {"train_loss": -42.1912727355957, "global_step": 327691, "epoch": 2708} {"train_loss": -38.26434326171875, "global_step": 327692, "epoch": 2708} {"train_loss": -40.61324691772461, "global_step": 327693, "epoch": 2708} {"train_loss": -42.10026168823242, "global_step": 327694, "epoch": 2708} {"train_loss": -42.544132232666016, "global_step": 327695, "epoch": 2708} {"train_loss": -41.064453125, "global_step": 327696, "epoch": 2708} {"train_loss": -41.384273529052734, "global_step": 327697, "epoch": 2708} {"train_loss": -42.4946403503418, "global_step": 327698, "epoch": 2708} {"train_loss": -42.885986328125, "global_step": 327699, "epoch": 2708} {"train_loss": -43.252113342285156, "global_step": 327700, "epoch": 2708} {"train_loss": -36.91631317138672, "global_step": 327701, "epoch": 2708} {"train_loss": -42.376495361328125, "global_step": 327702, "epoch": 2708} {"train_loss": -43.11935806274414, "global_step": 327703, "epoch": 2708} {"train_loss": -42.120033264160156, "global_step": 327704, "epoch": 2708} {"train_loss": -38.79584503173828, "global_step": 327705, "epoch": 2708} {"train_loss": -42.51057815551758, "global_step": 327706, "epoch": 2708} {"train_loss": -41.90238952636719, "global_step": 327707, "epoch": 2708} {"train_loss": -40.37289047241211, "global_step": 327708, "epoch": 2708} {"train_loss": -40.37492370605469, "global_step": 327709, "epoch": 2708} {"train_loss": -40.81429672241211, "global_step": 327710, "epoch": 2708} {"train_loss": -38.251617431640625, "global_step": 327711, "epoch": 2708} {"train_loss": -33.0589714050293, "global_step": 327712, "epoch": 2708} {"train_loss": -37.849910736083984, "global_step": 327713, "epoch": 2708} {"train_loss": -42.762245178222656, "global_step": 327714, "epoch": 2708} {"train_loss": -42.374176025390625, "global_step": 327715, "epoch": 2708} {"train_loss": -38.82147216796875, "global_step": 327716, "epoch": 2708} {"train_loss": -42.25537872314453, "global_step": 327717, "epoch": 2708} {"train_loss": -40.47760772705078, "global_step": 327718, "epoch": 2708} {"train_loss": -41.968894958496094, "global_step": 327719, "epoch": 2708} {"train_loss": -39.27944564819336, "global_step": 327720, "epoch": 2708} {"train_loss": -40.38863754272461, "global_step": 327721, "epoch": 2708} {"train_loss": -40.34794998168945, "global_step": 327722, "epoch": 2708} {"train_loss": -41.11940383911133, "global_step": 327723, "epoch": 2708} {"train_loss": -42.056331634521484, "global_step": 327724, "epoch": 2708} {"train_loss": -42.543800354003906, "global_step": 327725, "epoch": 2708} {"train_loss": -42.54902267456055, "global_step": 327726, "epoch": 2708} {"train_loss": -41.958160400390625, "global_step": 327727, "epoch": 2708} {"train_loss": -39.56842803955078, "global_step": 327728, "epoch": 2708} {"train_loss": -41.1126708984375, "global_step": 327729, "epoch": 2708} {"train_loss": -41.78113555908203, "global_step": 327730, "epoch": 2708} {"train_loss": -41.63075637817383, "global_step": 327731, "epoch": 2708} {"train_loss": -40.349666595458984, "global_step": 327732, "epoch": 2708} {"train_loss": -38.05073928833008, "global_step": 327733, "epoch": 2708} {"train_loss": -40.22756576538086, "global_step": 327734, "epoch": 2708} {"train_loss": -41.57350540161133, "global_step": 327735, "epoch": 2708} {"train_loss": -41.8853645324707, "global_step": 327736, "epoch": 2708} {"train_loss": -41.962432861328125, "global_step": 327737, "epoch": 2708} {"train_loss": -42.084228515625, "global_step": 327738, "epoch": 2708} {"train_loss": -42.21017074584961, "global_step": 327739, "epoch": 2708} {"train_loss": -42.27878952026367, "global_step": 327740, "epoch": 2708} {"train_loss": -42.14485549926758, "global_step": 327741, "epoch": 2708} {"train_loss": -40.90159225463867, "global_step": 327742, "epoch": 2708} {"train_loss": -40.37330627441406, "global_step": 327743, "epoch": 2708} {"train_loss": -38.9932746887207, "global_step": 327744, "epoch": 2708} {"train_loss": -42.54091262817383, "global_step": 327745, "epoch": 2708} {"train_loss": -42.25714874267578, "global_step": 327746, "epoch": 2708} {"train_loss": -41.10895919799805, "global_step": 327747, "epoch": 2708} {"train_loss": -41.79950714111328, "global_step": 327748, "epoch": 2708} {"train_loss": -42.161739349365234, "global_step": 327749, "epoch": 2708} {"train_loss": -40.163307189941406, "global_step": 327750, "epoch": 2708} {"train_loss": -43.32898712158203, "global_step": 327751, "epoch": 2708} {"train_loss": -41.41715621948242, "global_step": 327752, "epoch": 2708} {"train_loss": -42.5197639465332, "global_step": 327753, "epoch": 2708} {"train_loss": -42.0039176940918, "global_step": 327754, "epoch": 2708} {"train_loss": -42.20539093017578, "global_step": 327755, "epoch": 2708} {"train_loss": -42.57786178588867, "global_step": 327756, "epoch": 2708} {"train_loss": -41.61879348754883, "global_step": 327757, "epoch": 2708} {"train_loss": -40.40192794799805, "global_step": 327758, "epoch": 2708} {"train_loss": -41.96192932128906, "global_step": 327759, "epoch": 2708} {"train_loss": -41.651397705078125, "global_step": 327760, "epoch": 2708} {"train_loss": -42.903099060058594, "global_step": 327761, "epoch": 2708} {"train_loss": -41.607383728027344, "global_step": 327762, "epoch": 2708} {"train_loss": -42.829376220703125, "global_step": 327763, "epoch": 2708} {"train_loss": -42.1435546875, "global_step": 327764, "epoch": 2708} {"train_loss": -41.81101608276367, "global_step": 327765, "epoch": 2708} {"train_loss": -40.3973274230957, "global_step": 327766, "epoch": 2708} {"train_loss": -41.25756072998047, "global_step": 327767, "epoch": 2708} {"train_loss": -42.028499603271484, "global_step": 327768, "epoch": 2708} {"train_loss": -42.933048248291016, "global_step": 327769, "epoch": 2708} {"train_loss": -42.733428955078125, "global_step": 327770, "epoch": 2708} {"train_loss": -43.31550216674805, "global_step": 327771, "epoch": 2708} {"train_loss": -42.43326187133789, "global_step": 327772, "epoch": 2708} {"train_loss": -42.73881149291992, "global_step": 327773, "epoch": 2708} {"train_loss": -42.00558853149414, "global_step": 327774, "epoch": 2708} {"train_loss": -42.84006881713867, "global_step": 327775, "epoch": 2708} {"train_loss": -42.4871940612793, "global_step": 327776, "epoch": 2708} {"train_loss": -43.09147262573242, "global_step": 327777, "epoch": 2708} {"train_loss": -41.36555099487305, "global_step": 327778, "epoch": 2708} {"train_loss": -42.6004638671875, "global_step": 327779, "epoch": 2708} {"train_loss": -42.78620910644531, "global_step": 327780, "epoch": 2708} {"train_loss": -42.36133575439453, "global_step": 327781, "epoch": 2708} {"train_loss": -42.50325393676758, "global_step": 327782, "epoch": 2708} {"train_loss": -43.342079162597656, "global_step": 327783, "epoch": 2708} {"train_loss": -43.21895217895508, "global_step": 327784, "epoch": 2708} {"train_loss": -42.94221878051758, "global_step": 327785, "epoch": 2708} {"train_loss": -41.11085891723633, "global_step": 327786, "epoch": 2708} {"train_loss": -42.75141525268555, "global_step": 327787, "epoch": 2708} {"train_loss": -41.7346400426439, "global_step": 327788, "epoch": 2708, "val_loss": 2607169.75} {"train_loss": -42.87641143798828, "global_step": 327789, "epoch": 2709} {"train_loss": -41.92913818359375, "global_step": 327790, "epoch": 2709} {"train_loss": -42.6053581237793, "global_step": 327791, "epoch": 2709} {"train_loss": -43.67554473876953, "global_step": 327792, "epoch": 2709} {"train_loss": -42.08919906616211, "global_step": 327793, "epoch": 2709} {"train_loss": -43.41775131225586, "global_step": 327794, "epoch": 2709} {"train_loss": -38.67053985595703, "global_step": 327795, "epoch": 2709} {"train_loss": -42.80312728881836, "global_step": 327796, "epoch": 2709} {"train_loss": -43.430789947509766, "global_step": 327797, "epoch": 2709} {"train_loss": -43.44119644165039, "global_step": 327798, "epoch": 2709} {"train_loss": -42.390071868896484, "global_step": 327799, "epoch": 2709} {"train_loss": -42.27650451660156, "global_step": 327800, "epoch": 2709} {"train_loss": -43.578582763671875, "global_step": 327801, "epoch": 2709} {"train_loss": -41.93571090698242, "global_step": 327802, "epoch": 2709} {"train_loss": -43.44844055175781, "global_step": 327803, "epoch": 2709} {"train_loss": -42.706905364990234, "global_step": 327804, "epoch": 2709} {"train_loss": -42.61676788330078, "global_step": 327805, "epoch": 2709} {"train_loss": -43.4750862121582, "global_step": 327806, "epoch": 2709} {"train_loss": -41.079769134521484, "global_step": 327807, "epoch": 2709} {"train_loss": -42.868858337402344, "global_step": 327808, "epoch": 2709} {"train_loss": -43.46079635620117, "global_step": 327809, "epoch": 2709} {"train_loss": -39.247344970703125, "global_step": 327810, "epoch": 2709} {"train_loss": -41.86330032348633, "global_step": 327811, "epoch": 2709} {"train_loss": -43.27503204345703, "global_step": 327812, "epoch": 2709} {"train_loss": -43.19352722167969, "global_step": 327813, "epoch": 2709} {"train_loss": -42.24538803100586, "global_step": 327814, "epoch": 2709} {"train_loss": -43.6099853515625, "global_step": 327815, "epoch": 2709} {"train_loss": -42.5308837890625, "global_step": 327816, "epoch": 2709} {"train_loss": -42.54706954956055, "global_step": 327817, "epoch": 2709} {"train_loss": -42.94247055053711, "global_step": 327818, "epoch": 2709} {"train_loss": -43.82241439819336, "global_step": 327819, "epoch": 2709} {"train_loss": -42.841278076171875, "global_step": 327820, "epoch": 2709} {"train_loss": -43.15478515625, "global_step": 327821, "epoch": 2709} {"train_loss": -42.159358978271484, "global_step": 327822, "epoch": 2709} {"train_loss": -42.7820930480957, "global_step": 327823, "epoch": 2709} {"train_loss": -42.64333724975586, "global_step": 327824, "epoch": 2709} {"train_loss": -43.376399993896484, "global_step": 327825, "epoch": 2709} {"train_loss": -42.02216720581055, "global_step": 327826, "epoch": 2709} {"train_loss": -42.069984436035156, "global_step": 327827, "epoch": 2709} {"train_loss": -43.074859619140625, "global_step": 327828, "epoch": 2709} {"train_loss": -42.36772155761719, "global_step": 327829, "epoch": 2709} {"train_loss": -41.790374755859375, "global_step": 327830, "epoch": 2709} {"train_loss": -43.92854690551758, "global_step": 327831, "epoch": 2709} {"train_loss": -43.29098129272461, "global_step": 327832, "epoch": 2709} {"train_loss": -42.6641960144043, "global_step": 327833, "epoch": 2709} {"train_loss": -42.26899337768555, "global_step": 327834, "epoch": 2709} {"train_loss": -41.99707794189453, "global_step": 327835, "epoch": 2709} {"train_loss": -43.77395248413086, "global_step": 327836, "epoch": 2709} {"train_loss": -43.25335693359375, "global_step": 327837, "epoch": 2709} {"train_loss": -42.08076095581055, "global_step": 327838, "epoch": 2709} {"train_loss": -43.47468948364258, "global_step": 327839, "epoch": 2709} {"train_loss": -42.1162109375, "global_step": 327840, "epoch": 2709} {"train_loss": -41.26130294799805, "global_step": 327841, "epoch": 2709} {"train_loss": -43.018924713134766, "global_step": 327842, "epoch": 2709} {"train_loss": -42.48712921142578, "global_step": 327843, "epoch": 2709} {"train_loss": -40.66360855102539, "global_step": 327844, "epoch": 2709} {"train_loss": -43.533931732177734, "global_step": 327845, "epoch": 2709} {"train_loss": -42.2736701965332, "global_step": 327846, "epoch": 2709} {"train_loss": -41.8385009765625, "global_step": 327847, "epoch": 2709} {"train_loss": -43.350093841552734, "global_step": 327848, "epoch": 2709} {"train_loss": -41.468624114990234, "global_step": 327849, "epoch": 2709} {"train_loss": -42.95945358276367, "global_step": 327850, "epoch": 2709} {"train_loss": -43.25333786010742, "global_step": 327851, "epoch": 2709} {"train_loss": -42.773677825927734, "global_step": 327852, "epoch": 2709} {"train_loss": -43.72697067260742, "global_step": 327853, "epoch": 2709} {"train_loss": -42.2392692565918, "global_step": 327854, "epoch": 2709} {"train_loss": -42.91059112548828, "global_step": 327855, "epoch": 2709} {"train_loss": -43.51707077026367, "global_step": 327856, "epoch": 2709} {"train_loss": -43.14936447143555, "global_step": 327857, "epoch": 2709} {"train_loss": -42.6259651184082, "global_step": 327858, "epoch": 2709} {"train_loss": -43.14960861206055, "global_step": 327859, "epoch": 2709} {"train_loss": -42.447391510009766, "global_step": 327860, "epoch": 2709} {"train_loss": -41.78957748413086, "global_step": 327861, "epoch": 2709} {"train_loss": -42.93560028076172, "global_step": 327862, "epoch": 2709} {"train_loss": -39.75957107543945, "global_step": 327863, "epoch": 2709} {"train_loss": -42.31246566772461, "global_step": 327864, "epoch": 2709} {"train_loss": -41.83419418334961, "global_step": 327865, "epoch": 2709} {"train_loss": -42.1107063293457, "global_step": 327866, "epoch": 2709} {"train_loss": -42.224403381347656, "global_step": 327867, "epoch": 2709} {"train_loss": -41.32195281982422, "global_step": 327868, "epoch": 2709} {"train_loss": -40.779869079589844, "global_step": 327869, "epoch": 2709} {"train_loss": -42.30392074584961, "global_step": 327870, "epoch": 2709} {"train_loss": -41.00147247314453, "global_step": 327871, "epoch": 2709} {"train_loss": -43.026546478271484, "global_step": 327872, "epoch": 2709} {"train_loss": -41.71497344970703, "global_step": 327873, "epoch": 2709} {"train_loss": -42.93571853637695, "global_step": 327874, "epoch": 2709} {"train_loss": -41.077632904052734, "global_step": 327875, "epoch": 2709} {"train_loss": -42.7633056640625, "global_step": 327876, "epoch": 2709} {"train_loss": -43.05042266845703, "global_step": 327877, "epoch": 2709} {"train_loss": -42.869972229003906, "global_step": 327878, "epoch": 2709} {"train_loss": -42.312652587890625, "global_step": 327879, "epoch": 2709} {"train_loss": -43.59059524536133, "global_step": 327880, "epoch": 2709} {"train_loss": -42.79740524291992, "global_step": 327881, "epoch": 2709} {"train_loss": -42.942447662353516, "global_step": 327882, "epoch": 2709} {"train_loss": -43.170108795166016, "global_step": 327883, "epoch": 2709} {"train_loss": -43.562801361083984, "global_step": 327884, "epoch": 2709} {"train_loss": -42.82461166381836, "global_step": 327885, "epoch": 2709} {"train_loss": -43.19834518432617, "global_step": 327886, "epoch": 2709} {"train_loss": -43.60786819458008, "global_step": 327887, "epoch": 2709} {"train_loss": -43.75103759765625, "global_step": 327888, "epoch": 2709} {"train_loss": -43.245853424072266, "global_step": 327889, "epoch": 2709} {"train_loss": -43.390411376953125, "global_step": 327890, "epoch": 2709} {"train_loss": -43.82265090942383, "global_step": 327891, "epoch": 2709} {"train_loss": -43.414161682128906, "global_step": 327892, "epoch": 2709} {"train_loss": -43.267311096191406, "global_step": 327893, "epoch": 2709} {"train_loss": -43.54856491088867, "global_step": 327894, "epoch": 2709} {"train_loss": -43.85847473144531, "global_step": 327895, "epoch": 2709} {"train_loss": -42.996761322021484, "global_step": 327896, "epoch": 2709} {"train_loss": -43.4505615234375, "global_step": 327897, "epoch": 2709} {"train_loss": -43.66453170776367, "global_step": 327898, "epoch": 2709} {"train_loss": -43.363128662109375, "global_step": 327899, "epoch": 2709} {"train_loss": -30.191030502319336, "global_step": 327900, "epoch": 2709} {"train_loss": -43.92376708984375, "global_step": 327901, "epoch": 2709} {"train_loss": -43.118507385253906, "global_step": 327902, "epoch": 2709} {"train_loss": -42.94986343383789, "global_step": 327903, "epoch": 2709} {"train_loss": -43.364112854003906, "global_step": 327904, "epoch": 2709} {"train_loss": -42.81150436401367, "global_step": 327905, "epoch": 2709} {"train_loss": -42.658870697021484, "global_step": 327906, "epoch": 2709} {"train_loss": -43.10770797729492, "global_step": 327907, "epoch": 2709} {"train_loss": -43.018157958984375, "global_step": 327908, "epoch": 2709} {"train_loss": -42.59436270028107, "global_step": 327909, "epoch": 2709, "val_loss": 2610115.25} {"train_loss": -40.40468215942383, "global_step": 327910, "epoch": 2710} {"train_loss": -43.389930725097656, "global_step": 327911, "epoch": 2710} {"train_loss": -44.03173828125, "global_step": 327912, "epoch": 2710} {"train_loss": -43.40865707397461, "global_step": 327913, "epoch": 2710} {"train_loss": -43.56400680541992, "global_step": 327914, "epoch": 2710} {"train_loss": -43.84565734863281, "global_step": 327915, "epoch": 2710} {"train_loss": -43.600555419921875, "global_step": 327916, "epoch": 2710} {"train_loss": -42.6790885925293, "global_step": 327917, "epoch": 2710} {"train_loss": -42.79716491699219, "global_step": 327918, "epoch": 2710} {"train_loss": -43.85307312011719, "global_step": 327919, "epoch": 2710} {"train_loss": -43.661216735839844, "global_step": 327920, "epoch": 2710} {"train_loss": -43.620033264160156, "global_step": 327921, "epoch": 2710} {"train_loss": -43.41850662231445, "global_step": 327922, "epoch": 2710} {"train_loss": -40.13006591796875, "global_step": 327923, "epoch": 2710} {"train_loss": -43.438568115234375, "global_step": 327924, "epoch": 2710} {"train_loss": -41.98210144042969, "global_step": 327925, "epoch": 2710} {"train_loss": -42.99675750732422, "global_step": 327926, "epoch": 2710} {"train_loss": -42.46417236328125, "global_step": 327927, "epoch": 2710} {"train_loss": -41.63081741333008, "global_step": 327928, "epoch": 2710} {"train_loss": -42.27810287475586, "global_step": 327929, "epoch": 2710} {"train_loss": -42.6907844543457, "global_step": 327930, "epoch": 2710} {"train_loss": -42.47358322143555, "global_step": 327931, "epoch": 2710} {"train_loss": -43.33164978027344, "global_step": 327932, "epoch": 2710} {"train_loss": -42.2465934753418, "global_step": 327933, "epoch": 2710} {"train_loss": -42.020782470703125, "global_step": 327934, "epoch": 2710} {"train_loss": -40.092403411865234, "global_step": 327935, "epoch": 2710} {"train_loss": -42.05609893798828, "global_step": 327936, "epoch": 2710} {"train_loss": -42.61383819580078, "global_step": 327937, "epoch": 2710} {"train_loss": -41.57613754272461, "global_step": 327938, "epoch": 2710} {"train_loss": -39.775184631347656, "global_step": 327939, "epoch": 2710} {"train_loss": -40.30501937866211, "global_step": 327940, "epoch": 2710} {"train_loss": -42.09697341918945, "global_step": 327941, "epoch": 2710} {"train_loss": -42.98089599609375, "global_step": 327942, "epoch": 2710} {"train_loss": -41.327430725097656, "global_step": 327943, "epoch": 2710} {"train_loss": -43.279022216796875, "global_step": 327944, "epoch": 2710} {"train_loss": -41.869178771972656, "global_step": 327945, "epoch": 2710} {"train_loss": -38.41884231567383, "global_step": 327946, "epoch": 2710} {"train_loss": -36.5537223815918, "global_step": 327947, "epoch": 2710} {"train_loss": -40.813995361328125, "global_step": 327948, "epoch": 2710} {"train_loss": -41.71666717529297, "global_step": 327949, "epoch": 2710} {"train_loss": -39.42742919921875, "global_step": 327950, "epoch": 2710} {"train_loss": -42.401649475097656, "global_step": 327951, "epoch": 2710} {"train_loss": -40.13788604736328, "global_step": 327952, "epoch": 2710} {"train_loss": -40.001216888427734, "global_step": 327953, "epoch": 2710} {"train_loss": -42.0052375793457, "global_step": 327954, "epoch": 2710} {"train_loss": -39.99794387817383, "global_step": 327955, "epoch": 2710} {"train_loss": -41.450103759765625, "global_step": 327956, "epoch": 2710} {"train_loss": -42.0921745300293, "global_step": 327957, "epoch": 2710} {"train_loss": -41.26292037963867, "global_step": 327958, "epoch": 2710} {"train_loss": -42.363094329833984, "global_step": 327959, "epoch": 2710} {"train_loss": -40.75413131713867, "global_step": 327960, "epoch": 2710} {"train_loss": -41.4619026184082, "global_step": 327961, "epoch": 2710} {"train_loss": -42.59200668334961, "global_step": 327962, "epoch": 2710} {"train_loss": -40.77629852294922, "global_step": 327963, "epoch": 2710} {"train_loss": -42.26740646362305, "global_step": 327964, "epoch": 2710} {"train_loss": -42.151607513427734, "global_step": 327965, "epoch": 2710} {"train_loss": -42.15619659423828, "global_step": 327966, "epoch": 2710} {"train_loss": -42.577877044677734, "global_step": 327967, "epoch": 2710} {"train_loss": -42.72639083862305, "global_step": 327968, "epoch": 2710} {"train_loss": -42.830299377441406, "global_step": 327969, "epoch": 2710} {"train_loss": -42.81803894042969, "global_step": 327970, "epoch": 2710} {"train_loss": -43.56113815307617, "global_step": 327971, "epoch": 2710} {"train_loss": -43.41520309448242, "global_step": 327972, "epoch": 2710} {"train_loss": -43.782833099365234, "global_step": 327973, "epoch": 2710} {"train_loss": -43.141090393066406, "global_step": 327974, "epoch": 2710} {"train_loss": -43.37691879272461, "global_step": 327975, "epoch": 2710} {"train_loss": -43.094356536865234, "global_step": 327976, "epoch": 2710} {"train_loss": -42.733882904052734, "global_step": 327977, "epoch": 2710} {"train_loss": -41.523658752441406, "global_step": 327978, "epoch": 2710} {"train_loss": -42.8975830078125, "global_step": 327979, "epoch": 2710} {"train_loss": -43.394508361816406, "global_step": 327980, "epoch": 2710} {"train_loss": -43.567588806152344, "global_step": 327981, "epoch": 2710} {"train_loss": -43.45335006713867, "global_step": 327982, "epoch": 2710} {"train_loss": -43.82859420776367, "global_step": 327983, "epoch": 2710} {"train_loss": -43.44940185546875, "global_step": 327984, "epoch": 2710} {"train_loss": -43.80427169799805, "global_step": 327985, "epoch": 2710} {"train_loss": -43.56470489501953, "global_step": 327986, "epoch": 2710} {"train_loss": -43.79853057861328, "global_step": 327987, "epoch": 2710} {"train_loss": -43.201271057128906, "global_step": 327988, "epoch": 2710} {"train_loss": -42.97669219970703, "global_step": 327989, "epoch": 2710} {"train_loss": -42.93644332885742, "global_step": 327990, "epoch": 2710} {"train_loss": -44.07363510131836, "global_step": 327991, "epoch": 2710} {"train_loss": -42.897735595703125, "global_step": 327992, "epoch": 2710} {"train_loss": -43.65842819213867, "global_step": 327993, "epoch": 2710} {"train_loss": -43.266326904296875, "global_step": 327994, "epoch": 2710} {"train_loss": -43.9134407043457, "global_step": 327995, "epoch": 2710} {"train_loss": -44.07209396362305, "global_step": 327996, "epoch": 2710} {"train_loss": -42.88576889038086, "global_step": 327997, "epoch": 2710} {"train_loss": -44.07975387573242, "global_step": 327998, "epoch": 2710} {"train_loss": -42.33626174926758, "global_step": 327999, "epoch": 2710} {"train_loss": -43.835391998291016, "global_step": 328000, "epoch": 2710} {"train_loss": -44.05463409423828, "global_step": 328001, "epoch": 2710} {"train_loss": -43.20364761352539, "global_step": 328002, "epoch": 2710} {"train_loss": -44.022216796875, "global_step": 328003, "epoch": 2710} {"train_loss": -42.712581634521484, "global_step": 328004, "epoch": 2710} {"train_loss": -43.67231750488281, "global_step": 328005, "epoch": 2710} {"train_loss": -43.16379928588867, "global_step": 328006, "epoch": 2710} {"train_loss": -42.787078857421875, "global_step": 328007, "epoch": 2710} {"train_loss": -44.23002624511719, "global_step": 328008, "epoch": 2710} {"train_loss": -42.81986618041992, "global_step": 328009, "epoch": 2710} {"train_loss": -41.798824310302734, "global_step": 328010, "epoch": 2710} {"train_loss": -43.59177017211914, "global_step": 328011, "epoch": 2710} {"train_loss": -43.444068908691406, "global_step": 328012, "epoch": 2710} {"train_loss": -43.034423828125, "global_step": 328013, "epoch": 2710} {"train_loss": -43.72016525268555, "global_step": 328014, "epoch": 2710} {"train_loss": -43.8059196472168, "global_step": 328015, "epoch": 2710} {"train_loss": -43.76893997192383, "global_step": 328016, "epoch": 2710} {"train_loss": -44.303768157958984, "global_step": 328017, "epoch": 2710} {"train_loss": -44.39324188232422, "global_step": 328018, "epoch": 2710} {"train_loss": -43.91854476928711, "global_step": 328019, "epoch": 2710} {"train_loss": -44.145477294921875, "global_step": 328020, "epoch": 2710} {"train_loss": -43.082271575927734, "global_step": 328021, "epoch": 2710} {"train_loss": -44.16229248046875, "global_step": 328022, "epoch": 2710} {"train_loss": -42.79080581665039, "global_step": 328023, "epoch": 2710} {"train_loss": -44.3677864074707, "global_step": 328024, "epoch": 2710} {"train_loss": -44.07655715942383, "global_step": 328025, "epoch": 2710} {"train_loss": -42.929378509521484, "global_step": 328026, "epoch": 2710} {"train_loss": -44.077171325683594, "global_step": 328027, "epoch": 2710} {"train_loss": -43.942649841308594, "global_step": 328028, "epoch": 2710} {"train_loss": -43.8127326965332, "global_step": 328029, "epoch": 2710} {"train_loss": -42.700155967523244, "global_step": 328030, "epoch": 2710, "val_loss": 2654044.75} {"train_loss": -43.98564910888672, "global_step": 328031, "epoch": 2711} {"train_loss": -43.032291412353516, "global_step": 328032, "epoch": 2711} {"train_loss": -43.46684646606445, "global_step": 328033, "epoch": 2711} {"train_loss": -43.93305206298828, "global_step": 328034, "epoch": 2711} {"train_loss": -43.001983642578125, "global_step": 328035, "epoch": 2711} {"train_loss": -43.45383834838867, "global_step": 328036, "epoch": 2711} {"train_loss": -43.95625305175781, "global_step": 328037, "epoch": 2711} {"train_loss": -43.25162887573242, "global_step": 328038, "epoch": 2711} {"train_loss": -43.937625885009766, "global_step": 328039, "epoch": 2711} {"train_loss": -44.35335922241211, "global_step": 328040, "epoch": 2711} {"train_loss": -44.12377166748047, "global_step": 328041, "epoch": 2711} {"train_loss": -44.1823616027832, "global_step": 328042, "epoch": 2711} {"train_loss": -43.8665771484375, "global_step": 328043, "epoch": 2711} {"train_loss": -43.7196159362793, "global_step": 328044, "epoch": 2711} {"train_loss": -43.87202072143555, "global_step": 328045, "epoch": 2711} {"train_loss": -42.70172119140625, "global_step": 328046, "epoch": 2711} {"train_loss": -43.95598220825195, "global_step": 328047, "epoch": 2711} {"train_loss": -43.341278076171875, "global_step": 328048, "epoch": 2711} {"train_loss": -43.404109954833984, "global_step": 328049, "epoch": 2711} {"train_loss": -42.574913024902344, "global_step": 328050, "epoch": 2711} {"train_loss": -43.392127990722656, "global_step": 328051, "epoch": 2711} {"train_loss": -43.88204574584961, "global_step": 328052, "epoch": 2711} {"train_loss": -41.56317138671875, "global_step": 328053, "epoch": 2711} {"train_loss": -42.78242111206055, "global_step": 328054, "epoch": 2711} {"train_loss": -42.1317024230957, "global_step": 328055, "epoch": 2711} {"train_loss": -43.419673919677734, "global_step": 328056, "epoch": 2711} {"train_loss": -43.08696746826172, "global_step": 328057, "epoch": 2711} {"train_loss": -43.16182327270508, "global_step": 328058, "epoch": 2711} {"train_loss": -43.01301193237305, "global_step": 328059, "epoch": 2711} {"train_loss": -42.03089141845703, "global_step": 328060, "epoch": 2711} {"train_loss": -42.2435302734375, "global_step": 328061, "epoch": 2711} {"train_loss": -41.64392852783203, "global_step": 328062, "epoch": 2711} {"train_loss": -39.37329864501953, "global_step": 328063, "epoch": 2711} {"train_loss": -42.29707336425781, "global_step": 328064, "epoch": 2711} {"train_loss": -43.87803268432617, "global_step": 328065, "epoch": 2711} {"train_loss": -42.75894546508789, "global_step": 328066, "epoch": 2711} {"train_loss": -40.362266540527344, "global_step": 328067, "epoch": 2711} {"train_loss": -42.76671600341797, "global_step": 328068, "epoch": 2711} {"train_loss": -42.09608840942383, "global_step": 328069, "epoch": 2711} {"train_loss": -42.73556137084961, "global_step": 328070, "epoch": 2711} {"train_loss": -42.0497932434082, "global_step": 328071, "epoch": 2711} {"train_loss": -43.1794548034668, "global_step": 328072, "epoch": 2711} {"train_loss": -43.4265251159668, "global_step": 328073, "epoch": 2711} {"train_loss": -42.6672477722168, "global_step": 328074, "epoch": 2711} {"train_loss": -42.5998420715332, "global_step": 328075, "epoch": 2711} {"train_loss": -41.31654739379883, "global_step": 328076, "epoch": 2711} {"train_loss": -42.80689239501953, "global_step": 328077, "epoch": 2711} {"train_loss": -41.03422927856445, "global_step": 328078, "epoch": 2711} {"train_loss": -43.415855407714844, "global_step": 328079, "epoch": 2711} {"train_loss": -43.05076217651367, "global_step": 328080, "epoch": 2711} {"train_loss": -43.30073165893555, "global_step": 328081, "epoch": 2711} {"train_loss": -42.9561882019043, "global_step": 328082, "epoch": 2711} {"train_loss": -42.7860221862793, "global_step": 328083, "epoch": 2711} {"train_loss": -42.26593780517578, "global_step": 328084, "epoch": 2711} {"train_loss": -43.47269821166992, "global_step": 328085, "epoch": 2711} {"train_loss": -43.77424621582031, "global_step": 328086, "epoch": 2711} {"train_loss": -43.51654815673828, "global_step": 328087, "epoch": 2711} {"train_loss": -43.83078384399414, "global_step": 328088, "epoch": 2711} {"train_loss": -43.50749588012695, "global_step": 328089, "epoch": 2711} {"train_loss": -43.17112350463867, "global_step": 328090, "epoch": 2711} {"train_loss": -44.08401107788086, "global_step": 328091, "epoch": 2711} {"train_loss": -42.864776611328125, "global_step": 328092, "epoch": 2711} {"train_loss": -43.05392074584961, "global_step": 328093, "epoch": 2711} {"train_loss": -43.56708526611328, "global_step": 328094, "epoch": 2711} {"train_loss": -43.61566925048828, "global_step": 328095, "epoch": 2711} {"train_loss": -43.249114990234375, "global_step": 328096, "epoch": 2711} {"train_loss": -42.75080490112305, "global_step": 328097, "epoch": 2711} {"train_loss": -42.05268096923828, "global_step": 328098, "epoch": 2711} {"train_loss": -42.742897033691406, "global_step": 328099, "epoch": 2711} {"train_loss": -43.717769622802734, "global_step": 328100, "epoch": 2711} {"train_loss": -42.10350036621094, "global_step": 328101, "epoch": 2711} {"train_loss": -42.81206130981445, "global_step": 328102, "epoch": 2711} {"train_loss": -43.349483489990234, "global_step": 328103, "epoch": 2711} {"train_loss": -43.4307975769043, "global_step": 328104, "epoch": 2711} {"train_loss": -43.404823303222656, "global_step": 328105, "epoch": 2711} {"train_loss": -43.05309295654297, "global_step": 328106, "epoch": 2711} {"train_loss": -43.842567443847656, "global_step": 328107, "epoch": 2711} {"train_loss": -43.78676986694336, "global_step": 328108, "epoch": 2711} {"train_loss": -42.55027389526367, "global_step": 328109, "epoch": 2711} {"train_loss": -43.79995346069336, "global_step": 328110, "epoch": 2711} {"train_loss": -43.97992706298828, "global_step": 328111, "epoch": 2711} {"train_loss": -42.43873596191406, "global_step": 328112, "epoch": 2711} {"train_loss": -42.23040771484375, "global_step": 328113, "epoch": 2711} {"train_loss": -42.7950439453125, "global_step": 328114, "epoch": 2711} {"train_loss": -43.27970504760742, "global_step": 328115, "epoch": 2711} {"train_loss": -42.86119842529297, "global_step": 328116, "epoch": 2711} {"train_loss": -43.46787643432617, "global_step": 328117, "epoch": 2711} {"train_loss": -43.227821350097656, "global_step": 328118, "epoch": 2711} {"train_loss": -42.81234359741211, "global_step": 328119, "epoch": 2711} {"train_loss": -42.75516128540039, "global_step": 328120, "epoch": 2711} {"train_loss": -43.4193115234375, "global_step": 328121, "epoch": 2711} {"train_loss": -42.1732292175293, "global_step": 328122, "epoch": 2711} {"train_loss": -42.761871337890625, "global_step": 328123, "epoch": 2711} {"train_loss": -42.89291000366211, "global_step": 328124, "epoch": 2711} {"train_loss": -43.74453353881836, "global_step": 328125, "epoch": 2711} {"train_loss": -43.03900146484375, "global_step": 328126, "epoch": 2711} {"train_loss": -42.79911422729492, "global_step": 328127, "epoch": 2711} {"train_loss": -44.00542068481445, "global_step": 328128, "epoch": 2711} {"train_loss": -43.11733627319336, "global_step": 328129, "epoch": 2711} {"train_loss": -44.11273956298828, "global_step": 328130, "epoch": 2711} {"train_loss": -42.872955322265625, "global_step": 328131, "epoch": 2711} {"train_loss": -42.826908111572266, "global_step": 328132, "epoch": 2711} {"train_loss": -43.58150100708008, "global_step": 328133, "epoch": 2711} {"train_loss": -42.91908645629883, "global_step": 328134, "epoch": 2711} {"train_loss": -43.30253982543945, "global_step": 328135, "epoch": 2711} {"train_loss": -43.53817367553711, "global_step": 328136, "epoch": 2711} {"train_loss": -43.10498809814453, "global_step": 328137, "epoch": 2711} {"train_loss": -42.80910110473633, "global_step": 328138, "epoch": 2711} {"train_loss": -41.0098762512207, "global_step": 328139, "epoch": 2711} {"train_loss": -43.92041015625, "global_step": 328140, "epoch": 2711} {"train_loss": -43.595558166503906, "global_step": 328141, "epoch": 2711} {"train_loss": -42.9428596496582, "global_step": 328142, "epoch": 2711} {"train_loss": -43.252437591552734, "global_step": 328143, "epoch": 2711} {"train_loss": -43.60161209106445, "global_step": 328144, "epoch": 2711} {"train_loss": -41.7917594909668, "global_step": 328145, "epoch": 2711} {"train_loss": -37.973262786865234, "global_step": 328146, "epoch": 2711} {"train_loss": -37.70085525512695, "global_step": 328147, "epoch": 2711} {"train_loss": -43.12977981567383, "global_step": 328148, "epoch": 2711} {"train_loss": -39.8559684753418, "global_step": 328149, "epoch": 2711} {"train_loss": -40.853328704833984, "global_step": 328150, "epoch": 2711} {"train_loss": -42.89650937545398, "global_step": 328151, "epoch": 2711, "val_loss": 2636210.75} {"train_loss": -41.0400390625, "global_step": 328152, "epoch": 2712} {"train_loss": -41.31173324584961, "global_step": 328153, "epoch": 2712} {"train_loss": -42.25770950317383, "global_step": 328154, "epoch": 2712} {"train_loss": -41.49677658081055, "global_step": 328155, "epoch": 2712} {"train_loss": -41.28913497924805, "global_step": 328156, "epoch": 2712} {"train_loss": -41.895015716552734, "global_step": 328157, "epoch": 2712} {"train_loss": -38.69417953491211, "global_step": 328158, "epoch": 2712} {"train_loss": -42.34699249267578, "global_step": 328159, "epoch": 2712} {"train_loss": -41.96476364135742, "global_step": 328160, "epoch": 2712} {"train_loss": -41.11774444580078, "global_step": 328161, "epoch": 2712} {"train_loss": -43.427066802978516, "global_step": 328162, "epoch": 2712} {"train_loss": -41.771636962890625, "global_step": 328163, "epoch": 2712} {"train_loss": -42.274166107177734, "global_step": 328164, "epoch": 2712} {"train_loss": -42.9896354675293, "global_step": 328165, "epoch": 2712} {"train_loss": -41.77700424194336, "global_step": 328166, "epoch": 2712} {"train_loss": -42.69680404663086, "global_step": 328167, "epoch": 2712} {"train_loss": -41.6284294128418, "global_step": 328168, "epoch": 2712} {"train_loss": -42.130733489990234, "global_step": 328169, "epoch": 2712} {"train_loss": -42.549774169921875, "global_step": 328170, "epoch": 2712} {"train_loss": -42.12903594970703, "global_step": 328171, "epoch": 2712} {"train_loss": -43.46028137207031, "global_step": 328172, "epoch": 2712} {"train_loss": -43.16083526611328, "global_step": 328173, "epoch": 2712} {"train_loss": -43.203975677490234, "global_step": 328174, "epoch": 2712} {"train_loss": -43.01380920410156, "global_step": 328175, "epoch": 2712} {"train_loss": -42.04928207397461, "global_step": 328176, "epoch": 2712} {"train_loss": -43.7017707824707, "global_step": 328177, "epoch": 2712} {"train_loss": -42.892120361328125, "global_step": 328178, "epoch": 2712} {"train_loss": -42.76117706298828, "global_step": 328179, "epoch": 2712} {"train_loss": -43.124916076660156, "global_step": 328180, "epoch": 2712} {"train_loss": -43.934932708740234, "global_step": 328181, "epoch": 2712} {"train_loss": -42.494842529296875, "global_step": 328182, "epoch": 2712} {"train_loss": -42.933074951171875, "global_step": 328183, "epoch": 2712} {"train_loss": -42.913978576660156, "global_step": 328184, "epoch": 2712} {"train_loss": -43.03176498413086, "global_step": 328185, "epoch": 2712} {"train_loss": -42.87706756591797, "global_step": 328186, "epoch": 2712} {"train_loss": -43.272972106933594, "global_step": 328187, "epoch": 2712} {"train_loss": -42.83038330078125, "global_step": 328188, "epoch": 2712} {"train_loss": -43.75870895385742, "global_step": 328189, "epoch": 2712} {"train_loss": -43.11210250854492, "global_step": 328190, "epoch": 2712} {"train_loss": -43.41010665893555, "global_step": 328191, "epoch": 2712} {"train_loss": -43.29989242553711, "global_step": 328192, "epoch": 2712} {"train_loss": -42.49948501586914, "global_step": 328193, "epoch": 2712} {"train_loss": -43.92841339111328, "global_step": 328194, "epoch": 2712} {"train_loss": -43.227638244628906, "global_step": 328195, "epoch": 2712} {"train_loss": -42.5855598449707, "global_step": 328196, "epoch": 2712} {"train_loss": -42.63678741455078, "global_step": 328197, "epoch": 2712} {"train_loss": -43.5073127746582, "global_step": 328198, "epoch": 2712} {"train_loss": -41.97037887573242, "global_step": 328199, "epoch": 2712} {"train_loss": -42.4992790222168, "global_step": 328200, "epoch": 2712} {"train_loss": -44.117923736572266, "global_step": 328201, "epoch": 2712} {"train_loss": -43.056270599365234, "global_step": 328202, "epoch": 2712} {"train_loss": -43.2972526550293, "global_step": 328203, "epoch": 2712} {"train_loss": -44.469085693359375, "global_step": 328204, "epoch": 2712} {"train_loss": -43.71858596801758, "global_step": 328205, "epoch": 2712} {"train_loss": -42.41503143310547, "global_step": 328206, "epoch": 2712} {"train_loss": -43.22700500488281, "global_step": 328207, "epoch": 2712} {"train_loss": -44.2203254699707, "global_step": 328208, "epoch": 2712} {"train_loss": -43.93508529663086, "global_step": 328209, "epoch": 2712} {"train_loss": -43.51338577270508, "global_step": 328210, "epoch": 2712} {"train_loss": -43.68242263793945, "global_step": 328211, "epoch": 2712} {"train_loss": -44.36286544799805, "global_step": 328212, "epoch": 2712} {"train_loss": -43.988162994384766, "global_step": 328213, "epoch": 2712} {"train_loss": -43.11668395996094, "global_step": 328214, "epoch": 2712} {"train_loss": -42.774532318115234, "global_step": 328215, "epoch": 2712} {"train_loss": -43.774391174316406, "global_step": 328216, "epoch": 2712} {"train_loss": -44.90972137451172, "global_step": 328217, "epoch": 2712} {"train_loss": -44.426795959472656, "global_step": 328218, "epoch": 2712} {"train_loss": -44.17717361450195, "global_step": 328219, "epoch": 2712} {"train_loss": -43.75034713745117, "global_step": 328220, "epoch": 2712} {"train_loss": -44.649436950683594, "global_step": 328221, "epoch": 2712} {"train_loss": -43.86846923828125, "global_step": 328222, "epoch": 2712} {"train_loss": -44.20537567138672, "global_step": 328223, "epoch": 2712} {"train_loss": -44.43390655517578, "global_step": 328224, "epoch": 2712} {"train_loss": -44.46405029296875, "global_step": 328225, "epoch": 2712} {"train_loss": -44.89179611206055, "global_step": 328226, "epoch": 2712} {"train_loss": -42.0835075378418, "global_step": 328227, "epoch": 2712} {"train_loss": -44.12977981567383, "global_step": 328228, "epoch": 2712} {"train_loss": -44.899391174316406, "global_step": 328229, "epoch": 2712} {"train_loss": -44.57796859741211, "global_step": 328230, "epoch": 2712} {"train_loss": -43.81311798095703, "global_step": 328231, "epoch": 2712} {"train_loss": -44.66104507446289, "global_step": 328232, "epoch": 2712} {"train_loss": -44.414039611816406, "global_step": 328233, "epoch": 2712} {"train_loss": -43.00812530517578, "global_step": 328234, "epoch": 2712} {"train_loss": -44.64786148071289, "global_step": 328235, "epoch": 2712} {"train_loss": -43.43370819091797, "global_step": 328236, "epoch": 2712} {"train_loss": -37.826168060302734, "global_step": 328237, "epoch": 2712} {"train_loss": -44.251102447509766, "global_step": 328238, "epoch": 2712} {"train_loss": -39.43099594116211, "global_step": 328239, "epoch": 2712} {"train_loss": -30.3380069732666, "global_step": 328240, "epoch": 2712} {"train_loss": -44.50712203979492, "global_step": 328241, "epoch": 2712} {"train_loss": -43.43406295776367, "global_step": 328242, "epoch": 2712} {"train_loss": -38.59378433227539, "global_step": 328243, "epoch": 2712} {"train_loss": -43.2344970703125, "global_step": 328244, "epoch": 2712} {"train_loss": -42.315032958984375, "global_step": 328245, "epoch": 2712} {"train_loss": -41.268123626708984, "global_step": 328246, "epoch": 2712} {"train_loss": -37.1131477355957, "global_step": 328247, "epoch": 2712} {"train_loss": -35.46010208129883, "global_step": 328248, "epoch": 2712} {"train_loss": -40.46659469604492, "global_step": 328249, "epoch": 2712} {"train_loss": -31.1907958984375, "global_step": 328250, "epoch": 2712} {"train_loss": -40.748878479003906, "global_step": 328251, "epoch": 2712} {"train_loss": -41.11887741088867, "global_step": 328252, "epoch": 2712} {"train_loss": -40.161903381347656, "global_step": 328253, "epoch": 2712} {"train_loss": -25.286909103393555, "global_step": 328254, "epoch": 2712} {"train_loss": -39.54060745239258, "global_step": 328255, "epoch": 2712} {"train_loss": -42.889339447021484, "global_step": 328256, "epoch": 2712} {"train_loss": -23.06220054626465, "global_step": 328257, "epoch": 2712} {"train_loss": -36.82942199707031, "global_step": 328258, "epoch": 2712} {"train_loss": -35.834712982177734, "global_step": 328259, "epoch": 2712} {"train_loss": -32.68484115600586, "global_step": 328260, "epoch": 2712} {"train_loss": -37.070491790771484, "global_step": 328261, "epoch": 2712} {"train_loss": -27.539121627807617, "global_step": 328262, "epoch": 2712} {"train_loss": -39.62165832519531, "global_step": 328263, "epoch": 2712} {"train_loss": -33.67500686645508, "global_step": 328264, "epoch": 2712} {"train_loss": -36.71014404296875, "global_step": 328265, "epoch": 2712} {"train_loss": -40.2652473449707, "global_step": 328266, "epoch": 2712} {"train_loss": -41.3129997253418, "global_step": 328267, "epoch": 2712} {"train_loss": -38.72829055786133, "global_step": 328268, "epoch": 2712} {"train_loss": -40.7071647644043, "global_step": 328269, "epoch": 2712} {"train_loss": -40.17428970336914, "global_step": 328270, "epoch": 2712} {"train_loss": -39.47018051147461, "global_step": 328271, "epoch": 2712} {"train_loss": -41.55788913443069, "global_step": 328272, "epoch": 2712, "val_loss": 3933241.75} {"train_loss": -37.75132369995117, "global_step": 328273, "epoch": 2713} {"train_loss": -39.981868743896484, "global_step": 328274, "epoch": 2713} {"train_loss": -40.76572799682617, "global_step": 328275, "epoch": 2713} {"train_loss": -38.419517517089844, "global_step": 328276, "epoch": 2713} {"train_loss": -40.6750602722168, "global_step": 328277, "epoch": 2713} {"train_loss": -40.220027923583984, "global_step": 328278, "epoch": 2713} {"train_loss": -40.265254974365234, "global_step": 328279, "epoch": 2713} {"train_loss": -36.9636344909668, "global_step": 328280, "epoch": 2713} {"train_loss": -40.435211181640625, "global_step": 328281, "epoch": 2713} {"train_loss": -40.970760345458984, "global_step": 328282, "epoch": 2713} {"train_loss": -40.90571594238281, "global_step": 328283, "epoch": 2713} {"train_loss": -40.52467727661133, "global_step": 328284, "epoch": 2713} {"train_loss": -35.97151565551758, "global_step": 328285, "epoch": 2713} {"train_loss": -39.30613327026367, "global_step": 328286, "epoch": 2713} {"train_loss": -41.17361068725586, "global_step": 328287, "epoch": 2713} {"train_loss": -40.48344039916992, "global_step": 328288, "epoch": 2713} {"train_loss": -39.16534423828125, "global_step": 328289, "epoch": 2713} {"train_loss": -41.2641716003418, "global_step": 328290, "epoch": 2713} {"train_loss": -41.44675827026367, "global_step": 328291, "epoch": 2713} {"train_loss": -39.47830581665039, "global_step": 328292, "epoch": 2713} {"train_loss": -42.20679473876953, "global_step": 328293, "epoch": 2713} {"train_loss": -41.26021957397461, "global_step": 328294, "epoch": 2713} {"train_loss": -40.9259033203125, "global_step": 328295, "epoch": 2713} {"train_loss": -38.74629592895508, "global_step": 328296, "epoch": 2713} {"train_loss": -41.223060607910156, "global_step": 328297, "epoch": 2713} {"train_loss": -41.67353439331055, "global_step": 328298, "epoch": 2713} {"train_loss": -41.37897872924805, "global_step": 328299, "epoch": 2713} {"train_loss": -40.816017150878906, "global_step": 328300, "epoch": 2713} {"train_loss": -41.803890228271484, "global_step": 328301, "epoch": 2713} {"train_loss": -42.15946578979492, "global_step": 328302, "epoch": 2713} {"train_loss": -41.86833572387695, "global_step": 328303, "epoch": 2713} {"train_loss": -42.22432327270508, "global_step": 328304, "epoch": 2713} {"train_loss": -41.97943115234375, "global_step": 328305, "epoch": 2713} {"train_loss": -42.5206413269043, "global_step": 328306, "epoch": 2713} {"train_loss": -42.15929412841797, "global_step": 328307, "epoch": 2713} {"train_loss": -42.55134201049805, "global_step": 328308, "epoch": 2713} {"train_loss": -43.31761932373047, "global_step": 328309, "epoch": 2713} {"train_loss": -42.49296188354492, "global_step": 328310, "epoch": 2713} {"train_loss": -42.94575119018555, "global_step": 328311, "epoch": 2713} {"train_loss": -42.74867630004883, "global_step": 328312, "epoch": 2713} {"train_loss": -41.22764205932617, "global_step": 328313, "epoch": 2713} {"train_loss": -42.92837142944336, "global_step": 328314, "epoch": 2713} {"train_loss": -42.94489288330078, "global_step": 328315, "epoch": 2713} {"train_loss": -40.176204681396484, "global_step": 328316, "epoch": 2713} {"train_loss": -42.5517463684082, "global_step": 328317, "epoch": 2713} {"train_loss": -42.22797775268555, "global_step": 328318, "epoch": 2713} {"train_loss": -41.74131393432617, "global_step": 328319, "epoch": 2713} {"train_loss": -41.967124938964844, "global_step": 328320, "epoch": 2713} {"train_loss": -42.029720306396484, "global_step": 328321, "epoch": 2713} {"train_loss": -41.90298080444336, "global_step": 328322, "epoch": 2713} {"train_loss": -42.2357292175293, "global_step": 328323, "epoch": 2713} {"train_loss": -43.20681381225586, "global_step": 328324, "epoch": 2713} {"train_loss": -41.58867645263672, "global_step": 328325, "epoch": 2713} {"train_loss": -42.689701080322266, "global_step": 328326, "epoch": 2713} {"train_loss": -42.32297897338867, "global_step": 328327, "epoch": 2713} {"train_loss": -42.67681884765625, "global_step": 328328, "epoch": 2713} {"train_loss": -41.097652435302734, "global_step": 328329, "epoch": 2713} {"train_loss": -42.82756423950195, "global_step": 328330, "epoch": 2713} {"train_loss": -43.48810577392578, "global_step": 328331, "epoch": 2713} {"train_loss": -42.940650939941406, "global_step": 328332, "epoch": 2713} {"train_loss": -43.36980438232422, "global_step": 328333, "epoch": 2713} {"train_loss": -42.65165328979492, "global_step": 328334, "epoch": 2713} {"train_loss": -43.21063995361328, "global_step": 328335, "epoch": 2713} {"train_loss": -43.025306701660156, "global_step": 328336, "epoch": 2713} {"train_loss": -43.23672103881836, "global_step": 328337, "epoch": 2713} {"train_loss": -42.88407516479492, "global_step": 328338, "epoch": 2713} {"train_loss": -43.05820846557617, "global_step": 328339, "epoch": 2713} {"train_loss": -43.29520797729492, "global_step": 328340, "epoch": 2713} {"train_loss": -43.84468460083008, "global_step": 328341, "epoch": 2713} {"train_loss": -43.61069869995117, "global_step": 328342, "epoch": 2713} {"train_loss": -43.76218795776367, "global_step": 328343, "epoch": 2713} {"train_loss": -43.152191162109375, "global_step": 328344, "epoch": 2713} {"train_loss": -43.145423889160156, "global_step": 328345, "epoch": 2713} {"train_loss": -42.175201416015625, "global_step": 328346, "epoch": 2713} {"train_loss": -43.552528381347656, "global_step": 328347, "epoch": 2713} {"train_loss": -42.36731719970703, "global_step": 328348, "epoch": 2713} {"train_loss": -43.04000473022461, "global_step": 328349, "epoch": 2713} {"train_loss": -42.91364669799805, "global_step": 328350, "epoch": 2713} {"train_loss": -43.10224533081055, "global_step": 328351, "epoch": 2713} {"train_loss": -43.18699264526367, "global_step": 328352, "epoch": 2713} {"train_loss": -44.02656173706055, "global_step": 328353, "epoch": 2713} {"train_loss": -43.88557052612305, "global_step": 328354, "epoch": 2713} {"train_loss": -42.97251510620117, "global_step": 328355, "epoch": 2713} {"train_loss": -43.629024505615234, "global_step": 328356, "epoch": 2713} {"train_loss": -43.446632385253906, "global_step": 328357, "epoch": 2713} {"train_loss": -43.283321380615234, "global_step": 328358, "epoch": 2713} {"train_loss": -43.449520111083984, "global_step": 328359, "epoch": 2713} {"train_loss": -42.90388107299805, "global_step": 328360, "epoch": 2713} {"train_loss": -43.5815544128418, "global_step": 328361, "epoch": 2713} {"train_loss": -43.902069091796875, "global_step": 328362, "epoch": 2713} {"train_loss": -43.51667022705078, "global_step": 328363, "epoch": 2713} {"train_loss": -44.221038818359375, "global_step": 328364, "epoch": 2713} {"train_loss": -43.59062576293945, "global_step": 328365, "epoch": 2713} {"train_loss": -43.62520980834961, "global_step": 328366, "epoch": 2713} {"train_loss": -43.59556579589844, "global_step": 328367, "epoch": 2713} {"train_loss": -43.628936767578125, "global_step": 328368, "epoch": 2713} {"train_loss": -43.88523483276367, "global_step": 328369, "epoch": 2713} {"train_loss": -43.3880729675293, "global_step": 328370, "epoch": 2713} {"train_loss": -42.961334228515625, "global_step": 328371, "epoch": 2713} {"train_loss": -43.72315216064453, "global_step": 328372, "epoch": 2713} {"train_loss": -43.79679489135742, "global_step": 328373, "epoch": 2713} {"train_loss": -43.41047668457031, "global_step": 328374, "epoch": 2713} {"train_loss": -44.29344177246094, "global_step": 328375, "epoch": 2713} {"train_loss": -43.865108489990234, "global_step": 328376, "epoch": 2713} {"train_loss": -44.44544982910156, "global_step": 328377, "epoch": 2713} {"train_loss": -43.196224212646484, "global_step": 328378, "epoch": 2713} {"train_loss": -43.01011657714844, "global_step": 328379, "epoch": 2713} {"train_loss": -42.978736877441406, "global_step": 328380, "epoch": 2713} {"train_loss": -43.46364974975586, "global_step": 328381, "epoch": 2713} {"train_loss": -42.314125061035156, "global_step": 328382, "epoch": 2713} {"train_loss": -43.891963958740234, "global_step": 328383, "epoch": 2713} {"train_loss": -43.437103271484375, "global_step": 328384, "epoch": 2713} {"train_loss": -42.68247604370117, "global_step": 328385, "epoch": 2713} {"train_loss": -41.07322311401367, "global_step": 328386, "epoch": 2713} {"train_loss": -40.27593994140625, "global_step": 328387, "epoch": 2713} {"train_loss": -39.3566780090332, "global_step": 328388, "epoch": 2713} {"train_loss": -41.15948486328125, "global_step": 328389, "epoch": 2713} {"train_loss": -41.79693603515625, "global_step": 328390, "epoch": 2713} {"train_loss": -43.38650131225586, "global_step": 328391, "epoch": 2713} {"train_loss": -41.92009353637695, "global_step": 328392, "epoch": 2713} {"train_loss": -42.211111935702235, "global_step": 328393, "epoch": 2713, "val_loss": 2618610.0} {"train_loss": -42.66899490356445, "global_step": 328394, "epoch": 2714} {"train_loss": -43.25843811035156, "global_step": 328395, "epoch": 2714} {"train_loss": -42.7481689453125, "global_step": 328396, "epoch": 2714} {"train_loss": -42.270652770996094, "global_step": 328397, "epoch": 2714} {"train_loss": -42.65789031982422, "global_step": 328398, "epoch": 2714} {"train_loss": -43.68474197387695, "global_step": 328399, "epoch": 2714} {"train_loss": -42.588130950927734, "global_step": 328400, "epoch": 2714} {"train_loss": -42.18685531616211, "global_step": 328401, "epoch": 2714} {"train_loss": -42.879608154296875, "global_step": 328402, "epoch": 2714} {"train_loss": -42.30477523803711, "global_step": 328403, "epoch": 2714} {"train_loss": -41.8969612121582, "global_step": 328404, "epoch": 2714} {"train_loss": -42.84226989746094, "global_step": 328405, "epoch": 2714} {"train_loss": -43.00310134887695, "global_step": 328406, "epoch": 2714} {"train_loss": -41.979339599609375, "global_step": 328407, "epoch": 2714} {"train_loss": -42.5457763671875, "global_step": 328408, "epoch": 2714} {"train_loss": -43.191097259521484, "global_step": 328409, "epoch": 2714} {"train_loss": -43.42373275756836, "global_step": 328410, "epoch": 2714} {"train_loss": -43.069766998291016, "global_step": 328411, "epoch": 2714} {"train_loss": -42.68999099731445, "global_step": 328412, "epoch": 2714} {"train_loss": -42.60332107543945, "global_step": 328413, "epoch": 2714} {"train_loss": -42.56915283203125, "global_step": 328414, "epoch": 2714} {"train_loss": -43.11025619506836, "global_step": 328415, "epoch": 2714} {"train_loss": -42.751216888427734, "global_step": 328416, "epoch": 2714} {"train_loss": -43.104427337646484, "global_step": 328417, "epoch": 2714} {"train_loss": -43.28660202026367, "global_step": 328418, "epoch": 2714} {"train_loss": -41.771331787109375, "global_step": 328419, "epoch": 2714} {"train_loss": -40.55261993408203, "global_step": 328420, "epoch": 2714} {"train_loss": -42.006256103515625, "global_step": 328421, "epoch": 2714} {"train_loss": -42.257503509521484, "global_step": 328422, "epoch": 2714} {"train_loss": -41.93357467651367, "global_step": 328423, "epoch": 2714} {"train_loss": -42.423553466796875, "global_step": 328424, "epoch": 2714} {"train_loss": -42.14540481567383, "global_step": 328425, "epoch": 2714} {"train_loss": -40.64602279663086, "global_step": 328426, "epoch": 2714} {"train_loss": -42.879920959472656, "global_step": 328427, "epoch": 2714} {"train_loss": -43.18150329589844, "global_step": 328428, "epoch": 2714} {"train_loss": -41.16373825073242, "global_step": 328429, "epoch": 2714} {"train_loss": -42.845428466796875, "global_step": 328430, "epoch": 2714} {"train_loss": -42.147254943847656, "global_step": 328431, "epoch": 2714} {"train_loss": -41.58869552612305, "global_step": 328432, "epoch": 2714} {"train_loss": -42.14307403564453, "global_step": 328433, "epoch": 2714} {"train_loss": -42.626976013183594, "global_step": 328434, "epoch": 2714} {"train_loss": -43.01521682739258, "global_step": 328435, "epoch": 2714} {"train_loss": -41.960174560546875, "global_step": 328436, "epoch": 2714} {"train_loss": -42.542842864990234, "global_step": 328437, "epoch": 2714} {"train_loss": -43.409942626953125, "global_step": 328438, "epoch": 2714} {"train_loss": -42.486629486083984, "global_step": 328439, "epoch": 2714} {"train_loss": -43.662841796875, "global_step": 328440, "epoch": 2714} {"train_loss": -42.221309661865234, "global_step": 328441, "epoch": 2714} {"train_loss": -43.32333755493164, "global_step": 328442, "epoch": 2714} {"train_loss": -42.56172561645508, "global_step": 328443, "epoch": 2714} {"train_loss": -42.31593704223633, "global_step": 328444, "epoch": 2714} {"train_loss": -41.729034423828125, "global_step": 328445, "epoch": 2714} {"train_loss": -42.18600082397461, "global_step": 328446, "epoch": 2714} {"train_loss": -41.623374938964844, "global_step": 328447, "epoch": 2714} {"train_loss": -43.1304931640625, "global_step": 328448, "epoch": 2714} {"train_loss": -40.5324821472168, "global_step": 328449, "epoch": 2714} {"train_loss": -43.53517532348633, "global_step": 328450, "epoch": 2714} {"train_loss": -42.84069061279297, "global_step": 328451, "epoch": 2714} {"train_loss": -42.44355010986328, "global_step": 328452, "epoch": 2714} {"train_loss": -41.9666633605957, "global_step": 328453, "epoch": 2714} {"train_loss": -43.263790130615234, "global_step": 328454, "epoch": 2714} {"train_loss": -40.856746673583984, "global_step": 328455, "epoch": 2714} {"train_loss": -41.560760498046875, "global_step": 328456, "epoch": 2714} {"train_loss": -43.56972885131836, "global_step": 328457, "epoch": 2714} {"train_loss": -41.159080505371094, "global_step": 328458, "epoch": 2714} {"train_loss": -42.51615524291992, "global_step": 328459, "epoch": 2714} {"train_loss": -42.192298889160156, "global_step": 328460, "epoch": 2714} {"train_loss": -42.69985580444336, "global_step": 328461, "epoch": 2714} {"train_loss": -43.29462432861328, "global_step": 328462, "epoch": 2714} {"train_loss": -43.14204025268555, "global_step": 328463, "epoch": 2714} {"train_loss": -42.929176330566406, "global_step": 328464, "epoch": 2714} {"train_loss": -41.82474899291992, "global_step": 328465, "epoch": 2714} {"train_loss": -43.12427520751953, "global_step": 328466, "epoch": 2714} {"train_loss": -42.821712493896484, "global_step": 328467, "epoch": 2714} {"train_loss": -42.63242721557617, "global_step": 328468, "epoch": 2714} {"train_loss": -43.55866622924805, "global_step": 328469, "epoch": 2714} {"train_loss": -42.65665817260742, "global_step": 328470, "epoch": 2714} {"train_loss": -43.14913558959961, "global_step": 328471, "epoch": 2714} {"train_loss": -43.53339385986328, "global_step": 328472, "epoch": 2714} {"train_loss": -43.263893127441406, "global_step": 328473, "epoch": 2714} {"train_loss": -43.12010192871094, "global_step": 328474, "epoch": 2714} {"train_loss": -43.44735336303711, "global_step": 328475, "epoch": 2714} {"train_loss": -43.83938980102539, "global_step": 328476, "epoch": 2714} {"train_loss": -43.338130950927734, "global_step": 328477, "epoch": 2714} {"train_loss": -43.63901901245117, "global_step": 328478, "epoch": 2714} {"train_loss": -44.20327377319336, "global_step": 328479, "epoch": 2714} {"train_loss": -43.82465744018555, "global_step": 328480, "epoch": 2714} {"train_loss": -43.55657958984375, "global_step": 328481, "epoch": 2714} {"train_loss": -43.203765869140625, "global_step": 328482, "epoch": 2714} {"train_loss": -43.900455474853516, "global_step": 328483, "epoch": 2714} {"train_loss": -43.78571319580078, "global_step": 328484, "epoch": 2714} {"train_loss": -43.6413459777832, "global_step": 328485, "epoch": 2714} {"train_loss": -43.936744689941406, "global_step": 328486, "epoch": 2714} {"train_loss": -43.53752517700195, "global_step": 328487, "epoch": 2714} {"train_loss": -43.833736419677734, "global_step": 328488, "epoch": 2714} {"train_loss": -44.14557647705078, "global_step": 328489, "epoch": 2714} {"train_loss": -43.79594039916992, "global_step": 328490, "epoch": 2714} {"train_loss": -44.429107666015625, "global_step": 328491, "epoch": 2714} {"train_loss": -43.9224853515625, "global_step": 328492, "epoch": 2714} {"train_loss": -44.14907455444336, "global_step": 328493, "epoch": 2714} {"train_loss": -44.19474411010742, "global_step": 328494, "epoch": 2714} {"train_loss": -43.29841995239258, "global_step": 328495, "epoch": 2714} {"train_loss": -43.55531692504883, "global_step": 328496, "epoch": 2714} {"train_loss": -44.536800384521484, "global_step": 328497, "epoch": 2714} {"train_loss": -43.77391052246094, "global_step": 328498, "epoch": 2714} {"train_loss": -44.369632720947266, "global_step": 328499, "epoch": 2714} {"train_loss": -43.49146270751953, "global_step": 328500, "epoch": 2714} {"train_loss": -43.74895095825195, "global_step": 328501, "epoch": 2714} {"train_loss": -43.90232467651367, "global_step": 328502, "epoch": 2714} {"train_loss": -44.182613372802734, "global_step": 328503, "epoch": 2714} {"train_loss": -43.25175857543945, "global_step": 328504, "epoch": 2714} {"train_loss": -43.71229934692383, "global_step": 328505, "epoch": 2714} {"train_loss": -44.4780158996582, "global_step": 328506, "epoch": 2714} {"train_loss": -44.34061813354492, "global_step": 328507, "epoch": 2714} {"train_loss": -43.26395797729492, "global_step": 328508, "epoch": 2714} {"train_loss": -41.768123626708984, "global_step": 328509, "epoch": 2714} {"train_loss": -41.26395034790039, "global_step": 328510, "epoch": 2714} {"train_loss": -43.03484344482422, "global_step": 328511, "epoch": 2714} {"train_loss": -43.943904876708984, "global_step": 328512, "epoch": 2714} {"train_loss": -43.69915771484375, "global_step": 328513, "epoch": 2714} {"train_loss": -42.9239998494298, "global_step": 328514, "epoch": 2714, "val_loss": 2672673.75} {"train_loss": -44.2495002746582, "global_step": 328515, "epoch": 2715} {"train_loss": -43.79793930053711, "global_step": 328516, "epoch": 2715} {"train_loss": -43.805538177490234, "global_step": 328517, "epoch": 2715} {"train_loss": -43.13753890991211, "global_step": 328518, "epoch": 2715} {"train_loss": -37.64807891845703, "global_step": 328519, "epoch": 2715} {"train_loss": -41.557193756103516, "global_step": 328520, "epoch": 2715} {"train_loss": -41.31771469116211, "global_step": 328521, "epoch": 2715} {"train_loss": -42.86945724487305, "global_step": 328522, "epoch": 2715} {"train_loss": -9.195199966430664, "global_step": 328523, "epoch": 2715} {"train_loss": -28.706857681274414, "global_step": 328524, "epoch": 2715} {"train_loss": -34.30134201049805, "global_step": 328525, "epoch": 2715} {"train_loss": -38.91328048706055, "global_step": 328526, "epoch": 2715} {"train_loss": -33.87946319580078, "global_step": 328527, "epoch": 2715} {"train_loss": -37.18360900878906, "global_step": 328528, "epoch": 2715} {"train_loss": -38.130802154541016, "global_step": 328529, "epoch": 2715} {"train_loss": -34.040550231933594, "global_step": 328530, "epoch": 2715} {"train_loss": -40.516380310058594, "global_step": 328531, "epoch": 2715} {"train_loss": -34.79652786254883, "global_step": 328532, "epoch": 2715} {"train_loss": -36.94719314575195, "global_step": 328533, "epoch": 2715} {"train_loss": -36.9935302734375, "global_step": 328534, "epoch": 2715} {"train_loss": -40.59123611450195, "global_step": 328535, "epoch": 2715} {"train_loss": -38.416561126708984, "global_step": 328536, "epoch": 2715} {"train_loss": -39.66771697998047, "global_step": 328537, "epoch": 2715} {"train_loss": -39.23434066772461, "global_step": 328538, "epoch": 2715} {"train_loss": -39.56132125854492, "global_step": 328539, "epoch": 2715} {"train_loss": -40.45588302612305, "global_step": 328540, "epoch": 2715} {"train_loss": -40.67295455932617, "global_step": 328541, "epoch": 2715} {"train_loss": -40.904598236083984, "global_step": 328542, "epoch": 2715} {"train_loss": -41.582332611083984, "global_step": 328543, "epoch": 2715} {"train_loss": -40.31203842163086, "global_step": 328544, "epoch": 2715} {"train_loss": -41.41707229614258, "global_step": 328545, "epoch": 2715} {"train_loss": -40.979183197021484, "global_step": 328546, "epoch": 2715} {"train_loss": -40.784912109375, "global_step": 328547, "epoch": 2715} {"train_loss": -40.89632034301758, "global_step": 328548, "epoch": 2715} {"train_loss": -41.45146179199219, "global_step": 328549, "epoch": 2715} {"train_loss": -38.88785171508789, "global_step": 328550, "epoch": 2715} {"train_loss": -41.361114501953125, "global_step": 328551, "epoch": 2715} {"train_loss": -41.91917037963867, "global_step": 328552, "epoch": 2715} {"train_loss": -42.526023864746094, "global_step": 328553, "epoch": 2715} {"train_loss": -41.936500549316406, "global_step": 328554, "epoch": 2715} {"train_loss": -41.70984649658203, "global_step": 328555, "epoch": 2715} {"train_loss": -41.26353454589844, "global_step": 328556, "epoch": 2715} {"train_loss": -42.60361862182617, "global_step": 328557, "epoch": 2715} {"train_loss": -42.03449630737305, "global_step": 328558, "epoch": 2715} {"train_loss": -41.9207649230957, "global_step": 328559, "epoch": 2715} {"train_loss": -42.20198440551758, "global_step": 328560, "epoch": 2715} {"train_loss": -42.48084259033203, "global_step": 328561, "epoch": 2715} {"train_loss": -42.2230339050293, "global_step": 328562, "epoch": 2715} {"train_loss": -41.31209945678711, "global_step": 328563, "epoch": 2715} {"train_loss": -42.84816360473633, "global_step": 328564, "epoch": 2715} {"train_loss": -42.37563705444336, "global_step": 328565, "epoch": 2715} {"train_loss": -42.87746810913086, "global_step": 328566, "epoch": 2715} {"train_loss": -42.234432220458984, "global_step": 328567, "epoch": 2715} {"train_loss": -42.50972366333008, "global_step": 328568, "epoch": 2715} {"train_loss": -42.582679748535156, "global_step": 328569, "epoch": 2715} {"train_loss": -42.94401168823242, "global_step": 328570, "epoch": 2715} {"train_loss": -43.08552932739258, "global_step": 328571, "epoch": 2715} {"train_loss": -42.76599884033203, "global_step": 328572, "epoch": 2715} {"train_loss": -43.08784103393555, "global_step": 328573, "epoch": 2715} {"train_loss": -42.782806396484375, "global_step": 328574, "epoch": 2715} {"train_loss": -43.30194091796875, "global_step": 328575, "epoch": 2715} {"train_loss": -43.36099624633789, "global_step": 328576, "epoch": 2715} {"train_loss": -43.21796417236328, "global_step": 328577, "epoch": 2715} {"train_loss": -43.06269454956055, "global_step": 328578, "epoch": 2715} {"train_loss": -43.35539245605469, "global_step": 328579, "epoch": 2715} {"train_loss": -43.265838623046875, "global_step": 328580, "epoch": 2715} {"train_loss": -43.66695022583008, "global_step": 328581, "epoch": 2715} {"train_loss": -43.7166862487793, "global_step": 328582, "epoch": 2715} {"train_loss": -42.8268928527832, "global_step": 328583, "epoch": 2715} {"train_loss": -42.93597412109375, "global_step": 328584, "epoch": 2715} {"train_loss": -43.133846282958984, "global_step": 328585, "epoch": 2715} {"train_loss": -43.63944625854492, "global_step": 328586, "epoch": 2715} {"train_loss": -43.70938491821289, "global_step": 328587, "epoch": 2715} {"train_loss": -43.84164047241211, "global_step": 328588, "epoch": 2715} {"train_loss": -43.21455764770508, "global_step": 328589, "epoch": 2715} {"train_loss": -43.78468322753906, "global_step": 328590, "epoch": 2715} {"train_loss": -43.8341178894043, "global_step": 328591, "epoch": 2715} {"train_loss": -43.17959213256836, "global_step": 328592, "epoch": 2715} {"train_loss": -43.86427688598633, "global_step": 328593, "epoch": 2715} {"train_loss": -44.1992073059082, "global_step": 328594, "epoch": 2715} {"train_loss": -43.60435485839844, "global_step": 328595, "epoch": 2715} {"train_loss": -42.94818115234375, "global_step": 328596, "epoch": 2715} {"train_loss": -43.9426383972168, "global_step": 328597, "epoch": 2715} {"train_loss": -44.19887161254883, "global_step": 328598, "epoch": 2715} {"train_loss": -44.055320739746094, "global_step": 328599, "epoch": 2715} {"train_loss": -43.99522018432617, "global_step": 328600, "epoch": 2715} {"train_loss": -43.471099853515625, "global_step": 328601, "epoch": 2715} {"train_loss": -44.16470718383789, "global_step": 328602, "epoch": 2715} {"train_loss": -44.04751205444336, "global_step": 328603, "epoch": 2715} {"train_loss": -44.1773796081543, "global_step": 328604, "epoch": 2715} {"train_loss": -44.004112243652344, "global_step": 328605, "epoch": 2715} {"train_loss": -40.12253952026367, "global_step": 328606, "epoch": 2715} {"train_loss": -43.66592025756836, "global_step": 328607, "epoch": 2715} {"train_loss": -44.16114044189453, "global_step": 328608, "epoch": 2715} {"train_loss": -44.072872161865234, "global_step": 328609, "epoch": 2715} {"train_loss": -44.539955139160156, "global_step": 328610, "epoch": 2715} {"train_loss": -44.17694854736328, "global_step": 328611, "epoch": 2715} {"train_loss": -44.04238510131836, "global_step": 328612, "epoch": 2715} {"train_loss": -44.18476867675781, "global_step": 328613, "epoch": 2715} {"train_loss": -44.216068267822266, "global_step": 328614, "epoch": 2715} {"train_loss": -44.21097946166992, "global_step": 328615, "epoch": 2715} {"train_loss": -43.01055908203125, "global_step": 328616, "epoch": 2715} {"train_loss": -44.04597091674805, "global_step": 328617, "epoch": 2715} {"train_loss": -44.1677360534668, "global_step": 328618, "epoch": 2715} {"train_loss": -44.56553268432617, "global_step": 328619, "epoch": 2715} {"train_loss": -44.048954010009766, "global_step": 328620, "epoch": 2715} {"train_loss": -44.37672424316406, "global_step": 328621, "epoch": 2715} {"train_loss": -42.898860931396484, "global_step": 328622, "epoch": 2715} {"train_loss": -44.43120193481445, "global_step": 328623, "epoch": 2715} {"train_loss": -41.97243118286133, "global_step": 328624, "epoch": 2715} {"train_loss": -41.829769134521484, "global_step": 328625, "epoch": 2715} {"train_loss": -40.83828353881836, "global_step": 328626, "epoch": 2715} {"train_loss": -43.877193450927734, "global_step": 328627, "epoch": 2715} {"train_loss": -43.744503021240234, "global_step": 328628, "epoch": 2715} {"train_loss": -43.66323471069336, "global_step": 328629, "epoch": 2715} {"train_loss": -43.92715835571289, "global_step": 328630, "epoch": 2715} {"train_loss": -43.847930908203125, "global_step": 328631, "epoch": 2715} {"train_loss": -44.152587890625, "global_step": 328632, "epoch": 2715} {"train_loss": -44.085052490234375, "global_step": 328633, "epoch": 2715} {"train_loss": -43.529571533203125, "global_step": 328634, "epoch": 2715} {"train_loss": -41.825141654526895, "global_step": 328635, "epoch": 2715, "val_loss": 2670241.0} {"train_loss": -41.7411994934082, "global_step": 328636, "epoch": 2716} {"train_loss": -42.65278244018555, "global_step": 328637, "epoch": 2716} {"train_loss": -43.06644821166992, "global_step": 328638, "epoch": 2716} {"train_loss": -43.835323333740234, "global_step": 328639, "epoch": 2716} {"train_loss": -41.88389205932617, "global_step": 328640, "epoch": 2716} {"train_loss": -42.301124572753906, "global_step": 328641, "epoch": 2716} {"train_loss": -43.37803649902344, "global_step": 328642, "epoch": 2716} {"train_loss": -43.07693099975586, "global_step": 328643, "epoch": 2716} {"train_loss": -40.554473876953125, "global_step": 328644, "epoch": 2716} {"train_loss": -43.135860443115234, "global_step": 328645, "epoch": 2716} {"train_loss": -42.204044342041016, "global_step": 328646, "epoch": 2716} {"train_loss": -40.05664825439453, "global_step": 328647, "epoch": 2716} {"train_loss": -41.38779067993164, "global_step": 328648, "epoch": 2716} {"train_loss": -42.18308639526367, "global_step": 328649, "epoch": 2716} {"train_loss": -42.3378791809082, "global_step": 328650, "epoch": 2716} {"train_loss": -42.71343994140625, "global_step": 328651, "epoch": 2716} {"train_loss": -43.993343353271484, "global_step": 328652, "epoch": 2716} {"train_loss": -42.7567253112793, "global_step": 328653, "epoch": 2716} {"train_loss": -42.95195770263672, "global_step": 328654, "epoch": 2716} {"train_loss": -43.487525939941406, "global_step": 328655, "epoch": 2716} {"train_loss": -42.59149169921875, "global_step": 328656, "epoch": 2716} {"train_loss": -43.49930953979492, "global_step": 328657, "epoch": 2716} {"train_loss": -43.48689270019531, "global_step": 328658, "epoch": 2716} {"train_loss": -43.719573974609375, "global_step": 328659, "epoch": 2716} {"train_loss": -42.65910339355469, "global_step": 328660, "epoch": 2716} {"train_loss": -43.62221908569336, "global_step": 328661, "epoch": 2716} {"train_loss": -35.65949630737305, "global_step": 328662, "epoch": 2716} {"train_loss": -44.08295822143555, "global_step": 328663, "epoch": 2716} {"train_loss": -43.2071533203125, "global_step": 328664, "epoch": 2716} {"train_loss": -42.417030334472656, "global_step": 328665, "epoch": 2716} {"train_loss": -43.5479736328125, "global_step": 328666, "epoch": 2716} {"train_loss": -41.40725326538086, "global_step": 328667, "epoch": 2716} {"train_loss": -43.419734954833984, "global_step": 328668, "epoch": 2716} {"train_loss": -43.28829574584961, "global_step": 328669, "epoch": 2716} {"train_loss": -43.94242477416992, "global_step": 328670, "epoch": 2716} {"train_loss": -42.26887512207031, "global_step": 328671, "epoch": 2716} {"train_loss": -43.554317474365234, "global_step": 328672, "epoch": 2716} {"train_loss": -43.23594284057617, "global_step": 328673, "epoch": 2716} {"train_loss": -42.06846618652344, "global_step": 328674, "epoch": 2716} {"train_loss": -42.83464813232422, "global_step": 328675, "epoch": 2716} {"train_loss": -43.300018310546875, "global_step": 328676, "epoch": 2716} {"train_loss": -42.99160385131836, "global_step": 328677, "epoch": 2716} {"train_loss": -43.16389465332031, "global_step": 328678, "epoch": 2716} {"train_loss": -43.98639678955078, "global_step": 328679, "epoch": 2716} {"train_loss": -43.073856353759766, "global_step": 328680, "epoch": 2716} {"train_loss": -44.38045120239258, "global_step": 328681, "epoch": 2716} {"train_loss": -43.50264358520508, "global_step": 328682, "epoch": 2716} {"train_loss": -43.84769821166992, "global_step": 328683, "epoch": 2716} {"train_loss": -44.05306625366211, "global_step": 328684, "epoch": 2716} {"train_loss": -43.80903244018555, "global_step": 328685, "epoch": 2716} {"train_loss": -43.84122848510742, "global_step": 328686, "epoch": 2716} {"train_loss": -44.074440002441406, "global_step": 328687, "epoch": 2716} {"train_loss": -41.97275161743164, "global_step": 328688, "epoch": 2716} {"train_loss": -41.51741409301758, "global_step": 328689, "epoch": 2716} {"train_loss": -42.603294372558594, "global_step": 328690, "epoch": 2716} {"train_loss": -43.35697937011719, "global_step": 328691, "epoch": 2716} {"train_loss": -43.11869430541992, "global_step": 328692, "epoch": 2716} {"train_loss": -43.314186096191406, "global_step": 328693, "epoch": 2716} {"train_loss": -43.83921432495117, "global_step": 328694, "epoch": 2716} {"train_loss": -43.30974578857422, "global_step": 328695, "epoch": 2716} {"train_loss": -44.561920166015625, "global_step": 328696, "epoch": 2716} {"train_loss": -42.401790618896484, "global_step": 328697, "epoch": 2716} {"train_loss": -42.83576583862305, "global_step": 328698, "epoch": 2716} {"train_loss": -44.528255462646484, "global_step": 328699, "epoch": 2716} {"train_loss": -43.81721878051758, "global_step": 328700, "epoch": 2716} {"train_loss": -43.70253372192383, "global_step": 328701, "epoch": 2716} {"train_loss": -43.76173400878906, "global_step": 328702, "epoch": 2716} {"train_loss": -43.874244689941406, "global_step": 328703, "epoch": 2716} {"train_loss": -43.072601318359375, "global_step": 328704, "epoch": 2716} {"train_loss": -43.92046356201172, "global_step": 328705, "epoch": 2716} {"train_loss": -43.60274887084961, "global_step": 328706, "epoch": 2716} {"train_loss": -43.262699127197266, "global_step": 328707, "epoch": 2716} {"train_loss": -42.15217208862305, "global_step": 328708, "epoch": 2716} {"train_loss": -43.482887268066406, "global_step": 328709, "epoch": 2716} {"train_loss": -43.74776840209961, "global_step": 328710, "epoch": 2716} {"train_loss": -43.098876953125, "global_step": 328711, "epoch": 2716} {"train_loss": -44.407569885253906, "global_step": 328712, "epoch": 2716} {"train_loss": -44.223388671875, "global_step": 328713, "epoch": 2716} {"train_loss": -43.32014846801758, "global_step": 328714, "epoch": 2716} {"train_loss": -43.84017562866211, "global_step": 328715, "epoch": 2716} {"train_loss": -43.49931716918945, "global_step": 328716, "epoch": 2716} {"train_loss": -43.2367057800293, "global_step": 328717, "epoch": 2716} {"train_loss": -43.80645751953125, "global_step": 328718, "epoch": 2716} {"train_loss": -42.95424270629883, "global_step": 328719, "epoch": 2716} {"train_loss": -42.041011810302734, "global_step": 328720, "epoch": 2716} {"train_loss": -43.226661682128906, "global_step": 328721, "epoch": 2716} {"train_loss": -44.30592727661133, "global_step": 328722, "epoch": 2716} {"train_loss": -41.920501708984375, "global_step": 328723, "epoch": 2716} {"train_loss": -43.912899017333984, "global_step": 328724, "epoch": 2716} {"train_loss": -43.705928802490234, "global_step": 328725, "epoch": 2716} {"train_loss": -43.78915023803711, "global_step": 328726, "epoch": 2716} {"train_loss": -43.36693572998047, "global_step": 328727, "epoch": 2716} {"train_loss": -43.560768127441406, "global_step": 328728, "epoch": 2716} {"train_loss": -43.84433364868164, "global_step": 328729, "epoch": 2716} {"train_loss": -41.595794677734375, "global_step": 328730, "epoch": 2716} {"train_loss": -43.72746658325195, "global_step": 328731, "epoch": 2716} {"train_loss": -44.559322357177734, "global_step": 328732, "epoch": 2716} {"train_loss": -42.819637298583984, "global_step": 328733, "epoch": 2716} {"train_loss": -42.87917709350586, "global_step": 328734, "epoch": 2716} {"train_loss": -43.876365661621094, "global_step": 328735, "epoch": 2716} {"train_loss": -42.143409729003906, "global_step": 328736, "epoch": 2716} {"train_loss": -43.74639129638672, "global_step": 328737, "epoch": 2716} {"train_loss": -43.83407211303711, "global_step": 328738, "epoch": 2716} {"train_loss": -44.25727462768555, "global_step": 328739, "epoch": 2716} {"train_loss": -43.88053512573242, "global_step": 328740, "epoch": 2716} {"train_loss": -44.194496154785156, "global_step": 328741, "epoch": 2716} {"train_loss": -43.77701950073242, "global_step": 328742, "epoch": 2716} {"train_loss": -43.6030158996582, "global_step": 328743, "epoch": 2716} {"train_loss": -44.56227493286133, "global_step": 328744, "epoch": 2716} {"train_loss": -43.95444869995117, "global_step": 328745, "epoch": 2716} {"train_loss": -43.3812370300293, "global_step": 328746, "epoch": 2716} {"train_loss": -43.699947357177734, "global_step": 328747, "epoch": 2716} {"train_loss": -44.17464065551758, "global_step": 328748, "epoch": 2716} {"train_loss": -44.14223098754883, "global_step": 328749, "epoch": 2716} {"train_loss": -44.41636276245117, "global_step": 328750, "epoch": 2716} {"train_loss": -44.33060836791992, "global_step": 328751, "epoch": 2716} {"train_loss": -43.85234451293945, "global_step": 328752, "epoch": 2716} {"train_loss": -44.61090850830078, "global_step": 328753, "epoch": 2716} {"train_loss": -43.976593017578125, "global_step": 328754, "epoch": 2716} {"train_loss": -43.3029670715332, "global_step": 328755, "epoch": 2716} {"train_loss": -43.220247757336324, "global_step": 328756, "epoch": 2716, "val_loss": 2695783.75} {"train_loss": -42.797767639160156, "global_step": 328757, "epoch": 2717} {"train_loss": -44.25682830810547, "global_step": 328758, "epoch": 2717} {"train_loss": -42.37211608886719, "global_step": 328759, "epoch": 2717} {"train_loss": -40.41477584838867, "global_step": 328760, "epoch": 2717} {"train_loss": -41.13425064086914, "global_step": 328761, "epoch": 2717} {"train_loss": -42.25046157836914, "global_step": 328762, "epoch": 2717} {"train_loss": -40.98899459838867, "global_step": 328763, "epoch": 2717} {"train_loss": -41.862098693847656, "global_step": 328764, "epoch": 2717} {"train_loss": -43.166099548339844, "global_step": 328765, "epoch": 2717} {"train_loss": -43.330650329589844, "global_step": 328766, "epoch": 2717} {"train_loss": -42.528114318847656, "global_step": 328767, "epoch": 2717} {"train_loss": -43.19135665893555, "global_step": 328768, "epoch": 2717} {"train_loss": -43.45353317260742, "global_step": 328769, "epoch": 2717} {"train_loss": -43.29934310913086, "global_step": 328770, "epoch": 2717} {"train_loss": -43.40367126464844, "global_step": 328771, "epoch": 2717} {"train_loss": -43.087764739990234, "global_step": 328772, "epoch": 2717} {"train_loss": -43.35493087768555, "global_step": 328773, "epoch": 2717} {"train_loss": -43.07990264892578, "global_step": 328774, "epoch": 2717} {"train_loss": -43.23643112182617, "global_step": 328775, "epoch": 2717} {"train_loss": -43.26569366455078, "global_step": 328776, "epoch": 2717} {"train_loss": -43.16534423828125, "global_step": 328777, "epoch": 2717} {"train_loss": -43.596229553222656, "global_step": 328778, "epoch": 2717} {"train_loss": -43.193756103515625, "global_step": 328779, "epoch": 2717} {"train_loss": -43.025146484375, "global_step": 328780, "epoch": 2717} {"train_loss": -44.0823974609375, "global_step": 328781, "epoch": 2717} {"train_loss": -43.59896469116211, "global_step": 328782, "epoch": 2717} {"train_loss": -43.42171859741211, "global_step": 328783, "epoch": 2717} {"train_loss": -43.176177978515625, "global_step": 328784, "epoch": 2717} {"train_loss": -43.622562408447266, "global_step": 328785, "epoch": 2717} {"train_loss": -42.70341110229492, "global_step": 328786, "epoch": 2717} {"train_loss": -43.53092956542969, "global_step": 328787, "epoch": 2717} {"train_loss": -43.692718505859375, "global_step": 328788, "epoch": 2717} {"train_loss": -43.35494613647461, "global_step": 328789, "epoch": 2717} {"train_loss": -43.665470123291016, "global_step": 328790, "epoch": 2717} {"train_loss": -42.7617301940918, "global_step": 328791, "epoch": 2717} {"train_loss": -43.3125114440918, "global_step": 328792, "epoch": 2717} {"train_loss": -43.97189712524414, "global_step": 328793, "epoch": 2717} {"train_loss": -42.004512786865234, "global_step": 328794, "epoch": 2717} {"train_loss": -42.84218215942383, "global_step": 328795, "epoch": 2717} {"train_loss": -43.13381576538086, "global_step": 328796, "epoch": 2717} {"train_loss": -43.28269577026367, "global_step": 328797, "epoch": 2717} {"train_loss": -43.27478790283203, "global_step": 328798, "epoch": 2717} {"train_loss": -43.377349853515625, "global_step": 328799, "epoch": 2717} {"train_loss": -43.12665557861328, "global_step": 328800, "epoch": 2717} {"train_loss": -43.3965950012207, "global_step": 328801, "epoch": 2717} {"train_loss": -43.21333312988281, "global_step": 328802, "epoch": 2717} {"train_loss": -42.94420623779297, "global_step": 328803, "epoch": 2717} {"train_loss": -42.89862823486328, "global_step": 328804, "epoch": 2717} {"train_loss": -43.53752517700195, "global_step": 328805, "epoch": 2717} {"train_loss": -43.119632720947266, "global_step": 328806, "epoch": 2717} {"train_loss": -42.8409423828125, "global_step": 328807, "epoch": 2717} {"train_loss": -42.65058517456055, "global_step": 328808, "epoch": 2717} {"train_loss": -43.528114318847656, "global_step": 328809, "epoch": 2717} {"train_loss": -43.25407791137695, "global_step": 328810, "epoch": 2717} {"train_loss": -41.693599700927734, "global_step": 328811, "epoch": 2717} {"train_loss": -41.47077560424805, "global_step": 328812, "epoch": 2717} {"train_loss": -43.168758392333984, "global_step": 328813, "epoch": 2717} {"train_loss": -43.32427978515625, "global_step": 328814, "epoch": 2717} {"train_loss": -42.93992233276367, "global_step": 328815, "epoch": 2717} {"train_loss": -42.17953109741211, "global_step": 328816, "epoch": 2717} {"train_loss": -43.28947067260742, "global_step": 328817, "epoch": 2717} {"train_loss": -41.250186920166016, "global_step": 328818, "epoch": 2717} {"train_loss": -43.402767181396484, "global_step": 328819, "epoch": 2717} {"train_loss": -40.62852096557617, "global_step": 328820, "epoch": 2717} {"train_loss": -43.62754440307617, "global_step": 328821, "epoch": 2717} {"train_loss": -42.11894226074219, "global_step": 328822, "epoch": 2717} {"train_loss": -42.649715423583984, "global_step": 328823, "epoch": 2717} {"train_loss": -42.185203552246094, "global_step": 328824, "epoch": 2717} {"train_loss": -43.39099884033203, "global_step": 328825, "epoch": 2717} {"train_loss": -42.7346076965332, "global_step": 328826, "epoch": 2717} {"train_loss": -42.27071762084961, "global_step": 328827, "epoch": 2717} {"train_loss": -42.367164611816406, "global_step": 328828, "epoch": 2717} {"train_loss": -41.71720886230469, "global_step": 328829, "epoch": 2717} {"train_loss": -43.3818359375, "global_step": 328830, "epoch": 2717} {"train_loss": -43.04578399658203, "global_step": 328831, "epoch": 2717} {"train_loss": -42.972782135009766, "global_step": 328832, "epoch": 2717} {"train_loss": -43.427940368652344, "global_step": 328833, "epoch": 2717} {"train_loss": -43.478065490722656, "global_step": 328834, "epoch": 2717} {"train_loss": -43.38888168334961, "global_step": 328835, "epoch": 2717} {"train_loss": -43.81549072265625, "global_step": 328836, "epoch": 2717} {"train_loss": -44.02552032470703, "global_step": 328837, "epoch": 2717} {"train_loss": -43.984676361083984, "global_step": 328838, "epoch": 2717} {"train_loss": -43.88239288330078, "global_step": 328839, "epoch": 2717} {"train_loss": -44.09880447387695, "global_step": 328840, "epoch": 2717} {"train_loss": -44.42559814453125, "global_step": 328841, "epoch": 2717} {"train_loss": -43.45270538330078, "global_step": 328842, "epoch": 2717} {"train_loss": -43.97316360473633, "global_step": 328843, "epoch": 2717} {"train_loss": -43.89996337890625, "global_step": 328844, "epoch": 2717} {"train_loss": -44.02363204956055, "global_step": 328845, "epoch": 2717} {"train_loss": -43.71869659423828, "global_step": 328846, "epoch": 2717} {"train_loss": -44.27220153808594, "global_step": 328847, "epoch": 2717} {"train_loss": -44.35335922241211, "global_step": 328848, "epoch": 2717} {"train_loss": -43.78456497192383, "global_step": 328849, "epoch": 2717} {"train_loss": -43.9808235168457, "global_step": 328850, "epoch": 2717} {"train_loss": -44.138973236083984, "global_step": 328851, "epoch": 2717} {"train_loss": -43.265926361083984, "global_step": 328852, "epoch": 2717} {"train_loss": -43.79805374145508, "global_step": 328853, "epoch": 2717} {"train_loss": -43.915550231933594, "global_step": 328854, "epoch": 2717} {"train_loss": -43.63808059692383, "global_step": 328855, "epoch": 2717} {"train_loss": -43.83545684814453, "global_step": 328856, "epoch": 2717} {"train_loss": -43.98579788208008, "global_step": 328857, "epoch": 2717} {"train_loss": -43.96319580078125, "global_step": 328858, "epoch": 2717} {"train_loss": -44.55974578857422, "global_step": 328859, "epoch": 2717} {"train_loss": -43.70058059692383, "global_step": 328860, "epoch": 2717} {"train_loss": -44.02302169799805, "global_step": 328861, "epoch": 2717} {"train_loss": -44.337005615234375, "global_step": 328862, "epoch": 2717} {"train_loss": -44.388851165771484, "global_step": 328863, "epoch": 2717} {"train_loss": -43.81083297729492, "global_step": 328864, "epoch": 2717} {"train_loss": -43.94172668457031, "global_step": 328865, "epoch": 2717} {"train_loss": -43.82557678222656, "global_step": 328866, "epoch": 2717} {"train_loss": -44.76346969604492, "global_step": 328867, "epoch": 2717} {"train_loss": -43.93717575073242, "global_step": 328868, "epoch": 2717} {"train_loss": -44.1113166809082, "global_step": 328869, "epoch": 2717} {"train_loss": -44.15850830078125, "global_step": 328870, "epoch": 2717} {"train_loss": -43.72746276855469, "global_step": 328871, "epoch": 2717} {"train_loss": -43.294795989990234, "global_step": 328872, "epoch": 2717} {"train_loss": -44.46025848388672, "global_step": 328873, "epoch": 2717} {"train_loss": -44.453033447265625, "global_step": 328874, "epoch": 2717} {"train_loss": -43.91179275512695, "global_step": 328875, "epoch": 2717} {"train_loss": -43.953102111816406, "global_step": 328876, "epoch": 2717} {"train_loss": -43.29005252428291, "global_step": 328877, "epoch": 2717, "val_loss": 2584855.25} {"train_loss": -44.39534378051758, "global_step": 328878, "epoch": 2718} {"train_loss": -44.70784378051758, "global_step": 328879, "epoch": 2718} {"train_loss": -43.34212875366211, "global_step": 328880, "epoch": 2718} {"train_loss": -43.50433349609375, "global_step": 328881, "epoch": 2718} {"train_loss": -42.91790008544922, "global_step": 328882, "epoch": 2718} {"train_loss": -43.796112060546875, "global_step": 328883, "epoch": 2718} {"train_loss": -44.36870193481445, "global_step": 328884, "epoch": 2718} {"train_loss": -43.795860290527344, "global_step": 328885, "epoch": 2718} {"train_loss": -43.33787155151367, "global_step": 328886, "epoch": 2718} {"train_loss": -43.81618881225586, "global_step": 328887, "epoch": 2718} {"train_loss": -44.01679992675781, "global_step": 328888, "epoch": 2718} {"train_loss": -44.16567611694336, "global_step": 328889, "epoch": 2718} {"train_loss": -43.94303512573242, "global_step": 328890, "epoch": 2718} {"train_loss": -42.149208068847656, "global_step": 328891, "epoch": 2718} {"train_loss": -43.080963134765625, "global_step": 328892, "epoch": 2718} {"train_loss": -43.9499626159668, "global_step": 328893, "epoch": 2718} {"train_loss": -43.59592056274414, "global_step": 328894, "epoch": 2718} {"train_loss": -41.48377227783203, "global_step": 328895, "epoch": 2718} {"train_loss": -42.18282699584961, "global_step": 328896, "epoch": 2718} {"train_loss": -41.942405700683594, "global_step": 328897, "epoch": 2718} {"train_loss": -42.8806266784668, "global_step": 328898, "epoch": 2718} {"train_loss": -42.792598724365234, "global_step": 328899, "epoch": 2718} {"train_loss": -40.94071578979492, "global_step": 328900, "epoch": 2718} {"train_loss": -41.04440689086914, "global_step": 328901, "epoch": 2718} {"train_loss": -42.1298942565918, "global_step": 328902, "epoch": 2718} {"train_loss": -43.80891418457031, "global_step": 328903, "epoch": 2718} {"train_loss": -42.871986389160156, "global_step": 328904, "epoch": 2718} {"train_loss": -43.02823257446289, "global_step": 328905, "epoch": 2718} {"train_loss": -43.28855514526367, "global_step": 328906, "epoch": 2718} {"train_loss": -42.94023513793945, "global_step": 328907, "epoch": 2718} {"train_loss": -39.07503128051758, "global_step": 328908, "epoch": 2718} {"train_loss": -40.97150802612305, "global_step": 328909, "epoch": 2718} {"train_loss": -42.820159912109375, "global_step": 328910, "epoch": 2718} {"train_loss": -39.292755126953125, "global_step": 328911, "epoch": 2718} {"train_loss": -39.11191940307617, "global_step": 328912, "epoch": 2718} {"train_loss": -42.3101806640625, "global_step": 328913, "epoch": 2718} {"train_loss": -42.03025436401367, "global_step": 328914, "epoch": 2718} {"train_loss": -38.80167770385742, "global_step": 328915, "epoch": 2718} {"train_loss": -41.18210220336914, "global_step": 328916, "epoch": 2718} {"train_loss": -42.143531799316406, "global_step": 328917, "epoch": 2718} {"train_loss": -38.32426452636719, "global_step": 328918, "epoch": 2718} {"train_loss": -41.358070373535156, "global_step": 328919, "epoch": 2718} {"train_loss": -42.296043395996094, "global_step": 328920, "epoch": 2718} {"train_loss": -41.1572380065918, "global_step": 328921, "epoch": 2718} {"train_loss": -42.53074264526367, "global_step": 328922, "epoch": 2718} {"train_loss": -41.58602523803711, "global_step": 328923, "epoch": 2718} {"train_loss": -42.96822738647461, "global_step": 328924, "epoch": 2718} {"train_loss": -41.944698333740234, "global_step": 328925, "epoch": 2718} {"train_loss": -42.13119125366211, "global_step": 328926, "epoch": 2718} {"train_loss": -43.119014739990234, "global_step": 328927, "epoch": 2718} {"train_loss": -42.532508850097656, "global_step": 328928, "epoch": 2718} {"train_loss": -43.36149597167969, "global_step": 328929, "epoch": 2718} {"train_loss": -42.894161224365234, "global_step": 328930, "epoch": 2718} {"train_loss": -42.98398971557617, "global_step": 328931, "epoch": 2718} {"train_loss": -43.50933837890625, "global_step": 328932, "epoch": 2718} {"train_loss": -43.098236083984375, "global_step": 328933, "epoch": 2718} {"train_loss": -42.65056228637695, "global_step": 328934, "epoch": 2718} {"train_loss": -42.7830924987793, "global_step": 328935, "epoch": 2718} {"train_loss": -43.5873908996582, "global_step": 328936, "epoch": 2718} {"train_loss": -43.86690139770508, "global_step": 328937, "epoch": 2718} {"train_loss": -43.164493560791016, "global_step": 328938, "epoch": 2718} {"train_loss": -43.66239547729492, "global_step": 328939, "epoch": 2718} {"train_loss": -42.662349700927734, "global_step": 328940, "epoch": 2718} {"train_loss": -42.624114990234375, "global_step": 328941, "epoch": 2718} {"train_loss": -43.33795928955078, "global_step": 328942, "epoch": 2718} {"train_loss": -43.610958099365234, "global_step": 328943, "epoch": 2718} {"train_loss": -43.157596588134766, "global_step": 328944, "epoch": 2718} {"train_loss": -43.01685333251953, "global_step": 328945, "epoch": 2718} {"train_loss": -43.31830596923828, "global_step": 328946, "epoch": 2718} {"train_loss": -43.16139602661133, "global_step": 328947, "epoch": 2718} {"train_loss": -43.568084716796875, "global_step": 328948, "epoch": 2718} {"train_loss": -42.670833587646484, "global_step": 328949, "epoch": 2718} {"train_loss": -43.62763214111328, "global_step": 328950, "epoch": 2718} {"train_loss": -42.82537078857422, "global_step": 328951, "epoch": 2718} {"train_loss": -43.947872161865234, "global_step": 328952, "epoch": 2718} {"train_loss": -43.64179611206055, "global_step": 328953, "epoch": 2718} {"train_loss": -44.18157958984375, "global_step": 328954, "epoch": 2718} {"train_loss": -42.978206634521484, "global_step": 328955, "epoch": 2718} {"train_loss": -43.20866012573242, "global_step": 328956, "epoch": 2718} {"train_loss": -43.815643310546875, "global_step": 328957, "epoch": 2718} {"train_loss": -43.140357971191406, "global_step": 328958, "epoch": 2718} {"train_loss": -43.67082595825195, "global_step": 328959, "epoch": 2718} {"train_loss": -43.930908203125, "global_step": 328960, "epoch": 2718} {"train_loss": -36.39939498901367, "global_step": 328961, "epoch": 2718} {"train_loss": -43.72840118408203, "global_step": 328962, "epoch": 2718} {"train_loss": -43.9965934753418, "global_step": 328963, "epoch": 2718} {"train_loss": -44.234169006347656, "global_step": 328964, "epoch": 2718} {"train_loss": -42.925445556640625, "global_step": 328965, "epoch": 2718} {"train_loss": -43.956722259521484, "global_step": 328966, "epoch": 2718} {"train_loss": -43.44388961791992, "global_step": 328967, "epoch": 2718} {"train_loss": -43.03382873535156, "global_step": 328968, "epoch": 2718} {"train_loss": -43.17197799682617, "global_step": 328969, "epoch": 2718} {"train_loss": -43.31398010253906, "global_step": 328970, "epoch": 2718} {"train_loss": -44.17934799194336, "global_step": 328971, "epoch": 2718} {"train_loss": -43.39365768432617, "global_step": 328972, "epoch": 2718} {"train_loss": -44.053646087646484, "global_step": 328973, "epoch": 2718} {"train_loss": -43.88136291503906, "global_step": 328974, "epoch": 2718} {"train_loss": -43.06573486328125, "global_step": 328975, "epoch": 2718} {"train_loss": -38.8294792175293, "global_step": 328976, "epoch": 2718} {"train_loss": -43.00929641723633, "global_step": 328977, "epoch": 2718} {"train_loss": -43.83069610595703, "global_step": 328978, "epoch": 2718} {"train_loss": -41.77264404296875, "global_step": 328979, "epoch": 2718} {"train_loss": -43.179481506347656, "global_step": 328980, "epoch": 2718} {"train_loss": -43.498714447021484, "global_step": 328981, "epoch": 2718} {"train_loss": -39.63013458251953, "global_step": 328982, "epoch": 2718} {"train_loss": -43.825923919677734, "global_step": 328983, "epoch": 2718} {"train_loss": -43.11298370361328, "global_step": 328984, "epoch": 2718} {"train_loss": -42.69596481323242, "global_step": 328985, "epoch": 2718} {"train_loss": -37.30434799194336, "global_step": 328986, "epoch": 2718} {"train_loss": -41.62392044067383, "global_step": 328987, "epoch": 2718} {"train_loss": -43.0942268371582, "global_step": 328988, "epoch": 2718} {"train_loss": -38.162593841552734, "global_step": 328989, "epoch": 2718} {"train_loss": -33.38969039916992, "global_step": 328990, "epoch": 2718} {"train_loss": -38.90877151489258, "global_step": 328991, "epoch": 2718} {"train_loss": -39.64613723754883, "global_step": 328992, "epoch": 2718} {"train_loss": -25.898950576782227, "global_step": 328993, "epoch": 2718} {"train_loss": -39.402828216552734, "global_step": 328994, "epoch": 2718} {"train_loss": -40.2019157409668, "global_step": 328995, "epoch": 2718} {"train_loss": -40.813995361328125, "global_step": 328996, "epoch": 2718} {"train_loss": -40.165802001953125, "global_step": 328997, "epoch": 2718} {"train_loss": -42.21667532487349, "global_step": 328998, "epoch": 2718, "val_loss": 2628191.75} {"train_loss": -40.38304901123047, "global_step": 328999, "epoch": 2719} {"train_loss": -37.490753173828125, "global_step": 329000, "epoch": 2719} {"train_loss": -37.4503059387207, "global_step": 329001, "epoch": 2719} {"train_loss": -39.98325729370117, "global_step": 329002, "epoch": 2719} {"train_loss": -41.1141242980957, "global_step": 329003, "epoch": 2719} {"train_loss": -34.191463470458984, "global_step": 329004, "epoch": 2719} {"train_loss": -36.82387924194336, "global_step": 329005, "epoch": 2719} {"train_loss": -39.86349868774414, "global_step": 329006, "epoch": 2719} {"train_loss": -33.989784240722656, "global_step": 329007, "epoch": 2719} {"train_loss": -38.601524353027344, "global_step": 329008, "epoch": 2719} {"train_loss": -38.865478515625, "global_step": 329009, "epoch": 2719} {"train_loss": -41.39828109741211, "global_step": 329010, "epoch": 2719} {"train_loss": -35.98741149902344, "global_step": 329011, "epoch": 2719} {"train_loss": -40.36147689819336, "global_step": 329012, "epoch": 2719} {"train_loss": -38.77888107299805, "global_step": 329013, "epoch": 2719} {"train_loss": -37.88945007324219, "global_step": 329014, "epoch": 2719} {"train_loss": -32.876644134521484, "global_step": 329015, "epoch": 2719} {"train_loss": -38.61562728881836, "global_step": 329016, "epoch": 2719} {"train_loss": -41.22673416137695, "global_step": 329017, "epoch": 2719} {"train_loss": -40.588966369628906, "global_step": 329018, "epoch": 2719} {"train_loss": -33.071502685546875, "global_step": 329019, "epoch": 2719} {"train_loss": -34.05184555053711, "global_step": 329020, "epoch": 2719} {"train_loss": -35.568397521972656, "global_step": 329021, "epoch": 2719} {"train_loss": -35.98072052001953, "global_step": 329022, "epoch": 2719} {"train_loss": -40.6248779296875, "global_step": 329023, "epoch": 2719} {"train_loss": -35.71482849121094, "global_step": 329024, "epoch": 2719} {"train_loss": -40.75980758666992, "global_step": 329025, "epoch": 2719} {"train_loss": -38.669189453125, "global_step": 329026, "epoch": 2719} {"train_loss": -40.88523864746094, "global_step": 329027, "epoch": 2719} {"train_loss": -40.89630126953125, "global_step": 329028, "epoch": 2719} {"train_loss": -40.3395881652832, "global_step": 329029, "epoch": 2719} {"train_loss": -39.65854263305664, "global_step": 329030, "epoch": 2719} {"train_loss": -41.01886749267578, "global_step": 329031, "epoch": 2719} {"train_loss": -38.96653366088867, "global_step": 329032, "epoch": 2719} {"train_loss": -41.66132736206055, "global_step": 329033, "epoch": 2719} {"train_loss": -41.3492431640625, "global_step": 329034, "epoch": 2719} {"train_loss": -40.145423889160156, "global_step": 329035, "epoch": 2719} {"train_loss": -40.852970123291016, "global_step": 329036, "epoch": 2719} {"train_loss": -41.751686096191406, "global_step": 329037, "epoch": 2719} {"train_loss": -40.29880142211914, "global_step": 329038, "epoch": 2719} {"train_loss": -39.787391662597656, "global_step": 329039, "epoch": 2719} {"train_loss": -41.656654357910156, "global_step": 329040, "epoch": 2719} {"train_loss": -41.62104034423828, "global_step": 329041, "epoch": 2719} {"train_loss": -40.660274505615234, "global_step": 329042, "epoch": 2719} {"train_loss": -40.69039535522461, "global_step": 329043, "epoch": 2719} {"train_loss": -41.34487533569336, "global_step": 329044, "epoch": 2719} {"train_loss": -41.196815490722656, "global_step": 329045, "epoch": 2719} {"train_loss": -38.948482513427734, "global_step": 329046, "epoch": 2719} {"train_loss": -41.76857376098633, "global_step": 329047, "epoch": 2719} {"train_loss": -41.35881423950195, "global_step": 329048, "epoch": 2719} {"train_loss": -42.35772705078125, "global_step": 329049, "epoch": 2719} {"train_loss": -41.9337158203125, "global_step": 329050, "epoch": 2719} {"train_loss": -41.51899719238281, "global_step": 329051, "epoch": 2719} {"train_loss": -38.96743392944336, "global_step": 329052, "epoch": 2719} {"train_loss": -41.91986846923828, "global_step": 329053, "epoch": 2719} {"train_loss": -41.526859283447266, "global_step": 329054, "epoch": 2719} {"train_loss": -41.27128601074219, "global_step": 329055, "epoch": 2719} {"train_loss": -42.16669845581055, "global_step": 329056, "epoch": 2719} {"train_loss": -41.755916595458984, "global_step": 329057, "epoch": 2719} {"train_loss": -41.181697845458984, "global_step": 329058, "epoch": 2719} {"train_loss": -41.159847259521484, "global_step": 329059, "epoch": 2719} {"train_loss": -40.85879135131836, "global_step": 329060, "epoch": 2719} {"train_loss": -42.13526153564453, "global_step": 329061, "epoch": 2719} {"train_loss": -41.54197311401367, "global_step": 329062, "epoch": 2719} {"train_loss": -42.25851058959961, "global_step": 329063, "epoch": 2719} {"train_loss": -41.44670486450195, "global_step": 329064, "epoch": 2719} {"train_loss": -42.414100646972656, "global_step": 329065, "epoch": 2719} {"train_loss": -42.46809768676758, "global_step": 329066, "epoch": 2719} {"train_loss": -42.796424865722656, "global_step": 329067, "epoch": 2719} {"train_loss": -42.39459228515625, "global_step": 329068, "epoch": 2719} {"train_loss": -41.99930953979492, "global_step": 329069, "epoch": 2719} {"train_loss": -42.487831115722656, "global_step": 329070, "epoch": 2719} {"train_loss": -42.25710678100586, "global_step": 329071, "epoch": 2719} {"train_loss": -42.44964599609375, "global_step": 329072, "epoch": 2719} {"train_loss": -42.551753997802734, "global_step": 329073, "epoch": 2719} {"train_loss": -41.784881591796875, "global_step": 329074, "epoch": 2719} {"train_loss": -42.17018127441406, "global_step": 329075, "epoch": 2719} {"train_loss": -42.935081481933594, "global_step": 329076, "epoch": 2719} {"train_loss": -43.069435119628906, "global_step": 329077, "epoch": 2719} {"train_loss": -42.58730697631836, "global_step": 329078, "epoch": 2719} {"train_loss": -43.03990936279297, "global_step": 329079, "epoch": 2719} {"train_loss": -43.07355499267578, "global_step": 329080, "epoch": 2719} {"train_loss": -42.40232467651367, "global_step": 329081, "epoch": 2719} {"train_loss": -41.95581817626953, "global_step": 329082, "epoch": 2719} {"train_loss": -43.26028823852539, "global_step": 329083, "epoch": 2719} {"train_loss": -42.68374252319336, "global_step": 329084, "epoch": 2719} {"train_loss": -42.5612678527832, "global_step": 329085, "epoch": 2719} {"train_loss": -42.95723342895508, "global_step": 329086, "epoch": 2719} {"train_loss": -42.89236068725586, "global_step": 329087, "epoch": 2719} {"train_loss": -42.894500732421875, "global_step": 329088, "epoch": 2719} {"train_loss": -42.72868347167969, "global_step": 329089, "epoch": 2719} {"train_loss": -43.22880172729492, "global_step": 329090, "epoch": 2719} {"train_loss": -43.06647872924805, "global_step": 329091, "epoch": 2719} {"train_loss": -43.08234405517578, "global_step": 329092, "epoch": 2719} {"train_loss": -42.86818313598633, "global_step": 329093, "epoch": 2719} {"train_loss": -43.735382080078125, "global_step": 329094, "epoch": 2719} {"train_loss": -41.83536911010742, "global_step": 329095, "epoch": 2719} {"train_loss": -43.184627532958984, "global_step": 329096, "epoch": 2719} {"train_loss": -41.89925765991211, "global_step": 329097, "epoch": 2719} {"train_loss": -42.84037399291992, "global_step": 329098, "epoch": 2719} {"train_loss": -43.45294952392578, "global_step": 329099, "epoch": 2719} {"train_loss": -42.900428771972656, "global_step": 329100, "epoch": 2719} {"train_loss": -42.67842102050781, "global_step": 329101, "epoch": 2719} {"train_loss": -43.42366409301758, "global_step": 329102, "epoch": 2719} {"train_loss": -43.61307907104492, "global_step": 329103, "epoch": 2719} {"train_loss": -42.13898468017578, "global_step": 329104, "epoch": 2719} {"train_loss": -43.246551513671875, "global_step": 329105, "epoch": 2719} {"train_loss": -43.539100646972656, "global_step": 329106, "epoch": 2719} {"train_loss": -43.377052307128906, "global_step": 329107, "epoch": 2719} {"train_loss": -43.60100173950195, "global_step": 329108, "epoch": 2719} {"train_loss": -43.369659423828125, "global_step": 329109, "epoch": 2719} {"train_loss": -43.45268630981445, "global_step": 329110, "epoch": 2719} {"train_loss": -44.24320602416992, "global_step": 329111, "epoch": 2719} {"train_loss": -42.95918655395508, "global_step": 329112, "epoch": 2719} {"train_loss": -43.84816360473633, "global_step": 329113, "epoch": 2719} {"train_loss": -44.07996368408203, "global_step": 329114, "epoch": 2719} {"train_loss": -43.653724670410156, "global_step": 329115, "epoch": 2719} {"train_loss": -43.982418060302734, "global_step": 329116, "epoch": 2719} {"train_loss": -43.598426818847656, "global_step": 329117, "epoch": 2719} {"train_loss": -43.698116302490234, "global_step": 329118, "epoch": 2719} {"train_loss": -41.20056051459194, "global_step": 329119, "epoch": 2719, "val_loss": 2547299.5} {"train_loss": -43.167362213134766, "global_step": 329120, "epoch": 2720} {"train_loss": -43.989898681640625, "global_step": 329121, "epoch": 2720} {"train_loss": -44.28920364379883, "global_step": 329122, "epoch": 2720} {"train_loss": -43.22282791137695, "global_step": 329123, "epoch": 2720} {"train_loss": -43.8922233581543, "global_step": 329124, "epoch": 2720} {"train_loss": -43.991207122802734, "global_step": 329125, "epoch": 2720} {"train_loss": -43.59882736206055, "global_step": 329126, "epoch": 2720} {"train_loss": -44.4173698425293, "global_step": 329127, "epoch": 2720} {"train_loss": -43.81096267700195, "global_step": 329128, "epoch": 2720} {"train_loss": -43.63386917114258, "global_step": 329129, "epoch": 2720} {"train_loss": -43.633819580078125, "global_step": 329130, "epoch": 2720} {"train_loss": -43.98675537109375, "global_step": 329131, "epoch": 2720} {"train_loss": -44.051605224609375, "global_step": 329132, "epoch": 2720} {"train_loss": -43.9358024597168, "global_step": 329133, "epoch": 2720} {"train_loss": -43.7836799621582, "global_step": 329134, "epoch": 2720} {"train_loss": -43.427772521972656, "global_step": 329135, "epoch": 2720} {"train_loss": -44.021480560302734, "global_step": 329136, "epoch": 2720} {"train_loss": -44.24251937866211, "global_step": 329137, "epoch": 2720} {"train_loss": -43.43345260620117, "global_step": 329138, "epoch": 2720} {"train_loss": -43.832088470458984, "global_step": 329139, "epoch": 2720} {"train_loss": -41.77263259887695, "global_step": 329140, "epoch": 2720} {"train_loss": -44.32944107055664, "global_step": 329141, "epoch": 2720} {"train_loss": -42.553855895996094, "global_step": 329142, "epoch": 2720} {"train_loss": -43.7001953125, "global_step": 329143, "epoch": 2720} {"train_loss": -43.49882507324219, "global_step": 329144, "epoch": 2720} {"train_loss": -44.22587966918945, "global_step": 329145, "epoch": 2720} {"train_loss": -44.36311721801758, "global_step": 329146, "epoch": 2720} {"train_loss": -44.47067642211914, "global_step": 329147, "epoch": 2720} {"train_loss": -44.11336135864258, "global_step": 329148, "epoch": 2720} {"train_loss": -43.855255126953125, "global_step": 329149, "epoch": 2720} {"train_loss": -43.26648712158203, "global_step": 329150, "epoch": 2720} {"train_loss": -44.10960388183594, "global_step": 329151, "epoch": 2720} {"train_loss": -43.69733810424805, "global_step": 329152, "epoch": 2720} {"train_loss": -41.301475524902344, "global_step": 329153, "epoch": 2720} {"train_loss": -43.6380729675293, "global_step": 329154, "epoch": 2720} {"train_loss": -43.44974899291992, "global_step": 329155, "epoch": 2720} {"train_loss": -43.82438278198242, "global_step": 329156, "epoch": 2720} {"train_loss": -43.16610336303711, "global_step": 329157, "epoch": 2720} {"train_loss": -40.94224166870117, "global_step": 329158, "epoch": 2720} {"train_loss": -42.69667434692383, "global_step": 329159, "epoch": 2720} {"train_loss": -43.108943939208984, "global_step": 329160, "epoch": 2720} {"train_loss": -42.31251907348633, "global_step": 329161, "epoch": 2720} {"train_loss": -41.82631301879883, "global_step": 329162, "epoch": 2720} {"train_loss": -42.20729064941406, "global_step": 329163, "epoch": 2720} {"train_loss": -41.432960510253906, "global_step": 329164, "epoch": 2720} {"train_loss": -39.34043502807617, "global_step": 329165, "epoch": 2720} {"train_loss": -36.849891662597656, "global_step": 329166, "epoch": 2720} {"train_loss": -42.07149887084961, "global_step": 329167, "epoch": 2720} {"train_loss": -37.4671745300293, "global_step": 329168, "epoch": 2720} {"train_loss": -31.905359268188477, "global_step": 329169, "epoch": 2720} {"train_loss": -29.336912155151367, "global_step": 329170, "epoch": 2720} {"train_loss": -34.18602752685547, "global_step": 329171, "epoch": 2720} {"train_loss": -34.479225158691406, "global_step": 329172, "epoch": 2720} {"train_loss": -32.39353942871094, "global_step": 329173, "epoch": 2720} {"train_loss": -37.23134994506836, "global_step": 329174, "epoch": 2720} {"train_loss": -35.838539123535156, "global_step": 329175, "epoch": 2720} {"train_loss": -37.282100677490234, "global_step": 329176, "epoch": 2720} {"train_loss": -38.226470947265625, "global_step": 329177, "epoch": 2720} {"train_loss": -36.147186279296875, "global_step": 329178, "epoch": 2720} {"train_loss": -37.67695236206055, "global_step": 329179, "epoch": 2720} {"train_loss": -40.0295524597168, "global_step": 329180, "epoch": 2720} {"train_loss": -38.34739303588867, "global_step": 329181, "epoch": 2720} {"train_loss": -40.04920959472656, "global_step": 329182, "epoch": 2720} {"train_loss": -40.63627243041992, "global_step": 329183, "epoch": 2720} {"train_loss": -40.05141830444336, "global_step": 329184, "epoch": 2720} {"train_loss": -41.358367919921875, "global_step": 329185, "epoch": 2720} {"train_loss": -41.69155502319336, "global_step": 329186, "epoch": 2720} {"train_loss": -40.770774841308594, "global_step": 329187, "epoch": 2720} {"train_loss": -40.86420822143555, "global_step": 329188, "epoch": 2720} {"train_loss": -40.07004928588867, "global_step": 329189, "epoch": 2720} {"train_loss": -41.43586349487305, "global_step": 329190, "epoch": 2720} {"train_loss": -41.45295715332031, "global_step": 329191, "epoch": 2720} {"train_loss": -41.47709274291992, "global_step": 329192, "epoch": 2720} {"train_loss": -41.78410720825195, "global_step": 329193, "epoch": 2720} {"train_loss": -41.917152404785156, "global_step": 329194, "epoch": 2720} {"train_loss": -41.013458251953125, "global_step": 329195, "epoch": 2720} {"train_loss": -41.568023681640625, "global_step": 329196, "epoch": 2720} {"train_loss": -42.07666015625, "global_step": 329197, "epoch": 2720} {"train_loss": -41.74896240234375, "global_step": 329198, "epoch": 2720} {"train_loss": -41.814544677734375, "global_step": 329199, "epoch": 2720} {"train_loss": -42.28950119018555, "global_step": 329200, "epoch": 2720} {"train_loss": -42.69752883911133, "global_step": 329201, "epoch": 2720} {"train_loss": -42.719417572021484, "global_step": 329202, "epoch": 2720} {"train_loss": -42.44444274902344, "global_step": 329203, "epoch": 2720} {"train_loss": -42.33917999267578, "global_step": 329204, "epoch": 2720} {"train_loss": -42.540931701660156, "global_step": 329205, "epoch": 2720} {"train_loss": -42.2121467590332, "global_step": 329206, "epoch": 2720} {"train_loss": -42.0297737121582, "global_step": 329207, "epoch": 2720} {"train_loss": -42.42338180541992, "global_step": 329208, "epoch": 2720} {"train_loss": -43.15104293823242, "global_step": 329209, "epoch": 2720} {"train_loss": -41.787086486816406, "global_step": 329210, "epoch": 2720} {"train_loss": -42.715213775634766, "global_step": 329211, "epoch": 2720} {"train_loss": -42.940303802490234, "global_step": 329212, "epoch": 2720} {"train_loss": -42.914794921875, "global_step": 329213, "epoch": 2720} {"train_loss": -43.03388214111328, "global_step": 329214, "epoch": 2720} {"train_loss": -43.006832122802734, "global_step": 329215, "epoch": 2720} {"train_loss": -42.613128662109375, "global_step": 329216, "epoch": 2720} {"train_loss": -42.94093704223633, "global_step": 329217, "epoch": 2720} {"train_loss": -42.9613151550293, "global_step": 329218, "epoch": 2720} {"train_loss": -43.719482421875, "global_step": 329219, "epoch": 2720} {"train_loss": -43.54768753051758, "global_step": 329220, "epoch": 2720} {"train_loss": -43.33122634887695, "global_step": 329221, "epoch": 2720} {"train_loss": -43.662353515625, "global_step": 329222, "epoch": 2720} {"train_loss": -43.31679916381836, "global_step": 329223, "epoch": 2720} {"train_loss": -43.228599548339844, "global_step": 329224, "epoch": 2720} {"train_loss": -42.90392303466797, "global_step": 329225, "epoch": 2720} {"train_loss": -43.7038688659668, "global_step": 329226, "epoch": 2720} {"train_loss": -42.859344482421875, "global_step": 329227, "epoch": 2720} {"train_loss": -43.04151916503906, "global_step": 329228, "epoch": 2720} {"train_loss": -43.958858489990234, "global_step": 329229, "epoch": 2720} {"train_loss": -43.655967712402344, "global_step": 329230, "epoch": 2720} {"train_loss": -43.3549919128418, "global_step": 329231, "epoch": 2720} {"train_loss": -43.92729568481445, "global_step": 329232, "epoch": 2720} {"train_loss": -43.71894073486328, "global_step": 329233, "epoch": 2720} {"train_loss": -44.111366271972656, "global_step": 329234, "epoch": 2720} {"train_loss": -43.18816375732422, "global_step": 329235, "epoch": 2720} {"train_loss": -43.88950729370117, "global_step": 329236, "epoch": 2720} {"train_loss": -43.88496017456055, "global_step": 329237, "epoch": 2720} {"train_loss": -43.9898796081543, "global_step": 329238, "epoch": 2720} {"train_loss": -43.299964904785156, "global_step": 329239, "epoch": 2720} {"train_loss": -42.00140718192108, "global_step": 329240, "epoch": 2720, "val_loss": 2641963.75} {"train_loss": -43.7957878112793, "global_step": 329241, "epoch": 2721} {"train_loss": -44.07029724121094, "global_step": 329242, "epoch": 2721} {"train_loss": -43.97882843017578, "global_step": 329243, "epoch": 2721} {"train_loss": -44.05100631713867, "global_step": 329244, "epoch": 2721} {"train_loss": -44.1579704284668, "global_step": 329245, "epoch": 2721} {"train_loss": -44.00245666503906, "global_step": 329246, "epoch": 2721} {"train_loss": -44.068389892578125, "global_step": 329247, "epoch": 2721} {"train_loss": -43.756221771240234, "global_step": 329248, "epoch": 2721} {"train_loss": -43.7818489074707, "global_step": 329249, "epoch": 2721} {"train_loss": -44.19309616088867, "global_step": 329250, "epoch": 2721} {"train_loss": -44.05512237548828, "global_step": 329251, "epoch": 2721} {"train_loss": -43.76722717285156, "global_step": 329252, "epoch": 2721} {"train_loss": -44.37250900268555, "global_step": 329253, "epoch": 2721} {"train_loss": -44.23046875, "global_step": 329254, "epoch": 2721} {"train_loss": -44.30138397216797, "global_step": 329255, "epoch": 2721} {"train_loss": -44.57379150390625, "global_step": 329256, "epoch": 2721} {"train_loss": -44.24010467529297, "global_step": 329257, "epoch": 2721} {"train_loss": -44.52152633666992, "global_step": 329258, "epoch": 2721} {"train_loss": -43.59212875366211, "global_step": 329259, "epoch": 2721} {"train_loss": -44.142555236816406, "global_step": 329260, "epoch": 2721} {"train_loss": -44.32206344604492, "global_step": 329261, "epoch": 2721} {"train_loss": -44.199806213378906, "global_step": 329262, "epoch": 2721} {"train_loss": -44.50495147705078, "global_step": 329263, "epoch": 2721} {"train_loss": -44.39934158325195, "global_step": 329264, "epoch": 2721} {"train_loss": -44.49442672729492, "global_step": 329265, "epoch": 2721} {"train_loss": -44.360084533691406, "global_step": 329266, "epoch": 2721} {"train_loss": -44.40108108520508, "global_step": 329267, "epoch": 2721} {"train_loss": -44.440467834472656, "global_step": 329268, "epoch": 2721} {"train_loss": -44.7529411315918, "global_step": 329269, "epoch": 2721} {"train_loss": -44.21028137207031, "global_step": 329270, "epoch": 2721} {"train_loss": -44.16997528076172, "global_step": 329271, "epoch": 2721} {"train_loss": -43.85592269897461, "global_step": 329272, "epoch": 2721} {"train_loss": -44.51826095581055, "global_step": 329273, "epoch": 2721} {"train_loss": -44.74393844604492, "global_step": 329274, "epoch": 2721} {"train_loss": -44.81425094604492, "global_step": 329275, "epoch": 2721} {"train_loss": -44.47634506225586, "global_step": 329276, "epoch": 2721} {"train_loss": -44.021949768066406, "global_step": 329277, "epoch": 2721} {"train_loss": -43.83747100830078, "global_step": 329278, "epoch": 2721} {"train_loss": -44.865516662597656, "global_step": 329279, "epoch": 2721} {"train_loss": -44.626583099365234, "global_step": 329280, "epoch": 2721} {"train_loss": -44.91672897338867, "global_step": 329281, "epoch": 2721} {"train_loss": -44.566078186035156, "global_step": 329282, "epoch": 2721} {"train_loss": -43.71494674682617, "global_step": 329283, "epoch": 2721} {"train_loss": -44.355838775634766, "global_step": 329284, "epoch": 2721} {"train_loss": -44.6692008972168, "global_step": 329285, "epoch": 2721} {"train_loss": -44.351478576660156, "global_step": 329286, "epoch": 2721} {"train_loss": -44.64008712768555, "global_step": 329287, "epoch": 2721} {"train_loss": -44.20721435546875, "global_step": 329288, "epoch": 2721} {"train_loss": -44.11393737792969, "global_step": 329289, "epoch": 2721} {"train_loss": -43.33866500854492, "global_step": 329290, "epoch": 2721} {"train_loss": -44.391414642333984, "global_step": 329291, "epoch": 2721} {"train_loss": -44.20521926879883, "global_step": 329292, "epoch": 2721} {"train_loss": -44.029632568359375, "global_step": 329293, "epoch": 2721} {"train_loss": -42.880958557128906, "global_step": 329294, "epoch": 2721} {"train_loss": -42.56233596801758, "global_step": 329295, "epoch": 2721} {"train_loss": -43.69391632080078, "global_step": 329296, "epoch": 2721} {"train_loss": -44.42135238647461, "global_step": 329297, "epoch": 2721} {"train_loss": -43.98610305786133, "global_step": 329298, "epoch": 2721} {"train_loss": -43.341461181640625, "global_step": 329299, "epoch": 2721} {"train_loss": -42.97872543334961, "global_step": 329300, "epoch": 2721} {"train_loss": -42.990760803222656, "global_step": 329301, "epoch": 2721} {"train_loss": -43.583431243896484, "global_step": 329302, "epoch": 2721} {"train_loss": -43.74795150756836, "global_step": 329303, "epoch": 2721} {"train_loss": -43.91828536987305, "global_step": 329304, "epoch": 2721} {"train_loss": -43.2850456237793, "global_step": 329305, "epoch": 2721} {"train_loss": -42.894386291503906, "global_step": 329306, "epoch": 2721} {"train_loss": -42.124717712402344, "global_step": 329307, "epoch": 2721} {"train_loss": -43.73400115966797, "global_step": 329308, "epoch": 2721} {"train_loss": -42.10588836669922, "global_step": 329309, "epoch": 2721} {"train_loss": -43.15258026123047, "global_step": 329310, "epoch": 2721} {"train_loss": -43.29303741455078, "global_step": 329311, "epoch": 2721} {"train_loss": -42.4583854675293, "global_step": 329312, "epoch": 2721} {"train_loss": -42.69558334350586, "global_step": 329313, "epoch": 2721} {"train_loss": -41.717742919921875, "global_step": 329314, "epoch": 2721} {"train_loss": -41.82234191894531, "global_step": 329315, "epoch": 2721} {"train_loss": -39.85203552246094, "global_step": 329316, "epoch": 2721} {"train_loss": -39.06132125854492, "global_step": 329317, "epoch": 2721} {"train_loss": -42.08993148803711, "global_step": 329318, "epoch": 2721} {"train_loss": -42.56410598754883, "global_step": 329319, "epoch": 2721} {"train_loss": -40.27008056640625, "global_step": 329320, "epoch": 2721} {"train_loss": -39.09658432006836, "global_step": 329321, "epoch": 2721} {"train_loss": -41.67521286010742, "global_step": 329322, "epoch": 2721} {"train_loss": -41.83664321899414, "global_step": 329323, "epoch": 2721} {"train_loss": -38.160457611083984, "global_step": 329324, "epoch": 2721} {"train_loss": -40.13749313354492, "global_step": 329325, "epoch": 2721} {"train_loss": -41.42951202392578, "global_step": 329326, "epoch": 2721} {"train_loss": -41.100528717041016, "global_step": 329327, "epoch": 2721} {"train_loss": -40.59178161621094, "global_step": 329328, "epoch": 2721} {"train_loss": -42.2493896484375, "global_step": 329329, "epoch": 2721} {"train_loss": -41.912105560302734, "global_step": 329330, "epoch": 2721} {"train_loss": -42.04537582397461, "global_step": 329331, "epoch": 2721} {"train_loss": -41.39957809448242, "global_step": 329332, "epoch": 2721} {"train_loss": -42.3808479309082, "global_step": 329333, "epoch": 2721} {"train_loss": -41.34952926635742, "global_step": 329334, "epoch": 2721} {"train_loss": -41.41110610961914, "global_step": 329335, "epoch": 2721} {"train_loss": -41.1510009765625, "global_step": 329336, "epoch": 2721} {"train_loss": -43.4075927734375, "global_step": 329337, "epoch": 2721} {"train_loss": -40.74968719482422, "global_step": 329338, "epoch": 2721} {"train_loss": -42.71014404296875, "global_step": 329339, "epoch": 2721} {"train_loss": -40.92898178100586, "global_step": 329340, "epoch": 2721} {"train_loss": -41.90345001220703, "global_step": 329341, "epoch": 2721} {"train_loss": -42.67643356323242, "global_step": 329342, "epoch": 2721} {"train_loss": -41.93791961669922, "global_step": 329343, "epoch": 2721} {"train_loss": -42.22381591796875, "global_step": 329344, "epoch": 2721} {"train_loss": -41.446353912353516, "global_step": 329345, "epoch": 2721} {"train_loss": -41.900203704833984, "global_step": 329346, "epoch": 2721} {"train_loss": -41.58148956298828, "global_step": 329347, "epoch": 2721} {"train_loss": -42.26835250854492, "global_step": 329348, "epoch": 2721} {"train_loss": -42.605587005615234, "global_step": 329349, "epoch": 2721} {"train_loss": -42.982364654541016, "global_step": 329350, "epoch": 2721} {"train_loss": -42.381187438964844, "global_step": 329351, "epoch": 2721} {"train_loss": -43.22841262817383, "global_step": 329352, "epoch": 2721} {"train_loss": -42.44622039794922, "global_step": 329353, "epoch": 2721} {"train_loss": -43.00239181518555, "global_step": 329354, "epoch": 2721} {"train_loss": -42.67808532714844, "global_step": 329355, "epoch": 2721} {"train_loss": -43.06313705444336, "global_step": 329356, "epoch": 2721} {"train_loss": -42.75565719604492, "global_step": 329357, "epoch": 2721} {"train_loss": -43.17680740356445, "global_step": 329358, "epoch": 2721} {"train_loss": -43.20574951171875, "global_step": 329359, "epoch": 2721} {"train_loss": -43.1447639465332, "global_step": 329360, "epoch": 2721} {"train_loss": -43.10592260439534, "global_step": 329361, "epoch": 2721, "val_loss": 2637047.75} {"train_loss": -42.68119430541992, "global_step": 329362, "epoch": 2722} {"train_loss": -43.04051208496094, "global_step": 329363, "epoch": 2722} {"train_loss": -43.15325927734375, "global_step": 329364, "epoch": 2722} {"train_loss": -43.72089767456055, "global_step": 329365, "epoch": 2722} {"train_loss": -43.30851364135742, "global_step": 329366, "epoch": 2722} {"train_loss": -43.275630950927734, "global_step": 329367, "epoch": 2722} {"train_loss": -43.99695587158203, "global_step": 329368, "epoch": 2722} {"train_loss": -43.788997650146484, "global_step": 329369, "epoch": 2722} {"train_loss": -43.662803649902344, "global_step": 329370, "epoch": 2722} {"train_loss": -44.3226432800293, "global_step": 329371, "epoch": 2722} {"train_loss": -43.80047607421875, "global_step": 329372, "epoch": 2722} {"train_loss": -43.894344329833984, "global_step": 329373, "epoch": 2722} {"train_loss": -44.17112731933594, "global_step": 329374, "epoch": 2722} {"train_loss": -43.582637786865234, "global_step": 329375, "epoch": 2722} {"train_loss": -43.905052185058594, "global_step": 329376, "epoch": 2722} {"train_loss": -43.589378356933594, "global_step": 329377, "epoch": 2722} {"train_loss": -43.69887161254883, "global_step": 329378, "epoch": 2722} {"train_loss": -44.203529357910156, "global_step": 329379, "epoch": 2722} {"train_loss": -43.978240966796875, "global_step": 329380, "epoch": 2722} {"train_loss": -44.296119689941406, "global_step": 329381, "epoch": 2722} {"train_loss": -44.018856048583984, "global_step": 329382, "epoch": 2722} {"train_loss": -43.9199104309082, "global_step": 329383, "epoch": 2722} {"train_loss": -44.524383544921875, "global_step": 329384, "epoch": 2722} {"train_loss": -44.09273910522461, "global_step": 329385, "epoch": 2722} {"train_loss": -44.2708740234375, "global_step": 329386, "epoch": 2722} {"train_loss": -44.2691764831543, "global_step": 329387, "epoch": 2722} {"train_loss": -43.67605209350586, "global_step": 329388, "epoch": 2722} {"train_loss": -44.4888801574707, "global_step": 329389, "epoch": 2722} {"train_loss": -44.58268356323242, "global_step": 329390, "epoch": 2722} {"train_loss": -44.5073127746582, "global_step": 329391, "epoch": 2722} {"train_loss": -44.225135803222656, "global_step": 329392, "epoch": 2722} {"train_loss": -43.92701721191406, "global_step": 329393, "epoch": 2722} {"train_loss": -44.72625732421875, "global_step": 329394, "epoch": 2722} {"train_loss": -44.821876525878906, "global_step": 329395, "epoch": 2722} {"train_loss": -44.27614212036133, "global_step": 329396, "epoch": 2722} {"train_loss": -44.19492721557617, "global_step": 329397, "epoch": 2722} {"train_loss": -44.92948532104492, "global_step": 329398, "epoch": 2722} {"train_loss": -43.638343811035156, "global_step": 329399, "epoch": 2722} {"train_loss": -44.30121612548828, "global_step": 329400, "epoch": 2722} {"train_loss": -44.205318450927734, "global_step": 329401, "epoch": 2722} {"train_loss": -45.05773162841797, "global_step": 329402, "epoch": 2722} {"train_loss": -44.430389404296875, "global_step": 329403, "epoch": 2722} {"train_loss": -44.664405822753906, "global_step": 329404, "epoch": 2722} {"train_loss": -44.2874870300293, "global_step": 329405, "epoch": 2722} {"train_loss": -43.03976058959961, "global_step": 329406, "epoch": 2722} {"train_loss": -44.6783332824707, "global_step": 329407, "epoch": 2722} {"train_loss": -41.32024383544922, "global_step": 329408, "epoch": 2722} {"train_loss": -43.89054489135742, "global_step": 329409, "epoch": 2722} {"train_loss": -43.17380905151367, "global_step": 329410, "epoch": 2722} {"train_loss": -43.79449462890625, "global_step": 329411, "epoch": 2722} {"train_loss": -44.33805847167969, "global_step": 329412, "epoch": 2722} {"train_loss": -43.63857650756836, "global_step": 329413, "epoch": 2722} {"train_loss": -41.606842041015625, "global_step": 329414, "epoch": 2722} {"train_loss": -43.762611389160156, "global_step": 329415, "epoch": 2722} {"train_loss": -41.22553634643555, "global_step": 329416, "epoch": 2722} {"train_loss": -43.009521484375, "global_step": 329417, "epoch": 2722} {"train_loss": -40.30329513549805, "global_step": 329418, "epoch": 2722} {"train_loss": -40.66901779174805, "global_step": 329419, "epoch": 2722} {"train_loss": -41.69428253173828, "global_step": 329420, "epoch": 2722} {"train_loss": -44.39618682861328, "global_step": 329421, "epoch": 2722} {"train_loss": -42.91987609863281, "global_step": 329422, "epoch": 2722} {"train_loss": -42.82863235473633, "global_step": 329423, "epoch": 2722} {"train_loss": -43.79264450073242, "global_step": 329424, "epoch": 2722} {"train_loss": -42.75126266479492, "global_step": 329425, "epoch": 2722} {"train_loss": -42.67380905151367, "global_step": 329426, "epoch": 2722} {"train_loss": -43.597206115722656, "global_step": 329427, "epoch": 2722} {"train_loss": -43.506954193115234, "global_step": 329428, "epoch": 2722} {"train_loss": -42.69222640991211, "global_step": 329429, "epoch": 2722} {"train_loss": -43.56071090698242, "global_step": 329430, "epoch": 2722} {"train_loss": -42.45985794067383, "global_step": 329431, "epoch": 2722} {"train_loss": -43.687496185302734, "global_step": 329432, "epoch": 2722} {"train_loss": -42.05757522583008, "global_step": 329433, "epoch": 2722} {"train_loss": -42.007144927978516, "global_step": 329434, "epoch": 2722} {"train_loss": -42.77804183959961, "global_step": 329435, "epoch": 2722} {"train_loss": -44.08525848388672, "global_step": 329436, "epoch": 2722} {"train_loss": -43.944725036621094, "global_step": 329437, "epoch": 2722} {"train_loss": -44.112220764160156, "global_step": 329438, "epoch": 2722} {"train_loss": -43.456600189208984, "global_step": 329439, "epoch": 2722} {"train_loss": -43.15340042114258, "global_step": 329440, "epoch": 2722} {"train_loss": -43.05911636352539, "global_step": 329441, "epoch": 2722} {"train_loss": -44.064476013183594, "global_step": 329442, "epoch": 2722} {"train_loss": -43.49055099487305, "global_step": 329443, "epoch": 2722} {"train_loss": -43.62730026245117, "global_step": 329444, "epoch": 2722} {"train_loss": -43.323036193847656, "global_step": 329445, "epoch": 2722} {"train_loss": -43.58824157714844, "global_step": 329446, "epoch": 2722} {"train_loss": -43.62147903442383, "global_step": 329447, "epoch": 2722} {"train_loss": -42.7684440612793, "global_step": 329448, "epoch": 2722} {"train_loss": -43.4209098815918, "global_step": 329449, "epoch": 2722} {"train_loss": -42.89639663696289, "global_step": 329450, "epoch": 2722} {"train_loss": -41.12933349609375, "global_step": 329451, "epoch": 2722} {"train_loss": -43.40594482421875, "global_step": 329452, "epoch": 2722} {"train_loss": -42.00088882446289, "global_step": 329453, "epoch": 2722} {"train_loss": -43.329708099365234, "global_step": 329454, "epoch": 2722} {"train_loss": -43.705535888671875, "global_step": 329455, "epoch": 2722} {"train_loss": -43.150856018066406, "global_step": 329456, "epoch": 2722} {"train_loss": -44.4342155456543, "global_step": 329457, "epoch": 2722} {"train_loss": -42.81468963623047, "global_step": 329458, "epoch": 2722} {"train_loss": -42.46468734741211, "global_step": 329459, "epoch": 2722} {"train_loss": -43.705745697021484, "global_step": 329460, "epoch": 2722} {"train_loss": -43.67794418334961, "global_step": 329461, "epoch": 2722} {"train_loss": -42.94074630737305, "global_step": 329462, "epoch": 2722} {"train_loss": -44.340633392333984, "global_step": 329463, "epoch": 2722} {"train_loss": -43.473628997802734, "global_step": 329464, "epoch": 2722} {"train_loss": -44.11927032470703, "global_step": 329465, "epoch": 2722} {"train_loss": -44.10466003417969, "global_step": 329466, "epoch": 2722} {"train_loss": -43.42866897583008, "global_step": 329467, "epoch": 2722} {"train_loss": -44.22343063354492, "global_step": 329468, "epoch": 2722} {"train_loss": -44.24787521362305, "global_step": 329469, "epoch": 2722} {"train_loss": -43.445980072021484, "global_step": 329470, "epoch": 2722} {"train_loss": -44.42509841918945, "global_step": 329471, "epoch": 2722} {"train_loss": -44.096710205078125, "global_step": 329472, "epoch": 2722} {"train_loss": -44.1330680847168, "global_step": 329473, "epoch": 2722} {"train_loss": -43.53896713256836, "global_step": 329474, "epoch": 2722} {"train_loss": -44.373863220214844, "global_step": 329475, "epoch": 2722} {"train_loss": -44.92051696777344, "global_step": 329476, "epoch": 2722} {"train_loss": -44.10133743286133, "global_step": 329477, "epoch": 2722} {"train_loss": -43.979732513427734, "global_step": 329478, "epoch": 2722} {"train_loss": -44.2548828125, "global_step": 329479, "epoch": 2722} {"train_loss": -44.08596420288086, "global_step": 329480, "epoch": 2722} {"train_loss": -43.55006790161133, "global_step": 329481, "epoch": 2722} {"train_loss": -43.58150091250081, "global_step": 329482, "epoch": 2722, "val_loss": 2663729.25} {"train_loss": -44.06026840209961, "global_step": 329483, "epoch": 2723} {"train_loss": -44.53852462768555, "global_step": 329484, "epoch": 2723} {"train_loss": -44.1922607421875, "global_step": 329485, "epoch": 2723} {"train_loss": -43.745216369628906, "global_step": 329486, "epoch": 2723} {"train_loss": -44.359432220458984, "global_step": 329487, "epoch": 2723} {"train_loss": -43.90850067138672, "global_step": 329488, "epoch": 2723} {"train_loss": -44.05317687988281, "global_step": 329489, "epoch": 2723} {"train_loss": -44.1781120300293, "global_step": 329490, "epoch": 2723} {"train_loss": -42.52479934692383, "global_step": 329491, "epoch": 2723} {"train_loss": -43.51862335205078, "global_step": 329492, "epoch": 2723} {"train_loss": -43.42715072631836, "global_step": 329493, "epoch": 2723} {"train_loss": -42.745391845703125, "global_step": 329494, "epoch": 2723} {"train_loss": -44.110965728759766, "global_step": 329495, "epoch": 2723} {"train_loss": -43.57935333251953, "global_step": 329496, "epoch": 2723} {"train_loss": -42.31955337524414, "global_step": 329497, "epoch": 2723} {"train_loss": -42.96403503417969, "global_step": 329498, "epoch": 2723} {"train_loss": -42.91786193847656, "global_step": 329499, "epoch": 2723} {"train_loss": -42.66547393798828, "global_step": 329500, "epoch": 2723} {"train_loss": -43.51506423950195, "global_step": 329501, "epoch": 2723} {"train_loss": -42.92193603515625, "global_step": 329502, "epoch": 2723} {"train_loss": -43.236419677734375, "global_step": 329503, "epoch": 2723} {"train_loss": -40.17563247680664, "global_step": 329504, "epoch": 2723} {"train_loss": -43.067745208740234, "global_step": 329505, "epoch": 2723} {"train_loss": -42.4795036315918, "global_step": 329506, "epoch": 2723} {"train_loss": -41.9090690612793, "global_step": 329507, "epoch": 2723} {"train_loss": -43.541812896728516, "global_step": 329508, "epoch": 2723} {"train_loss": -43.132503509521484, "global_step": 329509, "epoch": 2723} {"train_loss": -42.672725677490234, "global_step": 329510, "epoch": 2723} {"train_loss": -41.365657806396484, "global_step": 329511, "epoch": 2723} {"train_loss": -43.38261413574219, "global_step": 329512, "epoch": 2723} {"train_loss": -42.505855560302734, "global_step": 329513, "epoch": 2723} {"train_loss": -44.33419418334961, "global_step": 329514, "epoch": 2723} {"train_loss": -43.748023986816406, "global_step": 329515, "epoch": 2723} {"train_loss": -42.97086715698242, "global_step": 329516, "epoch": 2723} {"train_loss": -41.90644454956055, "global_step": 329517, "epoch": 2723} {"train_loss": -43.423736572265625, "global_step": 329518, "epoch": 2723} {"train_loss": -43.55636215209961, "global_step": 329519, "epoch": 2723} {"train_loss": -43.59572982788086, "global_step": 329520, "epoch": 2723} {"train_loss": -43.7672119140625, "global_step": 329521, "epoch": 2723} {"train_loss": -43.38849639892578, "global_step": 329522, "epoch": 2723} {"train_loss": -43.64964294433594, "global_step": 329523, "epoch": 2723} {"train_loss": -43.18092727661133, "global_step": 329524, "epoch": 2723} {"train_loss": -41.82221603393555, "global_step": 329525, "epoch": 2723} {"train_loss": -42.937713623046875, "global_step": 329526, "epoch": 2723} {"train_loss": -42.955039978027344, "global_step": 329527, "epoch": 2723} {"train_loss": -42.08332443237305, "global_step": 329528, "epoch": 2723} {"train_loss": -42.06257629394531, "global_step": 329529, "epoch": 2723} {"train_loss": -40.807613372802734, "global_step": 329530, "epoch": 2723} {"train_loss": -41.4066276550293, "global_step": 329531, "epoch": 2723} {"train_loss": -42.24172592163086, "global_step": 329532, "epoch": 2723} {"train_loss": -41.07768249511719, "global_step": 329533, "epoch": 2723} {"train_loss": -38.22141647338867, "global_step": 329534, "epoch": 2723} {"train_loss": -39.173423767089844, "global_step": 329535, "epoch": 2723} {"train_loss": -40.405311584472656, "global_step": 329536, "epoch": 2723} {"train_loss": -38.87620162963867, "global_step": 329537, "epoch": 2723} {"train_loss": -39.837032318115234, "global_step": 329538, "epoch": 2723} {"train_loss": -38.68842697143555, "global_step": 329539, "epoch": 2723} {"train_loss": -39.4130973815918, "global_step": 329540, "epoch": 2723} {"train_loss": -40.085533142089844, "global_step": 329541, "epoch": 2723} {"train_loss": -37.3349609375, "global_step": 329542, "epoch": 2723} {"train_loss": -37.44755172729492, "global_step": 329543, "epoch": 2723} {"train_loss": -39.94599533081055, "global_step": 329544, "epoch": 2723} {"train_loss": -31.368886947631836, "global_step": 329545, "epoch": 2723} {"train_loss": -40.359825134277344, "global_step": 329546, "epoch": 2723} {"train_loss": -39.642391204833984, "global_step": 329547, "epoch": 2723} {"train_loss": -38.5349235534668, "global_step": 329548, "epoch": 2723} {"train_loss": -37.03611755371094, "global_step": 329549, "epoch": 2723} {"train_loss": -37.02151107788086, "global_step": 329550, "epoch": 2723} {"train_loss": -32.9691276550293, "global_step": 329551, "epoch": 2723} {"train_loss": -39.457759857177734, "global_step": 329552, "epoch": 2723} {"train_loss": -40.4681510925293, "global_step": 329553, "epoch": 2723} {"train_loss": -41.061466217041016, "global_step": 329554, "epoch": 2723} {"train_loss": -41.268035888671875, "global_step": 329555, "epoch": 2723} {"train_loss": -41.69489669799805, "global_step": 329556, "epoch": 2723} {"train_loss": -41.33747482299805, "global_step": 329557, "epoch": 2723} {"train_loss": -38.55652618408203, "global_step": 329558, "epoch": 2723} {"train_loss": -41.03550338745117, "global_step": 329559, "epoch": 2723} {"train_loss": -37.449127197265625, "global_step": 329560, "epoch": 2723} {"train_loss": -40.33180618286133, "global_step": 329561, "epoch": 2723} {"train_loss": -41.20199203491211, "global_step": 329562, "epoch": 2723} {"train_loss": -41.13920974731445, "global_step": 329563, "epoch": 2723} {"train_loss": -37.70176315307617, "global_step": 329564, "epoch": 2723} {"train_loss": -38.51132583618164, "global_step": 329565, "epoch": 2723} {"train_loss": -40.69922637939453, "global_step": 329566, "epoch": 2723} {"train_loss": -40.64923095703125, "global_step": 329567, "epoch": 2723} {"train_loss": -40.85427474975586, "global_step": 329568, "epoch": 2723} {"train_loss": -40.332855224609375, "global_step": 329569, "epoch": 2723} {"train_loss": -40.73644256591797, "global_step": 329570, "epoch": 2723} {"train_loss": -41.582061767578125, "global_step": 329571, "epoch": 2723} {"train_loss": -39.77622604370117, "global_step": 329572, "epoch": 2723} {"train_loss": -41.37959671020508, "global_step": 329573, "epoch": 2723} {"train_loss": -40.951988220214844, "global_step": 329574, "epoch": 2723} {"train_loss": -39.321468353271484, "global_step": 329575, "epoch": 2723} {"train_loss": -39.76560974121094, "global_step": 329576, "epoch": 2723} {"train_loss": -42.20905685424805, "global_step": 329577, "epoch": 2723} {"train_loss": -39.87765121459961, "global_step": 329578, "epoch": 2723} {"train_loss": -42.38119125366211, "global_step": 329579, "epoch": 2723} {"train_loss": -42.36880111694336, "global_step": 329580, "epoch": 2723} {"train_loss": -41.248046875, "global_step": 329581, "epoch": 2723} {"train_loss": -39.3254508972168, "global_step": 329582, "epoch": 2723} {"train_loss": -42.002933502197266, "global_step": 329583, "epoch": 2723} {"train_loss": -41.41666793823242, "global_step": 329584, "epoch": 2723} {"train_loss": -42.32098388671875, "global_step": 329585, "epoch": 2723} {"train_loss": -40.991302490234375, "global_step": 329586, "epoch": 2723} {"train_loss": -41.24626159667969, "global_step": 329587, "epoch": 2723} {"train_loss": -42.87470245361328, "global_step": 329588, "epoch": 2723} {"train_loss": -42.5439338684082, "global_step": 329589, "epoch": 2723} {"train_loss": -42.927860260009766, "global_step": 329590, "epoch": 2723} {"train_loss": -42.80120849609375, "global_step": 329591, "epoch": 2723} {"train_loss": -42.275760650634766, "global_step": 329592, "epoch": 2723} {"train_loss": -42.5877685546875, "global_step": 329593, "epoch": 2723} {"train_loss": -41.502498626708984, "global_step": 329594, "epoch": 2723} {"train_loss": -42.470497131347656, "global_step": 329595, "epoch": 2723} {"train_loss": -41.25019073486328, "global_step": 329596, "epoch": 2723} {"train_loss": -42.25485610961914, "global_step": 329597, "epoch": 2723} {"train_loss": -43.24964141845703, "global_step": 329598, "epoch": 2723} {"train_loss": -42.92961502075195, "global_step": 329599, "epoch": 2723} {"train_loss": -42.587249755859375, "global_step": 329600, "epoch": 2723} {"train_loss": -42.63950729370117, "global_step": 329601, "epoch": 2723} {"train_loss": -42.80548095703125, "global_step": 329602, "epoch": 2723} {"train_loss": -41.50089861341744, "global_step": 329603, "epoch": 2723, "val_loss": 2614047.25} {"train_loss": -42.59959030151367, "global_step": 329604, "epoch": 2724} {"train_loss": -38.38020706176758, "global_step": 329605, "epoch": 2724} {"train_loss": -42.755401611328125, "global_step": 329606, "epoch": 2724} {"train_loss": -42.09193801879883, "global_step": 329607, "epoch": 2724} {"train_loss": -42.36625289916992, "global_step": 329608, "epoch": 2724} {"train_loss": -43.02085494995117, "global_step": 329609, "epoch": 2724} {"train_loss": -42.29305648803711, "global_step": 329610, "epoch": 2724} {"train_loss": -36.492977142333984, "global_step": 329611, "epoch": 2724} {"train_loss": -43.145668029785156, "global_step": 329612, "epoch": 2724} {"train_loss": -43.15497970581055, "global_step": 329613, "epoch": 2724} {"train_loss": -43.11137008666992, "global_step": 329614, "epoch": 2724} {"train_loss": -41.899574279785156, "global_step": 329615, "epoch": 2724} {"train_loss": -43.473602294921875, "global_step": 329616, "epoch": 2724} {"train_loss": -37.85610580444336, "global_step": 329617, "epoch": 2724} {"train_loss": -42.233642578125, "global_step": 329618, "epoch": 2724} {"train_loss": -42.982757568359375, "global_step": 329619, "epoch": 2724} {"train_loss": -43.71810531616211, "global_step": 329620, "epoch": 2724} {"train_loss": -44.13865661621094, "global_step": 329621, "epoch": 2724} {"train_loss": -41.453094482421875, "global_step": 329622, "epoch": 2724} {"train_loss": -42.92335891723633, "global_step": 329623, "epoch": 2724} {"train_loss": -43.585567474365234, "global_step": 329624, "epoch": 2724} {"train_loss": -43.42707443237305, "global_step": 329625, "epoch": 2724} {"train_loss": -41.32295608520508, "global_step": 329626, "epoch": 2724} {"train_loss": -43.12728500366211, "global_step": 329627, "epoch": 2724} {"train_loss": -42.28513717651367, "global_step": 329628, "epoch": 2724} {"train_loss": -43.13157272338867, "global_step": 329629, "epoch": 2724} {"train_loss": -43.2767333984375, "global_step": 329630, "epoch": 2724} {"train_loss": -43.52680587768555, "global_step": 329631, "epoch": 2724} {"train_loss": -43.27085876464844, "global_step": 329632, "epoch": 2724} {"train_loss": -42.2566032409668, "global_step": 329633, "epoch": 2724} {"train_loss": -43.07603454589844, "global_step": 329634, "epoch": 2724} {"train_loss": -36.85041427612305, "global_step": 329635, "epoch": 2724} {"train_loss": -43.68874740600586, "global_step": 329636, "epoch": 2724} {"train_loss": -43.76810836791992, "global_step": 329637, "epoch": 2724} {"train_loss": -43.518714904785156, "global_step": 329638, "epoch": 2724} {"train_loss": -40.30470275878906, "global_step": 329639, "epoch": 2724} {"train_loss": -40.61286544799805, "global_step": 329640, "epoch": 2724} {"train_loss": -42.54365158081055, "global_step": 329641, "epoch": 2724} {"train_loss": -42.47538375854492, "global_step": 329642, "epoch": 2724} {"train_loss": -42.195770263671875, "global_step": 329643, "epoch": 2724} {"train_loss": -41.944915771484375, "global_step": 329644, "epoch": 2724} {"train_loss": -41.89919662475586, "global_step": 329645, "epoch": 2724} {"train_loss": -42.83262634277344, "global_step": 329646, "epoch": 2724} {"train_loss": -43.01998519897461, "global_step": 329647, "epoch": 2724} {"train_loss": -43.476192474365234, "global_step": 329648, "epoch": 2724} {"train_loss": -42.52812576293945, "global_step": 329649, "epoch": 2724} {"train_loss": -43.09682083129883, "global_step": 329650, "epoch": 2724} {"train_loss": -43.02871322631836, "global_step": 329651, "epoch": 2724} {"train_loss": -41.906856536865234, "global_step": 329652, "epoch": 2724} {"train_loss": -43.300655364990234, "global_step": 329653, "epoch": 2724} {"train_loss": -40.55073928833008, "global_step": 329654, "epoch": 2724} {"train_loss": -43.677425384521484, "global_step": 329655, "epoch": 2724} {"train_loss": -43.33173370361328, "global_step": 329656, "epoch": 2724} {"train_loss": -42.8360481262207, "global_step": 329657, "epoch": 2724} {"train_loss": -43.70363235473633, "global_step": 329658, "epoch": 2724} {"train_loss": -43.36440658569336, "global_step": 329659, "epoch": 2724} {"train_loss": -40.51506423950195, "global_step": 329660, "epoch": 2724} {"train_loss": -43.63508987426758, "global_step": 329661, "epoch": 2724} {"train_loss": -42.5723762512207, "global_step": 329662, "epoch": 2724} {"train_loss": -43.34136962890625, "global_step": 329663, "epoch": 2724} {"train_loss": -42.30860900878906, "global_step": 329664, "epoch": 2724} {"train_loss": -42.6031494140625, "global_step": 329665, "epoch": 2724} {"train_loss": -42.18839645385742, "global_step": 329666, "epoch": 2724} {"train_loss": -43.51696014404297, "global_step": 329667, "epoch": 2724} {"train_loss": -41.49652862548828, "global_step": 329668, "epoch": 2724} {"train_loss": -41.170387268066406, "global_step": 329669, "epoch": 2724} {"train_loss": -42.669586181640625, "global_step": 329670, "epoch": 2724} {"train_loss": -34.14382553100586, "global_step": 329671, "epoch": 2724} {"train_loss": -43.57015609741211, "global_step": 329672, "epoch": 2724} {"train_loss": -43.33529281616211, "global_step": 329673, "epoch": 2724} {"train_loss": -42.461570739746094, "global_step": 329674, "epoch": 2724} {"train_loss": -43.28064727783203, "global_step": 329675, "epoch": 2724} {"train_loss": -42.885643005371094, "global_step": 329676, "epoch": 2724} {"train_loss": -39.83378219604492, "global_step": 329677, "epoch": 2724} {"train_loss": -41.2879524230957, "global_step": 329678, "epoch": 2724} {"train_loss": -42.210784912109375, "global_step": 329679, "epoch": 2724} {"train_loss": -40.03438949584961, "global_step": 329680, "epoch": 2724} {"train_loss": -41.7091064453125, "global_step": 329681, "epoch": 2724} {"train_loss": -42.822845458984375, "global_step": 329682, "epoch": 2724} {"train_loss": -41.56517791748047, "global_step": 329683, "epoch": 2724} {"train_loss": -42.335960388183594, "global_step": 329684, "epoch": 2724} {"train_loss": -39.57841110229492, "global_step": 329685, "epoch": 2724} {"train_loss": -43.10441970825195, "global_step": 329686, "epoch": 2724} {"train_loss": -38.546234130859375, "global_step": 329687, "epoch": 2724} {"train_loss": -42.37269973754883, "global_step": 329688, "epoch": 2724} {"train_loss": -40.53961944580078, "global_step": 329689, "epoch": 2724} {"train_loss": -42.48995590209961, "global_step": 329690, "epoch": 2724} {"train_loss": -41.34126663208008, "global_step": 329691, "epoch": 2724} {"train_loss": -41.395057678222656, "global_step": 329692, "epoch": 2724} {"train_loss": -40.78379440307617, "global_step": 329693, "epoch": 2724} {"train_loss": -40.56399917602539, "global_step": 329694, "epoch": 2724} {"train_loss": -42.62946701049805, "global_step": 329695, "epoch": 2724} {"train_loss": -38.43101119995117, "global_step": 329696, "epoch": 2724} {"train_loss": -41.018890380859375, "global_step": 329697, "epoch": 2724} {"train_loss": -41.58840560913086, "global_step": 329698, "epoch": 2724} {"train_loss": -40.91264343261719, "global_step": 329699, "epoch": 2724} {"train_loss": -42.11763000488281, "global_step": 329700, "epoch": 2724} {"train_loss": -40.874114990234375, "global_step": 329701, "epoch": 2724} {"train_loss": -42.21175765991211, "global_step": 329702, "epoch": 2724} {"train_loss": -41.5284538269043, "global_step": 329703, "epoch": 2724} {"train_loss": -40.940155029296875, "global_step": 329704, "epoch": 2724} {"train_loss": -41.39070129394531, "global_step": 329705, "epoch": 2724} {"train_loss": -41.73703384399414, "global_step": 329706, "epoch": 2724} {"train_loss": -41.95174026489258, "global_step": 329707, "epoch": 2724} {"train_loss": -41.208553314208984, "global_step": 329708, "epoch": 2724} {"train_loss": -42.35653305053711, "global_step": 329709, "epoch": 2724} {"train_loss": -42.56458282470703, "global_step": 329710, "epoch": 2724} {"train_loss": -42.37175369262695, "global_step": 329711, "epoch": 2724} {"train_loss": -41.56008529663086, "global_step": 329712, "epoch": 2724} {"train_loss": -40.93697738647461, "global_step": 329713, "epoch": 2724} {"train_loss": -42.2098388671875, "global_step": 329714, "epoch": 2724} {"train_loss": -41.398719787597656, "global_step": 329715, "epoch": 2724} {"train_loss": -41.23075485229492, "global_step": 329716, "epoch": 2724} {"train_loss": -41.87156295776367, "global_step": 329717, "epoch": 2724} {"train_loss": -36.1085205078125, "global_step": 329718, "epoch": 2724} {"train_loss": -40.665626525878906, "global_step": 329719, "epoch": 2724} {"train_loss": -39.10477066040039, "global_step": 329720, "epoch": 2724} {"train_loss": -41.949371337890625, "global_step": 329721, "epoch": 2724} {"train_loss": -40.226470947265625, "global_step": 329722, "epoch": 2724} {"train_loss": -41.816383361816406, "global_step": 329723, "epoch": 2724} {"train_loss": -41.87986859408292, "global_step": 329724, "epoch": 2724, "val_loss": 2545439.75} {"train_loss": -41.7599983215332, "global_step": 329725, "epoch": 2725} {"train_loss": -42.591392517089844, "global_step": 329726, "epoch": 2725} {"train_loss": -41.56002426147461, "global_step": 329727, "epoch": 2725} {"train_loss": -39.94342041015625, "global_step": 329728, "epoch": 2725} {"train_loss": -42.35520553588867, "global_step": 329729, "epoch": 2725} {"train_loss": -35.595191955566406, "global_step": 329730, "epoch": 2725} {"train_loss": -41.87676239013672, "global_step": 329731, "epoch": 2725} {"train_loss": -42.085105895996094, "global_step": 329732, "epoch": 2725} {"train_loss": -42.7921028137207, "global_step": 329733, "epoch": 2725} {"train_loss": -42.007076263427734, "global_step": 329734, "epoch": 2725} {"train_loss": -42.65675735473633, "global_step": 329735, "epoch": 2725} {"train_loss": -41.96141052246094, "global_step": 329736, "epoch": 2725} {"train_loss": -42.94950485229492, "global_step": 329737, "epoch": 2725} {"train_loss": -42.35251998901367, "global_step": 329738, "epoch": 2725} {"train_loss": -43.33205032348633, "global_step": 329739, "epoch": 2725} {"train_loss": -42.840309143066406, "global_step": 329740, "epoch": 2725} {"train_loss": -42.69974899291992, "global_step": 329741, "epoch": 2725} {"train_loss": -43.394126892089844, "global_step": 329742, "epoch": 2725} {"train_loss": -42.610042572021484, "global_step": 329743, "epoch": 2725} {"train_loss": -42.86414337158203, "global_step": 329744, "epoch": 2725} {"train_loss": -42.7115364074707, "global_step": 329745, "epoch": 2725} {"train_loss": -42.616336822509766, "global_step": 329746, "epoch": 2725} {"train_loss": -41.547218322753906, "global_step": 329747, "epoch": 2725} {"train_loss": -42.02604293823242, "global_step": 329748, "epoch": 2725} {"train_loss": -43.175025939941406, "global_step": 329749, "epoch": 2725} {"train_loss": -43.22970199584961, "global_step": 329750, "epoch": 2725} {"train_loss": -41.72487258911133, "global_step": 329751, "epoch": 2725} {"train_loss": -42.4771842956543, "global_step": 329752, "epoch": 2725} {"train_loss": -43.01420211791992, "global_step": 329753, "epoch": 2725} {"train_loss": -41.646175384521484, "global_step": 329754, "epoch": 2725} {"train_loss": -43.466121673583984, "global_step": 329755, "epoch": 2725} {"train_loss": -41.526458740234375, "global_step": 329756, "epoch": 2725} {"train_loss": -43.466915130615234, "global_step": 329757, "epoch": 2725} {"train_loss": -43.3040771484375, "global_step": 329758, "epoch": 2725} {"train_loss": -41.64316940307617, "global_step": 329759, "epoch": 2725} {"train_loss": -43.548763275146484, "global_step": 329760, "epoch": 2725} {"train_loss": -42.24846267700195, "global_step": 329761, "epoch": 2725} {"train_loss": -43.199188232421875, "global_step": 329762, "epoch": 2725} {"train_loss": -42.783565521240234, "global_step": 329763, "epoch": 2725} {"train_loss": -43.27291488647461, "global_step": 329764, "epoch": 2725} {"train_loss": -43.00233840942383, "global_step": 329765, "epoch": 2725} {"train_loss": -41.6307487487793, "global_step": 329766, "epoch": 2725} {"train_loss": -42.387184143066406, "global_step": 329767, "epoch": 2725} {"train_loss": -42.568031311035156, "global_step": 329768, "epoch": 2725} {"train_loss": -43.03275680541992, "global_step": 329769, "epoch": 2725} {"train_loss": -43.322933197021484, "global_step": 329770, "epoch": 2725} {"train_loss": -43.725582122802734, "global_step": 329771, "epoch": 2725} {"train_loss": -43.57612609863281, "global_step": 329772, "epoch": 2725} {"train_loss": -42.898616790771484, "global_step": 329773, "epoch": 2725} {"train_loss": -43.80926513671875, "global_step": 329774, "epoch": 2725} {"train_loss": -42.85787582397461, "global_step": 329775, "epoch": 2725} {"train_loss": -43.436641693115234, "global_step": 329776, "epoch": 2725} {"train_loss": -43.825008392333984, "global_step": 329777, "epoch": 2725} {"train_loss": -43.0994873046875, "global_step": 329778, "epoch": 2725} {"train_loss": -43.60957717895508, "global_step": 329779, "epoch": 2725} {"train_loss": -43.532474517822266, "global_step": 329780, "epoch": 2725} {"train_loss": -43.288509368896484, "global_step": 329781, "epoch": 2725} {"train_loss": -44.07406234741211, "global_step": 329782, "epoch": 2725} {"train_loss": -43.5984992980957, "global_step": 329783, "epoch": 2725} {"train_loss": -43.777095794677734, "global_step": 329784, "epoch": 2725} {"train_loss": -43.088314056396484, "global_step": 329785, "epoch": 2725} {"train_loss": -41.92544174194336, "global_step": 329786, "epoch": 2725} {"train_loss": -41.56011962890625, "global_step": 329787, "epoch": 2725} {"train_loss": -43.1651496887207, "global_step": 329788, "epoch": 2725} {"train_loss": -43.279022216796875, "global_step": 329789, "epoch": 2725} {"train_loss": -43.23419952392578, "global_step": 329790, "epoch": 2725} {"train_loss": -42.30782699584961, "global_step": 329791, "epoch": 2725} {"train_loss": -43.720947265625, "global_step": 329792, "epoch": 2725} {"train_loss": -44.09756851196289, "global_step": 329793, "epoch": 2725} {"train_loss": -43.886146545410156, "global_step": 329794, "epoch": 2725} {"train_loss": -43.14126968383789, "global_step": 329795, "epoch": 2725} {"train_loss": -42.28365707397461, "global_step": 329796, "epoch": 2725} {"train_loss": -43.0452995300293, "global_step": 329797, "epoch": 2725} {"train_loss": -42.22385787963867, "global_step": 329798, "epoch": 2725} {"train_loss": -43.28117370605469, "global_step": 329799, "epoch": 2725} {"train_loss": -43.01191329956055, "global_step": 329800, "epoch": 2725} {"train_loss": -42.83575439453125, "global_step": 329801, "epoch": 2725} {"train_loss": -43.23971176147461, "global_step": 329802, "epoch": 2725} {"train_loss": -39.792999267578125, "global_step": 329803, "epoch": 2725} {"train_loss": -40.282325744628906, "global_step": 329804, "epoch": 2725} {"train_loss": -41.124267578125, "global_step": 329805, "epoch": 2725} {"train_loss": -42.252418518066406, "global_step": 329806, "epoch": 2725} {"train_loss": -40.478450775146484, "global_step": 329807, "epoch": 2725} {"train_loss": -36.38663864135742, "global_step": 329808, "epoch": 2725} {"train_loss": -41.10538864135742, "global_step": 329809, "epoch": 2725} {"train_loss": -41.651947021484375, "global_step": 329810, "epoch": 2725} {"train_loss": -39.18333053588867, "global_step": 329811, "epoch": 2725} {"train_loss": -42.07075881958008, "global_step": 329812, "epoch": 2725} {"train_loss": -41.765167236328125, "global_step": 329813, "epoch": 2725} {"train_loss": -38.09934616088867, "global_step": 329814, "epoch": 2725} {"train_loss": -42.004852294921875, "global_step": 329815, "epoch": 2725} {"train_loss": -41.940425872802734, "global_step": 329816, "epoch": 2725} {"train_loss": -41.69462585449219, "global_step": 329817, "epoch": 2725} {"train_loss": -42.695274353027344, "global_step": 329818, "epoch": 2725} {"train_loss": -41.54618453979492, "global_step": 329819, "epoch": 2725} {"train_loss": -43.02883529663086, "global_step": 329820, "epoch": 2725} {"train_loss": -42.217803955078125, "global_step": 329821, "epoch": 2725} {"train_loss": -43.02302169799805, "global_step": 329822, "epoch": 2725} {"train_loss": -42.53694152832031, "global_step": 329823, "epoch": 2725} {"train_loss": -42.84004592895508, "global_step": 329824, "epoch": 2725} {"train_loss": -43.87001419067383, "global_step": 329825, "epoch": 2725} {"train_loss": -42.628379821777344, "global_step": 329826, "epoch": 2725} {"train_loss": -41.92506408691406, "global_step": 329827, "epoch": 2725} {"train_loss": -43.476619720458984, "global_step": 329828, "epoch": 2725} {"train_loss": -43.511016845703125, "global_step": 329829, "epoch": 2725} {"train_loss": -43.419898986816406, "global_step": 329830, "epoch": 2725} {"train_loss": -43.656951904296875, "global_step": 329831, "epoch": 2725} {"train_loss": -43.4310188293457, "global_step": 329832, "epoch": 2725} {"train_loss": -42.83522415161133, "global_step": 329833, "epoch": 2725} {"train_loss": -43.24930953979492, "global_step": 329834, "epoch": 2725} {"train_loss": -42.63697814941406, "global_step": 329835, "epoch": 2725} {"train_loss": -43.34980392456055, "global_step": 329836, "epoch": 2725} {"train_loss": -41.52895736694336, "global_step": 329837, "epoch": 2725} {"train_loss": -43.74569320678711, "global_step": 329838, "epoch": 2725} {"train_loss": -43.23883819580078, "global_step": 329839, "epoch": 2725} {"train_loss": -43.5669059753418, "global_step": 329840, "epoch": 2725} {"train_loss": -40.788021087646484, "global_step": 329841, "epoch": 2725} {"train_loss": -43.141883850097656, "global_step": 329842, "epoch": 2725} {"train_loss": -43.7478141784668, "global_step": 329843, "epoch": 2725} {"train_loss": -43.336944580078125, "global_step": 329844, "epoch": 2725} {"train_loss": -42.50765559298933, "global_step": 329845, "epoch": 2725, "val_loss": 2460054.25} {"train_loss": -43.300559997558594, "global_step": 329846, "epoch": 2726} {"train_loss": -42.548316955566406, "global_step": 329847, "epoch": 2726} {"train_loss": -43.26361083984375, "global_step": 329848, "epoch": 2726} {"train_loss": -43.70172119140625, "global_step": 329849, "epoch": 2726} {"train_loss": -42.8497428894043, "global_step": 329850, "epoch": 2726} {"train_loss": -43.19468307495117, "global_step": 329851, "epoch": 2726} {"train_loss": -43.75997543334961, "global_step": 329852, "epoch": 2726} {"train_loss": -43.79930114746094, "global_step": 329853, "epoch": 2726} {"train_loss": -43.19679260253906, "global_step": 329854, "epoch": 2726} {"train_loss": -43.19413757324219, "global_step": 329855, "epoch": 2726} {"train_loss": -43.50615310668945, "global_step": 329856, "epoch": 2726} {"train_loss": -43.767879486083984, "global_step": 329857, "epoch": 2726} {"train_loss": -43.60334396362305, "global_step": 329858, "epoch": 2726} {"train_loss": -43.76624298095703, "global_step": 329859, "epoch": 2726} {"train_loss": -43.26511764526367, "global_step": 329860, "epoch": 2726} {"train_loss": -43.93042755126953, "global_step": 329861, "epoch": 2726} {"train_loss": -43.66199493408203, "global_step": 329862, "epoch": 2726} {"train_loss": -43.28591537475586, "global_step": 329863, "epoch": 2726} {"train_loss": -43.67002487182617, "global_step": 329864, "epoch": 2726} {"train_loss": -43.31549835205078, "global_step": 329865, "epoch": 2726} {"train_loss": -42.9981803894043, "global_step": 329866, "epoch": 2726} {"train_loss": -43.540653228759766, "global_step": 329867, "epoch": 2726} {"train_loss": -43.527034759521484, "global_step": 329868, "epoch": 2726} {"train_loss": -42.94434356689453, "global_step": 329869, "epoch": 2726} {"train_loss": -42.30432891845703, "global_step": 329870, "epoch": 2726} {"train_loss": -42.39686965942383, "global_step": 329871, "epoch": 2726} {"train_loss": -43.48642349243164, "global_step": 329872, "epoch": 2726} {"train_loss": -44.16488265991211, "global_step": 329873, "epoch": 2726} {"train_loss": -39.42243957519531, "global_step": 329874, "epoch": 2726} {"train_loss": -41.161720275878906, "global_step": 329875, "epoch": 2726} {"train_loss": -41.159202575683594, "global_step": 329876, "epoch": 2726} {"train_loss": -43.45066452026367, "global_step": 329877, "epoch": 2726} {"train_loss": -43.626705169677734, "global_step": 329878, "epoch": 2726} {"train_loss": -41.698970794677734, "global_step": 329879, "epoch": 2726} {"train_loss": -42.35555648803711, "global_step": 329880, "epoch": 2726} {"train_loss": -43.33512496948242, "global_step": 329881, "epoch": 2726} {"train_loss": -44.27450942993164, "global_step": 329882, "epoch": 2726} {"train_loss": -43.6246337890625, "global_step": 329883, "epoch": 2726} {"train_loss": -43.376705169677734, "global_step": 329884, "epoch": 2726} {"train_loss": -43.459251403808594, "global_step": 329885, "epoch": 2726} {"train_loss": -43.902034759521484, "global_step": 329886, "epoch": 2726} {"train_loss": -42.92629623413086, "global_step": 329887, "epoch": 2726} {"train_loss": -43.81438064575195, "global_step": 329888, "epoch": 2726} {"train_loss": -43.560543060302734, "global_step": 329889, "epoch": 2726} {"train_loss": -43.67655563354492, "global_step": 329890, "epoch": 2726} {"train_loss": -42.830543518066406, "global_step": 329891, "epoch": 2726} {"train_loss": -42.94077682495117, "global_step": 329892, "epoch": 2726} {"train_loss": -42.9940299987793, "global_step": 329893, "epoch": 2726} {"train_loss": -43.71970748901367, "global_step": 329894, "epoch": 2726} {"train_loss": -43.18253707885742, "global_step": 329895, "epoch": 2726} {"train_loss": -40.980167388916016, "global_step": 329896, "epoch": 2726} {"train_loss": -42.59065628051758, "global_step": 329897, "epoch": 2726} {"train_loss": -43.1595458984375, "global_step": 329898, "epoch": 2726} {"train_loss": -42.080108642578125, "global_step": 329899, "epoch": 2726} {"train_loss": -42.88526153564453, "global_step": 329900, "epoch": 2726} {"train_loss": -42.81541061401367, "global_step": 329901, "epoch": 2726} {"train_loss": -43.8769645690918, "global_step": 329902, "epoch": 2726} {"train_loss": -43.36227035522461, "global_step": 329903, "epoch": 2726} {"train_loss": -43.57727813720703, "global_step": 329904, "epoch": 2726} {"train_loss": -42.65141296386719, "global_step": 329905, "epoch": 2726} {"train_loss": -42.60770797729492, "global_step": 329906, "epoch": 2726} {"train_loss": -43.6451416015625, "global_step": 329907, "epoch": 2726} {"train_loss": -44.27070236206055, "global_step": 329908, "epoch": 2726} {"train_loss": -43.78336715698242, "global_step": 329909, "epoch": 2726} {"train_loss": -43.555320739746094, "global_step": 329910, "epoch": 2726} {"train_loss": -44.018760681152344, "global_step": 329911, "epoch": 2726} {"train_loss": -43.28021240234375, "global_step": 329912, "epoch": 2726} {"train_loss": -43.28830337524414, "global_step": 329913, "epoch": 2726} {"train_loss": -43.887142181396484, "global_step": 329914, "epoch": 2726} {"train_loss": -43.52596664428711, "global_step": 329915, "epoch": 2726} {"train_loss": -43.79951095581055, "global_step": 329916, "epoch": 2726} {"train_loss": -43.895530700683594, "global_step": 329917, "epoch": 2726} {"train_loss": -43.84759521484375, "global_step": 329918, "epoch": 2726} {"train_loss": -42.52932357788086, "global_step": 329919, "epoch": 2726} {"train_loss": -44.25858688354492, "global_step": 329920, "epoch": 2726} {"train_loss": -43.35525131225586, "global_step": 329921, "epoch": 2726} {"train_loss": -44.24663162231445, "global_step": 329922, "epoch": 2726} {"train_loss": -42.98157501220703, "global_step": 329923, "epoch": 2726} {"train_loss": -43.55779266357422, "global_step": 329924, "epoch": 2726} {"train_loss": -43.129432678222656, "global_step": 329925, "epoch": 2726} {"train_loss": -42.919334411621094, "global_step": 329926, "epoch": 2726} {"train_loss": -42.90394973754883, "global_step": 329927, "epoch": 2726} {"train_loss": -43.80182647705078, "global_step": 329928, "epoch": 2726} {"train_loss": -42.98035430908203, "global_step": 329929, "epoch": 2726} {"train_loss": -43.416053771972656, "global_step": 329930, "epoch": 2726} {"train_loss": -43.147125244140625, "global_step": 329931, "epoch": 2726} {"train_loss": -42.915802001953125, "global_step": 329932, "epoch": 2726} {"train_loss": -43.669002532958984, "global_step": 329933, "epoch": 2726} {"train_loss": -43.993282318115234, "global_step": 329934, "epoch": 2726} {"train_loss": -43.151546478271484, "global_step": 329935, "epoch": 2726} {"train_loss": -43.16288375854492, "global_step": 329936, "epoch": 2726} {"train_loss": -43.07778549194336, "global_step": 329937, "epoch": 2726} {"train_loss": -41.70148849487305, "global_step": 329938, "epoch": 2726} {"train_loss": -40.335914611816406, "global_step": 329939, "epoch": 2726} {"train_loss": -41.5030632019043, "global_step": 329940, "epoch": 2726} {"train_loss": -42.2138671875, "global_step": 329941, "epoch": 2726} {"train_loss": -43.52676010131836, "global_step": 329942, "epoch": 2726} {"train_loss": -43.96052169799805, "global_step": 329943, "epoch": 2726} {"train_loss": -43.447792053222656, "global_step": 329944, "epoch": 2726} {"train_loss": -43.48869705200195, "global_step": 329945, "epoch": 2726} {"train_loss": -43.26023483276367, "global_step": 329946, "epoch": 2726} {"train_loss": -44.051536560058594, "global_step": 329947, "epoch": 2726} {"train_loss": -42.38967514038086, "global_step": 329948, "epoch": 2726} {"train_loss": -43.34791946411133, "global_step": 329949, "epoch": 2726} {"train_loss": -43.700958251953125, "global_step": 329950, "epoch": 2726} {"train_loss": -43.3095703125, "global_step": 329951, "epoch": 2726} {"train_loss": -43.764278411865234, "global_step": 329952, "epoch": 2726} {"train_loss": -43.946651458740234, "global_step": 329953, "epoch": 2726} {"train_loss": -40.82589340209961, "global_step": 329954, "epoch": 2726} {"train_loss": -39.52897262573242, "global_step": 329955, "epoch": 2726} {"train_loss": -37.661659240722656, "global_step": 329956, "epoch": 2726} {"train_loss": -41.09444808959961, "global_step": 329957, "epoch": 2726} {"train_loss": -43.50184631347656, "global_step": 329958, "epoch": 2726} {"train_loss": -40.589473724365234, "global_step": 329959, "epoch": 2726} {"train_loss": -39.88703155517578, "global_step": 329960, "epoch": 2726} {"train_loss": -43.45167922973633, "global_step": 329961, "epoch": 2726} {"train_loss": -41.74834060668945, "global_step": 329962, "epoch": 2726} {"train_loss": -41.36454391479492, "global_step": 329963, "epoch": 2726} {"train_loss": -42.47069549560547, "global_step": 329964, "epoch": 2726} {"train_loss": -42.62290573120117, "global_step": 329965, "epoch": 2726} {"train_loss": -42.98702810618503, "global_step": 329966, "epoch": 2726, "val_loss": 2415936.25} {"train_loss": -42.425559997558594, "global_step": 329967, "epoch": 2727} {"train_loss": -43.03035354614258, "global_step": 329968, "epoch": 2727} {"train_loss": -41.96129608154297, "global_step": 329969, "epoch": 2727} {"train_loss": -42.28695297241211, "global_step": 329970, "epoch": 2727} {"train_loss": -43.0653190612793, "global_step": 329971, "epoch": 2727} {"train_loss": -41.06425094604492, "global_step": 329972, "epoch": 2727} {"train_loss": -42.92229080200195, "global_step": 329973, "epoch": 2727} {"train_loss": -42.765621185302734, "global_step": 329974, "epoch": 2727} {"train_loss": -42.339454650878906, "global_step": 329975, "epoch": 2727} {"train_loss": -43.87711715698242, "global_step": 329976, "epoch": 2727} {"train_loss": -41.7998161315918, "global_step": 329977, "epoch": 2727} {"train_loss": -44.15693664550781, "global_step": 329978, "epoch": 2727} {"train_loss": -41.96318435668945, "global_step": 329979, "epoch": 2727} {"train_loss": -42.983680725097656, "global_step": 329980, "epoch": 2727} {"train_loss": -43.67683029174805, "global_step": 329981, "epoch": 2727} {"train_loss": -41.625831604003906, "global_step": 329982, "epoch": 2727} {"train_loss": -43.52693176269531, "global_step": 329983, "epoch": 2727} {"train_loss": -43.69797134399414, "global_step": 329984, "epoch": 2727} {"train_loss": -42.895015716552734, "global_step": 329985, "epoch": 2727} {"train_loss": -42.750244140625, "global_step": 329986, "epoch": 2727} {"train_loss": -42.907833099365234, "global_step": 329987, "epoch": 2727} {"train_loss": -42.861297607421875, "global_step": 329988, "epoch": 2727} {"train_loss": -43.08336639404297, "global_step": 329989, "epoch": 2727} {"train_loss": -43.3459358215332, "global_step": 329990, "epoch": 2727} {"train_loss": -42.968292236328125, "global_step": 329991, "epoch": 2727} {"train_loss": -44.07813262939453, "global_step": 329992, "epoch": 2727} {"train_loss": -43.077816009521484, "global_step": 329993, "epoch": 2727} {"train_loss": -43.496856689453125, "global_step": 329994, "epoch": 2727} {"train_loss": -43.44301986694336, "global_step": 329995, "epoch": 2727} {"train_loss": -43.14506530761719, "global_step": 329996, "epoch": 2727} {"train_loss": -44.519874572753906, "global_step": 329997, "epoch": 2727} {"train_loss": -43.8632698059082, "global_step": 329998, "epoch": 2727} {"train_loss": -43.755943298339844, "global_step": 329999, "epoch": 2727} {"train_loss": -43.565982818603516, "global_step": 330000, "epoch": 2727} {"train_loss": -43.5322151184082, "global_step": 330001, "epoch": 2727} {"train_loss": -44.3568115234375, "global_step": 330002, "epoch": 2727} {"train_loss": -43.8990478515625, "global_step": 330003, "epoch": 2727} {"train_loss": -44.26911544799805, "global_step": 330004, "epoch": 2727} {"train_loss": -44.12028121948242, "global_step": 330005, "epoch": 2727} {"train_loss": -43.213233947753906, "global_step": 330006, "epoch": 2727} {"train_loss": -44.0346565246582, "global_step": 330007, "epoch": 2727} {"train_loss": -44.23835372924805, "global_step": 330008, "epoch": 2727} {"train_loss": -43.84025955200195, "global_step": 330009, "epoch": 2727} {"train_loss": -44.53408432006836, "global_step": 330010, "epoch": 2727} {"train_loss": -44.23170852661133, "global_step": 330011, "epoch": 2727} {"train_loss": -43.81364059448242, "global_step": 330012, "epoch": 2727} {"train_loss": -44.580196380615234, "global_step": 330013, "epoch": 2727} {"train_loss": -44.03473663330078, "global_step": 330014, "epoch": 2727} {"train_loss": -44.1986198425293, "global_step": 330015, "epoch": 2727} {"train_loss": -44.62954330444336, "global_step": 330016, "epoch": 2727} {"train_loss": -44.159976959228516, "global_step": 330017, "epoch": 2727} {"train_loss": -44.37199020385742, "global_step": 330018, "epoch": 2727} {"train_loss": -43.73653793334961, "global_step": 330019, "epoch": 2727} {"train_loss": -43.86615753173828, "global_step": 330020, "epoch": 2727} {"train_loss": -43.98849105834961, "global_step": 330021, "epoch": 2727} {"train_loss": -43.362300872802734, "global_step": 330022, "epoch": 2727} {"train_loss": -44.06956481933594, "global_step": 330023, "epoch": 2727} {"train_loss": -44.64621353149414, "global_step": 330024, "epoch": 2727} {"train_loss": -44.036964416503906, "global_step": 330025, "epoch": 2727} {"train_loss": -43.08323287963867, "global_step": 330026, "epoch": 2727} {"train_loss": -44.6240348815918, "global_step": 330027, "epoch": 2727} {"train_loss": -43.67045974731445, "global_step": 330028, "epoch": 2727} {"train_loss": -44.108306884765625, "global_step": 330029, "epoch": 2727} {"train_loss": -44.044647216796875, "global_step": 330030, "epoch": 2727} {"train_loss": -43.696231842041016, "global_step": 330031, "epoch": 2727} {"train_loss": -44.11211013793945, "global_step": 330032, "epoch": 2727} {"train_loss": -44.37150573730469, "global_step": 330033, "epoch": 2727} {"train_loss": -43.62824630737305, "global_step": 330034, "epoch": 2727} {"train_loss": -42.65005111694336, "global_step": 330035, "epoch": 2727} {"train_loss": -44.58176803588867, "global_step": 330036, "epoch": 2727} {"train_loss": -44.114280700683594, "global_step": 330037, "epoch": 2727} {"train_loss": -42.57572555541992, "global_step": 330038, "epoch": 2727} {"train_loss": -40.684391021728516, "global_step": 330039, "epoch": 2727} {"train_loss": -41.84049606323242, "global_step": 330040, "epoch": 2727} {"train_loss": -43.86210250854492, "global_step": 330041, "epoch": 2727} {"train_loss": -42.7350959777832, "global_step": 330042, "epoch": 2727} {"train_loss": -42.14338302612305, "global_step": 330043, "epoch": 2727} {"train_loss": -44.1031608581543, "global_step": 330044, "epoch": 2727} {"train_loss": -41.679107666015625, "global_step": 330045, "epoch": 2727} {"train_loss": -42.31413650512695, "global_step": 330046, "epoch": 2727} {"train_loss": -43.148414611816406, "global_step": 330047, "epoch": 2727} {"train_loss": -42.67896270751953, "global_step": 330048, "epoch": 2727} {"train_loss": -43.381771087646484, "global_step": 330049, "epoch": 2727} {"train_loss": -43.352149963378906, "global_step": 330050, "epoch": 2727} {"train_loss": -40.5254020690918, "global_step": 330051, "epoch": 2727} {"train_loss": -42.700164794921875, "global_step": 330052, "epoch": 2727} {"train_loss": -43.6109504699707, "global_step": 330053, "epoch": 2727} {"train_loss": -42.81830978393555, "global_step": 330054, "epoch": 2727} {"train_loss": -43.07825469970703, "global_step": 330055, "epoch": 2727} {"train_loss": -43.54343795776367, "global_step": 330056, "epoch": 2727} {"train_loss": -43.34628677368164, "global_step": 330057, "epoch": 2727} {"train_loss": -41.96858596801758, "global_step": 330058, "epoch": 2727} {"train_loss": -42.38157272338867, "global_step": 330059, "epoch": 2727} {"train_loss": -43.5200309753418, "global_step": 330060, "epoch": 2727} {"train_loss": -42.921791076660156, "global_step": 330061, "epoch": 2727} {"train_loss": -42.3539924621582, "global_step": 330062, "epoch": 2727} {"train_loss": -43.45026779174805, "global_step": 330063, "epoch": 2727} {"train_loss": -43.0620002746582, "global_step": 330064, "epoch": 2727} {"train_loss": -42.30878448486328, "global_step": 330065, "epoch": 2727} {"train_loss": -42.465309143066406, "global_step": 330066, "epoch": 2727} {"train_loss": -43.980812072753906, "global_step": 330067, "epoch": 2727} {"train_loss": -42.86235427856445, "global_step": 330068, "epoch": 2727} {"train_loss": -40.0815315246582, "global_step": 330069, "epoch": 2727} {"train_loss": -42.84217071533203, "global_step": 330070, "epoch": 2727} {"train_loss": -43.155757904052734, "global_step": 330071, "epoch": 2727} {"train_loss": -42.96614456176758, "global_step": 330072, "epoch": 2727} {"train_loss": -43.83395004272461, "global_step": 330073, "epoch": 2727} {"train_loss": -43.31509017944336, "global_step": 330074, "epoch": 2727} {"train_loss": -42.80178451538086, "global_step": 330075, "epoch": 2727} {"train_loss": -42.067378997802734, "global_step": 330076, "epoch": 2727} {"train_loss": -43.001991271972656, "global_step": 330077, "epoch": 2727} {"train_loss": -43.08720016479492, "global_step": 330078, "epoch": 2727} {"train_loss": -43.26267623901367, "global_step": 330079, "epoch": 2727} {"train_loss": -42.6552619934082, "global_step": 330080, "epoch": 2727} {"train_loss": -43.20827865600586, "global_step": 330081, "epoch": 2727} {"train_loss": -41.88747787475586, "global_step": 330082, "epoch": 2727} {"train_loss": -43.734554290771484, "global_step": 330083, "epoch": 2727} {"train_loss": -43.54060363769531, "global_step": 330084, "epoch": 2727} {"train_loss": -43.59749984741211, "global_step": 330085, "epoch": 2727} {"train_loss": -44.0079345703125, "global_step": 330086, "epoch": 2727} {"train_loss": -43.253470334139735, "global_step": 330087, "epoch": 2727, "val_loss": 2418784.25} {"train_loss": -42.63541030883789, "global_step": 330088, "epoch": 2728} {"train_loss": -43.39818572998047, "global_step": 330089, "epoch": 2728} {"train_loss": -43.640350341796875, "global_step": 330090, "epoch": 2728} {"train_loss": -43.08665466308594, "global_step": 330091, "epoch": 2728} {"train_loss": -44.22834777832031, "global_step": 330092, "epoch": 2728} {"train_loss": -43.666683197021484, "global_step": 330093, "epoch": 2728} {"train_loss": -44.47047424316406, "global_step": 330094, "epoch": 2728} {"train_loss": -43.77616882324219, "global_step": 330095, "epoch": 2728} {"train_loss": -44.054534912109375, "global_step": 330096, "epoch": 2728} {"train_loss": -43.802406311035156, "global_step": 330097, "epoch": 2728} {"train_loss": -44.48383712768555, "global_step": 330098, "epoch": 2728} {"train_loss": -44.1903190612793, "global_step": 330099, "epoch": 2728} {"train_loss": -44.1639289855957, "global_step": 330100, "epoch": 2728} {"train_loss": -44.47317123413086, "global_step": 330101, "epoch": 2728} {"train_loss": -44.62721633911133, "global_step": 330102, "epoch": 2728} {"train_loss": -43.42369079589844, "global_step": 330103, "epoch": 2728} {"train_loss": -44.67573165893555, "global_step": 330104, "epoch": 2728} {"train_loss": -44.45212936401367, "global_step": 330105, "epoch": 2728} {"train_loss": -43.81829071044922, "global_step": 330106, "epoch": 2728} {"train_loss": -44.85588836669922, "global_step": 330107, "epoch": 2728} {"train_loss": -44.20779800415039, "global_step": 330108, "epoch": 2728} {"train_loss": -44.50545120239258, "global_step": 330109, "epoch": 2728} {"train_loss": -44.24920654296875, "global_step": 330110, "epoch": 2728} {"train_loss": -44.40873336791992, "global_step": 330111, "epoch": 2728} {"train_loss": -44.218719482421875, "global_step": 330112, "epoch": 2728} {"train_loss": -44.22353744506836, "global_step": 330113, "epoch": 2728} {"train_loss": -44.862152099609375, "global_step": 330114, "epoch": 2728} {"train_loss": -43.92238998413086, "global_step": 330115, "epoch": 2728} {"train_loss": -43.343990325927734, "global_step": 330116, "epoch": 2728} {"train_loss": -43.72622299194336, "global_step": 330117, "epoch": 2728} {"train_loss": -44.089969635009766, "global_step": 330118, "epoch": 2728} {"train_loss": -43.81600570678711, "global_step": 330119, "epoch": 2728} {"train_loss": -42.12289047241211, "global_step": 330120, "epoch": 2728} {"train_loss": -42.860164642333984, "global_step": 330121, "epoch": 2728} {"train_loss": -44.48433303833008, "global_step": 330122, "epoch": 2728} {"train_loss": -41.67916488647461, "global_step": 330123, "epoch": 2728} {"train_loss": -41.6337890625, "global_step": 330124, "epoch": 2728} {"train_loss": -42.786094665527344, "global_step": 330125, "epoch": 2728} {"train_loss": -41.511146545410156, "global_step": 330126, "epoch": 2728} {"train_loss": -41.952308654785156, "global_step": 330127, "epoch": 2728} {"train_loss": -40.42241287231445, "global_step": 330128, "epoch": 2728} {"train_loss": -43.508453369140625, "global_step": 330129, "epoch": 2728} {"train_loss": -41.72139358520508, "global_step": 330130, "epoch": 2728} {"train_loss": -41.74398422241211, "global_step": 330131, "epoch": 2728} {"train_loss": -43.3521614074707, "global_step": 330132, "epoch": 2728} {"train_loss": -41.908321380615234, "global_step": 330133, "epoch": 2728} {"train_loss": -43.47115707397461, "global_step": 330134, "epoch": 2728} {"train_loss": -42.77717208862305, "global_step": 330135, "epoch": 2728} {"train_loss": -41.207923889160156, "global_step": 330136, "epoch": 2728} {"train_loss": -42.79436492919922, "global_step": 330137, "epoch": 2728} {"train_loss": -41.922847747802734, "global_step": 330138, "epoch": 2728} {"train_loss": -41.297584533691406, "global_step": 330139, "epoch": 2728} {"train_loss": -41.590065002441406, "global_step": 330140, "epoch": 2728} {"train_loss": -42.427154541015625, "global_step": 330141, "epoch": 2728} {"train_loss": -42.62336349487305, "global_step": 330142, "epoch": 2728} {"train_loss": -41.829811096191406, "global_step": 330143, "epoch": 2728} {"train_loss": -42.54490280151367, "global_step": 330144, "epoch": 2728} {"train_loss": -42.41023635864258, "global_step": 330145, "epoch": 2728} {"train_loss": -42.21648406982422, "global_step": 330146, "epoch": 2728} {"train_loss": -42.5890007019043, "global_step": 330147, "epoch": 2728} {"train_loss": -42.95585250854492, "global_step": 330148, "epoch": 2728} {"train_loss": -42.50014114379883, "global_step": 330149, "epoch": 2728} {"train_loss": -42.41191482543945, "global_step": 330150, "epoch": 2728} {"train_loss": -42.89284896850586, "global_step": 330151, "epoch": 2728} {"train_loss": -42.594539642333984, "global_step": 330152, "epoch": 2728} {"train_loss": -42.86149215698242, "global_step": 330153, "epoch": 2728} {"train_loss": -43.237457275390625, "global_step": 330154, "epoch": 2728} {"train_loss": -42.4219856262207, "global_step": 330155, "epoch": 2728} {"train_loss": -43.205013275146484, "global_step": 330156, "epoch": 2728} {"train_loss": -42.775489807128906, "global_step": 330157, "epoch": 2728} {"train_loss": -43.491878509521484, "global_step": 330158, "epoch": 2728} {"train_loss": -42.9490852355957, "global_step": 330159, "epoch": 2728} {"train_loss": -43.50959014892578, "global_step": 330160, "epoch": 2728} {"train_loss": -43.6044807434082, "global_step": 330161, "epoch": 2728} {"train_loss": -42.8877067565918, "global_step": 330162, "epoch": 2728} {"train_loss": -44.047725677490234, "global_step": 330163, "epoch": 2728} {"train_loss": -43.24617385864258, "global_step": 330164, "epoch": 2728} {"train_loss": -43.07497024536133, "global_step": 330165, "epoch": 2728} {"train_loss": -43.125732421875, "global_step": 330166, "epoch": 2728} {"train_loss": -43.48895263671875, "global_step": 330167, "epoch": 2728} {"train_loss": -43.60893630981445, "global_step": 330168, "epoch": 2728} {"train_loss": -43.8072509765625, "global_step": 330169, "epoch": 2728} {"train_loss": -43.974849700927734, "global_step": 330170, "epoch": 2728} {"train_loss": -43.79328536987305, "global_step": 330171, "epoch": 2728} {"train_loss": -43.51860427856445, "global_step": 330172, "epoch": 2728} {"train_loss": -43.966060638427734, "global_step": 330173, "epoch": 2728} {"train_loss": -43.820491790771484, "global_step": 330174, "epoch": 2728} {"train_loss": -43.9882926940918, "global_step": 330175, "epoch": 2728} {"train_loss": -44.1866569519043, "global_step": 330176, "epoch": 2728} {"train_loss": -43.65193557739258, "global_step": 330177, "epoch": 2728} {"train_loss": -43.79905700683594, "global_step": 330178, "epoch": 2728} {"train_loss": -44.647396087646484, "global_step": 330179, "epoch": 2728} {"train_loss": -44.010555267333984, "global_step": 330180, "epoch": 2728} {"train_loss": -43.6904411315918, "global_step": 330181, "epoch": 2728} {"train_loss": -43.62746047973633, "global_step": 330182, "epoch": 2728} {"train_loss": -43.857704162597656, "global_step": 330183, "epoch": 2728} {"train_loss": -44.3715705871582, "global_step": 330184, "epoch": 2728} {"train_loss": -44.317012786865234, "global_step": 330185, "epoch": 2728} {"train_loss": -43.46113967895508, "global_step": 330186, "epoch": 2728} {"train_loss": -44.54010772705078, "global_step": 330187, "epoch": 2728} {"train_loss": -43.64958190917969, "global_step": 330188, "epoch": 2728} {"train_loss": -43.16659164428711, "global_step": 330189, "epoch": 2728} {"train_loss": -43.5911750793457, "global_step": 330190, "epoch": 2728} {"train_loss": -44.4005126953125, "global_step": 330191, "epoch": 2728} {"train_loss": -43.619380950927734, "global_step": 330192, "epoch": 2728} {"train_loss": -43.53895568847656, "global_step": 330193, "epoch": 2728} {"train_loss": -44.663143157958984, "global_step": 330194, "epoch": 2728} {"train_loss": -44.46649169921875, "global_step": 330195, "epoch": 2728} {"train_loss": -44.0550422668457, "global_step": 330196, "epoch": 2728} {"train_loss": -44.51522445678711, "global_step": 330197, "epoch": 2728} {"train_loss": -44.31527328491211, "global_step": 330198, "epoch": 2728} {"train_loss": -44.545867919921875, "global_step": 330199, "epoch": 2728} {"train_loss": -44.55495834350586, "global_step": 330200, "epoch": 2728} {"train_loss": -44.70406723022461, "global_step": 330201, "epoch": 2728} {"train_loss": -44.89681625366211, "global_step": 330202, "epoch": 2728} {"train_loss": -43.75196075439453, "global_step": 330203, "epoch": 2728} {"train_loss": -44.600799560546875, "global_step": 330204, "epoch": 2728} {"train_loss": -45.02370834350586, "global_step": 330205, "epoch": 2728} {"train_loss": -43.871917724609375, "global_step": 330206, "epoch": 2728} {"train_loss": -44.25209426879883, "global_step": 330207, "epoch": 2728} {"train_loss": -43.48091506958008, "global_step": 330208, "epoch": 2728, "val_loss": 2478653.75} {"train_loss": -44.32099533081055, "global_step": 330209, "epoch": 2729} {"train_loss": -44.07630157470703, "global_step": 330210, "epoch": 2729} {"train_loss": -43.59440994262695, "global_step": 330211, "epoch": 2729} {"train_loss": -44.75980758666992, "global_step": 330212, "epoch": 2729} {"train_loss": -44.31998825073242, "global_step": 330213, "epoch": 2729} {"train_loss": -43.69197463989258, "global_step": 330214, "epoch": 2729} {"train_loss": -43.0546989440918, "global_step": 330215, "epoch": 2729} {"train_loss": -41.4581184387207, "global_step": 330216, "epoch": 2729} {"train_loss": -40.23842239379883, "global_step": 330217, "epoch": 2729} {"train_loss": -42.229766845703125, "global_step": 330218, "epoch": 2729} {"train_loss": -43.725704193115234, "global_step": 330219, "epoch": 2729} {"train_loss": -41.947181701660156, "global_step": 330220, "epoch": 2729} {"train_loss": -41.3486442565918, "global_step": 330221, "epoch": 2729} {"train_loss": -41.55904769897461, "global_step": 330222, "epoch": 2729} {"train_loss": -42.243682861328125, "global_step": 330223, "epoch": 2729} {"train_loss": -40.36159133911133, "global_step": 330224, "epoch": 2729} {"train_loss": -41.39561080932617, "global_step": 330225, "epoch": 2729} {"train_loss": -42.61640930175781, "global_step": 330226, "epoch": 2729} {"train_loss": -43.5588264465332, "global_step": 330227, "epoch": 2729} {"train_loss": -41.18749237060547, "global_step": 330228, "epoch": 2729} {"train_loss": -41.95027542114258, "global_step": 330229, "epoch": 2729} {"train_loss": -42.60970687866211, "global_step": 330230, "epoch": 2729} {"train_loss": -42.24704360961914, "global_step": 330231, "epoch": 2729} {"train_loss": -41.72030258178711, "global_step": 330232, "epoch": 2729} {"train_loss": -42.961910247802734, "global_step": 330233, "epoch": 2729} {"train_loss": -43.42304992675781, "global_step": 330234, "epoch": 2729} {"train_loss": -43.81541442871094, "global_step": 330235, "epoch": 2729} {"train_loss": -43.134422302246094, "global_step": 330236, "epoch": 2729} {"train_loss": -43.66071701049805, "global_step": 330237, "epoch": 2729} {"train_loss": -43.5388298034668, "global_step": 330238, "epoch": 2729} {"train_loss": -43.68973159790039, "global_step": 330239, "epoch": 2729} {"train_loss": -43.196006774902344, "global_step": 330240, "epoch": 2729} {"train_loss": -43.72158432006836, "global_step": 330241, "epoch": 2729} {"train_loss": -43.50774002075195, "global_step": 330242, "epoch": 2729} {"train_loss": -43.977718353271484, "global_step": 330243, "epoch": 2729} {"train_loss": -44.19820022583008, "global_step": 330244, "epoch": 2729} {"train_loss": -44.230770111083984, "global_step": 330245, "epoch": 2729} {"train_loss": -44.078365325927734, "global_step": 330246, "epoch": 2729} {"train_loss": -44.35016632080078, "global_step": 330247, "epoch": 2729} {"train_loss": -44.583736419677734, "global_step": 330248, "epoch": 2729} {"train_loss": -43.844539642333984, "global_step": 330249, "epoch": 2729} {"train_loss": -44.185943603515625, "global_step": 330250, "epoch": 2729} {"train_loss": -44.141822814941406, "global_step": 330251, "epoch": 2729} {"train_loss": -43.440433502197266, "global_step": 330252, "epoch": 2729} {"train_loss": -44.29008102416992, "global_step": 330253, "epoch": 2729} {"train_loss": -44.5727653503418, "global_step": 330254, "epoch": 2729} {"train_loss": -44.096343994140625, "global_step": 330255, "epoch": 2729} {"train_loss": -44.41931915283203, "global_step": 330256, "epoch": 2729} {"train_loss": -44.06686019897461, "global_step": 330257, "epoch": 2729} {"train_loss": -44.34296798706055, "global_step": 330258, "epoch": 2729} {"train_loss": -44.18198776245117, "global_step": 330259, "epoch": 2729} {"train_loss": -43.68998718261719, "global_step": 330260, "epoch": 2729} {"train_loss": -43.555965423583984, "global_step": 330261, "epoch": 2729} {"train_loss": -43.32148361206055, "global_step": 330262, "epoch": 2729} {"train_loss": -42.761287689208984, "global_step": 330263, "epoch": 2729} {"train_loss": -43.25828170776367, "global_step": 330264, "epoch": 2729} {"train_loss": -42.8018798828125, "global_step": 330265, "epoch": 2729} {"train_loss": -42.73508834838867, "global_step": 330266, "epoch": 2729} {"train_loss": -41.341094970703125, "global_step": 330267, "epoch": 2729} {"train_loss": -42.00265121459961, "global_step": 330268, "epoch": 2729} {"train_loss": -42.5413932800293, "global_step": 330269, "epoch": 2729} {"train_loss": -41.61707305908203, "global_step": 330270, "epoch": 2729} {"train_loss": -42.76130294799805, "global_step": 330271, "epoch": 2729} {"train_loss": -42.62877655029297, "global_step": 330272, "epoch": 2729} {"train_loss": -41.961978912353516, "global_step": 330273, "epoch": 2729} {"train_loss": -41.76873779296875, "global_step": 330274, "epoch": 2729} {"train_loss": -42.156551361083984, "global_step": 330275, "epoch": 2729} {"train_loss": -41.6630859375, "global_step": 330276, "epoch": 2729} {"train_loss": -42.24575424194336, "global_step": 330277, "epoch": 2729} {"train_loss": -42.00498580932617, "global_step": 330278, "epoch": 2729} {"train_loss": -40.9824104309082, "global_step": 330279, "epoch": 2729} {"train_loss": -39.63965606689453, "global_step": 330280, "epoch": 2729} {"train_loss": -42.46345901489258, "global_step": 330281, "epoch": 2729} {"train_loss": -39.56317138671875, "global_step": 330282, "epoch": 2729} {"train_loss": -41.33210372924805, "global_step": 330283, "epoch": 2729} {"train_loss": -41.015560150146484, "global_step": 330284, "epoch": 2729} {"train_loss": -40.633602142333984, "global_step": 330285, "epoch": 2729} {"train_loss": -42.34824752807617, "global_step": 330286, "epoch": 2729} {"train_loss": -42.3739128112793, "global_step": 330287, "epoch": 2729} {"train_loss": -42.35431671142578, "global_step": 330288, "epoch": 2729} {"train_loss": -42.32110595703125, "global_step": 330289, "epoch": 2729} {"train_loss": -43.14310836791992, "global_step": 330290, "epoch": 2729} {"train_loss": -42.84627914428711, "global_step": 330291, "epoch": 2729} {"train_loss": -42.561153411865234, "global_step": 330292, "epoch": 2729} {"train_loss": -42.90447998046875, "global_step": 330293, "epoch": 2729} {"train_loss": -42.14406204223633, "global_step": 330294, "epoch": 2729} {"train_loss": -43.0338134765625, "global_step": 330295, "epoch": 2729} {"train_loss": -43.061317443847656, "global_step": 330296, "epoch": 2729} {"train_loss": -42.87498092651367, "global_step": 330297, "epoch": 2729} {"train_loss": -43.77334976196289, "global_step": 330298, "epoch": 2729} {"train_loss": -43.439510345458984, "global_step": 330299, "epoch": 2729} {"train_loss": -43.28389358520508, "global_step": 330300, "epoch": 2729} {"train_loss": -43.348243713378906, "global_step": 330301, "epoch": 2729} {"train_loss": -43.26346969604492, "global_step": 330302, "epoch": 2729} {"train_loss": -44.25355911254883, "global_step": 330303, "epoch": 2729} {"train_loss": -43.18701934814453, "global_step": 330304, "epoch": 2729} {"train_loss": -44.370147705078125, "global_step": 330305, "epoch": 2729} {"train_loss": -43.710594177246094, "global_step": 330306, "epoch": 2729} {"train_loss": -44.0036506652832, "global_step": 330307, "epoch": 2729} {"train_loss": -44.36246871948242, "global_step": 330308, "epoch": 2729} {"train_loss": -44.298118591308594, "global_step": 330309, "epoch": 2729} {"train_loss": -44.318359375, "global_step": 330310, "epoch": 2729} {"train_loss": -44.19657516479492, "global_step": 330311, "epoch": 2729} {"train_loss": -44.14209747314453, "global_step": 330312, "epoch": 2729} {"train_loss": -44.3211784362793, "global_step": 330313, "epoch": 2729} {"train_loss": -43.98762130737305, "global_step": 330314, "epoch": 2729} {"train_loss": -44.082740783691406, "global_step": 330315, "epoch": 2729} {"train_loss": -44.57229232788086, "global_step": 330316, "epoch": 2729} {"train_loss": -44.649349212646484, "global_step": 330317, "epoch": 2729} {"train_loss": -44.2718620300293, "global_step": 330318, "epoch": 2729} {"train_loss": -44.4265251159668, "global_step": 330319, "epoch": 2729} {"train_loss": -44.58526611328125, "global_step": 330320, "epoch": 2729} {"train_loss": -44.33746337890625, "global_step": 330321, "epoch": 2729} {"train_loss": -44.891544342041016, "global_step": 330322, "epoch": 2729} {"train_loss": -44.84550857543945, "global_step": 330323, "epoch": 2729} {"train_loss": -44.81252670288086, "global_step": 330324, "epoch": 2729} {"train_loss": -44.57550048828125, "global_step": 330325, "epoch": 2729} {"train_loss": -44.68651580810547, "global_step": 330326, "epoch": 2729} {"train_loss": -44.15989303588867, "global_step": 330327, "epoch": 2729} {"train_loss": -44.8669319152832, "global_step": 330328, "epoch": 2729} {"train_loss": -43.18028527251945, "global_step": 330329, "epoch": 2729, "val_loss": 2428039.75} {"train_loss": -44.73738479614258, "global_step": 330330, "epoch": 2730} {"train_loss": -44.602027893066406, "global_step": 330331, "epoch": 2730} {"train_loss": -44.420265197753906, "global_step": 330332, "epoch": 2730} {"train_loss": -44.8104362487793, "global_step": 330333, "epoch": 2730} {"train_loss": -44.354000091552734, "global_step": 330334, "epoch": 2730} {"train_loss": -44.75716018676758, "global_step": 330335, "epoch": 2730} {"train_loss": -44.89400863647461, "global_step": 330336, "epoch": 2730} {"train_loss": -44.704002380371094, "global_step": 330337, "epoch": 2730} {"train_loss": -44.86627960205078, "global_step": 330338, "epoch": 2730} {"train_loss": -44.91975021362305, "global_step": 330339, "epoch": 2730} {"train_loss": -44.163326263427734, "global_step": 330340, "epoch": 2730} {"train_loss": -44.4942512512207, "global_step": 330341, "epoch": 2730} {"train_loss": -45.04488754272461, "global_step": 330342, "epoch": 2730} {"train_loss": -44.814117431640625, "global_step": 330343, "epoch": 2730} {"train_loss": -44.80248260498047, "global_step": 330344, "epoch": 2730} {"train_loss": -44.931522369384766, "global_step": 330345, "epoch": 2730} {"train_loss": -43.92695999145508, "global_step": 330346, "epoch": 2730} {"train_loss": -44.78855514526367, "global_step": 330347, "epoch": 2730} {"train_loss": -44.47357940673828, "global_step": 330348, "epoch": 2730} {"train_loss": -44.70705795288086, "global_step": 330349, "epoch": 2730} {"train_loss": -44.93486404418945, "global_step": 330350, "epoch": 2730} {"train_loss": -44.04623031616211, "global_step": 330351, "epoch": 2730} {"train_loss": -44.74287796020508, "global_step": 330352, "epoch": 2730} {"train_loss": -45.23332595825195, "global_step": 330353, "epoch": 2730} {"train_loss": -45.130523681640625, "global_step": 330354, "epoch": 2730} {"train_loss": -44.264835357666016, "global_step": 330355, "epoch": 2730} {"train_loss": -45.06980514526367, "global_step": 330356, "epoch": 2730} {"train_loss": -44.70591354370117, "global_step": 330357, "epoch": 2730} {"train_loss": -44.467227935791016, "global_step": 330358, "epoch": 2730} {"train_loss": -44.38014602661133, "global_step": 330359, "epoch": 2730} {"train_loss": -43.70512771606445, "global_step": 330360, "epoch": 2730} {"train_loss": -44.22121047973633, "global_step": 330361, "epoch": 2730} {"train_loss": -43.822261810302734, "global_step": 330362, "epoch": 2730} {"train_loss": -41.85244369506836, "global_step": 330363, "epoch": 2730} {"train_loss": -39.33130645751953, "global_step": 330364, "epoch": 2730} {"train_loss": -34.449947357177734, "global_step": 330365, "epoch": 2730} {"train_loss": -34.66164016723633, "global_step": 330366, "epoch": 2730} {"train_loss": -37.32160568237305, "global_step": 330367, "epoch": 2730} {"train_loss": -40.218257904052734, "global_step": 330368, "epoch": 2730} {"train_loss": -41.357059478759766, "global_step": 330369, "epoch": 2730} {"train_loss": -36.411495208740234, "global_step": 330370, "epoch": 2730} {"train_loss": -38.52058792114258, "global_step": 330371, "epoch": 2730} {"train_loss": -41.606781005859375, "global_step": 330372, "epoch": 2730} {"train_loss": -40.35356521606445, "global_step": 330373, "epoch": 2730} {"train_loss": -41.17658615112305, "global_step": 330374, "epoch": 2730} {"train_loss": -41.96353530883789, "global_step": 330375, "epoch": 2730} {"train_loss": -40.9716682434082, "global_step": 330376, "epoch": 2730} {"train_loss": -41.357418060302734, "global_step": 330377, "epoch": 2730} {"train_loss": -42.69814682006836, "global_step": 330378, "epoch": 2730} {"train_loss": -41.48201370239258, "global_step": 330379, "epoch": 2730} {"train_loss": -42.988037109375, "global_step": 330380, "epoch": 2730} {"train_loss": -42.441619873046875, "global_step": 330381, "epoch": 2730} {"train_loss": -43.05537033081055, "global_step": 330382, "epoch": 2730} {"train_loss": -43.20710372924805, "global_step": 330383, "epoch": 2730} {"train_loss": -42.6410026550293, "global_step": 330384, "epoch": 2730} {"train_loss": -43.005584716796875, "global_step": 330385, "epoch": 2730} {"train_loss": -43.13682174682617, "global_step": 330386, "epoch": 2730} {"train_loss": -43.47711944580078, "global_step": 330387, "epoch": 2730} {"train_loss": -42.416648864746094, "global_step": 330388, "epoch": 2730} {"train_loss": -43.185787200927734, "global_step": 330389, "epoch": 2730} {"train_loss": -42.75014877319336, "global_step": 330390, "epoch": 2730} {"train_loss": -43.30339050292969, "global_step": 330391, "epoch": 2730} {"train_loss": -43.05998229980469, "global_step": 330392, "epoch": 2730} {"train_loss": -43.06144332885742, "global_step": 330393, "epoch": 2730} {"train_loss": -43.756500244140625, "global_step": 330394, "epoch": 2730} {"train_loss": -43.42613220214844, "global_step": 330395, "epoch": 2730} {"train_loss": -43.932586669921875, "global_step": 330396, "epoch": 2730} {"train_loss": -43.82442092895508, "global_step": 330397, "epoch": 2730} {"train_loss": -43.88294982910156, "global_step": 330398, "epoch": 2730} {"train_loss": -43.669124603271484, "global_step": 330399, "epoch": 2730} {"train_loss": -44.13351058959961, "global_step": 330400, "epoch": 2730} {"train_loss": -43.64585494995117, "global_step": 330401, "epoch": 2730} {"train_loss": -44.26702880859375, "global_step": 330402, "epoch": 2730} {"train_loss": -44.082969665527344, "global_step": 330403, "epoch": 2730} {"train_loss": -44.24078369140625, "global_step": 330404, "epoch": 2730} {"train_loss": -44.256587982177734, "global_step": 330405, "epoch": 2730} {"train_loss": -44.16032028198242, "global_step": 330406, "epoch": 2730} {"train_loss": -44.361446380615234, "global_step": 330407, "epoch": 2730} {"train_loss": -44.40338134765625, "global_step": 330408, "epoch": 2730} {"train_loss": -44.0826301574707, "global_step": 330409, "epoch": 2730} {"train_loss": -44.17255783081055, "global_step": 330410, "epoch": 2730} {"train_loss": -44.22999954223633, "global_step": 330411, "epoch": 2730} {"train_loss": -44.16689682006836, "global_step": 330412, "epoch": 2730} {"train_loss": -44.21820068359375, "global_step": 330413, "epoch": 2730} {"train_loss": -43.95878219604492, "global_step": 330414, "epoch": 2730} {"train_loss": -44.62444305419922, "global_step": 330415, "epoch": 2730} {"train_loss": -44.011077880859375, "global_step": 330416, "epoch": 2730} {"train_loss": -44.82521438598633, "global_step": 330417, "epoch": 2730} {"train_loss": -44.73836898803711, "global_step": 330418, "epoch": 2730} {"train_loss": -44.829341888427734, "global_step": 330419, "epoch": 2730} {"train_loss": -44.636077880859375, "global_step": 330420, "epoch": 2730} {"train_loss": -44.72504806518555, "global_step": 330421, "epoch": 2730} {"train_loss": -44.68092727661133, "global_step": 330422, "epoch": 2730} {"train_loss": -44.546661376953125, "global_step": 330423, "epoch": 2730} {"train_loss": -44.48722457885742, "global_step": 330424, "epoch": 2730} {"train_loss": -44.675392150878906, "global_step": 330425, "epoch": 2730} {"train_loss": -45.27120590209961, "global_step": 330426, "epoch": 2730} {"train_loss": -45.033851623535156, "global_step": 330427, "epoch": 2730} {"train_loss": -44.864723205566406, "global_step": 330428, "epoch": 2730} {"train_loss": -45.00127029418945, "global_step": 330429, "epoch": 2730} {"train_loss": -45.11773681640625, "global_step": 330430, "epoch": 2730} {"train_loss": -45.168636322021484, "global_step": 330431, "epoch": 2730} {"train_loss": -44.67413330078125, "global_step": 330432, "epoch": 2730} {"train_loss": -45.36910629272461, "global_step": 330433, "epoch": 2730} {"train_loss": -45.11757278442383, "global_step": 330434, "epoch": 2730} {"train_loss": -45.04058074951172, "global_step": 330435, "epoch": 2730} {"train_loss": -45.06341552734375, "global_step": 330436, "epoch": 2730} {"train_loss": -44.72861862182617, "global_step": 330437, "epoch": 2730} {"train_loss": -44.859554290771484, "global_step": 330438, "epoch": 2730} {"train_loss": -45.10866165161133, "global_step": 330439, "epoch": 2730} {"train_loss": -45.62821578979492, "global_step": 330440, "epoch": 2730} {"train_loss": -44.644927978515625, "global_step": 330441, "epoch": 2730} {"train_loss": -44.678802490234375, "global_step": 330442, "epoch": 2730} {"train_loss": -44.375972747802734, "global_step": 330443, "epoch": 2730} {"train_loss": -44.88185119628906, "global_step": 330444, "epoch": 2730} {"train_loss": -45.20798873901367, "global_step": 330445, "epoch": 2730} {"train_loss": -45.129539489746094, "global_step": 330446, "epoch": 2730} {"train_loss": -44.9514045715332, "global_step": 330447, "epoch": 2730} {"train_loss": -45.55500411987305, "global_step": 330448, "epoch": 2730} {"train_loss": -45.09001159667969, "global_step": 330449, "epoch": 2730} {"train_loss": -43.72436422552944, "global_step": 330450, "epoch": 2730, "val_loss": 2591654.0} {"train_loss": -44.64944076538086, "global_step": 330451, "epoch": 2731} {"train_loss": -45.455177307128906, "global_step": 330452, "epoch": 2731} {"train_loss": -45.08346939086914, "global_step": 330453, "epoch": 2731} {"train_loss": -45.34454345703125, "global_step": 330454, "epoch": 2731} {"train_loss": -45.203582763671875, "global_step": 330455, "epoch": 2731} {"train_loss": -43.92472457885742, "global_step": 330456, "epoch": 2731} {"train_loss": -44.76343536376953, "global_step": 330457, "epoch": 2731} {"train_loss": -44.7978630065918, "global_step": 330458, "epoch": 2731} {"train_loss": -44.43610763549805, "global_step": 330459, "epoch": 2731} {"train_loss": -44.137962341308594, "global_step": 330460, "epoch": 2731} {"train_loss": -43.7439079284668, "global_step": 330461, "epoch": 2731} {"train_loss": -42.923133850097656, "global_step": 330462, "epoch": 2731} {"train_loss": -40.326595306396484, "global_step": 330463, "epoch": 2731} {"train_loss": -38.90549850463867, "global_step": 330464, "epoch": 2731} {"train_loss": -41.251094818115234, "global_step": 330465, "epoch": 2731} {"train_loss": -44.12251663208008, "global_step": 330466, "epoch": 2731} {"train_loss": -43.84566879272461, "global_step": 330467, "epoch": 2731} {"train_loss": -42.011932373046875, "global_step": 330468, "epoch": 2731} {"train_loss": -42.967464447021484, "global_step": 330469, "epoch": 2731} {"train_loss": -44.3555908203125, "global_step": 330470, "epoch": 2731} {"train_loss": -41.7838134765625, "global_step": 330471, "epoch": 2731} {"train_loss": -40.66482162475586, "global_step": 330472, "epoch": 2731} {"train_loss": -43.17171096801758, "global_step": 330473, "epoch": 2731} {"train_loss": -42.932308197021484, "global_step": 330474, "epoch": 2731} {"train_loss": -41.58191680908203, "global_step": 330475, "epoch": 2731} {"train_loss": -43.01690673828125, "global_step": 330476, "epoch": 2731} {"train_loss": -43.00384521484375, "global_step": 330477, "epoch": 2731} {"train_loss": -42.067169189453125, "global_step": 330478, "epoch": 2731} {"train_loss": -41.05148696899414, "global_step": 330479, "epoch": 2731} {"train_loss": -41.156150817871094, "global_step": 330480, "epoch": 2731} {"train_loss": -41.977787017822266, "global_step": 330481, "epoch": 2731} {"train_loss": -38.73934555053711, "global_step": 330482, "epoch": 2731} {"train_loss": -39.93268966674805, "global_step": 330483, "epoch": 2731} {"train_loss": -43.00675582885742, "global_step": 330484, "epoch": 2731} {"train_loss": -42.24441909790039, "global_step": 330485, "epoch": 2731} {"train_loss": -38.91621780395508, "global_step": 330486, "epoch": 2731} {"train_loss": -41.673519134521484, "global_step": 330487, "epoch": 2731} {"train_loss": -42.5637321472168, "global_step": 330488, "epoch": 2731} {"train_loss": -42.75531768798828, "global_step": 330489, "epoch": 2731} {"train_loss": -42.987098693847656, "global_step": 330490, "epoch": 2731} {"train_loss": -43.36042404174805, "global_step": 330491, "epoch": 2731} {"train_loss": -43.2618522644043, "global_step": 330492, "epoch": 2731} {"train_loss": -43.9317741394043, "global_step": 330493, "epoch": 2731} {"train_loss": -43.96672821044922, "global_step": 330494, "epoch": 2731} {"train_loss": -43.784210205078125, "global_step": 330495, "epoch": 2731} {"train_loss": -43.63353729248047, "global_step": 330496, "epoch": 2731} {"train_loss": -43.79833984375, "global_step": 330497, "epoch": 2731} {"train_loss": -44.21950149536133, "global_step": 330498, "epoch": 2731} {"train_loss": -43.6889533996582, "global_step": 330499, "epoch": 2731} {"train_loss": -44.18219757080078, "global_step": 330500, "epoch": 2731} {"train_loss": -43.90785598754883, "global_step": 330501, "epoch": 2731} {"train_loss": -43.945247650146484, "global_step": 330502, "epoch": 2731} {"train_loss": -43.97895050048828, "global_step": 330503, "epoch": 2731} {"train_loss": -43.76169204711914, "global_step": 330504, "epoch": 2731} {"train_loss": -43.89046096801758, "global_step": 330505, "epoch": 2731} {"train_loss": -44.09280776977539, "global_step": 330506, "epoch": 2731} {"train_loss": -44.4516487121582, "global_step": 330507, "epoch": 2731} {"train_loss": -44.1407356262207, "global_step": 330508, "epoch": 2731} {"train_loss": -44.55109786987305, "global_step": 330509, "epoch": 2731} {"train_loss": -44.151851654052734, "global_step": 330510, "epoch": 2731} {"train_loss": -44.29909896850586, "global_step": 330511, "epoch": 2731} {"train_loss": -44.39583206176758, "global_step": 330512, "epoch": 2731} {"train_loss": -43.933692932128906, "global_step": 330513, "epoch": 2731} {"train_loss": -44.4359016418457, "global_step": 330514, "epoch": 2731} {"train_loss": -44.18783950805664, "global_step": 330515, "epoch": 2731} {"train_loss": -43.89348602294922, "global_step": 330516, "epoch": 2731} {"train_loss": -44.38682174682617, "global_step": 330517, "epoch": 2731} {"train_loss": -44.540435791015625, "global_step": 330518, "epoch": 2731} {"train_loss": -44.71681594848633, "global_step": 330519, "epoch": 2731} {"train_loss": -44.203514099121094, "global_step": 330520, "epoch": 2731} {"train_loss": -43.51338577270508, "global_step": 330521, "epoch": 2731} {"train_loss": -44.256011962890625, "global_step": 330522, "epoch": 2731} {"train_loss": -44.792091369628906, "global_step": 330523, "epoch": 2731} {"train_loss": -44.31769943237305, "global_step": 330524, "epoch": 2731} {"train_loss": -44.75504684448242, "global_step": 330525, "epoch": 2731} {"train_loss": -44.584632873535156, "global_step": 330526, "epoch": 2731} {"train_loss": -44.26401901245117, "global_step": 330527, "epoch": 2731} {"train_loss": -44.74456024169922, "global_step": 330528, "epoch": 2731} {"train_loss": -44.38975524902344, "global_step": 330529, "epoch": 2731} {"train_loss": -44.78684616088867, "global_step": 330530, "epoch": 2731} {"train_loss": -44.87559127807617, "global_step": 330531, "epoch": 2731} {"train_loss": -44.15735626220703, "global_step": 330532, "epoch": 2731} {"train_loss": -44.99531173706055, "global_step": 330533, "epoch": 2731} {"train_loss": -44.83768844604492, "global_step": 330534, "epoch": 2731} {"train_loss": -44.90822982788086, "global_step": 330535, "epoch": 2731} {"train_loss": -44.4547119140625, "global_step": 330536, "epoch": 2731} {"train_loss": -44.69881057739258, "global_step": 330537, "epoch": 2731} {"train_loss": -44.39152145385742, "global_step": 330538, "epoch": 2731} {"train_loss": -44.43021774291992, "global_step": 330539, "epoch": 2731} {"train_loss": -44.70895004272461, "global_step": 330540, "epoch": 2731} {"train_loss": -44.6677360534668, "global_step": 330541, "epoch": 2731} {"train_loss": -44.75251388549805, "global_step": 330542, "epoch": 2731} {"train_loss": -44.70931625366211, "global_step": 330543, "epoch": 2731} {"train_loss": -45.215518951416016, "global_step": 330544, "epoch": 2731} {"train_loss": -45.073482513427734, "global_step": 330545, "epoch": 2731} {"train_loss": -44.9467887878418, "global_step": 330546, "epoch": 2731} {"train_loss": -44.496803283691406, "global_step": 330547, "epoch": 2731} {"train_loss": -44.520206451416016, "global_step": 330548, "epoch": 2731} {"train_loss": -45.04813766479492, "global_step": 330549, "epoch": 2731} {"train_loss": -44.17934036254883, "global_step": 330550, "epoch": 2731} {"train_loss": -44.5147705078125, "global_step": 330551, "epoch": 2731} {"train_loss": -44.90720748901367, "global_step": 330552, "epoch": 2731} {"train_loss": -44.47384262084961, "global_step": 330553, "epoch": 2731} {"train_loss": -44.77288055419922, "global_step": 330554, "epoch": 2731} {"train_loss": -43.9648323059082, "global_step": 330555, "epoch": 2731} {"train_loss": -44.71894454956055, "global_step": 330556, "epoch": 2731} {"train_loss": -44.75679397583008, "global_step": 330557, "epoch": 2731} {"train_loss": -44.349945068359375, "global_step": 330558, "epoch": 2731} {"train_loss": -43.89582824707031, "global_step": 330559, "epoch": 2731} {"train_loss": -44.71149826049805, "global_step": 330560, "epoch": 2731} {"train_loss": -44.88538360595703, "global_step": 330561, "epoch": 2731} {"train_loss": -44.05709457397461, "global_step": 330562, "epoch": 2731} {"train_loss": -44.28449630737305, "global_step": 330563, "epoch": 2731} {"train_loss": -45.0081672668457, "global_step": 330564, "epoch": 2731} {"train_loss": -44.02300262451172, "global_step": 330565, "epoch": 2731} {"train_loss": -44.0231819152832, "global_step": 330566, "epoch": 2731} {"train_loss": -44.31710433959961, "global_step": 330567, "epoch": 2731} {"train_loss": -45.3782844543457, "global_step": 330568, "epoch": 2731} {"train_loss": -44.290626525878906, "global_step": 330569, "epoch": 2731} {"train_loss": -44.672576904296875, "global_step": 330570, "epoch": 2731} {"train_loss": -43.82502746582031, "global_step": 330571, "epoch": 2731, "val_loss": 2430480.25} {"train_loss": -44.66108322143555, "global_step": 330572, "epoch": 2732} {"train_loss": -45.2132453918457, "global_step": 330573, "epoch": 2732} {"train_loss": -44.36423873901367, "global_step": 330574, "epoch": 2732} {"train_loss": -44.07030487060547, "global_step": 330575, "epoch": 2732} {"train_loss": -43.124324798583984, "global_step": 330576, "epoch": 2732} {"train_loss": -44.184112548828125, "global_step": 330577, "epoch": 2732} {"train_loss": -45.28192901611328, "global_step": 330578, "epoch": 2732} {"train_loss": -44.017547607421875, "global_step": 330579, "epoch": 2732} {"train_loss": -44.06907272338867, "global_step": 330580, "epoch": 2732} {"train_loss": -44.2653694152832, "global_step": 330581, "epoch": 2732} {"train_loss": -44.397579193115234, "global_step": 330582, "epoch": 2732} {"train_loss": -44.11878204345703, "global_step": 330583, "epoch": 2732} {"train_loss": -43.8408203125, "global_step": 330584, "epoch": 2732} {"train_loss": -44.90283966064453, "global_step": 330585, "epoch": 2732} {"train_loss": -44.45820999145508, "global_step": 330586, "epoch": 2732} {"train_loss": -43.874671936035156, "global_step": 330587, "epoch": 2732} {"train_loss": -44.19551467895508, "global_step": 330588, "epoch": 2732} {"train_loss": -44.05121994018555, "global_step": 330589, "epoch": 2732} {"train_loss": -44.03940963745117, "global_step": 330590, "epoch": 2732} {"train_loss": -42.8702507019043, "global_step": 330591, "epoch": 2732} {"train_loss": -41.925819396972656, "global_step": 330592, "epoch": 2732} {"train_loss": -42.79688262939453, "global_step": 330593, "epoch": 2732} {"train_loss": -44.265743255615234, "global_step": 330594, "epoch": 2732} {"train_loss": -43.625423431396484, "global_step": 330595, "epoch": 2732} {"train_loss": -43.25046157836914, "global_step": 330596, "epoch": 2732} {"train_loss": -43.912837982177734, "global_step": 330597, "epoch": 2732} {"train_loss": -44.645790100097656, "global_step": 330598, "epoch": 2732} {"train_loss": -43.1510124206543, "global_step": 330599, "epoch": 2732} {"train_loss": -42.59089279174805, "global_step": 330600, "epoch": 2732} {"train_loss": -43.41914749145508, "global_step": 330601, "epoch": 2732} {"train_loss": -42.61322784423828, "global_step": 330602, "epoch": 2732} {"train_loss": -44.02766036987305, "global_step": 330603, "epoch": 2732} {"train_loss": -42.6986083984375, "global_step": 330604, "epoch": 2732} {"train_loss": -41.625423431396484, "global_step": 330605, "epoch": 2732} {"train_loss": -40.035037994384766, "global_step": 330606, "epoch": 2732} {"train_loss": -42.09699249267578, "global_step": 330607, "epoch": 2732} {"train_loss": -42.04536056518555, "global_step": 330608, "epoch": 2732} {"train_loss": -42.74211120605469, "global_step": 330609, "epoch": 2732} {"train_loss": -41.83681869506836, "global_step": 330610, "epoch": 2732} {"train_loss": -41.70667266845703, "global_step": 330611, "epoch": 2732} {"train_loss": -42.814048767089844, "global_step": 330612, "epoch": 2732} {"train_loss": -43.79329299926758, "global_step": 330613, "epoch": 2732} {"train_loss": -42.87565994262695, "global_step": 330614, "epoch": 2732} {"train_loss": -43.497039794921875, "global_step": 330615, "epoch": 2732} {"train_loss": -42.788665771484375, "global_step": 330616, "epoch": 2732} {"train_loss": -41.21576690673828, "global_step": 330617, "epoch": 2732} {"train_loss": -41.781219482421875, "global_step": 330618, "epoch": 2732} {"train_loss": -42.42279052734375, "global_step": 330619, "epoch": 2732} {"train_loss": -42.83753204345703, "global_step": 330620, "epoch": 2732} {"train_loss": -42.62614059448242, "global_step": 330621, "epoch": 2732} {"train_loss": -42.926998138427734, "global_step": 330622, "epoch": 2732} {"train_loss": -42.76043701171875, "global_step": 330623, "epoch": 2732} {"train_loss": -43.216888427734375, "global_step": 330624, "epoch": 2732} {"train_loss": -43.06815719604492, "global_step": 330625, "epoch": 2732} {"train_loss": -42.23079299926758, "global_step": 330626, "epoch": 2732} {"train_loss": -43.24857711791992, "global_step": 330627, "epoch": 2732} {"train_loss": -43.794471740722656, "global_step": 330628, "epoch": 2732} {"train_loss": -43.32938003540039, "global_step": 330629, "epoch": 2732} {"train_loss": -44.2525634765625, "global_step": 330630, "epoch": 2732} {"train_loss": -44.012603759765625, "global_step": 330631, "epoch": 2732} {"train_loss": -43.32735061645508, "global_step": 330632, "epoch": 2732} {"train_loss": -43.996734619140625, "global_step": 330633, "epoch": 2732} {"train_loss": -43.71236801147461, "global_step": 330634, "epoch": 2732} {"train_loss": -43.40019607543945, "global_step": 330635, "epoch": 2732} {"train_loss": -43.52225875854492, "global_step": 330636, "epoch": 2732} {"train_loss": -44.52939987182617, "global_step": 330637, "epoch": 2732} {"train_loss": -43.88725662231445, "global_step": 330638, "epoch": 2732} {"train_loss": -43.51266098022461, "global_step": 330639, "epoch": 2732} {"train_loss": -43.39613342285156, "global_step": 330640, "epoch": 2732} {"train_loss": -42.771358489990234, "global_step": 330641, "epoch": 2732} {"train_loss": -43.858917236328125, "global_step": 330642, "epoch": 2732} {"train_loss": -43.74251937866211, "global_step": 330643, "epoch": 2732} {"train_loss": -44.540889739990234, "global_step": 330644, "epoch": 2732} {"train_loss": -43.93937301635742, "global_step": 330645, "epoch": 2732} {"train_loss": -42.383766174316406, "global_step": 330646, "epoch": 2732} {"train_loss": -43.495994567871094, "global_step": 330647, "epoch": 2732} {"train_loss": -44.14871597290039, "global_step": 330648, "epoch": 2732} {"train_loss": -43.717369079589844, "global_step": 330649, "epoch": 2732} {"train_loss": -43.169795989990234, "global_step": 330650, "epoch": 2732} {"train_loss": -44.01152420043945, "global_step": 330651, "epoch": 2732} {"train_loss": -43.003700256347656, "global_step": 330652, "epoch": 2732} {"train_loss": -43.672828674316406, "global_step": 330653, "epoch": 2732} {"train_loss": -43.79085922241211, "global_step": 330654, "epoch": 2732} {"train_loss": -44.21955490112305, "global_step": 330655, "epoch": 2732} {"train_loss": -43.890663146972656, "global_step": 330656, "epoch": 2732} {"train_loss": -43.57931137084961, "global_step": 330657, "epoch": 2732} {"train_loss": -44.4830207824707, "global_step": 330658, "epoch": 2732} {"train_loss": -43.93976593017578, "global_step": 330659, "epoch": 2732} {"train_loss": -44.419708251953125, "global_step": 330660, "epoch": 2732} {"train_loss": -43.79622268676758, "global_step": 330661, "epoch": 2732} {"train_loss": -44.24509811401367, "global_step": 330662, "epoch": 2732} {"train_loss": -44.609195709228516, "global_step": 330663, "epoch": 2732} {"train_loss": -44.466548919677734, "global_step": 330664, "epoch": 2732} {"train_loss": -44.19327926635742, "global_step": 330665, "epoch": 2732} {"train_loss": -44.28668975830078, "global_step": 330666, "epoch": 2732} {"train_loss": -43.552982330322266, "global_step": 330667, "epoch": 2732} {"train_loss": -44.60313034057617, "global_step": 330668, "epoch": 2732} {"train_loss": -43.62189483642578, "global_step": 330669, "epoch": 2732} {"train_loss": -43.2945556640625, "global_step": 330670, "epoch": 2732} {"train_loss": -43.20313262939453, "global_step": 330671, "epoch": 2732} {"train_loss": -43.05613327026367, "global_step": 330672, "epoch": 2732} {"train_loss": -44.284027099609375, "global_step": 330673, "epoch": 2732} {"train_loss": -43.2994384765625, "global_step": 330674, "epoch": 2732} {"train_loss": -43.788204193115234, "global_step": 330675, "epoch": 2732} {"train_loss": -43.16850662231445, "global_step": 330676, "epoch": 2732} {"train_loss": -44.14482116699219, "global_step": 330677, "epoch": 2732} {"train_loss": -43.964229583740234, "global_step": 330678, "epoch": 2732} {"train_loss": -42.5871696472168, "global_step": 330679, "epoch": 2732} {"train_loss": -43.95668029785156, "global_step": 330680, "epoch": 2732} {"train_loss": -44.348304748535156, "global_step": 330681, "epoch": 2732} {"train_loss": -44.0872688293457, "global_step": 330682, "epoch": 2732} {"train_loss": -43.63764190673828, "global_step": 330683, "epoch": 2732} {"train_loss": -45.155426025390625, "global_step": 330684, "epoch": 2732} {"train_loss": -43.974998474121094, "global_step": 330685, "epoch": 2732} {"train_loss": -44.287899017333984, "global_step": 330686, "epoch": 2732} {"train_loss": -44.26917266845703, "global_step": 330687, "epoch": 2732} {"train_loss": -44.65328598022461, "global_step": 330688, "epoch": 2732} {"train_loss": -44.765071868896484, "global_step": 330689, "epoch": 2732} {"train_loss": -44.35860061645508, "global_step": 330690, "epoch": 2732} {"train_loss": -44.624786376953125, "global_step": 330691, "epoch": 2732} {"train_loss": -43.59223745677097, "global_step": 330692, "epoch": 2732, "val_loss": 2404248.75} {"train_loss": -44.5379753112793, "global_step": 330693, "epoch": 2733} {"train_loss": -44.081199645996094, "global_step": 330694, "epoch": 2733} {"train_loss": -43.802955627441406, "global_step": 330695, "epoch": 2733} {"train_loss": -44.611358642578125, "global_step": 330696, "epoch": 2733} {"train_loss": -43.76810836791992, "global_step": 330697, "epoch": 2733} {"train_loss": -43.7611198425293, "global_step": 330698, "epoch": 2733} {"train_loss": -43.307308197021484, "global_step": 330699, "epoch": 2733} {"train_loss": -43.626651763916016, "global_step": 330700, "epoch": 2733} {"train_loss": -43.656829833984375, "global_step": 330701, "epoch": 2733} {"train_loss": -43.564334869384766, "global_step": 330702, "epoch": 2733} {"train_loss": -43.732810974121094, "global_step": 330703, "epoch": 2733} {"train_loss": -41.758079528808594, "global_step": 330704, "epoch": 2733} {"train_loss": -43.0573844909668, "global_step": 330705, "epoch": 2733} {"train_loss": -42.37086486816406, "global_step": 330706, "epoch": 2733} {"train_loss": -41.466609954833984, "global_step": 330707, "epoch": 2733} {"train_loss": -41.05877685546875, "global_step": 330708, "epoch": 2733} {"train_loss": -43.24815368652344, "global_step": 330709, "epoch": 2733} {"train_loss": -40.63559341430664, "global_step": 330710, "epoch": 2733} {"train_loss": -40.4833984375, "global_step": 330711, "epoch": 2733} {"train_loss": -42.147769927978516, "global_step": 330712, "epoch": 2733} {"train_loss": -40.18505859375, "global_step": 330713, "epoch": 2733} {"train_loss": -41.305328369140625, "global_step": 330714, "epoch": 2733} {"train_loss": -41.34110641479492, "global_step": 330715, "epoch": 2733} {"train_loss": -41.413414001464844, "global_step": 330716, "epoch": 2733} {"train_loss": -40.7258415222168, "global_step": 330717, "epoch": 2733} {"train_loss": -41.976993560791016, "global_step": 330718, "epoch": 2733} {"train_loss": -42.11167907714844, "global_step": 330719, "epoch": 2733} {"train_loss": -42.06333541870117, "global_step": 330720, "epoch": 2733} {"train_loss": -42.46212387084961, "global_step": 330721, "epoch": 2733} {"train_loss": -43.76294708251953, "global_step": 330722, "epoch": 2733} {"train_loss": -41.1282844543457, "global_step": 330723, "epoch": 2733} {"train_loss": -43.27995300292969, "global_step": 330724, "epoch": 2733} {"train_loss": -42.660728454589844, "global_step": 330725, "epoch": 2733} {"train_loss": -42.54985427856445, "global_step": 330726, "epoch": 2733} {"train_loss": -43.28116989135742, "global_step": 330727, "epoch": 2733} {"train_loss": -43.712955474853516, "global_step": 330728, "epoch": 2733} {"train_loss": -43.3005485534668, "global_step": 330729, "epoch": 2733} {"train_loss": -42.935909271240234, "global_step": 330730, "epoch": 2733} {"train_loss": -43.06322479248047, "global_step": 330731, "epoch": 2733} {"train_loss": -43.550228118896484, "global_step": 330732, "epoch": 2733} {"train_loss": -44.10810089111328, "global_step": 330733, "epoch": 2733} {"train_loss": -43.227474212646484, "global_step": 330734, "epoch": 2733} {"train_loss": -44.04568099975586, "global_step": 330735, "epoch": 2733} {"train_loss": -42.77667236328125, "global_step": 330736, "epoch": 2733} {"train_loss": -44.0915412902832, "global_step": 330737, "epoch": 2733} {"train_loss": -43.1062126159668, "global_step": 330738, "epoch": 2733} {"train_loss": -43.94068145751953, "global_step": 330739, "epoch": 2733} {"train_loss": -44.3079833984375, "global_step": 330740, "epoch": 2733} {"train_loss": -43.56325912475586, "global_step": 330741, "epoch": 2733} {"train_loss": -44.75666046142578, "global_step": 330742, "epoch": 2733} {"train_loss": -43.68441390991211, "global_step": 330743, "epoch": 2733} {"train_loss": -44.267120361328125, "global_step": 330744, "epoch": 2733} {"train_loss": -43.1387825012207, "global_step": 330745, "epoch": 2733} {"train_loss": -44.14601516723633, "global_step": 330746, "epoch": 2733} {"train_loss": -44.12078857421875, "global_step": 330747, "epoch": 2733} {"train_loss": -44.03629684448242, "global_step": 330748, "epoch": 2733} {"train_loss": -44.352455139160156, "global_step": 330749, "epoch": 2733} {"train_loss": -44.414791107177734, "global_step": 330750, "epoch": 2733} {"train_loss": -44.880435943603516, "global_step": 330751, "epoch": 2733} {"train_loss": -43.310482025146484, "global_step": 330752, "epoch": 2733} {"train_loss": -44.77436447143555, "global_step": 330753, "epoch": 2733} {"train_loss": -44.72612380981445, "global_step": 330754, "epoch": 2733} {"train_loss": -44.59772491455078, "global_step": 330755, "epoch": 2733} {"train_loss": -44.87775421142578, "global_step": 330756, "epoch": 2733} {"train_loss": -44.68558120727539, "global_step": 330757, "epoch": 2733} {"train_loss": -44.7910270690918, "global_step": 330758, "epoch": 2733} {"train_loss": -45.1533317565918, "global_step": 330759, "epoch": 2733} {"train_loss": -44.99696731567383, "global_step": 330760, "epoch": 2733} {"train_loss": -44.82284927368164, "global_step": 330761, "epoch": 2733} {"train_loss": -44.922035217285156, "global_step": 330762, "epoch": 2733} {"train_loss": -45.15961837768555, "global_step": 330763, "epoch": 2733} {"train_loss": -44.67551803588867, "global_step": 330764, "epoch": 2733} {"train_loss": -45.28448486328125, "global_step": 330765, "epoch": 2733} {"train_loss": -44.57657241821289, "global_step": 330766, "epoch": 2733} {"train_loss": -45.157283782958984, "global_step": 330767, "epoch": 2733} {"train_loss": -44.487274169921875, "global_step": 330768, "epoch": 2733} {"train_loss": -45.24282455444336, "global_step": 330769, "epoch": 2733} {"train_loss": -44.744178771972656, "global_step": 330770, "epoch": 2733} {"train_loss": -44.723487854003906, "global_step": 330771, "epoch": 2733} {"train_loss": -45.088653564453125, "global_step": 330772, "epoch": 2733} {"train_loss": -44.77668762207031, "global_step": 330773, "epoch": 2733} {"train_loss": -44.9011116027832, "global_step": 330774, "epoch": 2733} {"train_loss": -45.33681869506836, "global_step": 330775, "epoch": 2733} {"train_loss": -44.802001953125, "global_step": 330776, "epoch": 2733} {"train_loss": -43.774147033691406, "global_step": 330777, "epoch": 2733} {"train_loss": -44.35003662109375, "global_step": 330778, "epoch": 2733} {"train_loss": -44.60573959350586, "global_step": 330779, "epoch": 2733} {"train_loss": -44.84018325805664, "global_step": 330780, "epoch": 2733} {"train_loss": -43.25344467163086, "global_step": 330781, "epoch": 2733} {"train_loss": -44.53211212158203, "global_step": 330782, "epoch": 2733} {"train_loss": -44.56385803222656, "global_step": 330783, "epoch": 2733} {"train_loss": -44.95283889770508, "global_step": 330784, "epoch": 2733} {"train_loss": -44.663082122802734, "global_step": 330785, "epoch": 2733} {"train_loss": -44.72917556762695, "global_step": 330786, "epoch": 2733} {"train_loss": -43.6932373046875, "global_step": 330787, "epoch": 2733} {"train_loss": -44.04659652709961, "global_step": 330788, "epoch": 2733} {"train_loss": -42.94565963745117, "global_step": 330789, "epoch": 2733} {"train_loss": -44.22675704956055, "global_step": 330790, "epoch": 2733} {"train_loss": -43.480079650878906, "global_step": 330791, "epoch": 2733} {"train_loss": -44.11237335205078, "global_step": 330792, "epoch": 2733} {"train_loss": -43.82267761230469, "global_step": 330793, "epoch": 2733} {"train_loss": -44.94261932373047, "global_step": 330794, "epoch": 2733} {"train_loss": -44.19169235229492, "global_step": 330795, "epoch": 2733} {"train_loss": -44.35082244873047, "global_step": 330796, "epoch": 2733} {"train_loss": -44.48020553588867, "global_step": 330797, "epoch": 2733} {"train_loss": -44.433067321777344, "global_step": 330798, "epoch": 2733} {"train_loss": -44.52358627319336, "global_step": 330799, "epoch": 2733} {"train_loss": -42.99398422241211, "global_step": 330800, "epoch": 2733} {"train_loss": -44.05311965942383, "global_step": 330801, "epoch": 2733} {"train_loss": -44.7154541015625, "global_step": 330802, "epoch": 2733} {"train_loss": -44.25075912475586, "global_step": 330803, "epoch": 2733} {"train_loss": -42.842987060546875, "global_step": 330804, "epoch": 2733} {"train_loss": -43.04410934448242, "global_step": 330805, "epoch": 2733} {"train_loss": -42.79351806640625, "global_step": 330806, "epoch": 2733} {"train_loss": -43.39081954956055, "global_step": 330807, "epoch": 2733} {"train_loss": -44.470279693603516, "global_step": 330808, "epoch": 2733} {"train_loss": -44.694190979003906, "global_step": 330809, "epoch": 2733} {"train_loss": -43.314510345458984, "global_step": 330810, "epoch": 2733} {"train_loss": -43.176918029785156, "global_step": 330811, "epoch": 2733} {"train_loss": -44.30387496948242, "global_step": 330812, "epoch": 2733} {"train_loss": -43.715370083643386, "global_step": 330813, "epoch": 2733, "val_loss": 2516148.0} {"train_loss": -39.81911849975586, "global_step": 330814, "epoch": 2734} {"train_loss": -37.11228561401367, "global_step": 330815, "epoch": 2734} {"train_loss": -37.605560302734375, "global_step": 330816, "epoch": 2734} {"train_loss": -43.18255615234375, "global_step": 330817, "epoch": 2734} {"train_loss": -41.282527923583984, "global_step": 330818, "epoch": 2734} {"train_loss": -37.389305114746094, "global_step": 330819, "epoch": 2734} {"train_loss": -40.89249801635742, "global_step": 330820, "epoch": 2734} {"train_loss": -42.38634490966797, "global_step": 330821, "epoch": 2734} {"train_loss": -42.848609924316406, "global_step": 330822, "epoch": 2734} {"train_loss": -42.64641571044922, "global_step": 330823, "epoch": 2734} {"train_loss": -42.392974853515625, "global_step": 330824, "epoch": 2734} {"train_loss": -42.288509368896484, "global_step": 330825, "epoch": 2734} {"train_loss": -42.07868957519531, "global_step": 330826, "epoch": 2734} {"train_loss": -42.41233444213867, "global_step": 330827, "epoch": 2734} {"train_loss": -41.48493576049805, "global_step": 330828, "epoch": 2734} {"train_loss": -42.481178283691406, "global_step": 330829, "epoch": 2734} {"train_loss": -41.630584716796875, "global_step": 330830, "epoch": 2734} {"train_loss": -42.45341110229492, "global_step": 330831, "epoch": 2734} {"train_loss": -43.50693893432617, "global_step": 330832, "epoch": 2734} {"train_loss": -42.88759231567383, "global_step": 330833, "epoch": 2734} {"train_loss": -43.9739875793457, "global_step": 330834, "epoch": 2734} {"train_loss": -43.46144485473633, "global_step": 330835, "epoch": 2734} {"train_loss": -43.64006423950195, "global_step": 330836, "epoch": 2734} {"train_loss": -43.564491271972656, "global_step": 330837, "epoch": 2734} {"train_loss": -43.1504020690918, "global_step": 330838, "epoch": 2734} {"train_loss": -43.98295974731445, "global_step": 330839, "epoch": 2734} {"train_loss": -43.267940521240234, "global_step": 330840, "epoch": 2734} {"train_loss": -43.923583984375, "global_step": 330841, "epoch": 2734} {"train_loss": -42.893157958984375, "global_step": 330842, "epoch": 2734} {"train_loss": -43.64064407348633, "global_step": 330843, "epoch": 2734} {"train_loss": -44.0566291809082, "global_step": 330844, "epoch": 2734} {"train_loss": -43.59714889526367, "global_step": 330845, "epoch": 2734} {"train_loss": -43.00836944580078, "global_step": 330846, "epoch": 2734} {"train_loss": -43.96427536010742, "global_step": 330847, "epoch": 2734} {"train_loss": -43.58829879760742, "global_step": 330848, "epoch": 2734} {"train_loss": -44.0926628112793, "global_step": 330849, "epoch": 2734} {"train_loss": -44.09369659423828, "global_step": 330850, "epoch": 2734} {"train_loss": -43.9374885559082, "global_step": 330851, "epoch": 2734} {"train_loss": -43.75912094116211, "global_step": 330852, "epoch": 2734} {"train_loss": -44.44203567504883, "global_step": 330853, "epoch": 2734} {"train_loss": -43.7886848449707, "global_step": 330854, "epoch": 2734} {"train_loss": -44.55813217163086, "global_step": 330855, "epoch": 2734} {"train_loss": -44.34969711303711, "global_step": 330856, "epoch": 2734} {"train_loss": -44.487178802490234, "global_step": 330857, "epoch": 2734} {"train_loss": -43.70791244506836, "global_step": 330858, "epoch": 2734} {"train_loss": -44.60769271850586, "global_step": 330859, "epoch": 2734} {"train_loss": -44.70216369628906, "global_step": 330860, "epoch": 2734} {"train_loss": -44.83926773071289, "global_step": 330861, "epoch": 2734} {"train_loss": -44.645809173583984, "global_step": 330862, "epoch": 2734} {"train_loss": -43.78505325317383, "global_step": 330863, "epoch": 2734} {"train_loss": -44.57453918457031, "global_step": 330864, "epoch": 2734} {"train_loss": -44.43888473510742, "global_step": 330865, "epoch": 2734} {"train_loss": -44.587562561035156, "global_step": 330866, "epoch": 2734} {"train_loss": -44.3046989440918, "global_step": 330867, "epoch": 2734} {"train_loss": -43.366973876953125, "global_step": 330868, "epoch": 2734} {"train_loss": -44.75651931762695, "global_step": 330869, "epoch": 2734} {"train_loss": -41.39805221557617, "global_step": 330870, "epoch": 2734} {"train_loss": -42.773983001708984, "global_step": 330871, "epoch": 2734} {"train_loss": -44.4489860534668, "global_step": 330872, "epoch": 2734} {"train_loss": -44.11922836303711, "global_step": 330873, "epoch": 2734} {"train_loss": -43.94045639038086, "global_step": 330874, "epoch": 2734} {"train_loss": -43.461448669433594, "global_step": 330875, "epoch": 2734} {"train_loss": -42.57182693481445, "global_step": 330876, "epoch": 2734} {"train_loss": -44.57674789428711, "global_step": 330877, "epoch": 2734} {"train_loss": -44.46754455566406, "global_step": 330878, "epoch": 2734} {"train_loss": -42.31008529663086, "global_step": 330879, "epoch": 2734} {"train_loss": -41.468467712402344, "global_step": 330880, "epoch": 2734} {"train_loss": -44.20075607299805, "global_step": 330881, "epoch": 2734} {"train_loss": -44.70256423950195, "global_step": 330882, "epoch": 2734} {"train_loss": -43.27582931518555, "global_step": 330883, "epoch": 2734} {"train_loss": -44.63790512084961, "global_step": 330884, "epoch": 2734} {"train_loss": -43.86366653442383, "global_step": 330885, "epoch": 2734} {"train_loss": -44.669898986816406, "global_step": 330886, "epoch": 2734} {"train_loss": -42.546382904052734, "global_step": 330887, "epoch": 2734} {"train_loss": -43.83486557006836, "global_step": 330888, "epoch": 2734} {"train_loss": -44.53499984741211, "global_step": 330889, "epoch": 2734} {"train_loss": -44.486873626708984, "global_step": 330890, "epoch": 2734} {"train_loss": -44.60891342163086, "global_step": 330891, "epoch": 2734} {"train_loss": -44.838653564453125, "global_step": 330892, "epoch": 2734} {"train_loss": -44.176265716552734, "global_step": 330893, "epoch": 2734} {"train_loss": -44.238006591796875, "global_step": 330894, "epoch": 2734} {"train_loss": -44.81673049926758, "global_step": 330895, "epoch": 2734} {"train_loss": -44.50818634033203, "global_step": 330896, "epoch": 2734} {"train_loss": -43.78249740600586, "global_step": 330897, "epoch": 2734} {"train_loss": -44.3104362487793, "global_step": 330898, "epoch": 2734} {"train_loss": -43.18526840209961, "global_step": 330899, "epoch": 2734} {"train_loss": -43.00849533081055, "global_step": 330900, "epoch": 2734} {"train_loss": -44.47672653198242, "global_step": 330901, "epoch": 2734} {"train_loss": -43.433475494384766, "global_step": 330902, "epoch": 2734} {"train_loss": -44.454769134521484, "global_step": 330903, "epoch": 2734} {"train_loss": -43.59001922607422, "global_step": 330904, "epoch": 2734} {"train_loss": -44.214656829833984, "global_step": 330905, "epoch": 2734} {"train_loss": -43.2838020324707, "global_step": 330906, "epoch": 2734} {"train_loss": -42.980159759521484, "global_step": 330907, "epoch": 2734} {"train_loss": -44.08610153198242, "global_step": 330908, "epoch": 2734} {"train_loss": -42.90973663330078, "global_step": 330909, "epoch": 2734} {"train_loss": -42.9714241027832, "global_step": 330910, "epoch": 2734} {"train_loss": -43.6659049987793, "global_step": 330911, "epoch": 2734} {"train_loss": -43.652400970458984, "global_step": 330912, "epoch": 2734} {"train_loss": -43.23209762573242, "global_step": 330913, "epoch": 2734} {"train_loss": -43.66489791870117, "global_step": 330914, "epoch": 2734} {"train_loss": -43.870906829833984, "global_step": 330915, "epoch": 2734} {"train_loss": -44.79998779296875, "global_step": 330916, "epoch": 2734} {"train_loss": -43.17478561401367, "global_step": 330917, "epoch": 2734} {"train_loss": -44.63685989379883, "global_step": 330918, "epoch": 2734} {"train_loss": -42.5515251159668, "global_step": 330919, "epoch": 2734} {"train_loss": -43.51974105834961, "global_step": 330920, "epoch": 2734} {"train_loss": -44.386959075927734, "global_step": 330921, "epoch": 2734} {"train_loss": -41.72125244140625, "global_step": 330922, "epoch": 2734} {"train_loss": -44.0323486328125, "global_step": 330923, "epoch": 2734} {"train_loss": -40.8648681640625, "global_step": 330924, "epoch": 2734} {"train_loss": -41.3734130859375, "global_step": 330925, "epoch": 2734} {"train_loss": -41.21351623535156, "global_step": 330926, "epoch": 2734} {"train_loss": -42.65279006958008, "global_step": 330927, "epoch": 2734} {"train_loss": -42.728271484375, "global_step": 330928, "epoch": 2734} {"train_loss": -40.94683837890625, "global_step": 330929, "epoch": 2734} {"train_loss": -41.706268310546875, "global_step": 330930, "epoch": 2734} {"train_loss": -42.39625930786133, "global_step": 330931, "epoch": 2734} {"train_loss": -43.45484161376953, "global_step": 330932, "epoch": 2734} {"train_loss": -41.74996566772461, "global_step": 330933, "epoch": 2734} {"train_loss": -43.25161071651238, "global_step": 330934, "epoch": 2734, "val_loss": 2562652.75} {"train_loss": -42.84583282470703, "global_step": 330935, "epoch": 2735} {"train_loss": -41.87553024291992, "global_step": 330936, "epoch": 2735} {"train_loss": -43.063995361328125, "global_step": 330937, "epoch": 2735} {"train_loss": -43.342079162597656, "global_step": 330938, "epoch": 2735} {"train_loss": -42.877925872802734, "global_step": 330939, "epoch": 2735} {"train_loss": -41.47965621948242, "global_step": 330940, "epoch": 2735} {"train_loss": -42.254661560058594, "global_step": 330941, "epoch": 2735} {"train_loss": -43.06570053100586, "global_step": 330942, "epoch": 2735} {"train_loss": -42.28003692626953, "global_step": 330943, "epoch": 2735} {"train_loss": -42.375648498535156, "global_step": 330944, "epoch": 2735} {"train_loss": -42.24243927001953, "global_step": 330945, "epoch": 2735} {"train_loss": -43.21751022338867, "global_step": 330946, "epoch": 2735} {"train_loss": -41.63152313232422, "global_step": 330947, "epoch": 2735} {"train_loss": -42.250545501708984, "global_step": 330948, "epoch": 2735} {"train_loss": -40.694679260253906, "global_step": 330949, "epoch": 2735} {"train_loss": -43.149261474609375, "global_step": 330950, "epoch": 2735} {"train_loss": -42.585723876953125, "global_step": 330951, "epoch": 2735} {"train_loss": -43.69467544555664, "global_step": 330952, "epoch": 2735} {"train_loss": -43.772377014160156, "global_step": 330953, "epoch": 2735} {"train_loss": -43.61905288696289, "global_step": 330954, "epoch": 2735} {"train_loss": -42.74632263183594, "global_step": 330955, "epoch": 2735} {"train_loss": -43.26841354370117, "global_step": 330956, "epoch": 2735} {"train_loss": -44.28395462036133, "global_step": 330957, "epoch": 2735} {"train_loss": -43.23088073730469, "global_step": 330958, "epoch": 2735} {"train_loss": -43.7398796081543, "global_step": 330959, "epoch": 2735} {"train_loss": -43.730037689208984, "global_step": 330960, "epoch": 2735} {"train_loss": -44.449989318847656, "global_step": 330961, "epoch": 2735} {"train_loss": -43.831790924072266, "global_step": 330962, "epoch": 2735} {"train_loss": -43.63833236694336, "global_step": 330963, "epoch": 2735} {"train_loss": -43.44062042236328, "global_step": 330964, "epoch": 2735} {"train_loss": -44.08515548706055, "global_step": 330965, "epoch": 2735} {"train_loss": -43.258705139160156, "global_step": 330966, "epoch": 2735} {"train_loss": -44.23896026611328, "global_step": 330967, "epoch": 2735} {"train_loss": -44.00790023803711, "global_step": 330968, "epoch": 2735} {"train_loss": -44.87117385864258, "global_step": 330969, "epoch": 2735} {"train_loss": -43.22140121459961, "global_step": 330970, "epoch": 2735} {"train_loss": -43.58184051513672, "global_step": 330971, "epoch": 2735} {"train_loss": -44.137725830078125, "global_step": 330972, "epoch": 2735} {"train_loss": -43.52321243286133, "global_step": 330973, "epoch": 2735} {"train_loss": -42.48592758178711, "global_step": 330974, "epoch": 2735} {"train_loss": -43.81891632080078, "global_step": 330975, "epoch": 2735} {"train_loss": -43.616146087646484, "global_step": 330976, "epoch": 2735} {"train_loss": -43.84033966064453, "global_step": 330977, "epoch": 2735} {"train_loss": -42.43479537963867, "global_step": 330978, "epoch": 2735} {"train_loss": -40.34052276611328, "global_step": 330979, "epoch": 2735} {"train_loss": -43.44141387939453, "global_step": 330980, "epoch": 2735} {"train_loss": -42.46417999267578, "global_step": 330981, "epoch": 2735} {"train_loss": -42.47370529174805, "global_step": 330982, "epoch": 2735} {"train_loss": -42.40589141845703, "global_step": 330983, "epoch": 2735} {"train_loss": -40.27457809448242, "global_step": 330984, "epoch": 2735} {"train_loss": -43.34768295288086, "global_step": 330985, "epoch": 2735} {"train_loss": -43.02167892456055, "global_step": 330986, "epoch": 2735} {"train_loss": -42.02842712402344, "global_step": 330987, "epoch": 2735} {"train_loss": -44.25895309448242, "global_step": 330988, "epoch": 2735} {"train_loss": -42.87131881713867, "global_step": 330989, "epoch": 2735} {"train_loss": -42.24265670776367, "global_step": 330990, "epoch": 2735} {"train_loss": -43.61129379272461, "global_step": 330991, "epoch": 2735} {"train_loss": -42.01827621459961, "global_step": 330992, "epoch": 2735} {"train_loss": -41.71529769897461, "global_step": 330993, "epoch": 2735} {"train_loss": -42.96509552001953, "global_step": 330994, "epoch": 2735} {"train_loss": -43.14631271362305, "global_step": 330995, "epoch": 2735} {"train_loss": -42.24509811401367, "global_step": 330996, "epoch": 2735} {"train_loss": -42.47905349731445, "global_step": 330997, "epoch": 2735} {"train_loss": -43.30887985229492, "global_step": 330998, "epoch": 2735} {"train_loss": -43.68034744262695, "global_step": 330999, "epoch": 2735} {"train_loss": -42.75172805786133, "global_step": 331000, "epoch": 2735} {"train_loss": -43.79106903076172, "global_step": 331001, "epoch": 2735} {"train_loss": -43.91947937011719, "global_step": 331002, "epoch": 2735} {"train_loss": -42.5221061706543, "global_step": 331003, "epoch": 2735} {"train_loss": -43.68376541137695, "global_step": 331004, "epoch": 2735} {"train_loss": -42.990474700927734, "global_step": 331005, "epoch": 2735} {"train_loss": -41.23472595214844, "global_step": 331006, "epoch": 2735} {"train_loss": -44.55178451538086, "global_step": 331007, "epoch": 2735} {"train_loss": -42.0999641418457, "global_step": 331008, "epoch": 2735} {"train_loss": -41.45595932006836, "global_step": 331009, "epoch": 2735} {"train_loss": -43.0097770690918, "global_step": 331010, "epoch": 2735} {"train_loss": -42.35578155517578, "global_step": 331011, "epoch": 2735} {"train_loss": -42.997615814208984, "global_step": 331012, "epoch": 2735} {"train_loss": -43.476253509521484, "global_step": 331013, "epoch": 2735} {"train_loss": -41.24507522583008, "global_step": 331014, "epoch": 2735} {"train_loss": -42.1292839050293, "global_step": 331015, "epoch": 2735} {"train_loss": -42.55199432373047, "global_step": 331016, "epoch": 2735} {"train_loss": -41.20868682861328, "global_step": 331017, "epoch": 2735} {"train_loss": -41.38626480102539, "global_step": 331018, "epoch": 2735} {"train_loss": -43.73027801513672, "global_step": 331019, "epoch": 2735} {"train_loss": -41.183353424072266, "global_step": 331020, "epoch": 2735} {"train_loss": -42.92869186401367, "global_step": 331021, "epoch": 2735} {"train_loss": -43.43133544921875, "global_step": 331022, "epoch": 2735} {"train_loss": -41.59694290161133, "global_step": 331023, "epoch": 2735} {"train_loss": -42.903343200683594, "global_step": 331024, "epoch": 2735} {"train_loss": -42.537960052490234, "global_step": 331025, "epoch": 2735} {"train_loss": -38.294189453125, "global_step": 331026, "epoch": 2735} {"train_loss": -43.424468994140625, "global_step": 331027, "epoch": 2735} {"train_loss": -40.2445182800293, "global_step": 331028, "epoch": 2735} {"train_loss": -40.51605987548828, "global_step": 331029, "epoch": 2735} {"train_loss": -42.32540512084961, "global_step": 331030, "epoch": 2735} {"train_loss": -42.85103988647461, "global_step": 331031, "epoch": 2735} {"train_loss": -42.41181182861328, "global_step": 331032, "epoch": 2735} {"train_loss": -43.68665313720703, "global_step": 331033, "epoch": 2735} {"train_loss": -41.60160827636719, "global_step": 331034, "epoch": 2735} {"train_loss": -43.61417770385742, "global_step": 331035, "epoch": 2735} {"train_loss": -42.651100158691406, "global_step": 331036, "epoch": 2735} {"train_loss": -43.12872314453125, "global_step": 331037, "epoch": 2735} {"train_loss": -42.65867233276367, "global_step": 331038, "epoch": 2735} {"train_loss": -43.06854248046875, "global_step": 331039, "epoch": 2735} {"train_loss": -43.23099899291992, "global_step": 331040, "epoch": 2735} {"train_loss": -42.38446807861328, "global_step": 331041, "epoch": 2735} {"train_loss": -43.95025634765625, "global_step": 331042, "epoch": 2735} {"train_loss": -43.33430862426758, "global_step": 331043, "epoch": 2735} {"train_loss": -42.75515365600586, "global_step": 331044, "epoch": 2735} {"train_loss": -43.31705093383789, "global_step": 331045, "epoch": 2735} {"train_loss": -42.934993743896484, "global_step": 331046, "epoch": 2735} {"train_loss": -41.36366271972656, "global_step": 331047, "epoch": 2735} {"train_loss": -43.989749908447266, "global_step": 331048, "epoch": 2735} {"train_loss": -43.51368713378906, "global_step": 331049, "epoch": 2735} {"train_loss": -44.042659759521484, "global_step": 331050, "epoch": 2735} {"train_loss": -43.62357711791992, "global_step": 331051, "epoch": 2735} {"train_loss": -44.2761344909668, "global_step": 331052, "epoch": 2735} {"train_loss": -43.69923400878906, "global_step": 331053, "epoch": 2735} {"train_loss": -44.204715728759766, "global_step": 331054, "epoch": 2735} {"train_loss": -42.869467585540015, "global_step": 331055, "epoch": 2735, "val_loss": 2594008.75} {"train_loss": -43.61011505126953, "global_step": 331056, "epoch": 2736} {"train_loss": -44.16510009765625, "global_step": 331057, "epoch": 2736} {"train_loss": -44.0980110168457, "global_step": 331058, "epoch": 2736} {"train_loss": -44.256591796875, "global_step": 331059, "epoch": 2736} {"train_loss": -44.29232406616211, "global_step": 331060, "epoch": 2736} {"train_loss": -44.01712417602539, "global_step": 331061, "epoch": 2736} {"train_loss": -43.970951080322266, "global_step": 331062, "epoch": 2736} {"train_loss": -44.094547271728516, "global_step": 331063, "epoch": 2736} {"train_loss": -44.48240280151367, "global_step": 331064, "epoch": 2736} {"train_loss": -43.72993087768555, "global_step": 331065, "epoch": 2736} {"train_loss": -44.52937316894531, "global_step": 331066, "epoch": 2736} {"train_loss": -43.82605743408203, "global_step": 331067, "epoch": 2736} {"train_loss": -44.17619323730469, "global_step": 331068, "epoch": 2736} {"train_loss": -45.29283142089844, "global_step": 331069, "epoch": 2736} {"train_loss": -44.61652755737305, "global_step": 331070, "epoch": 2736} {"train_loss": -44.78666687011719, "global_step": 331071, "epoch": 2736} {"train_loss": -44.61736297607422, "global_step": 331072, "epoch": 2736} {"train_loss": -44.5671272277832, "global_step": 331073, "epoch": 2736} {"train_loss": -44.41510009765625, "global_step": 331074, "epoch": 2736} {"train_loss": -44.35496139526367, "global_step": 331075, "epoch": 2736} {"train_loss": -44.71651077270508, "global_step": 331076, "epoch": 2736} {"train_loss": -44.37440490722656, "global_step": 331077, "epoch": 2736} {"train_loss": -44.705257415771484, "global_step": 331078, "epoch": 2736} {"train_loss": -45.26264572143555, "global_step": 331079, "epoch": 2736} {"train_loss": -44.456642150878906, "global_step": 331080, "epoch": 2736} {"train_loss": -44.11033248901367, "global_step": 331081, "epoch": 2736} {"train_loss": -44.772029876708984, "global_step": 331082, "epoch": 2736} {"train_loss": -44.67070388793945, "global_step": 331083, "epoch": 2736} {"train_loss": -44.61021423339844, "global_step": 331084, "epoch": 2736} {"train_loss": -44.452415466308594, "global_step": 331085, "epoch": 2736} {"train_loss": -45.221675872802734, "global_step": 331086, "epoch": 2736} {"train_loss": -44.22029113769531, "global_step": 331087, "epoch": 2736} {"train_loss": -44.201961517333984, "global_step": 331088, "epoch": 2736} {"train_loss": -44.7734489440918, "global_step": 331089, "epoch": 2736} {"train_loss": -44.27604675292969, "global_step": 331090, "epoch": 2736} {"train_loss": -44.18217849731445, "global_step": 331091, "epoch": 2736} {"train_loss": -44.297569274902344, "global_step": 331092, "epoch": 2736} {"train_loss": -44.3328857421875, "global_step": 331093, "epoch": 2736} {"train_loss": -44.15145492553711, "global_step": 331094, "epoch": 2736} {"train_loss": -44.03240966796875, "global_step": 331095, "epoch": 2736} {"train_loss": -45.139949798583984, "global_step": 331096, "epoch": 2736} {"train_loss": -44.7043342590332, "global_step": 331097, "epoch": 2736} {"train_loss": -44.998470306396484, "global_step": 331098, "epoch": 2736} {"train_loss": -44.689361572265625, "global_step": 331099, "epoch": 2736} {"train_loss": -44.4761848449707, "global_step": 331100, "epoch": 2736} {"train_loss": -44.15394973754883, "global_step": 331101, "epoch": 2736} {"train_loss": -44.507808685302734, "global_step": 331102, "epoch": 2736} {"train_loss": -43.628875732421875, "global_step": 331103, "epoch": 2736} {"train_loss": -44.250179290771484, "global_step": 331104, "epoch": 2736} {"train_loss": -44.62203598022461, "global_step": 331105, "epoch": 2736} {"train_loss": -44.69634246826172, "global_step": 331106, "epoch": 2736} {"train_loss": -44.59098434448242, "global_step": 331107, "epoch": 2736} {"train_loss": -43.98292922973633, "global_step": 331108, "epoch": 2736} {"train_loss": -44.908626556396484, "global_step": 331109, "epoch": 2736} {"train_loss": -45.02042770385742, "global_step": 331110, "epoch": 2736} {"train_loss": -44.347145080566406, "global_step": 331111, "epoch": 2736} {"train_loss": -45.20433044433594, "global_step": 331112, "epoch": 2736} {"train_loss": -43.67181396484375, "global_step": 331113, "epoch": 2736} {"train_loss": -42.82445526123047, "global_step": 331114, "epoch": 2736} {"train_loss": -42.10773849487305, "global_step": 331115, "epoch": 2736} {"train_loss": -42.13629150390625, "global_step": 331116, "epoch": 2736} {"train_loss": -44.86308670043945, "global_step": 331117, "epoch": 2736} {"train_loss": -43.56710433959961, "global_step": 331118, "epoch": 2736} {"train_loss": -41.643470764160156, "global_step": 331119, "epoch": 2736} {"train_loss": -42.80046463012695, "global_step": 331120, "epoch": 2736} {"train_loss": -44.46480941772461, "global_step": 331121, "epoch": 2736} {"train_loss": -43.05180740356445, "global_step": 331122, "epoch": 2736} {"train_loss": -40.512664794921875, "global_step": 331123, "epoch": 2736} {"train_loss": -41.612823486328125, "global_step": 331124, "epoch": 2736} {"train_loss": -43.30780029296875, "global_step": 331125, "epoch": 2736} {"train_loss": -43.87432861328125, "global_step": 331126, "epoch": 2736} {"train_loss": -43.761192321777344, "global_step": 331127, "epoch": 2736} {"train_loss": -42.81129837036133, "global_step": 331128, "epoch": 2736} {"train_loss": -44.244903564453125, "global_step": 331129, "epoch": 2736} {"train_loss": -43.2223014831543, "global_step": 331130, "epoch": 2736} {"train_loss": -44.03461456298828, "global_step": 331131, "epoch": 2736} {"train_loss": -43.95318603515625, "global_step": 331132, "epoch": 2736} {"train_loss": -41.632057189941406, "global_step": 331133, "epoch": 2736} {"train_loss": -43.262569427490234, "global_step": 331134, "epoch": 2736} {"train_loss": -44.039344787597656, "global_step": 331135, "epoch": 2736} {"train_loss": -43.52215576171875, "global_step": 331136, "epoch": 2736} {"train_loss": -44.06034851074219, "global_step": 331137, "epoch": 2736} {"train_loss": -43.82905197143555, "global_step": 331138, "epoch": 2736} {"train_loss": -42.3618278503418, "global_step": 331139, "epoch": 2736} {"train_loss": -43.298152923583984, "global_step": 331140, "epoch": 2736} {"train_loss": -42.480201721191406, "global_step": 331141, "epoch": 2736} {"train_loss": -42.88542556762695, "global_step": 331142, "epoch": 2736} {"train_loss": -42.155250549316406, "global_step": 331143, "epoch": 2736} {"train_loss": -42.623558044433594, "global_step": 331144, "epoch": 2736} {"train_loss": -43.82677459716797, "global_step": 331145, "epoch": 2736} {"train_loss": -42.905853271484375, "global_step": 331146, "epoch": 2736} {"train_loss": -42.905723571777344, "global_step": 331147, "epoch": 2736} {"train_loss": -43.466163635253906, "global_step": 331148, "epoch": 2736} {"train_loss": -43.390846252441406, "global_step": 331149, "epoch": 2736} {"train_loss": -42.57335662841797, "global_step": 331150, "epoch": 2736} {"train_loss": -43.02484130859375, "global_step": 331151, "epoch": 2736} {"train_loss": -43.33652877807617, "global_step": 331152, "epoch": 2736} {"train_loss": -44.15222930908203, "global_step": 331153, "epoch": 2736} {"train_loss": -43.11367416381836, "global_step": 331154, "epoch": 2736} {"train_loss": -43.57773971557617, "global_step": 331155, "epoch": 2736} {"train_loss": -44.174163818359375, "global_step": 331156, "epoch": 2736} {"train_loss": -42.54730987548828, "global_step": 331157, "epoch": 2736} {"train_loss": -44.05609130859375, "global_step": 331158, "epoch": 2736} {"train_loss": -43.10360336303711, "global_step": 331159, "epoch": 2736} {"train_loss": -42.819725036621094, "global_step": 331160, "epoch": 2736} {"train_loss": -43.26715087890625, "global_step": 331161, "epoch": 2736} {"train_loss": -43.6646842956543, "global_step": 331162, "epoch": 2736} {"train_loss": -43.33945846557617, "global_step": 331163, "epoch": 2736} {"train_loss": -44.293941497802734, "global_step": 331164, "epoch": 2736} {"train_loss": -42.88918685913086, "global_step": 331165, "epoch": 2736} {"train_loss": -44.76090621948242, "global_step": 331166, "epoch": 2736} {"train_loss": -43.812049865722656, "global_step": 331167, "epoch": 2736} {"train_loss": -44.03591537475586, "global_step": 331168, "epoch": 2736} {"train_loss": -43.83250045776367, "global_step": 331169, "epoch": 2736} {"train_loss": -43.95967483520508, "global_step": 331170, "epoch": 2736} {"train_loss": -44.488277435302734, "global_step": 331171, "epoch": 2736} {"train_loss": -43.884857177734375, "global_step": 331172, "epoch": 2736} {"train_loss": -44.5539436340332, "global_step": 331173, "epoch": 2736} {"train_loss": -44.560089111328125, "global_step": 331174, "epoch": 2736} {"train_loss": -44.479000091552734, "global_step": 331175, "epoch": 2736} {"train_loss": -43.877293389690806, "global_step": 331176, "epoch": 2736, "val_loss": 2441958.75} {"train_loss": -44.79218673706055, "global_step": 331177, "epoch": 2737} {"train_loss": -44.29438018798828, "global_step": 331178, "epoch": 2737} {"train_loss": -44.663360595703125, "global_step": 331179, "epoch": 2737} {"train_loss": -44.936912536621094, "global_step": 331180, "epoch": 2737} {"train_loss": -44.5994987487793, "global_step": 331181, "epoch": 2737} {"train_loss": -45.24735641479492, "global_step": 331182, "epoch": 2737} {"train_loss": -44.5174446105957, "global_step": 331183, "epoch": 2737} {"train_loss": -45.04140090942383, "global_step": 331184, "epoch": 2737} {"train_loss": -45.22062301635742, "global_step": 331185, "epoch": 2737} {"train_loss": -45.049320220947266, "global_step": 331186, "epoch": 2737} {"train_loss": -45.0423698425293, "global_step": 331187, "epoch": 2737} {"train_loss": -45.0246696472168, "global_step": 331188, "epoch": 2737} {"train_loss": -44.68410110473633, "global_step": 331189, "epoch": 2737} {"train_loss": -45.111629486083984, "global_step": 331190, "epoch": 2737} {"train_loss": -44.44723129272461, "global_step": 331191, "epoch": 2737} {"train_loss": -44.75640869140625, "global_step": 331192, "epoch": 2737} {"train_loss": -45.26954650878906, "global_step": 331193, "epoch": 2737} {"train_loss": -45.2751579284668, "global_step": 331194, "epoch": 2737} {"train_loss": -45.4657096862793, "global_step": 331195, "epoch": 2737} {"train_loss": -44.80426788330078, "global_step": 331196, "epoch": 2737} {"train_loss": -45.18727493286133, "global_step": 331197, "epoch": 2737} {"train_loss": -45.2980842590332, "global_step": 331198, "epoch": 2737} {"train_loss": -45.02568435668945, "global_step": 331199, "epoch": 2737} {"train_loss": -45.47678756713867, "global_step": 331200, "epoch": 2737} {"train_loss": -45.074058532714844, "global_step": 331201, "epoch": 2737} {"train_loss": -44.824703216552734, "global_step": 331202, "epoch": 2737} {"train_loss": -45.43207931518555, "global_step": 331203, "epoch": 2737} {"train_loss": -44.78376388549805, "global_step": 331204, "epoch": 2737} {"train_loss": -43.06618881225586, "global_step": 331205, "epoch": 2737} {"train_loss": -45.11737823486328, "global_step": 331206, "epoch": 2737} {"train_loss": -44.72092819213867, "global_step": 331207, "epoch": 2737} {"train_loss": -44.08457946777344, "global_step": 331208, "epoch": 2737} {"train_loss": -44.51499938964844, "global_step": 331209, "epoch": 2737} {"train_loss": -43.42136764526367, "global_step": 331210, "epoch": 2737} {"train_loss": -44.039451599121094, "global_step": 331211, "epoch": 2737} {"train_loss": -44.996498107910156, "global_step": 331212, "epoch": 2737} {"train_loss": -44.27737045288086, "global_step": 331213, "epoch": 2737} {"train_loss": -43.41044998168945, "global_step": 331214, "epoch": 2737} {"train_loss": -42.635597229003906, "global_step": 331215, "epoch": 2737} {"train_loss": -43.47127151489258, "global_step": 331216, "epoch": 2737} {"train_loss": -44.818538665771484, "global_step": 331217, "epoch": 2737} {"train_loss": -44.64017105102539, "global_step": 331218, "epoch": 2737} {"train_loss": -44.35370635986328, "global_step": 331219, "epoch": 2737} {"train_loss": -43.214942932128906, "global_step": 331220, "epoch": 2737} {"train_loss": -43.85028076171875, "global_step": 331221, "epoch": 2737} {"train_loss": -43.747772216796875, "global_step": 331222, "epoch": 2737} {"train_loss": -43.43185043334961, "global_step": 331223, "epoch": 2737} {"train_loss": -43.639862060546875, "global_step": 331224, "epoch": 2737} {"train_loss": -43.22107696533203, "global_step": 331225, "epoch": 2737} {"train_loss": -43.9814338684082, "global_step": 331226, "epoch": 2737} {"train_loss": -43.412322998046875, "global_step": 331227, "epoch": 2737} {"train_loss": -44.829139709472656, "global_step": 331228, "epoch": 2737} {"train_loss": -44.16476058959961, "global_step": 331229, "epoch": 2737} {"train_loss": -42.351600646972656, "global_step": 331230, "epoch": 2737} {"train_loss": -42.003875732421875, "global_step": 331231, "epoch": 2737} {"train_loss": -43.47410202026367, "global_step": 331232, "epoch": 2737} {"train_loss": -44.120094299316406, "global_step": 331233, "epoch": 2737} {"train_loss": -44.371498107910156, "global_step": 331234, "epoch": 2737} {"train_loss": -44.53656005859375, "global_step": 331235, "epoch": 2737} {"train_loss": -43.856563568115234, "global_step": 331236, "epoch": 2737} {"train_loss": -44.368011474609375, "global_step": 331237, "epoch": 2737} {"train_loss": -44.045955657958984, "global_step": 331238, "epoch": 2737} {"train_loss": -43.93265914916992, "global_step": 331239, "epoch": 2737} {"train_loss": -44.720157623291016, "global_step": 331240, "epoch": 2737} {"train_loss": -42.10782241821289, "global_step": 331241, "epoch": 2737} {"train_loss": -41.0954475402832, "global_step": 331242, "epoch": 2737} {"train_loss": -42.21138381958008, "global_step": 331243, "epoch": 2737} {"train_loss": -43.24538803100586, "global_step": 331244, "epoch": 2737} {"train_loss": -44.1059684753418, "global_step": 331245, "epoch": 2737} {"train_loss": -43.28377151489258, "global_step": 331246, "epoch": 2737} {"train_loss": -43.189144134521484, "global_step": 331247, "epoch": 2737} {"train_loss": -43.920162200927734, "global_step": 331248, "epoch": 2737} {"train_loss": -42.374176025390625, "global_step": 331249, "epoch": 2737} {"train_loss": -42.91382598876953, "global_step": 331250, "epoch": 2737} {"train_loss": -41.25923156738281, "global_step": 331251, "epoch": 2737} {"train_loss": -43.20254135131836, "global_step": 331252, "epoch": 2737} {"train_loss": -43.151824951171875, "global_step": 331253, "epoch": 2737} {"train_loss": -40.42692947387695, "global_step": 331254, "epoch": 2737} {"train_loss": -41.90966033935547, "global_step": 331255, "epoch": 2737} {"train_loss": -43.7248649597168, "global_step": 331256, "epoch": 2737} {"train_loss": -42.59765625, "global_step": 331257, "epoch": 2737} {"train_loss": -43.3079948425293, "global_step": 331258, "epoch": 2737} {"train_loss": -42.77484130859375, "global_step": 331259, "epoch": 2737} {"train_loss": -42.86320495605469, "global_step": 331260, "epoch": 2737} {"train_loss": -43.144710540771484, "global_step": 331261, "epoch": 2737} {"train_loss": -43.04647445678711, "global_step": 331262, "epoch": 2737} {"train_loss": -42.75776290893555, "global_step": 331263, "epoch": 2737} {"train_loss": -42.50095748901367, "global_step": 331264, "epoch": 2737} {"train_loss": -43.53565979003906, "global_step": 331265, "epoch": 2737} {"train_loss": -41.960514068603516, "global_step": 331266, "epoch": 2737} {"train_loss": -42.00205612182617, "global_step": 331267, "epoch": 2737} {"train_loss": -43.037818908691406, "global_step": 331268, "epoch": 2737} {"train_loss": -42.56342697143555, "global_step": 331269, "epoch": 2737} {"train_loss": -41.73829650878906, "global_step": 331270, "epoch": 2737} {"train_loss": -42.65096664428711, "global_step": 331271, "epoch": 2737} {"train_loss": -42.74849319458008, "global_step": 331272, "epoch": 2737} {"train_loss": -43.569068908691406, "global_step": 331273, "epoch": 2737} {"train_loss": -43.13798522949219, "global_step": 331274, "epoch": 2737} {"train_loss": -41.61396026611328, "global_step": 331275, "epoch": 2737} {"train_loss": -43.69894027709961, "global_step": 331276, "epoch": 2737} {"train_loss": -43.174468994140625, "global_step": 331277, "epoch": 2737} {"train_loss": -43.73215866088867, "global_step": 331278, "epoch": 2737} {"train_loss": -43.57368087768555, "global_step": 331279, "epoch": 2737} {"train_loss": -44.03501510620117, "global_step": 331280, "epoch": 2737} {"train_loss": -43.18075942993164, "global_step": 331281, "epoch": 2737} {"train_loss": -43.63998031616211, "global_step": 331282, "epoch": 2737} {"train_loss": -43.4378776550293, "global_step": 331283, "epoch": 2737} {"train_loss": -43.49596405029297, "global_step": 331284, "epoch": 2737} {"train_loss": -43.137447357177734, "global_step": 331285, "epoch": 2737} {"train_loss": -43.23969268798828, "global_step": 331286, "epoch": 2737} {"train_loss": -43.51266098022461, "global_step": 331287, "epoch": 2737} {"train_loss": -42.332393646240234, "global_step": 331288, "epoch": 2737} {"train_loss": -43.38607406616211, "global_step": 331289, "epoch": 2737} {"train_loss": -43.825233459472656, "global_step": 331290, "epoch": 2737} {"train_loss": -44.03963088989258, "global_step": 331291, "epoch": 2737} {"train_loss": -43.36067199707031, "global_step": 331292, "epoch": 2737} {"train_loss": -43.68256378173828, "global_step": 331293, "epoch": 2737} {"train_loss": -43.73963165283203, "global_step": 331294, "epoch": 2737} {"train_loss": -44.3557243347168, "global_step": 331295, "epoch": 2737} {"train_loss": -42.2116584777832, "global_step": 331296, "epoch": 2737} {"train_loss": -43.72534157619003, "global_step": 331297, "epoch": 2737, "val_loss": 2417006.75} {"train_loss": -44.46212387084961, "global_step": 331298, "epoch": 2738} {"train_loss": -44.196998596191406, "global_step": 331299, "epoch": 2738} {"train_loss": -44.519569396972656, "global_step": 331300, "epoch": 2738} {"train_loss": -44.104061126708984, "global_step": 331301, "epoch": 2738} {"train_loss": -44.47745132446289, "global_step": 331302, "epoch": 2738} {"train_loss": -43.67596435546875, "global_step": 331303, "epoch": 2738} {"train_loss": -43.84977340698242, "global_step": 331304, "epoch": 2738} {"train_loss": -44.30617904663086, "global_step": 331305, "epoch": 2738} {"train_loss": -44.557952880859375, "global_step": 331306, "epoch": 2738} {"train_loss": -44.41526412963867, "global_step": 331307, "epoch": 2738} {"train_loss": -44.822818756103516, "global_step": 331308, "epoch": 2738} {"train_loss": -44.671356201171875, "global_step": 331309, "epoch": 2738} {"train_loss": -44.816280364990234, "global_step": 331310, "epoch": 2738} {"train_loss": -44.977561950683594, "global_step": 331311, "epoch": 2738} {"train_loss": -44.834197998046875, "global_step": 331312, "epoch": 2738} {"train_loss": -44.8777961730957, "global_step": 331313, "epoch": 2738} {"train_loss": -44.9515380859375, "global_step": 331314, "epoch": 2738} {"train_loss": -44.311729431152344, "global_step": 331315, "epoch": 2738} {"train_loss": -44.93526077270508, "global_step": 331316, "epoch": 2738} {"train_loss": -44.636043548583984, "global_step": 331317, "epoch": 2738} {"train_loss": -45.027137756347656, "global_step": 331318, "epoch": 2738} {"train_loss": -44.851165771484375, "global_step": 331319, "epoch": 2738} {"train_loss": -44.619380950927734, "global_step": 331320, "epoch": 2738} {"train_loss": -44.47657012939453, "global_step": 331321, "epoch": 2738} {"train_loss": -44.38279342651367, "global_step": 331322, "epoch": 2738} {"train_loss": -44.80255889892578, "global_step": 331323, "epoch": 2738} {"train_loss": -44.66386032104492, "global_step": 331324, "epoch": 2738} {"train_loss": -44.775203704833984, "global_step": 331325, "epoch": 2738} {"train_loss": -44.19816207885742, "global_step": 331326, "epoch": 2738} {"train_loss": -44.45085525512695, "global_step": 331327, "epoch": 2738} {"train_loss": -44.510841369628906, "global_step": 331328, "epoch": 2738} {"train_loss": -44.83681869506836, "global_step": 331329, "epoch": 2738} {"train_loss": -44.59870529174805, "global_step": 331330, "epoch": 2738} {"train_loss": -44.6959342956543, "global_step": 331331, "epoch": 2738} {"train_loss": -44.866920471191406, "global_step": 331332, "epoch": 2738} {"train_loss": -44.106666564941406, "global_step": 331333, "epoch": 2738} {"train_loss": -44.010101318359375, "global_step": 331334, "epoch": 2738} {"train_loss": -44.51218795776367, "global_step": 331335, "epoch": 2738} {"train_loss": -44.76908493041992, "global_step": 331336, "epoch": 2738} {"train_loss": -44.689178466796875, "global_step": 331337, "epoch": 2738} {"train_loss": -44.114803314208984, "global_step": 331338, "epoch": 2738} {"train_loss": -44.27909851074219, "global_step": 331339, "epoch": 2738} {"train_loss": -44.29948806762695, "global_step": 331340, "epoch": 2738} {"train_loss": -44.36985397338867, "global_step": 331341, "epoch": 2738} {"train_loss": -45.50806427001953, "global_step": 331342, "epoch": 2738} {"train_loss": -45.07339096069336, "global_step": 331343, "epoch": 2738} {"train_loss": -44.48078536987305, "global_step": 331344, "epoch": 2738} {"train_loss": -44.999977111816406, "global_step": 331345, "epoch": 2738} {"train_loss": -43.24813461303711, "global_step": 331346, "epoch": 2738} {"train_loss": -44.32008743286133, "global_step": 331347, "epoch": 2738} {"train_loss": -45.23272705078125, "global_step": 331348, "epoch": 2738} {"train_loss": -44.47160720825195, "global_step": 331349, "epoch": 2738} {"train_loss": -44.360015869140625, "global_step": 331350, "epoch": 2738} {"train_loss": -44.529170989990234, "global_step": 331351, "epoch": 2738} {"train_loss": -45.029972076416016, "global_step": 331352, "epoch": 2738} {"train_loss": -44.5800666809082, "global_step": 331353, "epoch": 2738} {"train_loss": -44.64028549194336, "global_step": 331354, "epoch": 2738} {"train_loss": -44.62664794921875, "global_step": 331355, "epoch": 2738} {"train_loss": -44.36252975463867, "global_step": 331356, "epoch": 2738} {"train_loss": -45.136287689208984, "global_step": 331357, "epoch": 2738} {"train_loss": -44.47304916381836, "global_step": 331358, "epoch": 2738} {"train_loss": -44.82920455932617, "global_step": 331359, "epoch": 2738} {"train_loss": -44.92369079589844, "global_step": 331360, "epoch": 2738} {"train_loss": -44.769657135009766, "global_step": 331361, "epoch": 2738} {"train_loss": -44.27009582519531, "global_step": 331362, "epoch": 2738} {"train_loss": -45.3286247253418, "global_step": 331363, "epoch": 2738} {"train_loss": -44.451534271240234, "global_step": 331364, "epoch": 2738} {"train_loss": -43.39824295043945, "global_step": 331365, "epoch": 2738} {"train_loss": -44.91733932495117, "global_step": 331366, "epoch": 2738} {"train_loss": -44.37825393676758, "global_step": 331367, "epoch": 2738} {"train_loss": -42.99258041381836, "global_step": 331368, "epoch": 2738} {"train_loss": -42.68327713012695, "global_step": 331369, "epoch": 2738} {"train_loss": -43.082698822021484, "global_step": 331370, "epoch": 2738} {"train_loss": -43.56616973876953, "global_step": 331371, "epoch": 2738} {"train_loss": -44.31871032714844, "global_step": 331372, "epoch": 2738} {"train_loss": -43.294639587402344, "global_step": 331373, "epoch": 2738} {"train_loss": -43.67462158203125, "global_step": 331374, "epoch": 2738} {"train_loss": -44.69097900390625, "global_step": 331375, "epoch": 2738} {"train_loss": -44.7417106628418, "global_step": 331376, "epoch": 2738} {"train_loss": -44.26034164428711, "global_step": 331377, "epoch": 2738} {"train_loss": -42.93012237548828, "global_step": 331378, "epoch": 2738} {"train_loss": -44.097599029541016, "global_step": 331379, "epoch": 2738} {"train_loss": -43.96074295043945, "global_step": 331380, "epoch": 2738} {"train_loss": -44.801780700683594, "global_step": 331381, "epoch": 2738} {"train_loss": -43.128353118896484, "global_step": 331382, "epoch": 2738} {"train_loss": -43.26640701293945, "global_step": 331383, "epoch": 2738} {"train_loss": -44.292442321777344, "global_step": 331384, "epoch": 2738} {"train_loss": -43.63546371459961, "global_step": 331385, "epoch": 2738} {"train_loss": -43.11405563354492, "global_step": 331386, "epoch": 2738} {"train_loss": -42.31168746948242, "global_step": 331387, "epoch": 2738} {"train_loss": -44.448768615722656, "global_step": 331388, "epoch": 2738} {"train_loss": -44.370479583740234, "global_step": 331389, "epoch": 2738} {"train_loss": -43.67913055419922, "global_step": 331390, "epoch": 2738} {"train_loss": -43.52994918823242, "global_step": 331391, "epoch": 2738} {"train_loss": -43.948768615722656, "global_step": 331392, "epoch": 2738} {"train_loss": -43.629188537597656, "global_step": 331393, "epoch": 2738} {"train_loss": -42.9832878112793, "global_step": 331394, "epoch": 2738} {"train_loss": -42.32159423828125, "global_step": 331395, "epoch": 2738} {"train_loss": -42.735595703125, "global_step": 331396, "epoch": 2738} {"train_loss": -45.02394485473633, "global_step": 331397, "epoch": 2738} {"train_loss": -43.46767044067383, "global_step": 331398, "epoch": 2738} {"train_loss": -43.93612289428711, "global_step": 331399, "epoch": 2738} {"train_loss": -44.67121124267578, "global_step": 331400, "epoch": 2738} {"train_loss": -44.3059196472168, "global_step": 331401, "epoch": 2738} {"train_loss": -43.63992691040039, "global_step": 331402, "epoch": 2738} {"train_loss": -43.859004974365234, "global_step": 331403, "epoch": 2738} {"train_loss": -44.67783737182617, "global_step": 331404, "epoch": 2738} {"train_loss": -44.373146057128906, "global_step": 331405, "epoch": 2738} {"train_loss": -44.67143630981445, "global_step": 331406, "epoch": 2738} {"train_loss": -44.32361602783203, "global_step": 331407, "epoch": 2738} {"train_loss": -43.61188888549805, "global_step": 331408, "epoch": 2738} {"train_loss": -44.69582748413086, "global_step": 331409, "epoch": 2738} {"train_loss": -44.632381439208984, "global_step": 331410, "epoch": 2738} {"train_loss": -44.8737678527832, "global_step": 331411, "epoch": 2738} {"train_loss": -44.40781021118164, "global_step": 331412, "epoch": 2738} {"train_loss": -44.70488739013672, "global_step": 331413, "epoch": 2738} {"train_loss": -44.59994125366211, "global_step": 331414, "epoch": 2738} {"train_loss": -44.43317794799805, "global_step": 331415, "epoch": 2738} {"train_loss": -44.288414001464844, "global_step": 331416, "epoch": 2738} {"train_loss": -44.42072677612305, "global_step": 331417, "epoch": 2738} {"train_loss": -44.283839738073425, "global_step": 331418, "epoch": 2738, "val_loss": 2584085.75} {"train_loss": -41.324005126953125, "global_step": 331419, "epoch": 2739} {"train_loss": -42.16162109375, "global_step": 331420, "epoch": 2739} {"train_loss": -43.31709289550781, "global_step": 331421, "epoch": 2739} {"train_loss": -42.88380813598633, "global_step": 331422, "epoch": 2739} {"train_loss": -42.5963134765625, "global_step": 331423, "epoch": 2739} {"train_loss": -42.214515686035156, "global_step": 331424, "epoch": 2739} {"train_loss": -42.39506912231445, "global_step": 331425, "epoch": 2739} {"train_loss": -44.21347427368164, "global_step": 331426, "epoch": 2739} {"train_loss": -43.35211944580078, "global_step": 331427, "epoch": 2739} {"train_loss": -43.570289611816406, "global_step": 331428, "epoch": 2739} {"train_loss": -43.33481979370117, "global_step": 331429, "epoch": 2739} {"train_loss": -43.7400016784668, "global_step": 331430, "epoch": 2739} {"train_loss": -43.59952926635742, "global_step": 331431, "epoch": 2739} {"train_loss": -43.56747055053711, "global_step": 331432, "epoch": 2739} {"train_loss": -43.75148391723633, "global_step": 331433, "epoch": 2739} {"train_loss": -43.77037811279297, "global_step": 331434, "epoch": 2739} {"train_loss": -44.14570999145508, "global_step": 331435, "epoch": 2739} {"train_loss": -43.54353713989258, "global_step": 331436, "epoch": 2739} {"train_loss": -44.33223342895508, "global_step": 331437, "epoch": 2739} {"train_loss": -44.21885681152344, "global_step": 331438, "epoch": 2739} {"train_loss": -43.09343338012695, "global_step": 331439, "epoch": 2739} {"train_loss": -43.92238998413086, "global_step": 331440, "epoch": 2739} {"train_loss": -42.895599365234375, "global_step": 331441, "epoch": 2739} {"train_loss": -42.388084411621094, "global_step": 331442, "epoch": 2739} {"train_loss": -43.11508560180664, "global_step": 331443, "epoch": 2739} {"train_loss": -43.13825225830078, "global_step": 331444, "epoch": 2739} {"train_loss": -43.705230712890625, "global_step": 331445, "epoch": 2739} {"train_loss": -44.32558822631836, "global_step": 331446, "epoch": 2739} {"train_loss": -44.099178314208984, "global_step": 331447, "epoch": 2739} {"train_loss": -43.72005081176758, "global_step": 331448, "epoch": 2739} {"train_loss": -44.24560546875, "global_step": 331449, "epoch": 2739} {"train_loss": -44.203487396240234, "global_step": 331450, "epoch": 2739} {"train_loss": -43.96676254272461, "global_step": 331451, "epoch": 2739} {"train_loss": -44.62593460083008, "global_step": 331452, "epoch": 2739} {"train_loss": -42.56083679199219, "global_step": 331453, "epoch": 2739} {"train_loss": -44.76063537597656, "global_step": 331454, "epoch": 2739} {"train_loss": -44.65113830566406, "global_step": 331455, "epoch": 2739} {"train_loss": -44.26512908935547, "global_step": 331456, "epoch": 2739} {"train_loss": -44.5635986328125, "global_step": 331457, "epoch": 2739} {"train_loss": -44.17205047607422, "global_step": 331458, "epoch": 2739} {"train_loss": -44.59217071533203, "global_step": 331459, "epoch": 2739} {"train_loss": -44.96500015258789, "global_step": 331460, "epoch": 2739} {"train_loss": -44.34515380859375, "global_step": 331461, "epoch": 2739} {"train_loss": -44.7755012512207, "global_step": 331462, "epoch": 2739} {"train_loss": -44.77994918823242, "global_step": 331463, "epoch": 2739} {"train_loss": -44.7042121887207, "global_step": 331464, "epoch": 2739} {"train_loss": -44.8675651550293, "global_step": 331465, "epoch": 2739} {"train_loss": -45.24422073364258, "global_step": 331466, "epoch": 2739} {"train_loss": -44.89405822753906, "global_step": 331467, "epoch": 2739} {"train_loss": -44.855690002441406, "global_step": 331468, "epoch": 2739} {"train_loss": -44.99851608276367, "global_step": 331469, "epoch": 2739} {"train_loss": -44.48713302612305, "global_step": 331470, "epoch": 2739} {"train_loss": -44.377620697021484, "global_step": 331471, "epoch": 2739} {"train_loss": -44.32597732543945, "global_step": 331472, "epoch": 2739} {"train_loss": -45.185482025146484, "global_step": 331473, "epoch": 2739} {"train_loss": -44.65536117553711, "global_step": 331474, "epoch": 2739} {"train_loss": -43.99512481689453, "global_step": 331475, "epoch": 2739} {"train_loss": -43.6153678894043, "global_step": 331476, "epoch": 2739} {"train_loss": -43.81266403198242, "global_step": 331477, "epoch": 2739} {"train_loss": -44.35337448120117, "global_step": 331478, "epoch": 2739} {"train_loss": -43.443702697753906, "global_step": 331479, "epoch": 2739} {"train_loss": -44.828487396240234, "global_step": 331480, "epoch": 2739} {"train_loss": -44.8351936340332, "global_step": 331481, "epoch": 2739} {"train_loss": -43.44419479370117, "global_step": 331482, "epoch": 2739} {"train_loss": -42.35948181152344, "global_step": 331483, "epoch": 2739} {"train_loss": -44.12031936645508, "global_step": 331484, "epoch": 2739} {"train_loss": -43.8818473815918, "global_step": 331485, "epoch": 2739} {"train_loss": -41.81673049926758, "global_step": 331486, "epoch": 2739} {"train_loss": -42.353084564208984, "global_step": 331487, "epoch": 2739} {"train_loss": -43.5089111328125, "global_step": 331488, "epoch": 2739} {"train_loss": -42.925193786621094, "global_step": 331489, "epoch": 2739} {"train_loss": -42.91453170776367, "global_step": 331490, "epoch": 2739} {"train_loss": -43.371910095214844, "global_step": 331491, "epoch": 2739} {"train_loss": -41.3485221862793, "global_step": 331492, "epoch": 2739} {"train_loss": -42.35606002807617, "global_step": 331493, "epoch": 2739} {"train_loss": -43.18296432495117, "global_step": 331494, "epoch": 2739} {"train_loss": -43.57026672363281, "global_step": 331495, "epoch": 2739} {"train_loss": -41.841041564941406, "global_step": 331496, "epoch": 2739} {"train_loss": -42.33290481567383, "global_step": 331497, "epoch": 2739} {"train_loss": -36.67068862915039, "global_step": 331498, "epoch": 2739} {"train_loss": -42.551490783691406, "global_step": 331499, "epoch": 2739} {"train_loss": -33.96267318725586, "global_step": 331500, "epoch": 2739} {"train_loss": -37.39678955078125, "global_step": 331501, "epoch": 2739} {"train_loss": -43.237754821777344, "global_step": 331502, "epoch": 2739} {"train_loss": -42.268062591552734, "global_step": 331503, "epoch": 2739} {"train_loss": -36.218284606933594, "global_step": 331504, "epoch": 2739} {"train_loss": -41.011966705322266, "global_step": 331505, "epoch": 2739} {"train_loss": -29.992292404174805, "global_step": 331506, "epoch": 2739} {"train_loss": -41.03934097290039, "global_step": 331507, "epoch": 2739} {"train_loss": -42.436100006103516, "global_step": 331508, "epoch": 2739} {"train_loss": -28.795135498046875, "global_step": 331509, "epoch": 2739} {"train_loss": -41.70280456542969, "global_step": 331510, "epoch": 2739} {"train_loss": -40.83295440673828, "global_step": 331511, "epoch": 2739} {"train_loss": -42.428157806396484, "global_step": 331512, "epoch": 2739} {"train_loss": -41.10590744018555, "global_step": 331513, "epoch": 2739} {"train_loss": -35.07763671875, "global_step": 331514, "epoch": 2739} {"train_loss": -38.70307540893555, "global_step": 331515, "epoch": 2739} {"train_loss": -41.39838409423828, "global_step": 331516, "epoch": 2739} {"train_loss": -40.48435592651367, "global_step": 331517, "epoch": 2739} {"train_loss": -38.65424346923828, "global_step": 331518, "epoch": 2739} {"train_loss": -25.712854385375977, "global_step": 331519, "epoch": 2739} {"train_loss": -40.82788848876953, "global_step": 331520, "epoch": 2739} {"train_loss": -40.97002029418945, "global_step": 331521, "epoch": 2739} {"train_loss": -37.712806701660156, "global_step": 331522, "epoch": 2739} {"train_loss": -41.47426986694336, "global_step": 331523, "epoch": 2739} {"train_loss": -42.00822448730469, "global_step": 331524, "epoch": 2739} {"train_loss": -41.7027702331543, "global_step": 331525, "epoch": 2739} {"train_loss": -42.18029022216797, "global_step": 331526, "epoch": 2739} {"train_loss": -41.67878723144531, "global_step": 331527, "epoch": 2739} {"train_loss": -41.298057556152344, "global_step": 331528, "epoch": 2739} {"train_loss": -43.100624084472656, "global_step": 331529, "epoch": 2739} {"train_loss": -42.60383987426758, "global_step": 331530, "epoch": 2739} {"train_loss": -42.54218673706055, "global_step": 331531, "epoch": 2739} {"train_loss": -42.17688751220703, "global_step": 331532, "epoch": 2739} {"train_loss": -41.172977447509766, "global_step": 331533, "epoch": 2739} {"train_loss": -42.37577438354492, "global_step": 331534, "epoch": 2739} {"train_loss": -43.075355529785156, "global_step": 331535, "epoch": 2739} {"train_loss": -42.536468505859375, "global_step": 331536, "epoch": 2739} {"train_loss": -43.171260833740234, "global_step": 331537, "epoch": 2739} {"train_loss": -43.0634765625, "global_step": 331538, "epoch": 2739} {"train_loss": -42.42181276683965, "global_step": 331539, "epoch": 2739, "val_loss": 2558376.25} {"train_loss": -41.28790283203125, "global_step": 331540, "epoch": 2740} {"train_loss": -42.87942123413086, "global_step": 331541, "epoch": 2740} {"train_loss": -42.531837463378906, "global_step": 331542, "epoch": 2740} {"train_loss": -42.94913864135742, "global_step": 331543, "epoch": 2740} {"train_loss": -42.74376678466797, "global_step": 331544, "epoch": 2740} {"train_loss": -42.49155807495117, "global_step": 331545, "epoch": 2740} {"train_loss": -42.74058532714844, "global_step": 331546, "epoch": 2740} {"train_loss": -42.334049224853516, "global_step": 331547, "epoch": 2740} {"train_loss": -43.069190979003906, "global_step": 331548, "epoch": 2740} {"train_loss": -43.42953109741211, "global_step": 331549, "epoch": 2740} {"train_loss": -41.39010238647461, "global_step": 331550, "epoch": 2740} {"train_loss": -43.11045455932617, "global_step": 331551, "epoch": 2740} {"train_loss": -42.86566925048828, "global_step": 331552, "epoch": 2740} {"train_loss": -43.14380645751953, "global_step": 331553, "epoch": 2740} {"train_loss": -42.62445831298828, "global_step": 331554, "epoch": 2740} {"train_loss": -43.65037155151367, "global_step": 331555, "epoch": 2740} {"train_loss": -43.351051330566406, "global_step": 331556, "epoch": 2740} {"train_loss": -43.72795486450195, "global_step": 331557, "epoch": 2740} {"train_loss": -44.07257080078125, "global_step": 331558, "epoch": 2740} {"train_loss": -42.94666290283203, "global_step": 331559, "epoch": 2740} {"train_loss": -44.2504768371582, "global_step": 331560, "epoch": 2740} {"train_loss": -44.25593948364258, "global_step": 331561, "epoch": 2740} {"train_loss": -43.905067443847656, "global_step": 331562, "epoch": 2740} {"train_loss": -43.5245475769043, "global_step": 331563, "epoch": 2740} {"train_loss": -43.92039489746094, "global_step": 331564, "epoch": 2740} {"train_loss": -43.97834777832031, "global_step": 331565, "epoch": 2740} {"train_loss": -43.79701614379883, "global_step": 331566, "epoch": 2740} {"train_loss": -44.17866897583008, "global_step": 331567, "epoch": 2740} {"train_loss": -42.97185134887695, "global_step": 331568, "epoch": 2740} {"train_loss": -44.1362190246582, "global_step": 331569, "epoch": 2740} {"train_loss": -43.896644592285156, "global_step": 331570, "epoch": 2740} {"train_loss": -44.22197341918945, "global_step": 331571, "epoch": 2740} {"train_loss": -44.1353874206543, "global_step": 331572, "epoch": 2740} {"train_loss": -44.628475189208984, "global_step": 331573, "epoch": 2740} {"train_loss": -44.15228271484375, "global_step": 331574, "epoch": 2740} {"train_loss": -44.385597229003906, "global_step": 331575, "epoch": 2740} {"train_loss": -43.7779655456543, "global_step": 331576, "epoch": 2740} {"train_loss": -44.396026611328125, "global_step": 331577, "epoch": 2740} {"train_loss": -44.365779876708984, "global_step": 331578, "epoch": 2740} {"train_loss": -44.67869567871094, "global_step": 331579, "epoch": 2740} {"train_loss": -44.35995864868164, "global_step": 331580, "epoch": 2740} {"train_loss": -44.05662155151367, "global_step": 331581, "epoch": 2740} {"train_loss": -43.35921859741211, "global_step": 331582, "epoch": 2740} {"train_loss": -44.6353874206543, "global_step": 331583, "epoch": 2740} {"train_loss": -43.6195182800293, "global_step": 331584, "epoch": 2740} {"train_loss": -42.63577651977539, "global_step": 331585, "epoch": 2740} {"train_loss": -42.431766510009766, "global_step": 331586, "epoch": 2740} {"train_loss": -43.536895751953125, "global_step": 331587, "epoch": 2740} {"train_loss": -43.914939880371094, "global_step": 331588, "epoch": 2740} {"train_loss": -42.946571350097656, "global_step": 331589, "epoch": 2740} {"train_loss": -43.784156799316406, "global_step": 331590, "epoch": 2740} {"train_loss": -44.24188995361328, "global_step": 331591, "epoch": 2740} {"train_loss": -43.51723098754883, "global_step": 331592, "epoch": 2740} {"train_loss": -43.849788665771484, "global_step": 331593, "epoch": 2740} {"train_loss": -43.96417999267578, "global_step": 331594, "epoch": 2740} {"train_loss": -44.125083923339844, "global_step": 331595, "epoch": 2740} {"train_loss": -43.33031463623047, "global_step": 331596, "epoch": 2740} {"train_loss": -44.16199493408203, "global_step": 331597, "epoch": 2740} {"train_loss": -43.9917106628418, "global_step": 331598, "epoch": 2740} {"train_loss": -43.5519905090332, "global_step": 331599, "epoch": 2740} {"train_loss": -41.974853515625, "global_step": 331600, "epoch": 2740} {"train_loss": -43.63893508911133, "global_step": 331601, "epoch": 2740} {"train_loss": -43.839637756347656, "global_step": 331602, "epoch": 2740} {"train_loss": -44.15754318237305, "global_step": 331603, "epoch": 2740} {"train_loss": -42.4725341796875, "global_step": 331604, "epoch": 2740} {"train_loss": -43.119422912597656, "global_step": 331605, "epoch": 2740} {"train_loss": -43.874385833740234, "global_step": 331606, "epoch": 2740} {"train_loss": -43.42875289916992, "global_step": 331607, "epoch": 2740} {"train_loss": -43.544769287109375, "global_step": 331608, "epoch": 2740} {"train_loss": -43.96405029296875, "global_step": 331609, "epoch": 2740} {"train_loss": -43.43248748779297, "global_step": 331610, "epoch": 2740} {"train_loss": -42.73733139038086, "global_step": 331611, "epoch": 2740} {"train_loss": -43.756561279296875, "global_step": 331612, "epoch": 2740} {"train_loss": -44.3145866394043, "global_step": 331613, "epoch": 2740} {"train_loss": -43.1318473815918, "global_step": 331614, "epoch": 2740} {"train_loss": -44.01565170288086, "global_step": 331615, "epoch": 2740} {"train_loss": -42.45027160644531, "global_step": 331616, "epoch": 2740} {"train_loss": -43.97975540161133, "global_step": 331617, "epoch": 2740} {"train_loss": -42.25960922241211, "global_step": 331618, "epoch": 2740} {"train_loss": -42.638397216796875, "global_step": 331619, "epoch": 2740} {"train_loss": -42.673458099365234, "global_step": 331620, "epoch": 2740} {"train_loss": -41.63001251220703, "global_step": 331621, "epoch": 2740} {"train_loss": -43.31747055053711, "global_step": 331622, "epoch": 2740} {"train_loss": -42.477378845214844, "global_step": 331623, "epoch": 2740} {"train_loss": -43.03750991821289, "global_step": 331624, "epoch": 2740} {"train_loss": -44.2402229309082, "global_step": 331625, "epoch": 2740} {"train_loss": -42.211669921875, "global_step": 331626, "epoch": 2740} {"train_loss": -41.3154411315918, "global_step": 331627, "epoch": 2740} {"train_loss": -42.720863342285156, "global_step": 331628, "epoch": 2740} {"train_loss": -43.78037643432617, "global_step": 331629, "epoch": 2740} {"train_loss": -41.8908576965332, "global_step": 331630, "epoch": 2740} {"train_loss": -41.34251022338867, "global_step": 331631, "epoch": 2740} {"train_loss": -42.373104095458984, "global_step": 331632, "epoch": 2740} {"train_loss": -38.0342903137207, "global_step": 331633, "epoch": 2740} {"train_loss": -39.06349182128906, "global_step": 331634, "epoch": 2740} {"train_loss": -41.37067413330078, "global_step": 331635, "epoch": 2740} {"train_loss": -41.48749542236328, "global_step": 331636, "epoch": 2740} {"train_loss": -40.80304718017578, "global_step": 331637, "epoch": 2740} {"train_loss": -39.85616683959961, "global_step": 331638, "epoch": 2740} {"train_loss": -42.482357025146484, "global_step": 331639, "epoch": 2740} {"train_loss": -40.032569885253906, "global_step": 331640, "epoch": 2740} {"train_loss": -41.860877990722656, "global_step": 331641, "epoch": 2740} {"train_loss": -41.833900451660156, "global_step": 331642, "epoch": 2740} {"train_loss": -42.112396240234375, "global_step": 331643, "epoch": 2740} {"train_loss": -42.93089294433594, "global_step": 331644, "epoch": 2740} {"train_loss": -39.9292106628418, "global_step": 331645, "epoch": 2740} {"train_loss": -42.759090423583984, "global_step": 331646, "epoch": 2740} {"train_loss": -40.63960647583008, "global_step": 331647, "epoch": 2740} {"train_loss": -42.265438079833984, "global_step": 331648, "epoch": 2740} {"train_loss": -42.74967956542969, "global_step": 331649, "epoch": 2740} {"train_loss": -42.44630813598633, "global_step": 331650, "epoch": 2740} {"train_loss": -42.4293327331543, "global_step": 331651, "epoch": 2740} {"train_loss": -41.37113952636719, "global_step": 331652, "epoch": 2740} {"train_loss": -43.31005096435547, "global_step": 331653, "epoch": 2740} {"train_loss": -42.544105529785156, "global_step": 331654, "epoch": 2740} {"train_loss": -43.52808380126953, "global_step": 331655, "epoch": 2740} {"train_loss": -43.34503173828125, "global_step": 331656, "epoch": 2740} {"train_loss": -43.4539909362793, "global_step": 331657, "epoch": 2740} {"train_loss": -43.59861373901367, "global_step": 331658, "epoch": 2740} {"train_loss": -43.43673324584961, "global_step": 331659, "epoch": 2740} {"train_loss": -43.025701601643206, "global_step": 331660, "epoch": 2740, "val_loss": 2463793.5} {"train_loss": -43.1944694519043, "global_step": 331661, "epoch": 2741} {"train_loss": -44.070167541503906, "global_step": 331662, "epoch": 2741} {"train_loss": -43.958709716796875, "global_step": 331663, "epoch": 2741} {"train_loss": -43.57052230834961, "global_step": 331664, "epoch": 2741} {"train_loss": -44.186519622802734, "global_step": 331665, "epoch": 2741} {"train_loss": -43.505455017089844, "global_step": 331666, "epoch": 2741} {"train_loss": -44.28644943237305, "global_step": 331667, "epoch": 2741} {"train_loss": -43.908447265625, "global_step": 331668, "epoch": 2741} {"train_loss": -44.06794357299805, "global_step": 331669, "epoch": 2741} {"train_loss": -43.79508972167969, "global_step": 331670, "epoch": 2741} {"train_loss": -43.92097854614258, "global_step": 331671, "epoch": 2741} {"train_loss": -44.2223014831543, "global_step": 331672, "epoch": 2741} {"train_loss": -44.47477722167969, "global_step": 331673, "epoch": 2741} {"train_loss": -44.51618576049805, "global_step": 331674, "epoch": 2741} {"train_loss": -44.065208435058594, "global_step": 331675, "epoch": 2741} {"train_loss": -44.235286712646484, "global_step": 331676, "epoch": 2741} {"train_loss": -44.22626876831055, "global_step": 331677, "epoch": 2741} {"train_loss": -44.69527816772461, "global_step": 331678, "epoch": 2741} {"train_loss": -44.03590774536133, "global_step": 331679, "epoch": 2741} {"train_loss": -44.76902770996094, "global_step": 331680, "epoch": 2741} {"train_loss": -44.242549896240234, "global_step": 331681, "epoch": 2741} {"train_loss": -43.48118209838867, "global_step": 331682, "epoch": 2741} {"train_loss": -44.538265228271484, "global_step": 331683, "epoch": 2741} {"train_loss": -44.64723587036133, "global_step": 331684, "epoch": 2741} {"train_loss": -44.91313171386719, "global_step": 331685, "epoch": 2741} {"train_loss": -44.70232391357422, "global_step": 331686, "epoch": 2741} {"train_loss": -43.93662643432617, "global_step": 331687, "epoch": 2741} {"train_loss": -44.71584701538086, "global_step": 331688, "epoch": 2741} {"train_loss": -44.834468841552734, "global_step": 331689, "epoch": 2741} {"train_loss": -44.86016845703125, "global_step": 331690, "epoch": 2741} {"train_loss": -44.073055267333984, "global_step": 331691, "epoch": 2741} {"train_loss": -44.492374420166016, "global_step": 331692, "epoch": 2741} {"train_loss": -44.302833557128906, "global_step": 331693, "epoch": 2741} {"train_loss": -44.2779655456543, "global_step": 331694, "epoch": 2741} {"train_loss": -44.77694320678711, "global_step": 331695, "epoch": 2741} {"train_loss": -44.47595977783203, "global_step": 331696, "epoch": 2741} {"train_loss": -44.36511993408203, "global_step": 331697, "epoch": 2741} {"train_loss": -44.87730026245117, "global_step": 331698, "epoch": 2741} {"train_loss": -44.948936462402344, "global_step": 331699, "epoch": 2741} {"train_loss": -44.52769088745117, "global_step": 331700, "epoch": 2741} {"train_loss": -44.2219352722168, "global_step": 331701, "epoch": 2741} {"train_loss": -44.78691864013672, "global_step": 331702, "epoch": 2741} {"train_loss": -44.71556091308594, "global_step": 331703, "epoch": 2741} {"train_loss": -45.39876174926758, "global_step": 331704, "epoch": 2741} {"train_loss": -45.1056022644043, "global_step": 331705, "epoch": 2741} {"train_loss": -45.1866455078125, "global_step": 331706, "epoch": 2741} {"train_loss": -45.24892807006836, "global_step": 331707, "epoch": 2741} {"train_loss": -45.206581115722656, "global_step": 331708, "epoch": 2741} {"train_loss": -45.065704345703125, "global_step": 331709, "epoch": 2741} {"train_loss": -44.63482666015625, "global_step": 331710, "epoch": 2741} {"train_loss": -44.746429443359375, "global_step": 331711, "epoch": 2741} {"train_loss": -44.80419921875, "global_step": 331712, "epoch": 2741} {"train_loss": -45.10084915161133, "global_step": 331713, "epoch": 2741} {"train_loss": -45.1025390625, "global_step": 331714, "epoch": 2741} {"train_loss": -44.468719482421875, "global_step": 331715, "epoch": 2741} {"train_loss": -44.880645751953125, "global_step": 331716, "epoch": 2741} {"train_loss": -44.93375778198242, "global_step": 331717, "epoch": 2741} {"train_loss": -45.1453971862793, "global_step": 331718, "epoch": 2741} {"train_loss": -43.77177047729492, "global_step": 331719, "epoch": 2741} {"train_loss": -42.130470275878906, "global_step": 331720, "epoch": 2741} {"train_loss": -41.36044692993164, "global_step": 331721, "epoch": 2741} {"train_loss": -42.7768440246582, "global_step": 331722, "epoch": 2741} {"train_loss": -44.5510139465332, "global_step": 331723, "epoch": 2741} {"train_loss": -42.67647933959961, "global_step": 331724, "epoch": 2741} {"train_loss": -39.643558502197266, "global_step": 331725, "epoch": 2741} {"train_loss": -43.725860595703125, "global_step": 331726, "epoch": 2741} {"train_loss": -41.99520492553711, "global_step": 331727, "epoch": 2741} {"train_loss": -40.49460983276367, "global_step": 331728, "epoch": 2741} {"train_loss": -42.23394012451172, "global_step": 331729, "epoch": 2741} {"train_loss": -41.28164291381836, "global_step": 331730, "epoch": 2741} {"train_loss": -43.748111724853516, "global_step": 331731, "epoch": 2741} {"train_loss": -42.47079086303711, "global_step": 331732, "epoch": 2741} {"train_loss": -43.24729537963867, "global_step": 331733, "epoch": 2741} {"train_loss": -42.89594650268555, "global_step": 331734, "epoch": 2741} {"train_loss": -42.774688720703125, "global_step": 331735, "epoch": 2741} {"train_loss": -42.88528060913086, "global_step": 331736, "epoch": 2741} {"train_loss": -42.125911712646484, "global_step": 331737, "epoch": 2741} {"train_loss": -43.516441345214844, "global_step": 331738, "epoch": 2741} {"train_loss": -43.23020935058594, "global_step": 331739, "epoch": 2741} {"train_loss": -42.37890625, "global_step": 331740, "epoch": 2741} {"train_loss": -43.49110794067383, "global_step": 331741, "epoch": 2741} {"train_loss": -42.49320602416992, "global_step": 331742, "epoch": 2741} {"train_loss": -42.45436477661133, "global_step": 331743, "epoch": 2741} {"train_loss": -43.77549362182617, "global_step": 331744, "epoch": 2741} {"train_loss": -41.51409149169922, "global_step": 331745, "epoch": 2741} {"train_loss": -42.777313232421875, "global_step": 331746, "epoch": 2741} {"train_loss": -42.82537841796875, "global_step": 331747, "epoch": 2741} {"train_loss": -41.88591384887695, "global_step": 331748, "epoch": 2741} {"train_loss": -41.715850830078125, "global_step": 331749, "epoch": 2741} {"train_loss": -42.53144454956055, "global_step": 331750, "epoch": 2741} {"train_loss": -41.216758728027344, "global_step": 331751, "epoch": 2741} {"train_loss": -42.23295211791992, "global_step": 331752, "epoch": 2741} {"train_loss": -42.42567443847656, "global_step": 331753, "epoch": 2741} {"train_loss": -41.8265266418457, "global_step": 331754, "epoch": 2741} {"train_loss": -41.95240020751953, "global_step": 331755, "epoch": 2741} {"train_loss": -42.33513259887695, "global_step": 331756, "epoch": 2741} {"train_loss": -43.64881134033203, "global_step": 331757, "epoch": 2741} {"train_loss": -42.79842758178711, "global_step": 331758, "epoch": 2741} {"train_loss": -42.98785400390625, "global_step": 331759, "epoch": 2741} {"train_loss": -43.462337493896484, "global_step": 331760, "epoch": 2741} {"train_loss": -42.690834045410156, "global_step": 331761, "epoch": 2741} {"train_loss": -43.56157302856445, "global_step": 331762, "epoch": 2741} {"train_loss": -43.24836349487305, "global_step": 331763, "epoch": 2741} {"train_loss": -44.03666305541992, "global_step": 331764, "epoch": 2741} {"train_loss": -43.472755432128906, "global_step": 331765, "epoch": 2741} {"train_loss": -43.30399703979492, "global_step": 331766, "epoch": 2741} {"train_loss": -43.79118728637695, "global_step": 331767, "epoch": 2741} {"train_loss": -43.71192169189453, "global_step": 331768, "epoch": 2741} {"train_loss": -43.26200485229492, "global_step": 331769, "epoch": 2741} {"train_loss": -43.56218338012695, "global_step": 331770, "epoch": 2741} {"train_loss": -42.72013473510742, "global_step": 331771, "epoch": 2741} {"train_loss": -43.5234375, "global_step": 331772, "epoch": 2741} {"train_loss": -43.42977523803711, "global_step": 331773, "epoch": 2741} {"train_loss": -44.05204391479492, "global_step": 331774, "epoch": 2741} {"train_loss": -43.3740119934082, "global_step": 331775, "epoch": 2741} {"train_loss": -43.45928955078125, "global_step": 331776, "epoch": 2741} {"train_loss": -43.13735580444336, "global_step": 331777, "epoch": 2741} {"train_loss": -42.85089874267578, "global_step": 331778, "epoch": 2741} {"train_loss": -42.75728988647461, "global_step": 331779, "epoch": 2741} {"train_loss": -42.9742546081543, "global_step": 331780, "epoch": 2741} {"train_loss": -43.61540310441955, "global_step": 331781, "epoch": 2741, "val_loss": 2548358.0} {"train_loss": -43.29520797729492, "global_step": 331782, "epoch": 2742} {"train_loss": -44.061805725097656, "global_step": 331783, "epoch": 2742} {"train_loss": -43.47319030761719, "global_step": 331784, "epoch": 2742} {"train_loss": -43.349666595458984, "global_step": 331785, "epoch": 2742} {"train_loss": -43.76951217651367, "global_step": 331786, "epoch": 2742} {"train_loss": -44.26335144042969, "global_step": 331787, "epoch": 2742} {"train_loss": -43.47027587890625, "global_step": 331788, "epoch": 2742} {"train_loss": -44.05790328979492, "global_step": 331789, "epoch": 2742} {"train_loss": -44.0770263671875, "global_step": 331790, "epoch": 2742} {"train_loss": -43.675811767578125, "global_step": 331791, "epoch": 2742} {"train_loss": -43.935855865478516, "global_step": 331792, "epoch": 2742} {"train_loss": -44.2532844543457, "global_step": 331793, "epoch": 2742} {"train_loss": -44.02610397338867, "global_step": 331794, "epoch": 2742} {"train_loss": -43.918113708496094, "global_step": 331795, "epoch": 2742} {"train_loss": -43.8628044128418, "global_step": 331796, "epoch": 2742} {"train_loss": -44.525115966796875, "global_step": 331797, "epoch": 2742} {"train_loss": -44.069488525390625, "global_step": 331798, "epoch": 2742} {"train_loss": -44.025108337402344, "global_step": 331799, "epoch": 2742} {"train_loss": -43.724483489990234, "global_step": 331800, "epoch": 2742} {"train_loss": -44.15208435058594, "global_step": 331801, "epoch": 2742} {"train_loss": -44.665035247802734, "global_step": 331802, "epoch": 2742} {"train_loss": -44.372718811035156, "global_step": 331803, "epoch": 2742} {"train_loss": -44.613685607910156, "global_step": 331804, "epoch": 2742} {"train_loss": -44.430599212646484, "global_step": 331805, "epoch": 2742} {"train_loss": -44.51802444458008, "global_step": 331806, "epoch": 2742} {"train_loss": -44.543922424316406, "global_step": 331807, "epoch": 2742} {"train_loss": -44.34566879272461, "global_step": 331808, "epoch": 2742} {"train_loss": -43.75823974609375, "global_step": 331809, "epoch": 2742} {"train_loss": -44.151912689208984, "global_step": 331810, "epoch": 2742} {"train_loss": -44.32697677612305, "global_step": 331811, "epoch": 2742} {"train_loss": -44.2672233581543, "global_step": 331812, "epoch": 2742} {"train_loss": -44.78691101074219, "global_step": 331813, "epoch": 2742} {"train_loss": -44.698360443115234, "global_step": 331814, "epoch": 2742} {"train_loss": -44.552734375, "global_step": 331815, "epoch": 2742} {"train_loss": -43.57859420776367, "global_step": 331816, "epoch": 2742} {"train_loss": -43.82790756225586, "global_step": 331817, "epoch": 2742} {"train_loss": -44.88264083862305, "global_step": 331818, "epoch": 2742} {"train_loss": -44.83697509765625, "global_step": 331819, "epoch": 2742} {"train_loss": -44.68045425415039, "global_step": 331820, "epoch": 2742} {"train_loss": -44.46955108642578, "global_step": 331821, "epoch": 2742} {"train_loss": -44.98176574707031, "global_step": 331822, "epoch": 2742} {"train_loss": -44.72001266479492, "global_step": 331823, "epoch": 2742} {"train_loss": -45.0694694519043, "global_step": 331824, "epoch": 2742} {"train_loss": -44.79494857788086, "global_step": 331825, "epoch": 2742} {"train_loss": -44.509193420410156, "global_step": 331826, "epoch": 2742} {"train_loss": -44.58381652832031, "global_step": 331827, "epoch": 2742} {"train_loss": -43.65580368041992, "global_step": 331828, "epoch": 2742} {"train_loss": -44.510887145996094, "global_step": 331829, "epoch": 2742} {"train_loss": -44.80927276611328, "global_step": 331830, "epoch": 2742} {"train_loss": -43.92104721069336, "global_step": 331831, "epoch": 2742} {"train_loss": -43.941219329833984, "global_step": 331832, "epoch": 2742} {"train_loss": -44.2822380065918, "global_step": 331833, "epoch": 2742} {"train_loss": -43.53043746948242, "global_step": 331834, "epoch": 2742} {"train_loss": -44.028282165527344, "global_step": 331835, "epoch": 2742} {"train_loss": -43.338321685791016, "global_step": 331836, "epoch": 2742} {"train_loss": -45.16616439819336, "global_step": 331837, "epoch": 2742} {"train_loss": -44.941856384277344, "global_step": 331838, "epoch": 2742} {"train_loss": -42.28865432739258, "global_step": 331839, "epoch": 2742} {"train_loss": -43.0656623840332, "global_step": 331840, "epoch": 2742} {"train_loss": -43.981483459472656, "global_step": 331841, "epoch": 2742} {"train_loss": -44.957332611083984, "global_step": 331842, "epoch": 2742} {"train_loss": -44.51504135131836, "global_step": 331843, "epoch": 2742} {"train_loss": -44.66608810424805, "global_step": 331844, "epoch": 2742} {"train_loss": -44.60285568237305, "global_step": 331845, "epoch": 2742} {"train_loss": -44.37154006958008, "global_step": 331846, "epoch": 2742} {"train_loss": -44.65153121948242, "global_step": 331847, "epoch": 2742} {"train_loss": -44.69734191894531, "global_step": 331848, "epoch": 2742} {"train_loss": -44.20805740356445, "global_step": 331849, "epoch": 2742} {"train_loss": -44.551513671875, "global_step": 331850, "epoch": 2742} {"train_loss": -44.850013732910156, "global_step": 331851, "epoch": 2742} {"train_loss": -44.202735900878906, "global_step": 331852, "epoch": 2742} {"train_loss": -43.60431671142578, "global_step": 331853, "epoch": 2742} {"train_loss": -44.4201545715332, "global_step": 331854, "epoch": 2742} {"train_loss": -44.60224533081055, "global_step": 331855, "epoch": 2742} {"train_loss": -41.607704162597656, "global_step": 331856, "epoch": 2742} {"train_loss": -41.473873138427734, "global_step": 331857, "epoch": 2742} {"train_loss": -43.57971954345703, "global_step": 331858, "epoch": 2742} {"train_loss": -40.475460052490234, "global_step": 331859, "epoch": 2742} {"train_loss": -43.08088302612305, "global_step": 331860, "epoch": 2742} {"train_loss": -43.65092086791992, "global_step": 331861, "epoch": 2742} {"train_loss": -42.96814727783203, "global_step": 331862, "epoch": 2742} {"train_loss": -44.6589469909668, "global_step": 331863, "epoch": 2742} {"train_loss": -43.70167922973633, "global_step": 331864, "epoch": 2742} {"train_loss": -43.09923553466797, "global_step": 331865, "epoch": 2742} {"train_loss": -41.29842758178711, "global_step": 331866, "epoch": 2742} {"train_loss": -40.8885612487793, "global_step": 331867, "epoch": 2742} {"train_loss": -42.195186614990234, "global_step": 331868, "epoch": 2742} {"train_loss": -43.37759017944336, "global_step": 331869, "epoch": 2742} {"train_loss": -43.71028518676758, "global_step": 331870, "epoch": 2742} {"train_loss": -41.82905197143555, "global_step": 331871, "epoch": 2742} {"train_loss": -42.242610931396484, "global_step": 331872, "epoch": 2742} {"train_loss": -43.120819091796875, "global_step": 331873, "epoch": 2742} {"train_loss": -42.367889404296875, "global_step": 331874, "epoch": 2742} {"train_loss": -43.016971588134766, "global_step": 331875, "epoch": 2742} {"train_loss": -43.984100341796875, "global_step": 331876, "epoch": 2742} {"train_loss": -42.851314544677734, "global_step": 331877, "epoch": 2742} {"train_loss": -42.704986572265625, "global_step": 331878, "epoch": 2742} {"train_loss": -42.76117706298828, "global_step": 331879, "epoch": 2742} {"train_loss": -43.34076690673828, "global_step": 331880, "epoch": 2742} {"train_loss": -44.72022247314453, "global_step": 331881, "epoch": 2742} {"train_loss": -44.048927307128906, "global_step": 331882, "epoch": 2742} {"train_loss": -44.19208908081055, "global_step": 331883, "epoch": 2742} {"train_loss": -43.56349563598633, "global_step": 331884, "epoch": 2742} {"train_loss": -43.5554084777832, "global_step": 331885, "epoch": 2742} {"train_loss": -43.66705322265625, "global_step": 331886, "epoch": 2742} {"train_loss": -44.21354293823242, "global_step": 331887, "epoch": 2742} {"train_loss": -43.986202239990234, "global_step": 331888, "epoch": 2742} {"train_loss": -43.61090087890625, "global_step": 331889, "epoch": 2742} {"train_loss": -44.85011672973633, "global_step": 331890, "epoch": 2742} {"train_loss": -44.241790771484375, "global_step": 331891, "epoch": 2742} {"train_loss": -44.64384841918945, "global_step": 331892, "epoch": 2742} {"train_loss": -43.80302047729492, "global_step": 331893, "epoch": 2742} {"train_loss": -44.09896469116211, "global_step": 331894, "epoch": 2742} {"train_loss": -44.62006759643555, "global_step": 331895, "epoch": 2742} {"train_loss": -44.55756759643555, "global_step": 331896, "epoch": 2742} {"train_loss": -44.124385833740234, "global_step": 331897, "epoch": 2742} {"train_loss": -44.54844284057617, "global_step": 331898, "epoch": 2742} {"train_loss": -43.6227912902832, "global_step": 331899, "epoch": 2742} {"train_loss": -43.781158447265625, "global_step": 331900, "epoch": 2742} {"train_loss": -43.84092330932617, "global_step": 331901, "epoch": 2742} {"train_loss": -43.88920627940785, "global_step": 331902, "epoch": 2742, "val_loss": 2564969.0} {"train_loss": -43.950286865234375, "global_step": 331903, "epoch": 2743} {"train_loss": -44.365509033203125, "global_step": 331904, "epoch": 2743} {"train_loss": -43.933162689208984, "global_step": 331905, "epoch": 2743} {"train_loss": -44.650508880615234, "global_step": 331906, "epoch": 2743} {"train_loss": -43.999141693115234, "global_step": 331907, "epoch": 2743} {"train_loss": -43.219844818115234, "global_step": 331908, "epoch": 2743} {"train_loss": -44.76582717895508, "global_step": 331909, "epoch": 2743} {"train_loss": -43.90977096557617, "global_step": 331910, "epoch": 2743} {"train_loss": -42.52817916870117, "global_step": 331911, "epoch": 2743} {"train_loss": -44.47445297241211, "global_step": 331912, "epoch": 2743} {"train_loss": -43.552642822265625, "global_step": 331913, "epoch": 2743} {"train_loss": -43.565975189208984, "global_step": 331914, "epoch": 2743} {"train_loss": -42.87102127075195, "global_step": 331915, "epoch": 2743} {"train_loss": -44.29362869262695, "global_step": 331916, "epoch": 2743} {"train_loss": -43.657623291015625, "global_step": 331917, "epoch": 2743} {"train_loss": -44.34784698486328, "global_step": 331918, "epoch": 2743} {"train_loss": -42.26557540893555, "global_step": 331919, "epoch": 2743} {"train_loss": -43.90876770019531, "global_step": 331920, "epoch": 2743} {"train_loss": -44.52888870239258, "global_step": 331921, "epoch": 2743} {"train_loss": -43.61738204956055, "global_step": 331922, "epoch": 2743} {"train_loss": -43.794219970703125, "global_step": 331923, "epoch": 2743} {"train_loss": -44.24576187133789, "global_step": 331924, "epoch": 2743} {"train_loss": -43.43666458129883, "global_step": 331925, "epoch": 2743} {"train_loss": -43.899322509765625, "global_step": 331926, "epoch": 2743} {"train_loss": -44.09306335449219, "global_step": 331927, "epoch": 2743} {"train_loss": -43.326019287109375, "global_step": 331928, "epoch": 2743} {"train_loss": -44.436580657958984, "global_step": 331929, "epoch": 2743} {"train_loss": -44.70484161376953, "global_step": 331930, "epoch": 2743} {"train_loss": -42.851593017578125, "global_step": 331931, "epoch": 2743} {"train_loss": -44.8938102722168, "global_step": 331932, "epoch": 2743} {"train_loss": -44.06581115722656, "global_step": 331933, "epoch": 2743} {"train_loss": -43.003578186035156, "global_step": 331934, "epoch": 2743} {"train_loss": -44.2351188659668, "global_step": 331935, "epoch": 2743} {"train_loss": -42.68737030029297, "global_step": 331936, "epoch": 2743} {"train_loss": -42.791725158691406, "global_step": 331937, "epoch": 2743} {"train_loss": -43.50260543823242, "global_step": 331938, "epoch": 2743} {"train_loss": -43.72137451171875, "global_step": 331939, "epoch": 2743} {"train_loss": -42.51184844970703, "global_step": 331940, "epoch": 2743} {"train_loss": -43.839778900146484, "global_step": 331941, "epoch": 2743} {"train_loss": -41.595130920410156, "global_step": 331942, "epoch": 2743} {"train_loss": -41.13315963745117, "global_step": 331943, "epoch": 2743} {"train_loss": -41.05484390258789, "global_step": 331944, "epoch": 2743} {"train_loss": -43.944339752197266, "global_step": 331945, "epoch": 2743} {"train_loss": -41.12678146362305, "global_step": 331946, "epoch": 2743} {"train_loss": -40.633358001708984, "global_step": 331947, "epoch": 2743} {"train_loss": -44.07130432128906, "global_step": 331948, "epoch": 2743} {"train_loss": -41.48114013671875, "global_step": 331949, "epoch": 2743} {"train_loss": -43.05100631713867, "global_step": 331950, "epoch": 2743} {"train_loss": -43.505191802978516, "global_step": 331951, "epoch": 2743} {"train_loss": -42.73613357543945, "global_step": 331952, "epoch": 2743} {"train_loss": -42.208045959472656, "global_step": 331953, "epoch": 2743} {"train_loss": -43.52937698364258, "global_step": 331954, "epoch": 2743} {"train_loss": -42.76113510131836, "global_step": 331955, "epoch": 2743} {"train_loss": -42.708168029785156, "global_step": 331956, "epoch": 2743} {"train_loss": -42.27495193481445, "global_step": 331957, "epoch": 2743} {"train_loss": -43.37826156616211, "global_step": 331958, "epoch": 2743} {"train_loss": -41.920562744140625, "global_step": 331959, "epoch": 2743} {"train_loss": -42.684417724609375, "global_step": 331960, "epoch": 2743} {"train_loss": -42.31734085083008, "global_step": 331961, "epoch": 2743} {"train_loss": -41.8440055847168, "global_step": 331962, "epoch": 2743} {"train_loss": -43.92231369018555, "global_step": 331963, "epoch": 2743} {"train_loss": -42.100467681884766, "global_step": 331964, "epoch": 2743} {"train_loss": -43.37306213378906, "global_step": 331965, "epoch": 2743} {"train_loss": -43.10823440551758, "global_step": 331966, "epoch": 2743} {"train_loss": -43.23119354248047, "global_step": 331967, "epoch": 2743} {"train_loss": -42.80010986328125, "global_step": 331968, "epoch": 2743} {"train_loss": -43.834075927734375, "global_step": 331969, "epoch": 2743} {"train_loss": -43.03483963012695, "global_step": 331970, "epoch": 2743} {"train_loss": -43.39372253417969, "global_step": 331971, "epoch": 2743} {"train_loss": -42.78263473510742, "global_step": 331972, "epoch": 2743} {"train_loss": -43.515743255615234, "global_step": 331973, "epoch": 2743} {"train_loss": -43.13285446166992, "global_step": 331974, "epoch": 2743} {"train_loss": -43.425254821777344, "global_step": 331975, "epoch": 2743} {"train_loss": -43.97898483276367, "global_step": 331976, "epoch": 2743} {"train_loss": -43.35879135131836, "global_step": 331977, "epoch": 2743} {"train_loss": -43.79814147949219, "global_step": 331978, "epoch": 2743} {"train_loss": -43.57007598876953, "global_step": 331979, "epoch": 2743} {"train_loss": -43.79603576660156, "global_step": 331980, "epoch": 2743} {"train_loss": -43.32712936401367, "global_step": 331981, "epoch": 2743} {"train_loss": -43.75437545776367, "global_step": 331982, "epoch": 2743} {"train_loss": -43.89487838745117, "global_step": 331983, "epoch": 2743} {"train_loss": -43.524288177490234, "global_step": 331984, "epoch": 2743} {"train_loss": -43.304012298583984, "global_step": 331985, "epoch": 2743} {"train_loss": -43.693328857421875, "global_step": 331986, "epoch": 2743} {"train_loss": -43.627803802490234, "global_step": 331987, "epoch": 2743} {"train_loss": -43.804466247558594, "global_step": 331988, "epoch": 2743} {"train_loss": -44.16872787475586, "global_step": 331989, "epoch": 2743} {"train_loss": -42.99711990356445, "global_step": 331990, "epoch": 2743} {"train_loss": -44.44447708129883, "global_step": 331991, "epoch": 2743} {"train_loss": -42.655086517333984, "global_step": 331992, "epoch": 2743} {"train_loss": -44.12193298339844, "global_step": 331993, "epoch": 2743} {"train_loss": -43.634822845458984, "global_step": 331994, "epoch": 2743} {"train_loss": -43.33112716674805, "global_step": 331995, "epoch": 2743} {"train_loss": -44.386192321777344, "global_step": 331996, "epoch": 2743} {"train_loss": -42.4743537902832, "global_step": 331997, "epoch": 2743} {"train_loss": -43.839576721191406, "global_step": 331998, "epoch": 2743} {"train_loss": -42.18565368652344, "global_step": 331999, "epoch": 2743} {"train_loss": -43.76385498046875, "global_step": 332000, "epoch": 2743} {"train_loss": -43.0145263671875, "global_step": 332001, "epoch": 2743} {"train_loss": -44.08993148803711, "global_step": 332002, "epoch": 2743} {"train_loss": -42.8294792175293, "global_step": 332003, "epoch": 2743} {"train_loss": -43.7381477355957, "global_step": 332004, "epoch": 2743} {"train_loss": -44.039405822753906, "global_step": 332005, "epoch": 2743} {"train_loss": -44.113216400146484, "global_step": 332006, "epoch": 2743} {"train_loss": -44.5736083984375, "global_step": 332007, "epoch": 2743} {"train_loss": -44.222591400146484, "global_step": 332008, "epoch": 2743} {"train_loss": -44.224334716796875, "global_step": 332009, "epoch": 2743} {"train_loss": -43.838741302490234, "global_step": 332010, "epoch": 2743} {"train_loss": -44.86994171142578, "global_step": 332011, "epoch": 2743} {"train_loss": -44.0970573425293, "global_step": 332012, "epoch": 2743} {"train_loss": -44.3076171875, "global_step": 332013, "epoch": 2743} {"train_loss": -44.34008026123047, "global_step": 332014, "epoch": 2743} {"train_loss": -44.66063690185547, "global_step": 332015, "epoch": 2743} {"train_loss": -44.47423553466797, "global_step": 332016, "epoch": 2743} {"train_loss": -44.36271286010742, "global_step": 332017, "epoch": 2743} {"train_loss": -45.0176887512207, "global_step": 332018, "epoch": 2743} {"train_loss": -44.319244384765625, "global_step": 332019, "epoch": 2743} {"train_loss": -44.45743179321289, "global_step": 332020, "epoch": 2743} {"train_loss": -44.28774642944336, "global_step": 332021, "epoch": 2743} {"train_loss": -44.48484420776367, "global_step": 332022, "epoch": 2743} {"train_loss": -43.506849683020725, "global_step": 332023, "epoch": 2743, "val_loss": 2495655.75} {"train_loss": -44.8716926574707, "global_step": 332024, "epoch": 2744} {"train_loss": -45.269996643066406, "global_step": 332025, "epoch": 2744} {"train_loss": -44.320526123046875, "global_step": 332026, "epoch": 2744} {"train_loss": -44.40422821044922, "global_step": 332027, "epoch": 2744} {"train_loss": -44.693721771240234, "global_step": 332028, "epoch": 2744} {"train_loss": -44.48744201660156, "global_step": 332029, "epoch": 2744} {"train_loss": -44.253204345703125, "global_step": 332030, "epoch": 2744} {"train_loss": -44.963680267333984, "global_step": 332031, "epoch": 2744} {"train_loss": -44.71405792236328, "global_step": 332032, "epoch": 2744} {"train_loss": -43.899925231933594, "global_step": 332033, "epoch": 2744} {"train_loss": -44.76986312866211, "global_step": 332034, "epoch": 2744} {"train_loss": -44.3310661315918, "global_step": 332035, "epoch": 2744} {"train_loss": -43.69936752319336, "global_step": 332036, "epoch": 2744} {"train_loss": -44.0426139831543, "global_step": 332037, "epoch": 2744} {"train_loss": -44.35934066772461, "global_step": 332038, "epoch": 2744} {"train_loss": -44.38645935058594, "global_step": 332039, "epoch": 2744} {"train_loss": -43.6513671875, "global_step": 332040, "epoch": 2744} {"train_loss": -44.286006927490234, "global_step": 332041, "epoch": 2744} {"train_loss": -44.85716247558594, "global_step": 332042, "epoch": 2744} {"train_loss": -44.20906448364258, "global_step": 332043, "epoch": 2744} {"train_loss": -44.22492599487305, "global_step": 332044, "epoch": 2744} {"train_loss": -44.35730743408203, "global_step": 332045, "epoch": 2744} {"train_loss": -44.196590423583984, "global_step": 332046, "epoch": 2744} {"train_loss": -44.623653411865234, "global_step": 332047, "epoch": 2744} {"train_loss": -43.73189926147461, "global_step": 332048, "epoch": 2744} {"train_loss": -43.68516159057617, "global_step": 332049, "epoch": 2744} {"train_loss": -44.60261535644531, "global_step": 332050, "epoch": 2744} {"train_loss": -44.272308349609375, "global_step": 332051, "epoch": 2744} {"train_loss": -42.654518127441406, "global_step": 332052, "epoch": 2744} {"train_loss": -43.69429397583008, "global_step": 332053, "epoch": 2744} {"train_loss": -44.102291107177734, "global_step": 332054, "epoch": 2744} {"train_loss": -44.448116302490234, "global_step": 332055, "epoch": 2744} {"train_loss": -43.1790885925293, "global_step": 332056, "epoch": 2744} {"train_loss": -43.6396369934082, "global_step": 332057, "epoch": 2744} {"train_loss": -43.78888702392578, "global_step": 332058, "epoch": 2744} {"train_loss": -44.14680099487305, "global_step": 332059, "epoch": 2744} {"train_loss": -42.98250198364258, "global_step": 332060, "epoch": 2744} {"train_loss": -43.35879135131836, "global_step": 332061, "epoch": 2744} {"train_loss": -45.00234603881836, "global_step": 332062, "epoch": 2744} {"train_loss": -44.01133728027344, "global_step": 332063, "epoch": 2744} {"train_loss": -43.71307373046875, "global_step": 332064, "epoch": 2744} {"train_loss": -43.75077819824219, "global_step": 332065, "epoch": 2744} {"train_loss": -44.272674560546875, "global_step": 332066, "epoch": 2744} {"train_loss": -43.79345703125, "global_step": 332067, "epoch": 2744} {"train_loss": -43.440303802490234, "global_step": 332068, "epoch": 2744} {"train_loss": -43.00912094116211, "global_step": 332069, "epoch": 2744} {"train_loss": -43.45136260986328, "global_step": 332070, "epoch": 2744} {"train_loss": -44.07862854003906, "global_step": 332071, "epoch": 2744} {"train_loss": -43.420475006103516, "global_step": 332072, "epoch": 2744} {"train_loss": -41.573760986328125, "global_step": 332073, "epoch": 2744} {"train_loss": -42.713623046875, "global_step": 332074, "epoch": 2744} {"train_loss": -44.100563049316406, "global_step": 332075, "epoch": 2744} {"train_loss": -42.57769775390625, "global_step": 332076, "epoch": 2744} {"train_loss": -43.44624710083008, "global_step": 332077, "epoch": 2744} {"train_loss": -43.58692169189453, "global_step": 332078, "epoch": 2744} {"train_loss": -43.35340118408203, "global_step": 332079, "epoch": 2744} {"train_loss": -44.52724075317383, "global_step": 332080, "epoch": 2744} {"train_loss": -43.259864807128906, "global_step": 332081, "epoch": 2744} {"train_loss": -43.50516891479492, "global_step": 332082, "epoch": 2744} {"train_loss": -44.44581985473633, "global_step": 332083, "epoch": 2744} {"train_loss": -44.01072311401367, "global_step": 332084, "epoch": 2744} {"train_loss": -44.34109115600586, "global_step": 332085, "epoch": 2744} {"train_loss": -44.28934860229492, "global_step": 332086, "epoch": 2744} {"train_loss": -44.1771125793457, "global_step": 332087, "epoch": 2744} {"train_loss": -44.23875045776367, "global_step": 332088, "epoch": 2744} {"train_loss": -44.860530853271484, "global_step": 332089, "epoch": 2744} {"train_loss": -44.63582992553711, "global_step": 332090, "epoch": 2744} {"train_loss": -44.37303924560547, "global_step": 332091, "epoch": 2744} {"train_loss": -44.324737548828125, "global_step": 332092, "epoch": 2744} {"train_loss": -44.74263381958008, "global_step": 332093, "epoch": 2744} {"train_loss": -44.77432632446289, "global_step": 332094, "epoch": 2744} {"train_loss": -44.15108871459961, "global_step": 332095, "epoch": 2744} {"train_loss": -45.1508903503418, "global_step": 332096, "epoch": 2744} {"train_loss": -44.797096252441406, "global_step": 332097, "epoch": 2744} {"train_loss": -44.29564666748047, "global_step": 332098, "epoch": 2744} {"train_loss": -45.0474739074707, "global_step": 332099, "epoch": 2744} {"train_loss": -45.0031852722168, "global_step": 332100, "epoch": 2744} {"train_loss": -44.971553802490234, "global_step": 332101, "epoch": 2744} {"train_loss": -45.06882858276367, "global_step": 332102, "epoch": 2744} {"train_loss": -44.769344329833984, "global_step": 332103, "epoch": 2744} {"train_loss": -44.75623321533203, "global_step": 332104, "epoch": 2744} {"train_loss": -45.30336380004883, "global_step": 332105, "epoch": 2744} {"train_loss": -45.1506233215332, "global_step": 332106, "epoch": 2744} {"train_loss": -45.23008346557617, "global_step": 332107, "epoch": 2744} {"train_loss": -44.84639358520508, "global_step": 332108, "epoch": 2744} {"train_loss": -45.457550048828125, "global_step": 332109, "epoch": 2744} {"train_loss": -45.44893264770508, "global_step": 332110, "epoch": 2744} {"train_loss": -43.94072341918945, "global_step": 332111, "epoch": 2744} {"train_loss": -44.89115524291992, "global_step": 332112, "epoch": 2744} {"train_loss": -45.19248962402344, "global_step": 332113, "epoch": 2744} {"train_loss": -45.3780632019043, "global_step": 332114, "epoch": 2744} {"train_loss": -45.1329345703125, "global_step": 332115, "epoch": 2744} {"train_loss": -44.77265548706055, "global_step": 332116, "epoch": 2744} {"train_loss": -45.5188102722168, "global_step": 332117, "epoch": 2744} {"train_loss": -45.45905685424805, "global_step": 332118, "epoch": 2744} {"train_loss": -44.558326721191406, "global_step": 332119, "epoch": 2744} {"train_loss": -44.0667724609375, "global_step": 332120, "epoch": 2744} {"train_loss": -45.211483001708984, "global_step": 332121, "epoch": 2744} {"train_loss": -45.6047477722168, "global_step": 332122, "epoch": 2744} {"train_loss": -44.42847442626953, "global_step": 332123, "epoch": 2744} {"train_loss": -44.15044403076172, "global_step": 332124, "epoch": 2744} {"train_loss": -45.332149505615234, "global_step": 332125, "epoch": 2744} {"train_loss": -45.08533477783203, "global_step": 332126, "epoch": 2744} {"train_loss": -44.73065185546875, "global_step": 332127, "epoch": 2744} {"train_loss": -43.85270690917969, "global_step": 332128, "epoch": 2744} {"train_loss": -43.50602340698242, "global_step": 332129, "epoch": 2744} {"train_loss": -43.992034912109375, "global_step": 332130, "epoch": 2744} {"train_loss": -43.972015380859375, "global_step": 332131, "epoch": 2744} {"train_loss": -44.2048225402832, "global_step": 332132, "epoch": 2744} {"train_loss": -44.120452880859375, "global_step": 332133, "epoch": 2744} {"train_loss": -44.77567672729492, "global_step": 332134, "epoch": 2744} {"train_loss": -44.335750579833984, "global_step": 332135, "epoch": 2744} {"train_loss": -44.190093994140625, "global_step": 332136, "epoch": 2744} {"train_loss": -44.785438537597656, "global_step": 332137, "epoch": 2744} {"train_loss": -44.5496826171875, "global_step": 332138, "epoch": 2744} {"train_loss": -44.4727668762207, "global_step": 332139, "epoch": 2744} {"train_loss": -45.21194076538086, "global_step": 332140, "epoch": 2744} {"train_loss": -44.62455368041992, "global_step": 332141, "epoch": 2744} {"train_loss": -45.27372360229492, "global_step": 332142, "epoch": 2744} {"train_loss": -44.81236267089844, "global_step": 332143, "epoch": 2744} {"train_loss": -44.33549326116388, "global_step": 332144, "epoch": 2744, "val_loss": 2503978.0} {"train_loss": -44.84088897705078, "global_step": 332145, "epoch": 2745} {"train_loss": -44.720558166503906, "global_step": 332146, "epoch": 2745} {"train_loss": -44.03879928588867, "global_step": 332147, "epoch": 2745} {"train_loss": -44.487220764160156, "global_step": 332148, "epoch": 2745} {"train_loss": -44.35342025756836, "global_step": 332149, "epoch": 2745} {"train_loss": -44.1568717956543, "global_step": 332150, "epoch": 2745} {"train_loss": -44.141883850097656, "global_step": 332151, "epoch": 2745} {"train_loss": -44.47195053100586, "global_step": 332152, "epoch": 2745} {"train_loss": -44.68635177612305, "global_step": 332153, "epoch": 2745} {"train_loss": -44.349609375, "global_step": 332154, "epoch": 2745} {"train_loss": -42.47695541381836, "global_step": 332155, "epoch": 2745} {"train_loss": -43.27936935424805, "global_step": 332156, "epoch": 2745} {"train_loss": -43.16099548339844, "global_step": 332157, "epoch": 2745} {"train_loss": -43.04386901855469, "global_step": 332158, "epoch": 2745} {"train_loss": -42.58370590209961, "global_step": 332159, "epoch": 2745} {"train_loss": -43.26167297363281, "global_step": 332160, "epoch": 2745} {"train_loss": -44.12968063354492, "global_step": 332161, "epoch": 2745} {"train_loss": -42.688533782958984, "global_step": 332162, "epoch": 2745} {"train_loss": -44.062660217285156, "global_step": 332163, "epoch": 2745} {"train_loss": -44.72282028198242, "global_step": 332164, "epoch": 2745} {"train_loss": -45.039466857910156, "global_step": 332165, "epoch": 2745} {"train_loss": -44.643463134765625, "global_step": 332166, "epoch": 2745} {"train_loss": -43.31446075439453, "global_step": 332167, "epoch": 2745} {"train_loss": -44.35268783569336, "global_step": 332168, "epoch": 2745} {"train_loss": -44.65196228027344, "global_step": 332169, "epoch": 2745} {"train_loss": -44.16374969482422, "global_step": 332170, "epoch": 2745} {"train_loss": -44.79058837890625, "global_step": 332171, "epoch": 2745} {"train_loss": -44.5434455871582, "global_step": 332172, "epoch": 2745} {"train_loss": -44.103851318359375, "global_step": 332173, "epoch": 2745} {"train_loss": -44.74123764038086, "global_step": 332174, "epoch": 2745} {"train_loss": -43.943092346191406, "global_step": 332175, "epoch": 2745} {"train_loss": -44.46311569213867, "global_step": 332176, "epoch": 2745} {"train_loss": -44.43951416015625, "global_step": 332177, "epoch": 2745} {"train_loss": -43.71023178100586, "global_step": 332178, "epoch": 2745} {"train_loss": -40.91140365600586, "global_step": 332179, "epoch": 2745} {"train_loss": -41.856727600097656, "global_step": 332180, "epoch": 2745} {"train_loss": -42.048465728759766, "global_step": 332181, "epoch": 2745} {"train_loss": -44.35185623168945, "global_step": 332182, "epoch": 2745} {"train_loss": -42.66498947143555, "global_step": 332183, "epoch": 2745} {"train_loss": -42.412811279296875, "global_step": 332184, "epoch": 2745} {"train_loss": -41.038692474365234, "global_step": 332185, "epoch": 2745} {"train_loss": -41.179988861083984, "global_step": 332186, "epoch": 2745} {"train_loss": -41.59647750854492, "global_step": 332187, "epoch": 2745} {"train_loss": -43.09663009643555, "global_step": 332188, "epoch": 2745} {"train_loss": -42.9215087890625, "global_step": 332189, "epoch": 2745} {"train_loss": -40.58642578125, "global_step": 332190, "epoch": 2745} {"train_loss": -43.828590393066406, "global_step": 332191, "epoch": 2745} {"train_loss": -42.258644104003906, "global_step": 332192, "epoch": 2745} {"train_loss": -41.71224594116211, "global_step": 332193, "epoch": 2745} {"train_loss": -43.86056137084961, "global_step": 332194, "epoch": 2745} {"train_loss": -39.72953414916992, "global_step": 332195, "epoch": 2745} {"train_loss": -41.24050521850586, "global_step": 332196, "epoch": 2745} {"train_loss": -43.69749450683594, "global_step": 332197, "epoch": 2745} {"train_loss": -41.616641998291016, "global_step": 332198, "epoch": 2745} {"train_loss": -42.52659606933594, "global_step": 332199, "epoch": 2745} {"train_loss": -42.722076416015625, "global_step": 332200, "epoch": 2745} {"train_loss": -41.024139404296875, "global_step": 332201, "epoch": 2745} {"train_loss": -43.237831115722656, "global_step": 332202, "epoch": 2745} {"train_loss": -43.07130432128906, "global_step": 332203, "epoch": 2745} {"train_loss": -42.617530822753906, "global_step": 332204, "epoch": 2745} {"train_loss": -43.64767074584961, "global_step": 332205, "epoch": 2745} {"train_loss": -43.2614631652832, "global_step": 332206, "epoch": 2745} {"train_loss": -42.952239990234375, "global_step": 332207, "epoch": 2745} {"train_loss": -43.938995361328125, "global_step": 332208, "epoch": 2745} {"train_loss": -42.56856918334961, "global_step": 332209, "epoch": 2745} {"train_loss": -43.990779876708984, "global_step": 332210, "epoch": 2745} {"train_loss": -43.142921447753906, "global_step": 332211, "epoch": 2745} {"train_loss": -43.8519401550293, "global_step": 332212, "epoch": 2745} {"train_loss": -43.30585479736328, "global_step": 332213, "epoch": 2745} {"train_loss": -42.67119598388672, "global_step": 332214, "epoch": 2745} {"train_loss": -43.76831817626953, "global_step": 332215, "epoch": 2745} {"train_loss": -42.2423210144043, "global_step": 332216, "epoch": 2745} {"train_loss": -43.48096466064453, "global_step": 332217, "epoch": 2745} {"train_loss": -42.494747161865234, "global_step": 332218, "epoch": 2745} {"train_loss": -43.20386505126953, "global_step": 332219, "epoch": 2745} {"train_loss": -43.083824157714844, "global_step": 332220, "epoch": 2745} {"train_loss": -43.75144577026367, "global_step": 332221, "epoch": 2745} {"train_loss": -43.882110595703125, "global_step": 332222, "epoch": 2745} {"train_loss": -43.62144088745117, "global_step": 332223, "epoch": 2745} {"train_loss": -44.40767288208008, "global_step": 332224, "epoch": 2745} {"train_loss": -43.394264221191406, "global_step": 332225, "epoch": 2745} {"train_loss": -44.10885238647461, "global_step": 332226, "epoch": 2745} {"train_loss": -44.34052276611328, "global_step": 332227, "epoch": 2745} {"train_loss": -43.565521240234375, "global_step": 332228, "epoch": 2745} {"train_loss": -43.146053314208984, "global_step": 332229, "epoch": 2745} {"train_loss": -43.66806411743164, "global_step": 332230, "epoch": 2745} {"train_loss": -43.41619873046875, "global_step": 332231, "epoch": 2745} {"train_loss": -44.167747497558594, "global_step": 332232, "epoch": 2745} {"train_loss": -43.87380599975586, "global_step": 332233, "epoch": 2745} {"train_loss": -43.49578857421875, "global_step": 332234, "epoch": 2745} {"train_loss": -43.880104064941406, "global_step": 332235, "epoch": 2745} {"train_loss": -44.24867630004883, "global_step": 332236, "epoch": 2745} {"train_loss": -42.71122360229492, "global_step": 332237, "epoch": 2745} {"train_loss": -44.290950775146484, "global_step": 332238, "epoch": 2745} {"train_loss": -43.5108757019043, "global_step": 332239, "epoch": 2745} {"train_loss": -43.448028564453125, "global_step": 332240, "epoch": 2745} {"train_loss": -43.2650260925293, "global_step": 332241, "epoch": 2745} {"train_loss": -43.258338928222656, "global_step": 332242, "epoch": 2745} {"train_loss": -44.132484436035156, "global_step": 332243, "epoch": 2745} {"train_loss": -43.750205993652344, "global_step": 332244, "epoch": 2745} {"train_loss": -43.045013427734375, "global_step": 332245, "epoch": 2745} {"train_loss": -43.84981918334961, "global_step": 332246, "epoch": 2745} {"train_loss": -43.086219787597656, "global_step": 332247, "epoch": 2745} {"train_loss": -43.882057189941406, "global_step": 332248, "epoch": 2745} {"train_loss": -42.935245513916016, "global_step": 332249, "epoch": 2745} {"train_loss": -43.464630126953125, "global_step": 332250, "epoch": 2745} {"train_loss": -43.83211898803711, "global_step": 332251, "epoch": 2745} {"train_loss": -42.61227035522461, "global_step": 332252, "epoch": 2745} {"train_loss": -43.71022415161133, "global_step": 332253, "epoch": 2745} {"train_loss": -41.89718246459961, "global_step": 332254, "epoch": 2745} {"train_loss": -44.442142486572266, "global_step": 332255, "epoch": 2745} {"train_loss": -42.872615814208984, "global_step": 332256, "epoch": 2745} {"train_loss": -43.56930923461914, "global_step": 332257, "epoch": 2745} {"train_loss": -44.13926315307617, "global_step": 332258, "epoch": 2745} {"train_loss": -43.637489318847656, "global_step": 332259, "epoch": 2745} {"train_loss": -44.379459381103516, "global_step": 332260, "epoch": 2745} {"train_loss": -43.74071502685547, "global_step": 332261, "epoch": 2745} {"train_loss": -44.51093292236328, "global_step": 332262, "epoch": 2745} {"train_loss": -44.92148971557617, "global_step": 332263, "epoch": 2745} {"train_loss": -45.03691482543945, "global_step": 332264, "epoch": 2745} {"train_loss": -43.431258682377084, "global_step": 332265, "epoch": 2745, "val_loss": 2549108.25} {"train_loss": -44.95284652709961, "global_step": 332266, "epoch": 2746} {"train_loss": -44.90635299682617, "global_step": 332267, "epoch": 2746} {"train_loss": -44.9104118347168, "global_step": 332268, "epoch": 2746} {"train_loss": -44.71772384643555, "global_step": 332269, "epoch": 2746} {"train_loss": -45.02585983276367, "global_step": 332270, "epoch": 2746} {"train_loss": -44.6944580078125, "global_step": 332271, "epoch": 2746} {"train_loss": -44.729122161865234, "global_step": 332272, "epoch": 2746} {"train_loss": -45.38690948486328, "global_step": 332273, "epoch": 2746} {"train_loss": -44.81696319580078, "global_step": 332274, "epoch": 2746} {"train_loss": -45.27239990234375, "global_step": 332275, "epoch": 2746} {"train_loss": -45.42556381225586, "global_step": 332276, "epoch": 2746} {"train_loss": -45.3055534362793, "global_step": 332277, "epoch": 2746} {"train_loss": -43.452701568603516, "global_step": 332278, "epoch": 2746} {"train_loss": -45.369873046875, "global_step": 332279, "epoch": 2746} {"train_loss": -45.14825439453125, "global_step": 332280, "epoch": 2746} {"train_loss": -45.32491683959961, "global_step": 332281, "epoch": 2746} {"train_loss": -45.2678337097168, "global_step": 332282, "epoch": 2746} {"train_loss": -45.68447494506836, "global_step": 332283, "epoch": 2746} {"train_loss": -45.39248275756836, "global_step": 332284, "epoch": 2746} {"train_loss": -45.571250915527344, "global_step": 332285, "epoch": 2746} {"train_loss": -45.75211715698242, "global_step": 332286, "epoch": 2746} {"train_loss": -45.337188720703125, "global_step": 332287, "epoch": 2746} {"train_loss": -45.224308013916016, "global_step": 332288, "epoch": 2746} {"train_loss": -45.292537689208984, "global_step": 332289, "epoch": 2746} {"train_loss": -45.48896026611328, "global_step": 332290, "epoch": 2746} {"train_loss": -45.809513092041016, "global_step": 332291, "epoch": 2746} {"train_loss": -45.55717086791992, "global_step": 332292, "epoch": 2746} {"train_loss": -45.38442611694336, "global_step": 332293, "epoch": 2746} {"train_loss": -45.503814697265625, "global_step": 332294, "epoch": 2746} {"train_loss": -44.96854782104492, "global_step": 332295, "epoch": 2746} {"train_loss": -45.40327072143555, "global_step": 332296, "epoch": 2746} {"train_loss": -45.46494674682617, "global_step": 332297, "epoch": 2746} {"train_loss": -45.59480285644531, "global_step": 332298, "epoch": 2746} {"train_loss": -45.17892074584961, "global_step": 332299, "epoch": 2746} {"train_loss": -45.76420974731445, "global_step": 332300, "epoch": 2746} {"train_loss": -46.12734603881836, "global_step": 332301, "epoch": 2746} {"train_loss": -45.339603424072266, "global_step": 332302, "epoch": 2746} {"train_loss": -45.210567474365234, "global_step": 332303, "epoch": 2746} {"train_loss": -45.9856071472168, "global_step": 332304, "epoch": 2746} {"train_loss": -45.669464111328125, "global_step": 332305, "epoch": 2746} {"train_loss": -45.116310119628906, "global_step": 332306, "epoch": 2746} {"train_loss": -45.23820877075195, "global_step": 332307, "epoch": 2746} {"train_loss": -45.62981033325195, "global_step": 332308, "epoch": 2746} {"train_loss": -45.56996536254883, "global_step": 332309, "epoch": 2746} {"train_loss": -45.434669494628906, "global_step": 332310, "epoch": 2746} {"train_loss": -44.63917922973633, "global_step": 332311, "epoch": 2746} {"train_loss": -44.26031494140625, "global_step": 332312, "epoch": 2746} {"train_loss": -44.53959655761719, "global_step": 332313, "epoch": 2746} {"train_loss": -45.468563079833984, "global_step": 332314, "epoch": 2746} {"train_loss": -44.751319885253906, "global_step": 332315, "epoch": 2746} {"train_loss": -44.7761344909668, "global_step": 332316, "epoch": 2746} {"train_loss": -44.474945068359375, "global_step": 332317, "epoch": 2746} {"train_loss": -45.1959228515625, "global_step": 332318, "epoch": 2746} {"train_loss": -44.94329833984375, "global_step": 332319, "epoch": 2746} {"train_loss": -44.79106521606445, "global_step": 332320, "epoch": 2746} {"train_loss": -45.457759857177734, "global_step": 332321, "epoch": 2746} {"train_loss": -45.05644607543945, "global_step": 332322, "epoch": 2746} {"train_loss": -45.185333251953125, "global_step": 332323, "epoch": 2746} {"train_loss": -45.23970413208008, "global_step": 332324, "epoch": 2746} {"train_loss": -44.14591598510742, "global_step": 332325, "epoch": 2746} {"train_loss": -43.00034713745117, "global_step": 332326, "epoch": 2746} {"train_loss": -41.7514762878418, "global_step": 332327, "epoch": 2746} {"train_loss": -38.80165481567383, "global_step": 332328, "epoch": 2746} {"train_loss": -38.46541213989258, "global_step": 332329, "epoch": 2746} {"train_loss": -32.02849197387695, "global_step": 332330, "epoch": 2746} {"train_loss": -32.57816696166992, "global_step": 332331, "epoch": 2746} {"train_loss": 4.714444637298584, "global_step": 332332, "epoch": 2746} {"train_loss": -22.351831436157227, "global_step": 332333, "epoch": 2746} {"train_loss": -25.378299713134766, "global_step": 332334, "epoch": 2746} {"train_loss": -11.920807838439941, "global_step": 332335, "epoch": 2746} {"train_loss": -24.891637802124023, "global_step": 332336, "epoch": 2746} {"train_loss": -20.18128776550293, "global_step": 332337, "epoch": 2746} {"train_loss": -13.666356086730957, "global_step": 332338, "epoch": 2746} {"train_loss": -30.880598068237305, "global_step": 332339, "epoch": 2746} {"train_loss": -29.176069259643555, "global_step": 332340, "epoch": 2746} {"train_loss": -24.96558952331543, "global_step": 332341, "epoch": 2746} {"train_loss": -28.145185470581055, "global_step": 332342, "epoch": 2746} {"train_loss": -26.244821548461914, "global_step": 332343, "epoch": 2746} {"train_loss": -34.048831939697266, "global_step": 332344, "epoch": 2746} {"train_loss": -37.00568771362305, "global_step": 332345, "epoch": 2746} {"train_loss": -34.17206954956055, "global_step": 332346, "epoch": 2746} {"train_loss": -34.91321563720703, "global_step": 332347, "epoch": 2746} {"train_loss": -34.71432113647461, "global_step": 332348, "epoch": 2746} {"train_loss": -36.61469650268555, "global_step": 332349, "epoch": 2746} {"train_loss": -37.183837890625, "global_step": 332350, "epoch": 2746} {"train_loss": -36.66622543334961, "global_step": 332351, "epoch": 2746} {"train_loss": -38.544822692871094, "global_step": 332352, "epoch": 2746} {"train_loss": -37.196022033691406, "global_step": 332353, "epoch": 2746} {"train_loss": -37.9107780456543, "global_step": 332354, "epoch": 2746} {"train_loss": -38.3386344909668, "global_step": 332355, "epoch": 2746} {"train_loss": -38.999324798583984, "global_step": 332356, "epoch": 2746} {"train_loss": -39.40873336791992, "global_step": 332357, "epoch": 2746} {"train_loss": -39.656612396240234, "global_step": 332358, "epoch": 2746} {"train_loss": -38.86103439331055, "global_step": 332359, "epoch": 2746} {"train_loss": -39.73765182495117, "global_step": 332360, "epoch": 2746} {"train_loss": -40.35465621948242, "global_step": 332361, "epoch": 2746} {"train_loss": -39.304595947265625, "global_step": 332362, "epoch": 2746} {"train_loss": -39.88663101196289, "global_step": 332363, "epoch": 2746} {"train_loss": -40.33069610595703, "global_step": 332364, "epoch": 2746} {"train_loss": -40.665489196777344, "global_step": 332365, "epoch": 2746} {"train_loss": -40.91343307495117, "global_step": 332366, "epoch": 2746} {"train_loss": -40.64046859741211, "global_step": 332367, "epoch": 2746} {"train_loss": -40.48786544799805, "global_step": 332368, "epoch": 2746} {"train_loss": -40.447486877441406, "global_step": 332369, "epoch": 2746} {"train_loss": -41.00859451293945, "global_step": 332370, "epoch": 2746} {"train_loss": -40.909725189208984, "global_step": 332371, "epoch": 2746} {"train_loss": -41.27039337158203, "global_step": 332372, "epoch": 2746} {"train_loss": -41.050636291503906, "global_step": 332373, "epoch": 2746} {"train_loss": -41.20641326904297, "global_step": 332374, "epoch": 2746} {"train_loss": -41.43476486206055, "global_step": 332375, "epoch": 2746} {"train_loss": -41.285858154296875, "global_step": 332376, "epoch": 2746} {"train_loss": -41.33632278442383, "global_step": 332377, "epoch": 2746} {"train_loss": -41.937957763671875, "global_step": 332378, "epoch": 2746} {"train_loss": -41.587257385253906, "global_step": 332379, "epoch": 2746} {"train_loss": -41.482723236083984, "global_step": 332380, "epoch": 2746} {"train_loss": -41.993595123291016, "global_step": 332381, "epoch": 2746} {"train_loss": -42.1844482421875, "global_step": 332382, "epoch": 2746} {"train_loss": -41.70917892456055, "global_step": 332383, "epoch": 2746} {"train_loss": -42.09194564819336, "global_step": 332384, "epoch": 2746} {"train_loss": -41.89753341674805, "global_step": 332385, "epoch": 2746} {"train_loss": -40.4509487664404, "global_step": 332386, "epoch": 2746, "val_loss": 2362770.0} {"train_loss": -42.22541046142578, "global_step": 332387, "epoch": 2747} {"train_loss": -42.018070220947266, "global_step": 332388, "epoch": 2747} {"train_loss": -41.865413665771484, "global_step": 332389, "epoch": 2747} {"train_loss": -42.18740463256836, "global_step": 332390, "epoch": 2747} {"train_loss": -42.480987548828125, "global_step": 332391, "epoch": 2747} {"train_loss": -41.890193939208984, "global_step": 332392, "epoch": 2747} {"train_loss": -41.7623176574707, "global_step": 332393, "epoch": 2747} {"train_loss": -42.560176849365234, "global_step": 332394, "epoch": 2747} {"train_loss": -42.40842819213867, "global_step": 332395, "epoch": 2747} {"train_loss": -42.38888168334961, "global_step": 332396, "epoch": 2747} {"train_loss": -42.863563537597656, "global_step": 332397, "epoch": 2747} {"train_loss": -42.5092658996582, "global_step": 332398, "epoch": 2747} {"train_loss": -42.554927825927734, "global_step": 332399, "epoch": 2747} {"train_loss": -42.48973846435547, "global_step": 332400, "epoch": 2747} {"train_loss": -42.829681396484375, "global_step": 332401, "epoch": 2747} {"train_loss": -42.680416107177734, "global_step": 332402, "epoch": 2747} {"train_loss": -42.89064407348633, "global_step": 332403, "epoch": 2747} {"train_loss": -42.37356185913086, "global_step": 332404, "epoch": 2747} {"train_loss": -42.765289306640625, "global_step": 332405, "epoch": 2747} {"train_loss": -42.7652702331543, "global_step": 332406, "epoch": 2747} {"train_loss": -43.06410598754883, "global_step": 332407, "epoch": 2747} {"train_loss": -42.817039489746094, "global_step": 332408, "epoch": 2747} {"train_loss": -42.98329544067383, "global_step": 332409, "epoch": 2747} {"train_loss": -42.834266662597656, "global_step": 332410, "epoch": 2747} {"train_loss": -43.31377029418945, "global_step": 332411, "epoch": 2747} {"train_loss": -43.4217529296875, "global_step": 332412, "epoch": 2747} {"train_loss": -43.24140930175781, "global_step": 332413, "epoch": 2747} {"train_loss": -43.29204559326172, "global_step": 332414, "epoch": 2747} {"train_loss": -43.29465103149414, "global_step": 332415, "epoch": 2747} {"train_loss": -43.551631927490234, "global_step": 332416, "epoch": 2747} {"train_loss": -43.21274948120117, "global_step": 332417, "epoch": 2747} {"train_loss": -43.34026336669922, "global_step": 332418, "epoch": 2747} {"train_loss": -43.478084564208984, "global_step": 332419, "epoch": 2747} {"train_loss": -43.90892028808594, "global_step": 332420, "epoch": 2747} {"train_loss": -43.57331466674805, "global_step": 332421, "epoch": 2747} {"train_loss": -43.43595886230469, "global_step": 332422, "epoch": 2747} {"train_loss": -43.7534294128418, "global_step": 332423, "epoch": 2747} {"train_loss": -43.44570541381836, "global_step": 332424, "epoch": 2747} {"train_loss": -43.93779373168945, "global_step": 332425, "epoch": 2747} {"train_loss": -43.72520446777344, "global_step": 332426, "epoch": 2747} {"train_loss": -43.73126983642578, "global_step": 332427, "epoch": 2747} {"train_loss": -43.6142463684082, "global_step": 332428, "epoch": 2747} {"train_loss": -43.5936393737793, "global_step": 332429, "epoch": 2747} {"train_loss": -43.77095413208008, "global_step": 332430, "epoch": 2747} {"train_loss": -43.65652084350586, "global_step": 332431, "epoch": 2747} {"train_loss": -43.67877960205078, "global_step": 332432, "epoch": 2747} {"train_loss": -44.004371643066406, "global_step": 332433, "epoch": 2747} {"train_loss": -44.169124603271484, "global_step": 332434, "epoch": 2747} {"train_loss": -44.102996826171875, "global_step": 332435, "epoch": 2747} {"train_loss": -44.13167953491211, "global_step": 332436, "epoch": 2747} {"train_loss": -43.79187774658203, "global_step": 332437, "epoch": 2747} {"train_loss": -44.06729507446289, "global_step": 332438, "epoch": 2747} {"train_loss": -44.164283752441406, "global_step": 332439, "epoch": 2747} {"train_loss": -43.817134857177734, "global_step": 332440, "epoch": 2747} {"train_loss": -43.853919982910156, "global_step": 332441, "epoch": 2747} {"train_loss": -44.518577575683594, "global_step": 332442, "epoch": 2747} {"train_loss": -43.980628967285156, "global_step": 332443, "epoch": 2747} {"train_loss": -44.40852355957031, "global_step": 332444, "epoch": 2747} {"train_loss": -44.28764343261719, "global_step": 332445, "epoch": 2747} {"train_loss": -44.21502685546875, "global_step": 332446, "epoch": 2747} {"train_loss": -44.212791442871094, "global_step": 332447, "epoch": 2747} {"train_loss": -44.63645935058594, "global_step": 332448, "epoch": 2747} {"train_loss": -44.46296310424805, "global_step": 332449, "epoch": 2747} {"train_loss": -44.25881576538086, "global_step": 332450, "epoch": 2747} {"train_loss": -44.622474670410156, "global_step": 332451, "epoch": 2747} {"train_loss": -44.809574127197266, "global_step": 332452, "epoch": 2747} {"train_loss": -44.270626068115234, "global_step": 332453, "epoch": 2747} {"train_loss": -44.18010711669922, "global_step": 332454, "epoch": 2747} {"train_loss": -44.45766067504883, "global_step": 332455, "epoch": 2747} {"train_loss": -43.822486877441406, "global_step": 332456, "epoch": 2747} {"train_loss": -44.465694427490234, "global_step": 332457, "epoch": 2747} {"train_loss": -43.96085739135742, "global_step": 332458, "epoch": 2747} {"train_loss": -44.3837776184082, "global_step": 332459, "epoch": 2747} {"train_loss": -44.85207748413086, "global_step": 332460, "epoch": 2747} {"train_loss": -45.0498161315918, "global_step": 332461, "epoch": 2747} {"train_loss": -44.828399658203125, "global_step": 332462, "epoch": 2747} {"train_loss": -45.036712646484375, "global_step": 332463, "epoch": 2747} {"train_loss": -44.895660400390625, "global_step": 332464, "epoch": 2747} {"train_loss": -44.8176383972168, "global_step": 332465, "epoch": 2747} {"train_loss": -45.038673400878906, "global_step": 332466, "epoch": 2747} {"train_loss": -44.4478759765625, "global_step": 332467, "epoch": 2747} {"train_loss": -44.90688705444336, "global_step": 332468, "epoch": 2747} {"train_loss": -44.75514602661133, "global_step": 332469, "epoch": 2747} {"train_loss": -45.062904357910156, "global_step": 332470, "epoch": 2747} {"train_loss": -44.96852111816406, "global_step": 332471, "epoch": 2747} {"train_loss": -44.79867172241211, "global_step": 332472, "epoch": 2747} {"train_loss": -45.09223556518555, "global_step": 332473, "epoch": 2747} {"train_loss": -44.8682975769043, "global_step": 332474, "epoch": 2747} {"train_loss": -45.05843734741211, "global_step": 332475, "epoch": 2747} {"train_loss": -44.78632736206055, "global_step": 332476, "epoch": 2747} {"train_loss": -45.346248626708984, "global_step": 332477, "epoch": 2747} {"train_loss": -45.3427734375, "global_step": 332478, "epoch": 2747} {"train_loss": -44.86446762084961, "global_step": 332479, "epoch": 2747} {"train_loss": -44.834476470947266, "global_step": 332480, "epoch": 2747} {"train_loss": -45.116004943847656, "global_step": 332481, "epoch": 2747} {"train_loss": -45.102962493896484, "global_step": 332482, "epoch": 2747} {"train_loss": -45.02689743041992, "global_step": 332483, "epoch": 2747} {"train_loss": -45.316768646240234, "global_step": 332484, "epoch": 2747} {"train_loss": -45.17116165161133, "global_step": 332485, "epoch": 2747} {"train_loss": -45.12723159790039, "global_step": 332486, "epoch": 2747} {"train_loss": -44.81321334838867, "global_step": 332487, "epoch": 2747} {"train_loss": -44.885433197021484, "global_step": 332488, "epoch": 2747} {"train_loss": -45.39692306518555, "global_step": 332489, "epoch": 2747} {"train_loss": -44.75285720825195, "global_step": 332490, "epoch": 2747} {"train_loss": -45.19382858276367, "global_step": 332491, "epoch": 2747} {"train_loss": -45.66093826293945, "global_step": 332492, "epoch": 2747} {"train_loss": -45.23976516723633, "global_step": 332493, "epoch": 2747} {"train_loss": -45.007415771484375, "global_step": 332494, "epoch": 2747} {"train_loss": -45.10176467895508, "global_step": 332495, "epoch": 2747} {"train_loss": -45.19355010986328, "global_step": 332496, "epoch": 2747} {"train_loss": -45.1524543762207, "global_step": 332497, "epoch": 2747} {"train_loss": -44.59019088745117, "global_step": 332498, "epoch": 2747} {"train_loss": -44.811283111572266, "global_step": 332499, "epoch": 2747} {"train_loss": -44.483516693115234, "global_step": 332500, "epoch": 2747} {"train_loss": -43.421382904052734, "global_step": 332501, "epoch": 2747} {"train_loss": -40.431636810302734, "global_step": 332502, "epoch": 2747} {"train_loss": -38.61577224731445, "global_step": 332503, "epoch": 2747} {"train_loss": -33.97874069213867, "global_step": 332504, "epoch": 2747} {"train_loss": -30.361846923828125, "global_step": 332505, "epoch": 2747} {"train_loss": -34.27274703979492, "global_step": 332506, "epoch": 2747} {"train_loss": -43.652284354217784, "global_step": 332507, "epoch": 2747, "val_loss": 2324833.75} {"train_loss": -39.752113342285156, "global_step": 332508, "epoch": 2748} {"train_loss": -32.55904769897461, "global_step": 332509, "epoch": 2748} {"train_loss": -42.81088638305664, "global_step": 332510, "epoch": 2748} {"train_loss": -35.14815139770508, "global_step": 332511, "epoch": 2748} {"train_loss": -33.990962982177734, "global_step": 332512, "epoch": 2748} {"train_loss": -42.355995178222656, "global_step": 332513, "epoch": 2748} {"train_loss": -34.202880859375, "global_step": 332514, "epoch": 2748} {"train_loss": -41.96382522583008, "global_step": 332515, "epoch": 2748} {"train_loss": -37.39669418334961, "global_step": 332516, "epoch": 2748} {"train_loss": -42.64030075073242, "global_step": 332517, "epoch": 2748} {"train_loss": -38.306434631347656, "global_step": 332518, "epoch": 2748} {"train_loss": -40.691280364990234, "global_step": 332519, "epoch": 2748} {"train_loss": -40.7319450378418, "global_step": 332520, "epoch": 2748} {"train_loss": -40.585811614990234, "global_step": 332521, "epoch": 2748} {"train_loss": -41.047603607177734, "global_step": 332522, "epoch": 2748} {"train_loss": -41.0161247253418, "global_step": 332523, "epoch": 2748} {"train_loss": -42.02322769165039, "global_step": 332524, "epoch": 2748} {"train_loss": -42.36198425292969, "global_step": 332525, "epoch": 2748} {"train_loss": -40.12600326538086, "global_step": 332526, "epoch": 2748} {"train_loss": -43.036800384521484, "global_step": 332527, "epoch": 2748} {"train_loss": -40.0714225769043, "global_step": 332528, "epoch": 2748} {"train_loss": -42.83842849731445, "global_step": 332529, "epoch": 2748} {"train_loss": -39.26597213745117, "global_step": 332530, "epoch": 2748} {"train_loss": -41.99040603637695, "global_step": 332531, "epoch": 2748} {"train_loss": -42.19753646850586, "global_step": 332532, "epoch": 2748} {"train_loss": -40.175636291503906, "global_step": 332533, "epoch": 2748} {"train_loss": -43.49951171875, "global_step": 332534, "epoch": 2748} {"train_loss": -40.580692291259766, "global_step": 332535, "epoch": 2748} {"train_loss": -42.47674560546875, "global_step": 332536, "epoch": 2748} {"train_loss": -42.348487854003906, "global_step": 332537, "epoch": 2748} {"train_loss": -42.301307678222656, "global_step": 332538, "epoch": 2748} {"train_loss": -42.81673049926758, "global_step": 332539, "epoch": 2748} {"train_loss": -42.9254150390625, "global_step": 332540, "epoch": 2748} {"train_loss": -43.44450759887695, "global_step": 332541, "epoch": 2748} {"train_loss": -42.75861740112305, "global_step": 332542, "epoch": 2748} {"train_loss": -43.76152420043945, "global_step": 332543, "epoch": 2748} {"train_loss": -43.42024612426758, "global_step": 332544, "epoch": 2748} {"train_loss": -43.65325164794922, "global_step": 332545, "epoch": 2748} {"train_loss": -43.6197395324707, "global_step": 332546, "epoch": 2748} {"train_loss": -44.18086242675781, "global_step": 332547, "epoch": 2748} {"train_loss": -43.6026611328125, "global_step": 332548, "epoch": 2748} {"train_loss": -44.15159225463867, "global_step": 332549, "epoch": 2748} {"train_loss": -43.959564208984375, "global_step": 332550, "epoch": 2748} {"train_loss": -44.366905212402344, "global_step": 332551, "epoch": 2748} {"train_loss": -43.64435958862305, "global_step": 332552, "epoch": 2748} {"train_loss": -43.83258819580078, "global_step": 332553, "epoch": 2748} {"train_loss": -44.08487319946289, "global_step": 332554, "epoch": 2748} {"train_loss": -44.288360595703125, "global_step": 332555, "epoch": 2748} {"train_loss": -43.948726654052734, "global_step": 332556, "epoch": 2748} {"train_loss": -44.28896713256836, "global_step": 332557, "epoch": 2748} {"train_loss": -43.469024658203125, "global_step": 332558, "epoch": 2748} {"train_loss": -44.09720993041992, "global_step": 332559, "epoch": 2748} {"train_loss": -44.105953216552734, "global_step": 332560, "epoch": 2748} {"train_loss": -44.18491744995117, "global_step": 332561, "epoch": 2748} {"train_loss": -43.96041488647461, "global_step": 332562, "epoch": 2748} {"train_loss": -43.89945983886719, "global_step": 332563, "epoch": 2748} {"train_loss": -44.36347579956055, "global_step": 332564, "epoch": 2748} {"train_loss": -43.64366912841797, "global_step": 332565, "epoch": 2748} {"train_loss": -43.87847900390625, "global_step": 332566, "epoch": 2748} {"train_loss": -44.41053009033203, "global_step": 332567, "epoch": 2748} {"train_loss": -42.98308563232422, "global_step": 332568, "epoch": 2748} {"train_loss": -44.30752944946289, "global_step": 332569, "epoch": 2748} {"train_loss": -43.87934494018555, "global_step": 332570, "epoch": 2748} {"train_loss": -44.27873992919922, "global_step": 332571, "epoch": 2748} {"train_loss": -42.936492919921875, "global_step": 332572, "epoch": 2748} {"train_loss": -44.49257278442383, "global_step": 332573, "epoch": 2748} {"train_loss": -43.762325286865234, "global_step": 332574, "epoch": 2748} {"train_loss": -44.039485931396484, "global_step": 332575, "epoch": 2748} {"train_loss": -44.32882308959961, "global_step": 332576, "epoch": 2748} {"train_loss": -44.277462005615234, "global_step": 332577, "epoch": 2748} {"train_loss": -44.32793426513672, "global_step": 332578, "epoch": 2748} {"train_loss": -44.2734489440918, "global_step": 332579, "epoch": 2748} {"train_loss": -44.29070281982422, "global_step": 332580, "epoch": 2748} {"train_loss": -44.458526611328125, "global_step": 332581, "epoch": 2748} {"train_loss": -44.645233154296875, "global_step": 332582, "epoch": 2748} {"train_loss": -44.493404388427734, "global_step": 332583, "epoch": 2748} {"train_loss": -44.624725341796875, "global_step": 332584, "epoch": 2748} {"train_loss": -44.6396369934082, "global_step": 332585, "epoch": 2748} {"train_loss": -44.65929412841797, "global_step": 332586, "epoch": 2748} {"train_loss": -44.60694885253906, "global_step": 332587, "epoch": 2748} {"train_loss": -44.69078063964844, "global_step": 332588, "epoch": 2748} {"train_loss": -44.88125228881836, "global_step": 332589, "epoch": 2748} {"train_loss": -44.92658615112305, "global_step": 332590, "epoch": 2748} {"train_loss": -44.490760803222656, "global_step": 332591, "epoch": 2748} {"train_loss": -44.6091423034668, "global_step": 332592, "epoch": 2748} {"train_loss": -44.66140365600586, "global_step": 332593, "epoch": 2748} {"train_loss": -44.64057922363281, "global_step": 332594, "epoch": 2748} {"train_loss": -44.45563888549805, "global_step": 332595, "epoch": 2748} {"train_loss": -44.74640655517578, "global_step": 332596, "epoch": 2748} {"train_loss": -44.8077507019043, "global_step": 332597, "epoch": 2748} {"train_loss": -43.75010299682617, "global_step": 332598, "epoch": 2748} {"train_loss": -43.87821960449219, "global_step": 332599, "epoch": 2748} {"train_loss": -44.045082092285156, "global_step": 332600, "epoch": 2748} {"train_loss": -44.128997802734375, "global_step": 332601, "epoch": 2748} {"train_loss": -43.964454650878906, "global_step": 332602, "epoch": 2748} {"train_loss": -44.15111541748047, "global_step": 332603, "epoch": 2748} {"train_loss": -44.36582565307617, "global_step": 332604, "epoch": 2748} {"train_loss": -44.3647575378418, "global_step": 332605, "epoch": 2748} {"train_loss": -43.68988800048828, "global_step": 332606, "epoch": 2748} {"train_loss": -42.97797775268555, "global_step": 332607, "epoch": 2748} {"train_loss": -43.71098709106445, "global_step": 332608, "epoch": 2748} {"train_loss": -44.393096923828125, "global_step": 332609, "epoch": 2748} {"train_loss": -44.28023910522461, "global_step": 332610, "epoch": 2748} {"train_loss": -44.74653244018555, "global_step": 332611, "epoch": 2748} {"train_loss": -44.26322555541992, "global_step": 332612, "epoch": 2748} {"train_loss": -43.83127975463867, "global_step": 332613, "epoch": 2748} {"train_loss": -43.8487663269043, "global_step": 332614, "epoch": 2748} {"train_loss": -44.1507682800293, "global_step": 332615, "epoch": 2748} {"train_loss": -44.12336349487305, "global_step": 332616, "epoch": 2748} {"train_loss": -43.506744384765625, "global_step": 332617, "epoch": 2748} {"train_loss": -44.82038497924805, "global_step": 332618, "epoch": 2748} {"train_loss": -44.43606948852539, "global_step": 332619, "epoch": 2748} {"train_loss": -44.1482048034668, "global_step": 332620, "epoch": 2748} {"train_loss": -44.75076675415039, "global_step": 332621, "epoch": 2748} {"train_loss": -44.031982421875, "global_step": 332622, "epoch": 2748} {"train_loss": -44.01417922973633, "global_step": 332623, "epoch": 2748} {"train_loss": -44.97183609008789, "global_step": 332624, "epoch": 2748} {"train_loss": -44.20939254760742, "global_step": 332625, "epoch": 2748} {"train_loss": -44.478363037109375, "global_step": 332626, "epoch": 2748} {"train_loss": -44.931678771972656, "global_step": 332627, "epoch": 2748} {"train_loss": -43.15043914416605, "global_step": 332628, "epoch": 2748, "val_loss": 2440459.25} {"train_loss": -44.491146087646484, "global_step": 332629, "epoch": 2749} {"train_loss": -44.01748275756836, "global_step": 332630, "epoch": 2749} {"train_loss": -44.7943229675293, "global_step": 332631, "epoch": 2749} {"train_loss": -44.880733489990234, "global_step": 332632, "epoch": 2749} {"train_loss": -44.18616485595703, "global_step": 332633, "epoch": 2749} {"train_loss": -44.938045501708984, "global_step": 332634, "epoch": 2749} {"train_loss": -45.06652069091797, "global_step": 332635, "epoch": 2749} {"train_loss": -44.10365676879883, "global_step": 332636, "epoch": 2749} {"train_loss": -45.03711700439453, "global_step": 332637, "epoch": 2749} {"train_loss": -45.2136116027832, "global_step": 332638, "epoch": 2749} {"train_loss": -44.517120361328125, "global_step": 332639, "epoch": 2749} {"train_loss": -43.891292572021484, "global_step": 332640, "epoch": 2749} {"train_loss": -44.359371185302734, "global_step": 332641, "epoch": 2749} {"train_loss": -45.458778381347656, "global_step": 332642, "epoch": 2749} {"train_loss": -44.92546844482422, "global_step": 332643, "epoch": 2749} {"train_loss": -43.82251739501953, "global_step": 332644, "epoch": 2749} {"train_loss": -43.64312744140625, "global_step": 332645, "epoch": 2749} {"train_loss": -44.3785400390625, "global_step": 332646, "epoch": 2749} {"train_loss": -44.845802307128906, "global_step": 332647, "epoch": 2749} {"train_loss": -44.21885299682617, "global_step": 332648, "epoch": 2749} {"train_loss": -44.2360954284668, "global_step": 332649, "epoch": 2749} {"train_loss": -44.87773513793945, "global_step": 332650, "epoch": 2749} {"train_loss": -44.91343307495117, "global_step": 332651, "epoch": 2749} {"train_loss": -45.07096481323242, "global_step": 332652, "epoch": 2749} {"train_loss": -44.32484817504883, "global_step": 332653, "epoch": 2749} {"train_loss": -44.78242111206055, "global_step": 332654, "epoch": 2749} {"train_loss": -44.785396575927734, "global_step": 332655, "epoch": 2749} {"train_loss": -45.05339431762695, "global_step": 332656, "epoch": 2749} {"train_loss": -44.7535514831543, "global_step": 332657, "epoch": 2749} {"train_loss": -45.227840423583984, "global_step": 332658, "epoch": 2749} {"train_loss": -44.286781311035156, "global_step": 332659, "epoch": 2749} {"train_loss": -43.4898681640625, "global_step": 332660, "epoch": 2749} {"train_loss": -43.25828170776367, "global_step": 332661, "epoch": 2749} {"train_loss": -44.15793991088867, "global_step": 332662, "epoch": 2749} {"train_loss": -43.873291015625, "global_step": 332663, "epoch": 2749} {"train_loss": -42.78871536254883, "global_step": 332664, "epoch": 2749} {"train_loss": -42.40549087524414, "global_step": 332665, "epoch": 2749} {"train_loss": -42.17921829223633, "global_step": 332666, "epoch": 2749} {"train_loss": -43.727874755859375, "global_step": 332667, "epoch": 2749} {"train_loss": -43.370513916015625, "global_step": 332668, "epoch": 2749} {"train_loss": -41.7451286315918, "global_step": 332669, "epoch": 2749} {"train_loss": -40.889923095703125, "global_step": 332670, "epoch": 2749} {"train_loss": -42.07020950317383, "global_step": 332671, "epoch": 2749} {"train_loss": -43.84989929199219, "global_step": 332672, "epoch": 2749} {"train_loss": -42.47313690185547, "global_step": 332673, "epoch": 2749} {"train_loss": -42.33746337890625, "global_step": 332674, "epoch": 2749} {"train_loss": -42.21826934814453, "global_step": 332675, "epoch": 2749} {"train_loss": -42.26536178588867, "global_step": 332676, "epoch": 2749} {"train_loss": -42.54642868041992, "global_step": 332677, "epoch": 2749} {"train_loss": -42.721710205078125, "global_step": 332678, "epoch": 2749} {"train_loss": -40.81625747680664, "global_step": 332679, "epoch": 2749} {"train_loss": -43.63788986206055, "global_step": 332680, "epoch": 2749} {"train_loss": -41.80279541015625, "global_step": 332681, "epoch": 2749} {"train_loss": -39.43941879272461, "global_step": 332682, "epoch": 2749} {"train_loss": -42.45026779174805, "global_step": 332683, "epoch": 2749} {"train_loss": -43.358882904052734, "global_step": 332684, "epoch": 2749} {"train_loss": -42.207542419433594, "global_step": 332685, "epoch": 2749} {"train_loss": -43.954097747802734, "global_step": 332686, "epoch": 2749} {"train_loss": -44.18807601928711, "global_step": 332687, "epoch": 2749} {"train_loss": -43.138790130615234, "global_step": 332688, "epoch": 2749} {"train_loss": -43.975242614746094, "global_step": 332689, "epoch": 2749} {"train_loss": -43.34806442260742, "global_step": 332690, "epoch": 2749} {"train_loss": -43.89521026611328, "global_step": 332691, "epoch": 2749} {"train_loss": -44.39706802368164, "global_step": 332692, "epoch": 2749} {"train_loss": -44.23127365112305, "global_step": 332693, "epoch": 2749} {"train_loss": -44.581268310546875, "global_step": 332694, "epoch": 2749} {"train_loss": -44.156524658203125, "global_step": 332695, "epoch": 2749} {"train_loss": -44.3697395324707, "global_step": 332696, "epoch": 2749} {"train_loss": -44.230384826660156, "global_step": 332697, "epoch": 2749} {"train_loss": -44.37247085571289, "global_step": 332698, "epoch": 2749} {"train_loss": -44.13312530517578, "global_step": 332699, "epoch": 2749} {"train_loss": -45.11948776245117, "global_step": 332700, "epoch": 2749} {"train_loss": -44.17898178100586, "global_step": 332701, "epoch": 2749} {"train_loss": -44.38800811767578, "global_step": 332702, "epoch": 2749} {"train_loss": -44.56686019897461, "global_step": 332703, "epoch": 2749} {"train_loss": -44.701087951660156, "global_step": 332704, "epoch": 2749} {"train_loss": -44.82171630859375, "global_step": 332705, "epoch": 2749} {"train_loss": -45.09103012084961, "global_step": 332706, "epoch": 2749} {"train_loss": -44.84938430786133, "global_step": 332707, "epoch": 2749} {"train_loss": -44.56630325317383, "global_step": 332708, "epoch": 2749} {"train_loss": -44.92163848876953, "global_step": 332709, "epoch": 2749} {"train_loss": -44.81390380859375, "global_step": 332710, "epoch": 2749} {"train_loss": -44.50849151611328, "global_step": 332711, "epoch": 2749} {"train_loss": -44.71001052856445, "global_step": 332712, "epoch": 2749} {"train_loss": -44.87051010131836, "global_step": 332713, "epoch": 2749} {"train_loss": -44.81364059448242, "global_step": 332714, "epoch": 2749} {"train_loss": -44.80889892578125, "global_step": 332715, "epoch": 2749} {"train_loss": -44.683753967285156, "global_step": 332716, "epoch": 2749} {"train_loss": -44.49953842163086, "global_step": 332717, "epoch": 2749} {"train_loss": -44.85429382324219, "global_step": 332718, "epoch": 2749} {"train_loss": -43.1724967956543, "global_step": 332719, "epoch": 2749} {"train_loss": -44.829872131347656, "global_step": 332720, "epoch": 2749} {"train_loss": -44.016475677490234, "global_step": 332721, "epoch": 2749} {"train_loss": -44.64387130737305, "global_step": 332722, "epoch": 2749} {"train_loss": -44.40743637084961, "global_step": 332723, "epoch": 2749} {"train_loss": -43.169769287109375, "global_step": 332724, "epoch": 2749} {"train_loss": -43.4190788269043, "global_step": 332725, "epoch": 2749} {"train_loss": -44.380348205566406, "global_step": 332726, "epoch": 2749} {"train_loss": -44.46095657348633, "global_step": 332727, "epoch": 2749} {"train_loss": -42.71428298950195, "global_step": 332728, "epoch": 2749} {"train_loss": -43.6082878112793, "global_step": 332729, "epoch": 2749} {"train_loss": -45.003448486328125, "global_step": 332730, "epoch": 2749} {"train_loss": -41.71964645385742, "global_step": 332731, "epoch": 2749} {"train_loss": -43.29512023925781, "global_step": 332732, "epoch": 2749} {"train_loss": -44.072017669677734, "global_step": 332733, "epoch": 2749} {"train_loss": -38.359859466552734, "global_step": 332734, "epoch": 2749} {"train_loss": -39.47736740112305, "global_step": 332735, "epoch": 2749} {"train_loss": -43.791259765625, "global_step": 332736, "epoch": 2749} {"train_loss": -37.2918815612793, "global_step": 332737, "epoch": 2749} {"train_loss": -40.66541290283203, "global_step": 332738, "epoch": 2749} {"train_loss": -42.48089599609375, "global_step": 332739, "epoch": 2749} {"train_loss": -37.67495346069336, "global_step": 332740, "epoch": 2749} {"train_loss": -42.8187255859375, "global_step": 332741, "epoch": 2749} {"train_loss": -40.01560592651367, "global_step": 332742, "epoch": 2749} {"train_loss": -44.33284378051758, "global_step": 332743, "epoch": 2749} {"train_loss": -40.632015228271484, "global_step": 332744, "epoch": 2749} {"train_loss": -42.1126823425293, "global_step": 332745, "epoch": 2749} {"train_loss": -40.920265197753906, "global_step": 332746, "epoch": 2749} {"train_loss": -40.89689254760742, "global_step": 332747, "epoch": 2749} {"train_loss": -42.53398513793945, "global_step": 332748, "epoch": 2749} {"train_loss": -43.53684587715086, "global_step": 332749, "epoch": 2749, "val_loss": 2576274.75} {"train_loss": -43.68201446533203, "global_step": 332750, "epoch": 2750} {"train_loss": -40.17837905883789, "global_step": 332751, "epoch": 2750} {"train_loss": -42.92927169799805, "global_step": 332752, "epoch": 2750} {"train_loss": -42.71247482299805, "global_step": 332753, "epoch": 2750} {"train_loss": -43.5162467956543, "global_step": 332754, "epoch": 2750} {"train_loss": -43.4523811340332, "global_step": 332755, "epoch": 2750} {"train_loss": -43.97971725463867, "global_step": 332756, "epoch": 2750} {"train_loss": -43.941768646240234, "global_step": 332757, "epoch": 2750} {"train_loss": -43.319793701171875, "global_step": 332758, "epoch": 2750} {"train_loss": -43.858802795410156, "global_step": 332759, "epoch": 2750} {"train_loss": -44.14706039428711, "global_step": 332760, "epoch": 2750} {"train_loss": -43.869380950927734, "global_step": 332761, "epoch": 2750} {"train_loss": -44.363990783691406, "global_step": 332762, "epoch": 2750} {"train_loss": -44.2115478515625, "global_step": 332763, "epoch": 2750} {"train_loss": -44.01133728027344, "global_step": 332764, "epoch": 2750} {"train_loss": -44.82664108276367, "global_step": 332765, "epoch": 2750} {"train_loss": -43.97896957397461, "global_step": 332766, "epoch": 2750} {"train_loss": -44.44480514526367, "global_step": 332767, "epoch": 2750} {"train_loss": -44.54966354370117, "global_step": 332768, "epoch": 2750} {"train_loss": -44.3129997253418, "global_step": 332769, "epoch": 2750} {"train_loss": -44.4388427734375, "global_step": 332770, "epoch": 2750} {"train_loss": -44.326534271240234, "global_step": 332771, "epoch": 2750} {"train_loss": -44.277584075927734, "global_step": 332772, "epoch": 2750} {"train_loss": -44.635894775390625, "global_step": 332773, "epoch": 2750} {"train_loss": -44.75120544433594, "global_step": 332774, "epoch": 2750} {"train_loss": -44.2405891418457, "global_step": 332775, "epoch": 2750} {"train_loss": -44.758209228515625, "global_step": 332776, "epoch": 2750} {"train_loss": -44.5609016418457, "global_step": 332777, "epoch": 2750} {"train_loss": -45.050960540771484, "global_step": 332778, "epoch": 2750} {"train_loss": -44.24821090698242, "global_step": 332779, "epoch": 2750} {"train_loss": -44.99934005737305, "global_step": 332780, "epoch": 2750} {"train_loss": -44.70563507080078, "global_step": 332781, "epoch": 2750} {"train_loss": -45.031856536865234, "global_step": 332782, "epoch": 2750} {"train_loss": -43.8822135925293, "global_step": 332783, "epoch": 2750} {"train_loss": -44.85960388183594, "global_step": 332784, "epoch": 2750} {"train_loss": -45.2271614074707, "global_step": 332785, "epoch": 2750} {"train_loss": -44.74164962768555, "global_step": 332786, "epoch": 2750} {"train_loss": -42.79668426513672, "global_step": 332787, "epoch": 2750} {"train_loss": -44.50586700439453, "global_step": 332788, "epoch": 2750} {"train_loss": -43.71611785888672, "global_step": 332789, "epoch": 2750} {"train_loss": -44.42620849609375, "global_step": 332790, "epoch": 2750} {"train_loss": -44.707244873046875, "global_step": 332791, "epoch": 2750} {"train_loss": -44.295284271240234, "global_step": 332792, "epoch": 2750} {"train_loss": -44.45064163208008, "global_step": 332793, "epoch": 2750} {"train_loss": -44.529335021972656, "global_step": 332794, "epoch": 2750} {"train_loss": -43.08707046508789, "global_step": 332795, "epoch": 2750} {"train_loss": -45.014801025390625, "global_step": 332796, "epoch": 2750} {"train_loss": -43.9610481262207, "global_step": 332797, "epoch": 2750} {"train_loss": -44.85588455200195, "global_step": 332798, "epoch": 2750} {"train_loss": -44.084468841552734, "global_step": 332799, "epoch": 2750} {"train_loss": -44.616661071777344, "global_step": 332800, "epoch": 2750} {"train_loss": -44.935462951660156, "global_step": 332801, "epoch": 2750} {"train_loss": -45.10456085205078, "global_step": 332802, "epoch": 2750} {"train_loss": -44.84542465209961, "global_step": 332803, "epoch": 2750} {"train_loss": -43.91719055175781, "global_step": 332804, "epoch": 2750} {"train_loss": -45.44253158569336, "global_step": 332805, "epoch": 2750} {"train_loss": -44.54853439331055, "global_step": 332806, "epoch": 2750} {"train_loss": -44.64193344116211, "global_step": 332807, "epoch": 2750} {"train_loss": -43.98298645019531, "global_step": 332808, "epoch": 2750} {"train_loss": -45.142738342285156, "global_step": 332809, "epoch": 2750} {"train_loss": -43.76731491088867, "global_step": 332810, "epoch": 2750} {"train_loss": -44.647552490234375, "global_step": 332811, "epoch": 2750} {"train_loss": -44.8016242980957, "global_step": 332812, "epoch": 2750} {"train_loss": -43.59680938720703, "global_step": 332813, "epoch": 2750} {"train_loss": -42.15491485595703, "global_step": 332814, "epoch": 2750} {"train_loss": -44.352027893066406, "global_step": 332815, "epoch": 2750} {"train_loss": -44.774932861328125, "global_step": 332816, "epoch": 2750} {"train_loss": -43.173126220703125, "global_step": 332817, "epoch": 2750} {"train_loss": -43.593719482421875, "global_step": 332818, "epoch": 2750} {"train_loss": -44.15198516845703, "global_step": 332819, "epoch": 2750} {"train_loss": -44.099491119384766, "global_step": 332820, "epoch": 2750} {"train_loss": -43.326087951660156, "global_step": 332821, "epoch": 2750} {"train_loss": -44.471858978271484, "global_step": 332822, "epoch": 2750} {"train_loss": -44.27399826049805, "global_step": 332823, "epoch": 2750} {"train_loss": -43.9334831237793, "global_step": 332824, "epoch": 2750} {"train_loss": -43.85946273803711, "global_step": 332825, "epoch": 2750} {"train_loss": -44.01613235473633, "global_step": 332826, "epoch": 2750} {"train_loss": -44.23661422729492, "global_step": 332827, "epoch": 2750} {"train_loss": -44.8241081237793, "global_step": 332828, "epoch": 2750} {"train_loss": -43.51494216918945, "global_step": 332829, "epoch": 2750} {"train_loss": -44.701358795166016, "global_step": 332830, "epoch": 2750} {"train_loss": -44.541229248046875, "global_step": 332831, "epoch": 2750} {"train_loss": -42.5948600769043, "global_step": 332832, "epoch": 2750} {"train_loss": -44.093990325927734, "global_step": 332833, "epoch": 2750} {"train_loss": -44.904632568359375, "global_step": 332834, "epoch": 2750} {"train_loss": -43.690277099609375, "global_step": 332835, "epoch": 2750} {"train_loss": -44.33950424194336, "global_step": 332836, "epoch": 2750} {"train_loss": -44.79648971557617, "global_step": 332837, "epoch": 2750} {"train_loss": -43.97738265991211, "global_step": 332838, "epoch": 2750} {"train_loss": -44.82403564453125, "global_step": 332839, "epoch": 2750} {"train_loss": -43.59597396850586, "global_step": 332840, "epoch": 2750} {"train_loss": -44.24935531616211, "global_step": 332841, "epoch": 2750} {"train_loss": -45.13622283935547, "global_step": 332842, "epoch": 2750} {"train_loss": -43.9550666809082, "global_step": 332843, "epoch": 2750} {"train_loss": -42.9224967956543, "global_step": 332844, "epoch": 2750} {"train_loss": -44.10029983520508, "global_step": 332845, "epoch": 2750} {"train_loss": -44.68590545654297, "global_step": 332846, "epoch": 2750} {"train_loss": -43.935176849365234, "global_step": 332847, "epoch": 2750} {"train_loss": -44.9827995300293, "global_step": 332848, "epoch": 2750} {"train_loss": -45.32516098022461, "global_step": 332849, "epoch": 2750} {"train_loss": -44.800838470458984, "global_step": 332850, "epoch": 2750} {"train_loss": -44.975006103515625, "global_step": 332851, "epoch": 2750} {"train_loss": -45.062374114990234, "global_step": 332852, "epoch": 2750} {"train_loss": -43.304073333740234, "global_step": 332853, "epoch": 2750} {"train_loss": -44.62004089355469, "global_step": 332854, "epoch": 2750} {"train_loss": -44.76890182495117, "global_step": 332855, "epoch": 2750} {"train_loss": -44.87038040161133, "global_step": 332856, "epoch": 2750} {"train_loss": -45.19154739379883, "global_step": 332857, "epoch": 2750} {"train_loss": -45.074317932128906, "global_step": 332858, "epoch": 2750} {"train_loss": -44.84597396850586, "global_step": 332859, "epoch": 2750} {"train_loss": -44.638832092285156, "global_step": 332860, "epoch": 2750} {"train_loss": -44.91480255126953, "global_step": 332861, "epoch": 2750} {"train_loss": -44.15183639526367, "global_step": 332862, "epoch": 2750} {"train_loss": -44.08521270751953, "global_step": 332863, "epoch": 2750} {"train_loss": -44.95745849609375, "global_step": 332864, "epoch": 2750} {"train_loss": -45.39330291748047, "global_step": 332865, "epoch": 2750} {"train_loss": -45.449581146240234, "global_step": 332866, "epoch": 2750} {"train_loss": -44.645591735839844, "global_step": 332867, "epoch": 2750} {"train_loss": -45.267662048339844, "global_step": 332868, "epoch": 2750} {"train_loss": -45.11640548706055, "global_step": 332869, "epoch": 2750} {"train_loss": -44.29812089273752, "global_step": 332870, "epoch": 2750, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4400000": 1.0, "test/sim_max_reward_4400001": 1.0, "test/sim_max_reward_4400002": 1.0, "test/sim_max_reward_4400003": 1.0, "test/sim_max_reward_4400004": 1.0, "test/sim_max_reward_4400005": 1.0, "test/sim_max_reward_4400006": 1.0, "test/sim_max_reward_4400007": 1.0, "test/sim_max_reward_4400008": 1.0, "test/sim_max_reward_4400009": 1.0, "test/sim_max_reward_4400010": 1.0, "test/sim_max_reward_4400011": 1.0, "test/sim_max_reward_4400012": 1.0, "test/sim_max_reward_4400013": 1.0, "test/sim_max_reward_4400014": 1.0, "test/sim_max_reward_4400015": 1.0, "test/sim_max_reward_4400016": 1.0, "test/sim_max_reward_4400017": 1.0, "test/sim_max_reward_4400018": 1.0, "test/sim_max_reward_4400019": 1.0, "test/sim_max_reward_4400020": 1.0, "test/sim_max_reward_4400021": 1.0, "train/mean_score": 1.0, "test/mean_score": 1.0, "val_loss": 2563486.25} {"train_loss": -44.92953109741211, "global_step": 332871, "epoch": 2751} {"train_loss": -45.270870208740234, "global_step": 332872, "epoch": 2751} {"train_loss": -45.250213623046875, "global_step": 332873, "epoch": 2751} {"train_loss": -44.15887451171875, "global_step": 332874, "epoch": 2751} {"train_loss": -43.49775695800781, "global_step": 332875, "epoch": 2751} {"train_loss": -44.76191329956055, "global_step": 332876, "epoch": 2751} {"train_loss": -44.35926818847656, "global_step": 332877, "epoch": 2751} {"train_loss": -44.569210052490234, "global_step": 332878, "epoch": 2751} {"train_loss": -45.23650360107422, "global_step": 332879, "epoch": 2751} {"train_loss": -44.44895935058594, "global_step": 332880, "epoch": 2751} {"train_loss": -44.74829864501953, "global_step": 332881, "epoch": 2751} {"train_loss": -45.241329193115234, "global_step": 332882, "epoch": 2751} {"train_loss": -44.76190185546875, "global_step": 332883, "epoch": 2751} {"train_loss": -44.013484954833984, "global_step": 332884, "epoch": 2751} {"train_loss": -44.116207122802734, "global_step": 332885, "epoch": 2751} {"train_loss": -44.23291778564453, "global_step": 332886, "epoch": 2751} {"train_loss": -43.93720245361328, "global_step": 332887, "epoch": 2751} {"train_loss": -44.68843078613281, "global_step": 332888, "epoch": 2751} {"train_loss": -44.515342712402344, "global_step": 332889, "epoch": 2751} {"train_loss": -45.05384063720703, "global_step": 332890, "epoch": 2751} {"train_loss": -44.58573913574219, "global_step": 332891, "epoch": 2751} {"train_loss": -44.6406364440918, "global_step": 332892, "epoch": 2751} {"train_loss": -44.80550003051758, "global_step": 332893, "epoch": 2751} {"train_loss": -45.39042282104492, "global_step": 332894, "epoch": 2751} {"train_loss": -45.470008850097656, "global_step": 332895, "epoch": 2751} {"train_loss": -44.85453414916992, "global_step": 332896, "epoch": 2751} {"train_loss": -44.89482498168945, "global_step": 332897, "epoch": 2751} {"train_loss": -44.987850189208984, "global_step": 332898, "epoch": 2751} {"train_loss": -44.717628479003906, "global_step": 332899, "epoch": 2751} {"train_loss": -44.19659423828125, "global_step": 332900, "epoch": 2751} {"train_loss": -45.07054901123047, "global_step": 332901, "epoch": 2751} {"train_loss": -43.13319778442383, "global_step": 332902, "epoch": 2751} {"train_loss": -43.40121841430664, "global_step": 332903, "epoch": 2751} {"train_loss": -44.1739387512207, "global_step": 332904, "epoch": 2751} {"train_loss": -43.82435607910156, "global_step": 332905, "epoch": 2751} {"train_loss": -43.40580368041992, "global_step": 332906, "epoch": 2751} {"train_loss": -43.63674545288086, "global_step": 332907, "epoch": 2751} {"train_loss": -44.71131896972656, "global_step": 332908, "epoch": 2751} {"train_loss": -44.00570297241211, "global_step": 332909, "epoch": 2751} {"train_loss": -43.936336517333984, "global_step": 332910, "epoch": 2751} {"train_loss": -42.73160934448242, "global_step": 332911, "epoch": 2751} {"train_loss": -44.88323974609375, "global_step": 332912, "epoch": 2751} {"train_loss": -44.09943389892578, "global_step": 332913, "epoch": 2751} {"train_loss": -44.672462463378906, "global_step": 332914, "epoch": 2751} {"train_loss": -43.81583786010742, "global_step": 332915, "epoch": 2751} {"train_loss": -40.50416946411133, "global_step": 332916, "epoch": 2751} {"train_loss": -43.37490463256836, "global_step": 332917, "epoch": 2751} {"train_loss": -44.502174377441406, "global_step": 332918, "epoch": 2751} {"train_loss": -42.24836730957031, "global_step": 332919, "epoch": 2751} {"train_loss": -42.49528884887695, "global_step": 332920, "epoch": 2751} {"train_loss": -42.9290885925293, "global_step": 332921, "epoch": 2751} {"train_loss": -43.74594497680664, "global_step": 332922, "epoch": 2751} {"train_loss": -42.2851676940918, "global_step": 332923, "epoch": 2751} {"train_loss": -41.061805725097656, "global_step": 332924, "epoch": 2751} {"train_loss": -43.60923385620117, "global_step": 332925, "epoch": 2751} {"train_loss": -42.45873260498047, "global_step": 332926, "epoch": 2751} {"train_loss": -41.705299377441406, "global_step": 332927, "epoch": 2751} {"train_loss": -42.77279281616211, "global_step": 332928, "epoch": 2751} {"train_loss": -43.184844970703125, "global_step": 332929, "epoch": 2751} {"train_loss": -42.709957122802734, "global_step": 332930, "epoch": 2751} {"train_loss": 24.251066207885742, "global_step": 332931, "epoch": 2751} {"train_loss": -40.072959899902344, "global_step": 332932, "epoch": 2751} {"train_loss": -41.972354888916016, "global_step": 332933, "epoch": 2751} {"train_loss": -42.14055633544922, "global_step": 332934, "epoch": 2751} {"train_loss": -39.93383026123047, "global_step": 332935, "epoch": 2751} {"train_loss": -42.38547897338867, "global_step": 332936, "epoch": 2751} {"train_loss": -39.016273498535156, "global_step": 332937, "epoch": 2751} {"train_loss": -38.781219482421875, "global_step": 332938, "epoch": 2751} {"train_loss": -40.0739631652832, "global_step": 332939, "epoch": 2751} {"train_loss": -29.952686309814453, "global_step": 332940, "epoch": 2751} {"train_loss": -39.95809555053711, "global_step": 332941, "epoch": 2751} {"train_loss": -38.601318359375, "global_step": 332942, "epoch": 2751} {"train_loss": -37.81399917602539, "global_step": 332943, "epoch": 2751} {"train_loss": -29.755542755126953, "global_step": 332944, "epoch": 2751} {"train_loss": -40.093017578125, "global_step": 332945, "epoch": 2751} {"train_loss": -41.36434555053711, "global_step": 332946, "epoch": 2751} {"train_loss": -38.94441604614258, "global_step": 332947, "epoch": 2751} {"train_loss": -39.59511184692383, "global_step": 332948, "epoch": 2751} {"train_loss": -39.28106689453125, "global_step": 332949, "epoch": 2751} {"train_loss": -36.98771286010742, "global_step": 332950, "epoch": 2751} {"train_loss": -40.63509750366211, "global_step": 332951, "epoch": 2751} {"train_loss": -37.77947998046875, "global_step": 332952, "epoch": 2751} {"train_loss": -36.716636657714844, "global_step": 332953, "epoch": 2751} {"train_loss": -41.125301361083984, "global_step": 332954, "epoch": 2751} {"train_loss": -38.91164779663086, "global_step": 332955, "epoch": 2751} {"train_loss": -41.26860427856445, "global_step": 332956, "epoch": 2751} {"train_loss": -41.77323532104492, "global_step": 332957, "epoch": 2751} {"train_loss": -40.21039962768555, "global_step": 332958, "epoch": 2751} {"train_loss": -39.53628921508789, "global_step": 332959, "epoch": 2751} {"train_loss": -40.96938705444336, "global_step": 332960, "epoch": 2751} {"train_loss": -30.408140182495117, "global_step": 332961, "epoch": 2751} {"train_loss": -42.480098724365234, "global_step": 332962, "epoch": 2751} {"train_loss": -37.80763626098633, "global_step": 332963, "epoch": 2751} {"train_loss": -40.627342224121094, "global_step": 332964, "epoch": 2751} {"train_loss": -39.41794967651367, "global_step": 332965, "epoch": 2751} {"train_loss": -41.58924865722656, "global_step": 332966, "epoch": 2751} {"train_loss": -41.20949172973633, "global_step": 332967, "epoch": 2751} {"train_loss": -40.032936096191406, "global_step": 332968, "epoch": 2751} {"train_loss": -42.31841278076172, "global_step": 332969, "epoch": 2751} {"train_loss": -40.72687911987305, "global_step": 332970, "epoch": 2751} {"train_loss": -41.07892608642578, "global_step": 332971, "epoch": 2751} {"train_loss": -41.11000442504883, "global_step": 332972, "epoch": 2751} {"train_loss": -39.07081985473633, "global_step": 332973, "epoch": 2751} {"train_loss": -42.39849853515625, "global_step": 332974, "epoch": 2751} {"train_loss": -41.641845703125, "global_step": 332975, "epoch": 2751} {"train_loss": -41.00571823120117, "global_step": 332976, "epoch": 2751} {"train_loss": -42.19247055053711, "global_step": 332977, "epoch": 2751} {"train_loss": -42.17873001098633, "global_step": 332978, "epoch": 2751} {"train_loss": -43.06248092651367, "global_step": 332979, "epoch": 2751} {"train_loss": -41.13261032104492, "global_step": 332980, "epoch": 2751} {"train_loss": -41.33602523803711, "global_step": 332981, "epoch": 2751} {"train_loss": -42.31337356567383, "global_step": 332982, "epoch": 2751} {"train_loss": -43.13131332397461, "global_step": 332983, "epoch": 2751} {"train_loss": -42.99245834350586, "global_step": 332984, "epoch": 2751} {"train_loss": -43.14771270751953, "global_step": 332985, "epoch": 2751} {"train_loss": -42.398311614990234, "global_step": 332986, "epoch": 2751} {"train_loss": -42.71703338623047, "global_step": 332987, "epoch": 2751} {"train_loss": -43.47209167480469, "global_step": 332988, "epoch": 2751} {"train_loss": -43.05436325073242, "global_step": 332989, "epoch": 2751} {"train_loss": -42.21840286254883, "global_step": 332990, "epoch": 2751} {"train_loss": -41.5859237860057, "global_step": 332991, "epoch": 2751, "val_loss": 2440833.25} {"train_loss": -43.28030014038086, "global_step": 332992, "epoch": 2752} {"train_loss": -43.65104293823242, "global_step": 332993, "epoch": 2752} {"train_loss": -43.1170539855957, "global_step": 332994, "epoch": 2752} {"train_loss": -42.3629150390625, "global_step": 332995, "epoch": 2752} {"train_loss": -43.1471061706543, "global_step": 332996, "epoch": 2752} {"train_loss": -43.56999969482422, "global_step": 332997, "epoch": 2752} {"train_loss": -42.947349548339844, "global_step": 332998, "epoch": 2752} {"train_loss": -43.26533126831055, "global_step": 332999, "epoch": 2752} {"train_loss": -44.14034652709961, "global_step": 333000, "epoch": 2752} {"train_loss": -43.38571548461914, "global_step": 333001, "epoch": 2752} {"train_loss": -43.762874603271484, "global_step": 333002, "epoch": 2752} {"train_loss": -43.9451904296875, "global_step": 333003, "epoch": 2752} {"train_loss": -44.33041000366211, "global_step": 333004, "epoch": 2752} {"train_loss": -43.774513244628906, "global_step": 333005, "epoch": 2752} {"train_loss": -44.320682525634766, "global_step": 333006, "epoch": 2752} {"train_loss": -43.81792068481445, "global_step": 333007, "epoch": 2752} {"train_loss": -43.69890594482422, "global_step": 333008, "epoch": 2752} {"train_loss": -43.91131591796875, "global_step": 333009, "epoch": 2752} {"train_loss": -44.3153076171875, "global_step": 333010, "epoch": 2752} {"train_loss": -43.61688995361328, "global_step": 333011, "epoch": 2752} {"train_loss": -43.2542610168457, "global_step": 333012, "epoch": 2752} {"train_loss": -44.3469352722168, "global_step": 333013, "epoch": 2752} {"train_loss": -44.75710678100586, "global_step": 333014, "epoch": 2752} {"train_loss": -44.13967514038086, "global_step": 333015, "epoch": 2752} {"train_loss": -44.31848907470703, "global_step": 333016, "epoch": 2752} {"train_loss": -43.283382415771484, "global_step": 333017, "epoch": 2752} {"train_loss": -44.625999450683594, "global_step": 333018, "epoch": 2752} {"train_loss": -44.318626403808594, "global_step": 333019, "epoch": 2752} {"train_loss": -43.784549713134766, "global_step": 333020, "epoch": 2752} {"train_loss": -44.08131790161133, "global_step": 333021, "epoch": 2752} {"train_loss": -43.732025146484375, "global_step": 333022, "epoch": 2752} {"train_loss": -44.26319885253906, "global_step": 333023, "epoch": 2752} {"train_loss": -43.949493408203125, "global_step": 333024, "epoch": 2752} {"train_loss": -44.788719177246094, "global_step": 333025, "epoch": 2752} {"train_loss": -43.630733489990234, "global_step": 333026, "epoch": 2752} {"train_loss": -44.13291931152344, "global_step": 333027, "epoch": 2752} {"train_loss": -44.29600143432617, "global_step": 333028, "epoch": 2752} {"train_loss": -44.09423828125, "global_step": 333029, "epoch": 2752} {"train_loss": -44.55121994018555, "global_step": 333030, "epoch": 2752} {"train_loss": -44.8270378112793, "global_step": 333031, "epoch": 2752} {"train_loss": -44.696834564208984, "global_step": 333032, "epoch": 2752} {"train_loss": -44.96432876586914, "global_step": 333033, "epoch": 2752} {"train_loss": -44.33500289916992, "global_step": 333034, "epoch": 2752} {"train_loss": -44.48388671875, "global_step": 333035, "epoch": 2752} {"train_loss": -43.9742546081543, "global_step": 333036, "epoch": 2752} {"train_loss": -44.359222412109375, "global_step": 333037, "epoch": 2752} {"train_loss": -44.762420654296875, "global_step": 333038, "epoch": 2752} {"train_loss": -43.7368278503418, "global_step": 333039, "epoch": 2752} {"train_loss": -44.41587448120117, "global_step": 333040, "epoch": 2752} {"train_loss": -45.33468246459961, "global_step": 333041, "epoch": 2752} {"train_loss": -44.5791130065918, "global_step": 333042, "epoch": 2752} {"train_loss": -44.34468078613281, "global_step": 333043, "epoch": 2752} {"train_loss": -44.81536865234375, "global_step": 333044, "epoch": 2752} {"train_loss": -44.38117599487305, "global_step": 333045, "epoch": 2752} {"train_loss": -43.942378997802734, "global_step": 333046, "epoch": 2752} {"train_loss": -44.986385345458984, "global_step": 333047, "epoch": 2752} {"train_loss": -44.29341506958008, "global_step": 333048, "epoch": 2752} {"train_loss": -43.444671630859375, "global_step": 333049, "epoch": 2752} {"train_loss": -44.93043518066406, "global_step": 333050, "epoch": 2752} {"train_loss": -43.9378776550293, "global_step": 333051, "epoch": 2752} {"train_loss": -43.18877029418945, "global_step": 333052, "epoch": 2752} {"train_loss": -44.60359573364258, "global_step": 333053, "epoch": 2752} {"train_loss": -43.7475700378418, "global_step": 333054, "epoch": 2752} {"train_loss": -43.22976303100586, "global_step": 333055, "epoch": 2752} {"train_loss": -44.44768142700195, "global_step": 333056, "epoch": 2752} {"train_loss": -44.733333587646484, "global_step": 333057, "epoch": 2752} {"train_loss": -43.706939697265625, "global_step": 333058, "epoch": 2752} {"train_loss": -43.0141716003418, "global_step": 333059, "epoch": 2752} {"train_loss": -42.893917083740234, "global_step": 333060, "epoch": 2752} {"train_loss": -42.31999206542969, "global_step": 333061, "epoch": 2752} {"train_loss": -43.73151779174805, "global_step": 333062, "epoch": 2752} {"train_loss": -42.94513702392578, "global_step": 333063, "epoch": 2752} {"train_loss": -43.42725372314453, "global_step": 333064, "epoch": 2752} {"train_loss": -43.32143020629883, "global_step": 333065, "epoch": 2752} {"train_loss": -43.3840446472168, "global_step": 333066, "epoch": 2752} {"train_loss": -42.993804931640625, "global_step": 333067, "epoch": 2752} {"train_loss": -43.73560333251953, "global_step": 333068, "epoch": 2752} {"train_loss": -43.37781524658203, "global_step": 333069, "epoch": 2752} {"train_loss": -41.894561767578125, "global_step": 333070, "epoch": 2752} {"train_loss": -44.17372512817383, "global_step": 333071, "epoch": 2752} {"train_loss": -42.25278854370117, "global_step": 333072, "epoch": 2752} {"train_loss": -41.72575378417969, "global_step": 333073, "epoch": 2752} {"train_loss": -42.65336990356445, "global_step": 333074, "epoch": 2752} {"train_loss": -41.480892181396484, "global_step": 333075, "epoch": 2752} {"train_loss": -43.69028091430664, "global_step": 333076, "epoch": 2752} {"train_loss": -41.845211029052734, "global_step": 333077, "epoch": 2752} {"train_loss": -42.84318923950195, "global_step": 333078, "epoch": 2752} {"train_loss": -42.60893630981445, "global_step": 333079, "epoch": 2752} {"train_loss": -44.0869140625, "global_step": 333080, "epoch": 2752} {"train_loss": -43.487457275390625, "global_step": 333081, "epoch": 2752} {"train_loss": -43.49569320678711, "global_step": 333082, "epoch": 2752} {"train_loss": -43.92024230957031, "global_step": 333083, "epoch": 2752} {"train_loss": -43.08244705200195, "global_step": 333084, "epoch": 2752} {"train_loss": -43.669578552246094, "global_step": 333085, "epoch": 2752} {"train_loss": -42.743499755859375, "global_step": 333086, "epoch": 2752} {"train_loss": -44.325130462646484, "global_step": 333087, "epoch": 2752} {"train_loss": -43.493141174316406, "global_step": 333088, "epoch": 2752} {"train_loss": -42.03182601928711, "global_step": 333089, "epoch": 2752} {"train_loss": -43.667236328125, "global_step": 333090, "epoch": 2752} {"train_loss": -42.17241287231445, "global_step": 333091, "epoch": 2752} {"train_loss": -42.46091842651367, "global_step": 333092, "epoch": 2752} {"train_loss": -43.24243927001953, "global_step": 333093, "epoch": 2752} {"train_loss": -42.76055908203125, "global_step": 333094, "epoch": 2752} {"train_loss": -42.96564483642578, "global_step": 333095, "epoch": 2752} {"train_loss": -43.254512786865234, "global_step": 333096, "epoch": 2752} {"train_loss": -41.811431884765625, "global_step": 333097, "epoch": 2752} {"train_loss": -44.06907272338867, "global_step": 333098, "epoch": 2752} {"train_loss": -41.479915618896484, "global_step": 333099, "epoch": 2752} {"train_loss": -42.502830505371094, "global_step": 333100, "epoch": 2752} {"train_loss": -42.30244064331055, "global_step": 333101, "epoch": 2752} {"train_loss": -42.14321517944336, "global_step": 333102, "epoch": 2752} {"train_loss": -42.2028923034668, "global_step": 333103, "epoch": 2752} {"train_loss": -41.65312957763672, "global_step": 333104, "epoch": 2752} {"train_loss": -43.15716552734375, "global_step": 333105, "epoch": 2752} {"train_loss": -43.013851165771484, "global_step": 333106, "epoch": 2752} {"train_loss": -44.008182525634766, "global_step": 333107, "epoch": 2752} {"train_loss": -42.83744430541992, "global_step": 333108, "epoch": 2752} {"train_loss": -43.822723388671875, "global_step": 333109, "epoch": 2752} {"train_loss": -42.88762664794922, "global_step": 333110, "epoch": 2752} {"train_loss": -44.23330307006836, "global_step": 333111, "epoch": 2752} {"train_loss": -43.57726354047286, "global_step": 333112, "epoch": 2752, "val_loss": 2464524.75} {"train_loss": -44.507179260253906, "global_step": 333113, "epoch": 2753} {"train_loss": -43.723182678222656, "global_step": 333114, "epoch": 2753} {"train_loss": -43.76091766357422, "global_step": 333115, "epoch": 2753} {"train_loss": -43.567989349365234, "global_step": 333116, "epoch": 2753} {"train_loss": -44.380733489990234, "global_step": 333117, "epoch": 2753} {"train_loss": -43.85099792480469, "global_step": 333118, "epoch": 2753} {"train_loss": -44.787513732910156, "global_step": 333119, "epoch": 2753} {"train_loss": -43.97052001953125, "global_step": 333120, "epoch": 2753} {"train_loss": -44.38678741455078, "global_step": 333121, "epoch": 2753} {"train_loss": -44.440364837646484, "global_step": 333122, "epoch": 2753} {"train_loss": -44.15106201171875, "global_step": 333123, "epoch": 2753} {"train_loss": -44.4808235168457, "global_step": 333124, "epoch": 2753} {"train_loss": -45.02398681640625, "global_step": 333125, "epoch": 2753} {"train_loss": -44.19297409057617, "global_step": 333126, "epoch": 2753} {"train_loss": -44.65369415283203, "global_step": 333127, "epoch": 2753} {"train_loss": -44.84096908569336, "global_step": 333128, "epoch": 2753} {"train_loss": -44.734004974365234, "global_step": 333129, "epoch": 2753} {"train_loss": -44.58358383178711, "global_step": 333130, "epoch": 2753} {"train_loss": -44.850826263427734, "global_step": 333131, "epoch": 2753} {"train_loss": -44.93424606323242, "global_step": 333132, "epoch": 2753} {"train_loss": -44.55611801147461, "global_step": 333133, "epoch": 2753} {"train_loss": -44.912776947021484, "global_step": 333134, "epoch": 2753} {"train_loss": -44.84813690185547, "global_step": 333135, "epoch": 2753} {"train_loss": -44.814937591552734, "global_step": 333136, "epoch": 2753} {"train_loss": -45.02921676635742, "global_step": 333137, "epoch": 2753} {"train_loss": -45.09817123413086, "global_step": 333138, "epoch": 2753} {"train_loss": -45.25899887084961, "global_step": 333139, "epoch": 2753} {"train_loss": -43.894649505615234, "global_step": 333140, "epoch": 2753} {"train_loss": -44.57440948486328, "global_step": 333141, "epoch": 2753} {"train_loss": -44.376888275146484, "global_step": 333142, "epoch": 2753} {"train_loss": -44.32157897949219, "global_step": 333143, "epoch": 2753} {"train_loss": -44.74151611328125, "global_step": 333144, "epoch": 2753} {"train_loss": -44.79447555541992, "global_step": 333145, "epoch": 2753} {"train_loss": -44.185508728027344, "global_step": 333146, "epoch": 2753} {"train_loss": -44.451759338378906, "global_step": 333147, "epoch": 2753} {"train_loss": -44.60551071166992, "global_step": 333148, "epoch": 2753} {"train_loss": -45.028507232666016, "global_step": 333149, "epoch": 2753} {"train_loss": -45.14802932739258, "global_step": 333150, "epoch": 2753} {"train_loss": -44.89588928222656, "global_step": 333151, "epoch": 2753} {"train_loss": -45.0389518737793, "global_step": 333152, "epoch": 2753} {"train_loss": -44.648868560791016, "global_step": 333153, "epoch": 2753} {"train_loss": -44.833438873291016, "global_step": 333154, "epoch": 2753} {"train_loss": -43.925750732421875, "global_step": 333155, "epoch": 2753} {"train_loss": -44.589019775390625, "global_step": 333156, "epoch": 2753} {"train_loss": -44.61362838745117, "global_step": 333157, "epoch": 2753} {"train_loss": -45.212730407714844, "global_step": 333158, "epoch": 2753} {"train_loss": -45.14987564086914, "global_step": 333159, "epoch": 2753} {"train_loss": -45.34745407104492, "global_step": 333160, "epoch": 2753} {"train_loss": -44.067317962646484, "global_step": 333161, "epoch": 2753} {"train_loss": -44.28303146362305, "global_step": 333162, "epoch": 2753} {"train_loss": -44.8187370300293, "global_step": 333163, "epoch": 2753} {"train_loss": -44.7692985534668, "global_step": 333164, "epoch": 2753} {"train_loss": -44.724483489990234, "global_step": 333165, "epoch": 2753} {"train_loss": -45.381256103515625, "global_step": 333166, "epoch": 2753} {"train_loss": -45.17742919921875, "global_step": 333167, "epoch": 2753} {"train_loss": -45.07261276245117, "global_step": 333168, "epoch": 2753} {"train_loss": -45.08909225463867, "global_step": 333169, "epoch": 2753} {"train_loss": -45.29236602783203, "global_step": 333170, "epoch": 2753} {"train_loss": -44.819087982177734, "global_step": 333171, "epoch": 2753} {"train_loss": -44.65898895263672, "global_step": 333172, "epoch": 2753} {"train_loss": -45.00779342651367, "global_step": 333173, "epoch": 2753} {"train_loss": -44.698246002197266, "global_step": 333174, "epoch": 2753} {"train_loss": -44.10239791870117, "global_step": 333175, "epoch": 2753} {"train_loss": -43.49920654296875, "global_step": 333176, "epoch": 2753} {"train_loss": -44.19342803955078, "global_step": 333177, "epoch": 2753} {"train_loss": -45.09157180786133, "global_step": 333178, "epoch": 2753} {"train_loss": -45.18174362182617, "global_step": 333179, "epoch": 2753} {"train_loss": -44.766258239746094, "global_step": 333180, "epoch": 2753} {"train_loss": -43.64419174194336, "global_step": 333181, "epoch": 2753} {"train_loss": -43.44342041015625, "global_step": 333182, "epoch": 2753} {"train_loss": -42.15034866333008, "global_step": 333183, "epoch": 2753} {"train_loss": -43.22834014892578, "global_step": 333184, "epoch": 2753} {"train_loss": -44.32242965698242, "global_step": 333185, "epoch": 2753} {"train_loss": -44.86500930786133, "global_step": 333186, "epoch": 2753} {"train_loss": -44.543514251708984, "global_step": 333187, "epoch": 2753} {"train_loss": -44.127384185791016, "global_step": 333188, "epoch": 2753} {"train_loss": -44.81948471069336, "global_step": 333189, "epoch": 2753} {"train_loss": -44.35844802856445, "global_step": 333190, "epoch": 2753} {"train_loss": -42.6633186340332, "global_step": 333191, "epoch": 2753} {"train_loss": -43.37464904785156, "global_step": 333192, "epoch": 2753} {"train_loss": -44.80234909057617, "global_step": 333193, "epoch": 2753} {"train_loss": -43.32935333251953, "global_step": 333194, "epoch": 2753} {"train_loss": -43.73139190673828, "global_step": 333195, "epoch": 2753} {"train_loss": -44.881797790527344, "global_step": 333196, "epoch": 2753} {"train_loss": -43.02622604370117, "global_step": 333197, "epoch": 2753} {"train_loss": -40.485294342041016, "global_step": 333198, "epoch": 2753} {"train_loss": -43.515350341796875, "global_step": 333199, "epoch": 2753} {"train_loss": -42.6508674621582, "global_step": 333200, "epoch": 2753} {"train_loss": -42.4138069152832, "global_step": 333201, "epoch": 2753} {"train_loss": -42.88051986694336, "global_step": 333202, "epoch": 2753} {"train_loss": -42.99164581298828, "global_step": 333203, "epoch": 2753} {"train_loss": -40.12346267700195, "global_step": 333204, "epoch": 2753} {"train_loss": -42.80904006958008, "global_step": 333205, "epoch": 2753} {"train_loss": -40.17512130737305, "global_step": 333206, "epoch": 2753} {"train_loss": -42.98907470703125, "global_step": 333207, "epoch": 2753} {"train_loss": -42.15658187866211, "global_step": 333208, "epoch": 2753} {"train_loss": -41.25498580932617, "global_step": 333209, "epoch": 2753} {"train_loss": -43.13991165161133, "global_step": 333210, "epoch": 2753} {"train_loss": -42.84295654296875, "global_step": 333211, "epoch": 2753} {"train_loss": -43.757869720458984, "global_step": 333212, "epoch": 2753} {"train_loss": -41.24714660644531, "global_step": 333213, "epoch": 2753} {"train_loss": -43.699222564697266, "global_step": 333214, "epoch": 2753} {"train_loss": -43.473201751708984, "global_step": 333215, "epoch": 2753} {"train_loss": -43.60258865356445, "global_step": 333216, "epoch": 2753} {"train_loss": -43.68536376953125, "global_step": 333217, "epoch": 2753} {"train_loss": -42.46303939819336, "global_step": 333218, "epoch": 2753} {"train_loss": -44.51693344116211, "global_step": 333219, "epoch": 2753} {"train_loss": -43.14728546142578, "global_step": 333220, "epoch": 2753} {"train_loss": -43.669742584228516, "global_step": 333221, "epoch": 2753} {"train_loss": -44.308738708496094, "global_step": 333222, "epoch": 2753} {"train_loss": -43.43280792236328, "global_step": 333223, "epoch": 2753} {"train_loss": -43.959938049316406, "global_step": 333224, "epoch": 2753} {"train_loss": -43.4659423828125, "global_step": 333225, "epoch": 2753} {"train_loss": -44.54558181762695, "global_step": 333226, "epoch": 2753} {"train_loss": -42.48125076293945, "global_step": 333227, "epoch": 2753} {"train_loss": -41.5214729309082, "global_step": 333228, "epoch": 2753} {"train_loss": -43.2952995300293, "global_step": 333229, "epoch": 2753} {"train_loss": -43.16482925415039, "global_step": 333230, "epoch": 2753} {"train_loss": -43.075531005859375, "global_step": 333231, "epoch": 2753} {"train_loss": -42.45956039428711, "global_step": 333232, "epoch": 2753} {"train_loss": -43.99014175036722, "global_step": 333233, "epoch": 2753, "val_loss": 2471301.5} {"train_loss": -43.36727523803711, "global_step": 333234, "epoch": 2754} {"train_loss": -44.12997817993164, "global_step": 333235, "epoch": 2754} {"train_loss": -43.1644287109375, "global_step": 333236, "epoch": 2754} {"train_loss": -44.488616943359375, "global_step": 333237, "epoch": 2754} {"train_loss": -43.331459045410156, "global_step": 333238, "epoch": 2754} {"train_loss": -43.73371124267578, "global_step": 333239, "epoch": 2754} {"train_loss": -43.989166259765625, "global_step": 333240, "epoch": 2754} {"train_loss": -43.06596755981445, "global_step": 333241, "epoch": 2754} {"train_loss": -43.25168991088867, "global_step": 333242, "epoch": 2754} {"train_loss": -43.794857025146484, "global_step": 333243, "epoch": 2754} {"train_loss": -40.59430694580078, "global_step": 333244, "epoch": 2754} {"train_loss": -43.181148529052734, "global_step": 333245, "epoch": 2754} {"train_loss": -43.56830596923828, "global_step": 333246, "epoch": 2754} {"train_loss": -41.24560546875, "global_step": 333247, "epoch": 2754} {"train_loss": -43.220619201660156, "global_step": 333248, "epoch": 2754} {"train_loss": -42.98716735839844, "global_step": 333249, "epoch": 2754} {"train_loss": -42.795654296875, "global_step": 333250, "epoch": 2754} {"train_loss": -42.747188568115234, "global_step": 333251, "epoch": 2754} {"train_loss": -44.64924240112305, "global_step": 333252, "epoch": 2754} {"train_loss": -42.68096923828125, "global_step": 333253, "epoch": 2754} {"train_loss": -43.325592041015625, "global_step": 333254, "epoch": 2754} {"train_loss": -44.315425872802734, "global_step": 333255, "epoch": 2754} {"train_loss": -43.03452682495117, "global_step": 333256, "epoch": 2754} {"train_loss": -44.59348678588867, "global_step": 333257, "epoch": 2754} {"train_loss": -43.23340606689453, "global_step": 333258, "epoch": 2754} {"train_loss": -43.19428634643555, "global_step": 333259, "epoch": 2754} {"train_loss": -44.051631927490234, "global_step": 333260, "epoch": 2754} {"train_loss": -43.16383743286133, "global_step": 333261, "epoch": 2754} {"train_loss": -43.650081634521484, "global_step": 333262, "epoch": 2754} {"train_loss": -43.36802291870117, "global_step": 333263, "epoch": 2754} {"train_loss": -43.99353790283203, "global_step": 333264, "epoch": 2754} {"train_loss": -43.467750549316406, "global_step": 333265, "epoch": 2754} {"train_loss": -43.56401443481445, "global_step": 333266, "epoch": 2754} {"train_loss": -43.94511795043945, "global_step": 333267, "epoch": 2754} {"train_loss": -44.096900939941406, "global_step": 333268, "epoch": 2754} {"train_loss": -44.25373840332031, "global_step": 333269, "epoch": 2754} {"train_loss": -44.53961181640625, "global_step": 333270, "epoch": 2754} {"train_loss": -43.91642379760742, "global_step": 333271, "epoch": 2754} {"train_loss": -44.74692916870117, "global_step": 333272, "epoch": 2754} {"train_loss": -43.193153381347656, "global_step": 333273, "epoch": 2754} {"train_loss": -44.40346908569336, "global_step": 333274, "epoch": 2754} {"train_loss": -44.47852325439453, "global_step": 333275, "epoch": 2754} {"train_loss": -44.307525634765625, "global_step": 333276, "epoch": 2754} {"train_loss": -44.280006408691406, "global_step": 333277, "epoch": 2754} {"train_loss": -44.02443313598633, "global_step": 333278, "epoch": 2754} {"train_loss": -44.304866790771484, "global_step": 333279, "epoch": 2754} {"train_loss": -43.9339714050293, "global_step": 333280, "epoch": 2754} {"train_loss": -44.38693618774414, "global_step": 333281, "epoch": 2754} {"train_loss": -44.350914001464844, "global_step": 333282, "epoch": 2754} {"train_loss": -43.95835876464844, "global_step": 333283, "epoch": 2754} {"train_loss": -44.069129943847656, "global_step": 333284, "epoch": 2754} {"train_loss": -45.02769088745117, "global_step": 333285, "epoch": 2754} {"train_loss": -44.25620651245117, "global_step": 333286, "epoch": 2754} {"train_loss": -44.022457122802734, "global_step": 333287, "epoch": 2754} {"train_loss": -44.6684455871582, "global_step": 333288, "epoch": 2754} {"train_loss": -43.75376510620117, "global_step": 333289, "epoch": 2754} {"train_loss": -44.80084991455078, "global_step": 333290, "epoch": 2754} {"train_loss": -44.21345901489258, "global_step": 333291, "epoch": 2754} {"train_loss": -43.781246185302734, "global_step": 333292, "epoch": 2754} {"train_loss": -44.47174835205078, "global_step": 333293, "epoch": 2754} {"train_loss": -44.21167755126953, "global_step": 333294, "epoch": 2754} {"train_loss": -43.7846565246582, "global_step": 333295, "epoch": 2754} {"train_loss": -44.97660446166992, "global_step": 333296, "epoch": 2754} {"train_loss": -44.460968017578125, "global_step": 333297, "epoch": 2754} {"train_loss": -44.001827239990234, "global_step": 333298, "epoch": 2754} {"train_loss": -44.94186782836914, "global_step": 333299, "epoch": 2754} {"train_loss": -45.03768539428711, "global_step": 333300, "epoch": 2754} {"train_loss": -44.03976058959961, "global_step": 333301, "epoch": 2754} {"train_loss": -44.76617431640625, "global_step": 333302, "epoch": 2754} {"train_loss": -44.46690368652344, "global_step": 333303, "epoch": 2754} {"train_loss": -44.971187591552734, "global_step": 333304, "epoch": 2754} {"train_loss": -44.262901306152344, "global_step": 333305, "epoch": 2754} {"train_loss": -44.6818962097168, "global_step": 333306, "epoch": 2754} {"train_loss": -44.713741302490234, "global_step": 333307, "epoch": 2754} {"train_loss": -44.66097640991211, "global_step": 333308, "epoch": 2754} {"train_loss": -45.01558303833008, "global_step": 333309, "epoch": 2754} {"train_loss": -44.544944763183594, "global_step": 333310, "epoch": 2754} {"train_loss": -44.752445220947266, "global_step": 333311, "epoch": 2754} {"train_loss": -44.9817008972168, "global_step": 333312, "epoch": 2754} {"train_loss": -45.61009979248047, "global_step": 333313, "epoch": 2754} {"train_loss": -45.05965805053711, "global_step": 333314, "epoch": 2754} {"train_loss": -44.469520568847656, "global_step": 333315, "epoch": 2754} {"train_loss": -44.81771469116211, "global_step": 333316, "epoch": 2754} {"train_loss": -44.83449172973633, "global_step": 333317, "epoch": 2754} {"train_loss": -45.248199462890625, "global_step": 333318, "epoch": 2754} {"train_loss": -45.006500244140625, "global_step": 333319, "epoch": 2754} {"train_loss": -44.93335723876953, "global_step": 333320, "epoch": 2754} {"train_loss": -45.02252960205078, "global_step": 333321, "epoch": 2754} {"train_loss": -45.2141227722168, "global_step": 333322, "epoch": 2754} {"train_loss": -45.1459846496582, "global_step": 333323, "epoch": 2754} {"train_loss": -44.65975570678711, "global_step": 333324, "epoch": 2754} {"train_loss": -44.78718566894531, "global_step": 333325, "epoch": 2754} {"train_loss": -44.939613342285156, "global_step": 333326, "epoch": 2754} {"train_loss": -45.172550201416016, "global_step": 333327, "epoch": 2754} {"train_loss": -45.33633041381836, "global_step": 333328, "epoch": 2754} {"train_loss": -44.99321365356445, "global_step": 333329, "epoch": 2754} {"train_loss": -45.127540588378906, "global_step": 333330, "epoch": 2754} {"train_loss": -45.028865814208984, "global_step": 333331, "epoch": 2754} {"train_loss": -44.982337951660156, "global_step": 333332, "epoch": 2754} {"train_loss": -44.66954040527344, "global_step": 333333, "epoch": 2754} {"train_loss": -45.01301193237305, "global_step": 333334, "epoch": 2754} {"train_loss": -44.92686462402344, "global_step": 333335, "epoch": 2754} {"train_loss": -44.912349700927734, "global_step": 333336, "epoch": 2754} {"train_loss": -43.77354049682617, "global_step": 333337, "epoch": 2754} {"train_loss": -44.65134811401367, "global_step": 333338, "epoch": 2754} {"train_loss": -45.25724411010742, "global_step": 333339, "epoch": 2754} {"train_loss": -45.06417465209961, "global_step": 333340, "epoch": 2754} {"train_loss": -43.71729278564453, "global_step": 333341, "epoch": 2754} {"train_loss": -44.44266128540039, "global_step": 333342, "epoch": 2754} {"train_loss": -44.2720832824707, "global_step": 333343, "epoch": 2754} {"train_loss": -43.757667541503906, "global_step": 333344, "epoch": 2754} {"train_loss": -44.686100006103516, "global_step": 333345, "epoch": 2754} {"train_loss": -44.62091827392578, "global_step": 333346, "epoch": 2754} {"train_loss": -44.10969161987305, "global_step": 333347, "epoch": 2754} {"train_loss": -44.65522384643555, "global_step": 333348, "epoch": 2754} {"train_loss": -44.47416305541992, "global_step": 333349, "epoch": 2754} {"train_loss": -43.90505599975586, "global_step": 333350, "epoch": 2754} {"train_loss": -45.15950012207031, "global_step": 333351, "epoch": 2754} {"train_loss": -44.864742279052734, "global_step": 333352, "epoch": 2754} {"train_loss": -43.8023681640625, "global_step": 333353, "epoch": 2754} {"train_loss": -44.232876076185995, "global_step": 333354, "epoch": 2754, "val_loss": 2587198.0} {"train_loss": -45.09242630004883, "global_step": 333355, "epoch": 2755} {"train_loss": -44.338985443115234, "global_step": 333356, "epoch": 2755} {"train_loss": -43.53342819213867, "global_step": 333357, "epoch": 2755} {"train_loss": -44.9885368347168, "global_step": 333358, "epoch": 2755} {"train_loss": -44.15798568725586, "global_step": 333359, "epoch": 2755} {"train_loss": -43.7261962890625, "global_step": 333360, "epoch": 2755} {"train_loss": -44.632850646972656, "global_step": 333361, "epoch": 2755} {"train_loss": -45.175235748291016, "global_step": 333362, "epoch": 2755} {"train_loss": -44.19995880126953, "global_step": 333363, "epoch": 2755} {"train_loss": -43.49872589111328, "global_step": 333364, "epoch": 2755} {"train_loss": -44.01588821411133, "global_step": 333365, "epoch": 2755} {"train_loss": -43.37830352783203, "global_step": 333366, "epoch": 2755} {"train_loss": -44.491939544677734, "global_step": 333367, "epoch": 2755} {"train_loss": -43.89925003051758, "global_step": 333368, "epoch": 2755} {"train_loss": -42.09782028198242, "global_step": 333369, "epoch": 2755} {"train_loss": -43.04519271850586, "global_step": 333370, "epoch": 2755} {"train_loss": -43.4565544128418, "global_step": 333371, "epoch": 2755} {"train_loss": -43.88164138793945, "global_step": 333372, "epoch": 2755} {"train_loss": -43.88945007324219, "global_step": 333373, "epoch": 2755} {"train_loss": -43.42686080932617, "global_step": 333374, "epoch": 2755} {"train_loss": -43.75301742553711, "global_step": 333375, "epoch": 2755} {"train_loss": -43.540504455566406, "global_step": 333376, "epoch": 2755} {"train_loss": -43.2238655090332, "global_step": 333377, "epoch": 2755} {"train_loss": -44.151824951171875, "global_step": 333378, "epoch": 2755} {"train_loss": -43.65364456176758, "global_step": 333379, "epoch": 2755} {"train_loss": -44.128841400146484, "global_step": 333380, "epoch": 2755} {"train_loss": -44.00951385498047, "global_step": 333381, "epoch": 2755} {"train_loss": -44.00185775756836, "global_step": 333382, "epoch": 2755} {"train_loss": -44.05768585205078, "global_step": 333383, "epoch": 2755} {"train_loss": -44.855377197265625, "global_step": 333384, "epoch": 2755} {"train_loss": -43.42167282104492, "global_step": 333385, "epoch": 2755} {"train_loss": -43.58700180053711, "global_step": 333386, "epoch": 2755} {"train_loss": -42.91535568237305, "global_step": 333387, "epoch": 2755} {"train_loss": -44.084510803222656, "global_step": 333388, "epoch": 2755} {"train_loss": -44.01333999633789, "global_step": 333389, "epoch": 2755} {"train_loss": -44.47641372680664, "global_step": 333390, "epoch": 2755} {"train_loss": -44.28318405151367, "global_step": 333391, "epoch": 2755} {"train_loss": -44.115360260009766, "global_step": 333392, "epoch": 2755} {"train_loss": -43.5336799621582, "global_step": 333393, "epoch": 2755} {"train_loss": -43.25779342651367, "global_step": 333394, "epoch": 2755} {"train_loss": -45.10190963745117, "global_step": 333395, "epoch": 2755} {"train_loss": -43.746307373046875, "global_step": 333396, "epoch": 2755} {"train_loss": -42.51479721069336, "global_step": 333397, "epoch": 2755} {"train_loss": -41.93180465698242, "global_step": 333398, "epoch": 2755} {"train_loss": -43.474891662597656, "global_step": 333399, "epoch": 2755} {"train_loss": -43.46554946899414, "global_step": 333400, "epoch": 2755} {"train_loss": -43.36662292480469, "global_step": 333401, "epoch": 2755} {"train_loss": -43.509952545166016, "global_step": 333402, "epoch": 2755} {"train_loss": -43.69963455200195, "global_step": 333403, "epoch": 2755} {"train_loss": -43.046424865722656, "global_step": 333404, "epoch": 2755} {"train_loss": -42.66035842895508, "global_step": 333405, "epoch": 2755} {"train_loss": -43.988685607910156, "global_step": 333406, "epoch": 2755} {"train_loss": -43.8589973449707, "global_step": 333407, "epoch": 2755} {"train_loss": -43.670162200927734, "global_step": 333408, "epoch": 2755} {"train_loss": -43.13350296020508, "global_step": 333409, "epoch": 2755} {"train_loss": -44.46371078491211, "global_step": 333410, "epoch": 2755} {"train_loss": -42.555152893066406, "global_step": 333411, "epoch": 2755} {"train_loss": -42.882118225097656, "global_step": 333412, "epoch": 2755} {"train_loss": -44.141944885253906, "global_step": 333413, "epoch": 2755} {"train_loss": -43.117652893066406, "global_step": 333414, "epoch": 2755} {"train_loss": -44.067291259765625, "global_step": 333415, "epoch": 2755} {"train_loss": -43.79007339477539, "global_step": 333416, "epoch": 2755} {"train_loss": -44.60060119628906, "global_step": 333417, "epoch": 2755} {"train_loss": -44.165279388427734, "global_step": 333418, "epoch": 2755} {"train_loss": -43.222232818603516, "global_step": 333419, "epoch": 2755} {"train_loss": -44.26606369018555, "global_step": 333420, "epoch": 2755} {"train_loss": -43.002601623535156, "global_step": 333421, "epoch": 2755} {"train_loss": -43.996124267578125, "global_step": 333422, "epoch": 2755} {"train_loss": -44.255615234375, "global_step": 333423, "epoch": 2755} {"train_loss": -43.90916061401367, "global_step": 333424, "epoch": 2755} {"train_loss": -44.638240814208984, "global_step": 333425, "epoch": 2755} {"train_loss": -43.84538269042969, "global_step": 333426, "epoch": 2755} {"train_loss": -44.1170768737793, "global_step": 333427, "epoch": 2755} {"train_loss": -44.247596740722656, "global_step": 333428, "epoch": 2755} {"train_loss": -44.79170227050781, "global_step": 333429, "epoch": 2755} {"train_loss": -44.6753044128418, "global_step": 333430, "epoch": 2755} {"train_loss": -44.042720794677734, "global_step": 333431, "epoch": 2755} {"train_loss": -45.01423263549805, "global_step": 333432, "epoch": 2755} {"train_loss": -44.708980560302734, "global_step": 333433, "epoch": 2755} {"train_loss": -44.50746154785156, "global_step": 333434, "epoch": 2755} {"train_loss": -45.02431106567383, "global_step": 333435, "epoch": 2755} {"train_loss": -44.997093200683594, "global_step": 333436, "epoch": 2755} {"train_loss": -44.736515045166016, "global_step": 333437, "epoch": 2755} {"train_loss": -44.88836669921875, "global_step": 333438, "epoch": 2755} {"train_loss": -45.213958740234375, "global_step": 333439, "epoch": 2755} {"train_loss": -44.653114318847656, "global_step": 333440, "epoch": 2755} {"train_loss": -44.835453033447266, "global_step": 333441, "epoch": 2755} {"train_loss": -45.29282760620117, "global_step": 333442, "epoch": 2755} {"train_loss": -44.98603439331055, "global_step": 333443, "epoch": 2755} {"train_loss": -45.274391174316406, "global_step": 333444, "epoch": 2755} {"train_loss": -44.809791564941406, "global_step": 333445, "epoch": 2755} {"train_loss": -44.140254974365234, "global_step": 333446, "epoch": 2755} {"train_loss": -45.13881301879883, "global_step": 333447, "epoch": 2755} {"train_loss": -44.8696174621582, "global_step": 333448, "epoch": 2755} {"train_loss": -44.788909912109375, "global_step": 333449, "epoch": 2755} {"train_loss": -44.77431106567383, "global_step": 333450, "epoch": 2755} {"train_loss": -44.86481857299805, "global_step": 333451, "epoch": 2755} {"train_loss": -45.40837097167969, "global_step": 333452, "epoch": 2755} {"train_loss": -45.14617919921875, "global_step": 333453, "epoch": 2755} {"train_loss": -45.08565139770508, "global_step": 333454, "epoch": 2755} {"train_loss": -45.22601318359375, "global_step": 333455, "epoch": 2755} {"train_loss": -45.18681716918945, "global_step": 333456, "epoch": 2755} {"train_loss": -45.09443283081055, "global_step": 333457, "epoch": 2755} {"train_loss": -45.26631546020508, "global_step": 333458, "epoch": 2755} {"train_loss": -45.27692413330078, "global_step": 333459, "epoch": 2755} {"train_loss": -45.016845703125, "global_step": 333460, "epoch": 2755} {"train_loss": -43.946937561035156, "global_step": 333461, "epoch": 2755} {"train_loss": -45.52443313598633, "global_step": 333462, "epoch": 2755} {"train_loss": -44.90899658203125, "global_step": 333463, "epoch": 2755} {"train_loss": -44.05156326293945, "global_step": 333464, "epoch": 2755} {"train_loss": -44.920257568359375, "global_step": 333465, "epoch": 2755} {"train_loss": -45.56855392456055, "global_step": 333466, "epoch": 2755} {"train_loss": -44.03284454345703, "global_step": 333467, "epoch": 2755} {"train_loss": -44.25650405883789, "global_step": 333468, "epoch": 2755} {"train_loss": -44.679866790771484, "global_step": 333469, "epoch": 2755} {"train_loss": -45.00425338745117, "global_step": 333470, "epoch": 2755} {"train_loss": -44.64237594604492, "global_step": 333471, "epoch": 2755} {"train_loss": -43.53445816040039, "global_step": 333472, "epoch": 2755} {"train_loss": -44.08675003051758, "global_step": 333473, "epoch": 2755} {"train_loss": -43.96120834350586, "global_step": 333474, "epoch": 2755} {"train_loss": -44.17950042220187, "global_step": 333475, "epoch": 2755, "val_loss": 2521235.0} {"train_loss": -44.73552703857422, "global_step": 333476, "epoch": 2756} {"train_loss": -44.390533447265625, "global_step": 333477, "epoch": 2756} {"train_loss": -42.622154235839844, "global_step": 333478, "epoch": 2756} {"train_loss": -41.91191482543945, "global_step": 333479, "epoch": 2756} {"train_loss": -41.12057876586914, "global_step": 333480, "epoch": 2756} {"train_loss": -44.0037727355957, "global_step": 333481, "epoch": 2756} {"train_loss": -43.884735107421875, "global_step": 333482, "epoch": 2756} {"train_loss": -44.68938064575195, "global_step": 333483, "epoch": 2756} {"train_loss": -43.25580978393555, "global_step": 333484, "epoch": 2756} {"train_loss": -42.72994613647461, "global_step": 333485, "epoch": 2756} {"train_loss": -43.1859016418457, "global_step": 333486, "epoch": 2756} {"train_loss": -44.110740661621094, "global_step": 333487, "epoch": 2756} {"train_loss": -40.828731536865234, "global_step": 333488, "epoch": 2756} {"train_loss": -41.79948043823242, "global_step": 333489, "epoch": 2756} {"train_loss": -41.95001983642578, "global_step": 333490, "epoch": 2756} {"train_loss": -43.059993743896484, "global_step": 333491, "epoch": 2756} {"train_loss": -43.92777633666992, "global_step": 333492, "epoch": 2756} {"train_loss": -40.795955657958984, "global_step": 333493, "epoch": 2756} {"train_loss": -42.432830810546875, "global_step": 333494, "epoch": 2756} {"train_loss": -43.361366271972656, "global_step": 333495, "epoch": 2756} {"train_loss": -41.369930267333984, "global_step": 333496, "epoch": 2756} {"train_loss": -42.539306640625, "global_step": 333497, "epoch": 2756} {"train_loss": -43.231021881103516, "global_step": 333498, "epoch": 2756} {"train_loss": -42.31795883178711, "global_step": 333499, "epoch": 2756} {"train_loss": -43.0585823059082, "global_step": 333500, "epoch": 2756} {"train_loss": -43.159053802490234, "global_step": 333501, "epoch": 2756} {"train_loss": -42.10239791870117, "global_step": 333502, "epoch": 2756} {"train_loss": -42.25497055053711, "global_step": 333503, "epoch": 2756} {"train_loss": -43.46577072143555, "global_step": 333504, "epoch": 2756} {"train_loss": -41.30426788330078, "global_step": 333505, "epoch": 2756} {"train_loss": -42.50287628173828, "global_step": 333506, "epoch": 2756} {"train_loss": -43.03559494018555, "global_step": 333507, "epoch": 2756} {"train_loss": -41.19490051269531, "global_step": 333508, "epoch": 2756} {"train_loss": -43.19209671020508, "global_step": 333509, "epoch": 2756} {"train_loss": -42.980194091796875, "global_step": 333510, "epoch": 2756} {"train_loss": -40.44205856323242, "global_step": 333511, "epoch": 2756} {"train_loss": -42.57102584838867, "global_step": 333512, "epoch": 2756} {"train_loss": -43.109336853027344, "global_step": 333513, "epoch": 2756} {"train_loss": -42.66349411010742, "global_step": 333514, "epoch": 2756} {"train_loss": -40.59807586669922, "global_step": 333515, "epoch": 2756} {"train_loss": -41.02016830444336, "global_step": 333516, "epoch": 2756} {"train_loss": -40.286434173583984, "global_step": 333517, "epoch": 2756} {"train_loss": -42.96876907348633, "global_step": 333518, "epoch": 2756} {"train_loss": -41.544960021972656, "global_step": 333519, "epoch": 2756} {"train_loss": -41.40044403076172, "global_step": 333520, "epoch": 2756} {"train_loss": -42.9376220703125, "global_step": 333521, "epoch": 2756} {"train_loss": -41.45601272583008, "global_step": 333522, "epoch": 2756} {"train_loss": -43.35612106323242, "global_step": 333523, "epoch": 2756} {"train_loss": -42.23607635498047, "global_step": 333524, "epoch": 2756} {"train_loss": -43.084571838378906, "global_step": 333525, "epoch": 2756} {"train_loss": -41.46787643432617, "global_step": 333526, "epoch": 2756} {"train_loss": -43.1780891418457, "global_step": 333527, "epoch": 2756} {"train_loss": -42.683685302734375, "global_step": 333528, "epoch": 2756} {"train_loss": -41.9660758972168, "global_step": 333529, "epoch": 2756} {"train_loss": -41.67588424682617, "global_step": 333530, "epoch": 2756} {"train_loss": -41.9952507019043, "global_step": 333531, "epoch": 2756} {"train_loss": -42.19063186645508, "global_step": 333532, "epoch": 2756} {"train_loss": -43.726688385009766, "global_step": 333533, "epoch": 2756} {"train_loss": -43.57511520385742, "global_step": 333534, "epoch": 2756} {"train_loss": -43.7996711730957, "global_step": 333535, "epoch": 2756} {"train_loss": -43.361507415771484, "global_step": 333536, "epoch": 2756} {"train_loss": -43.610530853271484, "global_step": 333537, "epoch": 2756} {"train_loss": -44.323848724365234, "global_step": 333538, "epoch": 2756} {"train_loss": -43.38970947265625, "global_step": 333539, "epoch": 2756} {"train_loss": -44.58744430541992, "global_step": 333540, "epoch": 2756} {"train_loss": -43.94731140136719, "global_step": 333541, "epoch": 2756} {"train_loss": -44.351806640625, "global_step": 333542, "epoch": 2756} {"train_loss": -43.55370330810547, "global_step": 333543, "epoch": 2756} {"train_loss": -43.152748107910156, "global_step": 333544, "epoch": 2756} {"train_loss": -43.77478790283203, "global_step": 333545, "epoch": 2756} {"train_loss": -44.459442138671875, "global_step": 333546, "epoch": 2756} {"train_loss": -44.64726638793945, "global_step": 333547, "epoch": 2756} {"train_loss": -44.49098587036133, "global_step": 333548, "epoch": 2756} {"train_loss": -44.652862548828125, "global_step": 333549, "epoch": 2756} {"train_loss": -44.71272659301758, "global_step": 333550, "epoch": 2756} {"train_loss": -44.5164909362793, "global_step": 333551, "epoch": 2756} {"train_loss": -44.95597457885742, "global_step": 333552, "epoch": 2756} {"train_loss": -44.7798957824707, "global_step": 333553, "epoch": 2756} {"train_loss": -44.47032165527344, "global_step": 333554, "epoch": 2756} {"train_loss": -45.097408294677734, "global_step": 333555, "epoch": 2756} {"train_loss": -44.72000503540039, "global_step": 333556, "epoch": 2756} {"train_loss": -44.76268768310547, "global_step": 333557, "epoch": 2756} {"train_loss": -43.8209228515625, "global_step": 333558, "epoch": 2756} {"train_loss": -44.92000198364258, "global_step": 333559, "epoch": 2756} {"train_loss": -44.82164764404297, "global_step": 333560, "epoch": 2756} {"train_loss": -44.86312484741211, "global_step": 333561, "epoch": 2756} {"train_loss": -45.225379943847656, "global_step": 333562, "epoch": 2756} {"train_loss": -44.785614013671875, "global_step": 333563, "epoch": 2756} {"train_loss": -44.92789077758789, "global_step": 333564, "epoch": 2756} {"train_loss": -43.55133819580078, "global_step": 333565, "epoch": 2756} {"train_loss": -44.82190704345703, "global_step": 333566, "epoch": 2756} {"train_loss": -45.13066482543945, "global_step": 333567, "epoch": 2756} {"train_loss": -44.745018005371094, "global_step": 333568, "epoch": 2756} {"train_loss": -45.06756591796875, "global_step": 333569, "epoch": 2756} {"train_loss": -45.229122161865234, "global_step": 333570, "epoch": 2756} {"train_loss": -45.25130844116211, "global_step": 333571, "epoch": 2756} {"train_loss": -45.090309143066406, "global_step": 333572, "epoch": 2756} {"train_loss": -45.145870208740234, "global_step": 333573, "epoch": 2756} {"train_loss": -45.22422409057617, "global_step": 333574, "epoch": 2756} {"train_loss": -45.113494873046875, "global_step": 333575, "epoch": 2756} {"train_loss": -44.12091827392578, "global_step": 333576, "epoch": 2756} {"train_loss": -45.35453414916992, "global_step": 333577, "epoch": 2756} {"train_loss": -44.46928787231445, "global_step": 333578, "epoch": 2756} {"train_loss": -44.19470977783203, "global_step": 333579, "epoch": 2756} {"train_loss": -45.50179672241211, "global_step": 333580, "epoch": 2756} {"train_loss": -44.83466339111328, "global_step": 333581, "epoch": 2756} {"train_loss": -44.877437591552734, "global_step": 333582, "epoch": 2756} {"train_loss": -45.55534362792969, "global_step": 333583, "epoch": 2756} {"train_loss": -45.30585861206055, "global_step": 333584, "epoch": 2756} {"train_loss": -45.27359390258789, "global_step": 333585, "epoch": 2756} {"train_loss": -44.933780670166016, "global_step": 333586, "epoch": 2756} {"train_loss": -45.38780975341797, "global_step": 333587, "epoch": 2756} {"train_loss": -45.03064727783203, "global_step": 333588, "epoch": 2756} {"train_loss": -45.1431999206543, "global_step": 333589, "epoch": 2756} {"train_loss": -44.93374252319336, "global_step": 333590, "epoch": 2756} {"train_loss": -45.00886154174805, "global_step": 333591, "epoch": 2756} {"train_loss": -44.377010345458984, "global_step": 333592, "epoch": 2756} {"train_loss": -44.47733688354492, "global_step": 333593, "epoch": 2756} {"train_loss": -45.39948654174805, "global_step": 333594, "epoch": 2756} {"train_loss": -44.30459213256836, "global_step": 333595, "epoch": 2756} {"train_loss": -43.61470608671835, "global_step": 333596, "epoch": 2756, "val_loss": 2625623.25} {"train_loss": -43.9766845703125, "global_step": 333597, "epoch": 2757} {"train_loss": -43.765289306640625, "global_step": 333598, "epoch": 2757} {"train_loss": -44.11133575439453, "global_step": 333599, "epoch": 2757} {"train_loss": -43.118385314941406, "global_step": 333600, "epoch": 2757} {"train_loss": -42.85224914550781, "global_step": 333601, "epoch": 2757} {"train_loss": -44.66987991333008, "global_step": 333602, "epoch": 2757} {"train_loss": -43.89937210083008, "global_step": 333603, "epoch": 2757} {"train_loss": -44.450504302978516, "global_step": 333604, "epoch": 2757} {"train_loss": -43.20940399169922, "global_step": 333605, "epoch": 2757} {"train_loss": -42.96806335449219, "global_step": 333606, "epoch": 2757} {"train_loss": -42.79170608520508, "global_step": 333607, "epoch": 2757} {"train_loss": -41.992393493652344, "global_step": 333608, "epoch": 2757} {"train_loss": -42.68263626098633, "global_step": 333609, "epoch": 2757} {"train_loss": -44.751190185546875, "global_step": 333610, "epoch": 2757} {"train_loss": -43.20979690551758, "global_step": 333611, "epoch": 2757} {"train_loss": -40.06602096557617, "global_step": 333612, "epoch": 2757} {"train_loss": -44.672943115234375, "global_step": 333613, "epoch": 2757} {"train_loss": -42.930755615234375, "global_step": 333614, "epoch": 2757} {"train_loss": -41.07762908935547, "global_step": 333615, "epoch": 2757} {"train_loss": -42.679298400878906, "global_step": 333616, "epoch": 2757} {"train_loss": -40.47797775268555, "global_step": 333617, "epoch": 2757} {"train_loss": -42.623756408691406, "global_step": 333618, "epoch": 2757} {"train_loss": -41.82184982299805, "global_step": 333619, "epoch": 2757} {"train_loss": -42.49526596069336, "global_step": 333620, "epoch": 2757} {"train_loss": -43.000389099121094, "global_step": 333621, "epoch": 2757} {"train_loss": -41.2090950012207, "global_step": 333622, "epoch": 2757} {"train_loss": -42.5178108215332, "global_step": 333623, "epoch": 2757} {"train_loss": -42.633575439453125, "global_step": 333624, "epoch": 2757} {"train_loss": -43.50522232055664, "global_step": 333625, "epoch": 2757} {"train_loss": -42.39271926879883, "global_step": 333626, "epoch": 2757} {"train_loss": -42.57338333129883, "global_step": 333627, "epoch": 2757} {"train_loss": -42.90884780883789, "global_step": 333628, "epoch": 2757} {"train_loss": -43.649654388427734, "global_step": 333629, "epoch": 2757} {"train_loss": -43.292293548583984, "global_step": 333630, "epoch": 2757} {"train_loss": -43.51620101928711, "global_step": 333631, "epoch": 2757} {"train_loss": -43.02657699584961, "global_step": 333632, "epoch": 2757} {"train_loss": -43.5109748840332, "global_step": 333633, "epoch": 2757} {"train_loss": -43.37925338745117, "global_step": 333634, "epoch": 2757} {"train_loss": -43.612003326416016, "global_step": 333635, "epoch": 2757} {"train_loss": -44.08041000366211, "global_step": 333636, "epoch": 2757} {"train_loss": -44.53504180908203, "global_step": 333637, "epoch": 2757} {"train_loss": -43.42402267456055, "global_step": 333638, "epoch": 2757} {"train_loss": -44.48468017578125, "global_step": 333639, "epoch": 2757} {"train_loss": -44.49017333984375, "global_step": 333640, "epoch": 2757} {"train_loss": -43.310035705566406, "global_step": 333641, "epoch": 2757} {"train_loss": -43.579002380371094, "global_step": 333642, "epoch": 2757} {"train_loss": -43.95398712158203, "global_step": 333643, "epoch": 2757} {"train_loss": -45.1533317565918, "global_step": 333644, "epoch": 2757} {"train_loss": -44.070858001708984, "global_step": 333645, "epoch": 2757} {"train_loss": -42.46352005004883, "global_step": 333646, "epoch": 2757} {"train_loss": -43.49951934814453, "global_step": 333647, "epoch": 2757} {"train_loss": -44.23588180541992, "global_step": 333648, "epoch": 2757} {"train_loss": -44.01808547973633, "global_step": 333649, "epoch": 2757} {"train_loss": -43.588653564453125, "global_step": 333650, "epoch": 2757} {"train_loss": -44.024654388427734, "global_step": 333651, "epoch": 2757} {"train_loss": -44.238792419433594, "global_step": 333652, "epoch": 2757} {"train_loss": -43.961265563964844, "global_step": 333653, "epoch": 2757} {"train_loss": -44.79474639892578, "global_step": 333654, "epoch": 2757} {"train_loss": -44.53424835205078, "global_step": 333655, "epoch": 2757} {"train_loss": -44.11058807373047, "global_step": 333656, "epoch": 2757} {"train_loss": -44.885009765625, "global_step": 333657, "epoch": 2757} {"train_loss": -44.173187255859375, "global_step": 333658, "epoch": 2757} {"train_loss": -44.86149215698242, "global_step": 333659, "epoch": 2757} {"train_loss": -44.794525146484375, "global_step": 333660, "epoch": 2757} {"train_loss": -43.918251037597656, "global_step": 333661, "epoch": 2757} {"train_loss": -44.71268844604492, "global_step": 333662, "epoch": 2757} {"train_loss": -43.743133544921875, "global_step": 333663, "epoch": 2757} {"train_loss": -44.305946350097656, "global_step": 333664, "epoch": 2757} {"train_loss": -44.754207611083984, "global_step": 333665, "epoch": 2757} {"train_loss": -43.96916198730469, "global_step": 333666, "epoch": 2757} {"train_loss": -43.60240936279297, "global_step": 333667, "epoch": 2757} {"train_loss": -45.1314582824707, "global_step": 333668, "epoch": 2757} {"train_loss": -44.498626708984375, "global_step": 333669, "epoch": 2757} {"train_loss": -44.29895782470703, "global_step": 333670, "epoch": 2757} {"train_loss": -45.12642288208008, "global_step": 333671, "epoch": 2757} {"train_loss": -45.25366973876953, "global_step": 333672, "epoch": 2757} {"train_loss": -44.472625732421875, "global_step": 333673, "epoch": 2757} {"train_loss": -44.97951889038086, "global_step": 333674, "epoch": 2757} {"train_loss": -44.507137298583984, "global_step": 333675, "epoch": 2757} {"train_loss": -44.75196838378906, "global_step": 333676, "epoch": 2757} {"train_loss": -45.12296676635742, "global_step": 333677, "epoch": 2757} {"train_loss": -44.321815490722656, "global_step": 333678, "epoch": 2757} {"train_loss": -44.835445404052734, "global_step": 333679, "epoch": 2757} {"train_loss": -45.496463775634766, "global_step": 333680, "epoch": 2757} {"train_loss": -44.938350677490234, "global_step": 333681, "epoch": 2757} {"train_loss": -44.59841537475586, "global_step": 333682, "epoch": 2757} {"train_loss": -45.00397491455078, "global_step": 333683, "epoch": 2757} {"train_loss": -44.209388732910156, "global_step": 333684, "epoch": 2757} {"train_loss": -44.35006332397461, "global_step": 333685, "epoch": 2757} {"train_loss": -44.72225570678711, "global_step": 333686, "epoch": 2757} {"train_loss": -45.16324996948242, "global_step": 333687, "epoch": 2757} {"train_loss": -44.65373611450195, "global_step": 333688, "epoch": 2757} {"train_loss": -44.971553802490234, "global_step": 333689, "epoch": 2757} {"train_loss": -44.89374542236328, "global_step": 333690, "epoch": 2757} {"train_loss": -44.87971878051758, "global_step": 333691, "epoch": 2757} {"train_loss": -44.29741668701172, "global_step": 333692, "epoch": 2757} {"train_loss": -44.364681243896484, "global_step": 333693, "epoch": 2757} {"train_loss": -44.29280471801758, "global_step": 333694, "epoch": 2757} {"train_loss": -44.66079330444336, "global_step": 333695, "epoch": 2757} {"train_loss": -44.922698974609375, "global_step": 333696, "epoch": 2757} {"train_loss": -43.669410705566406, "global_step": 333697, "epoch": 2757} {"train_loss": -44.33955001831055, "global_step": 333698, "epoch": 2757} {"train_loss": -44.67560577392578, "global_step": 333699, "epoch": 2757} {"train_loss": -43.99979782104492, "global_step": 333700, "epoch": 2757} {"train_loss": -44.189369201660156, "global_step": 333701, "epoch": 2757} {"train_loss": -44.538848876953125, "global_step": 333702, "epoch": 2757} {"train_loss": -44.30558395385742, "global_step": 333703, "epoch": 2757} {"train_loss": -43.03715896606445, "global_step": 333704, "epoch": 2757} {"train_loss": -43.190460205078125, "global_step": 333705, "epoch": 2757} {"train_loss": -42.89384078979492, "global_step": 333706, "epoch": 2757} {"train_loss": -44.202327728271484, "global_step": 333707, "epoch": 2757} {"train_loss": -44.68837356567383, "global_step": 333708, "epoch": 2757} {"train_loss": -43.0839958190918, "global_step": 333709, "epoch": 2757} {"train_loss": -44.57635498046875, "global_step": 333710, "epoch": 2757} {"train_loss": -44.88798141479492, "global_step": 333711, "epoch": 2757} {"train_loss": -43.89558029174805, "global_step": 333712, "epoch": 2757} {"train_loss": -44.80947494506836, "global_step": 333713, "epoch": 2757} {"train_loss": -44.890625, "global_step": 333714, "epoch": 2757} {"train_loss": -44.43115234375, "global_step": 333715, "epoch": 2757} {"train_loss": -42.53557586669922, "global_step": 333716, "epoch": 2757} {"train_loss": -43.8797194740989, "global_step": 333717, "epoch": 2757, "val_loss": 2531051.5} {"train_loss": -44.28617858886719, "global_step": 333718, "epoch": 2758} {"train_loss": -44.116615295410156, "global_step": 333719, "epoch": 2758} {"train_loss": -42.38215255737305, "global_step": 333720, "epoch": 2758} {"train_loss": -43.57867431640625, "global_step": 333721, "epoch": 2758} {"train_loss": -44.61552047729492, "global_step": 333722, "epoch": 2758} {"train_loss": -43.501686096191406, "global_step": 333723, "epoch": 2758} {"train_loss": -43.88169479370117, "global_step": 333724, "epoch": 2758} {"train_loss": -44.17939376831055, "global_step": 333725, "epoch": 2758} {"train_loss": -43.48015213012695, "global_step": 333726, "epoch": 2758} {"train_loss": -44.692440032958984, "global_step": 333727, "epoch": 2758} {"train_loss": -44.313331604003906, "global_step": 333728, "epoch": 2758} {"train_loss": -43.976478576660156, "global_step": 333729, "epoch": 2758} {"train_loss": -43.39165115356445, "global_step": 333730, "epoch": 2758} {"train_loss": -44.41563034057617, "global_step": 333731, "epoch": 2758} {"train_loss": -44.547325134277344, "global_step": 333732, "epoch": 2758} {"train_loss": -44.363975524902344, "global_step": 333733, "epoch": 2758} {"train_loss": -44.9160270690918, "global_step": 333734, "epoch": 2758} {"train_loss": -44.731868743896484, "global_step": 333735, "epoch": 2758} {"train_loss": -44.390869140625, "global_step": 333736, "epoch": 2758} {"train_loss": -43.79111099243164, "global_step": 333737, "epoch": 2758} {"train_loss": -44.8380126953125, "global_step": 333738, "epoch": 2758} {"train_loss": -44.69715118408203, "global_step": 333739, "epoch": 2758} {"train_loss": -44.920318603515625, "global_step": 333740, "epoch": 2758} {"train_loss": -45.068477630615234, "global_step": 333741, "epoch": 2758} {"train_loss": -45.01515579223633, "global_step": 333742, "epoch": 2758} {"train_loss": -44.54425811767578, "global_step": 333743, "epoch": 2758} {"train_loss": -44.82661819458008, "global_step": 333744, "epoch": 2758} {"train_loss": -44.96802520751953, "global_step": 333745, "epoch": 2758} {"train_loss": -44.91023254394531, "global_step": 333746, "epoch": 2758} {"train_loss": -44.35284423828125, "global_step": 333747, "epoch": 2758} {"train_loss": -44.60140609741211, "global_step": 333748, "epoch": 2758} {"train_loss": -44.8819465637207, "global_step": 333749, "epoch": 2758} {"train_loss": -45.07694625854492, "global_step": 333750, "epoch": 2758} {"train_loss": -43.954444885253906, "global_step": 333751, "epoch": 2758} {"train_loss": -42.752113342285156, "global_step": 333752, "epoch": 2758} {"train_loss": -44.92226028442383, "global_step": 333753, "epoch": 2758} {"train_loss": -44.810821533203125, "global_step": 333754, "epoch": 2758} {"train_loss": -42.8031120300293, "global_step": 333755, "epoch": 2758} {"train_loss": -42.593746185302734, "global_step": 333756, "epoch": 2758} {"train_loss": -44.34498596191406, "global_step": 333757, "epoch": 2758} {"train_loss": -45.27939987182617, "global_step": 333758, "epoch": 2758} {"train_loss": -43.77072525024414, "global_step": 333759, "epoch": 2758} {"train_loss": -43.7449836730957, "global_step": 333760, "epoch": 2758} {"train_loss": -44.5617790222168, "global_step": 333761, "epoch": 2758} {"train_loss": -45.077266693115234, "global_step": 333762, "epoch": 2758} {"train_loss": -44.630733489990234, "global_step": 333763, "epoch": 2758} {"train_loss": -44.28684616088867, "global_step": 333764, "epoch": 2758} {"train_loss": -45.42536163330078, "global_step": 333765, "epoch": 2758} {"train_loss": -44.202510833740234, "global_step": 333766, "epoch": 2758} {"train_loss": -44.969295501708984, "global_step": 333767, "epoch": 2758} {"train_loss": -45.070980072021484, "global_step": 333768, "epoch": 2758} {"train_loss": -44.81570053100586, "global_step": 333769, "epoch": 2758} {"train_loss": -44.21505355834961, "global_step": 333770, "epoch": 2758} {"train_loss": -44.783172607421875, "global_step": 333771, "epoch": 2758} {"train_loss": -44.385738372802734, "global_step": 333772, "epoch": 2758} {"train_loss": -44.442440032958984, "global_step": 333773, "epoch": 2758} {"train_loss": -44.53293991088867, "global_step": 333774, "epoch": 2758} {"train_loss": -43.573123931884766, "global_step": 333775, "epoch": 2758} {"train_loss": -44.61399459838867, "global_step": 333776, "epoch": 2758} {"train_loss": -43.8410758972168, "global_step": 333777, "epoch": 2758} {"train_loss": -44.75625228881836, "global_step": 333778, "epoch": 2758} {"train_loss": -43.74131393432617, "global_step": 333779, "epoch": 2758} {"train_loss": -43.86814880371094, "global_step": 333780, "epoch": 2758} {"train_loss": -43.58127975463867, "global_step": 333781, "epoch": 2758} {"train_loss": -43.58786392211914, "global_step": 333782, "epoch": 2758} {"train_loss": -42.22710418701172, "global_step": 333783, "epoch": 2758} {"train_loss": -44.367347717285156, "global_step": 333784, "epoch": 2758} {"train_loss": -43.34505844116211, "global_step": 333785, "epoch": 2758} {"train_loss": -42.61772918701172, "global_step": 333786, "epoch": 2758} {"train_loss": -43.10273361206055, "global_step": 333787, "epoch": 2758} {"train_loss": -43.880859375, "global_step": 333788, "epoch": 2758} {"train_loss": -43.60365295410156, "global_step": 333789, "epoch": 2758} {"train_loss": -42.22400665283203, "global_step": 333790, "epoch": 2758} {"train_loss": -43.21564865112305, "global_step": 333791, "epoch": 2758} {"train_loss": -43.17487716674805, "global_step": 333792, "epoch": 2758} {"train_loss": -42.759552001953125, "global_step": 333793, "epoch": 2758} {"train_loss": -40.634613037109375, "global_step": 333794, "epoch": 2758} {"train_loss": -43.52085494995117, "global_step": 333795, "epoch": 2758} {"train_loss": -42.21201705932617, "global_step": 333796, "epoch": 2758} {"train_loss": -39.10573959350586, "global_step": 333797, "epoch": 2758} {"train_loss": -42.81132507324219, "global_step": 333798, "epoch": 2758} {"train_loss": -42.90617752075195, "global_step": 333799, "epoch": 2758} {"train_loss": -40.76777648925781, "global_step": 333800, "epoch": 2758} {"train_loss": -44.12801742553711, "global_step": 333801, "epoch": 2758} {"train_loss": -41.42315673828125, "global_step": 333802, "epoch": 2758} {"train_loss": -43.006935119628906, "global_step": 333803, "epoch": 2758} {"train_loss": -43.658687591552734, "global_step": 333804, "epoch": 2758} {"train_loss": -42.930667877197266, "global_step": 333805, "epoch": 2758} {"train_loss": -42.03135299682617, "global_step": 333806, "epoch": 2758} {"train_loss": -44.61775207519531, "global_step": 333807, "epoch": 2758} {"train_loss": -43.48957824707031, "global_step": 333808, "epoch": 2758} {"train_loss": -43.2409553527832, "global_step": 333809, "epoch": 2758} {"train_loss": -43.534114837646484, "global_step": 333810, "epoch": 2758} {"train_loss": -44.39218521118164, "global_step": 333811, "epoch": 2758} {"train_loss": -42.734100341796875, "global_step": 333812, "epoch": 2758} {"train_loss": -43.81636047363281, "global_step": 333813, "epoch": 2758} {"train_loss": -44.78687286376953, "global_step": 333814, "epoch": 2758} {"train_loss": -44.34166717529297, "global_step": 333815, "epoch": 2758} {"train_loss": -43.32491683959961, "global_step": 333816, "epoch": 2758} {"train_loss": -44.15424346923828, "global_step": 333817, "epoch": 2758} {"train_loss": -44.63489532470703, "global_step": 333818, "epoch": 2758} {"train_loss": -43.045955657958984, "global_step": 333819, "epoch": 2758} {"train_loss": -44.4227294921875, "global_step": 333820, "epoch": 2758} {"train_loss": -44.19460678100586, "global_step": 333821, "epoch": 2758} {"train_loss": -43.15055465698242, "global_step": 333822, "epoch": 2758} {"train_loss": -43.09145736694336, "global_step": 333823, "epoch": 2758} {"train_loss": -43.4128532409668, "global_step": 333824, "epoch": 2758} {"train_loss": -44.363765716552734, "global_step": 333825, "epoch": 2758} {"train_loss": -44.016353607177734, "global_step": 333826, "epoch": 2758} {"train_loss": -44.604644775390625, "global_step": 333827, "epoch": 2758} {"train_loss": -43.371238708496094, "global_step": 333828, "epoch": 2758} {"train_loss": -44.41225051879883, "global_step": 333829, "epoch": 2758} {"train_loss": -43.75385665893555, "global_step": 333830, "epoch": 2758} {"train_loss": -44.10379409790039, "global_step": 333831, "epoch": 2758} {"train_loss": -44.15143966674805, "global_step": 333832, "epoch": 2758} {"train_loss": -43.75083541870117, "global_step": 333833, "epoch": 2758} {"train_loss": -44.89058303833008, "global_step": 333834, "epoch": 2758} {"train_loss": -40.45943069458008, "global_step": 333835, "epoch": 2758} {"train_loss": -42.868865966796875, "global_step": 333836, "epoch": 2758} {"train_loss": -42.177467346191406, "global_step": 333837, "epoch": 2758} {"train_loss": -43.827576030384414, "global_step": 333838, "epoch": 2758, "val_loss": 3206594.0} {"train_loss": -42.74541091918945, "global_step": 333839, "epoch": 2759} {"train_loss": -43.549964904785156, "global_step": 333840, "epoch": 2759} {"train_loss": -42.50212097167969, "global_step": 333841, "epoch": 2759} {"train_loss": -41.731727600097656, "global_step": 333842, "epoch": 2759} {"train_loss": -42.941017150878906, "global_step": 333843, "epoch": 2759} {"train_loss": -43.2418327331543, "global_step": 333844, "epoch": 2759} {"train_loss": -43.22222900390625, "global_step": 333845, "epoch": 2759} {"train_loss": -41.88098907470703, "global_step": 333846, "epoch": 2759} {"train_loss": -43.31911087036133, "global_step": 333847, "epoch": 2759} {"train_loss": -41.854427337646484, "global_step": 333848, "epoch": 2759} {"train_loss": -43.004127502441406, "global_step": 333849, "epoch": 2759} {"train_loss": -43.89658737182617, "global_step": 333850, "epoch": 2759} {"train_loss": -43.704349517822266, "global_step": 333851, "epoch": 2759} {"train_loss": -43.1181640625, "global_step": 333852, "epoch": 2759} {"train_loss": -44.11351013183594, "global_step": 333853, "epoch": 2759} {"train_loss": -43.49973678588867, "global_step": 333854, "epoch": 2759} {"train_loss": -43.015472412109375, "global_step": 333855, "epoch": 2759} {"train_loss": -43.302696228027344, "global_step": 333856, "epoch": 2759} {"train_loss": -43.09646987915039, "global_step": 333857, "epoch": 2759} {"train_loss": -43.18305206298828, "global_step": 333858, "epoch": 2759} {"train_loss": -41.694297790527344, "global_step": 333859, "epoch": 2759} {"train_loss": -40.87861251831055, "global_step": 333860, "epoch": 2759} {"train_loss": -43.628883361816406, "global_step": 333861, "epoch": 2759} {"train_loss": -43.984188079833984, "global_step": 333862, "epoch": 2759} {"train_loss": -42.17295455932617, "global_step": 333863, "epoch": 2759} {"train_loss": -43.449581146240234, "global_step": 333864, "epoch": 2759} {"train_loss": -38.219879150390625, "global_step": 333865, "epoch": 2759} {"train_loss": -42.06849670410156, "global_step": 333866, "epoch": 2759} {"train_loss": -43.53273391723633, "global_step": 333867, "epoch": 2759} {"train_loss": -42.633079528808594, "global_step": 333868, "epoch": 2759} {"train_loss": -43.1695442199707, "global_step": 333869, "epoch": 2759} {"train_loss": -42.57532501220703, "global_step": 333870, "epoch": 2759} {"train_loss": -43.474884033203125, "global_step": 333871, "epoch": 2759} {"train_loss": -43.47005844116211, "global_step": 333872, "epoch": 2759} {"train_loss": -44.04487228393555, "global_step": 333873, "epoch": 2759} {"train_loss": -42.78056716918945, "global_step": 333874, "epoch": 2759} {"train_loss": -40.36635971069336, "global_step": 333875, "epoch": 2759} {"train_loss": -43.0008659362793, "global_step": 333876, "epoch": 2759} {"train_loss": -42.82744216918945, "global_step": 333877, "epoch": 2759} {"train_loss": -41.00984573364258, "global_step": 333878, "epoch": 2759} {"train_loss": -43.3988151550293, "global_step": 333879, "epoch": 2759} {"train_loss": -44.26054000854492, "global_step": 333880, "epoch": 2759} {"train_loss": -42.28809356689453, "global_step": 333881, "epoch": 2759} {"train_loss": -42.49312973022461, "global_step": 333882, "epoch": 2759} {"train_loss": -42.624427795410156, "global_step": 333883, "epoch": 2759} {"train_loss": -43.97149658203125, "global_step": 333884, "epoch": 2759} {"train_loss": -42.4307975769043, "global_step": 333885, "epoch": 2759} {"train_loss": -42.544979095458984, "global_step": 333886, "epoch": 2759} {"train_loss": -42.7353401184082, "global_step": 333887, "epoch": 2759} {"train_loss": -42.69529342651367, "global_step": 333888, "epoch": 2759} {"train_loss": -43.26802444458008, "global_step": 333889, "epoch": 2759} {"train_loss": -41.40232849121094, "global_step": 333890, "epoch": 2759} {"train_loss": -43.64254379272461, "global_step": 333891, "epoch": 2759} {"train_loss": -43.352317810058594, "global_step": 333892, "epoch": 2759} {"train_loss": -39.704246520996094, "global_step": 333893, "epoch": 2759} {"train_loss": -43.249794006347656, "global_step": 333894, "epoch": 2759} {"train_loss": -42.901912689208984, "global_step": 333895, "epoch": 2759} {"train_loss": -42.35041427612305, "global_step": 333896, "epoch": 2759} {"train_loss": -43.38467025756836, "global_step": 333897, "epoch": 2759} {"train_loss": -43.056270599365234, "global_step": 333898, "epoch": 2759} {"train_loss": -43.43819808959961, "global_step": 333899, "epoch": 2759} {"train_loss": -43.61802291870117, "global_step": 333900, "epoch": 2759} {"train_loss": -43.450645446777344, "global_step": 333901, "epoch": 2759} {"train_loss": -44.18815612792969, "global_step": 333902, "epoch": 2759} {"train_loss": -41.86125564575195, "global_step": 333903, "epoch": 2759} {"train_loss": -43.19912338256836, "global_step": 333904, "epoch": 2759} {"train_loss": -43.713314056396484, "global_step": 333905, "epoch": 2759} {"train_loss": -43.572715759277344, "global_step": 333906, "epoch": 2759} {"train_loss": -43.61033248901367, "global_step": 333907, "epoch": 2759} {"train_loss": -43.423091888427734, "global_step": 333908, "epoch": 2759} {"train_loss": -43.06101989746094, "global_step": 333909, "epoch": 2759} {"train_loss": -42.85456466674805, "global_step": 333910, "epoch": 2759} {"train_loss": -42.07603073120117, "global_step": 333911, "epoch": 2759} {"train_loss": -43.635963439941406, "global_step": 333912, "epoch": 2759} {"train_loss": -43.52333068847656, "global_step": 333913, "epoch": 2759} {"train_loss": -43.07194900512695, "global_step": 333914, "epoch": 2759} {"train_loss": -43.15774154663086, "global_step": 333915, "epoch": 2759} {"train_loss": -44.003761291503906, "global_step": 333916, "epoch": 2759} {"train_loss": -43.72733688354492, "global_step": 333917, "epoch": 2759} {"train_loss": -43.87303924560547, "global_step": 333918, "epoch": 2759} {"train_loss": -44.489906311035156, "global_step": 333919, "epoch": 2759} {"train_loss": -43.70170974731445, "global_step": 333920, "epoch": 2759} {"train_loss": -43.333553314208984, "global_step": 333921, "epoch": 2759} {"train_loss": -43.74898147583008, "global_step": 333922, "epoch": 2759} {"train_loss": -44.011871337890625, "global_step": 333923, "epoch": 2759} {"train_loss": -44.18547439575195, "global_step": 333924, "epoch": 2759} {"train_loss": -44.958984375, "global_step": 333925, "epoch": 2759} {"train_loss": -44.64187240600586, "global_step": 333926, "epoch": 2759} {"train_loss": -44.21517562866211, "global_step": 333927, "epoch": 2759} {"train_loss": -43.59051513671875, "global_step": 333928, "epoch": 2759} {"train_loss": -44.2377815246582, "global_step": 333929, "epoch": 2759} {"train_loss": -44.6081657409668, "global_step": 333930, "epoch": 2759} {"train_loss": -44.25859832763672, "global_step": 333931, "epoch": 2759} {"train_loss": -44.223812103271484, "global_step": 333932, "epoch": 2759} {"train_loss": -44.32820510864258, "global_step": 333933, "epoch": 2759} {"train_loss": -44.247432708740234, "global_step": 333934, "epoch": 2759} {"train_loss": -43.90590286254883, "global_step": 333935, "epoch": 2759} {"train_loss": -44.9182243347168, "global_step": 333936, "epoch": 2759} {"train_loss": -43.950252532958984, "global_step": 333937, "epoch": 2759} {"train_loss": -44.60818099975586, "global_step": 333938, "epoch": 2759} {"train_loss": -44.60963821411133, "global_step": 333939, "epoch": 2759} {"train_loss": -43.93149185180664, "global_step": 333940, "epoch": 2759} {"train_loss": -44.99428939819336, "global_step": 333941, "epoch": 2759} {"train_loss": -45.065773010253906, "global_step": 333942, "epoch": 2759} {"train_loss": -44.888912200927734, "global_step": 333943, "epoch": 2759} {"train_loss": -44.32849884033203, "global_step": 333944, "epoch": 2759} {"train_loss": -44.603031158447266, "global_step": 333945, "epoch": 2759} {"train_loss": -45.234588623046875, "global_step": 333946, "epoch": 2759} {"train_loss": -44.17072296142578, "global_step": 333947, "epoch": 2759} {"train_loss": -43.7557258605957, "global_step": 333948, "epoch": 2759} {"train_loss": -43.40568923950195, "global_step": 333949, "epoch": 2759} {"train_loss": -44.57621383666992, "global_step": 333950, "epoch": 2759} {"train_loss": -44.678001403808594, "global_step": 333951, "epoch": 2759} {"train_loss": -44.438053131103516, "global_step": 333952, "epoch": 2759} {"train_loss": -44.3741569519043, "global_step": 333953, "epoch": 2759} {"train_loss": -44.742523193359375, "global_step": 333954, "epoch": 2759} {"train_loss": -42.95699691772461, "global_step": 333955, "epoch": 2759} {"train_loss": -44.12651443481445, "global_step": 333956, "epoch": 2759} {"train_loss": -44.14099884033203, "global_step": 333957, "epoch": 2759} {"train_loss": -43.67489242553711, "global_step": 333958, "epoch": 2759} {"train_loss": -43.37458435563016, "global_step": 333959, "epoch": 2759, "val_loss": 2509521.25} {"train_loss": -44.573848724365234, "global_step": 333960, "epoch": 2760} {"train_loss": -44.49449157714844, "global_step": 333961, "epoch": 2760} {"train_loss": -44.350101470947266, "global_step": 333962, "epoch": 2760} {"train_loss": -44.038970947265625, "global_step": 333963, "epoch": 2760} {"train_loss": -45.000728607177734, "global_step": 333964, "epoch": 2760} {"train_loss": -44.855567932128906, "global_step": 333965, "epoch": 2760} {"train_loss": -43.535926818847656, "global_step": 333966, "epoch": 2760} {"train_loss": -43.98090744018555, "global_step": 333967, "epoch": 2760} {"train_loss": -44.17765426635742, "global_step": 333968, "epoch": 2760} {"train_loss": -44.504276275634766, "global_step": 333969, "epoch": 2760} {"train_loss": -44.02304458618164, "global_step": 333970, "epoch": 2760} {"train_loss": -43.38361740112305, "global_step": 333971, "epoch": 2760} {"train_loss": -40.52394485473633, "global_step": 333972, "epoch": 2760} {"train_loss": -44.257320404052734, "global_step": 333973, "epoch": 2760} {"train_loss": -44.34678649902344, "global_step": 333974, "epoch": 2760} {"train_loss": -43.75724411010742, "global_step": 333975, "epoch": 2760} {"train_loss": -43.065921783447266, "global_step": 333976, "epoch": 2760} {"train_loss": -42.82733154296875, "global_step": 333977, "epoch": 2760} {"train_loss": -43.546871185302734, "global_step": 333978, "epoch": 2760} {"train_loss": -44.034820556640625, "global_step": 333979, "epoch": 2760} {"train_loss": -44.02981948852539, "global_step": 333980, "epoch": 2760} {"train_loss": -43.7165412902832, "global_step": 333981, "epoch": 2760} {"train_loss": -44.38583755493164, "global_step": 333982, "epoch": 2760} {"train_loss": -40.27024841308594, "global_step": 333983, "epoch": 2760} {"train_loss": -44.04803466796875, "global_step": 333984, "epoch": 2760} {"train_loss": -43.66776657104492, "global_step": 333985, "epoch": 2760} {"train_loss": -43.6887321472168, "global_step": 333986, "epoch": 2760} {"train_loss": -44.12941360473633, "global_step": 333987, "epoch": 2760} {"train_loss": -44.113948822021484, "global_step": 333988, "epoch": 2760} {"train_loss": -42.905113220214844, "global_step": 333989, "epoch": 2760} {"train_loss": -40.56998825073242, "global_step": 333990, "epoch": 2760} {"train_loss": -37.12416458129883, "global_step": 333991, "epoch": 2760} {"train_loss": -42.00230026245117, "global_step": 333992, "epoch": 2760} {"train_loss": -43.294036865234375, "global_step": 333993, "epoch": 2760} {"train_loss": -40.94591522216797, "global_step": 333994, "epoch": 2760} {"train_loss": -40.955501556396484, "global_step": 333995, "epoch": 2760} {"train_loss": -43.05316925048828, "global_step": 333996, "epoch": 2760} {"train_loss": -42.7986946105957, "global_step": 333997, "epoch": 2760} {"train_loss": -42.67106246948242, "global_step": 333998, "epoch": 2760} {"train_loss": -43.414058685302734, "global_step": 333999, "epoch": 2760} {"train_loss": -41.303951263427734, "global_step": 334000, "epoch": 2760} {"train_loss": -43.442779541015625, "global_step": 334001, "epoch": 2760} {"train_loss": -41.88507843017578, "global_step": 334002, "epoch": 2760} {"train_loss": -40.576900482177734, "global_step": 334003, "epoch": 2760} {"train_loss": -40.751014709472656, "global_step": 334004, "epoch": 2760} {"train_loss": -42.2498779296875, "global_step": 334005, "epoch": 2760} {"train_loss": -41.22822189331055, "global_step": 334006, "epoch": 2760} {"train_loss": -41.11378860473633, "global_step": 334007, "epoch": 2760} {"train_loss": -42.08949279785156, "global_step": 334008, "epoch": 2760} {"train_loss": -41.066585540771484, "global_step": 334009, "epoch": 2760} {"train_loss": -38.6932258605957, "global_step": 334010, "epoch": 2760} {"train_loss": -43.481842041015625, "global_step": 334011, "epoch": 2760} {"train_loss": -41.367652893066406, "global_step": 334012, "epoch": 2760} {"train_loss": -41.35675811767578, "global_step": 334013, "epoch": 2760} {"train_loss": -42.79750442504883, "global_step": 334014, "epoch": 2760} {"train_loss": -41.59221649169922, "global_step": 334015, "epoch": 2760} {"train_loss": -42.32558059692383, "global_step": 334016, "epoch": 2760} {"train_loss": -41.743255615234375, "global_step": 334017, "epoch": 2760} {"train_loss": -42.213409423828125, "global_step": 334018, "epoch": 2760} {"train_loss": -42.8017692565918, "global_step": 334019, "epoch": 2760} {"train_loss": -42.37258529663086, "global_step": 334020, "epoch": 2760} {"train_loss": -44.15023422241211, "global_step": 334021, "epoch": 2760} {"train_loss": -43.28034591674805, "global_step": 334022, "epoch": 2760} {"train_loss": -43.400611877441406, "global_step": 334023, "epoch": 2760} {"train_loss": -43.740753173828125, "global_step": 334024, "epoch": 2760} {"train_loss": -43.18809509277344, "global_step": 334025, "epoch": 2760} {"train_loss": -43.778778076171875, "global_step": 334026, "epoch": 2760} {"train_loss": -43.46200180053711, "global_step": 334027, "epoch": 2760} {"train_loss": -43.86327362060547, "global_step": 334028, "epoch": 2760} {"train_loss": -44.37070846557617, "global_step": 334029, "epoch": 2760} {"train_loss": -43.55314636230469, "global_step": 334030, "epoch": 2760} {"train_loss": -44.149208068847656, "global_step": 334031, "epoch": 2760} {"train_loss": -44.16141891479492, "global_step": 334032, "epoch": 2760} {"train_loss": -44.06783676147461, "global_step": 334033, "epoch": 2760} {"train_loss": -43.982643127441406, "global_step": 334034, "epoch": 2760} {"train_loss": -43.82503890991211, "global_step": 334035, "epoch": 2760} {"train_loss": -44.178871154785156, "global_step": 334036, "epoch": 2760} {"train_loss": -44.07267379760742, "global_step": 334037, "epoch": 2760} {"train_loss": -44.007232666015625, "global_step": 334038, "epoch": 2760} {"train_loss": -44.3149528503418, "global_step": 334039, "epoch": 2760} {"train_loss": -44.37055206298828, "global_step": 334040, "epoch": 2760} {"train_loss": -44.066810607910156, "global_step": 334041, "epoch": 2760} {"train_loss": -43.26453399658203, "global_step": 334042, "epoch": 2760} {"train_loss": -44.119510650634766, "global_step": 334043, "epoch": 2760} {"train_loss": -44.2296142578125, "global_step": 334044, "epoch": 2760} {"train_loss": -44.417083740234375, "global_step": 334045, "epoch": 2760} {"train_loss": -44.13349533081055, "global_step": 334046, "epoch": 2760} {"train_loss": -44.348140716552734, "global_step": 334047, "epoch": 2760} {"train_loss": -44.25938034057617, "global_step": 334048, "epoch": 2760} {"train_loss": -44.07331466674805, "global_step": 334049, "epoch": 2760} {"train_loss": -43.95389938354492, "global_step": 334050, "epoch": 2760} {"train_loss": -44.83436965942383, "global_step": 334051, "epoch": 2760} {"train_loss": -44.23604965209961, "global_step": 334052, "epoch": 2760} {"train_loss": -43.63541030883789, "global_step": 334053, "epoch": 2760} {"train_loss": -43.53885269165039, "global_step": 334054, "epoch": 2760} {"train_loss": -44.75013732910156, "global_step": 334055, "epoch": 2760} {"train_loss": -44.46247100830078, "global_step": 334056, "epoch": 2760} {"train_loss": -45.16297149658203, "global_step": 334057, "epoch": 2760} {"train_loss": -44.965057373046875, "global_step": 334058, "epoch": 2760} {"train_loss": -44.785160064697266, "global_step": 334059, "epoch": 2760} {"train_loss": -44.56367492675781, "global_step": 334060, "epoch": 2760} {"train_loss": -44.621009826660156, "global_step": 334061, "epoch": 2760} {"train_loss": -45.319149017333984, "global_step": 334062, "epoch": 2760} {"train_loss": -44.795875549316406, "global_step": 334063, "epoch": 2760} {"train_loss": -44.15782928466797, "global_step": 334064, "epoch": 2760} {"train_loss": -44.366275787353516, "global_step": 334065, "epoch": 2760} {"train_loss": -44.43498611450195, "global_step": 334066, "epoch": 2760} {"train_loss": -43.7376823425293, "global_step": 334067, "epoch": 2760} {"train_loss": -43.823089599609375, "global_step": 334068, "epoch": 2760} {"train_loss": -44.55706787109375, "global_step": 334069, "epoch": 2760} {"train_loss": -44.532379150390625, "global_step": 334070, "epoch": 2760} {"train_loss": -44.73640060424805, "global_step": 334071, "epoch": 2760} {"train_loss": -43.13222122192383, "global_step": 334072, "epoch": 2760} {"train_loss": -43.933349609375, "global_step": 334073, "epoch": 2760} {"train_loss": -44.83378219604492, "global_step": 334074, "epoch": 2760} {"train_loss": -44.03719711303711, "global_step": 334075, "epoch": 2760} {"train_loss": -41.42042541503906, "global_step": 334076, "epoch": 2760} {"train_loss": -44.61739730834961, "global_step": 334077, "epoch": 2760} {"train_loss": -43.15353012084961, "global_step": 334078, "epoch": 2760} {"train_loss": -42.191043853759766, "global_step": 334079, "epoch": 2760} {"train_loss": -43.38777800630932, "global_step": 334080, "epoch": 2760, "val_loss": 2505908.75} {"train_loss": -43.0398063659668, "global_step": 334081, "epoch": 2761} {"train_loss": -42.026180267333984, "global_step": 334082, "epoch": 2761} {"train_loss": -43.75140380859375, "global_step": 334083, "epoch": 2761} {"train_loss": -44.75353240966797, "global_step": 334084, "epoch": 2761} {"train_loss": -44.39735412597656, "global_step": 334085, "epoch": 2761} {"train_loss": -44.32792282104492, "global_step": 334086, "epoch": 2761} {"train_loss": -44.94586944580078, "global_step": 334087, "epoch": 2761} {"train_loss": -43.31609344482422, "global_step": 334088, "epoch": 2761} {"train_loss": -44.03960037231445, "global_step": 334089, "epoch": 2761} {"train_loss": -45.18437576293945, "global_step": 334090, "epoch": 2761} {"train_loss": -44.1152229309082, "global_step": 334091, "epoch": 2761} {"train_loss": -44.08366012573242, "global_step": 334092, "epoch": 2761} {"train_loss": -44.75395584106445, "global_step": 334093, "epoch": 2761} {"train_loss": -44.23353958129883, "global_step": 334094, "epoch": 2761} {"train_loss": -43.325225830078125, "global_step": 334095, "epoch": 2761} {"train_loss": -44.017696380615234, "global_step": 334096, "epoch": 2761} {"train_loss": -44.57476806640625, "global_step": 334097, "epoch": 2761} {"train_loss": -41.79471969604492, "global_step": 334098, "epoch": 2761} {"train_loss": -43.382720947265625, "global_step": 334099, "epoch": 2761} {"train_loss": -43.860740661621094, "global_step": 334100, "epoch": 2761} {"train_loss": -43.287925720214844, "global_step": 334101, "epoch": 2761} {"train_loss": -42.573997497558594, "global_step": 334102, "epoch": 2761} {"train_loss": -43.506465911865234, "global_step": 334103, "epoch": 2761} {"train_loss": -43.37693405151367, "global_step": 334104, "epoch": 2761} {"train_loss": -43.36832809448242, "global_step": 334105, "epoch": 2761} {"train_loss": -44.29719161987305, "global_step": 334106, "epoch": 2761} {"train_loss": -43.819984436035156, "global_step": 334107, "epoch": 2761} {"train_loss": -43.214385986328125, "global_step": 334108, "epoch": 2761} {"train_loss": -44.100582122802734, "global_step": 334109, "epoch": 2761} {"train_loss": -43.94101333618164, "global_step": 334110, "epoch": 2761} {"train_loss": -44.27101135253906, "global_step": 334111, "epoch": 2761} {"train_loss": -44.09821319580078, "global_step": 334112, "epoch": 2761} {"train_loss": -44.736454010009766, "global_step": 334113, "epoch": 2761} {"train_loss": -44.18518829345703, "global_step": 334114, "epoch": 2761} {"train_loss": -43.4796028137207, "global_step": 334115, "epoch": 2761} {"train_loss": -44.342803955078125, "global_step": 334116, "epoch": 2761} {"train_loss": -43.61698532104492, "global_step": 334117, "epoch": 2761} {"train_loss": -44.61484909057617, "global_step": 334118, "epoch": 2761} {"train_loss": -44.38993835449219, "global_step": 334119, "epoch": 2761} {"train_loss": -44.345237731933594, "global_step": 334120, "epoch": 2761} {"train_loss": -44.15100860595703, "global_step": 334121, "epoch": 2761} {"train_loss": -44.905330657958984, "global_step": 334122, "epoch": 2761} {"train_loss": -44.720001220703125, "global_step": 334123, "epoch": 2761} {"train_loss": -44.733314514160156, "global_step": 334124, "epoch": 2761} {"train_loss": -44.54986572265625, "global_step": 334125, "epoch": 2761} {"train_loss": -44.33024978637695, "global_step": 334126, "epoch": 2761} {"train_loss": -44.54667663574219, "global_step": 334127, "epoch": 2761} {"train_loss": -45.037933349609375, "global_step": 334128, "epoch": 2761} {"train_loss": -44.82127380371094, "global_step": 334129, "epoch": 2761} {"train_loss": -44.6778450012207, "global_step": 334130, "epoch": 2761} {"train_loss": -45.4593391418457, "global_step": 334131, "epoch": 2761} {"train_loss": -44.51089096069336, "global_step": 334132, "epoch": 2761} {"train_loss": -44.186744689941406, "global_step": 334133, "epoch": 2761} {"train_loss": -44.77466583251953, "global_step": 334134, "epoch": 2761} {"train_loss": -44.63179397583008, "global_step": 334135, "epoch": 2761} {"train_loss": -44.89274215698242, "global_step": 334136, "epoch": 2761} {"train_loss": -45.08765411376953, "global_step": 334137, "epoch": 2761} {"train_loss": -43.47689437866211, "global_step": 334138, "epoch": 2761} {"train_loss": -44.12473678588867, "global_step": 334139, "epoch": 2761} {"train_loss": -44.56183624267578, "global_step": 334140, "epoch": 2761} {"train_loss": -43.0977897644043, "global_step": 334141, "epoch": 2761} {"train_loss": -43.232295989990234, "global_step": 334142, "epoch": 2761} {"train_loss": -43.771785736083984, "global_step": 334143, "epoch": 2761} {"train_loss": -42.147762298583984, "global_step": 334144, "epoch": 2761} {"train_loss": -43.46726989746094, "global_step": 334145, "epoch": 2761} {"train_loss": -42.479610443115234, "global_step": 334146, "epoch": 2761} {"train_loss": -43.61932373046875, "global_step": 334147, "epoch": 2761} {"train_loss": -43.509185791015625, "global_step": 334148, "epoch": 2761} {"train_loss": -43.026611328125, "global_step": 334149, "epoch": 2761} {"train_loss": -43.63912582397461, "global_step": 334150, "epoch": 2761} {"train_loss": -44.31722640991211, "global_step": 334151, "epoch": 2761} {"train_loss": -43.71027755737305, "global_step": 334152, "epoch": 2761} {"train_loss": -43.64712142944336, "global_step": 334153, "epoch": 2761} {"train_loss": -44.148555755615234, "global_step": 334154, "epoch": 2761} {"train_loss": -43.77618408203125, "global_step": 334155, "epoch": 2761} {"train_loss": -43.72419357299805, "global_step": 334156, "epoch": 2761} {"train_loss": -44.500205993652344, "global_step": 334157, "epoch": 2761} {"train_loss": -44.15431594848633, "global_step": 334158, "epoch": 2761} {"train_loss": -44.70717239379883, "global_step": 334159, "epoch": 2761} {"train_loss": -43.928775787353516, "global_step": 334160, "epoch": 2761} {"train_loss": -44.71101760864258, "global_step": 334161, "epoch": 2761} {"train_loss": -44.245731353759766, "global_step": 334162, "epoch": 2761} {"train_loss": -44.12392044067383, "global_step": 334163, "epoch": 2761} {"train_loss": -44.6629638671875, "global_step": 334164, "epoch": 2761} {"train_loss": -44.06974411010742, "global_step": 334165, "epoch": 2761} {"train_loss": -43.88904571533203, "global_step": 334166, "epoch": 2761} {"train_loss": -44.1515998840332, "global_step": 334167, "epoch": 2761} {"train_loss": -44.75688934326172, "global_step": 334168, "epoch": 2761} {"train_loss": -43.825496673583984, "global_step": 334169, "epoch": 2761} {"train_loss": -44.056861877441406, "global_step": 334170, "epoch": 2761} {"train_loss": -43.76261520385742, "global_step": 334171, "epoch": 2761} {"train_loss": -43.26250076293945, "global_step": 334172, "epoch": 2761} {"train_loss": -44.475521087646484, "global_step": 334173, "epoch": 2761} {"train_loss": -43.89799880981445, "global_step": 334174, "epoch": 2761} {"train_loss": -42.862396240234375, "global_step": 334175, "epoch": 2761} {"train_loss": -43.83949661254883, "global_step": 334176, "epoch": 2761} {"train_loss": -45.08865737915039, "global_step": 334177, "epoch": 2761} {"train_loss": -42.46981430053711, "global_step": 334178, "epoch": 2761} {"train_loss": -43.4122428894043, "global_step": 334179, "epoch": 2761} {"train_loss": -43.279327392578125, "global_step": 334180, "epoch": 2761} {"train_loss": -43.564361572265625, "global_step": 334181, "epoch": 2761} {"train_loss": -43.60763168334961, "global_step": 334182, "epoch": 2761} {"train_loss": -43.63193893432617, "global_step": 334183, "epoch": 2761} {"train_loss": -43.35118103027344, "global_step": 334184, "epoch": 2761} {"train_loss": -44.169517517089844, "global_step": 334185, "epoch": 2761} {"train_loss": -44.254371643066406, "global_step": 334186, "epoch": 2761} {"train_loss": -44.1534423828125, "global_step": 334187, "epoch": 2761} {"train_loss": -44.27663803100586, "global_step": 334188, "epoch": 2761} {"train_loss": -44.589717864990234, "global_step": 334189, "epoch": 2761} {"train_loss": -44.30085754394531, "global_step": 334190, "epoch": 2761} {"train_loss": -44.64735794067383, "global_step": 334191, "epoch": 2761} {"train_loss": -44.47307205200195, "global_step": 334192, "epoch": 2761} {"train_loss": -45.01826095581055, "global_step": 334193, "epoch": 2761} {"train_loss": -44.5069580078125, "global_step": 334194, "epoch": 2761} {"train_loss": -45.01313400268555, "global_step": 334195, "epoch": 2761} {"train_loss": -44.50682830810547, "global_step": 334196, "epoch": 2761} {"train_loss": -44.86103439331055, "global_step": 334197, "epoch": 2761} {"train_loss": -45.0256462097168, "global_step": 334198, "epoch": 2761} {"train_loss": -44.403968811035156, "global_step": 334199, "epoch": 2761} {"train_loss": -45.00643539428711, "global_step": 334200, "epoch": 2761} {"train_loss": -44.05993605054115, "global_step": 334201, "epoch": 2761, "val_loss": 2509686.25} {"train_loss": -44.767940521240234, "global_step": 334202, "epoch": 2762} {"train_loss": -44.51457977294922, "global_step": 334203, "epoch": 2762} {"train_loss": -44.41498565673828, "global_step": 334204, "epoch": 2762} {"train_loss": -45.10888671875, "global_step": 334205, "epoch": 2762} {"train_loss": -44.20625686645508, "global_step": 334206, "epoch": 2762} {"train_loss": -44.75260543823242, "global_step": 334207, "epoch": 2762} {"train_loss": -44.52583312988281, "global_step": 334208, "epoch": 2762} {"train_loss": -44.84461212158203, "global_step": 334209, "epoch": 2762} {"train_loss": -45.22480773925781, "global_step": 334210, "epoch": 2762} {"train_loss": -45.02307891845703, "global_step": 334211, "epoch": 2762} {"train_loss": -44.607810974121094, "global_step": 334212, "epoch": 2762} {"train_loss": -44.850059509277344, "global_step": 334213, "epoch": 2762} {"train_loss": -44.84528350830078, "global_step": 334214, "epoch": 2762} {"train_loss": -43.944881439208984, "global_step": 334215, "epoch": 2762} {"train_loss": -44.997589111328125, "global_step": 334216, "epoch": 2762} {"train_loss": -45.0313835144043, "global_step": 334217, "epoch": 2762} {"train_loss": -44.7188606262207, "global_step": 334218, "epoch": 2762} {"train_loss": -44.21204376220703, "global_step": 334219, "epoch": 2762} {"train_loss": -45.40679931640625, "global_step": 334220, "epoch": 2762} {"train_loss": -45.32313919067383, "global_step": 334221, "epoch": 2762} {"train_loss": -44.39487838745117, "global_step": 334222, "epoch": 2762} {"train_loss": -44.02878189086914, "global_step": 334223, "epoch": 2762} {"train_loss": -44.465118408203125, "global_step": 334224, "epoch": 2762} {"train_loss": -44.43367385864258, "global_step": 334225, "epoch": 2762} {"train_loss": -44.41807174682617, "global_step": 334226, "epoch": 2762} {"train_loss": -45.31348419189453, "global_step": 334227, "epoch": 2762} {"train_loss": -44.830318450927734, "global_step": 334228, "epoch": 2762} {"train_loss": -44.913570404052734, "global_step": 334229, "epoch": 2762} {"train_loss": -43.849571228027344, "global_step": 334230, "epoch": 2762} {"train_loss": -44.38176727294922, "global_step": 334231, "epoch": 2762} {"train_loss": -44.03776931762695, "global_step": 334232, "epoch": 2762} {"train_loss": -43.823333740234375, "global_step": 334233, "epoch": 2762} {"train_loss": -44.06480026245117, "global_step": 334234, "epoch": 2762} {"train_loss": -44.67351150512695, "global_step": 334235, "epoch": 2762} {"train_loss": -44.281978607177734, "global_step": 334236, "epoch": 2762} {"train_loss": -44.337833404541016, "global_step": 334237, "epoch": 2762} {"train_loss": -44.27131271362305, "global_step": 334238, "epoch": 2762} {"train_loss": -44.80165481567383, "global_step": 334239, "epoch": 2762} {"train_loss": -45.08912658691406, "global_step": 334240, "epoch": 2762} {"train_loss": -44.46629333496094, "global_step": 334241, "epoch": 2762} {"train_loss": -44.69936752319336, "global_step": 334242, "epoch": 2762} {"train_loss": -44.01318359375, "global_step": 334243, "epoch": 2762} {"train_loss": -44.337276458740234, "global_step": 334244, "epoch": 2762} {"train_loss": -45.106239318847656, "global_step": 334245, "epoch": 2762} {"train_loss": -44.398799896240234, "global_step": 334246, "epoch": 2762} {"train_loss": -43.54536056518555, "global_step": 334247, "epoch": 2762} {"train_loss": -44.619956970214844, "global_step": 334248, "epoch": 2762} {"train_loss": -44.38786697387695, "global_step": 334249, "epoch": 2762} {"train_loss": -43.30646514892578, "global_step": 334250, "epoch": 2762} {"train_loss": -44.18637466430664, "global_step": 334251, "epoch": 2762} {"train_loss": -44.041927337646484, "global_step": 334252, "epoch": 2762} {"train_loss": -44.152565002441406, "global_step": 334253, "epoch": 2762} {"train_loss": -45.03119659423828, "global_step": 334254, "epoch": 2762} {"train_loss": -43.655731201171875, "global_step": 334255, "epoch": 2762} {"train_loss": -44.6939811706543, "global_step": 334256, "epoch": 2762} {"train_loss": -44.79551696777344, "global_step": 334257, "epoch": 2762} {"train_loss": -44.62847137451172, "global_step": 334258, "epoch": 2762} {"train_loss": -44.63186264038086, "global_step": 334259, "epoch": 2762} {"train_loss": -44.82351303100586, "global_step": 334260, "epoch": 2762} {"train_loss": -44.959285736083984, "global_step": 334261, "epoch": 2762} {"train_loss": -44.793636322021484, "global_step": 334262, "epoch": 2762} {"train_loss": -44.302833557128906, "global_step": 334263, "epoch": 2762} {"train_loss": -44.968502044677734, "global_step": 334264, "epoch": 2762} {"train_loss": -44.430824279785156, "global_step": 334265, "epoch": 2762} {"train_loss": -43.48521423339844, "global_step": 334266, "epoch": 2762} {"train_loss": -43.72651290893555, "global_step": 334267, "epoch": 2762} {"train_loss": -43.91641616821289, "global_step": 334268, "epoch": 2762} {"train_loss": -44.724300384521484, "global_step": 334269, "epoch": 2762} {"train_loss": -44.419734954833984, "global_step": 334270, "epoch": 2762} {"train_loss": -43.17477035522461, "global_step": 334271, "epoch": 2762} {"train_loss": -43.41626739501953, "global_step": 334272, "epoch": 2762} {"train_loss": -43.0556755065918, "global_step": 334273, "epoch": 2762} {"train_loss": -44.60313415527344, "global_step": 334274, "epoch": 2762} {"train_loss": -44.68653869628906, "global_step": 334275, "epoch": 2762} {"train_loss": -43.742828369140625, "global_step": 334276, "epoch": 2762} {"train_loss": -42.4535026550293, "global_step": 334277, "epoch": 2762} {"train_loss": -41.538333892822266, "global_step": 334278, "epoch": 2762} {"train_loss": -44.59027099609375, "global_step": 334279, "epoch": 2762} {"train_loss": -42.25236892700195, "global_step": 334280, "epoch": 2762} {"train_loss": -40.27595138549805, "global_step": 334281, "epoch": 2762} {"train_loss": -44.189517974853516, "global_step": 334282, "epoch": 2762} {"train_loss": -39.78767776489258, "global_step": 334283, "epoch": 2762} {"train_loss": -42.506282806396484, "global_step": 334284, "epoch": 2762} {"train_loss": -42.5633659362793, "global_step": 334285, "epoch": 2762} {"train_loss": -40.91996383666992, "global_step": 334286, "epoch": 2762} {"train_loss": -42.0936164855957, "global_step": 334287, "epoch": 2762} {"train_loss": -42.736297607421875, "global_step": 334288, "epoch": 2762} {"train_loss": -43.12514114379883, "global_step": 334289, "epoch": 2762} {"train_loss": -42.50773239135742, "global_step": 334290, "epoch": 2762} {"train_loss": -42.45017623901367, "global_step": 334291, "epoch": 2762} {"train_loss": -43.62765121459961, "global_step": 334292, "epoch": 2762} {"train_loss": -42.91091537475586, "global_step": 334293, "epoch": 2762} {"train_loss": -43.467735290527344, "global_step": 334294, "epoch": 2762} {"train_loss": -44.077091217041016, "global_step": 334295, "epoch": 2762} {"train_loss": -42.5762825012207, "global_step": 334296, "epoch": 2762} {"train_loss": -43.52334213256836, "global_step": 334297, "epoch": 2762} {"train_loss": -43.64457702636719, "global_step": 334298, "epoch": 2762} {"train_loss": -44.00101852416992, "global_step": 334299, "epoch": 2762} {"train_loss": -42.7950553894043, "global_step": 334300, "epoch": 2762} {"train_loss": -44.56458282470703, "global_step": 334301, "epoch": 2762} {"train_loss": -43.721099853515625, "global_step": 334302, "epoch": 2762} {"train_loss": -43.211849212646484, "global_step": 334303, "epoch": 2762} {"train_loss": -43.11399459838867, "global_step": 334304, "epoch": 2762} {"train_loss": -41.911251068115234, "global_step": 334305, "epoch": 2762} {"train_loss": -43.61248779296875, "global_step": 334306, "epoch": 2762} {"train_loss": -43.22185134887695, "global_step": 334307, "epoch": 2762} {"train_loss": -43.025489807128906, "global_step": 334308, "epoch": 2762} {"train_loss": -43.65707015991211, "global_step": 334309, "epoch": 2762} {"train_loss": -44.47111892700195, "global_step": 334310, "epoch": 2762} {"train_loss": -43.96993637084961, "global_step": 334311, "epoch": 2762} {"train_loss": -44.210018157958984, "global_step": 334312, "epoch": 2762} {"train_loss": -45.09854507446289, "global_step": 334313, "epoch": 2762} {"train_loss": -43.60758972167969, "global_step": 334314, "epoch": 2762} {"train_loss": -43.48029327392578, "global_step": 334315, "epoch": 2762} {"train_loss": -44.63813400268555, "global_step": 334316, "epoch": 2762} {"train_loss": -43.76021957397461, "global_step": 334317, "epoch": 2762} {"train_loss": -43.43107986450195, "global_step": 334318, "epoch": 2762} {"train_loss": -44.9549560546875, "global_step": 334319, "epoch": 2762} {"train_loss": -43.71360397338867, "global_step": 334320, "epoch": 2762} {"train_loss": -43.55869674682617, "global_step": 334321, "epoch": 2762} {"train_loss": -43.98185055315002, "global_step": 334322, "epoch": 2762, "val_loss": 2479727.25} {"train_loss": -43.59518051147461, "global_step": 334323, "epoch": 2763} {"train_loss": -40.8213005065918, "global_step": 334324, "epoch": 2763} {"train_loss": -44.17121505737305, "global_step": 334325, "epoch": 2763} {"train_loss": -38.70380783081055, "global_step": 334326, "epoch": 2763} {"train_loss": -44.17954635620117, "global_step": 334327, "epoch": 2763} {"train_loss": -40.25520706176758, "global_step": 334328, "epoch": 2763} {"train_loss": -42.68891525268555, "global_step": 334329, "epoch": 2763} {"train_loss": -42.33018493652344, "global_step": 334330, "epoch": 2763} {"train_loss": -42.552764892578125, "global_step": 334331, "epoch": 2763} {"train_loss": -43.16093063354492, "global_step": 334332, "epoch": 2763} {"train_loss": -42.4548454284668, "global_step": 334333, "epoch": 2763} {"train_loss": -41.09336471557617, "global_step": 334334, "epoch": 2763} {"train_loss": -43.669586181640625, "global_step": 334335, "epoch": 2763} {"train_loss": -42.84864044189453, "global_step": 334336, "epoch": 2763} {"train_loss": -42.85970687866211, "global_step": 334337, "epoch": 2763} {"train_loss": -43.28878402709961, "global_step": 334338, "epoch": 2763} {"train_loss": -43.013179779052734, "global_step": 334339, "epoch": 2763} {"train_loss": -42.77777862548828, "global_step": 334340, "epoch": 2763} {"train_loss": -43.2498779296875, "global_step": 334341, "epoch": 2763} {"train_loss": -44.02296829223633, "global_step": 334342, "epoch": 2763} {"train_loss": -43.65888595581055, "global_step": 334343, "epoch": 2763} {"train_loss": -43.13124465942383, "global_step": 334344, "epoch": 2763} {"train_loss": -44.40620040893555, "global_step": 334345, "epoch": 2763} {"train_loss": -44.20355987548828, "global_step": 334346, "epoch": 2763} {"train_loss": -44.43164825439453, "global_step": 334347, "epoch": 2763} {"train_loss": -44.70613479614258, "global_step": 334348, "epoch": 2763} {"train_loss": -44.0831298828125, "global_step": 334349, "epoch": 2763} {"train_loss": -43.41538619995117, "global_step": 334350, "epoch": 2763} {"train_loss": -44.62662887573242, "global_step": 334351, "epoch": 2763} {"train_loss": -41.4302978515625, "global_step": 334352, "epoch": 2763} {"train_loss": -44.416927337646484, "global_step": 334353, "epoch": 2763} {"train_loss": -44.29138946533203, "global_step": 334354, "epoch": 2763} {"train_loss": -43.70208740234375, "global_step": 334355, "epoch": 2763} {"train_loss": -43.653411865234375, "global_step": 334356, "epoch": 2763} {"train_loss": -43.744667053222656, "global_step": 334357, "epoch": 2763} {"train_loss": -43.685462951660156, "global_step": 334358, "epoch": 2763} {"train_loss": -43.88721466064453, "global_step": 334359, "epoch": 2763} {"train_loss": -43.472129821777344, "global_step": 334360, "epoch": 2763} {"train_loss": -43.86690902709961, "global_step": 334361, "epoch": 2763} {"train_loss": -43.444122314453125, "global_step": 334362, "epoch": 2763} {"train_loss": -43.071556091308594, "global_step": 334363, "epoch": 2763} {"train_loss": -43.382568359375, "global_step": 334364, "epoch": 2763} {"train_loss": -44.189449310302734, "global_step": 334365, "epoch": 2763} {"train_loss": -43.93888473510742, "global_step": 334366, "epoch": 2763} {"train_loss": -43.818965911865234, "global_step": 334367, "epoch": 2763} {"train_loss": -44.3341178894043, "global_step": 334368, "epoch": 2763} {"train_loss": -44.03059005737305, "global_step": 334369, "epoch": 2763} {"train_loss": -44.27685546875, "global_step": 334370, "epoch": 2763} {"train_loss": -43.797523498535156, "global_step": 334371, "epoch": 2763} {"train_loss": -43.25666046142578, "global_step": 334372, "epoch": 2763} {"train_loss": -44.22964859008789, "global_step": 334373, "epoch": 2763} {"train_loss": -44.326229095458984, "global_step": 334374, "epoch": 2763} {"train_loss": -44.20831298828125, "global_step": 334375, "epoch": 2763} {"train_loss": -43.90102767944336, "global_step": 334376, "epoch": 2763} {"train_loss": -44.482666015625, "global_step": 334377, "epoch": 2763} {"train_loss": -44.53522872924805, "global_step": 334378, "epoch": 2763} {"train_loss": -44.6374626159668, "global_step": 334379, "epoch": 2763} {"train_loss": -43.713375091552734, "global_step": 334380, "epoch": 2763} {"train_loss": -44.63661193847656, "global_step": 334381, "epoch": 2763} {"train_loss": -44.66437911987305, "global_step": 334382, "epoch": 2763} {"train_loss": -44.41044235229492, "global_step": 334383, "epoch": 2763} {"train_loss": -44.96548080444336, "global_step": 334384, "epoch": 2763} {"train_loss": -45.07841873168945, "global_step": 334385, "epoch": 2763} {"train_loss": -45.0347785949707, "global_step": 334386, "epoch": 2763} {"train_loss": -43.596038818359375, "global_step": 334387, "epoch": 2763} {"train_loss": -44.03022003173828, "global_step": 334388, "epoch": 2763} {"train_loss": -44.09345626831055, "global_step": 334389, "epoch": 2763} {"train_loss": -44.524314880371094, "global_step": 334390, "epoch": 2763} {"train_loss": -43.88087844848633, "global_step": 334391, "epoch": 2763} {"train_loss": -43.5971794128418, "global_step": 334392, "epoch": 2763} {"train_loss": -44.51359558105469, "global_step": 334393, "epoch": 2763} {"train_loss": -43.706092834472656, "global_step": 334394, "epoch": 2763} {"train_loss": -44.126461029052734, "global_step": 334395, "epoch": 2763} {"train_loss": -43.96013259887695, "global_step": 334396, "epoch": 2763} {"train_loss": -44.85649490356445, "global_step": 334397, "epoch": 2763} {"train_loss": -43.49631881713867, "global_step": 334398, "epoch": 2763} {"train_loss": -44.11881637573242, "global_step": 334399, "epoch": 2763} {"train_loss": -44.5636100769043, "global_step": 334400, "epoch": 2763} {"train_loss": -43.69435501098633, "global_step": 334401, "epoch": 2763} {"train_loss": -44.095947265625, "global_step": 334402, "epoch": 2763} {"train_loss": -44.19091796875, "global_step": 334403, "epoch": 2763} {"train_loss": -44.581661224365234, "global_step": 334404, "epoch": 2763} {"train_loss": -44.88300704956055, "global_step": 334405, "epoch": 2763} {"train_loss": -44.778289794921875, "global_step": 334406, "epoch": 2763} {"train_loss": -44.373626708984375, "global_step": 334407, "epoch": 2763} {"train_loss": -44.59763717651367, "global_step": 334408, "epoch": 2763} {"train_loss": -43.969207763671875, "global_step": 334409, "epoch": 2763} {"train_loss": -44.44318389892578, "global_step": 334410, "epoch": 2763} {"train_loss": -44.957740783691406, "global_step": 334411, "epoch": 2763} {"train_loss": -44.238243103027344, "global_step": 334412, "epoch": 2763} {"train_loss": -44.056270599365234, "global_step": 334413, "epoch": 2763} {"train_loss": -44.84682846069336, "global_step": 334414, "epoch": 2763} {"train_loss": -44.552791595458984, "global_step": 334415, "epoch": 2763} {"train_loss": -42.794410705566406, "global_step": 334416, "epoch": 2763} {"train_loss": -44.5059700012207, "global_step": 334417, "epoch": 2763} {"train_loss": -44.30547332763672, "global_step": 334418, "epoch": 2763} {"train_loss": -43.73891830444336, "global_step": 334419, "epoch": 2763} {"train_loss": -44.63701248168945, "global_step": 334420, "epoch": 2763} {"train_loss": -43.903465270996094, "global_step": 334421, "epoch": 2763} {"train_loss": -44.15729904174805, "global_step": 334422, "epoch": 2763} {"train_loss": -44.753211975097656, "global_step": 334423, "epoch": 2763} {"train_loss": -44.4580078125, "global_step": 334424, "epoch": 2763} {"train_loss": -43.7877197265625, "global_step": 334425, "epoch": 2763} {"train_loss": -44.69388961791992, "global_step": 334426, "epoch": 2763} {"train_loss": -44.95133590698242, "global_step": 334427, "epoch": 2763} {"train_loss": -44.01533889770508, "global_step": 334428, "epoch": 2763} {"train_loss": -44.03160858154297, "global_step": 334429, "epoch": 2763} {"train_loss": -44.47067642211914, "global_step": 334430, "epoch": 2763} {"train_loss": -44.44853210449219, "global_step": 334431, "epoch": 2763} {"train_loss": -44.51753616333008, "global_step": 334432, "epoch": 2763} {"train_loss": -44.454166412353516, "global_step": 334433, "epoch": 2763} {"train_loss": -43.94709396362305, "global_step": 334434, "epoch": 2763} {"train_loss": -44.07004928588867, "global_step": 334435, "epoch": 2763} {"train_loss": -45.02790451049805, "global_step": 334436, "epoch": 2763} {"train_loss": -43.7430534362793, "global_step": 334437, "epoch": 2763} {"train_loss": -43.28690719604492, "global_step": 334438, "epoch": 2763} {"train_loss": -44.6790885925293, "global_step": 334439, "epoch": 2763} {"train_loss": -44.245243072509766, "global_step": 334440, "epoch": 2763} {"train_loss": -44.293697357177734, "global_step": 334441, "epoch": 2763} {"train_loss": -44.274986267089844, "global_step": 334442, "epoch": 2763} {"train_loss": -43.888176878621756, "global_step": 334443, "epoch": 2763, "val_loss": 2564214.5} {"train_loss": -44.46914291381836, "global_step": 334444, "epoch": 2764} {"train_loss": -43.794288635253906, "global_step": 334445, "epoch": 2764} {"train_loss": -44.759849548339844, "global_step": 334446, "epoch": 2764} {"train_loss": -44.35296630859375, "global_step": 334447, "epoch": 2764} {"train_loss": -44.0881233215332, "global_step": 334448, "epoch": 2764} {"train_loss": -43.10293197631836, "global_step": 334449, "epoch": 2764} {"train_loss": -44.0526237487793, "global_step": 334450, "epoch": 2764} {"train_loss": -42.84410858154297, "global_step": 334451, "epoch": 2764} {"train_loss": -37.40285873413086, "global_step": 334452, "epoch": 2764} {"train_loss": -40.4796257019043, "global_step": 334453, "epoch": 2764} {"train_loss": -28.512548446655273, "global_step": 334454, "epoch": 2764} {"train_loss": -17.395551681518555, "global_step": 334455, "epoch": 2764} {"train_loss": -35.08060836791992, "global_step": 334456, "epoch": 2764} {"train_loss": -18.5269718170166, "global_step": 334457, "epoch": 2764} {"train_loss": -33.105751037597656, "global_step": 334458, "epoch": 2764} {"train_loss": -23.14657211303711, "global_step": 334459, "epoch": 2764} {"train_loss": -33.29011154174805, "global_step": 334460, "epoch": 2764} {"train_loss": -31.0799617767334, "global_step": 334461, "epoch": 2764} {"train_loss": -29.473840713500977, "global_step": 334462, "epoch": 2764} {"train_loss": -35.0084114074707, "global_step": 334463, "epoch": 2764} {"train_loss": -31.768918991088867, "global_step": 334464, "epoch": 2764} {"train_loss": -33.894287109375, "global_step": 334465, "epoch": 2764} {"train_loss": -34.96498107910156, "global_step": 334466, "epoch": 2764} {"train_loss": -35.270057678222656, "global_step": 334467, "epoch": 2764} {"train_loss": -35.36442184448242, "global_step": 334468, "epoch": 2764} {"train_loss": -35.361053466796875, "global_step": 334469, "epoch": 2764} {"train_loss": -35.109066009521484, "global_step": 334470, "epoch": 2764} {"train_loss": -35.589229583740234, "global_step": 334471, "epoch": 2764} {"train_loss": -34.86307907104492, "global_step": 334472, "epoch": 2764} {"train_loss": -34.69094467163086, "global_step": 334473, "epoch": 2764} {"train_loss": -36.06927490234375, "global_step": 334474, "epoch": 2764} {"train_loss": -35.882076263427734, "global_step": 334475, "epoch": 2764} {"train_loss": -35.99776840209961, "global_step": 334476, "epoch": 2764} {"train_loss": -36.50105667114258, "global_step": 334477, "epoch": 2764} {"train_loss": -36.952003479003906, "global_step": 334478, "epoch": 2764} {"train_loss": -35.682289123535156, "global_step": 334479, "epoch": 2764} {"train_loss": -36.99039840698242, "global_step": 334480, "epoch": 2764} {"train_loss": -36.22559356689453, "global_step": 334481, "epoch": 2764} {"train_loss": -37.24274826049805, "global_step": 334482, "epoch": 2764} {"train_loss": -38.03460693359375, "global_step": 334483, "epoch": 2764} {"train_loss": -36.54933166503906, "global_step": 334484, "epoch": 2764} {"train_loss": -36.616737365722656, "global_step": 334485, "epoch": 2764} {"train_loss": -38.16506576538086, "global_step": 334486, "epoch": 2764} {"train_loss": -36.954864501953125, "global_step": 334487, "epoch": 2764} {"train_loss": -37.13204574584961, "global_step": 334488, "epoch": 2764} {"train_loss": -37.45185852050781, "global_step": 334489, "epoch": 2764} {"train_loss": -37.78036880493164, "global_step": 334490, "epoch": 2764} {"train_loss": -37.582576751708984, "global_step": 334491, "epoch": 2764} {"train_loss": -38.173213958740234, "global_step": 334492, "epoch": 2764} {"train_loss": -38.466182708740234, "global_step": 334493, "epoch": 2764} {"train_loss": -38.3873176574707, "global_step": 334494, "epoch": 2764} {"train_loss": -38.04664993286133, "global_step": 334495, "epoch": 2764} {"train_loss": -39.30009460449219, "global_step": 334496, "epoch": 2764} {"train_loss": -38.407169342041016, "global_step": 334497, "epoch": 2764} {"train_loss": -39.09777069091797, "global_step": 334498, "epoch": 2764} {"train_loss": -38.57455062866211, "global_step": 334499, "epoch": 2764} {"train_loss": -38.62723159790039, "global_step": 334500, "epoch": 2764} {"train_loss": -38.76837158203125, "global_step": 334501, "epoch": 2764} {"train_loss": -39.141754150390625, "global_step": 334502, "epoch": 2764} {"train_loss": -38.94928741455078, "global_step": 334503, "epoch": 2764} {"train_loss": -38.577430725097656, "global_step": 334504, "epoch": 2764} {"train_loss": -38.89714431762695, "global_step": 334505, "epoch": 2764} {"train_loss": -40.058441162109375, "global_step": 334506, "epoch": 2764} {"train_loss": -39.495887756347656, "global_step": 334507, "epoch": 2764} {"train_loss": -39.842041015625, "global_step": 334508, "epoch": 2764} {"train_loss": -39.650264739990234, "global_step": 334509, "epoch": 2764} {"train_loss": -39.63249969482422, "global_step": 334510, "epoch": 2764} {"train_loss": -40.2714958190918, "global_step": 334511, "epoch": 2764} {"train_loss": -40.096473693847656, "global_step": 334512, "epoch": 2764} {"train_loss": -40.334197998046875, "global_step": 334513, "epoch": 2764} {"train_loss": -40.414344787597656, "global_step": 334514, "epoch": 2764} {"train_loss": -40.79523468017578, "global_step": 334515, "epoch": 2764} {"train_loss": -40.34423065185547, "global_step": 334516, "epoch": 2764} {"train_loss": -40.31862258911133, "global_step": 334517, "epoch": 2764} {"train_loss": -40.75372314453125, "global_step": 334518, "epoch": 2764} {"train_loss": -40.38444137573242, "global_step": 334519, "epoch": 2764} {"train_loss": -40.97835159301758, "global_step": 334520, "epoch": 2764} {"train_loss": -40.36931610107422, "global_step": 334521, "epoch": 2764} {"train_loss": -40.633663177490234, "global_step": 334522, "epoch": 2764} {"train_loss": -40.9342041015625, "global_step": 334523, "epoch": 2764} {"train_loss": -41.13302993774414, "global_step": 334524, "epoch": 2764} {"train_loss": -40.98287582397461, "global_step": 334525, "epoch": 2764} {"train_loss": -41.20394515991211, "global_step": 334526, "epoch": 2764} {"train_loss": -41.14047622680664, "global_step": 334527, "epoch": 2764} {"train_loss": -41.29610824584961, "global_step": 334528, "epoch": 2764} {"train_loss": -41.73704147338867, "global_step": 334529, "epoch": 2764} {"train_loss": -41.74760055541992, "global_step": 334530, "epoch": 2764} {"train_loss": -41.118099212646484, "global_step": 334531, "epoch": 2764} {"train_loss": -41.56114196777344, "global_step": 334532, "epoch": 2764} {"train_loss": -41.00121307373047, "global_step": 334533, "epoch": 2764} {"train_loss": -40.694732666015625, "global_step": 334534, "epoch": 2764} {"train_loss": -39.099918365478516, "global_step": 334535, "epoch": 2764} {"train_loss": -39.502559661865234, "global_step": 334536, "epoch": 2764} {"train_loss": -41.7556266784668, "global_step": 334537, "epoch": 2764} {"train_loss": -40.517364501953125, "global_step": 334538, "epoch": 2764} {"train_loss": -41.142967224121094, "global_step": 334539, "epoch": 2764} {"train_loss": -41.85115432739258, "global_step": 334540, "epoch": 2764} {"train_loss": -41.592445373535156, "global_step": 334541, "epoch": 2764} {"train_loss": -41.307003021240234, "global_step": 334542, "epoch": 2764} {"train_loss": -40.96125411987305, "global_step": 334543, "epoch": 2764} {"train_loss": -41.57472610473633, "global_step": 334544, "epoch": 2764} {"train_loss": -41.60315704345703, "global_step": 334545, "epoch": 2764} {"train_loss": -41.507633209228516, "global_step": 334546, "epoch": 2764} {"train_loss": -41.62787628173828, "global_step": 334547, "epoch": 2764} {"train_loss": -41.60133361816406, "global_step": 334548, "epoch": 2764} {"train_loss": -41.918304443359375, "global_step": 334549, "epoch": 2764} {"train_loss": -42.097232818603516, "global_step": 334550, "epoch": 2764} {"train_loss": -41.85764694213867, "global_step": 334551, "epoch": 2764} {"train_loss": -42.073448181152344, "global_step": 334552, "epoch": 2764} {"train_loss": -42.855224609375, "global_step": 334553, "epoch": 2764} {"train_loss": -42.2012825012207, "global_step": 334554, "epoch": 2764} {"train_loss": -42.3014030456543, "global_step": 334555, "epoch": 2764} {"train_loss": -42.038875579833984, "global_step": 334556, "epoch": 2764} {"train_loss": -42.59526062011719, "global_step": 334557, "epoch": 2764} {"train_loss": -42.881168365478516, "global_step": 334558, "epoch": 2764} {"train_loss": -42.003204345703125, "global_step": 334559, "epoch": 2764} {"train_loss": -41.99525833129883, "global_step": 334560, "epoch": 2764} {"train_loss": -42.95037078857422, "global_step": 334561, "epoch": 2764} {"train_loss": -42.83354568481445, "global_step": 334562, "epoch": 2764} {"train_loss": -42.665184020996094, "global_step": 334563, "epoch": 2764} {"train_loss": -38.82622881172117, "global_step": 334564, "epoch": 2764, "val_loss": 2578486.75} {"train_loss": -42.87592315673828, "global_step": 334565, "epoch": 2765} {"train_loss": -42.639034271240234, "global_step": 334566, "epoch": 2765} {"train_loss": -42.20347213745117, "global_step": 334567, "epoch": 2765} {"train_loss": -40.09720993041992, "global_step": 334568, "epoch": 2765} {"train_loss": -39.812686920166016, "global_step": 334569, "epoch": 2765} {"train_loss": -42.6964225769043, "global_step": 334570, "epoch": 2765} {"train_loss": -41.623653411865234, "global_step": 334571, "epoch": 2765} {"train_loss": -40.6698112487793, "global_step": 334572, "epoch": 2765} {"train_loss": -42.77932357788086, "global_step": 334573, "epoch": 2765} {"train_loss": -40.90391540527344, "global_step": 334574, "epoch": 2765} {"train_loss": -42.995704650878906, "global_step": 334575, "epoch": 2765} {"train_loss": -40.88359069824219, "global_step": 334576, "epoch": 2765} {"train_loss": -42.898555755615234, "global_step": 334577, "epoch": 2765} {"train_loss": -42.53482437133789, "global_step": 334578, "epoch": 2765} {"train_loss": -41.944252014160156, "global_step": 334579, "epoch": 2765} {"train_loss": -42.3593864440918, "global_step": 334580, "epoch": 2765} {"train_loss": -41.058509826660156, "global_step": 334581, "epoch": 2765} {"train_loss": -42.47774887084961, "global_step": 334582, "epoch": 2765} {"train_loss": -42.32854080200195, "global_step": 334583, "epoch": 2765} {"train_loss": -43.13096237182617, "global_step": 334584, "epoch": 2765} {"train_loss": -42.28647994995117, "global_step": 334585, "epoch": 2765} {"train_loss": -42.518367767333984, "global_step": 334586, "epoch": 2765} {"train_loss": -42.358848571777344, "global_step": 334587, "epoch": 2765} {"train_loss": -43.09501266479492, "global_step": 334588, "epoch": 2765} {"train_loss": -41.99467086791992, "global_step": 334589, "epoch": 2765} {"train_loss": -41.89518356323242, "global_step": 334590, "epoch": 2765} {"train_loss": -42.3584098815918, "global_step": 334591, "epoch": 2765} {"train_loss": -43.00324630737305, "global_step": 334592, "epoch": 2765} {"train_loss": -41.7234001159668, "global_step": 334593, "epoch": 2765} {"train_loss": -42.682579040527344, "global_step": 334594, "epoch": 2765} {"train_loss": -41.98988723754883, "global_step": 334595, "epoch": 2765} {"train_loss": -41.94979476928711, "global_step": 334596, "epoch": 2765} {"train_loss": -42.186492919921875, "global_step": 334597, "epoch": 2765} {"train_loss": -41.794342041015625, "global_step": 334598, "epoch": 2765} {"train_loss": -42.341529846191406, "global_step": 334599, "epoch": 2765} {"train_loss": -42.28908920288086, "global_step": 334600, "epoch": 2765} {"train_loss": -42.710445404052734, "global_step": 334601, "epoch": 2765} {"train_loss": -42.21706008911133, "global_step": 334602, "epoch": 2765} {"train_loss": -41.6230583190918, "global_step": 334603, "epoch": 2765} {"train_loss": -42.308128356933594, "global_step": 334604, "epoch": 2765} {"train_loss": -42.4570426940918, "global_step": 334605, "epoch": 2765} {"train_loss": -41.961204528808594, "global_step": 334606, "epoch": 2765} {"train_loss": -42.47268295288086, "global_step": 334607, "epoch": 2765} {"train_loss": -42.400360107421875, "global_step": 334608, "epoch": 2765} {"train_loss": -42.77230453491211, "global_step": 334609, "epoch": 2765} {"train_loss": -42.359840393066406, "global_step": 334610, "epoch": 2765} {"train_loss": -43.09221267700195, "global_step": 334611, "epoch": 2765} {"train_loss": -41.836666107177734, "global_step": 334612, "epoch": 2765} {"train_loss": -41.43526840209961, "global_step": 334613, "epoch": 2765} {"train_loss": -42.31613540649414, "global_step": 334614, "epoch": 2765} {"train_loss": -41.54266357421875, "global_step": 334615, "epoch": 2765} {"train_loss": -42.094879150390625, "global_step": 334616, "epoch": 2765} {"train_loss": -41.089561462402344, "global_step": 334617, "epoch": 2765} {"train_loss": -40.57725524902344, "global_step": 334618, "epoch": 2765} {"train_loss": -42.32126998901367, "global_step": 334619, "epoch": 2765} {"train_loss": -40.59281539916992, "global_step": 334620, "epoch": 2765} {"train_loss": -41.05678939819336, "global_step": 334621, "epoch": 2765} {"train_loss": -42.06467056274414, "global_step": 334622, "epoch": 2765} {"train_loss": -42.034610748291016, "global_step": 334623, "epoch": 2765} {"train_loss": -42.078582763671875, "global_step": 334624, "epoch": 2765} {"train_loss": -41.79053497314453, "global_step": 334625, "epoch": 2765} {"train_loss": -40.58576202392578, "global_step": 334626, "epoch": 2765} {"train_loss": -42.930789947509766, "global_step": 334627, "epoch": 2765} {"train_loss": -41.91130065917969, "global_step": 334628, "epoch": 2765} {"train_loss": -42.00236511230469, "global_step": 334629, "epoch": 2765} {"train_loss": -42.360103607177734, "global_step": 334630, "epoch": 2765} {"train_loss": -38.81507110595703, "global_step": 334631, "epoch": 2765} {"train_loss": -41.67631149291992, "global_step": 334632, "epoch": 2765} {"train_loss": -42.3148307800293, "global_step": 334633, "epoch": 2765} {"train_loss": -41.8308219909668, "global_step": 334634, "epoch": 2765} {"train_loss": -43.17216873168945, "global_step": 334635, "epoch": 2765} {"train_loss": -42.2343635559082, "global_step": 334636, "epoch": 2765} {"train_loss": -42.28125762939453, "global_step": 334637, "epoch": 2765} {"train_loss": -39.050323486328125, "global_step": 334638, "epoch": 2765} {"train_loss": -43.010986328125, "global_step": 334639, "epoch": 2765} {"train_loss": -41.9737434387207, "global_step": 334640, "epoch": 2765} {"train_loss": -42.0609245300293, "global_step": 334641, "epoch": 2765} {"train_loss": -42.748958587646484, "global_step": 334642, "epoch": 2765} {"train_loss": -42.89467239379883, "global_step": 334643, "epoch": 2765} {"train_loss": -42.37518310546875, "global_step": 334644, "epoch": 2765} {"train_loss": -42.64407730102539, "global_step": 334645, "epoch": 2765} {"train_loss": -42.03374481201172, "global_step": 334646, "epoch": 2765} {"train_loss": -41.25600051879883, "global_step": 334647, "epoch": 2765} {"train_loss": -42.815635681152344, "global_step": 334648, "epoch": 2765} {"train_loss": -42.9800910949707, "global_step": 334649, "epoch": 2765} {"train_loss": -43.45070266723633, "global_step": 334650, "epoch": 2765} {"train_loss": -38.24992752075195, "global_step": 334651, "epoch": 2765} {"train_loss": -42.54594039916992, "global_step": 334652, "epoch": 2765} {"train_loss": -43.1311149597168, "global_step": 334653, "epoch": 2765} {"train_loss": -42.441463470458984, "global_step": 334654, "epoch": 2765} {"train_loss": -42.08381652832031, "global_step": 334655, "epoch": 2765} {"train_loss": -42.32133865356445, "global_step": 334656, "epoch": 2765} {"train_loss": -38.71568298339844, "global_step": 334657, "epoch": 2765} {"train_loss": -38.59519577026367, "global_step": 334658, "epoch": 2765} {"train_loss": -42.36359786987305, "global_step": 334659, "epoch": 2765} {"train_loss": -40.082027435302734, "global_step": 334660, "epoch": 2765} {"train_loss": -42.96760940551758, "global_step": 334661, "epoch": 2765} {"train_loss": -36.467063903808594, "global_step": 334662, "epoch": 2765} {"train_loss": -42.3766975402832, "global_step": 334663, "epoch": 2765} {"train_loss": -30.922306060791016, "global_step": 334664, "epoch": 2765} {"train_loss": -34.094764709472656, "global_step": 334665, "epoch": 2765} {"train_loss": -36.21326446533203, "global_step": 334666, "epoch": 2765} {"train_loss": -40.93833541870117, "global_step": 334667, "epoch": 2765} {"train_loss": -35.8608512878418, "global_step": 334668, "epoch": 2765} {"train_loss": -40.358638763427734, "global_step": 334669, "epoch": 2765} {"train_loss": -39.85990524291992, "global_step": 334670, "epoch": 2765} {"train_loss": -41.86371612548828, "global_step": 334671, "epoch": 2765} {"train_loss": -33.8436164855957, "global_step": 334672, "epoch": 2765} {"train_loss": -37.97907257080078, "global_step": 334673, "epoch": 2765} {"train_loss": -40.71107864379883, "global_step": 334674, "epoch": 2765} {"train_loss": -38.86933898925781, "global_step": 334675, "epoch": 2765} {"train_loss": -39.8685188293457, "global_step": 334676, "epoch": 2765} {"train_loss": -39.83275604248047, "global_step": 334677, "epoch": 2765} {"train_loss": -40.157958984375, "global_step": 334678, "epoch": 2765} {"train_loss": -38.04756546020508, "global_step": 334679, "epoch": 2765} {"train_loss": -40.182891845703125, "global_step": 334680, "epoch": 2765} {"train_loss": -40.1579704284668, "global_step": 334681, "epoch": 2765} {"train_loss": -39.428035736083984, "global_step": 334682, "epoch": 2765} {"train_loss": -35.600433349609375, "global_step": 334683, "epoch": 2765} {"train_loss": -37.99872589111328, "global_step": 334684, "epoch": 2765} {"train_loss": -41.24693077654878, "global_step": 334685, "epoch": 2765, "val_loss": 4102178.75} {"train_loss": -39.04837417602539, "global_step": 334686, "epoch": 2766} {"train_loss": -40.057289123535156, "global_step": 334687, "epoch": 2766} {"train_loss": -36.39707565307617, "global_step": 334688, "epoch": 2766} {"train_loss": -39.96633529663086, "global_step": 334689, "epoch": 2766} {"train_loss": -40.09139633178711, "global_step": 334690, "epoch": 2766} {"train_loss": -40.99941635131836, "global_step": 334691, "epoch": 2766} {"train_loss": -40.573883056640625, "global_step": 334692, "epoch": 2766} {"train_loss": -36.41219711303711, "global_step": 334693, "epoch": 2766} {"train_loss": -41.1609992980957, "global_step": 334694, "epoch": 2766} {"train_loss": -40.73051834106445, "global_step": 334695, "epoch": 2766} {"train_loss": -39.46770095825195, "global_step": 334696, "epoch": 2766} {"train_loss": -39.90346145629883, "global_step": 334697, "epoch": 2766} {"train_loss": -39.305992126464844, "global_step": 334698, "epoch": 2766} {"train_loss": -39.728214263916016, "global_step": 334699, "epoch": 2766} {"train_loss": -40.406211853027344, "global_step": 334700, "epoch": 2766} {"train_loss": -39.23588180541992, "global_step": 334701, "epoch": 2766} {"train_loss": -38.464542388916016, "global_step": 334702, "epoch": 2766} {"train_loss": -40.94706344604492, "global_step": 334703, "epoch": 2766} {"train_loss": -39.36617660522461, "global_step": 334704, "epoch": 2766} {"train_loss": -40.295169830322266, "global_step": 334705, "epoch": 2766} {"train_loss": -38.258487701416016, "global_step": 334706, "epoch": 2766} {"train_loss": -39.128055572509766, "global_step": 334707, "epoch": 2766} {"train_loss": -39.5688362121582, "global_step": 334708, "epoch": 2766} {"train_loss": -41.35951614379883, "global_step": 334709, "epoch": 2766} {"train_loss": -39.592140197753906, "global_step": 334710, "epoch": 2766} {"train_loss": -40.57789611816406, "global_step": 334711, "epoch": 2766} {"train_loss": -40.82790756225586, "global_step": 334712, "epoch": 2766} {"train_loss": -41.36025619506836, "global_step": 334713, "epoch": 2766} {"train_loss": -40.72031021118164, "global_step": 334714, "epoch": 2766} {"train_loss": -40.81508255004883, "global_step": 334715, "epoch": 2766} {"train_loss": -42.598785400390625, "global_step": 334716, "epoch": 2766} {"train_loss": -41.79226303100586, "global_step": 334717, "epoch": 2766} {"train_loss": -42.264854431152344, "global_step": 334718, "epoch": 2766} {"train_loss": -39.96230697631836, "global_step": 334719, "epoch": 2766} {"train_loss": -41.937320709228516, "global_step": 334720, "epoch": 2766} {"train_loss": -42.456939697265625, "global_step": 334721, "epoch": 2766} {"train_loss": -42.056026458740234, "global_step": 334722, "epoch": 2766} {"train_loss": -43.08379364013672, "global_step": 334723, "epoch": 2766} {"train_loss": -42.0819091796875, "global_step": 334724, "epoch": 2766} {"train_loss": -41.96413803100586, "global_step": 334725, "epoch": 2766} {"train_loss": -41.77737045288086, "global_step": 334726, "epoch": 2766} {"train_loss": -42.05404281616211, "global_step": 334727, "epoch": 2766} {"train_loss": -41.813655853271484, "global_step": 334728, "epoch": 2766} {"train_loss": -42.1326904296875, "global_step": 334729, "epoch": 2766} {"train_loss": -42.02186965942383, "global_step": 334730, "epoch": 2766} {"train_loss": -41.555641174316406, "global_step": 334731, "epoch": 2766} {"train_loss": -42.790191650390625, "global_step": 334732, "epoch": 2766} {"train_loss": -42.249176025390625, "global_step": 334733, "epoch": 2766} {"train_loss": -42.467201232910156, "global_step": 334734, "epoch": 2766} {"train_loss": -43.129764556884766, "global_step": 334735, "epoch": 2766} {"train_loss": -42.93124008178711, "global_step": 334736, "epoch": 2766} {"train_loss": -42.19344711303711, "global_step": 334737, "epoch": 2766} {"train_loss": -43.73969268798828, "global_step": 334738, "epoch": 2766} {"train_loss": -43.79714584350586, "global_step": 334739, "epoch": 2766} {"train_loss": -42.54085159301758, "global_step": 334740, "epoch": 2766} {"train_loss": -43.284786224365234, "global_step": 334741, "epoch": 2766} {"train_loss": -43.032962799072266, "global_step": 334742, "epoch": 2766} {"train_loss": -43.33973693847656, "global_step": 334743, "epoch": 2766} {"train_loss": -43.77272415161133, "global_step": 334744, "epoch": 2766} {"train_loss": -42.562984466552734, "global_step": 334745, "epoch": 2766} {"train_loss": -43.20735549926758, "global_step": 334746, "epoch": 2766} {"train_loss": -43.418212890625, "global_step": 334747, "epoch": 2766} {"train_loss": -43.435279846191406, "global_step": 334748, "epoch": 2766} {"train_loss": -43.03657150268555, "global_step": 334749, "epoch": 2766} {"train_loss": -43.18679428100586, "global_step": 334750, "epoch": 2766} {"train_loss": -42.56629943847656, "global_step": 334751, "epoch": 2766} {"train_loss": -43.22142028808594, "global_step": 334752, "epoch": 2766} {"train_loss": -43.31425094604492, "global_step": 334753, "epoch": 2766} {"train_loss": -43.99701690673828, "global_step": 334754, "epoch": 2766} {"train_loss": -42.19733810424805, "global_step": 334755, "epoch": 2766} {"train_loss": -44.35861587524414, "global_step": 334756, "epoch": 2766} {"train_loss": -42.73972702026367, "global_step": 334757, "epoch": 2766} {"train_loss": -44.39710235595703, "global_step": 334758, "epoch": 2766} {"train_loss": -43.579708099365234, "global_step": 334759, "epoch": 2766} {"train_loss": -43.372737884521484, "global_step": 334760, "epoch": 2766} {"train_loss": -43.575469970703125, "global_step": 334761, "epoch": 2766} {"train_loss": -43.22199249267578, "global_step": 334762, "epoch": 2766} {"train_loss": -43.108158111572266, "global_step": 334763, "epoch": 2766} {"train_loss": -39.68023681640625, "global_step": 334764, "epoch": 2766} {"train_loss": -44.139747619628906, "global_step": 334765, "epoch": 2766} {"train_loss": -43.676971435546875, "global_step": 334766, "epoch": 2766} {"train_loss": -44.28246307373047, "global_step": 334767, "epoch": 2766} {"train_loss": -43.511756896972656, "global_step": 334768, "epoch": 2766} {"train_loss": -43.604225158691406, "global_step": 334769, "epoch": 2766} {"train_loss": -42.178524017333984, "global_step": 334770, "epoch": 2766} {"train_loss": -44.45122528076172, "global_step": 334771, "epoch": 2766} {"train_loss": -42.006996154785156, "global_step": 334772, "epoch": 2766} {"train_loss": -43.8975715637207, "global_step": 334773, "epoch": 2766} {"train_loss": -43.306888580322266, "global_step": 334774, "epoch": 2766} {"train_loss": -44.25484085083008, "global_step": 334775, "epoch": 2766} {"train_loss": -43.20907211303711, "global_step": 334776, "epoch": 2766} {"train_loss": -43.1906852722168, "global_step": 334777, "epoch": 2766} {"train_loss": -43.30451583862305, "global_step": 334778, "epoch": 2766} {"train_loss": -44.372108459472656, "global_step": 334779, "epoch": 2766} {"train_loss": -43.14324951171875, "global_step": 334780, "epoch": 2766} {"train_loss": -43.8265380859375, "global_step": 334781, "epoch": 2766} {"train_loss": -43.287349700927734, "global_step": 334782, "epoch": 2766} {"train_loss": -43.76680374145508, "global_step": 334783, "epoch": 2766} {"train_loss": -42.99934768676758, "global_step": 334784, "epoch": 2766} {"train_loss": -43.64007568359375, "global_step": 334785, "epoch": 2766} {"train_loss": -44.06737518310547, "global_step": 334786, "epoch": 2766} {"train_loss": -42.767578125, "global_step": 334787, "epoch": 2766} {"train_loss": -42.92292785644531, "global_step": 334788, "epoch": 2766} {"train_loss": -43.211769104003906, "global_step": 334789, "epoch": 2766} {"train_loss": -42.54792022705078, "global_step": 334790, "epoch": 2766} {"train_loss": -44.01640701293945, "global_step": 334791, "epoch": 2766} {"train_loss": -42.58368682861328, "global_step": 334792, "epoch": 2766} {"train_loss": -43.83096694946289, "global_step": 334793, "epoch": 2766} {"train_loss": -43.660823822021484, "global_step": 334794, "epoch": 2766} {"train_loss": -42.447235107421875, "global_step": 334795, "epoch": 2766} {"train_loss": -43.660396575927734, "global_step": 334796, "epoch": 2766} {"train_loss": -40.03623580932617, "global_step": 334797, "epoch": 2766} {"train_loss": -40.69028854370117, "global_step": 334798, "epoch": 2766} {"train_loss": -41.0120735168457, "global_step": 334799, "epoch": 2766} {"train_loss": -40.14205551147461, "global_step": 334800, "epoch": 2766} {"train_loss": -40.841670989990234, "global_step": 334801, "epoch": 2766} {"train_loss": -40.546485900878906, "global_step": 334802, "epoch": 2766} {"train_loss": -40.94026184082031, "global_step": 334803, "epoch": 2766} {"train_loss": -41.39580535888672, "global_step": 334804, "epoch": 2766} {"train_loss": -40.5157585144043, "global_step": 334805, "epoch": 2766} {"train_loss": -42.013000046911316, "global_step": 334806, "epoch": 2766, "val_loss": 2694016.25} {"train_loss": -40.53015899658203, "global_step": 334807, "epoch": 2767} {"train_loss": -39.98310089111328, "global_step": 334808, "epoch": 2767} {"train_loss": -40.38259506225586, "global_step": 334809, "epoch": 2767} {"train_loss": -40.455936431884766, "global_step": 334810, "epoch": 2767} {"train_loss": -38.35040283203125, "global_step": 334811, "epoch": 2767} {"train_loss": -38.793251037597656, "global_step": 334812, "epoch": 2767} {"train_loss": -41.143043518066406, "global_step": 334813, "epoch": 2767} {"train_loss": -40.255592346191406, "global_step": 334814, "epoch": 2767} {"train_loss": -40.64008331298828, "global_step": 334815, "epoch": 2767} {"train_loss": -40.92171096801758, "global_step": 334816, "epoch": 2767} {"train_loss": -40.0456428527832, "global_step": 334817, "epoch": 2767} {"train_loss": -41.35560607910156, "global_step": 334818, "epoch": 2767} {"train_loss": -40.28898239135742, "global_step": 334819, "epoch": 2767} {"train_loss": -41.56216049194336, "global_step": 334820, "epoch": 2767} {"train_loss": -40.823341369628906, "global_step": 334821, "epoch": 2767} {"train_loss": -41.08626937866211, "global_step": 334822, "epoch": 2767} {"train_loss": -41.5341911315918, "global_step": 334823, "epoch": 2767} {"train_loss": -41.81427764892578, "global_step": 334824, "epoch": 2767} {"train_loss": -41.3460807800293, "global_step": 334825, "epoch": 2767} {"train_loss": -42.37758255004883, "global_step": 334826, "epoch": 2767} {"train_loss": -41.27531051635742, "global_step": 334827, "epoch": 2767} {"train_loss": -42.45374298095703, "global_step": 334828, "epoch": 2767} {"train_loss": -41.99490737915039, "global_step": 334829, "epoch": 2767} {"train_loss": -42.0277214050293, "global_step": 334830, "epoch": 2767} {"train_loss": -41.637840270996094, "global_step": 334831, "epoch": 2767} {"train_loss": -42.95626449584961, "global_step": 334832, "epoch": 2767} {"train_loss": -42.67985153198242, "global_step": 334833, "epoch": 2767} {"train_loss": -43.70945358276367, "global_step": 334834, "epoch": 2767} {"train_loss": -42.66109848022461, "global_step": 334835, "epoch": 2767} {"train_loss": -42.635807037353516, "global_step": 334836, "epoch": 2767} {"train_loss": -42.92153549194336, "global_step": 334837, "epoch": 2767} {"train_loss": -42.992313385009766, "global_step": 334838, "epoch": 2767} {"train_loss": -43.48362350463867, "global_step": 334839, "epoch": 2767} {"train_loss": -43.12489700317383, "global_step": 334840, "epoch": 2767} {"train_loss": -42.14362716674805, "global_step": 334841, "epoch": 2767} {"train_loss": -43.440277099609375, "global_step": 334842, "epoch": 2767} {"train_loss": -40.36345291137695, "global_step": 334843, "epoch": 2767} {"train_loss": -42.50334548950195, "global_step": 334844, "epoch": 2767} {"train_loss": -40.535152435302734, "global_step": 334845, "epoch": 2767} {"train_loss": -40.42646408081055, "global_step": 334846, "epoch": 2767} {"train_loss": -41.94443130493164, "global_step": 334847, "epoch": 2767} {"train_loss": -43.60836410522461, "global_step": 334848, "epoch": 2767} {"train_loss": -40.399776458740234, "global_step": 334849, "epoch": 2767} {"train_loss": -42.24037551879883, "global_step": 334850, "epoch": 2767} {"train_loss": -42.72591018676758, "global_step": 334851, "epoch": 2767} {"train_loss": -43.09628677368164, "global_step": 334852, "epoch": 2767} {"train_loss": -41.55524826049805, "global_step": 334853, "epoch": 2767} {"train_loss": -42.9826774597168, "global_step": 334854, "epoch": 2767} {"train_loss": -40.537837982177734, "global_step": 334855, "epoch": 2767} {"train_loss": -40.69477081298828, "global_step": 334856, "epoch": 2767} {"train_loss": -42.079803466796875, "global_step": 334857, "epoch": 2767} {"train_loss": -40.3500862121582, "global_step": 334858, "epoch": 2767} {"train_loss": -41.87592697143555, "global_step": 334859, "epoch": 2767} {"train_loss": -41.137489318847656, "global_step": 334860, "epoch": 2767} {"train_loss": -41.580841064453125, "global_step": 334861, "epoch": 2767} {"train_loss": -41.12984085083008, "global_step": 334862, "epoch": 2767} {"train_loss": -42.564571380615234, "global_step": 334863, "epoch": 2767} {"train_loss": -42.42713165283203, "global_step": 334864, "epoch": 2767} {"train_loss": -41.9268684387207, "global_step": 334865, "epoch": 2767} {"train_loss": -43.09758377075195, "global_step": 334866, "epoch": 2767} {"train_loss": -42.772518157958984, "global_step": 334867, "epoch": 2767} {"train_loss": -42.13004684448242, "global_step": 334868, "epoch": 2767} {"train_loss": -43.13182067871094, "global_step": 334869, "epoch": 2767} {"train_loss": -42.28788375854492, "global_step": 334870, "epoch": 2767} {"train_loss": -42.22829055786133, "global_step": 334871, "epoch": 2767} {"train_loss": -42.457923889160156, "global_step": 334872, "epoch": 2767} {"train_loss": -42.162193298339844, "global_step": 334873, "epoch": 2767} {"train_loss": -43.17295455932617, "global_step": 334874, "epoch": 2767} {"train_loss": -42.56329345703125, "global_step": 334875, "epoch": 2767} {"train_loss": -43.35023498535156, "global_step": 334876, "epoch": 2767} {"train_loss": -42.32535934448242, "global_step": 334877, "epoch": 2767} {"train_loss": -43.063018798828125, "global_step": 334878, "epoch": 2767} {"train_loss": -42.52716064453125, "global_step": 334879, "epoch": 2767} {"train_loss": -44.130348205566406, "global_step": 334880, "epoch": 2767} {"train_loss": -42.43097686767578, "global_step": 334881, "epoch": 2767} {"train_loss": -43.33185577392578, "global_step": 334882, "epoch": 2767} {"train_loss": -42.88112258911133, "global_step": 334883, "epoch": 2767} {"train_loss": -41.36249923706055, "global_step": 334884, "epoch": 2767} {"train_loss": -43.02104568481445, "global_step": 334885, "epoch": 2767} {"train_loss": -42.99812698364258, "global_step": 334886, "epoch": 2767} {"train_loss": -42.79014205932617, "global_step": 334887, "epoch": 2767} {"train_loss": -43.15668869018555, "global_step": 334888, "epoch": 2767} {"train_loss": -43.739845275878906, "global_step": 334889, "epoch": 2767} {"train_loss": -41.809532165527344, "global_step": 334890, "epoch": 2767} {"train_loss": -43.249019622802734, "global_step": 334891, "epoch": 2767} {"train_loss": -42.464107513427734, "global_step": 334892, "epoch": 2767} {"train_loss": -43.403594970703125, "global_step": 334893, "epoch": 2767} {"train_loss": -42.67728805541992, "global_step": 334894, "epoch": 2767} {"train_loss": -43.48653030395508, "global_step": 334895, "epoch": 2767} {"train_loss": -43.55021286010742, "global_step": 334896, "epoch": 2767} {"train_loss": -43.89683151245117, "global_step": 334897, "epoch": 2767} {"train_loss": -42.8773307800293, "global_step": 334898, "epoch": 2767} {"train_loss": -43.50989532470703, "global_step": 334899, "epoch": 2767} {"train_loss": -43.71622085571289, "global_step": 334900, "epoch": 2767} {"train_loss": -43.01980209350586, "global_step": 334901, "epoch": 2767} {"train_loss": -41.98037338256836, "global_step": 334902, "epoch": 2767} {"train_loss": -43.37241744995117, "global_step": 334903, "epoch": 2767} {"train_loss": -43.50175094604492, "global_step": 334904, "epoch": 2767} {"train_loss": -43.11408615112305, "global_step": 334905, "epoch": 2767} {"train_loss": -43.13777160644531, "global_step": 334906, "epoch": 2767} {"train_loss": -44.034828186035156, "global_step": 334907, "epoch": 2767} {"train_loss": -43.88755798339844, "global_step": 334908, "epoch": 2767} {"train_loss": -42.947792053222656, "global_step": 334909, "epoch": 2767} {"train_loss": -43.66738510131836, "global_step": 334910, "epoch": 2767} {"train_loss": -42.95387649536133, "global_step": 334911, "epoch": 2767} {"train_loss": -43.01244354248047, "global_step": 334912, "epoch": 2767} {"train_loss": -42.99799728393555, "global_step": 334913, "epoch": 2767} {"train_loss": -43.87734603881836, "global_step": 334914, "epoch": 2767} {"train_loss": -43.77008819580078, "global_step": 334915, "epoch": 2767} {"train_loss": -43.57343673706055, "global_step": 334916, "epoch": 2767} {"train_loss": -43.98826217651367, "global_step": 334917, "epoch": 2767} {"train_loss": -42.971004486083984, "global_step": 334918, "epoch": 2767} {"train_loss": -43.3631591796875, "global_step": 334919, "epoch": 2767} {"train_loss": -43.770904541015625, "global_step": 334920, "epoch": 2767} {"train_loss": -43.162593841552734, "global_step": 334921, "epoch": 2767} {"train_loss": -43.47473907470703, "global_step": 334922, "epoch": 2767} {"train_loss": -43.57624053955078, "global_step": 334923, "epoch": 2767} {"train_loss": -44.304927825927734, "global_step": 334924, "epoch": 2767} {"train_loss": -43.75541305541992, "global_step": 334925, "epoch": 2767} {"train_loss": -44.20784378051758, "global_step": 334926, "epoch": 2767} {"train_loss": -42.38487568374508, "global_step": 334927, "epoch": 2767, "val_loss": 2515808.5} {"train_loss": -44.243873596191406, "global_step": 334928, "epoch": 2768} {"train_loss": -43.81275177001953, "global_step": 334929, "epoch": 2768} {"train_loss": -44.23110580444336, "global_step": 334930, "epoch": 2768} {"train_loss": -44.340919494628906, "global_step": 334931, "epoch": 2768} {"train_loss": -43.24589920043945, "global_step": 334932, "epoch": 2768} {"train_loss": -44.66437911987305, "global_step": 334933, "epoch": 2768} {"train_loss": -41.486141204833984, "global_step": 334934, "epoch": 2768} {"train_loss": -41.432613372802734, "global_step": 334935, "epoch": 2768} {"train_loss": -42.30295944213867, "global_step": 334936, "epoch": 2768} {"train_loss": -41.293724060058594, "global_step": 334937, "epoch": 2768} {"train_loss": -42.664283752441406, "global_step": 334938, "epoch": 2768} {"train_loss": -41.38546371459961, "global_step": 334939, "epoch": 2768} {"train_loss": -42.771583557128906, "global_step": 334940, "epoch": 2768} {"train_loss": -40.19411849975586, "global_step": 334941, "epoch": 2768} {"train_loss": -41.690059661865234, "global_step": 334942, "epoch": 2768} {"train_loss": -41.652645111083984, "global_step": 334943, "epoch": 2768} {"train_loss": -43.82833480834961, "global_step": 334944, "epoch": 2768} {"train_loss": -41.14060592651367, "global_step": 334945, "epoch": 2768} {"train_loss": -42.871742248535156, "global_step": 334946, "epoch": 2768} {"train_loss": -42.5941162109375, "global_step": 334947, "epoch": 2768} {"train_loss": -42.29480743408203, "global_step": 334948, "epoch": 2768} {"train_loss": -42.83637619018555, "global_step": 334949, "epoch": 2768} {"train_loss": -42.55588150024414, "global_step": 334950, "epoch": 2768} {"train_loss": -42.93376541137695, "global_step": 334951, "epoch": 2768} {"train_loss": -42.282630920410156, "global_step": 334952, "epoch": 2768} {"train_loss": -43.82827377319336, "global_step": 334953, "epoch": 2768} {"train_loss": -41.769535064697266, "global_step": 334954, "epoch": 2768} {"train_loss": -43.3233642578125, "global_step": 334955, "epoch": 2768} {"train_loss": -42.928382873535156, "global_step": 334956, "epoch": 2768} {"train_loss": -44.15852737426758, "global_step": 334957, "epoch": 2768} {"train_loss": -43.52159881591797, "global_step": 334958, "epoch": 2768} {"train_loss": -43.28106689453125, "global_step": 334959, "epoch": 2768} {"train_loss": -43.76670455932617, "global_step": 334960, "epoch": 2768} {"train_loss": -42.50748825073242, "global_step": 334961, "epoch": 2768} {"train_loss": -42.66789627075195, "global_step": 334962, "epoch": 2768} {"train_loss": -41.710208892822266, "global_step": 334963, "epoch": 2768} {"train_loss": -42.87865447998047, "global_step": 334964, "epoch": 2768} {"train_loss": -41.7908821105957, "global_step": 334965, "epoch": 2768} {"train_loss": -41.72732162475586, "global_step": 334966, "epoch": 2768} {"train_loss": -42.581092834472656, "global_step": 334967, "epoch": 2768} {"train_loss": -41.7362174987793, "global_step": 334968, "epoch": 2768} {"train_loss": -42.037025451660156, "global_step": 334969, "epoch": 2768} {"train_loss": -43.351253509521484, "global_step": 334970, "epoch": 2768} {"train_loss": -42.02016067504883, "global_step": 334971, "epoch": 2768} {"train_loss": -43.69554901123047, "global_step": 334972, "epoch": 2768} {"train_loss": -41.99135971069336, "global_step": 334973, "epoch": 2768} {"train_loss": -43.738460540771484, "global_step": 334974, "epoch": 2768} {"train_loss": -43.54620361328125, "global_step": 334975, "epoch": 2768} {"train_loss": -43.12091827392578, "global_step": 334976, "epoch": 2768} {"train_loss": -42.9478874206543, "global_step": 334977, "epoch": 2768} {"train_loss": -43.112483978271484, "global_step": 334978, "epoch": 2768} {"train_loss": -44.013614654541016, "global_step": 334979, "epoch": 2768} {"train_loss": -43.292152404785156, "global_step": 334980, "epoch": 2768} {"train_loss": -43.8707389831543, "global_step": 334981, "epoch": 2768} {"train_loss": -43.94585037231445, "global_step": 334982, "epoch": 2768} {"train_loss": -42.7694091796875, "global_step": 334983, "epoch": 2768} {"train_loss": -43.51856994628906, "global_step": 334984, "epoch": 2768} {"train_loss": -43.299400329589844, "global_step": 334985, "epoch": 2768} {"train_loss": -43.78700637817383, "global_step": 334986, "epoch": 2768} {"train_loss": -43.2495002746582, "global_step": 334987, "epoch": 2768} {"train_loss": -43.89020538330078, "global_step": 334988, "epoch": 2768} {"train_loss": -42.3236198425293, "global_step": 334989, "epoch": 2768} {"train_loss": -44.135250091552734, "global_step": 334990, "epoch": 2768} {"train_loss": -43.44475173950195, "global_step": 334991, "epoch": 2768} {"train_loss": -44.409912109375, "global_step": 334992, "epoch": 2768} {"train_loss": -43.94491195678711, "global_step": 334993, "epoch": 2768} {"train_loss": -43.778724670410156, "global_step": 334994, "epoch": 2768} {"train_loss": -44.17966079711914, "global_step": 334995, "epoch": 2768} {"train_loss": -44.41167068481445, "global_step": 334996, "epoch": 2768} {"train_loss": -43.73705291748047, "global_step": 334997, "epoch": 2768} {"train_loss": -43.95418930053711, "global_step": 334998, "epoch": 2768} {"train_loss": -43.65134048461914, "global_step": 334999, "epoch": 2768} {"train_loss": -43.98914337158203, "global_step": 335000, "epoch": 2768} {"train_loss": -43.8089599609375, "global_step": 335001, "epoch": 2768} {"train_loss": -44.424049377441406, "global_step": 335002, "epoch": 2768} {"train_loss": -32.670448303222656, "global_step": 335003, "epoch": 2768} {"train_loss": -44.419307708740234, "global_step": 335004, "epoch": 2768} {"train_loss": -42.57882308959961, "global_step": 335005, "epoch": 2768} {"train_loss": -43.40888977050781, "global_step": 335006, "epoch": 2768} {"train_loss": -44.507076263427734, "global_step": 335007, "epoch": 2768} {"train_loss": -44.2014274597168, "global_step": 335008, "epoch": 2768} {"train_loss": -43.79524612426758, "global_step": 335009, "epoch": 2768} {"train_loss": -42.497215270996094, "global_step": 335010, "epoch": 2768} {"train_loss": -43.837181091308594, "global_step": 335011, "epoch": 2768} {"train_loss": -41.164485931396484, "global_step": 335012, "epoch": 2768} {"train_loss": -44.01674270629883, "global_step": 335013, "epoch": 2768} {"train_loss": -42.18464279174805, "global_step": 335014, "epoch": 2768} {"train_loss": -44.58177185058594, "global_step": 335015, "epoch": 2768} {"train_loss": -42.82261276245117, "global_step": 335016, "epoch": 2768} {"train_loss": -44.30327606201172, "global_step": 335017, "epoch": 2768} {"train_loss": -43.59015655517578, "global_step": 335018, "epoch": 2768} {"train_loss": -42.452205657958984, "global_step": 335019, "epoch": 2768} {"train_loss": -42.86777877807617, "global_step": 335020, "epoch": 2768} {"train_loss": -43.60111999511719, "global_step": 335021, "epoch": 2768} {"train_loss": -44.335174560546875, "global_step": 335022, "epoch": 2768} {"train_loss": -43.811283111572266, "global_step": 335023, "epoch": 2768} {"train_loss": -43.6450309753418, "global_step": 335024, "epoch": 2768} {"train_loss": -43.5584602355957, "global_step": 335025, "epoch": 2768} {"train_loss": -42.96205139160156, "global_step": 335026, "epoch": 2768} {"train_loss": -43.891963958740234, "global_step": 335027, "epoch": 2768} {"train_loss": -42.43102264404297, "global_step": 335028, "epoch": 2768} {"train_loss": -43.6981201171875, "global_step": 335029, "epoch": 2768} {"train_loss": -41.80241012573242, "global_step": 335030, "epoch": 2768} {"train_loss": -43.157012939453125, "global_step": 335031, "epoch": 2768} {"train_loss": -42.47488021850586, "global_step": 335032, "epoch": 2768} {"train_loss": -42.90239715576172, "global_step": 335033, "epoch": 2768} {"train_loss": -40.9606819152832, "global_step": 335034, "epoch": 2768} {"train_loss": -42.559513092041016, "global_step": 335035, "epoch": 2768} {"train_loss": -41.58002853393555, "global_step": 335036, "epoch": 2768} {"train_loss": -42.143348693847656, "global_step": 335037, "epoch": 2768} {"train_loss": -42.54977035522461, "global_step": 335038, "epoch": 2768} {"train_loss": -42.94617462158203, "global_step": 335039, "epoch": 2768} {"train_loss": -43.33036804199219, "global_step": 335040, "epoch": 2768} {"train_loss": -41.86353302001953, "global_step": 335041, "epoch": 2768} {"train_loss": -43.3202018737793, "global_step": 335042, "epoch": 2768} {"train_loss": -42.7794303894043, "global_step": 335043, "epoch": 2768} {"train_loss": -42.21440887451172, "global_step": 335044, "epoch": 2768} {"train_loss": -43.17122268676758, "global_step": 335045, "epoch": 2768} {"train_loss": -42.2796630859375, "global_step": 335046, "epoch": 2768} {"train_loss": -42.75415802001953, "global_step": 335047, "epoch": 2768} {"train_loss": -42.96266530564994, "global_step": 335048, "epoch": 2768, "val_loss": 2547164.5} {"train_loss": -43.33663558959961, "global_step": 335049, "epoch": 2769} {"train_loss": -42.08677291870117, "global_step": 335050, "epoch": 2769} {"train_loss": -41.65637969970703, "global_step": 335051, "epoch": 2769} {"train_loss": -43.036190032958984, "global_step": 335052, "epoch": 2769} {"train_loss": -40.322540283203125, "global_step": 335053, "epoch": 2769} {"train_loss": -42.30327606201172, "global_step": 335054, "epoch": 2769} {"train_loss": -42.802520751953125, "global_step": 335055, "epoch": 2769} {"train_loss": -42.25447082519531, "global_step": 335056, "epoch": 2769} {"train_loss": -43.20772933959961, "global_step": 335057, "epoch": 2769} {"train_loss": -42.46257019042969, "global_step": 335058, "epoch": 2769} {"train_loss": -43.28208541870117, "global_step": 335059, "epoch": 2769} {"train_loss": -42.225196838378906, "global_step": 335060, "epoch": 2769} {"train_loss": -43.11313247680664, "global_step": 335061, "epoch": 2769} {"train_loss": -42.77705764770508, "global_step": 335062, "epoch": 2769} {"train_loss": -42.82085418701172, "global_step": 335063, "epoch": 2769} {"train_loss": -44.643184661865234, "global_step": 335064, "epoch": 2769} {"train_loss": -43.27516555786133, "global_step": 335065, "epoch": 2769} {"train_loss": -43.60129928588867, "global_step": 335066, "epoch": 2769} {"train_loss": -43.73911666870117, "global_step": 335067, "epoch": 2769} {"train_loss": -43.50771713256836, "global_step": 335068, "epoch": 2769} {"train_loss": -43.98862075805664, "global_step": 335069, "epoch": 2769} {"train_loss": -43.63123321533203, "global_step": 335070, "epoch": 2769} {"train_loss": -43.721099853515625, "global_step": 335071, "epoch": 2769} {"train_loss": -44.66037368774414, "global_step": 335072, "epoch": 2769} {"train_loss": -44.24436569213867, "global_step": 335073, "epoch": 2769} {"train_loss": -42.582523345947266, "global_step": 335074, "epoch": 2769} {"train_loss": -44.512203216552734, "global_step": 335075, "epoch": 2769} {"train_loss": -42.68233871459961, "global_step": 335076, "epoch": 2769} {"train_loss": -44.348602294921875, "global_step": 335077, "epoch": 2769} {"train_loss": -42.1557731628418, "global_step": 335078, "epoch": 2769} {"train_loss": -44.35206985473633, "global_step": 335079, "epoch": 2769} {"train_loss": -42.23453903198242, "global_step": 335080, "epoch": 2769} {"train_loss": -43.65340805053711, "global_step": 335081, "epoch": 2769} {"train_loss": -42.25165939331055, "global_step": 335082, "epoch": 2769} {"train_loss": -43.279640197753906, "global_step": 335083, "epoch": 2769} {"train_loss": -43.190731048583984, "global_step": 335084, "epoch": 2769} {"train_loss": -42.23466873168945, "global_step": 335085, "epoch": 2769} {"train_loss": -43.63546371459961, "global_step": 335086, "epoch": 2769} {"train_loss": -41.19955825805664, "global_step": 335087, "epoch": 2769} {"train_loss": -42.98057174682617, "global_step": 335088, "epoch": 2769} {"train_loss": -41.018394470214844, "global_step": 335089, "epoch": 2769} {"train_loss": -41.829864501953125, "global_step": 335090, "epoch": 2769} {"train_loss": -43.40961837768555, "global_step": 335091, "epoch": 2769} {"train_loss": -40.71493148803711, "global_step": 335092, "epoch": 2769} {"train_loss": -42.13185501098633, "global_step": 335093, "epoch": 2769} {"train_loss": -41.28457260131836, "global_step": 335094, "epoch": 2769} {"train_loss": -42.375614166259766, "global_step": 335095, "epoch": 2769} {"train_loss": -41.817405700683594, "global_step": 335096, "epoch": 2769} {"train_loss": -40.91862106323242, "global_step": 335097, "epoch": 2769} {"train_loss": -41.60943603515625, "global_step": 335098, "epoch": 2769} {"train_loss": -41.59627151489258, "global_step": 335099, "epoch": 2769} {"train_loss": -42.24933624267578, "global_step": 335100, "epoch": 2769} {"train_loss": -41.98334503173828, "global_step": 335101, "epoch": 2769} {"train_loss": -41.78314208984375, "global_step": 335102, "epoch": 2769} {"train_loss": -43.4528694152832, "global_step": 335103, "epoch": 2769} {"train_loss": -42.074745178222656, "global_step": 335104, "epoch": 2769} {"train_loss": -42.98554992675781, "global_step": 335105, "epoch": 2769} {"train_loss": -42.26853942871094, "global_step": 335106, "epoch": 2769} {"train_loss": -41.66651153564453, "global_step": 335107, "epoch": 2769} {"train_loss": -41.60129928588867, "global_step": 335108, "epoch": 2769} {"train_loss": -42.092586517333984, "global_step": 335109, "epoch": 2769} {"train_loss": -42.49738693237305, "global_step": 335110, "epoch": 2769} {"train_loss": -41.83687973022461, "global_step": 335111, "epoch": 2769} {"train_loss": -41.419677734375, "global_step": 335112, "epoch": 2769} {"train_loss": -43.218379974365234, "global_step": 335113, "epoch": 2769} {"train_loss": -43.216121673583984, "global_step": 335114, "epoch": 2769} {"train_loss": -43.36962890625, "global_step": 335115, "epoch": 2769} {"train_loss": -43.24752426147461, "global_step": 335116, "epoch": 2769} {"train_loss": -44.0912971496582, "global_step": 335117, "epoch": 2769} {"train_loss": -43.251914978027344, "global_step": 335118, "epoch": 2769} {"train_loss": -44.4172477722168, "global_step": 335119, "epoch": 2769} {"train_loss": -42.96343231201172, "global_step": 335120, "epoch": 2769} {"train_loss": -43.02191162109375, "global_step": 335121, "epoch": 2769} {"train_loss": -43.88013458251953, "global_step": 335122, "epoch": 2769} {"train_loss": -42.93688201904297, "global_step": 335123, "epoch": 2769} {"train_loss": -43.396484375, "global_step": 335124, "epoch": 2769} {"train_loss": -43.77506637573242, "global_step": 335125, "epoch": 2769} {"train_loss": -43.20729064941406, "global_step": 335126, "epoch": 2769} {"train_loss": -44.04206466674805, "global_step": 335127, "epoch": 2769} {"train_loss": -44.299007415771484, "global_step": 335128, "epoch": 2769} {"train_loss": -44.78672409057617, "global_step": 335129, "epoch": 2769} {"train_loss": -44.59906005859375, "global_step": 335130, "epoch": 2769} {"train_loss": -43.94865036010742, "global_step": 335131, "epoch": 2769} {"train_loss": -44.434356689453125, "global_step": 335132, "epoch": 2769} {"train_loss": -44.02999496459961, "global_step": 335133, "epoch": 2769} {"train_loss": -44.4844856262207, "global_step": 335134, "epoch": 2769} {"train_loss": -44.24481201171875, "global_step": 335135, "epoch": 2769} {"train_loss": -44.87099838256836, "global_step": 335136, "epoch": 2769} {"train_loss": -43.29217529296875, "global_step": 335137, "epoch": 2769} {"train_loss": -44.272220611572266, "global_step": 335138, "epoch": 2769} {"train_loss": -44.337913513183594, "global_step": 335139, "epoch": 2769} {"train_loss": -44.18949508666992, "global_step": 335140, "epoch": 2769} {"train_loss": -44.0513801574707, "global_step": 335141, "epoch": 2769} {"train_loss": -44.516326904296875, "global_step": 335142, "epoch": 2769} {"train_loss": -43.63151168823242, "global_step": 335143, "epoch": 2769} {"train_loss": -44.508419036865234, "global_step": 335144, "epoch": 2769} {"train_loss": -44.07682800292969, "global_step": 335145, "epoch": 2769} {"train_loss": -43.85526657104492, "global_step": 335146, "epoch": 2769} {"train_loss": -42.3419075012207, "global_step": 335147, "epoch": 2769} {"train_loss": -43.62368392944336, "global_step": 335148, "epoch": 2769} {"train_loss": -40.67694854736328, "global_step": 335149, "epoch": 2769} {"train_loss": -41.31427001953125, "global_step": 335150, "epoch": 2769} {"train_loss": -43.137020111083984, "global_step": 335151, "epoch": 2769} {"train_loss": -39.553688049316406, "global_step": 335152, "epoch": 2769} {"train_loss": -41.36774826049805, "global_step": 335153, "epoch": 2769} {"train_loss": -42.363258361816406, "global_step": 335154, "epoch": 2769} {"train_loss": -43.3144416809082, "global_step": 335155, "epoch": 2769} {"train_loss": -42.95629119873047, "global_step": 335156, "epoch": 2769} {"train_loss": -41.003761291503906, "global_step": 335157, "epoch": 2769} {"train_loss": -42.159420013427734, "global_step": 335158, "epoch": 2769} {"train_loss": -43.764007568359375, "global_step": 335159, "epoch": 2769} {"train_loss": -42.757530212402344, "global_step": 335160, "epoch": 2769} {"train_loss": -41.470638275146484, "global_step": 335161, "epoch": 2769} {"train_loss": -39.69533920288086, "global_step": 335162, "epoch": 2769} {"train_loss": -42.39577102661133, "global_step": 335163, "epoch": 2769} {"train_loss": -43.21574020385742, "global_step": 335164, "epoch": 2769} {"train_loss": -42.163787841796875, "global_step": 335165, "epoch": 2769} {"train_loss": -41.639129638671875, "global_step": 335166, "epoch": 2769} {"train_loss": -44.01862335205078, "global_step": 335167, "epoch": 2769} {"train_loss": -41.73670196533203, "global_step": 335168, "epoch": 2769} {"train_loss": -42.900782593025646, "global_step": 335169, "epoch": 2769, "val_loss": 2638890.0} {"train_loss": -43.705169677734375, "global_step": 335170, "epoch": 2770} {"train_loss": -40.709835052490234, "global_step": 335171, "epoch": 2770} {"train_loss": -41.63961410522461, "global_step": 335172, "epoch": 2770} {"train_loss": -42.002601623535156, "global_step": 335173, "epoch": 2770} {"train_loss": -40.7789192199707, "global_step": 335174, "epoch": 2770} {"train_loss": -42.68368148803711, "global_step": 335175, "epoch": 2770} {"train_loss": -43.47491455078125, "global_step": 335176, "epoch": 2770} {"train_loss": -42.53138732910156, "global_step": 335177, "epoch": 2770} {"train_loss": -42.20529556274414, "global_step": 335178, "epoch": 2770} {"train_loss": -44.303245544433594, "global_step": 335179, "epoch": 2770} {"train_loss": -41.58485794067383, "global_step": 335180, "epoch": 2770} {"train_loss": -42.65836715698242, "global_step": 335181, "epoch": 2770} {"train_loss": -41.883514404296875, "global_step": 335182, "epoch": 2770} {"train_loss": -41.95962142944336, "global_step": 335183, "epoch": 2770} {"train_loss": -42.5727424621582, "global_step": 335184, "epoch": 2770} {"train_loss": -42.94936752319336, "global_step": 335185, "epoch": 2770} {"train_loss": -43.532711029052734, "global_step": 335186, "epoch": 2770} {"train_loss": -42.1475944519043, "global_step": 335187, "epoch": 2770} {"train_loss": -43.425472259521484, "global_step": 335188, "epoch": 2770} {"train_loss": -41.50224685668945, "global_step": 335189, "epoch": 2770} {"train_loss": -44.2860107421875, "global_step": 335190, "epoch": 2770} {"train_loss": -42.582820892333984, "global_step": 335191, "epoch": 2770} {"train_loss": -43.7843017578125, "global_step": 335192, "epoch": 2770} {"train_loss": -43.365234375, "global_step": 335193, "epoch": 2770} {"train_loss": -43.61579132080078, "global_step": 335194, "epoch": 2770} {"train_loss": -43.40767288208008, "global_step": 335195, "epoch": 2770} {"train_loss": -43.821414947509766, "global_step": 335196, "epoch": 2770} {"train_loss": -43.30820846557617, "global_step": 335197, "epoch": 2770} {"train_loss": -44.18532180786133, "global_step": 335198, "epoch": 2770} {"train_loss": -43.744258880615234, "global_step": 335199, "epoch": 2770} {"train_loss": -44.118072509765625, "global_step": 335200, "epoch": 2770} {"train_loss": -44.257625579833984, "global_step": 335201, "epoch": 2770} {"train_loss": -44.27517318725586, "global_step": 335202, "epoch": 2770} {"train_loss": -44.04970169067383, "global_step": 335203, "epoch": 2770} {"train_loss": -44.474952697753906, "global_step": 335204, "epoch": 2770} {"train_loss": -44.277278900146484, "global_step": 335205, "epoch": 2770} {"train_loss": -44.3575325012207, "global_step": 335206, "epoch": 2770} {"train_loss": -43.81976318359375, "global_step": 335207, "epoch": 2770} {"train_loss": -44.771480560302734, "global_step": 335208, "epoch": 2770} {"train_loss": -44.81877136230469, "global_step": 335209, "epoch": 2770} {"train_loss": -44.56391143798828, "global_step": 335210, "epoch": 2770} {"train_loss": -44.220733642578125, "global_step": 335211, "epoch": 2770} {"train_loss": -44.79594802856445, "global_step": 335212, "epoch": 2770} {"train_loss": -44.60248565673828, "global_step": 335213, "epoch": 2770} {"train_loss": -43.809322357177734, "global_step": 335214, "epoch": 2770} {"train_loss": -44.63066482543945, "global_step": 335215, "epoch": 2770} {"train_loss": -43.85573196411133, "global_step": 335216, "epoch": 2770} {"train_loss": -44.2602424621582, "global_step": 335217, "epoch": 2770} {"train_loss": -45.0026969909668, "global_step": 335218, "epoch": 2770} {"train_loss": -44.5427131652832, "global_step": 335219, "epoch": 2770} {"train_loss": -44.639686584472656, "global_step": 335220, "epoch": 2770} {"train_loss": -44.61231994628906, "global_step": 335221, "epoch": 2770} {"train_loss": -44.284847259521484, "global_step": 335222, "epoch": 2770} {"train_loss": -44.75830841064453, "global_step": 335223, "epoch": 2770} {"train_loss": -44.78794860839844, "global_step": 335224, "epoch": 2770} {"train_loss": -44.956077575683594, "global_step": 335225, "epoch": 2770} {"train_loss": -44.60833740234375, "global_step": 335226, "epoch": 2770} {"train_loss": -45.25851821899414, "global_step": 335227, "epoch": 2770} {"train_loss": -44.20741653442383, "global_step": 335228, "epoch": 2770} {"train_loss": -44.73759078979492, "global_step": 335229, "epoch": 2770} {"train_loss": -45.61765670776367, "global_step": 335230, "epoch": 2770} {"train_loss": -44.252777099609375, "global_step": 335231, "epoch": 2770} {"train_loss": -44.298255920410156, "global_step": 335232, "epoch": 2770} {"train_loss": -44.05947494506836, "global_step": 335233, "epoch": 2770} {"train_loss": -44.44218063354492, "global_step": 335234, "epoch": 2770} {"train_loss": -45.39628982543945, "global_step": 335235, "epoch": 2770} {"train_loss": -44.781246185302734, "global_step": 335236, "epoch": 2770} {"train_loss": -43.86674118041992, "global_step": 335237, "epoch": 2770} {"train_loss": -45.5272102355957, "global_step": 335238, "epoch": 2770} {"train_loss": -45.49152755737305, "global_step": 335239, "epoch": 2770} {"train_loss": -44.16804122924805, "global_step": 335240, "epoch": 2770} {"train_loss": -44.0738639831543, "global_step": 335241, "epoch": 2770} {"train_loss": -44.62480926513672, "global_step": 335242, "epoch": 2770} {"train_loss": -45.061119079589844, "global_step": 335243, "epoch": 2770} {"train_loss": -43.88898468017578, "global_step": 335244, "epoch": 2770} {"train_loss": -43.88906478881836, "global_step": 335245, "epoch": 2770} {"train_loss": -42.82556915283203, "global_step": 335246, "epoch": 2770} {"train_loss": -43.966148376464844, "global_step": 335247, "epoch": 2770} {"train_loss": -43.635433197021484, "global_step": 335248, "epoch": 2770} {"train_loss": -42.357460021972656, "global_step": 335249, "epoch": 2770} {"train_loss": -43.95770263671875, "global_step": 335250, "epoch": 2770} {"train_loss": -41.197505950927734, "global_step": 335251, "epoch": 2770} {"train_loss": -43.46657943725586, "global_step": 335252, "epoch": 2770} {"train_loss": -41.2330322265625, "global_step": 335253, "epoch": 2770} {"train_loss": -42.59855270385742, "global_step": 335254, "epoch": 2770} {"train_loss": -39.40987777709961, "global_step": 335255, "epoch": 2770} {"train_loss": -40.678977966308594, "global_step": 335256, "epoch": 2770} {"train_loss": -40.253448486328125, "global_step": 335257, "epoch": 2770} {"train_loss": -40.48162841796875, "global_step": 335258, "epoch": 2770} {"train_loss": -38.16838455200195, "global_step": 335259, "epoch": 2770} {"train_loss": -42.3449821472168, "global_step": 335260, "epoch": 2770} {"train_loss": -39.50664138793945, "global_step": 335261, "epoch": 2770} {"train_loss": -41.767005920410156, "global_step": 335262, "epoch": 2770} {"train_loss": -41.46444320678711, "global_step": 335263, "epoch": 2770} {"train_loss": -40.85697555541992, "global_step": 335264, "epoch": 2770} {"train_loss": -40.43980026245117, "global_step": 335265, "epoch": 2770} {"train_loss": -41.008235931396484, "global_step": 335266, "epoch": 2770} {"train_loss": -40.66524887084961, "global_step": 335267, "epoch": 2770} {"train_loss": -43.110530853271484, "global_step": 335268, "epoch": 2770} {"train_loss": -40.85696029663086, "global_step": 335269, "epoch": 2770} {"train_loss": -41.872615814208984, "global_step": 335270, "epoch": 2770} {"train_loss": -42.097267150878906, "global_step": 335271, "epoch": 2770} {"train_loss": -42.23309326171875, "global_step": 335272, "epoch": 2770} {"train_loss": -42.72353744506836, "global_step": 335273, "epoch": 2770} {"train_loss": -43.70693588256836, "global_step": 335274, "epoch": 2770} {"train_loss": -43.16762924194336, "global_step": 335275, "epoch": 2770} {"train_loss": -43.03308868408203, "global_step": 335276, "epoch": 2770} {"train_loss": -43.79819869995117, "global_step": 335277, "epoch": 2770} {"train_loss": -43.244720458984375, "global_step": 335278, "epoch": 2770} {"train_loss": -43.347145080566406, "global_step": 335279, "epoch": 2770} {"train_loss": -43.63753128051758, "global_step": 335280, "epoch": 2770} {"train_loss": -42.83510208129883, "global_step": 335281, "epoch": 2770} {"train_loss": -42.980735778808594, "global_step": 335282, "epoch": 2770} {"train_loss": -44.2131462097168, "global_step": 335283, "epoch": 2770} {"train_loss": -42.02393341064453, "global_step": 335284, "epoch": 2770} {"train_loss": -43.42820358276367, "global_step": 335285, "epoch": 2770} {"train_loss": -43.0713996887207, "global_step": 335286, "epoch": 2770} {"train_loss": -43.49551010131836, "global_step": 335287, "epoch": 2770} {"train_loss": -44.28814697265625, "global_step": 335288, "epoch": 2770} {"train_loss": -43.66787338256836, "global_step": 335289, "epoch": 2770} {"train_loss": -43.26345689631691, "global_step": 335290, "epoch": 2770, "val_loss": 2485255.75} {"train_loss": -43.63651657104492, "global_step": 335291, "epoch": 2771} {"train_loss": -43.93790817260742, "global_step": 335292, "epoch": 2771} {"train_loss": -43.593544006347656, "global_step": 335293, "epoch": 2771} {"train_loss": -43.01760482788086, "global_step": 335294, "epoch": 2771} {"train_loss": -44.1953010559082, "global_step": 335295, "epoch": 2771} {"train_loss": -44.22917556762695, "global_step": 335296, "epoch": 2771} {"train_loss": -43.558013916015625, "global_step": 335297, "epoch": 2771} {"train_loss": -43.53408432006836, "global_step": 335298, "epoch": 2771} {"train_loss": -44.593238830566406, "global_step": 335299, "epoch": 2771} {"train_loss": -44.22180938720703, "global_step": 335300, "epoch": 2771} {"train_loss": -43.079586029052734, "global_step": 335301, "epoch": 2771} {"train_loss": -43.991207122802734, "global_step": 335302, "epoch": 2771} {"train_loss": -44.26396560668945, "global_step": 335303, "epoch": 2771} {"train_loss": -42.240413665771484, "global_step": 335304, "epoch": 2771} {"train_loss": -44.13783264160156, "global_step": 335305, "epoch": 2771} {"train_loss": -41.63441848754883, "global_step": 335306, "epoch": 2771} {"train_loss": -44.067501068115234, "global_step": 335307, "epoch": 2771} {"train_loss": -41.41008377075195, "global_step": 335308, "epoch": 2771} {"train_loss": -42.79764938354492, "global_step": 335309, "epoch": 2771} {"train_loss": -41.0328254699707, "global_step": 335310, "epoch": 2771} {"train_loss": -42.136653900146484, "global_step": 335311, "epoch": 2771} {"train_loss": -42.859169006347656, "global_step": 335312, "epoch": 2771} {"train_loss": -41.47159194946289, "global_step": 335313, "epoch": 2771} {"train_loss": -43.66910934448242, "global_step": 335314, "epoch": 2771} {"train_loss": -41.97787094116211, "global_step": 335315, "epoch": 2771} {"train_loss": -42.32966232299805, "global_step": 335316, "epoch": 2771} {"train_loss": -42.37354278564453, "global_step": 335317, "epoch": 2771} {"train_loss": -43.256710052490234, "global_step": 335318, "epoch": 2771} {"train_loss": -42.38957595825195, "global_step": 335319, "epoch": 2771} {"train_loss": -43.43146896362305, "global_step": 335320, "epoch": 2771} {"train_loss": -40.144569396972656, "global_step": 335321, "epoch": 2771} {"train_loss": -40.963584899902344, "global_step": 335322, "epoch": 2771} {"train_loss": -40.62974166870117, "global_step": 335323, "epoch": 2771} {"train_loss": -41.59047317504883, "global_step": 335324, "epoch": 2771} {"train_loss": -43.00263214111328, "global_step": 335325, "epoch": 2771} {"train_loss": -41.58783721923828, "global_step": 335326, "epoch": 2771} {"train_loss": -43.248531341552734, "global_step": 335327, "epoch": 2771} {"train_loss": -43.09622573852539, "global_step": 335328, "epoch": 2771} {"train_loss": -42.63115310668945, "global_step": 335329, "epoch": 2771} {"train_loss": -42.64309310913086, "global_step": 335330, "epoch": 2771} {"train_loss": -42.723236083984375, "global_step": 335331, "epoch": 2771} {"train_loss": -44.04473876953125, "global_step": 335332, "epoch": 2771} {"train_loss": -44.2153434753418, "global_step": 335333, "epoch": 2771} {"train_loss": -43.68021774291992, "global_step": 335334, "epoch": 2771} {"train_loss": -43.684574127197266, "global_step": 335335, "epoch": 2771} {"train_loss": -44.20793914794922, "global_step": 335336, "epoch": 2771} {"train_loss": -43.7215690612793, "global_step": 335337, "epoch": 2771} {"train_loss": -43.7242317199707, "global_step": 335338, "epoch": 2771} {"train_loss": -43.99666976928711, "global_step": 335339, "epoch": 2771} {"train_loss": -43.524078369140625, "global_step": 335340, "epoch": 2771} {"train_loss": -42.839927673339844, "global_step": 335341, "epoch": 2771} {"train_loss": -42.87724685668945, "global_step": 335342, "epoch": 2771} {"train_loss": -42.72101974487305, "global_step": 335343, "epoch": 2771} {"train_loss": -44.20228576660156, "global_step": 335344, "epoch": 2771} {"train_loss": -40.83000564575195, "global_step": 335345, "epoch": 2771} {"train_loss": -37.3043098449707, "global_step": 335346, "epoch": 2771} {"train_loss": -42.03356170654297, "global_step": 335347, "epoch": 2771} {"train_loss": -43.83012771606445, "global_step": 335348, "epoch": 2771} {"train_loss": -41.976070404052734, "global_step": 335349, "epoch": 2771} {"train_loss": -42.540489196777344, "global_step": 335350, "epoch": 2771} {"train_loss": -43.9094123840332, "global_step": 335351, "epoch": 2771} {"train_loss": -43.08499526977539, "global_step": 335352, "epoch": 2771} {"train_loss": -44.49943161010742, "global_step": 335353, "epoch": 2771} {"train_loss": -42.87221908569336, "global_step": 335354, "epoch": 2771} {"train_loss": -43.99758529663086, "global_step": 335355, "epoch": 2771} {"train_loss": -43.02203369140625, "global_step": 335356, "epoch": 2771} {"train_loss": -43.54916000366211, "global_step": 335357, "epoch": 2771} {"train_loss": -44.76841354370117, "global_step": 335358, "epoch": 2771} {"train_loss": -43.392425537109375, "global_step": 335359, "epoch": 2771} {"train_loss": -43.695003509521484, "global_step": 335360, "epoch": 2771} {"train_loss": -44.164791107177734, "global_step": 335361, "epoch": 2771} {"train_loss": -42.47824478149414, "global_step": 335362, "epoch": 2771} {"train_loss": -43.35524368286133, "global_step": 335363, "epoch": 2771} {"train_loss": -43.91737747192383, "global_step": 335364, "epoch": 2771} {"train_loss": -43.900115966796875, "global_step": 335365, "epoch": 2771} {"train_loss": -42.77559280395508, "global_step": 335366, "epoch": 2771} {"train_loss": -44.17494201660156, "global_step": 335367, "epoch": 2771} {"train_loss": -43.56996536254883, "global_step": 335368, "epoch": 2771} {"train_loss": -43.68916320800781, "global_step": 335369, "epoch": 2771} {"train_loss": -43.567230224609375, "global_step": 335370, "epoch": 2771} {"train_loss": -44.149085998535156, "global_step": 335371, "epoch": 2771} {"train_loss": -43.32601547241211, "global_step": 335372, "epoch": 2771} {"train_loss": -44.30476760864258, "global_step": 335373, "epoch": 2771} {"train_loss": -42.86098098754883, "global_step": 335374, "epoch": 2771} {"train_loss": -43.17277908325195, "global_step": 335375, "epoch": 2771} {"train_loss": -44.36622619628906, "global_step": 335376, "epoch": 2771} {"train_loss": -41.7100715637207, "global_step": 335377, "epoch": 2771} {"train_loss": -42.80294418334961, "global_step": 335378, "epoch": 2771} {"train_loss": -44.51300811767578, "global_step": 335379, "epoch": 2771} {"train_loss": -41.94624328613281, "global_step": 335380, "epoch": 2771} {"train_loss": -44.54339599609375, "global_step": 335381, "epoch": 2771} {"train_loss": -43.737300872802734, "global_step": 335382, "epoch": 2771} {"train_loss": -43.136775970458984, "global_step": 335383, "epoch": 2771} {"train_loss": -44.613037109375, "global_step": 335384, "epoch": 2771} {"train_loss": -43.080039978027344, "global_step": 335385, "epoch": 2771} {"train_loss": -44.08345031738281, "global_step": 335386, "epoch": 2771} {"train_loss": -43.874263763427734, "global_step": 335387, "epoch": 2771} {"train_loss": -43.5439567565918, "global_step": 335388, "epoch": 2771} {"train_loss": -43.5271110534668, "global_step": 335389, "epoch": 2771} {"train_loss": -42.76243591308594, "global_step": 335390, "epoch": 2771} {"train_loss": -44.654048919677734, "global_step": 335391, "epoch": 2771} {"train_loss": -42.47504425048828, "global_step": 335392, "epoch": 2771} {"train_loss": -44.29905319213867, "global_step": 335393, "epoch": 2771} {"train_loss": -44.06044006347656, "global_step": 335394, "epoch": 2771} {"train_loss": -43.96794128417969, "global_step": 335395, "epoch": 2771} {"train_loss": -43.6942024230957, "global_step": 335396, "epoch": 2771} {"train_loss": -44.34540939331055, "global_step": 335397, "epoch": 2771} {"train_loss": -44.00127410888672, "global_step": 335398, "epoch": 2771} {"train_loss": -43.64563751220703, "global_step": 335399, "epoch": 2771} {"train_loss": -43.4190788269043, "global_step": 335400, "epoch": 2771} {"train_loss": -44.828956604003906, "global_step": 335401, "epoch": 2771} {"train_loss": -42.82871627807617, "global_step": 335402, "epoch": 2771} {"train_loss": -44.766719818115234, "global_step": 335403, "epoch": 2771} {"train_loss": -42.51295471191406, "global_step": 335404, "epoch": 2771} {"train_loss": -44.023353576660156, "global_step": 335405, "epoch": 2771} {"train_loss": -43.934391021728516, "global_step": 335406, "epoch": 2771} {"train_loss": -43.18525314331055, "global_step": 335407, "epoch": 2771} {"train_loss": -44.19866943359375, "global_step": 335408, "epoch": 2771} {"train_loss": -43.7795295715332, "global_step": 335409, "epoch": 2771} {"train_loss": -44.4020881652832, "global_step": 335410, "epoch": 2771} {"train_loss": -43.261764337208646, "global_step": 335411, "epoch": 2771, "val_loss": 2587274.25} {"train_loss": -43.26851272583008, "global_step": 335412, "epoch": 2772} {"train_loss": -44.59528732299805, "global_step": 335413, "epoch": 2772} {"train_loss": -43.68122482299805, "global_step": 335414, "epoch": 2772} {"train_loss": -44.05622100830078, "global_step": 335415, "epoch": 2772} {"train_loss": -44.37410354614258, "global_step": 335416, "epoch": 2772} {"train_loss": -43.32795715332031, "global_step": 335417, "epoch": 2772} {"train_loss": -44.460968017578125, "global_step": 335418, "epoch": 2772} {"train_loss": -43.30177688598633, "global_step": 335419, "epoch": 2772} {"train_loss": -44.09531784057617, "global_step": 335420, "epoch": 2772} {"train_loss": -43.63521957397461, "global_step": 335421, "epoch": 2772} {"train_loss": -44.213539123535156, "global_step": 335422, "epoch": 2772} {"train_loss": -44.97035217285156, "global_step": 335423, "epoch": 2772} {"train_loss": -44.019405364990234, "global_step": 335424, "epoch": 2772} {"train_loss": -44.66965866088867, "global_step": 335425, "epoch": 2772} {"train_loss": -44.18543243408203, "global_step": 335426, "epoch": 2772} {"train_loss": -44.740230560302734, "global_step": 335427, "epoch": 2772} {"train_loss": -43.966651916503906, "global_step": 335428, "epoch": 2772} {"train_loss": -45.12614822387695, "global_step": 335429, "epoch": 2772} {"train_loss": -43.13629913330078, "global_step": 335430, "epoch": 2772} {"train_loss": -45.12617111206055, "global_step": 335431, "epoch": 2772} {"train_loss": -43.59676742553711, "global_step": 335432, "epoch": 2772} {"train_loss": -44.44330978393555, "global_step": 335433, "epoch": 2772} {"train_loss": -44.4147834777832, "global_step": 335434, "epoch": 2772} {"train_loss": -44.39199447631836, "global_step": 335435, "epoch": 2772} {"train_loss": -44.20017623901367, "global_step": 335436, "epoch": 2772} {"train_loss": -44.513916015625, "global_step": 335437, "epoch": 2772} {"train_loss": -44.666542053222656, "global_step": 335438, "epoch": 2772} {"train_loss": -43.981353759765625, "global_step": 335439, "epoch": 2772} {"train_loss": -44.63438034057617, "global_step": 335440, "epoch": 2772} {"train_loss": -43.954139709472656, "global_step": 335441, "epoch": 2772} {"train_loss": -44.77518844604492, "global_step": 335442, "epoch": 2772} {"train_loss": -43.78671646118164, "global_step": 335443, "epoch": 2772} {"train_loss": -44.47504806518555, "global_step": 335444, "epoch": 2772} {"train_loss": -44.509429931640625, "global_step": 335445, "epoch": 2772} {"train_loss": -44.425697326660156, "global_step": 335446, "epoch": 2772} {"train_loss": -44.12415313720703, "global_step": 335447, "epoch": 2772} {"train_loss": -44.35858154296875, "global_step": 335448, "epoch": 2772} {"train_loss": -44.16080093383789, "global_step": 335449, "epoch": 2772} {"train_loss": -44.594871520996094, "global_step": 335450, "epoch": 2772} {"train_loss": -43.568111419677734, "global_step": 335451, "epoch": 2772} {"train_loss": -44.76934051513672, "global_step": 335452, "epoch": 2772} {"train_loss": -44.2474479675293, "global_step": 335453, "epoch": 2772} {"train_loss": -44.3359489440918, "global_step": 335454, "epoch": 2772} {"train_loss": -44.83363723754883, "global_step": 335455, "epoch": 2772} {"train_loss": -44.70231246948242, "global_step": 335456, "epoch": 2772} {"train_loss": -44.627105712890625, "global_step": 335457, "epoch": 2772} {"train_loss": -44.3218994140625, "global_step": 335458, "epoch": 2772} {"train_loss": -43.77433395385742, "global_step": 335459, "epoch": 2772} {"train_loss": -44.2723388671875, "global_step": 335460, "epoch": 2772} {"train_loss": -44.405677795410156, "global_step": 335461, "epoch": 2772} {"train_loss": -44.711151123046875, "global_step": 335462, "epoch": 2772} {"train_loss": -43.91302490234375, "global_step": 335463, "epoch": 2772} {"train_loss": -44.40542221069336, "global_step": 335464, "epoch": 2772} {"train_loss": -44.49114990234375, "global_step": 335465, "epoch": 2772} {"train_loss": -44.741783142089844, "global_step": 335466, "epoch": 2772} {"train_loss": -44.145294189453125, "global_step": 335467, "epoch": 2772} {"train_loss": -44.79462432861328, "global_step": 335468, "epoch": 2772} {"train_loss": -44.788814544677734, "global_step": 335469, "epoch": 2772} {"train_loss": -44.038875579833984, "global_step": 335470, "epoch": 2772} {"train_loss": -43.91066360473633, "global_step": 335471, "epoch": 2772} {"train_loss": -43.29502487182617, "global_step": 335472, "epoch": 2772} {"train_loss": -44.476722717285156, "global_step": 335473, "epoch": 2772} {"train_loss": -44.54874801635742, "global_step": 335474, "epoch": 2772} {"train_loss": -43.76641845703125, "global_step": 335475, "epoch": 2772} {"train_loss": -44.771148681640625, "global_step": 335476, "epoch": 2772} {"train_loss": -44.46104431152344, "global_step": 335477, "epoch": 2772} {"train_loss": -43.60930252075195, "global_step": 335478, "epoch": 2772} {"train_loss": -43.68874740600586, "global_step": 335479, "epoch": 2772} {"train_loss": -44.336551666259766, "global_step": 335480, "epoch": 2772} {"train_loss": -44.71726608276367, "global_step": 335481, "epoch": 2772} {"train_loss": -43.79421615600586, "global_step": 335482, "epoch": 2772} {"train_loss": -43.8025016784668, "global_step": 335483, "epoch": 2772} {"train_loss": -43.87174606323242, "global_step": 335484, "epoch": 2772} {"train_loss": -43.784088134765625, "global_step": 335485, "epoch": 2772} {"train_loss": -43.5657958984375, "global_step": 335486, "epoch": 2772} {"train_loss": -43.778236389160156, "global_step": 335487, "epoch": 2772} {"train_loss": -44.63225173950195, "global_step": 335488, "epoch": 2772} {"train_loss": -43.060523986816406, "global_step": 335489, "epoch": 2772} {"train_loss": -43.73823165893555, "global_step": 335490, "epoch": 2772} {"train_loss": -44.40007400512695, "global_step": 335491, "epoch": 2772} {"train_loss": -44.3275260925293, "global_step": 335492, "epoch": 2772} {"train_loss": -43.76689910888672, "global_step": 335493, "epoch": 2772} {"train_loss": -41.82883071899414, "global_step": 335494, "epoch": 2772} {"train_loss": -43.39966583251953, "global_step": 335495, "epoch": 2772} {"train_loss": -41.87793731689453, "global_step": 335496, "epoch": 2772} {"train_loss": -41.398841857910156, "global_step": 335497, "epoch": 2772} {"train_loss": -41.626461029052734, "global_step": 335498, "epoch": 2772} {"train_loss": -42.75437545776367, "global_step": 335499, "epoch": 2772} {"train_loss": -41.97195053100586, "global_step": 335500, "epoch": 2772} {"train_loss": -43.96291732788086, "global_step": 335501, "epoch": 2772} {"train_loss": -42.52099609375, "global_step": 335502, "epoch": 2772} {"train_loss": -43.6025505065918, "global_step": 335503, "epoch": 2772} {"train_loss": -43.92472457885742, "global_step": 335504, "epoch": 2772} {"train_loss": -43.632625579833984, "global_step": 335505, "epoch": 2772} {"train_loss": -42.61151123046875, "global_step": 335506, "epoch": 2772} {"train_loss": -44.23112106323242, "global_step": 335507, "epoch": 2772} {"train_loss": -42.36750411987305, "global_step": 335508, "epoch": 2772} {"train_loss": -43.17502975463867, "global_step": 335509, "epoch": 2772} {"train_loss": -43.62399673461914, "global_step": 335510, "epoch": 2772} {"train_loss": -41.436397552490234, "global_step": 335511, "epoch": 2772} {"train_loss": -43.91748046875, "global_step": 335512, "epoch": 2772} {"train_loss": -39.260494232177734, "global_step": 335513, "epoch": 2772} {"train_loss": -39.85732650756836, "global_step": 335514, "epoch": 2772} {"train_loss": -42.38825607299805, "global_step": 335515, "epoch": 2772} {"train_loss": -37.85274124145508, "global_step": 335516, "epoch": 2772} {"train_loss": -41.53396224975586, "global_step": 335517, "epoch": 2772} {"train_loss": -39.703861236572266, "global_step": 335518, "epoch": 2772} {"train_loss": -41.00986862182617, "global_step": 335519, "epoch": 2772} {"train_loss": -40.99696731567383, "global_step": 335520, "epoch": 2772} {"train_loss": -40.896541595458984, "global_step": 335521, "epoch": 2772} {"train_loss": -42.25968551635742, "global_step": 335522, "epoch": 2772} {"train_loss": -42.25885009765625, "global_step": 335523, "epoch": 2772} {"train_loss": -42.175289154052734, "global_step": 335524, "epoch": 2772} {"train_loss": -39.73226547241211, "global_step": 335525, "epoch": 2772} {"train_loss": -42.7308464050293, "global_step": 335526, "epoch": 2772} {"train_loss": -42.377376556396484, "global_step": 335527, "epoch": 2772} {"train_loss": -43.1895751953125, "global_step": 335528, "epoch": 2772} {"train_loss": -42.87850570678711, "global_step": 335529, "epoch": 2772} {"train_loss": -41.20914077758789, "global_step": 335530, "epoch": 2772} {"train_loss": -42.3139762878418, "global_step": 335531, "epoch": 2772} {"train_loss": -43.52204901324816, "global_step": 335532, "epoch": 2772, "val_loss": 2525709.0} {"train_loss": -43.188629150390625, "global_step": 335533, "epoch": 2773} {"train_loss": -42.320247650146484, "global_step": 335534, "epoch": 2773} {"train_loss": -42.958309173583984, "global_step": 335535, "epoch": 2773} {"train_loss": -43.61198425292969, "global_step": 335536, "epoch": 2773} {"train_loss": -42.6402702331543, "global_step": 335537, "epoch": 2773} {"train_loss": -43.541229248046875, "global_step": 335538, "epoch": 2773} {"train_loss": -43.98552322387695, "global_step": 335539, "epoch": 2773} {"train_loss": -43.396339416503906, "global_step": 335540, "epoch": 2773} {"train_loss": -43.44385528564453, "global_step": 335541, "epoch": 2773} {"train_loss": -43.864662170410156, "global_step": 335542, "epoch": 2773} {"train_loss": -43.6295166015625, "global_step": 335543, "epoch": 2773} {"train_loss": -44.003074645996094, "global_step": 335544, "epoch": 2773} {"train_loss": -43.83523178100586, "global_step": 335545, "epoch": 2773} {"train_loss": -44.286041259765625, "global_step": 335546, "epoch": 2773} {"train_loss": -43.529884338378906, "global_step": 335547, "epoch": 2773} {"train_loss": -44.66504669189453, "global_step": 335548, "epoch": 2773} {"train_loss": -43.364437103271484, "global_step": 335549, "epoch": 2773} {"train_loss": -43.851383209228516, "global_step": 335550, "epoch": 2773} {"train_loss": -45.02277755737305, "global_step": 335551, "epoch": 2773} {"train_loss": -43.06061553955078, "global_step": 335552, "epoch": 2773} {"train_loss": -43.52366256713867, "global_step": 335553, "epoch": 2773} {"train_loss": -44.42026901245117, "global_step": 335554, "epoch": 2773} {"train_loss": -44.236934661865234, "global_step": 335555, "epoch": 2773} {"train_loss": -44.27353286743164, "global_step": 335556, "epoch": 2773} {"train_loss": -43.80366897583008, "global_step": 335557, "epoch": 2773} {"train_loss": -44.550228118896484, "global_step": 335558, "epoch": 2773} {"train_loss": -42.71297836303711, "global_step": 335559, "epoch": 2773} {"train_loss": -43.652034759521484, "global_step": 335560, "epoch": 2773} {"train_loss": -45.004310607910156, "global_step": 335561, "epoch": 2773} {"train_loss": -43.89719009399414, "global_step": 335562, "epoch": 2773} {"train_loss": -44.295555114746094, "global_step": 335563, "epoch": 2773} {"train_loss": -44.1938591003418, "global_step": 335564, "epoch": 2773} {"train_loss": -44.0604248046875, "global_step": 335565, "epoch": 2773} {"train_loss": -44.40529251098633, "global_step": 335566, "epoch": 2773} {"train_loss": -43.86567306518555, "global_step": 335567, "epoch": 2773} {"train_loss": -44.25261306762695, "global_step": 335568, "epoch": 2773} {"train_loss": -44.6683464050293, "global_step": 335569, "epoch": 2773} {"train_loss": -44.338069915771484, "global_step": 335570, "epoch": 2773} {"train_loss": -44.241127014160156, "global_step": 335571, "epoch": 2773} {"train_loss": -44.07270431518555, "global_step": 335572, "epoch": 2773} {"train_loss": -44.234737396240234, "global_step": 335573, "epoch": 2773} {"train_loss": -43.89368438720703, "global_step": 335574, "epoch": 2773} {"train_loss": -42.738277435302734, "global_step": 335575, "epoch": 2773} {"train_loss": -44.96938705444336, "global_step": 335576, "epoch": 2773} {"train_loss": -42.39482498168945, "global_step": 335577, "epoch": 2773} {"train_loss": -42.0683708190918, "global_step": 335578, "epoch": 2773} {"train_loss": -43.28617477416992, "global_step": 335579, "epoch": 2773} {"train_loss": -42.450740814208984, "global_step": 335580, "epoch": 2773} {"train_loss": -44.282588958740234, "global_step": 335581, "epoch": 2773} {"train_loss": -43.95466995239258, "global_step": 335582, "epoch": 2773} {"train_loss": -43.3511848449707, "global_step": 335583, "epoch": 2773} {"train_loss": -42.63153839111328, "global_step": 335584, "epoch": 2773} {"train_loss": -43.84031295776367, "global_step": 335585, "epoch": 2773} {"train_loss": -44.30196762084961, "global_step": 335586, "epoch": 2773} {"train_loss": -42.68561553955078, "global_step": 335587, "epoch": 2773} {"train_loss": -43.28752517700195, "global_step": 335588, "epoch": 2773} {"train_loss": -43.42609786987305, "global_step": 335589, "epoch": 2773} {"train_loss": -43.972537994384766, "global_step": 335590, "epoch": 2773} {"train_loss": -44.28969955444336, "global_step": 335591, "epoch": 2773} {"train_loss": -44.493865966796875, "global_step": 335592, "epoch": 2773} {"train_loss": -44.39675521850586, "global_step": 335593, "epoch": 2773} {"train_loss": -44.6112174987793, "global_step": 335594, "epoch": 2773} {"train_loss": -44.58479309082031, "global_step": 335595, "epoch": 2773} {"train_loss": -44.572933197021484, "global_step": 335596, "epoch": 2773} {"train_loss": -44.29518508911133, "global_step": 335597, "epoch": 2773} {"train_loss": -44.95101547241211, "global_step": 335598, "epoch": 2773} {"train_loss": -45.35063171386719, "global_step": 335599, "epoch": 2773} {"train_loss": -44.869144439697266, "global_step": 335600, "epoch": 2773} {"train_loss": -44.8123893737793, "global_step": 335601, "epoch": 2773} {"train_loss": -44.82160949707031, "global_step": 335602, "epoch": 2773} {"train_loss": -45.030635833740234, "global_step": 335603, "epoch": 2773} {"train_loss": -44.81498718261719, "global_step": 335604, "epoch": 2773} {"train_loss": -44.75208282470703, "global_step": 335605, "epoch": 2773} {"train_loss": -44.61880874633789, "global_step": 335606, "epoch": 2773} {"train_loss": -44.753639221191406, "global_step": 335607, "epoch": 2773} {"train_loss": -45.17514419555664, "global_step": 335608, "epoch": 2773} {"train_loss": -44.65373229980469, "global_step": 335609, "epoch": 2773} {"train_loss": -45.12272644042969, "global_step": 335610, "epoch": 2773} {"train_loss": -45.10310745239258, "global_step": 335611, "epoch": 2773} {"train_loss": -44.96029281616211, "global_step": 335612, "epoch": 2773} {"train_loss": -44.5090217590332, "global_step": 335613, "epoch": 2773} {"train_loss": -45.30025863647461, "global_step": 335614, "epoch": 2773} {"train_loss": -44.170467376708984, "global_step": 335615, "epoch": 2773} {"train_loss": -44.0739860534668, "global_step": 335616, "epoch": 2773} {"train_loss": -45.072357177734375, "global_step": 335617, "epoch": 2773} {"train_loss": -45.1034049987793, "global_step": 335618, "epoch": 2773} {"train_loss": -44.48591232299805, "global_step": 335619, "epoch": 2773} {"train_loss": -44.57008743286133, "global_step": 335620, "epoch": 2773} {"train_loss": -44.81113815307617, "global_step": 335621, "epoch": 2773} {"train_loss": -43.76717758178711, "global_step": 335622, "epoch": 2773} {"train_loss": -44.36367416381836, "global_step": 335623, "epoch": 2773} {"train_loss": -44.95960998535156, "global_step": 335624, "epoch": 2773} {"train_loss": -43.85415267944336, "global_step": 335625, "epoch": 2773} {"train_loss": -44.500484466552734, "global_step": 335626, "epoch": 2773} {"train_loss": -43.005584716796875, "global_step": 335627, "epoch": 2773} {"train_loss": -40.063255310058594, "global_step": 335628, "epoch": 2773} {"train_loss": -42.18625259399414, "global_step": 335629, "epoch": 2773} {"train_loss": -44.75174331665039, "global_step": 335630, "epoch": 2773} {"train_loss": -39.67637634277344, "global_step": 335631, "epoch": 2773} {"train_loss": -42.3241081237793, "global_step": 335632, "epoch": 2773} {"train_loss": -44.4483642578125, "global_step": 335633, "epoch": 2773} {"train_loss": -40.03021240234375, "global_step": 335634, "epoch": 2773} {"train_loss": -43.993988037109375, "global_step": 335635, "epoch": 2773} {"train_loss": -41.04602813720703, "global_step": 335636, "epoch": 2773} {"train_loss": -41.630950927734375, "global_step": 335637, "epoch": 2773} {"train_loss": -42.169925689697266, "global_step": 335638, "epoch": 2773} {"train_loss": -40.3233528137207, "global_step": 335639, "epoch": 2773} {"train_loss": -41.4692497253418, "global_step": 335640, "epoch": 2773} {"train_loss": -41.525264739990234, "global_step": 335641, "epoch": 2773} {"train_loss": -41.119537353515625, "global_step": 335642, "epoch": 2773} {"train_loss": -41.04052734375, "global_step": 335643, "epoch": 2773} {"train_loss": -42.01919174194336, "global_step": 335644, "epoch": 2773} {"train_loss": -41.942047119140625, "global_step": 335645, "epoch": 2773} {"train_loss": -41.80965042114258, "global_step": 335646, "epoch": 2773} {"train_loss": -40.35859298706055, "global_step": 335647, "epoch": 2773} {"train_loss": -42.7535285949707, "global_step": 335648, "epoch": 2773} {"train_loss": -40.69124221801758, "global_step": 335649, "epoch": 2773} {"train_loss": -42.64741516113281, "global_step": 335650, "epoch": 2773} {"train_loss": -40.15431213378906, "global_step": 335651, "epoch": 2773} {"train_loss": -43.57950973510742, "global_step": 335652, "epoch": 2773} {"train_loss": -43.5622103352192, "global_step": 335653, "epoch": 2773, "val_loss": 2576988.75} {"train_loss": -42.705177307128906, "global_step": 335654, "epoch": 2774} {"train_loss": -41.53125762939453, "global_step": 335655, "epoch": 2774} {"train_loss": -42.3673210144043, "global_step": 335656, "epoch": 2774} {"train_loss": -43.35963821411133, "global_step": 335657, "epoch": 2774} {"train_loss": -41.7801513671875, "global_step": 335658, "epoch": 2774} {"train_loss": -43.34746170043945, "global_step": 335659, "epoch": 2774} {"train_loss": -41.022342681884766, "global_step": 335660, "epoch": 2774} {"train_loss": -43.60590362548828, "global_step": 335661, "epoch": 2774} {"train_loss": -42.929603576660156, "global_step": 335662, "epoch": 2774} {"train_loss": -42.44700241088867, "global_step": 335663, "epoch": 2774} {"train_loss": -43.43758773803711, "global_step": 335664, "epoch": 2774} {"train_loss": -42.69575881958008, "global_step": 335665, "epoch": 2774} {"train_loss": -43.86766052246094, "global_step": 335666, "epoch": 2774} {"train_loss": -42.83041000366211, "global_step": 335667, "epoch": 2774} {"train_loss": -43.36616134643555, "global_step": 335668, "epoch": 2774} {"train_loss": -43.173580169677734, "global_step": 335669, "epoch": 2774} {"train_loss": -43.11634063720703, "global_step": 335670, "epoch": 2774} {"train_loss": -43.947410583496094, "global_step": 335671, "epoch": 2774} {"train_loss": -43.769771575927734, "global_step": 335672, "epoch": 2774} {"train_loss": -42.7950439453125, "global_step": 335673, "epoch": 2774} {"train_loss": -43.928653717041016, "global_step": 335674, "epoch": 2774} {"train_loss": -42.839202880859375, "global_step": 335675, "epoch": 2774} {"train_loss": -43.82179641723633, "global_step": 335676, "epoch": 2774} {"train_loss": -43.671409606933594, "global_step": 335677, "epoch": 2774} {"train_loss": -44.40140914916992, "global_step": 335678, "epoch": 2774} {"train_loss": -43.77162551879883, "global_step": 335679, "epoch": 2774} {"train_loss": -44.46003341674805, "global_step": 335680, "epoch": 2774} {"train_loss": -44.01869201660156, "global_step": 335681, "epoch": 2774} {"train_loss": -43.87999725341797, "global_step": 335682, "epoch": 2774} {"train_loss": -44.25930404663086, "global_step": 335683, "epoch": 2774} {"train_loss": -44.16566848754883, "global_step": 335684, "epoch": 2774} {"train_loss": -44.2111701965332, "global_step": 335685, "epoch": 2774} {"train_loss": -44.29484558105469, "global_step": 335686, "epoch": 2774} {"train_loss": -44.22206115722656, "global_step": 335687, "epoch": 2774} {"train_loss": -43.84761047363281, "global_step": 335688, "epoch": 2774} {"train_loss": -43.77313232421875, "global_step": 335689, "epoch": 2774} {"train_loss": -44.049598693847656, "global_step": 335690, "epoch": 2774} {"train_loss": -44.13181686401367, "global_step": 335691, "epoch": 2774} {"train_loss": -44.195186614990234, "global_step": 335692, "epoch": 2774} {"train_loss": -44.402748107910156, "global_step": 335693, "epoch": 2774} {"train_loss": -44.054176330566406, "global_step": 335694, "epoch": 2774} {"train_loss": -44.27656936645508, "global_step": 335695, "epoch": 2774} {"train_loss": -44.299598693847656, "global_step": 335696, "epoch": 2774} {"train_loss": -44.482234954833984, "global_step": 335697, "epoch": 2774} {"train_loss": -44.598201751708984, "global_step": 335698, "epoch": 2774} {"train_loss": -44.353206634521484, "global_step": 335699, "epoch": 2774} {"train_loss": -44.38958740234375, "global_step": 335700, "epoch": 2774} {"train_loss": -44.4604606628418, "global_step": 335701, "epoch": 2774} {"train_loss": -44.29509735107422, "global_step": 335702, "epoch": 2774} {"train_loss": -44.51569747924805, "global_step": 335703, "epoch": 2774} {"train_loss": -44.91495132446289, "global_step": 335704, "epoch": 2774} {"train_loss": -44.21027755737305, "global_step": 335705, "epoch": 2774} {"train_loss": -43.95879364013672, "global_step": 335706, "epoch": 2774} {"train_loss": -44.61426544189453, "global_step": 335707, "epoch": 2774} {"train_loss": -44.6487922668457, "global_step": 335708, "epoch": 2774} {"train_loss": -44.69697952270508, "global_step": 335709, "epoch": 2774} {"train_loss": -44.383583068847656, "global_step": 335710, "epoch": 2774} {"train_loss": -44.95343780517578, "global_step": 335711, "epoch": 2774} {"train_loss": -44.50722885131836, "global_step": 335712, "epoch": 2774} {"train_loss": -44.885494232177734, "global_step": 335713, "epoch": 2774} {"train_loss": -44.65737533569336, "global_step": 335714, "epoch": 2774} {"train_loss": -44.73167037963867, "global_step": 335715, "epoch": 2774} {"train_loss": -44.856632232666016, "global_step": 335716, "epoch": 2774} {"train_loss": -44.425498962402344, "global_step": 335717, "epoch": 2774} {"train_loss": -44.2952995300293, "global_step": 335718, "epoch": 2774} {"train_loss": -44.11865234375, "global_step": 335719, "epoch": 2774} {"train_loss": -44.73834228515625, "global_step": 335720, "epoch": 2774} {"train_loss": -44.34541702270508, "global_step": 335721, "epoch": 2774} {"train_loss": -44.3698844909668, "global_step": 335722, "epoch": 2774} {"train_loss": -43.86194610595703, "global_step": 335723, "epoch": 2774} {"train_loss": -43.62715148925781, "global_step": 335724, "epoch": 2774} {"train_loss": -44.4837760925293, "global_step": 335725, "epoch": 2774} {"train_loss": -41.95138168334961, "global_step": 335726, "epoch": 2774} {"train_loss": -44.467891693115234, "global_step": 335727, "epoch": 2774} {"train_loss": -43.282535552978516, "global_step": 335728, "epoch": 2774} {"train_loss": -43.40720748901367, "global_step": 335729, "epoch": 2774} {"train_loss": -44.73867416381836, "global_step": 335730, "epoch": 2774} {"train_loss": -41.883731842041016, "global_step": 335731, "epoch": 2774} {"train_loss": -43.72394561767578, "global_step": 335732, "epoch": 2774} {"train_loss": -43.948509216308594, "global_step": 335733, "epoch": 2774} {"train_loss": -42.59867858886719, "global_step": 335734, "epoch": 2774} {"train_loss": -44.390865325927734, "global_step": 335735, "epoch": 2774} {"train_loss": -41.730411529541016, "global_step": 335736, "epoch": 2774} {"train_loss": -43.80992126464844, "global_step": 335737, "epoch": 2774} {"train_loss": -44.13593292236328, "global_step": 335738, "epoch": 2774} {"train_loss": -42.4633903503418, "global_step": 335739, "epoch": 2774} {"train_loss": -45.01761245727539, "global_step": 335740, "epoch": 2774} {"train_loss": -41.148311614990234, "global_step": 335741, "epoch": 2774} {"train_loss": -43.539180755615234, "global_step": 335742, "epoch": 2774} {"train_loss": -39.17324447631836, "global_step": 335743, "epoch": 2774} {"train_loss": -39.541831970214844, "global_step": 335744, "epoch": 2774} {"train_loss": -39.47216796875, "global_step": 335745, "epoch": 2774} {"train_loss": -39.58136749267578, "global_step": 335746, "epoch": 2774} {"train_loss": -40.019039154052734, "global_step": 335747, "epoch": 2774} {"train_loss": -38.99762725830078, "global_step": 335748, "epoch": 2774} {"train_loss": -40.581756591796875, "global_step": 335749, "epoch": 2774} {"train_loss": -40.3405647277832, "global_step": 335750, "epoch": 2774} {"train_loss": -40.06678771972656, "global_step": 335751, "epoch": 2774} {"train_loss": -40.49872970581055, "global_step": 335752, "epoch": 2774} {"train_loss": -40.41428756713867, "global_step": 335753, "epoch": 2774} {"train_loss": -40.56428146362305, "global_step": 335754, "epoch": 2774} {"train_loss": -40.466041564941406, "global_step": 335755, "epoch": 2774} {"train_loss": -40.57148361206055, "global_step": 335756, "epoch": 2774} {"train_loss": -41.207679748535156, "global_step": 335757, "epoch": 2774} {"train_loss": -40.604530334472656, "global_step": 335758, "epoch": 2774} {"train_loss": -41.38311767578125, "global_step": 335759, "epoch": 2774} {"train_loss": -41.46879959106445, "global_step": 335760, "epoch": 2774} {"train_loss": -41.28274917602539, "global_step": 335761, "epoch": 2774} {"train_loss": -41.24158477783203, "global_step": 335762, "epoch": 2774} {"train_loss": -41.912391662597656, "global_step": 335763, "epoch": 2774} {"train_loss": -41.596885681152344, "global_step": 335764, "epoch": 2774} {"train_loss": -41.069419860839844, "global_step": 335765, "epoch": 2774} {"train_loss": -41.5941047668457, "global_step": 335766, "epoch": 2774} {"train_loss": -41.73124694824219, "global_step": 335767, "epoch": 2774} {"train_loss": -41.771881103515625, "global_step": 335768, "epoch": 2774} {"train_loss": -41.9846305847168, "global_step": 335769, "epoch": 2774} {"train_loss": -42.667903900146484, "global_step": 335770, "epoch": 2774} {"train_loss": -41.85364532470703, "global_step": 335771, "epoch": 2774} {"train_loss": -42.218788146972656, "global_step": 335772, "epoch": 2774} {"train_loss": -42.94130325317383, "global_step": 335773, "epoch": 2774} {"train_loss": -43.03859707540717, "global_step": 335774, "epoch": 2774, "val_loss": 2467850.0} {"train_loss": -43.164241790771484, "global_step": 335775, "epoch": 2775} {"train_loss": -43.556575775146484, "global_step": 335776, "epoch": 2775} {"train_loss": -44.28657150268555, "global_step": 335777, "epoch": 2775} {"train_loss": -43.79548263549805, "global_step": 335778, "epoch": 2775} {"train_loss": -44.14900588989258, "global_step": 335779, "epoch": 2775} {"train_loss": -44.375038146972656, "global_step": 335780, "epoch": 2775} {"train_loss": -43.70884323120117, "global_step": 335781, "epoch": 2775} {"train_loss": -44.54283905029297, "global_step": 335782, "epoch": 2775} {"train_loss": -44.421871185302734, "global_step": 335783, "epoch": 2775} {"train_loss": -44.08978271484375, "global_step": 335784, "epoch": 2775} {"train_loss": -44.97798156738281, "global_step": 335785, "epoch": 2775} {"train_loss": -44.884620666503906, "global_step": 335786, "epoch": 2775} {"train_loss": -44.74522018432617, "global_step": 335787, "epoch": 2775} {"train_loss": -44.73964309692383, "global_step": 335788, "epoch": 2775} {"train_loss": -44.79336166381836, "global_step": 335789, "epoch": 2775} {"train_loss": -45.0904426574707, "global_step": 335790, "epoch": 2775} {"train_loss": -44.3207893371582, "global_step": 335791, "epoch": 2775} {"train_loss": -44.078643798828125, "global_step": 335792, "epoch": 2775} {"train_loss": -44.50802230834961, "global_step": 335793, "epoch": 2775} {"train_loss": -44.644752502441406, "global_step": 335794, "epoch": 2775} {"train_loss": -45.1585693359375, "global_step": 335795, "epoch": 2775} {"train_loss": -44.336936950683594, "global_step": 335796, "epoch": 2775} {"train_loss": -44.95166015625, "global_step": 335797, "epoch": 2775} {"train_loss": -45.326438903808594, "global_step": 335798, "epoch": 2775} {"train_loss": -44.186397552490234, "global_step": 335799, "epoch": 2775} {"train_loss": -44.80787658691406, "global_step": 335800, "epoch": 2775} {"train_loss": -43.8706169128418, "global_step": 335801, "epoch": 2775} {"train_loss": -43.0625114440918, "global_step": 335802, "epoch": 2775} {"train_loss": -43.265174865722656, "global_step": 335803, "epoch": 2775} {"train_loss": -39.33537292480469, "global_step": 335804, "epoch": 2775} {"train_loss": -41.58342742919922, "global_step": 335805, "epoch": 2775} {"train_loss": -42.362205505371094, "global_step": 335806, "epoch": 2775} {"train_loss": -37.77427291870117, "global_step": 335807, "epoch": 2775} {"train_loss": -41.041744232177734, "global_step": 335808, "epoch": 2775} {"train_loss": -40.62609100341797, "global_step": 335809, "epoch": 2775} {"train_loss": -37.70086669921875, "global_step": 335810, "epoch": 2775} {"train_loss": -42.14927291870117, "global_step": 335811, "epoch": 2775} {"train_loss": -39.85969543457031, "global_step": 335812, "epoch": 2775} {"train_loss": -42.60910415649414, "global_step": 335813, "epoch": 2775} {"train_loss": -40.980899810791016, "global_step": 335814, "epoch": 2775} {"train_loss": -38.9205436706543, "global_step": 335815, "epoch": 2775} {"train_loss": -42.657352447509766, "global_step": 335816, "epoch": 2775} {"train_loss": -39.37997817993164, "global_step": 335817, "epoch": 2775} {"train_loss": -42.67005157470703, "global_step": 335818, "epoch": 2775} {"train_loss": -40.991878509521484, "global_step": 335819, "epoch": 2775} {"train_loss": -43.10561752319336, "global_step": 335820, "epoch": 2775} {"train_loss": -41.23504638671875, "global_step": 335821, "epoch": 2775} {"train_loss": -42.36566162109375, "global_step": 335822, "epoch": 2775} {"train_loss": -42.30029296875, "global_step": 335823, "epoch": 2775} {"train_loss": -42.667022705078125, "global_step": 335824, "epoch": 2775} {"train_loss": -43.6435661315918, "global_step": 335825, "epoch": 2775} {"train_loss": -42.82596969604492, "global_step": 335826, "epoch": 2775} {"train_loss": -43.33890914916992, "global_step": 335827, "epoch": 2775} {"train_loss": -43.38069534301758, "global_step": 335828, "epoch": 2775} {"train_loss": -43.25751876831055, "global_step": 335829, "epoch": 2775} {"train_loss": -43.96810531616211, "global_step": 335830, "epoch": 2775} {"train_loss": -43.15774154663086, "global_step": 335831, "epoch": 2775} {"train_loss": -42.5679817199707, "global_step": 335832, "epoch": 2775} {"train_loss": -43.10468673706055, "global_step": 335833, "epoch": 2775} {"train_loss": -42.88186264038086, "global_step": 335834, "epoch": 2775} {"train_loss": -43.68526840209961, "global_step": 335835, "epoch": 2775} {"train_loss": -43.84364700317383, "global_step": 335836, "epoch": 2775} {"train_loss": -43.09746170043945, "global_step": 335837, "epoch": 2775} {"train_loss": -44.106239318847656, "global_step": 335838, "epoch": 2775} {"train_loss": -43.72805404663086, "global_step": 335839, "epoch": 2775} {"train_loss": -43.478267669677734, "global_step": 335840, "epoch": 2775} {"train_loss": -44.80373764038086, "global_step": 335841, "epoch": 2775} {"train_loss": -43.70913314819336, "global_step": 335842, "epoch": 2775} {"train_loss": -44.30218505859375, "global_step": 335843, "epoch": 2775} {"train_loss": -44.63201904296875, "global_step": 335844, "epoch": 2775} {"train_loss": -44.23801803588867, "global_step": 335845, "epoch": 2775} {"train_loss": -44.32548904418945, "global_step": 335846, "epoch": 2775} {"train_loss": -44.41887283325195, "global_step": 335847, "epoch": 2775} {"train_loss": -44.348201751708984, "global_step": 335848, "epoch": 2775} {"train_loss": -44.340579986572266, "global_step": 335849, "epoch": 2775} {"train_loss": -44.15412521362305, "global_step": 335850, "epoch": 2775} {"train_loss": -44.30826950073242, "global_step": 335851, "epoch": 2775} {"train_loss": -44.4251708984375, "global_step": 335852, "epoch": 2775} {"train_loss": -44.742706298828125, "global_step": 335853, "epoch": 2775} {"train_loss": -44.84503936767578, "global_step": 335854, "epoch": 2775} {"train_loss": -44.31313705444336, "global_step": 335855, "epoch": 2775} {"train_loss": -44.840938568115234, "global_step": 335856, "epoch": 2775} {"train_loss": -44.49734115600586, "global_step": 335857, "epoch": 2775} {"train_loss": -44.78726577758789, "global_step": 335858, "epoch": 2775} {"train_loss": -44.81226348876953, "global_step": 335859, "epoch": 2775} {"train_loss": -44.53909683227539, "global_step": 335860, "epoch": 2775} {"train_loss": -44.898799896240234, "global_step": 335861, "epoch": 2775} {"train_loss": -44.86157989501953, "global_step": 335862, "epoch": 2775} {"train_loss": -44.67927169799805, "global_step": 335863, "epoch": 2775} {"train_loss": -45.1527214050293, "global_step": 335864, "epoch": 2775} {"train_loss": -44.981483459472656, "global_step": 335865, "epoch": 2775} {"train_loss": -44.89572525024414, "global_step": 335866, "epoch": 2775} {"train_loss": -44.63264846801758, "global_step": 335867, "epoch": 2775} {"train_loss": -45.16746139526367, "global_step": 335868, "epoch": 2775} {"train_loss": -44.45047378540039, "global_step": 335869, "epoch": 2775} {"train_loss": -45.44313430786133, "global_step": 335870, "epoch": 2775} {"train_loss": -44.105098724365234, "global_step": 335871, "epoch": 2775} {"train_loss": -45.39567184448242, "global_step": 335872, "epoch": 2775} {"train_loss": -44.4289665222168, "global_step": 335873, "epoch": 2775} {"train_loss": -45.02978515625, "global_step": 335874, "epoch": 2775} {"train_loss": -44.7241325378418, "global_step": 335875, "epoch": 2775} {"train_loss": -45.1277961730957, "global_step": 335876, "epoch": 2775} {"train_loss": -45.67226028442383, "global_step": 335877, "epoch": 2775} {"train_loss": -45.06502914428711, "global_step": 335878, "epoch": 2775} {"train_loss": -45.464988708496094, "global_step": 335879, "epoch": 2775} {"train_loss": -45.22869110107422, "global_step": 335880, "epoch": 2775} {"train_loss": -45.3497428894043, "global_step": 335881, "epoch": 2775} {"train_loss": -45.62312316894531, "global_step": 335882, "epoch": 2775} {"train_loss": -45.44620895385742, "global_step": 335883, "epoch": 2775} {"train_loss": -45.09765625, "global_step": 335884, "epoch": 2775} {"train_loss": -45.157615661621094, "global_step": 335885, "epoch": 2775} {"train_loss": -44.58527374267578, "global_step": 335886, "epoch": 2775} {"train_loss": -45.3973388671875, "global_step": 335887, "epoch": 2775} {"train_loss": -44.90536117553711, "global_step": 335888, "epoch": 2775} {"train_loss": -45.22563552856445, "global_step": 335889, "epoch": 2775} {"train_loss": -45.079227447509766, "global_step": 335890, "epoch": 2775} {"train_loss": -45.549129486083984, "global_step": 335891, "epoch": 2775} {"train_loss": -45.60889434814453, "global_step": 335892, "epoch": 2775} {"train_loss": -45.14634323120117, "global_step": 335893, "epoch": 2775} {"train_loss": -45.31943893432617, "global_step": 335894, "epoch": 2775} {"train_loss": -43.882585761960875, "global_step": 335895, "epoch": 2775, "val_loss": 2604309.5} {"train_loss": -45.10822677612305, "global_step": 335896, "epoch": 2776} {"train_loss": -44.95784378051758, "global_step": 335897, "epoch": 2776} {"train_loss": -44.8521842956543, "global_step": 335898, "epoch": 2776} {"train_loss": -45.38270568847656, "global_step": 335899, "epoch": 2776} {"train_loss": -44.95185089111328, "global_step": 335900, "epoch": 2776} {"train_loss": -44.82658004760742, "global_step": 335901, "epoch": 2776} {"train_loss": -43.814083099365234, "global_step": 335902, "epoch": 2776} {"train_loss": -43.657928466796875, "global_step": 335903, "epoch": 2776} {"train_loss": -43.45623779296875, "global_step": 335904, "epoch": 2776} {"train_loss": -44.01242446899414, "global_step": 335905, "epoch": 2776} {"train_loss": -43.55158615112305, "global_step": 335906, "epoch": 2776} {"train_loss": -43.759132385253906, "global_step": 335907, "epoch": 2776} {"train_loss": -44.371238708496094, "global_step": 335908, "epoch": 2776} {"train_loss": -43.2542724609375, "global_step": 335909, "epoch": 2776} {"train_loss": -44.33758544921875, "global_step": 335910, "epoch": 2776} {"train_loss": -41.8984489440918, "global_step": 335911, "epoch": 2776} {"train_loss": -44.74296951293945, "global_step": 335912, "epoch": 2776} {"train_loss": -42.243431091308594, "global_step": 335913, "epoch": 2776} {"train_loss": -42.635501861572266, "global_step": 335914, "epoch": 2776} {"train_loss": -43.7123908996582, "global_step": 335915, "epoch": 2776} {"train_loss": -39.974178314208984, "global_step": 335916, "epoch": 2776} {"train_loss": -41.77158737182617, "global_step": 335917, "epoch": 2776} {"train_loss": -40.195167541503906, "global_step": 335918, "epoch": 2776} {"train_loss": -42.634647369384766, "global_step": 335919, "epoch": 2776} {"train_loss": -40.439144134521484, "global_step": 335920, "epoch": 2776} {"train_loss": -43.4901008605957, "global_step": 335921, "epoch": 2776} {"train_loss": -41.1849365234375, "global_step": 335922, "epoch": 2776} {"train_loss": -42.725215911865234, "global_step": 335923, "epoch": 2776} {"train_loss": -41.15790939331055, "global_step": 335924, "epoch": 2776} {"train_loss": -39.931724548339844, "global_step": 335925, "epoch": 2776} {"train_loss": -41.56856155395508, "global_step": 335926, "epoch": 2776} {"train_loss": -40.016944885253906, "global_step": 335927, "epoch": 2776} {"train_loss": -42.99522018432617, "global_step": 335928, "epoch": 2776} {"train_loss": -41.2596321105957, "global_step": 335929, "epoch": 2776} {"train_loss": -43.132625579833984, "global_step": 335930, "epoch": 2776} {"train_loss": -40.25483703613281, "global_step": 335931, "epoch": 2776} {"train_loss": -43.272674560546875, "global_step": 335932, "epoch": 2776} {"train_loss": -41.64143371582031, "global_step": 335933, "epoch": 2776} {"train_loss": -43.65470504760742, "global_step": 335934, "epoch": 2776} {"train_loss": -43.00192642211914, "global_step": 335935, "epoch": 2776} {"train_loss": -42.959835052490234, "global_step": 335936, "epoch": 2776} {"train_loss": -43.39014434814453, "global_step": 335937, "epoch": 2776} {"train_loss": -43.07133102416992, "global_step": 335938, "epoch": 2776} {"train_loss": -43.80988693237305, "global_step": 335939, "epoch": 2776} {"train_loss": -43.8372802734375, "global_step": 335940, "epoch": 2776} {"train_loss": -43.72944259643555, "global_step": 335941, "epoch": 2776} {"train_loss": -44.081905364990234, "global_step": 335942, "epoch": 2776} {"train_loss": -44.764713287353516, "global_step": 335943, "epoch": 2776} {"train_loss": -44.3680534362793, "global_step": 335944, "epoch": 2776} {"train_loss": -44.1952018737793, "global_step": 335945, "epoch": 2776} {"train_loss": -44.3535041809082, "global_step": 335946, "epoch": 2776} {"train_loss": -44.27553176879883, "global_step": 335947, "epoch": 2776} {"train_loss": -44.268795013427734, "global_step": 335948, "epoch": 2776} {"train_loss": -44.37581253051758, "global_step": 335949, "epoch": 2776} {"train_loss": -44.4242057800293, "global_step": 335950, "epoch": 2776} {"train_loss": -44.06370162963867, "global_step": 335951, "epoch": 2776} {"train_loss": -43.82786178588867, "global_step": 335952, "epoch": 2776} {"train_loss": -44.71632385253906, "global_step": 335953, "epoch": 2776} {"train_loss": -44.009273529052734, "global_step": 335954, "epoch": 2776} {"train_loss": -44.36615753173828, "global_step": 335955, "epoch": 2776} {"train_loss": -44.56354522705078, "global_step": 335956, "epoch": 2776} {"train_loss": -44.59654998779297, "global_step": 335957, "epoch": 2776} {"train_loss": -44.839717864990234, "global_step": 335958, "epoch": 2776} {"train_loss": -43.934059143066406, "global_step": 335959, "epoch": 2776} {"train_loss": -44.150856018066406, "global_step": 335960, "epoch": 2776} {"train_loss": -44.52711868286133, "global_step": 335961, "epoch": 2776} {"train_loss": -43.11973190307617, "global_step": 335962, "epoch": 2776} {"train_loss": -44.52736282348633, "global_step": 335963, "epoch": 2776} {"train_loss": -43.680233001708984, "global_step": 335964, "epoch": 2776} {"train_loss": -44.9143180847168, "global_step": 335965, "epoch": 2776} {"train_loss": -44.54696273803711, "global_step": 335966, "epoch": 2776} {"train_loss": -44.04052734375, "global_step": 335967, "epoch": 2776} {"train_loss": -44.567543029785156, "global_step": 335968, "epoch": 2776} {"train_loss": -44.773643493652344, "global_step": 335969, "epoch": 2776} {"train_loss": -43.84855270385742, "global_step": 335970, "epoch": 2776} {"train_loss": -44.1802978515625, "global_step": 335971, "epoch": 2776} {"train_loss": -44.489959716796875, "global_step": 335972, "epoch": 2776} {"train_loss": -45.1192512512207, "global_step": 335973, "epoch": 2776} {"train_loss": -44.25572204589844, "global_step": 335974, "epoch": 2776} {"train_loss": -44.76594924926758, "global_step": 335975, "epoch": 2776} {"train_loss": -45.0312614440918, "global_step": 335976, "epoch": 2776} {"train_loss": -43.558956146240234, "global_step": 335977, "epoch": 2776} {"train_loss": -44.11344909667969, "global_step": 335978, "epoch": 2776} {"train_loss": -44.668155670166016, "global_step": 335979, "epoch": 2776} {"train_loss": -43.0744514465332, "global_step": 335980, "epoch": 2776} {"train_loss": -44.24760055541992, "global_step": 335981, "epoch": 2776} {"train_loss": -43.60152816772461, "global_step": 335982, "epoch": 2776} {"train_loss": -44.34401321411133, "global_step": 335983, "epoch": 2776} {"train_loss": -44.46259307861328, "global_step": 335984, "epoch": 2776} {"train_loss": -43.42209243774414, "global_step": 335985, "epoch": 2776} {"train_loss": -44.35355758666992, "global_step": 335986, "epoch": 2776} {"train_loss": -44.16831588745117, "global_step": 335987, "epoch": 2776} {"train_loss": -44.35169219970703, "global_step": 335988, "epoch": 2776} {"train_loss": -44.56379318237305, "global_step": 335989, "epoch": 2776} {"train_loss": -44.2374382019043, "global_step": 335990, "epoch": 2776} {"train_loss": -43.59025192260742, "global_step": 335991, "epoch": 2776} {"train_loss": -45.29884338378906, "global_step": 335992, "epoch": 2776} {"train_loss": -42.842498779296875, "global_step": 335993, "epoch": 2776} {"train_loss": -44.53398513793945, "global_step": 335994, "epoch": 2776} {"train_loss": -44.839561462402344, "global_step": 335995, "epoch": 2776} {"train_loss": -44.14258575439453, "global_step": 335996, "epoch": 2776} {"train_loss": -44.392608642578125, "global_step": 335997, "epoch": 2776} {"train_loss": -45.01192092895508, "global_step": 335998, "epoch": 2776} {"train_loss": -44.90633773803711, "global_step": 335999, "epoch": 2776} {"train_loss": -45.032440185546875, "global_step": 336000, "epoch": 2776} {"train_loss": -45.05660629272461, "global_step": 336001, "epoch": 2776} {"train_loss": -44.99202346801758, "global_step": 336002, "epoch": 2776} {"train_loss": -43.891693115234375, "global_step": 336003, "epoch": 2776} {"train_loss": -45.038330078125, "global_step": 336004, "epoch": 2776} {"train_loss": -44.704872131347656, "global_step": 336005, "epoch": 2776} {"train_loss": -44.35908889770508, "global_step": 336006, "epoch": 2776} {"train_loss": -45.041378021240234, "global_step": 336007, "epoch": 2776} {"train_loss": -44.5018424987793, "global_step": 336008, "epoch": 2776} {"train_loss": -44.70209884643555, "global_step": 336009, "epoch": 2776} {"train_loss": -44.57688522338867, "global_step": 336010, "epoch": 2776} {"train_loss": -45.02668380737305, "global_step": 336011, "epoch": 2776} {"train_loss": -44.62281036376953, "global_step": 336012, "epoch": 2776} {"train_loss": -44.551631927490234, "global_step": 336013, "epoch": 2776} {"train_loss": -44.725032806396484, "global_step": 336014, "epoch": 2776} {"train_loss": -44.234981536865234, "global_step": 336015, "epoch": 2776} {"train_loss": -43.827825625080706, "global_step": 336016, "epoch": 2776, "val_loss": 2495772.25} {"train_loss": -43.71623611450195, "global_step": 336017, "epoch": 2777} {"train_loss": -43.96637725830078, "global_step": 336018, "epoch": 2777} {"train_loss": -44.97117233276367, "global_step": 336019, "epoch": 2777} {"train_loss": -43.178932189941406, "global_step": 336020, "epoch": 2777} {"train_loss": -43.64975357055664, "global_step": 336021, "epoch": 2777} {"train_loss": -41.91147994995117, "global_step": 336022, "epoch": 2777} {"train_loss": -44.50749206542969, "global_step": 336023, "epoch": 2777} {"train_loss": -43.880889892578125, "global_step": 336024, "epoch": 2777} {"train_loss": -40.93560028076172, "global_step": 336025, "epoch": 2777} {"train_loss": -40.881893157958984, "global_step": 336026, "epoch": 2777} {"train_loss": -41.38306427001953, "global_step": 336027, "epoch": 2777} {"train_loss": -41.4974250793457, "global_step": 336028, "epoch": 2777} {"train_loss": -42.340145111083984, "global_step": 336029, "epoch": 2777} {"train_loss": -42.341041564941406, "global_step": 336030, "epoch": 2777} {"train_loss": -42.25919723510742, "global_step": 336031, "epoch": 2777} {"train_loss": -42.258583068847656, "global_step": 336032, "epoch": 2777} {"train_loss": -42.60643768310547, "global_step": 336033, "epoch": 2777} {"train_loss": -42.67274475097656, "global_step": 336034, "epoch": 2777} {"train_loss": -43.48355484008789, "global_step": 336035, "epoch": 2777} {"train_loss": -43.954524993896484, "global_step": 336036, "epoch": 2777} {"train_loss": -44.231544494628906, "global_step": 336037, "epoch": 2777} {"train_loss": -43.209163665771484, "global_step": 336038, "epoch": 2777} {"train_loss": -44.4089469909668, "global_step": 336039, "epoch": 2777} {"train_loss": -43.650508880615234, "global_step": 336040, "epoch": 2777} {"train_loss": -42.51560592651367, "global_step": 336041, "epoch": 2777} {"train_loss": -43.30548858642578, "global_step": 336042, "epoch": 2777} {"train_loss": -42.44783401489258, "global_step": 336043, "epoch": 2777} {"train_loss": -42.61776351928711, "global_step": 336044, "epoch": 2777} {"train_loss": -42.87191390991211, "global_step": 336045, "epoch": 2777} {"train_loss": -43.456214904785156, "global_step": 336046, "epoch": 2777} {"train_loss": -43.936527252197266, "global_step": 336047, "epoch": 2777} {"train_loss": -42.1438102722168, "global_step": 336048, "epoch": 2777} {"train_loss": -43.25185775756836, "global_step": 336049, "epoch": 2777} {"train_loss": -43.52341079711914, "global_step": 336050, "epoch": 2777} {"train_loss": -41.949676513671875, "global_step": 336051, "epoch": 2777} {"train_loss": -43.779212951660156, "global_step": 336052, "epoch": 2777} {"train_loss": -40.208919525146484, "global_step": 336053, "epoch": 2777} {"train_loss": -41.31417465209961, "global_step": 336054, "epoch": 2777} {"train_loss": -42.6192741394043, "global_step": 336055, "epoch": 2777} {"train_loss": -42.39947509765625, "global_step": 336056, "epoch": 2777} {"train_loss": -41.36497497558594, "global_step": 336057, "epoch": 2777} {"train_loss": -42.16097640991211, "global_step": 336058, "epoch": 2777} {"train_loss": -41.30404281616211, "global_step": 336059, "epoch": 2777} {"train_loss": -42.392940521240234, "global_step": 336060, "epoch": 2777} {"train_loss": -40.980567932128906, "global_step": 336061, "epoch": 2777} {"train_loss": -42.704986572265625, "global_step": 336062, "epoch": 2777} {"train_loss": -43.51642990112305, "global_step": 336063, "epoch": 2777} {"train_loss": -43.01499557495117, "global_step": 336064, "epoch": 2777} {"train_loss": -42.74037551879883, "global_step": 336065, "epoch": 2777} {"train_loss": -43.38344955444336, "global_step": 336066, "epoch": 2777} {"train_loss": -43.33894348144531, "global_step": 336067, "epoch": 2777} {"train_loss": -43.96270751953125, "global_step": 336068, "epoch": 2777} {"train_loss": -43.916786193847656, "global_step": 336069, "epoch": 2777} {"train_loss": -44.247249603271484, "global_step": 336070, "epoch": 2777} {"train_loss": -44.37562561035156, "global_step": 336071, "epoch": 2777} {"train_loss": -43.888946533203125, "global_step": 336072, "epoch": 2777} {"train_loss": -43.764156341552734, "global_step": 336073, "epoch": 2777} {"train_loss": -44.64910888671875, "global_step": 336074, "epoch": 2777} {"train_loss": -44.208045959472656, "global_step": 336075, "epoch": 2777} {"train_loss": -44.08222198486328, "global_step": 336076, "epoch": 2777} {"train_loss": -43.78642272949219, "global_step": 336077, "epoch": 2777} {"train_loss": -44.608089447021484, "global_step": 336078, "epoch": 2777} {"train_loss": -43.793861389160156, "global_step": 336079, "epoch": 2777} {"train_loss": -45.211647033691406, "global_step": 336080, "epoch": 2777} {"train_loss": -44.34177780151367, "global_step": 336081, "epoch": 2777} {"train_loss": -45.12250900268555, "global_step": 336082, "epoch": 2777} {"train_loss": -44.75794219970703, "global_step": 336083, "epoch": 2777} {"train_loss": -44.86683654785156, "global_step": 336084, "epoch": 2777} {"train_loss": -44.467529296875, "global_step": 336085, "epoch": 2777} {"train_loss": -45.21283721923828, "global_step": 336086, "epoch": 2777} {"train_loss": -44.22224807739258, "global_step": 336087, "epoch": 2777} {"train_loss": -44.22074508666992, "global_step": 336088, "epoch": 2777} {"train_loss": -44.7608757019043, "global_step": 336089, "epoch": 2777} {"train_loss": -44.65900421142578, "global_step": 336090, "epoch": 2777} {"train_loss": -44.624847412109375, "global_step": 336091, "epoch": 2777} {"train_loss": -43.84431076049805, "global_step": 336092, "epoch": 2777} {"train_loss": -45.15081024169922, "global_step": 336093, "epoch": 2777} {"train_loss": -44.71773910522461, "global_step": 336094, "epoch": 2777} {"train_loss": -44.37141799926758, "global_step": 336095, "epoch": 2777} {"train_loss": -43.54779815673828, "global_step": 336096, "epoch": 2777} {"train_loss": -42.675777435302734, "global_step": 336097, "epoch": 2777} {"train_loss": -45.00372314453125, "global_step": 336098, "epoch": 2777} {"train_loss": -44.9336051940918, "global_step": 336099, "epoch": 2777} {"train_loss": -44.86963653564453, "global_step": 336100, "epoch": 2777} {"train_loss": -44.48373031616211, "global_step": 336101, "epoch": 2777} {"train_loss": -44.626914978027344, "global_step": 336102, "epoch": 2777} {"train_loss": -45.17274856567383, "global_step": 336103, "epoch": 2777} {"train_loss": -45.22829055786133, "global_step": 336104, "epoch": 2777} {"train_loss": -45.07865524291992, "global_step": 336105, "epoch": 2777} {"train_loss": -45.32598114013672, "global_step": 336106, "epoch": 2777} {"train_loss": -44.3296012878418, "global_step": 336107, "epoch": 2777} {"train_loss": -44.4500846862793, "global_step": 336108, "epoch": 2777} {"train_loss": -44.530303955078125, "global_step": 336109, "epoch": 2777} {"train_loss": -45.54718780517578, "global_step": 336110, "epoch": 2777} {"train_loss": -44.66712188720703, "global_step": 336111, "epoch": 2777} {"train_loss": -43.55735397338867, "global_step": 336112, "epoch": 2777} {"train_loss": -44.10667037963867, "global_step": 336113, "epoch": 2777} {"train_loss": -45.34305191040039, "global_step": 336114, "epoch": 2777} {"train_loss": -44.06584548950195, "global_step": 336115, "epoch": 2777} {"train_loss": -43.21625900268555, "global_step": 336116, "epoch": 2777} {"train_loss": -41.508216857910156, "global_step": 336117, "epoch": 2777} {"train_loss": -43.730369567871094, "global_step": 336118, "epoch": 2777} {"train_loss": -43.52723693847656, "global_step": 336119, "epoch": 2777} {"train_loss": -43.130550384521484, "global_step": 336120, "epoch": 2777} {"train_loss": -42.16440963745117, "global_step": 336121, "epoch": 2777} {"train_loss": -43.01533126831055, "global_step": 336122, "epoch": 2777} {"train_loss": -44.24784469604492, "global_step": 336123, "epoch": 2777} {"train_loss": -42.56672286987305, "global_step": 336124, "epoch": 2777} {"train_loss": -42.02878189086914, "global_step": 336125, "epoch": 2777} {"train_loss": -43.88554382324219, "global_step": 336126, "epoch": 2777} {"train_loss": -27.650909423828125, "global_step": 336127, "epoch": 2777} {"train_loss": -38.932960510253906, "global_step": 336128, "epoch": 2777} {"train_loss": -41.558349609375, "global_step": 336129, "epoch": 2777} {"train_loss": -38.57770919799805, "global_step": 336130, "epoch": 2777} {"train_loss": -36.36001205444336, "global_step": 336131, "epoch": 2777} {"train_loss": -37.80713653564453, "global_step": 336132, "epoch": 2777} {"train_loss": -40.4789924621582, "global_step": 336133, "epoch": 2777} {"train_loss": -36.73854446411133, "global_step": 336134, "epoch": 2777} {"train_loss": -41.81146240234375, "global_step": 336135, "epoch": 2777} {"train_loss": -37.31989288330078, "global_step": 336136, "epoch": 2777} {"train_loss": -43.03420588595808, "global_step": 336137, "epoch": 2777, "val_loss": 3151160.75} {"train_loss": -38.82094192504883, "global_step": 336138, "epoch": 2778} {"train_loss": -40.58536911010742, "global_step": 336139, "epoch": 2778} {"train_loss": -38.9246940612793, "global_step": 336140, "epoch": 2778} {"train_loss": -41.22779846191406, "global_step": 336141, "epoch": 2778} {"train_loss": -41.39549255371094, "global_step": 336142, "epoch": 2778} {"train_loss": -37.03494644165039, "global_step": 336143, "epoch": 2778} {"train_loss": -32.438575744628906, "global_step": 336144, "epoch": 2778} {"train_loss": -33.86017990112305, "global_step": 336145, "epoch": 2778} {"train_loss": -37.24367141723633, "global_step": 336146, "epoch": 2778} {"train_loss": -39.880062103271484, "global_step": 336147, "epoch": 2778} {"train_loss": -40.547550201416016, "global_step": 336148, "epoch": 2778} {"train_loss": -39.41455841064453, "global_step": 336149, "epoch": 2778} {"train_loss": -40.98889923095703, "global_step": 336150, "epoch": 2778} {"train_loss": -37.90119552612305, "global_step": 336151, "epoch": 2778} {"train_loss": -40.846412658691406, "global_step": 336152, "epoch": 2778} {"train_loss": -31.778650283813477, "global_step": 336153, "epoch": 2778} {"train_loss": -40.9084587097168, "global_step": 336154, "epoch": 2778} {"train_loss": -40.5172119140625, "global_step": 336155, "epoch": 2778} {"train_loss": -36.847320556640625, "global_step": 336156, "epoch": 2778} {"train_loss": -39.91162872314453, "global_step": 336157, "epoch": 2778} {"train_loss": -24.851058959960938, "global_step": 336158, "epoch": 2778} {"train_loss": -39.41897964477539, "global_step": 336159, "epoch": 2778} {"train_loss": -35.49605178833008, "global_step": 336160, "epoch": 2778} {"train_loss": -39.149757385253906, "global_step": 336161, "epoch": 2778} {"train_loss": -32.42485427856445, "global_step": 336162, "epoch": 2778} {"train_loss": -37.90127182006836, "global_step": 336163, "epoch": 2778} {"train_loss": -39.19302749633789, "global_step": 336164, "epoch": 2778} {"train_loss": -36.095680236816406, "global_step": 336165, "epoch": 2778} {"train_loss": -38.14885711669922, "global_step": 336166, "epoch": 2778} {"train_loss": -39.9351692199707, "global_step": 336167, "epoch": 2778} {"train_loss": -40.998016357421875, "global_step": 336168, "epoch": 2778} {"train_loss": -38.53284454345703, "global_step": 336169, "epoch": 2778} {"train_loss": -39.43292999267578, "global_step": 336170, "epoch": 2778} {"train_loss": -38.006065368652344, "global_step": 336171, "epoch": 2778} {"train_loss": -39.38216781616211, "global_step": 336172, "epoch": 2778} {"train_loss": -41.238033294677734, "global_step": 336173, "epoch": 2778} {"train_loss": -41.584346771240234, "global_step": 336174, "epoch": 2778} {"train_loss": -41.28046798706055, "global_step": 336175, "epoch": 2778} {"train_loss": -41.1963996887207, "global_step": 336176, "epoch": 2778} {"train_loss": -41.04640579223633, "global_step": 336177, "epoch": 2778} {"train_loss": -41.085304260253906, "global_step": 336178, "epoch": 2778} {"train_loss": -40.958072662353516, "global_step": 336179, "epoch": 2778} {"train_loss": -41.385597229003906, "global_step": 336180, "epoch": 2778} {"train_loss": -41.61188507080078, "global_step": 336181, "epoch": 2778} {"train_loss": -40.86842727661133, "global_step": 336182, "epoch": 2778} {"train_loss": -40.42605209350586, "global_step": 336183, "epoch": 2778} {"train_loss": -41.067970275878906, "global_step": 336184, "epoch": 2778} {"train_loss": -41.712646484375, "global_step": 336185, "epoch": 2778} {"train_loss": -40.72379684448242, "global_step": 336186, "epoch": 2778} {"train_loss": -42.048583984375, "global_step": 336187, "epoch": 2778} {"train_loss": -41.85520553588867, "global_step": 336188, "epoch": 2778} {"train_loss": -42.3657341003418, "global_step": 336189, "epoch": 2778} {"train_loss": -42.33539962768555, "global_step": 336190, "epoch": 2778} {"train_loss": -41.70687484741211, "global_step": 336191, "epoch": 2778} {"train_loss": -42.095943450927734, "global_step": 336192, "epoch": 2778} {"train_loss": -42.75687789916992, "global_step": 336193, "epoch": 2778} {"train_loss": -42.2552490234375, "global_step": 336194, "epoch": 2778} {"train_loss": -42.367977142333984, "global_step": 336195, "epoch": 2778} {"train_loss": -41.794219970703125, "global_step": 336196, "epoch": 2778} {"train_loss": -42.59023666381836, "global_step": 336197, "epoch": 2778} {"train_loss": -42.4610481262207, "global_step": 336198, "epoch": 2778} {"train_loss": -42.24409866333008, "global_step": 336199, "epoch": 2778} {"train_loss": -42.717281341552734, "global_step": 336200, "epoch": 2778} {"train_loss": -42.55729293823242, "global_step": 336201, "epoch": 2778} {"train_loss": -42.46521759033203, "global_step": 336202, "epoch": 2778} {"train_loss": -42.63420867919922, "global_step": 336203, "epoch": 2778} {"train_loss": -42.181312561035156, "global_step": 336204, "epoch": 2778} {"train_loss": -43.23583984375, "global_step": 336205, "epoch": 2778} {"train_loss": -42.9926643371582, "global_step": 336206, "epoch": 2778} {"train_loss": -42.91201400756836, "global_step": 336207, "epoch": 2778} {"train_loss": -43.14423370361328, "global_step": 336208, "epoch": 2778} {"train_loss": -43.48756790161133, "global_step": 336209, "epoch": 2778} {"train_loss": -43.300018310546875, "global_step": 336210, "epoch": 2778} {"train_loss": -42.819332122802734, "global_step": 336211, "epoch": 2778} {"train_loss": -43.66162109375, "global_step": 336212, "epoch": 2778} {"train_loss": -43.40192413330078, "global_step": 336213, "epoch": 2778} {"train_loss": -43.47043991088867, "global_step": 336214, "epoch": 2778} {"train_loss": -43.1530876159668, "global_step": 336215, "epoch": 2778} {"train_loss": -43.175209045410156, "global_step": 336216, "epoch": 2778} {"train_loss": -43.45705032348633, "global_step": 336217, "epoch": 2778} {"train_loss": -43.554195404052734, "global_step": 336218, "epoch": 2778} {"train_loss": -44.31117630004883, "global_step": 336219, "epoch": 2778} {"train_loss": -43.4676513671875, "global_step": 336220, "epoch": 2778} {"train_loss": -44.14203643798828, "global_step": 336221, "epoch": 2778} {"train_loss": -43.50288391113281, "global_step": 336222, "epoch": 2778} {"train_loss": -44.055885314941406, "global_step": 336223, "epoch": 2778} {"train_loss": -44.01015090942383, "global_step": 336224, "epoch": 2778} {"train_loss": -44.170082092285156, "global_step": 336225, "epoch": 2778} {"train_loss": -44.03364181518555, "global_step": 336226, "epoch": 2778} {"train_loss": -43.928871154785156, "global_step": 336227, "epoch": 2778} {"train_loss": -44.405982971191406, "global_step": 336228, "epoch": 2778} {"train_loss": -44.560935974121094, "global_step": 336229, "epoch": 2778} {"train_loss": -44.46318817138672, "global_step": 336230, "epoch": 2778} {"train_loss": -44.024169921875, "global_step": 336231, "epoch": 2778} {"train_loss": -43.92470932006836, "global_step": 336232, "epoch": 2778} {"train_loss": -44.25077438354492, "global_step": 336233, "epoch": 2778} {"train_loss": -44.316802978515625, "global_step": 336234, "epoch": 2778} {"train_loss": -44.41788864135742, "global_step": 336235, "epoch": 2778} {"train_loss": -44.47564697265625, "global_step": 336236, "epoch": 2778} {"train_loss": -44.47840118408203, "global_step": 336237, "epoch": 2778} {"train_loss": -44.76359176635742, "global_step": 336238, "epoch": 2778} {"train_loss": -45.06721115112305, "global_step": 336239, "epoch": 2778} {"train_loss": -44.69157791137695, "global_step": 336240, "epoch": 2778} {"train_loss": -43.93990707397461, "global_step": 336241, "epoch": 2778} {"train_loss": -44.41996383666992, "global_step": 336242, "epoch": 2778} {"train_loss": -44.734710693359375, "global_step": 336243, "epoch": 2778} {"train_loss": -44.12118911743164, "global_step": 336244, "epoch": 2778} {"train_loss": -44.105491638183594, "global_step": 336245, "epoch": 2778} {"train_loss": -44.1001091003418, "global_step": 336246, "epoch": 2778} {"train_loss": -45.03601837158203, "global_step": 336247, "epoch": 2778} {"train_loss": -44.89359664916992, "global_step": 336248, "epoch": 2778} {"train_loss": -44.55906677246094, "global_step": 336249, "epoch": 2778} {"train_loss": -44.76913070678711, "global_step": 336250, "epoch": 2778} {"train_loss": -44.51798629760742, "global_step": 336251, "epoch": 2778} {"train_loss": -44.608577728271484, "global_step": 336252, "epoch": 2778} {"train_loss": -43.612037658691406, "global_step": 336253, "epoch": 2778} {"train_loss": -44.24699020385742, "global_step": 336254, "epoch": 2778} {"train_loss": -44.62246322631836, "global_step": 336255, "epoch": 2778} {"train_loss": -44.09890365600586, "global_step": 336256, "epoch": 2778} {"train_loss": -44.68091583251953, "global_step": 336257, "epoch": 2778} {"train_loss": -41.70670209837354, "global_step": 336258, "epoch": 2778, "val_loss": 2478123.25} {"train_loss": -44.288063049316406, "global_step": 336259, "epoch": 2779} {"train_loss": -44.595252990722656, "global_step": 336260, "epoch": 2779} {"train_loss": -44.1242561340332, "global_step": 336261, "epoch": 2779} {"train_loss": -44.03583908081055, "global_step": 336262, "epoch": 2779} {"train_loss": -45.18259811401367, "global_step": 336263, "epoch": 2779} {"train_loss": -43.509239196777344, "global_step": 336264, "epoch": 2779} {"train_loss": -43.723751068115234, "global_step": 336265, "epoch": 2779} {"train_loss": -44.304622650146484, "global_step": 336266, "epoch": 2779} {"train_loss": -43.300079345703125, "global_step": 336267, "epoch": 2779} {"train_loss": -43.944366455078125, "global_step": 336268, "epoch": 2779} {"train_loss": -44.1622428894043, "global_step": 336269, "epoch": 2779} {"train_loss": -43.12729263305664, "global_step": 336270, "epoch": 2779} {"train_loss": -44.4551887512207, "global_step": 336271, "epoch": 2779} {"train_loss": -44.39198684692383, "global_step": 336272, "epoch": 2779} {"train_loss": -44.31595993041992, "global_step": 336273, "epoch": 2779} {"train_loss": -43.8211669921875, "global_step": 336274, "epoch": 2779} {"train_loss": -42.94402313232422, "global_step": 336275, "epoch": 2779} {"train_loss": -42.408626556396484, "global_step": 336276, "epoch": 2779} {"train_loss": -44.02805709838867, "global_step": 336277, "epoch": 2779} {"train_loss": -44.141700744628906, "global_step": 336278, "epoch": 2779} {"train_loss": -44.062660217285156, "global_step": 336279, "epoch": 2779} {"train_loss": -41.936641693115234, "global_step": 336280, "epoch": 2779} {"train_loss": -42.570335388183594, "global_step": 336281, "epoch": 2779} {"train_loss": -44.315120697021484, "global_step": 336282, "epoch": 2779} {"train_loss": -43.403011322021484, "global_step": 336283, "epoch": 2779} {"train_loss": -41.86406707763672, "global_step": 336284, "epoch": 2779} {"train_loss": -41.977413177490234, "global_step": 336285, "epoch": 2779} {"train_loss": -41.63527297973633, "global_step": 336286, "epoch": 2779} {"train_loss": -41.241207122802734, "global_step": 336287, "epoch": 2779} {"train_loss": -42.714698791503906, "global_step": 336288, "epoch": 2779} {"train_loss": -41.483238220214844, "global_step": 336289, "epoch": 2779} {"train_loss": -42.77002716064453, "global_step": 336290, "epoch": 2779} {"train_loss": -43.476112365722656, "global_step": 336291, "epoch": 2779} {"train_loss": -44.116092681884766, "global_step": 336292, "epoch": 2779} {"train_loss": -43.433448791503906, "global_step": 336293, "epoch": 2779} {"train_loss": -43.548423767089844, "global_step": 336294, "epoch": 2779} {"train_loss": -42.169429779052734, "global_step": 336295, "epoch": 2779} {"train_loss": -43.15523910522461, "global_step": 336296, "epoch": 2779} {"train_loss": -43.71822738647461, "global_step": 336297, "epoch": 2779} {"train_loss": -42.27278518676758, "global_step": 336298, "epoch": 2779} {"train_loss": -44.01511764526367, "global_step": 336299, "epoch": 2779} {"train_loss": -41.71186065673828, "global_step": 336300, "epoch": 2779} {"train_loss": -41.37281036376953, "global_step": 336301, "epoch": 2779} {"train_loss": -40.80931091308594, "global_step": 336302, "epoch": 2779} {"train_loss": -43.749202728271484, "global_step": 336303, "epoch": 2779} {"train_loss": -42.06574249267578, "global_step": 336304, "epoch": 2779} {"train_loss": -42.12202072143555, "global_step": 336305, "epoch": 2779} {"train_loss": -40.89897155761719, "global_step": 336306, "epoch": 2779} {"train_loss": -42.242244720458984, "global_step": 336307, "epoch": 2779} {"train_loss": -39.932823181152344, "global_step": 336308, "epoch": 2779} {"train_loss": -39.685028076171875, "global_step": 336309, "epoch": 2779} {"train_loss": -41.6203727722168, "global_step": 336310, "epoch": 2779} {"train_loss": -40.42123794555664, "global_step": 336311, "epoch": 2779} {"train_loss": -41.040653228759766, "global_step": 336312, "epoch": 2779} {"train_loss": -42.60185623168945, "global_step": 336313, "epoch": 2779} {"train_loss": -41.88685989379883, "global_step": 336314, "epoch": 2779} {"train_loss": -42.64955520629883, "global_step": 336315, "epoch": 2779} {"train_loss": -41.82936477661133, "global_step": 336316, "epoch": 2779} {"train_loss": -42.099639892578125, "global_step": 336317, "epoch": 2779} {"train_loss": -42.334407806396484, "global_step": 336318, "epoch": 2779} {"train_loss": -41.25071716308594, "global_step": 336319, "epoch": 2779} {"train_loss": -43.36772918701172, "global_step": 336320, "epoch": 2779} {"train_loss": -40.90219497680664, "global_step": 336321, "epoch": 2779} {"train_loss": -43.04887008666992, "global_step": 336322, "epoch": 2779} {"train_loss": -42.32587432861328, "global_step": 336323, "epoch": 2779} {"train_loss": -42.09548568725586, "global_step": 336324, "epoch": 2779} {"train_loss": -43.86772155761719, "global_step": 336325, "epoch": 2779} {"train_loss": -42.4705810546875, "global_step": 336326, "epoch": 2779} {"train_loss": -42.69312286376953, "global_step": 336327, "epoch": 2779} {"train_loss": -43.4891471862793, "global_step": 336328, "epoch": 2779} {"train_loss": -42.516849517822266, "global_step": 336329, "epoch": 2779} {"train_loss": -44.032230377197266, "global_step": 336330, "epoch": 2779} {"train_loss": -43.5598030090332, "global_step": 336331, "epoch": 2779} {"train_loss": -43.611751556396484, "global_step": 336332, "epoch": 2779} {"train_loss": -43.80473327636719, "global_step": 336333, "epoch": 2779} {"train_loss": -43.206233978271484, "global_step": 336334, "epoch": 2779} {"train_loss": -44.39312744140625, "global_step": 336335, "epoch": 2779} {"train_loss": -43.56104278564453, "global_step": 336336, "epoch": 2779} {"train_loss": -43.804805755615234, "global_step": 336337, "epoch": 2779} {"train_loss": -43.96284866333008, "global_step": 336338, "epoch": 2779} {"train_loss": -43.92392349243164, "global_step": 336339, "epoch": 2779} {"train_loss": -43.16694259643555, "global_step": 336340, "epoch": 2779} {"train_loss": -44.63373947143555, "global_step": 336341, "epoch": 2779} {"train_loss": -43.75879669189453, "global_step": 336342, "epoch": 2779} {"train_loss": -43.96088790893555, "global_step": 336343, "epoch": 2779} {"train_loss": -44.1986198425293, "global_step": 336344, "epoch": 2779} {"train_loss": -44.301963806152344, "global_step": 336345, "epoch": 2779} {"train_loss": -43.97344970703125, "global_step": 336346, "epoch": 2779} {"train_loss": -44.08332061767578, "global_step": 336347, "epoch": 2779} {"train_loss": -44.498634338378906, "global_step": 336348, "epoch": 2779} {"train_loss": -44.12991714477539, "global_step": 336349, "epoch": 2779} {"train_loss": -43.840362548828125, "global_step": 336350, "epoch": 2779} {"train_loss": -43.382965087890625, "global_step": 336351, "epoch": 2779} {"train_loss": -44.94085693359375, "global_step": 336352, "epoch": 2779} {"train_loss": -43.89567184448242, "global_step": 336353, "epoch": 2779} {"train_loss": -43.453346252441406, "global_step": 336354, "epoch": 2779} {"train_loss": -43.63396072387695, "global_step": 336355, "epoch": 2779} {"train_loss": -44.229103088378906, "global_step": 336356, "epoch": 2779} {"train_loss": -44.317718505859375, "global_step": 336357, "epoch": 2779} {"train_loss": -44.5954704284668, "global_step": 336358, "epoch": 2779} {"train_loss": -44.81285858154297, "global_step": 336359, "epoch": 2779} {"train_loss": -44.80092239379883, "global_step": 336360, "epoch": 2779} {"train_loss": -44.555999755859375, "global_step": 336361, "epoch": 2779} {"train_loss": -44.99685287475586, "global_step": 336362, "epoch": 2779} {"train_loss": -44.23231506347656, "global_step": 336363, "epoch": 2779} {"train_loss": -43.996273040771484, "global_step": 336364, "epoch": 2779} {"train_loss": -43.26618576049805, "global_step": 336365, "epoch": 2779} {"train_loss": -43.81205368041992, "global_step": 336366, "epoch": 2779} {"train_loss": -44.27546310424805, "global_step": 336367, "epoch": 2779} {"train_loss": -44.12428665161133, "global_step": 336368, "epoch": 2779} {"train_loss": -43.079952239990234, "global_step": 336369, "epoch": 2779} {"train_loss": -42.80989456176758, "global_step": 336370, "epoch": 2779} {"train_loss": -42.99015426635742, "global_step": 336371, "epoch": 2779} {"train_loss": -43.59922790527344, "global_step": 336372, "epoch": 2779} {"train_loss": -44.35997772216797, "global_step": 336373, "epoch": 2779} {"train_loss": -43.4795036315918, "global_step": 336374, "epoch": 2779} {"train_loss": -43.640953063964844, "global_step": 336375, "epoch": 2779} {"train_loss": -44.6312141418457, "global_step": 336376, "epoch": 2779} {"train_loss": -43.74852752685547, "global_step": 336377, "epoch": 2779} {"train_loss": -44.112361907958984, "global_step": 336378, "epoch": 2779} {"train_loss": -43.27756456107147, "global_step": 336379, "epoch": 2779, "val_loss": 2529428.25} {"train_loss": -43.97779846191406, "global_step": 336380, "epoch": 2780} {"train_loss": -44.575382232666016, "global_step": 336381, "epoch": 2780} {"train_loss": -44.63679885864258, "global_step": 336382, "epoch": 2780} {"train_loss": -44.232234954833984, "global_step": 336383, "epoch": 2780} {"train_loss": -43.66721725463867, "global_step": 336384, "epoch": 2780} {"train_loss": -43.99158477783203, "global_step": 336385, "epoch": 2780} {"train_loss": -43.84086990356445, "global_step": 336386, "epoch": 2780} {"train_loss": -43.88460159301758, "global_step": 336387, "epoch": 2780} {"train_loss": -44.433837890625, "global_step": 336388, "epoch": 2780} {"train_loss": -43.15433120727539, "global_step": 336389, "epoch": 2780} {"train_loss": -43.413150787353516, "global_step": 336390, "epoch": 2780} {"train_loss": -43.84499740600586, "global_step": 336391, "epoch": 2780} {"train_loss": -43.9124870300293, "global_step": 336392, "epoch": 2780} {"train_loss": -44.11981201171875, "global_step": 336393, "epoch": 2780} {"train_loss": -44.327186584472656, "global_step": 336394, "epoch": 2780} {"train_loss": -44.01472091674805, "global_step": 336395, "epoch": 2780} {"train_loss": -43.54120635986328, "global_step": 336396, "epoch": 2780} {"train_loss": -43.8216552734375, "global_step": 336397, "epoch": 2780} {"train_loss": -44.565608978271484, "global_step": 336398, "epoch": 2780} {"train_loss": -44.39661407470703, "global_step": 336399, "epoch": 2780} {"train_loss": -44.26247024536133, "global_step": 336400, "epoch": 2780} {"train_loss": -44.589263916015625, "global_step": 336401, "epoch": 2780} {"train_loss": -44.13271713256836, "global_step": 336402, "epoch": 2780} {"train_loss": -44.3747673034668, "global_step": 336403, "epoch": 2780} {"train_loss": -44.438087463378906, "global_step": 336404, "epoch": 2780} {"train_loss": -43.993934631347656, "global_step": 336405, "epoch": 2780} {"train_loss": -44.484771728515625, "global_step": 336406, "epoch": 2780} {"train_loss": -44.67560577392578, "global_step": 336407, "epoch": 2780} {"train_loss": -44.51524353027344, "global_step": 336408, "epoch": 2780} {"train_loss": -44.63044357299805, "global_step": 336409, "epoch": 2780} {"train_loss": -43.493736267089844, "global_step": 336410, "epoch": 2780} {"train_loss": -44.054412841796875, "global_step": 336411, "epoch": 2780} {"train_loss": -44.38677978515625, "global_step": 336412, "epoch": 2780} {"train_loss": -43.463497161865234, "global_step": 336413, "epoch": 2780} {"train_loss": -43.37651443481445, "global_step": 336414, "epoch": 2780} {"train_loss": -43.20967483520508, "global_step": 336415, "epoch": 2780} {"train_loss": -43.47651672363281, "global_step": 336416, "epoch": 2780} {"train_loss": -43.48383712768555, "global_step": 336417, "epoch": 2780} {"train_loss": -42.3302001953125, "global_step": 336418, "epoch": 2780} {"train_loss": -41.77732849121094, "global_step": 336419, "epoch": 2780} {"train_loss": -43.03827667236328, "global_step": 336420, "epoch": 2780} {"train_loss": -43.19214630126953, "global_step": 336421, "epoch": 2780} {"train_loss": -42.9843635559082, "global_step": 336422, "epoch": 2780} {"train_loss": -43.1807861328125, "global_step": 336423, "epoch": 2780} {"train_loss": -43.130977630615234, "global_step": 336424, "epoch": 2780} {"train_loss": -43.2900390625, "global_step": 336425, "epoch": 2780} {"train_loss": -42.39747619628906, "global_step": 336426, "epoch": 2780} {"train_loss": -43.4182014465332, "global_step": 336427, "epoch": 2780} {"train_loss": -43.46772384643555, "global_step": 336428, "epoch": 2780} {"train_loss": -42.88153839111328, "global_step": 336429, "epoch": 2780} {"train_loss": -44.54726028442383, "global_step": 336430, "epoch": 2780} {"train_loss": -42.63236618041992, "global_step": 336431, "epoch": 2780} {"train_loss": -43.138187408447266, "global_step": 336432, "epoch": 2780} {"train_loss": -43.638301849365234, "global_step": 336433, "epoch": 2780} {"train_loss": -43.33094787597656, "global_step": 336434, "epoch": 2780} {"train_loss": -43.45241928100586, "global_step": 336435, "epoch": 2780} {"train_loss": -43.00496292114258, "global_step": 336436, "epoch": 2780} {"train_loss": -42.583194732666016, "global_step": 336437, "epoch": 2780} {"train_loss": -44.251983642578125, "global_step": 336438, "epoch": 2780} {"train_loss": -42.53924560546875, "global_step": 336439, "epoch": 2780} {"train_loss": -43.77274703979492, "global_step": 336440, "epoch": 2780} {"train_loss": -44.12128448486328, "global_step": 336441, "epoch": 2780} {"train_loss": -43.56342315673828, "global_step": 336442, "epoch": 2780} {"train_loss": -44.469970703125, "global_step": 336443, "epoch": 2780} {"train_loss": -43.348060607910156, "global_step": 336444, "epoch": 2780} {"train_loss": -43.68891143798828, "global_step": 336445, "epoch": 2780} {"train_loss": -44.06229782104492, "global_step": 336446, "epoch": 2780} {"train_loss": -43.57389450073242, "global_step": 336447, "epoch": 2780} {"train_loss": -44.28434753417969, "global_step": 336448, "epoch": 2780} {"train_loss": -43.61793899536133, "global_step": 336449, "epoch": 2780} {"train_loss": -42.91376876831055, "global_step": 336450, "epoch": 2780} {"train_loss": -44.19475173950195, "global_step": 336451, "epoch": 2780} {"train_loss": -44.1451301574707, "global_step": 336452, "epoch": 2780} {"train_loss": -43.483272552490234, "global_step": 336453, "epoch": 2780} {"train_loss": -43.730140686035156, "global_step": 336454, "epoch": 2780} {"train_loss": -43.170562744140625, "global_step": 336455, "epoch": 2780} {"train_loss": -44.17769241333008, "global_step": 336456, "epoch": 2780} {"train_loss": -43.5908317565918, "global_step": 336457, "epoch": 2780} {"train_loss": -43.72352600097656, "global_step": 336458, "epoch": 2780} {"train_loss": -43.6900634765625, "global_step": 336459, "epoch": 2780} {"train_loss": -44.13972091674805, "global_step": 336460, "epoch": 2780} {"train_loss": -44.29909133911133, "global_step": 336461, "epoch": 2780} {"train_loss": -43.898292541503906, "global_step": 336462, "epoch": 2780} {"train_loss": -43.20586395263672, "global_step": 336463, "epoch": 2780} {"train_loss": -43.88716125488281, "global_step": 336464, "epoch": 2780} {"train_loss": -44.206661224365234, "global_step": 336465, "epoch": 2780} {"train_loss": -44.457942962646484, "global_step": 336466, "epoch": 2780} {"train_loss": -44.359493255615234, "global_step": 336467, "epoch": 2780} {"train_loss": -43.93352127075195, "global_step": 336468, "epoch": 2780} {"train_loss": -44.333396911621094, "global_step": 336469, "epoch": 2780} {"train_loss": -44.021568298339844, "global_step": 336470, "epoch": 2780} {"train_loss": -44.26118087768555, "global_step": 336471, "epoch": 2780} {"train_loss": -44.679691314697266, "global_step": 336472, "epoch": 2780} {"train_loss": -44.8975715637207, "global_step": 336473, "epoch": 2780} {"train_loss": -43.84062957763672, "global_step": 336474, "epoch": 2780} {"train_loss": -44.579036712646484, "global_step": 336475, "epoch": 2780} {"train_loss": -44.354312896728516, "global_step": 336476, "epoch": 2780} {"train_loss": -44.955074310302734, "global_step": 336477, "epoch": 2780} {"train_loss": -44.56317901611328, "global_step": 336478, "epoch": 2780} {"train_loss": -43.69428634643555, "global_step": 336479, "epoch": 2780} {"train_loss": -43.78947067260742, "global_step": 336480, "epoch": 2780} {"train_loss": -43.99164962768555, "global_step": 336481, "epoch": 2780} {"train_loss": -41.894649505615234, "global_step": 336482, "epoch": 2780} {"train_loss": -43.32854080200195, "global_step": 336483, "epoch": 2780} {"train_loss": -43.67110824584961, "global_step": 336484, "epoch": 2780} {"train_loss": -44.30048370361328, "global_step": 336485, "epoch": 2780} {"train_loss": -43.92757034301758, "global_step": 336486, "epoch": 2780} {"train_loss": -44.19379806518555, "global_step": 336487, "epoch": 2780} {"train_loss": -43.45033264160156, "global_step": 336488, "epoch": 2780} {"train_loss": -43.14951705932617, "global_step": 336489, "epoch": 2780} {"train_loss": -44.29623031616211, "global_step": 336490, "epoch": 2780} {"train_loss": -44.130889892578125, "global_step": 336491, "epoch": 2780} {"train_loss": -43.070518493652344, "global_step": 336492, "epoch": 2780} {"train_loss": -43.8957633972168, "global_step": 336493, "epoch": 2780} {"train_loss": -44.56059646606445, "global_step": 336494, "epoch": 2780} {"train_loss": -43.53691482543945, "global_step": 336495, "epoch": 2780} {"train_loss": -43.51790237426758, "global_step": 336496, "epoch": 2780} {"train_loss": -44.61670684814453, "global_step": 336497, "epoch": 2780} {"train_loss": -44.09640121459961, "global_step": 336498, "epoch": 2780} {"train_loss": -42.7851676940918, "global_step": 336499, "epoch": 2780} {"train_loss": -43.80808699426572, "global_step": 336500, "epoch": 2780, "val_loss": 2752347.25} {"train_loss": -44.447940826416016, "global_step": 336501, "epoch": 2781} {"train_loss": -44.4208984375, "global_step": 336502, "epoch": 2781} {"train_loss": -44.976417541503906, "global_step": 336503, "epoch": 2781} {"train_loss": -43.961891174316406, "global_step": 336504, "epoch": 2781} {"train_loss": -43.804962158203125, "global_step": 336505, "epoch": 2781} {"train_loss": -44.99876022338867, "global_step": 336506, "epoch": 2781} {"train_loss": -44.15253829956055, "global_step": 336507, "epoch": 2781} {"train_loss": -41.991493225097656, "global_step": 336508, "epoch": 2781} {"train_loss": -42.93739700317383, "global_step": 336509, "epoch": 2781} {"train_loss": -39.10049057006836, "global_step": 336510, "epoch": 2781} {"train_loss": -40.2276496887207, "global_step": 336511, "epoch": 2781} {"train_loss": -39.80216979980469, "global_step": 336512, "epoch": 2781} {"train_loss": -39.89358901977539, "global_step": 336513, "epoch": 2781} {"train_loss": -39.24080276489258, "global_step": 336514, "epoch": 2781} {"train_loss": -40.13081741333008, "global_step": 336515, "epoch": 2781} {"train_loss": -39.748592376708984, "global_step": 336516, "epoch": 2781} {"train_loss": -39.91801452636719, "global_step": 336517, "epoch": 2781} {"train_loss": -39.62259292602539, "global_step": 336518, "epoch": 2781} {"train_loss": -40.488216400146484, "global_step": 336519, "epoch": 2781} {"train_loss": -39.966487884521484, "global_step": 336520, "epoch": 2781} {"train_loss": -40.43442153930664, "global_step": 336521, "epoch": 2781} {"train_loss": -35.1116943359375, "global_step": 336522, "epoch": 2781} {"train_loss": -40.65385055541992, "global_step": 336523, "epoch": 2781} {"train_loss": -40.71238327026367, "global_step": 336524, "epoch": 2781} {"train_loss": -40.59172439575195, "global_step": 336525, "epoch": 2781} {"train_loss": -38.4196891784668, "global_step": 336526, "epoch": 2781} {"train_loss": -36.07441329956055, "global_step": 336527, "epoch": 2781} {"train_loss": -38.135440826416016, "global_step": 336528, "epoch": 2781} {"train_loss": -30.941843032836914, "global_step": 336529, "epoch": 2781} {"train_loss": -39.89432907104492, "global_step": 336530, "epoch": 2781} {"train_loss": -40.150081634521484, "global_step": 336531, "epoch": 2781} {"train_loss": -39.621551513671875, "global_step": 336532, "epoch": 2781} {"train_loss": -38.335079193115234, "global_step": 336533, "epoch": 2781} {"train_loss": -40.19255447387695, "global_step": 336534, "epoch": 2781} {"train_loss": -39.942623138427734, "global_step": 336535, "epoch": 2781} {"train_loss": -40.39970397949219, "global_step": 336536, "epoch": 2781} {"train_loss": -40.41902160644531, "global_step": 336537, "epoch": 2781} {"train_loss": -36.89674758911133, "global_step": 336538, "epoch": 2781} {"train_loss": -40.08317947387695, "global_step": 336539, "epoch": 2781} {"train_loss": -37.60128402709961, "global_step": 336540, "epoch": 2781} {"train_loss": -40.6488151550293, "global_step": 336541, "epoch": 2781} {"train_loss": -40.324974060058594, "global_step": 336542, "epoch": 2781} {"train_loss": -40.38347244262695, "global_step": 336543, "epoch": 2781} {"train_loss": -36.66299057006836, "global_step": 336544, "epoch": 2781} {"train_loss": -40.989097595214844, "global_step": 336545, "epoch": 2781} {"train_loss": -38.42626953125, "global_step": 336546, "epoch": 2781} {"train_loss": -41.22998046875, "global_step": 336547, "epoch": 2781} {"train_loss": -38.95976257324219, "global_step": 336548, "epoch": 2781} {"train_loss": -40.032588958740234, "global_step": 336549, "epoch": 2781} {"train_loss": -36.738861083984375, "global_step": 336550, "epoch": 2781} {"train_loss": -41.10386276245117, "global_step": 336551, "epoch": 2781} {"train_loss": -42.086421966552734, "global_step": 336552, "epoch": 2781} {"train_loss": -39.4495964050293, "global_step": 336553, "epoch": 2781} {"train_loss": -38.94169616699219, "global_step": 336554, "epoch": 2781} {"train_loss": -42.91555404663086, "global_step": 336555, "epoch": 2781} {"train_loss": -39.852413177490234, "global_step": 336556, "epoch": 2781} {"train_loss": -43.1630859375, "global_step": 336557, "epoch": 2781} {"train_loss": -42.69169235229492, "global_step": 336558, "epoch": 2781} {"train_loss": -42.20548629760742, "global_step": 336559, "epoch": 2781} {"train_loss": -41.36579132080078, "global_step": 336560, "epoch": 2781} {"train_loss": -43.028743743896484, "global_step": 336561, "epoch": 2781} {"train_loss": -43.105525970458984, "global_step": 336562, "epoch": 2781} {"train_loss": -41.84818649291992, "global_step": 336563, "epoch": 2781} {"train_loss": -40.75181579589844, "global_step": 336564, "epoch": 2781} {"train_loss": -42.49871826171875, "global_step": 336565, "epoch": 2781} {"train_loss": -42.64997100830078, "global_step": 336566, "epoch": 2781} {"train_loss": -42.96207809448242, "global_step": 336567, "epoch": 2781} {"train_loss": -41.328956604003906, "global_step": 336568, "epoch": 2781} {"train_loss": -40.28891372680664, "global_step": 336569, "epoch": 2781} {"train_loss": -39.47487258911133, "global_step": 336570, "epoch": 2781} {"train_loss": -43.52241134643555, "global_step": 336571, "epoch": 2781} {"train_loss": -41.67384719848633, "global_step": 336572, "epoch": 2781} {"train_loss": -43.573143005371094, "global_step": 336573, "epoch": 2781} {"train_loss": -43.13261032104492, "global_step": 336574, "epoch": 2781} {"train_loss": -43.2042236328125, "global_step": 336575, "epoch": 2781} {"train_loss": -42.5146598815918, "global_step": 336576, "epoch": 2781} {"train_loss": -42.68768310546875, "global_step": 336577, "epoch": 2781} {"train_loss": -43.725685119628906, "global_step": 336578, "epoch": 2781} {"train_loss": -43.58259963989258, "global_step": 336579, "epoch": 2781} {"train_loss": -42.045040130615234, "global_step": 336580, "epoch": 2781} {"train_loss": -44.05063247680664, "global_step": 336581, "epoch": 2781} {"train_loss": -39.841312408447266, "global_step": 336582, "epoch": 2781} {"train_loss": -43.59745407104492, "global_step": 336583, "epoch": 2781} {"train_loss": -42.925445556640625, "global_step": 336584, "epoch": 2781} {"train_loss": -40.71133804321289, "global_step": 336585, "epoch": 2781} {"train_loss": -43.72215270996094, "global_step": 336586, "epoch": 2781} {"train_loss": -42.024051666259766, "global_step": 336587, "epoch": 2781} {"train_loss": -43.655826568603516, "global_step": 336588, "epoch": 2781} {"train_loss": -43.17151641845703, "global_step": 336589, "epoch": 2781} {"train_loss": -42.76814651489258, "global_step": 336590, "epoch": 2781} {"train_loss": -42.863582611083984, "global_step": 336591, "epoch": 2781} {"train_loss": -43.6211051940918, "global_step": 336592, "epoch": 2781} {"train_loss": -42.65975570678711, "global_step": 336593, "epoch": 2781} {"train_loss": -44.27047348022461, "global_step": 336594, "epoch": 2781} {"train_loss": -42.887569427490234, "global_step": 336595, "epoch": 2781} {"train_loss": -43.56121063232422, "global_step": 336596, "epoch": 2781} {"train_loss": -43.00956344604492, "global_step": 336597, "epoch": 2781} {"train_loss": -43.8337287902832, "global_step": 336598, "epoch": 2781} {"train_loss": -43.28554153442383, "global_step": 336599, "epoch": 2781} {"train_loss": -44.22697448730469, "global_step": 336600, "epoch": 2781} {"train_loss": -41.593414306640625, "global_step": 336601, "epoch": 2781} {"train_loss": -43.41120529174805, "global_step": 336602, "epoch": 2781} {"train_loss": -43.4740104675293, "global_step": 336603, "epoch": 2781} {"train_loss": -44.224674224853516, "global_step": 336604, "epoch": 2781} {"train_loss": -43.30845260620117, "global_step": 336605, "epoch": 2781} {"train_loss": -43.494014739990234, "global_step": 336606, "epoch": 2781} {"train_loss": -43.360538482666016, "global_step": 336607, "epoch": 2781} {"train_loss": -43.31931686401367, "global_step": 336608, "epoch": 2781} {"train_loss": -43.422847747802734, "global_step": 336609, "epoch": 2781} {"train_loss": -43.437747955322266, "global_step": 336610, "epoch": 2781} {"train_loss": -43.277870178222656, "global_step": 336611, "epoch": 2781} {"train_loss": -43.89113998413086, "global_step": 336612, "epoch": 2781} {"train_loss": -43.68111038208008, "global_step": 336613, "epoch": 2781} {"train_loss": -42.67488479614258, "global_step": 336614, "epoch": 2781} {"train_loss": -42.98550033569336, "global_step": 336615, "epoch": 2781} {"train_loss": -44.2198600769043, "global_step": 336616, "epoch": 2781} {"train_loss": -43.65153503417969, "global_step": 336617, "epoch": 2781} {"train_loss": -42.62248611450195, "global_step": 336618, "epoch": 2781} {"train_loss": -44.14650344848633, "global_step": 336619, "epoch": 2781} {"train_loss": -43.49290084838867, "global_step": 336620, "epoch": 2781} {"train_loss": -41.6179758339874, "global_step": 336621, "epoch": 2781, "val_loss": 2575575.0} {"train_loss": -43.470314025878906, "global_step": 336622, "epoch": 2782} {"train_loss": -43.98267364501953, "global_step": 336623, "epoch": 2782} {"train_loss": -44.7722053527832, "global_step": 336624, "epoch": 2782} {"train_loss": -43.8360710144043, "global_step": 336625, "epoch": 2782} {"train_loss": -44.0744743347168, "global_step": 336626, "epoch": 2782} {"train_loss": -43.165740966796875, "global_step": 336627, "epoch": 2782} {"train_loss": -43.446144104003906, "global_step": 336628, "epoch": 2782} {"train_loss": -43.69515609741211, "global_step": 336629, "epoch": 2782} {"train_loss": -43.6522216796875, "global_step": 336630, "epoch": 2782} {"train_loss": -44.54384231567383, "global_step": 336631, "epoch": 2782} {"train_loss": -43.3929443359375, "global_step": 336632, "epoch": 2782} {"train_loss": -43.56624221801758, "global_step": 336633, "epoch": 2782} {"train_loss": -41.63405227661133, "global_step": 336634, "epoch": 2782} {"train_loss": -43.51993942260742, "global_step": 336635, "epoch": 2782} {"train_loss": -43.83191680908203, "global_step": 336636, "epoch": 2782} {"train_loss": -42.33372116088867, "global_step": 336637, "epoch": 2782} {"train_loss": -44.144893646240234, "global_step": 336638, "epoch": 2782} {"train_loss": -43.250484466552734, "global_step": 336639, "epoch": 2782} {"train_loss": -43.89888000488281, "global_step": 336640, "epoch": 2782} {"train_loss": -44.08367919921875, "global_step": 336641, "epoch": 2782} {"train_loss": -43.311885833740234, "global_step": 336642, "epoch": 2782} {"train_loss": -41.6553955078125, "global_step": 336643, "epoch": 2782} {"train_loss": -43.54891586303711, "global_step": 336644, "epoch": 2782} {"train_loss": -41.602298736572266, "global_step": 336645, "epoch": 2782} {"train_loss": -43.271018981933594, "global_step": 336646, "epoch": 2782} {"train_loss": -43.8670539855957, "global_step": 336647, "epoch": 2782} {"train_loss": -41.39914321899414, "global_step": 336648, "epoch": 2782} {"train_loss": -40.97213363647461, "global_step": 336649, "epoch": 2782} {"train_loss": -42.29848861694336, "global_step": 336650, "epoch": 2782} {"train_loss": -41.591148376464844, "global_step": 336651, "epoch": 2782} {"train_loss": -41.73790740966797, "global_step": 336652, "epoch": 2782} {"train_loss": -41.994140625, "global_step": 336653, "epoch": 2782} {"train_loss": -42.36692810058594, "global_step": 336654, "epoch": 2782} {"train_loss": -41.202476501464844, "global_step": 336655, "epoch": 2782} {"train_loss": -43.4296989440918, "global_step": 336656, "epoch": 2782} {"train_loss": -41.97684860229492, "global_step": 336657, "epoch": 2782} {"train_loss": -44.097991943359375, "global_step": 336658, "epoch": 2782} {"train_loss": -40.7535514831543, "global_step": 336659, "epoch": 2782} {"train_loss": -41.01729202270508, "global_step": 336660, "epoch": 2782} {"train_loss": -40.9654655456543, "global_step": 336661, "epoch": 2782} {"train_loss": -41.71099090576172, "global_step": 336662, "epoch": 2782} {"train_loss": -43.319610595703125, "global_step": 336663, "epoch": 2782} {"train_loss": -40.95375442504883, "global_step": 336664, "epoch": 2782} {"train_loss": -43.297115325927734, "global_step": 336665, "epoch": 2782} {"train_loss": -42.064571380615234, "global_step": 336666, "epoch": 2782} {"train_loss": -43.137481689453125, "global_step": 336667, "epoch": 2782} {"train_loss": -42.19575119018555, "global_step": 336668, "epoch": 2782} {"train_loss": -42.08112716674805, "global_step": 336669, "epoch": 2782} {"train_loss": -43.043331146240234, "global_step": 336670, "epoch": 2782} {"train_loss": -43.692176818847656, "global_step": 336671, "epoch": 2782} {"train_loss": -42.27458572387695, "global_step": 336672, "epoch": 2782} {"train_loss": -43.181121826171875, "global_step": 336673, "epoch": 2782} {"train_loss": -42.95219039916992, "global_step": 336674, "epoch": 2782} {"train_loss": -42.80670166015625, "global_step": 336675, "epoch": 2782} {"train_loss": -42.8497200012207, "global_step": 336676, "epoch": 2782} {"train_loss": -43.43712615966797, "global_step": 336677, "epoch": 2782} {"train_loss": -42.84689712524414, "global_step": 336678, "epoch": 2782} {"train_loss": -42.97481155395508, "global_step": 336679, "epoch": 2782} {"train_loss": -43.369930267333984, "global_step": 336680, "epoch": 2782} {"train_loss": -43.74805450439453, "global_step": 336681, "epoch": 2782} {"train_loss": -44.29842758178711, "global_step": 336682, "epoch": 2782} {"train_loss": -43.787105560302734, "global_step": 336683, "epoch": 2782} {"train_loss": -43.78719711303711, "global_step": 336684, "epoch": 2782} {"train_loss": -44.596004486083984, "global_step": 336685, "epoch": 2782} {"train_loss": -43.911354064941406, "global_step": 336686, "epoch": 2782} {"train_loss": -44.13384246826172, "global_step": 336687, "epoch": 2782} {"train_loss": -44.17433547973633, "global_step": 336688, "epoch": 2782} {"train_loss": -43.584529876708984, "global_step": 336689, "epoch": 2782} {"train_loss": -44.24111557006836, "global_step": 336690, "epoch": 2782} {"train_loss": -43.8294792175293, "global_step": 336691, "epoch": 2782} {"train_loss": -44.12385940551758, "global_step": 336692, "epoch": 2782} {"train_loss": -43.663211822509766, "global_step": 336693, "epoch": 2782} {"train_loss": -43.90894317626953, "global_step": 336694, "epoch": 2782} {"train_loss": -43.81163024902344, "global_step": 336695, "epoch": 2782} {"train_loss": -42.92485809326172, "global_step": 336696, "epoch": 2782} {"train_loss": -44.47184371948242, "global_step": 336697, "epoch": 2782} {"train_loss": -43.945037841796875, "global_step": 336698, "epoch": 2782} {"train_loss": -43.2867546081543, "global_step": 336699, "epoch": 2782} {"train_loss": -44.3504638671875, "global_step": 336700, "epoch": 2782} {"train_loss": -43.23860168457031, "global_step": 336701, "epoch": 2782} {"train_loss": -43.017879486083984, "global_step": 336702, "epoch": 2782} {"train_loss": -44.225154876708984, "global_step": 336703, "epoch": 2782} {"train_loss": -43.0400390625, "global_step": 336704, "epoch": 2782} {"train_loss": -44.47638702392578, "global_step": 336705, "epoch": 2782} {"train_loss": -43.9779052734375, "global_step": 336706, "epoch": 2782} {"train_loss": -43.91257858276367, "global_step": 336707, "epoch": 2782} {"train_loss": -44.173095703125, "global_step": 336708, "epoch": 2782} {"train_loss": -44.24625015258789, "global_step": 336709, "epoch": 2782} {"train_loss": -44.63640213012695, "global_step": 336710, "epoch": 2782} {"train_loss": -43.239742279052734, "global_step": 336711, "epoch": 2782} {"train_loss": -43.96567153930664, "global_step": 336712, "epoch": 2782} {"train_loss": -44.592708587646484, "global_step": 336713, "epoch": 2782} {"train_loss": -44.00827407836914, "global_step": 336714, "epoch": 2782} {"train_loss": -44.04652786254883, "global_step": 336715, "epoch": 2782} {"train_loss": -42.044090270996094, "global_step": 336716, "epoch": 2782} {"train_loss": -43.320831298828125, "global_step": 336717, "epoch": 2782} {"train_loss": -42.66902160644531, "global_step": 336718, "epoch": 2782} {"train_loss": -43.87379837036133, "global_step": 336719, "epoch": 2782} {"train_loss": -44.31711959838867, "global_step": 336720, "epoch": 2782} {"train_loss": -44.294368743896484, "global_step": 336721, "epoch": 2782} {"train_loss": -44.308502197265625, "global_step": 336722, "epoch": 2782} {"train_loss": -43.69314193725586, "global_step": 336723, "epoch": 2782} {"train_loss": -44.75392150878906, "global_step": 336724, "epoch": 2782} {"train_loss": -43.15726852416992, "global_step": 336725, "epoch": 2782} {"train_loss": -43.45206069946289, "global_step": 336726, "epoch": 2782} {"train_loss": -43.4008674621582, "global_step": 336727, "epoch": 2782} {"train_loss": -43.51216506958008, "global_step": 336728, "epoch": 2782} {"train_loss": -43.49442672729492, "global_step": 336729, "epoch": 2782} {"train_loss": -42.286041259765625, "global_step": 336730, "epoch": 2782} {"train_loss": -42.49092483520508, "global_step": 336731, "epoch": 2782} {"train_loss": -43.63352584838867, "global_step": 336732, "epoch": 2782} {"train_loss": -43.71635818481445, "global_step": 336733, "epoch": 2782} {"train_loss": -43.1407470703125, "global_step": 336734, "epoch": 2782} {"train_loss": -43.959205627441406, "global_step": 336735, "epoch": 2782} {"train_loss": -42.556270599365234, "global_step": 336736, "epoch": 2782} {"train_loss": -43.29108810424805, "global_step": 336737, "epoch": 2782} {"train_loss": -43.46712875366211, "global_step": 336738, "epoch": 2782} {"train_loss": -43.51557159423828, "global_step": 336739, "epoch": 2782} {"train_loss": -43.34203338623047, "global_step": 336740, "epoch": 2782} {"train_loss": -44.088863372802734, "global_step": 336741, "epoch": 2782} {"train_loss": -43.28604835321095, "global_step": 336742, "epoch": 2782, "val_loss": 2603554.25} {"train_loss": -43.748008728027344, "global_step": 336743, "epoch": 2783} {"train_loss": -44.193355560302734, "global_step": 336744, "epoch": 2783} {"train_loss": -43.040279388427734, "global_step": 336745, "epoch": 2783} {"train_loss": -44.00021743774414, "global_step": 336746, "epoch": 2783} {"train_loss": -44.7555046081543, "global_step": 336747, "epoch": 2783} {"train_loss": -43.183467864990234, "global_step": 336748, "epoch": 2783} {"train_loss": -44.180721282958984, "global_step": 336749, "epoch": 2783} {"train_loss": -43.62649154663086, "global_step": 336750, "epoch": 2783} {"train_loss": -42.51265335083008, "global_step": 336751, "epoch": 2783} {"train_loss": -44.4184684753418, "global_step": 336752, "epoch": 2783} {"train_loss": -43.621456146240234, "global_step": 336753, "epoch": 2783} {"train_loss": -44.61961364746094, "global_step": 336754, "epoch": 2783} {"train_loss": -41.85573959350586, "global_step": 336755, "epoch": 2783} {"train_loss": -42.28125, "global_step": 336756, "epoch": 2783} {"train_loss": -41.55386734008789, "global_step": 336757, "epoch": 2783} {"train_loss": -44.007930755615234, "global_step": 336758, "epoch": 2783} {"train_loss": -44.31651306152344, "global_step": 336759, "epoch": 2783} {"train_loss": -42.33197784423828, "global_step": 336760, "epoch": 2783} {"train_loss": -42.221553802490234, "global_step": 336761, "epoch": 2783} {"train_loss": -42.992916107177734, "global_step": 336762, "epoch": 2783} {"train_loss": -44.18020248413086, "global_step": 336763, "epoch": 2783} {"train_loss": -43.342750549316406, "global_step": 336764, "epoch": 2783} {"train_loss": -44.341644287109375, "global_step": 336765, "epoch": 2783} {"train_loss": -42.93341827392578, "global_step": 336766, "epoch": 2783} {"train_loss": -43.5914192199707, "global_step": 336767, "epoch": 2783} {"train_loss": -43.906497955322266, "global_step": 336768, "epoch": 2783} {"train_loss": -42.4909782409668, "global_step": 336769, "epoch": 2783} {"train_loss": -38.357177734375, "global_step": 336770, "epoch": 2783} {"train_loss": -44.1510124206543, "global_step": 336771, "epoch": 2783} {"train_loss": -43.61500930786133, "global_step": 336772, "epoch": 2783} {"train_loss": -44.11601638793945, "global_step": 336773, "epoch": 2783} {"train_loss": -43.85853958129883, "global_step": 336774, "epoch": 2783} {"train_loss": -42.43099594116211, "global_step": 336775, "epoch": 2783} {"train_loss": -43.2931022644043, "global_step": 336776, "epoch": 2783} {"train_loss": -43.63624572753906, "global_step": 336777, "epoch": 2783} {"train_loss": -43.798946380615234, "global_step": 336778, "epoch": 2783} {"train_loss": -44.135433197021484, "global_step": 336779, "epoch": 2783} {"train_loss": -39.77950668334961, "global_step": 336780, "epoch": 2783} {"train_loss": -44.38916015625, "global_step": 336781, "epoch": 2783} {"train_loss": -44.10335159301758, "global_step": 336782, "epoch": 2783} {"train_loss": -42.411476135253906, "global_step": 336783, "epoch": 2783} {"train_loss": -41.22806930541992, "global_step": 336784, "epoch": 2783} {"train_loss": -44.0909309387207, "global_step": 336785, "epoch": 2783} {"train_loss": -44.83168029785156, "global_step": 336786, "epoch": 2783} {"train_loss": -43.59369659423828, "global_step": 336787, "epoch": 2783} {"train_loss": -41.981483459472656, "global_step": 336788, "epoch": 2783} {"train_loss": -42.59397506713867, "global_step": 336789, "epoch": 2783} {"train_loss": -43.47416305541992, "global_step": 336790, "epoch": 2783} {"train_loss": -42.20945358276367, "global_step": 336791, "epoch": 2783} {"train_loss": -43.02783966064453, "global_step": 336792, "epoch": 2783} {"train_loss": -41.58294677734375, "global_step": 336793, "epoch": 2783} {"train_loss": -41.6505241394043, "global_step": 336794, "epoch": 2783} {"train_loss": -43.07070541381836, "global_step": 336795, "epoch": 2783} {"train_loss": -41.096675872802734, "global_step": 336796, "epoch": 2783} {"train_loss": -39.2702751159668, "global_step": 336797, "epoch": 2783} {"train_loss": -41.92596435546875, "global_step": 336798, "epoch": 2783} {"train_loss": -42.926692962646484, "global_step": 336799, "epoch": 2783} {"train_loss": -39.2313346862793, "global_step": 336800, "epoch": 2783} {"train_loss": -40.30863571166992, "global_step": 336801, "epoch": 2783} {"train_loss": -42.9768180847168, "global_step": 336802, "epoch": 2783} {"train_loss": -41.10432052612305, "global_step": 336803, "epoch": 2783} {"train_loss": -42.38005447387695, "global_step": 336804, "epoch": 2783} {"train_loss": -41.87441635131836, "global_step": 336805, "epoch": 2783} {"train_loss": -42.43727111816406, "global_step": 336806, "epoch": 2783} {"train_loss": -41.64840316772461, "global_step": 336807, "epoch": 2783} {"train_loss": -41.7193717956543, "global_step": 336808, "epoch": 2783} {"train_loss": -41.97772216796875, "global_step": 336809, "epoch": 2783} {"train_loss": -40.380252838134766, "global_step": 336810, "epoch": 2783} {"train_loss": -41.887874603271484, "global_step": 336811, "epoch": 2783} {"train_loss": -40.982032775878906, "global_step": 336812, "epoch": 2783} {"train_loss": -42.35197067260742, "global_step": 336813, "epoch": 2783} {"train_loss": -42.37333297729492, "global_step": 336814, "epoch": 2783} {"train_loss": -42.103431701660156, "global_step": 336815, "epoch": 2783} {"train_loss": -41.701114654541016, "global_step": 336816, "epoch": 2783} {"train_loss": -43.70991897583008, "global_step": 336817, "epoch": 2783} {"train_loss": -43.021114349365234, "global_step": 336818, "epoch": 2783} {"train_loss": -43.53544998168945, "global_step": 336819, "epoch": 2783} {"train_loss": -41.34626007080078, "global_step": 336820, "epoch": 2783} {"train_loss": -42.199459075927734, "global_step": 336821, "epoch": 2783} {"train_loss": -43.350860595703125, "global_step": 336822, "epoch": 2783} {"train_loss": -42.82324981689453, "global_step": 336823, "epoch": 2783} {"train_loss": -43.71802520751953, "global_step": 336824, "epoch": 2783} {"train_loss": -42.576045989990234, "global_step": 336825, "epoch": 2783} {"train_loss": -43.661712646484375, "global_step": 336826, "epoch": 2783} {"train_loss": -42.34113311767578, "global_step": 336827, "epoch": 2783} {"train_loss": -43.47164535522461, "global_step": 336828, "epoch": 2783} {"train_loss": -43.55659866333008, "global_step": 336829, "epoch": 2783} {"train_loss": -42.259742736816406, "global_step": 336830, "epoch": 2783} {"train_loss": -43.4452018737793, "global_step": 336831, "epoch": 2783} {"train_loss": -43.74753952026367, "global_step": 336832, "epoch": 2783} {"train_loss": -43.049713134765625, "global_step": 336833, "epoch": 2783} {"train_loss": -42.72819519042969, "global_step": 336834, "epoch": 2783} {"train_loss": -44.40829086303711, "global_step": 336835, "epoch": 2783} {"train_loss": -43.714988708496094, "global_step": 336836, "epoch": 2783} {"train_loss": -43.39179229736328, "global_step": 336837, "epoch": 2783} {"train_loss": -44.30835723876953, "global_step": 336838, "epoch": 2783} {"train_loss": -44.24401092529297, "global_step": 336839, "epoch": 2783} {"train_loss": -43.948238372802734, "global_step": 336840, "epoch": 2783} {"train_loss": -44.191566467285156, "global_step": 336841, "epoch": 2783} {"train_loss": -44.108787536621094, "global_step": 336842, "epoch": 2783} {"train_loss": -44.56964874267578, "global_step": 336843, "epoch": 2783} {"train_loss": -44.4461669921875, "global_step": 336844, "epoch": 2783} {"train_loss": -43.80880355834961, "global_step": 336845, "epoch": 2783} {"train_loss": -44.517208099365234, "global_step": 336846, "epoch": 2783} {"train_loss": -43.351383209228516, "global_step": 336847, "epoch": 2783} {"train_loss": -43.92695236206055, "global_step": 336848, "epoch": 2783} {"train_loss": -43.88398361206055, "global_step": 336849, "epoch": 2783} {"train_loss": -43.638118743896484, "global_step": 336850, "epoch": 2783} {"train_loss": -44.07241439819336, "global_step": 336851, "epoch": 2783} {"train_loss": -43.96982955932617, "global_step": 336852, "epoch": 2783} {"train_loss": -44.43921661376953, "global_step": 336853, "epoch": 2783} {"train_loss": -44.670318603515625, "global_step": 336854, "epoch": 2783} {"train_loss": -43.566253662109375, "global_step": 336855, "epoch": 2783} {"train_loss": -44.6119384765625, "global_step": 336856, "epoch": 2783} {"train_loss": -44.31970977783203, "global_step": 336857, "epoch": 2783} {"train_loss": -43.555274963378906, "global_step": 336858, "epoch": 2783} {"train_loss": -43.91392517089844, "global_step": 336859, "epoch": 2783} {"train_loss": -44.71339797973633, "global_step": 336860, "epoch": 2783} {"train_loss": -44.711544036865234, "global_step": 336861, "epoch": 2783} {"train_loss": -44.26707077026367, "global_step": 336862, "epoch": 2783} {"train_loss": -43.096471423945154, "global_step": 336863, "epoch": 2783, "val_loss": 2608545.0} {"train_loss": -44.411582946777344, "global_step": 336864, "epoch": 2784} {"train_loss": -44.77859115600586, "global_step": 336865, "epoch": 2784} {"train_loss": -44.140357971191406, "global_step": 336866, "epoch": 2784} {"train_loss": -44.70256423950195, "global_step": 336867, "epoch": 2784} {"train_loss": -44.896297454833984, "global_step": 336868, "epoch": 2784} {"train_loss": -45.08364486694336, "global_step": 336869, "epoch": 2784} {"train_loss": -43.810523986816406, "global_step": 336870, "epoch": 2784} {"train_loss": -44.401702880859375, "global_step": 336871, "epoch": 2784} {"train_loss": -44.95458984375, "global_step": 336872, "epoch": 2784} {"train_loss": -44.42145919799805, "global_step": 336873, "epoch": 2784} {"train_loss": -43.26327133178711, "global_step": 336874, "epoch": 2784} {"train_loss": -43.716854095458984, "global_step": 336875, "epoch": 2784} {"train_loss": -44.65885543823242, "global_step": 336876, "epoch": 2784} {"train_loss": -42.16337966918945, "global_step": 336877, "epoch": 2784} {"train_loss": -43.820884704589844, "global_step": 336878, "epoch": 2784} {"train_loss": -43.82395553588867, "global_step": 336879, "epoch": 2784} {"train_loss": -41.209449768066406, "global_step": 336880, "epoch": 2784} {"train_loss": -44.79628372192383, "global_step": 336881, "epoch": 2784} {"train_loss": -39.76273727416992, "global_step": 336882, "epoch": 2784} {"train_loss": -40.0895881652832, "global_step": 336883, "epoch": 2784} {"train_loss": -43.26581573486328, "global_step": 336884, "epoch": 2784} {"train_loss": -40.28843307495117, "global_step": 336885, "epoch": 2784} {"train_loss": -39.4345588684082, "global_step": 336886, "epoch": 2784} {"train_loss": -40.89848709106445, "global_step": 336887, "epoch": 2784} {"train_loss": -40.803932189941406, "global_step": 336888, "epoch": 2784} {"train_loss": -40.265357971191406, "global_step": 336889, "epoch": 2784} {"train_loss": -39.659603118896484, "global_step": 336890, "epoch": 2784} {"train_loss": -38.603118896484375, "global_step": 336891, "epoch": 2784} {"train_loss": -39.7779426574707, "global_step": 336892, "epoch": 2784} {"train_loss": -39.655433654785156, "global_step": 336893, "epoch": 2784} {"train_loss": -39.62101364135742, "global_step": 336894, "epoch": 2784} {"train_loss": -40.73356246948242, "global_step": 336895, "epoch": 2784} {"train_loss": -40.19939041137695, "global_step": 336896, "epoch": 2784} {"train_loss": -40.37850570678711, "global_step": 336897, "epoch": 2784} {"train_loss": -40.35537338256836, "global_step": 336898, "epoch": 2784} {"train_loss": -40.77365493774414, "global_step": 336899, "epoch": 2784} {"train_loss": -40.25846481323242, "global_step": 336900, "epoch": 2784} {"train_loss": -40.23793029785156, "global_step": 336901, "epoch": 2784} {"train_loss": -41.59356689453125, "global_step": 336902, "epoch": 2784} {"train_loss": -41.4537353515625, "global_step": 336903, "epoch": 2784} {"train_loss": -40.15507888793945, "global_step": 336904, "epoch": 2784} {"train_loss": -41.314327239990234, "global_step": 336905, "epoch": 2784} {"train_loss": -40.33552932739258, "global_step": 336906, "epoch": 2784} {"train_loss": -39.84942626953125, "global_step": 336907, "epoch": 2784} {"train_loss": -40.13068771362305, "global_step": 336908, "epoch": 2784} {"train_loss": -40.350013732910156, "global_step": 336909, "epoch": 2784} {"train_loss": -41.0799446105957, "global_step": 336910, "epoch": 2784} {"train_loss": -41.4282341003418, "global_step": 336911, "epoch": 2784} {"train_loss": -41.78126525878906, "global_step": 336912, "epoch": 2784} {"train_loss": -41.84922409057617, "global_step": 336913, "epoch": 2784} {"train_loss": -41.8604736328125, "global_step": 336914, "epoch": 2784} {"train_loss": -41.99494552612305, "global_step": 336915, "epoch": 2784} {"train_loss": -42.44330596923828, "global_step": 336916, "epoch": 2784} {"train_loss": -42.247169494628906, "global_step": 336917, "epoch": 2784} {"train_loss": -43.17295455932617, "global_step": 336918, "epoch": 2784} {"train_loss": -42.47578048706055, "global_step": 336919, "epoch": 2784} {"train_loss": -43.79252243041992, "global_step": 336920, "epoch": 2784} {"train_loss": -43.570533752441406, "global_step": 336921, "epoch": 2784} {"train_loss": -43.42219161987305, "global_step": 336922, "epoch": 2784} {"train_loss": -43.47907638549805, "global_step": 336923, "epoch": 2784} {"train_loss": -43.46269989013672, "global_step": 336924, "epoch": 2784} {"train_loss": -43.938140869140625, "global_step": 336925, "epoch": 2784} {"train_loss": -43.94480514526367, "global_step": 336926, "epoch": 2784} {"train_loss": -43.49817657470703, "global_step": 336927, "epoch": 2784} {"train_loss": -44.10873031616211, "global_step": 336928, "epoch": 2784} {"train_loss": -44.30543899536133, "global_step": 336929, "epoch": 2784} {"train_loss": -43.33796310424805, "global_step": 336930, "epoch": 2784} {"train_loss": -43.653316497802734, "global_step": 336931, "epoch": 2784} {"train_loss": -43.91170883178711, "global_step": 336932, "epoch": 2784} {"train_loss": -44.34798812866211, "global_step": 336933, "epoch": 2784} {"train_loss": -43.898433685302734, "global_step": 336934, "epoch": 2784} {"train_loss": -43.82552719116211, "global_step": 336935, "epoch": 2784} {"train_loss": -44.173553466796875, "global_step": 336936, "epoch": 2784} {"train_loss": -44.04877471923828, "global_step": 336937, "epoch": 2784} {"train_loss": -44.44805908203125, "global_step": 336938, "epoch": 2784} {"train_loss": -43.18023681640625, "global_step": 336939, "epoch": 2784} {"train_loss": -43.35782241821289, "global_step": 336940, "epoch": 2784} {"train_loss": -43.87229919433594, "global_step": 336941, "epoch": 2784} {"train_loss": -44.04661178588867, "global_step": 336942, "epoch": 2784} {"train_loss": -44.188926696777344, "global_step": 336943, "epoch": 2784} {"train_loss": -44.84136199951172, "global_step": 336944, "epoch": 2784} {"train_loss": -44.551368713378906, "global_step": 336945, "epoch": 2784} {"train_loss": -45.18004608154297, "global_step": 336946, "epoch": 2784} {"train_loss": -44.2271614074707, "global_step": 336947, "epoch": 2784} {"train_loss": -44.68428421020508, "global_step": 336948, "epoch": 2784} {"train_loss": -43.98994827270508, "global_step": 336949, "epoch": 2784} {"train_loss": -44.11835479736328, "global_step": 336950, "epoch": 2784} {"train_loss": -44.053768157958984, "global_step": 336951, "epoch": 2784} {"train_loss": -43.163475036621094, "global_step": 336952, "epoch": 2784} {"train_loss": -44.0605583190918, "global_step": 336953, "epoch": 2784} {"train_loss": -41.83640670776367, "global_step": 336954, "epoch": 2784} {"train_loss": -44.50397872924805, "global_step": 336955, "epoch": 2784} {"train_loss": -40.53391647338867, "global_step": 336956, "epoch": 2784} {"train_loss": -44.21923828125, "global_step": 336957, "epoch": 2784} {"train_loss": -42.13800811767578, "global_step": 336958, "epoch": 2784} {"train_loss": -44.2455940246582, "global_step": 336959, "epoch": 2784} {"train_loss": -41.1903076171875, "global_step": 336960, "epoch": 2784} {"train_loss": -43.15351486206055, "global_step": 336961, "epoch": 2784} {"train_loss": -43.305145263671875, "global_step": 336962, "epoch": 2784} {"train_loss": -43.57148361206055, "global_step": 336963, "epoch": 2784} {"train_loss": -43.810157775878906, "global_step": 336964, "epoch": 2784} {"train_loss": -43.24895477294922, "global_step": 336965, "epoch": 2784} {"train_loss": -43.87088394165039, "global_step": 336966, "epoch": 2784} {"train_loss": -42.56626510620117, "global_step": 336967, "epoch": 2784} {"train_loss": -44.71228790283203, "global_step": 336968, "epoch": 2784} {"train_loss": -42.074363708496094, "global_step": 336969, "epoch": 2784} {"train_loss": -44.478515625, "global_step": 336970, "epoch": 2784} {"train_loss": -42.7509651184082, "global_step": 336971, "epoch": 2784} {"train_loss": -43.457305908203125, "global_step": 336972, "epoch": 2784} {"train_loss": -43.74330139160156, "global_step": 336973, "epoch": 2784} {"train_loss": -42.99964141845703, "global_step": 336974, "epoch": 2784} {"train_loss": -44.15629196166992, "global_step": 336975, "epoch": 2784} {"train_loss": -43.73788833618164, "global_step": 336976, "epoch": 2784} {"train_loss": -43.874244689941406, "global_step": 336977, "epoch": 2784} {"train_loss": -44.19222640991211, "global_step": 336978, "epoch": 2784} {"train_loss": -44.39024353027344, "global_step": 336979, "epoch": 2784} {"train_loss": -44.09092712402344, "global_step": 336980, "epoch": 2784} {"train_loss": -42.5527458190918, "global_step": 336981, "epoch": 2784} {"train_loss": -43.616302490234375, "global_step": 336982, "epoch": 2784} {"train_loss": -43.33754348754883, "global_step": 336983, "epoch": 2784} {"train_loss": -42.829449141321106, "global_step": 336984, "epoch": 2784, "val_loss": 2599828.5} {"train_loss": -43.05177688598633, "global_step": 336985, "epoch": 2785} {"train_loss": -43.72672653198242, "global_step": 336986, "epoch": 2785} {"train_loss": -41.84100341796875, "global_step": 336987, "epoch": 2785} {"train_loss": -43.510738372802734, "global_step": 336988, "epoch": 2785} {"train_loss": -42.48153305053711, "global_step": 336989, "epoch": 2785} {"train_loss": -43.74481201171875, "global_step": 336990, "epoch": 2785} {"train_loss": -43.0838737487793, "global_step": 336991, "epoch": 2785} {"train_loss": -43.747005462646484, "global_step": 336992, "epoch": 2785} {"train_loss": -41.67293167114258, "global_step": 336993, "epoch": 2785} {"train_loss": -43.09398651123047, "global_step": 336994, "epoch": 2785} {"train_loss": -41.71317672729492, "global_step": 336995, "epoch": 2785} {"train_loss": -43.76700973510742, "global_step": 336996, "epoch": 2785} {"train_loss": -42.17190170288086, "global_step": 336997, "epoch": 2785} {"train_loss": -43.01278305053711, "global_step": 336998, "epoch": 2785} {"train_loss": -43.461769104003906, "global_step": 336999, "epoch": 2785} {"train_loss": -44.15070343017578, "global_step": 337000, "epoch": 2785} {"train_loss": -43.351131439208984, "global_step": 337001, "epoch": 2785} {"train_loss": -42.41098403930664, "global_step": 337002, "epoch": 2785} {"train_loss": -43.105628967285156, "global_step": 337003, "epoch": 2785} {"train_loss": -44.12032699584961, "global_step": 337004, "epoch": 2785} {"train_loss": -43.940040588378906, "global_step": 337005, "epoch": 2785} {"train_loss": -43.53791046142578, "global_step": 337006, "epoch": 2785} {"train_loss": -43.65626907348633, "global_step": 337007, "epoch": 2785} {"train_loss": -43.725990295410156, "global_step": 337008, "epoch": 2785} {"train_loss": -44.01597213745117, "global_step": 337009, "epoch": 2785} {"train_loss": -44.25160598754883, "global_step": 337010, "epoch": 2785} {"train_loss": -44.202667236328125, "global_step": 337011, "epoch": 2785} {"train_loss": -43.404415130615234, "global_step": 337012, "epoch": 2785} {"train_loss": -44.88285446166992, "global_step": 337013, "epoch": 2785} {"train_loss": -43.54832077026367, "global_step": 337014, "epoch": 2785} {"train_loss": -42.1998291015625, "global_step": 337015, "epoch": 2785} {"train_loss": -44.67985153198242, "global_step": 337016, "epoch": 2785} {"train_loss": -44.01066207885742, "global_step": 337017, "epoch": 2785} {"train_loss": -44.18516540527344, "global_step": 337018, "epoch": 2785} {"train_loss": -43.78451156616211, "global_step": 337019, "epoch": 2785} {"train_loss": -43.95600128173828, "global_step": 337020, "epoch": 2785} {"train_loss": -44.67658615112305, "global_step": 337021, "epoch": 2785} {"train_loss": -43.34383773803711, "global_step": 337022, "epoch": 2785} {"train_loss": -43.84145736694336, "global_step": 337023, "epoch": 2785} {"train_loss": -43.6913948059082, "global_step": 337024, "epoch": 2785} {"train_loss": -44.24927520751953, "global_step": 337025, "epoch": 2785} {"train_loss": -43.55927276611328, "global_step": 337026, "epoch": 2785} {"train_loss": -43.934574127197266, "global_step": 337027, "epoch": 2785} {"train_loss": -43.16609573364258, "global_step": 337028, "epoch": 2785} {"train_loss": -43.6379508972168, "global_step": 337029, "epoch": 2785} {"train_loss": -43.495941162109375, "global_step": 337030, "epoch": 2785} {"train_loss": -42.8390007019043, "global_step": 337031, "epoch": 2785} {"train_loss": -42.37056350708008, "global_step": 337032, "epoch": 2785} {"train_loss": -42.07558059692383, "global_step": 337033, "epoch": 2785} {"train_loss": -42.769744873046875, "global_step": 337034, "epoch": 2785} {"train_loss": -44.220420837402344, "global_step": 337035, "epoch": 2785} {"train_loss": -43.244197845458984, "global_step": 337036, "epoch": 2785} {"train_loss": -43.577423095703125, "global_step": 337037, "epoch": 2785} {"train_loss": -43.60175323486328, "global_step": 337038, "epoch": 2785} {"train_loss": -42.95294952392578, "global_step": 337039, "epoch": 2785} {"train_loss": -43.2713737487793, "global_step": 337040, "epoch": 2785} {"train_loss": -40.30573272705078, "global_step": 337041, "epoch": 2785} {"train_loss": -43.76548385620117, "global_step": 337042, "epoch": 2785} {"train_loss": -41.42609405517578, "global_step": 337043, "epoch": 2785} {"train_loss": -42.57188034057617, "global_step": 337044, "epoch": 2785} {"train_loss": -41.168006896972656, "global_step": 337045, "epoch": 2785} {"train_loss": -42.39229202270508, "global_step": 337046, "epoch": 2785} {"train_loss": -43.05801010131836, "global_step": 337047, "epoch": 2785} {"train_loss": -42.10084533691406, "global_step": 337048, "epoch": 2785} {"train_loss": -42.28740310668945, "global_step": 337049, "epoch": 2785} {"train_loss": -41.9311637878418, "global_step": 337050, "epoch": 2785} {"train_loss": -41.922943115234375, "global_step": 337051, "epoch": 2785} {"train_loss": -43.0037841796875, "global_step": 337052, "epoch": 2785} {"train_loss": -41.808467864990234, "global_step": 337053, "epoch": 2785} {"train_loss": -43.22157669067383, "global_step": 337054, "epoch": 2785} {"train_loss": -41.25373077392578, "global_step": 337055, "epoch": 2785} {"train_loss": -43.84394073486328, "global_step": 337056, "epoch": 2785} {"train_loss": -41.83112716674805, "global_step": 337057, "epoch": 2785} {"train_loss": -42.96242141723633, "global_step": 337058, "epoch": 2785} {"train_loss": -39.0098991394043, "global_step": 337059, "epoch": 2785} {"train_loss": -42.22711181640625, "global_step": 337060, "epoch": 2785} {"train_loss": -43.27313232421875, "global_step": 337061, "epoch": 2785} {"train_loss": -41.25066375732422, "global_step": 337062, "epoch": 2785} {"train_loss": -43.80342483520508, "global_step": 337063, "epoch": 2785} {"train_loss": -42.2739372253418, "global_step": 337064, "epoch": 2785} {"train_loss": -40.56413269042969, "global_step": 337065, "epoch": 2785} {"train_loss": -42.13969039916992, "global_step": 337066, "epoch": 2785} {"train_loss": -43.35065460205078, "global_step": 337067, "epoch": 2785} {"train_loss": -42.23618698120117, "global_step": 337068, "epoch": 2785} {"train_loss": -42.56411361694336, "global_step": 337069, "epoch": 2785} {"train_loss": -43.237342834472656, "global_step": 337070, "epoch": 2785} {"train_loss": -39.47111892700195, "global_step": 337071, "epoch": 2785} {"train_loss": -42.530941009521484, "global_step": 337072, "epoch": 2785} {"train_loss": -40.06046676635742, "global_step": 337073, "epoch": 2785} {"train_loss": -40.84365463256836, "global_step": 337074, "epoch": 2785} {"train_loss": -43.3567008972168, "global_step": 337075, "epoch": 2785} {"train_loss": -41.409236907958984, "global_step": 337076, "epoch": 2785} {"train_loss": -41.93751907348633, "global_step": 337077, "epoch": 2785} {"train_loss": -44.39071273803711, "global_step": 337078, "epoch": 2785} {"train_loss": -41.41904830932617, "global_step": 337079, "epoch": 2785} {"train_loss": -44.00054931640625, "global_step": 337080, "epoch": 2785} {"train_loss": -42.67763137817383, "global_step": 337081, "epoch": 2785} {"train_loss": -42.29637145996094, "global_step": 337082, "epoch": 2785} {"train_loss": -42.80348587036133, "global_step": 337083, "epoch": 2785} {"train_loss": -43.0582275390625, "global_step": 337084, "epoch": 2785} {"train_loss": -44.167911529541016, "global_step": 337085, "epoch": 2785} {"train_loss": -42.90095138549805, "global_step": 337086, "epoch": 2785} {"train_loss": -43.04814529418945, "global_step": 337087, "epoch": 2785} {"train_loss": -42.97719192504883, "global_step": 337088, "epoch": 2785} {"train_loss": -43.17151641845703, "global_step": 337089, "epoch": 2785} {"train_loss": -43.269996643066406, "global_step": 337090, "epoch": 2785} {"train_loss": -44.07685089111328, "global_step": 337091, "epoch": 2785} {"train_loss": -42.90865707397461, "global_step": 337092, "epoch": 2785} {"train_loss": -42.556915283203125, "global_step": 337093, "epoch": 2785} {"train_loss": -44.314693450927734, "global_step": 337094, "epoch": 2785} {"train_loss": -42.79364776611328, "global_step": 337095, "epoch": 2785} {"train_loss": -43.42039108276367, "global_step": 337096, "epoch": 2785} {"train_loss": -43.37417221069336, "global_step": 337097, "epoch": 2785} {"train_loss": -42.6955451965332, "global_step": 337098, "epoch": 2785} {"train_loss": -44.030086517333984, "global_step": 337099, "epoch": 2785} {"train_loss": -43.897071838378906, "global_step": 337100, "epoch": 2785} {"train_loss": -42.72576904296875, "global_step": 337101, "epoch": 2785} {"train_loss": -44.39515686035156, "global_step": 337102, "epoch": 2785} {"train_loss": -44.00362777709961, "global_step": 337103, "epoch": 2785} {"train_loss": -42.8867301940918, "global_step": 337104, "epoch": 2785} {"train_loss": -42.979913632731794, "global_step": 337105, "epoch": 2785, "val_loss": 2793318.5} {"train_loss": -43.79691696166992, "global_step": 337106, "epoch": 2786} {"train_loss": -43.27750015258789, "global_step": 337107, "epoch": 2786} {"train_loss": -44.25222396850586, "global_step": 337108, "epoch": 2786} {"train_loss": -41.907466888427734, "global_step": 337109, "epoch": 2786} {"train_loss": -43.53229522705078, "global_step": 337110, "epoch": 2786} {"train_loss": -42.29648208618164, "global_step": 337111, "epoch": 2786} {"train_loss": -42.95656967163086, "global_step": 337112, "epoch": 2786} {"train_loss": -43.68349838256836, "global_step": 337113, "epoch": 2786} {"train_loss": -42.31528854370117, "global_step": 337114, "epoch": 2786} {"train_loss": -43.7569694519043, "global_step": 337115, "epoch": 2786} {"train_loss": -43.21882629394531, "global_step": 337116, "epoch": 2786} {"train_loss": -43.09160232543945, "global_step": 337117, "epoch": 2786} {"train_loss": -42.927154541015625, "global_step": 337118, "epoch": 2786} {"train_loss": -43.52752685546875, "global_step": 337119, "epoch": 2786} {"train_loss": -43.616756439208984, "global_step": 337120, "epoch": 2786} {"train_loss": -43.82954025268555, "global_step": 337121, "epoch": 2786} {"train_loss": -42.3844108581543, "global_step": 337122, "epoch": 2786} {"train_loss": -42.94099807739258, "global_step": 337123, "epoch": 2786} {"train_loss": -43.843833923339844, "global_step": 337124, "epoch": 2786} {"train_loss": -43.3311767578125, "global_step": 337125, "epoch": 2786} {"train_loss": -43.34713363647461, "global_step": 337126, "epoch": 2786} {"train_loss": -44.041873931884766, "global_step": 337127, "epoch": 2786} {"train_loss": -42.43833541870117, "global_step": 337128, "epoch": 2786} {"train_loss": -44.15641403198242, "global_step": 337129, "epoch": 2786} {"train_loss": -41.67277145385742, "global_step": 337130, "epoch": 2786} {"train_loss": -44.99148178100586, "global_step": 337131, "epoch": 2786} {"train_loss": -42.726661682128906, "global_step": 337132, "epoch": 2786} {"train_loss": -44.551387786865234, "global_step": 337133, "epoch": 2786} {"train_loss": -42.28862762451172, "global_step": 337134, "epoch": 2786} {"train_loss": -43.54271697998047, "global_step": 337135, "epoch": 2786} {"train_loss": -41.85362243652344, "global_step": 337136, "epoch": 2786} {"train_loss": -44.098690032958984, "global_step": 337137, "epoch": 2786} {"train_loss": -42.73012924194336, "global_step": 337138, "epoch": 2786} {"train_loss": -44.3031120300293, "global_step": 337139, "epoch": 2786} {"train_loss": -43.359619140625, "global_step": 337140, "epoch": 2786} {"train_loss": -43.17252731323242, "global_step": 337141, "epoch": 2786} {"train_loss": -44.127830505371094, "global_step": 337142, "epoch": 2786} {"train_loss": -42.00455856323242, "global_step": 337143, "epoch": 2786} {"train_loss": -43.81156539916992, "global_step": 337144, "epoch": 2786} {"train_loss": -42.71866989135742, "global_step": 337145, "epoch": 2786} {"train_loss": -44.216026306152344, "global_step": 337146, "epoch": 2786} {"train_loss": -43.413814544677734, "global_step": 337147, "epoch": 2786} {"train_loss": -43.82011795043945, "global_step": 337148, "epoch": 2786} {"train_loss": -42.2840576171875, "global_step": 337149, "epoch": 2786} {"train_loss": -44.013580322265625, "global_step": 337150, "epoch": 2786} {"train_loss": -43.583370208740234, "global_step": 337151, "epoch": 2786} {"train_loss": -44.86588668823242, "global_step": 337152, "epoch": 2786} {"train_loss": -43.14417266845703, "global_step": 337153, "epoch": 2786} {"train_loss": -43.121158599853516, "global_step": 337154, "epoch": 2786} {"train_loss": -43.89948654174805, "global_step": 337155, "epoch": 2786} {"train_loss": -44.77588653564453, "global_step": 337156, "epoch": 2786} {"train_loss": -43.818843841552734, "global_step": 337157, "epoch": 2786} {"train_loss": -44.27717208862305, "global_step": 337158, "epoch": 2786} {"train_loss": -43.412689208984375, "global_step": 337159, "epoch": 2786} {"train_loss": -44.09223175048828, "global_step": 337160, "epoch": 2786} {"train_loss": -43.753082275390625, "global_step": 337161, "epoch": 2786} {"train_loss": -44.8555793762207, "global_step": 337162, "epoch": 2786} {"train_loss": -43.034847259521484, "global_step": 337163, "epoch": 2786} {"train_loss": -44.18190002441406, "global_step": 337164, "epoch": 2786} {"train_loss": -43.32996368408203, "global_step": 337165, "epoch": 2786} {"train_loss": -44.13531494140625, "global_step": 337166, "epoch": 2786} {"train_loss": -44.48768997192383, "global_step": 337167, "epoch": 2786} {"train_loss": -44.99251174926758, "global_step": 337168, "epoch": 2786} {"train_loss": -44.586971282958984, "global_step": 337169, "epoch": 2786} {"train_loss": -43.3452262878418, "global_step": 337170, "epoch": 2786} {"train_loss": -43.853755950927734, "global_step": 337171, "epoch": 2786} {"train_loss": -42.38957977294922, "global_step": 337172, "epoch": 2786} {"train_loss": -44.341575622558594, "global_step": 337173, "epoch": 2786} {"train_loss": -44.610897064208984, "global_step": 337174, "epoch": 2786} {"train_loss": -42.5485954284668, "global_step": 337175, "epoch": 2786} {"train_loss": -44.49734115600586, "global_step": 337176, "epoch": 2786} {"train_loss": -44.36480712890625, "global_step": 337177, "epoch": 2786} {"train_loss": -41.52651596069336, "global_step": 337178, "epoch": 2786} {"train_loss": -39.64434814453125, "global_step": 337179, "epoch": 2786} {"train_loss": -44.52100372314453, "global_step": 337180, "epoch": 2786} {"train_loss": -40.57609939575195, "global_step": 337181, "epoch": 2786} {"train_loss": -34.71692657470703, "global_step": 337182, "epoch": 2786} {"train_loss": -43.129005432128906, "global_step": 337183, "epoch": 2786} {"train_loss": -40.831050872802734, "global_step": 337184, "epoch": 2786} {"train_loss": -39.32969284057617, "global_step": 337185, "epoch": 2786} {"train_loss": -34.444122314453125, "global_step": 337186, "epoch": 2786} {"train_loss": -34.086822509765625, "global_step": 337187, "epoch": 2786} {"train_loss": -37.11235046386719, "global_step": 337188, "epoch": 2786} {"train_loss": -37.45701217651367, "global_step": 337189, "epoch": 2786} {"train_loss": -36.724491119384766, "global_step": 337190, "epoch": 2786} {"train_loss": -38.9555549621582, "global_step": 337191, "epoch": 2786} {"train_loss": -37.54850769042969, "global_step": 337192, "epoch": 2786} {"train_loss": -39.19797134399414, "global_step": 337193, "epoch": 2786} {"train_loss": -38.08327865600586, "global_step": 337194, "epoch": 2786} {"train_loss": -39.33024215698242, "global_step": 337195, "epoch": 2786} {"train_loss": -37.38336944580078, "global_step": 337196, "epoch": 2786} {"train_loss": -39.575008392333984, "global_step": 337197, "epoch": 2786} {"train_loss": -37.88320541381836, "global_step": 337198, "epoch": 2786} {"train_loss": -40.31905746459961, "global_step": 337199, "epoch": 2786} {"train_loss": -38.91389846801758, "global_step": 337200, "epoch": 2786} {"train_loss": -40.10097885131836, "global_step": 337201, "epoch": 2786} {"train_loss": -39.64065170288086, "global_step": 337202, "epoch": 2786} {"train_loss": -40.409175872802734, "global_step": 337203, "epoch": 2786} {"train_loss": -39.24163055419922, "global_step": 337204, "epoch": 2786} {"train_loss": -39.81459426879883, "global_step": 337205, "epoch": 2786} {"train_loss": -40.39714431762695, "global_step": 337206, "epoch": 2786} {"train_loss": -39.96022415161133, "global_step": 337207, "epoch": 2786} {"train_loss": -40.3170166015625, "global_step": 337208, "epoch": 2786} {"train_loss": -40.293453216552734, "global_step": 337209, "epoch": 2786} {"train_loss": -40.14698791503906, "global_step": 337210, "epoch": 2786} {"train_loss": -40.40464401245117, "global_step": 337211, "epoch": 2786} {"train_loss": -40.28867721557617, "global_step": 337212, "epoch": 2786} {"train_loss": -41.16181182861328, "global_step": 337213, "epoch": 2786} {"train_loss": -40.94123077392578, "global_step": 337214, "epoch": 2786} {"train_loss": -40.395511627197266, "global_step": 337215, "epoch": 2786} {"train_loss": -40.553707122802734, "global_step": 337216, "epoch": 2786} {"train_loss": -40.73432540893555, "global_step": 337217, "epoch": 2786} {"train_loss": -41.02085494995117, "global_step": 337218, "epoch": 2786} {"train_loss": -41.23421859741211, "global_step": 337219, "epoch": 2786} {"train_loss": -41.34248733520508, "global_step": 337220, "epoch": 2786} {"train_loss": -41.125911712646484, "global_step": 337221, "epoch": 2786} {"train_loss": -41.253231048583984, "global_step": 337222, "epoch": 2786} {"train_loss": -41.21297836303711, "global_step": 337223, "epoch": 2786} {"train_loss": -40.817665100097656, "global_step": 337224, "epoch": 2786} {"train_loss": -40.85097885131836, "global_step": 337225, "epoch": 2786} {"train_loss": -41.959372559854806, "global_step": 337226, "epoch": 2786, "val_loss": 2742726.75} {"train_loss": -37.43587875366211, "global_step": 337227, "epoch": 2787} {"train_loss": -40.303688049316406, "global_step": 337228, "epoch": 2787} {"train_loss": -40.45747756958008, "global_step": 337229, "epoch": 2787} {"train_loss": -39.9453125, "global_step": 337230, "epoch": 2787} {"train_loss": -40.9948616027832, "global_step": 337231, "epoch": 2787} {"train_loss": -40.36213684082031, "global_step": 337232, "epoch": 2787} {"train_loss": -40.29353713989258, "global_step": 337233, "epoch": 2787} {"train_loss": -41.771095275878906, "global_step": 337234, "epoch": 2787} {"train_loss": -40.924007415771484, "global_step": 337235, "epoch": 2787} {"train_loss": -42.155696868896484, "global_step": 337236, "epoch": 2787} {"train_loss": -41.35116195678711, "global_step": 337237, "epoch": 2787} {"train_loss": -40.90192413330078, "global_step": 337238, "epoch": 2787} {"train_loss": -41.7627067565918, "global_step": 337239, "epoch": 2787} {"train_loss": -41.05354690551758, "global_step": 337240, "epoch": 2787} {"train_loss": -42.09088897705078, "global_step": 337241, "epoch": 2787} {"train_loss": -41.61263656616211, "global_step": 337242, "epoch": 2787} {"train_loss": -41.5673828125, "global_step": 337243, "epoch": 2787} {"train_loss": -41.302978515625, "global_step": 337244, "epoch": 2787} {"train_loss": -42.13562774658203, "global_step": 337245, "epoch": 2787} {"train_loss": -42.17507553100586, "global_step": 337246, "epoch": 2787} {"train_loss": -41.66999053955078, "global_step": 337247, "epoch": 2787} {"train_loss": -41.7144660949707, "global_step": 337248, "epoch": 2787} {"train_loss": -42.15758514404297, "global_step": 337249, "epoch": 2787} {"train_loss": -42.49314498901367, "global_step": 337250, "epoch": 2787} {"train_loss": -42.088890075683594, "global_step": 337251, "epoch": 2787} {"train_loss": -41.9783935546875, "global_step": 337252, "epoch": 2787} {"train_loss": -41.251590728759766, "global_step": 337253, "epoch": 2787} {"train_loss": -42.20709228515625, "global_step": 337254, "epoch": 2787} {"train_loss": -42.533138275146484, "global_step": 337255, "epoch": 2787} {"train_loss": -41.74295425415039, "global_step": 337256, "epoch": 2787} {"train_loss": -41.29631423950195, "global_step": 337257, "epoch": 2787} {"train_loss": -41.36678695678711, "global_step": 337258, "epoch": 2787} {"train_loss": -42.614723205566406, "global_step": 337259, "epoch": 2787} {"train_loss": -41.701725006103516, "global_step": 337260, "epoch": 2787} {"train_loss": -41.750057220458984, "global_step": 337261, "epoch": 2787} {"train_loss": -42.86384201049805, "global_step": 337262, "epoch": 2787} {"train_loss": -41.54127502441406, "global_step": 337263, "epoch": 2787} {"train_loss": -40.887939453125, "global_step": 337264, "epoch": 2787} {"train_loss": -43.119075775146484, "global_step": 337265, "epoch": 2787} {"train_loss": -41.232872009277344, "global_step": 337266, "epoch": 2787} {"train_loss": -41.6530876159668, "global_step": 337267, "epoch": 2787} {"train_loss": -42.42549514770508, "global_step": 337268, "epoch": 2787} {"train_loss": -41.6088981628418, "global_step": 337269, "epoch": 2787} {"train_loss": -42.850311279296875, "global_step": 337270, "epoch": 2787} {"train_loss": -42.4493522644043, "global_step": 337271, "epoch": 2787} {"train_loss": -41.72700500488281, "global_step": 337272, "epoch": 2787} {"train_loss": -42.80884552001953, "global_step": 337273, "epoch": 2787} {"train_loss": -42.6298713684082, "global_step": 337274, "epoch": 2787} {"train_loss": -42.89442825317383, "global_step": 337275, "epoch": 2787} {"train_loss": -42.686790466308594, "global_step": 337276, "epoch": 2787} {"train_loss": -42.870182037353516, "global_step": 337277, "epoch": 2787} {"train_loss": -42.8884391784668, "global_step": 337278, "epoch": 2787} {"train_loss": -43.1352653503418, "global_step": 337279, "epoch": 2787} {"train_loss": -43.59019088745117, "global_step": 337280, "epoch": 2787} {"train_loss": -42.42960739135742, "global_step": 337281, "epoch": 2787} {"train_loss": -42.506988525390625, "global_step": 337282, "epoch": 2787} {"train_loss": -42.99271011352539, "global_step": 337283, "epoch": 2787} {"train_loss": -43.02845764160156, "global_step": 337284, "epoch": 2787} {"train_loss": -43.151092529296875, "global_step": 337285, "epoch": 2787} {"train_loss": -43.42617416381836, "global_step": 337286, "epoch": 2787} {"train_loss": -43.27120590209961, "global_step": 337287, "epoch": 2787} {"train_loss": -43.51633071899414, "global_step": 337288, "epoch": 2787} {"train_loss": -43.50847244262695, "global_step": 337289, "epoch": 2787} {"train_loss": -35.28885269165039, "global_step": 337290, "epoch": 2787} {"train_loss": -41.644832611083984, "global_step": 337291, "epoch": 2787} {"train_loss": -43.024330139160156, "global_step": 337292, "epoch": 2787} {"train_loss": -42.924598693847656, "global_step": 337293, "epoch": 2787} {"train_loss": -43.023651123046875, "global_step": 337294, "epoch": 2787} {"train_loss": -42.42263412475586, "global_step": 337295, "epoch": 2787} {"train_loss": -43.16443634033203, "global_step": 337296, "epoch": 2787} {"train_loss": -43.11237716674805, "global_step": 337297, "epoch": 2787} {"train_loss": -43.39948272705078, "global_step": 337298, "epoch": 2787} {"train_loss": -43.47768783569336, "global_step": 337299, "epoch": 2787} {"train_loss": -43.26630783081055, "global_step": 337300, "epoch": 2787} {"train_loss": -43.49459457397461, "global_step": 337301, "epoch": 2787} {"train_loss": -42.773677825927734, "global_step": 337302, "epoch": 2787} {"train_loss": -42.151947021484375, "global_step": 337303, "epoch": 2787} {"train_loss": -40.12261199951172, "global_step": 337304, "epoch": 2787} {"train_loss": -38.74629211425781, "global_step": 337305, "epoch": 2787} {"train_loss": -42.73548126220703, "global_step": 337306, "epoch": 2787} {"train_loss": -40.90834426879883, "global_step": 337307, "epoch": 2787} {"train_loss": -32.759376525878906, "global_step": 337308, "epoch": 2787} {"train_loss": -42.59133529663086, "global_step": 337309, "epoch": 2787} {"train_loss": -40.73710250854492, "global_step": 337310, "epoch": 2787} {"train_loss": -40.611881256103516, "global_step": 337311, "epoch": 2787} {"train_loss": -42.861541748046875, "global_step": 337312, "epoch": 2787} {"train_loss": -41.72352981567383, "global_step": 337313, "epoch": 2787} {"train_loss": -41.32059860229492, "global_step": 337314, "epoch": 2787} {"train_loss": -41.57754898071289, "global_step": 337315, "epoch": 2787} {"train_loss": -37.843509674072266, "global_step": 337316, "epoch": 2787} {"train_loss": -41.544490814208984, "global_step": 337317, "epoch": 2787} {"train_loss": -42.28718185424805, "global_step": 337318, "epoch": 2787} {"train_loss": -41.6036262512207, "global_step": 337319, "epoch": 2787} {"train_loss": -41.9473991394043, "global_step": 337320, "epoch": 2787} {"train_loss": -39.494476318359375, "global_step": 337321, "epoch": 2787} {"train_loss": -42.55110549926758, "global_step": 337322, "epoch": 2787} {"train_loss": -40.916622161865234, "global_step": 337323, "epoch": 2787} {"train_loss": -30.232044219970703, "global_step": 337324, "epoch": 2787} {"train_loss": -40.40180206298828, "global_step": 337325, "epoch": 2787} {"train_loss": -43.000484466552734, "global_step": 337326, "epoch": 2787} {"train_loss": -32.25960922241211, "global_step": 337327, "epoch": 2787} {"train_loss": -38.248836517333984, "global_step": 337328, "epoch": 2787} {"train_loss": -39.80652618408203, "global_step": 337329, "epoch": 2787} {"train_loss": -29.41754150390625, "global_step": 337330, "epoch": 2787} {"train_loss": -38.399147033691406, "global_step": 337331, "epoch": 2787} {"train_loss": -39.2016716003418, "global_step": 337332, "epoch": 2787} {"train_loss": -40.88862228393555, "global_step": 337333, "epoch": 2787} {"train_loss": -40.99876022338867, "global_step": 337334, "epoch": 2787} {"train_loss": -35.9728889465332, "global_step": 337335, "epoch": 2787} {"train_loss": -37.88619613647461, "global_step": 337336, "epoch": 2787} {"train_loss": -41.4559326171875, "global_step": 337337, "epoch": 2787} {"train_loss": -39.06948471069336, "global_step": 337338, "epoch": 2787} {"train_loss": -40.28791809082031, "global_step": 337339, "epoch": 2787} {"train_loss": -36.972896575927734, "global_step": 337340, "epoch": 2787} {"train_loss": -36.56666946411133, "global_step": 337341, "epoch": 2787} {"train_loss": -39.260650634765625, "global_step": 337342, "epoch": 2787} {"train_loss": -39.64013671875, "global_step": 337343, "epoch": 2787} {"train_loss": -36.85212326049805, "global_step": 337344, "epoch": 2787} {"train_loss": -39.68061447143555, "global_step": 337345, "epoch": 2787} {"train_loss": -40.40562057495117, "global_step": 337346, "epoch": 2787} {"train_loss": -41.0149314502054, "global_step": 337347, "epoch": 2787, "val_loss": 2600977.25} {"train_loss": -37.65544128417969, "global_step": 337348, "epoch": 2788} {"train_loss": -36.489871978759766, "global_step": 337349, "epoch": 2788} {"train_loss": -39.30466079711914, "global_step": 337350, "epoch": 2788} {"train_loss": -40.74326705932617, "global_step": 337351, "epoch": 2788} {"train_loss": -35.647823333740234, "global_step": 337352, "epoch": 2788} {"train_loss": -37.51634979248047, "global_step": 337353, "epoch": 2788} {"train_loss": -39.0219841003418, "global_step": 337354, "epoch": 2788} {"train_loss": -36.42823028564453, "global_step": 337355, "epoch": 2788} {"train_loss": -36.97658920288086, "global_step": 337356, "epoch": 2788} {"train_loss": -39.28776168823242, "global_step": 337357, "epoch": 2788} {"train_loss": -39.124874114990234, "global_step": 337358, "epoch": 2788} {"train_loss": -39.43849182128906, "global_step": 337359, "epoch": 2788} {"train_loss": -38.91526412963867, "global_step": 337360, "epoch": 2788} {"train_loss": -38.36417007446289, "global_step": 337361, "epoch": 2788} {"train_loss": -36.700355529785156, "global_step": 337362, "epoch": 2788} {"train_loss": -39.31600570678711, "global_step": 337363, "epoch": 2788} {"train_loss": -40.83687973022461, "global_step": 337364, "epoch": 2788} {"train_loss": -34.091346740722656, "global_step": 337365, "epoch": 2788} {"train_loss": -39.8052978515625, "global_step": 337366, "epoch": 2788} {"train_loss": -39.36308670043945, "global_step": 337367, "epoch": 2788} {"train_loss": -39.7317008972168, "global_step": 337368, "epoch": 2788} {"train_loss": -38.55607986450195, "global_step": 337369, "epoch": 2788} {"train_loss": -39.667598724365234, "global_step": 337370, "epoch": 2788} {"train_loss": -41.345558166503906, "global_step": 337371, "epoch": 2788} {"train_loss": -38.5721549987793, "global_step": 337372, "epoch": 2788} {"train_loss": -39.11362838745117, "global_step": 337373, "epoch": 2788} {"train_loss": -38.4127311706543, "global_step": 337374, "epoch": 2788} {"train_loss": -40.64923095703125, "global_step": 337375, "epoch": 2788} {"train_loss": -40.60470199584961, "global_step": 337376, "epoch": 2788} {"train_loss": -40.797855377197266, "global_step": 337377, "epoch": 2788} {"train_loss": -40.71604537963867, "global_step": 337378, "epoch": 2788} {"train_loss": -39.8998908996582, "global_step": 337379, "epoch": 2788} {"train_loss": -40.295841217041016, "global_step": 337380, "epoch": 2788} {"train_loss": -40.97418975830078, "global_step": 337381, "epoch": 2788} {"train_loss": -40.705387115478516, "global_step": 337382, "epoch": 2788} {"train_loss": -39.29214096069336, "global_step": 337383, "epoch": 2788} {"train_loss": -40.14913558959961, "global_step": 337384, "epoch": 2788} {"train_loss": -40.2193717956543, "global_step": 337385, "epoch": 2788} {"train_loss": -40.679443359375, "global_step": 337386, "epoch": 2788} {"train_loss": -40.15149688720703, "global_step": 337387, "epoch": 2788} {"train_loss": -39.21377182006836, "global_step": 337388, "epoch": 2788} {"train_loss": -40.621944427490234, "global_step": 337389, "epoch": 2788} {"train_loss": -39.655025482177734, "global_step": 337390, "epoch": 2788} {"train_loss": -40.75843048095703, "global_step": 337391, "epoch": 2788} {"train_loss": -40.89552688598633, "global_step": 337392, "epoch": 2788} {"train_loss": -40.77782440185547, "global_step": 337393, "epoch": 2788} {"train_loss": -41.8681526184082, "global_step": 337394, "epoch": 2788} {"train_loss": -41.8480339050293, "global_step": 337395, "epoch": 2788} {"train_loss": -40.47572708129883, "global_step": 337396, "epoch": 2788} {"train_loss": -40.10700607299805, "global_step": 337397, "epoch": 2788} {"train_loss": -39.23197937011719, "global_step": 337398, "epoch": 2788} {"train_loss": -40.387813568115234, "global_step": 337399, "epoch": 2788} {"train_loss": -41.39162063598633, "global_step": 337400, "epoch": 2788} {"train_loss": -39.95337677001953, "global_step": 337401, "epoch": 2788} {"train_loss": -41.329586029052734, "global_step": 337402, "epoch": 2788} {"train_loss": -39.774993896484375, "global_step": 337403, "epoch": 2788} {"train_loss": -41.44075393676758, "global_step": 337404, "epoch": 2788} {"train_loss": -41.862667083740234, "global_step": 337405, "epoch": 2788} {"train_loss": -40.61921310424805, "global_step": 337406, "epoch": 2788} {"train_loss": -40.72805404663086, "global_step": 337407, "epoch": 2788} {"train_loss": -41.8340950012207, "global_step": 337408, "epoch": 2788} {"train_loss": -41.82577133178711, "global_step": 337409, "epoch": 2788} {"train_loss": -41.4848747253418, "global_step": 337410, "epoch": 2788} {"train_loss": -40.506710052490234, "global_step": 337411, "epoch": 2788} {"train_loss": -41.65602111816406, "global_step": 337412, "epoch": 2788} {"train_loss": -41.65119171142578, "global_step": 337413, "epoch": 2788} {"train_loss": -41.635589599609375, "global_step": 337414, "epoch": 2788} {"train_loss": -40.70697784423828, "global_step": 337415, "epoch": 2788} {"train_loss": -42.15214920043945, "global_step": 337416, "epoch": 2788} {"train_loss": -39.94866943359375, "global_step": 337417, "epoch": 2788} {"train_loss": -42.374813079833984, "global_step": 337418, "epoch": 2788} {"train_loss": -41.41239547729492, "global_step": 337419, "epoch": 2788} {"train_loss": -41.93830871582031, "global_step": 337420, "epoch": 2788} {"train_loss": -41.60270690917969, "global_step": 337421, "epoch": 2788} {"train_loss": -41.125389099121094, "global_step": 337422, "epoch": 2788} {"train_loss": -41.954505920410156, "global_step": 337423, "epoch": 2788} {"train_loss": -41.80280685424805, "global_step": 337424, "epoch": 2788} {"train_loss": -41.755401611328125, "global_step": 337425, "epoch": 2788} {"train_loss": -41.530025482177734, "global_step": 337426, "epoch": 2788} {"train_loss": -42.757781982421875, "global_step": 337427, "epoch": 2788} {"train_loss": -41.22024154663086, "global_step": 337428, "epoch": 2788} {"train_loss": -40.46577072143555, "global_step": 337429, "epoch": 2788} {"train_loss": -42.54523849487305, "global_step": 337430, "epoch": 2788} {"train_loss": -42.099491119384766, "global_step": 337431, "epoch": 2788} {"train_loss": -42.16767501831055, "global_step": 337432, "epoch": 2788} {"train_loss": -42.306514739990234, "global_step": 337433, "epoch": 2788} {"train_loss": -41.36255645751953, "global_step": 337434, "epoch": 2788} {"train_loss": -42.29151153564453, "global_step": 337435, "epoch": 2788} {"train_loss": -42.828853607177734, "global_step": 337436, "epoch": 2788} {"train_loss": -43.02212142944336, "global_step": 337437, "epoch": 2788} {"train_loss": -42.09556198120117, "global_step": 337438, "epoch": 2788} {"train_loss": -41.784217834472656, "global_step": 337439, "epoch": 2788} {"train_loss": -42.173152923583984, "global_step": 337440, "epoch": 2788} {"train_loss": -41.79769515991211, "global_step": 337441, "epoch": 2788} {"train_loss": -41.64876937866211, "global_step": 337442, "epoch": 2788} {"train_loss": -41.79952621459961, "global_step": 337443, "epoch": 2788} {"train_loss": -41.735877990722656, "global_step": 337444, "epoch": 2788} {"train_loss": -39.60187530517578, "global_step": 337445, "epoch": 2788} {"train_loss": -42.4874267578125, "global_step": 337446, "epoch": 2788} {"train_loss": -42.534332275390625, "global_step": 337447, "epoch": 2788} {"train_loss": -42.774715423583984, "global_step": 337448, "epoch": 2788} {"train_loss": -41.92878723144531, "global_step": 337449, "epoch": 2788} {"train_loss": -41.963321685791016, "global_step": 337450, "epoch": 2788} {"train_loss": -42.96001434326172, "global_step": 337451, "epoch": 2788} {"train_loss": -41.87746810913086, "global_step": 337452, "epoch": 2788} {"train_loss": -41.9687385559082, "global_step": 337453, "epoch": 2788} {"train_loss": -42.877113342285156, "global_step": 337454, "epoch": 2788} {"train_loss": -42.01919174194336, "global_step": 337455, "epoch": 2788} {"train_loss": -42.38818359375, "global_step": 337456, "epoch": 2788} {"train_loss": -41.978309631347656, "global_step": 337457, "epoch": 2788} {"train_loss": -41.9273681640625, "global_step": 337458, "epoch": 2788} {"train_loss": -42.86592483520508, "global_step": 337459, "epoch": 2788} {"train_loss": -42.91058349609375, "global_step": 337460, "epoch": 2788} {"train_loss": -41.547088623046875, "global_step": 337461, "epoch": 2788} {"train_loss": -41.96425247192383, "global_step": 337462, "epoch": 2788} {"train_loss": -43.00739669799805, "global_step": 337463, "epoch": 2788} {"train_loss": -42.78719711303711, "global_step": 337464, "epoch": 2788} {"train_loss": -39.88202667236328, "global_step": 337465, "epoch": 2788} {"train_loss": -42.86465072631836, "global_step": 337466, "epoch": 2788} {"train_loss": -42.43818283081055, "global_step": 337467, "epoch": 2788} {"train_loss": -40.79049490306003, "global_step": 337468, "epoch": 2788, "val_loss": 2591994.75} {"train_loss": -41.753604888916016, "global_step": 337469, "epoch": 2789} {"train_loss": -42.18024826049805, "global_step": 337470, "epoch": 2789} {"train_loss": -42.17898178100586, "global_step": 337471, "epoch": 2789} {"train_loss": -43.09558868408203, "global_step": 337472, "epoch": 2789} {"train_loss": -42.25294876098633, "global_step": 337473, "epoch": 2789} {"train_loss": -42.0863037109375, "global_step": 337474, "epoch": 2789} {"train_loss": -42.11355209350586, "global_step": 337475, "epoch": 2789} {"train_loss": -41.10725021362305, "global_step": 337476, "epoch": 2789} {"train_loss": -40.00904846191406, "global_step": 337477, "epoch": 2789} {"train_loss": -37.71830368041992, "global_step": 337478, "epoch": 2789} {"train_loss": -39.59670639038086, "global_step": 337479, "epoch": 2789} {"train_loss": -42.912322998046875, "global_step": 337480, "epoch": 2789} {"train_loss": -38.72068786621094, "global_step": 337481, "epoch": 2789} {"train_loss": -39.33707809448242, "global_step": 337482, "epoch": 2789} {"train_loss": -42.898983001708984, "global_step": 337483, "epoch": 2789} {"train_loss": -39.936214447021484, "global_step": 337484, "epoch": 2789} {"train_loss": -40.71415328979492, "global_step": 337485, "epoch": 2789} {"train_loss": -42.28486251831055, "global_step": 337486, "epoch": 2789} {"train_loss": -40.13235092163086, "global_step": 337487, "epoch": 2789} {"train_loss": -41.7458610534668, "global_step": 337488, "epoch": 2789} {"train_loss": -42.21220779418945, "global_step": 337489, "epoch": 2789} {"train_loss": -43.048152923583984, "global_step": 337490, "epoch": 2789} {"train_loss": -42.244571685791016, "global_step": 337491, "epoch": 2789} {"train_loss": -41.68769073486328, "global_step": 337492, "epoch": 2789} {"train_loss": -42.71286392211914, "global_step": 337493, "epoch": 2789} {"train_loss": -42.6981086730957, "global_step": 337494, "epoch": 2789} {"train_loss": -42.287479400634766, "global_step": 337495, "epoch": 2789} {"train_loss": -42.67144012451172, "global_step": 337496, "epoch": 2789} {"train_loss": -42.4994010925293, "global_step": 337497, "epoch": 2789} {"train_loss": -42.848052978515625, "global_step": 337498, "epoch": 2789} {"train_loss": -42.847957611083984, "global_step": 337499, "epoch": 2789} {"train_loss": -42.16901397705078, "global_step": 337500, "epoch": 2789} {"train_loss": -42.501075744628906, "global_step": 337501, "epoch": 2789} {"train_loss": -41.941261291503906, "global_step": 337502, "epoch": 2789} {"train_loss": -41.59941864013672, "global_step": 337503, "epoch": 2789} {"train_loss": -41.99030685424805, "global_step": 337504, "epoch": 2789} {"train_loss": -43.064876556396484, "global_step": 337505, "epoch": 2789} {"train_loss": -41.93279266357422, "global_step": 337506, "epoch": 2789} {"train_loss": -43.30230712890625, "global_step": 337507, "epoch": 2789} {"train_loss": -42.00302505493164, "global_step": 337508, "epoch": 2789} {"train_loss": -42.10491943359375, "global_step": 337509, "epoch": 2789} {"train_loss": -41.80826950073242, "global_step": 337510, "epoch": 2789} {"train_loss": -43.269588470458984, "global_step": 337511, "epoch": 2789} {"train_loss": -42.786399841308594, "global_step": 337512, "epoch": 2789} {"train_loss": -42.960235595703125, "global_step": 337513, "epoch": 2789} {"train_loss": -42.58002471923828, "global_step": 337514, "epoch": 2789} {"train_loss": -43.09661865234375, "global_step": 337515, "epoch": 2789} {"train_loss": -42.436279296875, "global_step": 337516, "epoch": 2789} {"train_loss": -43.399169921875, "global_step": 337517, "epoch": 2789} {"train_loss": -42.61509704589844, "global_step": 337518, "epoch": 2789} {"train_loss": -42.995452880859375, "global_step": 337519, "epoch": 2789} {"train_loss": -43.24300765991211, "global_step": 337520, "epoch": 2789} {"train_loss": -42.432769775390625, "global_step": 337521, "epoch": 2789} {"train_loss": -43.32990646362305, "global_step": 337522, "epoch": 2789} {"train_loss": -42.47520446777344, "global_step": 337523, "epoch": 2789} {"train_loss": -43.0663948059082, "global_step": 337524, "epoch": 2789} {"train_loss": -42.97409439086914, "global_step": 337525, "epoch": 2789} {"train_loss": -42.079917907714844, "global_step": 337526, "epoch": 2789} {"train_loss": -39.51249694824219, "global_step": 337527, "epoch": 2789} {"train_loss": -34.79353713989258, "global_step": 337528, "epoch": 2789} {"train_loss": -29.9708251953125, "global_step": 337529, "epoch": 2789} {"train_loss": -36.319496154785156, "global_step": 337530, "epoch": 2789} {"train_loss": -42.8198356628418, "global_step": 337531, "epoch": 2789} {"train_loss": -34.90907669067383, "global_step": 337532, "epoch": 2789} {"train_loss": -39.936885833740234, "global_step": 337533, "epoch": 2789} {"train_loss": -39.20964431762695, "global_step": 337534, "epoch": 2789} {"train_loss": -36.59442901611328, "global_step": 337535, "epoch": 2789} {"train_loss": -41.78294372558594, "global_step": 337536, "epoch": 2789} {"train_loss": -38.0867919921875, "global_step": 337537, "epoch": 2789} {"train_loss": -42.31318283081055, "global_step": 337538, "epoch": 2789} {"train_loss": -38.31593704223633, "global_step": 337539, "epoch": 2789} {"train_loss": -41.905086517333984, "global_step": 337540, "epoch": 2789} {"train_loss": -37.940032958984375, "global_step": 337541, "epoch": 2789} {"train_loss": -42.26826858520508, "global_step": 337542, "epoch": 2789} {"train_loss": -37.84358596801758, "global_step": 337543, "epoch": 2789} {"train_loss": -41.95325469970703, "global_step": 337544, "epoch": 2789} {"train_loss": -39.98170852661133, "global_step": 337545, "epoch": 2789} {"train_loss": -40.26353073120117, "global_step": 337546, "epoch": 2789} {"train_loss": -41.56489181518555, "global_step": 337547, "epoch": 2789} {"train_loss": -41.28809356689453, "global_step": 337548, "epoch": 2789} {"train_loss": -42.704627990722656, "global_step": 337549, "epoch": 2789} {"train_loss": -41.47994613647461, "global_step": 337550, "epoch": 2789} {"train_loss": -42.0286750793457, "global_step": 337551, "epoch": 2789} {"train_loss": -41.927772521972656, "global_step": 337552, "epoch": 2789} {"train_loss": -42.34489059448242, "global_step": 337553, "epoch": 2789} {"train_loss": -41.68621063232422, "global_step": 337554, "epoch": 2789} {"train_loss": -40.85883712768555, "global_step": 337555, "epoch": 2789} {"train_loss": -40.29879379272461, "global_step": 337556, "epoch": 2789} {"train_loss": -42.48011016845703, "global_step": 337557, "epoch": 2789} {"train_loss": -41.5904426574707, "global_step": 337558, "epoch": 2789} {"train_loss": -42.15570068359375, "global_step": 337559, "epoch": 2789} {"train_loss": -41.90690231323242, "global_step": 337560, "epoch": 2789} {"train_loss": -42.59731674194336, "global_step": 337561, "epoch": 2789} {"train_loss": -40.805416107177734, "global_step": 337562, "epoch": 2789} {"train_loss": -42.470794677734375, "global_step": 337563, "epoch": 2789} {"train_loss": -42.02268600463867, "global_step": 337564, "epoch": 2789} {"train_loss": -41.543678283691406, "global_step": 337565, "epoch": 2789} {"train_loss": -42.272090911865234, "global_step": 337566, "epoch": 2789} {"train_loss": -42.47987747192383, "global_step": 337567, "epoch": 2789} {"train_loss": -42.212257385253906, "global_step": 337568, "epoch": 2789} {"train_loss": -42.79034423828125, "global_step": 337569, "epoch": 2789} {"train_loss": -42.87492752075195, "global_step": 337570, "epoch": 2789} {"train_loss": -42.81018829345703, "global_step": 337571, "epoch": 2789} {"train_loss": -42.4801139831543, "global_step": 337572, "epoch": 2789} {"train_loss": -42.371578216552734, "global_step": 337573, "epoch": 2789} {"train_loss": -42.88228988647461, "global_step": 337574, "epoch": 2789} {"train_loss": -42.401573181152344, "global_step": 337575, "epoch": 2789} {"train_loss": -43.40655517578125, "global_step": 337576, "epoch": 2789} {"train_loss": -42.81679153442383, "global_step": 337577, "epoch": 2789} {"train_loss": -43.23067855834961, "global_step": 337578, "epoch": 2789} {"train_loss": -42.904518127441406, "global_step": 337579, "epoch": 2789} {"train_loss": -43.22412109375, "global_step": 337580, "epoch": 2789} {"train_loss": -43.3625602722168, "global_step": 337581, "epoch": 2789} {"train_loss": -43.053470611572266, "global_step": 337582, "epoch": 2789} {"train_loss": -42.149166107177734, "global_step": 337583, "epoch": 2789} {"train_loss": -43.11152267456055, "global_step": 337584, "epoch": 2789} {"train_loss": -43.37636184692383, "global_step": 337585, "epoch": 2789} {"train_loss": -42.81644821166992, "global_step": 337586, "epoch": 2789} {"train_loss": -43.214378356933594, "global_step": 337587, "epoch": 2789} {"train_loss": -43.259254455566406, "global_step": 337588, "epoch": 2789} {"train_loss": -41.655943184844716, "global_step": 337589, "epoch": 2789, "val_loss": 2609264.75} {"train_loss": -43.70044708251953, "global_step": 337590, "epoch": 2790} {"train_loss": -42.65925216674805, "global_step": 337591, "epoch": 2790} {"train_loss": -42.58871078491211, "global_step": 337592, "epoch": 2790} {"train_loss": -43.6513671875, "global_step": 337593, "epoch": 2790} {"train_loss": -43.125885009765625, "global_step": 337594, "epoch": 2790} {"train_loss": -42.2505989074707, "global_step": 337595, "epoch": 2790} {"train_loss": -43.044891357421875, "global_step": 337596, "epoch": 2790} {"train_loss": -43.55128860473633, "global_step": 337597, "epoch": 2790} {"train_loss": -43.45685577392578, "global_step": 337598, "epoch": 2790} {"train_loss": -43.93522644042969, "global_step": 337599, "epoch": 2790} {"train_loss": -43.55522918701172, "global_step": 337600, "epoch": 2790} {"train_loss": -43.59886932373047, "global_step": 337601, "epoch": 2790} {"train_loss": -43.83645248413086, "global_step": 337602, "epoch": 2790} {"train_loss": -41.15048599243164, "global_step": 337603, "epoch": 2790} {"train_loss": -43.66375732421875, "global_step": 337604, "epoch": 2790} {"train_loss": -43.8026237487793, "global_step": 337605, "epoch": 2790} {"train_loss": -43.71273422241211, "global_step": 337606, "epoch": 2790} {"train_loss": -44.1614875793457, "global_step": 337607, "epoch": 2790} {"train_loss": -43.615882873535156, "global_step": 337608, "epoch": 2790} {"train_loss": -43.99320602416992, "global_step": 337609, "epoch": 2790} {"train_loss": -43.33513641357422, "global_step": 337610, "epoch": 2790} {"train_loss": -43.36606979370117, "global_step": 337611, "epoch": 2790} {"train_loss": -42.76852035522461, "global_step": 337612, "epoch": 2790} {"train_loss": -41.93192672729492, "global_step": 337613, "epoch": 2790} {"train_loss": -43.42483139038086, "global_step": 337614, "epoch": 2790} {"train_loss": -44.13056564331055, "global_step": 337615, "epoch": 2790} {"train_loss": -42.57442092895508, "global_step": 337616, "epoch": 2790} {"train_loss": -42.97249221801758, "global_step": 337617, "epoch": 2790} {"train_loss": -41.31561279296875, "global_step": 337618, "epoch": 2790} {"train_loss": -40.2541389465332, "global_step": 337619, "epoch": 2790} {"train_loss": -40.054195404052734, "global_step": 337620, "epoch": 2790} {"train_loss": -34.79362487792969, "global_step": 337621, "epoch": 2790} {"train_loss": -38.170040130615234, "global_step": 337622, "epoch": 2790} {"train_loss": -40.460060119628906, "global_step": 337623, "epoch": 2790} {"train_loss": -40.582069396972656, "global_step": 337624, "epoch": 2790} {"train_loss": -39.416297912597656, "global_step": 337625, "epoch": 2790} {"train_loss": -34.228118896484375, "global_step": 337626, "epoch": 2790} {"train_loss": -40.528995513916016, "global_step": 337627, "epoch": 2790} {"train_loss": -38.843624114990234, "global_step": 337628, "epoch": 2790} {"train_loss": -33.21775436401367, "global_step": 337629, "epoch": 2790} {"train_loss": -29.79633903503418, "global_step": 337630, "epoch": 2790} {"train_loss": -36.60993194580078, "global_step": 337631, "epoch": 2790} {"train_loss": -30.245038986206055, "global_step": 337632, "epoch": 2790} {"train_loss": -38.57401657104492, "global_step": 337633, "epoch": 2790} {"train_loss": -33.55792236328125, "global_step": 337634, "epoch": 2790} {"train_loss": -35.338043212890625, "global_step": 337635, "epoch": 2790} {"train_loss": -35.9075813293457, "global_step": 337636, "epoch": 2790} {"train_loss": -36.06578063964844, "global_step": 337637, "epoch": 2790} {"train_loss": -36.289794921875, "global_step": 337638, "epoch": 2790} {"train_loss": -36.81362533569336, "global_step": 337639, "epoch": 2790} {"train_loss": -37.4200325012207, "global_step": 337640, "epoch": 2790} {"train_loss": -38.8784065246582, "global_step": 337641, "epoch": 2790} {"train_loss": -39.645755767822266, "global_step": 337642, "epoch": 2790} {"train_loss": -38.18491744995117, "global_step": 337643, "epoch": 2790} {"train_loss": -38.952816009521484, "global_step": 337644, "epoch": 2790} {"train_loss": -37.50150680541992, "global_step": 337645, "epoch": 2790} {"train_loss": -40.921504974365234, "global_step": 337646, "epoch": 2790} {"train_loss": -38.43516540527344, "global_step": 337647, "epoch": 2790} {"train_loss": -41.2033805847168, "global_step": 337648, "epoch": 2790} {"train_loss": -40.56200408935547, "global_step": 337649, "epoch": 2790} {"train_loss": -40.278907775878906, "global_step": 337650, "epoch": 2790} {"train_loss": -40.72549057006836, "global_step": 337651, "epoch": 2790} {"train_loss": -39.98414993286133, "global_step": 337652, "epoch": 2790} {"train_loss": -37.089725494384766, "global_step": 337653, "epoch": 2790} {"train_loss": -41.13154220581055, "global_step": 337654, "epoch": 2790} {"train_loss": -41.14701461791992, "global_step": 337655, "epoch": 2790} {"train_loss": -40.9866828918457, "global_step": 337656, "epoch": 2790} {"train_loss": -41.25698471069336, "global_step": 337657, "epoch": 2790} {"train_loss": -41.420318603515625, "global_step": 337658, "epoch": 2790} {"train_loss": -41.887046813964844, "global_step": 337659, "epoch": 2790} {"train_loss": -41.25006866455078, "global_step": 337660, "epoch": 2790} {"train_loss": -39.026973724365234, "global_step": 337661, "epoch": 2790} {"train_loss": -40.18960189819336, "global_step": 337662, "epoch": 2790} {"train_loss": -40.38017654418945, "global_step": 337663, "epoch": 2790} {"train_loss": -41.18927764892578, "global_step": 337664, "epoch": 2790} {"train_loss": -41.15481185913086, "global_step": 337665, "epoch": 2790} {"train_loss": -38.874794006347656, "global_step": 337666, "epoch": 2790} {"train_loss": -41.664833068847656, "global_step": 337667, "epoch": 2790} {"train_loss": -40.86903381347656, "global_step": 337668, "epoch": 2790} {"train_loss": -41.41963195800781, "global_step": 337669, "epoch": 2790} {"train_loss": -41.50028991699219, "global_step": 337670, "epoch": 2790} {"train_loss": -41.92008590698242, "global_step": 337671, "epoch": 2790} {"train_loss": -41.397396087646484, "global_step": 337672, "epoch": 2790} {"train_loss": -41.1474723815918, "global_step": 337673, "epoch": 2790} {"train_loss": -41.9218635559082, "global_step": 337674, "epoch": 2790} {"train_loss": -41.729671478271484, "global_step": 337675, "epoch": 2790} {"train_loss": -41.567665100097656, "global_step": 337676, "epoch": 2790} {"train_loss": -41.814178466796875, "global_step": 337677, "epoch": 2790} {"train_loss": -41.188289642333984, "global_step": 337678, "epoch": 2790} {"train_loss": -42.36684036254883, "global_step": 337679, "epoch": 2790} {"train_loss": -42.14346694946289, "global_step": 337680, "epoch": 2790} {"train_loss": -41.20806884765625, "global_step": 337681, "epoch": 2790} {"train_loss": -41.007545471191406, "global_step": 337682, "epoch": 2790} {"train_loss": -42.179439544677734, "global_step": 337683, "epoch": 2790} {"train_loss": -41.93415451049805, "global_step": 337684, "epoch": 2790} {"train_loss": -41.021385192871094, "global_step": 337685, "epoch": 2790} {"train_loss": -42.28705978393555, "global_step": 337686, "epoch": 2790} {"train_loss": -41.715309143066406, "global_step": 337687, "epoch": 2790} {"train_loss": -42.29621887207031, "global_step": 337688, "epoch": 2790} {"train_loss": -42.5681266784668, "global_step": 337689, "epoch": 2790} {"train_loss": -42.280029296875, "global_step": 337690, "epoch": 2790} {"train_loss": -43.105411529541016, "global_step": 337691, "epoch": 2790} {"train_loss": -42.793548583984375, "global_step": 337692, "epoch": 2790} {"train_loss": -43.14943313598633, "global_step": 337693, "epoch": 2790} {"train_loss": -41.60256576538086, "global_step": 337694, "epoch": 2790} {"train_loss": -42.490779876708984, "global_step": 337695, "epoch": 2790} {"train_loss": -42.8903923034668, "global_step": 337696, "epoch": 2790} {"train_loss": -41.54473876953125, "global_step": 337697, "epoch": 2790} {"train_loss": -42.99101638793945, "global_step": 337698, "epoch": 2790} {"train_loss": -42.58967971801758, "global_step": 337699, "epoch": 2790} {"train_loss": -42.2927131652832, "global_step": 337700, "epoch": 2790} {"train_loss": -41.958160400390625, "global_step": 337701, "epoch": 2790} {"train_loss": -41.53053283691406, "global_step": 337702, "epoch": 2790} {"train_loss": -42.027076721191406, "global_step": 337703, "epoch": 2790} {"train_loss": -43.3465576171875, "global_step": 337704, "epoch": 2790} {"train_loss": -43.40713119506836, "global_step": 337705, "epoch": 2790} {"train_loss": -42.83811950683594, "global_step": 337706, "epoch": 2790} {"train_loss": -42.74365997314453, "global_step": 337707, "epoch": 2790} {"train_loss": -42.81190872192383, "global_step": 337708, "epoch": 2790} {"train_loss": -43.41244125366211, "global_step": 337709, "epoch": 2790} {"train_loss": -40.957799170628064, "global_step": 337710, "epoch": 2790, "val_loss": 2693660.75} {"train_loss": -43.357032775878906, "global_step": 337711, "epoch": 2791} {"train_loss": -42.237091064453125, "global_step": 337712, "epoch": 2791} {"train_loss": -41.5072135925293, "global_step": 337713, "epoch": 2791} {"train_loss": -43.70536422729492, "global_step": 337714, "epoch": 2791} {"train_loss": -43.339473724365234, "global_step": 337715, "epoch": 2791} {"train_loss": -43.08900451660156, "global_step": 337716, "epoch": 2791} {"train_loss": -42.557716369628906, "global_step": 337717, "epoch": 2791} {"train_loss": -43.53711700439453, "global_step": 337718, "epoch": 2791} {"train_loss": -43.42572021484375, "global_step": 337719, "epoch": 2791} {"train_loss": -43.631935119628906, "global_step": 337720, "epoch": 2791} {"train_loss": -43.56382751464844, "global_step": 337721, "epoch": 2791} {"train_loss": -43.18259811401367, "global_step": 337722, "epoch": 2791} {"train_loss": -41.671485900878906, "global_step": 337723, "epoch": 2791} {"train_loss": -43.58498001098633, "global_step": 337724, "epoch": 2791} {"train_loss": -43.035945892333984, "global_step": 337725, "epoch": 2791} {"train_loss": -43.60560989379883, "global_step": 337726, "epoch": 2791} {"train_loss": -43.042903900146484, "global_step": 337727, "epoch": 2791} {"train_loss": -43.57176971435547, "global_step": 337728, "epoch": 2791} {"train_loss": -42.9196891784668, "global_step": 337729, "epoch": 2791} {"train_loss": -43.85641098022461, "global_step": 337730, "epoch": 2791} {"train_loss": -44.118316650390625, "global_step": 337731, "epoch": 2791} {"train_loss": -44.27204895019531, "global_step": 337732, "epoch": 2791} {"train_loss": -43.554359436035156, "global_step": 337733, "epoch": 2791} {"train_loss": -43.23043441772461, "global_step": 337734, "epoch": 2791} {"train_loss": -43.35121536254883, "global_step": 337735, "epoch": 2791} {"train_loss": -43.35697937011719, "global_step": 337736, "epoch": 2791} {"train_loss": -43.81789016723633, "global_step": 337737, "epoch": 2791} {"train_loss": -43.18347930908203, "global_step": 337738, "epoch": 2791} {"train_loss": -43.20640182495117, "global_step": 337739, "epoch": 2791} {"train_loss": -44.29361343383789, "global_step": 337740, "epoch": 2791} {"train_loss": -43.163330078125, "global_step": 337741, "epoch": 2791} {"train_loss": -43.918479919433594, "global_step": 337742, "epoch": 2791} {"train_loss": -41.9014892578125, "global_step": 337743, "epoch": 2791} {"train_loss": -41.162322998046875, "global_step": 337744, "epoch": 2791} {"train_loss": -42.74294662475586, "global_step": 337745, "epoch": 2791} {"train_loss": -42.07624816894531, "global_step": 337746, "epoch": 2791} {"train_loss": -42.531307220458984, "global_step": 337747, "epoch": 2791} {"train_loss": -44.2638053894043, "global_step": 337748, "epoch": 2791} {"train_loss": -43.47768783569336, "global_step": 337749, "epoch": 2791} {"train_loss": -43.519039154052734, "global_step": 337750, "epoch": 2791} {"train_loss": -43.24898147583008, "global_step": 337751, "epoch": 2791} {"train_loss": -41.431087493896484, "global_step": 337752, "epoch": 2791} {"train_loss": -43.730770111083984, "global_step": 337753, "epoch": 2791} {"train_loss": -43.61109924316406, "global_step": 337754, "epoch": 2791} {"train_loss": -43.52958297729492, "global_step": 337755, "epoch": 2791} {"train_loss": -42.61441421508789, "global_step": 337756, "epoch": 2791} {"train_loss": -33.10847854614258, "global_step": 337757, "epoch": 2791} {"train_loss": -42.73930740356445, "global_step": 337758, "epoch": 2791} {"train_loss": -43.50014114379883, "global_step": 337759, "epoch": 2791} {"train_loss": -41.783935546875, "global_step": 337760, "epoch": 2791} {"train_loss": -42.16236877441406, "global_step": 337761, "epoch": 2791} {"train_loss": -42.317955017089844, "global_step": 337762, "epoch": 2791} {"train_loss": -40.78335189819336, "global_step": 337763, "epoch": 2791} {"train_loss": -40.05278396606445, "global_step": 337764, "epoch": 2791} {"train_loss": -42.93351364135742, "global_step": 337765, "epoch": 2791} {"train_loss": -42.072269439697266, "global_step": 337766, "epoch": 2791} {"train_loss": -42.473976135253906, "global_step": 337767, "epoch": 2791} {"train_loss": -42.84973907470703, "global_step": 337768, "epoch": 2791} {"train_loss": -42.36257553100586, "global_step": 337769, "epoch": 2791} {"train_loss": -43.262943267822266, "global_step": 337770, "epoch": 2791} {"train_loss": -42.586669921875, "global_step": 337771, "epoch": 2791} {"train_loss": -42.41608428955078, "global_step": 337772, "epoch": 2791} {"train_loss": -43.145416259765625, "global_step": 337773, "epoch": 2791} {"train_loss": -42.94905090332031, "global_step": 337774, "epoch": 2791} {"train_loss": -43.10565185546875, "global_step": 337775, "epoch": 2791} {"train_loss": -42.998226165771484, "global_step": 337776, "epoch": 2791} {"train_loss": -42.85261917114258, "global_step": 337777, "epoch": 2791} {"train_loss": -43.382015228271484, "global_step": 337778, "epoch": 2791} {"train_loss": -42.86123275756836, "global_step": 337779, "epoch": 2791} {"train_loss": -41.90813064575195, "global_step": 337780, "epoch": 2791} {"train_loss": -41.20817184448242, "global_step": 337781, "epoch": 2791} {"train_loss": -41.51140213012695, "global_step": 337782, "epoch": 2791} {"train_loss": -42.96210861206055, "global_step": 337783, "epoch": 2791} {"train_loss": -39.648006439208984, "global_step": 337784, "epoch": 2791} {"train_loss": -38.69474411010742, "global_step": 337785, "epoch": 2791} {"train_loss": -42.55879592895508, "global_step": 337786, "epoch": 2791} {"train_loss": -36.50303649902344, "global_step": 337787, "epoch": 2791} {"train_loss": -41.891822814941406, "global_step": 337788, "epoch": 2791} {"train_loss": -40.87136459350586, "global_step": 337789, "epoch": 2791} {"train_loss": -41.98588180541992, "global_step": 337790, "epoch": 2791} {"train_loss": -42.29050827026367, "global_step": 337791, "epoch": 2791} {"train_loss": -41.03342819213867, "global_step": 337792, "epoch": 2791} {"train_loss": -42.7085075378418, "global_step": 337793, "epoch": 2791} {"train_loss": -40.87211227416992, "global_step": 337794, "epoch": 2791} {"train_loss": -41.3394889831543, "global_step": 337795, "epoch": 2791} {"train_loss": -42.3053092956543, "global_step": 337796, "epoch": 2791} {"train_loss": -41.92548751831055, "global_step": 337797, "epoch": 2791} {"train_loss": -41.55521774291992, "global_step": 337798, "epoch": 2791} {"train_loss": -41.060054779052734, "global_step": 337799, "epoch": 2791} {"train_loss": -38.28060531616211, "global_step": 337800, "epoch": 2791} {"train_loss": -42.381099700927734, "global_step": 337801, "epoch": 2791} {"train_loss": -41.36996078491211, "global_step": 337802, "epoch": 2791} {"train_loss": -41.25124740600586, "global_step": 337803, "epoch": 2791} {"train_loss": -42.18996810913086, "global_step": 337804, "epoch": 2791} {"train_loss": -42.12295150756836, "global_step": 337805, "epoch": 2791} {"train_loss": -41.06764602661133, "global_step": 337806, "epoch": 2791} {"train_loss": -41.54718017578125, "global_step": 337807, "epoch": 2791} {"train_loss": -41.434242248535156, "global_step": 337808, "epoch": 2791} {"train_loss": -39.46613693237305, "global_step": 337809, "epoch": 2791} {"train_loss": -42.04997634887695, "global_step": 337810, "epoch": 2791} {"train_loss": -38.50613784790039, "global_step": 337811, "epoch": 2791} {"train_loss": -41.67399215698242, "global_step": 337812, "epoch": 2791} {"train_loss": -41.98674392700195, "global_step": 337813, "epoch": 2791} {"train_loss": -40.701751708984375, "global_step": 337814, "epoch": 2791} {"train_loss": -42.50107955932617, "global_step": 337815, "epoch": 2791} {"train_loss": -41.613197326660156, "global_step": 337816, "epoch": 2791} {"train_loss": -42.020538330078125, "global_step": 337817, "epoch": 2791} {"train_loss": -41.21430206298828, "global_step": 337818, "epoch": 2791} {"train_loss": -41.79557418823242, "global_step": 337819, "epoch": 2791} {"train_loss": -40.534358978271484, "global_step": 337820, "epoch": 2791} {"train_loss": -42.31787109375, "global_step": 337821, "epoch": 2791} {"train_loss": -42.11944580078125, "global_step": 337822, "epoch": 2791} {"train_loss": -40.54685592651367, "global_step": 337823, "epoch": 2791} {"train_loss": -42.40800857543945, "global_step": 337824, "epoch": 2791} {"train_loss": -40.84444808959961, "global_step": 337825, "epoch": 2791} {"train_loss": -41.62420654296875, "global_step": 337826, "epoch": 2791} {"train_loss": -42.5243034362793, "global_step": 337827, "epoch": 2791} {"train_loss": -39.85490417480469, "global_step": 337828, "epoch": 2791} {"train_loss": -41.2195930480957, "global_step": 337829, "epoch": 2791} {"train_loss": -41.24019241333008, "global_step": 337830, "epoch": 2791} {"train_loss": -42.14507205427186, "global_step": 337831, "epoch": 2791, "val_loss": 2490856.25} {"train_loss": -40.22138214111328, "global_step": 337832, "epoch": 2792} {"train_loss": -41.5296630859375, "global_step": 337833, "epoch": 2792} {"train_loss": -41.980445861816406, "global_step": 337834, "epoch": 2792} {"train_loss": -42.523921966552734, "global_step": 337835, "epoch": 2792} {"train_loss": -42.02800369262695, "global_step": 337836, "epoch": 2792} {"train_loss": -42.111595153808594, "global_step": 337837, "epoch": 2792} {"train_loss": -40.80277633666992, "global_step": 337838, "epoch": 2792} {"train_loss": -39.09928512573242, "global_step": 337839, "epoch": 2792} {"train_loss": -42.025917053222656, "global_step": 337840, "epoch": 2792} {"train_loss": -40.38093948364258, "global_step": 337841, "epoch": 2792} {"train_loss": -41.453269958496094, "global_step": 337842, "epoch": 2792} {"train_loss": -42.85543441772461, "global_step": 337843, "epoch": 2792} {"train_loss": -40.882423400878906, "global_step": 337844, "epoch": 2792} {"train_loss": -42.46035385131836, "global_step": 337845, "epoch": 2792} {"train_loss": -42.06440353393555, "global_step": 337846, "epoch": 2792} {"train_loss": -42.279170989990234, "global_step": 337847, "epoch": 2792} {"train_loss": -41.84617614746094, "global_step": 337848, "epoch": 2792} {"train_loss": -41.17367172241211, "global_step": 337849, "epoch": 2792} {"train_loss": -42.3937873840332, "global_step": 337850, "epoch": 2792} {"train_loss": -41.46135711669922, "global_step": 337851, "epoch": 2792} {"train_loss": -41.66207504272461, "global_step": 337852, "epoch": 2792} {"train_loss": -40.2238655090332, "global_step": 337853, "epoch": 2792} {"train_loss": -41.9383544921875, "global_step": 337854, "epoch": 2792} {"train_loss": -42.94019317626953, "global_step": 337855, "epoch": 2792} {"train_loss": -41.7057991027832, "global_step": 337856, "epoch": 2792} {"train_loss": -41.905433654785156, "global_step": 337857, "epoch": 2792} {"train_loss": -41.0858268737793, "global_step": 337858, "epoch": 2792} {"train_loss": -42.47237014770508, "global_step": 337859, "epoch": 2792} {"train_loss": -40.570125579833984, "global_step": 337860, "epoch": 2792} {"train_loss": -42.1291618347168, "global_step": 337861, "epoch": 2792} {"train_loss": -42.86164093017578, "global_step": 337862, "epoch": 2792} {"train_loss": -40.99890899658203, "global_step": 337863, "epoch": 2792} {"train_loss": -41.46836853027344, "global_step": 337864, "epoch": 2792} {"train_loss": -42.80628967285156, "global_step": 337865, "epoch": 2792} {"train_loss": -41.516658782958984, "global_step": 337866, "epoch": 2792} {"train_loss": -41.576194763183594, "global_step": 337867, "epoch": 2792} {"train_loss": -40.38277816772461, "global_step": 337868, "epoch": 2792} {"train_loss": -41.768760681152344, "global_step": 337869, "epoch": 2792} {"train_loss": -42.58963394165039, "global_step": 337870, "epoch": 2792} {"train_loss": -39.22428894042969, "global_step": 337871, "epoch": 2792} {"train_loss": -42.13998794555664, "global_step": 337872, "epoch": 2792} {"train_loss": -41.545753479003906, "global_step": 337873, "epoch": 2792} {"train_loss": -40.668209075927734, "global_step": 337874, "epoch": 2792} {"train_loss": -42.90092086791992, "global_step": 337875, "epoch": 2792} {"train_loss": -42.18082809448242, "global_step": 337876, "epoch": 2792} {"train_loss": -41.298004150390625, "global_step": 337877, "epoch": 2792} {"train_loss": -42.711021423339844, "global_step": 337878, "epoch": 2792} {"train_loss": -40.82954788208008, "global_step": 337879, "epoch": 2792} {"train_loss": -42.04949951171875, "global_step": 337880, "epoch": 2792} {"train_loss": -43.19560623168945, "global_step": 337881, "epoch": 2792} {"train_loss": -42.529640197753906, "global_step": 337882, "epoch": 2792} {"train_loss": -41.835426330566406, "global_step": 337883, "epoch": 2792} {"train_loss": -40.55091094970703, "global_step": 337884, "epoch": 2792} {"train_loss": -40.5992546081543, "global_step": 337885, "epoch": 2792} {"train_loss": -40.767520904541016, "global_step": 337886, "epoch": 2792} {"train_loss": -42.491878509521484, "global_step": 337887, "epoch": 2792} {"train_loss": -41.95370101928711, "global_step": 337888, "epoch": 2792} {"train_loss": -41.21235275268555, "global_step": 337889, "epoch": 2792} {"train_loss": -39.5313835144043, "global_step": 337890, "epoch": 2792} {"train_loss": -41.78931427001953, "global_step": 337891, "epoch": 2792} {"train_loss": -41.497806549072266, "global_step": 337892, "epoch": 2792} {"train_loss": -40.94613265991211, "global_step": 337893, "epoch": 2792} {"train_loss": -42.79339599609375, "global_step": 337894, "epoch": 2792} {"train_loss": -42.62362289428711, "global_step": 337895, "epoch": 2792} {"train_loss": -40.48893737792969, "global_step": 337896, "epoch": 2792} {"train_loss": -38.38505172729492, "global_step": 337897, "epoch": 2792} {"train_loss": -41.22494888305664, "global_step": 337898, "epoch": 2792} {"train_loss": -41.75745391845703, "global_step": 337899, "epoch": 2792} {"train_loss": -42.31113815307617, "global_step": 337900, "epoch": 2792} {"train_loss": -40.711788177490234, "global_step": 337901, "epoch": 2792} {"train_loss": -40.77523422241211, "global_step": 337902, "epoch": 2792} {"train_loss": -42.63217544555664, "global_step": 337903, "epoch": 2792} {"train_loss": -40.502418518066406, "global_step": 337904, "epoch": 2792} {"train_loss": -42.76314163208008, "global_step": 337905, "epoch": 2792} {"train_loss": -37.97089767456055, "global_step": 337906, "epoch": 2792} {"train_loss": -41.75368881225586, "global_step": 337907, "epoch": 2792} {"train_loss": -38.11935043334961, "global_step": 337908, "epoch": 2792} {"train_loss": -41.08152770996094, "global_step": 337909, "epoch": 2792} {"train_loss": -42.00558090209961, "global_step": 337910, "epoch": 2792} {"train_loss": -39.76533126831055, "global_step": 337911, "epoch": 2792} {"train_loss": -41.26678466796875, "global_step": 337912, "epoch": 2792} {"train_loss": -41.80939865112305, "global_step": 337913, "epoch": 2792} {"train_loss": -40.44599533081055, "global_step": 337914, "epoch": 2792} {"train_loss": -39.27338790893555, "global_step": 337915, "epoch": 2792} {"train_loss": -41.96656799316406, "global_step": 337916, "epoch": 2792} {"train_loss": -42.01304244995117, "global_step": 337917, "epoch": 2792} {"train_loss": -41.13789367675781, "global_step": 337918, "epoch": 2792} {"train_loss": -34.444801330566406, "global_step": 337919, "epoch": 2792} {"train_loss": -40.900299072265625, "global_step": 337920, "epoch": 2792} {"train_loss": -40.14437484741211, "global_step": 337921, "epoch": 2792} {"train_loss": -38.9558219909668, "global_step": 337922, "epoch": 2792} {"train_loss": -41.1512451171875, "global_step": 337923, "epoch": 2792} {"train_loss": -39.31588363647461, "global_step": 337924, "epoch": 2792} {"train_loss": -42.43195724487305, "global_step": 337925, "epoch": 2792} {"train_loss": -40.77685546875, "global_step": 337926, "epoch": 2792} {"train_loss": -41.40538787841797, "global_step": 337927, "epoch": 2792} {"train_loss": -41.325191497802734, "global_step": 337928, "epoch": 2792} {"train_loss": -42.00300979614258, "global_step": 337929, "epoch": 2792} {"train_loss": -40.3965950012207, "global_step": 337930, "epoch": 2792} {"train_loss": -42.3246955871582, "global_step": 337931, "epoch": 2792} {"train_loss": -40.95083999633789, "global_step": 337932, "epoch": 2792} {"train_loss": -42.3234977722168, "global_step": 337933, "epoch": 2792} {"train_loss": -39.8244743347168, "global_step": 337934, "epoch": 2792} {"train_loss": -42.03712844848633, "global_step": 337935, "epoch": 2792} {"train_loss": -41.229122161865234, "global_step": 337936, "epoch": 2792} {"train_loss": -41.59747314453125, "global_step": 337937, "epoch": 2792} {"train_loss": -40.51910400390625, "global_step": 337938, "epoch": 2792} {"train_loss": -42.05941390991211, "global_step": 337939, "epoch": 2792} {"train_loss": -41.215362548828125, "global_step": 337940, "epoch": 2792} {"train_loss": -40.830116271972656, "global_step": 337941, "epoch": 2792} {"train_loss": -40.98575973510742, "global_step": 337942, "epoch": 2792} {"train_loss": -41.12649154663086, "global_step": 337943, "epoch": 2792} {"train_loss": -42.49639129638672, "global_step": 337944, "epoch": 2792} {"train_loss": -42.15403366088867, "global_step": 337945, "epoch": 2792} {"train_loss": -42.33556365966797, "global_step": 337946, "epoch": 2792} {"train_loss": -42.216957092285156, "global_step": 337947, "epoch": 2792} {"train_loss": -41.843570709228516, "global_step": 337948, "epoch": 2792} {"train_loss": -42.10490036010742, "global_step": 337949, "epoch": 2792} {"train_loss": -41.560546875, "global_step": 337950, "epoch": 2792} {"train_loss": -42.828975677490234, "global_step": 337951, "epoch": 2792} {"train_loss": -41.35938108459977, "global_step": 337952, "epoch": 2792, "val_loss": 2610760.75} {"train_loss": -42.82270431518555, "global_step": 337953, "epoch": 2793} {"train_loss": -42.58223342895508, "global_step": 337954, "epoch": 2793} {"train_loss": -42.21774673461914, "global_step": 337955, "epoch": 2793} {"train_loss": -42.3416633605957, "global_step": 337956, "epoch": 2793} {"train_loss": -42.545772552490234, "global_step": 337957, "epoch": 2793} {"train_loss": -41.88279342651367, "global_step": 337958, "epoch": 2793} {"train_loss": -42.501502990722656, "global_step": 337959, "epoch": 2793} {"train_loss": -41.91886520385742, "global_step": 337960, "epoch": 2793} {"train_loss": -42.58147048950195, "global_step": 337961, "epoch": 2793} {"train_loss": -42.88776779174805, "global_step": 337962, "epoch": 2793} {"train_loss": -42.395137786865234, "global_step": 337963, "epoch": 2793} {"train_loss": -41.787139892578125, "global_step": 337964, "epoch": 2793} {"train_loss": -43.205909729003906, "global_step": 337965, "epoch": 2793} {"train_loss": -41.85772705078125, "global_step": 337966, "epoch": 2793} {"train_loss": -41.660797119140625, "global_step": 337967, "epoch": 2793} {"train_loss": -42.48381805419922, "global_step": 337968, "epoch": 2793} {"train_loss": -42.28224182128906, "global_step": 337969, "epoch": 2793} {"train_loss": -40.99578857421875, "global_step": 337970, "epoch": 2793} {"train_loss": -42.355506896972656, "global_step": 337971, "epoch": 2793} {"train_loss": -41.17422103881836, "global_step": 337972, "epoch": 2793} {"train_loss": -40.86238479614258, "global_step": 337973, "epoch": 2793} {"train_loss": -42.65847396850586, "global_step": 337974, "epoch": 2793} {"train_loss": -41.67655563354492, "global_step": 337975, "epoch": 2793} {"train_loss": -42.9290771484375, "global_step": 337976, "epoch": 2793} {"train_loss": -41.749874114990234, "global_step": 337977, "epoch": 2793} {"train_loss": -42.24796676635742, "global_step": 337978, "epoch": 2793} {"train_loss": -42.62968063354492, "global_step": 337979, "epoch": 2793} {"train_loss": -42.64192581176758, "global_step": 337980, "epoch": 2793} {"train_loss": -41.36509323120117, "global_step": 337981, "epoch": 2793} {"train_loss": -41.754600524902344, "global_step": 337982, "epoch": 2793} {"train_loss": -43.086002349853516, "global_step": 337983, "epoch": 2793} {"train_loss": -42.320899963378906, "global_step": 337984, "epoch": 2793} {"train_loss": -42.87424850463867, "global_step": 337985, "epoch": 2793} {"train_loss": -41.91130447387695, "global_step": 337986, "epoch": 2793} {"train_loss": -42.34419631958008, "global_step": 337987, "epoch": 2793} {"train_loss": -42.755577087402344, "global_step": 337988, "epoch": 2793} {"train_loss": -41.503173828125, "global_step": 337989, "epoch": 2793} {"train_loss": -42.17435836791992, "global_step": 337990, "epoch": 2793} {"train_loss": -42.59961700439453, "global_step": 337991, "epoch": 2793} {"train_loss": -42.415931701660156, "global_step": 337992, "epoch": 2793} {"train_loss": -41.84953689575195, "global_step": 337993, "epoch": 2793} {"train_loss": -42.1493034362793, "global_step": 337994, "epoch": 2793} {"train_loss": -42.962066650390625, "global_step": 337995, "epoch": 2793} {"train_loss": -42.34907150268555, "global_step": 337996, "epoch": 2793} {"train_loss": -41.92496871948242, "global_step": 337997, "epoch": 2793} {"train_loss": -43.03062057495117, "global_step": 337998, "epoch": 2793} {"train_loss": -42.22114944458008, "global_step": 337999, "epoch": 2793} {"train_loss": -42.810890197753906, "global_step": 338000, "epoch": 2793} {"train_loss": -42.86740493774414, "global_step": 338001, "epoch": 2793} {"train_loss": -41.608619689941406, "global_step": 338002, "epoch": 2793} {"train_loss": -42.68587875366211, "global_step": 338003, "epoch": 2793} {"train_loss": -42.44890213012695, "global_step": 338004, "epoch": 2793} {"train_loss": -42.033992767333984, "global_step": 338005, "epoch": 2793} {"train_loss": -43.04156494140625, "global_step": 338006, "epoch": 2793} {"train_loss": -41.85946273803711, "global_step": 338007, "epoch": 2793} {"train_loss": -41.330299377441406, "global_step": 338008, "epoch": 2793} {"train_loss": -42.3150749206543, "global_step": 338009, "epoch": 2793} {"train_loss": -42.72560119628906, "global_step": 338010, "epoch": 2793} {"train_loss": -42.18208694458008, "global_step": 338011, "epoch": 2793} {"train_loss": -43.3177604675293, "global_step": 338012, "epoch": 2793} {"train_loss": -41.81314468383789, "global_step": 338013, "epoch": 2793} {"train_loss": -41.859622955322266, "global_step": 338014, "epoch": 2793} {"train_loss": -42.72029495239258, "global_step": 338015, "epoch": 2793} {"train_loss": -42.058265686035156, "global_step": 338016, "epoch": 2793} {"train_loss": -41.98716354370117, "global_step": 338017, "epoch": 2793} {"train_loss": -43.73708724975586, "global_step": 338018, "epoch": 2793} {"train_loss": -42.21357345581055, "global_step": 338019, "epoch": 2793} {"train_loss": -43.441558837890625, "global_step": 338020, "epoch": 2793} {"train_loss": -42.6958122253418, "global_step": 338021, "epoch": 2793} {"train_loss": -43.17104721069336, "global_step": 338022, "epoch": 2793} {"train_loss": -42.1662483215332, "global_step": 338023, "epoch": 2793} {"train_loss": -43.405086517333984, "global_step": 338024, "epoch": 2793} {"train_loss": -43.2649040222168, "global_step": 338025, "epoch": 2793} {"train_loss": -43.05037307739258, "global_step": 338026, "epoch": 2793} {"train_loss": -43.02653884887695, "global_step": 338027, "epoch": 2793} {"train_loss": -43.27479553222656, "global_step": 338028, "epoch": 2793} {"train_loss": -43.33441925048828, "global_step": 338029, "epoch": 2793} {"train_loss": -42.365264892578125, "global_step": 338030, "epoch": 2793} {"train_loss": -43.41447830200195, "global_step": 338031, "epoch": 2793} {"train_loss": -42.7556037902832, "global_step": 338032, "epoch": 2793} {"train_loss": -42.89460372924805, "global_step": 338033, "epoch": 2793} {"train_loss": -42.83680725097656, "global_step": 338034, "epoch": 2793} {"train_loss": -42.828575134277344, "global_step": 338035, "epoch": 2793} {"train_loss": -42.67827224731445, "global_step": 338036, "epoch": 2793} {"train_loss": -41.19963836669922, "global_step": 338037, "epoch": 2793} {"train_loss": -42.72785568237305, "global_step": 338038, "epoch": 2793} {"train_loss": -41.35908126831055, "global_step": 338039, "epoch": 2793} {"train_loss": -41.988346099853516, "global_step": 338040, "epoch": 2793} {"train_loss": -42.9622688293457, "global_step": 338041, "epoch": 2793} {"train_loss": -42.728572845458984, "global_step": 338042, "epoch": 2793} {"train_loss": -42.70534896850586, "global_step": 338043, "epoch": 2793} {"train_loss": -42.2097282409668, "global_step": 338044, "epoch": 2793} {"train_loss": -39.74872970581055, "global_step": 338045, "epoch": 2793} {"train_loss": -39.472991943359375, "global_step": 338046, "epoch": 2793} {"train_loss": -41.42560577392578, "global_step": 338047, "epoch": 2793} {"train_loss": -42.20398712158203, "global_step": 338048, "epoch": 2793} {"train_loss": -40.16143798828125, "global_step": 338049, "epoch": 2793} {"train_loss": -38.490966796875, "global_step": 338050, "epoch": 2793} {"train_loss": -39.732154846191406, "global_step": 338051, "epoch": 2793} {"train_loss": -42.632049560546875, "global_step": 338052, "epoch": 2793} {"train_loss": -42.4005126953125, "global_step": 338053, "epoch": 2793} {"train_loss": -40.138671875, "global_step": 338054, "epoch": 2793} {"train_loss": -42.11935043334961, "global_step": 338055, "epoch": 2793} {"train_loss": -42.80292892456055, "global_step": 338056, "epoch": 2793} {"train_loss": -41.846412658691406, "global_step": 338057, "epoch": 2793} {"train_loss": -42.766536712646484, "global_step": 338058, "epoch": 2793} {"train_loss": -42.01144027709961, "global_step": 338059, "epoch": 2793} {"train_loss": -42.66962814331055, "global_step": 338060, "epoch": 2793} {"train_loss": -43.38724899291992, "global_step": 338061, "epoch": 2793} {"train_loss": -43.30689239501953, "global_step": 338062, "epoch": 2793} {"train_loss": -43.11590576171875, "global_step": 338063, "epoch": 2793} {"train_loss": -42.574806213378906, "global_step": 338064, "epoch": 2793} {"train_loss": -42.74020004272461, "global_step": 338065, "epoch": 2793} {"train_loss": -43.02088165283203, "global_step": 338066, "epoch": 2793} {"train_loss": -39.709346771240234, "global_step": 338067, "epoch": 2793} {"train_loss": -41.3748893737793, "global_step": 338068, "epoch": 2793} {"train_loss": -43.80012130737305, "global_step": 338069, "epoch": 2793} {"train_loss": -43.392642974853516, "global_step": 338070, "epoch": 2793} {"train_loss": -43.5133056640625, "global_step": 338071, "epoch": 2793} {"train_loss": -42.40558624267578, "global_step": 338072, "epoch": 2793} {"train_loss": -42.28840533169833, "global_step": 338073, "epoch": 2793, "val_loss": 2659698.25} {"train_loss": -43.29810333251953, "global_step": 338074, "epoch": 2794} {"train_loss": -43.60234451293945, "global_step": 338075, "epoch": 2794} {"train_loss": -40.37830352783203, "global_step": 338076, "epoch": 2794} {"train_loss": -43.553035736083984, "global_step": 338077, "epoch": 2794} {"train_loss": -43.58842086791992, "global_step": 338078, "epoch": 2794} {"train_loss": -43.37602615356445, "global_step": 338079, "epoch": 2794} {"train_loss": -43.368263244628906, "global_step": 338080, "epoch": 2794} {"train_loss": -41.22029495239258, "global_step": 338081, "epoch": 2794} {"train_loss": -43.436683654785156, "global_step": 338082, "epoch": 2794} {"train_loss": -41.015380859375, "global_step": 338083, "epoch": 2794} {"train_loss": -41.97835922241211, "global_step": 338084, "epoch": 2794} {"train_loss": -42.910396575927734, "global_step": 338085, "epoch": 2794} {"train_loss": -43.149112701416016, "global_step": 338086, "epoch": 2794} {"train_loss": -43.79108810424805, "global_step": 338087, "epoch": 2794} {"train_loss": -42.82935333251953, "global_step": 338088, "epoch": 2794} {"train_loss": -40.93427658081055, "global_step": 338089, "epoch": 2794} {"train_loss": -41.29305648803711, "global_step": 338090, "epoch": 2794} {"train_loss": -42.99123764038086, "global_step": 338091, "epoch": 2794} {"train_loss": -38.55545425415039, "global_step": 338092, "epoch": 2794} {"train_loss": -43.29933547973633, "global_step": 338093, "epoch": 2794} {"train_loss": -43.424373626708984, "global_step": 338094, "epoch": 2794} {"train_loss": -43.254005432128906, "global_step": 338095, "epoch": 2794} {"train_loss": -42.95670700073242, "global_step": 338096, "epoch": 2794} {"train_loss": -41.0396614074707, "global_step": 338097, "epoch": 2794} {"train_loss": -43.578102111816406, "global_step": 338098, "epoch": 2794} {"train_loss": -43.47660827636719, "global_step": 338099, "epoch": 2794} {"train_loss": -43.67403030395508, "global_step": 338100, "epoch": 2794} {"train_loss": -44.04691696166992, "global_step": 338101, "epoch": 2794} {"train_loss": -43.81550216674805, "global_step": 338102, "epoch": 2794} {"train_loss": -43.544776916503906, "global_step": 338103, "epoch": 2794} {"train_loss": -43.450103759765625, "global_step": 338104, "epoch": 2794} {"train_loss": -43.629188537597656, "global_step": 338105, "epoch": 2794} {"train_loss": -43.54362869262695, "global_step": 338106, "epoch": 2794} {"train_loss": -43.66704177856445, "global_step": 338107, "epoch": 2794} {"train_loss": -43.67576217651367, "global_step": 338108, "epoch": 2794} {"train_loss": -41.38983154296875, "global_step": 338109, "epoch": 2794} {"train_loss": -42.25787353515625, "global_step": 338110, "epoch": 2794} {"train_loss": -42.82122802734375, "global_step": 338111, "epoch": 2794} {"train_loss": -44.156429290771484, "global_step": 338112, "epoch": 2794} {"train_loss": -43.25680160522461, "global_step": 338113, "epoch": 2794} {"train_loss": -43.532466888427734, "global_step": 338114, "epoch": 2794} {"train_loss": -43.220333099365234, "global_step": 338115, "epoch": 2794} {"train_loss": -44.008140563964844, "global_step": 338116, "epoch": 2794} {"train_loss": -43.46358108520508, "global_step": 338117, "epoch": 2794} {"train_loss": -40.93124008178711, "global_step": 338118, "epoch": 2794} {"train_loss": -43.47488021850586, "global_step": 338119, "epoch": 2794} {"train_loss": -42.94126510620117, "global_step": 338120, "epoch": 2794} {"train_loss": -42.1999626159668, "global_step": 338121, "epoch": 2794} {"train_loss": -42.107051849365234, "global_step": 338122, "epoch": 2794} {"train_loss": -44.38842010498047, "global_step": 338123, "epoch": 2794} {"train_loss": -41.25720977783203, "global_step": 338124, "epoch": 2794} {"train_loss": -43.65717697143555, "global_step": 338125, "epoch": 2794} {"train_loss": -42.51436233520508, "global_step": 338126, "epoch": 2794} {"train_loss": -42.188438415527344, "global_step": 338127, "epoch": 2794} {"train_loss": -43.162227630615234, "global_step": 338128, "epoch": 2794} {"train_loss": -44.3679313659668, "global_step": 338129, "epoch": 2794} {"train_loss": -43.480342864990234, "global_step": 338130, "epoch": 2794} {"train_loss": -43.81394577026367, "global_step": 338131, "epoch": 2794} {"train_loss": -43.461177825927734, "global_step": 338132, "epoch": 2794} {"train_loss": -42.740108489990234, "global_step": 338133, "epoch": 2794} {"train_loss": -43.103614807128906, "global_step": 338134, "epoch": 2794} {"train_loss": -43.77848434448242, "global_step": 338135, "epoch": 2794} {"train_loss": -42.582122802734375, "global_step": 338136, "epoch": 2794} {"train_loss": -43.6563835144043, "global_step": 338137, "epoch": 2794} {"train_loss": -43.37112045288086, "global_step": 338138, "epoch": 2794} {"train_loss": -43.473018646240234, "global_step": 338139, "epoch": 2794} {"train_loss": -41.888160705566406, "global_step": 338140, "epoch": 2794} {"train_loss": -44.00494384765625, "global_step": 338141, "epoch": 2794} {"train_loss": -42.77264404296875, "global_step": 338142, "epoch": 2794} {"train_loss": -43.87178039550781, "global_step": 338143, "epoch": 2794} {"train_loss": -41.68323516845703, "global_step": 338144, "epoch": 2794} {"train_loss": -43.725582122802734, "global_step": 338145, "epoch": 2794} {"train_loss": -42.59823226928711, "global_step": 338146, "epoch": 2794} {"train_loss": -42.837562561035156, "global_step": 338147, "epoch": 2794} {"train_loss": -43.196258544921875, "global_step": 338148, "epoch": 2794} {"train_loss": -42.434486389160156, "global_step": 338149, "epoch": 2794} {"train_loss": -41.46057891845703, "global_step": 338150, "epoch": 2794} {"train_loss": -43.4178581237793, "global_step": 338151, "epoch": 2794} {"train_loss": -40.64288330078125, "global_step": 338152, "epoch": 2794} {"train_loss": -40.92914962768555, "global_step": 338153, "epoch": 2794} {"train_loss": -42.24846267700195, "global_step": 338154, "epoch": 2794} {"train_loss": -41.290679931640625, "global_step": 338155, "epoch": 2794} {"train_loss": -39.457618713378906, "global_step": 338156, "epoch": 2794} {"train_loss": -40.6794319152832, "global_step": 338157, "epoch": 2794} {"train_loss": -41.97133255004883, "global_step": 338158, "epoch": 2794} {"train_loss": -40.884395599365234, "global_step": 338159, "epoch": 2794} {"train_loss": -41.24769973754883, "global_step": 338160, "epoch": 2794} {"train_loss": -40.67800521850586, "global_step": 338161, "epoch": 2794} {"train_loss": -41.72199249267578, "global_step": 338162, "epoch": 2794} {"train_loss": -42.65534591674805, "global_step": 338163, "epoch": 2794} {"train_loss": -41.79458236694336, "global_step": 338164, "epoch": 2794} {"train_loss": -39.75272750854492, "global_step": 338165, "epoch": 2794} {"train_loss": -41.28715133666992, "global_step": 338166, "epoch": 2794} {"train_loss": -40.55277633666992, "global_step": 338167, "epoch": 2794} {"train_loss": -40.11802291870117, "global_step": 338168, "epoch": 2794} {"train_loss": -41.64333724975586, "global_step": 338169, "epoch": 2794} {"train_loss": -42.056156158447266, "global_step": 338170, "epoch": 2794} {"train_loss": -41.82877731323242, "global_step": 338171, "epoch": 2794} {"train_loss": -40.71562957763672, "global_step": 338172, "epoch": 2794} {"train_loss": -41.27541732788086, "global_step": 338173, "epoch": 2794} {"train_loss": -40.127586364746094, "global_step": 338174, "epoch": 2794} {"train_loss": -34.7795524597168, "global_step": 338175, "epoch": 2794} {"train_loss": -39.966461181640625, "global_step": 338176, "epoch": 2794} {"train_loss": -40.958675384521484, "global_step": 338177, "epoch": 2794} {"train_loss": -41.19777297973633, "global_step": 338178, "epoch": 2794} {"train_loss": -36.41255569458008, "global_step": 338179, "epoch": 2794} {"train_loss": -41.827781677246094, "global_step": 338180, "epoch": 2794} {"train_loss": -41.816200256347656, "global_step": 338181, "epoch": 2794} {"train_loss": -41.03359603881836, "global_step": 338182, "epoch": 2794} {"train_loss": -35.18385696411133, "global_step": 338183, "epoch": 2794} {"train_loss": -39.36513137817383, "global_step": 338184, "epoch": 2794} {"train_loss": -40.90928649902344, "global_step": 338185, "epoch": 2794} {"train_loss": -39.89609909057617, "global_step": 338186, "epoch": 2794} {"train_loss": -39.768409729003906, "global_step": 338187, "epoch": 2794} {"train_loss": -41.00126647949219, "global_step": 338188, "epoch": 2794} {"train_loss": -40.10494613647461, "global_step": 338189, "epoch": 2794} {"train_loss": -38.15560531616211, "global_step": 338190, "epoch": 2794} {"train_loss": -39.739681243896484, "global_step": 338191, "epoch": 2794} {"train_loss": -39.42661666870117, "global_step": 338192, "epoch": 2794} {"train_loss": -37.49595260620117, "global_step": 338193, "epoch": 2794} {"train_loss": -41.979276010812804, "global_step": 338194, "epoch": 2794, "val_loss": 2580166.75} {"train_loss": -39.4352912902832, "global_step": 338195, "epoch": 2795} {"train_loss": -41.082820892333984, "global_step": 338196, "epoch": 2795} {"train_loss": -40.66572952270508, "global_step": 338197, "epoch": 2795} {"train_loss": -39.89552688598633, "global_step": 338198, "epoch": 2795} {"train_loss": -39.818939208984375, "global_step": 338199, "epoch": 2795} {"train_loss": -40.51128005981445, "global_step": 338200, "epoch": 2795} {"train_loss": -39.2293701171875, "global_step": 338201, "epoch": 2795} {"train_loss": -40.61541748046875, "global_step": 338202, "epoch": 2795} {"train_loss": -39.724796295166016, "global_step": 338203, "epoch": 2795} {"train_loss": -40.65045928955078, "global_step": 338204, "epoch": 2795} {"train_loss": -40.58717727661133, "global_step": 338205, "epoch": 2795} {"train_loss": -38.458797454833984, "global_step": 338206, "epoch": 2795} {"train_loss": -40.967037200927734, "global_step": 338207, "epoch": 2795} {"train_loss": -40.3181266784668, "global_step": 338208, "epoch": 2795} {"train_loss": -41.75509262084961, "global_step": 338209, "epoch": 2795} {"train_loss": -41.803321838378906, "global_step": 338210, "epoch": 2795} {"train_loss": -39.63289260864258, "global_step": 338211, "epoch": 2795} {"train_loss": -41.176856994628906, "global_step": 338212, "epoch": 2795} {"train_loss": -41.19669723510742, "global_step": 338213, "epoch": 2795} {"train_loss": -41.78676223754883, "global_step": 338214, "epoch": 2795} {"train_loss": -40.44465255737305, "global_step": 338215, "epoch": 2795} {"train_loss": -41.24518966674805, "global_step": 338216, "epoch": 2795} {"train_loss": -40.03681182861328, "global_step": 338217, "epoch": 2795} {"train_loss": -41.03593444824219, "global_step": 338218, "epoch": 2795} {"train_loss": -41.92280960083008, "global_step": 338219, "epoch": 2795} {"train_loss": -41.757049560546875, "global_step": 338220, "epoch": 2795} {"train_loss": -41.6254997253418, "global_step": 338221, "epoch": 2795} {"train_loss": -41.65070343017578, "global_step": 338222, "epoch": 2795} {"train_loss": -41.80724334716797, "global_step": 338223, "epoch": 2795} {"train_loss": -42.477081298828125, "global_step": 338224, "epoch": 2795} {"train_loss": -42.3191032409668, "global_step": 338225, "epoch": 2795} {"train_loss": -42.027854919433594, "global_step": 338226, "epoch": 2795} {"train_loss": -41.998573303222656, "global_step": 338227, "epoch": 2795} {"train_loss": -41.00536346435547, "global_step": 338228, "epoch": 2795} {"train_loss": -42.193885803222656, "global_step": 338229, "epoch": 2795} {"train_loss": -41.95636749267578, "global_step": 338230, "epoch": 2795} {"train_loss": -40.93389892578125, "global_step": 338231, "epoch": 2795} {"train_loss": -42.130653381347656, "global_step": 338232, "epoch": 2795} {"train_loss": -41.43321990966797, "global_step": 338233, "epoch": 2795} {"train_loss": -42.687313079833984, "global_step": 338234, "epoch": 2795} {"train_loss": -41.17438888549805, "global_step": 338235, "epoch": 2795} {"train_loss": -42.03422927856445, "global_step": 338236, "epoch": 2795} {"train_loss": -41.480892181396484, "global_step": 338237, "epoch": 2795} {"train_loss": -42.579833984375, "global_step": 338238, "epoch": 2795} {"train_loss": -42.523284912109375, "global_step": 338239, "epoch": 2795} {"train_loss": -42.68084716796875, "global_step": 338240, "epoch": 2795} {"train_loss": -42.6152458190918, "global_step": 338241, "epoch": 2795} {"train_loss": -42.91866683959961, "global_step": 338242, "epoch": 2795} {"train_loss": -42.789573669433594, "global_step": 338243, "epoch": 2795} {"train_loss": -41.688880920410156, "global_step": 338244, "epoch": 2795} {"train_loss": -41.055355072021484, "global_step": 338245, "epoch": 2795} {"train_loss": -41.517608642578125, "global_step": 338246, "epoch": 2795} {"train_loss": -41.94047164916992, "global_step": 338247, "epoch": 2795} {"train_loss": -42.73196029663086, "global_step": 338248, "epoch": 2795} {"train_loss": -42.350135803222656, "global_step": 338249, "epoch": 2795} {"train_loss": -41.87559127807617, "global_step": 338250, "epoch": 2795} {"train_loss": -41.00064468383789, "global_step": 338251, "epoch": 2795} {"train_loss": -42.63432693481445, "global_step": 338252, "epoch": 2795} {"train_loss": -43.06939697265625, "global_step": 338253, "epoch": 2795} {"train_loss": -42.787227630615234, "global_step": 338254, "epoch": 2795} {"train_loss": -43.152259826660156, "global_step": 338255, "epoch": 2795} {"train_loss": -41.78687286376953, "global_step": 338256, "epoch": 2795} {"train_loss": -42.75482177734375, "global_step": 338257, "epoch": 2795} {"train_loss": -42.4301872253418, "global_step": 338258, "epoch": 2795} {"train_loss": -42.98112106323242, "global_step": 338259, "epoch": 2795} {"train_loss": -42.797576904296875, "global_step": 338260, "epoch": 2795} {"train_loss": -43.02396774291992, "global_step": 338261, "epoch": 2795} {"train_loss": -41.607887268066406, "global_step": 338262, "epoch": 2795} {"train_loss": -42.203033447265625, "global_step": 338263, "epoch": 2795} {"train_loss": -42.272674560546875, "global_step": 338264, "epoch": 2795} {"train_loss": -43.18662643432617, "global_step": 338265, "epoch": 2795} {"train_loss": -43.1514892578125, "global_step": 338266, "epoch": 2795} {"train_loss": -43.26848220825195, "global_step": 338267, "epoch": 2795} {"train_loss": -43.13532638549805, "global_step": 338268, "epoch": 2795} {"train_loss": -42.48092269897461, "global_step": 338269, "epoch": 2795} {"train_loss": -43.01732635498047, "global_step": 338270, "epoch": 2795} {"train_loss": -43.034908294677734, "global_step": 338271, "epoch": 2795} {"train_loss": -37.2943115234375, "global_step": 338272, "epoch": 2795} {"train_loss": -43.26252365112305, "global_step": 338273, "epoch": 2795} {"train_loss": -43.21158218383789, "global_step": 338274, "epoch": 2795} {"train_loss": -42.7391471862793, "global_step": 338275, "epoch": 2795} {"train_loss": -42.56599044799805, "global_step": 338276, "epoch": 2795} {"train_loss": -41.299232482910156, "global_step": 338277, "epoch": 2795} {"train_loss": -42.666011810302734, "global_step": 338278, "epoch": 2795} {"train_loss": -43.39093017578125, "global_step": 338279, "epoch": 2795} {"train_loss": -43.262916564941406, "global_step": 338280, "epoch": 2795} {"train_loss": -36.320762634277344, "global_step": 338281, "epoch": 2795} {"train_loss": -42.077571868896484, "global_step": 338282, "epoch": 2795} {"train_loss": -43.05558395385742, "global_step": 338283, "epoch": 2795} {"train_loss": -42.653594970703125, "global_step": 338284, "epoch": 2795} {"train_loss": -42.622737884521484, "global_step": 338285, "epoch": 2795} {"train_loss": -42.99885559082031, "global_step": 338286, "epoch": 2795} {"train_loss": -43.11373519897461, "global_step": 338287, "epoch": 2795} {"train_loss": -43.72980880737305, "global_step": 338288, "epoch": 2795} {"train_loss": -43.16741943359375, "global_step": 338289, "epoch": 2795} {"train_loss": -43.26143264770508, "global_step": 338290, "epoch": 2795} {"train_loss": -43.24824142456055, "global_step": 338291, "epoch": 2795} {"train_loss": -43.726158142089844, "global_step": 338292, "epoch": 2795} {"train_loss": -43.30479049682617, "global_step": 338293, "epoch": 2795} {"train_loss": -42.68755340576172, "global_step": 338294, "epoch": 2795} {"train_loss": -43.81768798828125, "global_step": 338295, "epoch": 2795} {"train_loss": -43.582427978515625, "global_step": 338296, "epoch": 2795} {"train_loss": -43.20819091796875, "global_step": 338297, "epoch": 2795} {"train_loss": -42.6763801574707, "global_step": 338298, "epoch": 2795} {"train_loss": -43.029747009277344, "global_step": 338299, "epoch": 2795} {"train_loss": -42.55727005004883, "global_step": 338300, "epoch": 2795} {"train_loss": -43.254127502441406, "global_step": 338301, "epoch": 2795} {"train_loss": -43.29627990722656, "global_step": 338302, "epoch": 2795} {"train_loss": -43.35769271850586, "global_step": 338303, "epoch": 2795} {"train_loss": -43.17000961303711, "global_step": 338304, "epoch": 2795} {"train_loss": -41.9643669128418, "global_step": 338305, "epoch": 2795} {"train_loss": -43.37063217163086, "global_step": 338306, "epoch": 2795} {"train_loss": -42.83321762084961, "global_step": 338307, "epoch": 2795} {"train_loss": -43.541683197021484, "global_step": 338308, "epoch": 2795} {"train_loss": -43.579471588134766, "global_step": 338309, "epoch": 2795} {"train_loss": -43.486690521240234, "global_step": 338310, "epoch": 2795} {"train_loss": -43.73685073852539, "global_step": 338311, "epoch": 2795} {"train_loss": -43.39303970336914, "global_step": 338312, "epoch": 2795} {"train_loss": -43.87860870361328, "global_step": 338313, "epoch": 2795} {"train_loss": -43.474300384521484, "global_step": 338314, "epoch": 2795} {"train_loss": -42.095387387866815, "global_step": 338315, "epoch": 2795, "val_loss": 2430714.75} {"train_loss": -43.06159210205078, "global_step": 338316, "epoch": 2796} {"train_loss": -43.58601379394531, "global_step": 338317, "epoch": 2796} {"train_loss": -43.40175247192383, "global_step": 338318, "epoch": 2796} {"train_loss": -43.3802375793457, "global_step": 338319, "epoch": 2796} {"train_loss": -43.14634323120117, "global_step": 338320, "epoch": 2796} {"train_loss": -42.10137176513672, "global_step": 338321, "epoch": 2796} {"train_loss": -41.853206634521484, "global_step": 338322, "epoch": 2796} {"train_loss": -38.93760299682617, "global_step": 338323, "epoch": 2796} {"train_loss": -36.86027908325195, "global_step": 338324, "epoch": 2796} {"train_loss": -40.24769973754883, "global_step": 338325, "epoch": 2796} {"train_loss": -41.753292083740234, "global_step": 338326, "epoch": 2796} {"train_loss": -41.12936019897461, "global_step": 338327, "epoch": 2796} {"train_loss": -37.13819122314453, "global_step": 338328, "epoch": 2796} {"train_loss": -37.641517639160156, "global_step": 338329, "epoch": 2796} {"train_loss": -42.8553352355957, "global_step": 338330, "epoch": 2796} {"train_loss": -40.20176315307617, "global_step": 338331, "epoch": 2796} {"train_loss": -41.527671813964844, "global_step": 338332, "epoch": 2796} {"train_loss": -43.18538284301758, "global_step": 338333, "epoch": 2796} {"train_loss": -41.35976028442383, "global_step": 338334, "epoch": 2796} {"train_loss": -41.65877914428711, "global_step": 338335, "epoch": 2796} {"train_loss": -41.782386779785156, "global_step": 338336, "epoch": 2796} {"train_loss": -41.94330978393555, "global_step": 338337, "epoch": 2796} {"train_loss": -43.107933044433594, "global_step": 338338, "epoch": 2796} {"train_loss": -41.991180419921875, "global_step": 338339, "epoch": 2796} {"train_loss": -42.67800521850586, "global_step": 338340, "epoch": 2796} {"train_loss": -40.72341537475586, "global_step": 338341, "epoch": 2796} {"train_loss": -40.96841812133789, "global_step": 338342, "epoch": 2796} {"train_loss": -39.73641586303711, "global_step": 338343, "epoch": 2796} {"train_loss": -41.10481643676758, "global_step": 338344, "epoch": 2796} {"train_loss": -40.704219818115234, "global_step": 338345, "epoch": 2796} {"train_loss": -40.94722366333008, "global_step": 338346, "epoch": 2796} {"train_loss": -41.54655075073242, "global_step": 338347, "epoch": 2796} {"train_loss": -40.31581497192383, "global_step": 338348, "epoch": 2796} {"train_loss": -41.82612991333008, "global_step": 338349, "epoch": 2796} {"train_loss": -38.0030517578125, "global_step": 338350, "epoch": 2796} {"train_loss": -41.458213806152344, "global_step": 338351, "epoch": 2796} {"train_loss": -41.303497314453125, "global_step": 338352, "epoch": 2796} {"train_loss": -42.72310256958008, "global_step": 338353, "epoch": 2796} {"train_loss": -41.733455657958984, "global_step": 338354, "epoch": 2796} {"train_loss": -42.07197952270508, "global_step": 338355, "epoch": 2796} {"train_loss": -42.65424728393555, "global_step": 338356, "epoch": 2796} {"train_loss": -40.61544418334961, "global_step": 338357, "epoch": 2796} {"train_loss": -42.83340072631836, "global_step": 338358, "epoch": 2796} {"train_loss": -41.60710525512695, "global_step": 338359, "epoch": 2796} {"train_loss": -42.88605880737305, "global_step": 338360, "epoch": 2796} {"train_loss": -42.17344284057617, "global_step": 338361, "epoch": 2796} {"train_loss": -42.13332748413086, "global_step": 338362, "epoch": 2796} {"train_loss": -42.07638168334961, "global_step": 338363, "epoch": 2796} {"train_loss": -43.367919921875, "global_step": 338364, "epoch": 2796} {"train_loss": -42.929290771484375, "global_step": 338365, "epoch": 2796} {"train_loss": -43.273460388183594, "global_step": 338366, "epoch": 2796} {"train_loss": -42.661705017089844, "global_step": 338367, "epoch": 2796} {"train_loss": -42.46921920776367, "global_step": 338368, "epoch": 2796} {"train_loss": -43.34390640258789, "global_step": 338369, "epoch": 2796} {"train_loss": -42.578121185302734, "global_step": 338370, "epoch": 2796} {"train_loss": -43.17499923706055, "global_step": 338371, "epoch": 2796} {"train_loss": -43.06616973876953, "global_step": 338372, "epoch": 2796} {"train_loss": -43.27360153198242, "global_step": 338373, "epoch": 2796} {"train_loss": -43.53268051147461, "global_step": 338374, "epoch": 2796} {"train_loss": -43.321529388427734, "global_step": 338375, "epoch": 2796} {"train_loss": -43.707374572753906, "global_step": 338376, "epoch": 2796} {"train_loss": -42.6319694519043, "global_step": 338377, "epoch": 2796} {"train_loss": -42.865699768066406, "global_step": 338378, "epoch": 2796} {"train_loss": -43.729793548583984, "global_step": 338379, "epoch": 2796} {"train_loss": -43.0951042175293, "global_step": 338380, "epoch": 2796} {"train_loss": -43.65479278564453, "global_step": 338381, "epoch": 2796} {"train_loss": -43.50914001464844, "global_step": 338382, "epoch": 2796} {"train_loss": -43.223358154296875, "global_step": 338383, "epoch": 2796} {"train_loss": -44.01184844970703, "global_step": 338384, "epoch": 2796} {"train_loss": -43.967742919921875, "global_step": 338385, "epoch": 2796} {"train_loss": -43.8466796875, "global_step": 338386, "epoch": 2796} {"train_loss": -43.763187408447266, "global_step": 338387, "epoch": 2796} {"train_loss": -43.28799057006836, "global_step": 338388, "epoch": 2796} {"train_loss": -43.66886520385742, "global_step": 338389, "epoch": 2796} {"train_loss": -44.3516731262207, "global_step": 338390, "epoch": 2796} {"train_loss": -43.99638748168945, "global_step": 338391, "epoch": 2796} {"train_loss": -44.08782196044922, "global_step": 338392, "epoch": 2796} {"train_loss": -43.53321075439453, "global_step": 338393, "epoch": 2796} {"train_loss": -43.97216033935547, "global_step": 338394, "epoch": 2796} {"train_loss": -43.8630256652832, "global_step": 338395, "epoch": 2796} {"train_loss": -43.76721954345703, "global_step": 338396, "epoch": 2796} {"train_loss": -43.868743896484375, "global_step": 338397, "epoch": 2796} {"train_loss": -43.76566696166992, "global_step": 338398, "epoch": 2796} {"train_loss": -44.241119384765625, "global_step": 338399, "epoch": 2796} {"train_loss": -43.51276779174805, "global_step": 338400, "epoch": 2796} {"train_loss": -44.241249084472656, "global_step": 338401, "epoch": 2796} {"train_loss": -44.0307502746582, "global_step": 338402, "epoch": 2796} {"train_loss": -44.180419921875, "global_step": 338403, "epoch": 2796} {"train_loss": -43.99446487426758, "global_step": 338404, "epoch": 2796} {"train_loss": -43.65016174316406, "global_step": 338405, "epoch": 2796} {"train_loss": -44.1309700012207, "global_step": 338406, "epoch": 2796} {"train_loss": -43.50638198852539, "global_step": 338407, "epoch": 2796} {"train_loss": -44.25028991699219, "global_step": 338408, "epoch": 2796} {"train_loss": -43.585853576660156, "global_step": 338409, "epoch": 2796} {"train_loss": -44.2808837890625, "global_step": 338410, "epoch": 2796} {"train_loss": -44.3868522644043, "global_step": 338411, "epoch": 2796} {"train_loss": -43.989532470703125, "global_step": 338412, "epoch": 2796} {"train_loss": -43.127532958984375, "global_step": 338413, "epoch": 2796} {"train_loss": -43.874629974365234, "global_step": 338414, "epoch": 2796} {"train_loss": -43.27532958984375, "global_step": 338415, "epoch": 2796} {"train_loss": -44.15253448486328, "global_step": 338416, "epoch": 2796} {"train_loss": -44.45912551879883, "global_step": 338417, "epoch": 2796} {"train_loss": -44.24222946166992, "global_step": 338418, "epoch": 2796} {"train_loss": -44.272613525390625, "global_step": 338419, "epoch": 2796} {"train_loss": -44.2292594909668, "global_step": 338420, "epoch": 2796} {"train_loss": -44.41938400268555, "global_step": 338421, "epoch": 2796} {"train_loss": -43.53778076171875, "global_step": 338422, "epoch": 2796} {"train_loss": -44.44698715209961, "global_step": 338423, "epoch": 2796} {"train_loss": -44.3983154296875, "global_step": 338424, "epoch": 2796} {"train_loss": -43.44500732421875, "global_step": 338425, "epoch": 2796} {"train_loss": -43.96720504760742, "global_step": 338426, "epoch": 2796} {"train_loss": -43.459407806396484, "global_step": 338427, "epoch": 2796} {"train_loss": -43.48118591308594, "global_step": 338428, "epoch": 2796} {"train_loss": -44.32544708251953, "global_step": 338429, "epoch": 2796} {"train_loss": -43.600341796875, "global_step": 338430, "epoch": 2796} {"train_loss": -42.72443771362305, "global_step": 338431, "epoch": 2796} {"train_loss": -41.680965423583984, "global_step": 338432, "epoch": 2796} {"train_loss": -37.72871017456055, "global_step": 338433, "epoch": 2796} {"train_loss": -32.53996658325195, "global_step": 338434, "epoch": 2796} {"train_loss": -37.56105041503906, "global_step": 338435, "epoch": 2796} {"train_loss": -42.55388786378971, "global_step": 338436, "epoch": 2796, "val_loss": 2492515.25} {"train_loss": -42.9960823059082, "global_step": 338437, "epoch": 2797} {"train_loss": -39.42050552368164, "global_step": 338438, "epoch": 2797} {"train_loss": -38.84476089477539, "global_step": 338439, "epoch": 2797} {"train_loss": -40.16526412963867, "global_step": 338440, "epoch": 2797} {"train_loss": -42.884765625, "global_step": 338441, "epoch": 2797} {"train_loss": -40.57595443725586, "global_step": 338442, "epoch": 2797} {"train_loss": -39.90907669067383, "global_step": 338443, "epoch": 2797} {"train_loss": -42.489830017089844, "global_step": 338444, "epoch": 2797} {"train_loss": -41.91915512084961, "global_step": 338445, "epoch": 2797} {"train_loss": -41.25263595581055, "global_step": 338446, "epoch": 2797} {"train_loss": -41.46974563598633, "global_step": 338447, "epoch": 2797} {"train_loss": -42.493465423583984, "global_step": 338448, "epoch": 2797} {"train_loss": -42.39077377319336, "global_step": 338449, "epoch": 2797} {"train_loss": -41.87599563598633, "global_step": 338450, "epoch": 2797} {"train_loss": -42.522308349609375, "global_step": 338451, "epoch": 2797} {"train_loss": -42.0545768737793, "global_step": 338452, "epoch": 2797} {"train_loss": -41.56698989868164, "global_step": 338453, "epoch": 2797} {"train_loss": -42.416259765625, "global_step": 338454, "epoch": 2797} {"train_loss": -41.484981536865234, "global_step": 338455, "epoch": 2797} {"train_loss": -41.937313079833984, "global_step": 338456, "epoch": 2797} {"train_loss": -43.190303802490234, "global_step": 338457, "epoch": 2797} {"train_loss": -42.910316467285156, "global_step": 338458, "epoch": 2797} {"train_loss": -42.21657180786133, "global_step": 338459, "epoch": 2797} {"train_loss": -41.86237716674805, "global_step": 338460, "epoch": 2797} {"train_loss": -42.11279296875, "global_step": 338461, "epoch": 2797} {"train_loss": -42.49997329711914, "global_step": 338462, "epoch": 2797} {"train_loss": -42.47465133666992, "global_step": 338463, "epoch": 2797} {"train_loss": -41.88027572631836, "global_step": 338464, "epoch": 2797} {"train_loss": -42.28642654418945, "global_step": 338465, "epoch": 2797} {"train_loss": -42.481502532958984, "global_step": 338466, "epoch": 2797} {"train_loss": -42.77396774291992, "global_step": 338467, "epoch": 2797} {"train_loss": -42.95691680908203, "global_step": 338468, "epoch": 2797} {"train_loss": -42.693817138671875, "global_step": 338469, "epoch": 2797} {"train_loss": -42.329139709472656, "global_step": 338470, "epoch": 2797} {"train_loss": -43.028621673583984, "global_step": 338471, "epoch": 2797} {"train_loss": -42.82905197143555, "global_step": 338472, "epoch": 2797} {"train_loss": -43.4080924987793, "global_step": 338473, "epoch": 2797} {"train_loss": -43.59758377075195, "global_step": 338474, "epoch": 2797} {"train_loss": -43.060054779052734, "global_step": 338475, "epoch": 2797} {"train_loss": -43.54439163208008, "global_step": 338476, "epoch": 2797} {"train_loss": -42.34487533569336, "global_step": 338477, "epoch": 2797} {"train_loss": -42.80512619018555, "global_step": 338478, "epoch": 2797} {"train_loss": -43.112300872802734, "global_step": 338479, "epoch": 2797} {"train_loss": -42.51729965209961, "global_step": 338480, "epoch": 2797} {"train_loss": -43.478878021240234, "global_step": 338481, "epoch": 2797} {"train_loss": -43.78464889526367, "global_step": 338482, "epoch": 2797} {"train_loss": -42.0923957824707, "global_step": 338483, "epoch": 2797} {"train_loss": -42.75071334838867, "global_step": 338484, "epoch": 2797} {"train_loss": -43.44755935668945, "global_step": 338485, "epoch": 2797} {"train_loss": -43.55424118041992, "global_step": 338486, "epoch": 2797} {"train_loss": -43.79856491088867, "global_step": 338487, "epoch": 2797} {"train_loss": -43.6090202331543, "global_step": 338488, "epoch": 2797} {"train_loss": -44.0434455871582, "global_step": 338489, "epoch": 2797} {"train_loss": -43.49687957763672, "global_step": 338490, "epoch": 2797} {"train_loss": -43.86503219604492, "global_step": 338491, "epoch": 2797} {"train_loss": -43.1545524597168, "global_step": 338492, "epoch": 2797} {"train_loss": -43.52865219116211, "global_step": 338493, "epoch": 2797} {"train_loss": -43.09281539916992, "global_step": 338494, "epoch": 2797} {"train_loss": -43.63069152832031, "global_step": 338495, "epoch": 2797} {"train_loss": -43.549007415771484, "global_step": 338496, "epoch": 2797} {"train_loss": -44.221595764160156, "global_step": 338497, "epoch": 2797} {"train_loss": -42.92670822143555, "global_step": 338498, "epoch": 2797} {"train_loss": -43.57462692260742, "global_step": 338499, "epoch": 2797} {"train_loss": -43.362701416015625, "global_step": 338500, "epoch": 2797} {"train_loss": -43.299015045166016, "global_step": 338501, "epoch": 2797} {"train_loss": -43.02079391479492, "global_step": 338502, "epoch": 2797} {"train_loss": -43.52592086791992, "global_step": 338503, "epoch": 2797} {"train_loss": -43.65258026123047, "global_step": 338504, "epoch": 2797} {"train_loss": -43.4681510925293, "global_step": 338505, "epoch": 2797} {"train_loss": -42.35626220703125, "global_step": 338506, "epoch": 2797} {"train_loss": -42.51581573486328, "global_step": 338507, "epoch": 2797} {"train_loss": -43.490989685058594, "global_step": 338508, "epoch": 2797} {"train_loss": -43.23664474487305, "global_step": 338509, "epoch": 2797} {"train_loss": -43.579689025878906, "global_step": 338510, "epoch": 2797} {"train_loss": -40.43480682373047, "global_step": 338511, "epoch": 2797} {"train_loss": -42.46124267578125, "global_step": 338512, "epoch": 2797} {"train_loss": -43.54764175415039, "global_step": 338513, "epoch": 2797} {"train_loss": -43.769405364990234, "global_step": 338514, "epoch": 2797} {"train_loss": -43.2000732421875, "global_step": 338515, "epoch": 2797} {"train_loss": -44.4105224609375, "global_step": 338516, "epoch": 2797} {"train_loss": -42.147438049316406, "global_step": 338517, "epoch": 2797} {"train_loss": -43.70174026489258, "global_step": 338518, "epoch": 2797} {"train_loss": -43.59724426269531, "global_step": 338519, "epoch": 2797} {"train_loss": -42.920650482177734, "global_step": 338520, "epoch": 2797} {"train_loss": -44.22849655151367, "global_step": 338521, "epoch": 2797} {"train_loss": -43.545467376708984, "global_step": 338522, "epoch": 2797} {"train_loss": -41.02467346191406, "global_step": 338523, "epoch": 2797} {"train_loss": -43.071014404296875, "global_step": 338524, "epoch": 2797} {"train_loss": -41.3885612487793, "global_step": 338525, "epoch": 2797} {"train_loss": -43.3722038269043, "global_step": 338526, "epoch": 2797} {"train_loss": -38.02490234375, "global_step": 338527, "epoch": 2797} {"train_loss": -41.41779708862305, "global_step": 338528, "epoch": 2797} {"train_loss": -42.342952728271484, "global_step": 338529, "epoch": 2797} {"train_loss": -41.01527786254883, "global_step": 338530, "epoch": 2797} {"train_loss": -41.3388557434082, "global_step": 338531, "epoch": 2797} {"train_loss": -41.22005844116211, "global_step": 338532, "epoch": 2797} {"train_loss": -42.09946823120117, "global_step": 338533, "epoch": 2797} {"train_loss": -34.720130920410156, "global_step": 338534, "epoch": 2797} {"train_loss": -36.33942794799805, "global_step": 338535, "epoch": 2797} {"train_loss": -41.22818374633789, "global_step": 338536, "epoch": 2797} {"train_loss": -4.719552516937256, "global_step": 338537, "epoch": 2797} {"train_loss": -41.915313720703125, "global_step": 338538, "epoch": 2797} {"train_loss": -40.148040771484375, "global_step": 338539, "epoch": 2797} {"train_loss": -25.940916061401367, "global_step": 338540, "epoch": 2797} {"train_loss": -39.77808380126953, "global_step": 338541, "epoch": 2797} {"train_loss": -39.67800521850586, "global_step": 338542, "epoch": 2797} {"train_loss": -28.882801055908203, "global_step": 338543, "epoch": 2797} {"train_loss": -40.4334831237793, "global_step": 338544, "epoch": 2797} {"train_loss": -34.927825927734375, "global_step": 338545, "epoch": 2797} {"train_loss": -31.704513549804688, "global_step": 338546, "epoch": 2797} {"train_loss": -33.54117965698242, "global_step": 338547, "epoch": 2797} {"train_loss": -37.07771301269531, "global_step": 338548, "epoch": 2797} {"train_loss": -38.58401107788086, "global_step": 338549, "epoch": 2797} {"train_loss": -37.85742950439453, "global_step": 338550, "epoch": 2797} {"train_loss": -38.51237869262695, "global_step": 338551, "epoch": 2797} {"train_loss": -36.56838607788086, "global_step": 338552, "epoch": 2797} {"train_loss": -40.22196960449219, "global_step": 338553, "epoch": 2797} {"train_loss": -36.8862190246582, "global_step": 338554, "epoch": 2797} {"train_loss": -37.20174026489258, "global_step": 338555, "epoch": 2797} {"train_loss": -39.11395263671875, "global_step": 338556, "epoch": 2797} {"train_loss": -41.182873808647976, "global_step": 338557, "epoch": 2797, "val_loss": 2829411.25} {"train_loss": -39.3959846496582, "global_step": 338558, "epoch": 2798} {"train_loss": -38.06462478637695, "global_step": 338559, "epoch": 2798} {"train_loss": -40.06085968017578, "global_step": 338560, "epoch": 2798} {"train_loss": -39.854129791259766, "global_step": 338561, "epoch": 2798} {"train_loss": -39.53041458129883, "global_step": 338562, "epoch": 2798} {"train_loss": -39.51797103881836, "global_step": 338563, "epoch": 2798} {"train_loss": -40.886287689208984, "global_step": 338564, "epoch": 2798} {"train_loss": -40.165889739990234, "global_step": 338565, "epoch": 2798} {"train_loss": -41.259456634521484, "global_step": 338566, "epoch": 2798} {"train_loss": -40.86259460449219, "global_step": 338567, "epoch": 2798} {"train_loss": -40.39319610595703, "global_step": 338568, "epoch": 2798} {"train_loss": -40.64690017700195, "global_step": 338569, "epoch": 2798} {"train_loss": -40.63422775268555, "global_step": 338570, "epoch": 2798} {"train_loss": -39.9014892578125, "global_step": 338571, "epoch": 2798} {"train_loss": -40.97404861450195, "global_step": 338572, "epoch": 2798} {"train_loss": -40.5659294128418, "global_step": 338573, "epoch": 2798} {"train_loss": -40.39906692504883, "global_step": 338574, "epoch": 2798} {"train_loss": -40.09743881225586, "global_step": 338575, "epoch": 2798} {"train_loss": -40.26056671142578, "global_step": 338576, "epoch": 2798} {"train_loss": -40.37826919555664, "global_step": 338577, "epoch": 2798} {"train_loss": -40.41230010986328, "global_step": 338578, "epoch": 2798} {"train_loss": -41.68085861206055, "global_step": 338579, "epoch": 2798} {"train_loss": -41.34803771972656, "global_step": 338580, "epoch": 2798} {"train_loss": -41.1241340637207, "global_step": 338581, "epoch": 2798} {"train_loss": -41.272491455078125, "global_step": 338582, "epoch": 2798} {"train_loss": -40.976951599121094, "global_step": 338583, "epoch": 2798} {"train_loss": -40.457515716552734, "global_step": 338584, "epoch": 2798} {"train_loss": -41.02873611450195, "global_step": 338585, "epoch": 2798} {"train_loss": -41.56045150756836, "global_step": 338586, "epoch": 2798} {"train_loss": -41.34074401855469, "global_step": 338587, "epoch": 2798} {"train_loss": -42.0452766418457, "global_step": 338588, "epoch": 2798} {"train_loss": -41.56682586669922, "global_step": 338589, "epoch": 2798} {"train_loss": -40.8621826171875, "global_step": 338590, "epoch": 2798} {"train_loss": -41.019134521484375, "global_step": 338591, "epoch": 2798} {"train_loss": -42.02183151245117, "global_step": 338592, "epoch": 2798} {"train_loss": -41.49186325073242, "global_step": 338593, "epoch": 2798} {"train_loss": -42.2788200378418, "global_step": 338594, "epoch": 2798} {"train_loss": -42.01819610595703, "global_step": 338595, "epoch": 2798} {"train_loss": -42.0832633972168, "global_step": 338596, "epoch": 2798} {"train_loss": -41.63869857788086, "global_step": 338597, "epoch": 2798} {"train_loss": -42.497955322265625, "global_step": 338598, "epoch": 2798} {"train_loss": -42.18696594238281, "global_step": 338599, "epoch": 2798} {"train_loss": -41.90620803833008, "global_step": 338600, "epoch": 2798} {"train_loss": -43.12373733520508, "global_step": 338601, "epoch": 2798} {"train_loss": -42.42290115356445, "global_step": 338602, "epoch": 2798} {"train_loss": -42.096961975097656, "global_step": 338603, "epoch": 2798} {"train_loss": -41.1104736328125, "global_step": 338604, "epoch": 2798} {"train_loss": -41.87380599975586, "global_step": 338605, "epoch": 2798} {"train_loss": -41.359840393066406, "global_step": 338606, "epoch": 2798} {"train_loss": -41.30191421508789, "global_step": 338607, "epoch": 2798} {"train_loss": -42.6961555480957, "global_step": 338608, "epoch": 2798} {"train_loss": -40.45025634765625, "global_step": 338609, "epoch": 2798} {"train_loss": -42.46627426147461, "global_step": 338610, "epoch": 2798} {"train_loss": -43.09028625488281, "global_step": 338611, "epoch": 2798} {"train_loss": -42.635345458984375, "global_step": 338612, "epoch": 2798} {"train_loss": -42.12434768676758, "global_step": 338613, "epoch": 2798} {"train_loss": -42.23722457885742, "global_step": 338614, "epoch": 2798} {"train_loss": -42.12800216674805, "global_step": 338615, "epoch": 2798} {"train_loss": -42.479637145996094, "global_step": 338616, "epoch": 2798} {"train_loss": -42.440433502197266, "global_step": 338617, "epoch": 2798} {"train_loss": -41.88475036621094, "global_step": 338618, "epoch": 2798} {"train_loss": -42.13284683227539, "global_step": 338619, "epoch": 2798} {"train_loss": -42.50936508178711, "global_step": 338620, "epoch": 2798} {"train_loss": -41.603126525878906, "global_step": 338621, "epoch": 2798} {"train_loss": -43.5151252746582, "global_step": 338622, "epoch": 2798} {"train_loss": -42.77132797241211, "global_step": 338623, "epoch": 2798} {"train_loss": -42.94427490234375, "global_step": 338624, "epoch": 2798} {"train_loss": -42.574031829833984, "global_step": 338625, "epoch": 2798} {"train_loss": -42.9364128112793, "global_step": 338626, "epoch": 2798} {"train_loss": -42.826045989990234, "global_step": 338627, "epoch": 2798} {"train_loss": -43.0045051574707, "global_step": 338628, "epoch": 2798} {"train_loss": -43.29643630981445, "global_step": 338629, "epoch": 2798} {"train_loss": -43.14710235595703, "global_step": 338630, "epoch": 2798} {"train_loss": -43.01979446411133, "global_step": 338631, "epoch": 2798} {"train_loss": -43.429874420166016, "global_step": 338632, "epoch": 2798} {"train_loss": -43.10102081298828, "global_step": 338633, "epoch": 2798} {"train_loss": -43.19886016845703, "global_step": 338634, "epoch": 2798} {"train_loss": -43.20417785644531, "global_step": 338635, "epoch": 2798} {"train_loss": -43.48830795288086, "global_step": 338636, "epoch": 2798} {"train_loss": -42.99622344970703, "global_step": 338637, "epoch": 2798} {"train_loss": -43.20536422729492, "global_step": 338638, "epoch": 2798} {"train_loss": -43.16474533081055, "global_step": 338639, "epoch": 2798} {"train_loss": -43.8342399597168, "global_step": 338640, "epoch": 2798} {"train_loss": -42.47930908203125, "global_step": 338641, "epoch": 2798} {"train_loss": -43.60469055175781, "global_step": 338642, "epoch": 2798} {"train_loss": -43.26768112182617, "global_step": 338643, "epoch": 2798} {"train_loss": -43.137325286865234, "global_step": 338644, "epoch": 2798} {"train_loss": -43.82099533081055, "global_step": 338645, "epoch": 2798} {"train_loss": -43.633914947509766, "global_step": 338646, "epoch": 2798} {"train_loss": -43.026546478271484, "global_step": 338647, "epoch": 2798} {"train_loss": -43.5448112487793, "global_step": 338648, "epoch": 2798} {"train_loss": -43.41535186767578, "global_step": 338649, "epoch": 2798} {"train_loss": -42.8560905456543, "global_step": 338650, "epoch": 2798} {"train_loss": -42.94940948486328, "global_step": 338651, "epoch": 2798} {"train_loss": -42.95286178588867, "global_step": 338652, "epoch": 2798} {"train_loss": -44.0909538269043, "global_step": 338653, "epoch": 2798} {"train_loss": -43.63093185424805, "global_step": 338654, "epoch": 2798} {"train_loss": -43.077972412109375, "global_step": 338655, "epoch": 2798} {"train_loss": -43.553646087646484, "global_step": 338656, "epoch": 2798} {"train_loss": -43.554046630859375, "global_step": 338657, "epoch": 2798} {"train_loss": -43.282630920410156, "global_step": 338658, "epoch": 2798} {"train_loss": -43.62221145629883, "global_step": 338659, "epoch": 2798} {"train_loss": -43.532379150390625, "global_step": 338660, "epoch": 2798} {"train_loss": -43.29705810546875, "global_step": 338661, "epoch": 2798} {"train_loss": -43.6248893737793, "global_step": 338662, "epoch": 2798} {"train_loss": -43.41964340209961, "global_step": 338663, "epoch": 2798} {"train_loss": -43.93352127075195, "global_step": 338664, "epoch": 2798} {"train_loss": -42.77241134643555, "global_step": 338665, "epoch": 2798} {"train_loss": -43.45343017578125, "global_step": 338666, "epoch": 2798} {"train_loss": -43.344573974609375, "global_step": 338667, "epoch": 2798} {"train_loss": -40.34735107421875, "global_step": 338668, "epoch": 2798} {"train_loss": -42.755157470703125, "global_step": 338669, "epoch": 2798} {"train_loss": -42.320613861083984, "global_step": 338670, "epoch": 2798} {"train_loss": -42.07143783569336, "global_step": 338671, "epoch": 2798} {"train_loss": -42.864532470703125, "global_step": 338672, "epoch": 2798} {"train_loss": -42.86285400390625, "global_step": 338673, "epoch": 2798} {"train_loss": -43.14537048339844, "global_step": 338674, "epoch": 2798} {"train_loss": -43.12176513671875, "global_step": 338675, "epoch": 2798} {"train_loss": -43.291595458984375, "global_step": 338676, "epoch": 2798} {"train_loss": -41.796573638916016, "global_step": 338677, "epoch": 2798} {"train_loss": -42.153685892909024, "global_step": 338678, "epoch": 2798, "val_loss": 2785921.25} {"train_loss": -42.424556732177734, "global_step": 338679, "epoch": 2799} {"train_loss": -42.647972106933594, "global_step": 338680, "epoch": 2799} {"train_loss": -42.81496810913086, "global_step": 338681, "epoch": 2799} {"train_loss": -43.69819259643555, "global_step": 338682, "epoch": 2799} {"train_loss": -42.430442810058594, "global_step": 338683, "epoch": 2799} {"train_loss": -42.81580352783203, "global_step": 338684, "epoch": 2799} {"train_loss": -41.89683151245117, "global_step": 338685, "epoch": 2799} {"train_loss": -41.66228485107422, "global_step": 338686, "epoch": 2799} {"train_loss": -43.1146240234375, "global_step": 338687, "epoch": 2799} {"train_loss": -42.82540512084961, "global_step": 338688, "epoch": 2799} {"train_loss": -42.93844223022461, "global_step": 338689, "epoch": 2799} {"train_loss": -42.092689514160156, "global_step": 338690, "epoch": 2799} {"train_loss": -42.84934997558594, "global_step": 338691, "epoch": 2799} {"train_loss": -42.34444808959961, "global_step": 338692, "epoch": 2799} {"train_loss": -40.65653610229492, "global_step": 338693, "epoch": 2799} {"train_loss": -39.2120361328125, "global_step": 338694, "epoch": 2799} {"train_loss": -40.73218536376953, "global_step": 338695, "epoch": 2799} {"train_loss": -38.91376876831055, "global_step": 338696, "epoch": 2799} {"train_loss": -41.913578033447266, "global_step": 338697, "epoch": 2799} {"train_loss": -39.81424331665039, "global_step": 338698, "epoch": 2799} {"train_loss": -38.44183349609375, "global_step": 338699, "epoch": 2799} {"train_loss": -42.05253219604492, "global_step": 338700, "epoch": 2799} {"train_loss": -40.185726165771484, "global_step": 338701, "epoch": 2799} {"train_loss": -42.096961975097656, "global_step": 338702, "epoch": 2799} {"train_loss": -40.61507797241211, "global_step": 338703, "epoch": 2799} {"train_loss": -41.59033966064453, "global_step": 338704, "epoch": 2799} {"train_loss": -41.75564193725586, "global_step": 338705, "epoch": 2799} {"train_loss": -42.49365234375, "global_step": 338706, "epoch": 2799} {"train_loss": -41.982704162597656, "global_step": 338707, "epoch": 2799} {"train_loss": -43.07328796386719, "global_step": 338708, "epoch": 2799} {"train_loss": -41.28998565673828, "global_step": 338709, "epoch": 2799} {"train_loss": -42.946563720703125, "global_step": 338710, "epoch": 2799} {"train_loss": -42.82929611206055, "global_step": 338711, "epoch": 2799} {"train_loss": -42.663734436035156, "global_step": 338712, "epoch": 2799} {"train_loss": -42.721656799316406, "global_step": 338713, "epoch": 2799} {"train_loss": -39.24610137939453, "global_step": 338714, "epoch": 2799} {"train_loss": -42.245967864990234, "global_step": 338715, "epoch": 2799} {"train_loss": -42.75396728515625, "global_step": 338716, "epoch": 2799} {"train_loss": -42.89044189453125, "global_step": 338717, "epoch": 2799} {"train_loss": -42.51181411743164, "global_step": 338718, "epoch": 2799} {"train_loss": -42.92221450805664, "global_step": 338719, "epoch": 2799} {"train_loss": -41.58143997192383, "global_step": 338720, "epoch": 2799} {"train_loss": -43.26467514038086, "global_step": 338721, "epoch": 2799} {"train_loss": -41.50275421142578, "global_step": 338722, "epoch": 2799} {"train_loss": -42.84797286987305, "global_step": 338723, "epoch": 2799} {"train_loss": -42.5685920715332, "global_step": 338724, "epoch": 2799} {"train_loss": -43.43838882446289, "global_step": 338725, "epoch": 2799} {"train_loss": -42.423580169677734, "global_step": 338726, "epoch": 2799} {"train_loss": -43.020362854003906, "global_step": 338727, "epoch": 2799} {"train_loss": -43.72732162475586, "global_step": 338728, "epoch": 2799} {"train_loss": -43.8339958190918, "global_step": 338729, "epoch": 2799} {"train_loss": -41.99665832519531, "global_step": 338730, "epoch": 2799} {"train_loss": -43.788787841796875, "global_step": 338731, "epoch": 2799} {"train_loss": -43.509361267089844, "global_step": 338732, "epoch": 2799} {"train_loss": -43.0155143737793, "global_step": 338733, "epoch": 2799} {"train_loss": -43.79067611694336, "global_step": 338734, "epoch": 2799} {"train_loss": -35.39414596557617, "global_step": 338735, "epoch": 2799} {"train_loss": -43.70742416381836, "global_step": 338736, "epoch": 2799} {"train_loss": -43.5959358215332, "global_step": 338737, "epoch": 2799} {"train_loss": -43.075313568115234, "global_step": 338738, "epoch": 2799} {"train_loss": -43.24540710449219, "global_step": 338739, "epoch": 2799} {"train_loss": -43.785560607910156, "global_step": 338740, "epoch": 2799} {"train_loss": -43.03364181518555, "global_step": 338741, "epoch": 2799} {"train_loss": -43.63026809692383, "global_step": 338742, "epoch": 2799} {"train_loss": -43.8253059387207, "global_step": 338743, "epoch": 2799} {"train_loss": -42.81173324584961, "global_step": 338744, "epoch": 2799} {"train_loss": -42.87928009033203, "global_step": 338745, "epoch": 2799} {"train_loss": -42.16287612915039, "global_step": 338746, "epoch": 2799} {"train_loss": -42.55587387084961, "global_step": 338747, "epoch": 2799} {"train_loss": -41.3174934387207, "global_step": 338748, "epoch": 2799} {"train_loss": -42.9754638671875, "global_step": 338749, "epoch": 2799} {"train_loss": -43.080745697021484, "global_step": 338750, "epoch": 2799} {"train_loss": -39.60589599609375, "global_step": 338751, "epoch": 2799} {"train_loss": -42.54610824584961, "global_step": 338752, "epoch": 2799} {"train_loss": -42.76237106323242, "global_step": 338753, "epoch": 2799} {"train_loss": -42.3674201965332, "global_step": 338754, "epoch": 2799} {"train_loss": -41.07597732543945, "global_step": 338755, "epoch": 2799} {"train_loss": -41.62177276611328, "global_step": 338756, "epoch": 2799} {"train_loss": -41.08163070678711, "global_step": 338757, "epoch": 2799} {"train_loss": -42.40975570678711, "global_step": 338758, "epoch": 2799} {"train_loss": -41.993404388427734, "global_step": 338759, "epoch": 2799} {"train_loss": -42.75172424316406, "global_step": 338760, "epoch": 2799} {"train_loss": -42.04745101928711, "global_step": 338761, "epoch": 2799} {"train_loss": -41.71646499633789, "global_step": 338762, "epoch": 2799} {"train_loss": -40.77694320678711, "global_step": 338763, "epoch": 2799} {"train_loss": -39.508270263671875, "global_step": 338764, "epoch": 2799} {"train_loss": -40.22866439819336, "global_step": 338765, "epoch": 2799} {"train_loss": -38.10544967651367, "global_step": 338766, "epoch": 2799} {"train_loss": -41.72478485107422, "global_step": 338767, "epoch": 2799} {"train_loss": -40.03916549682617, "global_step": 338768, "epoch": 2799} {"train_loss": -39.068538665771484, "global_step": 338769, "epoch": 2799} {"train_loss": -40.82329177856445, "global_step": 338770, "epoch": 2799} {"train_loss": -38.60527801513672, "global_step": 338771, "epoch": 2799} {"train_loss": -41.177978515625, "global_step": 338772, "epoch": 2799} {"train_loss": -42.2395133972168, "global_step": 338773, "epoch": 2799} {"train_loss": -40.37300491333008, "global_step": 338774, "epoch": 2799} {"train_loss": -41.611183166503906, "global_step": 338775, "epoch": 2799} {"train_loss": -41.491485595703125, "global_step": 338776, "epoch": 2799} {"train_loss": -41.724605560302734, "global_step": 338777, "epoch": 2799} {"train_loss": -42.35099411010742, "global_step": 338778, "epoch": 2799} {"train_loss": -39.769256591796875, "global_step": 338779, "epoch": 2799} {"train_loss": -40.73317337036133, "global_step": 338780, "epoch": 2799} {"train_loss": -42.73108673095703, "global_step": 338781, "epoch": 2799} {"train_loss": -41.236724853515625, "global_step": 338782, "epoch": 2799} {"train_loss": -42.079750061035156, "global_step": 338783, "epoch": 2799} {"train_loss": -37.96430206298828, "global_step": 338784, "epoch": 2799} {"train_loss": -40.59371566772461, "global_step": 338785, "epoch": 2799} {"train_loss": -42.15162658691406, "global_step": 338786, "epoch": 2799} {"train_loss": -35.02351379394531, "global_step": 338787, "epoch": 2799} {"train_loss": -41.81952667236328, "global_step": 338788, "epoch": 2799} {"train_loss": -40.78220748901367, "global_step": 338789, "epoch": 2799} {"train_loss": -42.14284896850586, "global_step": 338790, "epoch": 2799} {"train_loss": -42.33240509033203, "global_step": 338791, "epoch": 2799} {"train_loss": -41.15078353881836, "global_step": 338792, "epoch": 2799} {"train_loss": -42.50606155395508, "global_step": 338793, "epoch": 2799} {"train_loss": -42.01717758178711, "global_step": 338794, "epoch": 2799} {"train_loss": -42.63395309448242, "global_step": 338795, "epoch": 2799} {"train_loss": -41.60890579223633, "global_step": 338796, "epoch": 2799} {"train_loss": -40.920345306396484, "global_step": 338797, "epoch": 2799} {"train_loss": -40.34907150268555, "global_step": 338798, "epoch": 2799} {"train_loss": -41.79459254997821, "global_step": 338799, "epoch": 2799, "val_loss": 2505675.25} {"train_loss": -42.91146469116211, "global_step": 338800, "epoch": 2800} {"train_loss": -41.76255416870117, "global_step": 338801, "epoch": 2800} {"train_loss": -43.04862594604492, "global_step": 338802, "epoch": 2800} {"train_loss": -40.835872650146484, "global_step": 338803, "epoch": 2800} {"train_loss": -42.614559173583984, "global_step": 338804, "epoch": 2800} {"train_loss": -42.84452438354492, "global_step": 338805, "epoch": 2800} {"train_loss": -42.54976272583008, "global_step": 338806, "epoch": 2800} {"train_loss": -43.31239700317383, "global_step": 338807, "epoch": 2800} {"train_loss": -41.955299377441406, "global_step": 338808, "epoch": 2800} {"train_loss": -42.96864318847656, "global_step": 338809, "epoch": 2800} {"train_loss": -41.676368713378906, "global_step": 338810, "epoch": 2800} {"train_loss": -42.99496078491211, "global_step": 338811, "epoch": 2800} {"train_loss": -41.3431396484375, "global_step": 338812, "epoch": 2800} {"train_loss": -43.13986587524414, "global_step": 338813, "epoch": 2800} {"train_loss": -42.69428253173828, "global_step": 338814, "epoch": 2800} {"train_loss": -41.82438278198242, "global_step": 338815, "epoch": 2800} {"train_loss": -43.35710525512695, "global_step": 338816, "epoch": 2800} {"train_loss": -42.9724235534668, "global_step": 338817, "epoch": 2800} {"train_loss": -42.83651351928711, "global_step": 338818, "epoch": 2800} {"train_loss": -43.36528778076172, "global_step": 338819, "epoch": 2800} {"train_loss": -42.700435638427734, "global_step": 338820, "epoch": 2800} {"train_loss": -43.5481071472168, "global_step": 338821, "epoch": 2800} {"train_loss": -40.9892692565918, "global_step": 338822, "epoch": 2800} {"train_loss": -43.54853439331055, "global_step": 338823, "epoch": 2800} {"train_loss": -43.2003059387207, "global_step": 338824, "epoch": 2800} {"train_loss": -42.65627670288086, "global_step": 338825, "epoch": 2800} {"train_loss": -40.274742126464844, "global_step": 338826, "epoch": 2800} {"train_loss": -42.77313232421875, "global_step": 338827, "epoch": 2800} {"train_loss": -43.30666732788086, "global_step": 338828, "epoch": 2800} {"train_loss": -42.60221481323242, "global_step": 338829, "epoch": 2800} {"train_loss": -43.953857421875, "global_step": 338830, "epoch": 2800} {"train_loss": -43.461944580078125, "global_step": 338831, "epoch": 2800} {"train_loss": -42.94154739379883, "global_step": 338832, "epoch": 2800} {"train_loss": -41.65883255004883, "global_step": 338833, "epoch": 2800} {"train_loss": -41.9871826171875, "global_step": 338834, "epoch": 2800} {"train_loss": -43.69094467163086, "global_step": 338835, "epoch": 2800} {"train_loss": -43.69574737548828, "global_step": 338836, "epoch": 2800} {"train_loss": -43.1285400390625, "global_step": 338837, "epoch": 2800} {"train_loss": -43.751216888427734, "global_step": 338838, "epoch": 2800} {"train_loss": -43.36170196533203, "global_step": 338839, "epoch": 2800} {"train_loss": -43.12586212158203, "global_step": 338840, "epoch": 2800} {"train_loss": -42.59853744506836, "global_step": 338841, "epoch": 2800} {"train_loss": -43.228755950927734, "global_step": 338842, "epoch": 2800} {"train_loss": -42.80560302734375, "global_step": 338843, "epoch": 2800} {"train_loss": -42.74158477783203, "global_step": 338844, "epoch": 2800} {"train_loss": -44.20518112182617, "global_step": 338845, "epoch": 2800} {"train_loss": -43.423030853271484, "global_step": 338846, "epoch": 2800} {"train_loss": -42.932830810546875, "global_step": 338847, "epoch": 2800} {"train_loss": -42.83203887939453, "global_step": 338848, "epoch": 2800} {"train_loss": -43.422821044921875, "global_step": 338849, "epoch": 2800} {"train_loss": -43.284454345703125, "global_step": 338850, "epoch": 2800} {"train_loss": -42.45735549926758, "global_step": 338851, "epoch": 2800} {"train_loss": -43.33858871459961, "global_step": 338852, "epoch": 2800} {"train_loss": -43.232418060302734, "global_step": 338853, "epoch": 2800} {"train_loss": -43.49758529663086, "global_step": 338854, "epoch": 2800} {"train_loss": -42.83681106567383, "global_step": 338855, "epoch": 2800} {"train_loss": -43.58504104614258, "global_step": 338856, "epoch": 2800} {"train_loss": -42.22621536254883, "global_step": 338857, "epoch": 2800} {"train_loss": -43.28953552246094, "global_step": 338858, "epoch": 2800} {"train_loss": -42.837886810302734, "global_step": 338859, "epoch": 2800} {"train_loss": -42.763179779052734, "global_step": 338860, "epoch": 2800} {"train_loss": -41.06754684448242, "global_step": 338861, "epoch": 2800} {"train_loss": -42.297733306884766, "global_step": 338862, "epoch": 2800} {"train_loss": -43.341148376464844, "global_step": 338863, "epoch": 2800} {"train_loss": -41.353370666503906, "global_step": 338864, "epoch": 2800} {"train_loss": -41.814727783203125, "global_step": 338865, "epoch": 2800} {"train_loss": -42.71842575073242, "global_step": 338866, "epoch": 2800} {"train_loss": -43.772666931152344, "global_step": 338867, "epoch": 2800} {"train_loss": -41.800987243652344, "global_step": 338868, "epoch": 2800} {"train_loss": -42.40231704711914, "global_step": 338869, "epoch": 2800} {"train_loss": -43.54800796508789, "global_step": 338870, "epoch": 2800} {"train_loss": -42.308345794677734, "global_step": 338871, "epoch": 2800} {"train_loss": -42.223567962646484, "global_step": 338872, "epoch": 2800} {"train_loss": -43.47048568725586, "global_step": 338873, "epoch": 2800} {"train_loss": -43.1467170715332, "global_step": 338874, "epoch": 2800} {"train_loss": -41.932464599609375, "global_step": 338875, "epoch": 2800} {"train_loss": -43.150753021240234, "global_step": 338876, "epoch": 2800} {"train_loss": -42.99589157104492, "global_step": 338877, "epoch": 2800} {"train_loss": -42.484344482421875, "global_step": 338878, "epoch": 2800} {"train_loss": -42.24213409423828, "global_step": 338879, "epoch": 2800} {"train_loss": -42.52075958251953, "global_step": 338880, "epoch": 2800} {"train_loss": -42.9400634765625, "global_step": 338881, "epoch": 2800} {"train_loss": -42.15050506591797, "global_step": 338882, "epoch": 2800} {"train_loss": -42.39781188964844, "global_step": 338883, "epoch": 2800} {"train_loss": -44.03602981567383, "global_step": 338884, "epoch": 2800} {"train_loss": -42.712154388427734, "global_step": 338885, "epoch": 2800} {"train_loss": -43.29172897338867, "global_step": 338886, "epoch": 2800} {"train_loss": -43.4182243347168, "global_step": 338887, "epoch": 2800} {"train_loss": -43.19828414916992, "global_step": 338888, "epoch": 2800} {"train_loss": -43.53214645385742, "global_step": 338889, "epoch": 2800} {"train_loss": -43.53839874267578, "global_step": 338890, "epoch": 2800} {"train_loss": -43.47103500366211, "global_step": 338891, "epoch": 2800} {"train_loss": -43.144798278808594, "global_step": 338892, "epoch": 2800} {"train_loss": -43.60660934448242, "global_step": 338893, "epoch": 2800} {"train_loss": -41.9404182434082, "global_step": 338894, "epoch": 2800} {"train_loss": -41.861114501953125, "global_step": 338895, "epoch": 2800} {"train_loss": -42.38299560546875, "global_step": 338896, "epoch": 2800} {"train_loss": -43.378292083740234, "global_step": 338897, "epoch": 2800} {"train_loss": -42.70868682861328, "global_step": 338898, "epoch": 2800} {"train_loss": -42.820064544677734, "global_step": 338899, "epoch": 2800} {"train_loss": -42.93488311767578, "global_step": 338900, "epoch": 2800} {"train_loss": -43.78067398071289, "global_step": 338901, "epoch": 2800} {"train_loss": -42.817596435546875, "global_step": 338902, "epoch": 2800} {"train_loss": -42.15776443481445, "global_step": 338903, "epoch": 2800} {"train_loss": -41.74408721923828, "global_step": 338904, "epoch": 2800} {"train_loss": -42.43470001220703, "global_step": 338905, "epoch": 2800} {"train_loss": -42.90476608276367, "global_step": 338906, "epoch": 2800} {"train_loss": -43.27524948120117, "global_step": 338907, "epoch": 2800} {"train_loss": -43.50707244873047, "global_step": 338908, "epoch": 2800} {"train_loss": -43.219154357910156, "global_step": 338909, "epoch": 2800} {"train_loss": -43.190250396728516, "global_step": 338910, "epoch": 2800} {"train_loss": -42.76694869995117, "global_step": 338911, "epoch": 2800} {"train_loss": -43.143428802490234, "global_step": 338912, "epoch": 2800} {"train_loss": -43.332698822021484, "global_step": 338913, "epoch": 2800} {"train_loss": -42.185970306396484, "global_step": 338914, "epoch": 2800} {"train_loss": -43.761962890625, "global_step": 338915, "epoch": 2800} {"train_loss": -44.0612678527832, "global_step": 338916, "epoch": 2800} {"train_loss": -42.63608169555664, "global_step": 338917, "epoch": 2800} {"train_loss": -41.80613708496094, "global_step": 338918, "epoch": 2800} {"train_loss": -43.1118278503418, "global_step": 338919, "epoch": 2800} {"train_loss": -42.82583791559393, "global_step": 338920, "epoch": 2800, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4400000": 1.0, "test/sim_max_reward_4400001": 1.0, "test/sim_max_reward_4400002": 1.0, "test/sim_max_reward_4400003": 1.0, "test/sim_max_reward_4400004": 1.0, "test/sim_max_reward_4400005": 1.0, "test/sim_max_reward_4400006": 1.0, "test/sim_max_reward_4400007": 1.0, "test/sim_max_reward_4400008": 1.0, "test/sim_max_reward_4400009": 1.0, "test/sim_max_reward_4400010": 1.0, "test/sim_max_reward_4400011": 1.0, "test/sim_max_reward_4400012": 1.0, "test/sim_max_reward_4400013": 1.0, "test/sim_max_reward_4400014": 1.0, "test/sim_max_reward_4400015": 1.0, "test/sim_max_reward_4400016": 1.0, "test/sim_max_reward_4400017": 1.0, "test/sim_max_reward_4400018": 1.0, "test/sim_max_reward_4400019": 1.0, "test/sim_max_reward_4400020": 1.0, "test/sim_max_reward_4400021": 1.0, "train/mean_score": 1.0, "test/mean_score": 1.0, "val_loss": 2555153.5} {"train_loss": -42.971221923828125, "global_step": 338921, "epoch": 2801} {"train_loss": -42.178375244140625, "global_step": 338922, "epoch": 2801} {"train_loss": -43.0789680480957, "global_step": 338923, "epoch": 2801} {"train_loss": -43.0289192199707, "global_step": 338924, "epoch": 2801} {"train_loss": -42.820072174072266, "global_step": 338925, "epoch": 2801} {"train_loss": -42.98739242553711, "global_step": 338926, "epoch": 2801} {"train_loss": -43.14936065673828, "global_step": 338927, "epoch": 2801} {"train_loss": -43.33417510986328, "global_step": 338928, "epoch": 2801} {"train_loss": -43.044429779052734, "global_step": 338929, "epoch": 2801} {"train_loss": -43.63969802856445, "global_step": 338930, "epoch": 2801} {"train_loss": -43.57354736328125, "global_step": 338931, "epoch": 2801} {"train_loss": -43.92599105834961, "global_step": 338932, "epoch": 2801} {"train_loss": -41.83864212036133, "global_step": 338933, "epoch": 2801} {"train_loss": -42.752811431884766, "global_step": 338934, "epoch": 2801} {"train_loss": -42.622615814208984, "global_step": 338935, "epoch": 2801} {"train_loss": -42.51839828491211, "global_step": 338936, "epoch": 2801} {"train_loss": -43.40332794189453, "global_step": 338937, "epoch": 2801} {"train_loss": -42.51911163330078, "global_step": 338938, "epoch": 2801} {"train_loss": -43.08340072631836, "global_step": 338939, "epoch": 2801} {"train_loss": -43.31187057495117, "global_step": 338940, "epoch": 2801} {"train_loss": -41.93341064453125, "global_step": 338941, "epoch": 2801} {"train_loss": -42.79097366333008, "global_step": 338942, "epoch": 2801} {"train_loss": -43.46611022949219, "global_step": 338943, "epoch": 2801} {"train_loss": -42.564918518066406, "global_step": 338944, "epoch": 2801} {"train_loss": -43.5629997253418, "global_step": 338945, "epoch": 2801} {"train_loss": -42.900142669677734, "global_step": 338946, "epoch": 2801} {"train_loss": -43.93931198120117, "global_step": 338947, "epoch": 2801} {"train_loss": -43.53036117553711, "global_step": 338948, "epoch": 2801} {"train_loss": -43.58443832397461, "global_step": 338949, "epoch": 2801} {"train_loss": -43.9777717590332, "global_step": 338950, "epoch": 2801} {"train_loss": -43.39046859741211, "global_step": 338951, "epoch": 2801} {"train_loss": -43.770263671875, "global_step": 338952, "epoch": 2801} {"train_loss": -42.76301193237305, "global_step": 338953, "epoch": 2801} {"train_loss": -43.03768539428711, "global_step": 338954, "epoch": 2801} {"train_loss": -43.67584991455078, "global_step": 338955, "epoch": 2801} {"train_loss": -43.55655288696289, "global_step": 338956, "epoch": 2801} {"train_loss": -41.9211540222168, "global_step": 338957, "epoch": 2801} {"train_loss": -42.04279708862305, "global_step": 338958, "epoch": 2801} {"train_loss": -43.2374153137207, "global_step": 338959, "epoch": 2801} {"train_loss": -43.592647552490234, "global_step": 338960, "epoch": 2801} {"train_loss": -42.15040969848633, "global_step": 338961, "epoch": 2801} {"train_loss": -43.10565185546875, "global_step": 338962, "epoch": 2801} {"train_loss": -43.68240737915039, "global_step": 338963, "epoch": 2801} {"train_loss": -42.88743591308594, "global_step": 338964, "epoch": 2801} {"train_loss": -42.297088623046875, "global_step": 338965, "epoch": 2801} {"train_loss": -43.22750473022461, "global_step": 338966, "epoch": 2801} {"train_loss": -42.2216796875, "global_step": 338967, "epoch": 2801} {"train_loss": -41.59158706665039, "global_step": 338968, "epoch": 2801} {"train_loss": -43.5289421081543, "global_step": 338969, "epoch": 2801} {"train_loss": -43.28776168823242, "global_step": 338970, "epoch": 2801} {"train_loss": -39.94002914428711, "global_step": 338971, "epoch": 2801} {"train_loss": -43.624515533447266, "global_step": 338972, "epoch": 2801} {"train_loss": -39.63721466064453, "global_step": 338973, "epoch": 2801} {"train_loss": -42.671791076660156, "global_step": 338974, "epoch": 2801} {"train_loss": -43.888790130615234, "global_step": 338975, "epoch": 2801} {"train_loss": -43.473243713378906, "global_step": 338976, "epoch": 2801} {"train_loss": -42.172149658203125, "global_step": 338977, "epoch": 2801} {"train_loss": -43.51184844970703, "global_step": 338978, "epoch": 2801} {"train_loss": -41.8990364074707, "global_step": 338979, "epoch": 2801} {"train_loss": -41.63800811767578, "global_step": 338980, "epoch": 2801} {"train_loss": -42.257080078125, "global_step": 338981, "epoch": 2801} {"train_loss": -43.89592361450195, "global_step": 338982, "epoch": 2801} {"train_loss": -34.41981887817383, "global_step": 338983, "epoch": 2801} {"train_loss": -42.33978271484375, "global_step": 338984, "epoch": 2801} {"train_loss": -39.26611328125, "global_step": 338985, "epoch": 2801} {"train_loss": -43.12604522705078, "global_step": 338986, "epoch": 2801} {"train_loss": -42.74333190917969, "global_step": 338987, "epoch": 2801} {"train_loss": -42.513668060302734, "global_step": 338988, "epoch": 2801} {"train_loss": -41.91939163208008, "global_step": 338989, "epoch": 2801} {"train_loss": -42.9157829284668, "global_step": 338990, "epoch": 2801} {"train_loss": -43.14168930053711, "global_step": 338991, "epoch": 2801} {"train_loss": -43.0026969909668, "global_step": 338992, "epoch": 2801} {"train_loss": -43.0754508972168, "global_step": 338993, "epoch": 2801} {"train_loss": -42.717933654785156, "global_step": 338994, "epoch": 2801} {"train_loss": -43.0020866394043, "global_step": 338995, "epoch": 2801} {"train_loss": -43.014095306396484, "global_step": 338996, "epoch": 2801} {"train_loss": -42.214385986328125, "global_step": 338997, "epoch": 2801} {"train_loss": -43.88650131225586, "global_step": 338998, "epoch": 2801} {"train_loss": -44.040897369384766, "global_step": 338999, "epoch": 2801} {"train_loss": -43.561805725097656, "global_step": 339000, "epoch": 2801} {"train_loss": -43.99026107788086, "global_step": 339001, "epoch": 2801} {"train_loss": -43.74789047241211, "global_step": 339002, "epoch": 2801} {"train_loss": -44.0738639831543, "global_step": 339003, "epoch": 2801} {"train_loss": -43.83449935913086, "global_step": 339004, "epoch": 2801} {"train_loss": -43.63047409057617, "global_step": 339005, "epoch": 2801} {"train_loss": -43.95972442626953, "global_step": 339006, "epoch": 2801} {"train_loss": -43.93746566772461, "global_step": 339007, "epoch": 2801} {"train_loss": -43.90961837768555, "global_step": 339008, "epoch": 2801} {"train_loss": -42.3935432434082, "global_step": 339009, "epoch": 2801} {"train_loss": -43.719390869140625, "global_step": 339010, "epoch": 2801} {"train_loss": -43.35549545288086, "global_step": 339011, "epoch": 2801} {"train_loss": -41.204925537109375, "global_step": 339012, "epoch": 2801} {"train_loss": -43.58264923095703, "global_step": 339013, "epoch": 2801} {"train_loss": -44.120391845703125, "global_step": 339014, "epoch": 2801} {"train_loss": -43.38705062866211, "global_step": 339015, "epoch": 2801} {"train_loss": -43.43436813354492, "global_step": 339016, "epoch": 2801} {"train_loss": -44.19782257080078, "global_step": 339017, "epoch": 2801} {"train_loss": -43.669898986816406, "global_step": 339018, "epoch": 2801} {"train_loss": -44.234954833984375, "global_step": 339019, "epoch": 2801} {"train_loss": -43.27452087402344, "global_step": 339020, "epoch": 2801} {"train_loss": -44.00092697143555, "global_step": 339021, "epoch": 2801} {"train_loss": -43.8637809753418, "global_step": 339022, "epoch": 2801} {"train_loss": -43.96966552734375, "global_step": 339023, "epoch": 2801} {"train_loss": -43.94196319580078, "global_step": 339024, "epoch": 2801} {"train_loss": -43.866432189941406, "global_step": 339025, "epoch": 2801} {"train_loss": -44.220333099365234, "global_step": 339026, "epoch": 2801} {"train_loss": -44.09785842895508, "global_step": 339027, "epoch": 2801} {"train_loss": -43.61128616333008, "global_step": 339028, "epoch": 2801} {"train_loss": -43.68547058105469, "global_step": 339029, "epoch": 2801} {"train_loss": -43.725563049316406, "global_step": 339030, "epoch": 2801} {"train_loss": -44.36334991455078, "global_step": 339031, "epoch": 2801} {"train_loss": -43.35909652709961, "global_step": 339032, "epoch": 2801} {"train_loss": -43.74264144897461, "global_step": 339033, "epoch": 2801} {"train_loss": -43.516944885253906, "global_step": 339034, "epoch": 2801} {"train_loss": -43.106048583984375, "global_step": 339035, "epoch": 2801} {"train_loss": -43.59542465209961, "global_step": 339036, "epoch": 2801} {"train_loss": -43.39889144897461, "global_step": 339037, "epoch": 2801} {"train_loss": -42.63810348510742, "global_step": 339038, "epoch": 2801} {"train_loss": -42.663387298583984, "global_step": 339039, "epoch": 2801} {"train_loss": -43.260719299316406, "global_step": 339040, "epoch": 2801} {"train_loss": -43.03639016269652, "global_step": 339041, "epoch": 2801, "val_loss": 2640367.0} {"train_loss": -43.3475341796875, "global_step": 339042, "epoch": 2802} {"train_loss": -44.19916534423828, "global_step": 339043, "epoch": 2802} {"train_loss": -41.44204330444336, "global_step": 339044, "epoch": 2802} {"train_loss": -42.18037796020508, "global_step": 339045, "epoch": 2802} {"train_loss": -43.1854362487793, "global_step": 339046, "epoch": 2802} {"train_loss": -44.07438278198242, "global_step": 339047, "epoch": 2802} {"train_loss": -43.906856536865234, "global_step": 339048, "epoch": 2802} {"train_loss": -43.946083068847656, "global_step": 339049, "epoch": 2802} {"train_loss": -43.104408264160156, "global_step": 339050, "epoch": 2802} {"train_loss": -43.17156982421875, "global_step": 339051, "epoch": 2802} {"train_loss": -43.91781234741211, "global_step": 339052, "epoch": 2802} {"train_loss": -44.65287399291992, "global_step": 339053, "epoch": 2802} {"train_loss": -44.115230560302734, "global_step": 339054, "epoch": 2802} {"train_loss": -43.62236404418945, "global_step": 339055, "epoch": 2802} {"train_loss": -43.43121337890625, "global_step": 339056, "epoch": 2802} {"train_loss": -43.91709899902344, "global_step": 339057, "epoch": 2802} {"train_loss": -43.57086181640625, "global_step": 339058, "epoch": 2802} {"train_loss": -43.88045883178711, "global_step": 339059, "epoch": 2802} {"train_loss": -43.29572296142578, "global_step": 339060, "epoch": 2802} {"train_loss": -43.336830139160156, "global_step": 339061, "epoch": 2802} {"train_loss": -43.51435470581055, "global_step": 339062, "epoch": 2802} {"train_loss": -43.81673049926758, "global_step": 339063, "epoch": 2802} {"train_loss": -44.17092514038086, "global_step": 339064, "epoch": 2802} {"train_loss": -44.36806106567383, "global_step": 339065, "epoch": 2802} {"train_loss": -43.44472885131836, "global_step": 339066, "epoch": 2802} {"train_loss": -43.668148040771484, "global_step": 339067, "epoch": 2802} {"train_loss": -44.05021667480469, "global_step": 339068, "epoch": 2802} {"train_loss": -43.44287872314453, "global_step": 339069, "epoch": 2802} {"train_loss": -43.8326530456543, "global_step": 339070, "epoch": 2802} {"train_loss": -44.1643180847168, "global_step": 339071, "epoch": 2802} {"train_loss": -44.3034553527832, "global_step": 339072, "epoch": 2802} {"train_loss": -43.88383865356445, "global_step": 339073, "epoch": 2802} {"train_loss": -43.35126495361328, "global_step": 339074, "epoch": 2802} {"train_loss": -44.06405258178711, "global_step": 339075, "epoch": 2802} {"train_loss": -44.723793029785156, "global_step": 339076, "epoch": 2802} {"train_loss": -43.87546157836914, "global_step": 339077, "epoch": 2802} {"train_loss": -43.69390869140625, "global_step": 339078, "epoch": 2802} {"train_loss": -41.81807327270508, "global_step": 339079, "epoch": 2802} {"train_loss": -39.97731399536133, "global_step": 339080, "epoch": 2802} {"train_loss": -41.21036911010742, "global_step": 339081, "epoch": 2802} {"train_loss": -44.49740219116211, "global_step": 339082, "epoch": 2802} {"train_loss": -37.59556198120117, "global_step": 339083, "epoch": 2802} {"train_loss": -41.2215690612793, "global_step": 339084, "epoch": 2802} {"train_loss": -42.10006332397461, "global_step": 339085, "epoch": 2802} {"train_loss": -42.36946105957031, "global_step": 339086, "epoch": 2802} {"train_loss": -41.87779235839844, "global_step": 339087, "epoch": 2802} {"train_loss": -42.6415901184082, "global_step": 339088, "epoch": 2802} {"train_loss": -43.377254486083984, "global_step": 339089, "epoch": 2802} {"train_loss": -42.83272933959961, "global_step": 339090, "epoch": 2802} {"train_loss": -43.33590316772461, "global_step": 339091, "epoch": 2802} {"train_loss": -43.27055740356445, "global_step": 339092, "epoch": 2802} {"train_loss": -43.56510925292969, "global_step": 339093, "epoch": 2802} {"train_loss": -42.87726593017578, "global_step": 339094, "epoch": 2802} {"train_loss": -43.73518753051758, "global_step": 339095, "epoch": 2802} {"train_loss": -43.764766693115234, "global_step": 339096, "epoch": 2802} {"train_loss": -44.31449890136719, "global_step": 339097, "epoch": 2802} {"train_loss": -42.92000961303711, "global_step": 339098, "epoch": 2802} {"train_loss": -43.33982467651367, "global_step": 339099, "epoch": 2802} {"train_loss": -43.34455490112305, "global_step": 339100, "epoch": 2802} {"train_loss": -43.01365280151367, "global_step": 339101, "epoch": 2802} {"train_loss": -42.815494537353516, "global_step": 339102, "epoch": 2802} {"train_loss": -43.14177322387695, "global_step": 339103, "epoch": 2802} {"train_loss": -41.859954833984375, "global_step": 339104, "epoch": 2802} {"train_loss": -42.960975646972656, "global_step": 339105, "epoch": 2802} {"train_loss": -43.40270233154297, "global_step": 339106, "epoch": 2802} {"train_loss": -42.6891975402832, "global_step": 339107, "epoch": 2802} {"train_loss": -41.61328125, "global_step": 339108, "epoch": 2802} {"train_loss": -42.954158782958984, "global_step": 339109, "epoch": 2802} {"train_loss": -43.164974212646484, "global_step": 339110, "epoch": 2802} {"train_loss": -42.94478225708008, "global_step": 339111, "epoch": 2802} {"train_loss": -42.011112213134766, "global_step": 339112, "epoch": 2802} {"train_loss": -41.9496955871582, "global_step": 339113, "epoch": 2802} {"train_loss": -43.7185173034668, "global_step": 339114, "epoch": 2802} {"train_loss": -43.44841766357422, "global_step": 339115, "epoch": 2802} {"train_loss": -43.17433547973633, "global_step": 339116, "epoch": 2802} {"train_loss": -42.40729522705078, "global_step": 339117, "epoch": 2802} {"train_loss": -43.6795539855957, "global_step": 339118, "epoch": 2802} {"train_loss": -41.75708770751953, "global_step": 339119, "epoch": 2802} {"train_loss": -42.57231521606445, "global_step": 339120, "epoch": 2802} {"train_loss": -43.014930725097656, "global_step": 339121, "epoch": 2802} {"train_loss": -42.763694763183594, "global_step": 339122, "epoch": 2802} {"train_loss": -42.649200439453125, "global_step": 339123, "epoch": 2802} {"train_loss": -44.0775032043457, "global_step": 339124, "epoch": 2802} {"train_loss": -43.167232513427734, "global_step": 339125, "epoch": 2802} {"train_loss": -43.088191986083984, "global_step": 339126, "epoch": 2802} {"train_loss": -43.130428314208984, "global_step": 339127, "epoch": 2802} {"train_loss": -43.12428665161133, "global_step": 339128, "epoch": 2802} {"train_loss": -43.10357666015625, "global_step": 339129, "epoch": 2802} {"train_loss": -44.04918670654297, "global_step": 339130, "epoch": 2802} {"train_loss": -43.539649963378906, "global_step": 339131, "epoch": 2802} {"train_loss": -42.749786376953125, "global_step": 339132, "epoch": 2802} {"train_loss": -42.42002487182617, "global_step": 339133, "epoch": 2802} {"train_loss": -43.47254943847656, "global_step": 339134, "epoch": 2802} {"train_loss": -44.05472946166992, "global_step": 339135, "epoch": 2802} {"train_loss": -43.660789489746094, "global_step": 339136, "epoch": 2802} {"train_loss": -44.21790313720703, "global_step": 339137, "epoch": 2802} {"train_loss": -44.046791076660156, "global_step": 339138, "epoch": 2802} {"train_loss": -43.77048873901367, "global_step": 339139, "epoch": 2802} {"train_loss": -43.03049850463867, "global_step": 339140, "epoch": 2802} {"train_loss": -43.76557540893555, "global_step": 339141, "epoch": 2802} {"train_loss": -43.6191291809082, "global_step": 339142, "epoch": 2802} {"train_loss": -43.70284652709961, "global_step": 339143, "epoch": 2802} {"train_loss": -44.05531692504883, "global_step": 339144, "epoch": 2802} {"train_loss": -43.97333908081055, "global_step": 339145, "epoch": 2802} {"train_loss": -44.27606964111328, "global_step": 339146, "epoch": 2802} {"train_loss": -44.07736587524414, "global_step": 339147, "epoch": 2802} {"train_loss": -43.76234436035156, "global_step": 339148, "epoch": 2802} {"train_loss": -44.356056213378906, "global_step": 339149, "epoch": 2802} {"train_loss": -44.79419708251953, "global_step": 339150, "epoch": 2802} {"train_loss": -42.33831787109375, "global_step": 339151, "epoch": 2802} {"train_loss": -41.10422897338867, "global_step": 339152, "epoch": 2802} {"train_loss": -44.11479568481445, "global_step": 339153, "epoch": 2802} {"train_loss": -43.765621185302734, "global_step": 339154, "epoch": 2802} {"train_loss": -43.2402229309082, "global_step": 339155, "epoch": 2802} {"train_loss": -44.05923843383789, "global_step": 339156, "epoch": 2802} {"train_loss": -42.933685302734375, "global_step": 339157, "epoch": 2802} {"train_loss": -43.579036712646484, "global_step": 339158, "epoch": 2802} {"train_loss": -44.29854202270508, "global_step": 339159, "epoch": 2802} {"train_loss": -43.77272033691406, "global_step": 339160, "epoch": 2802} {"train_loss": -43.46180725097656, "global_step": 339161, "epoch": 2802} {"train_loss": -43.27811699859367, "global_step": 339162, "epoch": 2802, "val_loss": 2574692.75} {"train_loss": -43.07008361816406, "global_step": 339163, "epoch": 2803} {"train_loss": -43.15597915649414, "global_step": 339164, "epoch": 2803} {"train_loss": -43.6519889831543, "global_step": 339165, "epoch": 2803} {"train_loss": -43.2159538269043, "global_step": 339166, "epoch": 2803} {"train_loss": -43.85697555541992, "global_step": 339167, "epoch": 2803} {"train_loss": -44.30305862426758, "global_step": 339168, "epoch": 2803} {"train_loss": -43.9148063659668, "global_step": 339169, "epoch": 2803} {"train_loss": -43.74113845825195, "global_step": 339170, "epoch": 2803} {"train_loss": -44.428524017333984, "global_step": 339171, "epoch": 2803} {"train_loss": -44.49839401245117, "global_step": 339172, "epoch": 2803} {"train_loss": -43.92940902709961, "global_step": 339173, "epoch": 2803} {"train_loss": -43.674888610839844, "global_step": 339174, "epoch": 2803} {"train_loss": -44.49465560913086, "global_step": 339175, "epoch": 2803} {"train_loss": -43.71458435058594, "global_step": 339176, "epoch": 2803} {"train_loss": -43.12146759033203, "global_step": 339177, "epoch": 2803} {"train_loss": -44.05173873901367, "global_step": 339178, "epoch": 2803} {"train_loss": -43.45685577392578, "global_step": 339179, "epoch": 2803} {"train_loss": -43.10986328125, "global_step": 339180, "epoch": 2803} {"train_loss": -42.99943161010742, "global_step": 339181, "epoch": 2803} {"train_loss": -42.13882064819336, "global_step": 339182, "epoch": 2803} {"train_loss": -43.30670166015625, "global_step": 339183, "epoch": 2803} {"train_loss": -43.14677810668945, "global_step": 339184, "epoch": 2803} {"train_loss": -42.37973403930664, "global_step": 339185, "epoch": 2803} {"train_loss": -42.839935302734375, "global_step": 339186, "epoch": 2803} {"train_loss": -43.61282730102539, "global_step": 339187, "epoch": 2803} {"train_loss": -43.481807708740234, "global_step": 339188, "epoch": 2803} {"train_loss": -43.425533294677734, "global_step": 339189, "epoch": 2803} {"train_loss": -42.94898223876953, "global_step": 339190, "epoch": 2803} {"train_loss": -42.85235595703125, "global_step": 339191, "epoch": 2803} {"train_loss": -43.9390983581543, "global_step": 339192, "epoch": 2803} {"train_loss": -43.38190841674805, "global_step": 339193, "epoch": 2803} {"train_loss": -43.48845291137695, "global_step": 339194, "epoch": 2803} {"train_loss": -41.94171905517578, "global_step": 339195, "epoch": 2803} {"train_loss": -42.972042083740234, "global_step": 339196, "epoch": 2803} {"train_loss": -43.50051498413086, "global_step": 339197, "epoch": 2803} {"train_loss": -44.241146087646484, "global_step": 339198, "epoch": 2803} {"train_loss": -43.78953170776367, "global_step": 339199, "epoch": 2803} {"train_loss": -42.01535415649414, "global_step": 339200, "epoch": 2803} {"train_loss": -43.76750946044922, "global_step": 339201, "epoch": 2803} {"train_loss": -43.101837158203125, "global_step": 339202, "epoch": 2803} {"train_loss": -42.75313949584961, "global_step": 339203, "epoch": 2803} {"train_loss": -43.62971878051758, "global_step": 339204, "epoch": 2803} {"train_loss": -43.83020782470703, "global_step": 339205, "epoch": 2803} {"train_loss": -42.849666595458984, "global_step": 339206, "epoch": 2803} {"train_loss": -43.311317443847656, "global_step": 339207, "epoch": 2803} {"train_loss": -43.827980041503906, "global_step": 339208, "epoch": 2803} {"train_loss": -43.926544189453125, "global_step": 339209, "epoch": 2803} {"train_loss": -44.2501335144043, "global_step": 339210, "epoch": 2803} {"train_loss": -44.46345520019531, "global_step": 339211, "epoch": 2803} {"train_loss": -43.8835563659668, "global_step": 339212, "epoch": 2803} {"train_loss": -44.09968566894531, "global_step": 339213, "epoch": 2803} {"train_loss": -44.53049850463867, "global_step": 339214, "epoch": 2803} {"train_loss": -44.1447868347168, "global_step": 339215, "epoch": 2803} {"train_loss": -44.37224197387695, "global_step": 339216, "epoch": 2803} {"train_loss": -44.06047439575195, "global_step": 339217, "epoch": 2803} {"train_loss": -43.95294189453125, "global_step": 339218, "epoch": 2803} {"train_loss": -44.395294189453125, "global_step": 339219, "epoch": 2803} {"train_loss": -43.71247100830078, "global_step": 339220, "epoch": 2803} {"train_loss": -43.141075134277344, "global_step": 339221, "epoch": 2803} {"train_loss": -43.44793701171875, "global_step": 339222, "epoch": 2803} {"train_loss": -44.64794158935547, "global_step": 339223, "epoch": 2803} {"train_loss": -44.23623275756836, "global_step": 339224, "epoch": 2803} {"train_loss": -44.16549301147461, "global_step": 339225, "epoch": 2803} {"train_loss": -44.616790771484375, "global_step": 339226, "epoch": 2803} {"train_loss": -42.563262939453125, "global_step": 339227, "epoch": 2803} {"train_loss": -43.48651885986328, "global_step": 339228, "epoch": 2803} {"train_loss": -43.880489349365234, "global_step": 339229, "epoch": 2803} {"train_loss": -41.75520706176758, "global_step": 339230, "epoch": 2803} {"train_loss": -44.53646469116211, "global_step": 339231, "epoch": 2803} {"train_loss": -41.260284423828125, "global_step": 339232, "epoch": 2803} {"train_loss": -43.28109359741211, "global_step": 339233, "epoch": 2803} {"train_loss": -43.55440139770508, "global_step": 339234, "epoch": 2803} {"train_loss": -43.148719787597656, "global_step": 339235, "epoch": 2803} {"train_loss": -42.910552978515625, "global_step": 339236, "epoch": 2803} {"train_loss": -43.23841094970703, "global_step": 339237, "epoch": 2803} {"train_loss": -43.211666107177734, "global_step": 339238, "epoch": 2803} {"train_loss": -42.533260345458984, "global_step": 339239, "epoch": 2803} {"train_loss": -43.2489013671875, "global_step": 339240, "epoch": 2803} {"train_loss": -43.012603759765625, "global_step": 339241, "epoch": 2803} {"train_loss": -43.309852600097656, "global_step": 339242, "epoch": 2803} {"train_loss": -43.03416061401367, "global_step": 339243, "epoch": 2803} {"train_loss": -43.441585540771484, "global_step": 339244, "epoch": 2803} {"train_loss": -43.172508239746094, "global_step": 339245, "epoch": 2803} {"train_loss": -42.673763275146484, "global_step": 339246, "epoch": 2803} {"train_loss": -43.05648422241211, "global_step": 339247, "epoch": 2803} {"train_loss": -43.40212631225586, "global_step": 339248, "epoch": 2803} {"train_loss": -43.777130126953125, "global_step": 339249, "epoch": 2803} {"train_loss": -43.55082321166992, "global_step": 339250, "epoch": 2803} {"train_loss": -44.117897033691406, "global_step": 339251, "epoch": 2803} {"train_loss": -44.184608459472656, "global_step": 339252, "epoch": 2803} {"train_loss": -43.70005798339844, "global_step": 339253, "epoch": 2803} {"train_loss": -44.01831817626953, "global_step": 339254, "epoch": 2803} {"train_loss": -43.701942443847656, "global_step": 339255, "epoch": 2803} {"train_loss": -44.51631546020508, "global_step": 339256, "epoch": 2803} {"train_loss": -43.490840911865234, "global_step": 339257, "epoch": 2803} {"train_loss": -43.900238037109375, "global_step": 339258, "epoch": 2803} {"train_loss": -44.009700775146484, "global_step": 339259, "epoch": 2803} {"train_loss": -44.45998764038086, "global_step": 339260, "epoch": 2803} {"train_loss": -44.07534408569336, "global_step": 339261, "epoch": 2803} {"train_loss": -44.173553466796875, "global_step": 339262, "epoch": 2803} {"train_loss": -44.456233978271484, "global_step": 339263, "epoch": 2803} {"train_loss": -44.03936767578125, "global_step": 339264, "epoch": 2803} {"train_loss": -44.449790954589844, "global_step": 339265, "epoch": 2803} {"train_loss": -43.79081344604492, "global_step": 339266, "epoch": 2803} {"train_loss": -44.4793815612793, "global_step": 339267, "epoch": 2803} {"train_loss": -44.78479766845703, "global_step": 339268, "epoch": 2803} {"train_loss": -44.344520568847656, "global_step": 339269, "epoch": 2803} {"train_loss": -43.85158157348633, "global_step": 339270, "epoch": 2803} {"train_loss": -44.61116027832031, "global_step": 339271, "epoch": 2803} {"train_loss": -44.344356536865234, "global_step": 339272, "epoch": 2803} {"train_loss": -44.62725830078125, "global_step": 339273, "epoch": 2803} {"train_loss": -44.28096389770508, "global_step": 339274, "epoch": 2803} {"train_loss": -43.65485382080078, "global_step": 339275, "epoch": 2803} {"train_loss": -43.2194938659668, "global_step": 339276, "epoch": 2803} {"train_loss": -43.73393630981445, "global_step": 339277, "epoch": 2803} {"train_loss": -42.265743255615234, "global_step": 339278, "epoch": 2803} {"train_loss": -43.08138656616211, "global_step": 339279, "epoch": 2803} {"train_loss": -42.0470085144043, "global_step": 339280, "epoch": 2803} {"train_loss": -43.10543441772461, "global_step": 339281, "epoch": 2803} {"train_loss": -43.4219856262207, "global_step": 339282, "epoch": 2803} {"train_loss": -43.59225984053178, "global_step": 339283, "epoch": 2803, "val_loss": 2626174.0} {"train_loss": -44.184059143066406, "global_step": 339284, "epoch": 2804} {"train_loss": -44.5710563659668, "global_step": 339285, "epoch": 2804} {"train_loss": -44.206241607666016, "global_step": 339286, "epoch": 2804} {"train_loss": -43.380584716796875, "global_step": 339287, "epoch": 2804} {"train_loss": -43.34615707397461, "global_step": 339288, "epoch": 2804} {"train_loss": -43.519935607910156, "global_step": 339289, "epoch": 2804} {"train_loss": -44.06747055053711, "global_step": 339290, "epoch": 2804} {"train_loss": -43.7155876159668, "global_step": 339291, "epoch": 2804} {"train_loss": -43.33172607421875, "global_step": 339292, "epoch": 2804} {"train_loss": -41.7310791015625, "global_step": 339293, "epoch": 2804} {"train_loss": -44.44106674194336, "global_step": 339294, "epoch": 2804} {"train_loss": -42.04924392700195, "global_step": 339295, "epoch": 2804} {"train_loss": -41.66526412963867, "global_step": 339296, "epoch": 2804} {"train_loss": -43.42342758178711, "global_step": 339297, "epoch": 2804} {"train_loss": -40.07474899291992, "global_step": 339298, "epoch": 2804} {"train_loss": -43.88788604736328, "global_step": 339299, "epoch": 2804} {"train_loss": -41.15849685668945, "global_step": 339300, "epoch": 2804} {"train_loss": -42.202754974365234, "global_step": 339301, "epoch": 2804} {"train_loss": -43.003639221191406, "global_step": 339302, "epoch": 2804} {"train_loss": -42.76597213745117, "global_step": 339303, "epoch": 2804} {"train_loss": -41.61236572265625, "global_step": 339304, "epoch": 2804} {"train_loss": -43.49018859863281, "global_step": 339305, "epoch": 2804} {"train_loss": -42.784610748291016, "global_step": 339306, "epoch": 2804} {"train_loss": -42.07740783691406, "global_step": 339307, "epoch": 2804} {"train_loss": -44.17390060424805, "global_step": 339308, "epoch": 2804} {"train_loss": -41.43623352050781, "global_step": 339309, "epoch": 2804} {"train_loss": -42.76125717163086, "global_step": 339310, "epoch": 2804} {"train_loss": -43.645503997802734, "global_step": 339311, "epoch": 2804} {"train_loss": -41.81734085083008, "global_step": 339312, "epoch": 2804} {"train_loss": -44.17185592651367, "global_step": 339313, "epoch": 2804} {"train_loss": -42.37064743041992, "global_step": 339314, "epoch": 2804} {"train_loss": -42.7627067565918, "global_step": 339315, "epoch": 2804} {"train_loss": -43.17824172973633, "global_step": 339316, "epoch": 2804} {"train_loss": -41.64691925048828, "global_step": 339317, "epoch": 2804} {"train_loss": -43.19014358520508, "global_step": 339318, "epoch": 2804} {"train_loss": -42.593910217285156, "global_step": 339319, "epoch": 2804} {"train_loss": -43.475074768066406, "global_step": 339320, "epoch": 2804} {"train_loss": -40.95820236206055, "global_step": 339321, "epoch": 2804} {"train_loss": -43.82827377319336, "global_step": 339322, "epoch": 2804} {"train_loss": -42.941280364990234, "global_step": 339323, "epoch": 2804} {"train_loss": -42.74699020385742, "global_step": 339324, "epoch": 2804} {"train_loss": -43.461273193359375, "global_step": 339325, "epoch": 2804} {"train_loss": -42.71898651123047, "global_step": 339326, "epoch": 2804} {"train_loss": -43.18882751464844, "global_step": 339327, "epoch": 2804} {"train_loss": -42.7713508605957, "global_step": 339328, "epoch": 2804} {"train_loss": -43.506683349609375, "global_step": 339329, "epoch": 2804} {"train_loss": -42.76386642456055, "global_step": 339330, "epoch": 2804} {"train_loss": -44.175697326660156, "global_step": 339331, "epoch": 2804} {"train_loss": -43.12738800048828, "global_step": 339332, "epoch": 2804} {"train_loss": -43.15546798706055, "global_step": 339333, "epoch": 2804} {"train_loss": -42.90814208984375, "global_step": 339334, "epoch": 2804} {"train_loss": -43.03449630737305, "global_step": 339335, "epoch": 2804} {"train_loss": -42.22466278076172, "global_step": 339336, "epoch": 2804} {"train_loss": -43.134376525878906, "global_step": 339337, "epoch": 2804} {"train_loss": -43.243709564208984, "global_step": 339338, "epoch": 2804} {"train_loss": -42.887718200683594, "global_step": 339339, "epoch": 2804} {"train_loss": -43.51118087768555, "global_step": 339340, "epoch": 2804} {"train_loss": -43.6607666015625, "global_step": 339341, "epoch": 2804} {"train_loss": -43.29072189331055, "global_step": 339342, "epoch": 2804} {"train_loss": -44.00864791870117, "global_step": 339343, "epoch": 2804} {"train_loss": -43.49488830566406, "global_step": 339344, "epoch": 2804} {"train_loss": -42.5157585144043, "global_step": 339345, "epoch": 2804} {"train_loss": -43.773193359375, "global_step": 339346, "epoch": 2804} {"train_loss": -43.656105041503906, "global_step": 339347, "epoch": 2804} {"train_loss": -42.61224365234375, "global_step": 339348, "epoch": 2804} {"train_loss": -43.80851745605469, "global_step": 339349, "epoch": 2804} {"train_loss": -43.15830612182617, "global_step": 339350, "epoch": 2804} {"train_loss": -43.59452438354492, "global_step": 339351, "epoch": 2804} {"train_loss": -42.12911605834961, "global_step": 339352, "epoch": 2804} {"train_loss": -43.65816879272461, "global_step": 339353, "epoch": 2804} {"train_loss": -42.990787506103516, "global_step": 339354, "epoch": 2804} {"train_loss": -43.59780502319336, "global_step": 339355, "epoch": 2804} {"train_loss": -42.54376220703125, "global_step": 339356, "epoch": 2804} {"train_loss": -43.93793487548828, "global_step": 339357, "epoch": 2804} {"train_loss": -43.731510162353516, "global_step": 339358, "epoch": 2804} {"train_loss": -43.415740966796875, "global_step": 339359, "epoch": 2804} {"train_loss": -43.33930206298828, "global_step": 339360, "epoch": 2804} {"train_loss": -43.925506591796875, "global_step": 339361, "epoch": 2804} {"train_loss": -43.41511917114258, "global_step": 339362, "epoch": 2804} {"train_loss": -43.67184066772461, "global_step": 339363, "epoch": 2804} {"train_loss": -43.116485595703125, "global_step": 339364, "epoch": 2804} {"train_loss": -44.25822448730469, "global_step": 339365, "epoch": 2804} {"train_loss": -43.2878532409668, "global_step": 339366, "epoch": 2804} {"train_loss": -43.05336380004883, "global_step": 339367, "epoch": 2804} {"train_loss": -43.83707809448242, "global_step": 339368, "epoch": 2804} {"train_loss": -44.391136169433594, "global_step": 339369, "epoch": 2804} {"train_loss": -44.05217742919922, "global_step": 339370, "epoch": 2804} {"train_loss": -43.88732147216797, "global_step": 339371, "epoch": 2804} {"train_loss": -44.27164840698242, "global_step": 339372, "epoch": 2804} {"train_loss": -44.21782302856445, "global_step": 339373, "epoch": 2804} {"train_loss": -44.166255950927734, "global_step": 339374, "epoch": 2804} {"train_loss": -44.54340744018555, "global_step": 339375, "epoch": 2804} {"train_loss": -44.465877532958984, "global_step": 339376, "epoch": 2804} {"train_loss": -44.51374053955078, "global_step": 339377, "epoch": 2804} {"train_loss": -43.22251510620117, "global_step": 339378, "epoch": 2804} {"train_loss": -43.7264518737793, "global_step": 339379, "epoch": 2804} {"train_loss": -44.1588134765625, "global_step": 339380, "epoch": 2804} {"train_loss": -43.825862884521484, "global_step": 339381, "epoch": 2804} {"train_loss": -43.12098693847656, "global_step": 339382, "epoch": 2804} {"train_loss": -44.0012092590332, "global_step": 339383, "epoch": 2804} {"train_loss": -44.41281509399414, "global_step": 339384, "epoch": 2804} {"train_loss": -43.56340026855469, "global_step": 339385, "epoch": 2804} {"train_loss": -43.04598617553711, "global_step": 339386, "epoch": 2804} {"train_loss": -44.35405731201172, "global_step": 339387, "epoch": 2804} {"train_loss": -43.3465690612793, "global_step": 339388, "epoch": 2804} {"train_loss": -43.291690826416016, "global_step": 339389, "epoch": 2804} {"train_loss": -44.01201248168945, "global_step": 339390, "epoch": 2804} {"train_loss": -43.20830535888672, "global_step": 339391, "epoch": 2804} {"train_loss": -44.496734619140625, "global_step": 339392, "epoch": 2804} {"train_loss": -43.995113372802734, "global_step": 339393, "epoch": 2804} {"train_loss": -43.65630340576172, "global_step": 339394, "epoch": 2804} {"train_loss": -44.660762786865234, "global_step": 339395, "epoch": 2804} {"train_loss": -44.40972900390625, "global_step": 339396, "epoch": 2804} {"train_loss": -43.530921936035156, "global_step": 339397, "epoch": 2804} {"train_loss": -44.578826904296875, "global_step": 339398, "epoch": 2804} {"train_loss": -45.09357452392578, "global_step": 339399, "epoch": 2804} {"train_loss": -44.48625564575195, "global_step": 339400, "epoch": 2804} {"train_loss": -44.1452751159668, "global_step": 339401, "epoch": 2804} {"train_loss": -45.028594970703125, "global_step": 339402, "epoch": 2804} {"train_loss": -43.940425872802734, "global_step": 339403, "epoch": 2804} {"train_loss": -43.38237251723108, "global_step": 339404, "epoch": 2804, "val_loss": 2622827.75} {"train_loss": -44.65763473510742, "global_step": 339405, "epoch": 2805} {"train_loss": -44.21247482299805, "global_step": 339406, "epoch": 2805} {"train_loss": -44.58845901489258, "global_step": 339407, "epoch": 2805} {"train_loss": -44.8668098449707, "global_step": 339408, "epoch": 2805} {"train_loss": -44.76337432861328, "global_step": 339409, "epoch": 2805} {"train_loss": -44.98810958862305, "global_step": 339410, "epoch": 2805} {"train_loss": -44.50625228881836, "global_step": 339411, "epoch": 2805} {"train_loss": -45.42500686645508, "global_step": 339412, "epoch": 2805} {"train_loss": -44.535972595214844, "global_step": 339413, "epoch": 2805} {"train_loss": -44.53011703491211, "global_step": 339414, "epoch": 2805} {"train_loss": -45.30609893798828, "global_step": 339415, "epoch": 2805} {"train_loss": -44.68113327026367, "global_step": 339416, "epoch": 2805} {"train_loss": -44.36142349243164, "global_step": 339417, "epoch": 2805} {"train_loss": -44.14594650268555, "global_step": 339418, "epoch": 2805} {"train_loss": -44.76106643676758, "global_step": 339419, "epoch": 2805} {"train_loss": -43.81591796875, "global_step": 339420, "epoch": 2805} {"train_loss": -44.75197982788086, "global_step": 339421, "epoch": 2805} {"train_loss": -44.375587463378906, "global_step": 339422, "epoch": 2805} {"train_loss": -43.05847930908203, "global_step": 339423, "epoch": 2805} {"train_loss": -41.71269226074219, "global_step": 339424, "epoch": 2805} {"train_loss": -43.54429626464844, "global_step": 339425, "epoch": 2805} {"train_loss": -38.58179473876953, "global_step": 339426, "epoch": 2805} {"train_loss": -39.53395462036133, "global_step": 339427, "epoch": 2805} {"train_loss": -39.7467041015625, "global_step": 339428, "epoch": 2805} {"train_loss": -40.71928024291992, "global_step": 339429, "epoch": 2805} {"train_loss": -40.49290084838867, "global_step": 339430, "epoch": 2805} {"train_loss": -41.454158782958984, "global_step": 339431, "epoch": 2805} {"train_loss": -38.29008865356445, "global_step": 339432, "epoch": 2805} {"train_loss": -39.098812103271484, "global_step": 339433, "epoch": 2805} {"train_loss": -42.034786224365234, "global_step": 339434, "epoch": 2805} {"train_loss": -41.61804962158203, "global_step": 339435, "epoch": 2805} {"train_loss": -39.06144332885742, "global_step": 339436, "epoch": 2805} {"train_loss": -37.32769775390625, "global_step": 339437, "epoch": 2805} {"train_loss": -39.72053146362305, "global_step": 339438, "epoch": 2805} {"train_loss": -38.86928939819336, "global_step": 339439, "epoch": 2805} {"train_loss": -41.12969970703125, "global_step": 339440, "epoch": 2805} {"train_loss": -42.24203109741211, "global_step": 339441, "epoch": 2805} {"train_loss": -41.762054443359375, "global_step": 339442, "epoch": 2805} {"train_loss": -40.83958053588867, "global_step": 339443, "epoch": 2805} {"train_loss": -41.63911056518555, "global_step": 339444, "epoch": 2805} {"train_loss": -41.76414108276367, "global_step": 339445, "epoch": 2805} {"train_loss": -42.18254089355469, "global_step": 339446, "epoch": 2805} {"train_loss": -41.92770004272461, "global_step": 339447, "epoch": 2805} {"train_loss": -42.62209701538086, "global_step": 339448, "epoch": 2805} {"train_loss": -42.75323486328125, "global_step": 339449, "epoch": 2805} {"train_loss": -42.71723175048828, "global_step": 339450, "epoch": 2805} {"train_loss": -42.71946334838867, "global_step": 339451, "epoch": 2805} {"train_loss": -41.548160552978516, "global_step": 339452, "epoch": 2805} {"train_loss": -43.497657775878906, "global_step": 339453, "epoch": 2805} {"train_loss": -41.57087326049805, "global_step": 339454, "epoch": 2805} {"train_loss": -43.70235824584961, "global_step": 339455, "epoch": 2805} {"train_loss": -43.065242767333984, "global_step": 339456, "epoch": 2805} {"train_loss": -43.406063079833984, "global_step": 339457, "epoch": 2805} {"train_loss": -43.47080612182617, "global_step": 339458, "epoch": 2805} {"train_loss": -42.97137451171875, "global_step": 339459, "epoch": 2805} {"train_loss": -43.72510528564453, "global_step": 339460, "epoch": 2805} {"train_loss": -43.039581298828125, "global_step": 339461, "epoch": 2805} {"train_loss": -43.65145492553711, "global_step": 339462, "epoch": 2805} {"train_loss": -43.444942474365234, "global_step": 339463, "epoch": 2805} {"train_loss": -44.111854553222656, "global_step": 339464, "epoch": 2805} {"train_loss": -43.17255783081055, "global_step": 339465, "epoch": 2805} {"train_loss": -43.83066940307617, "global_step": 339466, "epoch": 2805} {"train_loss": -43.491493225097656, "global_step": 339467, "epoch": 2805} {"train_loss": -43.50112533569336, "global_step": 339468, "epoch": 2805} {"train_loss": -43.822662353515625, "global_step": 339469, "epoch": 2805} {"train_loss": -43.054412841796875, "global_step": 339470, "epoch": 2805} {"train_loss": -43.7491569519043, "global_step": 339471, "epoch": 2805} {"train_loss": -43.29013442993164, "global_step": 339472, "epoch": 2805} {"train_loss": -43.626708984375, "global_step": 339473, "epoch": 2805} {"train_loss": -43.26481246948242, "global_step": 339474, "epoch": 2805} {"train_loss": -43.48866271972656, "global_step": 339475, "epoch": 2805} {"train_loss": -43.282291412353516, "global_step": 339476, "epoch": 2805} {"train_loss": -44.063289642333984, "global_step": 339477, "epoch": 2805} {"train_loss": -43.21207809448242, "global_step": 339478, "epoch": 2805} {"train_loss": -43.86484909057617, "global_step": 339479, "epoch": 2805} {"train_loss": -43.860069274902344, "global_step": 339480, "epoch": 2805} {"train_loss": -43.667091369628906, "global_step": 339481, "epoch": 2805} {"train_loss": -44.276466369628906, "global_step": 339482, "epoch": 2805} {"train_loss": -44.39934158325195, "global_step": 339483, "epoch": 2805} {"train_loss": -43.805965423583984, "global_step": 339484, "epoch": 2805} {"train_loss": -44.273460388183594, "global_step": 339485, "epoch": 2805} {"train_loss": -44.33298873901367, "global_step": 339486, "epoch": 2805} {"train_loss": -44.76359939575195, "global_step": 339487, "epoch": 2805} {"train_loss": -43.354949951171875, "global_step": 339488, "epoch": 2805} {"train_loss": -44.61117935180664, "global_step": 339489, "epoch": 2805} {"train_loss": -44.06009292602539, "global_step": 339490, "epoch": 2805} {"train_loss": -44.174861907958984, "global_step": 339491, "epoch": 2805} {"train_loss": -44.35299301147461, "global_step": 339492, "epoch": 2805} {"train_loss": -44.76103591918945, "global_step": 339493, "epoch": 2805} {"train_loss": -44.9107551574707, "global_step": 339494, "epoch": 2805} {"train_loss": -44.49372100830078, "global_step": 339495, "epoch": 2805} {"train_loss": -44.60239791870117, "global_step": 339496, "epoch": 2805} {"train_loss": -44.388607025146484, "global_step": 339497, "epoch": 2805} {"train_loss": -44.45258712768555, "global_step": 339498, "epoch": 2805} {"train_loss": -44.953765869140625, "global_step": 339499, "epoch": 2805} {"train_loss": -44.406593322753906, "global_step": 339500, "epoch": 2805} {"train_loss": -44.993717193603516, "global_step": 339501, "epoch": 2805} {"train_loss": -44.91728591918945, "global_step": 339502, "epoch": 2805} {"train_loss": -44.893775939941406, "global_step": 339503, "epoch": 2805} {"train_loss": -44.6905632019043, "global_step": 339504, "epoch": 2805} {"train_loss": -44.65331268310547, "global_step": 339505, "epoch": 2805} {"train_loss": -45.24392318725586, "global_step": 339506, "epoch": 2805} {"train_loss": -45.24106979370117, "global_step": 339507, "epoch": 2805} {"train_loss": -45.00682067871094, "global_step": 339508, "epoch": 2805} {"train_loss": -44.58743667602539, "global_step": 339509, "epoch": 2805} {"train_loss": -45.07782745361328, "global_step": 339510, "epoch": 2805} {"train_loss": -45.388092041015625, "global_step": 339511, "epoch": 2805} {"train_loss": -45.07072448730469, "global_step": 339512, "epoch": 2805} {"train_loss": -44.55926513671875, "global_step": 339513, "epoch": 2805} {"train_loss": -45.09674072265625, "global_step": 339514, "epoch": 2805} {"train_loss": -44.76416015625, "global_step": 339515, "epoch": 2805} {"train_loss": -44.514129638671875, "global_step": 339516, "epoch": 2805} {"train_loss": -45.25172424316406, "global_step": 339517, "epoch": 2805} {"train_loss": -44.9061164855957, "global_step": 339518, "epoch": 2805} {"train_loss": -44.30434799194336, "global_step": 339519, "epoch": 2805} {"train_loss": -44.64613723754883, "global_step": 339520, "epoch": 2805} {"train_loss": -44.73003005981445, "global_step": 339521, "epoch": 2805} {"train_loss": -44.41035079956055, "global_step": 339522, "epoch": 2805} {"train_loss": -44.23185348510742, "global_step": 339523, "epoch": 2805} {"train_loss": -44.9869384765625, "global_step": 339524, "epoch": 2805} {"train_loss": -43.44579252132699, "global_step": 339525, "epoch": 2805, "val_loss": 2587404.25} {"train_loss": -43.23519515991211, "global_step": 339526, "epoch": 2806} {"train_loss": -43.7490348815918, "global_step": 339527, "epoch": 2806} {"train_loss": -43.27342224121094, "global_step": 339528, "epoch": 2806} {"train_loss": -44.58950424194336, "global_step": 339529, "epoch": 2806} {"train_loss": -41.962799072265625, "global_step": 339530, "epoch": 2806} {"train_loss": -40.193939208984375, "global_step": 339531, "epoch": 2806} {"train_loss": -40.371700286865234, "global_step": 339532, "epoch": 2806} {"train_loss": -42.645362854003906, "global_step": 339533, "epoch": 2806} {"train_loss": -42.78255844116211, "global_step": 339534, "epoch": 2806} {"train_loss": -43.935482025146484, "global_step": 339535, "epoch": 2806} {"train_loss": -43.345916748046875, "global_step": 339536, "epoch": 2806} {"train_loss": -38.7596435546875, "global_step": 339537, "epoch": 2806} {"train_loss": -38.907623291015625, "global_step": 339538, "epoch": 2806} {"train_loss": -38.45304489135742, "global_step": 339539, "epoch": 2806} {"train_loss": -40.82487106323242, "global_step": 339540, "epoch": 2806} {"train_loss": -39.24613571166992, "global_step": 339541, "epoch": 2806} {"train_loss": -33.32838439941406, "global_step": 339542, "epoch": 2806} {"train_loss": -41.51888656616211, "global_step": 339543, "epoch": 2806} {"train_loss": -33.46610641479492, "global_step": 339544, "epoch": 2806} {"train_loss": -37.86627960205078, "global_step": 339545, "epoch": 2806} {"train_loss": -37.75187301635742, "global_step": 339546, "epoch": 2806} {"train_loss": -35.35752487182617, "global_step": 339547, "epoch": 2806} {"train_loss": -40.183807373046875, "global_step": 339548, "epoch": 2806} {"train_loss": -38.228370666503906, "global_step": 339549, "epoch": 2806} {"train_loss": -38.41199493408203, "global_step": 339550, "epoch": 2806} {"train_loss": -42.52777099609375, "global_step": 339551, "epoch": 2806} {"train_loss": -39.181819915771484, "global_step": 339552, "epoch": 2806} {"train_loss": -42.14902877807617, "global_step": 339553, "epoch": 2806} {"train_loss": -40.78098678588867, "global_step": 339554, "epoch": 2806} {"train_loss": -42.27338790893555, "global_step": 339555, "epoch": 2806} {"train_loss": -40.30936813354492, "global_step": 339556, "epoch": 2806} {"train_loss": -42.839630126953125, "global_step": 339557, "epoch": 2806} {"train_loss": -41.08185958862305, "global_step": 339558, "epoch": 2806} {"train_loss": -43.43437957763672, "global_step": 339559, "epoch": 2806} {"train_loss": -41.16950225830078, "global_step": 339560, "epoch": 2806} {"train_loss": -42.98099899291992, "global_step": 339561, "epoch": 2806} {"train_loss": -42.040096282958984, "global_step": 339562, "epoch": 2806} {"train_loss": -43.27628707885742, "global_step": 339563, "epoch": 2806} {"train_loss": -41.44694519042969, "global_step": 339564, "epoch": 2806} {"train_loss": -43.07489013671875, "global_step": 339565, "epoch": 2806} {"train_loss": -43.056854248046875, "global_step": 339566, "epoch": 2806} {"train_loss": -42.48810577392578, "global_step": 339567, "epoch": 2806} {"train_loss": -42.70478057861328, "global_step": 339568, "epoch": 2806} {"train_loss": -42.63591384887695, "global_step": 339569, "epoch": 2806} {"train_loss": -43.76436996459961, "global_step": 339570, "epoch": 2806} {"train_loss": -43.307315826416016, "global_step": 339571, "epoch": 2806} {"train_loss": -43.78704833984375, "global_step": 339572, "epoch": 2806} {"train_loss": -43.951454162597656, "global_step": 339573, "epoch": 2806} {"train_loss": -43.578651428222656, "global_step": 339574, "epoch": 2806} {"train_loss": -43.834346771240234, "global_step": 339575, "epoch": 2806} {"train_loss": -43.43476486206055, "global_step": 339576, "epoch": 2806} {"train_loss": -43.908565521240234, "global_step": 339577, "epoch": 2806} {"train_loss": -43.76462936401367, "global_step": 339578, "epoch": 2806} {"train_loss": -43.249446868896484, "global_step": 339579, "epoch": 2806} {"train_loss": -43.50216293334961, "global_step": 339580, "epoch": 2806} {"train_loss": -43.80025100708008, "global_step": 339581, "epoch": 2806} {"train_loss": -44.29929733276367, "global_step": 339582, "epoch": 2806} {"train_loss": -44.21723556518555, "global_step": 339583, "epoch": 2806} {"train_loss": -44.47724533081055, "global_step": 339584, "epoch": 2806} {"train_loss": -43.643409729003906, "global_step": 339585, "epoch": 2806} {"train_loss": -44.398681640625, "global_step": 339586, "epoch": 2806} {"train_loss": -44.302085876464844, "global_step": 339587, "epoch": 2806} {"train_loss": -44.22966003417969, "global_step": 339588, "epoch": 2806} {"train_loss": -44.394752502441406, "global_step": 339589, "epoch": 2806} {"train_loss": -44.07355880737305, "global_step": 339590, "epoch": 2806} {"train_loss": -44.70103073120117, "global_step": 339591, "epoch": 2806} {"train_loss": -44.51079177856445, "global_step": 339592, "epoch": 2806} {"train_loss": -44.57404708862305, "global_step": 339593, "epoch": 2806} {"train_loss": -44.61946487426758, "global_step": 339594, "epoch": 2806} {"train_loss": -44.48709487915039, "global_step": 339595, "epoch": 2806} {"train_loss": -44.21221923828125, "global_step": 339596, "epoch": 2806} {"train_loss": -44.19599533081055, "global_step": 339597, "epoch": 2806} {"train_loss": -45.00165939331055, "global_step": 339598, "epoch": 2806} {"train_loss": -44.820465087890625, "global_step": 339599, "epoch": 2806} {"train_loss": -44.9564094543457, "global_step": 339600, "epoch": 2806} {"train_loss": -44.80760192871094, "global_step": 339601, "epoch": 2806} {"train_loss": -44.804439544677734, "global_step": 339602, "epoch": 2806} {"train_loss": -44.79423141479492, "global_step": 339603, "epoch": 2806} {"train_loss": -44.686641693115234, "global_step": 339604, "epoch": 2806} {"train_loss": -44.75320053100586, "global_step": 339605, "epoch": 2806} {"train_loss": -44.60136795043945, "global_step": 339606, "epoch": 2806} {"train_loss": -44.47623825073242, "global_step": 339607, "epoch": 2806} {"train_loss": -44.9656867980957, "global_step": 339608, "epoch": 2806} {"train_loss": -44.775787353515625, "global_step": 339609, "epoch": 2806} {"train_loss": -44.844505310058594, "global_step": 339610, "epoch": 2806} {"train_loss": -44.99933624267578, "global_step": 339611, "epoch": 2806} {"train_loss": -45.13873291015625, "global_step": 339612, "epoch": 2806} {"train_loss": -45.33889389038086, "global_step": 339613, "epoch": 2806} {"train_loss": -45.075286865234375, "global_step": 339614, "epoch": 2806} {"train_loss": -44.86592483520508, "global_step": 339615, "epoch": 2806} {"train_loss": -44.38666534423828, "global_step": 339616, "epoch": 2806} {"train_loss": -44.95962142944336, "global_step": 339617, "epoch": 2806} {"train_loss": -45.16128158569336, "global_step": 339618, "epoch": 2806} {"train_loss": -44.79274368286133, "global_step": 339619, "epoch": 2806} {"train_loss": -44.80622482299805, "global_step": 339620, "epoch": 2806} {"train_loss": -44.970436096191406, "global_step": 339621, "epoch": 2806} {"train_loss": -44.93813705444336, "global_step": 339622, "epoch": 2806} {"train_loss": -44.82320022583008, "global_step": 339623, "epoch": 2806} {"train_loss": -44.67228317260742, "global_step": 339624, "epoch": 2806} {"train_loss": -44.691402435302734, "global_step": 339625, "epoch": 2806} {"train_loss": -43.289485931396484, "global_step": 339626, "epoch": 2806} {"train_loss": -41.31307601928711, "global_step": 339627, "epoch": 2806} {"train_loss": -41.96977615356445, "global_step": 339628, "epoch": 2806} {"train_loss": -40.864173889160156, "global_step": 339629, "epoch": 2806} {"train_loss": -41.23896408081055, "global_step": 339630, "epoch": 2806} {"train_loss": -37.782711029052734, "global_step": 339631, "epoch": 2806} {"train_loss": -40.343074798583984, "global_step": 339632, "epoch": 2806} {"train_loss": -43.625057220458984, "global_step": 339633, "epoch": 2806} {"train_loss": -39.050716400146484, "global_step": 339634, "epoch": 2806} {"train_loss": -40.75342559814453, "global_step": 339635, "epoch": 2806} {"train_loss": -40.68111801147461, "global_step": 339636, "epoch": 2806} {"train_loss": -37.960304260253906, "global_step": 339637, "epoch": 2806} {"train_loss": -42.013431549072266, "global_step": 339638, "epoch": 2806} {"train_loss": -40.962364196777344, "global_step": 339639, "epoch": 2806} {"train_loss": -42.71623611450195, "global_step": 339640, "epoch": 2806} {"train_loss": -41.44367599487305, "global_step": 339641, "epoch": 2806} {"train_loss": -42.131221771240234, "global_step": 339642, "epoch": 2806} {"train_loss": -40.228084564208984, "global_step": 339643, "epoch": 2806} {"train_loss": -40.26238250732422, "global_step": 339644, "epoch": 2806} {"train_loss": -41.13433074951172, "global_step": 339645, "epoch": 2806} {"train_loss": -42.57845397823113, "global_step": 339646, "epoch": 2806, "val_loss": 2655235.25} {"train_loss": -41.228633880615234, "global_step": 339647, "epoch": 2807} {"train_loss": -42.24252700805664, "global_step": 339648, "epoch": 2807} {"train_loss": -41.41740417480469, "global_step": 339649, "epoch": 2807} {"train_loss": -40.99184799194336, "global_step": 339650, "epoch": 2807} {"train_loss": -41.346038818359375, "global_step": 339651, "epoch": 2807} {"train_loss": -41.28300857543945, "global_step": 339652, "epoch": 2807} {"train_loss": -42.76865768432617, "global_step": 339653, "epoch": 2807} {"train_loss": -42.1351432800293, "global_step": 339654, "epoch": 2807} {"train_loss": -41.939903259277344, "global_step": 339655, "epoch": 2807} {"train_loss": -41.97706985473633, "global_step": 339656, "epoch": 2807} {"train_loss": -43.233619689941406, "global_step": 339657, "epoch": 2807} {"train_loss": -42.7558708190918, "global_step": 339658, "epoch": 2807} {"train_loss": -42.8006477355957, "global_step": 339659, "epoch": 2807} {"train_loss": -42.42782974243164, "global_step": 339660, "epoch": 2807} {"train_loss": -43.769466400146484, "global_step": 339661, "epoch": 2807} {"train_loss": -43.123321533203125, "global_step": 339662, "epoch": 2807} {"train_loss": -42.4722900390625, "global_step": 339663, "epoch": 2807} {"train_loss": -43.718170166015625, "global_step": 339664, "epoch": 2807} {"train_loss": -43.043209075927734, "global_step": 339665, "epoch": 2807} {"train_loss": -43.5603141784668, "global_step": 339666, "epoch": 2807} {"train_loss": -42.99728012084961, "global_step": 339667, "epoch": 2807} {"train_loss": -43.40167999267578, "global_step": 339668, "epoch": 2807} {"train_loss": -43.249305725097656, "global_step": 339669, "epoch": 2807} {"train_loss": -43.14866638183594, "global_step": 339670, "epoch": 2807} {"train_loss": -43.69858932495117, "global_step": 339671, "epoch": 2807} {"train_loss": -43.708621978759766, "global_step": 339672, "epoch": 2807} {"train_loss": -44.27729034423828, "global_step": 339673, "epoch": 2807} {"train_loss": -43.94337844848633, "global_step": 339674, "epoch": 2807} {"train_loss": -43.97643280029297, "global_step": 339675, "epoch": 2807} {"train_loss": -43.96790313720703, "global_step": 339676, "epoch": 2807} {"train_loss": -43.5474967956543, "global_step": 339677, "epoch": 2807} {"train_loss": -44.64535140991211, "global_step": 339678, "epoch": 2807} {"train_loss": -43.6651725769043, "global_step": 339679, "epoch": 2807} {"train_loss": -44.133182525634766, "global_step": 339680, "epoch": 2807} {"train_loss": -43.841732025146484, "global_step": 339681, "epoch": 2807} {"train_loss": -43.614463806152344, "global_step": 339682, "epoch": 2807} {"train_loss": -44.16875076293945, "global_step": 339683, "epoch": 2807} {"train_loss": -43.67531967163086, "global_step": 339684, "epoch": 2807} {"train_loss": -43.95524215698242, "global_step": 339685, "epoch": 2807} {"train_loss": -43.852027893066406, "global_step": 339686, "epoch": 2807} {"train_loss": -44.512611389160156, "global_step": 339687, "epoch": 2807} {"train_loss": -44.628204345703125, "global_step": 339688, "epoch": 2807} {"train_loss": -43.74947738647461, "global_step": 339689, "epoch": 2807} {"train_loss": -44.85749435424805, "global_step": 339690, "epoch": 2807} {"train_loss": -44.64498519897461, "global_step": 339691, "epoch": 2807} {"train_loss": -44.3245964050293, "global_step": 339692, "epoch": 2807} {"train_loss": -45.01669692993164, "global_step": 339693, "epoch": 2807} {"train_loss": -44.53642654418945, "global_step": 339694, "epoch": 2807} {"train_loss": -44.68427658081055, "global_step": 339695, "epoch": 2807} {"train_loss": -44.77601623535156, "global_step": 339696, "epoch": 2807} {"train_loss": -44.79050064086914, "global_step": 339697, "epoch": 2807} {"train_loss": -45.024688720703125, "global_step": 339698, "epoch": 2807} {"train_loss": -45.053871154785156, "global_step": 339699, "epoch": 2807} {"train_loss": -45.01556396484375, "global_step": 339700, "epoch": 2807} {"train_loss": -44.570125579833984, "global_step": 339701, "epoch": 2807} {"train_loss": -44.832210540771484, "global_step": 339702, "epoch": 2807} {"train_loss": -44.72739791870117, "global_step": 339703, "epoch": 2807} {"train_loss": -44.68164825439453, "global_step": 339704, "epoch": 2807} {"train_loss": -44.79582595825195, "global_step": 339705, "epoch": 2807} {"train_loss": -44.69524002075195, "global_step": 339706, "epoch": 2807} {"train_loss": -45.38344955444336, "global_step": 339707, "epoch": 2807} {"train_loss": -44.90217208862305, "global_step": 339708, "epoch": 2807} {"train_loss": -44.790409088134766, "global_step": 339709, "epoch": 2807} {"train_loss": -45.087379455566406, "global_step": 339710, "epoch": 2807} {"train_loss": -45.05103302001953, "global_step": 339711, "epoch": 2807} {"train_loss": -45.05750274658203, "global_step": 339712, "epoch": 2807} {"train_loss": -45.36806869506836, "global_step": 339713, "epoch": 2807} {"train_loss": -44.865997314453125, "global_step": 339714, "epoch": 2807} {"train_loss": -45.0670280456543, "global_step": 339715, "epoch": 2807} {"train_loss": -45.14950180053711, "global_step": 339716, "epoch": 2807} {"train_loss": -45.19453811645508, "global_step": 339717, "epoch": 2807} {"train_loss": -45.40658950805664, "global_step": 339718, "epoch": 2807} {"train_loss": -45.06229782104492, "global_step": 339719, "epoch": 2807} {"train_loss": -45.08558654785156, "global_step": 339720, "epoch": 2807} {"train_loss": -45.101444244384766, "global_step": 339721, "epoch": 2807} {"train_loss": -45.10857009887695, "global_step": 339722, "epoch": 2807} {"train_loss": -45.005977630615234, "global_step": 339723, "epoch": 2807} {"train_loss": -45.186012268066406, "global_step": 339724, "epoch": 2807} {"train_loss": -45.5374641418457, "global_step": 339725, "epoch": 2807} {"train_loss": -45.141902923583984, "global_step": 339726, "epoch": 2807} {"train_loss": -44.7450065612793, "global_step": 339727, "epoch": 2807} {"train_loss": -45.328041076660156, "global_step": 339728, "epoch": 2807} {"train_loss": -44.408973693847656, "global_step": 339729, "epoch": 2807} {"train_loss": -44.147552490234375, "global_step": 339730, "epoch": 2807} {"train_loss": -42.163543701171875, "global_step": 339731, "epoch": 2807} {"train_loss": -43.504154205322266, "global_step": 339732, "epoch": 2807} {"train_loss": -43.35087585449219, "global_step": 339733, "epoch": 2807} {"train_loss": -41.78910446166992, "global_step": 339734, "epoch": 2807} {"train_loss": -41.923316955566406, "global_step": 339735, "epoch": 2807} {"train_loss": -40.495357513427734, "global_step": 339736, "epoch": 2807} {"train_loss": -43.70981216430664, "global_step": 339737, "epoch": 2807} {"train_loss": -40.75405502319336, "global_step": 339738, "epoch": 2807} {"train_loss": -42.74428939819336, "global_step": 339739, "epoch": 2807} {"train_loss": -43.02190017700195, "global_step": 339740, "epoch": 2807} {"train_loss": -39.24601364135742, "global_step": 339741, "epoch": 2807} {"train_loss": -43.685455322265625, "global_step": 339742, "epoch": 2807} {"train_loss": -40.25464630126953, "global_step": 339743, "epoch": 2807} {"train_loss": -40.990150451660156, "global_step": 339744, "epoch": 2807} {"train_loss": -43.08134841918945, "global_step": 339745, "epoch": 2807} {"train_loss": -37.76255416870117, "global_step": 339746, "epoch": 2807} {"train_loss": -42.1942024230957, "global_step": 339747, "epoch": 2807} {"train_loss": -35.2012825012207, "global_step": 339748, "epoch": 2807} {"train_loss": -39.012237548828125, "global_step": 339749, "epoch": 2807} {"train_loss": -41.11906051635742, "global_step": 339750, "epoch": 2807} {"train_loss": -35.900753021240234, "global_step": 339751, "epoch": 2807} {"train_loss": -39.32998275756836, "global_step": 339752, "epoch": 2807} {"train_loss": -41.40053939819336, "global_step": 339753, "epoch": 2807} {"train_loss": -38.852699279785156, "global_step": 339754, "epoch": 2807} {"train_loss": -42.58549118041992, "global_step": 339755, "epoch": 2807} {"train_loss": -38.55842208862305, "global_step": 339756, "epoch": 2807} {"train_loss": -42.72791290283203, "global_step": 339757, "epoch": 2807} {"train_loss": -40.8989143371582, "global_step": 339758, "epoch": 2807} {"train_loss": -41.390933990478516, "global_step": 339759, "epoch": 2807} {"train_loss": -42.05852127075195, "global_step": 339760, "epoch": 2807} {"train_loss": -40.64335632324219, "global_step": 339761, "epoch": 2807} {"train_loss": -41.42845916748047, "global_step": 339762, "epoch": 2807} {"train_loss": -40.860347747802734, "global_step": 339763, "epoch": 2807} {"train_loss": -42.877437591552734, "global_step": 339764, "epoch": 2807} {"train_loss": -40.437862396240234, "global_step": 339765, "epoch": 2807} {"train_loss": -42.76215744018555, "global_step": 339766, "epoch": 2807} {"train_loss": -43.131998960636864, "global_step": 339767, "epoch": 2807, "val_loss": 2614293.75} {"train_loss": -42.06039047241211, "global_step": 339768, "epoch": 2808} {"train_loss": -42.59342575073242, "global_step": 339769, "epoch": 2808} {"train_loss": -42.20905685424805, "global_step": 339770, "epoch": 2808} {"train_loss": -41.9044303894043, "global_step": 339771, "epoch": 2808} {"train_loss": -43.161529541015625, "global_step": 339772, "epoch": 2808} {"train_loss": -42.454872131347656, "global_step": 339773, "epoch": 2808} {"train_loss": -42.21055221557617, "global_step": 339774, "epoch": 2808} {"train_loss": -42.33293151855469, "global_step": 339775, "epoch": 2808} {"train_loss": -42.361690521240234, "global_step": 339776, "epoch": 2808} {"train_loss": -43.34840393066406, "global_step": 339777, "epoch": 2808} {"train_loss": -41.99809646606445, "global_step": 339778, "epoch": 2808} {"train_loss": -43.4749641418457, "global_step": 339779, "epoch": 2808} {"train_loss": -42.751277923583984, "global_step": 339780, "epoch": 2808} {"train_loss": -42.83660888671875, "global_step": 339781, "epoch": 2808} {"train_loss": -42.73326873779297, "global_step": 339782, "epoch": 2808} {"train_loss": -43.00904083251953, "global_step": 339783, "epoch": 2808} {"train_loss": -43.57001876831055, "global_step": 339784, "epoch": 2808} {"train_loss": -43.15212631225586, "global_step": 339785, "epoch": 2808} {"train_loss": -43.905914306640625, "global_step": 339786, "epoch": 2808} {"train_loss": -43.8513069152832, "global_step": 339787, "epoch": 2808} {"train_loss": -43.92079162597656, "global_step": 339788, "epoch": 2808} {"train_loss": -43.78211212158203, "global_step": 339789, "epoch": 2808} {"train_loss": -43.714115142822266, "global_step": 339790, "epoch": 2808} {"train_loss": -44.031436920166016, "global_step": 339791, "epoch": 2808} {"train_loss": -43.338863372802734, "global_step": 339792, "epoch": 2808} {"train_loss": -44.19315719604492, "global_step": 339793, "epoch": 2808} {"train_loss": -43.95985412597656, "global_step": 339794, "epoch": 2808} {"train_loss": -43.624366760253906, "global_step": 339795, "epoch": 2808} {"train_loss": -43.855777740478516, "global_step": 339796, "epoch": 2808} {"train_loss": -43.91661834716797, "global_step": 339797, "epoch": 2808} {"train_loss": -44.38559341430664, "global_step": 339798, "epoch": 2808} {"train_loss": -43.99414825439453, "global_step": 339799, "epoch": 2808} {"train_loss": -44.42177200317383, "global_step": 339800, "epoch": 2808} {"train_loss": -44.748191833496094, "global_step": 339801, "epoch": 2808} {"train_loss": -44.333953857421875, "global_step": 339802, "epoch": 2808} {"train_loss": -44.50803756713867, "global_step": 339803, "epoch": 2808} {"train_loss": -44.49243927001953, "global_step": 339804, "epoch": 2808} {"train_loss": -44.64851379394531, "global_step": 339805, "epoch": 2808} {"train_loss": -44.71369934082031, "global_step": 339806, "epoch": 2808} {"train_loss": -45.1123161315918, "global_step": 339807, "epoch": 2808} {"train_loss": -44.68735885620117, "global_step": 339808, "epoch": 2808} {"train_loss": -44.63151168823242, "global_step": 339809, "epoch": 2808} {"train_loss": -44.82683181762695, "global_step": 339810, "epoch": 2808} {"train_loss": -44.61460494995117, "global_step": 339811, "epoch": 2808} {"train_loss": -45.0207405090332, "global_step": 339812, "epoch": 2808} {"train_loss": -45.04107666015625, "global_step": 339813, "epoch": 2808} {"train_loss": -44.81247329711914, "global_step": 339814, "epoch": 2808} {"train_loss": -44.76337814331055, "global_step": 339815, "epoch": 2808} {"train_loss": -45.32596969604492, "global_step": 339816, "epoch": 2808} {"train_loss": -45.06879425048828, "global_step": 339817, "epoch": 2808} {"train_loss": -44.725189208984375, "global_step": 339818, "epoch": 2808} {"train_loss": -45.250911712646484, "global_step": 339819, "epoch": 2808} {"train_loss": -44.690792083740234, "global_step": 339820, "epoch": 2808} {"train_loss": -44.915584564208984, "global_step": 339821, "epoch": 2808} {"train_loss": -45.0977668762207, "global_step": 339822, "epoch": 2808} {"train_loss": -45.232826232910156, "global_step": 339823, "epoch": 2808} {"train_loss": -44.869075775146484, "global_step": 339824, "epoch": 2808} {"train_loss": -44.500770568847656, "global_step": 339825, "epoch": 2808} {"train_loss": -45.16262435913086, "global_step": 339826, "epoch": 2808} {"train_loss": -45.19122314453125, "global_step": 339827, "epoch": 2808} {"train_loss": -45.220191955566406, "global_step": 339828, "epoch": 2808} {"train_loss": -45.18779754638672, "global_step": 339829, "epoch": 2808} {"train_loss": -44.452388763427734, "global_step": 339830, "epoch": 2808} {"train_loss": -44.212554931640625, "global_step": 339831, "epoch": 2808} {"train_loss": -44.30079650878906, "global_step": 339832, "epoch": 2808} {"train_loss": -45.11487579345703, "global_step": 339833, "epoch": 2808} {"train_loss": -44.495906829833984, "global_step": 339834, "epoch": 2808} {"train_loss": -44.410888671875, "global_step": 339835, "epoch": 2808} {"train_loss": -44.486690521240234, "global_step": 339836, "epoch": 2808} {"train_loss": -44.52361297607422, "global_step": 339837, "epoch": 2808} {"train_loss": -43.74248504638672, "global_step": 339838, "epoch": 2808} {"train_loss": -44.1277961730957, "global_step": 339839, "epoch": 2808} {"train_loss": -44.701446533203125, "global_step": 339840, "epoch": 2808} {"train_loss": -44.509273529052734, "global_step": 339841, "epoch": 2808} {"train_loss": -43.301246643066406, "global_step": 339842, "epoch": 2808} {"train_loss": -42.8557243347168, "global_step": 339843, "epoch": 2808} {"train_loss": -42.76530075073242, "global_step": 339844, "epoch": 2808} {"train_loss": -43.2363166809082, "global_step": 339845, "epoch": 2808} {"train_loss": -43.07674789428711, "global_step": 339846, "epoch": 2808} {"train_loss": -43.683502197265625, "global_step": 339847, "epoch": 2808} {"train_loss": -43.95144271850586, "global_step": 339848, "epoch": 2808} {"train_loss": -43.63458251953125, "global_step": 339849, "epoch": 2808} {"train_loss": -43.268653869628906, "global_step": 339850, "epoch": 2808} {"train_loss": -44.171688079833984, "global_step": 339851, "epoch": 2808} {"train_loss": -40.88701248168945, "global_step": 339852, "epoch": 2808} {"train_loss": -39.39099884033203, "global_step": 339853, "epoch": 2808} {"train_loss": -44.33927536010742, "global_step": 339854, "epoch": 2808} {"train_loss": -40.98451614379883, "global_step": 339855, "epoch": 2808} {"train_loss": -38.789546966552734, "global_step": 339856, "epoch": 2808} {"train_loss": -41.078617095947266, "global_step": 339857, "epoch": 2808} {"train_loss": -42.70591354370117, "global_step": 339858, "epoch": 2808} {"train_loss": -41.98202896118164, "global_step": 339859, "epoch": 2808} {"train_loss": -41.73634338378906, "global_step": 339860, "epoch": 2808} {"train_loss": -39.84449768066406, "global_step": 339861, "epoch": 2808} {"train_loss": -42.867958068847656, "global_step": 339862, "epoch": 2808} {"train_loss": -44.57758331298828, "global_step": 339863, "epoch": 2808} {"train_loss": -40.99058151245117, "global_step": 339864, "epoch": 2808} {"train_loss": -41.93356704711914, "global_step": 339865, "epoch": 2808} {"train_loss": -43.848384857177734, "global_step": 339866, "epoch": 2808} {"train_loss": -41.670467376708984, "global_step": 339867, "epoch": 2808} {"train_loss": -40.918067932128906, "global_step": 339868, "epoch": 2808} {"train_loss": -44.13705062866211, "global_step": 339869, "epoch": 2808} {"train_loss": -39.746246337890625, "global_step": 339870, "epoch": 2808} {"train_loss": -42.59138870239258, "global_step": 339871, "epoch": 2808} {"train_loss": -43.30337142944336, "global_step": 339872, "epoch": 2808} {"train_loss": -41.707035064697266, "global_step": 339873, "epoch": 2808} {"train_loss": -43.495113372802734, "global_step": 339874, "epoch": 2808} {"train_loss": -42.71328353881836, "global_step": 339875, "epoch": 2808} {"train_loss": -44.25703811645508, "global_step": 339876, "epoch": 2808} {"train_loss": -43.071929931640625, "global_step": 339877, "epoch": 2808} {"train_loss": -41.984439849853516, "global_step": 339878, "epoch": 2808} {"train_loss": -44.40899658203125, "global_step": 339879, "epoch": 2808} {"train_loss": -43.34548568725586, "global_step": 339880, "epoch": 2808} {"train_loss": -42.984249114990234, "global_step": 339881, "epoch": 2808} {"train_loss": -44.218563079833984, "global_step": 339882, "epoch": 2808} {"train_loss": -43.80880355834961, "global_step": 339883, "epoch": 2808} {"train_loss": -44.05299758911133, "global_step": 339884, "epoch": 2808} {"train_loss": -43.6302375793457, "global_step": 339885, "epoch": 2808} {"train_loss": -44.17485427856445, "global_step": 339886, "epoch": 2808} {"train_loss": -44.46046447753906, "global_step": 339887, "epoch": 2808} {"train_loss": -43.55470565922004, "global_step": 339888, "epoch": 2808, "val_loss": 2649705.75} {"train_loss": -43.7060661315918, "global_step": 339889, "epoch": 2809} {"train_loss": -44.18402862548828, "global_step": 339890, "epoch": 2809} {"train_loss": -44.20026779174805, "global_step": 339891, "epoch": 2809} {"train_loss": -43.82843017578125, "global_step": 339892, "epoch": 2809} {"train_loss": -44.43921661376953, "global_step": 339893, "epoch": 2809} {"train_loss": -41.43787384033203, "global_step": 339894, "epoch": 2809} {"train_loss": -44.2307014465332, "global_step": 339895, "epoch": 2809} {"train_loss": -44.22727584838867, "global_step": 339896, "epoch": 2809} {"train_loss": -44.25927734375, "global_step": 339897, "epoch": 2809} {"train_loss": -44.15930938720703, "global_step": 339898, "epoch": 2809} {"train_loss": -44.2480583190918, "global_step": 339899, "epoch": 2809} {"train_loss": -44.164302825927734, "global_step": 339900, "epoch": 2809} {"train_loss": -44.11946487426758, "global_step": 339901, "epoch": 2809} {"train_loss": -43.92875289916992, "global_step": 339902, "epoch": 2809} {"train_loss": -43.63296127319336, "global_step": 339903, "epoch": 2809} {"train_loss": -43.63604736328125, "global_step": 339904, "epoch": 2809} {"train_loss": -44.93486785888672, "global_step": 339905, "epoch": 2809} {"train_loss": -44.755470275878906, "global_step": 339906, "epoch": 2809} {"train_loss": -44.52574157714844, "global_step": 339907, "epoch": 2809} {"train_loss": -43.83892822265625, "global_step": 339908, "epoch": 2809} {"train_loss": -42.91636657714844, "global_step": 339909, "epoch": 2809} {"train_loss": -44.0188102722168, "global_step": 339910, "epoch": 2809} {"train_loss": -44.70720672607422, "global_step": 339911, "epoch": 2809} {"train_loss": -41.82381057739258, "global_step": 339912, "epoch": 2809} {"train_loss": -42.30282211303711, "global_step": 339913, "epoch": 2809} {"train_loss": -44.260860443115234, "global_step": 339914, "epoch": 2809} {"train_loss": -44.52684783935547, "global_step": 339915, "epoch": 2809} {"train_loss": -41.78926467895508, "global_step": 339916, "epoch": 2809} {"train_loss": -44.276458740234375, "global_step": 339917, "epoch": 2809} {"train_loss": -44.9283447265625, "global_step": 339918, "epoch": 2809} {"train_loss": -42.63308334350586, "global_step": 339919, "epoch": 2809} {"train_loss": -43.444332122802734, "global_step": 339920, "epoch": 2809} {"train_loss": -41.90705108642578, "global_step": 339921, "epoch": 2809} {"train_loss": -43.0533561706543, "global_step": 339922, "epoch": 2809} {"train_loss": -43.54026412963867, "global_step": 339923, "epoch": 2809} {"train_loss": -43.89616775512695, "global_step": 339924, "epoch": 2809} {"train_loss": -43.023494720458984, "global_step": 339925, "epoch": 2809} {"train_loss": -43.620079040527344, "global_step": 339926, "epoch": 2809} {"train_loss": -44.345401763916016, "global_step": 339927, "epoch": 2809} {"train_loss": -43.664405822753906, "global_step": 339928, "epoch": 2809} {"train_loss": -43.997379302978516, "global_step": 339929, "epoch": 2809} {"train_loss": -43.417396545410156, "global_step": 339930, "epoch": 2809} {"train_loss": -43.07250213623047, "global_step": 339931, "epoch": 2809} {"train_loss": -44.5036506652832, "global_step": 339932, "epoch": 2809} {"train_loss": -44.74888229370117, "global_step": 339933, "epoch": 2809} {"train_loss": -44.27042770385742, "global_step": 339934, "epoch": 2809} {"train_loss": -44.091888427734375, "global_step": 339935, "epoch": 2809} {"train_loss": -41.91139221191406, "global_step": 339936, "epoch": 2809} {"train_loss": -43.71244812011719, "global_step": 339937, "epoch": 2809} {"train_loss": -44.4940185546875, "global_step": 339938, "epoch": 2809} {"train_loss": -43.906681060791016, "global_step": 339939, "epoch": 2809} {"train_loss": -43.89179229736328, "global_step": 339940, "epoch": 2809} {"train_loss": -42.46123123168945, "global_step": 339941, "epoch": 2809} {"train_loss": -44.719444274902344, "global_step": 339942, "epoch": 2809} {"train_loss": -44.74073028564453, "global_step": 339943, "epoch": 2809} {"train_loss": -44.68061065673828, "global_step": 339944, "epoch": 2809} {"train_loss": -38.817813873291016, "global_step": 339945, "epoch": 2809} {"train_loss": -42.9031867980957, "global_step": 339946, "epoch": 2809} {"train_loss": -44.229103088378906, "global_step": 339947, "epoch": 2809} {"train_loss": -44.538578033447266, "global_step": 339948, "epoch": 2809} {"train_loss": -44.30306625366211, "global_step": 339949, "epoch": 2809} {"train_loss": -43.47414016723633, "global_step": 339950, "epoch": 2809} {"train_loss": -44.168426513671875, "global_step": 339951, "epoch": 2809} {"train_loss": -41.34718704223633, "global_step": 339952, "epoch": 2809} {"train_loss": -42.9208869934082, "global_step": 339953, "epoch": 2809} {"train_loss": -43.884639739990234, "global_step": 339954, "epoch": 2809} {"train_loss": -44.57161331176758, "global_step": 339955, "epoch": 2809} {"train_loss": -42.7231559753418, "global_step": 339956, "epoch": 2809} {"train_loss": -44.12042999267578, "global_step": 339957, "epoch": 2809} {"train_loss": -44.73035430908203, "global_step": 339958, "epoch": 2809} {"train_loss": -43.54269027709961, "global_step": 339959, "epoch": 2809} {"train_loss": -43.71828842163086, "global_step": 339960, "epoch": 2809} {"train_loss": -44.45126724243164, "global_step": 339961, "epoch": 2809} {"train_loss": -44.00124740600586, "global_step": 339962, "epoch": 2809} {"train_loss": -44.11977005004883, "global_step": 339963, "epoch": 2809} {"train_loss": -44.74528121948242, "global_step": 339964, "epoch": 2809} {"train_loss": -44.52518081665039, "global_step": 339965, "epoch": 2809} {"train_loss": -44.70188522338867, "global_step": 339966, "epoch": 2809} {"train_loss": -44.2667350769043, "global_step": 339967, "epoch": 2809} {"train_loss": -44.789161682128906, "global_step": 339968, "epoch": 2809} {"train_loss": -45.1844596862793, "global_step": 339969, "epoch": 2809} {"train_loss": -44.25471115112305, "global_step": 339970, "epoch": 2809} {"train_loss": -44.938018798828125, "global_step": 339971, "epoch": 2809} {"train_loss": -44.72918701171875, "global_step": 339972, "epoch": 2809} {"train_loss": -44.79777908325195, "global_step": 339973, "epoch": 2809} {"train_loss": -44.02535629272461, "global_step": 339974, "epoch": 2809} {"train_loss": -45.068603515625, "global_step": 339975, "epoch": 2809} {"train_loss": -44.210750579833984, "global_step": 339976, "epoch": 2809} {"train_loss": -44.640438079833984, "global_step": 339977, "epoch": 2809} {"train_loss": -44.007381439208984, "global_step": 339978, "epoch": 2809} {"train_loss": -44.26557540893555, "global_step": 339979, "epoch": 2809} {"train_loss": -44.65296173095703, "global_step": 339980, "epoch": 2809} {"train_loss": -44.2102165222168, "global_step": 339981, "epoch": 2809} {"train_loss": -44.77423858642578, "global_step": 339982, "epoch": 2809} {"train_loss": -44.5244255065918, "global_step": 339983, "epoch": 2809} {"train_loss": -44.188507080078125, "global_step": 339984, "epoch": 2809} {"train_loss": -43.9344596862793, "global_step": 339985, "epoch": 2809} {"train_loss": -42.62418746948242, "global_step": 339986, "epoch": 2809} {"train_loss": -42.145957946777344, "global_step": 339987, "epoch": 2809} {"train_loss": -41.24597930908203, "global_step": 339988, "epoch": 2809} {"train_loss": -42.40031051635742, "global_step": 339989, "epoch": 2809} {"train_loss": -42.50946807861328, "global_step": 339990, "epoch": 2809} {"train_loss": -42.87755584716797, "global_step": 339991, "epoch": 2809} {"train_loss": -44.7353630065918, "global_step": 339992, "epoch": 2809} {"train_loss": -43.1212043762207, "global_step": 339993, "epoch": 2809} {"train_loss": -43.7320442199707, "global_step": 339994, "epoch": 2809} {"train_loss": -43.58535385131836, "global_step": 339995, "epoch": 2809} {"train_loss": -44.65504837036133, "global_step": 339996, "epoch": 2809} {"train_loss": -43.166542053222656, "global_step": 339997, "epoch": 2809} {"train_loss": -41.49251937866211, "global_step": 339998, "epoch": 2809} {"train_loss": -38.258148193359375, "global_step": 339999, "epoch": 2809} {"train_loss": -39.712257385253906, "global_step": 340000, "epoch": 2809} {"train_loss": -43.40559005737305, "global_step": 340001, "epoch": 2809} {"train_loss": -39.41755294799805, "global_step": 340002, "epoch": 2809} {"train_loss": -40.11174392700195, "global_step": 340003, "epoch": 2809} {"train_loss": -41.266937255859375, "global_step": 340004, "epoch": 2809} {"train_loss": -32.1118049621582, "global_step": 340005, "epoch": 2809} {"train_loss": -41.482295989990234, "global_step": 340006, "epoch": 2809} {"train_loss": -37.507415771484375, "global_step": 340007, "epoch": 2809} {"train_loss": -41.09264373779297, "global_step": 340008, "epoch": 2809} {"train_loss": -43.38986202902045, "global_step": 340009, "epoch": 2809, "val_loss": 2562280.25} {"train_loss": -40.8605842590332, "global_step": 340010, "epoch": 2810} {"train_loss": -41.7106819152832, "global_step": 340011, "epoch": 2810} {"train_loss": -40.8428840637207, "global_step": 340012, "epoch": 2810} {"train_loss": -41.5620231628418, "global_step": 340013, "epoch": 2810} {"train_loss": -41.873043060302734, "global_step": 340014, "epoch": 2810} {"train_loss": -41.21322250366211, "global_step": 340015, "epoch": 2810} {"train_loss": -42.735877990722656, "global_step": 340016, "epoch": 2810} {"train_loss": -41.901771545410156, "global_step": 340017, "epoch": 2810} {"train_loss": -41.87963104248047, "global_step": 340018, "epoch": 2810} {"train_loss": -42.78640365600586, "global_step": 340019, "epoch": 2810} {"train_loss": -42.55651092529297, "global_step": 340020, "epoch": 2810} {"train_loss": -41.47602844238281, "global_step": 340021, "epoch": 2810} {"train_loss": -43.11143493652344, "global_step": 340022, "epoch": 2810} {"train_loss": -41.91862487792969, "global_step": 340023, "epoch": 2810} {"train_loss": -43.086605072021484, "global_step": 340024, "epoch": 2810} {"train_loss": -43.258399963378906, "global_step": 340025, "epoch": 2810} {"train_loss": -42.083499908447266, "global_step": 340026, "epoch": 2810} {"train_loss": -42.851375579833984, "global_step": 340027, "epoch": 2810} {"train_loss": -42.292564392089844, "global_step": 340028, "epoch": 2810} {"train_loss": -43.39324951171875, "global_step": 340029, "epoch": 2810} {"train_loss": -42.937896728515625, "global_step": 340030, "epoch": 2810} {"train_loss": -43.505218505859375, "global_step": 340031, "epoch": 2810} {"train_loss": -42.731658935546875, "global_step": 340032, "epoch": 2810} {"train_loss": -43.57929229736328, "global_step": 340033, "epoch": 2810} {"train_loss": -43.152099609375, "global_step": 340034, "epoch": 2810} {"train_loss": -43.92460250854492, "global_step": 340035, "epoch": 2810} {"train_loss": -43.94325637817383, "global_step": 340036, "epoch": 2810} {"train_loss": -44.00434112548828, "global_step": 340037, "epoch": 2810} {"train_loss": -44.064369201660156, "global_step": 340038, "epoch": 2810} {"train_loss": -43.1597900390625, "global_step": 340039, "epoch": 2810} {"train_loss": -43.723201751708984, "global_step": 340040, "epoch": 2810} {"train_loss": -43.93207931518555, "global_step": 340041, "epoch": 2810} {"train_loss": -43.74436950683594, "global_step": 340042, "epoch": 2810} {"train_loss": -43.80007553100586, "global_step": 340043, "epoch": 2810} {"train_loss": -44.2268180847168, "global_step": 340044, "epoch": 2810} {"train_loss": -43.97930908203125, "global_step": 340045, "epoch": 2810} {"train_loss": -44.286598205566406, "global_step": 340046, "epoch": 2810} {"train_loss": -44.52560043334961, "global_step": 340047, "epoch": 2810} {"train_loss": -44.11036682128906, "global_step": 340048, "epoch": 2810} {"train_loss": -43.852779388427734, "global_step": 340049, "epoch": 2810} {"train_loss": -44.668304443359375, "global_step": 340050, "epoch": 2810} {"train_loss": -44.13347244262695, "global_step": 340051, "epoch": 2810} {"train_loss": -44.54827880859375, "global_step": 340052, "epoch": 2810} {"train_loss": -44.19923782348633, "global_step": 340053, "epoch": 2810} {"train_loss": -44.76542663574219, "global_step": 340054, "epoch": 2810} {"train_loss": -44.21763229370117, "global_step": 340055, "epoch": 2810} {"train_loss": -44.743404388427734, "global_step": 340056, "epoch": 2810} {"train_loss": -44.70600509643555, "global_step": 340057, "epoch": 2810} {"train_loss": -44.65159606933594, "global_step": 340058, "epoch": 2810} {"train_loss": -44.31616973876953, "global_step": 340059, "epoch": 2810} {"train_loss": -44.001495361328125, "global_step": 340060, "epoch": 2810} {"train_loss": -44.6320915222168, "global_step": 340061, "epoch": 2810} {"train_loss": -44.8281364440918, "global_step": 340062, "epoch": 2810} {"train_loss": -44.185142517089844, "global_step": 340063, "epoch": 2810} {"train_loss": -44.2630615234375, "global_step": 340064, "epoch": 2810} {"train_loss": -45.19837951660156, "global_step": 340065, "epoch": 2810} {"train_loss": -44.621002197265625, "global_step": 340066, "epoch": 2810} {"train_loss": -45.01572799682617, "global_step": 340067, "epoch": 2810} {"train_loss": -44.35502243041992, "global_step": 340068, "epoch": 2810} {"train_loss": -45.06718063354492, "global_step": 340069, "epoch": 2810} {"train_loss": -45.409175872802734, "global_step": 340070, "epoch": 2810} {"train_loss": -44.79134750366211, "global_step": 340071, "epoch": 2810} {"train_loss": -44.4592399597168, "global_step": 340072, "epoch": 2810} {"train_loss": -45.47810363769531, "global_step": 340073, "epoch": 2810} {"train_loss": -45.69331359863281, "global_step": 340074, "epoch": 2810} {"train_loss": -45.1059684753418, "global_step": 340075, "epoch": 2810} {"train_loss": -45.62368392944336, "global_step": 340076, "epoch": 2810} {"train_loss": -44.94588851928711, "global_step": 340077, "epoch": 2810} {"train_loss": -45.38823699951172, "global_step": 340078, "epoch": 2810} {"train_loss": -45.1789665222168, "global_step": 340079, "epoch": 2810} {"train_loss": -45.41990280151367, "global_step": 340080, "epoch": 2810} {"train_loss": -45.29901885986328, "global_step": 340081, "epoch": 2810} {"train_loss": -44.200191497802734, "global_step": 340082, "epoch": 2810} {"train_loss": -44.8415641784668, "global_step": 340083, "epoch": 2810} {"train_loss": -45.199493408203125, "global_step": 340084, "epoch": 2810} {"train_loss": -44.954864501953125, "global_step": 340085, "epoch": 2810} {"train_loss": -45.20119094848633, "global_step": 340086, "epoch": 2810} {"train_loss": -45.51911163330078, "global_step": 340087, "epoch": 2810} {"train_loss": -45.08705520629883, "global_step": 340088, "epoch": 2810} {"train_loss": -44.95758819580078, "global_step": 340089, "epoch": 2810} {"train_loss": -45.96656799316406, "global_step": 340090, "epoch": 2810} {"train_loss": -44.743873596191406, "global_step": 340091, "epoch": 2810} {"train_loss": -44.2264289855957, "global_step": 340092, "epoch": 2810} {"train_loss": -43.987037658691406, "global_step": 340093, "epoch": 2810} {"train_loss": -43.679744720458984, "global_step": 340094, "epoch": 2810} {"train_loss": -43.622276306152344, "global_step": 340095, "epoch": 2810} {"train_loss": -43.4969482421875, "global_step": 340096, "epoch": 2810} {"train_loss": -42.7683219909668, "global_step": 340097, "epoch": 2810} {"train_loss": -43.4647216796875, "global_step": 340098, "epoch": 2810} {"train_loss": -44.7545280456543, "global_step": 340099, "epoch": 2810} {"train_loss": -43.96376419067383, "global_step": 340100, "epoch": 2810} {"train_loss": -43.6755485534668, "global_step": 340101, "epoch": 2810} {"train_loss": -43.864871978759766, "global_step": 340102, "epoch": 2810} {"train_loss": -42.61354446411133, "global_step": 340103, "epoch": 2810} {"train_loss": -41.59552764892578, "global_step": 340104, "epoch": 2810} {"train_loss": -40.6246223449707, "global_step": 340105, "epoch": 2810} {"train_loss": -43.43622970581055, "global_step": 340106, "epoch": 2810} {"train_loss": -44.51076889038086, "global_step": 340107, "epoch": 2810} {"train_loss": -42.528316497802734, "global_step": 340108, "epoch": 2810} {"train_loss": -42.656463623046875, "global_step": 340109, "epoch": 2810} {"train_loss": -42.09410095214844, "global_step": 340110, "epoch": 2810} {"train_loss": -44.29559326171875, "global_step": 340111, "epoch": 2810} {"train_loss": -41.691768646240234, "global_step": 340112, "epoch": 2810} {"train_loss": -43.13930130004883, "global_step": 340113, "epoch": 2810} {"train_loss": -44.35722732543945, "global_step": 340114, "epoch": 2810} {"train_loss": -41.32172775268555, "global_step": 340115, "epoch": 2810} {"train_loss": -42.84263610839844, "global_step": 340116, "epoch": 2810} {"train_loss": -44.06098556518555, "global_step": 340117, "epoch": 2810} {"train_loss": -43.467323303222656, "global_step": 340118, "epoch": 2810} {"train_loss": -42.84377670288086, "global_step": 340119, "epoch": 2810} {"train_loss": -43.463741302490234, "global_step": 340120, "epoch": 2810} {"train_loss": -43.03436279296875, "global_step": 340121, "epoch": 2810} {"train_loss": -43.83381271362305, "global_step": 340122, "epoch": 2810} {"train_loss": -44.13642501831055, "global_step": 340123, "epoch": 2810} {"train_loss": -43.53852462768555, "global_step": 340124, "epoch": 2810} {"train_loss": -43.370426177978516, "global_step": 340125, "epoch": 2810} {"train_loss": -43.886260986328125, "global_step": 340126, "epoch": 2810} {"train_loss": -43.69277572631836, "global_step": 340127, "epoch": 2810} {"train_loss": -42.79948425292969, "global_step": 340128, "epoch": 2810} {"train_loss": -43.619720458984375, "global_step": 340129, "epoch": 2810} {"train_loss": -43.73204803466797, "global_step": 340130, "epoch": 2810, "val_loss": 2625820.0} {"train_loss": -43.37080001831055, "global_step": 340131, "epoch": 2811} {"train_loss": -44.01579666137695, "global_step": 340132, "epoch": 2811} {"train_loss": -42.417415618896484, "global_step": 340133, "epoch": 2811} {"train_loss": -43.8441276550293, "global_step": 340134, "epoch": 2811} {"train_loss": -43.20862579345703, "global_step": 340135, "epoch": 2811} {"train_loss": -42.368446350097656, "global_step": 340136, "epoch": 2811} {"train_loss": -43.992210388183594, "global_step": 340137, "epoch": 2811} {"train_loss": -41.814735412597656, "global_step": 340138, "epoch": 2811} {"train_loss": -43.3729133605957, "global_step": 340139, "epoch": 2811} {"train_loss": -42.49636459350586, "global_step": 340140, "epoch": 2811} {"train_loss": -43.08888626098633, "global_step": 340141, "epoch": 2811} {"train_loss": -42.64399337768555, "global_step": 340142, "epoch": 2811} {"train_loss": -43.61591720581055, "global_step": 340143, "epoch": 2811} {"train_loss": -42.5124626159668, "global_step": 340144, "epoch": 2811} {"train_loss": -43.01474380493164, "global_step": 340145, "epoch": 2811} {"train_loss": -42.66575241088867, "global_step": 340146, "epoch": 2811} {"train_loss": -42.205020904541016, "global_step": 340147, "epoch": 2811} {"train_loss": -43.49420928955078, "global_step": 340148, "epoch": 2811} {"train_loss": -42.4083251953125, "global_step": 340149, "epoch": 2811} {"train_loss": -44.39337158203125, "global_step": 340150, "epoch": 2811} {"train_loss": -43.06355667114258, "global_step": 340151, "epoch": 2811} {"train_loss": -43.7541618347168, "global_step": 340152, "epoch": 2811} {"train_loss": -43.92224884033203, "global_step": 340153, "epoch": 2811} {"train_loss": -43.844703674316406, "global_step": 340154, "epoch": 2811} {"train_loss": -43.99369430541992, "global_step": 340155, "epoch": 2811} {"train_loss": -43.15017318725586, "global_step": 340156, "epoch": 2811} {"train_loss": -44.480072021484375, "global_step": 340157, "epoch": 2811} {"train_loss": -43.759578704833984, "global_step": 340158, "epoch": 2811} {"train_loss": -44.33055877685547, "global_step": 340159, "epoch": 2811} {"train_loss": -43.95072555541992, "global_step": 340160, "epoch": 2811} {"train_loss": -44.2032585144043, "global_step": 340161, "epoch": 2811} {"train_loss": -44.90876770019531, "global_step": 340162, "epoch": 2811} {"train_loss": -43.90468978881836, "global_step": 340163, "epoch": 2811} {"train_loss": -44.19180679321289, "global_step": 340164, "epoch": 2811} {"train_loss": -44.500797271728516, "global_step": 340165, "epoch": 2811} {"train_loss": -44.581031799316406, "global_step": 340166, "epoch": 2811} {"train_loss": -44.54695510864258, "global_step": 340167, "epoch": 2811} {"train_loss": -45.59402084350586, "global_step": 340168, "epoch": 2811} {"train_loss": -44.559696197509766, "global_step": 340169, "epoch": 2811} {"train_loss": -45.16109848022461, "global_step": 340170, "epoch": 2811} {"train_loss": -44.851802825927734, "global_step": 340171, "epoch": 2811} {"train_loss": -44.22194290161133, "global_step": 340172, "epoch": 2811} {"train_loss": -45.49658203125, "global_step": 340173, "epoch": 2811} {"train_loss": -45.22816467285156, "global_step": 340174, "epoch": 2811} {"train_loss": -45.097694396972656, "global_step": 340175, "epoch": 2811} {"train_loss": -45.02384567260742, "global_step": 340176, "epoch": 2811} {"train_loss": -44.99311065673828, "global_step": 340177, "epoch": 2811} {"train_loss": -45.14254379272461, "global_step": 340178, "epoch": 2811} {"train_loss": -44.62053298950195, "global_step": 340179, "epoch": 2811} {"train_loss": -44.90937423706055, "global_step": 340180, "epoch": 2811} {"train_loss": -45.4171142578125, "global_step": 340181, "epoch": 2811} {"train_loss": -45.63066482543945, "global_step": 340182, "epoch": 2811} {"train_loss": -45.36300277709961, "global_step": 340183, "epoch": 2811} {"train_loss": -44.89199447631836, "global_step": 340184, "epoch": 2811} {"train_loss": -45.14300537109375, "global_step": 340185, "epoch": 2811} {"train_loss": -44.979957580566406, "global_step": 340186, "epoch": 2811} {"train_loss": -45.5135498046875, "global_step": 340187, "epoch": 2811} {"train_loss": -44.56380844116211, "global_step": 340188, "epoch": 2811} {"train_loss": -44.22518539428711, "global_step": 340189, "epoch": 2811} {"train_loss": -45.6773796081543, "global_step": 340190, "epoch": 2811} {"train_loss": -45.17359161376953, "global_step": 340191, "epoch": 2811} {"train_loss": -43.32295608520508, "global_step": 340192, "epoch": 2811} {"train_loss": -44.61639404296875, "global_step": 340193, "epoch": 2811} {"train_loss": -45.62069320678711, "global_step": 340194, "epoch": 2811} {"train_loss": -45.02656173706055, "global_step": 340195, "epoch": 2811} {"train_loss": -45.10908889770508, "global_step": 340196, "epoch": 2811} {"train_loss": -44.77497482299805, "global_step": 340197, "epoch": 2811} {"train_loss": -44.59273910522461, "global_step": 340198, "epoch": 2811} {"train_loss": -45.183616638183594, "global_step": 340199, "epoch": 2811} {"train_loss": -44.93349838256836, "global_step": 340200, "epoch": 2811} {"train_loss": -44.298397064208984, "global_step": 340201, "epoch": 2811} {"train_loss": -45.10356521606445, "global_step": 340202, "epoch": 2811} {"train_loss": -45.58643341064453, "global_step": 340203, "epoch": 2811} {"train_loss": -45.36812210083008, "global_step": 340204, "epoch": 2811} {"train_loss": -44.149131774902344, "global_step": 340205, "epoch": 2811} {"train_loss": -43.76396179199219, "global_step": 340206, "epoch": 2811} {"train_loss": -42.32259750366211, "global_step": 340207, "epoch": 2811} {"train_loss": -42.53181838989258, "global_step": 340208, "epoch": 2811} {"train_loss": -44.92289352416992, "global_step": 340209, "epoch": 2811} {"train_loss": -44.14156723022461, "global_step": 340210, "epoch": 2811} {"train_loss": -42.22238540649414, "global_step": 340211, "epoch": 2811} {"train_loss": -43.90021896362305, "global_step": 340212, "epoch": 2811} {"train_loss": -44.31436538696289, "global_step": 340213, "epoch": 2811} {"train_loss": -43.12772750854492, "global_step": 340214, "epoch": 2811} {"train_loss": -42.805877685546875, "global_step": 340215, "epoch": 2811} {"train_loss": -42.5072021484375, "global_step": 340216, "epoch": 2811} {"train_loss": -43.706581115722656, "global_step": 340217, "epoch": 2811} {"train_loss": -45.319522857666016, "global_step": 340218, "epoch": 2811} {"train_loss": -43.877620697021484, "global_step": 340219, "epoch": 2811} {"train_loss": -41.992958068847656, "global_step": 340220, "epoch": 2811} {"train_loss": -44.78627395629883, "global_step": 340221, "epoch": 2811} {"train_loss": -42.09437942504883, "global_step": 340222, "epoch": 2811} {"train_loss": -42.72974395751953, "global_step": 340223, "epoch": 2811} {"train_loss": -44.65731430053711, "global_step": 340224, "epoch": 2811} {"train_loss": -44.0699348449707, "global_step": 340225, "epoch": 2811} {"train_loss": -42.70144271850586, "global_step": 340226, "epoch": 2811} {"train_loss": -43.165706634521484, "global_step": 340227, "epoch": 2811} {"train_loss": -43.7566032409668, "global_step": 340228, "epoch": 2811} {"train_loss": -44.13636016845703, "global_step": 340229, "epoch": 2811} {"train_loss": -43.30888748168945, "global_step": 340230, "epoch": 2811} {"train_loss": -44.162837982177734, "global_step": 340231, "epoch": 2811} {"train_loss": -45.03336715698242, "global_step": 340232, "epoch": 2811} {"train_loss": -42.838382720947266, "global_step": 340233, "epoch": 2811} {"train_loss": -45.087677001953125, "global_step": 340234, "epoch": 2811} {"train_loss": -43.575355529785156, "global_step": 340235, "epoch": 2811} {"train_loss": -42.394710540771484, "global_step": 340236, "epoch": 2811} {"train_loss": -44.20863723754883, "global_step": 340237, "epoch": 2811} {"train_loss": -43.5247802734375, "global_step": 340238, "epoch": 2811} {"train_loss": -43.95170211791992, "global_step": 340239, "epoch": 2811} {"train_loss": -44.080989837646484, "global_step": 340240, "epoch": 2811} {"train_loss": -44.275909423828125, "global_step": 340241, "epoch": 2811} {"train_loss": -44.26343536376953, "global_step": 340242, "epoch": 2811} {"train_loss": -44.64638900756836, "global_step": 340243, "epoch": 2811} {"train_loss": -44.48257064819336, "global_step": 340244, "epoch": 2811} {"train_loss": -44.566688537597656, "global_step": 340245, "epoch": 2811} {"train_loss": -44.01601791381836, "global_step": 340246, "epoch": 2811} {"train_loss": -44.990806579589844, "global_step": 340247, "epoch": 2811} {"train_loss": -44.7609977722168, "global_step": 340248, "epoch": 2811} {"train_loss": -44.17702865600586, "global_step": 340249, "epoch": 2811} {"train_loss": -44.025794982910156, "global_step": 340250, "epoch": 2811} {"train_loss": -44.0764997498063, "global_step": 340251, "epoch": 2811, "val_loss": 2590330.75} {"train_loss": -44.70078659057617, "global_step": 340252, "epoch": 2812} {"train_loss": -44.833831787109375, "global_step": 340253, "epoch": 2812} {"train_loss": -44.64016342163086, "global_step": 340254, "epoch": 2812} {"train_loss": -45.090797424316406, "global_step": 340255, "epoch": 2812} {"train_loss": -45.25419235229492, "global_step": 340256, "epoch": 2812} {"train_loss": -45.39590072631836, "global_step": 340257, "epoch": 2812} {"train_loss": -45.499412536621094, "global_step": 340258, "epoch": 2812} {"train_loss": -44.44865417480469, "global_step": 340259, "epoch": 2812} {"train_loss": -44.98046875, "global_step": 340260, "epoch": 2812} {"train_loss": -44.22391891479492, "global_step": 340261, "epoch": 2812} {"train_loss": -44.32326126098633, "global_step": 340262, "epoch": 2812} {"train_loss": -45.061485290527344, "global_step": 340263, "epoch": 2812} {"train_loss": -44.32804489135742, "global_step": 340264, "epoch": 2812} {"train_loss": -43.77998733520508, "global_step": 340265, "epoch": 2812} {"train_loss": -44.92313003540039, "global_step": 340266, "epoch": 2812} {"train_loss": -43.91015625, "global_step": 340267, "epoch": 2812} {"train_loss": -43.098045349121094, "global_step": 340268, "epoch": 2812} {"train_loss": -44.19643020629883, "global_step": 340269, "epoch": 2812} {"train_loss": -43.73987579345703, "global_step": 340270, "epoch": 2812} {"train_loss": -42.72929000854492, "global_step": 340271, "epoch": 2812} {"train_loss": -44.76005935668945, "global_step": 340272, "epoch": 2812} {"train_loss": -44.11773681640625, "global_step": 340273, "epoch": 2812} {"train_loss": -44.309974670410156, "global_step": 340274, "epoch": 2812} {"train_loss": -43.86201095581055, "global_step": 340275, "epoch": 2812} {"train_loss": -44.27490997314453, "global_step": 340276, "epoch": 2812} {"train_loss": -44.20144271850586, "global_step": 340277, "epoch": 2812} {"train_loss": -44.463314056396484, "global_step": 340278, "epoch": 2812} {"train_loss": -44.2588005065918, "global_step": 340279, "epoch": 2812} {"train_loss": -44.66936111450195, "global_step": 340280, "epoch": 2812} {"train_loss": -45.11365509033203, "global_step": 340281, "epoch": 2812} {"train_loss": -44.464237213134766, "global_step": 340282, "epoch": 2812} {"train_loss": -44.22037887573242, "global_step": 340283, "epoch": 2812} {"train_loss": -44.68404769897461, "global_step": 340284, "epoch": 2812} {"train_loss": -44.89645004272461, "global_step": 340285, "epoch": 2812} {"train_loss": -44.52696990966797, "global_step": 340286, "epoch": 2812} {"train_loss": -44.895320892333984, "global_step": 340287, "epoch": 2812} {"train_loss": -44.589271545410156, "global_step": 340288, "epoch": 2812} {"train_loss": -44.93788146972656, "global_step": 340289, "epoch": 2812} {"train_loss": -44.45747756958008, "global_step": 340290, "epoch": 2812} {"train_loss": -44.349639892578125, "global_step": 340291, "epoch": 2812} {"train_loss": -45.53558349609375, "global_step": 340292, "epoch": 2812} {"train_loss": -45.4298095703125, "global_step": 340293, "epoch": 2812} {"train_loss": -44.38943862915039, "global_step": 340294, "epoch": 2812} {"train_loss": -45.28782272338867, "global_step": 340295, "epoch": 2812} {"train_loss": -44.86883544921875, "global_step": 340296, "epoch": 2812} {"train_loss": -45.28279495239258, "global_step": 340297, "epoch": 2812} {"train_loss": -44.98966598510742, "global_step": 340298, "epoch": 2812} {"train_loss": -45.33833694458008, "global_step": 340299, "epoch": 2812} {"train_loss": -45.18375778198242, "global_step": 340300, "epoch": 2812} {"train_loss": -44.68161392211914, "global_step": 340301, "epoch": 2812} {"train_loss": -44.74861526489258, "global_step": 340302, "epoch": 2812} {"train_loss": -44.79496383666992, "global_step": 340303, "epoch": 2812} {"train_loss": -45.337005615234375, "global_step": 340304, "epoch": 2812} {"train_loss": -44.921852111816406, "global_step": 340305, "epoch": 2812} {"train_loss": -44.69016647338867, "global_step": 340306, "epoch": 2812} {"train_loss": -45.20734786987305, "global_step": 340307, "epoch": 2812} {"train_loss": -45.504554748535156, "global_step": 340308, "epoch": 2812} {"train_loss": -45.30426788330078, "global_step": 340309, "epoch": 2812} {"train_loss": -44.353050231933594, "global_step": 340310, "epoch": 2812} {"train_loss": -44.24333572387695, "global_step": 340311, "epoch": 2812} {"train_loss": -45.1624755859375, "global_step": 340312, "epoch": 2812} {"train_loss": -44.74298858642578, "global_step": 340313, "epoch": 2812} {"train_loss": -44.003108978271484, "global_step": 340314, "epoch": 2812} {"train_loss": -44.179176330566406, "global_step": 340315, "epoch": 2812} {"train_loss": -41.511688232421875, "global_step": 340316, "epoch": 2812} {"train_loss": -43.04498291015625, "global_step": 340317, "epoch": 2812} {"train_loss": -43.96491622924805, "global_step": 340318, "epoch": 2812} {"train_loss": -43.68099594116211, "global_step": 340319, "epoch": 2812} {"train_loss": -44.40773010253906, "global_step": 340320, "epoch": 2812} {"train_loss": -44.32102584838867, "global_step": 340321, "epoch": 2812} {"train_loss": -43.935760498046875, "global_step": 340322, "epoch": 2812} {"train_loss": -41.7255859375, "global_step": 340323, "epoch": 2812} {"train_loss": -43.24534225463867, "global_step": 340324, "epoch": 2812} {"train_loss": -44.46782302856445, "global_step": 340325, "epoch": 2812} {"train_loss": -43.96407699584961, "global_step": 340326, "epoch": 2812} {"train_loss": -43.690467834472656, "global_step": 340327, "epoch": 2812} {"train_loss": -44.194515228271484, "global_step": 340328, "epoch": 2812} {"train_loss": -44.12638473510742, "global_step": 340329, "epoch": 2812} {"train_loss": -42.7110710144043, "global_step": 340330, "epoch": 2812} {"train_loss": -43.010353088378906, "global_step": 340331, "epoch": 2812} {"train_loss": -43.25337600708008, "global_step": 340332, "epoch": 2812} {"train_loss": -43.751922607421875, "global_step": 340333, "epoch": 2812} {"train_loss": -43.959144592285156, "global_step": 340334, "epoch": 2812} {"train_loss": -41.58597183227539, "global_step": 340335, "epoch": 2812} {"train_loss": -43.905860900878906, "global_step": 340336, "epoch": 2812} {"train_loss": -43.33753204345703, "global_step": 340337, "epoch": 2812} {"train_loss": -42.462581634521484, "global_step": 340338, "epoch": 2812} {"train_loss": -43.88349533081055, "global_step": 340339, "epoch": 2812} {"train_loss": -42.43256378173828, "global_step": 340340, "epoch": 2812} {"train_loss": -44.38235092163086, "global_step": 340341, "epoch": 2812} {"train_loss": -44.10651779174805, "global_step": 340342, "epoch": 2812} {"train_loss": -43.171287536621094, "global_step": 340343, "epoch": 2812} {"train_loss": -43.40938949584961, "global_step": 340344, "epoch": 2812} {"train_loss": -44.486263275146484, "global_step": 340345, "epoch": 2812} {"train_loss": -43.74786376953125, "global_step": 340346, "epoch": 2812} {"train_loss": -43.86634063720703, "global_step": 340347, "epoch": 2812} {"train_loss": -42.65473937988281, "global_step": 340348, "epoch": 2812} {"train_loss": -44.501399993896484, "global_step": 340349, "epoch": 2812} {"train_loss": -43.72034454345703, "global_step": 340350, "epoch": 2812} {"train_loss": -43.571044921875, "global_step": 340351, "epoch": 2812} {"train_loss": -44.9041633605957, "global_step": 340352, "epoch": 2812} {"train_loss": -43.80624008178711, "global_step": 340353, "epoch": 2812} {"train_loss": -43.90768051147461, "global_step": 340354, "epoch": 2812} {"train_loss": -44.39683151245117, "global_step": 340355, "epoch": 2812} {"train_loss": -44.41193389892578, "global_step": 340356, "epoch": 2812} {"train_loss": -44.898136138916016, "global_step": 340357, "epoch": 2812} {"train_loss": -44.633724212646484, "global_step": 340358, "epoch": 2812} {"train_loss": -44.320438385009766, "global_step": 340359, "epoch": 2812} {"train_loss": -45.102783203125, "global_step": 340360, "epoch": 2812} {"train_loss": -44.35310745239258, "global_step": 340361, "epoch": 2812} {"train_loss": -44.5751953125, "global_step": 340362, "epoch": 2812} {"train_loss": -45.25796127319336, "global_step": 340363, "epoch": 2812} {"train_loss": -44.70823287963867, "global_step": 340364, "epoch": 2812} {"train_loss": -45.09624099731445, "global_step": 340365, "epoch": 2812} {"train_loss": -44.477691650390625, "global_step": 340366, "epoch": 2812} {"train_loss": -44.46102523803711, "global_step": 340367, "epoch": 2812} {"train_loss": -44.845455169677734, "global_step": 340368, "epoch": 2812} {"train_loss": -43.972747802734375, "global_step": 340369, "epoch": 2812} {"train_loss": -44.550537109375, "global_step": 340370, "epoch": 2812} {"train_loss": -44.21639633178711, "global_step": 340371, "epoch": 2812} {"train_loss": -44.28942590508579, "global_step": 340372, "epoch": 2812, "val_loss": 2642490.5} {"train_loss": -45.61084747314453, "global_step": 340373, "epoch": 2813} {"train_loss": -43.81806564331055, "global_step": 340374, "epoch": 2813} {"train_loss": -43.08820724487305, "global_step": 340375, "epoch": 2813} {"train_loss": -44.154457092285156, "global_step": 340376, "epoch": 2813} {"train_loss": -44.072731018066406, "global_step": 340377, "epoch": 2813} {"train_loss": -42.672950744628906, "global_step": 340378, "epoch": 2813} {"train_loss": -43.89398193359375, "global_step": 340379, "epoch": 2813} {"train_loss": -44.254817962646484, "global_step": 340380, "epoch": 2813} {"train_loss": -43.39405059814453, "global_step": 340381, "epoch": 2813} {"train_loss": -43.730735778808594, "global_step": 340382, "epoch": 2813} {"train_loss": -43.311004638671875, "global_step": 340383, "epoch": 2813} {"train_loss": -43.30134201049805, "global_step": 340384, "epoch": 2813} {"train_loss": -43.59535217285156, "global_step": 340385, "epoch": 2813} {"train_loss": -44.17904281616211, "global_step": 340386, "epoch": 2813} {"train_loss": -42.945613861083984, "global_step": 340387, "epoch": 2813} {"train_loss": -43.61722946166992, "global_step": 340388, "epoch": 2813} {"train_loss": -45.56820297241211, "global_step": 340389, "epoch": 2813} {"train_loss": -43.79217529296875, "global_step": 340390, "epoch": 2813} {"train_loss": -43.097984313964844, "global_step": 340391, "epoch": 2813} {"train_loss": -44.00635528564453, "global_step": 340392, "epoch": 2813} {"train_loss": -43.415401458740234, "global_step": 340393, "epoch": 2813} {"train_loss": -42.45420455932617, "global_step": 340394, "epoch": 2813} {"train_loss": -44.65829086303711, "global_step": 340395, "epoch": 2813} {"train_loss": -43.89802169799805, "global_step": 340396, "epoch": 2813} {"train_loss": -42.9925651550293, "global_step": 340397, "epoch": 2813} {"train_loss": -44.342742919921875, "global_step": 340398, "epoch": 2813} {"train_loss": -44.2906494140625, "global_step": 340399, "epoch": 2813} {"train_loss": -43.670989990234375, "global_step": 340400, "epoch": 2813} {"train_loss": -44.863895416259766, "global_step": 340401, "epoch": 2813} {"train_loss": -45.41486358642578, "global_step": 340402, "epoch": 2813} {"train_loss": -45.06636428833008, "global_step": 340403, "epoch": 2813} {"train_loss": -44.10382080078125, "global_step": 340404, "epoch": 2813} {"train_loss": -44.678985595703125, "global_step": 340405, "epoch": 2813} {"train_loss": -43.262996673583984, "global_step": 340406, "epoch": 2813} {"train_loss": -41.983604431152344, "global_step": 340407, "epoch": 2813} {"train_loss": -41.97724533081055, "global_step": 340408, "epoch": 2813} {"train_loss": -42.62208938598633, "global_step": 340409, "epoch": 2813} {"train_loss": -44.80421447753906, "global_step": 340410, "epoch": 2813} {"train_loss": -42.49441909790039, "global_step": 340411, "epoch": 2813} {"train_loss": -44.27894973754883, "global_step": 340412, "epoch": 2813} {"train_loss": -44.594295501708984, "global_step": 340413, "epoch": 2813} {"train_loss": -42.585899353027344, "global_step": 340414, "epoch": 2813} {"train_loss": -43.056129455566406, "global_step": 340415, "epoch": 2813} {"train_loss": -44.306575775146484, "global_step": 340416, "epoch": 2813} {"train_loss": -43.98757553100586, "global_step": 340417, "epoch": 2813} {"train_loss": -41.1949577331543, "global_step": 340418, "epoch": 2813} {"train_loss": -42.95248031616211, "global_step": 340419, "epoch": 2813} {"train_loss": -43.77587127685547, "global_step": 340420, "epoch": 2813} {"train_loss": -42.79561996459961, "global_step": 340421, "epoch": 2813} {"train_loss": -39.617462158203125, "global_step": 340422, "epoch": 2813} {"train_loss": -44.18892288208008, "global_step": 340423, "epoch": 2813} {"train_loss": -36.64988327026367, "global_step": 340424, "epoch": 2813} {"train_loss": -43.70684051513672, "global_step": 340425, "epoch": 2813} {"train_loss": -39.49027633666992, "global_step": 340426, "epoch": 2813} {"train_loss": -41.75140380859375, "global_step": 340427, "epoch": 2813} {"train_loss": -42.766414642333984, "global_step": 340428, "epoch": 2813} {"train_loss": -41.32720947265625, "global_step": 340429, "epoch": 2813} {"train_loss": -42.79623031616211, "global_step": 340430, "epoch": 2813} {"train_loss": -42.123779296875, "global_step": 340431, "epoch": 2813} {"train_loss": -41.75617599487305, "global_step": 340432, "epoch": 2813} {"train_loss": -42.67136764526367, "global_step": 340433, "epoch": 2813} {"train_loss": -41.50858688354492, "global_step": 340434, "epoch": 2813} {"train_loss": -43.274452209472656, "global_step": 340435, "epoch": 2813} {"train_loss": -44.62152862548828, "global_step": 340436, "epoch": 2813} {"train_loss": -43.76205062866211, "global_step": 340437, "epoch": 2813} {"train_loss": -42.042842864990234, "global_step": 340438, "epoch": 2813} {"train_loss": -43.80512619018555, "global_step": 340439, "epoch": 2813} {"train_loss": -43.37664794921875, "global_step": 340440, "epoch": 2813} {"train_loss": -42.9867057800293, "global_step": 340441, "epoch": 2813} {"train_loss": -43.420677185058594, "global_step": 340442, "epoch": 2813} {"train_loss": -43.04050064086914, "global_step": 340443, "epoch": 2813} {"train_loss": -43.44789505004883, "global_step": 340444, "epoch": 2813} {"train_loss": -43.493595123291016, "global_step": 340445, "epoch": 2813} {"train_loss": -44.25048828125, "global_step": 340446, "epoch": 2813} {"train_loss": -43.76044845581055, "global_step": 340447, "epoch": 2813} {"train_loss": -44.22293472290039, "global_step": 340448, "epoch": 2813} {"train_loss": -44.58964157104492, "global_step": 340449, "epoch": 2813} {"train_loss": -43.876434326171875, "global_step": 340450, "epoch": 2813} {"train_loss": -44.409034729003906, "global_step": 340451, "epoch": 2813} {"train_loss": -43.83164978027344, "global_step": 340452, "epoch": 2813} {"train_loss": -44.019020080566406, "global_step": 340453, "epoch": 2813} {"train_loss": -44.33477783203125, "global_step": 340454, "epoch": 2813} {"train_loss": -44.177406311035156, "global_step": 340455, "epoch": 2813} {"train_loss": -44.46566390991211, "global_step": 340456, "epoch": 2813} {"train_loss": -44.31814193725586, "global_step": 340457, "epoch": 2813} {"train_loss": -42.81874465942383, "global_step": 340458, "epoch": 2813} {"train_loss": -44.41084671020508, "global_step": 340459, "epoch": 2813} {"train_loss": -45.299747467041016, "global_step": 340460, "epoch": 2813} {"train_loss": -44.423988342285156, "global_step": 340461, "epoch": 2813} {"train_loss": -44.86500930786133, "global_step": 340462, "epoch": 2813} {"train_loss": -44.00592041015625, "global_step": 340463, "epoch": 2813} {"train_loss": -44.54289627075195, "global_step": 340464, "epoch": 2813} {"train_loss": -44.45503616333008, "global_step": 340465, "epoch": 2813} {"train_loss": -44.694541931152344, "global_step": 340466, "epoch": 2813} {"train_loss": -45.141380310058594, "global_step": 340467, "epoch": 2813} {"train_loss": -44.89654541015625, "global_step": 340468, "epoch": 2813} {"train_loss": -44.98749923706055, "global_step": 340469, "epoch": 2813} {"train_loss": -45.07365036010742, "global_step": 340470, "epoch": 2813} {"train_loss": -44.777069091796875, "global_step": 340471, "epoch": 2813} {"train_loss": -44.59101486206055, "global_step": 340472, "epoch": 2813} {"train_loss": -45.027889251708984, "global_step": 340473, "epoch": 2813} {"train_loss": -44.44480514526367, "global_step": 340474, "epoch": 2813} {"train_loss": -44.94570541381836, "global_step": 340475, "epoch": 2813} {"train_loss": -44.877567291259766, "global_step": 340476, "epoch": 2813} {"train_loss": -44.67660903930664, "global_step": 340477, "epoch": 2813} {"train_loss": -45.06630325317383, "global_step": 340478, "epoch": 2813} {"train_loss": -45.160858154296875, "global_step": 340479, "epoch": 2813} {"train_loss": -44.381690979003906, "global_step": 340480, "epoch": 2813} {"train_loss": -45.03175735473633, "global_step": 340481, "epoch": 2813} {"train_loss": -44.71151351928711, "global_step": 340482, "epoch": 2813} {"train_loss": -44.44071578979492, "global_step": 340483, "epoch": 2813} {"train_loss": -44.573143005371094, "global_step": 340484, "epoch": 2813} {"train_loss": -45.65932083129883, "global_step": 340485, "epoch": 2813} {"train_loss": -45.1848030090332, "global_step": 340486, "epoch": 2813} {"train_loss": -44.61147689819336, "global_step": 340487, "epoch": 2813} {"train_loss": -45.29004669189453, "global_step": 340488, "epoch": 2813} {"train_loss": -45.5596809387207, "global_step": 340489, "epoch": 2813} {"train_loss": -44.20817184448242, "global_step": 340490, "epoch": 2813} {"train_loss": -45.0203742980957, "global_step": 340491, "epoch": 2813} {"train_loss": -43.942283630371094, "global_step": 340492, "epoch": 2813} {"train_loss": -43.78860457869601, "global_step": 340493, "epoch": 2813, "val_loss": 2648166.75} {"train_loss": -44.195064544677734, "global_step": 340494, "epoch": 2814} {"train_loss": -44.75791549682617, "global_step": 340495, "epoch": 2814} {"train_loss": -44.64119338989258, "global_step": 340496, "epoch": 2814} {"train_loss": -43.9593620300293, "global_step": 340497, "epoch": 2814} {"train_loss": -44.39094543457031, "global_step": 340498, "epoch": 2814} {"train_loss": -44.13389205932617, "global_step": 340499, "epoch": 2814} {"train_loss": -44.40364456176758, "global_step": 340500, "epoch": 2814} {"train_loss": -44.63511276245117, "global_step": 340501, "epoch": 2814} {"train_loss": -44.15642166137695, "global_step": 340502, "epoch": 2814} {"train_loss": -44.419010162353516, "global_step": 340503, "epoch": 2814} {"train_loss": -43.28652572631836, "global_step": 340504, "epoch": 2814} {"train_loss": -43.690975189208984, "global_step": 340505, "epoch": 2814} {"train_loss": -44.22273254394531, "global_step": 340506, "epoch": 2814} {"train_loss": -44.73440170288086, "global_step": 340507, "epoch": 2814} {"train_loss": -44.06332778930664, "global_step": 340508, "epoch": 2814} {"train_loss": -44.614990234375, "global_step": 340509, "epoch": 2814} {"train_loss": -41.81904220581055, "global_step": 340510, "epoch": 2814} {"train_loss": -43.54545974731445, "global_step": 340511, "epoch": 2814} {"train_loss": -44.79872512817383, "global_step": 340512, "epoch": 2814} {"train_loss": -43.597137451171875, "global_step": 340513, "epoch": 2814} {"train_loss": -43.34761428833008, "global_step": 340514, "epoch": 2814} {"train_loss": -44.17317581176758, "global_step": 340515, "epoch": 2814} {"train_loss": -42.856101989746094, "global_step": 340516, "epoch": 2814} {"train_loss": -43.51552963256836, "global_step": 340517, "epoch": 2814} {"train_loss": -44.659812927246094, "global_step": 340518, "epoch": 2814} {"train_loss": -43.395057678222656, "global_step": 340519, "epoch": 2814} {"train_loss": -44.56559371948242, "global_step": 340520, "epoch": 2814} {"train_loss": -44.01405715942383, "global_step": 340521, "epoch": 2814} {"train_loss": -44.262359619140625, "global_step": 340522, "epoch": 2814} {"train_loss": -43.478965759277344, "global_step": 340523, "epoch": 2814} {"train_loss": -44.840187072753906, "global_step": 340524, "epoch": 2814} {"train_loss": -44.71255111694336, "global_step": 340525, "epoch": 2814} {"train_loss": -44.67601013183594, "global_step": 340526, "epoch": 2814} {"train_loss": -45.12473678588867, "global_step": 340527, "epoch": 2814} {"train_loss": -45.58997344970703, "global_step": 340528, "epoch": 2814} {"train_loss": -45.555030822753906, "global_step": 340529, "epoch": 2814} {"train_loss": -45.118560791015625, "global_step": 340530, "epoch": 2814} {"train_loss": -44.6467170715332, "global_step": 340531, "epoch": 2814} {"train_loss": -44.49984359741211, "global_step": 340532, "epoch": 2814} {"train_loss": -45.07892608642578, "global_step": 340533, "epoch": 2814} {"train_loss": -44.693389892578125, "global_step": 340534, "epoch": 2814} {"train_loss": -45.16366195678711, "global_step": 340535, "epoch": 2814} {"train_loss": -44.62922286987305, "global_step": 340536, "epoch": 2814} {"train_loss": -44.05240249633789, "global_step": 340537, "epoch": 2814} {"train_loss": -44.270992279052734, "global_step": 340538, "epoch": 2814} {"train_loss": -44.40144729614258, "global_step": 340539, "epoch": 2814} {"train_loss": -44.63808059692383, "global_step": 340540, "epoch": 2814} {"train_loss": -44.51568603515625, "global_step": 340541, "epoch": 2814} {"train_loss": -45.03553771972656, "global_step": 340542, "epoch": 2814} {"train_loss": -45.38519287109375, "global_step": 340543, "epoch": 2814} {"train_loss": -44.504234313964844, "global_step": 340544, "epoch": 2814} {"train_loss": -45.273555755615234, "global_step": 340545, "epoch": 2814} {"train_loss": -44.8939323425293, "global_step": 340546, "epoch": 2814} {"train_loss": -45.04069137573242, "global_step": 340547, "epoch": 2814} {"train_loss": -45.5083122253418, "global_step": 340548, "epoch": 2814} {"train_loss": -44.705970764160156, "global_step": 340549, "epoch": 2814} {"train_loss": -44.49055099487305, "global_step": 340550, "epoch": 2814} {"train_loss": -45.61311340332031, "global_step": 340551, "epoch": 2814} {"train_loss": -44.233924865722656, "global_step": 340552, "epoch": 2814} {"train_loss": -43.038055419921875, "global_step": 340553, "epoch": 2814} {"train_loss": -45.00837707519531, "global_step": 340554, "epoch": 2814} {"train_loss": -43.401424407958984, "global_step": 340555, "epoch": 2814} {"train_loss": -43.87818908691406, "global_step": 340556, "epoch": 2814} {"train_loss": -45.05808639526367, "global_step": 340557, "epoch": 2814} {"train_loss": -42.05088424682617, "global_step": 340558, "epoch": 2814} {"train_loss": -41.256385803222656, "global_step": 340559, "epoch": 2814} {"train_loss": -43.788490295410156, "global_step": 340560, "epoch": 2814} {"train_loss": -40.54994583129883, "global_step": 340561, "epoch": 2814} {"train_loss": -42.828163146972656, "global_step": 340562, "epoch": 2814} {"train_loss": -43.167476654052734, "global_step": 340563, "epoch": 2814} {"train_loss": -42.23382568359375, "global_step": 340564, "epoch": 2814} {"train_loss": -43.73085021972656, "global_step": 340565, "epoch": 2814} {"train_loss": -43.30669021606445, "global_step": 340566, "epoch": 2814} {"train_loss": -41.76952362060547, "global_step": 340567, "epoch": 2814} {"train_loss": -44.00783157348633, "global_step": 340568, "epoch": 2814} {"train_loss": -42.24544143676758, "global_step": 340569, "epoch": 2814} {"train_loss": -43.763282775878906, "global_step": 340570, "epoch": 2814} {"train_loss": -43.37971878051758, "global_step": 340571, "epoch": 2814} {"train_loss": -43.69906234741211, "global_step": 340572, "epoch": 2814} {"train_loss": -44.57344436645508, "global_step": 340573, "epoch": 2814} {"train_loss": -43.95565414428711, "global_step": 340574, "epoch": 2814} {"train_loss": -42.88410568237305, "global_step": 340575, "epoch": 2814} {"train_loss": -42.98582077026367, "global_step": 340576, "epoch": 2814} {"train_loss": -43.57821273803711, "global_step": 340577, "epoch": 2814} {"train_loss": -42.7557373046875, "global_step": 340578, "epoch": 2814} {"train_loss": -42.97270584106445, "global_step": 340579, "epoch": 2814} {"train_loss": -43.34583282470703, "global_step": 340580, "epoch": 2814} {"train_loss": -43.48763656616211, "global_step": 340581, "epoch": 2814} {"train_loss": -43.731075286865234, "global_step": 340582, "epoch": 2814} {"train_loss": -44.54703140258789, "global_step": 340583, "epoch": 2814} {"train_loss": -43.766841888427734, "global_step": 340584, "epoch": 2814} {"train_loss": -44.94466781616211, "global_step": 340585, "epoch": 2814} {"train_loss": -44.11144256591797, "global_step": 340586, "epoch": 2814} {"train_loss": -44.21197509765625, "global_step": 340587, "epoch": 2814} {"train_loss": -44.54901123046875, "global_step": 340588, "epoch": 2814} {"train_loss": -43.92312240600586, "global_step": 340589, "epoch": 2814} {"train_loss": -44.90681076049805, "global_step": 340590, "epoch": 2814} {"train_loss": -44.283565521240234, "global_step": 340591, "epoch": 2814} {"train_loss": -44.33012008666992, "global_step": 340592, "epoch": 2814} {"train_loss": -44.60590744018555, "global_step": 340593, "epoch": 2814} {"train_loss": -44.065773010253906, "global_step": 340594, "epoch": 2814} {"train_loss": -44.844783782958984, "global_step": 340595, "epoch": 2814} {"train_loss": -44.181583404541016, "global_step": 340596, "epoch": 2814} {"train_loss": -44.6619987487793, "global_step": 340597, "epoch": 2814} {"train_loss": -44.92194366455078, "global_step": 340598, "epoch": 2814} {"train_loss": -44.06183624267578, "global_step": 340599, "epoch": 2814} {"train_loss": -43.979225158691406, "global_step": 340600, "epoch": 2814} {"train_loss": -43.68525695800781, "global_step": 340601, "epoch": 2814} {"train_loss": -44.106842041015625, "global_step": 340602, "epoch": 2814} {"train_loss": -43.864044189453125, "global_step": 340603, "epoch": 2814} {"train_loss": -43.6038932800293, "global_step": 340604, "epoch": 2814} {"train_loss": -43.05988311767578, "global_step": 340605, "epoch": 2814} {"train_loss": -43.32421875, "global_step": 340606, "epoch": 2814} {"train_loss": -44.39604568481445, "global_step": 340607, "epoch": 2814} {"train_loss": -44.51020431518555, "global_step": 340608, "epoch": 2814} {"train_loss": -43.009944915771484, "global_step": 340609, "epoch": 2814} {"train_loss": -43.7401008605957, "global_step": 340610, "epoch": 2814} {"train_loss": -44.1474723815918, "global_step": 340611, "epoch": 2814} {"train_loss": -44.3036994934082, "global_step": 340612, "epoch": 2814} {"train_loss": -43.65688705444336, "global_step": 340613, "epoch": 2814} {"train_loss": -44.05493718927557, "global_step": 340614, "epoch": 2814, "val_loss": 2708726.25} {"train_loss": -44.27357864379883, "global_step": 340615, "epoch": 2815} {"train_loss": -44.56383514404297, "global_step": 340616, "epoch": 2815} {"train_loss": -44.93848419189453, "global_step": 340617, "epoch": 2815} {"train_loss": -44.07966232299805, "global_step": 340618, "epoch": 2815} {"train_loss": -44.96462631225586, "global_step": 340619, "epoch": 2815} {"train_loss": -44.481788635253906, "global_step": 340620, "epoch": 2815} {"train_loss": -44.93897247314453, "global_step": 340621, "epoch": 2815} {"train_loss": -44.7918815612793, "global_step": 340622, "epoch": 2815} {"train_loss": -44.84641647338867, "global_step": 340623, "epoch": 2815} {"train_loss": -44.716068267822266, "global_step": 340624, "epoch": 2815} {"train_loss": -44.98342514038086, "global_step": 340625, "epoch": 2815} {"train_loss": -44.48672866821289, "global_step": 340626, "epoch": 2815} {"train_loss": -44.5644645690918, "global_step": 340627, "epoch": 2815} {"train_loss": -45.2253532409668, "global_step": 340628, "epoch": 2815} {"train_loss": -44.5637092590332, "global_step": 340629, "epoch": 2815} {"train_loss": -45.052730560302734, "global_step": 340630, "epoch": 2815} {"train_loss": -44.533409118652344, "global_step": 340631, "epoch": 2815} {"train_loss": -45.002254486083984, "global_step": 340632, "epoch": 2815} {"train_loss": -44.960105895996094, "global_step": 340633, "epoch": 2815} {"train_loss": -45.118656158447266, "global_step": 340634, "epoch": 2815} {"train_loss": -45.119903564453125, "global_step": 340635, "epoch": 2815} {"train_loss": -44.81013107299805, "global_step": 340636, "epoch": 2815} {"train_loss": -44.90183639526367, "global_step": 340637, "epoch": 2815} {"train_loss": -45.2589225769043, "global_step": 340638, "epoch": 2815} {"train_loss": -45.11785888671875, "global_step": 340639, "epoch": 2815} {"train_loss": -44.82293701171875, "global_step": 340640, "epoch": 2815} {"train_loss": -45.39396286010742, "global_step": 340641, "epoch": 2815} {"train_loss": -45.31842041015625, "global_step": 340642, "epoch": 2815} {"train_loss": -44.01912307739258, "global_step": 340643, "epoch": 2815} {"train_loss": -44.616668701171875, "global_step": 340644, "epoch": 2815} {"train_loss": -44.25800323486328, "global_step": 340645, "epoch": 2815} {"train_loss": -42.60719680786133, "global_step": 340646, "epoch": 2815} {"train_loss": -43.46525192260742, "global_step": 340647, "epoch": 2815} {"train_loss": -43.24082565307617, "global_step": 340648, "epoch": 2815} {"train_loss": -41.88698959350586, "global_step": 340649, "epoch": 2815} {"train_loss": -44.26986312866211, "global_step": 340650, "epoch": 2815} {"train_loss": -44.12662887573242, "global_step": 340651, "epoch": 2815} {"train_loss": -42.50728988647461, "global_step": 340652, "epoch": 2815} {"train_loss": -44.554359436035156, "global_step": 340653, "epoch": 2815} {"train_loss": -43.35139846801758, "global_step": 340654, "epoch": 2815} {"train_loss": -43.47788619995117, "global_step": 340655, "epoch": 2815} {"train_loss": -44.84381103515625, "global_step": 340656, "epoch": 2815} {"train_loss": -41.809730529785156, "global_step": 340657, "epoch": 2815} {"train_loss": -42.3946418762207, "global_step": 340658, "epoch": 2815} {"train_loss": -44.24689483642578, "global_step": 340659, "epoch": 2815} {"train_loss": -42.87014389038086, "global_step": 340660, "epoch": 2815} {"train_loss": -42.821815490722656, "global_step": 340661, "epoch": 2815} {"train_loss": -44.18569564819336, "global_step": 340662, "epoch": 2815} {"train_loss": -42.155860900878906, "global_step": 340663, "epoch": 2815} {"train_loss": -41.1511116027832, "global_step": 340664, "epoch": 2815} {"train_loss": -43.77976989746094, "global_step": 340665, "epoch": 2815} {"train_loss": -42.636268615722656, "global_step": 340666, "epoch": 2815} {"train_loss": -42.180641174316406, "global_step": 340667, "epoch": 2815} {"train_loss": -42.471248626708984, "global_step": 340668, "epoch": 2815} {"train_loss": -43.98202896118164, "global_step": 340669, "epoch": 2815} {"train_loss": -43.4393310546875, "global_step": 340670, "epoch": 2815} {"train_loss": -43.67573165893555, "global_step": 340671, "epoch": 2815} {"train_loss": -42.8651237487793, "global_step": 340672, "epoch": 2815} {"train_loss": -44.4553337097168, "global_step": 340673, "epoch": 2815} {"train_loss": -42.05792999267578, "global_step": 340674, "epoch": 2815} {"train_loss": -42.31901168823242, "global_step": 340675, "epoch": 2815} {"train_loss": -44.518348693847656, "global_step": 340676, "epoch": 2815} {"train_loss": -43.17959213256836, "global_step": 340677, "epoch": 2815} {"train_loss": -44.085872650146484, "global_step": 340678, "epoch": 2815} {"train_loss": -42.885841369628906, "global_step": 340679, "epoch": 2815} {"train_loss": -44.047821044921875, "global_step": 340680, "epoch": 2815} {"train_loss": -43.552242279052734, "global_step": 340681, "epoch": 2815} {"train_loss": -42.87465286254883, "global_step": 340682, "epoch": 2815} {"train_loss": -44.2337646484375, "global_step": 340683, "epoch": 2815} {"train_loss": -42.6345329284668, "global_step": 340684, "epoch": 2815} {"train_loss": -43.849403381347656, "global_step": 340685, "epoch": 2815} {"train_loss": -43.582794189453125, "global_step": 340686, "epoch": 2815} {"train_loss": -44.035762786865234, "global_step": 340687, "epoch": 2815} {"train_loss": -43.23895263671875, "global_step": 340688, "epoch": 2815} {"train_loss": -43.52623748779297, "global_step": 340689, "epoch": 2815} {"train_loss": -44.225040435791016, "global_step": 340690, "epoch": 2815} {"train_loss": -44.14594650268555, "global_step": 340691, "epoch": 2815} {"train_loss": -44.84528350830078, "global_step": 340692, "epoch": 2815} {"train_loss": -44.3199577331543, "global_step": 340693, "epoch": 2815} {"train_loss": -43.917633056640625, "global_step": 340694, "epoch": 2815} {"train_loss": -44.377769470214844, "global_step": 340695, "epoch": 2815} {"train_loss": -45.249473571777344, "global_step": 340696, "epoch": 2815} {"train_loss": -44.478546142578125, "global_step": 340697, "epoch": 2815} {"train_loss": -44.398345947265625, "global_step": 340698, "epoch": 2815} {"train_loss": -44.90189743041992, "global_step": 340699, "epoch": 2815} {"train_loss": -44.315059661865234, "global_step": 340700, "epoch": 2815} {"train_loss": -44.86640167236328, "global_step": 340701, "epoch": 2815} {"train_loss": -44.584102630615234, "global_step": 340702, "epoch": 2815} {"train_loss": -44.772823333740234, "global_step": 340703, "epoch": 2815} {"train_loss": -45.314430236816406, "global_step": 340704, "epoch": 2815} {"train_loss": -44.854434967041016, "global_step": 340705, "epoch": 2815} {"train_loss": -45.261409759521484, "global_step": 340706, "epoch": 2815} {"train_loss": -44.96638488769531, "global_step": 340707, "epoch": 2815} {"train_loss": -44.61418914794922, "global_step": 340708, "epoch": 2815} {"train_loss": -44.77923583984375, "global_step": 340709, "epoch": 2815} {"train_loss": -45.534664154052734, "global_step": 340710, "epoch": 2815} {"train_loss": -44.9941520690918, "global_step": 340711, "epoch": 2815} {"train_loss": -44.905635833740234, "global_step": 340712, "epoch": 2815} {"train_loss": -44.606937408447266, "global_step": 340713, "epoch": 2815} {"train_loss": -45.30060577392578, "global_step": 340714, "epoch": 2815} {"train_loss": -45.17924118041992, "global_step": 340715, "epoch": 2815} {"train_loss": -45.130550384521484, "global_step": 340716, "epoch": 2815} {"train_loss": -45.46506118774414, "global_step": 340717, "epoch": 2815} {"train_loss": -45.520782470703125, "global_step": 340718, "epoch": 2815} {"train_loss": -45.77907180786133, "global_step": 340719, "epoch": 2815} {"train_loss": -44.75196075439453, "global_step": 340720, "epoch": 2815} {"train_loss": -45.7198371887207, "global_step": 340721, "epoch": 2815} {"train_loss": -45.118568420410156, "global_step": 340722, "epoch": 2815} {"train_loss": -45.21561813354492, "global_step": 340723, "epoch": 2815} {"train_loss": -45.125038146972656, "global_step": 340724, "epoch": 2815} {"train_loss": -45.07960891723633, "global_step": 340725, "epoch": 2815} {"train_loss": -45.51715087890625, "global_step": 340726, "epoch": 2815} {"train_loss": -45.03506088256836, "global_step": 340727, "epoch": 2815} {"train_loss": -45.059078216552734, "global_step": 340728, "epoch": 2815} {"train_loss": -44.84615707397461, "global_step": 340729, "epoch": 2815} {"train_loss": -44.217098236083984, "global_step": 340730, "epoch": 2815} {"train_loss": -43.80786895751953, "global_step": 340731, "epoch": 2815} {"train_loss": -44.141578674316406, "global_step": 340732, "epoch": 2815} {"train_loss": -43.813720703125, "global_step": 340733, "epoch": 2815} {"train_loss": -43.73081588745117, "global_step": 340734, "epoch": 2815} {"train_loss": -44.250662685425816, "global_step": 340735, "epoch": 2815, "val_loss": 2647984.25} {"train_loss": -44.34070587158203, "global_step": 340736, "epoch": 2816} {"train_loss": -43.79928207397461, "global_step": 340737, "epoch": 2816} {"train_loss": -44.2767448425293, "global_step": 340738, "epoch": 2816} {"train_loss": -44.084861755371094, "global_step": 340739, "epoch": 2816} {"train_loss": -44.8197021484375, "global_step": 340740, "epoch": 2816} {"train_loss": -44.64017105102539, "global_step": 340741, "epoch": 2816} {"train_loss": -44.36491394042969, "global_step": 340742, "epoch": 2816} {"train_loss": -42.43675994873047, "global_step": 340743, "epoch": 2816} {"train_loss": -43.40017318725586, "global_step": 340744, "epoch": 2816} {"train_loss": -43.80533218383789, "global_step": 340745, "epoch": 2816} {"train_loss": -41.453792572021484, "global_step": 340746, "epoch": 2816} {"train_loss": -44.2067756652832, "global_step": 340747, "epoch": 2816} {"train_loss": -42.33647918701172, "global_step": 340748, "epoch": 2816} {"train_loss": -43.02542495727539, "global_step": 340749, "epoch": 2816} {"train_loss": -42.923580169677734, "global_step": 340750, "epoch": 2816} {"train_loss": -42.2651481628418, "global_step": 340751, "epoch": 2816} {"train_loss": -43.322200775146484, "global_step": 340752, "epoch": 2816} {"train_loss": -43.303001403808594, "global_step": 340753, "epoch": 2816} {"train_loss": -41.602149963378906, "global_step": 340754, "epoch": 2816} {"train_loss": -43.78438186645508, "global_step": 340755, "epoch": 2816} {"train_loss": -42.71851348876953, "global_step": 340756, "epoch": 2816} {"train_loss": -44.227264404296875, "global_step": 340757, "epoch": 2816} {"train_loss": -43.404815673828125, "global_step": 340758, "epoch": 2816} {"train_loss": -42.38282775878906, "global_step": 340759, "epoch": 2816} {"train_loss": -42.45698165893555, "global_step": 340760, "epoch": 2816} {"train_loss": -43.30093002319336, "global_step": 340761, "epoch": 2816} {"train_loss": -43.23762130737305, "global_step": 340762, "epoch": 2816} {"train_loss": -43.26448059082031, "global_step": 340763, "epoch": 2816} {"train_loss": -43.31515121459961, "global_step": 340764, "epoch": 2816} {"train_loss": -43.48389434814453, "global_step": 340765, "epoch": 2816} {"train_loss": -44.32883834838867, "global_step": 340766, "epoch": 2816} {"train_loss": -43.343536376953125, "global_step": 340767, "epoch": 2816} {"train_loss": -43.255104064941406, "global_step": 340768, "epoch": 2816} {"train_loss": -44.48883819580078, "global_step": 340769, "epoch": 2816} {"train_loss": -43.85524368286133, "global_step": 340770, "epoch": 2816} {"train_loss": -44.09576416015625, "global_step": 340771, "epoch": 2816} {"train_loss": -43.43121337890625, "global_step": 340772, "epoch": 2816} {"train_loss": -44.07558822631836, "global_step": 340773, "epoch": 2816} {"train_loss": -43.90632247924805, "global_step": 340774, "epoch": 2816} {"train_loss": -43.43618392944336, "global_step": 340775, "epoch": 2816} {"train_loss": -43.72507858276367, "global_step": 340776, "epoch": 2816} {"train_loss": -43.799537658691406, "global_step": 340777, "epoch": 2816} {"train_loss": -43.438289642333984, "global_step": 340778, "epoch": 2816} {"train_loss": -44.51546096801758, "global_step": 340779, "epoch": 2816} {"train_loss": -44.03123092651367, "global_step": 340780, "epoch": 2816} {"train_loss": -43.370941162109375, "global_step": 340781, "epoch": 2816} {"train_loss": -44.244903564453125, "global_step": 340782, "epoch": 2816} {"train_loss": -42.986366271972656, "global_step": 340783, "epoch": 2816} {"train_loss": -44.374916076660156, "global_step": 340784, "epoch": 2816} {"train_loss": -44.059242248535156, "global_step": 340785, "epoch": 2816} {"train_loss": -44.22235107421875, "global_step": 340786, "epoch": 2816} {"train_loss": -43.2512321472168, "global_step": 340787, "epoch": 2816} {"train_loss": -43.861976623535156, "global_step": 340788, "epoch": 2816} {"train_loss": -43.448604583740234, "global_step": 340789, "epoch": 2816} {"train_loss": -43.81538772583008, "global_step": 340790, "epoch": 2816} {"train_loss": -44.73603439331055, "global_step": 340791, "epoch": 2816} {"train_loss": -43.25685119628906, "global_step": 340792, "epoch": 2816} {"train_loss": -44.57383346557617, "global_step": 340793, "epoch": 2816} {"train_loss": -43.26633834838867, "global_step": 340794, "epoch": 2816} {"train_loss": -44.36564636230469, "global_step": 340795, "epoch": 2816} {"train_loss": -43.874210357666016, "global_step": 340796, "epoch": 2816} {"train_loss": -44.513763427734375, "global_step": 340797, "epoch": 2816} {"train_loss": -44.12953567504883, "global_step": 340798, "epoch": 2816} {"train_loss": -44.476600646972656, "global_step": 340799, "epoch": 2816} {"train_loss": -43.94240951538086, "global_step": 340800, "epoch": 2816} {"train_loss": -44.852596282958984, "global_step": 340801, "epoch": 2816} {"train_loss": -44.61005783081055, "global_step": 340802, "epoch": 2816} {"train_loss": -44.8784294128418, "global_step": 340803, "epoch": 2816} {"train_loss": -44.611202239990234, "global_step": 340804, "epoch": 2816} {"train_loss": -44.33602523803711, "global_step": 340805, "epoch": 2816} {"train_loss": -45.03885269165039, "global_step": 340806, "epoch": 2816} {"train_loss": -44.4431037902832, "global_step": 340807, "epoch": 2816} {"train_loss": -44.96284103393555, "global_step": 340808, "epoch": 2816} {"train_loss": -45.32177734375, "global_step": 340809, "epoch": 2816} {"train_loss": -45.43824768066406, "global_step": 340810, "epoch": 2816} {"train_loss": -45.20135498046875, "global_step": 340811, "epoch": 2816} {"train_loss": -45.315711975097656, "global_step": 340812, "epoch": 2816} {"train_loss": -45.29102325439453, "global_step": 340813, "epoch": 2816} {"train_loss": -45.46940612792969, "global_step": 340814, "epoch": 2816} {"train_loss": -45.546119689941406, "global_step": 340815, "epoch": 2816} {"train_loss": -45.3846549987793, "global_step": 340816, "epoch": 2816} {"train_loss": -45.38836669921875, "global_step": 340817, "epoch": 2816} {"train_loss": -44.81177520751953, "global_step": 340818, "epoch": 2816} {"train_loss": -45.62905502319336, "global_step": 340819, "epoch": 2816} {"train_loss": -45.44382858276367, "global_step": 340820, "epoch": 2816} {"train_loss": -45.45313262939453, "global_step": 340821, "epoch": 2816} {"train_loss": -45.88203811645508, "global_step": 340822, "epoch": 2816} {"train_loss": -45.938716888427734, "global_step": 340823, "epoch": 2816} {"train_loss": -45.5538215637207, "global_step": 340824, "epoch": 2816} {"train_loss": -44.36669921875, "global_step": 340825, "epoch": 2816} {"train_loss": -44.63420486450195, "global_step": 340826, "epoch": 2816} {"train_loss": -44.574302673339844, "global_step": 340827, "epoch": 2816} {"train_loss": -44.96799850463867, "global_step": 340828, "epoch": 2816} {"train_loss": -45.3602294921875, "global_step": 340829, "epoch": 2816} {"train_loss": -44.316795349121094, "global_step": 340830, "epoch": 2816} {"train_loss": -45.391998291015625, "global_step": 340831, "epoch": 2816} {"train_loss": -44.99656295776367, "global_step": 340832, "epoch": 2816} {"train_loss": -44.926551818847656, "global_step": 340833, "epoch": 2816} {"train_loss": -44.73359680175781, "global_step": 340834, "epoch": 2816} {"train_loss": -43.65439987182617, "global_step": 340835, "epoch": 2816} {"train_loss": -44.297462463378906, "global_step": 340836, "epoch": 2816} {"train_loss": -44.898223876953125, "global_step": 340837, "epoch": 2816} {"train_loss": -43.49634552001953, "global_step": 340838, "epoch": 2816} {"train_loss": -43.31008529663086, "global_step": 340839, "epoch": 2816} {"train_loss": -43.7474365234375, "global_step": 340840, "epoch": 2816} {"train_loss": -43.694156646728516, "global_step": 340841, "epoch": 2816} {"train_loss": -43.30396270751953, "global_step": 340842, "epoch": 2816} {"train_loss": -41.76763916015625, "global_step": 340843, "epoch": 2816} {"train_loss": -41.98833084106445, "global_step": 340844, "epoch": 2816} {"train_loss": -43.2773551940918, "global_step": 340845, "epoch": 2816} {"train_loss": -44.13208770751953, "global_step": 340846, "epoch": 2816} {"train_loss": -43.93939208984375, "global_step": 340847, "epoch": 2816} {"train_loss": -44.68837356567383, "global_step": 340848, "epoch": 2816} {"train_loss": -42.32099533081055, "global_step": 340849, "epoch": 2816} {"train_loss": -43.31892395019531, "global_step": 340850, "epoch": 2816} {"train_loss": -42.751220703125, "global_step": 340851, "epoch": 2816} {"train_loss": -44.02782440185547, "global_step": 340852, "epoch": 2816} {"train_loss": -43.14904022216797, "global_step": 340853, "epoch": 2816} {"train_loss": -43.69712448120117, "global_step": 340854, "epoch": 2816} {"train_loss": -44.15676498413086, "global_step": 340855, "epoch": 2816} {"train_loss": -44.01989815451882, "global_step": 340856, "epoch": 2816, "val_loss": 2644252.75} {"train_loss": -43.197628021240234, "global_step": 340857, "epoch": 2817} {"train_loss": -43.20085906982422, "global_step": 340858, "epoch": 2817} {"train_loss": -43.68769073486328, "global_step": 340859, "epoch": 2817} {"train_loss": -43.485748291015625, "global_step": 340860, "epoch": 2817} {"train_loss": -44.996551513671875, "global_step": 340861, "epoch": 2817} {"train_loss": -44.35979080200195, "global_step": 340862, "epoch": 2817} {"train_loss": -43.934852600097656, "global_step": 340863, "epoch": 2817} {"train_loss": -44.67428207397461, "global_step": 340864, "epoch": 2817} {"train_loss": -43.92142868041992, "global_step": 340865, "epoch": 2817} {"train_loss": -43.867340087890625, "global_step": 340866, "epoch": 2817} {"train_loss": -44.62726974487305, "global_step": 340867, "epoch": 2817} {"train_loss": -43.55073928833008, "global_step": 340868, "epoch": 2817} {"train_loss": -44.12296676635742, "global_step": 340869, "epoch": 2817} {"train_loss": -44.13261032104492, "global_step": 340870, "epoch": 2817} {"train_loss": -43.39894485473633, "global_step": 340871, "epoch": 2817} {"train_loss": -43.51799392700195, "global_step": 340872, "epoch": 2817} {"train_loss": -43.60079574584961, "global_step": 340873, "epoch": 2817} {"train_loss": -44.276527404785156, "global_step": 340874, "epoch": 2817} {"train_loss": -44.503883361816406, "global_step": 340875, "epoch": 2817} {"train_loss": -44.317604064941406, "global_step": 340876, "epoch": 2817} {"train_loss": -43.9831657409668, "global_step": 340877, "epoch": 2817} {"train_loss": -44.55790328979492, "global_step": 340878, "epoch": 2817} {"train_loss": -43.473995208740234, "global_step": 340879, "epoch": 2817} {"train_loss": -43.325645446777344, "global_step": 340880, "epoch": 2817} {"train_loss": -43.486995697021484, "global_step": 340881, "epoch": 2817} {"train_loss": -43.691593170166016, "global_step": 340882, "epoch": 2817} {"train_loss": -42.35719680786133, "global_step": 340883, "epoch": 2817} {"train_loss": -43.49523162841797, "global_step": 340884, "epoch": 2817} {"train_loss": -43.2918586730957, "global_step": 340885, "epoch": 2817} {"train_loss": -42.96725082397461, "global_step": 340886, "epoch": 2817} {"train_loss": -41.4194450378418, "global_step": 340887, "epoch": 2817} {"train_loss": -44.275142669677734, "global_step": 340888, "epoch": 2817} {"train_loss": -41.37618637084961, "global_step": 340889, "epoch": 2817} {"train_loss": -43.623531341552734, "global_step": 340890, "epoch": 2817} {"train_loss": -42.15155792236328, "global_step": 340891, "epoch": 2817} {"train_loss": -43.85357666015625, "global_step": 340892, "epoch": 2817} {"train_loss": -41.23691940307617, "global_step": 340893, "epoch": 2817} {"train_loss": -43.966827392578125, "global_step": 340894, "epoch": 2817} {"train_loss": -43.84634017944336, "global_step": 340895, "epoch": 2817} {"train_loss": -42.725013732910156, "global_step": 340896, "epoch": 2817} {"train_loss": -44.07854461669922, "global_step": 340897, "epoch": 2817} {"train_loss": -43.813453674316406, "global_step": 340898, "epoch": 2817} {"train_loss": -43.62677001953125, "global_step": 340899, "epoch": 2817} {"train_loss": -43.18910217285156, "global_step": 340900, "epoch": 2817} {"train_loss": -44.49176788330078, "global_step": 340901, "epoch": 2817} {"train_loss": -43.72837448120117, "global_step": 340902, "epoch": 2817} {"train_loss": -43.62348556518555, "global_step": 340903, "epoch": 2817} {"train_loss": -44.742488861083984, "global_step": 340904, "epoch": 2817} {"train_loss": -44.388404846191406, "global_step": 340905, "epoch": 2817} {"train_loss": -44.2120246887207, "global_step": 340906, "epoch": 2817} {"train_loss": -43.744869232177734, "global_step": 340907, "epoch": 2817} {"train_loss": -45.135841369628906, "global_step": 340908, "epoch": 2817} {"train_loss": -43.65340042114258, "global_step": 340909, "epoch": 2817} {"train_loss": -44.033050537109375, "global_step": 340910, "epoch": 2817} {"train_loss": -44.254249572753906, "global_step": 340911, "epoch": 2817} {"train_loss": -44.6543083190918, "global_step": 340912, "epoch": 2817} {"train_loss": -44.56278991699219, "global_step": 340913, "epoch": 2817} {"train_loss": -44.70452880859375, "global_step": 340914, "epoch": 2817} {"train_loss": -44.95799255371094, "global_step": 340915, "epoch": 2817} {"train_loss": -44.45322036743164, "global_step": 340916, "epoch": 2817} {"train_loss": -45.084808349609375, "global_step": 340917, "epoch": 2817} {"train_loss": -44.897037506103516, "global_step": 340918, "epoch": 2817} {"train_loss": -45.051082611083984, "global_step": 340919, "epoch": 2817} {"train_loss": -44.97684860229492, "global_step": 340920, "epoch": 2817} {"train_loss": -44.91016387939453, "global_step": 340921, "epoch": 2817} {"train_loss": -45.113624572753906, "global_step": 340922, "epoch": 2817} {"train_loss": -45.022884368896484, "global_step": 340923, "epoch": 2817} {"train_loss": -45.24098587036133, "global_step": 340924, "epoch": 2817} {"train_loss": -44.665138244628906, "global_step": 340925, "epoch": 2817} {"train_loss": -45.4952507019043, "global_step": 340926, "epoch": 2817} {"train_loss": -45.173622131347656, "global_step": 340927, "epoch": 2817} {"train_loss": -45.36287307739258, "global_step": 340928, "epoch": 2817} {"train_loss": -45.49113845825195, "global_step": 340929, "epoch": 2817} {"train_loss": -45.59161376953125, "global_step": 340930, "epoch": 2817} {"train_loss": -45.82304000854492, "global_step": 340931, "epoch": 2817} {"train_loss": -45.4975471496582, "global_step": 340932, "epoch": 2817} {"train_loss": -45.283138275146484, "global_step": 340933, "epoch": 2817} {"train_loss": -44.844146728515625, "global_step": 340934, "epoch": 2817} {"train_loss": -45.720497131347656, "global_step": 340935, "epoch": 2817} {"train_loss": -45.26940155029297, "global_step": 340936, "epoch": 2817} {"train_loss": -44.55356979370117, "global_step": 340937, "epoch": 2817} {"train_loss": -44.7034912109375, "global_step": 340938, "epoch": 2817} {"train_loss": -45.21009826660156, "global_step": 340939, "epoch": 2817} {"train_loss": -44.9334831237793, "global_step": 340940, "epoch": 2817} {"train_loss": -45.1451530456543, "global_step": 340941, "epoch": 2817} {"train_loss": -45.0001106262207, "global_step": 340942, "epoch": 2817} {"train_loss": -45.4293212890625, "global_step": 340943, "epoch": 2817} {"train_loss": -45.31873321533203, "global_step": 340944, "epoch": 2817} {"train_loss": -44.532554626464844, "global_step": 340945, "epoch": 2817} {"train_loss": -44.93326187133789, "global_step": 340946, "epoch": 2817} {"train_loss": -45.497920989990234, "global_step": 340947, "epoch": 2817} {"train_loss": -44.878902435302734, "global_step": 340948, "epoch": 2817} {"train_loss": -44.62234115600586, "global_step": 340949, "epoch": 2817} {"train_loss": -45.39177703857422, "global_step": 340950, "epoch": 2817} {"train_loss": -44.60918045043945, "global_step": 340951, "epoch": 2817} {"train_loss": -45.327205657958984, "global_step": 340952, "epoch": 2817} {"train_loss": -45.316497802734375, "global_step": 340953, "epoch": 2817} {"train_loss": -44.432430267333984, "global_step": 340954, "epoch": 2817} {"train_loss": -44.13124084472656, "global_step": 340955, "epoch": 2817} {"train_loss": -45.231563568115234, "global_step": 340956, "epoch": 2817} {"train_loss": -45.63481521606445, "global_step": 340957, "epoch": 2817} {"train_loss": -45.14944076538086, "global_step": 340958, "epoch": 2817} {"train_loss": -45.32814407348633, "global_step": 340959, "epoch": 2817} {"train_loss": -45.396549224853516, "global_step": 340960, "epoch": 2817} {"train_loss": -44.624481201171875, "global_step": 340961, "epoch": 2817} {"train_loss": -45.25949478149414, "global_step": 340962, "epoch": 2817} {"train_loss": -44.40996170043945, "global_step": 340963, "epoch": 2817} {"train_loss": -44.62987518310547, "global_step": 340964, "epoch": 2817} {"train_loss": -45.00143051147461, "global_step": 340965, "epoch": 2817} {"train_loss": -45.58041000366211, "global_step": 340966, "epoch": 2817} {"train_loss": -44.058135986328125, "global_step": 340967, "epoch": 2817} {"train_loss": -44.35517120361328, "global_step": 340968, "epoch": 2817} {"train_loss": -45.24628448486328, "global_step": 340969, "epoch": 2817} {"train_loss": -45.75454330444336, "global_step": 340970, "epoch": 2817} {"train_loss": -44.08056640625, "global_step": 340971, "epoch": 2817} {"train_loss": -43.64528274536133, "global_step": 340972, "epoch": 2817} {"train_loss": -45.15484619140625, "global_step": 340973, "epoch": 2817} {"train_loss": -44.02080535888672, "global_step": 340974, "epoch": 2817} {"train_loss": -43.72747039794922, "global_step": 340975, "epoch": 2817} {"train_loss": -44.610008239746094, "global_step": 340976, "epoch": 2817} {"train_loss": -44.381154178587856, "global_step": 340977, "epoch": 2817, "val_loss": 2659348.25} {"train_loss": -43.163055419921875, "global_step": 340978, "epoch": 2818} {"train_loss": -45.07461929321289, "global_step": 340979, "epoch": 2818} {"train_loss": -43.10694122314453, "global_step": 340980, "epoch": 2818} {"train_loss": -42.602474212646484, "global_step": 340981, "epoch": 2818} {"train_loss": -44.53401565551758, "global_step": 340982, "epoch": 2818} {"train_loss": -43.07148361206055, "global_step": 340983, "epoch": 2818} {"train_loss": -42.74174499511719, "global_step": 340984, "epoch": 2818} {"train_loss": -42.8055534362793, "global_step": 340985, "epoch": 2818} {"train_loss": -44.249237060546875, "global_step": 340986, "epoch": 2818} {"train_loss": -44.07326126098633, "global_step": 340987, "epoch": 2818} {"train_loss": -43.281856536865234, "global_step": 340988, "epoch": 2818} {"train_loss": -43.77925491333008, "global_step": 340989, "epoch": 2818} {"train_loss": -44.057594299316406, "global_step": 340990, "epoch": 2818} {"train_loss": -44.59707260131836, "global_step": 340991, "epoch": 2818} {"train_loss": -44.611732482910156, "global_step": 340992, "epoch": 2818} {"train_loss": -43.470703125, "global_step": 340993, "epoch": 2818} {"train_loss": -43.96908187866211, "global_step": 340994, "epoch": 2818} {"train_loss": -44.472389221191406, "global_step": 340995, "epoch": 2818} {"train_loss": -43.547847747802734, "global_step": 340996, "epoch": 2818} {"train_loss": -43.99934005737305, "global_step": 340997, "epoch": 2818} {"train_loss": -43.88376998901367, "global_step": 340998, "epoch": 2818} {"train_loss": -44.41419982910156, "global_step": 340999, "epoch": 2818} {"train_loss": -44.294246673583984, "global_step": 341000, "epoch": 2818} {"train_loss": -42.68887710571289, "global_step": 341001, "epoch": 2818} {"train_loss": -42.19924545288086, "global_step": 341002, "epoch": 2818} {"train_loss": -44.374568939208984, "global_step": 341003, "epoch": 2818} {"train_loss": -43.936641693115234, "global_step": 341004, "epoch": 2818} {"train_loss": -44.43186569213867, "global_step": 341005, "epoch": 2818} {"train_loss": -44.7825813293457, "global_step": 341006, "epoch": 2818} {"train_loss": -44.73506164550781, "global_step": 341007, "epoch": 2818} {"train_loss": -44.259315490722656, "global_step": 341008, "epoch": 2818} {"train_loss": -44.9270133972168, "global_step": 341009, "epoch": 2818} {"train_loss": -42.726036071777344, "global_step": 341010, "epoch": 2818} {"train_loss": -44.67637252807617, "global_step": 341011, "epoch": 2818} {"train_loss": -43.77724838256836, "global_step": 341012, "epoch": 2818} {"train_loss": -43.73228073120117, "global_step": 341013, "epoch": 2818} {"train_loss": -45.26035690307617, "global_step": 341014, "epoch": 2818} {"train_loss": -44.7224235534668, "global_step": 341015, "epoch": 2818} {"train_loss": -44.576011657714844, "global_step": 341016, "epoch": 2818} {"train_loss": -44.6824836730957, "global_step": 341017, "epoch": 2818} {"train_loss": -44.713218688964844, "global_step": 341018, "epoch": 2818} {"train_loss": -44.979042053222656, "global_step": 341019, "epoch": 2818} {"train_loss": -45.08649826049805, "global_step": 341020, "epoch": 2818} {"train_loss": -44.657989501953125, "global_step": 341021, "epoch": 2818} {"train_loss": -44.71059799194336, "global_step": 341022, "epoch": 2818} {"train_loss": -44.81182861328125, "global_step": 341023, "epoch": 2818} {"train_loss": -44.652015686035156, "global_step": 341024, "epoch": 2818} {"train_loss": -44.504310607910156, "global_step": 341025, "epoch": 2818} {"train_loss": -44.75849151611328, "global_step": 341026, "epoch": 2818} {"train_loss": -44.62915802001953, "global_step": 341027, "epoch": 2818} {"train_loss": -44.371158599853516, "global_step": 341028, "epoch": 2818} {"train_loss": -45.265594482421875, "global_step": 341029, "epoch": 2818} {"train_loss": -45.18452072143555, "global_step": 341030, "epoch": 2818} {"train_loss": -44.566497802734375, "global_step": 341031, "epoch": 2818} {"train_loss": -44.38332748413086, "global_step": 341032, "epoch": 2818} {"train_loss": -44.63043212890625, "global_step": 341033, "epoch": 2818} {"train_loss": -44.05788803100586, "global_step": 341034, "epoch": 2818} {"train_loss": -44.17817687988281, "global_step": 341035, "epoch": 2818} {"train_loss": -44.666015625, "global_step": 341036, "epoch": 2818} {"train_loss": -43.9622802734375, "global_step": 341037, "epoch": 2818} {"train_loss": -45.25165939331055, "global_step": 341038, "epoch": 2818} {"train_loss": -44.464054107666016, "global_step": 341039, "epoch": 2818} {"train_loss": -44.898170471191406, "global_step": 341040, "epoch": 2818} {"train_loss": -45.50429916381836, "global_step": 341041, "epoch": 2818} {"train_loss": -45.03498458862305, "global_step": 341042, "epoch": 2818} {"train_loss": -44.246395111083984, "global_step": 341043, "epoch": 2818} {"train_loss": -45.47810363769531, "global_step": 341044, "epoch": 2818} {"train_loss": -44.45051574707031, "global_step": 341045, "epoch": 2818} {"train_loss": -44.87782287597656, "global_step": 341046, "epoch": 2818} {"train_loss": -44.98268508911133, "global_step": 341047, "epoch": 2818} {"train_loss": -44.71479415893555, "global_step": 341048, "epoch": 2818} {"train_loss": -45.30105209350586, "global_step": 341049, "epoch": 2818} {"train_loss": -44.90210723876953, "global_step": 341050, "epoch": 2818} {"train_loss": -44.14325714111328, "global_step": 341051, "epoch": 2818} {"train_loss": -44.78895950317383, "global_step": 341052, "epoch": 2818} {"train_loss": -44.98249435424805, "global_step": 341053, "epoch": 2818} {"train_loss": -44.00117111206055, "global_step": 341054, "epoch": 2818} {"train_loss": -44.005638122558594, "global_step": 341055, "epoch": 2818} {"train_loss": -44.14629364013672, "global_step": 341056, "epoch": 2818} {"train_loss": -44.70827865600586, "global_step": 341057, "epoch": 2818} {"train_loss": -45.47854232788086, "global_step": 341058, "epoch": 2818} {"train_loss": -44.83074951171875, "global_step": 341059, "epoch": 2818} {"train_loss": -44.456703186035156, "global_step": 341060, "epoch": 2818} {"train_loss": -45.4651985168457, "global_step": 341061, "epoch": 2818} {"train_loss": -45.33036422729492, "global_step": 341062, "epoch": 2818} {"train_loss": -45.3310546875, "global_step": 341063, "epoch": 2818} {"train_loss": -44.44192123413086, "global_step": 341064, "epoch": 2818} {"train_loss": -43.7731819152832, "global_step": 341065, "epoch": 2818} {"train_loss": -45.0347900390625, "global_step": 341066, "epoch": 2818} {"train_loss": -44.915061950683594, "global_step": 341067, "epoch": 2818} {"train_loss": -45.353084564208984, "global_step": 341068, "epoch": 2818} {"train_loss": -44.592891693115234, "global_step": 341069, "epoch": 2818} {"train_loss": -44.36753463745117, "global_step": 341070, "epoch": 2818} {"train_loss": -44.624549865722656, "global_step": 341071, "epoch": 2818} {"train_loss": -44.8079948425293, "global_step": 341072, "epoch": 2818} {"train_loss": -44.19880294799805, "global_step": 341073, "epoch": 2818} {"train_loss": -43.10520553588867, "global_step": 341074, "epoch": 2818} {"train_loss": -44.66215515136719, "global_step": 341075, "epoch": 2818} {"train_loss": -45.63859558105469, "global_step": 341076, "epoch": 2818} {"train_loss": -45.29104232788086, "global_step": 341077, "epoch": 2818} {"train_loss": -45.34315872192383, "global_step": 341078, "epoch": 2818} {"train_loss": -45.39302444458008, "global_step": 341079, "epoch": 2818} {"train_loss": -44.8277702331543, "global_step": 341080, "epoch": 2818} {"train_loss": -43.791542053222656, "global_step": 341081, "epoch": 2818} {"train_loss": -44.96023941040039, "global_step": 341082, "epoch": 2818} {"train_loss": -44.73008346557617, "global_step": 341083, "epoch": 2818} {"train_loss": -44.617000579833984, "global_step": 341084, "epoch": 2818} {"train_loss": -44.96480941772461, "global_step": 341085, "epoch": 2818} {"train_loss": -44.561641693115234, "global_step": 341086, "epoch": 2818} {"train_loss": -45.052833557128906, "global_step": 341087, "epoch": 2818} {"train_loss": -44.13693618774414, "global_step": 341088, "epoch": 2818} {"train_loss": -45.20246124267578, "global_step": 341089, "epoch": 2818} {"train_loss": -45.21395492553711, "global_step": 341090, "epoch": 2818} {"train_loss": -43.17951583862305, "global_step": 341091, "epoch": 2818} {"train_loss": -43.925106048583984, "global_step": 341092, "epoch": 2818} {"train_loss": -44.600215911865234, "global_step": 341093, "epoch": 2818} {"train_loss": -41.25291442871094, "global_step": 341094, "epoch": 2818} {"train_loss": -43.32259750366211, "global_step": 341095, "epoch": 2818} {"train_loss": -42.11371612548828, "global_step": 341096, "epoch": 2818} {"train_loss": -42.058223724365234, "global_step": 341097, "epoch": 2818} {"train_loss": -44.355243209964975, "global_step": 341098, "epoch": 2818, "val_loss": 2612932.75} {"train_loss": -43.8411750793457, "global_step": 341099, "epoch": 2819} {"train_loss": -43.430816650390625, "global_step": 341100, "epoch": 2819} {"train_loss": -40.94586181640625, "global_step": 341101, "epoch": 2819} {"train_loss": -43.195159912109375, "global_step": 341102, "epoch": 2819} {"train_loss": -43.22214126586914, "global_step": 341103, "epoch": 2819} {"train_loss": -41.9548454284668, "global_step": 341104, "epoch": 2819} {"train_loss": -43.89724349975586, "global_step": 341105, "epoch": 2819} {"train_loss": -43.54636764526367, "global_step": 341106, "epoch": 2819} {"train_loss": -43.70304489135742, "global_step": 341107, "epoch": 2819} {"train_loss": -41.30355453491211, "global_step": 341108, "epoch": 2819} {"train_loss": -43.83457565307617, "global_step": 341109, "epoch": 2819} {"train_loss": -40.234920501708984, "global_step": 341110, "epoch": 2819} {"train_loss": -42.2356071472168, "global_step": 341111, "epoch": 2819} {"train_loss": -39.67086410522461, "global_step": 341112, "epoch": 2819} {"train_loss": -41.109283447265625, "global_step": 341113, "epoch": 2819} {"train_loss": -42.037933349609375, "global_step": 341114, "epoch": 2819} {"train_loss": -41.47555160522461, "global_step": 341115, "epoch": 2819} {"train_loss": -43.27178955078125, "global_step": 341116, "epoch": 2819} {"train_loss": -42.87092971801758, "global_step": 341117, "epoch": 2819} {"train_loss": -43.043270111083984, "global_step": 341118, "epoch": 2819} {"train_loss": -43.60719680786133, "global_step": 341119, "epoch": 2819} {"train_loss": -43.116207122802734, "global_step": 341120, "epoch": 2819} {"train_loss": -43.984920501708984, "global_step": 341121, "epoch": 2819} {"train_loss": -42.43289566040039, "global_step": 341122, "epoch": 2819} {"train_loss": -43.560394287109375, "global_step": 341123, "epoch": 2819} {"train_loss": -42.06452560424805, "global_step": 341124, "epoch": 2819} {"train_loss": -43.76287841796875, "global_step": 341125, "epoch": 2819} {"train_loss": -42.750404357910156, "global_step": 341126, "epoch": 2819} {"train_loss": -43.196781158447266, "global_step": 341127, "epoch": 2819} {"train_loss": -43.066463470458984, "global_step": 341128, "epoch": 2819} {"train_loss": -43.93596649169922, "global_step": 341129, "epoch": 2819} {"train_loss": -44.1140251159668, "global_step": 341130, "epoch": 2819} {"train_loss": -42.83189010620117, "global_step": 341131, "epoch": 2819} {"train_loss": -43.96062088012695, "global_step": 341132, "epoch": 2819} {"train_loss": -43.814208984375, "global_step": 341133, "epoch": 2819} {"train_loss": -43.95920944213867, "global_step": 341134, "epoch": 2819} {"train_loss": -43.864990234375, "global_step": 341135, "epoch": 2819} {"train_loss": -43.88789749145508, "global_step": 341136, "epoch": 2819} {"train_loss": -43.542598724365234, "global_step": 341137, "epoch": 2819} {"train_loss": -43.081607818603516, "global_step": 341138, "epoch": 2819} {"train_loss": -44.16538619995117, "global_step": 341139, "epoch": 2819} {"train_loss": -43.752227783203125, "global_step": 341140, "epoch": 2819} {"train_loss": -43.143917083740234, "global_step": 341141, "epoch": 2819} {"train_loss": -44.308067321777344, "global_step": 341142, "epoch": 2819} {"train_loss": -43.69987106323242, "global_step": 341143, "epoch": 2819} {"train_loss": -43.755287170410156, "global_step": 341144, "epoch": 2819} {"train_loss": -43.90095520019531, "global_step": 341145, "epoch": 2819} {"train_loss": -44.21271514892578, "global_step": 341146, "epoch": 2819} {"train_loss": -44.06700134277344, "global_step": 341147, "epoch": 2819} {"train_loss": -44.475677490234375, "global_step": 341148, "epoch": 2819} {"train_loss": -44.47874069213867, "global_step": 341149, "epoch": 2819} {"train_loss": -44.30548858642578, "global_step": 341150, "epoch": 2819} {"train_loss": -44.43024826049805, "global_step": 341151, "epoch": 2819} {"train_loss": -44.80876541137695, "global_step": 341152, "epoch": 2819} {"train_loss": -44.42452621459961, "global_step": 341153, "epoch": 2819} {"train_loss": -44.48221969604492, "global_step": 341154, "epoch": 2819} {"train_loss": -43.89539337158203, "global_step": 341155, "epoch": 2819} {"train_loss": -44.29874801635742, "global_step": 341156, "epoch": 2819} {"train_loss": -44.4174690246582, "global_step": 341157, "epoch": 2819} {"train_loss": -44.7119140625, "global_step": 341158, "epoch": 2819} {"train_loss": -44.237667083740234, "global_step": 341159, "epoch": 2819} {"train_loss": -44.42707824707031, "global_step": 341160, "epoch": 2819} {"train_loss": -44.52333450317383, "global_step": 341161, "epoch": 2819} {"train_loss": -44.7760009765625, "global_step": 341162, "epoch": 2819} {"train_loss": -44.81968307495117, "global_step": 341163, "epoch": 2819} {"train_loss": -44.707576751708984, "global_step": 341164, "epoch": 2819} {"train_loss": -44.83232498168945, "global_step": 341165, "epoch": 2819} {"train_loss": -45.1965446472168, "global_step": 341166, "epoch": 2819} {"train_loss": -45.00643539428711, "global_step": 341167, "epoch": 2819} {"train_loss": -44.929237365722656, "global_step": 341168, "epoch": 2819} {"train_loss": -44.482601165771484, "global_step": 341169, "epoch": 2819} {"train_loss": -45.143890380859375, "global_step": 341170, "epoch": 2819} {"train_loss": -45.6490592956543, "global_step": 341171, "epoch": 2819} {"train_loss": -44.786537170410156, "global_step": 341172, "epoch": 2819} {"train_loss": -45.14735412597656, "global_step": 341173, "epoch": 2819} {"train_loss": -45.52314376831055, "global_step": 341174, "epoch": 2819} {"train_loss": -44.88418197631836, "global_step": 341175, "epoch": 2819} {"train_loss": -45.20591354370117, "global_step": 341176, "epoch": 2819} {"train_loss": -45.1303825378418, "global_step": 341177, "epoch": 2819} {"train_loss": -44.9075927734375, "global_step": 341178, "epoch": 2819} {"train_loss": -44.98706817626953, "global_step": 341179, "epoch": 2819} {"train_loss": -45.149810791015625, "global_step": 341180, "epoch": 2819} {"train_loss": -45.45813751220703, "global_step": 341181, "epoch": 2819} {"train_loss": -44.643638610839844, "global_step": 341182, "epoch": 2819} {"train_loss": -45.32088088989258, "global_step": 341183, "epoch": 2819} {"train_loss": -45.33502197265625, "global_step": 341184, "epoch": 2819} {"train_loss": -45.069461822509766, "global_step": 341185, "epoch": 2819} {"train_loss": -45.181007385253906, "global_step": 341186, "epoch": 2819} {"train_loss": -45.56505584716797, "global_step": 341187, "epoch": 2819} {"train_loss": -45.50886917114258, "global_step": 341188, "epoch": 2819} {"train_loss": -45.45442199707031, "global_step": 341189, "epoch": 2819} {"train_loss": -45.5792236328125, "global_step": 341190, "epoch": 2819} {"train_loss": -45.39044952392578, "global_step": 341191, "epoch": 2819} {"train_loss": -45.77961349487305, "global_step": 341192, "epoch": 2819} {"train_loss": -45.59822082519531, "global_step": 341193, "epoch": 2819} {"train_loss": -45.7276496887207, "global_step": 341194, "epoch": 2819} {"train_loss": -45.54427719116211, "global_step": 341195, "epoch": 2819} {"train_loss": -45.781734466552734, "global_step": 341196, "epoch": 2819} {"train_loss": -45.35096740722656, "global_step": 341197, "epoch": 2819} {"train_loss": -45.46857833862305, "global_step": 341198, "epoch": 2819} {"train_loss": -45.45549392700195, "global_step": 341199, "epoch": 2819} {"train_loss": -46.04758071899414, "global_step": 341200, "epoch": 2819} {"train_loss": -46.06207275390625, "global_step": 341201, "epoch": 2819} {"train_loss": -45.711761474609375, "global_step": 341202, "epoch": 2819} {"train_loss": -45.538082122802734, "global_step": 341203, "epoch": 2819} {"train_loss": -45.37850570678711, "global_step": 341204, "epoch": 2819} {"train_loss": -44.86925506591797, "global_step": 341205, "epoch": 2819} {"train_loss": -45.83487319946289, "global_step": 341206, "epoch": 2819} {"train_loss": -45.92990493774414, "global_step": 341207, "epoch": 2819} {"train_loss": -45.581756591796875, "global_step": 341208, "epoch": 2819} {"train_loss": -45.039527893066406, "global_step": 341209, "epoch": 2819} {"train_loss": -45.70310592651367, "global_step": 341210, "epoch": 2819} {"train_loss": -45.9091796875, "global_step": 341211, "epoch": 2819} {"train_loss": -45.49941635131836, "global_step": 341212, "epoch": 2819} {"train_loss": -45.118221282958984, "global_step": 341213, "epoch": 2819} {"train_loss": -43.94647216796875, "global_step": 341214, "epoch": 2819} {"train_loss": -42.8183479309082, "global_step": 341215, "epoch": 2819} {"train_loss": -44.24081039428711, "global_step": 341216, "epoch": 2819} {"train_loss": -45.07627868652344, "global_step": 341217, "epoch": 2819} {"train_loss": -44.76536178588867, "global_step": 341218, "epoch": 2819} {"train_loss": -44.26258796502736, "global_step": 341219, "epoch": 2819, "val_loss": 2663146.5} {"train_loss": -42.781028747558594, "global_step": 341220, "epoch": 2820} {"train_loss": -44.32353591918945, "global_step": 341221, "epoch": 2820} {"train_loss": -45.306949615478516, "global_step": 341222, "epoch": 2820} {"train_loss": -44.0588264465332, "global_step": 341223, "epoch": 2820} {"train_loss": -44.294918060302734, "global_step": 341224, "epoch": 2820} {"train_loss": -45.177406311035156, "global_step": 341225, "epoch": 2820} {"train_loss": -44.289276123046875, "global_step": 341226, "epoch": 2820} {"train_loss": -44.54864501953125, "global_step": 341227, "epoch": 2820} {"train_loss": -44.9322624206543, "global_step": 341228, "epoch": 2820} {"train_loss": -42.814510345458984, "global_step": 341229, "epoch": 2820} {"train_loss": -41.7855339050293, "global_step": 341230, "epoch": 2820} {"train_loss": -44.65009689331055, "global_step": 341231, "epoch": 2820} {"train_loss": -39.98649215698242, "global_step": 341232, "epoch": 2820} {"train_loss": -44.49994659423828, "global_step": 341233, "epoch": 2820} {"train_loss": -42.07719039916992, "global_step": 341234, "epoch": 2820} {"train_loss": -44.529518127441406, "global_step": 341235, "epoch": 2820} {"train_loss": -44.55121994018555, "global_step": 341236, "epoch": 2820} {"train_loss": -43.9604377746582, "global_step": 341237, "epoch": 2820} {"train_loss": -44.261260986328125, "global_step": 341238, "epoch": 2820} {"train_loss": -44.21357345581055, "global_step": 341239, "epoch": 2820} {"train_loss": -43.9774169921875, "global_step": 341240, "epoch": 2820} {"train_loss": -43.002227783203125, "global_step": 341241, "epoch": 2820} {"train_loss": -44.59626770019531, "global_step": 341242, "epoch": 2820} {"train_loss": -43.82270050048828, "global_step": 341243, "epoch": 2820} {"train_loss": -44.204673767089844, "global_step": 341244, "epoch": 2820} {"train_loss": -44.5798225402832, "global_step": 341245, "epoch": 2820} {"train_loss": -43.721282958984375, "global_step": 341246, "epoch": 2820} {"train_loss": -43.48029327392578, "global_step": 341247, "epoch": 2820} {"train_loss": -44.18902587890625, "global_step": 341248, "epoch": 2820} {"train_loss": -42.916015625, "global_step": 341249, "epoch": 2820} {"train_loss": -42.57846450805664, "global_step": 341250, "epoch": 2820} {"train_loss": -44.3203125, "global_step": 341251, "epoch": 2820} {"train_loss": -43.70014572143555, "global_step": 341252, "epoch": 2820} {"train_loss": -42.59973907470703, "global_step": 341253, "epoch": 2820} {"train_loss": -44.167381286621094, "global_step": 341254, "epoch": 2820} {"train_loss": -44.226802825927734, "global_step": 341255, "epoch": 2820} {"train_loss": -43.910858154296875, "global_step": 341256, "epoch": 2820} {"train_loss": -43.94337844848633, "global_step": 341257, "epoch": 2820} {"train_loss": -44.51864242553711, "global_step": 341258, "epoch": 2820} {"train_loss": -43.56669998168945, "global_step": 341259, "epoch": 2820} {"train_loss": -43.81549835205078, "global_step": 341260, "epoch": 2820} {"train_loss": -44.04534912109375, "global_step": 341261, "epoch": 2820} {"train_loss": -44.393768310546875, "global_step": 341262, "epoch": 2820} {"train_loss": -44.45812225341797, "global_step": 341263, "epoch": 2820} {"train_loss": -44.62087631225586, "global_step": 341264, "epoch": 2820} {"train_loss": -44.54443359375, "global_step": 341265, "epoch": 2820} {"train_loss": -44.88410949707031, "global_step": 341266, "epoch": 2820} {"train_loss": -43.69611358642578, "global_step": 341267, "epoch": 2820} {"train_loss": -44.24802017211914, "global_step": 341268, "epoch": 2820} {"train_loss": -44.66614532470703, "global_step": 341269, "epoch": 2820} {"train_loss": -43.777523040771484, "global_step": 341270, "epoch": 2820} {"train_loss": -43.4527587890625, "global_step": 341271, "epoch": 2820} {"train_loss": -45.28586959838867, "global_step": 341272, "epoch": 2820} {"train_loss": -43.88199234008789, "global_step": 341273, "epoch": 2820} {"train_loss": -44.48752975463867, "global_step": 341274, "epoch": 2820} {"train_loss": -44.46205520629883, "global_step": 341275, "epoch": 2820} {"train_loss": -44.73334503173828, "global_step": 341276, "epoch": 2820} {"train_loss": -44.8932991027832, "global_step": 341277, "epoch": 2820} {"train_loss": -44.28921127319336, "global_step": 341278, "epoch": 2820} {"train_loss": -44.2899284362793, "global_step": 341279, "epoch": 2820} {"train_loss": -45.045040130615234, "global_step": 341280, "epoch": 2820} {"train_loss": -45.30085372924805, "global_step": 341281, "epoch": 2820} {"train_loss": -44.964576721191406, "global_step": 341282, "epoch": 2820} {"train_loss": -44.82041549682617, "global_step": 341283, "epoch": 2820} {"train_loss": -44.327392578125, "global_step": 341284, "epoch": 2820} {"train_loss": -44.53580856323242, "global_step": 341285, "epoch": 2820} {"train_loss": -45.24416732788086, "global_step": 341286, "epoch": 2820} {"train_loss": -43.785457611083984, "global_step": 341287, "epoch": 2820} {"train_loss": -43.897216796875, "global_step": 341288, "epoch": 2820} {"train_loss": -44.783504486083984, "global_step": 341289, "epoch": 2820} {"train_loss": -44.503265380859375, "global_step": 341290, "epoch": 2820} {"train_loss": -44.626060485839844, "global_step": 341291, "epoch": 2820} {"train_loss": -45.063209533691406, "global_step": 341292, "epoch": 2820} {"train_loss": -44.57354736328125, "global_step": 341293, "epoch": 2820} {"train_loss": -44.50109100341797, "global_step": 341294, "epoch": 2820} {"train_loss": -44.876373291015625, "global_step": 341295, "epoch": 2820} {"train_loss": -44.23336410522461, "global_step": 341296, "epoch": 2820} {"train_loss": -44.723052978515625, "global_step": 341297, "epoch": 2820} {"train_loss": -43.72593307495117, "global_step": 341298, "epoch": 2820} {"train_loss": -42.32378005981445, "global_step": 341299, "epoch": 2820} {"train_loss": -43.300045013427734, "global_step": 341300, "epoch": 2820} {"train_loss": -44.52880859375, "global_step": 341301, "epoch": 2820} {"train_loss": -45.07392501831055, "global_step": 341302, "epoch": 2820} {"train_loss": -44.634605407714844, "global_step": 341303, "epoch": 2820} {"train_loss": -44.43781280517578, "global_step": 341304, "epoch": 2820} {"train_loss": -44.933753967285156, "global_step": 341305, "epoch": 2820} {"train_loss": -45.26863098144531, "global_step": 341306, "epoch": 2820} {"train_loss": -44.53641891479492, "global_step": 341307, "epoch": 2820} {"train_loss": -44.18899154663086, "global_step": 341308, "epoch": 2820} {"train_loss": -44.89583969116211, "global_step": 341309, "epoch": 2820} {"train_loss": -44.11819076538086, "global_step": 341310, "epoch": 2820} {"train_loss": -43.557884216308594, "global_step": 341311, "epoch": 2820} {"train_loss": -44.56525802612305, "global_step": 341312, "epoch": 2820} {"train_loss": -45.179718017578125, "global_step": 341313, "epoch": 2820} {"train_loss": -44.935184478759766, "global_step": 341314, "epoch": 2820} {"train_loss": -45.17684555053711, "global_step": 341315, "epoch": 2820} {"train_loss": -44.53980255126953, "global_step": 341316, "epoch": 2820} {"train_loss": -44.721187591552734, "global_step": 341317, "epoch": 2820} {"train_loss": -43.984375, "global_step": 341318, "epoch": 2820} {"train_loss": -44.2575798034668, "global_step": 341319, "epoch": 2820} {"train_loss": -44.53602981567383, "global_step": 341320, "epoch": 2820} {"train_loss": -43.298858642578125, "global_step": 341321, "epoch": 2820} {"train_loss": -44.560882568359375, "global_step": 341322, "epoch": 2820} {"train_loss": -44.747596740722656, "global_step": 341323, "epoch": 2820} {"train_loss": -44.60683822631836, "global_step": 341324, "epoch": 2820} {"train_loss": -45.233642578125, "global_step": 341325, "epoch": 2820} {"train_loss": -44.727718353271484, "global_step": 341326, "epoch": 2820} {"train_loss": -44.5228157043457, "global_step": 341327, "epoch": 2820} {"train_loss": -44.617183685302734, "global_step": 341328, "epoch": 2820} {"train_loss": -44.412628173828125, "global_step": 341329, "epoch": 2820} {"train_loss": -44.83856964111328, "global_step": 341330, "epoch": 2820} {"train_loss": -44.93365478515625, "global_step": 341331, "epoch": 2820} {"train_loss": -44.491512298583984, "global_step": 341332, "epoch": 2820} {"train_loss": -43.292694091796875, "global_step": 341333, "epoch": 2820} {"train_loss": -44.9173469543457, "global_step": 341334, "epoch": 2820} {"train_loss": -43.063568115234375, "global_step": 341335, "epoch": 2820} {"train_loss": -44.325584411621094, "global_step": 341336, "epoch": 2820} {"train_loss": -44.79957962036133, "global_step": 341337, "epoch": 2820} {"train_loss": -44.942848205566406, "global_step": 341338, "epoch": 2820} {"train_loss": -45.16020202636719, "global_step": 341339, "epoch": 2820} {"train_loss": -44.25439055892062, "global_step": 341340, "epoch": 2820, "val_loss": 2584340.25} {"train_loss": -45.04486083984375, "global_step": 341341, "epoch": 2821} {"train_loss": -44.181297302246094, "global_step": 341342, "epoch": 2821} {"train_loss": -44.360206604003906, "global_step": 341343, "epoch": 2821} {"train_loss": -45.06269454956055, "global_step": 341344, "epoch": 2821} {"train_loss": -43.091609954833984, "global_step": 341345, "epoch": 2821} {"train_loss": -44.374385833740234, "global_step": 341346, "epoch": 2821} {"train_loss": -45.200931549072266, "global_step": 341347, "epoch": 2821} {"train_loss": -44.0330924987793, "global_step": 341348, "epoch": 2821} {"train_loss": -44.571998596191406, "global_step": 341349, "epoch": 2821} {"train_loss": -44.32350540161133, "global_step": 341350, "epoch": 2821} {"train_loss": -45.19790267944336, "global_step": 341351, "epoch": 2821} {"train_loss": -45.198150634765625, "global_step": 341352, "epoch": 2821} {"train_loss": -44.691890716552734, "global_step": 341353, "epoch": 2821} {"train_loss": -45.12822341918945, "global_step": 341354, "epoch": 2821} {"train_loss": -44.64480209350586, "global_step": 341355, "epoch": 2821} {"train_loss": -44.82358169555664, "global_step": 341356, "epoch": 2821} {"train_loss": -45.31427001953125, "global_step": 341357, "epoch": 2821} {"train_loss": -45.1809196472168, "global_step": 341358, "epoch": 2821} {"train_loss": -44.98775100708008, "global_step": 341359, "epoch": 2821} {"train_loss": -44.75711441040039, "global_step": 341360, "epoch": 2821} {"train_loss": -44.46828842163086, "global_step": 341361, "epoch": 2821} {"train_loss": -43.82114791870117, "global_step": 341362, "epoch": 2821} {"train_loss": -44.01479721069336, "global_step": 341363, "epoch": 2821} {"train_loss": -44.44501495361328, "global_step": 341364, "epoch": 2821} {"train_loss": -45.34572982788086, "global_step": 341365, "epoch": 2821} {"train_loss": -43.5904426574707, "global_step": 341366, "epoch": 2821} {"train_loss": -43.80125045776367, "global_step": 341367, "epoch": 2821} {"train_loss": -42.884639739990234, "global_step": 341368, "epoch": 2821} {"train_loss": -44.81892013549805, "global_step": 341369, "epoch": 2821} {"train_loss": -44.17262649536133, "global_step": 341370, "epoch": 2821} {"train_loss": -44.22516632080078, "global_step": 341371, "epoch": 2821} {"train_loss": -43.48277282714844, "global_step": 341372, "epoch": 2821} {"train_loss": -44.61452102661133, "global_step": 341373, "epoch": 2821} {"train_loss": -43.945228576660156, "global_step": 341374, "epoch": 2821} {"train_loss": -42.639930725097656, "global_step": 341375, "epoch": 2821} {"train_loss": -44.18045425415039, "global_step": 341376, "epoch": 2821} {"train_loss": -43.36322021484375, "global_step": 341377, "epoch": 2821} {"train_loss": -44.4610595703125, "global_step": 341378, "epoch": 2821} {"train_loss": -43.26231002807617, "global_step": 341379, "epoch": 2821} {"train_loss": -43.55077362060547, "global_step": 341380, "epoch": 2821} {"train_loss": -44.68337631225586, "global_step": 341381, "epoch": 2821} {"train_loss": -41.96196365356445, "global_step": 341382, "epoch": 2821} {"train_loss": -43.207454681396484, "global_step": 341383, "epoch": 2821} {"train_loss": -42.953792572021484, "global_step": 341384, "epoch": 2821} {"train_loss": -43.212730407714844, "global_step": 341385, "epoch": 2821} {"train_loss": -42.55884552001953, "global_step": 341386, "epoch": 2821} {"train_loss": -43.58303451538086, "global_step": 341387, "epoch": 2821} {"train_loss": -43.58955764770508, "global_step": 341388, "epoch": 2821} {"train_loss": -43.62388229370117, "global_step": 341389, "epoch": 2821} {"train_loss": -42.763511657714844, "global_step": 341390, "epoch": 2821} {"train_loss": -43.83005905151367, "global_step": 341391, "epoch": 2821} {"train_loss": -43.681739807128906, "global_step": 341392, "epoch": 2821} {"train_loss": -43.72418212890625, "global_step": 341393, "epoch": 2821} {"train_loss": -43.2662467956543, "global_step": 341394, "epoch": 2821} {"train_loss": -42.964141845703125, "global_step": 341395, "epoch": 2821} {"train_loss": -43.0286750793457, "global_step": 341396, "epoch": 2821} {"train_loss": -43.708980560302734, "global_step": 341397, "epoch": 2821} {"train_loss": -42.563140869140625, "global_step": 341398, "epoch": 2821} {"train_loss": -43.645423889160156, "global_step": 341399, "epoch": 2821} {"train_loss": -43.10075759887695, "global_step": 341400, "epoch": 2821} {"train_loss": -44.173580169677734, "global_step": 341401, "epoch": 2821} {"train_loss": -44.25521469116211, "global_step": 341402, "epoch": 2821} {"train_loss": -42.68272018432617, "global_step": 341403, "epoch": 2821} {"train_loss": -44.4096794128418, "global_step": 341404, "epoch": 2821} {"train_loss": -44.23065948486328, "global_step": 341405, "epoch": 2821} {"train_loss": -42.93207550048828, "global_step": 341406, "epoch": 2821} {"train_loss": -44.39166259765625, "global_step": 341407, "epoch": 2821} {"train_loss": -43.165992736816406, "global_step": 341408, "epoch": 2821} {"train_loss": -43.10932159423828, "global_step": 341409, "epoch": 2821} {"train_loss": -44.447147369384766, "global_step": 341410, "epoch": 2821} {"train_loss": -43.640724182128906, "global_step": 341411, "epoch": 2821} {"train_loss": -44.920265197753906, "global_step": 341412, "epoch": 2821} {"train_loss": -44.227394104003906, "global_step": 341413, "epoch": 2821} {"train_loss": -44.50809860229492, "global_step": 341414, "epoch": 2821} {"train_loss": -44.53504180908203, "global_step": 341415, "epoch": 2821} {"train_loss": -44.64797592163086, "global_step": 341416, "epoch": 2821} {"train_loss": -44.95558166503906, "global_step": 341417, "epoch": 2821} {"train_loss": -44.38212585449219, "global_step": 341418, "epoch": 2821} {"train_loss": -44.821163177490234, "global_step": 341419, "epoch": 2821} {"train_loss": -44.34141540527344, "global_step": 341420, "epoch": 2821} {"train_loss": -44.76011657714844, "global_step": 341421, "epoch": 2821} {"train_loss": -45.20967102050781, "global_step": 341422, "epoch": 2821} {"train_loss": -44.38987350463867, "global_step": 341423, "epoch": 2821} {"train_loss": -44.84947204589844, "global_step": 341424, "epoch": 2821} {"train_loss": -44.80294418334961, "global_step": 341425, "epoch": 2821} {"train_loss": -44.65082931518555, "global_step": 341426, "epoch": 2821} {"train_loss": -45.3489875793457, "global_step": 341427, "epoch": 2821} {"train_loss": -44.74109649658203, "global_step": 341428, "epoch": 2821} {"train_loss": -44.61099624633789, "global_step": 341429, "epoch": 2821} {"train_loss": -45.38312911987305, "global_step": 341430, "epoch": 2821} {"train_loss": -44.450294494628906, "global_step": 341431, "epoch": 2821} {"train_loss": -45.15951156616211, "global_step": 341432, "epoch": 2821} {"train_loss": -44.605384826660156, "global_step": 341433, "epoch": 2821} {"train_loss": -44.25506591796875, "global_step": 341434, "epoch": 2821} {"train_loss": -45.35112380981445, "global_step": 341435, "epoch": 2821} {"train_loss": -44.59922409057617, "global_step": 341436, "epoch": 2821} {"train_loss": -44.74250030517578, "global_step": 341437, "epoch": 2821} {"train_loss": -45.1290397644043, "global_step": 341438, "epoch": 2821} {"train_loss": -44.02571105957031, "global_step": 341439, "epoch": 2821} {"train_loss": -45.32121276855469, "global_step": 341440, "epoch": 2821} {"train_loss": -44.477935791015625, "global_step": 341441, "epoch": 2821} {"train_loss": -43.96391296386719, "global_step": 341442, "epoch": 2821} {"train_loss": -45.228363037109375, "global_step": 341443, "epoch": 2821} {"train_loss": -45.26072311401367, "global_step": 341444, "epoch": 2821} {"train_loss": -45.10885238647461, "global_step": 341445, "epoch": 2821} {"train_loss": -44.872894287109375, "global_step": 341446, "epoch": 2821} {"train_loss": -45.035491943359375, "global_step": 341447, "epoch": 2821} {"train_loss": -45.42383575439453, "global_step": 341448, "epoch": 2821} {"train_loss": -45.51218795776367, "global_step": 341449, "epoch": 2821} {"train_loss": -45.041839599609375, "global_step": 341450, "epoch": 2821} {"train_loss": -45.65327835083008, "global_step": 341451, "epoch": 2821} {"train_loss": -44.95917892456055, "global_step": 341452, "epoch": 2821} {"train_loss": -45.5048713684082, "global_step": 341453, "epoch": 2821} {"train_loss": -45.86914825439453, "global_step": 341454, "epoch": 2821} {"train_loss": -45.088253021240234, "global_step": 341455, "epoch": 2821} {"train_loss": -45.22158432006836, "global_step": 341456, "epoch": 2821} {"train_loss": -45.07318878173828, "global_step": 341457, "epoch": 2821} {"train_loss": -44.14911651611328, "global_step": 341458, "epoch": 2821} {"train_loss": -44.292598724365234, "global_step": 341459, "epoch": 2821} {"train_loss": -44.83356475830078, "global_step": 341460, "epoch": 2821} {"train_loss": -44.325036545430336, "global_step": 341461, "epoch": 2821, "val_loss": 2626765.25} {"train_loss": -45.08953857421875, "global_step": 341462, "epoch": 2822} {"train_loss": -43.96645736694336, "global_step": 341463, "epoch": 2822} {"train_loss": -43.97939682006836, "global_step": 341464, "epoch": 2822} {"train_loss": -43.92106246948242, "global_step": 341465, "epoch": 2822} {"train_loss": -44.7938117980957, "global_step": 341466, "epoch": 2822} {"train_loss": -43.8986701965332, "global_step": 341467, "epoch": 2822} {"train_loss": -42.96107482910156, "global_step": 341468, "epoch": 2822} {"train_loss": -43.92619705200195, "global_step": 341469, "epoch": 2822} {"train_loss": -44.831085205078125, "global_step": 341470, "epoch": 2822} {"train_loss": -44.572566986083984, "global_step": 341471, "epoch": 2822} {"train_loss": -44.21824264526367, "global_step": 341472, "epoch": 2822} {"train_loss": -42.81791305541992, "global_step": 341473, "epoch": 2822} {"train_loss": -45.352752685546875, "global_step": 341474, "epoch": 2822} {"train_loss": -42.948299407958984, "global_step": 341475, "epoch": 2822} {"train_loss": -44.210445404052734, "global_step": 341476, "epoch": 2822} {"train_loss": -44.821414947509766, "global_step": 341477, "epoch": 2822} {"train_loss": -43.20808029174805, "global_step": 341478, "epoch": 2822} {"train_loss": -44.2384147644043, "global_step": 341479, "epoch": 2822} {"train_loss": -43.4177131652832, "global_step": 341480, "epoch": 2822} {"train_loss": -44.39339828491211, "global_step": 341481, "epoch": 2822} {"train_loss": -44.601112365722656, "global_step": 341482, "epoch": 2822} {"train_loss": -43.97688674926758, "global_step": 341483, "epoch": 2822} {"train_loss": -45.03276062011719, "global_step": 341484, "epoch": 2822} {"train_loss": -44.9499397277832, "global_step": 341485, "epoch": 2822} {"train_loss": -44.76171875, "global_step": 341486, "epoch": 2822} {"train_loss": -44.57595443725586, "global_step": 341487, "epoch": 2822} {"train_loss": -44.72080993652344, "global_step": 341488, "epoch": 2822} {"train_loss": -44.966827392578125, "global_step": 341489, "epoch": 2822} {"train_loss": -44.6279182434082, "global_step": 341490, "epoch": 2822} {"train_loss": -44.896175384521484, "global_step": 341491, "epoch": 2822} {"train_loss": -44.43212127685547, "global_step": 341492, "epoch": 2822} {"train_loss": -45.13532638549805, "global_step": 341493, "epoch": 2822} {"train_loss": -45.3017463684082, "global_step": 341494, "epoch": 2822} {"train_loss": -45.39167404174805, "global_step": 341495, "epoch": 2822} {"train_loss": -44.795711517333984, "global_step": 341496, "epoch": 2822} {"train_loss": -45.36953353881836, "global_step": 341497, "epoch": 2822} {"train_loss": -45.11996841430664, "global_step": 341498, "epoch": 2822} {"train_loss": -45.446956634521484, "global_step": 341499, "epoch": 2822} {"train_loss": -45.60209274291992, "global_step": 341500, "epoch": 2822} {"train_loss": -45.021331787109375, "global_step": 341501, "epoch": 2822} {"train_loss": -45.333984375, "global_step": 341502, "epoch": 2822} {"train_loss": -44.842872619628906, "global_step": 341503, "epoch": 2822} {"train_loss": -45.06153869628906, "global_step": 341504, "epoch": 2822} {"train_loss": -45.655757904052734, "global_step": 341505, "epoch": 2822} {"train_loss": -44.85960006713867, "global_step": 341506, "epoch": 2822} {"train_loss": -44.14570236206055, "global_step": 341507, "epoch": 2822} {"train_loss": -44.57856369018555, "global_step": 341508, "epoch": 2822} {"train_loss": -45.296138763427734, "global_step": 341509, "epoch": 2822} {"train_loss": -43.751853942871094, "global_step": 341510, "epoch": 2822} {"train_loss": -42.950130462646484, "global_step": 341511, "epoch": 2822} {"train_loss": -44.82001495361328, "global_step": 341512, "epoch": 2822} {"train_loss": -44.01710891723633, "global_step": 341513, "epoch": 2822} {"train_loss": -44.62221908569336, "global_step": 341514, "epoch": 2822} {"train_loss": -44.705482482910156, "global_step": 341515, "epoch": 2822} {"train_loss": -44.786190032958984, "global_step": 341516, "epoch": 2822} {"train_loss": -44.92644119262695, "global_step": 341517, "epoch": 2822} {"train_loss": -44.91949462890625, "global_step": 341518, "epoch": 2822} {"train_loss": -44.14082717895508, "global_step": 341519, "epoch": 2822} {"train_loss": -44.17892074584961, "global_step": 341520, "epoch": 2822} {"train_loss": -45.080780029296875, "global_step": 341521, "epoch": 2822} {"train_loss": -44.68437576293945, "global_step": 341522, "epoch": 2822} {"train_loss": -44.408111572265625, "global_step": 341523, "epoch": 2822} {"train_loss": -44.86656951904297, "global_step": 341524, "epoch": 2822} {"train_loss": -44.3832893371582, "global_step": 341525, "epoch": 2822} {"train_loss": -44.939598083496094, "global_step": 341526, "epoch": 2822} {"train_loss": -44.742454528808594, "global_step": 341527, "epoch": 2822} {"train_loss": -44.738616943359375, "global_step": 341528, "epoch": 2822} {"train_loss": -44.86042785644531, "global_step": 341529, "epoch": 2822} {"train_loss": -45.078433990478516, "global_step": 341530, "epoch": 2822} {"train_loss": -44.50666427612305, "global_step": 341531, "epoch": 2822} {"train_loss": -44.63969802856445, "global_step": 341532, "epoch": 2822} {"train_loss": -44.50698471069336, "global_step": 341533, "epoch": 2822} {"train_loss": -44.29289245605469, "global_step": 341534, "epoch": 2822} {"train_loss": -44.61576461791992, "global_step": 341535, "epoch": 2822} {"train_loss": -45.02242660522461, "global_step": 341536, "epoch": 2822} {"train_loss": -44.41790771484375, "global_step": 341537, "epoch": 2822} {"train_loss": -44.892066955566406, "global_step": 341538, "epoch": 2822} {"train_loss": -44.73792266845703, "global_step": 341539, "epoch": 2822} {"train_loss": -43.32404327392578, "global_step": 341540, "epoch": 2822} {"train_loss": -44.42097091674805, "global_step": 341541, "epoch": 2822} {"train_loss": -43.47746658325195, "global_step": 341542, "epoch": 2822} {"train_loss": -44.4051513671875, "global_step": 341543, "epoch": 2822} {"train_loss": -44.72388458251953, "global_step": 341544, "epoch": 2822} {"train_loss": -43.28676986694336, "global_step": 341545, "epoch": 2822} {"train_loss": -43.92800521850586, "global_step": 341546, "epoch": 2822} {"train_loss": -44.455074310302734, "global_step": 341547, "epoch": 2822} {"train_loss": -44.15412139892578, "global_step": 341548, "epoch": 2822} {"train_loss": -45.431888580322266, "global_step": 341549, "epoch": 2822} {"train_loss": -44.572322845458984, "global_step": 341550, "epoch": 2822} {"train_loss": -44.35206985473633, "global_step": 341551, "epoch": 2822} {"train_loss": -43.90510940551758, "global_step": 341552, "epoch": 2822} {"train_loss": -44.7843017578125, "global_step": 341553, "epoch": 2822} {"train_loss": -45.04813003540039, "global_step": 341554, "epoch": 2822} {"train_loss": -44.84443283081055, "global_step": 341555, "epoch": 2822} {"train_loss": -44.3730583190918, "global_step": 341556, "epoch": 2822} {"train_loss": -44.78994369506836, "global_step": 341557, "epoch": 2822} {"train_loss": -45.10938262939453, "global_step": 341558, "epoch": 2822} {"train_loss": -43.7415771484375, "global_step": 341559, "epoch": 2822} {"train_loss": -45.02736282348633, "global_step": 341560, "epoch": 2822} {"train_loss": -45.18649673461914, "global_step": 341561, "epoch": 2822} {"train_loss": -44.0180549621582, "global_step": 341562, "epoch": 2822} {"train_loss": -44.0789794921875, "global_step": 341563, "epoch": 2822} {"train_loss": -44.75635528564453, "global_step": 341564, "epoch": 2822} {"train_loss": -44.76871109008789, "global_step": 341565, "epoch": 2822} {"train_loss": -44.55795669555664, "global_step": 341566, "epoch": 2822} {"train_loss": -43.8125114440918, "global_step": 341567, "epoch": 2822} {"train_loss": -44.49530792236328, "global_step": 341568, "epoch": 2822} {"train_loss": -45.173004150390625, "global_step": 341569, "epoch": 2822} {"train_loss": -44.307106018066406, "global_step": 341570, "epoch": 2822} {"train_loss": -44.645263671875, "global_step": 341571, "epoch": 2822} {"train_loss": -44.66727066040039, "global_step": 341572, "epoch": 2822} {"train_loss": -45.03119659423828, "global_step": 341573, "epoch": 2822} {"train_loss": -44.642459869384766, "global_step": 341574, "epoch": 2822} {"train_loss": -44.54204559326172, "global_step": 341575, "epoch": 2822} {"train_loss": -44.52382278442383, "global_step": 341576, "epoch": 2822} {"train_loss": -43.07393264770508, "global_step": 341577, "epoch": 2822} {"train_loss": -45.1778678894043, "global_step": 341578, "epoch": 2822} {"train_loss": -44.7321891784668, "global_step": 341579, "epoch": 2822} {"train_loss": -45.11233139038086, "global_step": 341580, "epoch": 2822} {"train_loss": -45.403934478759766, "global_step": 341581, "epoch": 2822} {"train_loss": -44.54645115876001, "global_step": 341582, "epoch": 2822, "val_loss": 2675305.25} {"train_loss": -44.050086975097656, "global_step": 341583, "epoch": 2823} {"train_loss": -44.383636474609375, "global_step": 341584, "epoch": 2823} {"train_loss": -43.98610305786133, "global_step": 341585, "epoch": 2823} {"train_loss": -45.31684494018555, "global_step": 341586, "epoch": 2823} {"train_loss": -45.75480270385742, "global_step": 341587, "epoch": 2823} {"train_loss": -44.154945373535156, "global_step": 341588, "epoch": 2823} {"train_loss": -44.888946533203125, "global_step": 341589, "epoch": 2823} {"train_loss": -45.07672119140625, "global_step": 341590, "epoch": 2823} {"train_loss": -45.49518585205078, "global_step": 341591, "epoch": 2823} {"train_loss": -44.48466873168945, "global_step": 341592, "epoch": 2823} {"train_loss": -44.17216873168945, "global_step": 341593, "epoch": 2823} {"train_loss": -44.8211669921875, "global_step": 341594, "epoch": 2823} {"train_loss": -44.0281982421875, "global_step": 341595, "epoch": 2823} {"train_loss": -44.19503402709961, "global_step": 341596, "epoch": 2823} {"train_loss": -44.79193115234375, "global_step": 341597, "epoch": 2823} {"train_loss": -44.48995590209961, "global_step": 341598, "epoch": 2823} {"train_loss": -45.43027877807617, "global_step": 341599, "epoch": 2823} {"train_loss": -44.448219299316406, "global_step": 341600, "epoch": 2823} {"train_loss": -45.07844161987305, "global_step": 341601, "epoch": 2823} {"train_loss": -44.07145309448242, "global_step": 341602, "epoch": 2823} {"train_loss": -44.644683837890625, "global_step": 341603, "epoch": 2823} {"train_loss": -45.27540969848633, "global_step": 341604, "epoch": 2823} {"train_loss": -43.923797607421875, "global_step": 341605, "epoch": 2823} {"train_loss": -43.09507369995117, "global_step": 341606, "epoch": 2823} {"train_loss": -45.149635314941406, "global_step": 341607, "epoch": 2823} {"train_loss": -44.13358688354492, "global_step": 341608, "epoch": 2823} {"train_loss": -43.01845932006836, "global_step": 341609, "epoch": 2823} {"train_loss": -44.264129638671875, "global_step": 341610, "epoch": 2823} {"train_loss": -42.89457321166992, "global_step": 341611, "epoch": 2823} {"train_loss": -44.287593841552734, "global_step": 341612, "epoch": 2823} {"train_loss": -45.03182601928711, "global_step": 341613, "epoch": 2823} {"train_loss": -44.06801986694336, "global_step": 341614, "epoch": 2823} {"train_loss": -44.19871139526367, "global_step": 341615, "epoch": 2823} {"train_loss": -43.9420280456543, "global_step": 341616, "epoch": 2823} {"train_loss": -44.219696044921875, "global_step": 341617, "epoch": 2823} {"train_loss": -44.12268829345703, "global_step": 341618, "epoch": 2823} {"train_loss": -44.13235855102539, "global_step": 341619, "epoch": 2823} {"train_loss": -44.30983352661133, "global_step": 341620, "epoch": 2823} {"train_loss": -44.383766174316406, "global_step": 341621, "epoch": 2823} {"train_loss": -44.55243682861328, "global_step": 341622, "epoch": 2823} {"train_loss": -44.68357467651367, "global_step": 341623, "epoch": 2823} {"train_loss": -44.509864807128906, "global_step": 341624, "epoch": 2823} {"train_loss": -44.455684661865234, "global_step": 341625, "epoch": 2823} {"train_loss": -43.43136215209961, "global_step": 341626, "epoch": 2823} {"train_loss": -43.27621078491211, "global_step": 341627, "epoch": 2823} {"train_loss": -43.14309310913086, "global_step": 341628, "epoch": 2823} {"train_loss": -42.54165267944336, "global_step": 341629, "epoch": 2823} {"train_loss": -43.2872200012207, "global_step": 341630, "epoch": 2823} {"train_loss": -43.46046829223633, "global_step": 341631, "epoch": 2823} {"train_loss": -43.639068603515625, "global_step": 341632, "epoch": 2823} {"train_loss": -43.62742233276367, "global_step": 341633, "epoch": 2823} {"train_loss": -44.47979736328125, "global_step": 341634, "epoch": 2823} {"train_loss": -44.42692947387695, "global_step": 341635, "epoch": 2823} {"train_loss": -44.6143798828125, "global_step": 341636, "epoch": 2823} {"train_loss": -44.21381378173828, "global_step": 341637, "epoch": 2823} {"train_loss": -44.472103118896484, "global_step": 341638, "epoch": 2823} {"train_loss": -44.791439056396484, "global_step": 341639, "epoch": 2823} {"train_loss": -45.10555648803711, "global_step": 341640, "epoch": 2823} {"train_loss": -44.13474655151367, "global_step": 341641, "epoch": 2823} {"train_loss": -45.335140228271484, "global_step": 341642, "epoch": 2823} {"train_loss": -45.227535247802734, "global_step": 341643, "epoch": 2823} {"train_loss": -43.855804443359375, "global_step": 341644, "epoch": 2823} {"train_loss": -44.81087875366211, "global_step": 341645, "epoch": 2823} {"train_loss": -44.636714935302734, "global_step": 341646, "epoch": 2823} {"train_loss": -44.44590377807617, "global_step": 341647, "epoch": 2823} {"train_loss": -44.68455505371094, "global_step": 341648, "epoch": 2823} {"train_loss": -44.91614532470703, "global_step": 341649, "epoch": 2823} {"train_loss": -45.00426483154297, "global_step": 341650, "epoch": 2823} {"train_loss": -44.91131591796875, "global_step": 341651, "epoch": 2823} {"train_loss": -45.178165435791016, "global_step": 341652, "epoch": 2823} {"train_loss": -45.20561599731445, "global_step": 341653, "epoch": 2823} {"train_loss": -45.241050720214844, "global_step": 341654, "epoch": 2823} {"train_loss": -45.27256393432617, "global_step": 341655, "epoch": 2823} {"train_loss": -45.366573333740234, "global_step": 341656, "epoch": 2823} {"train_loss": -45.23294448852539, "global_step": 341657, "epoch": 2823} {"train_loss": -45.97108459472656, "global_step": 341658, "epoch": 2823} {"train_loss": -45.484703063964844, "global_step": 341659, "epoch": 2823} {"train_loss": -45.8509635925293, "global_step": 341660, "epoch": 2823} {"train_loss": -45.5385856628418, "global_step": 341661, "epoch": 2823} {"train_loss": -45.706336975097656, "global_step": 341662, "epoch": 2823} {"train_loss": -45.7597541809082, "global_step": 341663, "epoch": 2823} {"train_loss": -45.781124114990234, "global_step": 341664, "epoch": 2823} {"train_loss": -45.40243911743164, "global_step": 341665, "epoch": 2823} {"train_loss": -45.775386810302734, "global_step": 341666, "epoch": 2823} {"train_loss": -45.25319290161133, "global_step": 341667, "epoch": 2823} {"train_loss": -45.654701232910156, "global_step": 341668, "epoch": 2823} {"train_loss": -44.86537551879883, "global_step": 341669, "epoch": 2823} {"train_loss": -45.21952819824219, "global_step": 341670, "epoch": 2823} {"train_loss": -44.93034744262695, "global_step": 341671, "epoch": 2823} {"train_loss": -43.89619064331055, "global_step": 341672, "epoch": 2823} {"train_loss": -42.92507553100586, "global_step": 341673, "epoch": 2823} {"train_loss": -44.0054931640625, "global_step": 341674, "epoch": 2823} {"train_loss": -44.59889221191406, "global_step": 341675, "epoch": 2823} {"train_loss": -42.884307861328125, "global_step": 341676, "epoch": 2823} {"train_loss": -44.72968292236328, "global_step": 341677, "epoch": 2823} {"train_loss": -44.309226989746094, "global_step": 341678, "epoch": 2823} {"train_loss": -43.38767623901367, "global_step": 341679, "epoch": 2823} {"train_loss": -42.9109001159668, "global_step": 341680, "epoch": 2823} {"train_loss": -42.941158294677734, "global_step": 341681, "epoch": 2823} {"train_loss": -45.08243942260742, "global_step": 341682, "epoch": 2823} {"train_loss": -44.27711868286133, "global_step": 341683, "epoch": 2823} {"train_loss": -43.2960319519043, "global_step": 341684, "epoch": 2823} {"train_loss": -43.71139144897461, "global_step": 341685, "epoch": 2823} {"train_loss": -44.9621467590332, "global_step": 341686, "epoch": 2823} {"train_loss": -44.04044723510742, "global_step": 341687, "epoch": 2823} {"train_loss": -44.06620407104492, "global_step": 341688, "epoch": 2823} {"train_loss": -43.993438720703125, "global_step": 341689, "epoch": 2823} {"train_loss": -44.258514404296875, "global_step": 341690, "epoch": 2823} {"train_loss": -43.53873062133789, "global_step": 341691, "epoch": 2823} {"train_loss": -44.98048782348633, "global_step": 341692, "epoch": 2823} {"train_loss": -44.280208587646484, "global_step": 341693, "epoch": 2823} {"train_loss": -43.997764587402344, "global_step": 341694, "epoch": 2823} {"train_loss": -44.36098861694336, "global_step": 341695, "epoch": 2823} {"train_loss": -44.81718826293945, "global_step": 341696, "epoch": 2823} {"train_loss": -44.89973831176758, "global_step": 341697, "epoch": 2823} {"train_loss": -44.090240478515625, "global_step": 341698, "epoch": 2823} {"train_loss": -44.67776107788086, "global_step": 341699, "epoch": 2823} {"train_loss": -44.92856216430664, "global_step": 341700, "epoch": 2823} {"train_loss": -44.608985900878906, "global_step": 341701, "epoch": 2823} {"train_loss": -44.31852722167969, "global_step": 341702, "epoch": 2823} {"train_loss": -44.46955288343193, "global_step": 341703, "epoch": 2823, "val_loss": 2649851.0} {"train_loss": -44.28933334350586, "global_step": 341704, "epoch": 2824} {"train_loss": -45.124412536621094, "global_step": 341705, "epoch": 2824} {"train_loss": -44.10383224487305, "global_step": 341706, "epoch": 2824} {"train_loss": -44.56361770629883, "global_step": 341707, "epoch": 2824} {"train_loss": -42.81244659423828, "global_step": 341708, "epoch": 2824} {"train_loss": -44.26671600341797, "global_step": 341709, "epoch": 2824} {"train_loss": -43.80934524536133, "global_step": 341710, "epoch": 2824} {"train_loss": -42.46371841430664, "global_step": 341711, "epoch": 2824} {"train_loss": -43.34925079345703, "global_step": 341712, "epoch": 2824} {"train_loss": -43.42985153198242, "global_step": 341713, "epoch": 2824} {"train_loss": -42.989227294921875, "global_step": 341714, "epoch": 2824} {"train_loss": -43.68421173095703, "global_step": 341715, "epoch": 2824} {"train_loss": -42.030059814453125, "global_step": 341716, "epoch": 2824} {"train_loss": -44.29591751098633, "global_step": 341717, "epoch": 2824} {"train_loss": -43.71037292480469, "global_step": 341718, "epoch": 2824} {"train_loss": -44.00934600830078, "global_step": 341719, "epoch": 2824} {"train_loss": -44.11090850830078, "global_step": 341720, "epoch": 2824} {"train_loss": -42.49936294555664, "global_step": 341721, "epoch": 2824} {"train_loss": -43.800716400146484, "global_step": 341722, "epoch": 2824} {"train_loss": -44.284950256347656, "global_step": 341723, "epoch": 2824} {"train_loss": -42.442840576171875, "global_step": 341724, "epoch": 2824} {"train_loss": -44.34547805786133, "global_step": 341725, "epoch": 2824} {"train_loss": -43.09751510620117, "global_step": 341726, "epoch": 2824} {"train_loss": -44.92300033569336, "global_step": 341727, "epoch": 2824} {"train_loss": -42.48786544799805, "global_step": 341728, "epoch": 2824} {"train_loss": -44.23495101928711, "global_step": 341729, "epoch": 2824} {"train_loss": -44.751953125, "global_step": 341730, "epoch": 2824} {"train_loss": -43.83522415161133, "global_step": 341731, "epoch": 2824} {"train_loss": -44.33134460449219, "global_step": 341732, "epoch": 2824} {"train_loss": -44.9718132019043, "global_step": 341733, "epoch": 2824} {"train_loss": -44.29106521606445, "global_step": 341734, "epoch": 2824} {"train_loss": -44.463966369628906, "global_step": 341735, "epoch": 2824} {"train_loss": -45.49763870239258, "global_step": 341736, "epoch": 2824} {"train_loss": -44.38092803955078, "global_step": 341737, "epoch": 2824} {"train_loss": -45.34920883178711, "global_step": 341738, "epoch": 2824} {"train_loss": -45.04708480834961, "global_step": 341739, "epoch": 2824} {"train_loss": -44.76535415649414, "global_step": 341740, "epoch": 2824} {"train_loss": -45.35050582885742, "global_step": 341741, "epoch": 2824} {"train_loss": -44.86707305908203, "global_step": 341742, "epoch": 2824} {"train_loss": -44.706363677978516, "global_step": 341743, "epoch": 2824} {"train_loss": -45.1411247253418, "global_step": 341744, "epoch": 2824} {"train_loss": -45.07222366333008, "global_step": 341745, "epoch": 2824} {"train_loss": -45.03544235229492, "global_step": 341746, "epoch": 2824} {"train_loss": -45.4015007019043, "global_step": 341747, "epoch": 2824} {"train_loss": -45.87423324584961, "global_step": 341748, "epoch": 2824} {"train_loss": -45.26266860961914, "global_step": 341749, "epoch": 2824} {"train_loss": -45.0832633972168, "global_step": 341750, "epoch": 2824} {"train_loss": -45.472137451171875, "global_step": 341751, "epoch": 2824} {"train_loss": -45.54975509643555, "global_step": 341752, "epoch": 2824} {"train_loss": -45.627742767333984, "global_step": 341753, "epoch": 2824} {"train_loss": -45.179595947265625, "global_step": 341754, "epoch": 2824} {"train_loss": -45.87028884887695, "global_step": 341755, "epoch": 2824} {"train_loss": -45.56596374511719, "global_step": 341756, "epoch": 2824} {"train_loss": -45.58492660522461, "global_step": 341757, "epoch": 2824} {"train_loss": -45.60934066772461, "global_step": 341758, "epoch": 2824} {"train_loss": -45.537471771240234, "global_step": 341759, "epoch": 2824} {"train_loss": -45.48055648803711, "global_step": 341760, "epoch": 2824} {"train_loss": -45.39585876464844, "global_step": 341761, "epoch": 2824} {"train_loss": -44.450477600097656, "global_step": 341762, "epoch": 2824} {"train_loss": -45.407752990722656, "global_step": 341763, "epoch": 2824} {"train_loss": -45.46482849121094, "global_step": 341764, "epoch": 2824} {"train_loss": -45.22036361694336, "global_step": 341765, "epoch": 2824} {"train_loss": -45.03330612182617, "global_step": 341766, "epoch": 2824} {"train_loss": -45.61317825317383, "global_step": 341767, "epoch": 2824} {"train_loss": -45.33629608154297, "global_step": 341768, "epoch": 2824} {"train_loss": -45.17060470581055, "global_step": 341769, "epoch": 2824} {"train_loss": -45.82448959350586, "global_step": 341770, "epoch": 2824} {"train_loss": -45.09391784667969, "global_step": 341771, "epoch": 2824} {"train_loss": -45.46759033203125, "global_step": 341772, "epoch": 2824} {"train_loss": -44.480953216552734, "global_step": 341773, "epoch": 2824} {"train_loss": -45.20053482055664, "global_step": 341774, "epoch": 2824} {"train_loss": -45.00645446777344, "global_step": 341775, "epoch": 2824} {"train_loss": -44.56766128540039, "global_step": 341776, "epoch": 2824} {"train_loss": -44.992950439453125, "global_step": 341777, "epoch": 2824} {"train_loss": -45.836822509765625, "global_step": 341778, "epoch": 2824} {"train_loss": -45.62559127807617, "global_step": 341779, "epoch": 2824} {"train_loss": -45.3203010559082, "global_step": 341780, "epoch": 2824} {"train_loss": -45.09011459350586, "global_step": 341781, "epoch": 2824} {"train_loss": -45.67350769042969, "global_step": 341782, "epoch": 2824} {"train_loss": -45.78391647338867, "global_step": 341783, "epoch": 2824} {"train_loss": -45.83281707763672, "global_step": 341784, "epoch": 2824} {"train_loss": -45.54354476928711, "global_step": 341785, "epoch": 2824} {"train_loss": -45.447933197021484, "global_step": 341786, "epoch": 2824} {"train_loss": -45.069454193115234, "global_step": 341787, "epoch": 2824} {"train_loss": -45.53430938720703, "global_step": 341788, "epoch": 2824} {"train_loss": -46.15232467651367, "global_step": 341789, "epoch": 2824} {"train_loss": -45.96967697143555, "global_step": 341790, "epoch": 2824} {"train_loss": -45.84830856323242, "global_step": 341791, "epoch": 2824} {"train_loss": -45.905853271484375, "global_step": 341792, "epoch": 2824} {"train_loss": -45.13541793823242, "global_step": 341793, "epoch": 2824} {"train_loss": -45.69650650024414, "global_step": 341794, "epoch": 2824} {"train_loss": -45.61090850830078, "global_step": 341795, "epoch": 2824} {"train_loss": -44.77907943725586, "global_step": 341796, "epoch": 2824} {"train_loss": -45.36367416381836, "global_step": 341797, "epoch": 2824} {"train_loss": -44.15177917480469, "global_step": 341798, "epoch": 2824} {"train_loss": -42.92568588256836, "global_step": 341799, "epoch": 2824} {"train_loss": -42.08469009399414, "global_step": 341800, "epoch": 2824} {"train_loss": -43.8524055480957, "global_step": 341801, "epoch": 2824} {"train_loss": -26.39288330078125, "global_step": 341802, "epoch": 2824} {"train_loss": -41.64167785644531, "global_step": 341803, "epoch": 2824} {"train_loss": -41.51362228393555, "global_step": 341804, "epoch": 2824} {"train_loss": -27.86480712890625, "global_step": 341805, "epoch": 2824} {"train_loss": -22.372079849243164, "global_step": 341806, "epoch": 2824} {"train_loss": -27.255279541015625, "global_step": 341807, "epoch": 2824} {"train_loss": -33.33366012573242, "global_step": 341808, "epoch": 2824} {"train_loss": -28.063434600830078, "global_step": 341809, "epoch": 2824} {"train_loss": -37.809139251708984, "global_step": 341810, "epoch": 2824} {"train_loss": -35.0201416015625, "global_step": 341811, "epoch": 2824} {"train_loss": -37.19523239135742, "global_step": 341812, "epoch": 2824} {"train_loss": -19.990041732788086, "global_step": 341813, "epoch": 2824} {"train_loss": -36.80552291870117, "global_step": 341814, "epoch": 2824} {"train_loss": -37.23967361450195, "global_step": 341815, "epoch": 2824} {"train_loss": -28.090238571166992, "global_step": 341816, "epoch": 2824} {"train_loss": -34.25358963012695, "global_step": 341817, "epoch": 2824} {"train_loss": -17.866851806640625, "global_step": 341818, "epoch": 2824} {"train_loss": -33.67290496826172, "global_step": 341819, "epoch": 2824} {"train_loss": -26.059009552001953, "global_step": 341820, "epoch": 2824} {"train_loss": -36.48458480834961, "global_step": 341821, "epoch": 2824} {"train_loss": -33.531558990478516, "global_step": 341822, "epoch": 2824} {"train_loss": -34.205421447753906, "global_step": 341823, "epoch": 2824} {"train_loss": -42.298020055471376, "global_step": 341824, "epoch": 2824, "val_loss": 3518055.0} {"train_loss": -32.53409957885742, "global_step": 341825, "epoch": 2825} {"train_loss": -38.07658004760742, "global_step": 341826, "epoch": 2825} {"train_loss": -38.927547454833984, "global_step": 341827, "epoch": 2825} {"train_loss": -38.12886428833008, "global_step": 341828, "epoch": 2825} {"train_loss": -37.08794403076172, "global_step": 341829, "epoch": 2825} {"train_loss": -35.93845748901367, "global_step": 341830, "epoch": 2825} {"train_loss": -33.63797378540039, "global_step": 341831, "epoch": 2825} {"train_loss": -38.73418045043945, "global_step": 341832, "epoch": 2825} {"train_loss": -39.42971420288086, "global_step": 341833, "epoch": 2825} {"train_loss": -35.81719970703125, "global_step": 341834, "epoch": 2825} {"train_loss": -35.79679489135742, "global_step": 341835, "epoch": 2825} {"train_loss": -36.613502502441406, "global_step": 341836, "epoch": 2825} {"train_loss": -33.97186279296875, "global_step": 341837, "epoch": 2825} {"train_loss": -38.255062103271484, "global_step": 341838, "epoch": 2825} {"train_loss": -39.20912551879883, "global_step": 341839, "epoch": 2825} {"train_loss": -39.107845306396484, "global_step": 341840, "epoch": 2825} {"train_loss": -38.91891098022461, "global_step": 341841, "epoch": 2825} {"train_loss": -38.8105583190918, "global_step": 341842, "epoch": 2825} {"train_loss": -39.27198028564453, "global_step": 341843, "epoch": 2825} {"train_loss": -39.032264709472656, "global_step": 341844, "epoch": 2825} {"train_loss": -39.46262741088867, "global_step": 341845, "epoch": 2825} {"train_loss": -39.32767868041992, "global_step": 341846, "epoch": 2825} {"train_loss": -39.31818771362305, "global_step": 341847, "epoch": 2825} {"train_loss": -39.49699020385742, "global_step": 341848, "epoch": 2825} {"train_loss": -39.895599365234375, "global_step": 341849, "epoch": 2825} {"train_loss": -39.97429275512695, "global_step": 341850, "epoch": 2825} {"train_loss": -41.311920166015625, "global_step": 341851, "epoch": 2825} {"train_loss": -40.82883834838867, "global_step": 341852, "epoch": 2825} {"train_loss": -40.019996643066406, "global_step": 341853, "epoch": 2825} {"train_loss": -40.60030746459961, "global_step": 341854, "epoch": 2825} {"train_loss": -41.27424240112305, "global_step": 341855, "epoch": 2825} {"train_loss": -41.27975082397461, "global_step": 341856, "epoch": 2825} {"train_loss": -41.05826187133789, "global_step": 341857, "epoch": 2825} {"train_loss": -41.42611312866211, "global_step": 341858, "epoch": 2825} {"train_loss": -41.28834915161133, "global_step": 341859, "epoch": 2825} {"train_loss": -41.27838897705078, "global_step": 341860, "epoch": 2825} {"train_loss": -39.23249816894531, "global_step": 341861, "epoch": 2825} {"train_loss": -41.44254684448242, "global_step": 341862, "epoch": 2825} {"train_loss": -41.40127182006836, "global_step": 341863, "epoch": 2825} {"train_loss": -41.3625602722168, "global_step": 341864, "epoch": 2825} {"train_loss": -40.666255950927734, "global_step": 341865, "epoch": 2825} {"train_loss": -41.71699142456055, "global_step": 341866, "epoch": 2825} {"train_loss": -39.9489860534668, "global_step": 341867, "epoch": 2825} {"train_loss": -41.86268997192383, "global_step": 341868, "epoch": 2825} {"train_loss": -41.42485809326172, "global_step": 341869, "epoch": 2825} {"train_loss": -41.8631591796875, "global_step": 341870, "epoch": 2825} {"train_loss": -41.63828659057617, "global_step": 341871, "epoch": 2825} {"train_loss": -41.452362060546875, "global_step": 341872, "epoch": 2825} {"train_loss": -41.80498123168945, "global_step": 341873, "epoch": 2825} {"train_loss": -42.1012077331543, "global_step": 341874, "epoch": 2825} {"train_loss": -42.51598358154297, "global_step": 341875, "epoch": 2825} {"train_loss": -42.94203186035156, "global_step": 341876, "epoch": 2825} {"train_loss": -42.5875129699707, "global_step": 341877, "epoch": 2825} {"train_loss": -41.330936431884766, "global_step": 341878, "epoch": 2825} {"train_loss": -42.423641204833984, "global_step": 341879, "epoch": 2825} {"train_loss": -42.8552360534668, "global_step": 341880, "epoch": 2825} {"train_loss": -42.55438232421875, "global_step": 341881, "epoch": 2825} {"train_loss": -42.72394943237305, "global_step": 341882, "epoch": 2825} {"train_loss": -42.303401947021484, "global_step": 341883, "epoch": 2825} {"train_loss": -42.7584114074707, "global_step": 341884, "epoch": 2825} {"train_loss": -41.420345306396484, "global_step": 341885, "epoch": 2825} {"train_loss": -42.59329605102539, "global_step": 341886, "epoch": 2825} {"train_loss": -42.09054183959961, "global_step": 341887, "epoch": 2825} {"train_loss": -42.74483108520508, "global_step": 341888, "epoch": 2825} {"train_loss": -43.03501510620117, "global_step": 341889, "epoch": 2825} {"train_loss": -42.35585403442383, "global_step": 341890, "epoch": 2825} {"train_loss": -42.770965576171875, "global_step": 341891, "epoch": 2825} {"train_loss": -41.24057388305664, "global_step": 341892, "epoch": 2825} {"train_loss": -42.62992858886719, "global_step": 341893, "epoch": 2825} {"train_loss": -42.909423828125, "global_step": 341894, "epoch": 2825} {"train_loss": -43.16775894165039, "global_step": 341895, "epoch": 2825} {"train_loss": -42.032894134521484, "global_step": 341896, "epoch": 2825} {"train_loss": -43.32720947265625, "global_step": 341897, "epoch": 2825} {"train_loss": -43.4381217956543, "global_step": 341898, "epoch": 2825} {"train_loss": -43.539119720458984, "global_step": 341899, "epoch": 2825} {"train_loss": -42.29575729370117, "global_step": 341900, "epoch": 2825} {"train_loss": -43.45962142944336, "global_step": 341901, "epoch": 2825} {"train_loss": -42.48383331298828, "global_step": 341902, "epoch": 2825} {"train_loss": -42.7293586730957, "global_step": 341903, "epoch": 2825} {"train_loss": -43.60398483276367, "global_step": 341904, "epoch": 2825} {"train_loss": -43.305843353271484, "global_step": 341905, "epoch": 2825} {"train_loss": -42.888431549072266, "global_step": 341906, "epoch": 2825} {"train_loss": -43.46067810058594, "global_step": 341907, "epoch": 2825} {"train_loss": -43.853050231933594, "global_step": 341908, "epoch": 2825} {"train_loss": -43.857391357421875, "global_step": 341909, "epoch": 2825} {"train_loss": -44.05134201049805, "global_step": 341910, "epoch": 2825} {"train_loss": -42.04658889770508, "global_step": 341911, "epoch": 2825} {"train_loss": -43.85476303100586, "global_step": 341912, "epoch": 2825} {"train_loss": -43.66089630126953, "global_step": 341913, "epoch": 2825} {"train_loss": -43.67300033569336, "global_step": 341914, "epoch": 2825} {"train_loss": -44.45258712768555, "global_step": 341915, "epoch": 2825} {"train_loss": -44.20509338378906, "global_step": 341916, "epoch": 2825} {"train_loss": -44.33613967895508, "global_step": 341917, "epoch": 2825} {"train_loss": -44.198116302490234, "global_step": 341918, "epoch": 2825} {"train_loss": -43.86566925048828, "global_step": 341919, "epoch": 2825} {"train_loss": -43.52625274658203, "global_step": 341920, "epoch": 2825} {"train_loss": -44.654354095458984, "global_step": 341921, "epoch": 2825} {"train_loss": -44.554256439208984, "global_step": 341922, "epoch": 2825} {"train_loss": -44.437259674072266, "global_step": 341923, "epoch": 2825} {"train_loss": -43.76413345336914, "global_step": 341924, "epoch": 2825} {"train_loss": -43.15537643432617, "global_step": 341925, "epoch": 2825} {"train_loss": -44.57766342163086, "global_step": 341926, "epoch": 2825} {"train_loss": -44.43276596069336, "global_step": 341927, "epoch": 2825} {"train_loss": -43.8676643371582, "global_step": 341928, "epoch": 2825} {"train_loss": -44.36469650268555, "global_step": 341929, "epoch": 2825} {"train_loss": -43.22005081176758, "global_step": 341930, "epoch": 2825} {"train_loss": -43.71217727661133, "global_step": 341931, "epoch": 2825} {"train_loss": -43.96794509887695, "global_step": 341932, "epoch": 2825} {"train_loss": -44.4614372253418, "global_step": 341933, "epoch": 2825} {"train_loss": -44.18583297729492, "global_step": 341934, "epoch": 2825} {"train_loss": -44.58400344848633, "global_step": 341935, "epoch": 2825} {"train_loss": -44.003257751464844, "global_step": 341936, "epoch": 2825} {"train_loss": -44.933101654052734, "global_step": 341937, "epoch": 2825} {"train_loss": -43.67231750488281, "global_step": 341938, "epoch": 2825} {"train_loss": -44.21113204956055, "global_step": 341939, "epoch": 2825} {"train_loss": -44.59565353393555, "global_step": 341940, "epoch": 2825} {"train_loss": -44.923866271972656, "global_step": 341941, "epoch": 2825} {"train_loss": -44.67619705200195, "global_step": 341942, "epoch": 2825} {"train_loss": -44.71656036376953, "global_step": 341943, "epoch": 2825} {"train_loss": -44.684791564941406, "global_step": 341944, "epoch": 2825} {"train_loss": -41.80245719468298, "global_step": 341945, "epoch": 2825, "val_loss": 2605438.0} {"train_loss": -44.56209945678711, "global_step": 341946, "epoch": 2826} {"train_loss": -45.02607727050781, "global_step": 341947, "epoch": 2826} {"train_loss": -44.824031829833984, "global_step": 341948, "epoch": 2826} {"train_loss": -44.78631591796875, "global_step": 341949, "epoch": 2826} {"train_loss": -44.4074821472168, "global_step": 341950, "epoch": 2826} {"train_loss": -44.71984100341797, "global_step": 341951, "epoch": 2826} {"train_loss": -45.45375061035156, "global_step": 341952, "epoch": 2826} {"train_loss": -44.38503646850586, "global_step": 341953, "epoch": 2826} {"train_loss": -45.11053466796875, "global_step": 341954, "epoch": 2826} {"train_loss": -44.48358917236328, "global_step": 341955, "epoch": 2826} {"train_loss": -44.54975509643555, "global_step": 341956, "epoch": 2826} {"train_loss": -45.2546501159668, "global_step": 341957, "epoch": 2826} {"train_loss": -44.928199768066406, "global_step": 341958, "epoch": 2826} {"train_loss": -44.69721603393555, "global_step": 341959, "epoch": 2826} {"train_loss": -44.25739669799805, "global_step": 341960, "epoch": 2826} {"train_loss": -44.20156478881836, "global_step": 341961, "epoch": 2826} {"train_loss": -44.339332580566406, "global_step": 341962, "epoch": 2826} {"train_loss": -45.37080764770508, "global_step": 341963, "epoch": 2826} {"train_loss": -45.173423767089844, "global_step": 341964, "epoch": 2826} {"train_loss": -44.41636276245117, "global_step": 341965, "epoch": 2826} {"train_loss": -45.05742645263672, "global_step": 341966, "epoch": 2826} {"train_loss": -45.03662109375, "global_step": 341967, "epoch": 2826} {"train_loss": -44.97459030151367, "global_step": 341968, "epoch": 2826} {"train_loss": -45.3216552734375, "global_step": 341969, "epoch": 2826} {"train_loss": -44.44878005981445, "global_step": 341970, "epoch": 2826} {"train_loss": -44.9571418762207, "global_step": 341971, "epoch": 2826} {"train_loss": -44.552398681640625, "global_step": 341972, "epoch": 2826} {"train_loss": -44.55080795288086, "global_step": 341973, "epoch": 2826} {"train_loss": -43.22988510131836, "global_step": 341974, "epoch": 2826} {"train_loss": -42.6186637878418, "global_step": 341975, "epoch": 2826} {"train_loss": -43.229949951171875, "global_step": 341976, "epoch": 2826} {"train_loss": -41.47848129272461, "global_step": 341977, "epoch": 2826} {"train_loss": -42.25754928588867, "global_step": 341978, "epoch": 2826} {"train_loss": -43.47209930419922, "global_step": 341979, "epoch": 2826} {"train_loss": -44.08262634277344, "global_step": 341980, "epoch": 2826} {"train_loss": -42.86537551879883, "global_step": 341981, "epoch": 2826} {"train_loss": -42.2859992980957, "global_step": 341982, "epoch": 2826} {"train_loss": -43.41386032104492, "global_step": 341983, "epoch": 2826} {"train_loss": -43.30286407470703, "global_step": 341984, "epoch": 2826} {"train_loss": -43.39048385620117, "global_step": 341985, "epoch": 2826} {"train_loss": -43.71311569213867, "global_step": 341986, "epoch": 2826} {"train_loss": -43.310752868652344, "global_step": 341987, "epoch": 2826} {"train_loss": -42.63383102416992, "global_step": 341988, "epoch": 2826} {"train_loss": -42.62865447998047, "global_step": 341989, "epoch": 2826} {"train_loss": -43.86804962158203, "global_step": 341990, "epoch": 2826} {"train_loss": -42.26516342163086, "global_step": 341991, "epoch": 2826} {"train_loss": -43.536842346191406, "global_step": 341992, "epoch": 2826} {"train_loss": -43.34200668334961, "global_step": 341993, "epoch": 2826} {"train_loss": -42.6624870300293, "global_step": 341994, "epoch": 2826} {"train_loss": -42.964683532714844, "global_step": 341995, "epoch": 2826} {"train_loss": -43.35506820678711, "global_step": 341996, "epoch": 2826} {"train_loss": -43.501407623291016, "global_step": 341997, "epoch": 2826} {"train_loss": -43.76609420776367, "global_step": 341998, "epoch": 2826} {"train_loss": -44.08033752441406, "global_step": 341999, "epoch": 2826} {"train_loss": -43.851680755615234, "global_step": 342000, "epoch": 2826} {"train_loss": -42.65995407104492, "global_step": 342001, "epoch": 2826} {"train_loss": -42.966487884521484, "global_step": 342002, "epoch": 2826} {"train_loss": -43.49128723144531, "global_step": 342003, "epoch": 2826} {"train_loss": -42.863887786865234, "global_step": 342004, "epoch": 2826} {"train_loss": -42.44800567626953, "global_step": 342005, "epoch": 2826} {"train_loss": -43.45218276977539, "global_step": 342006, "epoch": 2826} {"train_loss": -41.8988151550293, "global_step": 342007, "epoch": 2826} {"train_loss": -43.027767181396484, "global_step": 342008, "epoch": 2826} {"train_loss": -42.4972038269043, "global_step": 342009, "epoch": 2826} {"train_loss": -43.291988372802734, "global_step": 342010, "epoch": 2826} {"train_loss": -44.01183319091797, "global_step": 342011, "epoch": 2826} {"train_loss": -43.727447509765625, "global_step": 342012, "epoch": 2826} {"train_loss": -44.33909225463867, "global_step": 342013, "epoch": 2826} {"train_loss": -43.65095901489258, "global_step": 342014, "epoch": 2826} {"train_loss": -43.68844223022461, "global_step": 342015, "epoch": 2826} {"train_loss": -43.609188079833984, "global_step": 342016, "epoch": 2826} {"train_loss": -44.51206588745117, "global_step": 342017, "epoch": 2826} {"train_loss": -43.42665481567383, "global_step": 342018, "epoch": 2826} {"train_loss": -43.823822021484375, "global_step": 342019, "epoch": 2826} {"train_loss": -43.488773345947266, "global_step": 342020, "epoch": 2826} {"train_loss": -44.07122039794922, "global_step": 342021, "epoch": 2826} {"train_loss": -44.24063491821289, "global_step": 342022, "epoch": 2826} {"train_loss": -44.20111846923828, "global_step": 342023, "epoch": 2826} {"train_loss": -44.56812286376953, "global_step": 342024, "epoch": 2826} {"train_loss": -43.816139221191406, "global_step": 342025, "epoch": 2826} {"train_loss": -43.62407684326172, "global_step": 342026, "epoch": 2826} {"train_loss": -44.029022216796875, "global_step": 342027, "epoch": 2826} {"train_loss": -44.02811050415039, "global_step": 342028, "epoch": 2826} {"train_loss": -42.326961517333984, "global_step": 342029, "epoch": 2826} {"train_loss": -41.78396224975586, "global_step": 342030, "epoch": 2826} {"train_loss": -43.48760223388672, "global_step": 342031, "epoch": 2826} {"train_loss": -44.397010803222656, "global_step": 342032, "epoch": 2826} {"train_loss": -43.631526947021484, "global_step": 342033, "epoch": 2826} {"train_loss": -43.5752067565918, "global_step": 342034, "epoch": 2826} {"train_loss": -44.565799713134766, "global_step": 342035, "epoch": 2826} {"train_loss": -43.99142837524414, "global_step": 342036, "epoch": 2826} {"train_loss": -43.076595306396484, "global_step": 342037, "epoch": 2826} {"train_loss": -40.60456466674805, "global_step": 342038, "epoch": 2826} {"train_loss": -39.58736801147461, "global_step": 342039, "epoch": 2826} {"train_loss": -43.312660217285156, "global_step": 342040, "epoch": 2826} {"train_loss": -40.28749084472656, "global_step": 342041, "epoch": 2826} {"train_loss": -43.457332611083984, "global_step": 342042, "epoch": 2826} {"train_loss": -44.130855560302734, "global_step": 342043, "epoch": 2826} {"train_loss": -42.78675079345703, "global_step": 342044, "epoch": 2826} {"train_loss": -41.977298736572266, "global_step": 342045, "epoch": 2826} {"train_loss": -43.854766845703125, "global_step": 342046, "epoch": 2826} {"train_loss": -43.131160736083984, "global_step": 342047, "epoch": 2826} {"train_loss": -41.62882995605469, "global_step": 342048, "epoch": 2826} {"train_loss": -43.20127868652344, "global_step": 342049, "epoch": 2826} {"train_loss": -43.78025436401367, "global_step": 342050, "epoch": 2826} {"train_loss": -42.855628967285156, "global_step": 342051, "epoch": 2826} {"train_loss": -40.960269927978516, "global_step": 342052, "epoch": 2826} {"train_loss": -43.653419494628906, "global_step": 342053, "epoch": 2826} {"train_loss": -43.70159912109375, "global_step": 342054, "epoch": 2826} {"train_loss": -43.94210433959961, "global_step": 342055, "epoch": 2826} {"train_loss": -44.2261962890625, "global_step": 342056, "epoch": 2826} {"train_loss": -43.47227096557617, "global_step": 342057, "epoch": 2826} {"train_loss": -44.40971374511719, "global_step": 342058, "epoch": 2826} {"train_loss": -44.0675163269043, "global_step": 342059, "epoch": 2826} {"train_loss": -43.035736083984375, "global_step": 342060, "epoch": 2826} {"train_loss": -44.04903793334961, "global_step": 342061, "epoch": 2826} {"train_loss": -44.25604248046875, "global_step": 342062, "epoch": 2826} {"train_loss": -42.771942138671875, "global_step": 342063, "epoch": 2826} {"train_loss": -44.16950607299805, "global_step": 342064, "epoch": 2826} {"train_loss": -44.660552978515625, "global_step": 342065, "epoch": 2826} {"train_loss": -43.628966150204995, "global_step": 342066, "epoch": 2826, "val_loss": 2773162.0} {"train_loss": -43.71277618408203, "global_step": 342067, "epoch": 2827} {"train_loss": -44.61429214477539, "global_step": 342068, "epoch": 2827} {"train_loss": -44.05877685546875, "global_step": 342069, "epoch": 2827} {"train_loss": -44.60676193237305, "global_step": 342070, "epoch": 2827} {"train_loss": -44.688655853271484, "global_step": 342071, "epoch": 2827} {"train_loss": -44.60498809814453, "global_step": 342072, "epoch": 2827} {"train_loss": -43.65150833129883, "global_step": 342073, "epoch": 2827} {"train_loss": -44.05371856689453, "global_step": 342074, "epoch": 2827} {"train_loss": -44.41251754760742, "global_step": 342075, "epoch": 2827} {"train_loss": -44.43511199951172, "global_step": 342076, "epoch": 2827} {"train_loss": -44.10024642944336, "global_step": 342077, "epoch": 2827} {"train_loss": -43.614654541015625, "global_step": 342078, "epoch": 2827} {"train_loss": -44.97772979736328, "global_step": 342079, "epoch": 2827} {"train_loss": -44.02383041381836, "global_step": 342080, "epoch": 2827} {"train_loss": -44.38471603393555, "global_step": 342081, "epoch": 2827} {"train_loss": -44.6101188659668, "global_step": 342082, "epoch": 2827} {"train_loss": -44.518062591552734, "global_step": 342083, "epoch": 2827} {"train_loss": -43.51811599731445, "global_step": 342084, "epoch": 2827} {"train_loss": -44.17179489135742, "global_step": 342085, "epoch": 2827} {"train_loss": -43.69263458251953, "global_step": 342086, "epoch": 2827} {"train_loss": -41.38093185424805, "global_step": 342087, "epoch": 2827} {"train_loss": -43.326080322265625, "global_step": 342088, "epoch": 2827} {"train_loss": -43.90182113647461, "global_step": 342089, "epoch": 2827} {"train_loss": -41.94365692138672, "global_step": 342090, "epoch": 2827} {"train_loss": -44.23554229736328, "global_step": 342091, "epoch": 2827} {"train_loss": -43.945335388183594, "global_step": 342092, "epoch": 2827} {"train_loss": -33.19504928588867, "global_step": 342093, "epoch": 2827} {"train_loss": -44.286434173583984, "global_step": 342094, "epoch": 2827} {"train_loss": -42.92916488647461, "global_step": 342095, "epoch": 2827} {"train_loss": -43.590538024902344, "global_step": 342096, "epoch": 2827} {"train_loss": -31.6763858795166, "global_step": 342097, "epoch": 2827} {"train_loss": -40.75509262084961, "global_step": 342098, "epoch": 2827} {"train_loss": -43.77882385253906, "global_step": 342099, "epoch": 2827} {"train_loss": -40.080238342285156, "global_step": 342100, "epoch": 2827} {"train_loss": -42.69043731689453, "global_step": 342101, "epoch": 2827} {"train_loss": -39.169776916503906, "global_step": 342102, "epoch": 2827} {"train_loss": -42.26087951660156, "global_step": 342103, "epoch": 2827} {"train_loss": -43.43461227416992, "global_step": 342104, "epoch": 2827} {"train_loss": -41.739295959472656, "global_step": 342105, "epoch": 2827} {"train_loss": -42.236305236816406, "global_step": 342106, "epoch": 2827} {"train_loss": -43.90669250488281, "global_step": 342107, "epoch": 2827} {"train_loss": -42.278446197509766, "global_step": 342108, "epoch": 2827} {"train_loss": -43.406490325927734, "global_step": 342109, "epoch": 2827} {"train_loss": -43.621429443359375, "global_step": 342110, "epoch": 2827} {"train_loss": -42.90314483642578, "global_step": 342111, "epoch": 2827} {"train_loss": -43.11674118041992, "global_step": 342112, "epoch": 2827} {"train_loss": -43.00830841064453, "global_step": 342113, "epoch": 2827} {"train_loss": -41.94004440307617, "global_step": 342114, "epoch": 2827} {"train_loss": -43.57444763183594, "global_step": 342115, "epoch": 2827} {"train_loss": -43.98358917236328, "global_step": 342116, "epoch": 2827} {"train_loss": -43.52490997314453, "global_step": 342117, "epoch": 2827} {"train_loss": -43.03969192504883, "global_step": 342118, "epoch": 2827} {"train_loss": -43.94393539428711, "global_step": 342119, "epoch": 2827} {"train_loss": -43.92507553100586, "global_step": 342120, "epoch": 2827} {"train_loss": -43.04706573486328, "global_step": 342121, "epoch": 2827} {"train_loss": -43.73762130737305, "global_step": 342122, "epoch": 2827} {"train_loss": -42.746925354003906, "global_step": 342123, "epoch": 2827} {"train_loss": -42.16059875488281, "global_step": 342124, "epoch": 2827} {"train_loss": -44.407161712646484, "global_step": 342125, "epoch": 2827} {"train_loss": -43.289974212646484, "global_step": 342126, "epoch": 2827} {"train_loss": -42.5489387512207, "global_step": 342127, "epoch": 2827} {"train_loss": -42.743080139160156, "global_step": 342128, "epoch": 2827} {"train_loss": -44.30011749267578, "global_step": 342129, "epoch": 2827} {"train_loss": -44.11143112182617, "global_step": 342130, "epoch": 2827} {"train_loss": -44.28096389770508, "global_step": 342131, "epoch": 2827} {"train_loss": -43.74171447753906, "global_step": 342132, "epoch": 2827} {"train_loss": -44.419185638427734, "global_step": 342133, "epoch": 2827} {"train_loss": -44.23191452026367, "global_step": 342134, "epoch": 2827} {"train_loss": -44.539642333984375, "global_step": 342135, "epoch": 2827} {"train_loss": -42.832576751708984, "global_step": 342136, "epoch": 2827} {"train_loss": -44.532318115234375, "global_step": 342137, "epoch": 2827} {"train_loss": -44.18368148803711, "global_step": 342138, "epoch": 2827} {"train_loss": -42.39697265625, "global_step": 342139, "epoch": 2827} {"train_loss": -44.58051300048828, "global_step": 342140, "epoch": 2827} {"train_loss": -44.32438278198242, "global_step": 342141, "epoch": 2827} {"train_loss": -43.90198516845703, "global_step": 342142, "epoch": 2827} {"train_loss": -43.94179153442383, "global_step": 342143, "epoch": 2827} {"train_loss": -43.5931396484375, "global_step": 342144, "epoch": 2827} {"train_loss": -44.85090255737305, "global_step": 342145, "epoch": 2827} {"train_loss": -44.934932708740234, "global_step": 342146, "epoch": 2827} {"train_loss": -44.699058532714844, "global_step": 342147, "epoch": 2827} {"train_loss": -45.041351318359375, "global_step": 342148, "epoch": 2827} {"train_loss": -44.89335250854492, "global_step": 342149, "epoch": 2827} {"train_loss": -44.92620849609375, "global_step": 342150, "epoch": 2827} {"train_loss": -45.062889099121094, "global_step": 342151, "epoch": 2827} {"train_loss": -44.70186996459961, "global_step": 342152, "epoch": 2827} {"train_loss": -44.879329681396484, "global_step": 342153, "epoch": 2827} {"train_loss": -44.19297409057617, "global_step": 342154, "epoch": 2827} {"train_loss": -44.5804443359375, "global_step": 342155, "epoch": 2827} {"train_loss": -45.098445892333984, "global_step": 342156, "epoch": 2827} {"train_loss": -44.656837463378906, "global_step": 342157, "epoch": 2827} {"train_loss": -44.709815979003906, "global_step": 342158, "epoch": 2827} {"train_loss": -44.57984161376953, "global_step": 342159, "epoch": 2827} {"train_loss": -44.51285934448242, "global_step": 342160, "epoch": 2827} {"train_loss": -44.18977737426758, "global_step": 342161, "epoch": 2827} {"train_loss": -44.913516998291016, "global_step": 342162, "epoch": 2827} {"train_loss": -44.92074203491211, "global_step": 342163, "epoch": 2827} {"train_loss": -44.90534210205078, "global_step": 342164, "epoch": 2827} {"train_loss": -45.075679779052734, "global_step": 342165, "epoch": 2827} {"train_loss": -43.358821868896484, "global_step": 342166, "epoch": 2827} {"train_loss": -44.47850799560547, "global_step": 342167, "epoch": 2827} {"train_loss": -44.69868087768555, "global_step": 342168, "epoch": 2827} {"train_loss": -45.180580139160156, "global_step": 342169, "epoch": 2827} {"train_loss": -44.43132019042969, "global_step": 342170, "epoch": 2827} {"train_loss": -44.48366928100586, "global_step": 342171, "epoch": 2827} {"train_loss": -44.90571975708008, "global_step": 342172, "epoch": 2827} {"train_loss": -43.49115753173828, "global_step": 342173, "epoch": 2827} {"train_loss": -45.21175765991211, "global_step": 342174, "epoch": 2827} {"train_loss": -45.083980560302734, "global_step": 342175, "epoch": 2827} {"train_loss": -44.280120849609375, "global_step": 342176, "epoch": 2827} {"train_loss": -43.28133010864258, "global_step": 342177, "epoch": 2827} {"train_loss": -43.345855712890625, "global_step": 342178, "epoch": 2827} {"train_loss": -43.25991439819336, "global_step": 342179, "epoch": 2827} {"train_loss": -44.2732048034668, "global_step": 342180, "epoch": 2827} {"train_loss": -44.080421447753906, "global_step": 342181, "epoch": 2827} {"train_loss": -44.158729553222656, "global_step": 342182, "epoch": 2827} {"train_loss": -44.179744720458984, "global_step": 342183, "epoch": 2827} {"train_loss": -41.54865646362305, "global_step": 342184, "epoch": 2827} {"train_loss": -44.30780029296875, "global_step": 342185, "epoch": 2827} {"train_loss": -44.7899169921875, "global_step": 342186, "epoch": 2827} {"train_loss": -43.64758113199029, "global_step": 342187, "epoch": 2827, "val_loss": 2598430.25} {"train_loss": -43.07878112792969, "global_step": 342188, "epoch": 2828} {"train_loss": -44.545345306396484, "global_step": 342189, "epoch": 2828} {"train_loss": -43.88616180419922, "global_step": 342190, "epoch": 2828} {"train_loss": -43.188812255859375, "global_step": 342191, "epoch": 2828} {"train_loss": -44.19146728515625, "global_step": 342192, "epoch": 2828} {"train_loss": -43.787818908691406, "global_step": 342193, "epoch": 2828} {"train_loss": -44.21589279174805, "global_step": 342194, "epoch": 2828} {"train_loss": -42.67449951171875, "global_step": 342195, "epoch": 2828} {"train_loss": -43.430606842041016, "global_step": 342196, "epoch": 2828} {"train_loss": -42.81574630737305, "global_step": 342197, "epoch": 2828} {"train_loss": -43.28915023803711, "global_step": 342198, "epoch": 2828} {"train_loss": -43.26453399658203, "global_step": 342199, "epoch": 2828} {"train_loss": -43.89384460449219, "global_step": 342200, "epoch": 2828} {"train_loss": -44.50569534301758, "global_step": 342201, "epoch": 2828} {"train_loss": -44.173377990722656, "global_step": 342202, "epoch": 2828} {"train_loss": -43.42670440673828, "global_step": 342203, "epoch": 2828} {"train_loss": -44.586421966552734, "global_step": 342204, "epoch": 2828} {"train_loss": -44.24807357788086, "global_step": 342205, "epoch": 2828} {"train_loss": -42.539459228515625, "global_step": 342206, "epoch": 2828} {"train_loss": -44.000667572021484, "global_step": 342207, "epoch": 2828} {"train_loss": -44.16611862182617, "global_step": 342208, "epoch": 2828} {"train_loss": -43.365657806396484, "global_step": 342209, "epoch": 2828} {"train_loss": -44.1613655090332, "global_step": 342210, "epoch": 2828} {"train_loss": -44.2567253112793, "global_step": 342211, "epoch": 2828} {"train_loss": -43.54557418823242, "global_step": 342212, "epoch": 2828} {"train_loss": -43.89301681518555, "global_step": 342213, "epoch": 2828} {"train_loss": -44.50314712524414, "global_step": 342214, "epoch": 2828} {"train_loss": -44.79944610595703, "global_step": 342215, "epoch": 2828} {"train_loss": -44.47046661376953, "global_step": 342216, "epoch": 2828} {"train_loss": -44.975494384765625, "global_step": 342217, "epoch": 2828} {"train_loss": -44.8883056640625, "global_step": 342218, "epoch": 2828} {"train_loss": -44.48563766479492, "global_step": 342219, "epoch": 2828} {"train_loss": -44.24832534790039, "global_step": 342220, "epoch": 2828} {"train_loss": -44.465911865234375, "global_step": 342221, "epoch": 2828} {"train_loss": -44.02317428588867, "global_step": 342222, "epoch": 2828} {"train_loss": -44.290687561035156, "global_step": 342223, "epoch": 2828} {"train_loss": -45.24068832397461, "global_step": 342224, "epoch": 2828} {"train_loss": -43.32015609741211, "global_step": 342225, "epoch": 2828} {"train_loss": -44.866024017333984, "global_step": 342226, "epoch": 2828} {"train_loss": -44.445533752441406, "global_step": 342227, "epoch": 2828} {"train_loss": -43.82790756225586, "global_step": 342228, "epoch": 2828} {"train_loss": -45.259033203125, "global_step": 342229, "epoch": 2828} {"train_loss": -42.56660461425781, "global_step": 342230, "epoch": 2828} {"train_loss": -43.37678909301758, "global_step": 342231, "epoch": 2828} {"train_loss": -44.24079513549805, "global_step": 342232, "epoch": 2828} {"train_loss": -44.24498748779297, "global_step": 342233, "epoch": 2828} {"train_loss": -43.92152786254883, "global_step": 342234, "epoch": 2828} {"train_loss": -44.251338958740234, "global_step": 342235, "epoch": 2828} {"train_loss": -44.24861526489258, "global_step": 342236, "epoch": 2828} {"train_loss": -44.42753219604492, "global_step": 342237, "epoch": 2828} {"train_loss": -44.69064712524414, "global_step": 342238, "epoch": 2828} {"train_loss": -44.27671432495117, "global_step": 342239, "epoch": 2828} {"train_loss": -45.13508224487305, "global_step": 342240, "epoch": 2828} {"train_loss": -44.11305618286133, "global_step": 342241, "epoch": 2828} {"train_loss": -44.057533264160156, "global_step": 342242, "epoch": 2828} {"train_loss": -44.472930908203125, "global_step": 342243, "epoch": 2828} {"train_loss": -44.95915222167969, "global_step": 342244, "epoch": 2828} {"train_loss": -43.841007232666016, "global_step": 342245, "epoch": 2828} {"train_loss": -44.84968948364258, "global_step": 342246, "epoch": 2828} {"train_loss": -45.09933090209961, "global_step": 342247, "epoch": 2828} {"train_loss": -43.79446029663086, "global_step": 342248, "epoch": 2828} {"train_loss": -44.59397506713867, "global_step": 342249, "epoch": 2828} {"train_loss": -44.28314971923828, "global_step": 342250, "epoch": 2828} {"train_loss": -45.0933837890625, "global_step": 342251, "epoch": 2828} {"train_loss": -42.73362731933594, "global_step": 342252, "epoch": 2828} {"train_loss": -44.16926193237305, "global_step": 342253, "epoch": 2828} {"train_loss": -43.53007125854492, "global_step": 342254, "epoch": 2828} {"train_loss": -44.226688385009766, "global_step": 342255, "epoch": 2828} {"train_loss": -43.542510986328125, "global_step": 342256, "epoch": 2828} {"train_loss": -44.12027359008789, "global_step": 342257, "epoch": 2828} {"train_loss": -44.965389251708984, "global_step": 342258, "epoch": 2828} {"train_loss": -43.607845306396484, "global_step": 342259, "epoch": 2828} {"train_loss": -42.70712661743164, "global_step": 342260, "epoch": 2828} {"train_loss": -41.88764572143555, "global_step": 342261, "epoch": 2828} {"train_loss": -44.011104583740234, "global_step": 342262, "epoch": 2828} {"train_loss": -44.334712982177734, "global_step": 342263, "epoch": 2828} {"train_loss": -43.4868278503418, "global_step": 342264, "epoch": 2828} {"train_loss": -43.92034149169922, "global_step": 342265, "epoch": 2828} {"train_loss": -43.32263946533203, "global_step": 342266, "epoch": 2828} {"train_loss": -43.64362716674805, "global_step": 342267, "epoch": 2828} {"train_loss": -43.32099914550781, "global_step": 342268, "epoch": 2828} {"train_loss": -43.508544921875, "global_step": 342269, "epoch": 2828} {"train_loss": -44.43263626098633, "global_step": 342270, "epoch": 2828} {"train_loss": -43.105133056640625, "global_step": 342271, "epoch": 2828} {"train_loss": -42.05986404418945, "global_step": 342272, "epoch": 2828} {"train_loss": -43.8015251159668, "global_step": 342273, "epoch": 2828} {"train_loss": -41.42866134643555, "global_step": 342274, "epoch": 2828} {"train_loss": -43.466854095458984, "global_step": 342275, "epoch": 2828} {"train_loss": -43.38652420043945, "global_step": 342276, "epoch": 2828} {"train_loss": -41.6348991394043, "global_step": 342277, "epoch": 2828} {"train_loss": -43.47513961791992, "global_step": 342278, "epoch": 2828} {"train_loss": -43.89897537231445, "global_step": 342279, "epoch": 2828} {"train_loss": -42.771026611328125, "global_step": 342280, "epoch": 2828} {"train_loss": -44.08966827392578, "global_step": 342281, "epoch": 2828} {"train_loss": -43.5196418762207, "global_step": 342282, "epoch": 2828} {"train_loss": -42.53150939941406, "global_step": 342283, "epoch": 2828} {"train_loss": -44.57157516479492, "global_step": 342284, "epoch": 2828} {"train_loss": -42.08296585083008, "global_step": 342285, "epoch": 2828} {"train_loss": -43.05329513549805, "global_step": 342286, "epoch": 2828} {"train_loss": -44.246089935302734, "global_step": 342287, "epoch": 2828} {"train_loss": -43.10763168334961, "global_step": 342288, "epoch": 2828} {"train_loss": -42.548519134521484, "global_step": 342289, "epoch": 2828} {"train_loss": -44.17933654785156, "global_step": 342290, "epoch": 2828} {"train_loss": -41.47803497314453, "global_step": 342291, "epoch": 2828} {"train_loss": -41.761138916015625, "global_step": 342292, "epoch": 2828} {"train_loss": -44.25105667114258, "global_step": 342293, "epoch": 2828} {"train_loss": -42.35818099975586, "global_step": 342294, "epoch": 2828} {"train_loss": -43.741146087646484, "global_step": 342295, "epoch": 2828} {"train_loss": -43.24168395996094, "global_step": 342296, "epoch": 2828} {"train_loss": -42.29682159423828, "global_step": 342297, "epoch": 2828} {"train_loss": -44.00266647338867, "global_step": 342298, "epoch": 2828} {"train_loss": -43.02482223510742, "global_step": 342299, "epoch": 2828} {"train_loss": -43.670135498046875, "global_step": 342300, "epoch": 2828} {"train_loss": -43.39609146118164, "global_step": 342301, "epoch": 2828} {"train_loss": -43.58646774291992, "global_step": 342302, "epoch": 2828} {"train_loss": -43.23069763183594, "global_step": 342303, "epoch": 2828} {"train_loss": -40.73375701904297, "global_step": 342304, "epoch": 2828} {"train_loss": -43.77927780151367, "global_step": 342305, "epoch": 2828} {"train_loss": -42.785030364990234, "global_step": 342306, "epoch": 2828} {"train_loss": -43.187740325927734, "global_step": 342307, "epoch": 2828} {"train_loss": -43.71846228985747, "global_step": 342308, "epoch": 2828, "val_loss": 2884640.75} {"train_loss": -42.151729583740234, "global_step": 342309, "epoch": 2829} {"train_loss": -43.94757080078125, "global_step": 342310, "epoch": 2829} {"train_loss": -42.292964935302734, "global_step": 342311, "epoch": 2829} {"train_loss": -44.14069747924805, "global_step": 342312, "epoch": 2829} {"train_loss": -42.630828857421875, "global_step": 342313, "epoch": 2829} {"train_loss": -43.30015563964844, "global_step": 342314, "epoch": 2829} {"train_loss": -43.710975646972656, "global_step": 342315, "epoch": 2829} {"train_loss": -43.1830940246582, "global_step": 342316, "epoch": 2829} {"train_loss": -43.8358039855957, "global_step": 342317, "epoch": 2829} {"train_loss": -42.66032409667969, "global_step": 342318, "epoch": 2829} {"train_loss": -43.96456527709961, "global_step": 342319, "epoch": 2829} {"train_loss": -43.236202239990234, "global_step": 342320, "epoch": 2829} {"train_loss": -44.47385787963867, "global_step": 342321, "epoch": 2829} {"train_loss": -43.53447341918945, "global_step": 342322, "epoch": 2829} {"train_loss": -43.474422454833984, "global_step": 342323, "epoch": 2829} {"train_loss": -43.99334716796875, "global_step": 342324, "epoch": 2829} {"train_loss": -43.93095779418945, "global_step": 342325, "epoch": 2829} {"train_loss": -43.369625091552734, "global_step": 342326, "epoch": 2829} {"train_loss": -44.65934753417969, "global_step": 342327, "epoch": 2829} {"train_loss": -43.53217697143555, "global_step": 342328, "epoch": 2829} {"train_loss": -44.46084213256836, "global_step": 342329, "epoch": 2829} {"train_loss": -43.650917053222656, "global_step": 342330, "epoch": 2829} {"train_loss": -44.55198287963867, "global_step": 342331, "epoch": 2829} {"train_loss": -44.31435012817383, "global_step": 342332, "epoch": 2829} {"train_loss": -44.694252014160156, "global_step": 342333, "epoch": 2829} {"train_loss": -44.27762222290039, "global_step": 342334, "epoch": 2829} {"train_loss": -44.50143051147461, "global_step": 342335, "epoch": 2829} {"train_loss": -43.94422149658203, "global_step": 342336, "epoch": 2829} {"train_loss": -45.31776809692383, "global_step": 342337, "epoch": 2829} {"train_loss": -44.065826416015625, "global_step": 342338, "epoch": 2829} {"train_loss": -44.9190788269043, "global_step": 342339, "epoch": 2829} {"train_loss": -44.29246139526367, "global_step": 342340, "epoch": 2829} {"train_loss": -44.95051956176758, "global_step": 342341, "epoch": 2829} {"train_loss": -44.33987045288086, "global_step": 342342, "epoch": 2829} {"train_loss": -44.51595687866211, "global_step": 342343, "epoch": 2829} {"train_loss": -44.379150390625, "global_step": 342344, "epoch": 2829} {"train_loss": -44.76262283325195, "global_step": 342345, "epoch": 2829} {"train_loss": -45.27435302734375, "global_step": 342346, "epoch": 2829} {"train_loss": -45.30475997924805, "global_step": 342347, "epoch": 2829} {"train_loss": -45.018253326416016, "global_step": 342348, "epoch": 2829} {"train_loss": -44.82849884033203, "global_step": 342349, "epoch": 2829} {"train_loss": -44.86878204345703, "global_step": 342350, "epoch": 2829} {"train_loss": -44.19352340698242, "global_step": 342351, "epoch": 2829} {"train_loss": -45.06092071533203, "global_step": 342352, "epoch": 2829} {"train_loss": -44.89035415649414, "global_step": 342353, "epoch": 2829} {"train_loss": -44.94755172729492, "global_step": 342354, "epoch": 2829} {"train_loss": -44.6526985168457, "global_step": 342355, "epoch": 2829} {"train_loss": -44.776954650878906, "global_step": 342356, "epoch": 2829} {"train_loss": -45.12242889404297, "global_step": 342357, "epoch": 2829} {"train_loss": -44.33918380737305, "global_step": 342358, "epoch": 2829} {"train_loss": -44.23371124267578, "global_step": 342359, "epoch": 2829} {"train_loss": -44.37700271606445, "global_step": 342360, "epoch": 2829} {"train_loss": -44.98441696166992, "global_step": 342361, "epoch": 2829} {"train_loss": -44.548667907714844, "global_step": 342362, "epoch": 2829} {"train_loss": -45.02578353881836, "global_step": 342363, "epoch": 2829} {"train_loss": -44.97898483276367, "global_step": 342364, "epoch": 2829} {"train_loss": -45.2867431640625, "global_step": 342365, "epoch": 2829} {"train_loss": -44.714481353759766, "global_step": 342366, "epoch": 2829} {"train_loss": -44.90694808959961, "global_step": 342367, "epoch": 2829} {"train_loss": -44.83358383178711, "global_step": 342368, "epoch": 2829} {"train_loss": -45.8128547668457, "global_step": 342369, "epoch": 2829} {"train_loss": -44.60832977294922, "global_step": 342370, "epoch": 2829} {"train_loss": -44.71759033203125, "global_step": 342371, "epoch": 2829} {"train_loss": -45.270633697509766, "global_step": 342372, "epoch": 2829} {"train_loss": -45.1651725769043, "global_step": 342373, "epoch": 2829} {"train_loss": -43.930110931396484, "global_step": 342374, "epoch": 2829} {"train_loss": -42.92283248901367, "global_step": 342375, "epoch": 2829} {"train_loss": -45.3498420715332, "global_step": 342376, "epoch": 2829} {"train_loss": -44.520423889160156, "global_step": 342377, "epoch": 2829} {"train_loss": -42.312068939208984, "global_step": 342378, "epoch": 2829} {"train_loss": -43.9725341796875, "global_step": 342379, "epoch": 2829} {"train_loss": -45.047115325927734, "global_step": 342380, "epoch": 2829} {"train_loss": -44.192176818847656, "global_step": 342381, "epoch": 2829} {"train_loss": -44.185977935791016, "global_step": 342382, "epoch": 2829} {"train_loss": -44.84333801269531, "global_step": 342383, "epoch": 2829} {"train_loss": -44.47829818725586, "global_step": 342384, "epoch": 2829} {"train_loss": -44.7783203125, "global_step": 342385, "epoch": 2829} {"train_loss": -44.064178466796875, "global_step": 342386, "epoch": 2829} {"train_loss": -44.944129943847656, "global_step": 342387, "epoch": 2829} {"train_loss": -43.62771224975586, "global_step": 342388, "epoch": 2829} {"train_loss": -44.60905075073242, "global_step": 342389, "epoch": 2829} {"train_loss": -43.052818298339844, "global_step": 342390, "epoch": 2829} {"train_loss": -43.17011260986328, "global_step": 342391, "epoch": 2829} {"train_loss": -43.357994079589844, "global_step": 342392, "epoch": 2829} {"train_loss": -42.570980072021484, "global_step": 342393, "epoch": 2829} {"train_loss": -43.536922454833984, "global_step": 342394, "epoch": 2829} {"train_loss": -43.1430778503418, "global_step": 342395, "epoch": 2829} {"train_loss": -44.23200225830078, "global_step": 342396, "epoch": 2829} {"train_loss": -43.39779281616211, "global_step": 342397, "epoch": 2829} {"train_loss": -43.172462463378906, "global_step": 342398, "epoch": 2829} {"train_loss": -43.71692657470703, "global_step": 342399, "epoch": 2829} {"train_loss": -43.126930236816406, "global_step": 342400, "epoch": 2829} {"train_loss": -43.41677474975586, "global_step": 342401, "epoch": 2829} {"train_loss": -43.0308723449707, "global_step": 342402, "epoch": 2829} {"train_loss": -42.886348724365234, "global_step": 342403, "epoch": 2829} {"train_loss": -43.30363464355469, "global_step": 342404, "epoch": 2829} {"train_loss": -44.90040969848633, "global_step": 342405, "epoch": 2829} {"train_loss": -43.395294189453125, "global_step": 342406, "epoch": 2829} {"train_loss": -44.63009262084961, "global_step": 342407, "epoch": 2829} {"train_loss": -43.82916259765625, "global_step": 342408, "epoch": 2829} {"train_loss": -44.32574462890625, "global_step": 342409, "epoch": 2829} {"train_loss": -43.522071838378906, "global_step": 342410, "epoch": 2829} {"train_loss": -44.6591682434082, "global_step": 342411, "epoch": 2829} {"train_loss": -44.31267166137695, "global_step": 342412, "epoch": 2829} {"train_loss": -44.2944221496582, "global_step": 342413, "epoch": 2829} {"train_loss": -43.731319427490234, "global_step": 342414, "epoch": 2829} {"train_loss": -44.22161102294922, "global_step": 342415, "epoch": 2829} {"train_loss": -44.460391998291016, "global_step": 342416, "epoch": 2829} {"train_loss": -44.71828079223633, "global_step": 342417, "epoch": 2829} {"train_loss": -44.68795394897461, "global_step": 342418, "epoch": 2829} {"train_loss": -44.683258056640625, "global_step": 342419, "epoch": 2829} {"train_loss": -44.5594482421875, "global_step": 342420, "epoch": 2829} {"train_loss": -43.92547607421875, "global_step": 342421, "epoch": 2829} {"train_loss": -45.07514572143555, "global_step": 342422, "epoch": 2829} {"train_loss": -44.46614074707031, "global_step": 342423, "epoch": 2829} {"train_loss": -44.853790283203125, "global_step": 342424, "epoch": 2829} {"train_loss": -44.79690170288086, "global_step": 342425, "epoch": 2829} {"train_loss": -45.19955062866211, "global_step": 342426, "epoch": 2829} {"train_loss": -44.370155334472656, "global_step": 342427, "epoch": 2829} {"train_loss": -44.8536376953125, "global_step": 342428, "epoch": 2829} {"train_loss": -44.22048789410552, "global_step": 342429, "epoch": 2829, "val_loss": 2689587.0} {"train_loss": -43.589412689208984, "global_step": 342430, "epoch": 2830} {"train_loss": -44.535499572753906, "global_step": 342431, "epoch": 2830} {"train_loss": -44.67306137084961, "global_step": 342432, "epoch": 2830} {"train_loss": -43.745933532714844, "global_step": 342433, "epoch": 2830} {"train_loss": -44.33167266845703, "global_step": 342434, "epoch": 2830} {"train_loss": -43.669376373291016, "global_step": 342435, "epoch": 2830} {"train_loss": -44.36417770385742, "global_step": 342436, "epoch": 2830} {"train_loss": -44.05194091796875, "global_step": 342437, "epoch": 2830} {"train_loss": -44.25696563720703, "global_step": 342438, "epoch": 2830} {"train_loss": -44.14346694946289, "global_step": 342439, "epoch": 2830} {"train_loss": -43.1932373046875, "global_step": 342440, "epoch": 2830} {"train_loss": -43.34861373901367, "global_step": 342441, "epoch": 2830} {"train_loss": -44.213680267333984, "global_step": 342442, "epoch": 2830} {"train_loss": -42.804542541503906, "global_step": 342443, "epoch": 2830} {"train_loss": -44.554386138916016, "global_step": 342444, "epoch": 2830} {"train_loss": -43.263370513916016, "global_step": 342445, "epoch": 2830} {"train_loss": -43.575531005859375, "global_step": 342446, "epoch": 2830} {"train_loss": -44.39455795288086, "global_step": 342447, "epoch": 2830} {"train_loss": -43.75502395629883, "global_step": 342448, "epoch": 2830} {"train_loss": -44.15888595581055, "global_step": 342449, "epoch": 2830} {"train_loss": -44.46917724609375, "global_step": 342450, "epoch": 2830} {"train_loss": -43.876548767089844, "global_step": 342451, "epoch": 2830} {"train_loss": -44.1106071472168, "global_step": 342452, "epoch": 2830} {"train_loss": -44.48555374145508, "global_step": 342453, "epoch": 2830} {"train_loss": -44.86136245727539, "global_step": 342454, "epoch": 2830} {"train_loss": -44.75851058959961, "global_step": 342455, "epoch": 2830} {"train_loss": -44.90510177612305, "global_step": 342456, "epoch": 2830} {"train_loss": -44.66672897338867, "global_step": 342457, "epoch": 2830} {"train_loss": -45.2750129699707, "global_step": 342458, "epoch": 2830} {"train_loss": -44.6715087890625, "global_step": 342459, "epoch": 2830} {"train_loss": -45.14434051513672, "global_step": 342460, "epoch": 2830} {"train_loss": -44.868804931640625, "global_step": 342461, "epoch": 2830} {"train_loss": -44.635108947753906, "global_step": 342462, "epoch": 2830} {"train_loss": -44.65623092651367, "global_step": 342463, "epoch": 2830} {"train_loss": -45.42584228515625, "global_step": 342464, "epoch": 2830} {"train_loss": -45.553829193115234, "global_step": 342465, "epoch": 2830} {"train_loss": -44.830135345458984, "global_step": 342466, "epoch": 2830} {"train_loss": -45.39506149291992, "global_step": 342467, "epoch": 2830} {"train_loss": -45.417877197265625, "global_step": 342468, "epoch": 2830} {"train_loss": -44.727291107177734, "global_step": 342469, "epoch": 2830} {"train_loss": -45.39276123046875, "global_step": 342470, "epoch": 2830} {"train_loss": -45.35761260986328, "global_step": 342471, "epoch": 2830} {"train_loss": -45.0087776184082, "global_step": 342472, "epoch": 2830} {"train_loss": -45.066036224365234, "global_step": 342473, "epoch": 2830} {"train_loss": -44.97990417480469, "global_step": 342474, "epoch": 2830} {"train_loss": -44.54643630981445, "global_step": 342475, "epoch": 2830} {"train_loss": -44.09343338012695, "global_step": 342476, "epoch": 2830} {"train_loss": -44.96832275390625, "global_step": 342477, "epoch": 2830} {"train_loss": -44.426971435546875, "global_step": 342478, "epoch": 2830} {"train_loss": -44.43867874145508, "global_step": 342479, "epoch": 2830} {"train_loss": -44.066925048828125, "global_step": 342480, "epoch": 2830} {"train_loss": -43.3599967956543, "global_step": 342481, "epoch": 2830} {"train_loss": -45.06325149536133, "global_step": 342482, "epoch": 2830} {"train_loss": -44.43733215332031, "global_step": 342483, "epoch": 2830} {"train_loss": -44.89885330200195, "global_step": 342484, "epoch": 2830} {"train_loss": -44.76722717285156, "global_step": 342485, "epoch": 2830} {"train_loss": -44.37128829956055, "global_step": 342486, "epoch": 2830} {"train_loss": -43.092315673828125, "global_step": 342487, "epoch": 2830} {"train_loss": -43.92019271850586, "global_step": 342488, "epoch": 2830} {"train_loss": -44.08384704589844, "global_step": 342489, "epoch": 2830} {"train_loss": -43.13853073120117, "global_step": 342490, "epoch": 2830} {"train_loss": -41.93308639526367, "global_step": 342491, "epoch": 2830} {"train_loss": -42.99654769897461, "global_step": 342492, "epoch": 2830} {"train_loss": -42.62553024291992, "global_step": 342493, "epoch": 2830} {"train_loss": -40.91753005981445, "global_step": 342494, "epoch": 2830} {"train_loss": -44.6419792175293, "global_step": 342495, "epoch": 2830} {"train_loss": -41.683345794677734, "global_step": 342496, "epoch": 2830} {"train_loss": -42.449546813964844, "global_step": 342497, "epoch": 2830} {"train_loss": -43.547725677490234, "global_step": 342498, "epoch": 2830} {"train_loss": -42.710662841796875, "global_step": 342499, "epoch": 2830} {"train_loss": -43.3586311340332, "global_step": 342500, "epoch": 2830} {"train_loss": -43.8482666015625, "global_step": 342501, "epoch": 2830} {"train_loss": -43.82725524902344, "global_step": 342502, "epoch": 2830} {"train_loss": -41.58732604980469, "global_step": 342503, "epoch": 2830} {"train_loss": -44.10107421875, "global_step": 342504, "epoch": 2830} {"train_loss": -43.89999771118164, "global_step": 342505, "epoch": 2830} {"train_loss": -43.937103271484375, "global_step": 342506, "epoch": 2830} {"train_loss": -44.15346908569336, "global_step": 342507, "epoch": 2830} {"train_loss": -43.95419692993164, "global_step": 342508, "epoch": 2830} {"train_loss": -43.881591796875, "global_step": 342509, "epoch": 2830} {"train_loss": -43.889068603515625, "global_step": 342510, "epoch": 2830} {"train_loss": -43.300079345703125, "global_step": 342511, "epoch": 2830} {"train_loss": -43.601654052734375, "global_step": 342512, "epoch": 2830} {"train_loss": -44.331600189208984, "global_step": 342513, "epoch": 2830} {"train_loss": -44.05945587158203, "global_step": 342514, "epoch": 2830} {"train_loss": -43.5193977355957, "global_step": 342515, "epoch": 2830} {"train_loss": -44.21381759643555, "global_step": 342516, "epoch": 2830} {"train_loss": -44.91192626953125, "global_step": 342517, "epoch": 2830} {"train_loss": -43.470088958740234, "global_step": 342518, "epoch": 2830} {"train_loss": -44.842498779296875, "global_step": 342519, "epoch": 2830} {"train_loss": -44.47772979736328, "global_step": 342520, "epoch": 2830} {"train_loss": -43.95332336425781, "global_step": 342521, "epoch": 2830} {"train_loss": -45.125606536865234, "global_step": 342522, "epoch": 2830} {"train_loss": -44.87617111206055, "global_step": 342523, "epoch": 2830} {"train_loss": -43.944515228271484, "global_step": 342524, "epoch": 2830} {"train_loss": -45.11225128173828, "global_step": 342525, "epoch": 2830} {"train_loss": -44.11684799194336, "global_step": 342526, "epoch": 2830} {"train_loss": -44.3657112121582, "global_step": 342527, "epoch": 2830} {"train_loss": -44.7918815612793, "global_step": 342528, "epoch": 2830} {"train_loss": -44.119956970214844, "global_step": 342529, "epoch": 2830} {"train_loss": -44.3851318359375, "global_step": 342530, "epoch": 2830} {"train_loss": -44.84759521484375, "global_step": 342531, "epoch": 2830} {"train_loss": -44.63943099975586, "global_step": 342532, "epoch": 2830} {"train_loss": -45.177452087402344, "global_step": 342533, "epoch": 2830} {"train_loss": -44.62998962402344, "global_step": 342534, "epoch": 2830} {"train_loss": -44.90398406982422, "global_step": 342535, "epoch": 2830} {"train_loss": -44.76839828491211, "global_step": 342536, "epoch": 2830} {"train_loss": -45.00419998168945, "global_step": 342537, "epoch": 2830} {"train_loss": -45.01357650756836, "global_step": 342538, "epoch": 2830} {"train_loss": -44.102783203125, "global_step": 342539, "epoch": 2830} {"train_loss": -44.731109619140625, "global_step": 342540, "epoch": 2830} {"train_loss": -45.038818359375, "global_step": 342541, "epoch": 2830} {"train_loss": -45.186187744140625, "global_step": 342542, "epoch": 2830} {"train_loss": -45.00272750854492, "global_step": 342543, "epoch": 2830} {"train_loss": -45.16044235229492, "global_step": 342544, "epoch": 2830} {"train_loss": -45.589962005615234, "global_step": 342545, "epoch": 2830} {"train_loss": -45.24250030517578, "global_step": 342546, "epoch": 2830} {"train_loss": -45.387908935546875, "global_step": 342547, "epoch": 2830} {"train_loss": -45.61058807373047, "global_step": 342548, "epoch": 2830} {"train_loss": -45.62107467651367, "global_step": 342549, "epoch": 2830} {"train_loss": -44.28766099283518, "global_step": 342550, "epoch": 2830, "val_loss": 2667107.75} {"train_loss": -44.2341194152832, "global_step": 342551, "epoch": 2831} {"train_loss": -44.15519332885742, "global_step": 342552, "epoch": 2831} {"train_loss": -44.645301818847656, "global_step": 342553, "epoch": 2831} {"train_loss": -44.996726989746094, "global_step": 342554, "epoch": 2831} {"train_loss": -45.38076400756836, "global_step": 342555, "epoch": 2831} {"train_loss": -45.4901237487793, "global_step": 342556, "epoch": 2831} {"train_loss": -45.328590393066406, "global_step": 342557, "epoch": 2831} {"train_loss": -44.87038040161133, "global_step": 342558, "epoch": 2831} {"train_loss": -43.53541564941406, "global_step": 342559, "epoch": 2831} {"train_loss": -45.362300872802734, "global_step": 342560, "epoch": 2831} {"train_loss": -45.15035629272461, "global_step": 342561, "epoch": 2831} {"train_loss": -44.937347412109375, "global_step": 342562, "epoch": 2831} {"train_loss": -44.71273422241211, "global_step": 342563, "epoch": 2831} {"train_loss": -45.00141906738281, "global_step": 342564, "epoch": 2831} {"train_loss": -45.17409133911133, "global_step": 342565, "epoch": 2831} {"train_loss": -44.453033447265625, "global_step": 342566, "epoch": 2831} {"train_loss": -44.20783615112305, "global_step": 342567, "epoch": 2831} {"train_loss": -45.06740951538086, "global_step": 342568, "epoch": 2831} {"train_loss": -44.72719192504883, "global_step": 342569, "epoch": 2831} {"train_loss": -43.620967864990234, "global_step": 342570, "epoch": 2831} {"train_loss": -45.45113754272461, "global_step": 342571, "epoch": 2831} {"train_loss": -45.30432891845703, "global_step": 342572, "epoch": 2831} {"train_loss": -44.604061126708984, "global_step": 342573, "epoch": 2831} {"train_loss": -44.16600799560547, "global_step": 342574, "epoch": 2831} {"train_loss": -43.988311767578125, "global_step": 342575, "epoch": 2831} {"train_loss": -44.39528274536133, "global_step": 342576, "epoch": 2831} {"train_loss": -44.353485107421875, "global_step": 342577, "epoch": 2831} {"train_loss": -44.71290969848633, "global_step": 342578, "epoch": 2831} {"train_loss": -45.23276901245117, "global_step": 342579, "epoch": 2831} {"train_loss": -44.495662689208984, "global_step": 342580, "epoch": 2831} {"train_loss": -44.72516632080078, "global_step": 342581, "epoch": 2831} {"train_loss": -43.87111282348633, "global_step": 342582, "epoch": 2831} {"train_loss": -44.3961067199707, "global_step": 342583, "epoch": 2831} {"train_loss": -44.616737365722656, "global_step": 342584, "epoch": 2831} {"train_loss": -43.8818473815918, "global_step": 342585, "epoch": 2831} {"train_loss": -44.70831298828125, "global_step": 342586, "epoch": 2831} {"train_loss": -43.957584381103516, "global_step": 342587, "epoch": 2831} {"train_loss": -42.98888397216797, "global_step": 342588, "epoch": 2831} {"train_loss": -43.788291931152344, "global_step": 342589, "epoch": 2831} {"train_loss": -44.2513542175293, "global_step": 342590, "epoch": 2831} {"train_loss": -43.40185546875, "global_step": 342591, "epoch": 2831} {"train_loss": -43.898284912109375, "global_step": 342592, "epoch": 2831} {"train_loss": -43.45366287231445, "global_step": 342593, "epoch": 2831} {"train_loss": -41.60396194458008, "global_step": 342594, "epoch": 2831} {"train_loss": -44.62361145019531, "global_step": 342595, "epoch": 2831} {"train_loss": -41.30118179321289, "global_step": 342596, "epoch": 2831} {"train_loss": -44.462196350097656, "global_step": 342597, "epoch": 2831} {"train_loss": -42.767120361328125, "global_step": 342598, "epoch": 2831} {"train_loss": -42.40421676635742, "global_step": 342599, "epoch": 2831} {"train_loss": -42.63711166381836, "global_step": 342600, "epoch": 2831} {"train_loss": -43.73007583618164, "global_step": 342601, "epoch": 2831} {"train_loss": -44.13941192626953, "global_step": 342602, "epoch": 2831} {"train_loss": -43.39757537841797, "global_step": 342603, "epoch": 2831} {"train_loss": -44.650909423828125, "global_step": 342604, "epoch": 2831} {"train_loss": -43.19274139404297, "global_step": 342605, "epoch": 2831} {"train_loss": -43.869991302490234, "global_step": 342606, "epoch": 2831} {"train_loss": -42.627750396728516, "global_step": 342607, "epoch": 2831} {"train_loss": -44.13496398925781, "global_step": 342608, "epoch": 2831} {"train_loss": -42.87211990356445, "global_step": 342609, "epoch": 2831} {"train_loss": -43.2874755859375, "global_step": 342610, "epoch": 2831} {"train_loss": -43.19766616821289, "global_step": 342611, "epoch": 2831} {"train_loss": -43.4586296081543, "global_step": 342612, "epoch": 2831} {"train_loss": -44.038509368896484, "global_step": 342613, "epoch": 2831} {"train_loss": -40.86396408081055, "global_step": 342614, "epoch": 2831} {"train_loss": -43.765254974365234, "global_step": 342615, "epoch": 2831} {"train_loss": -43.61130905151367, "global_step": 342616, "epoch": 2831} {"train_loss": -42.17629623413086, "global_step": 342617, "epoch": 2831} {"train_loss": -42.53778076171875, "global_step": 342618, "epoch": 2831} {"train_loss": -44.13187789916992, "global_step": 342619, "epoch": 2831} {"train_loss": -43.39697265625, "global_step": 342620, "epoch": 2831} {"train_loss": -43.05278396606445, "global_step": 342621, "epoch": 2831} {"train_loss": -44.6334342956543, "global_step": 342622, "epoch": 2831} {"train_loss": -42.65633010864258, "global_step": 342623, "epoch": 2831} {"train_loss": -43.618080139160156, "global_step": 342624, "epoch": 2831} {"train_loss": -44.36695098876953, "global_step": 342625, "epoch": 2831} {"train_loss": -42.017791748046875, "global_step": 342626, "epoch": 2831} {"train_loss": -44.60958480834961, "global_step": 342627, "epoch": 2831} {"train_loss": -43.30813217163086, "global_step": 342628, "epoch": 2831} {"train_loss": -43.986637115478516, "global_step": 342629, "epoch": 2831} {"train_loss": -43.67030715942383, "global_step": 342630, "epoch": 2831} {"train_loss": -43.134830474853516, "global_step": 342631, "epoch": 2831} {"train_loss": -43.96204376220703, "global_step": 342632, "epoch": 2831} {"train_loss": -43.7518424987793, "global_step": 342633, "epoch": 2831} {"train_loss": -42.62104415893555, "global_step": 342634, "epoch": 2831} {"train_loss": -44.57380676269531, "global_step": 342635, "epoch": 2831} {"train_loss": -42.82400131225586, "global_step": 342636, "epoch": 2831} {"train_loss": -44.546077728271484, "global_step": 342637, "epoch": 2831} {"train_loss": -44.44963455200195, "global_step": 342638, "epoch": 2831} {"train_loss": -42.00377655029297, "global_step": 342639, "epoch": 2831} {"train_loss": -44.792076110839844, "global_step": 342640, "epoch": 2831} {"train_loss": -44.23312759399414, "global_step": 342641, "epoch": 2831} {"train_loss": -44.84865951538086, "global_step": 342642, "epoch": 2831} {"train_loss": -44.562374114990234, "global_step": 342643, "epoch": 2831} {"train_loss": -44.99160385131836, "global_step": 342644, "epoch": 2831} {"train_loss": -43.48430252075195, "global_step": 342645, "epoch": 2831} {"train_loss": -43.694339752197266, "global_step": 342646, "epoch": 2831} {"train_loss": -44.582340240478516, "global_step": 342647, "epoch": 2831} {"train_loss": -44.54487228393555, "global_step": 342648, "epoch": 2831} {"train_loss": -44.80598068237305, "global_step": 342649, "epoch": 2831} {"train_loss": -45.418949127197266, "global_step": 342650, "epoch": 2831} {"train_loss": -45.02920913696289, "global_step": 342651, "epoch": 2831} {"train_loss": -44.37895584106445, "global_step": 342652, "epoch": 2831} {"train_loss": -45.19903564453125, "global_step": 342653, "epoch": 2831} {"train_loss": -44.74484634399414, "global_step": 342654, "epoch": 2831} {"train_loss": -44.778907775878906, "global_step": 342655, "epoch": 2831} {"train_loss": -45.06673812866211, "global_step": 342656, "epoch": 2831} {"train_loss": -43.4157829284668, "global_step": 342657, "epoch": 2831} {"train_loss": -45.149070739746094, "global_step": 342658, "epoch": 2831} {"train_loss": -44.555946350097656, "global_step": 342659, "epoch": 2831} {"train_loss": -44.522682189941406, "global_step": 342660, "epoch": 2831} {"train_loss": -44.99171447753906, "global_step": 342661, "epoch": 2831} {"train_loss": -44.5222282409668, "global_step": 342662, "epoch": 2831} {"train_loss": -44.70516586303711, "global_step": 342663, "epoch": 2831} {"train_loss": -44.08034896850586, "global_step": 342664, "epoch": 2831} {"train_loss": -45.01619338989258, "global_step": 342665, "epoch": 2831} {"train_loss": -44.97063446044922, "global_step": 342666, "epoch": 2831} {"train_loss": -43.33549118041992, "global_step": 342667, "epoch": 2831} {"train_loss": -44.83906173706055, "global_step": 342668, "epoch": 2831} {"train_loss": -45.17660903930664, "global_step": 342669, "epoch": 2831} {"train_loss": -44.172508239746094, "global_step": 342670, "epoch": 2831} {"train_loss": -44.100856308109506, "global_step": 342671, "epoch": 2831, "val_loss": 2604797.25} {"train_loss": -44.03510665893555, "global_step": 342672, "epoch": 2832} {"train_loss": -44.42510986328125, "global_step": 342673, "epoch": 2832} {"train_loss": -44.81254577636719, "global_step": 342674, "epoch": 2832} {"train_loss": -44.89594650268555, "global_step": 342675, "epoch": 2832} {"train_loss": -44.414154052734375, "global_step": 342676, "epoch": 2832} {"train_loss": -44.83028030395508, "global_step": 342677, "epoch": 2832} {"train_loss": -44.82401657104492, "global_step": 342678, "epoch": 2832} {"train_loss": -45.01110076904297, "global_step": 342679, "epoch": 2832} {"train_loss": -45.37970733642578, "global_step": 342680, "epoch": 2832} {"train_loss": -45.49001693725586, "global_step": 342681, "epoch": 2832} {"train_loss": -45.5728645324707, "global_step": 342682, "epoch": 2832} {"train_loss": -45.06226348876953, "global_step": 342683, "epoch": 2832} {"train_loss": -45.36477279663086, "global_step": 342684, "epoch": 2832} {"train_loss": -45.32478713989258, "global_step": 342685, "epoch": 2832} {"train_loss": -45.79679870605469, "global_step": 342686, "epoch": 2832} {"train_loss": -45.43430709838867, "global_step": 342687, "epoch": 2832} {"train_loss": -45.49406814575195, "global_step": 342688, "epoch": 2832} {"train_loss": -44.641090393066406, "global_step": 342689, "epoch": 2832} {"train_loss": -44.91413116455078, "global_step": 342690, "epoch": 2832} {"train_loss": -45.41667938232422, "global_step": 342691, "epoch": 2832} {"train_loss": -45.337860107421875, "global_step": 342692, "epoch": 2832} {"train_loss": -45.88761520385742, "global_step": 342693, "epoch": 2832} {"train_loss": -45.445796966552734, "global_step": 342694, "epoch": 2832} {"train_loss": -45.53611373901367, "global_step": 342695, "epoch": 2832} {"train_loss": -45.25182342529297, "global_step": 342696, "epoch": 2832} {"train_loss": -45.74993896484375, "global_step": 342697, "epoch": 2832} {"train_loss": -45.105506896972656, "global_step": 342698, "epoch": 2832} {"train_loss": -45.24178695678711, "global_step": 342699, "epoch": 2832} {"train_loss": -44.014198303222656, "global_step": 342700, "epoch": 2832} {"train_loss": -44.82734298706055, "global_step": 342701, "epoch": 2832} {"train_loss": -43.707881927490234, "global_step": 342702, "epoch": 2832} {"train_loss": -43.23439407348633, "global_step": 342703, "epoch": 2832} {"train_loss": -42.8062858581543, "global_step": 342704, "epoch": 2832} {"train_loss": -39.74101638793945, "global_step": 342705, "epoch": 2832} {"train_loss": -42.00492477416992, "global_step": 342706, "epoch": 2832} {"train_loss": -37.4061164855957, "global_step": 342707, "epoch": 2832} {"train_loss": -38.637943267822266, "global_step": 342708, "epoch": 2832} {"train_loss": -38.10538864135742, "global_step": 342709, "epoch": 2832} {"train_loss": -36.59440994262695, "global_step": 342710, "epoch": 2832} {"train_loss": -37.8876838684082, "global_step": 342711, "epoch": 2832} {"train_loss": -37.592220306396484, "global_step": 342712, "epoch": 2832} {"train_loss": -38.37897491455078, "global_step": 342713, "epoch": 2832} {"train_loss": -39.82941818237305, "global_step": 342714, "epoch": 2832} {"train_loss": -38.42525100708008, "global_step": 342715, "epoch": 2832} {"train_loss": -39.93290328979492, "global_step": 342716, "epoch": 2832} {"train_loss": -39.87540054321289, "global_step": 342717, "epoch": 2832} {"train_loss": -40.051971435546875, "global_step": 342718, "epoch": 2832} {"train_loss": -39.76918411254883, "global_step": 342719, "epoch": 2832} {"train_loss": -40.18840408325195, "global_step": 342720, "epoch": 2832} {"train_loss": -41.21290969848633, "global_step": 342721, "epoch": 2832} {"train_loss": -41.0281867980957, "global_step": 342722, "epoch": 2832} {"train_loss": -42.09606170654297, "global_step": 342723, "epoch": 2832} {"train_loss": -41.44001770019531, "global_step": 342724, "epoch": 2832} {"train_loss": -43.02804946899414, "global_step": 342725, "epoch": 2832} {"train_loss": -41.45941925048828, "global_step": 342726, "epoch": 2832} {"train_loss": -42.819393157958984, "global_step": 342727, "epoch": 2832} {"train_loss": -40.293434143066406, "global_step": 342728, "epoch": 2832} {"train_loss": -40.51997375488281, "global_step": 342729, "epoch": 2832} {"train_loss": -42.89168167114258, "global_step": 342730, "epoch": 2832} {"train_loss": -42.69839096069336, "global_step": 342731, "epoch": 2832} {"train_loss": -38.03377914428711, "global_step": 342732, "epoch": 2832} {"train_loss": -43.904693603515625, "global_step": 342733, "epoch": 2832} {"train_loss": -43.41824722290039, "global_step": 342734, "epoch": 2832} {"train_loss": -43.152156829833984, "global_step": 342735, "epoch": 2832} {"train_loss": -43.904541015625, "global_step": 342736, "epoch": 2832} {"train_loss": -44.17656326293945, "global_step": 342737, "epoch": 2832} {"train_loss": -43.69919967651367, "global_step": 342738, "epoch": 2832} {"train_loss": -43.561492919921875, "global_step": 342739, "epoch": 2832} {"train_loss": -44.40436553955078, "global_step": 342740, "epoch": 2832} {"train_loss": -43.340423583984375, "global_step": 342741, "epoch": 2832} {"train_loss": -43.53676223754883, "global_step": 342742, "epoch": 2832} {"train_loss": -43.399940490722656, "global_step": 342743, "epoch": 2832} {"train_loss": -43.50221252441406, "global_step": 342744, "epoch": 2832} {"train_loss": -44.34592819213867, "global_step": 342745, "epoch": 2832} {"train_loss": -43.97092056274414, "global_step": 342746, "epoch": 2832} {"train_loss": -43.5787467956543, "global_step": 342747, "epoch": 2832} {"train_loss": -44.85915756225586, "global_step": 342748, "epoch": 2832} {"train_loss": -44.242637634277344, "global_step": 342749, "epoch": 2832} {"train_loss": -44.5207633972168, "global_step": 342750, "epoch": 2832} {"train_loss": -44.70670700073242, "global_step": 342751, "epoch": 2832} {"train_loss": -44.476158142089844, "global_step": 342752, "epoch": 2832} {"train_loss": -43.730079650878906, "global_step": 342753, "epoch": 2832} {"train_loss": -37.06489944458008, "global_step": 342754, "epoch": 2832} {"train_loss": -43.6670036315918, "global_step": 342755, "epoch": 2832} {"train_loss": -43.87006378173828, "global_step": 342756, "epoch": 2832} {"train_loss": -44.50489044189453, "global_step": 342757, "epoch": 2832} {"train_loss": -43.415767669677734, "global_step": 342758, "epoch": 2832} {"train_loss": -42.14398956298828, "global_step": 342759, "epoch": 2832} {"train_loss": -40.17965316772461, "global_step": 342760, "epoch": 2832} {"train_loss": -43.657901763916016, "global_step": 342761, "epoch": 2832} {"train_loss": -44.39021682739258, "global_step": 342762, "epoch": 2832} {"train_loss": -43.65926742553711, "global_step": 342763, "epoch": 2832} {"train_loss": -43.7014274597168, "global_step": 342764, "epoch": 2832} {"train_loss": -44.49306106567383, "global_step": 342765, "epoch": 2832} {"train_loss": -43.10073471069336, "global_step": 342766, "epoch": 2832} {"train_loss": -44.80356979370117, "global_step": 342767, "epoch": 2832} {"train_loss": -44.13637924194336, "global_step": 342768, "epoch": 2832} {"train_loss": -39.52767562866211, "global_step": 342769, "epoch": 2832} {"train_loss": -44.30511474609375, "global_step": 342770, "epoch": 2832} {"train_loss": -41.87990951538086, "global_step": 342771, "epoch": 2832} {"train_loss": -42.89616012573242, "global_step": 342772, "epoch": 2832} {"train_loss": -44.1240119934082, "global_step": 342773, "epoch": 2832} {"train_loss": -44.25939178466797, "global_step": 342774, "epoch": 2832} {"train_loss": -44.16373062133789, "global_step": 342775, "epoch": 2832} {"train_loss": -43.549556732177734, "global_step": 342776, "epoch": 2832} {"train_loss": -44.54054641723633, "global_step": 342777, "epoch": 2832} {"train_loss": -44.2961311340332, "global_step": 342778, "epoch": 2832} {"train_loss": -42.85750961303711, "global_step": 342779, "epoch": 2832} {"train_loss": -44.53647994995117, "global_step": 342780, "epoch": 2832} {"train_loss": -43.6912956237793, "global_step": 342781, "epoch": 2832} {"train_loss": -43.939510345458984, "global_step": 342782, "epoch": 2832} {"train_loss": -43.70377731323242, "global_step": 342783, "epoch": 2832} {"train_loss": -44.73115158081055, "global_step": 342784, "epoch": 2832} {"train_loss": -44.51435470581055, "global_step": 342785, "epoch": 2832} {"train_loss": -42.96751022338867, "global_step": 342786, "epoch": 2832} {"train_loss": -44.13613510131836, "global_step": 342787, "epoch": 2832} {"train_loss": -44.90751266479492, "global_step": 342788, "epoch": 2832} {"train_loss": -44.574031829833984, "global_step": 342789, "epoch": 2832} {"train_loss": -44.644264221191406, "global_step": 342790, "epoch": 2832} {"train_loss": -43.529205322265625, "global_step": 342791, "epoch": 2832} {"train_loss": -43.181752796015466, "global_step": 342792, "epoch": 2832, "val_loss": 2915502.75} {"train_loss": -44.811424255371094, "global_step": 342793, "epoch": 2833} {"train_loss": -45.144325256347656, "global_step": 342794, "epoch": 2833} {"train_loss": -43.89121627807617, "global_step": 342795, "epoch": 2833} {"train_loss": -44.72420120239258, "global_step": 342796, "epoch": 2833} {"train_loss": -44.37757873535156, "global_step": 342797, "epoch": 2833} {"train_loss": -44.51723098754883, "global_step": 342798, "epoch": 2833} {"train_loss": -43.71139144897461, "global_step": 342799, "epoch": 2833} {"train_loss": -45.42509841918945, "global_step": 342800, "epoch": 2833} {"train_loss": -44.69404983520508, "global_step": 342801, "epoch": 2833} {"train_loss": -44.86829376220703, "global_step": 342802, "epoch": 2833} {"train_loss": -45.18505859375, "global_step": 342803, "epoch": 2833} {"train_loss": -44.85981369018555, "global_step": 342804, "epoch": 2833} {"train_loss": -45.309635162353516, "global_step": 342805, "epoch": 2833} {"train_loss": -44.61452865600586, "global_step": 342806, "epoch": 2833} {"train_loss": -44.562591552734375, "global_step": 342807, "epoch": 2833} {"train_loss": -45.31586837768555, "global_step": 342808, "epoch": 2833} {"train_loss": -45.243038177490234, "global_step": 342809, "epoch": 2833} {"train_loss": -44.83627700805664, "global_step": 342810, "epoch": 2833} {"train_loss": -44.918025970458984, "global_step": 342811, "epoch": 2833} {"train_loss": -44.47003936767578, "global_step": 342812, "epoch": 2833} {"train_loss": -45.12799072265625, "global_step": 342813, "epoch": 2833} {"train_loss": -44.98106002807617, "global_step": 342814, "epoch": 2833} {"train_loss": -44.61836624145508, "global_step": 342815, "epoch": 2833} {"train_loss": -44.88177490234375, "global_step": 342816, "epoch": 2833} {"train_loss": -44.34188461303711, "global_step": 342817, "epoch": 2833} {"train_loss": -44.967655181884766, "global_step": 342818, "epoch": 2833} {"train_loss": -44.87362289428711, "global_step": 342819, "epoch": 2833} {"train_loss": -45.26896286010742, "global_step": 342820, "epoch": 2833} {"train_loss": -45.15242004394531, "global_step": 342821, "epoch": 2833} {"train_loss": -44.312381744384766, "global_step": 342822, "epoch": 2833} {"train_loss": -45.1926383972168, "global_step": 342823, "epoch": 2833} {"train_loss": -44.49836349487305, "global_step": 342824, "epoch": 2833} {"train_loss": -43.74909591674805, "global_step": 342825, "epoch": 2833} {"train_loss": -44.481231689453125, "global_step": 342826, "epoch": 2833} {"train_loss": -44.531673431396484, "global_step": 342827, "epoch": 2833} {"train_loss": -45.04242706298828, "global_step": 342828, "epoch": 2833} {"train_loss": -45.17746353149414, "global_step": 342829, "epoch": 2833} {"train_loss": -44.55025100708008, "global_step": 342830, "epoch": 2833} {"train_loss": -45.512569427490234, "global_step": 342831, "epoch": 2833} {"train_loss": -44.70539474487305, "global_step": 342832, "epoch": 2833} {"train_loss": -44.79883575439453, "global_step": 342833, "epoch": 2833} {"train_loss": -44.24453353881836, "global_step": 342834, "epoch": 2833} {"train_loss": -44.76374053955078, "global_step": 342835, "epoch": 2833} {"train_loss": -42.93592071533203, "global_step": 342836, "epoch": 2833} {"train_loss": -45.18809127807617, "global_step": 342837, "epoch": 2833} {"train_loss": -44.47406005859375, "global_step": 342838, "epoch": 2833} {"train_loss": -43.039398193359375, "global_step": 342839, "epoch": 2833} {"train_loss": -42.825828552246094, "global_step": 342840, "epoch": 2833} {"train_loss": -41.35100555419922, "global_step": 342841, "epoch": 2833} {"train_loss": -42.570274353027344, "global_step": 342842, "epoch": 2833} {"train_loss": -42.941009521484375, "global_step": 342843, "epoch": 2833} {"train_loss": -44.05850601196289, "global_step": 342844, "epoch": 2833} {"train_loss": -44.222408294677734, "global_step": 342845, "epoch": 2833} {"train_loss": -43.290252685546875, "global_step": 342846, "epoch": 2833} {"train_loss": -42.71905517578125, "global_step": 342847, "epoch": 2833} {"train_loss": -44.38671875, "global_step": 342848, "epoch": 2833} {"train_loss": -43.70885467529297, "global_step": 342849, "epoch": 2833} {"train_loss": -44.61973190307617, "global_step": 342850, "epoch": 2833} {"train_loss": -44.412879943847656, "global_step": 342851, "epoch": 2833} {"train_loss": -44.48896026611328, "global_step": 342852, "epoch": 2833} {"train_loss": -44.80766677856445, "global_step": 342853, "epoch": 2833} {"train_loss": -43.516780853271484, "global_step": 342854, "epoch": 2833} {"train_loss": -43.1803092956543, "global_step": 342855, "epoch": 2833} {"train_loss": -43.61484909057617, "global_step": 342856, "epoch": 2833} {"train_loss": -44.18597412109375, "global_step": 342857, "epoch": 2833} {"train_loss": -44.7656364440918, "global_step": 342858, "epoch": 2833} {"train_loss": -44.41794967651367, "global_step": 342859, "epoch": 2833} {"train_loss": -44.46548080444336, "global_step": 342860, "epoch": 2833} {"train_loss": -45.00997543334961, "global_step": 342861, "epoch": 2833} {"train_loss": -43.8665657043457, "global_step": 342862, "epoch": 2833} {"train_loss": -44.58327865600586, "global_step": 342863, "epoch": 2833} {"train_loss": -44.73582077026367, "global_step": 342864, "epoch": 2833} {"train_loss": -43.913448333740234, "global_step": 342865, "epoch": 2833} {"train_loss": -44.32689666748047, "global_step": 342866, "epoch": 2833} {"train_loss": -44.45859909057617, "global_step": 342867, "epoch": 2833} {"train_loss": -45.1677360534668, "global_step": 342868, "epoch": 2833} {"train_loss": -43.909854888916016, "global_step": 342869, "epoch": 2833} {"train_loss": -43.22664260864258, "global_step": 342870, "epoch": 2833} {"train_loss": -44.186546325683594, "global_step": 342871, "epoch": 2833} {"train_loss": -44.83351516723633, "global_step": 342872, "epoch": 2833} {"train_loss": -44.50260543823242, "global_step": 342873, "epoch": 2833} {"train_loss": -45.08840560913086, "global_step": 342874, "epoch": 2833} {"train_loss": -45.57168197631836, "global_step": 342875, "epoch": 2833} {"train_loss": -45.338111877441406, "global_step": 342876, "epoch": 2833} {"train_loss": -45.23551940917969, "global_step": 342877, "epoch": 2833} {"train_loss": -45.24215316772461, "global_step": 342878, "epoch": 2833} {"train_loss": -44.439308166503906, "global_step": 342879, "epoch": 2833} {"train_loss": -45.06856155395508, "global_step": 342880, "epoch": 2833} {"train_loss": -44.70942306518555, "global_step": 342881, "epoch": 2833} {"train_loss": -44.75638961791992, "global_step": 342882, "epoch": 2833} {"train_loss": -44.541133880615234, "global_step": 342883, "epoch": 2833} {"train_loss": -44.821834564208984, "global_step": 342884, "epoch": 2833} {"train_loss": -44.462711334228516, "global_step": 342885, "epoch": 2833} {"train_loss": -43.4681396484375, "global_step": 342886, "epoch": 2833} {"train_loss": -42.82659912109375, "global_step": 342887, "epoch": 2833} {"train_loss": -45.3165168762207, "global_step": 342888, "epoch": 2833} {"train_loss": -44.97818374633789, "global_step": 342889, "epoch": 2833} {"train_loss": -42.72089385986328, "global_step": 342890, "epoch": 2833} {"train_loss": -43.81399154663086, "global_step": 342891, "epoch": 2833} {"train_loss": -44.70003128051758, "global_step": 342892, "epoch": 2833} {"train_loss": -43.71759796142578, "global_step": 342893, "epoch": 2833} {"train_loss": -44.99583053588867, "global_step": 342894, "epoch": 2833} {"train_loss": -44.07669448852539, "global_step": 342895, "epoch": 2833} {"train_loss": -43.05888748168945, "global_step": 342896, "epoch": 2833} {"train_loss": -43.17057418823242, "global_step": 342897, "epoch": 2833} {"train_loss": -42.95138168334961, "global_step": 342898, "epoch": 2833} {"train_loss": -42.81436538696289, "global_step": 342899, "epoch": 2833} {"train_loss": -42.453277587890625, "global_step": 342900, "epoch": 2833} {"train_loss": -42.99897003173828, "global_step": 342901, "epoch": 2833} {"train_loss": -42.18781280517578, "global_step": 342902, "epoch": 2833} {"train_loss": -44.62812042236328, "global_step": 342903, "epoch": 2833} {"train_loss": -43.20302200317383, "global_step": 342904, "epoch": 2833} {"train_loss": -40.54435348510742, "global_step": 342905, "epoch": 2833} {"train_loss": -41.851566314697266, "global_step": 342906, "epoch": 2833} {"train_loss": -39.19228744506836, "global_step": 342907, "epoch": 2833} {"train_loss": -40.53953552246094, "global_step": 342908, "epoch": 2833} {"train_loss": -42.07725143432617, "global_step": 342909, "epoch": 2833} {"train_loss": -39.6677131652832, "global_step": 342910, "epoch": 2833} {"train_loss": -42.933162689208984, "global_step": 342911, "epoch": 2833} {"train_loss": -41.994171142578125, "global_step": 342912, "epoch": 2833} {"train_loss": -44.08463400848641, "global_step": 342913, "epoch": 2833, "val_loss": 2512289.75} {"train_loss": -43.831398010253906, "global_step": 342914, "epoch": 2834} {"train_loss": -42.40378952026367, "global_step": 342915, "epoch": 2834} {"train_loss": -43.60514831542969, "global_step": 342916, "epoch": 2834} {"train_loss": -43.73389434814453, "global_step": 342917, "epoch": 2834} {"train_loss": -43.604122161865234, "global_step": 342918, "epoch": 2834} {"train_loss": -43.27277374267578, "global_step": 342919, "epoch": 2834} {"train_loss": -43.19535446166992, "global_step": 342920, "epoch": 2834} {"train_loss": -44.129737854003906, "global_step": 342921, "epoch": 2834} {"train_loss": -42.944068908691406, "global_step": 342922, "epoch": 2834} {"train_loss": -43.888118743896484, "global_step": 342923, "epoch": 2834} {"train_loss": -42.87488555908203, "global_step": 342924, "epoch": 2834} {"train_loss": -43.80595016479492, "global_step": 342925, "epoch": 2834} {"train_loss": -44.21857833862305, "global_step": 342926, "epoch": 2834} {"train_loss": -43.34871292114258, "global_step": 342927, "epoch": 2834} {"train_loss": -43.966705322265625, "global_step": 342928, "epoch": 2834} {"train_loss": -44.08802795410156, "global_step": 342929, "epoch": 2834} {"train_loss": -45.06745529174805, "global_step": 342930, "epoch": 2834} {"train_loss": -44.26166915893555, "global_step": 342931, "epoch": 2834} {"train_loss": -44.51244354248047, "global_step": 342932, "epoch": 2834} {"train_loss": -43.85783004760742, "global_step": 342933, "epoch": 2834} {"train_loss": -44.34273910522461, "global_step": 342934, "epoch": 2834} {"train_loss": -44.87099838256836, "global_step": 342935, "epoch": 2834} {"train_loss": -43.8563232421875, "global_step": 342936, "epoch": 2834} {"train_loss": -44.8563346862793, "global_step": 342937, "epoch": 2834} {"train_loss": -43.41877365112305, "global_step": 342938, "epoch": 2834} {"train_loss": -44.1680908203125, "global_step": 342939, "epoch": 2834} {"train_loss": -44.671363830566406, "global_step": 342940, "epoch": 2834} {"train_loss": -43.57725524902344, "global_step": 342941, "epoch": 2834} {"train_loss": -45.037349700927734, "global_step": 342942, "epoch": 2834} {"train_loss": -44.0910530090332, "global_step": 342943, "epoch": 2834} {"train_loss": -45.032745361328125, "global_step": 342944, "epoch": 2834} {"train_loss": -44.968807220458984, "global_step": 342945, "epoch": 2834} {"train_loss": -43.73054885864258, "global_step": 342946, "epoch": 2834} {"train_loss": -45.13290023803711, "global_step": 342947, "epoch": 2834} {"train_loss": -44.2186279296875, "global_step": 342948, "epoch": 2834} {"train_loss": -44.392635345458984, "global_step": 342949, "epoch": 2834} {"train_loss": -44.569576263427734, "global_step": 342950, "epoch": 2834} {"train_loss": -44.95582962036133, "global_step": 342951, "epoch": 2834} {"train_loss": -45.034820556640625, "global_step": 342952, "epoch": 2834} {"train_loss": -44.4735107421875, "global_step": 342953, "epoch": 2834} {"train_loss": -45.29096603393555, "global_step": 342954, "epoch": 2834} {"train_loss": -44.58539962768555, "global_step": 342955, "epoch": 2834} {"train_loss": -45.786293029785156, "global_step": 342956, "epoch": 2834} {"train_loss": -44.880859375, "global_step": 342957, "epoch": 2834} {"train_loss": -44.944393157958984, "global_step": 342958, "epoch": 2834} {"train_loss": -45.246917724609375, "global_step": 342959, "epoch": 2834} {"train_loss": -45.158390045166016, "global_step": 342960, "epoch": 2834} {"train_loss": -45.152889251708984, "global_step": 342961, "epoch": 2834} {"train_loss": -45.245059967041016, "global_step": 342962, "epoch": 2834} {"train_loss": -45.358699798583984, "global_step": 342963, "epoch": 2834} {"train_loss": -45.140228271484375, "global_step": 342964, "epoch": 2834} {"train_loss": -45.25769805908203, "global_step": 342965, "epoch": 2834} {"train_loss": -44.61705017089844, "global_step": 342966, "epoch": 2834} {"train_loss": -45.45044708251953, "global_step": 342967, "epoch": 2834} {"train_loss": -44.35445022583008, "global_step": 342968, "epoch": 2834} {"train_loss": -44.96780014038086, "global_step": 342969, "epoch": 2834} {"train_loss": -44.90497970581055, "global_step": 342970, "epoch": 2834} {"train_loss": -45.36075210571289, "global_step": 342971, "epoch": 2834} {"train_loss": -43.100276947021484, "global_step": 342972, "epoch": 2834} {"train_loss": -43.90781784057617, "global_step": 342973, "epoch": 2834} {"train_loss": -45.04603958129883, "global_step": 342974, "epoch": 2834} {"train_loss": -43.11526107788086, "global_step": 342975, "epoch": 2834} {"train_loss": -45.05512619018555, "global_step": 342976, "epoch": 2834} {"train_loss": -43.958709716796875, "global_step": 342977, "epoch": 2834} {"train_loss": -43.77579879760742, "global_step": 342978, "epoch": 2834} {"train_loss": -43.178321838378906, "global_step": 342979, "epoch": 2834} {"train_loss": -29.757678985595703, "global_step": 342980, "epoch": 2834} {"train_loss": -35.52839279174805, "global_step": 342981, "epoch": 2834} {"train_loss": -44.0653076171875, "global_step": 342982, "epoch": 2834} {"train_loss": -41.46297073364258, "global_step": 342983, "epoch": 2834} {"train_loss": -44.2523193359375, "global_step": 342984, "epoch": 2834} {"train_loss": -44.04087829589844, "global_step": 342985, "epoch": 2834} {"train_loss": -41.96335983276367, "global_step": 342986, "epoch": 2834} {"train_loss": -42.29671859741211, "global_step": 342987, "epoch": 2834} {"train_loss": -39.89292907714844, "global_step": 342988, "epoch": 2834} {"train_loss": -40.43798065185547, "global_step": 342989, "epoch": 2834} {"train_loss": -42.10692596435547, "global_step": 342990, "epoch": 2834} {"train_loss": -37.48957061767578, "global_step": 342991, "epoch": 2834} {"train_loss": -42.851078033447266, "global_step": 342992, "epoch": 2834} {"train_loss": -40.692630767822266, "global_step": 342993, "epoch": 2834} {"train_loss": -41.950740814208984, "global_step": 342994, "epoch": 2834} {"train_loss": -39.52248764038086, "global_step": 342995, "epoch": 2834} {"train_loss": -41.167266845703125, "global_step": 342996, "epoch": 2834} {"train_loss": -40.8889274597168, "global_step": 342997, "epoch": 2834} {"train_loss": -42.061588287353516, "global_step": 342998, "epoch": 2834} {"train_loss": -39.163604736328125, "global_step": 342999, "epoch": 2834} {"train_loss": -41.10346603393555, "global_step": 343000, "epoch": 2834} {"train_loss": -35.40431594848633, "global_step": 343001, "epoch": 2834} {"train_loss": -40.978607177734375, "global_step": 343002, "epoch": 2834} {"train_loss": -40.18378829956055, "global_step": 343003, "epoch": 2834} {"train_loss": -42.3995475769043, "global_step": 343004, "epoch": 2834} {"train_loss": -39.234222412109375, "global_step": 343005, "epoch": 2834} {"train_loss": -40.541934967041016, "global_step": 343006, "epoch": 2834} {"train_loss": -39.83443069458008, "global_step": 343007, "epoch": 2834} {"train_loss": -40.56868362426758, "global_step": 343008, "epoch": 2834} {"train_loss": -41.53721237182617, "global_step": 343009, "epoch": 2834} {"train_loss": -38.242427825927734, "global_step": 343010, "epoch": 2834} {"train_loss": -41.289981842041016, "global_step": 343011, "epoch": 2834} {"train_loss": -41.848323822021484, "global_step": 343012, "epoch": 2834} {"train_loss": -41.40022277832031, "global_step": 343013, "epoch": 2834} {"train_loss": -41.980220794677734, "global_step": 343014, "epoch": 2834} {"train_loss": -41.78202819824219, "global_step": 343015, "epoch": 2834} {"train_loss": -40.26673126220703, "global_step": 343016, "epoch": 2834} {"train_loss": -42.298152923583984, "global_step": 343017, "epoch": 2834} {"train_loss": -40.56787872314453, "global_step": 343018, "epoch": 2834} {"train_loss": -40.83512496948242, "global_step": 343019, "epoch": 2834} {"train_loss": -43.00000762939453, "global_step": 343020, "epoch": 2834} {"train_loss": -41.02983856201172, "global_step": 343021, "epoch": 2834} {"train_loss": -41.99688720703125, "global_step": 343022, "epoch": 2834} {"train_loss": -40.5995979309082, "global_step": 343023, "epoch": 2834} {"train_loss": -43.01417922973633, "global_step": 343024, "epoch": 2834} {"train_loss": -41.73371505737305, "global_step": 343025, "epoch": 2834} {"train_loss": -43.32771682739258, "global_step": 343026, "epoch": 2834} {"train_loss": -42.47895050048828, "global_step": 343027, "epoch": 2834} {"train_loss": -43.00046157836914, "global_step": 343028, "epoch": 2834} {"train_loss": -43.265621185302734, "global_step": 343029, "epoch": 2834} {"train_loss": -42.72392654418945, "global_step": 343030, "epoch": 2834} {"train_loss": -42.91950225830078, "global_step": 343031, "epoch": 2834} {"train_loss": -42.682186126708984, "global_step": 343032, "epoch": 2834} {"train_loss": -43.70064163208008, "global_step": 343033, "epoch": 2834} {"train_loss": -42.88663410155241, "global_step": 343034, "epoch": 2834, "val_loss": 2517695.0} {"train_loss": -43.440006256103516, "global_step": 343035, "epoch": 2835} {"train_loss": -43.46261215209961, "global_step": 343036, "epoch": 2835} {"train_loss": -43.24636459350586, "global_step": 343037, "epoch": 2835} {"train_loss": -43.71952438354492, "global_step": 343038, "epoch": 2835} {"train_loss": -43.25696563720703, "global_step": 343039, "epoch": 2835} {"train_loss": -44.18368148803711, "global_step": 343040, "epoch": 2835} {"train_loss": -43.98347854614258, "global_step": 343041, "epoch": 2835} {"train_loss": -44.0414924621582, "global_step": 343042, "epoch": 2835} {"train_loss": -43.90951156616211, "global_step": 343043, "epoch": 2835} {"train_loss": -43.479225158691406, "global_step": 343044, "epoch": 2835} {"train_loss": -43.518680572509766, "global_step": 343045, "epoch": 2835} {"train_loss": -44.07683181762695, "global_step": 343046, "epoch": 2835} {"train_loss": -43.027183532714844, "global_step": 343047, "epoch": 2835} {"train_loss": -43.80522537231445, "global_step": 343048, "epoch": 2835} {"train_loss": -43.6508674621582, "global_step": 343049, "epoch": 2835} {"train_loss": -43.863258361816406, "global_step": 343050, "epoch": 2835} {"train_loss": -43.73952865600586, "global_step": 343051, "epoch": 2835} {"train_loss": -44.20728302001953, "global_step": 343052, "epoch": 2835} {"train_loss": -43.719120025634766, "global_step": 343053, "epoch": 2835} {"train_loss": -44.366886138916016, "global_step": 343054, "epoch": 2835} {"train_loss": -44.73912811279297, "global_step": 343055, "epoch": 2835} {"train_loss": -44.33726119995117, "global_step": 343056, "epoch": 2835} {"train_loss": -44.55756759643555, "global_step": 343057, "epoch": 2835} {"train_loss": -44.451515197753906, "global_step": 343058, "epoch": 2835} {"train_loss": -44.53592300415039, "global_step": 343059, "epoch": 2835} {"train_loss": -45.122013092041016, "global_step": 343060, "epoch": 2835} {"train_loss": -44.82273483276367, "global_step": 343061, "epoch": 2835} {"train_loss": -44.71171569824219, "global_step": 343062, "epoch": 2835} {"train_loss": -44.65031814575195, "global_step": 343063, "epoch": 2835} {"train_loss": -44.679466247558594, "global_step": 343064, "epoch": 2835} {"train_loss": -44.457881927490234, "global_step": 343065, "epoch": 2835} {"train_loss": -44.6170654296875, "global_step": 343066, "epoch": 2835} {"train_loss": -44.14386749267578, "global_step": 343067, "epoch": 2835} {"train_loss": -44.93501281738281, "global_step": 343068, "epoch": 2835} {"train_loss": -45.15982437133789, "global_step": 343069, "epoch": 2835} {"train_loss": -45.187721252441406, "global_step": 343070, "epoch": 2835} {"train_loss": -45.13019561767578, "global_step": 343071, "epoch": 2835} {"train_loss": -44.53375244140625, "global_step": 343072, "epoch": 2835} {"train_loss": -45.14811325073242, "global_step": 343073, "epoch": 2835} {"train_loss": -45.01405334472656, "global_step": 343074, "epoch": 2835} {"train_loss": -44.95319366455078, "global_step": 343075, "epoch": 2835} {"train_loss": -45.259918212890625, "global_step": 343076, "epoch": 2835} {"train_loss": -44.501319885253906, "global_step": 343077, "epoch": 2835} {"train_loss": -45.31398391723633, "global_step": 343078, "epoch": 2835} {"train_loss": -44.903839111328125, "global_step": 343079, "epoch": 2835} {"train_loss": -45.29247283935547, "global_step": 343080, "epoch": 2835} {"train_loss": -44.883914947509766, "global_step": 343081, "epoch": 2835} {"train_loss": -45.64878463745117, "global_step": 343082, "epoch": 2835} {"train_loss": -45.48643112182617, "global_step": 343083, "epoch": 2835} {"train_loss": -44.742366790771484, "global_step": 343084, "epoch": 2835} {"train_loss": -44.66500473022461, "global_step": 343085, "epoch": 2835} {"train_loss": -44.18415832519531, "global_step": 343086, "epoch": 2835} {"train_loss": -44.65944290161133, "global_step": 343087, "epoch": 2835} {"train_loss": -45.287174224853516, "global_step": 343088, "epoch": 2835} {"train_loss": -44.46147537231445, "global_step": 343089, "epoch": 2835} {"train_loss": -43.983028411865234, "global_step": 343090, "epoch": 2835} {"train_loss": -43.35200119018555, "global_step": 343091, "epoch": 2835} {"train_loss": -45.030189514160156, "global_step": 343092, "epoch": 2835} {"train_loss": -44.73247146606445, "global_step": 343093, "epoch": 2835} {"train_loss": -45.334991455078125, "global_step": 343094, "epoch": 2835} {"train_loss": -45.04395294189453, "global_step": 343095, "epoch": 2835} {"train_loss": -45.637184143066406, "global_step": 343096, "epoch": 2835} {"train_loss": -44.805599212646484, "global_step": 343097, "epoch": 2835} {"train_loss": -45.15296936035156, "global_step": 343098, "epoch": 2835} {"train_loss": -45.16656494140625, "global_step": 343099, "epoch": 2835} {"train_loss": -44.388057708740234, "global_step": 343100, "epoch": 2835} {"train_loss": -45.342037200927734, "global_step": 343101, "epoch": 2835} {"train_loss": -45.444580078125, "global_step": 343102, "epoch": 2835} {"train_loss": -44.777652740478516, "global_step": 343103, "epoch": 2835} {"train_loss": -45.09416961669922, "global_step": 343104, "epoch": 2835} {"train_loss": -45.68561935424805, "global_step": 343105, "epoch": 2835} {"train_loss": -45.864070892333984, "global_step": 343106, "epoch": 2835} {"train_loss": -45.79142379760742, "global_step": 343107, "epoch": 2835} {"train_loss": -44.99924087524414, "global_step": 343108, "epoch": 2835} {"train_loss": -44.985042572021484, "global_step": 343109, "epoch": 2835} {"train_loss": -44.720767974853516, "global_step": 343110, "epoch": 2835} {"train_loss": -44.749691009521484, "global_step": 343111, "epoch": 2835} {"train_loss": -44.75677490234375, "global_step": 343112, "epoch": 2835} {"train_loss": -43.3205451965332, "global_step": 343113, "epoch": 2835} {"train_loss": -42.77499008178711, "global_step": 343114, "epoch": 2835} {"train_loss": -44.310020446777344, "global_step": 343115, "epoch": 2835} {"train_loss": -43.80816650390625, "global_step": 343116, "epoch": 2835} {"train_loss": -42.94346618652344, "global_step": 343117, "epoch": 2835} {"train_loss": -43.486080169677734, "global_step": 343118, "epoch": 2835} {"train_loss": -43.871673583984375, "global_step": 343119, "epoch": 2835} {"train_loss": -42.323299407958984, "global_step": 343120, "epoch": 2835} {"train_loss": -41.72842025756836, "global_step": 343121, "epoch": 2835} {"train_loss": -42.738914489746094, "global_step": 343122, "epoch": 2835} {"train_loss": -42.419979095458984, "global_step": 343123, "epoch": 2835} {"train_loss": -41.589080810546875, "global_step": 343124, "epoch": 2835} {"train_loss": -42.87483215332031, "global_step": 343125, "epoch": 2835} {"train_loss": -41.6127815246582, "global_step": 343126, "epoch": 2835} {"train_loss": -43.92557907104492, "global_step": 343127, "epoch": 2835} {"train_loss": -42.01701354980469, "global_step": 343128, "epoch": 2835} {"train_loss": -44.21969223022461, "global_step": 343129, "epoch": 2835} {"train_loss": -42.0114860534668, "global_step": 343130, "epoch": 2835} {"train_loss": -43.25775146484375, "global_step": 343131, "epoch": 2835} {"train_loss": -43.81598663330078, "global_step": 343132, "epoch": 2835} {"train_loss": -42.3919792175293, "global_step": 343133, "epoch": 2835} {"train_loss": -43.25417709350586, "global_step": 343134, "epoch": 2835} {"train_loss": -43.38542556762695, "global_step": 343135, "epoch": 2835} {"train_loss": -43.482662200927734, "global_step": 343136, "epoch": 2835} {"train_loss": -42.17475891113281, "global_step": 343137, "epoch": 2835} {"train_loss": -44.14130783081055, "global_step": 343138, "epoch": 2835} {"train_loss": -42.46747970581055, "global_step": 343139, "epoch": 2835} {"train_loss": -43.72966384887695, "global_step": 343140, "epoch": 2835} {"train_loss": -44.05277633666992, "global_step": 343141, "epoch": 2835} {"train_loss": -42.975460052490234, "global_step": 343142, "epoch": 2835} {"train_loss": -43.69725036621094, "global_step": 343143, "epoch": 2835} {"train_loss": -44.1770133972168, "global_step": 343144, "epoch": 2835} {"train_loss": -43.515010833740234, "global_step": 343145, "epoch": 2835} {"train_loss": -43.881343841552734, "global_step": 343146, "epoch": 2835} {"train_loss": -43.24940872192383, "global_step": 343147, "epoch": 2835} {"train_loss": -43.37022018432617, "global_step": 343148, "epoch": 2835} {"train_loss": -44.27847671508789, "global_step": 343149, "epoch": 2835} {"train_loss": -43.066688537597656, "global_step": 343150, "epoch": 2835} {"train_loss": -44.75983428955078, "global_step": 343151, "epoch": 2835} {"train_loss": -44.042171478271484, "global_step": 343152, "epoch": 2835} {"train_loss": -44.31494140625, "global_step": 343153, "epoch": 2835} {"train_loss": -44.43513870239258, "global_step": 343154, "epoch": 2835} {"train_loss": -44.14131356861966, "global_step": 343155, "epoch": 2835, "val_loss": 2523148.75} {"train_loss": -44.83516311645508, "global_step": 343156, "epoch": 2836} {"train_loss": -44.505489349365234, "global_step": 343157, "epoch": 2836} {"train_loss": -44.860687255859375, "global_step": 343158, "epoch": 2836} {"train_loss": -44.318233489990234, "global_step": 343159, "epoch": 2836} {"train_loss": -44.621089935302734, "global_step": 343160, "epoch": 2836} {"train_loss": -44.580657958984375, "global_step": 343161, "epoch": 2836} {"train_loss": -45.085105895996094, "global_step": 343162, "epoch": 2836} {"train_loss": -44.37677764892578, "global_step": 343163, "epoch": 2836} {"train_loss": -45.12092971801758, "global_step": 343164, "epoch": 2836} {"train_loss": -44.676639556884766, "global_step": 343165, "epoch": 2836} {"train_loss": -44.883033752441406, "global_step": 343166, "epoch": 2836} {"train_loss": -44.93635940551758, "global_step": 343167, "epoch": 2836} {"train_loss": -43.51768112182617, "global_step": 343168, "epoch": 2836} {"train_loss": -44.731544494628906, "global_step": 343169, "epoch": 2836} {"train_loss": -45.04042053222656, "global_step": 343170, "epoch": 2836} {"train_loss": -44.19987106323242, "global_step": 343171, "epoch": 2836} {"train_loss": -44.18233871459961, "global_step": 343172, "epoch": 2836} {"train_loss": -45.05313491821289, "global_step": 343173, "epoch": 2836} {"train_loss": -44.48820114135742, "global_step": 343174, "epoch": 2836} {"train_loss": -44.17948913574219, "global_step": 343175, "epoch": 2836} {"train_loss": -45.22111129760742, "global_step": 343176, "epoch": 2836} {"train_loss": -44.515899658203125, "global_step": 343177, "epoch": 2836} {"train_loss": -45.10555648803711, "global_step": 343178, "epoch": 2836} {"train_loss": -45.00428009033203, "global_step": 343179, "epoch": 2836} {"train_loss": -44.4874153137207, "global_step": 343180, "epoch": 2836} {"train_loss": -44.535369873046875, "global_step": 343181, "epoch": 2836} {"train_loss": -43.99277114868164, "global_step": 343182, "epoch": 2836} {"train_loss": -42.16434860229492, "global_step": 343183, "epoch": 2836} {"train_loss": -44.89490509033203, "global_step": 343184, "epoch": 2836} {"train_loss": -43.359004974365234, "global_step": 343185, "epoch": 2836} {"train_loss": -44.101314544677734, "global_step": 343186, "epoch": 2836} {"train_loss": -43.56711196899414, "global_step": 343187, "epoch": 2836} {"train_loss": -43.25264358520508, "global_step": 343188, "epoch": 2836} {"train_loss": -42.9332275390625, "global_step": 343189, "epoch": 2836} {"train_loss": -42.94770050048828, "global_step": 343190, "epoch": 2836} {"train_loss": -43.33234786987305, "global_step": 343191, "epoch": 2836} {"train_loss": -44.07619857788086, "global_step": 343192, "epoch": 2836} {"train_loss": -44.630470275878906, "global_step": 343193, "epoch": 2836} {"train_loss": -42.23365020751953, "global_step": 343194, "epoch": 2836} {"train_loss": -44.03165054321289, "global_step": 343195, "epoch": 2836} {"train_loss": -44.12042999267578, "global_step": 343196, "epoch": 2836} {"train_loss": -42.938148498535156, "global_step": 343197, "epoch": 2836} {"train_loss": -43.69449234008789, "global_step": 343198, "epoch": 2836} {"train_loss": -43.605438232421875, "global_step": 343199, "epoch": 2836} {"train_loss": -43.739112854003906, "global_step": 343200, "epoch": 2836} {"train_loss": -43.58693313598633, "global_step": 343201, "epoch": 2836} {"train_loss": -43.98699951171875, "global_step": 343202, "epoch": 2836} {"train_loss": -43.8619384765625, "global_step": 343203, "epoch": 2836} {"train_loss": -44.12940216064453, "global_step": 343204, "epoch": 2836} {"train_loss": -43.720664978027344, "global_step": 343205, "epoch": 2836} {"train_loss": -42.92727279663086, "global_step": 343206, "epoch": 2836} {"train_loss": -44.468379974365234, "global_step": 343207, "epoch": 2836} {"train_loss": -42.536285400390625, "global_step": 343208, "epoch": 2836} {"train_loss": -43.50288391113281, "global_step": 343209, "epoch": 2836} {"train_loss": -44.385250091552734, "global_step": 343210, "epoch": 2836} {"train_loss": -43.68751907348633, "global_step": 343211, "epoch": 2836} {"train_loss": -44.0723876953125, "global_step": 343212, "epoch": 2836} {"train_loss": -43.99468994140625, "global_step": 343213, "epoch": 2836} {"train_loss": -43.94202423095703, "global_step": 343214, "epoch": 2836} {"train_loss": -44.35688400268555, "global_step": 343215, "epoch": 2836} {"train_loss": -44.036922454833984, "global_step": 343216, "epoch": 2836} {"train_loss": -44.87910842895508, "global_step": 343217, "epoch": 2836} {"train_loss": -44.62944030761719, "global_step": 343218, "epoch": 2836} {"train_loss": -44.057708740234375, "global_step": 343219, "epoch": 2836} {"train_loss": -44.33454513549805, "global_step": 343220, "epoch": 2836} {"train_loss": -44.997737884521484, "global_step": 343221, "epoch": 2836} {"train_loss": -44.607826232910156, "global_step": 343222, "epoch": 2836} {"train_loss": -44.76255798339844, "global_step": 343223, "epoch": 2836} {"train_loss": -45.28107833862305, "global_step": 343224, "epoch": 2836} {"train_loss": -44.907798767089844, "global_step": 343225, "epoch": 2836} {"train_loss": -44.936519622802734, "global_step": 343226, "epoch": 2836} {"train_loss": -44.34528350830078, "global_step": 343227, "epoch": 2836} {"train_loss": -45.340816497802734, "global_step": 343228, "epoch": 2836} {"train_loss": -44.246944427490234, "global_step": 343229, "epoch": 2836} {"train_loss": -44.77900314331055, "global_step": 343230, "epoch": 2836} {"train_loss": -44.8616828918457, "global_step": 343231, "epoch": 2836} {"train_loss": -45.16677474975586, "global_step": 343232, "epoch": 2836} {"train_loss": -44.58396530151367, "global_step": 343233, "epoch": 2836} {"train_loss": -45.03328323364258, "global_step": 343234, "epoch": 2836} {"train_loss": -45.050804138183594, "global_step": 343235, "epoch": 2836} {"train_loss": -45.43586349487305, "global_step": 343236, "epoch": 2836} {"train_loss": -45.138404846191406, "global_step": 343237, "epoch": 2836} {"train_loss": -45.34941482543945, "global_step": 343238, "epoch": 2836} {"train_loss": -45.13043212890625, "global_step": 343239, "epoch": 2836} {"train_loss": -45.09855270385742, "global_step": 343240, "epoch": 2836} {"train_loss": -44.28680419921875, "global_step": 343241, "epoch": 2836} {"train_loss": -44.2719841003418, "global_step": 343242, "epoch": 2836} {"train_loss": -45.14736557006836, "global_step": 343243, "epoch": 2836} {"train_loss": -45.20327377319336, "global_step": 343244, "epoch": 2836} {"train_loss": -44.71432113647461, "global_step": 343245, "epoch": 2836} {"train_loss": -44.53772735595703, "global_step": 343246, "epoch": 2836} {"train_loss": -45.1504020690918, "global_step": 343247, "epoch": 2836} {"train_loss": -45.489864349365234, "global_step": 343248, "epoch": 2836} {"train_loss": -44.405120849609375, "global_step": 343249, "epoch": 2836} {"train_loss": -45.6356315612793, "global_step": 343250, "epoch": 2836} {"train_loss": -45.0892333984375, "global_step": 343251, "epoch": 2836} {"train_loss": -45.365943908691406, "global_step": 343252, "epoch": 2836} {"train_loss": -45.36064529418945, "global_step": 343253, "epoch": 2836} {"train_loss": -45.43986129760742, "global_step": 343254, "epoch": 2836} {"train_loss": -44.819580078125, "global_step": 343255, "epoch": 2836} {"train_loss": -45.421077728271484, "global_step": 343256, "epoch": 2836} {"train_loss": -45.01719665527344, "global_step": 343257, "epoch": 2836} {"train_loss": -44.7182731628418, "global_step": 343258, "epoch": 2836} {"train_loss": -45.63862609863281, "global_step": 343259, "epoch": 2836} {"train_loss": -45.04338073730469, "global_step": 343260, "epoch": 2836} {"train_loss": -44.50947189331055, "global_step": 343261, "epoch": 2836} {"train_loss": -45.032527923583984, "global_step": 343262, "epoch": 2836} {"train_loss": -45.62135696411133, "global_step": 343263, "epoch": 2836} {"train_loss": -44.54359817504883, "global_step": 343264, "epoch": 2836} {"train_loss": -44.79335403442383, "global_step": 343265, "epoch": 2836} {"train_loss": -44.89433670043945, "global_step": 343266, "epoch": 2836} {"train_loss": -44.93368148803711, "global_step": 343267, "epoch": 2836} {"train_loss": -44.42301940917969, "global_step": 343268, "epoch": 2836} {"train_loss": -44.845130920410156, "global_step": 343269, "epoch": 2836} {"train_loss": -44.9564094543457, "global_step": 343270, "epoch": 2836} {"train_loss": -43.84528732299805, "global_step": 343271, "epoch": 2836} {"train_loss": -44.264156341552734, "global_step": 343272, "epoch": 2836} {"train_loss": -43.85807800292969, "global_step": 343273, "epoch": 2836} {"train_loss": -44.251739501953125, "global_step": 343274, "epoch": 2836} {"train_loss": -44.824092864990234, "global_step": 343275, "epoch": 2836} {"train_loss": -44.47288686578924, "global_step": 343276, "epoch": 2836, "val_loss": 2595169.25} {"train_loss": -41.373756408691406, "global_step": 343277, "epoch": 2837} {"train_loss": -43.476402282714844, "global_step": 343278, "epoch": 2837} {"train_loss": -43.8136100769043, "global_step": 343279, "epoch": 2837} {"train_loss": -44.69839096069336, "global_step": 343280, "epoch": 2837} {"train_loss": -39.780181884765625, "global_step": 343281, "epoch": 2837} {"train_loss": -44.265342712402344, "global_step": 343282, "epoch": 2837} {"train_loss": -41.627784729003906, "global_step": 343283, "epoch": 2837} {"train_loss": -42.00761032104492, "global_step": 343284, "epoch": 2837} {"train_loss": -43.28609848022461, "global_step": 343285, "epoch": 2837} {"train_loss": -42.274959564208984, "global_step": 343286, "epoch": 2837} {"train_loss": -41.31209182739258, "global_step": 343287, "epoch": 2837} {"train_loss": -44.91084289550781, "global_step": 343288, "epoch": 2837} {"train_loss": -40.46511459350586, "global_step": 343289, "epoch": 2837} {"train_loss": -44.19149398803711, "global_step": 343290, "epoch": 2837} {"train_loss": -43.99746322631836, "global_step": 343291, "epoch": 2837} {"train_loss": -43.65943145751953, "global_step": 343292, "epoch": 2837} {"train_loss": -44.425758361816406, "global_step": 343293, "epoch": 2837} {"train_loss": -44.081417083740234, "global_step": 343294, "epoch": 2837} {"train_loss": -44.1057014465332, "global_step": 343295, "epoch": 2837} {"train_loss": -44.63902282714844, "global_step": 343296, "epoch": 2837} {"train_loss": -44.35073471069336, "global_step": 343297, "epoch": 2837} {"train_loss": -45.12751007080078, "global_step": 343298, "epoch": 2837} {"train_loss": -43.281375885009766, "global_step": 343299, "epoch": 2837} {"train_loss": -43.433895111083984, "global_step": 343300, "epoch": 2837} {"train_loss": -44.75924301147461, "global_step": 343301, "epoch": 2837} {"train_loss": -42.587623596191406, "global_step": 343302, "epoch": 2837} {"train_loss": -42.4794807434082, "global_step": 343303, "epoch": 2837} {"train_loss": -43.954158782958984, "global_step": 343304, "epoch": 2837} {"train_loss": -42.653751373291016, "global_step": 343305, "epoch": 2837} {"train_loss": -44.76948165893555, "global_step": 343306, "epoch": 2837} {"train_loss": -43.64558029174805, "global_step": 343307, "epoch": 2837} {"train_loss": -42.350032806396484, "global_step": 343308, "epoch": 2837} {"train_loss": -44.34976577758789, "global_step": 343309, "epoch": 2837} {"train_loss": -44.077301025390625, "global_step": 343310, "epoch": 2837} {"train_loss": -43.10789108276367, "global_step": 343311, "epoch": 2837} {"train_loss": -44.35060501098633, "global_step": 343312, "epoch": 2837} {"train_loss": -44.047298431396484, "global_step": 343313, "epoch": 2837} {"train_loss": -44.19015121459961, "global_step": 343314, "epoch": 2837} {"train_loss": -43.53309631347656, "global_step": 343315, "epoch": 2837} {"train_loss": -42.853790283203125, "global_step": 343316, "epoch": 2837} {"train_loss": -44.65302658081055, "global_step": 343317, "epoch": 2837} {"train_loss": -43.72097396850586, "global_step": 343318, "epoch": 2837} {"train_loss": -42.528594970703125, "global_step": 343319, "epoch": 2837} {"train_loss": -44.49693298339844, "global_step": 343320, "epoch": 2837} {"train_loss": -42.38523864746094, "global_step": 343321, "epoch": 2837} {"train_loss": -44.021488189697266, "global_step": 343322, "epoch": 2837} {"train_loss": -43.93566131591797, "global_step": 343323, "epoch": 2837} {"train_loss": -43.07705307006836, "global_step": 343324, "epoch": 2837} {"train_loss": -44.879390716552734, "global_step": 343325, "epoch": 2837} {"train_loss": -43.79185104370117, "global_step": 343326, "epoch": 2837} {"train_loss": -44.39130783081055, "global_step": 343327, "epoch": 2837} {"train_loss": -44.6685905456543, "global_step": 343328, "epoch": 2837} {"train_loss": -44.451202392578125, "global_step": 343329, "epoch": 2837} {"train_loss": -44.56291580200195, "global_step": 343330, "epoch": 2837} {"train_loss": -44.59489822387695, "global_step": 343331, "epoch": 2837} {"train_loss": -45.19739532470703, "global_step": 343332, "epoch": 2837} {"train_loss": -43.921173095703125, "global_step": 343333, "epoch": 2837} {"train_loss": -44.1863899230957, "global_step": 343334, "epoch": 2837} {"train_loss": -44.773983001708984, "global_step": 343335, "epoch": 2837} {"train_loss": -44.5565299987793, "global_step": 343336, "epoch": 2837} {"train_loss": -44.164859771728516, "global_step": 343337, "epoch": 2837} {"train_loss": -44.7360954284668, "global_step": 343338, "epoch": 2837} {"train_loss": -43.89166259765625, "global_step": 343339, "epoch": 2837} {"train_loss": -44.42583465576172, "global_step": 343340, "epoch": 2837} {"train_loss": -44.447425842285156, "global_step": 343341, "epoch": 2837} {"train_loss": -44.38675308227539, "global_step": 343342, "epoch": 2837} {"train_loss": -44.46662139892578, "global_step": 343343, "epoch": 2837} {"train_loss": -44.27681350708008, "global_step": 343344, "epoch": 2837} {"train_loss": -44.864986419677734, "global_step": 343345, "epoch": 2837} {"train_loss": -45.131797790527344, "global_step": 343346, "epoch": 2837} {"train_loss": -44.912696838378906, "global_step": 343347, "epoch": 2837} {"train_loss": -45.12030029296875, "global_step": 343348, "epoch": 2837} {"train_loss": -44.02737808227539, "global_step": 343349, "epoch": 2837} {"train_loss": -45.62909698486328, "global_step": 343350, "epoch": 2837} {"train_loss": -44.489845275878906, "global_step": 343351, "epoch": 2837} {"train_loss": -45.41866683959961, "global_step": 343352, "epoch": 2837} {"train_loss": -44.47700881958008, "global_step": 343353, "epoch": 2837} {"train_loss": -43.91268539428711, "global_step": 343354, "epoch": 2837} {"train_loss": -45.453399658203125, "global_step": 343355, "epoch": 2837} {"train_loss": -43.94305419921875, "global_step": 343356, "epoch": 2837} {"train_loss": -44.06520462036133, "global_step": 343357, "epoch": 2837} {"train_loss": -44.78749084472656, "global_step": 343358, "epoch": 2837} {"train_loss": -44.88581085205078, "global_step": 343359, "epoch": 2837} {"train_loss": -44.66988754272461, "global_step": 343360, "epoch": 2837} {"train_loss": -44.3072624206543, "global_step": 343361, "epoch": 2837} {"train_loss": -43.805908203125, "global_step": 343362, "epoch": 2837} {"train_loss": -44.829776763916016, "global_step": 343363, "epoch": 2837} {"train_loss": -45.181640625, "global_step": 343364, "epoch": 2837} {"train_loss": -43.993934631347656, "global_step": 343365, "epoch": 2837} {"train_loss": -44.68930435180664, "global_step": 343366, "epoch": 2837} {"train_loss": -44.6446533203125, "global_step": 343367, "epoch": 2837} {"train_loss": -44.17636489868164, "global_step": 343368, "epoch": 2837} {"train_loss": -43.95560073852539, "global_step": 343369, "epoch": 2837} {"train_loss": -44.59780502319336, "global_step": 343370, "epoch": 2837} {"train_loss": -44.05170440673828, "global_step": 343371, "epoch": 2837} {"train_loss": -42.56899642944336, "global_step": 343372, "epoch": 2837} {"train_loss": -42.13048553466797, "global_step": 343373, "epoch": 2837} {"train_loss": -44.471588134765625, "global_step": 343374, "epoch": 2837} {"train_loss": -43.58041763305664, "global_step": 343375, "epoch": 2837} {"train_loss": -43.61005783081055, "global_step": 343376, "epoch": 2837} {"train_loss": -44.79598617553711, "global_step": 343377, "epoch": 2837} {"train_loss": -44.020477294921875, "global_step": 343378, "epoch": 2837} {"train_loss": -44.2330322265625, "global_step": 343379, "epoch": 2837} {"train_loss": -44.85457229614258, "global_step": 343380, "epoch": 2837} {"train_loss": -43.7150993347168, "global_step": 343381, "epoch": 2837} {"train_loss": -44.377716064453125, "global_step": 343382, "epoch": 2837} {"train_loss": -44.74764633178711, "global_step": 343383, "epoch": 2837} {"train_loss": -42.989349365234375, "global_step": 343384, "epoch": 2837} {"train_loss": -44.72702407836914, "global_step": 343385, "epoch": 2837} {"train_loss": -44.996768951416016, "global_step": 343386, "epoch": 2837} {"train_loss": -44.484493255615234, "global_step": 343387, "epoch": 2837} {"train_loss": -44.458797454833984, "global_step": 343388, "epoch": 2837} {"train_loss": -45.08720779418945, "global_step": 343389, "epoch": 2837} {"train_loss": -45.37736892700195, "global_step": 343390, "epoch": 2837} {"train_loss": -43.61442947387695, "global_step": 343391, "epoch": 2837} {"train_loss": -44.004329681396484, "global_step": 343392, "epoch": 2837} {"train_loss": -44.70967483520508, "global_step": 343393, "epoch": 2837} {"train_loss": -44.41722869873047, "global_step": 343394, "epoch": 2837} {"train_loss": -44.43490219116211, "global_step": 343395, "epoch": 2837} {"train_loss": -44.37678909301758, "global_step": 343396, "epoch": 2837} {"train_loss": -44.012546602359485, "global_step": 343397, "epoch": 2837, "val_loss": 2434111.0} {"train_loss": -43.728275299072266, "global_step": 343398, "epoch": 2838} {"train_loss": -44.5245246887207, "global_step": 343399, "epoch": 2838} {"train_loss": -44.06120300292969, "global_step": 343400, "epoch": 2838} {"train_loss": -44.42353057861328, "global_step": 343401, "epoch": 2838} {"train_loss": -44.47524642944336, "global_step": 343402, "epoch": 2838} {"train_loss": -45.021339416503906, "global_step": 343403, "epoch": 2838} {"train_loss": -44.17348098754883, "global_step": 343404, "epoch": 2838} {"train_loss": -44.58118438720703, "global_step": 343405, "epoch": 2838} {"train_loss": -45.452674865722656, "global_step": 343406, "epoch": 2838} {"train_loss": -45.24009704589844, "global_step": 343407, "epoch": 2838} {"train_loss": -44.892391204833984, "global_step": 343408, "epoch": 2838} {"train_loss": -45.13918685913086, "global_step": 343409, "epoch": 2838} {"train_loss": -44.29933166503906, "global_step": 343410, "epoch": 2838} {"train_loss": -44.23020553588867, "global_step": 343411, "epoch": 2838} {"train_loss": -44.76994705200195, "global_step": 343412, "epoch": 2838} {"train_loss": -44.03306579589844, "global_step": 343413, "epoch": 2838} {"train_loss": -43.65035629272461, "global_step": 343414, "epoch": 2838} {"train_loss": -44.637325286865234, "global_step": 343415, "epoch": 2838} {"train_loss": -43.9305305480957, "global_step": 343416, "epoch": 2838} {"train_loss": -44.14039993286133, "global_step": 343417, "epoch": 2838} {"train_loss": -44.32524108886719, "global_step": 343418, "epoch": 2838} {"train_loss": -43.70828628540039, "global_step": 343419, "epoch": 2838} {"train_loss": -41.81626510620117, "global_step": 343420, "epoch": 2838} {"train_loss": -43.18876647949219, "global_step": 343421, "epoch": 2838} {"train_loss": -42.27909469604492, "global_step": 343422, "epoch": 2838} {"train_loss": -44.016639709472656, "global_step": 343423, "epoch": 2838} {"train_loss": -42.137359619140625, "global_step": 343424, "epoch": 2838} {"train_loss": -43.316192626953125, "global_step": 343425, "epoch": 2838} {"train_loss": -41.64820098876953, "global_step": 343426, "epoch": 2838} {"train_loss": -44.70684814453125, "global_step": 343427, "epoch": 2838} {"train_loss": -43.421627044677734, "global_step": 343428, "epoch": 2838} {"train_loss": -43.199337005615234, "global_step": 343429, "epoch": 2838} {"train_loss": -44.64663314819336, "global_step": 343430, "epoch": 2838} {"train_loss": -43.3513069152832, "global_step": 343431, "epoch": 2838} {"train_loss": -44.82349395751953, "global_step": 343432, "epoch": 2838} {"train_loss": -44.31001663208008, "global_step": 343433, "epoch": 2838} {"train_loss": -44.449283599853516, "global_step": 343434, "epoch": 2838} {"train_loss": -43.92622756958008, "global_step": 343435, "epoch": 2838} {"train_loss": -42.95682144165039, "global_step": 343436, "epoch": 2838} {"train_loss": -43.9671630859375, "global_step": 343437, "epoch": 2838} {"train_loss": -44.56232833862305, "global_step": 343438, "epoch": 2838} {"train_loss": -44.003875732421875, "global_step": 343439, "epoch": 2838} {"train_loss": -43.438533782958984, "global_step": 343440, "epoch": 2838} {"train_loss": -43.874149322509766, "global_step": 343441, "epoch": 2838} {"train_loss": -44.85445022583008, "global_step": 343442, "epoch": 2838} {"train_loss": -43.66714096069336, "global_step": 343443, "epoch": 2838} {"train_loss": -44.64786911010742, "global_step": 343444, "epoch": 2838} {"train_loss": -44.68793869018555, "global_step": 343445, "epoch": 2838} {"train_loss": -44.10978317260742, "global_step": 343446, "epoch": 2838} {"train_loss": -44.55231475830078, "global_step": 343447, "epoch": 2838} {"train_loss": -43.96479415893555, "global_step": 343448, "epoch": 2838} {"train_loss": -44.958099365234375, "global_step": 343449, "epoch": 2838} {"train_loss": -45.06272506713867, "global_step": 343450, "epoch": 2838} {"train_loss": -44.379920959472656, "global_step": 343451, "epoch": 2838} {"train_loss": -45.17806625366211, "global_step": 343452, "epoch": 2838} {"train_loss": -44.34314727783203, "global_step": 343453, "epoch": 2838} {"train_loss": -44.566741943359375, "global_step": 343454, "epoch": 2838} {"train_loss": -44.60124588012695, "global_step": 343455, "epoch": 2838} {"train_loss": -44.53326416015625, "global_step": 343456, "epoch": 2838} {"train_loss": -45.16041564941406, "global_step": 343457, "epoch": 2838} {"train_loss": -44.4577751159668, "global_step": 343458, "epoch": 2838} {"train_loss": -44.960750579833984, "global_step": 343459, "epoch": 2838} {"train_loss": -44.804622650146484, "global_step": 343460, "epoch": 2838} {"train_loss": -44.03276062011719, "global_step": 343461, "epoch": 2838} {"train_loss": -44.99747848510742, "global_step": 343462, "epoch": 2838} {"train_loss": -44.294158935546875, "global_step": 343463, "epoch": 2838} {"train_loss": -43.808353424072266, "global_step": 343464, "epoch": 2838} {"train_loss": -44.767826080322266, "global_step": 343465, "epoch": 2838} {"train_loss": -43.94740295410156, "global_step": 343466, "epoch": 2838} {"train_loss": -45.36494064331055, "global_step": 343467, "epoch": 2838} {"train_loss": -44.353450775146484, "global_step": 343468, "epoch": 2838} {"train_loss": -44.73423385620117, "global_step": 343469, "epoch": 2838} {"train_loss": -44.676422119140625, "global_step": 343470, "epoch": 2838} {"train_loss": -44.559852600097656, "global_step": 343471, "epoch": 2838} {"train_loss": -44.59367752075195, "global_step": 343472, "epoch": 2838} {"train_loss": -43.94369125366211, "global_step": 343473, "epoch": 2838} {"train_loss": -44.37543487548828, "global_step": 343474, "epoch": 2838} {"train_loss": -44.279659271240234, "global_step": 343475, "epoch": 2838} {"train_loss": -44.612525939941406, "global_step": 343476, "epoch": 2838} {"train_loss": -44.68708801269531, "global_step": 343477, "epoch": 2838} {"train_loss": -44.6203498840332, "global_step": 343478, "epoch": 2838} {"train_loss": -44.79629135131836, "global_step": 343479, "epoch": 2838} {"train_loss": -44.80149459838867, "global_step": 343480, "epoch": 2838} {"train_loss": -43.53936767578125, "global_step": 343481, "epoch": 2838} {"train_loss": -42.76387405395508, "global_step": 343482, "epoch": 2838} {"train_loss": -40.844966888427734, "global_step": 343483, "epoch": 2838} {"train_loss": -41.20542526245117, "global_step": 343484, "epoch": 2838} {"train_loss": -43.975982666015625, "global_step": 343485, "epoch": 2838} {"train_loss": -40.214012145996094, "global_step": 343486, "epoch": 2838} {"train_loss": -42.60095977783203, "global_step": 343487, "epoch": 2838} {"train_loss": -40.2835807800293, "global_step": 343488, "epoch": 2838} {"train_loss": -37.97701644897461, "global_step": 343489, "epoch": 2838} {"train_loss": -38.54285430908203, "global_step": 343490, "epoch": 2838} {"train_loss": -38.738277435302734, "global_step": 343491, "epoch": 2838} {"train_loss": -39.03799057006836, "global_step": 343492, "epoch": 2838} {"train_loss": -41.06361389160156, "global_step": 343493, "epoch": 2838} {"train_loss": -42.29890441894531, "global_step": 343494, "epoch": 2838} {"train_loss": -42.348819732666016, "global_step": 343495, "epoch": 2838} {"train_loss": -40.9463996887207, "global_step": 343496, "epoch": 2838} {"train_loss": -39.42770004272461, "global_step": 343497, "epoch": 2838} {"train_loss": -42.72651290893555, "global_step": 343498, "epoch": 2838} {"train_loss": -39.68773651123047, "global_step": 343499, "epoch": 2838} {"train_loss": -40.37375259399414, "global_step": 343500, "epoch": 2838} {"train_loss": -39.96449279785156, "global_step": 343501, "epoch": 2838} {"train_loss": -41.318233489990234, "global_step": 343502, "epoch": 2838} {"train_loss": -41.73145294189453, "global_step": 343503, "epoch": 2838} {"train_loss": -39.4508171081543, "global_step": 343504, "epoch": 2838} {"train_loss": -41.5465087890625, "global_step": 343505, "epoch": 2838} {"train_loss": -40.8602294921875, "global_step": 343506, "epoch": 2838} {"train_loss": -42.686397552490234, "global_step": 343507, "epoch": 2838} {"train_loss": -41.75417709350586, "global_step": 343508, "epoch": 2838} {"train_loss": -42.144439697265625, "global_step": 343509, "epoch": 2838} {"train_loss": -43.00113296508789, "global_step": 343510, "epoch": 2838} {"train_loss": -39.27449417114258, "global_step": 343511, "epoch": 2838} {"train_loss": -40.37911605834961, "global_step": 343512, "epoch": 2838} {"train_loss": -41.65011215209961, "global_step": 343513, "epoch": 2838} {"train_loss": -40.87054443359375, "global_step": 343514, "epoch": 2838} {"train_loss": -40.154563903808594, "global_step": 343515, "epoch": 2838} {"train_loss": -41.993072509765625, "global_step": 343516, "epoch": 2838} {"train_loss": -39.43217849731445, "global_step": 343517, "epoch": 2838} {"train_loss": -43.24119079211527, "global_step": 343518, "epoch": 2838, "val_loss": 2460508.25} {"train_loss": -38.68595504760742, "global_step": 343519, "epoch": 2839} {"train_loss": -40.311439514160156, "global_step": 343520, "epoch": 2839} {"train_loss": -39.82544708251953, "global_step": 343521, "epoch": 2839} {"train_loss": -40.09549331665039, "global_step": 343522, "epoch": 2839} {"train_loss": -39.588436126708984, "global_step": 343523, "epoch": 2839} {"train_loss": -40.0674934387207, "global_step": 343524, "epoch": 2839} {"train_loss": -41.894439697265625, "global_step": 343525, "epoch": 2839} {"train_loss": -42.28363037109375, "global_step": 343526, "epoch": 2839} {"train_loss": -42.4195671081543, "global_step": 343527, "epoch": 2839} {"train_loss": -41.508460998535156, "global_step": 343528, "epoch": 2839} {"train_loss": -38.83606719970703, "global_step": 343529, "epoch": 2839} {"train_loss": -41.48982620239258, "global_step": 343530, "epoch": 2839} {"train_loss": -42.161251068115234, "global_step": 343531, "epoch": 2839} {"train_loss": -42.14468765258789, "global_step": 343532, "epoch": 2839} {"train_loss": -42.72802734375, "global_step": 343533, "epoch": 2839} {"train_loss": -42.495094299316406, "global_step": 343534, "epoch": 2839} {"train_loss": -41.28017044067383, "global_step": 343535, "epoch": 2839} {"train_loss": -42.746063232421875, "global_step": 343536, "epoch": 2839} {"train_loss": -42.24772262573242, "global_step": 343537, "epoch": 2839} {"train_loss": -42.016109466552734, "global_step": 343538, "epoch": 2839} {"train_loss": -43.024593353271484, "global_step": 343539, "epoch": 2839} {"train_loss": -43.6272087097168, "global_step": 343540, "epoch": 2839} {"train_loss": -42.7371826171875, "global_step": 343541, "epoch": 2839} {"train_loss": -42.25560760498047, "global_step": 343542, "epoch": 2839} {"train_loss": -43.621437072753906, "global_step": 343543, "epoch": 2839} {"train_loss": -43.83818435668945, "global_step": 343544, "epoch": 2839} {"train_loss": -43.576412200927734, "global_step": 343545, "epoch": 2839} {"train_loss": -43.19306564331055, "global_step": 343546, "epoch": 2839} {"train_loss": -43.33297348022461, "global_step": 343547, "epoch": 2839} {"train_loss": -43.90644073486328, "global_step": 343548, "epoch": 2839} {"train_loss": -43.4581298828125, "global_step": 343549, "epoch": 2839} {"train_loss": -43.40412521362305, "global_step": 343550, "epoch": 2839} {"train_loss": -44.0432243347168, "global_step": 343551, "epoch": 2839} {"train_loss": -44.04828643798828, "global_step": 343552, "epoch": 2839} {"train_loss": -43.70613098144531, "global_step": 343553, "epoch": 2839} {"train_loss": -43.45866775512695, "global_step": 343554, "epoch": 2839} {"train_loss": -43.73579025268555, "global_step": 343555, "epoch": 2839} {"train_loss": -43.938228607177734, "global_step": 343556, "epoch": 2839} {"train_loss": -44.33723831176758, "global_step": 343557, "epoch": 2839} {"train_loss": -44.29648208618164, "global_step": 343558, "epoch": 2839} {"train_loss": -44.34819030761719, "global_step": 343559, "epoch": 2839} {"train_loss": -43.96677780151367, "global_step": 343560, "epoch": 2839} {"train_loss": -44.0440559387207, "global_step": 343561, "epoch": 2839} {"train_loss": -44.11861801147461, "global_step": 343562, "epoch": 2839} {"train_loss": -44.170772552490234, "global_step": 343563, "epoch": 2839} {"train_loss": -44.375762939453125, "global_step": 343564, "epoch": 2839} {"train_loss": -44.588619232177734, "global_step": 343565, "epoch": 2839} {"train_loss": -44.13557052612305, "global_step": 343566, "epoch": 2839} {"train_loss": -44.090816497802734, "global_step": 343567, "epoch": 2839} {"train_loss": -44.40244674682617, "global_step": 343568, "epoch": 2839} {"train_loss": -44.203712463378906, "global_step": 343569, "epoch": 2839} {"train_loss": -44.5819091796875, "global_step": 343570, "epoch": 2839} {"train_loss": -44.66298294067383, "global_step": 343571, "epoch": 2839} {"train_loss": -44.439422607421875, "global_step": 343572, "epoch": 2839} {"train_loss": -44.53377914428711, "global_step": 343573, "epoch": 2839} {"train_loss": -44.165889739990234, "global_step": 343574, "epoch": 2839} {"train_loss": -44.05317306518555, "global_step": 343575, "epoch": 2839} {"train_loss": -44.845672607421875, "global_step": 343576, "epoch": 2839} {"train_loss": -44.0900993347168, "global_step": 343577, "epoch": 2839} {"train_loss": -45.02341842651367, "global_step": 343578, "epoch": 2839} {"train_loss": -45.35336685180664, "global_step": 343579, "epoch": 2839} {"train_loss": -45.087223052978516, "global_step": 343580, "epoch": 2839} {"train_loss": -45.348236083984375, "global_step": 343581, "epoch": 2839} {"train_loss": -44.78139114379883, "global_step": 343582, "epoch": 2839} {"train_loss": -44.83736038208008, "global_step": 343583, "epoch": 2839} {"train_loss": -44.34919357299805, "global_step": 343584, "epoch": 2839} {"train_loss": -44.738582611083984, "global_step": 343585, "epoch": 2839} {"train_loss": -45.38351058959961, "global_step": 343586, "epoch": 2839} {"train_loss": -45.27213668823242, "global_step": 343587, "epoch": 2839} {"train_loss": -45.2359733581543, "global_step": 343588, "epoch": 2839} {"train_loss": -44.45479202270508, "global_step": 343589, "epoch": 2839} {"train_loss": -44.94197082519531, "global_step": 343590, "epoch": 2839} {"train_loss": -44.492069244384766, "global_step": 343591, "epoch": 2839} {"train_loss": -44.17653274536133, "global_step": 343592, "epoch": 2839} {"train_loss": -43.3056755065918, "global_step": 343593, "epoch": 2839} {"train_loss": -43.5064811706543, "global_step": 343594, "epoch": 2839} {"train_loss": -43.7924690246582, "global_step": 343595, "epoch": 2839} {"train_loss": -44.344207763671875, "global_step": 343596, "epoch": 2839} {"train_loss": -44.17182540893555, "global_step": 343597, "epoch": 2839} {"train_loss": -42.79498291015625, "global_step": 343598, "epoch": 2839} {"train_loss": -41.83960723876953, "global_step": 343599, "epoch": 2839} {"train_loss": -43.304439544677734, "global_step": 343600, "epoch": 2839} {"train_loss": -42.294898986816406, "global_step": 343601, "epoch": 2839} {"train_loss": -44.264556884765625, "global_step": 343602, "epoch": 2839} {"train_loss": -43.97970199584961, "global_step": 343603, "epoch": 2839} {"train_loss": -41.46158218383789, "global_step": 343604, "epoch": 2839} {"train_loss": -42.32985305786133, "global_step": 343605, "epoch": 2839} {"train_loss": -43.48622131347656, "global_step": 343606, "epoch": 2839} {"train_loss": -43.35213851928711, "global_step": 343607, "epoch": 2839} {"train_loss": -44.20732116699219, "global_step": 343608, "epoch": 2839} {"train_loss": -43.63581466674805, "global_step": 343609, "epoch": 2839} {"train_loss": -41.88663864135742, "global_step": 343610, "epoch": 2839} {"train_loss": -44.084083557128906, "global_step": 343611, "epoch": 2839} {"train_loss": -42.478485107421875, "global_step": 343612, "epoch": 2839} {"train_loss": -43.419189453125, "global_step": 343613, "epoch": 2839} {"train_loss": -43.425750732421875, "global_step": 343614, "epoch": 2839} {"train_loss": -43.13336944580078, "global_step": 343615, "epoch": 2839} {"train_loss": -44.057254791259766, "global_step": 343616, "epoch": 2839} {"train_loss": -44.2425651550293, "global_step": 343617, "epoch": 2839} {"train_loss": -44.35313415527344, "global_step": 343618, "epoch": 2839} {"train_loss": -44.0076789855957, "global_step": 343619, "epoch": 2839} {"train_loss": -43.5054817199707, "global_step": 343620, "epoch": 2839} {"train_loss": -43.82246017456055, "global_step": 343621, "epoch": 2839} {"train_loss": -44.1384391784668, "global_step": 343622, "epoch": 2839} {"train_loss": -44.161739349365234, "global_step": 343623, "epoch": 2839} {"train_loss": -44.99882507324219, "global_step": 343624, "epoch": 2839} {"train_loss": -44.00550079345703, "global_step": 343625, "epoch": 2839} {"train_loss": -44.652339935302734, "global_step": 343626, "epoch": 2839} {"train_loss": -44.26420211791992, "global_step": 343627, "epoch": 2839} {"train_loss": -44.7276611328125, "global_step": 343628, "epoch": 2839} {"train_loss": -45.11293411254883, "global_step": 343629, "epoch": 2839} {"train_loss": -44.65081787109375, "global_step": 343630, "epoch": 2839} {"train_loss": -44.5073356628418, "global_step": 343631, "epoch": 2839} {"train_loss": -44.91658401489258, "global_step": 343632, "epoch": 2839} {"train_loss": -44.33260726928711, "global_step": 343633, "epoch": 2839} {"train_loss": -44.811065673828125, "global_step": 343634, "epoch": 2839} {"train_loss": -44.31853103637695, "global_step": 343635, "epoch": 2839} {"train_loss": -44.741798400878906, "global_step": 343636, "epoch": 2839} {"train_loss": -44.620819091796875, "global_step": 343637, "epoch": 2839} {"train_loss": -44.50863265991211, "global_step": 343638, "epoch": 2839} {"train_loss": -43.57724667383619, "global_step": 343639, "epoch": 2839, "val_loss": 2622345.5} {"train_loss": -42.97105026245117, "global_step": 343640, "epoch": 2840} {"train_loss": -43.67446517944336, "global_step": 343641, "epoch": 2840} {"train_loss": -43.196041107177734, "global_step": 343642, "epoch": 2840} {"train_loss": -40.91620635986328, "global_step": 343643, "epoch": 2840} {"train_loss": -44.29731369018555, "global_step": 343644, "epoch": 2840} {"train_loss": -42.42107009887695, "global_step": 343645, "epoch": 2840} {"train_loss": -43.521141052246094, "global_step": 343646, "epoch": 2840} {"train_loss": -42.557952880859375, "global_step": 343647, "epoch": 2840} {"train_loss": -42.723968505859375, "global_step": 343648, "epoch": 2840} {"train_loss": -43.44923782348633, "global_step": 343649, "epoch": 2840} {"train_loss": -42.8648796081543, "global_step": 343650, "epoch": 2840} {"train_loss": -43.272857666015625, "global_step": 343651, "epoch": 2840} {"train_loss": -44.080474853515625, "global_step": 343652, "epoch": 2840} {"train_loss": -43.62363815307617, "global_step": 343653, "epoch": 2840} {"train_loss": -44.084529876708984, "global_step": 343654, "epoch": 2840} {"train_loss": -43.15946578979492, "global_step": 343655, "epoch": 2840} {"train_loss": -44.43393325805664, "global_step": 343656, "epoch": 2840} {"train_loss": -43.563045501708984, "global_step": 343657, "epoch": 2840} {"train_loss": -44.36349105834961, "global_step": 343658, "epoch": 2840} {"train_loss": -42.52640914916992, "global_step": 343659, "epoch": 2840} {"train_loss": -43.69124984741211, "global_step": 343660, "epoch": 2840} {"train_loss": -42.256927490234375, "global_step": 343661, "epoch": 2840} {"train_loss": -44.46880340576172, "global_step": 343662, "epoch": 2840} {"train_loss": -43.43756866455078, "global_step": 343663, "epoch": 2840} {"train_loss": -42.66102981567383, "global_step": 343664, "epoch": 2840} {"train_loss": -44.15890121459961, "global_step": 343665, "epoch": 2840} {"train_loss": -42.48440170288086, "global_step": 343666, "epoch": 2840} {"train_loss": -42.37130355834961, "global_step": 343667, "epoch": 2840} {"train_loss": -43.499900817871094, "global_step": 343668, "epoch": 2840} {"train_loss": -42.02810287475586, "global_step": 343669, "epoch": 2840} {"train_loss": -43.78995895385742, "global_step": 343670, "epoch": 2840} {"train_loss": -42.54608154296875, "global_step": 343671, "epoch": 2840} {"train_loss": -44.325050354003906, "global_step": 343672, "epoch": 2840} {"train_loss": -42.80014419555664, "global_step": 343673, "epoch": 2840} {"train_loss": -44.40800857543945, "global_step": 343674, "epoch": 2840} {"train_loss": -44.2697868347168, "global_step": 343675, "epoch": 2840} {"train_loss": -43.78644943237305, "global_step": 343676, "epoch": 2840} {"train_loss": -43.875511169433594, "global_step": 343677, "epoch": 2840} {"train_loss": -44.514156341552734, "global_step": 343678, "epoch": 2840} {"train_loss": -44.11434555053711, "global_step": 343679, "epoch": 2840} {"train_loss": -44.5023307800293, "global_step": 343680, "epoch": 2840} {"train_loss": -44.575748443603516, "global_step": 343681, "epoch": 2840} {"train_loss": -45.02107238769531, "global_step": 343682, "epoch": 2840} {"train_loss": -44.659881591796875, "global_step": 343683, "epoch": 2840} {"train_loss": -44.79229736328125, "global_step": 343684, "epoch": 2840} {"train_loss": -44.45551681518555, "global_step": 343685, "epoch": 2840} {"train_loss": -44.83478546142578, "global_step": 343686, "epoch": 2840} {"train_loss": -44.811256408691406, "global_step": 343687, "epoch": 2840} {"train_loss": -44.47766876220703, "global_step": 343688, "epoch": 2840} {"train_loss": -44.85667419433594, "global_step": 343689, "epoch": 2840} {"train_loss": -44.745269775390625, "global_step": 343690, "epoch": 2840} {"train_loss": -44.556861877441406, "global_step": 343691, "epoch": 2840} {"train_loss": -43.84652328491211, "global_step": 343692, "epoch": 2840} {"train_loss": -45.13722610473633, "global_step": 343693, "epoch": 2840} {"train_loss": -44.705055236816406, "global_step": 343694, "epoch": 2840} {"train_loss": -45.07609939575195, "global_step": 343695, "epoch": 2840} {"train_loss": -44.60090255737305, "global_step": 343696, "epoch": 2840} {"train_loss": -44.88933181762695, "global_step": 343697, "epoch": 2840} {"train_loss": -45.2018928527832, "global_step": 343698, "epoch": 2840} {"train_loss": -44.96588134765625, "global_step": 343699, "epoch": 2840} {"train_loss": -44.47471237182617, "global_step": 343700, "epoch": 2840} {"train_loss": -44.04938888549805, "global_step": 343701, "epoch": 2840} {"train_loss": -45.48918533325195, "global_step": 343702, "epoch": 2840} {"train_loss": -45.37847900390625, "global_step": 343703, "epoch": 2840} {"train_loss": -45.102943420410156, "global_step": 343704, "epoch": 2840} {"train_loss": -44.526275634765625, "global_step": 343705, "epoch": 2840} {"train_loss": -45.04212188720703, "global_step": 343706, "epoch": 2840} {"train_loss": -45.59675216674805, "global_step": 343707, "epoch": 2840} {"train_loss": -44.8953857421875, "global_step": 343708, "epoch": 2840} {"train_loss": -44.80268478393555, "global_step": 343709, "epoch": 2840} {"train_loss": -45.00299835205078, "global_step": 343710, "epoch": 2840} {"train_loss": -45.345272064208984, "global_step": 343711, "epoch": 2840} {"train_loss": -45.1339111328125, "global_step": 343712, "epoch": 2840} {"train_loss": -44.845523834228516, "global_step": 343713, "epoch": 2840} {"train_loss": -45.067161560058594, "global_step": 343714, "epoch": 2840} {"train_loss": -45.24673080444336, "global_step": 343715, "epoch": 2840} {"train_loss": -45.20671463012695, "global_step": 343716, "epoch": 2840} {"train_loss": -44.98836135864258, "global_step": 343717, "epoch": 2840} {"train_loss": -43.50892639160156, "global_step": 343718, "epoch": 2840} {"train_loss": -44.526832580566406, "global_step": 343719, "epoch": 2840} {"train_loss": -44.10826110839844, "global_step": 343720, "epoch": 2840} {"train_loss": -45.2743034362793, "global_step": 343721, "epoch": 2840} {"train_loss": -45.544830322265625, "global_step": 343722, "epoch": 2840} {"train_loss": -45.25938034057617, "global_step": 343723, "epoch": 2840} {"train_loss": -44.741607666015625, "global_step": 343724, "epoch": 2840} {"train_loss": -44.95759963989258, "global_step": 343725, "epoch": 2840} {"train_loss": -45.23112869262695, "global_step": 343726, "epoch": 2840} {"train_loss": -45.57598876953125, "global_step": 343727, "epoch": 2840} {"train_loss": -45.0606803894043, "global_step": 343728, "epoch": 2840} {"train_loss": -44.299468994140625, "global_step": 343729, "epoch": 2840} {"train_loss": -45.104217529296875, "global_step": 343730, "epoch": 2840} {"train_loss": -44.54066848754883, "global_step": 343731, "epoch": 2840} {"train_loss": -42.011924743652344, "global_step": 343732, "epoch": 2840} {"train_loss": -42.498451232910156, "global_step": 343733, "epoch": 2840} {"train_loss": -45.245059967041016, "global_step": 343734, "epoch": 2840} {"train_loss": -43.19529724121094, "global_step": 343735, "epoch": 2840} {"train_loss": -41.79690170288086, "global_step": 343736, "epoch": 2840} {"train_loss": -44.433441162109375, "global_step": 343737, "epoch": 2840} {"train_loss": -42.90607833862305, "global_step": 343738, "epoch": 2840} {"train_loss": -42.07045364379883, "global_step": 343739, "epoch": 2840} {"train_loss": -44.76025390625, "global_step": 343740, "epoch": 2840} {"train_loss": -41.3901481628418, "global_step": 343741, "epoch": 2840} {"train_loss": -44.59899139404297, "global_step": 343742, "epoch": 2840} {"train_loss": -42.37981033325195, "global_step": 343743, "epoch": 2840} {"train_loss": -39.789363861083984, "global_step": 343744, "epoch": 2840} {"train_loss": -41.119728088378906, "global_step": 343745, "epoch": 2840} {"train_loss": -41.043617248535156, "global_step": 343746, "epoch": 2840} {"train_loss": -40.46725082397461, "global_step": 343747, "epoch": 2840} {"train_loss": -41.33050537109375, "global_step": 343748, "epoch": 2840} {"train_loss": -43.37232208251953, "global_step": 343749, "epoch": 2840} {"train_loss": -43.80189895629883, "global_step": 343750, "epoch": 2840} {"train_loss": -41.09560012817383, "global_step": 343751, "epoch": 2840} {"train_loss": -43.16242218017578, "global_step": 343752, "epoch": 2840} {"train_loss": -41.11480712890625, "global_step": 343753, "epoch": 2840} {"train_loss": -42.753692626953125, "global_step": 343754, "epoch": 2840} {"train_loss": -42.252357482910156, "global_step": 343755, "epoch": 2840} {"train_loss": -42.801143646240234, "global_step": 343756, "epoch": 2840} {"train_loss": -43.2064094543457, "global_step": 343757, "epoch": 2840} {"train_loss": -42.03510284423828, "global_step": 343758, "epoch": 2840} {"train_loss": -42.924434661865234, "global_step": 343759, "epoch": 2840} {"train_loss": -43.8048712044708, "global_step": 343760, "epoch": 2840, "val_loss": 2634903.25} {"train_loss": -43.224761962890625, "global_step": 343761, "epoch": 2841} {"train_loss": -43.45036315917969, "global_step": 343762, "epoch": 2841} {"train_loss": -42.89344024658203, "global_step": 343763, "epoch": 2841} {"train_loss": -43.457313537597656, "global_step": 343764, "epoch": 2841} {"train_loss": -43.6740837097168, "global_step": 343765, "epoch": 2841} {"train_loss": -43.39944076538086, "global_step": 343766, "epoch": 2841} {"train_loss": -43.944725036621094, "global_step": 343767, "epoch": 2841} {"train_loss": -43.869136810302734, "global_step": 343768, "epoch": 2841} {"train_loss": -44.18238067626953, "global_step": 343769, "epoch": 2841} {"train_loss": -43.907920837402344, "global_step": 343770, "epoch": 2841} {"train_loss": -44.21963119506836, "global_step": 343771, "epoch": 2841} {"train_loss": -43.95429611206055, "global_step": 343772, "epoch": 2841} {"train_loss": -43.052337646484375, "global_step": 343773, "epoch": 2841} {"train_loss": -44.8897705078125, "global_step": 343774, "epoch": 2841} {"train_loss": -44.2329216003418, "global_step": 343775, "epoch": 2841} {"train_loss": -44.0473518371582, "global_step": 343776, "epoch": 2841} {"train_loss": -43.99873733520508, "global_step": 343777, "epoch": 2841} {"train_loss": -44.342037200927734, "global_step": 343778, "epoch": 2841} {"train_loss": -44.57981491088867, "global_step": 343779, "epoch": 2841} {"train_loss": -43.99917984008789, "global_step": 343780, "epoch": 2841} {"train_loss": -43.79688262939453, "global_step": 343781, "epoch": 2841} {"train_loss": -45.0181999206543, "global_step": 343782, "epoch": 2841} {"train_loss": -45.16853713989258, "global_step": 343783, "epoch": 2841} {"train_loss": -44.370758056640625, "global_step": 343784, "epoch": 2841} {"train_loss": -45.10612869262695, "global_step": 343785, "epoch": 2841} {"train_loss": -44.62172317504883, "global_step": 343786, "epoch": 2841} {"train_loss": -43.81092071533203, "global_step": 343787, "epoch": 2841} {"train_loss": -44.41622543334961, "global_step": 343788, "epoch": 2841} {"train_loss": -44.65536117553711, "global_step": 343789, "epoch": 2841} {"train_loss": -44.437923431396484, "global_step": 343790, "epoch": 2841} {"train_loss": -44.47802734375, "global_step": 343791, "epoch": 2841} {"train_loss": -43.39540481567383, "global_step": 343792, "epoch": 2841} {"train_loss": -44.89594650268555, "global_step": 343793, "epoch": 2841} {"train_loss": -44.991065979003906, "global_step": 343794, "epoch": 2841} {"train_loss": -44.772491455078125, "global_step": 343795, "epoch": 2841} {"train_loss": -44.96296310424805, "global_step": 343796, "epoch": 2841} {"train_loss": -45.44432067871094, "global_step": 343797, "epoch": 2841} {"train_loss": -45.270790100097656, "global_step": 343798, "epoch": 2841} {"train_loss": -44.55825424194336, "global_step": 343799, "epoch": 2841} {"train_loss": -44.779991149902344, "global_step": 343800, "epoch": 2841} {"train_loss": -44.73850631713867, "global_step": 343801, "epoch": 2841} {"train_loss": -44.16473388671875, "global_step": 343802, "epoch": 2841} {"train_loss": -44.58369064331055, "global_step": 343803, "epoch": 2841} {"train_loss": -44.33661651611328, "global_step": 343804, "epoch": 2841} {"train_loss": -43.805870056152344, "global_step": 343805, "epoch": 2841} {"train_loss": -43.75620651245117, "global_step": 343806, "epoch": 2841} {"train_loss": -43.485328674316406, "global_step": 343807, "epoch": 2841} {"train_loss": -43.49418640136719, "global_step": 343808, "epoch": 2841} {"train_loss": -44.5215950012207, "global_step": 343809, "epoch": 2841} {"train_loss": -43.928401947021484, "global_step": 343810, "epoch": 2841} {"train_loss": -43.13742446899414, "global_step": 343811, "epoch": 2841} {"train_loss": -44.57987594604492, "global_step": 343812, "epoch": 2841} {"train_loss": -44.58061599731445, "global_step": 343813, "epoch": 2841} {"train_loss": -43.83308029174805, "global_step": 343814, "epoch": 2841} {"train_loss": -44.53457260131836, "global_step": 343815, "epoch": 2841} {"train_loss": -42.619319915771484, "global_step": 343816, "epoch": 2841} {"train_loss": -43.8718147277832, "global_step": 343817, "epoch": 2841} {"train_loss": -44.845489501953125, "global_step": 343818, "epoch": 2841} {"train_loss": -43.50413131713867, "global_step": 343819, "epoch": 2841} {"train_loss": -44.06718063354492, "global_step": 343820, "epoch": 2841} {"train_loss": -44.927791595458984, "global_step": 343821, "epoch": 2841} {"train_loss": -43.35002136230469, "global_step": 343822, "epoch": 2841} {"train_loss": -44.32416915893555, "global_step": 343823, "epoch": 2841} {"train_loss": -43.777671813964844, "global_step": 343824, "epoch": 2841} {"train_loss": -43.903594970703125, "global_step": 343825, "epoch": 2841} {"train_loss": -45.35246276855469, "global_step": 343826, "epoch": 2841} {"train_loss": -43.58535385131836, "global_step": 343827, "epoch": 2841} {"train_loss": -43.38924026489258, "global_step": 343828, "epoch": 2841} {"train_loss": -45.192298889160156, "global_step": 343829, "epoch": 2841} {"train_loss": -44.09288787841797, "global_step": 343830, "epoch": 2841} {"train_loss": -44.02621078491211, "global_step": 343831, "epoch": 2841} {"train_loss": -44.31465148925781, "global_step": 343832, "epoch": 2841} {"train_loss": -43.435428619384766, "global_step": 343833, "epoch": 2841} {"train_loss": -43.61930465698242, "global_step": 343834, "epoch": 2841} {"train_loss": -44.03681564331055, "global_step": 343835, "epoch": 2841} {"train_loss": -43.99951171875, "global_step": 343836, "epoch": 2841} {"train_loss": -43.52507400512695, "global_step": 343837, "epoch": 2841} {"train_loss": -43.86179733276367, "global_step": 343838, "epoch": 2841} {"train_loss": -44.69163131713867, "global_step": 343839, "epoch": 2841} {"train_loss": -43.84284973144531, "global_step": 343840, "epoch": 2841} {"train_loss": -44.38898849487305, "global_step": 343841, "epoch": 2841} {"train_loss": -44.00761032104492, "global_step": 343842, "epoch": 2841} {"train_loss": -42.157230377197266, "global_step": 343843, "epoch": 2841} {"train_loss": -44.03588104248047, "global_step": 343844, "epoch": 2841} {"train_loss": -43.27979278564453, "global_step": 343845, "epoch": 2841} {"train_loss": -43.90256881713867, "global_step": 343846, "epoch": 2841} {"train_loss": -44.25967788696289, "global_step": 343847, "epoch": 2841} {"train_loss": -43.42934799194336, "global_step": 343848, "epoch": 2841} {"train_loss": -43.17222213745117, "global_step": 343849, "epoch": 2841} {"train_loss": -44.82200622558594, "global_step": 343850, "epoch": 2841} {"train_loss": -43.0999641418457, "global_step": 343851, "epoch": 2841} {"train_loss": -43.30092239379883, "global_step": 343852, "epoch": 2841} {"train_loss": -43.92980194091797, "global_step": 343853, "epoch": 2841} {"train_loss": -44.43893051147461, "global_step": 343854, "epoch": 2841} {"train_loss": -43.608741760253906, "global_step": 343855, "epoch": 2841} {"train_loss": -44.97123718261719, "global_step": 343856, "epoch": 2841} {"train_loss": -44.792823791503906, "global_step": 343857, "epoch": 2841} {"train_loss": -44.1172981262207, "global_step": 343858, "epoch": 2841} {"train_loss": -44.66203689575195, "global_step": 343859, "epoch": 2841} {"train_loss": -44.05677032470703, "global_step": 343860, "epoch": 2841} {"train_loss": -44.2795524597168, "global_step": 343861, "epoch": 2841} {"train_loss": -44.9061393737793, "global_step": 343862, "epoch": 2841} {"train_loss": -43.896827697753906, "global_step": 343863, "epoch": 2841} {"train_loss": -44.23876953125, "global_step": 343864, "epoch": 2841} {"train_loss": -44.337562561035156, "global_step": 343865, "epoch": 2841} {"train_loss": -44.336421966552734, "global_step": 343866, "epoch": 2841} {"train_loss": -43.935543060302734, "global_step": 343867, "epoch": 2841} {"train_loss": -45.14716720581055, "global_step": 343868, "epoch": 2841} {"train_loss": -44.72763442993164, "global_step": 343869, "epoch": 2841} {"train_loss": -42.94865417480469, "global_step": 343870, "epoch": 2841} {"train_loss": -44.439300537109375, "global_step": 343871, "epoch": 2841} {"train_loss": -44.20132827758789, "global_step": 343872, "epoch": 2841} {"train_loss": -43.53445053100586, "global_step": 343873, "epoch": 2841} {"train_loss": -44.31022262573242, "global_step": 343874, "epoch": 2841} {"train_loss": -44.28539276123047, "global_step": 343875, "epoch": 2841} {"train_loss": -43.66229248046875, "global_step": 343876, "epoch": 2841} {"train_loss": -44.944820404052734, "global_step": 343877, "epoch": 2841} {"train_loss": -44.74951171875, "global_step": 343878, "epoch": 2841} {"train_loss": -44.646419525146484, "global_step": 343879, "epoch": 2841} {"train_loss": -42.94729232788086, "global_step": 343880, "epoch": 2841} {"train_loss": -44.12099245560071, "global_step": 343881, "epoch": 2841, "val_loss": 2658091.75} {"train_loss": -44.37672805786133, "global_step": 343882, "epoch": 2842} {"train_loss": -43.75873565673828, "global_step": 343883, "epoch": 2842} {"train_loss": -43.08888244628906, "global_step": 343884, "epoch": 2842} {"train_loss": -44.481197357177734, "global_step": 343885, "epoch": 2842} {"train_loss": -45.09645462036133, "global_step": 343886, "epoch": 2842} {"train_loss": -42.83949661254883, "global_step": 343887, "epoch": 2842} {"train_loss": -44.53776168823242, "global_step": 343888, "epoch": 2842} {"train_loss": -44.96392059326172, "global_step": 343889, "epoch": 2842} {"train_loss": -43.27755355834961, "global_step": 343890, "epoch": 2842} {"train_loss": -42.80058670043945, "global_step": 343891, "epoch": 2842} {"train_loss": -44.403907775878906, "global_step": 343892, "epoch": 2842} {"train_loss": -44.54419708251953, "global_step": 343893, "epoch": 2842} {"train_loss": -42.81638717651367, "global_step": 343894, "epoch": 2842} {"train_loss": -44.546241760253906, "global_step": 343895, "epoch": 2842} {"train_loss": -45.14376449584961, "global_step": 343896, "epoch": 2842} {"train_loss": -43.578041076660156, "global_step": 343897, "epoch": 2842} {"train_loss": -44.359222412109375, "global_step": 343898, "epoch": 2842} {"train_loss": -43.37824630737305, "global_step": 343899, "epoch": 2842} {"train_loss": -42.06201934814453, "global_step": 343900, "epoch": 2842} {"train_loss": -43.836910247802734, "global_step": 343901, "epoch": 2842} {"train_loss": -42.14474105834961, "global_step": 343902, "epoch": 2842} {"train_loss": -43.619319915771484, "global_step": 343903, "epoch": 2842} {"train_loss": -43.92387390136719, "global_step": 343904, "epoch": 2842} {"train_loss": -41.67544937133789, "global_step": 343905, "epoch": 2842} {"train_loss": -43.321346282958984, "global_step": 343906, "epoch": 2842} {"train_loss": -42.65015411376953, "global_step": 343907, "epoch": 2842} {"train_loss": -44.534793853759766, "global_step": 343908, "epoch": 2842} {"train_loss": -43.900184631347656, "global_step": 343909, "epoch": 2842} {"train_loss": -44.630470275878906, "global_step": 343910, "epoch": 2842} {"train_loss": -44.33320999145508, "global_step": 343911, "epoch": 2842} {"train_loss": -44.567291259765625, "global_step": 343912, "epoch": 2842} {"train_loss": -43.856597900390625, "global_step": 343913, "epoch": 2842} {"train_loss": -44.57914352416992, "global_step": 343914, "epoch": 2842} {"train_loss": -44.03164291381836, "global_step": 343915, "epoch": 2842} {"train_loss": -44.501991271972656, "global_step": 343916, "epoch": 2842} {"train_loss": -44.9976692199707, "global_step": 343917, "epoch": 2842} {"train_loss": -44.14678955078125, "global_step": 343918, "epoch": 2842} {"train_loss": -44.93125534057617, "global_step": 343919, "epoch": 2842} {"train_loss": -44.509857177734375, "global_step": 343920, "epoch": 2842} {"train_loss": -44.920021057128906, "global_step": 343921, "epoch": 2842} {"train_loss": -44.88899230957031, "global_step": 343922, "epoch": 2842} {"train_loss": -44.607574462890625, "global_step": 343923, "epoch": 2842} {"train_loss": -44.8273811340332, "global_step": 343924, "epoch": 2842} {"train_loss": -44.96206283569336, "global_step": 343925, "epoch": 2842} {"train_loss": -44.537235260009766, "global_step": 343926, "epoch": 2842} {"train_loss": -44.12040328979492, "global_step": 343927, "epoch": 2842} {"train_loss": -44.16001510620117, "global_step": 343928, "epoch": 2842} {"train_loss": -44.50222396850586, "global_step": 343929, "epoch": 2842} {"train_loss": -44.654449462890625, "global_step": 343930, "epoch": 2842} {"train_loss": -44.07432174682617, "global_step": 343931, "epoch": 2842} {"train_loss": -44.29502868652344, "global_step": 343932, "epoch": 2842} {"train_loss": -44.85380172729492, "global_step": 343933, "epoch": 2842} {"train_loss": -44.99755859375, "global_step": 343934, "epoch": 2842} {"train_loss": -45.1884651184082, "global_step": 343935, "epoch": 2842} {"train_loss": -44.5732536315918, "global_step": 343936, "epoch": 2842} {"train_loss": -44.84486389160156, "global_step": 343937, "epoch": 2842} {"train_loss": -45.389129638671875, "global_step": 343938, "epoch": 2842} {"train_loss": -45.42670822143555, "global_step": 343939, "epoch": 2842} {"train_loss": -45.16781234741211, "global_step": 343940, "epoch": 2842} {"train_loss": -45.07706832885742, "global_step": 343941, "epoch": 2842} {"train_loss": -44.991249084472656, "global_step": 343942, "epoch": 2842} {"train_loss": -45.770084381103516, "global_step": 343943, "epoch": 2842} {"train_loss": -45.06271743774414, "global_step": 343944, "epoch": 2842} {"train_loss": -45.71949768066406, "global_step": 343945, "epoch": 2842} {"train_loss": -45.433292388916016, "global_step": 343946, "epoch": 2842} {"train_loss": -45.60061264038086, "global_step": 343947, "epoch": 2842} {"train_loss": -45.1026725769043, "global_step": 343948, "epoch": 2842} {"train_loss": -45.52294921875, "global_step": 343949, "epoch": 2842} {"train_loss": -45.32148361206055, "global_step": 343950, "epoch": 2842} {"train_loss": -45.65745162963867, "global_step": 343951, "epoch": 2842} {"train_loss": -45.38605880737305, "global_step": 343952, "epoch": 2842} {"train_loss": -45.11886215209961, "global_step": 343953, "epoch": 2842} {"train_loss": -45.60661697387695, "global_step": 343954, "epoch": 2842} {"train_loss": -45.49260330200195, "global_step": 343955, "epoch": 2842} {"train_loss": -45.50003433227539, "global_step": 343956, "epoch": 2842} {"train_loss": -45.6281623840332, "global_step": 343957, "epoch": 2842} {"train_loss": -45.44829177856445, "global_step": 343958, "epoch": 2842} {"train_loss": -44.94893264770508, "global_step": 343959, "epoch": 2842} {"train_loss": -45.556640625, "global_step": 343960, "epoch": 2842} {"train_loss": -45.13277816772461, "global_step": 343961, "epoch": 2842} {"train_loss": -45.22507858276367, "global_step": 343962, "epoch": 2842} {"train_loss": -45.61823654174805, "global_step": 343963, "epoch": 2842} {"train_loss": -45.94480895996094, "global_step": 343964, "epoch": 2842} {"train_loss": -45.5119743347168, "global_step": 343965, "epoch": 2842} {"train_loss": -45.877052307128906, "global_step": 343966, "epoch": 2842} {"train_loss": -45.59889602661133, "global_step": 343967, "epoch": 2842} {"train_loss": -45.879451751708984, "global_step": 343968, "epoch": 2842} {"train_loss": -45.62632751464844, "global_step": 343969, "epoch": 2842} {"train_loss": -46.047325134277344, "global_step": 343970, "epoch": 2842} {"train_loss": -45.39257049560547, "global_step": 343971, "epoch": 2842} {"train_loss": -44.4136962890625, "global_step": 343972, "epoch": 2842} {"train_loss": -44.15753936767578, "global_step": 343973, "epoch": 2842} {"train_loss": -44.508724212646484, "global_step": 343974, "epoch": 2842} {"train_loss": -45.51830291748047, "global_step": 343975, "epoch": 2842} {"train_loss": -44.90543746948242, "global_step": 343976, "epoch": 2842} {"train_loss": -43.51488494873047, "global_step": 343977, "epoch": 2842} {"train_loss": -43.421142578125, "global_step": 343978, "epoch": 2842} {"train_loss": -45.38975143432617, "global_step": 343979, "epoch": 2842} {"train_loss": -44.562774658203125, "global_step": 343980, "epoch": 2842} {"train_loss": -41.29978942871094, "global_step": 343981, "epoch": 2842} {"train_loss": -44.29998779296875, "global_step": 343982, "epoch": 2842} {"train_loss": -44.00786209106445, "global_step": 343983, "epoch": 2842} {"train_loss": -41.89944839477539, "global_step": 343984, "epoch": 2842} {"train_loss": -44.900516510009766, "global_step": 343985, "epoch": 2842} {"train_loss": -42.052520751953125, "global_step": 343986, "epoch": 2842} {"train_loss": -43.580753326416016, "global_step": 343987, "epoch": 2842} {"train_loss": -41.17977523803711, "global_step": 343988, "epoch": 2842} {"train_loss": -44.033935546875, "global_step": 343989, "epoch": 2842} {"train_loss": -42.15998458862305, "global_step": 343990, "epoch": 2842} {"train_loss": -41.787445068359375, "global_step": 343991, "epoch": 2842} {"train_loss": -44.246742248535156, "global_step": 343992, "epoch": 2842} {"train_loss": -40.06262969970703, "global_step": 343993, "epoch": 2842} {"train_loss": -43.361358642578125, "global_step": 343994, "epoch": 2842} {"train_loss": -38.60152816772461, "global_step": 343995, "epoch": 2842} {"train_loss": -39.83522415161133, "global_step": 343996, "epoch": 2842} {"train_loss": -41.841766357421875, "global_step": 343997, "epoch": 2842} {"train_loss": -42.228187561035156, "global_step": 343998, "epoch": 2842} {"train_loss": -42.02900314331055, "global_step": 343999, "epoch": 2842} {"train_loss": -41.55072784423828, "global_step": 344000, "epoch": 2842} {"train_loss": -39.77492904663086, "global_step": 344001, "epoch": 2842} {"train_loss": -44.16875445153102, "global_step": 344002, "epoch": 2842, "val_loss": 2660199.0} {"train_loss": -40.56702423095703, "global_step": 344003, "epoch": 2843} {"train_loss": -43.57852554321289, "global_step": 344004, "epoch": 2843} {"train_loss": -41.049068450927734, "global_step": 344005, "epoch": 2843} {"train_loss": -42.201446533203125, "global_step": 344006, "epoch": 2843} {"train_loss": -42.9472770690918, "global_step": 344007, "epoch": 2843} {"train_loss": -43.291385650634766, "global_step": 344008, "epoch": 2843} {"train_loss": -42.49696731567383, "global_step": 344009, "epoch": 2843} {"train_loss": -44.26140594482422, "global_step": 344010, "epoch": 2843} {"train_loss": -42.77363204956055, "global_step": 344011, "epoch": 2843} {"train_loss": -43.178550720214844, "global_step": 344012, "epoch": 2843} {"train_loss": -43.157161712646484, "global_step": 344013, "epoch": 2843} {"train_loss": -42.480560302734375, "global_step": 344014, "epoch": 2843} {"train_loss": -42.73038864135742, "global_step": 344015, "epoch": 2843} {"train_loss": -44.39008331298828, "global_step": 344016, "epoch": 2843} {"train_loss": -41.93849563598633, "global_step": 344017, "epoch": 2843} {"train_loss": -43.44194412231445, "global_step": 344018, "epoch": 2843} {"train_loss": -44.420814514160156, "global_step": 344019, "epoch": 2843} {"train_loss": -44.11789321899414, "global_step": 344020, "epoch": 2843} {"train_loss": -44.314205169677734, "global_step": 344021, "epoch": 2843} {"train_loss": -44.12638473510742, "global_step": 344022, "epoch": 2843} {"train_loss": -44.13973617553711, "global_step": 344023, "epoch": 2843} {"train_loss": -44.009002685546875, "global_step": 344024, "epoch": 2843} {"train_loss": -44.53840255737305, "global_step": 344025, "epoch": 2843} {"train_loss": -43.831974029541016, "global_step": 344026, "epoch": 2843} {"train_loss": -44.25983810424805, "global_step": 344027, "epoch": 2843} {"train_loss": -44.85436248779297, "global_step": 344028, "epoch": 2843} {"train_loss": -44.560176849365234, "global_step": 344029, "epoch": 2843} {"train_loss": -44.40191650390625, "global_step": 344030, "epoch": 2843} {"train_loss": -44.823150634765625, "global_step": 344031, "epoch": 2843} {"train_loss": -44.630348205566406, "global_step": 344032, "epoch": 2843} {"train_loss": -44.854366302490234, "global_step": 344033, "epoch": 2843} {"train_loss": -44.82915115356445, "global_step": 344034, "epoch": 2843} {"train_loss": -44.86053466796875, "global_step": 344035, "epoch": 2843} {"train_loss": -44.95829772949219, "global_step": 344036, "epoch": 2843} {"train_loss": -44.51050567626953, "global_step": 344037, "epoch": 2843} {"train_loss": -45.36788558959961, "global_step": 344038, "epoch": 2843} {"train_loss": -44.943878173828125, "global_step": 344039, "epoch": 2843} {"train_loss": -45.19802474975586, "global_step": 344040, "epoch": 2843} {"train_loss": -44.73527145385742, "global_step": 344041, "epoch": 2843} {"train_loss": -44.04664993286133, "global_step": 344042, "epoch": 2843} {"train_loss": -45.127288818359375, "global_step": 344043, "epoch": 2843} {"train_loss": -44.363555908203125, "global_step": 344044, "epoch": 2843} {"train_loss": -44.765682220458984, "global_step": 344045, "epoch": 2843} {"train_loss": -45.50883102416992, "global_step": 344046, "epoch": 2843} {"train_loss": -44.594947814941406, "global_step": 344047, "epoch": 2843} {"train_loss": -45.273292541503906, "global_step": 344048, "epoch": 2843} {"train_loss": -44.76909637451172, "global_step": 344049, "epoch": 2843} {"train_loss": -45.22239303588867, "global_step": 344050, "epoch": 2843} {"train_loss": -45.37265396118164, "global_step": 344051, "epoch": 2843} {"train_loss": -44.81673812866211, "global_step": 344052, "epoch": 2843} {"train_loss": -45.75838851928711, "global_step": 344053, "epoch": 2843} {"train_loss": -45.18167495727539, "global_step": 344054, "epoch": 2843} {"train_loss": -45.13953399658203, "global_step": 344055, "epoch": 2843} {"train_loss": -45.6119499206543, "global_step": 344056, "epoch": 2843} {"train_loss": -45.34402847290039, "global_step": 344057, "epoch": 2843} {"train_loss": -44.78670883178711, "global_step": 344058, "epoch": 2843} {"train_loss": -46.01219940185547, "global_step": 344059, "epoch": 2843} {"train_loss": -45.0889892578125, "global_step": 344060, "epoch": 2843} {"train_loss": -45.5428352355957, "global_step": 344061, "epoch": 2843} {"train_loss": -45.82872772216797, "global_step": 344062, "epoch": 2843} {"train_loss": -46.06541442871094, "global_step": 344063, "epoch": 2843} {"train_loss": -45.54412841796875, "global_step": 344064, "epoch": 2843} {"train_loss": -45.68845748901367, "global_step": 344065, "epoch": 2843} {"train_loss": -45.452083587646484, "global_step": 344066, "epoch": 2843} {"train_loss": -45.891109466552734, "global_step": 344067, "epoch": 2843} {"train_loss": -45.25067138671875, "global_step": 344068, "epoch": 2843} {"train_loss": -45.844112396240234, "global_step": 344069, "epoch": 2843} {"train_loss": -45.801109313964844, "global_step": 344070, "epoch": 2843} {"train_loss": -45.5741081237793, "global_step": 344071, "epoch": 2843} {"train_loss": -45.15034484863281, "global_step": 344072, "epoch": 2843} {"train_loss": -45.53922653198242, "global_step": 344073, "epoch": 2843} {"train_loss": -45.5609130859375, "global_step": 344074, "epoch": 2843} {"train_loss": -45.89580154418945, "global_step": 344075, "epoch": 2843} {"train_loss": -45.67975997924805, "global_step": 344076, "epoch": 2843} {"train_loss": -45.92976379394531, "global_step": 344077, "epoch": 2843} {"train_loss": -45.844024658203125, "global_step": 344078, "epoch": 2843} {"train_loss": -45.757850646972656, "global_step": 344079, "epoch": 2843} {"train_loss": -46.42644119262695, "global_step": 344080, "epoch": 2843} {"train_loss": -46.0552864074707, "global_step": 344081, "epoch": 2843} {"train_loss": -45.6038932800293, "global_step": 344082, "epoch": 2843} {"train_loss": -46.01129913330078, "global_step": 344083, "epoch": 2843} {"train_loss": -46.0093994140625, "global_step": 344084, "epoch": 2843} {"train_loss": -45.51802062988281, "global_step": 344085, "epoch": 2843} {"train_loss": -45.991878509521484, "global_step": 344086, "epoch": 2843} {"train_loss": -45.53431701660156, "global_step": 344087, "epoch": 2843} {"train_loss": -45.034366607666016, "global_step": 344088, "epoch": 2843} {"train_loss": -45.165618896484375, "global_step": 344089, "epoch": 2843} {"train_loss": -45.329559326171875, "global_step": 344090, "epoch": 2843} {"train_loss": -44.46259689331055, "global_step": 344091, "epoch": 2843} {"train_loss": -44.594112396240234, "global_step": 344092, "epoch": 2843} {"train_loss": -45.29810333251953, "global_step": 344093, "epoch": 2843} {"train_loss": -41.84397506713867, "global_step": 344094, "epoch": 2843} {"train_loss": -38.77519989013672, "global_step": 344095, "epoch": 2843} {"train_loss": -41.952903747558594, "global_step": 344096, "epoch": 2843} {"train_loss": -43.66547393798828, "global_step": 344097, "epoch": 2843} {"train_loss": -42.917030334472656, "global_step": 344098, "epoch": 2843} {"train_loss": -40.51192855834961, "global_step": 344099, "epoch": 2843} {"train_loss": -36.776058197021484, "global_step": 344100, "epoch": 2843} {"train_loss": -40.91246795654297, "global_step": 344101, "epoch": 2843} {"train_loss": -42.003700256347656, "global_step": 344102, "epoch": 2843} {"train_loss": -38.29566192626953, "global_step": 344103, "epoch": 2843} {"train_loss": -42.930755615234375, "global_step": 344104, "epoch": 2843} {"train_loss": -40.799034118652344, "global_step": 344105, "epoch": 2843} {"train_loss": -35.08279037475586, "global_step": 344106, "epoch": 2843} {"train_loss": -39.8034553527832, "global_step": 344107, "epoch": 2843} {"train_loss": -40.94529342651367, "global_step": 344108, "epoch": 2843} {"train_loss": -38.346900939941406, "global_step": 344109, "epoch": 2843} {"train_loss": -38.76285171508789, "global_step": 344110, "epoch": 2843} {"train_loss": -41.17769241333008, "global_step": 344111, "epoch": 2843} {"train_loss": -38.50766372680664, "global_step": 344112, "epoch": 2843} {"train_loss": -40.56291198730469, "global_step": 344113, "epoch": 2843} {"train_loss": -40.20896530151367, "global_step": 344114, "epoch": 2843} {"train_loss": -42.23934555053711, "global_step": 344115, "epoch": 2843} {"train_loss": -39.91781997680664, "global_step": 344116, "epoch": 2843} {"train_loss": -41.41675567626953, "global_step": 344117, "epoch": 2843} {"train_loss": -41.101531982421875, "global_step": 344118, "epoch": 2843} {"train_loss": -40.506736755371094, "global_step": 344119, "epoch": 2843} {"train_loss": -40.652706146240234, "global_step": 344120, "epoch": 2843} {"train_loss": -41.19055938720703, "global_step": 344121, "epoch": 2843} {"train_loss": -40.99675750732422, "global_step": 344122, "epoch": 2843} {"train_loss": -43.687457691539414, "global_step": 344123, "epoch": 2843, "val_loss": 2617158.0} {"train_loss": -41.093788146972656, "global_step": 344124, "epoch": 2844} {"train_loss": -42.15694046020508, "global_step": 344125, "epoch": 2844} {"train_loss": -41.537418365478516, "global_step": 344126, "epoch": 2844} {"train_loss": -42.95308303833008, "global_step": 344127, "epoch": 2844} {"train_loss": -41.793251037597656, "global_step": 344128, "epoch": 2844} {"train_loss": -43.30485534667969, "global_step": 344129, "epoch": 2844} {"train_loss": -42.395931243896484, "global_step": 344130, "epoch": 2844} {"train_loss": -42.90877151489258, "global_step": 344131, "epoch": 2844} {"train_loss": -42.18321228027344, "global_step": 344132, "epoch": 2844} {"train_loss": -43.974239349365234, "global_step": 344133, "epoch": 2844} {"train_loss": -42.53977584838867, "global_step": 344134, "epoch": 2844} {"train_loss": -43.28629684448242, "global_step": 344135, "epoch": 2844} {"train_loss": -42.90841293334961, "global_step": 344136, "epoch": 2844} {"train_loss": -43.759239196777344, "global_step": 344137, "epoch": 2844} {"train_loss": -42.71353530883789, "global_step": 344138, "epoch": 2844} {"train_loss": -43.53761672973633, "global_step": 344139, "epoch": 2844} {"train_loss": -43.12092590332031, "global_step": 344140, "epoch": 2844} {"train_loss": -43.477516174316406, "global_step": 344141, "epoch": 2844} {"train_loss": -43.18974685668945, "global_step": 344142, "epoch": 2844} {"train_loss": -42.83979415893555, "global_step": 344143, "epoch": 2844} {"train_loss": -44.157257080078125, "global_step": 344144, "epoch": 2844} {"train_loss": -43.399383544921875, "global_step": 344145, "epoch": 2844} {"train_loss": -44.042633056640625, "global_step": 344146, "epoch": 2844} {"train_loss": -43.55167007446289, "global_step": 344147, "epoch": 2844} {"train_loss": -44.24453353881836, "global_step": 344148, "epoch": 2844} {"train_loss": -43.84955596923828, "global_step": 344149, "epoch": 2844} {"train_loss": -44.40502166748047, "global_step": 344150, "epoch": 2844} {"train_loss": -44.02106475830078, "global_step": 344151, "epoch": 2844} {"train_loss": -44.63001251220703, "global_step": 344152, "epoch": 2844} {"train_loss": -44.752418518066406, "global_step": 344153, "epoch": 2844} {"train_loss": -44.422515869140625, "global_step": 344154, "epoch": 2844} {"train_loss": -45.056488037109375, "global_step": 344155, "epoch": 2844} {"train_loss": -44.78218460083008, "global_step": 344156, "epoch": 2844} {"train_loss": -45.41998291015625, "global_step": 344157, "epoch": 2844} {"train_loss": -45.21626281738281, "global_step": 344158, "epoch": 2844} {"train_loss": -45.165653228759766, "global_step": 344159, "epoch": 2844} {"train_loss": -45.07504653930664, "global_step": 344160, "epoch": 2844} {"train_loss": -45.25364303588867, "global_step": 344161, "epoch": 2844} {"train_loss": -45.43026351928711, "global_step": 344162, "epoch": 2844} {"train_loss": -45.18209457397461, "global_step": 344163, "epoch": 2844} {"train_loss": -44.995479583740234, "global_step": 344164, "epoch": 2844} {"train_loss": -45.83692932128906, "global_step": 344165, "epoch": 2844} {"train_loss": -45.131832122802734, "global_step": 344166, "epoch": 2844} {"train_loss": -45.30657958984375, "global_step": 344167, "epoch": 2844} {"train_loss": -44.89936065673828, "global_step": 344168, "epoch": 2844} {"train_loss": -45.86723327636719, "global_step": 344169, "epoch": 2844} {"train_loss": -45.313289642333984, "global_step": 344170, "epoch": 2844} {"train_loss": -45.62788772583008, "global_step": 344171, "epoch": 2844} {"train_loss": -45.52254104614258, "global_step": 344172, "epoch": 2844} {"train_loss": -45.998817443847656, "global_step": 344173, "epoch": 2844} {"train_loss": -45.4378547668457, "global_step": 344174, "epoch": 2844} {"train_loss": -45.22761154174805, "global_step": 344175, "epoch": 2844} {"train_loss": -45.57174301147461, "global_step": 344176, "epoch": 2844} {"train_loss": -45.69944381713867, "global_step": 344177, "epoch": 2844} {"train_loss": -45.16473388671875, "global_step": 344178, "epoch": 2844} {"train_loss": -45.53736114501953, "global_step": 344179, "epoch": 2844} {"train_loss": -45.739013671875, "global_step": 344180, "epoch": 2844} {"train_loss": -45.616878509521484, "global_step": 344181, "epoch": 2844} {"train_loss": -45.60750198364258, "global_step": 344182, "epoch": 2844} {"train_loss": -45.70882797241211, "global_step": 344183, "epoch": 2844} {"train_loss": -45.84309768676758, "global_step": 344184, "epoch": 2844} {"train_loss": -46.239463806152344, "global_step": 344185, "epoch": 2844} {"train_loss": -46.042171478271484, "global_step": 344186, "epoch": 2844} {"train_loss": -46.366756439208984, "global_step": 344187, "epoch": 2844} {"train_loss": -45.885929107666016, "global_step": 344188, "epoch": 2844} {"train_loss": -46.00871658325195, "global_step": 344189, "epoch": 2844} {"train_loss": -45.5188102722168, "global_step": 344190, "epoch": 2844} {"train_loss": -46.03662109375, "global_step": 344191, "epoch": 2844} {"train_loss": -46.18780517578125, "global_step": 344192, "epoch": 2844} {"train_loss": -45.86397933959961, "global_step": 344193, "epoch": 2844} {"train_loss": -45.64186477661133, "global_step": 344194, "epoch": 2844} {"train_loss": -45.233428955078125, "global_step": 344195, "epoch": 2844} {"train_loss": -45.481056213378906, "global_step": 344196, "epoch": 2844} {"train_loss": -45.00984573364258, "global_step": 344197, "epoch": 2844} {"train_loss": -44.29063034057617, "global_step": 344198, "epoch": 2844} {"train_loss": -44.84113693237305, "global_step": 344199, "epoch": 2844} {"train_loss": -44.81769561767578, "global_step": 344200, "epoch": 2844} {"train_loss": -44.946834564208984, "global_step": 344201, "epoch": 2844} {"train_loss": -44.66352462768555, "global_step": 344202, "epoch": 2844} {"train_loss": -45.80218505859375, "global_step": 344203, "epoch": 2844} {"train_loss": -44.87130355834961, "global_step": 344204, "epoch": 2844} {"train_loss": -42.20534133911133, "global_step": 344205, "epoch": 2844} {"train_loss": -41.9733772277832, "global_step": 344206, "epoch": 2844} {"train_loss": -42.494300842285156, "global_step": 344207, "epoch": 2844} {"train_loss": -43.02958297729492, "global_step": 344208, "epoch": 2844} {"train_loss": -42.73133850097656, "global_step": 344209, "epoch": 2844} {"train_loss": -44.6986083984375, "global_step": 344210, "epoch": 2844} {"train_loss": -44.65263366699219, "global_step": 344211, "epoch": 2844} {"train_loss": -42.38782501220703, "global_step": 344212, "epoch": 2844} {"train_loss": -41.0230827331543, "global_step": 344213, "epoch": 2844} {"train_loss": -44.76144027709961, "global_step": 344214, "epoch": 2844} {"train_loss": -42.720703125, "global_step": 344215, "epoch": 2844} {"train_loss": -43.15046310424805, "global_step": 344216, "epoch": 2844} {"train_loss": -44.91847229003906, "global_step": 344217, "epoch": 2844} {"train_loss": -44.06708908081055, "global_step": 344218, "epoch": 2844} {"train_loss": -44.013710021972656, "global_step": 344219, "epoch": 2844} {"train_loss": -44.452449798583984, "global_step": 344220, "epoch": 2844} {"train_loss": -44.71552276611328, "global_step": 344221, "epoch": 2844} {"train_loss": -44.859432220458984, "global_step": 344222, "epoch": 2844} {"train_loss": -44.522300720214844, "global_step": 344223, "epoch": 2844} {"train_loss": -44.61171340942383, "global_step": 344224, "epoch": 2844} {"train_loss": -44.79435348510742, "global_step": 344225, "epoch": 2844} {"train_loss": -44.51935577392578, "global_step": 344226, "epoch": 2844} {"train_loss": -44.91682434082031, "global_step": 344227, "epoch": 2844} {"train_loss": -45.6221923828125, "global_step": 344228, "epoch": 2844} {"train_loss": -45.293670654296875, "global_step": 344229, "epoch": 2844} {"train_loss": -45.16724395751953, "global_step": 344230, "epoch": 2844} {"train_loss": -45.29256820678711, "global_step": 344231, "epoch": 2844} {"train_loss": -45.69167709350586, "global_step": 344232, "epoch": 2844} {"train_loss": -45.313167572021484, "global_step": 344233, "epoch": 2844} {"train_loss": -44.52976989746094, "global_step": 344234, "epoch": 2844} {"train_loss": -45.12054443359375, "global_step": 344235, "epoch": 2844} {"train_loss": -45.25925827026367, "global_step": 344236, "epoch": 2844} {"train_loss": -44.394344329833984, "global_step": 344237, "epoch": 2844} {"train_loss": -45.53829574584961, "global_step": 344238, "epoch": 2844} {"train_loss": -44.814453125, "global_step": 344239, "epoch": 2844} {"train_loss": -45.16301727294922, "global_step": 344240, "epoch": 2844} {"train_loss": -45.270545959472656, "global_step": 344241, "epoch": 2844} {"train_loss": -45.28547286987305, "global_step": 344242, "epoch": 2844} {"train_loss": -44.13731002807617, "global_step": 344243, "epoch": 2844} {"train_loss": -44.517797202118174, "global_step": 344244, "epoch": 2844, "val_loss": 2635476.75} {"train_loss": -44.9677734375, "global_step": 344245, "epoch": 2845} {"train_loss": -44.00464630126953, "global_step": 344246, "epoch": 2845} {"train_loss": -45.00054168701172, "global_step": 344247, "epoch": 2845} {"train_loss": -45.3508415222168, "global_step": 344248, "epoch": 2845} {"train_loss": -45.556941986083984, "global_step": 344249, "epoch": 2845} {"train_loss": -45.687801361083984, "global_step": 344250, "epoch": 2845} {"train_loss": -44.72805404663086, "global_step": 344251, "epoch": 2845} {"train_loss": -45.15176773071289, "global_step": 344252, "epoch": 2845} {"train_loss": -45.42621612548828, "global_step": 344253, "epoch": 2845} {"train_loss": -45.70261764526367, "global_step": 344254, "epoch": 2845} {"train_loss": -45.4240608215332, "global_step": 344255, "epoch": 2845} {"train_loss": -45.11881637573242, "global_step": 344256, "epoch": 2845} {"train_loss": -44.87909698486328, "global_step": 344257, "epoch": 2845} {"train_loss": -45.812496185302734, "global_step": 344258, "epoch": 2845} {"train_loss": -45.36178207397461, "global_step": 344259, "epoch": 2845} {"train_loss": -45.977718353271484, "global_step": 344260, "epoch": 2845} {"train_loss": -45.58903884887695, "global_step": 344261, "epoch": 2845} {"train_loss": -44.961456298828125, "global_step": 344262, "epoch": 2845} {"train_loss": -45.59542465209961, "global_step": 344263, "epoch": 2845} {"train_loss": -45.06205368041992, "global_step": 344264, "epoch": 2845} {"train_loss": -45.903053283691406, "global_step": 344265, "epoch": 2845} {"train_loss": -45.95041275024414, "global_step": 344266, "epoch": 2845} {"train_loss": -45.49827575683594, "global_step": 344267, "epoch": 2845} {"train_loss": -45.93037796020508, "global_step": 344268, "epoch": 2845} {"train_loss": -45.49312210083008, "global_step": 344269, "epoch": 2845} {"train_loss": -45.570770263671875, "global_step": 344270, "epoch": 2845} {"train_loss": -45.62008285522461, "global_step": 344271, "epoch": 2845} {"train_loss": -45.79620361328125, "global_step": 344272, "epoch": 2845} {"train_loss": -45.45036697387695, "global_step": 344273, "epoch": 2845} {"train_loss": -45.186885833740234, "global_step": 344274, "epoch": 2845} {"train_loss": -44.794857025146484, "global_step": 344275, "epoch": 2845} {"train_loss": -45.79006576538086, "global_step": 344276, "epoch": 2845} {"train_loss": -45.81853103637695, "global_step": 344277, "epoch": 2845} {"train_loss": -44.831634521484375, "global_step": 344278, "epoch": 2845} {"train_loss": -44.06637191772461, "global_step": 344279, "epoch": 2845} {"train_loss": -44.14411163330078, "global_step": 344280, "epoch": 2845} {"train_loss": -44.568782806396484, "global_step": 344281, "epoch": 2845} {"train_loss": -44.044063568115234, "global_step": 344282, "epoch": 2845} {"train_loss": -45.42879104614258, "global_step": 344283, "epoch": 2845} {"train_loss": -45.60646057128906, "global_step": 344284, "epoch": 2845} {"train_loss": -45.291141510009766, "global_step": 344285, "epoch": 2845} {"train_loss": -45.42890167236328, "global_step": 344286, "epoch": 2845} {"train_loss": -44.52378463745117, "global_step": 344287, "epoch": 2845} {"train_loss": -43.07423782348633, "global_step": 344288, "epoch": 2845} {"train_loss": -42.99580764770508, "global_step": 344289, "epoch": 2845} {"train_loss": -45.292694091796875, "global_step": 344290, "epoch": 2845} {"train_loss": -45.01812744140625, "global_step": 344291, "epoch": 2845} {"train_loss": -44.868614196777344, "global_step": 344292, "epoch": 2845} {"train_loss": -45.119483947753906, "global_step": 344293, "epoch": 2845} {"train_loss": -45.5403938293457, "global_step": 344294, "epoch": 2845} {"train_loss": -44.71012878417969, "global_step": 344295, "epoch": 2845} {"train_loss": -43.67963409423828, "global_step": 344296, "epoch": 2845} {"train_loss": -44.42933654785156, "global_step": 344297, "epoch": 2845} {"train_loss": -44.845977783203125, "global_step": 344298, "epoch": 2845} {"train_loss": -44.65578842163086, "global_step": 344299, "epoch": 2845} {"train_loss": -45.048213958740234, "global_step": 344300, "epoch": 2845} {"train_loss": -43.867034912109375, "global_step": 344301, "epoch": 2845} {"train_loss": -44.17713165283203, "global_step": 344302, "epoch": 2845} {"train_loss": -44.46223068237305, "global_step": 344303, "epoch": 2845} {"train_loss": -44.4168586730957, "global_step": 344304, "epoch": 2845} {"train_loss": -41.541664123535156, "global_step": 344305, "epoch": 2845} {"train_loss": -43.213993072509766, "global_step": 344306, "epoch": 2845} {"train_loss": -45.05677032470703, "global_step": 344307, "epoch": 2845} {"train_loss": -42.74138259887695, "global_step": 344308, "epoch": 2845} {"train_loss": -42.790828704833984, "global_step": 344309, "epoch": 2845} {"train_loss": -43.54560470581055, "global_step": 344310, "epoch": 2845} {"train_loss": -45.127891540527344, "global_step": 344311, "epoch": 2845} {"train_loss": -42.4854850769043, "global_step": 344312, "epoch": 2845} {"train_loss": -41.730831146240234, "global_step": 344313, "epoch": 2845} {"train_loss": -44.460445404052734, "global_step": 344314, "epoch": 2845} {"train_loss": -42.585914611816406, "global_step": 344315, "epoch": 2845} {"train_loss": -42.23002624511719, "global_step": 344316, "epoch": 2845} {"train_loss": -44.60213851928711, "global_step": 344317, "epoch": 2845} {"train_loss": -43.03965377807617, "global_step": 344318, "epoch": 2845} {"train_loss": -42.9009895324707, "global_step": 344319, "epoch": 2845} {"train_loss": -43.81336975097656, "global_step": 344320, "epoch": 2845} {"train_loss": -41.50129318237305, "global_step": 344321, "epoch": 2845} {"train_loss": -43.28021240234375, "global_step": 344322, "epoch": 2845} {"train_loss": -42.693092346191406, "global_step": 344323, "epoch": 2845} {"train_loss": -42.684207916259766, "global_step": 344324, "epoch": 2845} {"train_loss": -42.54767990112305, "global_step": 344325, "epoch": 2845} {"train_loss": -40.02448654174805, "global_step": 344326, "epoch": 2845} {"train_loss": -43.81676483154297, "global_step": 344327, "epoch": 2845} {"train_loss": -43.10776138305664, "global_step": 344328, "epoch": 2845} {"train_loss": -40.20406723022461, "global_step": 344329, "epoch": 2845} {"train_loss": -44.040321350097656, "global_step": 344330, "epoch": 2845} {"train_loss": -40.02118682861328, "global_step": 344331, "epoch": 2845} {"train_loss": -35.176605224609375, "global_step": 344332, "epoch": 2845} {"train_loss": -36.911861419677734, "global_step": 344333, "epoch": 2845} {"train_loss": -38.0410270690918, "global_step": 344334, "epoch": 2845} {"train_loss": -42.764957427978516, "global_step": 344335, "epoch": 2845} {"train_loss": -38.77360153198242, "global_step": 344336, "epoch": 2845} {"train_loss": -42.764251708984375, "global_step": 344337, "epoch": 2845} {"train_loss": -38.82057189941406, "global_step": 344338, "epoch": 2845} {"train_loss": -37.11576461791992, "global_step": 344339, "epoch": 2845} {"train_loss": -39.84304428100586, "global_step": 344340, "epoch": 2845} {"train_loss": -36.8972053527832, "global_step": 344341, "epoch": 2845} {"train_loss": -25.34931755065918, "global_step": 344342, "epoch": 2845} {"train_loss": -33.602699279785156, "global_step": 344343, "epoch": 2845} {"train_loss": -39.53036880493164, "global_step": 344344, "epoch": 2845} {"train_loss": -37.22999954223633, "global_step": 344345, "epoch": 2845} {"train_loss": -33.96572494506836, "global_step": 344346, "epoch": 2845} {"train_loss": -29.900985717773438, "global_step": 344347, "epoch": 2845} {"train_loss": -37.02338409423828, "global_step": 344348, "epoch": 2845} {"train_loss": -35.46405792236328, "global_step": 344349, "epoch": 2845} {"train_loss": -39.556575775146484, "global_step": 344350, "epoch": 2845} {"train_loss": -38.94035720825195, "global_step": 344351, "epoch": 2845} {"train_loss": -40.201690673828125, "global_step": 344352, "epoch": 2845} {"train_loss": -40.941322326660156, "global_step": 344353, "epoch": 2845} {"train_loss": -41.05794906616211, "global_step": 344354, "epoch": 2845} {"train_loss": -42.36236572265625, "global_step": 344355, "epoch": 2845} {"train_loss": -39.18980026245117, "global_step": 344356, "epoch": 2845} {"train_loss": -40.832054138183594, "global_step": 344357, "epoch": 2845} {"train_loss": -41.34003829956055, "global_step": 344358, "epoch": 2845} {"train_loss": -42.14764404296875, "global_step": 344359, "epoch": 2845} {"train_loss": -39.31911087036133, "global_step": 344360, "epoch": 2845} {"train_loss": -41.887203216552734, "global_step": 344361, "epoch": 2845} {"train_loss": -40.43766403198242, "global_step": 344362, "epoch": 2845} {"train_loss": -39.11301803588867, "global_step": 344363, "epoch": 2845} {"train_loss": -38.701454162597656, "global_step": 344364, "epoch": 2845} {"train_loss": -42.68732381458125, "global_step": 344365, "epoch": 2845, "val_loss": 3869225.0} {"train_loss": -40.638458251953125, "global_step": 344366, "epoch": 2846} {"train_loss": -40.6241340637207, "global_step": 344367, "epoch": 2846} {"train_loss": -42.33495330810547, "global_step": 344368, "epoch": 2846} {"train_loss": -41.519203186035156, "global_step": 344369, "epoch": 2846} {"train_loss": -41.95518112182617, "global_step": 344370, "epoch": 2846} {"train_loss": -42.36981201171875, "global_step": 344371, "epoch": 2846} {"train_loss": -41.39679718017578, "global_step": 344372, "epoch": 2846} {"train_loss": -42.0605583190918, "global_step": 344373, "epoch": 2846} {"train_loss": -42.38462448120117, "global_step": 344374, "epoch": 2846} {"train_loss": -42.23554611206055, "global_step": 344375, "epoch": 2846} {"train_loss": -41.593360900878906, "global_step": 344376, "epoch": 2846} {"train_loss": -42.207637786865234, "global_step": 344377, "epoch": 2846} {"train_loss": -43.1449089050293, "global_step": 344378, "epoch": 2846} {"train_loss": -43.78558349609375, "global_step": 344379, "epoch": 2846} {"train_loss": -42.247859954833984, "global_step": 344380, "epoch": 2846} {"train_loss": -43.495765686035156, "global_step": 344381, "epoch": 2846} {"train_loss": -42.94378662109375, "global_step": 344382, "epoch": 2846} {"train_loss": -42.894405364990234, "global_step": 344383, "epoch": 2846} {"train_loss": -42.264766693115234, "global_step": 344384, "epoch": 2846} {"train_loss": -42.36402893066406, "global_step": 344385, "epoch": 2846} {"train_loss": -42.824623107910156, "global_step": 344386, "epoch": 2846} {"train_loss": -43.018218994140625, "global_step": 344387, "epoch": 2846} {"train_loss": -43.09332275390625, "global_step": 344388, "epoch": 2846} {"train_loss": -43.44932174682617, "global_step": 344389, "epoch": 2846} {"train_loss": -43.18587112426758, "global_step": 344390, "epoch": 2846} {"train_loss": -42.75459289550781, "global_step": 344391, "epoch": 2846} {"train_loss": -43.84988021850586, "global_step": 344392, "epoch": 2846} {"train_loss": -43.72240447998047, "global_step": 344393, "epoch": 2846} {"train_loss": -43.5985221862793, "global_step": 344394, "epoch": 2846} {"train_loss": -43.904422760009766, "global_step": 344395, "epoch": 2846} {"train_loss": -43.7191276550293, "global_step": 344396, "epoch": 2846} {"train_loss": -43.980499267578125, "global_step": 344397, "epoch": 2846} {"train_loss": -44.08980941772461, "global_step": 344398, "epoch": 2846} {"train_loss": -43.86290740966797, "global_step": 344399, "epoch": 2846} {"train_loss": -43.36334991455078, "global_step": 344400, "epoch": 2846} {"train_loss": -44.54952621459961, "global_step": 344401, "epoch": 2846} {"train_loss": -43.869178771972656, "global_step": 344402, "epoch": 2846} {"train_loss": -44.18841552734375, "global_step": 344403, "epoch": 2846} {"train_loss": -44.311607360839844, "global_step": 344404, "epoch": 2846} {"train_loss": -44.283992767333984, "global_step": 344405, "epoch": 2846} {"train_loss": -43.81502914428711, "global_step": 344406, "epoch": 2846} {"train_loss": -44.73733139038086, "global_step": 344407, "epoch": 2846} {"train_loss": -44.22702407836914, "global_step": 344408, "epoch": 2846} {"train_loss": -45.4200325012207, "global_step": 344409, "epoch": 2846} {"train_loss": -44.68488693237305, "global_step": 344410, "epoch": 2846} {"train_loss": -44.67983627319336, "global_step": 344411, "epoch": 2846} {"train_loss": -44.030269622802734, "global_step": 344412, "epoch": 2846} {"train_loss": -44.87507247924805, "global_step": 344413, "epoch": 2846} {"train_loss": -44.12065505981445, "global_step": 344414, "epoch": 2846} {"train_loss": -44.785945892333984, "global_step": 344415, "epoch": 2846} {"train_loss": -44.61468505859375, "global_step": 344416, "epoch": 2846} {"train_loss": -43.46974563598633, "global_step": 344417, "epoch": 2846} {"train_loss": -45.00535202026367, "global_step": 344418, "epoch": 2846} {"train_loss": -44.50653839111328, "global_step": 344419, "epoch": 2846} {"train_loss": -45.07218551635742, "global_step": 344420, "epoch": 2846} {"train_loss": -44.58933639526367, "global_step": 344421, "epoch": 2846} {"train_loss": -44.81560134887695, "global_step": 344422, "epoch": 2846} {"train_loss": -44.72886276245117, "global_step": 344423, "epoch": 2846} {"train_loss": -44.29557418823242, "global_step": 344424, "epoch": 2846} {"train_loss": -44.31850814819336, "global_step": 344425, "epoch": 2846} {"train_loss": -43.833065032958984, "global_step": 344426, "epoch": 2846} {"train_loss": -43.85087966918945, "global_step": 344427, "epoch": 2846} {"train_loss": -44.17619705200195, "global_step": 344428, "epoch": 2846} {"train_loss": -43.383296966552734, "global_step": 344429, "epoch": 2846} {"train_loss": -44.355403900146484, "global_step": 344430, "epoch": 2846} {"train_loss": -44.68815612792969, "global_step": 344431, "epoch": 2846} {"train_loss": -44.442935943603516, "global_step": 344432, "epoch": 2846} {"train_loss": -44.75248718261719, "global_step": 344433, "epoch": 2846} {"train_loss": -44.57722091674805, "global_step": 344434, "epoch": 2846} {"train_loss": -43.478511810302734, "global_step": 344435, "epoch": 2846} {"train_loss": -44.238746643066406, "global_step": 344436, "epoch": 2846} {"train_loss": -44.57838821411133, "global_step": 344437, "epoch": 2846} {"train_loss": -44.918636322021484, "global_step": 344438, "epoch": 2846} {"train_loss": -45.04024887084961, "global_step": 344439, "epoch": 2846} {"train_loss": -44.11085891723633, "global_step": 344440, "epoch": 2846} {"train_loss": -45.113277435302734, "global_step": 344441, "epoch": 2846} {"train_loss": -44.84383773803711, "global_step": 344442, "epoch": 2846} {"train_loss": -44.799739837646484, "global_step": 344443, "epoch": 2846} {"train_loss": -45.08148956298828, "global_step": 344444, "epoch": 2846} {"train_loss": -44.77259063720703, "global_step": 344445, "epoch": 2846} {"train_loss": -45.00663375854492, "global_step": 344446, "epoch": 2846} {"train_loss": -45.42516326904297, "global_step": 344447, "epoch": 2846} {"train_loss": -45.1181526184082, "global_step": 344448, "epoch": 2846} {"train_loss": -44.26493835449219, "global_step": 344449, "epoch": 2846} {"train_loss": -44.67313766479492, "global_step": 344450, "epoch": 2846} {"train_loss": -44.6014518737793, "global_step": 344451, "epoch": 2846} {"train_loss": -44.39699935913086, "global_step": 344452, "epoch": 2846} {"train_loss": -44.33903121948242, "global_step": 344453, "epoch": 2846} {"train_loss": -42.34174346923828, "global_step": 344454, "epoch": 2846} {"train_loss": -41.47723388671875, "global_step": 344455, "epoch": 2846} {"train_loss": -44.21409606933594, "global_step": 344456, "epoch": 2846} {"train_loss": -43.820674896240234, "global_step": 344457, "epoch": 2846} {"train_loss": -40.2992057800293, "global_step": 344458, "epoch": 2846} {"train_loss": -43.0261116027832, "global_step": 344459, "epoch": 2846} {"train_loss": -42.22397994995117, "global_step": 344460, "epoch": 2846} {"train_loss": -41.067909240722656, "global_step": 344461, "epoch": 2846} {"train_loss": -43.892311096191406, "global_step": 344462, "epoch": 2846} {"train_loss": -44.70841598510742, "global_step": 344463, "epoch": 2846} {"train_loss": -42.957618713378906, "global_step": 344464, "epoch": 2846} {"train_loss": -42.61551284790039, "global_step": 344465, "epoch": 2846} {"train_loss": -44.49109649658203, "global_step": 344466, "epoch": 2846} {"train_loss": -43.078067779541016, "global_step": 344467, "epoch": 2846} {"train_loss": -43.32373046875, "global_step": 344468, "epoch": 2846} {"train_loss": -44.27933120727539, "global_step": 344469, "epoch": 2846} {"train_loss": -43.42998123168945, "global_step": 344470, "epoch": 2846} {"train_loss": -43.200439453125, "global_step": 344471, "epoch": 2846} {"train_loss": -44.2081298828125, "global_step": 344472, "epoch": 2846} {"train_loss": -43.75212478637695, "global_step": 344473, "epoch": 2846} {"train_loss": -43.60820007324219, "global_step": 344474, "epoch": 2846} {"train_loss": -42.86790466308594, "global_step": 344475, "epoch": 2846} {"train_loss": -44.53506088256836, "global_step": 344476, "epoch": 2846} {"train_loss": -43.887027740478516, "global_step": 344477, "epoch": 2846} {"train_loss": -44.153114318847656, "global_step": 344478, "epoch": 2846} {"train_loss": -44.638397216796875, "global_step": 344479, "epoch": 2846} {"train_loss": -44.29834747314453, "global_step": 344480, "epoch": 2846} {"train_loss": -44.393314361572266, "global_step": 344481, "epoch": 2846} {"train_loss": -43.36315155029297, "global_step": 344482, "epoch": 2846} {"train_loss": -44.272945404052734, "global_step": 344483, "epoch": 2846} {"train_loss": -44.86654281616211, "global_step": 344484, "epoch": 2846} {"train_loss": -43.50223159790039, "global_step": 344485, "epoch": 2846} {"train_loss": -43.72703835983907, "global_step": 344486, "epoch": 2846, "val_loss": 2532746.25} {"train_loss": -44.58005905151367, "global_step": 344487, "epoch": 2847} {"train_loss": -44.783111572265625, "global_step": 344488, "epoch": 2847} {"train_loss": -44.29354476928711, "global_step": 344489, "epoch": 2847} {"train_loss": -43.47176742553711, "global_step": 344490, "epoch": 2847} {"train_loss": -43.75016403198242, "global_step": 344491, "epoch": 2847} {"train_loss": -44.073646545410156, "global_step": 344492, "epoch": 2847} {"train_loss": -44.48310470581055, "global_step": 344493, "epoch": 2847} {"train_loss": -43.40036392211914, "global_step": 344494, "epoch": 2847} {"train_loss": -43.97297286987305, "global_step": 344495, "epoch": 2847} {"train_loss": -44.08155059814453, "global_step": 344496, "epoch": 2847} {"train_loss": -42.55504608154297, "global_step": 344497, "epoch": 2847} {"train_loss": -43.72676467895508, "global_step": 344498, "epoch": 2847} {"train_loss": -42.214935302734375, "global_step": 344499, "epoch": 2847} {"train_loss": -44.054073333740234, "global_step": 344500, "epoch": 2847} {"train_loss": -43.31545639038086, "global_step": 344501, "epoch": 2847} {"train_loss": -39.80990219116211, "global_step": 344502, "epoch": 2847} {"train_loss": -42.8275146484375, "global_step": 344503, "epoch": 2847} {"train_loss": -42.60427474975586, "global_step": 344504, "epoch": 2847} {"train_loss": -40.89289474487305, "global_step": 344505, "epoch": 2847} {"train_loss": -40.4983024597168, "global_step": 344506, "epoch": 2847} {"train_loss": -43.17920684814453, "global_step": 344507, "epoch": 2847} {"train_loss": -43.17521286010742, "global_step": 344508, "epoch": 2847} {"train_loss": -40.30260467529297, "global_step": 344509, "epoch": 2847} {"train_loss": -42.662628173828125, "global_step": 344510, "epoch": 2847} {"train_loss": -42.32467269897461, "global_step": 344511, "epoch": 2847} {"train_loss": -40.47428512573242, "global_step": 344512, "epoch": 2847} {"train_loss": -43.54783248901367, "global_step": 344513, "epoch": 2847} {"train_loss": -41.49732208251953, "global_step": 344514, "epoch": 2847} {"train_loss": -41.59098815917969, "global_step": 344515, "epoch": 2847} {"train_loss": -43.928077697753906, "global_step": 344516, "epoch": 2847} {"train_loss": -42.175045013427734, "global_step": 344517, "epoch": 2847} {"train_loss": -43.362457275390625, "global_step": 344518, "epoch": 2847} {"train_loss": -44.27702713012695, "global_step": 344519, "epoch": 2847} {"train_loss": -42.90509796142578, "global_step": 344520, "epoch": 2847} {"train_loss": -43.583038330078125, "global_step": 344521, "epoch": 2847} {"train_loss": -44.28303146362305, "global_step": 344522, "epoch": 2847} {"train_loss": -41.992034912109375, "global_step": 344523, "epoch": 2847} {"train_loss": -44.338321685791016, "global_step": 344524, "epoch": 2847} {"train_loss": -42.70829772949219, "global_step": 344525, "epoch": 2847} {"train_loss": -42.51886749267578, "global_step": 344526, "epoch": 2847} {"train_loss": -43.556522369384766, "global_step": 344527, "epoch": 2847} {"train_loss": -43.08931350708008, "global_step": 344528, "epoch": 2847} {"train_loss": -43.925872802734375, "global_step": 344529, "epoch": 2847} {"train_loss": -44.71350860595703, "global_step": 344530, "epoch": 2847} {"train_loss": -44.0482292175293, "global_step": 344531, "epoch": 2847} {"train_loss": -44.28064727783203, "global_step": 344532, "epoch": 2847} {"train_loss": -43.990047454833984, "global_step": 344533, "epoch": 2847} {"train_loss": -44.35491180419922, "global_step": 344534, "epoch": 2847} {"train_loss": -44.082454681396484, "global_step": 344535, "epoch": 2847} {"train_loss": -43.576351165771484, "global_step": 344536, "epoch": 2847} {"train_loss": -44.72968673706055, "global_step": 344537, "epoch": 2847} {"train_loss": -44.13975143432617, "global_step": 344538, "epoch": 2847} {"train_loss": -43.1489372253418, "global_step": 344539, "epoch": 2847} {"train_loss": -44.90354537963867, "global_step": 344540, "epoch": 2847} {"train_loss": -43.8869514465332, "global_step": 344541, "epoch": 2847} {"train_loss": -44.7297477722168, "global_step": 344542, "epoch": 2847} {"train_loss": -44.12173080444336, "global_step": 344543, "epoch": 2847} {"train_loss": -45.258358001708984, "global_step": 344544, "epoch": 2847} {"train_loss": -44.76064682006836, "global_step": 344545, "epoch": 2847} {"train_loss": -44.53216552734375, "global_step": 344546, "epoch": 2847} {"train_loss": -43.72694778442383, "global_step": 344547, "epoch": 2847} {"train_loss": -44.867916107177734, "global_step": 344548, "epoch": 2847} {"train_loss": -44.94963073730469, "global_step": 344549, "epoch": 2847} {"train_loss": -45.183956146240234, "global_step": 344550, "epoch": 2847} {"train_loss": -44.94419479370117, "global_step": 344551, "epoch": 2847} {"train_loss": -44.6826286315918, "global_step": 344552, "epoch": 2847} {"train_loss": -45.03052520751953, "global_step": 344553, "epoch": 2847} {"train_loss": -45.296180725097656, "global_step": 344554, "epoch": 2847} {"train_loss": -45.20974349975586, "global_step": 344555, "epoch": 2847} {"train_loss": -44.75710678100586, "global_step": 344556, "epoch": 2847} {"train_loss": -45.28218078613281, "global_step": 344557, "epoch": 2847} {"train_loss": -44.58203887939453, "global_step": 344558, "epoch": 2847} {"train_loss": -45.170257568359375, "global_step": 344559, "epoch": 2847} {"train_loss": -45.46320724487305, "global_step": 344560, "epoch": 2847} {"train_loss": -45.61906051635742, "global_step": 344561, "epoch": 2847} {"train_loss": -44.89308547973633, "global_step": 344562, "epoch": 2847} {"train_loss": -45.43511962890625, "global_step": 344563, "epoch": 2847} {"train_loss": -45.319671630859375, "global_step": 344564, "epoch": 2847} {"train_loss": -45.289024353027344, "global_step": 344565, "epoch": 2847} {"train_loss": -44.998104095458984, "global_step": 344566, "epoch": 2847} {"train_loss": -45.23476028442383, "global_step": 344567, "epoch": 2847} {"train_loss": -45.291969299316406, "global_step": 344568, "epoch": 2847} {"train_loss": -46.05176544189453, "global_step": 344569, "epoch": 2847} {"train_loss": -45.10732650756836, "global_step": 344570, "epoch": 2847} {"train_loss": -44.09315872192383, "global_step": 344571, "epoch": 2847} {"train_loss": -42.65473175048828, "global_step": 344572, "epoch": 2847} {"train_loss": -41.8254508972168, "global_step": 344573, "epoch": 2847} {"train_loss": -42.507591247558594, "global_step": 344574, "epoch": 2847} {"train_loss": -43.95294952392578, "global_step": 344575, "epoch": 2847} {"train_loss": -45.17509841918945, "global_step": 344576, "epoch": 2847} {"train_loss": -45.181739807128906, "global_step": 344577, "epoch": 2847} {"train_loss": -44.50704574584961, "global_step": 344578, "epoch": 2847} {"train_loss": -44.276588439941406, "global_step": 344579, "epoch": 2847} {"train_loss": -44.988948822021484, "global_step": 344580, "epoch": 2847} {"train_loss": -44.11858367919922, "global_step": 344581, "epoch": 2847} {"train_loss": -43.24959182739258, "global_step": 344582, "epoch": 2847} {"train_loss": -42.43229293823242, "global_step": 344583, "epoch": 2847} {"train_loss": -44.745296478271484, "global_step": 344584, "epoch": 2847} {"train_loss": -43.128787994384766, "global_step": 344585, "epoch": 2847} {"train_loss": -39.1765251159668, "global_step": 344586, "epoch": 2847} {"train_loss": -44.8189697265625, "global_step": 344587, "epoch": 2847} {"train_loss": -42.977230072021484, "global_step": 344588, "epoch": 2847} {"train_loss": -41.05376052856445, "global_step": 344589, "epoch": 2847} {"train_loss": -44.47282028198242, "global_step": 344590, "epoch": 2847} {"train_loss": -43.15556716918945, "global_step": 344591, "epoch": 2847} {"train_loss": -44.38143539428711, "global_step": 344592, "epoch": 2847} {"train_loss": -44.155792236328125, "global_step": 344593, "epoch": 2847} {"train_loss": -43.7564811706543, "global_step": 344594, "epoch": 2847} {"train_loss": -44.237030029296875, "global_step": 344595, "epoch": 2847} {"train_loss": -42.65239334106445, "global_step": 344596, "epoch": 2847} {"train_loss": -44.30799102783203, "global_step": 344597, "epoch": 2847} {"train_loss": -44.189266204833984, "global_step": 344598, "epoch": 2847} {"train_loss": -42.06775665283203, "global_step": 344599, "epoch": 2847} {"train_loss": -42.637733459472656, "global_step": 344600, "epoch": 2847} {"train_loss": -42.57522201538086, "global_step": 344601, "epoch": 2847} {"train_loss": -43.69182205200195, "global_step": 344602, "epoch": 2847} {"train_loss": -44.071529388427734, "global_step": 344603, "epoch": 2847} {"train_loss": -42.256561279296875, "global_step": 344604, "epoch": 2847} {"train_loss": -42.185020446777344, "global_step": 344605, "epoch": 2847} {"train_loss": -43.339447021484375, "global_step": 344606, "epoch": 2847} {"train_loss": -43.7170565896783, "global_step": 344607, "epoch": 2847, "val_loss": 2651258.5} {"train_loss": -39.40349197387695, "global_step": 344608, "epoch": 2848} {"train_loss": -42.15859603881836, "global_step": 344609, "epoch": 2848} {"train_loss": -36.54120635986328, "global_step": 344610, "epoch": 2848} {"train_loss": -38.62205123901367, "global_step": 344611, "epoch": 2848} {"train_loss": -40.097511291503906, "global_step": 344612, "epoch": 2848} {"train_loss": -38.43099594116211, "global_step": 344613, "epoch": 2848} {"train_loss": -38.11355209350586, "global_step": 344614, "epoch": 2848} {"train_loss": -38.0076789855957, "global_step": 344615, "epoch": 2848} {"train_loss": -39.274208068847656, "global_step": 344616, "epoch": 2848} {"train_loss": -39.81862258911133, "global_step": 344617, "epoch": 2848} {"train_loss": -40.853511810302734, "global_step": 344618, "epoch": 2848} {"train_loss": -41.507320404052734, "global_step": 344619, "epoch": 2848} {"train_loss": -42.14236068725586, "global_step": 344620, "epoch": 2848} {"train_loss": -42.06691360473633, "global_step": 344621, "epoch": 2848} {"train_loss": -41.2403678894043, "global_step": 344622, "epoch": 2848} {"train_loss": -42.36628723144531, "global_step": 344623, "epoch": 2848} {"train_loss": -42.32729721069336, "global_step": 344624, "epoch": 2848} {"train_loss": -43.277950286865234, "global_step": 344625, "epoch": 2848} {"train_loss": -42.03704833984375, "global_step": 344626, "epoch": 2848} {"train_loss": -43.13728713989258, "global_step": 344627, "epoch": 2848} {"train_loss": -42.72749710083008, "global_step": 344628, "epoch": 2848} {"train_loss": -42.86096954345703, "global_step": 344629, "epoch": 2848} {"train_loss": -42.55413055419922, "global_step": 344630, "epoch": 2848} {"train_loss": -43.22406005859375, "global_step": 344631, "epoch": 2848} {"train_loss": -43.791969299316406, "global_step": 344632, "epoch": 2848} {"train_loss": -42.632381439208984, "global_step": 344633, "epoch": 2848} {"train_loss": -43.52796173095703, "global_step": 344634, "epoch": 2848} {"train_loss": -43.25728988647461, "global_step": 344635, "epoch": 2848} {"train_loss": -43.88011932373047, "global_step": 344636, "epoch": 2848} {"train_loss": -43.6956672668457, "global_step": 344637, "epoch": 2848} {"train_loss": -43.209651947021484, "global_step": 344638, "epoch": 2848} {"train_loss": -43.42722702026367, "global_step": 344639, "epoch": 2848} {"train_loss": -43.301090240478516, "global_step": 344640, "epoch": 2848} {"train_loss": -43.96397018432617, "global_step": 344641, "epoch": 2848} {"train_loss": -43.525550842285156, "global_step": 344642, "epoch": 2848} {"train_loss": -43.993404388427734, "global_step": 344643, "epoch": 2848} {"train_loss": -43.8248405456543, "global_step": 344644, "epoch": 2848} {"train_loss": -44.26496505737305, "global_step": 344645, "epoch": 2848} {"train_loss": -44.168216705322266, "global_step": 344646, "epoch": 2848} {"train_loss": -43.732757568359375, "global_step": 344647, "epoch": 2848} {"train_loss": -44.6285514831543, "global_step": 344648, "epoch": 2848} {"train_loss": -43.940711975097656, "global_step": 344649, "epoch": 2848} {"train_loss": -44.66402816772461, "global_step": 344650, "epoch": 2848} {"train_loss": -43.682350158691406, "global_step": 344651, "epoch": 2848} {"train_loss": -44.46944808959961, "global_step": 344652, "epoch": 2848} {"train_loss": -44.007720947265625, "global_step": 344653, "epoch": 2848} {"train_loss": -44.608123779296875, "global_step": 344654, "epoch": 2848} {"train_loss": -44.37480545043945, "global_step": 344655, "epoch": 2848} {"train_loss": -44.435455322265625, "global_step": 344656, "epoch": 2848} {"train_loss": -44.424381256103516, "global_step": 344657, "epoch": 2848} {"train_loss": -44.72149658203125, "global_step": 344658, "epoch": 2848} {"train_loss": -44.38412094116211, "global_step": 344659, "epoch": 2848} {"train_loss": -45.01413345336914, "global_step": 344660, "epoch": 2848} {"train_loss": -44.68020248413086, "global_step": 344661, "epoch": 2848} {"train_loss": -44.8908576965332, "global_step": 344662, "epoch": 2848} {"train_loss": -44.280433654785156, "global_step": 344663, "epoch": 2848} {"train_loss": -45.086463928222656, "global_step": 344664, "epoch": 2848} {"train_loss": -45.17202377319336, "global_step": 344665, "epoch": 2848} {"train_loss": -44.93229293823242, "global_step": 344666, "epoch": 2848} {"train_loss": -45.41387939453125, "global_step": 344667, "epoch": 2848} {"train_loss": -44.438167572021484, "global_step": 344668, "epoch": 2848} {"train_loss": -44.985801696777344, "global_step": 344669, "epoch": 2848} {"train_loss": -45.44039535522461, "global_step": 344670, "epoch": 2848} {"train_loss": -45.26142501831055, "global_step": 344671, "epoch": 2848} {"train_loss": -45.32948684692383, "global_step": 344672, "epoch": 2848} {"train_loss": -45.2075309753418, "global_step": 344673, "epoch": 2848} {"train_loss": -45.27357482910156, "global_step": 344674, "epoch": 2848} {"train_loss": -45.53615188598633, "global_step": 344675, "epoch": 2848} {"train_loss": -44.97211456298828, "global_step": 344676, "epoch": 2848} {"train_loss": -45.55215072631836, "global_step": 344677, "epoch": 2848} {"train_loss": -45.60722732543945, "global_step": 344678, "epoch": 2848} {"train_loss": -45.19794464111328, "global_step": 344679, "epoch": 2848} {"train_loss": -45.43601608276367, "global_step": 344680, "epoch": 2848} {"train_loss": -45.56184768676758, "global_step": 344681, "epoch": 2848} {"train_loss": -45.172054290771484, "global_step": 344682, "epoch": 2848} {"train_loss": -45.59843826293945, "global_step": 344683, "epoch": 2848} {"train_loss": -45.23759841918945, "global_step": 344684, "epoch": 2848} {"train_loss": -44.87229537963867, "global_step": 344685, "epoch": 2848} {"train_loss": -45.14781951904297, "global_step": 344686, "epoch": 2848} {"train_loss": -45.14701461791992, "global_step": 344687, "epoch": 2848} {"train_loss": -45.24025344848633, "global_step": 344688, "epoch": 2848} {"train_loss": -45.270904541015625, "global_step": 344689, "epoch": 2848} {"train_loss": -45.56355285644531, "global_step": 344690, "epoch": 2848} {"train_loss": -44.46073913574219, "global_step": 344691, "epoch": 2848} {"train_loss": -45.075927734375, "global_step": 344692, "epoch": 2848} {"train_loss": -45.25082015991211, "global_step": 344693, "epoch": 2848} {"train_loss": -45.56638717651367, "global_step": 344694, "epoch": 2848} {"train_loss": -44.817420959472656, "global_step": 344695, "epoch": 2848} {"train_loss": -45.27443313598633, "global_step": 344696, "epoch": 2848} {"train_loss": -45.529685974121094, "global_step": 344697, "epoch": 2848} {"train_loss": -45.23115539550781, "global_step": 344698, "epoch": 2848} {"train_loss": -45.47529220581055, "global_step": 344699, "epoch": 2848} {"train_loss": -44.88106155395508, "global_step": 344700, "epoch": 2848} {"train_loss": -43.54058837890625, "global_step": 344701, "epoch": 2848} {"train_loss": -44.072444915771484, "global_step": 344702, "epoch": 2848} {"train_loss": -44.65792465209961, "global_step": 344703, "epoch": 2848} {"train_loss": -44.17533493041992, "global_step": 344704, "epoch": 2848} {"train_loss": -43.94889450073242, "global_step": 344705, "epoch": 2848} {"train_loss": -43.628631591796875, "global_step": 344706, "epoch": 2848} {"train_loss": -43.34709548950195, "global_step": 344707, "epoch": 2848} {"train_loss": -43.06791305541992, "global_step": 344708, "epoch": 2848} {"train_loss": -44.81573486328125, "global_step": 344709, "epoch": 2848} {"train_loss": -44.241180419921875, "global_step": 344710, "epoch": 2848} {"train_loss": -44.41658401489258, "global_step": 344711, "epoch": 2848} {"train_loss": -44.28645706176758, "global_step": 344712, "epoch": 2848} {"train_loss": -43.21889114379883, "global_step": 344713, "epoch": 2848} {"train_loss": -44.95931625366211, "global_step": 344714, "epoch": 2848} {"train_loss": -45.10921096801758, "global_step": 344715, "epoch": 2848} {"train_loss": -43.7195930480957, "global_step": 344716, "epoch": 2848} {"train_loss": -44.13410186767578, "global_step": 344717, "epoch": 2848} {"train_loss": -43.945274353027344, "global_step": 344718, "epoch": 2848} {"train_loss": -44.55398178100586, "global_step": 344719, "epoch": 2848} {"train_loss": -44.90888214111328, "global_step": 344720, "epoch": 2848} {"train_loss": -43.62284469604492, "global_step": 344721, "epoch": 2848} {"train_loss": -43.715396881103516, "global_step": 344722, "epoch": 2848} {"train_loss": -44.17112350463867, "global_step": 344723, "epoch": 2848} {"train_loss": -44.27067184448242, "global_step": 344724, "epoch": 2848} {"train_loss": -41.9036750793457, "global_step": 344725, "epoch": 2848} {"train_loss": -41.57146072387695, "global_step": 344726, "epoch": 2848} {"train_loss": -44.30998229980469, "global_step": 344727, "epoch": 2848} {"train_loss": -43.740867898483906, "global_step": 344728, "epoch": 2848, "val_loss": 2555118.0} {"train_loss": -42.33616638183594, "global_step": 344729, "epoch": 2849} {"train_loss": -44.10590362548828, "global_step": 344730, "epoch": 2849} {"train_loss": -43.4411735534668, "global_step": 344731, "epoch": 2849} {"train_loss": -44.35198211669922, "global_step": 344732, "epoch": 2849} {"train_loss": -43.77163314819336, "global_step": 344733, "epoch": 2849} {"train_loss": -41.970680236816406, "global_step": 344734, "epoch": 2849} {"train_loss": -44.367347717285156, "global_step": 344735, "epoch": 2849} {"train_loss": -42.21693801879883, "global_step": 344736, "epoch": 2849} {"train_loss": -43.22993087768555, "global_step": 344737, "epoch": 2849} {"train_loss": -44.00559997558594, "global_step": 344738, "epoch": 2849} {"train_loss": -42.921607971191406, "global_step": 344739, "epoch": 2849} {"train_loss": -43.9057502746582, "global_step": 344740, "epoch": 2849} {"train_loss": -42.1905403137207, "global_step": 344741, "epoch": 2849} {"train_loss": -44.72262191772461, "global_step": 344742, "epoch": 2849} {"train_loss": -42.775360107421875, "global_step": 344743, "epoch": 2849} {"train_loss": -43.036930084228516, "global_step": 344744, "epoch": 2849} {"train_loss": -44.39161682128906, "global_step": 344745, "epoch": 2849} {"train_loss": -41.822242736816406, "global_step": 344746, "epoch": 2849} {"train_loss": -44.24883270263672, "global_step": 344747, "epoch": 2849} {"train_loss": -41.83555221557617, "global_step": 344748, "epoch": 2849} {"train_loss": -44.08870315551758, "global_step": 344749, "epoch": 2849} {"train_loss": -41.544490814208984, "global_step": 344750, "epoch": 2849} {"train_loss": -44.10392761230469, "global_step": 344751, "epoch": 2849} {"train_loss": -42.56026840209961, "global_step": 344752, "epoch": 2849} {"train_loss": -43.84999465942383, "global_step": 344753, "epoch": 2849} {"train_loss": -43.13560485839844, "global_step": 344754, "epoch": 2849} {"train_loss": -44.38459396362305, "global_step": 344755, "epoch": 2849} {"train_loss": -44.28804016113281, "global_step": 344756, "epoch": 2849} {"train_loss": -44.476417541503906, "global_step": 344757, "epoch": 2849} {"train_loss": -44.411865234375, "global_step": 344758, "epoch": 2849} {"train_loss": -44.3582649230957, "global_step": 344759, "epoch": 2849} {"train_loss": -44.32212448120117, "global_step": 344760, "epoch": 2849} {"train_loss": -44.33872604370117, "global_step": 344761, "epoch": 2849} {"train_loss": -44.4112663269043, "global_step": 344762, "epoch": 2849} {"train_loss": -44.59904479980469, "global_step": 344763, "epoch": 2849} {"train_loss": -44.98030090332031, "global_step": 344764, "epoch": 2849} {"train_loss": -44.85805130004883, "global_step": 344765, "epoch": 2849} {"train_loss": -45.04353332519531, "global_step": 344766, "epoch": 2849} {"train_loss": -45.18952941894531, "global_step": 344767, "epoch": 2849} {"train_loss": -44.48305892944336, "global_step": 344768, "epoch": 2849} {"train_loss": -44.77897644042969, "global_step": 344769, "epoch": 2849} {"train_loss": -43.878257751464844, "global_step": 344770, "epoch": 2849} {"train_loss": -45.250484466552734, "global_step": 344771, "epoch": 2849} {"train_loss": -44.44166946411133, "global_step": 344772, "epoch": 2849} {"train_loss": -44.29700469970703, "global_step": 344773, "epoch": 2849} {"train_loss": -44.800724029541016, "global_step": 344774, "epoch": 2849} {"train_loss": -44.14788818359375, "global_step": 344775, "epoch": 2849} {"train_loss": -45.095951080322266, "global_step": 344776, "epoch": 2849} {"train_loss": -44.54704666137695, "global_step": 344777, "epoch": 2849} {"train_loss": -44.79697799682617, "global_step": 344778, "epoch": 2849} {"train_loss": -45.22428512573242, "global_step": 344779, "epoch": 2849} {"train_loss": -45.149574279785156, "global_step": 344780, "epoch": 2849} {"train_loss": -45.53656768798828, "global_step": 344781, "epoch": 2849} {"train_loss": -45.1374626159668, "global_step": 344782, "epoch": 2849} {"train_loss": -45.506324768066406, "global_step": 344783, "epoch": 2849} {"train_loss": -44.92003631591797, "global_step": 344784, "epoch": 2849} {"train_loss": -45.021541595458984, "global_step": 344785, "epoch": 2849} {"train_loss": -45.272396087646484, "global_step": 344786, "epoch": 2849} {"train_loss": -45.00131607055664, "global_step": 344787, "epoch": 2849} {"train_loss": -45.1199951171875, "global_step": 344788, "epoch": 2849} {"train_loss": -44.643150329589844, "global_step": 344789, "epoch": 2849} {"train_loss": -45.80332565307617, "global_step": 344790, "epoch": 2849} {"train_loss": -44.66231918334961, "global_step": 344791, "epoch": 2849} {"train_loss": -44.90271759033203, "global_step": 344792, "epoch": 2849} {"train_loss": -44.863563537597656, "global_step": 344793, "epoch": 2849} {"train_loss": -45.48686599731445, "global_step": 344794, "epoch": 2849} {"train_loss": -45.34193801879883, "global_step": 344795, "epoch": 2849} {"train_loss": -45.4347038269043, "global_step": 344796, "epoch": 2849} {"train_loss": -45.163970947265625, "global_step": 344797, "epoch": 2849} {"train_loss": -46.0434684753418, "global_step": 344798, "epoch": 2849} {"train_loss": -45.108673095703125, "global_step": 344799, "epoch": 2849} {"train_loss": -44.75910568237305, "global_step": 344800, "epoch": 2849} {"train_loss": -45.300289154052734, "global_step": 344801, "epoch": 2849} {"train_loss": -45.517879486083984, "global_step": 344802, "epoch": 2849} {"train_loss": -45.641910552978516, "global_step": 344803, "epoch": 2849} {"train_loss": -44.38353729248047, "global_step": 344804, "epoch": 2849} {"train_loss": -44.28554916381836, "global_step": 344805, "epoch": 2849} {"train_loss": -44.98834991455078, "global_step": 344806, "epoch": 2849} {"train_loss": -44.56514358520508, "global_step": 344807, "epoch": 2849} {"train_loss": -44.712581634521484, "global_step": 344808, "epoch": 2849} {"train_loss": -45.16992950439453, "global_step": 344809, "epoch": 2849} {"train_loss": -44.20906448364258, "global_step": 344810, "epoch": 2849} {"train_loss": -45.2083740234375, "global_step": 344811, "epoch": 2849} {"train_loss": -45.221435546875, "global_step": 344812, "epoch": 2849} {"train_loss": -45.7205924987793, "global_step": 344813, "epoch": 2849} {"train_loss": -45.211669921875, "global_step": 344814, "epoch": 2849} {"train_loss": -44.94427490234375, "global_step": 344815, "epoch": 2849} {"train_loss": -44.87148666381836, "global_step": 344816, "epoch": 2849} {"train_loss": -45.314292907714844, "global_step": 344817, "epoch": 2849} {"train_loss": -44.63979721069336, "global_step": 344818, "epoch": 2849} {"train_loss": -45.44956588745117, "global_step": 344819, "epoch": 2849} {"train_loss": -44.380741119384766, "global_step": 344820, "epoch": 2849} {"train_loss": -44.162757873535156, "global_step": 344821, "epoch": 2849} {"train_loss": -44.7186393737793, "global_step": 344822, "epoch": 2849} {"train_loss": -44.93584060668945, "global_step": 344823, "epoch": 2849} {"train_loss": -43.73805236816406, "global_step": 344824, "epoch": 2849} {"train_loss": -42.215553283691406, "global_step": 344825, "epoch": 2849} {"train_loss": -44.01119613647461, "global_step": 344826, "epoch": 2849} {"train_loss": -43.81344985961914, "global_step": 344827, "epoch": 2849} {"train_loss": -41.44435501098633, "global_step": 344828, "epoch": 2849} {"train_loss": -43.31754684448242, "global_step": 344829, "epoch": 2849} {"train_loss": -44.10340118408203, "global_step": 344830, "epoch": 2849} {"train_loss": -43.431270599365234, "global_step": 344831, "epoch": 2849} {"train_loss": -43.605796813964844, "global_step": 344832, "epoch": 2849} {"train_loss": -43.939369201660156, "global_step": 344833, "epoch": 2849} {"train_loss": -42.49203109741211, "global_step": 344834, "epoch": 2849} {"train_loss": -42.85838317871094, "global_step": 344835, "epoch": 2849} {"train_loss": -44.470272064208984, "global_step": 344836, "epoch": 2849} {"train_loss": -44.18800735473633, "global_step": 344837, "epoch": 2849} {"train_loss": -43.00403594970703, "global_step": 344838, "epoch": 2849} {"train_loss": -44.134437561035156, "global_step": 344839, "epoch": 2849} {"train_loss": -43.66209411621094, "global_step": 344840, "epoch": 2849} {"train_loss": -43.98919677734375, "global_step": 344841, "epoch": 2849} {"train_loss": -44.45732498168945, "global_step": 344842, "epoch": 2849} {"train_loss": -44.38386917114258, "global_step": 344843, "epoch": 2849} {"train_loss": -44.14742660522461, "global_step": 344844, "epoch": 2849} {"train_loss": -44.023433685302734, "global_step": 344845, "epoch": 2849} {"train_loss": -43.441768646240234, "global_step": 344846, "epoch": 2849} {"train_loss": -43.1925163269043, "global_step": 344847, "epoch": 2849} {"train_loss": -44.08526611328125, "global_step": 344848, "epoch": 2849} {"train_loss": -44.256782878528945, "global_step": 344849, "epoch": 2849, "val_loss": 2558648.5} {"train_loss": -42.63765335083008, "global_step": 344850, "epoch": 2850} {"train_loss": -44.52836990356445, "global_step": 344851, "epoch": 2850} {"train_loss": -44.28731155395508, "global_step": 344852, "epoch": 2850} {"train_loss": -43.20911407470703, "global_step": 344853, "epoch": 2850} {"train_loss": -44.38698959350586, "global_step": 344854, "epoch": 2850} {"train_loss": -43.0250129699707, "global_step": 344855, "epoch": 2850} {"train_loss": -44.56167984008789, "global_step": 344856, "epoch": 2850} {"train_loss": -44.068992614746094, "global_step": 344857, "epoch": 2850} {"train_loss": -43.55049514770508, "global_step": 344858, "epoch": 2850} {"train_loss": -44.65212631225586, "global_step": 344859, "epoch": 2850} {"train_loss": -43.89278030395508, "global_step": 344860, "epoch": 2850} {"train_loss": -44.01074981689453, "global_step": 344861, "epoch": 2850} {"train_loss": -44.803096771240234, "global_step": 344862, "epoch": 2850} {"train_loss": -43.254024505615234, "global_step": 344863, "epoch": 2850} {"train_loss": -44.10568618774414, "global_step": 344864, "epoch": 2850} {"train_loss": -44.1639404296875, "global_step": 344865, "epoch": 2850} {"train_loss": -44.455810546875, "global_step": 344866, "epoch": 2850} {"train_loss": -44.58967971801758, "global_step": 344867, "epoch": 2850} {"train_loss": -44.36827850341797, "global_step": 344868, "epoch": 2850} {"train_loss": -44.74174118041992, "global_step": 344869, "epoch": 2850} {"train_loss": -44.57269287109375, "global_step": 344870, "epoch": 2850} {"train_loss": -44.37062454223633, "global_step": 344871, "epoch": 2850} {"train_loss": -45.35378646850586, "global_step": 344872, "epoch": 2850} {"train_loss": -43.97429275512695, "global_step": 344873, "epoch": 2850} {"train_loss": -44.583553314208984, "global_step": 344874, "epoch": 2850} {"train_loss": -44.36405563354492, "global_step": 344875, "epoch": 2850} {"train_loss": -44.487648010253906, "global_step": 344876, "epoch": 2850} {"train_loss": -43.47853469848633, "global_step": 344877, "epoch": 2850} {"train_loss": -44.56372833251953, "global_step": 344878, "epoch": 2850} {"train_loss": -44.31985092163086, "global_step": 344879, "epoch": 2850} {"train_loss": -44.31084442138672, "global_step": 344880, "epoch": 2850} {"train_loss": -44.98708724975586, "global_step": 344881, "epoch": 2850} {"train_loss": -44.32080841064453, "global_step": 344882, "epoch": 2850} {"train_loss": -44.76498794555664, "global_step": 344883, "epoch": 2850} {"train_loss": -44.731353759765625, "global_step": 344884, "epoch": 2850} {"train_loss": -45.20054626464844, "global_step": 344885, "epoch": 2850} {"train_loss": -44.09553909301758, "global_step": 344886, "epoch": 2850} {"train_loss": -44.36481857299805, "global_step": 344887, "epoch": 2850} {"train_loss": -44.691402435302734, "global_step": 344888, "epoch": 2850} {"train_loss": -44.60999298095703, "global_step": 344889, "epoch": 2850} {"train_loss": -44.41141891479492, "global_step": 344890, "epoch": 2850} {"train_loss": -44.76534652709961, "global_step": 344891, "epoch": 2850} {"train_loss": -43.8277473449707, "global_step": 344892, "epoch": 2850} {"train_loss": -43.454830169677734, "global_step": 344893, "epoch": 2850} {"train_loss": -44.96620559692383, "global_step": 344894, "epoch": 2850} {"train_loss": -43.485023498535156, "global_step": 344895, "epoch": 2850} {"train_loss": -45.51548385620117, "global_step": 344896, "epoch": 2850} {"train_loss": -43.66901779174805, "global_step": 344897, "epoch": 2850} {"train_loss": -44.76754379272461, "global_step": 344898, "epoch": 2850} {"train_loss": -44.53318405151367, "global_step": 344899, "epoch": 2850} {"train_loss": -44.662139892578125, "global_step": 344900, "epoch": 2850} {"train_loss": -44.787330627441406, "global_step": 344901, "epoch": 2850} {"train_loss": -44.3685188293457, "global_step": 344902, "epoch": 2850} {"train_loss": -44.93178939819336, "global_step": 344903, "epoch": 2850} {"train_loss": -44.299312591552734, "global_step": 344904, "epoch": 2850} {"train_loss": -45.23977279663086, "global_step": 344905, "epoch": 2850} {"train_loss": -43.40511703491211, "global_step": 344906, "epoch": 2850} {"train_loss": -44.84272384643555, "global_step": 344907, "epoch": 2850} {"train_loss": -44.783721923828125, "global_step": 344908, "epoch": 2850} {"train_loss": -44.62191390991211, "global_step": 344909, "epoch": 2850} {"train_loss": -44.62385940551758, "global_step": 344910, "epoch": 2850} {"train_loss": -44.9069709777832, "global_step": 344911, "epoch": 2850} {"train_loss": -44.77994918823242, "global_step": 344912, "epoch": 2850} {"train_loss": -44.921974182128906, "global_step": 344913, "epoch": 2850} {"train_loss": -44.0471076965332, "global_step": 344914, "epoch": 2850} {"train_loss": -45.10882568359375, "global_step": 344915, "epoch": 2850} {"train_loss": -44.206336975097656, "global_step": 344916, "epoch": 2850} {"train_loss": -43.792396545410156, "global_step": 344917, "epoch": 2850} {"train_loss": -45.13749313354492, "global_step": 344918, "epoch": 2850} {"train_loss": -43.905879974365234, "global_step": 344919, "epoch": 2850} {"train_loss": -44.58628463745117, "global_step": 344920, "epoch": 2850} {"train_loss": -43.94253921508789, "global_step": 344921, "epoch": 2850} {"train_loss": -45.0966682434082, "global_step": 344922, "epoch": 2850} {"train_loss": -44.535316467285156, "global_step": 344923, "epoch": 2850} {"train_loss": -43.880348205566406, "global_step": 344924, "epoch": 2850} {"train_loss": -43.18169021606445, "global_step": 344925, "epoch": 2850} {"train_loss": -44.208187103271484, "global_step": 344926, "epoch": 2850} {"train_loss": -44.52345657348633, "global_step": 344927, "epoch": 2850} {"train_loss": -44.553070068359375, "global_step": 344928, "epoch": 2850} {"train_loss": -44.25883102416992, "global_step": 344929, "epoch": 2850} {"train_loss": -42.954227447509766, "global_step": 344930, "epoch": 2850} {"train_loss": -44.20315170288086, "global_step": 344931, "epoch": 2850} {"train_loss": -44.694000244140625, "global_step": 344932, "epoch": 2850} {"train_loss": -44.37681579589844, "global_step": 344933, "epoch": 2850} {"train_loss": -44.91306686401367, "global_step": 344934, "epoch": 2850} {"train_loss": -44.956214904785156, "global_step": 344935, "epoch": 2850} {"train_loss": -44.98894119262695, "global_step": 344936, "epoch": 2850} {"train_loss": -45.31715774536133, "global_step": 344937, "epoch": 2850} {"train_loss": -43.896888732910156, "global_step": 344938, "epoch": 2850} {"train_loss": -45.144344329833984, "global_step": 344939, "epoch": 2850} {"train_loss": -44.57190704345703, "global_step": 344940, "epoch": 2850} {"train_loss": -45.038612365722656, "global_step": 344941, "epoch": 2850} {"train_loss": -45.612056732177734, "global_step": 344942, "epoch": 2850} {"train_loss": -45.02521896362305, "global_step": 344943, "epoch": 2850} {"train_loss": -44.48573303222656, "global_step": 344944, "epoch": 2850} {"train_loss": -44.751731872558594, "global_step": 344945, "epoch": 2850} {"train_loss": -43.9726676940918, "global_step": 344946, "epoch": 2850} {"train_loss": -45.172203063964844, "global_step": 344947, "epoch": 2850} {"train_loss": -44.90245056152344, "global_step": 344948, "epoch": 2850} {"train_loss": -44.38692092895508, "global_step": 344949, "epoch": 2850} {"train_loss": -44.270809173583984, "global_step": 344950, "epoch": 2850} {"train_loss": -44.17586135864258, "global_step": 344951, "epoch": 2850} {"train_loss": -44.730133056640625, "global_step": 344952, "epoch": 2850} {"train_loss": -45.63446807861328, "global_step": 344953, "epoch": 2850} {"train_loss": -44.032039642333984, "global_step": 344954, "epoch": 2850} {"train_loss": -43.48549270629883, "global_step": 344955, "epoch": 2850} {"train_loss": -42.69862365722656, "global_step": 344956, "epoch": 2850} {"train_loss": -40.04487991333008, "global_step": 344957, "epoch": 2850} {"train_loss": -43.763832092285156, "global_step": 344958, "epoch": 2850} {"train_loss": -44.998870849609375, "global_step": 344959, "epoch": 2850} {"train_loss": -43.807735443115234, "global_step": 344960, "epoch": 2850} {"train_loss": -45.08747482299805, "global_step": 344961, "epoch": 2850} {"train_loss": -45.29080581665039, "global_step": 344962, "epoch": 2850} {"train_loss": -44.77161407470703, "global_step": 344963, "epoch": 2850} {"train_loss": -43.06425094604492, "global_step": 344964, "epoch": 2850} {"train_loss": -43.42798614501953, "global_step": 344965, "epoch": 2850} {"train_loss": -44.98554229736328, "global_step": 344966, "epoch": 2850} {"train_loss": -42.81351852416992, "global_step": 344967, "epoch": 2850} {"train_loss": -44.19207000732422, "global_step": 344968, "epoch": 2850} {"train_loss": -44.09937286376953, "global_step": 344969, "epoch": 2850} {"train_loss": -44.34181188157768, "global_step": 344970, "epoch": 2850, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 0.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4400000": 1.0, "test/sim_max_reward_4400001": 1.0, "test/sim_max_reward_4400002": 1.0, "test/sim_max_reward_4400003": 1.0, "test/sim_max_reward_4400004": 1.0, "test/sim_max_reward_4400005": 1.0, "test/sim_max_reward_4400006": 1.0, "test/sim_max_reward_4400007": 1.0, "test/sim_max_reward_4400008": 1.0, "test/sim_max_reward_4400009": 1.0, "test/sim_max_reward_4400010": 1.0, "test/sim_max_reward_4400011": 1.0, "test/sim_max_reward_4400012": 1.0, "test/sim_max_reward_4400013": 1.0, "test/sim_max_reward_4400014": 1.0, "test/sim_max_reward_4400015": 1.0, "test/sim_max_reward_4400016": 1.0, "test/sim_max_reward_4400017": 1.0, "test/sim_max_reward_4400018": 1.0, "test/sim_max_reward_4400019": 1.0, "test/sim_max_reward_4400020": 1.0, "test/sim_max_reward_4400021": 1.0, "train/mean_score": 0.8333333333333334, "test/mean_score": 1.0, "val_loss": 2650866.75} {"train_loss": -37.413814544677734, "global_step": 344971, "epoch": 2851} {"train_loss": -44.59440231323242, "global_step": 344972, "epoch": 2851} {"train_loss": -41.77421951293945, "global_step": 344973, "epoch": 2851} {"train_loss": -43.25407409667969, "global_step": 344974, "epoch": 2851} {"train_loss": -43.18671798706055, "global_step": 344975, "epoch": 2851} {"train_loss": -42.916683197021484, "global_step": 344976, "epoch": 2851} {"train_loss": -44.11017990112305, "global_step": 344977, "epoch": 2851} {"train_loss": -41.84102249145508, "global_step": 344978, "epoch": 2851} {"train_loss": -42.61190414428711, "global_step": 344979, "epoch": 2851} {"train_loss": -43.38764953613281, "global_step": 344980, "epoch": 2851} {"train_loss": -42.25374984741211, "global_step": 344981, "epoch": 2851} {"train_loss": -43.357051849365234, "global_step": 344982, "epoch": 2851} {"train_loss": -43.01820755004883, "global_step": 344983, "epoch": 2851} {"train_loss": -43.04077911376953, "global_step": 344984, "epoch": 2851} {"train_loss": -44.4035758972168, "global_step": 344985, "epoch": 2851} {"train_loss": -44.3878288269043, "global_step": 344986, "epoch": 2851} {"train_loss": -42.98346710205078, "global_step": 344987, "epoch": 2851} {"train_loss": -43.81684112548828, "global_step": 344988, "epoch": 2851} {"train_loss": -44.433372497558594, "global_step": 344989, "epoch": 2851} {"train_loss": -43.634700775146484, "global_step": 344990, "epoch": 2851} {"train_loss": -44.15401077270508, "global_step": 344991, "epoch": 2851} {"train_loss": -43.542964935302734, "global_step": 344992, "epoch": 2851} {"train_loss": -44.328189849853516, "global_step": 344993, "epoch": 2851} {"train_loss": -43.39185333251953, "global_step": 344994, "epoch": 2851} {"train_loss": -44.88100051879883, "global_step": 344995, "epoch": 2851} {"train_loss": -44.00470733642578, "global_step": 344996, "epoch": 2851} {"train_loss": -41.86077880859375, "global_step": 344997, "epoch": 2851} {"train_loss": -43.91880798339844, "global_step": 344998, "epoch": 2851} {"train_loss": -44.20681381225586, "global_step": 344999, "epoch": 2851} {"train_loss": -44.72214889526367, "global_step": 345000, "epoch": 2851} {"train_loss": -43.97048568725586, "global_step": 345001, "epoch": 2851} {"train_loss": -44.191986083984375, "global_step": 345002, "epoch": 2851} {"train_loss": -43.779693603515625, "global_step": 345003, "epoch": 2851} {"train_loss": -44.12853240966797, "global_step": 345004, "epoch": 2851} {"train_loss": -44.15047073364258, "global_step": 345005, "epoch": 2851} {"train_loss": -43.823543548583984, "global_step": 345006, "epoch": 2851} {"train_loss": -43.971282958984375, "global_step": 345007, "epoch": 2851} {"train_loss": -43.963523864746094, "global_step": 345008, "epoch": 2851} {"train_loss": -44.24528503417969, "global_step": 345009, "epoch": 2851} {"train_loss": -44.82417678833008, "global_step": 345010, "epoch": 2851} {"train_loss": -44.52888107299805, "global_step": 345011, "epoch": 2851} {"train_loss": -44.30367660522461, "global_step": 345012, "epoch": 2851} {"train_loss": -44.64289093017578, "global_step": 345013, "epoch": 2851} {"train_loss": -44.804351806640625, "global_step": 345014, "epoch": 2851} {"train_loss": -44.70234298706055, "global_step": 345015, "epoch": 2851} {"train_loss": -44.15279006958008, "global_step": 345016, "epoch": 2851} {"train_loss": -44.575279235839844, "global_step": 345017, "epoch": 2851} {"train_loss": -45.19945526123047, "global_step": 345018, "epoch": 2851} {"train_loss": -45.06461715698242, "global_step": 345019, "epoch": 2851} {"train_loss": -45.34761428833008, "global_step": 345020, "epoch": 2851} {"train_loss": -44.12881088256836, "global_step": 345021, "epoch": 2851} {"train_loss": -44.95089340209961, "global_step": 345022, "epoch": 2851} {"train_loss": -44.5811882019043, "global_step": 345023, "epoch": 2851} {"train_loss": -44.99372100830078, "global_step": 345024, "epoch": 2851} {"train_loss": -45.25015640258789, "global_step": 345025, "epoch": 2851} {"train_loss": -44.73268508911133, "global_step": 345026, "epoch": 2851} {"train_loss": -45.22988510131836, "global_step": 345027, "epoch": 2851} {"train_loss": -44.893245697021484, "global_step": 345028, "epoch": 2851} {"train_loss": -44.67755889892578, "global_step": 345029, "epoch": 2851} {"train_loss": -45.1829948425293, "global_step": 345030, "epoch": 2851} {"train_loss": -45.75654983520508, "global_step": 345031, "epoch": 2851} {"train_loss": -45.33436965942383, "global_step": 345032, "epoch": 2851} {"train_loss": -44.86393356323242, "global_step": 345033, "epoch": 2851} {"train_loss": -45.15138626098633, "global_step": 345034, "epoch": 2851} {"train_loss": -45.55531311035156, "global_step": 345035, "epoch": 2851} {"train_loss": -44.78719711303711, "global_step": 345036, "epoch": 2851} {"train_loss": -44.9438591003418, "global_step": 345037, "epoch": 2851} {"train_loss": -44.67464065551758, "global_step": 345038, "epoch": 2851} {"train_loss": -45.035552978515625, "global_step": 345039, "epoch": 2851} {"train_loss": -42.96429443359375, "global_step": 345040, "epoch": 2851} {"train_loss": -44.56281661987305, "global_step": 345041, "epoch": 2851} {"train_loss": -44.374366760253906, "global_step": 345042, "epoch": 2851} {"train_loss": -44.35129928588867, "global_step": 345043, "epoch": 2851} {"train_loss": -44.21944046020508, "global_step": 345044, "epoch": 2851} {"train_loss": -44.944313049316406, "global_step": 345045, "epoch": 2851} {"train_loss": -45.06336212158203, "global_step": 345046, "epoch": 2851} {"train_loss": -44.81150436401367, "global_step": 345047, "epoch": 2851} {"train_loss": -45.046382904052734, "global_step": 345048, "epoch": 2851} {"train_loss": -43.7323112487793, "global_step": 345049, "epoch": 2851} {"train_loss": -42.770484924316406, "global_step": 345050, "epoch": 2851} {"train_loss": -44.31480026245117, "global_step": 345051, "epoch": 2851} {"train_loss": -45.509647369384766, "global_step": 345052, "epoch": 2851} {"train_loss": -43.55091857910156, "global_step": 345053, "epoch": 2851} {"train_loss": -42.91367721557617, "global_step": 345054, "epoch": 2851} {"train_loss": -44.62043762207031, "global_step": 345055, "epoch": 2851} {"train_loss": -45.78754806518555, "global_step": 345056, "epoch": 2851} {"train_loss": -44.05064010620117, "global_step": 345057, "epoch": 2851} {"train_loss": -44.582881927490234, "global_step": 345058, "epoch": 2851} {"train_loss": -45.042236328125, "global_step": 345059, "epoch": 2851} {"train_loss": -43.91646194458008, "global_step": 345060, "epoch": 2851} {"train_loss": -43.245113372802734, "global_step": 345061, "epoch": 2851} {"train_loss": -44.61262130737305, "global_step": 345062, "epoch": 2851} {"train_loss": -44.7125358581543, "global_step": 345063, "epoch": 2851} {"train_loss": -44.60503387451172, "global_step": 345064, "epoch": 2851} {"train_loss": -44.22983932495117, "global_step": 345065, "epoch": 2851} {"train_loss": -43.53129196166992, "global_step": 345066, "epoch": 2851} {"train_loss": -44.922245025634766, "global_step": 345067, "epoch": 2851} {"train_loss": -45.29642868041992, "global_step": 345068, "epoch": 2851} {"train_loss": -44.950077056884766, "global_step": 345069, "epoch": 2851} {"train_loss": -45.03481674194336, "global_step": 345070, "epoch": 2851} {"train_loss": -45.132869720458984, "global_step": 345071, "epoch": 2851} {"train_loss": -44.715858459472656, "global_step": 345072, "epoch": 2851} {"train_loss": -44.229217529296875, "global_step": 345073, "epoch": 2851} {"train_loss": -45.1998405456543, "global_step": 345074, "epoch": 2851} {"train_loss": -45.01329803466797, "global_step": 345075, "epoch": 2851} {"train_loss": -45.09418487548828, "global_step": 345076, "epoch": 2851} {"train_loss": -42.72420120239258, "global_step": 345077, "epoch": 2851} {"train_loss": -43.81142807006836, "global_step": 345078, "epoch": 2851} {"train_loss": -45.01092529296875, "global_step": 345079, "epoch": 2851} {"train_loss": -45.07319259643555, "global_step": 345080, "epoch": 2851} {"train_loss": -43.896949768066406, "global_step": 345081, "epoch": 2851} {"train_loss": -42.898719787597656, "global_step": 345082, "epoch": 2851} {"train_loss": -43.67103958129883, "global_step": 345083, "epoch": 2851} {"train_loss": -43.88866424560547, "global_step": 345084, "epoch": 2851} {"train_loss": -43.18428421020508, "global_step": 345085, "epoch": 2851} {"train_loss": -44.82651901245117, "global_step": 345086, "epoch": 2851} {"train_loss": -43.76735305786133, "global_step": 345087, "epoch": 2851} {"train_loss": -43.97871017456055, "global_step": 345088, "epoch": 2851} {"train_loss": -45.385093688964844, "global_step": 345089, "epoch": 2851} {"train_loss": -43.769405364990234, "global_step": 345090, "epoch": 2851} {"train_loss": -44.19498985858003, "global_step": 345091, "epoch": 2851, "val_loss": 2519898.75} {"train_loss": -43.928558349609375, "global_step": 345092, "epoch": 2852} {"train_loss": -44.44173812866211, "global_step": 345093, "epoch": 2852} {"train_loss": -44.468387603759766, "global_step": 345094, "epoch": 2852} {"train_loss": -44.70644760131836, "global_step": 345095, "epoch": 2852} {"train_loss": -44.23247146606445, "global_step": 345096, "epoch": 2852} {"train_loss": -43.36648178100586, "global_step": 345097, "epoch": 2852} {"train_loss": -44.242862701416016, "global_step": 345098, "epoch": 2852} {"train_loss": -43.84736251831055, "global_step": 345099, "epoch": 2852} {"train_loss": -44.628265380859375, "global_step": 345100, "epoch": 2852} {"train_loss": -44.386009216308594, "global_step": 345101, "epoch": 2852} {"train_loss": -43.44454574584961, "global_step": 345102, "epoch": 2852} {"train_loss": -44.98991012573242, "global_step": 345103, "epoch": 2852} {"train_loss": -44.8953971862793, "global_step": 345104, "epoch": 2852} {"train_loss": -43.993228912353516, "global_step": 345105, "epoch": 2852} {"train_loss": -44.47817611694336, "global_step": 345106, "epoch": 2852} {"train_loss": -44.33972930908203, "global_step": 345107, "epoch": 2852} {"train_loss": -44.7495002746582, "global_step": 345108, "epoch": 2852} {"train_loss": -44.0504264831543, "global_step": 345109, "epoch": 2852} {"train_loss": -44.94409942626953, "global_step": 345110, "epoch": 2852} {"train_loss": -44.199363708496094, "global_step": 345111, "epoch": 2852} {"train_loss": -43.6673583984375, "global_step": 345112, "epoch": 2852} {"train_loss": -44.953609466552734, "global_step": 345113, "epoch": 2852} {"train_loss": -44.18110275268555, "global_step": 345114, "epoch": 2852} {"train_loss": -44.374847412109375, "global_step": 345115, "epoch": 2852} {"train_loss": -44.62240219116211, "global_step": 345116, "epoch": 2852} {"train_loss": -44.490718841552734, "global_step": 345117, "epoch": 2852} {"train_loss": -44.783447265625, "global_step": 345118, "epoch": 2852} {"train_loss": -45.07590866088867, "global_step": 345119, "epoch": 2852} {"train_loss": -44.50580978393555, "global_step": 345120, "epoch": 2852} {"train_loss": -45.14970016479492, "global_step": 345121, "epoch": 2852} {"train_loss": -44.86639404296875, "global_step": 345122, "epoch": 2852} {"train_loss": -44.268836975097656, "global_step": 345123, "epoch": 2852} {"train_loss": -44.48665237426758, "global_step": 345124, "epoch": 2852} {"train_loss": -44.24355697631836, "global_step": 345125, "epoch": 2852} {"train_loss": -45.12099075317383, "global_step": 345126, "epoch": 2852} {"train_loss": -44.33467102050781, "global_step": 345127, "epoch": 2852} {"train_loss": -43.58487319946289, "global_step": 345128, "epoch": 2852} {"train_loss": -45.15810775756836, "global_step": 345129, "epoch": 2852} {"train_loss": -44.50892639160156, "global_step": 345130, "epoch": 2852} {"train_loss": -44.653358459472656, "global_step": 345131, "epoch": 2852} {"train_loss": -44.44816207885742, "global_step": 345132, "epoch": 2852} {"train_loss": -44.90266799926758, "global_step": 345133, "epoch": 2852} {"train_loss": -44.81332015991211, "global_step": 345134, "epoch": 2852} {"train_loss": -44.65788269042969, "global_step": 345135, "epoch": 2852} {"train_loss": -44.682777404785156, "global_step": 345136, "epoch": 2852} {"train_loss": -45.46334457397461, "global_step": 345137, "epoch": 2852} {"train_loss": -44.02267074584961, "global_step": 345138, "epoch": 2852} {"train_loss": -45.21780014038086, "global_step": 345139, "epoch": 2852} {"train_loss": -45.51890563964844, "global_step": 345140, "epoch": 2852} {"train_loss": -45.12626266479492, "global_step": 345141, "epoch": 2852} {"train_loss": -44.786956787109375, "global_step": 345142, "epoch": 2852} {"train_loss": -44.58651351928711, "global_step": 345143, "epoch": 2852} {"train_loss": -45.630218505859375, "global_step": 345144, "epoch": 2852} {"train_loss": -44.69392776489258, "global_step": 345145, "epoch": 2852} {"train_loss": -45.34780502319336, "global_step": 345146, "epoch": 2852} {"train_loss": -45.091732025146484, "global_step": 345147, "epoch": 2852} {"train_loss": -45.1745719909668, "global_step": 345148, "epoch": 2852} {"train_loss": -45.134521484375, "global_step": 345149, "epoch": 2852} {"train_loss": -44.675506591796875, "global_step": 345150, "epoch": 2852} {"train_loss": -44.915164947509766, "global_step": 345151, "epoch": 2852} {"train_loss": -45.22339630126953, "global_step": 345152, "epoch": 2852} {"train_loss": -44.711036682128906, "global_step": 345153, "epoch": 2852} {"train_loss": -44.78820037841797, "global_step": 345154, "epoch": 2852} {"train_loss": -45.10372543334961, "global_step": 345155, "epoch": 2852} {"train_loss": -44.64352035522461, "global_step": 345156, "epoch": 2852} {"train_loss": -45.25690460205078, "global_step": 345157, "epoch": 2852} {"train_loss": -44.93964767456055, "global_step": 345158, "epoch": 2852} {"train_loss": -44.996822357177734, "global_step": 345159, "epoch": 2852} {"train_loss": -44.04353332519531, "global_step": 345160, "epoch": 2852} {"train_loss": -44.45907211303711, "global_step": 345161, "epoch": 2852} {"train_loss": -45.567169189453125, "global_step": 345162, "epoch": 2852} {"train_loss": -44.700843811035156, "global_step": 345163, "epoch": 2852} {"train_loss": -44.9438591003418, "global_step": 345164, "epoch": 2852} {"train_loss": -44.647701263427734, "global_step": 345165, "epoch": 2852} {"train_loss": -44.44887924194336, "global_step": 345166, "epoch": 2852} {"train_loss": -45.065887451171875, "global_step": 345167, "epoch": 2852} {"train_loss": -43.008949279785156, "global_step": 345168, "epoch": 2852} {"train_loss": -42.530799865722656, "global_step": 345169, "epoch": 2852} {"train_loss": -44.75938034057617, "global_step": 345170, "epoch": 2852} {"train_loss": -43.088661193847656, "global_step": 345171, "epoch": 2852} {"train_loss": -42.5303955078125, "global_step": 345172, "epoch": 2852} {"train_loss": -43.5377197265625, "global_step": 345173, "epoch": 2852} {"train_loss": -43.422454833984375, "global_step": 345174, "epoch": 2852} {"train_loss": -44.377052307128906, "global_step": 345175, "epoch": 2852} {"train_loss": -42.65797424316406, "global_step": 345176, "epoch": 2852} {"train_loss": -43.06199264526367, "global_step": 345177, "epoch": 2852} {"train_loss": -42.41097640991211, "global_step": 345178, "epoch": 2852} {"train_loss": -42.85676193237305, "global_step": 345179, "epoch": 2852} {"train_loss": -43.890968322753906, "global_step": 345180, "epoch": 2852} {"train_loss": -44.093849182128906, "global_step": 345181, "epoch": 2852} {"train_loss": -43.42628479003906, "global_step": 345182, "epoch": 2852} {"train_loss": -43.8328857421875, "global_step": 345183, "epoch": 2852} {"train_loss": -43.36325454711914, "global_step": 345184, "epoch": 2852} {"train_loss": -42.98512649536133, "global_step": 345185, "epoch": 2852} {"train_loss": -44.432037353515625, "global_step": 345186, "epoch": 2852} {"train_loss": -43.87066650390625, "global_step": 345187, "epoch": 2852} {"train_loss": -44.02725601196289, "global_step": 345188, "epoch": 2852} {"train_loss": -43.57191848754883, "global_step": 345189, "epoch": 2852} {"train_loss": -43.62015151977539, "global_step": 345190, "epoch": 2852} {"train_loss": -43.72036361694336, "global_step": 345191, "epoch": 2852} {"train_loss": -43.950164794921875, "global_step": 345192, "epoch": 2852} {"train_loss": -42.18263244628906, "global_step": 345193, "epoch": 2852} {"train_loss": -43.25044631958008, "global_step": 345194, "epoch": 2852} {"train_loss": -45.06343078613281, "global_step": 345195, "epoch": 2852} {"train_loss": -42.92118835449219, "global_step": 345196, "epoch": 2852} {"train_loss": -44.3077278137207, "global_step": 345197, "epoch": 2852} {"train_loss": -44.24939727783203, "global_step": 345198, "epoch": 2852} {"train_loss": -43.600521087646484, "global_step": 345199, "epoch": 2852} {"train_loss": -44.215126037597656, "global_step": 345200, "epoch": 2852} {"train_loss": -44.32830810546875, "global_step": 345201, "epoch": 2852} {"train_loss": -44.80924606323242, "global_step": 345202, "epoch": 2852} {"train_loss": -45.12165451049805, "global_step": 345203, "epoch": 2852} {"train_loss": -42.56536865234375, "global_step": 345204, "epoch": 2852} {"train_loss": -44.545467376708984, "global_step": 345205, "epoch": 2852} {"train_loss": -42.992950439453125, "global_step": 345206, "epoch": 2852} {"train_loss": -45.0486946105957, "global_step": 345207, "epoch": 2852} {"train_loss": -43.22892379760742, "global_step": 345208, "epoch": 2852} {"train_loss": -44.058040618896484, "global_step": 345209, "epoch": 2852} {"train_loss": -43.653602600097656, "global_step": 345210, "epoch": 2852} {"train_loss": -44.93206787109375, "global_step": 345211, "epoch": 2852} {"train_loss": -44.297120464734796, "global_step": 345212, "epoch": 2852, "val_loss": 2485084.75} {"train_loss": -45.45486831665039, "global_step": 345213, "epoch": 2853} {"train_loss": -44.28072738647461, "global_step": 345214, "epoch": 2853} {"train_loss": -44.961631774902344, "global_step": 345215, "epoch": 2853} {"train_loss": -45.72503662109375, "global_step": 345216, "epoch": 2853} {"train_loss": -44.80075454711914, "global_step": 345217, "epoch": 2853} {"train_loss": -44.67359161376953, "global_step": 345218, "epoch": 2853} {"train_loss": -44.64316940307617, "global_step": 345219, "epoch": 2853} {"train_loss": -44.95450973510742, "global_step": 345220, "epoch": 2853} {"train_loss": -44.784332275390625, "global_step": 345221, "epoch": 2853} {"train_loss": -45.515621185302734, "global_step": 345222, "epoch": 2853} {"train_loss": -45.39067840576172, "global_step": 345223, "epoch": 2853} {"train_loss": -45.328121185302734, "global_step": 345224, "epoch": 2853} {"train_loss": -45.969032287597656, "global_step": 345225, "epoch": 2853} {"train_loss": -45.5430793762207, "global_step": 345226, "epoch": 2853} {"train_loss": -45.728755950927734, "global_step": 345227, "epoch": 2853} {"train_loss": -45.82764434814453, "global_step": 345228, "epoch": 2853} {"train_loss": -45.64693069458008, "global_step": 345229, "epoch": 2853} {"train_loss": -45.24642562866211, "global_step": 345230, "epoch": 2853} {"train_loss": -45.85958480834961, "global_step": 345231, "epoch": 2853} {"train_loss": -46.01009750366211, "global_step": 345232, "epoch": 2853} {"train_loss": -45.77500534057617, "global_step": 345233, "epoch": 2853} {"train_loss": -45.91206741333008, "global_step": 345234, "epoch": 2853} {"train_loss": -46.10994338989258, "global_step": 345235, "epoch": 2853} {"train_loss": -45.81020736694336, "global_step": 345236, "epoch": 2853} {"train_loss": -45.8222770690918, "global_step": 345237, "epoch": 2853} {"train_loss": -45.65809631347656, "global_step": 345238, "epoch": 2853} {"train_loss": -45.66941452026367, "global_step": 345239, "epoch": 2853} {"train_loss": -45.41066360473633, "global_step": 345240, "epoch": 2853} {"train_loss": -45.18276596069336, "global_step": 345241, "epoch": 2853} {"train_loss": -45.7365837097168, "global_step": 345242, "epoch": 2853} {"train_loss": -45.605403900146484, "global_step": 345243, "epoch": 2853} {"train_loss": -46.0542106628418, "global_step": 345244, "epoch": 2853} {"train_loss": -45.65751266479492, "global_step": 345245, "epoch": 2853} {"train_loss": -45.012203216552734, "global_step": 345246, "epoch": 2853} {"train_loss": -44.58846664428711, "global_step": 345247, "epoch": 2853} {"train_loss": -45.922279357910156, "global_step": 345248, "epoch": 2853} {"train_loss": -45.75008773803711, "global_step": 345249, "epoch": 2853} {"train_loss": -45.45433044433594, "global_step": 345250, "epoch": 2853} {"train_loss": -44.822044372558594, "global_step": 345251, "epoch": 2853} {"train_loss": -42.63436508178711, "global_step": 345252, "epoch": 2853} {"train_loss": -44.95956039428711, "global_step": 345253, "epoch": 2853} {"train_loss": -44.60321044921875, "global_step": 345254, "epoch": 2853} {"train_loss": -43.294376373291016, "global_step": 345255, "epoch": 2853} {"train_loss": -39.51005554199219, "global_step": 345256, "epoch": 2853} {"train_loss": -45.491329193115234, "global_step": 345257, "epoch": 2853} {"train_loss": -40.376861572265625, "global_step": 345258, "epoch": 2853} {"train_loss": -39.60306930541992, "global_step": 345259, "epoch": 2853} {"train_loss": -41.8784065246582, "global_step": 345260, "epoch": 2853} {"train_loss": -36.236610412597656, "global_step": 345261, "epoch": 2853} {"train_loss": -42.70204544067383, "global_step": 345262, "epoch": 2853} {"train_loss": -40.26179122924805, "global_step": 345263, "epoch": 2853} {"train_loss": -43.702308654785156, "global_step": 345264, "epoch": 2853} {"train_loss": -40.57769012451172, "global_step": 345265, "epoch": 2853} {"train_loss": -40.6383171081543, "global_step": 345266, "epoch": 2853} {"train_loss": -43.102508544921875, "global_step": 345267, "epoch": 2853} {"train_loss": -40.606773376464844, "global_step": 345268, "epoch": 2853} {"train_loss": -41.524436950683594, "global_step": 345269, "epoch": 2853} {"train_loss": -42.39823532104492, "global_step": 345270, "epoch": 2853} {"train_loss": -39.27450180053711, "global_step": 345271, "epoch": 2853} {"train_loss": -42.94300842285156, "global_step": 345272, "epoch": 2853} {"train_loss": -43.129024505615234, "global_step": 345273, "epoch": 2853} {"train_loss": -42.02517318725586, "global_step": 345274, "epoch": 2853} {"train_loss": -42.66811752319336, "global_step": 345275, "epoch": 2853} {"train_loss": -42.39667892456055, "global_step": 345276, "epoch": 2853} {"train_loss": -43.322364807128906, "global_step": 345277, "epoch": 2853} {"train_loss": -43.927486419677734, "global_step": 345278, "epoch": 2853} {"train_loss": -43.51088333129883, "global_step": 345279, "epoch": 2853} {"train_loss": -43.537513732910156, "global_step": 345280, "epoch": 2853} {"train_loss": -43.645233154296875, "global_step": 345281, "epoch": 2853} {"train_loss": -43.38363265991211, "global_step": 345282, "epoch": 2853} {"train_loss": -42.74172592163086, "global_step": 345283, "epoch": 2853} {"train_loss": -43.663612365722656, "global_step": 345284, "epoch": 2853} {"train_loss": -43.638038635253906, "global_step": 345285, "epoch": 2853} {"train_loss": -43.5551643371582, "global_step": 345286, "epoch": 2853} {"train_loss": -43.02727508544922, "global_step": 345287, "epoch": 2853} {"train_loss": -42.52168273925781, "global_step": 345288, "epoch": 2853} {"train_loss": -44.545711517333984, "global_step": 345289, "epoch": 2853} {"train_loss": -43.5054931640625, "global_step": 345290, "epoch": 2853} {"train_loss": -44.1221923828125, "global_step": 345291, "epoch": 2853} {"train_loss": -43.879852294921875, "global_step": 345292, "epoch": 2853} {"train_loss": -42.77827835083008, "global_step": 345293, "epoch": 2853} {"train_loss": -44.306331634521484, "global_step": 345294, "epoch": 2853} {"train_loss": -43.982749938964844, "global_step": 345295, "epoch": 2853} {"train_loss": -44.007686614990234, "global_step": 345296, "epoch": 2853} {"train_loss": -44.44544219970703, "global_step": 345297, "epoch": 2853} {"train_loss": -43.541500091552734, "global_step": 345298, "epoch": 2853} {"train_loss": -44.4034538269043, "global_step": 345299, "epoch": 2853} {"train_loss": -44.211997985839844, "global_step": 345300, "epoch": 2853} {"train_loss": -43.9145622253418, "global_step": 345301, "epoch": 2853} {"train_loss": -44.49165725708008, "global_step": 345302, "epoch": 2853} {"train_loss": -44.4829216003418, "global_step": 345303, "epoch": 2853} {"train_loss": -44.07121658325195, "global_step": 345304, "epoch": 2853} {"train_loss": -44.04459762573242, "global_step": 345305, "epoch": 2853} {"train_loss": -44.540870666503906, "global_step": 345306, "epoch": 2853} {"train_loss": -43.57493209838867, "global_step": 345307, "epoch": 2853} {"train_loss": -44.39532470703125, "global_step": 345308, "epoch": 2853} {"train_loss": -44.79246520996094, "global_step": 345309, "epoch": 2853} {"train_loss": -43.549373626708984, "global_step": 345310, "epoch": 2853} {"train_loss": -44.65501022338867, "global_step": 345311, "epoch": 2853} {"train_loss": -43.7866325378418, "global_step": 345312, "epoch": 2853} {"train_loss": -44.00774002075195, "global_step": 345313, "epoch": 2853} {"train_loss": -43.970191955566406, "global_step": 345314, "epoch": 2853} {"train_loss": -44.05355453491211, "global_step": 345315, "epoch": 2853} {"train_loss": -44.20296859741211, "global_step": 345316, "epoch": 2853} {"train_loss": -44.127803802490234, "global_step": 345317, "epoch": 2853} {"train_loss": -44.35242462158203, "global_step": 345318, "epoch": 2853} {"train_loss": -44.11793899536133, "global_step": 345319, "epoch": 2853} {"train_loss": -45.33644485473633, "global_step": 345320, "epoch": 2853} {"train_loss": -43.36104202270508, "global_step": 345321, "epoch": 2853} {"train_loss": -44.986297607421875, "global_step": 345322, "epoch": 2853} {"train_loss": -44.647769927978516, "global_step": 345323, "epoch": 2853} {"train_loss": -44.49077224731445, "global_step": 345324, "epoch": 2853} {"train_loss": -45.276973724365234, "global_step": 345325, "epoch": 2853} {"train_loss": -44.24993133544922, "global_step": 345326, "epoch": 2853} {"train_loss": -45.01947784423828, "global_step": 345327, "epoch": 2853} {"train_loss": -44.57497787475586, "global_step": 345328, "epoch": 2853} {"train_loss": -44.84141540527344, "global_step": 345329, "epoch": 2853} {"train_loss": -44.817073822021484, "global_step": 345330, "epoch": 2853} {"train_loss": -45.264381408691406, "global_step": 345331, "epoch": 2853} {"train_loss": -44.98904800415039, "global_step": 345332, "epoch": 2853} {"train_loss": -44.07510952910116, "global_step": 345333, "epoch": 2853, "val_loss": 2562767.75} {"train_loss": -45.45486068725586, "global_step": 345334, "epoch": 2854} {"train_loss": -45.21247482299805, "global_step": 345335, "epoch": 2854} {"train_loss": -45.41877365112305, "global_step": 345336, "epoch": 2854} {"train_loss": -45.13386917114258, "global_step": 345337, "epoch": 2854} {"train_loss": -45.377716064453125, "global_step": 345338, "epoch": 2854} {"train_loss": -45.6463508605957, "global_step": 345339, "epoch": 2854} {"train_loss": -45.421875, "global_step": 345340, "epoch": 2854} {"train_loss": -45.62805938720703, "global_step": 345341, "epoch": 2854} {"train_loss": -45.34843826293945, "global_step": 345342, "epoch": 2854} {"train_loss": -45.39907455444336, "global_step": 345343, "epoch": 2854} {"train_loss": -45.437965393066406, "global_step": 345344, "epoch": 2854} {"train_loss": -45.45608139038086, "global_step": 345345, "epoch": 2854} {"train_loss": -45.488861083984375, "global_step": 345346, "epoch": 2854} {"train_loss": -46.19499969482422, "global_step": 345347, "epoch": 2854} {"train_loss": -45.6108512878418, "global_step": 345348, "epoch": 2854} {"train_loss": -46.00824737548828, "global_step": 345349, "epoch": 2854} {"train_loss": -45.799739837646484, "global_step": 345350, "epoch": 2854} {"train_loss": -45.73407745361328, "global_step": 345351, "epoch": 2854} {"train_loss": -45.781314849853516, "global_step": 345352, "epoch": 2854} {"train_loss": -45.841129302978516, "global_step": 345353, "epoch": 2854} {"train_loss": -46.3756217956543, "global_step": 345354, "epoch": 2854} {"train_loss": -45.69303894042969, "global_step": 345355, "epoch": 2854} {"train_loss": -45.143089294433594, "global_step": 345356, "epoch": 2854} {"train_loss": -45.87986373901367, "global_step": 345357, "epoch": 2854} {"train_loss": -45.18158721923828, "global_step": 345358, "epoch": 2854} {"train_loss": -46.443634033203125, "global_step": 345359, "epoch": 2854} {"train_loss": -46.09543991088867, "global_step": 345360, "epoch": 2854} {"train_loss": -45.11365509033203, "global_step": 345361, "epoch": 2854} {"train_loss": -45.085845947265625, "global_step": 345362, "epoch": 2854} {"train_loss": -44.904747009277344, "global_step": 345363, "epoch": 2854} {"train_loss": -44.37091827392578, "global_step": 345364, "epoch": 2854} {"train_loss": -43.70211410522461, "global_step": 345365, "epoch": 2854} {"train_loss": -45.02090072631836, "global_step": 345366, "epoch": 2854} {"train_loss": -45.24909591674805, "global_step": 345367, "epoch": 2854} {"train_loss": -44.005523681640625, "global_step": 345368, "epoch": 2854} {"train_loss": -43.59554672241211, "global_step": 345369, "epoch": 2854} {"train_loss": -44.80831527709961, "global_step": 345370, "epoch": 2854} {"train_loss": -43.466854095458984, "global_step": 345371, "epoch": 2854} {"train_loss": -41.275184631347656, "global_step": 345372, "epoch": 2854} {"train_loss": -45.18303298950195, "global_step": 345373, "epoch": 2854} {"train_loss": -43.25413131713867, "global_step": 345374, "epoch": 2854} {"train_loss": -43.5326042175293, "global_step": 345375, "epoch": 2854} {"train_loss": -45.050594329833984, "global_step": 345376, "epoch": 2854} {"train_loss": -43.44289779663086, "global_step": 345377, "epoch": 2854} {"train_loss": -42.734249114990234, "global_step": 345378, "epoch": 2854} {"train_loss": -44.35420608520508, "global_step": 345379, "epoch": 2854} {"train_loss": -43.6265983581543, "global_step": 345380, "epoch": 2854} {"train_loss": -44.19844436645508, "global_step": 345381, "epoch": 2854} {"train_loss": -43.42615509033203, "global_step": 345382, "epoch": 2854} {"train_loss": -43.52864456176758, "global_step": 345383, "epoch": 2854} {"train_loss": -43.288414001464844, "global_step": 345384, "epoch": 2854} {"train_loss": -43.634735107421875, "global_step": 345385, "epoch": 2854} {"train_loss": -44.01642990112305, "global_step": 345386, "epoch": 2854} {"train_loss": -43.75706100463867, "global_step": 345387, "epoch": 2854} {"train_loss": -44.20848083496094, "global_step": 345388, "epoch": 2854} {"train_loss": -43.7957763671875, "global_step": 345389, "epoch": 2854} {"train_loss": -44.14752960205078, "global_step": 345390, "epoch": 2854} {"train_loss": -43.12812042236328, "global_step": 345391, "epoch": 2854} {"train_loss": -43.993812561035156, "global_step": 345392, "epoch": 2854} {"train_loss": -43.10679244995117, "global_step": 345393, "epoch": 2854} {"train_loss": -43.79322052001953, "global_step": 345394, "epoch": 2854} {"train_loss": -43.72682571411133, "global_step": 345395, "epoch": 2854} {"train_loss": -44.62425994873047, "global_step": 345396, "epoch": 2854} {"train_loss": -44.00430679321289, "global_step": 345397, "epoch": 2854} {"train_loss": -43.61863327026367, "global_step": 345398, "epoch": 2854} {"train_loss": -44.062164306640625, "global_step": 345399, "epoch": 2854} {"train_loss": -44.2929573059082, "global_step": 345400, "epoch": 2854} {"train_loss": -44.890628814697266, "global_step": 345401, "epoch": 2854} {"train_loss": -44.389892578125, "global_step": 345402, "epoch": 2854} {"train_loss": -43.83878707885742, "global_step": 345403, "epoch": 2854} {"train_loss": -43.829593658447266, "global_step": 345404, "epoch": 2854} {"train_loss": -44.57612991333008, "global_step": 345405, "epoch": 2854} {"train_loss": -43.92243576049805, "global_step": 345406, "epoch": 2854} {"train_loss": -42.97187042236328, "global_step": 345407, "epoch": 2854} {"train_loss": -42.42399215698242, "global_step": 345408, "epoch": 2854} {"train_loss": -43.88631057739258, "global_step": 345409, "epoch": 2854} {"train_loss": -42.29087448120117, "global_step": 345410, "epoch": 2854} {"train_loss": -42.21112823486328, "global_step": 345411, "epoch": 2854} {"train_loss": -44.036678314208984, "global_step": 345412, "epoch": 2854} {"train_loss": -44.740234375, "global_step": 345413, "epoch": 2854} {"train_loss": -44.44071960449219, "global_step": 345414, "epoch": 2854} {"train_loss": -44.106380462646484, "global_step": 345415, "epoch": 2854} {"train_loss": -44.79848861694336, "global_step": 345416, "epoch": 2854} {"train_loss": -44.31447982788086, "global_step": 345417, "epoch": 2854} {"train_loss": -44.501953125, "global_step": 345418, "epoch": 2854} {"train_loss": -44.4202766418457, "global_step": 345419, "epoch": 2854} {"train_loss": -45.0828742980957, "global_step": 345420, "epoch": 2854} {"train_loss": -43.392601013183594, "global_step": 345421, "epoch": 2854} {"train_loss": -43.0085334777832, "global_step": 345422, "epoch": 2854} {"train_loss": -45.0253791809082, "global_step": 345423, "epoch": 2854} {"train_loss": -44.1126823425293, "global_step": 345424, "epoch": 2854} {"train_loss": -41.773292541503906, "global_step": 345425, "epoch": 2854} {"train_loss": -44.994205474853516, "global_step": 345426, "epoch": 2854} {"train_loss": -45.06036376953125, "global_step": 345427, "epoch": 2854} {"train_loss": -44.96165084838867, "global_step": 345428, "epoch": 2854} {"train_loss": -44.916114807128906, "global_step": 345429, "epoch": 2854} {"train_loss": -43.924861907958984, "global_step": 345430, "epoch": 2854} {"train_loss": -44.319786071777344, "global_step": 345431, "epoch": 2854} {"train_loss": -44.95697784423828, "global_step": 345432, "epoch": 2854} {"train_loss": -43.207210540771484, "global_step": 345433, "epoch": 2854} {"train_loss": -44.280818939208984, "global_step": 345434, "epoch": 2854} {"train_loss": -44.24076843261719, "global_step": 345435, "epoch": 2854} {"train_loss": -44.303619384765625, "global_step": 345436, "epoch": 2854} {"train_loss": -45.15058517456055, "global_step": 345437, "epoch": 2854} {"train_loss": -44.6545524597168, "global_step": 345438, "epoch": 2854} {"train_loss": -45.102081298828125, "global_step": 345439, "epoch": 2854} {"train_loss": -44.40488815307617, "global_step": 345440, "epoch": 2854} {"train_loss": -44.56140899658203, "global_step": 345441, "epoch": 2854} {"train_loss": -45.046566009521484, "global_step": 345442, "epoch": 2854} {"train_loss": -44.879364013671875, "global_step": 345443, "epoch": 2854} {"train_loss": -44.70133590698242, "global_step": 345444, "epoch": 2854} {"train_loss": -45.43837356567383, "global_step": 345445, "epoch": 2854} {"train_loss": -45.381752014160156, "global_step": 345446, "epoch": 2854} {"train_loss": -44.4986686706543, "global_step": 345447, "epoch": 2854} {"train_loss": -45.41987991333008, "global_step": 345448, "epoch": 2854} {"train_loss": -45.17709732055664, "global_step": 345449, "epoch": 2854} {"train_loss": -45.53520584106445, "global_step": 345450, "epoch": 2854} {"train_loss": -45.11678695678711, "global_step": 345451, "epoch": 2854} {"train_loss": -45.2481575012207, "global_step": 345452, "epoch": 2854} {"train_loss": -46.05257034301758, "global_step": 345453, "epoch": 2854} {"train_loss": -44.524925421092135, "global_step": 345454, "epoch": 2854, "val_loss": 2594093.75} {"train_loss": -45.33492660522461, "global_step": 345455, "epoch": 2855} {"train_loss": -45.4324836730957, "global_step": 345456, "epoch": 2855} {"train_loss": -44.89205551147461, "global_step": 345457, "epoch": 2855} {"train_loss": -45.19503402709961, "global_step": 345458, "epoch": 2855} {"train_loss": -45.89498519897461, "global_step": 345459, "epoch": 2855} {"train_loss": -45.21474075317383, "global_step": 345460, "epoch": 2855} {"train_loss": -45.52927780151367, "global_step": 345461, "epoch": 2855} {"train_loss": -45.557254791259766, "global_step": 345462, "epoch": 2855} {"train_loss": -45.48486328125, "global_step": 345463, "epoch": 2855} {"train_loss": -44.809547424316406, "global_step": 345464, "epoch": 2855} {"train_loss": -45.91094970703125, "global_step": 345465, "epoch": 2855} {"train_loss": -45.508155822753906, "global_step": 345466, "epoch": 2855} {"train_loss": -45.6168327331543, "global_step": 345467, "epoch": 2855} {"train_loss": -45.377689361572266, "global_step": 345468, "epoch": 2855} {"train_loss": -45.36524200439453, "global_step": 345469, "epoch": 2855} {"train_loss": -45.331703186035156, "global_step": 345470, "epoch": 2855} {"train_loss": -45.389869689941406, "global_step": 345471, "epoch": 2855} {"train_loss": -45.154823303222656, "global_step": 345472, "epoch": 2855} {"train_loss": -45.62582015991211, "global_step": 345473, "epoch": 2855} {"train_loss": -45.90315628051758, "global_step": 345474, "epoch": 2855} {"train_loss": -44.36696243286133, "global_step": 345475, "epoch": 2855} {"train_loss": -45.58165740966797, "global_step": 345476, "epoch": 2855} {"train_loss": -45.06173324584961, "global_step": 345477, "epoch": 2855} {"train_loss": -45.53956985473633, "global_step": 345478, "epoch": 2855} {"train_loss": -45.01517105102539, "global_step": 345479, "epoch": 2855} {"train_loss": -44.420528411865234, "global_step": 345480, "epoch": 2855} {"train_loss": -43.71828079223633, "global_step": 345481, "epoch": 2855} {"train_loss": -45.34550857543945, "global_step": 345482, "epoch": 2855} {"train_loss": -45.5850715637207, "global_step": 345483, "epoch": 2855} {"train_loss": -44.86054611206055, "global_step": 345484, "epoch": 2855} {"train_loss": -45.460296630859375, "global_step": 345485, "epoch": 2855} {"train_loss": -44.933956146240234, "global_step": 345486, "epoch": 2855} {"train_loss": -43.65629196166992, "global_step": 345487, "epoch": 2855} {"train_loss": -44.99172592163086, "global_step": 345488, "epoch": 2855} {"train_loss": -44.909603118896484, "global_step": 345489, "epoch": 2855} {"train_loss": -43.5352668762207, "global_step": 345490, "epoch": 2855} {"train_loss": -43.97063064575195, "global_step": 345491, "epoch": 2855} {"train_loss": -44.61530303955078, "global_step": 345492, "epoch": 2855} {"train_loss": -43.3065185546875, "global_step": 345493, "epoch": 2855} {"train_loss": -43.40723419189453, "global_step": 345494, "epoch": 2855} {"train_loss": -44.11054229736328, "global_step": 345495, "epoch": 2855} {"train_loss": -42.897666931152344, "global_step": 345496, "epoch": 2855} {"train_loss": -44.38625717163086, "global_step": 345497, "epoch": 2855} {"train_loss": -43.39950180053711, "global_step": 345498, "epoch": 2855} {"train_loss": -41.84629440307617, "global_step": 345499, "epoch": 2855} {"train_loss": -43.81650924682617, "global_step": 345500, "epoch": 2855} {"train_loss": -43.53591537475586, "global_step": 345501, "epoch": 2855} {"train_loss": -43.9544792175293, "global_step": 345502, "epoch": 2855} {"train_loss": -44.301509857177734, "global_step": 345503, "epoch": 2855} {"train_loss": -44.12836837768555, "global_step": 345504, "epoch": 2855} {"train_loss": -44.26283264160156, "global_step": 345505, "epoch": 2855} {"train_loss": -44.0749626159668, "global_step": 345506, "epoch": 2855} {"train_loss": -44.67531967163086, "global_step": 345507, "epoch": 2855} {"train_loss": -44.15546417236328, "global_step": 345508, "epoch": 2855} {"train_loss": -43.869197845458984, "global_step": 345509, "epoch": 2855} {"train_loss": -45.07560348510742, "global_step": 345510, "epoch": 2855} {"train_loss": -44.61098861694336, "global_step": 345511, "epoch": 2855} {"train_loss": -45.17729568481445, "global_step": 345512, "epoch": 2855} {"train_loss": -43.81702423095703, "global_step": 345513, "epoch": 2855} {"train_loss": -43.970855712890625, "global_step": 345514, "epoch": 2855} {"train_loss": -44.742095947265625, "global_step": 345515, "epoch": 2855} {"train_loss": -44.281978607177734, "global_step": 345516, "epoch": 2855} {"train_loss": -45.11820602416992, "global_step": 345517, "epoch": 2855} {"train_loss": -44.659297943115234, "global_step": 345518, "epoch": 2855} {"train_loss": -44.61467361450195, "global_step": 345519, "epoch": 2855} {"train_loss": -45.33137893676758, "global_step": 345520, "epoch": 2855} {"train_loss": -44.830875396728516, "global_step": 345521, "epoch": 2855} {"train_loss": -43.68339920043945, "global_step": 345522, "epoch": 2855} {"train_loss": -44.32676315307617, "global_step": 345523, "epoch": 2855} {"train_loss": -45.186378479003906, "global_step": 345524, "epoch": 2855} {"train_loss": -45.0610466003418, "global_step": 345525, "epoch": 2855} {"train_loss": -44.83333969116211, "global_step": 345526, "epoch": 2855} {"train_loss": -44.40140914916992, "global_step": 345527, "epoch": 2855} {"train_loss": -44.91666793823242, "global_step": 345528, "epoch": 2855} {"train_loss": -45.44050216674805, "global_step": 345529, "epoch": 2855} {"train_loss": -45.58888626098633, "global_step": 345530, "epoch": 2855} {"train_loss": -45.33667755126953, "global_step": 345531, "epoch": 2855} {"train_loss": -45.26362228393555, "global_step": 345532, "epoch": 2855} {"train_loss": -45.2753791809082, "global_step": 345533, "epoch": 2855} {"train_loss": -40.52378463745117, "global_step": 345534, "epoch": 2855} {"train_loss": -44.959110260009766, "global_step": 345535, "epoch": 2855} {"train_loss": -44.286102294921875, "global_step": 345536, "epoch": 2855} {"train_loss": -45.486507415771484, "global_step": 345537, "epoch": 2855} {"train_loss": -44.66596603393555, "global_step": 345538, "epoch": 2855} {"train_loss": -32.703758239746094, "global_step": 345539, "epoch": 2855} {"train_loss": -44.0543212890625, "global_step": 345540, "epoch": 2855} {"train_loss": -42.28237533569336, "global_step": 345541, "epoch": 2855} {"train_loss": -44.100379943847656, "global_step": 345542, "epoch": 2855} {"train_loss": -41.92267990112305, "global_step": 345543, "epoch": 2855} {"train_loss": -35.35921859741211, "global_step": 345544, "epoch": 2855} {"train_loss": -42.11674499511719, "global_step": 345545, "epoch": 2855} {"train_loss": -41.74049758911133, "global_step": 345546, "epoch": 2855} {"train_loss": -42.57477951049805, "global_step": 345547, "epoch": 2855} {"train_loss": -33.879032135009766, "global_step": 345548, "epoch": 2855} {"train_loss": -36.67053985595703, "global_step": 345549, "epoch": 2855} {"train_loss": -41.3571662902832, "global_step": 345550, "epoch": 2855} {"train_loss": -33.12580490112305, "global_step": 345551, "epoch": 2855} {"train_loss": -42.066532135009766, "global_step": 345552, "epoch": 2855} {"train_loss": -35.96451950073242, "global_step": 345553, "epoch": 2855} {"train_loss": -41.59626007080078, "global_step": 345554, "epoch": 2855} {"train_loss": -36.8896598815918, "global_step": 345555, "epoch": 2855} {"train_loss": -40.929996490478516, "global_step": 345556, "epoch": 2855} {"train_loss": -34.64042282104492, "global_step": 345557, "epoch": 2855} {"train_loss": -40.021461486816406, "global_step": 345558, "epoch": 2855} {"train_loss": -41.92962646484375, "global_step": 345559, "epoch": 2855} {"train_loss": -39.90800094604492, "global_step": 345560, "epoch": 2855} {"train_loss": -39.68549728393555, "global_step": 345561, "epoch": 2855} {"train_loss": -42.21098709106445, "global_step": 345562, "epoch": 2855} {"train_loss": -42.01252365112305, "global_step": 345563, "epoch": 2855} {"train_loss": -41.95480728149414, "global_step": 345564, "epoch": 2855} {"train_loss": -42.160308837890625, "global_step": 345565, "epoch": 2855} {"train_loss": -40.0451774597168, "global_step": 345566, "epoch": 2855} {"train_loss": -42.88100051879883, "global_step": 345567, "epoch": 2855} {"train_loss": -41.54771423339844, "global_step": 345568, "epoch": 2855} {"train_loss": -41.84223175048828, "global_step": 345569, "epoch": 2855} {"train_loss": -41.98323440551758, "global_step": 345570, "epoch": 2855} {"train_loss": -42.849281311035156, "global_step": 345571, "epoch": 2855} {"train_loss": -43.23369216918945, "global_step": 345572, "epoch": 2855} {"train_loss": -41.764129638671875, "global_step": 345573, "epoch": 2855} {"train_loss": -42.59907150268555, "global_step": 345574, "epoch": 2855} {"train_loss": -43.38423150432997, "global_step": 345575, "epoch": 2855, "val_loss": 2584072.75} {"train_loss": -42.25822830200195, "global_step": 345576, "epoch": 2856} {"train_loss": -43.90925216674805, "global_step": 345577, "epoch": 2856} {"train_loss": -42.29425811767578, "global_step": 345578, "epoch": 2856} {"train_loss": -43.7833251953125, "global_step": 345579, "epoch": 2856} {"train_loss": -43.36882019042969, "global_step": 345580, "epoch": 2856} {"train_loss": -42.48527908325195, "global_step": 345581, "epoch": 2856} {"train_loss": -43.25834274291992, "global_step": 345582, "epoch": 2856} {"train_loss": -43.21799087524414, "global_step": 345583, "epoch": 2856} {"train_loss": -43.92070388793945, "global_step": 345584, "epoch": 2856} {"train_loss": -43.35500717163086, "global_step": 345585, "epoch": 2856} {"train_loss": -43.23810577392578, "global_step": 345586, "epoch": 2856} {"train_loss": -44.10322189331055, "global_step": 345587, "epoch": 2856} {"train_loss": -44.29970932006836, "global_step": 345588, "epoch": 2856} {"train_loss": -42.80022430419922, "global_step": 345589, "epoch": 2856} {"train_loss": -44.20783233642578, "global_step": 345590, "epoch": 2856} {"train_loss": -44.36488723754883, "global_step": 345591, "epoch": 2856} {"train_loss": -43.8156852722168, "global_step": 345592, "epoch": 2856} {"train_loss": -44.53145980834961, "global_step": 345593, "epoch": 2856} {"train_loss": -44.2135124206543, "global_step": 345594, "epoch": 2856} {"train_loss": -44.71104049682617, "global_step": 345595, "epoch": 2856} {"train_loss": -44.64622116088867, "global_step": 345596, "epoch": 2856} {"train_loss": -44.62211608886719, "global_step": 345597, "epoch": 2856} {"train_loss": -44.82997131347656, "global_step": 345598, "epoch": 2856} {"train_loss": -43.837303161621094, "global_step": 345599, "epoch": 2856} {"train_loss": -44.5704231262207, "global_step": 345600, "epoch": 2856} {"train_loss": -44.39860153198242, "global_step": 345601, "epoch": 2856} {"train_loss": -44.881099700927734, "global_step": 345602, "epoch": 2856} {"train_loss": -44.88724899291992, "global_step": 345603, "epoch": 2856} {"train_loss": -45.125667572021484, "global_step": 345604, "epoch": 2856} {"train_loss": -44.741798400878906, "global_step": 345605, "epoch": 2856} {"train_loss": -44.21428298950195, "global_step": 345606, "epoch": 2856} {"train_loss": -44.91659164428711, "global_step": 345607, "epoch": 2856} {"train_loss": -45.19086837768555, "global_step": 345608, "epoch": 2856} {"train_loss": -45.072200775146484, "global_step": 345609, "epoch": 2856} {"train_loss": -44.54383087158203, "global_step": 345610, "epoch": 2856} {"train_loss": -45.30720138549805, "global_step": 345611, "epoch": 2856} {"train_loss": -45.46918487548828, "global_step": 345612, "epoch": 2856} {"train_loss": -45.52875900268555, "global_step": 345613, "epoch": 2856} {"train_loss": -44.93576431274414, "global_step": 345614, "epoch": 2856} {"train_loss": -45.54710388183594, "global_step": 345615, "epoch": 2856} {"train_loss": -45.375274658203125, "global_step": 345616, "epoch": 2856} {"train_loss": -45.95224380493164, "global_step": 345617, "epoch": 2856} {"train_loss": -45.364501953125, "global_step": 345618, "epoch": 2856} {"train_loss": -45.43525314331055, "global_step": 345619, "epoch": 2856} {"train_loss": -45.54752731323242, "global_step": 345620, "epoch": 2856} {"train_loss": -44.678138732910156, "global_step": 345621, "epoch": 2856} {"train_loss": -44.95292282104492, "global_step": 345622, "epoch": 2856} {"train_loss": -45.64463806152344, "global_step": 345623, "epoch": 2856} {"train_loss": -45.82399368286133, "global_step": 345624, "epoch": 2856} {"train_loss": -45.735023498535156, "global_step": 345625, "epoch": 2856} {"train_loss": -45.63618087768555, "global_step": 345626, "epoch": 2856} {"train_loss": -44.78080368041992, "global_step": 345627, "epoch": 2856} {"train_loss": -45.52960968017578, "global_step": 345628, "epoch": 2856} {"train_loss": -45.89540481567383, "global_step": 345629, "epoch": 2856} {"train_loss": -45.31266403198242, "global_step": 345630, "epoch": 2856} {"train_loss": -45.950740814208984, "global_step": 345631, "epoch": 2856} {"train_loss": -45.98527145385742, "global_step": 345632, "epoch": 2856} {"train_loss": -45.231597900390625, "global_step": 345633, "epoch": 2856} {"train_loss": -45.38869857788086, "global_step": 345634, "epoch": 2856} {"train_loss": -46.03664779663086, "global_step": 345635, "epoch": 2856} {"train_loss": -45.34003829956055, "global_step": 345636, "epoch": 2856} {"train_loss": -45.10757064819336, "global_step": 345637, "epoch": 2856} {"train_loss": -45.24285125732422, "global_step": 345638, "epoch": 2856} {"train_loss": -45.121315002441406, "global_step": 345639, "epoch": 2856} {"train_loss": -44.934722900390625, "global_step": 345640, "epoch": 2856} {"train_loss": -45.462772369384766, "global_step": 345641, "epoch": 2856} {"train_loss": -44.83698654174805, "global_step": 345642, "epoch": 2856} {"train_loss": -45.307247161865234, "global_step": 345643, "epoch": 2856} {"train_loss": -45.312171936035156, "global_step": 345644, "epoch": 2856} {"train_loss": -44.094112396240234, "global_step": 345645, "epoch": 2856} {"train_loss": -42.3717041015625, "global_step": 345646, "epoch": 2856} {"train_loss": -43.25442123413086, "global_step": 345647, "epoch": 2856} {"train_loss": -40.45801544189453, "global_step": 345648, "epoch": 2856} {"train_loss": -42.376556396484375, "global_step": 345649, "epoch": 2856} {"train_loss": -43.93265914916992, "global_step": 345650, "epoch": 2856} {"train_loss": -42.23212814331055, "global_step": 345651, "epoch": 2856} {"train_loss": -43.278282165527344, "global_step": 345652, "epoch": 2856} {"train_loss": -42.37949752807617, "global_step": 345653, "epoch": 2856} {"train_loss": -43.06631088256836, "global_step": 345654, "epoch": 2856} {"train_loss": -44.90634536743164, "global_step": 345655, "epoch": 2856} {"train_loss": -43.99892044067383, "global_step": 345656, "epoch": 2856} {"train_loss": -44.37273025512695, "global_step": 345657, "epoch": 2856} {"train_loss": -44.234928131103516, "global_step": 345658, "epoch": 2856} {"train_loss": -44.789466857910156, "global_step": 345659, "epoch": 2856} {"train_loss": -44.6069221496582, "global_step": 345660, "epoch": 2856} {"train_loss": -44.44292068481445, "global_step": 345661, "epoch": 2856} {"train_loss": -44.401206970214844, "global_step": 345662, "epoch": 2856} {"train_loss": -44.24769973754883, "global_step": 345663, "epoch": 2856} {"train_loss": -45.20978546142578, "global_step": 345664, "epoch": 2856} {"train_loss": -44.549285888671875, "global_step": 345665, "epoch": 2856} {"train_loss": -45.193721771240234, "global_step": 345666, "epoch": 2856} {"train_loss": -45.47536849975586, "global_step": 345667, "epoch": 2856} {"train_loss": -44.95962142944336, "global_step": 345668, "epoch": 2856} {"train_loss": -44.02608108520508, "global_step": 345669, "epoch": 2856} {"train_loss": -44.5411262512207, "global_step": 345670, "epoch": 2856} {"train_loss": -45.53883743286133, "global_step": 345671, "epoch": 2856} {"train_loss": -44.46846389770508, "global_step": 345672, "epoch": 2856} {"train_loss": -44.40908432006836, "global_step": 345673, "epoch": 2856} {"train_loss": -44.3083610534668, "global_step": 345674, "epoch": 2856} {"train_loss": -44.3177375793457, "global_step": 345675, "epoch": 2856} {"train_loss": -43.73690414428711, "global_step": 345676, "epoch": 2856} {"train_loss": -43.9287109375, "global_step": 345677, "epoch": 2856} {"train_loss": -44.3924674987793, "global_step": 345678, "epoch": 2856} {"train_loss": -44.6999397277832, "global_step": 345679, "epoch": 2856} {"train_loss": -43.725608825683594, "global_step": 345680, "epoch": 2856} {"train_loss": -44.722625732421875, "global_step": 345681, "epoch": 2856} {"train_loss": -43.929054260253906, "global_step": 345682, "epoch": 2856} {"train_loss": -43.7242546081543, "global_step": 345683, "epoch": 2856} {"train_loss": -44.06667709350586, "global_step": 345684, "epoch": 2856} {"train_loss": -43.05186462402344, "global_step": 345685, "epoch": 2856} {"train_loss": -43.4033317565918, "global_step": 345686, "epoch": 2856} {"train_loss": -43.7718620300293, "global_step": 345687, "epoch": 2856} {"train_loss": -42.717132568359375, "global_step": 345688, "epoch": 2856} {"train_loss": -43.351192474365234, "global_step": 345689, "epoch": 2856} {"train_loss": -44.794105529785156, "global_step": 345690, "epoch": 2856} {"train_loss": -43.20022201538086, "global_step": 345691, "epoch": 2856} {"train_loss": -43.816864013671875, "global_step": 345692, "epoch": 2856} {"train_loss": -44.26575469970703, "global_step": 345693, "epoch": 2856} {"train_loss": -41.876190185546875, "global_step": 345694, "epoch": 2856} {"train_loss": -43.91359329223633, "global_step": 345695, "epoch": 2856} {"train_loss": -44.38436032129713, "global_step": 345696, "epoch": 2856, "val_loss": 2577145.0} {"train_loss": -43.971466064453125, "global_step": 345697, "epoch": 2857} {"train_loss": -43.8258171081543, "global_step": 345698, "epoch": 2857} {"train_loss": -42.56452178955078, "global_step": 345699, "epoch": 2857} {"train_loss": -43.97749328613281, "global_step": 345700, "epoch": 2857} {"train_loss": -43.12546920776367, "global_step": 345701, "epoch": 2857} {"train_loss": -43.48460388183594, "global_step": 345702, "epoch": 2857} {"train_loss": -43.383846282958984, "global_step": 345703, "epoch": 2857} {"train_loss": -43.62004852294922, "global_step": 345704, "epoch": 2857} {"train_loss": -41.40876388549805, "global_step": 345705, "epoch": 2857} {"train_loss": -44.294647216796875, "global_step": 345706, "epoch": 2857} {"train_loss": -41.254329681396484, "global_step": 345707, "epoch": 2857} {"train_loss": -43.70322799682617, "global_step": 345708, "epoch": 2857} {"train_loss": -40.886024475097656, "global_step": 345709, "epoch": 2857} {"train_loss": -44.58684539794922, "global_step": 345710, "epoch": 2857} {"train_loss": -42.101226806640625, "global_step": 345711, "epoch": 2857} {"train_loss": -44.5057487487793, "global_step": 345712, "epoch": 2857} {"train_loss": -43.097145080566406, "global_step": 345713, "epoch": 2857} {"train_loss": -44.177974700927734, "global_step": 345714, "epoch": 2857} {"train_loss": -42.509368896484375, "global_step": 345715, "epoch": 2857} {"train_loss": -44.34163284301758, "global_step": 345716, "epoch": 2857} {"train_loss": -43.23655319213867, "global_step": 345717, "epoch": 2857} {"train_loss": -43.79903030395508, "global_step": 345718, "epoch": 2857} {"train_loss": -43.87160110473633, "global_step": 345719, "epoch": 2857} {"train_loss": -43.76115036010742, "global_step": 345720, "epoch": 2857} {"train_loss": -44.003353118896484, "global_step": 345721, "epoch": 2857} {"train_loss": -44.39982223510742, "global_step": 345722, "epoch": 2857} {"train_loss": -44.26945877075195, "global_step": 345723, "epoch": 2857} {"train_loss": -43.68679428100586, "global_step": 345724, "epoch": 2857} {"train_loss": -45.004638671875, "global_step": 345725, "epoch": 2857} {"train_loss": -43.6336784362793, "global_step": 345726, "epoch": 2857} {"train_loss": -44.155128479003906, "global_step": 345727, "epoch": 2857} {"train_loss": -44.38108444213867, "global_step": 345728, "epoch": 2857} {"train_loss": -44.678680419921875, "global_step": 345729, "epoch": 2857} {"train_loss": -44.319149017333984, "global_step": 345730, "epoch": 2857} {"train_loss": -45.267242431640625, "global_step": 345731, "epoch": 2857} {"train_loss": -44.610511779785156, "global_step": 345732, "epoch": 2857} {"train_loss": -44.9778938293457, "global_step": 345733, "epoch": 2857} {"train_loss": -44.78388977050781, "global_step": 345734, "epoch": 2857} {"train_loss": -45.007320404052734, "global_step": 345735, "epoch": 2857} {"train_loss": -44.796199798583984, "global_step": 345736, "epoch": 2857} {"train_loss": -44.35468673706055, "global_step": 345737, "epoch": 2857} {"train_loss": -44.85932159423828, "global_step": 345738, "epoch": 2857} {"train_loss": -44.8315315246582, "global_step": 345739, "epoch": 2857} {"train_loss": -44.6455192565918, "global_step": 345740, "epoch": 2857} {"train_loss": -45.05772018432617, "global_step": 345741, "epoch": 2857} {"train_loss": -44.230751037597656, "global_step": 345742, "epoch": 2857} {"train_loss": -45.55485916137695, "global_step": 345743, "epoch": 2857} {"train_loss": -44.51465606689453, "global_step": 345744, "epoch": 2857} {"train_loss": -44.834651947021484, "global_step": 345745, "epoch": 2857} {"train_loss": -45.17496871948242, "global_step": 345746, "epoch": 2857} {"train_loss": -45.2894401550293, "global_step": 345747, "epoch": 2857} {"train_loss": -44.98383712768555, "global_step": 345748, "epoch": 2857} {"train_loss": -45.15337371826172, "global_step": 345749, "epoch": 2857} {"train_loss": -45.35314178466797, "global_step": 345750, "epoch": 2857} {"train_loss": -45.3315315246582, "global_step": 345751, "epoch": 2857} {"train_loss": -44.340797424316406, "global_step": 345752, "epoch": 2857} {"train_loss": -45.24994659423828, "global_step": 345753, "epoch": 2857} {"train_loss": -44.94202423095703, "global_step": 345754, "epoch": 2857} {"train_loss": -45.11445236206055, "global_step": 345755, "epoch": 2857} {"train_loss": -45.48057174682617, "global_step": 345756, "epoch": 2857} {"train_loss": -44.680633544921875, "global_step": 345757, "epoch": 2857} {"train_loss": -44.95518112182617, "global_step": 345758, "epoch": 2857} {"train_loss": -44.62030029296875, "global_step": 345759, "epoch": 2857} {"train_loss": -45.0653076171875, "global_step": 345760, "epoch": 2857} {"train_loss": -45.13349533081055, "global_step": 345761, "epoch": 2857} {"train_loss": -44.50508117675781, "global_step": 345762, "epoch": 2857} {"train_loss": -44.6489372253418, "global_step": 345763, "epoch": 2857} {"train_loss": -44.899864196777344, "global_step": 345764, "epoch": 2857} {"train_loss": -45.033138275146484, "global_step": 345765, "epoch": 2857} {"train_loss": -45.0272216796875, "global_step": 345766, "epoch": 2857} {"train_loss": -42.63405227661133, "global_step": 345767, "epoch": 2857} {"train_loss": -43.09053421020508, "global_step": 345768, "epoch": 2857} {"train_loss": -44.123199462890625, "global_step": 345769, "epoch": 2857} {"train_loss": -44.476043701171875, "global_step": 345770, "epoch": 2857} {"train_loss": -44.09113311767578, "global_step": 345771, "epoch": 2857} {"train_loss": -39.4273796081543, "global_step": 345772, "epoch": 2857} {"train_loss": -44.523101806640625, "global_step": 345773, "epoch": 2857} {"train_loss": -44.070674896240234, "global_step": 345774, "epoch": 2857} {"train_loss": -45.02053451538086, "global_step": 345775, "epoch": 2857} {"train_loss": -42.85172653198242, "global_step": 345776, "epoch": 2857} {"train_loss": -43.990718841552734, "global_step": 345777, "epoch": 2857} {"train_loss": -40.50510787963867, "global_step": 345778, "epoch": 2857} {"train_loss": -44.15645980834961, "global_step": 345779, "epoch": 2857} {"train_loss": -40.3253288269043, "global_step": 345780, "epoch": 2857} {"train_loss": -44.388221740722656, "global_step": 345781, "epoch": 2857} {"train_loss": -42.27883529663086, "global_step": 345782, "epoch": 2857} {"train_loss": -38.59444046020508, "global_step": 345783, "epoch": 2857} {"train_loss": -41.68532943725586, "global_step": 345784, "epoch": 2857} {"train_loss": -43.99995803833008, "global_step": 345785, "epoch": 2857} {"train_loss": -42.1528205871582, "global_step": 345786, "epoch": 2857} {"train_loss": -41.28581619262695, "global_step": 345787, "epoch": 2857} {"train_loss": -42.218875885009766, "global_step": 345788, "epoch": 2857} {"train_loss": -39.49821853637695, "global_step": 345789, "epoch": 2857} {"train_loss": -39.44710922241211, "global_step": 345790, "epoch": 2857} {"train_loss": -42.85795211791992, "global_step": 345791, "epoch": 2857} {"train_loss": -40.2742805480957, "global_step": 345792, "epoch": 2857} {"train_loss": -42.822086334228516, "global_step": 345793, "epoch": 2857} {"train_loss": -40.91912841796875, "global_step": 345794, "epoch": 2857} {"train_loss": -39.6231803894043, "global_step": 345795, "epoch": 2857} {"train_loss": -43.45425796508789, "global_step": 345796, "epoch": 2857} {"train_loss": -40.11254119873047, "global_step": 345797, "epoch": 2857} {"train_loss": -42.70524978637695, "global_step": 345798, "epoch": 2857} {"train_loss": -41.13291549682617, "global_step": 345799, "epoch": 2857} {"train_loss": -42.09212875366211, "global_step": 345800, "epoch": 2857} {"train_loss": -43.3400993347168, "global_step": 345801, "epoch": 2857} {"train_loss": -43.9656867980957, "global_step": 345802, "epoch": 2857} {"train_loss": -42.95917510986328, "global_step": 345803, "epoch": 2857} {"train_loss": -42.28203201293945, "global_step": 345804, "epoch": 2857} {"train_loss": -43.3155632019043, "global_step": 345805, "epoch": 2857} {"train_loss": -43.5117301940918, "global_step": 345806, "epoch": 2857} {"train_loss": -42.273948669433594, "global_step": 345807, "epoch": 2857} {"train_loss": -42.72925567626953, "global_step": 345808, "epoch": 2857} {"train_loss": -43.89985275268555, "global_step": 345809, "epoch": 2857} {"train_loss": -44.36945343017578, "global_step": 345810, "epoch": 2857} {"train_loss": -44.497745513916016, "global_step": 345811, "epoch": 2857} {"train_loss": -41.68555450439453, "global_step": 345812, "epoch": 2857} {"train_loss": -43.85602569580078, "global_step": 345813, "epoch": 2857} {"train_loss": -44.34815979003906, "global_step": 345814, "epoch": 2857} {"train_loss": -44.426815032958984, "global_step": 345815, "epoch": 2857} {"train_loss": -43.814056396484375, "global_step": 345816, "epoch": 2857} {"train_loss": -43.572713552427686, "global_step": 345817, "epoch": 2857, "val_loss": 2755170.75} {"train_loss": -44.6198844909668, "global_step": 345818, "epoch": 2858} {"train_loss": -44.22196578979492, "global_step": 345819, "epoch": 2858} {"train_loss": -44.46622848510742, "global_step": 345820, "epoch": 2858} {"train_loss": -44.88917541503906, "global_step": 345821, "epoch": 2858} {"train_loss": -43.4273796081543, "global_step": 345822, "epoch": 2858} {"train_loss": -43.814449310302734, "global_step": 345823, "epoch": 2858} {"train_loss": -44.501251220703125, "global_step": 345824, "epoch": 2858} {"train_loss": -43.20155715942383, "global_step": 345825, "epoch": 2858} {"train_loss": -44.91733932495117, "global_step": 345826, "epoch": 2858} {"train_loss": -43.47294616699219, "global_step": 345827, "epoch": 2858} {"train_loss": -44.733680725097656, "global_step": 345828, "epoch": 2858} {"train_loss": -44.44783401489258, "global_step": 345829, "epoch": 2858} {"train_loss": -43.69300842285156, "global_step": 345830, "epoch": 2858} {"train_loss": -44.642574310302734, "global_step": 345831, "epoch": 2858} {"train_loss": -44.55560302734375, "global_step": 345832, "epoch": 2858} {"train_loss": -43.60456466674805, "global_step": 345833, "epoch": 2858} {"train_loss": -44.059200286865234, "global_step": 345834, "epoch": 2858} {"train_loss": -43.639915466308594, "global_step": 345835, "epoch": 2858} {"train_loss": -44.72185134887695, "global_step": 345836, "epoch": 2858} {"train_loss": -44.16946029663086, "global_step": 345837, "epoch": 2858} {"train_loss": -44.66480255126953, "global_step": 345838, "epoch": 2858} {"train_loss": -44.61808395385742, "global_step": 345839, "epoch": 2858} {"train_loss": -45.44968795776367, "global_step": 345840, "epoch": 2858} {"train_loss": -43.81888961791992, "global_step": 345841, "epoch": 2858} {"train_loss": -44.0958137512207, "global_step": 345842, "epoch": 2858} {"train_loss": -45.05400466918945, "global_step": 345843, "epoch": 2858} {"train_loss": -45.31283187866211, "global_step": 345844, "epoch": 2858} {"train_loss": -45.012298583984375, "global_step": 345845, "epoch": 2858} {"train_loss": -45.108314514160156, "global_step": 345846, "epoch": 2858} {"train_loss": -44.40050506591797, "global_step": 345847, "epoch": 2858} {"train_loss": -45.12067794799805, "global_step": 345848, "epoch": 2858} {"train_loss": -44.95552444458008, "global_step": 345849, "epoch": 2858} {"train_loss": -44.8751220703125, "global_step": 345850, "epoch": 2858} {"train_loss": -44.792236328125, "global_step": 345851, "epoch": 2858} {"train_loss": -44.7236328125, "global_step": 345852, "epoch": 2858} {"train_loss": -44.483184814453125, "global_step": 345853, "epoch": 2858} {"train_loss": -45.29923629760742, "global_step": 345854, "epoch": 2858} {"train_loss": -44.749786376953125, "global_step": 345855, "epoch": 2858} {"train_loss": -44.814083099365234, "global_step": 345856, "epoch": 2858} {"train_loss": -45.13827133178711, "global_step": 345857, "epoch": 2858} {"train_loss": -44.96745681762695, "global_step": 345858, "epoch": 2858} {"train_loss": -44.25717544555664, "global_step": 345859, "epoch": 2858} {"train_loss": -44.09943771362305, "global_step": 345860, "epoch": 2858} {"train_loss": -44.327125549316406, "global_step": 345861, "epoch": 2858} {"train_loss": -43.7919921875, "global_step": 345862, "epoch": 2858} {"train_loss": -44.95327377319336, "global_step": 345863, "epoch": 2858} {"train_loss": -44.5012321472168, "global_step": 345864, "epoch": 2858} {"train_loss": -42.5477409362793, "global_step": 345865, "epoch": 2858} {"train_loss": -42.51310348510742, "global_step": 345866, "epoch": 2858} {"train_loss": -43.604679107666016, "global_step": 345867, "epoch": 2858} {"train_loss": -45.028568267822266, "global_step": 345868, "epoch": 2858} {"train_loss": -43.504329681396484, "global_step": 345869, "epoch": 2858} {"train_loss": -44.73800277709961, "global_step": 345870, "epoch": 2858} {"train_loss": -44.91042709350586, "global_step": 345871, "epoch": 2858} {"train_loss": -44.45565414428711, "global_step": 345872, "epoch": 2858} {"train_loss": -44.61906051635742, "global_step": 345873, "epoch": 2858} {"train_loss": -44.98372268676758, "global_step": 345874, "epoch": 2858} {"train_loss": -44.80678939819336, "global_step": 345875, "epoch": 2858} {"train_loss": -44.84645462036133, "global_step": 345876, "epoch": 2858} {"train_loss": -44.31391525268555, "global_step": 345877, "epoch": 2858} {"train_loss": -45.067405700683594, "global_step": 345878, "epoch": 2858} {"train_loss": -44.14255905151367, "global_step": 345879, "epoch": 2858} {"train_loss": -44.4887580871582, "global_step": 345880, "epoch": 2858} {"train_loss": -45.06639862060547, "global_step": 345881, "epoch": 2858} {"train_loss": -43.74629592895508, "global_step": 345882, "epoch": 2858} {"train_loss": -44.5844841003418, "global_step": 345883, "epoch": 2858} {"train_loss": -44.604488372802734, "global_step": 345884, "epoch": 2858} {"train_loss": -42.962852478027344, "global_step": 345885, "epoch": 2858} {"train_loss": -44.44097900390625, "global_step": 345886, "epoch": 2858} {"train_loss": -45.342830657958984, "global_step": 345887, "epoch": 2858} {"train_loss": -43.830543518066406, "global_step": 345888, "epoch": 2858} {"train_loss": -44.50460433959961, "global_step": 345889, "epoch": 2858} {"train_loss": -44.789119720458984, "global_step": 345890, "epoch": 2858} {"train_loss": -44.502357482910156, "global_step": 345891, "epoch": 2858} {"train_loss": -44.387229919433594, "global_step": 345892, "epoch": 2858} {"train_loss": -44.13420867919922, "global_step": 345893, "epoch": 2858} {"train_loss": -44.424774169921875, "global_step": 345894, "epoch": 2858} {"train_loss": -44.00261306762695, "global_step": 345895, "epoch": 2858} {"train_loss": -44.16902542114258, "global_step": 345896, "epoch": 2858} {"train_loss": -45.51212692260742, "global_step": 345897, "epoch": 2858} {"train_loss": -44.877098083496094, "global_step": 345898, "epoch": 2858} {"train_loss": -44.79802322387695, "global_step": 345899, "epoch": 2858} {"train_loss": -44.743892669677734, "global_step": 345900, "epoch": 2858} {"train_loss": -45.194068908691406, "global_step": 345901, "epoch": 2858} {"train_loss": -44.63764190673828, "global_step": 345902, "epoch": 2858} {"train_loss": -44.86143112182617, "global_step": 345903, "epoch": 2858} {"train_loss": -44.83880615234375, "global_step": 345904, "epoch": 2858} {"train_loss": -44.68258285522461, "global_step": 345905, "epoch": 2858} {"train_loss": -44.65601348876953, "global_step": 345906, "epoch": 2858} {"train_loss": -45.14310836791992, "global_step": 345907, "epoch": 2858} {"train_loss": -44.5889778137207, "global_step": 345908, "epoch": 2858} {"train_loss": -44.501014709472656, "global_step": 345909, "epoch": 2858} {"train_loss": -44.341575622558594, "global_step": 345910, "epoch": 2858} {"train_loss": -45.52510070800781, "global_step": 345911, "epoch": 2858} {"train_loss": -45.076171875, "global_step": 345912, "epoch": 2858} {"train_loss": -45.31535720825195, "global_step": 345913, "epoch": 2858} {"train_loss": -45.35126876831055, "global_step": 345914, "epoch": 2858} {"train_loss": -44.011653900146484, "global_step": 345915, "epoch": 2858} {"train_loss": -44.44099807739258, "global_step": 345916, "epoch": 2858} {"train_loss": -45.42987823486328, "global_step": 345917, "epoch": 2858} {"train_loss": -45.246070861816406, "global_step": 345918, "epoch": 2858} {"train_loss": -45.081809997558594, "global_step": 345919, "epoch": 2858} {"train_loss": -44.83466339111328, "global_step": 345920, "epoch": 2858} {"train_loss": -45.04132843017578, "global_step": 345921, "epoch": 2858} {"train_loss": -45.3222541809082, "global_step": 345922, "epoch": 2858} {"train_loss": -44.566375732421875, "global_step": 345923, "epoch": 2858} {"train_loss": -44.221927642822266, "global_step": 345924, "epoch": 2858} {"train_loss": -42.61184310913086, "global_step": 345925, "epoch": 2858} {"train_loss": -44.27849197387695, "global_step": 345926, "epoch": 2858} {"train_loss": -45.5012321472168, "global_step": 345927, "epoch": 2858} {"train_loss": -44.37257385253906, "global_step": 345928, "epoch": 2858} {"train_loss": -39.92214584350586, "global_step": 345929, "epoch": 2858} {"train_loss": -43.336585998535156, "global_step": 345930, "epoch": 2858} {"train_loss": -34.87363815307617, "global_step": 345931, "epoch": 2858} {"train_loss": -33.98160934448242, "global_step": 345932, "epoch": 2858} {"train_loss": -40.21942138671875, "global_step": 345933, "epoch": 2858} {"train_loss": -38.51504135131836, "global_step": 345934, "epoch": 2858} {"train_loss": -34.74028778076172, "global_step": 345935, "epoch": 2858} {"train_loss": -38.27359390258789, "global_step": 345936, "epoch": 2858} {"train_loss": -37.62765121459961, "global_step": 345937, "epoch": 2858} {"train_loss": -43.988034681840375, "global_step": 345938, "epoch": 2858, "val_loss": 2540611.0} {"train_loss": -38.376163482666016, "global_step": 345939, "epoch": 2859} {"train_loss": -37.49928283691406, "global_step": 345940, "epoch": 2859} {"train_loss": -37.89337158203125, "global_step": 345941, "epoch": 2859} {"train_loss": -37.90981674194336, "global_step": 345942, "epoch": 2859} {"train_loss": -39.29063034057617, "global_step": 345943, "epoch": 2859} {"train_loss": -39.24392318725586, "global_step": 345944, "epoch": 2859} {"train_loss": -39.54916000366211, "global_step": 345945, "epoch": 2859} {"train_loss": -39.543609619140625, "global_step": 345946, "epoch": 2859} {"train_loss": -40.93650436401367, "global_step": 345947, "epoch": 2859} {"train_loss": -41.601402282714844, "global_step": 345948, "epoch": 2859} {"train_loss": -41.5961799621582, "global_step": 345949, "epoch": 2859} {"train_loss": -41.915870666503906, "global_step": 345950, "epoch": 2859} {"train_loss": -40.355979919433594, "global_step": 345951, "epoch": 2859} {"train_loss": -42.729427337646484, "global_step": 345952, "epoch": 2859} {"train_loss": -41.901466369628906, "global_step": 345953, "epoch": 2859} {"train_loss": -43.48891830444336, "global_step": 345954, "epoch": 2859} {"train_loss": -42.642879486083984, "global_step": 345955, "epoch": 2859} {"train_loss": -43.408138275146484, "global_step": 345956, "epoch": 2859} {"train_loss": -43.1258430480957, "global_step": 345957, "epoch": 2859} {"train_loss": -42.16646957397461, "global_step": 345958, "epoch": 2859} {"train_loss": -42.90864562988281, "global_step": 345959, "epoch": 2859} {"train_loss": -42.878692626953125, "global_step": 345960, "epoch": 2859} {"train_loss": -43.88978958129883, "global_step": 345961, "epoch": 2859} {"train_loss": -43.30691909790039, "global_step": 345962, "epoch": 2859} {"train_loss": -44.15884017944336, "global_step": 345963, "epoch": 2859} {"train_loss": -43.729557037353516, "global_step": 345964, "epoch": 2859} {"train_loss": -43.80672836303711, "global_step": 345965, "epoch": 2859} {"train_loss": -44.4040412902832, "global_step": 345966, "epoch": 2859} {"train_loss": -43.50995635986328, "global_step": 345967, "epoch": 2859} {"train_loss": -44.351505279541016, "global_step": 345968, "epoch": 2859} {"train_loss": -42.760353088378906, "global_step": 345969, "epoch": 2859} {"train_loss": -44.28762435913086, "global_step": 345970, "epoch": 2859} {"train_loss": -43.57050323486328, "global_step": 345971, "epoch": 2859} {"train_loss": -43.69584274291992, "global_step": 345972, "epoch": 2859} {"train_loss": -44.06940460205078, "global_step": 345973, "epoch": 2859} {"train_loss": -42.96590805053711, "global_step": 345974, "epoch": 2859} {"train_loss": -45.08364486694336, "global_step": 345975, "epoch": 2859} {"train_loss": -43.15260314941406, "global_step": 345976, "epoch": 2859} {"train_loss": -43.411651611328125, "global_step": 345977, "epoch": 2859} {"train_loss": -44.484580993652344, "global_step": 345978, "epoch": 2859} {"train_loss": -44.1280403137207, "global_step": 345979, "epoch": 2859} {"train_loss": -44.673683166503906, "global_step": 345980, "epoch": 2859} {"train_loss": -43.585994720458984, "global_step": 345981, "epoch": 2859} {"train_loss": -44.8154296875, "global_step": 345982, "epoch": 2859} {"train_loss": -43.97642135620117, "global_step": 345983, "epoch": 2859} {"train_loss": -44.275047302246094, "global_step": 345984, "epoch": 2859} {"train_loss": -44.75764083862305, "global_step": 345985, "epoch": 2859} {"train_loss": -44.65256881713867, "global_step": 345986, "epoch": 2859} {"train_loss": -44.65478515625, "global_step": 345987, "epoch": 2859} {"train_loss": -44.446712493896484, "global_step": 345988, "epoch": 2859} {"train_loss": -44.9358024597168, "global_step": 345989, "epoch": 2859} {"train_loss": -44.746395111083984, "global_step": 345990, "epoch": 2859} {"train_loss": -44.34064865112305, "global_step": 345991, "epoch": 2859} {"train_loss": -45.2380256652832, "global_step": 345992, "epoch": 2859} {"train_loss": -45.11573791503906, "global_step": 345993, "epoch": 2859} {"train_loss": -44.830177307128906, "global_step": 345994, "epoch": 2859} {"train_loss": -44.78737258911133, "global_step": 345995, "epoch": 2859} {"train_loss": -45.04197311401367, "global_step": 345996, "epoch": 2859} {"train_loss": -44.720184326171875, "global_step": 345997, "epoch": 2859} {"train_loss": -45.159297943115234, "global_step": 345998, "epoch": 2859} {"train_loss": -44.14935302734375, "global_step": 345999, "epoch": 2859} {"train_loss": -45.334938049316406, "global_step": 346000, "epoch": 2859} {"train_loss": -45.629791259765625, "global_step": 346001, "epoch": 2859} {"train_loss": -45.264366149902344, "global_step": 346002, "epoch": 2859} {"train_loss": -44.75688552856445, "global_step": 346003, "epoch": 2859} {"train_loss": -44.89467239379883, "global_step": 346004, "epoch": 2859} {"train_loss": -44.53924560546875, "global_step": 346005, "epoch": 2859} {"train_loss": -45.41816329956055, "global_step": 346006, "epoch": 2859} {"train_loss": -45.62215042114258, "global_step": 346007, "epoch": 2859} {"train_loss": -45.94197082519531, "global_step": 346008, "epoch": 2859} {"train_loss": -44.99384307861328, "global_step": 346009, "epoch": 2859} {"train_loss": -44.54666519165039, "global_step": 346010, "epoch": 2859} {"train_loss": -45.19902801513672, "global_step": 346011, "epoch": 2859} {"train_loss": -45.41475296020508, "global_step": 346012, "epoch": 2859} {"train_loss": -44.85960006713867, "global_step": 346013, "epoch": 2859} {"train_loss": -44.61396789550781, "global_step": 346014, "epoch": 2859} {"train_loss": -44.98747634887695, "global_step": 346015, "epoch": 2859} {"train_loss": -45.33779525756836, "global_step": 346016, "epoch": 2859} {"train_loss": -44.69397735595703, "global_step": 346017, "epoch": 2859} {"train_loss": -44.7530517578125, "global_step": 346018, "epoch": 2859} {"train_loss": -44.98885726928711, "global_step": 346019, "epoch": 2859} {"train_loss": -45.371158599853516, "global_step": 346020, "epoch": 2859} {"train_loss": -44.82515335083008, "global_step": 346021, "epoch": 2859} {"train_loss": -45.07897186279297, "global_step": 346022, "epoch": 2859} {"train_loss": -45.11837387084961, "global_step": 346023, "epoch": 2859} {"train_loss": -45.78829574584961, "global_step": 346024, "epoch": 2859} {"train_loss": -43.585479736328125, "global_step": 346025, "epoch": 2859} {"train_loss": -42.778907775878906, "global_step": 346026, "epoch": 2859} {"train_loss": -42.614891052246094, "global_step": 346027, "epoch": 2859} {"train_loss": -44.614532470703125, "global_step": 346028, "epoch": 2859} {"train_loss": -44.430084228515625, "global_step": 346029, "epoch": 2859} {"train_loss": -42.03662872314453, "global_step": 346030, "epoch": 2859} {"train_loss": -41.77105712890625, "global_step": 346031, "epoch": 2859} {"train_loss": -43.40748596191406, "global_step": 346032, "epoch": 2859} {"train_loss": -41.95335388183594, "global_step": 346033, "epoch": 2859} {"train_loss": -44.31025314331055, "global_step": 346034, "epoch": 2859} {"train_loss": -43.55908966064453, "global_step": 346035, "epoch": 2859} {"train_loss": -44.19898223876953, "global_step": 346036, "epoch": 2859} {"train_loss": -44.13703536987305, "global_step": 346037, "epoch": 2859} {"train_loss": -44.01350021362305, "global_step": 346038, "epoch": 2859} {"train_loss": -44.427101135253906, "global_step": 346039, "epoch": 2859} {"train_loss": -45.167030334472656, "global_step": 346040, "epoch": 2859} {"train_loss": -44.3800163269043, "global_step": 346041, "epoch": 2859} {"train_loss": -43.79423141479492, "global_step": 346042, "epoch": 2859} {"train_loss": -44.18696212768555, "global_step": 346043, "epoch": 2859} {"train_loss": -44.42966842651367, "global_step": 346044, "epoch": 2859} {"train_loss": -44.530704498291016, "global_step": 346045, "epoch": 2859} {"train_loss": -44.496097564697266, "global_step": 346046, "epoch": 2859} {"train_loss": -44.771705627441406, "global_step": 346047, "epoch": 2859} {"train_loss": -44.58100509643555, "global_step": 346048, "epoch": 2859} {"train_loss": -44.70954513549805, "global_step": 346049, "epoch": 2859} {"train_loss": -45.133941650390625, "global_step": 346050, "epoch": 2859} {"train_loss": -45.00155258178711, "global_step": 346051, "epoch": 2859} {"train_loss": -44.67623519897461, "global_step": 346052, "epoch": 2859} {"train_loss": -45.42580795288086, "global_step": 346053, "epoch": 2859} {"train_loss": -45.56377029418945, "global_step": 346054, "epoch": 2859} {"train_loss": -45.45600128173828, "global_step": 346055, "epoch": 2859} {"train_loss": -45.610321044921875, "global_step": 346056, "epoch": 2859} {"train_loss": -45.4398078918457, "global_step": 346057, "epoch": 2859} {"train_loss": -45.52667236328125, "global_step": 346058, "epoch": 2859} {"train_loss": -43.83873080419115, "global_step": 346059, "epoch": 2859, "val_loss": 2535312.75} {"train_loss": -45.418888092041016, "global_step": 346060, "epoch": 2860} {"train_loss": -44.667991638183594, "global_step": 346061, "epoch": 2860} {"train_loss": -44.80615234375, "global_step": 346062, "epoch": 2860} {"train_loss": -45.628360748291016, "global_step": 346063, "epoch": 2860} {"train_loss": -45.97138214111328, "global_step": 346064, "epoch": 2860} {"train_loss": -45.29392623901367, "global_step": 346065, "epoch": 2860} {"train_loss": -45.801513671875, "global_step": 346066, "epoch": 2860} {"train_loss": -45.046485900878906, "global_step": 346067, "epoch": 2860} {"train_loss": -44.83089828491211, "global_step": 346068, "epoch": 2860} {"train_loss": -45.276241302490234, "global_step": 346069, "epoch": 2860} {"train_loss": -45.8747673034668, "global_step": 346070, "epoch": 2860} {"train_loss": -45.17132568359375, "global_step": 346071, "epoch": 2860} {"train_loss": -45.02473068237305, "global_step": 346072, "epoch": 2860} {"train_loss": -45.622344970703125, "global_step": 346073, "epoch": 2860} {"train_loss": -45.61867904663086, "global_step": 346074, "epoch": 2860} {"train_loss": -45.28179168701172, "global_step": 346075, "epoch": 2860} {"train_loss": -45.04110336303711, "global_step": 346076, "epoch": 2860} {"train_loss": -45.66752243041992, "global_step": 346077, "epoch": 2860} {"train_loss": -45.053653717041016, "global_step": 346078, "epoch": 2860} {"train_loss": -44.376365661621094, "global_step": 346079, "epoch": 2860} {"train_loss": -43.0997314453125, "global_step": 346080, "epoch": 2860} {"train_loss": -43.46598434448242, "global_step": 346081, "epoch": 2860} {"train_loss": -42.38959884643555, "global_step": 346082, "epoch": 2860} {"train_loss": -40.90763473510742, "global_step": 346083, "epoch": 2860} {"train_loss": -43.27226638793945, "global_step": 346084, "epoch": 2860} {"train_loss": -44.56962966918945, "global_step": 346085, "epoch": 2860} {"train_loss": -43.688594818115234, "global_step": 346086, "epoch": 2860} {"train_loss": -44.103843688964844, "global_step": 346087, "epoch": 2860} {"train_loss": -44.408077239990234, "global_step": 346088, "epoch": 2860} {"train_loss": -44.35883331298828, "global_step": 346089, "epoch": 2860} {"train_loss": -43.450660705566406, "global_step": 346090, "epoch": 2860} {"train_loss": -44.02267837524414, "global_step": 346091, "epoch": 2860} {"train_loss": -43.77643966674805, "global_step": 346092, "epoch": 2860} {"train_loss": -44.42643737792969, "global_step": 346093, "epoch": 2860} {"train_loss": -42.56363296508789, "global_step": 346094, "epoch": 2860} {"train_loss": -44.11914825439453, "global_step": 346095, "epoch": 2860} {"train_loss": -42.26539611816406, "global_step": 346096, "epoch": 2860} {"train_loss": -44.77285385131836, "global_step": 346097, "epoch": 2860} {"train_loss": -42.732295989990234, "global_step": 346098, "epoch": 2860} {"train_loss": -42.76918411254883, "global_step": 346099, "epoch": 2860} {"train_loss": -41.982704162597656, "global_step": 346100, "epoch": 2860} {"train_loss": -41.39170455932617, "global_step": 346101, "epoch": 2860} {"train_loss": -43.16895294189453, "global_step": 346102, "epoch": 2860} {"train_loss": -43.78007125854492, "global_step": 346103, "epoch": 2860} {"train_loss": -44.69209671020508, "global_step": 346104, "epoch": 2860} {"train_loss": -43.73342514038086, "global_step": 346105, "epoch": 2860} {"train_loss": -43.82141876220703, "global_step": 346106, "epoch": 2860} {"train_loss": -44.83725357055664, "global_step": 346107, "epoch": 2860} {"train_loss": -44.02109909057617, "global_step": 346108, "epoch": 2860} {"train_loss": -44.91924285888672, "global_step": 346109, "epoch": 2860} {"train_loss": -44.56093978881836, "global_step": 346110, "epoch": 2860} {"train_loss": -44.58413314819336, "global_step": 346111, "epoch": 2860} {"train_loss": -44.12456512451172, "global_step": 346112, "epoch": 2860} {"train_loss": -44.05231475830078, "global_step": 346113, "epoch": 2860} {"train_loss": -44.527259826660156, "global_step": 346114, "epoch": 2860} {"train_loss": -44.20521926879883, "global_step": 346115, "epoch": 2860} {"train_loss": -44.77968215942383, "global_step": 346116, "epoch": 2860} {"train_loss": -43.217403411865234, "global_step": 346117, "epoch": 2860} {"train_loss": -44.60634994506836, "global_step": 346118, "epoch": 2860} {"train_loss": -44.280540466308594, "global_step": 346119, "epoch": 2860} {"train_loss": -43.2878303527832, "global_step": 346120, "epoch": 2860} {"train_loss": -44.04128646850586, "global_step": 346121, "epoch": 2860} {"train_loss": -44.57719039916992, "global_step": 346122, "epoch": 2860} {"train_loss": -42.7745246887207, "global_step": 346123, "epoch": 2860} {"train_loss": -44.341796875, "global_step": 346124, "epoch": 2860} {"train_loss": -45.21611404418945, "global_step": 346125, "epoch": 2860} {"train_loss": -43.701045989990234, "global_step": 346126, "epoch": 2860} {"train_loss": -43.70882034301758, "global_step": 346127, "epoch": 2860} {"train_loss": -44.822147369384766, "global_step": 346128, "epoch": 2860} {"train_loss": -44.1430549621582, "global_step": 346129, "epoch": 2860} {"train_loss": -44.3762321472168, "global_step": 346130, "epoch": 2860} {"train_loss": -44.64068603515625, "global_step": 346131, "epoch": 2860} {"train_loss": -44.83091354370117, "global_step": 346132, "epoch": 2860} {"train_loss": -45.307952880859375, "global_step": 346133, "epoch": 2860} {"train_loss": -45.20844650268555, "global_step": 346134, "epoch": 2860} {"train_loss": -45.02181625366211, "global_step": 346135, "epoch": 2860} {"train_loss": -44.683204650878906, "global_step": 346136, "epoch": 2860} {"train_loss": -43.20444869995117, "global_step": 346137, "epoch": 2860} {"train_loss": -44.16933822631836, "global_step": 346138, "epoch": 2860} {"train_loss": -45.74821853637695, "global_step": 346139, "epoch": 2860} {"train_loss": -43.870880126953125, "global_step": 346140, "epoch": 2860} {"train_loss": -43.663814544677734, "global_step": 346141, "epoch": 2860} {"train_loss": -45.134708404541016, "global_step": 346142, "epoch": 2860} {"train_loss": -44.08614730834961, "global_step": 346143, "epoch": 2860} {"train_loss": -44.327064514160156, "global_step": 346144, "epoch": 2860} {"train_loss": -45.17340087890625, "global_step": 346145, "epoch": 2860} {"train_loss": -45.08785629272461, "global_step": 346146, "epoch": 2860} {"train_loss": -45.154781341552734, "global_step": 346147, "epoch": 2860} {"train_loss": -45.25160217285156, "global_step": 346148, "epoch": 2860} {"train_loss": -45.0123405456543, "global_step": 346149, "epoch": 2860} {"train_loss": -44.95249557495117, "global_step": 346150, "epoch": 2860} {"train_loss": -45.28400421142578, "global_step": 346151, "epoch": 2860} {"train_loss": -45.13600540161133, "global_step": 346152, "epoch": 2860} {"train_loss": -45.12115478515625, "global_step": 346153, "epoch": 2860} {"train_loss": -45.06707763671875, "global_step": 346154, "epoch": 2860} {"train_loss": -45.174312591552734, "global_step": 346155, "epoch": 2860} {"train_loss": -44.753170013427734, "global_step": 346156, "epoch": 2860} {"train_loss": -45.543495178222656, "global_step": 346157, "epoch": 2860} {"train_loss": -45.281410217285156, "global_step": 346158, "epoch": 2860} {"train_loss": -45.493751525878906, "global_step": 346159, "epoch": 2860} {"train_loss": -45.07465362548828, "global_step": 346160, "epoch": 2860} {"train_loss": -45.63970947265625, "global_step": 346161, "epoch": 2860} {"train_loss": -45.278072357177734, "global_step": 346162, "epoch": 2860} {"train_loss": -45.27425003051758, "global_step": 346163, "epoch": 2860} {"train_loss": -45.81362533569336, "global_step": 346164, "epoch": 2860} {"train_loss": -45.144927978515625, "global_step": 346165, "epoch": 2860} {"train_loss": -44.9697380065918, "global_step": 346166, "epoch": 2860} {"train_loss": -45.585567474365234, "global_step": 346167, "epoch": 2860} {"train_loss": -45.509559631347656, "global_step": 346168, "epoch": 2860} {"train_loss": -45.685577392578125, "global_step": 346169, "epoch": 2860} {"train_loss": -45.01038360595703, "global_step": 346170, "epoch": 2860} {"train_loss": -45.13644027709961, "global_step": 346171, "epoch": 2860} {"train_loss": -45.95930099487305, "global_step": 346172, "epoch": 2860} {"train_loss": -44.53620147705078, "global_step": 346173, "epoch": 2860} {"train_loss": -44.56913375854492, "global_step": 346174, "epoch": 2860} {"train_loss": -44.99701690673828, "global_step": 346175, "epoch": 2860} {"train_loss": -44.300811767578125, "global_step": 346176, "epoch": 2860} {"train_loss": -45.26908493041992, "global_step": 346177, "epoch": 2860} {"train_loss": -46.00094223022461, "global_step": 346178, "epoch": 2860} {"train_loss": -45.28209686279297, "global_step": 346179, "epoch": 2860} {"train_loss": -44.54207702510613, "global_step": 346180, "epoch": 2860, "val_loss": 2524031.5} {"train_loss": -44.914913177490234, "global_step": 346181, "epoch": 2861} {"train_loss": -44.56689453125, "global_step": 346182, "epoch": 2861} {"train_loss": -43.862152099609375, "global_step": 346183, "epoch": 2861} {"train_loss": -43.852027893066406, "global_step": 346184, "epoch": 2861} {"train_loss": -43.61687088012695, "global_step": 346185, "epoch": 2861} {"train_loss": -44.862457275390625, "global_step": 346186, "epoch": 2861} {"train_loss": -44.88203048706055, "global_step": 346187, "epoch": 2861} {"train_loss": -44.65642166137695, "global_step": 346188, "epoch": 2861} {"train_loss": -43.725990295410156, "global_step": 346189, "epoch": 2861} {"train_loss": -45.245880126953125, "global_step": 346190, "epoch": 2861} {"train_loss": -44.819427490234375, "global_step": 346191, "epoch": 2861} {"train_loss": -45.30422592163086, "global_step": 346192, "epoch": 2861} {"train_loss": -44.71320343017578, "global_step": 346193, "epoch": 2861} {"train_loss": -44.52400588989258, "global_step": 346194, "epoch": 2861} {"train_loss": -44.93451690673828, "global_step": 346195, "epoch": 2861} {"train_loss": -44.775665283203125, "global_step": 346196, "epoch": 2861} {"train_loss": -44.82843017578125, "global_step": 346197, "epoch": 2861} {"train_loss": -44.85030746459961, "global_step": 346198, "epoch": 2861} {"train_loss": -45.15243148803711, "global_step": 346199, "epoch": 2861} {"train_loss": -45.10551071166992, "global_step": 346200, "epoch": 2861} {"train_loss": -45.3476676940918, "global_step": 346201, "epoch": 2861} {"train_loss": -45.483184814453125, "global_step": 346202, "epoch": 2861} {"train_loss": -45.32497787475586, "global_step": 346203, "epoch": 2861} {"train_loss": -44.588619232177734, "global_step": 346204, "epoch": 2861} {"train_loss": -45.200191497802734, "global_step": 346205, "epoch": 2861} {"train_loss": -44.95132064819336, "global_step": 346206, "epoch": 2861} {"train_loss": -45.23149871826172, "global_step": 346207, "epoch": 2861} {"train_loss": -45.197444915771484, "global_step": 346208, "epoch": 2861} {"train_loss": -44.1195182800293, "global_step": 346209, "epoch": 2861} {"train_loss": -43.509490966796875, "global_step": 346210, "epoch": 2861} {"train_loss": -45.341407775878906, "global_step": 346211, "epoch": 2861} {"train_loss": -43.1722526550293, "global_step": 346212, "epoch": 2861} {"train_loss": -43.24149703979492, "global_step": 346213, "epoch": 2861} {"train_loss": -44.95011520385742, "global_step": 346214, "epoch": 2861} {"train_loss": -43.078582763671875, "global_step": 346215, "epoch": 2861} {"train_loss": -44.18752670288086, "global_step": 346216, "epoch": 2861} {"train_loss": -44.76619338989258, "global_step": 346217, "epoch": 2861} {"train_loss": -44.47956466674805, "global_step": 346218, "epoch": 2861} {"train_loss": -44.483680725097656, "global_step": 346219, "epoch": 2861} {"train_loss": -44.79072570800781, "global_step": 346220, "epoch": 2861} {"train_loss": -44.91898727416992, "global_step": 346221, "epoch": 2861} {"train_loss": -44.391963958740234, "global_step": 346222, "epoch": 2861} {"train_loss": -43.28578567504883, "global_step": 346223, "epoch": 2861} {"train_loss": -42.43912887573242, "global_step": 346224, "epoch": 2861} {"train_loss": -44.30564880371094, "global_step": 346225, "epoch": 2861} {"train_loss": -41.97564697265625, "global_step": 346226, "epoch": 2861} {"train_loss": -43.02144241333008, "global_step": 346227, "epoch": 2861} {"train_loss": -42.93160629272461, "global_step": 346228, "epoch": 2861} {"train_loss": -40.90897750854492, "global_step": 346229, "epoch": 2861} {"train_loss": -41.22041320800781, "global_step": 346230, "epoch": 2861} {"train_loss": -43.074092864990234, "global_step": 346231, "epoch": 2861} {"train_loss": -39.10178756713867, "global_step": 346232, "epoch": 2861} {"train_loss": -43.446868896484375, "global_step": 346233, "epoch": 2861} {"train_loss": -37.35890579223633, "global_step": 346234, "epoch": 2861} {"train_loss": -37.9991340637207, "global_step": 346235, "epoch": 2861} {"train_loss": -36.34143829345703, "global_step": 346236, "epoch": 2861} {"train_loss": -41.0797119140625, "global_step": 346237, "epoch": 2861} {"train_loss": -42.36033248901367, "global_step": 346238, "epoch": 2861} {"train_loss": -40.65141296386719, "global_step": 346239, "epoch": 2861} {"train_loss": -41.88169479370117, "global_step": 346240, "epoch": 2861} {"train_loss": -40.734222412109375, "global_step": 346241, "epoch": 2861} {"train_loss": -43.91606521606445, "global_step": 346242, "epoch": 2861} {"train_loss": -42.448482513427734, "global_step": 346243, "epoch": 2861} {"train_loss": -43.0136833190918, "global_step": 346244, "epoch": 2861} {"train_loss": -41.03512191772461, "global_step": 346245, "epoch": 2861} {"train_loss": -42.02930450439453, "global_step": 346246, "epoch": 2861} {"train_loss": -42.011226654052734, "global_step": 346247, "epoch": 2861} {"train_loss": -41.694026947021484, "global_step": 346248, "epoch": 2861} {"train_loss": -42.967864990234375, "global_step": 346249, "epoch": 2861} {"train_loss": -42.24956130981445, "global_step": 346250, "epoch": 2861} {"train_loss": -42.9342041015625, "global_step": 346251, "epoch": 2861} {"train_loss": -42.901466369628906, "global_step": 346252, "epoch": 2861} {"train_loss": -42.63134002685547, "global_step": 346253, "epoch": 2861} {"train_loss": -43.03321075439453, "global_step": 346254, "epoch": 2861} {"train_loss": -43.41282272338867, "global_step": 346255, "epoch": 2861} {"train_loss": -43.18483352661133, "global_step": 346256, "epoch": 2861} {"train_loss": -43.247840881347656, "global_step": 346257, "epoch": 2861} {"train_loss": -43.520172119140625, "global_step": 346258, "epoch": 2861} {"train_loss": -43.030452728271484, "global_step": 346259, "epoch": 2861} {"train_loss": -42.598628997802734, "global_step": 346260, "epoch": 2861} {"train_loss": -43.40805435180664, "global_step": 346261, "epoch": 2861} {"train_loss": -42.90827941894531, "global_step": 346262, "epoch": 2861} {"train_loss": -43.87226486206055, "global_step": 346263, "epoch": 2861} {"train_loss": -43.9074592590332, "global_step": 346264, "epoch": 2861} {"train_loss": -43.69891357421875, "global_step": 346265, "epoch": 2861} {"train_loss": -43.316627502441406, "global_step": 346266, "epoch": 2861} {"train_loss": -44.11781692504883, "global_step": 346267, "epoch": 2861} {"train_loss": -44.02328872680664, "global_step": 346268, "epoch": 2861} {"train_loss": -43.59048843383789, "global_step": 346269, "epoch": 2861} {"train_loss": -43.95335006713867, "global_step": 346270, "epoch": 2861} {"train_loss": -44.194000244140625, "global_step": 346271, "epoch": 2861} {"train_loss": -44.40716552734375, "global_step": 346272, "epoch": 2861} {"train_loss": -44.15290451049805, "global_step": 346273, "epoch": 2861} {"train_loss": -43.834930419921875, "global_step": 346274, "epoch": 2861} {"train_loss": -43.884033203125, "global_step": 346275, "epoch": 2861} {"train_loss": -43.9226188659668, "global_step": 346276, "epoch": 2861} {"train_loss": -44.37089920043945, "global_step": 346277, "epoch": 2861} {"train_loss": -44.43238067626953, "global_step": 346278, "epoch": 2861} {"train_loss": -44.24220657348633, "global_step": 346279, "epoch": 2861} {"train_loss": -44.81728744506836, "global_step": 346280, "epoch": 2861} {"train_loss": -44.431739807128906, "global_step": 346281, "epoch": 2861} {"train_loss": -44.65249252319336, "global_step": 346282, "epoch": 2861} {"train_loss": -44.1161994934082, "global_step": 346283, "epoch": 2861} {"train_loss": -44.531429290771484, "global_step": 346284, "epoch": 2861} {"train_loss": -43.778987884521484, "global_step": 346285, "epoch": 2861} {"train_loss": -44.760047912597656, "global_step": 346286, "epoch": 2861} {"train_loss": -44.31338119506836, "global_step": 346287, "epoch": 2861} {"train_loss": -44.826786041259766, "global_step": 346288, "epoch": 2861} {"train_loss": -44.21302032470703, "global_step": 346289, "epoch": 2861} {"train_loss": -44.099327087402344, "global_step": 346290, "epoch": 2861} {"train_loss": -44.83302688598633, "global_step": 346291, "epoch": 2861} {"train_loss": -44.80011749267578, "global_step": 346292, "epoch": 2861} {"train_loss": -44.80876541137695, "global_step": 346293, "epoch": 2861} {"train_loss": -45.116817474365234, "global_step": 346294, "epoch": 2861} {"train_loss": -44.30552291870117, "global_step": 346295, "epoch": 2861} {"train_loss": -44.95735168457031, "global_step": 346296, "epoch": 2861} {"train_loss": -45.12124252319336, "global_step": 346297, "epoch": 2861} {"train_loss": -44.93387222290039, "global_step": 346298, "epoch": 2861} {"train_loss": -45.6041145324707, "global_step": 346299, "epoch": 2861} {"train_loss": -44.362060546875, "global_step": 346300, "epoch": 2861} {"train_loss": -43.689335878230324, "global_step": 346301, "epoch": 2861, "val_loss": 2505277.25} {"train_loss": -44.801570892333984, "global_step": 346302, "epoch": 2862} {"train_loss": -45.40281295776367, "global_step": 346303, "epoch": 2862} {"train_loss": -44.64579772949219, "global_step": 346304, "epoch": 2862} {"train_loss": -45.18558883666992, "global_step": 346305, "epoch": 2862} {"train_loss": -45.161712646484375, "global_step": 346306, "epoch": 2862} {"train_loss": -44.77606964111328, "global_step": 346307, "epoch": 2862} {"train_loss": -45.399356842041016, "global_step": 346308, "epoch": 2862} {"train_loss": -45.123958587646484, "global_step": 346309, "epoch": 2862} {"train_loss": -45.95539474487305, "global_step": 346310, "epoch": 2862} {"train_loss": -45.50164794921875, "global_step": 346311, "epoch": 2862} {"train_loss": -45.26426315307617, "global_step": 346312, "epoch": 2862} {"train_loss": -45.5026741027832, "global_step": 346313, "epoch": 2862} {"train_loss": -45.21537399291992, "global_step": 346314, "epoch": 2862} {"train_loss": -45.96027755737305, "global_step": 346315, "epoch": 2862} {"train_loss": -45.466163635253906, "global_step": 346316, "epoch": 2862} {"train_loss": -45.48966598510742, "global_step": 346317, "epoch": 2862} {"train_loss": -45.62083053588867, "global_step": 346318, "epoch": 2862} {"train_loss": -45.508731842041016, "global_step": 346319, "epoch": 2862} {"train_loss": -44.92354202270508, "global_step": 346320, "epoch": 2862} {"train_loss": -45.94801712036133, "global_step": 346321, "epoch": 2862} {"train_loss": -45.58734893798828, "global_step": 346322, "epoch": 2862} {"train_loss": -45.632564544677734, "global_step": 346323, "epoch": 2862} {"train_loss": -45.26829147338867, "global_step": 346324, "epoch": 2862} {"train_loss": -45.38001251220703, "global_step": 346325, "epoch": 2862} {"train_loss": -45.38672637939453, "global_step": 346326, "epoch": 2862} {"train_loss": -45.72404098510742, "global_step": 346327, "epoch": 2862} {"train_loss": -45.719947814941406, "global_step": 346328, "epoch": 2862} {"train_loss": -46.12691879272461, "global_step": 346329, "epoch": 2862} {"train_loss": -45.65909957885742, "global_step": 346330, "epoch": 2862} {"train_loss": -44.829708099365234, "global_step": 346331, "epoch": 2862} {"train_loss": -44.610137939453125, "global_step": 346332, "epoch": 2862} {"train_loss": -45.27186584472656, "global_step": 346333, "epoch": 2862} {"train_loss": -45.5714225769043, "global_step": 346334, "epoch": 2862} {"train_loss": -44.26730728149414, "global_step": 346335, "epoch": 2862} {"train_loss": -45.13337326049805, "global_step": 346336, "epoch": 2862} {"train_loss": -45.881160736083984, "global_step": 346337, "epoch": 2862} {"train_loss": -44.74843978881836, "global_step": 346338, "epoch": 2862} {"train_loss": -43.66590118408203, "global_step": 346339, "epoch": 2862} {"train_loss": -44.942501068115234, "global_step": 346340, "epoch": 2862} {"train_loss": -45.55890655517578, "global_step": 346341, "epoch": 2862} {"train_loss": -44.77892303466797, "global_step": 346342, "epoch": 2862} {"train_loss": -42.75374984741211, "global_step": 346343, "epoch": 2862} {"train_loss": -45.005226135253906, "global_step": 346344, "epoch": 2862} {"train_loss": -45.12146759033203, "global_step": 346345, "epoch": 2862} {"train_loss": -44.86910629272461, "global_step": 346346, "epoch": 2862} {"train_loss": -44.2086067199707, "global_step": 346347, "epoch": 2862} {"train_loss": -45.2947998046875, "global_step": 346348, "epoch": 2862} {"train_loss": -45.422969818115234, "global_step": 346349, "epoch": 2862} {"train_loss": -44.43778991699219, "global_step": 346350, "epoch": 2862} {"train_loss": -45.10414505004883, "global_step": 346351, "epoch": 2862} {"train_loss": -43.7927360534668, "global_step": 346352, "epoch": 2862} {"train_loss": -43.95707702636719, "global_step": 346353, "epoch": 2862} {"train_loss": -45.029541015625, "global_step": 346354, "epoch": 2862} {"train_loss": -44.85268783569336, "global_step": 346355, "epoch": 2862} {"train_loss": -44.05136489868164, "global_step": 346356, "epoch": 2862} {"train_loss": -45.1593017578125, "global_step": 346357, "epoch": 2862} {"train_loss": -44.295711517333984, "global_step": 346358, "epoch": 2862} {"train_loss": -44.17202377319336, "global_step": 346359, "epoch": 2862} {"train_loss": -44.994789123535156, "global_step": 346360, "epoch": 2862} {"train_loss": -43.02256393432617, "global_step": 346361, "epoch": 2862} {"train_loss": -45.13174057006836, "global_step": 346362, "epoch": 2862} {"train_loss": -44.97700881958008, "global_step": 346363, "epoch": 2862} {"train_loss": -44.475154876708984, "global_step": 346364, "epoch": 2862} {"train_loss": -44.99930953979492, "global_step": 346365, "epoch": 2862} {"train_loss": -44.8254280090332, "global_step": 346366, "epoch": 2862} {"train_loss": -45.04404067993164, "global_step": 346367, "epoch": 2862} {"train_loss": -44.4835319519043, "global_step": 346368, "epoch": 2862} {"train_loss": -43.55238723754883, "global_step": 346369, "epoch": 2862} {"train_loss": -44.5338249206543, "global_step": 346370, "epoch": 2862} {"train_loss": -44.430294036865234, "global_step": 346371, "epoch": 2862} {"train_loss": -44.389583587646484, "global_step": 346372, "epoch": 2862} {"train_loss": -45.04677200317383, "global_step": 346373, "epoch": 2862} {"train_loss": -44.014461517333984, "global_step": 346374, "epoch": 2862} {"train_loss": -44.18476486206055, "global_step": 346375, "epoch": 2862} {"train_loss": -45.31097412109375, "global_step": 346376, "epoch": 2862} {"train_loss": -43.9265251159668, "global_step": 346377, "epoch": 2862} {"train_loss": -44.809471130371094, "global_step": 346378, "epoch": 2862} {"train_loss": -44.767799377441406, "global_step": 346379, "epoch": 2862} {"train_loss": -45.09788131713867, "global_step": 346380, "epoch": 2862} {"train_loss": -44.58262252807617, "global_step": 346381, "epoch": 2862} {"train_loss": -44.17079162597656, "global_step": 346382, "epoch": 2862} {"train_loss": -44.78095626831055, "global_step": 346383, "epoch": 2862} {"train_loss": -45.17557907104492, "global_step": 346384, "epoch": 2862} {"train_loss": -45.36738204956055, "global_step": 346385, "epoch": 2862} {"train_loss": -45.243316650390625, "global_step": 346386, "epoch": 2862} {"train_loss": -44.843849182128906, "global_step": 346387, "epoch": 2862} {"train_loss": -44.85175704956055, "global_step": 346388, "epoch": 2862} {"train_loss": -44.44035720825195, "global_step": 346389, "epoch": 2862} {"train_loss": -45.1129264831543, "global_step": 346390, "epoch": 2862} {"train_loss": -45.3253059387207, "global_step": 346391, "epoch": 2862} {"train_loss": -45.10061264038086, "global_step": 346392, "epoch": 2862} {"train_loss": -43.10445785522461, "global_step": 346393, "epoch": 2862} {"train_loss": -43.47837448120117, "global_step": 346394, "epoch": 2862} {"train_loss": -44.49459457397461, "global_step": 346395, "epoch": 2862} {"train_loss": -45.912742614746094, "global_step": 346396, "epoch": 2862} {"train_loss": -44.0610466003418, "global_step": 346397, "epoch": 2862} {"train_loss": -40.39305877685547, "global_step": 346398, "epoch": 2862} {"train_loss": -45.50822067260742, "global_step": 346399, "epoch": 2862} {"train_loss": -42.716007232666016, "global_step": 346400, "epoch": 2862} {"train_loss": -41.719722747802734, "global_step": 346401, "epoch": 2862} {"train_loss": -44.87553405761719, "global_step": 346402, "epoch": 2862} {"train_loss": -42.47335433959961, "global_step": 346403, "epoch": 2862} {"train_loss": -42.40572738647461, "global_step": 346404, "epoch": 2862} {"train_loss": -44.3430290222168, "global_step": 346405, "epoch": 2862} {"train_loss": -39.028419494628906, "global_step": 346406, "epoch": 2862} {"train_loss": -43.15191650390625, "global_step": 346407, "epoch": 2862} {"train_loss": -30.306747436523438, "global_step": 346408, "epoch": 2862} {"train_loss": -43.24531173706055, "global_step": 346409, "epoch": 2862} {"train_loss": -35.455692291259766, "global_step": 346410, "epoch": 2862} {"train_loss": -41.89628219604492, "global_step": 346411, "epoch": 2862} {"train_loss": -40.933162689208984, "global_step": 346412, "epoch": 2862} {"train_loss": -39.87824249267578, "global_step": 346413, "epoch": 2862} {"train_loss": -43.31056213378906, "global_step": 346414, "epoch": 2862} {"train_loss": -42.54665756225586, "global_step": 346415, "epoch": 2862} {"train_loss": -42.21127700805664, "global_step": 346416, "epoch": 2862} {"train_loss": -42.8274040222168, "global_step": 346417, "epoch": 2862} {"train_loss": -41.96381378173828, "global_step": 346418, "epoch": 2862} {"train_loss": -44.12138748168945, "global_step": 346419, "epoch": 2862} {"train_loss": -42.303131103515625, "global_step": 346420, "epoch": 2862} {"train_loss": -44.65769577026367, "global_step": 346421, "epoch": 2862} {"train_loss": -44.269721764178314, "global_step": 346422, "epoch": 2862, "val_loss": 2550897.25} {"train_loss": -43.86329650878906, "global_step": 346423, "epoch": 2863} {"train_loss": -43.791351318359375, "global_step": 346424, "epoch": 2863} {"train_loss": -43.97072982788086, "global_step": 346425, "epoch": 2863} {"train_loss": -42.92816162109375, "global_step": 346426, "epoch": 2863} {"train_loss": -44.571502685546875, "global_step": 346427, "epoch": 2863} {"train_loss": -42.98240280151367, "global_step": 346428, "epoch": 2863} {"train_loss": -43.933292388916016, "global_step": 346429, "epoch": 2863} {"train_loss": -44.315792083740234, "global_step": 346430, "epoch": 2863} {"train_loss": -44.21914291381836, "global_step": 346431, "epoch": 2863} {"train_loss": -44.683135986328125, "global_step": 346432, "epoch": 2863} {"train_loss": -44.80363464355469, "global_step": 346433, "epoch": 2863} {"train_loss": -44.619136810302734, "global_step": 346434, "epoch": 2863} {"train_loss": -44.77065658569336, "global_step": 346435, "epoch": 2863} {"train_loss": -44.69001007080078, "global_step": 346436, "epoch": 2863} {"train_loss": -44.492000579833984, "global_step": 346437, "epoch": 2863} {"train_loss": -44.380714416503906, "global_step": 346438, "epoch": 2863} {"train_loss": -45.17464065551758, "global_step": 346439, "epoch": 2863} {"train_loss": -44.78738021850586, "global_step": 346440, "epoch": 2863} {"train_loss": -45.0335693359375, "global_step": 346441, "epoch": 2863} {"train_loss": -45.29914474487305, "global_step": 346442, "epoch": 2863} {"train_loss": -45.10713577270508, "global_step": 346443, "epoch": 2863} {"train_loss": -45.48785400390625, "global_step": 346444, "epoch": 2863} {"train_loss": -44.81007766723633, "global_step": 346445, "epoch": 2863} {"train_loss": -45.578155517578125, "global_step": 346446, "epoch": 2863} {"train_loss": -45.29094314575195, "global_step": 346447, "epoch": 2863} {"train_loss": -45.628726959228516, "global_step": 346448, "epoch": 2863} {"train_loss": -44.9412841796875, "global_step": 346449, "epoch": 2863} {"train_loss": -45.1860466003418, "global_step": 346450, "epoch": 2863} {"train_loss": -45.571197509765625, "global_step": 346451, "epoch": 2863} {"train_loss": -45.2658576965332, "global_step": 346452, "epoch": 2863} {"train_loss": -45.01287841796875, "global_step": 346453, "epoch": 2863} {"train_loss": -45.439754486083984, "global_step": 346454, "epoch": 2863} {"train_loss": -45.521610260009766, "global_step": 346455, "epoch": 2863} {"train_loss": -44.99467849731445, "global_step": 346456, "epoch": 2863} {"train_loss": -44.701416015625, "global_step": 346457, "epoch": 2863} {"train_loss": -44.602535247802734, "global_step": 346458, "epoch": 2863} {"train_loss": -45.735931396484375, "global_step": 346459, "epoch": 2863} {"train_loss": -44.31916046142578, "global_step": 346460, "epoch": 2863} {"train_loss": -45.24418258666992, "global_step": 346461, "epoch": 2863} {"train_loss": -45.66129684448242, "global_step": 346462, "epoch": 2863} {"train_loss": -44.53833770751953, "global_step": 346463, "epoch": 2863} {"train_loss": -45.62670135498047, "global_step": 346464, "epoch": 2863} {"train_loss": -45.40529251098633, "global_step": 346465, "epoch": 2863} {"train_loss": -45.39570999145508, "global_step": 346466, "epoch": 2863} {"train_loss": -45.050750732421875, "global_step": 346467, "epoch": 2863} {"train_loss": -44.90037536621094, "global_step": 346468, "epoch": 2863} {"train_loss": -46.1188850402832, "global_step": 346469, "epoch": 2863} {"train_loss": -44.3896369934082, "global_step": 346470, "epoch": 2863} {"train_loss": -44.046730041503906, "global_step": 346471, "epoch": 2863} {"train_loss": -44.55002975463867, "global_step": 346472, "epoch": 2863} {"train_loss": -44.94365692138672, "global_step": 346473, "epoch": 2863} {"train_loss": -45.52705383300781, "global_step": 346474, "epoch": 2863} {"train_loss": -44.98800277709961, "global_step": 346475, "epoch": 2863} {"train_loss": -44.88016891479492, "global_step": 346476, "epoch": 2863} {"train_loss": -45.25368118286133, "global_step": 346477, "epoch": 2863} {"train_loss": -44.987857818603516, "global_step": 346478, "epoch": 2863} {"train_loss": -45.084075927734375, "global_step": 346479, "epoch": 2863} {"train_loss": -45.010684967041016, "global_step": 346480, "epoch": 2863} {"train_loss": -44.82069778442383, "global_step": 346481, "epoch": 2863} {"train_loss": -45.25874710083008, "global_step": 346482, "epoch": 2863} {"train_loss": -44.91677474975586, "global_step": 346483, "epoch": 2863} {"train_loss": -44.76150131225586, "global_step": 346484, "epoch": 2863} {"train_loss": -45.021270751953125, "global_step": 346485, "epoch": 2863} {"train_loss": -45.0186882019043, "global_step": 346486, "epoch": 2863} {"train_loss": -45.45612716674805, "global_step": 346487, "epoch": 2863} {"train_loss": -44.851539611816406, "global_step": 346488, "epoch": 2863} {"train_loss": -44.19169998168945, "global_step": 346489, "epoch": 2863} {"train_loss": -42.78013229370117, "global_step": 346490, "epoch": 2863} {"train_loss": -44.80624008178711, "global_step": 346491, "epoch": 2863} {"train_loss": -45.038726806640625, "global_step": 346492, "epoch": 2863} {"train_loss": -43.87531661987305, "global_step": 346493, "epoch": 2863} {"train_loss": -44.26267623901367, "global_step": 346494, "epoch": 2863} {"train_loss": -42.47599411010742, "global_step": 346495, "epoch": 2863} {"train_loss": -43.80453109741211, "global_step": 346496, "epoch": 2863} {"train_loss": -41.6812858581543, "global_step": 346497, "epoch": 2863} {"train_loss": -41.96071243286133, "global_step": 346498, "epoch": 2863} {"train_loss": -45.30463409423828, "global_step": 346499, "epoch": 2863} {"train_loss": -43.633827209472656, "global_step": 346500, "epoch": 2863} {"train_loss": -43.3850212097168, "global_step": 346501, "epoch": 2863} {"train_loss": -44.151153564453125, "global_step": 346502, "epoch": 2863} {"train_loss": -43.16558074951172, "global_step": 346503, "epoch": 2863} {"train_loss": -44.39813995361328, "global_step": 346504, "epoch": 2863} {"train_loss": -44.67354202270508, "global_step": 346505, "epoch": 2863} {"train_loss": -45.308387756347656, "global_step": 346506, "epoch": 2863} {"train_loss": -44.711360931396484, "global_step": 346507, "epoch": 2863} {"train_loss": -44.86941146850586, "global_step": 346508, "epoch": 2863} {"train_loss": -45.32896423339844, "global_step": 346509, "epoch": 2863} {"train_loss": -44.80439376831055, "global_step": 346510, "epoch": 2863} {"train_loss": -42.91815948486328, "global_step": 346511, "epoch": 2863} {"train_loss": -43.01272201538086, "global_step": 346512, "epoch": 2863} {"train_loss": -42.68932342529297, "global_step": 346513, "epoch": 2863} {"train_loss": -44.36452865600586, "global_step": 346514, "epoch": 2863} {"train_loss": -43.673038482666016, "global_step": 346515, "epoch": 2863} {"train_loss": -44.911861419677734, "global_step": 346516, "epoch": 2863} {"train_loss": -43.41547775268555, "global_step": 346517, "epoch": 2863} {"train_loss": -42.404762268066406, "global_step": 346518, "epoch": 2863} {"train_loss": -42.55992126464844, "global_step": 346519, "epoch": 2863} {"train_loss": -44.674346923828125, "global_step": 346520, "epoch": 2863} {"train_loss": -44.23814010620117, "global_step": 346521, "epoch": 2863} {"train_loss": -44.648475646972656, "global_step": 346522, "epoch": 2863} {"train_loss": -44.16030502319336, "global_step": 346523, "epoch": 2863} {"train_loss": -44.27029037475586, "global_step": 346524, "epoch": 2863} {"train_loss": -44.817134857177734, "global_step": 346525, "epoch": 2863} {"train_loss": -44.01450729370117, "global_step": 346526, "epoch": 2863} {"train_loss": -44.134151458740234, "global_step": 346527, "epoch": 2863} {"train_loss": -45.0904541015625, "global_step": 346528, "epoch": 2863} {"train_loss": -44.16713333129883, "global_step": 346529, "epoch": 2863} {"train_loss": -45.077510833740234, "global_step": 346530, "epoch": 2863} {"train_loss": -45.28092575073242, "global_step": 346531, "epoch": 2863} {"train_loss": -44.10808181762695, "global_step": 346532, "epoch": 2863} {"train_loss": -44.72886276245117, "global_step": 346533, "epoch": 2863} {"train_loss": -44.864227294921875, "global_step": 346534, "epoch": 2863} {"train_loss": -44.254600524902344, "global_step": 346535, "epoch": 2863} {"train_loss": -45.17033004760742, "global_step": 346536, "epoch": 2863} {"train_loss": -43.622901916503906, "global_step": 346537, "epoch": 2863} {"train_loss": -44.94277572631836, "global_step": 346538, "epoch": 2863} {"train_loss": -44.81898880004883, "global_step": 346539, "epoch": 2863} {"train_loss": -44.79058837890625, "global_step": 346540, "epoch": 2863} {"train_loss": -45.03470230102539, "global_step": 346541, "epoch": 2863} {"train_loss": -44.21902084350586, "global_step": 346542, "epoch": 2863} {"train_loss": -44.553721530378354, "global_step": 346543, "epoch": 2863, "val_loss": 2527631.5} {"train_loss": -44.93120574951172, "global_step": 346544, "epoch": 2864} {"train_loss": -45.087921142578125, "global_step": 346545, "epoch": 2864} {"train_loss": -44.693153381347656, "global_step": 346546, "epoch": 2864} {"train_loss": -45.631080627441406, "global_step": 346547, "epoch": 2864} {"train_loss": -44.66746520996094, "global_step": 346548, "epoch": 2864} {"train_loss": -45.1307487487793, "global_step": 346549, "epoch": 2864} {"train_loss": -44.84367752075195, "global_step": 346550, "epoch": 2864} {"train_loss": -45.314815521240234, "global_step": 346551, "epoch": 2864} {"train_loss": -43.89536666870117, "global_step": 346552, "epoch": 2864} {"train_loss": -43.92455291748047, "global_step": 346553, "epoch": 2864} {"train_loss": -44.77457809448242, "global_step": 346554, "epoch": 2864} {"train_loss": -44.813209533691406, "global_step": 346555, "epoch": 2864} {"train_loss": -44.62826156616211, "global_step": 346556, "epoch": 2864} {"train_loss": -44.50481033325195, "global_step": 346557, "epoch": 2864} {"train_loss": -45.153419494628906, "global_step": 346558, "epoch": 2864} {"train_loss": -45.38581848144531, "global_step": 346559, "epoch": 2864} {"train_loss": -45.44684600830078, "global_step": 346560, "epoch": 2864} {"train_loss": -45.4093132019043, "global_step": 346561, "epoch": 2864} {"train_loss": -45.224605560302734, "global_step": 346562, "epoch": 2864} {"train_loss": -44.99740219116211, "global_step": 346563, "epoch": 2864} {"train_loss": -45.46132278442383, "global_step": 346564, "epoch": 2864} {"train_loss": -45.433082580566406, "global_step": 346565, "epoch": 2864} {"train_loss": -45.751190185546875, "global_step": 346566, "epoch": 2864} {"train_loss": -45.198055267333984, "global_step": 346567, "epoch": 2864} {"train_loss": -45.56684875488281, "global_step": 346568, "epoch": 2864} {"train_loss": -45.79155731201172, "global_step": 346569, "epoch": 2864} {"train_loss": -45.34952926635742, "global_step": 346570, "epoch": 2864} {"train_loss": -45.68046188354492, "global_step": 346571, "epoch": 2864} {"train_loss": -45.5623664855957, "global_step": 346572, "epoch": 2864} {"train_loss": -45.495635986328125, "global_step": 346573, "epoch": 2864} {"train_loss": -45.3504753112793, "global_step": 346574, "epoch": 2864} {"train_loss": -45.60415267944336, "global_step": 346575, "epoch": 2864} {"train_loss": -45.86458969116211, "global_step": 346576, "epoch": 2864} {"train_loss": -46.02458953857422, "global_step": 346577, "epoch": 2864} {"train_loss": -45.69306564331055, "global_step": 346578, "epoch": 2864} {"train_loss": -45.640594482421875, "global_step": 346579, "epoch": 2864} {"train_loss": -46.27792739868164, "global_step": 346580, "epoch": 2864} {"train_loss": -44.96091079711914, "global_step": 346581, "epoch": 2864} {"train_loss": -45.47898864746094, "global_step": 346582, "epoch": 2864} {"train_loss": -45.2507438659668, "global_step": 346583, "epoch": 2864} {"train_loss": -45.18959045410156, "global_step": 346584, "epoch": 2864} {"train_loss": -46.13435363769531, "global_step": 346585, "epoch": 2864} {"train_loss": -45.97066116333008, "global_step": 346586, "epoch": 2864} {"train_loss": -45.854400634765625, "global_step": 346587, "epoch": 2864} {"train_loss": -45.90591049194336, "global_step": 346588, "epoch": 2864} {"train_loss": -45.5733528137207, "global_step": 346589, "epoch": 2864} {"train_loss": -45.7078742980957, "global_step": 346590, "epoch": 2864} {"train_loss": -45.3909912109375, "global_step": 346591, "epoch": 2864} {"train_loss": -45.77242660522461, "global_step": 346592, "epoch": 2864} {"train_loss": -45.84445571899414, "global_step": 346593, "epoch": 2864} {"train_loss": -46.14076232910156, "global_step": 346594, "epoch": 2864} {"train_loss": -45.45225524902344, "global_step": 346595, "epoch": 2864} {"train_loss": -45.47483444213867, "global_step": 346596, "epoch": 2864} {"train_loss": -44.52946090698242, "global_step": 346597, "epoch": 2864} {"train_loss": -44.73910903930664, "global_step": 346598, "epoch": 2864} {"train_loss": -45.22694778442383, "global_step": 346599, "epoch": 2864} {"train_loss": -45.862586975097656, "global_step": 346600, "epoch": 2864} {"train_loss": -45.667640686035156, "global_step": 346601, "epoch": 2864} {"train_loss": -44.737632751464844, "global_step": 346602, "epoch": 2864} {"train_loss": -44.78642654418945, "global_step": 346603, "epoch": 2864} {"train_loss": -44.21998977661133, "global_step": 346604, "epoch": 2864} {"train_loss": -43.5978889465332, "global_step": 346605, "epoch": 2864} {"train_loss": -44.72740936279297, "global_step": 346606, "epoch": 2864} {"train_loss": -44.12652587890625, "global_step": 346607, "epoch": 2864} {"train_loss": -42.52290344238281, "global_step": 346608, "epoch": 2864} {"train_loss": -38.05031967163086, "global_step": 346609, "epoch": 2864} {"train_loss": -44.74463653564453, "global_step": 346610, "epoch": 2864} {"train_loss": -34.67992401123047, "global_step": 346611, "epoch": 2864} {"train_loss": -42.31980514526367, "global_step": 346612, "epoch": 2864} {"train_loss": -40.30801010131836, "global_step": 346613, "epoch": 2864} {"train_loss": -38.66103744506836, "global_step": 346614, "epoch": 2864} {"train_loss": -41.29203414916992, "global_step": 346615, "epoch": 2864} {"train_loss": -39.953800201416016, "global_step": 346616, "epoch": 2864} {"train_loss": -40.61029815673828, "global_step": 346617, "epoch": 2864} {"train_loss": -40.74396514892578, "global_step": 346618, "epoch": 2864} {"train_loss": -39.46333694458008, "global_step": 346619, "epoch": 2864} {"train_loss": -39.02783966064453, "global_step": 346620, "epoch": 2864} {"train_loss": -39.97871017456055, "global_step": 346621, "epoch": 2864} {"train_loss": -41.19118118286133, "global_step": 346622, "epoch": 2864} {"train_loss": -38.93682861328125, "global_step": 346623, "epoch": 2864} {"train_loss": -37.756690979003906, "global_step": 346624, "epoch": 2864} {"train_loss": -40.67898178100586, "global_step": 346625, "epoch": 2864} {"train_loss": -37.478248596191406, "global_step": 346626, "epoch": 2864} {"train_loss": -40.14112091064453, "global_step": 346627, "epoch": 2864} {"train_loss": -39.69107437133789, "global_step": 346628, "epoch": 2864} {"train_loss": -39.3040885925293, "global_step": 346629, "epoch": 2864} {"train_loss": -41.714508056640625, "global_step": 346630, "epoch": 2864} {"train_loss": -39.712581634521484, "global_step": 346631, "epoch": 2864} {"train_loss": -42.0946044921875, "global_step": 346632, "epoch": 2864} {"train_loss": -40.484622955322266, "global_step": 346633, "epoch": 2864} {"train_loss": -43.22407150268555, "global_step": 346634, "epoch": 2864} {"train_loss": -39.22385025024414, "global_step": 346635, "epoch": 2864} {"train_loss": -42.36762619018555, "global_step": 346636, "epoch": 2864} {"train_loss": -37.82992172241211, "global_step": 346637, "epoch": 2864} {"train_loss": -42.60121536254883, "global_step": 346638, "epoch": 2864} {"train_loss": -39.59086227416992, "global_step": 346639, "epoch": 2864} {"train_loss": -39.658355712890625, "global_step": 346640, "epoch": 2864} {"train_loss": -42.53483581542969, "global_step": 346641, "epoch": 2864} {"train_loss": -40.73702621459961, "global_step": 346642, "epoch": 2864} {"train_loss": -42.46450424194336, "global_step": 346643, "epoch": 2864} {"train_loss": -42.639705657958984, "global_step": 346644, "epoch": 2864} {"train_loss": -43.06612777709961, "global_step": 346645, "epoch": 2864} {"train_loss": -41.34011459350586, "global_step": 346646, "epoch": 2864} {"train_loss": -43.18416213989258, "global_step": 346647, "epoch": 2864} {"train_loss": -41.37477111816406, "global_step": 346648, "epoch": 2864} {"train_loss": -43.18868637084961, "global_step": 346649, "epoch": 2864} {"train_loss": -42.45072937011719, "global_step": 346650, "epoch": 2864} {"train_loss": -42.73276138305664, "global_step": 346651, "epoch": 2864} {"train_loss": -43.07941818237305, "global_step": 346652, "epoch": 2864} {"train_loss": -44.23712158203125, "global_step": 346653, "epoch": 2864} {"train_loss": -42.7231559753418, "global_step": 346654, "epoch": 2864} {"train_loss": -44.476070404052734, "global_step": 346655, "epoch": 2864} {"train_loss": -43.223785400390625, "global_step": 346656, "epoch": 2864} {"train_loss": -44.45895004272461, "global_step": 346657, "epoch": 2864} {"train_loss": -43.617374420166016, "global_step": 346658, "epoch": 2864} {"train_loss": -43.900753021240234, "global_step": 346659, "epoch": 2864} {"train_loss": -43.49195861816406, "global_step": 346660, "epoch": 2864} {"train_loss": -44.637054443359375, "global_step": 346661, "epoch": 2864} {"train_loss": -43.888824462890625, "global_step": 346662, "epoch": 2864} {"train_loss": -44.6038703918457, "global_step": 346663, "epoch": 2864} {"train_loss": -43.458634999172745, "global_step": 346664, "epoch": 2864, "val_loss": 2544431.75} {"train_loss": -44.55971908569336, "global_step": 346665, "epoch": 2865} {"train_loss": -44.01781463623047, "global_step": 346666, "epoch": 2865} {"train_loss": -44.56515121459961, "global_step": 346667, "epoch": 2865} {"train_loss": -44.292449951171875, "global_step": 346668, "epoch": 2865} {"train_loss": -44.62099075317383, "global_step": 346669, "epoch": 2865} {"train_loss": -44.699649810791016, "global_step": 346670, "epoch": 2865} {"train_loss": -45.3432731628418, "global_step": 346671, "epoch": 2865} {"train_loss": -44.8880500793457, "global_step": 346672, "epoch": 2865} {"train_loss": -44.96627426147461, "global_step": 346673, "epoch": 2865} {"train_loss": -44.682533264160156, "global_step": 346674, "epoch": 2865} {"train_loss": -45.051631927490234, "global_step": 346675, "epoch": 2865} {"train_loss": -44.81086349487305, "global_step": 346676, "epoch": 2865} {"train_loss": -45.195350646972656, "global_step": 346677, "epoch": 2865} {"train_loss": -44.8304557800293, "global_step": 346678, "epoch": 2865} {"train_loss": -45.47209548950195, "global_step": 346679, "epoch": 2865} {"train_loss": -44.97553634643555, "global_step": 346680, "epoch": 2865} {"train_loss": -45.03996658325195, "global_step": 346681, "epoch": 2865} {"train_loss": -45.27885818481445, "global_step": 346682, "epoch": 2865} {"train_loss": -45.815547943115234, "global_step": 346683, "epoch": 2865} {"train_loss": -45.283973693847656, "global_step": 346684, "epoch": 2865} {"train_loss": -45.687713623046875, "global_step": 346685, "epoch": 2865} {"train_loss": -45.58143997192383, "global_step": 346686, "epoch": 2865} {"train_loss": -45.32309341430664, "global_step": 346687, "epoch": 2865} {"train_loss": -45.477447509765625, "global_step": 346688, "epoch": 2865} {"train_loss": -45.57233810424805, "global_step": 346689, "epoch": 2865} {"train_loss": -45.75930404663086, "global_step": 346690, "epoch": 2865} {"train_loss": -45.81075668334961, "global_step": 346691, "epoch": 2865} {"train_loss": -45.66154098510742, "global_step": 346692, "epoch": 2865} {"train_loss": -45.3775634765625, "global_step": 346693, "epoch": 2865} {"train_loss": -45.943511962890625, "global_step": 346694, "epoch": 2865} {"train_loss": -45.75528335571289, "global_step": 346695, "epoch": 2865} {"train_loss": -45.42593002319336, "global_step": 346696, "epoch": 2865} {"train_loss": -45.687103271484375, "global_step": 346697, "epoch": 2865} {"train_loss": -45.91279220581055, "global_step": 346698, "epoch": 2865} {"train_loss": -45.673370361328125, "global_step": 346699, "epoch": 2865} {"train_loss": -45.654293060302734, "global_step": 346700, "epoch": 2865} {"train_loss": -45.56569290161133, "global_step": 346701, "epoch": 2865} {"train_loss": -45.71737289428711, "global_step": 346702, "epoch": 2865} {"train_loss": -45.6971435546875, "global_step": 346703, "epoch": 2865} {"train_loss": -46.1259651184082, "global_step": 346704, "epoch": 2865} {"train_loss": -45.954463958740234, "global_step": 346705, "epoch": 2865} {"train_loss": -45.7192497253418, "global_step": 346706, "epoch": 2865} {"train_loss": -46.32365798950195, "global_step": 346707, "epoch": 2865} {"train_loss": -46.05751419067383, "global_step": 346708, "epoch": 2865} {"train_loss": -45.8648796081543, "global_step": 346709, "epoch": 2865} {"train_loss": -46.16990280151367, "global_step": 346710, "epoch": 2865} {"train_loss": -45.7888069152832, "global_step": 346711, "epoch": 2865} {"train_loss": -46.650794982910156, "global_step": 346712, "epoch": 2865} {"train_loss": -46.77376174926758, "global_step": 346713, "epoch": 2865} {"train_loss": -46.270233154296875, "global_step": 346714, "epoch": 2865} {"train_loss": -46.37038040161133, "global_step": 346715, "epoch": 2865} {"train_loss": -46.20771789550781, "global_step": 346716, "epoch": 2865} {"train_loss": -46.51198196411133, "global_step": 346717, "epoch": 2865} {"train_loss": -46.107826232910156, "global_step": 346718, "epoch": 2865} {"train_loss": -46.35081100463867, "global_step": 346719, "epoch": 2865} {"train_loss": -46.28752899169922, "global_step": 346720, "epoch": 2865} {"train_loss": -46.53390121459961, "global_step": 346721, "epoch": 2865} {"train_loss": -46.17955017089844, "global_step": 346722, "epoch": 2865} {"train_loss": -46.56034469604492, "global_step": 346723, "epoch": 2865} {"train_loss": -46.0814094543457, "global_step": 346724, "epoch": 2865} {"train_loss": -46.692344665527344, "global_step": 346725, "epoch": 2865} {"train_loss": -46.209991455078125, "global_step": 346726, "epoch": 2865} {"train_loss": -46.57208251953125, "global_step": 346727, "epoch": 2865} {"train_loss": -45.730953216552734, "global_step": 346728, "epoch": 2865} {"train_loss": -44.43466567993164, "global_step": 346729, "epoch": 2865} {"train_loss": -44.28078842163086, "global_step": 346730, "epoch": 2865} {"train_loss": -44.6759147644043, "global_step": 346731, "epoch": 2865} {"train_loss": -45.551658630371094, "global_step": 346732, "epoch": 2865} {"train_loss": -45.64194869995117, "global_step": 346733, "epoch": 2865} {"train_loss": -43.76170349121094, "global_step": 346734, "epoch": 2865} {"train_loss": -42.91289520263672, "global_step": 346735, "epoch": 2865} {"train_loss": -43.356197357177734, "global_step": 346736, "epoch": 2865} {"train_loss": -43.75497817993164, "global_step": 346737, "epoch": 2865} {"train_loss": -43.712646484375, "global_step": 346738, "epoch": 2865} {"train_loss": -42.82230758666992, "global_step": 346739, "epoch": 2865} {"train_loss": -42.54117965698242, "global_step": 346740, "epoch": 2865} {"train_loss": -43.5548210144043, "global_step": 346741, "epoch": 2865} {"train_loss": -44.267921447753906, "global_step": 346742, "epoch": 2865} {"train_loss": -44.638179779052734, "global_step": 346743, "epoch": 2865} {"train_loss": -45.37163543701172, "global_step": 346744, "epoch": 2865} {"train_loss": -45.74154281616211, "global_step": 346745, "epoch": 2865} {"train_loss": -44.321529388427734, "global_step": 346746, "epoch": 2865} {"train_loss": -43.90724563598633, "global_step": 346747, "epoch": 2865} {"train_loss": -40.57759475708008, "global_step": 346748, "epoch": 2865} {"train_loss": -43.193294525146484, "global_step": 346749, "epoch": 2865} {"train_loss": -41.464664459228516, "global_step": 346750, "epoch": 2865} {"train_loss": -42.598995208740234, "global_step": 346751, "epoch": 2865} {"train_loss": -43.65006637573242, "global_step": 346752, "epoch": 2865} {"train_loss": -41.740447998046875, "global_step": 346753, "epoch": 2865} {"train_loss": -44.2467155456543, "global_step": 346754, "epoch": 2865} {"train_loss": -40.778099060058594, "global_step": 346755, "epoch": 2865} {"train_loss": -42.16822052001953, "global_step": 346756, "epoch": 2865} {"train_loss": -43.71488571166992, "global_step": 346757, "epoch": 2865} {"train_loss": -42.16915512084961, "global_step": 346758, "epoch": 2865} {"train_loss": -42.72378158569336, "global_step": 346759, "epoch": 2865} {"train_loss": -43.057899475097656, "global_step": 346760, "epoch": 2865} {"train_loss": -41.640987396240234, "global_step": 346761, "epoch": 2865} {"train_loss": -43.2888298034668, "global_step": 346762, "epoch": 2865} {"train_loss": -42.95254135131836, "global_step": 346763, "epoch": 2865} {"train_loss": -43.851356506347656, "global_step": 346764, "epoch": 2865} {"train_loss": -43.896270751953125, "global_step": 346765, "epoch": 2865} {"train_loss": -43.42438507080078, "global_step": 346766, "epoch": 2865} {"train_loss": -43.97044372558594, "global_step": 346767, "epoch": 2865} {"train_loss": -43.92729949951172, "global_step": 346768, "epoch": 2865} {"train_loss": -43.5115852355957, "global_step": 346769, "epoch": 2865} {"train_loss": -44.09477615356445, "global_step": 346770, "epoch": 2865} {"train_loss": -42.911373138427734, "global_step": 346771, "epoch": 2865} {"train_loss": -43.86702346801758, "global_step": 346772, "epoch": 2865} {"train_loss": -43.0010986328125, "global_step": 346773, "epoch": 2865} {"train_loss": -43.849727630615234, "global_step": 346774, "epoch": 2865} {"train_loss": -44.21664047241211, "global_step": 346775, "epoch": 2865} {"train_loss": -44.013851165771484, "global_step": 346776, "epoch": 2865} {"train_loss": -43.698795318603516, "global_step": 346777, "epoch": 2865} {"train_loss": -44.474708557128906, "global_step": 346778, "epoch": 2865} {"train_loss": -44.00057601928711, "global_step": 346779, "epoch": 2865} {"train_loss": -43.72145080566406, "global_step": 346780, "epoch": 2865} {"train_loss": -44.606502532958984, "global_step": 346781, "epoch": 2865} {"train_loss": -44.345516204833984, "global_step": 346782, "epoch": 2865} {"train_loss": -44.11275100708008, "global_step": 346783, "epoch": 2865} {"train_loss": -44.012001037597656, "global_step": 346784, "epoch": 2865} {"train_loss": -44.68556632680341, "global_step": 346785, "epoch": 2865, "val_loss": 2561746.75} {"train_loss": -44.326690673828125, "global_step": 346786, "epoch": 2866} {"train_loss": -44.8199348449707, "global_step": 346787, "epoch": 2866} {"train_loss": -44.679378509521484, "global_step": 346788, "epoch": 2866} {"train_loss": -44.71714401245117, "global_step": 346789, "epoch": 2866} {"train_loss": -44.94142150878906, "global_step": 346790, "epoch": 2866} {"train_loss": -43.72023391723633, "global_step": 346791, "epoch": 2866} {"train_loss": -45.555458068847656, "global_step": 346792, "epoch": 2866} {"train_loss": -44.02898025512695, "global_step": 346793, "epoch": 2866} {"train_loss": -44.29969024658203, "global_step": 346794, "epoch": 2866} {"train_loss": -44.93062210083008, "global_step": 346795, "epoch": 2866} {"train_loss": -44.23134994506836, "global_step": 346796, "epoch": 2866} {"train_loss": -44.81399917602539, "global_step": 346797, "epoch": 2866} {"train_loss": -44.2857551574707, "global_step": 346798, "epoch": 2866} {"train_loss": -45.305419921875, "global_step": 346799, "epoch": 2866} {"train_loss": -45.05550003051758, "global_step": 346800, "epoch": 2866} {"train_loss": -44.949588775634766, "global_step": 346801, "epoch": 2866} {"train_loss": -45.40452194213867, "global_step": 346802, "epoch": 2866} {"train_loss": -44.97270965576172, "global_step": 346803, "epoch": 2866} {"train_loss": -45.17287826538086, "global_step": 346804, "epoch": 2866} {"train_loss": -44.9835090637207, "global_step": 346805, "epoch": 2866} {"train_loss": -44.29897689819336, "global_step": 346806, "epoch": 2866} {"train_loss": -45.46923828125, "global_step": 346807, "epoch": 2866} {"train_loss": -44.66709518432617, "global_step": 346808, "epoch": 2866} {"train_loss": -45.44857406616211, "global_step": 346809, "epoch": 2866} {"train_loss": -45.44660568237305, "global_step": 346810, "epoch": 2866} {"train_loss": -45.49457550048828, "global_step": 346811, "epoch": 2866} {"train_loss": -45.731441497802734, "global_step": 346812, "epoch": 2866} {"train_loss": -45.746238708496094, "global_step": 346813, "epoch": 2866} {"train_loss": -45.79094314575195, "global_step": 346814, "epoch": 2866} {"train_loss": -45.193050384521484, "global_step": 346815, "epoch": 2866} {"train_loss": -45.37673568725586, "global_step": 346816, "epoch": 2866} {"train_loss": -45.18986892700195, "global_step": 346817, "epoch": 2866} {"train_loss": -45.27326202392578, "global_step": 346818, "epoch": 2866} {"train_loss": -45.906864166259766, "global_step": 346819, "epoch": 2866} {"train_loss": -45.73521041870117, "global_step": 346820, "epoch": 2866} {"train_loss": -45.05729293823242, "global_step": 346821, "epoch": 2866} {"train_loss": -45.86792755126953, "global_step": 346822, "epoch": 2866} {"train_loss": -44.02779006958008, "global_step": 346823, "epoch": 2866} {"train_loss": -45.3989143371582, "global_step": 346824, "epoch": 2866} {"train_loss": -43.939334869384766, "global_step": 346825, "epoch": 2866} {"train_loss": -45.32988357543945, "global_step": 346826, "epoch": 2866} {"train_loss": -45.50608825683594, "global_step": 346827, "epoch": 2866} {"train_loss": -44.124881744384766, "global_step": 346828, "epoch": 2866} {"train_loss": -45.028411865234375, "global_step": 346829, "epoch": 2866} {"train_loss": -45.00459671020508, "global_step": 346830, "epoch": 2866} {"train_loss": -44.91852569580078, "global_step": 346831, "epoch": 2866} {"train_loss": -44.957454681396484, "global_step": 346832, "epoch": 2866} {"train_loss": -44.39044189453125, "global_step": 346833, "epoch": 2866} {"train_loss": -44.801002502441406, "global_step": 346834, "epoch": 2866} {"train_loss": -44.78104782104492, "global_step": 346835, "epoch": 2866} {"train_loss": -44.88103485107422, "global_step": 346836, "epoch": 2866} {"train_loss": -45.19802474975586, "global_step": 346837, "epoch": 2866} {"train_loss": -44.678184509277344, "global_step": 346838, "epoch": 2866} {"train_loss": -44.72517395019531, "global_step": 346839, "epoch": 2866} {"train_loss": -45.4967155456543, "global_step": 346840, "epoch": 2866} {"train_loss": -45.401912689208984, "global_step": 346841, "epoch": 2866} {"train_loss": -44.94170379638672, "global_step": 346842, "epoch": 2866} {"train_loss": -45.51774978637695, "global_step": 346843, "epoch": 2866} {"train_loss": -45.66176986694336, "global_step": 346844, "epoch": 2866} {"train_loss": -44.1041145324707, "global_step": 346845, "epoch": 2866} {"train_loss": -43.39509963989258, "global_step": 346846, "epoch": 2866} {"train_loss": -44.825775146484375, "global_step": 346847, "epoch": 2866} {"train_loss": -45.139495849609375, "global_step": 346848, "epoch": 2866} {"train_loss": -43.42387771606445, "global_step": 346849, "epoch": 2866} {"train_loss": -43.31201171875, "global_step": 346850, "epoch": 2866} {"train_loss": -45.7436637878418, "global_step": 346851, "epoch": 2866} {"train_loss": -44.6143684387207, "global_step": 346852, "epoch": 2866} {"train_loss": -44.80580520629883, "global_step": 346853, "epoch": 2866} {"train_loss": -45.222206115722656, "global_step": 346854, "epoch": 2866} {"train_loss": -44.49479293823242, "global_step": 346855, "epoch": 2866} {"train_loss": -44.07401657104492, "global_step": 346856, "epoch": 2866} {"train_loss": -45.84771728515625, "global_step": 346857, "epoch": 2866} {"train_loss": -44.93830871582031, "global_step": 346858, "epoch": 2866} {"train_loss": -44.824424743652344, "global_step": 346859, "epoch": 2866} {"train_loss": -45.25519943237305, "global_step": 346860, "epoch": 2866} {"train_loss": -45.34877395629883, "global_step": 346861, "epoch": 2866} {"train_loss": -45.320186614990234, "global_step": 346862, "epoch": 2866} {"train_loss": -45.428462982177734, "global_step": 346863, "epoch": 2866} {"train_loss": -45.209686279296875, "global_step": 346864, "epoch": 2866} {"train_loss": -45.05085754394531, "global_step": 346865, "epoch": 2866} {"train_loss": -45.381263732910156, "global_step": 346866, "epoch": 2866} {"train_loss": -45.73004150390625, "global_step": 346867, "epoch": 2866} {"train_loss": -45.76188659667969, "global_step": 346868, "epoch": 2866} {"train_loss": -45.86549758911133, "global_step": 346869, "epoch": 2866} {"train_loss": -45.5894889831543, "global_step": 346870, "epoch": 2866} {"train_loss": -45.25814437866211, "global_step": 346871, "epoch": 2866} {"train_loss": -45.49723434448242, "global_step": 346872, "epoch": 2866} {"train_loss": -45.68488693237305, "global_step": 346873, "epoch": 2866} {"train_loss": -45.558589935302734, "global_step": 346874, "epoch": 2866} {"train_loss": -45.56637954711914, "global_step": 346875, "epoch": 2866} {"train_loss": -45.06245040893555, "global_step": 346876, "epoch": 2866} {"train_loss": -45.783504486083984, "global_step": 346877, "epoch": 2866} {"train_loss": -46.05009841918945, "global_step": 346878, "epoch": 2866} {"train_loss": -46.055938720703125, "global_step": 346879, "epoch": 2866} {"train_loss": -45.571773529052734, "global_step": 346880, "epoch": 2866} {"train_loss": -46.25927734375, "global_step": 346881, "epoch": 2866} {"train_loss": -45.32353591918945, "global_step": 346882, "epoch": 2866} {"train_loss": -45.66132354736328, "global_step": 346883, "epoch": 2866} {"train_loss": -45.57511901855469, "global_step": 346884, "epoch": 2866} {"train_loss": -45.88154983520508, "global_step": 346885, "epoch": 2866} {"train_loss": -45.250118255615234, "global_step": 346886, "epoch": 2866} {"train_loss": -45.52753829956055, "global_step": 346887, "epoch": 2866} {"train_loss": -45.860652923583984, "global_step": 346888, "epoch": 2866} {"train_loss": -45.908878326416016, "global_step": 346889, "epoch": 2866} {"train_loss": -45.774574279785156, "global_step": 346890, "epoch": 2866} {"train_loss": -45.95683670043945, "global_step": 346891, "epoch": 2866} {"train_loss": -46.13149642944336, "global_step": 346892, "epoch": 2866} {"train_loss": -45.835819244384766, "global_step": 346893, "epoch": 2866} {"train_loss": -45.89150619506836, "global_step": 346894, "epoch": 2866} {"train_loss": -45.808074951171875, "global_step": 346895, "epoch": 2866} {"train_loss": -45.53396224975586, "global_step": 346896, "epoch": 2866} {"train_loss": -44.82180404663086, "global_step": 346897, "epoch": 2866} {"train_loss": -44.69498825073242, "global_step": 346898, "epoch": 2866} {"train_loss": -45.290557861328125, "global_step": 346899, "epoch": 2866} {"train_loss": -45.43508529663086, "global_step": 346900, "epoch": 2866} {"train_loss": -45.717803955078125, "global_step": 346901, "epoch": 2866} {"train_loss": -46.12055969238281, "global_step": 346902, "epoch": 2866} {"train_loss": -44.85478591918945, "global_step": 346903, "epoch": 2866} {"train_loss": -44.92253494262695, "global_step": 346904, "epoch": 2866} {"train_loss": -45.26267623901367, "global_step": 346905, "epoch": 2866} {"train_loss": -45.15974300163837, "global_step": 346906, "epoch": 2866, "val_loss": 2567067.25} {"train_loss": -45.25563049316406, "global_step": 346907, "epoch": 2867} {"train_loss": -43.5185661315918, "global_step": 346908, "epoch": 2867} {"train_loss": -44.10239028930664, "global_step": 346909, "epoch": 2867} {"train_loss": -45.33625411987305, "global_step": 346910, "epoch": 2867} {"train_loss": -44.93031311035156, "global_step": 346911, "epoch": 2867} {"train_loss": -45.21891784667969, "global_step": 346912, "epoch": 2867} {"train_loss": -45.63349151611328, "global_step": 346913, "epoch": 2867} {"train_loss": -44.57666015625, "global_step": 346914, "epoch": 2867} {"train_loss": -39.8607177734375, "global_step": 346915, "epoch": 2867} {"train_loss": -44.00614929199219, "global_step": 346916, "epoch": 2867} {"train_loss": -43.62217330932617, "global_step": 346917, "epoch": 2867} {"train_loss": -45.05900955200195, "global_step": 346918, "epoch": 2867} {"train_loss": -44.39303970336914, "global_step": 346919, "epoch": 2867} {"train_loss": -43.4969482421875, "global_step": 346920, "epoch": 2867} {"train_loss": -43.81745529174805, "global_step": 346921, "epoch": 2867} {"train_loss": -45.16386413574219, "global_step": 346922, "epoch": 2867} {"train_loss": -43.173892974853516, "global_step": 346923, "epoch": 2867} {"train_loss": -43.649715423583984, "global_step": 346924, "epoch": 2867} {"train_loss": -42.82823181152344, "global_step": 346925, "epoch": 2867} {"train_loss": -42.938480377197266, "global_step": 346926, "epoch": 2867} {"train_loss": -43.95810317993164, "global_step": 346927, "epoch": 2867} {"train_loss": -41.63964080810547, "global_step": 346928, "epoch": 2867} {"train_loss": -42.69629669189453, "global_step": 346929, "epoch": 2867} {"train_loss": -36.63690948486328, "global_step": 346930, "epoch": 2867} {"train_loss": -42.0296630859375, "global_step": 346931, "epoch": 2867} {"train_loss": -41.479652404785156, "global_step": 346932, "epoch": 2867} {"train_loss": -35.68256378173828, "global_step": 346933, "epoch": 2867} {"train_loss": -42.800628662109375, "global_step": 346934, "epoch": 2867} {"train_loss": -27.38563346862793, "global_step": 346935, "epoch": 2867} {"train_loss": -37.159584045410156, "global_step": 346936, "epoch": 2867} {"train_loss": -34.941558837890625, "global_step": 346937, "epoch": 2867} {"train_loss": -39.92502212524414, "global_step": 346938, "epoch": 2867} {"train_loss": -36.71503829956055, "global_step": 346939, "epoch": 2867} {"train_loss": -36.78459930419922, "global_step": 346940, "epoch": 2867} {"train_loss": -37.495941162109375, "global_step": 346941, "epoch": 2867} {"train_loss": -38.48666763305664, "global_step": 346942, "epoch": 2867} {"train_loss": -36.45376968383789, "global_step": 346943, "epoch": 2867} {"train_loss": -37.055755615234375, "global_step": 346944, "epoch": 2867} {"train_loss": -34.09408187866211, "global_step": 346945, "epoch": 2867} {"train_loss": -37.160133361816406, "global_step": 346946, "epoch": 2867} {"train_loss": -39.16361618041992, "global_step": 346947, "epoch": 2867} {"train_loss": -37.71565628051758, "global_step": 346948, "epoch": 2867} {"train_loss": -38.29130554199219, "global_step": 346949, "epoch": 2867} {"train_loss": -40.707984924316406, "global_step": 346950, "epoch": 2867} {"train_loss": -38.57284164428711, "global_step": 346951, "epoch": 2867} {"train_loss": -40.00725173950195, "global_step": 346952, "epoch": 2867} {"train_loss": -40.11281204223633, "global_step": 346953, "epoch": 2867} {"train_loss": -40.121238708496094, "global_step": 346954, "epoch": 2867} {"train_loss": -40.77879333496094, "global_step": 346955, "epoch": 2867} {"train_loss": -40.81581497192383, "global_step": 346956, "epoch": 2867} {"train_loss": -39.192779541015625, "global_step": 346957, "epoch": 2867} {"train_loss": -41.57745361328125, "global_step": 346958, "epoch": 2867} {"train_loss": -40.98285675048828, "global_step": 346959, "epoch": 2867} {"train_loss": -41.551612854003906, "global_step": 346960, "epoch": 2867} {"train_loss": -41.35179138183594, "global_step": 346961, "epoch": 2867} {"train_loss": -43.17731857299805, "global_step": 346962, "epoch": 2867} {"train_loss": -42.06660842895508, "global_step": 346963, "epoch": 2867} {"train_loss": -42.392147064208984, "global_step": 346964, "epoch": 2867} {"train_loss": -42.55695724487305, "global_step": 346965, "epoch": 2867} {"train_loss": -42.06227493286133, "global_step": 346966, "epoch": 2867} {"train_loss": -42.946319580078125, "global_step": 346967, "epoch": 2867} {"train_loss": -41.55369186401367, "global_step": 346968, "epoch": 2867} {"train_loss": -42.5979118347168, "global_step": 346969, "epoch": 2867} {"train_loss": -42.81047439575195, "global_step": 346970, "epoch": 2867} {"train_loss": -42.82978439331055, "global_step": 346971, "epoch": 2867} {"train_loss": -43.249298095703125, "global_step": 346972, "epoch": 2867} {"train_loss": -42.1278190612793, "global_step": 346973, "epoch": 2867} {"train_loss": -43.67896270751953, "global_step": 346974, "epoch": 2867} {"train_loss": -43.88010787963867, "global_step": 346975, "epoch": 2867} {"train_loss": -42.55526351928711, "global_step": 346976, "epoch": 2867} {"train_loss": -42.8823356628418, "global_step": 346977, "epoch": 2867} {"train_loss": -42.73405075073242, "global_step": 346978, "epoch": 2867} {"train_loss": -43.30756759643555, "global_step": 346979, "epoch": 2867} {"train_loss": -42.85464096069336, "global_step": 346980, "epoch": 2867} {"train_loss": -44.03257369995117, "global_step": 346981, "epoch": 2867} {"train_loss": -43.656803131103516, "global_step": 346982, "epoch": 2867} {"train_loss": -43.09388732910156, "global_step": 346983, "epoch": 2867} {"train_loss": -43.151241302490234, "global_step": 346984, "epoch": 2867} {"train_loss": -43.690120697021484, "global_step": 346985, "epoch": 2867} {"train_loss": -43.92905044555664, "global_step": 346986, "epoch": 2867} {"train_loss": -43.554073333740234, "global_step": 346987, "epoch": 2867} {"train_loss": -43.93195343017578, "global_step": 346988, "epoch": 2867} {"train_loss": -43.3790283203125, "global_step": 346989, "epoch": 2867} {"train_loss": -43.43905258178711, "global_step": 346990, "epoch": 2867} {"train_loss": -44.260040283203125, "global_step": 346991, "epoch": 2867} {"train_loss": -42.994056701660156, "global_step": 346992, "epoch": 2867} {"train_loss": -44.056983947753906, "global_step": 346993, "epoch": 2867} {"train_loss": -44.03693771362305, "global_step": 346994, "epoch": 2867} {"train_loss": -44.53548812866211, "global_step": 346995, "epoch": 2867} {"train_loss": -44.007667541503906, "global_step": 346996, "epoch": 2867} {"train_loss": -44.318660736083984, "global_step": 346997, "epoch": 2867} {"train_loss": -43.93185043334961, "global_step": 346998, "epoch": 2867} {"train_loss": -44.08688735961914, "global_step": 346999, "epoch": 2867} {"train_loss": -44.55491256713867, "global_step": 347000, "epoch": 2867} {"train_loss": -44.57969284057617, "global_step": 347001, "epoch": 2867} {"train_loss": -44.7514762878418, "global_step": 347002, "epoch": 2867} {"train_loss": -44.42823028564453, "global_step": 347003, "epoch": 2867} {"train_loss": -44.17515182495117, "global_step": 347004, "epoch": 2867} {"train_loss": -44.8298454284668, "global_step": 347005, "epoch": 2867} {"train_loss": -44.29903793334961, "global_step": 347006, "epoch": 2867} {"train_loss": -44.54899215698242, "global_step": 347007, "epoch": 2867} {"train_loss": -43.98134231567383, "global_step": 347008, "epoch": 2867} {"train_loss": -44.077030181884766, "global_step": 347009, "epoch": 2867} {"train_loss": -44.9649772644043, "global_step": 347010, "epoch": 2867} {"train_loss": -44.508445739746094, "global_step": 347011, "epoch": 2867} {"train_loss": -44.625179290771484, "global_step": 347012, "epoch": 2867} {"train_loss": -44.98948287963867, "global_step": 347013, "epoch": 2867} {"train_loss": -44.93891525268555, "global_step": 347014, "epoch": 2867} {"train_loss": -44.97364044189453, "global_step": 347015, "epoch": 2867} {"train_loss": -45.42298126220703, "global_step": 347016, "epoch": 2867} {"train_loss": -45.45576858520508, "global_step": 347017, "epoch": 2867} {"train_loss": -45.28977966308594, "global_step": 347018, "epoch": 2867} {"train_loss": -45.04315948486328, "global_step": 347019, "epoch": 2867} {"train_loss": -44.247108459472656, "global_step": 347020, "epoch": 2867} {"train_loss": -45.089263916015625, "global_step": 347021, "epoch": 2867} {"train_loss": -45.44314193725586, "global_step": 347022, "epoch": 2867} {"train_loss": -45.21380615234375, "global_step": 347023, "epoch": 2867} {"train_loss": -45.314205169677734, "global_step": 347024, "epoch": 2867} {"train_loss": -44.53156280517578, "global_step": 347025, "epoch": 2867} {"train_loss": -45.897518157958984, "global_step": 347026, "epoch": 2867} {"train_loss": -42.49403635135367, "global_step": 347027, "epoch": 2867, "val_loss": 2564452.0} {"train_loss": -44.70799255371094, "global_step": 347028, "epoch": 2868} {"train_loss": -45.07071304321289, "global_step": 347029, "epoch": 2868} {"train_loss": -45.13037872314453, "global_step": 347030, "epoch": 2868} {"train_loss": -44.9289665222168, "global_step": 347031, "epoch": 2868} {"train_loss": -45.37989044189453, "global_step": 347032, "epoch": 2868} {"train_loss": -44.4909553527832, "global_step": 347033, "epoch": 2868} {"train_loss": -45.8980712890625, "global_step": 347034, "epoch": 2868} {"train_loss": -45.79020690917969, "global_step": 347035, "epoch": 2868} {"train_loss": -45.56211853027344, "global_step": 347036, "epoch": 2868} {"train_loss": -45.07682418823242, "global_step": 347037, "epoch": 2868} {"train_loss": -45.29500198364258, "global_step": 347038, "epoch": 2868} {"train_loss": -45.302364349365234, "global_step": 347039, "epoch": 2868} {"train_loss": -45.252723693847656, "global_step": 347040, "epoch": 2868} {"train_loss": -45.90864944458008, "global_step": 347041, "epoch": 2868} {"train_loss": -44.84710693359375, "global_step": 347042, "epoch": 2868} {"train_loss": -43.185482025146484, "global_step": 347043, "epoch": 2868} {"train_loss": -40.24489212036133, "global_step": 347044, "epoch": 2868} {"train_loss": -43.000457763671875, "global_step": 347045, "epoch": 2868} {"train_loss": -43.4979133605957, "global_step": 347046, "epoch": 2868} {"train_loss": -42.109840393066406, "global_step": 347047, "epoch": 2868} {"train_loss": -42.30794906616211, "global_step": 347048, "epoch": 2868} {"train_loss": -42.19831085205078, "global_step": 347049, "epoch": 2868} {"train_loss": -44.419281005859375, "global_step": 347050, "epoch": 2868} {"train_loss": -43.412532806396484, "global_step": 347051, "epoch": 2868} {"train_loss": -40.200660705566406, "global_step": 347052, "epoch": 2868} {"train_loss": -43.76997756958008, "global_step": 347053, "epoch": 2868} {"train_loss": -42.80167770385742, "global_step": 347054, "epoch": 2868} {"train_loss": -40.50323486328125, "global_step": 347055, "epoch": 2868} {"train_loss": -44.29813766479492, "global_step": 347056, "epoch": 2868} {"train_loss": -39.18972396850586, "global_step": 347057, "epoch": 2868} {"train_loss": -43.6207389831543, "global_step": 347058, "epoch": 2868} {"train_loss": -39.763832092285156, "global_step": 347059, "epoch": 2868} {"train_loss": -42.19613265991211, "global_step": 347060, "epoch": 2868} {"train_loss": -44.11638641357422, "global_step": 347061, "epoch": 2868} {"train_loss": -41.809505462646484, "global_step": 347062, "epoch": 2868} {"train_loss": -44.40922927856445, "global_step": 347063, "epoch": 2868} {"train_loss": -43.33696365356445, "global_step": 347064, "epoch": 2868} {"train_loss": -43.88811111450195, "global_step": 347065, "epoch": 2868} {"train_loss": -42.91651153564453, "global_step": 347066, "epoch": 2868} {"train_loss": -41.22782516479492, "global_step": 347067, "epoch": 2868} {"train_loss": -43.43733596801758, "global_step": 347068, "epoch": 2868} {"train_loss": -44.037471771240234, "global_step": 347069, "epoch": 2868} {"train_loss": -41.91939163208008, "global_step": 347070, "epoch": 2868} {"train_loss": -43.8506965637207, "global_step": 347071, "epoch": 2868} {"train_loss": -44.10194778442383, "global_step": 347072, "epoch": 2868} {"train_loss": -44.191375732421875, "global_step": 347073, "epoch": 2868} {"train_loss": -44.08142852783203, "global_step": 347074, "epoch": 2868} {"train_loss": -44.062652587890625, "global_step": 347075, "epoch": 2868} {"train_loss": -44.970733642578125, "global_step": 347076, "epoch": 2868} {"train_loss": -43.5373420715332, "global_step": 347077, "epoch": 2868} {"train_loss": -44.927791595458984, "global_step": 347078, "epoch": 2868} {"train_loss": -43.85622787475586, "global_step": 347079, "epoch": 2868} {"train_loss": -43.99418258666992, "global_step": 347080, "epoch": 2868} {"train_loss": -44.336700439453125, "global_step": 347081, "epoch": 2868} {"train_loss": -44.243404388427734, "global_step": 347082, "epoch": 2868} {"train_loss": -44.82021713256836, "global_step": 347083, "epoch": 2868} {"train_loss": -44.64599609375, "global_step": 347084, "epoch": 2868} {"train_loss": -44.69818878173828, "global_step": 347085, "epoch": 2868} {"train_loss": -43.4350471496582, "global_step": 347086, "epoch": 2868} {"train_loss": -43.38064193725586, "global_step": 347087, "epoch": 2868} {"train_loss": -44.160621643066406, "global_step": 347088, "epoch": 2868} {"train_loss": -44.18870544433594, "global_step": 347089, "epoch": 2868} {"train_loss": -42.71866989135742, "global_step": 347090, "epoch": 2868} {"train_loss": -42.11294174194336, "global_step": 347091, "epoch": 2868} {"train_loss": -44.403499603271484, "global_step": 347092, "epoch": 2868} {"train_loss": -44.19044876098633, "global_step": 347093, "epoch": 2868} {"train_loss": -43.87009811401367, "global_step": 347094, "epoch": 2868} {"train_loss": -43.608272552490234, "global_step": 347095, "epoch": 2868} {"train_loss": -44.27170944213867, "global_step": 347096, "epoch": 2868} {"train_loss": -44.35504913330078, "global_step": 347097, "epoch": 2868} {"train_loss": -42.8308219909668, "global_step": 347098, "epoch": 2868} {"train_loss": -43.93357849121094, "global_step": 347099, "epoch": 2868} {"train_loss": -44.70581817626953, "global_step": 347100, "epoch": 2868} {"train_loss": -43.14567565917969, "global_step": 347101, "epoch": 2868} {"train_loss": -43.19830322265625, "global_step": 347102, "epoch": 2868} {"train_loss": -44.30502700805664, "global_step": 347103, "epoch": 2868} {"train_loss": -44.637020111083984, "global_step": 347104, "epoch": 2868} {"train_loss": -44.307281494140625, "global_step": 347105, "epoch": 2868} {"train_loss": -44.57084655761719, "global_step": 347106, "epoch": 2868} {"train_loss": -44.82485580444336, "global_step": 347107, "epoch": 2868} {"train_loss": -44.79948806762695, "global_step": 347108, "epoch": 2868} {"train_loss": -44.332916259765625, "global_step": 347109, "epoch": 2868} {"train_loss": -45.08449172973633, "global_step": 347110, "epoch": 2868} {"train_loss": -44.91045379638672, "global_step": 347111, "epoch": 2868} {"train_loss": -44.38336181640625, "global_step": 347112, "epoch": 2868} {"train_loss": -44.23982620239258, "global_step": 347113, "epoch": 2868} {"train_loss": -44.16416549682617, "global_step": 347114, "epoch": 2868} {"train_loss": -43.74665451049805, "global_step": 347115, "epoch": 2868} {"train_loss": -44.58822250366211, "global_step": 347116, "epoch": 2868} {"train_loss": -44.77080535888672, "global_step": 347117, "epoch": 2868} {"train_loss": -44.10419845581055, "global_step": 347118, "epoch": 2868} {"train_loss": -45.1478271484375, "global_step": 347119, "epoch": 2868} {"train_loss": -44.77663803100586, "global_step": 347120, "epoch": 2868} {"train_loss": -44.429931640625, "global_step": 347121, "epoch": 2868} {"train_loss": -45.266563415527344, "global_step": 347122, "epoch": 2868} {"train_loss": -43.723304748535156, "global_step": 347123, "epoch": 2868} {"train_loss": -45.07809066772461, "global_step": 347124, "epoch": 2868} {"train_loss": -44.800716400146484, "global_step": 347125, "epoch": 2868} {"train_loss": -44.96305465698242, "global_step": 347126, "epoch": 2868} {"train_loss": -45.580196380615234, "global_step": 347127, "epoch": 2868} {"train_loss": -44.126007080078125, "global_step": 347128, "epoch": 2868} {"train_loss": -45.15238571166992, "global_step": 347129, "epoch": 2868} {"train_loss": -45.2608757019043, "global_step": 347130, "epoch": 2868} {"train_loss": -45.01557159423828, "global_step": 347131, "epoch": 2868} {"train_loss": -45.34334182739258, "global_step": 347132, "epoch": 2868} {"train_loss": -45.55714797973633, "global_step": 347133, "epoch": 2868} {"train_loss": -45.10764694213867, "global_step": 347134, "epoch": 2868} {"train_loss": -44.776329040527344, "global_step": 347135, "epoch": 2868} {"train_loss": -45.27268600463867, "global_step": 347136, "epoch": 2868} {"train_loss": -45.42859649658203, "global_step": 347137, "epoch": 2868} {"train_loss": -44.783302307128906, "global_step": 347138, "epoch": 2868} {"train_loss": -44.40642166137695, "global_step": 347139, "epoch": 2868} {"train_loss": -46.064266204833984, "global_step": 347140, "epoch": 2868} {"train_loss": -44.42988967895508, "global_step": 347141, "epoch": 2868} {"train_loss": -44.293556213378906, "global_step": 347142, "epoch": 2868} {"train_loss": -44.92042541503906, "global_step": 347143, "epoch": 2868} {"train_loss": -44.96916580200195, "global_step": 347144, "epoch": 2868} {"train_loss": -43.316524505615234, "global_step": 347145, "epoch": 2868} {"train_loss": -43.64444351196289, "global_step": 347146, "epoch": 2868} {"train_loss": -44.749732971191406, "global_step": 347147, "epoch": 2868} {"train_loss": -44.0632257697996, "global_step": 347148, "epoch": 2868, "val_loss": 2493885.0} {"train_loss": -41.97993087768555, "global_step": 347149, "epoch": 2869} {"train_loss": -45.26323318481445, "global_step": 347150, "epoch": 2869} {"train_loss": -42.24298095703125, "global_step": 347151, "epoch": 2869} {"train_loss": -43.56319808959961, "global_step": 347152, "epoch": 2869} {"train_loss": -42.553585052490234, "global_step": 347153, "epoch": 2869} {"train_loss": -40.38796615600586, "global_step": 347154, "epoch": 2869} {"train_loss": -42.90575408935547, "global_step": 347155, "epoch": 2869} {"train_loss": -37.3319206237793, "global_step": 347156, "epoch": 2869} {"train_loss": -37.768165588378906, "global_step": 347157, "epoch": 2869} {"train_loss": -37.088016510009766, "global_step": 347158, "epoch": 2869} {"train_loss": -36.08759689331055, "global_step": 347159, "epoch": 2869} {"train_loss": -36.60200881958008, "global_step": 347160, "epoch": 2869} {"train_loss": -36.737518310546875, "global_step": 347161, "epoch": 2869} {"train_loss": -36.6576042175293, "global_step": 347162, "epoch": 2869} {"train_loss": -37.06137466430664, "global_step": 347163, "epoch": 2869} {"train_loss": -36.86989974975586, "global_step": 347164, "epoch": 2869} {"train_loss": -37.36799621582031, "global_step": 347165, "epoch": 2869} {"train_loss": -38.31218338012695, "global_step": 347166, "epoch": 2869} {"train_loss": -38.36765670776367, "global_step": 347167, "epoch": 2869} {"train_loss": -37.56338119506836, "global_step": 347168, "epoch": 2869} {"train_loss": -37.50650405883789, "global_step": 347169, "epoch": 2869} {"train_loss": -37.50386047363281, "global_step": 347170, "epoch": 2869} {"train_loss": -38.262596130371094, "global_step": 347171, "epoch": 2869} {"train_loss": -39.191001892089844, "global_step": 347172, "epoch": 2869} {"train_loss": -38.954097747802734, "global_step": 347173, "epoch": 2869} {"train_loss": -38.80324172973633, "global_step": 347174, "epoch": 2869} {"train_loss": -38.94028854370117, "global_step": 347175, "epoch": 2869} {"train_loss": -38.5404167175293, "global_step": 347176, "epoch": 2869} {"train_loss": -38.70901107788086, "global_step": 347177, "epoch": 2869} {"train_loss": -38.42853546142578, "global_step": 347178, "epoch": 2869} {"train_loss": -39.42963790893555, "global_step": 347179, "epoch": 2869} {"train_loss": -39.64778518676758, "global_step": 347180, "epoch": 2869} {"train_loss": -40.280517578125, "global_step": 347181, "epoch": 2869} {"train_loss": -40.92353439331055, "global_step": 347182, "epoch": 2869} {"train_loss": -40.60599899291992, "global_step": 347183, "epoch": 2869} {"train_loss": -41.17829132080078, "global_step": 347184, "epoch": 2869} {"train_loss": -39.79291915893555, "global_step": 347185, "epoch": 2869} {"train_loss": -40.5555419921875, "global_step": 347186, "epoch": 2869} {"train_loss": -41.36814498901367, "global_step": 347187, "epoch": 2869} {"train_loss": -41.651611328125, "global_step": 347188, "epoch": 2869} {"train_loss": -41.421974182128906, "global_step": 347189, "epoch": 2869} {"train_loss": -42.01240158081055, "global_step": 347190, "epoch": 2869} {"train_loss": -42.83469009399414, "global_step": 347191, "epoch": 2869} {"train_loss": -42.241737365722656, "global_step": 347192, "epoch": 2869} {"train_loss": -43.11157989501953, "global_step": 347193, "epoch": 2869} {"train_loss": -43.89558029174805, "global_step": 347194, "epoch": 2869} {"train_loss": -43.346832275390625, "global_step": 347195, "epoch": 2869} {"train_loss": -43.46244812011719, "global_step": 347196, "epoch": 2869} {"train_loss": -43.55542755126953, "global_step": 347197, "epoch": 2869} {"train_loss": -44.006893157958984, "global_step": 347198, "epoch": 2869} {"train_loss": -44.0791015625, "global_step": 347199, "epoch": 2869} {"train_loss": -44.4836540222168, "global_step": 347200, "epoch": 2869} {"train_loss": -44.25725173950195, "global_step": 347201, "epoch": 2869} {"train_loss": -44.09775924682617, "global_step": 347202, "epoch": 2869} {"train_loss": -44.4858512878418, "global_step": 347203, "epoch": 2869} {"train_loss": -44.803157806396484, "global_step": 347204, "epoch": 2869} {"train_loss": -44.026519775390625, "global_step": 347205, "epoch": 2869} {"train_loss": -44.54825973510742, "global_step": 347206, "epoch": 2869} {"train_loss": -44.003231048583984, "global_step": 347207, "epoch": 2869} {"train_loss": -44.025325775146484, "global_step": 347208, "epoch": 2869} {"train_loss": -43.640663146972656, "global_step": 347209, "epoch": 2869} {"train_loss": -43.6170768737793, "global_step": 347210, "epoch": 2869} {"train_loss": -44.6782341003418, "global_step": 347211, "epoch": 2869} {"train_loss": -43.795101165771484, "global_step": 347212, "epoch": 2869} {"train_loss": -44.34480667114258, "global_step": 347213, "epoch": 2869} {"train_loss": -44.44614791870117, "global_step": 347214, "epoch": 2869} {"train_loss": -44.36402893066406, "global_step": 347215, "epoch": 2869} {"train_loss": -42.25897979736328, "global_step": 347216, "epoch": 2869} {"train_loss": -43.97258377075195, "global_step": 347217, "epoch": 2869} {"train_loss": -44.12694549560547, "global_step": 347218, "epoch": 2869} {"train_loss": -43.20089340209961, "global_step": 347219, "epoch": 2869} {"train_loss": -44.215965270996094, "global_step": 347220, "epoch": 2869} {"train_loss": -44.2934684753418, "global_step": 347221, "epoch": 2869} {"train_loss": -42.92446517944336, "global_step": 347222, "epoch": 2869} {"train_loss": -44.45014190673828, "global_step": 347223, "epoch": 2869} {"train_loss": -43.822696685791016, "global_step": 347224, "epoch": 2869} {"train_loss": -43.22815704345703, "global_step": 347225, "epoch": 2869} {"train_loss": -44.608280181884766, "global_step": 347226, "epoch": 2869} {"train_loss": -43.14689254760742, "global_step": 347227, "epoch": 2869} {"train_loss": -43.604740142822266, "global_step": 347228, "epoch": 2869} {"train_loss": -44.618377685546875, "global_step": 347229, "epoch": 2869} {"train_loss": -44.899070739746094, "global_step": 347230, "epoch": 2869} {"train_loss": -42.89377975463867, "global_step": 347231, "epoch": 2869} {"train_loss": -43.3570556640625, "global_step": 347232, "epoch": 2869} {"train_loss": -44.6961555480957, "global_step": 347233, "epoch": 2869} {"train_loss": -44.33940124511719, "global_step": 347234, "epoch": 2869} {"train_loss": -43.94364929199219, "global_step": 347235, "epoch": 2869} {"train_loss": -43.781681060791016, "global_step": 347236, "epoch": 2869} {"train_loss": -43.10359573364258, "global_step": 347237, "epoch": 2869} {"train_loss": -44.95998764038086, "global_step": 347238, "epoch": 2869} {"train_loss": -43.03414535522461, "global_step": 347239, "epoch": 2869} {"train_loss": -44.09578323364258, "global_step": 347240, "epoch": 2869} {"train_loss": -43.95792770385742, "global_step": 347241, "epoch": 2869} {"train_loss": -44.679840087890625, "global_step": 347242, "epoch": 2869} {"train_loss": -44.461402893066406, "global_step": 347243, "epoch": 2869} {"train_loss": -43.46715545654297, "global_step": 347244, "epoch": 2869} {"train_loss": -44.302833557128906, "global_step": 347245, "epoch": 2869} {"train_loss": -44.6166877746582, "global_step": 347246, "epoch": 2869} {"train_loss": -44.94255828857422, "global_step": 347247, "epoch": 2869} {"train_loss": -43.5964469909668, "global_step": 347248, "epoch": 2869} {"train_loss": -44.73228073120117, "global_step": 347249, "epoch": 2869} {"train_loss": -43.68867111206055, "global_step": 347250, "epoch": 2869} {"train_loss": -44.156070709228516, "global_step": 347251, "epoch": 2869} {"train_loss": -42.058448791503906, "global_step": 347252, "epoch": 2869} {"train_loss": -43.12061309814453, "global_step": 347253, "epoch": 2869} {"train_loss": -43.61259841918945, "global_step": 347254, "epoch": 2869} {"train_loss": -44.48579025268555, "global_step": 347255, "epoch": 2869} {"train_loss": -44.46139144897461, "global_step": 347256, "epoch": 2869} {"train_loss": -43.985939025878906, "global_step": 347257, "epoch": 2869} {"train_loss": -44.475563049316406, "global_step": 347258, "epoch": 2869} {"train_loss": -44.59740447998047, "global_step": 347259, "epoch": 2869} {"train_loss": -43.803016662597656, "global_step": 347260, "epoch": 2869} {"train_loss": -42.571533203125, "global_step": 347261, "epoch": 2869} {"train_loss": -44.614158630371094, "global_step": 347262, "epoch": 2869} {"train_loss": -44.03310012817383, "global_step": 347263, "epoch": 2869} {"train_loss": -44.062984466552734, "global_step": 347264, "epoch": 2869} {"train_loss": -42.79148483276367, "global_step": 347265, "epoch": 2869} {"train_loss": -45.11329650878906, "global_step": 347266, "epoch": 2869} {"train_loss": -44.21206283569336, "global_step": 347267, "epoch": 2869} {"train_loss": -43.57606887817383, "global_step": 347268, "epoch": 2869} {"train_loss": -42.37197913808271, "global_step": 347269, "epoch": 2869, "val_loss": 2436358.0} {"train_loss": -43.593318939208984, "global_step": 347270, "epoch": 2870} {"train_loss": -45.02058029174805, "global_step": 347271, "epoch": 2870} {"train_loss": -44.340362548828125, "global_step": 347272, "epoch": 2870} {"train_loss": -43.68935775756836, "global_step": 347273, "epoch": 2870} {"train_loss": -44.099430084228516, "global_step": 347274, "epoch": 2870} {"train_loss": -44.79615020751953, "global_step": 347275, "epoch": 2870} {"train_loss": -44.68709945678711, "global_step": 347276, "epoch": 2870} {"train_loss": -44.30540084838867, "global_step": 347277, "epoch": 2870} {"train_loss": -43.723331451416016, "global_step": 347278, "epoch": 2870} {"train_loss": -44.460140228271484, "global_step": 347279, "epoch": 2870} {"train_loss": -44.40424728393555, "global_step": 347280, "epoch": 2870} {"train_loss": -44.89859390258789, "global_step": 347281, "epoch": 2870} {"train_loss": -44.621437072753906, "global_step": 347282, "epoch": 2870} {"train_loss": -44.99078369140625, "global_step": 347283, "epoch": 2870} {"train_loss": -45.479469299316406, "global_step": 347284, "epoch": 2870} {"train_loss": -44.87124252319336, "global_step": 347285, "epoch": 2870} {"train_loss": -45.394893646240234, "global_step": 347286, "epoch": 2870} {"train_loss": -44.08454513549805, "global_step": 347287, "epoch": 2870} {"train_loss": -44.026180267333984, "global_step": 347288, "epoch": 2870} {"train_loss": -44.56591796875, "global_step": 347289, "epoch": 2870} {"train_loss": -45.550994873046875, "global_step": 347290, "epoch": 2870} {"train_loss": -44.896820068359375, "global_step": 347291, "epoch": 2870} {"train_loss": -44.47446823120117, "global_step": 347292, "epoch": 2870} {"train_loss": -43.4398078918457, "global_step": 347293, "epoch": 2870} {"train_loss": -43.63035202026367, "global_step": 347294, "epoch": 2870} {"train_loss": -43.25104904174805, "global_step": 347295, "epoch": 2870} {"train_loss": -42.66608810424805, "global_step": 347296, "epoch": 2870} {"train_loss": -43.5735969543457, "global_step": 347297, "epoch": 2870} {"train_loss": -44.8946647644043, "global_step": 347298, "epoch": 2870} {"train_loss": -44.456809997558594, "global_step": 347299, "epoch": 2870} {"train_loss": -41.48518371582031, "global_step": 347300, "epoch": 2870} {"train_loss": -42.2447509765625, "global_step": 347301, "epoch": 2870} {"train_loss": -30.411462783813477, "global_step": 347302, "epoch": 2870} {"train_loss": -33.138153076171875, "global_step": 347303, "epoch": 2870} {"train_loss": -28.068389892578125, "global_step": 347304, "epoch": 2870} {"train_loss": -38.887916564941406, "global_step": 347305, "epoch": 2870} {"train_loss": -32.56650924682617, "global_step": 347306, "epoch": 2870} {"train_loss": -27.9614200592041, "global_step": 347307, "epoch": 2870} {"train_loss": -36.535247802734375, "global_step": 347308, "epoch": 2870} {"train_loss": -35.76910400390625, "global_step": 347309, "epoch": 2870} {"train_loss": -36.4721794128418, "global_step": 347310, "epoch": 2870} {"train_loss": -39.97455978393555, "global_step": 347311, "epoch": 2870} {"train_loss": -37.8592529296875, "global_step": 347312, "epoch": 2870} {"train_loss": -38.41884994506836, "global_step": 347313, "epoch": 2870} {"train_loss": -39.66191101074219, "global_step": 347314, "epoch": 2870} {"train_loss": -37.35261154174805, "global_step": 347315, "epoch": 2870} {"train_loss": -34.801239013671875, "global_step": 347316, "epoch": 2870} {"train_loss": -32.23332595825195, "global_step": 347317, "epoch": 2870} {"train_loss": -35.80495834350586, "global_step": 347318, "epoch": 2870} {"train_loss": -37.60244369506836, "global_step": 347319, "epoch": 2870} {"train_loss": -39.21104049682617, "global_step": 347320, "epoch": 2870} {"train_loss": -36.762020111083984, "global_step": 347321, "epoch": 2870} {"train_loss": -37.72906494140625, "global_step": 347322, "epoch": 2870} {"train_loss": -32.916748046875, "global_step": 347323, "epoch": 2870} {"train_loss": -36.270263671875, "global_step": 347324, "epoch": 2870} {"train_loss": -40.302955627441406, "global_step": 347325, "epoch": 2870} {"train_loss": -37.57988357543945, "global_step": 347326, "epoch": 2870} {"train_loss": -38.5734748840332, "global_step": 347327, "epoch": 2870} {"train_loss": -40.134727478027344, "global_step": 347328, "epoch": 2870} {"train_loss": -39.943519592285156, "global_step": 347329, "epoch": 2870} {"train_loss": -41.08754348754883, "global_step": 347330, "epoch": 2870} {"train_loss": -40.337738037109375, "global_step": 347331, "epoch": 2870} {"train_loss": -39.705604553222656, "global_step": 347332, "epoch": 2870} {"train_loss": -40.25619125366211, "global_step": 347333, "epoch": 2870} {"train_loss": -40.144649505615234, "global_step": 347334, "epoch": 2870} {"train_loss": -40.334815979003906, "global_step": 347335, "epoch": 2870} {"train_loss": -39.82328796386719, "global_step": 347336, "epoch": 2870} {"train_loss": -40.223384857177734, "global_step": 347337, "epoch": 2870} {"train_loss": -41.63197708129883, "global_step": 347338, "epoch": 2870} {"train_loss": -40.76166915893555, "global_step": 347339, "epoch": 2870} {"train_loss": -41.60398483276367, "global_step": 347340, "epoch": 2870} {"train_loss": -39.911376953125, "global_step": 347341, "epoch": 2870} {"train_loss": -42.12124252319336, "global_step": 347342, "epoch": 2870} {"train_loss": -38.0761833190918, "global_step": 347343, "epoch": 2870} {"train_loss": -40.550025939941406, "global_step": 347344, "epoch": 2870} {"train_loss": -41.7159538269043, "global_step": 347345, "epoch": 2870} {"train_loss": -40.24551010131836, "global_step": 347346, "epoch": 2870} {"train_loss": -40.26327133178711, "global_step": 347347, "epoch": 2870} {"train_loss": -39.07826614379883, "global_step": 347348, "epoch": 2870} {"train_loss": -40.4467887878418, "global_step": 347349, "epoch": 2870} {"train_loss": -41.29780197143555, "global_step": 347350, "epoch": 2870} {"train_loss": -41.1990966796875, "global_step": 347351, "epoch": 2870} {"train_loss": -41.3082389831543, "global_step": 347352, "epoch": 2870} {"train_loss": -42.361690521240234, "global_step": 347353, "epoch": 2870} {"train_loss": -42.3531608581543, "global_step": 347354, "epoch": 2870} {"train_loss": -41.72500991821289, "global_step": 347355, "epoch": 2870} {"train_loss": -42.47233200073242, "global_step": 347356, "epoch": 2870} {"train_loss": -42.972434997558594, "global_step": 347357, "epoch": 2870} {"train_loss": -41.83554458618164, "global_step": 347358, "epoch": 2870} {"train_loss": -42.913482666015625, "global_step": 347359, "epoch": 2870} {"train_loss": -42.28739547729492, "global_step": 347360, "epoch": 2870} {"train_loss": -43.03278350830078, "global_step": 347361, "epoch": 2870} {"train_loss": -41.18449020385742, "global_step": 347362, "epoch": 2870} {"train_loss": -42.21510696411133, "global_step": 347363, "epoch": 2870} {"train_loss": -41.278621673583984, "global_step": 347364, "epoch": 2870} {"train_loss": -42.387142181396484, "global_step": 347365, "epoch": 2870} {"train_loss": -42.48451614379883, "global_step": 347366, "epoch": 2870} {"train_loss": -43.03365707397461, "global_step": 347367, "epoch": 2870} {"train_loss": -42.20457077026367, "global_step": 347368, "epoch": 2870} {"train_loss": -43.08198928833008, "global_step": 347369, "epoch": 2870} {"train_loss": -43.11599349975586, "global_step": 347370, "epoch": 2870} {"train_loss": -42.639015197753906, "global_step": 347371, "epoch": 2870} {"train_loss": -42.940914154052734, "global_step": 347372, "epoch": 2870} {"train_loss": -41.30086135864258, "global_step": 347373, "epoch": 2870} {"train_loss": -41.99481964111328, "global_step": 347374, "epoch": 2870} {"train_loss": -41.21409606933594, "global_step": 347375, "epoch": 2870} {"train_loss": -41.6033821105957, "global_step": 347376, "epoch": 2870} {"train_loss": -41.815425872802734, "global_step": 347377, "epoch": 2870} {"train_loss": -39.397193908691406, "global_step": 347378, "epoch": 2870} {"train_loss": -42.88765335083008, "global_step": 347379, "epoch": 2870} {"train_loss": -42.07044219970703, "global_step": 347380, "epoch": 2870} {"train_loss": -41.867408752441406, "global_step": 347381, "epoch": 2870} {"train_loss": -42.80948257446289, "global_step": 347382, "epoch": 2870} {"train_loss": -40.52656555175781, "global_step": 347383, "epoch": 2870} {"train_loss": -43.092498779296875, "global_step": 347384, "epoch": 2870} {"train_loss": -43.452510833740234, "global_step": 347385, "epoch": 2870} {"train_loss": -42.56570053100586, "global_step": 347386, "epoch": 2870} {"train_loss": -43.40098571777344, "global_step": 347387, "epoch": 2870} {"train_loss": -41.01957321166992, "global_step": 347388, "epoch": 2870} {"train_loss": -43.15031814575195, "global_step": 347389, "epoch": 2870} {"train_loss": -41.030856550232436, "global_step": 347390, "epoch": 2870, "val_loss": 2585138.75} {"train_loss": -42.322933197021484, "global_step": 347391, "epoch": 2871} {"train_loss": -41.60493850708008, "global_step": 347392, "epoch": 2871} {"train_loss": -40.174781799316406, "global_step": 347393, "epoch": 2871} {"train_loss": -43.57093048095703, "global_step": 347394, "epoch": 2871} {"train_loss": -42.4771842956543, "global_step": 347395, "epoch": 2871} {"train_loss": -41.80817794799805, "global_step": 347396, "epoch": 2871} {"train_loss": -42.72140884399414, "global_step": 347397, "epoch": 2871} {"train_loss": -41.20390701293945, "global_step": 347398, "epoch": 2871} {"train_loss": -42.72888946533203, "global_step": 347399, "epoch": 2871} {"train_loss": -42.615474700927734, "global_step": 347400, "epoch": 2871} {"train_loss": -41.191505432128906, "global_step": 347401, "epoch": 2871} {"train_loss": -42.53091049194336, "global_step": 347402, "epoch": 2871} {"train_loss": -42.81121826171875, "global_step": 347403, "epoch": 2871} {"train_loss": -42.52351760864258, "global_step": 347404, "epoch": 2871} {"train_loss": -43.60478591918945, "global_step": 347405, "epoch": 2871} {"train_loss": -43.36750411987305, "global_step": 347406, "epoch": 2871} {"train_loss": -43.201107025146484, "global_step": 347407, "epoch": 2871} {"train_loss": -42.21773147583008, "global_step": 347408, "epoch": 2871} {"train_loss": -42.5927734375, "global_step": 347409, "epoch": 2871} {"train_loss": -43.10538864135742, "global_step": 347410, "epoch": 2871} {"train_loss": -43.69862747192383, "global_step": 347411, "epoch": 2871} {"train_loss": -43.18550109863281, "global_step": 347412, "epoch": 2871} {"train_loss": -42.788238525390625, "global_step": 347413, "epoch": 2871} {"train_loss": -43.9489631652832, "global_step": 347414, "epoch": 2871} {"train_loss": -43.218929290771484, "global_step": 347415, "epoch": 2871} {"train_loss": -42.47847366333008, "global_step": 347416, "epoch": 2871} {"train_loss": -43.16240692138672, "global_step": 347417, "epoch": 2871} {"train_loss": -43.13715362548828, "global_step": 347418, "epoch": 2871} {"train_loss": -43.446861267089844, "global_step": 347419, "epoch": 2871} {"train_loss": -42.66402816772461, "global_step": 347420, "epoch": 2871} {"train_loss": -43.04837417602539, "global_step": 347421, "epoch": 2871} {"train_loss": -43.556495666503906, "global_step": 347422, "epoch": 2871} {"train_loss": -43.7675666809082, "global_step": 347423, "epoch": 2871} {"train_loss": -43.397151947021484, "global_step": 347424, "epoch": 2871} {"train_loss": -43.76808547973633, "global_step": 347425, "epoch": 2871} {"train_loss": -43.84186553955078, "global_step": 347426, "epoch": 2871} {"train_loss": -44.122623443603516, "global_step": 347427, "epoch": 2871} {"train_loss": -43.385414123535156, "global_step": 347428, "epoch": 2871} {"train_loss": -43.906436920166016, "global_step": 347429, "epoch": 2871} {"train_loss": -44.04372787475586, "global_step": 347430, "epoch": 2871} {"train_loss": -43.80965805053711, "global_step": 347431, "epoch": 2871} {"train_loss": -43.620155334472656, "global_step": 347432, "epoch": 2871} {"train_loss": -43.99251937866211, "global_step": 347433, "epoch": 2871} {"train_loss": -44.416664123535156, "global_step": 347434, "epoch": 2871} {"train_loss": -44.03895950317383, "global_step": 347435, "epoch": 2871} {"train_loss": -43.703182220458984, "global_step": 347436, "epoch": 2871} {"train_loss": -44.17572021484375, "global_step": 347437, "epoch": 2871} {"train_loss": -44.252479553222656, "global_step": 347438, "epoch": 2871} {"train_loss": -43.69804763793945, "global_step": 347439, "epoch": 2871} {"train_loss": -44.134639739990234, "global_step": 347440, "epoch": 2871} {"train_loss": -44.28530502319336, "global_step": 347441, "epoch": 2871} {"train_loss": -44.31282424926758, "global_step": 347442, "epoch": 2871} {"train_loss": -44.113643646240234, "global_step": 347443, "epoch": 2871} {"train_loss": -44.32722473144531, "global_step": 347444, "epoch": 2871} {"train_loss": -44.76612854003906, "global_step": 347445, "epoch": 2871} {"train_loss": -44.77437973022461, "global_step": 347446, "epoch": 2871} {"train_loss": -44.983253479003906, "global_step": 347447, "epoch": 2871} {"train_loss": -44.15877151489258, "global_step": 347448, "epoch": 2871} {"train_loss": -44.78045654296875, "global_step": 347449, "epoch": 2871} {"train_loss": -44.75718307495117, "global_step": 347450, "epoch": 2871} {"train_loss": -45.035377502441406, "global_step": 347451, "epoch": 2871} {"train_loss": -45.23419189453125, "global_step": 347452, "epoch": 2871} {"train_loss": -44.70574951171875, "global_step": 347453, "epoch": 2871} {"train_loss": -45.1338005065918, "global_step": 347454, "epoch": 2871} {"train_loss": -44.37847137451172, "global_step": 347455, "epoch": 2871} {"train_loss": -45.176727294921875, "global_step": 347456, "epoch": 2871} {"train_loss": -45.09164810180664, "global_step": 347457, "epoch": 2871} {"train_loss": -45.157833099365234, "global_step": 347458, "epoch": 2871} {"train_loss": -45.07255172729492, "global_step": 347459, "epoch": 2871} {"train_loss": -45.25913619995117, "global_step": 347460, "epoch": 2871} {"train_loss": -44.89506530761719, "global_step": 347461, "epoch": 2871} {"train_loss": -45.014686584472656, "global_step": 347462, "epoch": 2871} {"train_loss": -44.58344650268555, "global_step": 347463, "epoch": 2871} {"train_loss": -45.043087005615234, "global_step": 347464, "epoch": 2871} {"train_loss": -45.22825241088867, "global_step": 347465, "epoch": 2871} {"train_loss": -44.84920120239258, "global_step": 347466, "epoch": 2871} {"train_loss": -44.9763298034668, "global_step": 347467, "epoch": 2871} {"train_loss": -45.2891960144043, "global_step": 347468, "epoch": 2871} {"train_loss": -45.649513244628906, "global_step": 347469, "epoch": 2871} {"train_loss": -45.03498458862305, "global_step": 347470, "epoch": 2871} {"train_loss": -45.28276062011719, "global_step": 347471, "epoch": 2871} {"train_loss": -45.34414291381836, "global_step": 347472, "epoch": 2871} {"train_loss": -45.080848693847656, "global_step": 347473, "epoch": 2871} {"train_loss": -44.82933807373047, "global_step": 347474, "epoch": 2871} {"train_loss": -45.669776916503906, "global_step": 347475, "epoch": 2871} {"train_loss": -45.02527618408203, "global_step": 347476, "epoch": 2871} {"train_loss": -45.46445846557617, "global_step": 347477, "epoch": 2871} {"train_loss": -45.2077522277832, "global_step": 347478, "epoch": 2871} {"train_loss": -45.248897552490234, "global_step": 347479, "epoch": 2871} {"train_loss": -45.443843841552734, "global_step": 347480, "epoch": 2871} {"train_loss": -44.4939079284668, "global_step": 347481, "epoch": 2871} {"train_loss": -45.236854553222656, "global_step": 347482, "epoch": 2871} {"train_loss": -44.939693450927734, "global_step": 347483, "epoch": 2871} {"train_loss": -44.599945068359375, "global_step": 347484, "epoch": 2871} {"train_loss": -45.24634552001953, "global_step": 347485, "epoch": 2871} {"train_loss": -45.40269088745117, "global_step": 347486, "epoch": 2871} {"train_loss": -45.25817108154297, "global_step": 347487, "epoch": 2871} {"train_loss": -45.890132904052734, "global_step": 347488, "epoch": 2871} {"train_loss": -45.10167694091797, "global_step": 347489, "epoch": 2871} {"train_loss": -45.10737228393555, "global_step": 347490, "epoch": 2871} {"train_loss": -45.40666198730469, "global_step": 347491, "epoch": 2871} {"train_loss": -45.85271453857422, "global_step": 347492, "epoch": 2871} {"train_loss": -45.54256057739258, "global_step": 347493, "epoch": 2871} {"train_loss": -45.2230110168457, "global_step": 347494, "epoch": 2871} {"train_loss": -45.37257385253906, "global_step": 347495, "epoch": 2871} {"train_loss": -45.5314826965332, "global_step": 347496, "epoch": 2871} {"train_loss": -45.575843811035156, "global_step": 347497, "epoch": 2871} {"train_loss": -45.179115295410156, "global_step": 347498, "epoch": 2871} {"train_loss": -45.633548736572266, "global_step": 347499, "epoch": 2871} {"train_loss": -45.59672927856445, "global_step": 347500, "epoch": 2871} {"train_loss": -45.20329666137695, "global_step": 347501, "epoch": 2871} {"train_loss": -45.547882080078125, "global_step": 347502, "epoch": 2871} {"train_loss": -44.94560623168945, "global_step": 347503, "epoch": 2871} {"train_loss": -45.64213943481445, "global_step": 347504, "epoch": 2871} {"train_loss": -44.999202728271484, "global_step": 347505, "epoch": 2871} {"train_loss": -44.680397033691406, "global_step": 347506, "epoch": 2871} {"train_loss": -44.95576858520508, "global_step": 347507, "epoch": 2871} {"train_loss": -44.58413314819336, "global_step": 347508, "epoch": 2871} {"train_loss": -42.48787307739258, "global_step": 347509, "epoch": 2871} {"train_loss": -41.08187484741211, "global_step": 347510, "epoch": 2871} {"train_loss": -44.175110210071914, "global_step": 347511, "epoch": 2871, "val_loss": 2598283.25} {"train_loss": -43.98438262939453, "global_step": 347512, "epoch": 2872} {"train_loss": -44.695068359375, "global_step": 347513, "epoch": 2872} {"train_loss": -42.944759368896484, "global_step": 347514, "epoch": 2872} {"train_loss": -43.00575256347656, "global_step": 347515, "epoch": 2872} {"train_loss": -43.450862884521484, "global_step": 347516, "epoch": 2872} {"train_loss": -44.28763961791992, "global_step": 347517, "epoch": 2872} {"train_loss": -40.032657623291016, "global_step": 347518, "epoch": 2872} {"train_loss": -42.79449462890625, "global_step": 347519, "epoch": 2872} {"train_loss": -41.4350700378418, "global_step": 347520, "epoch": 2872} {"train_loss": -41.09364700317383, "global_step": 347521, "epoch": 2872} {"train_loss": -44.0796012878418, "global_step": 347522, "epoch": 2872} {"train_loss": -38.22651290893555, "global_step": 347523, "epoch": 2872} {"train_loss": -43.34969711303711, "global_step": 347524, "epoch": 2872} {"train_loss": -37.488155364990234, "global_step": 347525, "epoch": 2872} {"train_loss": -37.59972381591797, "global_step": 347526, "epoch": 2872} {"train_loss": -39.289947509765625, "global_step": 347527, "epoch": 2872} {"train_loss": -41.5416374206543, "global_step": 347528, "epoch": 2872} {"train_loss": -38.75726318359375, "global_step": 347529, "epoch": 2872} {"train_loss": -42.4510498046875, "global_step": 347530, "epoch": 2872} {"train_loss": -39.8424072265625, "global_step": 347531, "epoch": 2872} {"train_loss": -42.876922607421875, "global_step": 347532, "epoch": 2872} {"train_loss": -41.8112907409668, "global_step": 347533, "epoch": 2872} {"train_loss": -41.70847702026367, "global_step": 347534, "epoch": 2872} {"train_loss": -42.004798889160156, "global_step": 347535, "epoch": 2872} {"train_loss": -42.15570831298828, "global_step": 347536, "epoch": 2872} {"train_loss": -42.27191162109375, "global_step": 347537, "epoch": 2872} {"train_loss": -42.60081100463867, "global_step": 347538, "epoch": 2872} {"train_loss": -43.7224235534668, "global_step": 347539, "epoch": 2872} {"train_loss": -42.2780876159668, "global_step": 347540, "epoch": 2872} {"train_loss": -43.5570068359375, "global_step": 347541, "epoch": 2872} {"train_loss": -43.36155319213867, "global_step": 347542, "epoch": 2872} {"train_loss": -42.54327392578125, "global_step": 347543, "epoch": 2872} {"train_loss": -43.71914291381836, "global_step": 347544, "epoch": 2872} {"train_loss": -42.63991165161133, "global_step": 347545, "epoch": 2872} {"train_loss": -43.99052429199219, "global_step": 347546, "epoch": 2872} {"train_loss": -42.7187385559082, "global_step": 347547, "epoch": 2872} {"train_loss": -44.105255126953125, "global_step": 347548, "epoch": 2872} {"train_loss": -43.35615921020508, "global_step": 347549, "epoch": 2872} {"train_loss": -43.6692008972168, "global_step": 347550, "epoch": 2872} {"train_loss": -43.012664794921875, "global_step": 347551, "epoch": 2872} {"train_loss": -42.67987823486328, "global_step": 347552, "epoch": 2872} {"train_loss": -43.9503059387207, "global_step": 347553, "epoch": 2872} {"train_loss": -43.70988082885742, "global_step": 347554, "epoch": 2872} {"train_loss": -44.259403228759766, "global_step": 347555, "epoch": 2872} {"train_loss": -43.00614547729492, "global_step": 347556, "epoch": 2872} {"train_loss": -43.374088287353516, "global_step": 347557, "epoch": 2872} {"train_loss": -44.112911224365234, "global_step": 347558, "epoch": 2872} {"train_loss": -43.14815902709961, "global_step": 347559, "epoch": 2872} {"train_loss": -43.76590347290039, "global_step": 347560, "epoch": 2872} {"train_loss": -44.11488342285156, "global_step": 347561, "epoch": 2872} {"train_loss": -43.59696578979492, "global_step": 347562, "epoch": 2872} {"train_loss": -44.18425369262695, "global_step": 347563, "epoch": 2872} {"train_loss": -44.553741455078125, "global_step": 347564, "epoch": 2872} {"train_loss": -43.732582092285156, "global_step": 347565, "epoch": 2872} {"train_loss": -44.130252838134766, "global_step": 347566, "epoch": 2872} {"train_loss": -44.55556106567383, "global_step": 347567, "epoch": 2872} {"train_loss": -44.06645965576172, "global_step": 347568, "epoch": 2872} {"train_loss": -44.270084381103516, "global_step": 347569, "epoch": 2872} {"train_loss": -45.21471405029297, "global_step": 347570, "epoch": 2872} {"train_loss": -44.51971435546875, "global_step": 347571, "epoch": 2872} {"train_loss": -44.25413513183594, "global_step": 347572, "epoch": 2872} {"train_loss": -45.12235641479492, "global_step": 347573, "epoch": 2872} {"train_loss": -44.58724594116211, "global_step": 347574, "epoch": 2872} {"train_loss": -44.902156829833984, "global_step": 347575, "epoch": 2872} {"train_loss": -44.89887619018555, "global_step": 347576, "epoch": 2872} {"train_loss": -44.91315841674805, "global_step": 347577, "epoch": 2872} {"train_loss": -44.662925720214844, "global_step": 347578, "epoch": 2872} {"train_loss": -45.297607421875, "global_step": 347579, "epoch": 2872} {"train_loss": -45.213111877441406, "global_step": 347580, "epoch": 2872} {"train_loss": -45.22001647949219, "global_step": 347581, "epoch": 2872} {"train_loss": -45.184017181396484, "global_step": 347582, "epoch": 2872} {"train_loss": -44.55361557006836, "global_step": 347583, "epoch": 2872} {"train_loss": -45.27667999267578, "global_step": 347584, "epoch": 2872} {"train_loss": -44.9902229309082, "global_step": 347585, "epoch": 2872} {"train_loss": -45.14432144165039, "global_step": 347586, "epoch": 2872} {"train_loss": -45.00373840332031, "global_step": 347587, "epoch": 2872} {"train_loss": -45.704864501953125, "global_step": 347588, "epoch": 2872} {"train_loss": -45.67008972167969, "global_step": 347589, "epoch": 2872} {"train_loss": -45.14336013793945, "global_step": 347590, "epoch": 2872} {"train_loss": -44.77565383911133, "global_step": 347591, "epoch": 2872} {"train_loss": -45.633148193359375, "global_step": 347592, "epoch": 2872} {"train_loss": -44.85746383666992, "global_step": 347593, "epoch": 2872} {"train_loss": -43.88254928588867, "global_step": 347594, "epoch": 2872} {"train_loss": -45.31644821166992, "global_step": 347595, "epoch": 2872} {"train_loss": -45.37730026245117, "global_step": 347596, "epoch": 2872} {"train_loss": -44.436500549316406, "global_step": 347597, "epoch": 2872} {"train_loss": -44.3736572265625, "global_step": 347598, "epoch": 2872} {"train_loss": -45.01739501953125, "global_step": 347599, "epoch": 2872} {"train_loss": -45.3205451965332, "global_step": 347600, "epoch": 2872} {"train_loss": -44.83396911621094, "global_step": 347601, "epoch": 2872} {"train_loss": -44.0971565246582, "global_step": 347602, "epoch": 2872} {"train_loss": -44.28692626953125, "global_step": 347603, "epoch": 2872} {"train_loss": -44.83774948120117, "global_step": 347604, "epoch": 2872} {"train_loss": -43.327613830566406, "global_step": 347605, "epoch": 2872} {"train_loss": -42.54413986206055, "global_step": 347606, "epoch": 2872} {"train_loss": -44.494712829589844, "global_step": 347607, "epoch": 2872} {"train_loss": -44.550071716308594, "global_step": 347608, "epoch": 2872} {"train_loss": -42.26484680175781, "global_step": 347609, "epoch": 2872} {"train_loss": -44.940975189208984, "global_step": 347610, "epoch": 2872} {"train_loss": -44.7070198059082, "global_step": 347611, "epoch": 2872} {"train_loss": -45.03778076171875, "global_step": 347612, "epoch": 2872} {"train_loss": -44.68193435668945, "global_step": 347613, "epoch": 2872} {"train_loss": -44.47887420654297, "global_step": 347614, "epoch": 2872} {"train_loss": -44.02064514160156, "global_step": 347615, "epoch": 2872} {"train_loss": -45.06276321411133, "global_step": 347616, "epoch": 2872} {"train_loss": -44.9422607421875, "global_step": 347617, "epoch": 2872} {"train_loss": -44.6546745300293, "global_step": 347618, "epoch": 2872} {"train_loss": -45.18189239501953, "global_step": 347619, "epoch": 2872} {"train_loss": -45.07525634765625, "global_step": 347620, "epoch": 2872} {"train_loss": -45.42924499511719, "global_step": 347621, "epoch": 2872} {"train_loss": -45.00455093383789, "global_step": 347622, "epoch": 2872} {"train_loss": -44.740928649902344, "global_step": 347623, "epoch": 2872} {"train_loss": -43.83906173706055, "global_step": 347624, "epoch": 2872} {"train_loss": -44.710697174072266, "global_step": 347625, "epoch": 2872} {"train_loss": -45.84855270385742, "global_step": 347626, "epoch": 2872} {"train_loss": -44.76335525512695, "global_step": 347627, "epoch": 2872} {"train_loss": -43.32931900024414, "global_step": 347628, "epoch": 2872} {"train_loss": -43.9796028137207, "global_step": 347629, "epoch": 2872} {"train_loss": -45.15876388549805, "global_step": 347630, "epoch": 2872} {"train_loss": -44.429412841796875, "global_step": 347631, "epoch": 2872} {"train_loss": -43.75595121147219, "global_step": 347632, "epoch": 2872, "val_loss": 2637055.25} {"train_loss": -44.082008361816406, "global_step": 347633, "epoch": 2873} {"train_loss": -44.44782257080078, "global_step": 347634, "epoch": 2873} {"train_loss": -43.84174728393555, "global_step": 347635, "epoch": 2873} {"train_loss": -43.54539108276367, "global_step": 347636, "epoch": 2873} {"train_loss": -43.692176818847656, "global_step": 347637, "epoch": 2873} {"train_loss": -43.922943115234375, "global_step": 347638, "epoch": 2873} {"train_loss": -44.0286979675293, "global_step": 347639, "epoch": 2873} {"train_loss": -44.1381950378418, "global_step": 347640, "epoch": 2873} {"train_loss": -43.53388595581055, "global_step": 347641, "epoch": 2873} {"train_loss": -44.483299255371094, "global_step": 347642, "epoch": 2873} {"train_loss": -43.20319366455078, "global_step": 347643, "epoch": 2873} {"train_loss": -42.2612419128418, "global_step": 347644, "epoch": 2873} {"train_loss": -44.087955474853516, "global_step": 347645, "epoch": 2873} {"train_loss": -43.43110656738281, "global_step": 347646, "epoch": 2873} {"train_loss": -43.57273483276367, "global_step": 347647, "epoch": 2873} {"train_loss": -43.481910705566406, "global_step": 347648, "epoch": 2873} {"train_loss": -44.47682189941406, "global_step": 347649, "epoch": 2873} {"train_loss": -44.69013595581055, "global_step": 347650, "epoch": 2873} {"train_loss": -44.090633392333984, "global_step": 347651, "epoch": 2873} {"train_loss": -44.076560974121094, "global_step": 347652, "epoch": 2873} {"train_loss": -44.5877799987793, "global_step": 347653, "epoch": 2873} {"train_loss": -43.97628402709961, "global_step": 347654, "epoch": 2873} {"train_loss": -43.752864837646484, "global_step": 347655, "epoch": 2873} {"train_loss": -44.44181442260742, "global_step": 347656, "epoch": 2873} {"train_loss": -43.941978454589844, "global_step": 347657, "epoch": 2873} {"train_loss": -43.96522521972656, "global_step": 347658, "epoch": 2873} {"train_loss": -44.51239776611328, "global_step": 347659, "epoch": 2873} {"train_loss": -44.41265869140625, "global_step": 347660, "epoch": 2873} {"train_loss": -44.361915588378906, "global_step": 347661, "epoch": 2873} {"train_loss": -44.51378631591797, "global_step": 347662, "epoch": 2873} {"train_loss": -44.662086486816406, "global_step": 347663, "epoch": 2873} {"train_loss": -45.10301971435547, "global_step": 347664, "epoch": 2873} {"train_loss": -44.57615661621094, "global_step": 347665, "epoch": 2873} {"train_loss": -45.409175872802734, "global_step": 347666, "epoch": 2873} {"train_loss": -44.479000091552734, "global_step": 347667, "epoch": 2873} {"train_loss": -44.752838134765625, "global_step": 347668, "epoch": 2873} {"train_loss": -44.93819808959961, "global_step": 347669, "epoch": 2873} {"train_loss": -45.059959411621094, "global_step": 347670, "epoch": 2873} {"train_loss": -44.206207275390625, "global_step": 347671, "epoch": 2873} {"train_loss": -45.05064010620117, "global_step": 347672, "epoch": 2873} {"train_loss": -45.23037338256836, "global_step": 347673, "epoch": 2873} {"train_loss": -44.085899353027344, "global_step": 347674, "epoch": 2873} {"train_loss": -44.70637512207031, "global_step": 347675, "epoch": 2873} {"train_loss": -45.0495719909668, "global_step": 347676, "epoch": 2873} {"train_loss": -43.971656799316406, "global_step": 347677, "epoch": 2873} {"train_loss": -44.46055603027344, "global_step": 347678, "epoch": 2873} {"train_loss": -43.29011154174805, "global_step": 347679, "epoch": 2873} {"train_loss": -45.08443832397461, "global_step": 347680, "epoch": 2873} {"train_loss": -44.560420989990234, "global_step": 347681, "epoch": 2873} {"train_loss": -43.282012939453125, "global_step": 347682, "epoch": 2873} {"train_loss": -45.472503662109375, "global_step": 347683, "epoch": 2873} {"train_loss": -43.994728088378906, "global_step": 347684, "epoch": 2873} {"train_loss": -45.15180206298828, "global_step": 347685, "epoch": 2873} {"train_loss": -44.82363510131836, "global_step": 347686, "epoch": 2873} {"train_loss": -44.353126525878906, "global_step": 347687, "epoch": 2873} {"train_loss": -45.67523956298828, "global_step": 347688, "epoch": 2873} {"train_loss": -44.88239669799805, "global_step": 347689, "epoch": 2873} {"train_loss": -45.30195617675781, "global_step": 347690, "epoch": 2873} {"train_loss": -45.08970260620117, "global_step": 347691, "epoch": 2873} {"train_loss": -44.47117233276367, "global_step": 347692, "epoch": 2873} {"train_loss": -45.67594528198242, "global_step": 347693, "epoch": 2873} {"train_loss": -45.373165130615234, "global_step": 347694, "epoch": 2873} {"train_loss": -45.02500915527344, "global_step": 347695, "epoch": 2873} {"train_loss": -45.39039993286133, "global_step": 347696, "epoch": 2873} {"train_loss": -45.281349182128906, "global_step": 347697, "epoch": 2873} {"train_loss": -45.04994201660156, "global_step": 347698, "epoch": 2873} {"train_loss": -45.556026458740234, "global_step": 347699, "epoch": 2873} {"train_loss": -45.10940170288086, "global_step": 347700, "epoch": 2873} {"train_loss": -44.41518783569336, "global_step": 347701, "epoch": 2873} {"train_loss": -45.297969818115234, "global_step": 347702, "epoch": 2873} {"train_loss": -44.99103927612305, "global_step": 347703, "epoch": 2873} {"train_loss": -43.4323616027832, "global_step": 347704, "epoch": 2873} {"train_loss": -44.48856735229492, "global_step": 347705, "epoch": 2873} {"train_loss": -45.34762954711914, "global_step": 347706, "epoch": 2873} {"train_loss": -44.22811508178711, "global_step": 347707, "epoch": 2873} {"train_loss": -43.14678955078125, "global_step": 347708, "epoch": 2873} {"train_loss": -42.61008071899414, "global_step": 347709, "epoch": 2873} {"train_loss": -44.50065231323242, "global_step": 347710, "epoch": 2873} {"train_loss": -42.28538131713867, "global_step": 347711, "epoch": 2873} {"train_loss": -42.73267364501953, "global_step": 347712, "epoch": 2873} {"train_loss": -44.54841995239258, "global_step": 347713, "epoch": 2873} {"train_loss": -41.604454040527344, "global_step": 347714, "epoch": 2873} {"train_loss": -41.592586517333984, "global_step": 347715, "epoch": 2873} {"train_loss": -44.28740692138672, "global_step": 347716, "epoch": 2873} {"train_loss": -43.69984436035156, "global_step": 347717, "epoch": 2873} {"train_loss": -42.56280517578125, "global_step": 347718, "epoch": 2873} {"train_loss": -45.5534553527832, "global_step": 347719, "epoch": 2873} {"train_loss": -43.648048400878906, "global_step": 347720, "epoch": 2873} {"train_loss": -44.283687591552734, "global_step": 347721, "epoch": 2873} {"train_loss": -44.68944549560547, "global_step": 347722, "epoch": 2873} {"train_loss": -44.59061813354492, "global_step": 347723, "epoch": 2873} {"train_loss": -44.64535140991211, "global_step": 347724, "epoch": 2873} {"train_loss": -45.5073356628418, "global_step": 347725, "epoch": 2873} {"train_loss": -45.19061279296875, "global_step": 347726, "epoch": 2873} {"train_loss": -44.69717025756836, "global_step": 347727, "epoch": 2873} {"train_loss": -45.463356018066406, "global_step": 347728, "epoch": 2873} {"train_loss": -45.22056579589844, "global_step": 347729, "epoch": 2873} {"train_loss": -44.50956344604492, "global_step": 347730, "epoch": 2873} {"train_loss": -45.26930236816406, "global_step": 347731, "epoch": 2873} {"train_loss": -44.562095642089844, "global_step": 347732, "epoch": 2873} {"train_loss": -45.999629974365234, "global_step": 347733, "epoch": 2873} {"train_loss": -45.13421630859375, "global_step": 347734, "epoch": 2873} {"train_loss": -44.33057403564453, "global_step": 347735, "epoch": 2873} {"train_loss": -44.603694915771484, "global_step": 347736, "epoch": 2873} {"train_loss": -45.03776168823242, "global_step": 347737, "epoch": 2873} {"train_loss": -43.754058837890625, "global_step": 347738, "epoch": 2873} {"train_loss": -44.75175094604492, "global_step": 347739, "epoch": 2873} {"train_loss": -45.13045120239258, "global_step": 347740, "epoch": 2873} {"train_loss": -44.2515983581543, "global_step": 347741, "epoch": 2873} {"train_loss": -44.79372787475586, "global_step": 347742, "epoch": 2873} {"train_loss": -43.44731521606445, "global_step": 347743, "epoch": 2873} {"train_loss": -44.38800048828125, "global_step": 347744, "epoch": 2873} {"train_loss": -44.71368408203125, "global_step": 347745, "epoch": 2873} {"train_loss": -45.07988739013672, "global_step": 347746, "epoch": 2873} {"train_loss": -44.2728157043457, "global_step": 347747, "epoch": 2873} {"train_loss": -45.18290328979492, "global_step": 347748, "epoch": 2873} {"train_loss": -43.273468017578125, "global_step": 347749, "epoch": 2873} {"train_loss": -44.49439239501953, "global_step": 347750, "epoch": 2873} {"train_loss": -44.36819076538086, "global_step": 347751, "epoch": 2873} {"train_loss": -43.695526123046875, "global_step": 347752, "epoch": 2873} {"train_loss": -44.40499036174175, "global_step": 347753, "epoch": 2873, "val_loss": 2545168.0} {"train_loss": -44.249446868896484, "global_step": 347754, "epoch": 2874} {"train_loss": -45.20882034301758, "global_step": 347755, "epoch": 2874} {"train_loss": -44.78512191772461, "global_step": 347756, "epoch": 2874} {"train_loss": -44.997772216796875, "global_step": 347757, "epoch": 2874} {"train_loss": -44.89772033691406, "global_step": 347758, "epoch": 2874} {"train_loss": -44.9578857421875, "global_step": 347759, "epoch": 2874} {"train_loss": -45.0627555847168, "global_step": 347760, "epoch": 2874} {"train_loss": -45.527099609375, "global_step": 347761, "epoch": 2874} {"train_loss": -44.852821350097656, "global_step": 347762, "epoch": 2874} {"train_loss": -45.36591720581055, "global_step": 347763, "epoch": 2874} {"train_loss": -45.293792724609375, "global_step": 347764, "epoch": 2874} {"train_loss": -45.892242431640625, "global_step": 347765, "epoch": 2874} {"train_loss": -44.786041259765625, "global_step": 347766, "epoch": 2874} {"train_loss": -43.36721420288086, "global_step": 347767, "epoch": 2874} {"train_loss": -45.26432418823242, "global_step": 347768, "epoch": 2874} {"train_loss": -45.30184555053711, "global_step": 347769, "epoch": 2874} {"train_loss": -45.70383834838867, "global_step": 347770, "epoch": 2874} {"train_loss": -44.903499603271484, "global_step": 347771, "epoch": 2874} {"train_loss": -43.99988555908203, "global_step": 347772, "epoch": 2874} {"train_loss": -44.828670501708984, "global_step": 347773, "epoch": 2874} {"train_loss": -44.564170837402344, "global_step": 347774, "epoch": 2874} {"train_loss": -45.37173080444336, "global_step": 347775, "epoch": 2874} {"train_loss": -45.24176025390625, "global_step": 347776, "epoch": 2874} {"train_loss": -45.27291488647461, "global_step": 347777, "epoch": 2874} {"train_loss": -45.72047424316406, "global_step": 347778, "epoch": 2874} {"train_loss": -45.663719177246094, "global_step": 347779, "epoch": 2874} {"train_loss": -44.96067810058594, "global_step": 347780, "epoch": 2874} {"train_loss": -45.75337600708008, "global_step": 347781, "epoch": 2874} {"train_loss": -45.43687057495117, "global_step": 347782, "epoch": 2874} {"train_loss": -45.03609085083008, "global_step": 347783, "epoch": 2874} {"train_loss": -45.52167892456055, "global_step": 347784, "epoch": 2874} {"train_loss": -44.7601432800293, "global_step": 347785, "epoch": 2874} {"train_loss": -45.20124435424805, "global_step": 347786, "epoch": 2874} {"train_loss": -44.67854309082031, "global_step": 347787, "epoch": 2874} {"train_loss": -44.8064079284668, "global_step": 347788, "epoch": 2874} {"train_loss": -45.31610107421875, "global_step": 347789, "epoch": 2874} {"train_loss": -45.01350021362305, "global_step": 347790, "epoch": 2874} {"train_loss": -45.393917083740234, "global_step": 347791, "epoch": 2874} {"train_loss": -45.27644729614258, "global_step": 347792, "epoch": 2874} {"train_loss": -45.4644775390625, "global_step": 347793, "epoch": 2874} {"train_loss": -44.289451599121094, "global_step": 347794, "epoch": 2874} {"train_loss": -45.36931228637695, "global_step": 347795, "epoch": 2874} {"train_loss": -45.0767822265625, "global_step": 347796, "epoch": 2874} {"train_loss": -44.025386810302734, "global_step": 347797, "epoch": 2874} {"train_loss": -42.0193977355957, "global_step": 347798, "epoch": 2874} {"train_loss": -41.0194091796875, "global_step": 347799, "epoch": 2874} {"train_loss": -44.62663650512695, "global_step": 347800, "epoch": 2874} {"train_loss": -45.2165641784668, "global_step": 347801, "epoch": 2874} {"train_loss": -44.8199462890625, "global_step": 347802, "epoch": 2874} {"train_loss": -44.63547897338867, "global_step": 347803, "epoch": 2874} {"train_loss": -43.746700286865234, "global_step": 347804, "epoch": 2874} {"train_loss": -44.27704620361328, "global_step": 347805, "epoch": 2874} {"train_loss": -45.07143783569336, "global_step": 347806, "epoch": 2874} {"train_loss": -44.50222396850586, "global_step": 347807, "epoch": 2874} {"train_loss": -43.46870040893555, "global_step": 347808, "epoch": 2874} {"train_loss": -43.3428955078125, "global_step": 347809, "epoch": 2874} {"train_loss": -44.323341369628906, "global_step": 347810, "epoch": 2874} {"train_loss": -45.00956344604492, "global_step": 347811, "epoch": 2874} {"train_loss": -45.30931854248047, "global_step": 347812, "epoch": 2874} {"train_loss": -45.145408630371094, "global_step": 347813, "epoch": 2874} {"train_loss": -43.47272872924805, "global_step": 347814, "epoch": 2874} {"train_loss": -44.457820892333984, "global_step": 347815, "epoch": 2874} {"train_loss": -45.51643753051758, "global_step": 347816, "epoch": 2874} {"train_loss": -45.141048431396484, "global_step": 347817, "epoch": 2874} {"train_loss": -44.0406608581543, "global_step": 347818, "epoch": 2874} {"train_loss": -44.623329162597656, "global_step": 347819, "epoch": 2874} {"train_loss": -44.804935455322266, "global_step": 347820, "epoch": 2874} {"train_loss": -44.32732009887695, "global_step": 347821, "epoch": 2874} {"train_loss": -45.06706619262695, "global_step": 347822, "epoch": 2874} {"train_loss": -43.53163528442383, "global_step": 347823, "epoch": 2874} {"train_loss": -42.23299789428711, "global_step": 347824, "epoch": 2874} {"train_loss": -43.90096664428711, "global_step": 347825, "epoch": 2874} {"train_loss": -43.93659210205078, "global_step": 347826, "epoch": 2874} {"train_loss": -44.99921798706055, "global_step": 347827, "epoch": 2874} {"train_loss": -44.974098205566406, "global_step": 347828, "epoch": 2874} {"train_loss": -44.55589294433594, "global_step": 347829, "epoch": 2874} {"train_loss": -45.12733840942383, "global_step": 347830, "epoch": 2874} {"train_loss": -44.98273849487305, "global_step": 347831, "epoch": 2874} {"train_loss": -39.821807861328125, "global_step": 347832, "epoch": 2874} {"train_loss": -40.88465881347656, "global_step": 347833, "epoch": 2874} {"train_loss": -43.19600296020508, "global_step": 347834, "epoch": 2874} {"train_loss": -39.92216110229492, "global_step": 347835, "epoch": 2874} {"train_loss": -42.13914108276367, "global_step": 347836, "epoch": 2874} {"train_loss": -41.52720260620117, "global_step": 347837, "epoch": 2874} {"train_loss": -42.15122604370117, "global_step": 347838, "epoch": 2874} {"train_loss": -42.914588928222656, "global_step": 347839, "epoch": 2874} {"train_loss": -43.81795883178711, "global_step": 347840, "epoch": 2874} {"train_loss": -43.151344299316406, "global_step": 347841, "epoch": 2874} {"train_loss": -43.382022857666016, "global_step": 347842, "epoch": 2874} {"train_loss": -43.890201568603516, "global_step": 347843, "epoch": 2874} {"train_loss": -42.10528564453125, "global_step": 347844, "epoch": 2874} {"train_loss": -44.18025588989258, "global_step": 347845, "epoch": 2874} {"train_loss": -42.60100173950195, "global_step": 347846, "epoch": 2874} {"train_loss": -41.135719299316406, "global_step": 347847, "epoch": 2874} {"train_loss": -44.6595344543457, "global_step": 347848, "epoch": 2874} {"train_loss": -41.01579284667969, "global_step": 347849, "epoch": 2874} {"train_loss": -43.05519485473633, "global_step": 347850, "epoch": 2874} {"train_loss": -42.63604736328125, "global_step": 347851, "epoch": 2874} {"train_loss": -41.71364974975586, "global_step": 347852, "epoch": 2874} {"train_loss": -43.8659782409668, "global_step": 347853, "epoch": 2874} {"train_loss": -43.10844039916992, "global_step": 347854, "epoch": 2874} {"train_loss": -42.08842849731445, "global_step": 347855, "epoch": 2874} {"train_loss": -43.55088424682617, "global_step": 347856, "epoch": 2874} {"train_loss": -40.51512908935547, "global_step": 347857, "epoch": 2874} {"train_loss": -44.43114471435547, "global_step": 347858, "epoch": 2874} {"train_loss": -42.214019775390625, "global_step": 347859, "epoch": 2874} {"train_loss": -42.49341583251953, "global_step": 347860, "epoch": 2874} {"train_loss": -42.897151947021484, "global_step": 347861, "epoch": 2874} {"train_loss": -42.007301330566406, "global_step": 347862, "epoch": 2874} {"train_loss": -43.427703857421875, "global_step": 347863, "epoch": 2874} {"train_loss": -41.188533782958984, "global_step": 347864, "epoch": 2874} {"train_loss": -44.27224349975586, "global_step": 347865, "epoch": 2874} {"train_loss": -41.47903823852539, "global_step": 347866, "epoch": 2874} {"train_loss": -44.02595901489258, "global_step": 347867, "epoch": 2874} {"train_loss": -40.68189239501953, "global_step": 347868, "epoch": 2874} {"train_loss": -43.3935546875, "global_step": 347869, "epoch": 2874} {"train_loss": -41.49868392944336, "global_step": 347870, "epoch": 2874} {"train_loss": -44.03498840332031, "global_step": 347871, "epoch": 2874} {"train_loss": -41.89619827270508, "global_step": 347872, "epoch": 2874} {"train_loss": -44.17866134643555, "global_step": 347873, "epoch": 2874} {"train_loss": -43.94379935776892, "global_step": 347874, "epoch": 2874, "val_loss": 2540806.0} {"train_loss": -44.57631301879883, "global_step": 347875, "epoch": 2875} {"train_loss": -42.48765182495117, "global_step": 347876, "epoch": 2875} {"train_loss": -44.23533630371094, "global_step": 347877, "epoch": 2875} {"train_loss": -43.00926971435547, "global_step": 347878, "epoch": 2875} {"train_loss": -43.406558990478516, "global_step": 347879, "epoch": 2875} {"train_loss": -42.63512420654297, "global_step": 347880, "epoch": 2875} {"train_loss": -43.6174201965332, "global_step": 347881, "epoch": 2875} {"train_loss": -42.78679275512695, "global_step": 347882, "epoch": 2875} {"train_loss": -44.35671615600586, "global_step": 347883, "epoch": 2875} {"train_loss": -41.88196563720703, "global_step": 347884, "epoch": 2875} {"train_loss": -43.96029281616211, "global_step": 347885, "epoch": 2875} {"train_loss": -43.088802337646484, "global_step": 347886, "epoch": 2875} {"train_loss": -42.539058685302734, "global_step": 347887, "epoch": 2875} {"train_loss": -42.395965576171875, "global_step": 347888, "epoch": 2875} {"train_loss": -43.6127815246582, "global_step": 347889, "epoch": 2875} {"train_loss": -42.77684020996094, "global_step": 347890, "epoch": 2875} {"train_loss": -43.48726272583008, "global_step": 347891, "epoch": 2875} {"train_loss": -43.77033615112305, "global_step": 347892, "epoch": 2875} {"train_loss": -43.646705627441406, "global_step": 347893, "epoch": 2875} {"train_loss": -43.384071350097656, "global_step": 347894, "epoch": 2875} {"train_loss": -39.78782272338867, "global_step": 347895, "epoch": 2875} {"train_loss": -43.07618713378906, "global_step": 347896, "epoch": 2875} {"train_loss": -41.09369659423828, "global_step": 347897, "epoch": 2875} {"train_loss": -42.67259216308594, "global_step": 347898, "epoch": 2875} {"train_loss": -42.85874557495117, "global_step": 347899, "epoch": 2875} {"train_loss": -42.60081100463867, "global_step": 347900, "epoch": 2875} {"train_loss": -43.724422454833984, "global_step": 347901, "epoch": 2875} {"train_loss": -41.4461784362793, "global_step": 347902, "epoch": 2875} {"train_loss": -42.77998733520508, "global_step": 347903, "epoch": 2875} {"train_loss": -40.424922943115234, "global_step": 347904, "epoch": 2875} {"train_loss": -43.35661697387695, "global_step": 347905, "epoch": 2875} {"train_loss": -38.04375076293945, "global_step": 347906, "epoch": 2875} {"train_loss": -43.91958999633789, "global_step": 347907, "epoch": 2875} {"train_loss": -43.35368347167969, "global_step": 347908, "epoch": 2875} {"train_loss": -42.405738830566406, "global_step": 347909, "epoch": 2875} {"train_loss": -43.36044692993164, "global_step": 347910, "epoch": 2875} {"train_loss": -42.235923767089844, "global_step": 347911, "epoch": 2875} {"train_loss": -44.088356018066406, "global_step": 347912, "epoch": 2875} {"train_loss": -43.35746383666992, "global_step": 347913, "epoch": 2875} {"train_loss": -44.118019104003906, "global_step": 347914, "epoch": 2875} {"train_loss": -43.70315170288086, "global_step": 347915, "epoch": 2875} {"train_loss": -42.554439544677734, "global_step": 347916, "epoch": 2875} {"train_loss": -42.986019134521484, "global_step": 347917, "epoch": 2875} {"train_loss": -42.16939926147461, "global_step": 347918, "epoch": 2875} {"train_loss": -43.51387023925781, "global_step": 347919, "epoch": 2875} {"train_loss": -42.72821807861328, "global_step": 347920, "epoch": 2875} {"train_loss": -43.8486328125, "global_step": 347921, "epoch": 2875} {"train_loss": -44.33890151977539, "global_step": 347922, "epoch": 2875} {"train_loss": -43.669063568115234, "global_step": 347923, "epoch": 2875} {"train_loss": -44.36186981201172, "global_step": 347924, "epoch": 2875} {"train_loss": -44.03728485107422, "global_step": 347925, "epoch": 2875} {"train_loss": -43.66856002807617, "global_step": 347926, "epoch": 2875} {"train_loss": -44.10539627075195, "global_step": 347927, "epoch": 2875} {"train_loss": -44.40366744995117, "global_step": 347928, "epoch": 2875} {"train_loss": -44.36454391479492, "global_step": 347929, "epoch": 2875} {"train_loss": -44.6949348449707, "global_step": 347930, "epoch": 2875} {"train_loss": -44.02335739135742, "global_step": 347931, "epoch": 2875} {"train_loss": -42.7574577331543, "global_step": 347932, "epoch": 2875} {"train_loss": -43.72199630737305, "global_step": 347933, "epoch": 2875} {"train_loss": -43.7086296081543, "global_step": 347934, "epoch": 2875} {"train_loss": -43.98384475708008, "global_step": 347935, "epoch": 2875} {"train_loss": -44.180809020996094, "global_step": 347936, "epoch": 2875} {"train_loss": -42.37495803833008, "global_step": 347937, "epoch": 2875} {"train_loss": -44.183834075927734, "global_step": 347938, "epoch": 2875} {"train_loss": -44.37986373901367, "global_step": 347939, "epoch": 2875} {"train_loss": -44.2747802734375, "global_step": 347940, "epoch": 2875} {"train_loss": -44.904396057128906, "global_step": 347941, "epoch": 2875} {"train_loss": -44.654296875, "global_step": 347942, "epoch": 2875} {"train_loss": -44.743282318115234, "global_step": 347943, "epoch": 2875} {"train_loss": -44.613037109375, "global_step": 347944, "epoch": 2875} {"train_loss": -44.34885787963867, "global_step": 347945, "epoch": 2875} {"train_loss": -44.19753646850586, "global_step": 347946, "epoch": 2875} {"train_loss": -45.06943893432617, "global_step": 347947, "epoch": 2875} {"train_loss": -44.526676177978516, "global_step": 347948, "epoch": 2875} {"train_loss": -45.217491149902344, "global_step": 347949, "epoch": 2875} {"train_loss": -44.82209396362305, "global_step": 347950, "epoch": 2875} {"train_loss": -44.16385269165039, "global_step": 347951, "epoch": 2875} {"train_loss": -44.78407287597656, "global_step": 347952, "epoch": 2875} {"train_loss": -45.00784683227539, "global_step": 347953, "epoch": 2875} {"train_loss": -45.04465866088867, "global_step": 347954, "epoch": 2875} {"train_loss": -44.89984130859375, "global_step": 347955, "epoch": 2875} {"train_loss": -45.574886322021484, "global_step": 347956, "epoch": 2875} {"train_loss": -45.621517181396484, "global_step": 347957, "epoch": 2875} {"train_loss": -45.08372497558594, "global_step": 347958, "epoch": 2875} {"train_loss": -44.995853424072266, "global_step": 347959, "epoch": 2875} {"train_loss": -45.37163543701172, "global_step": 347960, "epoch": 2875} {"train_loss": -45.223609924316406, "global_step": 347961, "epoch": 2875} {"train_loss": -43.69076919555664, "global_step": 347962, "epoch": 2875} {"train_loss": -44.97888946533203, "global_step": 347963, "epoch": 2875} {"train_loss": -45.122310638427734, "global_step": 347964, "epoch": 2875} {"train_loss": -45.55002975463867, "global_step": 347965, "epoch": 2875} {"train_loss": -45.040714263916016, "global_step": 347966, "epoch": 2875} {"train_loss": -45.19308853149414, "global_step": 347967, "epoch": 2875} {"train_loss": -44.69012451171875, "global_step": 347968, "epoch": 2875} {"train_loss": -42.531307220458984, "global_step": 347969, "epoch": 2875} {"train_loss": -44.64988327026367, "global_step": 347970, "epoch": 2875} {"train_loss": -43.5812873840332, "global_step": 347971, "epoch": 2875} {"train_loss": -28.8987979888916, "global_step": 347972, "epoch": 2875} {"train_loss": -43.99041748046875, "global_step": 347973, "epoch": 2875} {"train_loss": -44.8412971496582, "global_step": 347974, "epoch": 2875} {"train_loss": -45.06757736206055, "global_step": 347975, "epoch": 2875} {"train_loss": -45.274784088134766, "global_step": 347976, "epoch": 2875} {"train_loss": -45.20112228393555, "global_step": 347977, "epoch": 2875} {"train_loss": -44.150516510009766, "global_step": 347978, "epoch": 2875} {"train_loss": -43.605037689208984, "global_step": 347979, "epoch": 2875} {"train_loss": -44.55028533935547, "global_step": 347980, "epoch": 2875} {"train_loss": -44.62045669555664, "global_step": 347981, "epoch": 2875} {"train_loss": -44.08878707885742, "global_step": 347982, "epoch": 2875} {"train_loss": -44.04731369018555, "global_step": 347983, "epoch": 2875} {"train_loss": -44.17472457885742, "global_step": 347984, "epoch": 2875} {"train_loss": -43.81240463256836, "global_step": 347985, "epoch": 2875} {"train_loss": -44.73899459838867, "global_step": 347986, "epoch": 2875} {"train_loss": -36.24412536621094, "global_step": 347987, "epoch": 2875} {"train_loss": -43.54415512084961, "global_step": 347988, "epoch": 2875} {"train_loss": -44.46340560913086, "global_step": 347989, "epoch": 2875} {"train_loss": -41.1715087890625, "global_step": 347990, "epoch": 2875} {"train_loss": -42.44474792480469, "global_step": 347991, "epoch": 2875} {"train_loss": -39.88747787475586, "global_step": 347992, "epoch": 2875} {"train_loss": -43.374900817871094, "global_step": 347993, "epoch": 2875} {"train_loss": -40.91987228393555, "global_step": 347994, "epoch": 2875} {"train_loss": -43.51847752657804, "global_step": 347995, "epoch": 2875, "val_loss": 2583167.5} {"train_loss": -40.112518310546875, "global_step": 347996, "epoch": 2876} {"train_loss": -42.322998046875, "global_step": 347997, "epoch": 2876} {"train_loss": -39.90340042114258, "global_step": 347998, "epoch": 2876} {"train_loss": -43.260616302490234, "global_step": 347999, "epoch": 2876} {"train_loss": -42.4485969543457, "global_step": 348000, "epoch": 2876} {"train_loss": -41.40584182739258, "global_step": 348001, "epoch": 2876} {"train_loss": -44.194488525390625, "global_step": 348002, "epoch": 2876} {"train_loss": -41.259822845458984, "global_step": 348003, "epoch": 2876} {"train_loss": -43.14604568481445, "global_step": 348004, "epoch": 2876} {"train_loss": -43.40678024291992, "global_step": 348005, "epoch": 2876} {"train_loss": -43.77157211303711, "global_step": 348006, "epoch": 2876} {"train_loss": -42.60305404663086, "global_step": 348007, "epoch": 2876} {"train_loss": -43.595848083496094, "global_step": 348008, "epoch": 2876} {"train_loss": -43.99370193481445, "global_step": 348009, "epoch": 2876} {"train_loss": -42.837303161621094, "global_step": 348010, "epoch": 2876} {"train_loss": -43.34817123413086, "global_step": 348011, "epoch": 2876} {"train_loss": -40.620758056640625, "global_step": 348012, "epoch": 2876} {"train_loss": -43.30204391479492, "global_step": 348013, "epoch": 2876} {"train_loss": -44.1512336730957, "global_step": 348014, "epoch": 2876} {"train_loss": -43.365562438964844, "global_step": 348015, "epoch": 2876} {"train_loss": -44.84933090209961, "global_step": 348016, "epoch": 2876} {"train_loss": -43.00449752807617, "global_step": 348017, "epoch": 2876} {"train_loss": -43.95036315917969, "global_step": 348018, "epoch": 2876} {"train_loss": -44.05986785888672, "global_step": 348019, "epoch": 2876} {"train_loss": -44.265228271484375, "global_step": 348020, "epoch": 2876} {"train_loss": -41.16744613647461, "global_step": 348021, "epoch": 2876} {"train_loss": -43.76724624633789, "global_step": 348022, "epoch": 2876} {"train_loss": -44.45320129394531, "global_step": 348023, "epoch": 2876} {"train_loss": -43.95107650756836, "global_step": 348024, "epoch": 2876} {"train_loss": -44.3498649597168, "global_step": 348025, "epoch": 2876} {"train_loss": -44.24759292602539, "global_step": 348026, "epoch": 2876} {"train_loss": -44.06696319580078, "global_step": 348027, "epoch": 2876} {"train_loss": -43.299964904785156, "global_step": 348028, "epoch": 2876} {"train_loss": -44.06047821044922, "global_step": 348029, "epoch": 2876} {"train_loss": -44.52301025390625, "global_step": 348030, "epoch": 2876} {"train_loss": -45.02524948120117, "global_step": 348031, "epoch": 2876} {"train_loss": -44.476566314697266, "global_step": 348032, "epoch": 2876} {"train_loss": -44.44866943359375, "global_step": 348033, "epoch": 2876} {"train_loss": -44.33213424682617, "global_step": 348034, "epoch": 2876} {"train_loss": -45.057186126708984, "global_step": 348035, "epoch": 2876} {"train_loss": -44.6408576965332, "global_step": 348036, "epoch": 2876} {"train_loss": -45.29436111450195, "global_step": 348037, "epoch": 2876} {"train_loss": -44.70974349975586, "global_step": 348038, "epoch": 2876} {"train_loss": -44.17041015625, "global_step": 348039, "epoch": 2876} {"train_loss": -44.70826721191406, "global_step": 348040, "epoch": 2876} {"train_loss": -44.7894172668457, "global_step": 348041, "epoch": 2876} {"train_loss": -45.1942253112793, "global_step": 348042, "epoch": 2876} {"train_loss": -43.99658203125, "global_step": 348043, "epoch": 2876} {"train_loss": -44.69745635986328, "global_step": 348044, "epoch": 2876} {"train_loss": -44.67694091796875, "global_step": 348045, "epoch": 2876} {"train_loss": -44.91727828979492, "global_step": 348046, "epoch": 2876} {"train_loss": -45.09280014038086, "global_step": 348047, "epoch": 2876} {"train_loss": -44.95346450805664, "global_step": 348048, "epoch": 2876} {"train_loss": -45.26789474487305, "global_step": 348049, "epoch": 2876} {"train_loss": -45.73820114135742, "global_step": 348050, "epoch": 2876} {"train_loss": -44.7339973449707, "global_step": 348051, "epoch": 2876} {"train_loss": -44.963966369628906, "global_step": 348052, "epoch": 2876} {"train_loss": -45.8138542175293, "global_step": 348053, "epoch": 2876} {"train_loss": -45.58438491821289, "global_step": 348054, "epoch": 2876} {"train_loss": -45.202423095703125, "global_step": 348055, "epoch": 2876} {"train_loss": -45.60823440551758, "global_step": 348056, "epoch": 2876} {"train_loss": -45.450260162353516, "global_step": 348057, "epoch": 2876} {"train_loss": -45.79599380493164, "global_step": 348058, "epoch": 2876} {"train_loss": -45.391849517822266, "global_step": 348059, "epoch": 2876} {"train_loss": -44.08863067626953, "global_step": 348060, "epoch": 2876} {"train_loss": -45.51112365722656, "global_step": 348061, "epoch": 2876} {"train_loss": -45.25760269165039, "global_step": 348062, "epoch": 2876} {"train_loss": -45.933528900146484, "global_step": 348063, "epoch": 2876} {"train_loss": -45.38928985595703, "global_step": 348064, "epoch": 2876} {"train_loss": -45.4461784362793, "global_step": 348065, "epoch": 2876} {"train_loss": -45.79359817504883, "global_step": 348066, "epoch": 2876} {"train_loss": -45.1309928894043, "global_step": 348067, "epoch": 2876} {"train_loss": -44.83757781982422, "global_step": 348068, "epoch": 2876} {"train_loss": -45.28438949584961, "global_step": 348069, "epoch": 2876} {"train_loss": -45.454994201660156, "global_step": 348070, "epoch": 2876} {"train_loss": -45.0353889465332, "global_step": 348071, "epoch": 2876} {"train_loss": -44.8096809387207, "global_step": 348072, "epoch": 2876} {"train_loss": -45.894432067871094, "global_step": 348073, "epoch": 2876} {"train_loss": -46.00440216064453, "global_step": 348074, "epoch": 2876} {"train_loss": -45.38385772705078, "global_step": 348075, "epoch": 2876} {"train_loss": -43.78408432006836, "global_step": 348076, "epoch": 2876} {"train_loss": -41.79102325439453, "global_step": 348077, "epoch": 2876} {"train_loss": -41.345211029052734, "global_step": 348078, "epoch": 2876} {"train_loss": -43.73080062866211, "global_step": 348079, "epoch": 2876} {"train_loss": -44.911476135253906, "global_step": 348080, "epoch": 2876} {"train_loss": -44.00696563720703, "global_step": 348081, "epoch": 2876} {"train_loss": -40.3243522644043, "global_step": 348082, "epoch": 2876} {"train_loss": -44.430049896240234, "global_step": 348083, "epoch": 2876} {"train_loss": -41.39836883544922, "global_step": 348084, "epoch": 2876} {"train_loss": -39.22547149658203, "global_step": 348085, "epoch": 2876} {"train_loss": -41.7150764465332, "global_step": 348086, "epoch": 2876} {"train_loss": -37.22523880004883, "global_step": 348087, "epoch": 2876} {"train_loss": -36.9403190612793, "global_step": 348088, "epoch": 2876} {"train_loss": -37.67447280883789, "global_step": 348089, "epoch": 2876} {"train_loss": -37.48076248168945, "global_step": 348090, "epoch": 2876} {"train_loss": -37.09865951538086, "global_step": 348091, "epoch": 2876} {"train_loss": -36.814727783203125, "global_step": 348092, "epoch": 2876} {"train_loss": -37.70620346069336, "global_step": 348093, "epoch": 2876} {"train_loss": -37.14421081542969, "global_step": 348094, "epoch": 2876} {"train_loss": -37.41642379760742, "global_step": 348095, "epoch": 2876} {"train_loss": -37.21741485595703, "global_step": 348096, "epoch": 2876} {"train_loss": -37.143672943115234, "global_step": 348097, "epoch": 2876} {"train_loss": -37.27891159057617, "global_step": 348098, "epoch": 2876} {"train_loss": -36.67287063598633, "global_step": 348099, "epoch": 2876} {"train_loss": -37.24570846557617, "global_step": 348100, "epoch": 2876} {"train_loss": -38.114105224609375, "global_step": 348101, "epoch": 2876} {"train_loss": -37.4350471496582, "global_step": 348102, "epoch": 2876} {"train_loss": -37.97382736206055, "global_step": 348103, "epoch": 2876} {"train_loss": -38.30775833129883, "global_step": 348104, "epoch": 2876} {"train_loss": -38.03253173828125, "global_step": 348105, "epoch": 2876} {"train_loss": -37.60634994506836, "global_step": 348106, "epoch": 2876} {"train_loss": -38.81116485595703, "global_step": 348107, "epoch": 2876} {"train_loss": -38.37141418457031, "global_step": 348108, "epoch": 2876} {"train_loss": -38.204227447509766, "global_step": 348109, "epoch": 2876} {"train_loss": -39.153785705566406, "global_step": 348110, "epoch": 2876} {"train_loss": -39.18149948120117, "global_step": 348111, "epoch": 2876} {"train_loss": -38.993446350097656, "global_step": 348112, "epoch": 2876} {"train_loss": -39.150611877441406, "global_step": 348113, "epoch": 2876} {"train_loss": -37.81755447387695, "global_step": 348114, "epoch": 2876} {"train_loss": -36.94365310668945, "global_step": 348115, "epoch": 2876} {"train_loss": -42.486089186234906, "global_step": 348116, "epoch": 2876, "val_loss": 2593934.0} {"train_loss": -40.12356185913086, "global_step": 348117, "epoch": 2877} {"train_loss": -38.24861526489258, "global_step": 348118, "epoch": 2877} {"train_loss": -39.35563278198242, "global_step": 348119, "epoch": 2877} {"train_loss": -38.122169494628906, "global_step": 348120, "epoch": 2877} {"train_loss": -40.03458786010742, "global_step": 348121, "epoch": 2877} {"train_loss": -38.59049987792969, "global_step": 348122, "epoch": 2877} {"train_loss": -39.16228103637695, "global_step": 348123, "epoch": 2877} {"train_loss": -38.87482833862305, "global_step": 348124, "epoch": 2877} {"train_loss": -39.96175765991211, "global_step": 348125, "epoch": 2877} {"train_loss": -39.0423469543457, "global_step": 348126, "epoch": 2877} {"train_loss": -40.801002502441406, "global_step": 348127, "epoch": 2877} {"train_loss": -39.604061126708984, "global_step": 348128, "epoch": 2877} {"train_loss": -40.83087921142578, "global_step": 348129, "epoch": 2877} {"train_loss": -40.05922317504883, "global_step": 348130, "epoch": 2877} {"train_loss": -40.79024887084961, "global_step": 348131, "epoch": 2877} {"train_loss": -40.76814270019531, "global_step": 348132, "epoch": 2877} {"train_loss": -41.04707717895508, "global_step": 348133, "epoch": 2877} {"train_loss": -40.49700164794922, "global_step": 348134, "epoch": 2877} {"train_loss": -41.03981399536133, "global_step": 348135, "epoch": 2877} {"train_loss": -40.05788803100586, "global_step": 348136, "epoch": 2877} {"train_loss": -39.950618743896484, "global_step": 348137, "epoch": 2877} {"train_loss": -41.00419235229492, "global_step": 348138, "epoch": 2877} {"train_loss": -41.06129837036133, "global_step": 348139, "epoch": 2877} {"train_loss": -40.590370178222656, "global_step": 348140, "epoch": 2877} {"train_loss": -41.79995346069336, "global_step": 348141, "epoch": 2877} {"train_loss": -41.065547943115234, "global_step": 348142, "epoch": 2877} {"train_loss": -40.07654571533203, "global_step": 348143, "epoch": 2877} {"train_loss": -38.35078811645508, "global_step": 348144, "epoch": 2877} {"train_loss": -38.75211715698242, "global_step": 348145, "epoch": 2877} {"train_loss": -39.57896041870117, "global_step": 348146, "epoch": 2877} {"train_loss": -40.76542282104492, "global_step": 348147, "epoch": 2877} {"train_loss": -41.05556869506836, "global_step": 348148, "epoch": 2877} {"train_loss": -41.38913345336914, "global_step": 348149, "epoch": 2877} {"train_loss": -41.01772689819336, "global_step": 348150, "epoch": 2877} {"train_loss": -38.94826889038086, "global_step": 348151, "epoch": 2877} {"train_loss": -42.688777923583984, "global_step": 348152, "epoch": 2877} {"train_loss": -38.807861328125, "global_step": 348153, "epoch": 2877} {"train_loss": -39.80952835083008, "global_step": 348154, "epoch": 2877} {"train_loss": -40.18085861206055, "global_step": 348155, "epoch": 2877} {"train_loss": -39.47544479370117, "global_step": 348156, "epoch": 2877} {"train_loss": -42.47277069091797, "global_step": 348157, "epoch": 2877} {"train_loss": -39.7494010925293, "global_step": 348158, "epoch": 2877} {"train_loss": -42.65651321411133, "global_step": 348159, "epoch": 2877} {"train_loss": -40.99856185913086, "global_step": 348160, "epoch": 2877} {"train_loss": -42.81782150268555, "global_step": 348161, "epoch": 2877} {"train_loss": -41.244651794433594, "global_step": 348162, "epoch": 2877} {"train_loss": -42.074676513671875, "global_step": 348163, "epoch": 2877} {"train_loss": -41.44865798950195, "global_step": 348164, "epoch": 2877} {"train_loss": -42.24116897583008, "global_step": 348165, "epoch": 2877} {"train_loss": -41.73439025878906, "global_step": 348166, "epoch": 2877} {"train_loss": -42.44450759887695, "global_step": 348167, "epoch": 2877} {"train_loss": -41.944671630859375, "global_step": 348168, "epoch": 2877} {"train_loss": -42.27789306640625, "global_step": 348169, "epoch": 2877} {"train_loss": -41.942440032958984, "global_step": 348170, "epoch": 2877} {"train_loss": -42.6093864440918, "global_step": 348171, "epoch": 2877} {"train_loss": -42.464439392089844, "global_step": 348172, "epoch": 2877} {"train_loss": -43.056854248046875, "global_step": 348173, "epoch": 2877} {"train_loss": -41.82271957397461, "global_step": 348174, "epoch": 2877} {"train_loss": -41.41555404663086, "global_step": 348175, "epoch": 2877} {"train_loss": -42.26027297973633, "global_step": 348176, "epoch": 2877} {"train_loss": -42.0393180847168, "global_step": 348177, "epoch": 2877} {"train_loss": -42.5903205871582, "global_step": 348178, "epoch": 2877} {"train_loss": -43.19649887084961, "global_step": 348179, "epoch": 2877} {"train_loss": -41.054317474365234, "global_step": 348180, "epoch": 2877} {"train_loss": -42.39537811279297, "global_step": 348181, "epoch": 2877} {"train_loss": -42.77969741821289, "global_step": 348182, "epoch": 2877} {"train_loss": -40.409481048583984, "global_step": 348183, "epoch": 2877} {"train_loss": -40.908042907714844, "global_step": 348184, "epoch": 2877} {"train_loss": -41.79023742675781, "global_step": 348185, "epoch": 2877} {"train_loss": -41.7745475769043, "global_step": 348186, "epoch": 2877} {"train_loss": -42.050384521484375, "global_step": 348187, "epoch": 2877} {"train_loss": -41.43347930908203, "global_step": 348188, "epoch": 2877} {"train_loss": -42.02643585205078, "global_step": 348189, "epoch": 2877} {"train_loss": -41.936851501464844, "global_step": 348190, "epoch": 2877} {"train_loss": -42.587257385253906, "global_step": 348191, "epoch": 2877} {"train_loss": -42.49034881591797, "global_step": 348192, "epoch": 2877} {"train_loss": -41.99919891357422, "global_step": 348193, "epoch": 2877} {"train_loss": -42.93207931518555, "global_step": 348194, "epoch": 2877} {"train_loss": -41.9460563659668, "global_step": 348195, "epoch": 2877} {"train_loss": -42.14448547363281, "global_step": 348196, "epoch": 2877} {"train_loss": -42.93253707885742, "global_step": 348197, "epoch": 2877} {"train_loss": -42.86227035522461, "global_step": 348198, "epoch": 2877} {"train_loss": -42.56270980834961, "global_step": 348199, "epoch": 2877} {"train_loss": -42.1335563659668, "global_step": 348200, "epoch": 2877} {"train_loss": -42.74848556518555, "global_step": 348201, "epoch": 2877} {"train_loss": -43.01084899902344, "global_step": 348202, "epoch": 2877} {"train_loss": -42.97475814819336, "global_step": 348203, "epoch": 2877} {"train_loss": -42.54940414428711, "global_step": 348204, "epoch": 2877} {"train_loss": -41.9744758605957, "global_step": 348205, "epoch": 2877} {"train_loss": -42.6854362487793, "global_step": 348206, "epoch": 2877} {"train_loss": -41.982791900634766, "global_step": 348207, "epoch": 2877} {"train_loss": -42.823760986328125, "global_step": 348208, "epoch": 2877} {"train_loss": -42.916725158691406, "global_step": 348209, "epoch": 2877} {"train_loss": -42.956077575683594, "global_step": 348210, "epoch": 2877} {"train_loss": -43.01571273803711, "global_step": 348211, "epoch": 2877} {"train_loss": -43.36567687988281, "global_step": 348212, "epoch": 2877} {"train_loss": -43.254730224609375, "global_step": 348213, "epoch": 2877} {"train_loss": -43.30634307861328, "global_step": 348214, "epoch": 2877} {"train_loss": -43.76955032348633, "global_step": 348215, "epoch": 2877} {"train_loss": -43.650264739990234, "global_step": 348216, "epoch": 2877} {"train_loss": -43.27431106567383, "global_step": 348217, "epoch": 2877} {"train_loss": -42.099021911621094, "global_step": 348218, "epoch": 2877} {"train_loss": -43.502777099609375, "global_step": 348219, "epoch": 2877} {"train_loss": -43.52788162231445, "global_step": 348220, "epoch": 2877} {"train_loss": -42.50041580200195, "global_step": 348221, "epoch": 2877} {"train_loss": -44.2547721862793, "global_step": 348222, "epoch": 2877} {"train_loss": -43.66428756713867, "global_step": 348223, "epoch": 2877} {"train_loss": -43.27176284790039, "global_step": 348224, "epoch": 2877} {"train_loss": -42.922245025634766, "global_step": 348225, "epoch": 2877} {"train_loss": -42.7667350769043, "global_step": 348226, "epoch": 2877} {"train_loss": -42.69407272338867, "global_step": 348227, "epoch": 2877} {"train_loss": -43.89382553100586, "global_step": 348228, "epoch": 2877} {"train_loss": -43.55268478393555, "global_step": 348229, "epoch": 2877} {"train_loss": -44.33016586303711, "global_step": 348230, "epoch": 2877} {"train_loss": -42.04026412963867, "global_step": 348231, "epoch": 2877} {"train_loss": -41.89875030517578, "global_step": 348232, "epoch": 2877} {"train_loss": -41.135215759277344, "global_step": 348233, "epoch": 2877} {"train_loss": -37.7435417175293, "global_step": 348234, "epoch": 2877} {"train_loss": -42.632503509521484, "global_step": 348235, "epoch": 2877} {"train_loss": -42.64009475708008, "global_step": 348236, "epoch": 2877} {"train_loss": -41.6377689266993, "global_step": 348237, "epoch": 2877, "val_loss": 2826519.25} {"train_loss": -40.99209213256836, "global_step": 348238, "epoch": 2878} {"train_loss": -41.24147415161133, "global_step": 348239, "epoch": 2878} {"train_loss": -43.00453567504883, "global_step": 348240, "epoch": 2878} {"train_loss": -43.50629425048828, "global_step": 348241, "epoch": 2878} {"train_loss": -41.59186935424805, "global_step": 348242, "epoch": 2878} {"train_loss": -36.992218017578125, "global_step": 348243, "epoch": 2878} {"train_loss": -43.597801208496094, "global_step": 348244, "epoch": 2878} {"train_loss": -42.25974655151367, "global_step": 348245, "epoch": 2878} {"train_loss": -42.84709167480469, "global_step": 348246, "epoch": 2878} {"train_loss": -42.47670364379883, "global_step": 348247, "epoch": 2878} {"train_loss": -42.2307014465332, "global_step": 348248, "epoch": 2878} {"train_loss": -42.75205612182617, "global_step": 348249, "epoch": 2878} {"train_loss": -41.99349594116211, "global_step": 348250, "epoch": 2878} {"train_loss": -41.46455383300781, "global_step": 348251, "epoch": 2878} {"train_loss": -42.80705642700195, "global_step": 348252, "epoch": 2878} {"train_loss": -42.623146057128906, "global_step": 348253, "epoch": 2878} {"train_loss": -42.86335754394531, "global_step": 348254, "epoch": 2878} {"train_loss": -42.32426071166992, "global_step": 348255, "epoch": 2878} {"train_loss": -42.235321044921875, "global_step": 348256, "epoch": 2878} {"train_loss": -43.35972213745117, "global_step": 348257, "epoch": 2878} {"train_loss": -39.1296272277832, "global_step": 348258, "epoch": 2878} {"train_loss": -42.141780853271484, "global_step": 348259, "epoch": 2878} {"train_loss": -43.02588653564453, "global_step": 348260, "epoch": 2878} {"train_loss": -31.907262802124023, "global_step": 348261, "epoch": 2878} {"train_loss": -34.33835983276367, "global_step": 348262, "epoch": 2878} {"train_loss": -40.88552474975586, "global_step": 348263, "epoch": 2878} {"train_loss": -42.21305465698242, "global_step": 348264, "epoch": 2878} {"train_loss": -39.93092727661133, "global_step": 348265, "epoch": 2878} {"train_loss": -39.33575439453125, "global_step": 348266, "epoch": 2878} {"train_loss": -40.7860107421875, "global_step": 348267, "epoch": 2878} {"train_loss": -32.77021408081055, "global_step": 348268, "epoch": 2878} {"train_loss": -41.436912536621094, "global_step": 348269, "epoch": 2878} {"train_loss": -41.40035629272461, "global_step": 348270, "epoch": 2878} {"train_loss": -42.12099838256836, "global_step": 348271, "epoch": 2878} {"train_loss": -41.390254974365234, "global_step": 348272, "epoch": 2878} {"train_loss": -40.3179817199707, "global_step": 348273, "epoch": 2878} {"train_loss": -39.99376678466797, "global_step": 348274, "epoch": 2878} {"train_loss": -39.0908317565918, "global_step": 348275, "epoch": 2878} {"train_loss": -40.64704132080078, "global_step": 348276, "epoch": 2878} {"train_loss": -40.40377426147461, "global_step": 348277, "epoch": 2878} {"train_loss": -39.257423400878906, "global_step": 348278, "epoch": 2878} {"train_loss": -41.92243576049805, "global_step": 348279, "epoch": 2878} {"train_loss": -41.68478012084961, "global_step": 348280, "epoch": 2878} {"train_loss": -37.659698486328125, "global_step": 348281, "epoch": 2878} {"train_loss": -36.32232666015625, "global_step": 348282, "epoch": 2878} {"train_loss": -34.056087493896484, "global_step": 348283, "epoch": 2878} {"train_loss": -39.34592819213867, "global_step": 348284, "epoch": 2878} {"train_loss": -42.295711517333984, "global_step": 348285, "epoch": 2878} {"train_loss": -35.29535675048828, "global_step": 348286, "epoch": 2878} {"train_loss": -41.28898620605469, "global_step": 348287, "epoch": 2878} {"train_loss": -36.52781295776367, "global_step": 348288, "epoch": 2878} {"train_loss": -37.314327239990234, "global_step": 348289, "epoch": 2878} {"train_loss": -40.65235137939453, "global_step": 348290, "epoch": 2878} {"train_loss": -40.53002166748047, "global_step": 348291, "epoch": 2878} {"train_loss": -38.40079879760742, "global_step": 348292, "epoch": 2878} {"train_loss": -39.04446029663086, "global_step": 348293, "epoch": 2878} {"train_loss": -41.69846725463867, "global_step": 348294, "epoch": 2878} {"train_loss": -41.30459213256836, "global_step": 348295, "epoch": 2878} {"train_loss": -38.10737228393555, "global_step": 348296, "epoch": 2878} {"train_loss": -41.04243087768555, "global_step": 348297, "epoch": 2878} {"train_loss": -40.80678176879883, "global_step": 348298, "epoch": 2878} {"train_loss": -41.962215423583984, "global_step": 348299, "epoch": 2878} {"train_loss": -41.24931716918945, "global_step": 348300, "epoch": 2878} {"train_loss": -40.60586166381836, "global_step": 348301, "epoch": 2878} {"train_loss": -40.551509857177734, "global_step": 348302, "epoch": 2878} {"train_loss": -40.25773239135742, "global_step": 348303, "epoch": 2878} {"train_loss": -41.411094665527344, "global_step": 348304, "epoch": 2878} {"train_loss": -41.49460983276367, "global_step": 348305, "epoch": 2878} {"train_loss": -40.8199348449707, "global_step": 348306, "epoch": 2878} {"train_loss": -40.76106643676758, "global_step": 348307, "epoch": 2878} {"train_loss": -40.702266693115234, "global_step": 348308, "epoch": 2878} {"train_loss": -41.03459548950195, "global_step": 348309, "epoch": 2878} {"train_loss": -42.07088851928711, "global_step": 348310, "epoch": 2878} {"train_loss": -42.09090805053711, "global_step": 348311, "epoch": 2878} {"train_loss": -41.194210052490234, "global_step": 348312, "epoch": 2878} {"train_loss": -41.547908782958984, "global_step": 348313, "epoch": 2878} {"train_loss": -42.43552780151367, "global_step": 348314, "epoch": 2878} {"train_loss": -42.19687271118164, "global_step": 348315, "epoch": 2878} {"train_loss": -40.75587844848633, "global_step": 348316, "epoch": 2878} {"train_loss": -41.33600997924805, "global_step": 348317, "epoch": 2878} {"train_loss": -39.18959426879883, "global_step": 348318, "epoch": 2878} {"train_loss": -42.225589752197266, "global_step": 348319, "epoch": 2878} {"train_loss": -41.69597625732422, "global_step": 348320, "epoch": 2878} {"train_loss": -42.46875762939453, "global_step": 348321, "epoch": 2878} {"train_loss": -42.03738021850586, "global_step": 348322, "epoch": 2878} {"train_loss": -41.857059478759766, "global_step": 348323, "epoch": 2878} {"train_loss": -42.47744369506836, "global_step": 348324, "epoch": 2878} {"train_loss": -42.30861282348633, "global_step": 348325, "epoch": 2878} {"train_loss": -41.825557708740234, "global_step": 348326, "epoch": 2878} {"train_loss": -41.36459732055664, "global_step": 348327, "epoch": 2878} {"train_loss": -41.51306915283203, "global_step": 348328, "epoch": 2878} {"train_loss": -40.88564682006836, "global_step": 348329, "epoch": 2878} {"train_loss": -40.41590118408203, "global_step": 348330, "epoch": 2878} {"train_loss": -34.84172439575195, "global_step": 348331, "epoch": 2878} {"train_loss": -41.53676986694336, "global_step": 348332, "epoch": 2878} {"train_loss": -42.021602630615234, "global_step": 348333, "epoch": 2878} {"train_loss": -41.811248779296875, "global_step": 348334, "epoch": 2878} {"train_loss": -41.033084869384766, "global_step": 348335, "epoch": 2878} {"train_loss": -41.293190002441406, "global_step": 348336, "epoch": 2878} {"train_loss": -42.58000564575195, "global_step": 348337, "epoch": 2878} {"train_loss": -39.73757553100586, "global_step": 348338, "epoch": 2878} {"train_loss": -42.1967658996582, "global_step": 348339, "epoch": 2878} {"train_loss": -41.158103942871094, "global_step": 348340, "epoch": 2878} {"train_loss": -42.18634033203125, "global_step": 348341, "epoch": 2878} {"train_loss": -42.02354049682617, "global_step": 348342, "epoch": 2878} {"train_loss": -39.679256439208984, "global_step": 348343, "epoch": 2878} {"train_loss": -41.04071807861328, "global_step": 348344, "epoch": 2878} {"train_loss": -37.8899040222168, "global_step": 348345, "epoch": 2878} {"train_loss": -41.80451583862305, "global_step": 348346, "epoch": 2878} {"train_loss": -40.4175910949707, "global_step": 348347, "epoch": 2878} {"train_loss": -40.9416389465332, "global_step": 348348, "epoch": 2878} {"train_loss": -41.33008575439453, "global_step": 348349, "epoch": 2878} {"train_loss": -41.90534591674805, "global_step": 348350, "epoch": 2878} {"train_loss": -41.603248596191406, "global_step": 348351, "epoch": 2878} {"train_loss": -41.80594253540039, "global_step": 348352, "epoch": 2878} {"train_loss": -41.57977294921875, "global_step": 348353, "epoch": 2878} {"train_loss": -40.86147689819336, "global_step": 348354, "epoch": 2878} {"train_loss": -37.396148681640625, "global_step": 348355, "epoch": 2878} {"train_loss": -41.50028610229492, "global_step": 348356, "epoch": 2878} {"train_loss": -31.734756469726562, "global_step": 348357, "epoch": 2878} {"train_loss": -40.654718871944205, "global_step": 348358, "epoch": 2878, "val_loss": 2742538.0} {"train_loss": -42.05311965942383, "global_step": 348359, "epoch": 2879} {"train_loss": -39.22431182861328, "global_step": 348360, "epoch": 2879} {"train_loss": -40.58683395385742, "global_step": 348361, "epoch": 2879} {"train_loss": -38.65201950073242, "global_step": 348362, "epoch": 2879} {"train_loss": -41.638587951660156, "global_step": 348363, "epoch": 2879} {"train_loss": -41.44716262817383, "global_step": 348364, "epoch": 2879} {"train_loss": -40.34282302856445, "global_step": 348365, "epoch": 2879} {"train_loss": -41.210365295410156, "global_step": 348366, "epoch": 2879} {"train_loss": -40.044593811035156, "global_step": 348367, "epoch": 2879} {"train_loss": -38.86286163330078, "global_step": 348368, "epoch": 2879} {"train_loss": -34.46649932861328, "global_step": 348369, "epoch": 2879} {"train_loss": -37.38724899291992, "global_step": 348370, "epoch": 2879} {"train_loss": -36.721805572509766, "global_step": 348371, "epoch": 2879} {"train_loss": -41.07280731201172, "global_step": 348372, "epoch": 2879} {"train_loss": -40.948604583740234, "global_step": 348373, "epoch": 2879} {"train_loss": -41.26445007324219, "global_step": 348374, "epoch": 2879} {"train_loss": -40.39201736450195, "global_step": 348375, "epoch": 2879} {"train_loss": -41.02692413330078, "global_step": 348376, "epoch": 2879} {"train_loss": -41.31882858276367, "global_step": 348377, "epoch": 2879} {"train_loss": -40.73381805419922, "global_step": 348378, "epoch": 2879} {"train_loss": -40.812252044677734, "global_step": 348379, "epoch": 2879} {"train_loss": -40.45081329345703, "global_step": 348380, "epoch": 2879} {"train_loss": -38.9202995300293, "global_step": 348381, "epoch": 2879} {"train_loss": -40.34652328491211, "global_step": 348382, "epoch": 2879} {"train_loss": -39.912540435791016, "global_step": 348383, "epoch": 2879} {"train_loss": -40.35332107543945, "global_step": 348384, "epoch": 2879} {"train_loss": -40.89759826660156, "global_step": 348385, "epoch": 2879} {"train_loss": -37.687808990478516, "global_step": 348386, "epoch": 2879} {"train_loss": -39.76258850097656, "global_step": 348387, "epoch": 2879} {"train_loss": -40.42158126831055, "global_step": 348388, "epoch": 2879} {"train_loss": -41.378719329833984, "global_step": 348389, "epoch": 2879} {"train_loss": -39.490234375, "global_step": 348390, "epoch": 2879} {"train_loss": -41.32017135620117, "global_step": 348391, "epoch": 2879} {"train_loss": -42.044307708740234, "global_step": 348392, "epoch": 2879} {"train_loss": -39.67140579223633, "global_step": 348393, "epoch": 2879} {"train_loss": -41.602664947509766, "global_step": 348394, "epoch": 2879} {"train_loss": -41.82769775390625, "global_step": 348395, "epoch": 2879} {"train_loss": -40.33747100830078, "global_step": 348396, "epoch": 2879} {"train_loss": -39.089778900146484, "global_step": 348397, "epoch": 2879} {"train_loss": -40.67490768432617, "global_step": 348398, "epoch": 2879} {"train_loss": -38.7779655456543, "global_step": 348399, "epoch": 2879} {"train_loss": -42.521026611328125, "global_step": 348400, "epoch": 2879} {"train_loss": -42.104820251464844, "global_step": 348401, "epoch": 2879} {"train_loss": -41.62898635864258, "global_step": 348402, "epoch": 2879} {"train_loss": -39.80241775512695, "global_step": 348403, "epoch": 2879} {"train_loss": -40.323646545410156, "global_step": 348404, "epoch": 2879} {"train_loss": -40.30605697631836, "global_step": 348405, "epoch": 2879} {"train_loss": -42.02381896972656, "global_step": 348406, "epoch": 2879} {"train_loss": -42.56474685668945, "global_step": 348407, "epoch": 2879} {"train_loss": -42.1639289855957, "global_step": 348408, "epoch": 2879} {"train_loss": -41.175960540771484, "global_step": 348409, "epoch": 2879} {"train_loss": -41.32992172241211, "global_step": 348410, "epoch": 2879} {"train_loss": -42.185203552246094, "global_step": 348411, "epoch": 2879} {"train_loss": -40.36345291137695, "global_step": 348412, "epoch": 2879} {"train_loss": -40.5348014831543, "global_step": 348413, "epoch": 2879} {"train_loss": -42.851436614990234, "global_step": 348414, "epoch": 2879} {"train_loss": -41.979061126708984, "global_step": 348415, "epoch": 2879} {"train_loss": -41.761680603027344, "global_step": 348416, "epoch": 2879} {"train_loss": -41.659847259521484, "global_step": 348417, "epoch": 2879} {"train_loss": -42.48670959472656, "global_step": 348418, "epoch": 2879} {"train_loss": -42.48936462402344, "global_step": 348419, "epoch": 2879} {"train_loss": -42.340736389160156, "global_step": 348420, "epoch": 2879} {"train_loss": -40.71519470214844, "global_step": 348421, "epoch": 2879} {"train_loss": -42.013729095458984, "global_step": 348422, "epoch": 2879} {"train_loss": -42.83077621459961, "global_step": 348423, "epoch": 2879} {"train_loss": -42.32551193237305, "global_step": 348424, "epoch": 2879} {"train_loss": -42.30157470703125, "global_step": 348425, "epoch": 2879} {"train_loss": -42.0896110534668, "global_step": 348426, "epoch": 2879} {"train_loss": -42.044960021972656, "global_step": 348427, "epoch": 2879} {"train_loss": -43.324466705322266, "global_step": 348428, "epoch": 2879} {"train_loss": -40.62612533569336, "global_step": 348429, "epoch": 2879} {"train_loss": -43.104835510253906, "global_step": 348430, "epoch": 2879} {"train_loss": -42.80733871459961, "global_step": 348431, "epoch": 2879} {"train_loss": -41.113426208496094, "global_step": 348432, "epoch": 2879} {"train_loss": -42.53471755981445, "global_step": 348433, "epoch": 2879} {"train_loss": -42.28760528564453, "global_step": 348434, "epoch": 2879} {"train_loss": -42.93821334838867, "global_step": 348435, "epoch": 2879} {"train_loss": -39.960060119628906, "global_step": 348436, "epoch": 2879} {"train_loss": -40.48184585571289, "global_step": 348437, "epoch": 2879} {"train_loss": -41.612056732177734, "global_step": 348438, "epoch": 2879} {"train_loss": -42.94743728637695, "global_step": 348439, "epoch": 2879} {"train_loss": -41.874244689941406, "global_step": 348440, "epoch": 2879} {"train_loss": -42.63651657104492, "global_step": 348441, "epoch": 2879} {"train_loss": -41.405616760253906, "global_step": 348442, "epoch": 2879} {"train_loss": -40.686702728271484, "global_step": 348443, "epoch": 2879} {"train_loss": -41.09718704223633, "global_step": 348444, "epoch": 2879} {"train_loss": -42.75434494018555, "global_step": 348445, "epoch": 2879} {"train_loss": -42.73250961303711, "global_step": 348446, "epoch": 2879} {"train_loss": -42.619964599609375, "global_step": 348447, "epoch": 2879} {"train_loss": -39.9017333984375, "global_step": 348448, "epoch": 2879} {"train_loss": -42.80055618286133, "global_step": 348449, "epoch": 2879} {"train_loss": -41.68691635131836, "global_step": 348450, "epoch": 2879} {"train_loss": -42.286399841308594, "global_step": 348451, "epoch": 2879} {"train_loss": -42.7346305847168, "global_step": 348452, "epoch": 2879} {"train_loss": -42.72753143310547, "global_step": 348453, "epoch": 2879} {"train_loss": -42.72480392456055, "global_step": 348454, "epoch": 2879} {"train_loss": -43.38151168823242, "global_step": 348455, "epoch": 2879} {"train_loss": -42.61738204956055, "global_step": 348456, "epoch": 2879} {"train_loss": -42.36161422729492, "global_step": 348457, "epoch": 2879} {"train_loss": -41.28948974609375, "global_step": 348458, "epoch": 2879} {"train_loss": -41.35992431640625, "global_step": 348459, "epoch": 2879} {"train_loss": -42.182106018066406, "global_step": 348460, "epoch": 2879} {"train_loss": -41.94771957397461, "global_step": 348461, "epoch": 2879} {"train_loss": -37.988609313964844, "global_step": 348462, "epoch": 2879} {"train_loss": -31.810089111328125, "global_step": 348463, "epoch": 2879} {"train_loss": -32.18048858642578, "global_step": 348464, "epoch": 2879} {"train_loss": -33.44074630737305, "global_step": 348465, "epoch": 2879} {"train_loss": -39.82246017456055, "global_step": 348466, "epoch": 2879} {"train_loss": -38.05341720581055, "global_step": 348467, "epoch": 2879} {"train_loss": -34.69944763183594, "global_step": 348468, "epoch": 2879} {"train_loss": -36.47386932373047, "global_step": 348469, "epoch": 2879} {"train_loss": -38.51575469970703, "global_step": 348470, "epoch": 2879} {"train_loss": -39.36792755126953, "global_step": 348471, "epoch": 2879} {"train_loss": -38.718841552734375, "global_step": 348472, "epoch": 2879} {"train_loss": -39.50215530395508, "global_step": 348473, "epoch": 2879} {"train_loss": -37.06298828125, "global_step": 348474, "epoch": 2879} {"train_loss": -40.1503791809082, "global_step": 348475, "epoch": 2879} {"train_loss": -38.1890869140625, "global_step": 348476, "epoch": 2879} {"train_loss": -40.03989028930664, "global_step": 348477, "epoch": 2879} {"train_loss": -39.916988372802734, "global_step": 348478, "epoch": 2879} {"train_loss": -40.65077764337713, "global_step": 348479, "epoch": 2879, "val_loss": 2447615.25} {"train_loss": -41.87441635131836, "global_step": 348480, "epoch": 2880} {"train_loss": -39.99724578857422, "global_step": 348481, "epoch": 2880} {"train_loss": -39.11216354370117, "global_step": 348482, "epoch": 2880} {"train_loss": -40.413719177246094, "global_step": 348483, "epoch": 2880} {"train_loss": -40.22166061401367, "global_step": 348484, "epoch": 2880} {"train_loss": -40.84477996826172, "global_step": 348485, "epoch": 2880} {"train_loss": -41.0255012512207, "global_step": 348486, "epoch": 2880} {"train_loss": -41.128456115722656, "global_step": 348487, "epoch": 2880} {"train_loss": -39.479461669921875, "global_step": 348488, "epoch": 2880} {"train_loss": -40.5131950378418, "global_step": 348489, "epoch": 2880} {"train_loss": -39.97177505493164, "global_step": 348490, "epoch": 2880} {"train_loss": -37.535926818847656, "global_step": 348491, "epoch": 2880} {"train_loss": -41.45908737182617, "global_step": 348492, "epoch": 2880} {"train_loss": -40.871639251708984, "global_step": 348493, "epoch": 2880} {"train_loss": -41.981964111328125, "global_step": 348494, "epoch": 2880} {"train_loss": -41.25154495239258, "global_step": 348495, "epoch": 2880} {"train_loss": -41.0660285949707, "global_step": 348496, "epoch": 2880} {"train_loss": -40.055057525634766, "global_step": 348497, "epoch": 2880} {"train_loss": -41.80497741699219, "global_step": 348498, "epoch": 2880} {"train_loss": -41.459651947021484, "global_step": 348499, "epoch": 2880} {"train_loss": -41.42110824584961, "global_step": 348500, "epoch": 2880} {"train_loss": -40.97018051147461, "global_step": 348501, "epoch": 2880} {"train_loss": -41.732086181640625, "global_step": 348502, "epoch": 2880} {"train_loss": -42.1378288269043, "global_step": 348503, "epoch": 2880} {"train_loss": -41.47401428222656, "global_step": 348504, "epoch": 2880} {"train_loss": -42.35799026489258, "global_step": 348505, "epoch": 2880} {"train_loss": -42.119781494140625, "global_step": 348506, "epoch": 2880} {"train_loss": -40.597286224365234, "global_step": 348507, "epoch": 2880} {"train_loss": -41.135066986083984, "global_step": 348508, "epoch": 2880} {"train_loss": -41.6014518737793, "global_step": 348509, "epoch": 2880} {"train_loss": -41.97920608520508, "global_step": 348510, "epoch": 2880} {"train_loss": -42.105628967285156, "global_step": 348511, "epoch": 2880} {"train_loss": -42.50716781616211, "global_step": 348512, "epoch": 2880} {"train_loss": -42.607051849365234, "global_step": 348513, "epoch": 2880} {"train_loss": -42.80742645263672, "global_step": 348514, "epoch": 2880} {"train_loss": -42.86375427246094, "global_step": 348515, "epoch": 2880} {"train_loss": -42.6242561340332, "global_step": 348516, "epoch": 2880} {"train_loss": -42.39303970336914, "global_step": 348517, "epoch": 2880} {"train_loss": -40.514678955078125, "global_step": 348518, "epoch": 2880} {"train_loss": -42.799617767333984, "global_step": 348519, "epoch": 2880} {"train_loss": -39.590518951416016, "global_step": 348520, "epoch": 2880} {"train_loss": -42.94429397583008, "global_step": 348521, "epoch": 2880} {"train_loss": -41.3906364440918, "global_step": 348522, "epoch": 2880} {"train_loss": -43.26412582397461, "global_step": 348523, "epoch": 2880} {"train_loss": -42.696067810058594, "global_step": 348524, "epoch": 2880} {"train_loss": -40.475948333740234, "global_step": 348525, "epoch": 2880} {"train_loss": -41.957618713378906, "global_step": 348526, "epoch": 2880} {"train_loss": -42.726776123046875, "global_step": 348527, "epoch": 2880} {"train_loss": -41.329830169677734, "global_step": 348528, "epoch": 2880} {"train_loss": -41.7099494934082, "global_step": 348529, "epoch": 2880} {"train_loss": -42.83437728881836, "global_step": 348530, "epoch": 2880} {"train_loss": -42.62370681762695, "global_step": 348531, "epoch": 2880} {"train_loss": -42.52333450317383, "global_step": 348532, "epoch": 2880} {"train_loss": -42.09634017944336, "global_step": 348533, "epoch": 2880} {"train_loss": -43.1251106262207, "global_step": 348534, "epoch": 2880} {"train_loss": -39.96284866333008, "global_step": 348535, "epoch": 2880} {"train_loss": -41.88967514038086, "global_step": 348536, "epoch": 2880} {"train_loss": -42.522274017333984, "global_step": 348537, "epoch": 2880} {"train_loss": -43.05028533935547, "global_step": 348538, "epoch": 2880} {"train_loss": -43.546234130859375, "global_step": 348539, "epoch": 2880} {"train_loss": -43.0014762878418, "global_step": 348540, "epoch": 2880} {"train_loss": -41.987300872802734, "global_step": 348541, "epoch": 2880} {"train_loss": -43.06686019897461, "global_step": 348542, "epoch": 2880} {"train_loss": -43.055110931396484, "global_step": 348543, "epoch": 2880} {"train_loss": -41.50798797607422, "global_step": 348544, "epoch": 2880} {"train_loss": -43.02027130126953, "global_step": 348545, "epoch": 2880} {"train_loss": -43.732601165771484, "global_step": 348546, "epoch": 2880} {"train_loss": -43.63752365112305, "global_step": 348547, "epoch": 2880} {"train_loss": -43.707576751708984, "global_step": 348548, "epoch": 2880} {"train_loss": -42.71529769897461, "global_step": 348549, "epoch": 2880} {"train_loss": -43.81736373901367, "global_step": 348550, "epoch": 2880} {"train_loss": -42.93232345581055, "global_step": 348551, "epoch": 2880} {"train_loss": -43.754249572753906, "global_step": 348552, "epoch": 2880} {"train_loss": -42.09872055053711, "global_step": 348553, "epoch": 2880} {"train_loss": -43.51310348510742, "global_step": 348554, "epoch": 2880} {"train_loss": -43.32853317260742, "global_step": 348555, "epoch": 2880} {"train_loss": -43.73027038574219, "global_step": 348556, "epoch": 2880} {"train_loss": -43.812923431396484, "global_step": 348557, "epoch": 2880} {"train_loss": -43.6762809753418, "global_step": 348558, "epoch": 2880} {"train_loss": -42.90165328979492, "global_step": 348559, "epoch": 2880} {"train_loss": -44.166202545166016, "global_step": 348560, "epoch": 2880} {"train_loss": -44.2608757019043, "global_step": 348561, "epoch": 2880} {"train_loss": -44.17934799194336, "global_step": 348562, "epoch": 2880} {"train_loss": -41.983978271484375, "global_step": 348563, "epoch": 2880} {"train_loss": -43.38510513305664, "global_step": 348564, "epoch": 2880} {"train_loss": -44.36080551147461, "global_step": 348565, "epoch": 2880} {"train_loss": -44.27933120727539, "global_step": 348566, "epoch": 2880} {"train_loss": -43.82661056518555, "global_step": 348567, "epoch": 2880} {"train_loss": -41.104225158691406, "global_step": 348568, "epoch": 2880} {"train_loss": -41.01987075805664, "global_step": 348569, "epoch": 2880} {"train_loss": -37.21530532836914, "global_step": 348570, "epoch": 2880} {"train_loss": -41.1091423034668, "global_step": 348571, "epoch": 2880} {"train_loss": -42.9947509765625, "global_step": 348572, "epoch": 2880} {"train_loss": -43.27787399291992, "global_step": 348573, "epoch": 2880} {"train_loss": -43.54692840576172, "global_step": 348574, "epoch": 2880} {"train_loss": -42.677791595458984, "global_step": 348575, "epoch": 2880} {"train_loss": -43.00678634643555, "global_step": 348576, "epoch": 2880} {"train_loss": -42.45632553100586, "global_step": 348577, "epoch": 2880} {"train_loss": -43.071434020996094, "global_step": 348578, "epoch": 2880} {"train_loss": -43.06267166137695, "global_step": 348579, "epoch": 2880} {"train_loss": -42.48490524291992, "global_step": 348580, "epoch": 2880} {"train_loss": -44.01290512084961, "global_step": 348581, "epoch": 2880} {"train_loss": -40.976417541503906, "global_step": 348582, "epoch": 2880} {"train_loss": -43.013885498046875, "global_step": 348583, "epoch": 2880} {"train_loss": -41.61103820800781, "global_step": 348584, "epoch": 2880} {"train_loss": -42.933650970458984, "global_step": 348585, "epoch": 2880} {"train_loss": -40.63273620605469, "global_step": 348586, "epoch": 2880} {"train_loss": -41.50015640258789, "global_step": 348587, "epoch": 2880} {"train_loss": -43.479766845703125, "global_step": 348588, "epoch": 2880} {"train_loss": -40.453643798828125, "global_step": 348589, "epoch": 2880} {"train_loss": -40.81869125366211, "global_step": 348590, "epoch": 2880} {"train_loss": -41.01039505004883, "global_step": 348591, "epoch": 2880} {"train_loss": -42.8745231628418, "global_step": 348592, "epoch": 2880} {"train_loss": -39.428009033203125, "global_step": 348593, "epoch": 2880} {"train_loss": -41.05805969238281, "global_step": 348594, "epoch": 2880} {"train_loss": -43.05465316772461, "global_step": 348595, "epoch": 2880} {"train_loss": -41.79133605957031, "global_step": 348596, "epoch": 2880} {"train_loss": -40.89276885986328, "global_step": 348597, "epoch": 2880} {"train_loss": -42.67045211791992, "global_step": 348598, "epoch": 2880} {"train_loss": -38.836856842041016, "global_step": 348599, "epoch": 2880} {"train_loss": -42.03567353555979, "global_step": 348600, "epoch": 2880, "val_loss": 2651251.75} {"train_loss": -40.19842529296875, "global_step": 348601, "epoch": 2881} {"train_loss": -42.460357666015625, "global_step": 348602, "epoch": 2881} {"train_loss": -41.003082275390625, "global_step": 348603, "epoch": 2881} {"train_loss": -40.88734436035156, "global_step": 348604, "epoch": 2881} {"train_loss": -40.95757293701172, "global_step": 348605, "epoch": 2881} {"train_loss": -40.680908203125, "global_step": 348606, "epoch": 2881} {"train_loss": -42.13145065307617, "global_step": 348607, "epoch": 2881} {"train_loss": -41.28544998168945, "global_step": 348608, "epoch": 2881} {"train_loss": -41.389034271240234, "global_step": 348609, "epoch": 2881} {"train_loss": -39.56475067138672, "global_step": 348610, "epoch": 2881} {"train_loss": -27.792322158813477, "global_step": 348611, "epoch": 2881} {"train_loss": -41.46521759033203, "global_step": 348612, "epoch": 2881} {"train_loss": -40.6806640625, "global_step": 348613, "epoch": 2881} {"train_loss": -37.095455169677734, "global_step": 348614, "epoch": 2881} {"train_loss": -36.91450881958008, "global_step": 348615, "epoch": 2881} {"train_loss": -32.20835494995117, "global_step": 348616, "epoch": 2881} {"train_loss": -36.66552734375, "global_step": 348617, "epoch": 2881} {"train_loss": -38.18407440185547, "global_step": 348618, "epoch": 2881} {"train_loss": -33.82148361206055, "global_step": 348619, "epoch": 2881} {"train_loss": -41.3082389831543, "global_step": 348620, "epoch": 2881} {"train_loss": -40.74676513671875, "global_step": 348621, "epoch": 2881} {"train_loss": -41.73467254638672, "global_step": 348622, "epoch": 2881} {"train_loss": -39.12297439575195, "global_step": 348623, "epoch": 2881} {"train_loss": -37.43549728393555, "global_step": 348624, "epoch": 2881} {"train_loss": -38.1654167175293, "global_step": 348625, "epoch": 2881} {"train_loss": -38.56726837158203, "global_step": 348626, "epoch": 2881} {"train_loss": -40.33066940307617, "global_step": 348627, "epoch": 2881} {"train_loss": -40.34980392456055, "global_step": 348628, "epoch": 2881} {"train_loss": -39.36571502685547, "global_step": 348629, "epoch": 2881} {"train_loss": -40.52703857421875, "global_step": 348630, "epoch": 2881} {"train_loss": -40.47397994995117, "global_step": 348631, "epoch": 2881} {"train_loss": -38.7309455871582, "global_step": 348632, "epoch": 2881} {"train_loss": -40.3344841003418, "global_step": 348633, "epoch": 2881} {"train_loss": -39.34347152709961, "global_step": 348634, "epoch": 2881} {"train_loss": -41.98098373413086, "global_step": 348635, "epoch": 2881} {"train_loss": -41.445770263671875, "global_step": 348636, "epoch": 2881} {"train_loss": -40.16826629638672, "global_step": 348637, "epoch": 2881} {"train_loss": -37.64984130859375, "global_step": 348638, "epoch": 2881} {"train_loss": -41.280818939208984, "global_step": 348639, "epoch": 2881} {"train_loss": -41.53303909301758, "global_step": 348640, "epoch": 2881} {"train_loss": -41.2484130859375, "global_step": 348641, "epoch": 2881} {"train_loss": -41.4065055847168, "global_step": 348642, "epoch": 2881} {"train_loss": -41.41081237792969, "global_step": 348643, "epoch": 2881} {"train_loss": -40.287818908691406, "global_step": 348644, "epoch": 2881} {"train_loss": -41.6866569519043, "global_step": 348645, "epoch": 2881} {"train_loss": -41.33216094970703, "global_step": 348646, "epoch": 2881} {"train_loss": -41.391292572021484, "global_step": 348647, "epoch": 2881} {"train_loss": -41.36115264892578, "global_step": 348648, "epoch": 2881} {"train_loss": -41.07852554321289, "global_step": 348649, "epoch": 2881} {"train_loss": -41.23832321166992, "global_step": 348650, "epoch": 2881} {"train_loss": -42.2619743347168, "global_step": 348651, "epoch": 2881} {"train_loss": -41.2043571472168, "global_step": 348652, "epoch": 2881} {"train_loss": -42.18658447265625, "global_step": 348653, "epoch": 2881} {"train_loss": -40.931087493896484, "global_step": 348654, "epoch": 2881} {"train_loss": -41.32216262817383, "global_step": 348655, "epoch": 2881} {"train_loss": -42.025115966796875, "global_step": 348656, "epoch": 2881} {"train_loss": -41.1959342956543, "global_step": 348657, "epoch": 2881} {"train_loss": -42.065582275390625, "global_step": 348658, "epoch": 2881} {"train_loss": -42.53879928588867, "global_step": 348659, "epoch": 2881} {"train_loss": -41.101043701171875, "global_step": 348660, "epoch": 2881} {"train_loss": -42.78106689453125, "global_step": 348661, "epoch": 2881} {"train_loss": -42.25096130371094, "global_step": 348662, "epoch": 2881} {"train_loss": -42.339454650878906, "global_step": 348663, "epoch": 2881} {"train_loss": -41.53334426879883, "global_step": 348664, "epoch": 2881} {"train_loss": -42.769813537597656, "global_step": 348665, "epoch": 2881} {"train_loss": -41.01969528198242, "global_step": 348666, "epoch": 2881} {"train_loss": -42.60084915161133, "global_step": 348667, "epoch": 2881} {"train_loss": -42.217018127441406, "global_step": 348668, "epoch": 2881} {"train_loss": -41.404701232910156, "global_step": 348669, "epoch": 2881} {"train_loss": -42.46863555908203, "global_step": 348670, "epoch": 2881} {"train_loss": -42.45481491088867, "global_step": 348671, "epoch": 2881} {"train_loss": -42.32796859741211, "global_step": 348672, "epoch": 2881} {"train_loss": -42.201778411865234, "global_step": 348673, "epoch": 2881} {"train_loss": -41.344051361083984, "global_step": 348674, "epoch": 2881} {"train_loss": -41.807796478271484, "global_step": 348675, "epoch": 2881} {"train_loss": -42.488807678222656, "global_step": 348676, "epoch": 2881} {"train_loss": -43.1336669921875, "global_step": 348677, "epoch": 2881} {"train_loss": -42.758705139160156, "global_step": 348678, "epoch": 2881} {"train_loss": -41.3259391784668, "global_step": 348679, "epoch": 2881} {"train_loss": -42.61509323120117, "global_step": 348680, "epoch": 2881} {"train_loss": -41.8193359375, "global_step": 348681, "epoch": 2881} {"train_loss": -42.288028717041016, "global_step": 348682, "epoch": 2881} {"train_loss": -42.26283645629883, "global_step": 348683, "epoch": 2881} {"train_loss": -42.6323356628418, "global_step": 348684, "epoch": 2881} {"train_loss": -42.73427200317383, "global_step": 348685, "epoch": 2881} {"train_loss": -42.7828483581543, "global_step": 348686, "epoch": 2881} {"train_loss": -42.87772750854492, "global_step": 348687, "epoch": 2881} {"train_loss": -40.94926834106445, "global_step": 348688, "epoch": 2881} {"train_loss": -42.04270553588867, "global_step": 348689, "epoch": 2881} {"train_loss": -42.632347106933594, "global_step": 348690, "epoch": 2881} {"train_loss": -42.73410415649414, "global_step": 348691, "epoch": 2881} {"train_loss": -42.75164794921875, "global_step": 348692, "epoch": 2881} {"train_loss": -42.329341888427734, "global_step": 348693, "epoch": 2881} {"train_loss": -41.25489044189453, "global_step": 348694, "epoch": 2881} {"train_loss": -42.049495697021484, "global_step": 348695, "epoch": 2881} {"train_loss": -42.044185638427734, "global_step": 348696, "epoch": 2881} {"train_loss": -42.05593490600586, "global_step": 348697, "epoch": 2881} {"train_loss": -41.96894454956055, "global_step": 348698, "epoch": 2881} {"train_loss": -42.982505798339844, "global_step": 348699, "epoch": 2881} {"train_loss": -41.72480392456055, "global_step": 348700, "epoch": 2881} {"train_loss": -41.83639144897461, "global_step": 348701, "epoch": 2881} {"train_loss": -43.49810028076172, "global_step": 348702, "epoch": 2881} {"train_loss": -42.7735710144043, "global_step": 348703, "epoch": 2881} {"train_loss": -41.513301849365234, "global_step": 348704, "epoch": 2881} {"train_loss": -41.69194793701172, "global_step": 348705, "epoch": 2881} {"train_loss": -42.89974594116211, "global_step": 348706, "epoch": 2881} {"train_loss": -43.17647933959961, "global_step": 348707, "epoch": 2881} {"train_loss": -42.978397369384766, "global_step": 348708, "epoch": 2881} {"train_loss": -42.37076950073242, "global_step": 348709, "epoch": 2881} {"train_loss": -42.24870300292969, "global_step": 348710, "epoch": 2881} {"train_loss": -43.592708587646484, "global_step": 348711, "epoch": 2881} {"train_loss": -43.04774475097656, "global_step": 348712, "epoch": 2881} {"train_loss": -43.66532516479492, "global_step": 348713, "epoch": 2881} {"train_loss": -42.0456657409668, "global_step": 348714, "epoch": 2881} {"train_loss": -42.3872184753418, "global_step": 348715, "epoch": 2881} {"train_loss": -43.40208053588867, "global_step": 348716, "epoch": 2881} {"train_loss": -43.41044235229492, "global_step": 348717, "epoch": 2881} {"train_loss": -43.090370178222656, "global_step": 348718, "epoch": 2881} {"train_loss": -43.2527961730957, "global_step": 348719, "epoch": 2881} {"train_loss": -43.12930679321289, "global_step": 348720, "epoch": 2881} {"train_loss": -41.26464709762699, "global_step": 348721, "epoch": 2881, "val_loss": 2600557.25} {"train_loss": -43.3947639465332, "global_step": 348722, "epoch": 2882} {"train_loss": -42.438575744628906, "global_step": 348723, "epoch": 2882} {"train_loss": -43.98579788208008, "global_step": 348724, "epoch": 2882} {"train_loss": -42.7427978515625, "global_step": 348725, "epoch": 2882} {"train_loss": -42.5885009765625, "global_step": 348726, "epoch": 2882} {"train_loss": -41.598106384277344, "global_step": 348727, "epoch": 2882} {"train_loss": -43.22548294067383, "global_step": 348728, "epoch": 2882} {"train_loss": -42.102294921875, "global_step": 348729, "epoch": 2882} {"train_loss": -39.66754913330078, "global_step": 348730, "epoch": 2882} {"train_loss": -38.5782470703125, "global_step": 348731, "epoch": 2882} {"train_loss": -37.611568450927734, "global_step": 348732, "epoch": 2882} {"train_loss": -37.024837493896484, "global_step": 348733, "epoch": 2882} {"train_loss": -41.49404525756836, "global_step": 348734, "epoch": 2882} {"train_loss": -38.7708854675293, "global_step": 348735, "epoch": 2882} {"train_loss": -37.407562255859375, "global_step": 348736, "epoch": 2882} {"train_loss": -40.98573684692383, "global_step": 348737, "epoch": 2882} {"train_loss": -37.191192626953125, "global_step": 348738, "epoch": 2882} {"train_loss": -39.1731071472168, "global_step": 348739, "epoch": 2882} {"train_loss": -39.56061935424805, "global_step": 348740, "epoch": 2882} {"train_loss": -35.779109954833984, "global_step": 348741, "epoch": 2882} {"train_loss": -40.83018112182617, "global_step": 348742, "epoch": 2882} {"train_loss": -38.48101806640625, "global_step": 348743, "epoch": 2882} {"train_loss": -38.608158111572266, "global_step": 348744, "epoch": 2882} {"train_loss": -39.59884262084961, "global_step": 348745, "epoch": 2882} {"train_loss": -40.3643798828125, "global_step": 348746, "epoch": 2882} {"train_loss": -41.39482116699219, "global_step": 348747, "epoch": 2882} {"train_loss": -39.554443359375, "global_step": 348748, "epoch": 2882} {"train_loss": -41.40108871459961, "global_step": 348749, "epoch": 2882} {"train_loss": -40.26128005981445, "global_step": 348750, "epoch": 2882} {"train_loss": -42.456520080566406, "global_step": 348751, "epoch": 2882} {"train_loss": -39.07888412475586, "global_step": 348752, "epoch": 2882} {"train_loss": -42.3570442199707, "global_step": 348753, "epoch": 2882} {"train_loss": -41.1470947265625, "global_step": 348754, "epoch": 2882} {"train_loss": -41.752071380615234, "global_step": 348755, "epoch": 2882} {"train_loss": -42.20586395263672, "global_step": 348756, "epoch": 2882} {"train_loss": -40.11994171142578, "global_step": 348757, "epoch": 2882} {"train_loss": -42.4847526550293, "global_step": 348758, "epoch": 2882} {"train_loss": -39.72351837158203, "global_step": 348759, "epoch": 2882} {"train_loss": -41.0501594543457, "global_step": 348760, "epoch": 2882} {"train_loss": -42.424903869628906, "global_step": 348761, "epoch": 2882} {"train_loss": -41.0898551940918, "global_step": 348762, "epoch": 2882} {"train_loss": -41.73261260986328, "global_step": 348763, "epoch": 2882} {"train_loss": -42.44050979614258, "global_step": 348764, "epoch": 2882} {"train_loss": -41.84507369995117, "global_step": 348765, "epoch": 2882} {"train_loss": -41.904109954833984, "global_step": 348766, "epoch": 2882} {"train_loss": -41.02789306640625, "global_step": 348767, "epoch": 2882} {"train_loss": -42.83737564086914, "global_step": 348768, "epoch": 2882} {"train_loss": -42.285377502441406, "global_step": 348769, "epoch": 2882} {"train_loss": -42.874114990234375, "global_step": 348770, "epoch": 2882} {"train_loss": -42.80324935913086, "global_step": 348771, "epoch": 2882} {"train_loss": -42.648048400878906, "global_step": 348772, "epoch": 2882} {"train_loss": -43.281490325927734, "global_step": 348773, "epoch": 2882} {"train_loss": -42.360626220703125, "global_step": 348774, "epoch": 2882} {"train_loss": -43.26713180541992, "global_step": 348775, "epoch": 2882} {"train_loss": -43.05963897705078, "global_step": 348776, "epoch": 2882} {"train_loss": -42.71047592163086, "global_step": 348777, "epoch": 2882} {"train_loss": -43.342193603515625, "global_step": 348778, "epoch": 2882} {"train_loss": -43.0728645324707, "global_step": 348779, "epoch": 2882} {"train_loss": -42.18107986450195, "global_step": 348780, "epoch": 2882} {"train_loss": -43.498512268066406, "global_step": 348781, "epoch": 2882} {"train_loss": -43.69259262084961, "global_step": 348782, "epoch": 2882} {"train_loss": -43.136226654052734, "global_step": 348783, "epoch": 2882} {"train_loss": -43.54119110107422, "global_step": 348784, "epoch": 2882} {"train_loss": -43.04549789428711, "global_step": 348785, "epoch": 2882} {"train_loss": -42.22053909301758, "global_step": 348786, "epoch": 2882} {"train_loss": -42.79292678833008, "global_step": 348787, "epoch": 2882} {"train_loss": -43.10658645629883, "global_step": 348788, "epoch": 2882} {"train_loss": -42.88509750366211, "global_step": 348789, "epoch": 2882} {"train_loss": -43.6084098815918, "global_step": 348790, "epoch": 2882} {"train_loss": -42.80042266845703, "global_step": 348791, "epoch": 2882} {"train_loss": -43.53104782104492, "global_step": 348792, "epoch": 2882} {"train_loss": -43.311622619628906, "global_step": 348793, "epoch": 2882} {"train_loss": -43.484779357910156, "global_step": 348794, "epoch": 2882} {"train_loss": -43.794002532958984, "global_step": 348795, "epoch": 2882} {"train_loss": -42.5123405456543, "global_step": 348796, "epoch": 2882} {"train_loss": -43.76742172241211, "global_step": 348797, "epoch": 2882} {"train_loss": -43.45083999633789, "global_step": 348798, "epoch": 2882} {"train_loss": -43.72726058959961, "global_step": 348799, "epoch": 2882} {"train_loss": -43.3112678527832, "global_step": 348800, "epoch": 2882} {"train_loss": -43.48426055908203, "global_step": 348801, "epoch": 2882} {"train_loss": -43.08454513549805, "global_step": 348802, "epoch": 2882} {"train_loss": -43.242122650146484, "global_step": 348803, "epoch": 2882} {"train_loss": -42.91117477416992, "global_step": 348804, "epoch": 2882} {"train_loss": -43.46309280395508, "global_step": 348805, "epoch": 2882} {"train_loss": -42.95418930053711, "global_step": 348806, "epoch": 2882} {"train_loss": -43.253170013427734, "global_step": 348807, "epoch": 2882} {"train_loss": -42.93095016479492, "global_step": 348808, "epoch": 2882} {"train_loss": -43.42410659790039, "global_step": 348809, "epoch": 2882} {"train_loss": -43.78717041015625, "global_step": 348810, "epoch": 2882} {"train_loss": -43.17019271850586, "global_step": 348811, "epoch": 2882} {"train_loss": -43.76561737060547, "global_step": 348812, "epoch": 2882} {"train_loss": -43.73667526245117, "global_step": 348813, "epoch": 2882} {"train_loss": -43.528133392333984, "global_step": 348814, "epoch": 2882} {"train_loss": -41.486328125, "global_step": 348815, "epoch": 2882} {"train_loss": -43.47760772705078, "global_step": 348816, "epoch": 2882} {"train_loss": -43.613983154296875, "global_step": 348817, "epoch": 2882} {"train_loss": -42.78761672973633, "global_step": 348818, "epoch": 2882} {"train_loss": -43.16884231567383, "global_step": 348819, "epoch": 2882} {"train_loss": -43.06293487548828, "global_step": 348820, "epoch": 2882} {"train_loss": -42.05703353881836, "global_step": 348821, "epoch": 2882} {"train_loss": -43.77293014526367, "global_step": 348822, "epoch": 2882} {"train_loss": -43.7545051574707, "global_step": 348823, "epoch": 2882} {"train_loss": -43.42537307739258, "global_step": 348824, "epoch": 2882} {"train_loss": -44.123836517333984, "global_step": 348825, "epoch": 2882} {"train_loss": -43.86513900756836, "global_step": 348826, "epoch": 2882} {"train_loss": -43.60954666137695, "global_step": 348827, "epoch": 2882} {"train_loss": -43.40044021606445, "global_step": 348828, "epoch": 2882} {"train_loss": -42.881935119628906, "global_step": 348829, "epoch": 2882} {"train_loss": -40.467140197753906, "global_step": 348830, "epoch": 2882} {"train_loss": -37.029090881347656, "global_step": 348831, "epoch": 2882} {"train_loss": -28.010541915893555, "global_step": 348832, "epoch": 2882} {"train_loss": -26.228551864624023, "global_step": 348833, "epoch": 2882} {"train_loss": -39.27992630004883, "global_step": 348834, "epoch": 2882} {"train_loss": -37.362060546875, "global_step": 348835, "epoch": 2882} {"train_loss": -30.434919357299805, "global_step": 348836, "epoch": 2882} {"train_loss": -39.24951171875, "global_step": 348837, "epoch": 2882} {"train_loss": -37.24229431152344, "global_step": 348838, "epoch": 2882} {"train_loss": -39.27273178100586, "global_step": 348839, "epoch": 2882} {"train_loss": -37.859046936035156, "global_step": 348840, "epoch": 2882} {"train_loss": -37.99795913696289, "global_step": 348841, "epoch": 2882} {"train_loss": -41.3873816876372, "global_step": 348842, "epoch": 2882, "val_loss": 2698842.0} {"train_loss": -34.50149154663086, "global_step": 348843, "epoch": 2883} {"train_loss": -32.019466400146484, "global_step": 348844, "epoch": 2883} {"train_loss": -34.63801193237305, "global_step": 348845, "epoch": 2883} {"train_loss": -39.26325607299805, "global_step": 348846, "epoch": 2883} {"train_loss": -28.633148193359375, "global_step": 348847, "epoch": 2883} {"train_loss": -35.906227111816406, "global_step": 348848, "epoch": 2883} {"train_loss": -39.93013381958008, "global_step": 348849, "epoch": 2883} {"train_loss": -34.51729202270508, "global_step": 348850, "epoch": 2883} {"train_loss": -33.1596794128418, "global_step": 348851, "epoch": 2883} {"train_loss": -40.630619049072266, "global_step": 348852, "epoch": 2883} {"train_loss": -40.63348388671875, "global_step": 348853, "epoch": 2883} {"train_loss": -36.57204055786133, "global_step": 348854, "epoch": 2883} {"train_loss": -38.39500045776367, "global_step": 348855, "epoch": 2883} {"train_loss": -41.25600051879883, "global_step": 348856, "epoch": 2883} {"train_loss": -39.3148307800293, "global_step": 348857, "epoch": 2883} {"train_loss": -38.0303955078125, "global_step": 348858, "epoch": 2883} {"train_loss": -38.7064094543457, "global_step": 348859, "epoch": 2883} {"train_loss": -40.95361328125, "global_step": 348860, "epoch": 2883} {"train_loss": -41.11788558959961, "global_step": 348861, "epoch": 2883} {"train_loss": -41.284976959228516, "global_step": 348862, "epoch": 2883} {"train_loss": -37.81519317626953, "global_step": 348863, "epoch": 2883} {"train_loss": -40.03983688354492, "global_step": 348864, "epoch": 2883} {"train_loss": -40.678131103515625, "global_step": 348865, "epoch": 2883} {"train_loss": -41.65182113647461, "global_step": 348866, "epoch": 2883} {"train_loss": -41.707393646240234, "global_step": 348867, "epoch": 2883} {"train_loss": -41.23784637451172, "global_step": 348868, "epoch": 2883} {"train_loss": -41.592342376708984, "global_step": 348869, "epoch": 2883} {"train_loss": -41.64333724975586, "global_step": 348870, "epoch": 2883} {"train_loss": -41.32149887084961, "global_step": 348871, "epoch": 2883} {"train_loss": -41.27412414550781, "global_step": 348872, "epoch": 2883} {"train_loss": -41.47347640991211, "global_step": 348873, "epoch": 2883} {"train_loss": -42.048492431640625, "global_step": 348874, "epoch": 2883} {"train_loss": -41.66378402709961, "global_step": 348875, "epoch": 2883} {"train_loss": -42.198081970214844, "global_step": 348876, "epoch": 2883} {"train_loss": -41.21066665649414, "global_step": 348877, "epoch": 2883} {"train_loss": -41.996337890625, "global_step": 348878, "epoch": 2883} {"train_loss": -42.30379867553711, "global_step": 348879, "epoch": 2883} {"train_loss": -41.75502395629883, "global_step": 348880, "epoch": 2883} {"train_loss": -42.34320068359375, "global_step": 348881, "epoch": 2883} {"train_loss": -42.6080322265625, "global_step": 348882, "epoch": 2883} {"train_loss": -42.04082107543945, "global_step": 348883, "epoch": 2883} {"train_loss": -42.08561325073242, "global_step": 348884, "epoch": 2883} {"train_loss": -42.515621185302734, "global_step": 348885, "epoch": 2883} {"train_loss": -42.09469223022461, "global_step": 348886, "epoch": 2883} {"train_loss": -42.7253303527832, "global_step": 348887, "epoch": 2883} {"train_loss": -42.12520217895508, "global_step": 348888, "epoch": 2883} {"train_loss": -42.93980407714844, "global_step": 348889, "epoch": 2883} {"train_loss": -41.90119934082031, "global_step": 348890, "epoch": 2883} {"train_loss": -42.775630950927734, "global_step": 348891, "epoch": 2883} {"train_loss": -43.34833526611328, "global_step": 348892, "epoch": 2883} {"train_loss": -42.735618591308594, "global_step": 348893, "epoch": 2883} {"train_loss": -42.67906188964844, "global_step": 348894, "epoch": 2883} {"train_loss": -42.64164733886719, "global_step": 348895, "epoch": 2883} {"train_loss": -43.205039978027344, "global_step": 348896, "epoch": 2883} {"train_loss": -42.51167678833008, "global_step": 348897, "epoch": 2883} {"train_loss": -42.81435012817383, "global_step": 348898, "epoch": 2883} {"train_loss": -42.534542083740234, "global_step": 348899, "epoch": 2883} {"train_loss": -42.87907028198242, "global_step": 348900, "epoch": 2883} {"train_loss": -42.84480285644531, "global_step": 348901, "epoch": 2883} {"train_loss": -43.564117431640625, "global_step": 348902, "epoch": 2883} {"train_loss": -43.48491287231445, "global_step": 348903, "epoch": 2883} {"train_loss": -43.35197067260742, "global_step": 348904, "epoch": 2883} {"train_loss": -43.38847732543945, "global_step": 348905, "epoch": 2883} {"train_loss": -43.49245834350586, "global_step": 348906, "epoch": 2883} {"train_loss": -43.3656005859375, "global_step": 348907, "epoch": 2883} {"train_loss": -43.66396713256836, "global_step": 348908, "epoch": 2883} {"train_loss": -43.63543701171875, "global_step": 348909, "epoch": 2883} {"train_loss": -43.71998977661133, "global_step": 348910, "epoch": 2883} {"train_loss": -42.50206756591797, "global_step": 348911, "epoch": 2883} {"train_loss": -43.58230209350586, "global_step": 348912, "epoch": 2883} {"train_loss": -43.350276947021484, "global_step": 348913, "epoch": 2883} {"train_loss": -43.90656280517578, "global_step": 348914, "epoch": 2883} {"train_loss": -43.67097473144531, "global_step": 348915, "epoch": 2883} {"train_loss": -43.99984359741211, "global_step": 348916, "epoch": 2883} {"train_loss": -43.6866455078125, "global_step": 348917, "epoch": 2883} {"train_loss": -44.09333419799805, "global_step": 348918, "epoch": 2883} {"train_loss": -43.32859802246094, "global_step": 348919, "epoch": 2883} {"train_loss": -43.24383544921875, "global_step": 348920, "epoch": 2883} {"train_loss": -43.882965087890625, "global_step": 348921, "epoch": 2883} {"train_loss": -43.55363082885742, "global_step": 348922, "epoch": 2883} {"train_loss": -44.26897048950195, "global_step": 348923, "epoch": 2883} {"train_loss": -44.017066955566406, "global_step": 348924, "epoch": 2883} {"train_loss": -44.187686920166016, "global_step": 348925, "epoch": 2883} {"train_loss": -44.238582611083984, "global_step": 348926, "epoch": 2883} {"train_loss": -44.0515251159668, "global_step": 348927, "epoch": 2883} {"train_loss": -43.72201156616211, "global_step": 348928, "epoch": 2883} {"train_loss": -44.27033996582031, "global_step": 348929, "epoch": 2883} {"train_loss": -44.677001953125, "global_step": 348930, "epoch": 2883} {"train_loss": -43.03816604614258, "global_step": 348931, "epoch": 2883} {"train_loss": -43.57042694091797, "global_step": 348932, "epoch": 2883} {"train_loss": -43.04526138305664, "global_step": 348933, "epoch": 2883} {"train_loss": -42.2474479675293, "global_step": 348934, "epoch": 2883} {"train_loss": -40.34815216064453, "global_step": 348935, "epoch": 2883} {"train_loss": -38.105220794677734, "global_step": 348936, "epoch": 2883} {"train_loss": -33.23708724975586, "global_step": 348937, "epoch": 2883} {"train_loss": -35.526912689208984, "global_step": 348938, "epoch": 2883} {"train_loss": -43.54459762573242, "global_step": 348939, "epoch": 2883} {"train_loss": -40.262413024902344, "global_step": 348940, "epoch": 2883} {"train_loss": -37.352046966552734, "global_step": 348941, "epoch": 2883} {"train_loss": -43.33087158203125, "global_step": 348942, "epoch": 2883} {"train_loss": -40.807552337646484, "global_step": 348943, "epoch": 2883} {"train_loss": -39.90603256225586, "global_step": 348944, "epoch": 2883} {"train_loss": -43.18323516845703, "global_step": 348945, "epoch": 2883} {"train_loss": -39.21189498901367, "global_step": 348946, "epoch": 2883} {"train_loss": -43.15279769897461, "global_step": 348947, "epoch": 2883} {"train_loss": -40.64447021484375, "global_step": 348948, "epoch": 2883} {"train_loss": -40.54274368286133, "global_step": 348949, "epoch": 2883} {"train_loss": -42.38750076293945, "global_step": 348950, "epoch": 2883} {"train_loss": -41.0005989074707, "global_step": 348951, "epoch": 2883} {"train_loss": -43.121063232421875, "global_step": 348952, "epoch": 2883} {"train_loss": -41.41933822631836, "global_step": 348953, "epoch": 2883} {"train_loss": -42.881378173828125, "global_step": 348954, "epoch": 2883} {"train_loss": -42.10757064819336, "global_step": 348955, "epoch": 2883} {"train_loss": -43.37156295776367, "global_step": 348956, "epoch": 2883} {"train_loss": -40.302223205566406, "global_step": 348957, "epoch": 2883} {"train_loss": -43.16488265991211, "global_step": 348958, "epoch": 2883} {"train_loss": -42.054622650146484, "global_step": 348959, "epoch": 2883} {"train_loss": -43.56898498535156, "global_step": 348960, "epoch": 2883} {"train_loss": -41.57503128051758, "global_step": 348961, "epoch": 2883} {"train_loss": -43.67324447631836, "global_step": 348962, "epoch": 2883} {"train_loss": -41.48321085527909, "global_step": 348963, "epoch": 2883, "val_loss": 2531820.0} {"train_loss": -43.06029510498047, "global_step": 348964, "epoch": 2884} {"train_loss": -42.13117980957031, "global_step": 348965, "epoch": 2884} {"train_loss": -43.36175537109375, "global_step": 348966, "epoch": 2884} {"train_loss": -42.243350982666016, "global_step": 348967, "epoch": 2884} {"train_loss": -43.432003021240234, "global_step": 348968, "epoch": 2884} {"train_loss": -42.671993255615234, "global_step": 348969, "epoch": 2884} {"train_loss": -43.3560791015625, "global_step": 348970, "epoch": 2884} {"train_loss": -43.31439208984375, "global_step": 348971, "epoch": 2884} {"train_loss": -43.32354736328125, "global_step": 348972, "epoch": 2884} {"train_loss": -43.76884460449219, "global_step": 348973, "epoch": 2884} {"train_loss": -43.54946517944336, "global_step": 348974, "epoch": 2884} {"train_loss": -43.448822021484375, "global_step": 348975, "epoch": 2884} {"train_loss": -43.82624435424805, "global_step": 348976, "epoch": 2884} {"train_loss": -43.63747024536133, "global_step": 348977, "epoch": 2884} {"train_loss": -42.74378204345703, "global_step": 348978, "epoch": 2884} {"train_loss": -43.806053161621094, "global_step": 348979, "epoch": 2884} {"train_loss": -44.232173919677734, "global_step": 348980, "epoch": 2884} {"train_loss": -44.144020080566406, "global_step": 348981, "epoch": 2884} {"train_loss": -43.526527404785156, "global_step": 348982, "epoch": 2884} {"train_loss": -42.95685958862305, "global_step": 348983, "epoch": 2884} {"train_loss": -43.40572738647461, "global_step": 348984, "epoch": 2884} {"train_loss": -44.12278366088867, "global_step": 348985, "epoch": 2884} {"train_loss": -43.46586608886719, "global_step": 348986, "epoch": 2884} {"train_loss": -43.89992904663086, "global_step": 348987, "epoch": 2884} {"train_loss": -43.46052169799805, "global_step": 348988, "epoch": 2884} {"train_loss": -43.978843688964844, "global_step": 348989, "epoch": 2884} {"train_loss": -43.92143630981445, "global_step": 348990, "epoch": 2884} {"train_loss": -43.471229553222656, "global_step": 348991, "epoch": 2884} {"train_loss": -43.42987823486328, "global_step": 348992, "epoch": 2884} {"train_loss": -44.10022735595703, "global_step": 348993, "epoch": 2884} {"train_loss": -43.31528854370117, "global_step": 348994, "epoch": 2884} {"train_loss": -43.09564971923828, "global_step": 348995, "epoch": 2884} {"train_loss": -43.199134826660156, "global_step": 348996, "epoch": 2884} {"train_loss": -44.15764236450195, "global_step": 348997, "epoch": 2884} {"train_loss": -43.9450798034668, "global_step": 348998, "epoch": 2884} {"train_loss": -43.55583572387695, "global_step": 348999, "epoch": 2884} {"train_loss": -43.176204681396484, "global_step": 349000, "epoch": 2884} {"train_loss": -44.148597717285156, "global_step": 349001, "epoch": 2884} {"train_loss": -44.284820556640625, "global_step": 349002, "epoch": 2884} {"train_loss": -43.692291259765625, "global_step": 349003, "epoch": 2884} {"train_loss": -43.885189056396484, "global_step": 349004, "epoch": 2884} {"train_loss": -44.290584564208984, "global_step": 349005, "epoch": 2884} {"train_loss": -44.634521484375, "global_step": 349006, "epoch": 2884} {"train_loss": -44.054298400878906, "global_step": 349007, "epoch": 2884} {"train_loss": -44.509456634521484, "global_step": 349008, "epoch": 2884} {"train_loss": -43.95469284057617, "global_step": 349009, "epoch": 2884} {"train_loss": -43.37091827392578, "global_step": 349010, "epoch": 2884} {"train_loss": -42.83001708984375, "global_step": 349011, "epoch": 2884} {"train_loss": -44.4759521484375, "global_step": 349012, "epoch": 2884} {"train_loss": -44.04072189331055, "global_step": 349013, "epoch": 2884} {"train_loss": -43.55990219116211, "global_step": 349014, "epoch": 2884} {"train_loss": -44.62715530395508, "global_step": 349015, "epoch": 2884} {"train_loss": -44.4414176940918, "global_step": 349016, "epoch": 2884} {"train_loss": -44.30352783203125, "global_step": 349017, "epoch": 2884} {"train_loss": -43.643978118896484, "global_step": 349018, "epoch": 2884} {"train_loss": -44.725337982177734, "global_step": 349019, "epoch": 2884} {"train_loss": -44.35670852661133, "global_step": 349020, "epoch": 2884} {"train_loss": -44.505916595458984, "global_step": 349021, "epoch": 2884} {"train_loss": -43.588924407958984, "global_step": 349022, "epoch": 2884} {"train_loss": -43.22285079956055, "global_step": 349023, "epoch": 2884} {"train_loss": -43.46815872192383, "global_step": 349024, "epoch": 2884} {"train_loss": -44.490108489990234, "global_step": 349025, "epoch": 2884} {"train_loss": -43.4821891784668, "global_step": 349026, "epoch": 2884} {"train_loss": -43.82889938354492, "global_step": 349027, "epoch": 2884} {"train_loss": -44.356605529785156, "global_step": 349028, "epoch": 2884} {"train_loss": -44.02292251586914, "global_step": 349029, "epoch": 2884} {"train_loss": -44.03803634643555, "global_step": 349030, "epoch": 2884} {"train_loss": -44.31510543823242, "global_step": 349031, "epoch": 2884} {"train_loss": -44.082275390625, "global_step": 349032, "epoch": 2884} {"train_loss": -44.38031005859375, "global_step": 349033, "epoch": 2884} {"train_loss": -44.58175277709961, "global_step": 349034, "epoch": 2884} {"train_loss": -43.70466995239258, "global_step": 349035, "epoch": 2884} {"train_loss": -44.63179016113281, "global_step": 349036, "epoch": 2884} {"train_loss": -42.56088638305664, "global_step": 349037, "epoch": 2884} {"train_loss": -43.76879119873047, "global_step": 349038, "epoch": 2884} {"train_loss": -44.102909088134766, "global_step": 349039, "epoch": 2884} {"train_loss": -43.962154388427734, "global_step": 349040, "epoch": 2884} {"train_loss": -43.97041320800781, "global_step": 349041, "epoch": 2884} {"train_loss": -43.05259323120117, "global_step": 349042, "epoch": 2884} {"train_loss": -40.91392135620117, "global_step": 349043, "epoch": 2884} {"train_loss": -40.672630310058594, "global_step": 349044, "epoch": 2884} {"train_loss": -42.01924514770508, "global_step": 349045, "epoch": 2884} {"train_loss": -42.25031280517578, "global_step": 349046, "epoch": 2884} {"train_loss": -42.3006706237793, "global_step": 349047, "epoch": 2884} {"train_loss": -42.613094329833984, "global_step": 349048, "epoch": 2884} {"train_loss": -42.05754852294922, "global_step": 349049, "epoch": 2884} {"train_loss": -41.81393051147461, "global_step": 349050, "epoch": 2884} {"train_loss": -40.9272575378418, "global_step": 349051, "epoch": 2884} {"train_loss": -43.172691345214844, "global_step": 349052, "epoch": 2884} {"train_loss": -42.77587890625, "global_step": 349053, "epoch": 2884} {"train_loss": -40.25879669189453, "global_step": 349054, "epoch": 2884} {"train_loss": -37.780967712402344, "global_step": 349055, "epoch": 2884} {"train_loss": -41.65320587158203, "global_step": 349056, "epoch": 2884} {"train_loss": -42.6800537109375, "global_step": 349057, "epoch": 2884} {"train_loss": -39.344337463378906, "global_step": 349058, "epoch": 2884} {"train_loss": -42.3576545715332, "global_step": 349059, "epoch": 2884} {"train_loss": -43.252716064453125, "global_step": 349060, "epoch": 2884} {"train_loss": -41.85734176635742, "global_step": 349061, "epoch": 2884} {"train_loss": -42.419166564941406, "global_step": 349062, "epoch": 2884} {"train_loss": -42.02096176147461, "global_step": 349063, "epoch": 2884} {"train_loss": -42.7081298828125, "global_step": 349064, "epoch": 2884} {"train_loss": -41.04490280151367, "global_step": 349065, "epoch": 2884} {"train_loss": -42.5174560546875, "global_step": 349066, "epoch": 2884} {"train_loss": -42.9572639465332, "global_step": 349067, "epoch": 2884} {"train_loss": -42.501708984375, "global_step": 349068, "epoch": 2884} {"train_loss": -43.437278747558594, "global_step": 349069, "epoch": 2884} {"train_loss": -43.077239990234375, "global_step": 349070, "epoch": 2884} {"train_loss": -43.56187057495117, "global_step": 349071, "epoch": 2884} {"train_loss": -42.03957748413086, "global_step": 349072, "epoch": 2884} {"train_loss": -43.35934829711914, "global_step": 349073, "epoch": 2884} {"train_loss": -43.48441696166992, "global_step": 349074, "epoch": 2884} {"train_loss": -41.987762451171875, "global_step": 349075, "epoch": 2884} {"train_loss": -43.52301025390625, "global_step": 349076, "epoch": 2884} {"train_loss": -43.4415283203125, "global_step": 349077, "epoch": 2884} {"train_loss": -43.81144714355469, "global_step": 349078, "epoch": 2884} {"train_loss": -42.44847869873047, "global_step": 349079, "epoch": 2884} {"train_loss": -42.467350006103516, "global_step": 349080, "epoch": 2884} {"train_loss": -44.141788482666016, "global_step": 349081, "epoch": 2884} {"train_loss": -44.22057342529297, "global_step": 349082, "epoch": 2884} {"train_loss": -43.95476531982422, "global_step": 349083, "epoch": 2884} {"train_loss": -43.27413079758321, "global_step": 349084, "epoch": 2884, "val_loss": 2517537.75} {"train_loss": -43.22745895385742, "global_step": 349085, "epoch": 2885} {"train_loss": -44.083805084228516, "global_step": 349086, "epoch": 2885} {"train_loss": -37.886070251464844, "global_step": 349087, "epoch": 2885} {"train_loss": -42.34384536743164, "global_step": 349088, "epoch": 2885} {"train_loss": -44.17741012573242, "global_step": 349089, "epoch": 2885} {"train_loss": -39.53046798706055, "global_step": 349090, "epoch": 2885} {"train_loss": -43.525184631347656, "global_step": 349091, "epoch": 2885} {"train_loss": -43.14205551147461, "global_step": 349092, "epoch": 2885} {"train_loss": -42.26829147338867, "global_step": 349093, "epoch": 2885} {"train_loss": -29.548852920532227, "global_step": 349094, "epoch": 2885} {"train_loss": -43.46536636352539, "global_step": 349095, "epoch": 2885} {"train_loss": -43.57661056518555, "global_step": 349096, "epoch": 2885} {"train_loss": -37.90428924560547, "global_step": 349097, "epoch": 2885} {"train_loss": -41.96190643310547, "global_step": 349098, "epoch": 2885} {"train_loss": -21.64417839050293, "global_step": 349099, "epoch": 2885} {"train_loss": -33.85820007324219, "global_step": 349100, "epoch": 2885} {"train_loss": -35.19609069824219, "global_step": 349101, "epoch": 2885} {"train_loss": -40.090240478515625, "global_step": 349102, "epoch": 2885} {"train_loss": -42.7282600402832, "global_step": 349103, "epoch": 2885} {"train_loss": -40.751590728759766, "global_step": 349104, "epoch": 2885} {"train_loss": -37.29953384399414, "global_step": 349105, "epoch": 2885} {"train_loss": -40.9661750793457, "global_step": 349106, "epoch": 2885} {"train_loss": -39.216243743896484, "global_step": 349107, "epoch": 2885} {"train_loss": -32.2692756652832, "global_step": 349108, "epoch": 2885} {"train_loss": -37.08170700073242, "global_step": 349109, "epoch": 2885} {"train_loss": -39.883853912353516, "global_step": 349110, "epoch": 2885} {"train_loss": -41.3638801574707, "global_step": 349111, "epoch": 2885} {"train_loss": -41.59717559814453, "global_step": 349112, "epoch": 2885} {"train_loss": -37.627750396728516, "global_step": 349113, "epoch": 2885} {"train_loss": -41.616798400878906, "global_step": 349114, "epoch": 2885} {"train_loss": -41.03160858154297, "global_step": 349115, "epoch": 2885} {"train_loss": -41.6213264465332, "global_step": 349116, "epoch": 2885} {"train_loss": -41.50715255737305, "global_step": 349117, "epoch": 2885} {"train_loss": -41.204444885253906, "global_step": 349118, "epoch": 2885} {"train_loss": -40.754493713378906, "global_step": 349119, "epoch": 2885} {"train_loss": -38.80759811401367, "global_step": 349120, "epoch": 2885} {"train_loss": -40.987911224365234, "global_step": 349121, "epoch": 2885} {"train_loss": -41.68416976928711, "global_step": 349122, "epoch": 2885} {"train_loss": -41.96046447753906, "global_step": 349123, "epoch": 2885} {"train_loss": -42.07958221435547, "global_step": 349124, "epoch": 2885} {"train_loss": -41.95982360839844, "global_step": 349125, "epoch": 2885} {"train_loss": -41.476863861083984, "global_step": 349126, "epoch": 2885} {"train_loss": -42.552371978759766, "global_step": 349127, "epoch": 2885} {"train_loss": -37.423553466796875, "global_step": 349128, "epoch": 2885} {"train_loss": -38.93239974975586, "global_step": 349129, "epoch": 2885} {"train_loss": -41.006103515625, "global_step": 349130, "epoch": 2885} {"train_loss": -42.564308166503906, "global_step": 349131, "epoch": 2885} {"train_loss": -41.76241683959961, "global_step": 349132, "epoch": 2885} {"train_loss": -41.61159896850586, "global_step": 349133, "epoch": 2885} {"train_loss": -40.77771759033203, "global_step": 349134, "epoch": 2885} {"train_loss": -42.34988021850586, "global_step": 349135, "epoch": 2885} {"train_loss": -41.23992156982422, "global_step": 349136, "epoch": 2885} {"train_loss": -39.30257797241211, "global_step": 349137, "epoch": 2885} {"train_loss": -42.81209182739258, "global_step": 349138, "epoch": 2885} {"train_loss": -42.04273223876953, "global_step": 349139, "epoch": 2885} {"train_loss": -41.484981536865234, "global_step": 349140, "epoch": 2885} {"train_loss": -42.874969482421875, "global_step": 349141, "epoch": 2885} {"train_loss": -42.77451705932617, "global_step": 349142, "epoch": 2885} {"train_loss": -39.708404541015625, "global_step": 349143, "epoch": 2885} {"train_loss": -41.63116455078125, "global_step": 349144, "epoch": 2885} {"train_loss": -41.40482711791992, "global_step": 349145, "epoch": 2885} {"train_loss": -41.694400787353516, "global_step": 349146, "epoch": 2885} {"train_loss": -40.60190200805664, "global_step": 349147, "epoch": 2885} {"train_loss": -40.006103515625, "global_step": 349148, "epoch": 2885} {"train_loss": -41.66908645629883, "global_step": 349149, "epoch": 2885} {"train_loss": -42.29863357543945, "global_step": 349150, "epoch": 2885} {"train_loss": -42.804443359375, "global_step": 349151, "epoch": 2885} {"train_loss": -41.68189239501953, "global_step": 349152, "epoch": 2885} {"train_loss": -43.26997756958008, "global_step": 349153, "epoch": 2885} {"train_loss": -42.658447265625, "global_step": 349154, "epoch": 2885} {"train_loss": -42.7192497253418, "global_step": 349155, "epoch": 2885} {"train_loss": -42.42139434814453, "global_step": 349156, "epoch": 2885} {"train_loss": -42.241058349609375, "global_step": 349157, "epoch": 2885} {"train_loss": -42.08392333984375, "global_step": 349158, "epoch": 2885} {"train_loss": -41.08572006225586, "global_step": 349159, "epoch": 2885} {"train_loss": -42.733802795410156, "global_step": 349160, "epoch": 2885} {"train_loss": -43.02817916870117, "global_step": 349161, "epoch": 2885} {"train_loss": -42.73933029174805, "global_step": 349162, "epoch": 2885} {"train_loss": -42.8464241027832, "global_step": 349163, "epoch": 2885} {"train_loss": -43.69084930419922, "global_step": 349164, "epoch": 2885} {"train_loss": -43.26833724975586, "global_step": 349165, "epoch": 2885} {"train_loss": -42.30940246582031, "global_step": 349166, "epoch": 2885} {"train_loss": -43.343231201171875, "global_step": 349167, "epoch": 2885} {"train_loss": -43.30772018432617, "global_step": 349168, "epoch": 2885} {"train_loss": -40.72176742553711, "global_step": 349169, "epoch": 2885} {"train_loss": -42.07966232299805, "global_step": 349170, "epoch": 2885} {"train_loss": -43.01974868774414, "global_step": 349171, "epoch": 2885} {"train_loss": -39.515228271484375, "global_step": 349172, "epoch": 2885} {"train_loss": -42.8728141784668, "global_step": 349173, "epoch": 2885} {"train_loss": -43.059906005859375, "global_step": 349174, "epoch": 2885} {"train_loss": -42.367244720458984, "global_step": 349175, "epoch": 2885} {"train_loss": -43.02859115600586, "global_step": 349176, "epoch": 2885} {"train_loss": -43.40500259399414, "global_step": 349177, "epoch": 2885} {"train_loss": -43.91962814331055, "global_step": 349178, "epoch": 2885} {"train_loss": -43.840057373046875, "global_step": 349179, "epoch": 2885} {"train_loss": -43.221134185791016, "global_step": 349180, "epoch": 2885} {"train_loss": -43.189144134521484, "global_step": 349181, "epoch": 2885} {"train_loss": -43.5050163269043, "global_step": 349182, "epoch": 2885} {"train_loss": -41.917633056640625, "global_step": 349183, "epoch": 2885} {"train_loss": -42.533748626708984, "global_step": 349184, "epoch": 2885} {"train_loss": -42.76907730102539, "global_step": 349185, "epoch": 2885} {"train_loss": -43.335693359375, "global_step": 349186, "epoch": 2885} {"train_loss": -42.998958587646484, "global_step": 349187, "epoch": 2885} {"train_loss": -43.450531005859375, "global_step": 349188, "epoch": 2885} {"train_loss": -42.066646575927734, "global_step": 349189, "epoch": 2885} {"train_loss": -40.94999694824219, "global_step": 349190, "epoch": 2885} {"train_loss": -43.063846588134766, "global_step": 349191, "epoch": 2885} {"train_loss": -42.6921501159668, "global_step": 349192, "epoch": 2885} {"train_loss": -43.6525993347168, "global_step": 349193, "epoch": 2885} {"train_loss": -43.241973876953125, "global_step": 349194, "epoch": 2885} {"train_loss": -43.342140197753906, "global_step": 349195, "epoch": 2885} {"train_loss": -43.542564392089844, "global_step": 349196, "epoch": 2885} {"train_loss": -43.026241302490234, "global_step": 349197, "epoch": 2885} {"train_loss": -43.387325286865234, "global_step": 349198, "epoch": 2885} {"train_loss": -43.34641647338867, "global_step": 349199, "epoch": 2885} {"train_loss": -44.08701705932617, "global_step": 349200, "epoch": 2885} {"train_loss": -43.7735481262207, "global_step": 349201, "epoch": 2885} {"train_loss": -42.61021041870117, "global_step": 349202, "epoch": 2885} {"train_loss": -44.115257263183594, "global_step": 349203, "epoch": 2885} {"train_loss": -44.29594802856445, "global_step": 349204, "epoch": 2885} {"train_loss": -41.51551626536472, "global_step": 349205, "epoch": 2885, "val_loss": 2681699.0} {"train_loss": -44.206947326660156, "global_step": 349206, "epoch": 2886} {"train_loss": -42.2061767578125, "global_step": 349207, "epoch": 2886} {"train_loss": -43.17270278930664, "global_step": 349208, "epoch": 2886} {"train_loss": -43.658138275146484, "global_step": 349209, "epoch": 2886} {"train_loss": -44.25632858276367, "global_step": 349210, "epoch": 2886} {"train_loss": -44.19874954223633, "global_step": 349211, "epoch": 2886} {"train_loss": -43.72431564331055, "global_step": 349212, "epoch": 2886} {"train_loss": -43.900726318359375, "global_step": 349213, "epoch": 2886} {"train_loss": -44.225284576416016, "global_step": 349214, "epoch": 2886} {"train_loss": -44.04018783569336, "global_step": 349215, "epoch": 2886} {"train_loss": -44.43140411376953, "global_step": 349216, "epoch": 2886} {"train_loss": -44.0203971862793, "global_step": 349217, "epoch": 2886} {"train_loss": -44.335323333740234, "global_step": 349218, "epoch": 2886} {"train_loss": -44.1864128112793, "global_step": 349219, "epoch": 2886} {"train_loss": -44.544219970703125, "global_step": 349220, "epoch": 2886} {"train_loss": -44.18251419067383, "global_step": 349221, "epoch": 2886} {"train_loss": -44.126983642578125, "global_step": 349222, "epoch": 2886} {"train_loss": -43.354530334472656, "global_step": 349223, "epoch": 2886} {"train_loss": -43.76292419433594, "global_step": 349224, "epoch": 2886} {"train_loss": -44.2779426574707, "global_step": 349225, "epoch": 2886} {"train_loss": -44.45382308959961, "global_step": 349226, "epoch": 2886} {"train_loss": -44.262855529785156, "global_step": 349227, "epoch": 2886} {"train_loss": -44.14890670776367, "global_step": 349228, "epoch": 2886} {"train_loss": -43.68339920043945, "global_step": 349229, "epoch": 2886} {"train_loss": -44.47223663330078, "global_step": 349230, "epoch": 2886} {"train_loss": -43.9327507019043, "global_step": 349231, "epoch": 2886} {"train_loss": -43.30071258544922, "global_step": 349232, "epoch": 2886} {"train_loss": -43.47915267944336, "global_step": 349233, "epoch": 2886} {"train_loss": -42.050479888916016, "global_step": 349234, "epoch": 2886} {"train_loss": -44.44689178466797, "global_step": 349235, "epoch": 2886} {"train_loss": -44.010406494140625, "global_step": 349236, "epoch": 2886} {"train_loss": -43.95626449584961, "global_step": 349237, "epoch": 2886} {"train_loss": -43.88358688354492, "global_step": 349238, "epoch": 2886} {"train_loss": -41.937835693359375, "global_step": 349239, "epoch": 2886} {"train_loss": -44.47247314453125, "global_step": 349240, "epoch": 2886} {"train_loss": -41.41238021850586, "global_step": 349241, "epoch": 2886} {"train_loss": -44.25118637084961, "global_step": 349242, "epoch": 2886} {"train_loss": -43.379241943359375, "global_step": 349243, "epoch": 2886} {"train_loss": -44.74924087524414, "global_step": 349244, "epoch": 2886} {"train_loss": -43.98869705200195, "global_step": 349245, "epoch": 2886} {"train_loss": -43.91634750366211, "global_step": 349246, "epoch": 2886} {"train_loss": -43.4109992980957, "global_step": 349247, "epoch": 2886} {"train_loss": -41.836219787597656, "global_step": 349248, "epoch": 2886} {"train_loss": -42.87871170043945, "global_step": 349249, "epoch": 2886} {"train_loss": -42.82094192504883, "global_step": 349250, "epoch": 2886} {"train_loss": -43.700111389160156, "global_step": 349251, "epoch": 2886} {"train_loss": -44.12540054321289, "global_step": 349252, "epoch": 2886} {"train_loss": -42.63193893432617, "global_step": 349253, "epoch": 2886} {"train_loss": -44.58631134033203, "global_step": 349254, "epoch": 2886} {"train_loss": -44.07979202270508, "global_step": 349255, "epoch": 2886} {"train_loss": -44.0626335144043, "global_step": 349256, "epoch": 2886} {"train_loss": -44.014835357666016, "global_step": 349257, "epoch": 2886} {"train_loss": -43.29924392700195, "global_step": 349258, "epoch": 2886} {"train_loss": -43.52964401245117, "global_step": 349259, "epoch": 2886} {"train_loss": -43.6047477722168, "global_step": 349260, "epoch": 2886} {"train_loss": -43.3307991027832, "global_step": 349261, "epoch": 2886} {"train_loss": -43.5914421081543, "global_step": 349262, "epoch": 2886} {"train_loss": -44.46570587158203, "global_step": 349263, "epoch": 2886} {"train_loss": -43.79085159301758, "global_step": 349264, "epoch": 2886} {"train_loss": -43.648006439208984, "global_step": 349265, "epoch": 2886} {"train_loss": -43.896461486816406, "global_step": 349266, "epoch": 2886} {"train_loss": -44.5858039855957, "global_step": 349267, "epoch": 2886} {"train_loss": -44.19894027709961, "global_step": 349268, "epoch": 2886} {"train_loss": -42.867652893066406, "global_step": 349269, "epoch": 2886} {"train_loss": -43.193599700927734, "global_step": 349270, "epoch": 2886} {"train_loss": -42.71430587768555, "global_step": 349271, "epoch": 2886} {"train_loss": -41.82395553588867, "global_step": 349272, "epoch": 2886} {"train_loss": -43.815155029296875, "global_step": 349273, "epoch": 2886} {"train_loss": -43.33333969116211, "global_step": 349274, "epoch": 2886} {"train_loss": -40.92692184448242, "global_step": 349275, "epoch": 2886} {"train_loss": -42.0208740234375, "global_step": 349276, "epoch": 2886} {"train_loss": -43.228336334228516, "global_step": 349277, "epoch": 2886} {"train_loss": -43.558387756347656, "global_step": 349278, "epoch": 2886} {"train_loss": -42.994712829589844, "global_step": 349279, "epoch": 2886} {"train_loss": -43.610107421875, "global_step": 349280, "epoch": 2886} {"train_loss": -42.5002326965332, "global_step": 349281, "epoch": 2886} {"train_loss": -42.216712951660156, "global_step": 349282, "epoch": 2886} {"train_loss": -42.536441802978516, "global_step": 349283, "epoch": 2886} {"train_loss": -43.584991455078125, "global_step": 349284, "epoch": 2886} {"train_loss": -42.54396438598633, "global_step": 349285, "epoch": 2886} {"train_loss": -41.50272750854492, "global_step": 349286, "epoch": 2886} {"train_loss": -42.772064208984375, "global_step": 349287, "epoch": 2886} {"train_loss": -43.785884857177734, "global_step": 349288, "epoch": 2886} {"train_loss": -42.10370635986328, "global_step": 349289, "epoch": 2886} {"train_loss": -42.55927658081055, "global_step": 349290, "epoch": 2886} {"train_loss": -41.04488754272461, "global_step": 349291, "epoch": 2886} {"train_loss": -42.05040740966797, "global_step": 349292, "epoch": 2886} {"train_loss": -42.95212936401367, "global_step": 349293, "epoch": 2886} {"train_loss": -42.59174728393555, "global_step": 349294, "epoch": 2886} {"train_loss": -41.61149978637695, "global_step": 349295, "epoch": 2886} {"train_loss": -41.389705657958984, "global_step": 349296, "epoch": 2886} {"train_loss": -42.779754638671875, "global_step": 349297, "epoch": 2886} {"train_loss": -41.80091857910156, "global_step": 349298, "epoch": 2886} {"train_loss": -42.871376037597656, "global_step": 349299, "epoch": 2886} {"train_loss": -42.25554275512695, "global_step": 349300, "epoch": 2886} {"train_loss": -41.09177780151367, "global_step": 349301, "epoch": 2886} {"train_loss": -40.78532028198242, "global_step": 349302, "epoch": 2886} {"train_loss": -43.31211471557617, "global_step": 349303, "epoch": 2886} {"train_loss": -41.45368194580078, "global_step": 349304, "epoch": 2886} {"train_loss": -41.82109451293945, "global_step": 349305, "epoch": 2886} {"train_loss": -43.438106536865234, "global_step": 349306, "epoch": 2886} {"train_loss": -40.742713928222656, "global_step": 349307, "epoch": 2886} {"train_loss": -41.42749786376953, "global_step": 349308, "epoch": 2886} {"train_loss": -43.15784454345703, "global_step": 349309, "epoch": 2886} {"train_loss": -40.89687728881836, "global_step": 349310, "epoch": 2886} {"train_loss": -43.00007247924805, "global_step": 349311, "epoch": 2886} {"train_loss": -43.16461944580078, "global_step": 349312, "epoch": 2886} {"train_loss": -39.823951721191406, "global_step": 349313, "epoch": 2886} {"train_loss": -43.38079071044922, "global_step": 349314, "epoch": 2886} {"train_loss": -42.45515060424805, "global_step": 349315, "epoch": 2886} {"train_loss": -43.11054229736328, "global_step": 349316, "epoch": 2886} {"train_loss": -43.40339660644531, "global_step": 349317, "epoch": 2886} {"train_loss": -42.98952102661133, "global_step": 349318, "epoch": 2886} {"train_loss": -43.08821487426758, "global_step": 349319, "epoch": 2886} {"train_loss": -43.35127639770508, "global_step": 349320, "epoch": 2886} {"train_loss": -43.40391159057617, "global_step": 349321, "epoch": 2886} {"train_loss": -42.6743278503418, "global_step": 349322, "epoch": 2886} {"train_loss": -42.517486572265625, "global_step": 349323, "epoch": 2886} {"train_loss": -42.48210525512695, "global_step": 349324, "epoch": 2886} {"train_loss": -40.57275390625, "global_step": 349325, "epoch": 2886} {"train_loss": -43.14182483263252, "global_step": 349326, "epoch": 2886, "val_loss": 2744360.75} {"train_loss": -41.814781188964844, "global_step": 349327, "epoch": 2887} {"train_loss": -41.98397445678711, "global_step": 349328, "epoch": 2887} {"train_loss": -36.23980712890625, "global_step": 349329, "epoch": 2887} {"train_loss": -42.334957122802734, "global_step": 349330, "epoch": 2887} {"train_loss": -37.4969596862793, "global_step": 349331, "epoch": 2887} {"train_loss": -43.339473724365234, "global_step": 349332, "epoch": 2887} {"train_loss": -41.755184173583984, "global_step": 349333, "epoch": 2887} {"train_loss": -40.987953186035156, "global_step": 349334, "epoch": 2887} {"train_loss": -43.615753173828125, "global_step": 349335, "epoch": 2887} {"train_loss": -42.08464050292969, "global_step": 349336, "epoch": 2887} {"train_loss": -41.316829681396484, "global_step": 349337, "epoch": 2887} {"train_loss": -42.250850677490234, "global_step": 349338, "epoch": 2887} {"train_loss": -40.1285514831543, "global_step": 349339, "epoch": 2887} {"train_loss": -42.17794418334961, "global_step": 349340, "epoch": 2887} {"train_loss": -40.567081451416016, "global_step": 349341, "epoch": 2887} {"train_loss": -39.23654556274414, "global_step": 349342, "epoch": 2887} {"train_loss": -40.65765380859375, "global_step": 349343, "epoch": 2887} {"train_loss": -41.01778793334961, "global_step": 349344, "epoch": 2887} {"train_loss": -39.6030387878418, "global_step": 349345, "epoch": 2887} {"train_loss": -38.57232666015625, "global_step": 349346, "epoch": 2887} {"train_loss": -39.16682052612305, "global_step": 349347, "epoch": 2887} {"train_loss": -41.74850082397461, "global_step": 349348, "epoch": 2887} {"train_loss": -39.8018913269043, "global_step": 349349, "epoch": 2887} {"train_loss": -38.66847229003906, "global_step": 349350, "epoch": 2887} {"train_loss": -41.52743148803711, "global_step": 349351, "epoch": 2887} {"train_loss": -42.078582763671875, "global_step": 349352, "epoch": 2887} {"train_loss": -41.55788803100586, "global_step": 349353, "epoch": 2887} {"train_loss": -41.61466598510742, "global_step": 349354, "epoch": 2887} {"train_loss": -42.25218200683594, "global_step": 349355, "epoch": 2887} {"train_loss": -39.808441162109375, "global_step": 349356, "epoch": 2887} {"train_loss": -42.176509857177734, "global_step": 349357, "epoch": 2887} {"train_loss": -40.35712432861328, "global_step": 349358, "epoch": 2887} {"train_loss": -41.91559982299805, "global_step": 349359, "epoch": 2887} {"train_loss": -41.143089294433594, "global_step": 349360, "epoch": 2887} {"train_loss": -42.08323287963867, "global_step": 349361, "epoch": 2887} {"train_loss": -41.45261001586914, "global_step": 349362, "epoch": 2887} {"train_loss": -42.644893646240234, "global_step": 349363, "epoch": 2887} {"train_loss": -41.42373275756836, "global_step": 349364, "epoch": 2887} {"train_loss": -39.06195068359375, "global_step": 349365, "epoch": 2887} {"train_loss": -41.31663131713867, "global_step": 349366, "epoch": 2887} {"train_loss": -40.78155517578125, "global_step": 349367, "epoch": 2887} {"train_loss": -41.5484619140625, "global_step": 349368, "epoch": 2887} {"train_loss": -41.08637619018555, "global_step": 349369, "epoch": 2887} {"train_loss": -40.00912094116211, "global_step": 349370, "epoch": 2887} {"train_loss": -42.1724739074707, "global_step": 349371, "epoch": 2887} {"train_loss": -39.56952667236328, "global_step": 349372, "epoch": 2887} {"train_loss": -41.13517761230469, "global_step": 349373, "epoch": 2887} {"train_loss": -39.27386474609375, "global_step": 349374, "epoch": 2887} {"train_loss": -39.48772048950195, "global_step": 349375, "epoch": 2887} {"train_loss": -41.45749282836914, "global_step": 349376, "epoch": 2887} {"train_loss": -39.377235412597656, "global_step": 349377, "epoch": 2887} {"train_loss": -40.98225784301758, "global_step": 349378, "epoch": 2887} {"train_loss": -39.63159942626953, "global_step": 349379, "epoch": 2887} {"train_loss": -40.95956039428711, "global_step": 349380, "epoch": 2887} {"train_loss": -39.82808303833008, "global_step": 349381, "epoch": 2887} {"train_loss": -40.832435607910156, "global_step": 349382, "epoch": 2887} {"train_loss": -40.67237091064453, "global_step": 349383, "epoch": 2887} {"train_loss": -39.68495559692383, "global_step": 349384, "epoch": 2887} {"train_loss": -41.332035064697266, "global_step": 349385, "epoch": 2887} {"train_loss": -41.58488082885742, "global_step": 349386, "epoch": 2887} {"train_loss": -40.426246643066406, "global_step": 349387, "epoch": 2887} {"train_loss": -41.10422897338867, "global_step": 349388, "epoch": 2887} {"train_loss": -38.75185775756836, "global_step": 349389, "epoch": 2887} {"train_loss": -42.20579147338867, "global_step": 349390, "epoch": 2887} {"train_loss": -40.32197570800781, "global_step": 349391, "epoch": 2887} {"train_loss": -40.95417785644531, "global_step": 349392, "epoch": 2887} {"train_loss": -40.59406280517578, "global_step": 349393, "epoch": 2887} {"train_loss": -41.15314865112305, "global_step": 349394, "epoch": 2887} {"train_loss": -42.34223556518555, "global_step": 349395, "epoch": 2887} {"train_loss": -40.7280158996582, "global_step": 349396, "epoch": 2887} {"train_loss": -41.8963623046875, "global_step": 349397, "epoch": 2887} {"train_loss": -37.95309829711914, "global_step": 349398, "epoch": 2887} {"train_loss": -40.43690872192383, "global_step": 349399, "epoch": 2887} {"train_loss": -41.6067008972168, "global_step": 349400, "epoch": 2887} {"train_loss": -36.70102310180664, "global_step": 349401, "epoch": 2887} {"train_loss": -40.18503952026367, "global_step": 349402, "epoch": 2887} {"train_loss": -40.46769332885742, "global_step": 349403, "epoch": 2887} {"train_loss": -41.53532028198242, "global_step": 349404, "epoch": 2887} {"train_loss": -41.57642364501953, "global_step": 349405, "epoch": 2887} {"train_loss": -39.10102462768555, "global_step": 349406, "epoch": 2887} {"train_loss": -41.173824310302734, "global_step": 349407, "epoch": 2887} {"train_loss": -41.38209915161133, "global_step": 349408, "epoch": 2887} {"train_loss": -40.89264678955078, "global_step": 349409, "epoch": 2887} {"train_loss": -38.31877899169922, "global_step": 349410, "epoch": 2887} {"train_loss": -40.8257942199707, "global_step": 349411, "epoch": 2887} {"train_loss": -40.46674728393555, "global_step": 349412, "epoch": 2887} {"train_loss": -39.48154830932617, "global_step": 349413, "epoch": 2887} {"train_loss": -39.6258430480957, "global_step": 349414, "epoch": 2887} {"train_loss": -28.297468185424805, "global_step": 349415, "epoch": 2887} {"train_loss": -38.0822639465332, "global_step": 349416, "epoch": 2887} {"train_loss": -39.37554168701172, "global_step": 349417, "epoch": 2887} {"train_loss": -41.95564651489258, "global_step": 349418, "epoch": 2887} {"train_loss": -36.01659393310547, "global_step": 349419, "epoch": 2887} {"train_loss": -36.010719299316406, "global_step": 349420, "epoch": 2887} {"train_loss": -39.232418060302734, "global_step": 349421, "epoch": 2887} {"train_loss": -38.68903350830078, "global_step": 349422, "epoch": 2887} {"train_loss": -39.60218048095703, "global_step": 349423, "epoch": 2887} {"train_loss": -39.4871711730957, "global_step": 349424, "epoch": 2887} {"train_loss": -33.9986572265625, "global_step": 349425, "epoch": 2887} {"train_loss": -39.461578369140625, "global_step": 349426, "epoch": 2887} {"train_loss": -41.17572021484375, "global_step": 349427, "epoch": 2887} {"train_loss": -38.964447021484375, "global_step": 349428, "epoch": 2887} {"train_loss": -36.49114227294922, "global_step": 349429, "epoch": 2887} {"train_loss": -25.6031436920166, "global_step": 349430, "epoch": 2887} {"train_loss": -38.61199951171875, "global_step": 349431, "epoch": 2887} {"train_loss": -32.04390335083008, "global_step": 349432, "epoch": 2887} {"train_loss": -36.55497360229492, "global_step": 349433, "epoch": 2887} {"train_loss": -33.4696159362793, "global_step": 349434, "epoch": 2887} {"train_loss": -35.015380859375, "global_step": 349435, "epoch": 2887} {"train_loss": -31.87771987915039, "global_step": 349436, "epoch": 2887} {"train_loss": -37.01290512084961, "global_step": 349437, "epoch": 2887} {"train_loss": -30.978132247924805, "global_step": 349438, "epoch": 2887} {"train_loss": -39.135501861572266, "global_step": 349439, "epoch": 2887} {"train_loss": -39.61170196533203, "global_step": 349440, "epoch": 2887} {"train_loss": -37.251155853271484, "global_step": 349441, "epoch": 2887} {"train_loss": -34.851806640625, "global_step": 349442, "epoch": 2887} {"train_loss": -37.824153900146484, "global_step": 349443, "epoch": 2887} {"train_loss": -38.573974609375, "global_step": 349444, "epoch": 2887} {"train_loss": -35.41936111450195, "global_step": 349445, "epoch": 2887} {"train_loss": -39.47140121459961, "global_step": 349446, "epoch": 2887} {"train_loss": -39.592604818422934, "global_step": 349447, "epoch": 2887, "val_loss": 2626542.0} {"train_loss": -39.975765228271484, "global_step": 349448, "epoch": 2888} {"train_loss": -39.284584045410156, "global_step": 349449, "epoch": 2888} {"train_loss": -37.89310836791992, "global_step": 349450, "epoch": 2888} {"train_loss": -39.62501907348633, "global_step": 349451, "epoch": 2888} {"train_loss": -39.17852783203125, "global_step": 349452, "epoch": 2888} {"train_loss": -39.76667022705078, "global_step": 349453, "epoch": 2888} {"train_loss": -39.74106979370117, "global_step": 349454, "epoch": 2888} {"train_loss": -40.030311584472656, "global_step": 349455, "epoch": 2888} {"train_loss": -39.346614837646484, "global_step": 349456, "epoch": 2888} {"train_loss": -40.142024993896484, "global_step": 349457, "epoch": 2888} {"train_loss": -39.43186569213867, "global_step": 349458, "epoch": 2888} {"train_loss": -39.329402923583984, "global_step": 349459, "epoch": 2888} {"train_loss": -39.96467208862305, "global_step": 349460, "epoch": 2888} {"train_loss": -40.33952713012695, "global_step": 349461, "epoch": 2888} {"train_loss": -39.82557678222656, "global_step": 349462, "epoch": 2888} {"train_loss": -39.76042175292969, "global_step": 349463, "epoch": 2888} {"train_loss": -39.95047378540039, "global_step": 349464, "epoch": 2888} {"train_loss": -41.09228515625, "global_step": 349465, "epoch": 2888} {"train_loss": -40.908199310302734, "global_step": 349466, "epoch": 2888} {"train_loss": -40.69962692260742, "global_step": 349467, "epoch": 2888} {"train_loss": -39.9209098815918, "global_step": 349468, "epoch": 2888} {"train_loss": -40.69541931152344, "global_step": 349469, "epoch": 2888} {"train_loss": -40.538387298583984, "global_step": 349470, "epoch": 2888} {"train_loss": -40.896549224853516, "global_step": 349471, "epoch": 2888} {"train_loss": -40.52533721923828, "global_step": 349472, "epoch": 2888} {"train_loss": -41.237037658691406, "global_step": 349473, "epoch": 2888} {"train_loss": -40.672569274902344, "global_step": 349474, "epoch": 2888} {"train_loss": -40.93478012084961, "global_step": 349475, "epoch": 2888} {"train_loss": -39.843807220458984, "global_step": 349476, "epoch": 2888} {"train_loss": -40.985347747802734, "global_step": 349477, "epoch": 2888} {"train_loss": -40.483070373535156, "global_step": 349478, "epoch": 2888} {"train_loss": -40.74531173706055, "global_step": 349479, "epoch": 2888} {"train_loss": -41.10892868041992, "global_step": 349480, "epoch": 2888} {"train_loss": -41.288333892822266, "global_step": 349481, "epoch": 2888} {"train_loss": -41.242916107177734, "global_step": 349482, "epoch": 2888} {"train_loss": -41.809051513671875, "global_step": 349483, "epoch": 2888} {"train_loss": -41.269874572753906, "global_step": 349484, "epoch": 2888} {"train_loss": -40.98786544799805, "global_step": 349485, "epoch": 2888} {"train_loss": -41.812896728515625, "global_step": 349486, "epoch": 2888} {"train_loss": -41.70392990112305, "global_step": 349487, "epoch": 2888} {"train_loss": -41.7540168762207, "global_step": 349488, "epoch": 2888} {"train_loss": -42.09165954589844, "global_step": 349489, "epoch": 2888} {"train_loss": -41.654640197753906, "global_step": 349490, "epoch": 2888} {"train_loss": -41.70278549194336, "global_step": 349491, "epoch": 2888} {"train_loss": -42.196346282958984, "global_step": 349492, "epoch": 2888} {"train_loss": -41.9427604675293, "global_step": 349493, "epoch": 2888} {"train_loss": -41.74162292480469, "global_step": 349494, "epoch": 2888} {"train_loss": -41.23727035522461, "global_step": 349495, "epoch": 2888} {"train_loss": -42.28695297241211, "global_step": 349496, "epoch": 2888} {"train_loss": -41.30585861206055, "global_step": 349497, "epoch": 2888} {"train_loss": -41.17377853393555, "global_step": 349498, "epoch": 2888} {"train_loss": -42.53682327270508, "global_step": 349499, "epoch": 2888} {"train_loss": -41.8541259765625, "global_step": 349500, "epoch": 2888} {"train_loss": -41.92369079589844, "global_step": 349501, "epoch": 2888} {"train_loss": -42.256649017333984, "global_step": 349502, "epoch": 2888} {"train_loss": -42.02762985229492, "global_step": 349503, "epoch": 2888} {"train_loss": -42.32571792602539, "global_step": 349504, "epoch": 2888} {"train_loss": -42.265777587890625, "global_step": 349505, "epoch": 2888} {"train_loss": -42.0513801574707, "global_step": 349506, "epoch": 2888} {"train_loss": -42.3399772644043, "global_step": 349507, "epoch": 2888} {"train_loss": -41.822959899902344, "global_step": 349508, "epoch": 2888} {"train_loss": -41.72178649902344, "global_step": 349509, "epoch": 2888} {"train_loss": -42.03157424926758, "global_step": 349510, "epoch": 2888} {"train_loss": -42.364620208740234, "global_step": 349511, "epoch": 2888} {"train_loss": -42.20927047729492, "global_step": 349512, "epoch": 2888} {"train_loss": -41.266815185546875, "global_step": 349513, "epoch": 2888} {"train_loss": -42.59457015991211, "global_step": 349514, "epoch": 2888} {"train_loss": -42.02999496459961, "global_step": 349515, "epoch": 2888} {"train_loss": -42.63063430786133, "global_step": 349516, "epoch": 2888} {"train_loss": -42.571388244628906, "global_step": 349517, "epoch": 2888} {"train_loss": -42.58597183227539, "global_step": 349518, "epoch": 2888} {"train_loss": -42.34214782714844, "global_step": 349519, "epoch": 2888} {"train_loss": -42.712860107421875, "global_step": 349520, "epoch": 2888} {"train_loss": -43.091392517089844, "global_step": 349521, "epoch": 2888} {"train_loss": -42.89049530029297, "global_step": 349522, "epoch": 2888} {"train_loss": -42.750404357910156, "global_step": 349523, "epoch": 2888} {"train_loss": -43.190853118896484, "global_step": 349524, "epoch": 2888} {"train_loss": -42.5706672668457, "global_step": 349525, "epoch": 2888} {"train_loss": -42.92097091674805, "global_step": 349526, "epoch": 2888} {"train_loss": -43.09657669067383, "global_step": 349527, "epoch": 2888} {"train_loss": -42.513336181640625, "global_step": 349528, "epoch": 2888} {"train_loss": -43.2015495300293, "global_step": 349529, "epoch": 2888} {"train_loss": -42.70963668823242, "global_step": 349530, "epoch": 2888} {"train_loss": -42.58472442626953, "global_step": 349531, "epoch": 2888} {"train_loss": -42.926788330078125, "global_step": 349532, "epoch": 2888} {"train_loss": -43.40230941772461, "global_step": 349533, "epoch": 2888} {"train_loss": -43.347774505615234, "global_step": 349534, "epoch": 2888} {"train_loss": -42.20701217651367, "global_step": 349535, "epoch": 2888} {"train_loss": -42.88916778564453, "global_step": 349536, "epoch": 2888} {"train_loss": -42.601905822753906, "global_step": 349537, "epoch": 2888} {"train_loss": -43.474159240722656, "global_step": 349538, "epoch": 2888} {"train_loss": -43.41543197631836, "global_step": 349539, "epoch": 2888} {"train_loss": -42.91135025024414, "global_step": 349540, "epoch": 2888} {"train_loss": -43.40682601928711, "global_step": 349541, "epoch": 2888} {"train_loss": -42.87068176269531, "global_step": 349542, "epoch": 2888} {"train_loss": -42.53335952758789, "global_step": 349543, "epoch": 2888} {"train_loss": -42.941349029541016, "global_step": 349544, "epoch": 2888} {"train_loss": -43.47161865234375, "global_step": 349545, "epoch": 2888} {"train_loss": -43.59449768066406, "global_step": 349546, "epoch": 2888} {"train_loss": -43.402618408203125, "global_step": 349547, "epoch": 2888} {"train_loss": -42.62723922729492, "global_step": 349548, "epoch": 2888} {"train_loss": -43.81471633911133, "global_step": 349549, "epoch": 2888} {"train_loss": -43.1736946105957, "global_step": 349550, "epoch": 2888} {"train_loss": -43.468841552734375, "global_step": 349551, "epoch": 2888} {"train_loss": -43.09981918334961, "global_step": 349552, "epoch": 2888} {"train_loss": -43.33885192871094, "global_step": 349553, "epoch": 2888} {"train_loss": -42.847225189208984, "global_step": 349554, "epoch": 2888} {"train_loss": -43.60787582397461, "global_step": 349555, "epoch": 2888} {"train_loss": -43.17135238647461, "global_step": 349556, "epoch": 2888} {"train_loss": -43.472957611083984, "global_step": 349557, "epoch": 2888} {"train_loss": -43.51272201538086, "global_step": 349558, "epoch": 2888} {"train_loss": -43.34450912475586, "global_step": 349559, "epoch": 2888} {"train_loss": -43.5421142578125, "global_step": 349560, "epoch": 2888} {"train_loss": -43.482460021972656, "global_step": 349561, "epoch": 2888} {"train_loss": -43.63346481323242, "global_step": 349562, "epoch": 2888} {"train_loss": -43.19891357421875, "global_step": 349563, "epoch": 2888} {"train_loss": -42.41984176635742, "global_step": 349564, "epoch": 2888} {"train_loss": -43.53664016723633, "global_step": 349565, "epoch": 2888} {"train_loss": -43.78477096557617, "global_step": 349566, "epoch": 2888} {"train_loss": -42.822731018066406, "global_step": 349567, "epoch": 2888} {"train_loss": -41.91296415092531, "global_step": 349568, "epoch": 2888, "val_loss": 2600913.75} {"train_loss": -42.788875579833984, "global_step": 349569, "epoch": 2889} {"train_loss": -43.21685791015625, "global_step": 349570, "epoch": 2889} {"train_loss": -41.95724105834961, "global_step": 349571, "epoch": 2889} {"train_loss": -40.286678314208984, "global_step": 349572, "epoch": 2889} {"train_loss": -39.822322845458984, "global_step": 349573, "epoch": 2889} {"train_loss": -43.176795959472656, "global_step": 349574, "epoch": 2889} {"train_loss": -41.858829498291016, "global_step": 349575, "epoch": 2889} {"train_loss": -41.64944076538086, "global_step": 349576, "epoch": 2889} {"train_loss": -42.725067138671875, "global_step": 349577, "epoch": 2889} {"train_loss": -41.602317810058594, "global_step": 349578, "epoch": 2889} {"train_loss": -42.491695404052734, "global_step": 349579, "epoch": 2889} {"train_loss": -42.9517822265625, "global_step": 349580, "epoch": 2889} {"train_loss": -41.65614700317383, "global_step": 349581, "epoch": 2889} {"train_loss": -40.45103073120117, "global_step": 349582, "epoch": 2889} {"train_loss": -42.685951232910156, "global_step": 349583, "epoch": 2889} {"train_loss": -42.985347747802734, "global_step": 349584, "epoch": 2889} {"train_loss": -42.34954833984375, "global_step": 349585, "epoch": 2889} {"train_loss": -43.77971649169922, "global_step": 349586, "epoch": 2889} {"train_loss": -43.045833587646484, "global_step": 349587, "epoch": 2889} {"train_loss": -43.56427001953125, "global_step": 349588, "epoch": 2889} {"train_loss": -42.704071044921875, "global_step": 349589, "epoch": 2889} {"train_loss": -42.47608947753906, "global_step": 349590, "epoch": 2889} {"train_loss": -43.03360366821289, "global_step": 349591, "epoch": 2889} {"train_loss": -42.754451751708984, "global_step": 349592, "epoch": 2889} {"train_loss": -42.50584030151367, "global_step": 349593, "epoch": 2889} {"train_loss": -43.26630783081055, "global_step": 349594, "epoch": 2889} {"train_loss": -43.26093673706055, "global_step": 349595, "epoch": 2889} {"train_loss": -43.25141525268555, "global_step": 349596, "epoch": 2889} {"train_loss": -42.35852813720703, "global_step": 349597, "epoch": 2889} {"train_loss": -43.84612274169922, "global_step": 349598, "epoch": 2889} {"train_loss": -43.22688293457031, "global_step": 349599, "epoch": 2889} {"train_loss": -42.9251708984375, "global_step": 349600, "epoch": 2889} {"train_loss": -42.3448371887207, "global_step": 349601, "epoch": 2889} {"train_loss": -43.69292068481445, "global_step": 349602, "epoch": 2889} {"train_loss": -42.18941879272461, "global_step": 349603, "epoch": 2889} {"train_loss": -43.009437561035156, "global_step": 349604, "epoch": 2889} {"train_loss": -41.98591232299805, "global_step": 349605, "epoch": 2889} {"train_loss": -42.3122673034668, "global_step": 349606, "epoch": 2889} {"train_loss": -43.47951889038086, "global_step": 349607, "epoch": 2889} {"train_loss": -43.280731201171875, "global_step": 349608, "epoch": 2889} {"train_loss": -43.263309478759766, "global_step": 349609, "epoch": 2889} {"train_loss": -43.389278411865234, "global_step": 349610, "epoch": 2889} {"train_loss": -42.26197052001953, "global_step": 349611, "epoch": 2889} {"train_loss": -43.49581527709961, "global_step": 349612, "epoch": 2889} {"train_loss": -43.134559631347656, "global_step": 349613, "epoch": 2889} {"train_loss": -42.109928131103516, "global_step": 349614, "epoch": 2889} {"train_loss": -43.424339294433594, "global_step": 349615, "epoch": 2889} {"train_loss": -42.97660827636719, "global_step": 349616, "epoch": 2889} {"train_loss": -42.47301483154297, "global_step": 349617, "epoch": 2889} {"train_loss": -42.273990631103516, "global_step": 349618, "epoch": 2889} {"train_loss": -43.22817611694336, "global_step": 349619, "epoch": 2889} {"train_loss": -42.315399169921875, "global_step": 349620, "epoch": 2889} {"train_loss": -42.29657745361328, "global_step": 349621, "epoch": 2889} {"train_loss": -41.191566467285156, "global_step": 349622, "epoch": 2889} {"train_loss": -42.821346282958984, "global_step": 349623, "epoch": 2889} {"train_loss": -42.2783317565918, "global_step": 349624, "epoch": 2889} {"train_loss": -40.971534729003906, "global_step": 349625, "epoch": 2889} {"train_loss": -43.341217041015625, "global_step": 349626, "epoch": 2889} {"train_loss": -42.19791793823242, "global_step": 349627, "epoch": 2889} {"train_loss": -41.432254791259766, "global_step": 349628, "epoch": 2889} {"train_loss": -41.600746154785156, "global_step": 349629, "epoch": 2889} {"train_loss": -40.609310150146484, "global_step": 349630, "epoch": 2889} {"train_loss": -42.60372543334961, "global_step": 349631, "epoch": 2889} {"train_loss": -41.856788635253906, "global_step": 349632, "epoch": 2889} {"train_loss": -42.540496826171875, "global_step": 349633, "epoch": 2889} {"train_loss": -42.538570404052734, "global_step": 349634, "epoch": 2889} {"train_loss": -41.5428466796875, "global_step": 349635, "epoch": 2889} {"train_loss": -43.12851333618164, "global_step": 349636, "epoch": 2889} {"train_loss": -43.21990966796875, "global_step": 349637, "epoch": 2889} {"train_loss": -43.3474006652832, "global_step": 349638, "epoch": 2889} {"train_loss": -43.15298843383789, "global_step": 349639, "epoch": 2889} {"train_loss": -43.0794563293457, "global_step": 349640, "epoch": 2889} {"train_loss": -43.28255844116211, "global_step": 349641, "epoch": 2889} {"train_loss": -42.46992874145508, "global_step": 349642, "epoch": 2889} {"train_loss": -43.64817428588867, "global_step": 349643, "epoch": 2889} {"train_loss": -43.45314025878906, "global_step": 349644, "epoch": 2889} {"train_loss": -43.61025619506836, "global_step": 349645, "epoch": 2889} {"train_loss": -43.78350067138672, "global_step": 349646, "epoch": 2889} {"train_loss": -42.15205001831055, "global_step": 349647, "epoch": 2889} {"train_loss": -43.23539352416992, "global_step": 349648, "epoch": 2889} {"train_loss": -43.33673858642578, "global_step": 349649, "epoch": 2889} {"train_loss": -43.14126205444336, "global_step": 349650, "epoch": 2889} {"train_loss": -43.22675704956055, "global_step": 349651, "epoch": 2889} {"train_loss": -43.78935623168945, "global_step": 349652, "epoch": 2889} {"train_loss": -42.89133071899414, "global_step": 349653, "epoch": 2889} {"train_loss": -43.5102653503418, "global_step": 349654, "epoch": 2889} {"train_loss": -41.25230026245117, "global_step": 349655, "epoch": 2889} {"train_loss": -43.01314926147461, "global_step": 349656, "epoch": 2889} {"train_loss": -41.61131286621094, "global_step": 349657, "epoch": 2889} {"train_loss": -43.74724197387695, "global_step": 349658, "epoch": 2889} {"train_loss": -43.004432678222656, "global_step": 349659, "epoch": 2889} {"train_loss": -42.157039642333984, "global_step": 349660, "epoch": 2889} {"train_loss": -42.3099250793457, "global_step": 349661, "epoch": 2889} {"train_loss": -43.67934799194336, "global_step": 349662, "epoch": 2889} {"train_loss": -42.57847213745117, "global_step": 349663, "epoch": 2889} {"train_loss": -42.960567474365234, "global_step": 349664, "epoch": 2889} {"train_loss": -43.23844528198242, "global_step": 349665, "epoch": 2889} {"train_loss": -43.31415939331055, "global_step": 349666, "epoch": 2889} {"train_loss": -42.48140335083008, "global_step": 349667, "epoch": 2889} {"train_loss": -42.77670669555664, "global_step": 349668, "epoch": 2889} {"train_loss": -42.58110427856445, "global_step": 349669, "epoch": 2889} {"train_loss": -41.43798828125, "global_step": 349670, "epoch": 2889} {"train_loss": -42.06330871582031, "global_step": 349671, "epoch": 2889} {"train_loss": -43.43381881713867, "global_step": 349672, "epoch": 2889} {"train_loss": -42.92193603515625, "global_step": 349673, "epoch": 2889} {"train_loss": -42.391536712646484, "global_step": 349674, "epoch": 2889} {"train_loss": -42.4746208190918, "global_step": 349675, "epoch": 2889} {"train_loss": -44.01397705078125, "global_step": 349676, "epoch": 2889} {"train_loss": -43.905738830566406, "global_step": 349677, "epoch": 2889} {"train_loss": -42.663143157958984, "global_step": 349678, "epoch": 2889} {"train_loss": -43.170692443847656, "global_step": 349679, "epoch": 2889} {"train_loss": -43.7185173034668, "global_step": 349680, "epoch": 2889} {"train_loss": -43.34971237182617, "global_step": 349681, "epoch": 2889} {"train_loss": -42.780513763427734, "global_step": 349682, "epoch": 2889} {"train_loss": -43.63508224487305, "global_step": 349683, "epoch": 2889} {"train_loss": -42.7425537109375, "global_step": 349684, "epoch": 2889} {"train_loss": -43.883480072021484, "global_step": 349685, "epoch": 2889} {"train_loss": -43.069091796875, "global_step": 349686, "epoch": 2889} {"train_loss": -43.15814208984375, "global_step": 349687, "epoch": 2889} {"train_loss": -43.203983306884766, "global_step": 349688, "epoch": 2889} {"train_loss": -42.73228438826632, "global_step": 349689, "epoch": 2889, "val_loss": 2642055.25} {"train_loss": -44.09944534301758, "global_step": 349690, "epoch": 2890} {"train_loss": -42.51331329345703, "global_step": 349691, "epoch": 2890} {"train_loss": -42.39101028442383, "global_step": 349692, "epoch": 2890} {"train_loss": -43.51518630981445, "global_step": 349693, "epoch": 2890} {"train_loss": -44.09144973754883, "global_step": 349694, "epoch": 2890} {"train_loss": -41.94876480102539, "global_step": 349695, "epoch": 2890} {"train_loss": -43.57427978515625, "global_step": 349696, "epoch": 2890} {"train_loss": -44.097877502441406, "global_step": 349697, "epoch": 2890} {"train_loss": -42.19103240966797, "global_step": 349698, "epoch": 2890} {"train_loss": -42.78264617919922, "global_step": 349699, "epoch": 2890} {"train_loss": -42.84890365600586, "global_step": 349700, "epoch": 2890} {"train_loss": -42.56742477416992, "global_step": 349701, "epoch": 2890} {"train_loss": -42.552520751953125, "global_step": 349702, "epoch": 2890} {"train_loss": -43.6754150390625, "global_step": 349703, "epoch": 2890} {"train_loss": -43.31866455078125, "global_step": 349704, "epoch": 2890} {"train_loss": -43.271514892578125, "global_step": 349705, "epoch": 2890} {"train_loss": -42.83180618286133, "global_step": 349706, "epoch": 2890} {"train_loss": -42.16794967651367, "global_step": 349707, "epoch": 2890} {"train_loss": -43.1644287109375, "global_step": 349708, "epoch": 2890} {"train_loss": -43.18861770629883, "global_step": 349709, "epoch": 2890} {"train_loss": -41.51677322387695, "global_step": 349710, "epoch": 2890} {"train_loss": -40.12074661254883, "global_step": 349711, "epoch": 2890} {"train_loss": -43.51729965209961, "global_step": 349712, "epoch": 2890} {"train_loss": -41.019935607910156, "global_step": 349713, "epoch": 2890} {"train_loss": -38.987701416015625, "global_step": 349714, "epoch": 2890} {"train_loss": -42.44416427612305, "global_step": 349715, "epoch": 2890} {"train_loss": -41.305850982666016, "global_step": 349716, "epoch": 2890} {"train_loss": -42.93141174316406, "global_step": 349717, "epoch": 2890} {"train_loss": -40.31149673461914, "global_step": 349718, "epoch": 2890} {"train_loss": -41.22463607788086, "global_step": 349719, "epoch": 2890} {"train_loss": -42.000572204589844, "global_step": 349720, "epoch": 2890} {"train_loss": -37.9090576171875, "global_step": 349721, "epoch": 2890} {"train_loss": -40.126625061035156, "global_step": 349722, "epoch": 2890} {"train_loss": -41.99587631225586, "global_step": 349723, "epoch": 2890} {"train_loss": -41.20010757446289, "global_step": 349724, "epoch": 2890} {"train_loss": -39.99208450317383, "global_step": 349725, "epoch": 2890} {"train_loss": -40.972389221191406, "global_step": 349726, "epoch": 2890} {"train_loss": -34.02870178222656, "global_step": 349727, "epoch": 2890} {"train_loss": -39.479122161865234, "global_step": 349728, "epoch": 2890} {"train_loss": -37.03744125366211, "global_step": 349729, "epoch": 2890} {"train_loss": -39.07883834838867, "global_step": 349730, "epoch": 2890} {"train_loss": -41.52376174926758, "global_step": 349731, "epoch": 2890} {"train_loss": -39.64022445678711, "global_step": 349732, "epoch": 2890} {"train_loss": -38.13607406616211, "global_step": 349733, "epoch": 2890} {"train_loss": -41.228729248046875, "global_step": 349734, "epoch": 2890} {"train_loss": -39.74220657348633, "global_step": 349735, "epoch": 2890} {"train_loss": -42.09879684448242, "global_step": 349736, "epoch": 2890} {"train_loss": -40.66877365112305, "global_step": 349737, "epoch": 2890} {"train_loss": -42.25410461425781, "global_step": 349738, "epoch": 2890} {"train_loss": -39.37443161010742, "global_step": 349739, "epoch": 2890} {"train_loss": -40.659420013427734, "global_step": 349740, "epoch": 2890} {"train_loss": -41.19179153442383, "global_step": 349741, "epoch": 2890} {"train_loss": -41.62132263183594, "global_step": 349742, "epoch": 2890} {"train_loss": -41.42051315307617, "global_step": 349743, "epoch": 2890} {"train_loss": -42.655670166015625, "global_step": 349744, "epoch": 2890} {"train_loss": -41.6489372253418, "global_step": 349745, "epoch": 2890} {"train_loss": -39.84273147583008, "global_step": 349746, "epoch": 2890} {"train_loss": -41.478389739990234, "global_step": 349747, "epoch": 2890} {"train_loss": -42.89263916015625, "global_step": 349748, "epoch": 2890} {"train_loss": -41.406856536865234, "global_step": 349749, "epoch": 2890} {"train_loss": -25.860715866088867, "global_step": 349750, "epoch": 2890} {"train_loss": -40.91183853149414, "global_step": 349751, "epoch": 2890} {"train_loss": -41.97883224487305, "global_step": 349752, "epoch": 2890} {"train_loss": -40.49114990234375, "global_step": 349753, "epoch": 2890} {"train_loss": -42.052467346191406, "global_step": 349754, "epoch": 2890} {"train_loss": -35.001285552978516, "global_step": 349755, "epoch": 2890} {"train_loss": -38.96733474731445, "global_step": 349756, "epoch": 2890} {"train_loss": 12.02708625793457, "global_step": 349757, "epoch": 2890} {"train_loss": -40.890968322753906, "global_step": 349758, "epoch": 2890} {"train_loss": -39.80426025390625, "global_step": 349759, "epoch": 2890} {"train_loss": -36.300392150878906, "global_step": 349760, "epoch": 2890} {"train_loss": -36.981746673583984, "global_step": 349761, "epoch": 2890} {"train_loss": -31.276691436767578, "global_step": 349762, "epoch": 2890} {"train_loss": -24.719146728515625, "global_step": 349763, "epoch": 2890} {"train_loss": -38.6463623046875, "global_step": 349764, "epoch": 2890} {"train_loss": -36.92829513549805, "global_step": 349765, "epoch": 2890} {"train_loss": -38.00710678100586, "global_step": 349766, "epoch": 2890} {"train_loss": -38.14742660522461, "global_step": 349767, "epoch": 2890} {"train_loss": -39.34817123413086, "global_step": 349768, "epoch": 2890} {"train_loss": -39.763702392578125, "global_step": 349769, "epoch": 2890} {"train_loss": -39.58903121948242, "global_step": 349770, "epoch": 2890} {"train_loss": -39.567596435546875, "global_step": 349771, "epoch": 2890} {"train_loss": -40.427608489990234, "global_step": 349772, "epoch": 2890} {"train_loss": -39.39107131958008, "global_step": 349773, "epoch": 2890} {"train_loss": -39.67213821411133, "global_step": 349774, "epoch": 2890} {"train_loss": -37.79297637939453, "global_step": 349775, "epoch": 2890} {"train_loss": -39.51102828979492, "global_step": 349776, "epoch": 2890} {"train_loss": -41.200599670410156, "global_step": 349777, "epoch": 2890} {"train_loss": -40.8349494934082, "global_step": 349778, "epoch": 2890} {"train_loss": -39.245845794677734, "global_step": 349779, "epoch": 2890} {"train_loss": -40.59412384033203, "global_step": 349780, "epoch": 2890} {"train_loss": -40.420433044433594, "global_step": 349781, "epoch": 2890} {"train_loss": -40.349891662597656, "global_step": 349782, "epoch": 2890} {"train_loss": -40.78877639770508, "global_step": 349783, "epoch": 2890} {"train_loss": -40.56119918823242, "global_step": 349784, "epoch": 2890} {"train_loss": -41.456172943115234, "global_step": 349785, "epoch": 2890} {"train_loss": -41.3106689453125, "global_step": 349786, "epoch": 2890} {"train_loss": -41.20412063598633, "global_step": 349787, "epoch": 2890} {"train_loss": -40.3059196472168, "global_step": 349788, "epoch": 2890} {"train_loss": -40.46773910522461, "global_step": 349789, "epoch": 2890} {"train_loss": -40.936309814453125, "global_step": 349790, "epoch": 2890} {"train_loss": -41.221412658691406, "global_step": 349791, "epoch": 2890} {"train_loss": -41.09112548828125, "global_step": 349792, "epoch": 2890} {"train_loss": -41.368438720703125, "global_step": 349793, "epoch": 2890} {"train_loss": -41.70733642578125, "global_step": 349794, "epoch": 2890} {"train_loss": -41.72761917114258, "global_step": 349795, "epoch": 2890} {"train_loss": -41.65663528442383, "global_step": 349796, "epoch": 2890} {"train_loss": -41.31243896484375, "global_step": 349797, "epoch": 2890} {"train_loss": -41.999202728271484, "global_step": 349798, "epoch": 2890} {"train_loss": -41.6887092590332, "global_step": 349799, "epoch": 2890} {"train_loss": -41.36921310424805, "global_step": 349800, "epoch": 2890} {"train_loss": -40.919837951660156, "global_step": 349801, "epoch": 2890} {"train_loss": -41.50914001464844, "global_step": 349802, "epoch": 2890} {"train_loss": -41.28975296020508, "global_step": 349803, "epoch": 2890} {"train_loss": -42.16786575317383, "global_step": 349804, "epoch": 2890} {"train_loss": -42.529998779296875, "global_step": 349805, "epoch": 2890} {"train_loss": -42.41886520385742, "global_step": 349806, "epoch": 2890} {"train_loss": -41.72395706176758, "global_step": 349807, "epoch": 2890} {"train_loss": -41.63094711303711, "global_step": 349808, "epoch": 2890} {"train_loss": -42.002315521240234, "global_step": 349809, "epoch": 2890} {"train_loss": -40.173756118648306, "global_step": 349810, "epoch": 2890, "val_loss": 2665082.0} {"train_loss": -42.37921905517578, "global_step": 349811, "epoch": 2891} {"train_loss": -42.40336990356445, "global_step": 349812, "epoch": 2891} {"train_loss": -42.111358642578125, "global_step": 349813, "epoch": 2891} {"train_loss": -42.6546745300293, "global_step": 349814, "epoch": 2891} {"train_loss": -42.11269760131836, "global_step": 349815, "epoch": 2891} {"train_loss": -42.408912658691406, "global_step": 349816, "epoch": 2891} {"train_loss": -42.748252868652344, "global_step": 349817, "epoch": 2891} {"train_loss": -42.91229248046875, "global_step": 349818, "epoch": 2891} {"train_loss": -41.93051528930664, "global_step": 349819, "epoch": 2891} {"train_loss": -42.411434173583984, "global_step": 349820, "epoch": 2891} {"train_loss": -43.03641891479492, "global_step": 349821, "epoch": 2891} {"train_loss": -42.617164611816406, "global_step": 349822, "epoch": 2891} {"train_loss": -43.472198486328125, "global_step": 349823, "epoch": 2891} {"train_loss": -42.30192947387695, "global_step": 349824, "epoch": 2891} {"train_loss": -42.580413818359375, "global_step": 349825, "epoch": 2891} {"train_loss": -42.23781204223633, "global_step": 349826, "epoch": 2891} {"train_loss": -43.456298828125, "global_step": 349827, "epoch": 2891} {"train_loss": -41.1929817199707, "global_step": 349828, "epoch": 2891} {"train_loss": -42.96259689331055, "global_step": 349829, "epoch": 2891} {"train_loss": -42.69563674926758, "global_step": 349830, "epoch": 2891} {"train_loss": -43.45463180541992, "global_step": 349831, "epoch": 2891} {"train_loss": -42.725196838378906, "global_step": 349832, "epoch": 2891} {"train_loss": -43.936256408691406, "global_step": 349833, "epoch": 2891} {"train_loss": -42.97867965698242, "global_step": 349834, "epoch": 2891} {"train_loss": -43.651222229003906, "global_step": 349835, "epoch": 2891} {"train_loss": -43.65166473388672, "global_step": 349836, "epoch": 2891} {"train_loss": -43.2745246887207, "global_step": 349837, "epoch": 2891} {"train_loss": -43.6859130859375, "global_step": 349838, "epoch": 2891} {"train_loss": -42.99335861206055, "global_step": 349839, "epoch": 2891} {"train_loss": -43.34890365600586, "global_step": 349840, "epoch": 2891} {"train_loss": -43.63570785522461, "global_step": 349841, "epoch": 2891} {"train_loss": -42.29610061645508, "global_step": 349842, "epoch": 2891} {"train_loss": -43.91842269897461, "global_step": 349843, "epoch": 2891} {"train_loss": -43.01233673095703, "global_step": 349844, "epoch": 2891} {"train_loss": -42.976802825927734, "global_step": 349845, "epoch": 2891} {"train_loss": -42.59233856201172, "global_step": 349846, "epoch": 2891} {"train_loss": -43.5162467956543, "global_step": 349847, "epoch": 2891} {"train_loss": -43.41310501098633, "global_step": 349848, "epoch": 2891} {"train_loss": -42.98219299316406, "global_step": 349849, "epoch": 2891} {"train_loss": -43.64870834350586, "global_step": 349850, "epoch": 2891} {"train_loss": -43.51923751831055, "global_step": 349851, "epoch": 2891} {"train_loss": -42.670143127441406, "global_step": 349852, "epoch": 2891} {"train_loss": -43.12107467651367, "global_step": 349853, "epoch": 2891} {"train_loss": -43.42461013793945, "global_step": 349854, "epoch": 2891} {"train_loss": -43.32300567626953, "global_step": 349855, "epoch": 2891} {"train_loss": -43.417724609375, "global_step": 349856, "epoch": 2891} {"train_loss": -43.87238693237305, "global_step": 349857, "epoch": 2891} {"train_loss": -43.4127311706543, "global_step": 349858, "epoch": 2891} {"train_loss": -43.565208435058594, "global_step": 349859, "epoch": 2891} {"train_loss": -42.34519577026367, "global_step": 349860, "epoch": 2891} {"train_loss": -42.8638916015625, "global_step": 349861, "epoch": 2891} {"train_loss": -43.07011795043945, "global_step": 349862, "epoch": 2891} {"train_loss": -42.834800720214844, "global_step": 349863, "epoch": 2891} {"train_loss": -42.86199951171875, "global_step": 349864, "epoch": 2891} {"train_loss": -42.807533264160156, "global_step": 349865, "epoch": 2891} {"train_loss": -43.655128479003906, "global_step": 349866, "epoch": 2891} {"train_loss": -43.504539489746094, "global_step": 349867, "epoch": 2891} {"train_loss": -43.766578674316406, "global_step": 349868, "epoch": 2891} {"train_loss": -42.559242248535156, "global_step": 349869, "epoch": 2891} {"train_loss": -43.14613723754883, "global_step": 349870, "epoch": 2891} {"train_loss": -43.215248107910156, "global_step": 349871, "epoch": 2891} {"train_loss": -43.25883102416992, "global_step": 349872, "epoch": 2891} {"train_loss": -43.649417877197266, "global_step": 349873, "epoch": 2891} {"train_loss": -43.279659271240234, "global_step": 349874, "epoch": 2891} {"train_loss": -42.47304916381836, "global_step": 349875, "epoch": 2891} {"train_loss": -44.456382751464844, "global_step": 349876, "epoch": 2891} {"train_loss": -43.328372955322266, "global_step": 349877, "epoch": 2891} {"train_loss": -42.82857131958008, "global_step": 349878, "epoch": 2891} {"train_loss": -43.71240997314453, "global_step": 349879, "epoch": 2891} {"train_loss": -43.24131393432617, "global_step": 349880, "epoch": 2891} {"train_loss": -42.946044921875, "global_step": 349881, "epoch": 2891} {"train_loss": -43.3936882019043, "global_step": 349882, "epoch": 2891} {"train_loss": -43.903541564941406, "global_step": 349883, "epoch": 2891} {"train_loss": -43.65419387817383, "global_step": 349884, "epoch": 2891} {"train_loss": -43.148414611816406, "global_step": 349885, "epoch": 2891} {"train_loss": -42.01774978637695, "global_step": 349886, "epoch": 2891} {"train_loss": -43.45054244995117, "global_step": 349887, "epoch": 2891} {"train_loss": -42.60721969604492, "global_step": 349888, "epoch": 2891} {"train_loss": -42.547203063964844, "global_step": 349889, "epoch": 2891} {"train_loss": -43.36886978149414, "global_step": 349890, "epoch": 2891} {"train_loss": -44.09202575683594, "global_step": 349891, "epoch": 2891} {"train_loss": -43.61348342895508, "global_step": 349892, "epoch": 2891} {"train_loss": -43.28664779663086, "global_step": 349893, "epoch": 2891} {"train_loss": -43.3798828125, "global_step": 349894, "epoch": 2891} {"train_loss": -43.22822189331055, "global_step": 349895, "epoch": 2891} {"train_loss": -43.98268508911133, "global_step": 349896, "epoch": 2891} {"train_loss": -42.38957595825195, "global_step": 349897, "epoch": 2891} {"train_loss": -42.0160026550293, "global_step": 349898, "epoch": 2891} {"train_loss": -42.490535736083984, "global_step": 349899, "epoch": 2891} {"train_loss": -42.520729064941406, "global_step": 349900, "epoch": 2891} {"train_loss": -36.823970794677734, "global_step": 349901, "epoch": 2891} {"train_loss": -35.258968353271484, "global_step": 349902, "epoch": 2891} {"train_loss": -32.55758285522461, "global_step": 349903, "epoch": 2891} {"train_loss": -38.29204177856445, "global_step": 349904, "epoch": 2891} {"train_loss": -43.74351119995117, "global_step": 349905, "epoch": 2891} {"train_loss": -39.379249572753906, "global_step": 349906, "epoch": 2891} {"train_loss": -37.19880676269531, "global_step": 349907, "epoch": 2891} {"train_loss": -41.30741500854492, "global_step": 349908, "epoch": 2891} {"train_loss": -42.064693450927734, "global_step": 349909, "epoch": 2891} {"train_loss": -39.03398132324219, "global_step": 349910, "epoch": 2891} {"train_loss": -42.38669967651367, "global_step": 349911, "epoch": 2891} {"train_loss": -41.77524948120117, "global_step": 349912, "epoch": 2891} {"train_loss": -40.38228988647461, "global_step": 349913, "epoch": 2891} {"train_loss": -40.45566940307617, "global_step": 349914, "epoch": 2891} {"train_loss": -40.60315704345703, "global_step": 349915, "epoch": 2891} {"train_loss": -42.17045974731445, "global_step": 349916, "epoch": 2891} {"train_loss": -40.75596618652344, "global_step": 349917, "epoch": 2891} {"train_loss": -40.7956428527832, "global_step": 349918, "epoch": 2891} {"train_loss": -40.98394775390625, "global_step": 349919, "epoch": 2891} {"train_loss": -40.392578125, "global_step": 349920, "epoch": 2891} {"train_loss": -42.9455680847168, "global_step": 349921, "epoch": 2891} {"train_loss": -41.437801361083984, "global_step": 349922, "epoch": 2891} {"train_loss": -42.57353210449219, "global_step": 349923, "epoch": 2891} {"train_loss": -41.74922561645508, "global_step": 349924, "epoch": 2891} {"train_loss": -41.566062927246094, "global_step": 349925, "epoch": 2891} {"train_loss": -40.24611282348633, "global_step": 349926, "epoch": 2891} {"train_loss": -42.177364349365234, "global_step": 349927, "epoch": 2891} {"train_loss": -41.682106018066406, "global_step": 349928, "epoch": 2891} {"train_loss": -42.671627044677734, "global_step": 349929, "epoch": 2891} {"train_loss": -42.2305908203125, "global_step": 349930, "epoch": 2891} {"train_loss": -42.42383840261412, "global_step": 349931, "epoch": 2891, "val_loss": 2655522.5} {"train_loss": -42.17695999145508, "global_step": 349932, "epoch": 2892} {"train_loss": -39.47803497314453, "global_step": 349933, "epoch": 2892} {"train_loss": -39.565330505371094, "global_step": 349934, "epoch": 2892} {"train_loss": -41.33893585205078, "global_step": 349935, "epoch": 2892} {"train_loss": -42.702205657958984, "global_step": 349936, "epoch": 2892} {"train_loss": -43.22132873535156, "global_step": 349937, "epoch": 2892} {"train_loss": -31.713397979736328, "global_step": 349938, "epoch": 2892} {"train_loss": -37.54207992553711, "global_step": 349939, "epoch": 2892} {"train_loss": -39.19217300415039, "global_step": 349940, "epoch": 2892} {"train_loss": -41.16492462158203, "global_step": 349941, "epoch": 2892} {"train_loss": -42.30585861206055, "global_step": 349942, "epoch": 2892} {"train_loss": -42.36433029174805, "global_step": 349943, "epoch": 2892} {"train_loss": -42.001094818115234, "global_step": 349944, "epoch": 2892} {"train_loss": -41.48269271850586, "global_step": 349945, "epoch": 2892} {"train_loss": -39.956787109375, "global_step": 349946, "epoch": 2892} {"train_loss": -29.162799835205078, "global_step": 349947, "epoch": 2892} {"train_loss": -24.82553482055664, "global_step": 349948, "epoch": 2892} {"train_loss": -38.5683708190918, "global_step": 349949, "epoch": 2892} {"train_loss": -40.19594192504883, "global_step": 349950, "epoch": 2892} {"train_loss": -38.39498519897461, "global_step": 349951, "epoch": 2892} {"train_loss": -40.63434982299805, "global_step": 349952, "epoch": 2892} {"train_loss": -40.36128616333008, "global_step": 349953, "epoch": 2892} {"train_loss": -39.595245361328125, "global_step": 349954, "epoch": 2892} {"train_loss": -40.62109375, "global_step": 349955, "epoch": 2892} {"train_loss": -40.82584762573242, "global_step": 349956, "epoch": 2892} {"train_loss": -38.70960235595703, "global_step": 349957, "epoch": 2892} {"train_loss": -41.32182312011719, "global_step": 349958, "epoch": 2892} {"train_loss": -40.6832160949707, "global_step": 349959, "epoch": 2892} {"train_loss": -36.318206787109375, "global_step": 349960, "epoch": 2892} {"train_loss": -41.99746322631836, "global_step": 349961, "epoch": 2892} {"train_loss": -41.963531494140625, "global_step": 349962, "epoch": 2892} {"train_loss": -42.0368766784668, "global_step": 349963, "epoch": 2892} {"train_loss": -42.373897552490234, "global_step": 349964, "epoch": 2892} {"train_loss": -35.6170768737793, "global_step": 349965, "epoch": 2892} {"train_loss": -39.937191009521484, "global_step": 349966, "epoch": 2892} {"train_loss": -39.514381408691406, "global_step": 349967, "epoch": 2892} {"train_loss": -40.198097229003906, "global_step": 349968, "epoch": 2892} {"train_loss": -41.4844970703125, "global_step": 349969, "epoch": 2892} {"train_loss": -34.88180160522461, "global_step": 349970, "epoch": 2892} {"train_loss": -40.27762985229492, "global_step": 349971, "epoch": 2892} {"train_loss": -41.42983627319336, "global_step": 349972, "epoch": 2892} {"train_loss": -41.773193359375, "global_step": 349973, "epoch": 2892} {"train_loss": -40.66376876831055, "global_step": 349974, "epoch": 2892} {"train_loss": -40.231937408447266, "global_step": 349975, "epoch": 2892} {"train_loss": -42.10799026489258, "global_step": 349976, "epoch": 2892} {"train_loss": -41.402503967285156, "global_step": 349977, "epoch": 2892} {"train_loss": -42.39902114868164, "global_step": 349978, "epoch": 2892} {"train_loss": -41.349143981933594, "global_step": 349979, "epoch": 2892} {"train_loss": -39.01327896118164, "global_step": 349980, "epoch": 2892} {"train_loss": -40.95249938964844, "global_step": 349981, "epoch": 2892} {"train_loss": -41.55263900756836, "global_step": 349982, "epoch": 2892} {"train_loss": -41.796592712402344, "global_step": 349983, "epoch": 2892} {"train_loss": -40.26820373535156, "global_step": 349984, "epoch": 2892} {"train_loss": -41.07073974609375, "global_step": 349985, "epoch": 2892} {"train_loss": -41.063255310058594, "global_step": 349986, "epoch": 2892} {"train_loss": -42.359169006347656, "global_step": 349987, "epoch": 2892} {"train_loss": -42.00564193725586, "global_step": 349988, "epoch": 2892} {"train_loss": -42.03443145751953, "global_step": 349989, "epoch": 2892} {"train_loss": -39.353981018066406, "global_step": 349990, "epoch": 2892} {"train_loss": -42.154388427734375, "global_step": 349991, "epoch": 2892} {"train_loss": -41.51013946533203, "global_step": 349992, "epoch": 2892} {"train_loss": -41.93916702270508, "global_step": 349993, "epoch": 2892} {"train_loss": -42.187007904052734, "global_step": 349994, "epoch": 2892} {"train_loss": -42.92385482788086, "global_step": 349995, "epoch": 2892} {"train_loss": -42.86003494262695, "global_step": 349996, "epoch": 2892} {"train_loss": -42.25185775756836, "global_step": 349997, "epoch": 2892} {"train_loss": -41.964847564697266, "global_step": 349998, "epoch": 2892} {"train_loss": -42.5501594543457, "global_step": 349999, "epoch": 2892} {"train_loss": -43.05096435546875, "global_step": 350000, "epoch": 2892} {"train_loss": -42.53737258911133, "global_step": 350001, "epoch": 2892} {"train_loss": -42.32646560668945, "global_step": 350002, "epoch": 2892} {"train_loss": -42.76578140258789, "global_step": 350003, "epoch": 2892} {"train_loss": -42.7879753112793, "global_step": 350004, "epoch": 2892} {"train_loss": -43.23664855957031, "global_step": 350005, "epoch": 2892} {"train_loss": -43.199989318847656, "global_step": 350006, "epoch": 2892} {"train_loss": -43.423500061035156, "global_step": 350007, "epoch": 2892} {"train_loss": -43.07156753540039, "global_step": 350008, "epoch": 2892} {"train_loss": -43.20405197143555, "global_step": 350009, "epoch": 2892} {"train_loss": -42.93510055541992, "global_step": 350010, "epoch": 2892} {"train_loss": -42.81460189819336, "global_step": 350011, "epoch": 2892} {"train_loss": -42.870357513427734, "global_step": 350012, "epoch": 2892} {"train_loss": -43.16459274291992, "global_step": 350013, "epoch": 2892} {"train_loss": -43.19342041015625, "global_step": 350014, "epoch": 2892} {"train_loss": -42.53963851928711, "global_step": 350015, "epoch": 2892} {"train_loss": -43.30851745605469, "global_step": 350016, "epoch": 2892} {"train_loss": -42.51817321777344, "global_step": 350017, "epoch": 2892} {"train_loss": -43.61076354980469, "global_step": 350018, "epoch": 2892} {"train_loss": -43.785804748535156, "global_step": 350019, "epoch": 2892} {"train_loss": -43.2342529296875, "global_step": 350020, "epoch": 2892} {"train_loss": -42.119136810302734, "global_step": 350021, "epoch": 2892} {"train_loss": -43.587135314941406, "global_step": 350022, "epoch": 2892} {"train_loss": -43.29021072387695, "global_step": 350023, "epoch": 2892} {"train_loss": -43.617584228515625, "global_step": 350024, "epoch": 2892} {"train_loss": -43.566261291503906, "global_step": 350025, "epoch": 2892} {"train_loss": -43.95886993408203, "global_step": 350026, "epoch": 2892} {"train_loss": -42.34470748901367, "global_step": 350027, "epoch": 2892} {"train_loss": -42.765419006347656, "global_step": 350028, "epoch": 2892} {"train_loss": -43.68804168701172, "global_step": 350029, "epoch": 2892} {"train_loss": -43.19645309448242, "global_step": 350030, "epoch": 2892} {"train_loss": -42.148719787597656, "global_step": 350031, "epoch": 2892} {"train_loss": -41.43416976928711, "global_step": 350032, "epoch": 2892} {"train_loss": -43.80845260620117, "global_step": 350033, "epoch": 2892} {"train_loss": -43.21864700317383, "global_step": 350034, "epoch": 2892} {"train_loss": -43.375579833984375, "global_step": 350035, "epoch": 2892} {"train_loss": -43.023250579833984, "global_step": 350036, "epoch": 2892} {"train_loss": -43.90946960449219, "global_step": 350037, "epoch": 2892} {"train_loss": -43.193092346191406, "global_step": 350038, "epoch": 2892} {"train_loss": -43.869239807128906, "global_step": 350039, "epoch": 2892} {"train_loss": -43.774505615234375, "global_step": 350040, "epoch": 2892} {"train_loss": -41.789371490478516, "global_step": 350041, "epoch": 2892} {"train_loss": -43.31623458862305, "global_step": 350042, "epoch": 2892} {"train_loss": -44.22301483154297, "global_step": 350043, "epoch": 2892} {"train_loss": -43.58822250366211, "global_step": 350044, "epoch": 2892} {"train_loss": -43.676021575927734, "global_step": 350045, "epoch": 2892} {"train_loss": -44.010860443115234, "global_step": 350046, "epoch": 2892} {"train_loss": -43.07032012939453, "global_step": 350047, "epoch": 2892} {"train_loss": -42.93293762207031, "global_step": 350048, "epoch": 2892} {"train_loss": -41.97230911254883, "global_step": 350049, "epoch": 2892} {"train_loss": -41.78933334350586, "global_step": 350050, "epoch": 2892} {"train_loss": -43.00373458862305, "global_step": 350051, "epoch": 2892} {"train_loss": -41.523322302447866, "global_step": 350052, "epoch": 2892, "val_loss": 2638355.75} {"train_loss": -41.276397705078125, "global_step": 350053, "epoch": 2893} {"train_loss": -43.36381149291992, "global_step": 350054, "epoch": 2893} {"train_loss": -41.17092514038086, "global_step": 350055, "epoch": 2893} {"train_loss": -43.82841491699219, "global_step": 350056, "epoch": 2893} {"train_loss": -43.07274627685547, "global_step": 350057, "epoch": 2893} {"train_loss": -42.38564682006836, "global_step": 350058, "epoch": 2893} {"train_loss": -41.06296920776367, "global_step": 350059, "epoch": 2893} {"train_loss": -43.58662033081055, "global_step": 350060, "epoch": 2893} {"train_loss": -42.19916915893555, "global_step": 350061, "epoch": 2893} {"train_loss": -41.235321044921875, "global_step": 350062, "epoch": 2893} {"train_loss": -41.99805450439453, "global_step": 350063, "epoch": 2893} {"train_loss": -42.22731399536133, "global_step": 350064, "epoch": 2893} {"train_loss": -43.319541931152344, "global_step": 350065, "epoch": 2893} {"train_loss": -42.08405685424805, "global_step": 350066, "epoch": 2893} {"train_loss": -42.426605224609375, "global_step": 350067, "epoch": 2893} {"train_loss": -42.89117431640625, "global_step": 350068, "epoch": 2893} {"train_loss": -42.17435836791992, "global_step": 350069, "epoch": 2893} {"train_loss": -42.09427261352539, "global_step": 350070, "epoch": 2893} {"train_loss": -40.44242477416992, "global_step": 350071, "epoch": 2893} {"train_loss": -41.62203598022461, "global_step": 350072, "epoch": 2893} {"train_loss": -43.004878997802734, "global_step": 350073, "epoch": 2893} {"train_loss": -41.166709899902344, "global_step": 350074, "epoch": 2893} {"train_loss": -41.35585403442383, "global_step": 350075, "epoch": 2893} {"train_loss": -41.8397102355957, "global_step": 350076, "epoch": 2893} {"train_loss": -41.71200180053711, "global_step": 350077, "epoch": 2893} {"train_loss": -40.78233337402344, "global_step": 350078, "epoch": 2893} {"train_loss": -41.67426681518555, "global_step": 350079, "epoch": 2893} {"train_loss": -39.79679489135742, "global_step": 350080, "epoch": 2893} {"train_loss": -38.98308181762695, "global_step": 350081, "epoch": 2893} {"train_loss": -40.745887756347656, "global_step": 350082, "epoch": 2893} {"train_loss": -41.292964935302734, "global_step": 350083, "epoch": 2893} {"train_loss": -36.859554290771484, "global_step": 350084, "epoch": 2893} {"train_loss": -36.22499465942383, "global_step": 350085, "epoch": 2893} {"train_loss": -40.8511848449707, "global_step": 350086, "epoch": 2893} {"train_loss": -39.793724060058594, "global_step": 350087, "epoch": 2893} {"train_loss": -41.34911346435547, "global_step": 350088, "epoch": 2893} {"train_loss": -39.567359924316406, "global_step": 350089, "epoch": 2893} {"train_loss": -41.86440658569336, "global_step": 350090, "epoch": 2893} {"train_loss": -40.543094635009766, "global_step": 350091, "epoch": 2893} {"train_loss": -41.54383850097656, "global_step": 350092, "epoch": 2893} {"train_loss": -41.95392990112305, "global_step": 350093, "epoch": 2893} {"train_loss": -41.44279861450195, "global_step": 350094, "epoch": 2893} {"train_loss": -42.61537170410156, "global_step": 350095, "epoch": 2893} {"train_loss": -39.815345764160156, "global_step": 350096, "epoch": 2893} {"train_loss": -42.818328857421875, "global_step": 350097, "epoch": 2893} {"train_loss": -41.40662384033203, "global_step": 350098, "epoch": 2893} {"train_loss": -42.2371940612793, "global_step": 350099, "epoch": 2893} {"train_loss": -40.51041030883789, "global_step": 350100, "epoch": 2893} {"train_loss": -42.12029266357422, "global_step": 350101, "epoch": 2893} {"train_loss": -42.76077651977539, "global_step": 350102, "epoch": 2893} {"train_loss": -41.606998443603516, "global_step": 350103, "epoch": 2893} {"train_loss": -42.09218215942383, "global_step": 350104, "epoch": 2893} {"train_loss": -42.58790969848633, "global_step": 350105, "epoch": 2893} {"train_loss": -42.547306060791016, "global_step": 350106, "epoch": 2893} {"train_loss": -43.24918746948242, "global_step": 350107, "epoch": 2893} {"train_loss": -42.21110916137695, "global_step": 350108, "epoch": 2893} {"train_loss": -42.584259033203125, "global_step": 350109, "epoch": 2893} {"train_loss": -42.924861907958984, "global_step": 350110, "epoch": 2893} {"train_loss": -42.16838073730469, "global_step": 350111, "epoch": 2893} {"train_loss": -43.383018493652344, "global_step": 350112, "epoch": 2893} {"train_loss": -42.72969436645508, "global_step": 350113, "epoch": 2893} {"train_loss": -43.24382400512695, "global_step": 350114, "epoch": 2893} {"train_loss": -43.15843200683594, "global_step": 350115, "epoch": 2893} {"train_loss": -42.81411361694336, "global_step": 350116, "epoch": 2893} {"train_loss": -43.10305404663086, "global_step": 350117, "epoch": 2893} {"train_loss": -43.38227462768555, "global_step": 350118, "epoch": 2893} {"train_loss": -42.361942291259766, "global_step": 350119, "epoch": 2893} {"train_loss": -42.249671936035156, "global_step": 350120, "epoch": 2893} {"train_loss": -43.758636474609375, "global_step": 350121, "epoch": 2893} {"train_loss": -43.67702102661133, "global_step": 350122, "epoch": 2893} {"train_loss": -41.52839279174805, "global_step": 350123, "epoch": 2893} {"train_loss": -43.95252227783203, "global_step": 350124, "epoch": 2893} {"train_loss": -43.41112518310547, "global_step": 350125, "epoch": 2893} {"train_loss": -41.6595573425293, "global_step": 350126, "epoch": 2893} {"train_loss": -43.76107406616211, "global_step": 350127, "epoch": 2893} {"train_loss": -44.0594482421875, "global_step": 350128, "epoch": 2893} {"train_loss": -43.133785247802734, "global_step": 350129, "epoch": 2893} {"train_loss": -43.5280647277832, "global_step": 350130, "epoch": 2893} {"train_loss": -43.51641845703125, "global_step": 350131, "epoch": 2893} {"train_loss": -43.8045539855957, "global_step": 350132, "epoch": 2893} {"train_loss": -43.8346061706543, "global_step": 350133, "epoch": 2893} {"train_loss": -42.02309799194336, "global_step": 350134, "epoch": 2893} {"train_loss": -43.454097747802734, "global_step": 350135, "epoch": 2893} {"train_loss": -44.043636322021484, "global_step": 350136, "epoch": 2893} {"train_loss": -43.1258659362793, "global_step": 350137, "epoch": 2893} {"train_loss": -43.666900634765625, "global_step": 350138, "epoch": 2893} {"train_loss": -44.26828384399414, "global_step": 350139, "epoch": 2893} {"train_loss": -43.018978118896484, "global_step": 350140, "epoch": 2893} {"train_loss": -44.08071517944336, "global_step": 350141, "epoch": 2893} {"train_loss": -43.52634811401367, "global_step": 350142, "epoch": 2893} {"train_loss": -43.6962776184082, "global_step": 350143, "epoch": 2893} {"train_loss": -44.48460006713867, "global_step": 350144, "epoch": 2893} {"train_loss": -42.311927795410156, "global_step": 350145, "epoch": 2893} {"train_loss": -43.84150314331055, "global_step": 350146, "epoch": 2893} {"train_loss": -42.837615966796875, "global_step": 350147, "epoch": 2893} {"train_loss": -43.06807327270508, "global_step": 350148, "epoch": 2893} {"train_loss": -44.43757247924805, "global_step": 350149, "epoch": 2893} {"train_loss": -44.40456771850586, "global_step": 350150, "epoch": 2893} {"train_loss": -43.65220260620117, "global_step": 350151, "epoch": 2893} {"train_loss": -43.65108108520508, "global_step": 350152, "epoch": 2893} {"train_loss": -43.830360412597656, "global_step": 350153, "epoch": 2893} {"train_loss": -44.41391372680664, "global_step": 350154, "epoch": 2893} {"train_loss": -42.983665466308594, "global_step": 350155, "epoch": 2893} {"train_loss": -44.4041633605957, "global_step": 350156, "epoch": 2893} {"train_loss": -42.80373764038086, "global_step": 350157, "epoch": 2893} {"train_loss": -43.83160400390625, "global_step": 350158, "epoch": 2893} {"train_loss": -44.60450744628906, "global_step": 350159, "epoch": 2893} {"train_loss": -42.874290466308594, "global_step": 350160, "epoch": 2893} {"train_loss": -43.97800064086914, "global_step": 350161, "epoch": 2893} {"train_loss": -42.45888900756836, "global_step": 350162, "epoch": 2893} {"train_loss": -43.46211624145508, "global_step": 350163, "epoch": 2893} {"train_loss": -44.488555908203125, "global_step": 350164, "epoch": 2893} {"train_loss": -43.396976470947266, "global_step": 350165, "epoch": 2893} {"train_loss": -43.47978591918945, "global_step": 350166, "epoch": 2893} {"train_loss": -43.00563430786133, "global_step": 350167, "epoch": 2893} {"train_loss": -44.031795501708984, "global_step": 350168, "epoch": 2893} {"train_loss": -43.53547668457031, "global_step": 350169, "epoch": 2893} {"train_loss": -42.27703857421875, "global_step": 350170, "epoch": 2893} {"train_loss": -42.375091552734375, "global_step": 350171, "epoch": 2893} {"train_loss": -43.66764450073242, "global_step": 350172, "epoch": 2893} {"train_loss": -42.51293973686281, "global_step": 350173, "epoch": 2893, "val_loss": 2797406.0} {"train_loss": -36.33808135986328, "global_step": 350174, "epoch": 2894} {"train_loss": -41.18948745727539, "global_step": 350175, "epoch": 2894} {"train_loss": -41.65978240966797, "global_step": 350176, "epoch": 2894} {"train_loss": -43.14167404174805, "global_step": 350177, "epoch": 2894} {"train_loss": -39.16897201538086, "global_step": 350178, "epoch": 2894} {"train_loss": -43.136566162109375, "global_step": 350179, "epoch": 2894} {"train_loss": -42.5345458984375, "global_step": 350180, "epoch": 2894} {"train_loss": -42.543766021728516, "global_step": 350181, "epoch": 2894} {"train_loss": -41.343231201171875, "global_step": 350182, "epoch": 2894} {"train_loss": -43.7606201171875, "global_step": 350183, "epoch": 2894} {"train_loss": -43.06372833251953, "global_step": 350184, "epoch": 2894} {"train_loss": -42.459651947021484, "global_step": 350185, "epoch": 2894} {"train_loss": -42.49738311767578, "global_step": 350186, "epoch": 2894} {"train_loss": -43.39619064331055, "global_step": 350187, "epoch": 2894} {"train_loss": -40.20357894897461, "global_step": 350188, "epoch": 2894} {"train_loss": -41.557708740234375, "global_step": 350189, "epoch": 2894} {"train_loss": -42.87569808959961, "global_step": 350190, "epoch": 2894} {"train_loss": -40.826995849609375, "global_step": 350191, "epoch": 2894} {"train_loss": -36.91932678222656, "global_step": 350192, "epoch": 2894} {"train_loss": -42.9697380065918, "global_step": 350193, "epoch": 2894} {"train_loss": -41.0554313659668, "global_step": 350194, "epoch": 2894} {"train_loss": -43.18131637573242, "global_step": 350195, "epoch": 2894} {"train_loss": -41.9435920715332, "global_step": 350196, "epoch": 2894} {"train_loss": -43.659481048583984, "global_step": 350197, "epoch": 2894} {"train_loss": -42.157371520996094, "global_step": 350198, "epoch": 2894} {"train_loss": -41.8104248046875, "global_step": 350199, "epoch": 2894} {"train_loss": -42.325836181640625, "global_step": 350200, "epoch": 2894} {"train_loss": -42.834224700927734, "global_step": 350201, "epoch": 2894} {"train_loss": -42.93169403076172, "global_step": 350202, "epoch": 2894} {"train_loss": -42.56062698364258, "global_step": 350203, "epoch": 2894} {"train_loss": -41.874359130859375, "global_step": 350204, "epoch": 2894} {"train_loss": -39.99186706542969, "global_step": 350205, "epoch": 2894} {"train_loss": -42.63950729370117, "global_step": 350206, "epoch": 2894} {"train_loss": -41.51654052734375, "global_step": 350207, "epoch": 2894} {"train_loss": -42.96794509887695, "global_step": 350208, "epoch": 2894} {"train_loss": -42.44257354736328, "global_step": 350209, "epoch": 2894} {"train_loss": -42.706539154052734, "global_step": 350210, "epoch": 2894} {"train_loss": -42.516231536865234, "global_step": 350211, "epoch": 2894} {"train_loss": -42.8411865234375, "global_step": 350212, "epoch": 2894} {"train_loss": -42.99573516845703, "global_step": 350213, "epoch": 2894} {"train_loss": -42.73635482788086, "global_step": 350214, "epoch": 2894} {"train_loss": -40.48594665527344, "global_step": 350215, "epoch": 2894} {"train_loss": -43.09565353393555, "global_step": 350216, "epoch": 2894} {"train_loss": -40.3242073059082, "global_step": 350217, "epoch": 2894} {"train_loss": -41.76575469970703, "global_step": 350218, "epoch": 2894} {"train_loss": -43.096988677978516, "global_step": 350219, "epoch": 2894} {"train_loss": -43.22153091430664, "global_step": 350220, "epoch": 2894} {"train_loss": -24.44057273864746, "global_step": 350221, "epoch": 2894} {"train_loss": -42.19875717163086, "global_step": 350222, "epoch": 2894} {"train_loss": -42.17193603515625, "global_step": 350223, "epoch": 2894} {"train_loss": -42.33170700073242, "global_step": 350224, "epoch": 2894} {"train_loss": -42.016334533691406, "global_step": 350225, "epoch": 2894} {"train_loss": -42.65774154663086, "global_step": 350226, "epoch": 2894} {"train_loss": -40.62663650512695, "global_step": 350227, "epoch": 2894} {"train_loss": -41.29939651489258, "global_step": 350228, "epoch": 2894} {"train_loss": -40.80489730834961, "global_step": 350229, "epoch": 2894} {"train_loss": -42.11181640625, "global_step": 350230, "epoch": 2894} {"train_loss": -38.8219108581543, "global_step": 350231, "epoch": 2894} {"train_loss": -42.62296676635742, "global_step": 350232, "epoch": 2894} {"train_loss": -41.2489128112793, "global_step": 350233, "epoch": 2894} {"train_loss": -42.27848434448242, "global_step": 350234, "epoch": 2894} {"train_loss": -41.58456802368164, "global_step": 350235, "epoch": 2894} {"train_loss": -43.122554779052734, "global_step": 350236, "epoch": 2894} {"train_loss": -40.455501556396484, "global_step": 350237, "epoch": 2894} {"train_loss": -41.391563415527344, "global_step": 350238, "epoch": 2894} {"train_loss": -40.38985061645508, "global_step": 350239, "epoch": 2894} {"train_loss": -37.84989547729492, "global_step": 350240, "epoch": 2894} {"train_loss": -41.87813949584961, "global_step": 350241, "epoch": 2894} {"train_loss": -40.796424865722656, "global_step": 350242, "epoch": 2894} {"train_loss": -41.216487884521484, "global_step": 350243, "epoch": 2894} {"train_loss": -42.19931411743164, "global_step": 350244, "epoch": 2894} {"train_loss": -41.950260162353516, "global_step": 350245, "epoch": 2894} {"train_loss": -41.09710693359375, "global_step": 350246, "epoch": 2894} {"train_loss": -42.55542755126953, "global_step": 350247, "epoch": 2894} {"train_loss": -42.538169860839844, "global_step": 350248, "epoch": 2894} {"train_loss": -41.705501556396484, "global_step": 350249, "epoch": 2894} {"train_loss": -43.355438232421875, "global_step": 350250, "epoch": 2894} {"train_loss": -42.2166862487793, "global_step": 350251, "epoch": 2894} {"train_loss": -42.65971755981445, "global_step": 350252, "epoch": 2894} {"train_loss": -38.54524612426758, "global_step": 350253, "epoch": 2894} {"train_loss": -43.09737014770508, "global_step": 350254, "epoch": 2894} {"train_loss": -35.8874626159668, "global_step": 350255, "epoch": 2894} {"train_loss": -37.19413375854492, "global_step": 350256, "epoch": 2894} {"train_loss": -43.30683898925781, "global_step": 350257, "epoch": 2894} {"train_loss": -40.94074249267578, "global_step": 350258, "epoch": 2894} {"train_loss": -42.270782470703125, "global_step": 350259, "epoch": 2894} {"train_loss": -42.346778869628906, "global_step": 350260, "epoch": 2894} {"train_loss": -43.106536865234375, "global_step": 350261, "epoch": 2894} {"train_loss": -41.508541107177734, "global_step": 350262, "epoch": 2894} {"train_loss": -42.32175827026367, "global_step": 350263, "epoch": 2894} {"train_loss": -42.746456146240234, "global_step": 350264, "epoch": 2894} {"train_loss": -43.11091232299805, "global_step": 350265, "epoch": 2894} {"train_loss": -41.27080154418945, "global_step": 350266, "epoch": 2894} {"train_loss": -42.80598449707031, "global_step": 350267, "epoch": 2894} {"train_loss": -43.295753479003906, "global_step": 350268, "epoch": 2894} {"train_loss": -40.303123474121094, "global_step": 350269, "epoch": 2894} {"train_loss": -42.71912384033203, "global_step": 350270, "epoch": 2894} {"train_loss": -41.34916305541992, "global_step": 350271, "epoch": 2894} {"train_loss": -43.43634033203125, "global_step": 350272, "epoch": 2894} {"train_loss": -42.11906051635742, "global_step": 350273, "epoch": 2894} {"train_loss": -43.19010543823242, "global_step": 350274, "epoch": 2894} {"train_loss": -42.3829460144043, "global_step": 350275, "epoch": 2894} {"train_loss": -42.52490997314453, "global_step": 350276, "epoch": 2894} {"train_loss": -43.661983489990234, "global_step": 350277, "epoch": 2894} {"train_loss": -41.82976150512695, "global_step": 350278, "epoch": 2894} {"train_loss": -39.74200439453125, "global_step": 350279, "epoch": 2894} {"train_loss": -43.364418029785156, "global_step": 350280, "epoch": 2894} {"train_loss": -41.601539611816406, "global_step": 350281, "epoch": 2894} {"train_loss": -43.01011657714844, "global_step": 350282, "epoch": 2894} {"train_loss": -42.92951965332031, "global_step": 350283, "epoch": 2894} {"train_loss": -43.056453704833984, "global_step": 350284, "epoch": 2894} {"train_loss": -42.062255859375, "global_step": 350285, "epoch": 2894} {"train_loss": -43.38778305053711, "global_step": 350286, "epoch": 2894} {"train_loss": -43.5810661315918, "global_step": 350287, "epoch": 2894} {"train_loss": -42.46418380737305, "global_step": 350288, "epoch": 2894} {"train_loss": -43.93949508666992, "global_step": 350289, "epoch": 2894} {"train_loss": -43.15633773803711, "global_step": 350290, "epoch": 2894} {"train_loss": -43.30441665649414, "global_step": 350291, "epoch": 2894} {"train_loss": -43.3515625, "global_step": 350292, "epoch": 2894} {"train_loss": -43.92534255981445, "global_step": 350293, "epoch": 2894} {"train_loss": -41.83338548329251, "global_step": 350294, "epoch": 2894, "val_loss": 2707919.0} {"train_loss": -43.45351028442383, "global_step": 350295, "epoch": 2895} {"train_loss": -42.73775863647461, "global_step": 350296, "epoch": 2895} {"train_loss": -44.14117431640625, "global_step": 350297, "epoch": 2895} {"train_loss": -43.1744384765625, "global_step": 350298, "epoch": 2895} {"train_loss": -43.89162826538086, "global_step": 350299, "epoch": 2895} {"train_loss": -43.78712844848633, "global_step": 350300, "epoch": 2895} {"train_loss": -43.679141998291016, "global_step": 350301, "epoch": 2895} {"train_loss": -43.820831298828125, "global_step": 350302, "epoch": 2895} {"train_loss": -44.30831527709961, "global_step": 350303, "epoch": 2895} {"train_loss": -44.11732864379883, "global_step": 350304, "epoch": 2895} {"train_loss": -42.52735137939453, "global_step": 350305, "epoch": 2895} {"train_loss": -44.48249816894531, "global_step": 350306, "epoch": 2895} {"train_loss": -43.199920654296875, "global_step": 350307, "epoch": 2895} {"train_loss": -44.054237365722656, "global_step": 350308, "epoch": 2895} {"train_loss": -44.24776077270508, "global_step": 350309, "epoch": 2895} {"train_loss": -43.58648681640625, "global_step": 350310, "epoch": 2895} {"train_loss": -43.59907150268555, "global_step": 350311, "epoch": 2895} {"train_loss": -42.91270065307617, "global_step": 350312, "epoch": 2895} {"train_loss": -43.205604553222656, "global_step": 350313, "epoch": 2895} {"train_loss": -43.88797378540039, "global_step": 350314, "epoch": 2895} {"train_loss": -43.986732482910156, "global_step": 350315, "epoch": 2895} {"train_loss": -43.65277099609375, "global_step": 350316, "epoch": 2895} {"train_loss": -43.445003509521484, "global_step": 350317, "epoch": 2895} {"train_loss": -43.564815521240234, "global_step": 350318, "epoch": 2895} {"train_loss": -41.7020263671875, "global_step": 350319, "epoch": 2895} {"train_loss": -43.863712310791016, "global_step": 350320, "epoch": 2895} {"train_loss": -41.8986701965332, "global_step": 350321, "epoch": 2895} {"train_loss": -43.043060302734375, "global_step": 350322, "epoch": 2895} {"train_loss": -44.58944320678711, "global_step": 350323, "epoch": 2895} {"train_loss": -43.53996658325195, "global_step": 350324, "epoch": 2895} {"train_loss": -44.48489761352539, "global_step": 350325, "epoch": 2895} {"train_loss": -43.6261100769043, "global_step": 350326, "epoch": 2895} {"train_loss": -44.20595932006836, "global_step": 350327, "epoch": 2895} {"train_loss": -43.03036117553711, "global_step": 350328, "epoch": 2895} {"train_loss": -43.91706466674805, "global_step": 350329, "epoch": 2895} {"train_loss": -42.49540328979492, "global_step": 350330, "epoch": 2895} {"train_loss": -44.28778839111328, "global_step": 350331, "epoch": 2895} {"train_loss": -42.74823760986328, "global_step": 350332, "epoch": 2895} {"train_loss": -43.28763961791992, "global_step": 350333, "epoch": 2895} {"train_loss": -43.63374710083008, "global_step": 350334, "epoch": 2895} {"train_loss": -44.66086959838867, "global_step": 350335, "epoch": 2895} {"train_loss": -42.88629913330078, "global_step": 350336, "epoch": 2895} {"train_loss": -43.855899810791016, "global_step": 350337, "epoch": 2895} {"train_loss": -43.888179779052734, "global_step": 350338, "epoch": 2895} {"train_loss": -43.81475067138672, "global_step": 350339, "epoch": 2895} {"train_loss": -44.699981689453125, "global_step": 350340, "epoch": 2895} {"train_loss": -44.23918914794922, "global_step": 350341, "epoch": 2895} {"train_loss": -44.661800384521484, "global_step": 350342, "epoch": 2895} {"train_loss": -44.151058197021484, "global_step": 350343, "epoch": 2895} {"train_loss": -44.03131866455078, "global_step": 350344, "epoch": 2895} {"train_loss": -44.23000717163086, "global_step": 350345, "epoch": 2895} {"train_loss": -43.54294204711914, "global_step": 350346, "epoch": 2895} {"train_loss": -43.11745834350586, "global_step": 350347, "epoch": 2895} {"train_loss": -44.57577133178711, "global_step": 350348, "epoch": 2895} {"train_loss": -43.429447174072266, "global_step": 350349, "epoch": 2895} {"train_loss": -43.43039321899414, "global_step": 350350, "epoch": 2895} {"train_loss": -41.62363815307617, "global_step": 350351, "epoch": 2895} {"train_loss": -41.45920944213867, "global_step": 350352, "epoch": 2895} {"train_loss": -40.75550842285156, "global_step": 350353, "epoch": 2895} {"train_loss": -41.61606979370117, "global_step": 350354, "epoch": 2895} {"train_loss": -43.13821029663086, "global_step": 350355, "epoch": 2895} {"train_loss": -43.1638069152832, "global_step": 350356, "epoch": 2895} {"train_loss": -43.845428466796875, "global_step": 350357, "epoch": 2895} {"train_loss": -43.1058464050293, "global_step": 350358, "epoch": 2895} {"train_loss": -42.16389083862305, "global_step": 350359, "epoch": 2895} {"train_loss": -41.2647590637207, "global_step": 350360, "epoch": 2895} {"train_loss": -39.620628356933594, "global_step": 350361, "epoch": 2895} {"train_loss": -42.60239791870117, "global_step": 350362, "epoch": 2895} {"train_loss": -42.410396575927734, "global_step": 350363, "epoch": 2895} {"train_loss": -39.17194747924805, "global_step": 350364, "epoch": 2895} {"train_loss": -39.350826263427734, "global_step": 350365, "epoch": 2895} {"train_loss": -41.176475524902344, "global_step": 350366, "epoch": 2895} {"train_loss": -42.9361686706543, "global_step": 350367, "epoch": 2895} {"train_loss": -43.333099365234375, "global_step": 350368, "epoch": 2895} {"train_loss": -42.76123809814453, "global_step": 350369, "epoch": 2895} {"train_loss": -42.35287094116211, "global_step": 350370, "epoch": 2895} {"train_loss": -42.16774368286133, "global_step": 350371, "epoch": 2895} {"train_loss": -42.76008987426758, "global_step": 350372, "epoch": 2895} {"train_loss": -41.7647819519043, "global_step": 350373, "epoch": 2895} {"train_loss": -40.26528549194336, "global_step": 350374, "epoch": 2895} {"train_loss": -41.26102828979492, "global_step": 350375, "epoch": 2895} {"train_loss": -42.4102897644043, "global_step": 350376, "epoch": 2895} {"train_loss": -41.5626335144043, "global_step": 350377, "epoch": 2895} {"train_loss": -41.385982513427734, "global_step": 350378, "epoch": 2895} {"train_loss": -40.76371765136719, "global_step": 350379, "epoch": 2895} {"train_loss": -40.11573028564453, "global_step": 350380, "epoch": 2895} {"train_loss": -42.236083984375, "global_step": 350381, "epoch": 2895} {"train_loss": -40.395233154296875, "global_step": 350382, "epoch": 2895} {"train_loss": -41.80825424194336, "global_step": 350383, "epoch": 2895} {"train_loss": -42.558448791503906, "global_step": 350384, "epoch": 2895} {"train_loss": -41.1893424987793, "global_step": 350385, "epoch": 2895} {"train_loss": -41.92914962768555, "global_step": 350386, "epoch": 2895} {"train_loss": -41.03763961791992, "global_step": 350387, "epoch": 2895} {"train_loss": -42.69077682495117, "global_step": 350388, "epoch": 2895} {"train_loss": -42.042354583740234, "global_step": 350389, "epoch": 2895} {"train_loss": -42.067012786865234, "global_step": 350390, "epoch": 2895} {"train_loss": -43.05320358276367, "global_step": 350391, "epoch": 2895} {"train_loss": -42.63792419433594, "global_step": 350392, "epoch": 2895} {"train_loss": -42.61445236206055, "global_step": 350393, "epoch": 2895} {"train_loss": -41.72079849243164, "global_step": 350394, "epoch": 2895} {"train_loss": -42.9731559753418, "global_step": 350395, "epoch": 2895} {"train_loss": -42.005889892578125, "global_step": 350396, "epoch": 2895} {"train_loss": -42.23307418823242, "global_step": 350397, "epoch": 2895} {"train_loss": -42.22269058227539, "global_step": 350398, "epoch": 2895} {"train_loss": -41.92878341674805, "global_step": 350399, "epoch": 2895} {"train_loss": -42.452266693115234, "global_step": 350400, "epoch": 2895} {"train_loss": -42.7614631652832, "global_step": 350401, "epoch": 2895} {"train_loss": -42.414939880371094, "global_step": 350402, "epoch": 2895} {"train_loss": -42.64168930053711, "global_step": 350403, "epoch": 2895} {"train_loss": -41.5925178527832, "global_step": 350404, "epoch": 2895} {"train_loss": -43.287445068359375, "global_step": 350405, "epoch": 2895} {"train_loss": -41.177730560302734, "global_step": 350406, "epoch": 2895} {"train_loss": -42.51810073852539, "global_step": 350407, "epoch": 2895} {"train_loss": -43.45600891113281, "global_step": 350408, "epoch": 2895} {"train_loss": -42.6161994934082, "global_step": 350409, "epoch": 2895} {"train_loss": -41.81136703491211, "global_step": 350410, "epoch": 2895} {"train_loss": -43.31489181518555, "global_step": 350411, "epoch": 2895} {"train_loss": -42.98454284667969, "global_step": 350412, "epoch": 2895} {"train_loss": -42.87125778198242, "global_step": 350413, "epoch": 2895} {"train_loss": -43.05610656738281, "global_step": 350414, "epoch": 2895} {"train_loss": -42.79362487792969, "global_step": 350415, "epoch": 2895, "val_loss": 2693516.75} {"train_loss": -43.34743881225586, "global_step": 350416, "epoch": 2896} {"train_loss": -43.504756927490234, "global_step": 350417, "epoch": 2896} {"train_loss": -42.64772415161133, "global_step": 350418, "epoch": 2896} {"train_loss": -43.03096008300781, "global_step": 350419, "epoch": 2896} {"train_loss": -42.39393615722656, "global_step": 350420, "epoch": 2896} {"train_loss": -43.6234016418457, "global_step": 350421, "epoch": 2896} {"train_loss": -42.10145568847656, "global_step": 350422, "epoch": 2896} {"train_loss": -43.109962463378906, "global_step": 350423, "epoch": 2896} {"train_loss": -43.33800506591797, "global_step": 350424, "epoch": 2896} {"train_loss": -43.6604118347168, "global_step": 350425, "epoch": 2896} {"train_loss": -42.47705078125, "global_step": 350426, "epoch": 2896} {"train_loss": -42.651283264160156, "global_step": 350427, "epoch": 2896} {"train_loss": -35.1585693359375, "global_step": 350428, "epoch": 2896} {"train_loss": -42.611690521240234, "global_step": 350429, "epoch": 2896} {"train_loss": -37.687740325927734, "global_step": 350430, "epoch": 2896} {"train_loss": -43.142127990722656, "global_step": 350431, "epoch": 2896} {"train_loss": -40.2669677734375, "global_step": 350432, "epoch": 2896} {"train_loss": -42.925453186035156, "global_step": 350433, "epoch": 2896} {"train_loss": -43.51995086669922, "global_step": 350434, "epoch": 2896} {"train_loss": -43.49883270263672, "global_step": 350435, "epoch": 2896} {"train_loss": -43.46852111816406, "global_step": 350436, "epoch": 2896} {"train_loss": -43.680877685546875, "global_step": 350437, "epoch": 2896} {"train_loss": -41.66896438598633, "global_step": 350438, "epoch": 2896} {"train_loss": -43.40771484375, "global_step": 350439, "epoch": 2896} {"train_loss": -43.78426742553711, "global_step": 350440, "epoch": 2896} {"train_loss": -42.56059646606445, "global_step": 350441, "epoch": 2896} {"train_loss": -42.613311767578125, "global_step": 350442, "epoch": 2896} {"train_loss": -43.34780502319336, "global_step": 350443, "epoch": 2896} {"train_loss": -43.79385757446289, "global_step": 350444, "epoch": 2896} {"train_loss": -43.6937141418457, "global_step": 350445, "epoch": 2896} {"train_loss": -34.3524055480957, "global_step": 350446, "epoch": 2896} {"train_loss": -43.221683502197266, "global_step": 350447, "epoch": 2896} {"train_loss": -44.19450378417969, "global_step": 350448, "epoch": 2896} {"train_loss": -44.13334274291992, "global_step": 350449, "epoch": 2896} {"train_loss": -42.21117401123047, "global_step": 350450, "epoch": 2896} {"train_loss": -44.06250762939453, "global_step": 350451, "epoch": 2896} {"train_loss": -43.62627029418945, "global_step": 350452, "epoch": 2896} {"train_loss": -43.774715423583984, "global_step": 350453, "epoch": 2896} {"train_loss": -44.17418670654297, "global_step": 350454, "epoch": 2896} {"train_loss": -43.223114013671875, "global_step": 350455, "epoch": 2896} {"train_loss": -42.51362228393555, "global_step": 350456, "epoch": 2896} {"train_loss": -43.77681350708008, "global_step": 350457, "epoch": 2896} {"train_loss": -42.898468017578125, "global_step": 350458, "epoch": 2896} {"train_loss": -44.29267501831055, "global_step": 350459, "epoch": 2896} {"train_loss": -44.403106689453125, "global_step": 350460, "epoch": 2896} {"train_loss": -43.905235290527344, "global_step": 350461, "epoch": 2896} {"train_loss": -44.19259262084961, "global_step": 350462, "epoch": 2896} {"train_loss": -43.0384521484375, "global_step": 350463, "epoch": 2896} {"train_loss": -44.41650390625, "global_step": 350464, "epoch": 2896} {"train_loss": -43.774139404296875, "global_step": 350465, "epoch": 2896} {"train_loss": -43.818294525146484, "global_step": 350466, "epoch": 2896} {"train_loss": -44.532466888427734, "global_step": 350467, "epoch": 2896} {"train_loss": -43.94132614135742, "global_step": 350468, "epoch": 2896} {"train_loss": -44.750099182128906, "global_step": 350469, "epoch": 2896} {"train_loss": -44.48260498046875, "global_step": 350470, "epoch": 2896} {"train_loss": -44.27328872680664, "global_step": 350471, "epoch": 2896} {"train_loss": -43.996009826660156, "global_step": 350472, "epoch": 2896} {"train_loss": -44.313377380371094, "global_step": 350473, "epoch": 2896} {"train_loss": -43.673072814941406, "global_step": 350474, "epoch": 2896} {"train_loss": -43.94233322143555, "global_step": 350475, "epoch": 2896} {"train_loss": -44.24753952026367, "global_step": 350476, "epoch": 2896} {"train_loss": -43.10207748413086, "global_step": 350477, "epoch": 2896} {"train_loss": -44.355220794677734, "global_step": 350478, "epoch": 2896} {"train_loss": -43.69340896606445, "global_step": 350479, "epoch": 2896} {"train_loss": -44.217567443847656, "global_step": 350480, "epoch": 2896} {"train_loss": -43.092960357666016, "global_step": 350481, "epoch": 2896} {"train_loss": -43.86119842529297, "global_step": 350482, "epoch": 2896} {"train_loss": -44.493648529052734, "global_step": 350483, "epoch": 2896} {"train_loss": -43.02594757080078, "global_step": 350484, "epoch": 2896} {"train_loss": -42.90788650512695, "global_step": 350485, "epoch": 2896} {"train_loss": -43.7450065612793, "global_step": 350486, "epoch": 2896} {"train_loss": -42.49495315551758, "global_step": 350487, "epoch": 2896} {"train_loss": -43.850440979003906, "global_step": 350488, "epoch": 2896} {"train_loss": -43.57766342163086, "global_step": 350489, "epoch": 2896} {"train_loss": -44.165130615234375, "global_step": 350490, "epoch": 2896} {"train_loss": -44.08928298950195, "global_step": 350491, "epoch": 2896} {"train_loss": -43.37636947631836, "global_step": 350492, "epoch": 2896} {"train_loss": -42.48825454711914, "global_step": 350493, "epoch": 2896} {"train_loss": -43.6415901184082, "global_step": 350494, "epoch": 2896} {"train_loss": -43.47697067260742, "global_step": 350495, "epoch": 2896} {"train_loss": -43.838558197021484, "global_step": 350496, "epoch": 2896} {"train_loss": -44.03058624267578, "global_step": 350497, "epoch": 2896} {"train_loss": -43.27745056152344, "global_step": 350498, "epoch": 2896} {"train_loss": -43.474666595458984, "global_step": 350499, "epoch": 2896} {"train_loss": -43.601470947265625, "global_step": 350500, "epoch": 2896} {"train_loss": -42.7004280090332, "global_step": 350501, "epoch": 2896} {"train_loss": -44.00423049926758, "global_step": 350502, "epoch": 2896} {"train_loss": -43.78497314453125, "global_step": 350503, "epoch": 2896} {"train_loss": -43.119956970214844, "global_step": 350504, "epoch": 2896} {"train_loss": -42.5900993347168, "global_step": 350505, "epoch": 2896} {"train_loss": -43.0832633972168, "global_step": 350506, "epoch": 2896} {"train_loss": -43.924346923828125, "global_step": 350507, "epoch": 2896} {"train_loss": -43.94293212890625, "global_step": 350508, "epoch": 2896} {"train_loss": -42.26826095581055, "global_step": 350509, "epoch": 2896} {"train_loss": -40.92415237426758, "global_step": 350510, "epoch": 2896} {"train_loss": -40.44795608520508, "global_step": 350511, "epoch": 2896} {"train_loss": -41.44234848022461, "global_step": 350512, "epoch": 2896} {"train_loss": -42.07444763183594, "global_step": 350513, "epoch": 2896} {"train_loss": -42.22150802612305, "global_step": 350514, "epoch": 2896} {"train_loss": -41.997047424316406, "global_step": 350515, "epoch": 2896} {"train_loss": -42.85841751098633, "global_step": 350516, "epoch": 2896} {"train_loss": -38.81650161743164, "global_step": 350517, "epoch": 2896} {"train_loss": -40.44889450073242, "global_step": 350518, "epoch": 2896} {"train_loss": -43.3433723449707, "global_step": 350519, "epoch": 2896} {"train_loss": -40.29912185668945, "global_step": 350520, "epoch": 2896} {"train_loss": -40.6648063659668, "global_step": 350521, "epoch": 2896} {"train_loss": -42.573883056640625, "global_step": 350522, "epoch": 2896} {"train_loss": -40.85963821411133, "global_step": 350523, "epoch": 2896} {"train_loss": -40.815948486328125, "global_step": 350524, "epoch": 2896} {"train_loss": -43.30601119995117, "global_step": 350525, "epoch": 2896} {"train_loss": -41.81545639038086, "global_step": 350526, "epoch": 2896} {"train_loss": -40.73734664916992, "global_step": 350527, "epoch": 2896} {"train_loss": -43.194183349609375, "global_step": 350528, "epoch": 2896} {"train_loss": -42.077125549316406, "global_step": 350529, "epoch": 2896} {"train_loss": -43.31633377075195, "global_step": 350530, "epoch": 2896} {"train_loss": -42.14994812011719, "global_step": 350531, "epoch": 2896} {"train_loss": -42.994300842285156, "global_step": 350532, "epoch": 2896} {"train_loss": -42.8680534362793, "global_step": 350533, "epoch": 2896} {"train_loss": -43.28219223022461, "global_step": 350534, "epoch": 2896} {"train_loss": -42.87299728393555, "global_step": 350535, "epoch": 2896} {"train_loss": -42.91924175546189, "global_step": 350536, "epoch": 2896, "val_loss": 2744715.0} {"train_loss": -43.26789093017578, "global_step": 350537, "epoch": 2897} {"train_loss": -43.409786224365234, "global_step": 350538, "epoch": 2897} {"train_loss": -41.949928283691406, "global_step": 350539, "epoch": 2897} {"train_loss": -42.87778854370117, "global_step": 350540, "epoch": 2897} {"train_loss": -43.323360443115234, "global_step": 350541, "epoch": 2897} {"train_loss": -43.29671096801758, "global_step": 350542, "epoch": 2897} {"train_loss": -42.85987091064453, "global_step": 350543, "epoch": 2897} {"train_loss": -43.189796447753906, "global_step": 350544, "epoch": 2897} {"train_loss": -43.04677963256836, "global_step": 350545, "epoch": 2897} {"train_loss": -43.968502044677734, "global_step": 350546, "epoch": 2897} {"train_loss": -43.46014404296875, "global_step": 350547, "epoch": 2897} {"train_loss": -43.410640716552734, "global_step": 350548, "epoch": 2897} {"train_loss": -43.5639762878418, "global_step": 350549, "epoch": 2897} {"train_loss": -43.76774215698242, "global_step": 350550, "epoch": 2897} {"train_loss": -43.95101547241211, "global_step": 350551, "epoch": 2897} {"train_loss": -43.85913848876953, "global_step": 350552, "epoch": 2897} {"train_loss": -43.084617614746094, "global_step": 350553, "epoch": 2897} {"train_loss": -44.25020217895508, "global_step": 350554, "epoch": 2897} {"train_loss": -43.94474411010742, "global_step": 350555, "epoch": 2897} {"train_loss": -44.25627517700195, "global_step": 350556, "epoch": 2897} {"train_loss": -43.27474594116211, "global_step": 350557, "epoch": 2897} {"train_loss": -44.107826232910156, "global_step": 350558, "epoch": 2897} {"train_loss": -44.16059112548828, "global_step": 350559, "epoch": 2897} {"train_loss": -44.10445022583008, "global_step": 350560, "epoch": 2897} {"train_loss": -44.45624923706055, "global_step": 350561, "epoch": 2897} {"train_loss": -43.901641845703125, "global_step": 350562, "epoch": 2897} {"train_loss": -44.110347747802734, "global_step": 350563, "epoch": 2897} {"train_loss": -44.24592590332031, "global_step": 350564, "epoch": 2897} {"train_loss": -44.09880447387695, "global_step": 350565, "epoch": 2897} {"train_loss": -43.27632522583008, "global_step": 350566, "epoch": 2897} {"train_loss": -44.17377853393555, "global_step": 350567, "epoch": 2897} {"train_loss": -43.478126525878906, "global_step": 350568, "epoch": 2897} {"train_loss": -43.378299713134766, "global_step": 350569, "epoch": 2897} {"train_loss": -44.2074089050293, "global_step": 350570, "epoch": 2897} {"train_loss": -43.58967971801758, "global_step": 350571, "epoch": 2897} {"train_loss": -43.26933670043945, "global_step": 350572, "epoch": 2897} {"train_loss": -43.97343826293945, "global_step": 350573, "epoch": 2897} {"train_loss": -43.65055465698242, "global_step": 350574, "epoch": 2897} {"train_loss": -43.34022903442383, "global_step": 350575, "epoch": 2897} {"train_loss": -44.059139251708984, "global_step": 350576, "epoch": 2897} {"train_loss": -43.145721435546875, "global_step": 350577, "epoch": 2897} {"train_loss": -43.47539138793945, "global_step": 350578, "epoch": 2897} {"train_loss": -43.317176818847656, "global_step": 350579, "epoch": 2897} {"train_loss": -42.97974395751953, "global_step": 350580, "epoch": 2897} {"train_loss": -41.82113265991211, "global_step": 350581, "epoch": 2897} {"train_loss": -42.089290618896484, "global_step": 350582, "epoch": 2897} {"train_loss": -41.07487487792969, "global_step": 350583, "epoch": 2897} {"train_loss": -41.40486526489258, "global_step": 350584, "epoch": 2897} {"train_loss": -41.35138702392578, "global_step": 350585, "epoch": 2897} {"train_loss": -41.07611083984375, "global_step": 350586, "epoch": 2897} {"train_loss": -39.95280838012695, "global_step": 350587, "epoch": 2897} {"train_loss": -43.159034729003906, "global_step": 350588, "epoch": 2897} {"train_loss": -40.46428680419922, "global_step": 350589, "epoch": 2897} {"train_loss": -41.395259857177734, "global_step": 350590, "epoch": 2897} {"train_loss": -43.51678466796875, "global_step": 350591, "epoch": 2897} {"train_loss": -40.48390579223633, "global_step": 350592, "epoch": 2897} {"train_loss": -43.0604362487793, "global_step": 350593, "epoch": 2897} {"train_loss": -42.493499755859375, "global_step": 350594, "epoch": 2897} {"train_loss": -42.9062614440918, "global_step": 350595, "epoch": 2897} {"train_loss": -42.77485275268555, "global_step": 350596, "epoch": 2897} {"train_loss": -43.75132369995117, "global_step": 350597, "epoch": 2897} {"train_loss": -42.89852523803711, "global_step": 350598, "epoch": 2897} {"train_loss": -42.306819915771484, "global_step": 350599, "epoch": 2897} {"train_loss": -43.418148040771484, "global_step": 350600, "epoch": 2897} {"train_loss": -42.22274398803711, "global_step": 350601, "epoch": 2897} {"train_loss": -43.116737365722656, "global_step": 350602, "epoch": 2897} {"train_loss": -43.04679870605469, "global_step": 350603, "epoch": 2897} {"train_loss": -43.1533317565918, "global_step": 350604, "epoch": 2897} {"train_loss": -43.31562805175781, "global_step": 350605, "epoch": 2897} {"train_loss": -43.60533142089844, "global_step": 350606, "epoch": 2897} {"train_loss": -44.093475341796875, "global_step": 350607, "epoch": 2897} {"train_loss": -43.52155685424805, "global_step": 350608, "epoch": 2897} {"train_loss": -44.0131721496582, "global_step": 350609, "epoch": 2897} {"train_loss": -43.445777893066406, "global_step": 350610, "epoch": 2897} {"train_loss": -43.81414794921875, "global_step": 350611, "epoch": 2897} {"train_loss": -43.801639556884766, "global_step": 350612, "epoch": 2897} {"train_loss": -43.48752975463867, "global_step": 350613, "epoch": 2897} {"train_loss": -43.84457015991211, "global_step": 350614, "epoch": 2897} {"train_loss": -44.29269027709961, "global_step": 350615, "epoch": 2897} {"train_loss": -43.49920654296875, "global_step": 350616, "epoch": 2897} {"train_loss": -44.29175567626953, "global_step": 350617, "epoch": 2897} {"train_loss": -42.30754852294922, "global_step": 350618, "epoch": 2897} {"train_loss": -44.36628723144531, "global_step": 350619, "epoch": 2897} {"train_loss": -43.53193283081055, "global_step": 350620, "epoch": 2897} {"train_loss": -43.9795036315918, "global_step": 350621, "epoch": 2897} {"train_loss": -43.85792541503906, "global_step": 350622, "epoch": 2897} {"train_loss": -43.4072265625, "global_step": 350623, "epoch": 2897} {"train_loss": -44.33949661254883, "global_step": 350624, "epoch": 2897} {"train_loss": -42.99727249145508, "global_step": 350625, "epoch": 2897} {"train_loss": -42.555686950683594, "global_step": 350626, "epoch": 2897} {"train_loss": -43.58995819091797, "global_step": 350627, "epoch": 2897} {"train_loss": -42.52810287475586, "global_step": 350628, "epoch": 2897} {"train_loss": -44.239349365234375, "global_step": 350629, "epoch": 2897} {"train_loss": -43.44805908203125, "global_step": 350630, "epoch": 2897} {"train_loss": -42.57191848754883, "global_step": 350631, "epoch": 2897} {"train_loss": -44.030635833740234, "global_step": 350632, "epoch": 2897} {"train_loss": -41.190948486328125, "global_step": 350633, "epoch": 2897} {"train_loss": -44.50420379638672, "global_step": 350634, "epoch": 2897} {"train_loss": -43.923622131347656, "global_step": 350635, "epoch": 2897} {"train_loss": -45.14426803588867, "global_step": 350636, "epoch": 2897} {"train_loss": -42.952266693115234, "global_step": 350637, "epoch": 2897} {"train_loss": -43.962398529052734, "global_step": 350638, "epoch": 2897} {"train_loss": -43.896480560302734, "global_step": 350639, "epoch": 2897} {"train_loss": -43.78019332885742, "global_step": 350640, "epoch": 2897} {"train_loss": -44.40812683105469, "global_step": 350641, "epoch": 2897} {"train_loss": -44.00006866455078, "global_step": 350642, "epoch": 2897} {"train_loss": -43.82453155517578, "global_step": 350643, "epoch": 2897} {"train_loss": -43.24323654174805, "global_step": 350644, "epoch": 2897} {"train_loss": -42.57894515991211, "global_step": 350645, "epoch": 2897} {"train_loss": -43.78181076049805, "global_step": 350646, "epoch": 2897} {"train_loss": -44.29401779174805, "global_step": 350647, "epoch": 2897} {"train_loss": -44.364437103271484, "global_step": 350648, "epoch": 2897} {"train_loss": -43.95272445678711, "global_step": 350649, "epoch": 2897} {"train_loss": -43.67047119140625, "global_step": 350650, "epoch": 2897} {"train_loss": -44.08486557006836, "global_step": 350651, "epoch": 2897} {"train_loss": -42.26948547363281, "global_step": 350652, "epoch": 2897} {"train_loss": -44.202877044677734, "global_step": 350653, "epoch": 2897} {"train_loss": -44.03950881958008, "global_step": 350654, "epoch": 2897} {"train_loss": -43.563072204589844, "global_step": 350655, "epoch": 2897} {"train_loss": -43.18020248413086, "global_step": 350656, "epoch": 2897} {"train_loss": -43.33576728883854, "global_step": 350657, "epoch": 2897, "val_loss": 2677080.0} {"train_loss": -43.38600540161133, "global_step": 350658, "epoch": 2898} {"train_loss": -44.35813522338867, "global_step": 350659, "epoch": 2898} {"train_loss": -43.89765930175781, "global_step": 350660, "epoch": 2898} {"train_loss": -43.7728157043457, "global_step": 350661, "epoch": 2898} {"train_loss": -42.61310577392578, "global_step": 350662, "epoch": 2898} {"train_loss": -44.208805084228516, "global_step": 350663, "epoch": 2898} {"train_loss": -42.169769287109375, "global_step": 350664, "epoch": 2898} {"train_loss": -44.1849479675293, "global_step": 350665, "epoch": 2898} {"train_loss": -44.32014846801758, "global_step": 350666, "epoch": 2898} {"train_loss": -44.21847152709961, "global_step": 350667, "epoch": 2898} {"train_loss": -43.764434814453125, "global_step": 350668, "epoch": 2898} {"train_loss": -43.833187103271484, "global_step": 350669, "epoch": 2898} {"train_loss": -38.8410758972168, "global_step": 350670, "epoch": 2898} {"train_loss": -43.0277099609375, "global_step": 350671, "epoch": 2898} {"train_loss": -42.83878707885742, "global_step": 350672, "epoch": 2898} {"train_loss": -43.63839340209961, "global_step": 350673, "epoch": 2898} {"train_loss": -43.566158294677734, "global_step": 350674, "epoch": 2898} {"train_loss": -38.7171630859375, "global_step": 350675, "epoch": 2898} {"train_loss": -43.91229248046875, "global_step": 350676, "epoch": 2898} {"train_loss": -44.374813079833984, "global_step": 350677, "epoch": 2898} {"train_loss": -44.41432571411133, "global_step": 350678, "epoch": 2898} {"train_loss": -43.42512893676758, "global_step": 350679, "epoch": 2898} {"train_loss": -42.14130401611328, "global_step": 350680, "epoch": 2898} {"train_loss": -42.07020568847656, "global_step": 350681, "epoch": 2898} {"train_loss": -34.123897552490234, "global_step": 350682, "epoch": 2898} {"train_loss": -42.20064926147461, "global_step": 350683, "epoch": 2898} {"train_loss": -42.19427490234375, "global_step": 350684, "epoch": 2898} {"train_loss": -36.536842346191406, "global_step": 350685, "epoch": 2898} {"train_loss": -40.98945999145508, "global_step": 350686, "epoch": 2898} {"train_loss": -43.402889251708984, "global_step": 350687, "epoch": 2898} {"train_loss": -43.19643020629883, "global_step": 350688, "epoch": 2898} {"train_loss": -41.93913269042969, "global_step": 350689, "epoch": 2898} {"train_loss": -42.65106964111328, "global_step": 350690, "epoch": 2898} {"train_loss": -34.98392868041992, "global_step": 350691, "epoch": 2898} {"train_loss": -40.08063888549805, "global_step": 350692, "epoch": 2898} {"train_loss": -41.32526779174805, "global_step": 350693, "epoch": 2898} {"train_loss": -38.69879913330078, "global_step": 350694, "epoch": 2898} {"train_loss": -38.07680130004883, "global_step": 350695, "epoch": 2898} {"train_loss": -42.96896743774414, "global_step": 350696, "epoch": 2898} {"train_loss": -38.00973129272461, "global_step": 350697, "epoch": 2898} {"train_loss": -40.09528732299805, "global_step": 350698, "epoch": 2898} {"train_loss": -42.92832565307617, "global_step": 350699, "epoch": 2898} {"train_loss": -39.934303283691406, "global_step": 350700, "epoch": 2898} {"train_loss": -42.69331741333008, "global_step": 350701, "epoch": 2898} {"train_loss": -39.55683898925781, "global_step": 350702, "epoch": 2898} {"train_loss": -41.5278205871582, "global_step": 350703, "epoch": 2898} {"train_loss": -41.03713607788086, "global_step": 350704, "epoch": 2898} {"train_loss": -42.32217025756836, "global_step": 350705, "epoch": 2898} {"train_loss": -41.802490234375, "global_step": 350706, "epoch": 2898} {"train_loss": -43.16425704956055, "global_step": 350707, "epoch": 2898} {"train_loss": -42.08443069458008, "global_step": 350708, "epoch": 2898} {"train_loss": -42.15925598144531, "global_step": 350709, "epoch": 2898} {"train_loss": -36.19463348388672, "global_step": 350710, "epoch": 2898} {"train_loss": -42.77387237548828, "global_step": 350711, "epoch": 2898} {"train_loss": -42.500465393066406, "global_step": 350712, "epoch": 2898} {"train_loss": -41.51983642578125, "global_step": 350713, "epoch": 2898} {"train_loss": -42.592105865478516, "global_step": 350714, "epoch": 2898} {"train_loss": -42.69091033935547, "global_step": 350715, "epoch": 2898} {"train_loss": -43.43851089477539, "global_step": 350716, "epoch": 2898} {"train_loss": -40.88055419921875, "global_step": 350717, "epoch": 2898} {"train_loss": -41.74053955078125, "global_step": 350718, "epoch": 2898} {"train_loss": -41.04350662231445, "global_step": 350719, "epoch": 2898} {"train_loss": -42.33161926269531, "global_step": 350720, "epoch": 2898} {"train_loss": -42.012939453125, "global_step": 350721, "epoch": 2898} {"train_loss": -43.19828414916992, "global_step": 350722, "epoch": 2898} {"train_loss": -42.79964065551758, "global_step": 350723, "epoch": 2898} {"train_loss": -42.6135139465332, "global_step": 350724, "epoch": 2898} {"train_loss": -43.49404525756836, "global_step": 350725, "epoch": 2898} {"train_loss": -43.720855712890625, "global_step": 350726, "epoch": 2898} {"train_loss": -43.55869674682617, "global_step": 350727, "epoch": 2898} {"train_loss": -40.5598030090332, "global_step": 350728, "epoch": 2898} {"train_loss": -43.2592887878418, "global_step": 350729, "epoch": 2898} {"train_loss": -42.77539825439453, "global_step": 350730, "epoch": 2898} {"train_loss": -41.1807861328125, "global_step": 350731, "epoch": 2898} {"train_loss": -40.190834045410156, "global_step": 350732, "epoch": 2898} {"train_loss": -42.6098518371582, "global_step": 350733, "epoch": 2898} {"train_loss": -43.1259880065918, "global_step": 350734, "epoch": 2898} {"train_loss": -42.77583694458008, "global_step": 350735, "epoch": 2898} {"train_loss": -43.073341369628906, "global_step": 350736, "epoch": 2898} {"train_loss": -43.43972396850586, "global_step": 350737, "epoch": 2898} {"train_loss": -38.12053298950195, "global_step": 350738, "epoch": 2898} {"train_loss": -42.86159896850586, "global_step": 350739, "epoch": 2898} {"train_loss": -40.85190963745117, "global_step": 350740, "epoch": 2898} {"train_loss": -38.31220626831055, "global_step": 350741, "epoch": 2898} {"train_loss": -42.6594123840332, "global_step": 350742, "epoch": 2898} {"train_loss": -39.391231536865234, "global_step": 350743, "epoch": 2898} {"train_loss": -42.89345932006836, "global_step": 350744, "epoch": 2898} {"train_loss": -42.69755554199219, "global_step": 350745, "epoch": 2898} {"train_loss": -43.05171585083008, "global_step": 350746, "epoch": 2898} {"train_loss": -41.869136810302734, "global_step": 350747, "epoch": 2898} {"train_loss": -43.14439010620117, "global_step": 350748, "epoch": 2898} {"train_loss": -42.733551025390625, "global_step": 350749, "epoch": 2898} {"train_loss": -42.996795654296875, "global_step": 350750, "epoch": 2898} {"train_loss": -43.08466720581055, "global_step": 350751, "epoch": 2898} {"train_loss": -42.958465576171875, "global_step": 350752, "epoch": 2898} {"train_loss": -37.862281799316406, "global_step": 350753, "epoch": 2898} {"train_loss": -42.42641830444336, "global_step": 350754, "epoch": 2898} {"train_loss": -41.006160736083984, "global_step": 350755, "epoch": 2898} {"train_loss": -41.44458770751953, "global_step": 350756, "epoch": 2898} {"train_loss": -39.191036224365234, "global_step": 350757, "epoch": 2898} {"train_loss": -42.10079574584961, "global_step": 350758, "epoch": 2898} {"train_loss": -41.2061653137207, "global_step": 350759, "epoch": 2898} {"train_loss": -42.02360153198242, "global_step": 350760, "epoch": 2898} {"train_loss": -43.4141960144043, "global_step": 350761, "epoch": 2898} {"train_loss": -43.4288330078125, "global_step": 350762, "epoch": 2898} {"train_loss": -42.918800354003906, "global_step": 350763, "epoch": 2898} {"train_loss": -43.33674240112305, "global_step": 350764, "epoch": 2898} {"train_loss": -41.85828399658203, "global_step": 350765, "epoch": 2898} {"train_loss": -43.455482482910156, "global_step": 350766, "epoch": 2898} {"train_loss": -41.4594612121582, "global_step": 350767, "epoch": 2898} {"train_loss": -42.88991928100586, "global_step": 350768, "epoch": 2898} {"train_loss": -43.44108200073242, "global_step": 350769, "epoch": 2898} {"train_loss": -42.06324768066406, "global_step": 350770, "epoch": 2898} {"train_loss": -42.7702751159668, "global_step": 350771, "epoch": 2898} {"train_loss": -43.72676086425781, "global_step": 350772, "epoch": 2898} {"train_loss": -43.7751579284668, "global_step": 350773, "epoch": 2898} {"train_loss": -42.46103286743164, "global_step": 350774, "epoch": 2898} {"train_loss": -43.60956573486328, "global_step": 350775, "epoch": 2898} {"train_loss": -43.802284240722656, "global_step": 350776, "epoch": 2898} {"train_loss": -42.94771194458008, "global_step": 350777, "epoch": 2898} {"train_loss": -42.05051939152489, "global_step": 350778, "epoch": 2898, "val_loss": 2656064.75} {"train_loss": -43.141029357910156, "global_step": 350779, "epoch": 2899} {"train_loss": -43.674312591552734, "global_step": 350780, "epoch": 2899} {"train_loss": -43.5594367980957, "global_step": 350781, "epoch": 2899} {"train_loss": -41.98038864135742, "global_step": 350782, "epoch": 2899} {"train_loss": -43.447994232177734, "global_step": 350783, "epoch": 2899} {"train_loss": -43.98989486694336, "global_step": 350784, "epoch": 2899} {"train_loss": -44.074771881103516, "global_step": 350785, "epoch": 2899} {"train_loss": -43.05423355102539, "global_step": 350786, "epoch": 2899} {"train_loss": -44.05955123901367, "global_step": 350787, "epoch": 2899} {"train_loss": -43.201332092285156, "global_step": 350788, "epoch": 2899} {"train_loss": -43.2243766784668, "global_step": 350789, "epoch": 2899} {"train_loss": -43.597450256347656, "global_step": 350790, "epoch": 2899} {"train_loss": -43.9735221862793, "global_step": 350791, "epoch": 2899} {"train_loss": -42.21049118041992, "global_step": 350792, "epoch": 2899} {"train_loss": -44.08443832397461, "global_step": 350793, "epoch": 2899} {"train_loss": -43.386409759521484, "global_step": 350794, "epoch": 2899} {"train_loss": -44.6473503112793, "global_step": 350795, "epoch": 2899} {"train_loss": -43.9992790222168, "global_step": 350796, "epoch": 2899} {"train_loss": -42.84601593017578, "global_step": 350797, "epoch": 2899} {"train_loss": -43.54450988769531, "global_step": 350798, "epoch": 2899} {"train_loss": -43.85677719116211, "global_step": 350799, "epoch": 2899} {"train_loss": -44.0340576171875, "global_step": 350800, "epoch": 2899} {"train_loss": -44.19108963012695, "global_step": 350801, "epoch": 2899} {"train_loss": -44.05894470214844, "global_step": 350802, "epoch": 2899} {"train_loss": -44.33815383911133, "global_step": 350803, "epoch": 2899} {"train_loss": -43.92341613769531, "global_step": 350804, "epoch": 2899} {"train_loss": -43.387367248535156, "global_step": 350805, "epoch": 2899} {"train_loss": -43.76832962036133, "global_step": 350806, "epoch": 2899} {"train_loss": -44.0829963684082, "global_step": 350807, "epoch": 2899} {"train_loss": -43.757301330566406, "global_step": 350808, "epoch": 2899} {"train_loss": -43.50735092163086, "global_step": 350809, "epoch": 2899} {"train_loss": -43.41643142700195, "global_step": 350810, "epoch": 2899} {"train_loss": -44.514347076416016, "global_step": 350811, "epoch": 2899} {"train_loss": -43.62675094604492, "global_step": 350812, "epoch": 2899} {"train_loss": -44.413082122802734, "global_step": 350813, "epoch": 2899} {"train_loss": -43.32786560058594, "global_step": 350814, "epoch": 2899} {"train_loss": -43.689212799072266, "global_step": 350815, "epoch": 2899} {"train_loss": -43.533912658691406, "global_step": 350816, "epoch": 2899} {"train_loss": -44.44850540161133, "global_step": 350817, "epoch": 2899} {"train_loss": -42.531795501708984, "global_step": 350818, "epoch": 2899} {"train_loss": -43.92042922973633, "global_step": 350819, "epoch": 2899} {"train_loss": -44.52804183959961, "global_step": 350820, "epoch": 2899} {"train_loss": -44.4677734375, "global_step": 350821, "epoch": 2899} {"train_loss": -43.983741760253906, "global_step": 350822, "epoch": 2899} {"train_loss": -44.7191047668457, "global_step": 350823, "epoch": 2899} {"train_loss": -44.19081497192383, "global_step": 350824, "epoch": 2899} {"train_loss": -43.536502838134766, "global_step": 350825, "epoch": 2899} {"train_loss": -44.14133834838867, "global_step": 350826, "epoch": 2899} {"train_loss": -44.16688537597656, "global_step": 350827, "epoch": 2899} {"train_loss": -43.306453704833984, "global_step": 350828, "epoch": 2899} {"train_loss": -44.08726119995117, "global_step": 350829, "epoch": 2899} {"train_loss": -43.62010192871094, "global_step": 350830, "epoch": 2899} {"train_loss": -43.15568161010742, "global_step": 350831, "epoch": 2899} {"train_loss": -42.430389404296875, "global_step": 350832, "epoch": 2899} {"train_loss": -42.82929992675781, "global_step": 350833, "epoch": 2899} {"train_loss": -41.20074462890625, "global_step": 350834, "epoch": 2899} {"train_loss": -40.98574447631836, "global_step": 350835, "epoch": 2899} {"train_loss": -40.923744201660156, "global_step": 350836, "epoch": 2899} {"train_loss": -43.3775749206543, "global_step": 350837, "epoch": 2899} {"train_loss": -42.22489547729492, "global_step": 350838, "epoch": 2899} {"train_loss": -41.82992172241211, "global_step": 350839, "epoch": 2899} {"train_loss": -40.13974380493164, "global_step": 350840, "epoch": 2899} {"train_loss": -41.475677490234375, "global_step": 350841, "epoch": 2899} {"train_loss": -39.65839767456055, "global_step": 350842, "epoch": 2899} {"train_loss": -41.58685302734375, "global_step": 350843, "epoch": 2899} {"train_loss": -42.27371597290039, "global_step": 350844, "epoch": 2899} {"train_loss": -40.70401382446289, "global_step": 350845, "epoch": 2899} {"train_loss": -41.787132263183594, "global_step": 350846, "epoch": 2899} {"train_loss": -43.15190124511719, "global_step": 350847, "epoch": 2899} {"train_loss": -42.1801643371582, "global_step": 350848, "epoch": 2899} {"train_loss": -42.30397415161133, "global_step": 350849, "epoch": 2899} {"train_loss": -43.357421875, "global_step": 350850, "epoch": 2899} {"train_loss": -42.78202438354492, "global_step": 350851, "epoch": 2899} {"train_loss": -41.4061393737793, "global_step": 350852, "epoch": 2899} {"train_loss": -43.52055740356445, "global_step": 350853, "epoch": 2899} {"train_loss": -42.138336181640625, "global_step": 350854, "epoch": 2899} {"train_loss": -41.58731460571289, "global_step": 350855, "epoch": 2899} {"train_loss": -43.39723587036133, "global_step": 350856, "epoch": 2899} {"train_loss": -42.40289306640625, "global_step": 350857, "epoch": 2899} {"train_loss": -41.378578186035156, "global_step": 350858, "epoch": 2899} {"train_loss": -43.019840240478516, "global_step": 350859, "epoch": 2899} {"train_loss": -42.600250244140625, "global_step": 350860, "epoch": 2899} {"train_loss": -43.43204116821289, "global_step": 350861, "epoch": 2899} {"train_loss": -43.31229019165039, "global_step": 350862, "epoch": 2899} {"train_loss": -43.89218521118164, "global_step": 350863, "epoch": 2899} {"train_loss": -43.47193145751953, "global_step": 350864, "epoch": 2899} {"train_loss": -43.24412536621094, "global_step": 350865, "epoch": 2899} {"train_loss": -43.09736251831055, "global_step": 350866, "epoch": 2899} {"train_loss": -44.11991882324219, "global_step": 350867, "epoch": 2899} {"train_loss": -43.1668701171875, "global_step": 350868, "epoch": 2899} {"train_loss": -43.4362907409668, "global_step": 350869, "epoch": 2899} {"train_loss": -43.24593734741211, "global_step": 350870, "epoch": 2899} {"train_loss": -43.65339279174805, "global_step": 350871, "epoch": 2899} {"train_loss": -43.644771575927734, "global_step": 350872, "epoch": 2899} {"train_loss": -44.31592559814453, "global_step": 350873, "epoch": 2899} {"train_loss": -44.35015106201172, "global_step": 350874, "epoch": 2899} {"train_loss": -44.119869232177734, "global_step": 350875, "epoch": 2899} {"train_loss": -44.20060348510742, "global_step": 350876, "epoch": 2899} {"train_loss": -43.718414306640625, "global_step": 350877, "epoch": 2899} {"train_loss": -44.114990234375, "global_step": 350878, "epoch": 2899} {"train_loss": -43.45124053955078, "global_step": 350879, "epoch": 2899} {"train_loss": -44.040897369384766, "global_step": 350880, "epoch": 2899} {"train_loss": -44.16007614135742, "global_step": 350881, "epoch": 2899} {"train_loss": -43.509918212890625, "global_step": 350882, "epoch": 2899} {"train_loss": -43.99554443359375, "global_step": 350883, "epoch": 2899} {"train_loss": -44.25655746459961, "global_step": 350884, "epoch": 2899} {"train_loss": -43.91493606567383, "global_step": 350885, "epoch": 2899} {"train_loss": -44.11587142944336, "global_step": 350886, "epoch": 2899} {"train_loss": -44.02684020996094, "global_step": 350887, "epoch": 2899} {"train_loss": -43.66597366333008, "global_step": 350888, "epoch": 2899} {"train_loss": -43.25439453125, "global_step": 350889, "epoch": 2899} {"train_loss": -44.2313346862793, "global_step": 350890, "epoch": 2899} {"train_loss": -44.37343215942383, "global_step": 350891, "epoch": 2899} {"train_loss": -44.021846771240234, "global_step": 350892, "epoch": 2899} {"train_loss": -43.53913497924805, "global_step": 350893, "epoch": 2899} {"train_loss": -43.74031448364258, "global_step": 350894, "epoch": 2899} {"train_loss": -44.05878829956055, "global_step": 350895, "epoch": 2899} {"train_loss": -44.43232727050781, "global_step": 350896, "epoch": 2899} {"train_loss": -43.73398971557617, "global_step": 350897, "epoch": 2899} {"train_loss": -43.66776657104492, "global_step": 350898, "epoch": 2899} {"train_loss": -43.34720747135887, "global_step": 350899, "epoch": 2899, "val_loss": 2558001.25} {"train_loss": -43.936134338378906, "global_step": 350900, "epoch": 2900} {"train_loss": -43.305328369140625, "global_step": 350901, "epoch": 2900} {"train_loss": -42.54195785522461, "global_step": 350902, "epoch": 2900} {"train_loss": -42.28826904296875, "global_step": 350903, "epoch": 2900} {"train_loss": -44.03596496582031, "global_step": 350904, "epoch": 2900} {"train_loss": -43.6421012878418, "global_step": 350905, "epoch": 2900} {"train_loss": -44.27004623413086, "global_step": 350906, "epoch": 2900} {"train_loss": -44.459991455078125, "global_step": 350907, "epoch": 2900} {"train_loss": -42.05111312866211, "global_step": 350908, "epoch": 2900} {"train_loss": -41.880157470703125, "global_step": 350909, "epoch": 2900} {"train_loss": -43.528160095214844, "global_step": 350910, "epoch": 2900} {"train_loss": -44.098262786865234, "global_step": 350911, "epoch": 2900} {"train_loss": -43.88905715942383, "global_step": 350912, "epoch": 2900} {"train_loss": -43.38320541381836, "global_step": 350913, "epoch": 2900} {"train_loss": -43.9239387512207, "global_step": 350914, "epoch": 2900} {"train_loss": -43.918453216552734, "global_step": 350915, "epoch": 2900} {"train_loss": -43.238895416259766, "global_step": 350916, "epoch": 2900} {"train_loss": -42.5528678894043, "global_step": 350917, "epoch": 2900} {"train_loss": -40.79981994628906, "global_step": 350918, "epoch": 2900} {"train_loss": -42.197669982910156, "global_step": 350919, "epoch": 2900} {"train_loss": -41.61368942260742, "global_step": 350920, "epoch": 2900} {"train_loss": -41.4991455078125, "global_step": 350921, "epoch": 2900} {"train_loss": -43.18746566772461, "global_step": 350922, "epoch": 2900} {"train_loss": -43.306251525878906, "global_step": 350923, "epoch": 2900} {"train_loss": -41.13204574584961, "global_step": 350924, "epoch": 2900} {"train_loss": -41.430076599121094, "global_step": 350925, "epoch": 2900} {"train_loss": -43.21987533569336, "global_step": 350926, "epoch": 2900} {"train_loss": -42.87150573730469, "global_step": 350927, "epoch": 2900} {"train_loss": -42.55794906616211, "global_step": 350928, "epoch": 2900} {"train_loss": -42.5464973449707, "global_step": 350929, "epoch": 2900} {"train_loss": -43.591400146484375, "global_step": 350930, "epoch": 2900} {"train_loss": -40.81828689575195, "global_step": 350931, "epoch": 2900} {"train_loss": -40.954925537109375, "global_step": 350932, "epoch": 2900} {"train_loss": -43.32340621948242, "global_step": 350933, "epoch": 2900} {"train_loss": -42.347991943359375, "global_step": 350934, "epoch": 2900} {"train_loss": -42.737815856933594, "global_step": 350935, "epoch": 2900} {"train_loss": -43.41162109375, "global_step": 350936, "epoch": 2900} {"train_loss": -42.744590759277344, "global_step": 350937, "epoch": 2900} {"train_loss": -42.807559967041016, "global_step": 350938, "epoch": 2900} {"train_loss": -43.46733093261719, "global_step": 350939, "epoch": 2900} {"train_loss": -43.76494216918945, "global_step": 350940, "epoch": 2900} {"train_loss": -43.441993713378906, "global_step": 350941, "epoch": 2900} {"train_loss": -42.42226791381836, "global_step": 350942, "epoch": 2900} {"train_loss": -42.925899505615234, "global_step": 350943, "epoch": 2900} {"train_loss": -44.04024124145508, "global_step": 350944, "epoch": 2900} {"train_loss": -41.93353271484375, "global_step": 350945, "epoch": 2900} {"train_loss": -42.93742752075195, "global_step": 350946, "epoch": 2900} {"train_loss": -43.563228607177734, "global_step": 350947, "epoch": 2900} {"train_loss": -43.62435531616211, "global_step": 350948, "epoch": 2900} {"train_loss": -43.41585922241211, "global_step": 350949, "epoch": 2900} {"train_loss": -43.85530471801758, "global_step": 350950, "epoch": 2900} {"train_loss": -43.522457122802734, "global_step": 350951, "epoch": 2900} {"train_loss": -43.91228103637695, "global_step": 350952, "epoch": 2900} {"train_loss": -41.8102912902832, "global_step": 350953, "epoch": 2900} {"train_loss": -43.02116012573242, "global_step": 350954, "epoch": 2900} {"train_loss": -43.82249069213867, "global_step": 350955, "epoch": 2900} {"train_loss": -43.41691970825195, "global_step": 350956, "epoch": 2900} {"train_loss": -42.70154571533203, "global_step": 350957, "epoch": 2900} {"train_loss": -43.85970687866211, "global_step": 350958, "epoch": 2900} {"train_loss": -42.19734191894531, "global_step": 350959, "epoch": 2900} {"train_loss": -37.898136138916016, "global_step": 350960, "epoch": 2900} {"train_loss": -43.2933235168457, "global_step": 350961, "epoch": 2900} {"train_loss": -43.61344528198242, "global_step": 350962, "epoch": 2900} {"train_loss": -42.79855728149414, "global_step": 350963, "epoch": 2900} {"train_loss": -42.11989974975586, "global_step": 350964, "epoch": 2900} {"train_loss": -43.013343811035156, "global_step": 350965, "epoch": 2900} {"train_loss": -42.66035842895508, "global_step": 350966, "epoch": 2900} {"train_loss": -43.698795318603516, "global_step": 350967, "epoch": 2900} {"train_loss": -43.537696838378906, "global_step": 350968, "epoch": 2900} {"train_loss": -43.40570068359375, "global_step": 350969, "epoch": 2900} {"train_loss": -43.40350341796875, "global_step": 350970, "epoch": 2900} {"train_loss": -37.7577018737793, "global_step": 350971, "epoch": 2900} {"train_loss": -43.963623046875, "global_step": 350972, "epoch": 2900} {"train_loss": -42.69574737548828, "global_step": 350973, "epoch": 2900} {"train_loss": -43.73362350463867, "global_step": 350974, "epoch": 2900} {"train_loss": -43.3452262878418, "global_step": 350975, "epoch": 2900} {"train_loss": -43.519371032714844, "global_step": 350976, "epoch": 2900} {"train_loss": -43.89598083496094, "global_step": 350977, "epoch": 2900} {"train_loss": -43.35860824584961, "global_step": 350978, "epoch": 2900} {"train_loss": -43.94773864746094, "global_step": 350979, "epoch": 2900} {"train_loss": -44.35317611694336, "global_step": 350980, "epoch": 2900} {"train_loss": -44.329341888427734, "global_step": 350981, "epoch": 2900} {"train_loss": -39.68888473510742, "global_step": 350982, "epoch": 2900} {"train_loss": -44.036067962646484, "global_step": 350983, "epoch": 2900} {"train_loss": -41.913734436035156, "global_step": 350984, "epoch": 2900} {"train_loss": -44.381072998046875, "global_step": 350985, "epoch": 2900} {"train_loss": -43.83008575439453, "global_step": 350986, "epoch": 2900} {"train_loss": -44.234981536865234, "global_step": 350987, "epoch": 2900} {"train_loss": -44.3443603515625, "global_step": 350988, "epoch": 2900} {"train_loss": -43.29728317260742, "global_step": 350989, "epoch": 2900} {"train_loss": -44.18391418457031, "global_step": 350990, "epoch": 2900} {"train_loss": -44.06472396850586, "global_step": 350991, "epoch": 2900} {"train_loss": -44.33673858642578, "global_step": 350992, "epoch": 2900} {"train_loss": -44.339752197265625, "global_step": 350993, "epoch": 2900} {"train_loss": -44.23273849487305, "global_step": 350994, "epoch": 2900} {"train_loss": -43.73747253417969, "global_step": 350995, "epoch": 2900} {"train_loss": -44.68428039550781, "global_step": 350996, "epoch": 2900} {"train_loss": -38.60863494873047, "global_step": 350997, "epoch": 2900} {"train_loss": -44.382503509521484, "global_step": 350998, "epoch": 2900} {"train_loss": -43.79598617553711, "global_step": 350999, "epoch": 2900} {"train_loss": -44.16156005859375, "global_step": 351000, "epoch": 2900} {"train_loss": -44.736202239990234, "global_step": 351001, "epoch": 2900} {"train_loss": -40.28042221069336, "global_step": 351002, "epoch": 2900} {"train_loss": -44.22686767578125, "global_step": 351003, "epoch": 2900} {"train_loss": -44.88875961303711, "global_step": 351004, "epoch": 2900} {"train_loss": -43.986507415771484, "global_step": 351005, "epoch": 2900} {"train_loss": -43.77784729003906, "global_step": 351006, "epoch": 2900} {"train_loss": -43.58922576904297, "global_step": 351007, "epoch": 2900} {"train_loss": -43.76892852783203, "global_step": 351008, "epoch": 2900} {"train_loss": -44.241241455078125, "global_step": 351009, "epoch": 2900} {"train_loss": -44.106624603271484, "global_step": 351010, "epoch": 2900} {"train_loss": -43.37606430053711, "global_step": 351011, "epoch": 2900} {"train_loss": -43.455440521240234, "global_step": 351012, "epoch": 2900} {"train_loss": -44.48200607299805, "global_step": 351013, "epoch": 2900} {"train_loss": -44.7834358215332, "global_step": 351014, "epoch": 2900} {"train_loss": -44.3231086730957, "global_step": 351015, "epoch": 2900} {"train_loss": -43.944889068603516, "global_step": 351016, "epoch": 2900} {"train_loss": -45.07099533081055, "global_step": 351017, "epoch": 2900} {"train_loss": -44.40092849731445, "global_step": 351018, "epoch": 2900} {"train_loss": -44.37104415893555, "global_step": 351019, "epoch": 2900} {"train_loss": -43.213046207900874, "global_step": 351020, "epoch": 2900, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4400000": 1.0, "test/sim_max_reward_4400001": 1.0, "test/sim_max_reward_4400002": 1.0, "test/sim_max_reward_4400003": 1.0, "test/sim_max_reward_4400004": 1.0, "test/sim_max_reward_4400005": 1.0, "test/sim_max_reward_4400006": 1.0, "test/sim_max_reward_4400007": 1.0, "test/sim_max_reward_4400008": 1.0, "test/sim_max_reward_4400009": 1.0, "test/sim_max_reward_4400010": 1.0, "test/sim_max_reward_4400011": 1.0, "test/sim_max_reward_4400012": 1.0, "test/sim_max_reward_4400013": 1.0, "test/sim_max_reward_4400014": 1.0, "test/sim_max_reward_4400015": 1.0, "test/sim_max_reward_4400016": 1.0, "test/sim_max_reward_4400017": 1.0, "test/sim_max_reward_4400018": 1.0, "test/sim_max_reward_4400019": 1.0, "test/sim_max_reward_4400020": 1.0, "test/sim_max_reward_4400021": 1.0, "train/mean_score": 1.0, "test/mean_score": 1.0, "val_loss": 2605171.25} {"train_loss": -44.253135681152344, "global_step": 351021, "epoch": 2901} {"train_loss": -44.595497131347656, "global_step": 351022, "epoch": 2901} {"train_loss": -44.62577438354492, "global_step": 351023, "epoch": 2901} {"train_loss": -42.990108489990234, "global_step": 351024, "epoch": 2901} {"train_loss": -44.91109848022461, "global_step": 351025, "epoch": 2901} {"train_loss": -44.14813995361328, "global_step": 351026, "epoch": 2901} {"train_loss": -42.793514251708984, "global_step": 351027, "epoch": 2901} {"train_loss": -44.045021057128906, "global_step": 351028, "epoch": 2901} {"train_loss": -44.392547607421875, "global_step": 351029, "epoch": 2901} {"train_loss": -42.60935592651367, "global_step": 351030, "epoch": 2901} {"train_loss": -42.37703323364258, "global_step": 351031, "epoch": 2901} {"train_loss": -44.095726013183594, "global_step": 351032, "epoch": 2901} {"train_loss": -42.90837860107422, "global_step": 351033, "epoch": 2901} {"train_loss": -43.7385368347168, "global_step": 351034, "epoch": 2901} {"train_loss": -43.87481689453125, "global_step": 351035, "epoch": 2901} {"train_loss": -37.243309020996094, "global_step": 351036, "epoch": 2901} {"train_loss": -43.608642578125, "global_step": 351037, "epoch": 2901} {"train_loss": -42.74894332885742, "global_step": 351038, "epoch": 2901} {"train_loss": -43.96533203125, "global_step": 351039, "epoch": 2901} {"train_loss": -42.6244010925293, "global_step": 351040, "epoch": 2901} {"train_loss": -43.42599105834961, "global_step": 351041, "epoch": 2901} {"train_loss": -35.64815139770508, "global_step": 351042, "epoch": 2901} {"train_loss": -40.641963958740234, "global_step": 351043, "epoch": 2901} {"train_loss": -39.66988754272461, "global_step": 351044, "epoch": 2901} {"train_loss": -42.77802658081055, "global_step": 351045, "epoch": 2901} {"train_loss": -39.064449310302734, "global_step": 351046, "epoch": 2901} {"train_loss": -41.5135612487793, "global_step": 351047, "epoch": 2901} {"train_loss": -32.78483200073242, "global_step": 351048, "epoch": 2901} {"train_loss": -32.430294036865234, "global_step": 351049, "epoch": 2901} {"train_loss": -42.3039665222168, "global_step": 351050, "epoch": 2901} {"train_loss": -41.54800033569336, "global_step": 351051, "epoch": 2901} {"train_loss": -42.1122932434082, "global_step": 351052, "epoch": 2901} {"train_loss": -34.57101058959961, "global_step": 351053, "epoch": 2901} {"train_loss": -39.170433044433594, "global_step": 351054, "epoch": 2901} {"train_loss": -40.29478073120117, "global_step": 351055, "epoch": 2901} {"train_loss": -39.1163330078125, "global_step": 351056, "epoch": 2901} {"train_loss": -36.423545837402344, "global_step": 351057, "epoch": 2901} {"train_loss": -39.327510833740234, "global_step": 351058, "epoch": 2901} {"train_loss": -34.36088943481445, "global_step": 351059, "epoch": 2901} {"train_loss": -37.5643424987793, "global_step": 351060, "epoch": 2901} {"train_loss": -39.53672409057617, "global_step": 351061, "epoch": 2901} {"train_loss": -35.71364212036133, "global_step": 351062, "epoch": 2901} {"train_loss": -37.58942794799805, "global_step": 351063, "epoch": 2901} {"train_loss": -33.603302001953125, "global_step": 351064, "epoch": 2901} {"train_loss": -32.91497802734375, "global_step": 351065, "epoch": 2901} {"train_loss": -36.60715866088867, "global_step": 351066, "epoch": 2901} {"train_loss": -38.87307357788086, "global_step": 351067, "epoch": 2901} {"train_loss": -36.18832778930664, "global_step": 351068, "epoch": 2901} {"train_loss": -33.108253479003906, "global_step": 351069, "epoch": 2901} {"train_loss": -34.42814636230469, "global_step": 351070, "epoch": 2901} {"train_loss": -38.24665451049805, "global_step": 351071, "epoch": 2901} {"train_loss": -34.988826751708984, "global_step": 351072, "epoch": 2901} {"train_loss": -33.241920471191406, "global_step": 351073, "epoch": 2901} {"train_loss": -37.83076095581055, "global_step": 351074, "epoch": 2901} {"train_loss": -38.88206481933594, "global_step": 351075, "epoch": 2901} {"train_loss": -37.74982833862305, "global_step": 351076, "epoch": 2901} {"train_loss": -35.83451461791992, "global_step": 351077, "epoch": 2901} {"train_loss": -38.96250534057617, "global_step": 351078, "epoch": 2901} {"train_loss": -38.99495315551758, "global_step": 351079, "epoch": 2901} {"train_loss": -40.925506591796875, "global_step": 351080, "epoch": 2901} {"train_loss": -39.91090774536133, "global_step": 351081, "epoch": 2901} {"train_loss": -40.85312271118164, "global_step": 351082, "epoch": 2901} {"train_loss": -39.6253776550293, "global_step": 351083, "epoch": 2901} {"train_loss": -40.01518630981445, "global_step": 351084, "epoch": 2901} {"train_loss": -39.828426361083984, "global_step": 351085, "epoch": 2901} {"train_loss": -40.130794525146484, "global_step": 351086, "epoch": 2901} {"train_loss": -37.666961669921875, "global_step": 351087, "epoch": 2901} {"train_loss": -39.08751678466797, "global_step": 351088, "epoch": 2901} {"train_loss": -40.48258590698242, "global_step": 351089, "epoch": 2901} {"train_loss": -40.23231506347656, "global_step": 351090, "epoch": 2901} {"train_loss": -39.445186614990234, "global_step": 351091, "epoch": 2901} {"train_loss": -40.155155181884766, "global_step": 351092, "epoch": 2901} {"train_loss": -40.017887115478516, "global_step": 351093, "epoch": 2901} {"train_loss": -40.7265510559082, "global_step": 351094, "epoch": 2901} {"train_loss": -39.38820266723633, "global_step": 351095, "epoch": 2901} {"train_loss": -40.40317153930664, "global_step": 351096, "epoch": 2901} {"train_loss": -41.39601135253906, "global_step": 351097, "epoch": 2901} {"train_loss": -40.50396728515625, "global_step": 351098, "epoch": 2901} {"train_loss": -41.40224838256836, "global_step": 351099, "epoch": 2901} {"train_loss": -40.253257751464844, "global_step": 351100, "epoch": 2901} {"train_loss": -40.45341110229492, "global_step": 351101, "epoch": 2901} {"train_loss": -41.2164306640625, "global_step": 351102, "epoch": 2901} {"train_loss": -40.24336242675781, "global_step": 351103, "epoch": 2901} {"train_loss": -41.074127197265625, "global_step": 351104, "epoch": 2901} {"train_loss": -41.10162353515625, "global_step": 351105, "epoch": 2901} {"train_loss": -41.60952377319336, "global_step": 351106, "epoch": 2901} {"train_loss": -41.6483268737793, "global_step": 351107, "epoch": 2901} {"train_loss": -41.75654602050781, "global_step": 351108, "epoch": 2901} {"train_loss": -41.63605499267578, "global_step": 351109, "epoch": 2901} {"train_loss": -41.88248825073242, "global_step": 351110, "epoch": 2901} {"train_loss": -41.49949264526367, "global_step": 351111, "epoch": 2901} {"train_loss": -41.77482986450195, "global_step": 351112, "epoch": 2901} {"train_loss": -41.74806213378906, "global_step": 351113, "epoch": 2901} {"train_loss": -42.09761047363281, "global_step": 351114, "epoch": 2901} {"train_loss": -41.60163116455078, "global_step": 351115, "epoch": 2901} {"train_loss": -41.873104095458984, "global_step": 351116, "epoch": 2901} {"train_loss": -41.876625061035156, "global_step": 351117, "epoch": 2901} {"train_loss": -41.69035720825195, "global_step": 351118, "epoch": 2901} {"train_loss": -41.574642181396484, "global_step": 351119, "epoch": 2901} {"train_loss": -42.41127395629883, "global_step": 351120, "epoch": 2901} {"train_loss": -41.64762496948242, "global_step": 351121, "epoch": 2901} {"train_loss": -42.66045379638672, "global_step": 351122, "epoch": 2901} {"train_loss": -42.669097900390625, "global_step": 351123, "epoch": 2901} {"train_loss": -42.52362823486328, "global_step": 351124, "epoch": 2901} {"train_loss": -43.08720016479492, "global_step": 351125, "epoch": 2901} {"train_loss": -42.54267883300781, "global_step": 351126, "epoch": 2901} {"train_loss": -42.357696533203125, "global_step": 351127, "epoch": 2901} {"train_loss": -41.572845458984375, "global_step": 351128, "epoch": 2901} {"train_loss": -41.535011291503906, "global_step": 351129, "epoch": 2901} {"train_loss": -41.753231048583984, "global_step": 351130, "epoch": 2901} {"train_loss": -42.809818267822266, "global_step": 351131, "epoch": 2901} {"train_loss": -42.615726470947266, "global_step": 351132, "epoch": 2901} {"train_loss": -41.704986572265625, "global_step": 351133, "epoch": 2901} {"train_loss": -43.14730453491211, "global_step": 351134, "epoch": 2901} {"train_loss": -42.325927734375, "global_step": 351135, "epoch": 2901} {"train_loss": -42.633365631103516, "global_step": 351136, "epoch": 2901} {"train_loss": -41.70011520385742, "global_step": 351137, "epoch": 2901} {"train_loss": -42.92873001098633, "global_step": 351138, "epoch": 2901} {"train_loss": -42.612709045410156, "global_step": 351139, "epoch": 2901} {"train_loss": -41.55931854248047, "global_step": 351140, "epoch": 2901} {"train_loss": -40.475707976286074, "global_step": 351141, "epoch": 2901, "val_loss": 2663396.25} {"train_loss": -39.43729782104492, "global_step": 351142, "epoch": 2902} {"train_loss": -42.93654251098633, "global_step": 351143, "epoch": 2902} {"train_loss": -43.0755500793457, "global_step": 351144, "epoch": 2902} {"train_loss": -42.886924743652344, "global_step": 351145, "epoch": 2902} {"train_loss": -43.31007766723633, "global_step": 351146, "epoch": 2902} {"train_loss": -44.065650939941406, "global_step": 351147, "epoch": 2902} {"train_loss": -42.75631332397461, "global_step": 351148, "epoch": 2902} {"train_loss": -43.418907165527344, "global_step": 351149, "epoch": 2902} {"train_loss": -43.03273391723633, "global_step": 351150, "epoch": 2902} {"train_loss": -43.32587814331055, "global_step": 351151, "epoch": 2902} {"train_loss": -43.7170524597168, "global_step": 351152, "epoch": 2902} {"train_loss": -43.10737991333008, "global_step": 351153, "epoch": 2902} {"train_loss": -42.71607208251953, "global_step": 351154, "epoch": 2902} {"train_loss": -42.93471145629883, "global_step": 351155, "epoch": 2902} {"train_loss": -42.70170974731445, "global_step": 351156, "epoch": 2902} {"train_loss": -43.720211029052734, "global_step": 351157, "epoch": 2902} {"train_loss": -42.689674377441406, "global_step": 351158, "epoch": 2902} {"train_loss": -43.210384368896484, "global_step": 351159, "epoch": 2902} {"train_loss": -43.584293365478516, "global_step": 351160, "epoch": 2902} {"train_loss": -42.13203430175781, "global_step": 351161, "epoch": 2902} {"train_loss": -42.82257843017578, "global_step": 351162, "epoch": 2902} {"train_loss": -44.039695739746094, "global_step": 351163, "epoch": 2902} {"train_loss": -43.66096878051758, "global_step": 351164, "epoch": 2902} {"train_loss": -43.89434814453125, "global_step": 351165, "epoch": 2902} {"train_loss": -44.03225326538086, "global_step": 351166, "epoch": 2902} {"train_loss": -42.979896545410156, "global_step": 351167, "epoch": 2902} {"train_loss": -43.34975051879883, "global_step": 351168, "epoch": 2902} {"train_loss": -44.34878158569336, "global_step": 351169, "epoch": 2902} {"train_loss": -42.612770080566406, "global_step": 351170, "epoch": 2902} {"train_loss": -42.99576950073242, "global_step": 351171, "epoch": 2902} {"train_loss": -44.08027267456055, "global_step": 351172, "epoch": 2902} {"train_loss": -41.58610153198242, "global_step": 351173, "epoch": 2902} {"train_loss": -43.483680725097656, "global_step": 351174, "epoch": 2902} {"train_loss": -43.93160629272461, "global_step": 351175, "epoch": 2902} {"train_loss": -43.95132064819336, "global_step": 351176, "epoch": 2902} {"train_loss": -43.36172103881836, "global_step": 351177, "epoch": 2902} {"train_loss": -42.77256774902344, "global_step": 351178, "epoch": 2902} {"train_loss": -43.27448272705078, "global_step": 351179, "epoch": 2902} {"train_loss": -43.8026008605957, "global_step": 351180, "epoch": 2902} {"train_loss": -42.56284713745117, "global_step": 351181, "epoch": 2902} {"train_loss": -42.34910202026367, "global_step": 351182, "epoch": 2902} {"train_loss": -43.10990524291992, "global_step": 351183, "epoch": 2902} {"train_loss": -42.478614807128906, "global_step": 351184, "epoch": 2902} {"train_loss": -43.334938049316406, "global_step": 351185, "epoch": 2902} {"train_loss": -43.25389862060547, "global_step": 351186, "epoch": 2902} {"train_loss": -43.720523834228516, "global_step": 351187, "epoch": 2902} {"train_loss": -43.68547439575195, "global_step": 351188, "epoch": 2902} {"train_loss": -43.761409759521484, "global_step": 351189, "epoch": 2902} {"train_loss": -42.88348388671875, "global_step": 351190, "epoch": 2902} {"train_loss": -43.508968353271484, "global_step": 351191, "epoch": 2902} {"train_loss": -42.933570861816406, "global_step": 351192, "epoch": 2902} {"train_loss": -42.897613525390625, "global_step": 351193, "epoch": 2902} {"train_loss": -43.39928436279297, "global_step": 351194, "epoch": 2902} {"train_loss": -43.20844650268555, "global_step": 351195, "epoch": 2902} {"train_loss": -43.481258392333984, "global_step": 351196, "epoch": 2902} {"train_loss": -44.28083038330078, "global_step": 351197, "epoch": 2902} {"train_loss": -43.21134567260742, "global_step": 351198, "epoch": 2902} {"train_loss": -43.52994918823242, "global_step": 351199, "epoch": 2902} {"train_loss": -42.84772872924805, "global_step": 351200, "epoch": 2902} {"train_loss": -42.386993408203125, "global_step": 351201, "epoch": 2902} {"train_loss": -42.98672103881836, "global_step": 351202, "epoch": 2902} {"train_loss": -43.40265655517578, "global_step": 351203, "epoch": 2902} {"train_loss": -42.5301628112793, "global_step": 351204, "epoch": 2902} {"train_loss": -42.79207992553711, "global_step": 351205, "epoch": 2902} {"train_loss": -43.5092887878418, "global_step": 351206, "epoch": 2902} {"train_loss": -42.321956634521484, "global_step": 351207, "epoch": 2902} {"train_loss": -42.46879196166992, "global_step": 351208, "epoch": 2902} {"train_loss": -43.988365173339844, "global_step": 351209, "epoch": 2902} {"train_loss": -43.3611946105957, "global_step": 351210, "epoch": 2902} {"train_loss": -43.21952819824219, "global_step": 351211, "epoch": 2902} {"train_loss": -42.80859375, "global_step": 351212, "epoch": 2902} {"train_loss": -43.87114334106445, "global_step": 351213, "epoch": 2902} {"train_loss": -43.38563919067383, "global_step": 351214, "epoch": 2902} {"train_loss": -43.50310516357422, "global_step": 351215, "epoch": 2902} {"train_loss": -43.39276123046875, "global_step": 351216, "epoch": 2902} {"train_loss": -43.302398681640625, "global_step": 351217, "epoch": 2902} {"train_loss": -43.23793411254883, "global_step": 351218, "epoch": 2902} {"train_loss": -42.67416000366211, "global_step": 351219, "epoch": 2902} {"train_loss": -42.69181442260742, "global_step": 351220, "epoch": 2902} {"train_loss": -43.45881271362305, "global_step": 351221, "epoch": 2902} {"train_loss": -42.964717864990234, "global_step": 351222, "epoch": 2902} {"train_loss": -43.474403381347656, "global_step": 351223, "epoch": 2902} {"train_loss": -44.030487060546875, "global_step": 351224, "epoch": 2902} {"train_loss": -42.659889221191406, "global_step": 351225, "epoch": 2902} {"train_loss": -43.55062484741211, "global_step": 351226, "epoch": 2902} {"train_loss": -43.665321350097656, "global_step": 351227, "epoch": 2902} {"train_loss": -43.24024200439453, "global_step": 351228, "epoch": 2902} {"train_loss": -42.97359085083008, "global_step": 351229, "epoch": 2902} {"train_loss": -43.525306701660156, "global_step": 351230, "epoch": 2902} {"train_loss": -43.65765380859375, "global_step": 351231, "epoch": 2902} {"train_loss": -42.66845703125, "global_step": 351232, "epoch": 2902} {"train_loss": -42.02851867675781, "global_step": 351233, "epoch": 2902} {"train_loss": -42.84713363647461, "global_step": 351234, "epoch": 2902} {"train_loss": -43.10408401489258, "global_step": 351235, "epoch": 2902} {"train_loss": -42.5415153503418, "global_step": 351236, "epoch": 2902} {"train_loss": -42.698421478271484, "global_step": 351237, "epoch": 2902} {"train_loss": -42.767330169677734, "global_step": 351238, "epoch": 2902} {"train_loss": -43.0727653503418, "global_step": 351239, "epoch": 2902} {"train_loss": -43.13335037231445, "global_step": 351240, "epoch": 2902} {"train_loss": -42.55281448364258, "global_step": 351241, "epoch": 2902} {"train_loss": -43.07920455932617, "global_step": 351242, "epoch": 2902} {"train_loss": -43.2022819519043, "global_step": 351243, "epoch": 2902} {"train_loss": -41.94924545288086, "global_step": 351244, "epoch": 2902} {"train_loss": -42.691654205322266, "global_step": 351245, "epoch": 2902} {"train_loss": -43.700592041015625, "global_step": 351246, "epoch": 2902} {"train_loss": -43.267696380615234, "global_step": 351247, "epoch": 2902} {"train_loss": -42.80154037475586, "global_step": 351248, "epoch": 2902} {"train_loss": -42.173187255859375, "global_step": 351249, "epoch": 2902} {"train_loss": -43.525123596191406, "global_step": 351250, "epoch": 2902} {"train_loss": -41.5988655090332, "global_step": 351251, "epoch": 2902} {"train_loss": -42.291507720947266, "global_step": 351252, "epoch": 2902} {"train_loss": -42.657257080078125, "global_step": 351253, "epoch": 2902} {"train_loss": -41.77506637573242, "global_step": 351254, "epoch": 2902} {"train_loss": -42.9479866027832, "global_step": 351255, "epoch": 2902} {"train_loss": -41.67127227783203, "global_step": 351256, "epoch": 2902} {"train_loss": -43.529327392578125, "global_step": 351257, "epoch": 2902} {"train_loss": -43.23737335205078, "global_step": 351258, "epoch": 2902} {"train_loss": -43.284339904785156, "global_step": 351259, "epoch": 2902} {"train_loss": -43.717735290527344, "global_step": 351260, "epoch": 2902} {"train_loss": -42.379005432128906, "global_step": 351261, "epoch": 2902} {"train_loss": -43.0840472071624, "global_step": 351262, "epoch": 2902, "val_loss": 2635627.0} {"train_loss": -42.67787170410156, "global_step": 351263, "epoch": 2903} {"train_loss": -42.973289489746094, "global_step": 351264, "epoch": 2903} {"train_loss": -41.945289611816406, "global_step": 351265, "epoch": 2903} {"train_loss": -41.659725189208984, "global_step": 351266, "epoch": 2903} {"train_loss": -41.02161407470703, "global_step": 351267, "epoch": 2903} {"train_loss": -43.1575813293457, "global_step": 351268, "epoch": 2903} {"train_loss": -43.256290435791016, "global_step": 351269, "epoch": 2903} {"train_loss": -43.18977737426758, "global_step": 351270, "epoch": 2903} {"train_loss": -43.64284896850586, "global_step": 351271, "epoch": 2903} {"train_loss": -41.560821533203125, "global_step": 351272, "epoch": 2903} {"train_loss": -42.19548416137695, "global_step": 351273, "epoch": 2903} {"train_loss": -41.65937423706055, "global_step": 351274, "epoch": 2903} {"train_loss": -42.09748458862305, "global_step": 351275, "epoch": 2903} {"train_loss": -42.5523567199707, "global_step": 351276, "epoch": 2903} {"train_loss": -43.403228759765625, "global_step": 351277, "epoch": 2903} {"train_loss": -41.9117546081543, "global_step": 351278, "epoch": 2903} {"train_loss": -41.86593246459961, "global_step": 351279, "epoch": 2903} {"train_loss": -42.23460006713867, "global_step": 351280, "epoch": 2903} {"train_loss": -38.59702682495117, "global_step": 351281, "epoch": 2903} {"train_loss": -41.60187911987305, "global_step": 351282, "epoch": 2903} {"train_loss": -43.58810043334961, "global_step": 351283, "epoch": 2903} {"train_loss": -41.60676193237305, "global_step": 351284, "epoch": 2903} {"train_loss": -42.16059112548828, "global_step": 351285, "epoch": 2903} {"train_loss": -42.5245361328125, "global_step": 351286, "epoch": 2903} {"train_loss": -41.78802490234375, "global_step": 351287, "epoch": 2903} {"train_loss": -43.15092849731445, "global_step": 351288, "epoch": 2903} {"train_loss": -42.1995849609375, "global_step": 351289, "epoch": 2903} {"train_loss": -41.337406158447266, "global_step": 351290, "epoch": 2903} {"train_loss": -41.222801208496094, "global_step": 351291, "epoch": 2903} {"train_loss": -41.69053268432617, "global_step": 351292, "epoch": 2903} {"train_loss": -40.69422149658203, "global_step": 351293, "epoch": 2903} {"train_loss": -42.6073112487793, "global_step": 351294, "epoch": 2903} {"train_loss": -41.72262191772461, "global_step": 351295, "epoch": 2903} {"train_loss": -39.904579162597656, "global_step": 351296, "epoch": 2903} {"train_loss": -42.6683235168457, "global_step": 351297, "epoch": 2903} {"train_loss": -41.10978698730469, "global_step": 351298, "epoch": 2903} {"train_loss": -41.76393508911133, "global_step": 351299, "epoch": 2903} {"train_loss": -41.55860137939453, "global_step": 351300, "epoch": 2903} {"train_loss": -40.34253692626953, "global_step": 351301, "epoch": 2903} {"train_loss": -41.664207458496094, "global_step": 351302, "epoch": 2903} {"train_loss": -39.996849060058594, "global_step": 351303, "epoch": 2903} {"train_loss": -42.469303131103516, "global_step": 351304, "epoch": 2903} {"train_loss": -41.07063674926758, "global_step": 351305, "epoch": 2903} {"train_loss": -41.346099853515625, "global_step": 351306, "epoch": 2903} {"train_loss": -42.95396041870117, "global_step": 351307, "epoch": 2903} {"train_loss": -42.35307693481445, "global_step": 351308, "epoch": 2903} {"train_loss": -41.3563117980957, "global_step": 351309, "epoch": 2903} {"train_loss": -42.944766998291016, "global_step": 351310, "epoch": 2903} {"train_loss": -42.545162200927734, "global_step": 351311, "epoch": 2903} {"train_loss": -42.0750732421875, "global_step": 351312, "epoch": 2903} {"train_loss": -43.28779220581055, "global_step": 351313, "epoch": 2903} {"train_loss": -42.617488861083984, "global_step": 351314, "epoch": 2903} {"train_loss": -42.940059661865234, "global_step": 351315, "epoch": 2903} {"train_loss": -43.46356964111328, "global_step": 351316, "epoch": 2903} {"train_loss": -43.11252975463867, "global_step": 351317, "epoch": 2903} {"train_loss": -43.1313362121582, "global_step": 351318, "epoch": 2903} {"train_loss": -43.55256652832031, "global_step": 351319, "epoch": 2903} {"train_loss": -43.57892990112305, "global_step": 351320, "epoch": 2903} {"train_loss": -41.97109603881836, "global_step": 351321, "epoch": 2903} {"train_loss": -42.61859893798828, "global_step": 351322, "epoch": 2903} {"train_loss": -43.433685302734375, "global_step": 351323, "epoch": 2903} {"train_loss": -43.24592971801758, "global_step": 351324, "epoch": 2903} {"train_loss": -41.5479621887207, "global_step": 351325, "epoch": 2903} {"train_loss": -42.66913986206055, "global_step": 351326, "epoch": 2903} {"train_loss": -43.50397491455078, "global_step": 351327, "epoch": 2903} {"train_loss": -42.83854293823242, "global_step": 351328, "epoch": 2903} {"train_loss": -42.400638580322266, "global_step": 351329, "epoch": 2903} {"train_loss": -43.497161865234375, "global_step": 351330, "epoch": 2903} {"train_loss": -42.88224792480469, "global_step": 351331, "epoch": 2903} {"train_loss": -43.01545333862305, "global_step": 351332, "epoch": 2903} {"train_loss": -43.77635192871094, "global_step": 351333, "epoch": 2903} {"train_loss": -43.81085205078125, "global_step": 351334, "epoch": 2903} {"train_loss": -43.34869384765625, "global_step": 351335, "epoch": 2903} {"train_loss": -43.7894172668457, "global_step": 351336, "epoch": 2903} {"train_loss": -43.48087692260742, "global_step": 351337, "epoch": 2903} {"train_loss": -44.30804443359375, "global_step": 351338, "epoch": 2903} {"train_loss": -43.904327392578125, "global_step": 351339, "epoch": 2903} {"train_loss": -43.320167541503906, "global_step": 351340, "epoch": 2903} {"train_loss": -43.63737487792969, "global_step": 351341, "epoch": 2903} {"train_loss": -43.748748779296875, "global_step": 351342, "epoch": 2903} {"train_loss": -43.41709518432617, "global_step": 351343, "epoch": 2903} {"train_loss": -42.7346076965332, "global_step": 351344, "epoch": 2903} {"train_loss": -44.05289077758789, "global_step": 351345, "epoch": 2903} {"train_loss": -42.94735336303711, "global_step": 351346, "epoch": 2903} {"train_loss": -43.252567291259766, "global_step": 351347, "epoch": 2903} {"train_loss": -43.89881896972656, "global_step": 351348, "epoch": 2903} {"train_loss": -43.683448791503906, "global_step": 351349, "epoch": 2903} {"train_loss": -43.65835189819336, "global_step": 351350, "epoch": 2903} {"train_loss": -43.04592514038086, "global_step": 351351, "epoch": 2903} {"train_loss": -44.275856018066406, "global_step": 351352, "epoch": 2903} {"train_loss": -43.8883056640625, "global_step": 351353, "epoch": 2903} {"train_loss": -43.07326126098633, "global_step": 351354, "epoch": 2903} {"train_loss": -44.204227447509766, "global_step": 351355, "epoch": 2903} {"train_loss": -43.8408317565918, "global_step": 351356, "epoch": 2903} {"train_loss": -44.21865463256836, "global_step": 351357, "epoch": 2903} {"train_loss": -44.24591827392578, "global_step": 351358, "epoch": 2903} {"train_loss": -44.01218795776367, "global_step": 351359, "epoch": 2903} {"train_loss": -44.31410598754883, "global_step": 351360, "epoch": 2903} {"train_loss": -43.90743637084961, "global_step": 351361, "epoch": 2903} {"train_loss": -44.541168212890625, "global_step": 351362, "epoch": 2903} {"train_loss": -42.8492317199707, "global_step": 351363, "epoch": 2903} {"train_loss": -42.204647064208984, "global_step": 351364, "epoch": 2903} {"train_loss": -44.24210739135742, "global_step": 351365, "epoch": 2903} {"train_loss": -43.067298889160156, "global_step": 351366, "epoch": 2903} {"train_loss": -41.929378509521484, "global_step": 351367, "epoch": 2903} {"train_loss": -43.482666015625, "global_step": 351368, "epoch": 2903} {"train_loss": -43.04669189453125, "global_step": 351369, "epoch": 2903} {"train_loss": -42.185691833496094, "global_step": 351370, "epoch": 2903} {"train_loss": -42.31584548950195, "global_step": 351371, "epoch": 2903} {"train_loss": -42.80534744262695, "global_step": 351372, "epoch": 2903} {"train_loss": -43.60240936279297, "global_step": 351373, "epoch": 2903} {"train_loss": -40.77304458618164, "global_step": 351374, "epoch": 2903} {"train_loss": -40.7723503112793, "global_step": 351375, "epoch": 2903} {"train_loss": -43.970306396484375, "global_step": 351376, "epoch": 2903} {"train_loss": -40.99982833862305, "global_step": 351377, "epoch": 2903} {"train_loss": -39.97798538208008, "global_step": 351378, "epoch": 2903} {"train_loss": -42.423160552978516, "global_step": 351379, "epoch": 2903} {"train_loss": -42.2750129699707, "global_step": 351380, "epoch": 2903} {"train_loss": -37.764564514160156, "global_step": 351381, "epoch": 2903} {"train_loss": -41.39191436767578, "global_step": 351382, "epoch": 2903} {"train_loss": -42.589108900590375, "global_step": 351383, "epoch": 2903, "val_loss": 2568198.75} {"train_loss": -36.521175384521484, "global_step": 351384, "epoch": 2904} {"train_loss": -42.00026321411133, "global_step": 351385, "epoch": 2904} {"train_loss": -41.31987380981445, "global_step": 351386, "epoch": 2904} {"train_loss": -39.7259635925293, "global_step": 351387, "epoch": 2904} {"train_loss": -42.58793640136719, "global_step": 351388, "epoch": 2904} {"train_loss": -39.979061126708984, "global_step": 351389, "epoch": 2904} {"train_loss": -43.41809844970703, "global_step": 351390, "epoch": 2904} {"train_loss": -41.6756706237793, "global_step": 351391, "epoch": 2904} {"train_loss": -41.890132904052734, "global_step": 351392, "epoch": 2904} {"train_loss": -41.8795280456543, "global_step": 351393, "epoch": 2904} {"train_loss": -43.03316116333008, "global_step": 351394, "epoch": 2904} {"train_loss": -41.53277587890625, "global_step": 351395, "epoch": 2904} {"train_loss": -42.00767517089844, "global_step": 351396, "epoch": 2904} {"train_loss": -42.135231018066406, "global_step": 351397, "epoch": 2904} {"train_loss": -42.5134391784668, "global_step": 351398, "epoch": 2904} {"train_loss": -42.05086898803711, "global_step": 351399, "epoch": 2904} {"train_loss": -42.28550338745117, "global_step": 351400, "epoch": 2904} {"train_loss": -42.290130615234375, "global_step": 351401, "epoch": 2904} {"train_loss": -42.785377502441406, "global_step": 351402, "epoch": 2904} {"train_loss": -42.70145797729492, "global_step": 351403, "epoch": 2904} {"train_loss": -43.0557975769043, "global_step": 351404, "epoch": 2904} {"train_loss": -42.36007308959961, "global_step": 351405, "epoch": 2904} {"train_loss": -43.13568115234375, "global_step": 351406, "epoch": 2904} {"train_loss": -42.529998779296875, "global_step": 351407, "epoch": 2904} {"train_loss": -43.31195831298828, "global_step": 351408, "epoch": 2904} {"train_loss": -43.06288528442383, "global_step": 351409, "epoch": 2904} {"train_loss": -42.93123245239258, "global_step": 351410, "epoch": 2904} {"train_loss": -42.91120529174805, "global_step": 351411, "epoch": 2904} {"train_loss": -43.52031326293945, "global_step": 351412, "epoch": 2904} {"train_loss": -42.752620697021484, "global_step": 351413, "epoch": 2904} {"train_loss": -43.39779281616211, "global_step": 351414, "epoch": 2904} {"train_loss": -43.03054428100586, "global_step": 351415, "epoch": 2904} {"train_loss": -43.15473175048828, "global_step": 351416, "epoch": 2904} {"train_loss": -42.1563606262207, "global_step": 351417, "epoch": 2904} {"train_loss": -43.98318862915039, "global_step": 351418, "epoch": 2904} {"train_loss": -42.93434524536133, "global_step": 351419, "epoch": 2904} {"train_loss": -42.79377365112305, "global_step": 351420, "epoch": 2904} {"train_loss": -43.757686614990234, "global_step": 351421, "epoch": 2904} {"train_loss": -43.10860824584961, "global_step": 351422, "epoch": 2904} {"train_loss": -43.58640670776367, "global_step": 351423, "epoch": 2904} {"train_loss": -43.8908576965332, "global_step": 351424, "epoch": 2904} {"train_loss": -43.41069412231445, "global_step": 351425, "epoch": 2904} {"train_loss": -43.65576171875, "global_step": 351426, "epoch": 2904} {"train_loss": -43.61711502075195, "global_step": 351427, "epoch": 2904} {"train_loss": -44.27653884887695, "global_step": 351428, "epoch": 2904} {"train_loss": -43.318565368652344, "global_step": 351429, "epoch": 2904} {"train_loss": -44.28302001953125, "global_step": 351430, "epoch": 2904} {"train_loss": -44.2051887512207, "global_step": 351431, "epoch": 2904} {"train_loss": -43.49475860595703, "global_step": 351432, "epoch": 2904} {"train_loss": -43.68793869018555, "global_step": 351433, "epoch": 2904} {"train_loss": -43.887142181396484, "global_step": 351434, "epoch": 2904} {"train_loss": -43.00954818725586, "global_step": 351435, "epoch": 2904} {"train_loss": -43.47469711303711, "global_step": 351436, "epoch": 2904} {"train_loss": -44.15517807006836, "global_step": 351437, "epoch": 2904} {"train_loss": -44.18021011352539, "global_step": 351438, "epoch": 2904} {"train_loss": -44.28155517578125, "global_step": 351439, "epoch": 2904} {"train_loss": -43.7744255065918, "global_step": 351440, "epoch": 2904} {"train_loss": -44.2095947265625, "global_step": 351441, "epoch": 2904} {"train_loss": -44.18669509887695, "global_step": 351442, "epoch": 2904} {"train_loss": -44.1627082824707, "global_step": 351443, "epoch": 2904} {"train_loss": -43.76569366455078, "global_step": 351444, "epoch": 2904} {"train_loss": -44.07818603515625, "global_step": 351445, "epoch": 2904} {"train_loss": -44.042903900146484, "global_step": 351446, "epoch": 2904} {"train_loss": -44.39900588989258, "global_step": 351447, "epoch": 2904} {"train_loss": -44.40826416015625, "global_step": 351448, "epoch": 2904} {"train_loss": -43.66054916381836, "global_step": 351449, "epoch": 2904} {"train_loss": -44.589271545410156, "global_step": 351450, "epoch": 2904} {"train_loss": -43.94393539428711, "global_step": 351451, "epoch": 2904} {"train_loss": -44.05634689331055, "global_step": 351452, "epoch": 2904} {"train_loss": -43.78227996826172, "global_step": 351453, "epoch": 2904} {"train_loss": -43.78389358520508, "global_step": 351454, "epoch": 2904} {"train_loss": -43.69437789916992, "global_step": 351455, "epoch": 2904} {"train_loss": -44.22748947143555, "global_step": 351456, "epoch": 2904} {"train_loss": -44.224239349365234, "global_step": 351457, "epoch": 2904} {"train_loss": -44.38686752319336, "global_step": 351458, "epoch": 2904} {"train_loss": -43.59181213378906, "global_step": 351459, "epoch": 2904} {"train_loss": -42.6546516418457, "global_step": 351460, "epoch": 2904} {"train_loss": -42.69740676879883, "global_step": 351461, "epoch": 2904} {"train_loss": -43.32889938354492, "global_step": 351462, "epoch": 2904} {"train_loss": -43.92991256713867, "global_step": 351463, "epoch": 2904} {"train_loss": -43.9512825012207, "global_step": 351464, "epoch": 2904} {"train_loss": -43.7633171081543, "global_step": 351465, "epoch": 2904} {"train_loss": -43.492183685302734, "global_step": 351466, "epoch": 2904} {"train_loss": -42.863136291503906, "global_step": 351467, "epoch": 2904} {"train_loss": -43.74343490600586, "global_step": 351468, "epoch": 2904} {"train_loss": -43.49287033081055, "global_step": 351469, "epoch": 2904} {"train_loss": -42.759498596191406, "global_step": 351470, "epoch": 2904} {"train_loss": -42.394569396972656, "global_step": 351471, "epoch": 2904} {"train_loss": -43.14643478393555, "global_step": 351472, "epoch": 2904} {"train_loss": -43.221832275390625, "global_step": 351473, "epoch": 2904} {"train_loss": -43.30321502685547, "global_step": 351474, "epoch": 2904} {"train_loss": -42.35293197631836, "global_step": 351475, "epoch": 2904} {"train_loss": -42.682220458984375, "global_step": 351476, "epoch": 2904} {"train_loss": -43.8540153503418, "global_step": 351477, "epoch": 2904} {"train_loss": -43.373077392578125, "global_step": 351478, "epoch": 2904} {"train_loss": -44.00825500488281, "global_step": 351479, "epoch": 2904} {"train_loss": -43.683189392089844, "global_step": 351480, "epoch": 2904} {"train_loss": -43.79172897338867, "global_step": 351481, "epoch": 2904} {"train_loss": -44.29458236694336, "global_step": 351482, "epoch": 2904} {"train_loss": -43.30771255493164, "global_step": 351483, "epoch": 2904} {"train_loss": -43.45293426513672, "global_step": 351484, "epoch": 2904} {"train_loss": -43.947261810302734, "global_step": 351485, "epoch": 2904} {"train_loss": -42.9107551574707, "global_step": 351486, "epoch": 2904} {"train_loss": -43.63447570800781, "global_step": 351487, "epoch": 2904} {"train_loss": -43.245174407958984, "global_step": 351488, "epoch": 2904} {"train_loss": -42.652679443359375, "global_step": 351489, "epoch": 2904} {"train_loss": -42.64387130737305, "global_step": 351490, "epoch": 2904} {"train_loss": -43.17774200439453, "global_step": 351491, "epoch": 2904} {"train_loss": -41.69993209838867, "global_step": 351492, "epoch": 2904} {"train_loss": -43.139617919921875, "global_step": 351493, "epoch": 2904} {"train_loss": -43.19115447998047, "global_step": 351494, "epoch": 2904} {"train_loss": -41.831275939941406, "global_step": 351495, "epoch": 2904} {"train_loss": -40.59980773925781, "global_step": 351496, "epoch": 2904} {"train_loss": -40.848365783691406, "global_step": 351497, "epoch": 2904} {"train_loss": -43.00374984741211, "global_step": 351498, "epoch": 2904} {"train_loss": -43.081478118896484, "global_step": 351499, "epoch": 2904} {"train_loss": -42.3953971862793, "global_step": 351500, "epoch": 2904} {"train_loss": -42.8005485534668, "global_step": 351501, "epoch": 2904} {"train_loss": -43.9519157409668, "global_step": 351502, "epoch": 2904} {"train_loss": -43.1991081237793, "global_step": 351503, "epoch": 2904} {"train_loss": -43.103157516353384, "global_step": 351504, "epoch": 2904, "val_loss": 2629912.75} {"train_loss": -43.90290451049805, "global_step": 351505, "epoch": 2905} {"train_loss": -42.4708137512207, "global_step": 351506, "epoch": 2905} {"train_loss": -42.619110107421875, "global_step": 351507, "epoch": 2905} {"train_loss": -43.24705505371094, "global_step": 351508, "epoch": 2905} {"train_loss": -43.62623977661133, "global_step": 351509, "epoch": 2905} {"train_loss": -43.303138732910156, "global_step": 351510, "epoch": 2905} {"train_loss": -43.80123519897461, "global_step": 351511, "epoch": 2905} {"train_loss": -43.77792739868164, "global_step": 351512, "epoch": 2905} {"train_loss": -43.8416862487793, "global_step": 351513, "epoch": 2905} {"train_loss": -44.046382904052734, "global_step": 351514, "epoch": 2905} {"train_loss": -43.95827102661133, "global_step": 351515, "epoch": 2905} {"train_loss": -43.60065460205078, "global_step": 351516, "epoch": 2905} {"train_loss": -44.3250846862793, "global_step": 351517, "epoch": 2905} {"train_loss": -43.62440490722656, "global_step": 351518, "epoch": 2905} {"train_loss": -43.14362335205078, "global_step": 351519, "epoch": 2905} {"train_loss": -44.06646728515625, "global_step": 351520, "epoch": 2905} {"train_loss": -44.25602340698242, "global_step": 351521, "epoch": 2905} {"train_loss": -44.18666458129883, "global_step": 351522, "epoch": 2905} {"train_loss": -44.106929779052734, "global_step": 351523, "epoch": 2905} {"train_loss": -44.168399810791016, "global_step": 351524, "epoch": 2905} {"train_loss": -43.595252990722656, "global_step": 351525, "epoch": 2905} {"train_loss": -44.6712532043457, "global_step": 351526, "epoch": 2905} {"train_loss": -44.01910400390625, "global_step": 351527, "epoch": 2905} {"train_loss": -43.50288009643555, "global_step": 351528, "epoch": 2905} {"train_loss": -43.85270690917969, "global_step": 351529, "epoch": 2905} {"train_loss": -43.74141311645508, "global_step": 351530, "epoch": 2905} {"train_loss": -43.59482955932617, "global_step": 351531, "epoch": 2905} {"train_loss": -43.94399642944336, "global_step": 351532, "epoch": 2905} {"train_loss": -44.29421615600586, "global_step": 351533, "epoch": 2905} {"train_loss": -43.910133361816406, "global_step": 351534, "epoch": 2905} {"train_loss": -44.07133865356445, "global_step": 351535, "epoch": 2905} {"train_loss": -44.512386322021484, "global_step": 351536, "epoch": 2905} {"train_loss": -44.43430709838867, "global_step": 351537, "epoch": 2905} {"train_loss": -44.4459228515625, "global_step": 351538, "epoch": 2905} {"train_loss": -44.43982696533203, "global_step": 351539, "epoch": 2905} {"train_loss": -44.366817474365234, "global_step": 351540, "epoch": 2905} {"train_loss": -44.41961669921875, "global_step": 351541, "epoch": 2905} {"train_loss": -44.22010803222656, "global_step": 351542, "epoch": 2905} {"train_loss": -44.04902267456055, "global_step": 351543, "epoch": 2905} {"train_loss": -44.35844802856445, "global_step": 351544, "epoch": 2905} {"train_loss": -44.62130355834961, "global_step": 351545, "epoch": 2905} {"train_loss": -44.5125846862793, "global_step": 351546, "epoch": 2905} {"train_loss": -43.329383850097656, "global_step": 351547, "epoch": 2905} {"train_loss": -44.3781623840332, "global_step": 351548, "epoch": 2905} {"train_loss": -44.3599739074707, "global_step": 351549, "epoch": 2905} {"train_loss": -44.421241760253906, "global_step": 351550, "epoch": 2905} {"train_loss": -44.65431594848633, "global_step": 351551, "epoch": 2905} {"train_loss": -44.7723388671875, "global_step": 351552, "epoch": 2905} {"train_loss": -44.833492279052734, "global_step": 351553, "epoch": 2905} {"train_loss": -45.000099182128906, "global_step": 351554, "epoch": 2905} {"train_loss": -44.746917724609375, "global_step": 351555, "epoch": 2905} {"train_loss": -44.279659271240234, "global_step": 351556, "epoch": 2905} {"train_loss": -44.48456954956055, "global_step": 351557, "epoch": 2905} {"train_loss": -44.492942810058594, "global_step": 351558, "epoch": 2905} {"train_loss": -45.08046340942383, "global_step": 351559, "epoch": 2905} {"train_loss": -44.942596435546875, "global_step": 351560, "epoch": 2905} {"train_loss": -44.51045227050781, "global_step": 351561, "epoch": 2905} {"train_loss": -43.0724983215332, "global_step": 351562, "epoch": 2905} {"train_loss": -42.92021942138672, "global_step": 351563, "epoch": 2905} {"train_loss": -43.98280715942383, "global_step": 351564, "epoch": 2905} {"train_loss": -44.4421501159668, "global_step": 351565, "epoch": 2905} {"train_loss": -44.0128288269043, "global_step": 351566, "epoch": 2905} {"train_loss": -44.59928894042969, "global_step": 351567, "epoch": 2905} {"train_loss": -44.29975891113281, "global_step": 351568, "epoch": 2905} {"train_loss": -42.012203216552734, "global_step": 351569, "epoch": 2905} {"train_loss": -41.52216339111328, "global_step": 351570, "epoch": 2905} {"train_loss": -40.842681884765625, "global_step": 351571, "epoch": 2905} {"train_loss": -42.310577392578125, "global_step": 351572, "epoch": 2905} {"train_loss": -41.930599212646484, "global_step": 351573, "epoch": 2905} {"train_loss": -41.868526458740234, "global_step": 351574, "epoch": 2905} {"train_loss": -41.583702087402344, "global_step": 351575, "epoch": 2905} {"train_loss": -42.626136779785156, "global_step": 351576, "epoch": 2905} {"train_loss": -43.97158432006836, "global_step": 351577, "epoch": 2905} {"train_loss": -43.02706527709961, "global_step": 351578, "epoch": 2905} {"train_loss": -42.502899169921875, "global_step": 351579, "epoch": 2905} {"train_loss": -42.97944259643555, "global_step": 351580, "epoch": 2905} {"train_loss": -42.60755157470703, "global_step": 351581, "epoch": 2905} {"train_loss": -43.250465393066406, "global_step": 351582, "epoch": 2905} {"train_loss": -43.33012771606445, "global_step": 351583, "epoch": 2905} {"train_loss": -42.66754150390625, "global_step": 351584, "epoch": 2905} {"train_loss": -40.618072509765625, "global_step": 351585, "epoch": 2905} {"train_loss": -42.11996841430664, "global_step": 351586, "epoch": 2905} {"train_loss": -42.118438720703125, "global_step": 351587, "epoch": 2905} {"train_loss": -41.53553009033203, "global_step": 351588, "epoch": 2905} {"train_loss": -41.452693939208984, "global_step": 351589, "epoch": 2905} {"train_loss": -43.024478912353516, "global_step": 351590, "epoch": 2905} {"train_loss": -41.106929779052734, "global_step": 351591, "epoch": 2905} {"train_loss": -40.96156692504883, "global_step": 351592, "epoch": 2905} {"train_loss": -42.941261291503906, "global_step": 351593, "epoch": 2905} {"train_loss": -42.74413299560547, "global_step": 351594, "epoch": 2905} {"train_loss": -42.06550598144531, "global_step": 351595, "epoch": 2905} {"train_loss": -43.04041290283203, "global_step": 351596, "epoch": 2905} {"train_loss": -43.60591125488281, "global_step": 351597, "epoch": 2905} {"train_loss": -43.296146392822266, "global_step": 351598, "epoch": 2905} {"train_loss": -43.412044525146484, "global_step": 351599, "epoch": 2905} {"train_loss": -43.46546173095703, "global_step": 351600, "epoch": 2905} {"train_loss": -43.24837112426758, "global_step": 351601, "epoch": 2905} {"train_loss": -44.01292419433594, "global_step": 351602, "epoch": 2905} {"train_loss": -43.67662048339844, "global_step": 351603, "epoch": 2905} {"train_loss": -43.57197189331055, "global_step": 351604, "epoch": 2905} {"train_loss": -43.95648956298828, "global_step": 351605, "epoch": 2905} {"train_loss": -43.874542236328125, "global_step": 351606, "epoch": 2905} {"train_loss": -44.04035949707031, "global_step": 351607, "epoch": 2905} {"train_loss": -43.73898696899414, "global_step": 351608, "epoch": 2905} {"train_loss": -43.978004455566406, "global_step": 351609, "epoch": 2905} {"train_loss": -43.37085723876953, "global_step": 351610, "epoch": 2905} {"train_loss": -44.11249923706055, "global_step": 351611, "epoch": 2905} {"train_loss": -44.77472686767578, "global_step": 351612, "epoch": 2905} {"train_loss": -43.779476165771484, "global_step": 351613, "epoch": 2905} {"train_loss": -42.646541595458984, "global_step": 351614, "epoch": 2905} {"train_loss": -43.799556732177734, "global_step": 351615, "epoch": 2905} {"train_loss": -44.291412353515625, "global_step": 351616, "epoch": 2905} {"train_loss": -44.3477897644043, "global_step": 351617, "epoch": 2905} {"train_loss": -44.10211944580078, "global_step": 351618, "epoch": 2905} {"train_loss": -43.84867477416992, "global_step": 351619, "epoch": 2905} {"train_loss": -43.88349151611328, "global_step": 351620, "epoch": 2905} {"train_loss": -44.28407669067383, "global_step": 351621, "epoch": 2905} {"train_loss": -44.717193603515625, "global_step": 351622, "epoch": 2905} {"train_loss": -44.146751403808594, "global_step": 351623, "epoch": 2905} {"train_loss": -44.378135681152344, "global_step": 351624, "epoch": 2905} {"train_loss": -43.60647431680979, "global_step": 351625, "epoch": 2905, "val_loss": 2553633.0} {"train_loss": -44.6067008972168, "global_step": 351626, "epoch": 2906} {"train_loss": -44.527320861816406, "global_step": 351627, "epoch": 2906} {"train_loss": -44.28589630126953, "global_step": 351628, "epoch": 2906} {"train_loss": -42.828704833984375, "global_step": 351629, "epoch": 2906} {"train_loss": -44.18476867675781, "global_step": 351630, "epoch": 2906} {"train_loss": -44.19796371459961, "global_step": 351631, "epoch": 2906} {"train_loss": -43.88456344604492, "global_step": 351632, "epoch": 2906} {"train_loss": -44.09237289428711, "global_step": 351633, "epoch": 2906} {"train_loss": -45.25104522705078, "global_step": 351634, "epoch": 2906} {"train_loss": -44.65754318237305, "global_step": 351635, "epoch": 2906} {"train_loss": -44.54160690307617, "global_step": 351636, "epoch": 2906} {"train_loss": -44.63642501831055, "global_step": 351637, "epoch": 2906} {"train_loss": -44.29693603515625, "global_step": 351638, "epoch": 2906} {"train_loss": -44.652809143066406, "global_step": 351639, "epoch": 2906} {"train_loss": -45.251319885253906, "global_step": 351640, "epoch": 2906} {"train_loss": -43.53464126586914, "global_step": 351641, "epoch": 2906} {"train_loss": -44.24888229370117, "global_step": 351642, "epoch": 2906} {"train_loss": -44.71232986450195, "global_step": 351643, "epoch": 2906} {"train_loss": -44.73501205444336, "global_step": 351644, "epoch": 2906} {"train_loss": -44.65299606323242, "global_step": 351645, "epoch": 2906} {"train_loss": -44.82427215576172, "global_step": 351646, "epoch": 2906} {"train_loss": -44.89516067504883, "global_step": 351647, "epoch": 2906} {"train_loss": -44.316890716552734, "global_step": 351648, "epoch": 2906} {"train_loss": -45.405609130859375, "global_step": 351649, "epoch": 2906} {"train_loss": -44.32590866088867, "global_step": 351650, "epoch": 2906} {"train_loss": -43.906341552734375, "global_step": 351651, "epoch": 2906} {"train_loss": -44.03013229370117, "global_step": 351652, "epoch": 2906} {"train_loss": -44.79533386230469, "global_step": 351653, "epoch": 2906} {"train_loss": -44.07991409301758, "global_step": 351654, "epoch": 2906} {"train_loss": -43.98719787597656, "global_step": 351655, "epoch": 2906} {"train_loss": -43.68962097167969, "global_step": 351656, "epoch": 2906} {"train_loss": -43.54883575439453, "global_step": 351657, "epoch": 2906} {"train_loss": -43.055999755859375, "global_step": 351658, "epoch": 2906} {"train_loss": -42.03411102294922, "global_step": 351659, "epoch": 2906} {"train_loss": -43.457908630371094, "global_step": 351660, "epoch": 2906} {"train_loss": -43.756492614746094, "global_step": 351661, "epoch": 2906} {"train_loss": -43.817466735839844, "global_step": 351662, "epoch": 2906} {"train_loss": -42.3034782409668, "global_step": 351663, "epoch": 2906} {"train_loss": -42.855045318603516, "global_step": 351664, "epoch": 2906} {"train_loss": -41.86284637451172, "global_step": 351665, "epoch": 2906} {"train_loss": -43.127197265625, "global_step": 351666, "epoch": 2906} {"train_loss": -42.73591995239258, "global_step": 351667, "epoch": 2906} {"train_loss": -42.63578414916992, "global_step": 351668, "epoch": 2906} {"train_loss": -41.519012451171875, "global_step": 351669, "epoch": 2906} {"train_loss": -42.69514846801758, "global_step": 351670, "epoch": 2906} {"train_loss": -43.55733871459961, "global_step": 351671, "epoch": 2906} {"train_loss": -41.32421875, "global_step": 351672, "epoch": 2906} {"train_loss": -42.205142974853516, "global_step": 351673, "epoch": 2906} {"train_loss": -43.84513473510742, "global_step": 351674, "epoch": 2906} {"train_loss": -42.74991989135742, "global_step": 351675, "epoch": 2906} {"train_loss": -43.32538986206055, "global_step": 351676, "epoch": 2906} {"train_loss": -43.25823211669922, "global_step": 351677, "epoch": 2906} {"train_loss": -43.56584548950195, "global_step": 351678, "epoch": 2906} {"train_loss": -43.40348434448242, "global_step": 351679, "epoch": 2906} {"train_loss": -43.64113998413086, "global_step": 351680, "epoch": 2906} {"train_loss": -43.745216369628906, "global_step": 351681, "epoch": 2906} {"train_loss": -43.9953727722168, "global_step": 351682, "epoch": 2906} {"train_loss": -43.499351501464844, "global_step": 351683, "epoch": 2906} {"train_loss": -43.826271057128906, "global_step": 351684, "epoch": 2906} {"train_loss": -44.5205192565918, "global_step": 351685, "epoch": 2906} {"train_loss": -43.78169631958008, "global_step": 351686, "epoch": 2906} {"train_loss": -44.11204147338867, "global_step": 351687, "epoch": 2906} {"train_loss": -43.83631134033203, "global_step": 351688, "epoch": 2906} {"train_loss": -43.21997833251953, "global_step": 351689, "epoch": 2906} {"train_loss": -44.11516571044922, "global_step": 351690, "epoch": 2906} {"train_loss": -44.114864349365234, "global_step": 351691, "epoch": 2906} {"train_loss": -43.75802993774414, "global_step": 351692, "epoch": 2906} {"train_loss": -44.215972900390625, "global_step": 351693, "epoch": 2906} {"train_loss": -44.158966064453125, "global_step": 351694, "epoch": 2906} {"train_loss": -44.42814254760742, "global_step": 351695, "epoch": 2906} {"train_loss": -44.26383590698242, "global_step": 351696, "epoch": 2906} {"train_loss": -43.92512893676758, "global_step": 351697, "epoch": 2906} {"train_loss": -44.515830993652344, "global_step": 351698, "epoch": 2906} {"train_loss": -44.203094482421875, "global_step": 351699, "epoch": 2906} {"train_loss": -43.628692626953125, "global_step": 351700, "epoch": 2906} {"train_loss": -44.36558151245117, "global_step": 351701, "epoch": 2906} {"train_loss": -44.088226318359375, "global_step": 351702, "epoch": 2906} {"train_loss": -44.942230224609375, "global_step": 351703, "epoch": 2906} {"train_loss": -44.52984619140625, "global_step": 351704, "epoch": 2906} {"train_loss": -44.514129638671875, "global_step": 351705, "epoch": 2906} {"train_loss": -44.216888427734375, "global_step": 351706, "epoch": 2906} {"train_loss": -44.62602615356445, "global_step": 351707, "epoch": 2906} {"train_loss": -44.479305267333984, "global_step": 351708, "epoch": 2906} {"train_loss": -44.29448318481445, "global_step": 351709, "epoch": 2906} {"train_loss": -44.64039993286133, "global_step": 351710, "epoch": 2906} {"train_loss": -44.91862869262695, "global_step": 351711, "epoch": 2906} {"train_loss": -44.29718017578125, "global_step": 351712, "epoch": 2906} {"train_loss": -44.90963363647461, "global_step": 351713, "epoch": 2906} {"train_loss": -44.374359130859375, "global_step": 351714, "epoch": 2906} {"train_loss": -44.832305908203125, "global_step": 351715, "epoch": 2906} {"train_loss": -44.23242950439453, "global_step": 351716, "epoch": 2906} {"train_loss": -44.334407806396484, "global_step": 351717, "epoch": 2906} {"train_loss": -44.550628662109375, "global_step": 351718, "epoch": 2906} {"train_loss": -44.57048034667969, "global_step": 351719, "epoch": 2906} {"train_loss": -43.979286193847656, "global_step": 351720, "epoch": 2906} {"train_loss": -44.28498458862305, "global_step": 351721, "epoch": 2906} {"train_loss": -44.539581298828125, "global_step": 351722, "epoch": 2906} {"train_loss": -44.73762893676758, "global_step": 351723, "epoch": 2906} {"train_loss": -44.81370162963867, "global_step": 351724, "epoch": 2906} {"train_loss": -43.92837142944336, "global_step": 351725, "epoch": 2906} {"train_loss": -44.389869689941406, "global_step": 351726, "epoch": 2906} {"train_loss": -44.65498733520508, "global_step": 351727, "epoch": 2906} {"train_loss": -43.67734909057617, "global_step": 351728, "epoch": 2906} {"train_loss": -43.97844696044922, "global_step": 351729, "epoch": 2906} {"train_loss": -44.951393127441406, "global_step": 351730, "epoch": 2906} {"train_loss": -44.367462158203125, "global_step": 351731, "epoch": 2906} {"train_loss": -44.26694107055664, "global_step": 351732, "epoch": 2906} {"train_loss": -44.1878547668457, "global_step": 351733, "epoch": 2906} {"train_loss": -43.35659408569336, "global_step": 351734, "epoch": 2906} {"train_loss": -44.19236373901367, "global_step": 351735, "epoch": 2906} {"train_loss": -44.15073013305664, "global_step": 351736, "epoch": 2906} {"train_loss": -43.28931427001953, "global_step": 351737, "epoch": 2906} {"train_loss": -43.98662185668945, "global_step": 351738, "epoch": 2906} {"train_loss": -43.67598342895508, "global_step": 351739, "epoch": 2906} {"train_loss": -44.52427291870117, "global_step": 351740, "epoch": 2906} {"train_loss": -44.07362747192383, "global_step": 351741, "epoch": 2906} {"train_loss": -44.650325775146484, "global_step": 351742, "epoch": 2906} {"train_loss": -44.92721176147461, "global_step": 351743, "epoch": 2906} {"train_loss": -43.705299377441406, "global_step": 351744, "epoch": 2906} {"train_loss": -43.8853759765625, "global_step": 351745, "epoch": 2906} {"train_loss": -44.00241085714545, "global_step": 351746, "epoch": 2906, "val_loss": 2625148.75} {"train_loss": -43.2537727355957, "global_step": 351747, "epoch": 2907} {"train_loss": -43.855960845947266, "global_step": 351748, "epoch": 2907} {"train_loss": -43.95663070678711, "global_step": 351749, "epoch": 2907} {"train_loss": -43.62811279296875, "global_step": 351750, "epoch": 2907} {"train_loss": -44.085750579833984, "global_step": 351751, "epoch": 2907} {"train_loss": -43.59370803833008, "global_step": 351752, "epoch": 2907} {"train_loss": -42.85626983642578, "global_step": 351753, "epoch": 2907} {"train_loss": -41.92066192626953, "global_step": 351754, "epoch": 2907} {"train_loss": -42.49848175048828, "global_step": 351755, "epoch": 2907} {"train_loss": -43.76152801513672, "global_step": 351756, "epoch": 2907} {"train_loss": -43.410980224609375, "global_step": 351757, "epoch": 2907} {"train_loss": -41.67971420288086, "global_step": 351758, "epoch": 2907} {"train_loss": -43.40965270996094, "global_step": 351759, "epoch": 2907} {"train_loss": -44.03718948364258, "global_step": 351760, "epoch": 2907} {"train_loss": -43.6309814453125, "global_step": 351761, "epoch": 2907} {"train_loss": -42.48836898803711, "global_step": 351762, "epoch": 2907} {"train_loss": -42.76729965209961, "global_step": 351763, "epoch": 2907} {"train_loss": -43.28887939453125, "global_step": 351764, "epoch": 2907} {"train_loss": -43.23682403564453, "global_step": 351765, "epoch": 2907} {"train_loss": -39.61627960205078, "global_step": 351766, "epoch": 2907} {"train_loss": -39.35630798339844, "global_step": 351767, "epoch": 2907} {"train_loss": -43.63766098022461, "global_step": 351768, "epoch": 2907} {"train_loss": -41.533348083496094, "global_step": 351769, "epoch": 2907} {"train_loss": -34.143463134765625, "global_step": 351770, "epoch": 2907} {"train_loss": -36.79154586791992, "global_step": 351771, "epoch": 2907} {"train_loss": -42.49824905395508, "global_step": 351772, "epoch": 2907} {"train_loss": -40.46919631958008, "global_step": 351773, "epoch": 2907} {"train_loss": -37.755653381347656, "global_step": 351774, "epoch": 2907} {"train_loss": -43.26824951171875, "global_step": 351775, "epoch": 2907} {"train_loss": -40.14875030517578, "global_step": 351776, "epoch": 2907} {"train_loss": -39.814205169677734, "global_step": 351777, "epoch": 2907} {"train_loss": -44.201541900634766, "global_step": 351778, "epoch": 2907} {"train_loss": -39.92626953125, "global_step": 351779, "epoch": 2907} {"train_loss": -42.88203048706055, "global_step": 351780, "epoch": 2907} {"train_loss": -42.482234954833984, "global_step": 351781, "epoch": 2907} {"train_loss": -42.126197814941406, "global_step": 351782, "epoch": 2907} {"train_loss": -43.11861801147461, "global_step": 351783, "epoch": 2907} {"train_loss": -43.112152099609375, "global_step": 351784, "epoch": 2907} {"train_loss": -42.340431213378906, "global_step": 351785, "epoch": 2907} {"train_loss": -43.68703842163086, "global_step": 351786, "epoch": 2907} {"train_loss": -42.09682083129883, "global_step": 351787, "epoch": 2907} {"train_loss": -43.308860778808594, "global_step": 351788, "epoch": 2907} {"train_loss": -43.6450309753418, "global_step": 351789, "epoch": 2907} {"train_loss": -42.8386116027832, "global_step": 351790, "epoch": 2907} {"train_loss": -43.851619720458984, "global_step": 351791, "epoch": 2907} {"train_loss": -43.78173065185547, "global_step": 351792, "epoch": 2907} {"train_loss": -42.816627502441406, "global_step": 351793, "epoch": 2907} {"train_loss": -43.346275329589844, "global_step": 351794, "epoch": 2907} {"train_loss": -43.04256057739258, "global_step": 351795, "epoch": 2907} {"train_loss": -44.46590042114258, "global_step": 351796, "epoch": 2907} {"train_loss": -42.53101348876953, "global_step": 351797, "epoch": 2907} {"train_loss": -43.61665725708008, "global_step": 351798, "epoch": 2907} {"train_loss": -43.65412521362305, "global_step": 351799, "epoch": 2907} {"train_loss": -44.017982482910156, "global_step": 351800, "epoch": 2907} {"train_loss": -44.283206939697266, "global_step": 351801, "epoch": 2907} {"train_loss": -44.05267333984375, "global_step": 351802, "epoch": 2907} {"train_loss": -44.03501510620117, "global_step": 351803, "epoch": 2907} {"train_loss": -44.110137939453125, "global_step": 351804, "epoch": 2907} {"train_loss": -44.69286346435547, "global_step": 351805, "epoch": 2907} {"train_loss": -44.15483474731445, "global_step": 351806, "epoch": 2907} {"train_loss": -44.91352462768555, "global_step": 351807, "epoch": 2907} {"train_loss": -44.604331970214844, "global_step": 351808, "epoch": 2907} {"train_loss": -44.44303512573242, "global_step": 351809, "epoch": 2907} {"train_loss": -44.362117767333984, "global_step": 351810, "epoch": 2907} {"train_loss": -44.68600082397461, "global_step": 351811, "epoch": 2907} {"train_loss": -45.0413703918457, "global_step": 351812, "epoch": 2907} {"train_loss": -44.33854675292969, "global_step": 351813, "epoch": 2907} {"train_loss": -44.830379486083984, "global_step": 351814, "epoch": 2907} {"train_loss": -44.76572799682617, "global_step": 351815, "epoch": 2907} {"train_loss": -44.63123321533203, "global_step": 351816, "epoch": 2907} {"train_loss": -44.51435470581055, "global_step": 351817, "epoch": 2907} {"train_loss": -44.56998825073242, "global_step": 351818, "epoch": 2907} {"train_loss": -44.904541015625, "global_step": 351819, "epoch": 2907} {"train_loss": -44.80070114135742, "global_step": 351820, "epoch": 2907} {"train_loss": -45.13599395751953, "global_step": 351821, "epoch": 2907} {"train_loss": -44.912776947021484, "global_step": 351822, "epoch": 2907} {"train_loss": -43.292823791503906, "global_step": 351823, "epoch": 2907} {"train_loss": -44.92340850830078, "global_step": 351824, "epoch": 2907} {"train_loss": -44.42448043823242, "global_step": 351825, "epoch": 2907} {"train_loss": -44.66835021972656, "global_step": 351826, "epoch": 2907} {"train_loss": -44.80024337768555, "global_step": 351827, "epoch": 2907} {"train_loss": -44.71467208862305, "global_step": 351828, "epoch": 2907} {"train_loss": -44.76076889038086, "global_step": 351829, "epoch": 2907} {"train_loss": -43.57661819458008, "global_step": 351830, "epoch": 2907} {"train_loss": -44.878177642822266, "global_step": 351831, "epoch": 2907} {"train_loss": -44.97809600830078, "global_step": 351832, "epoch": 2907} {"train_loss": -44.73807907104492, "global_step": 351833, "epoch": 2907} {"train_loss": -45.1695556640625, "global_step": 351834, "epoch": 2907} {"train_loss": -44.642269134521484, "global_step": 351835, "epoch": 2907} {"train_loss": -44.12929153442383, "global_step": 351836, "epoch": 2907} {"train_loss": -45.07594680786133, "global_step": 351837, "epoch": 2907} {"train_loss": -45.323429107666016, "global_step": 351838, "epoch": 2907} {"train_loss": -45.2161979675293, "global_step": 351839, "epoch": 2907} {"train_loss": -39.974483489990234, "global_step": 351840, "epoch": 2907} {"train_loss": -44.64508056640625, "global_step": 351841, "epoch": 2907} {"train_loss": -44.36861801147461, "global_step": 351842, "epoch": 2907} {"train_loss": -40.531124114990234, "global_step": 351843, "epoch": 2907} {"train_loss": -44.3093376159668, "global_step": 351844, "epoch": 2907} {"train_loss": -44.645992279052734, "global_step": 351845, "epoch": 2907} {"train_loss": -44.65675735473633, "global_step": 351846, "epoch": 2907} {"train_loss": -44.351165771484375, "global_step": 351847, "epoch": 2907} {"train_loss": -38.36122512817383, "global_step": 351848, "epoch": 2907} {"train_loss": -36.71360397338867, "global_step": 351849, "epoch": 2907} {"train_loss": -43.98411560058594, "global_step": 351850, "epoch": 2907} {"train_loss": -41.187435150146484, "global_step": 351851, "epoch": 2907} {"train_loss": -44.291236877441406, "global_step": 351852, "epoch": 2907} {"train_loss": -44.048221588134766, "global_step": 351853, "epoch": 2907} {"train_loss": -42.31951904296875, "global_step": 351854, "epoch": 2907} {"train_loss": -37.50788497924805, "global_step": 351855, "epoch": 2907} {"train_loss": -43.855743408203125, "global_step": 351856, "epoch": 2907} {"train_loss": -40.724002838134766, "global_step": 351857, "epoch": 2907} {"train_loss": -34.35378646850586, "global_step": 351858, "epoch": 2907} {"train_loss": -43.23796463012695, "global_step": 351859, "epoch": 2907} {"train_loss": -42.057071685791016, "global_step": 351860, "epoch": 2907} {"train_loss": -42.57521438598633, "global_step": 351861, "epoch": 2907} {"train_loss": -41.24374771118164, "global_step": 351862, "epoch": 2907} {"train_loss": -41.76899337768555, "global_step": 351863, "epoch": 2907} {"train_loss": -37.2998161315918, "global_step": 351864, "epoch": 2907} {"train_loss": -43.4790153503418, "global_step": 351865, "epoch": 2907} {"train_loss": -41.35277557373047, "global_step": 351866, "epoch": 2907} {"train_loss": -42.992188634951255, "global_step": 351867, "epoch": 2907, "val_loss": 2654719.25} {"train_loss": -38.843177795410156, "global_step": 351868, "epoch": 2908} {"train_loss": -41.91011047363281, "global_step": 351869, "epoch": 2908} {"train_loss": -41.167823791503906, "global_step": 351870, "epoch": 2908} {"train_loss": -42.09318923950195, "global_step": 351871, "epoch": 2908} {"train_loss": -37.0601692199707, "global_step": 351872, "epoch": 2908} {"train_loss": -41.95969772338867, "global_step": 351873, "epoch": 2908} {"train_loss": -39.80266571044922, "global_step": 351874, "epoch": 2908} {"train_loss": -42.03288650512695, "global_step": 351875, "epoch": 2908} {"train_loss": -41.24795150756836, "global_step": 351876, "epoch": 2908} {"train_loss": -42.36943054199219, "global_step": 351877, "epoch": 2908} {"train_loss": -41.42020797729492, "global_step": 351878, "epoch": 2908} {"train_loss": -41.564449310302734, "global_step": 351879, "epoch": 2908} {"train_loss": -43.11220932006836, "global_step": 351880, "epoch": 2908} {"train_loss": -42.17766189575195, "global_step": 351881, "epoch": 2908} {"train_loss": -42.79982376098633, "global_step": 351882, "epoch": 2908} {"train_loss": -42.09052276611328, "global_step": 351883, "epoch": 2908} {"train_loss": -41.62885665893555, "global_step": 351884, "epoch": 2908} {"train_loss": -43.212162017822266, "global_step": 351885, "epoch": 2908} {"train_loss": -42.929622650146484, "global_step": 351886, "epoch": 2908} {"train_loss": -42.85063171386719, "global_step": 351887, "epoch": 2908} {"train_loss": -42.53234100341797, "global_step": 351888, "epoch": 2908} {"train_loss": -42.974788665771484, "global_step": 351889, "epoch": 2908} {"train_loss": -42.50506591796875, "global_step": 351890, "epoch": 2908} {"train_loss": -43.651885986328125, "global_step": 351891, "epoch": 2908} {"train_loss": -42.793392181396484, "global_step": 351892, "epoch": 2908} {"train_loss": -43.86931610107422, "global_step": 351893, "epoch": 2908} {"train_loss": -43.546688079833984, "global_step": 351894, "epoch": 2908} {"train_loss": -43.488037109375, "global_step": 351895, "epoch": 2908} {"train_loss": -42.01029586791992, "global_step": 351896, "epoch": 2908} {"train_loss": -43.42424011230469, "global_step": 351897, "epoch": 2908} {"train_loss": -43.05057907104492, "global_step": 351898, "epoch": 2908} {"train_loss": -39.3934211730957, "global_step": 351899, "epoch": 2908} {"train_loss": -43.97404098510742, "global_step": 351900, "epoch": 2908} {"train_loss": -42.69428634643555, "global_step": 351901, "epoch": 2908} {"train_loss": -42.2892951965332, "global_step": 351902, "epoch": 2908} {"train_loss": -41.72922134399414, "global_step": 351903, "epoch": 2908} {"train_loss": -43.96601486206055, "global_step": 351904, "epoch": 2908} {"train_loss": -43.60980224609375, "global_step": 351905, "epoch": 2908} {"train_loss": -41.446556091308594, "global_step": 351906, "epoch": 2908} {"train_loss": -42.216400146484375, "global_step": 351907, "epoch": 2908} {"train_loss": -41.48223876953125, "global_step": 351908, "epoch": 2908} {"train_loss": -42.860260009765625, "global_step": 351909, "epoch": 2908} {"train_loss": -41.25529098510742, "global_step": 351910, "epoch": 2908} {"train_loss": -43.41169357299805, "global_step": 351911, "epoch": 2908} {"train_loss": -43.20127487182617, "global_step": 351912, "epoch": 2908} {"train_loss": -42.31111145019531, "global_step": 351913, "epoch": 2908} {"train_loss": -43.60340118408203, "global_step": 351914, "epoch": 2908} {"train_loss": -42.62187194824219, "global_step": 351915, "epoch": 2908} {"train_loss": -43.187862396240234, "global_step": 351916, "epoch": 2908} {"train_loss": -43.08631134033203, "global_step": 351917, "epoch": 2908} {"train_loss": -42.76945877075195, "global_step": 351918, "epoch": 2908} {"train_loss": -43.3787841796875, "global_step": 351919, "epoch": 2908} {"train_loss": -44.134029388427734, "global_step": 351920, "epoch": 2908} {"train_loss": -42.45870590209961, "global_step": 351921, "epoch": 2908} {"train_loss": -42.764041900634766, "global_step": 351922, "epoch": 2908} {"train_loss": -43.22396469116211, "global_step": 351923, "epoch": 2908} {"train_loss": -43.16621780395508, "global_step": 351924, "epoch": 2908} {"train_loss": -44.260807037353516, "global_step": 351925, "epoch": 2908} {"train_loss": -40.915931701660156, "global_step": 351926, "epoch": 2908} {"train_loss": -43.96199417114258, "global_step": 351927, "epoch": 2908} {"train_loss": -43.85236740112305, "global_step": 351928, "epoch": 2908} {"train_loss": -43.08618927001953, "global_step": 351929, "epoch": 2908} {"train_loss": -22.79437255859375, "global_step": 351930, "epoch": 2908} {"train_loss": -42.38959884643555, "global_step": 351931, "epoch": 2908} {"train_loss": -42.19565963745117, "global_step": 351932, "epoch": 2908} {"train_loss": -36.8430290222168, "global_step": 351933, "epoch": 2908} {"train_loss": -37.902191162109375, "global_step": 351934, "epoch": 2908} {"train_loss": -37.387386322021484, "global_step": 351935, "epoch": 2908} {"train_loss": -41.593074798583984, "global_step": 351936, "epoch": 2908} {"train_loss": -41.871700286865234, "global_step": 351937, "epoch": 2908} {"train_loss": -30.760568618774414, "global_step": 351938, "epoch": 2908} {"train_loss": -28.9151554107666, "global_step": 351939, "epoch": 2908} {"train_loss": -39.508705139160156, "global_step": 351940, "epoch": 2908} {"train_loss": -35.978057861328125, "global_step": 351941, "epoch": 2908} {"train_loss": -39.17635726928711, "global_step": 351942, "epoch": 2908} {"train_loss": -32.64690017700195, "global_step": 351943, "epoch": 2908} {"train_loss": -41.01016616821289, "global_step": 351944, "epoch": 2908} {"train_loss": -38.77350997924805, "global_step": 351945, "epoch": 2908} {"train_loss": -37.578399658203125, "global_step": 351946, "epoch": 2908} {"train_loss": -31.633380889892578, "global_step": 351947, "epoch": 2908} {"train_loss": -40.056312561035156, "global_step": 351948, "epoch": 2908} {"train_loss": -33.70249557495117, "global_step": 351949, "epoch": 2908} {"train_loss": -32.92539596557617, "global_step": 351950, "epoch": 2908} {"train_loss": -15.929234504699707, "global_step": 351951, "epoch": 2908} {"train_loss": -37.29499816894531, "global_step": 351952, "epoch": 2908} {"train_loss": -37.34656524658203, "global_step": 351953, "epoch": 2908} {"train_loss": -36.51079177856445, "global_step": 351954, "epoch": 2908} {"train_loss": -33.51691436767578, "global_step": 351955, "epoch": 2908} {"train_loss": -34.30158615112305, "global_step": 351956, "epoch": 2908} {"train_loss": -36.643001556396484, "global_step": 351957, "epoch": 2908} {"train_loss": -36.59492874145508, "global_step": 351958, "epoch": 2908} {"train_loss": -21.69551658630371, "global_step": 351959, "epoch": 2908} {"train_loss": -33.35824203491211, "global_step": 351960, "epoch": 2908} {"train_loss": -39.97870635986328, "global_step": 351961, "epoch": 2908} {"train_loss": -37.00990676879883, "global_step": 351962, "epoch": 2908} {"train_loss": -38.84307861328125, "global_step": 351963, "epoch": 2908} {"train_loss": -38.519771575927734, "global_step": 351964, "epoch": 2908} {"train_loss": -35.83808517456055, "global_step": 351965, "epoch": 2908} {"train_loss": -36.37496566772461, "global_step": 351966, "epoch": 2908} {"train_loss": -36.57973861694336, "global_step": 351967, "epoch": 2908} {"train_loss": -38.21024703979492, "global_step": 351968, "epoch": 2908} {"train_loss": -38.823856353759766, "global_step": 351969, "epoch": 2908} {"train_loss": -39.321746826171875, "global_step": 351970, "epoch": 2908} {"train_loss": -36.78334426879883, "global_step": 351971, "epoch": 2908} {"train_loss": -39.944942474365234, "global_step": 351972, "epoch": 2908} {"train_loss": -38.875282287597656, "global_step": 351973, "epoch": 2908} {"train_loss": -38.30305862426758, "global_step": 351974, "epoch": 2908} {"train_loss": -39.07865905761719, "global_step": 351975, "epoch": 2908} {"train_loss": -37.58224105834961, "global_step": 351976, "epoch": 2908} {"train_loss": -40.337181091308594, "global_step": 351977, "epoch": 2908} {"train_loss": -39.606300354003906, "global_step": 351978, "epoch": 2908} {"train_loss": -39.89116287231445, "global_step": 351979, "epoch": 2908} {"train_loss": -39.682464599609375, "global_step": 351980, "epoch": 2908} {"train_loss": -39.714717864990234, "global_step": 351981, "epoch": 2908} {"train_loss": -39.95713424682617, "global_step": 351982, "epoch": 2908} {"train_loss": -40.02620315551758, "global_step": 351983, "epoch": 2908} {"train_loss": -40.63823318481445, "global_step": 351984, "epoch": 2908} {"train_loss": -39.5141487121582, "global_step": 351985, "epoch": 2908} {"train_loss": -39.787715911865234, "global_step": 351986, "epoch": 2908} {"train_loss": -40.5689582824707, "global_step": 351987, "epoch": 2908} {"train_loss": -39.766699727901745, "global_step": 351988, "epoch": 2908, "val_loss": 2537199.75} {"train_loss": -40.21177291870117, "global_step": 351989, "epoch": 2909} {"train_loss": -40.60905838012695, "global_step": 351990, "epoch": 2909} {"train_loss": -39.049224853515625, "global_step": 351991, "epoch": 2909} {"train_loss": -41.119686126708984, "global_step": 351992, "epoch": 2909} {"train_loss": -40.873104095458984, "global_step": 351993, "epoch": 2909} {"train_loss": -41.1917839050293, "global_step": 351994, "epoch": 2909} {"train_loss": -40.94338607788086, "global_step": 351995, "epoch": 2909} {"train_loss": -40.21126937866211, "global_step": 351996, "epoch": 2909} {"train_loss": -40.55392074584961, "global_step": 351997, "epoch": 2909} {"train_loss": -40.8436393737793, "global_step": 351998, "epoch": 2909} {"train_loss": -40.9314079284668, "global_step": 351999, "epoch": 2909} {"train_loss": -41.18937301635742, "global_step": 352000, "epoch": 2909} {"train_loss": -41.04771041870117, "global_step": 352001, "epoch": 2909} {"train_loss": -41.302330017089844, "global_step": 352002, "epoch": 2909} {"train_loss": -41.22623825073242, "global_step": 352003, "epoch": 2909} {"train_loss": -41.06834030151367, "global_step": 352004, "epoch": 2909} {"train_loss": -41.56035232543945, "global_step": 352005, "epoch": 2909} {"train_loss": -41.3729248046875, "global_step": 352006, "epoch": 2909} {"train_loss": -41.755550384521484, "global_step": 352007, "epoch": 2909} {"train_loss": -41.58301544189453, "global_step": 352008, "epoch": 2909} {"train_loss": -41.257591247558594, "global_step": 352009, "epoch": 2909} {"train_loss": -41.78730010986328, "global_step": 352010, "epoch": 2909} {"train_loss": -42.07656478881836, "global_step": 352011, "epoch": 2909} {"train_loss": -41.57761764526367, "global_step": 352012, "epoch": 2909} {"train_loss": -41.85127639770508, "global_step": 352013, "epoch": 2909} {"train_loss": -41.23014450073242, "global_step": 352014, "epoch": 2909} {"train_loss": -42.432029724121094, "global_step": 352015, "epoch": 2909} {"train_loss": -42.53326416015625, "global_step": 352016, "epoch": 2909} {"train_loss": -41.49013137817383, "global_step": 352017, "epoch": 2909} {"train_loss": -41.87380599975586, "global_step": 352018, "epoch": 2909} {"train_loss": -41.66851806640625, "global_step": 352019, "epoch": 2909} {"train_loss": -42.65314865112305, "global_step": 352020, "epoch": 2909} {"train_loss": -41.7750358581543, "global_step": 352021, "epoch": 2909} {"train_loss": -42.12342071533203, "global_step": 352022, "epoch": 2909} {"train_loss": -41.919776916503906, "global_step": 352023, "epoch": 2909} {"train_loss": -42.7706184387207, "global_step": 352024, "epoch": 2909} {"train_loss": -41.70790481567383, "global_step": 352025, "epoch": 2909} {"train_loss": -42.600650787353516, "global_step": 352026, "epoch": 2909} {"train_loss": -41.62481689453125, "global_step": 352027, "epoch": 2909} {"train_loss": -42.5321159362793, "global_step": 352028, "epoch": 2909} {"train_loss": -41.6688346862793, "global_step": 352029, "epoch": 2909} {"train_loss": -42.26024627685547, "global_step": 352030, "epoch": 2909} {"train_loss": -42.763118743896484, "global_step": 352031, "epoch": 2909} {"train_loss": -42.55868148803711, "global_step": 352032, "epoch": 2909} {"train_loss": -42.10761260986328, "global_step": 352033, "epoch": 2909} {"train_loss": -42.169490814208984, "global_step": 352034, "epoch": 2909} {"train_loss": -41.59734344482422, "global_step": 352035, "epoch": 2909} {"train_loss": -42.944854736328125, "global_step": 352036, "epoch": 2909} {"train_loss": -42.84261703491211, "global_step": 352037, "epoch": 2909} {"train_loss": -42.30682373046875, "global_step": 352038, "epoch": 2909} {"train_loss": -42.035423278808594, "global_step": 352039, "epoch": 2909} {"train_loss": -41.86519241333008, "global_step": 352040, "epoch": 2909} {"train_loss": -42.484432220458984, "global_step": 352041, "epoch": 2909} {"train_loss": -41.92097091674805, "global_step": 352042, "epoch": 2909} {"train_loss": -42.7581672668457, "global_step": 352043, "epoch": 2909} {"train_loss": -41.66851043701172, "global_step": 352044, "epoch": 2909} {"train_loss": 3.7399704456329346, "global_step": 352045, "epoch": 2909} {"train_loss": -37.67552947998047, "global_step": 352046, "epoch": 2909} {"train_loss": -40.47064208984375, "global_step": 352047, "epoch": 2909} {"train_loss": -36.41436767578125, "global_step": 352048, "epoch": 2909} {"train_loss": -34.945980072021484, "global_step": 352049, "epoch": 2909} {"train_loss": -21.55946922302246, "global_step": 352050, "epoch": 2909} {"train_loss": 4.7512526512146, "global_step": 352051, "epoch": 2909} {"train_loss": -35.01043701171875, "global_step": 352052, "epoch": 2909} {"train_loss": -37.20222091674805, "global_step": 352053, "epoch": 2909} {"train_loss": -37.97843551635742, "global_step": 352054, "epoch": 2909} {"train_loss": -35.91618728637695, "global_step": 352055, "epoch": 2909} {"train_loss": -32.9628791809082, "global_step": 352056, "epoch": 2909} {"train_loss": -35.396724700927734, "global_step": 352057, "epoch": 2909} {"train_loss": -37.96963119506836, "global_step": 352058, "epoch": 2909} {"train_loss": -36.84846496582031, "global_step": 352059, "epoch": 2909} {"train_loss": -36.81705856323242, "global_step": 352060, "epoch": 2909} {"train_loss": -39.14019775390625, "global_step": 352061, "epoch": 2909} {"train_loss": -37.74306106567383, "global_step": 352062, "epoch": 2909} {"train_loss": -39.8048095703125, "global_step": 352063, "epoch": 2909} {"train_loss": -38.99702072143555, "global_step": 352064, "epoch": 2909} {"train_loss": -38.70319747924805, "global_step": 352065, "epoch": 2909} {"train_loss": -32.7607536315918, "global_step": 352066, "epoch": 2909} {"train_loss": -38.858673095703125, "global_step": 352067, "epoch": 2909} {"train_loss": -39.318267822265625, "global_step": 352068, "epoch": 2909} {"train_loss": -39.463619232177734, "global_step": 352069, "epoch": 2909} {"train_loss": -35.185951232910156, "global_step": 352070, "epoch": 2909} {"train_loss": -34.49929428100586, "global_step": 352071, "epoch": 2909} {"train_loss": -36.71970748901367, "global_step": 352072, "epoch": 2909} {"train_loss": -38.04694747924805, "global_step": 352073, "epoch": 2909} {"train_loss": -39.73187255859375, "global_step": 352074, "epoch": 2909} {"train_loss": -39.281551361083984, "global_step": 352075, "epoch": 2909} {"train_loss": -39.83866500854492, "global_step": 352076, "epoch": 2909} {"train_loss": -39.76725387573242, "global_step": 352077, "epoch": 2909} {"train_loss": -39.583003997802734, "global_step": 352078, "epoch": 2909} {"train_loss": -39.47526168823242, "global_step": 352079, "epoch": 2909} {"train_loss": -37.941226959228516, "global_step": 352080, "epoch": 2909} {"train_loss": -38.74923324584961, "global_step": 352081, "epoch": 2909} {"train_loss": -40.151329040527344, "global_step": 352082, "epoch": 2909} {"train_loss": -39.77579879760742, "global_step": 352083, "epoch": 2909} {"train_loss": -39.61317443847656, "global_step": 352084, "epoch": 2909} {"train_loss": -40.36690902709961, "global_step": 352085, "epoch": 2909} {"train_loss": -40.260799407958984, "global_step": 352086, "epoch": 2909} {"train_loss": -40.31986618041992, "global_step": 352087, "epoch": 2909} {"train_loss": -39.449684143066406, "global_step": 352088, "epoch": 2909} {"train_loss": -40.589759826660156, "global_step": 352089, "epoch": 2909} {"train_loss": -39.86714553833008, "global_step": 352090, "epoch": 2909} {"train_loss": -40.64780807495117, "global_step": 352091, "epoch": 2909} {"train_loss": -40.535118103027344, "global_step": 352092, "epoch": 2909} {"train_loss": -40.560272216796875, "global_step": 352093, "epoch": 2909} {"train_loss": -40.661895751953125, "global_step": 352094, "epoch": 2909} {"train_loss": -40.7311897277832, "global_step": 352095, "epoch": 2909} {"train_loss": -40.716529846191406, "global_step": 352096, "epoch": 2909} {"train_loss": -40.8924674987793, "global_step": 352097, "epoch": 2909} {"train_loss": -40.812400817871094, "global_step": 352098, "epoch": 2909} {"train_loss": -40.896202087402344, "global_step": 352099, "epoch": 2909} {"train_loss": -39.97015380859375, "global_step": 352100, "epoch": 2909} {"train_loss": -40.60773468017578, "global_step": 352101, "epoch": 2909} {"train_loss": -41.47026062011719, "global_step": 352102, "epoch": 2909} {"train_loss": -41.110748291015625, "global_step": 352103, "epoch": 2909} {"train_loss": -40.469818115234375, "global_step": 352104, "epoch": 2909} {"train_loss": -40.76041793823242, "global_step": 352105, "epoch": 2909} {"train_loss": -40.85432052612305, "global_step": 352106, "epoch": 2909} {"train_loss": -41.336727142333984, "global_step": 352107, "epoch": 2909} {"train_loss": -40.623165130615234, "global_step": 352108, "epoch": 2909} {"train_loss": -39.350454009268894, "global_step": 352109, "epoch": 2909, "val_loss": 2437543.75} {"train_loss": -41.54352569580078, "global_step": 352110, "epoch": 2910} {"train_loss": -41.23920822143555, "global_step": 352111, "epoch": 2910} {"train_loss": -41.92499542236328, "global_step": 352112, "epoch": 2910} {"train_loss": -41.72943878173828, "global_step": 352113, "epoch": 2910} {"train_loss": -41.487449645996094, "global_step": 352114, "epoch": 2910} {"train_loss": -41.644412994384766, "global_step": 352115, "epoch": 2910} {"train_loss": -42.0656852722168, "global_step": 352116, "epoch": 2910} {"train_loss": -41.60237121582031, "global_step": 352117, "epoch": 2910} {"train_loss": -42.00625228881836, "global_step": 352118, "epoch": 2910} {"train_loss": -40.96315383911133, "global_step": 352119, "epoch": 2910} {"train_loss": -42.08988571166992, "global_step": 352120, "epoch": 2910} {"train_loss": -41.613563537597656, "global_step": 352121, "epoch": 2910} {"train_loss": -42.4692497253418, "global_step": 352122, "epoch": 2910} {"train_loss": -42.0810661315918, "global_step": 352123, "epoch": 2910} {"train_loss": -42.01869583129883, "global_step": 352124, "epoch": 2910} {"train_loss": -42.04560852050781, "global_step": 352125, "epoch": 2910} {"train_loss": -42.09859848022461, "global_step": 352126, "epoch": 2910} {"train_loss": -41.994991302490234, "global_step": 352127, "epoch": 2910} {"train_loss": -41.36357498168945, "global_step": 352128, "epoch": 2910} {"train_loss": -42.61731719970703, "global_step": 352129, "epoch": 2910} {"train_loss": -41.36164855957031, "global_step": 352130, "epoch": 2910} {"train_loss": -42.8712043762207, "global_step": 352131, "epoch": 2910} {"train_loss": -42.355735778808594, "global_step": 352132, "epoch": 2910} {"train_loss": -42.41645431518555, "global_step": 352133, "epoch": 2910} {"train_loss": -42.45392990112305, "global_step": 352134, "epoch": 2910} {"train_loss": -42.80648422241211, "global_step": 352135, "epoch": 2910} {"train_loss": -42.075801849365234, "global_step": 352136, "epoch": 2910} {"train_loss": -42.83875274658203, "global_step": 352137, "epoch": 2910} {"train_loss": -41.869197845458984, "global_step": 352138, "epoch": 2910} {"train_loss": -42.45364761352539, "global_step": 352139, "epoch": 2910} {"train_loss": -42.01594924926758, "global_step": 352140, "epoch": 2910} {"train_loss": -42.8614501953125, "global_step": 352141, "epoch": 2910} {"train_loss": -42.768367767333984, "global_step": 352142, "epoch": 2910} {"train_loss": -43.196292877197266, "global_step": 352143, "epoch": 2910} {"train_loss": -42.68212890625, "global_step": 352144, "epoch": 2910} {"train_loss": -42.356929779052734, "global_step": 352145, "epoch": 2910} {"train_loss": -42.49901580810547, "global_step": 352146, "epoch": 2910} {"train_loss": -43.133399963378906, "global_step": 352147, "epoch": 2910} {"train_loss": -42.603633880615234, "global_step": 352148, "epoch": 2910} {"train_loss": -43.4275016784668, "global_step": 352149, "epoch": 2910} {"train_loss": -42.838050842285156, "global_step": 352150, "epoch": 2910} {"train_loss": -43.16150665283203, "global_step": 352151, "epoch": 2910} {"train_loss": -43.46863555908203, "global_step": 352152, "epoch": 2910} {"train_loss": -42.78778076171875, "global_step": 352153, "epoch": 2910} {"train_loss": -43.09116744995117, "global_step": 352154, "epoch": 2910} {"train_loss": -43.27002716064453, "global_step": 352155, "epoch": 2910} {"train_loss": -43.554439544677734, "global_step": 352156, "epoch": 2910} {"train_loss": -43.0205192565918, "global_step": 352157, "epoch": 2910} {"train_loss": -43.55770492553711, "global_step": 352158, "epoch": 2910} {"train_loss": -43.36492156982422, "global_step": 352159, "epoch": 2910} {"train_loss": -43.45573425292969, "global_step": 352160, "epoch": 2910} {"train_loss": -43.38855743408203, "global_step": 352161, "epoch": 2910} {"train_loss": -43.14036178588867, "global_step": 352162, "epoch": 2910} {"train_loss": -43.16064453125, "global_step": 352163, "epoch": 2910} {"train_loss": -43.16960525512695, "global_step": 352164, "epoch": 2910} {"train_loss": -43.10560989379883, "global_step": 352165, "epoch": 2910} {"train_loss": -43.27669906616211, "global_step": 352166, "epoch": 2910} {"train_loss": -43.86025619506836, "global_step": 352167, "epoch": 2910} {"train_loss": -43.74440383911133, "global_step": 352168, "epoch": 2910} {"train_loss": -43.63316345214844, "global_step": 352169, "epoch": 2910} {"train_loss": -43.77267074584961, "global_step": 352170, "epoch": 2910} {"train_loss": -44.1341667175293, "global_step": 352171, "epoch": 2910} {"train_loss": -43.83181381225586, "global_step": 352172, "epoch": 2910} {"train_loss": -43.80645751953125, "global_step": 352173, "epoch": 2910} {"train_loss": -42.79673385620117, "global_step": 352174, "epoch": 2910} {"train_loss": -42.020450592041016, "global_step": 352175, "epoch": 2910} {"train_loss": -43.80546951293945, "global_step": 352176, "epoch": 2910} {"train_loss": -44.003273010253906, "global_step": 352177, "epoch": 2910} {"train_loss": -43.42420959472656, "global_step": 352178, "epoch": 2910} {"train_loss": -44.089599609375, "global_step": 352179, "epoch": 2910} {"train_loss": -44.268795013427734, "global_step": 352180, "epoch": 2910} {"train_loss": -43.5964469909668, "global_step": 352181, "epoch": 2910} {"train_loss": -44.317378997802734, "global_step": 352182, "epoch": 2910} {"train_loss": -44.0472297668457, "global_step": 352183, "epoch": 2910} {"train_loss": -44.131988525390625, "global_step": 352184, "epoch": 2910} {"train_loss": -43.734649658203125, "global_step": 352185, "epoch": 2910} {"train_loss": -43.2019157409668, "global_step": 352186, "epoch": 2910} {"train_loss": -44.28609848022461, "global_step": 352187, "epoch": 2910} {"train_loss": -44.22304153442383, "global_step": 352188, "epoch": 2910} {"train_loss": -44.344581604003906, "global_step": 352189, "epoch": 2910} {"train_loss": -43.14693069458008, "global_step": 352190, "epoch": 2910} {"train_loss": -43.84282302856445, "global_step": 352191, "epoch": 2910} {"train_loss": -41.52574157714844, "global_step": 352192, "epoch": 2910} {"train_loss": -43.781124114990234, "global_step": 352193, "epoch": 2910} {"train_loss": -43.88465881347656, "global_step": 352194, "epoch": 2910} {"train_loss": -43.36848068237305, "global_step": 352195, "epoch": 2910} {"train_loss": -43.06603240966797, "global_step": 352196, "epoch": 2910} {"train_loss": -43.90669631958008, "global_step": 352197, "epoch": 2910} {"train_loss": -43.02398681640625, "global_step": 352198, "epoch": 2910} {"train_loss": -43.55727767944336, "global_step": 352199, "epoch": 2910} {"train_loss": -43.39879608154297, "global_step": 352200, "epoch": 2910} {"train_loss": -42.81718063354492, "global_step": 352201, "epoch": 2910} {"train_loss": -43.828487396240234, "global_step": 352202, "epoch": 2910} {"train_loss": -44.138118743896484, "global_step": 352203, "epoch": 2910} {"train_loss": -44.18978500366211, "global_step": 352204, "epoch": 2910} {"train_loss": -43.791587829589844, "global_step": 352205, "epoch": 2910} {"train_loss": -43.62866973876953, "global_step": 352206, "epoch": 2910} {"train_loss": -44.07622146606445, "global_step": 352207, "epoch": 2910} {"train_loss": -44.10218048095703, "global_step": 352208, "epoch": 2910} {"train_loss": -44.18708419799805, "global_step": 352209, "epoch": 2910} {"train_loss": -43.76286697387695, "global_step": 352210, "epoch": 2910} {"train_loss": -44.00344467163086, "global_step": 352211, "epoch": 2910} {"train_loss": -44.4827880859375, "global_step": 352212, "epoch": 2910} {"train_loss": -44.146453857421875, "global_step": 352213, "epoch": 2910} {"train_loss": -44.357051849365234, "global_step": 352214, "epoch": 2910} {"train_loss": -44.16492462158203, "global_step": 352215, "epoch": 2910} {"train_loss": -43.4240837097168, "global_step": 352216, "epoch": 2910} {"train_loss": -43.19245529174805, "global_step": 352217, "epoch": 2910} {"train_loss": -43.52116012573242, "global_step": 352218, "epoch": 2910} {"train_loss": -43.08969497680664, "global_step": 352219, "epoch": 2910} {"train_loss": -42.013160705566406, "global_step": 352220, "epoch": 2910} {"train_loss": -40.80598831176758, "global_step": 352221, "epoch": 2910} {"train_loss": -40.82301712036133, "global_step": 352222, "epoch": 2910} {"train_loss": -42.63703536987305, "global_step": 352223, "epoch": 2910} {"train_loss": -43.18404769897461, "global_step": 352224, "epoch": 2910} {"train_loss": -42.10451889038086, "global_step": 352225, "epoch": 2910} {"train_loss": -33.041046142578125, "global_step": 352226, "epoch": 2910} {"train_loss": -26.254364013671875, "global_step": 352227, "epoch": 2910} {"train_loss": -29.930524826049805, "global_step": 352228, "epoch": 2910} {"train_loss": -36.461463928222656, "global_step": 352229, "epoch": 2910} {"train_loss": -42.59718053202984, "global_step": 352230, "epoch": 2910, "val_loss": 2545804.5} {"train_loss": -38.860599517822266, "global_step": 352231, "epoch": 2911} {"train_loss": -37.24263000488281, "global_step": 352232, "epoch": 2911} {"train_loss": -39.25165557861328, "global_step": 352233, "epoch": 2911} {"train_loss": -37.05405807495117, "global_step": 352234, "epoch": 2911} {"train_loss": -39.94448471069336, "global_step": 352235, "epoch": 2911} {"train_loss": -39.35741424560547, "global_step": 352236, "epoch": 2911} {"train_loss": -40.845333099365234, "global_step": 352237, "epoch": 2911} {"train_loss": -39.75470733642578, "global_step": 352238, "epoch": 2911} {"train_loss": -38.77897262573242, "global_step": 352239, "epoch": 2911} {"train_loss": -41.807167053222656, "global_step": 352240, "epoch": 2911} {"train_loss": -37.85503005981445, "global_step": 352241, "epoch": 2911} {"train_loss": -42.147605895996094, "global_step": 352242, "epoch": 2911} {"train_loss": -40.73440170288086, "global_step": 352243, "epoch": 2911} {"train_loss": -42.28800964355469, "global_step": 352244, "epoch": 2911} {"train_loss": -40.93691635131836, "global_step": 352245, "epoch": 2911} {"train_loss": -41.37150955200195, "global_step": 352246, "epoch": 2911} {"train_loss": -41.7230339050293, "global_step": 352247, "epoch": 2911} {"train_loss": -40.95225143432617, "global_step": 352248, "epoch": 2911} {"train_loss": -42.26948165893555, "global_step": 352249, "epoch": 2911} {"train_loss": -41.667205810546875, "global_step": 352250, "epoch": 2911} {"train_loss": -42.89853286743164, "global_step": 352251, "epoch": 2911} {"train_loss": -42.335960388183594, "global_step": 352252, "epoch": 2911} {"train_loss": -42.53989028930664, "global_step": 352253, "epoch": 2911} {"train_loss": -42.182701110839844, "global_step": 352254, "epoch": 2911} {"train_loss": -42.528541564941406, "global_step": 352255, "epoch": 2911} {"train_loss": -43.25625228881836, "global_step": 352256, "epoch": 2911} {"train_loss": -42.41996383666992, "global_step": 352257, "epoch": 2911} {"train_loss": -42.482879638671875, "global_step": 352258, "epoch": 2911} {"train_loss": -42.876708984375, "global_step": 352259, "epoch": 2911} {"train_loss": -43.03347396850586, "global_step": 352260, "epoch": 2911} {"train_loss": -42.625850677490234, "global_step": 352261, "epoch": 2911} {"train_loss": -43.2264518737793, "global_step": 352262, "epoch": 2911} {"train_loss": -43.58103561401367, "global_step": 352263, "epoch": 2911} {"train_loss": -43.35598373413086, "global_step": 352264, "epoch": 2911} {"train_loss": -43.16066360473633, "global_step": 352265, "epoch": 2911} {"train_loss": -43.30708694458008, "global_step": 352266, "epoch": 2911} {"train_loss": -43.2415657043457, "global_step": 352267, "epoch": 2911} {"train_loss": -43.52292251586914, "global_step": 352268, "epoch": 2911} {"train_loss": -43.24235916137695, "global_step": 352269, "epoch": 2911} {"train_loss": -43.5825309753418, "global_step": 352270, "epoch": 2911} {"train_loss": -43.25513458251953, "global_step": 352271, "epoch": 2911} {"train_loss": -43.094482421875, "global_step": 352272, "epoch": 2911} {"train_loss": -43.76949691772461, "global_step": 352273, "epoch": 2911} {"train_loss": -43.587677001953125, "global_step": 352274, "epoch": 2911} {"train_loss": -43.23028564453125, "global_step": 352275, "epoch": 2911} {"train_loss": -43.64713668823242, "global_step": 352276, "epoch": 2911} {"train_loss": -43.44853210449219, "global_step": 352277, "epoch": 2911} {"train_loss": -43.88246536254883, "global_step": 352278, "epoch": 2911} {"train_loss": -43.68059539794922, "global_step": 352279, "epoch": 2911} {"train_loss": -42.979549407958984, "global_step": 352280, "epoch": 2911} {"train_loss": -44.00593948364258, "global_step": 352281, "epoch": 2911} {"train_loss": -44.1361198425293, "global_step": 352282, "epoch": 2911} {"train_loss": -43.66668701171875, "global_step": 352283, "epoch": 2911} {"train_loss": -43.85019302368164, "global_step": 352284, "epoch": 2911} {"train_loss": -44.29643630981445, "global_step": 352285, "epoch": 2911} {"train_loss": -43.90440368652344, "global_step": 352286, "epoch": 2911} {"train_loss": -43.7141227722168, "global_step": 352287, "epoch": 2911} {"train_loss": -44.37504959106445, "global_step": 352288, "epoch": 2911} {"train_loss": -44.199703216552734, "global_step": 352289, "epoch": 2911} {"train_loss": -44.03474426269531, "global_step": 352290, "epoch": 2911} {"train_loss": -43.867977142333984, "global_step": 352291, "epoch": 2911} {"train_loss": -43.741512298583984, "global_step": 352292, "epoch": 2911} {"train_loss": -44.18267822265625, "global_step": 352293, "epoch": 2911} {"train_loss": -44.1717529296875, "global_step": 352294, "epoch": 2911} {"train_loss": -43.568782806396484, "global_step": 352295, "epoch": 2911} {"train_loss": -43.23615264892578, "global_step": 352296, "epoch": 2911} {"train_loss": -44.186370849609375, "global_step": 352297, "epoch": 2911} {"train_loss": -44.72822952270508, "global_step": 352298, "epoch": 2911} {"train_loss": -44.55584716796875, "global_step": 352299, "epoch": 2911} {"train_loss": -44.4306526184082, "global_step": 352300, "epoch": 2911} {"train_loss": -44.09968948364258, "global_step": 352301, "epoch": 2911} {"train_loss": -44.53571319580078, "global_step": 352302, "epoch": 2911} {"train_loss": -44.693603515625, "global_step": 352303, "epoch": 2911} {"train_loss": -42.73598098754883, "global_step": 352304, "epoch": 2911} {"train_loss": -44.6761474609375, "global_step": 352305, "epoch": 2911} {"train_loss": -43.430660247802734, "global_step": 352306, "epoch": 2911} {"train_loss": -44.33335494995117, "global_step": 352307, "epoch": 2911} {"train_loss": -44.45429611206055, "global_step": 352308, "epoch": 2911} {"train_loss": -44.35067367553711, "global_step": 352309, "epoch": 2911} {"train_loss": -44.527687072753906, "global_step": 352310, "epoch": 2911} {"train_loss": -44.568809509277344, "global_step": 352311, "epoch": 2911} {"train_loss": -44.74659729003906, "global_step": 352312, "epoch": 2911} {"train_loss": -44.49898910522461, "global_step": 352313, "epoch": 2911} {"train_loss": -44.91401290893555, "global_step": 352314, "epoch": 2911} {"train_loss": -43.54951095581055, "global_step": 352315, "epoch": 2911} {"train_loss": -44.554840087890625, "global_step": 352316, "epoch": 2911} {"train_loss": -43.85819625854492, "global_step": 352317, "epoch": 2911} {"train_loss": -43.6439208984375, "global_step": 352318, "epoch": 2911} {"train_loss": -44.16389083862305, "global_step": 352319, "epoch": 2911} {"train_loss": -44.97847366333008, "global_step": 352320, "epoch": 2911} {"train_loss": -43.99155807495117, "global_step": 352321, "epoch": 2911} {"train_loss": -44.99468994140625, "global_step": 352322, "epoch": 2911} {"train_loss": -45.067718505859375, "global_step": 352323, "epoch": 2911} {"train_loss": -44.26306915283203, "global_step": 352324, "epoch": 2911} {"train_loss": -44.46795654296875, "global_step": 352325, "epoch": 2911} {"train_loss": -44.658912658691406, "global_step": 352326, "epoch": 2911} {"train_loss": -45.12150573730469, "global_step": 352327, "epoch": 2911} {"train_loss": -45.105709075927734, "global_step": 352328, "epoch": 2911} {"train_loss": -44.16127395629883, "global_step": 352329, "epoch": 2911} {"train_loss": -44.53347396850586, "global_step": 352330, "epoch": 2911} {"train_loss": -44.27477264404297, "global_step": 352331, "epoch": 2911} {"train_loss": -43.88029861450195, "global_step": 352332, "epoch": 2911} {"train_loss": -44.90214157104492, "global_step": 352333, "epoch": 2911} {"train_loss": -44.254432678222656, "global_step": 352334, "epoch": 2911} {"train_loss": -43.901885986328125, "global_step": 352335, "epoch": 2911} {"train_loss": -43.90041732788086, "global_step": 352336, "epoch": 2911} {"train_loss": -43.05491256713867, "global_step": 352337, "epoch": 2911} {"train_loss": -43.034175872802734, "global_step": 352338, "epoch": 2911} {"train_loss": -43.956966400146484, "global_step": 352339, "epoch": 2911} {"train_loss": -45.08284378051758, "global_step": 352340, "epoch": 2911} {"train_loss": -43.91182327270508, "global_step": 352341, "epoch": 2911} {"train_loss": -44.147071838378906, "global_step": 352342, "epoch": 2911} {"train_loss": -42.94809341430664, "global_step": 352343, "epoch": 2911} {"train_loss": -42.6718864440918, "global_step": 352344, "epoch": 2911} {"train_loss": -41.35390853881836, "global_step": 352345, "epoch": 2911} {"train_loss": -39.762306213378906, "global_step": 352346, "epoch": 2911} {"train_loss": -41.884281158447266, "global_step": 352347, "epoch": 2911} {"train_loss": -44.11848831176758, "global_step": 352348, "epoch": 2911} {"train_loss": -43.82668685913086, "global_step": 352349, "epoch": 2911} {"train_loss": -43.098812103271484, "global_step": 352350, "epoch": 2911} {"train_loss": -43.167692389369996, "global_step": 352351, "epoch": 2911, "val_loss": 2474820.75} {"train_loss": -44.390464782714844, "global_step": 352352, "epoch": 2912} {"train_loss": -42.43821334838867, "global_step": 352353, "epoch": 2912} {"train_loss": -42.64795684814453, "global_step": 352354, "epoch": 2912} {"train_loss": -43.28720474243164, "global_step": 352355, "epoch": 2912} {"train_loss": -43.80437088012695, "global_step": 352356, "epoch": 2912} {"train_loss": -43.862754821777344, "global_step": 352357, "epoch": 2912} {"train_loss": -43.49773025512695, "global_step": 352358, "epoch": 2912} {"train_loss": -43.214107513427734, "global_step": 352359, "epoch": 2912} {"train_loss": -43.83005142211914, "global_step": 352360, "epoch": 2912} {"train_loss": -43.519954681396484, "global_step": 352361, "epoch": 2912} {"train_loss": -43.68807601928711, "global_step": 352362, "epoch": 2912} {"train_loss": -43.547996520996094, "global_step": 352363, "epoch": 2912} {"train_loss": -43.49320602416992, "global_step": 352364, "epoch": 2912} {"train_loss": -44.0414924621582, "global_step": 352365, "epoch": 2912} {"train_loss": -44.83205795288086, "global_step": 352366, "epoch": 2912} {"train_loss": -44.1079216003418, "global_step": 352367, "epoch": 2912} {"train_loss": -43.86090087890625, "global_step": 352368, "epoch": 2912} {"train_loss": -44.50556182861328, "global_step": 352369, "epoch": 2912} {"train_loss": -44.46981430053711, "global_step": 352370, "epoch": 2912} {"train_loss": -44.27886962890625, "global_step": 352371, "epoch": 2912} {"train_loss": -43.31538772583008, "global_step": 352372, "epoch": 2912} {"train_loss": -44.89547348022461, "global_step": 352373, "epoch": 2912} {"train_loss": -43.55183792114258, "global_step": 352374, "epoch": 2912} {"train_loss": -44.38269805908203, "global_step": 352375, "epoch": 2912} {"train_loss": -44.097713470458984, "global_step": 352376, "epoch": 2912} {"train_loss": -44.659793853759766, "global_step": 352377, "epoch": 2912} {"train_loss": -43.385677337646484, "global_step": 352378, "epoch": 2912} {"train_loss": -44.43662643432617, "global_step": 352379, "epoch": 2912} {"train_loss": -44.592041015625, "global_step": 352380, "epoch": 2912} {"train_loss": -43.31473922729492, "global_step": 352381, "epoch": 2912} {"train_loss": -44.580440521240234, "global_step": 352382, "epoch": 2912} {"train_loss": -44.17337417602539, "global_step": 352383, "epoch": 2912} {"train_loss": -44.423805236816406, "global_step": 352384, "epoch": 2912} {"train_loss": -44.693519592285156, "global_step": 352385, "epoch": 2912} {"train_loss": -44.6616096496582, "global_step": 352386, "epoch": 2912} {"train_loss": -44.60166931152344, "global_step": 352387, "epoch": 2912} {"train_loss": -43.913665771484375, "global_step": 352388, "epoch": 2912} {"train_loss": -43.00433349609375, "global_step": 352389, "epoch": 2912} {"train_loss": -44.59189987182617, "global_step": 352390, "epoch": 2912} {"train_loss": -44.505916595458984, "global_step": 352391, "epoch": 2912} {"train_loss": -43.958473205566406, "global_step": 352392, "epoch": 2912} {"train_loss": -43.81805419921875, "global_step": 352393, "epoch": 2912} {"train_loss": -44.54108810424805, "global_step": 352394, "epoch": 2912} {"train_loss": -44.753231048583984, "global_step": 352395, "epoch": 2912} {"train_loss": -44.2347412109375, "global_step": 352396, "epoch": 2912} {"train_loss": -44.84440994262695, "global_step": 352397, "epoch": 2912} {"train_loss": -44.17594528198242, "global_step": 352398, "epoch": 2912} {"train_loss": -44.8696403503418, "global_step": 352399, "epoch": 2912} {"train_loss": -44.59823226928711, "global_step": 352400, "epoch": 2912} {"train_loss": -44.5752067565918, "global_step": 352401, "epoch": 2912} {"train_loss": -43.236289978027344, "global_step": 352402, "epoch": 2912} {"train_loss": -43.784095764160156, "global_step": 352403, "epoch": 2912} {"train_loss": -43.94355010986328, "global_step": 352404, "epoch": 2912} {"train_loss": -43.57182693481445, "global_step": 352405, "epoch": 2912} {"train_loss": -42.30110168457031, "global_step": 352406, "epoch": 2912} {"train_loss": -43.326961517333984, "global_step": 352407, "epoch": 2912} {"train_loss": -44.3847770690918, "global_step": 352408, "epoch": 2912} {"train_loss": -42.36990737915039, "global_step": 352409, "epoch": 2912} {"train_loss": -43.24909591674805, "global_step": 352410, "epoch": 2912} {"train_loss": -42.56520462036133, "global_step": 352411, "epoch": 2912} {"train_loss": -42.927825927734375, "global_step": 352412, "epoch": 2912} {"train_loss": -42.65264892578125, "global_step": 352413, "epoch": 2912} {"train_loss": -42.1225700378418, "global_step": 352414, "epoch": 2912} {"train_loss": -42.84144973754883, "global_step": 352415, "epoch": 2912} {"train_loss": -43.12635040283203, "global_step": 352416, "epoch": 2912} {"train_loss": -43.27919387817383, "global_step": 352417, "epoch": 2912} {"train_loss": -41.74445724487305, "global_step": 352418, "epoch": 2912} {"train_loss": -43.20730209350586, "global_step": 352419, "epoch": 2912} {"train_loss": -42.725555419921875, "global_step": 352420, "epoch": 2912} {"train_loss": -42.32160186767578, "global_step": 352421, "epoch": 2912} {"train_loss": -41.48247146606445, "global_step": 352422, "epoch": 2912} {"train_loss": -42.8150520324707, "global_step": 352423, "epoch": 2912} {"train_loss": -42.457210540771484, "global_step": 352424, "epoch": 2912} {"train_loss": -42.90186309814453, "global_step": 352425, "epoch": 2912} {"train_loss": -43.32192611694336, "global_step": 352426, "epoch": 2912} {"train_loss": -43.706092834472656, "global_step": 352427, "epoch": 2912} {"train_loss": -43.61557388305664, "global_step": 352428, "epoch": 2912} {"train_loss": -44.0140495300293, "global_step": 352429, "epoch": 2912} {"train_loss": -43.38568878173828, "global_step": 352430, "epoch": 2912} {"train_loss": -43.487022399902344, "global_step": 352431, "epoch": 2912} {"train_loss": -42.59827423095703, "global_step": 352432, "epoch": 2912} {"train_loss": -44.0505485534668, "global_step": 352433, "epoch": 2912} {"train_loss": -43.96733093261719, "global_step": 352434, "epoch": 2912} {"train_loss": -43.22712326049805, "global_step": 352435, "epoch": 2912} {"train_loss": -43.035526275634766, "global_step": 352436, "epoch": 2912} {"train_loss": -44.051673889160156, "global_step": 352437, "epoch": 2912} {"train_loss": -42.646392822265625, "global_step": 352438, "epoch": 2912} {"train_loss": -43.02762985229492, "global_step": 352439, "epoch": 2912} {"train_loss": -43.69254684448242, "global_step": 352440, "epoch": 2912} {"train_loss": -42.83696365356445, "global_step": 352441, "epoch": 2912} {"train_loss": -42.06237030029297, "global_step": 352442, "epoch": 2912} {"train_loss": -43.60917282104492, "global_step": 352443, "epoch": 2912} {"train_loss": -43.05788803100586, "global_step": 352444, "epoch": 2912} {"train_loss": -40.2988166809082, "global_step": 352445, "epoch": 2912} {"train_loss": -39.57401657104492, "global_step": 352446, "epoch": 2912} {"train_loss": -42.80052185058594, "global_step": 352447, "epoch": 2912} {"train_loss": -42.24848175048828, "global_step": 352448, "epoch": 2912} {"train_loss": -40.26367950439453, "global_step": 352449, "epoch": 2912} {"train_loss": -43.16158676147461, "global_step": 352450, "epoch": 2912} {"train_loss": -40.59164047241211, "global_step": 352451, "epoch": 2912} {"train_loss": -39.57148361206055, "global_step": 352452, "epoch": 2912} {"train_loss": -42.888065338134766, "global_step": 352453, "epoch": 2912} {"train_loss": -42.15807342529297, "global_step": 352454, "epoch": 2912} {"train_loss": -42.23165512084961, "global_step": 352455, "epoch": 2912} {"train_loss": -43.39863204956055, "global_step": 352456, "epoch": 2912} {"train_loss": -41.7874870300293, "global_step": 352457, "epoch": 2912} {"train_loss": -42.63155746459961, "global_step": 352458, "epoch": 2912} {"train_loss": -42.563987731933594, "global_step": 352459, "epoch": 2912} {"train_loss": -41.8076286315918, "global_step": 352460, "epoch": 2912} {"train_loss": -43.06726837158203, "global_step": 352461, "epoch": 2912} {"train_loss": -43.2440299987793, "global_step": 352462, "epoch": 2912} {"train_loss": -42.865116119384766, "global_step": 352463, "epoch": 2912} {"train_loss": -43.13192367553711, "global_step": 352464, "epoch": 2912} {"train_loss": -43.3004035949707, "global_step": 352465, "epoch": 2912} {"train_loss": -43.65262222290039, "global_step": 352466, "epoch": 2912} {"train_loss": -43.613216400146484, "global_step": 352467, "epoch": 2912} {"train_loss": -44.17717361450195, "global_step": 352468, "epoch": 2912} {"train_loss": -43.216461181640625, "global_step": 352469, "epoch": 2912} {"train_loss": -42.888160705566406, "global_step": 352470, "epoch": 2912} {"train_loss": -43.80081558227539, "global_step": 352471, "epoch": 2912} {"train_loss": -43.35303109539442, "global_step": 352472, "epoch": 2912, "val_loss": 2546783.0} {"train_loss": -43.784400939941406, "global_step": 352473, "epoch": 2913} {"train_loss": -43.543819427490234, "global_step": 352474, "epoch": 2913} {"train_loss": -44.21974563598633, "global_step": 352475, "epoch": 2913} {"train_loss": -43.89280319213867, "global_step": 352476, "epoch": 2913} {"train_loss": -44.40938186645508, "global_step": 352477, "epoch": 2913} {"train_loss": -44.57251739501953, "global_step": 352478, "epoch": 2913} {"train_loss": -44.376708984375, "global_step": 352479, "epoch": 2913} {"train_loss": -44.175392150878906, "global_step": 352480, "epoch": 2913} {"train_loss": -44.252220153808594, "global_step": 352481, "epoch": 2913} {"train_loss": -44.189971923828125, "global_step": 352482, "epoch": 2913} {"train_loss": -43.703216552734375, "global_step": 352483, "epoch": 2913} {"train_loss": -44.729671478271484, "global_step": 352484, "epoch": 2913} {"train_loss": -44.348785400390625, "global_step": 352485, "epoch": 2913} {"train_loss": -43.83755111694336, "global_step": 352486, "epoch": 2913} {"train_loss": -44.17610168457031, "global_step": 352487, "epoch": 2913} {"train_loss": -44.47125244140625, "global_step": 352488, "epoch": 2913} {"train_loss": -44.499637603759766, "global_step": 352489, "epoch": 2913} {"train_loss": -44.16813278198242, "global_step": 352490, "epoch": 2913} {"train_loss": -44.79436111450195, "global_step": 352491, "epoch": 2913} {"train_loss": -44.8924674987793, "global_step": 352492, "epoch": 2913} {"train_loss": -44.555477142333984, "global_step": 352493, "epoch": 2913} {"train_loss": -44.39320755004883, "global_step": 352494, "epoch": 2913} {"train_loss": -45.10300827026367, "global_step": 352495, "epoch": 2913} {"train_loss": -45.114906311035156, "global_step": 352496, "epoch": 2913} {"train_loss": -44.14229202270508, "global_step": 352497, "epoch": 2913} {"train_loss": -44.78965377807617, "global_step": 352498, "epoch": 2913} {"train_loss": -44.90818405151367, "global_step": 352499, "epoch": 2913} {"train_loss": -44.176876068115234, "global_step": 352500, "epoch": 2913} {"train_loss": -43.435455322265625, "global_step": 352501, "epoch": 2913} {"train_loss": -43.35347366333008, "global_step": 352502, "epoch": 2913} {"train_loss": -43.751220703125, "global_step": 352503, "epoch": 2913} {"train_loss": -44.418819427490234, "global_step": 352504, "epoch": 2913} {"train_loss": -44.163631439208984, "global_step": 352505, "epoch": 2913} {"train_loss": -44.07093048095703, "global_step": 352506, "epoch": 2913} {"train_loss": -44.439754486083984, "global_step": 352507, "epoch": 2913} {"train_loss": -45.3101921081543, "global_step": 352508, "epoch": 2913} {"train_loss": -44.030303955078125, "global_step": 352509, "epoch": 2913} {"train_loss": -44.65983963012695, "global_step": 352510, "epoch": 2913} {"train_loss": -45.169464111328125, "global_step": 352511, "epoch": 2913} {"train_loss": -44.755470275878906, "global_step": 352512, "epoch": 2913} {"train_loss": -43.813899993896484, "global_step": 352513, "epoch": 2913} {"train_loss": -44.325801849365234, "global_step": 352514, "epoch": 2913} {"train_loss": -44.290321350097656, "global_step": 352515, "epoch": 2913} {"train_loss": -44.475955963134766, "global_step": 352516, "epoch": 2913} {"train_loss": -44.52812957763672, "global_step": 352517, "epoch": 2913} {"train_loss": -44.7773551940918, "global_step": 352518, "epoch": 2913} {"train_loss": -43.86054229736328, "global_step": 352519, "epoch": 2913} {"train_loss": -44.785213470458984, "global_step": 352520, "epoch": 2913} {"train_loss": -44.61418914794922, "global_step": 352521, "epoch": 2913} {"train_loss": -44.647850036621094, "global_step": 352522, "epoch": 2913} {"train_loss": -44.75624465942383, "global_step": 352523, "epoch": 2913} {"train_loss": -44.70111846923828, "global_step": 352524, "epoch": 2913} {"train_loss": -44.74408721923828, "global_step": 352525, "epoch": 2913} {"train_loss": -43.90034103393555, "global_step": 352526, "epoch": 2913} {"train_loss": -42.937007904052734, "global_step": 352527, "epoch": 2913} {"train_loss": -44.05220413208008, "global_step": 352528, "epoch": 2913} {"train_loss": -43.945621490478516, "global_step": 352529, "epoch": 2913} {"train_loss": -44.73643493652344, "global_step": 352530, "epoch": 2913} {"train_loss": -44.47322463989258, "global_step": 352531, "epoch": 2913} {"train_loss": -44.53580856323242, "global_step": 352532, "epoch": 2913} {"train_loss": -45.06732940673828, "global_step": 352533, "epoch": 2913} {"train_loss": -44.06449508666992, "global_step": 352534, "epoch": 2913} {"train_loss": -44.05536651611328, "global_step": 352535, "epoch": 2913} {"train_loss": -44.51311111450195, "global_step": 352536, "epoch": 2913} {"train_loss": -44.230464935302734, "global_step": 352537, "epoch": 2913} {"train_loss": -43.59467315673828, "global_step": 352538, "epoch": 2913} {"train_loss": -42.83727264404297, "global_step": 352539, "epoch": 2913} {"train_loss": -43.54596710205078, "global_step": 352540, "epoch": 2913} {"train_loss": -42.82638931274414, "global_step": 352541, "epoch": 2913} {"train_loss": -41.48523712158203, "global_step": 352542, "epoch": 2913} {"train_loss": -43.14716720581055, "global_step": 352543, "epoch": 2913} {"train_loss": -44.10647964477539, "global_step": 352544, "epoch": 2913} {"train_loss": -43.696773529052734, "global_step": 352545, "epoch": 2913} {"train_loss": -42.36421203613281, "global_step": 352546, "epoch": 2913} {"train_loss": -42.02279281616211, "global_step": 352547, "epoch": 2913} {"train_loss": -41.086891174316406, "global_step": 352548, "epoch": 2913} {"train_loss": -39.68178939819336, "global_step": 352549, "epoch": 2913} {"train_loss": -40.1192626953125, "global_step": 352550, "epoch": 2913} {"train_loss": -42.856319427490234, "global_step": 352551, "epoch": 2913} {"train_loss": -41.39768600463867, "global_step": 352552, "epoch": 2913} {"train_loss": -39.24557113647461, "global_step": 352553, "epoch": 2913} {"train_loss": -42.07261276245117, "global_step": 352554, "epoch": 2913} {"train_loss": -43.160579681396484, "global_step": 352555, "epoch": 2913} {"train_loss": -42.32050323486328, "global_step": 352556, "epoch": 2913} {"train_loss": -43.258705139160156, "global_step": 352557, "epoch": 2913} {"train_loss": -42.9775390625, "global_step": 352558, "epoch": 2913} {"train_loss": -42.68889236450195, "global_step": 352559, "epoch": 2913} {"train_loss": -41.532989501953125, "global_step": 352560, "epoch": 2913} {"train_loss": -43.37950897216797, "global_step": 352561, "epoch": 2913} {"train_loss": -41.41792297363281, "global_step": 352562, "epoch": 2913} {"train_loss": -42.746761322021484, "global_step": 352563, "epoch": 2913} {"train_loss": -42.63728713989258, "global_step": 352564, "epoch": 2913} {"train_loss": -42.876094818115234, "global_step": 352565, "epoch": 2913} {"train_loss": -42.339149475097656, "global_step": 352566, "epoch": 2913} {"train_loss": -42.577964782714844, "global_step": 352567, "epoch": 2913} {"train_loss": -42.98488998413086, "global_step": 352568, "epoch": 2913} {"train_loss": -43.27049255371094, "global_step": 352569, "epoch": 2913} {"train_loss": -42.23531723022461, "global_step": 352570, "epoch": 2913} {"train_loss": -43.60091781616211, "global_step": 352571, "epoch": 2913} {"train_loss": -43.70768356323242, "global_step": 352572, "epoch": 2913} {"train_loss": -43.33148193359375, "global_step": 352573, "epoch": 2913} {"train_loss": -43.348114013671875, "global_step": 352574, "epoch": 2913} {"train_loss": -43.69212341308594, "global_step": 352575, "epoch": 2913} {"train_loss": -43.750186920166016, "global_step": 352576, "epoch": 2913} {"train_loss": -43.64054489135742, "global_step": 352577, "epoch": 2913} {"train_loss": -44.0388298034668, "global_step": 352578, "epoch": 2913} {"train_loss": -43.148597717285156, "global_step": 352579, "epoch": 2913} {"train_loss": -44.23348617553711, "global_step": 352580, "epoch": 2913} {"train_loss": -43.333213806152344, "global_step": 352581, "epoch": 2913} {"train_loss": -42.41970443725586, "global_step": 352582, "epoch": 2913} {"train_loss": -44.27418518066406, "global_step": 352583, "epoch": 2913} {"train_loss": -43.1908073425293, "global_step": 352584, "epoch": 2913} {"train_loss": -43.360713958740234, "global_step": 352585, "epoch": 2913} {"train_loss": -44.28589630126953, "global_step": 352586, "epoch": 2913} {"train_loss": -43.546138763427734, "global_step": 352587, "epoch": 2913} {"train_loss": -43.79006576538086, "global_step": 352588, "epoch": 2913} {"train_loss": -44.34504699707031, "global_step": 352589, "epoch": 2913} {"train_loss": -44.28464889526367, "global_step": 352590, "epoch": 2913} {"train_loss": -43.298095703125, "global_step": 352591, "epoch": 2913} {"train_loss": -44.57770538330078, "global_step": 352592, "epoch": 2913} {"train_loss": -43.68577525241316, "global_step": 352593, "epoch": 2913, "val_loss": 2538699.0} {"train_loss": -44.18696212768555, "global_step": 352594, "epoch": 2914} {"train_loss": -44.1778564453125, "global_step": 352595, "epoch": 2914} {"train_loss": -44.279396057128906, "global_step": 352596, "epoch": 2914} {"train_loss": -43.9866828918457, "global_step": 352597, "epoch": 2914} {"train_loss": -44.970027923583984, "global_step": 352598, "epoch": 2914} {"train_loss": -43.830204010009766, "global_step": 352599, "epoch": 2914} {"train_loss": -43.94340515136719, "global_step": 352600, "epoch": 2914} {"train_loss": -44.31707763671875, "global_step": 352601, "epoch": 2914} {"train_loss": -44.67828369140625, "global_step": 352602, "epoch": 2914} {"train_loss": -43.936458587646484, "global_step": 352603, "epoch": 2914} {"train_loss": -44.39870834350586, "global_step": 352604, "epoch": 2914} {"train_loss": -44.35280990600586, "global_step": 352605, "epoch": 2914} {"train_loss": -44.61149215698242, "global_step": 352606, "epoch": 2914} {"train_loss": -44.9091911315918, "global_step": 352607, "epoch": 2914} {"train_loss": -44.30503463745117, "global_step": 352608, "epoch": 2914} {"train_loss": -44.9166145324707, "global_step": 352609, "epoch": 2914} {"train_loss": -44.277442932128906, "global_step": 352610, "epoch": 2914} {"train_loss": -44.64262771606445, "global_step": 352611, "epoch": 2914} {"train_loss": -44.79609298706055, "global_step": 352612, "epoch": 2914} {"train_loss": -44.35843276977539, "global_step": 352613, "epoch": 2914} {"train_loss": -44.75825881958008, "global_step": 352614, "epoch": 2914} {"train_loss": -44.94675064086914, "global_step": 352615, "epoch": 2914} {"train_loss": -44.01936721801758, "global_step": 352616, "epoch": 2914} {"train_loss": -44.4595832824707, "global_step": 352617, "epoch": 2914} {"train_loss": -44.6971321105957, "global_step": 352618, "epoch": 2914} {"train_loss": -44.674072265625, "global_step": 352619, "epoch": 2914} {"train_loss": -44.55733108520508, "global_step": 352620, "epoch": 2914} {"train_loss": -44.85400390625, "global_step": 352621, "epoch": 2914} {"train_loss": -45.26231002807617, "global_step": 352622, "epoch": 2914} {"train_loss": -45.19132614135742, "global_step": 352623, "epoch": 2914} {"train_loss": -45.41931915283203, "global_step": 352624, "epoch": 2914} {"train_loss": -44.940975189208984, "global_step": 352625, "epoch": 2914} {"train_loss": -45.38203430175781, "global_step": 352626, "epoch": 2914} {"train_loss": -45.32939529418945, "global_step": 352627, "epoch": 2914} {"train_loss": -45.17033386230469, "global_step": 352628, "epoch": 2914} {"train_loss": -45.550148010253906, "global_step": 352629, "epoch": 2914} {"train_loss": -45.221717834472656, "global_step": 352630, "epoch": 2914} {"train_loss": -45.244476318359375, "global_step": 352631, "epoch": 2914} {"train_loss": -45.316009521484375, "global_step": 352632, "epoch": 2914} {"train_loss": -45.036922454833984, "global_step": 352633, "epoch": 2914} {"train_loss": -45.27353286743164, "global_step": 352634, "epoch": 2914} {"train_loss": -44.53070831298828, "global_step": 352635, "epoch": 2914} {"train_loss": -44.257259368896484, "global_step": 352636, "epoch": 2914} {"train_loss": -43.89472579956055, "global_step": 352637, "epoch": 2914} {"train_loss": -44.22612380981445, "global_step": 352638, "epoch": 2914} {"train_loss": -45.41266632080078, "global_step": 352639, "epoch": 2914} {"train_loss": -44.575477600097656, "global_step": 352640, "epoch": 2914} {"train_loss": -43.1319465637207, "global_step": 352641, "epoch": 2914} {"train_loss": -39.73645782470703, "global_step": 352642, "epoch": 2914} {"train_loss": -36.495487213134766, "global_step": 352643, "epoch": 2914} {"train_loss": -38.170745849609375, "global_step": 352644, "epoch": 2914} {"train_loss": -42.28919219970703, "global_step": 352645, "epoch": 2914} {"train_loss": -43.752315521240234, "global_step": 352646, "epoch": 2914} {"train_loss": -41.92000198364258, "global_step": 352647, "epoch": 2914} {"train_loss": -41.98041915893555, "global_step": 352648, "epoch": 2914} {"train_loss": -43.33680725097656, "global_step": 352649, "epoch": 2914} {"train_loss": -43.21379470825195, "global_step": 352650, "epoch": 2914} {"train_loss": -42.04241943359375, "global_step": 352651, "epoch": 2914} {"train_loss": -42.599334716796875, "global_step": 352652, "epoch": 2914} {"train_loss": -44.463680267333984, "global_step": 352653, "epoch": 2914} {"train_loss": -42.65814208984375, "global_step": 352654, "epoch": 2914} {"train_loss": -40.94572067260742, "global_step": 352655, "epoch": 2914} {"train_loss": -43.952693939208984, "global_step": 352656, "epoch": 2914} {"train_loss": -42.4376106262207, "global_step": 352657, "epoch": 2914} {"train_loss": -42.12736511230469, "global_step": 352658, "epoch": 2914} {"train_loss": -42.91794967651367, "global_step": 352659, "epoch": 2914} {"train_loss": -43.72032165527344, "global_step": 352660, "epoch": 2914} {"train_loss": -43.09816360473633, "global_step": 352661, "epoch": 2914} {"train_loss": -43.74666213989258, "global_step": 352662, "epoch": 2914} {"train_loss": -43.585906982421875, "global_step": 352663, "epoch": 2914} {"train_loss": -43.74310302734375, "global_step": 352664, "epoch": 2914} {"train_loss": -43.44075393676758, "global_step": 352665, "epoch": 2914} {"train_loss": -43.238216400146484, "global_step": 352666, "epoch": 2914} {"train_loss": -43.7536735534668, "global_step": 352667, "epoch": 2914} {"train_loss": -43.942806243896484, "global_step": 352668, "epoch": 2914} {"train_loss": -44.28111267089844, "global_step": 352669, "epoch": 2914} {"train_loss": -41.595340728759766, "global_step": 352670, "epoch": 2914} {"train_loss": -44.24842071533203, "global_step": 352671, "epoch": 2914} {"train_loss": -44.063018798828125, "global_step": 352672, "epoch": 2914} {"train_loss": -43.47576141357422, "global_step": 352673, "epoch": 2914} {"train_loss": -44.24855041503906, "global_step": 352674, "epoch": 2914} {"train_loss": -43.34579086303711, "global_step": 352675, "epoch": 2914} {"train_loss": -44.464202880859375, "global_step": 352676, "epoch": 2914} {"train_loss": -43.59077453613281, "global_step": 352677, "epoch": 2914} {"train_loss": -44.20624923706055, "global_step": 352678, "epoch": 2914} {"train_loss": -44.262657165527344, "global_step": 352679, "epoch": 2914} {"train_loss": -44.40196228027344, "global_step": 352680, "epoch": 2914} {"train_loss": -43.907691955566406, "global_step": 352681, "epoch": 2914} {"train_loss": -43.0667724609375, "global_step": 352682, "epoch": 2914} {"train_loss": -44.74209213256836, "global_step": 352683, "epoch": 2914} {"train_loss": -43.285701751708984, "global_step": 352684, "epoch": 2914} {"train_loss": -44.06703567504883, "global_step": 352685, "epoch": 2914} {"train_loss": -43.121124267578125, "global_step": 352686, "epoch": 2914} {"train_loss": -43.68623733520508, "global_step": 352687, "epoch": 2914} {"train_loss": -43.22896957397461, "global_step": 352688, "epoch": 2914} {"train_loss": -44.15452194213867, "global_step": 352689, "epoch": 2914} {"train_loss": -43.47538375854492, "global_step": 352690, "epoch": 2914} {"train_loss": -43.835960388183594, "global_step": 352691, "epoch": 2914} {"train_loss": -44.78267288208008, "global_step": 352692, "epoch": 2914} {"train_loss": -43.94122314453125, "global_step": 352693, "epoch": 2914} {"train_loss": -44.19722366333008, "global_step": 352694, "epoch": 2914} {"train_loss": -44.60209274291992, "global_step": 352695, "epoch": 2914} {"train_loss": -36.85854721069336, "global_step": 352696, "epoch": 2914} {"train_loss": -44.05720520019531, "global_step": 352697, "epoch": 2914} {"train_loss": -43.65182113647461, "global_step": 352698, "epoch": 2914} {"train_loss": -44.75994110107422, "global_step": 352699, "epoch": 2914} {"train_loss": -43.2037467956543, "global_step": 352700, "epoch": 2914} {"train_loss": -43.90621566772461, "global_step": 352701, "epoch": 2914} {"train_loss": -43.931617736816406, "global_step": 352702, "epoch": 2914} {"train_loss": -41.23772048950195, "global_step": 352703, "epoch": 2914} {"train_loss": -43.072052001953125, "global_step": 352704, "epoch": 2914} {"train_loss": -43.415950775146484, "global_step": 352705, "epoch": 2914} {"train_loss": -43.4943962097168, "global_step": 352706, "epoch": 2914} {"train_loss": -42.87675857543945, "global_step": 352707, "epoch": 2914} {"train_loss": -44.00959014892578, "global_step": 352708, "epoch": 2914} {"train_loss": -42.7745361328125, "global_step": 352709, "epoch": 2914} {"train_loss": -43.881019592285156, "global_step": 352710, "epoch": 2914} {"train_loss": -41.51734161376953, "global_step": 352711, "epoch": 2914} {"train_loss": -42.72037124633789, "global_step": 352712, "epoch": 2914} {"train_loss": -43.65273666381836, "global_step": 352713, "epoch": 2914} {"train_loss": -43.59423006861663, "global_step": 352714, "epoch": 2914, "val_loss": 2493569.75} {"train_loss": -43.6105842590332, "global_step": 352715, "epoch": 2915} {"train_loss": -44.34273910522461, "global_step": 352716, "epoch": 2915} {"train_loss": -38.21206283569336, "global_step": 352717, "epoch": 2915} {"train_loss": -42.98774337768555, "global_step": 352718, "epoch": 2915} {"train_loss": -44.399688720703125, "global_step": 352719, "epoch": 2915} {"train_loss": -43.75470733642578, "global_step": 352720, "epoch": 2915} {"train_loss": -43.4283447265625, "global_step": 352721, "epoch": 2915} {"train_loss": -42.193233489990234, "global_step": 352722, "epoch": 2915} {"train_loss": -36.897579193115234, "global_step": 352723, "epoch": 2915} {"train_loss": -43.702980041503906, "global_step": 352724, "epoch": 2915} {"train_loss": -43.274410247802734, "global_step": 352725, "epoch": 2915} {"train_loss": -43.04807662963867, "global_step": 352726, "epoch": 2915} {"train_loss": -43.74414825439453, "global_step": 352727, "epoch": 2915} {"train_loss": -42.498809814453125, "global_step": 352728, "epoch": 2915} {"train_loss": -43.1929817199707, "global_step": 352729, "epoch": 2915} {"train_loss": -44.319091796875, "global_step": 352730, "epoch": 2915} {"train_loss": -42.90165328979492, "global_step": 352731, "epoch": 2915} {"train_loss": -41.867759704589844, "global_step": 352732, "epoch": 2915} {"train_loss": -43.09988021850586, "global_step": 352733, "epoch": 2915} {"train_loss": -43.610233306884766, "global_step": 352734, "epoch": 2915} {"train_loss": -43.91120529174805, "global_step": 352735, "epoch": 2915} {"train_loss": -43.0993766784668, "global_step": 352736, "epoch": 2915} {"train_loss": -43.44907760620117, "global_step": 352737, "epoch": 2915} {"train_loss": -43.7058219909668, "global_step": 352738, "epoch": 2915} {"train_loss": -43.97704315185547, "global_step": 352739, "epoch": 2915} {"train_loss": -44.05440902709961, "global_step": 352740, "epoch": 2915} {"train_loss": -43.13780975341797, "global_step": 352741, "epoch": 2915} {"train_loss": -44.398563385009766, "global_step": 352742, "epoch": 2915} {"train_loss": -44.1840705871582, "global_step": 352743, "epoch": 2915} {"train_loss": -44.06816482543945, "global_step": 352744, "epoch": 2915} {"train_loss": -44.03203201293945, "global_step": 352745, "epoch": 2915} {"train_loss": -43.4766731262207, "global_step": 352746, "epoch": 2915} {"train_loss": -42.44840621948242, "global_step": 352747, "epoch": 2915} {"train_loss": -44.2762565612793, "global_step": 352748, "epoch": 2915} {"train_loss": -42.896270751953125, "global_step": 352749, "epoch": 2915} {"train_loss": -43.799556732177734, "global_step": 352750, "epoch": 2915} {"train_loss": -44.539283752441406, "global_step": 352751, "epoch": 2915} {"train_loss": -43.724605560302734, "global_step": 352752, "epoch": 2915} {"train_loss": -44.217708587646484, "global_step": 352753, "epoch": 2915} {"train_loss": -43.882137298583984, "global_step": 352754, "epoch": 2915} {"train_loss": -43.550933837890625, "global_step": 352755, "epoch": 2915} {"train_loss": -42.96038055419922, "global_step": 352756, "epoch": 2915} {"train_loss": -44.74355697631836, "global_step": 352757, "epoch": 2915} {"train_loss": -43.50965881347656, "global_step": 352758, "epoch": 2915} {"train_loss": -44.055885314941406, "global_step": 352759, "epoch": 2915} {"train_loss": -44.47823715209961, "global_step": 352760, "epoch": 2915} {"train_loss": -44.59551239013672, "global_step": 352761, "epoch": 2915} {"train_loss": -42.63615036010742, "global_step": 352762, "epoch": 2915} {"train_loss": -44.73014450073242, "global_step": 352763, "epoch": 2915} {"train_loss": -44.081722259521484, "global_step": 352764, "epoch": 2915} {"train_loss": -43.930206298828125, "global_step": 352765, "epoch": 2915} {"train_loss": -43.97279357910156, "global_step": 352766, "epoch": 2915} {"train_loss": -43.77122497558594, "global_step": 352767, "epoch": 2915} {"train_loss": -43.86635971069336, "global_step": 352768, "epoch": 2915} {"train_loss": -43.781494140625, "global_step": 352769, "epoch": 2915} {"train_loss": -43.283119201660156, "global_step": 352770, "epoch": 2915} {"train_loss": -43.4679069519043, "global_step": 352771, "epoch": 2915} {"train_loss": -44.20921325683594, "global_step": 352772, "epoch": 2915} {"train_loss": -43.821224212646484, "global_step": 352773, "epoch": 2915} {"train_loss": -44.01332473754883, "global_step": 352774, "epoch": 2915} {"train_loss": -44.05495071411133, "global_step": 352775, "epoch": 2915} {"train_loss": -42.63817596435547, "global_step": 352776, "epoch": 2915} {"train_loss": -44.148616790771484, "global_step": 352777, "epoch": 2915} {"train_loss": -43.715538024902344, "global_step": 352778, "epoch": 2915} {"train_loss": -43.983985900878906, "global_step": 352779, "epoch": 2915} {"train_loss": -44.186134338378906, "global_step": 352780, "epoch": 2915} {"train_loss": -42.92405319213867, "global_step": 352781, "epoch": 2915} {"train_loss": -43.70559310913086, "global_step": 352782, "epoch": 2915} {"train_loss": -44.12227249145508, "global_step": 352783, "epoch": 2915} {"train_loss": -43.6836051940918, "global_step": 352784, "epoch": 2915} {"train_loss": -44.05294418334961, "global_step": 352785, "epoch": 2915} {"train_loss": -43.86277389526367, "global_step": 352786, "epoch": 2915} {"train_loss": -43.5457649230957, "global_step": 352787, "epoch": 2915} {"train_loss": -44.12815475463867, "global_step": 352788, "epoch": 2915} {"train_loss": -43.48833465576172, "global_step": 352789, "epoch": 2915} {"train_loss": -44.37917709350586, "global_step": 352790, "epoch": 2915} {"train_loss": -43.900691986083984, "global_step": 352791, "epoch": 2915} {"train_loss": -44.0719108581543, "global_step": 352792, "epoch": 2915} {"train_loss": -42.55414962768555, "global_step": 352793, "epoch": 2915} {"train_loss": -43.83523178100586, "global_step": 352794, "epoch": 2915} {"train_loss": -42.06695556640625, "global_step": 352795, "epoch": 2915} {"train_loss": -43.758270263671875, "global_step": 352796, "epoch": 2915} {"train_loss": -44.41274642944336, "global_step": 352797, "epoch": 2915} {"train_loss": -43.05583953857422, "global_step": 352798, "epoch": 2915} {"train_loss": -43.29193878173828, "global_step": 352799, "epoch": 2915} {"train_loss": -44.02676010131836, "global_step": 352800, "epoch": 2915} {"train_loss": -43.1754150390625, "global_step": 352801, "epoch": 2915} {"train_loss": -42.659542083740234, "global_step": 352802, "epoch": 2915} {"train_loss": -42.03225326538086, "global_step": 352803, "epoch": 2915} {"train_loss": -42.820980072021484, "global_step": 352804, "epoch": 2915} {"train_loss": -44.557525634765625, "global_step": 352805, "epoch": 2915} {"train_loss": -44.46444320678711, "global_step": 352806, "epoch": 2915} {"train_loss": -43.56972122192383, "global_step": 352807, "epoch": 2915} {"train_loss": -43.533878326416016, "global_step": 352808, "epoch": 2915} {"train_loss": -43.338539123535156, "global_step": 352809, "epoch": 2915} {"train_loss": -43.78902816772461, "global_step": 352810, "epoch": 2915} {"train_loss": -41.95852279663086, "global_step": 352811, "epoch": 2915} {"train_loss": -40.89620590209961, "global_step": 352812, "epoch": 2915} {"train_loss": -41.68609619140625, "global_step": 352813, "epoch": 2915} {"train_loss": -41.972896575927734, "global_step": 352814, "epoch": 2915} {"train_loss": -44.47156524658203, "global_step": 352815, "epoch": 2915} {"train_loss": -44.058448791503906, "global_step": 352816, "epoch": 2915} {"train_loss": -42.5883903503418, "global_step": 352817, "epoch": 2915} {"train_loss": -44.75251007080078, "global_step": 352818, "epoch": 2915} {"train_loss": -43.10773849487305, "global_step": 352819, "epoch": 2915} {"train_loss": -43.34530258178711, "global_step": 352820, "epoch": 2915} {"train_loss": -44.770118713378906, "global_step": 352821, "epoch": 2915} {"train_loss": -42.764801025390625, "global_step": 352822, "epoch": 2915} {"train_loss": -42.37608337402344, "global_step": 352823, "epoch": 2915} {"train_loss": -44.02849197387695, "global_step": 352824, "epoch": 2915} {"train_loss": -44.397621154785156, "global_step": 352825, "epoch": 2915} {"train_loss": -43.57353210449219, "global_step": 352826, "epoch": 2915} {"train_loss": -44.48218536376953, "global_step": 352827, "epoch": 2915} {"train_loss": -43.47564697265625, "global_step": 352828, "epoch": 2915} {"train_loss": -42.31916046142578, "global_step": 352829, "epoch": 2915} {"train_loss": -44.01784133911133, "global_step": 352830, "epoch": 2915} {"train_loss": -43.730506896972656, "global_step": 352831, "epoch": 2915} {"train_loss": -42.77406311035156, "global_step": 352832, "epoch": 2915} {"train_loss": -44.7678337097168, "global_step": 352833, "epoch": 2915} {"train_loss": -44.21289825439453, "global_step": 352834, "epoch": 2915} {"train_loss": -43.48704642303719, "global_step": 352835, "epoch": 2915, "val_loss": 2443705.75} {"train_loss": -44.327816009521484, "global_step": 352836, "epoch": 2916} {"train_loss": -44.538822174072266, "global_step": 352837, "epoch": 2916} {"train_loss": -44.592342376708984, "global_step": 352838, "epoch": 2916} {"train_loss": -44.57379913330078, "global_step": 352839, "epoch": 2916} {"train_loss": -44.99757766723633, "global_step": 352840, "epoch": 2916} {"train_loss": -44.904781341552734, "global_step": 352841, "epoch": 2916} {"train_loss": -44.1247444152832, "global_step": 352842, "epoch": 2916} {"train_loss": -44.2185173034668, "global_step": 352843, "epoch": 2916} {"train_loss": -43.76215744018555, "global_step": 352844, "epoch": 2916} {"train_loss": -44.76035690307617, "global_step": 352845, "epoch": 2916} {"train_loss": -44.7733268737793, "global_step": 352846, "epoch": 2916} {"train_loss": -44.55338668823242, "global_step": 352847, "epoch": 2916} {"train_loss": -44.858917236328125, "global_step": 352848, "epoch": 2916} {"train_loss": -45.082298278808594, "global_step": 352849, "epoch": 2916} {"train_loss": -44.977535247802734, "global_step": 352850, "epoch": 2916} {"train_loss": -44.75580596923828, "global_step": 352851, "epoch": 2916} {"train_loss": -44.80535888671875, "global_step": 352852, "epoch": 2916} {"train_loss": -45.01616287231445, "global_step": 352853, "epoch": 2916} {"train_loss": -44.288246154785156, "global_step": 352854, "epoch": 2916} {"train_loss": -44.51738739013672, "global_step": 352855, "epoch": 2916} {"train_loss": -44.895111083984375, "global_step": 352856, "epoch": 2916} {"train_loss": -44.80332565307617, "global_step": 352857, "epoch": 2916} {"train_loss": -44.807220458984375, "global_step": 352858, "epoch": 2916} {"train_loss": -44.92017364501953, "global_step": 352859, "epoch": 2916} {"train_loss": -44.092857360839844, "global_step": 352860, "epoch": 2916} {"train_loss": -44.379337310791016, "global_step": 352861, "epoch": 2916} {"train_loss": -44.91858673095703, "global_step": 352862, "epoch": 2916} {"train_loss": -43.84408187866211, "global_step": 352863, "epoch": 2916} {"train_loss": -44.928348541259766, "global_step": 352864, "epoch": 2916} {"train_loss": -45.01715850830078, "global_step": 352865, "epoch": 2916} {"train_loss": -44.78921890258789, "global_step": 352866, "epoch": 2916} {"train_loss": -45.0251579284668, "global_step": 352867, "epoch": 2916} {"train_loss": -45.01694869995117, "global_step": 352868, "epoch": 2916} {"train_loss": -44.40640640258789, "global_step": 352869, "epoch": 2916} {"train_loss": -44.75429916381836, "global_step": 352870, "epoch": 2916} {"train_loss": -44.99795150756836, "global_step": 352871, "epoch": 2916} {"train_loss": -44.74612045288086, "global_step": 352872, "epoch": 2916} {"train_loss": -44.4224853515625, "global_step": 352873, "epoch": 2916} {"train_loss": -43.8947639465332, "global_step": 352874, "epoch": 2916} {"train_loss": -43.271766662597656, "global_step": 352875, "epoch": 2916} {"train_loss": -42.99668502807617, "global_step": 352876, "epoch": 2916} {"train_loss": -43.627140045166016, "global_step": 352877, "epoch": 2916} {"train_loss": -44.47930145263672, "global_step": 352878, "epoch": 2916} {"train_loss": -44.555267333984375, "global_step": 352879, "epoch": 2916} {"train_loss": -44.367897033691406, "global_step": 352880, "epoch": 2916} {"train_loss": -45.57638931274414, "global_step": 352881, "epoch": 2916} {"train_loss": -44.24823760986328, "global_step": 352882, "epoch": 2916} {"train_loss": -44.290679931640625, "global_step": 352883, "epoch": 2916} {"train_loss": -43.511165618896484, "global_step": 352884, "epoch": 2916} {"train_loss": -42.8062858581543, "global_step": 352885, "epoch": 2916} {"train_loss": -41.492000579833984, "global_step": 352886, "epoch": 2916} {"train_loss": -40.03900909423828, "global_step": 352887, "epoch": 2916} {"train_loss": -43.47830581665039, "global_step": 352888, "epoch": 2916} {"train_loss": -41.95597457885742, "global_step": 352889, "epoch": 2916} {"train_loss": -38.92006301879883, "global_step": 352890, "epoch": 2916} {"train_loss": -42.0208854675293, "global_step": 352891, "epoch": 2916} {"train_loss": -38.21940231323242, "global_step": 352892, "epoch": 2916} {"train_loss": -35.553932189941406, "global_step": 352893, "epoch": 2916} {"train_loss": -35.50576400756836, "global_step": 352894, "epoch": 2916} {"train_loss": -35.993404388427734, "global_step": 352895, "epoch": 2916} {"train_loss": -38.307552337646484, "global_step": 352896, "epoch": 2916} {"train_loss": -38.615966796875, "global_step": 352897, "epoch": 2916} {"train_loss": -36.263187408447266, "global_step": 352898, "epoch": 2916} {"train_loss": -39.192481994628906, "global_step": 352899, "epoch": 2916} {"train_loss": -37.47983932495117, "global_step": 352900, "epoch": 2916} {"train_loss": -38.30860137939453, "global_step": 352901, "epoch": 2916} {"train_loss": -39.412147521972656, "global_step": 352902, "epoch": 2916} {"train_loss": -36.868953704833984, "global_step": 352903, "epoch": 2916} {"train_loss": -37.30461502075195, "global_step": 352904, "epoch": 2916} {"train_loss": -41.561946868896484, "global_step": 352905, "epoch": 2916} {"train_loss": -40.067413330078125, "global_step": 352906, "epoch": 2916} {"train_loss": -39.38465118408203, "global_step": 352907, "epoch": 2916} {"train_loss": -41.03831100463867, "global_step": 352908, "epoch": 2916} {"train_loss": -40.98875427246094, "global_step": 352909, "epoch": 2916} {"train_loss": -42.38097381591797, "global_step": 352910, "epoch": 2916} {"train_loss": -41.522823333740234, "global_step": 352911, "epoch": 2916} {"train_loss": -41.17384338378906, "global_step": 352912, "epoch": 2916} {"train_loss": -41.15274429321289, "global_step": 352913, "epoch": 2916} {"train_loss": -40.59246826171875, "global_step": 352914, "epoch": 2916} {"train_loss": -43.155006408691406, "global_step": 352915, "epoch": 2916} {"train_loss": -41.621429443359375, "global_step": 352916, "epoch": 2916} {"train_loss": -42.675048828125, "global_step": 352917, "epoch": 2916} {"train_loss": -41.83121871948242, "global_step": 352918, "epoch": 2916} {"train_loss": -42.46488571166992, "global_step": 352919, "epoch": 2916} {"train_loss": -42.791378021240234, "global_step": 352920, "epoch": 2916} {"train_loss": -42.27278518676758, "global_step": 352921, "epoch": 2916} {"train_loss": -42.922027587890625, "global_step": 352922, "epoch": 2916} {"train_loss": -42.18851852416992, "global_step": 352923, "epoch": 2916} {"train_loss": -43.103939056396484, "global_step": 352924, "epoch": 2916} {"train_loss": -43.003150939941406, "global_step": 352925, "epoch": 2916} {"train_loss": -43.20842742919922, "global_step": 352926, "epoch": 2916} {"train_loss": -42.797855377197266, "global_step": 352927, "epoch": 2916} {"train_loss": -43.435543060302734, "global_step": 352928, "epoch": 2916} {"train_loss": -43.46379470825195, "global_step": 352929, "epoch": 2916} {"train_loss": -43.43593215942383, "global_step": 352930, "epoch": 2916} {"train_loss": -43.7684326171875, "global_step": 352931, "epoch": 2916} {"train_loss": -43.83781433105469, "global_step": 352932, "epoch": 2916} {"train_loss": -43.865413665771484, "global_step": 352933, "epoch": 2916} {"train_loss": -43.742088317871094, "global_step": 352934, "epoch": 2916} {"train_loss": -43.645259857177734, "global_step": 352935, "epoch": 2916} {"train_loss": -42.6842041015625, "global_step": 352936, "epoch": 2916} {"train_loss": -44.22629928588867, "global_step": 352937, "epoch": 2916} {"train_loss": -42.99057388305664, "global_step": 352938, "epoch": 2916} {"train_loss": -44.32072448730469, "global_step": 352939, "epoch": 2916} {"train_loss": -42.86320877075195, "global_step": 352940, "epoch": 2916} {"train_loss": -44.21643829345703, "global_step": 352941, "epoch": 2916} {"train_loss": -43.675662994384766, "global_step": 352942, "epoch": 2916} {"train_loss": -43.64999008178711, "global_step": 352943, "epoch": 2916} {"train_loss": -43.995540618896484, "global_step": 352944, "epoch": 2916} {"train_loss": -44.36281967163086, "global_step": 352945, "epoch": 2916} {"train_loss": -44.527462005615234, "global_step": 352946, "epoch": 2916} {"train_loss": -44.433895111083984, "global_step": 352947, "epoch": 2916} {"train_loss": -44.182735443115234, "global_step": 352948, "epoch": 2916} {"train_loss": -44.4277229309082, "global_step": 352949, "epoch": 2916} {"train_loss": -44.18081283569336, "global_step": 352950, "epoch": 2916} {"train_loss": -44.4240608215332, "global_step": 352951, "epoch": 2916} {"train_loss": -44.34214401245117, "global_step": 352952, "epoch": 2916} {"train_loss": -44.80540084838867, "global_step": 352953, "epoch": 2916} {"train_loss": -44.605220794677734, "global_step": 352954, "epoch": 2916} {"train_loss": -44.616943359375, "global_step": 352955, "epoch": 2916} {"train_loss": -42.96836266635863, "global_step": 352956, "epoch": 2916, "val_loss": 2484439.0} {"train_loss": -44.514068603515625, "global_step": 352957, "epoch": 2917} {"train_loss": -45.148494720458984, "global_step": 352958, "epoch": 2917} {"train_loss": -44.914276123046875, "global_step": 352959, "epoch": 2917} {"train_loss": -44.7297248840332, "global_step": 352960, "epoch": 2917} {"train_loss": -45.19242858886719, "global_step": 352961, "epoch": 2917} {"train_loss": -45.162635803222656, "global_step": 352962, "epoch": 2917} {"train_loss": -45.217620849609375, "global_step": 352963, "epoch": 2917} {"train_loss": -44.70288848876953, "global_step": 352964, "epoch": 2917} {"train_loss": -45.3049430847168, "global_step": 352965, "epoch": 2917} {"train_loss": -44.61438751220703, "global_step": 352966, "epoch": 2917} {"train_loss": -45.00669479370117, "global_step": 352967, "epoch": 2917} {"train_loss": -45.16019821166992, "global_step": 352968, "epoch": 2917} {"train_loss": -44.56510543823242, "global_step": 352969, "epoch": 2917} {"train_loss": -45.56415557861328, "global_step": 352970, "epoch": 2917} {"train_loss": -44.881717681884766, "global_step": 352971, "epoch": 2917} {"train_loss": -44.55036926269531, "global_step": 352972, "epoch": 2917} {"train_loss": -45.05840301513672, "global_step": 352973, "epoch": 2917} {"train_loss": -44.98722457885742, "global_step": 352974, "epoch": 2917} {"train_loss": -44.86921310424805, "global_step": 352975, "epoch": 2917} {"train_loss": -45.06622314453125, "global_step": 352976, "epoch": 2917} {"train_loss": -45.40186309814453, "global_step": 352977, "epoch": 2917} {"train_loss": -45.491065979003906, "global_step": 352978, "epoch": 2917} {"train_loss": -45.45064926147461, "global_step": 352979, "epoch": 2917} {"train_loss": -45.24436569213867, "global_step": 352980, "epoch": 2917} {"train_loss": -44.77617263793945, "global_step": 352981, "epoch": 2917} {"train_loss": -45.40592575073242, "global_step": 352982, "epoch": 2917} {"train_loss": -45.6197509765625, "global_step": 352983, "epoch": 2917} {"train_loss": -44.89463424682617, "global_step": 352984, "epoch": 2917} {"train_loss": -45.498939514160156, "global_step": 352985, "epoch": 2917} {"train_loss": -45.29302215576172, "global_step": 352986, "epoch": 2917} {"train_loss": -44.89739990234375, "global_step": 352987, "epoch": 2917} {"train_loss": -44.79938888549805, "global_step": 352988, "epoch": 2917} {"train_loss": -45.09334945678711, "global_step": 352989, "epoch": 2917} {"train_loss": -45.64662170410156, "global_step": 352990, "epoch": 2917} {"train_loss": -45.000240325927734, "global_step": 352991, "epoch": 2917} {"train_loss": -45.1919059753418, "global_step": 352992, "epoch": 2917} {"train_loss": -45.227359771728516, "global_step": 352993, "epoch": 2917} {"train_loss": -45.10012435913086, "global_step": 352994, "epoch": 2917} {"train_loss": -45.6193962097168, "global_step": 352995, "epoch": 2917} {"train_loss": -44.93758010864258, "global_step": 352996, "epoch": 2917} {"train_loss": -45.2632942199707, "global_step": 352997, "epoch": 2917} {"train_loss": -44.725093841552734, "global_step": 352998, "epoch": 2917} {"train_loss": -44.75787353515625, "global_step": 352999, "epoch": 2917} {"train_loss": -44.33249282836914, "global_step": 353000, "epoch": 2917} {"train_loss": -43.602333068847656, "global_step": 353001, "epoch": 2917} {"train_loss": -44.30509948730469, "global_step": 353002, "epoch": 2917} {"train_loss": -44.304359436035156, "global_step": 353003, "epoch": 2917} {"train_loss": -41.767921447753906, "global_step": 353004, "epoch": 2917} {"train_loss": -39.67422866821289, "global_step": 353005, "epoch": 2917} {"train_loss": -43.45497512817383, "global_step": 353006, "epoch": 2917} {"train_loss": -41.76992416381836, "global_step": 353007, "epoch": 2917} {"train_loss": -39.64866256713867, "global_step": 353008, "epoch": 2917} {"train_loss": -43.3092155456543, "global_step": 353009, "epoch": 2917} {"train_loss": -34.09615707397461, "global_step": 353010, "epoch": 2917} {"train_loss": -42.662330627441406, "global_step": 353011, "epoch": 2917} {"train_loss": -28.574438095092773, "global_step": 353012, "epoch": 2917} {"train_loss": -38.09385299682617, "global_step": 353013, "epoch": 2917} {"train_loss": -35.19967269897461, "global_step": 353014, "epoch": 2917} {"train_loss": -39.94866943359375, "global_step": 353015, "epoch": 2917} {"train_loss": -33.90507888793945, "global_step": 353016, "epoch": 2917} {"train_loss": -39.945228576660156, "global_step": 353017, "epoch": 2917} {"train_loss": -32.4763069152832, "global_step": 353018, "epoch": 2917} {"train_loss": -35.676204681396484, "global_step": 353019, "epoch": 2917} {"train_loss": -35.86005783081055, "global_step": 353020, "epoch": 2917} {"train_loss": -35.34270095825195, "global_step": 353021, "epoch": 2917} {"train_loss": -34.609310150146484, "global_step": 353022, "epoch": 2917} {"train_loss": -37.849239349365234, "global_step": 353023, "epoch": 2917} {"train_loss": -38.0266227722168, "global_step": 353024, "epoch": 2917} {"train_loss": -37.72931671142578, "global_step": 353025, "epoch": 2917} {"train_loss": -38.587989807128906, "global_step": 353026, "epoch": 2917} {"train_loss": -38.22370529174805, "global_step": 353027, "epoch": 2917} {"train_loss": -38.91914367675781, "global_step": 353028, "epoch": 2917} {"train_loss": -38.50667953491211, "global_step": 353029, "epoch": 2917} {"train_loss": -38.4271240234375, "global_step": 353030, "epoch": 2917} {"train_loss": -39.5091667175293, "global_step": 353031, "epoch": 2917} {"train_loss": -40.56685256958008, "global_step": 353032, "epoch": 2917} {"train_loss": -39.84387969970703, "global_step": 353033, "epoch": 2917} {"train_loss": -41.552005767822266, "global_step": 353034, "epoch": 2917} {"train_loss": -40.60323715209961, "global_step": 353035, "epoch": 2917} {"train_loss": -41.80564498901367, "global_step": 353036, "epoch": 2917} {"train_loss": -41.324703216552734, "global_step": 353037, "epoch": 2917} {"train_loss": -41.92539978027344, "global_step": 353038, "epoch": 2917} {"train_loss": -41.90120315551758, "global_step": 353039, "epoch": 2917} {"train_loss": -43.01340866088867, "global_step": 353040, "epoch": 2917} {"train_loss": -42.1427001953125, "global_step": 353041, "epoch": 2917} {"train_loss": -42.91024398803711, "global_step": 353042, "epoch": 2917} {"train_loss": -42.997833251953125, "global_step": 353043, "epoch": 2917} {"train_loss": -43.27549743652344, "global_step": 353044, "epoch": 2917} {"train_loss": -43.124332427978516, "global_step": 353045, "epoch": 2917} {"train_loss": -43.4387321472168, "global_step": 353046, "epoch": 2917} {"train_loss": -42.95563888549805, "global_step": 353047, "epoch": 2917} {"train_loss": -43.2034912109375, "global_step": 353048, "epoch": 2917} {"train_loss": -43.93220901489258, "global_step": 353049, "epoch": 2917} {"train_loss": -43.782928466796875, "global_step": 353050, "epoch": 2917} {"train_loss": -44.008609771728516, "global_step": 353051, "epoch": 2917} {"train_loss": -43.20404815673828, "global_step": 353052, "epoch": 2917} {"train_loss": -43.64641189575195, "global_step": 353053, "epoch": 2917} {"train_loss": -43.684505462646484, "global_step": 353054, "epoch": 2917} {"train_loss": -43.73957443237305, "global_step": 353055, "epoch": 2917} {"train_loss": -43.84906768798828, "global_step": 353056, "epoch": 2917} {"train_loss": -43.88536834716797, "global_step": 353057, "epoch": 2917} {"train_loss": -43.5930290222168, "global_step": 353058, "epoch": 2917} {"train_loss": -44.28425216674805, "global_step": 353059, "epoch": 2917} {"train_loss": -44.03452682495117, "global_step": 353060, "epoch": 2917} {"train_loss": -44.554603576660156, "global_step": 353061, "epoch": 2917} {"train_loss": -43.651973724365234, "global_step": 353062, "epoch": 2917} {"train_loss": -43.809383392333984, "global_step": 353063, "epoch": 2917} {"train_loss": -44.65237045288086, "global_step": 353064, "epoch": 2917} {"train_loss": -44.1083869934082, "global_step": 353065, "epoch": 2917} {"train_loss": -44.04560089111328, "global_step": 353066, "epoch": 2917} {"train_loss": -44.55887222290039, "global_step": 353067, "epoch": 2917} {"train_loss": -44.40633010864258, "global_step": 353068, "epoch": 2917} {"train_loss": -43.875545501708984, "global_step": 353069, "epoch": 2917} {"train_loss": -44.64521026611328, "global_step": 353070, "epoch": 2917} {"train_loss": -44.63930130004883, "global_step": 353071, "epoch": 2917} {"train_loss": -44.72468948364258, "global_step": 353072, "epoch": 2917} {"train_loss": -44.3397102355957, "global_step": 353073, "epoch": 2917} {"train_loss": -44.514896392822266, "global_step": 353074, "epoch": 2917} {"train_loss": -44.89862060546875, "global_step": 353075, "epoch": 2917} {"train_loss": -44.615718841552734, "global_step": 353076, "epoch": 2917} {"train_loss": -42.75761973168239, "global_step": 353077, "epoch": 2917, "val_loss": 2494383.25} {"train_loss": -45.05984115600586, "global_step": 353078, "epoch": 2918} {"train_loss": -44.86471176147461, "global_step": 353079, "epoch": 2918} {"train_loss": -44.75751876831055, "global_step": 353080, "epoch": 2918} {"train_loss": -44.8192138671875, "global_step": 353081, "epoch": 2918} {"train_loss": -45.12968444824219, "global_step": 353082, "epoch": 2918} {"train_loss": -45.2027473449707, "global_step": 353083, "epoch": 2918} {"train_loss": -45.23052978515625, "global_step": 353084, "epoch": 2918} {"train_loss": -45.572471618652344, "global_step": 353085, "epoch": 2918} {"train_loss": -44.78998947143555, "global_step": 353086, "epoch": 2918} {"train_loss": -44.956180572509766, "global_step": 353087, "epoch": 2918} {"train_loss": -45.275604248046875, "global_step": 353088, "epoch": 2918} {"train_loss": -45.0852165222168, "global_step": 353089, "epoch": 2918} {"train_loss": -44.582740783691406, "global_step": 353090, "epoch": 2918} {"train_loss": -45.097328186035156, "global_step": 353091, "epoch": 2918} {"train_loss": -44.47257614135742, "global_step": 353092, "epoch": 2918} {"train_loss": -45.312931060791016, "global_step": 353093, "epoch": 2918} {"train_loss": -45.038143157958984, "global_step": 353094, "epoch": 2918} {"train_loss": -45.379722595214844, "global_step": 353095, "epoch": 2918} {"train_loss": -45.08112716674805, "global_step": 353096, "epoch": 2918} {"train_loss": -45.122920989990234, "global_step": 353097, "epoch": 2918} {"train_loss": -45.330352783203125, "global_step": 353098, "epoch": 2918} {"train_loss": -44.65193557739258, "global_step": 353099, "epoch": 2918} {"train_loss": -45.04741287231445, "global_step": 353100, "epoch": 2918} {"train_loss": -45.176490783691406, "global_step": 353101, "epoch": 2918} {"train_loss": -45.3491325378418, "global_step": 353102, "epoch": 2918} {"train_loss": -45.64179611206055, "global_step": 353103, "epoch": 2918} {"train_loss": -45.1307487487793, "global_step": 353104, "epoch": 2918} {"train_loss": -45.4552116394043, "global_step": 353105, "epoch": 2918} {"train_loss": -45.267913818359375, "global_step": 353106, "epoch": 2918} {"train_loss": -44.99713134765625, "global_step": 353107, "epoch": 2918} {"train_loss": -45.39334487915039, "global_step": 353108, "epoch": 2918} {"train_loss": -44.64924621582031, "global_step": 353109, "epoch": 2918} {"train_loss": -44.56321334838867, "global_step": 353110, "epoch": 2918} {"train_loss": -44.35661315917969, "global_step": 353111, "epoch": 2918} {"train_loss": -43.54480743408203, "global_step": 353112, "epoch": 2918} {"train_loss": -44.619869232177734, "global_step": 353113, "epoch": 2918} {"train_loss": -44.444801330566406, "global_step": 353114, "epoch": 2918} {"train_loss": -42.18183517456055, "global_step": 353115, "epoch": 2918} {"train_loss": -40.97758102416992, "global_step": 353116, "epoch": 2918} {"train_loss": -42.966285705566406, "global_step": 353117, "epoch": 2918} {"train_loss": -44.336421966552734, "global_step": 353118, "epoch": 2918} {"train_loss": -43.40947341918945, "global_step": 353119, "epoch": 2918} {"train_loss": -41.905269622802734, "global_step": 353120, "epoch": 2918} {"train_loss": -44.95509719848633, "global_step": 353121, "epoch": 2918} {"train_loss": -43.678382873535156, "global_step": 353122, "epoch": 2918} {"train_loss": -41.787574768066406, "global_step": 353123, "epoch": 2918} {"train_loss": -44.70676040649414, "global_step": 353124, "epoch": 2918} {"train_loss": -43.15813446044922, "global_step": 353125, "epoch": 2918} {"train_loss": -41.300662994384766, "global_step": 353126, "epoch": 2918} {"train_loss": -44.2019157409668, "global_step": 353127, "epoch": 2918} {"train_loss": -42.93734359741211, "global_step": 353128, "epoch": 2918} {"train_loss": -41.28945541381836, "global_step": 353129, "epoch": 2918} {"train_loss": -42.18947219848633, "global_step": 353130, "epoch": 2918} {"train_loss": -41.76060485839844, "global_step": 353131, "epoch": 2918} {"train_loss": -41.84092330932617, "global_step": 353132, "epoch": 2918} {"train_loss": -39.916969299316406, "global_step": 353133, "epoch": 2918} {"train_loss": -42.730072021484375, "global_step": 353134, "epoch": 2918} {"train_loss": -39.9178581237793, "global_step": 353135, "epoch": 2918} {"train_loss": -42.04096603393555, "global_step": 353136, "epoch": 2918} {"train_loss": -39.202308654785156, "global_step": 353137, "epoch": 2918} {"train_loss": -42.23507308959961, "global_step": 353138, "epoch": 2918} {"train_loss": -41.78609848022461, "global_step": 353139, "epoch": 2918} {"train_loss": -41.91376876831055, "global_step": 353140, "epoch": 2918} {"train_loss": -42.16832733154297, "global_step": 353141, "epoch": 2918} {"train_loss": -43.01888656616211, "global_step": 353142, "epoch": 2918} {"train_loss": -42.4531364440918, "global_step": 353143, "epoch": 2918} {"train_loss": -42.12186813354492, "global_step": 353144, "epoch": 2918} {"train_loss": -42.850948333740234, "global_step": 353145, "epoch": 2918} {"train_loss": -41.808467864990234, "global_step": 353146, "epoch": 2918} {"train_loss": -43.88811111450195, "global_step": 353147, "epoch": 2918} {"train_loss": -42.03111267089844, "global_step": 353148, "epoch": 2918} {"train_loss": -42.25838851928711, "global_step": 353149, "epoch": 2918} {"train_loss": -42.61896896362305, "global_step": 353150, "epoch": 2918} {"train_loss": -41.986263275146484, "global_step": 353151, "epoch": 2918} {"train_loss": -43.726985931396484, "global_step": 353152, "epoch": 2918} {"train_loss": -43.286964416503906, "global_step": 353153, "epoch": 2918} {"train_loss": -43.44478225708008, "global_step": 353154, "epoch": 2918} {"train_loss": -42.8873176574707, "global_step": 353155, "epoch": 2918} {"train_loss": -43.98556137084961, "global_step": 353156, "epoch": 2918} {"train_loss": -43.7845458984375, "global_step": 353157, "epoch": 2918} {"train_loss": -43.883785247802734, "global_step": 353158, "epoch": 2918} {"train_loss": -43.60847091674805, "global_step": 353159, "epoch": 2918} {"train_loss": -44.24988555908203, "global_step": 353160, "epoch": 2918} {"train_loss": -43.88653564453125, "global_step": 353161, "epoch": 2918} {"train_loss": -44.390716552734375, "global_step": 353162, "epoch": 2918} {"train_loss": -44.15256881713867, "global_step": 353163, "epoch": 2918} {"train_loss": -44.329986572265625, "global_step": 353164, "epoch": 2918} {"train_loss": -44.2227668762207, "global_step": 353165, "epoch": 2918} {"train_loss": -43.99392318725586, "global_step": 353166, "epoch": 2918} {"train_loss": -44.102596282958984, "global_step": 353167, "epoch": 2918} {"train_loss": -44.62246322631836, "global_step": 353168, "epoch": 2918} {"train_loss": -44.66764450073242, "global_step": 353169, "epoch": 2918} {"train_loss": -44.43593215942383, "global_step": 353170, "epoch": 2918} {"train_loss": -44.51205062866211, "global_step": 353171, "epoch": 2918} {"train_loss": -44.38458251953125, "global_step": 353172, "epoch": 2918} {"train_loss": -44.98017120361328, "global_step": 353173, "epoch": 2918} {"train_loss": -43.92184066772461, "global_step": 353174, "epoch": 2918} {"train_loss": -44.70808792114258, "global_step": 353175, "epoch": 2918} {"train_loss": -44.218971252441406, "global_step": 353176, "epoch": 2918} {"train_loss": -45.04917526245117, "global_step": 353177, "epoch": 2918} {"train_loss": -44.544677734375, "global_step": 353178, "epoch": 2918} {"train_loss": -45.265472412109375, "global_step": 353179, "epoch": 2918} {"train_loss": -44.650325775146484, "global_step": 353180, "epoch": 2918} {"train_loss": -45.124996185302734, "global_step": 353181, "epoch": 2918} {"train_loss": -45.33771896362305, "global_step": 353182, "epoch": 2918} {"train_loss": -44.94425582885742, "global_step": 353183, "epoch": 2918} {"train_loss": -45.13473129272461, "global_step": 353184, "epoch": 2918} {"train_loss": -45.251827239990234, "global_step": 353185, "epoch": 2918} {"train_loss": -45.22005081176758, "global_step": 353186, "epoch": 2918} {"train_loss": -45.229103088378906, "global_step": 353187, "epoch": 2918} {"train_loss": -45.40822219848633, "global_step": 353188, "epoch": 2918} {"train_loss": -45.00721740722656, "global_step": 353189, "epoch": 2918} {"train_loss": -45.0882568359375, "global_step": 353190, "epoch": 2918} {"train_loss": -45.37095260620117, "global_step": 353191, "epoch": 2918} {"train_loss": -45.10065841674805, "global_step": 353192, "epoch": 2918} {"train_loss": -45.40814208984375, "global_step": 353193, "epoch": 2918} {"train_loss": -45.21842575073242, "global_step": 353194, "epoch": 2918} {"train_loss": -45.420040130615234, "global_step": 353195, "epoch": 2918} {"train_loss": -45.70002365112305, "global_step": 353196, "epoch": 2918} {"train_loss": -45.367122650146484, "global_step": 353197, "epoch": 2918} {"train_loss": -44.03024878383668, "global_step": 353198, "epoch": 2918, "val_loss": 2491871.75} {"train_loss": -45.23579406738281, "global_step": 353199, "epoch": 2919} {"train_loss": -45.26997756958008, "global_step": 353200, "epoch": 2919} {"train_loss": -45.42582321166992, "global_step": 353201, "epoch": 2919} {"train_loss": -44.95193099975586, "global_step": 353202, "epoch": 2919} {"train_loss": -44.980037689208984, "global_step": 353203, "epoch": 2919} {"train_loss": -45.673797607421875, "global_step": 353204, "epoch": 2919} {"train_loss": -45.41025924682617, "global_step": 353205, "epoch": 2919} {"train_loss": -45.02466583251953, "global_step": 353206, "epoch": 2919} {"train_loss": -45.908809661865234, "global_step": 353207, "epoch": 2919} {"train_loss": -45.30327606201172, "global_step": 353208, "epoch": 2919} {"train_loss": -45.309669494628906, "global_step": 353209, "epoch": 2919} {"train_loss": -45.25599670410156, "global_step": 353210, "epoch": 2919} {"train_loss": -45.64692306518555, "global_step": 353211, "epoch": 2919} {"train_loss": -45.34943389892578, "global_step": 353212, "epoch": 2919} {"train_loss": -45.2520751953125, "global_step": 353213, "epoch": 2919} {"train_loss": -45.938201904296875, "global_step": 353214, "epoch": 2919} {"train_loss": -45.512969970703125, "global_step": 353215, "epoch": 2919} {"train_loss": -45.11762619018555, "global_step": 353216, "epoch": 2919} {"train_loss": -45.503326416015625, "global_step": 353217, "epoch": 2919} {"train_loss": -45.57088851928711, "global_step": 353218, "epoch": 2919} {"train_loss": -45.13373565673828, "global_step": 353219, "epoch": 2919} {"train_loss": -45.10528564453125, "global_step": 353220, "epoch": 2919} {"train_loss": -43.57141876220703, "global_step": 353221, "epoch": 2919} {"train_loss": -41.286617279052734, "global_step": 353222, "epoch": 2919} {"train_loss": -43.328243255615234, "global_step": 353223, "epoch": 2919} {"train_loss": -44.498714447021484, "global_step": 353224, "epoch": 2919} {"train_loss": -45.4112548828125, "global_step": 353225, "epoch": 2919} {"train_loss": -43.469112396240234, "global_step": 353226, "epoch": 2919} {"train_loss": -42.52396011352539, "global_step": 353227, "epoch": 2919} {"train_loss": -44.51937484741211, "global_step": 353228, "epoch": 2919} {"train_loss": -41.9038200378418, "global_step": 353229, "epoch": 2919} {"train_loss": -41.898738861083984, "global_step": 353230, "epoch": 2919} {"train_loss": -44.928157806396484, "global_step": 353231, "epoch": 2919} {"train_loss": -42.27703857421875, "global_step": 353232, "epoch": 2919} {"train_loss": -43.10150909423828, "global_step": 353233, "epoch": 2919} {"train_loss": -43.22694778442383, "global_step": 353234, "epoch": 2919} {"train_loss": -42.924072265625, "global_step": 353235, "epoch": 2919} {"train_loss": -44.43498611450195, "global_step": 353236, "epoch": 2919} {"train_loss": -43.30295944213867, "global_step": 353237, "epoch": 2919} {"train_loss": -43.24961471557617, "global_step": 353238, "epoch": 2919} {"train_loss": -44.06110763549805, "global_step": 353239, "epoch": 2919} {"train_loss": -44.696922302246094, "global_step": 353240, "epoch": 2919} {"train_loss": -43.817169189453125, "global_step": 353241, "epoch": 2919} {"train_loss": -42.3005485534668, "global_step": 353242, "epoch": 2919} {"train_loss": -44.8912467956543, "global_step": 353243, "epoch": 2919} {"train_loss": -42.381832122802734, "global_step": 353244, "epoch": 2919} {"train_loss": -41.18910598754883, "global_step": 353245, "epoch": 2919} {"train_loss": -41.9974250793457, "global_step": 353246, "epoch": 2919} {"train_loss": -37.535743713378906, "global_step": 353247, "epoch": 2919} {"train_loss": -40.011165618896484, "global_step": 353248, "epoch": 2919} {"train_loss": -38.35969161987305, "global_step": 353249, "epoch": 2919} {"train_loss": -36.91663360595703, "global_step": 353250, "epoch": 2919} {"train_loss": -38.89408493041992, "global_step": 353251, "epoch": 2919} {"train_loss": -39.5205078125, "global_step": 353252, "epoch": 2919} {"train_loss": -39.894805908203125, "global_step": 353253, "epoch": 2919} {"train_loss": -38.894222259521484, "global_step": 353254, "epoch": 2919} {"train_loss": -35.47758102416992, "global_step": 353255, "epoch": 2919} {"train_loss": -40.51679611206055, "global_step": 353256, "epoch": 2919} {"train_loss": -35.041236877441406, "global_step": 353257, "epoch": 2919} {"train_loss": -38.85776901245117, "global_step": 353258, "epoch": 2919} {"train_loss": -39.54752731323242, "global_step": 353259, "epoch": 2919} {"train_loss": -34.9769401550293, "global_step": 353260, "epoch": 2919} {"train_loss": -38.394657135009766, "global_step": 353261, "epoch": 2919} {"train_loss": -37.32189178466797, "global_step": 353262, "epoch": 2919} {"train_loss": -37.707244873046875, "global_step": 353263, "epoch": 2919} {"train_loss": -40.220069885253906, "global_step": 353264, "epoch": 2919} {"train_loss": -39.30609893798828, "global_step": 353265, "epoch": 2919} {"train_loss": -40.59762191772461, "global_step": 353266, "epoch": 2919} {"train_loss": -38.7156982421875, "global_step": 353267, "epoch": 2919} {"train_loss": -40.33021926879883, "global_step": 353268, "epoch": 2919} {"train_loss": -40.6417121887207, "global_step": 353269, "epoch": 2919} {"train_loss": -40.514076232910156, "global_step": 353270, "epoch": 2919} {"train_loss": -41.46588897705078, "global_step": 353271, "epoch": 2919} {"train_loss": -40.29209518432617, "global_step": 353272, "epoch": 2919} {"train_loss": -40.72054672241211, "global_step": 353273, "epoch": 2919} {"train_loss": -42.046669006347656, "global_step": 353274, "epoch": 2919} {"train_loss": -40.48688888549805, "global_step": 353275, "epoch": 2919} {"train_loss": -41.73638916015625, "global_step": 353276, "epoch": 2919} {"train_loss": -40.94403839111328, "global_step": 353277, "epoch": 2919} {"train_loss": -42.782073974609375, "global_step": 353278, "epoch": 2919} {"train_loss": -41.819976806640625, "global_step": 353279, "epoch": 2919} {"train_loss": -41.73508834838867, "global_step": 353280, "epoch": 2919} {"train_loss": -42.54694366455078, "global_step": 353281, "epoch": 2919} {"train_loss": -42.3886604309082, "global_step": 353282, "epoch": 2919} {"train_loss": -42.79092025756836, "global_step": 353283, "epoch": 2919} {"train_loss": -43.365570068359375, "global_step": 353284, "epoch": 2919} {"train_loss": -42.91731262207031, "global_step": 353285, "epoch": 2919} {"train_loss": -43.243560791015625, "global_step": 353286, "epoch": 2919} {"train_loss": -43.177093505859375, "global_step": 353287, "epoch": 2919} {"train_loss": -43.616817474365234, "global_step": 353288, "epoch": 2919} {"train_loss": -43.54545211791992, "global_step": 353289, "epoch": 2919} {"train_loss": -43.65151596069336, "global_step": 353290, "epoch": 2919} {"train_loss": -43.530128479003906, "global_step": 353291, "epoch": 2919} {"train_loss": -43.386104583740234, "global_step": 353292, "epoch": 2919} {"train_loss": -43.67525100708008, "global_step": 353293, "epoch": 2919} {"train_loss": -43.59139633178711, "global_step": 353294, "epoch": 2919} {"train_loss": -43.91233444213867, "global_step": 353295, "epoch": 2919} {"train_loss": -43.83155059814453, "global_step": 353296, "epoch": 2919} {"train_loss": -44.0311279296875, "global_step": 353297, "epoch": 2919} {"train_loss": -44.1272087097168, "global_step": 353298, "epoch": 2919} {"train_loss": -44.132450103759766, "global_step": 353299, "epoch": 2919} {"train_loss": -44.031551361083984, "global_step": 353300, "epoch": 2919} {"train_loss": -43.93437957763672, "global_step": 353301, "epoch": 2919} {"train_loss": -44.07712936401367, "global_step": 353302, "epoch": 2919} {"train_loss": -43.930145263671875, "global_step": 353303, "epoch": 2919} {"train_loss": -44.006874084472656, "global_step": 353304, "epoch": 2919} {"train_loss": -44.66846466064453, "global_step": 353305, "epoch": 2919} {"train_loss": -44.35071563720703, "global_step": 353306, "epoch": 2919} {"train_loss": -44.28980255126953, "global_step": 353307, "epoch": 2919} {"train_loss": -44.37406539916992, "global_step": 353308, "epoch": 2919} {"train_loss": -44.681392669677734, "global_step": 353309, "epoch": 2919} {"train_loss": -44.632530212402344, "global_step": 353310, "epoch": 2919} {"train_loss": -44.82528305053711, "global_step": 353311, "epoch": 2919} {"train_loss": -44.581886291503906, "global_step": 353312, "epoch": 2919} {"train_loss": -44.391517639160156, "global_step": 353313, "epoch": 2919} {"train_loss": -45.031063079833984, "global_step": 353314, "epoch": 2919} {"train_loss": -44.60139083862305, "global_step": 353315, "epoch": 2919} {"train_loss": -44.83979415893555, "global_step": 353316, "epoch": 2919} {"train_loss": -44.87941360473633, "global_step": 353317, "epoch": 2919} {"train_loss": -44.896305084228516, "global_step": 353318, "epoch": 2919} {"train_loss": -42.814512426202946, "global_step": 353319, "epoch": 2919, "val_loss": 2502786.0} {"train_loss": -45.305049896240234, "global_step": 353320, "epoch": 2920} {"train_loss": -44.81675338745117, "global_step": 353321, "epoch": 2920} {"train_loss": -45.090065002441406, "global_step": 353322, "epoch": 2920} {"train_loss": -44.85439682006836, "global_step": 353323, "epoch": 2920} {"train_loss": -45.169734954833984, "global_step": 353324, "epoch": 2920} {"train_loss": -44.9967041015625, "global_step": 353325, "epoch": 2920} {"train_loss": -45.35265350341797, "global_step": 353326, "epoch": 2920} {"train_loss": -45.26565170288086, "global_step": 353327, "epoch": 2920} {"train_loss": -45.481109619140625, "global_step": 353328, "epoch": 2920} {"train_loss": -44.96665573120117, "global_step": 353329, "epoch": 2920} {"train_loss": -45.30470657348633, "global_step": 353330, "epoch": 2920} {"train_loss": -45.23035430908203, "global_step": 353331, "epoch": 2920} {"train_loss": -45.602378845214844, "global_step": 353332, "epoch": 2920} {"train_loss": -45.16612243652344, "global_step": 353333, "epoch": 2920} {"train_loss": -45.408042907714844, "global_step": 353334, "epoch": 2920} {"train_loss": -45.60316848754883, "global_step": 353335, "epoch": 2920} {"train_loss": -45.358856201171875, "global_step": 353336, "epoch": 2920} {"train_loss": -45.356483459472656, "global_step": 353337, "epoch": 2920} {"train_loss": -45.81231689453125, "global_step": 353338, "epoch": 2920} {"train_loss": -45.36676788330078, "global_step": 353339, "epoch": 2920} {"train_loss": -45.21399688720703, "global_step": 353340, "epoch": 2920} {"train_loss": -45.63972091674805, "global_step": 353341, "epoch": 2920} {"train_loss": -45.181087493896484, "global_step": 353342, "epoch": 2920} {"train_loss": -45.46712875366211, "global_step": 353343, "epoch": 2920} {"train_loss": -45.890350341796875, "global_step": 353344, "epoch": 2920} {"train_loss": -45.639583587646484, "global_step": 353345, "epoch": 2920} {"train_loss": -44.93830490112305, "global_step": 353346, "epoch": 2920} {"train_loss": -45.29704284667969, "global_step": 353347, "epoch": 2920} {"train_loss": -45.632057189941406, "global_step": 353348, "epoch": 2920} {"train_loss": -45.492042541503906, "global_step": 353349, "epoch": 2920} {"train_loss": -45.18526077270508, "global_step": 353350, "epoch": 2920} {"train_loss": -45.44934844970703, "global_step": 353351, "epoch": 2920} {"train_loss": -45.795928955078125, "global_step": 353352, "epoch": 2920} {"train_loss": -45.9645881652832, "global_step": 353353, "epoch": 2920} {"train_loss": -44.92390823364258, "global_step": 353354, "epoch": 2920} {"train_loss": -45.7280158996582, "global_step": 353355, "epoch": 2920} {"train_loss": -45.5986328125, "global_step": 353356, "epoch": 2920} {"train_loss": -45.440338134765625, "global_step": 353357, "epoch": 2920} {"train_loss": -43.343719482421875, "global_step": 353358, "epoch": 2920} {"train_loss": -43.350826263427734, "global_step": 353359, "epoch": 2920} {"train_loss": -45.09147644042969, "global_step": 353360, "epoch": 2920} {"train_loss": -44.5816535949707, "global_step": 353361, "epoch": 2920} {"train_loss": -42.37747573852539, "global_step": 353362, "epoch": 2920} {"train_loss": -44.24272537231445, "global_step": 353363, "epoch": 2920} {"train_loss": -44.82905197143555, "global_step": 353364, "epoch": 2920} {"train_loss": -43.96980667114258, "global_step": 353365, "epoch": 2920} {"train_loss": -42.58777618408203, "global_step": 353366, "epoch": 2920} {"train_loss": -44.488399505615234, "global_step": 353367, "epoch": 2920} {"train_loss": -44.51863479614258, "global_step": 353368, "epoch": 2920} {"train_loss": -43.911163330078125, "global_step": 353369, "epoch": 2920} {"train_loss": -42.75249099731445, "global_step": 353370, "epoch": 2920} {"train_loss": -43.52155303955078, "global_step": 353371, "epoch": 2920} {"train_loss": -42.77761459350586, "global_step": 353372, "epoch": 2920} {"train_loss": -42.216854095458984, "global_step": 353373, "epoch": 2920} {"train_loss": -44.204689025878906, "global_step": 353374, "epoch": 2920} {"train_loss": -42.90229034423828, "global_step": 353375, "epoch": 2920} {"train_loss": -43.6700553894043, "global_step": 353376, "epoch": 2920} {"train_loss": -44.36450958251953, "global_step": 353377, "epoch": 2920} {"train_loss": -42.30863571166992, "global_step": 353378, "epoch": 2920} {"train_loss": -43.98539352416992, "global_step": 353379, "epoch": 2920} {"train_loss": -42.92184066772461, "global_step": 353380, "epoch": 2920} {"train_loss": -45.03709030151367, "global_step": 353381, "epoch": 2920} {"train_loss": -45.004371643066406, "global_step": 353382, "epoch": 2920} {"train_loss": -44.41385269165039, "global_step": 353383, "epoch": 2920} {"train_loss": -44.642208099365234, "global_step": 353384, "epoch": 2920} {"train_loss": -44.930999755859375, "global_step": 353385, "epoch": 2920} {"train_loss": -45.026607513427734, "global_step": 353386, "epoch": 2920} {"train_loss": -44.50554275512695, "global_step": 353387, "epoch": 2920} {"train_loss": -43.670291900634766, "global_step": 353388, "epoch": 2920} {"train_loss": -44.0527458190918, "global_step": 353389, "epoch": 2920} {"train_loss": -43.66535186767578, "global_step": 353390, "epoch": 2920} {"train_loss": -45.04850387573242, "global_step": 353391, "epoch": 2920} {"train_loss": -44.905094146728516, "global_step": 353392, "epoch": 2920} {"train_loss": -45.06003952026367, "global_step": 353393, "epoch": 2920} {"train_loss": -44.8086051940918, "global_step": 353394, "epoch": 2920} {"train_loss": -44.62929916381836, "global_step": 353395, "epoch": 2920} {"train_loss": -45.392879486083984, "global_step": 353396, "epoch": 2920} {"train_loss": -44.659786224365234, "global_step": 353397, "epoch": 2920} {"train_loss": -44.9417724609375, "global_step": 353398, "epoch": 2920} {"train_loss": -45.1446647644043, "global_step": 353399, "epoch": 2920} {"train_loss": -45.06195068359375, "global_step": 353400, "epoch": 2920} {"train_loss": -44.86750030517578, "global_step": 353401, "epoch": 2920} {"train_loss": -44.91530990600586, "global_step": 353402, "epoch": 2920} {"train_loss": -45.554012298583984, "global_step": 353403, "epoch": 2920} {"train_loss": -45.41634750366211, "global_step": 353404, "epoch": 2920} {"train_loss": -45.36040115356445, "global_step": 353405, "epoch": 2920} {"train_loss": -45.42904281616211, "global_step": 353406, "epoch": 2920} {"train_loss": -45.14899826049805, "global_step": 353407, "epoch": 2920} {"train_loss": -45.663814544677734, "global_step": 353408, "epoch": 2920} {"train_loss": -45.42507553100586, "global_step": 353409, "epoch": 2920} {"train_loss": -44.966896057128906, "global_step": 353410, "epoch": 2920} {"train_loss": -45.428646087646484, "global_step": 353411, "epoch": 2920} {"train_loss": -45.55989456176758, "global_step": 353412, "epoch": 2920} {"train_loss": -45.221763610839844, "global_step": 353413, "epoch": 2920} {"train_loss": -45.299251556396484, "global_step": 353414, "epoch": 2920} {"train_loss": -45.32428741455078, "global_step": 353415, "epoch": 2920} {"train_loss": -45.05955123901367, "global_step": 353416, "epoch": 2920} {"train_loss": -45.37750244140625, "global_step": 353417, "epoch": 2920} {"train_loss": -44.801761627197266, "global_step": 353418, "epoch": 2920} {"train_loss": -44.256103515625, "global_step": 353419, "epoch": 2920} {"train_loss": -45.08256149291992, "global_step": 353420, "epoch": 2920} {"train_loss": -45.186767578125, "global_step": 353421, "epoch": 2920} {"train_loss": -44.6773796081543, "global_step": 353422, "epoch": 2920} {"train_loss": -44.94655227661133, "global_step": 353423, "epoch": 2920} {"train_loss": -44.960968017578125, "global_step": 353424, "epoch": 2920} {"train_loss": -45.173316955566406, "global_step": 353425, "epoch": 2920} {"train_loss": -45.20182418823242, "global_step": 353426, "epoch": 2920} {"train_loss": -44.9253044128418, "global_step": 353427, "epoch": 2920} {"train_loss": -45.41257858276367, "global_step": 353428, "epoch": 2920} {"train_loss": -44.00780487060547, "global_step": 353429, "epoch": 2920} {"train_loss": -44.612281799316406, "global_step": 353430, "epoch": 2920} {"train_loss": -45.30653762817383, "global_step": 353431, "epoch": 2920} {"train_loss": -43.904781341552734, "global_step": 353432, "epoch": 2920} {"train_loss": -45.12621307373047, "global_step": 353433, "epoch": 2920} {"train_loss": -44.78078842163086, "global_step": 353434, "epoch": 2920} {"train_loss": -43.97297286987305, "global_step": 353435, "epoch": 2920} {"train_loss": -44.86317443847656, "global_step": 353436, "epoch": 2920} {"train_loss": -44.18708419799805, "global_step": 353437, "epoch": 2920} {"train_loss": -42.74359893798828, "global_step": 353438, "epoch": 2920} {"train_loss": -44.80402755737305, "global_step": 353439, "epoch": 2920} {"train_loss": -44.77187599623499, "global_step": 353440, "epoch": 2920, "val_loss": 2487874.0} {"train_loss": -44.53892135620117, "global_step": 353441, "epoch": 2921} {"train_loss": -43.465511322021484, "global_step": 353442, "epoch": 2921} {"train_loss": -42.92572784423828, "global_step": 353443, "epoch": 2921} {"train_loss": -44.570068359375, "global_step": 353444, "epoch": 2921} {"train_loss": -42.50810623168945, "global_step": 353445, "epoch": 2921} {"train_loss": -43.78389358520508, "global_step": 353446, "epoch": 2921} {"train_loss": -44.024105072021484, "global_step": 353447, "epoch": 2921} {"train_loss": -42.82678985595703, "global_step": 353448, "epoch": 2921} {"train_loss": -43.414154052734375, "global_step": 353449, "epoch": 2921} {"train_loss": -43.548587799072266, "global_step": 353450, "epoch": 2921} {"train_loss": -45.09967803955078, "global_step": 353451, "epoch": 2921} {"train_loss": -44.474586486816406, "global_step": 353452, "epoch": 2921} {"train_loss": -44.46893310546875, "global_step": 353453, "epoch": 2921} {"train_loss": -43.152687072753906, "global_step": 353454, "epoch": 2921} {"train_loss": -44.35528564453125, "global_step": 353455, "epoch": 2921} {"train_loss": -42.69844436645508, "global_step": 353456, "epoch": 2921} {"train_loss": -42.6024169921875, "global_step": 353457, "epoch": 2921} {"train_loss": -44.5741081237793, "global_step": 353458, "epoch": 2921} {"train_loss": -43.377105712890625, "global_step": 353459, "epoch": 2921} {"train_loss": -43.230037689208984, "global_step": 353460, "epoch": 2921} {"train_loss": -43.8867073059082, "global_step": 353461, "epoch": 2921} {"train_loss": -43.076725006103516, "global_step": 353462, "epoch": 2921} {"train_loss": -40.88721466064453, "global_step": 353463, "epoch": 2921} {"train_loss": -43.7097053527832, "global_step": 353464, "epoch": 2921} {"train_loss": -43.15048599243164, "global_step": 353465, "epoch": 2921} {"train_loss": -42.636322021484375, "global_step": 353466, "epoch": 2921} {"train_loss": -44.0185661315918, "global_step": 353467, "epoch": 2921} {"train_loss": -42.854095458984375, "global_step": 353468, "epoch": 2921} {"train_loss": -40.4885368347168, "global_step": 353469, "epoch": 2921} {"train_loss": -43.512245178222656, "global_step": 353470, "epoch": 2921} {"train_loss": -39.984867095947266, "global_step": 353471, "epoch": 2921} {"train_loss": -44.728477478027344, "global_step": 353472, "epoch": 2921} {"train_loss": -41.229644775390625, "global_step": 353473, "epoch": 2921} {"train_loss": -43.63441467285156, "global_step": 353474, "epoch": 2921} {"train_loss": -43.15773391723633, "global_step": 353475, "epoch": 2921} {"train_loss": -42.873104095458984, "global_step": 353476, "epoch": 2921} {"train_loss": -42.925682067871094, "global_step": 353477, "epoch": 2921} {"train_loss": -42.04591751098633, "global_step": 353478, "epoch": 2921} {"train_loss": -44.16412353515625, "global_step": 353479, "epoch": 2921} {"train_loss": -42.57744216918945, "global_step": 353480, "epoch": 2921} {"train_loss": -44.44134521484375, "global_step": 353481, "epoch": 2921} {"train_loss": -43.57337188720703, "global_step": 353482, "epoch": 2921} {"train_loss": -42.473289489746094, "global_step": 353483, "epoch": 2921} {"train_loss": -42.97724533081055, "global_step": 353484, "epoch": 2921} {"train_loss": -42.80469512939453, "global_step": 353485, "epoch": 2921} {"train_loss": -43.96487045288086, "global_step": 353486, "epoch": 2921} {"train_loss": -44.050682067871094, "global_step": 353487, "epoch": 2921} {"train_loss": -43.94102096557617, "global_step": 353488, "epoch": 2921} {"train_loss": -43.244102478027344, "global_step": 353489, "epoch": 2921} {"train_loss": -44.4183235168457, "global_step": 353490, "epoch": 2921} {"train_loss": -43.531394958496094, "global_step": 353491, "epoch": 2921} {"train_loss": -44.80449295043945, "global_step": 353492, "epoch": 2921} {"train_loss": -44.013427734375, "global_step": 353493, "epoch": 2921} {"train_loss": -44.76750946044922, "global_step": 353494, "epoch": 2921} {"train_loss": -44.31665802001953, "global_step": 353495, "epoch": 2921} {"train_loss": -44.55227279663086, "global_step": 353496, "epoch": 2921} {"train_loss": -44.16563415527344, "global_step": 353497, "epoch": 2921} {"train_loss": -44.73210906982422, "global_step": 353498, "epoch": 2921} {"train_loss": -44.071693420410156, "global_step": 353499, "epoch": 2921} {"train_loss": -44.28902053833008, "global_step": 353500, "epoch": 2921} {"train_loss": -44.49296951293945, "global_step": 353501, "epoch": 2921} {"train_loss": -44.483150482177734, "global_step": 353502, "epoch": 2921} {"train_loss": -43.36893844604492, "global_step": 353503, "epoch": 2921} {"train_loss": -44.72243881225586, "global_step": 353504, "epoch": 2921} {"train_loss": -44.198604583740234, "global_step": 353505, "epoch": 2921} {"train_loss": -43.14533233642578, "global_step": 353506, "epoch": 2921} {"train_loss": -44.0894660949707, "global_step": 353507, "epoch": 2921} {"train_loss": -44.42351531982422, "global_step": 353508, "epoch": 2921} {"train_loss": -44.02078628540039, "global_step": 353509, "epoch": 2921} {"train_loss": -44.64790725708008, "global_step": 353510, "epoch": 2921} {"train_loss": -44.7985954284668, "global_step": 353511, "epoch": 2921} {"train_loss": -44.45515823364258, "global_step": 353512, "epoch": 2921} {"train_loss": -44.75834655761719, "global_step": 353513, "epoch": 2921} {"train_loss": -45.01559829711914, "global_step": 353514, "epoch": 2921} {"train_loss": -45.028831481933594, "global_step": 353515, "epoch": 2921} {"train_loss": -45.14508819580078, "global_step": 353516, "epoch": 2921} {"train_loss": -44.6413688659668, "global_step": 353517, "epoch": 2921} {"train_loss": -44.55393600463867, "global_step": 353518, "epoch": 2921} {"train_loss": -45.50590133666992, "global_step": 353519, "epoch": 2921} {"train_loss": -44.69435119628906, "global_step": 353520, "epoch": 2921} {"train_loss": -44.684852600097656, "global_step": 353521, "epoch": 2921} {"train_loss": -45.15384292602539, "global_step": 353522, "epoch": 2921} {"train_loss": -44.74675369262695, "global_step": 353523, "epoch": 2921} {"train_loss": -45.2966194152832, "global_step": 353524, "epoch": 2921} {"train_loss": -44.73152542114258, "global_step": 353525, "epoch": 2921} {"train_loss": -44.851341247558594, "global_step": 353526, "epoch": 2921} {"train_loss": -45.00770950317383, "global_step": 353527, "epoch": 2921} {"train_loss": -45.03377914428711, "global_step": 353528, "epoch": 2921} {"train_loss": -45.0111083984375, "global_step": 353529, "epoch": 2921} {"train_loss": -45.03936767578125, "global_step": 353530, "epoch": 2921} {"train_loss": -45.2977409362793, "global_step": 353531, "epoch": 2921} {"train_loss": -45.2492790222168, "global_step": 353532, "epoch": 2921} {"train_loss": -45.3995475769043, "global_step": 353533, "epoch": 2921} {"train_loss": -44.864376068115234, "global_step": 353534, "epoch": 2921} {"train_loss": -44.8476676940918, "global_step": 353535, "epoch": 2921} {"train_loss": -45.097145080566406, "global_step": 353536, "epoch": 2921} {"train_loss": -45.251564025878906, "global_step": 353537, "epoch": 2921} {"train_loss": -44.64776611328125, "global_step": 353538, "epoch": 2921} {"train_loss": -45.463172912597656, "global_step": 353539, "epoch": 2921} {"train_loss": -44.679443359375, "global_step": 353540, "epoch": 2921} {"train_loss": -44.84597396850586, "global_step": 353541, "epoch": 2921} {"train_loss": -44.9256706237793, "global_step": 353542, "epoch": 2921} {"train_loss": -44.923072814941406, "global_step": 353543, "epoch": 2921} {"train_loss": -44.896236419677734, "global_step": 353544, "epoch": 2921} {"train_loss": -44.994571685791016, "global_step": 353545, "epoch": 2921} {"train_loss": -43.60268783569336, "global_step": 353546, "epoch": 2921} {"train_loss": -43.497352600097656, "global_step": 353547, "epoch": 2921} {"train_loss": -43.76334762573242, "global_step": 353548, "epoch": 2921} {"train_loss": -43.00162887573242, "global_step": 353549, "epoch": 2921} {"train_loss": -43.45060348510742, "global_step": 353550, "epoch": 2921} {"train_loss": -40.96990966796875, "global_step": 353551, "epoch": 2921} {"train_loss": -43.88326644897461, "global_step": 353552, "epoch": 2921} {"train_loss": -44.31325149536133, "global_step": 353553, "epoch": 2921} {"train_loss": -43.46664047241211, "global_step": 353554, "epoch": 2921} {"train_loss": -43.45185089111328, "global_step": 353555, "epoch": 2921} {"train_loss": -43.64826202392578, "global_step": 353556, "epoch": 2921} {"train_loss": -41.5295524597168, "global_step": 353557, "epoch": 2921} {"train_loss": -42.19044876098633, "global_step": 353558, "epoch": 2921} {"train_loss": -44.47674560546875, "global_step": 353559, "epoch": 2921} {"train_loss": -43.53162384033203, "global_step": 353560, "epoch": 2921} {"train_loss": -43.924500047667955, "global_step": 353561, "epoch": 2921, "val_loss": 2529020.5} {"train_loss": -42.281288146972656, "global_step": 353562, "epoch": 2922} {"train_loss": -44.144378662109375, "global_step": 353563, "epoch": 2922} {"train_loss": -43.577239990234375, "global_step": 353564, "epoch": 2922} {"train_loss": -43.65793991088867, "global_step": 353565, "epoch": 2922} {"train_loss": -43.0595817565918, "global_step": 353566, "epoch": 2922} {"train_loss": -44.438297271728516, "global_step": 353567, "epoch": 2922} {"train_loss": -44.721595764160156, "global_step": 353568, "epoch": 2922} {"train_loss": -43.092716217041016, "global_step": 353569, "epoch": 2922} {"train_loss": -42.3294792175293, "global_step": 353570, "epoch": 2922} {"train_loss": -43.93174362182617, "global_step": 353571, "epoch": 2922} {"train_loss": -44.774925231933594, "global_step": 353572, "epoch": 2922} {"train_loss": -42.80916976928711, "global_step": 353573, "epoch": 2922} {"train_loss": -43.33656311035156, "global_step": 353574, "epoch": 2922} {"train_loss": -44.851829528808594, "global_step": 353575, "epoch": 2922} {"train_loss": -43.7004280090332, "global_step": 353576, "epoch": 2922} {"train_loss": -43.46798324584961, "global_step": 353577, "epoch": 2922} {"train_loss": -44.34099197387695, "global_step": 353578, "epoch": 2922} {"train_loss": -44.262184143066406, "global_step": 353579, "epoch": 2922} {"train_loss": -44.6490364074707, "global_step": 353580, "epoch": 2922} {"train_loss": -44.289241790771484, "global_step": 353581, "epoch": 2922} {"train_loss": -43.8634147644043, "global_step": 353582, "epoch": 2922} {"train_loss": -44.05669403076172, "global_step": 353583, "epoch": 2922} {"train_loss": -44.3502082824707, "global_step": 353584, "epoch": 2922} {"train_loss": -43.757781982421875, "global_step": 353585, "epoch": 2922} {"train_loss": -43.64027404785156, "global_step": 353586, "epoch": 2922} {"train_loss": -44.74992370605469, "global_step": 353587, "epoch": 2922} {"train_loss": -44.33977127075195, "global_step": 353588, "epoch": 2922} {"train_loss": -43.07972717285156, "global_step": 353589, "epoch": 2922} {"train_loss": -44.24079895019531, "global_step": 353590, "epoch": 2922} {"train_loss": -44.42420959472656, "global_step": 353591, "epoch": 2922} {"train_loss": -44.76951599121094, "global_step": 353592, "epoch": 2922} {"train_loss": -44.7611198425293, "global_step": 353593, "epoch": 2922} {"train_loss": -45.39990234375, "global_step": 353594, "epoch": 2922} {"train_loss": -44.50626754760742, "global_step": 353595, "epoch": 2922} {"train_loss": -44.16569137573242, "global_step": 353596, "epoch": 2922} {"train_loss": -44.798763275146484, "global_step": 353597, "epoch": 2922} {"train_loss": -45.38901901245117, "global_step": 353598, "epoch": 2922} {"train_loss": -44.96299362182617, "global_step": 353599, "epoch": 2922} {"train_loss": -45.32810592651367, "global_step": 353600, "epoch": 2922} {"train_loss": -45.23755645751953, "global_step": 353601, "epoch": 2922} {"train_loss": -44.697509765625, "global_step": 353602, "epoch": 2922} {"train_loss": -44.901851654052734, "global_step": 353603, "epoch": 2922} {"train_loss": -45.1741828918457, "global_step": 353604, "epoch": 2922} {"train_loss": -44.52021026611328, "global_step": 353605, "epoch": 2922} {"train_loss": -44.71366882324219, "global_step": 353606, "epoch": 2922} {"train_loss": -44.921112060546875, "global_step": 353607, "epoch": 2922} {"train_loss": -44.48391342163086, "global_step": 353608, "epoch": 2922} {"train_loss": -43.96262741088867, "global_step": 353609, "epoch": 2922} {"train_loss": -44.78849411010742, "global_step": 353610, "epoch": 2922} {"train_loss": -44.91982650756836, "global_step": 353611, "epoch": 2922} {"train_loss": -43.934139251708984, "global_step": 353612, "epoch": 2922} {"train_loss": -43.65530014038086, "global_step": 353613, "epoch": 2922} {"train_loss": -45.00236511230469, "global_step": 353614, "epoch": 2922} {"train_loss": -44.487483978271484, "global_step": 353615, "epoch": 2922} {"train_loss": -43.36286544799805, "global_step": 353616, "epoch": 2922} {"train_loss": -44.40387725830078, "global_step": 353617, "epoch": 2922} {"train_loss": -44.68494415283203, "global_step": 353618, "epoch": 2922} {"train_loss": -44.544708251953125, "global_step": 353619, "epoch": 2922} {"train_loss": -44.4379997253418, "global_step": 353620, "epoch": 2922} {"train_loss": -44.747291564941406, "global_step": 353621, "epoch": 2922} {"train_loss": -44.6768913269043, "global_step": 353622, "epoch": 2922} {"train_loss": -45.58095932006836, "global_step": 353623, "epoch": 2922} {"train_loss": -44.65859603881836, "global_step": 353624, "epoch": 2922} {"train_loss": -42.781158447265625, "global_step": 353625, "epoch": 2922} {"train_loss": -44.35039138793945, "global_step": 353626, "epoch": 2922} {"train_loss": -44.98496627807617, "global_step": 353627, "epoch": 2922} {"train_loss": -44.710391998291016, "global_step": 353628, "epoch": 2922} {"train_loss": -43.1866569519043, "global_step": 353629, "epoch": 2922} {"train_loss": -41.782081604003906, "global_step": 353630, "epoch": 2922} {"train_loss": -44.46003341674805, "global_step": 353631, "epoch": 2922} {"train_loss": -44.307613372802734, "global_step": 353632, "epoch": 2922} {"train_loss": -42.97105026245117, "global_step": 353633, "epoch": 2922} {"train_loss": -44.541473388671875, "global_step": 353634, "epoch": 2922} {"train_loss": -40.44894790649414, "global_step": 353635, "epoch": 2922} {"train_loss": -43.11452865600586, "global_step": 353636, "epoch": 2922} {"train_loss": -43.200252532958984, "global_step": 353637, "epoch": 2922} {"train_loss": -42.98464584350586, "global_step": 353638, "epoch": 2922} {"train_loss": -42.86616897583008, "global_step": 353639, "epoch": 2922} {"train_loss": -42.62208557128906, "global_step": 353640, "epoch": 2922} {"train_loss": -43.78017807006836, "global_step": 353641, "epoch": 2922} {"train_loss": -42.75199508666992, "global_step": 353642, "epoch": 2922} {"train_loss": -44.1832389831543, "global_step": 353643, "epoch": 2922} {"train_loss": -43.2347412109375, "global_step": 353644, "epoch": 2922} {"train_loss": -42.81273651123047, "global_step": 353645, "epoch": 2922} {"train_loss": -45.00616455078125, "global_step": 353646, "epoch": 2922} {"train_loss": -43.065223693847656, "global_step": 353647, "epoch": 2922} {"train_loss": -43.30696105957031, "global_step": 353648, "epoch": 2922} {"train_loss": -43.672664642333984, "global_step": 353649, "epoch": 2922} {"train_loss": -44.292293548583984, "global_step": 353650, "epoch": 2922} {"train_loss": -43.991912841796875, "global_step": 353651, "epoch": 2922} {"train_loss": -43.214263916015625, "global_step": 353652, "epoch": 2922} {"train_loss": -44.49190139770508, "global_step": 353653, "epoch": 2922} {"train_loss": -42.72431564331055, "global_step": 353654, "epoch": 2922} {"train_loss": -44.57011795043945, "global_step": 353655, "epoch": 2922} {"train_loss": -44.517330169677734, "global_step": 353656, "epoch": 2922} {"train_loss": -42.520931243896484, "global_step": 353657, "epoch": 2922} {"train_loss": -43.8027229309082, "global_step": 353658, "epoch": 2922} {"train_loss": -44.2169303894043, "global_step": 353659, "epoch": 2922} {"train_loss": -43.59682083129883, "global_step": 353660, "epoch": 2922} {"train_loss": -44.679744720458984, "global_step": 353661, "epoch": 2922} {"train_loss": -43.20106887817383, "global_step": 353662, "epoch": 2922} {"train_loss": -44.4644660949707, "global_step": 353663, "epoch": 2922} {"train_loss": -44.3109016418457, "global_step": 353664, "epoch": 2922} {"train_loss": -43.96804428100586, "global_step": 353665, "epoch": 2922} {"train_loss": -44.95066452026367, "global_step": 353666, "epoch": 2922} {"train_loss": -44.24595642089844, "global_step": 353667, "epoch": 2922} {"train_loss": -44.144020080566406, "global_step": 353668, "epoch": 2922} {"train_loss": -44.55242156982422, "global_step": 353669, "epoch": 2922} {"train_loss": -44.83559036254883, "global_step": 353670, "epoch": 2922} {"train_loss": -45.29868698120117, "global_step": 353671, "epoch": 2922} {"train_loss": -44.3609504699707, "global_step": 353672, "epoch": 2922} {"train_loss": -44.203224182128906, "global_step": 353673, "epoch": 2922} {"train_loss": -44.880577087402344, "global_step": 353674, "epoch": 2922} {"train_loss": -44.98093795776367, "global_step": 353675, "epoch": 2922} {"train_loss": -44.98889923095703, "global_step": 353676, "epoch": 2922} {"train_loss": -44.64171600341797, "global_step": 353677, "epoch": 2922} {"train_loss": -45.040138244628906, "global_step": 353678, "epoch": 2922} {"train_loss": -45.02566146850586, "global_step": 353679, "epoch": 2922} {"train_loss": -44.5114860534668, "global_step": 353680, "epoch": 2922} {"train_loss": -45.26324462890625, "global_step": 353681, "epoch": 2922} {"train_loss": -44.134041179310195, "global_step": 353682, "epoch": 2922, "val_loss": 2448225.25} {"train_loss": -44.91489791870117, "global_step": 353683, "epoch": 2923} {"train_loss": -44.01591491699219, "global_step": 353684, "epoch": 2923} {"train_loss": -44.93437576293945, "global_step": 353685, "epoch": 2923} {"train_loss": -45.466522216796875, "global_step": 353686, "epoch": 2923} {"train_loss": -43.91917037963867, "global_step": 353687, "epoch": 2923} {"train_loss": -44.20381546020508, "global_step": 353688, "epoch": 2923} {"train_loss": -44.884464263916016, "global_step": 353689, "epoch": 2923} {"train_loss": -43.729671478271484, "global_step": 353690, "epoch": 2923} {"train_loss": -42.9840202331543, "global_step": 353691, "epoch": 2923} {"train_loss": -44.260597229003906, "global_step": 353692, "epoch": 2923} {"train_loss": -44.679039001464844, "global_step": 353693, "epoch": 2923} {"train_loss": -44.27488327026367, "global_step": 353694, "epoch": 2923} {"train_loss": -44.50000762939453, "global_step": 353695, "epoch": 2923} {"train_loss": -43.28961181640625, "global_step": 353696, "epoch": 2923} {"train_loss": -44.10030746459961, "global_step": 353697, "epoch": 2923} {"train_loss": -44.484859466552734, "global_step": 353698, "epoch": 2923} {"train_loss": -45.157249450683594, "global_step": 353699, "epoch": 2923} {"train_loss": -44.12636184692383, "global_step": 353700, "epoch": 2923} {"train_loss": -42.962890625, "global_step": 353701, "epoch": 2923} {"train_loss": -44.001670837402344, "global_step": 353702, "epoch": 2923} {"train_loss": -44.94832992553711, "global_step": 353703, "epoch": 2923} {"train_loss": -44.9250373840332, "global_step": 353704, "epoch": 2923} {"train_loss": -44.692222595214844, "global_step": 353705, "epoch": 2923} {"train_loss": -44.24623489379883, "global_step": 353706, "epoch": 2923} {"train_loss": -44.569698333740234, "global_step": 353707, "epoch": 2923} {"train_loss": -44.9522819519043, "global_step": 353708, "epoch": 2923} {"train_loss": -44.4448356628418, "global_step": 353709, "epoch": 2923} {"train_loss": -45.009613037109375, "global_step": 353710, "epoch": 2923} {"train_loss": -44.94510269165039, "global_step": 353711, "epoch": 2923} {"train_loss": -44.6047477722168, "global_step": 353712, "epoch": 2923} {"train_loss": -45.501949310302734, "global_step": 353713, "epoch": 2923} {"train_loss": -44.630096435546875, "global_step": 353714, "epoch": 2923} {"train_loss": -44.5040168762207, "global_step": 353715, "epoch": 2923} {"train_loss": -44.42488479614258, "global_step": 353716, "epoch": 2923} {"train_loss": -45.38295364379883, "global_step": 353717, "epoch": 2923} {"train_loss": -44.52730941772461, "global_step": 353718, "epoch": 2923} {"train_loss": -44.431297302246094, "global_step": 353719, "epoch": 2923} {"train_loss": -45.00376510620117, "global_step": 353720, "epoch": 2923} {"train_loss": -43.8026237487793, "global_step": 353721, "epoch": 2923} {"train_loss": -45.29517364501953, "global_step": 353722, "epoch": 2923} {"train_loss": -44.0047492980957, "global_step": 353723, "epoch": 2923} {"train_loss": -44.680782318115234, "global_step": 353724, "epoch": 2923} {"train_loss": -43.942909240722656, "global_step": 353725, "epoch": 2923} {"train_loss": -42.96232986450195, "global_step": 353726, "epoch": 2923} {"train_loss": -43.53895950317383, "global_step": 353727, "epoch": 2923} {"train_loss": -44.740692138671875, "global_step": 353728, "epoch": 2923} {"train_loss": -40.25588607788086, "global_step": 353729, "epoch": 2923} {"train_loss": -42.46627426147461, "global_step": 353730, "epoch": 2923} {"train_loss": -41.3422966003418, "global_step": 353731, "epoch": 2923} {"train_loss": -42.30198669433594, "global_step": 353732, "epoch": 2923} {"train_loss": -42.96662139892578, "global_step": 353733, "epoch": 2923} {"train_loss": -39.65167236328125, "global_step": 353734, "epoch": 2923} {"train_loss": -44.48850631713867, "global_step": 353735, "epoch": 2923} {"train_loss": -41.56728744506836, "global_step": 353736, "epoch": 2923} {"train_loss": -43.58948516845703, "global_step": 353737, "epoch": 2923} {"train_loss": -42.24591827392578, "global_step": 353738, "epoch": 2923} {"train_loss": -44.387516021728516, "global_step": 353739, "epoch": 2923} {"train_loss": -43.86985778808594, "global_step": 353740, "epoch": 2923} {"train_loss": -41.60828399658203, "global_step": 353741, "epoch": 2923} {"train_loss": -44.06740188598633, "global_step": 353742, "epoch": 2923} {"train_loss": -43.20325469970703, "global_step": 353743, "epoch": 2923} {"train_loss": -42.429080963134766, "global_step": 353744, "epoch": 2923} {"train_loss": -41.83553695678711, "global_step": 353745, "epoch": 2923} {"train_loss": -43.57624053955078, "global_step": 353746, "epoch": 2923} {"train_loss": -43.27106475830078, "global_step": 353747, "epoch": 2923} {"train_loss": -43.245670318603516, "global_step": 353748, "epoch": 2923} {"train_loss": -43.865638732910156, "global_step": 353749, "epoch": 2923} {"train_loss": -44.17469024658203, "global_step": 353750, "epoch": 2923} {"train_loss": -43.651206970214844, "global_step": 353751, "epoch": 2923} {"train_loss": -43.55336380004883, "global_step": 353752, "epoch": 2923} {"train_loss": -44.28824996948242, "global_step": 353753, "epoch": 2923} {"train_loss": -43.50154495239258, "global_step": 353754, "epoch": 2923} {"train_loss": -43.0411491394043, "global_step": 353755, "epoch": 2923} {"train_loss": -45.0980339050293, "global_step": 353756, "epoch": 2923} {"train_loss": -43.883644104003906, "global_step": 353757, "epoch": 2923} {"train_loss": -44.64170837402344, "global_step": 353758, "epoch": 2923} {"train_loss": -43.735923767089844, "global_step": 353759, "epoch": 2923} {"train_loss": -45.10804748535156, "global_step": 353760, "epoch": 2923} {"train_loss": -44.30497360229492, "global_step": 353761, "epoch": 2923} {"train_loss": -44.66788101196289, "global_step": 353762, "epoch": 2923} {"train_loss": -44.030906677246094, "global_step": 353763, "epoch": 2923} {"train_loss": -44.70406723022461, "global_step": 353764, "epoch": 2923} {"train_loss": -44.32508850097656, "global_step": 353765, "epoch": 2923} {"train_loss": -43.97430419921875, "global_step": 353766, "epoch": 2923} {"train_loss": -44.56979751586914, "global_step": 353767, "epoch": 2923} {"train_loss": -44.91461181640625, "global_step": 353768, "epoch": 2923} {"train_loss": -44.55308151245117, "global_step": 353769, "epoch": 2923} {"train_loss": -44.94377899169922, "global_step": 353770, "epoch": 2923} {"train_loss": -44.78889083862305, "global_step": 353771, "epoch": 2923} {"train_loss": -44.451988220214844, "global_step": 353772, "epoch": 2923} {"train_loss": -44.72337341308594, "global_step": 353773, "epoch": 2923} {"train_loss": -44.9283561706543, "global_step": 353774, "epoch": 2923} {"train_loss": -44.63556671142578, "global_step": 353775, "epoch": 2923} {"train_loss": -45.10465621948242, "global_step": 353776, "epoch": 2923} {"train_loss": -44.367340087890625, "global_step": 353777, "epoch": 2923} {"train_loss": -45.516845703125, "global_step": 353778, "epoch": 2923} {"train_loss": -45.311519622802734, "global_step": 353779, "epoch": 2923} {"train_loss": -45.47674560546875, "global_step": 353780, "epoch": 2923} {"train_loss": -45.5169563293457, "global_step": 353781, "epoch": 2923} {"train_loss": -45.070438385009766, "global_step": 353782, "epoch": 2923} {"train_loss": -45.332881927490234, "global_step": 353783, "epoch": 2923} {"train_loss": -45.023109436035156, "global_step": 353784, "epoch": 2923} {"train_loss": -45.41181945800781, "global_step": 353785, "epoch": 2923} {"train_loss": -45.433250427246094, "global_step": 353786, "epoch": 2923} {"train_loss": -45.07908248901367, "global_step": 353787, "epoch": 2923} {"train_loss": -45.35575866699219, "global_step": 353788, "epoch": 2923} {"train_loss": -45.696327209472656, "global_step": 353789, "epoch": 2923} {"train_loss": -45.09596633911133, "global_step": 353790, "epoch": 2923} {"train_loss": -45.866214752197266, "global_step": 353791, "epoch": 2923} {"train_loss": -45.14662170410156, "global_step": 353792, "epoch": 2923} {"train_loss": -45.35544967651367, "global_step": 353793, "epoch": 2923} {"train_loss": -45.69124984741211, "global_step": 353794, "epoch": 2923} {"train_loss": -44.89588165283203, "global_step": 353795, "epoch": 2923} {"train_loss": -45.14922332763672, "global_step": 353796, "epoch": 2923} {"train_loss": -45.86445236206055, "global_step": 353797, "epoch": 2923} {"train_loss": -44.95948028564453, "global_step": 353798, "epoch": 2923} {"train_loss": -44.88678741455078, "global_step": 353799, "epoch": 2923} {"train_loss": -45.22015380859375, "global_step": 353800, "epoch": 2923} {"train_loss": -44.87202835083008, "global_step": 353801, "epoch": 2923} {"train_loss": -45.1809196472168, "global_step": 353802, "epoch": 2923} {"train_loss": -44.2995533588504, "global_step": 353803, "epoch": 2923, "val_loss": 2546050.0} {"train_loss": -44.7830696105957, "global_step": 353804, "epoch": 2924} {"train_loss": -45.28491973876953, "global_step": 353805, "epoch": 2924} {"train_loss": -44.86812973022461, "global_step": 353806, "epoch": 2924} {"train_loss": -43.67934799194336, "global_step": 353807, "epoch": 2924} {"train_loss": -43.648162841796875, "global_step": 353808, "epoch": 2924} {"train_loss": -44.54819107055664, "global_step": 353809, "epoch": 2924} {"train_loss": -45.407386779785156, "global_step": 353810, "epoch": 2924} {"train_loss": -45.50967025756836, "global_step": 353811, "epoch": 2924} {"train_loss": -43.837032318115234, "global_step": 353812, "epoch": 2924} {"train_loss": -44.40496826171875, "global_step": 353813, "epoch": 2924} {"train_loss": -45.1459846496582, "global_step": 353814, "epoch": 2924} {"train_loss": -45.17425537109375, "global_step": 353815, "epoch": 2924} {"train_loss": -45.5316162109375, "global_step": 353816, "epoch": 2924} {"train_loss": -45.36637496948242, "global_step": 353817, "epoch": 2924} {"train_loss": -44.7960205078125, "global_step": 353818, "epoch": 2924} {"train_loss": -45.29315948486328, "global_step": 353819, "epoch": 2924} {"train_loss": -44.85615158081055, "global_step": 353820, "epoch": 2924} {"train_loss": -43.95394515991211, "global_step": 353821, "epoch": 2924} {"train_loss": -43.561458587646484, "global_step": 353822, "epoch": 2924} {"train_loss": -42.891632080078125, "global_step": 353823, "epoch": 2924} {"train_loss": -43.54941940307617, "global_step": 353824, "epoch": 2924} {"train_loss": -44.84049606323242, "global_step": 353825, "epoch": 2924} {"train_loss": -43.25876998901367, "global_step": 353826, "epoch": 2924} {"train_loss": -42.408241271972656, "global_step": 353827, "epoch": 2924} {"train_loss": -44.706146240234375, "global_step": 353828, "epoch": 2924} {"train_loss": -44.83598709106445, "global_step": 353829, "epoch": 2924} {"train_loss": -44.0868034362793, "global_step": 353830, "epoch": 2924} {"train_loss": -45.22125244140625, "global_step": 353831, "epoch": 2924} {"train_loss": -45.57328414916992, "global_step": 353832, "epoch": 2924} {"train_loss": -45.020172119140625, "global_step": 353833, "epoch": 2924} {"train_loss": -45.38576126098633, "global_step": 353834, "epoch": 2924} {"train_loss": -45.10071563720703, "global_step": 353835, "epoch": 2924} {"train_loss": -45.1155891418457, "global_step": 353836, "epoch": 2924} {"train_loss": -44.736690521240234, "global_step": 353837, "epoch": 2924} {"train_loss": -45.28581619262695, "global_step": 353838, "epoch": 2924} {"train_loss": -45.71213912963867, "global_step": 353839, "epoch": 2924} {"train_loss": -45.048004150390625, "global_step": 353840, "epoch": 2924} {"train_loss": -45.12261199951172, "global_step": 353841, "epoch": 2924} {"train_loss": -44.79656982421875, "global_step": 353842, "epoch": 2924} {"train_loss": -44.918636322021484, "global_step": 353843, "epoch": 2924} {"train_loss": -45.220027923583984, "global_step": 353844, "epoch": 2924} {"train_loss": -45.36491012573242, "global_step": 353845, "epoch": 2924} {"train_loss": -44.70109176635742, "global_step": 353846, "epoch": 2924} {"train_loss": -44.79398727416992, "global_step": 353847, "epoch": 2924} {"train_loss": -45.82147216796875, "global_step": 353848, "epoch": 2924} {"train_loss": -44.92641830444336, "global_step": 353849, "epoch": 2924} {"train_loss": -45.13936233520508, "global_step": 353850, "epoch": 2924} {"train_loss": -44.4427375793457, "global_step": 353851, "epoch": 2924} {"train_loss": -44.92304611206055, "global_step": 353852, "epoch": 2924} {"train_loss": -44.02631759643555, "global_step": 353853, "epoch": 2924} {"train_loss": -44.252471923828125, "global_step": 353854, "epoch": 2924} {"train_loss": -44.35431671142578, "global_step": 353855, "epoch": 2924} {"train_loss": -44.195518493652344, "global_step": 353856, "epoch": 2924} {"train_loss": -43.8016357421875, "global_step": 353857, "epoch": 2924} {"train_loss": -43.818782806396484, "global_step": 353858, "epoch": 2924} {"train_loss": -43.77925491333008, "global_step": 353859, "epoch": 2924} {"train_loss": -44.35089874267578, "global_step": 353860, "epoch": 2924} {"train_loss": -44.26682662963867, "global_step": 353861, "epoch": 2924} {"train_loss": -43.87763595581055, "global_step": 353862, "epoch": 2924} {"train_loss": -41.52494430541992, "global_step": 353863, "epoch": 2924} {"train_loss": -43.976558685302734, "global_step": 353864, "epoch": 2924} {"train_loss": -42.7005500793457, "global_step": 353865, "epoch": 2924} {"train_loss": -42.804931640625, "global_step": 353866, "epoch": 2924} {"train_loss": -41.596099853515625, "global_step": 353867, "epoch": 2924} {"train_loss": -43.35512161254883, "global_step": 353868, "epoch": 2924} {"train_loss": -41.38556671142578, "global_step": 353869, "epoch": 2924} {"train_loss": -40.826656341552734, "global_step": 353870, "epoch": 2924} {"train_loss": -44.53529739379883, "global_step": 353871, "epoch": 2924} {"train_loss": -43.613128662109375, "global_step": 353872, "epoch": 2924} {"train_loss": -42.608184814453125, "global_step": 353873, "epoch": 2924} {"train_loss": -42.02638626098633, "global_step": 353874, "epoch": 2924} {"train_loss": -43.32416534423828, "global_step": 353875, "epoch": 2924} {"train_loss": -44.14617919921875, "global_step": 353876, "epoch": 2924} {"train_loss": -43.146705627441406, "global_step": 353877, "epoch": 2924} {"train_loss": -43.89901351928711, "global_step": 353878, "epoch": 2924} {"train_loss": -44.80160140991211, "global_step": 353879, "epoch": 2924} {"train_loss": -43.33890914916992, "global_step": 353880, "epoch": 2924} {"train_loss": -44.16510009765625, "global_step": 353881, "epoch": 2924} {"train_loss": -43.516475677490234, "global_step": 353882, "epoch": 2924} {"train_loss": -43.713645935058594, "global_step": 353883, "epoch": 2924} {"train_loss": -42.45945358276367, "global_step": 353884, "epoch": 2924} {"train_loss": -44.202659606933594, "global_step": 353885, "epoch": 2924} {"train_loss": -42.8646125793457, "global_step": 353886, "epoch": 2924} {"train_loss": -42.962825775146484, "global_step": 353887, "epoch": 2924} {"train_loss": -44.30481719970703, "global_step": 353888, "epoch": 2924} {"train_loss": -44.067909240722656, "global_step": 353889, "epoch": 2924} {"train_loss": -44.53225326538086, "global_step": 353890, "epoch": 2924} {"train_loss": -44.52254867553711, "global_step": 353891, "epoch": 2924} {"train_loss": -43.66763687133789, "global_step": 353892, "epoch": 2924} {"train_loss": -44.5252571105957, "global_step": 353893, "epoch": 2924} {"train_loss": -44.50908660888672, "global_step": 353894, "epoch": 2924} {"train_loss": -44.58662033081055, "global_step": 353895, "epoch": 2924} {"train_loss": -44.466548919677734, "global_step": 353896, "epoch": 2924} {"train_loss": -44.87026596069336, "global_step": 353897, "epoch": 2924} {"train_loss": -44.491493225097656, "global_step": 353898, "epoch": 2924} {"train_loss": -44.24026107788086, "global_step": 353899, "epoch": 2924} {"train_loss": -44.75434875488281, "global_step": 353900, "epoch": 2924} {"train_loss": -44.63241958618164, "global_step": 353901, "epoch": 2924} {"train_loss": -44.690147399902344, "global_step": 353902, "epoch": 2924} {"train_loss": -45.06266403198242, "global_step": 353903, "epoch": 2924} {"train_loss": -45.02134323120117, "global_step": 353904, "epoch": 2924} {"train_loss": -45.427852630615234, "global_step": 353905, "epoch": 2924} {"train_loss": -44.788734436035156, "global_step": 353906, "epoch": 2924} {"train_loss": -45.32957077026367, "global_step": 353907, "epoch": 2924} {"train_loss": -44.8953857421875, "global_step": 353908, "epoch": 2924} {"train_loss": -45.1038932800293, "global_step": 353909, "epoch": 2924} {"train_loss": -44.343467712402344, "global_step": 353910, "epoch": 2924} {"train_loss": -44.99055862426758, "global_step": 353911, "epoch": 2924} {"train_loss": -45.00576400756836, "global_step": 353912, "epoch": 2924} {"train_loss": -45.30070114135742, "global_step": 353913, "epoch": 2924} {"train_loss": -44.71711349487305, "global_step": 353914, "epoch": 2924} {"train_loss": -44.718597412109375, "global_step": 353915, "epoch": 2924} {"train_loss": -45.44822311401367, "global_step": 353916, "epoch": 2924} {"train_loss": -45.0725212097168, "global_step": 353917, "epoch": 2924} {"train_loss": -44.74839401245117, "global_step": 353918, "epoch": 2924} {"train_loss": -44.98249435424805, "global_step": 353919, "epoch": 2924} {"train_loss": -45.530452728271484, "global_step": 353920, "epoch": 2924} {"train_loss": -44.79530715942383, "global_step": 353921, "epoch": 2924} {"train_loss": -45.33179473876953, "global_step": 353922, "epoch": 2924} {"train_loss": -45.73464584350586, "global_step": 353923, "epoch": 2924} {"train_loss": -44.37452464458371, "global_step": 353924, "epoch": 2924, "val_loss": 2497595.25} {"train_loss": -44.9711799621582, "global_step": 353925, "epoch": 2925} {"train_loss": -45.280460357666016, "global_step": 353926, "epoch": 2925} {"train_loss": -45.7007942199707, "global_step": 353927, "epoch": 2925} {"train_loss": -45.34114074707031, "global_step": 353928, "epoch": 2925} {"train_loss": -45.459510803222656, "global_step": 353929, "epoch": 2925} {"train_loss": -44.98952865600586, "global_step": 353930, "epoch": 2925} {"train_loss": -44.59495544433594, "global_step": 353931, "epoch": 2925} {"train_loss": -45.37720489501953, "global_step": 353932, "epoch": 2925} {"train_loss": -44.12306594848633, "global_step": 353933, "epoch": 2925} {"train_loss": -43.90924835205078, "global_step": 353934, "epoch": 2925} {"train_loss": -45.66891098022461, "global_step": 353935, "epoch": 2925} {"train_loss": -45.18608856201172, "global_step": 353936, "epoch": 2925} {"train_loss": -44.769344329833984, "global_step": 353937, "epoch": 2925} {"train_loss": -45.81574249267578, "global_step": 353938, "epoch": 2925} {"train_loss": -45.05814743041992, "global_step": 353939, "epoch": 2925} {"train_loss": -45.2291374206543, "global_step": 353940, "epoch": 2925} {"train_loss": -44.92332458496094, "global_step": 353941, "epoch": 2925} {"train_loss": -44.731868743896484, "global_step": 353942, "epoch": 2925} {"train_loss": -43.20884323120117, "global_step": 353943, "epoch": 2925} {"train_loss": -44.38050079345703, "global_step": 353944, "epoch": 2925} {"train_loss": -44.64751434326172, "global_step": 353945, "epoch": 2925} {"train_loss": -44.608943939208984, "global_step": 353946, "epoch": 2925} {"train_loss": -44.688899993896484, "global_step": 353947, "epoch": 2925} {"train_loss": -44.467529296875, "global_step": 353948, "epoch": 2925} {"train_loss": -43.9107551574707, "global_step": 353949, "epoch": 2925} {"train_loss": -44.9648323059082, "global_step": 353950, "epoch": 2925} {"train_loss": -44.73866653442383, "global_step": 353951, "epoch": 2925} {"train_loss": -44.066200256347656, "global_step": 353952, "epoch": 2925} {"train_loss": -44.87465286254883, "global_step": 353953, "epoch": 2925} {"train_loss": -44.77034378051758, "global_step": 353954, "epoch": 2925} {"train_loss": -44.522579193115234, "global_step": 353955, "epoch": 2925} {"train_loss": -44.23090744018555, "global_step": 353956, "epoch": 2925} {"train_loss": -43.8245735168457, "global_step": 353957, "epoch": 2925} {"train_loss": -44.479835510253906, "global_step": 353958, "epoch": 2925} {"train_loss": -45.21992492675781, "global_step": 353959, "epoch": 2925} {"train_loss": -44.499122619628906, "global_step": 353960, "epoch": 2925} {"train_loss": -45.04798889160156, "global_step": 353961, "epoch": 2925} {"train_loss": -44.83742904663086, "global_step": 353962, "epoch": 2925} {"train_loss": -43.68334197998047, "global_step": 353963, "epoch": 2925} {"train_loss": -44.22852325439453, "global_step": 353964, "epoch": 2925} {"train_loss": -44.61731719970703, "global_step": 353965, "epoch": 2925} {"train_loss": -45.74949264526367, "global_step": 353966, "epoch": 2925} {"train_loss": -45.46234893798828, "global_step": 353967, "epoch": 2925} {"train_loss": -44.77974319458008, "global_step": 353968, "epoch": 2925} {"train_loss": -45.104766845703125, "global_step": 353969, "epoch": 2925} {"train_loss": -45.22056198120117, "global_step": 353970, "epoch": 2925} {"train_loss": -44.316036224365234, "global_step": 353971, "epoch": 2925} {"train_loss": -44.742977142333984, "global_step": 353972, "epoch": 2925} {"train_loss": -44.42118453979492, "global_step": 353973, "epoch": 2925} {"train_loss": -43.95951461791992, "global_step": 353974, "epoch": 2925} {"train_loss": -45.01093673706055, "global_step": 353975, "epoch": 2925} {"train_loss": -44.18723678588867, "global_step": 353976, "epoch": 2925} {"train_loss": -43.399654388427734, "global_step": 353977, "epoch": 2925} {"train_loss": -45.17348098754883, "global_step": 353978, "epoch": 2925} {"train_loss": -44.72216033935547, "global_step": 353979, "epoch": 2925} {"train_loss": -42.8846435546875, "global_step": 353980, "epoch": 2925} {"train_loss": -44.23076248168945, "global_step": 353981, "epoch": 2925} {"train_loss": -44.088253021240234, "global_step": 353982, "epoch": 2925} {"train_loss": -42.505218505859375, "global_step": 353983, "epoch": 2925} {"train_loss": -44.37238693237305, "global_step": 353984, "epoch": 2925} {"train_loss": -43.6220703125, "global_step": 353985, "epoch": 2925} {"train_loss": -44.358455657958984, "global_step": 353986, "epoch": 2925} {"train_loss": -43.9110221862793, "global_step": 353987, "epoch": 2925} {"train_loss": -42.17119598388672, "global_step": 353988, "epoch": 2925} {"train_loss": -43.624839782714844, "global_step": 353989, "epoch": 2925} {"train_loss": -43.58197021484375, "global_step": 353990, "epoch": 2925} {"train_loss": -42.06121826171875, "global_step": 353991, "epoch": 2925} {"train_loss": -43.22346115112305, "global_step": 353992, "epoch": 2925} {"train_loss": -44.14669418334961, "global_step": 353993, "epoch": 2925} {"train_loss": -43.01375961303711, "global_step": 353994, "epoch": 2925} {"train_loss": -42.959808349609375, "global_step": 353995, "epoch": 2925} {"train_loss": -43.50640869140625, "global_step": 353996, "epoch": 2925} {"train_loss": -42.37302780151367, "global_step": 353997, "epoch": 2925} {"train_loss": -43.01153564453125, "global_step": 353998, "epoch": 2925} {"train_loss": -43.63825607299805, "global_step": 353999, "epoch": 2925} {"train_loss": -41.9957160949707, "global_step": 354000, "epoch": 2925} {"train_loss": -44.092567443847656, "global_step": 354001, "epoch": 2925} {"train_loss": -43.56528854370117, "global_step": 354002, "epoch": 2925} {"train_loss": -42.60776901245117, "global_step": 354003, "epoch": 2925} {"train_loss": -44.257686614990234, "global_step": 354004, "epoch": 2925} {"train_loss": -43.36052322387695, "global_step": 354005, "epoch": 2925} {"train_loss": -44.061256408691406, "global_step": 354006, "epoch": 2925} {"train_loss": -43.57353210449219, "global_step": 354007, "epoch": 2925} {"train_loss": -44.087928771972656, "global_step": 354008, "epoch": 2925} {"train_loss": -43.678646087646484, "global_step": 354009, "epoch": 2925} {"train_loss": -44.60502243041992, "global_step": 354010, "epoch": 2925} {"train_loss": -44.025901794433594, "global_step": 354011, "epoch": 2925} {"train_loss": -44.12955093383789, "global_step": 354012, "epoch": 2925} {"train_loss": -44.30690002441406, "global_step": 354013, "epoch": 2925} {"train_loss": -43.14156723022461, "global_step": 354014, "epoch": 2925} {"train_loss": -45.122982025146484, "global_step": 354015, "epoch": 2925} {"train_loss": -43.92327880859375, "global_step": 354016, "epoch": 2925} {"train_loss": -44.99715042114258, "global_step": 354017, "epoch": 2925} {"train_loss": -43.960960388183594, "global_step": 354018, "epoch": 2925} {"train_loss": -44.296173095703125, "global_step": 354019, "epoch": 2925} {"train_loss": -44.55739974975586, "global_step": 354020, "epoch": 2925} {"train_loss": -44.954078674316406, "global_step": 354021, "epoch": 2925} {"train_loss": -44.6899299621582, "global_step": 354022, "epoch": 2925} {"train_loss": -44.74309539794922, "global_step": 354023, "epoch": 2925} {"train_loss": -44.416847229003906, "global_step": 354024, "epoch": 2925} {"train_loss": -43.75751876831055, "global_step": 354025, "epoch": 2925} {"train_loss": -45.139312744140625, "global_step": 354026, "epoch": 2925} {"train_loss": -43.890838623046875, "global_step": 354027, "epoch": 2925} {"train_loss": -45.31443405151367, "global_step": 354028, "epoch": 2925} {"train_loss": -45.22053527832031, "global_step": 354029, "epoch": 2925} {"train_loss": -45.372901916503906, "global_step": 354030, "epoch": 2925} {"train_loss": -45.08575439453125, "global_step": 354031, "epoch": 2925} {"train_loss": -44.84761047363281, "global_step": 354032, "epoch": 2925} {"train_loss": -45.2544059753418, "global_step": 354033, "epoch": 2925} {"train_loss": -44.70451354980469, "global_step": 354034, "epoch": 2925} {"train_loss": -45.25341033935547, "global_step": 354035, "epoch": 2925} {"train_loss": -45.496002197265625, "global_step": 354036, "epoch": 2925} {"train_loss": -44.92631912231445, "global_step": 354037, "epoch": 2925} {"train_loss": -45.22483444213867, "global_step": 354038, "epoch": 2925} {"train_loss": -43.812374114990234, "global_step": 354039, "epoch": 2925} {"train_loss": -45.39008331298828, "global_step": 354040, "epoch": 2925} {"train_loss": -44.31902313232422, "global_step": 354041, "epoch": 2925} {"train_loss": -44.388980865478516, "global_step": 354042, "epoch": 2925} {"train_loss": -45.15590286254883, "global_step": 354043, "epoch": 2925} {"train_loss": -43.50335693359375, "global_step": 354044, "epoch": 2925} {"train_loss": -44.37795040036036, "global_step": 354045, "epoch": 2925, "val_loss": 2485469.75} {"train_loss": -44.95588302612305, "global_step": 354046, "epoch": 2926} {"train_loss": -44.67547607421875, "global_step": 354047, "epoch": 2926} {"train_loss": -45.358131408691406, "global_step": 354048, "epoch": 2926} {"train_loss": -44.91791534423828, "global_step": 354049, "epoch": 2926} {"train_loss": -45.309356689453125, "global_step": 354050, "epoch": 2926} {"train_loss": -44.40560531616211, "global_step": 354051, "epoch": 2926} {"train_loss": -44.454463958740234, "global_step": 354052, "epoch": 2926} {"train_loss": -45.79347610473633, "global_step": 354053, "epoch": 2926} {"train_loss": -44.717933654785156, "global_step": 354054, "epoch": 2926} {"train_loss": -44.47121047973633, "global_step": 354055, "epoch": 2926} {"train_loss": -45.81940460205078, "global_step": 354056, "epoch": 2926} {"train_loss": -44.960235595703125, "global_step": 354057, "epoch": 2926} {"train_loss": -45.53255844116211, "global_step": 354058, "epoch": 2926} {"train_loss": -45.41579818725586, "global_step": 354059, "epoch": 2926} {"train_loss": -44.78743362426758, "global_step": 354060, "epoch": 2926} {"train_loss": -45.546241760253906, "global_step": 354061, "epoch": 2926} {"train_loss": -44.997589111328125, "global_step": 354062, "epoch": 2926} {"train_loss": -45.72972869873047, "global_step": 354063, "epoch": 2926} {"train_loss": -45.34357452392578, "global_step": 354064, "epoch": 2926} {"train_loss": -45.46598434448242, "global_step": 354065, "epoch": 2926} {"train_loss": -45.68043899536133, "global_step": 354066, "epoch": 2926} {"train_loss": -45.22453689575195, "global_step": 354067, "epoch": 2926} {"train_loss": -44.874061584472656, "global_step": 354068, "epoch": 2926} {"train_loss": -45.2926139831543, "global_step": 354069, "epoch": 2926} {"train_loss": -44.7808837890625, "global_step": 354070, "epoch": 2926} {"train_loss": -45.24430465698242, "global_step": 354071, "epoch": 2926} {"train_loss": -43.60020065307617, "global_step": 354072, "epoch": 2926} {"train_loss": -44.110084533691406, "global_step": 354073, "epoch": 2926} {"train_loss": -44.892791748046875, "global_step": 354074, "epoch": 2926} {"train_loss": -43.76718521118164, "global_step": 354075, "epoch": 2926} {"train_loss": -44.6124382019043, "global_step": 354076, "epoch": 2926} {"train_loss": -44.13965606689453, "global_step": 354077, "epoch": 2926} {"train_loss": -43.74224853515625, "global_step": 354078, "epoch": 2926} {"train_loss": -44.527008056640625, "global_step": 354079, "epoch": 2926} {"train_loss": -45.118587493896484, "global_step": 354080, "epoch": 2926} {"train_loss": -43.430599212646484, "global_step": 354081, "epoch": 2926} {"train_loss": -43.75193405151367, "global_step": 354082, "epoch": 2926} {"train_loss": -44.572994232177734, "global_step": 354083, "epoch": 2926} {"train_loss": -45.211029052734375, "global_step": 354084, "epoch": 2926} {"train_loss": -44.93082809448242, "global_step": 354085, "epoch": 2926} {"train_loss": -45.14162826538086, "global_step": 354086, "epoch": 2926} {"train_loss": -45.65835189819336, "global_step": 354087, "epoch": 2926} {"train_loss": -44.78274917602539, "global_step": 354088, "epoch": 2926} {"train_loss": -45.27181625366211, "global_step": 354089, "epoch": 2926} {"train_loss": -44.68270492553711, "global_step": 354090, "epoch": 2926} {"train_loss": -44.88063430786133, "global_step": 354091, "epoch": 2926} {"train_loss": -45.01411819458008, "global_step": 354092, "epoch": 2926} {"train_loss": -45.21135711669922, "global_step": 354093, "epoch": 2926} {"train_loss": -45.27375030517578, "global_step": 354094, "epoch": 2926} {"train_loss": -45.326839447021484, "global_step": 354095, "epoch": 2926} {"train_loss": -43.75425720214844, "global_step": 354096, "epoch": 2926} {"train_loss": -44.031982421875, "global_step": 354097, "epoch": 2926} {"train_loss": -43.3069953918457, "global_step": 354098, "epoch": 2926} {"train_loss": -44.1682243347168, "global_step": 354099, "epoch": 2926} {"train_loss": -45.30241012573242, "global_step": 354100, "epoch": 2926} {"train_loss": -44.00261306762695, "global_step": 354101, "epoch": 2926} {"train_loss": -43.628936767578125, "global_step": 354102, "epoch": 2926} {"train_loss": -43.8227653503418, "global_step": 354103, "epoch": 2926} {"train_loss": -44.2503776550293, "global_step": 354104, "epoch": 2926} {"train_loss": -44.70634078979492, "global_step": 354105, "epoch": 2926} {"train_loss": -42.69416046142578, "global_step": 354106, "epoch": 2926} {"train_loss": -42.818511962890625, "global_step": 354107, "epoch": 2926} {"train_loss": -43.687129974365234, "global_step": 354108, "epoch": 2926} {"train_loss": -44.37502670288086, "global_step": 354109, "epoch": 2926} {"train_loss": -43.98456954956055, "global_step": 354110, "epoch": 2926} {"train_loss": -44.006752014160156, "global_step": 354111, "epoch": 2926} {"train_loss": -44.200408935546875, "global_step": 354112, "epoch": 2926} {"train_loss": -44.348976135253906, "global_step": 354113, "epoch": 2926} {"train_loss": -45.56969451904297, "global_step": 354114, "epoch": 2926} {"train_loss": -45.49411392211914, "global_step": 354115, "epoch": 2926} {"train_loss": -43.73232650756836, "global_step": 354116, "epoch": 2926} {"train_loss": -43.67867660522461, "global_step": 354117, "epoch": 2926} {"train_loss": -45.06317138671875, "global_step": 354118, "epoch": 2926} {"train_loss": -44.43636703491211, "global_step": 354119, "epoch": 2926} {"train_loss": -44.732906341552734, "global_step": 354120, "epoch": 2926} {"train_loss": -44.4297981262207, "global_step": 354121, "epoch": 2926} {"train_loss": -44.618560791015625, "global_step": 354122, "epoch": 2926} {"train_loss": -45.56031036376953, "global_step": 354123, "epoch": 2926} {"train_loss": -44.19462966918945, "global_step": 354124, "epoch": 2926} {"train_loss": -45.20195388793945, "global_step": 354125, "epoch": 2926} {"train_loss": -45.12921905517578, "global_step": 354126, "epoch": 2926} {"train_loss": -44.942806243896484, "global_step": 354127, "epoch": 2926} {"train_loss": -45.293067932128906, "global_step": 354128, "epoch": 2926} {"train_loss": -44.4415283203125, "global_step": 354129, "epoch": 2926} {"train_loss": -45.17629623413086, "global_step": 354130, "epoch": 2926} {"train_loss": -44.957881927490234, "global_step": 354131, "epoch": 2926} {"train_loss": -45.261817932128906, "global_step": 354132, "epoch": 2926} {"train_loss": -45.48274612426758, "global_step": 354133, "epoch": 2926} {"train_loss": -45.23188018798828, "global_step": 354134, "epoch": 2926} {"train_loss": -45.351837158203125, "global_step": 354135, "epoch": 2926} {"train_loss": -45.174076080322266, "global_step": 354136, "epoch": 2926} {"train_loss": -45.29874801635742, "global_step": 354137, "epoch": 2926} {"train_loss": -45.55658721923828, "global_step": 354138, "epoch": 2926} {"train_loss": -45.41126251220703, "global_step": 354139, "epoch": 2926} {"train_loss": -44.87773895263672, "global_step": 354140, "epoch": 2926} {"train_loss": -45.100215911865234, "global_step": 354141, "epoch": 2926} {"train_loss": -45.33696365356445, "global_step": 354142, "epoch": 2926} {"train_loss": -44.62370681762695, "global_step": 354143, "epoch": 2926} {"train_loss": -45.44183349609375, "global_step": 354144, "epoch": 2926} {"train_loss": -44.599220275878906, "global_step": 354145, "epoch": 2926} {"train_loss": -45.71696853637695, "global_step": 354146, "epoch": 2926} {"train_loss": -43.693660736083984, "global_step": 354147, "epoch": 2926} {"train_loss": -44.01384353637695, "global_step": 354148, "epoch": 2926} {"train_loss": -44.687740325927734, "global_step": 354149, "epoch": 2926} {"train_loss": -43.788909912109375, "global_step": 354150, "epoch": 2926} {"train_loss": -43.86741256713867, "global_step": 354151, "epoch": 2926} {"train_loss": -45.651180267333984, "global_step": 354152, "epoch": 2926} {"train_loss": -44.56147384643555, "global_step": 354153, "epoch": 2926} {"train_loss": -44.86511993408203, "global_step": 354154, "epoch": 2926} {"train_loss": -44.634315490722656, "global_step": 354155, "epoch": 2926} {"train_loss": -44.49013900756836, "global_step": 354156, "epoch": 2926} {"train_loss": -44.56272506713867, "global_step": 354157, "epoch": 2926} {"train_loss": -44.585052490234375, "global_step": 354158, "epoch": 2926} {"train_loss": -45.6480598449707, "global_step": 354159, "epoch": 2926} {"train_loss": -44.724876403808594, "global_step": 354160, "epoch": 2926} {"train_loss": -44.85536575317383, "global_step": 354161, "epoch": 2926} {"train_loss": -45.3243293762207, "global_step": 354162, "epoch": 2926} {"train_loss": -45.523162841796875, "global_step": 354163, "epoch": 2926} {"train_loss": -45.09339904785156, "global_step": 354164, "epoch": 2926} {"train_loss": -44.859554290771484, "global_step": 354165, "epoch": 2926} {"train_loss": -44.75861869370642, "global_step": 354166, "epoch": 2926, "val_loss": 2504695.75} {"train_loss": -44.903709411621094, "global_step": 354167, "epoch": 2927} {"train_loss": -45.68269729614258, "global_step": 354168, "epoch": 2927} {"train_loss": -45.09461212158203, "global_step": 354169, "epoch": 2927} {"train_loss": -43.958656311035156, "global_step": 354170, "epoch": 2927} {"train_loss": -44.94112777709961, "global_step": 354171, "epoch": 2927} {"train_loss": -45.405494689941406, "global_step": 354172, "epoch": 2927} {"train_loss": -45.55247116088867, "global_step": 354173, "epoch": 2927} {"train_loss": -44.21442413330078, "global_step": 354174, "epoch": 2927} {"train_loss": -45.39924621582031, "global_step": 354175, "epoch": 2927} {"train_loss": -44.539093017578125, "global_step": 354176, "epoch": 2927} {"train_loss": -45.37778854370117, "global_step": 354177, "epoch": 2927} {"train_loss": -45.02696990966797, "global_step": 354178, "epoch": 2927} {"train_loss": -44.98847579956055, "global_step": 354179, "epoch": 2927} {"train_loss": -43.14280319213867, "global_step": 354180, "epoch": 2927} {"train_loss": -43.79044723510742, "global_step": 354181, "epoch": 2927} {"train_loss": -43.44731903076172, "global_step": 354182, "epoch": 2927} {"train_loss": -44.59983825683594, "global_step": 354183, "epoch": 2927} {"train_loss": -44.7829704284668, "global_step": 354184, "epoch": 2927} {"train_loss": -45.4444580078125, "global_step": 354185, "epoch": 2927} {"train_loss": -45.057708740234375, "global_step": 354186, "epoch": 2927} {"train_loss": -45.6389274597168, "global_step": 354187, "epoch": 2927} {"train_loss": -44.963958740234375, "global_step": 354188, "epoch": 2927} {"train_loss": -45.30525588989258, "global_step": 354189, "epoch": 2927} {"train_loss": -45.64237594604492, "global_step": 354190, "epoch": 2927} {"train_loss": -44.8935661315918, "global_step": 354191, "epoch": 2927} {"train_loss": -44.88322448730469, "global_step": 354192, "epoch": 2927} {"train_loss": -44.78004455566406, "global_step": 354193, "epoch": 2927} {"train_loss": -45.5169563293457, "global_step": 354194, "epoch": 2927} {"train_loss": -45.42228698730469, "global_step": 354195, "epoch": 2927} {"train_loss": -45.25698471069336, "global_step": 354196, "epoch": 2927} {"train_loss": -46.03109359741211, "global_step": 354197, "epoch": 2927} {"train_loss": -45.757293701171875, "global_step": 354198, "epoch": 2927} {"train_loss": -46.12068557739258, "global_step": 354199, "epoch": 2927} {"train_loss": -45.28813552856445, "global_step": 354200, "epoch": 2927} {"train_loss": -45.01795196533203, "global_step": 354201, "epoch": 2927} {"train_loss": -45.00912094116211, "global_step": 354202, "epoch": 2927} {"train_loss": -45.44865036010742, "global_step": 354203, "epoch": 2927} {"train_loss": -45.341896057128906, "global_step": 354204, "epoch": 2927} {"train_loss": -44.61826705932617, "global_step": 354205, "epoch": 2927} {"train_loss": -45.32001876831055, "global_step": 354206, "epoch": 2927} {"train_loss": -45.25736618041992, "global_step": 354207, "epoch": 2927} {"train_loss": -42.91202163696289, "global_step": 354208, "epoch": 2927} {"train_loss": -43.75004196166992, "global_step": 354209, "epoch": 2927} {"train_loss": -44.40058517456055, "global_step": 354210, "epoch": 2927} {"train_loss": -44.86701965332031, "global_step": 354211, "epoch": 2927} {"train_loss": -44.109375, "global_step": 354212, "epoch": 2927} {"train_loss": -42.13459396362305, "global_step": 354213, "epoch": 2927} {"train_loss": -43.69466781616211, "global_step": 354214, "epoch": 2927} {"train_loss": -43.31478500366211, "global_step": 354215, "epoch": 2927} {"train_loss": -42.15645217895508, "global_step": 354216, "epoch": 2927} {"train_loss": -42.32374954223633, "global_step": 354217, "epoch": 2927} {"train_loss": -42.24463653564453, "global_step": 354218, "epoch": 2927} {"train_loss": -41.943603515625, "global_step": 354219, "epoch": 2927} {"train_loss": -43.16913986206055, "global_step": 354220, "epoch": 2927} {"train_loss": -40.76365280151367, "global_step": 354221, "epoch": 2927} {"train_loss": -42.695011138916016, "global_step": 354222, "epoch": 2927} {"train_loss": -37.94199752807617, "global_step": 354223, "epoch": 2927} {"train_loss": -42.286720275878906, "global_step": 354224, "epoch": 2927} {"train_loss": -31.76123046875, "global_step": 354225, "epoch": 2927} {"train_loss": -33.86125564575195, "global_step": 354226, "epoch": 2927} {"train_loss": -32.05022430419922, "global_step": 354227, "epoch": 2927} {"train_loss": -37.20039749145508, "global_step": 354228, "epoch": 2927} {"train_loss": -35.462005615234375, "global_step": 354229, "epoch": 2927} {"train_loss": -36.21122360229492, "global_step": 354230, "epoch": 2927} {"train_loss": -41.88572311401367, "global_step": 354231, "epoch": 2927} {"train_loss": -37.96369552612305, "global_step": 354232, "epoch": 2927} {"train_loss": -38.84377670288086, "global_step": 354233, "epoch": 2927} {"train_loss": -41.28944396972656, "global_step": 354234, "epoch": 2927} {"train_loss": -36.77720260620117, "global_step": 354235, "epoch": 2927} {"train_loss": -38.17832565307617, "global_step": 354236, "epoch": 2927} {"train_loss": -40.74763107299805, "global_step": 354237, "epoch": 2927} {"train_loss": -37.593868255615234, "global_step": 354238, "epoch": 2927} {"train_loss": -40.976016998291016, "global_step": 354239, "epoch": 2927} {"train_loss": -40.55013656616211, "global_step": 354240, "epoch": 2927} {"train_loss": -39.36875534057617, "global_step": 354241, "epoch": 2927} {"train_loss": -41.4433479309082, "global_step": 354242, "epoch": 2927} {"train_loss": -41.58510208129883, "global_step": 354243, "epoch": 2927} {"train_loss": -41.560546875, "global_step": 354244, "epoch": 2927} {"train_loss": -39.77947235107422, "global_step": 354245, "epoch": 2927} {"train_loss": -41.38015365600586, "global_step": 354246, "epoch": 2927} {"train_loss": -42.158363342285156, "global_step": 354247, "epoch": 2927} {"train_loss": -41.1505241394043, "global_step": 354248, "epoch": 2927} {"train_loss": -42.26021194458008, "global_step": 354249, "epoch": 2927} {"train_loss": -42.98820877075195, "global_step": 354250, "epoch": 2927} {"train_loss": -42.93507766723633, "global_step": 354251, "epoch": 2927} {"train_loss": -42.040504455566406, "global_step": 354252, "epoch": 2927} {"train_loss": -43.06459426879883, "global_step": 354253, "epoch": 2927} {"train_loss": -42.600372314453125, "global_step": 354254, "epoch": 2927} {"train_loss": -42.454437255859375, "global_step": 354255, "epoch": 2927} {"train_loss": -43.40496826171875, "global_step": 354256, "epoch": 2927} {"train_loss": -44.1451530456543, "global_step": 354257, "epoch": 2927} {"train_loss": -43.545249938964844, "global_step": 354258, "epoch": 2927} {"train_loss": -43.269710540771484, "global_step": 354259, "epoch": 2927} {"train_loss": -43.532100677490234, "global_step": 354260, "epoch": 2927} {"train_loss": -44.1953239440918, "global_step": 354261, "epoch": 2927} {"train_loss": -43.9538688659668, "global_step": 354262, "epoch": 2927} {"train_loss": -44.310665130615234, "global_step": 354263, "epoch": 2927} {"train_loss": -42.39540481567383, "global_step": 354264, "epoch": 2927} {"train_loss": -44.41252517700195, "global_step": 354265, "epoch": 2927} {"train_loss": -43.78761672973633, "global_step": 354266, "epoch": 2927} {"train_loss": -44.35405731201172, "global_step": 354267, "epoch": 2927} {"train_loss": -44.47407150268555, "global_step": 354268, "epoch": 2927} {"train_loss": -44.30192947387695, "global_step": 354269, "epoch": 2927} {"train_loss": -44.68584060668945, "global_step": 354270, "epoch": 2927} {"train_loss": -44.084449768066406, "global_step": 354271, "epoch": 2927} {"train_loss": -44.769439697265625, "global_step": 354272, "epoch": 2927} {"train_loss": -43.87693405151367, "global_step": 354273, "epoch": 2927} {"train_loss": -44.732513427734375, "global_step": 354274, "epoch": 2927} {"train_loss": -44.873512268066406, "global_step": 354275, "epoch": 2927} {"train_loss": -44.747589111328125, "global_step": 354276, "epoch": 2927} {"train_loss": -44.05133056640625, "global_step": 354277, "epoch": 2927} {"train_loss": -42.43144607543945, "global_step": 354278, "epoch": 2927} {"train_loss": -44.468772888183594, "global_step": 354279, "epoch": 2927} {"train_loss": -44.50990676879883, "global_step": 354280, "epoch": 2927} {"train_loss": -44.3004264831543, "global_step": 354281, "epoch": 2927} {"train_loss": -44.79935836791992, "global_step": 354282, "epoch": 2927} {"train_loss": -45.2180290222168, "global_step": 354283, "epoch": 2927} {"train_loss": -43.88077926635742, "global_step": 354284, "epoch": 2927} {"train_loss": -44.95646286010742, "global_step": 354285, "epoch": 2927} {"train_loss": -43.970699310302734, "global_step": 354286, "epoch": 2927} {"train_loss": -43.081480609483954, "global_step": 354287, "epoch": 2927, "val_loss": 2529294.5} {"train_loss": -44.87309646606445, "global_step": 354288, "epoch": 2928} {"train_loss": -45.01705551147461, "global_step": 354289, "epoch": 2928} {"train_loss": -44.88380813598633, "global_step": 354290, "epoch": 2928} {"train_loss": -45.12206268310547, "global_step": 354291, "epoch": 2928} {"train_loss": -45.13859176635742, "global_step": 354292, "epoch": 2928} {"train_loss": -44.80597686767578, "global_step": 354293, "epoch": 2928} {"train_loss": -45.08173751831055, "global_step": 354294, "epoch": 2928} {"train_loss": -43.87823486328125, "global_step": 354295, "epoch": 2928} {"train_loss": -42.857093811035156, "global_step": 354296, "epoch": 2928} {"train_loss": -42.86751174926758, "global_step": 354297, "epoch": 2928} {"train_loss": -44.04426956176758, "global_step": 354298, "epoch": 2928} {"train_loss": -43.087581634521484, "global_step": 354299, "epoch": 2928} {"train_loss": -44.3944206237793, "global_step": 354300, "epoch": 2928} {"train_loss": -44.4004020690918, "global_step": 354301, "epoch": 2928} {"train_loss": -42.2657585144043, "global_step": 354302, "epoch": 2928} {"train_loss": -44.65732192993164, "global_step": 354303, "epoch": 2928} {"train_loss": -44.67338943481445, "global_step": 354304, "epoch": 2928} {"train_loss": -44.579925537109375, "global_step": 354305, "epoch": 2928} {"train_loss": -45.03639602661133, "global_step": 354306, "epoch": 2928} {"train_loss": -44.73910140991211, "global_step": 354307, "epoch": 2928} {"train_loss": -44.41582489013672, "global_step": 354308, "epoch": 2928} {"train_loss": -43.502723693847656, "global_step": 354309, "epoch": 2928} {"train_loss": -43.93125534057617, "global_step": 354310, "epoch": 2928} {"train_loss": -43.912391662597656, "global_step": 354311, "epoch": 2928} {"train_loss": -43.488155364990234, "global_step": 354312, "epoch": 2928} {"train_loss": -43.97883987426758, "global_step": 354313, "epoch": 2928} {"train_loss": -45.455543518066406, "global_step": 354314, "epoch": 2928} {"train_loss": -44.567508697509766, "global_step": 354315, "epoch": 2928} {"train_loss": -44.30499267578125, "global_step": 354316, "epoch": 2928} {"train_loss": -43.78795623779297, "global_step": 354317, "epoch": 2928} {"train_loss": -43.5340690612793, "global_step": 354318, "epoch": 2928} {"train_loss": -44.48810958862305, "global_step": 354319, "epoch": 2928} {"train_loss": -44.48256301879883, "global_step": 354320, "epoch": 2928} {"train_loss": -44.2951774597168, "global_step": 354321, "epoch": 2928} {"train_loss": -43.879127502441406, "global_step": 354322, "epoch": 2928} {"train_loss": -44.94379425048828, "global_step": 354323, "epoch": 2928} {"train_loss": -44.52749252319336, "global_step": 354324, "epoch": 2928} {"train_loss": -44.76115036010742, "global_step": 354325, "epoch": 2928} {"train_loss": -44.88458251953125, "global_step": 354326, "epoch": 2928} {"train_loss": -44.57244873046875, "global_step": 354327, "epoch": 2928} {"train_loss": -44.40420150756836, "global_step": 354328, "epoch": 2928} {"train_loss": -43.18990707397461, "global_step": 354329, "epoch": 2928} {"train_loss": -44.126068115234375, "global_step": 354330, "epoch": 2928} {"train_loss": -43.839656829833984, "global_step": 354331, "epoch": 2928} {"train_loss": -44.19424057006836, "global_step": 354332, "epoch": 2928} {"train_loss": -44.60036849975586, "global_step": 354333, "epoch": 2928} {"train_loss": -45.106483459472656, "global_step": 354334, "epoch": 2928} {"train_loss": -45.194278717041016, "global_step": 354335, "epoch": 2928} {"train_loss": -44.34035110473633, "global_step": 354336, "epoch": 2928} {"train_loss": -42.81826400756836, "global_step": 354337, "epoch": 2928} {"train_loss": -45.3861198425293, "global_step": 354338, "epoch": 2928} {"train_loss": -43.538490295410156, "global_step": 354339, "epoch": 2928} {"train_loss": -43.0085334777832, "global_step": 354340, "epoch": 2928} {"train_loss": -45.1314697265625, "global_step": 354341, "epoch": 2928} {"train_loss": -45.16244125366211, "global_step": 354342, "epoch": 2928} {"train_loss": -44.16485595703125, "global_step": 354343, "epoch": 2928} {"train_loss": -44.51158142089844, "global_step": 354344, "epoch": 2928} {"train_loss": -44.276737213134766, "global_step": 354345, "epoch": 2928} {"train_loss": -43.113441467285156, "global_step": 354346, "epoch": 2928} {"train_loss": -44.22081756591797, "global_step": 354347, "epoch": 2928} {"train_loss": -44.37091064453125, "global_step": 354348, "epoch": 2928} {"train_loss": -44.3036003112793, "global_step": 354349, "epoch": 2928} {"train_loss": -41.838539123535156, "global_step": 354350, "epoch": 2928} {"train_loss": -42.446998596191406, "global_step": 354351, "epoch": 2928} {"train_loss": -44.010623931884766, "global_step": 354352, "epoch": 2928} {"train_loss": -42.54818344116211, "global_step": 354353, "epoch": 2928} {"train_loss": -43.44923400878906, "global_step": 354354, "epoch": 2928} {"train_loss": -42.00944900512695, "global_step": 354355, "epoch": 2928} {"train_loss": -42.14571762084961, "global_step": 354356, "epoch": 2928} {"train_loss": -43.85088348388672, "global_step": 354357, "epoch": 2928} {"train_loss": -43.016143798828125, "global_step": 354358, "epoch": 2928} {"train_loss": -44.7336311340332, "global_step": 354359, "epoch": 2928} {"train_loss": -43.72449493408203, "global_step": 354360, "epoch": 2928} {"train_loss": -43.03404998779297, "global_step": 354361, "epoch": 2928} {"train_loss": -44.37150955200195, "global_step": 354362, "epoch": 2928} {"train_loss": -42.7433967590332, "global_step": 354363, "epoch": 2928} {"train_loss": -44.280548095703125, "global_step": 354364, "epoch": 2928} {"train_loss": -44.76667785644531, "global_step": 354365, "epoch": 2928} {"train_loss": -43.080291748046875, "global_step": 354366, "epoch": 2928} {"train_loss": -44.31195068359375, "global_step": 354367, "epoch": 2928} {"train_loss": -44.76247787475586, "global_step": 354368, "epoch": 2928} {"train_loss": -43.935096740722656, "global_step": 354369, "epoch": 2928} {"train_loss": -44.43183517456055, "global_step": 354370, "epoch": 2928} {"train_loss": -44.961238861083984, "global_step": 354371, "epoch": 2928} {"train_loss": -44.156856536865234, "global_step": 354372, "epoch": 2928} {"train_loss": -44.97856521606445, "global_step": 354373, "epoch": 2928} {"train_loss": -44.00503158569336, "global_step": 354374, "epoch": 2928} {"train_loss": -44.40766525268555, "global_step": 354375, "epoch": 2928} {"train_loss": -44.47768020629883, "global_step": 354376, "epoch": 2928} {"train_loss": -42.990840911865234, "global_step": 354377, "epoch": 2928} {"train_loss": -44.35970687866211, "global_step": 354378, "epoch": 2928} {"train_loss": -43.9498291015625, "global_step": 354379, "epoch": 2928} {"train_loss": -43.29624938964844, "global_step": 354380, "epoch": 2928} {"train_loss": -44.60927200317383, "global_step": 354381, "epoch": 2928} {"train_loss": -44.171321868896484, "global_step": 354382, "epoch": 2928} {"train_loss": -44.54238510131836, "global_step": 354383, "epoch": 2928} {"train_loss": -43.26357650756836, "global_step": 354384, "epoch": 2928} {"train_loss": -43.94436264038086, "global_step": 354385, "epoch": 2928} {"train_loss": -44.3083381652832, "global_step": 354386, "epoch": 2928} {"train_loss": -44.6580810546875, "global_step": 354387, "epoch": 2928} {"train_loss": -44.53467559814453, "global_step": 354388, "epoch": 2928} {"train_loss": -44.747989654541016, "global_step": 354389, "epoch": 2928} {"train_loss": -44.3423957824707, "global_step": 354390, "epoch": 2928} {"train_loss": -45.2884407043457, "global_step": 354391, "epoch": 2928} {"train_loss": -44.893798828125, "global_step": 354392, "epoch": 2928} {"train_loss": -45.00482177734375, "global_step": 354393, "epoch": 2928} {"train_loss": -45.6251106262207, "global_step": 354394, "epoch": 2928} {"train_loss": -44.4706916809082, "global_step": 354395, "epoch": 2928} {"train_loss": -43.38629150390625, "global_step": 354396, "epoch": 2928} {"train_loss": -44.87750244140625, "global_step": 354397, "epoch": 2928} {"train_loss": -44.49773025512695, "global_step": 354398, "epoch": 2928} {"train_loss": -45.02973556518555, "global_step": 354399, "epoch": 2928} {"train_loss": -44.946144104003906, "global_step": 354400, "epoch": 2928} {"train_loss": -44.57804870605469, "global_step": 354401, "epoch": 2928} {"train_loss": -45.71574020385742, "global_step": 354402, "epoch": 2928} {"train_loss": -45.367515563964844, "global_step": 354403, "epoch": 2928} {"train_loss": -44.8839225769043, "global_step": 354404, "epoch": 2928} {"train_loss": -43.73154830932617, "global_step": 354405, "epoch": 2928} {"train_loss": -44.84817886352539, "global_step": 354406, "epoch": 2928} {"train_loss": -45.19098663330078, "global_step": 354407, "epoch": 2928} {"train_loss": -44.2216145854351, "global_step": 354408, "epoch": 2928, "val_loss": 2499271.5} {"train_loss": -44.73012924194336, "global_step": 354409, "epoch": 2929} {"train_loss": -44.34096145629883, "global_step": 354410, "epoch": 2929} {"train_loss": -45.156028747558594, "global_step": 354411, "epoch": 2929} {"train_loss": -43.37150192260742, "global_step": 354412, "epoch": 2929} {"train_loss": -44.570526123046875, "global_step": 354413, "epoch": 2929} {"train_loss": -44.18715286254883, "global_step": 354414, "epoch": 2929} {"train_loss": -44.395057678222656, "global_step": 354415, "epoch": 2929} {"train_loss": -45.07589340209961, "global_step": 354416, "epoch": 2929} {"train_loss": -44.713233947753906, "global_step": 354417, "epoch": 2929} {"train_loss": -45.09014892578125, "global_step": 354418, "epoch": 2929} {"train_loss": -41.34282302856445, "global_step": 354419, "epoch": 2929} {"train_loss": -45.19611740112305, "global_step": 354420, "epoch": 2929} {"train_loss": -44.16415023803711, "global_step": 354421, "epoch": 2929} {"train_loss": -43.55330276489258, "global_step": 354422, "epoch": 2929} {"train_loss": -44.71931076049805, "global_step": 354423, "epoch": 2929} {"train_loss": -43.35641098022461, "global_step": 354424, "epoch": 2929} {"train_loss": -44.38754653930664, "global_step": 354425, "epoch": 2929} {"train_loss": -44.58466720581055, "global_step": 354426, "epoch": 2929} {"train_loss": -44.94993209838867, "global_step": 354427, "epoch": 2929} {"train_loss": -44.941497802734375, "global_step": 354428, "epoch": 2929} {"train_loss": -44.90242385864258, "global_step": 354429, "epoch": 2929} {"train_loss": -45.15987777709961, "global_step": 354430, "epoch": 2929} {"train_loss": -45.23173904418945, "global_step": 354431, "epoch": 2929} {"train_loss": -45.2772331237793, "global_step": 354432, "epoch": 2929} {"train_loss": -44.16691970825195, "global_step": 354433, "epoch": 2929} {"train_loss": -45.348087310791016, "global_step": 354434, "epoch": 2929} {"train_loss": -42.587371826171875, "global_step": 354435, "epoch": 2929} {"train_loss": -44.21665573120117, "global_step": 354436, "epoch": 2929} {"train_loss": -44.88190841674805, "global_step": 354437, "epoch": 2929} {"train_loss": -45.15740966796875, "global_step": 354438, "epoch": 2929} {"train_loss": -45.3079719543457, "global_step": 354439, "epoch": 2929} {"train_loss": -45.335479736328125, "global_step": 354440, "epoch": 2929} {"train_loss": -44.35559844970703, "global_step": 354441, "epoch": 2929} {"train_loss": -45.16361618041992, "global_step": 354442, "epoch": 2929} {"train_loss": -43.952491760253906, "global_step": 354443, "epoch": 2929} {"train_loss": -45.51594161987305, "global_step": 354444, "epoch": 2929} {"train_loss": -45.155799865722656, "global_step": 354445, "epoch": 2929} {"train_loss": -44.9178466796875, "global_step": 354446, "epoch": 2929} {"train_loss": -44.208492279052734, "global_step": 354447, "epoch": 2929} {"train_loss": -43.91432189941406, "global_step": 354448, "epoch": 2929} {"train_loss": -43.51255416870117, "global_step": 354449, "epoch": 2929} {"train_loss": -44.837303161621094, "global_step": 354450, "epoch": 2929} {"train_loss": -43.24794387817383, "global_step": 354451, "epoch": 2929} {"train_loss": -42.79716110229492, "global_step": 354452, "epoch": 2929} {"train_loss": -44.987342834472656, "global_step": 354453, "epoch": 2929} {"train_loss": -44.27578353881836, "global_step": 354454, "epoch": 2929} {"train_loss": -43.9382438659668, "global_step": 354455, "epoch": 2929} {"train_loss": -43.38886642456055, "global_step": 354456, "epoch": 2929} {"train_loss": -44.104488372802734, "global_step": 354457, "epoch": 2929} {"train_loss": -44.833404541015625, "global_step": 354458, "epoch": 2929} {"train_loss": -45.559505462646484, "global_step": 354459, "epoch": 2929} {"train_loss": -44.59772491455078, "global_step": 354460, "epoch": 2929} {"train_loss": -42.92593002319336, "global_step": 354461, "epoch": 2929} {"train_loss": -44.137298583984375, "global_step": 354462, "epoch": 2929} {"train_loss": -43.962982177734375, "global_step": 354463, "epoch": 2929} {"train_loss": -43.483516693115234, "global_step": 354464, "epoch": 2929} {"train_loss": -44.93356704711914, "global_step": 354465, "epoch": 2929} {"train_loss": -43.26883316040039, "global_step": 354466, "epoch": 2929} {"train_loss": -43.67747116088867, "global_step": 354467, "epoch": 2929} {"train_loss": -44.64588165283203, "global_step": 354468, "epoch": 2929} {"train_loss": -44.12594223022461, "global_step": 354469, "epoch": 2929} {"train_loss": -43.37944412231445, "global_step": 354470, "epoch": 2929} {"train_loss": -44.7385368347168, "global_step": 354471, "epoch": 2929} {"train_loss": -44.22056198120117, "global_step": 354472, "epoch": 2929} {"train_loss": -42.92123794555664, "global_step": 354473, "epoch": 2929} {"train_loss": -44.50921630859375, "global_step": 354474, "epoch": 2929} {"train_loss": -44.08195877075195, "global_step": 354475, "epoch": 2929} {"train_loss": -43.00030517578125, "global_step": 354476, "epoch": 2929} {"train_loss": -42.79902267456055, "global_step": 354477, "epoch": 2929} {"train_loss": -41.65752029418945, "global_step": 354478, "epoch": 2929} {"train_loss": -43.773216247558594, "global_step": 354479, "epoch": 2929} {"train_loss": -40.82719039916992, "global_step": 354480, "epoch": 2929} {"train_loss": -41.62723922729492, "global_step": 354481, "epoch": 2929} {"train_loss": -42.952064514160156, "global_step": 354482, "epoch": 2929} {"train_loss": -43.37630081176758, "global_step": 354483, "epoch": 2929} {"train_loss": -42.960201263427734, "global_step": 354484, "epoch": 2929} {"train_loss": -42.843379974365234, "global_step": 354485, "epoch": 2929} {"train_loss": -43.26286697387695, "global_step": 354486, "epoch": 2929} {"train_loss": -39.8126220703125, "global_step": 354487, "epoch": 2929} {"train_loss": -43.0589714050293, "global_step": 354488, "epoch": 2929} {"train_loss": -41.933658599853516, "global_step": 354489, "epoch": 2929} {"train_loss": -41.437339782714844, "global_step": 354490, "epoch": 2929} {"train_loss": -43.94838333129883, "global_step": 354491, "epoch": 2929} {"train_loss": -41.67780685424805, "global_step": 354492, "epoch": 2929} {"train_loss": -41.59499740600586, "global_step": 354493, "epoch": 2929} {"train_loss": -42.09629821777344, "global_step": 354494, "epoch": 2929} {"train_loss": -42.663387298583984, "global_step": 354495, "epoch": 2929} {"train_loss": -41.66412353515625, "global_step": 354496, "epoch": 2929} {"train_loss": -42.72357177734375, "global_step": 354497, "epoch": 2929} {"train_loss": -43.20176315307617, "global_step": 354498, "epoch": 2929} {"train_loss": -37.6785774230957, "global_step": 354499, "epoch": 2929} {"train_loss": -43.418853759765625, "global_step": 354500, "epoch": 2929} {"train_loss": -41.49538803100586, "global_step": 354501, "epoch": 2929} {"train_loss": -43.32682418823242, "global_step": 354502, "epoch": 2929} {"train_loss": -42.0960807800293, "global_step": 354503, "epoch": 2929} {"train_loss": -43.372337341308594, "global_step": 354504, "epoch": 2929} {"train_loss": -43.47064971923828, "global_step": 354505, "epoch": 2929} {"train_loss": -40.997283935546875, "global_step": 354506, "epoch": 2929} {"train_loss": -44.038883209228516, "global_step": 354507, "epoch": 2929} {"train_loss": -43.395965576171875, "global_step": 354508, "epoch": 2929} {"train_loss": -44.1455192565918, "global_step": 354509, "epoch": 2929} {"train_loss": -44.30671310424805, "global_step": 354510, "epoch": 2929} {"train_loss": -41.08918762207031, "global_step": 354511, "epoch": 2929} {"train_loss": -43.433692932128906, "global_step": 354512, "epoch": 2929} {"train_loss": -43.03141403198242, "global_step": 354513, "epoch": 2929} {"train_loss": -44.741004943847656, "global_step": 354514, "epoch": 2929} {"train_loss": -44.2066764831543, "global_step": 354515, "epoch": 2929} {"train_loss": -43.46023941040039, "global_step": 354516, "epoch": 2929} {"train_loss": -44.965049743652344, "global_step": 354517, "epoch": 2929} {"train_loss": -44.45113754272461, "global_step": 354518, "epoch": 2929} {"train_loss": -43.50239181518555, "global_step": 354519, "epoch": 2929} {"train_loss": -41.99338912963867, "global_step": 354520, "epoch": 2929} {"train_loss": -44.23432159423828, "global_step": 354521, "epoch": 2929} {"train_loss": -43.79079818725586, "global_step": 354522, "epoch": 2929} {"train_loss": -44.037906646728516, "global_step": 354523, "epoch": 2929} {"train_loss": -44.06364059448242, "global_step": 354524, "epoch": 2929} {"train_loss": -44.47199630737305, "global_step": 354525, "epoch": 2929} {"train_loss": -44.48807144165039, "global_step": 354526, "epoch": 2929} {"train_loss": -43.892452239990234, "global_step": 354527, "epoch": 2929} {"train_loss": -44.39967727661133, "global_step": 354528, "epoch": 2929} {"train_loss": -43.72329538518732, "global_step": 354529, "epoch": 2929, "val_loss": 2571868.25} {"train_loss": -43.544185638427734, "global_step": 354530, "epoch": 2930} {"train_loss": -44.76351547241211, "global_step": 354531, "epoch": 2930} {"train_loss": -43.623348236083984, "global_step": 354532, "epoch": 2930} {"train_loss": -45.217323303222656, "global_step": 354533, "epoch": 2930} {"train_loss": -44.307186126708984, "global_step": 354534, "epoch": 2930} {"train_loss": -45.27479934692383, "global_step": 354535, "epoch": 2930} {"train_loss": -45.16691207885742, "global_step": 354536, "epoch": 2930} {"train_loss": -44.84577560424805, "global_step": 354537, "epoch": 2930} {"train_loss": -45.044151306152344, "global_step": 354538, "epoch": 2930} {"train_loss": -44.84785079956055, "global_step": 354539, "epoch": 2930} {"train_loss": -44.736873626708984, "global_step": 354540, "epoch": 2930} {"train_loss": -45.08821487426758, "global_step": 354541, "epoch": 2930} {"train_loss": -45.0732307434082, "global_step": 354542, "epoch": 2930} {"train_loss": -44.99361801147461, "global_step": 354543, "epoch": 2930} {"train_loss": -45.18059158325195, "global_step": 354544, "epoch": 2930} {"train_loss": -45.12821578979492, "global_step": 354545, "epoch": 2930} {"train_loss": -45.56723403930664, "global_step": 354546, "epoch": 2930} {"train_loss": -45.4438591003418, "global_step": 354547, "epoch": 2930} {"train_loss": -45.16836166381836, "global_step": 354548, "epoch": 2930} {"train_loss": -45.56663131713867, "global_step": 354549, "epoch": 2930} {"train_loss": -44.7166748046875, "global_step": 354550, "epoch": 2930} {"train_loss": -45.057491302490234, "global_step": 354551, "epoch": 2930} {"train_loss": -45.163818359375, "global_step": 354552, "epoch": 2930} {"train_loss": -45.7242317199707, "global_step": 354553, "epoch": 2930} {"train_loss": -45.057891845703125, "global_step": 354554, "epoch": 2930} {"train_loss": -45.618743896484375, "global_step": 354555, "epoch": 2930} {"train_loss": -45.14990997314453, "global_step": 354556, "epoch": 2930} {"train_loss": -44.39632797241211, "global_step": 354557, "epoch": 2930} {"train_loss": -44.83083724975586, "global_step": 354558, "epoch": 2930} {"train_loss": -44.323936462402344, "global_step": 354559, "epoch": 2930} {"train_loss": -45.740089416503906, "global_step": 354560, "epoch": 2930} {"train_loss": -44.6555290222168, "global_step": 354561, "epoch": 2930} {"train_loss": -44.39181900024414, "global_step": 354562, "epoch": 2930} {"train_loss": -43.24387741088867, "global_step": 354563, "epoch": 2930} {"train_loss": -45.7254638671875, "global_step": 354564, "epoch": 2930} {"train_loss": -45.2351188659668, "global_step": 354565, "epoch": 2930} {"train_loss": -45.02553939819336, "global_step": 354566, "epoch": 2930} {"train_loss": -44.21883773803711, "global_step": 354567, "epoch": 2930} {"train_loss": -44.45111083984375, "global_step": 354568, "epoch": 2930} {"train_loss": -44.78803634643555, "global_step": 354569, "epoch": 2930} {"train_loss": -44.79755401611328, "global_step": 354570, "epoch": 2930} {"train_loss": -41.77349090576172, "global_step": 354571, "epoch": 2930} {"train_loss": -42.237892150878906, "global_step": 354572, "epoch": 2930} {"train_loss": -43.91707229614258, "global_step": 354573, "epoch": 2930} {"train_loss": -43.61839294433594, "global_step": 354574, "epoch": 2930} {"train_loss": -39.557247161865234, "global_step": 354575, "epoch": 2930} {"train_loss": -43.283416748046875, "global_step": 354576, "epoch": 2930} {"train_loss": -35.86180114746094, "global_step": 354577, "epoch": 2930} {"train_loss": -32.049652099609375, "global_step": 354578, "epoch": 2930} {"train_loss": -34.74635314941406, "global_step": 354579, "epoch": 2930} {"train_loss": -35.576141357421875, "global_step": 354580, "epoch": 2930} {"train_loss": -33.69031524658203, "global_step": 354581, "epoch": 2930} {"train_loss": -38.820465087890625, "global_step": 354582, "epoch": 2930} {"train_loss": -33.8656005859375, "global_step": 354583, "epoch": 2930} {"train_loss": -36.49662780761719, "global_step": 354584, "epoch": 2930} {"train_loss": -33.94868087768555, "global_step": 354585, "epoch": 2930} {"train_loss": -35.40216064453125, "global_step": 354586, "epoch": 2930} {"train_loss": -32.56010055541992, "global_step": 354587, "epoch": 2930} {"train_loss": -35.9478874206543, "global_step": 354588, "epoch": 2930} {"train_loss": -34.4749870300293, "global_step": 354589, "epoch": 2930} {"train_loss": -36.00706100463867, "global_step": 354590, "epoch": 2930} {"train_loss": -36.64256286621094, "global_step": 354591, "epoch": 2930} {"train_loss": -35.92702865600586, "global_step": 354592, "epoch": 2930} {"train_loss": -38.286712646484375, "global_step": 354593, "epoch": 2930} {"train_loss": -37.23115158081055, "global_step": 354594, "epoch": 2930} {"train_loss": -36.371803283691406, "global_step": 354595, "epoch": 2930} {"train_loss": -38.33932113647461, "global_step": 354596, "epoch": 2930} {"train_loss": -37.895057678222656, "global_step": 354597, "epoch": 2930} {"train_loss": -37.347625732421875, "global_step": 354598, "epoch": 2930} {"train_loss": -37.59719467163086, "global_step": 354599, "epoch": 2930} {"train_loss": -37.988590240478516, "global_step": 354600, "epoch": 2930} {"train_loss": -38.970340728759766, "global_step": 354601, "epoch": 2930} {"train_loss": -38.08829116821289, "global_step": 354602, "epoch": 2930} {"train_loss": -38.22618103027344, "global_step": 354603, "epoch": 2930} {"train_loss": -38.18242263793945, "global_step": 354604, "epoch": 2930} {"train_loss": -39.1193733215332, "global_step": 354605, "epoch": 2930} {"train_loss": -39.17941665649414, "global_step": 354606, "epoch": 2930} {"train_loss": -38.89248275756836, "global_step": 354607, "epoch": 2930} {"train_loss": -39.94855499267578, "global_step": 354608, "epoch": 2930} {"train_loss": -38.31914138793945, "global_step": 354609, "epoch": 2930} {"train_loss": -39.69395065307617, "global_step": 354610, "epoch": 2930} {"train_loss": -39.982017517089844, "global_step": 354611, "epoch": 2930} {"train_loss": -40.299293518066406, "global_step": 354612, "epoch": 2930} {"train_loss": -38.63069152832031, "global_step": 354613, "epoch": 2930} {"train_loss": -40.23423385620117, "global_step": 354614, "epoch": 2930} {"train_loss": -40.49564743041992, "global_step": 354615, "epoch": 2930} {"train_loss": -40.64113235473633, "global_step": 354616, "epoch": 2930} {"train_loss": -39.50160598754883, "global_step": 354617, "epoch": 2930} {"train_loss": -40.76295852661133, "global_step": 354618, "epoch": 2930} {"train_loss": -40.66140365600586, "global_step": 354619, "epoch": 2930} {"train_loss": -40.694271087646484, "global_step": 354620, "epoch": 2930} {"train_loss": -40.9549446105957, "global_step": 354621, "epoch": 2930} {"train_loss": -41.149818420410156, "global_step": 354622, "epoch": 2930} {"train_loss": -41.40373611450195, "global_step": 354623, "epoch": 2930} {"train_loss": -41.06836700439453, "global_step": 354624, "epoch": 2930} {"train_loss": -41.34519577026367, "global_step": 354625, "epoch": 2930} {"train_loss": -41.742794036865234, "global_step": 354626, "epoch": 2930} {"train_loss": -40.24885177612305, "global_step": 354627, "epoch": 2930} {"train_loss": -41.51346969604492, "global_step": 354628, "epoch": 2930} {"train_loss": -41.63471603393555, "global_step": 354629, "epoch": 2930} {"train_loss": -41.57023239135742, "global_step": 354630, "epoch": 2930} {"train_loss": -42.60685348510742, "global_step": 354631, "epoch": 2930} {"train_loss": -42.2906379699707, "global_step": 354632, "epoch": 2930} {"train_loss": -42.891845703125, "global_step": 354633, "epoch": 2930} {"train_loss": -42.6563720703125, "global_step": 354634, "epoch": 2930} {"train_loss": -42.51544189453125, "global_step": 354635, "epoch": 2930} {"train_loss": -42.72220993041992, "global_step": 354636, "epoch": 2930} {"train_loss": -42.498992919921875, "global_step": 354637, "epoch": 2930} {"train_loss": -42.68423843383789, "global_step": 354638, "epoch": 2930} {"train_loss": -43.44807815551758, "global_step": 354639, "epoch": 2930} {"train_loss": -43.474117279052734, "global_step": 354640, "epoch": 2930} {"train_loss": -43.6345100402832, "global_step": 354641, "epoch": 2930} {"train_loss": -44.1263313293457, "global_step": 354642, "epoch": 2930} {"train_loss": -44.37248229980469, "global_step": 354643, "epoch": 2930} {"train_loss": -43.905616760253906, "global_step": 354644, "epoch": 2930} {"train_loss": -44.156734466552734, "global_step": 354645, "epoch": 2930} {"train_loss": -43.286800384521484, "global_step": 354646, "epoch": 2930} {"train_loss": -44.240596771240234, "global_step": 354647, "epoch": 2930} {"train_loss": -44.812007904052734, "global_step": 354648, "epoch": 2930} {"train_loss": -44.102081298828125, "global_step": 354649, "epoch": 2930} {"train_loss": -41.56363047450042, "global_step": 354650, "epoch": 2930, "val_loss": 2523857.75} {"train_loss": -45.32197570800781, "global_step": 354651, "epoch": 2931} {"train_loss": -44.377437591552734, "global_step": 354652, "epoch": 2931} {"train_loss": -43.19218063354492, "global_step": 354653, "epoch": 2931} {"train_loss": -43.49074935913086, "global_step": 354654, "epoch": 2931} {"train_loss": -44.7680778503418, "global_step": 354655, "epoch": 2931} {"train_loss": -44.32316970825195, "global_step": 354656, "epoch": 2931} {"train_loss": -44.211612701416016, "global_step": 354657, "epoch": 2931} {"train_loss": -44.46061325073242, "global_step": 354658, "epoch": 2931} {"train_loss": -44.089263916015625, "global_step": 354659, "epoch": 2931} {"train_loss": -44.815555572509766, "global_step": 354660, "epoch": 2931} {"train_loss": -44.47057342529297, "global_step": 354661, "epoch": 2931} {"train_loss": -44.925148010253906, "global_step": 354662, "epoch": 2931} {"train_loss": -44.79600143432617, "global_step": 354663, "epoch": 2931} {"train_loss": -44.7543830871582, "global_step": 354664, "epoch": 2931} {"train_loss": -44.519161224365234, "global_step": 354665, "epoch": 2931} {"train_loss": -45.01406478881836, "global_step": 354666, "epoch": 2931} {"train_loss": -44.98774337768555, "global_step": 354667, "epoch": 2931} {"train_loss": -44.61802291870117, "global_step": 354668, "epoch": 2931} {"train_loss": -45.07802963256836, "global_step": 354669, "epoch": 2931} {"train_loss": -44.408050537109375, "global_step": 354670, "epoch": 2931} {"train_loss": -44.91262435913086, "global_step": 354671, "epoch": 2931} {"train_loss": -44.77871322631836, "global_step": 354672, "epoch": 2931} {"train_loss": -44.8057861328125, "global_step": 354673, "epoch": 2931} {"train_loss": -44.69763946533203, "global_step": 354674, "epoch": 2931} {"train_loss": -44.49411392211914, "global_step": 354675, "epoch": 2931} {"train_loss": -43.8540153503418, "global_step": 354676, "epoch": 2931} {"train_loss": -44.145572662353516, "global_step": 354677, "epoch": 2931} {"train_loss": -45.55855178833008, "global_step": 354678, "epoch": 2931} {"train_loss": -43.28324508666992, "global_step": 354679, "epoch": 2931} {"train_loss": -44.4870719909668, "global_step": 354680, "epoch": 2931} {"train_loss": -45.13282012939453, "global_step": 354681, "epoch": 2931} {"train_loss": -44.20005798339844, "global_step": 354682, "epoch": 2931} {"train_loss": -44.50421142578125, "global_step": 354683, "epoch": 2931} {"train_loss": -45.06853103637695, "global_step": 354684, "epoch": 2931} {"train_loss": -44.52729415893555, "global_step": 354685, "epoch": 2931} {"train_loss": -43.61997604370117, "global_step": 354686, "epoch": 2931} {"train_loss": -43.93922424316406, "global_step": 354687, "epoch": 2931} {"train_loss": -43.99738693237305, "global_step": 354688, "epoch": 2931} {"train_loss": -45.35296630859375, "global_step": 354689, "epoch": 2931} {"train_loss": -45.48234176635742, "global_step": 354690, "epoch": 2931} {"train_loss": -44.037513732910156, "global_step": 354691, "epoch": 2931} {"train_loss": -45.26252365112305, "global_step": 354692, "epoch": 2931} {"train_loss": -45.09564208984375, "global_step": 354693, "epoch": 2931} {"train_loss": -43.5828742980957, "global_step": 354694, "epoch": 2931} {"train_loss": -45.378150939941406, "global_step": 354695, "epoch": 2931} {"train_loss": -45.3381462097168, "global_step": 354696, "epoch": 2931} {"train_loss": -45.39707565307617, "global_step": 354697, "epoch": 2931} {"train_loss": -43.96343994140625, "global_step": 354698, "epoch": 2931} {"train_loss": -44.63606643676758, "global_step": 354699, "epoch": 2931} {"train_loss": -44.533599853515625, "global_step": 354700, "epoch": 2931} {"train_loss": -44.2128791809082, "global_step": 354701, "epoch": 2931} {"train_loss": -45.01730728149414, "global_step": 354702, "epoch": 2931} {"train_loss": -45.35246658325195, "global_step": 354703, "epoch": 2931} {"train_loss": -44.5776481628418, "global_step": 354704, "epoch": 2931} {"train_loss": -44.087276458740234, "global_step": 354705, "epoch": 2931} {"train_loss": -43.97957992553711, "global_step": 354706, "epoch": 2931} {"train_loss": -44.48694610595703, "global_step": 354707, "epoch": 2931} {"train_loss": -45.38517379760742, "global_step": 354708, "epoch": 2931} {"train_loss": -44.92675018310547, "global_step": 354709, "epoch": 2931} {"train_loss": -44.554683685302734, "global_step": 354710, "epoch": 2931} {"train_loss": -45.02381134033203, "global_step": 354711, "epoch": 2931} {"train_loss": -45.4832878112793, "global_step": 354712, "epoch": 2931} {"train_loss": -45.19550704956055, "global_step": 354713, "epoch": 2931} {"train_loss": -45.09803009033203, "global_step": 354714, "epoch": 2931} {"train_loss": -45.28550720214844, "global_step": 354715, "epoch": 2931} {"train_loss": -45.82125473022461, "global_step": 354716, "epoch": 2931} {"train_loss": -44.54368591308594, "global_step": 354717, "epoch": 2931} {"train_loss": -45.04414367675781, "global_step": 354718, "epoch": 2931} {"train_loss": -44.76121139526367, "global_step": 354719, "epoch": 2931} {"train_loss": -45.345001220703125, "global_step": 354720, "epoch": 2931} {"train_loss": -45.57353591918945, "global_step": 354721, "epoch": 2931} {"train_loss": -45.32709884643555, "global_step": 354722, "epoch": 2931} {"train_loss": -45.759498596191406, "global_step": 354723, "epoch": 2931} {"train_loss": -44.987220764160156, "global_step": 354724, "epoch": 2931} {"train_loss": -44.8692626953125, "global_step": 354725, "epoch": 2931} {"train_loss": -45.15916061401367, "global_step": 354726, "epoch": 2931} {"train_loss": -44.270233154296875, "global_step": 354727, "epoch": 2931} {"train_loss": -43.59536361694336, "global_step": 354728, "epoch": 2931} {"train_loss": -44.513404846191406, "global_step": 354729, "epoch": 2931} {"train_loss": -45.36335754394531, "global_step": 354730, "epoch": 2931} {"train_loss": -44.264217376708984, "global_step": 354731, "epoch": 2931} {"train_loss": -42.49078369140625, "global_step": 354732, "epoch": 2931} {"train_loss": -43.6275749206543, "global_step": 354733, "epoch": 2931} {"train_loss": -44.77031326293945, "global_step": 354734, "epoch": 2931} {"train_loss": -43.93805694580078, "global_step": 354735, "epoch": 2931} {"train_loss": -43.089595794677734, "global_step": 354736, "epoch": 2931} {"train_loss": -44.23922348022461, "global_step": 354737, "epoch": 2931} {"train_loss": -43.617713928222656, "global_step": 354738, "epoch": 2931} {"train_loss": -43.029884338378906, "global_step": 354739, "epoch": 2931} {"train_loss": -44.66769027709961, "global_step": 354740, "epoch": 2931} {"train_loss": -44.80295181274414, "global_step": 354741, "epoch": 2931} {"train_loss": -44.86659240722656, "global_step": 354742, "epoch": 2931} {"train_loss": -44.301212310791016, "global_step": 354743, "epoch": 2931} {"train_loss": -43.6618537902832, "global_step": 354744, "epoch": 2931} {"train_loss": -43.391658782958984, "global_step": 354745, "epoch": 2931} {"train_loss": -44.8466911315918, "global_step": 354746, "epoch": 2931} {"train_loss": -45.061153411865234, "global_step": 354747, "epoch": 2931} {"train_loss": -44.58356475830078, "global_step": 354748, "epoch": 2931} {"train_loss": -44.55656051635742, "global_step": 354749, "epoch": 2931} {"train_loss": -44.461402893066406, "global_step": 354750, "epoch": 2931} {"train_loss": -45.40087890625, "global_step": 354751, "epoch": 2931} {"train_loss": -44.76374816894531, "global_step": 354752, "epoch": 2931} {"train_loss": -43.89116287231445, "global_step": 354753, "epoch": 2931} {"train_loss": -45.247493743896484, "global_step": 354754, "epoch": 2931} {"train_loss": -44.05162048339844, "global_step": 354755, "epoch": 2931} {"train_loss": -43.6119384765625, "global_step": 354756, "epoch": 2931} {"train_loss": -43.73081970214844, "global_step": 354757, "epoch": 2931} {"train_loss": -43.768131256103516, "global_step": 354758, "epoch": 2931} {"train_loss": -42.926170349121094, "global_step": 354759, "epoch": 2931} {"train_loss": -44.27014923095703, "global_step": 354760, "epoch": 2931} {"train_loss": -44.20207595825195, "global_step": 354761, "epoch": 2931} {"train_loss": -42.94883346557617, "global_step": 354762, "epoch": 2931} {"train_loss": -45.23057174682617, "global_step": 354763, "epoch": 2931} {"train_loss": -42.999019622802734, "global_step": 354764, "epoch": 2931} {"train_loss": -44.07184982299805, "global_step": 354765, "epoch": 2931} {"train_loss": -44.614620208740234, "global_step": 354766, "epoch": 2931} {"train_loss": -42.31549835205078, "global_step": 354767, "epoch": 2931} {"train_loss": -45.25368881225586, "global_step": 354768, "epoch": 2931} {"train_loss": -44.177669525146484, "global_step": 354769, "epoch": 2931} {"train_loss": -43.95974349975586, "global_step": 354770, "epoch": 2931} {"train_loss": -44.50206655707241, "global_step": 354771, "epoch": 2931, "val_loss": 2485589.25} {"train_loss": -44.48747634887695, "global_step": 354772, "epoch": 2932} {"train_loss": -44.16413879394531, "global_step": 354773, "epoch": 2932} {"train_loss": -43.27027130126953, "global_step": 354774, "epoch": 2932} {"train_loss": -44.97050476074219, "global_step": 354775, "epoch": 2932} {"train_loss": -44.3677978515625, "global_step": 354776, "epoch": 2932} {"train_loss": -42.78874969482422, "global_step": 354777, "epoch": 2932} {"train_loss": -45.07743453979492, "global_step": 354778, "epoch": 2932} {"train_loss": -43.866493225097656, "global_step": 354779, "epoch": 2932} {"train_loss": -43.54929733276367, "global_step": 354780, "epoch": 2932} {"train_loss": -44.155975341796875, "global_step": 354781, "epoch": 2932} {"train_loss": -44.37675857543945, "global_step": 354782, "epoch": 2932} {"train_loss": -44.933258056640625, "global_step": 354783, "epoch": 2932} {"train_loss": -42.714820861816406, "global_step": 354784, "epoch": 2932} {"train_loss": -44.5719108581543, "global_step": 354785, "epoch": 2932} {"train_loss": -45.192806243896484, "global_step": 354786, "epoch": 2932} {"train_loss": -44.607784271240234, "global_step": 354787, "epoch": 2932} {"train_loss": -44.50643539428711, "global_step": 354788, "epoch": 2932} {"train_loss": -44.83286666870117, "global_step": 354789, "epoch": 2932} {"train_loss": -43.99869918823242, "global_step": 354790, "epoch": 2932} {"train_loss": -44.405059814453125, "global_step": 354791, "epoch": 2932} {"train_loss": -44.30983352661133, "global_step": 354792, "epoch": 2932} {"train_loss": -43.17646408081055, "global_step": 354793, "epoch": 2932} {"train_loss": -45.066368103027344, "global_step": 354794, "epoch": 2932} {"train_loss": -43.82548904418945, "global_step": 354795, "epoch": 2932} {"train_loss": -44.38971710205078, "global_step": 354796, "epoch": 2932} {"train_loss": -44.84852981567383, "global_step": 354797, "epoch": 2932} {"train_loss": -43.92667770385742, "global_step": 354798, "epoch": 2932} {"train_loss": -44.346031188964844, "global_step": 354799, "epoch": 2932} {"train_loss": -43.8799934387207, "global_step": 354800, "epoch": 2932} {"train_loss": -45.40873336791992, "global_step": 354801, "epoch": 2932} {"train_loss": -42.153865814208984, "global_step": 354802, "epoch": 2932} {"train_loss": -43.25285339355469, "global_step": 354803, "epoch": 2932} {"train_loss": -44.2241096496582, "global_step": 354804, "epoch": 2932} {"train_loss": -42.90132522583008, "global_step": 354805, "epoch": 2932} {"train_loss": -44.70361328125, "global_step": 354806, "epoch": 2932} {"train_loss": -41.53314971923828, "global_step": 354807, "epoch": 2932} {"train_loss": -44.15690994262695, "global_step": 354808, "epoch": 2932} {"train_loss": -41.07510757446289, "global_step": 354809, "epoch": 2932} {"train_loss": -43.425655364990234, "global_step": 354810, "epoch": 2932} {"train_loss": -40.086055755615234, "global_step": 354811, "epoch": 2932} {"train_loss": -42.584075927734375, "global_step": 354812, "epoch": 2932} {"train_loss": -41.92478942871094, "global_step": 354813, "epoch": 2932} {"train_loss": -42.2921257019043, "global_step": 354814, "epoch": 2932} {"train_loss": -42.265541076660156, "global_step": 354815, "epoch": 2932} {"train_loss": -41.787254333496094, "global_step": 354816, "epoch": 2932} {"train_loss": -43.73103713989258, "global_step": 354817, "epoch": 2932} {"train_loss": -42.46455383300781, "global_step": 354818, "epoch": 2932} {"train_loss": -44.161903381347656, "global_step": 354819, "epoch": 2932} {"train_loss": -43.74922561645508, "global_step": 354820, "epoch": 2932} {"train_loss": -43.85443878173828, "global_step": 354821, "epoch": 2932} {"train_loss": -43.349971771240234, "global_step": 354822, "epoch": 2932} {"train_loss": -44.03254318237305, "global_step": 354823, "epoch": 2932} {"train_loss": -43.318946838378906, "global_step": 354824, "epoch": 2932} {"train_loss": -43.84440231323242, "global_step": 354825, "epoch": 2932} {"train_loss": -43.872779846191406, "global_step": 354826, "epoch": 2932} {"train_loss": -44.94824981689453, "global_step": 354827, "epoch": 2932} {"train_loss": -44.26841354370117, "global_step": 354828, "epoch": 2932} {"train_loss": -44.69519805908203, "global_step": 354829, "epoch": 2932} {"train_loss": -44.69245910644531, "global_step": 354830, "epoch": 2932} {"train_loss": -44.80996322631836, "global_step": 354831, "epoch": 2932} {"train_loss": -44.75532913208008, "global_step": 354832, "epoch": 2932} {"train_loss": -45.31000900268555, "global_step": 354833, "epoch": 2932} {"train_loss": -44.86884689331055, "global_step": 354834, "epoch": 2932} {"train_loss": -44.29979705810547, "global_step": 354835, "epoch": 2932} {"train_loss": -45.05984878540039, "global_step": 354836, "epoch": 2932} {"train_loss": -45.58528518676758, "global_step": 354837, "epoch": 2932} {"train_loss": -45.07296371459961, "global_step": 354838, "epoch": 2932} {"train_loss": -44.995845794677734, "global_step": 354839, "epoch": 2932} {"train_loss": -45.28373336791992, "global_step": 354840, "epoch": 2932} {"train_loss": -44.57074737548828, "global_step": 354841, "epoch": 2932} {"train_loss": -43.5821418762207, "global_step": 354842, "epoch": 2932} {"train_loss": -44.962013244628906, "global_step": 354843, "epoch": 2932} {"train_loss": -44.596866607666016, "global_step": 354844, "epoch": 2932} {"train_loss": -43.79220962524414, "global_step": 354845, "epoch": 2932} {"train_loss": -42.751312255859375, "global_step": 354846, "epoch": 2932} {"train_loss": -44.3521614074707, "global_step": 354847, "epoch": 2932} {"train_loss": -40.33551025390625, "global_step": 354848, "epoch": 2932} {"train_loss": -44.57402420043945, "global_step": 354849, "epoch": 2932} {"train_loss": -41.91886901855469, "global_step": 354850, "epoch": 2932} {"train_loss": -41.49079513549805, "global_step": 354851, "epoch": 2932} {"train_loss": -43.85903549194336, "global_step": 354852, "epoch": 2932} {"train_loss": -44.081478118896484, "global_step": 354853, "epoch": 2932} {"train_loss": -42.10805892944336, "global_step": 354854, "epoch": 2932} {"train_loss": -41.799137115478516, "global_step": 354855, "epoch": 2932} {"train_loss": -44.635860443115234, "global_step": 354856, "epoch": 2932} {"train_loss": -44.97115707397461, "global_step": 354857, "epoch": 2932} {"train_loss": -43.47927474975586, "global_step": 354858, "epoch": 2932} {"train_loss": -44.28142166137695, "global_step": 354859, "epoch": 2932} {"train_loss": -42.67608642578125, "global_step": 354860, "epoch": 2932} {"train_loss": -41.227821350097656, "global_step": 354861, "epoch": 2932} {"train_loss": -42.35720443725586, "global_step": 354862, "epoch": 2932} {"train_loss": -43.38326644897461, "global_step": 354863, "epoch": 2932} {"train_loss": -43.730072021484375, "global_step": 354864, "epoch": 2932} {"train_loss": -44.63041305541992, "global_step": 354865, "epoch": 2932} {"train_loss": -43.45526885986328, "global_step": 354866, "epoch": 2932} {"train_loss": -43.96310043334961, "global_step": 354867, "epoch": 2932} {"train_loss": -43.3689079284668, "global_step": 354868, "epoch": 2932} {"train_loss": -44.18711471557617, "global_step": 354869, "epoch": 2932} {"train_loss": -43.7222785949707, "global_step": 354870, "epoch": 2932} {"train_loss": -43.44715118408203, "global_step": 354871, "epoch": 2932} {"train_loss": -44.40874099731445, "global_step": 354872, "epoch": 2932} {"train_loss": -44.80817413330078, "global_step": 354873, "epoch": 2932} {"train_loss": -44.67088317871094, "global_step": 354874, "epoch": 2932} {"train_loss": -44.63590621948242, "global_step": 354875, "epoch": 2932} {"train_loss": -44.014747619628906, "global_step": 354876, "epoch": 2932} {"train_loss": -44.640621185302734, "global_step": 354877, "epoch": 2932} {"train_loss": -44.83253479003906, "global_step": 354878, "epoch": 2932} {"train_loss": -43.36824417114258, "global_step": 354879, "epoch": 2932} {"train_loss": -42.59552001953125, "global_step": 354880, "epoch": 2932} {"train_loss": -43.15813064575195, "global_step": 354881, "epoch": 2932} {"train_loss": -44.369415283203125, "global_step": 354882, "epoch": 2932} {"train_loss": -43.8273811340332, "global_step": 354883, "epoch": 2932} {"train_loss": -44.550987243652344, "global_step": 354884, "epoch": 2932} {"train_loss": -44.3192253112793, "global_step": 354885, "epoch": 2932} {"train_loss": -44.127838134765625, "global_step": 354886, "epoch": 2932} {"train_loss": -44.4183349609375, "global_step": 354887, "epoch": 2932} {"train_loss": -45.180519104003906, "global_step": 354888, "epoch": 2932} {"train_loss": -44.139137268066406, "global_step": 354889, "epoch": 2932} {"train_loss": -43.44321823120117, "global_step": 354890, "epoch": 2932} {"train_loss": -44.9554443359375, "global_step": 354891, "epoch": 2932} {"train_loss": -43.85845666680454, "global_step": 354892, "epoch": 2932, "val_loss": 2527477.75} {"train_loss": -44.3790168762207, "global_step": 354893, "epoch": 2933} {"train_loss": -44.74090576171875, "global_step": 354894, "epoch": 2933} {"train_loss": -44.16096115112305, "global_step": 354895, "epoch": 2933} {"train_loss": -43.59317398071289, "global_step": 354896, "epoch": 2933} {"train_loss": -44.664241790771484, "global_step": 354897, "epoch": 2933} {"train_loss": -44.67525100708008, "global_step": 354898, "epoch": 2933} {"train_loss": -43.95121765136719, "global_step": 354899, "epoch": 2933} {"train_loss": -43.03722381591797, "global_step": 354900, "epoch": 2933} {"train_loss": -43.799198150634766, "global_step": 354901, "epoch": 2933} {"train_loss": -44.254981994628906, "global_step": 354902, "epoch": 2933} {"train_loss": -45.11334991455078, "global_step": 354903, "epoch": 2933} {"train_loss": -45.615352630615234, "global_step": 354904, "epoch": 2933} {"train_loss": -44.74701690673828, "global_step": 354905, "epoch": 2933} {"train_loss": -44.50554656982422, "global_step": 354906, "epoch": 2933} {"train_loss": -45.60562515258789, "global_step": 354907, "epoch": 2933} {"train_loss": -44.067413330078125, "global_step": 354908, "epoch": 2933} {"train_loss": -45.321956634521484, "global_step": 354909, "epoch": 2933} {"train_loss": -44.875953674316406, "global_step": 354910, "epoch": 2933} {"train_loss": -44.9604606628418, "global_step": 354911, "epoch": 2933} {"train_loss": -45.19830322265625, "global_step": 354912, "epoch": 2933} {"train_loss": -42.1481819152832, "global_step": 354913, "epoch": 2933} {"train_loss": -44.399085998535156, "global_step": 354914, "epoch": 2933} {"train_loss": -44.25858688354492, "global_step": 354915, "epoch": 2933} {"train_loss": -42.439510345458984, "global_step": 354916, "epoch": 2933} {"train_loss": -43.85599899291992, "global_step": 354917, "epoch": 2933} {"train_loss": -44.595802307128906, "global_step": 354918, "epoch": 2933} {"train_loss": -42.986778259277344, "global_step": 354919, "epoch": 2933} {"train_loss": -44.54148483276367, "global_step": 354920, "epoch": 2933} {"train_loss": -44.588008880615234, "global_step": 354921, "epoch": 2933} {"train_loss": -43.58534622192383, "global_step": 354922, "epoch": 2933} {"train_loss": -43.94743728637695, "global_step": 354923, "epoch": 2933} {"train_loss": -43.67678451538086, "global_step": 354924, "epoch": 2933} {"train_loss": -44.495914459228516, "global_step": 354925, "epoch": 2933} {"train_loss": -45.24068832397461, "global_step": 354926, "epoch": 2933} {"train_loss": -44.2486457824707, "global_step": 354927, "epoch": 2933} {"train_loss": -44.307472229003906, "global_step": 354928, "epoch": 2933} {"train_loss": -44.945281982421875, "global_step": 354929, "epoch": 2933} {"train_loss": -44.82656478881836, "global_step": 354930, "epoch": 2933} {"train_loss": -44.9210090637207, "global_step": 354931, "epoch": 2933} {"train_loss": -44.50611114501953, "global_step": 354932, "epoch": 2933} {"train_loss": -41.80123519897461, "global_step": 354933, "epoch": 2933} {"train_loss": -45.01604461669922, "global_step": 354934, "epoch": 2933} {"train_loss": -45.36444091796875, "global_step": 354935, "epoch": 2933} {"train_loss": -45.532466888427734, "global_step": 354936, "epoch": 2933} {"train_loss": -45.28487777709961, "global_step": 354937, "epoch": 2933} {"train_loss": -45.45998001098633, "global_step": 354938, "epoch": 2933} {"train_loss": -45.20005416870117, "global_step": 354939, "epoch": 2933} {"train_loss": -45.31568145751953, "global_step": 354940, "epoch": 2933} {"train_loss": -45.66704177856445, "global_step": 354941, "epoch": 2933} {"train_loss": -45.26405334472656, "global_step": 354942, "epoch": 2933} {"train_loss": -45.08614730834961, "global_step": 354943, "epoch": 2933} {"train_loss": -45.04772186279297, "global_step": 354944, "epoch": 2933} {"train_loss": -45.18388748168945, "global_step": 354945, "epoch": 2933} {"train_loss": -45.22526168823242, "global_step": 354946, "epoch": 2933} {"train_loss": -45.509117126464844, "global_step": 354947, "epoch": 2933} {"train_loss": -45.80502700805664, "global_step": 354948, "epoch": 2933} {"train_loss": -44.97529983520508, "global_step": 354949, "epoch": 2933} {"train_loss": -44.38633728027344, "global_step": 354950, "epoch": 2933} {"train_loss": -44.77003860473633, "global_step": 354951, "epoch": 2933} {"train_loss": -44.155887603759766, "global_step": 354952, "epoch": 2933} {"train_loss": -39.88899612426758, "global_step": 354953, "epoch": 2933} {"train_loss": -44.55479049682617, "global_step": 354954, "epoch": 2933} {"train_loss": -40.97873306274414, "global_step": 354955, "epoch": 2933} {"train_loss": -44.300926208496094, "global_step": 354956, "epoch": 2933} {"train_loss": -43.97132873535156, "global_step": 354957, "epoch": 2933} {"train_loss": -42.9663200378418, "global_step": 354958, "epoch": 2933} {"train_loss": -44.63593673706055, "global_step": 354959, "epoch": 2933} {"train_loss": -44.15471267700195, "global_step": 354960, "epoch": 2933} {"train_loss": -44.260494232177734, "global_step": 354961, "epoch": 2933} {"train_loss": -44.61173629760742, "global_step": 354962, "epoch": 2933} {"train_loss": -44.86456298828125, "global_step": 354963, "epoch": 2933} {"train_loss": -42.9100341796875, "global_step": 354964, "epoch": 2933} {"train_loss": -43.61255645751953, "global_step": 354965, "epoch": 2933} {"train_loss": -43.8778190612793, "global_step": 354966, "epoch": 2933} {"train_loss": -42.022804260253906, "global_step": 354967, "epoch": 2933} {"train_loss": -45.02088165283203, "global_step": 354968, "epoch": 2933} {"train_loss": -41.29859161376953, "global_step": 354969, "epoch": 2933} {"train_loss": -43.8246955871582, "global_step": 354970, "epoch": 2933} {"train_loss": -40.160621643066406, "global_step": 354971, "epoch": 2933} {"train_loss": -41.65129852294922, "global_step": 354972, "epoch": 2933} {"train_loss": -41.59918212890625, "global_step": 354973, "epoch": 2933} {"train_loss": -37.17966079711914, "global_step": 354974, "epoch": 2933} {"train_loss": -38.43921661376953, "global_step": 354975, "epoch": 2933} {"train_loss": -43.01014709472656, "global_step": 354976, "epoch": 2933} {"train_loss": -40.11600112915039, "global_step": 354977, "epoch": 2933} {"train_loss": -40.00631332397461, "global_step": 354978, "epoch": 2933} {"train_loss": -41.3271598815918, "global_step": 354979, "epoch": 2933} {"train_loss": -43.357421875, "global_step": 354980, "epoch": 2933} {"train_loss": -41.888465881347656, "global_step": 354981, "epoch": 2933} {"train_loss": -42.87556076049805, "global_step": 354982, "epoch": 2933} {"train_loss": -42.39851760864258, "global_step": 354983, "epoch": 2933} {"train_loss": -43.601348876953125, "global_step": 354984, "epoch": 2933} {"train_loss": -42.52183151245117, "global_step": 354985, "epoch": 2933} {"train_loss": -43.484806060791016, "global_step": 354986, "epoch": 2933} {"train_loss": -43.398494720458984, "global_step": 354987, "epoch": 2933} {"train_loss": -42.65739822387695, "global_step": 354988, "epoch": 2933} {"train_loss": -44.183048248291016, "global_step": 354989, "epoch": 2933} {"train_loss": -42.77587890625, "global_step": 354990, "epoch": 2933} {"train_loss": -43.15693283081055, "global_step": 354991, "epoch": 2933} {"train_loss": -43.135108947753906, "global_step": 354992, "epoch": 2933} {"train_loss": -41.86517333984375, "global_step": 354993, "epoch": 2933} {"train_loss": -43.37314987182617, "global_step": 354994, "epoch": 2933} {"train_loss": -44.65304946899414, "global_step": 354995, "epoch": 2933} {"train_loss": -42.20032501220703, "global_step": 354996, "epoch": 2933} {"train_loss": -44.2650260925293, "global_step": 354997, "epoch": 2933} {"train_loss": -42.49766159057617, "global_step": 354998, "epoch": 2933} {"train_loss": -44.16579818725586, "global_step": 354999, "epoch": 2933} {"train_loss": -43.8240852355957, "global_step": 355000, "epoch": 2933} {"train_loss": -43.60213851928711, "global_step": 355001, "epoch": 2933} {"train_loss": -44.09002685546875, "global_step": 355002, "epoch": 2933} {"train_loss": -42.664405822753906, "global_step": 355003, "epoch": 2933} {"train_loss": -43.337860107421875, "global_step": 355004, "epoch": 2933} {"train_loss": -44.27801513671875, "global_step": 355005, "epoch": 2933} {"train_loss": -44.05944061279297, "global_step": 355006, "epoch": 2933} {"train_loss": -43.50529098510742, "global_step": 355007, "epoch": 2933} {"train_loss": -44.2689208984375, "global_step": 355008, "epoch": 2933} {"train_loss": -44.57660675048828, "global_step": 355009, "epoch": 2933} {"train_loss": -42.74150466918945, "global_step": 355010, "epoch": 2933} {"train_loss": -43.3385124206543, "global_step": 355011, "epoch": 2933} {"train_loss": -43.45134353637695, "global_step": 355012, "epoch": 2933} {"train_loss": -43.741902721814874, "global_step": 355013, "epoch": 2933, "val_loss": 2702701.0} {"train_loss": -42.82206344604492, "global_step": 355014, "epoch": 2934} {"train_loss": -44.09395980834961, "global_step": 355015, "epoch": 2934} {"train_loss": -44.5401496887207, "global_step": 355016, "epoch": 2934} {"train_loss": -44.76925277709961, "global_step": 355017, "epoch": 2934} {"train_loss": -44.57939147949219, "global_step": 355018, "epoch": 2934} {"train_loss": -42.36050033569336, "global_step": 355019, "epoch": 2934} {"train_loss": -44.81877517700195, "global_step": 355020, "epoch": 2934} {"train_loss": -43.463993072509766, "global_step": 355021, "epoch": 2934} {"train_loss": -45.020965576171875, "global_step": 355022, "epoch": 2934} {"train_loss": -44.913917541503906, "global_step": 355023, "epoch": 2934} {"train_loss": -44.82332229614258, "global_step": 355024, "epoch": 2934} {"train_loss": -44.74680709838867, "global_step": 355025, "epoch": 2934} {"train_loss": -43.656646728515625, "global_step": 355026, "epoch": 2934} {"train_loss": -45.030487060546875, "global_step": 355027, "epoch": 2934} {"train_loss": -45.18709945678711, "global_step": 355028, "epoch": 2934} {"train_loss": -43.03165817260742, "global_step": 355029, "epoch": 2934} {"train_loss": -44.745582580566406, "global_step": 355030, "epoch": 2934} {"train_loss": -45.501197814941406, "global_step": 355031, "epoch": 2934} {"train_loss": -44.68862533569336, "global_step": 355032, "epoch": 2934} {"train_loss": -44.673744201660156, "global_step": 355033, "epoch": 2934} {"train_loss": -43.52287673950195, "global_step": 355034, "epoch": 2934} {"train_loss": -45.264583587646484, "global_step": 355035, "epoch": 2934} {"train_loss": -44.92621994018555, "global_step": 355036, "epoch": 2934} {"train_loss": -44.61444854736328, "global_step": 355037, "epoch": 2934} {"train_loss": -44.64985275268555, "global_step": 355038, "epoch": 2934} {"train_loss": -45.4652099609375, "global_step": 355039, "epoch": 2934} {"train_loss": -44.80305099487305, "global_step": 355040, "epoch": 2934} {"train_loss": -43.85641098022461, "global_step": 355041, "epoch": 2934} {"train_loss": -45.0810546875, "global_step": 355042, "epoch": 2934} {"train_loss": -43.93672180175781, "global_step": 355043, "epoch": 2934} {"train_loss": -45.48916244506836, "global_step": 355044, "epoch": 2934} {"train_loss": -44.837974548339844, "global_step": 355045, "epoch": 2934} {"train_loss": -45.10707473754883, "global_step": 355046, "epoch": 2934} {"train_loss": -45.070396423339844, "global_step": 355047, "epoch": 2934} {"train_loss": -44.80522155761719, "global_step": 355048, "epoch": 2934} {"train_loss": -44.95878219604492, "global_step": 355049, "epoch": 2934} {"train_loss": -45.311683654785156, "global_step": 355050, "epoch": 2934} {"train_loss": -44.59894943237305, "global_step": 355051, "epoch": 2934} {"train_loss": -44.36773681640625, "global_step": 355052, "epoch": 2934} {"train_loss": -44.862545013427734, "global_step": 355053, "epoch": 2934} {"train_loss": -45.30403137207031, "global_step": 355054, "epoch": 2934} {"train_loss": -44.8903923034668, "global_step": 355055, "epoch": 2934} {"train_loss": -44.855037689208984, "global_step": 355056, "epoch": 2934} {"train_loss": -43.350608825683594, "global_step": 355057, "epoch": 2934} {"train_loss": -44.01736068725586, "global_step": 355058, "epoch": 2934} {"train_loss": -45.38026428222656, "global_step": 355059, "epoch": 2934} {"train_loss": -43.82440185546875, "global_step": 355060, "epoch": 2934} {"train_loss": -45.3665771484375, "global_step": 355061, "epoch": 2934} {"train_loss": -44.68844223022461, "global_step": 355062, "epoch": 2934} {"train_loss": -45.55946731567383, "global_step": 355063, "epoch": 2934} {"train_loss": -44.62385177612305, "global_step": 355064, "epoch": 2934} {"train_loss": -44.40766143798828, "global_step": 355065, "epoch": 2934} {"train_loss": -45.040565490722656, "global_step": 355066, "epoch": 2934} {"train_loss": -45.662715911865234, "global_step": 355067, "epoch": 2934} {"train_loss": -44.90044403076172, "global_step": 355068, "epoch": 2934} {"train_loss": -42.64802932739258, "global_step": 355069, "epoch": 2934} {"train_loss": -38.341373443603516, "global_step": 355070, "epoch": 2934} {"train_loss": -41.22633743286133, "global_step": 355071, "epoch": 2934} {"train_loss": -41.62471008300781, "global_step": 355072, "epoch": 2934} {"train_loss": -38.650184631347656, "global_step": 355073, "epoch": 2934} {"train_loss": -40.23681640625, "global_step": 355074, "epoch": 2934} {"train_loss": -40.960296630859375, "global_step": 355075, "epoch": 2934} {"train_loss": -42.403228759765625, "global_step": 355076, "epoch": 2934} {"train_loss": -41.82761001586914, "global_step": 355077, "epoch": 2934} {"train_loss": -42.296119689941406, "global_step": 355078, "epoch": 2934} {"train_loss": -43.244110107421875, "global_step": 355079, "epoch": 2934} {"train_loss": -43.50984573364258, "global_step": 355080, "epoch": 2934} {"train_loss": -41.77608108520508, "global_step": 355081, "epoch": 2934} {"train_loss": -43.58501052856445, "global_step": 355082, "epoch": 2934} {"train_loss": -42.272151947021484, "global_step": 355083, "epoch": 2934} {"train_loss": -41.88496780395508, "global_step": 355084, "epoch": 2934} {"train_loss": -43.28280258178711, "global_step": 355085, "epoch": 2934} {"train_loss": -42.27239990234375, "global_step": 355086, "epoch": 2934} {"train_loss": -40.6427116394043, "global_step": 355087, "epoch": 2934} {"train_loss": -43.07925033569336, "global_step": 355088, "epoch": 2934} {"train_loss": -41.94559097290039, "global_step": 355089, "epoch": 2934} {"train_loss": -41.95512771606445, "global_step": 355090, "epoch": 2934} {"train_loss": -42.16592025756836, "global_step": 355091, "epoch": 2934} {"train_loss": -43.54817581176758, "global_step": 355092, "epoch": 2934} {"train_loss": -40.43974685668945, "global_step": 355093, "epoch": 2934} {"train_loss": -41.765899658203125, "global_step": 355094, "epoch": 2934} {"train_loss": -42.74325180053711, "global_step": 355095, "epoch": 2934} {"train_loss": -43.42646408081055, "global_step": 355096, "epoch": 2934} {"train_loss": -41.98470687866211, "global_step": 355097, "epoch": 2934} {"train_loss": -42.35517501831055, "global_step": 355098, "epoch": 2934} {"train_loss": -44.11361312866211, "global_step": 355099, "epoch": 2934} {"train_loss": -41.84539031982422, "global_step": 355100, "epoch": 2934} {"train_loss": -42.21369552612305, "global_step": 355101, "epoch": 2934} {"train_loss": -42.994102478027344, "global_step": 355102, "epoch": 2934} {"train_loss": -43.6421012878418, "global_step": 355103, "epoch": 2934} {"train_loss": -41.79842758178711, "global_step": 355104, "epoch": 2934} {"train_loss": -43.161773681640625, "global_step": 355105, "epoch": 2934} {"train_loss": -43.10064697265625, "global_step": 355106, "epoch": 2934} {"train_loss": -41.58451461791992, "global_step": 355107, "epoch": 2934} {"train_loss": -42.65156555175781, "global_step": 355108, "epoch": 2934} {"train_loss": -40.579254150390625, "global_step": 355109, "epoch": 2934} {"train_loss": -43.66941452026367, "global_step": 355110, "epoch": 2934} {"train_loss": -38.87362289428711, "global_step": 355111, "epoch": 2934} {"train_loss": -40.44147872924805, "global_step": 355112, "epoch": 2934} {"train_loss": -41.38189697265625, "global_step": 355113, "epoch": 2934} {"train_loss": -40.41630554199219, "global_step": 355114, "epoch": 2934} {"train_loss": -42.43296432495117, "global_step": 355115, "epoch": 2934} {"train_loss": -40.8846435546875, "global_step": 355116, "epoch": 2934} {"train_loss": -43.26999282836914, "global_step": 355117, "epoch": 2934} {"train_loss": -40.75153350830078, "global_step": 355118, "epoch": 2934} {"train_loss": -42.56278610229492, "global_step": 355119, "epoch": 2934} {"train_loss": -41.371673583984375, "global_step": 355120, "epoch": 2934} {"train_loss": -41.58160400390625, "global_step": 355121, "epoch": 2934} {"train_loss": -41.60868453979492, "global_step": 355122, "epoch": 2934} {"train_loss": -43.2724494934082, "global_step": 355123, "epoch": 2934} {"train_loss": -42.16219711303711, "global_step": 355124, "epoch": 2934} {"train_loss": -42.59359359741211, "global_step": 355125, "epoch": 2934} {"train_loss": -43.625247955322266, "global_step": 355126, "epoch": 2934} {"train_loss": -43.252418518066406, "global_step": 355127, "epoch": 2934} {"train_loss": -43.538543701171875, "global_step": 355128, "epoch": 2934} {"train_loss": -43.915279388427734, "global_step": 355129, "epoch": 2934} {"train_loss": -43.86617660522461, "global_step": 355130, "epoch": 2934} {"train_loss": -43.41062545776367, "global_step": 355131, "epoch": 2934} {"train_loss": -43.6269416809082, "global_step": 355132, "epoch": 2934} {"train_loss": -43.320491790771484, "global_step": 355133, "epoch": 2934} {"train_loss": -43.308966360801506, "global_step": 355134, "epoch": 2934, "val_loss": 2656423.5} {"train_loss": -43.907142639160156, "global_step": 355135, "epoch": 2935} {"train_loss": -44.208160400390625, "global_step": 355136, "epoch": 2935} {"train_loss": -44.2150993347168, "global_step": 355137, "epoch": 2935} {"train_loss": -44.53601837158203, "global_step": 355138, "epoch": 2935} {"train_loss": -44.50162887573242, "global_step": 355139, "epoch": 2935} {"train_loss": -44.6048583984375, "global_step": 355140, "epoch": 2935} {"train_loss": -44.690773010253906, "global_step": 355141, "epoch": 2935} {"train_loss": -43.985504150390625, "global_step": 355142, "epoch": 2935} {"train_loss": -44.89890670776367, "global_step": 355143, "epoch": 2935} {"train_loss": -44.61564254760742, "global_step": 355144, "epoch": 2935} {"train_loss": -44.703304290771484, "global_step": 355145, "epoch": 2935} {"train_loss": -44.19525146484375, "global_step": 355146, "epoch": 2935} {"train_loss": -44.467403411865234, "global_step": 355147, "epoch": 2935} {"train_loss": -44.20402145385742, "global_step": 355148, "epoch": 2935} {"train_loss": -44.76338577270508, "global_step": 355149, "epoch": 2935} {"train_loss": -45.258296966552734, "global_step": 355150, "epoch": 2935} {"train_loss": -43.436153411865234, "global_step": 355151, "epoch": 2935} {"train_loss": -45.30175018310547, "global_step": 355152, "epoch": 2935} {"train_loss": -44.38866424560547, "global_step": 355153, "epoch": 2935} {"train_loss": -44.51304626464844, "global_step": 355154, "epoch": 2935} {"train_loss": -44.77082443237305, "global_step": 355155, "epoch": 2935} {"train_loss": -44.848087310791016, "global_step": 355156, "epoch": 2935} {"train_loss": -44.89802169799805, "global_step": 355157, "epoch": 2935} {"train_loss": -45.17134475708008, "global_step": 355158, "epoch": 2935} {"train_loss": -44.74074935913086, "global_step": 355159, "epoch": 2935} {"train_loss": -44.97983169555664, "global_step": 355160, "epoch": 2935} {"train_loss": -45.11897659301758, "global_step": 355161, "epoch": 2935} {"train_loss": -45.211822509765625, "global_step": 355162, "epoch": 2935} {"train_loss": -44.46429443359375, "global_step": 355163, "epoch": 2935} {"train_loss": -44.96228790283203, "global_step": 355164, "epoch": 2935} {"train_loss": -44.6541633605957, "global_step": 355165, "epoch": 2935} {"train_loss": -45.44738006591797, "global_step": 355166, "epoch": 2935} {"train_loss": -45.15412521362305, "global_step": 355167, "epoch": 2935} {"train_loss": -45.112457275390625, "global_step": 355168, "epoch": 2935} {"train_loss": -44.92666244506836, "global_step": 355169, "epoch": 2935} {"train_loss": -45.27261734008789, "global_step": 355170, "epoch": 2935} {"train_loss": -45.26112747192383, "global_step": 355171, "epoch": 2935} {"train_loss": -45.261085510253906, "global_step": 355172, "epoch": 2935} {"train_loss": -45.591590881347656, "global_step": 355173, "epoch": 2935} {"train_loss": -45.67339324951172, "global_step": 355174, "epoch": 2935} {"train_loss": -45.203453063964844, "global_step": 355175, "epoch": 2935} {"train_loss": -44.77967071533203, "global_step": 355176, "epoch": 2935} {"train_loss": -44.761295318603516, "global_step": 355177, "epoch": 2935} {"train_loss": -45.59577178955078, "global_step": 355178, "epoch": 2935} {"train_loss": -45.55720901489258, "global_step": 355179, "epoch": 2935} {"train_loss": -44.88630294799805, "global_step": 355180, "epoch": 2935} {"train_loss": -45.467891693115234, "global_step": 355181, "epoch": 2935} {"train_loss": -45.19186019897461, "global_step": 355182, "epoch": 2935} {"train_loss": -44.564292907714844, "global_step": 355183, "epoch": 2935} {"train_loss": -43.88077926635742, "global_step": 355184, "epoch": 2935} {"train_loss": -43.85732650756836, "global_step": 355185, "epoch": 2935} {"train_loss": -44.06252670288086, "global_step": 355186, "epoch": 2935} {"train_loss": -45.04215621948242, "global_step": 355187, "epoch": 2935} {"train_loss": -45.093502044677734, "global_step": 355188, "epoch": 2935} {"train_loss": -44.173614501953125, "global_step": 355189, "epoch": 2935} {"train_loss": -43.67684555053711, "global_step": 355190, "epoch": 2935} {"train_loss": -45.41331100463867, "global_step": 355191, "epoch": 2935} {"train_loss": -44.22809600830078, "global_step": 355192, "epoch": 2935} {"train_loss": -44.661128997802734, "global_step": 355193, "epoch": 2935} {"train_loss": -44.58226013183594, "global_step": 355194, "epoch": 2935} {"train_loss": -44.71829605102539, "global_step": 355195, "epoch": 2935} {"train_loss": -44.45689010620117, "global_step": 355196, "epoch": 2935} {"train_loss": -43.612300872802734, "global_step": 355197, "epoch": 2935} {"train_loss": -42.73501968383789, "global_step": 355198, "epoch": 2935} {"train_loss": -44.27549743652344, "global_step": 355199, "epoch": 2935} {"train_loss": -44.65378952026367, "global_step": 355200, "epoch": 2935} {"train_loss": -42.93740463256836, "global_step": 355201, "epoch": 2935} {"train_loss": -43.58254623413086, "global_step": 355202, "epoch": 2935} {"train_loss": -44.607540130615234, "global_step": 355203, "epoch": 2935} {"train_loss": -43.567623138427734, "global_step": 355204, "epoch": 2935} {"train_loss": -44.211727142333984, "global_step": 355205, "epoch": 2935} {"train_loss": -43.09080123901367, "global_step": 355206, "epoch": 2935} {"train_loss": -43.942012786865234, "global_step": 355207, "epoch": 2935} {"train_loss": -44.34005355834961, "global_step": 355208, "epoch": 2935} {"train_loss": -42.73297119140625, "global_step": 355209, "epoch": 2935} {"train_loss": -44.10195541381836, "global_step": 355210, "epoch": 2935} {"train_loss": -44.726478576660156, "global_step": 355211, "epoch": 2935} {"train_loss": -40.66701126098633, "global_step": 355212, "epoch": 2935} {"train_loss": -43.72315216064453, "global_step": 355213, "epoch": 2935} {"train_loss": -40.275569915771484, "global_step": 355214, "epoch": 2935} {"train_loss": -40.06075668334961, "global_step": 355215, "epoch": 2935} {"train_loss": -42.00513458251953, "global_step": 355216, "epoch": 2935} {"train_loss": -40.38277053833008, "global_step": 355217, "epoch": 2935} {"train_loss": -40.90071487426758, "global_step": 355218, "epoch": 2935} {"train_loss": -40.63161849975586, "global_step": 355219, "epoch": 2935} {"train_loss": -39.58552551269531, "global_step": 355220, "epoch": 2935} {"train_loss": -42.54884719848633, "global_step": 355221, "epoch": 2935} {"train_loss": -43.7876091003418, "global_step": 355222, "epoch": 2935} {"train_loss": -41.928279876708984, "global_step": 355223, "epoch": 2935} {"train_loss": -43.196773529052734, "global_step": 355224, "epoch": 2935} {"train_loss": -41.142127990722656, "global_step": 355225, "epoch": 2935} {"train_loss": -37.35743713378906, "global_step": 355226, "epoch": 2935} {"train_loss": -39.36351776123047, "global_step": 355227, "epoch": 2935} {"train_loss": -41.71976089477539, "global_step": 355228, "epoch": 2935} {"train_loss": -37.39883804321289, "global_step": 355229, "epoch": 2935} {"train_loss": -40.75591278076172, "global_step": 355230, "epoch": 2935} {"train_loss": -40.6395263671875, "global_step": 355231, "epoch": 2935} {"train_loss": -40.212398529052734, "global_step": 355232, "epoch": 2935} {"train_loss": -43.052330017089844, "global_step": 355233, "epoch": 2935} {"train_loss": -40.69692611694336, "global_step": 355234, "epoch": 2935} {"train_loss": -42.149322509765625, "global_step": 355235, "epoch": 2935} {"train_loss": -40.576290130615234, "global_step": 355236, "epoch": 2935} {"train_loss": -38.88755416870117, "global_step": 355237, "epoch": 2935} {"train_loss": -42.68387985229492, "global_step": 355238, "epoch": 2935} {"train_loss": -36.08702087402344, "global_step": 355239, "epoch": 2935} {"train_loss": -42.70608139038086, "global_step": 355240, "epoch": 2935} {"train_loss": -41.32293701171875, "global_step": 355241, "epoch": 2935} {"train_loss": -42.67160415649414, "global_step": 355242, "epoch": 2935} {"train_loss": -41.11676788330078, "global_step": 355243, "epoch": 2935} {"train_loss": -42.34123611450195, "global_step": 355244, "epoch": 2935} {"train_loss": -40.47303009033203, "global_step": 355245, "epoch": 2935} {"train_loss": -42.450904846191406, "global_step": 355246, "epoch": 2935} {"train_loss": -41.62563705444336, "global_step": 355247, "epoch": 2935} {"train_loss": -43.073455810546875, "global_step": 355248, "epoch": 2935} {"train_loss": -42.290985107421875, "global_step": 355249, "epoch": 2935} {"train_loss": -43.49934005737305, "global_step": 355250, "epoch": 2935} {"train_loss": -42.626705169677734, "global_step": 355251, "epoch": 2935} {"train_loss": -42.496742248535156, "global_step": 355252, "epoch": 2935} {"train_loss": -42.458370208740234, "global_step": 355253, "epoch": 2935} {"train_loss": -43.7194938659668, "global_step": 355254, "epoch": 2935} {"train_loss": -43.40242080057948, "global_step": 355255, "epoch": 2935, "val_loss": 2534239.75} {"train_loss": -43.26911544799805, "global_step": 355256, "epoch": 2936} {"train_loss": -43.127479553222656, "global_step": 355257, "epoch": 2936} {"train_loss": -43.46533966064453, "global_step": 355258, "epoch": 2936} {"train_loss": -42.4058723449707, "global_step": 355259, "epoch": 2936} {"train_loss": -43.96693801879883, "global_step": 355260, "epoch": 2936} {"train_loss": -44.13678741455078, "global_step": 355261, "epoch": 2936} {"train_loss": -43.52617263793945, "global_step": 355262, "epoch": 2936} {"train_loss": -41.515560150146484, "global_step": 355263, "epoch": 2936} {"train_loss": -43.4549674987793, "global_step": 355264, "epoch": 2936} {"train_loss": -44.02861404418945, "global_step": 355265, "epoch": 2936} {"train_loss": -44.4736328125, "global_step": 355266, "epoch": 2936} {"train_loss": -44.0698356628418, "global_step": 355267, "epoch": 2936} {"train_loss": -44.403621673583984, "global_step": 355268, "epoch": 2936} {"train_loss": -44.27727127075195, "global_step": 355269, "epoch": 2936} {"train_loss": -44.437801361083984, "global_step": 355270, "epoch": 2936} {"train_loss": -44.097774505615234, "global_step": 355271, "epoch": 2936} {"train_loss": -44.22224044799805, "global_step": 355272, "epoch": 2936} {"train_loss": -44.017696380615234, "global_step": 355273, "epoch": 2936} {"train_loss": -43.83808517456055, "global_step": 355274, "epoch": 2936} {"train_loss": -39.459228515625, "global_step": 355275, "epoch": 2936} {"train_loss": -44.76102828979492, "global_step": 355276, "epoch": 2936} {"train_loss": -43.63909912109375, "global_step": 355277, "epoch": 2936} {"train_loss": -44.910614013671875, "global_step": 355278, "epoch": 2936} {"train_loss": -43.62173843383789, "global_step": 355279, "epoch": 2936} {"train_loss": -44.28202819824219, "global_step": 355280, "epoch": 2936} {"train_loss": -43.82902145385742, "global_step": 355281, "epoch": 2936} {"train_loss": -44.661006927490234, "global_step": 355282, "epoch": 2936} {"train_loss": -43.949989318847656, "global_step": 355283, "epoch": 2936} {"train_loss": -43.7660026550293, "global_step": 355284, "epoch": 2936} {"train_loss": -42.93527603149414, "global_step": 355285, "epoch": 2936} {"train_loss": -40.07119369506836, "global_step": 355286, "epoch": 2936} {"train_loss": -44.07497024536133, "global_step": 355287, "epoch": 2936} {"train_loss": -43.519500732421875, "global_step": 355288, "epoch": 2936} {"train_loss": -44.00642776489258, "global_step": 355289, "epoch": 2936} {"train_loss": -44.91945266723633, "global_step": 355290, "epoch": 2936} {"train_loss": -43.71893310546875, "global_step": 355291, "epoch": 2936} {"train_loss": -44.22742462158203, "global_step": 355292, "epoch": 2936} {"train_loss": -43.062679290771484, "global_step": 355293, "epoch": 2936} {"train_loss": -43.76581954956055, "global_step": 355294, "epoch": 2936} {"train_loss": -44.19152069091797, "global_step": 355295, "epoch": 2936} {"train_loss": -44.70014190673828, "global_step": 355296, "epoch": 2936} {"train_loss": -44.698577880859375, "global_step": 355297, "epoch": 2936} {"train_loss": -44.0761833190918, "global_step": 355298, "epoch": 2936} {"train_loss": -44.561981201171875, "global_step": 355299, "epoch": 2936} {"train_loss": -43.897090911865234, "global_step": 355300, "epoch": 2936} {"train_loss": -45.00069046020508, "global_step": 355301, "epoch": 2936} {"train_loss": -44.823341369628906, "global_step": 355302, "epoch": 2936} {"train_loss": -42.56199645996094, "global_step": 355303, "epoch": 2936} {"train_loss": -45.063411712646484, "global_step": 355304, "epoch": 2936} {"train_loss": -45.04311752319336, "global_step": 355305, "epoch": 2936} {"train_loss": -44.60163497924805, "global_step": 355306, "epoch": 2936} {"train_loss": -44.67019271850586, "global_step": 355307, "epoch": 2936} {"train_loss": -44.8173713684082, "global_step": 355308, "epoch": 2936} {"train_loss": -44.24515151977539, "global_step": 355309, "epoch": 2936} {"train_loss": -45.130401611328125, "global_step": 355310, "epoch": 2936} {"train_loss": -44.952022552490234, "global_step": 355311, "epoch": 2936} {"train_loss": -45.616432189941406, "global_step": 355312, "epoch": 2936} {"train_loss": -45.0303955078125, "global_step": 355313, "epoch": 2936} {"train_loss": -45.00082778930664, "global_step": 355314, "epoch": 2936} {"train_loss": -44.89089584350586, "global_step": 355315, "epoch": 2936} {"train_loss": -44.8170280456543, "global_step": 355316, "epoch": 2936} {"train_loss": -44.85282516479492, "global_step": 355317, "epoch": 2936} {"train_loss": -44.476776123046875, "global_step": 355318, "epoch": 2936} {"train_loss": -44.97050857543945, "global_step": 355319, "epoch": 2936} {"train_loss": -44.844356536865234, "global_step": 355320, "epoch": 2936} {"train_loss": -44.783729553222656, "global_step": 355321, "epoch": 2936} {"train_loss": -44.99849319458008, "global_step": 355322, "epoch": 2936} {"train_loss": -44.2900390625, "global_step": 355323, "epoch": 2936} {"train_loss": -44.38287353515625, "global_step": 355324, "epoch": 2936} {"train_loss": -43.49354934692383, "global_step": 355325, "epoch": 2936} {"train_loss": -44.4885368347168, "global_step": 355326, "epoch": 2936} {"train_loss": -45.437347412109375, "global_step": 355327, "epoch": 2936} {"train_loss": -45.08179473876953, "global_step": 355328, "epoch": 2936} {"train_loss": -44.757930755615234, "global_step": 355329, "epoch": 2936} {"train_loss": -44.50197219848633, "global_step": 355330, "epoch": 2936} {"train_loss": -45.05427169799805, "global_step": 355331, "epoch": 2936} {"train_loss": -44.948822021484375, "global_step": 355332, "epoch": 2936} {"train_loss": -44.98976516723633, "global_step": 355333, "epoch": 2936} {"train_loss": -45.74659729003906, "global_step": 355334, "epoch": 2936} {"train_loss": -45.36379623413086, "global_step": 355335, "epoch": 2936} {"train_loss": -45.14365768432617, "global_step": 355336, "epoch": 2936} {"train_loss": -45.50493240356445, "global_step": 355337, "epoch": 2936} {"train_loss": -44.56170654296875, "global_step": 355338, "epoch": 2936} {"train_loss": -45.076847076416016, "global_step": 355339, "epoch": 2936} {"train_loss": -45.187435150146484, "global_step": 355340, "epoch": 2936} {"train_loss": -45.15565872192383, "global_step": 355341, "epoch": 2936} {"train_loss": -45.10270690917969, "global_step": 355342, "epoch": 2936} {"train_loss": -44.82483673095703, "global_step": 355343, "epoch": 2936} {"train_loss": -43.383968353271484, "global_step": 355344, "epoch": 2936} {"train_loss": -42.7348518371582, "global_step": 355345, "epoch": 2936} {"train_loss": -42.64598083496094, "global_step": 355346, "epoch": 2936} {"train_loss": -44.493587493896484, "global_step": 355347, "epoch": 2936} {"train_loss": -44.66047668457031, "global_step": 355348, "epoch": 2936} {"train_loss": -43.27385330200195, "global_step": 355349, "epoch": 2936} {"train_loss": -43.252410888671875, "global_step": 355350, "epoch": 2936} {"train_loss": -44.3817138671875, "global_step": 355351, "epoch": 2936} {"train_loss": -44.44784164428711, "global_step": 355352, "epoch": 2936} {"train_loss": -42.2085075378418, "global_step": 355353, "epoch": 2936} {"train_loss": -43.20331954956055, "global_step": 355354, "epoch": 2936} {"train_loss": -45.112403869628906, "global_step": 355355, "epoch": 2936} {"train_loss": -43.77162551879883, "global_step": 355356, "epoch": 2936} {"train_loss": -43.172706604003906, "global_step": 355357, "epoch": 2936} {"train_loss": -43.90366744995117, "global_step": 355358, "epoch": 2936} {"train_loss": -45.566253662109375, "global_step": 355359, "epoch": 2936} {"train_loss": -42.935420989990234, "global_step": 355360, "epoch": 2936} {"train_loss": -43.03071212768555, "global_step": 355361, "epoch": 2936} {"train_loss": -44.66111373901367, "global_step": 355362, "epoch": 2936} {"train_loss": -44.3024787902832, "global_step": 355363, "epoch": 2936} {"train_loss": -43.11574172973633, "global_step": 355364, "epoch": 2936} {"train_loss": -42.9595832824707, "global_step": 355365, "epoch": 2936} {"train_loss": -44.987548828125, "global_step": 355366, "epoch": 2936} {"train_loss": -44.14739227294922, "global_step": 355367, "epoch": 2936} {"train_loss": -43.832889556884766, "global_step": 355368, "epoch": 2936} {"train_loss": -44.7388801574707, "global_step": 355369, "epoch": 2936} {"train_loss": -44.58201217651367, "global_step": 355370, "epoch": 2936} {"train_loss": -45.42991256713867, "global_step": 355371, "epoch": 2936} {"train_loss": -44.03921127319336, "global_step": 355372, "epoch": 2936} {"train_loss": -44.498077392578125, "global_step": 355373, "epoch": 2936} {"train_loss": -44.90025329589844, "global_step": 355374, "epoch": 2936} {"train_loss": -43.97887420654297, "global_step": 355375, "epoch": 2936} {"train_loss": -44.191543768260104, "global_step": 355376, "epoch": 2936, "val_loss": 2467269.75} {"train_loss": -44.67525863647461, "global_step": 355377, "epoch": 2937} {"train_loss": -43.975830078125, "global_step": 355378, "epoch": 2937} {"train_loss": -44.61103439331055, "global_step": 355379, "epoch": 2937} {"train_loss": -44.76081466674805, "global_step": 355380, "epoch": 2937} {"train_loss": -45.04535675048828, "global_step": 355381, "epoch": 2937} {"train_loss": -44.76263427734375, "global_step": 355382, "epoch": 2937} {"train_loss": -44.547786712646484, "global_step": 355383, "epoch": 2937} {"train_loss": -44.89608383178711, "global_step": 355384, "epoch": 2937} {"train_loss": -45.25300979614258, "global_step": 355385, "epoch": 2937} {"train_loss": -44.80509948730469, "global_step": 355386, "epoch": 2937} {"train_loss": -44.59309768676758, "global_step": 355387, "epoch": 2937} {"train_loss": -44.75722885131836, "global_step": 355388, "epoch": 2937} {"train_loss": -44.56053924560547, "global_step": 355389, "epoch": 2937} {"train_loss": -44.91791534423828, "global_step": 355390, "epoch": 2937} {"train_loss": -45.03034210205078, "global_step": 355391, "epoch": 2937} {"train_loss": -43.53788757324219, "global_step": 355392, "epoch": 2937} {"train_loss": -44.23744583129883, "global_step": 355393, "epoch": 2937} {"train_loss": -44.735984802246094, "global_step": 355394, "epoch": 2937} {"train_loss": -43.85072708129883, "global_step": 355395, "epoch": 2937} {"train_loss": -44.54154586791992, "global_step": 355396, "epoch": 2937} {"train_loss": -45.4849967956543, "global_step": 355397, "epoch": 2937} {"train_loss": -44.55208969116211, "global_step": 355398, "epoch": 2937} {"train_loss": -44.857444763183594, "global_step": 355399, "epoch": 2937} {"train_loss": -44.71025085449219, "global_step": 355400, "epoch": 2937} {"train_loss": -44.7926139831543, "global_step": 355401, "epoch": 2937} {"train_loss": -44.46458053588867, "global_step": 355402, "epoch": 2937} {"train_loss": -43.956695556640625, "global_step": 355403, "epoch": 2937} {"train_loss": -43.776458740234375, "global_step": 355404, "epoch": 2937} {"train_loss": -44.6375617980957, "global_step": 355405, "epoch": 2937} {"train_loss": -44.28507995605469, "global_step": 355406, "epoch": 2937} {"train_loss": -44.349910736083984, "global_step": 355407, "epoch": 2937} {"train_loss": -44.4434814453125, "global_step": 355408, "epoch": 2937} {"train_loss": -44.6198844909668, "global_step": 355409, "epoch": 2937} {"train_loss": -43.639007568359375, "global_step": 355410, "epoch": 2937} {"train_loss": -42.30398178100586, "global_step": 355411, "epoch": 2937} {"train_loss": -43.95433044433594, "global_step": 355412, "epoch": 2937} {"train_loss": -43.464237213134766, "global_step": 355413, "epoch": 2937} {"train_loss": -43.577186584472656, "global_step": 355414, "epoch": 2937} {"train_loss": -44.19670104980469, "global_step": 355415, "epoch": 2937} {"train_loss": -45.24768829345703, "global_step": 355416, "epoch": 2937} {"train_loss": -41.81684494018555, "global_step": 355417, "epoch": 2937} {"train_loss": -43.83367919921875, "global_step": 355418, "epoch": 2937} {"train_loss": -42.76394271850586, "global_step": 355419, "epoch": 2937} {"train_loss": -42.18001937866211, "global_step": 355420, "epoch": 2937} {"train_loss": -43.81954574584961, "global_step": 355421, "epoch": 2937} {"train_loss": -42.40267562866211, "global_step": 355422, "epoch": 2937} {"train_loss": -43.1605339050293, "global_step": 355423, "epoch": 2937} {"train_loss": -44.28522491455078, "global_step": 355424, "epoch": 2937} {"train_loss": -43.38928985595703, "global_step": 355425, "epoch": 2937} {"train_loss": -43.90829086303711, "global_step": 355426, "epoch": 2937} {"train_loss": -43.17435836791992, "global_step": 355427, "epoch": 2937} {"train_loss": -44.87359619140625, "global_step": 355428, "epoch": 2937} {"train_loss": -42.967811584472656, "global_step": 355429, "epoch": 2937} {"train_loss": -43.55355453491211, "global_step": 355430, "epoch": 2937} {"train_loss": -41.8311767578125, "global_step": 355431, "epoch": 2937} {"train_loss": -42.981407165527344, "global_step": 355432, "epoch": 2937} {"train_loss": -44.32847595214844, "global_step": 355433, "epoch": 2937} {"train_loss": -43.58695602416992, "global_step": 355434, "epoch": 2937} {"train_loss": -43.49769592285156, "global_step": 355435, "epoch": 2937} {"train_loss": -44.12567138671875, "global_step": 355436, "epoch": 2937} {"train_loss": -43.83406448364258, "global_step": 355437, "epoch": 2937} {"train_loss": -43.93284606933594, "global_step": 355438, "epoch": 2937} {"train_loss": -43.8319206237793, "global_step": 355439, "epoch": 2937} {"train_loss": -43.844295501708984, "global_step": 355440, "epoch": 2937} {"train_loss": -44.68915939331055, "global_step": 355441, "epoch": 2937} {"train_loss": -43.2440071105957, "global_step": 355442, "epoch": 2937} {"train_loss": -41.118587493896484, "global_step": 355443, "epoch": 2937} {"train_loss": -44.401214599609375, "global_step": 355444, "epoch": 2937} {"train_loss": -44.227108001708984, "global_step": 355445, "epoch": 2937} {"train_loss": -42.0863151550293, "global_step": 355446, "epoch": 2937} {"train_loss": -43.94173049926758, "global_step": 355447, "epoch": 2937} {"train_loss": -43.94948959350586, "global_step": 355448, "epoch": 2937} {"train_loss": -43.00344467163086, "global_step": 355449, "epoch": 2937} {"train_loss": -44.908409118652344, "global_step": 355450, "epoch": 2937} {"train_loss": -43.550636291503906, "global_step": 355451, "epoch": 2937} {"train_loss": -44.35091781616211, "global_step": 355452, "epoch": 2937} {"train_loss": -43.86867904663086, "global_step": 355453, "epoch": 2937} {"train_loss": -44.45503616333008, "global_step": 355454, "epoch": 2937} {"train_loss": -44.119144439697266, "global_step": 355455, "epoch": 2937} {"train_loss": -44.626590728759766, "global_step": 355456, "epoch": 2937} {"train_loss": -44.63059997558594, "global_step": 355457, "epoch": 2937} {"train_loss": -44.645565032958984, "global_step": 355458, "epoch": 2937} {"train_loss": -43.633846282958984, "global_step": 355459, "epoch": 2937} {"train_loss": -44.68442153930664, "global_step": 355460, "epoch": 2937} {"train_loss": -44.81423568725586, "global_step": 355461, "epoch": 2937} {"train_loss": -44.415565490722656, "global_step": 355462, "epoch": 2937} {"train_loss": -44.0991096496582, "global_step": 355463, "epoch": 2937} {"train_loss": -44.52434158325195, "global_step": 355464, "epoch": 2937} {"train_loss": -44.80427169799805, "global_step": 355465, "epoch": 2937} {"train_loss": -45.06463623046875, "global_step": 355466, "epoch": 2937} {"train_loss": -44.663299560546875, "global_step": 355467, "epoch": 2937} {"train_loss": -44.428768157958984, "global_step": 355468, "epoch": 2937} {"train_loss": -44.85234069824219, "global_step": 355469, "epoch": 2937} {"train_loss": -44.81512451171875, "global_step": 355470, "epoch": 2937} {"train_loss": -43.81476974487305, "global_step": 355471, "epoch": 2937} {"train_loss": -44.74402618408203, "global_step": 355472, "epoch": 2937} {"train_loss": -44.21378707885742, "global_step": 355473, "epoch": 2937} {"train_loss": -44.424007415771484, "global_step": 355474, "epoch": 2937} {"train_loss": -44.47943878173828, "global_step": 355475, "epoch": 2937} {"train_loss": -44.472023010253906, "global_step": 355476, "epoch": 2937} {"train_loss": -43.917755126953125, "global_step": 355477, "epoch": 2937} {"train_loss": -45.38418960571289, "global_step": 355478, "epoch": 2937} {"train_loss": -45.271095275878906, "global_step": 355479, "epoch": 2937} {"train_loss": -44.906070709228516, "global_step": 355480, "epoch": 2937} {"train_loss": -45.754547119140625, "global_step": 355481, "epoch": 2937} {"train_loss": -44.54576873779297, "global_step": 355482, "epoch": 2937} {"train_loss": -45.71662521362305, "global_step": 355483, "epoch": 2937} {"train_loss": -44.943214416503906, "global_step": 355484, "epoch": 2937} {"train_loss": -45.3387451171875, "global_step": 355485, "epoch": 2937} {"train_loss": -45.251495361328125, "global_step": 355486, "epoch": 2937} {"train_loss": -43.939430236816406, "global_step": 355487, "epoch": 2937} {"train_loss": -44.95783233642578, "global_step": 355488, "epoch": 2937} {"train_loss": -44.850013732910156, "global_step": 355489, "epoch": 2937} {"train_loss": -43.90096664428711, "global_step": 355490, "epoch": 2937} {"train_loss": -44.807708740234375, "global_step": 355491, "epoch": 2937} {"train_loss": -44.28570556640625, "global_step": 355492, "epoch": 2937} {"train_loss": -44.489383697509766, "global_step": 355493, "epoch": 2937} {"train_loss": -43.65633773803711, "global_step": 355494, "epoch": 2937} {"train_loss": -43.9987907409668, "global_step": 355495, "epoch": 2937} {"train_loss": -43.99265670776367, "global_step": 355496, "epoch": 2937} {"train_loss": -44.19171798327738, "global_step": 355497, "epoch": 2937, "val_loss": 2515563.75} {"train_loss": -44.30905532836914, "global_step": 355498, "epoch": 2938} {"train_loss": -42.893951416015625, "global_step": 355499, "epoch": 2938} {"train_loss": -44.38752365112305, "global_step": 355500, "epoch": 2938} {"train_loss": -42.816219329833984, "global_step": 355501, "epoch": 2938} {"train_loss": -44.900997161865234, "global_step": 355502, "epoch": 2938} {"train_loss": -43.6272087097168, "global_step": 355503, "epoch": 2938} {"train_loss": -44.6308708190918, "global_step": 355504, "epoch": 2938} {"train_loss": -43.275169372558594, "global_step": 355505, "epoch": 2938} {"train_loss": -42.18855667114258, "global_step": 355506, "epoch": 2938} {"train_loss": -41.9889030456543, "global_step": 355507, "epoch": 2938} {"train_loss": -42.50399398803711, "global_step": 355508, "epoch": 2938} {"train_loss": -43.0378532409668, "global_step": 355509, "epoch": 2938} {"train_loss": -42.212398529052734, "global_step": 355510, "epoch": 2938} {"train_loss": -40.600624084472656, "global_step": 355511, "epoch": 2938} {"train_loss": -42.65548324584961, "global_step": 355512, "epoch": 2938} {"train_loss": -43.07575225830078, "global_step": 355513, "epoch": 2938} {"train_loss": -43.530906677246094, "global_step": 355514, "epoch": 2938} {"train_loss": -42.05670166015625, "global_step": 355515, "epoch": 2938} {"train_loss": -43.597599029541016, "global_step": 355516, "epoch": 2938} {"train_loss": -44.12227249145508, "global_step": 355517, "epoch": 2938} {"train_loss": -43.19388198852539, "global_step": 355518, "epoch": 2938} {"train_loss": -43.59756088256836, "global_step": 355519, "epoch": 2938} {"train_loss": -43.614051818847656, "global_step": 355520, "epoch": 2938} {"train_loss": -43.11568069458008, "global_step": 355521, "epoch": 2938} {"train_loss": -43.30363845825195, "global_step": 355522, "epoch": 2938} {"train_loss": -43.15607833862305, "global_step": 355523, "epoch": 2938} {"train_loss": -44.56745910644531, "global_step": 355524, "epoch": 2938} {"train_loss": -43.6954460144043, "global_step": 355525, "epoch": 2938} {"train_loss": -44.21366500854492, "global_step": 355526, "epoch": 2938} {"train_loss": -44.16621398925781, "global_step": 355527, "epoch": 2938} {"train_loss": -42.10150909423828, "global_step": 355528, "epoch": 2938} {"train_loss": -44.71913146972656, "global_step": 355529, "epoch": 2938} {"train_loss": -44.31343460083008, "global_step": 355530, "epoch": 2938} {"train_loss": -44.01498031616211, "global_step": 355531, "epoch": 2938} {"train_loss": -45.055110931396484, "global_step": 355532, "epoch": 2938} {"train_loss": -43.930721282958984, "global_step": 355533, "epoch": 2938} {"train_loss": -43.98439407348633, "global_step": 355534, "epoch": 2938} {"train_loss": -45.03353500366211, "global_step": 355535, "epoch": 2938} {"train_loss": -44.04537582397461, "global_step": 355536, "epoch": 2938} {"train_loss": -44.84299850463867, "global_step": 355537, "epoch": 2938} {"train_loss": -45.2564811706543, "global_step": 355538, "epoch": 2938} {"train_loss": -44.723594665527344, "global_step": 355539, "epoch": 2938} {"train_loss": -44.14273452758789, "global_step": 355540, "epoch": 2938} {"train_loss": -45.05984115600586, "global_step": 355541, "epoch": 2938} {"train_loss": -44.600948333740234, "global_step": 355542, "epoch": 2938} {"train_loss": -43.54732894897461, "global_step": 355543, "epoch": 2938} {"train_loss": -44.445899963378906, "global_step": 355544, "epoch": 2938} {"train_loss": -44.49003982543945, "global_step": 355545, "epoch": 2938} {"train_loss": -44.36316680908203, "global_step": 355546, "epoch": 2938} {"train_loss": -44.405120849609375, "global_step": 355547, "epoch": 2938} {"train_loss": -43.9892692565918, "global_step": 355548, "epoch": 2938} {"train_loss": -44.81099319458008, "global_step": 355549, "epoch": 2938} {"train_loss": -43.31364059448242, "global_step": 355550, "epoch": 2938} {"train_loss": -44.32656478881836, "global_step": 355551, "epoch": 2938} {"train_loss": -45.15973663330078, "global_step": 355552, "epoch": 2938} {"train_loss": -44.18487548828125, "global_step": 355553, "epoch": 2938} {"train_loss": -44.846961975097656, "global_step": 355554, "epoch": 2938} {"train_loss": -44.22970199584961, "global_step": 355555, "epoch": 2938} {"train_loss": -44.917091369628906, "global_step": 355556, "epoch": 2938} {"train_loss": -44.92810821533203, "global_step": 355557, "epoch": 2938} {"train_loss": -44.42558288574219, "global_step": 355558, "epoch": 2938} {"train_loss": -45.000057220458984, "global_step": 355559, "epoch": 2938} {"train_loss": -44.648460388183594, "global_step": 355560, "epoch": 2938} {"train_loss": -43.88645553588867, "global_step": 355561, "epoch": 2938} {"train_loss": -44.12506866455078, "global_step": 355562, "epoch": 2938} {"train_loss": -45.042720794677734, "global_step": 355563, "epoch": 2938} {"train_loss": -44.14133834838867, "global_step": 355564, "epoch": 2938} {"train_loss": -43.6914176940918, "global_step": 355565, "epoch": 2938} {"train_loss": -42.17971420288086, "global_step": 355566, "epoch": 2938} {"train_loss": -43.86668014526367, "global_step": 355567, "epoch": 2938} {"train_loss": -44.16205596923828, "global_step": 355568, "epoch": 2938} {"train_loss": -42.26445007324219, "global_step": 355569, "epoch": 2938} {"train_loss": -43.87565994262695, "global_step": 355570, "epoch": 2938} {"train_loss": -43.2820930480957, "global_step": 355571, "epoch": 2938} {"train_loss": -43.651859283447266, "global_step": 355572, "epoch": 2938} {"train_loss": -44.42474365234375, "global_step": 355573, "epoch": 2938} {"train_loss": -44.73213577270508, "global_step": 355574, "epoch": 2938} {"train_loss": -43.790462493896484, "global_step": 355575, "epoch": 2938} {"train_loss": -43.82011032104492, "global_step": 355576, "epoch": 2938} {"train_loss": -44.69350051879883, "global_step": 355577, "epoch": 2938} {"train_loss": -43.34539031982422, "global_step": 355578, "epoch": 2938} {"train_loss": -43.08210372924805, "global_step": 355579, "epoch": 2938} {"train_loss": -43.62229537963867, "global_step": 355580, "epoch": 2938} {"train_loss": -43.71171188354492, "global_step": 355581, "epoch": 2938} {"train_loss": -43.691612243652344, "global_step": 355582, "epoch": 2938} {"train_loss": -44.654293060302734, "global_step": 355583, "epoch": 2938} {"train_loss": -42.255672454833984, "global_step": 355584, "epoch": 2938} {"train_loss": -42.85736083984375, "global_step": 355585, "epoch": 2938} {"train_loss": -44.9647331237793, "global_step": 355586, "epoch": 2938} {"train_loss": -44.94269561767578, "global_step": 355587, "epoch": 2938} {"train_loss": -44.5873908996582, "global_step": 355588, "epoch": 2938} {"train_loss": -45.438838958740234, "global_step": 355589, "epoch": 2938} {"train_loss": -44.4348030090332, "global_step": 355590, "epoch": 2938} {"train_loss": -45.260963439941406, "global_step": 355591, "epoch": 2938} {"train_loss": -45.15906524658203, "global_step": 355592, "epoch": 2938} {"train_loss": -44.7352409362793, "global_step": 355593, "epoch": 2938} {"train_loss": -44.673892974853516, "global_step": 355594, "epoch": 2938} {"train_loss": -45.19484329223633, "global_step": 355595, "epoch": 2938} {"train_loss": -44.8670654296875, "global_step": 355596, "epoch": 2938} {"train_loss": -45.2164421081543, "global_step": 355597, "epoch": 2938} {"train_loss": -44.813838958740234, "global_step": 355598, "epoch": 2938} {"train_loss": -43.824378967285156, "global_step": 355599, "epoch": 2938} {"train_loss": -44.18880844116211, "global_step": 355600, "epoch": 2938} {"train_loss": -45.57065963745117, "global_step": 355601, "epoch": 2938} {"train_loss": -44.443397521972656, "global_step": 355602, "epoch": 2938} {"train_loss": -44.17206954956055, "global_step": 355603, "epoch": 2938} {"train_loss": -44.71425247192383, "global_step": 355604, "epoch": 2938} {"train_loss": -45.418190002441406, "global_step": 355605, "epoch": 2938} {"train_loss": -45.468231201171875, "global_step": 355606, "epoch": 2938} {"train_loss": -45.319190979003906, "global_step": 355607, "epoch": 2938} {"train_loss": -44.9548225402832, "global_step": 355608, "epoch": 2938} {"train_loss": -45.50150680541992, "global_step": 355609, "epoch": 2938} {"train_loss": -45.074859619140625, "global_step": 355610, "epoch": 2938} {"train_loss": -45.851924896240234, "global_step": 355611, "epoch": 2938} {"train_loss": -45.52070236206055, "global_step": 355612, "epoch": 2938} {"train_loss": -44.87092208862305, "global_step": 355613, "epoch": 2938} {"train_loss": -43.69367218017578, "global_step": 355614, "epoch": 2938} {"train_loss": -44.95851516723633, "global_step": 355615, "epoch": 2938} {"train_loss": -45.29456329345703, "global_step": 355616, "epoch": 2938} {"train_loss": -45.40278244018555, "global_step": 355617, "epoch": 2938} {"train_loss": -44.14455000822209, "global_step": 355618, "epoch": 2938, "val_loss": 2551390.75} {"train_loss": -46.022762298583984, "global_step": 355619, "epoch": 2939} {"train_loss": -45.534400939941406, "global_step": 355620, "epoch": 2939} {"train_loss": -45.57497787475586, "global_step": 355621, "epoch": 2939} {"train_loss": -45.58123016357422, "global_step": 355622, "epoch": 2939} {"train_loss": -45.50005340576172, "global_step": 355623, "epoch": 2939} {"train_loss": -45.4763069152832, "global_step": 355624, "epoch": 2939} {"train_loss": -45.1153564453125, "global_step": 355625, "epoch": 2939} {"train_loss": -45.612884521484375, "global_step": 355626, "epoch": 2939} {"train_loss": -45.11482620239258, "global_step": 355627, "epoch": 2939} {"train_loss": -44.024105072021484, "global_step": 355628, "epoch": 2939} {"train_loss": -43.15271759033203, "global_step": 355629, "epoch": 2939} {"train_loss": -45.39089584350586, "global_step": 355630, "epoch": 2939} {"train_loss": -43.912017822265625, "global_step": 355631, "epoch": 2939} {"train_loss": -43.41572189331055, "global_step": 355632, "epoch": 2939} {"train_loss": -43.31454086303711, "global_step": 355633, "epoch": 2939} {"train_loss": -43.61548614501953, "global_step": 355634, "epoch": 2939} {"train_loss": -44.626033782958984, "global_step": 355635, "epoch": 2939} {"train_loss": -43.93008041381836, "global_step": 355636, "epoch": 2939} {"train_loss": -43.90593338012695, "global_step": 355637, "epoch": 2939} {"train_loss": -44.44797897338867, "global_step": 355638, "epoch": 2939} {"train_loss": -43.85494613647461, "global_step": 355639, "epoch": 2939} {"train_loss": -42.74062728881836, "global_step": 355640, "epoch": 2939} {"train_loss": -45.08053207397461, "global_step": 355641, "epoch": 2939} {"train_loss": -44.24333953857422, "global_step": 355642, "epoch": 2939} {"train_loss": -43.71232986450195, "global_step": 355643, "epoch": 2939} {"train_loss": -44.47919464111328, "global_step": 355644, "epoch": 2939} {"train_loss": -45.0332145690918, "global_step": 355645, "epoch": 2939} {"train_loss": -44.026702880859375, "global_step": 355646, "epoch": 2939} {"train_loss": -43.26140213012695, "global_step": 355647, "epoch": 2939} {"train_loss": -43.9034309387207, "global_step": 355648, "epoch": 2939} {"train_loss": -44.33323287963867, "global_step": 355649, "epoch": 2939} {"train_loss": -43.2891960144043, "global_step": 355650, "epoch": 2939} {"train_loss": -43.60866165161133, "global_step": 355651, "epoch": 2939} {"train_loss": -44.03082275390625, "global_step": 355652, "epoch": 2939} {"train_loss": -44.98844528198242, "global_step": 355653, "epoch": 2939} {"train_loss": -44.416969299316406, "global_step": 355654, "epoch": 2939} {"train_loss": -43.66895294189453, "global_step": 355655, "epoch": 2939} {"train_loss": -45.39717483520508, "global_step": 355656, "epoch": 2939} {"train_loss": -43.21699523925781, "global_step": 355657, "epoch": 2939} {"train_loss": -43.69770812988281, "global_step": 355658, "epoch": 2939} {"train_loss": -44.61404037475586, "global_step": 355659, "epoch": 2939} {"train_loss": -43.83388137817383, "global_step": 355660, "epoch": 2939} {"train_loss": -44.81185531616211, "global_step": 355661, "epoch": 2939} {"train_loss": -44.35871887207031, "global_step": 355662, "epoch": 2939} {"train_loss": -43.902008056640625, "global_step": 355663, "epoch": 2939} {"train_loss": -44.50829315185547, "global_step": 355664, "epoch": 2939} {"train_loss": -44.010162353515625, "global_step": 355665, "epoch": 2939} {"train_loss": -44.26171875, "global_step": 355666, "epoch": 2939} {"train_loss": -45.13427734375, "global_step": 355667, "epoch": 2939} {"train_loss": -44.35684585571289, "global_step": 355668, "epoch": 2939} {"train_loss": -44.722572326660156, "global_step": 355669, "epoch": 2939} {"train_loss": -45.0325813293457, "global_step": 355670, "epoch": 2939} {"train_loss": -44.79890441894531, "global_step": 355671, "epoch": 2939} {"train_loss": -44.46453857421875, "global_step": 355672, "epoch": 2939} {"train_loss": -45.15676498413086, "global_step": 355673, "epoch": 2939} {"train_loss": -44.99321746826172, "global_step": 355674, "epoch": 2939} {"train_loss": -44.307369232177734, "global_step": 355675, "epoch": 2939} {"train_loss": -45.281246185302734, "global_step": 355676, "epoch": 2939} {"train_loss": -44.91693878173828, "global_step": 355677, "epoch": 2939} {"train_loss": -44.509639739990234, "global_step": 355678, "epoch": 2939} {"train_loss": -44.63843536376953, "global_step": 355679, "epoch": 2939} {"train_loss": -45.273372650146484, "global_step": 355680, "epoch": 2939} {"train_loss": -44.01762008666992, "global_step": 355681, "epoch": 2939} {"train_loss": -44.53852462768555, "global_step": 355682, "epoch": 2939} {"train_loss": -45.076961517333984, "global_step": 355683, "epoch": 2939} {"train_loss": -45.38996887207031, "global_step": 355684, "epoch": 2939} {"train_loss": -44.79120635986328, "global_step": 355685, "epoch": 2939} {"train_loss": -45.11710739135742, "global_step": 355686, "epoch": 2939} {"train_loss": -44.68865966796875, "global_step": 355687, "epoch": 2939} {"train_loss": -44.12428665161133, "global_step": 355688, "epoch": 2939} {"train_loss": -44.463558197021484, "global_step": 355689, "epoch": 2939} {"train_loss": -44.11663818359375, "global_step": 355690, "epoch": 2939} {"train_loss": -44.5142707824707, "global_step": 355691, "epoch": 2939} {"train_loss": -44.93095779418945, "global_step": 355692, "epoch": 2939} {"train_loss": -44.31728744506836, "global_step": 355693, "epoch": 2939} {"train_loss": -44.90829086303711, "global_step": 355694, "epoch": 2939} {"train_loss": -44.645057678222656, "global_step": 355695, "epoch": 2939} {"train_loss": -44.853919982910156, "global_step": 355696, "epoch": 2939} {"train_loss": -45.1734733581543, "global_step": 355697, "epoch": 2939} {"train_loss": -45.31545639038086, "global_step": 355698, "epoch": 2939} {"train_loss": -45.134151458740234, "global_step": 355699, "epoch": 2939} {"train_loss": -45.348262786865234, "global_step": 355700, "epoch": 2939} {"train_loss": -44.73571014404297, "global_step": 355701, "epoch": 2939} {"train_loss": -44.026546478271484, "global_step": 355702, "epoch": 2939} {"train_loss": -44.08219909667969, "global_step": 355703, "epoch": 2939} {"train_loss": -45.1353874206543, "global_step": 355704, "epoch": 2939} {"train_loss": -45.29713439941406, "global_step": 355705, "epoch": 2939} {"train_loss": -44.834163665771484, "global_step": 355706, "epoch": 2939} {"train_loss": -44.61051559448242, "global_step": 355707, "epoch": 2939} {"train_loss": -44.58648681640625, "global_step": 355708, "epoch": 2939} {"train_loss": -43.89657211303711, "global_step": 355709, "epoch": 2939} {"train_loss": -41.15673065185547, "global_step": 355710, "epoch": 2939} {"train_loss": -44.08179473876953, "global_step": 355711, "epoch": 2939} {"train_loss": -45.19331359863281, "global_step": 355712, "epoch": 2939} {"train_loss": -45.28399658203125, "global_step": 355713, "epoch": 2939} {"train_loss": -44.61733627319336, "global_step": 355714, "epoch": 2939} {"train_loss": -44.136775970458984, "global_step": 355715, "epoch": 2939} {"train_loss": -43.729740142822266, "global_step": 355716, "epoch": 2939} {"train_loss": -44.77300262451172, "global_step": 355717, "epoch": 2939} {"train_loss": -44.47144317626953, "global_step": 355718, "epoch": 2939} {"train_loss": -43.168182373046875, "global_step": 355719, "epoch": 2939} {"train_loss": -43.17702865600586, "global_step": 355720, "epoch": 2939} {"train_loss": -43.995697021484375, "global_step": 355721, "epoch": 2939} {"train_loss": -45.0587043762207, "global_step": 355722, "epoch": 2939} {"train_loss": -43.40033721923828, "global_step": 355723, "epoch": 2939} {"train_loss": -43.34304428100586, "global_step": 355724, "epoch": 2939} {"train_loss": -43.667510986328125, "global_step": 355725, "epoch": 2939} {"train_loss": -43.56577682495117, "global_step": 355726, "epoch": 2939} {"train_loss": -43.26386642456055, "global_step": 355727, "epoch": 2939} {"train_loss": -43.51497268676758, "global_step": 355728, "epoch": 2939} {"train_loss": -44.14484786987305, "global_step": 355729, "epoch": 2939} {"train_loss": -42.6607551574707, "global_step": 355730, "epoch": 2939} {"train_loss": -42.6960563659668, "global_step": 355731, "epoch": 2939} {"train_loss": -44.67277145385742, "global_step": 355732, "epoch": 2939} {"train_loss": -44.57041931152344, "global_step": 355733, "epoch": 2939} {"train_loss": -42.629051208496094, "global_step": 355734, "epoch": 2939} {"train_loss": -44.782447814941406, "global_step": 355735, "epoch": 2939} {"train_loss": -43.15476608276367, "global_step": 355736, "epoch": 2939} {"train_loss": -44.43567657470703, "global_step": 355737, "epoch": 2939} {"train_loss": -44.916744232177734, "global_step": 355738, "epoch": 2939} {"train_loss": -44.367044054772244, "global_step": 355739, "epoch": 2939, "val_loss": 2613028.25} {"train_loss": -44.592891693115234, "global_step": 355740, "epoch": 2940} {"train_loss": -45.2798957824707, "global_step": 355741, "epoch": 2940} {"train_loss": -44.59357833862305, "global_step": 355742, "epoch": 2940} {"train_loss": -44.890625, "global_step": 355743, "epoch": 2940} {"train_loss": -45.36860275268555, "global_step": 355744, "epoch": 2940} {"train_loss": -44.37604522705078, "global_step": 355745, "epoch": 2940} {"train_loss": -45.040740966796875, "global_step": 355746, "epoch": 2940} {"train_loss": -45.079769134521484, "global_step": 355747, "epoch": 2940} {"train_loss": -45.038429260253906, "global_step": 355748, "epoch": 2940} {"train_loss": -45.19633102416992, "global_step": 355749, "epoch": 2940} {"train_loss": -44.465938568115234, "global_step": 355750, "epoch": 2940} {"train_loss": -44.00014877319336, "global_step": 355751, "epoch": 2940} {"train_loss": -44.74134063720703, "global_step": 355752, "epoch": 2940} {"train_loss": -45.39259719848633, "global_step": 355753, "epoch": 2940} {"train_loss": -44.51848220825195, "global_step": 355754, "epoch": 2940} {"train_loss": -45.0194206237793, "global_step": 355755, "epoch": 2940} {"train_loss": -45.116943359375, "global_step": 355756, "epoch": 2940} {"train_loss": -43.93359375, "global_step": 355757, "epoch": 2940} {"train_loss": -45.53581237792969, "global_step": 355758, "epoch": 2940} {"train_loss": -45.49966049194336, "global_step": 355759, "epoch": 2940} {"train_loss": -44.92498016357422, "global_step": 355760, "epoch": 2940} {"train_loss": -45.48672866821289, "global_step": 355761, "epoch": 2940} {"train_loss": -45.48286056518555, "global_step": 355762, "epoch": 2940} {"train_loss": -45.18000411987305, "global_step": 355763, "epoch": 2940} {"train_loss": -45.01096725463867, "global_step": 355764, "epoch": 2940} {"train_loss": -45.32265853881836, "global_step": 355765, "epoch": 2940} {"train_loss": -45.53626251220703, "global_step": 355766, "epoch": 2940} {"train_loss": -44.23342514038086, "global_step": 355767, "epoch": 2940} {"train_loss": -45.01853942871094, "global_step": 355768, "epoch": 2940} {"train_loss": -45.47393798828125, "global_step": 355769, "epoch": 2940} {"train_loss": -44.84465408325195, "global_step": 355770, "epoch": 2940} {"train_loss": -44.99311447143555, "global_step": 355771, "epoch": 2940} {"train_loss": -45.04266357421875, "global_step": 355772, "epoch": 2940} {"train_loss": -44.63615036010742, "global_step": 355773, "epoch": 2940} {"train_loss": -44.407955169677734, "global_step": 355774, "epoch": 2940} {"train_loss": -44.54121017456055, "global_step": 355775, "epoch": 2940} {"train_loss": -44.25208282470703, "global_step": 355776, "epoch": 2940} {"train_loss": -44.41831588745117, "global_step": 355777, "epoch": 2940} {"train_loss": -44.64765548706055, "global_step": 355778, "epoch": 2940} {"train_loss": -45.11585235595703, "global_step": 355779, "epoch": 2940} {"train_loss": -43.79645538330078, "global_step": 355780, "epoch": 2940} {"train_loss": -44.52639389038086, "global_step": 355781, "epoch": 2940} {"train_loss": -44.097225189208984, "global_step": 355782, "epoch": 2940} {"train_loss": -45.37150573730469, "global_step": 355783, "epoch": 2940} {"train_loss": -45.2011833190918, "global_step": 355784, "epoch": 2940} {"train_loss": -44.342159271240234, "global_step": 355785, "epoch": 2940} {"train_loss": -44.628692626953125, "global_step": 355786, "epoch": 2940} {"train_loss": -44.25476837158203, "global_step": 355787, "epoch": 2940} {"train_loss": -44.975250244140625, "global_step": 355788, "epoch": 2940} {"train_loss": -44.53853988647461, "global_step": 355789, "epoch": 2940} {"train_loss": -43.113765716552734, "global_step": 355790, "epoch": 2940} {"train_loss": -43.93153762817383, "global_step": 355791, "epoch": 2940} {"train_loss": -44.8040657043457, "global_step": 355792, "epoch": 2940} {"train_loss": -44.65676498413086, "global_step": 355793, "epoch": 2940} {"train_loss": -43.14347839355469, "global_step": 355794, "epoch": 2940} {"train_loss": -42.755672454833984, "global_step": 355795, "epoch": 2940} {"train_loss": -44.56159210205078, "global_step": 355796, "epoch": 2940} {"train_loss": -44.581295013427734, "global_step": 355797, "epoch": 2940} {"train_loss": -44.73441696166992, "global_step": 355798, "epoch": 2940} {"train_loss": -44.8698844909668, "global_step": 355799, "epoch": 2940} {"train_loss": -44.278255462646484, "global_step": 355800, "epoch": 2940} {"train_loss": -45.080047607421875, "global_step": 355801, "epoch": 2940} {"train_loss": -43.70076370239258, "global_step": 355802, "epoch": 2940} {"train_loss": -44.322418212890625, "global_step": 355803, "epoch": 2940} {"train_loss": -45.5050048828125, "global_step": 355804, "epoch": 2940} {"train_loss": -44.02375793457031, "global_step": 355805, "epoch": 2940} {"train_loss": -42.92104721069336, "global_step": 355806, "epoch": 2940} {"train_loss": -44.52295684814453, "global_step": 355807, "epoch": 2940} {"train_loss": -44.701255798339844, "global_step": 355808, "epoch": 2940} {"train_loss": -44.668060302734375, "global_step": 355809, "epoch": 2940} {"train_loss": -44.74737548828125, "global_step": 355810, "epoch": 2940} {"train_loss": -44.43687057495117, "global_step": 355811, "epoch": 2940} {"train_loss": -45.17106246948242, "global_step": 355812, "epoch": 2940} {"train_loss": -44.62319564819336, "global_step": 355813, "epoch": 2940} {"train_loss": -45.104347229003906, "global_step": 355814, "epoch": 2940} {"train_loss": -44.73884201049805, "global_step": 355815, "epoch": 2940} {"train_loss": -44.361385345458984, "global_step": 355816, "epoch": 2940} {"train_loss": -45.278358459472656, "global_step": 355817, "epoch": 2940} {"train_loss": -44.7437858581543, "global_step": 355818, "epoch": 2940} {"train_loss": -44.10232162475586, "global_step": 355819, "epoch": 2940} {"train_loss": -45.18541717529297, "global_step": 355820, "epoch": 2940} {"train_loss": -44.56437301635742, "global_step": 355821, "epoch": 2940} {"train_loss": -43.96505355834961, "global_step": 355822, "epoch": 2940} {"train_loss": -45.09212112426758, "global_step": 355823, "epoch": 2940} {"train_loss": -45.352325439453125, "global_step": 355824, "epoch": 2940} {"train_loss": -44.93174362182617, "global_step": 355825, "epoch": 2940} {"train_loss": -44.590736389160156, "global_step": 355826, "epoch": 2940} {"train_loss": -44.7941780090332, "global_step": 355827, "epoch": 2940} {"train_loss": -44.85984802246094, "global_step": 355828, "epoch": 2940} {"train_loss": -44.7656364440918, "global_step": 355829, "epoch": 2940} {"train_loss": -45.08199691772461, "global_step": 355830, "epoch": 2940} {"train_loss": -45.11898422241211, "global_step": 355831, "epoch": 2940} {"train_loss": -44.760528564453125, "global_step": 355832, "epoch": 2940} {"train_loss": -45.27992630004883, "global_step": 355833, "epoch": 2940} {"train_loss": -45.236812591552734, "global_step": 355834, "epoch": 2940} {"train_loss": -44.857826232910156, "global_step": 355835, "epoch": 2940} {"train_loss": -44.93464279174805, "global_step": 355836, "epoch": 2940} {"train_loss": -45.291316986083984, "global_step": 355837, "epoch": 2940} {"train_loss": -44.73054122924805, "global_step": 355838, "epoch": 2940} {"train_loss": -44.748348236083984, "global_step": 355839, "epoch": 2940} {"train_loss": -44.627403259277344, "global_step": 355840, "epoch": 2940} {"train_loss": -45.11837387084961, "global_step": 355841, "epoch": 2940} {"train_loss": -44.458473205566406, "global_step": 355842, "epoch": 2940} {"train_loss": -43.62632751464844, "global_step": 355843, "epoch": 2940} {"train_loss": -43.753318786621094, "global_step": 355844, "epoch": 2940} {"train_loss": -45.011573791503906, "global_step": 355845, "epoch": 2940} {"train_loss": -43.79036331176758, "global_step": 355846, "epoch": 2940} {"train_loss": -41.460697174072266, "global_step": 355847, "epoch": 2940} {"train_loss": -43.76332092285156, "global_step": 355848, "epoch": 2940} {"train_loss": -44.772308349609375, "global_step": 355849, "epoch": 2940} {"train_loss": -43.27849197387695, "global_step": 355850, "epoch": 2940} {"train_loss": -42.9010124206543, "global_step": 355851, "epoch": 2940} {"train_loss": -44.804141998291016, "global_step": 355852, "epoch": 2940} {"train_loss": -43.802162170410156, "global_step": 355853, "epoch": 2940} {"train_loss": -43.209590911865234, "global_step": 355854, "epoch": 2940} {"train_loss": -44.24675369262695, "global_step": 355855, "epoch": 2940} {"train_loss": -42.76200485229492, "global_step": 355856, "epoch": 2940} {"train_loss": -43.28544616699219, "global_step": 355857, "epoch": 2940} {"train_loss": -43.4305305480957, "global_step": 355858, "epoch": 2940} {"train_loss": -41.316856384277344, "global_step": 355859, "epoch": 2940} {"train_loss": -44.54276912468524, "global_step": 355860, "epoch": 2940, "val_loss": 2491634.0} {"train_loss": -39.9902458190918, "global_step": 355861, "epoch": 2941} {"train_loss": -42.799739837646484, "global_step": 355862, "epoch": 2941} {"train_loss": -38.0919303894043, "global_step": 355863, "epoch": 2941} {"train_loss": -40.925716400146484, "global_step": 355864, "epoch": 2941} {"train_loss": -41.74281692504883, "global_step": 355865, "epoch": 2941} {"train_loss": -39.13218688964844, "global_step": 355866, "epoch": 2941} {"train_loss": -39.7835693359375, "global_step": 355867, "epoch": 2941} {"train_loss": -37.4857292175293, "global_step": 355868, "epoch": 2941} {"train_loss": -40.79384231567383, "global_step": 355869, "epoch": 2941} {"train_loss": -40.05160140991211, "global_step": 355870, "epoch": 2941} {"train_loss": -36.51376724243164, "global_step": 355871, "epoch": 2941} {"train_loss": -37.790870666503906, "global_step": 355872, "epoch": 2941} {"train_loss": -38.83417892456055, "global_step": 355873, "epoch": 2941} {"train_loss": -33.74917221069336, "global_step": 355874, "epoch": 2941} {"train_loss": -38.20892333984375, "global_step": 355875, "epoch": 2941} {"train_loss": -34.75319290161133, "global_step": 355876, "epoch": 2941} {"train_loss": -37.12510681152344, "global_step": 355877, "epoch": 2941} {"train_loss": -40.07687759399414, "global_step": 355878, "epoch": 2941} {"train_loss": -38.11597442626953, "global_step": 355879, "epoch": 2941} {"train_loss": -41.20144271850586, "global_step": 355880, "epoch": 2941} {"train_loss": -41.06245040893555, "global_step": 355881, "epoch": 2941} {"train_loss": -40.75050735473633, "global_step": 355882, "epoch": 2941} {"train_loss": -42.51560592651367, "global_step": 355883, "epoch": 2941} {"train_loss": -41.654205322265625, "global_step": 355884, "epoch": 2941} {"train_loss": -42.15956115722656, "global_step": 355885, "epoch": 2941} {"train_loss": -43.04963302612305, "global_step": 355886, "epoch": 2941} {"train_loss": -42.60404586791992, "global_step": 355887, "epoch": 2941} {"train_loss": -42.59419631958008, "global_step": 355888, "epoch": 2941} {"train_loss": -42.19526672363281, "global_step": 355889, "epoch": 2941} {"train_loss": -43.033660888671875, "global_step": 355890, "epoch": 2941} {"train_loss": -43.1338005065918, "global_step": 355891, "epoch": 2941} {"train_loss": -43.024810791015625, "global_step": 355892, "epoch": 2941} {"train_loss": -43.45270538330078, "global_step": 355893, "epoch": 2941} {"train_loss": -43.711769104003906, "global_step": 355894, "epoch": 2941} {"train_loss": -43.49271774291992, "global_step": 355895, "epoch": 2941} {"train_loss": -43.41257095336914, "global_step": 355896, "epoch": 2941} {"train_loss": -43.68883514404297, "global_step": 355897, "epoch": 2941} {"train_loss": -43.60587692260742, "global_step": 355898, "epoch": 2941} {"train_loss": -43.3360710144043, "global_step": 355899, "epoch": 2941} {"train_loss": -43.504241943359375, "global_step": 355900, "epoch": 2941} {"train_loss": -43.97400665283203, "global_step": 355901, "epoch": 2941} {"train_loss": -43.32734298706055, "global_step": 355902, "epoch": 2941} {"train_loss": -44.201168060302734, "global_step": 355903, "epoch": 2941} {"train_loss": -43.1656379699707, "global_step": 355904, "epoch": 2941} {"train_loss": -43.737083435058594, "global_step": 355905, "epoch": 2941} {"train_loss": -43.78862380981445, "global_step": 355906, "epoch": 2941} {"train_loss": -44.155452728271484, "global_step": 355907, "epoch": 2941} {"train_loss": -44.351131439208984, "global_step": 355908, "epoch": 2941} {"train_loss": -44.42253494262695, "global_step": 355909, "epoch": 2941} {"train_loss": -44.607601165771484, "global_step": 355910, "epoch": 2941} {"train_loss": -44.8499870300293, "global_step": 355911, "epoch": 2941} {"train_loss": -44.79839324951172, "global_step": 355912, "epoch": 2941} {"train_loss": -44.73411178588867, "global_step": 355913, "epoch": 2941} {"train_loss": -44.41278839111328, "global_step": 355914, "epoch": 2941} {"train_loss": -44.523284912109375, "global_step": 355915, "epoch": 2941} {"train_loss": -44.613704681396484, "global_step": 355916, "epoch": 2941} {"train_loss": -44.975223541259766, "global_step": 355917, "epoch": 2941} {"train_loss": -45.159873962402344, "global_step": 355918, "epoch": 2941} {"train_loss": -44.80080032348633, "global_step": 355919, "epoch": 2941} {"train_loss": -44.81241989135742, "global_step": 355920, "epoch": 2941} {"train_loss": -44.59416580200195, "global_step": 355921, "epoch": 2941} {"train_loss": -45.00566101074219, "global_step": 355922, "epoch": 2941} {"train_loss": -45.10753631591797, "global_step": 355923, "epoch": 2941} {"train_loss": -45.0584716796875, "global_step": 355924, "epoch": 2941} {"train_loss": -44.68006134033203, "global_step": 355925, "epoch": 2941} {"train_loss": -44.941429138183594, "global_step": 355926, "epoch": 2941} {"train_loss": -45.334754943847656, "global_step": 355927, "epoch": 2941} {"train_loss": -44.82075881958008, "global_step": 355928, "epoch": 2941} {"train_loss": -45.1350212097168, "global_step": 355929, "epoch": 2941} {"train_loss": -45.32387924194336, "global_step": 355930, "epoch": 2941} {"train_loss": -45.71672439575195, "global_step": 355931, "epoch": 2941} {"train_loss": -45.292816162109375, "global_step": 355932, "epoch": 2941} {"train_loss": -45.523475646972656, "global_step": 355933, "epoch": 2941} {"train_loss": -45.3518180847168, "global_step": 355934, "epoch": 2941} {"train_loss": -44.487525939941406, "global_step": 355935, "epoch": 2941} {"train_loss": -45.534549713134766, "global_step": 355936, "epoch": 2941} {"train_loss": -45.1088752746582, "global_step": 355937, "epoch": 2941} {"train_loss": -45.46070098876953, "global_step": 355938, "epoch": 2941} {"train_loss": -45.429561614990234, "global_step": 355939, "epoch": 2941} {"train_loss": -45.23114013671875, "global_step": 355940, "epoch": 2941} {"train_loss": -45.857913970947266, "global_step": 355941, "epoch": 2941} {"train_loss": -45.700984954833984, "global_step": 355942, "epoch": 2941} {"train_loss": -45.53121566772461, "global_step": 355943, "epoch": 2941} {"train_loss": -45.583953857421875, "global_step": 355944, "epoch": 2941} {"train_loss": -45.45216751098633, "global_step": 355945, "epoch": 2941} {"train_loss": -45.53322219848633, "global_step": 355946, "epoch": 2941} {"train_loss": -44.80992126464844, "global_step": 355947, "epoch": 2941} {"train_loss": -45.4645881652832, "global_step": 355948, "epoch": 2941} {"train_loss": -45.550636291503906, "global_step": 355949, "epoch": 2941} {"train_loss": -45.805171966552734, "global_step": 355950, "epoch": 2941} {"train_loss": -45.633235931396484, "global_step": 355951, "epoch": 2941} {"train_loss": -46.02943801879883, "global_step": 355952, "epoch": 2941} {"train_loss": -45.37175369262695, "global_step": 355953, "epoch": 2941} {"train_loss": -45.29964065551758, "global_step": 355954, "epoch": 2941} {"train_loss": -44.65488815307617, "global_step": 355955, "epoch": 2941} {"train_loss": -44.645320892333984, "global_step": 355956, "epoch": 2941} {"train_loss": -45.376434326171875, "global_step": 355957, "epoch": 2941} {"train_loss": -45.60484313964844, "global_step": 355958, "epoch": 2941} {"train_loss": -44.35491943359375, "global_step": 355959, "epoch": 2941} {"train_loss": -45.65328598022461, "global_step": 355960, "epoch": 2941} {"train_loss": -45.12962341308594, "global_step": 355961, "epoch": 2941} {"train_loss": -44.63472366333008, "global_step": 355962, "epoch": 2941} {"train_loss": -45.7404899597168, "global_step": 355963, "epoch": 2941} {"train_loss": -45.022151947021484, "global_step": 355964, "epoch": 2941} {"train_loss": -44.60187911987305, "global_step": 355965, "epoch": 2941} {"train_loss": -45.4488525390625, "global_step": 355966, "epoch": 2941} {"train_loss": -44.644256591796875, "global_step": 355967, "epoch": 2941} {"train_loss": -45.472808837890625, "global_step": 355968, "epoch": 2941} {"train_loss": -45.72047424316406, "global_step": 355969, "epoch": 2941} {"train_loss": -44.96043014526367, "global_step": 355970, "epoch": 2941} {"train_loss": -42.98197555541992, "global_step": 355971, "epoch": 2941} {"train_loss": -44.97616195678711, "global_step": 355972, "epoch": 2941} {"train_loss": -44.74071502685547, "global_step": 355973, "epoch": 2941} {"train_loss": -44.1766357421875, "global_step": 355974, "epoch": 2941} {"train_loss": -44.62960433959961, "global_step": 355975, "epoch": 2941} {"train_loss": -45.1397590637207, "global_step": 355976, "epoch": 2941} {"train_loss": -45.58113098144531, "global_step": 355977, "epoch": 2941} {"train_loss": -45.752742767333984, "global_step": 355978, "epoch": 2941} {"train_loss": -45.60272979736328, "global_step": 355979, "epoch": 2941} {"train_loss": -45.83454513549805, "global_step": 355980, "epoch": 2941} {"train_loss": -43.62075228730509, "global_step": 355981, "epoch": 2941, "val_loss": 2573840.0} {"train_loss": -45.162681579589844, "global_step": 355982, "epoch": 2942} {"train_loss": -44.70020294189453, "global_step": 355983, "epoch": 2942} {"train_loss": -45.523040771484375, "global_step": 355984, "epoch": 2942} {"train_loss": -45.20671081542969, "global_step": 355985, "epoch": 2942} {"train_loss": -44.766822814941406, "global_step": 355986, "epoch": 2942} {"train_loss": -44.945106506347656, "global_step": 355987, "epoch": 2942} {"train_loss": -45.504234313964844, "global_step": 355988, "epoch": 2942} {"train_loss": -45.29999923706055, "global_step": 355989, "epoch": 2942} {"train_loss": -45.32009506225586, "global_step": 355990, "epoch": 2942} {"train_loss": -44.081275939941406, "global_step": 355991, "epoch": 2942} {"train_loss": -45.24334716796875, "global_step": 355992, "epoch": 2942} {"train_loss": -45.17653274536133, "global_step": 355993, "epoch": 2942} {"train_loss": -44.23862838745117, "global_step": 355994, "epoch": 2942} {"train_loss": -43.122039794921875, "global_step": 355995, "epoch": 2942} {"train_loss": -45.28866195678711, "global_step": 355996, "epoch": 2942} {"train_loss": -43.83684158325195, "global_step": 355997, "epoch": 2942} {"train_loss": -41.57401657104492, "global_step": 355998, "epoch": 2942} {"train_loss": -44.64280700683594, "global_step": 355999, "epoch": 2942} {"train_loss": -44.627593994140625, "global_step": 356000, "epoch": 2942} {"train_loss": -41.53733444213867, "global_step": 356001, "epoch": 2942} {"train_loss": -42.94137191772461, "global_step": 356002, "epoch": 2942} {"train_loss": -44.15731430053711, "global_step": 356003, "epoch": 2942} {"train_loss": -44.063961029052734, "global_step": 356004, "epoch": 2942} {"train_loss": -42.542118072509766, "global_step": 356005, "epoch": 2942} {"train_loss": -41.210330963134766, "global_step": 356006, "epoch": 2942} {"train_loss": -44.608062744140625, "global_step": 356007, "epoch": 2942} {"train_loss": -43.42470932006836, "global_step": 356008, "epoch": 2942} {"train_loss": -43.16765213012695, "global_step": 356009, "epoch": 2942} {"train_loss": -44.4115104675293, "global_step": 356010, "epoch": 2942} {"train_loss": -42.78202438354492, "global_step": 356011, "epoch": 2942} {"train_loss": -43.37908935546875, "global_step": 356012, "epoch": 2942} {"train_loss": -43.09784698486328, "global_step": 356013, "epoch": 2942} {"train_loss": -43.473140716552734, "global_step": 356014, "epoch": 2942} {"train_loss": -43.92112731933594, "global_step": 356015, "epoch": 2942} {"train_loss": -43.777191162109375, "global_step": 356016, "epoch": 2942} {"train_loss": -43.7491340637207, "global_step": 356017, "epoch": 2942} {"train_loss": -45.035682678222656, "global_step": 356018, "epoch": 2942} {"train_loss": -44.500240325927734, "global_step": 356019, "epoch": 2942} {"train_loss": -44.24027633666992, "global_step": 356020, "epoch": 2942} {"train_loss": -44.169342041015625, "global_step": 356021, "epoch": 2942} {"train_loss": -44.56589889526367, "global_step": 356022, "epoch": 2942} {"train_loss": -43.83182144165039, "global_step": 356023, "epoch": 2942} {"train_loss": -44.816097259521484, "global_step": 356024, "epoch": 2942} {"train_loss": -43.905757904052734, "global_step": 356025, "epoch": 2942} {"train_loss": -44.97769546508789, "global_step": 356026, "epoch": 2942} {"train_loss": -44.48569107055664, "global_step": 356027, "epoch": 2942} {"train_loss": -45.0977668762207, "global_step": 356028, "epoch": 2942} {"train_loss": -44.62811279296875, "global_step": 356029, "epoch": 2942} {"train_loss": -44.56447219848633, "global_step": 356030, "epoch": 2942} {"train_loss": -45.506568908691406, "global_step": 356031, "epoch": 2942} {"train_loss": -44.02375411987305, "global_step": 356032, "epoch": 2942} {"train_loss": -44.98650360107422, "global_step": 356033, "epoch": 2942} {"train_loss": -45.08803939819336, "global_step": 356034, "epoch": 2942} {"train_loss": -44.68507385253906, "global_step": 356035, "epoch": 2942} {"train_loss": -45.3861083984375, "global_step": 356036, "epoch": 2942} {"train_loss": -45.021976470947266, "global_step": 356037, "epoch": 2942} {"train_loss": -45.20760726928711, "global_step": 356038, "epoch": 2942} {"train_loss": -45.23707962036133, "global_step": 356039, "epoch": 2942} {"train_loss": -44.88496017456055, "global_step": 356040, "epoch": 2942} {"train_loss": -45.653411865234375, "global_step": 356041, "epoch": 2942} {"train_loss": -45.42252731323242, "global_step": 356042, "epoch": 2942} {"train_loss": -45.62818908691406, "global_step": 356043, "epoch": 2942} {"train_loss": -45.35523223876953, "global_step": 356044, "epoch": 2942} {"train_loss": -45.171295166015625, "global_step": 356045, "epoch": 2942} {"train_loss": -45.730403900146484, "global_step": 356046, "epoch": 2942} {"train_loss": -44.767616271972656, "global_step": 356047, "epoch": 2942} {"train_loss": -45.03474044799805, "global_step": 356048, "epoch": 2942} {"train_loss": -45.881282806396484, "global_step": 356049, "epoch": 2942} {"train_loss": -45.85232925415039, "global_step": 356050, "epoch": 2942} {"train_loss": -45.55585479736328, "global_step": 356051, "epoch": 2942} {"train_loss": -45.23736572265625, "global_step": 356052, "epoch": 2942} {"train_loss": -45.732784271240234, "global_step": 356053, "epoch": 2942} {"train_loss": -45.907806396484375, "global_step": 356054, "epoch": 2942} {"train_loss": -46.030517578125, "global_step": 356055, "epoch": 2942} {"train_loss": -45.42560958862305, "global_step": 356056, "epoch": 2942} {"train_loss": -45.21979904174805, "global_step": 356057, "epoch": 2942} {"train_loss": -45.28620147705078, "global_step": 356058, "epoch": 2942} {"train_loss": -45.693756103515625, "global_step": 356059, "epoch": 2942} {"train_loss": -45.426475524902344, "global_step": 356060, "epoch": 2942} {"train_loss": -44.641056060791016, "global_step": 356061, "epoch": 2942} {"train_loss": -46.02235794067383, "global_step": 356062, "epoch": 2942} {"train_loss": -44.74125289916992, "global_step": 356063, "epoch": 2942} {"train_loss": -45.43876266479492, "global_step": 356064, "epoch": 2942} {"train_loss": -45.57832717895508, "global_step": 356065, "epoch": 2942} {"train_loss": -45.14262771606445, "global_step": 356066, "epoch": 2942} {"train_loss": -44.674537658691406, "global_step": 356067, "epoch": 2942} {"train_loss": -45.19356155395508, "global_step": 356068, "epoch": 2942} {"train_loss": -44.3586540222168, "global_step": 356069, "epoch": 2942} {"train_loss": -44.23556137084961, "global_step": 356070, "epoch": 2942} {"train_loss": -45.750343322753906, "global_step": 356071, "epoch": 2942} {"train_loss": -44.99934768676758, "global_step": 356072, "epoch": 2942} {"train_loss": -42.917720794677734, "global_step": 356073, "epoch": 2942} {"train_loss": -43.53511428833008, "global_step": 356074, "epoch": 2942} {"train_loss": -44.6439323425293, "global_step": 356075, "epoch": 2942} {"train_loss": -44.29146194458008, "global_step": 356076, "epoch": 2942} {"train_loss": -42.33264923095703, "global_step": 356077, "epoch": 2942} {"train_loss": -42.222782135009766, "global_step": 356078, "epoch": 2942} {"train_loss": -43.486324310302734, "global_step": 356079, "epoch": 2942} {"train_loss": -43.696170806884766, "global_step": 356080, "epoch": 2942} {"train_loss": -43.4194221496582, "global_step": 356081, "epoch": 2942} {"train_loss": -42.80479049682617, "global_step": 356082, "epoch": 2942} {"train_loss": -42.43473434448242, "global_step": 356083, "epoch": 2942} {"train_loss": -42.62929916381836, "global_step": 356084, "epoch": 2942} {"train_loss": -43.81332015991211, "global_step": 356085, "epoch": 2942} {"train_loss": -40.03807067871094, "global_step": 356086, "epoch": 2942} {"train_loss": -43.67110061645508, "global_step": 356087, "epoch": 2942} {"train_loss": -40.6174201965332, "global_step": 356088, "epoch": 2942} {"train_loss": -38.809959411621094, "global_step": 356089, "epoch": 2942} {"train_loss": -42.89085006713867, "global_step": 356090, "epoch": 2942} {"train_loss": -38.373756408691406, "global_step": 356091, "epoch": 2942} {"train_loss": -38.63669967651367, "global_step": 356092, "epoch": 2942} {"train_loss": -42.84944534301758, "global_step": 356093, "epoch": 2942} {"train_loss": -39.39628982543945, "global_step": 356094, "epoch": 2942} {"train_loss": -40.420406341552734, "global_step": 356095, "epoch": 2942} {"train_loss": -38.122676849365234, "global_step": 356096, "epoch": 2942} {"train_loss": -43.54026412963867, "global_step": 356097, "epoch": 2942} {"train_loss": -38.37531280517578, "global_step": 356098, "epoch": 2942} {"train_loss": -39.07499313354492, "global_step": 356099, "epoch": 2942} {"train_loss": -39.37827682495117, "global_step": 356100, "epoch": 2942} {"train_loss": -41.988216400146484, "global_step": 356101, "epoch": 2942} {"train_loss": -43.88944326353467, "global_step": 356102, "epoch": 2942, "val_loss": 2557340.75} {"train_loss": -39.51811981201172, "global_step": 356103, "epoch": 2943} {"train_loss": -41.30305862426758, "global_step": 356104, "epoch": 2943} {"train_loss": -39.13359451293945, "global_step": 356105, "epoch": 2943} {"train_loss": -37.200897216796875, "global_step": 356106, "epoch": 2943} {"train_loss": -21.516521453857422, "global_step": 356107, "epoch": 2943} {"train_loss": -39.017391204833984, "global_step": 356108, "epoch": 2943} {"train_loss": -38.529232025146484, "global_step": 356109, "epoch": 2943} {"train_loss": -37.12925338745117, "global_step": 356110, "epoch": 2943} {"train_loss": -39.35640335083008, "global_step": 356111, "epoch": 2943} {"train_loss": -38.57895278930664, "global_step": 356112, "epoch": 2943} {"train_loss": -37.43842697143555, "global_step": 356113, "epoch": 2943} {"train_loss": -37.005550384521484, "global_step": 356114, "epoch": 2943} {"train_loss": -39.098907470703125, "global_step": 356115, "epoch": 2943} {"train_loss": -41.09120559692383, "global_step": 356116, "epoch": 2943} {"train_loss": -36.60820770263672, "global_step": 356117, "epoch": 2943} {"train_loss": -31.754058837890625, "global_step": 356118, "epoch": 2943} {"train_loss": -39.663448333740234, "global_step": 356119, "epoch": 2943} {"train_loss": -40.07736587524414, "global_step": 356120, "epoch": 2943} {"train_loss": -41.075050354003906, "global_step": 356121, "epoch": 2943} {"train_loss": -34.473121643066406, "global_step": 356122, "epoch": 2943} {"train_loss": -41.91260528564453, "global_step": 356123, "epoch": 2943} {"train_loss": -40.0468864440918, "global_step": 356124, "epoch": 2943} {"train_loss": -39.9523811340332, "global_step": 356125, "epoch": 2943} {"train_loss": -41.629329681396484, "global_step": 356126, "epoch": 2943} {"train_loss": -41.28300857543945, "global_step": 356127, "epoch": 2943} {"train_loss": -40.38220977783203, "global_step": 356128, "epoch": 2943} {"train_loss": -42.20357131958008, "global_step": 356129, "epoch": 2943} {"train_loss": -41.175411224365234, "global_step": 356130, "epoch": 2943} {"train_loss": -42.059383392333984, "global_step": 356131, "epoch": 2943} {"train_loss": -42.04274368286133, "global_step": 356132, "epoch": 2943} {"train_loss": -42.2149772644043, "global_step": 356133, "epoch": 2943} {"train_loss": -41.89419174194336, "global_step": 356134, "epoch": 2943} {"train_loss": -41.942867279052734, "global_step": 356135, "epoch": 2943} {"train_loss": -42.5655517578125, "global_step": 356136, "epoch": 2943} {"train_loss": -42.865840911865234, "global_step": 356137, "epoch": 2943} {"train_loss": -41.081295013427734, "global_step": 356138, "epoch": 2943} {"train_loss": -41.9703254699707, "global_step": 356139, "epoch": 2943} {"train_loss": -43.121368408203125, "global_step": 356140, "epoch": 2943} {"train_loss": -42.51142501831055, "global_step": 356141, "epoch": 2943} {"train_loss": -43.25756072998047, "global_step": 356142, "epoch": 2943} {"train_loss": -41.86594772338867, "global_step": 356143, "epoch": 2943} {"train_loss": -42.65118408203125, "global_step": 356144, "epoch": 2943} {"train_loss": -43.394222259521484, "global_step": 356145, "epoch": 2943} {"train_loss": -43.6735725402832, "global_step": 356146, "epoch": 2943} {"train_loss": -43.31423568725586, "global_step": 356147, "epoch": 2943} {"train_loss": -42.984893798828125, "global_step": 356148, "epoch": 2943} {"train_loss": -42.87594985961914, "global_step": 356149, "epoch": 2943} {"train_loss": -42.80454635620117, "global_step": 356150, "epoch": 2943} {"train_loss": -43.78546142578125, "global_step": 356151, "epoch": 2943} {"train_loss": -43.50706100463867, "global_step": 356152, "epoch": 2943} {"train_loss": -43.08460998535156, "global_step": 356153, "epoch": 2943} {"train_loss": -40.45192337036133, "global_step": 356154, "epoch": 2943} {"train_loss": -43.450862884521484, "global_step": 356155, "epoch": 2943} {"train_loss": -43.872154235839844, "global_step": 356156, "epoch": 2943} {"train_loss": -43.84891891479492, "global_step": 356157, "epoch": 2943} {"train_loss": -42.95893478393555, "global_step": 356158, "epoch": 2943} {"train_loss": -43.80308151245117, "global_step": 356159, "epoch": 2943} {"train_loss": -43.6647834777832, "global_step": 356160, "epoch": 2943} {"train_loss": -44.177581787109375, "global_step": 356161, "epoch": 2943} {"train_loss": -43.29835891723633, "global_step": 356162, "epoch": 2943} {"train_loss": -42.802886962890625, "global_step": 356163, "epoch": 2943} {"train_loss": -43.084957122802734, "global_step": 356164, "epoch": 2943} {"train_loss": -44.34761428833008, "global_step": 356165, "epoch": 2943} {"train_loss": -43.78369140625, "global_step": 356166, "epoch": 2943} {"train_loss": -44.336456298828125, "global_step": 356167, "epoch": 2943} {"train_loss": -44.07027053833008, "global_step": 356168, "epoch": 2943} {"train_loss": -43.72792434692383, "global_step": 356169, "epoch": 2943} {"train_loss": -43.2889518737793, "global_step": 356170, "epoch": 2943} {"train_loss": -41.922603607177734, "global_step": 356171, "epoch": 2943} {"train_loss": -44.67600631713867, "global_step": 356172, "epoch": 2943} {"train_loss": -44.477630615234375, "global_step": 356173, "epoch": 2943} {"train_loss": -44.07080841064453, "global_step": 356174, "epoch": 2943} {"train_loss": -44.41010665893555, "global_step": 356175, "epoch": 2943} {"train_loss": -45.14631271362305, "global_step": 356176, "epoch": 2943} {"train_loss": -44.34878158569336, "global_step": 356177, "epoch": 2943} {"train_loss": -44.294132232666016, "global_step": 356178, "epoch": 2943} {"train_loss": -44.30939483642578, "global_step": 356179, "epoch": 2943} {"train_loss": -44.38578796386719, "global_step": 356180, "epoch": 2943} {"train_loss": -44.50916290283203, "global_step": 356181, "epoch": 2943} {"train_loss": -45.31959915161133, "global_step": 356182, "epoch": 2943} {"train_loss": -45.0550537109375, "global_step": 356183, "epoch": 2943} {"train_loss": -44.55233383178711, "global_step": 356184, "epoch": 2943} {"train_loss": -44.325469970703125, "global_step": 356185, "epoch": 2943} {"train_loss": -45.2999267578125, "global_step": 356186, "epoch": 2943} {"train_loss": -44.61151885986328, "global_step": 356187, "epoch": 2943} {"train_loss": -44.97007751464844, "global_step": 356188, "epoch": 2943} {"train_loss": -43.358489990234375, "global_step": 356189, "epoch": 2943} {"train_loss": -45.003421783447266, "global_step": 356190, "epoch": 2943} {"train_loss": -45.00556182861328, "global_step": 356191, "epoch": 2943} {"train_loss": -43.8878059387207, "global_step": 356192, "epoch": 2943} {"train_loss": -45.11812210083008, "global_step": 356193, "epoch": 2943} {"train_loss": -45.42414093017578, "global_step": 356194, "epoch": 2943} {"train_loss": -44.738136291503906, "global_step": 356195, "epoch": 2943} {"train_loss": -44.975894927978516, "global_step": 356196, "epoch": 2943} {"train_loss": -44.67290496826172, "global_step": 356197, "epoch": 2943} {"train_loss": -45.21904754638672, "global_step": 356198, "epoch": 2943} {"train_loss": -44.56178665161133, "global_step": 356199, "epoch": 2943} {"train_loss": -44.090023040771484, "global_step": 356200, "epoch": 2943} {"train_loss": -44.872249603271484, "global_step": 356201, "epoch": 2943} {"train_loss": -44.654781341552734, "global_step": 356202, "epoch": 2943} {"train_loss": -45.25724792480469, "global_step": 356203, "epoch": 2943} {"train_loss": -45.07379150390625, "global_step": 356204, "epoch": 2943} {"train_loss": -43.90985870361328, "global_step": 356205, "epoch": 2943} {"train_loss": -43.77278518676758, "global_step": 356206, "epoch": 2943} {"train_loss": -43.58616256713867, "global_step": 356207, "epoch": 2943} {"train_loss": -43.684200286865234, "global_step": 356208, "epoch": 2943} {"train_loss": -45.12636184692383, "global_step": 356209, "epoch": 2943} {"train_loss": -44.754852294921875, "global_step": 356210, "epoch": 2943} {"train_loss": -43.046165466308594, "global_step": 356211, "epoch": 2943} {"train_loss": -45.17918014526367, "global_step": 356212, "epoch": 2943} {"train_loss": -44.450984954833984, "global_step": 356213, "epoch": 2943} {"train_loss": -44.68772888183594, "global_step": 356214, "epoch": 2943} {"train_loss": -44.469146728515625, "global_step": 356215, "epoch": 2943} {"train_loss": -43.86776351928711, "global_step": 356216, "epoch": 2943} {"train_loss": -44.5053825378418, "global_step": 356217, "epoch": 2943} {"train_loss": -45.21693420410156, "global_step": 356218, "epoch": 2943} {"train_loss": -44.189208984375, "global_step": 356219, "epoch": 2943} {"train_loss": -44.11924362182617, "global_step": 356220, "epoch": 2943} {"train_loss": -44.204769134521484, "global_step": 356221, "epoch": 2943} {"train_loss": -44.7334098815918, "global_step": 356222, "epoch": 2943} {"train_loss": -42.613910706575254, "global_step": 356223, "epoch": 2943, "val_loss": 2450853.75} {"train_loss": -45.07981491088867, "global_step": 356224, "epoch": 2944} {"train_loss": -44.022491455078125, "global_step": 356225, "epoch": 2944} {"train_loss": -43.17570114135742, "global_step": 356226, "epoch": 2944} {"train_loss": -43.14531707763672, "global_step": 356227, "epoch": 2944} {"train_loss": -42.5561637878418, "global_step": 356228, "epoch": 2944} {"train_loss": -44.37553024291992, "global_step": 356229, "epoch": 2944} {"train_loss": -44.08511734008789, "global_step": 356230, "epoch": 2944} {"train_loss": -45.497901916503906, "global_step": 356231, "epoch": 2944} {"train_loss": -45.090232849121094, "global_step": 356232, "epoch": 2944} {"train_loss": -44.34830856323242, "global_step": 356233, "epoch": 2944} {"train_loss": -44.29632568359375, "global_step": 356234, "epoch": 2944} {"train_loss": -44.93208694458008, "global_step": 356235, "epoch": 2944} {"train_loss": -43.80747985839844, "global_step": 356236, "epoch": 2944} {"train_loss": -45.53701400756836, "global_step": 356237, "epoch": 2944} {"train_loss": -44.3548698425293, "global_step": 356238, "epoch": 2944} {"train_loss": -42.97370529174805, "global_step": 356239, "epoch": 2944} {"train_loss": -41.75350570678711, "global_step": 356240, "epoch": 2944} {"train_loss": -43.80725860595703, "global_step": 356241, "epoch": 2944} {"train_loss": -44.90829086303711, "global_step": 356242, "epoch": 2944} {"train_loss": -43.84674835205078, "global_step": 356243, "epoch": 2944} {"train_loss": -45.31742477416992, "global_step": 356244, "epoch": 2944} {"train_loss": -44.059268951416016, "global_step": 356245, "epoch": 2944} {"train_loss": -41.799678802490234, "global_step": 356246, "epoch": 2944} {"train_loss": -43.25608444213867, "global_step": 356247, "epoch": 2944} {"train_loss": -43.7085075378418, "global_step": 356248, "epoch": 2944} {"train_loss": -42.1678466796875, "global_step": 356249, "epoch": 2944} {"train_loss": -44.710933685302734, "global_step": 356250, "epoch": 2944} {"train_loss": -42.063838958740234, "global_step": 356251, "epoch": 2944} {"train_loss": -42.985565185546875, "global_step": 356252, "epoch": 2944} {"train_loss": -44.10061264038086, "global_step": 356253, "epoch": 2944} {"train_loss": -41.3470573425293, "global_step": 356254, "epoch": 2944} {"train_loss": -44.156185150146484, "global_step": 356255, "epoch": 2944} {"train_loss": -39.10234451293945, "global_step": 356256, "epoch": 2944} {"train_loss": -43.65589904785156, "global_step": 356257, "epoch": 2944} {"train_loss": -38.376068115234375, "global_step": 356258, "epoch": 2944} {"train_loss": -38.49235916137695, "global_step": 356259, "epoch": 2944} {"train_loss": -37.685638427734375, "global_step": 356260, "epoch": 2944} {"train_loss": -39.13639831542969, "global_step": 356261, "epoch": 2944} {"train_loss": -39.494476318359375, "global_step": 356262, "epoch": 2944} {"train_loss": -41.34941482543945, "global_step": 356263, "epoch": 2944} {"train_loss": -40.54743194580078, "global_step": 356264, "epoch": 2944} {"train_loss": -39.415016174316406, "global_step": 356265, "epoch": 2944} {"train_loss": -40.659645080566406, "global_step": 356266, "epoch": 2944} {"train_loss": -41.711036682128906, "global_step": 356267, "epoch": 2944} {"train_loss": -40.95393371582031, "global_step": 356268, "epoch": 2944} {"train_loss": -42.5748405456543, "global_step": 356269, "epoch": 2944} {"train_loss": -43.38630294799805, "global_step": 356270, "epoch": 2944} {"train_loss": -43.166656494140625, "global_step": 356271, "epoch": 2944} {"train_loss": -43.415138244628906, "global_step": 356272, "epoch": 2944} {"train_loss": -42.40261459350586, "global_step": 356273, "epoch": 2944} {"train_loss": -42.84065628051758, "global_step": 356274, "epoch": 2944} {"train_loss": -42.84397506713867, "global_step": 356275, "epoch": 2944} {"train_loss": -42.95756149291992, "global_step": 356276, "epoch": 2944} {"train_loss": -41.14887619018555, "global_step": 356277, "epoch": 2944} {"train_loss": -43.62751388549805, "global_step": 356278, "epoch": 2944} {"train_loss": -43.69926071166992, "global_step": 356279, "epoch": 2944} {"train_loss": -42.95671463012695, "global_step": 356280, "epoch": 2944} {"train_loss": -41.4615364074707, "global_step": 356281, "epoch": 2944} {"train_loss": -42.162418365478516, "global_step": 356282, "epoch": 2944} {"train_loss": -43.60394287109375, "global_step": 356283, "epoch": 2944} {"train_loss": -42.98971176147461, "global_step": 356284, "epoch": 2944} {"train_loss": -42.540870666503906, "global_step": 356285, "epoch": 2944} {"train_loss": -44.03517532348633, "global_step": 356286, "epoch": 2944} {"train_loss": -43.139991760253906, "global_step": 356287, "epoch": 2944} {"train_loss": -42.6336555480957, "global_step": 356288, "epoch": 2944} {"train_loss": -43.54235076904297, "global_step": 356289, "epoch": 2944} {"train_loss": -44.4537353515625, "global_step": 356290, "epoch": 2944} {"train_loss": -43.203369140625, "global_step": 356291, "epoch": 2944} {"train_loss": -43.7155876159668, "global_step": 356292, "epoch": 2944} {"train_loss": -44.24358367919922, "global_step": 356293, "epoch": 2944} {"train_loss": -44.08677291870117, "global_step": 356294, "epoch": 2944} {"train_loss": -43.731075286865234, "global_step": 356295, "epoch": 2944} {"train_loss": -44.08589172363281, "global_step": 356296, "epoch": 2944} {"train_loss": -44.17790985107422, "global_step": 356297, "epoch": 2944} {"train_loss": -43.281288146972656, "global_step": 356298, "epoch": 2944} {"train_loss": -44.51667404174805, "global_step": 356299, "epoch": 2944} {"train_loss": -43.30062484741211, "global_step": 356300, "epoch": 2944} {"train_loss": -44.4290657043457, "global_step": 356301, "epoch": 2944} {"train_loss": -43.94807052612305, "global_step": 356302, "epoch": 2944} {"train_loss": -43.40974044799805, "global_step": 356303, "epoch": 2944} {"train_loss": -44.34954833984375, "global_step": 356304, "epoch": 2944} {"train_loss": -44.40757369995117, "global_step": 356305, "epoch": 2944} {"train_loss": -44.56136703491211, "global_step": 356306, "epoch": 2944} {"train_loss": -44.499027252197266, "global_step": 356307, "epoch": 2944} {"train_loss": -42.50138473510742, "global_step": 356308, "epoch": 2944} {"train_loss": -44.31366729736328, "global_step": 356309, "epoch": 2944} {"train_loss": -44.155826568603516, "global_step": 356310, "epoch": 2944} {"train_loss": -43.57198715209961, "global_step": 356311, "epoch": 2944} {"train_loss": -44.43367004394531, "global_step": 356312, "epoch": 2944} {"train_loss": -43.38267135620117, "global_step": 356313, "epoch": 2944} {"train_loss": -44.13519287109375, "global_step": 356314, "epoch": 2944} {"train_loss": -45.224735260009766, "global_step": 356315, "epoch": 2944} {"train_loss": -43.03569030761719, "global_step": 356316, "epoch": 2944} {"train_loss": -44.62346267700195, "global_step": 356317, "epoch": 2944} {"train_loss": -44.299190521240234, "global_step": 356318, "epoch": 2944} {"train_loss": -44.76548385620117, "global_step": 356319, "epoch": 2944} {"train_loss": -44.529903411865234, "global_step": 356320, "epoch": 2944} {"train_loss": -44.79865264892578, "global_step": 356321, "epoch": 2944} {"train_loss": -44.835113525390625, "global_step": 356322, "epoch": 2944} {"train_loss": -44.23917770385742, "global_step": 356323, "epoch": 2944} {"train_loss": -44.993412017822266, "global_step": 356324, "epoch": 2944} {"train_loss": -44.327449798583984, "global_step": 356325, "epoch": 2944} {"train_loss": -44.24663162231445, "global_step": 356326, "epoch": 2944} {"train_loss": -45.30141830444336, "global_step": 356327, "epoch": 2944} {"train_loss": -45.23298263549805, "global_step": 356328, "epoch": 2944} {"train_loss": -44.90932083129883, "global_step": 356329, "epoch": 2944} {"train_loss": -45.129493713378906, "global_step": 356330, "epoch": 2944} {"train_loss": -45.05097579956055, "global_step": 356331, "epoch": 2944} {"train_loss": -44.25860595703125, "global_step": 356332, "epoch": 2944} {"train_loss": -44.44465255737305, "global_step": 356333, "epoch": 2944} {"train_loss": -45.3434944152832, "global_step": 356334, "epoch": 2944} {"train_loss": -44.54801940917969, "global_step": 356335, "epoch": 2944} {"train_loss": -44.810302734375, "global_step": 356336, "epoch": 2944} {"train_loss": -44.944400787353516, "global_step": 356337, "epoch": 2944} {"train_loss": -45.02607727050781, "global_step": 356338, "epoch": 2944} {"train_loss": -44.41462326049805, "global_step": 356339, "epoch": 2944} {"train_loss": -43.699745178222656, "global_step": 356340, "epoch": 2944} {"train_loss": -44.98444747924805, "global_step": 356341, "epoch": 2944} {"train_loss": -43.119380950927734, "global_step": 356342, "epoch": 2944} {"train_loss": -43.99613571166992, "global_step": 356343, "epoch": 2944} {"train_loss": -43.47327574422537, "global_step": 356344, "epoch": 2944, "val_loss": 2442458.0} {"train_loss": -42.825374603271484, "global_step": 356345, "epoch": 2945} {"train_loss": -44.449378967285156, "global_step": 356346, "epoch": 2945} {"train_loss": -41.8487548828125, "global_step": 356347, "epoch": 2945} {"train_loss": -44.34907150268555, "global_step": 356348, "epoch": 2945} {"train_loss": -44.24695587158203, "global_step": 356349, "epoch": 2945} {"train_loss": -43.369544982910156, "global_step": 356350, "epoch": 2945} {"train_loss": -43.88935852050781, "global_step": 356351, "epoch": 2945} {"train_loss": -43.678497314453125, "global_step": 356352, "epoch": 2945} {"train_loss": -44.953426361083984, "global_step": 356353, "epoch": 2945} {"train_loss": -43.99245071411133, "global_step": 356354, "epoch": 2945} {"train_loss": -45.48274230957031, "global_step": 356355, "epoch": 2945} {"train_loss": -44.20600509643555, "global_step": 356356, "epoch": 2945} {"train_loss": -42.95405960083008, "global_step": 356357, "epoch": 2945} {"train_loss": -44.571529388427734, "global_step": 356358, "epoch": 2945} {"train_loss": -44.739925384521484, "global_step": 356359, "epoch": 2945} {"train_loss": -44.369232177734375, "global_step": 356360, "epoch": 2945} {"train_loss": -44.92470169067383, "global_step": 356361, "epoch": 2945} {"train_loss": -44.30466079711914, "global_step": 356362, "epoch": 2945} {"train_loss": -44.9561653137207, "global_step": 356363, "epoch": 2945} {"train_loss": -44.74127197265625, "global_step": 356364, "epoch": 2945} {"train_loss": -45.03736114501953, "global_step": 356365, "epoch": 2945} {"train_loss": -45.312400817871094, "global_step": 356366, "epoch": 2945} {"train_loss": -44.50052261352539, "global_step": 356367, "epoch": 2945} {"train_loss": -44.77785110473633, "global_step": 356368, "epoch": 2945} {"train_loss": -44.92620086669922, "global_step": 356369, "epoch": 2945} {"train_loss": -44.95458984375, "global_step": 356370, "epoch": 2945} {"train_loss": -45.57442092895508, "global_step": 356371, "epoch": 2945} {"train_loss": -44.448097229003906, "global_step": 356372, "epoch": 2945} {"train_loss": -45.22587585449219, "global_step": 356373, "epoch": 2945} {"train_loss": -45.26227951049805, "global_step": 356374, "epoch": 2945} {"train_loss": -44.8783073425293, "global_step": 356375, "epoch": 2945} {"train_loss": -45.62746810913086, "global_step": 356376, "epoch": 2945} {"train_loss": -45.01792907714844, "global_step": 356377, "epoch": 2945} {"train_loss": -45.34495544433594, "global_step": 356378, "epoch": 2945} {"train_loss": -45.19880294799805, "global_step": 356379, "epoch": 2945} {"train_loss": -45.43853759765625, "global_step": 356380, "epoch": 2945} {"train_loss": -45.43050003051758, "global_step": 356381, "epoch": 2945} {"train_loss": -45.895294189453125, "global_step": 356382, "epoch": 2945} {"train_loss": -45.76094436645508, "global_step": 356383, "epoch": 2945} {"train_loss": -44.9824104309082, "global_step": 356384, "epoch": 2945} {"train_loss": -44.945274353027344, "global_step": 356385, "epoch": 2945} {"train_loss": -45.72014236450195, "global_step": 356386, "epoch": 2945} {"train_loss": -44.36721420288086, "global_step": 356387, "epoch": 2945} {"train_loss": -44.433013916015625, "global_step": 356388, "epoch": 2945} {"train_loss": -45.11574172973633, "global_step": 356389, "epoch": 2945} {"train_loss": -45.62757110595703, "global_step": 356390, "epoch": 2945} {"train_loss": -45.40325927734375, "global_step": 356391, "epoch": 2945} {"train_loss": -45.023155212402344, "global_step": 356392, "epoch": 2945} {"train_loss": -45.44916534423828, "global_step": 356393, "epoch": 2945} {"train_loss": -45.2710075378418, "global_step": 356394, "epoch": 2945} {"train_loss": -45.021541595458984, "global_step": 356395, "epoch": 2945} {"train_loss": -45.442115783691406, "global_step": 356396, "epoch": 2945} {"train_loss": -45.53045654296875, "global_step": 356397, "epoch": 2945} {"train_loss": -44.21266174316406, "global_step": 356398, "epoch": 2945} {"train_loss": -43.41217803955078, "global_step": 356399, "epoch": 2945} {"train_loss": -44.8287239074707, "global_step": 356400, "epoch": 2945} {"train_loss": -42.79011917114258, "global_step": 356401, "epoch": 2945} {"train_loss": -40.22251510620117, "global_step": 356402, "epoch": 2945} {"train_loss": -41.73911666870117, "global_step": 356403, "epoch": 2945} {"train_loss": -43.11799240112305, "global_step": 356404, "epoch": 2945} {"train_loss": -41.104129791259766, "global_step": 356405, "epoch": 2945} {"train_loss": -42.36906814575195, "global_step": 356406, "epoch": 2945} {"train_loss": -40.67271041870117, "global_step": 356407, "epoch": 2945} {"train_loss": -43.13495635986328, "global_step": 356408, "epoch": 2945} {"train_loss": -40.20955276489258, "global_step": 356409, "epoch": 2945} {"train_loss": -42.10171127319336, "global_step": 356410, "epoch": 2945} {"train_loss": -39.044227600097656, "global_step": 356411, "epoch": 2945} {"train_loss": -44.04852294921875, "global_step": 356412, "epoch": 2945} {"train_loss": -41.956722259521484, "global_step": 356413, "epoch": 2945} {"train_loss": -43.41242599487305, "global_step": 356414, "epoch": 2945} {"train_loss": -39.5626106262207, "global_step": 356415, "epoch": 2945} {"train_loss": -39.47884750366211, "global_step": 356416, "epoch": 2945} {"train_loss": -40.21358871459961, "global_step": 356417, "epoch": 2945} {"train_loss": -41.63065719604492, "global_step": 356418, "epoch": 2945} {"train_loss": -39.447120666503906, "global_step": 356419, "epoch": 2945} {"train_loss": -41.9154052734375, "global_step": 356420, "epoch": 2945} {"train_loss": -40.41054153442383, "global_step": 356421, "epoch": 2945} {"train_loss": -42.16747283935547, "global_step": 356422, "epoch": 2945} {"train_loss": -41.55261993408203, "global_step": 356423, "epoch": 2945} {"train_loss": -40.90583419799805, "global_step": 356424, "epoch": 2945} {"train_loss": -42.3116340637207, "global_step": 356425, "epoch": 2945} {"train_loss": -41.42011642456055, "global_step": 356426, "epoch": 2945} {"train_loss": -42.66538619995117, "global_step": 356427, "epoch": 2945} {"train_loss": -41.918701171875, "global_step": 356428, "epoch": 2945} {"train_loss": -41.81610870361328, "global_step": 356429, "epoch": 2945} {"train_loss": -43.01130294799805, "global_step": 356430, "epoch": 2945} {"train_loss": -42.12042236328125, "global_step": 356431, "epoch": 2945} {"train_loss": -43.01857376098633, "global_step": 356432, "epoch": 2945} {"train_loss": -42.24983215332031, "global_step": 356433, "epoch": 2945} {"train_loss": -42.93395233154297, "global_step": 356434, "epoch": 2945} {"train_loss": -42.02470016479492, "global_step": 356435, "epoch": 2945} {"train_loss": -43.173980712890625, "global_step": 356436, "epoch": 2945} {"train_loss": -43.055477142333984, "global_step": 356437, "epoch": 2945} {"train_loss": -42.80745315551758, "global_step": 356438, "epoch": 2945} {"train_loss": -43.101837158203125, "global_step": 356439, "epoch": 2945} {"train_loss": -44.00810623168945, "global_step": 356440, "epoch": 2945} {"train_loss": -43.13008499145508, "global_step": 356441, "epoch": 2945} {"train_loss": -43.84971237182617, "global_step": 356442, "epoch": 2945} {"train_loss": -43.25785827636719, "global_step": 356443, "epoch": 2945} {"train_loss": -41.703407287597656, "global_step": 356444, "epoch": 2945} {"train_loss": -43.3435173034668, "global_step": 356445, "epoch": 2945} {"train_loss": -43.152748107910156, "global_step": 356446, "epoch": 2945} {"train_loss": -42.49274826049805, "global_step": 356447, "epoch": 2945} {"train_loss": -43.8348388671875, "global_step": 356448, "epoch": 2945} {"train_loss": -43.50809860229492, "global_step": 356449, "epoch": 2945} {"train_loss": -41.04659652709961, "global_step": 356450, "epoch": 2945} {"train_loss": -43.90098190307617, "global_step": 356451, "epoch": 2945} {"train_loss": -40.7301139831543, "global_step": 356452, "epoch": 2945} {"train_loss": -43.97541809082031, "global_step": 356453, "epoch": 2945} {"train_loss": -42.63859558105469, "global_step": 356454, "epoch": 2945} {"train_loss": -43.16627883911133, "global_step": 356455, "epoch": 2945} {"train_loss": -43.9032096862793, "global_step": 356456, "epoch": 2945} {"train_loss": -43.452945709228516, "global_step": 356457, "epoch": 2945} {"train_loss": -43.91978073120117, "global_step": 356458, "epoch": 2945} {"train_loss": -43.433467864990234, "global_step": 356459, "epoch": 2945} {"train_loss": -43.62589645385742, "global_step": 356460, "epoch": 2945} {"train_loss": -43.13218307495117, "global_step": 356461, "epoch": 2945} {"train_loss": -44.40454864501953, "global_step": 356462, "epoch": 2945} {"train_loss": -43.14205551147461, "global_step": 356463, "epoch": 2945} {"train_loss": -43.77768325805664, "global_step": 356464, "epoch": 2945} {"train_loss": -43.48714052941188, "global_step": 356465, "epoch": 2945, "val_loss": 2484195.75} {"train_loss": -43.892578125, "global_step": 356466, "epoch": 2946} {"train_loss": -45.00717544555664, "global_step": 356467, "epoch": 2946} {"train_loss": -43.00315475463867, "global_step": 356468, "epoch": 2946} {"train_loss": -44.2796630859375, "global_step": 356469, "epoch": 2946} {"train_loss": -44.18337631225586, "global_step": 356470, "epoch": 2946} {"train_loss": -44.03642272949219, "global_step": 356471, "epoch": 2946} {"train_loss": -45.04932403564453, "global_step": 356472, "epoch": 2946} {"train_loss": -44.17522048950195, "global_step": 356473, "epoch": 2946} {"train_loss": -44.649593353271484, "global_step": 356474, "epoch": 2946} {"train_loss": -44.546897888183594, "global_step": 356475, "epoch": 2946} {"train_loss": -44.57562255859375, "global_step": 356476, "epoch": 2946} {"train_loss": -44.87229537963867, "global_step": 356477, "epoch": 2946} {"train_loss": -44.69573211669922, "global_step": 356478, "epoch": 2946} {"train_loss": -44.84736251831055, "global_step": 356479, "epoch": 2946} {"train_loss": -44.6783561706543, "global_step": 356480, "epoch": 2946} {"train_loss": -45.48979949951172, "global_step": 356481, "epoch": 2946} {"train_loss": -44.54350662231445, "global_step": 356482, "epoch": 2946} {"train_loss": -45.554019927978516, "global_step": 356483, "epoch": 2946} {"train_loss": -45.47589111328125, "global_step": 356484, "epoch": 2946} {"train_loss": -45.266883850097656, "global_step": 356485, "epoch": 2946} {"train_loss": -45.41250228881836, "global_step": 356486, "epoch": 2946} {"train_loss": -45.45386505126953, "global_step": 356487, "epoch": 2946} {"train_loss": -44.90428161621094, "global_step": 356488, "epoch": 2946} {"train_loss": -45.0072021484375, "global_step": 356489, "epoch": 2946} {"train_loss": -44.95624542236328, "global_step": 356490, "epoch": 2946} {"train_loss": -44.91462707519531, "global_step": 356491, "epoch": 2946} {"train_loss": -45.63909149169922, "global_step": 356492, "epoch": 2946} {"train_loss": -45.503841400146484, "global_step": 356493, "epoch": 2946} {"train_loss": -45.518157958984375, "global_step": 356494, "epoch": 2946} {"train_loss": -45.385475158691406, "global_step": 356495, "epoch": 2946} {"train_loss": -46.069549560546875, "global_step": 356496, "epoch": 2946} {"train_loss": -45.24638366699219, "global_step": 356497, "epoch": 2946} {"train_loss": -45.36914825439453, "global_step": 356498, "epoch": 2946} {"train_loss": -46.031917572021484, "global_step": 356499, "epoch": 2946} {"train_loss": -45.302978515625, "global_step": 356500, "epoch": 2946} {"train_loss": -45.34164047241211, "global_step": 356501, "epoch": 2946} {"train_loss": -45.5890007019043, "global_step": 356502, "epoch": 2946} {"train_loss": -45.65260696411133, "global_step": 356503, "epoch": 2946} {"train_loss": -45.67253112792969, "global_step": 356504, "epoch": 2946} {"train_loss": -46.05919647216797, "global_step": 356505, "epoch": 2946} {"train_loss": -45.484779357910156, "global_step": 356506, "epoch": 2946} {"train_loss": -45.521358489990234, "global_step": 356507, "epoch": 2946} {"train_loss": -45.71454620361328, "global_step": 356508, "epoch": 2946} {"train_loss": -45.81447219848633, "global_step": 356509, "epoch": 2946} {"train_loss": -45.88068771362305, "global_step": 356510, "epoch": 2946} {"train_loss": -45.23553466796875, "global_step": 356511, "epoch": 2946} {"train_loss": -44.84025192260742, "global_step": 356512, "epoch": 2946} {"train_loss": -46.05469512939453, "global_step": 356513, "epoch": 2946} {"train_loss": -45.815216064453125, "global_step": 356514, "epoch": 2946} {"train_loss": -44.21260452270508, "global_step": 356515, "epoch": 2946} {"train_loss": -45.427520751953125, "global_step": 356516, "epoch": 2946} {"train_loss": -45.5134162902832, "global_step": 356517, "epoch": 2946} {"train_loss": -45.19464111328125, "global_step": 356518, "epoch": 2946} {"train_loss": -44.597354888916016, "global_step": 356519, "epoch": 2946} {"train_loss": -45.95426940917969, "global_step": 356520, "epoch": 2946} {"train_loss": -44.52706527709961, "global_step": 356521, "epoch": 2946} {"train_loss": -44.58845138549805, "global_step": 356522, "epoch": 2946} {"train_loss": -45.68618392944336, "global_step": 356523, "epoch": 2946} {"train_loss": -45.137611389160156, "global_step": 356524, "epoch": 2946} {"train_loss": -45.335201263427734, "global_step": 356525, "epoch": 2946} {"train_loss": -45.45209884643555, "global_step": 356526, "epoch": 2946} {"train_loss": -45.419525146484375, "global_step": 356527, "epoch": 2946} {"train_loss": -44.73348617553711, "global_step": 356528, "epoch": 2946} {"train_loss": -44.148040771484375, "global_step": 356529, "epoch": 2946} {"train_loss": -45.43482208251953, "global_step": 356530, "epoch": 2946} {"train_loss": -45.4534912109375, "global_step": 356531, "epoch": 2946} {"train_loss": -44.06180953979492, "global_step": 356532, "epoch": 2946} {"train_loss": -43.767372131347656, "global_step": 356533, "epoch": 2946} {"train_loss": -44.186161041259766, "global_step": 356534, "epoch": 2946} {"train_loss": -45.50693893432617, "global_step": 356535, "epoch": 2946} {"train_loss": -44.740478515625, "global_step": 356536, "epoch": 2946} {"train_loss": -43.905696868896484, "global_step": 356537, "epoch": 2946} {"train_loss": -45.14602279663086, "global_step": 356538, "epoch": 2946} {"train_loss": -44.733760833740234, "global_step": 356539, "epoch": 2946} {"train_loss": -44.660133361816406, "global_step": 356540, "epoch": 2946} {"train_loss": -44.45795440673828, "global_step": 356541, "epoch": 2946} {"train_loss": -45.39362335205078, "global_step": 356542, "epoch": 2946} {"train_loss": -43.91294479370117, "global_step": 356543, "epoch": 2946} {"train_loss": -44.806846618652344, "global_step": 356544, "epoch": 2946} {"train_loss": -44.82770538330078, "global_step": 356545, "epoch": 2946} {"train_loss": -44.54218673706055, "global_step": 356546, "epoch": 2946} {"train_loss": -43.50309371948242, "global_step": 356547, "epoch": 2946} {"train_loss": -42.42185592651367, "global_step": 356548, "epoch": 2946} {"train_loss": -42.89889144897461, "global_step": 356549, "epoch": 2946} {"train_loss": -44.29524612426758, "global_step": 356550, "epoch": 2946} {"train_loss": -42.23655319213867, "global_step": 356551, "epoch": 2946} {"train_loss": -43.745113372802734, "global_step": 356552, "epoch": 2946} {"train_loss": -42.86392593383789, "global_step": 356553, "epoch": 2946} {"train_loss": -43.949501037597656, "global_step": 356554, "epoch": 2946} {"train_loss": -44.3305549621582, "global_step": 356555, "epoch": 2946} {"train_loss": -44.036109924316406, "global_step": 356556, "epoch": 2946} {"train_loss": -43.31836700439453, "global_step": 356557, "epoch": 2946} {"train_loss": -44.854949951171875, "global_step": 356558, "epoch": 2946} {"train_loss": -43.89628219604492, "global_step": 356559, "epoch": 2946} {"train_loss": -43.30288314819336, "global_step": 356560, "epoch": 2946} {"train_loss": -42.40194320678711, "global_step": 356561, "epoch": 2946} {"train_loss": -42.45610427856445, "global_step": 356562, "epoch": 2946} {"train_loss": -44.18612289428711, "global_step": 356563, "epoch": 2946} {"train_loss": -40.32102966308594, "global_step": 356564, "epoch": 2946} {"train_loss": -44.3521728515625, "global_step": 356565, "epoch": 2946} {"train_loss": -40.02924346923828, "global_step": 356566, "epoch": 2946} {"train_loss": -43.82527542114258, "global_step": 356567, "epoch": 2946} {"train_loss": -39.579978942871094, "global_step": 356568, "epoch": 2946} {"train_loss": -40.64750289916992, "global_step": 356569, "epoch": 2946} {"train_loss": -42.420650482177734, "global_step": 356570, "epoch": 2946} {"train_loss": -37.18212890625, "global_step": 356571, "epoch": 2946} {"train_loss": -40.26698303222656, "global_step": 356572, "epoch": 2946} {"train_loss": -38.225955963134766, "global_step": 356573, "epoch": 2946} {"train_loss": -35.787296295166016, "global_step": 356574, "epoch": 2946} {"train_loss": -36.26377487182617, "global_step": 356575, "epoch": 2946} {"train_loss": -38.45246124267578, "global_step": 356576, "epoch": 2946} {"train_loss": -36.715858459472656, "global_step": 356577, "epoch": 2946} {"train_loss": -36.940223693847656, "global_step": 356578, "epoch": 2946} {"train_loss": -38.7521858215332, "global_step": 356579, "epoch": 2946} {"train_loss": -37.79929733276367, "global_step": 356580, "epoch": 2946} {"train_loss": -37.878883361816406, "global_step": 356581, "epoch": 2946} {"train_loss": -37.804500579833984, "global_step": 356582, "epoch": 2946} {"train_loss": -39.34640121459961, "global_step": 356583, "epoch": 2946} {"train_loss": -37.876243591308594, "global_step": 356584, "epoch": 2946} {"train_loss": -39.47736740112305, "global_step": 356585, "epoch": 2946} {"train_loss": -43.684626492587, "global_step": 356586, "epoch": 2946, "val_loss": 2586218.25} {"train_loss": -40.73971176147461, "global_step": 356587, "epoch": 2947} {"train_loss": -40.14347839355469, "global_step": 356588, "epoch": 2947} {"train_loss": -41.478729248046875, "global_step": 356589, "epoch": 2947} {"train_loss": -41.12047576904297, "global_step": 356590, "epoch": 2947} {"train_loss": -40.91941452026367, "global_step": 356591, "epoch": 2947} {"train_loss": -41.8991813659668, "global_step": 356592, "epoch": 2947} {"train_loss": -40.07444381713867, "global_step": 356593, "epoch": 2947} {"train_loss": -41.74311447143555, "global_step": 356594, "epoch": 2947} {"train_loss": -41.2235107421875, "global_step": 356595, "epoch": 2947} {"train_loss": -41.79311752319336, "global_step": 356596, "epoch": 2947} {"train_loss": -42.19643020629883, "global_step": 356597, "epoch": 2947} {"train_loss": -41.24579620361328, "global_step": 356598, "epoch": 2947} {"train_loss": -42.11713409423828, "global_step": 356599, "epoch": 2947} {"train_loss": -40.85419845581055, "global_step": 356600, "epoch": 2947} {"train_loss": -42.73557662963867, "global_step": 356601, "epoch": 2947} {"train_loss": -40.688812255859375, "global_step": 356602, "epoch": 2947} {"train_loss": -42.54133224487305, "global_step": 356603, "epoch": 2947} {"train_loss": -40.838382720947266, "global_step": 356604, "epoch": 2947} {"train_loss": -42.304866790771484, "global_step": 356605, "epoch": 2947} {"train_loss": -42.03755569458008, "global_step": 356606, "epoch": 2947} {"train_loss": -41.737098693847656, "global_step": 356607, "epoch": 2947} {"train_loss": -43.039955139160156, "global_step": 356608, "epoch": 2947} {"train_loss": -42.009281158447266, "global_step": 356609, "epoch": 2947} {"train_loss": -43.39259719848633, "global_step": 356610, "epoch": 2947} {"train_loss": -42.3853874206543, "global_step": 356611, "epoch": 2947} {"train_loss": -43.5427360534668, "global_step": 356612, "epoch": 2947} {"train_loss": -42.0782585144043, "global_step": 356613, "epoch": 2947} {"train_loss": -43.97368240356445, "global_step": 356614, "epoch": 2947} {"train_loss": -43.80572509765625, "global_step": 356615, "epoch": 2947} {"train_loss": -43.872039794921875, "global_step": 356616, "epoch": 2947} {"train_loss": -43.39661407470703, "global_step": 356617, "epoch": 2947} {"train_loss": -44.18699645996094, "global_step": 356618, "epoch": 2947} {"train_loss": -43.67066192626953, "global_step": 356619, "epoch": 2947} {"train_loss": -44.31827926635742, "global_step": 356620, "epoch": 2947} {"train_loss": -43.54911422729492, "global_step": 356621, "epoch": 2947} {"train_loss": -44.66134262084961, "global_step": 356622, "epoch": 2947} {"train_loss": -44.14663314819336, "global_step": 356623, "epoch": 2947} {"train_loss": -43.91130828857422, "global_step": 356624, "epoch": 2947} {"train_loss": -43.85696029663086, "global_step": 356625, "epoch": 2947} {"train_loss": -44.0350227355957, "global_step": 356626, "epoch": 2947} {"train_loss": -44.09357452392578, "global_step": 356627, "epoch": 2947} {"train_loss": -44.76179122924805, "global_step": 356628, "epoch": 2947} {"train_loss": -44.611331939697266, "global_step": 356629, "epoch": 2947} {"train_loss": -44.80401611328125, "global_step": 356630, "epoch": 2947} {"train_loss": -44.49250030517578, "global_step": 356631, "epoch": 2947} {"train_loss": -44.42754364013672, "global_step": 356632, "epoch": 2947} {"train_loss": -44.458248138427734, "global_step": 356633, "epoch": 2947} {"train_loss": -44.8161506652832, "global_step": 356634, "epoch": 2947} {"train_loss": -44.97758483886719, "global_step": 356635, "epoch": 2947} {"train_loss": -44.97700881958008, "global_step": 356636, "epoch": 2947} {"train_loss": -44.869808197021484, "global_step": 356637, "epoch": 2947} {"train_loss": -44.98215103149414, "global_step": 356638, "epoch": 2947} {"train_loss": -44.77710723876953, "global_step": 356639, "epoch": 2947} {"train_loss": -45.51772689819336, "global_step": 356640, "epoch": 2947} {"train_loss": -45.059139251708984, "global_step": 356641, "epoch": 2947} {"train_loss": -45.388431549072266, "global_step": 356642, "epoch": 2947} {"train_loss": -45.318599700927734, "global_step": 356643, "epoch": 2947} {"train_loss": -45.282310485839844, "global_step": 356644, "epoch": 2947} {"train_loss": -45.828372955322266, "global_step": 356645, "epoch": 2947} {"train_loss": -45.134334564208984, "global_step": 356646, "epoch": 2947} {"train_loss": -45.088653564453125, "global_step": 356647, "epoch": 2947} {"train_loss": -45.34157180786133, "global_step": 356648, "epoch": 2947} {"train_loss": -44.684791564941406, "global_step": 356649, "epoch": 2947} {"train_loss": -45.6274299621582, "global_step": 356650, "epoch": 2947} {"train_loss": -45.612060546875, "global_step": 356651, "epoch": 2947} {"train_loss": -45.97505569458008, "global_step": 356652, "epoch": 2947} {"train_loss": -45.67683792114258, "global_step": 356653, "epoch": 2947} {"train_loss": -45.43721389770508, "global_step": 356654, "epoch": 2947} {"train_loss": -45.46149444580078, "global_step": 356655, "epoch": 2947} {"train_loss": -45.67632293701172, "global_step": 356656, "epoch": 2947} {"train_loss": -45.8330192565918, "global_step": 356657, "epoch": 2947} {"train_loss": -45.92017364501953, "global_step": 356658, "epoch": 2947} {"train_loss": -46.06862258911133, "global_step": 356659, "epoch": 2947} {"train_loss": -46.280418395996094, "global_step": 356660, "epoch": 2947} {"train_loss": -45.849544525146484, "global_step": 356661, "epoch": 2947} {"train_loss": -46.08026123046875, "global_step": 356662, "epoch": 2947} {"train_loss": -45.70111846923828, "global_step": 356663, "epoch": 2947} {"train_loss": -46.071834564208984, "global_step": 356664, "epoch": 2947} {"train_loss": -46.343780517578125, "global_step": 356665, "epoch": 2947} {"train_loss": -45.90052795410156, "global_step": 356666, "epoch": 2947} {"train_loss": -46.167091369628906, "global_step": 356667, "epoch": 2947} {"train_loss": -45.8781623840332, "global_step": 356668, "epoch": 2947} {"train_loss": -46.25477981567383, "global_step": 356669, "epoch": 2947} {"train_loss": -46.39432144165039, "global_step": 356670, "epoch": 2947} {"train_loss": -46.2618408203125, "global_step": 356671, "epoch": 2947} {"train_loss": -46.417884826660156, "global_step": 356672, "epoch": 2947} {"train_loss": -46.36366271972656, "global_step": 356673, "epoch": 2947} {"train_loss": -46.60404586791992, "global_step": 356674, "epoch": 2947} {"train_loss": -45.744712829589844, "global_step": 356675, "epoch": 2947} {"train_loss": -46.38395309448242, "global_step": 356676, "epoch": 2947} {"train_loss": -45.6075553894043, "global_step": 356677, "epoch": 2947} {"train_loss": -45.85626983642578, "global_step": 356678, "epoch": 2947} {"train_loss": -46.28866195678711, "global_step": 356679, "epoch": 2947} {"train_loss": -45.4437370300293, "global_step": 356680, "epoch": 2947} {"train_loss": -46.318050384521484, "global_step": 356681, "epoch": 2947} {"train_loss": -46.43624496459961, "global_step": 356682, "epoch": 2947} {"train_loss": -45.99281692504883, "global_step": 356683, "epoch": 2947} {"train_loss": -45.342506408691406, "global_step": 356684, "epoch": 2947} {"train_loss": -45.247314453125, "global_step": 356685, "epoch": 2947} {"train_loss": -42.979949951171875, "global_step": 356686, "epoch": 2947} {"train_loss": -42.5624885559082, "global_step": 356687, "epoch": 2947} {"train_loss": -44.964935302734375, "global_step": 356688, "epoch": 2947} {"train_loss": -44.925453186035156, "global_step": 356689, "epoch": 2947} {"train_loss": -39.972957611083984, "global_step": 356690, "epoch": 2947} {"train_loss": -39.62250900268555, "global_step": 356691, "epoch": 2947} {"train_loss": -41.690792083740234, "global_step": 356692, "epoch": 2947} {"train_loss": -41.11583709716797, "global_step": 356693, "epoch": 2947} {"train_loss": -41.00560760498047, "global_step": 356694, "epoch": 2947} {"train_loss": -41.23527908325195, "global_step": 356695, "epoch": 2947} {"train_loss": -41.47895431518555, "global_step": 356696, "epoch": 2947} {"train_loss": -41.95162582397461, "global_step": 356697, "epoch": 2947} {"train_loss": -43.89149475097656, "global_step": 356698, "epoch": 2947} {"train_loss": -43.38001251220703, "global_step": 356699, "epoch": 2947} {"train_loss": -43.44350051879883, "global_step": 356700, "epoch": 2947} {"train_loss": -42.18653106689453, "global_step": 356701, "epoch": 2947} {"train_loss": -41.611785888671875, "global_step": 356702, "epoch": 2947} {"train_loss": -43.24882125854492, "global_step": 356703, "epoch": 2947} {"train_loss": -42.925926208496094, "global_step": 356704, "epoch": 2947} {"train_loss": -42.918983459472656, "global_step": 356705, "epoch": 2947} {"train_loss": -43.14323806762695, "global_step": 356706, "epoch": 2947} {"train_loss": -43.96488722493826, "global_step": 356707, "epoch": 2947, "val_loss": 2495206.25} {"train_loss": -41.431190490722656, "global_step": 356708, "epoch": 2948} {"train_loss": -43.88481140136719, "global_step": 356709, "epoch": 2948} {"train_loss": -41.64565658569336, "global_step": 356710, "epoch": 2948} {"train_loss": -42.900760650634766, "global_step": 356711, "epoch": 2948} {"train_loss": -42.12742233276367, "global_step": 356712, "epoch": 2948} {"train_loss": -42.505306243896484, "global_step": 356713, "epoch": 2948} {"train_loss": -41.96744918823242, "global_step": 356714, "epoch": 2948} {"train_loss": -41.68504333496094, "global_step": 356715, "epoch": 2948} {"train_loss": -39.95956802368164, "global_step": 356716, "epoch": 2948} {"train_loss": -41.868831634521484, "global_step": 356717, "epoch": 2948} {"train_loss": -40.123836517333984, "global_step": 356718, "epoch": 2948} {"train_loss": -40.728111267089844, "global_step": 356719, "epoch": 2948} {"train_loss": -42.328792572021484, "global_step": 356720, "epoch": 2948} {"train_loss": -37.892269134521484, "global_step": 356721, "epoch": 2948} {"train_loss": -38.17183303833008, "global_step": 356722, "epoch": 2948} {"train_loss": -39.251319885253906, "global_step": 356723, "epoch": 2948} {"train_loss": -41.925323486328125, "global_step": 356724, "epoch": 2948} {"train_loss": -35.6270866394043, "global_step": 356725, "epoch": 2948} {"train_loss": -40.8060302734375, "global_step": 356726, "epoch": 2948} {"train_loss": -35.817718505859375, "global_step": 356727, "epoch": 2948} {"train_loss": -39.693241119384766, "global_step": 356728, "epoch": 2948} {"train_loss": -41.20136642456055, "global_step": 356729, "epoch": 2948} {"train_loss": -37.30860137939453, "global_step": 356730, "epoch": 2948} {"train_loss": -34.60710906982422, "global_step": 356731, "epoch": 2948} {"train_loss": -37.70024490356445, "global_step": 356732, "epoch": 2948} {"train_loss": -40.40199661254883, "global_step": 356733, "epoch": 2948} {"train_loss": -41.6848030090332, "global_step": 356734, "epoch": 2948} {"train_loss": -41.28308868408203, "global_step": 356735, "epoch": 2948} {"train_loss": -42.81003952026367, "global_step": 356736, "epoch": 2948} {"train_loss": -42.57297897338867, "global_step": 356737, "epoch": 2948} {"train_loss": -41.126529693603516, "global_step": 356738, "epoch": 2948} {"train_loss": -43.14826965332031, "global_step": 356739, "epoch": 2948} {"train_loss": -42.84033203125, "global_step": 356740, "epoch": 2948} {"train_loss": -42.73358917236328, "global_step": 356741, "epoch": 2948} {"train_loss": -42.12957763671875, "global_step": 356742, "epoch": 2948} {"train_loss": -43.0128288269043, "global_step": 356743, "epoch": 2948} {"train_loss": -42.945655822753906, "global_step": 356744, "epoch": 2948} {"train_loss": -42.50020980834961, "global_step": 356745, "epoch": 2948} {"train_loss": -43.48260498046875, "global_step": 356746, "epoch": 2948} {"train_loss": -42.512115478515625, "global_step": 356747, "epoch": 2948} {"train_loss": -43.074520111083984, "global_step": 356748, "epoch": 2948} {"train_loss": -43.18817138671875, "global_step": 356749, "epoch": 2948} {"train_loss": -42.92964172363281, "global_step": 356750, "epoch": 2948} {"train_loss": -43.22536849975586, "global_step": 356751, "epoch": 2948} {"train_loss": -43.45414733886719, "global_step": 356752, "epoch": 2948} {"train_loss": -36.8595085144043, "global_step": 356753, "epoch": 2948} {"train_loss": -43.262664794921875, "global_step": 356754, "epoch": 2948} {"train_loss": -43.20619583129883, "global_step": 356755, "epoch": 2948} {"train_loss": -43.866600036621094, "global_step": 356756, "epoch": 2948} {"train_loss": -43.63247299194336, "global_step": 356757, "epoch": 2948} {"train_loss": -44.27499008178711, "global_step": 356758, "epoch": 2948} {"train_loss": -43.34626007080078, "global_step": 356759, "epoch": 2948} {"train_loss": -43.6033935546875, "global_step": 356760, "epoch": 2948} {"train_loss": -43.7381477355957, "global_step": 356761, "epoch": 2948} {"train_loss": -38.836524963378906, "global_step": 356762, "epoch": 2948} {"train_loss": -43.989898681640625, "global_step": 356763, "epoch": 2948} {"train_loss": -44.4570426940918, "global_step": 356764, "epoch": 2948} {"train_loss": -44.29536437988281, "global_step": 356765, "epoch": 2948} {"train_loss": -43.9370002746582, "global_step": 356766, "epoch": 2948} {"train_loss": -43.64745330810547, "global_step": 356767, "epoch": 2948} {"train_loss": -40.57347869873047, "global_step": 356768, "epoch": 2948} {"train_loss": -43.65007400512695, "global_step": 356769, "epoch": 2948} {"train_loss": -43.74214553833008, "global_step": 356770, "epoch": 2948} {"train_loss": -43.555511474609375, "global_step": 356771, "epoch": 2948} {"train_loss": -43.95574188232422, "global_step": 356772, "epoch": 2948} {"train_loss": -43.196746826171875, "global_step": 356773, "epoch": 2948} {"train_loss": -43.75703048706055, "global_step": 356774, "epoch": 2948} {"train_loss": -43.883216857910156, "global_step": 356775, "epoch": 2948} {"train_loss": -43.95198059082031, "global_step": 356776, "epoch": 2948} {"train_loss": -44.19843673706055, "global_step": 356777, "epoch": 2948} {"train_loss": -43.414756774902344, "global_step": 356778, "epoch": 2948} {"train_loss": -44.257808685302734, "global_step": 356779, "epoch": 2948} {"train_loss": -44.474666595458984, "global_step": 356780, "epoch": 2948} {"train_loss": -44.719825744628906, "global_step": 356781, "epoch": 2948} {"train_loss": -44.34980010986328, "global_step": 356782, "epoch": 2948} {"train_loss": -43.97120666503906, "global_step": 356783, "epoch": 2948} {"train_loss": -44.15993881225586, "global_step": 356784, "epoch": 2948} {"train_loss": -44.58332061767578, "global_step": 356785, "epoch": 2948} {"train_loss": -44.55186462402344, "global_step": 356786, "epoch": 2948} {"train_loss": -44.40520095825195, "global_step": 356787, "epoch": 2948} {"train_loss": -44.92644119262695, "global_step": 356788, "epoch": 2948} {"train_loss": -44.48793411254883, "global_step": 356789, "epoch": 2948} {"train_loss": -45.21165466308594, "global_step": 356790, "epoch": 2948} {"train_loss": -45.065311431884766, "global_step": 356791, "epoch": 2948} {"train_loss": -45.1149787902832, "global_step": 356792, "epoch": 2948} {"train_loss": -44.2059211730957, "global_step": 356793, "epoch": 2948} {"train_loss": -44.57179260253906, "global_step": 356794, "epoch": 2948} {"train_loss": -45.18912887573242, "global_step": 356795, "epoch": 2948} {"train_loss": -43.755958557128906, "global_step": 356796, "epoch": 2948} {"train_loss": -44.16669845581055, "global_step": 356797, "epoch": 2948} {"train_loss": -44.58181381225586, "global_step": 356798, "epoch": 2948} {"train_loss": -44.62412643432617, "global_step": 356799, "epoch": 2948} {"train_loss": -44.50867462158203, "global_step": 356800, "epoch": 2948} {"train_loss": -45.400421142578125, "global_step": 356801, "epoch": 2948} {"train_loss": -45.51264953613281, "global_step": 356802, "epoch": 2948} {"train_loss": -45.42293167114258, "global_step": 356803, "epoch": 2948} {"train_loss": -44.53175735473633, "global_step": 356804, "epoch": 2948} {"train_loss": -44.68183898925781, "global_step": 356805, "epoch": 2948} {"train_loss": -42.0107536315918, "global_step": 356806, "epoch": 2948} {"train_loss": -44.454280853271484, "global_step": 356807, "epoch": 2948} {"train_loss": -44.84029769897461, "global_step": 356808, "epoch": 2948} {"train_loss": -42.58847427368164, "global_step": 356809, "epoch": 2948} {"train_loss": -45.19538116455078, "global_step": 356810, "epoch": 2948} {"train_loss": -45.58320617675781, "global_step": 356811, "epoch": 2948} {"train_loss": -45.4795036315918, "global_step": 356812, "epoch": 2948} {"train_loss": -44.85679244995117, "global_step": 356813, "epoch": 2948} {"train_loss": -44.11616134643555, "global_step": 356814, "epoch": 2948} {"train_loss": -43.234737396240234, "global_step": 356815, "epoch": 2948} {"train_loss": -45.132057189941406, "global_step": 356816, "epoch": 2948} {"train_loss": -45.193416595458984, "global_step": 356817, "epoch": 2948} {"train_loss": -44.99677658081055, "global_step": 356818, "epoch": 2948} {"train_loss": -45.22206497192383, "global_step": 356819, "epoch": 2948} {"train_loss": -44.96908187866211, "global_step": 356820, "epoch": 2948} {"train_loss": -44.9165153503418, "global_step": 356821, "epoch": 2948} {"train_loss": -44.8901252746582, "global_step": 356822, "epoch": 2948} {"train_loss": -45.63821029663086, "global_step": 356823, "epoch": 2948} {"train_loss": -45.362831115722656, "global_step": 356824, "epoch": 2948} {"train_loss": -45.82853317260742, "global_step": 356825, "epoch": 2948} {"train_loss": -45.195621490478516, "global_step": 356826, "epoch": 2948} {"train_loss": -45.21482467651367, "global_step": 356827, "epoch": 2948} {"train_loss": -43.07847834815664, "global_step": 356828, "epoch": 2948, "val_loss": 2510677.75} {"train_loss": -44.822444915771484, "global_step": 356829, "epoch": 2949} {"train_loss": -45.0211296081543, "global_step": 356830, "epoch": 2949} {"train_loss": -44.94497299194336, "global_step": 356831, "epoch": 2949} {"train_loss": -42.43727493286133, "global_step": 356832, "epoch": 2949} {"train_loss": -44.25059127807617, "global_step": 356833, "epoch": 2949} {"train_loss": -42.22275924682617, "global_step": 356834, "epoch": 2949} {"train_loss": -45.59796142578125, "global_step": 356835, "epoch": 2949} {"train_loss": -44.95951461791992, "global_step": 356836, "epoch": 2949} {"train_loss": -44.36979293823242, "global_step": 356837, "epoch": 2949} {"train_loss": -43.9052619934082, "global_step": 356838, "epoch": 2949} {"train_loss": -43.29656219482422, "global_step": 356839, "epoch": 2949} {"train_loss": -43.823753356933594, "global_step": 356840, "epoch": 2949} {"train_loss": -43.8204345703125, "global_step": 356841, "epoch": 2949} {"train_loss": -44.69984436035156, "global_step": 356842, "epoch": 2949} {"train_loss": -44.871620178222656, "global_step": 356843, "epoch": 2949} {"train_loss": -44.98289108276367, "global_step": 356844, "epoch": 2949} {"train_loss": -45.178932189941406, "global_step": 356845, "epoch": 2949} {"train_loss": -44.022823333740234, "global_step": 356846, "epoch": 2949} {"train_loss": -44.4284782409668, "global_step": 356847, "epoch": 2949} {"train_loss": -45.39067840576172, "global_step": 356848, "epoch": 2949} {"train_loss": -43.9927864074707, "global_step": 356849, "epoch": 2949} {"train_loss": -44.025238037109375, "global_step": 356850, "epoch": 2949} {"train_loss": -44.857383728027344, "global_step": 356851, "epoch": 2949} {"train_loss": -44.856685638427734, "global_step": 356852, "epoch": 2949} {"train_loss": -45.0904655456543, "global_step": 356853, "epoch": 2949} {"train_loss": -44.93886947631836, "global_step": 356854, "epoch": 2949} {"train_loss": -44.743553161621094, "global_step": 356855, "epoch": 2949} {"train_loss": -44.524227142333984, "global_step": 356856, "epoch": 2949} {"train_loss": -44.67582321166992, "global_step": 356857, "epoch": 2949} {"train_loss": -45.06726837158203, "global_step": 356858, "epoch": 2949} {"train_loss": -44.897186279296875, "global_step": 356859, "epoch": 2949} {"train_loss": -44.23804473876953, "global_step": 356860, "epoch": 2949} {"train_loss": -44.141597747802734, "global_step": 356861, "epoch": 2949} {"train_loss": -43.946659088134766, "global_step": 356862, "epoch": 2949} {"train_loss": -44.602108001708984, "global_step": 356863, "epoch": 2949} {"train_loss": -44.68983840942383, "global_step": 356864, "epoch": 2949} {"train_loss": -44.422943115234375, "global_step": 356865, "epoch": 2949} {"train_loss": -41.94236373901367, "global_step": 356866, "epoch": 2949} {"train_loss": -44.83024215698242, "global_step": 356867, "epoch": 2949} {"train_loss": -44.99665069580078, "global_step": 356868, "epoch": 2949} {"train_loss": -43.653743743896484, "global_step": 356869, "epoch": 2949} {"train_loss": -43.95983123779297, "global_step": 356870, "epoch": 2949} {"train_loss": -43.33661651611328, "global_step": 356871, "epoch": 2949} {"train_loss": -44.54119873046875, "global_step": 356872, "epoch": 2949} {"train_loss": -45.25315856933594, "global_step": 356873, "epoch": 2949} {"train_loss": -44.997867584228516, "global_step": 356874, "epoch": 2949} {"train_loss": -43.6986198425293, "global_step": 356875, "epoch": 2949} {"train_loss": -45.03092575073242, "global_step": 356876, "epoch": 2949} {"train_loss": -44.65395736694336, "global_step": 356877, "epoch": 2949} {"train_loss": -44.171363830566406, "global_step": 356878, "epoch": 2949} {"train_loss": -40.292171478271484, "global_step": 356879, "epoch": 2949} {"train_loss": -42.7799186706543, "global_step": 356880, "epoch": 2949} {"train_loss": -44.13429641723633, "global_step": 356881, "epoch": 2949} {"train_loss": -42.53941345214844, "global_step": 356882, "epoch": 2949} {"train_loss": -42.9506950378418, "global_step": 356883, "epoch": 2949} {"train_loss": -43.117916107177734, "global_step": 356884, "epoch": 2949} {"train_loss": -42.9619026184082, "global_step": 356885, "epoch": 2949} {"train_loss": -41.479732513427734, "global_step": 356886, "epoch": 2949} {"train_loss": -43.78547668457031, "global_step": 356887, "epoch": 2949} {"train_loss": -41.0811882019043, "global_step": 356888, "epoch": 2949} {"train_loss": -44.24623489379883, "global_step": 356889, "epoch": 2949} {"train_loss": -40.54879379272461, "global_step": 356890, "epoch": 2949} {"train_loss": -43.2847900390625, "global_step": 356891, "epoch": 2949} {"train_loss": -41.36476135253906, "global_step": 356892, "epoch": 2949} {"train_loss": -43.94659423828125, "global_step": 356893, "epoch": 2949} {"train_loss": -43.4732551574707, "global_step": 356894, "epoch": 2949} {"train_loss": -41.3614387512207, "global_step": 356895, "epoch": 2949} {"train_loss": -44.43645095825195, "global_step": 356896, "epoch": 2949} {"train_loss": -42.8109245300293, "global_step": 356897, "epoch": 2949} {"train_loss": -44.0759391784668, "global_step": 356898, "epoch": 2949} {"train_loss": -44.13176345825195, "global_step": 356899, "epoch": 2949} {"train_loss": -44.02858352661133, "global_step": 356900, "epoch": 2949} {"train_loss": -44.3224983215332, "global_step": 356901, "epoch": 2949} {"train_loss": -44.17165756225586, "global_step": 356902, "epoch": 2949} {"train_loss": -43.69950866699219, "global_step": 356903, "epoch": 2949} {"train_loss": -43.171783447265625, "global_step": 356904, "epoch": 2949} {"train_loss": -44.367347717285156, "global_step": 356905, "epoch": 2949} {"train_loss": -44.223758697509766, "global_step": 356906, "epoch": 2949} {"train_loss": -43.5757942199707, "global_step": 356907, "epoch": 2949} {"train_loss": -44.1399040222168, "global_step": 356908, "epoch": 2949} {"train_loss": -44.09116744995117, "global_step": 356909, "epoch": 2949} {"train_loss": -44.36676025390625, "global_step": 356910, "epoch": 2949} {"train_loss": -45.126304626464844, "global_step": 356911, "epoch": 2949} {"train_loss": -44.32927322387695, "global_step": 356912, "epoch": 2949} {"train_loss": -43.362213134765625, "global_step": 356913, "epoch": 2949} {"train_loss": -44.891571044921875, "global_step": 356914, "epoch": 2949} {"train_loss": -44.53995132446289, "global_step": 356915, "epoch": 2949} {"train_loss": -45.07805252075195, "global_step": 356916, "epoch": 2949} {"train_loss": -44.42022705078125, "global_step": 356917, "epoch": 2949} {"train_loss": -44.23524475097656, "global_step": 356918, "epoch": 2949} {"train_loss": -45.25015640258789, "global_step": 356919, "epoch": 2949} {"train_loss": -43.788551330566406, "global_step": 356920, "epoch": 2949} {"train_loss": -45.04740524291992, "global_step": 356921, "epoch": 2949} {"train_loss": -40.676021575927734, "global_step": 356922, "epoch": 2949} {"train_loss": -44.55918502807617, "global_step": 356923, "epoch": 2949} {"train_loss": -44.91386032104492, "global_step": 356924, "epoch": 2949} {"train_loss": -44.174190521240234, "global_step": 356925, "epoch": 2949} {"train_loss": -39.601036071777344, "global_step": 356926, "epoch": 2949} {"train_loss": -44.260162353515625, "global_step": 356927, "epoch": 2949} {"train_loss": -43.883216857910156, "global_step": 356928, "epoch": 2949} {"train_loss": -42.33024215698242, "global_step": 356929, "epoch": 2949} {"train_loss": -41.05733108520508, "global_step": 356930, "epoch": 2949} {"train_loss": -42.07820510864258, "global_step": 356931, "epoch": 2949} {"train_loss": -41.28352737426758, "global_step": 356932, "epoch": 2949} {"train_loss": -43.86538314819336, "global_step": 356933, "epoch": 2949} {"train_loss": -41.76177978515625, "global_step": 356934, "epoch": 2949} {"train_loss": -42.94499206542969, "global_step": 356935, "epoch": 2949} {"train_loss": -43.26618957519531, "global_step": 356936, "epoch": 2949} {"train_loss": -42.144771575927734, "global_step": 356937, "epoch": 2949} {"train_loss": -43.665016174316406, "global_step": 356938, "epoch": 2949} {"train_loss": -42.59165573120117, "global_step": 356939, "epoch": 2949} {"train_loss": -41.97574996948242, "global_step": 356940, "epoch": 2949} {"train_loss": -40.79420852661133, "global_step": 356941, "epoch": 2949} {"train_loss": -41.83949661254883, "global_step": 356942, "epoch": 2949} {"train_loss": -43.71088790893555, "global_step": 356943, "epoch": 2949} {"train_loss": -42.72121047973633, "global_step": 356944, "epoch": 2949} {"train_loss": -44.1552619934082, "global_step": 356945, "epoch": 2949} {"train_loss": -43.28240966796875, "global_step": 356946, "epoch": 2949} {"train_loss": -42.087135314941406, "global_step": 356947, "epoch": 2949} {"train_loss": -44.046443939208984, "global_step": 356948, "epoch": 2949} {"train_loss": -43.70750058386937, "global_step": 356949, "epoch": 2949, "val_loss": 2646244.5} {"train_loss": -44.09628677368164, "global_step": 356950, "epoch": 2950} {"train_loss": -42.458839416503906, "global_step": 356951, "epoch": 2950} {"train_loss": -44.22976303100586, "global_step": 356952, "epoch": 2950} {"train_loss": -43.11644744873047, "global_step": 356953, "epoch": 2950} {"train_loss": -43.15633010864258, "global_step": 356954, "epoch": 2950} {"train_loss": -43.298728942871094, "global_step": 356955, "epoch": 2950} {"train_loss": -43.34556198120117, "global_step": 356956, "epoch": 2950} {"train_loss": -44.137237548828125, "global_step": 356957, "epoch": 2950} {"train_loss": -43.78548812866211, "global_step": 356958, "epoch": 2950} {"train_loss": -44.10810470581055, "global_step": 356959, "epoch": 2950} {"train_loss": -44.13387680053711, "global_step": 356960, "epoch": 2950} {"train_loss": -44.28193283081055, "global_step": 356961, "epoch": 2950} {"train_loss": -43.34772872924805, "global_step": 356962, "epoch": 2950} {"train_loss": -44.7734260559082, "global_step": 356963, "epoch": 2950} {"train_loss": -42.952552795410156, "global_step": 356964, "epoch": 2950} {"train_loss": -41.206356048583984, "global_step": 356965, "epoch": 2950} {"train_loss": -42.88843536376953, "global_step": 356966, "epoch": 2950} {"train_loss": -43.04610824584961, "global_step": 356967, "epoch": 2950} {"train_loss": -44.342708587646484, "global_step": 356968, "epoch": 2950} {"train_loss": -44.244850158691406, "global_step": 356969, "epoch": 2950} {"train_loss": -43.03493881225586, "global_step": 356970, "epoch": 2950} {"train_loss": -44.4552116394043, "global_step": 356971, "epoch": 2950} {"train_loss": -43.610816955566406, "global_step": 356972, "epoch": 2950} {"train_loss": -44.53294372558594, "global_step": 356973, "epoch": 2950} {"train_loss": -44.921302795410156, "global_step": 356974, "epoch": 2950} {"train_loss": -44.30880355834961, "global_step": 356975, "epoch": 2950} {"train_loss": -44.54423141479492, "global_step": 356976, "epoch": 2950} {"train_loss": -44.0889778137207, "global_step": 356977, "epoch": 2950} {"train_loss": -44.677364349365234, "global_step": 356978, "epoch": 2950} {"train_loss": -44.573307037353516, "global_step": 356979, "epoch": 2950} {"train_loss": -44.2072868347168, "global_step": 356980, "epoch": 2950} {"train_loss": -44.509605407714844, "global_step": 356981, "epoch": 2950} {"train_loss": -44.97115707397461, "global_step": 356982, "epoch": 2950} {"train_loss": -44.343223571777344, "global_step": 356983, "epoch": 2950} {"train_loss": -45.071475982666016, "global_step": 356984, "epoch": 2950} {"train_loss": -44.83155059814453, "global_step": 356985, "epoch": 2950} {"train_loss": -43.515472412109375, "global_step": 356986, "epoch": 2950} {"train_loss": -45.0087776184082, "global_step": 356987, "epoch": 2950} {"train_loss": -45.368343353271484, "global_step": 356988, "epoch": 2950} {"train_loss": -45.3651123046875, "global_step": 356989, "epoch": 2950} {"train_loss": -45.066619873046875, "global_step": 356990, "epoch": 2950} {"train_loss": -45.436729431152344, "global_step": 356991, "epoch": 2950} {"train_loss": -44.900203704833984, "global_step": 356992, "epoch": 2950} {"train_loss": -45.37235641479492, "global_step": 356993, "epoch": 2950} {"train_loss": -44.99764633178711, "global_step": 356994, "epoch": 2950} {"train_loss": -45.50456237792969, "global_step": 356995, "epoch": 2950} {"train_loss": -45.15386199951172, "global_step": 356996, "epoch": 2950} {"train_loss": -45.162227630615234, "global_step": 356997, "epoch": 2950} {"train_loss": -44.847999572753906, "global_step": 356998, "epoch": 2950} {"train_loss": -45.65024948120117, "global_step": 356999, "epoch": 2950} {"train_loss": -45.041690826416016, "global_step": 357000, "epoch": 2950} {"train_loss": -44.1546630859375, "global_step": 357001, "epoch": 2950} {"train_loss": -45.382232666015625, "global_step": 357002, "epoch": 2950} {"train_loss": -45.3530158996582, "global_step": 357003, "epoch": 2950} {"train_loss": -45.41316223144531, "global_step": 357004, "epoch": 2950} {"train_loss": -45.0520133972168, "global_step": 357005, "epoch": 2950} {"train_loss": -45.257869720458984, "global_step": 357006, "epoch": 2950} {"train_loss": -44.8001823425293, "global_step": 357007, "epoch": 2950} {"train_loss": -45.4543571472168, "global_step": 357008, "epoch": 2950} {"train_loss": -44.98746871948242, "global_step": 357009, "epoch": 2950} {"train_loss": -44.44080352783203, "global_step": 357010, "epoch": 2950} {"train_loss": -45.675533294677734, "global_step": 357011, "epoch": 2950} {"train_loss": -45.11405563354492, "global_step": 357012, "epoch": 2950} {"train_loss": -44.651451110839844, "global_step": 357013, "epoch": 2950} {"train_loss": -45.64460372924805, "global_step": 357014, "epoch": 2950} {"train_loss": -43.210811614990234, "global_step": 357015, "epoch": 2950} {"train_loss": -44.85236740112305, "global_step": 357016, "epoch": 2950} {"train_loss": -45.11260986328125, "global_step": 357017, "epoch": 2950} {"train_loss": -43.26197052001953, "global_step": 357018, "epoch": 2950} {"train_loss": -43.919219970703125, "global_step": 357019, "epoch": 2950} {"train_loss": -44.13190841674805, "global_step": 357020, "epoch": 2950} {"train_loss": -44.25266647338867, "global_step": 357021, "epoch": 2950} {"train_loss": -44.666778564453125, "global_step": 357022, "epoch": 2950} {"train_loss": -41.97918701171875, "global_step": 357023, "epoch": 2950} {"train_loss": -40.400142669677734, "global_step": 357024, "epoch": 2950} {"train_loss": -44.77390670776367, "global_step": 357025, "epoch": 2950} {"train_loss": -38.45337677001953, "global_step": 357026, "epoch": 2950} {"train_loss": -40.9816780090332, "global_step": 357027, "epoch": 2950} {"train_loss": -32.841670989990234, "global_step": 357028, "epoch": 2950} {"train_loss": -38.3509635925293, "global_step": 357029, "epoch": 2950} {"train_loss": -41.4078254699707, "global_step": 357030, "epoch": 2950} {"train_loss": -33.02987289428711, "global_step": 357031, "epoch": 2950} {"train_loss": -38.191951751708984, "global_step": 357032, "epoch": 2950} {"train_loss": -38.25958251953125, "global_step": 357033, "epoch": 2950} {"train_loss": -37.42225646972656, "global_step": 357034, "epoch": 2950} {"train_loss": -37.22835922241211, "global_step": 357035, "epoch": 2950} {"train_loss": -40.64860153198242, "global_step": 357036, "epoch": 2950} {"train_loss": -41.10306930541992, "global_step": 357037, "epoch": 2950} {"train_loss": -39.84390640258789, "global_step": 357038, "epoch": 2950} {"train_loss": -41.42058563232422, "global_step": 357039, "epoch": 2950} {"train_loss": -41.7381706237793, "global_step": 357040, "epoch": 2950} {"train_loss": -42.144832611083984, "global_step": 357041, "epoch": 2950} {"train_loss": -42.415992736816406, "global_step": 357042, "epoch": 2950} {"train_loss": -42.09589767456055, "global_step": 357043, "epoch": 2950} {"train_loss": -42.472816467285156, "global_step": 357044, "epoch": 2950} {"train_loss": -42.830745697021484, "global_step": 357045, "epoch": 2950} {"train_loss": -42.51080322265625, "global_step": 357046, "epoch": 2950} {"train_loss": -42.64387130737305, "global_step": 357047, "epoch": 2950} {"train_loss": -43.0506591796875, "global_step": 357048, "epoch": 2950} {"train_loss": -42.753028869628906, "global_step": 357049, "epoch": 2950} {"train_loss": -43.25325393676758, "global_step": 357050, "epoch": 2950} {"train_loss": -43.37579345703125, "global_step": 357051, "epoch": 2950} {"train_loss": -43.37074279785156, "global_step": 357052, "epoch": 2950} {"train_loss": -43.90314865112305, "global_step": 357053, "epoch": 2950} {"train_loss": -43.29607009887695, "global_step": 357054, "epoch": 2950} {"train_loss": -44.47801208496094, "global_step": 357055, "epoch": 2950} {"train_loss": -43.875816345214844, "global_step": 357056, "epoch": 2950} {"train_loss": -43.3797721862793, "global_step": 357057, "epoch": 2950} {"train_loss": -43.9332160949707, "global_step": 357058, "epoch": 2950} {"train_loss": -43.29469680786133, "global_step": 357059, "epoch": 2950} {"train_loss": -43.95731735229492, "global_step": 357060, "epoch": 2950} {"train_loss": -44.228328704833984, "global_step": 357061, "epoch": 2950} {"train_loss": -43.78814697265625, "global_step": 357062, "epoch": 2950} {"train_loss": -43.96737289428711, "global_step": 357063, "epoch": 2950} {"train_loss": -44.030311584472656, "global_step": 357064, "epoch": 2950} {"train_loss": -44.6526985168457, "global_step": 357065, "epoch": 2950} {"train_loss": -44.10808181762695, "global_step": 357066, "epoch": 2950} {"train_loss": -44.20476150512695, "global_step": 357067, "epoch": 2950} {"train_loss": -44.727996826171875, "global_step": 357068, "epoch": 2950} {"train_loss": -44.03535842895508, "global_step": 357069, "epoch": 2950} {"train_loss": -43.43858759856421, "global_step": 357070, "epoch": 2950, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 1.0, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4400000": 1.0, "test/sim_max_reward_4400001": 1.0, "test/sim_max_reward_4400002": 1.0, "test/sim_max_reward_4400003": 0.0, "test/sim_max_reward_4400004": 1.0, "test/sim_max_reward_4400005": 1.0, "test/sim_max_reward_4400006": 1.0, "test/sim_max_reward_4400007": 1.0, "test/sim_max_reward_4400008": 1.0, "test/sim_max_reward_4400009": 1.0, "test/sim_max_reward_4400010": 1.0, "test/sim_max_reward_4400011": 1.0, "test/sim_max_reward_4400012": 1.0, "test/sim_max_reward_4400013": 1.0, "test/sim_max_reward_4400014": 1.0, "test/sim_max_reward_4400015": 1.0, "test/sim_max_reward_4400016": 1.0, "test/sim_max_reward_4400017": 1.0, "test/sim_max_reward_4400018": 1.0, "test/sim_max_reward_4400019": 1.0, "test/sim_max_reward_4400020": 1.0, "test/sim_max_reward_4400021": 1.0, "train/mean_score": 1.0, "test/mean_score": 0.9545454545454546, "val_loss": 2529907.25} {"train_loss": -44.45075607299805, "global_step": 357071, "epoch": 2951} {"train_loss": -44.706783294677734, "global_step": 357072, "epoch": 2951} {"train_loss": -44.4698371887207, "global_step": 357073, "epoch": 2951} {"train_loss": -45.07216262817383, "global_step": 357074, "epoch": 2951} {"train_loss": -44.37808609008789, "global_step": 357075, "epoch": 2951} {"train_loss": -44.60744094848633, "global_step": 357076, "epoch": 2951} {"train_loss": -44.97517013549805, "global_step": 357077, "epoch": 2951} {"train_loss": -45.09931564331055, "global_step": 357078, "epoch": 2951} {"train_loss": -44.588619232177734, "global_step": 357079, "epoch": 2951} {"train_loss": -45.01841354370117, "global_step": 357080, "epoch": 2951} {"train_loss": -45.00234603881836, "global_step": 357081, "epoch": 2951} {"train_loss": -45.59136962890625, "global_step": 357082, "epoch": 2951} {"train_loss": -44.74908447265625, "global_step": 357083, "epoch": 2951} {"train_loss": -44.80214309692383, "global_step": 357084, "epoch": 2951} {"train_loss": -45.11668014526367, "global_step": 357085, "epoch": 2951} {"train_loss": -44.58175277709961, "global_step": 357086, "epoch": 2951} {"train_loss": -44.42946243286133, "global_step": 357087, "epoch": 2951} {"train_loss": -45.38103103637695, "global_step": 357088, "epoch": 2951} {"train_loss": -44.27893829345703, "global_step": 357089, "epoch": 2951} {"train_loss": -44.05047607421875, "global_step": 357090, "epoch": 2951} {"train_loss": -42.96039962768555, "global_step": 357091, "epoch": 2951} {"train_loss": -44.767311096191406, "global_step": 357092, "epoch": 2951} {"train_loss": -44.12063980102539, "global_step": 357093, "epoch": 2951} {"train_loss": -42.7064208984375, "global_step": 357094, "epoch": 2951} {"train_loss": -41.597145080566406, "global_step": 357095, "epoch": 2951} {"train_loss": -43.02463912963867, "global_step": 357096, "epoch": 2951} {"train_loss": -44.494537353515625, "global_step": 357097, "epoch": 2951} {"train_loss": -44.11731719970703, "global_step": 357098, "epoch": 2951} {"train_loss": -43.84847640991211, "global_step": 357099, "epoch": 2951} {"train_loss": -44.36853790283203, "global_step": 357100, "epoch": 2951} {"train_loss": -44.93568801879883, "global_step": 357101, "epoch": 2951} {"train_loss": -44.236148834228516, "global_step": 357102, "epoch": 2951} {"train_loss": -43.97477340698242, "global_step": 357103, "epoch": 2951} {"train_loss": -44.29232406616211, "global_step": 357104, "epoch": 2951} {"train_loss": -44.02962875366211, "global_step": 357105, "epoch": 2951} {"train_loss": -43.67132568359375, "global_step": 357106, "epoch": 2951} {"train_loss": -44.52256393432617, "global_step": 357107, "epoch": 2951} {"train_loss": -44.196895599365234, "global_step": 357108, "epoch": 2951} {"train_loss": -45.23816680908203, "global_step": 357109, "epoch": 2951} {"train_loss": -44.571197509765625, "global_step": 357110, "epoch": 2951} {"train_loss": -44.243770599365234, "global_step": 357111, "epoch": 2951} {"train_loss": -44.07505416870117, "global_step": 357112, "epoch": 2951} {"train_loss": -44.47133255004883, "global_step": 357113, "epoch": 2951} {"train_loss": -44.74264144897461, "global_step": 357114, "epoch": 2951} {"train_loss": -44.88578414916992, "global_step": 357115, "epoch": 2951} {"train_loss": -44.40299606323242, "global_step": 357116, "epoch": 2951} {"train_loss": -44.58601760864258, "global_step": 357117, "epoch": 2951} {"train_loss": -45.043128967285156, "global_step": 357118, "epoch": 2951} {"train_loss": -45.34513473510742, "global_step": 357119, "epoch": 2951} {"train_loss": -44.81268310546875, "global_step": 357120, "epoch": 2951} {"train_loss": -45.21657180786133, "global_step": 357121, "epoch": 2951} {"train_loss": -44.86115264892578, "global_step": 357122, "epoch": 2951} {"train_loss": -44.83466720581055, "global_step": 357123, "epoch": 2951} {"train_loss": -44.59878158569336, "global_step": 357124, "epoch": 2951} {"train_loss": -44.164642333984375, "global_step": 357125, "epoch": 2951} {"train_loss": -44.76789855957031, "global_step": 357126, "epoch": 2951} {"train_loss": -45.292049407958984, "global_step": 357127, "epoch": 2951} {"train_loss": -44.155364990234375, "global_step": 357128, "epoch": 2951} {"train_loss": -45.10580062866211, "global_step": 357129, "epoch": 2951} {"train_loss": -45.17112350463867, "global_step": 357130, "epoch": 2951} {"train_loss": -44.46303939819336, "global_step": 357131, "epoch": 2951} {"train_loss": -45.059688568115234, "global_step": 357132, "epoch": 2951} {"train_loss": -45.14453125, "global_step": 357133, "epoch": 2951} {"train_loss": -45.25931167602539, "global_step": 357134, "epoch": 2951} {"train_loss": -45.65242385864258, "global_step": 357135, "epoch": 2951} {"train_loss": -45.597808837890625, "global_step": 357136, "epoch": 2951} {"train_loss": -45.642784118652344, "global_step": 357137, "epoch": 2951} {"train_loss": -45.990726470947266, "global_step": 357138, "epoch": 2951} {"train_loss": -45.77852249145508, "global_step": 357139, "epoch": 2951} {"train_loss": -45.2617073059082, "global_step": 357140, "epoch": 2951} {"train_loss": -45.467098236083984, "global_step": 357141, "epoch": 2951} {"train_loss": -45.34422302246094, "global_step": 357142, "epoch": 2951} {"train_loss": -45.49540328979492, "global_step": 357143, "epoch": 2951} {"train_loss": -45.29195022583008, "global_step": 357144, "epoch": 2951} {"train_loss": -45.678688049316406, "global_step": 357145, "epoch": 2951} {"train_loss": -45.430419921875, "global_step": 357146, "epoch": 2951} {"train_loss": -45.33381271362305, "global_step": 357147, "epoch": 2951} {"train_loss": -45.3331413269043, "global_step": 357148, "epoch": 2951} {"train_loss": -45.19057846069336, "global_step": 357149, "epoch": 2951} {"train_loss": -45.07875061035156, "global_step": 357150, "epoch": 2951} {"train_loss": -45.99239730834961, "global_step": 357151, "epoch": 2951} {"train_loss": -45.407508850097656, "global_step": 357152, "epoch": 2951} {"train_loss": -45.18949508666992, "global_step": 357153, "epoch": 2951} {"train_loss": -45.60780715942383, "global_step": 357154, "epoch": 2951} {"train_loss": -45.49207305908203, "global_step": 357155, "epoch": 2951} {"train_loss": -45.3822135925293, "global_step": 357156, "epoch": 2951} {"train_loss": -45.450191497802734, "global_step": 357157, "epoch": 2951} {"train_loss": -45.94077682495117, "global_step": 357158, "epoch": 2951} {"train_loss": -45.74031448364258, "global_step": 357159, "epoch": 2951} {"train_loss": -45.89229965209961, "global_step": 357160, "epoch": 2951} {"train_loss": -45.45186233520508, "global_step": 357161, "epoch": 2951} {"train_loss": -44.59812545776367, "global_step": 357162, "epoch": 2951} {"train_loss": -43.87635803222656, "global_step": 357163, "epoch": 2951} {"train_loss": -40.24647521972656, "global_step": 357164, "epoch": 2951} {"train_loss": -42.463539123535156, "global_step": 357165, "epoch": 2951} {"train_loss": -37.04934310913086, "global_step": 357166, "epoch": 2951} {"train_loss": -40.37887954711914, "global_step": 357167, "epoch": 2951} {"train_loss": -41.3073616027832, "global_step": 357168, "epoch": 2951} {"train_loss": -40.475990295410156, "global_step": 357169, "epoch": 2951} {"train_loss": -41.264930725097656, "global_step": 357170, "epoch": 2951} {"train_loss": -41.24729537963867, "global_step": 357171, "epoch": 2951} {"train_loss": -41.56157302856445, "global_step": 357172, "epoch": 2951} {"train_loss": -40.007625579833984, "global_step": 357173, "epoch": 2951} {"train_loss": -41.29463577270508, "global_step": 357174, "epoch": 2951} {"train_loss": -42.30035400390625, "global_step": 357175, "epoch": 2951} {"train_loss": -42.25141906738281, "global_step": 357176, "epoch": 2951} {"train_loss": -41.869232177734375, "global_step": 357177, "epoch": 2951} {"train_loss": -40.87380599975586, "global_step": 357178, "epoch": 2951} {"train_loss": -42.16725540161133, "global_step": 357179, "epoch": 2951} {"train_loss": -42.43711853027344, "global_step": 357180, "epoch": 2951} {"train_loss": -41.01641082763672, "global_step": 357181, "epoch": 2951} {"train_loss": -42.48200607299805, "global_step": 357182, "epoch": 2951} {"train_loss": -41.308563232421875, "global_step": 357183, "epoch": 2951} {"train_loss": -43.10468673706055, "global_step": 357184, "epoch": 2951} {"train_loss": -43.66377639770508, "global_step": 357185, "epoch": 2951} {"train_loss": -41.41450881958008, "global_step": 357186, "epoch": 2951} {"train_loss": -42.19437026977539, "global_step": 357187, "epoch": 2951} {"train_loss": -42.51708221435547, "global_step": 357188, "epoch": 2951} {"train_loss": -42.70709991455078, "global_step": 357189, "epoch": 2951} {"train_loss": -42.86892318725586, "global_step": 357190, "epoch": 2951} {"train_loss": -44.06688305563178, "global_step": 357191, "epoch": 2951, "val_loss": 2450889.0} {"train_loss": -44.050697326660156, "global_step": 357192, "epoch": 2952} {"train_loss": -43.17856979370117, "global_step": 357193, "epoch": 2952} {"train_loss": -43.86531448364258, "global_step": 357194, "epoch": 2952} {"train_loss": -42.81637191772461, "global_step": 357195, "epoch": 2952} {"train_loss": -43.68152618408203, "global_step": 357196, "epoch": 2952} {"train_loss": -44.0318603515625, "global_step": 357197, "epoch": 2952} {"train_loss": -44.08352279663086, "global_step": 357198, "epoch": 2952} {"train_loss": -44.22962951660156, "global_step": 357199, "epoch": 2952} {"train_loss": -43.07451248168945, "global_step": 357200, "epoch": 2952} {"train_loss": -44.01325225830078, "global_step": 357201, "epoch": 2952} {"train_loss": -44.039764404296875, "global_step": 357202, "epoch": 2952} {"train_loss": -44.43076705932617, "global_step": 357203, "epoch": 2952} {"train_loss": -44.52204132080078, "global_step": 357204, "epoch": 2952} {"train_loss": -44.8765869140625, "global_step": 357205, "epoch": 2952} {"train_loss": -44.42034912109375, "global_step": 357206, "epoch": 2952} {"train_loss": -44.518672943115234, "global_step": 357207, "epoch": 2952} {"train_loss": -44.834957122802734, "global_step": 357208, "epoch": 2952} {"train_loss": -44.47493362426758, "global_step": 357209, "epoch": 2952} {"train_loss": -45.10064697265625, "global_step": 357210, "epoch": 2952} {"train_loss": -44.366127014160156, "global_step": 357211, "epoch": 2952} {"train_loss": -44.76578903198242, "global_step": 357212, "epoch": 2952} {"train_loss": -44.827266693115234, "global_step": 357213, "epoch": 2952} {"train_loss": -44.522613525390625, "global_step": 357214, "epoch": 2952} {"train_loss": -45.05404281616211, "global_step": 357215, "epoch": 2952} {"train_loss": -45.322147369384766, "global_step": 357216, "epoch": 2952} {"train_loss": -44.788326263427734, "global_step": 357217, "epoch": 2952} {"train_loss": -45.0612907409668, "global_step": 357218, "epoch": 2952} {"train_loss": -45.002174377441406, "global_step": 357219, "epoch": 2952} {"train_loss": -45.18479919433594, "global_step": 357220, "epoch": 2952} {"train_loss": -45.17851638793945, "global_step": 357221, "epoch": 2952} {"train_loss": -45.414833068847656, "global_step": 357222, "epoch": 2952} {"train_loss": -45.59355163574219, "global_step": 357223, "epoch": 2952} {"train_loss": -45.77505111694336, "global_step": 357224, "epoch": 2952} {"train_loss": -45.282161712646484, "global_step": 357225, "epoch": 2952} {"train_loss": -44.948829650878906, "global_step": 357226, "epoch": 2952} {"train_loss": -45.437286376953125, "global_step": 357227, "epoch": 2952} {"train_loss": -45.42010498046875, "global_step": 357228, "epoch": 2952} {"train_loss": -45.64675521850586, "global_step": 357229, "epoch": 2952} {"train_loss": -45.170230865478516, "global_step": 357230, "epoch": 2952} {"train_loss": -45.17938995361328, "global_step": 357231, "epoch": 2952} {"train_loss": -45.78317642211914, "global_step": 357232, "epoch": 2952} {"train_loss": -45.00568389892578, "global_step": 357233, "epoch": 2952} {"train_loss": -45.74712371826172, "global_step": 357234, "epoch": 2952} {"train_loss": -45.22229766845703, "global_step": 357235, "epoch": 2952} {"train_loss": -45.11333084106445, "global_step": 357236, "epoch": 2952} {"train_loss": -45.38318634033203, "global_step": 357237, "epoch": 2952} {"train_loss": -45.41504669189453, "global_step": 357238, "epoch": 2952} {"train_loss": -45.58323287963867, "global_step": 357239, "epoch": 2952} {"train_loss": -45.62526321411133, "global_step": 357240, "epoch": 2952} {"train_loss": -45.50054168701172, "global_step": 357241, "epoch": 2952} {"train_loss": -45.47523880004883, "global_step": 357242, "epoch": 2952} {"train_loss": -45.77500534057617, "global_step": 357243, "epoch": 2952} {"train_loss": -44.743370056152344, "global_step": 357244, "epoch": 2952} {"train_loss": -45.293601989746094, "global_step": 357245, "epoch": 2952} {"train_loss": -45.16181564331055, "global_step": 357246, "epoch": 2952} {"train_loss": -46.0103645324707, "global_step": 357247, "epoch": 2952} {"train_loss": -45.089962005615234, "global_step": 357248, "epoch": 2952} {"train_loss": -44.910499572753906, "global_step": 357249, "epoch": 2952} {"train_loss": -45.27117919921875, "global_step": 357250, "epoch": 2952} {"train_loss": -45.490394592285156, "global_step": 357251, "epoch": 2952} {"train_loss": -45.63222885131836, "global_step": 357252, "epoch": 2952} {"train_loss": -45.50995635986328, "global_step": 357253, "epoch": 2952} {"train_loss": -44.65517807006836, "global_step": 357254, "epoch": 2952} {"train_loss": -43.93185043334961, "global_step": 357255, "epoch": 2952} {"train_loss": -45.19677734375, "global_step": 357256, "epoch": 2952} {"train_loss": -45.15403366088867, "global_step": 357257, "epoch": 2952} {"train_loss": -45.23136520385742, "global_step": 357258, "epoch": 2952} {"train_loss": -43.86077880859375, "global_step": 357259, "epoch": 2952} {"train_loss": -42.94783401489258, "global_step": 357260, "epoch": 2952} {"train_loss": -44.63212585449219, "global_step": 357261, "epoch": 2952} {"train_loss": -45.385284423828125, "global_step": 357262, "epoch": 2952} {"train_loss": -44.09934616088867, "global_step": 357263, "epoch": 2952} {"train_loss": -42.42058181762695, "global_step": 357264, "epoch": 2952} {"train_loss": -43.37520980834961, "global_step": 357265, "epoch": 2952} {"train_loss": -43.34674835205078, "global_step": 357266, "epoch": 2952} {"train_loss": -45.293235778808594, "global_step": 357267, "epoch": 2952} {"train_loss": -45.102352142333984, "global_step": 357268, "epoch": 2952} {"train_loss": -43.995479583740234, "global_step": 357269, "epoch": 2952} {"train_loss": -43.086769104003906, "global_step": 357270, "epoch": 2952} {"train_loss": -43.77210235595703, "global_step": 357271, "epoch": 2952} {"train_loss": -44.1943359375, "global_step": 357272, "epoch": 2952} {"train_loss": -44.1058349609375, "global_step": 357273, "epoch": 2952} {"train_loss": -44.704261779785156, "global_step": 357274, "epoch": 2952} {"train_loss": -44.82878875732422, "global_step": 357275, "epoch": 2952} {"train_loss": -43.96751022338867, "global_step": 357276, "epoch": 2952} {"train_loss": -45.370216369628906, "global_step": 357277, "epoch": 2952} {"train_loss": -43.90292739868164, "global_step": 357278, "epoch": 2952} {"train_loss": -43.91070556640625, "global_step": 357279, "epoch": 2952} {"train_loss": -45.430721282958984, "global_step": 357280, "epoch": 2952} {"train_loss": -45.113609313964844, "global_step": 357281, "epoch": 2952} {"train_loss": -44.55377197265625, "global_step": 357282, "epoch": 2952} {"train_loss": -44.53218460083008, "global_step": 357283, "epoch": 2952} {"train_loss": -44.476070404052734, "global_step": 357284, "epoch": 2952} {"train_loss": -44.72352600097656, "global_step": 357285, "epoch": 2952} {"train_loss": -43.533573150634766, "global_step": 357286, "epoch": 2952} {"train_loss": -41.799171447753906, "global_step": 357287, "epoch": 2952} {"train_loss": -45.2186279296875, "global_step": 357288, "epoch": 2952} {"train_loss": -44.53813552856445, "global_step": 357289, "epoch": 2952} {"train_loss": -43.37135696411133, "global_step": 357290, "epoch": 2952} {"train_loss": -44.201717376708984, "global_step": 357291, "epoch": 2952} {"train_loss": -44.49871826171875, "global_step": 357292, "epoch": 2952} {"train_loss": -44.08744430541992, "global_step": 357293, "epoch": 2952} {"train_loss": -44.54372024536133, "global_step": 357294, "epoch": 2952} {"train_loss": -44.65366744995117, "global_step": 357295, "epoch": 2952} {"train_loss": -45.1449089050293, "global_step": 357296, "epoch": 2952} {"train_loss": -45.38155746459961, "global_step": 357297, "epoch": 2952} {"train_loss": -44.8923454284668, "global_step": 357298, "epoch": 2952} {"train_loss": -45.540199279785156, "global_step": 357299, "epoch": 2952} {"train_loss": -44.17155075073242, "global_step": 357300, "epoch": 2952} {"train_loss": -44.93967819213867, "global_step": 357301, "epoch": 2952} {"train_loss": -45.01681137084961, "global_step": 357302, "epoch": 2952} {"train_loss": -45.35940933227539, "global_step": 357303, "epoch": 2952} {"train_loss": -45.01910400390625, "global_step": 357304, "epoch": 2952} {"train_loss": -45.04926300048828, "global_step": 357305, "epoch": 2952} {"train_loss": -42.233436584472656, "global_step": 357306, "epoch": 2952} {"train_loss": -45.59614181518555, "global_step": 357307, "epoch": 2952} {"train_loss": -44.97086715698242, "global_step": 357308, "epoch": 2952} {"train_loss": -45.262203216552734, "global_step": 357309, "epoch": 2952} {"train_loss": -45.12470626831055, "global_step": 357310, "epoch": 2952} {"train_loss": -44.79883575439453, "global_step": 357311, "epoch": 2952} {"train_loss": -44.695055402014866, "global_step": 357312, "epoch": 2952, "val_loss": 2559850.75} {"train_loss": -44.044158935546875, "global_step": 357313, "epoch": 2953} {"train_loss": -44.77132034301758, "global_step": 357314, "epoch": 2953} {"train_loss": -45.451087951660156, "global_step": 357315, "epoch": 2953} {"train_loss": -45.56240463256836, "global_step": 357316, "epoch": 2953} {"train_loss": -44.79668045043945, "global_step": 357317, "epoch": 2953} {"train_loss": -43.25794219970703, "global_step": 357318, "epoch": 2953} {"train_loss": -45.40730667114258, "global_step": 357319, "epoch": 2953} {"train_loss": -43.60332489013672, "global_step": 357320, "epoch": 2953} {"train_loss": -43.48377990722656, "global_step": 357321, "epoch": 2953} {"train_loss": -44.84649658203125, "global_step": 357322, "epoch": 2953} {"train_loss": -45.626529693603516, "global_step": 357323, "epoch": 2953} {"train_loss": -43.97580337524414, "global_step": 357324, "epoch": 2953} {"train_loss": -44.897735595703125, "global_step": 357325, "epoch": 2953} {"train_loss": -45.3853645324707, "global_step": 357326, "epoch": 2953} {"train_loss": -44.59273147583008, "global_step": 357327, "epoch": 2953} {"train_loss": -45.44144821166992, "global_step": 357328, "epoch": 2953} {"train_loss": -45.17655563354492, "global_step": 357329, "epoch": 2953} {"train_loss": -43.80180740356445, "global_step": 357330, "epoch": 2953} {"train_loss": -44.49789047241211, "global_step": 357331, "epoch": 2953} {"train_loss": -45.2598991394043, "global_step": 357332, "epoch": 2953} {"train_loss": -26.337751388549805, "global_step": 357333, "epoch": 2953} {"train_loss": -42.41355514526367, "global_step": 357334, "epoch": 2953} {"train_loss": -43.582576751708984, "global_step": 357335, "epoch": 2953} {"train_loss": -42.448543548583984, "global_step": 357336, "epoch": 2953} {"train_loss": -42.45696258544922, "global_step": 357337, "epoch": 2953} {"train_loss": -41.677146911621094, "global_step": 357338, "epoch": 2953} {"train_loss": -42.43342590332031, "global_step": 357339, "epoch": 2953} {"train_loss": -41.209716796875, "global_step": 357340, "epoch": 2953} {"train_loss": -41.92530059814453, "global_step": 357341, "epoch": 2953} {"train_loss": -42.03969192504883, "global_step": 357342, "epoch": 2953} {"train_loss": -43.68208694458008, "global_step": 357343, "epoch": 2953} {"train_loss": -43.814903259277344, "global_step": 357344, "epoch": 2953} {"train_loss": -43.039852142333984, "global_step": 357345, "epoch": 2953} {"train_loss": -41.81919479370117, "global_step": 357346, "epoch": 2953} {"train_loss": -42.200439453125, "global_step": 357347, "epoch": 2953} {"train_loss": -41.64847946166992, "global_step": 357348, "epoch": 2953} {"train_loss": -40.66943359375, "global_step": 357349, "epoch": 2953} {"train_loss": -43.66056823730469, "global_step": 357350, "epoch": 2953} {"train_loss": -43.214515686035156, "global_step": 357351, "epoch": 2953} {"train_loss": -41.1873664855957, "global_step": 357352, "epoch": 2953} {"train_loss": -42.271575927734375, "global_step": 357353, "epoch": 2953} {"train_loss": -40.26363754272461, "global_step": 357354, "epoch": 2953} {"train_loss": -41.0439338684082, "global_step": 357355, "epoch": 2953} {"train_loss": -43.0692138671875, "global_step": 357356, "epoch": 2953} {"train_loss": -40.6743049621582, "global_step": 357357, "epoch": 2953} {"train_loss": -41.777000427246094, "global_step": 357358, "epoch": 2953} {"train_loss": -39.67621994018555, "global_step": 357359, "epoch": 2953} {"train_loss": -43.930763244628906, "global_step": 357360, "epoch": 2953} {"train_loss": -38.549644470214844, "global_step": 357361, "epoch": 2953} {"train_loss": -43.601192474365234, "global_step": 357362, "epoch": 2953} {"train_loss": -39.002960205078125, "global_step": 357363, "epoch": 2953} {"train_loss": -37.676570892333984, "global_step": 357364, "epoch": 2953} {"train_loss": -37.590084075927734, "global_step": 357365, "epoch": 2953} {"train_loss": -39.796878814697266, "global_step": 357366, "epoch": 2953} {"train_loss": -39.74580383300781, "global_step": 357367, "epoch": 2953} {"train_loss": -40.8517951965332, "global_step": 357368, "epoch": 2953} {"train_loss": -41.78948974609375, "global_step": 357369, "epoch": 2953} {"train_loss": -39.32601547241211, "global_step": 357370, "epoch": 2953} {"train_loss": -42.350154876708984, "global_step": 357371, "epoch": 2953} {"train_loss": -40.33643341064453, "global_step": 357372, "epoch": 2953} {"train_loss": -43.092933654785156, "global_step": 357373, "epoch": 2953} {"train_loss": -40.21952438354492, "global_step": 357374, "epoch": 2953} {"train_loss": -42.88751220703125, "global_step": 357375, "epoch": 2953} {"train_loss": -41.89334487915039, "global_step": 357376, "epoch": 2953} {"train_loss": -43.127357482910156, "global_step": 357377, "epoch": 2953} {"train_loss": -41.39468765258789, "global_step": 357378, "epoch": 2953} {"train_loss": -42.731746673583984, "global_step": 357379, "epoch": 2953} {"train_loss": -43.5037956237793, "global_step": 357380, "epoch": 2953} {"train_loss": -43.65336227416992, "global_step": 357381, "epoch": 2953} {"train_loss": -43.60737228393555, "global_step": 357382, "epoch": 2953} {"train_loss": -43.69927978515625, "global_step": 357383, "epoch": 2953} {"train_loss": -43.92803192138672, "global_step": 357384, "epoch": 2953} {"train_loss": -44.01491165161133, "global_step": 357385, "epoch": 2953} {"train_loss": -43.81303024291992, "global_step": 357386, "epoch": 2953} {"train_loss": -43.55929946899414, "global_step": 357387, "epoch": 2953} {"train_loss": -44.52117919921875, "global_step": 357388, "epoch": 2953} {"train_loss": -43.395931243896484, "global_step": 357389, "epoch": 2953} {"train_loss": -44.194881439208984, "global_step": 357390, "epoch": 2953} {"train_loss": -44.079620361328125, "global_step": 357391, "epoch": 2953} {"train_loss": -43.84688949584961, "global_step": 357392, "epoch": 2953} {"train_loss": -43.948326110839844, "global_step": 357393, "epoch": 2953} {"train_loss": -43.65275192260742, "global_step": 357394, "epoch": 2953} {"train_loss": -44.49875259399414, "global_step": 357395, "epoch": 2953} {"train_loss": -44.77492141723633, "global_step": 357396, "epoch": 2953} {"train_loss": -44.60828399658203, "global_step": 357397, "epoch": 2953} {"train_loss": -44.42070770263672, "global_step": 357398, "epoch": 2953} {"train_loss": -43.59739303588867, "global_step": 357399, "epoch": 2953} {"train_loss": -44.36198043823242, "global_step": 357400, "epoch": 2953} {"train_loss": -44.4642448425293, "global_step": 357401, "epoch": 2953} {"train_loss": -44.13861846923828, "global_step": 357402, "epoch": 2953} {"train_loss": -44.25111770629883, "global_step": 357403, "epoch": 2953} {"train_loss": -44.6492805480957, "global_step": 357404, "epoch": 2953} {"train_loss": -44.20954513549805, "global_step": 357405, "epoch": 2953} {"train_loss": -43.767024993896484, "global_step": 357406, "epoch": 2953} {"train_loss": -44.74809646606445, "global_step": 357407, "epoch": 2953} {"train_loss": -44.86283874511719, "global_step": 357408, "epoch": 2953} {"train_loss": -44.54045486450195, "global_step": 357409, "epoch": 2953} {"train_loss": -44.8924674987793, "global_step": 357410, "epoch": 2953} {"train_loss": -44.85333251953125, "global_step": 357411, "epoch": 2953} {"train_loss": -44.9192008972168, "global_step": 357412, "epoch": 2953} {"train_loss": -44.59474182128906, "global_step": 357413, "epoch": 2953} {"train_loss": -45.05235290527344, "global_step": 357414, "epoch": 2953} {"train_loss": -45.21134567260742, "global_step": 357415, "epoch": 2953} {"train_loss": -44.36152267456055, "global_step": 357416, "epoch": 2953} {"train_loss": -45.13421630859375, "global_step": 357417, "epoch": 2953} {"train_loss": -44.34790802001953, "global_step": 357418, "epoch": 2953} {"train_loss": -44.928688049316406, "global_step": 357419, "epoch": 2953} {"train_loss": -43.2408447265625, "global_step": 357420, "epoch": 2953} {"train_loss": -45.11922073364258, "global_step": 357421, "epoch": 2953} {"train_loss": -44.34571075439453, "global_step": 357422, "epoch": 2953} {"train_loss": -43.98086166381836, "global_step": 357423, "epoch": 2953} {"train_loss": -44.54372787475586, "global_step": 357424, "epoch": 2953} {"train_loss": -42.96283721923828, "global_step": 357425, "epoch": 2953} {"train_loss": -41.11747360229492, "global_step": 357426, "epoch": 2953} {"train_loss": -44.015953063964844, "global_step": 357427, "epoch": 2953} {"train_loss": -43.8460807800293, "global_step": 357428, "epoch": 2953} {"train_loss": -43.0501823425293, "global_step": 357429, "epoch": 2953} {"train_loss": -42.87807083129883, "global_step": 357430, "epoch": 2953} {"train_loss": -41.960975646972656, "global_step": 357431, "epoch": 2953} {"train_loss": -43.89238739013672, "global_step": 357432, "epoch": 2953} {"train_loss": -43.08289222086756, "global_step": 357433, "epoch": 2953, "val_loss": 2375380.75} {"train_loss": -43.684085845947266, "global_step": 357434, "epoch": 2954} {"train_loss": -41.65696334838867, "global_step": 357435, "epoch": 2954} {"train_loss": -43.88509750366211, "global_step": 357436, "epoch": 2954} {"train_loss": -41.93000030517578, "global_step": 357437, "epoch": 2954} {"train_loss": -44.26158905029297, "global_step": 357438, "epoch": 2954} {"train_loss": -41.127864837646484, "global_step": 357439, "epoch": 2954} {"train_loss": -43.4093132019043, "global_step": 357440, "epoch": 2954} {"train_loss": -41.19684982299805, "global_step": 357441, "epoch": 2954} {"train_loss": -44.686527252197266, "global_step": 357442, "epoch": 2954} {"train_loss": -41.05542755126953, "global_step": 357443, "epoch": 2954} {"train_loss": -44.43647003173828, "global_step": 357444, "epoch": 2954} {"train_loss": -40.39147186279297, "global_step": 357445, "epoch": 2954} {"train_loss": -44.73431396484375, "global_step": 357446, "epoch": 2954} {"train_loss": -41.185237884521484, "global_step": 357447, "epoch": 2954} {"train_loss": -44.452972412109375, "global_step": 357448, "epoch": 2954} {"train_loss": -42.105655670166016, "global_step": 357449, "epoch": 2954} {"train_loss": -43.721832275390625, "global_step": 357450, "epoch": 2954} {"train_loss": -42.654781341552734, "global_step": 357451, "epoch": 2954} {"train_loss": -43.79352951049805, "global_step": 357452, "epoch": 2954} {"train_loss": -43.10870361328125, "global_step": 357453, "epoch": 2954} {"train_loss": -44.105594635009766, "global_step": 357454, "epoch": 2954} {"train_loss": -43.79193115234375, "global_step": 357455, "epoch": 2954} {"train_loss": -43.881378173828125, "global_step": 357456, "epoch": 2954} {"train_loss": -44.0338134765625, "global_step": 357457, "epoch": 2954} {"train_loss": -44.229427337646484, "global_step": 357458, "epoch": 2954} {"train_loss": -44.33318328857422, "global_step": 357459, "epoch": 2954} {"train_loss": -43.33612060546875, "global_step": 357460, "epoch": 2954} {"train_loss": -44.69009780883789, "global_step": 357461, "epoch": 2954} {"train_loss": -44.276485443115234, "global_step": 357462, "epoch": 2954} {"train_loss": -44.28476333618164, "global_step": 357463, "epoch": 2954} {"train_loss": -44.35181427001953, "global_step": 357464, "epoch": 2954} {"train_loss": -44.87303161621094, "global_step": 357465, "epoch": 2954} {"train_loss": -44.115570068359375, "global_step": 357466, "epoch": 2954} {"train_loss": -45.17647933959961, "global_step": 357467, "epoch": 2954} {"train_loss": -44.05873489379883, "global_step": 357468, "epoch": 2954} {"train_loss": -45.12112045288086, "global_step": 357469, "epoch": 2954} {"train_loss": -43.99637985229492, "global_step": 357470, "epoch": 2954} {"train_loss": -45.1519660949707, "global_step": 357471, "epoch": 2954} {"train_loss": -44.99692916870117, "global_step": 357472, "epoch": 2954} {"train_loss": -45.039161682128906, "global_step": 357473, "epoch": 2954} {"train_loss": -45.28163528442383, "global_step": 357474, "epoch": 2954} {"train_loss": -44.860511779785156, "global_step": 357475, "epoch": 2954} {"train_loss": -45.1429328918457, "global_step": 357476, "epoch": 2954} {"train_loss": -45.061641693115234, "global_step": 357477, "epoch": 2954} {"train_loss": -45.1187629699707, "global_step": 357478, "epoch": 2954} {"train_loss": -45.22834777832031, "global_step": 357479, "epoch": 2954} {"train_loss": -44.725215911865234, "global_step": 357480, "epoch": 2954} {"train_loss": -45.004852294921875, "global_step": 357481, "epoch": 2954} {"train_loss": -45.4679069519043, "global_step": 357482, "epoch": 2954} {"train_loss": -44.54058837890625, "global_step": 357483, "epoch": 2954} {"train_loss": -45.26551055908203, "global_step": 357484, "epoch": 2954} {"train_loss": -44.85987091064453, "global_step": 357485, "epoch": 2954} {"train_loss": -45.25416946411133, "global_step": 357486, "epoch": 2954} {"train_loss": -45.558834075927734, "global_step": 357487, "epoch": 2954} {"train_loss": -44.593929290771484, "global_step": 357488, "epoch": 2954} {"train_loss": -44.99801254272461, "global_step": 357489, "epoch": 2954} {"train_loss": -45.255104064941406, "global_step": 357490, "epoch": 2954} {"train_loss": -44.78546905517578, "global_step": 357491, "epoch": 2954} {"train_loss": -45.09903335571289, "global_step": 357492, "epoch": 2954} {"train_loss": -45.275413513183594, "global_step": 357493, "epoch": 2954} {"train_loss": -44.65321350097656, "global_step": 357494, "epoch": 2954} {"train_loss": -45.10182571411133, "global_step": 357495, "epoch": 2954} {"train_loss": -45.50371551513672, "global_step": 357496, "epoch": 2954} {"train_loss": -45.681114196777344, "global_step": 357497, "epoch": 2954} {"train_loss": -44.807960510253906, "global_step": 357498, "epoch": 2954} {"train_loss": -45.67730712890625, "global_step": 357499, "epoch": 2954} {"train_loss": -45.0184440612793, "global_step": 357500, "epoch": 2954} {"train_loss": -44.60595703125, "global_step": 357501, "epoch": 2954} {"train_loss": -44.083011627197266, "global_step": 357502, "epoch": 2954} {"train_loss": -44.425716400146484, "global_step": 357503, "epoch": 2954} {"train_loss": -44.79357147216797, "global_step": 357504, "epoch": 2954} {"train_loss": -45.21455001831055, "global_step": 357505, "epoch": 2954} {"train_loss": -44.86591720581055, "global_step": 357506, "epoch": 2954} {"train_loss": -44.699623107910156, "global_step": 357507, "epoch": 2954} {"train_loss": -44.96340560913086, "global_step": 357508, "epoch": 2954} {"train_loss": -45.95076370239258, "global_step": 357509, "epoch": 2954} {"train_loss": -45.519344329833984, "global_step": 357510, "epoch": 2954} {"train_loss": -45.649574279785156, "global_step": 357511, "epoch": 2954} {"train_loss": -44.702003479003906, "global_step": 357512, "epoch": 2954} {"train_loss": -44.8863639831543, "global_step": 357513, "epoch": 2954} {"train_loss": -45.02043151855469, "global_step": 357514, "epoch": 2954} {"train_loss": -45.31382369995117, "global_step": 357515, "epoch": 2954} {"train_loss": -44.97901153564453, "global_step": 357516, "epoch": 2954} {"train_loss": -45.8639030456543, "global_step": 357517, "epoch": 2954} {"train_loss": -45.063533782958984, "global_step": 357518, "epoch": 2954} {"train_loss": -45.22887420654297, "global_step": 357519, "epoch": 2954} {"train_loss": -45.243072509765625, "global_step": 357520, "epoch": 2954} {"train_loss": -45.90335464477539, "global_step": 357521, "epoch": 2954} {"train_loss": -45.204063415527344, "global_step": 357522, "epoch": 2954} {"train_loss": -45.63435363769531, "global_step": 357523, "epoch": 2954} {"train_loss": -45.53887939453125, "global_step": 357524, "epoch": 2954} {"train_loss": -44.89736557006836, "global_step": 357525, "epoch": 2954} {"train_loss": -44.15678787231445, "global_step": 357526, "epoch": 2954} {"train_loss": -45.254669189453125, "global_step": 357527, "epoch": 2954} {"train_loss": -45.413265228271484, "global_step": 357528, "epoch": 2954} {"train_loss": -45.4336051940918, "global_step": 357529, "epoch": 2954} {"train_loss": -45.248634338378906, "global_step": 357530, "epoch": 2954} {"train_loss": -45.56570053100586, "global_step": 357531, "epoch": 2954} {"train_loss": -45.47701644897461, "global_step": 357532, "epoch": 2954} {"train_loss": -44.9318733215332, "global_step": 357533, "epoch": 2954} {"train_loss": -45.33140563964844, "global_step": 357534, "epoch": 2954} {"train_loss": -45.76185989379883, "global_step": 357535, "epoch": 2954} {"train_loss": -45.84709167480469, "global_step": 357536, "epoch": 2954} {"train_loss": -45.60707473754883, "global_step": 357537, "epoch": 2954} {"train_loss": -45.51420974731445, "global_step": 357538, "epoch": 2954} {"train_loss": -45.68547439575195, "global_step": 357539, "epoch": 2954} {"train_loss": -45.71894454956055, "global_step": 357540, "epoch": 2954} {"train_loss": -45.09603500366211, "global_step": 357541, "epoch": 2954} {"train_loss": -44.39530944824219, "global_step": 357542, "epoch": 2954} {"train_loss": -45.48824691772461, "global_step": 357543, "epoch": 2954} {"train_loss": -45.73484802246094, "global_step": 357544, "epoch": 2954} {"train_loss": -45.01072692871094, "global_step": 357545, "epoch": 2954} {"train_loss": -44.71079635620117, "global_step": 357546, "epoch": 2954} {"train_loss": -45.589500427246094, "global_step": 357547, "epoch": 2954} {"train_loss": -45.97364044189453, "global_step": 357548, "epoch": 2954} {"train_loss": -45.20263671875, "global_step": 357549, "epoch": 2954} {"train_loss": -44.52323913574219, "global_step": 357550, "epoch": 2954} {"train_loss": -44.59457015991211, "global_step": 357551, "epoch": 2954} {"train_loss": -45.7192268371582, "global_step": 357552, "epoch": 2954} {"train_loss": -44.79836654663086, "global_step": 357553, "epoch": 2954} {"train_loss": -44.664814815048345, "global_step": 357554, "epoch": 2954, "val_loss": 2485846.0} {"train_loss": -44.98910140991211, "global_step": 357555, "epoch": 2955} {"train_loss": -44.60551071166992, "global_step": 357556, "epoch": 2955} {"train_loss": -44.752437591552734, "global_step": 357557, "epoch": 2955} {"train_loss": -44.4211540222168, "global_step": 357558, "epoch": 2955} {"train_loss": -43.841461181640625, "global_step": 357559, "epoch": 2955} {"train_loss": -43.204402923583984, "global_step": 357560, "epoch": 2955} {"train_loss": -44.57707977294922, "global_step": 357561, "epoch": 2955} {"train_loss": -45.08448028564453, "global_step": 357562, "epoch": 2955} {"train_loss": -44.4076042175293, "global_step": 357563, "epoch": 2955} {"train_loss": -40.703285217285156, "global_step": 357564, "epoch": 2955} {"train_loss": -44.62732696533203, "global_step": 357565, "epoch": 2955} {"train_loss": -38.70125198364258, "global_step": 357566, "epoch": 2955} {"train_loss": -44.26823806762695, "global_step": 357567, "epoch": 2955} {"train_loss": -35.52915954589844, "global_step": 357568, "epoch": 2955} {"train_loss": -38.54573059082031, "global_step": 357569, "epoch": 2955} {"train_loss": -36.84000015258789, "global_step": 357570, "epoch": 2955} {"train_loss": -43.487335205078125, "global_step": 357571, "epoch": 2955} {"train_loss": -38.640960693359375, "global_step": 357572, "epoch": 2955} {"train_loss": -41.302284240722656, "global_step": 357573, "epoch": 2955} {"train_loss": -37.88263702392578, "global_step": 357574, "epoch": 2955} {"train_loss": -37.98456573486328, "global_step": 357575, "epoch": 2955} {"train_loss": -42.15797805786133, "global_step": 357576, "epoch": 2955} {"train_loss": -38.20185089111328, "global_step": 357577, "epoch": 2955} {"train_loss": -40.72501754760742, "global_step": 357578, "epoch": 2955} {"train_loss": -42.488914489746094, "global_step": 357579, "epoch": 2955} {"train_loss": -39.15461349487305, "global_step": 357580, "epoch": 2955} {"train_loss": -41.16120147705078, "global_step": 357581, "epoch": 2955} {"train_loss": -39.88810729980469, "global_step": 357582, "epoch": 2955} {"train_loss": -40.73828125, "global_step": 357583, "epoch": 2955} {"train_loss": -37.53920364379883, "global_step": 357584, "epoch": 2955} {"train_loss": -39.46333694458008, "global_step": 357585, "epoch": 2955} {"train_loss": -42.112911224365234, "global_step": 357586, "epoch": 2955} {"train_loss": -39.449462890625, "global_step": 357587, "epoch": 2955} {"train_loss": -39.095882415771484, "global_step": 357588, "epoch": 2955} {"train_loss": -42.26365280151367, "global_step": 357589, "epoch": 2955} {"train_loss": -38.00679397583008, "global_step": 357590, "epoch": 2955} {"train_loss": -42.45808029174805, "global_step": 357591, "epoch": 2955} {"train_loss": -38.708518981933594, "global_step": 357592, "epoch": 2955} {"train_loss": -41.91643524169922, "global_step": 357593, "epoch": 2955} {"train_loss": -41.81264877319336, "global_step": 357594, "epoch": 2955} {"train_loss": -38.84150314331055, "global_step": 357595, "epoch": 2955} {"train_loss": -43.55584716796875, "global_step": 357596, "epoch": 2955} {"train_loss": -40.16704177856445, "global_step": 357597, "epoch": 2955} {"train_loss": -41.72667694091797, "global_step": 357598, "epoch": 2955} {"train_loss": -42.447669982910156, "global_step": 357599, "epoch": 2955} {"train_loss": -41.93052673339844, "global_step": 357600, "epoch": 2955} {"train_loss": -42.16414260864258, "global_step": 357601, "epoch": 2955} {"train_loss": -43.23624801635742, "global_step": 357602, "epoch": 2955} {"train_loss": -42.894222259521484, "global_step": 357603, "epoch": 2955} {"train_loss": -43.803287506103516, "global_step": 357604, "epoch": 2955} {"train_loss": -43.42954635620117, "global_step": 357605, "epoch": 2955} {"train_loss": -43.2310791015625, "global_step": 357606, "epoch": 2955} {"train_loss": -43.55561065673828, "global_step": 357607, "epoch": 2955} {"train_loss": -43.3588752746582, "global_step": 357608, "epoch": 2955} {"train_loss": -44.30366897583008, "global_step": 357609, "epoch": 2955} {"train_loss": -43.26911163330078, "global_step": 357610, "epoch": 2955} {"train_loss": -43.687957763671875, "global_step": 357611, "epoch": 2955} {"train_loss": -43.984981536865234, "global_step": 357612, "epoch": 2955} {"train_loss": -44.545860290527344, "global_step": 357613, "epoch": 2955} {"train_loss": -44.32196807861328, "global_step": 357614, "epoch": 2955} {"train_loss": -44.49821853637695, "global_step": 357615, "epoch": 2955} {"train_loss": -44.284488677978516, "global_step": 357616, "epoch": 2955} {"train_loss": -44.77016830444336, "global_step": 357617, "epoch": 2955} {"train_loss": -45.074546813964844, "global_step": 357618, "epoch": 2955} {"train_loss": -44.83628463745117, "global_step": 357619, "epoch": 2955} {"train_loss": -44.970516204833984, "global_step": 357620, "epoch": 2955} {"train_loss": -44.914154052734375, "global_step": 357621, "epoch": 2955} {"train_loss": -45.14929962158203, "global_step": 357622, "epoch": 2955} {"train_loss": -44.49607467651367, "global_step": 357623, "epoch": 2955} {"train_loss": -45.217689514160156, "global_step": 357624, "epoch": 2955} {"train_loss": -45.08445739746094, "global_step": 357625, "epoch": 2955} {"train_loss": -45.04972839355469, "global_step": 357626, "epoch": 2955} {"train_loss": -45.28478240966797, "global_step": 357627, "epoch": 2955} {"train_loss": -45.341552734375, "global_step": 357628, "epoch": 2955} {"train_loss": -44.92634201049805, "global_step": 357629, "epoch": 2955} {"train_loss": -44.873836517333984, "global_step": 357630, "epoch": 2955} {"train_loss": -45.26326370239258, "global_step": 357631, "epoch": 2955} {"train_loss": -45.4285888671875, "global_step": 357632, "epoch": 2955} {"train_loss": -45.74679183959961, "global_step": 357633, "epoch": 2955} {"train_loss": -45.451995849609375, "global_step": 357634, "epoch": 2955} {"train_loss": -45.272579193115234, "global_step": 357635, "epoch": 2955} {"train_loss": -45.47222137451172, "global_step": 357636, "epoch": 2955} {"train_loss": -45.719642639160156, "global_step": 357637, "epoch": 2955} {"train_loss": -45.61557388305664, "global_step": 357638, "epoch": 2955} {"train_loss": -44.91510772705078, "global_step": 357639, "epoch": 2955} {"train_loss": -45.29795455932617, "global_step": 357640, "epoch": 2955} {"train_loss": -45.640682220458984, "global_step": 357641, "epoch": 2955} {"train_loss": -45.03795623779297, "global_step": 357642, "epoch": 2955} {"train_loss": -43.029502868652344, "global_step": 357643, "epoch": 2955} {"train_loss": -45.82088088989258, "global_step": 357644, "epoch": 2955} {"train_loss": -44.7205810546875, "global_step": 357645, "epoch": 2955} {"train_loss": -45.71350860595703, "global_step": 357646, "epoch": 2955} {"train_loss": -45.41560745239258, "global_step": 357647, "epoch": 2955} {"train_loss": -45.17466354370117, "global_step": 357648, "epoch": 2955} {"train_loss": -45.43459701538086, "global_step": 357649, "epoch": 2955} {"train_loss": -45.83454513549805, "global_step": 357650, "epoch": 2955} {"train_loss": -45.94599533081055, "global_step": 357651, "epoch": 2955} {"train_loss": -44.50026321411133, "global_step": 357652, "epoch": 2955} {"train_loss": -43.89056396484375, "global_step": 357653, "epoch": 2955} {"train_loss": -44.808223724365234, "global_step": 357654, "epoch": 2955} {"train_loss": -44.013370513916016, "global_step": 357655, "epoch": 2955} {"train_loss": -42.446041107177734, "global_step": 357656, "epoch": 2955} {"train_loss": -45.19289779663086, "global_step": 357657, "epoch": 2955} {"train_loss": -44.414974212646484, "global_step": 357658, "epoch": 2955} {"train_loss": -44.01904296875, "global_step": 357659, "epoch": 2955} {"train_loss": -45.36146545410156, "global_step": 357660, "epoch": 2955} {"train_loss": -43.587825775146484, "global_step": 357661, "epoch": 2955} {"train_loss": -43.88179397583008, "global_step": 357662, "epoch": 2955} {"train_loss": -44.5037956237793, "global_step": 357663, "epoch": 2955} {"train_loss": -42.42091751098633, "global_step": 357664, "epoch": 2955} {"train_loss": -44.98555374145508, "global_step": 357665, "epoch": 2955} {"train_loss": -43.20278549194336, "global_step": 357666, "epoch": 2955} {"train_loss": -44.557987213134766, "global_step": 357667, "epoch": 2955} {"train_loss": -44.53725051879883, "global_step": 357668, "epoch": 2955} {"train_loss": -43.64530563354492, "global_step": 357669, "epoch": 2955} {"train_loss": -44.938533782958984, "global_step": 357670, "epoch": 2955} {"train_loss": -44.717552185058594, "global_step": 357671, "epoch": 2955} {"train_loss": -43.85667419433594, "global_step": 357672, "epoch": 2955} {"train_loss": -45.08689498901367, "global_step": 357673, "epoch": 2955} {"train_loss": -44.56733703613281, "global_step": 357674, "epoch": 2955} {"train_loss": -43.27444442244601, "global_step": 357675, "epoch": 2955, "val_loss": 2416947.0} {"train_loss": -44.90399932861328, "global_step": 357676, "epoch": 2956} {"train_loss": -44.093727111816406, "global_step": 357677, "epoch": 2956} {"train_loss": -43.14875411987305, "global_step": 357678, "epoch": 2956} {"train_loss": -44.1733512878418, "global_step": 357679, "epoch": 2956} {"train_loss": -44.60618209838867, "global_step": 357680, "epoch": 2956} {"train_loss": -43.52640914916992, "global_step": 357681, "epoch": 2956} {"train_loss": -44.4726676940918, "global_step": 357682, "epoch": 2956} {"train_loss": -45.134517669677734, "global_step": 357683, "epoch": 2956} {"train_loss": -42.15151596069336, "global_step": 357684, "epoch": 2956} {"train_loss": -44.71393966674805, "global_step": 357685, "epoch": 2956} {"train_loss": -44.0296516418457, "global_step": 357686, "epoch": 2956} {"train_loss": -45.336368560791016, "global_step": 357687, "epoch": 2956} {"train_loss": -44.65969467163086, "global_step": 357688, "epoch": 2956} {"train_loss": -44.92076873779297, "global_step": 357689, "epoch": 2956} {"train_loss": -45.02734375, "global_step": 357690, "epoch": 2956} {"train_loss": -44.53666305541992, "global_step": 357691, "epoch": 2956} {"train_loss": -44.61518478393555, "global_step": 357692, "epoch": 2956} {"train_loss": -45.6717414855957, "global_step": 357693, "epoch": 2956} {"train_loss": -45.095245361328125, "global_step": 357694, "epoch": 2956} {"train_loss": -44.51485824584961, "global_step": 357695, "epoch": 2956} {"train_loss": -45.721038818359375, "global_step": 357696, "epoch": 2956} {"train_loss": -45.530033111572266, "global_step": 357697, "epoch": 2956} {"train_loss": -45.49782943725586, "global_step": 357698, "epoch": 2956} {"train_loss": -45.69147872924805, "global_step": 357699, "epoch": 2956} {"train_loss": -45.200103759765625, "global_step": 357700, "epoch": 2956} {"train_loss": -45.4095458984375, "global_step": 357701, "epoch": 2956} {"train_loss": -45.64907455444336, "global_step": 357702, "epoch": 2956} {"train_loss": -45.28559112548828, "global_step": 357703, "epoch": 2956} {"train_loss": -44.58780288696289, "global_step": 357704, "epoch": 2956} {"train_loss": -44.30246353149414, "global_step": 357705, "epoch": 2956} {"train_loss": -44.39040756225586, "global_step": 357706, "epoch": 2956} {"train_loss": -43.25492477416992, "global_step": 357707, "epoch": 2956} {"train_loss": -44.447906494140625, "global_step": 357708, "epoch": 2956} {"train_loss": -43.464744567871094, "global_step": 357709, "epoch": 2956} {"train_loss": -44.116539001464844, "global_step": 357710, "epoch": 2956} {"train_loss": -44.78451156616211, "global_step": 357711, "epoch": 2956} {"train_loss": -45.25012969970703, "global_step": 357712, "epoch": 2956} {"train_loss": -44.307857513427734, "global_step": 357713, "epoch": 2956} {"train_loss": -45.150489807128906, "global_step": 357714, "epoch": 2956} {"train_loss": -44.7740364074707, "global_step": 357715, "epoch": 2956} {"train_loss": -45.0910758972168, "global_step": 357716, "epoch": 2956} {"train_loss": -44.50456237792969, "global_step": 357717, "epoch": 2956} {"train_loss": -44.85926055908203, "global_step": 357718, "epoch": 2956} {"train_loss": -44.87153244018555, "global_step": 357719, "epoch": 2956} {"train_loss": -44.58195114135742, "global_step": 357720, "epoch": 2956} {"train_loss": -45.19651412963867, "global_step": 357721, "epoch": 2956} {"train_loss": -44.77033615112305, "global_step": 357722, "epoch": 2956} {"train_loss": -44.41862106323242, "global_step": 357723, "epoch": 2956} {"train_loss": -44.14495849609375, "global_step": 357724, "epoch": 2956} {"train_loss": -45.26880645751953, "global_step": 357725, "epoch": 2956} {"train_loss": -44.343048095703125, "global_step": 357726, "epoch": 2956} {"train_loss": -42.948394775390625, "global_step": 357727, "epoch": 2956} {"train_loss": -44.45363998413086, "global_step": 357728, "epoch": 2956} {"train_loss": -43.67042922973633, "global_step": 357729, "epoch": 2956} {"train_loss": -43.79568099975586, "global_step": 357730, "epoch": 2956} {"train_loss": -44.78324508666992, "global_step": 357731, "epoch": 2956} {"train_loss": -45.11863327026367, "global_step": 357732, "epoch": 2956} {"train_loss": -43.548831939697266, "global_step": 357733, "epoch": 2956} {"train_loss": -45.224422454833984, "global_step": 357734, "epoch": 2956} {"train_loss": -44.72261428833008, "global_step": 357735, "epoch": 2956} {"train_loss": -45.207454681396484, "global_step": 357736, "epoch": 2956} {"train_loss": -44.48746109008789, "global_step": 357737, "epoch": 2956} {"train_loss": -44.711849212646484, "global_step": 357738, "epoch": 2956} {"train_loss": -44.73994064331055, "global_step": 357739, "epoch": 2956} {"train_loss": -45.25043487548828, "global_step": 357740, "epoch": 2956} {"train_loss": -44.7176628112793, "global_step": 357741, "epoch": 2956} {"train_loss": -43.7552490234375, "global_step": 357742, "epoch": 2956} {"train_loss": -44.56574249267578, "global_step": 357743, "epoch": 2956} {"train_loss": -44.31233215332031, "global_step": 357744, "epoch": 2956} {"train_loss": -42.03067398071289, "global_step": 357745, "epoch": 2956} {"train_loss": -44.1506233215332, "global_step": 357746, "epoch": 2956} {"train_loss": -44.73858642578125, "global_step": 357747, "epoch": 2956} {"train_loss": -44.22699737548828, "global_step": 357748, "epoch": 2956} {"train_loss": -41.54874801635742, "global_step": 357749, "epoch": 2956} {"train_loss": -45.36066436767578, "global_step": 357750, "epoch": 2956} {"train_loss": -42.28212356567383, "global_step": 357751, "epoch": 2956} {"train_loss": -44.48202896118164, "global_step": 357752, "epoch": 2956} {"train_loss": -43.920318603515625, "global_step": 357753, "epoch": 2956} {"train_loss": -43.023773193359375, "global_step": 357754, "epoch": 2956} {"train_loss": -44.02543258666992, "global_step": 357755, "epoch": 2956} {"train_loss": -42.924217224121094, "global_step": 357756, "epoch": 2956} {"train_loss": -44.17726516723633, "global_step": 357757, "epoch": 2956} {"train_loss": -44.4978141784668, "global_step": 357758, "epoch": 2956} {"train_loss": -43.013919830322266, "global_step": 357759, "epoch": 2956} {"train_loss": -42.57487869262695, "global_step": 357760, "epoch": 2956} {"train_loss": -44.687801361083984, "global_step": 357761, "epoch": 2956} {"train_loss": -43.202125549316406, "global_step": 357762, "epoch": 2956} {"train_loss": -44.31557083129883, "global_step": 357763, "epoch": 2956} {"train_loss": -43.90072250366211, "global_step": 357764, "epoch": 2956} {"train_loss": -44.5881233215332, "global_step": 357765, "epoch": 2956} {"train_loss": -44.290138244628906, "global_step": 357766, "epoch": 2956} {"train_loss": -43.709083557128906, "global_step": 357767, "epoch": 2956} {"train_loss": -44.45342254638672, "global_step": 357768, "epoch": 2956} {"train_loss": -44.22320556640625, "global_step": 357769, "epoch": 2956} {"train_loss": -42.76456832885742, "global_step": 357770, "epoch": 2956} {"train_loss": -45.130516052246094, "global_step": 357771, "epoch": 2956} {"train_loss": -43.99232864379883, "global_step": 357772, "epoch": 2956} {"train_loss": -44.452125549316406, "global_step": 357773, "epoch": 2956} {"train_loss": -45.2977294921875, "global_step": 357774, "epoch": 2956} {"train_loss": -43.79720687866211, "global_step": 357775, "epoch": 2956} {"train_loss": -44.6827278137207, "global_step": 357776, "epoch": 2956} {"train_loss": -44.46851348876953, "global_step": 357777, "epoch": 2956} {"train_loss": -44.31880569458008, "global_step": 357778, "epoch": 2956} {"train_loss": -45.393192291259766, "global_step": 357779, "epoch": 2956} {"train_loss": -44.4747428894043, "global_step": 357780, "epoch": 2956} {"train_loss": -45.27948760986328, "global_step": 357781, "epoch": 2956} {"train_loss": -44.84077072143555, "global_step": 357782, "epoch": 2956} {"train_loss": -44.652347564697266, "global_step": 357783, "epoch": 2956} {"train_loss": -44.97114562988281, "global_step": 357784, "epoch": 2956} {"train_loss": -44.82829666137695, "global_step": 357785, "epoch": 2956} {"train_loss": -44.742286682128906, "global_step": 357786, "epoch": 2956} {"train_loss": -44.96354675292969, "global_step": 357787, "epoch": 2956} {"train_loss": -45.2542839050293, "global_step": 357788, "epoch": 2956} {"train_loss": -45.17271041870117, "global_step": 357789, "epoch": 2956} {"train_loss": -44.99945068359375, "global_step": 357790, "epoch": 2956} {"train_loss": -44.59086227416992, "global_step": 357791, "epoch": 2956} {"train_loss": -45.324405670166016, "global_step": 357792, "epoch": 2956} {"train_loss": -45.018280029296875, "global_step": 357793, "epoch": 2956} {"train_loss": -45.55363845825195, "global_step": 357794, "epoch": 2956} {"train_loss": -45.72214889526367, "global_step": 357795, "epoch": 2956} {"train_loss": -44.48463670084299, "global_step": 357796, "epoch": 2956, "val_loss": 2424008.0} {"train_loss": -45.576019287109375, "global_step": 357797, "epoch": 2957} {"train_loss": -45.95037841796875, "global_step": 357798, "epoch": 2957} {"train_loss": -44.9951286315918, "global_step": 357799, "epoch": 2957} {"train_loss": -44.22815704345703, "global_step": 357800, "epoch": 2957} {"train_loss": -44.834388732910156, "global_step": 357801, "epoch": 2957} {"train_loss": -45.506927490234375, "global_step": 357802, "epoch": 2957} {"train_loss": -44.83000564575195, "global_step": 357803, "epoch": 2957} {"train_loss": -43.93374252319336, "global_step": 357804, "epoch": 2957} {"train_loss": -44.5043830871582, "global_step": 357805, "epoch": 2957} {"train_loss": -45.21771240234375, "global_step": 357806, "epoch": 2957} {"train_loss": -45.009090423583984, "global_step": 357807, "epoch": 2957} {"train_loss": -43.933135986328125, "global_step": 357808, "epoch": 2957} {"train_loss": -44.69709396362305, "global_step": 357809, "epoch": 2957} {"train_loss": -44.39118194580078, "global_step": 357810, "epoch": 2957} {"train_loss": -44.72150421142578, "global_step": 357811, "epoch": 2957} {"train_loss": -44.33473587036133, "global_step": 357812, "epoch": 2957} {"train_loss": -44.7586669921875, "global_step": 357813, "epoch": 2957} {"train_loss": -44.71493148803711, "global_step": 357814, "epoch": 2957} {"train_loss": -43.79172134399414, "global_step": 357815, "epoch": 2957} {"train_loss": -44.758583068847656, "global_step": 357816, "epoch": 2957} {"train_loss": -44.89236068725586, "global_step": 357817, "epoch": 2957} {"train_loss": -44.23300552368164, "global_step": 357818, "epoch": 2957} {"train_loss": -44.706787109375, "global_step": 357819, "epoch": 2957} {"train_loss": -44.609230041503906, "global_step": 357820, "epoch": 2957} {"train_loss": -43.77265167236328, "global_step": 357821, "epoch": 2957} {"train_loss": -44.065673828125, "global_step": 357822, "epoch": 2957} {"train_loss": -44.81901931762695, "global_step": 357823, "epoch": 2957} {"train_loss": -44.77654266357422, "global_step": 357824, "epoch": 2957} {"train_loss": -44.78642654418945, "global_step": 357825, "epoch": 2957} {"train_loss": -44.555049896240234, "global_step": 357826, "epoch": 2957} {"train_loss": -45.32943344116211, "global_step": 357827, "epoch": 2957} {"train_loss": -44.79153823852539, "global_step": 357828, "epoch": 2957} {"train_loss": -44.51543426513672, "global_step": 357829, "epoch": 2957} {"train_loss": -45.18862533569336, "global_step": 357830, "epoch": 2957} {"train_loss": -43.87145233154297, "global_step": 357831, "epoch": 2957} {"train_loss": -43.55131149291992, "global_step": 357832, "epoch": 2957} {"train_loss": -44.39128494262695, "global_step": 357833, "epoch": 2957} {"train_loss": -43.75602340698242, "global_step": 357834, "epoch": 2957} {"train_loss": -44.68410873413086, "global_step": 357835, "epoch": 2957} {"train_loss": -43.550533294677734, "global_step": 357836, "epoch": 2957} {"train_loss": -42.90562057495117, "global_step": 357837, "epoch": 2957} {"train_loss": -44.900047302246094, "global_step": 357838, "epoch": 2957} {"train_loss": -44.36796951293945, "global_step": 357839, "epoch": 2957} {"train_loss": -43.81792449951172, "global_step": 357840, "epoch": 2957} {"train_loss": -45.03407669067383, "global_step": 357841, "epoch": 2957} {"train_loss": -43.570594787597656, "global_step": 357842, "epoch": 2957} {"train_loss": -44.306312561035156, "global_step": 357843, "epoch": 2957} {"train_loss": -44.32395553588867, "global_step": 357844, "epoch": 2957} {"train_loss": -43.05400466918945, "global_step": 357845, "epoch": 2957} {"train_loss": -42.491207122802734, "global_step": 357846, "epoch": 2957} {"train_loss": -44.65056228637695, "global_step": 357847, "epoch": 2957} {"train_loss": -42.7520637512207, "global_step": 357848, "epoch": 2957} {"train_loss": -44.283748626708984, "global_step": 357849, "epoch": 2957} {"train_loss": -43.35873031616211, "global_step": 357850, "epoch": 2957} {"train_loss": -43.73459243774414, "global_step": 357851, "epoch": 2957} {"train_loss": -44.029823303222656, "global_step": 357852, "epoch": 2957} {"train_loss": -43.4849967956543, "global_step": 357853, "epoch": 2957} {"train_loss": -43.66243362426758, "global_step": 357854, "epoch": 2957} {"train_loss": -43.180259704589844, "global_step": 357855, "epoch": 2957} {"train_loss": -44.64683151245117, "global_step": 357856, "epoch": 2957} {"train_loss": -43.467872619628906, "global_step": 357857, "epoch": 2957} {"train_loss": -43.868106842041016, "global_step": 357858, "epoch": 2957} {"train_loss": -43.820674896240234, "global_step": 357859, "epoch": 2957} {"train_loss": -44.99677658081055, "global_step": 357860, "epoch": 2957} {"train_loss": -43.40850830078125, "global_step": 357861, "epoch": 2957} {"train_loss": -44.0390625, "global_step": 357862, "epoch": 2957} {"train_loss": -45.468109130859375, "global_step": 357863, "epoch": 2957} {"train_loss": -43.48358917236328, "global_step": 357864, "epoch": 2957} {"train_loss": -44.755863189697266, "global_step": 357865, "epoch": 2957} {"train_loss": -43.583065032958984, "global_step": 357866, "epoch": 2957} {"train_loss": -44.58355712890625, "global_step": 357867, "epoch": 2957} {"train_loss": -44.22758865356445, "global_step": 357868, "epoch": 2957} {"train_loss": -44.81632614135742, "global_step": 357869, "epoch": 2957} {"train_loss": -44.8091926574707, "global_step": 357870, "epoch": 2957} {"train_loss": -44.817176818847656, "global_step": 357871, "epoch": 2957} {"train_loss": -45.48902130126953, "global_step": 357872, "epoch": 2957} {"train_loss": -44.70582962036133, "global_step": 357873, "epoch": 2957} {"train_loss": -44.75461959838867, "global_step": 357874, "epoch": 2957} {"train_loss": -44.73108673095703, "global_step": 357875, "epoch": 2957} {"train_loss": -45.763526916503906, "global_step": 357876, "epoch": 2957} {"train_loss": -45.4095344543457, "global_step": 357877, "epoch": 2957} {"train_loss": -45.3087043762207, "global_step": 357878, "epoch": 2957} {"train_loss": -44.61042404174805, "global_step": 357879, "epoch": 2957} {"train_loss": -45.05967330932617, "global_step": 357880, "epoch": 2957} {"train_loss": -44.476314544677734, "global_step": 357881, "epoch": 2957} {"train_loss": -43.982666015625, "global_step": 357882, "epoch": 2957} {"train_loss": -44.8934211730957, "global_step": 357883, "epoch": 2957} {"train_loss": -44.853946685791016, "global_step": 357884, "epoch": 2957} {"train_loss": -43.9898796081543, "global_step": 357885, "epoch": 2957} {"train_loss": -45.07352828979492, "global_step": 357886, "epoch": 2957} {"train_loss": -44.95730209350586, "global_step": 357887, "epoch": 2957} {"train_loss": -43.0741081237793, "global_step": 357888, "epoch": 2957} {"train_loss": -45.33395004272461, "global_step": 357889, "epoch": 2957} {"train_loss": -44.98478317260742, "global_step": 357890, "epoch": 2957} {"train_loss": -43.6770133972168, "global_step": 357891, "epoch": 2957} {"train_loss": -45.13996887207031, "global_step": 357892, "epoch": 2957} {"train_loss": -45.18925857543945, "global_step": 357893, "epoch": 2957} {"train_loss": -44.398006439208984, "global_step": 357894, "epoch": 2957} {"train_loss": -44.3546028137207, "global_step": 357895, "epoch": 2957} {"train_loss": -43.703792572021484, "global_step": 357896, "epoch": 2957} {"train_loss": -44.040992736816406, "global_step": 357897, "epoch": 2957} {"train_loss": -44.67377471923828, "global_step": 357898, "epoch": 2957} {"train_loss": -44.38018035888672, "global_step": 357899, "epoch": 2957} {"train_loss": -44.38239669799805, "global_step": 357900, "epoch": 2957} {"train_loss": -43.30337142944336, "global_step": 357901, "epoch": 2957} {"train_loss": -44.231353759765625, "global_step": 357902, "epoch": 2957} {"train_loss": -44.4380989074707, "global_step": 357903, "epoch": 2957} {"train_loss": -43.388206481933594, "global_step": 357904, "epoch": 2957} {"train_loss": -44.23151779174805, "global_step": 357905, "epoch": 2957} {"train_loss": -44.179500579833984, "global_step": 357906, "epoch": 2957} {"train_loss": -44.03276443481445, "global_step": 357907, "epoch": 2957} {"train_loss": -45.1070671081543, "global_step": 357908, "epoch": 2957} {"train_loss": -44.402591705322266, "global_step": 357909, "epoch": 2957} {"train_loss": -44.34919738769531, "global_step": 357910, "epoch": 2957} {"train_loss": -44.81375503540039, "global_step": 357911, "epoch": 2957} {"train_loss": -43.54586410522461, "global_step": 357912, "epoch": 2957} {"train_loss": -44.19585418701172, "global_step": 357913, "epoch": 2957} {"train_loss": -44.47042465209961, "global_step": 357914, "epoch": 2957} {"train_loss": -44.513824462890625, "global_step": 357915, "epoch": 2957} {"train_loss": -43.99916458129883, "global_step": 357916, "epoch": 2957} {"train_loss": -44.38893679153821, "global_step": 357917, "epoch": 2957, "val_loss": 2384448.25} {"train_loss": -45.21623229980469, "global_step": 357918, "epoch": 2958} {"train_loss": -44.0527458190918, "global_step": 357919, "epoch": 2958} {"train_loss": -44.37179946899414, "global_step": 357920, "epoch": 2958} {"train_loss": -45.16667175292969, "global_step": 357921, "epoch": 2958} {"train_loss": -44.14858627319336, "global_step": 357922, "epoch": 2958} {"train_loss": -45.6224479675293, "global_step": 357923, "epoch": 2958} {"train_loss": -45.02032470703125, "global_step": 357924, "epoch": 2958} {"train_loss": -45.241878509521484, "global_step": 357925, "epoch": 2958} {"train_loss": -44.7279167175293, "global_step": 357926, "epoch": 2958} {"train_loss": -45.061012268066406, "global_step": 357927, "epoch": 2958} {"train_loss": -45.53420639038086, "global_step": 357928, "epoch": 2958} {"train_loss": -44.905635833740234, "global_step": 357929, "epoch": 2958} {"train_loss": -45.389923095703125, "global_step": 357930, "epoch": 2958} {"train_loss": -45.17851638793945, "global_step": 357931, "epoch": 2958} {"train_loss": -45.17953109741211, "global_step": 357932, "epoch": 2958} {"train_loss": -45.30308151245117, "global_step": 357933, "epoch": 2958} {"train_loss": -45.668209075927734, "global_step": 357934, "epoch": 2958} {"train_loss": -45.199363708496094, "global_step": 357935, "epoch": 2958} {"train_loss": -45.63193893432617, "global_step": 357936, "epoch": 2958} {"train_loss": -45.755653381347656, "global_step": 357937, "epoch": 2958} {"train_loss": -45.513427734375, "global_step": 357938, "epoch": 2958} {"train_loss": -45.224788665771484, "global_step": 357939, "epoch": 2958} {"train_loss": -45.40316390991211, "global_step": 357940, "epoch": 2958} {"train_loss": -45.01383590698242, "global_step": 357941, "epoch": 2958} {"train_loss": -45.08372116088867, "global_step": 357942, "epoch": 2958} {"train_loss": -44.3869514465332, "global_step": 357943, "epoch": 2958} {"train_loss": -45.149627685546875, "global_step": 357944, "epoch": 2958} {"train_loss": -44.72388458251953, "global_step": 357945, "epoch": 2958} {"train_loss": -45.65669631958008, "global_step": 357946, "epoch": 2958} {"train_loss": -45.44514083862305, "global_step": 357947, "epoch": 2958} {"train_loss": -44.31574630737305, "global_step": 357948, "epoch": 2958} {"train_loss": -44.504669189453125, "global_step": 357949, "epoch": 2958} {"train_loss": -45.04387283325195, "global_step": 357950, "epoch": 2958} {"train_loss": -45.36493682861328, "global_step": 357951, "epoch": 2958} {"train_loss": -45.52771759033203, "global_step": 357952, "epoch": 2958} {"train_loss": -45.04924392700195, "global_step": 357953, "epoch": 2958} {"train_loss": -45.218990325927734, "global_step": 357954, "epoch": 2958} {"train_loss": -45.33888626098633, "global_step": 357955, "epoch": 2958} {"train_loss": -45.54970169067383, "global_step": 357956, "epoch": 2958} {"train_loss": -44.7998046875, "global_step": 357957, "epoch": 2958} {"train_loss": -44.829193115234375, "global_step": 357958, "epoch": 2958} {"train_loss": -44.84296798706055, "global_step": 357959, "epoch": 2958} {"train_loss": -45.350555419921875, "global_step": 357960, "epoch": 2958} {"train_loss": -45.12843704223633, "global_step": 357961, "epoch": 2958} {"train_loss": -44.911903381347656, "global_step": 357962, "epoch": 2958} {"train_loss": -43.5464973449707, "global_step": 357963, "epoch": 2958} {"train_loss": -43.324920654296875, "global_step": 357964, "epoch": 2958} {"train_loss": -44.678035736083984, "global_step": 357965, "epoch": 2958} {"train_loss": -42.75307846069336, "global_step": 357966, "epoch": 2958} {"train_loss": -42.502498626708984, "global_step": 357967, "epoch": 2958} {"train_loss": -45.05556106567383, "global_step": 357968, "epoch": 2958} {"train_loss": -42.516685485839844, "global_step": 357969, "epoch": 2958} {"train_loss": -44.81825637817383, "global_step": 357970, "epoch": 2958} {"train_loss": -43.738136291503906, "global_step": 357971, "epoch": 2958} {"train_loss": -43.28481674194336, "global_step": 357972, "epoch": 2958} {"train_loss": -43.425994873046875, "global_step": 357973, "epoch": 2958} {"train_loss": -44.96166229248047, "global_step": 357974, "epoch": 2958} {"train_loss": -42.818538665771484, "global_step": 357975, "epoch": 2958} {"train_loss": -44.767391204833984, "global_step": 357976, "epoch": 2958} {"train_loss": -42.18708419799805, "global_step": 357977, "epoch": 2958} {"train_loss": -44.80621337890625, "global_step": 357978, "epoch": 2958} {"train_loss": -43.7064208984375, "global_step": 357979, "epoch": 2958} {"train_loss": -43.66358947753906, "global_step": 357980, "epoch": 2958} {"train_loss": -44.53245162963867, "global_step": 357981, "epoch": 2958} {"train_loss": -43.23273849487305, "global_step": 357982, "epoch": 2958} {"train_loss": -44.4470329284668, "global_step": 357983, "epoch": 2958} {"train_loss": -44.40234375, "global_step": 357984, "epoch": 2958} {"train_loss": -43.19891357421875, "global_step": 357985, "epoch": 2958} {"train_loss": -43.6212043762207, "global_step": 357986, "epoch": 2958} {"train_loss": -44.35755920410156, "global_step": 357987, "epoch": 2958} {"train_loss": -43.894039154052734, "global_step": 357988, "epoch": 2958} {"train_loss": -43.98740768432617, "global_step": 357989, "epoch": 2958} {"train_loss": -43.31939697265625, "global_step": 357990, "epoch": 2958} {"train_loss": -44.048011779785156, "global_step": 357991, "epoch": 2958} {"train_loss": -44.52029037475586, "global_step": 357992, "epoch": 2958} {"train_loss": -44.4007568359375, "global_step": 357993, "epoch": 2958} {"train_loss": -44.1567268371582, "global_step": 357994, "epoch": 2958} {"train_loss": -44.626827239990234, "global_step": 357995, "epoch": 2958} {"train_loss": -44.37258529663086, "global_step": 357996, "epoch": 2958} {"train_loss": -45.050804138183594, "global_step": 357997, "epoch": 2958} {"train_loss": -43.854801177978516, "global_step": 357998, "epoch": 2958} {"train_loss": -44.97922134399414, "global_step": 357999, "epoch": 2958} {"train_loss": -44.89506149291992, "global_step": 358000, "epoch": 2958} {"train_loss": -44.95484161376953, "global_step": 358001, "epoch": 2958} {"train_loss": -45.13335037231445, "global_step": 358002, "epoch": 2958} {"train_loss": -44.96297836303711, "global_step": 358003, "epoch": 2958} {"train_loss": -44.891170501708984, "global_step": 358004, "epoch": 2958} {"train_loss": -44.72518539428711, "global_step": 358005, "epoch": 2958} {"train_loss": -44.747291564941406, "global_step": 358006, "epoch": 2958} {"train_loss": -44.615753173828125, "global_step": 358007, "epoch": 2958} {"train_loss": -43.130340576171875, "global_step": 358008, "epoch": 2958} {"train_loss": -43.73486328125, "global_step": 358009, "epoch": 2958} {"train_loss": -43.19510269165039, "global_step": 358010, "epoch": 2958} {"train_loss": -43.88983154296875, "global_step": 358011, "epoch": 2958} {"train_loss": -44.53192138671875, "global_step": 358012, "epoch": 2958} {"train_loss": -42.91819381713867, "global_step": 358013, "epoch": 2958} {"train_loss": -44.02383041381836, "global_step": 358014, "epoch": 2958} {"train_loss": -44.41505432128906, "global_step": 358015, "epoch": 2958} {"train_loss": -43.888545989990234, "global_step": 358016, "epoch": 2958} {"train_loss": -43.99161911010742, "global_step": 358017, "epoch": 2958} {"train_loss": -44.258888244628906, "global_step": 358018, "epoch": 2958} {"train_loss": -43.58403396606445, "global_step": 358019, "epoch": 2958} {"train_loss": -45.32781982421875, "global_step": 358020, "epoch": 2958} {"train_loss": -43.98575973510742, "global_step": 358021, "epoch": 2958} {"train_loss": -44.239009857177734, "global_step": 358022, "epoch": 2958} {"train_loss": -44.65498733520508, "global_step": 358023, "epoch": 2958} {"train_loss": -44.07072067260742, "global_step": 358024, "epoch": 2958} {"train_loss": -42.8358154296875, "global_step": 358025, "epoch": 2958} {"train_loss": -44.2714958190918, "global_step": 358026, "epoch": 2958} {"train_loss": -43.59519577026367, "global_step": 358027, "epoch": 2958} {"train_loss": -44.580257415771484, "global_step": 358028, "epoch": 2958} {"train_loss": -43.61562728881836, "global_step": 358029, "epoch": 2958} {"train_loss": -43.649688720703125, "global_step": 358030, "epoch": 2958} {"train_loss": -44.77888870239258, "global_step": 358031, "epoch": 2958} {"train_loss": -44.634342193603516, "global_step": 358032, "epoch": 2958} {"train_loss": -44.421241760253906, "global_step": 358033, "epoch": 2958} {"train_loss": -43.84601593017578, "global_step": 358034, "epoch": 2958} {"train_loss": -44.36404037475586, "global_step": 358035, "epoch": 2958} {"train_loss": -44.38180923461914, "global_step": 358036, "epoch": 2958} {"train_loss": -44.40309524536133, "global_step": 358037, "epoch": 2958} {"train_loss": -44.461836318339195, "global_step": 358038, "epoch": 2958, "val_loss": 2453056.0} {"train_loss": -44.604347229003906, "global_step": 358039, "epoch": 2959} {"train_loss": -44.0901985168457, "global_step": 358040, "epoch": 2959} {"train_loss": -44.39308166503906, "global_step": 358041, "epoch": 2959} {"train_loss": -44.488075256347656, "global_step": 358042, "epoch": 2959} {"train_loss": -44.2069091796875, "global_step": 358043, "epoch": 2959} {"train_loss": -44.5022087097168, "global_step": 358044, "epoch": 2959} {"train_loss": -44.7196044921875, "global_step": 358045, "epoch": 2959} {"train_loss": -43.71780014038086, "global_step": 358046, "epoch": 2959} {"train_loss": -44.596405029296875, "global_step": 358047, "epoch": 2959} {"train_loss": -44.8370475769043, "global_step": 358048, "epoch": 2959} {"train_loss": -44.270870208740234, "global_step": 358049, "epoch": 2959} {"train_loss": -45.33372116088867, "global_step": 358050, "epoch": 2959} {"train_loss": -44.25979232788086, "global_step": 358051, "epoch": 2959} {"train_loss": -44.820335388183594, "global_step": 358052, "epoch": 2959} {"train_loss": -45.00210189819336, "global_step": 358053, "epoch": 2959} {"train_loss": -45.127586364746094, "global_step": 358054, "epoch": 2959} {"train_loss": -45.089847564697266, "global_step": 358055, "epoch": 2959} {"train_loss": -44.53842544555664, "global_step": 358056, "epoch": 2959} {"train_loss": -44.478939056396484, "global_step": 358057, "epoch": 2959} {"train_loss": -45.158363342285156, "global_step": 358058, "epoch": 2959} {"train_loss": -45.64107894897461, "global_step": 358059, "epoch": 2959} {"train_loss": -45.395599365234375, "global_step": 358060, "epoch": 2959} {"train_loss": -44.46781539916992, "global_step": 358061, "epoch": 2959} {"train_loss": -44.30131912231445, "global_step": 358062, "epoch": 2959} {"train_loss": -44.938114166259766, "global_step": 358063, "epoch": 2959} {"train_loss": -44.981876373291016, "global_step": 358064, "epoch": 2959} {"train_loss": -44.88547134399414, "global_step": 358065, "epoch": 2959} {"train_loss": -44.78982162475586, "global_step": 358066, "epoch": 2959} {"train_loss": -44.54267120361328, "global_step": 358067, "epoch": 2959} {"train_loss": -44.45560836791992, "global_step": 358068, "epoch": 2959} {"train_loss": -45.150203704833984, "global_step": 358069, "epoch": 2959} {"train_loss": -44.60498809814453, "global_step": 358070, "epoch": 2959} {"train_loss": -43.959808349609375, "global_step": 358071, "epoch": 2959} {"train_loss": -45.72526168823242, "global_step": 358072, "epoch": 2959} {"train_loss": -45.37494659423828, "global_step": 358073, "epoch": 2959} {"train_loss": -45.131649017333984, "global_step": 358074, "epoch": 2959} {"train_loss": -45.0274543762207, "global_step": 358075, "epoch": 2959} {"train_loss": -45.30161666870117, "global_step": 358076, "epoch": 2959} {"train_loss": -44.99201965332031, "global_step": 358077, "epoch": 2959} {"train_loss": -44.13625717163086, "global_step": 358078, "epoch": 2959} {"train_loss": -44.7877311706543, "global_step": 358079, "epoch": 2959} {"train_loss": -45.25985336303711, "global_step": 358080, "epoch": 2959} {"train_loss": -44.20490646362305, "global_step": 358081, "epoch": 2959} {"train_loss": -45.27474594116211, "global_step": 358082, "epoch": 2959} {"train_loss": -45.107032775878906, "global_step": 358083, "epoch": 2959} {"train_loss": -45.63920211791992, "global_step": 358084, "epoch": 2959} {"train_loss": -44.933895111083984, "global_step": 358085, "epoch": 2959} {"train_loss": -45.51020431518555, "global_step": 358086, "epoch": 2959} {"train_loss": -45.63759994506836, "global_step": 358087, "epoch": 2959} {"train_loss": -45.37186813354492, "global_step": 358088, "epoch": 2959} {"train_loss": -45.9246940612793, "global_step": 358089, "epoch": 2959} {"train_loss": -45.94352340698242, "global_step": 358090, "epoch": 2959} {"train_loss": -45.9832649230957, "global_step": 358091, "epoch": 2959} {"train_loss": -45.70471954345703, "global_step": 358092, "epoch": 2959} {"train_loss": -45.44861602783203, "global_step": 358093, "epoch": 2959} {"train_loss": -45.996891021728516, "global_step": 358094, "epoch": 2959} {"train_loss": -46.23087692260742, "global_step": 358095, "epoch": 2959} {"train_loss": -46.249542236328125, "global_step": 358096, "epoch": 2959} {"train_loss": -45.71204376220703, "global_step": 358097, "epoch": 2959} {"train_loss": -45.80640411376953, "global_step": 358098, "epoch": 2959} {"train_loss": -46.109378814697266, "global_step": 358099, "epoch": 2959} {"train_loss": -45.576534271240234, "global_step": 358100, "epoch": 2959} {"train_loss": -45.24222183227539, "global_step": 358101, "epoch": 2959} {"train_loss": -45.35542678833008, "global_step": 358102, "epoch": 2959} {"train_loss": -45.1124382019043, "global_step": 358103, "epoch": 2959} {"train_loss": -44.833675384521484, "global_step": 358104, "epoch": 2959} {"train_loss": -44.84535598754883, "global_step": 358105, "epoch": 2959} {"train_loss": -45.468894958496094, "global_step": 358106, "epoch": 2959} {"train_loss": -45.172332763671875, "global_step": 358107, "epoch": 2959} {"train_loss": -44.118011474609375, "global_step": 358108, "epoch": 2959} {"train_loss": -43.7209587097168, "global_step": 358109, "epoch": 2959} {"train_loss": -45.61074447631836, "global_step": 358110, "epoch": 2959} {"train_loss": -45.01374435424805, "global_step": 358111, "epoch": 2959} {"train_loss": -44.187984466552734, "global_step": 358112, "epoch": 2959} {"train_loss": -45.24897384643555, "global_step": 358113, "epoch": 2959} {"train_loss": -41.43709945678711, "global_step": 358114, "epoch": 2959} {"train_loss": -41.93260955810547, "global_step": 358115, "epoch": 2959} {"train_loss": -45.37858581542969, "global_step": 358116, "epoch": 2959} {"train_loss": -44.45512008666992, "global_step": 358117, "epoch": 2959} {"train_loss": -45.58998489379883, "global_step": 358118, "epoch": 2959} {"train_loss": -44.612117767333984, "global_step": 358119, "epoch": 2959} {"train_loss": -42.975860595703125, "global_step": 358120, "epoch": 2959} {"train_loss": -45.02265167236328, "global_step": 358121, "epoch": 2959} {"train_loss": -44.45400619506836, "global_step": 358122, "epoch": 2959} {"train_loss": -43.45741653442383, "global_step": 358123, "epoch": 2959} {"train_loss": -42.84833908081055, "global_step": 358124, "epoch": 2959} {"train_loss": -44.97018814086914, "global_step": 358125, "epoch": 2959} {"train_loss": -44.318782806396484, "global_step": 358126, "epoch": 2959} {"train_loss": -43.832786560058594, "global_step": 358127, "epoch": 2959} {"train_loss": -44.14936828613281, "global_step": 358128, "epoch": 2959} {"train_loss": -44.20367431640625, "global_step": 358129, "epoch": 2959} {"train_loss": -44.179771423339844, "global_step": 358130, "epoch": 2959} {"train_loss": -44.049110412597656, "global_step": 358131, "epoch": 2959} {"train_loss": -43.188812255859375, "global_step": 358132, "epoch": 2959} {"train_loss": -44.23303985595703, "global_step": 358133, "epoch": 2959} {"train_loss": -43.09490966796875, "global_step": 358134, "epoch": 2959} {"train_loss": -43.59844970703125, "global_step": 358135, "epoch": 2959} {"train_loss": -45.66341018676758, "global_step": 358136, "epoch": 2959} {"train_loss": -44.053680419921875, "global_step": 358137, "epoch": 2959} {"train_loss": -45.064571380615234, "global_step": 358138, "epoch": 2959} {"train_loss": -43.98077392578125, "global_step": 358139, "epoch": 2959} {"train_loss": -44.38220977783203, "global_step": 358140, "epoch": 2959} {"train_loss": -44.88294982910156, "global_step": 358141, "epoch": 2959} {"train_loss": -44.45448684692383, "global_step": 358142, "epoch": 2959} {"train_loss": -44.36356735229492, "global_step": 358143, "epoch": 2959} {"train_loss": -45.074520111083984, "global_step": 358144, "epoch": 2959} {"train_loss": -44.47603988647461, "global_step": 358145, "epoch": 2959} {"train_loss": -44.949989318847656, "global_step": 358146, "epoch": 2959} {"train_loss": -45.208980560302734, "global_step": 358147, "epoch": 2959} {"train_loss": -44.75577926635742, "global_step": 358148, "epoch": 2959} {"train_loss": -45.18526077270508, "global_step": 358149, "epoch": 2959} {"train_loss": -44.7282600402832, "global_step": 358150, "epoch": 2959} {"train_loss": -44.2567024230957, "global_step": 358151, "epoch": 2959} {"train_loss": -45.214351654052734, "global_step": 358152, "epoch": 2959} {"train_loss": -44.60615921020508, "global_step": 358153, "epoch": 2959} {"train_loss": -44.064640045166016, "global_step": 358154, "epoch": 2959} {"train_loss": -43.26040267944336, "global_step": 358155, "epoch": 2959} {"train_loss": -43.97631072998047, "global_step": 358156, "epoch": 2959} {"train_loss": -45.1985969543457, "global_step": 358157, "epoch": 2959} {"train_loss": -44.07680892944336, "global_step": 358158, "epoch": 2959} {"train_loss": -44.72454405225013, "global_step": 358159, "epoch": 2959, "val_loss": 2429015.75} {"train_loss": -44.165283203125, "global_step": 358160, "epoch": 2960} {"train_loss": -43.61445999145508, "global_step": 358161, "epoch": 2960} {"train_loss": -43.484107971191406, "global_step": 358162, "epoch": 2960} {"train_loss": -43.74430465698242, "global_step": 358163, "epoch": 2960} {"train_loss": -43.4510612487793, "global_step": 358164, "epoch": 2960} {"train_loss": -44.5527458190918, "global_step": 358165, "epoch": 2960} {"train_loss": -43.17477798461914, "global_step": 358166, "epoch": 2960} {"train_loss": -44.56365203857422, "global_step": 358167, "epoch": 2960} {"train_loss": -43.85464096069336, "global_step": 358168, "epoch": 2960} {"train_loss": -43.582801818847656, "global_step": 358169, "epoch": 2960} {"train_loss": -44.299251556396484, "global_step": 358170, "epoch": 2960} {"train_loss": -43.5337028503418, "global_step": 358171, "epoch": 2960} {"train_loss": -44.433040618896484, "global_step": 358172, "epoch": 2960} {"train_loss": -41.98476791381836, "global_step": 358173, "epoch": 2960} {"train_loss": -44.111263275146484, "global_step": 358174, "epoch": 2960} {"train_loss": -44.353824615478516, "global_step": 358175, "epoch": 2960} {"train_loss": -44.16822814941406, "global_step": 358176, "epoch": 2960} {"train_loss": -44.60969924926758, "global_step": 358177, "epoch": 2960} {"train_loss": -44.501678466796875, "global_step": 358178, "epoch": 2960} {"train_loss": -44.440956115722656, "global_step": 358179, "epoch": 2960} {"train_loss": -44.587982177734375, "global_step": 358180, "epoch": 2960} {"train_loss": -44.643104553222656, "global_step": 358181, "epoch": 2960} {"train_loss": -44.117916107177734, "global_step": 358182, "epoch": 2960} {"train_loss": -44.7937126159668, "global_step": 358183, "epoch": 2960} {"train_loss": -43.85382080078125, "global_step": 358184, "epoch": 2960} {"train_loss": -44.75407791137695, "global_step": 358185, "epoch": 2960} {"train_loss": -44.79190444946289, "global_step": 358186, "epoch": 2960} {"train_loss": -44.52922058105469, "global_step": 358187, "epoch": 2960} {"train_loss": -45.231109619140625, "global_step": 358188, "epoch": 2960} {"train_loss": -44.61397171020508, "global_step": 358189, "epoch": 2960} {"train_loss": -43.68886184692383, "global_step": 358190, "epoch": 2960} {"train_loss": -44.73377227783203, "global_step": 358191, "epoch": 2960} {"train_loss": -44.40859603881836, "global_step": 358192, "epoch": 2960} {"train_loss": -44.18973922729492, "global_step": 358193, "epoch": 2960} {"train_loss": -44.74038314819336, "global_step": 358194, "epoch": 2960} {"train_loss": -45.111873626708984, "global_step": 358195, "epoch": 2960} {"train_loss": -44.7209587097168, "global_step": 358196, "epoch": 2960} {"train_loss": -45.25236129760742, "global_step": 358197, "epoch": 2960} {"train_loss": -44.78622817993164, "global_step": 358198, "epoch": 2960} {"train_loss": -43.84595489501953, "global_step": 358199, "epoch": 2960} {"train_loss": -45.0025749206543, "global_step": 358200, "epoch": 2960} {"train_loss": -44.6972541809082, "global_step": 358201, "epoch": 2960} {"train_loss": -44.939125061035156, "global_step": 358202, "epoch": 2960} {"train_loss": -45.623268127441406, "global_step": 358203, "epoch": 2960} {"train_loss": -44.93767166137695, "global_step": 358204, "epoch": 2960} {"train_loss": -44.59522247314453, "global_step": 358205, "epoch": 2960} {"train_loss": -45.656532287597656, "global_step": 358206, "epoch": 2960} {"train_loss": -45.05062484741211, "global_step": 358207, "epoch": 2960} {"train_loss": -44.939453125, "global_step": 358208, "epoch": 2960} {"train_loss": -45.61980438232422, "global_step": 358209, "epoch": 2960} {"train_loss": -44.9060173034668, "global_step": 358210, "epoch": 2960} {"train_loss": -45.260711669921875, "global_step": 358211, "epoch": 2960} {"train_loss": -44.297706604003906, "global_step": 358212, "epoch": 2960} {"train_loss": -45.143165588378906, "global_step": 358213, "epoch": 2960} {"train_loss": -45.74675369262695, "global_step": 358214, "epoch": 2960} {"train_loss": -44.28571319580078, "global_step": 358215, "epoch": 2960} {"train_loss": -45.2867546081543, "global_step": 358216, "epoch": 2960} {"train_loss": -45.203773498535156, "global_step": 358217, "epoch": 2960} {"train_loss": -43.4311637878418, "global_step": 358218, "epoch": 2960} {"train_loss": -43.111663818359375, "global_step": 358219, "epoch": 2960} {"train_loss": -44.741050720214844, "global_step": 358220, "epoch": 2960} {"train_loss": -45.0440788269043, "global_step": 358221, "epoch": 2960} {"train_loss": -45.5091438293457, "global_step": 358222, "epoch": 2960} {"train_loss": -45.12085723876953, "global_step": 358223, "epoch": 2960} {"train_loss": -45.261539459228516, "global_step": 358224, "epoch": 2960} {"train_loss": -45.08810806274414, "global_step": 358225, "epoch": 2960} {"train_loss": -44.743675231933594, "global_step": 358226, "epoch": 2960} {"train_loss": -46.04917526245117, "global_step": 358227, "epoch": 2960} {"train_loss": -45.37820816040039, "global_step": 358228, "epoch": 2960} {"train_loss": -45.53114700317383, "global_step": 358229, "epoch": 2960} {"train_loss": -45.400390625, "global_step": 358230, "epoch": 2960} {"train_loss": -45.36484909057617, "global_step": 358231, "epoch": 2960} {"train_loss": -45.375152587890625, "global_step": 358232, "epoch": 2960} {"train_loss": -45.18013381958008, "global_step": 358233, "epoch": 2960} {"train_loss": -45.18134689331055, "global_step": 358234, "epoch": 2960} {"train_loss": -44.66421890258789, "global_step": 358235, "epoch": 2960} {"train_loss": -43.16255569458008, "global_step": 358236, "epoch": 2960} {"train_loss": -43.13473129272461, "global_step": 358237, "epoch": 2960} {"train_loss": -43.184326171875, "global_step": 358238, "epoch": 2960} {"train_loss": -45.07354736328125, "global_step": 358239, "epoch": 2960} {"train_loss": -44.50197219848633, "global_step": 358240, "epoch": 2960} {"train_loss": -42.95418167114258, "global_step": 358241, "epoch": 2960} {"train_loss": -43.63983917236328, "global_step": 358242, "epoch": 2960} {"train_loss": -45.71620559692383, "global_step": 358243, "epoch": 2960} {"train_loss": -44.3885383605957, "global_step": 358244, "epoch": 2960} {"train_loss": -42.58773422241211, "global_step": 358245, "epoch": 2960} {"train_loss": -41.091278076171875, "global_step": 358246, "epoch": 2960} {"train_loss": -44.58347702026367, "global_step": 358247, "epoch": 2960} {"train_loss": -38.87543487548828, "global_step": 358248, "epoch": 2960} {"train_loss": -42.759521484375, "global_step": 358249, "epoch": 2960} {"train_loss": -32.036861419677734, "global_step": 358250, "epoch": 2960} {"train_loss": -33.10687255859375, "global_step": 358251, "epoch": 2960} {"train_loss": -43.291805267333984, "global_step": 358252, "epoch": 2960} {"train_loss": -31.651752471923828, "global_step": 358253, "epoch": 2960} {"train_loss": -37.15130615234375, "global_step": 358254, "epoch": 2960} {"train_loss": -36.737464904785156, "global_step": 358255, "epoch": 2960} {"train_loss": -34.78974533081055, "global_step": 358256, "epoch": 2960} {"train_loss": -40.276180267333984, "global_step": 358257, "epoch": 2960} {"train_loss": -37.48249435424805, "global_step": 358258, "epoch": 2960} {"train_loss": -40.25691604614258, "global_step": 358259, "epoch": 2960} {"train_loss": -38.324859619140625, "global_step": 358260, "epoch": 2960} {"train_loss": -38.749446868896484, "global_step": 358261, "epoch": 2960} {"train_loss": -39.50849914550781, "global_step": 358262, "epoch": 2960} {"train_loss": -40.52802276611328, "global_step": 358263, "epoch": 2960} {"train_loss": -41.218360900878906, "global_step": 358264, "epoch": 2960} {"train_loss": -40.41001510620117, "global_step": 358265, "epoch": 2960} {"train_loss": -42.158058166503906, "global_step": 358266, "epoch": 2960} {"train_loss": -41.622432708740234, "global_step": 358267, "epoch": 2960} {"train_loss": -43.083431243896484, "global_step": 358268, "epoch": 2960} {"train_loss": -41.778560638427734, "global_step": 358269, "epoch": 2960} {"train_loss": -43.61820602416992, "global_step": 358270, "epoch": 2960} {"train_loss": -41.938133239746094, "global_step": 358271, "epoch": 2960} {"train_loss": -43.14254379272461, "global_step": 358272, "epoch": 2960} {"train_loss": -43.30971145629883, "global_step": 358273, "epoch": 2960} {"train_loss": -42.73322677612305, "global_step": 358274, "epoch": 2960} {"train_loss": -42.25939178466797, "global_step": 358275, "epoch": 2960} {"train_loss": -43.72768020629883, "global_step": 358276, "epoch": 2960} {"train_loss": -42.41314697265625, "global_step": 358277, "epoch": 2960} {"train_loss": -42.998836517333984, "global_step": 358278, "epoch": 2960} {"train_loss": -42.92692184448242, "global_step": 358279, "epoch": 2960} {"train_loss": -43.33439500666847, "global_step": 358280, "epoch": 2960, "val_loss": 2381253.25} {"train_loss": -43.17744064331055, "global_step": 358281, "epoch": 2961} {"train_loss": -44.3231315612793, "global_step": 358282, "epoch": 2961} {"train_loss": -43.52275085449219, "global_step": 358283, "epoch": 2961} {"train_loss": -43.84170150756836, "global_step": 358284, "epoch": 2961} {"train_loss": -44.05027770996094, "global_step": 358285, "epoch": 2961} {"train_loss": -44.20144271850586, "global_step": 358286, "epoch": 2961} {"train_loss": -43.47905349731445, "global_step": 358287, "epoch": 2961} {"train_loss": -44.53886795043945, "global_step": 358288, "epoch": 2961} {"train_loss": -44.17005157470703, "global_step": 358289, "epoch": 2961} {"train_loss": -43.839111328125, "global_step": 358290, "epoch": 2961} {"train_loss": -44.785858154296875, "global_step": 358291, "epoch": 2961} {"train_loss": -44.58256912231445, "global_step": 358292, "epoch": 2961} {"train_loss": -44.6657829284668, "global_step": 358293, "epoch": 2961} {"train_loss": -44.28522491455078, "global_step": 358294, "epoch": 2961} {"train_loss": -44.82631301879883, "global_step": 358295, "epoch": 2961} {"train_loss": -44.775211334228516, "global_step": 358296, "epoch": 2961} {"train_loss": -44.32194519042969, "global_step": 358297, "epoch": 2961} {"train_loss": -45.349700927734375, "global_step": 358298, "epoch": 2961} {"train_loss": -44.542396545410156, "global_step": 358299, "epoch": 2961} {"train_loss": -45.229915618896484, "global_step": 358300, "epoch": 2961} {"train_loss": -44.92951583862305, "global_step": 358301, "epoch": 2961} {"train_loss": -45.00704574584961, "global_step": 358302, "epoch": 2961} {"train_loss": -44.84555435180664, "global_step": 358303, "epoch": 2961} {"train_loss": -45.43256378173828, "global_step": 358304, "epoch": 2961} {"train_loss": -45.07588577270508, "global_step": 358305, "epoch": 2961} {"train_loss": -45.327396392822266, "global_step": 358306, "epoch": 2961} {"train_loss": -45.263763427734375, "global_step": 358307, "epoch": 2961} {"train_loss": -45.128517150878906, "global_step": 358308, "epoch": 2961} {"train_loss": -45.159278869628906, "global_step": 358309, "epoch": 2961} {"train_loss": -45.48366165161133, "global_step": 358310, "epoch": 2961} {"train_loss": -45.24735641479492, "global_step": 358311, "epoch": 2961} {"train_loss": -45.459835052490234, "global_step": 358312, "epoch": 2961} {"train_loss": -45.63323974609375, "global_step": 358313, "epoch": 2961} {"train_loss": -45.65953826904297, "global_step": 358314, "epoch": 2961} {"train_loss": -45.686866760253906, "global_step": 358315, "epoch": 2961} {"train_loss": -45.764156341552734, "global_step": 358316, "epoch": 2961} {"train_loss": -45.872013092041016, "global_step": 358317, "epoch": 2961} {"train_loss": -45.76436996459961, "global_step": 358318, "epoch": 2961} {"train_loss": -45.41122055053711, "global_step": 358319, "epoch": 2961} {"train_loss": -45.75443649291992, "global_step": 358320, "epoch": 2961} {"train_loss": -45.61367416381836, "global_step": 358321, "epoch": 2961} {"train_loss": -46.0560302734375, "global_step": 358322, "epoch": 2961} {"train_loss": -46.04533767700195, "global_step": 358323, "epoch": 2961} {"train_loss": -45.422237396240234, "global_step": 358324, "epoch": 2961} {"train_loss": -45.25309753417969, "global_step": 358325, "epoch": 2961} {"train_loss": -46.297271728515625, "global_step": 358326, "epoch": 2961} {"train_loss": -45.80996322631836, "global_step": 358327, "epoch": 2961} {"train_loss": -46.09025192260742, "global_step": 358328, "epoch": 2961} {"train_loss": -45.901214599609375, "global_step": 358329, "epoch": 2961} {"train_loss": -45.61137008666992, "global_step": 358330, "epoch": 2961} {"train_loss": -46.0112419128418, "global_step": 358331, "epoch": 2961} {"train_loss": -45.943843841552734, "global_step": 358332, "epoch": 2961} {"train_loss": -45.38572311401367, "global_step": 358333, "epoch": 2961} {"train_loss": -42.96087646484375, "global_step": 358334, "epoch": 2961} {"train_loss": -45.690677642822266, "global_step": 358335, "epoch": 2961} {"train_loss": -45.71182632446289, "global_step": 358336, "epoch": 2961} {"train_loss": -46.30596160888672, "global_step": 358337, "epoch": 2961} {"train_loss": -45.918392181396484, "global_step": 358338, "epoch": 2961} {"train_loss": -45.8343620300293, "global_step": 358339, "epoch": 2961} {"train_loss": -45.35236740112305, "global_step": 358340, "epoch": 2961} {"train_loss": -44.76703643798828, "global_step": 358341, "epoch": 2961} {"train_loss": -45.96564865112305, "global_step": 358342, "epoch": 2961} {"train_loss": -45.95414352416992, "global_step": 358343, "epoch": 2961} {"train_loss": -45.22422409057617, "global_step": 358344, "epoch": 2961} {"train_loss": -44.371246337890625, "global_step": 358345, "epoch": 2961} {"train_loss": -45.400146484375, "global_step": 358346, "epoch": 2961} {"train_loss": -46.04392623901367, "global_step": 358347, "epoch": 2961} {"train_loss": -44.4348030090332, "global_step": 358348, "epoch": 2961} {"train_loss": -44.04500961303711, "global_step": 358349, "epoch": 2961} {"train_loss": -45.309425354003906, "global_step": 358350, "epoch": 2961} {"train_loss": -45.820045471191406, "global_step": 358351, "epoch": 2961} {"train_loss": -45.01777267456055, "global_step": 358352, "epoch": 2961} {"train_loss": -44.472755432128906, "global_step": 358353, "epoch": 2961} {"train_loss": -45.30038070678711, "global_step": 358354, "epoch": 2961} {"train_loss": -45.62104034423828, "global_step": 358355, "epoch": 2961} {"train_loss": -42.20896530151367, "global_step": 358356, "epoch": 2961} {"train_loss": -43.81578063964844, "global_step": 358357, "epoch": 2961} {"train_loss": -45.290653228759766, "global_step": 358358, "epoch": 2961} {"train_loss": -44.27177810668945, "global_step": 358359, "epoch": 2961} {"train_loss": -42.608436584472656, "global_step": 358360, "epoch": 2961} {"train_loss": -45.02656173706055, "global_step": 358361, "epoch": 2961} {"train_loss": -42.290374755859375, "global_step": 358362, "epoch": 2961} {"train_loss": -41.55337142944336, "global_step": 358363, "epoch": 2961} {"train_loss": -39.02996063232422, "global_step": 358364, "epoch": 2961} {"train_loss": -42.438392639160156, "global_step": 358365, "epoch": 2961} {"train_loss": -40.670204162597656, "global_step": 358366, "epoch": 2961} {"train_loss": -42.56647491455078, "global_step": 358367, "epoch": 2961} {"train_loss": -42.59365463256836, "global_step": 358368, "epoch": 2961} {"train_loss": -41.88967514038086, "global_step": 358369, "epoch": 2961} {"train_loss": -44.55939865112305, "global_step": 358370, "epoch": 2961} {"train_loss": -42.89061737060547, "global_step": 358371, "epoch": 2961} {"train_loss": -43.40011215209961, "global_step": 358372, "epoch": 2961} {"train_loss": -38.770755767822266, "global_step": 358373, "epoch": 2961} {"train_loss": -27.796472549438477, "global_step": 358374, "epoch": 2961} {"train_loss": -36.88959503173828, "global_step": 358375, "epoch": 2961} {"train_loss": -41.61884689331055, "global_step": 358376, "epoch": 2961} {"train_loss": -39.53304672241211, "global_step": 358377, "epoch": 2961} {"train_loss": -27.351654052734375, "global_step": 358378, "epoch": 2961} {"train_loss": -34.169761657714844, "global_step": 358379, "epoch": 2961} {"train_loss": -24.828052520751953, "global_step": 358380, "epoch": 2961} {"train_loss": -37.40473556518555, "global_step": 358381, "epoch": 2961} {"train_loss": -38.7074089050293, "global_step": 358382, "epoch": 2961} {"train_loss": -34.1103515625, "global_step": 358383, "epoch": 2961} {"train_loss": -31.60743522644043, "global_step": 358384, "epoch": 2961} {"train_loss": -30.409826278686523, "global_step": 358385, "epoch": 2961} {"train_loss": -34.20759201049805, "global_step": 358386, "epoch": 2961} {"train_loss": -35.67804718017578, "global_step": 358387, "epoch": 2961} {"train_loss": -32.659698486328125, "global_step": 358388, "epoch": 2961} {"train_loss": -37.658260345458984, "global_step": 358389, "epoch": 2961} {"train_loss": -37.97284698486328, "global_step": 358390, "epoch": 2961} {"train_loss": -33.76868438720703, "global_step": 358391, "epoch": 2961} {"train_loss": -37.597904205322266, "global_step": 358392, "epoch": 2961} {"train_loss": -36.78742980957031, "global_step": 358393, "epoch": 2961} {"train_loss": -38.00421142578125, "global_step": 358394, "epoch": 2961} {"train_loss": -39.127540588378906, "global_step": 358395, "epoch": 2961} {"train_loss": -40.17719650268555, "global_step": 358396, "epoch": 2961} {"train_loss": -38.50559616088867, "global_step": 358397, "epoch": 2961} {"train_loss": -38.01968002319336, "global_step": 358398, "epoch": 2961} {"train_loss": -37.098636627197266, "global_step": 358399, "epoch": 2961} {"train_loss": -38.40625762939453, "global_step": 358400, "epoch": 2961} {"train_loss": -42.56315327478834, "global_step": 358401, "epoch": 2961, "val_loss": 2845350.75} {"train_loss": -39.65793991088867, "global_step": 358402, "epoch": 2962} {"train_loss": -40.89251708984375, "global_step": 358403, "epoch": 2962} {"train_loss": -41.04414749145508, "global_step": 358404, "epoch": 2962} {"train_loss": -40.482608795166016, "global_step": 358405, "epoch": 2962} {"train_loss": -41.4399299621582, "global_step": 358406, "epoch": 2962} {"train_loss": -40.71574020385742, "global_step": 358407, "epoch": 2962} {"train_loss": -39.4101676940918, "global_step": 358408, "epoch": 2962} {"train_loss": -39.68088912963867, "global_step": 358409, "epoch": 2962} {"train_loss": -41.372833251953125, "global_step": 358410, "epoch": 2962} {"train_loss": -41.24604034423828, "global_step": 358411, "epoch": 2962} {"train_loss": -41.69428634643555, "global_step": 358412, "epoch": 2962} {"train_loss": -42.40745544433594, "global_step": 358413, "epoch": 2962} {"train_loss": -41.36578369140625, "global_step": 358414, "epoch": 2962} {"train_loss": -40.27291488647461, "global_step": 358415, "epoch": 2962} {"train_loss": -42.17538070678711, "global_step": 358416, "epoch": 2962} {"train_loss": -41.923831939697266, "global_step": 358417, "epoch": 2962} {"train_loss": -41.704002380371094, "global_step": 358418, "epoch": 2962} {"train_loss": -42.25932693481445, "global_step": 358419, "epoch": 2962} {"train_loss": -41.9094352722168, "global_step": 358420, "epoch": 2962} {"train_loss": -40.64130401611328, "global_step": 358421, "epoch": 2962} {"train_loss": -42.0652961730957, "global_step": 358422, "epoch": 2962} {"train_loss": -41.37000274658203, "global_step": 358423, "epoch": 2962} {"train_loss": -41.51737594604492, "global_step": 358424, "epoch": 2962} {"train_loss": -42.14650344848633, "global_step": 358425, "epoch": 2962} {"train_loss": -41.17647933959961, "global_step": 358426, "epoch": 2962} {"train_loss": -42.29671859741211, "global_step": 358427, "epoch": 2962} {"train_loss": -42.75602340698242, "global_step": 358428, "epoch": 2962} {"train_loss": -42.224647521972656, "global_step": 358429, "epoch": 2962} {"train_loss": -42.3740119934082, "global_step": 358430, "epoch": 2962} {"train_loss": -42.15945053100586, "global_step": 358431, "epoch": 2962} {"train_loss": -41.881507873535156, "global_step": 358432, "epoch": 2962} {"train_loss": -42.871009826660156, "global_step": 358433, "epoch": 2962} {"train_loss": -42.419410705566406, "global_step": 358434, "epoch": 2962} {"train_loss": -43.05244445800781, "global_step": 358435, "epoch": 2962} {"train_loss": -42.28093719482422, "global_step": 358436, "epoch": 2962} {"train_loss": -43.96687698364258, "global_step": 358437, "epoch": 2962} {"train_loss": -43.303192138671875, "global_step": 358438, "epoch": 2962} {"train_loss": -43.126216888427734, "global_step": 358439, "epoch": 2962} {"train_loss": -43.13847732543945, "global_step": 358440, "epoch": 2962} {"train_loss": -43.846858978271484, "global_step": 358441, "epoch": 2962} {"train_loss": -44.03129196166992, "global_step": 358442, "epoch": 2962} {"train_loss": -43.712623596191406, "global_step": 358443, "epoch": 2962} {"train_loss": -43.48920440673828, "global_step": 358444, "epoch": 2962} {"train_loss": -43.955440521240234, "global_step": 358445, "epoch": 2962} {"train_loss": -43.977840423583984, "global_step": 358446, "epoch": 2962} {"train_loss": -43.28988265991211, "global_step": 358447, "epoch": 2962} {"train_loss": -44.30672836303711, "global_step": 358448, "epoch": 2962} {"train_loss": -43.950069427490234, "global_step": 358449, "epoch": 2962} {"train_loss": -43.82634735107422, "global_step": 358450, "epoch": 2962} {"train_loss": -42.7059211730957, "global_step": 358451, "epoch": 2962} {"train_loss": -44.05963134765625, "global_step": 358452, "epoch": 2962} {"train_loss": -43.18624496459961, "global_step": 358453, "epoch": 2962} {"train_loss": -44.36553192138672, "global_step": 358454, "epoch": 2962} {"train_loss": -43.67429733276367, "global_step": 358455, "epoch": 2962} {"train_loss": -43.56844711303711, "global_step": 358456, "epoch": 2962} {"train_loss": -43.637847900390625, "global_step": 358457, "epoch": 2962} {"train_loss": -44.39670944213867, "global_step": 358458, "epoch": 2962} {"train_loss": -44.13883590698242, "global_step": 358459, "epoch": 2962} {"train_loss": -43.58539962768555, "global_step": 358460, "epoch": 2962} {"train_loss": -44.12358474731445, "global_step": 358461, "epoch": 2962} {"train_loss": -43.93134689331055, "global_step": 358462, "epoch": 2962} {"train_loss": -44.72831344604492, "global_step": 358463, "epoch": 2962} {"train_loss": -43.70254135131836, "global_step": 358464, "epoch": 2962} {"train_loss": -43.798492431640625, "global_step": 358465, "epoch": 2962} {"train_loss": -43.73975372314453, "global_step": 358466, "epoch": 2962} {"train_loss": -44.228660583496094, "global_step": 358467, "epoch": 2962} {"train_loss": -44.58977127075195, "global_step": 358468, "epoch": 2962} {"train_loss": -43.2530632019043, "global_step": 358469, "epoch": 2962} {"train_loss": -44.56346130371094, "global_step": 358470, "epoch": 2962} {"train_loss": -44.38088607788086, "global_step": 358471, "epoch": 2962} {"train_loss": -44.3200569152832, "global_step": 358472, "epoch": 2962} {"train_loss": -44.17411804199219, "global_step": 358473, "epoch": 2962} {"train_loss": -43.57378005981445, "global_step": 358474, "epoch": 2962} {"train_loss": -44.6396598815918, "global_step": 358475, "epoch": 2962} {"train_loss": -44.611488342285156, "global_step": 358476, "epoch": 2962} {"train_loss": -44.84413528442383, "global_step": 358477, "epoch": 2962} {"train_loss": -45.24691390991211, "global_step": 358478, "epoch": 2962} {"train_loss": -45.00188064575195, "global_step": 358479, "epoch": 2962} {"train_loss": -45.38227844238281, "global_step": 358480, "epoch": 2962} {"train_loss": -44.51123809814453, "global_step": 358481, "epoch": 2962} {"train_loss": -43.20808029174805, "global_step": 358482, "epoch": 2962} {"train_loss": -45.436378479003906, "global_step": 358483, "epoch": 2962} {"train_loss": -45.31354904174805, "global_step": 358484, "epoch": 2962} {"train_loss": -44.47184371948242, "global_step": 358485, "epoch": 2962} {"train_loss": -44.73749923706055, "global_step": 358486, "epoch": 2962} {"train_loss": -43.661624908447266, "global_step": 358487, "epoch": 2962} {"train_loss": -43.84650802612305, "global_step": 358488, "epoch": 2962} {"train_loss": -44.4505500793457, "global_step": 358489, "epoch": 2962} {"train_loss": -44.29557418823242, "global_step": 358490, "epoch": 2962} {"train_loss": -44.78443145751953, "global_step": 358491, "epoch": 2962} {"train_loss": -43.97725296020508, "global_step": 358492, "epoch": 2962} {"train_loss": -45.166316986083984, "global_step": 358493, "epoch": 2962} {"train_loss": -44.50922393798828, "global_step": 358494, "epoch": 2962} {"train_loss": -45.74343490600586, "global_step": 358495, "epoch": 2962} {"train_loss": -44.91305160522461, "global_step": 358496, "epoch": 2962} {"train_loss": -45.05686950683594, "global_step": 358497, "epoch": 2962} {"train_loss": -45.12691879272461, "global_step": 358498, "epoch": 2962} {"train_loss": -45.13749313354492, "global_step": 358499, "epoch": 2962} {"train_loss": -44.5814208984375, "global_step": 358500, "epoch": 2962} {"train_loss": -45.041561126708984, "global_step": 358501, "epoch": 2962} {"train_loss": -44.81797790527344, "global_step": 358502, "epoch": 2962} {"train_loss": -44.46311569213867, "global_step": 358503, "epoch": 2962} {"train_loss": -45.048187255859375, "global_step": 358504, "epoch": 2962} {"train_loss": -45.06450271606445, "global_step": 358505, "epoch": 2962} {"train_loss": -44.00617599487305, "global_step": 358506, "epoch": 2962} {"train_loss": -43.7342529296875, "global_step": 358507, "epoch": 2962} {"train_loss": -45.36161422729492, "global_step": 358508, "epoch": 2962} {"train_loss": -43.453834533691406, "global_step": 358509, "epoch": 2962} {"train_loss": -42.50252151489258, "global_step": 358510, "epoch": 2962} {"train_loss": -43.28383255004883, "global_step": 358511, "epoch": 2962} {"train_loss": -43.13534164428711, "global_step": 358512, "epoch": 2962} {"train_loss": -41.7054557800293, "global_step": 358513, "epoch": 2962} {"train_loss": -41.23006057739258, "global_step": 358514, "epoch": 2962} {"train_loss": -44.90138626098633, "global_step": 358515, "epoch": 2962} {"train_loss": -43.8041877746582, "global_step": 358516, "epoch": 2962} {"train_loss": -44.32499313354492, "global_step": 358517, "epoch": 2962} {"train_loss": -44.09554672241211, "global_step": 358518, "epoch": 2962} {"train_loss": -42.957942962646484, "global_step": 358519, "epoch": 2962} {"train_loss": -43.95529556274414, "global_step": 358520, "epoch": 2962} {"train_loss": -44.313026428222656, "global_step": 358521, "epoch": 2962} {"train_loss": -43.38358180779071, "global_step": 358522, "epoch": 2962, "val_loss": 2380081.0} {"train_loss": -44.69331741333008, "global_step": 358523, "epoch": 2963} {"train_loss": -44.535057067871094, "global_step": 358524, "epoch": 2963} {"train_loss": -44.00956344604492, "global_step": 358525, "epoch": 2963} {"train_loss": -44.16283416748047, "global_step": 358526, "epoch": 2963} {"train_loss": -41.9451904296875, "global_step": 358527, "epoch": 2963} {"train_loss": -42.55082321166992, "global_step": 358528, "epoch": 2963} {"train_loss": -44.349239349365234, "global_step": 358529, "epoch": 2963} {"train_loss": -42.30084228515625, "global_step": 358530, "epoch": 2963} {"train_loss": -41.293949127197266, "global_step": 358531, "epoch": 2963} {"train_loss": -43.01386642456055, "global_step": 358532, "epoch": 2963} {"train_loss": -40.48191452026367, "global_step": 358533, "epoch": 2963} {"train_loss": -43.500328063964844, "global_step": 358534, "epoch": 2963} {"train_loss": -40.90302658081055, "global_step": 358535, "epoch": 2963} {"train_loss": -41.48429870605469, "global_step": 358536, "epoch": 2963} {"train_loss": -43.9071044921875, "global_step": 358537, "epoch": 2963} {"train_loss": -40.926204681396484, "global_step": 358538, "epoch": 2963} {"train_loss": -42.67589569091797, "global_step": 358539, "epoch": 2963} {"train_loss": -43.8505973815918, "global_step": 358540, "epoch": 2963} {"train_loss": -43.902137756347656, "global_step": 358541, "epoch": 2963} {"train_loss": -43.85097122192383, "global_step": 358542, "epoch": 2963} {"train_loss": -43.95768356323242, "global_step": 358543, "epoch": 2963} {"train_loss": -44.150543212890625, "global_step": 358544, "epoch": 2963} {"train_loss": -43.985164642333984, "global_step": 358545, "epoch": 2963} {"train_loss": -44.2859992980957, "global_step": 358546, "epoch": 2963} {"train_loss": -43.413116455078125, "global_step": 358547, "epoch": 2963} {"train_loss": -43.723697662353516, "global_step": 358548, "epoch": 2963} {"train_loss": -44.09823226928711, "global_step": 358549, "epoch": 2963} {"train_loss": -42.715511322021484, "global_step": 358550, "epoch": 2963} {"train_loss": -43.22611618041992, "global_step": 358551, "epoch": 2963} {"train_loss": -43.61509323120117, "global_step": 358552, "epoch": 2963} {"train_loss": -44.62881088256836, "global_step": 358553, "epoch": 2963} {"train_loss": -44.53792953491211, "global_step": 358554, "epoch": 2963} {"train_loss": -44.0557746887207, "global_step": 358555, "epoch": 2963} {"train_loss": -43.33766555786133, "global_step": 358556, "epoch": 2963} {"train_loss": -45.04505157470703, "global_step": 358557, "epoch": 2963} {"train_loss": -44.53472900390625, "global_step": 358558, "epoch": 2963} {"train_loss": -44.63064956665039, "global_step": 358559, "epoch": 2963} {"train_loss": -44.86656188964844, "global_step": 358560, "epoch": 2963} {"train_loss": -44.642189025878906, "global_step": 358561, "epoch": 2963} {"train_loss": -44.60080337524414, "global_step": 358562, "epoch": 2963} {"train_loss": -43.998409271240234, "global_step": 358563, "epoch": 2963} {"train_loss": -44.426788330078125, "global_step": 358564, "epoch": 2963} {"train_loss": -44.57245635986328, "global_step": 358565, "epoch": 2963} {"train_loss": -44.252193450927734, "global_step": 358566, "epoch": 2963} {"train_loss": -43.55617904663086, "global_step": 358567, "epoch": 2963} {"train_loss": -44.74763870239258, "global_step": 358568, "epoch": 2963} {"train_loss": -43.2924919128418, "global_step": 358569, "epoch": 2963} {"train_loss": -43.278106689453125, "global_step": 358570, "epoch": 2963} {"train_loss": -43.9745979309082, "global_step": 358571, "epoch": 2963} {"train_loss": -43.54589080810547, "global_step": 358572, "epoch": 2963} {"train_loss": -43.24597930908203, "global_step": 358573, "epoch": 2963} {"train_loss": -44.7366828918457, "global_step": 358574, "epoch": 2963} {"train_loss": -44.260963439941406, "global_step": 358575, "epoch": 2963} {"train_loss": -44.63129806518555, "global_step": 358576, "epoch": 2963} {"train_loss": -44.3893928527832, "global_step": 358577, "epoch": 2963} {"train_loss": -44.321136474609375, "global_step": 358578, "epoch": 2963} {"train_loss": -44.40237808227539, "global_step": 358579, "epoch": 2963} {"train_loss": -44.789791107177734, "global_step": 358580, "epoch": 2963} {"train_loss": -44.342872619628906, "global_step": 358581, "epoch": 2963} {"train_loss": -44.24802780151367, "global_step": 358582, "epoch": 2963} {"train_loss": -43.24636459350586, "global_step": 358583, "epoch": 2963} {"train_loss": -43.69206237792969, "global_step": 358584, "epoch": 2963} {"train_loss": -44.57957077026367, "global_step": 358585, "epoch": 2963} {"train_loss": -42.6057014465332, "global_step": 358586, "epoch": 2963} {"train_loss": -43.44097137451172, "global_step": 358587, "epoch": 2963} {"train_loss": -43.93828201293945, "global_step": 358588, "epoch": 2963} {"train_loss": -41.80971908569336, "global_step": 358589, "epoch": 2963} {"train_loss": -44.07072067260742, "global_step": 358590, "epoch": 2963} {"train_loss": -42.84003448486328, "global_step": 358591, "epoch": 2963} {"train_loss": -42.77897644042969, "global_step": 358592, "epoch": 2963} {"train_loss": -43.68996047973633, "global_step": 358593, "epoch": 2963} {"train_loss": -41.821712493896484, "global_step": 358594, "epoch": 2963} {"train_loss": -43.88383102416992, "global_step": 358595, "epoch": 2963} {"train_loss": -43.597408294677734, "global_step": 358596, "epoch": 2963} {"train_loss": -44.28623580932617, "global_step": 358597, "epoch": 2963} {"train_loss": -43.21912384033203, "global_step": 358598, "epoch": 2963} {"train_loss": -43.58402633666992, "global_step": 358599, "epoch": 2963} {"train_loss": -44.3062858581543, "global_step": 358600, "epoch": 2963} {"train_loss": -44.32444381713867, "global_step": 358601, "epoch": 2963} {"train_loss": -43.97479248046875, "global_step": 358602, "epoch": 2963} {"train_loss": -42.88063430786133, "global_step": 358603, "epoch": 2963} {"train_loss": -44.196868896484375, "global_step": 358604, "epoch": 2963} {"train_loss": -43.323612213134766, "global_step": 358605, "epoch": 2963} {"train_loss": -43.473175048828125, "global_step": 358606, "epoch": 2963} {"train_loss": -44.18910217285156, "global_step": 358607, "epoch": 2963} {"train_loss": -44.25309371948242, "global_step": 358608, "epoch": 2963} {"train_loss": -44.528621673583984, "global_step": 358609, "epoch": 2963} {"train_loss": -44.11325454711914, "global_step": 358610, "epoch": 2963} {"train_loss": -44.40473556518555, "global_step": 358611, "epoch": 2963} {"train_loss": -43.68149948120117, "global_step": 358612, "epoch": 2963} {"train_loss": -44.38602066040039, "global_step": 358613, "epoch": 2963} {"train_loss": -43.59058380126953, "global_step": 358614, "epoch": 2963} {"train_loss": -44.242401123046875, "global_step": 358615, "epoch": 2963} {"train_loss": -44.313114166259766, "global_step": 358616, "epoch": 2963} {"train_loss": -44.156959533691406, "global_step": 358617, "epoch": 2963} {"train_loss": -44.47477340698242, "global_step": 358618, "epoch": 2963} {"train_loss": -42.98828125, "global_step": 358619, "epoch": 2963} {"train_loss": -44.145565032958984, "global_step": 358620, "epoch": 2963} {"train_loss": -43.69035339355469, "global_step": 358621, "epoch": 2963} {"train_loss": -44.150691986083984, "global_step": 358622, "epoch": 2963} {"train_loss": -42.44169616699219, "global_step": 358623, "epoch": 2963} {"train_loss": -42.99690246582031, "global_step": 358624, "epoch": 2963} {"train_loss": -43.058536529541016, "global_step": 358625, "epoch": 2963} {"train_loss": -44.542999267578125, "global_step": 358626, "epoch": 2963} {"train_loss": -43.84498596191406, "global_step": 358627, "epoch": 2963} {"train_loss": -43.93955612182617, "global_step": 358628, "epoch": 2963} {"train_loss": -43.27301025390625, "global_step": 358629, "epoch": 2963} {"train_loss": -44.64370346069336, "global_step": 358630, "epoch": 2963} {"train_loss": -44.29179000854492, "global_step": 358631, "epoch": 2963} {"train_loss": -44.33232116699219, "global_step": 358632, "epoch": 2963} {"train_loss": -44.693111419677734, "global_step": 358633, "epoch": 2963} {"train_loss": -44.123653411865234, "global_step": 358634, "epoch": 2963} {"train_loss": -44.56007766723633, "global_step": 358635, "epoch": 2963} {"train_loss": -43.595027923583984, "global_step": 358636, "epoch": 2963} {"train_loss": -43.76096725463867, "global_step": 358637, "epoch": 2963} {"train_loss": -43.964683532714844, "global_step": 358638, "epoch": 2963} {"train_loss": -44.42332458496094, "global_step": 358639, "epoch": 2963} {"train_loss": -43.800506591796875, "global_step": 358640, "epoch": 2963} {"train_loss": -44.7406005859375, "global_step": 358641, "epoch": 2963} {"train_loss": -43.5972900390625, "global_step": 358642, "epoch": 2963} {"train_loss": -43.7438617422561, "global_step": 358643, "epoch": 2963, "val_loss": 2425377.5} {"train_loss": -42.85873794555664, "global_step": 358644, "epoch": 2964} {"train_loss": -43.25676727294922, "global_step": 358645, "epoch": 2964} {"train_loss": -43.93385696411133, "global_step": 358646, "epoch": 2964} {"train_loss": -43.6439323425293, "global_step": 358647, "epoch": 2964} {"train_loss": -42.764373779296875, "global_step": 358648, "epoch": 2964} {"train_loss": -42.65040969848633, "global_step": 358649, "epoch": 2964} {"train_loss": -44.267921447753906, "global_step": 358650, "epoch": 2964} {"train_loss": -44.2960319519043, "global_step": 358651, "epoch": 2964} {"train_loss": -44.012969970703125, "global_step": 358652, "epoch": 2964} {"train_loss": -41.86831283569336, "global_step": 358653, "epoch": 2964} {"train_loss": -44.20876693725586, "global_step": 358654, "epoch": 2964} {"train_loss": -43.52704620361328, "global_step": 358655, "epoch": 2964} {"train_loss": -43.47378921508789, "global_step": 358656, "epoch": 2964} {"train_loss": -44.156959533691406, "global_step": 358657, "epoch": 2964} {"train_loss": -44.28181457519531, "global_step": 358658, "epoch": 2964} {"train_loss": -44.303466796875, "global_step": 358659, "epoch": 2964} {"train_loss": -43.5505485534668, "global_step": 358660, "epoch": 2964} {"train_loss": -44.56476593017578, "global_step": 358661, "epoch": 2964} {"train_loss": -44.4444465637207, "global_step": 358662, "epoch": 2964} {"train_loss": -44.3841667175293, "global_step": 358663, "epoch": 2964} {"train_loss": -44.98736572265625, "global_step": 358664, "epoch": 2964} {"train_loss": -44.78741455078125, "global_step": 358665, "epoch": 2964} {"train_loss": -44.83205032348633, "global_step": 358666, "epoch": 2964} {"train_loss": -44.742767333984375, "global_step": 358667, "epoch": 2964} {"train_loss": -44.35478591918945, "global_step": 358668, "epoch": 2964} {"train_loss": -45.19697952270508, "global_step": 358669, "epoch": 2964} {"train_loss": -44.881591796875, "global_step": 358670, "epoch": 2964} {"train_loss": -43.709991455078125, "global_step": 358671, "epoch": 2964} {"train_loss": -43.78272247314453, "global_step": 358672, "epoch": 2964} {"train_loss": -44.48197937011719, "global_step": 358673, "epoch": 2964} {"train_loss": -44.90590286254883, "global_step": 358674, "epoch": 2964} {"train_loss": -45.230926513671875, "global_step": 358675, "epoch": 2964} {"train_loss": -44.785804748535156, "global_step": 358676, "epoch": 2964} {"train_loss": -44.89767074584961, "global_step": 358677, "epoch": 2964} {"train_loss": -45.132080078125, "global_step": 358678, "epoch": 2964} {"train_loss": -44.79248809814453, "global_step": 358679, "epoch": 2964} {"train_loss": -44.91171646118164, "global_step": 358680, "epoch": 2964} {"train_loss": -45.25254821777344, "global_step": 358681, "epoch": 2964} {"train_loss": -44.78154754638672, "global_step": 358682, "epoch": 2964} {"train_loss": -44.94980239868164, "global_step": 358683, "epoch": 2964} {"train_loss": -44.003944396972656, "global_step": 358684, "epoch": 2964} {"train_loss": -45.13514709472656, "global_step": 358685, "epoch": 2964} {"train_loss": -44.89529037475586, "global_step": 358686, "epoch": 2964} {"train_loss": -44.05005645751953, "global_step": 358687, "epoch": 2964} {"train_loss": -43.19623947143555, "global_step": 358688, "epoch": 2964} {"train_loss": -44.76137924194336, "global_step": 358689, "epoch": 2964} {"train_loss": -44.21084213256836, "global_step": 358690, "epoch": 2964} {"train_loss": -43.18455123901367, "global_step": 358691, "epoch": 2964} {"train_loss": -42.91380310058594, "global_step": 358692, "epoch": 2964} {"train_loss": -44.404964447021484, "global_step": 358693, "epoch": 2964} {"train_loss": -44.691864013671875, "global_step": 358694, "epoch": 2964} {"train_loss": -43.500736236572266, "global_step": 358695, "epoch": 2964} {"train_loss": -43.57017135620117, "global_step": 358696, "epoch": 2964} {"train_loss": -44.83557891845703, "global_step": 358697, "epoch": 2964} {"train_loss": -44.31280517578125, "global_step": 358698, "epoch": 2964} {"train_loss": -44.80289840698242, "global_step": 358699, "epoch": 2964} {"train_loss": -44.368072509765625, "global_step": 358700, "epoch": 2964} {"train_loss": -44.54378890991211, "global_step": 358701, "epoch": 2964} {"train_loss": -44.71689987182617, "global_step": 358702, "epoch": 2964} {"train_loss": -44.71368408203125, "global_step": 358703, "epoch": 2964} {"train_loss": -44.60274124145508, "global_step": 358704, "epoch": 2964} {"train_loss": -43.45792770385742, "global_step": 358705, "epoch": 2964} {"train_loss": -44.29396057128906, "global_step": 358706, "epoch": 2964} {"train_loss": -44.013092041015625, "global_step": 358707, "epoch": 2964} {"train_loss": -45.04429244995117, "global_step": 358708, "epoch": 2964} {"train_loss": -42.92142868041992, "global_step": 358709, "epoch": 2964} {"train_loss": -43.651668548583984, "global_step": 358710, "epoch": 2964} {"train_loss": -44.238887786865234, "global_step": 358711, "epoch": 2964} {"train_loss": -43.99555587768555, "global_step": 358712, "epoch": 2964} {"train_loss": -43.45620346069336, "global_step": 358713, "epoch": 2964} {"train_loss": -44.086605072021484, "global_step": 358714, "epoch": 2964} {"train_loss": -43.91757583618164, "global_step": 358715, "epoch": 2964} {"train_loss": -43.49560546875, "global_step": 358716, "epoch": 2964} {"train_loss": -43.781612396240234, "global_step": 358717, "epoch": 2964} {"train_loss": -43.033729553222656, "global_step": 358718, "epoch": 2964} {"train_loss": -41.89221954345703, "global_step": 358719, "epoch": 2964} {"train_loss": -44.924442291259766, "global_step": 358720, "epoch": 2964} {"train_loss": -43.60128402709961, "global_step": 358721, "epoch": 2964} {"train_loss": -43.079463958740234, "global_step": 358722, "epoch": 2964} {"train_loss": -44.82497787475586, "global_step": 358723, "epoch": 2964} {"train_loss": -44.10395431518555, "global_step": 358724, "epoch": 2964} {"train_loss": -43.556087493896484, "global_step": 358725, "epoch": 2964} {"train_loss": -44.98301315307617, "global_step": 358726, "epoch": 2964} {"train_loss": -44.50547409057617, "global_step": 358727, "epoch": 2964} {"train_loss": -43.80086898803711, "global_step": 358728, "epoch": 2964} {"train_loss": -44.61862564086914, "global_step": 358729, "epoch": 2964} {"train_loss": -43.13193893432617, "global_step": 358730, "epoch": 2964} {"train_loss": -44.34186935424805, "global_step": 358731, "epoch": 2964} {"train_loss": -44.66064453125, "global_step": 358732, "epoch": 2964} {"train_loss": -44.076351165771484, "global_step": 358733, "epoch": 2964} {"train_loss": -45.224910736083984, "global_step": 358734, "epoch": 2964} {"train_loss": -44.509063720703125, "global_step": 358735, "epoch": 2964} {"train_loss": -44.96311569213867, "global_step": 358736, "epoch": 2964} {"train_loss": -45.09059524536133, "global_step": 358737, "epoch": 2964} {"train_loss": -45.142127990722656, "global_step": 358738, "epoch": 2964} {"train_loss": -44.849281311035156, "global_step": 358739, "epoch": 2964} {"train_loss": -45.35963439941406, "global_step": 358740, "epoch": 2964} {"train_loss": -44.37362289428711, "global_step": 358741, "epoch": 2964} {"train_loss": -45.32164764404297, "global_step": 358742, "epoch": 2964} {"train_loss": -45.31736373901367, "global_step": 358743, "epoch": 2964} {"train_loss": -44.043846130371094, "global_step": 358744, "epoch": 2964} {"train_loss": -45.431114196777344, "global_step": 358745, "epoch": 2964} {"train_loss": -44.837493896484375, "global_step": 358746, "epoch": 2964} {"train_loss": -44.117557525634766, "global_step": 358747, "epoch": 2964} {"train_loss": -45.49203109741211, "global_step": 358748, "epoch": 2964} {"train_loss": -45.02106475830078, "global_step": 358749, "epoch": 2964} {"train_loss": -45.42279052734375, "global_step": 358750, "epoch": 2964} {"train_loss": -44.9708251953125, "global_step": 358751, "epoch": 2964} {"train_loss": -45.57107925415039, "global_step": 358752, "epoch": 2964} {"train_loss": -44.75252914428711, "global_step": 358753, "epoch": 2964} {"train_loss": -43.85710144042969, "global_step": 358754, "epoch": 2964} {"train_loss": -43.84412384033203, "global_step": 358755, "epoch": 2964} {"train_loss": -44.93135452270508, "global_step": 358756, "epoch": 2964} {"train_loss": -43.67340850830078, "global_step": 358757, "epoch": 2964} {"train_loss": -43.42201614379883, "global_step": 358758, "epoch": 2964} {"train_loss": -44.712345123291016, "global_step": 358759, "epoch": 2964} {"train_loss": -43.9261474609375, "global_step": 358760, "epoch": 2964} {"train_loss": -41.822628021240234, "global_step": 358761, "epoch": 2964} {"train_loss": -43.638641357421875, "global_step": 358762, "epoch": 2964} {"train_loss": -44.89226531982422, "global_step": 358763, "epoch": 2964} {"train_loss": -44.25549228132264, "global_step": 358764, "epoch": 2964, "val_loss": 2414756.75} {"train_loss": -43.34278106689453, "global_step": 358765, "epoch": 2965} {"train_loss": -45.20904541015625, "global_step": 358766, "epoch": 2965} {"train_loss": -43.849849700927734, "global_step": 358767, "epoch": 2965} {"train_loss": -44.29353713989258, "global_step": 358768, "epoch": 2965} {"train_loss": -42.36075210571289, "global_step": 358769, "epoch": 2965} {"train_loss": -43.67951583862305, "global_step": 358770, "epoch": 2965} {"train_loss": -40.26544952392578, "global_step": 358771, "epoch": 2965} {"train_loss": -44.83879470825195, "global_step": 358772, "epoch": 2965} {"train_loss": -39.86676788330078, "global_step": 358773, "epoch": 2965} {"train_loss": -44.54011154174805, "global_step": 358774, "epoch": 2965} {"train_loss": -39.23818588256836, "global_step": 358775, "epoch": 2965} {"train_loss": -44.53651428222656, "global_step": 358776, "epoch": 2965} {"train_loss": -41.19533157348633, "global_step": 358777, "epoch": 2965} {"train_loss": -44.06585693359375, "global_step": 358778, "epoch": 2965} {"train_loss": -39.551456451416016, "global_step": 358779, "epoch": 2965} {"train_loss": -42.8812141418457, "global_step": 358780, "epoch": 2965} {"train_loss": -40.6481819152832, "global_step": 358781, "epoch": 2965} {"train_loss": -42.89705276489258, "global_step": 358782, "epoch": 2965} {"train_loss": -41.73259735107422, "global_step": 358783, "epoch": 2965} {"train_loss": -44.378623962402344, "global_step": 358784, "epoch": 2965} {"train_loss": -42.628536224365234, "global_step": 358785, "epoch": 2965} {"train_loss": -44.1387825012207, "global_step": 358786, "epoch": 2965} {"train_loss": -43.6594123840332, "global_step": 358787, "epoch": 2965} {"train_loss": -43.63869094848633, "global_step": 358788, "epoch": 2965} {"train_loss": -44.24654006958008, "global_step": 358789, "epoch": 2965} {"train_loss": -44.306640625, "global_step": 358790, "epoch": 2965} {"train_loss": -44.51240921020508, "global_step": 358791, "epoch": 2965} {"train_loss": -43.45018768310547, "global_step": 358792, "epoch": 2965} {"train_loss": -44.800106048583984, "global_step": 358793, "epoch": 2965} {"train_loss": -42.66217803955078, "global_step": 358794, "epoch": 2965} {"train_loss": -44.896419525146484, "global_step": 358795, "epoch": 2965} {"train_loss": -43.38093948364258, "global_step": 358796, "epoch": 2965} {"train_loss": -44.67689895629883, "global_step": 358797, "epoch": 2965} {"train_loss": -43.826210021972656, "global_step": 358798, "epoch": 2965} {"train_loss": -44.97935485839844, "global_step": 358799, "epoch": 2965} {"train_loss": -44.62203598022461, "global_step": 358800, "epoch": 2965} {"train_loss": -44.58290481567383, "global_step": 358801, "epoch": 2965} {"train_loss": -44.62863540649414, "global_step": 358802, "epoch": 2965} {"train_loss": -44.94610595703125, "global_step": 358803, "epoch": 2965} {"train_loss": -44.6876220703125, "global_step": 358804, "epoch": 2965} {"train_loss": -44.61262130737305, "global_step": 358805, "epoch": 2965} {"train_loss": -45.269264221191406, "global_step": 358806, "epoch": 2965} {"train_loss": -44.732826232910156, "global_step": 358807, "epoch": 2965} {"train_loss": -45.13930892944336, "global_step": 358808, "epoch": 2965} {"train_loss": -44.78208923339844, "global_step": 358809, "epoch": 2965} {"train_loss": -44.6640510559082, "global_step": 358810, "epoch": 2965} {"train_loss": -45.020240783691406, "global_step": 358811, "epoch": 2965} {"train_loss": -45.56927490234375, "global_step": 358812, "epoch": 2965} {"train_loss": -45.04243087768555, "global_step": 358813, "epoch": 2965} {"train_loss": -44.78651809692383, "global_step": 358814, "epoch": 2965} {"train_loss": -43.7736930847168, "global_step": 358815, "epoch": 2965} {"train_loss": -44.82795333862305, "global_step": 358816, "epoch": 2965} {"train_loss": -44.526466369628906, "global_step": 358817, "epoch": 2965} {"train_loss": -45.45746994018555, "global_step": 358818, "epoch": 2965} {"train_loss": -44.90534210205078, "global_step": 358819, "epoch": 2965} {"train_loss": -45.227027893066406, "global_step": 358820, "epoch": 2965} {"train_loss": -44.68257522583008, "global_step": 358821, "epoch": 2965} {"train_loss": -45.081539154052734, "global_step": 358822, "epoch": 2965} {"train_loss": -45.184505462646484, "global_step": 358823, "epoch": 2965} {"train_loss": -45.6632194519043, "global_step": 358824, "epoch": 2965} {"train_loss": -45.43296432495117, "global_step": 358825, "epoch": 2965} {"train_loss": -45.09828567504883, "global_step": 358826, "epoch": 2965} {"train_loss": -44.67890167236328, "global_step": 358827, "epoch": 2965} {"train_loss": -44.4101676940918, "global_step": 358828, "epoch": 2965} {"train_loss": -45.117401123046875, "global_step": 358829, "epoch": 2965} {"train_loss": -45.36635971069336, "global_step": 358830, "epoch": 2965} {"train_loss": -45.18465042114258, "global_step": 358831, "epoch": 2965} {"train_loss": -44.62495422363281, "global_step": 358832, "epoch": 2965} {"train_loss": -43.930782318115234, "global_step": 358833, "epoch": 2965} {"train_loss": -44.30367660522461, "global_step": 358834, "epoch": 2965} {"train_loss": -44.32613754272461, "global_step": 358835, "epoch": 2965} {"train_loss": -44.997291564941406, "global_step": 358836, "epoch": 2965} {"train_loss": -45.01033020019531, "global_step": 358837, "epoch": 2965} {"train_loss": -45.25962448120117, "global_step": 358838, "epoch": 2965} {"train_loss": -44.8899040222168, "global_step": 358839, "epoch": 2965} {"train_loss": -44.23226547241211, "global_step": 358840, "epoch": 2965} {"train_loss": -44.10752487182617, "global_step": 358841, "epoch": 2965} {"train_loss": -45.06220245361328, "global_step": 358842, "epoch": 2965} {"train_loss": -45.389434814453125, "global_step": 358843, "epoch": 2965} {"train_loss": -44.88334274291992, "global_step": 358844, "epoch": 2965} {"train_loss": -44.99415969848633, "global_step": 358845, "epoch": 2965} {"train_loss": -45.31035614013672, "global_step": 358846, "epoch": 2965} {"train_loss": -45.31304931640625, "global_step": 358847, "epoch": 2965} {"train_loss": -44.730506896972656, "global_step": 358848, "epoch": 2965} {"train_loss": -44.475128173828125, "global_step": 358849, "epoch": 2965} {"train_loss": -44.336151123046875, "global_step": 358850, "epoch": 2965} {"train_loss": -44.72109603881836, "global_step": 358851, "epoch": 2965} {"train_loss": -43.952274322509766, "global_step": 358852, "epoch": 2965} {"train_loss": -44.740108489990234, "global_step": 358853, "epoch": 2965} {"train_loss": -45.35851287841797, "global_step": 358854, "epoch": 2965} {"train_loss": -44.43219757080078, "global_step": 358855, "epoch": 2965} {"train_loss": -44.59447479248047, "global_step": 358856, "epoch": 2965} {"train_loss": -44.57938766479492, "global_step": 358857, "epoch": 2965} {"train_loss": -44.92604446411133, "global_step": 358858, "epoch": 2965} {"train_loss": -44.73230743408203, "global_step": 358859, "epoch": 2965} {"train_loss": -44.8755989074707, "global_step": 358860, "epoch": 2965} {"train_loss": -44.132965087890625, "global_step": 358861, "epoch": 2965} {"train_loss": -44.59064865112305, "global_step": 358862, "epoch": 2965} {"train_loss": -44.57194519042969, "global_step": 358863, "epoch": 2965} {"train_loss": -44.306068420410156, "global_step": 358864, "epoch": 2965} {"train_loss": -45.21366882324219, "global_step": 358865, "epoch": 2965} {"train_loss": -44.764686584472656, "global_step": 358866, "epoch": 2965} {"train_loss": -43.413604736328125, "global_step": 358867, "epoch": 2965} {"train_loss": -43.858062744140625, "global_step": 358868, "epoch": 2965} {"train_loss": -44.755706787109375, "global_step": 358869, "epoch": 2965} {"train_loss": -43.59196853637695, "global_step": 358870, "epoch": 2965} {"train_loss": -43.98674011230469, "global_step": 358871, "epoch": 2965} {"train_loss": -42.71320343017578, "global_step": 358872, "epoch": 2965} {"train_loss": -42.15719223022461, "global_step": 358873, "epoch": 2965} {"train_loss": -44.804359436035156, "global_step": 358874, "epoch": 2965} {"train_loss": -43.16331100463867, "global_step": 358875, "epoch": 2965} {"train_loss": -42.65420913696289, "global_step": 358876, "epoch": 2965} {"train_loss": -44.05125045776367, "global_step": 358877, "epoch": 2965} {"train_loss": -44.315704345703125, "global_step": 358878, "epoch": 2965} {"train_loss": -42.65275192260742, "global_step": 358879, "epoch": 2965} {"train_loss": -44.80827713012695, "global_step": 358880, "epoch": 2965} {"train_loss": -42.600242614746094, "global_step": 358881, "epoch": 2965} {"train_loss": -42.031795501708984, "global_step": 358882, "epoch": 2965} {"train_loss": -43.76861572265625, "global_step": 358883, "epoch": 2965} {"train_loss": -42.0333137512207, "global_step": 358884, "epoch": 2965} {"train_loss": -44.13275077126243, "global_step": 358885, "epoch": 2965, "val_loss": 2519845.25} {"train_loss": -43.87691116333008, "global_step": 358886, "epoch": 2966} {"train_loss": -43.31748580932617, "global_step": 358887, "epoch": 2966} {"train_loss": -41.88191604614258, "global_step": 358888, "epoch": 2966} {"train_loss": -41.8773193359375, "global_step": 358889, "epoch": 2966} {"train_loss": -41.93924331665039, "global_step": 358890, "epoch": 2966} {"train_loss": -42.875911712646484, "global_step": 358891, "epoch": 2966} {"train_loss": -43.03291320800781, "global_step": 358892, "epoch": 2966} {"train_loss": -42.731300354003906, "global_step": 358893, "epoch": 2966} {"train_loss": -41.86787796020508, "global_step": 358894, "epoch": 2966} {"train_loss": -42.70273208618164, "global_step": 358895, "epoch": 2966} {"train_loss": -42.87866973876953, "global_step": 358896, "epoch": 2966} {"train_loss": -42.28373336791992, "global_step": 358897, "epoch": 2966} {"train_loss": -41.896644592285156, "global_step": 358898, "epoch": 2966} {"train_loss": -43.38283920288086, "global_step": 358899, "epoch": 2966} {"train_loss": -43.234771728515625, "global_step": 358900, "epoch": 2966} {"train_loss": -43.58855056762695, "global_step": 358901, "epoch": 2966} {"train_loss": -42.06366729736328, "global_step": 358902, "epoch": 2966} {"train_loss": -43.39728546142578, "global_step": 358903, "epoch": 2966} {"train_loss": -43.26621627807617, "global_step": 358904, "epoch": 2966} {"train_loss": -43.381019592285156, "global_step": 358905, "epoch": 2966} {"train_loss": -42.89344787597656, "global_step": 358906, "epoch": 2966} {"train_loss": -43.59821319580078, "global_step": 358907, "epoch": 2966} {"train_loss": -43.393775939941406, "global_step": 358908, "epoch": 2966} {"train_loss": -43.28715133666992, "global_step": 358909, "epoch": 2966} {"train_loss": -44.32257843017578, "global_step": 358910, "epoch": 2966} {"train_loss": -43.26687240600586, "global_step": 358911, "epoch": 2966} {"train_loss": -43.56650924682617, "global_step": 358912, "epoch": 2966} {"train_loss": -44.568477630615234, "global_step": 358913, "epoch": 2966} {"train_loss": -43.44736862182617, "global_step": 358914, "epoch": 2966} {"train_loss": -43.44328308105469, "global_step": 358915, "epoch": 2966} {"train_loss": -44.78018569946289, "global_step": 358916, "epoch": 2966} {"train_loss": -43.59880828857422, "global_step": 358917, "epoch": 2966} {"train_loss": -43.276100158691406, "global_step": 358918, "epoch": 2966} {"train_loss": -44.60431671142578, "global_step": 358919, "epoch": 2966} {"train_loss": -42.680328369140625, "global_step": 358920, "epoch": 2966} {"train_loss": -44.49424362182617, "global_step": 358921, "epoch": 2966} {"train_loss": -43.7558479309082, "global_step": 358922, "epoch": 2966} {"train_loss": -43.11494064331055, "global_step": 358923, "epoch": 2966} {"train_loss": -44.96601486206055, "global_step": 358924, "epoch": 2966} {"train_loss": -44.12784957885742, "global_step": 358925, "epoch": 2966} {"train_loss": -43.064327239990234, "global_step": 358926, "epoch": 2966} {"train_loss": -44.88985824584961, "global_step": 358927, "epoch": 2966} {"train_loss": -43.426063537597656, "global_step": 358928, "epoch": 2966} {"train_loss": -44.9837532043457, "global_step": 358929, "epoch": 2966} {"train_loss": -44.841773986816406, "global_step": 358930, "epoch": 2966} {"train_loss": -43.79311752319336, "global_step": 358931, "epoch": 2966} {"train_loss": -44.459598541259766, "global_step": 358932, "epoch": 2966} {"train_loss": -44.96857452392578, "global_step": 358933, "epoch": 2966} {"train_loss": -44.39909362792969, "global_step": 358934, "epoch": 2966} {"train_loss": -44.81740188598633, "global_step": 358935, "epoch": 2966} {"train_loss": -44.49705505371094, "global_step": 358936, "epoch": 2966} {"train_loss": -44.95944595336914, "global_step": 358937, "epoch": 2966} {"train_loss": -44.9136962890625, "global_step": 358938, "epoch": 2966} {"train_loss": -44.985931396484375, "global_step": 358939, "epoch": 2966} {"train_loss": -45.22182846069336, "global_step": 358940, "epoch": 2966} {"train_loss": -44.82046127319336, "global_step": 358941, "epoch": 2966} {"train_loss": -45.298919677734375, "global_step": 358942, "epoch": 2966} {"train_loss": -45.79775619506836, "global_step": 358943, "epoch": 2966} {"train_loss": -45.075016021728516, "global_step": 358944, "epoch": 2966} {"train_loss": -45.32497024536133, "global_step": 358945, "epoch": 2966} {"train_loss": -45.798561096191406, "global_step": 358946, "epoch": 2966} {"train_loss": -44.90501022338867, "global_step": 358947, "epoch": 2966} {"train_loss": -45.40855026245117, "global_step": 358948, "epoch": 2966} {"train_loss": -45.23965835571289, "global_step": 358949, "epoch": 2966} {"train_loss": -45.83999252319336, "global_step": 358950, "epoch": 2966} {"train_loss": -44.996864318847656, "global_step": 358951, "epoch": 2966} {"train_loss": -44.667076110839844, "global_step": 358952, "epoch": 2966} {"train_loss": -45.381507873535156, "global_step": 358953, "epoch": 2966} {"train_loss": -45.3227653503418, "global_step": 358954, "epoch": 2966} {"train_loss": -45.4062385559082, "global_step": 358955, "epoch": 2966} {"train_loss": -45.509674072265625, "global_step": 358956, "epoch": 2966} {"train_loss": -45.39760208129883, "global_step": 358957, "epoch": 2966} {"train_loss": -45.55352783203125, "global_step": 358958, "epoch": 2966} {"train_loss": -45.64466094970703, "global_step": 358959, "epoch": 2966} {"train_loss": -45.983638763427734, "global_step": 358960, "epoch": 2966} {"train_loss": -45.105316162109375, "global_step": 358961, "epoch": 2966} {"train_loss": -45.76569747924805, "global_step": 358962, "epoch": 2966} {"train_loss": -45.13218688964844, "global_step": 358963, "epoch": 2966} {"train_loss": -45.687068939208984, "global_step": 358964, "epoch": 2966} {"train_loss": -45.75334548950195, "global_step": 358965, "epoch": 2966} {"train_loss": -45.728511810302734, "global_step": 358966, "epoch": 2966} {"train_loss": -45.60128402709961, "global_step": 358967, "epoch": 2966} {"train_loss": -45.60811996459961, "global_step": 358968, "epoch": 2966} {"train_loss": -45.733402252197266, "global_step": 358969, "epoch": 2966} {"train_loss": -45.81659698486328, "global_step": 358970, "epoch": 2966} {"train_loss": -46.003238677978516, "global_step": 358971, "epoch": 2966} {"train_loss": -45.5768928527832, "global_step": 358972, "epoch": 2966} {"train_loss": -45.49729537963867, "global_step": 358973, "epoch": 2966} {"train_loss": -46.054622650146484, "global_step": 358974, "epoch": 2966} {"train_loss": -45.90049362182617, "global_step": 358975, "epoch": 2966} {"train_loss": -45.201820373535156, "global_step": 358976, "epoch": 2966} {"train_loss": -44.794185638427734, "global_step": 358977, "epoch": 2966} {"train_loss": -44.953487396240234, "global_step": 358978, "epoch": 2966} {"train_loss": -45.64275360107422, "global_step": 358979, "epoch": 2966} {"train_loss": -45.880516052246094, "global_step": 358980, "epoch": 2966} {"train_loss": -45.70207595825195, "global_step": 358981, "epoch": 2966} {"train_loss": -45.073665618896484, "global_step": 358982, "epoch": 2966} {"train_loss": -45.476078033447266, "global_step": 358983, "epoch": 2966} {"train_loss": -44.28282928466797, "global_step": 358984, "epoch": 2966} {"train_loss": -45.53998947143555, "global_step": 358985, "epoch": 2966} {"train_loss": -45.03290939331055, "global_step": 358986, "epoch": 2966} {"train_loss": -43.985660552978516, "global_step": 358987, "epoch": 2966} {"train_loss": -43.46755599975586, "global_step": 358988, "epoch": 2966} {"train_loss": -44.37274932861328, "global_step": 358989, "epoch": 2966} {"train_loss": -42.77172088623047, "global_step": 358990, "epoch": 2966} {"train_loss": -42.77608871459961, "global_step": 358991, "epoch": 2966} {"train_loss": -44.98859786987305, "global_step": 358992, "epoch": 2966} {"train_loss": -44.61471176147461, "global_step": 358993, "epoch": 2966} {"train_loss": -44.845577239990234, "global_step": 358994, "epoch": 2966} {"train_loss": -43.873756408691406, "global_step": 358995, "epoch": 2966} {"train_loss": -44.169044494628906, "global_step": 358996, "epoch": 2966} {"train_loss": -45.15631103515625, "global_step": 358997, "epoch": 2966} {"train_loss": -44.98579788208008, "global_step": 358998, "epoch": 2966} {"train_loss": -44.65285110473633, "global_step": 358999, "epoch": 2966} {"train_loss": -42.76225662231445, "global_step": 359000, "epoch": 2966} {"train_loss": -42.08732986450195, "global_step": 359001, "epoch": 2966} {"train_loss": -43.62310791015625, "global_step": 359002, "epoch": 2966} {"train_loss": -42.2242317199707, "global_step": 359003, "epoch": 2966} {"train_loss": -43.76544189453125, "global_step": 359004, "epoch": 2966} {"train_loss": -43.10915756225586, "global_step": 359005, "epoch": 2966} {"train_loss": -44.33370564988822, "global_step": 359006, "epoch": 2966, "val_loss": 2483081.25} {"train_loss": -42.12388229370117, "global_step": 359007, "epoch": 2967} {"train_loss": -40.05405807495117, "global_step": 359008, "epoch": 2967} {"train_loss": -44.1572380065918, "global_step": 359009, "epoch": 2967} {"train_loss": -39.51597213745117, "global_step": 359010, "epoch": 2967} {"train_loss": -43.97774124145508, "global_step": 359011, "epoch": 2967} {"train_loss": -39.9189567565918, "global_step": 359012, "epoch": 2967} {"train_loss": -43.89557647705078, "global_step": 359013, "epoch": 2967} {"train_loss": -42.30500411987305, "global_step": 359014, "epoch": 2967} {"train_loss": -43.80116653442383, "global_step": 359015, "epoch": 2967} {"train_loss": -43.20550537109375, "global_step": 359016, "epoch": 2967} {"train_loss": -43.882354736328125, "global_step": 359017, "epoch": 2967} {"train_loss": -43.63823318481445, "global_step": 359018, "epoch": 2967} {"train_loss": -44.06828308105469, "global_step": 359019, "epoch": 2967} {"train_loss": -44.07307052612305, "global_step": 359020, "epoch": 2967} {"train_loss": -44.6044807434082, "global_step": 359021, "epoch": 2967} {"train_loss": -44.2302360534668, "global_step": 359022, "epoch": 2967} {"train_loss": -44.8500862121582, "global_step": 359023, "epoch": 2967} {"train_loss": -44.31591033935547, "global_step": 359024, "epoch": 2967} {"train_loss": -43.98006820678711, "global_step": 359025, "epoch": 2967} {"train_loss": -43.78034591674805, "global_step": 359026, "epoch": 2967} {"train_loss": -44.892799377441406, "global_step": 359027, "epoch": 2967} {"train_loss": -44.70392990112305, "global_step": 359028, "epoch": 2967} {"train_loss": -44.74673080444336, "global_step": 359029, "epoch": 2967} {"train_loss": -44.80861282348633, "global_step": 359030, "epoch": 2967} {"train_loss": -44.83454132080078, "global_step": 359031, "epoch": 2967} {"train_loss": -45.02912139892578, "global_step": 359032, "epoch": 2967} {"train_loss": -45.00077438354492, "global_step": 359033, "epoch": 2967} {"train_loss": -44.6166877746582, "global_step": 359034, "epoch": 2967} {"train_loss": -45.37840270996094, "global_step": 359035, "epoch": 2967} {"train_loss": -44.762081146240234, "global_step": 359036, "epoch": 2967} {"train_loss": -45.35325241088867, "global_step": 359037, "epoch": 2967} {"train_loss": -45.66139221191406, "global_step": 359038, "epoch": 2967} {"train_loss": -44.627113342285156, "global_step": 359039, "epoch": 2967} {"train_loss": -44.71574401855469, "global_step": 359040, "epoch": 2967} {"train_loss": -45.14420700073242, "global_step": 359041, "epoch": 2967} {"train_loss": -45.50437927246094, "global_step": 359042, "epoch": 2967} {"train_loss": -44.44187545776367, "global_step": 359043, "epoch": 2967} {"train_loss": -45.1668586730957, "global_step": 359044, "epoch": 2967} {"train_loss": -44.944087982177734, "global_step": 359045, "epoch": 2967} {"train_loss": -45.12194061279297, "global_step": 359046, "epoch": 2967} {"train_loss": -44.54293441772461, "global_step": 359047, "epoch": 2967} {"train_loss": -45.21097946166992, "global_step": 359048, "epoch": 2967} {"train_loss": -45.20226287841797, "global_step": 359049, "epoch": 2967} {"train_loss": -43.92267990112305, "global_step": 359050, "epoch": 2967} {"train_loss": -44.41169357299805, "global_step": 359051, "epoch": 2967} {"train_loss": -45.4179801940918, "global_step": 359052, "epoch": 2967} {"train_loss": -44.77582931518555, "global_step": 359053, "epoch": 2967} {"train_loss": -44.18277359008789, "global_step": 359054, "epoch": 2967} {"train_loss": -45.70501708984375, "global_step": 359055, "epoch": 2967} {"train_loss": -45.1274299621582, "global_step": 359056, "epoch": 2967} {"train_loss": -45.5799560546875, "global_step": 359057, "epoch": 2967} {"train_loss": -45.18379592895508, "global_step": 359058, "epoch": 2967} {"train_loss": -45.37913513183594, "global_step": 359059, "epoch": 2967} {"train_loss": -45.284732818603516, "global_step": 359060, "epoch": 2967} {"train_loss": -44.937557220458984, "global_step": 359061, "epoch": 2967} {"train_loss": -45.23758316040039, "global_step": 359062, "epoch": 2967} {"train_loss": -44.74755096435547, "global_step": 359063, "epoch": 2967} {"train_loss": -45.315399169921875, "global_step": 359064, "epoch": 2967} {"train_loss": -45.06316375732422, "global_step": 359065, "epoch": 2967} {"train_loss": -45.71369552612305, "global_step": 359066, "epoch": 2967} {"train_loss": -45.70499801635742, "global_step": 359067, "epoch": 2967} {"train_loss": -46.01705551147461, "global_step": 359068, "epoch": 2967} {"train_loss": -45.2337532043457, "global_step": 359069, "epoch": 2967} {"train_loss": -46.00173568725586, "global_step": 359070, "epoch": 2967} {"train_loss": -45.53986740112305, "global_step": 359071, "epoch": 2967} {"train_loss": -45.51968002319336, "global_step": 359072, "epoch": 2967} {"train_loss": -45.193992614746094, "global_step": 359073, "epoch": 2967} {"train_loss": -45.80264663696289, "global_step": 359074, "epoch": 2967} {"train_loss": -45.62643051147461, "global_step": 359075, "epoch": 2967} {"train_loss": -45.67130661010742, "global_step": 359076, "epoch": 2967} {"train_loss": -45.63117218017578, "global_step": 359077, "epoch": 2967} {"train_loss": -46.29365158081055, "global_step": 359078, "epoch": 2967} {"train_loss": -45.87763595581055, "global_step": 359079, "epoch": 2967} {"train_loss": -46.03718185424805, "global_step": 359080, "epoch": 2967} {"train_loss": -45.16988754272461, "global_step": 359081, "epoch": 2967} {"train_loss": -46.3337516784668, "global_step": 359082, "epoch": 2967} {"train_loss": -45.59210968017578, "global_step": 359083, "epoch": 2967} {"train_loss": -45.66530227661133, "global_step": 359084, "epoch": 2967} {"train_loss": -45.523555755615234, "global_step": 359085, "epoch": 2967} {"train_loss": -45.428096771240234, "global_step": 359086, "epoch": 2967} {"train_loss": -46.08539581298828, "global_step": 359087, "epoch": 2967} {"train_loss": -45.27848434448242, "global_step": 359088, "epoch": 2967} {"train_loss": -45.140438079833984, "global_step": 359089, "epoch": 2967} {"train_loss": -45.00851058959961, "global_step": 359090, "epoch": 2967} {"train_loss": -45.754268646240234, "global_step": 359091, "epoch": 2967} {"train_loss": -45.15816879272461, "global_step": 359092, "epoch": 2967} {"train_loss": -45.58979415893555, "global_step": 359093, "epoch": 2967} {"train_loss": -44.67381286621094, "global_step": 359094, "epoch": 2967} {"train_loss": -45.62730026245117, "global_step": 359095, "epoch": 2967} {"train_loss": -44.87073516845703, "global_step": 359096, "epoch": 2967} {"train_loss": -44.36435317993164, "global_step": 359097, "epoch": 2967} {"train_loss": -42.76052474975586, "global_step": 359098, "epoch": 2967} {"train_loss": -44.25173568725586, "global_step": 359099, "epoch": 2967} {"train_loss": -42.89524459838867, "global_step": 359100, "epoch": 2967} {"train_loss": -43.894405364990234, "global_step": 359101, "epoch": 2967} {"train_loss": -43.965511322021484, "global_step": 359102, "epoch": 2967} {"train_loss": -45.284706115722656, "global_step": 359103, "epoch": 2967} {"train_loss": -43.78809356689453, "global_step": 359104, "epoch": 2967} {"train_loss": -44.910762786865234, "global_step": 359105, "epoch": 2967} {"train_loss": -45.21136474609375, "global_step": 359106, "epoch": 2967} {"train_loss": -44.53586959838867, "global_step": 359107, "epoch": 2967} {"train_loss": -44.308292388916016, "global_step": 359108, "epoch": 2967} {"train_loss": -43.751895904541016, "global_step": 359109, "epoch": 2967} {"train_loss": -43.881465911865234, "global_step": 359110, "epoch": 2967} {"train_loss": -44.68367004394531, "global_step": 359111, "epoch": 2967} {"train_loss": -43.5866584777832, "global_step": 359112, "epoch": 2967} {"train_loss": -42.656063079833984, "global_step": 359113, "epoch": 2967} {"train_loss": -44.7240104675293, "global_step": 359114, "epoch": 2967} {"train_loss": -44.755130767822266, "global_step": 359115, "epoch": 2967} {"train_loss": -44.380062103271484, "global_step": 359116, "epoch": 2967} {"train_loss": -43.63804626464844, "global_step": 359117, "epoch": 2967} {"train_loss": -43.05536651611328, "global_step": 359118, "epoch": 2967} {"train_loss": -42.268951416015625, "global_step": 359119, "epoch": 2967} {"train_loss": -43.02676010131836, "global_step": 359120, "epoch": 2967} {"train_loss": -42.91270065307617, "global_step": 359121, "epoch": 2967} {"train_loss": -42.19704818725586, "global_step": 359122, "epoch": 2967} {"train_loss": -44.04768371582031, "global_step": 359123, "epoch": 2967} {"train_loss": -42.153499603271484, "global_step": 359124, "epoch": 2967} {"train_loss": -41.43268966674805, "global_step": 359125, "epoch": 2967} {"train_loss": -44.02423095703125, "global_step": 359126, "epoch": 2967} {"train_loss": -44.50659375151327, "global_step": 359127, "epoch": 2967, "val_loss": 2480318.25} {"train_loss": -42.163543701171875, "global_step": 359128, "epoch": 2968} {"train_loss": -42.29832077026367, "global_step": 359129, "epoch": 2968} {"train_loss": -43.984283447265625, "global_step": 359130, "epoch": 2968} {"train_loss": -41.87922668457031, "global_step": 359131, "epoch": 2968} {"train_loss": -41.56044387817383, "global_step": 359132, "epoch": 2968} {"train_loss": -43.72102737426758, "global_step": 359133, "epoch": 2968} {"train_loss": -42.532955169677734, "global_step": 359134, "epoch": 2968} {"train_loss": -43.89104080200195, "global_step": 359135, "epoch": 2968} {"train_loss": -40.356239318847656, "global_step": 359136, "epoch": 2968} {"train_loss": -45.09544372558594, "global_step": 359137, "epoch": 2968} {"train_loss": -41.05824279785156, "global_step": 359138, "epoch": 2968} {"train_loss": -44.00325393676758, "global_step": 359139, "epoch": 2968} {"train_loss": -42.47553634643555, "global_step": 359140, "epoch": 2968} {"train_loss": -43.439453125, "global_step": 359141, "epoch": 2968} {"train_loss": -43.922821044921875, "global_step": 359142, "epoch": 2968} {"train_loss": -43.381103515625, "global_step": 359143, "epoch": 2968} {"train_loss": -43.488948822021484, "global_step": 359144, "epoch": 2968} {"train_loss": -42.99749755859375, "global_step": 359145, "epoch": 2968} {"train_loss": -44.2013053894043, "global_step": 359146, "epoch": 2968} {"train_loss": -43.544437408447266, "global_step": 359147, "epoch": 2968} {"train_loss": -43.819942474365234, "global_step": 359148, "epoch": 2968} {"train_loss": -44.67800521850586, "global_step": 359149, "epoch": 2968} {"train_loss": -43.116798400878906, "global_step": 359150, "epoch": 2968} {"train_loss": -43.54745101928711, "global_step": 359151, "epoch": 2968} {"train_loss": -43.966339111328125, "global_step": 359152, "epoch": 2968} {"train_loss": -42.83625030517578, "global_step": 359153, "epoch": 2968} {"train_loss": -44.4666862487793, "global_step": 359154, "epoch": 2968} {"train_loss": -40.96074676513672, "global_step": 359155, "epoch": 2968} {"train_loss": -44.48097610473633, "global_step": 359156, "epoch": 2968} {"train_loss": -41.52849197387695, "global_step": 359157, "epoch": 2968} {"train_loss": -44.124267578125, "global_step": 359158, "epoch": 2968} {"train_loss": -40.28675842285156, "global_step": 359159, "epoch": 2968} {"train_loss": -41.5157470703125, "global_step": 359160, "epoch": 2968} {"train_loss": -42.9148063659668, "global_step": 359161, "epoch": 2968} {"train_loss": -41.95229721069336, "global_step": 359162, "epoch": 2968} {"train_loss": -41.65928649902344, "global_step": 359163, "epoch": 2968} {"train_loss": -42.691688537597656, "global_step": 359164, "epoch": 2968} {"train_loss": -41.94485092163086, "global_step": 359165, "epoch": 2968} {"train_loss": -43.23773956298828, "global_step": 359166, "epoch": 2968} {"train_loss": -42.88962936401367, "global_step": 359167, "epoch": 2968} {"train_loss": -43.780670166015625, "global_step": 359168, "epoch": 2968} {"train_loss": -43.810516357421875, "global_step": 359169, "epoch": 2968} {"train_loss": -43.27685546875, "global_step": 359170, "epoch": 2968} {"train_loss": -43.327003479003906, "global_step": 359171, "epoch": 2968} {"train_loss": -43.62085723876953, "global_step": 359172, "epoch": 2968} {"train_loss": -44.44327163696289, "global_step": 359173, "epoch": 2968} {"train_loss": -44.210609436035156, "global_step": 359174, "epoch": 2968} {"train_loss": -44.0275764465332, "global_step": 359175, "epoch": 2968} {"train_loss": -44.881980895996094, "global_step": 359176, "epoch": 2968} {"train_loss": -44.66280746459961, "global_step": 359177, "epoch": 2968} {"train_loss": -44.62788772583008, "global_step": 359178, "epoch": 2968} {"train_loss": -44.68349075317383, "global_step": 359179, "epoch": 2968} {"train_loss": -45.004615783691406, "global_step": 359180, "epoch": 2968} {"train_loss": -44.81672286987305, "global_step": 359181, "epoch": 2968} {"train_loss": -44.9969367980957, "global_step": 359182, "epoch": 2968} {"train_loss": -44.57721710205078, "global_step": 359183, "epoch": 2968} {"train_loss": -43.65379333496094, "global_step": 359184, "epoch": 2968} {"train_loss": -44.844486236572266, "global_step": 359185, "epoch": 2968} {"train_loss": -44.6851921081543, "global_step": 359186, "epoch": 2968} {"train_loss": -45.04988479614258, "global_step": 359187, "epoch": 2968} {"train_loss": -44.9210319519043, "global_step": 359188, "epoch": 2968} {"train_loss": -45.15385818481445, "global_step": 359189, "epoch": 2968} {"train_loss": -45.042144775390625, "global_step": 359190, "epoch": 2968} {"train_loss": -44.90643310546875, "global_step": 359191, "epoch": 2968} {"train_loss": -45.7049674987793, "global_step": 359192, "epoch": 2968} {"train_loss": -44.80643844604492, "global_step": 359193, "epoch": 2968} {"train_loss": -45.17768478393555, "global_step": 359194, "epoch": 2968} {"train_loss": -45.021514892578125, "global_step": 359195, "epoch": 2968} {"train_loss": -45.50153350830078, "global_step": 359196, "epoch": 2968} {"train_loss": -44.88215255737305, "global_step": 359197, "epoch": 2968} {"train_loss": -45.05294418334961, "global_step": 359198, "epoch": 2968} {"train_loss": -45.390377044677734, "global_step": 359199, "epoch": 2968} {"train_loss": -45.49300003051758, "global_step": 359200, "epoch": 2968} {"train_loss": -45.50808334350586, "global_step": 359201, "epoch": 2968} {"train_loss": -44.79949951171875, "global_step": 359202, "epoch": 2968} {"train_loss": -45.4423828125, "global_step": 359203, "epoch": 2968} {"train_loss": -45.139976501464844, "global_step": 359204, "epoch": 2968} {"train_loss": -45.12586212158203, "global_step": 359205, "epoch": 2968} {"train_loss": -45.43654251098633, "global_step": 359206, "epoch": 2968} {"train_loss": -44.20390319824219, "global_step": 359207, "epoch": 2968} {"train_loss": -45.09265899658203, "global_step": 359208, "epoch": 2968} {"train_loss": -45.12443161010742, "global_step": 359209, "epoch": 2968} {"train_loss": -45.5592041015625, "global_step": 359210, "epoch": 2968} {"train_loss": -44.50558090209961, "global_step": 359211, "epoch": 2968} {"train_loss": -45.61112594604492, "global_step": 359212, "epoch": 2968} {"train_loss": -45.502471923828125, "global_step": 359213, "epoch": 2968} {"train_loss": -45.59579086303711, "global_step": 359214, "epoch": 2968} {"train_loss": -45.514190673828125, "global_step": 359215, "epoch": 2968} {"train_loss": -45.529701232910156, "global_step": 359216, "epoch": 2968} {"train_loss": -45.17013168334961, "global_step": 359217, "epoch": 2968} {"train_loss": -45.527809143066406, "global_step": 359218, "epoch": 2968} {"train_loss": -45.37556076049805, "global_step": 359219, "epoch": 2968} {"train_loss": -45.346534729003906, "global_step": 359220, "epoch": 2968} {"train_loss": -45.76548385620117, "global_step": 359221, "epoch": 2968} {"train_loss": -45.2273063659668, "global_step": 359222, "epoch": 2968} {"train_loss": -45.5035400390625, "global_step": 359223, "epoch": 2968} {"train_loss": -44.4168815612793, "global_step": 359224, "epoch": 2968} {"train_loss": -45.595333099365234, "global_step": 359225, "epoch": 2968} {"train_loss": -45.38105773925781, "global_step": 359226, "epoch": 2968} {"train_loss": -45.15570831298828, "global_step": 359227, "epoch": 2968} {"train_loss": -46.06064987182617, "global_step": 359228, "epoch": 2968} {"train_loss": -44.89827346801758, "global_step": 359229, "epoch": 2968} {"train_loss": -45.86020278930664, "global_step": 359230, "epoch": 2968} {"train_loss": -45.706756591796875, "global_step": 359231, "epoch": 2968} {"train_loss": -45.17680740356445, "global_step": 359232, "epoch": 2968} {"train_loss": -46.01988983154297, "global_step": 359233, "epoch": 2968} {"train_loss": -44.23565673828125, "global_step": 359234, "epoch": 2968} {"train_loss": -45.1849250793457, "global_step": 359235, "epoch": 2968} {"train_loss": -45.40435028076172, "global_step": 359236, "epoch": 2968} {"train_loss": -44.21358871459961, "global_step": 359237, "epoch": 2968} {"train_loss": -45.03011703491211, "global_step": 359238, "epoch": 2968} {"train_loss": -43.66804885864258, "global_step": 359239, "epoch": 2968} {"train_loss": -43.97517776489258, "global_step": 359240, "epoch": 2968} {"train_loss": -44.19147872924805, "global_step": 359241, "epoch": 2968} {"train_loss": -43.251129150390625, "global_step": 359242, "epoch": 2968} {"train_loss": -45.1909065246582, "global_step": 359243, "epoch": 2968} {"train_loss": -44.094482421875, "global_step": 359244, "epoch": 2968} {"train_loss": -40.5238151550293, "global_step": 359245, "epoch": 2968} {"train_loss": -44.169158935546875, "global_step": 359246, "epoch": 2968} {"train_loss": -44.11273956298828, "global_step": 359247, "epoch": 2968} {"train_loss": -44.201966088665415, "global_step": 359248, "epoch": 2968, "val_loss": 2439870.5} {"train_loss": -44.65586471557617, "global_step": 359249, "epoch": 2969} {"train_loss": -42.87961959838867, "global_step": 359250, "epoch": 2969} {"train_loss": -43.71143341064453, "global_step": 359251, "epoch": 2969} {"train_loss": -43.92361068725586, "global_step": 359252, "epoch": 2969} {"train_loss": -45.26472091674805, "global_step": 359253, "epoch": 2969} {"train_loss": -44.22434616088867, "global_step": 359254, "epoch": 2969} {"train_loss": -43.5181770324707, "global_step": 359255, "epoch": 2969} {"train_loss": -44.961063385009766, "global_step": 359256, "epoch": 2969} {"train_loss": -44.13798904418945, "global_step": 359257, "epoch": 2969} {"train_loss": -42.52352523803711, "global_step": 359258, "epoch": 2969} {"train_loss": -42.494659423828125, "global_step": 359259, "epoch": 2969} {"train_loss": -43.82636642456055, "global_step": 359260, "epoch": 2969} {"train_loss": -40.49622344970703, "global_step": 359261, "epoch": 2969} {"train_loss": -45.14460372924805, "global_step": 359262, "epoch": 2969} {"train_loss": -41.72381591796875, "global_step": 359263, "epoch": 2969} {"train_loss": -43.053192138671875, "global_step": 359264, "epoch": 2969} {"train_loss": -44.44607162475586, "global_step": 359265, "epoch": 2969} {"train_loss": -42.61619186401367, "global_step": 359266, "epoch": 2969} {"train_loss": -44.56533432006836, "global_step": 359267, "epoch": 2969} {"train_loss": -43.317298889160156, "global_step": 359268, "epoch": 2969} {"train_loss": -41.88419723510742, "global_step": 359269, "epoch": 2969} {"train_loss": -44.11817169189453, "global_step": 359270, "epoch": 2969} {"train_loss": -42.57998275756836, "global_step": 359271, "epoch": 2969} {"train_loss": -43.2347526550293, "global_step": 359272, "epoch": 2969} {"train_loss": -44.69546127319336, "global_step": 359273, "epoch": 2969} {"train_loss": -42.129234313964844, "global_step": 359274, "epoch": 2969} {"train_loss": -44.082435607910156, "global_step": 359275, "epoch": 2969} {"train_loss": -44.673946380615234, "global_step": 359276, "epoch": 2969} {"train_loss": -44.186859130859375, "global_step": 359277, "epoch": 2969} {"train_loss": -44.666419982910156, "global_step": 359278, "epoch": 2969} {"train_loss": -45.07620620727539, "global_step": 359279, "epoch": 2969} {"train_loss": -44.73667526245117, "global_step": 359280, "epoch": 2969} {"train_loss": -45.62385940551758, "global_step": 359281, "epoch": 2969} {"train_loss": -44.6883430480957, "global_step": 359282, "epoch": 2969} {"train_loss": -44.9601936340332, "global_step": 359283, "epoch": 2969} {"train_loss": -44.767974853515625, "global_step": 359284, "epoch": 2969} {"train_loss": -44.74137496948242, "global_step": 359285, "epoch": 2969} {"train_loss": -45.45736312866211, "global_step": 359286, "epoch": 2969} {"train_loss": -44.56673812866211, "global_step": 359287, "epoch": 2969} {"train_loss": -45.10685729980469, "global_step": 359288, "epoch": 2969} {"train_loss": -44.252784729003906, "global_step": 359289, "epoch": 2969} {"train_loss": -44.59771728515625, "global_step": 359290, "epoch": 2969} {"train_loss": -44.392799377441406, "global_step": 359291, "epoch": 2969} {"train_loss": -44.20623779296875, "global_step": 359292, "epoch": 2969} {"train_loss": -44.90052032470703, "global_step": 359293, "epoch": 2969} {"train_loss": -43.780582427978516, "global_step": 359294, "epoch": 2969} {"train_loss": -45.15810775756836, "global_step": 359295, "epoch": 2969} {"train_loss": -44.26154708862305, "global_step": 359296, "epoch": 2969} {"train_loss": -45.070919036865234, "global_step": 359297, "epoch": 2969} {"train_loss": -45.05085372924805, "global_step": 359298, "epoch": 2969} {"train_loss": -44.0504264831543, "global_step": 359299, "epoch": 2969} {"train_loss": -44.92677307128906, "global_step": 359300, "epoch": 2969} {"train_loss": -44.88528060913086, "global_step": 359301, "epoch": 2969} {"train_loss": -43.78194046020508, "global_step": 359302, "epoch": 2969} {"train_loss": -45.25891876220703, "global_step": 359303, "epoch": 2969} {"train_loss": -45.107845306396484, "global_step": 359304, "epoch": 2969} {"train_loss": -45.510616302490234, "global_step": 359305, "epoch": 2969} {"train_loss": -45.08830261230469, "global_step": 359306, "epoch": 2969} {"train_loss": -45.62821578979492, "global_step": 359307, "epoch": 2969} {"train_loss": -44.80991744995117, "global_step": 359308, "epoch": 2969} {"train_loss": -44.57459259033203, "global_step": 359309, "epoch": 2969} {"train_loss": -45.371124267578125, "global_step": 359310, "epoch": 2969} {"train_loss": -45.105892181396484, "global_step": 359311, "epoch": 2969} {"train_loss": -45.324310302734375, "global_step": 359312, "epoch": 2969} {"train_loss": -44.005367279052734, "global_step": 359313, "epoch": 2969} {"train_loss": -44.21226119995117, "global_step": 359314, "epoch": 2969} {"train_loss": -45.69532012939453, "global_step": 359315, "epoch": 2969} {"train_loss": -45.591068267822266, "global_step": 359316, "epoch": 2969} {"train_loss": -45.784420013427734, "global_step": 359317, "epoch": 2969} {"train_loss": -45.34918212890625, "global_step": 359318, "epoch": 2969} {"train_loss": -45.64651107788086, "global_step": 359319, "epoch": 2969} {"train_loss": -45.60374069213867, "global_step": 359320, "epoch": 2969} {"train_loss": -45.61201858520508, "global_step": 359321, "epoch": 2969} {"train_loss": -45.9017448425293, "global_step": 359322, "epoch": 2969} {"train_loss": -45.71928024291992, "global_step": 359323, "epoch": 2969} {"train_loss": -45.34013366699219, "global_step": 359324, "epoch": 2969} {"train_loss": -45.73359298706055, "global_step": 359325, "epoch": 2969} {"train_loss": -45.662025451660156, "global_step": 359326, "epoch": 2969} {"train_loss": -45.626461029052734, "global_step": 359327, "epoch": 2969} {"train_loss": -45.53763961791992, "global_step": 359328, "epoch": 2969} {"train_loss": -45.913204193115234, "global_step": 359329, "epoch": 2969} {"train_loss": -45.22833251953125, "global_step": 359330, "epoch": 2969} {"train_loss": -46.21531295776367, "global_step": 359331, "epoch": 2969} {"train_loss": -45.72251510620117, "global_step": 359332, "epoch": 2969} {"train_loss": -45.3809928894043, "global_step": 359333, "epoch": 2969} {"train_loss": -46.01020812988281, "global_step": 359334, "epoch": 2969} {"train_loss": -45.74416732788086, "global_step": 359335, "epoch": 2969} {"train_loss": -45.16199493408203, "global_step": 359336, "epoch": 2969} {"train_loss": -45.317298889160156, "global_step": 359337, "epoch": 2969} {"train_loss": -45.370418548583984, "global_step": 359338, "epoch": 2969} {"train_loss": -45.93109893798828, "global_step": 359339, "epoch": 2969} {"train_loss": -45.796485900878906, "global_step": 359340, "epoch": 2969} {"train_loss": -46.08187484741211, "global_step": 359341, "epoch": 2969} {"train_loss": -45.857635498046875, "global_step": 359342, "epoch": 2969} {"train_loss": -46.00252151489258, "global_step": 359343, "epoch": 2969} {"train_loss": -45.954620361328125, "global_step": 359344, "epoch": 2969} {"train_loss": -45.649837493896484, "global_step": 359345, "epoch": 2969} {"train_loss": -45.62784194946289, "global_step": 359346, "epoch": 2969} {"train_loss": -45.42041015625, "global_step": 359347, "epoch": 2969} {"train_loss": -44.99117660522461, "global_step": 359348, "epoch": 2969} {"train_loss": -44.849239349365234, "global_step": 359349, "epoch": 2969} {"train_loss": -42.205562591552734, "global_step": 359350, "epoch": 2969} {"train_loss": -44.966182708740234, "global_step": 359351, "epoch": 2969} {"train_loss": -45.742549896240234, "global_step": 359352, "epoch": 2969} {"train_loss": -44.67745590209961, "global_step": 359353, "epoch": 2969} {"train_loss": -40.5711784362793, "global_step": 359354, "epoch": 2969} {"train_loss": -44.94178009033203, "global_step": 359355, "epoch": 2969} {"train_loss": -36.48823928833008, "global_step": 359356, "epoch": 2969} {"train_loss": -43.933162689208984, "global_step": 359357, "epoch": 2969} {"train_loss": -41.86851119995117, "global_step": 359358, "epoch": 2969} {"train_loss": -36.64805221557617, "global_step": 359359, "epoch": 2969} {"train_loss": -30.597558975219727, "global_step": 359360, "epoch": 2969} {"train_loss": -26.58643913269043, "global_step": 359361, "epoch": 2969} {"train_loss": -32.96018600463867, "global_step": 359362, "epoch": 2969} {"train_loss": -41.18892288208008, "global_step": 359363, "epoch": 2969} {"train_loss": -38.116207122802734, "global_step": 359364, "epoch": 2969} {"train_loss": -35.278236389160156, "global_step": 359365, "epoch": 2969} {"train_loss": -40.109710693359375, "global_step": 359366, "epoch": 2969} {"train_loss": -37.7329216003418, "global_step": 359367, "epoch": 2969} {"train_loss": -35.62506103515625, "global_step": 359368, "epoch": 2969} {"train_loss": -43.788174211486314, "global_step": 359369, "epoch": 2969, "val_loss": 2471268.75} {"train_loss": -39.50943374633789, "global_step": 359370, "epoch": 2970} {"train_loss": -39.013545989990234, "global_step": 359371, "epoch": 2970} {"train_loss": -38.29522705078125, "global_step": 359372, "epoch": 2970} {"train_loss": -35.72002410888672, "global_step": 359373, "epoch": 2970} {"train_loss": -41.87287902832031, "global_step": 359374, "epoch": 2970} {"train_loss": -33.29181671142578, "global_step": 359375, "epoch": 2970} {"train_loss": -42.01850509643555, "global_step": 359376, "epoch": 2970} {"train_loss": -36.68577194213867, "global_step": 359377, "epoch": 2970} {"train_loss": -42.43184280395508, "global_step": 359378, "epoch": 2970} {"train_loss": -38.122222900390625, "global_step": 359379, "epoch": 2970} {"train_loss": -41.6364860534668, "global_step": 359380, "epoch": 2970} {"train_loss": -39.581356048583984, "global_step": 359381, "epoch": 2970} {"train_loss": -41.95815658569336, "global_step": 359382, "epoch": 2970} {"train_loss": -40.25738525390625, "global_step": 359383, "epoch": 2970} {"train_loss": -39.872711181640625, "global_step": 359384, "epoch": 2970} {"train_loss": -40.68873596191406, "global_step": 359385, "epoch": 2970} {"train_loss": -40.65696334838867, "global_step": 359386, "epoch": 2970} {"train_loss": -41.7171745300293, "global_step": 359387, "epoch": 2970} {"train_loss": -41.504859924316406, "global_step": 359388, "epoch": 2970} {"train_loss": -42.0694465637207, "global_step": 359389, "epoch": 2970} {"train_loss": -42.206886291503906, "global_step": 359390, "epoch": 2970} {"train_loss": -42.51828384399414, "global_step": 359391, "epoch": 2970} {"train_loss": -42.39946365356445, "global_step": 359392, "epoch": 2970} {"train_loss": -41.7180290222168, "global_step": 359393, "epoch": 2970} {"train_loss": -42.581947326660156, "global_step": 359394, "epoch": 2970} {"train_loss": -43.38669967651367, "global_step": 359395, "epoch": 2970} {"train_loss": -43.01599884033203, "global_step": 359396, "epoch": 2970} {"train_loss": -43.42910385131836, "global_step": 359397, "epoch": 2970} {"train_loss": -42.99760437011719, "global_step": 359398, "epoch": 2970} {"train_loss": -43.89306640625, "global_step": 359399, "epoch": 2970} {"train_loss": -42.62843704223633, "global_step": 359400, "epoch": 2970} {"train_loss": -43.23759078979492, "global_step": 359401, "epoch": 2970} {"train_loss": -43.94263458251953, "global_step": 359402, "epoch": 2970} {"train_loss": -43.6596794128418, "global_step": 359403, "epoch": 2970} {"train_loss": -44.155452728271484, "global_step": 359404, "epoch": 2970} {"train_loss": -43.9664306640625, "global_step": 359405, "epoch": 2970} {"train_loss": -43.931339263916016, "global_step": 359406, "epoch": 2970} {"train_loss": -44.16038513183594, "global_step": 359407, "epoch": 2970} {"train_loss": -44.38039779663086, "global_step": 359408, "epoch": 2970} {"train_loss": -43.40996170043945, "global_step": 359409, "epoch": 2970} {"train_loss": -44.07331466674805, "global_step": 359410, "epoch": 2970} {"train_loss": -44.31956481933594, "global_step": 359411, "epoch": 2970} {"train_loss": -44.589290618896484, "global_step": 359412, "epoch": 2970} {"train_loss": -44.672664642333984, "global_step": 359413, "epoch": 2970} {"train_loss": -44.251888275146484, "global_step": 359414, "epoch": 2970} {"train_loss": -44.47031784057617, "global_step": 359415, "epoch": 2970} {"train_loss": -44.730831146240234, "global_step": 359416, "epoch": 2970} {"train_loss": -44.73607635498047, "global_step": 359417, "epoch": 2970} {"train_loss": -44.720943450927734, "global_step": 359418, "epoch": 2970} {"train_loss": -44.96064376831055, "global_step": 359419, "epoch": 2970} {"train_loss": -44.19155502319336, "global_step": 359420, "epoch": 2970} {"train_loss": -43.90792465209961, "global_step": 359421, "epoch": 2970} {"train_loss": -44.53103256225586, "global_step": 359422, "epoch": 2970} {"train_loss": -44.69285202026367, "global_step": 359423, "epoch": 2970} {"train_loss": -44.64569854736328, "global_step": 359424, "epoch": 2970} {"train_loss": -44.68500518798828, "global_step": 359425, "epoch": 2970} {"train_loss": -45.05004119873047, "global_step": 359426, "epoch": 2970} {"train_loss": -44.532867431640625, "global_step": 359427, "epoch": 2970} {"train_loss": -44.83419418334961, "global_step": 359428, "epoch": 2970} {"train_loss": -44.81714630126953, "global_step": 359429, "epoch": 2970} {"train_loss": -44.25932693481445, "global_step": 359430, "epoch": 2970} {"train_loss": -44.94477462768555, "global_step": 359431, "epoch": 2970} {"train_loss": -44.52437973022461, "global_step": 359432, "epoch": 2970} {"train_loss": -45.370208740234375, "global_step": 359433, "epoch": 2970} {"train_loss": -45.01365280151367, "global_step": 359434, "epoch": 2970} {"train_loss": -43.4775505065918, "global_step": 359435, "epoch": 2970} {"train_loss": -45.10250473022461, "global_step": 359436, "epoch": 2970} {"train_loss": -44.804344177246094, "global_step": 359437, "epoch": 2970} {"train_loss": -42.65266799926758, "global_step": 359438, "epoch": 2970} {"train_loss": -45.35577392578125, "global_step": 359439, "epoch": 2970} {"train_loss": -42.9473991394043, "global_step": 359440, "epoch": 2970} {"train_loss": -44.95941925048828, "global_step": 359441, "epoch": 2970} {"train_loss": -45.88683319091797, "global_step": 359442, "epoch": 2970} {"train_loss": -45.31084060668945, "global_step": 359443, "epoch": 2970} {"train_loss": -45.35121536254883, "global_step": 359444, "epoch": 2970} {"train_loss": -45.283966064453125, "global_step": 359445, "epoch": 2970} {"train_loss": -45.36576843261719, "global_step": 359446, "epoch": 2970} {"train_loss": -44.9937858581543, "global_step": 359447, "epoch": 2970} {"train_loss": -45.60451126098633, "global_step": 359448, "epoch": 2970} {"train_loss": -45.310848236083984, "global_step": 359449, "epoch": 2970} {"train_loss": -44.30994415283203, "global_step": 359450, "epoch": 2970} {"train_loss": -45.52799606323242, "global_step": 359451, "epoch": 2970} {"train_loss": -45.31815719604492, "global_step": 359452, "epoch": 2970} {"train_loss": -45.20054626464844, "global_step": 359453, "epoch": 2970} {"train_loss": -40.735313415527344, "global_step": 359454, "epoch": 2970} {"train_loss": -45.6189079284668, "global_step": 359455, "epoch": 2970} {"train_loss": -35.79916000366211, "global_step": 359456, "epoch": 2970} {"train_loss": -45.54182815551758, "global_step": 359457, "epoch": 2970} {"train_loss": -45.217384338378906, "global_step": 359458, "epoch": 2970} {"train_loss": -45.52362060546875, "global_step": 359459, "epoch": 2970} {"train_loss": -43.95081329345703, "global_step": 359460, "epoch": 2970} {"train_loss": -44.75654220581055, "global_step": 359461, "epoch": 2970} {"train_loss": -42.42144775390625, "global_step": 359462, "epoch": 2970} {"train_loss": -43.413875579833984, "global_step": 359463, "epoch": 2970} {"train_loss": -44.34091567993164, "global_step": 359464, "epoch": 2970} {"train_loss": -42.52617645263672, "global_step": 359465, "epoch": 2970} {"train_loss": -42.77544021606445, "global_step": 359466, "epoch": 2970} {"train_loss": -43.23794174194336, "global_step": 359467, "epoch": 2970} {"train_loss": -41.61186218261719, "global_step": 359468, "epoch": 2970} {"train_loss": -44.566932678222656, "global_step": 359469, "epoch": 2970} {"train_loss": -39.863277435302734, "global_step": 359470, "epoch": 2970} {"train_loss": -37.91448974609375, "global_step": 359471, "epoch": 2970} {"train_loss": -40.58793258666992, "global_step": 359472, "epoch": 2970} {"train_loss": -43.80088424682617, "global_step": 359473, "epoch": 2970} {"train_loss": -40.09135818481445, "global_step": 359474, "epoch": 2970} {"train_loss": -34.06191635131836, "global_step": 359475, "epoch": 2970} {"train_loss": -32.01530838012695, "global_step": 359476, "epoch": 2970} {"train_loss": -36.52811813354492, "global_step": 359477, "epoch": 2970} {"train_loss": -40.39064407348633, "global_step": 359478, "epoch": 2970} {"train_loss": -43.297149658203125, "global_step": 359479, "epoch": 2970} {"train_loss": -42.6349983215332, "global_step": 359480, "epoch": 2970} {"train_loss": -38.333045959472656, "global_step": 359481, "epoch": 2970} {"train_loss": -40.2364387512207, "global_step": 359482, "epoch": 2970} {"train_loss": -41.4439811706543, "global_step": 359483, "epoch": 2970} {"train_loss": -40.85573959350586, "global_step": 359484, "epoch": 2970} {"train_loss": -40.76620101928711, "global_step": 359485, "epoch": 2970} {"train_loss": -40.49031066894531, "global_step": 359486, "epoch": 2970} {"train_loss": -41.18851852416992, "global_step": 359487, "epoch": 2970} {"train_loss": -41.941650390625, "global_step": 359488, "epoch": 2970} {"train_loss": -37.653995513916016, "global_step": 359489, "epoch": 2970} {"train_loss": -42.635211471683725, "global_step": 359490, "epoch": 2970, "val_loss": 2861835.25} {"train_loss": -42.37076187133789, "global_step": 359491, "epoch": 2971} {"train_loss": -43.491363525390625, "global_step": 359492, "epoch": 2971} {"train_loss": -42.84857940673828, "global_step": 359493, "epoch": 2971} {"train_loss": -41.708580017089844, "global_step": 359494, "epoch": 2971} {"train_loss": -42.846981048583984, "global_step": 359495, "epoch": 2971} {"train_loss": -43.02743148803711, "global_step": 359496, "epoch": 2971} {"train_loss": -41.560916900634766, "global_step": 359497, "epoch": 2971} {"train_loss": -42.99546432495117, "global_step": 359498, "epoch": 2971} {"train_loss": -43.6770133972168, "global_step": 359499, "epoch": 2971} {"train_loss": -43.367366790771484, "global_step": 359500, "epoch": 2971} {"train_loss": -43.314517974853516, "global_step": 359501, "epoch": 2971} {"train_loss": -43.20168685913086, "global_step": 359502, "epoch": 2971} {"train_loss": -43.37348556518555, "global_step": 359503, "epoch": 2971} {"train_loss": -41.92566680908203, "global_step": 359504, "epoch": 2971} {"train_loss": -43.619014739990234, "global_step": 359505, "epoch": 2971} {"train_loss": -43.745216369628906, "global_step": 359506, "epoch": 2971} {"train_loss": -44.38688278198242, "global_step": 359507, "epoch": 2971} {"train_loss": -42.85578536987305, "global_step": 359508, "epoch": 2971} {"train_loss": -43.63780975341797, "global_step": 359509, "epoch": 2971} {"train_loss": -43.43227767944336, "global_step": 359510, "epoch": 2971} {"train_loss": -42.371334075927734, "global_step": 359511, "epoch": 2971} {"train_loss": -44.4034309387207, "global_step": 359512, "epoch": 2971} {"train_loss": -44.63129806518555, "global_step": 359513, "epoch": 2971} {"train_loss": -44.042457580566406, "global_step": 359514, "epoch": 2971} {"train_loss": -43.22126388549805, "global_step": 359515, "epoch": 2971} {"train_loss": -44.48420333862305, "global_step": 359516, "epoch": 2971} {"train_loss": -44.47174835205078, "global_step": 359517, "epoch": 2971} {"train_loss": -44.62911605834961, "global_step": 359518, "epoch": 2971} {"train_loss": -44.69270706176758, "global_step": 359519, "epoch": 2971} {"train_loss": -44.89823532104492, "global_step": 359520, "epoch": 2971} {"train_loss": -44.519588470458984, "global_step": 359521, "epoch": 2971} {"train_loss": -44.38261795043945, "global_step": 359522, "epoch": 2971} {"train_loss": -44.273406982421875, "global_step": 359523, "epoch": 2971} {"train_loss": -44.44306182861328, "global_step": 359524, "epoch": 2971} {"train_loss": -43.801666259765625, "global_step": 359525, "epoch": 2971} {"train_loss": -45.142333984375, "global_step": 359526, "epoch": 2971} {"train_loss": -44.563323974609375, "global_step": 359527, "epoch": 2971} {"train_loss": -44.11879348754883, "global_step": 359528, "epoch": 2971} {"train_loss": -45.13674545288086, "global_step": 359529, "epoch": 2971} {"train_loss": -44.88466262817383, "global_step": 359530, "epoch": 2971} {"train_loss": -43.870662689208984, "global_step": 359531, "epoch": 2971} {"train_loss": -44.089317321777344, "global_step": 359532, "epoch": 2971} {"train_loss": -45.21696853637695, "global_step": 359533, "epoch": 2971} {"train_loss": -44.25725173950195, "global_step": 359534, "epoch": 2971} {"train_loss": -45.31711959838867, "global_step": 359535, "epoch": 2971} {"train_loss": -45.14204025268555, "global_step": 359536, "epoch": 2971} {"train_loss": -45.554603576660156, "global_step": 359537, "epoch": 2971} {"train_loss": -44.23638153076172, "global_step": 359538, "epoch": 2971} {"train_loss": -44.69027328491211, "global_step": 359539, "epoch": 2971} {"train_loss": -45.52058029174805, "global_step": 359540, "epoch": 2971} {"train_loss": -45.28646469116211, "global_step": 359541, "epoch": 2971} {"train_loss": -45.480934143066406, "global_step": 359542, "epoch": 2971} {"train_loss": -44.169158935546875, "global_step": 359543, "epoch": 2971} {"train_loss": -39.577701568603516, "global_step": 359544, "epoch": 2971} {"train_loss": -44.54270553588867, "global_step": 359545, "epoch": 2971} {"train_loss": -45.35295104980469, "global_step": 359546, "epoch": 2971} {"train_loss": -43.73418045043945, "global_step": 359547, "epoch": 2971} {"train_loss": -45.06524658203125, "global_step": 359548, "epoch": 2971} {"train_loss": -43.283931732177734, "global_step": 359549, "epoch": 2971} {"train_loss": -44.70756530761719, "global_step": 359550, "epoch": 2971} {"train_loss": -44.59601974487305, "global_step": 359551, "epoch": 2971} {"train_loss": -43.91237258911133, "global_step": 359552, "epoch": 2971} {"train_loss": -44.70109558105469, "global_step": 359553, "epoch": 2971} {"train_loss": -45.355342864990234, "global_step": 359554, "epoch": 2971} {"train_loss": -45.55500411987305, "global_step": 359555, "epoch": 2971} {"train_loss": -45.724029541015625, "global_step": 359556, "epoch": 2971} {"train_loss": -44.383182525634766, "global_step": 359557, "epoch": 2971} {"train_loss": -38.500885009765625, "global_step": 359558, "epoch": 2971} {"train_loss": -43.80042266845703, "global_step": 359559, "epoch": 2971} {"train_loss": -44.6448974609375, "global_step": 359560, "epoch": 2971} {"train_loss": -44.835601806640625, "global_step": 359561, "epoch": 2971} {"train_loss": -45.7249870300293, "global_step": 359562, "epoch": 2971} {"train_loss": -44.90372085571289, "global_step": 359563, "epoch": 2971} {"train_loss": -45.38421630859375, "global_step": 359564, "epoch": 2971} {"train_loss": -44.41695022583008, "global_step": 359565, "epoch": 2971} {"train_loss": -43.141300201416016, "global_step": 359566, "epoch": 2971} {"train_loss": -44.17414093017578, "global_step": 359567, "epoch": 2971} {"train_loss": -45.2325325012207, "global_step": 359568, "epoch": 2971} {"train_loss": -44.843223571777344, "global_step": 359569, "epoch": 2971} {"train_loss": -44.781890869140625, "global_step": 359570, "epoch": 2971} {"train_loss": -45.24032211303711, "global_step": 359571, "epoch": 2971} {"train_loss": -44.28779220581055, "global_step": 359572, "epoch": 2971} {"train_loss": -43.92829513549805, "global_step": 359573, "epoch": 2971} {"train_loss": -44.23295211791992, "global_step": 359574, "epoch": 2971} {"train_loss": -44.42524337768555, "global_step": 359575, "epoch": 2971} {"train_loss": -44.9307861328125, "global_step": 359576, "epoch": 2971} {"train_loss": -44.09645462036133, "global_step": 359577, "epoch": 2971} {"train_loss": -43.8475456237793, "global_step": 359578, "epoch": 2971} {"train_loss": -37.85511016845703, "global_step": 359579, "epoch": 2971} {"train_loss": -44.94502639770508, "global_step": 359580, "epoch": 2971} {"train_loss": -44.56611633300781, "global_step": 359581, "epoch": 2971} {"train_loss": -44.04582595825195, "global_step": 359582, "epoch": 2971} {"train_loss": -43.91913986206055, "global_step": 359583, "epoch": 2971} {"train_loss": -43.05160140991211, "global_step": 359584, "epoch": 2971} {"train_loss": -45.191078186035156, "global_step": 359585, "epoch": 2971} {"train_loss": -44.4883918762207, "global_step": 359586, "epoch": 2971} {"train_loss": -44.54383850097656, "global_step": 359587, "epoch": 2971} {"train_loss": -43.8543815612793, "global_step": 359588, "epoch": 2971} {"train_loss": -45.05079650878906, "global_step": 359589, "epoch": 2971} {"train_loss": -44.34571075439453, "global_step": 359590, "epoch": 2971} {"train_loss": -44.18648910522461, "global_step": 359591, "epoch": 2971} {"train_loss": -44.240516662597656, "global_step": 359592, "epoch": 2971} {"train_loss": -45.14640808105469, "global_step": 359593, "epoch": 2971} {"train_loss": -43.9064826965332, "global_step": 359594, "epoch": 2971} {"train_loss": -44.011417388916016, "global_step": 359595, "epoch": 2971} {"train_loss": -44.739315032958984, "global_step": 359596, "epoch": 2971} {"train_loss": -45.31299591064453, "global_step": 359597, "epoch": 2971} {"train_loss": -44.75997543334961, "global_step": 359598, "epoch": 2971} {"train_loss": -43.15232467651367, "global_step": 359599, "epoch": 2971} {"train_loss": -44.5513916015625, "global_step": 359600, "epoch": 2971} {"train_loss": -44.854148864746094, "global_step": 359601, "epoch": 2971} {"train_loss": -45.22468948364258, "global_step": 359602, "epoch": 2971} {"train_loss": -43.73092269897461, "global_step": 359603, "epoch": 2971} {"train_loss": -44.48978805541992, "global_step": 359604, "epoch": 2971} {"train_loss": -42.50078582763672, "global_step": 359605, "epoch": 2971} {"train_loss": -43.774227142333984, "global_step": 359606, "epoch": 2971} {"train_loss": -43.562374114990234, "global_step": 359607, "epoch": 2971} {"train_loss": -44.2021598815918, "global_step": 359608, "epoch": 2971} {"train_loss": -45.27416229248047, "global_step": 359609, "epoch": 2971} {"train_loss": -43.378639221191406, "global_step": 359610, "epoch": 2971} {"train_loss": -44.10405658690397, "global_step": 359611, "epoch": 2971, "val_loss": 2393357.0} {"train_loss": -44.55183792114258, "global_step": 359612, "epoch": 2972} {"train_loss": -44.789180755615234, "global_step": 359613, "epoch": 2972} {"train_loss": -44.45634078979492, "global_step": 359614, "epoch": 2972} {"train_loss": -44.99345779418945, "global_step": 359615, "epoch": 2972} {"train_loss": -44.2802619934082, "global_step": 359616, "epoch": 2972} {"train_loss": -43.03178787231445, "global_step": 359617, "epoch": 2972} {"train_loss": -43.547664642333984, "global_step": 359618, "epoch": 2972} {"train_loss": -41.92643356323242, "global_step": 359619, "epoch": 2972} {"train_loss": -43.18026351928711, "global_step": 359620, "epoch": 2972} {"train_loss": -44.281307220458984, "global_step": 359621, "epoch": 2972} {"train_loss": -39.951786041259766, "global_step": 359622, "epoch": 2972} {"train_loss": -42.13547134399414, "global_step": 359623, "epoch": 2972} {"train_loss": -41.952999114990234, "global_step": 359624, "epoch": 2972} {"train_loss": -40.98944091796875, "global_step": 359625, "epoch": 2972} {"train_loss": -42.11930465698242, "global_step": 359626, "epoch": 2972} {"train_loss": -41.840667724609375, "global_step": 359627, "epoch": 2972} {"train_loss": -43.79261016845703, "global_step": 359628, "epoch": 2972} {"train_loss": -40.84560775756836, "global_step": 359629, "epoch": 2972} {"train_loss": -41.92711639404297, "global_step": 359630, "epoch": 2972} {"train_loss": -43.083553314208984, "global_step": 359631, "epoch": 2972} {"train_loss": -41.0494384765625, "global_step": 359632, "epoch": 2972} {"train_loss": -41.823455810546875, "global_step": 359633, "epoch": 2972} {"train_loss": -43.13435745239258, "global_step": 359634, "epoch": 2972} {"train_loss": -41.46063232421875, "global_step": 359635, "epoch": 2972} {"train_loss": -43.4216423034668, "global_step": 359636, "epoch": 2972} {"train_loss": -43.331478118896484, "global_step": 359637, "epoch": 2972} {"train_loss": -43.09502029418945, "global_step": 359638, "epoch": 2972} {"train_loss": -41.98956298828125, "global_step": 359639, "epoch": 2972} {"train_loss": -43.414459228515625, "global_step": 359640, "epoch": 2972} {"train_loss": -43.05869674682617, "global_step": 359641, "epoch": 2972} {"train_loss": -43.603370666503906, "global_step": 359642, "epoch": 2972} {"train_loss": -42.368377685546875, "global_step": 359643, "epoch": 2972} {"train_loss": -43.61764144897461, "global_step": 359644, "epoch": 2972} {"train_loss": -43.318809509277344, "global_step": 359645, "epoch": 2972} {"train_loss": -42.407466888427734, "global_step": 359646, "epoch": 2972} {"train_loss": -44.75876235961914, "global_step": 359647, "epoch": 2972} {"train_loss": -42.68148422241211, "global_step": 359648, "epoch": 2972} {"train_loss": -42.842708587646484, "global_step": 359649, "epoch": 2972} {"train_loss": -43.63712692260742, "global_step": 359650, "epoch": 2972} {"train_loss": -43.2712516784668, "global_step": 359651, "epoch": 2972} {"train_loss": -42.253684997558594, "global_step": 359652, "epoch": 2972} {"train_loss": -43.708919525146484, "global_step": 359653, "epoch": 2972} {"train_loss": -43.1777229309082, "global_step": 359654, "epoch": 2972} {"train_loss": -44.558441162109375, "global_step": 359655, "epoch": 2972} {"train_loss": -43.47025680541992, "global_step": 359656, "epoch": 2972} {"train_loss": -44.11259841918945, "global_step": 359657, "epoch": 2972} {"train_loss": -44.11505889892578, "global_step": 359658, "epoch": 2972} {"train_loss": -44.12997055053711, "global_step": 359659, "epoch": 2972} {"train_loss": -44.227237701416016, "global_step": 359660, "epoch": 2972} {"train_loss": -44.070960998535156, "global_step": 359661, "epoch": 2972} {"train_loss": -44.85914993286133, "global_step": 359662, "epoch": 2972} {"train_loss": -44.290279388427734, "global_step": 359663, "epoch": 2972} {"train_loss": -44.61154556274414, "global_step": 359664, "epoch": 2972} {"train_loss": -45.15562438964844, "global_step": 359665, "epoch": 2972} {"train_loss": -45.04469680786133, "global_step": 359666, "epoch": 2972} {"train_loss": -44.437408447265625, "global_step": 359667, "epoch": 2972} {"train_loss": -44.8161735534668, "global_step": 359668, "epoch": 2972} {"train_loss": -45.048004150390625, "global_step": 359669, "epoch": 2972} {"train_loss": -44.54690170288086, "global_step": 359670, "epoch": 2972} {"train_loss": -43.941375732421875, "global_step": 359671, "epoch": 2972} {"train_loss": -44.89833068847656, "global_step": 359672, "epoch": 2972} {"train_loss": -44.24561309814453, "global_step": 359673, "epoch": 2972} {"train_loss": -45.117286682128906, "global_step": 359674, "epoch": 2972} {"train_loss": -44.23896789550781, "global_step": 359675, "epoch": 2972} {"train_loss": -44.75761032104492, "global_step": 359676, "epoch": 2972} {"train_loss": -44.89711380004883, "global_step": 359677, "epoch": 2972} {"train_loss": -44.09975814819336, "global_step": 359678, "epoch": 2972} {"train_loss": -45.05739974975586, "global_step": 359679, "epoch": 2972} {"train_loss": -44.725616455078125, "global_step": 359680, "epoch": 2972} {"train_loss": -45.2694206237793, "global_step": 359681, "epoch": 2972} {"train_loss": -44.66427230834961, "global_step": 359682, "epoch": 2972} {"train_loss": -45.44829559326172, "global_step": 359683, "epoch": 2972} {"train_loss": -45.38591766357422, "global_step": 359684, "epoch": 2972} {"train_loss": -45.2731819152832, "global_step": 359685, "epoch": 2972} {"train_loss": -44.952239990234375, "global_step": 359686, "epoch": 2972} {"train_loss": -44.549232482910156, "global_step": 359687, "epoch": 2972} {"train_loss": -45.81172561645508, "global_step": 359688, "epoch": 2972} {"train_loss": -45.717323303222656, "global_step": 359689, "epoch": 2972} {"train_loss": -45.66555404663086, "global_step": 359690, "epoch": 2972} {"train_loss": -45.7292594909668, "global_step": 359691, "epoch": 2972} {"train_loss": -45.00800323486328, "global_step": 359692, "epoch": 2972} {"train_loss": -45.5597038269043, "global_step": 359693, "epoch": 2972} {"train_loss": -45.75505447387695, "global_step": 359694, "epoch": 2972} {"train_loss": -45.171390533447266, "global_step": 359695, "epoch": 2972} {"train_loss": -45.079402923583984, "global_step": 359696, "epoch": 2972} {"train_loss": -45.01778793334961, "global_step": 359697, "epoch": 2972} {"train_loss": -44.92836380004883, "global_step": 359698, "epoch": 2972} {"train_loss": -44.84137725830078, "global_step": 359699, "epoch": 2972} {"train_loss": -44.2273063659668, "global_step": 359700, "epoch": 2972} {"train_loss": -44.81906509399414, "global_step": 359701, "epoch": 2972} {"train_loss": -44.63180160522461, "global_step": 359702, "epoch": 2972} {"train_loss": -44.40244674682617, "global_step": 359703, "epoch": 2972} {"train_loss": -44.733612060546875, "global_step": 359704, "epoch": 2972} {"train_loss": -44.7661247253418, "global_step": 359705, "epoch": 2972} {"train_loss": -43.898075103759766, "global_step": 359706, "epoch": 2972} {"train_loss": -44.31328201293945, "global_step": 359707, "epoch": 2972} {"train_loss": -44.77759552001953, "global_step": 359708, "epoch": 2972} {"train_loss": -44.063880920410156, "global_step": 359709, "epoch": 2972} {"train_loss": -45.31289291381836, "global_step": 359710, "epoch": 2972} {"train_loss": -44.10274124145508, "global_step": 359711, "epoch": 2972} {"train_loss": -44.6038818359375, "global_step": 359712, "epoch": 2972} {"train_loss": -45.01789474487305, "global_step": 359713, "epoch": 2972} {"train_loss": -44.562557220458984, "global_step": 359714, "epoch": 2972} {"train_loss": -45.30499267578125, "global_step": 359715, "epoch": 2972} {"train_loss": -43.024147033691406, "global_step": 359716, "epoch": 2972} {"train_loss": -44.30179977416992, "global_step": 359717, "epoch": 2972} {"train_loss": -45.292274475097656, "global_step": 359718, "epoch": 2972} {"train_loss": -44.769386291503906, "global_step": 359719, "epoch": 2972} {"train_loss": -44.69666290283203, "global_step": 359720, "epoch": 2972} {"train_loss": -44.63776397705078, "global_step": 359721, "epoch": 2972} {"train_loss": -43.751197814941406, "global_step": 359722, "epoch": 2972} {"train_loss": -45.39364242553711, "global_step": 359723, "epoch": 2972} {"train_loss": -45.40782928466797, "global_step": 359724, "epoch": 2972} {"train_loss": -44.075435638427734, "global_step": 359725, "epoch": 2972} {"train_loss": -44.60435104370117, "global_step": 359726, "epoch": 2972} {"train_loss": -45.33882522583008, "global_step": 359727, "epoch": 2972} {"train_loss": -45.38373947143555, "global_step": 359728, "epoch": 2972} {"train_loss": -45.46310043334961, "global_step": 359729, "epoch": 2972} {"train_loss": -44.63385009765625, "global_step": 359730, "epoch": 2972} {"train_loss": -44.459014892578125, "global_step": 359731, "epoch": 2972} {"train_loss": -44.09923112096865, "global_step": 359732, "epoch": 2972, "val_loss": 2428480.0} {"train_loss": -44.21413803100586, "global_step": 359733, "epoch": 2973} {"train_loss": -44.7769660949707, "global_step": 359734, "epoch": 2973} {"train_loss": -45.64188766479492, "global_step": 359735, "epoch": 2973} {"train_loss": -44.37441635131836, "global_step": 359736, "epoch": 2973} {"train_loss": -44.538265228271484, "global_step": 359737, "epoch": 2973} {"train_loss": -44.87501907348633, "global_step": 359738, "epoch": 2973} {"train_loss": -44.9013786315918, "global_step": 359739, "epoch": 2973} {"train_loss": -45.19904708862305, "global_step": 359740, "epoch": 2973} {"train_loss": -44.34452438354492, "global_step": 359741, "epoch": 2973} {"train_loss": -43.23606491088867, "global_step": 359742, "epoch": 2973} {"train_loss": -44.22454071044922, "global_step": 359743, "epoch": 2973} {"train_loss": -45.50132369995117, "global_step": 359744, "epoch": 2973} {"train_loss": -43.749080657958984, "global_step": 359745, "epoch": 2973} {"train_loss": -42.771697998046875, "global_step": 359746, "epoch": 2973} {"train_loss": -44.03034591674805, "global_step": 359747, "epoch": 2973} {"train_loss": -44.89833068847656, "global_step": 359748, "epoch": 2973} {"train_loss": -43.643470764160156, "global_step": 359749, "epoch": 2973} {"train_loss": -44.06793975830078, "global_step": 359750, "epoch": 2973} {"train_loss": -44.89760971069336, "global_step": 359751, "epoch": 2973} {"train_loss": -43.63410949707031, "global_step": 359752, "epoch": 2973} {"train_loss": -43.90460205078125, "global_step": 359753, "epoch": 2973} {"train_loss": -44.14539337158203, "global_step": 359754, "epoch": 2973} {"train_loss": -44.497344970703125, "global_step": 359755, "epoch": 2973} {"train_loss": -44.631805419921875, "global_step": 359756, "epoch": 2973} {"train_loss": -45.10576248168945, "global_step": 359757, "epoch": 2973} {"train_loss": -45.40753173828125, "global_step": 359758, "epoch": 2973} {"train_loss": -44.84815216064453, "global_step": 359759, "epoch": 2973} {"train_loss": -44.947872161865234, "global_step": 359760, "epoch": 2973} {"train_loss": -45.43475341796875, "global_step": 359761, "epoch": 2973} {"train_loss": -43.18341064453125, "global_step": 359762, "epoch": 2973} {"train_loss": -45.09249496459961, "global_step": 359763, "epoch": 2973} {"train_loss": -44.65432357788086, "global_step": 359764, "epoch": 2973} {"train_loss": -44.70453643798828, "global_step": 359765, "epoch": 2973} {"train_loss": -44.746124267578125, "global_step": 359766, "epoch": 2973} {"train_loss": -45.15793991088867, "global_step": 359767, "epoch": 2973} {"train_loss": -45.05154800415039, "global_step": 359768, "epoch": 2973} {"train_loss": -44.94340133666992, "global_step": 359769, "epoch": 2973} {"train_loss": -45.39308166503906, "global_step": 359770, "epoch": 2973} {"train_loss": -44.42499542236328, "global_step": 359771, "epoch": 2973} {"train_loss": -44.28989028930664, "global_step": 359772, "epoch": 2973} {"train_loss": -44.7641487121582, "global_step": 359773, "epoch": 2973} {"train_loss": -44.79657745361328, "global_step": 359774, "epoch": 2973} {"train_loss": -44.79545593261719, "global_step": 359775, "epoch": 2973} {"train_loss": -45.25262451171875, "global_step": 359776, "epoch": 2973} {"train_loss": -45.4935188293457, "global_step": 359777, "epoch": 2973} {"train_loss": -45.43609619140625, "global_step": 359778, "epoch": 2973} {"train_loss": -45.47100830078125, "global_step": 359779, "epoch": 2973} {"train_loss": -44.917293548583984, "global_step": 359780, "epoch": 2973} {"train_loss": -45.06940841674805, "global_step": 359781, "epoch": 2973} {"train_loss": -44.21087646484375, "global_step": 359782, "epoch": 2973} {"train_loss": -43.174835205078125, "global_step": 359783, "epoch": 2973} {"train_loss": -44.42006301879883, "global_step": 359784, "epoch": 2973} {"train_loss": -44.74365234375, "global_step": 359785, "epoch": 2973} {"train_loss": -43.55256271362305, "global_step": 359786, "epoch": 2973} {"train_loss": -40.92537307739258, "global_step": 359787, "epoch": 2973} {"train_loss": -44.796504974365234, "global_step": 359788, "epoch": 2973} {"train_loss": -43.86375045776367, "global_step": 359789, "epoch": 2973} {"train_loss": -43.71110153198242, "global_step": 359790, "epoch": 2973} {"train_loss": -44.791236877441406, "global_step": 359791, "epoch": 2973} {"train_loss": -45.1049919128418, "global_step": 359792, "epoch": 2973} {"train_loss": -43.36872482299805, "global_step": 359793, "epoch": 2973} {"train_loss": -45.038978576660156, "global_step": 359794, "epoch": 2973} {"train_loss": -44.40315628051758, "global_step": 359795, "epoch": 2973} {"train_loss": -44.16221237182617, "global_step": 359796, "epoch": 2973} {"train_loss": -44.547447204589844, "global_step": 359797, "epoch": 2973} {"train_loss": -43.974090576171875, "global_step": 359798, "epoch": 2973} {"train_loss": -43.92727279663086, "global_step": 359799, "epoch": 2973} {"train_loss": -44.51862335205078, "global_step": 359800, "epoch": 2973} {"train_loss": -44.60980224609375, "global_step": 359801, "epoch": 2973} {"train_loss": -44.32459259033203, "global_step": 359802, "epoch": 2973} {"train_loss": -44.26728057861328, "global_step": 359803, "epoch": 2973} {"train_loss": -44.309322357177734, "global_step": 359804, "epoch": 2973} {"train_loss": -45.5295295715332, "global_step": 359805, "epoch": 2973} {"train_loss": -44.33161163330078, "global_step": 359806, "epoch": 2973} {"train_loss": -45.5120964050293, "global_step": 359807, "epoch": 2973} {"train_loss": -44.64229202270508, "global_step": 359808, "epoch": 2973} {"train_loss": -45.00129318237305, "global_step": 359809, "epoch": 2973} {"train_loss": -45.09979248046875, "global_step": 359810, "epoch": 2973} {"train_loss": -44.317562103271484, "global_step": 359811, "epoch": 2973} {"train_loss": -44.12148666381836, "global_step": 359812, "epoch": 2973} {"train_loss": -44.77167892456055, "global_step": 359813, "epoch": 2973} {"train_loss": -45.4777946472168, "global_step": 359814, "epoch": 2973} {"train_loss": -44.27587127685547, "global_step": 359815, "epoch": 2973} {"train_loss": -44.69544219970703, "global_step": 359816, "epoch": 2973} {"train_loss": -45.382171630859375, "global_step": 359817, "epoch": 2973} {"train_loss": -44.75759506225586, "global_step": 359818, "epoch": 2973} {"train_loss": -44.874446868896484, "global_step": 359819, "epoch": 2973} {"train_loss": -45.282161712646484, "global_step": 359820, "epoch": 2973} {"train_loss": -45.173580169677734, "global_step": 359821, "epoch": 2973} {"train_loss": -45.46296310424805, "global_step": 359822, "epoch": 2973} {"train_loss": -43.99333953857422, "global_step": 359823, "epoch": 2973} {"train_loss": -45.88920211791992, "global_step": 359824, "epoch": 2973} {"train_loss": -45.45746994018555, "global_step": 359825, "epoch": 2973} {"train_loss": -45.18628692626953, "global_step": 359826, "epoch": 2973} {"train_loss": -45.17140579223633, "global_step": 359827, "epoch": 2973} {"train_loss": -45.03244400024414, "global_step": 359828, "epoch": 2973} {"train_loss": -44.979061126708984, "global_step": 359829, "epoch": 2973} {"train_loss": -44.9202766418457, "global_step": 359830, "epoch": 2973} {"train_loss": -44.97111892700195, "global_step": 359831, "epoch": 2973} {"train_loss": -45.079612731933594, "global_step": 359832, "epoch": 2973} {"train_loss": -44.988502502441406, "global_step": 359833, "epoch": 2973} {"train_loss": -44.4356575012207, "global_step": 359834, "epoch": 2973} {"train_loss": -43.6780891418457, "global_step": 359835, "epoch": 2973} {"train_loss": -44.27488708496094, "global_step": 359836, "epoch": 2973} {"train_loss": -44.86615753173828, "global_step": 359837, "epoch": 2973} {"train_loss": -43.5974235534668, "global_step": 359838, "epoch": 2973} {"train_loss": -43.82815170288086, "global_step": 359839, "epoch": 2973} {"train_loss": -44.48757553100586, "global_step": 359840, "epoch": 2973} {"train_loss": -43.50095748901367, "global_step": 359841, "epoch": 2973} {"train_loss": -42.495460510253906, "global_step": 359842, "epoch": 2973} {"train_loss": -43.11259460449219, "global_step": 359843, "epoch": 2973} {"train_loss": -44.15825271606445, "global_step": 359844, "epoch": 2973} {"train_loss": -36.218902587890625, "global_step": 359845, "epoch": 2973} {"train_loss": -43.6442756652832, "global_step": 359846, "epoch": 2973} {"train_loss": -41.709346771240234, "global_step": 359847, "epoch": 2973} {"train_loss": -40.495933532714844, "global_step": 359848, "epoch": 2973} {"train_loss": -42.50847625732422, "global_step": 359849, "epoch": 2973} {"train_loss": -40.50529861450195, "global_step": 359850, "epoch": 2973} {"train_loss": -39.9977912902832, "global_step": 359851, "epoch": 2973} {"train_loss": -43.137672424316406, "global_step": 359852, "epoch": 2973} {"train_loss": -44.267583642124144, "global_step": 359853, "epoch": 2973, "val_loss": 2354370.75} {"train_loss": -38.16752243041992, "global_step": 359854, "epoch": 2974} {"train_loss": -40.34589767456055, "global_step": 359855, "epoch": 2974} {"train_loss": -40.19026565551758, "global_step": 359856, "epoch": 2974} {"train_loss": -20.915775299072266, "global_step": 359857, "epoch": 2974} {"train_loss": -36.810028076171875, "global_step": 359858, "epoch": 2974} {"train_loss": -39.50832748413086, "global_step": 359859, "epoch": 2974} {"train_loss": -40.93270492553711, "global_step": 359860, "epoch": 2974} {"train_loss": -39.8051643371582, "global_step": 359861, "epoch": 2974} {"train_loss": -37.0712890625, "global_step": 359862, "epoch": 2974} {"train_loss": -39.534847259521484, "global_step": 359863, "epoch": 2974} {"train_loss": -40.186885833740234, "global_step": 359864, "epoch": 2974} {"train_loss": -38.61598587036133, "global_step": 359865, "epoch": 2974} {"train_loss": -40.1762809753418, "global_step": 359866, "epoch": 2974} {"train_loss": -40.835140228271484, "global_step": 359867, "epoch": 2974} {"train_loss": -40.734169006347656, "global_step": 359868, "epoch": 2974} {"train_loss": -40.1937370300293, "global_step": 359869, "epoch": 2974} {"train_loss": -37.90060043334961, "global_step": 359870, "epoch": 2974} {"train_loss": -40.44456100463867, "global_step": 359871, "epoch": 2974} {"train_loss": -39.44995880126953, "global_step": 359872, "epoch": 2974} {"train_loss": -37.985225677490234, "global_step": 359873, "epoch": 2974} {"train_loss": -40.7208366394043, "global_step": 359874, "epoch": 2974} {"train_loss": -40.091487884521484, "global_step": 359875, "epoch": 2974} {"train_loss": -42.019344329833984, "global_step": 359876, "epoch": 2974} {"train_loss": -38.67351150512695, "global_step": 359877, "epoch": 2974} {"train_loss": -40.33584213256836, "global_step": 359878, "epoch": 2974} {"train_loss": -41.57896041870117, "global_step": 359879, "epoch": 2974} {"train_loss": -41.66621398925781, "global_step": 359880, "epoch": 2974} {"train_loss": -41.755897521972656, "global_step": 359881, "epoch": 2974} {"train_loss": -41.959678649902344, "global_step": 359882, "epoch": 2974} {"train_loss": -41.1551628112793, "global_step": 359883, "epoch": 2974} {"train_loss": -41.9057502746582, "global_step": 359884, "epoch": 2974} {"train_loss": -41.626319885253906, "global_step": 359885, "epoch": 2974} {"train_loss": -40.874141693115234, "global_step": 359886, "epoch": 2974} {"train_loss": -42.23872756958008, "global_step": 359887, "epoch": 2974} {"train_loss": -40.861915588378906, "global_step": 359888, "epoch": 2974} {"train_loss": -42.8816032409668, "global_step": 359889, "epoch": 2974} {"train_loss": -41.830909729003906, "global_step": 359890, "epoch": 2974} {"train_loss": -41.61996841430664, "global_step": 359891, "epoch": 2974} {"train_loss": -43.53109359741211, "global_step": 359892, "epoch": 2974} {"train_loss": -42.646697998046875, "global_step": 359893, "epoch": 2974} {"train_loss": -42.841617584228516, "global_step": 359894, "epoch": 2974} {"train_loss": -43.38529586791992, "global_step": 359895, "epoch": 2974} {"train_loss": -42.88942337036133, "global_step": 359896, "epoch": 2974} {"train_loss": -43.11750793457031, "global_step": 359897, "epoch": 2974} {"train_loss": -43.54375457763672, "global_step": 359898, "epoch": 2974} {"train_loss": -42.7336311340332, "global_step": 359899, "epoch": 2974} {"train_loss": -43.391822814941406, "global_step": 359900, "epoch": 2974} {"train_loss": -43.39881134033203, "global_step": 359901, "epoch": 2974} {"train_loss": -43.338043212890625, "global_step": 359902, "epoch": 2974} {"train_loss": -43.72304153442383, "global_step": 359903, "epoch": 2974} {"train_loss": -43.62656784057617, "global_step": 359904, "epoch": 2974} {"train_loss": -43.994564056396484, "global_step": 359905, "epoch": 2974} {"train_loss": -43.675777435302734, "global_step": 359906, "epoch": 2974} {"train_loss": -43.445152282714844, "global_step": 359907, "epoch": 2974} {"train_loss": -43.84884262084961, "global_step": 359908, "epoch": 2974} {"train_loss": -43.66140365600586, "global_step": 359909, "epoch": 2974} {"train_loss": -44.2813720703125, "global_step": 359910, "epoch": 2974} {"train_loss": -43.106624603271484, "global_step": 359911, "epoch": 2974} {"train_loss": -43.89332580566406, "global_step": 359912, "epoch": 2974} {"train_loss": -43.09273910522461, "global_step": 359913, "epoch": 2974} {"train_loss": -43.63349151611328, "global_step": 359914, "epoch": 2974} {"train_loss": -44.02531433105469, "global_step": 359915, "epoch": 2974} {"train_loss": -44.09113311767578, "global_step": 359916, "epoch": 2974} {"train_loss": -44.446834564208984, "global_step": 359917, "epoch": 2974} {"train_loss": -44.63850784301758, "global_step": 359918, "epoch": 2974} {"train_loss": -44.31051254272461, "global_step": 359919, "epoch": 2974} {"train_loss": -44.51643371582031, "global_step": 359920, "epoch": 2974} {"train_loss": -43.697139739990234, "global_step": 359921, "epoch": 2974} {"train_loss": -44.238983154296875, "global_step": 359922, "epoch": 2974} {"train_loss": -44.78631591796875, "global_step": 359923, "epoch": 2974} {"train_loss": -43.355072021484375, "global_step": 359924, "epoch": 2974} {"train_loss": -44.14637756347656, "global_step": 359925, "epoch": 2974} {"train_loss": -44.747310638427734, "global_step": 359926, "epoch": 2974} {"train_loss": -44.05901336669922, "global_step": 359927, "epoch": 2974} {"train_loss": -44.58060836791992, "global_step": 359928, "epoch": 2974} {"train_loss": -44.7806282043457, "global_step": 359929, "epoch": 2974} {"train_loss": -44.147159576416016, "global_step": 359930, "epoch": 2974} {"train_loss": -44.95318603515625, "global_step": 359931, "epoch": 2974} {"train_loss": -43.50320816040039, "global_step": 359932, "epoch": 2974} {"train_loss": -44.126380920410156, "global_step": 359933, "epoch": 2974} {"train_loss": -44.32986068725586, "global_step": 359934, "epoch": 2974} {"train_loss": -44.10872268676758, "global_step": 359935, "epoch": 2974} {"train_loss": -44.90902328491211, "global_step": 359936, "epoch": 2974} {"train_loss": -44.84046173095703, "global_step": 359937, "epoch": 2974} {"train_loss": -44.44089126586914, "global_step": 359938, "epoch": 2974} {"train_loss": -44.4068717956543, "global_step": 359939, "epoch": 2974} {"train_loss": -44.4934196472168, "global_step": 359940, "epoch": 2974} {"train_loss": -45.1075325012207, "global_step": 359941, "epoch": 2974} {"train_loss": -44.87739181518555, "global_step": 359942, "epoch": 2974} {"train_loss": -44.836151123046875, "global_step": 359943, "epoch": 2974} {"train_loss": -44.74367141723633, "global_step": 359944, "epoch": 2974} {"train_loss": -44.71571350097656, "global_step": 359945, "epoch": 2974} {"train_loss": -44.29489517211914, "global_step": 359946, "epoch": 2974} {"train_loss": -45.5119514465332, "global_step": 359947, "epoch": 2974} {"train_loss": -44.882781982421875, "global_step": 359948, "epoch": 2974} {"train_loss": -44.74713134765625, "global_step": 359949, "epoch": 2974} {"train_loss": -45.44329833984375, "global_step": 359950, "epoch": 2974} {"train_loss": -44.91039276123047, "global_step": 359951, "epoch": 2974} {"train_loss": -44.652645111083984, "global_step": 359952, "epoch": 2974} {"train_loss": -44.86416244506836, "global_step": 359953, "epoch": 2974} {"train_loss": -45.61827087402344, "global_step": 359954, "epoch": 2974} {"train_loss": -44.97892379760742, "global_step": 359955, "epoch": 2974} {"train_loss": -44.665130615234375, "global_step": 359956, "epoch": 2974} {"train_loss": -45.45852279663086, "global_step": 359957, "epoch": 2974} {"train_loss": -44.782188415527344, "global_step": 359958, "epoch": 2974} {"train_loss": -45.00725173950195, "global_step": 359959, "epoch": 2974} {"train_loss": -45.562068939208984, "global_step": 359960, "epoch": 2974} {"train_loss": -45.30723190307617, "global_step": 359961, "epoch": 2974} {"train_loss": -44.81640625, "global_step": 359962, "epoch": 2974} {"train_loss": -44.983154296875, "global_step": 359963, "epoch": 2974} {"train_loss": -44.58390426635742, "global_step": 359964, "epoch": 2974} {"train_loss": -45.743080139160156, "global_step": 359965, "epoch": 2974} {"train_loss": -44.934593200683594, "global_step": 359966, "epoch": 2974} {"train_loss": -44.28096389770508, "global_step": 359967, "epoch": 2974} {"train_loss": -45.12581253051758, "global_step": 359968, "epoch": 2974} {"train_loss": -45.413936614990234, "global_step": 359969, "epoch": 2974} {"train_loss": -44.52705001831055, "global_step": 359970, "epoch": 2974} {"train_loss": -44.03515625, "global_step": 359971, "epoch": 2974} {"train_loss": -43.3277702331543, "global_step": 359972, "epoch": 2974} {"train_loss": -43.188446044921875, "global_step": 359973, "epoch": 2974} {"train_loss": -42.87549531164248, "global_step": 359974, "epoch": 2974, "val_loss": 2393750.5} {"train_loss": -45.509639739990234, "global_step": 359975, "epoch": 2975} {"train_loss": -45.3681640625, "global_step": 359976, "epoch": 2975} {"train_loss": -45.10874557495117, "global_step": 359977, "epoch": 2975} {"train_loss": -44.52171325683594, "global_step": 359978, "epoch": 2975} {"train_loss": -45.038063049316406, "global_step": 359979, "epoch": 2975} {"train_loss": -45.377838134765625, "global_step": 359980, "epoch": 2975} {"train_loss": -44.85968780517578, "global_step": 359981, "epoch": 2975} {"train_loss": -44.45789337158203, "global_step": 359982, "epoch": 2975} {"train_loss": -44.9169921875, "global_step": 359983, "epoch": 2975} {"train_loss": -44.31965255737305, "global_step": 359984, "epoch": 2975} {"train_loss": -44.55349349975586, "global_step": 359985, "epoch": 2975} {"train_loss": -43.942718505859375, "global_step": 359986, "epoch": 2975} {"train_loss": -43.07989501953125, "global_step": 359987, "epoch": 2975} {"train_loss": -44.8018798828125, "global_step": 359988, "epoch": 2975} {"train_loss": -45.1950798034668, "global_step": 359989, "epoch": 2975} {"train_loss": -43.06834411621094, "global_step": 359990, "epoch": 2975} {"train_loss": -42.063575744628906, "global_step": 359991, "epoch": 2975} {"train_loss": -42.45349884033203, "global_step": 359992, "epoch": 2975} {"train_loss": -44.83625411987305, "global_step": 359993, "epoch": 2975} {"train_loss": -44.94752883911133, "global_step": 359994, "epoch": 2975} {"train_loss": -41.7912483215332, "global_step": 359995, "epoch": 2975} {"train_loss": -40.58431625366211, "global_step": 359996, "epoch": 2975} {"train_loss": -44.232643127441406, "global_step": 359997, "epoch": 2975} {"train_loss": -43.54783248901367, "global_step": 359998, "epoch": 2975} {"train_loss": -42.24637985229492, "global_step": 359999, "epoch": 2975} {"train_loss": -42.53195571899414, "global_step": 360000, "epoch": 2975} {"train_loss": -43.55756759643555, "global_step": 360001, "epoch": 2975} {"train_loss": -43.69232940673828, "global_step": 360002, "epoch": 2975} {"train_loss": -43.10401153564453, "global_step": 360003, "epoch": 2975} {"train_loss": -42.8975715637207, "global_step": 360004, "epoch": 2975} {"train_loss": -43.0376091003418, "global_step": 360005, "epoch": 2975} {"train_loss": -39.379878997802734, "global_step": 360006, "epoch": 2975} {"train_loss": -42.444942474365234, "global_step": 360007, "epoch": 2975} {"train_loss": -42.67470169067383, "global_step": 360008, "epoch": 2975} {"train_loss": -38.85831832885742, "global_step": 360009, "epoch": 2975} {"train_loss": -43.44141387939453, "global_step": 360010, "epoch": 2975} {"train_loss": -38.112693786621094, "global_step": 360011, "epoch": 2975} {"train_loss": -41.00971603393555, "global_step": 360012, "epoch": 2975} {"train_loss": -36.45050048828125, "global_step": 360013, "epoch": 2975} {"train_loss": -36.75216293334961, "global_step": 360014, "epoch": 2975} {"train_loss": -39.10969924926758, "global_step": 360015, "epoch": 2975} {"train_loss": -39.68378829956055, "global_step": 360016, "epoch": 2975} {"train_loss": -37.40656661987305, "global_step": 360017, "epoch": 2975} {"train_loss": -39.93244552612305, "global_step": 360018, "epoch": 2975} {"train_loss": -39.2960090637207, "global_step": 360019, "epoch": 2975} {"train_loss": -37.59769821166992, "global_step": 360020, "epoch": 2975} {"train_loss": -39.765411376953125, "global_step": 360021, "epoch": 2975} {"train_loss": -40.42612838745117, "global_step": 360022, "epoch": 2975} {"train_loss": -40.979801177978516, "global_step": 360023, "epoch": 2975} {"train_loss": -41.33803939819336, "global_step": 360024, "epoch": 2975} {"train_loss": -40.01761245727539, "global_step": 360025, "epoch": 2975} {"train_loss": -42.80464553833008, "global_step": 360026, "epoch": 2975} {"train_loss": -39.41413116455078, "global_step": 360027, "epoch": 2975} {"train_loss": -42.89870834350586, "global_step": 360028, "epoch": 2975} {"train_loss": -41.2235107421875, "global_step": 360029, "epoch": 2975} {"train_loss": -41.47835159301758, "global_step": 360030, "epoch": 2975} {"train_loss": -42.25077438354492, "global_step": 360031, "epoch": 2975} {"train_loss": -41.31319808959961, "global_step": 360032, "epoch": 2975} {"train_loss": -42.744171142578125, "global_step": 360033, "epoch": 2975} {"train_loss": -42.11549758911133, "global_step": 360034, "epoch": 2975} {"train_loss": -43.43472671508789, "global_step": 360035, "epoch": 2975} {"train_loss": -42.73983383178711, "global_step": 360036, "epoch": 2975} {"train_loss": -43.08051681518555, "global_step": 360037, "epoch": 2975} {"train_loss": -42.69489669799805, "global_step": 360038, "epoch": 2975} {"train_loss": -42.109066009521484, "global_step": 360039, "epoch": 2975} {"train_loss": -43.38566207885742, "global_step": 360040, "epoch": 2975} {"train_loss": -43.59782028198242, "global_step": 360041, "epoch": 2975} {"train_loss": -43.10770797729492, "global_step": 360042, "epoch": 2975} {"train_loss": -44.037105560302734, "global_step": 360043, "epoch": 2975} {"train_loss": -43.15888214111328, "global_step": 360044, "epoch": 2975} {"train_loss": -44.0159912109375, "global_step": 360045, "epoch": 2975} {"train_loss": -43.94501876831055, "global_step": 360046, "epoch": 2975} {"train_loss": -43.71914291381836, "global_step": 360047, "epoch": 2975} {"train_loss": -44.383338928222656, "global_step": 360048, "epoch": 2975} {"train_loss": -44.0885124206543, "global_step": 360049, "epoch": 2975} {"train_loss": -44.477638244628906, "global_step": 360050, "epoch": 2975} {"train_loss": -44.062191009521484, "global_step": 360051, "epoch": 2975} {"train_loss": -44.19691848754883, "global_step": 360052, "epoch": 2975} {"train_loss": -44.479915618896484, "global_step": 360053, "epoch": 2975} {"train_loss": -44.36892318725586, "global_step": 360054, "epoch": 2975} {"train_loss": -44.254241943359375, "global_step": 360055, "epoch": 2975} {"train_loss": -44.51197052001953, "global_step": 360056, "epoch": 2975} {"train_loss": -44.3095703125, "global_step": 360057, "epoch": 2975} {"train_loss": -44.584938049316406, "global_step": 360058, "epoch": 2975} {"train_loss": -44.788448333740234, "global_step": 360059, "epoch": 2975} {"train_loss": -44.502803802490234, "global_step": 360060, "epoch": 2975} {"train_loss": -45.317909240722656, "global_step": 360061, "epoch": 2975} {"train_loss": -45.320430755615234, "global_step": 360062, "epoch": 2975} {"train_loss": -44.652339935302734, "global_step": 360063, "epoch": 2975} {"train_loss": -44.657920837402344, "global_step": 360064, "epoch": 2975} {"train_loss": -44.64247131347656, "global_step": 360065, "epoch": 2975} {"train_loss": -44.76142501831055, "global_step": 360066, "epoch": 2975} {"train_loss": -45.045589447021484, "global_step": 360067, "epoch": 2975} {"train_loss": -45.03603744506836, "global_step": 360068, "epoch": 2975} {"train_loss": -45.06277084350586, "global_step": 360069, "epoch": 2975} {"train_loss": -45.1368522644043, "global_step": 360070, "epoch": 2975} {"train_loss": -44.87177658081055, "global_step": 360071, "epoch": 2975} {"train_loss": -45.496429443359375, "global_step": 360072, "epoch": 2975} {"train_loss": -45.134193420410156, "global_step": 360073, "epoch": 2975} {"train_loss": -45.4457893371582, "global_step": 360074, "epoch": 2975} {"train_loss": -45.08280563354492, "global_step": 360075, "epoch": 2975} {"train_loss": -45.77065658569336, "global_step": 360076, "epoch": 2975} {"train_loss": -44.456031799316406, "global_step": 360077, "epoch": 2975} {"train_loss": -45.584224700927734, "global_step": 360078, "epoch": 2975} {"train_loss": -45.20655059814453, "global_step": 360079, "epoch": 2975} {"train_loss": -45.29596710205078, "global_step": 360080, "epoch": 2975} {"train_loss": -45.461177825927734, "global_step": 360081, "epoch": 2975} {"train_loss": -45.16288375854492, "global_step": 360082, "epoch": 2975} {"train_loss": -45.19661331176758, "global_step": 360083, "epoch": 2975} {"train_loss": -45.28152847290039, "global_step": 360084, "epoch": 2975} {"train_loss": -45.800994873046875, "global_step": 360085, "epoch": 2975} {"train_loss": -45.51417922973633, "global_step": 360086, "epoch": 2975} {"train_loss": -45.665008544921875, "global_step": 360087, "epoch": 2975} {"train_loss": -45.62196350097656, "global_step": 360088, "epoch": 2975} {"train_loss": -45.223236083984375, "global_step": 360089, "epoch": 2975} {"train_loss": -45.67697525024414, "global_step": 360090, "epoch": 2975} {"train_loss": -45.21257019042969, "global_step": 360091, "epoch": 2975} {"train_loss": -45.02497482299805, "global_step": 360092, "epoch": 2975} {"train_loss": -45.397029876708984, "global_step": 360093, "epoch": 2975} {"train_loss": -46.140663146972656, "global_step": 360094, "epoch": 2975} {"train_loss": -43.422751781369044, "global_step": 360095, "epoch": 2975, "val_loss": 2458940.25} {"train_loss": -44.77635955810547, "global_step": 360096, "epoch": 2976} {"train_loss": -44.633113861083984, "global_step": 360097, "epoch": 2976} {"train_loss": -45.2531852722168, "global_step": 360098, "epoch": 2976} {"train_loss": -44.80695724487305, "global_step": 360099, "epoch": 2976} {"train_loss": -44.29335403442383, "global_step": 360100, "epoch": 2976} {"train_loss": -44.47296905517578, "global_step": 360101, "epoch": 2976} {"train_loss": -44.29506301879883, "global_step": 360102, "epoch": 2976} {"train_loss": -45.29055404663086, "global_step": 360103, "epoch": 2976} {"train_loss": -44.670494079589844, "global_step": 360104, "epoch": 2976} {"train_loss": -45.630062103271484, "global_step": 360105, "epoch": 2976} {"train_loss": -45.34563446044922, "global_step": 360106, "epoch": 2976} {"train_loss": -44.57103729248047, "global_step": 360107, "epoch": 2976} {"train_loss": -45.28074264526367, "global_step": 360108, "epoch": 2976} {"train_loss": -44.758968353271484, "global_step": 360109, "epoch": 2976} {"train_loss": -44.49940872192383, "global_step": 360110, "epoch": 2976} {"train_loss": -44.70709228515625, "global_step": 360111, "epoch": 2976} {"train_loss": -43.87746047973633, "global_step": 360112, "epoch": 2976} {"train_loss": -43.471981048583984, "global_step": 360113, "epoch": 2976} {"train_loss": -44.25532913208008, "global_step": 360114, "epoch": 2976} {"train_loss": -45.503944396972656, "global_step": 360115, "epoch": 2976} {"train_loss": -45.4948616027832, "global_step": 360116, "epoch": 2976} {"train_loss": -44.03902053833008, "global_step": 360117, "epoch": 2976} {"train_loss": -44.766693115234375, "global_step": 360118, "epoch": 2976} {"train_loss": -45.68623352050781, "global_step": 360119, "epoch": 2976} {"train_loss": -45.36852264404297, "global_step": 360120, "epoch": 2976} {"train_loss": -45.13331985473633, "global_step": 360121, "epoch": 2976} {"train_loss": -44.7745246887207, "global_step": 360122, "epoch": 2976} {"train_loss": -44.49177169799805, "global_step": 360123, "epoch": 2976} {"train_loss": -44.149505615234375, "global_step": 360124, "epoch": 2976} {"train_loss": -44.271217346191406, "global_step": 360125, "epoch": 2976} {"train_loss": -44.08218002319336, "global_step": 360126, "epoch": 2976} {"train_loss": -43.158477783203125, "global_step": 360127, "epoch": 2976} {"train_loss": -43.68227005004883, "global_step": 360128, "epoch": 2976} {"train_loss": -41.329429626464844, "global_step": 360129, "epoch": 2976} {"train_loss": -43.6627311706543, "global_step": 360130, "epoch": 2976} {"train_loss": -43.698822021484375, "global_step": 360131, "epoch": 2976} {"train_loss": -42.7002067565918, "global_step": 360132, "epoch": 2976} {"train_loss": -39.48142623901367, "global_step": 360133, "epoch": 2976} {"train_loss": -41.6370849609375, "global_step": 360134, "epoch": 2976} {"train_loss": -42.14243698120117, "global_step": 360135, "epoch": 2976} {"train_loss": -42.675331115722656, "global_step": 360136, "epoch": 2976} {"train_loss": -44.73903274536133, "global_step": 360137, "epoch": 2976} {"train_loss": -42.33979034423828, "global_step": 360138, "epoch": 2976} {"train_loss": -43.511600494384766, "global_step": 360139, "epoch": 2976} {"train_loss": -43.60171127319336, "global_step": 360140, "epoch": 2976} {"train_loss": -43.36215591430664, "global_step": 360141, "epoch": 2976} {"train_loss": -43.26356887817383, "global_step": 360142, "epoch": 2976} {"train_loss": -44.541683197021484, "global_step": 360143, "epoch": 2976} {"train_loss": -44.325042724609375, "global_step": 360144, "epoch": 2976} {"train_loss": -42.72796630859375, "global_step": 360145, "epoch": 2976} {"train_loss": -43.12041091918945, "global_step": 360146, "epoch": 2976} {"train_loss": -44.985626220703125, "global_step": 360147, "epoch": 2976} {"train_loss": -42.676109313964844, "global_step": 360148, "epoch": 2976} {"train_loss": -44.93682098388672, "global_step": 360149, "epoch": 2976} {"train_loss": -43.58075714111328, "global_step": 360150, "epoch": 2976} {"train_loss": -43.83692169189453, "global_step": 360151, "epoch": 2976} {"train_loss": -44.64276123046875, "global_step": 360152, "epoch": 2976} {"train_loss": -44.2574577331543, "global_step": 360153, "epoch": 2976} {"train_loss": -43.70293426513672, "global_step": 360154, "epoch": 2976} {"train_loss": -44.510650634765625, "global_step": 360155, "epoch": 2976} {"train_loss": -44.2709846496582, "global_step": 360156, "epoch": 2976} {"train_loss": -44.28554916381836, "global_step": 360157, "epoch": 2976} {"train_loss": -43.372276306152344, "global_step": 360158, "epoch": 2976} {"train_loss": -44.51007843017578, "global_step": 360159, "epoch": 2976} {"train_loss": -44.57748031616211, "global_step": 360160, "epoch": 2976} {"train_loss": -44.127925872802734, "global_step": 360161, "epoch": 2976} {"train_loss": -44.43134689331055, "global_step": 360162, "epoch": 2976} {"train_loss": -44.920894622802734, "global_step": 360163, "epoch": 2976} {"train_loss": -44.736427307128906, "global_step": 360164, "epoch": 2976} {"train_loss": -44.34489440917969, "global_step": 360165, "epoch": 2976} {"train_loss": -45.14286422729492, "global_step": 360166, "epoch": 2976} {"train_loss": -44.67070388793945, "global_step": 360167, "epoch": 2976} {"train_loss": -44.67057800292969, "global_step": 360168, "epoch": 2976} {"train_loss": -45.080501556396484, "global_step": 360169, "epoch": 2976} {"train_loss": -43.27498245239258, "global_step": 360170, "epoch": 2976} {"train_loss": -45.03535079956055, "global_step": 360171, "epoch": 2976} {"train_loss": -43.4853401184082, "global_step": 360172, "epoch": 2976} {"train_loss": -44.07322311401367, "global_step": 360173, "epoch": 2976} {"train_loss": -44.22384262084961, "global_step": 360174, "epoch": 2976} {"train_loss": -43.76189041137695, "global_step": 360175, "epoch": 2976} {"train_loss": -44.39118957519531, "global_step": 360176, "epoch": 2976} {"train_loss": -43.63825607299805, "global_step": 360177, "epoch": 2976} {"train_loss": -43.99225997924805, "global_step": 360178, "epoch": 2976} {"train_loss": -45.04901885986328, "global_step": 360179, "epoch": 2976} {"train_loss": -44.43953323364258, "global_step": 360180, "epoch": 2976} {"train_loss": -44.69916534423828, "global_step": 360181, "epoch": 2976} {"train_loss": -44.6740608215332, "global_step": 360182, "epoch": 2976} {"train_loss": -44.45968246459961, "global_step": 360183, "epoch": 2976} {"train_loss": -44.53681564331055, "global_step": 360184, "epoch": 2976} {"train_loss": -44.251441955566406, "global_step": 360185, "epoch": 2976} {"train_loss": -44.85479736328125, "global_step": 360186, "epoch": 2976} {"train_loss": -44.7652702331543, "global_step": 360187, "epoch": 2976} {"train_loss": -44.3865852355957, "global_step": 360188, "epoch": 2976} {"train_loss": -44.25999069213867, "global_step": 360189, "epoch": 2976} {"train_loss": -44.93095016479492, "global_step": 360190, "epoch": 2976} {"train_loss": -43.938140869140625, "global_step": 360191, "epoch": 2976} {"train_loss": -44.62716293334961, "global_step": 360192, "epoch": 2976} {"train_loss": -45.048614501953125, "global_step": 360193, "epoch": 2976} {"train_loss": -44.61527633666992, "global_step": 360194, "epoch": 2976} {"train_loss": -44.613582611083984, "global_step": 360195, "epoch": 2976} {"train_loss": -45.017112731933594, "global_step": 360196, "epoch": 2976} {"train_loss": -44.116172790527344, "global_step": 360197, "epoch": 2976} {"train_loss": -44.47860336303711, "global_step": 360198, "epoch": 2976} {"train_loss": -44.622314453125, "global_step": 360199, "epoch": 2976} {"train_loss": -44.3263053894043, "global_step": 360200, "epoch": 2976} {"train_loss": -44.810638427734375, "global_step": 360201, "epoch": 2976} {"train_loss": -44.4580192565918, "global_step": 360202, "epoch": 2976} {"train_loss": -44.78728103637695, "global_step": 360203, "epoch": 2976} {"train_loss": -45.36275100708008, "global_step": 360204, "epoch": 2976} {"train_loss": -45.01525115966797, "global_step": 360205, "epoch": 2976} {"train_loss": -45.053043365478516, "global_step": 360206, "epoch": 2976} {"train_loss": -45.288330078125, "global_step": 360207, "epoch": 2976} {"train_loss": -43.40512466430664, "global_step": 360208, "epoch": 2976} {"train_loss": -44.702362060546875, "global_step": 360209, "epoch": 2976} {"train_loss": -44.53980255126953, "global_step": 360210, "epoch": 2976} {"train_loss": -44.25593185424805, "global_step": 360211, "epoch": 2976} {"train_loss": -44.37084197998047, "global_step": 360212, "epoch": 2976} {"train_loss": -44.622047424316406, "global_step": 360213, "epoch": 2976} {"train_loss": -44.012306213378906, "global_step": 360214, "epoch": 2976} {"train_loss": -44.86674880981445, "global_step": 360215, "epoch": 2976} {"train_loss": -44.282216442518, "global_step": 360216, "epoch": 2976, "val_loss": 2448484.5} {"train_loss": -44.75122833251953, "global_step": 360217, "epoch": 2977} {"train_loss": -45.50404357910156, "global_step": 360218, "epoch": 2977} {"train_loss": -44.911277770996094, "global_step": 360219, "epoch": 2977} {"train_loss": -45.17124938964844, "global_step": 360220, "epoch": 2977} {"train_loss": -45.332679748535156, "global_step": 360221, "epoch": 2977} {"train_loss": -45.8264274597168, "global_step": 360222, "epoch": 2977} {"train_loss": -44.879478454589844, "global_step": 360223, "epoch": 2977} {"train_loss": -45.52716827392578, "global_step": 360224, "epoch": 2977} {"train_loss": -45.394264221191406, "global_step": 360225, "epoch": 2977} {"train_loss": -45.36592102050781, "global_step": 360226, "epoch": 2977} {"train_loss": -44.420867919921875, "global_step": 360227, "epoch": 2977} {"train_loss": -44.46360397338867, "global_step": 360228, "epoch": 2977} {"train_loss": -45.28573226928711, "global_step": 360229, "epoch": 2977} {"train_loss": -44.4138298034668, "global_step": 360230, "epoch": 2977} {"train_loss": -44.3131217956543, "global_step": 360231, "epoch": 2977} {"train_loss": -43.32728958129883, "global_step": 360232, "epoch": 2977} {"train_loss": -45.19050216674805, "global_step": 360233, "epoch": 2977} {"train_loss": -44.4536018371582, "global_step": 360234, "epoch": 2977} {"train_loss": -44.75300216674805, "global_step": 360235, "epoch": 2977} {"train_loss": -43.94308853149414, "global_step": 360236, "epoch": 2977} {"train_loss": -44.48148727416992, "global_step": 360237, "epoch": 2977} {"train_loss": -45.353328704833984, "global_step": 360238, "epoch": 2977} {"train_loss": -43.90260314941406, "global_step": 360239, "epoch": 2977} {"train_loss": -45.15822219848633, "global_step": 360240, "epoch": 2977} {"train_loss": -44.81046676635742, "global_step": 360241, "epoch": 2977} {"train_loss": -44.654815673828125, "global_step": 360242, "epoch": 2977} {"train_loss": -44.95737075805664, "global_step": 360243, "epoch": 2977} {"train_loss": -45.510040283203125, "global_step": 360244, "epoch": 2977} {"train_loss": -45.223121643066406, "global_step": 360245, "epoch": 2977} {"train_loss": -45.34893798828125, "global_step": 360246, "epoch": 2977} {"train_loss": -45.276737213134766, "global_step": 360247, "epoch": 2977} {"train_loss": -45.459869384765625, "global_step": 360248, "epoch": 2977} {"train_loss": -45.341976165771484, "global_step": 360249, "epoch": 2977} {"train_loss": -45.13889694213867, "global_step": 360250, "epoch": 2977} {"train_loss": -44.3898811340332, "global_step": 360251, "epoch": 2977} {"train_loss": -45.033058166503906, "global_step": 360252, "epoch": 2977} {"train_loss": -45.2005729675293, "global_step": 360253, "epoch": 2977} {"train_loss": -44.323150634765625, "global_step": 360254, "epoch": 2977} {"train_loss": -45.18470001220703, "global_step": 360255, "epoch": 2977} {"train_loss": -45.290061950683594, "global_step": 360256, "epoch": 2977} {"train_loss": -45.69892883300781, "global_step": 360257, "epoch": 2977} {"train_loss": -44.137001037597656, "global_step": 360258, "epoch": 2977} {"train_loss": -45.09040069580078, "global_step": 360259, "epoch": 2977} {"train_loss": -45.13718032836914, "global_step": 360260, "epoch": 2977} {"train_loss": -44.70125961303711, "global_step": 360261, "epoch": 2977} {"train_loss": -45.89436721801758, "global_step": 360262, "epoch": 2977} {"train_loss": -44.11103439331055, "global_step": 360263, "epoch": 2977} {"train_loss": -45.491641998291016, "global_step": 360264, "epoch": 2977} {"train_loss": -45.69220733642578, "global_step": 360265, "epoch": 2977} {"train_loss": -44.20441818237305, "global_step": 360266, "epoch": 2977} {"train_loss": -45.218048095703125, "global_step": 360267, "epoch": 2977} {"train_loss": -45.04215621948242, "global_step": 360268, "epoch": 2977} {"train_loss": -45.81039810180664, "global_step": 360269, "epoch": 2977} {"train_loss": -44.52096176147461, "global_step": 360270, "epoch": 2977} {"train_loss": -43.391876220703125, "global_step": 360271, "epoch": 2977} {"train_loss": -43.90283203125, "global_step": 360272, "epoch": 2977} {"train_loss": -44.861690521240234, "global_step": 360273, "epoch": 2977} {"train_loss": -45.007564544677734, "global_step": 360274, "epoch": 2977} {"train_loss": -44.76737594604492, "global_step": 360275, "epoch": 2977} {"train_loss": -45.01324462890625, "global_step": 360276, "epoch": 2977} {"train_loss": -45.653350830078125, "global_step": 360277, "epoch": 2977} {"train_loss": -44.215553283691406, "global_step": 360278, "epoch": 2977} {"train_loss": -42.498565673828125, "global_step": 360279, "epoch": 2977} {"train_loss": -45.33909225463867, "global_step": 360280, "epoch": 2977} {"train_loss": -43.14568328857422, "global_step": 360281, "epoch": 2977} {"train_loss": -38.40159225463867, "global_step": 360282, "epoch": 2977} {"train_loss": -43.945098876953125, "global_step": 360283, "epoch": 2977} {"train_loss": -39.36791229248047, "global_step": 360284, "epoch": 2977} {"train_loss": -44.03727722167969, "global_step": 360285, "epoch": 2977} {"train_loss": -41.40056610107422, "global_step": 360286, "epoch": 2977} {"train_loss": -40.20267105102539, "global_step": 360287, "epoch": 2977} {"train_loss": -44.11654281616211, "global_step": 360288, "epoch": 2977} {"train_loss": -40.82442855834961, "global_step": 360289, "epoch": 2977} {"train_loss": -43.54307174682617, "global_step": 360290, "epoch": 2977} {"train_loss": -40.03864669799805, "global_step": 360291, "epoch": 2977} {"train_loss": -43.11650466918945, "global_step": 360292, "epoch": 2977} {"train_loss": -42.2280158996582, "global_step": 360293, "epoch": 2977} {"train_loss": -40.45564651489258, "global_step": 360294, "epoch": 2977} {"train_loss": -42.46438217163086, "global_step": 360295, "epoch": 2977} {"train_loss": -39.395145416259766, "global_step": 360296, "epoch": 2977} {"train_loss": -42.7738037109375, "global_step": 360297, "epoch": 2977} {"train_loss": -36.871307373046875, "global_step": 360298, "epoch": 2977} {"train_loss": -39.02616500854492, "global_step": 360299, "epoch": 2977} {"train_loss": -41.99542999267578, "global_step": 360300, "epoch": 2977} {"train_loss": -38.67676544189453, "global_step": 360301, "epoch": 2977} {"train_loss": -42.58100509643555, "global_step": 360302, "epoch": 2977} {"train_loss": -38.764320373535156, "global_step": 360303, "epoch": 2977} {"train_loss": -42.22724151611328, "global_step": 360304, "epoch": 2977} {"train_loss": -41.147857666015625, "global_step": 360305, "epoch": 2977} {"train_loss": -39.756988525390625, "global_step": 360306, "epoch": 2977} {"train_loss": -38.70839309692383, "global_step": 360307, "epoch": 2977} {"train_loss": -40.39423751831055, "global_step": 360308, "epoch": 2977} {"train_loss": -40.908531188964844, "global_step": 360309, "epoch": 2977} {"train_loss": -40.500030517578125, "global_step": 360310, "epoch": 2977} {"train_loss": -42.16907501220703, "global_step": 360311, "epoch": 2977} {"train_loss": -40.76421356201172, "global_step": 360312, "epoch": 2977} {"train_loss": -42.79487228393555, "global_step": 360313, "epoch": 2977} {"train_loss": -41.77022171020508, "global_step": 360314, "epoch": 2977} {"train_loss": -42.469478607177734, "global_step": 360315, "epoch": 2977} {"train_loss": -43.07088088989258, "global_step": 360316, "epoch": 2977} {"train_loss": -42.709571838378906, "global_step": 360317, "epoch": 2977} {"train_loss": -43.71699905395508, "global_step": 360318, "epoch": 2977} {"train_loss": -42.223243713378906, "global_step": 360319, "epoch": 2977} {"train_loss": -41.9022331237793, "global_step": 360320, "epoch": 2977} {"train_loss": -43.18570327758789, "global_step": 360321, "epoch": 2977} {"train_loss": -43.56374740600586, "global_step": 360322, "epoch": 2977} {"train_loss": -42.43598556518555, "global_step": 360323, "epoch": 2977} {"train_loss": -44.240203857421875, "global_step": 360324, "epoch": 2977} {"train_loss": -43.066593170166016, "global_step": 360325, "epoch": 2977} {"train_loss": -43.63770294189453, "global_step": 360326, "epoch": 2977} {"train_loss": -43.81903076171875, "global_step": 360327, "epoch": 2977} {"train_loss": -44.03468704223633, "global_step": 360328, "epoch": 2977} {"train_loss": -44.295860290527344, "global_step": 360329, "epoch": 2977} {"train_loss": -44.312007904052734, "global_step": 360330, "epoch": 2977} {"train_loss": -44.2367057800293, "global_step": 360331, "epoch": 2977} {"train_loss": -44.74348449707031, "global_step": 360332, "epoch": 2977} {"train_loss": -44.474639892578125, "global_step": 360333, "epoch": 2977} {"train_loss": -44.85122299194336, "global_step": 360334, "epoch": 2977} {"train_loss": -44.03507614135742, "global_step": 360335, "epoch": 2977} {"train_loss": -44.39724349975586, "global_step": 360336, "epoch": 2977} {"train_loss": -43.593715037196134, "global_step": 360337, "epoch": 2977, "val_loss": 2459199.25} {"train_loss": -44.599708557128906, "global_step": 360338, "epoch": 2978} {"train_loss": -44.45282745361328, "global_step": 360339, "epoch": 2978} {"train_loss": -44.80234909057617, "global_step": 360340, "epoch": 2978} {"train_loss": -44.89102554321289, "global_step": 360341, "epoch": 2978} {"train_loss": -45.14132308959961, "global_step": 360342, "epoch": 2978} {"train_loss": -45.30037307739258, "global_step": 360343, "epoch": 2978} {"train_loss": -45.43157958984375, "global_step": 360344, "epoch": 2978} {"train_loss": -44.794429779052734, "global_step": 360345, "epoch": 2978} {"train_loss": -45.02134323120117, "global_step": 360346, "epoch": 2978} {"train_loss": -44.99932861328125, "global_step": 360347, "epoch": 2978} {"train_loss": -45.36282730102539, "global_step": 360348, "epoch": 2978} {"train_loss": -45.051631927490234, "global_step": 360349, "epoch": 2978} {"train_loss": -45.5716667175293, "global_step": 360350, "epoch": 2978} {"train_loss": -45.08710861206055, "global_step": 360351, "epoch": 2978} {"train_loss": -45.384613037109375, "global_step": 360352, "epoch": 2978} {"train_loss": -45.469757080078125, "global_step": 360353, "epoch": 2978} {"train_loss": -45.509639739990234, "global_step": 360354, "epoch": 2978} {"train_loss": -45.80881118774414, "global_step": 360355, "epoch": 2978} {"train_loss": -45.233150482177734, "global_step": 360356, "epoch": 2978} {"train_loss": -45.78171157836914, "global_step": 360357, "epoch": 2978} {"train_loss": -45.39093017578125, "global_step": 360358, "epoch": 2978} {"train_loss": -45.5280876159668, "global_step": 360359, "epoch": 2978} {"train_loss": -45.57481002807617, "global_step": 360360, "epoch": 2978} {"train_loss": -45.12730026245117, "global_step": 360361, "epoch": 2978} {"train_loss": -45.57090377807617, "global_step": 360362, "epoch": 2978} {"train_loss": -45.98348617553711, "global_step": 360363, "epoch": 2978} {"train_loss": -45.79512023925781, "global_step": 360364, "epoch": 2978} {"train_loss": -45.689388275146484, "global_step": 360365, "epoch": 2978} {"train_loss": -45.91827392578125, "global_step": 360366, "epoch": 2978} {"train_loss": -45.9464225769043, "global_step": 360367, "epoch": 2978} {"train_loss": -45.869686126708984, "global_step": 360368, "epoch": 2978} {"train_loss": -45.872650146484375, "global_step": 360369, "epoch": 2978} {"train_loss": -45.57752990722656, "global_step": 360370, "epoch": 2978} {"train_loss": -46.2739372253418, "global_step": 360371, "epoch": 2978} {"train_loss": -45.841033935546875, "global_step": 360372, "epoch": 2978} {"train_loss": -46.1140022277832, "global_step": 360373, "epoch": 2978} {"train_loss": -46.013545989990234, "global_step": 360374, "epoch": 2978} {"train_loss": -45.87120056152344, "global_step": 360375, "epoch": 2978} {"train_loss": -46.195125579833984, "global_step": 360376, "epoch": 2978} {"train_loss": -46.41823196411133, "global_step": 360377, "epoch": 2978} {"train_loss": -45.974483489990234, "global_step": 360378, "epoch": 2978} {"train_loss": -45.8409423828125, "global_step": 360379, "epoch": 2978} {"train_loss": -45.946651458740234, "global_step": 360380, "epoch": 2978} {"train_loss": -45.79203414916992, "global_step": 360381, "epoch": 2978} {"train_loss": -45.944210052490234, "global_step": 360382, "epoch": 2978} {"train_loss": -45.754493713378906, "global_step": 360383, "epoch": 2978} {"train_loss": -46.344818115234375, "global_step": 360384, "epoch": 2978} {"train_loss": -46.57365417480469, "global_step": 360385, "epoch": 2978} {"train_loss": -46.374183654785156, "global_step": 360386, "epoch": 2978} {"train_loss": -46.1583251953125, "global_step": 360387, "epoch": 2978} {"train_loss": -46.49740219116211, "global_step": 360388, "epoch": 2978} {"train_loss": -46.053226470947266, "global_step": 360389, "epoch": 2978} {"train_loss": -46.03749465942383, "global_step": 360390, "epoch": 2978} {"train_loss": -46.433650970458984, "global_step": 360391, "epoch": 2978} {"train_loss": -46.21630859375, "global_step": 360392, "epoch": 2978} {"train_loss": -45.78371810913086, "global_step": 360393, "epoch": 2978} {"train_loss": -45.447017669677734, "global_step": 360394, "epoch": 2978} {"train_loss": -45.175941467285156, "global_step": 360395, "epoch": 2978} {"train_loss": -44.16545867919922, "global_step": 360396, "epoch": 2978} {"train_loss": -43.62237548828125, "global_step": 360397, "epoch": 2978} {"train_loss": -44.514015197753906, "global_step": 360398, "epoch": 2978} {"train_loss": -45.73904037475586, "global_step": 360399, "epoch": 2978} {"train_loss": -45.23147201538086, "global_step": 360400, "epoch": 2978} {"train_loss": -43.20290756225586, "global_step": 360401, "epoch": 2978} {"train_loss": -39.0634880065918, "global_step": 360402, "epoch": 2978} {"train_loss": -41.12406921386719, "global_step": 360403, "epoch": 2978} {"train_loss": -42.938201904296875, "global_step": 360404, "epoch": 2978} {"train_loss": -40.76080322265625, "global_step": 360405, "epoch": 2978} {"train_loss": -43.82240295410156, "global_step": 360406, "epoch": 2978} {"train_loss": -41.6430778503418, "global_step": 360407, "epoch": 2978} {"train_loss": -44.9128532409668, "global_step": 360408, "epoch": 2978} {"train_loss": -43.22233200073242, "global_step": 360409, "epoch": 2978} {"train_loss": -43.18518829345703, "global_step": 360410, "epoch": 2978} {"train_loss": -44.59309005737305, "global_step": 360411, "epoch": 2978} {"train_loss": -44.05377197265625, "global_step": 360412, "epoch": 2978} {"train_loss": -43.1109733581543, "global_step": 360413, "epoch": 2978} {"train_loss": -44.55609130859375, "global_step": 360414, "epoch": 2978} {"train_loss": -41.86919021606445, "global_step": 360415, "epoch": 2978} {"train_loss": -44.59622573852539, "global_step": 360416, "epoch": 2978} {"train_loss": -43.74990463256836, "global_step": 360417, "epoch": 2978} {"train_loss": -41.335121154785156, "global_step": 360418, "epoch": 2978} {"train_loss": -43.247230529785156, "global_step": 360419, "epoch": 2978} {"train_loss": -42.39429473876953, "global_step": 360420, "epoch": 2978} {"train_loss": -43.99027633666992, "global_step": 360421, "epoch": 2978} {"train_loss": -44.3343620300293, "global_step": 360422, "epoch": 2978} {"train_loss": -43.040767669677734, "global_step": 360423, "epoch": 2978} {"train_loss": -44.4318962097168, "global_step": 360424, "epoch": 2978} {"train_loss": -43.554039001464844, "global_step": 360425, "epoch": 2978} {"train_loss": -42.74638748168945, "global_step": 360426, "epoch": 2978} {"train_loss": -44.55642318725586, "global_step": 360427, "epoch": 2978} {"train_loss": -44.15425491333008, "global_step": 360428, "epoch": 2978} {"train_loss": -43.95595932006836, "global_step": 360429, "epoch": 2978} {"train_loss": -44.40804672241211, "global_step": 360430, "epoch": 2978} {"train_loss": -42.92612838745117, "global_step": 360431, "epoch": 2978} {"train_loss": -42.0830192565918, "global_step": 360432, "epoch": 2978} {"train_loss": -45.2148551940918, "global_step": 360433, "epoch": 2978} {"train_loss": -43.44501495361328, "global_step": 360434, "epoch": 2978} {"train_loss": -43.29259490966797, "global_step": 360435, "epoch": 2978} {"train_loss": -44.30576705932617, "global_step": 360436, "epoch": 2978} {"train_loss": -41.588417053222656, "global_step": 360437, "epoch": 2978} {"train_loss": -44.91326904296875, "global_step": 360438, "epoch": 2978} {"train_loss": -43.860260009765625, "global_step": 360439, "epoch": 2978} {"train_loss": -43.21576690673828, "global_step": 360440, "epoch": 2978} {"train_loss": -43.9773063659668, "global_step": 360441, "epoch": 2978} {"train_loss": -43.46956253051758, "global_step": 360442, "epoch": 2978} {"train_loss": -44.63117599487305, "global_step": 360443, "epoch": 2978} {"train_loss": -43.93398666381836, "global_step": 360444, "epoch": 2978} {"train_loss": -44.53269577026367, "global_step": 360445, "epoch": 2978} {"train_loss": -44.03388977050781, "global_step": 360446, "epoch": 2978} {"train_loss": -45.018157958984375, "global_step": 360447, "epoch": 2978} {"train_loss": -44.0970573425293, "global_step": 360448, "epoch": 2978} {"train_loss": -44.79933166503906, "global_step": 360449, "epoch": 2978} {"train_loss": -45.184730529785156, "global_step": 360450, "epoch": 2978} {"train_loss": -44.46384811401367, "global_step": 360451, "epoch": 2978} {"train_loss": -44.88232421875, "global_step": 360452, "epoch": 2978} {"train_loss": -45.357112884521484, "global_step": 360453, "epoch": 2978} {"train_loss": -45.06836700439453, "global_step": 360454, "epoch": 2978} {"train_loss": -44.32876205444336, "global_step": 360455, "epoch": 2978} {"train_loss": -45.280338287353516, "global_step": 360456, "epoch": 2978} {"train_loss": -44.82655715942383, "global_step": 360457, "epoch": 2978} {"train_loss": -44.682550036217556, "global_step": 360458, "epoch": 2978, "val_loss": 2435090.75} {"train_loss": -44.05219268798828, "global_step": 360459, "epoch": 2979} {"train_loss": -44.92928695678711, "global_step": 360460, "epoch": 2979} {"train_loss": -45.31048583984375, "global_step": 360461, "epoch": 2979} {"train_loss": -45.7022819519043, "global_step": 360462, "epoch": 2979} {"train_loss": -45.43221664428711, "global_step": 360463, "epoch": 2979} {"train_loss": -45.28086471557617, "global_step": 360464, "epoch": 2979} {"train_loss": -45.379817962646484, "global_step": 360465, "epoch": 2979} {"train_loss": -45.71114730834961, "global_step": 360466, "epoch": 2979} {"train_loss": -46.00543975830078, "global_step": 360467, "epoch": 2979} {"train_loss": -45.69019317626953, "global_step": 360468, "epoch": 2979} {"train_loss": -45.61767578125, "global_step": 360469, "epoch": 2979} {"train_loss": -45.892967224121094, "global_step": 360470, "epoch": 2979} {"train_loss": -46.091060638427734, "global_step": 360471, "epoch": 2979} {"train_loss": -45.942832946777344, "global_step": 360472, "epoch": 2979} {"train_loss": -45.366485595703125, "global_step": 360473, "epoch": 2979} {"train_loss": -45.9356803894043, "global_step": 360474, "epoch": 2979} {"train_loss": -45.7934455871582, "global_step": 360475, "epoch": 2979} {"train_loss": -45.76420974731445, "global_step": 360476, "epoch": 2979} {"train_loss": -45.540283203125, "global_step": 360477, "epoch": 2979} {"train_loss": -45.69877243041992, "global_step": 360478, "epoch": 2979} {"train_loss": -45.88223648071289, "global_step": 360479, "epoch": 2979} {"train_loss": -45.92738723754883, "global_step": 360480, "epoch": 2979} {"train_loss": -45.80135726928711, "global_step": 360481, "epoch": 2979} {"train_loss": -45.838104248046875, "global_step": 360482, "epoch": 2979} {"train_loss": -45.805145263671875, "global_step": 360483, "epoch": 2979} {"train_loss": -45.937435150146484, "global_step": 360484, "epoch": 2979} {"train_loss": -46.0067024230957, "global_step": 360485, "epoch": 2979} {"train_loss": -45.72681427001953, "global_step": 360486, "epoch": 2979} {"train_loss": -46.46995162963867, "global_step": 360487, "epoch": 2979} {"train_loss": -45.811729431152344, "global_step": 360488, "epoch": 2979} {"train_loss": -45.056575775146484, "global_step": 360489, "epoch": 2979} {"train_loss": -44.673397064208984, "global_step": 360490, "epoch": 2979} {"train_loss": -43.46388626098633, "global_step": 360491, "epoch": 2979} {"train_loss": -41.20217514038086, "global_step": 360492, "epoch": 2979} {"train_loss": -41.47095489501953, "global_step": 360493, "epoch": 2979} {"train_loss": -44.829620361328125, "global_step": 360494, "epoch": 2979} {"train_loss": -43.741580963134766, "global_step": 360495, "epoch": 2979} {"train_loss": -44.72209548950195, "global_step": 360496, "epoch": 2979} {"train_loss": -45.580074310302734, "global_step": 360497, "epoch": 2979} {"train_loss": -43.05916213989258, "global_step": 360498, "epoch": 2979} {"train_loss": -39.87908935546875, "global_step": 360499, "epoch": 2979} {"train_loss": -45.3586311340332, "global_step": 360500, "epoch": 2979} {"train_loss": -44.66447830200195, "global_step": 360501, "epoch": 2979} {"train_loss": -42.08450698852539, "global_step": 360502, "epoch": 2979} {"train_loss": -44.07122802734375, "global_step": 360503, "epoch": 2979} {"train_loss": -44.78418731689453, "global_step": 360504, "epoch": 2979} {"train_loss": -44.73842239379883, "global_step": 360505, "epoch": 2979} {"train_loss": -44.29838943481445, "global_step": 360506, "epoch": 2979} {"train_loss": -43.1802978515625, "global_step": 360507, "epoch": 2979} {"train_loss": -43.83758544921875, "global_step": 360508, "epoch": 2979} {"train_loss": -44.83266830444336, "global_step": 360509, "epoch": 2979} {"train_loss": -44.03413009643555, "global_step": 360510, "epoch": 2979} {"train_loss": -44.14815139770508, "global_step": 360511, "epoch": 2979} {"train_loss": -43.59328842163086, "global_step": 360512, "epoch": 2979} {"train_loss": -44.67608642578125, "global_step": 360513, "epoch": 2979} {"train_loss": -44.98360824584961, "global_step": 360514, "epoch": 2979} {"train_loss": -43.06850814819336, "global_step": 360515, "epoch": 2979} {"train_loss": -43.72908401489258, "global_step": 360516, "epoch": 2979} {"train_loss": -44.944984436035156, "global_step": 360517, "epoch": 2979} {"train_loss": -44.29854202270508, "global_step": 360518, "epoch": 2979} {"train_loss": -45.11149978637695, "global_step": 360519, "epoch": 2979} {"train_loss": -45.151432037353516, "global_step": 360520, "epoch": 2979} {"train_loss": -45.00063705444336, "global_step": 360521, "epoch": 2979} {"train_loss": -45.641761779785156, "global_step": 360522, "epoch": 2979} {"train_loss": -45.224449157714844, "global_step": 360523, "epoch": 2979} {"train_loss": -44.21099090576172, "global_step": 360524, "epoch": 2979} {"train_loss": -45.28679275512695, "global_step": 360525, "epoch": 2979} {"train_loss": -44.762718200683594, "global_step": 360526, "epoch": 2979} {"train_loss": -45.513362884521484, "global_step": 360527, "epoch": 2979} {"train_loss": -44.671451568603516, "global_step": 360528, "epoch": 2979} {"train_loss": -44.219661712646484, "global_step": 360529, "epoch": 2979} {"train_loss": -45.09272384643555, "global_step": 360530, "epoch": 2979} {"train_loss": -44.8748893737793, "global_step": 360531, "epoch": 2979} {"train_loss": -44.71277618408203, "global_step": 360532, "epoch": 2979} {"train_loss": -44.11016082763672, "global_step": 360533, "epoch": 2979} {"train_loss": -45.51737976074219, "global_step": 360534, "epoch": 2979} {"train_loss": -45.099788665771484, "global_step": 360535, "epoch": 2979} {"train_loss": -44.42409896850586, "global_step": 360536, "epoch": 2979} {"train_loss": -45.32683563232422, "global_step": 360537, "epoch": 2979} {"train_loss": -43.62948226928711, "global_step": 360538, "epoch": 2979} {"train_loss": -44.28019332885742, "global_step": 360539, "epoch": 2979} {"train_loss": -42.84198760986328, "global_step": 360540, "epoch": 2979} {"train_loss": -44.0499153137207, "global_step": 360541, "epoch": 2979} {"train_loss": -44.497920989990234, "global_step": 360542, "epoch": 2979} {"train_loss": -44.977596282958984, "global_step": 360543, "epoch": 2979} {"train_loss": -44.563716888427734, "global_step": 360544, "epoch": 2979} {"train_loss": -45.37127685546875, "global_step": 360545, "epoch": 2979} {"train_loss": -41.84772872924805, "global_step": 360546, "epoch": 2979} {"train_loss": -45.02457809448242, "global_step": 360547, "epoch": 2979} {"train_loss": -45.02337646484375, "global_step": 360548, "epoch": 2979} {"train_loss": -44.67017364501953, "global_step": 360549, "epoch": 2979} {"train_loss": -43.05704879760742, "global_step": 360550, "epoch": 2979} {"train_loss": -45.24807357788086, "global_step": 360551, "epoch": 2979} {"train_loss": -44.32526779174805, "global_step": 360552, "epoch": 2979} {"train_loss": -43.034664154052734, "global_step": 360553, "epoch": 2979} {"train_loss": -45.81435012817383, "global_step": 360554, "epoch": 2979} {"train_loss": -43.40719985961914, "global_step": 360555, "epoch": 2979} {"train_loss": -42.07109451293945, "global_step": 360556, "epoch": 2979} {"train_loss": -44.83905029296875, "global_step": 360557, "epoch": 2979} {"train_loss": -42.31242370605469, "global_step": 360558, "epoch": 2979} {"train_loss": -44.7475700378418, "global_step": 360559, "epoch": 2979} {"train_loss": -41.6368408203125, "global_step": 360560, "epoch": 2979} {"train_loss": -42.37096405029297, "global_step": 360561, "epoch": 2979} {"train_loss": -43.6848030090332, "global_step": 360562, "epoch": 2979} {"train_loss": -43.276790618896484, "global_step": 360563, "epoch": 2979} {"train_loss": -44.39030075073242, "global_step": 360564, "epoch": 2979} {"train_loss": -45.60142135620117, "global_step": 360565, "epoch": 2979} {"train_loss": -44.65895462036133, "global_step": 360566, "epoch": 2979} {"train_loss": -42.557716369628906, "global_step": 360567, "epoch": 2979} {"train_loss": -42.9347038269043, "global_step": 360568, "epoch": 2979} {"train_loss": -44.5787467956543, "global_step": 360569, "epoch": 2979} {"train_loss": -45.15961456298828, "global_step": 360570, "epoch": 2979} {"train_loss": -44.882041931152344, "global_step": 360571, "epoch": 2979} {"train_loss": -44.86027908325195, "global_step": 360572, "epoch": 2979} {"train_loss": -44.184078216552734, "global_step": 360573, "epoch": 2979} {"train_loss": -41.40690994262695, "global_step": 360574, "epoch": 2979} {"train_loss": -45.20743942260742, "global_step": 360575, "epoch": 2979} {"train_loss": -45.08197784423828, "global_step": 360576, "epoch": 2979} {"train_loss": -44.05290985107422, "global_step": 360577, "epoch": 2979} {"train_loss": -44.940731048583984, "global_step": 360578, "epoch": 2979} {"train_loss": -44.559047257604675, "global_step": 360579, "epoch": 2979, "val_loss": 2513675.25} {"train_loss": -44.54926300048828, "global_step": 360580, "epoch": 2980} {"train_loss": -45.15204620361328, "global_step": 360581, "epoch": 2980} {"train_loss": -45.30628204345703, "global_step": 360582, "epoch": 2980} {"train_loss": -45.671905517578125, "global_step": 360583, "epoch": 2980} {"train_loss": -45.58220672607422, "global_step": 360584, "epoch": 2980} {"train_loss": -45.64695358276367, "global_step": 360585, "epoch": 2980} {"train_loss": -44.66630172729492, "global_step": 360586, "epoch": 2980} {"train_loss": -45.22713088989258, "global_step": 360587, "epoch": 2980} {"train_loss": -42.39216232299805, "global_step": 360588, "epoch": 2980} {"train_loss": -45.273773193359375, "global_step": 360589, "epoch": 2980} {"train_loss": -45.132354736328125, "global_step": 360590, "epoch": 2980} {"train_loss": -42.82732391357422, "global_step": 360591, "epoch": 2980} {"train_loss": -44.50442886352539, "global_step": 360592, "epoch": 2980} {"train_loss": -45.37985610961914, "global_step": 360593, "epoch": 2980} {"train_loss": -45.43830108642578, "global_step": 360594, "epoch": 2980} {"train_loss": -43.757667541503906, "global_step": 360595, "epoch": 2980} {"train_loss": -44.936946868896484, "global_step": 360596, "epoch": 2980} {"train_loss": -45.8958625793457, "global_step": 360597, "epoch": 2980} {"train_loss": -44.63727951049805, "global_step": 360598, "epoch": 2980} {"train_loss": -44.239898681640625, "global_step": 360599, "epoch": 2980} {"train_loss": -45.40613555908203, "global_step": 360600, "epoch": 2980} {"train_loss": -44.686641693115234, "global_step": 360601, "epoch": 2980} {"train_loss": -44.970130920410156, "global_step": 360602, "epoch": 2980} {"train_loss": -44.0847282409668, "global_step": 360603, "epoch": 2980} {"train_loss": -44.03899002075195, "global_step": 360604, "epoch": 2980} {"train_loss": -43.244014739990234, "global_step": 360605, "epoch": 2980} {"train_loss": -44.360774993896484, "global_step": 360606, "epoch": 2980} {"train_loss": -44.47736358642578, "global_step": 360607, "epoch": 2980} {"train_loss": -45.54230499267578, "global_step": 360608, "epoch": 2980} {"train_loss": -44.62224197387695, "global_step": 360609, "epoch": 2980} {"train_loss": -43.670143127441406, "global_step": 360610, "epoch": 2980} {"train_loss": -44.1634407043457, "global_step": 360611, "epoch": 2980} {"train_loss": -44.8230094909668, "global_step": 360612, "epoch": 2980} {"train_loss": -44.438262939453125, "global_step": 360613, "epoch": 2980} {"train_loss": -45.07693099975586, "global_step": 360614, "epoch": 2980} {"train_loss": -44.82863998413086, "global_step": 360615, "epoch": 2980} {"train_loss": -43.355987548828125, "global_step": 360616, "epoch": 2980} {"train_loss": -43.11438751220703, "global_step": 360617, "epoch": 2980} {"train_loss": -44.22492599487305, "global_step": 360618, "epoch": 2980} {"train_loss": -44.20783233642578, "global_step": 360619, "epoch": 2980} {"train_loss": -43.5206413269043, "global_step": 360620, "epoch": 2980} {"train_loss": -44.43232345581055, "global_step": 360621, "epoch": 2980} {"train_loss": -44.38112258911133, "global_step": 360622, "epoch": 2980} {"train_loss": -42.381805419921875, "global_step": 360623, "epoch": 2980} {"train_loss": -43.88972091674805, "global_step": 360624, "epoch": 2980} {"train_loss": -44.52732467651367, "global_step": 360625, "epoch": 2980} {"train_loss": -42.8414192199707, "global_step": 360626, "epoch": 2980} {"train_loss": -45.292659759521484, "global_step": 360627, "epoch": 2980} {"train_loss": -42.56432342529297, "global_step": 360628, "epoch": 2980} {"train_loss": -44.50968551635742, "global_step": 360629, "epoch": 2980} {"train_loss": -44.01515579223633, "global_step": 360630, "epoch": 2980} {"train_loss": -43.59965515136719, "global_step": 360631, "epoch": 2980} {"train_loss": -44.49213790893555, "global_step": 360632, "epoch": 2980} {"train_loss": -43.81381607055664, "global_step": 360633, "epoch": 2980} {"train_loss": -44.753658294677734, "global_step": 360634, "epoch": 2980} {"train_loss": -42.861305236816406, "global_step": 360635, "epoch": 2980} {"train_loss": -39.03327560424805, "global_step": 360636, "epoch": 2980} {"train_loss": -43.33576202392578, "global_step": 360637, "epoch": 2980} {"train_loss": -44.69625473022461, "global_step": 360638, "epoch": 2980} {"train_loss": -43.66265106201172, "global_step": 360639, "epoch": 2980} {"train_loss": -43.47650909423828, "global_step": 360640, "epoch": 2980} {"train_loss": -43.72727584838867, "global_step": 360641, "epoch": 2980} {"train_loss": -44.04512023925781, "global_step": 360642, "epoch": 2980} {"train_loss": -43.50483322143555, "global_step": 360643, "epoch": 2980} {"train_loss": -41.654083251953125, "global_step": 360644, "epoch": 2980} {"train_loss": -43.10775375366211, "global_step": 360645, "epoch": 2980} {"train_loss": -44.67837142944336, "global_step": 360646, "epoch": 2980} {"train_loss": -41.65747833251953, "global_step": 360647, "epoch": 2980} {"train_loss": -43.15745162963867, "global_step": 360648, "epoch": 2980} {"train_loss": -43.03192901611328, "global_step": 360649, "epoch": 2980} {"train_loss": -44.5643424987793, "global_step": 360650, "epoch": 2980} {"train_loss": -44.66688919067383, "global_step": 360651, "epoch": 2980} {"train_loss": -43.23395919799805, "global_step": 360652, "epoch": 2980} {"train_loss": -44.2477912902832, "global_step": 360653, "epoch": 2980} {"train_loss": -43.15773391723633, "global_step": 360654, "epoch": 2980} {"train_loss": -43.5552978515625, "global_step": 360655, "epoch": 2980} {"train_loss": -44.17743682861328, "global_step": 360656, "epoch": 2980} {"train_loss": -40.9418830871582, "global_step": 360657, "epoch": 2980} {"train_loss": -43.59040451049805, "global_step": 360658, "epoch": 2980} {"train_loss": -42.894020080566406, "global_step": 360659, "epoch": 2980} {"train_loss": -44.11649703979492, "global_step": 360660, "epoch": 2980} {"train_loss": -43.625892639160156, "global_step": 360661, "epoch": 2980} {"train_loss": -43.91865158081055, "global_step": 360662, "epoch": 2980} {"train_loss": -44.2666130065918, "global_step": 360663, "epoch": 2980} {"train_loss": -42.5645866394043, "global_step": 360664, "epoch": 2980} {"train_loss": -44.32084655761719, "global_step": 360665, "epoch": 2980} {"train_loss": -42.74416732788086, "global_step": 360666, "epoch": 2980} {"train_loss": -43.71371078491211, "global_step": 360667, "epoch": 2980} {"train_loss": -44.53506088256836, "global_step": 360668, "epoch": 2980} {"train_loss": -40.94466781616211, "global_step": 360669, "epoch": 2980} {"train_loss": -44.251007080078125, "global_step": 360670, "epoch": 2980} {"train_loss": -42.157379150390625, "global_step": 360671, "epoch": 2980} {"train_loss": -41.298274993896484, "global_step": 360672, "epoch": 2980} {"train_loss": -42.930171966552734, "global_step": 360673, "epoch": 2980} {"train_loss": -43.823150634765625, "global_step": 360674, "epoch": 2980} {"train_loss": -44.15993118286133, "global_step": 360675, "epoch": 2980} {"train_loss": -43.461910247802734, "global_step": 360676, "epoch": 2980} {"train_loss": -44.4021110534668, "global_step": 360677, "epoch": 2980} {"train_loss": -44.76161575317383, "global_step": 360678, "epoch": 2980} {"train_loss": -43.71834945678711, "global_step": 360679, "epoch": 2980} {"train_loss": -44.031585693359375, "global_step": 360680, "epoch": 2980} {"train_loss": -44.74732208251953, "global_step": 360681, "epoch": 2980} {"train_loss": -45.12960433959961, "global_step": 360682, "epoch": 2980} {"train_loss": -44.99014663696289, "global_step": 360683, "epoch": 2980} {"train_loss": -44.794158935546875, "global_step": 360684, "epoch": 2980} {"train_loss": -44.942935943603516, "global_step": 360685, "epoch": 2980} {"train_loss": -44.66685104370117, "global_step": 360686, "epoch": 2980} {"train_loss": -44.651214599609375, "global_step": 360687, "epoch": 2980} {"train_loss": -44.571414947509766, "global_step": 360688, "epoch": 2980} {"train_loss": -45.10908889770508, "global_step": 360689, "epoch": 2980} {"train_loss": -44.7314453125, "global_step": 360690, "epoch": 2980} {"train_loss": -44.92469024658203, "global_step": 360691, "epoch": 2980} {"train_loss": -44.9296875, "global_step": 360692, "epoch": 2980} {"train_loss": -44.686214447021484, "global_step": 360693, "epoch": 2980} {"train_loss": -45.129669189453125, "global_step": 360694, "epoch": 2980} {"train_loss": -44.536136627197266, "global_step": 360695, "epoch": 2980} {"train_loss": -45.15259552001953, "global_step": 360696, "epoch": 2980} {"train_loss": -45.28789520263672, "global_step": 360697, "epoch": 2980} {"train_loss": -45.290157318115234, "global_step": 360698, "epoch": 2980} {"train_loss": -44.908958435058594, "global_step": 360699, "epoch": 2980} {"train_loss": -44.09471792425991, "global_step": 360700, "epoch": 2980, "val_loss": 2443330.75} {"train_loss": -45.20223617553711, "global_step": 360701, "epoch": 2981} {"train_loss": -45.866634368896484, "global_step": 360702, "epoch": 2981} {"train_loss": -45.62788009643555, "global_step": 360703, "epoch": 2981} {"train_loss": -45.23092269897461, "global_step": 360704, "epoch": 2981} {"train_loss": -45.53273391723633, "global_step": 360705, "epoch": 2981} {"train_loss": -45.21479415893555, "global_step": 360706, "epoch": 2981} {"train_loss": -45.320518493652344, "global_step": 360707, "epoch": 2981} {"train_loss": -44.119041442871094, "global_step": 360708, "epoch": 2981} {"train_loss": -43.84185028076172, "global_step": 360709, "epoch": 2981} {"train_loss": -44.445579528808594, "global_step": 360710, "epoch": 2981} {"train_loss": -43.8233642578125, "global_step": 360711, "epoch": 2981} {"train_loss": -44.525943756103516, "global_step": 360712, "epoch": 2981} {"train_loss": -45.04091262817383, "global_step": 360713, "epoch": 2981} {"train_loss": -43.072696685791016, "global_step": 360714, "epoch": 2981} {"train_loss": -44.92277145385742, "global_step": 360715, "epoch": 2981} {"train_loss": -45.46516799926758, "global_step": 360716, "epoch": 2981} {"train_loss": -45.536251068115234, "global_step": 360717, "epoch": 2981} {"train_loss": -44.93426513671875, "global_step": 360718, "epoch": 2981} {"train_loss": -44.56132507324219, "global_step": 360719, "epoch": 2981} {"train_loss": -45.308349609375, "global_step": 360720, "epoch": 2981} {"train_loss": -44.5067024230957, "global_step": 360721, "epoch": 2981} {"train_loss": -45.3363151550293, "global_step": 360722, "epoch": 2981} {"train_loss": -44.65602493286133, "global_step": 360723, "epoch": 2981} {"train_loss": -44.783634185791016, "global_step": 360724, "epoch": 2981} {"train_loss": -44.34806442260742, "global_step": 360725, "epoch": 2981} {"train_loss": -43.16438293457031, "global_step": 360726, "epoch": 2981} {"train_loss": -43.90223693847656, "global_step": 360727, "epoch": 2981} {"train_loss": -45.6778564453125, "global_step": 360728, "epoch": 2981} {"train_loss": -45.3774299621582, "global_step": 360729, "epoch": 2981} {"train_loss": -45.892677307128906, "global_step": 360730, "epoch": 2981} {"train_loss": -45.457725524902344, "global_step": 360731, "epoch": 2981} {"train_loss": -45.698883056640625, "global_step": 360732, "epoch": 2981} {"train_loss": -43.8218994140625, "global_step": 360733, "epoch": 2981} {"train_loss": -42.075904846191406, "global_step": 360734, "epoch": 2981} {"train_loss": -41.25230026245117, "global_step": 360735, "epoch": 2981} {"train_loss": -43.65184783935547, "global_step": 360736, "epoch": 2981} {"train_loss": -44.241607666015625, "global_step": 360737, "epoch": 2981} {"train_loss": -41.96073532104492, "global_step": 360738, "epoch": 2981} {"train_loss": -42.789913177490234, "global_step": 360739, "epoch": 2981} {"train_loss": -42.18980026245117, "global_step": 360740, "epoch": 2981} {"train_loss": -44.57353210449219, "global_step": 360741, "epoch": 2981} {"train_loss": -45.02650833129883, "global_step": 360742, "epoch": 2981} {"train_loss": -45.115718841552734, "global_step": 360743, "epoch": 2981} {"train_loss": -43.853519439697266, "global_step": 360744, "epoch": 2981} {"train_loss": -44.983558654785156, "global_step": 360745, "epoch": 2981} {"train_loss": -44.726165771484375, "global_step": 360746, "epoch": 2981} {"train_loss": -43.89426040649414, "global_step": 360747, "epoch": 2981} {"train_loss": -43.4746208190918, "global_step": 360748, "epoch": 2981} {"train_loss": -44.84939193725586, "global_step": 360749, "epoch": 2981} {"train_loss": -44.95637130737305, "global_step": 360750, "epoch": 2981} {"train_loss": -43.921993255615234, "global_step": 360751, "epoch": 2981} {"train_loss": -44.23563766479492, "global_step": 360752, "epoch": 2981} {"train_loss": -44.1676139831543, "global_step": 360753, "epoch": 2981} {"train_loss": -43.58642578125, "global_step": 360754, "epoch": 2981} {"train_loss": -43.15775680541992, "global_step": 360755, "epoch": 2981} {"train_loss": -41.93014144897461, "global_step": 360756, "epoch": 2981} {"train_loss": -43.882598876953125, "global_step": 360757, "epoch": 2981} {"train_loss": -44.445743560791016, "global_step": 360758, "epoch": 2981} {"train_loss": -43.65003204345703, "global_step": 360759, "epoch": 2981} {"train_loss": -42.848758697509766, "global_step": 360760, "epoch": 2981} {"train_loss": -44.56132507324219, "global_step": 360761, "epoch": 2981} {"train_loss": -42.146114349365234, "global_step": 360762, "epoch": 2981} {"train_loss": -43.95542526245117, "global_step": 360763, "epoch": 2981} {"train_loss": -44.23933792114258, "global_step": 360764, "epoch": 2981} {"train_loss": -42.74805450439453, "global_step": 360765, "epoch": 2981} {"train_loss": -42.10709762573242, "global_step": 360766, "epoch": 2981} {"train_loss": -43.72111129760742, "global_step": 360767, "epoch": 2981} {"train_loss": -41.100425720214844, "global_step": 360768, "epoch": 2981} {"train_loss": -43.32233810424805, "global_step": 360769, "epoch": 2981} {"train_loss": -40.8989372253418, "global_step": 360770, "epoch": 2981} {"train_loss": -43.60185623168945, "global_step": 360771, "epoch": 2981} {"train_loss": -41.202205657958984, "global_step": 360772, "epoch": 2981} {"train_loss": -44.09829330444336, "global_step": 360773, "epoch": 2981} {"train_loss": -41.8591194152832, "global_step": 360774, "epoch": 2981} {"train_loss": -43.295040130615234, "global_step": 360775, "epoch": 2981} {"train_loss": -43.476314544677734, "global_step": 360776, "epoch": 2981} {"train_loss": -43.31897735595703, "global_step": 360777, "epoch": 2981} {"train_loss": -44.2288932800293, "global_step": 360778, "epoch": 2981} {"train_loss": -43.847293853759766, "global_step": 360779, "epoch": 2981} {"train_loss": -43.46631622314453, "global_step": 360780, "epoch": 2981} {"train_loss": -43.13002014160156, "global_step": 360781, "epoch": 2981} {"train_loss": -43.76969528198242, "global_step": 360782, "epoch": 2981} {"train_loss": -44.357479095458984, "global_step": 360783, "epoch": 2981} {"train_loss": -43.77190399169922, "global_step": 360784, "epoch": 2981} {"train_loss": -44.412994384765625, "global_step": 360785, "epoch": 2981} {"train_loss": -43.901611328125, "global_step": 360786, "epoch": 2981} {"train_loss": -44.2989616394043, "global_step": 360787, "epoch": 2981} {"train_loss": -44.68559646606445, "global_step": 360788, "epoch": 2981} {"train_loss": -44.37190246582031, "global_step": 360789, "epoch": 2981} {"train_loss": -45.300758361816406, "global_step": 360790, "epoch": 2981} {"train_loss": -44.283287048339844, "global_step": 360791, "epoch": 2981} {"train_loss": -45.2496337890625, "global_step": 360792, "epoch": 2981} {"train_loss": -44.74349594116211, "global_step": 360793, "epoch": 2981} {"train_loss": -45.08781814575195, "global_step": 360794, "epoch": 2981} {"train_loss": -45.098941802978516, "global_step": 360795, "epoch": 2981} {"train_loss": -45.19307327270508, "global_step": 360796, "epoch": 2981} {"train_loss": -45.41969680786133, "global_step": 360797, "epoch": 2981} {"train_loss": -45.30178451538086, "global_step": 360798, "epoch": 2981} {"train_loss": -45.62866973876953, "global_step": 360799, "epoch": 2981} {"train_loss": -44.73263168334961, "global_step": 360800, "epoch": 2981} {"train_loss": -45.33656311035156, "global_step": 360801, "epoch": 2981} {"train_loss": -45.351688385009766, "global_step": 360802, "epoch": 2981} {"train_loss": -45.0076789855957, "global_step": 360803, "epoch": 2981} {"train_loss": -45.007991790771484, "global_step": 360804, "epoch": 2981} {"train_loss": -45.46041488647461, "global_step": 360805, "epoch": 2981} {"train_loss": -45.54203414916992, "global_step": 360806, "epoch": 2981} {"train_loss": -45.603694915771484, "global_step": 360807, "epoch": 2981} {"train_loss": -45.71671676635742, "global_step": 360808, "epoch": 2981} {"train_loss": -46.06549072265625, "global_step": 360809, "epoch": 2981} {"train_loss": -45.77511978149414, "global_step": 360810, "epoch": 2981} {"train_loss": -45.81976318359375, "global_step": 360811, "epoch": 2981} {"train_loss": -45.74274444580078, "global_step": 360812, "epoch": 2981} {"train_loss": -45.60628890991211, "global_step": 360813, "epoch": 2981} {"train_loss": -45.7801513671875, "global_step": 360814, "epoch": 2981} {"train_loss": -45.91367721557617, "global_step": 360815, "epoch": 2981} {"train_loss": -44.45646286010742, "global_step": 360816, "epoch": 2981} {"train_loss": -45.85688400268555, "global_step": 360817, "epoch": 2981} {"train_loss": -45.603790283203125, "global_step": 360818, "epoch": 2981} {"train_loss": -45.8596076965332, "global_step": 360819, "epoch": 2981} {"train_loss": -46.0128288269043, "global_step": 360820, "epoch": 2981} {"train_loss": -44.38823413060717, "global_step": 360821, "epoch": 2981, "val_loss": 2383314.75} {"train_loss": -46.081695556640625, "global_step": 360822, "epoch": 2982} {"train_loss": -45.9356803894043, "global_step": 360823, "epoch": 2982} {"train_loss": -45.85830307006836, "global_step": 360824, "epoch": 2982} {"train_loss": -46.28926467895508, "global_step": 360825, "epoch": 2982} {"train_loss": -45.847774505615234, "global_step": 360826, "epoch": 2982} {"train_loss": -46.302154541015625, "global_step": 360827, "epoch": 2982} {"train_loss": -46.48160934448242, "global_step": 360828, "epoch": 2982} {"train_loss": -45.76066970825195, "global_step": 360829, "epoch": 2982} {"train_loss": -45.84547805786133, "global_step": 360830, "epoch": 2982} {"train_loss": -45.54035949707031, "global_step": 360831, "epoch": 2982} {"train_loss": -46.14406204223633, "global_step": 360832, "epoch": 2982} {"train_loss": -45.4619026184082, "global_step": 360833, "epoch": 2982} {"train_loss": -45.78252029418945, "global_step": 360834, "epoch": 2982} {"train_loss": -45.575355529785156, "global_step": 360835, "epoch": 2982} {"train_loss": -45.30942916870117, "global_step": 360836, "epoch": 2982} {"train_loss": -45.789154052734375, "global_step": 360837, "epoch": 2982} {"train_loss": -46.233394622802734, "global_step": 360838, "epoch": 2982} {"train_loss": -44.75639724731445, "global_step": 360839, "epoch": 2982} {"train_loss": -45.61502456665039, "global_step": 360840, "epoch": 2982} {"train_loss": -45.592491149902344, "global_step": 360841, "epoch": 2982} {"train_loss": -44.24465560913086, "global_step": 360842, "epoch": 2982} {"train_loss": -43.786617279052734, "global_step": 360843, "epoch": 2982} {"train_loss": -43.93314743041992, "global_step": 360844, "epoch": 2982} {"train_loss": -44.941829681396484, "global_step": 360845, "epoch": 2982} {"train_loss": -44.47224807739258, "global_step": 360846, "epoch": 2982} {"train_loss": -44.70707321166992, "global_step": 360847, "epoch": 2982} {"train_loss": -45.41168212890625, "global_step": 360848, "epoch": 2982} {"train_loss": -46.02791213989258, "global_step": 360849, "epoch": 2982} {"train_loss": -45.44081115722656, "global_step": 360850, "epoch": 2982} {"train_loss": -46.36277389526367, "global_step": 360851, "epoch": 2982} {"train_loss": -44.155494689941406, "global_step": 360852, "epoch": 2982} {"train_loss": -43.924861907958984, "global_step": 360853, "epoch": 2982} {"train_loss": -44.6119499206543, "global_step": 360854, "epoch": 2982} {"train_loss": -44.94478225708008, "global_step": 360855, "epoch": 2982} {"train_loss": -45.17755889892578, "global_step": 360856, "epoch": 2982} {"train_loss": -45.20100784301758, "global_step": 360857, "epoch": 2982} {"train_loss": -45.1843147277832, "global_step": 360858, "epoch": 2982} {"train_loss": -43.582218170166016, "global_step": 360859, "epoch": 2982} {"train_loss": -43.95660400390625, "global_step": 360860, "epoch": 2982} {"train_loss": -45.15535354614258, "global_step": 360861, "epoch": 2982} {"train_loss": -45.1651611328125, "global_step": 360862, "epoch": 2982} {"train_loss": -42.52817153930664, "global_step": 360863, "epoch": 2982} {"train_loss": -40.16439437866211, "global_step": 360864, "epoch": 2982} {"train_loss": -43.5710334777832, "global_step": 360865, "epoch": 2982} {"train_loss": -41.21030044555664, "global_step": 360866, "epoch": 2982} {"train_loss": -43.7262077331543, "global_step": 360867, "epoch": 2982} {"train_loss": -41.28150939941406, "global_step": 360868, "epoch": 2982} {"train_loss": -44.439327239990234, "global_step": 360869, "epoch": 2982} {"train_loss": -41.97561264038086, "global_step": 360870, "epoch": 2982} {"train_loss": -40.69392013549805, "global_step": 360871, "epoch": 2982} {"train_loss": -44.234432220458984, "global_step": 360872, "epoch": 2982} {"train_loss": -40.55475997924805, "global_step": 360873, "epoch": 2982} {"train_loss": -44.03603744506836, "global_step": 360874, "epoch": 2982} {"train_loss": -41.61732864379883, "global_step": 360875, "epoch": 2982} {"train_loss": -41.27839660644531, "global_step": 360876, "epoch": 2982} {"train_loss": -43.52642059326172, "global_step": 360877, "epoch": 2982} {"train_loss": -40.62412643432617, "global_step": 360878, "epoch": 2982} {"train_loss": -41.73814010620117, "global_step": 360879, "epoch": 2982} {"train_loss": -40.907047271728516, "global_step": 360880, "epoch": 2982} {"train_loss": -40.78188705444336, "global_step": 360881, "epoch": 2982} {"train_loss": -42.90293502807617, "global_step": 360882, "epoch": 2982} {"train_loss": -39.72551345825195, "global_step": 360883, "epoch": 2982} {"train_loss": -43.49559783935547, "global_step": 360884, "epoch": 2982} {"train_loss": -41.38214874267578, "global_step": 360885, "epoch": 2982} {"train_loss": -43.7943229675293, "global_step": 360886, "epoch": 2982} {"train_loss": -41.6004638671875, "global_step": 360887, "epoch": 2982} {"train_loss": -43.58196258544922, "global_step": 360888, "epoch": 2982} {"train_loss": -42.4716911315918, "global_step": 360889, "epoch": 2982} {"train_loss": -43.25114059448242, "global_step": 360890, "epoch": 2982} {"train_loss": -43.83063888549805, "global_step": 360891, "epoch": 2982} {"train_loss": -41.68159484863281, "global_step": 360892, "epoch": 2982} {"train_loss": -44.01273727416992, "global_step": 360893, "epoch": 2982} {"train_loss": -42.752323150634766, "global_step": 360894, "epoch": 2982} {"train_loss": -44.01504135131836, "global_step": 360895, "epoch": 2982} {"train_loss": -43.867347717285156, "global_step": 360896, "epoch": 2982} {"train_loss": -43.9659309387207, "global_step": 360897, "epoch": 2982} {"train_loss": -44.53977584838867, "global_step": 360898, "epoch": 2982} {"train_loss": -43.83139419555664, "global_step": 360899, "epoch": 2982} {"train_loss": -44.87788009643555, "global_step": 360900, "epoch": 2982} {"train_loss": -44.30569076538086, "global_step": 360901, "epoch": 2982} {"train_loss": -43.968116760253906, "global_step": 360902, "epoch": 2982} {"train_loss": -44.35100173950195, "global_step": 360903, "epoch": 2982} {"train_loss": -44.254859924316406, "global_step": 360904, "epoch": 2982} {"train_loss": -45.37797546386719, "global_step": 360905, "epoch": 2982} {"train_loss": -44.07560348510742, "global_step": 360906, "epoch": 2982} {"train_loss": -45.13991165161133, "global_step": 360907, "epoch": 2982} {"train_loss": -44.67168426513672, "global_step": 360908, "epoch": 2982} {"train_loss": -44.72601318359375, "global_step": 360909, "epoch": 2982} {"train_loss": -45.018280029296875, "global_step": 360910, "epoch": 2982} {"train_loss": -44.47350311279297, "global_step": 360911, "epoch": 2982} {"train_loss": -44.84440994262695, "global_step": 360912, "epoch": 2982} {"train_loss": -44.76551818847656, "global_step": 360913, "epoch": 2982} {"train_loss": -45.22593307495117, "global_step": 360914, "epoch": 2982} {"train_loss": -45.16353988647461, "global_step": 360915, "epoch": 2982} {"train_loss": -45.195674896240234, "global_step": 360916, "epoch": 2982} {"train_loss": -45.36357498168945, "global_step": 360917, "epoch": 2982} {"train_loss": -45.3555793762207, "global_step": 360918, "epoch": 2982} {"train_loss": -45.26426315307617, "global_step": 360919, "epoch": 2982} {"train_loss": -45.33510971069336, "global_step": 360920, "epoch": 2982} {"train_loss": -45.420509338378906, "global_step": 360921, "epoch": 2982} {"train_loss": -45.394290924072266, "global_step": 360922, "epoch": 2982} {"train_loss": -45.463294982910156, "global_step": 360923, "epoch": 2982} {"train_loss": -45.799652099609375, "global_step": 360924, "epoch": 2982} {"train_loss": -45.86790466308594, "global_step": 360925, "epoch": 2982} {"train_loss": -45.481754302978516, "global_step": 360926, "epoch": 2982} {"train_loss": -45.86288070678711, "global_step": 360927, "epoch": 2982} {"train_loss": -45.87197494506836, "global_step": 360928, "epoch": 2982} {"train_loss": -45.93457794189453, "global_step": 360929, "epoch": 2982} {"train_loss": -45.535282135009766, "global_step": 360930, "epoch": 2982} {"train_loss": -45.897705078125, "global_step": 360931, "epoch": 2982} {"train_loss": -45.86834716796875, "global_step": 360932, "epoch": 2982} {"train_loss": -45.2009391784668, "global_step": 360933, "epoch": 2982} {"train_loss": -46.05263900756836, "global_step": 360934, "epoch": 2982} {"train_loss": -46.10639572143555, "global_step": 360935, "epoch": 2982} {"train_loss": -46.124427795410156, "global_step": 360936, "epoch": 2982} {"train_loss": -45.500160217285156, "global_step": 360937, "epoch": 2982} {"train_loss": -46.05221176147461, "global_step": 360938, "epoch": 2982} {"train_loss": -45.899803161621094, "global_step": 360939, "epoch": 2982} {"train_loss": -46.21457290649414, "global_step": 360940, "epoch": 2982} {"train_loss": -45.32869338989258, "global_step": 360941, "epoch": 2982} {"train_loss": -44.451557789952304, "global_step": 360942, "epoch": 2982, "val_loss": 2380738.0} {"train_loss": -45.728981018066406, "global_step": 360943, "epoch": 2983} {"train_loss": -45.26445388793945, "global_step": 360944, "epoch": 2983} {"train_loss": -45.7230110168457, "global_step": 360945, "epoch": 2983} {"train_loss": -45.596839904785156, "global_step": 360946, "epoch": 2983} {"train_loss": -45.25025177001953, "global_step": 360947, "epoch": 2983} {"train_loss": -46.05204391479492, "global_step": 360948, "epoch": 2983} {"train_loss": -46.154823303222656, "global_step": 360949, "epoch": 2983} {"train_loss": -45.88141632080078, "global_step": 360950, "epoch": 2983} {"train_loss": -45.50908279418945, "global_step": 360951, "epoch": 2983} {"train_loss": -45.70244216918945, "global_step": 360952, "epoch": 2983} {"train_loss": -45.74324035644531, "global_step": 360953, "epoch": 2983} {"train_loss": -45.85443115234375, "global_step": 360954, "epoch": 2983} {"train_loss": -45.417659759521484, "global_step": 360955, "epoch": 2983} {"train_loss": -45.854393005371094, "global_step": 360956, "epoch": 2983} {"train_loss": -45.81679916381836, "global_step": 360957, "epoch": 2983} {"train_loss": -45.6326789855957, "global_step": 360958, "epoch": 2983} {"train_loss": -45.119850158691406, "global_step": 360959, "epoch": 2983} {"train_loss": -44.32145690917969, "global_step": 360960, "epoch": 2983} {"train_loss": -43.14658737182617, "global_step": 360961, "epoch": 2983} {"train_loss": -42.03743362426758, "global_step": 360962, "epoch": 2983} {"train_loss": -43.168434143066406, "global_step": 360963, "epoch": 2983} {"train_loss": -45.055397033691406, "global_step": 360964, "epoch": 2983} {"train_loss": -45.27923583984375, "global_step": 360965, "epoch": 2983} {"train_loss": -44.66706466674805, "global_step": 360966, "epoch": 2983} {"train_loss": -45.429649353027344, "global_step": 360967, "epoch": 2983} {"train_loss": -44.97883605957031, "global_step": 360968, "epoch": 2983} {"train_loss": -44.035064697265625, "global_step": 360969, "epoch": 2983} {"train_loss": -44.43821334838867, "global_step": 360970, "epoch": 2983} {"train_loss": -44.23463821411133, "global_step": 360971, "epoch": 2983} {"train_loss": -44.36416244506836, "global_step": 360972, "epoch": 2983} {"train_loss": -44.14476013183594, "global_step": 360973, "epoch": 2983} {"train_loss": -44.86688995361328, "global_step": 360974, "epoch": 2983} {"train_loss": -43.57717514038086, "global_step": 360975, "epoch": 2983} {"train_loss": -42.14640426635742, "global_step": 360976, "epoch": 2983} {"train_loss": -43.55961990356445, "global_step": 360977, "epoch": 2983} {"train_loss": -44.023284912109375, "global_step": 360978, "epoch": 2983} {"train_loss": -42.04030990600586, "global_step": 360979, "epoch": 2983} {"train_loss": -42.322975158691406, "global_step": 360980, "epoch": 2983} {"train_loss": -44.25041198730469, "global_step": 360981, "epoch": 2983} {"train_loss": -43.47150802612305, "global_step": 360982, "epoch": 2983} {"train_loss": -41.733028411865234, "global_step": 360983, "epoch": 2983} {"train_loss": -43.502017974853516, "global_step": 360984, "epoch": 2983} {"train_loss": -40.69755172729492, "global_step": 360985, "epoch": 2983} {"train_loss": -41.95636749267578, "global_step": 360986, "epoch": 2983} {"train_loss": -42.46104049682617, "global_step": 360987, "epoch": 2983} {"train_loss": -44.24600601196289, "global_step": 360988, "epoch": 2983} {"train_loss": -40.2802848815918, "global_step": 360989, "epoch": 2983} {"train_loss": -44.75189208984375, "global_step": 360990, "epoch": 2983} {"train_loss": -41.19269561767578, "global_step": 360991, "epoch": 2983} {"train_loss": -43.47249221801758, "global_step": 360992, "epoch": 2983} {"train_loss": -44.181434631347656, "global_step": 360993, "epoch": 2983} {"train_loss": -43.543575286865234, "global_step": 360994, "epoch": 2983} {"train_loss": -43.676509857177734, "global_step": 360995, "epoch": 2983} {"train_loss": -42.435115814208984, "global_step": 360996, "epoch": 2983} {"train_loss": -42.58940124511719, "global_step": 360997, "epoch": 2983} {"train_loss": -44.63013458251953, "global_step": 360998, "epoch": 2983} {"train_loss": -42.44287872314453, "global_step": 360999, "epoch": 2983} {"train_loss": -44.38773727416992, "global_step": 361000, "epoch": 2983} {"train_loss": -44.374046325683594, "global_step": 361001, "epoch": 2983} {"train_loss": -43.36288070678711, "global_step": 361002, "epoch": 2983} {"train_loss": -44.799800872802734, "global_step": 361003, "epoch": 2983} {"train_loss": -43.62091064453125, "global_step": 361004, "epoch": 2983} {"train_loss": -45.195430755615234, "global_step": 361005, "epoch": 2983} {"train_loss": -44.531829833984375, "global_step": 361006, "epoch": 2983} {"train_loss": -44.93406295776367, "global_step": 361007, "epoch": 2983} {"train_loss": -44.12186813354492, "global_step": 361008, "epoch": 2983} {"train_loss": -44.902469635009766, "global_step": 361009, "epoch": 2983} {"train_loss": -44.632415771484375, "global_step": 361010, "epoch": 2983} {"train_loss": -44.11179733276367, "global_step": 361011, "epoch": 2983} {"train_loss": -45.266578674316406, "global_step": 361012, "epoch": 2983} {"train_loss": -44.92995834350586, "global_step": 361013, "epoch": 2983} {"train_loss": -44.30817413330078, "global_step": 361014, "epoch": 2983} {"train_loss": -45.130279541015625, "global_step": 361015, "epoch": 2983} {"train_loss": -43.62823486328125, "global_step": 361016, "epoch": 2983} {"train_loss": -45.14787673950195, "global_step": 361017, "epoch": 2983} {"train_loss": -44.19156265258789, "global_step": 361018, "epoch": 2983} {"train_loss": -45.68220138549805, "global_step": 361019, "epoch": 2983} {"train_loss": -43.54591751098633, "global_step": 361020, "epoch": 2983} {"train_loss": -44.7334098815918, "global_step": 361021, "epoch": 2983} {"train_loss": -45.04000473022461, "global_step": 361022, "epoch": 2983} {"train_loss": -44.92395782470703, "global_step": 361023, "epoch": 2983} {"train_loss": -43.55873107910156, "global_step": 361024, "epoch": 2983} {"train_loss": -45.546112060546875, "global_step": 361025, "epoch": 2983} {"train_loss": -44.880714416503906, "global_step": 361026, "epoch": 2983} {"train_loss": -44.737548828125, "global_step": 361027, "epoch": 2983} {"train_loss": -44.458438873291016, "global_step": 361028, "epoch": 2983} {"train_loss": -45.140480041503906, "global_step": 361029, "epoch": 2983} {"train_loss": -44.89057159423828, "global_step": 361030, "epoch": 2983} {"train_loss": -44.427391052246094, "global_step": 361031, "epoch": 2983} {"train_loss": -44.38241195678711, "global_step": 361032, "epoch": 2983} {"train_loss": -45.319976806640625, "global_step": 361033, "epoch": 2983} {"train_loss": -44.545616149902344, "global_step": 361034, "epoch": 2983} {"train_loss": -44.77158737182617, "global_step": 361035, "epoch": 2983} {"train_loss": -45.02729415893555, "global_step": 361036, "epoch": 2983} {"train_loss": -44.90031051635742, "global_step": 361037, "epoch": 2983} {"train_loss": -44.65486526489258, "global_step": 361038, "epoch": 2983} {"train_loss": -45.23696517944336, "global_step": 361039, "epoch": 2983} {"train_loss": -45.06403732299805, "global_step": 361040, "epoch": 2983} {"train_loss": -44.31301498413086, "global_step": 361041, "epoch": 2983} {"train_loss": -45.108253479003906, "global_step": 361042, "epoch": 2983} {"train_loss": -44.59625244140625, "global_step": 361043, "epoch": 2983} {"train_loss": -44.93262481689453, "global_step": 361044, "epoch": 2983} {"train_loss": -45.36188888549805, "global_step": 361045, "epoch": 2983} {"train_loss": -45.97600555419922, "global_step": 361046, "epoch": 2983} {"train_loss": -45.12064743041992, "global_step": 361047, "epoch": 2983} {"train_loss": -45.8192253112793, "global_step": 361048, "epoch": 2983} {"train_loss": -44.91884994506836, "global_step": 361049, "epoch": 2983} {"train_loss": -45.758907318115234, "global_step": 361050, "epoch": 2983} {"train_loss": -44.98165512084961, "global_step": 361051, "epoch": 2983} {"train_loss": -45.28851318359375, "global_step": 361052, "epoch": 2983} {"train_loss": -42.552223205566406, "global_step": 361053, "epoch": 2983} {"train_loss": -45.599456787109375, "global_step": 361054, "epoch": 2983} {"train_loss": -43.769500732421875, "global_step": 361055, "epoch": 2983} {"train_loss": -44.95510482788086, "global_step": 361056, "epoch": 2983} {"train_loss": -44.512664794921875, "global_step": 361057, "epoch": 2983} {"train_loss": -43.646053314208984, "global_step": 361058, "epoch": 2983} {"train_loss": -44.3267936706543, "global_step": 361059, "epoch": 2983} {"train_loss": -42.74483871459961, "global_step": 361060, "epoch": 2983} {"train_loss": -43.90719985961914, "global_step": 361061, "epoch": 2983} {"train_loss": -45.428810119628906, "global_step": 361062, "epoch": 2983} {"train_loss": -44.40167989809651, "global_step": 361063, "epoch": 2983, "val_loss": 2285288.25} {"train_loss": -40.37458419799805, "global_step": 361064, "epoch": 2984} {"train_loss": -42.98499298095703, "global_step": 361065, "epoch": 2984} {"train_loss": -44.416439056396484, "global_step": 361066, "epoch": 2984} {"train_loss": -44.38935089111328, "global_step": 361067, "epoch": 2984} {"train_loss": -43.88248825073242, "global_step": 361068, "epoch": 2984} {"train_loss": -43.16305160522461, "global_step": 361069, "epoch": 2984} {"train_loss": -44.74066162109375, "global_step": 361070, "epoch": 2984} {"train_loss": -44.05077362060547, "global_step": 361071, "epoch": 2984} {"train_loss": -44.999908447265625, "global_step": 361072, "epoch": 2984} {"train_loss": -43.73904037475586, "global_step": 361073, "epoch": 2984} {"train_loss": -44.61346435546875, "global_step": 361074, "epoch": 2984} {"train_loss": -44.507205963134766, "global_step": 361075, "epoch": 2984} {"train_loss": -41.997589111328125, "global_step": 361076, "epoch": 2984} {"train_loss": -44.39045333862305, "global_step": 361077, "epoch": 2984} {"train_loss": -44.62453842163086, "global_step": 361078, "epoch": 2984} {"train_loss": -43.204036712646484, "global_step": 361079, "epoch": 2984} {"train_loss": -44.42081832885742, "global_step": 361080, "epoch": 2984} {"train_loss": -43.817264556884766, "global_step": 361081, "epoch": 2984} {"train_loss": -44.06432342529297, "global_step": 361082, "epoch": 2984} {"train_loss": -44.54276657104492, "global_step": 361083, "epoch": 2984} {"train_loss": -43.58456039428711, "global_step": 361084, "epoch": 2984} {"train_loss": -44.2957878112793, "global_step": 361085, "epoch": 2984} {"train_loss": -43.81624984741211, "global_step": 361086, "epoch": 2984} {"train_loss": -43.03670120239258, "global_step": 361087, "epoch": 2984} {"train_loss": -43.46415328979492, "global_step": 361088, "epoch": 2984} {"train_loss": -43.53097915649414, "global_step": 361089, "epoch": 2984} {"train_loss": -41.29548263549805, "global_step": 361090, "epoch": 2984} {"train_loss": -42.367958068847656, "global_step": 361091, "epoch": 2984} {"train_loss": -43.0006103515625, "global_step": 361092, "epoch": 2984} {"train_loss": -41.343040466308594, "global_step": 361093, "epoch": 2984} {"train_loss": -42.80694580078125, "global_step": 361094, "epoch": 2984} {"train_loss": -42.385677337646484, "global_step": 361095, "epoch": 2984} {"train_loss": -43.26567077636719, "global_step": 361096, "epoch": 2984} {"train_loss": -43.3847541809082, "global_step": 361097, "epoch": 2984} {"train_loss": -42.005680084228516, "global_step": 361098, "epoch": 2984} {"train_loss": -43.45608139038086, "global_step": 361099, "epoch": 2984} {"train_loss": -43.86566162109375, "global_step": 361100, "epoch": 2984} {"train_loss": -44.2074089050293, "global_step": 361101, "epoch": 2984} {"train_loss": -43.9065055847168, "global_step": 361102, "epoch": 2984} {"train_loss": -43.32533645629883, "global_step": 361103, "epoch": 2984} {"train_loss": -44.3876838684082, "global_step": 361104, "epoch": 2984} {"train_loss": -43.92073440551758, "global_step": 361105, "epoch": 2984} {"train_loss": -43.50727462768555, "global_step": 361106, "epoch": 2984} {"train_loss": -43.66674041748047, "global_step": 361107, "epoch": 2984} {"train_loss": -43.7269401550293, "global_step": 361108, "epoch": 2984} {"train_loss": -45.070335388183594, "global_step": 361109, "epoch": 2984} {"train_loss": -43.57491683959961, "global_step": 361110, "epoch": 2984} {"train_loss": -43.692562103271484, "global_step": 361111, "epoch": 2984} {"train_loss": -43.77695846557617, "global_step": 361112, "epoch": 2984} {"train_loss": -43.71365737915039, "global_step": 361113, "epoch": 2984} {"train_loss": -42.72142791748047, "global_step": 361114, "epoch": 2984} {"train_loss": -44.38309860229492, "global_step": 361115, "epoch": 2984} {"train_loss": -42.49299240112305, "global_step": 361116, "epoch": 2984} {"train_loss": -44.16648483276367, "global_step": 361117, "epoch": 2984} {"train_loss": -43.657711029052734, "global_step": 361118, "epoch": 2984} {"train_loss": -43.74713897705078, "global_step": 361119, "epoch": 2984} {"train_loss": -44.59571075439453, "global_step": 361120, "epoch": 2984} {"train_loss": -41.911964416503906, "global_step": 361121, "epoch": 2984} {"train_loss": -44.00333023071289, "global_step": 361122, "epoch": 2984} {"train_loss": -44.57369613647461, "global_step": 361123, "epoch": 2984} {"train_loss": -43.99210739135742, "global_step": 361124, "epoch": 2984} {"train_loss": -44.12636184692383, "global_step": 361125, "epoch": 2984} {"train_loss": -43.9029655456543, "global_step": 361126, "epoch": 2984} {"train_loss": -43.62335205078125, "global_step": 361127, "epoch": 2984} {"train_loss": -44.26689529418945, "global_step": 361128, "epoch": 2984} {"train_loss": -44.524085998535156, "global_step": 361129, "epoch": 2984} {"train_loss": -44.32570266723633, "global_step": 361130, "epoch": 2984} {"train_loss": -43.20127487182617, "global_step": 361131, "epoch": 2984} {"train_loss": -42.91225814819336, "global_step": 361132, "epoch": 2984} {"train_loss": -44.0578727722168, "global_step": 361133, "epoch": 2984} {"train_loss": -43.146480560302734, "global_step": 361134, "epoch": 2984} {"train_loss": -44.061527252197266, "global_step": 361135, "epoch": 2984} {"train_loss": -44.85921859741211, "global_step": 361136, "epoch": 2984} {"train_loss": -44.2165641784668, "global_step": 361137, "epoch": 2984} {"train_loss": -44.03513717651367, "global_step": 361138, "epoch": 2984} {"train_loss": -44.525020599365234, "global_step": 361139, "epoch": 2984} {"train_loss": -43.56782150268555, "global_step": 361140, "epoch": 2984} {"train_loss": -44.465999603271484, "global_step": 361141, "epoch": 2984} {"train_loss": -43.5150032043457, "global_step": 361142, "epoch": 2984} {"train_loss": -44.90936279296875, "global_step": 361143, "epoch": 2984} {"train_loss": -44.55807113647461, "global_step": 361144, "epoch": 2984} {"train_loss": -44.09965896606445, "global_step": 361145, "epoch": 2984} {"train_loss": -43.90438461303711, "global_step": 361146, "epoch": 2984} {"train_loss": -44.762752532958984, "global_step": 361147, "epoch": 2984} {"train_loss": -44.386634826660156, "global_step": 361148, "epoch": 2984} {"train_loss": -43.251007080078125, "global_step": 361149, "epoch": 2984} {"train_loss": -45.230403900146484, "global_step": 361150, "epoch": 2984} {"train_loss": -43.94336700439453, "global_step": 361151, "epoch": 2984} {"train_loss": -44.11024856567383, "global_step": 361152, "epoch": 2984} {"train_loss": -43.794803619384766, "global_step": 361153, "epoch": 2984} {"train_loss": -44.31694412231445, "global_step": 361154, "epoch": 2984} {"train_loss": -43.290645599365234, "global_step": 361155, "epoch": 2984} {"train_loss": -44.45697784423828, "global_step": 361156, "epoch": 2984} {"train_loss": -44.5768928527832, "global_step": 361157, "epoch": 2984} {"train_loss": -44.64085006713867, "global_step": 361158, "epoch": 2984} {"train_loss": -45.271484375, "global_step": 361159, "epoch": 2984} {"train_loss": -45.2439079284668, "global_step": 361160, "epoch": 2984} {"train_loss": -44.40986633300781, "global_step": 361161, "epoch": 2984} {"train_loss": -43.88623046875, "global_step": 361162, "epoch": 2984} {"train_loss": -43.60361862182617, "global_step": 361163, "epoch": 2984} {"train_loss": -44.85211181640625, "global_step": 361164, "epoch": 2984} {"train_loss": -44.89188766479492, "global_step": 361165, "epoch": 2984} {"train_loss": -45.2108039855957, "global_step": 361166, "epoch": 2984} {"train_loss": -44.309024810791016, "global_step": 361167, "epoch": 2984} {"train_loss": -44.98221969604492, "global_step": 361168, "epoch": 2984} {"train_loss": -44.76702117919922, "global_step": 361169, "epoch": 2984} {"train_loss": -44.39830017089844, "global_step": 361170, "epoch": 2984} {"train_loss": -45.21832275390625, "global_step": 361171, "epoch": 2984} {"train_loss": -44.81525802612305, "global_step": 361172, "epoch": 2984} {"train_loss": -44.48683547973633, "global_step": 361173, "epoch": 2984} {"train_loss": -45.350311279296875, "global_step": 361174, "epoch": 2984} {"train_loss": -45.2794075012207, "global_step": 361175, "epoch": 2984} {"train_loss": -44.57263946533203, "global_step": 361176, "epoch": 2984} {"train_loss": -45.15981674194336, "global_step": 361177, "epoch": 2984} {"train_loss": -44.44332504272461, "global_step": 361178, "epoch": 2984} {"train_loss": -43.402217864990234, "global_step": 361179, "epoch": 2984} {"train_loss": -44.38180160522461, "global_step": 361180, "epoch": 2984} {"train_loss": -44.800662994384766, "global_step": 361181, "epoch": 2984} {"train_loss": -44.724056243896484, "global_step": 361182, "epoch": 2984} {"train_loss": -44.95936965942383, "global_step": 361183, "epoch": 2984} {"train_loss": -43.966394597833805, "global_step": 361184, "epoch": 2984, "val_loss": 2407770.25} {"train_loss": -45.51319122314453, "global_step": 361185, "epoch": 2985} {"train_loss": -44.16638946533203, "global_step": 361186, "epoch": 2985} {"train_loss": -45.26118087768555, "global_step": 361187, "epoch": 2985} {"train_loss": -45.62767028808594, "global_step": 361188, "epoch": 2985} {"train_loss": -45.61874008178711, "global_step": 361189, "epoch": 2985} {"train_loss": -44.36336898803711, "global_step": 361190, "epoch": 2985} {"train_loss": -45.823848724365234, "global_step": 361191, "epoch": 2985} {"train_loss": -45.24320602416992, "global_step": 361192, "epoch": 2985} {"train_loss": -45.431129455566406, "global_step": 361193, "epoch": 2985} {"train_loss": -45.584007263183594, "global_step": 361194, "epoch": 2985} {"train_loss": -44.79132080078125, "global_step": 361195, "epoch": 2985} {"train_loss": -45.063316345214844, "global_step": 361196, "epoch": 2985} {"train_loss": -45.15726852416992, "global_step": 361197, "epoch": 2985} {"train_loss": -45.57770919799805, "global_step": 361198, "epoch": 2985} {"train_loss": -45.82542037963867, "global_step": 361199, "epoch": 2985} {"train_loss": -45.47432327270508, "global_step": 361200, "epoch": 2985} {"train_loss": -45.598541259765625, "global_step": 361201, "epoch": 2985} {"train_loss": -45.51322555541992, "global_step": 361202, "epoch": 2985} {"train_loss": -44.49715805053711, "global_step": 361203, "epoch": 2985} {"train_loss": -45.49319076538086, "global_step": 361204, "epoch": 2985} {"train_loss": -44.209022521972656, "global_step": 361205, "epoch": 2985} {"train_loss": -45.12746810913086, "global_step": 361206, "epoch": 2985} {"train_loss": -44.73942565917969, "global_step": 361207, "epoch": 2985} {"train_loss": -46.080318450927734, "global_step": 361208, "epoch": 2985} {"train_loss": -44.7603874206543, "global_step": 361209, "epoch": 2985} {"train_loss": -45.15901565551758, "global_step": 361210, "epoch": 2985} {"train_loss": -44.848236083984375, "global_step": 361211, "epoch": 2985} {"train_loss": -43.90892791748047, "global_step": 361212, "epoch": 2985} {"train_loss": -44.77314376831055, "global_step": 361213, "epoch": 2985} {"train_loss": -43.985408782958984, "global_step": 361214, "epoch": 2985} {"train_loss": -45.3356819152832, "global_step": 361215, "epoch": 2985} {"train_loss": -45.54273223876953, "global_step": 361216, "epoch": 2985} {"train_loss": -44.72088623046875, "global_step": 361217, "epoch": 2985} {"train_loss": -44.92826461791992, "global_step": 361218, "epoch": 2985} {"train_loss": -43.798179626464844, "global_step": 361219, "epoch": 2985} {"train_loss": -43.04830551147461, "global_step": 361220, "epoch": 2985} {"train_loss": -43.41645812988281, "global_step": 361221, "epoch": 2985} {"train_loss": -45.37939453125, "global_step": 361222, "epoch": 2985} {"train_loss": -45.013099670410156, "global_step": 361223, "epoch": 2985} {"train_loss": -43.04037094116211, "global_step": 361224, "epoch": 2985} {"train_loss": -43.96151351928711, "global_step": 361225, "epoch": 2985} {"train_loss": -45.20842742919922, "global_step": 361226, "epoch": 2985} {"train_loss": -44.56203079223633, "global_step": 361227, "epoch": 2985} {"train_loss": -44.69036865234375, "global_step": 361228, "epoch": 2985} {"train_loss": -45.38386154174805, "global_step": 361229, "epoch": 2985} {"train_loss": -44.85920333862305, "global_step": 361230, "epoch": 2985} {"train_loss": -44.66463088989258, "global_step": 361231, "epoch": 2985} {"train_loss": -45.27022933959961, "global_step": 361232, "epoch": 2985} {"train_loss": -45.36817169189453, "global_step": 361233, "epoch": 2985} {"train_loss": -43.9554557800293, "global_step": 361234, "epoch": 2985} {"train_loss": -43.22815704345703, "global_step": 361235, "epoch": 2985} {"train_loss": -44.946834564208984, "global_step": 361236, "epoch": 2985} {"train_loss": -45.04110336303711, "global_step": 361237, "epoch": 2985} {"train_loss": -43.4352912902832, "global_step": 361238, "epoch": 2985} {"train_loss": -44.95954513549805, "global_step": 361239, "epoch": 2985} {"train_loss": -45.45351791381836, "global_step": 361240, "epoch": 2985} {"train_loss": -42.172203063964844, "global_step": 361241, "epoch": 2985} {"train_loss": -43.02708053588867, "global_step": 361242, "epoch": 2985} {"train_loss": -45.0214729309082, "global_step": 361243, "epoch": 2985} {"train_loss": -43.62470626831055, "global_step": 361244, "epoch": 2985} {"train_loss": -43.034603118896484, "global_step": 361245, "epoch": 2985} {"train_loss": -43.4840202331543, "global_step": 361246, "epoch": 2985} {"train_loss": -43.76314926147461, "global_step": 361247, "epoch": 2985} {"train_loss": -43.42041778564453, "global_step": 361248, "epoch": 2985} {"train_loss": -43.97547149658203, "global_step": 361249, "epoch": 2985} {"train_loss": -44.31660842895508, "global_step": 361250, "epoch": 2985} {"train_loss": -43.54076385498047, "global_step": 361251, "epoch": 2985} {"train_loss": -43.86517333984375, "global_step": 361252, "epoch": 2985} {"train_loss": -44.38080978393555, "global_step": 361253, "epoch": 2985} {"train_loss": -44.06379318237305, "global_step": 361254, "epoch": 2985} {"train_loss": -44.51152420043945, "global_step": 361255, "epoch": 2985} {"train_loss": -43.879127502441406, "global_step": 361256, "epoch": 2985} {"train_loss": -44.355552673339844, "global_step": 361257, "epoch": 2985} {"train_loss": -44.98615264892578, "global_step": 361258, "epoch": 2985} {"train_loss": -43.679718017578125, "global_step": 361259, "epoch": 2985} {"train_loss": -43.56610107421875, "global_step": 361260, "epoch": 2985} {"train_loss": -45.22038650512695, "global_step": 361261, "epoch": 2985} {"train_loss": -43.90169143676758, "global_step": 361262, "epoch": 2985} {"train_loss": -44.31438446044922, "global_step": 361263, "epoch": 2985} {"train_loss": -45.01923370361328, "global_step": 361264, "epoch": 2985} {"train_loss": -44.49843215942383, "global_step": 361265, "epoch": 2985} {"train_loss": -44.236351013183594, "global_step": 361266, "epoch": 2985} {"train_loss": -44.6279296875, "global_step": 361267, "epoch": 2985} {"train_loss": -45.321197509765625, "global_step": 361268, "epoch": 2985} {"train_loss": -44.255348205566406, "global_step": 361269, "epoch": 2985} {"train_loss": -44.41017150878906, "global_step": 361270, "epoch": 2985} {"train_loss": -45.00848388671875, "global_step": 361271, "epoch": 2985} {"train_loss": -44.824012756347656, "global_step": 361272, "epoch": 2985} {"train_loss": -45.17218780517578, "global_step": 361273, "epoch": 2985} {"train_loss": -44.836204528808594, "global_step": 361274, "epoch": 2985} {"train_loss": -45.38762664794922, "global_step": 361275, "epoch": 2985} {"train_loss": -44.67573928833008, "global_step": 361276, "epoch": 2985} {"train_loss": -45.38808822631836, "global_step": 361277, "epoch": 2985} {"train_loss": -44.567073822021484, "global_step": 361278, "epoch": 2985} {"train_loss": -44.85266876220703, "global_step": 361279, "epoch": 2985} {"train_loss": -45.91792678833008, "global_step": 361280, "epoch": 2985} {"train_loss": -44.77716064453125, "global_step": 361281, "epoch": 2985} {"train_loss": -45.81043243408203, "global_step": 361282, "epoch": 2985} {"train_loss": -45.74281692504883, "global_step": 361283, "epoch": 2985} {"train_loss": -44.6774787902832, "global_step": 361284, "epoch": 2985} {"train_loss": -45.51298141479492, "global_step": 361285, "epoch": 2985} {"train_loss": -45.55924606323242, "global_step": 361286, "epoch": 2985} {"train_loss": -45.10702133178711, "global_step": 361287, "epoch": 2985} {"train_loss": -45.525733947753906, "global_step": 361288, "epoch": 2985} {"train_loss": -45.517311096191406, "global_step": 361289, "epoch": 2985} {"train_loss": -45.07143783569336, "global_step": 361290, "epoch": 2985} {"train_loss": -45.236854553222656, "global_step": 361291, "epoch": 2985} {"train_loss": -45.4146842956543, "global_step": 361292, "epoch": 2985} {"train_loss": -45.38805389404297, "global_step": 361293, "epoch": 2985} {"train_loss": -45.15238952636719, "global_step": 361294, "epoch": 2985} {"train_loss": -45.715614318847656, "global_step": 361295, "epoch": 2985} {"train_loss": -45.355926513671875, "global_step": 361296, "epoch": 2985} {"train_loss": -44.633636474609375, "global_step": 361297, "epoch": 2985} {"train_loss": -44.92078399658203, "global_step": 361298, "epoch": 2985} {"train_loss": -45.44309616088867, "global_step": 361299, "epoch": 2985} {"train_loss": -45.43083572387695, "global_step": 361300, "epoch": 2985} {"train_loss": -44.6563835144043, "global_step": 361301, "epoch": 2985} {"train_loss": -45.658111572265625, "global_step": 361302, "epoch": 2985} {"train_loss": -45.09727096557617, "global_step": 361303, "epoch": 2985} {"train_loss": -45.713409423828125, "global_step": 361304, "epoch": 2985} {"train_loss": -44.77620668647703, "global_step": 361305, "epoch": 2985, "val_loss": 2420383.25} {"train_loss": -45.384918212890625, "global_step": 361306, "epoch": 2986} {"train_loss": -45.510353088378906, "global_step": 361307, "epoch": 2986} {"train_loss": -44.67014694213867, "global_step": 361308, "epoch": 2986} {"train_loss": -45.85127639770508, "global_step": 361309, "epoch": 2986} {"train_loss": -45.176368713378906, "global_step": 361310, "epoch": 2986} {"train_loss": -45.34440231323242, "global_step": 361311, "epoch": 2986} {"train_loss": -45.69353485107422, "global_step": 361312, "epoch": 2986} {"train_loss": -46.197757720947266, "global_step": 361313, "epoch": 2986} {"train_loss": -44.5094108581543, "global_step": 361314, "epoch": 2986} {"train_loss": -44.78642272949219, "global_step": 361315, "epoch": 2986} {"train_loss": -45.524654388427734, "global_step": 361316, "epoch": 2986} {"train_loss": -45.14561080932617, "global_step": 361317, "epoch": 2986} {"train_loss": -45.18234634399414, "global_step": 361318, "epoch": 2986} {"train_loss": -45.61787033081055, "global_step": 361319, "epoch": 2986} {"train_loss": -45.689144134521484, "global_step": 361320, "epoch": 2986} {"train_loss": -45.412715911865234, "global_step": 361321, "epoch": 2986} {"train_loss": -45.799198150634766, "global_step": 361322, "epoch": 2986} {"train_loss": -45.07548904418945, "global_step": 361323, "epoch": 2986} {"train_loss": -44.84528350830078, "global_step": 361324, "epoch": 2986} {"train_loss": -45.91294479370117, "global_step": 361325, "epoch": 2986} {"train_loss": -45.14832305908203, "global_step": 361326, "epoch": 2986} {"train_loss": -45.5506706237793, "global_step": 361327, "epoch": 2986} {"train_loss": -45.91876220703125, "global_step": 361328, "epoch": 2986} {"train_loss": -45.734188079833984, "global_step": 361329, "epoch": 2986} {"train_loss": -45.61769104003906, "global_step": 361330, "epoch": 2986} {"train_loss": -44.62594223022461, "global_step": 361331, "epoch": 2986} {"train_loss": -45.745826721191406, "global_step": 361332, "epoch": 2986} {"train_loss": -45.98186111450195, "global_step": 361333, "epoch": 2986} {"train_loss": -44.93183135986328, "global_step": 361334, "epoch": 2986} {"train_loss": -45.16578674316406, "global_step": 361335, "epoch": 2986} {"train_loss": -45.896751403808594, "global_step": 361336, "epoch": 2986} {"train_loss": -45.34847640991211, "global_step": 361337, "epoch": 2986} {"train_loss": -45.32583236694336, "global_step": 361338, "epoch": 2986} {"train_loss": -45.317779541015625, "global_step": 361339, "epoch": 2986} {"train_loss": -45.357723236083984, "global_step": 361340, "epoch": 2986} {"train_loss": -45.37375259399414, "global_step": 361341, "epoch": 2986} {"train_loss": -45.0909538269043, "global_step": 361342, "epoch": 2986} {"train_loss": -43.29372787475586, "global_step": 361343, "epoch": 2986} {"train_loss": -45.569793701171875, "global_step": 361344, "epoch": 2986} {"train_loss": -45.381500244140625, "global_step": 361345, "epoch": 2986} {"train_loss": -45.8508415222168, "global_step": 361346, "epoch": 2986} {"train_loss": -45.832271575927734, "global_step": 361347, "epoch": 2986} {"train_loss": -45.699256896972656, "global_step": 361348, "epoch": 2986} {"train_loss": -45.839229583740234, "global_step": 361349, "epoch": 2986} {"train_loss": -45.938236236572266, "global_step": 361350, "epoch": 2986} {"train_loss": -45.852272033691406, "global_step": 361351, "epoch": 2986} {"train_loss": -45.17928695678711, "global_step": 361352, "epoch": 2986} {"train_loss": -45.72324752807617, "global_step": 361353, "epoch": 2986} {"train_loss": -46.09246826171875, "global_step": 361354, "epoch": 2986} {"train_loss": -45.41761016845703, "global_step": 361355, "epoch": 2986} {"train_loss": -45.243812561035156, "global_step": 361356, "epoch": 2986} {"train_loss": -44.60921859741211, "global_step": 361357, "epoch": 2986} {"train_loss": -41.38090133666992, "global_step": 361358, "epoch": 2986} {"train_loss": -40.8814582824707, "global_step": 361359, "epoch": 2986} {"train_loss": -38.642250061035156, "global_step": 361360, "epoch": 2986} {"train_loss": -44.12152099609375, "global_step": 361361, "epoch": 2986} {"train_loss": -31.19964599609375, "global_step": 361362, "epoch": 2986} {"train_loss": -43.017574310302734, "global_step": 361363, "epoch": 2986} {"train_loss": -28.456628799438477, "global_step": 361364, "epoch": 2986} {"train_loss": -11.498381614685059, "global_step": 361365, "epoch": 2986} {"train_loss": -34.64585876464844, "global_step": 361366, "epoch": 2986} {"train_loss": -29.437284469604492, "global_step": 361367, "epoch": 2986} {"train_loss": -29.9254093170166, "global_step": 361368, "epoch": 2986} {"train_loss": -35.013328552246094, "global_step": 361369, "epoch": 2986} {"train_loss": -31.556562423706055, "global_step": 361370, "epoch": 2986} {"train_loss": -35.828857421875, "global_step": 361371, "epoch": 2986} {"train_loss": -33.371795654296875, "global_step": 361372, "epoch": 2986} {"train_loss": -39.0730094909668, "global_step": 361373, "epoch": 2986} {"train_loss": -33.908935546875, "global_step": 361374, "epoch": 2986} {"train_loss": -38.599891662597656, "global_step": 361375, "epoch": 2986} {"train_loss": -36.61565399169922, "global_step": 361376, "epoch": 2986} {"train_loss": -40.48649215698242, "global_step": 361377, "epoch": 2986} {"train_loss": -39.146209716796875, "global_step": 361378, "epoch": 2986} {"train_loss": -38.9964714050293, "global_step": 361379, "epoch": 2986} {"train_loss": -41.8929557800293, "global_step": 361380, "epoch": 2986} {"train_loss": -38.33291244506836, "global_step": 361381, "epoch": 2986} {"train_loss": -39.490055084228516, "global_step": 361382, "epoch": 2986} {"train_loss": -40.83909225463867, "global_step": 361383, "epoch": 2986} {"train_loss": -42.3269157409668, "global_step": 361384, "epoch": 2986} {"train_loss": -41.246925354003906, "global_step": 361385, "epoch": 2986} {"train_loss": -42.35847473144531, "global_step": 361386, "epoch": 2986} {"train_loss": -35.5500602722168, "global_step": 361387, "epoch": 2986} {"train_loss": -43.36310577392578, "global_step": 361388, "epoch": 2986} {"train_loss": -40.47050476074219, "global_step": 361389, "epoch": 2986} {"train_loss": -42.487098693847656, "global_step": 361390, "epoch": 2986} {"train_loss": -41.68220138549805, "global_step": 361391, "epoch": 2986} {"train_loss": -40.8761100769043, "global_step": 361392, "epoch": 2986} {"train_loss": -40.32477951049805, "global_step": 361393, "epoch": 2986} {"train_loss": -41.911312103271484, "global_step": 361394, "epoch": 2986} {"train_loss": -42.5940055847168, "global_step": 361395, "epoch": 2986} {"train_loss": -39.474727630615234, "global_step": 361396, "epoch": 2986} {"train_loss": -42.599212646484375, "global_step": 361397, "epoch": 2986} {"train_loss": -42.53451156616211, "global_step": 361398, "epoch": 2986} {"train_loss": -41.48586654663086, "global_step": 361399, "epoch": 2986} {"train_loss": -42.77341079711914, "global_step": 361400, "epoch": 2986} {"train_loss": -42.26736068725586, "global_step": 361401, "epoch": 2986} {"train_loss": -43.02457809448242, "global_step": 361402, "epoch": 2986} {"train_loss": -43.273128509521484, "global_step": 361403, "epoch": 2986} {"train_loss": -43.0119743347168, "global_step": 361404, "epoch": 2986} {"train_loss": -43.9620475769043, "global_step": 361405, "epoch": 2986} {"train_loss": -43.38483428955078, "global_step": 361406, "epoch": 2986} {"train_loss": -43.55678176879883, "global_step": 361407, "epoch": 2986} {"train_loss": -43.1671142578125, "global_step": 361408, "epoch": 2986} {"train_loss": -43.93684005737305, "global_step": 361409, "epoch": 2986} {"train_loss": -44.30520248413086, "global_step": 361410, "epoch": 2986} {"train_loss": -42.7833366394043, "global_step": 361411, "epoch": 2986} {"train_loss": -42.81813430786133, "global_step": 361412, "epoch": 2986} {"train_loss": -43.959266662597656, "global_step": 361413, "epoch": 2986} {"train_loss": -42.1723747253418, "global_step": 361414, "epoch": 2986} {"train_loss": -43.77494812011719, "global_step": 361415, "epoch": 2986} {"train_loss": -43.53812789916992, "global_step": 361416, "epoch": 2986} {"train_loss": -43.54775619506836, "global_step": 361417, "epoch": 2986} {"train_loss": -43.618221282958984, "global_step": 361418, "epoch": 2986} {"train_loss": -44.42723083496094, "global_step": 361419, "epoch": 2986} {"train_loss": -43.644775390625, "global_step": 361420, "epoch": 2986} {"train_loss": -43.86037063598633, "global_step": 361421, "epoch": 2986} {"train_loss": -44.179744720458984, "global_step": 361422, "epoch": 2986} {"train_loss": -44.45454025268555, "global_step": 361423, "epoch": 2986} {"train_loss": -44.570621490478516, "global_step": 361424, "epoch": 2986} {"train_loss": -44.021217346191406, "global_step": 361425, "epoch": 2986} {"train_loss": -42.42254874331892, "global_step": 361426, "epoch": 2986, "val_loss": 2768656.0} {"train_loss": -44.21800231933594, "global_step": 361427, "epoch": 2987} {"train_loss": -44.543243408203125, "global_step": 361428, "epoch": 2987} {"train_loss": -44.88987350463867, "global_step": 361429, "epoch": 2987} {"train_loss": -44.18112564086914, "global_step": 361430, "epoch": 2987} {"train_loss": -44.51981735229492, "global_step": 361431, "epoch": 2987} {"train_loss": -44.63228225708008, "global_step": 361432, "epoch": 2987} {"train_loss": -44.0300407409668, "global_step": 361433, "epoch": 2987} {"train_loss": -44.96192169189453, "global_step": 361434, "epoch": 2987} {"train_loss": -44.93223571777344, "global_step": 361435, "epoch": 2987} {"train_loss": -44.84778594970703, "global_step": 361436, "epoch": 2987} {"train_loss": -44.4805908203125, "global_step": 361437, "epoch": 2987} {"train_loss": -44.145729064941406, "global_step": 361438, "epoch": 2987} {"train_loss": -44.741939544677734, "global_step": 361439, "epoch": 2987} {"train_loss": -45.33019256591797, "global_step": 361440, "epoch": 2987} {"train_loss": -44.98397445678711, "global_step": 361441, "epoch": 2987} {"train_loss": -45.66170883178711, "global_step": 361442, "epoch": 2987} {"train_loss": -45.19562911987305, "global_step": 361443, "epoch": 2987} {"train_loss": -45.399166107177734, "global_step": 361444, "epoch": 2987} {"train_loss": -44.27413558959961, "global_step": 361445, "epoch": 2987} {"train_loss": -44.91774368286133, "global_step": 361446, "epoch": 2987} {"train_loss": -45.59537887573242, "global_step": 361447, "epoch": 2987} {"train_loss": -44.101985931396484, "global_step": 361448, "epoch": 2987} {"train_loss": -44.71641159057617, "global_step": 361449, "epoch": 2987} {"train_loss": -44.85190963745117, "global_step": 361450, "epoch": 2987} {"train_loss": -45.75828170776367, "global_step": 361451, "epoch": 2987} {"train_loss": -45.431610107421875, "global_step": 361452, "epoch": 2987} {"train_loss": -45.25509262084961, "global_step": 361453, "epoch": 2987} {"train_loss": -45.02431106567383, "global_step": 361454, "epoch": 2987} {"train_loss": -45.81646728515625, "global_step": 361455, "epoch": 2987} {"train_loss": -45.779388427734375, "global_step": 361456, "epoch": 2987} {"train_loss": -43.86873245239258, "global_step": 361457, "epoch": 2987} {"train_loss": -45.36082077026367, "global_step": 361458, "epoch": 2987} {"train_loss": -45.922115325927734, "global_step": 361459, "epoch": 2987} {"train_loss": -46.02399826049805, "global_step": 361460, "epoch": 2987} {"train_loss": -45.56721115112305, "global_step": 361461, "epoch": 2987} {"train_loss": -45.906593322753906, "global_step": 361462, "epoch": 2987} {"train_loss": -45.73568344116211, "global_step": 361463, "epoch": 2987} {"train_loss": -45.83536911010742, "global_step": 361464, "epoch": 2987} {"train_loss": -45.73586654663086, "global_step": 361465, "epoch": 2987} {"train_loss": -45.517669677734375, "global_step": 361466, "epoch": 2987} {"train_loss": -45.820735931396484, "global_step": 361467, "epoch": 2987} {"train_loss": -45.45051193237305, "global_step": 361468, "epoch": 2987} {"train_loss": -45.24043655395508, "global_step": 361469, "epoch": 2987} {"train_loss": -45.575233459472656, "global_step": 361470, "epoch": 2987} {"train_loss": -45.89530563354492, "global_step": 361471, "epoch": 2987} {"train_loss": -46.17466354370117, "global_step": 361472, "epoch": 2987} {"train_loss": -45.78635025024414, "global_step": 361473, "epoch": 2987} {"train_loss": -46.092918395996094, "global_step": 361474, "epoch": 2987} {"train_loss": -45.91209411621094, "global_step": 361475, "epoch": 2987} {"train_loss": -45.56404495239258, "global_step": 361476, "epoch": 2987} {"train_loss": -46.556331634521484, "global_step": 361477, "epoch": 2987} {"train_loss": -44.81730270385742, "global_step": 361478, "epoch": 2987} {"train_loss": -44.93482208251953, "global_step": 361479, "epoch": 2987} {"train_loss": -45.870906829833984, "global_step": 361480, "epoch": 2987} {"train_loss": -45.79667282104492, "global_step": 361481, "epoch": 2987} {"train_loss": -45.88745880126953, "global_step": 361482, "epoch": 2987} {"train_loss": -45.408843994140625, "global_step": 361483, "epoch": 2987} {"train_loss": -44.878231048583984, "global_step": 361484, "epoch": 2987} {"train_loss": -43.93665313720703, "global_step": 361485, "epoch": 2987} {"train_loss": -45.46421432495117, "global_step": 361486, "epoch": 2987} {"train_loss": -45.551055908203125, "global_step": 361487, "epoch": 2987} {"train_loss": -45.3110237121582, "global_step": 361488, "epoch": 2987} {"train_loss": -46.28850173950195, "global_step": 361489, "epoch": 2987} {"train_loss": -45.08308029174805, "global_step": 361490, "epoch": 2987} {"train_loss": -45.618080139160156, "global_step": 361491, "epoch": 2987} {"train_loss": -45.0899772644043, "global_step": 361492, "epoch": 2987} {"train_loss": -46.169578552246094, "global_step": 361493, "epoch": 2987} {"train_loss": -45.522003173828125, "global_step": 361494, "epoch": 2987} {"train_loss": -45.1265983581543, "global_step": 361495, "epoch": 2987} {"train_loss": -45.39033126831055, "global_step": 361496, "epoch": 2987} {"train_loss": -46.11468505859375, "global_step": 361497, "epoch": 2987} {"train_loss": -45.69222640991211, "global_step": 361498, "epoch": 2987} {"train_loss": -45.36190414428711, "global_step": 361499, "epoch": 2987} {"train_loss": -46.28323745727539, "global_step": 361500, "epoch": 2987} {"train_loss": -44.81759262084961, "global_step": 361501, "epoch": 2987} {"train_loss": -45.94703674316406, "global_step": 361502, "epoch": 2987} {"train_loss": -44.869998931884766, "global_step": 361503, "epoch": 2987} {"train_loss": -46.162349700927734, "global_step": 361504, "epoch": 2987} {"train_loss": -45.651737213134766, "global_step": 361505, "epoch": 2987} {"train_loss": -46.080970764160156, "global_step": 361506, "epoch": 2987} {"train_loss": -45.34348678588867, "global_step": 361507, "epoch": 2987} {"train_loss": -44.3382568359375, "global_step": 361508, "epoch": 2987} {"train_loss": -44.906368255615234, "global_step": 361509, "epoch": 2987} {"train_loss": -43.09174346923828, "global_step": 361510, "epoch": 2987} {"train_loss": -38.55641555786133, "global_step": 361511, "epoch": 2987} {"train_loss": -44.30245590209961, "global_step": 361512, "epoch": 2987} {"train_loss": -43.41842269897461, "global_step": 361513, "epoch": 2987} {"train_loss": -40.381282806396484, "global_step": 361514, "epoch": 2987} {"train_loss": -42.20859146118164, "global_step": 361515, "epoch": 2987} {"train_loss": -43.56185531616211, "global_step": 361516, "epoch": 2987} {"train_loss": -42.31336212158203, "global_step": 361517, "epoch": 2987} {"train_loss": -44.09934616088867, "global_step": 361518, "epoch": 2987} {"train_loss": -44.62498474121094, "global_step": 361519, "epoch": 2987} {"train_loss": -43.42901611328125, "global_step": 361520, "epoch": 2987} {"train_loss": -40.105262756347656, "global_step": 361521, "epoch": 2987} {"train_loss": -43.11472702026367, "global_step": 361522, "epoch": 2987} {"train_loss": -40.51182174682617, "global_step": 361523, "epoch": 2987} {"train_loss": -39.86479568481445, "global_step": 361524, "epoch": 2987} {"train_loss": -41.8411979675293, "global_step": 361525, "epoch": 2987} {"train_loss": -36.83591079711914, "global_step": 361526, "epoch": 2987} {"train_loss": -38.37711715698242, "global_step": 361527, "epoch": 2987} {"train_loss": -35.41352081298828, "global_step": 361528, "epoch": 2987} {"train_loss": -39.30628204345703, "global_step": 361529, "epoch": 2987} {"train_loss": -38.948768615722656, "global_step": 361530, "epoch": 2987} {"train_loss": -40.81600570678711, "global_step": 361531, "epoch": 2987} {"train_loss": -38.603816986083984, "global_step": 361532, "epoch": 2987} {"train_loss": -42.67289352416992, "global_step": 361533, "epoch": 2987} {"train_loss": -40.324623107910156, "global_step": 361534, "epoch": 2987} {"train_loss": -43.04655075073242, "global_step": 361535, "epoch": 2987} {"train_loss": -43.35172653198242, "global_step": 361536, "epoch": 2987} {"train_loss": -41.89179611206055, "global_step": 361537, "epoch": 2987} {"train_loss": -44.19623565673828, "global_step": 361538, "epoch": 2987} {"train_loss": -42.91078567504883, "global_step": 361539, "epoch": 2987} {"train_loss": -43.40520095825195, "global_step": 361540, "epoch": 2987} {"train_loss": -43.93994903564453, "global_step": 361541, "epoch": 2987} {"train_loss": -43.407814025878906, "global_step": 361542, "epoch": 2987} {"train_loss": -43.18931198120117, "global_step": 361543, "epoch": 2987} {"train_loss": -43.8673095703125, "global_step": 361544, "epoch": 2987} {"train_loss": -43.430030822753906, "global_step": 361545, "epoch": 2987} {"train_loss": -44.62641525268555, "global_step": 361546, "epoch": 2987} {"train_loss": -44.23541934431092, "global_step": 361547, "epoch": 2987, "val_loss": 2563054.0} {"train_loss": -44.00771713256836, "global_step": 361548, "epoch": 2988} {"train_loss": -44.30060577392578, "global_step": 361549, "epoch": 2988} {"train_loss": -44.44090270996094, "global_step": 361550, "epoch": 2988} {"train_loss": -44.177040100097656, "global_step": 361551, "epoch": 2988} {"train_loss": -44.419769287109375, "global_step": 361552, "epoch": 2988} {"train_loss": -44.70245361328125, "global_step": 361553, "epoch": 2988} {"train_loss": -44.69230270385742, "global_step": 361554, "epoch": 2988} {"train_loss": -44.42144775390625, "global_step": 361555, "epoch": 2988} {"train_loss": -44.91488265991211, "global_step": 361556, "epoch": 2988} {"train_loss": -44.57550811767578, "global_step": 361557, "epoch": 2988} {"train_loss": -45.001590728759766, "global_step": 361558, "epoch": 2988} {"train_loss": -44.923404693603516, "global_step": 361559, "epoch": 2988} {"train_loss": -44.6386604309082, "global_step": 361560, "epoch": 2988} {"train_loss": -44.55986022949219, "global_step": 361561, "epoch": 2988} {"train_loss": -44.899627685546875, "global_step": 361562, "epoch": 2988} {"train_loss": -44.90468978881836, "global_step": 361563, "epoch": 2988} {"train_loss": -45.18519592285156, "global_step": 361564, "epoch": 2988} {"train_loss": -45.580265045166016, "global_step": 361565, "epoch": 2988} {"train_loss": -44.960304260253906, "global_step": 361566, "epoch": 2988} {"train_loss": -44.679443359375, "global_step": 361567, "epoch": 2988} {"train_loss": -45.25347900390625, "global_step": 361568, "epoch": 2988} {"train_loss": -45.28132247924805, "global_step": 361569, "epoch": 2988} {"train_loss": -45.91567611694336, "global_step": 361570, "epoch": 2988} {"train_loss": -44.9702262878418, "global_step": 361571, "epoch": 2988} {"train_loss": -44.94995880126953, "global_step": 361572, "epoch": 2988} {"train_loss": -45.30439376831055, "global_step": 361573, "epoch": 2988} {"train_loss": -44.815853118896484, "global_step": 361574, "epoch": 2988} {"train_loss": -44.79380416870117, "global_step": 361575, "epoch": 2988} {"train_loss": -45.217811584472656, "global_step": 361576, "epoch": 2988} {"train_loss": -44.975250244140625, "global_step": 361577, "epoch": 2988} {"train_loss": -45.57625961303711, "global_step": 361578, "epoch": 2988} {"train_loss": -45.535858154296875, "global_step": 361579, "epoch": 2988} {"train_loss": -44.984375, "global_step": 361580, "epoch": 2988} {"train_loss": -45.252986907958984, "global_step": 361581, "epoch": 2988} {"train_loss": -45.85991287231445, "global_step": 361582, "epoch": 2988} {"train_loss": -44.861968994140625, "global_step": 361583, "epoch": 2988} {"train_loss": -44.25175857543945, "global_step": 361584, "epoch": 2988} {"train_loss": -44.941749572753906, "global_step": 361585, "epoch": 2988} {"train_loss": -44.4290657043457, "global_step": 361586, "epoch": 2988} {"train_loss": -43.55224609375, "global_step": 361587, "epoch": 2988} {"train_loss": -45.271461486816406, "global_step": 361588, "epoch": 2988} {"train_loss": -45.860477447509766, "global_step": 361589, "epoch": 2988} {"train_loss": -43.905879974365234, "global_step": 361590, "epoch": 2988} {"train_loss": -42.676082611083984, "global_step": 361591, "epoch": 2988} {"train_loss": -45.740699768066406, "global_step": 361592, "epoch": 2988} {"train_loss": -44.845096588134766, "global_step": 361593, "epoch": 2988} {"train_loss": -43.20222854614258, "global_step": 361594, "epoch": 2988} {"train_loss": -45.33951950073242, "global_step": 361595, "epoch": 2988} {"train_loss": -44.69621276855469, "global_step": 361596, "epoch": 2988} {"train_loss": -44.86076736450195, "global_step": 361597, "epoch": 2988} {"train_loss": -45.09319305419922, "global_step": 361598, "epoch": 2988} {"train_loss": -45.38685607910156, "global_step": 361599, "epoch": 2988} {"train_loss": -44.503173828125, "global_step": 361600, "epoch": 2988} {"train_loss": -42.74959182739258, "global_step": 361601, "epoch": 2988} {"train_loss": -45.13474655151367, "global_step": 361602, "epoch": 2988} {"train_loss": -45.09492492675781, "global_step": 361603, "epoch": 2988} {"train_loss": -44.944515228271484, "global_step": 361604, "epoch": 2988} {"train_loss": -43.42647933959961, "global_step": 361605, "epoch": 2988} {"train_loss": -45.59181594848633, "global_step": 361606, "epoch": 2988} {"train_loss": -45.24466323852539, "global_step": 361607, "epoch": 2988} {"train_loss": -45.379005432128906, "global_step": 361608, "epoch": 2988} {"train_loss": -45.653079986572266, "global_step": 361609, "epoch": 2988} {"train_loss": -45.25856399536133, "global_step": 361610, "epoch": 2988} {"train_loss": -45.4788818359375, "global_step": 361611, "epoch": 2988} {"train_loss": -45.50678253173828, "global_step": 361612, "epoch": 2988} {"train_loss": -45.525001525878906, "global_step": 361613, "epoch": 2988} {"train_loss": -44.491207122802734, "global_step": 361614, "epoch": 2988} {"train_loss": -45.89929962158203, "global_step": 361615, "epoch": 2988} {"train_loss": -45.712589263916016, "global_step": 361616, "epoch": 2988} {"train_loss": -44.672035217285156, "global_step": 361617, "epoch": 2988} {"train_loss": -46.09649658203125, "global_step": 361618, "epoch": 2988} {"train_loss": -45.613521575927734, "global_step": 361619, "epoch": 2988} {"train_loss": -45.22522735595703, "global_step": 361620, "epoch": 2988} {"train_loss": -46.18142318725586, "global_step": 361621, "epoch": 2988} {"train_loss": -45.45127487182617, "global_step": 361622, "epoch": 2988} {"train_loss": -45.6378173828125, "global_step": 361623, "epoch": 2988} {"train_loss": -45.78615951538086, "global_step": 361624, "epoch": 2988} {"train_loss": -45.38935852050781, "global_step": 361625, "epoch": 2988} {"train_loss": -44.398738861083984, "global_step": 361626, "epoch": 2988} {"train_loss": -45.8123893737793, "global_step": 361627, "epoch": 2988} {"train_loss": -44.429473876953125, "global_step": 361628, "epoch": 2988} {"train_loss": -44.15554428100586, "global_step": 361629, "epoch": 2988} {"train_loss": -45.25812911987305, "global_step": 361630, "epoch": 2988} {"train_loss": -45.15950393676758, "global_step": 361631, "epoch": 2988} {"train_loss": -44.24045944213867, "global_step": 361632, "epoch": 2988} {"train_loss": -45.329898834228516, "global_step": 361633, "epoch": 2988} {"train_loss": -44.872676849365234, "global_step": 361634, "epoch": 2988} {"train_loss": -44.972900390625, "global_step": 361635, "epoch": 2988} {"train_loss": -44.87807846069336, "global_step": 361636, "epoch": 2988} {"train_loss": -44.74700164794922, "global_step": 361637, "epoch": 2988} {"train_loss": -46.02252197265625, "global_step": 361638, "epoch": 2988} {"train_loss": -44.53892135620117, "global_step": 361639, "epoch": 2988} {"train_loss": -44.228309631347656, "global_step": 361640, "epoch": 2988} {"train_loss": -44.83677291870117, "global_step": 361641, "epoch": 2988} {"train_loss": -45.196773529052734, "global_step": 361642, "epoch": 2988} {"train_loss": -45.7722053527832, "global_step": 361643, "epoch": 2988} {"train_loss": -44.709041595458984, "global_step": 361644, "epoch": 2988} {"train_loss": -43.799964904785156, "global_step": 361645, "epoch": 2988} {"train_loss": -45.386348724365234, "global_step": 361646, "epoch": 2988} {"train_loss": -44.34232711791992, "global_step": 361647, "epoch": 2988} {"train_loss": -44.63186264038086, "global_step": 361648, "epoch": 2988} {"train_loss": -44.43687438964844, "global_step": 361649, "epoch": 2988} {"train_loss": -44.745201110839844, "global_step": 361650, "epoch": 2988} {"train_loss": -45.45170211791992, "global_step": 361651, "epoch": 2988} {"train_loss": -45.229801177978516, "global_step": 361652, "epoch": 2988} {"train_loss": -44.75629806518555, "global_step": 361653, "epoch": 2988} {"train_loss": -44.69134521484375, "global_step": 361654, "epoch": 2988} {"train_loss": -45.640560150146484, "global_step": 361655, "epoch": 2988} {"train_loss": -44.994171142578125, "global_step": 361656, "epoch": 2988} {"train_loss": -44.43595504760742, "global_step": 361657, "epoch": 2988} {"train_loss": -43.27271270751953, "global_step": 361658, "epoch": 2988} {"train_loss": -44.481658935546875, "global_step": 361659, "epoch": 2988} {"train_loss": -44.731929779052734, "global_step": 361660, "epoch": 2988} {"train_loss": -42.76887893676758, "global_step": 361661, "epoch": 2988} {"train_loss": -41.024261474609375, "global_step": 361662, "epoch": 2988} {"train_loss": -44.54537582397461, "global_step": 361663, "epoch": 2988} {"train_loss": -38.939544677734375, "global_step": 361664, "epoch": 2988} {"train_loss": -44.65908432006836, "global_step": 361665, "epoch": 2988} {"train_loss": -37.87287902832031, "global_step": 361666, "epoch": 2988} {"train_loss": -43.27793502807617, "global_step": 361667, "epoch": 2988} {"train_loss": -44.667184971580824, "global_step": 361668, "epoch": 2988, "val_loss": 2613290.0} {"train_loss": -38.18268966674805, "global_step": 361669, "epoch": 2989} {"train_loss": -40.001434326171875, "global_step": 361670, "epoch": 2989} {"train_loss": -38.12013244628906, "global_step": 361671, "epoch": 2989} {"train_loss": -38.6766242980957, "global_step": 361672, "epoch": 2989} {"train_loss": -40.01231002807617, "global_step": 361673, "epoch": 2989} {"train_loss": -39.43059158325195, "global_step": 361674, "epoch": 2989} {"train_loss": -38.842796325683594, "global_step": 361675, "epoch": 2989} {"train_loss": -42.31870651245117, "global_step": 361676, "epoch": 2989} {"train_loss": -38.9359016418457, "global_step": 361677, "epoch": 2989} {"train_loss": -41.44374084472656, "global_step": 361678, "epoch": 2989} {"train_loss": -39.401485443115234, "global_step": 361679, "epoch": 2989} {"train_loss": -39.152008056640625, "global_step": 361680, "epoch": 2989} {"train_loss": -40.304927825927734, "global_step": 361681, "epoch": 2989} {"train_loss": -39.21928787231445, "global_step": 361682, "epoch": 2989} {"train_loss": -40.73920822143555, "global_step": 361683, "epoch": 2989} {"train_loss": -41.8742790222168, "global_step": 361684, "epoch": 2989} {"train_loss": -41.31172561645508, "global_step": 361685, "epoch": 2989} {"train_loss": -42.08573532104492, "global_step": 361686, "epoch": 2989} {"train_loss": -41.294830322265625, "global_step": 361687, "epoch": 2989} {"train_loss": -43.449947357177734, "global_step": 361688, "epoch": 2989} {"train_loss": -41.09980392456055, "global_step": 361689, "epoch": 2989} {"train_loss": -43.13407516479492, "global_step": 361690, "epoch": 2989} {"train_loss": -42.21256637573242, "global_step": 361691, "epoch": 2989} {"train_loss": -42.95138168334961, "global_step": 361692, "epoch": 2989} {"train_loss": -43.175289154052734, "global_step": 361693, "epoch": 2989} {"train_loss": -42.80141067504883, "global_step": 361694, "epoch": 2989} {"train_loss": -44.45169448852539, "global_step": 361695, "epoch": 2989} {"train_loss": -43.10419845581055, "global_step": 361696, "epoch": 2989} {"train_loss": -43.29801559448242, "global_step": 361697, "epoch": 2989} {"train_loss": -43.61610412597656, "global_step": 361698, "epoch": 2989} {"train_loss": -43.996910095214844, "global_step": 361699, "epoch": 2989} {"train_loss": -44.43470764160156, "global_step": 361700, "epoch": 2989} {"train_loss": -44.360084533691406, "global_step": 361701, "epoch": 2989} {"train_loss": -43.79445266723633, "global_step": 361702, "epoch": 2989} {"train_loss": -44.85198974609375, "global_step": 361703, "epoch": 2989} {"train_loss": -43.931270599365234, "global_step": 361704, "epoch": 2989} {"train_loss": -44.9610481262207, "global_step": 361705, "epoch": 2989} {"train_loss": -44.36009216308594, "global_step": 361706, "epoch": 2989} {"train_loss": -44.274375915527344, "global_step": 361707, "epoch": 2989} {"train_loss": -44.78211975097656, "global_step": 361708, "epoch": 2989} {"train_loss": -44.65239334106445, "global_step": 361709, "epoch": 2989} {"train_loss": -44.74454879760742, "global_step": 361710, "epoch": 2989} {"train_loss": -44.72735595703125, "global_step": 361711, "epoch": 2989} {"train_loss": -44.72762680053711, "global_step": 361712, "epoch": 2989} {"train_loss": -44.98297882080078, "global_step": 361713, "epoch": 2989} {"train_loss": -44.520870208740234, "global_step": 361714, "epoch": 2989} {"train_loss": -44.634979248046875, "global_step": 361715, "epoch": 2989} {"train_loss": -44.656497955322266, "global_step": 361716, "epoch": 2989} {"train_loss": -44.749366760253906, "global_step": 361717, "epoch": 2989} {"train_loss": -44.69193649291992, "global_step": 361718, "epoch": 2989} {"train_loss": -45.00474166870117, "global_step": 361719, "epoch": 2989} {"train_loss": -45.25503158569336, "global_step": 361720, "epoch": 2989} {"train_loss": -45.21892547607422, "global_step": 361721, "epoch": 2989} {"train_loss": -45.21307373046875, "global_step": 361722, "epoch": 2989} {"train_loss": -45.25562286376953, "global_step": 361723, "epoch": 2989} {"train_loss": -45.049224853515625, "global_step": 361724, "epoch": 2989} {"train_loss": -45.22243881225586, "global_step": 361725, "epoch": 2989} {"train_loss": -45.23043441772461, "global_step": 361726, "epoch": 2989} {"train_loss": -44.929378509521484, "global_step": 361727, "epoch": 2989} {"train_loss": -45.34968948364258, "global_step": 361728, "epoch": 2989} {"train_loss": -45.368202209472656, "global_step": 361729, "epoch": 2989} {"train_loss": -43.80453109741211, "global_step": 361730, "epoch": 2989} {"train_loss": -45.7531852722168, "global_step": 361731, "epoch": 2989} {"train_loss": -44.07509994506836, "global_step": 361732, "epoch": 2989} {"train_loss": -44.70664596557617, "global_step": 361733, "epoch": 2989} {"train_loss": -45.41190719604492, "global_step": 361734, "epoch": 2989} {"train_loss": -44.20454025268555, "global_step": 361735, "epoch": 2989} {"train_loss": -45.58277893066406, "global_step": 361736, "epoch": 2989} {"train_loss": -44.41351318359375, "global_step": 361737, "epoch": 2989} {"train_loss": -43.994606018066406, "global_step": 361738, "epoch": 2989} {"train_loss": -45.750606536865234, "global_step": 361739, "epoch": 2989} {"train_loss": -45.15735626220703, "global_step": 361740, "epoch": 2989} {"train_loss": -44.198516845703125, "global_step": 361741, "epoch": 2989} {"train_loss": -45.817813873291016, "global_step": 361742, "epoch": 2989} {"train_loss": -44.149391174316406, "global_step": 361743, "epoch": 2989} {"train_loss": -44.9886360168457, "global_step": 361744, "epoch": 2989} {"train_loss": -45.036617279052734, "global_step": 361745, "epoch": 2989} {"train_loss": -44.07875442504883, "global_step": 361746, "epoch": 2989} {"train_loss": -44.56246566772461, "global_step": 361747, "epoch": 2989} {"train_loss": -45.54839324951172, "global_step": 361748, "epoch": 2989} {"train_loss": -43.79815673828125, "global_step": 361749, "epoch": 2989} {"train_loss": -45.46236038208008, "global_step": 361750, "epoch": 2989} {"train_loss": -45.25117874145508, "global_step": 361751, "epoch": 2989} {"train_loss": -44.68893051147461, "global_step": 361752, "epoch": 2989} {"train_loss": -45.005760192871094, "global_step": 361753, "epoch": 2989} {"train_loss": -45.328125, "global_step": 361754, "epoch": 2989} {"train_loss": -44.989654541015625, "global_step": 361755, "epoch": 2989} {"train_loss": -45.61078643798828, "global_step": 361756, "epoch": 2989} {"train_loss": -45.300994873046875, "global_step": 361757, "epoch": 2989} {"train_loss": -45.63738250732422, "global_step": 361758, "epoch": 2989} {"train_loss": -45.453609466552734, "global_step": 361759, "epoch": 2989} {"train_loss": -45.542572021484375, "global_step": 361760, "epoch": 2989} {"train_loss": -45.27564239501953, "global_step": 361761, "epoch": 2989} {"train_loss": -45.44036102294922, "global_step": 361762, "epoch": 2989} {"train_loss": -45.8158073425293, "global_step": 361763, "epoch": 2989} {"train_loss": -45.09758377075195, "global_step": 361764, "epoch": 2989} {"train_loss": -44.87766647338867, "global_step": 361765, "epoch": 2989} {"train_loss": -45.72315216064453, "global_step": 361766, "epoch": 2989} {"train_loss": -44.98088455200195, "global_step": 361767, "epoch": 2989} {"train_loss": -45.333309173583984, "global_step": 361768, "epoch": 2989} {"train_loss": -45.300140380859375, "global_step": 361769, "epoch": 2989} {"train_loss": -42.299537658691406, "global_step": 361770, "epoch": 2989} {"train_loss": -40.30588912963867, "global_step": 361771, "epoch": 2989} {"train_loss": -44.62382125854492, "global_step": 361772, "epoch": 2989} {"train_loss": -44.374080657958984, "global_step": 361773, "epoch": 2989} {"train_loss": -42.72687911987305, "global_step": 361774, "epoch": 2989} {"train_loss": -41.89579391479492, "global_step": 361775, "epoch": 2989} {"train_loss": -44.11882400512695, "global_step": 361776, "epoch": 2989} {"train_loss": -39.97504806518555, "global_step": 361777, "epoch": 2989} {"train_loss": -43.8791389465332, "global_step": 361778, "epoch": 2989} {"train_loss": -37.63380813598633, "global_step": 361779, "epoch": 2989} {"train_loss": -39.79810333251953, "global_step": 361780, "epoch": 2989} {"train_loss": -42.01571273803711, "global_step": 361781, "epoch": 2989} {"train_loss": -43.653968811035156, "global_step": 361782, "epoch": 2989} {"train_loss": -42.63045120239258, "global_step": 361783, "epoch": 2989} {"train_loss": -43.99660873413086, "global_step": 361784, "epoch": 2989} {"train_loss": -41.81772232055664, "global_step": 361785, "epoch": 2989} {"train_loss": -43.963043212890625, "global_step": 361786, "epoch": 2989} {"train_loss": -43.51446533203125, "global_step": 361787, "epoch": 2989} {"train_loss": -44.06128692626953, "global_step": 361788, "epoch": 2989} {"train_loss": -43.592209871150246, "global_step": 361789, "epoch": 2989, "val_loss": 2546108.75} {"train_loss": -41.62323760986328, "global_step": 361790, "epoch": 2990} {"train_loss": -43.410804748535156, "global_step": 361791, "epoch": 2990} {"train_loss": -41.75361251831055, "global_step": 361792, "epoch": 2990} {"train_loss": -44.83201217651367, "global_step": 361793, "epoch": 2990} {"train_loss": -42.081233978271484, "global_step": 361794, "epoch": 2990} {"train_loss": -44.821449279785156, "global_step": 361795, "epoch": 2990} {"train_loss": -42.97048568725586, "global_step": 361796, "epoch": 2990} {"train_loss": -44.6507568359375, "global_step": 361797, "epoch": 2990} {"train_loss": -44.56907653808594, "global_step": 361798, "epoch": 2990} {"train_loss": -44.300594329833984, "global_step": 361799, "epoch": 2990} {"train_loss": -44.4559440612793, "global_step": 361800, "epoch": 2990} {"train_loss": -44.2963981628418, "global_step": 361801, "epoch": 2990} {"train_loss": -45.05744552612305, "global_step": 361802, "epoch": 2990} {"train_loss": -44.10361862182617, "global_step": 361803, "epoch": 2990} {"train_loss": -44.8656120300293, "global_step": 361804, "epoch": 2990} {"train_loss": -44.583656311035156, "global_step": 361805, "epoch": 2990} {"train_loss": -44.030391693115234, "global_step": 361806, "epoch": 2990} {"train_loss": -45.003143310546875, "global_step": 361807, "epoch": 2990} {"train_loss": -44.31089782714844, "global_step": 361808, "epoch": 2990} {"train_loss": -43.51796340942383, "global_step": 361809, "epoch": 2990} {"train_loss": -45.365840911865234, "global_step": 361810, "epoch": 2990} {"train_loss": -44.354942321777344, "global_step": 361811, "epoch": 2990} {"train_loss": -44.605262756347656, "global_step": 361812, "epoch": 2990} {"train_loss": -44.93424606323242, "global_step": 361813, "epoch": 2990} {"train_loss": -44.50032424926758, "global_step": 361814, "epoch": 2990} {"train_loss": -44.85519027709961, "global_step": 361815, "epoch": 2990} {"train_loss": -44.32763671875, "global_step": 361816, "epoch": 2990} {"train_loss": -44.52189254760742, "global_step": 361817, "epoch": 2990} {"train_loss": -44.60531234741211, "global_step": 361818, "epoch": 2990} {"train_loss": -44.725929260253906, "global_step": 361819, "epoch": 2990} {"train_loss": -45.14077377319336, "global_step": 361820, "epoch": 2990} {"train_loss": -45.227542877197266, "global_step": 361821, "epoch": 2990} {"train_loss": -45.051517486572266, "global_step": 361822, "epoch": 2990} {"train_loss": -45.27460861206055, "global_step": 361823, "epoch": 2990} {"train_loss": -43.865779876708984, "global_step": 361824, "epoch": 2990} {"train_loss": -45.152679443359375, "global_step": 361825, "epoch": 2990} {"train_loss": -44.937923431396484, "global_step": 361826, "epoch": 2990} {"train_loss": -44.713436126708984, "global_step": 361827, "epoch": 2990} {"train_loss": -44.67108154296875, "global_step": 361828, "epoch": 2990} {"train_loss": -45.43379592895508, "global_step": 361829, "epoch": 2990} {"train_loss": -45.00003433227539, "global_step": 361830, "epoch": 2990} {"train_loss": -45.54799270629883, "global_step": 361831, "epoch": 2990} {"train_loss": -44.845245361328125, "global_step": 361832, "epoch": 2990} {"train_loss": -45.54273223876953, "global_step": 361833, "epoch": 2990} {"train_loss": -45.49685287475586, "global_step": 361834, "epoch": 2990} {"train_loss": -45.59394454956055, "global_step": 361835, "epoch": 2990} {"train_loss": -45.40082550048828, "global_step": 361836, "epoch": 2990} {"train_loss": -45.114601135253906, "global_step": 361837, "epoch": 2990} {"train_loss": -45.517189025878906, "global_step": 361838, "epoch": 2990} {"train_loss": -44.96548843383789, "global_step": 361839, "epoch": 2990} {"train_loss": -45.828983306884766, "global_step": 361840, "epoch": 2990} {"train_loss": -45.17926788330078, "global_step": 361841, "epoch": 2990} {"train_loss": -45.77899932861328, "global_step": 361842, "epoch": 2990} {"train_loss": -45.182430267333984, "global_step": 361843, "epoch": 2990} {"train_loss": -45.391483306884766, "global_step": 361844, "epoch": 2990} {"train_loss": -44.74431610107422, "global_step": 361845, "epoch": 2990} {"train_loss": -42.842098236083984, "global_step": 361846, "epoch": 2990} {"train_loss": -45.63775634765625, "global_step": 361847, "epoch": 2990} {"train_loss": -45.51527786254883, "global_step": 361848, "epoch": 2990} {"train_loss": -44.449893951416016, "global_step": 361849, "epoch": 2990} {"train_loss": -44.319889068603516, "global_step": 361850, "epoch": 2990} {"train_loss": -44.732276916503906, "global_step": 361851, "epoch": 2990} {"train_loss": -45.853145599365234, "global_step": 361852, "epoch": 2990} {"train_loss": -43.48072052001953, "global_step": 361853, "epoch": 2990} {"train_loss": -41.64545440673828, "global_step": 361854, "epoch": 2990} {"train_loss": -43.30848693847656, "global_step": 361855, "epoch": 2990} {"train_loss": -45.351341247558594, "global_step": 361856, "epoch": 2990} {"train_loss": -43.46218490600586, "global_step": 361857, "epoch": 2990} {"train_loss": -42.37358474731445, "global_step": 361858, "epoch": 2990} {"train_loss": -44.78034210205078, "global_step": 361859, "epoch": 2990} {"train_loss": -44.40571975708008, "global_step": 361860, "epoch": 2990} {"train_loss": -43.697242736816406, "global_step": 361861, "epoch": 2990} {"train_loss": -45.19111251831055, "global_step": 361862, "epoch": 2990} {"train_loss": -44.3514404296875, "global_step": 361863, "epoch": 2990} {"train_loss": -43.2753791809082, "global_step": 361864, "epoch": 2990} {"train_loss": -43.504207611083984, "global_step": 361865, "epoch": 2990} {"train_loss": -45.29664993286133, "global_step": 361866, "epoch": 2990} {"train_loss": -43.86627197265625, "global_step": 361867, "epoch": 2990} {"train_loss": -43.45894241333008, "global_step": 361868, "epoch": 2990} {"train_loss": -45.3239631652832, "global_step": 361869, "epoch": 2990} {"train_loss": -43.88119125366211, "global_step": 361870, "epoch": 2990} {"train_loss": -45.018836975097656, "global_step": 361871, "epoch": 2990} {"train_loss": -45.09560775756836, "global_step": 361872, "epoch": 2990} {"train_loss": -42.63017272949219, "global_step": 361873, "epoch": 2990} {"train_loss": -43.36934280395508, "global_step": 361874, "epoch": 2990} {"train_loss": -45.909053802490234, "global_step": 361875, "epoch": 2990} {"train_loss": -42.9351921081543, "global_step": 361876, "epoch": 2990} {"train_loss": -43.71366882324219, "global_step": 361877, "epoch": 2990} {"train_loss": -44.29799270629883, "global_step": 361878, "epoch": 2990} {"train_loss": -45.196319580078125, "global_step": 361879, "epoch": 2990} {"train_loss": -44.905887603759766, "global_step": 361880, "epoch": 2990} {"train_loss": -45.0103759765625, "global_step": 361881, "epoch": 2990} {"train_loss": -45.61686325073242, "global_step": 361882, "epoch": 2990} {"train_loss": -45.37592315673828, "global_step": 361883, "epoch": 2990} {"train_loss": -44.866451263427734, "global_step": 361884, "epoch": 2990} {"train_loss": -44.77372360229492, "global_step": 361885, "epoch": 2990} {"train_loss": -45.25269317626953, "global_step": 361886, "epoch": 2990} {"train_loss": -45.013187408447266, "global_step": 361887, "epoch": 2990} {"train_loss": -44.6619987487793, "global_step": 361888, "epoch": 2990} {"train_loss": -44.74040603637695, "global_step": 361889, "epoch": 2990} {"train_loss": -44.39984893798828, "global_step": 361890, "epoch": 2990} {"train_loss": -45.01096725463867, "global_step": 361891, "epoch": 2990} {"train_loss": -43.83725357055664, "global_step": 361892, "epoch": 2990} {"train_loss": -44.9580192565918, "global_step": 361893, "epoch": 2990} {"train_loss": -45.21352005004883, "global_step": 361894, "epoch": 2990} {"train_loss": -44.78850555419922, "global_step": 361895, "epoch": 2990} {"train_loss": -45.00715637207031, "global_step": 361896, "epoch": 2990} {"train_loss": -45.239810943603516, "global_step": 361897, "epoch": 2990} {"train_loss": -43.89793014526367, "global_step": 361898, "epoch": 2990} {"train_loss": -44.191017150878906, "global_step": 361899, "epoch": 2990} {"train_loss": -45.15073776245117, "global_step": 361900, "epoch": 2990} {"train_loss": -44.38418197631836, "global_step": 361901, "epoch": 2990} {"train_loss": -44.400081634521484, "global_step": 361902, "epoch": 2990} {"train_loss": -45.52681350708008, "global_step": 361903, "epoch": 2990} {"train_loss": -44.568721771240234, "global_step": 361904, "epoch": 2990} {"train_loss": -45.1676139831543, "global_step": 361905, "epoch": 2990} {"train_loss": -45.0937614440918, "global_step": 361906, "epoch": 2990} {"train_loss": -45.38241195678711, "global_step": 361907, "epoch": 2990} {"train_loss": -45.18749237060547, "global_step": 361908, "epoch": 2990} {"train_loss": -44.08513641357422, "global_step": 361909, "epoch": 2990} {"train_loss": -44.57884723884015, "global_step": 361910, "epoch": 2990, "val_loss": 2571910.0} {"train_loss": -44.95885467529297, "global_step": 361911, "epoch": 2991} {"train_loss": -44.90987014770508, "global_step": 361912, "epoch": 2991} {"train_loss": -45.4073600769043, "global_step": 361913, "epoch": 2991} {"train_loss": -44.82931137084961, "global_step": 361914, "epoch": 2991} {"train_loss": -45.08781051635742, "global_step": 361915, "epoch": 2991} {"train_loss": -45.396644592285156, "global_step": 361916, "epoch": 2991} {"train_loss": -44.29334259033203, "global_step": 361917, "epoch": 2991} {"train_loss": -45.270198822021484, "global_step": 361918, "epoch": 2991} {"train_loss": -45.58374786376953, "global_step": 361919, "epoch": 2991} {"train_loss": -45.15996551513672, "global_step": 361920, "epoch": 2991} {"train_loss": -45.2796745300293, "global_step": 361921, "epoch": 2991} {"train_loss": -45.0272216796875, "global_step": 361922, "epoch": 2991} {"train_loss": -45.628753662109375, "global_step": 361923, "epoch": 2991} {"train_loss": -45.07760238647461, "global_step": 361924, "epoch": 2991} {"train_loss": -45.254573822021484, "global_step": 361925, "epoch": 2991} {"train_loss": -45.593727111816406, "global_step": 361926, "epoch": 2991} {"train_loss": -44.745784759521484, "global_step": 361927, "epoch": 2991} {"train_loss": -45.13548278808594, "global_step": 361928, "epoch": 2991} {"train_loss": -44.97330093383789, "global_step": 361929, "epoch": 2991} {"train_loss": -45.84873962402344, "global_step": 361930, "epoch": 2991} {"train_loss": -45.80170440673828, "global_step": 361931, "epoch": 2991} {"train_loss": -45.730682373046875, "global_step": 361932, "epoch": 2991} {"train_loss": -45.290260314941406, "global_step": 361933, "epoch": 2991} {"train_loss": -44.910457611083984, "global_step": 361934, "epoch": 2991} {"train_loss": -45.5098876953125, "global_step": 361935, "epoch": 2991} {"train_loss": -45.605865478515625, "global_step": 361936, "epoch": 2991} {"train_loss": -45.374568939208984, "global_step": 361937, "epoch": 2991} {"train_loss": -46.23191452026367, "global_step": 361938, "epoch": 2991} {"train_loss": -45.2636833190918, "global_step": 361939, "epoch": 2991} {"train_loss": -44.75564193725586, "global_step": 361940, "epoch": 2991} {"train_loss": -45.3412971496582, "global_step": 361941, "epoch": 2991} {"train_loss": -45.66933822631836, "global_step": 361942, "epoch": 2991} {"train_loss": -44.85305404663086, "global_step": 361943, "epoch": 2991} {"train_loss": -45.3704948425293, "global_step": 361944, "epoch": 2991} {"train_loss": -46.02479934692383, "global_step": 361945, "epoch": 2991} {"train_loss": -45.28408432006836, "global_step": 361946, "epoch": 2991} {"train_loss": -45.50775909423828, "global_step": 361947, "epoch": 2991} {"train_loss": -46.047576904296875, "global_step": 361948, "epoch": 2991} {"train_loss": -45.387786865234375, "global_step": 361949, "epoch": 2991} {"train_loss": -46.19768142700195, "global_step": 361950, "epoch": 2991} {"train_loss": -45.119564056396484, "global_step": 361951, "epoch": 2991} {"train_loss": -45.804481506347656, "global_step": 361952, "epoch": 2991} {"train_loss": -46.0087776184082, "global_step": 361953, "epoch": 2991} {"train_loss": -44.71547317504883, "global_step": 361954, "epoch": 2991} {"train_loss": -45.62189865112305, "global_step": 361955, "epoch": 2991} {"train_loss": -46.22151565551758, "global_step": 361956, "epoch": 2991} {"train_loss": -45.243621826171875, "global_step": 361957, "epoch": 2991} {"train_loss": -44.70839309692383, "global_step": 361958, "epoch": 2991} {"train_loss": -45.54976272583008, "global_step": 361959, "epoch": 2991} {"train_loss": -46.06414794921875, "global_step": 361960, "epoch": 2991} {"train_loss": -44.71669387817383, "global_step": 361961, "epoch": 2991} {"train_loss": -44.17045211791992, "global_step": 361962, "epoch": 2991} {"train_loss": -46.195030212402344, "global_step": 361963, "epoch": 2991} {"train_loss": -43.89792251586914, "global_step": 361964, "epoch": 2991} {"train_loss": -42.952877044677734, "global_step": 361965, "epoch": 2991} {"train_loss": -45.53611373901367, "global_step": 361966, "epoch": 2991} {"train_loss": -44.851776123046875, "global_step": 361967, "epoch": 2991} {"train_loss": -44.47651672363281, "global_step": 361968, "epoch": 2991} {"train_loss": -44.14469528198242, "global_step": 361969, "epoch": 2991} {"train_loss": -45.25130081176758, "global_step": 361970, "epoch": 2991} {"train_loss": -43.50232696533203, "global_step": 361971, "epoch": 2991} {"train_loss": -44.226348876953125, "global_step": 361972, "epoch": 2991} {"train_loss": -45.01572799682617, "global_step": 361973, "epoch": 2991} {"train_loss": -43.38926696777344, "global_step": 361974, "epoch": 2991} {"train_loss": -43.79917526245117, "global_step": 361975, "epoch": 2991} {"train_loss": -45.03376388549805, "global_step": 361976, "epoch": 2991} {"train_loss": -44.80043029785156, "global_step": 361977, "epoch": 2991} {"train_loss": -44.400474548339844, "global_step": 361978, "epoch": 2991} {"train_loss": -44.5225944519043, "global_step": 361979, "epoch": 2991} {"train_loss": -44.31338119506836, "global_step": 361980, "epoch": 2991} {"train_loss": -43.05536651611328, "global_step": 361981, "epoch": 2991} {"train_loss": -42.50023651123047, "global_step": 361982, "epoch": 2991} {"train_loss": -43.74040985107422, "global_step": 361983, "epoch": 2991} {"train_loss": -43.67399215698242, "global_step": 361984, "epoch": 2991} {"train_loss": -42.87531661987305, "global_step": 361985, "epoch": 2991} {"train_loss": -43.625633239746094, "global_step": 361986, "epoch": 2991} {"train_loss": -44.309913635253906, "global_step": 361987, "epoch": 2991} {"train_loss": -43.91659164428711, "global_step": 361988, "epoch": 2991} {"train_loss": -44.0747184753418, "global_step": 361989, "epoch": 2991} {"train_loss": -42.826759338378906, "global_step": 361990, "epoch": 2991} {"train_loss": -43.46681213378906, "global_step": 361991, "epoch": 2991} {"train_loss": -43.584449768066406, "global_step": 361992, "epoch": 2991} {"train_loss": -43.3138427734375, "global_step": 361993, "epoch": 2991} {"train_loss": -44.04084396362305, "global_step": 361994, "epoch": 2991} {"train_loss": -44.5282096862793, "global_step": 361995, "epoch": 2991} {"train_loss": -44.777069091796875, "global_step": 361996, "epoch": 2991} {"train_loss": -44.14455795288086, "global_step": 361997, "epoch": 2991} {"train_loss": -43.954750061035156, "global_step": 361998, "epoch": 2991} {"train_loss": -43.58528518676758, "global_step": 361999, "epoch": 2991} {"train_loss": -44.0702018737793, "global_step": 362000, "epoch": 2991} {"train_loss": -43.43368148803711, "global_step": 362001, "epoch": 2991} {"train_loss": -43.699642181396484, "global_step": 362002, "epoch": 2991} {"train_loss": -44.084346771240234, "global_step": 362003, "epoch": 2991} {"train_loss": -43.41898727416992, "global_step": 362004, "epoch": 2991} {"train_loss": -43.91305160522461, "global_step": 362005, "epoch": 2991} {"train_loss": -44.0413932800293, "global_step": 362006, "epoch": 2991} {"train_loss": -44.278987884521484, "global_step": 362007, "epoch": 2991} {"train_loss": -43.97404098510742, "global_step": 362008, "epoch": 2991} {"train_loss": -44.761680603027344, "global_step": 362009, "epoch": 2991} {"train_loss": -44.43251037597656, "global_step": 362010, "epoch": 2991} {"train_loss": -44.550453186035156, "global_step": 362011, "epoch": 2991} {"train_loss": -43.95807647705078, "global_step": 362012, "epoch": 2991} {"train_loss": -45.215694427490234, "global_step": 362013, "epoch": 2991} {"train_loss": -44.691890716552734, "global_step": 362014, "epoch": 2991} {"train_loss": -44.8845329284668, "global_step": 362015, "epoch": 2991} {"train_loss": -43.960994720458984, "global_step": 362016, "epoch": 2991} {"train_loss": -45.09636306762695, "global_step": 362017, "epoch": 2991} {"train_loss": -44.688297271728516, "global_step": 362018, "epoch": 2991} {"train_loss": -44.916175842285156, "global_step": 362019, "epoch": 2991} {"train_loss": -45.13943862915039, "global_step": 362020, "epoch": 2991} {"train_loss": -44.661312103271484, "global_step": 362021, "epoch": 2991} {"train_loss": -45.225242614746094, "global_step": 362022, "epoch": 2991} {"train_loss": -44.876399993896484, "global_step": 362023, "epoch": 2991} {"train_loss": -45.051509857177734, "global_step": 362024, "epoch": 2991} {"train_loss": -45.26780319213867, "global_step": 362025, "epoch": 2991} {"train_loss": -44.46096420288086, "global_step": 362026, "epoch": 2991} {"train_loss": -45.383846282958984, "global_step": 362027, "epoch": 2991} {"train_loss": -44.77579879760742, "global_step": 362028, "epoch": 2991} {"train_loss": -43.71376037597656, "global_step": 362029, "epoch": 2991} {"train_loss": -45.381492614746094, "global_step": 362030, "epoch": 2991} {"train_loss": -44.729888317013575, "global_step": 362031, "epoch": 2991, "val_loss": 2557970.75} {"train_loss": -43.17265701293945, "global_step": 362032, "epoch": 2992} {"train_loss": -44.12285614013672, "global_step": 362033, "epoch": 2992} {"train_loss": -43.78237533569336, "global_step": 362034, "epoch": 2992} {"train_loss": -44.55723190307617, "global_step": 362035, "epoch": 2992} {"train_loss": -44.684959411621094, "global_step": 362036, "epoch": 2992} {"train_loss": -44.77675247192383, "global_step": 362037, "epoch": 2992} {"train_loss": -44.65863037109375, "global_step": 362038, "epoch": 2992} {"train_loss": -45.62370300292969, "global_step": 362039, "epoch": 2992} {"train_loss": -44.5539436340332, "global_step": 362040, "epoch": 2992} {"train_loss": -44.517391204833984, "global_step": 362041, "epoch": 2992} {"train_loss": -44.6817741394043, "global_step": 362042, "epoch": 2992} {"train_loss": -44.733821868896484, "global_step": 362043, "epoch": 2992} {"train_loss": -44.538516998291016, "global_step": 362044, "epoch": 2992} {"train_loss": -44.724578857421875, "global_step": 362045, "epoch": 2992} {"train_loss": -44.704681396484375, "global_step": 362046, "epoch": 2992} {"train_loss": -45.11585235595703, "global_step": 362047, "epoch": 2992} {"train_loss": -45.16340637207031, "global_step": 362048, "epoch": 2992} {"train_loss": -45.34635543823242, "global_step": 362049, "epoch": 2992} {"train_loss": -45.421932220458984, "global_step": 362050, "epoch": 2992} {"train_loss": -45.55754852294922, "global_step": 362051, "epoch": 2992} {"train_loss": -44.50208282470703, "global_step": 362052, "epoch": 2992} {"train_loss": -45.936161041259766, "global_step": 362053, "epoch": 2992} {"train_loss": -44.76499557495117, "global_step": 362054, "epoch": 2992} {"train_loss": -45.069671630859375, "global_step": 362055, "epoch": 2992} {"train_loss": -45.79222869873047, "global_step": 362056, "epoch": 2992} {"train_loss": -45.139705657958984, "global_step": 362057, "epoch": 2992} {"train_loss": -45.3365364074707, "global_step": 362058, "epoch": 2992} {"train_loss": -45.73089599609375, "global_step": 362059, "epoch": 2992} {"train_loss": -45.46298599243164, "global_step": 362060, "epoch": 2992} {"train_loss": -45.2936897277832, "global_step": 362061, "epoch": 2992} {"train_loss": -46.02397918701172, "global_step": 362062, "epoch": 2992} {"train_loss": -45.37909698486328, "global_step": 362063, "epoch": 2992} {"train_loss": -45.3160285949707, "global_step": 362064, "epoch": 2992} {"train_loss": -46.18929672241211, "global_step": 362065, "epoch": 2992} {"train_loss": -45.405677795410156, "global_step": 362066, "epoch": 2992} {"train_loss": -45.766334533691406, "global_step": 362067, "epoch": 2992} {"train_loss": -45.18770980834961, "global_step": 362068, "epoch": 2992} {"train_loss": -45.81258010864258, "global_step": 362069, "epoch": 2992} {"train_loss": -44.73198318481445, "global_step": 362070, "epoch": 2992} {"train_loss": -45.7816047668457, "global_step": 362071, "epoch": 2992} {"train_loss": -45.676239013671875, "global_step": 362072, "epoch": 2992} {"train_loss": -43.50590133666992, "global_step": 362073, "epoch": 2992} {"train_loss": -42.78127670288086, "global_step": 362074, "epoch": 2992} {"train_loss": -45.11570739746094, "global_step": 362075, "epoch": 2992} {"train_loss": -45.28857421875, "global_step": 362076, "epoch": 2992} {"train_loss": -42.895782470703125, "global_step": 362077, "epoch": 2992} {"train_loss": -44.54753494262695, "global_step": 362078, "epoch": 2992} {"train_loss": -44.30836868286133, "global_step": 362079, "epoch": 2992} {"train_loss": -44.521575927734375, "global_step": 362080, "epoch": 2992} {"train_loss": -45.02531433105469, "global_step": 362081, "epoch": 2992} {"train_loss": -43.54354476928711, "global_step": 362082, "epoch": 2992} {"train_loss": -42.893157958984375, "global_step": 362083, "epoch": 2992} {"train_loss": -43.782447814941406, "global_step": 362084, "epoch": 2992} {"train_loss": -45.6795654296875, "global_step": 362085, "epoch": 2992} {"train_loss": -44.58498001098633, "global_step": 362086, "epoch": 2992} {"train_loss": -43.42012405395508, "global_step": 362087, "epoch": 2992} {"train_loss": -42.935028076171875, "global_step": 362088, "epoch": 2992} {"train_loss": -43.97664260864258, "global_step": 362089, "epoch": 2992} {"train_loss": -45.46317672729492, "global_step": 362090, "epoch": 2992} {"train_loss": -44.46641540527344, "global_step": 362091, "epoch": 2992} {"train_loss": -44.135353088378906, "global_step": 362092, "epoch": 2992} {"train_loss": -45.33244705200195, "global_step": 362093, "epoch": 2992} {"train_loss": -45.18537902832031, "global_step": 362094, "epoch": 2992} {"train_loss": -44.001461029052734, "global_step": 362095, "epoch": 2992} {"train_loss": -44.8800048828125, "global_step": 362096, "epoch": 2992} {"train_loss": -45.51026153564453, "global_step": 362097, "epoch": 2992} {"train_loss": -44.90682601928711, "global_step": 362098, "epoch": 2992} {"train_loss": -45.95000076293945, "global_step": 362099, "epoch": 2992} {"train_loss": -45.2428092956543, "global_step": 362100, "epoch": 2992} {"train_loss": -45.62788772583008, "global_step": 362101, "epoch": 2992} {"train_loss": -45.223915100097656, "global_step": 362102, "epoch": 2992} {"train_loss": -44.90523910522461, "global_step": 362103, "epoch": 2992} {"train_loss": -45.72200393676758, "global_step": 362104, "epoch": 2992} {"train_loss": -45.877838134765625, "global_step": 362105, "epoch": 2992} {"train_loss": -45.19584274291992, "global_step": 362106, "epoch": 2992} {"train_loss": -45.67876052856445, "global_step": 362107, "epoch": 2992} {"train_loss": -46.01914596557617, "global_step": 362108, "epoch": 2992} {"train_loss": -45.07830810546875, "global_step": 362109, "epoch": 2992} {"train_loss": -45.10411834716797, "global_step": 362110, "epoch": 2992} {"train_loss": -45.327117919921875, "global_step": 362111, "epoch": 2992} {"train_loss": -45.56167221069336, "global_step": 362112, "epoch": 2992} {"train_loss": -44.69610595703125, "global_step": 362113, "epoch": 2992} {"train_loss": -45.576271057128906, "global_step": 362114, "epoch": 2992} {"train_loss": -45.660823822021484, "global_step": 362115, "epoch": 2992} {"train_loss": -45.89594650268555, "global_step": 362116, "epoch": 2992} {"train_loss": -45.037776947021484, "global_step": 362117, "epoch": 2992} {"train_loss": -45.3388557434082, "global_step": 362118, "epoch": 2992} {"train_loss": -45.22738265991211, "global_step": 362119, "epoch": 2992} {"train_loss": -45.185550689697266, "global_step": 362120, "epoch": 2992} {"train_loss": -45.186092376708984, "global_step": 362121, "epoch": 2992} {"train_loss": -45.957000732421875, "global_step": 362122, "epoch": 2992} {"train_loss": -45.27589797973633, "global_step": 362123, "epoch": 2992} {"train_loss": -46.00871658325195, "global_step": 362124, "epoch": 2992} {"train_loss": -45.82666015625, "global_step": 362125, "epoch": 2992} {"train_loss": -45.62807083129883, "global_step": 362126, "epoch": 2992} {"train_loss": -45.98542404174805, "global_step": 362127, "epoch": 2992} {"train_loss": -45.776912689208984, "global_step": 362128, "epoch": 2992} {"train_loss": -45.54545974731445, "global_step": 362129, "epoch": 2992} {"train_loss": -45.900081634521484, "global_step": 362130, "epoch": 2992} {"train_loss": -45.34421157836914, "global_step": 362131, "epoch": 2992} {"train_loss": -46.170204162597656, "global_step": 362132, "epoch": 2992} {"train_loss": -45.92478561401367, "global_step": 362133, "epoch": 2992} {"train_loss": -45.92547607421875, "global_step": 362134, "epoch": 2992} {"train_loss": -45.823394775390625, "global_step": 362135, "epoch": 2992} {"train_loss": -46.11385726928711, "global_step": 362136, "epoch": 2992} {"train_loss": -46.36857604980469, "global_step": 362137, "epoch": 2992} {"train_loss": -45.84012985229492, "global_step": 362138, "epoch": 2992} {"train_loss": -46.4889030456543, "global_step": 362139, "epoch": 2992} {"train_loss": -46.400054931640625, "global_step": 362140, "epoch": 2992} {"train_loss": -46.30442428588867, "global_step": 362141, "epoch": 2992} {"train_loss": -45.8529167175293, "global_step": 362142, "epoch": 2992} {"train_loss": -45.281551361083984, "global_step": 362143, "epoch": 2992} {"train_loss": -46.1934928894043, "global_step": 362144, "epoch": 2992} {"train_loss": -46.39385986328125, "global_step": 362145, "epoch": 2992} {"train_loss": -46.44733810424805, "global_step": 362146, "epoch": 2992} {"train_loss": -45.75285720825195, "global_step": 362147, "epoch": 2992} {"train_loss": -46.41426467895508, "global_step": 362148, "epoch": 2992} {"train_loss": -46.31521224975586, "global_step": 362149, "epoch": 2992} {"train_loss": -45.89875411987305, "global_step": 362150, "epoch": 2992} {"train_loss": -46.297218322753906, "global_step": 362151, "epoch": 2992} {"train_loss": -45.21462262366429, "global_step": 362152, "epoch": 2992, "val_loss": 2495731.5} {"train_loss": -45.812049865722656, "global_step": 362153, "epoch": 2993} {"train_loss": -45.921783447265625, "global_step": 362154, "epoch": 2993} {"train_loss": -45.86543655395508, "global_step": 362155, "epoch": 2993} {"train_loss": -46.5833740234375, "global_step": 362156, "epoch": 2993} {"train_loss": -44.45475769042969, "global_step": 362157, "epoch": 2993} {"train_loss": -44.800941467285156, "global_step": 362158, "epoch": 2993} {"train_loss": -45.76874542236328, "global_step": 362159, "epoch": 2993} {"train_loss": -45.4634895324707, "global_step": 362160, "epoch": 2993} {"train_loss": -44.1944465637207, "global_step": 362161, "epoch": 2993} {"train_loss": -45.08583450317383, "global_step": 362162, "epoch": 2993} {"train_loss": -44.16141128540039, "global_step": 362163, "epoch": 2993} {"train_loss": -45.07646942138672, "global_step": 362164, "epoch": 2993} {"train_loss": -45.42034912109375, "global_step": 362165, "epoch": 2993} {"train_loss": -45.631195068359375, "global_step": 362166, "epoch": 2993} {"train_loss": -45.38349533081055, "global_step": 362167, "epoch": 2993} {"train_loss": -43.16449737548828, "global_step": 362168, "epoch": 2993} {"train_loss": -44.267024993896484, "global_step": 362169, "epoch": 2993} {"train_loss": -42.62559127807617, "global_step": 362170, "epoch": 2993} {"train_loss": -45.82255172729492, "global_step": 362171, "epoch": 2993} {"train_loss": -43.98469161987305, "global_step": 362172, "epoch": 2993} {"train_loss": -44.55613327026367, "global_step": 362173, "epoch": 2993} {"train_loss": -43.8717041015625, "global_step": 362174, "epoch": 2993} {"train_loss": -45.54629898071289, "global_step": 362175, "epoch": 2993} {"train_loss": -44.51076889038086, "global_step": 362176, "epoch": 2993} {"train_loss": -43.586055755615234, "global_step": 362177, "epoch": 2993} {"train_loss": -43.6212272644043, "global_step": 362178, "epoch": 2993} {"train_loss": -44.7117919921875, "global_step": 362179, "epoch": 2993} {"train_loss": -45.06560516357422, "global_step": 362180, "epoch": 2993} {"train_loss": -41.72978591918945, "global_step": 362181, "epoch": 2993} {"train_loss": -43.54534912109375, "global_step": 362182, "epoch": 2993} {"train_loss": -44.079158782958984, "global_step": 362183, "epoch": 2993} {"train_loss": -42.985294342041016, "global_step": 362184, "epoch": 2993} {"train_loss": -43.43476486206055, "global_step": 362185, "epoch": 2993} {"train_loss": -42.60879135131836, "global_step": 362186, "epoch": 2993} {"train_loss": -43.801124572753906, "global_step": 362187, "epoch": 2993} {"train_loss": -42.36882019042969, "global_step": 362188, "epoch": 2993} {"train_loss": -43.93998336791992, "global_step": 362189, "epoch": 2993} {"train_loss": -42.059688568115234, "global_step": 362190, "epoch": 2993} {"train_loss": -44.46634292602539, "global_step": 362191, "epoch": 2993} {"train_loss": -43.79169845581055, "global_step": 362192, "epoch": 2993} {"train_loss": -43.7851676940918, "global_step": 362193, "epoch": 2993} {"train_loss": -43.51925277709961, "global_step": 362194, "epoch": 2993} {"train_loss": -43.7613410949707, "global_step": 362195, "epoch": 2993} {"train_loss": -44.34601593017578, "global_step": 362196, "epoch": 2993} {"train_loss": -42.9124641418457, "global_step": 362197, "epoch": 2993} {"train_loss": -42.182350158691406, "global_step": 362198, "epoch": 2993} {"train_loss": -44.18754196166992, "global_step": 362199, "epoch": 2993} {"train_loss": -44.0147590637207, "global_step": 362200, "epoch": 2993} {"train_loss": -43.087432861328125, "global_step": 362201, "epoch": 2993} {"train_loss": -44.401241302490234, "global_step": 362202, "epoch": 2993} {"train_loss": -42.84736633300781, "global_step": 362203, "epoch": 2993} {"train_loss": -43.66214370727539, "global_step": 362204, "epoch": 2993} {"train_loss": -44.0886344909668, "global_step": 362205, "epoch": 2993} {"train_loss": -44.79011154174805, "global_step": 362206, "epoch": 2993} {"train_loss": -42.37065505981445, "global_step": 362207, "epoch": 2993} {"train_loss": -43.664031982421875, "global_step": 362208, "epoch": 2993} {"train_loss": -44.47425079345703, "global_step": 362209, "epoch": 2993} {"train_loss": -44.496734619140625, "global_step": 362210, "epoch": 2993} {"train_loss": -44.88674545288086, "global_step": 362211, "epoch": 2993} {"train_loss": -44.649173736572266, "global_step": 362212, "epoch": 2993} {"train_loss": -44.90394973754883, "global_step": 362213, "epoch": 2993} {"train_loss": -44.254547119140625, "global_step": 362214, "epoch": 2993} {"train_loss": -45.122772216796875, "global_step": 362215, "epoch": 2993} {"train_loss": -44.987247467041016, "global_step": 362216, "epoch": 2993} {"train_loss": -42.38153076171875, "global_step": 362217, "epoch": 2993} {"train_loss": -44.23615264892578, "global_step": 362218, "epoch": 2993} {"train_loss": -44.082305908203125, "global_step": 362219, "epoch": 2993} {"train_loss": -43.887298583984375, "global_step": 362220, "epoch": 2993} {"train_loss": -44.30717849731445, "global_step": 362221, "epoch": 2993} {"train_loss": -42.77553939819336, "global_step": 362222, "epoch": 2993} {"train_loss": -44.78009796142578, "global_step": 362223, "epoch": 2993} {"train_loss": -44.21751022338867, "global_step": 362224, "epoch": 2993} {"train_loss": -43.77530288696289, "global_step": 362225, "epoch": 2993} {"train_loss": -44.86914825439453, "global_step": 362226, "epoch": 2993} {"train_loss": -42.88471221923828, "global_step": 362227, "epoch": 2993} {"train_loss": -45.542808532714844, "global_step": 362228, "epoch": 2993} {"train_loss": -42.75605392456055, "global_step": 362229, "epoch": 2993} {"train_loss": -43.10295867919922, "global_step": 362230, "epoch": 2993} {"train_loss": -44.25651168823242, "global_step": 362231, "epoch": 2993} {"train_loss": -44.289852142333984, "global_step": 362232, "epoch": 2993} {"train_loss": -44.05653762817383, "global_step": 362233, "epoch": 2993} {"train_loss": -43.46175765991211, "global_step": 362234, "epoch": 2993} {"train_loss": -41.44183349609375, "global_step": 362235, "epoch": 2993} {"train_loss": -43.77608108520508, "global_step": 362236, "epoch": 2993} {"train_loss": -42.72705841064453, "global_step": 362237, "epoch": 2993} {"train_loss": -43.25082015991211, "global_step": 362238, "epoch": 2993} {"train_loss": -42.518978118896484, "global_step": 362239, "epoch": 2993} {"train_loss": -43.499122619628906, "global_step": 362240, "epoch": 2993} {"train_loss": -43.1207160949707, "global_step": 362241, "epoch": 2993} {"train_loss": -43.476531982421875, "global_step": 362242, "epoch": 2993} {"train_loss": -43.168365478515625, "global_step": 362243, "epoch": 2993} {"train_loss": -43.592464447021484, "global_step": 362244, "epoch": 2993} {"train_loss": -41.54145431518555, "global_step": 362245, "epoch": 2993} {"train_loss": -43.471622467041016, "global_step": 362246, "epoch": 2993} {"train_loss": -41.908233642578125, "global_step": 362247, "epoch": 2993} {"train_loss": -44.03229522705078, "global_step": 362248, "epoch": 2993} {"train_loss": -44.72252655029297, "global_step": 362249, "epoch": 2993} {"train_loss": -42.766693115234375, "global_step": 362250, "epoch": 2993} {"train_loss": -43.636871337890625, "global_step": 362251, "epoch": 2993} {"train_loss": -43.651302337646484, "global_step": 362252, "epoch": 2993} {"train_loss": -45.20395278930664, "global_step": 362253, "epoch": 2993} {"train_loss": -44.71277618408203, "global_step": 362254, "epoch": 2993} {"train_loss": -42.94834518432617, "global_step": 362255, "epoch": 2993} {"train_loss": -43.37248611450195, "global_step": 362256, "epoch": 2993} {"train_loss": -44.88114547729492, "global_step": 362257, "epoch": 2993} {"train_loss": -43.27582550048828, "global_step": 362258, "epoch": 2993} {"train_loss": -40.77102279663086, "global_step": 362259, "epoch": 2993} {"train_loss": -44.1264762878418, "global_step": 362260, "epoch": 2993} {"train_loss": -44.42209243774414, "global_step": 362261, "epoch": 2993} {"train_loss": -42.54753494262695, "global_step": 362262, "epoch": 2993} {"train_loss": -44.247867584228516, "global_step": 362263, "epoch": 2993} {"train_loss": -44.42375564575195, "global_step": 362264, "epoch": 2993} {"train_loss": -44.56523513793945, "global_step": 362265, "epoch": 2993} {"train_loss": -44.53703308105469, "global_step": 362266, "epoch": 2993} {"train_loss": -43.780330657958984, "global_step": 362267, "epoch": 2993} {"train_loss": -44.676788330078125, "global_step": 362268, "epoch": 2993} {"train_loss": -44.89306640625, "global_step": 362269, "epoch": 2993} {"train_loss": -43.870574951171875, "global_step": 362270, "epoch": 2993} {"train_loss": -44.75110626220703, "global_step": 362271, "epoch": 2993} {"train_loss": -43.841068267822266, "global_step": 362272, "epoch": 2993} {"train_loss": -43.966029490321134, "global_step": 362273, "epoch": 2993, "val_loss": 2556556.75} {"train_loss": -45.15958786010742, "global_step": 362274, "epoch": 2994} {"train_loss": -44.353240966796875, "global_step": 362275, "epoch": 2994} {"train_loss": -45.43693542480469, "global_step": 362276, "epoch": 2994} {"train_loss": -45.26129913330078, "global_step": 362277, "epoch": 2994} {"train_loss": -44.78296661376953, "global_step": 362278, "epoch": 2994} {"train_loss": -45.119384765625, "global_step": 362279, "epoch": 2994} {"train_loss": -44.7467155456543, "global_step": 362280, "epoch": 2994} {"train_loss": -45.3434944152832, "global_step": 362281, "epoch": 2994} {"train_loss": -44.67511749267578, "global_step": 362282, "epoch": 2994} {"train_loss": -44.91411590576172, "global_step": 362283, "epoch": 2994} {"train_loss": -44.96828842163086, "global_step": 362284, "epoch": 2994} {"train_loss": -45.736148834228516, "global_step": 362285, "epoch": 2994} {"train_loss": -44.304054260253906, "global_step": 362286, "epoch": 2994} {"train_loss": -45.39833450317383, "global_step": 362287, "epoch": 2994} {"train_loss": -44.0393180847168, "global_step": 362288, "epoch": 2994} {"train_loss": -43.674278259277344, "global_step": 362289, "epoch": 2994} {"train_loss": -45.097259521484375, "global_step": 362290, "epoch": 2994} {"train_loss": -45.289146423339844, "global_step": 362291, "epoch": 2994} {"train_loss": -44.63961410522461, "global_step": 362292, "epoch": 2994} {"train_loss": -43.69664001464844, "global_step": 362293, "epoch": 2994} {"train_loss": -43.609493255615234, "global_step": 362294, "epoch": 2994} {"train_loss": -44.43215560913086, "global_step": 362295, "epoch": 2994} {"train_loss": -45.547420501708984, "global_step": 362296, "epoch": 2994} {"train_loss": -44.194976806640625, "global_step": 362297, "epoch": 2994} {"train_loss": -44.72013473510742, "global_step": 362298, "epoch": 2994} {"train_loss": -43.862239837646484, "global_step": 362299, "epoch": 2994} {"train_loss": -44.92444610595703, "global_step": 362300, "epoch": 2994} {"train_loss": -44.990753173828125, "global_step": 362301, "epoch": 2994} {"train_loss": -44.55172348022461, "global_step": 362302, "epoch": 2994} {"train_loss": -44.88973617553711, "global_step": 362303, "epoch": 2994} {"train_loss": -44.94929122924805, "global_step": 362304, "epoch": 2994} {"train_loss": -44.862586975097656, "global_step": 362305, "epoch": 2994} {"train_loss": -44.84278106689453, "global_step": 362306, "epoch": 2994} {"train_loss": -43.213924407958984, "global_step": 362307, "epoch": 2994} {"train_loss": -44.688026428222656, "global_step": 362308, "epoch": 2994} {"train_loss": -45.11410140991211, "global_step": 362309, "epoch": 2994} {"train_loss": -45.318824768066406, "global_step": 362310, "epoch": 2994} {"train_loss": -44.949153900146484, "global_step": 362311, "epoch": 2994} {"train_loss": -45.21663284301758, "global_step": 362312, "epoch": 2994} {"train_loss": -45.431060791015625, "global_step": 362313, "epoch": 2994} {"train_loss": -44.717655181884766, "global_step": 362314, "epoch": 2994} {"train_loss": -45.438331604003906, "global_step": 362315, "epoch": 2994} {"train_loss": -45.0800666809082, "global_step": 362316, "epoch": 2994} {"train_loss": -41.83420181274414, "global_step": 362317, "epoch": 2994} {"train_loss": -44.79487609863281, "global_step": 362318, "epoch": 2994} {"train_loss": -46.00325393676758, "global_step": 362319, "epoch": 2994} {"train_loss": -44.312068939208984, "global_step": 362320, "epoch": 2994} {"train_loss": -45.00455856323242, "global_step": 362321, "epoch": 2994} {"train_loss": -44.58496856689453, "global_step": 362322, "epoch": 2994} {"train_loss": -45.39341354370117, "global_step": 362323, "epoch": 2994} {"train_loss": -44.054725646972656, "global_step": 362324, "epoch": 2994} {"train_loss": -29.775854110717773, "global_step": 362325, "epoch": 2994} {"train_loss": -44.08952713012695, "global_step": 362326, "epoch": 2994} {"train_loss": -43.59964370727539, "global_step": 362327, "epoch": 2994} {"train_loss": -44.56463623046875, "global_step": 362328, "epoch": 2994} {"train_loss": -43.57749938964844, "global_step": 362329, "epoch": 2994} {"train_loss": -43.83819580078125, "global_step": 362330, "epoch": 2994} {"train_loss": -43.04758834838867, "global_step": 362331, "epoch": 2994} {"train_loss": -44.845211029052734, "global_step": 362332, "epoch": 2994} {"train_loss": -41.8722038269043, "global_step": 362333, "epoch": 2994} {"train_loss": -44.91014862060547, "global_step": 362334, "epoch": 2994} {"train_loss": -42.25659942626953, "global_step": 362335, "epoch": 2994} {"train_loss": -36.68564224243164, "global_step": 362336, "epoch": 2994} {"train_loss": -42.47297286987305, "global_step": 362337, "epoch": 2994} {"train_loss": -43.58740234375, "global_step": 362338, "epoch": 2994} {"train_loss": -44.890708923339844, "global_step": 362339, "epoch": 2994} {"train_loss": -43.688846588134766, "global_step": 362340, "epoch": 2994} {"train_loss": -42.7499885559082, "global_step": 362341, "epoch": 2994} {"train_loss": -45.252357482910156, "global_step": 362342, "epoch": 2994} {"train_loss": -42.893978118896484, "global_step": 362343, "epoch": 2994} {"train_loss": -43.31488037109375, "global_step": 362344, "epoch": 2994} {"train_loss": -44.35327911376953, "global_step": 362345, "epoch": 2994} {"train_loss": -40.659324645996094, "global_step": 362346, "epoch": 2994} {"train_loss": -43.646728515625, "global_step": 362347, "epoch": 2994} {"train_loss": -42.14933395385742, "global_step": 362348, "epoch": 2994} {"train_loss": -41.21213912963867, "global_step": 362349, "epoch": 2994} {"train_loss": -44.06681442260742, "global_step": 362350, "epoch": 2994} {"train_loss": -43.98085403442383, "global_step": 362351, "epoch": 2994} {"train_loss": -42.325836181640625, "global_step": 362352, "epoch": 2994} {"train_loss": -44.4153938293457, "global_step": 362353, "epoch": 2994} {"train_loss": -42.39801788330078, "global_step": 362354, "epoch": 2994} {"train_loss": -45.348812103271484, "global_step": 362355, "epoch": 2994} {"train_loss": -44.12958908081055, "global_step": 362356, "epoch": 2994} {"train_loss": -44.8077392578125, "global_step": 362357, "epoch": 2994} {"train_loss": -44.157875061035156, "global_step": 362358, "epoch": 2994} {"train_loss": -44.960384368896484, "global_step": 362359, "epoch": 2994} {"train_loss": -43.87080764770508, "global_step": 362360, "epoch": 2994} {"train_loss": -45.437225341796875, "global_step": 362361, "epoch": 2994} {"train_loss": -45.184688568115234, "global_step": 362362, "epoch": 2994} {"train_loss": -45.1594352722168, "global_step": 362363, "epoch": 2994} {"train_loss": -45.560829162597656, "global_step": 362364, "epoch": 2994} {"train_loss": -44.779640197753906, "global_step": 362365, "epoch": 2994} {"train_loss": -44.63755416870117, "global_step": 362366, "epoch": 2994} {"train_loss": -44.52067184448242, "global_step": 362367, "epoch": 2994} {"train_loss": -44.64457321166992, "global_step": 362368, "epoch": 2994} {"train_loss": -45.13994216918945, "global_step": 362369, "epoch": 2994} {"train_loss": -44.79052734375, "global_step": 362370, "epoch": 2994} {"train_loss": -45.422096252441406, "global_step": 362371, "epoch": 2994} {"train_loss": -44.89711380004883, "global_step": 362372, "epoch": 2994} {"train_loss": -44.76311111450195, "global_step": 362373, "epoch": 2994} {"train_loss": -44.92240905761719, "global_step": 362374, "epoch": 2994} {"train_loss": -45.0616569519043, "global_step": 362375, "epoch": 2994} {"train_loss": -45.28013229370117, "global_step": 362376, "epoch": 2994} {"train_loss": -44.8154296875, "global_step": 362377, "epoch": 2994} {"train_loss": -45.012046813964844, "global_step": 362378, "epoch": 2994} {"train_loss": -44.28509521484375, "global_step": 362379, "epoch": 2994} {"train_loss": -44.13934326171875, "global_step": 362380, "epoch": 2994} {"train_loss": -44.69124221801758, "global_step": 362381, "epoch": 2994} {"train_loss": -45.14815902709961, "global_step": 362382, "epoch": 2994} {"train_loss": -44.0306510925293, "global_step": 362383, "epoch": 2994} {"train_loss": -45.304683685302734, "global_step": 362384, "epoch": 2994} {"train_loss": -44.63587188720703, "global_step": 362385, "epoch": 2994} {"train_loss": -44.44984817504883, "global_step": 362386, "epoch": 2994} {"train_loss": -45.881019592285156, "global_step": 362387, "epoch": 2994} {"train_loss": -44.982540130615234, "global_step": 362388, "epoch": 2994} {"train_loss": -45.20740509033203, "global_step": 362389, "epoch": 2994} {"train_loss": -44.19044876098633, "global_step": 362390, "epoch": 2994} {"train_loss": -44.89645004272461, "global_step": 362391, "epoch": 2994} {"train_loss": -44.014984130859375, "global_step": 362392, "epoch": 2994} {"train_loss": -45.0513916015625, "global_step": 362393, "epoch": 2994} {"train_loss": -44.26751319633043, "global_step": 362394, "epoch": 2994, "val_loss": 2560162.5} {"train_loss": -44.881591796875, "global_step": 362395, "epoch": 2995} {"train_loss": -45.747802734375, "global_step": 362396, "epoch": 2995} {"train_loss": -44.577613830566406, "global_step": 362397, "epoch": 2995} {"train_loss": -44.498863220214844, "global_step": 362398, "epoch": 2995} {"train_loss": -45.743709564208984, "global_step": 362399, "epoch": 2995} {"train_loss": -44.712745666503906, "global_step": 362400, "epoch": 2995} {"train_loss": -44.67352294921875, "global_step": 362401, "epoch": 2995} {"train_loss": -45.13507080078125, "global_step": 362402, "epoch": 2995} {"train_loss": -45.321929931640625, "global_step": 362403, "epoch": 2995} {"train_loss": -45.2138671875, "global_step": 362404, "epoch": 2995} {"train_loss": -44.08354949951172, "global_step": 362405, "epoch": 2995} {"train_loss": -44.9365234375, "global_step": 362406, "epoch": 2995} {"train_loss": -44.382808685302734, "global_step": 362407, "epoch": 2995} {"train_loss": -45.52854919433594, "global_step": 362408, "epoch": 2995} {"train_loss": -44.56462478637695, "global_step": 362409, "epoch": 2995} {"train_loss": -41.09320831298828, "global_step": 362410, "epoch": 2995} {"train_loss": -43.40729904174805, "global_step": 362411, "epoch": 2995} {"train_loss": -43.68853759765625, "global_step": 362412, "epoch": 2995} {"train_loss": -44.8444709777832, "global_step": 362413, "epoch": 2995} {"train_loss": -44.162288665771484, "global_step": 362414, "epoch": 2995} {"train_loss": -42.30082321166992, "global_step": 362415, "epoch": 2995} {"train_loss": -42.47335433959961, "global_step": 362416, "epoch": 2995} {"train_loss": -45.157196044921875, "global_step": 362417, "epoch": 2995} {"train_loss": -41.26314926147461, "global_step": 362418, "epoch": 2995} {"train_loss": -44.24702835083008, "global_step": 362419, "epoch": 2995} {"train_loss": -44.55767822265625, "global_step": 362420, "epoch": 2995} {"train_loss": -42.366004943847656, "global_step": 362421, "epoch": 2995} {"train_loss": -44.53997802734375, "global_step": 362422, "epoch": 2995} {"train_loss": -42.85939407348633, "global_step": 362423, "epoch": 2995} {"train_loss": -42.80472946166992, "global_step": 362424, "epoch": 2995} {"train_loss": -44.09914016723633, "global_step": 362425, "epoch": 2995} {"train_loss": -45.246864318847656, "global_step": 362426, "epoch": 2995} {"train_loss": -44.81315994262695, "global_step": 362427, "epoch": 2995} {"train_loss": -42.26984405517578, "global_step": 362428, "epoch": 2995} {"train_loss": -44.8095588684082, "global_step": 362429, "epoch": 2995} {"train_loss": -43.96974182128906, "global_step": 362430, "epoch": 2995} {"train_loss": -43.007659912109375, "global_step": 362431, "epoch": 2995} {"train_loss": -44.72315216064453, "global_step": 362432, "epoch": 2995} {"train_loss": -44.02766036987305, "global_step": 362433, "epoch": 2995} {"train_loss": -43.475852966308594, "global_step": 362434, "epoch": 2995} {"train_loss": -44.100975036621094, "global_step": 362435, "epoch": 2995} {"train_loss": -44.42203903198242, "global_step": 362436, "epoch": 2995} {"train_loss": -42.25812911987305, "global_step": 362437, "epoch": 2995} {"train_loss": -43.76343536376953, "global_step": 362438, "epoch": 2995} {"train_loss": -43.82734298706055, "global_step": 362439, "epoch": 2995} {"train_loss": -41.67985534667969, "global_step": 362440, "epoch": 2995} {"train_loss": -43.84702682495117, "global_step": 362441, "epoch": 2995} {"train_loss": -43.37600326538086, "global_step": 362442, "epoch": 2995} {"train_loss": -42.796844482421875, "global_step": 362443, "epoch": 2995} {"train_loss": -43.7755126953125, "global_step": 362444, "epoch": 2995} {"train_loss": -44.01094055175781, "global_step": 362445, "epoch": 2995} {"train_loss": -44.449981689453125, "global_step": 362446, "epoch": 2995} {"train_loss": -44.32929611206055, "global_step": 362447, "epoch": 2995} {"train_loss": -44.130001068115234, "global_step": 362448, "epoch": 2995} {"train_loss": -44.65768051147461, "global_step": 362449, "epoch": 2995} {"train_loss": -44.52874755859375, "global_step": 362450, "epoch": 2995} {"train_loss": -44.53300094604492, "global_step": 362451, "epoch": 2995} {"train_loss": -44.339027404785156, "global_step": 362452, "epoch": 2995} {"train_loss": -44.380577087402344, "global_step": 362453, "epoch": 2995} {"train_loss": -44.52690505981445, "global_step": 362454, "epoch": 2995} {"train_loss": -45.24345779418945, "global_step": 362455, "epoch": 2995} {"train_loss": -44.565643310546875, "global_step": 362456, "epoch": 2995} {"train_loss": -44.99095916748047, "global_step": 362457, "epoch": 2995} {"train_loss": -44.520416259765625, "global_step": 362458, "epoch": 2995} {"train_loss": -44.12311553955078, "global_step": 362459, "epoch": 2995} {"train_loss": -45.116878509521484, "global_step": 362460, "epoch": 2995} {"train_loss": -44.024986267089844, "global_step": 362461, "epoch": 2995} {"train_loss": -45.150306701660156, "global_step": 362462, "epoch": 2995} {"train_loss": -45.28873062133789, "global_step": 362463, "epoch": 2995} {"train_loss": -44.45341873168945, "global_step": 362464, "epoch": 2995} {"train_loss": -44.8571891784668, "global_step": 362465, "epoch": 2995} {"train_loss": -45.05256271362305, "global_step": 362466, "epoch": 2995} {"train_loss": -44.44112777709961, "global_step": 362467, "epoch": 2995} {"train_loss": -44.55712127685547, "global_step": 362468, "epoch": 2995} {"train_loss": -44.0579948425293, "global_step": 362469, "epoch": 2995} {"train_loss": -43.85670852661133, "global_step": 362470, "epoch": 2995} {"train_loss": -43.739356994628906, "global_step": 362471, "epoch": 2995} {"train_loss": -44.587913513183594, "global_step": 362472, "epoch": 2995} {"train_loss": -41.81632614135742, "global_step": 362473, "epoch": 2995} {"train_loss": -43.08549118041992, "global_step": 362474, "epoch": 2995} {"train_loss": -45.45956039428711, "global_step": 362475, "epoch": 2995} {"train_loss": -43.189552307128906, "global_step": 362476, "epoch": 2995} {"train_loss": -44.524322509765625, "global_step": 362477, "epoch": 2995} {"train_loss": -42.10778045654297, "global_step": 362478, "epoch": 2995} {"train_loss": -43.53329086303711, "global_step": 362479, "epoch": 2995} {"train_loss": -44.11689376831055, "global_step": 362480, "epoch": 2995} {"train_loss": -44.16853713989258, "global_step": 362481, "epoch": 2995} {"train_loss": -44.49262619018555, "global_step": 362482, "epoch": 2995} {"train_loss": -44.614227294921875, "global_step": 362483, "epoch": 2995} {"train_loss": -45.0085334777832, "global_step": 362484, "epoch": 2995} {"train_loss": -45.01001739501953, "global_step": 362485, "epoch": 2995} {"train_loss": -45.14643478393555, "global_step": 362486, "epoch": 2995} {"train_loss": -44.80335235595703, "global_step": 362487, "epoch": 2995} {"train_loss": -44.92081832885742, "global_step": 362488, "epoch": 2995} {"train_loss": -44.936500549316406, "global_step": 362489, "epoch": 2995} {"train_loss": -45.296607971191406, "global_step": 362490, "epoch": 2995} {"train_loss": -44.671478271484375, "global_step": 362491, "epoch": 2995} {"train_loss": -45.14593505859375, "global_step": 362492, "epoch": 2995} {"train_loss": -45.67133331298828, "global_step": 362493, "epoch": 2995} {"train_loss": -45.22610092163086, "global_step": 362494, "epoch": 2995} {"train_loss": -45.081199645996094, "global_step": 362495, "epoch": 2995} {"train_loss": -45.129940032958984, "global_step": 362496, "epoch": 2995} {"train_loss": -45.58087158203125, "global_step": 362497, "epoch": 2995} {"train_loss": -45.50808334350586, "global_step": 362498, "epoch": 2995} {"train_loss": -45.05965805053711, "global_step": 362499, "epoch": 2995} {"train_loss": -44.73514175415039, "global_step": 362500, "epoch": 2995} {"train_loss": -45.6630859375, "global_step": 362501, "epoch": 2995} {"train_loss": -45.14690399169922, "global_step": 362502, "epoch": 2995} {"train_loss": -45.151554107666016, "global_step": 362503, "epoch": 2995} {"train_loss": -45.807884216308594, "global_step": 362504, "epoch": 2995} {"train_loss": -45.40547561645508, "global_step": 362505, "epoch": 2995} {"train_loss": -45.65771484375, "global_step": 362506, "epoch": 2995} {"train_loss": -44.84617233276367, "global_step": 362507, "epoch": 2995} {"train_loss": -45.04924774169922, "global_step": 362508, "epoch": 2995} {"train_loss": -45.91550827026367, "global_step": 362509, "epoch": 2995} {"train_loss": -44.865966796875, "global_step": 362510, "epoch": 2995} {"train_loss": -45.1705207824707, "global_step": 362511, "epoch": 2995} {"train_loss": -45.84025955200195, "global_step": 362512, "epoch": 2995} {"train_loss": -45.7440071105957, "global_step": 362513, "epoch": 2995} {"train_loss": -44.45831298828125, "global_step": 362514, "epoch": 2995} {"train_loss": -44.4026394048013, "global_step": 362515, "epoch": 2995, "val_loss": 2567975.0} {"train_loss": -45.537078857421875, "global_step": 362516, "epoch": 2996} {"train_loss": -45.46916198730469, "global_step": 362517, "epoch": 2996} {"train_loss": -44.823829650878906, "global_step": 362518, "epoch": 2996} {"train_loss": -44.056495666503906, "global_step": 362519, "epoch": 2996} {"train_loss": -44.09611129760742, "global_step": 362520, "epoch": 2996} {"train_loss": -45.648681640625, "global_step": 362521, "epoch": 2996} {"train_loss": -44.0311393737793, "global_step": 362522, "epoch": 2996} {"train_loss": -40.919124603271484, "global_step": 362523, "epoch": 2996} {"train_loss": -44.43576431274414, "global_step": 362524, "epoch": 2996} {"train_loss": -43.08650588989258, "global_step": 362525, "epoch": 2996} {"train_loss": -43.71745681762695, "global_step": 362526, "epoch": 2996} {"train_loss": -43.917728424072266, "global_step": 362527, "epoch": 2996} {"train_loss": -44.0903205871582, "global_step": 362528, "epoch": 2996} {"train_loss": -44.32862854003906, "global_step": 362529, "epoch": 2996} {"train_loss": -44.34217071533203, "global_step": 362530, "epoch": 2996} {"train_loss": -43.31315231323242, "global_step": 362531, "epoch": 2996} {"train_loss": -42.84578323364258, "global_step": 362532, "epoch": 2996} {"train_loss": -43.27461624145508, "global_step": 362533, "epoch": 2996} {"train_loss": -43.20344161987305, "global_step": 362534, "epoch": 2996} {"train_loss": -41.72030258178711, "global_step": 362535, "epoch": 2996} {"train_loss": -44.11554718017578, "global_step": 362536, "epoch": 2996} {"train_loss": -43.044857025146484, "global_step": 362537, "epoch": 2996} {"train_loss": -43.97994613647461, "global_step": 362538, "epoch": 2996} {"train_loss": -43.691490173339844, "global_step": 362539, "epoch": 2996} {"train_loss": -43.53156661987305, "global_step": 362540, "epoch": 2996} {"train_loss": -43.852901458740234, "global_step": 362541, "epoch": 2996} {"train_loss": -43.36331558227539, "global_step": 362542, "epoch": 2996} {"train_loss": -43.777259826660156, "global_step": 362543, "epoch": 2996} {"train_loss": -41.7882080078125, "global_step": 362544, "epoch": 2996} {"train_loss": -44.532649993896484, "global_step": 362545, "epoch": 2996} {"train_loss": -41.5697021484375, "global_step": 362546, "epoch": 2996} {"train_loss": -41.87751388549805, "global_step": 362547, "epoch": 2996} {"train_loss": -44.79629135131836, "global_step": 362548, "epoch": 2996} {"train_loss": -41.29843521118164, "global_step": 362549, "epoch": 2996} {"train_loss": -43.62411117553711, "global_step": 362550, "epoch": 2996} {"train_loss": -39.647705078125, "global_step": 362551, "epoch": 2996} {"train_loss": -41.178863525390625, "global_step": 362552, "epoch": 2996} {"train_loss": -41.80702590942383, "global_step": 362553, "epoch": 2996} {"train_loss": -42.380916595458984, "global_step": 362554, "epoch": 2996} {"train_loss": -41.94502639770508, "global_step": 362555, "epoch": 2996} {"train_loss": -43.36115264892578, "global_step": 362556, "epoch": 2996} {"train_loss": -41.69952392578125, "global_step": 362557, "epoch": 2996} {"train_loss": -43.754329681396484, "global_step": 362558, "epoch": 2996} {"train_loss": -43.35919952392578, "global_step": 362559, "epoch": 2996} {"train_loss": -42.995967864990234, "global_step": 362560, "epoch": 2996} {"train_loss": -44.534767150878906, "global_step": 362561, "epoch": 2996} {"train_loss": -43.506805419921875, "global_step": 362562, "epoch": 2996} {"train_loss": -44.213966369628906, "global_step": 362563, "epoch": 2996} {"train_loss": -43.684139251708984, "global_step": 362564, "epoch": 2996} {"train_loss": -44.188533782958984, "global_step": 362565, "epoch": 2996} {"train_loss": -44.20423126220703, "global_step": 362566, "epoch": 2996} {"train_loss": -43.86207580566406, "global_step": 362567, "epoch": 2996} {"train_loss": -44.031471252441406, "global_step": 362568, "epoch": 2996} {"train_loss": -45.14190673828125, "global_step": 362569, "epoch": 2996} {"train_loss": -44.11338806152344, "global_step": 362570, "epoch": 2996} {"train_loss": -44.43812942504883, "global_step": 362571, "epoch": 2996} {"train_loss": -44.42830276489258, "global_step": 362572, "epoch": 2996} {"train_loss": -44.55915069580078, "global_step": 362573, "epoch": 2996} {"train_loss": -44.924659729003906, "global_step": 362574, "epoch": 2996} {"train_loss": -44.50777816772461, "global_step": 362575, "epoch": 2996} {"train_loss": -45.41420364379883, "global_step": 362576, "epoch": 2996} {"train_loss": -44.898624420166016, "global_step": 362577, "epoch": 2996} {"train_loss": -45.08237838745117, "global_step": 362578, "epoch": 2996} {"train_loss": -45.11593246459961, "global_step": 362579, "epoch": 2996} {"train_loss": -45.023712158203125, "global_step": 362580, "epoch": 2996} {"train_loss": -45.27144241333008, "global_step": 362581, "epoch": 2996} {"train_loss": -44.48392868041992, "global_step": 362582, "epoch": 2996} {"train_loss": -45.568355560302734, "global_step": 362583, "epoch": 2996} {"train_loss": -45.42100524902344, "global_step": 362584, "epoch": 2996} {"train_loss": -45.128936767578125, "global_step": 362585, "epoch": 2996} {"train_loss": -45.137847900390625, "global_step": 362586, "epoch": 2996} {"train_loss": -45.40110397338867, "global_step": 362587, "epoch": 2996} {"train_loss": -45.00437927246094, "global_step": 362588, "epoch": 2996} {"train_loss": -45.44489669799805, "global_step": 362589, "epoch": 2996} {"train_loss": -45.327518463134766, "global_step": 362590, "epoch": 2996} {"train_loss": -45.623043060302734, "global_step": 362591, "epoch": 2996} {"train_loss": -45.820308685302734, "global_step": 362592, "epoch": 2996} {"train_loss": -45.34105682373047, "global_step": 362593, "epoch": 2996} {"train_loss": -45.40562057495117, "global_step": 362594, "epoch": 2996} {"train_loss": -45.41407012939453, "global_step": 362595, "epoch": 2996} {"train_loss": -45.39154815673828, "global_step": 362596, "epoch": 2996} {"train_loss": -44.43354415893555, "global_step": 362597, "epoch": 2996} {"train_loss": -45.1606330871582, "global_step": 362598, "epoch": 2996} {"train_loss": -45.110572814941406, "global_step": 362599, "epoch": 2996} {"train_loss": -45.0922966003418, "global_step": 362600, "epoch": 2996} {"train_loss": -45.94622802734375, "global_step": 362601, "epoch": 2996} {"train_loss": -45.24190902709961, "global_step": 362602, "epoch": 2996} {"train_loss": -45.08824157714844, "global_step": 362603, "epoch": 2996} {"train_loss": -44.41505432128906, "global_step": 362604, "epoch": 2996} {"train_loss": -45.26864242553711, "global_step": 362605, "epoch": 2996} {"train_loss": -45.63057327270508, "global_step": 362606, "epoch": 2996} {"train_loss": -45.282283782958984, "global_step": 362607, "epoch": 2996} {"train_loss": -45.50091552734375, "global_step": 362608, "epoch": 2996} {"train_loss": -45.82566452026367, "global_step": 362609, "epoch": 2996} {"train_loss": -45.907100677490234, "global_step": 362610, "epoch": 2996} {"train_loss": -46.237037658691406, "global_step": 362611, "epoch": 2996} {"train_loss": -45.32545852661133, "global_step": 362612, "epoch": 2996} {"train_loss": -46.254817962646484, "global_step": 362613, "epoch": 2996} {"train_loss": -45.72650146484375, "global_step": 362614, "epoch": 2996} {"train_loss": -45.83498001098633, "global_step": 362615, "epoch": 2996} {"train_loss": -45.67024612426758, "global_step": 362616, "epoch": 2996} {"train_loss": -43.9193115234375, "global_step": 362617, "epoch": 2996} {"train_loss": -43.54079055786133, "global_step": 362618, "epoch": 2996} {"train_loss": -42.85886001586914, "global_step": 362619, "epoch": 2996} {"train_loss": -42.89207077026367, "global_step": 362620, "epoch": 2996} {"train_loss": -45.555908203125, "global_step": 362621, "epoch": 2996} {"train_loss": -45.675777435302734, "global_step": 362622, "epoch": 2996} {"train_loss": -44.42963790893555, "global_step": 362623, "epoch": 2996} {"train_loss": -43.898197174072266, "global_step": 362624, "epoch": 2996} {"train_loss": -44.32106018066406, "global_step": 362625, "epoch": 2996} {"train_loss": -45.65415954589844, "global_step": 362626, "epoch": 2996} {"train_loss": -45.23643112182617, "global_step": 362627, "epoch": 2996} {"train_loss": -44.59394454956055, "global_step": 362628, "epoch": 2996} {"train_loss": -44.97279357910156, "global_step": 362629, "epoch": 2996} {"train_loss": -45.25679016113281, "global_step": 362630, "epoch": 2996} {"train_loss": -44.90760040283203, "global_step": 362631, "epoch": 2996} {"train_loss": -45.26717758178711, "global_step": 362632, "epoch": 2996} {"train_loss": -45.551025390625, "global_step": 362633, "epoch": 2996} {"train_loss": -45.23739242553711, "global_step": 362634, "epoch": 2996} {"train_loss": -45.5074577331543, "global_step": 362635, "epoch": 2996} {"train_loss": -44.348127727666174, "global_step": 362636, "epoch": 2996, "val_loss": 2596864.0} {"train_loss": -45.47369384765625, "global_step": 362637, "epoch": 2997} {"train_loss": -44.50415802001953, "global_step": 362638, "epoch": 2997} {"train_loss": -45.42803192138672, "global_step": 362639, "epoch": 2997} {"train_loss": -45.232940673828125, "global_step": 362640, "epoch": 2997} {"train_loss": -45.19620895385742, "global_step": 362641, "epoch": 2997} {"train_loss": -45.10706329345703, "global_step": 362642, "epoch": 2997} {"train_loss": -45.15166091918945, "global_step": 362643, "epoch": 2997} {"train_loss": -45.8338737487793, "global_step": 362644, "epoch": 2997} {"train_loss": -45.88237380981445, "global_step": 362645, "epoch": 2997} {"train_loss": -45.214996337890625, "global_step": 362646, "epoch": 2997} {"train_loss": -44.90283966064453, "global_step": 362647, "epoch": 2997} {"train_loss": -44.77433395385742, "global_step": 362648, "epoch": 2997} {"train_loss": -45.761112213134766, "global_step": 362649, "epoch": 2997} {"train_loss": -44.688228607177734, "global_step": 362650, "epoch": 2997} {"train_loss": -44.03148651123047, "global_step": 362651, "epoch": 2997} {"train_loss": -45.12007522583008, "global_step": 362652, "epoch": 2997} {"train_loss": -46.28654861450195, "global_step": 362653, "epoch": 2997} {"train_loss": -43.800025939941406, "global_step": 362654, "epoch": 2997} {"train_loss": -44.2823371887207, "global_step": 362655, "epoch": 2997} {"train_loss": -45.4084587097168, "global_step": 362656, "epoch": 2997} {"train_loss": -44.759132385253906, "global_step": 362657, "epoch": 2997} {"train_loss": -45.16573715209961, "global_step": 362658, "epoch": 2997} {"train_loss": -44.67582702636719, "global_step": 362659, "epoch": 2997} {"train_loss": -45.220558166503906, "global_step": 362660, "epoch": 2997} {"train_loss": -44.91619873046875, "global_step": 362661, "epoch": 2997} {"train_loss": -44.63005447387695, "global_step": 362662, "epoch": 2997} {"train_loss": -44.58417510986328, "global_step": 362663, "epoch": 2997} {"train_loss": -44.951904296875, "global_step": 362664, "epoch": 2997} {"train_loss": -44.74225997924805, "global_step": 362665, "epoch": 2997} {"train_loss": -44.60401153564453, "global_step": 362666, "epoch": 2997} {"train_loss": -44.91432189941406, "global_step": 362667, "epoch": 2997} {"train_loss": -44.88822555541992, "global_step": 362668, "epoch": 2997} {"train_loss": -43.19044876098633, "global_step": 362669, "epoch": 2997} {"train_loss": -43.084197998046875, "global_step": 362670, "epoch": 2997} {"train_loss": -44.267494201660156, "global_step": 362671, "epoch": 2997} {"train_loss": -44.93980026245117, "global_step": 362672, "epoch": 2997} {"train_loss": -43.55105209350586, "global_step": 362673, "epoch": 2997} {"train_loss": -41.4696044921875, "global_step": 362674, "epoch": 2997} {"train_loss": -44.79298400878906, "global_step": 362675, "epoch": 2997} {"train_loss": -44.263038635253906, "global_step": 362676, "epoch": 2997} {"train_loss": -43.8931999206543, "global_step": 362677, "epoch": 2997} {"train_loss": -43.75539779663086, "global_step": 362678, "epoch": 2997} {"train_loss": -42.651702880859375, "global_step": 362679, "epoch": 2997} {"train_loss": -44.11640548706055, "global_step": 362680, "epoch": 2997} {"train_loss": -43.3317756652832, "global_step": 362681, "epoch": 2997} {"train_loss": -40.68258285522461, "global_step": 362682, "epoch": 2997} {"train_loss": -43.80965042114258, "global_step": 362683, "epoch": 2997} {"train_loss": -38.237125396728516, "global_step": 362684, "epoch": 2997} {"train_loss": -37.446022033691406, "global_step": 362685, "epoch": 2997} {"train_loss": -44.442108154296875, "global_step": 362686, "epoch": 2997} {"train_loss": -36.97493362426758, "global_step": 362687, "epoch": 2997} {"train_loss": -42.24083709716797, "global_step": 362688, "epoch": 2997} {"train_loss": -39.21149444580078, "global_step": 362689, "epoch": 2997} {"train_loss": -37.595787048339844, "global_step": 362690, "epoch": 2997} {"train_loss": -42.9649543762207, "global_step": 362691, "epoch": 2997} {"train_loss": -38.91021728515625, "global_step": 362692, "epoch": 2997} {"train_loss": -39.68809509277344, "global_step": 362693, "epoch": 2997} {"train_loss": -40.595096588134766, "global_step": 362694, "epoch": 2997} {"train_loss": -43.840850830078125, "global_step": 362695, "epoch": 2997} {"train_loss": -41.77532958984375, "global_step": 362696, "epoch": 2997} {"train_loss": -43.33852767944336, "global_step": 362697, "epoch": 2997} {"train_loss": -43.776424407958984, "global_step": 362698, "epoch": 2997} {"train_loss": -43.579071044921875, "global_step": 362699, "epoch": 2997} {"train_loss": -43.001502990722656, "global_step": 362700, "epoch": 2997} {"train_loss": -44.44967269897461, "global_step": 362701, "epoch": 2997} {"train_loss": -43.23454284667969, "global_step": 362702, "epoch": 2997} {"train_loss": -44.30167770385742, "global_step": 362703, "epoch": 2997} {"train_loss": -42.841888427734375, "global_step": 362704, "epoch": 2997} {"train_loss": -44.62907028198242, "global_step": 362705, "epoch": 2997} {"train_loss": -43.8648567199707, "global_step": 362706, "epoch": 2997} {"train_loss": -43.77688217163086, "global_step": 362707, "epoch": 2997} {"train_loss": -43.6851921081543, "global_step": 362708, "epoch": 2997} {"train_loss": -44.09661865234375, "global_step": 362709, "epoch": 2997} {"train_loss": -45.261573791503906, "global_step": 362710, "epoch": 2997} {"train_loss": -44.30828857421875, "global_step": 362711, "epoch": 2997} {"train_loss": -44.939762115478516, "global_step": 362712, "epoch": 2997} {"train_loss": -44.3995246887207, "global_step": 362713, "epoch": 2997} {"train_loss": -44.82381820678711, "global_step": 362714, "epoch": 2997} {"train_loss": -44.622650146484375, "global_step": 362715, "epoch": 2997} {"train_loss": -44.55764389038086, "global_step": 362716, "epoch": 2997} {"train_loss": -45.15312194824219, "global_step": 362717, "epoch": 2997} {"train_loss": -45.42151641845703, "global_step": 362718, "epoch": 2997} {"train_loss": -45.373775482177734, "global_step": 362719, "epoch": 2997} {"train_loss": -45.41047286987305, "global_step": 362720, "epoch": 2997} {"train_loss": -44.83449172973633, "global_step": 362721, "epoch": 2997} {"train_loss": -45.368106842041016, "global_step": 362722, "epoch": 2997} {"train_loss": -45.09955978393555, "global_step": 362723, "epoch": 2997} {"train_loss": -44.92835235595703, "global_step": 362724, "epoch": 2997} {"train_loss": -44.943912506103516, "global_step": 362725, "epoch": 2997} {"train_loss": -44.964508056640625, "global_step": 362726, "epoch": 2997} {"train_loss": -44.997920989990234, "global_step": 362727, "epoch": 2997} {"train_loss": -45.51759719848633, "global_step": 362728, "epoch": 2997} {"train_loss": -45.22982406616211, "global_step": 362729, "epoch": 2997} {"train_loss": -45.406978607177734, "global_step": 362730, "epoch": 2997} {"train_loss": -45.3713493347168, "global_step": 362731, "epoch": 2997} {"train_loss": -45.63071823120117, "global_step": 362732, "epoch": 2997} {"train_loss": -45.698638916015625, "global_step": 362733, "epoch": 2997} {"train_loss": -45.972503662109375, "global_step": 362734, "epoch": 2997} {"train_loss": -45.52272415161133, "global_step": 362735, "epoch": 2997} {"train_loss": -46.05742645263672, "global_step": 362736, "epoch": 2997} {"train_loss": -45.954742431640625, "global_step": 362737, "epoch": 2997} {"train_loss": -45.8388786315918, "global_step": 362738, "epoch": 2997} {"train_loss": -46.0870475769043, "global_step": 362739, "epoch": 2997} {"train_loss": -45.80820846557617, "global_step": 362740, "epoch": 2997} {"train_loss": -46.463314056396484, "global_step": 362741, "epoch": 2997} {"train_loss": -45.85803985595703, "global_step": 362742, "epoch": 2997} {"train_loss": -46.43175506591797, "global_step": 362743, "epoch": 2997} {"train_loss": -46.2547721862793, "global_step": 362744, "epoch": 2997} {"train_loss": -46.03213882446289, "global_step": 362745, "epoch": 2997} {"train_loss": -45.9622802734375, "global_step": 362746, "epoch": 2997} {"train_loss": -46.20683288574219, "global_step": 362747, "epoch": 2997} {"train_loss": -46.1889533996582, "global_step": 362748, "epoch": 2997} {"train_loss": -46.46017837524414, "global_step": 362749, "epoch": 2997} {"train_loss": -46.303096771240234, "global_step": 362750, "epoch": 2997} {"train_loss": -46.364471435546875, "global_step": 362751, "epoch": 2997} {"train_loss": -46.324928283691406, "global_step": 362752, "epoch": 2997} {"train_loss": -46.221412658691406, "global_step": 362753, "epoch": 2997} {"train_loss": -45.954986572265625, "global_step": 362754, "epoch": 2997} {"train_loss": -46.47024917602539, "global_step": 362755, "epoch": 2997} {"train_loss": -46.35699462890625, "global_step": 362756, "epoch": 2997} {"train_loss": -44.41189363968274, "global_step": 362757, "epoch": 2997, "val_loss": 2590783.25} {"train_loss": -46.43073654174805, "global_step": 362758, "epoch": 2998} {"train_loss": -46.61359786987305, "global_step": 362759, "epoch": 2998} {"train_loss": -45.51032638549805, "global_step": 362760, "epoch": 2998} {"train_loss": -45.85749816894531, "global_step": 362761, "epoch": 2998} {"train_loss": -46.671417236328125, "global_step": 362762, "epoch": 2998} {"train_loss": -46.270042419433594, "global_step": 362763, "epoch": 2998} {"train_loss": -46.16727828979492, "global_step": 362764, "epoch": 2998} {"train_loss": -45.635990142822266, "global_step": 362765, "epoch": 2998} {"train_loss": -45.28956604003906, "global_step": 362766, "epoch": 2998} {"train_loss": -45.2634162902832, "global_step": 362767, "epoch": 2998} {"train_loss": -46.52334213256836, "global_step": 362768, "epoch": 2998} {"train_loss": -44.45266342163086, "global_step": 362769, "epoch": 2998} {"train_loss": -40.6662712097168, "global_step": 362770, "epoch": 2998} {"train_loss": -40.37742233276367, "global_step": 362771, "epoch": 2998} {"train_loss": -45.47385787963867, "global_step": 362772, "epoch": 2998} {"train_loss": -45.28871536254883, "global_step": 362773, "epoch": 2998} {"train_loss": -38.93088912963867, "global_step": 362774, "epoch": 2998} {"train_loss": -43.835079193115234, "global_step": 362775, "epoch": 2998} {"train_loss": -40.387542724609375, "global_step": 362776, "epoch": 2998} {"train_loss": -39.760826110839844, "global_step": 362777, "epoch": 2998} {"train_loss": -42.580806732177734, "global_step": 362778, "epoch": 2998} {"train_loss": -42.209381103515625, "global_step": 362779, "epoch": 2998} {"train_loss": -42.4941291809082, "global_step": 362780, "epoch": 2998} {"train_loss": -42.1221809387207, "global_step": 362781, "epoch": 2998} {"train_loss": -41.559181213378906, "global_step": 362782, "epoch": 2998} {"train_loss": -42.206302642822266, "global_step": 362783, "epoch": 2998} {"train_loss": -42.88819885253906, "global_step": 362784, "epoch": 2998} {"train_loss": -42.7909049987793, "global_step": 362785, "epoch": 2998} {"train_loss": -43.78214645385742, "global_step": 362786, "epoch": 2998} {"train_loss": -43.4525260925293, "global_step": 362787, "epoch": 2998} {"train_loss": -44.00905990600586, "global_step": 362788, "epoch": 2998} {"train_loss": -43.47314453125, "global_step": 362789, "epoch": 2998} {"train_loss": -44.26632308959961, "global_step": 362790, "epoch": 2998} {"train_loss": -44.194183349609375, "global_step": 362791, "epoch": 2998} {"train_loss": -44.15207290649414, "global_step": 362792, "epoch": 2998} {"train_loss": -44.95083999633789, "global_step": 362793, "epoch": 2998} {"train_loss": -44.57524871826172, "global_step": 362794, "epoch": 2998} {"train_loss": -43.89822006225586, "global_step": 362795, "epoch": 2998} {"train_loss": -44.45325469970703, "global_step": 362796, "epoch": 2998} {"train_loss": -43.864051818847656, "global_step": 362797, "epoch": 2998} {"train_loss": -44.765235900878906, "global_step": 362798, "epoch": 2998} {"train_loss": -43.87353515625, "global_step": 362799, "epoch": 2998} {"train_loss": -45.054317474365234, "global_step": 362800, "epoch": 2998} {"train_loss": -44.384437561035156, "global_step": 362801, "epoch": 2998} {"train_loss": -44.532711029052734, "global_step": 362802, "epoch": 2998} {"train_loss": -45.441036224365234, "global_step": 362803, "epoch": 2998} {"train_loss": -45.113277435302734, "global_step": 362804, "epoch": 2998} {"train_loss": -45.174434661865234, "global_step": 362805, "epoch": 2998} {"train_loss": -45.21689987182617, "global_step": 362806, "epoch": 2998} {"train_loss": -45.67072296142578, "global_step": 362807, "epoch": 2998} {"train_loss": -44.7563591003418, "global_step": 362808, "epoch": 2998} {"train_loss": -44.830963134765625, "global_step": 362809, "epoch": 2998} {"train_loss": -44.94597244262695, "global_step": 362810, "epoch": 2998} {"train_loss": -44.486846923828125, "global_step": 362811, "epoch": 2998} {"train_loss": -45.2269172668457, "global_step": 362812, "epoch": 2998} {"train_loss": -45.326202392578125, "global_step": 362813, "epoch": 2998} {"train_loss": -45.434410095214844, "global_step": 362814, "epoch": 2998} {"train_loss": -44.6562614440918, "global_step": 362815, "epoch": 2998} {"train_loss": -45.461788177490234, "global_step": 362816, "epoch": 2998} {"train_loss": -45.2482795715332, "global_step": 362817, "epoch": 2998} {"train_loss": -45.43731689453125, "global_step": 362818, "epoch": 2998} {"train_loss": -45.231475830078125, "global_step": 362819, "epoch": 2998} {"train_loss": -45.07434844970703, "global_step": 362820, "epoch": 2998} {"train_loss": -45.2584228515625, "global_step": 362821, "epoch": 2998} {"train_loss": -45.85305404663086, "global_step": 362822, "epoch": 2998} {"train_loss": -45.76481628417969, "global_step": 362823, "epoch": 2998} {"train_loss": -45.842769622802734, "global_step": 362824, "epoch": 2998} {"train_loss": -45.9221305847168, "global_step": 362825, "epoch": 2998} {"train_loss": -45.808162689208984, "global_step": 362826, "epoch": 2998} {"train_loss": -45.959716796875, "global_step": 362827, "epoch": 2998} {"train_loss": -46.15346145629883, "global_step": 362828, "epoch": 2998} {"train_loss": -45.024444580078125, "global_step": 362829, "epoch": 2998} {"train_loss": -45.81362533569336, "global_step": 362830, "epoch": 2998} {"train_loss": -45.772369384765625, "global_step": 362831, "epoch": 2998} {"train_loss": -45.434356689453125, "global_step": 362832, "epoch": 2998} {"train_loss": -45.54592514038086, "global_step": 362833, "epoch": 2998} {"train_loss": -45.298614501953125, "global_step": 362834, "epoch": 2998} {"train_loss": -45.0693359375, "global_step": 362835, "epoch": 2998} {"train_loss": -46.105873107910156, "global_step": 362836, "epoch": 2998} {"train_loss": -44.46889114379883, "global_step": 362837, "epoch": 2998} {"train_loss": -45.669586181640625, "global_step": 362838, "epoch": 2998} {"train_loss": -46.12065887451172, "global_step": 362839, "epoch": 2998} {"train_loss": -45.538116455078125, "global_step": 362840, "epoch": 2998} {"train_loss": -45.658447265625, "global_step": 362841, "epoch": 2998} {"train_loss": -46.029571533203125, "global_step": 362842, "epoch": 2998} {"train_loss": -45.91041946411133, "global_step": 362843, "epoch": 2998} {"train_loss": -46.088111877441406, "global_step": 362844, "epoch": 2998} {"train_loss": -46.49855422973633, "global_step": 362845, "epoch": 2998} {"train_loss": -46.27387237548828, "global_step": 362846, "epoch": 2998} {"train_loss": -46.08864974975586, "global_step": 362847, "epoch": 2998} {"train_loss": -45.43671798706055, "global_step": 362848, "epoch": 2998} {"train_loss": -46.43416976928711, "global_step": 362849, "epoch": 2998} {"train_loss": -45.39363479614258, "global_step": 362850, "epoch": 2998} {"train_loss": -45.84770965576172, "global_step": 362851, "epoch": 2998} {"train_loss": -45.894073486328125, "global_step": 362852, "epoch": 2998} {"train_loss": -44.9280891418457, "global_step": 362853, "epoch": 2998} {"train_loss": -45.778812408447266, "global_step": 362854, "epoch": 2998} {"train_loss": -45.99174880981445, "global_step": 362855, "epoch": 2998} {"train_loss": -45.5617790222168, "global_step": 362856, "epoch": 2998} {"train_loss": -44.8873176574707, "global_step": 362857, "epoch": 2998} {"train_loss": -45.09074401855469, "global_step": 362858, "epoch": 2998} {"train_loss": -46.31334686279297, "global_step": 362859, "epoch": 2998} {"train_loss": -46.25613021850586, "global_step": 362860, "epoch": 2998} {"train_loss": -45.54352951049805, "global_step": 362861, "epoch": 2998} {"train_loss": -45.63361740112305, "global_step": 362862, "epoch": 2998} {"train_loss": -46.320369720458984, "global_step": 362863, "epoch": 2998} {"train_loss": -46.02167892456055, "global_step": 362864, "epoch": 2998} {"train_loss": -46.275447845458984, "global_step": 362865, "epoch": 2998} {"train_loss": -45.78973388671875, "global_step": 362866, "epoch": 2998} {"train_loss": -45.783905029296875, "global_step": 362867, "epoch": 2998} {"train_loss": -45.949562072753906, "global_step": 362868, "epoch": 2998} {"train_loss": -46.36891555786133, "global_step": 362869, "epoch": 2998} {"train_loss": -45.56036376953125, "global_step": 362870, "epoch": 2998} {"train_loss": -46.19258117675781, "global_step": 362871, "epoch": 2998} {"train_loss": -45.94094467163086, "global_step": 362872, "epoch": 2998} {"train_loss": -45.12665557861328, "global_step": 362873, "epoch": 2998} {"train_loss": -45.67988204956055, "global_step": 362874, "epoch": 2998} {"train_loss": -45.68918991088867, "global_step": 362875, "epoch": 2998} {"train_loss": -45.45718002319336, "global_step": 362876, "epoch": 2998} {"train_loss": -45.31901168823242, "global_step": 362877, "epoch": 2998} {"train_loss": -44.974118477056834, "global_step": 362878, "epoch": 2998, "val_loss": 2555473.25} {"train_loss": -45.538265228271484, "global_step": 362879, "epoch": 2999} {"train_loss": -46.13199996948242, "global_step": 362880, "epoch": 2999} {"train_loss": -45.5181884765625, "global_step": 362881, "epoch": 2999} {"train_loss": -45.74125289916992, "global_step": 362882, "epoch": 2999} {"train_loss": -45.45475769042969, "global_step": 362883, "epoch": 2999} {"train_loss": -46.14034652709961, "global_step": 362884, "epoch": 2999} {"train_loss": -45.973243713378906, "global_step": 362885, "epoch": 2999} {"train_loss": -44.082862854003906, "global_step": 362886, "epoch": 2999} {"train_loss": -44.76784896850586, "global_step": 362887, "epoch": 2999} {"train_loss": -42.9233512878418, "global_step": 362888, "epoch": 2999} {"train_loss": -40.90346908569336, "global_step": 362889, "epoch": 2999} {"train_loss": -40.66194534301758, "global_step": 362890, "epoch": 2999} {"train_loss": -45.02047348022461, "global_step": 362891, "epoch": 2999} {"train_loss": -44.44948959350586, "global_step": 362892, "epoch": 2999} {"train_loss": -39.39536666870117, "global_step": 362893, "epoch": 2999} {"train_loss": -42.779632568359375, "global_step": 362894, "epoch": 2999} {"train_loss": -39.98208236694336, "global_step": 362895, "epoch": 2999} {"train_loss": -39.41127014160156, "global_step": 362896, "epoch": 2999} {"train_loss": -38.23439407348633, "global_step": 362897, "epoch": 2999} {"train_loss": -40.23773193359375, "global_step": 362898, "epoch": 2999} {"train_loss": -36.22188186645508, "global_step": 362899, "epoch": 2999} {"train_loss": -39.934505462646484, "global_step": 362900, "epoch": 2999} {"train_loss": -33.56108856201172, "global_step": 362901, "epoch": 2999} {"train_loss": -38.52975082397461, "global_step": 362902, "epoch": 2999} {"train_loss": -36.26792907714844, "global_step": 362903, "epoch": 2999} {"train_loss": -36.08721160888672, "global_step": 362904, "epoch": 2999} {"train_loss": -42.55802536010742, "global_step": 362905, "epoch": 2999} {"train_loss": -36.36898422241211, "global_step": 362906, "epoch": 2999} {"train_loss": -40.695037841796875, "global_step": 362907, "epoch": 2999} {"train_loss": -40.249507904052734, "global_step": 362908, "epoch": 2999} {"train_loss": -39.25166702270508, "global_step": 362909, "epoch": 2999} {"train_loss": -40.57780075073242, "global_step": 362910, "epoch": 2999} {"train_loss": -43.34385299682617, "global_step": 362911, "epoch": 2999} {"train_loss": -38.35713577270508, "global_step": 362912, "epoch": 2999} {"train_loss": -39.34455871582031, "global_step": 362913, "epoch": 2999} {"train_loss": -42.83742904663086, "global_step": 362914, "epoch": 2999} {"train_loss": -40.16761016845703, "global_step": 362915, "epoch": 2999} {"train_loss": -40.14728927612305, "global_step": 362916, "epoch": 2999} {"train_loss": -43.338623046875, "global_step": 362917, "epoch": 2999} {"train_loss": -42.46378707885742, "global_step": 362918, "epoch": 2999} {"train_loss": -41.94259262084961, "global_step": 362919, "epoch": 2999} {"train_loss": -39.22847366333008, "global_step": 362920, "epoch": 2999} {"train_loss": -42.929481506347656, "global_step": 362921, "epoch": 2999} {"train_loss": -42.843353271484375, "global_step": 362922, "epoch": 2999} {"train_loss": -41.331947326660156, "global_step": 362923, "epoch": 2999} {"train_loss": -43.63951110839844, "global_step": 362924, "epoch": 2999} {"train_loss": -43.15424346923828, "global_step": 362925, "epoch": 2999} {"train_loss": -43.02437973022461, "global_step": 362926, "epoch": 2999} {"train_loss": -42.943443298339844, "global_step": 362927, "epoch": 2999} {"train_loss": -44.00624465942383, "global_step": 362928, "epoch": 2999} {"train_loss": -44.33224105834961, "global_step": 362929, "epoch": 2999} {"train_loss": -44.418861389160156, "global_step": 362930, "epoch": 2999} {"train_loss": -43.05195999145508, "global_step": 362931, "epoch": 2999} {"train_loss": -42.78071212768555, "global_step": 362932, "epoch": 2999} {"train_loss": -44.88587951660156, "global_step": 362933, "epoch": 2999} {"train_loss": -42.99634552001953, "global_step": 362934, "epoch": 2999} {"train_loss": -44.436134338378906, "global_step": 362935, "epoch": 2999} {"train_loss": -43.670955657958984, "global_step": 362936, "epoch": 2999} {"train_loss": -44.174800872802734, "global_step": 362937, "epoch": 2999} {"train_loss": -44.72549057006836, "global_step": 362938, "epoch": 2999} {"train_loss": -43.858001708984375, "global_step": 362939, "epoch": 2999} {"train_loss": -44.59560012817383, "global_step": 362940, "epoch": 2999} {"train_loss": -44.51096725463867, "global_step": 362941, "epoch": 2999} {"train_loss": -44.39082336425781, "global_step": 362942, "epoch": 2999} {"train_loss": -44.6574592590332, "global_step": 362943, "epoch": 2999} {"train_loss": -44.53582763671875, "global_step": 362944, "epoch": 2999} {"train_loss": -44.77692794799805, "global_step": 362945, "epoch": 2999} {"train_loss": -44.813201904296875, "global_step": 362946, "epoch": 2999} {"train_loss": -45.50608444213867, "global_step": 362947, "epoch": 2999} {"train_loss": -44.85117721557617, "global_step": 362948, "epoch": 2999} {"train_loss": -45.32891845703125, "global_step": 362949, "epoch": 2999} {"train_loss": -45.2799186706543, "global_step": 362950, "epoch": 2999} {"train_loss": -45.601318359375, "global_step": 362951, "epoch": 2999} {"train_loss": -45.19861602783203, "global_step": 362952, "epoch": 2999} {"train_loss": -45.05418014526367, "global_step": 362953, "epoch": 2999} {"train_loss": -45.28460693359375, "global_step": 362954, "epoch": 2999} {"train_loss": -45.48542404174805, "global_step": 362955, "epoch": 2999} {"train_loss": -45.445159912109375, "global_step": 362956, "epoch": 2999} {"train_loss": -45.53630447387695, "global_step": 362957, "epoch": 2999} {"train_loss": -45.54410934448242, "global_step": 362958, "epoch": 2999} {"train_loss": -45.42338562011719, "global_step": 362959, "epoch": 2999} {"train_loss": -45.5284309387207, "global_step": 362960, "epoch": 2999} {"train_loss": -45.66166305541992, "global_step": 362961, "epoch": 2999} {"train_loss": -45.56593704223633, "global_step": 362962, "epoch": 2999} {"train_loss": -45.19322204589844, "global_step": 362963, "epoch": 2999} {"train_loss": -45.559017181396484, "global_step": 362964, "epoch": 2999} {"train_loss": -45.51329040527344, "global_step": 362965, "epoch": 2999} {"train_loss": -45.920814514160156, "global_step": 362966, "epoch": 2999} {"train_loss": -46.471046447753906, "global_step": 362967, "epoch": 2999} {"train_loss": -45.72170639038086, "global_step": 362968, "epoch": 2999} {"train_loss": -45.438987731933594, "global_step": 362969, "epoch": 2999} {"train_loss": -45.323368072509766, "global_step": 362970, "epoch": 2999} {"train_loss": -45.771846771240234, "global_step": 362971, "epoch": 2999} {"train_loss": -45.38718795776367, "global_step": 362972, "epoch": 2999} {"train_loss": -45.72060012817383, "global_step": 362973, "epoch": 2999} {"train_loss": -45.56779098510742, "global_step": 362974, "epoch": 2999} {"train_loss": -46.12656784057617, "global_step": 362975, "epoch": 2999} {"train_loss": -45.605403900146484, "global_step": 362976, "epoch": 2999} {"train_loss": -45.91252899169922, "global_step": 362977, "epoch": 2999} {"train_loss": -45.452064514160156, "global_step": 362978, "epoch": 2999} {"train_loss": -45.7374267578125, "global_step": 362979, "epoch": 2999} {"train_loss": -46.265560150146484, "global_step": 362980, "epoch": 2999} {"train_loss": -45.46772384643555, "global_step": 362981, "epoch": 2999} {"train_loss": -45.675941467285156, "global_step": 362982, "epoch": 2999} {"train_loss": -46.37081527709961, "global_step": 362983, "epoch": 2999} {"train_loss": -45.36750030517578, "global_step": 362984, "epoch": 2999} {"train_loss": -45.74769973754883, "global_step": 362985, "epoch": 2999} {"train_loss": -45.6212158203125, "global_step": 362986, "epoch": 2999} {"train_loss": -45.25637435913086, "global_step": 362987, "epoch": 2999} {"train_loss": -45.75291061401367, "global_step": 362988, "epoch": 2999} {"train_loss": -45.43769073486328, "global_step": 362989, "epoch": 2999} {"train_loss": -44.438697814941406, "global_step": 362990, "epoch": 2999} {"train_loss": -45.061668395996094, "global_step": 362991, "epoch": 2999} {"train_loss": -45.103858947753906, "global_step": 362992, "epoch": 2999} {"train_loss": -43.7182731628418, "global_step": 362993, "epoch": 2999} {"train_loss": -44.961891174316406, "global_step": 362994, "epoch": 2999} {"train_loss": -46.07798385620117, "global_step": 362995, "epoch": 2999} {"train_loss": -44.86955642700195, "global_step": 362996, "epoch": 2999} {"train_loss": -43.855743408203125, "global_step": 362997, "epoch": 2999} {"train_loss": -42.42353439331055, "global_step": 362998, "epoch": 2999} {"train_loss": -43.6236212864395, "global_step": 362999, "epoch": 2999, "val_loss": 2655276.75}